[
    {
        "id": "0074qaufB6",
        "title": "InfoNet: Missing Information Retrieval in Multi-Stream Sensing Systems",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Faulty sensors in a multiple input stream setup are more prone to corrupted input data streams, hindering the performance of Deep Neural Networks (DNN), which focus on deducing information from data. However, the relevant information among multiple input streams has correlations and contains mutual information. This paper utilizes this opportunity to retrieve perturbed information caused by corrupted input streams. We propose InfoNet, which estimates the information entropy at every element of the input feature to the network and retrieves the missing information in the input feature matrix. Finally, using the estimated information entropy and retrieved data, we introduce a novel guided replacement procedure to recover the complete information that is the input to the downstream DNN task. We evaluate the proposed algorithm for sound localization where audio streams from the microphone array are corrupted. We have recovered the performance drop due to the corrupted input stream and reduced the localization error with non-corrupted input streams. Finally, we assess the potential of using the proposed algorithm for retrieving information in other sensing modalities, e.g., wireless signal-based source localization.",
        "keywords": "Early attention;Feature Recovery;Information theory;Entropy;Multi-stream sensing system",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Subrata Kumar Biswas;Bashima Islam",
        "authorids": "~Subrata_Kumar_Biswas1;~Bashima_Islam1",
        "gender": "M;F",
        "homepage": "https://users.wpi.edu/~sbiswas/;https://users.wpi.edu/~bislam/",
        "dblp": ";188/6243",
        "google_scholar": "xuMQYBgAAAAJ;SxAZLx8AAAAJ",
        "orcid": "0000-0002-2670-0115;",
        "linkedin": "subrata-biswas-433247142/;bashimaislam",
        "or_profile": "~Subrata_Kumar_Biswas1;~Bashima_Islam1",
        "aff": "Meta Facebook;Worcester Polytechnic Institute",
        "aff_domain": "meta.com;wpi.edu",
        "position": "Intern;Assistant Professor",
        "bibtex": "@misc{\nbiswas2024infonet,\ntitle={InfoNet: Missing Information Retrieval in Multi-Stream Sensing Systems},\nauthor={Subrata Kumar Biswas and Bashima Islam},\nyear={2024},\nurl={https://openreview.net/forum?id=0074qaufB6}\n}",
        "github": "",
        "project": "",
        "reviewers": "fMm6;tZQw;9qjF",
        "site": "https://openreview.net/forum?id=0074qaufB6",
        "pdf_size": 4860378,
        "rating": "1;3;5",
        "confidence": "4;3;4",
        "soundness": "2;3;2",
        "contribution": "1;2;2",
        "presentation": "2;2;3",
        "wc_summary": "97;80;124",
        "wc_strengths": "49;53;168",
        "wc_weaknesses": "350;172;196",
        "wc_questions": "48;41;182",
        "wc_review": "544;346;670",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            1.632993161855452
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            100.33333333333333,
            18.116904322268255
        ],
        "wc_strengths_avg": [
            90.0,
            55.17849822772152
        ],
        "wc_weaknesses_avg": [
            239.33333333333334,
            78.86415887813396
        ],
        "wc_questions_avg": [
            90.33333333333333,
            64.88108781112996
        ],
        "wc_review_avg": [
            520.0,
            133.3566646253572
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Ao_75FN8juAJ:scholar.google.com/&scioq=InfoNet:+Missing+Information+Retrieval+in+Multi-Stream+Sensing+Systems&hl=en&as_sdt=0,31",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Meta;Worcester Polytechnic Institute",
        "aff_unique_dep": "Meta Platforms, Inc.;",
        "aff_unique_url": "https://meta.com;https://www.wpi.edu",
        "aff_unique_abbr": "Meta;WPI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "014CgNPAGy",
        "title": "On the Role of Momentum in the Implicit Bias of Gradient Descent for Diagonal Linear Networks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Momentum is a widely adopted and crucial modification to gradient descent when training modern deep neural networks. In this paper, we target on the regularization effect of momentum-based methods in regression settings and analyze a popular proxy model, diagonal linear networks, to precisely characterize the implicit bias of  heavy-ball (HB) and Nesterov's method of accelerated gradients (NAG). We show that, HB and NAG exhibit different implicit bias compared to GD for diagonal linear networks, which is different from the one for  classic linear regression problem where momentum-based methods share the same implicit bias with GD. Specifically, the role of momentum in the implicit bias of GD is twofold. On one hand, HB and NAG induce extra initialization mitigation effects similar to SGD that are beneficial for generalization of sparse regression. On the other hand, besides the initialization of parameters, the implicit regularization effects of HB and NAG also depend on the initialization of gradients explicitly, which may not be benign for generalization. As a consequence, whether HB and NAG have better generalization properties than GD jointly depends on the aforementioned twofold effects determined by various parameters such as learning rate, momentum factor, data matrix, and integral of gradients. Particularly, the difference between the implicit bias of GD and that of HB and NAG disappears for small learning rate. Our findings highlight the potential beneficial role of momentum and can help understand its advantages in practice from the perspective of generalization.",
        "keywords": "GD;momentum;implicit bias;linear networks",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Bochen Lyu;Zhanxing Zhu",
        "authorids": "~Bochen_Lyu1;~Zhanxing_Zhu1",
        "gender": ";M",
        "homepage": ";https://zhanxingzhu.github.io/",
        "dblp": ";87/7756.html",
        "google_scholar": ";a2sHceIAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Bochen_Lyu1;~Zhanxing_Zhu1",
        "aff": ";University of Southampton",
        "aff_domain": ";soton.ac.uk",
        "position": ";Associate Professor",
        "bibtex": "@misc{\nanonymous2024on,\ntitle={On the Role of Momentum in the Implicit Bias of Gradient Descent for Diagonal Linear Networks},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=014CgNPAGy}\n}",
        "github": "",
        "project": "",
        "reviewers": "oaZ7;YbMr;vt7i;wNfT",
        "site": "https://openreview.net/forum?id=014CgNPAGy",
        "pdf_size": 537004,
        "rating": "3;5;5;6",
        "confidence": "4;5;4;3",
        "soundness": "1;1;3;3",
        "contribution": "1;1;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "47;156;94;104",
        "wc_strengths": "31;8;15;95",
        "wc_weaknesses": "219;937;242;65",
        "wc_questions": "6;53;5;6",
        "wc_review": "303;1154;356;270",
        "wc_reply_reviewers": "198;899;68;10",
        "wc_reply_authors": "514;2139;1249;161",
        "reply_reviewers": "1;2;1;1",
        "reply_authors": "1;4;3;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.0,
            1.0
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            100.25,
            38.71934271136327
        ],
        "wc_strengths_avg": [
            37.25,
            34.368408458932166
        ],
        "wc_weaknesses_avg": [
            365.75,
            336.7590941607962
        ],
        "wc_questions_avg": [
            17.5,
            20.5
        ],
        "wc_review_avg": [
            520.75,
            366.8919289109533
        ],
        "wc_reply_reviewers_avg": [
            293.75,
            356.01009466024976
        ],
        "wc_reply_authors_avg": [
            1015.75,
            758.0314554818949
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            1.299038105676658
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.3244428422615251,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:G_DlNajnXBEJ:scholar.google.com/&scioq=On+the+Role+of+Momentum+in+the+Implicit+Bias+of+Gradient+Descent+for+Diagonal+Linear+Networks&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Southampton",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.southampton.ac.uk",
        "aff_unique_abbr": "Southampton",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "01Yi8rzoNs",
        "title": "Visual Chain of Thought: Bridging Logical Gaps with Multimodal Infillings",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recent advances in large language models elicit reasoning in a chain-of-thought that allows models to decompose problems in a human-like fashion. Though this paradigm improves multi-step reasoning ability in language models, it is limited by being unimodal and applied mainly to question-answering tasks. We claim that incorporating visual augmentation into reasoning is essential, especially for complex, imaginative tasks. Consequently, we introduce VCoT, a novel method that leverages chain-of-thought prompting with vision-language grounding to recursively bridge the logical gaps within sequential data. Our method uses visual guidance to generate synthetic multimodal infillings that add consistent and novel information to reduce the logical gaps for downstream tasks that can benefit from temporal reasoning, as well as provide interpretability into models' multi-step reasoning. We apply VCoT to the Visual Storytelling and WikiHow summarization datasets and demonstrate through human evaluation that VCoT offers novel and consistent synthetic data augmentation beating chain-of-thought baselines, which can be used to enhance downstream performance.",
        "keywords": "chain of thought;vision and language;large language models;reasoning",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Daniel Philip Rose;Vaishnavi Himakunthala;Andy Ouyang;Ryan He;Alex Mei;Yujie Lu;Michael Saxon;Chinmay Sonar;Diba Mirza;William Yang Wang",
        "authorids": "~Daniel_Philip_Rose1;~Vaishnavi_Himakunthala1;~Andy_Ouyang1;~Ryan_He1;~Alex_Mei1;~Yujie_Lu1;~Michael_Saxon1;~Chinmay_Sonar1;~Diba_Mirza1;~William_Yang_Wang2",
        "gender": "M;F;M;;;;M;M;F;M",
        "homepage": ";;;;http://sites.cs.ucsb.edu/~alexmei/;https://yujielu10.github.io/;https://saxon.me;https://chinmaysonar.github.io/;https://sites.cs.ucsb.edu/~dimirza/;https://www.cs.ucsb.edu/~william/",
        "dblp": ";;;;;;222/6656;207/0890;;08/9282",
        "google_scholar": ";;;;GOrfNGAAAAAJ;pcmr6GMAAAAJ;pAlwjdgAAAAJ;-6Rg0WcAAAAJ;https://scholar.google.com/citations?hl=en;gf8Ms_8AAAAJ",
        "orcid": ";;;;;;;;;",
        "linkedin": "danny-rose-2075651a7/;vaishnavihimakunthala/;andy--ouyang/;ryanhe02/;alexmeigz/;;;;diba-mirza-b3150914b/;",
        "or_profile": "~Daniel_Philip_Rose1;~Vaishnavi_Himakunthala1;~Andy_Ouyang1;~Ryan_He1;~Alex_Mei1;~Yujie_Lu1;~Michael_Saxon1;~Chinmay_Sonar1;~Diba_Mirza1;~William_Wang1",
        "aff": ", University of California, Santa Barbara;, University of California, Santa Barbara;University of California, Santa Barbara;University of California, Santa Barbara;;UC Santa Barbara;Advanced Micro Devices;University of California, Santa Barbara;University of California, Santa Barbara;UC Santa Barbara",
        "aff_domain": "cs.ucsb.edu;cs.ucsb.edu;ucsb.edu;ucsb.edu;;ucsb.edu;amd.com;ucsb.edu;ucsb.edu;ucsb.edu",
        "position": "Undergrad student;Undergrad student;Undergrad student;Intern;;PhD student;Intern;PhD student;Associate Professor;Full Professor",
        "bibtex": "@misc{\nrose2024visual,\ntitle={Visual Chain of Thought: Bridging Logical Gaps with Multimodal Infillings},\nauthor={Daniel Philip Rose and Vaishnavi Himakunthala and Andy Ouyang and Ryan He and Alex Mei and Yujie Lu and Michael Saxon and Chinmay Sonar and Diba Mirza and William Yang Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=01Yi8rzoNs}\n}",
        "github": "",
        "project": "",
        "reviewers": "E16R;a5oz;dqPG;BRKH",
        "site": "https://openreview.net/forum?id=01Yi8rzoNs",
        "pdf_size": 6739734,
        "rating": "3;3;5;6",
        "confidence": "4;4;4;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;2;3",
        "wc_summary": "136;55;76;74",
        "wc_strengths": "27;31;117;55",
        "wc_weaknesses": "285;261;411;235",
        "wc_questions": "4;21;109;52",
        "wc_review": "452;368;713;416",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            85.25,
            30.425112982534674
        ],
        "wc_strengths_avg": [
            57.5,
            35.98263470064414
        ],
        "wc_weaknesses_avg": [
            298.0,
            67.59437846448475
        ],
        "wc_questions_avg": [
            46.5,
            39.978119015281344
        ],
        "wc_review_avg": [
            487.25,
            133.69999065071022
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 18,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4674612661234009738&as_sdt=80005&sciodt=0,11&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0;0;1;0;0;0",
        "aff_unique_norm": "University of California, Santa Barbara;Advanced Micro Devices, Inc.",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ucsb.edu;https://www.amd.com",
        "aff_unique_abbr": "UCSB;AMD",
        "aff_campus_unique_index": "0;0;0;0;0;0;0;0",
        "aff_campus_unique": "Santa Barbara;",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "01ep65umEr",
        "title": "TeLLMe what you see: Using LLMs to Explain Neurons in Vision Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "As the role of machine learning models continues to expand across diverse fields, the demand for model interpretability grows. This is particularly crucial for deep learning models, which are often referred to as black boxes, due to their highly nonlinear nature. This paper proposes a novel method for generating and evaluating concise explanations for the behavior of specific neurons in trained vision models. Doing so signifies an important step towards better understanding the decision making in neural networks. Our technique draws inspiration from a recently published framework that utilized GPT-4 for interpretability of language models. Here, we extend and expand the method to vision models, offering interpretations based on both neuron activations and weights in the network. We illustrate our approach using an AlexNet model and ViT trained on ImageNet, generating clear, human-readable explanations. Our method outperforms the current state-of-the-art in both quantitative and qualitative assessments, while also demonstrating superior capacity in capturing polysemic neuron behavior. The findings hold promise for enhancing transparency, trust and understanding in the deployment of deep learning vision models across various domains. The relevant code can be found in our GitHub repository.",
        "keywords": "Explainable AI;Explaining Neurons in Vision Models",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Leon Guertler;M Ganesh Kumar;Anh Tuan Luu;Cheston Tan",
        "authorids": "~Leon_Guertler1;~M_Ganesh_Kumar1;~Anh_Tuan_Luu2;~Cheston_Tan1",
        "gender": "M;M;M;M",
        "homepage": ";https://mgkumar138.github.io/;https://tuanluu.github.io/;",
        "dblp": ";230/0379;81/8329.html;136/9366",
        "google_scholar": ";sFfy1q4AAAAJ;https://scholar.google.com.sg/citations?hl=en;Up0UYEYAAAAJ",
        "orcid": ";0000-0001-5559-6428;;",
        "linkedin": "leon-gurtler-6b3847165/;m-ganesh-kumar-28682792/;;cheston-tan/",
        "or_profile": "~Leon_Guertler1;~M_Ganesh_Kumar1;~Anh_Tuan_Luu2;~Cheston_Tan1",
        "aff": "Nanyang Technological University;Harvard University;Nanyang Technological University;Singapore University of Technology and Design",
        "aff_domain": "ntu.edu.sg;harvard.edu;ntu.edu.sg;sutd.edu.sg",
        "position": "Undergrad student;Postdoc;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nguertler2024tellme,\ntitle={Te{LLM}e what you see: Using {LLM}s to Explain Neurons in Vision Models},\nauthor={Leon Guertler and M Ganesh Kumar and Anh Tuan Luu and Cheston Tan},\nyear={2024},\nurl={https://openreview.net/forum?id=01ep65umEr}\n}",
        "github": "",
        "project": "",
        "reviewers": "1NcR;KpfM;xVYG;NqpP",
        "site": "https://openreview.net/forum?id=01ep65umEr",
        "pdf_size": 4504693,
        "rating": "5;5;5;6",
        "confidence": "3;4;3;5",
        "soundness": "2;3;2;2",
        "contribution": "2;3;2;3",
        "presentation": "2;3;2;3",
        "wc_summary": "96;37;46;90",
        "wc_strengths": "104;13;59;51",
        "wc_weaknesses": "196;184;86;250",
        "wc_questions": "1;4;98;6",
        "wc_review": "397;238;289;397",
        "wc_reply_reviewers": "0;0;0;86",
        "wc_reply_authors": "499;672;771;668",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            67.25,
            26.03243169586737
        ],
        "wc_strengths_avg": [
            56.75,
            32.34482184214345
        ],
        "wc_weaknesses_avg": [
            179.0,
            59.16924876994806
        ],
        "wc_questions_avg": [
            27.25,
            40.88627520330019
        ],
        "wc_review_avg": [
            330.25,
            69.14251586397475
        ],
        "wc_reply_reviewers_avg": [
            21.5,
            37.239092362730865
        ],
        "wc_reply_authors_avg": [
            652.5,
            97.75607398008576
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.8703882797784891,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:0-7pBnGKwxQJ:scholar.google.com/&scioq=TeLLMe+what+you+see:+Using+LLMs+to+Explain+Neurons+in+Vision+Models&hl=en&as_sdt=0,33",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "Nanyang Technological University;Harvard University;Singapore University of Technology and Design",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ntu.edu.sg;https://www.harvard.edu;https://www.sutd.edu.sg",
        "aff_unique_abbr": "NTU;Harvard;SUTD",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "Singapore;United States"
    },
    {
        "id": "02Ug9N8DCI",
        "title": "GateLoop: Fully Data-Controlled Linear Recurrence for Sequence Modeling",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Linear Recurrence has proven to be a powerful tool for modeling long sequences efficiently. In this work, we show that existing models fail to take full advantage of its potential. Motivated by this finding, we develop GateLoop, a foundational sequence model that generalizes linear recurrent models such as S4, S5, LRU and RetNet, by employing data-controlled state transitions. \nUtilizing this theoretical advance, GateLoop empirically outperforms existing models for auto-regressive language modeling. Our method comes with a low-cost $O(l)$ recurrent mode and an efficient $O(l \\log_{2} l)$ parallel mode making use of highly optimized associative scan implementations. Furthermore, we derive an $O(l^2)$ surrogate-attention mode, revealing remarkable implications for Transformer and recently proposed architectures. \nSpecifically, we prove that our approach can be interpreted as providing data-controlled relative-positional information to Attention. \nWhile many existing models solely rely on data-controlled cumulative sums for context aggregation, our findings suggest that incorporating data-controlled complex cumulative products may be a crucial step towards more powerful sequence models.",
        "keywords": "Data-controlled;Linear Recurrence;Sequence Modeling;GateLoop;Linear;RNN;State Space Model;SSM;S4;S5;LRU;RetNet;generalization",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Tobias Katsch",
        "authorids": "~Tobias_Katsch1",
        "gender": "M",
        "homepage": "https://github.com/tobiaskatsch",
        "dblp": "",
        "google_scholar": "",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Tobias_Katsch1",
        "aff": "",
        "aff_domain": "",
        "position": "",
        "bibtex": "@misc{\nkatsch2024gateloop,\ntitle={GateLoop: Fully Data-Controlled Linear Recurrence for Sequence Modeling},\nauthor={Tobias Katsch},\nyear={2024},\nurl={https://openreview.net/forum?id=02Ug9N8DCI}\n}",
        "github": "",
        "project": "",
        "reviewers": "kCvT;BbYv;3RS5;gLYa",
        "site": "https://openreview.net/forum?id=02Ug9N8DCI",
        "pdf_size": 7626103,
        "rating": "3;3;3;5",
        "confidence": "4;4;4;5",
        "soundness": "2;1;1;3",
        "contribution": "1;2;3;2",
        "presentation": "2;2;2;2",
        "wc_summary": "110;38;40;104",
        "wc_strengths": "72;15;38;94",
        "wc_weaknesses": "275;9;167;159",
        "wc_questions": "2;310;33;278",
        "wc_review": "459;372;278;635",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            73.0,
            34.07345007480164
        ],
        "wc_strengths_avg": [
            54.75,
            30.408674749156695
        ],
        "wc_weaknesses_avg": [
            152.5,
            94.67180150393253
        ],
        "wc_questions_avg": [
            155.75,
            139.1444842600669
        ],
        "wc_review_avg": [
            436.0,
            131.51996046228115
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 22,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12199180100342829511&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3
    },
    {
        "title": "Hybrid LLM: Cost-Efficient and Quality-Aware Query Routing",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19625",
        "id": "02f3mUtqnM",
        "author_site": "Dujian Ding, Ankur Mallick, Chi Wang, Robert Sim, Subhabrata Mukherjee, Victor R\u00fchle, Laks Lakshmanan, Ahmed H Awadallah",
        "tldr": "",
        "abstract": "Large language models (LLMs) excel in most NLP tasks but also require expensive cloud servers for deployment due to their size, while smaller models that can be deployed on lower cost (e.g., edge) devices, tend to lag behind in terms of response quality. Therefore in this work we propose a hybrid inference approach which combines their respective strengths to save cost and maintain quality. Our approach uses a router that assigns queries to the small or large model based on the predicted query difficulty and the desired quality level. The desired quality level can be tuned dynamically at test time to seamlessly trade  quality for cost as per the scenario requirements. In experiments our approach allows us to make up to 40% fewer calls to the large model, with no drop in response quality.",
        "keywords": "Large language models;Efficient ML;Query Routing",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Dujian Ding;Ankur Mallick;Chi Wang;Robert Sim;Subhabrata Mukherjee;Victor R\u00fchle;Laks V. S. Lakshmanan;Ahmed Hassan Awadallah",
        "authorids": "~Dujian_Ding1;~Ankur_Mallick1;~Chi_Wang3;~Robert_Sim1;~Subhabrata_Mukherjee2;~Victor_R\u00fchle1;~Laks_V._S._Lakshmanan1;~Ahmed_Hassan_Awadallah1",
        "gender": ";M;M;M;;;M;M",
        "homepage": ";https://ankurmallick.github.io/;http://chiwang.cc;;https://subhomukherjee.com/;https://www.cs.ubc.ca/~laks;https://www.microsoft.com/en-us/research/people/hassanam/publications/;https://www.microsoft.com/en-us/research/people/virueh/",
        "dblp": "244/8792;180/2636;09/404-1;47/1233;37/11030.html;l/LVSLakshmanan;147/9148;277/8100",
        "google_scholar": "https://scholar.google.ca/citations?user=1-FsZPQAAAAJ;6SYGK8cAAAAJ;https://scholar.google.com/citations?hl=en;uT8sPt8AAAAJ;T4iBN5cAAAAJ;https://scholar.google.ca/citations?user=_RCsaOsAAAAJ;sNGk-9MAAAAJ;",
        "orcid": ";;;;;0000-0002-9775-4241;;0000-0002-8957-7628",
        "linkedin": "dujian-ding-250123133/;ankurmallick/;chi-wang-autogen/;simra/;subho87;laksvslakshmanan/;ahmed-hassan-awadallah-a355a27/;victor-r%C3%BChle-bb752195",
        "or_profile": "~Dujian_Ding1;~Ankur_Mallick1;~Chi_Wang3;~Robert_Sim1;~Subhabrata_Mukherjee2;~Laks_V._S._Lakshmanan1;~Ahmed_Hassan_Awadallah1;~Victor_Ruehle1",
        "aff": "Computing Science, University of British Columbia;Microsoft;Microsoft Research;Microsoft;Hippocratic AI;University of British Columbia;Microsoft Research;Microsoft",
        "aff_domain": "cs.ubc.ca;microsoft.com;microsoft.com;microsoft.com;hippocraticai.com;ubc.ca;microsoft.com;microsoft.com",
        "position": "PhD student;Researcher;Principal Researcher;Principal Researcher;Chief Scientist;Professor;Principal Researcher;Principal Researcher",
        "bibtex": "@inproceedings{\nding2024hybrid,\ntitle={Hybrid {LLM}: Cost-Efficient and Quality-Aware Query Routing},\nauthor={Dujian Ding and Ankur Mallick and Chi Wang and Robert Sim and Subhabrata Mukherjee and Victor R{\\\"u}hle and Laks V. S. Lakshmanan and Ahmed Hassan Awadallah},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=02f3mUtqnM}\n}",
        "github": "",
        "project": "",
        "reviewers": "uyT6;ZnPu;VA7E;9pHQ",
        "pdf_size": 4420090,
        "rating": "3;6;6;8",
        "confidence": "4;2;2;5",
        "soundness": "2;2;3;4",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;4",
        "wc_summary": "85;94;101;59",
        "wc_strengths": "47;62;136;51",
        "wc_weaknesses": "189;73;64;39",
        "wc_questions": "4;34;30;64",
        "wc_review": "325;263;331;213",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1426;539;953;814",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;2;2;2",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.25,
            1.299038105676658
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            84.75,
            15.911866640969563
        ],
        "wc_strengths_avg": [
            74.0,
            36.21463792446364
        ],
        "wc_weaknesses_avg": [
            91.25,
            57.79435526069999
        ],
        "wc_questions_avg": [
            33.0,
            21.283796653792763
        ],
        "wc_review_avg": [
            283.0,
            48.394214530251446
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            933.0,
            321.2654665537521
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.13474201390907387,
        "gs_citation": 80,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14692033895568743922&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=02f3mUtqnM",
        "pdf": "https://openreview.net/pdf?id=02f3mUtqnM",
        "email": "cs.ubc.ca;microsoft.com;microsoft.com;microsoft.com;hippocraticai.com;ubc.ca;microsoft.com;microsoft.com",
        "author_num": 8,
        "aff_unique_index": "0;1;1;1;2;0;1;1",
        "aff_unique_norm": "University of British Columbia;Microsoft;Hippocratic AI",
        "aff_unique_dep": "Department of Computing Science;Microsoft Corporation;",
        "aff_unique_url": "https://www.ubc.ca;https://www.microsoft.com;https://www.hippocratic.ai",
        "aff_unique_abbr": "UBC;Microsoft;Hippocratic AI",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Vancouver;",
        "aff_country_unique_index": "0;1;1;1;1;0;1;1",
        "aff_country_unique": "Canada;United States"
    },
    {
        "id": "030cjlZm4a",
        "title": "Learning Predictive Checklists with Probabilistic Logic Programming",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Checklists have been widely recognized as effective tools for completing complex tasks in a systematic manner. Although originally intended for use in procedural tasks, their interpretability and ease of use have led to their adoption for predictive tasks as well, including in clinical settings. However, designing checklists can be challenging, often requiring expert knowledge and manual rule design based on available data. Recent work has attempted to address this issue by using machine learning to automatically generate predictive checklists from data, although these approaches have been limited to Boolean data. We propose a novel method for learning predictive checklists from diverse data modalities, such as images, time series, and text, by combining the power of dedicated deep learning architectures with the interpretability and conciseness of checklists. Our approach relies on probabilistic logic programming, a learning paradigm that enables matching the discrete nature of a checklist with continuous-valued data. We propose a regularization technique to tradeoff between the information captured in discrete concepts of continuous data and permit a tunable level of interpretability for the learned checklist concepts. We demonstrate that our method outperforms various explainable machine learning techniques on prediction tasks involving image sequences, clinical notes, and time series.",
        "keywords": "Predictive Checklists;Interpretability;Fairness;Probabilistic Logic Programming",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "/attachment/4a671c91b008d335242a0a7a33b2ee48de06144b.pdf",
        "author": "Yukti Makhija;Edward De Brouwer;Rahul G Krishnan",
        "authorids": "~Yukti_Makhija1;~Edward_De_Brouwer1;~Rahul_G_Krishnan1",
        "gender": ";M;M",
        "homepage": ";https://edwarddebrouwer.xyz;http://www.cs.toronto.edu/~rahulgk/index.html",
        "dblp": ";;172/0880",
        "google_scholar": ";-Pm4XtAAAAAJ;ilJgXHkAAAAJ",
        "orcid": ";;",
        "linkedin": ";edwarddebrouwer/;rahulgk/",
        "or_profile": "~Yukti_Makhija1;~Edward_De_Brouwer1;~Rahul_G_Krishnan1",
        "aff": ";Yale University;Department of Computer Science, University of Toronto",
        "aff_domain": ";yale.edu;cs.toronto.edu",
        "position": ";Postdoc;Assistant Professor",
        "bibtex": "@misc{\nmakhija2024learning,\ntitle={Learning Predictive Checklists with Probabilistic Logic Programming},\nauthor={Yukti Makhija and Edward De Brouwer and Rahul G Krishnan},\nyear={2024},\nurl={https://openreview.net/forum?id=030cjlZm4a}\n}",
        "github": "",
        "project": "",
        "reviewers": "Ucnh;eMqU;SxKf",
        "site": "https://openreview.net/forum?id=030cjlZm4a",
        "pdf_size": 1262744,
        "rating": "3;6;8",
        "confidence": "4;4;4",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "2;2;2",
        "wc_summary": "34;225;54",
        "wc_strengths": "51;88;37",
        "wc_weaknesses": "223;172;861",
        "wc_questions": "65;28;213",
        "wc_review": "373;513;1165",
        "wc_reply_reviewers": "0;40;93",
        "wc_reply_authors": "636;1034;2045",
        "reply_reviewers": "0;1;1",
        "reply_authors": "2;3;3",
        "rating_avg": [
            5.666666666666667,
            2.0548046676563256
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            104.33333333333333,
            85.71399470850072
        ],
        "wc_strengths_avg": [
            58.666666666666664,
            21.514852750806565
        ],
        "wc_weaknesses_avg": [
            418.6666666666667,
            313.4691195140103
        ],
        "wc_questions_avg": [
            102.0,
            79.92913528036361
        ],
        "wc_review_avg": [
            683.6666666666666,
            345.11962499335726
        ],
        "wc_reply_reviewers_avg": [
            44.333333333333336,
            38.09053542402481
        ],
        "wc_reply_authors_avg": [
            1238.3333333333333,
            593.0903997049878
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:UK5bP4Z4SfgJ:scholar.google.com/&scioq=Learning+Predictive+Checklists+with+Probabilistic+Logic+Programming&hl=en&as_sdt=0,44",
        "gs_version_total": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Yale University;University of Toronto",
        "aff_unique_dep": ";Department of Computer Science",
        "aff_unique_url": "https://www.yale.edu;https://www.utoronto.ca",
        "aff_unique_abbr": "Yale;U of T",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Toronto",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United States;Canada"
    },
    {
        "id": "04ARmqba4z",
        "title": "Adaptive Multi-head Contrastive Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In contrastive learning, two views of an original image generated by different augmentations are considered as a positive pair whose similarity is required to be high. Moreover, two views of two different images are considered as a negative pair, and their similarity is encouraged to be low. Normally, a single similarity measure given by a single projection head is used to evaluate positive and negative sample pairs, respectively. However, due to the various augmentation strategies and varying intra-sample similarity, augmented views from the same image are often not similar. Moreover, due to inter-sample similarity, augmented views of two different images may be more similar than augmented views from the same image. As such, enforcing a high similarity for positive pairs and a low similarity for negative pairs may not always be achievable, and in the case of some pairs, forcing so may be detrimental to the performance. To address this issue, we propose to use multiple projection heads, each producing a separate set of features. Our loss function for pre-training emerges from a solution to the maximum likelihood estimation over head-wise posterior distributions of positive samples given observations. The loss contains the similarity measure over positive and negative pairs, each re-weighted by an individual adaptive temperature that is regularized to prevent ill solutions. Our adaptive multi-head contrastive learning (AMCL) can be applied to and experimentally improves several popular contrastive learning methods such as SimCLR, MoCo and Barlow Twins. Such improvement is consistent under various backbones and linear probing epoches and is more significant when multiple augmentation methods are used.",
        "keywords": "adaptive temperature;contrastive learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Lei Wang;Piotr Koniusz;Tom Gedeon;Liang Zheng",
        "authorids": "~Lei_Wang20;~Piotr_Koniusz1;~Tom_Gedeon1;~Liang_Zheng4",
        "gender": "M;;M;M",
        "homepage": "https://leiwangr.github.io/;https://www.koniusz.com;https://cs.anu.edu.au/people/Tom.Gedeon/;http://zheng-lab.cecs.anu.edu.au/",
        "dblp": "181/2817-108;25/8616;g/TamasDGedeon.html;61/7360-1",
        "google_scholar": "VWCZLXgAAAAJ;https://scholar.google.co.uk/citations?user=wZ7-1tUAAAAJ;https://scholar.google.com.tw/citations?user=lPTjWIkAAAAJ;https://scholar.google.com.au/citations?user=vNHqr3oAAAAJ",
        "orcid": "0000-0002-8600-7099;0000-0002-6340-5289;0000-0001-8356-4909;",
        "linkedin": "lei-l-wang/;;tom-gedeon;liang-zheng-76341311a/",
        "or_profile": "~Lei_Wang20;~Piotr_Koniusz1;~Tom_Gedeon1;~Liang_Zheng4",
        "aff": "Australian National University;Data61, CSIRO;Curtin University of Technology;Australian National University",
        "aff_domain": "anu.edu.au;data61.csiro.au;curtin.edu.au;anu.edu.au",
        "position": "Postdoc;Principal Researcher;Full Professor;Associate Professor",
        "bibtex": "@misc{\nwang2024adaptive,\ntitle={Adaptive Multi-head Contrastive Learning},\nauthor={Lei Wang and Piotr Koniusz and Tom Gedeon and Liang Zheng},\nyear={2024},\nurl={https://openreview.net/forum?id=04ARmqba4z}\n}",
        "github": "",
        "project": "",
        "reviewers": "HgQy;pd1e;YrZy",
        "site": "https://openreview.net/forum?id=04ARmqba4z",
        "pdf_size": 2912051,
        "rating": "3;3;5",
        "confidence": "4;4;4",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "2;1;3",
        "wc_summary": "16;68;94",
        "wc_strengths": "25;44;31",
        "wc_weaknesses": "154;249;159",
        "wc_questions": "12;108;5",
        "wc_review": "207;469;289",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            59.333333333333336,
            32.42769735204082
        ],
        "wc_strengths_avg": [
            33.333333333333336,
            7.93025150224688
        ],
        "wc_weaknesses_avg": [
            187.33333333333334,
            43.65266951236265
        ],
        "wc_questions_avg": [
            41.666666666666664,
            46.99172503986444
        ],
        "wc_review_avg": [
            321.6666666666667,
            109.42678932611621
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11122893215011527354&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Australian National University;CSIRO;Curtin University",
        "aff_unique_dep": ";Data61;",
        "aff_unique_url": "https://www.anu.edu.au;https://www.csiro.au;https://www.curtin.edu.au",
        "aff_unique_abbr": "ANU;CSIRO;Curtin",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Australia"
    },
    {
        "id": "04UvXg4CvW",
        "title": "EPIC: Compressing Deep GNNs via Expressive Power Gap-Induced Knowledge Distillation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The teacher-student paradigm-based knowledge distillation (KD) has recently emerged as a promising technique for compressing graph neural networks (GNNs). Despite the great success in compressing moderate-sized GNNs, distilling deep GNNs (e.g., with over 100 layers) remains a tough challenge. A widely recognized reason is the *teacher-student expressive power gap*, i.e., the embeddings of a deep teacher may be extremely hard for a shallow student to approximate. Besides, the theoretical analysis and measurement of this gap are currently missing, resulting in a difficult trade-off between the needs of being \"lightweight'' and being \"expressive'' when selecting a student for the deep teacher. To bridge the theoretical gap and address the challenge of distilling deep GNNs, we propose the *first* GNN KD framework that quantitatively analyzes the teacher-student expressive power gap, namely **E**xpressive **P**ower gap-**I**ndu**C**ed knowledge distillation (**EPIC**). Our key idea is to formulate the estimation of the expressive power gap as an embedding regression problem based on the theory of polynomial approximation. Then, we show that the minimum approximation error has an upper bound, which decreases rapidly with respect to the number of student layers. Furthermore, we empirically demonstrate that the upper bound exponentially converges to zero as the number of student layers increases. Moreover, we propose to select an appropriate value for the number of student layers based on the upper bound, and propose an expressive power gap-induced loss term to further encourage the student to generate embeddings similar to those of the teacher. Experiments on large-scale benchmarks demonstrate that EPIC can effectively reduce the numbers of layers of deep GNNs, while achieving comparable or superior performance. Specifically, for the 1,001-layer RevGNN-Deep, we reduce the number of layers by 94\\% and accelerate inference by roughly eight times, while achieving comparable performance in terms of ROC-AUC on the large-scale benchmark ogbn-proteins.",
        "keywords": "deep graph neural networks;knowledge distillation;expressive power gap",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/75d2e1ed2ecc8c5b690aa40be7552716025b268a.zip",
        "author": "Xize Liang;Jie Wang;Zhihao Shi;Hanzhu Chen;Bin Li;Feng Wu",
        "authorids": "~Xize_Liang1;~Jie_Wang1;~Zhihao_Shi3;~Hanzhu_Chen1;~Bin_Li8;~Feng_Wu1",
        "gender": ";M;M;;M;M",
        "homepage": ";http://staff.ustc.edu.cn/~jwangx;https://miralab.ai/people/zhihao-shi/;;http://staff.ustc.edu.cn/~binli;",
        "dblp": ";29/5259-5;;;89/6764-25;25/3972-1",
        "google_scholar": ";OugG4dUAAAAJ;https://scholar.google.com.hk/citations?user=u2Ffj60AAAAJ;;;5bInRDEAAAAJ",
        "orcid": ";;;;0000-0002-2332-3959;",
        "linkedin": ";;;;;",
        "or_profile": "~Xize_Liang1;~Jie_Wang1;~Zhihao_Shi3;~Hanzhu_Chen1;~Bin_Li8;~Feng_Wu1",
        "aff": ";University of Science and Technology of China;University of Science and Technology of China;;University of Science and Technology of China;University of Science and Technology of China",
        "aff_domain": ";ustc.edu.cn;ustc.edu.cn;;ustc.edu.cn;ustc.edu.cn",
        "position": ";Full Professor;PhD student;;Full Professor;Full Professor",
        "bibtex": "@misc{\nliang2024epic,\ntitle={{EPIC}: Compressing Deep {GNN}s via Expressive Power Gap-Induced Knowledge Distillation},\nauthor={Xize Liang and Jie Wang and Zhihao Shi and Hanzhu Chen and Bin Li and Feng Wu},\nyear={2024},\nurl={https://openreview.net/forum?id=04UvXg4CvW}\n}",
        "github": "",
        "project": "",
        "reviewers": "G7rf;8ZML;ZSeG",
        "site": "https://openreview.net/forum?id=04UvXg4CvW",
        "pdf_size": 0,
        "rating": "3;5;5",
        "confidence": "4;4;4",
        "soundness": "2;3;3",
        "contribution": "2;2;2",
        "presentation": "2;3;2",
        "wc_summary": "49;54;116",
        "wc_strengths": "20;38;79",
        "wc_weaknesses": "86;171;433",
        "wc_questions": "4;19;77",
        "wc_review": "159;282;705",
        "wc_reply_reviewers": "0;0;134",
        "wc_reply_authors": "460;1188;1459",
        "reply_reviewers": "0;0;1",
        "reply_authors": "2;3;2",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            73.0,
            30.474032661705056
        ],
        "wc_strengths_avg": [
            45.666666666666664,
            24.689178916188272
        ],
        "wc_weaknesses_avg": [
            230.0,
            147.67757672262456
        ],
        "wc_questions_avg": [
            33.333333333333336,
            31.47838764754143
        ],
        "wc_review_avg": [
            382.0,
            233.8503795164763
        ],
        "wc_reply_reviewers_avg": [
            44.666666666666664,
            63.168205785998246
        ],
        "wc_reply_authors_avg": [
            1035.6666666666667,
            421.8248715073854
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:FTkpozQc7hsJ:scholar.google.com/&scioq=EPIC:+Compressing+Deep+GNNs+via+Expressive+Power+Gap-Induced+Knowledge+Distillation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of Science and Technology of China",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.ustc.edu.cn",
        "aff_unique_abbr": "USTC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "05gc31KWpz",
        "title": "DISPEL: Domain Generalization via Domain-Specific Liberating",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Domain generalization aims to learn a generalization model that can perform well on unseen test domains by only training on limited source domains. However, existing domain generalization approaches often bring in prediction-irrelevant noise or require the collection of domain labels. To address these challenges, we consider the domain generalization problem from a different perspective by categorizing the underlying feature groups into domain-shared and domain-specific features. Nevertheless, domain-specific features are difficult to be identified and distinguished from the input data. In this work, we propose $\\underline{\\mathrm{D}}$oma$\\underline{\\mathrm{I}}$n-$\\underline{\\mathrm{SPE}}$cific $\\underline{\\mathrm{L}}$iberating (DISPEL), a post-processing fine-grained masking approach that can filter out undefined and indistinguishable domain-specific features in the embedding space. Specifically, DISPEL utilizes a mask generator that produces a unique mask for each input data to filter domain-specific features. The DISPEL framework is highly flexible to apply to fine-tuned models. We derive a generalization error bound to guarantee the generalization performance by optimizing a designed objective loss. The experimental results on five benchmarks demonstrate that DISPEL outperforms existing methods and can further generalize various algorithms.",
        "keywords": "Domain Generalization;Transfer Learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/2a61e76f56ef1f9c15a426084797e74fe0060d7e.zip",
        "author": "Chia-Yuan Chang;Yu-Neng Chuang;Guanchu Wang;Samson Zhou;Vladimir Braverman;Mengnan Du;Na Zou",
        "authorids": "~Chia-Yuan_Chang3;~Yu-Neng_Chuang1;~Guanchu_Wang1;~Samson_Zhou1;~Vladimir_Braverman1;~Mengnan_Du1;~Na_Zou2",
        "gender": "Not Specified;M;M;;Unspecified;;F",
        "homepage": "https://z76316.github.io/;;https://guanchuwang.github.io/home;https://samsonzhou.github.io/;http://www.cs.jhu.edu/~vova/;https://mengnandu.com/;https://nzou1.github.io/",
        "dblp": "03/1382-2.html;207/7875;213/0985;179/2683;14/4758;183/5606;152/0090-1.html",
        "google_scholar": "EO595aMAAAAJ;;_QL5218AAAAJ;NpjsgocAAAAJ;https://scholar.google.com.tw/citations?user=DTthB48AAAAJ;0i-Js2gAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": "0009-0001-1889-612X;;;;;;0000-0003-1984-795X",
        "linkedin": "chia-yuan-chang/;ync/;;;;;na-zou-a1721535/",
        "or_profile": "~Chia-Yuan_Chang3;~Yu-Neng_Chuang1;~Guanchu_Wang1;~Samson_Zhou1;~Vladimir_Braverman1;~Mengnan_Du1;~Na_Zou2",
        "aff": "Texas A&M University - College Station;Rice University;Rice University;Texas A&M University - College Station;Department of Computer Science, Whiting School of Engineering;New Jersey Institute of Technology;University of Houston",
        "aff_domain": "tamu.edu;rice.edu;rice.edu;tamu.edu;cs.jhu.edu;njit.edu;uh.edu",
        "position": "PhD student;PhD student;PhD student;Assistant Professor;Full Professor;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nchang2024dispel,\ntitle={{DISPEL}: Domain Generalization via Domain-Specific Liberating},\nauthor={Chia-Yuan Chang and Yu-Neng Chuang and Guanchu Wang and Samson Zhou and Vladimir Braverman and Mengnan Du and Na Zou},\nyear={2024},\nurl={https://openreview.net/forum?id=05gc31KWpz}\n}",
        "github": "",
        "project": "",
        "reviewers": "Mwon;StPi;u3X2;zEDH",
        "site": "https://openreview.net/forum?id=05gc31KWpz",
        "pdf_size": 3150064,
        "rating": "3;3;5;6",
        "confidence": "5;4;3;4",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "75;51;67;172",
        "wc_strengths": "40;29;68;75",
        "wc_weaknesses": "59;43;53;236",
        "wc_questions": "227;270;242;46",
        "wc_review": "401;393;430;529",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            91.25,
            47.415055625824166
        ],
        "wc_strengths_avg": [
            53.0,
            19.06567596493762
        ],
        "wc_weaknesses_avg": [
            97.75,
            80.02304355621573
        ],
        "wc_questions_avg": [
            196.25,
            88.10895243957903
        ],
        "wc_review_avg": [
            438.25,
            54.172756067972024
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5443310539518174,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12868005047063878227&as_sdt=5,31&sciodt=0,31&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1;0;2;3;4",
        "aff_unique_norm": "Texas A&M University;Rice University;Johns Hopkins University;New Jersey Institute of Technology;University of Houston",
        "aff_unique_dep": ";;Department of Computer Science;;",
        "aff_unique_url": "https://www.tamu.edu;https://www.rice.edu;https://www.jhu.edu;https://www.njit.edu;https://www.uh.edu",
        "aff_unique_abbr": "TAMU;Rice;JHU;NJIT;UH",
        "aff_campus_unique_index": "0;0;2",
        "aff_campus_unique": "College Station;;Baltimore",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Dropout Enhanced Bilevel Training",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19624",
        "id": "06lrITXVAx",
        "author_site": "Peiran Yu, Junyi Li, Heng Huang",
        "tldr": "",
        "abstract": "Bilevel optimization problems appear in many widely used machine learning tasks. Bilevel optimization models are sensitive to small changes, and bilevel training tasks typically involve limited datasets. Therefore, overfitting is a common challenge in bilevel training tasks. This paper considers the use of dropout to address this problem. We propose a bilevel optimization model that depends on the distribution of dropout masks. We investigate how the dropout rate affects the hypergradient of this model. We propose a dropout bilevel method to solve the dropout bilevel optimization model. Subsequently, we analyze the resulting dropout bilevel method from an optimization perspective. Analyzing the optimization properties of methods with dropout is essential because it provides convergence guarantees for methods using dropout. However, there has been limited investigation in this research direction. We provide the complexity of the resulting dropout bilevel method in terms of reaching an $\\epsilon$ stationary point of the proposed stochastic bilevel model. Empirically, we demonstrate that overfitting occurs in data cleaning problems, and the method proposed in this work mitigates this issue.",
        "keywords": "Bilevel Optimization;Overfitting",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/3f2da4776df25e60924b0709b573e4fe323b121d.pdf",
        "author": "Peiran Yu;Junyi Li;Heng Huang",
        "authorids": "~Peiran_Yu1;~Junyi_Li1;~Heng_Huang1",
        "gender": "F;M;M",
        "homepage": "https://sites.google.com/view/yupeiran/;;https://www.cs.umd.edu/~heng/",
        "dblp": "240/3145;;03/281",
        "google_scholar": "SXJ4R24AAAAJ;MzvZSs0AAAAJ;4OqLaDwAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Peiran_Yu1;~Junyi_Li1;~Heng_Huang1",
        "aff": "University of Maryland;University of Maryland, College Park;Department of Computer Science, University of Maryland, College Park",
        "aff_domain": "umd.edu;umd.edu;cs.umd.edu",
        "position": "Postdoc;PhD student;Full Professor",
        "bibtex": "@inproceedings{\nyu2024dropout,\ntitle={Dropout Enhanced Bilevel Training},\nauthor={Peiran Yu and Junyi Li and Heng Huang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=06lrITXVAx}\n}",
        "github": "",
        "project": "",
        "reviewers": "mkUf;Kt41;fs9w;hA9j",
        "pdf_size": 837802,
        "rating": "6;6;8;8",
        "confidence": "4;4;3;3",
        "soundness": "3;3;4;3",
        "contribution": "2;3;3;3",
        "presentation": "2;3;4;3",
        "wc_summary": "50;39;89;80",
        "wc_strengths": "21;38;79;59",
        "wc_weaknesses": "158;110;28;108",
        "wc_questions": "23;80;21;2",
        "wc_review": "252;267;217;249",
        "wc_reply_reviewers": "17;153;0;0",
        "wc_reply_authors": "177;758;20;175",
        "reply_reviewers": "1;2;0;0",
        "reply_authors": "2;3;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            64.5,
            20.62159062730128
        ],
        "wc_strengths_avg": [
            49.25,
            21.821720830401986
        ],
        "wc_weaknesses_avg": [
            101.0,
            46.65833258915282
        ],
        "wc_questions_avg": [
            31.5,
            29.176188921790317
        ],
        "wc_review_avg": [
            246.25,
            18.21228980661136
        ],
        "wc_reply_reviewers_avg": [
            42.5,
            64.17359269980138
        ],
        "wc_reply_authors_avg": [
            282.5,
            281.82130863368013
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12300902621179201195&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=06lrITXVAx",
        "pdf": "https://openreview.net/pdf?id=06lrITXVAx",
        "email": "umd.edu;umd.edu;cs.umd.edu",
        "author_num": 3,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "University of Maryland;University of Maryland, College Park",
        "aff_unique_dep": ";Department of Computer Science",
        "aff_unique_url": "https://www/umd.edu;https://www/umd.edu",
        "aff_unique_abbr": "UMD;UMD",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";College Park",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "06mzMua9Rw",
        "title": "A Trust Region Approach for Few-Shot Sim-to-Real Reinforcement Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Simulation-to-Reality Reinforcement Learning (Sim-to-Real RL) seeks to use simulations to minimize the need for extensive real-world interactions. Specifically, in the few-shot off-dynamics setting, the goal is to acquire a simulator-based policy despite a dynamics mismatch that can be effectively transferred to the real-world using only a handful of real-world transitions. In this context, conventional RL agents tend to exploit simulation inaccuracies resulting in policies that excel in the simulator but underperform in the real environment. To address this challenge, we introduce a novel approach that incorporates a penalty to constrain the trajectories induced by the simulator-trained policy inspired by recent advances in Imitation Learning and Trust Region based RL algorithms. We evaluate our method across various environments representing diverse Sim-to-Real conditions, where access to the real environment is extremely limited. These experiments include high-dimensional systems relevant to real-world applications. Across most tested scenarios, our proposed method demonstrates performance improvements compared to existing baselines.",
        "keywords": "Reinforcement Learning;Simulation-to-Reality;Off-Dynamics",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/9c8b8be7e3ad45c2c20a21fa323c539b4a8d5f3f.pdf",
        "author": "Paul Daoudi;Bogdan Robu;CHRISTOPHE PRIEUR;Ludovic Dos Santos;Merwan Barlier",
        "authorids": "~Paul_Daoudi2;~Bogdan_Robu1;~CHRISTOPHE_PRIEUR1;~Ludovic_Dos_Santos1;~Merwan_Barlier1",
        "gender": "M;M;;;M",
        "homepage": ";http://www.gipsa-lab.fr/~bogdan.robu/;http://www.gipsa-lab.grenoble-inp.fr/~christophe.prieur/index.html;;https://scholar.google.com/citations?user=TNPp0cwAAAAJ",
        "dblp": "347/7716;74/8134;62/3525;185/0155;167/4759",
        "google_scholar": ";;https://scholar.google.com/citations?hl=en;;TNPp0cwAAAAJ",
        "orcid": "0009-0004-2784-952X;0000-0001-7568-007X;0000-0002-4456-2019;;",
        "linkedin": "paul-daoudi-83101a126/;;;;",
        "or_profile": "~Paul_Daoudi2;~Bogdan_Robu1;~CHRISTOPHE_PRIEUR1;~Merwan_Barlier1;~Ludovic_DOS_SANTOS3",
        "aff": "Huawei Technologies Ltd.;;CNRS;Huawei Technologies Ltd.;Criteo AI Lab",
        "aff_domain": "huawei.com;;cnrs.fr;huawei.com;criteo.com",
        "position": "PhD student;;Full Professor;Researcher;Researcher",
        "bibtex": "@misc{\nanonymous2024a,\ntitle={A Trust Region Approach for Few-Shot Sim-to-Real Reinforcement Learning},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=06mzMua9Rw}\n}",
        "github": "",
        "project": "",
        "reviewers": "mwPX;u2wg;iBdd;agZp",
        "site": "https://openreview.net/forum?id=06mzMua9Rw",
        "pdf_size": 1354416,
        "rating": "3;3;5;5",
        "confidence": "4;3;4;3",
        "soundness": "2;2;2;3",
        "contribution": "2;1;2;2",
        "presentation": "3;2;2;3",
        "wc_summary": "40;101;121;107",
        "wc_strengths": "60;30;32;61",
        "wc_weaknesses": "1028;164;49;220",
        "wc_questions": "2;33;170;7",
        "wc_review": "1130;328;372;395",
        "wc_reply_reviewers": "400;189;56;384",
        "wc_reply_authors": "983;579;559;760",
        "reply_reviewers": "2;1;1;1",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            92.25,
            31.027205803939225
        ],
        "wc_strengths_avg": [
            45.75,
            14.771171246722448
        ],
        "wc_weaknesses_avg": [
            365.25,
            387.5728157391847
        ],
        "wc_questions_avg": [
            53.0,
            68.56748500564973
        ],
        "wc_review_avg": [
            556.25,
            332.1282696489415
        ],
        "wc_reply_reviewers_avg": [
            257.25,
            142.83097528197447
        ],
        "wc_reply_authors_avg": [
            720.25,
            170.71229451917046
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7674579431628756951&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "Huawei;Centre National de la Recherche Scientifique;Criteo",
        "aff_unique_dep": "Huawei Technologies;;Criteo AI Lab",
        "aff_unique_url": "https://www.huawei.com;https://www.cnrs.fr;https://www.criteo.com",
        "aff_unique_abbr": "Huawei;CNRS;Criteo",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;1",
        "aff_country_unique": "China;France"
    },
    {
        "id": "070DFUdNh7",
        "title": "GraphGPT: Graph Learning with Generative Pre-trained Transformers",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We introduce GraphGPT, a novel model for Graph learning by self-supervised Generative Pre-training Transformers. Our model transforms each graph or sampled subgraph into a sequence of tokens representing the node, edge and attributes reversibly using the Eulerian path first. Then we feed the tokens into a standard transformer decoder and pre-train it with the next-token-prediction (NTP) task. Lastly, we fine-tune the GraphGPT model with the supervised tasks. This intuitive, yet effective model achieves superior or close results to the state-of-the-art methods for the graph-, edge- and node-level tasks on the large scale molecular dataset PCQM4Mv2, the protein-protein association dataset ogbl-ppa and the ogbn-proteins dataset from the Open Graph Benchmark (OGB). Furthermore, the generative pre-training enables us to train GraphGPT up to 400M+ parameters with consistently increasing performance, which is beyond the capability of GNNs and previous graph transformers. The source code and pre-trained checkpoints will be released soon to pave the way for the graph foundation model research, and also to assist the scientific discovery in pharmaceutical, chemistry, material and bio-informatics domains, etc.",
        "keywords": "Graph;GPT;Generative;Pre-train;Fine-tune;Transformer;GraphGPT",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Qifang Zhao;Weidong Ren;Tianyu Li;Xiaoxiao Xu;Hong Liu",
        "authorids": "~Qifang_Zhao1;~Weidong_Ren2;~Tianyu_Li2;~Xiaoxiao_Xu1;~Hong_Liu10",
        "gender": ";M;M;M;M",
        "homepage": ";;;https://orcid.org/0000-0003-0189-8601;https://c.liepin.com/resume/getdefaultresume/",
        "dblp": ";https://dblp.org/rec/conf/ijcnn/RenZLH21.html;;;",
        "google_scholar": ";;bsCWGaEAAAAJ;;",
        "orcid": ";;;0000-0003-0189-8601;",
        "linkedin": "zhaoqf123/;;;;",
        "or_profile": "~Qifang_Zhao1;~Weidong_Ren2;~Tianyu_Li2;~Xiaoxiao_Xu1;~Hong_Liu10",
        "aff": "Alibaba Group;;Alibaba Group;;",
        "aff_domain": "alibaba-inc.com;;alibaba-inc.com;;",
        "position": "Researcher;;Applied Scientist;;",
        "bibtex": "@misc{\nzhao2024graphgpt,\ntitle={Graph{GPT}: Graph Learning with Generative Pre-trained Transformers},\nauthor={Qifang Zhao and Weidong Ren and Tianyu Li and Xiaoxiao Xu and Hong Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=070DFUdNh7}\n}",
        "github": "",
        "project": "",
        "reviewers": "2YEp;kAz1;VKoy;v4XD",
        "site": "https://openreview.net/forum?id=070DFUdNh7",
        "pdf_size": 1885052,
        "rating": "3;5;5;5",
        "confidence": "3;4;3;3",
        "soundness": "2;2;3;3",
        "contribution": "2;3;3;2",
        "presentation": "3;2;3;3",
        "wc_summary": "77;75;125;55",
        "wc_strengths": "51;43;49;48",
        "wc_weaknesses": "38;203;200;79",
        "wc_questions": "52;50;2;2",
        "wc_review": "218;371;376;184",
        "wc_reply_reviewers": "0;97;73;0",
        "wc_reply_authors": "975;789;541;415",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            83.0,
            25.729360660537214
        ],
        "wc_strengths_avg": [
            47.75,
            2.947456530637899
        ],
        "wc_weaknesses_avg": [
            130.0,
            72.96231904209186
        ],
        "wc_questions_avg": [
            26.5,
            24.510201957552287
        ],
        "wc_review_avg": [
            287.25,
            87.10159298198857
        ],
        "wc_reply_reviewers_avg": [
            42.5,
            43.33878170876519
        ],
        "wc_reply_authors_avg": [
            680.0,
            217.05529249479267
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17618659319024588280&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Alibaba Group",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.alibaba.com",
        "aff_unique_abbr": "Alibaba",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "07xuZw59uB",
        "title": "Bridging the Fairness Divide: Achieving Group and Individual Fairness in Graph Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph neural networks (GNNs) have emerged as a powerful tool for analyzing and learning from complex data structured as graphs, demonstrating remarkable effectiveness in various applications, such as social network analysis, recommendation systems, and drug discovery. However, despite their impressive performance, the fairness problem has increasingly gained attention as a crucial aspect to consider. Existing research on fairness in graph learning primarily emphasizes either group fairness or individual fairness; however, to the best of our knowledge, none of these studies comprehensively address both individual and group fairness simultaneously. In this paper, we propose a new concept of individual fairness within groups and a novel framework named Fairness for Group and Individual (FairGI), which considers both group fairness and individual fairness within groups in the context of graph learning. FairGI employs the similarity matrix of individuals to achieve individual fairness within groups, while leveraging adversarial learning to address group fairness in terms of both Equal Opportunity and Statistical Parity. The experimental results demonstrate that our approach not only outperforms other state-of-the-art models in terms of group fairness and individual fairness within groups, but also exhibits excellent performance in population-level individual fairness, while maintaining comparable prediction accuracy.",
        "keywords": "Graph Neural Networks;Fairness in Graph Learning;Individual Fairness;Group Fairness",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Duna Zhan;Dongliang Guo;Pengsheng Ji;Sheng Li",
        "authorids": "~Duna_Zhan1;~Dongliang_Guo1;~Pengsheng_Ji1;~Sheng_Li3",
        "gender": "F;M;;M",
        "homepage": "https://www.stat.uga.edu/directory/people/duna-zhan;https://donglgcn.github.io/;https://www.stat.uga.edu/directory/people/pengsheng-ji;http://sheng-li.org",
        "dblp": ";48/7696-2.html;153/2224;23/3439-1",
        "google_scholar": ";;Wwl-gO0AAAAJ;DEncVcYAAAAJ",
        "orcid": ";0000-0003-2856-4011;0000-0003-1439-5819;0000-0003-1205-8632",
        "linkedin": "dunazhan;;;sheng-li-15a70022/",
        "or_profile": "~Duna_Zhan1;~Dongliang_Guo1;~Pengsheng_Ji1;~Sheng_Li3",
        "aff": ";University of Virginia, Charlottesville;University of Georgia;University of Virginia, Charlottesville",
        "aff_domain": ";virginia.edu;uga.edu;virginia.edu",
        "position": ";PhD student;Associate Professor;Associate Professor",
        "bibtex": "@misc{\nzhan2024bridging,\ntitle={Bridging the Fairness Divide: Achieving Group and Individual Fairness in Graph Neural Networks},\nauthor={Duna Zhan and Dongliang Guo and Pengsheng Ji and Sheng Li},\nyear={2024},\nurl={https://openreview.net/forum?id=07xuZw59uB}\n}",
        "github": "",
        "project": "",
        "reviewers": "uySt;dYzA;n2zH;9gSh",
        "site": "https://openreview.net/forum?id=07xuZw59uB",
        "pdf_size": 487658,
        "rating": "1;3;3;5",
        "confidence": "4;4;4;4",
        "soundness": "1;2;2;2",
        "contribution": "2;1;1;3",
        "presentation": "2;3;3;2",
        "wc_summary": "106;51;150;85",
        "wc_strengths": "89;17;34;63",
        "wc_weaknesses": "489;94;147;321",
        "wc_questions": "265;4;2;73",
        "wc_review": "949;166;333;542",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            98.0,
            35.86781286892191
        ],
        "wc_strengths_avg": [
            50.75,
            27.535204738661378
        ],
        "wc_weaknesses_avg": [
            262.75,
            155.28743510020377
        ],
        "wc_questions_avg": [
            86.0,
            107.2263960039691
        ],
        "wc_review_avg": [
            497.5,
            292.73921841803156
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15362928413863393123&as_sdt=80005&sciodt=0,11&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Virginia;University of Georgia",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.virginia.edu;https://www.uga.edu",
        "aff_unique_abbr": "UVA;UGA",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Charlottesville;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Sheared LLaMA: Accelerating Language Model Pre-training via Structured Pruning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19623",
        "id": "09iOdaeOzp",
        "author_site": "Mengzhou Xia, Tianyu Gao, Zhiyuan Zeng, Danqi Chen",
        "tldr": "",
        "abstract": "The popularity of LLaMA (Touvron et al., 2023a;b) and other recently emerged moderate-sized large language models (LLMs) highlights the potential of building smaller yet powerful LLMs. Regardless, the cost of training such models from scratch on trillions of tokens remains high. In this work, we study structured pruning as an effective means to develop smaller LLMs from pre-trained, larger models. Our approach employs two key techniques: (1) targeted structured pruning, which prunes a larger model to a specified target shape by removing layers, heads, and intermediate and hidden dimensions in an end-to-end manner, and (2) dynamic batch loading, which dynamically updates the composition of sampled data in each training batch based on varying losses across different domains. We demonstrate the efficacy of our approach by presenting the Sheared-LLaMA series, pruning the LLaMA2-7B model down to 1.3B and 2.7B parameters. Sheared-LLaMA models outperform state-of-the-art open-source models of equivalent sizes, such as Pythia, INCITE, OpenLLaMA and the concurrent TinyLlama models, on a wide range of downstream and instruction tuning evaluations, while requiring only 3% of compute compared to training such models from scratch. This work provides compelling evidence that leveraging existing LLMs with structured pruning is a far more cost-effective approach for building competitive small-scale LLMs",
        "keywords": "pruning;efficiency;large language models;pre-training",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Mengzhou Xia;Tianyu Gao;Zhiyuan Zeng;Danqi Chen",
        "authorids": "~Mengzhou_Xia1;~Tianyu_Gao1;~Zhiyuan_Zeng3;~Danqi_Chen1",
        "gender": "F;M;M;F",
        "homepage": "https://xiamengzhou.github.io/;https://gaotianyu.xyz/about/;https://zhiyuan-zeng.github.io/;https://www.cs.princeton.edu/~danqic/",
        "dblp": "241/9329;207/8893-1.html;;87/7949",
        "google_scholar": "zyJn1IcAAAAJ;il-F8YYAAAAJ;qLJqCqsAAAAJ;sVR8ktkAAAAJ",
        "orcid": ";0000-0002-5178-0866;;",
        "linkedin": ";;;",
        "or_profile": "~Mengzhou_Xia1;~Tianyu_Gao1;~Zhiyuan_Zeng3;~Danqi_Chen1",
        "aff": "Princeton University;Princeton University;Tsinghua University;Princeton University",
        "aff_domain": "princeton.edu;princeton.edu;tsinghua.edu.cn;cs.princeton.edu",
        "position": "PhD student;PhD student;Undergrad student;Assistant Professor",
        "bibtex": "@inproceedings{\nxia2024sheared,\ntitle={Sheared {LL}a{MA}: Accelerating Language Model Pre-training via Structured Pruning},\nauthor={Mengzhou Xia and Tianyu Gao and Zhiyuan Zeng and Danqi Chen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=09iOdaeOzp}\n}",
        "github": "",
        "project": "",
        "reviewers": "bT2X;wgpN;urdF;qt4Y",
        "pdf_size": 739472,
        "rating": "5;5;6;8",
        "confidence": "4;4;4;4",
        "soundness": "3;3;2;4",
        "contribution": "3;2;2;4",
        "presentation": "2;3;3;3",
        "wc_summary": "78;57;138;102",
        "wc_strengths": "37;54;95;224",
        "wc_weaknesses": "349;337;386;30",
        "wc_questions": "5;13;72;398",
        "wc_review": "469;461;691;754",
        "wc_reply_reviewers": "0;0;0;15",
        "wc_reply_authors": "475;436;869;815",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "2;2;3;2",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            93.75,
            30.102948360584218
        ],
        "wc_strengths_avg": [
            102.5,
            73.24786686313807
        ],
        "wc_weaknesses_avg": [
            275.5,
            142.88544362530425
        ],
        "wc_questions_avg": [
            122.0,
            161.43574573185455
        ],
        "wc_review_avg": [
            593.75,
            130.6931042557334
        ],
        "wc_reply_reviewers_avg": [
            3.75,
            6.49519052838329
        ],
        "wc_reply_authors_avg": [
            648.75,
            194.67970490012564
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 270,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9713425200262995197&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=09iOdaeOzp",
        "pdf": "https://openreview.net/pdf?id=09iOdaeOzp",
        "email": "princeton.edu;princeton.edu;tsinghua.edu.cn;cs.princeton.edu",
        "author_num": 4,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Princeton University;Tsinghua University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.princeton.edu;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "Princeton;THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "AutoLoRa: An Automated Robust Fine-Tuning Framework",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19622",
        "id": "09xFexjhqE",
        "author_site": "Xilie Xu, Jingfeng Zhang, Mohan Kankanhalli",
        "tldr": "",
        "abstract": "Robust Fine-Tuning (RFT) is a low-cost strategy to obtain adversarial robustness in downstream applications, without requiring a lot of computational resources and collecting significant amounts of data. This paper uncovers an issue with the existing RFT, \nwhere optimizing both adversarial and natural objectives through the feature extractor (FE) yields significantly divergent gradient directions. This divergence introduces instability in the optimization process, thereby hindering the attainment of adversarial robustness and rendering RFT highly sensitive to hyperparameters. To mitigate this issue, we propose a low-rank (LoRa) branch that disentangles RFT into two distinct components: optimizing natural objectives via the LoRa branch and adversarial objectives via the FE. Besides, we introduce heuristic strategies for automating the scheduling of the learning rate and the scalars of loss terms. Extensive empirical evaluations demonstrate that our proposed automated RFT disentangled via the LoRa branch (AutoLoRa) achieves new state-of-the-art results across a range of downstream tasks. AutoLoRa holds significant practical utility, as it automatically converts a pre-trained FE into an adversarially robust model for downstream tasks without the need for searching hyperparameters. Our source code is available at [the GitHub](https://github.com/GodXuxilie/RobustSSL_Benchmark/tree/main/Finetuning_Methods/AutoLoRa).",
        "keywords": "robust fine-tuning;adversarial robustness",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Xilie Xu;Jingfeng Zhang;Mohan Kankanhalli",
        "authorids": "~Xilie_Xu1;~Jingfeng_Zhang1;~Mohan_Kankanhalli1",
        "gender": "M;M;M",
        "homepage": "https://godxuxilie.github.io/;https://zjfheart.github.io;https://www.comp.nus.edu.sg/~mohan",
        "dblp": "259/2327;227/2664.html;09/3613.html",
        "google_scholar": "https://scholar.google.com/citations?hl=en;NS0P1FkAAAAJ;6Lx_eowAAAAJ",
        "orcid": ";0000-0003-3491-8074;0000-0002-4846-2015",
        "linkedin": ";;mohan-kankanhalli-583417221",
        "or_profile": "~Xilie_Xu1;~Jingfeng_Zhang1;~Mohan_Kankanhalli1",
        "aff": "National University of Singapore;University of Auckland;National University of Singapore",
        "aff_domain": "nus.edu.sg;auckland.ac.nz;nus.edu.sg",
        "position": "PhD student;Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\nxu2024autolora,\ntitle={AutoLoRa: An Automated Robust Fine-Tuning Framework},\nauthor={Xilie Xu and Jingfeng Zhang and Mohan Kankanhalli},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=09xFexjhqE}\n}",
        "github": "",
        "project": "",
        "reviewers": "qytY;4DPH;pJnK;kvxv",
        "pdf_size": 552186,
        "rating": "5;6;6;8",
        "confidence": "4;4;3;4",
        "soundness": "2;2;3;3",
        "contribution": "2;3;2;2",
        "presentation": "3;3;3;3",
        "wc_summary": "83;228;114;104",
        "wc_strengths": "53;92;41;80",
        "wc_weaknesses": "116;288;191;48",
        "wc_questions": "5;164;47;3",
        "wc_review": "257;772;393;235",
        "wc_reply_reviewers": "0;128;346;81",
        "wc_reply_authors": "812;954;1010;298",
        "reply_reviewers": "0;2;2;1",
        "reply_authors": "3;3;4;2",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            132.25,
            56.40201680791211
        ],
        "wc_strengths_avg": [
            66.5,
            20.402205763103165
        ],
        "wc_weaknesses_avg": [
            160.75,
            89.19466071464143
        ],
        "wc_questions_avg": [
            54.75,
            65.47661796397246
        ],
        "wc_review_avg": [
            414.25,
            215.2293834493794
        ],
        "wc_reply_reviewers_avg": [
            138.75,
            128.11591431200108
        ],
        "wc_reply_authors_avg": [
            768.5,
            281.0671627920985
        ],
        "reply_reviewers_avg": [
            1.25,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.13245323570650439,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18117461636957153722&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=09xFexjhqE",
        "pdf": "https://openreview.net/pdf?id=09xFexjhqE",
        "email": "nus.edu.sg;auckland.ac.nz;nus.edu.sg",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "National University of Singapore;University of Auckland",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.nus.edu.sg;https://www.auckland.ac.nz",
        "aff_unique_abbr": "NUS;UoA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Singapore;New Zealand"
    },
    {
        "id": "0A5o6dCKeK",
        "title": "NExT-GPT: Any-to-Any Multimodal LLM",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "While recently Multimodal Large Language Models (MM-LLMs) have made exciting strides, they mostly fall prey to the limitation of only input-side multimodal understanding, without the ability to produce content in multiple modalities. As we humans always perceive the world and communicate with people through various modalities, developing any-to-any MM-LLMs capable of accepting and delivering content in any modality becomes essential to human-level AI. To fill the gap, we present an end-to-end general-purpose any-to-any MM-LLM system, NExT-GPT. We connect an LLM with multimodal adaptors and different diffusion decoders, enabling NExT-GPT to perceive inputs and generate outputs in arbitrary combinations of text, images, videos, and audio. By leveraging the existing well-trained highly-performing encoders and decoders, NExT-GPT is tuned with only a small amount of parameter (1%) of certain projection layers, which not only benefits low-cost training but also facilitates convenient expansion to more potential modalities. Moreover, we introduce a modality-switching instruction tuning (MosIT) and manually curate a high-quality dataset for MosIT, based on which NExT-GPT is empowered with complex cross-modal semantic understanding and content generation. Overall, our research showcases the promising possibility of building a unified AI agent capable of modeling universal modalities, paving the way for more human-like AI research in the community.",
        "keywords": "Large Language Model;Diffusion Model",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/270675d02e3504834cbfd92ecf17614841e9db3f.zip",
        "author": "Shengqiong Wu;Hao Fei;Leigang Qu;Wei Ji;Tat-Seng Chua",
        "authorids": "~Shengqiong_Wu2;~Hao_Fei1;~Leigang_Qu1;~Wei_Ji1;~Tat-Seng_Chua2",
        "gender": "F;M;M;M;M",
        "homepage": "https://chocowu.github.io/;https://haofei.vip/;https://leigang-qu.github.io/;https://jiwei0523.github.io/;http://www.comp.nus.edu.sg/~chuats/",
        "dblp": "274/7191;81/3569-1;276/3150;52/3220-8;",
        "google_scholar": "RJJLKR0AAAAJ;YGDX46AAAAAJ;1W2Tio4AAAAJ;69OFB-AAAAAJ;https://scholar.google.com.tw/citations?user=Z9DWCBEAAAAJ",
        "orcid": "0000-0001-6192-1194;0000-0003-3026-6347;0009-0004-6555-3834;0000-0002-8106-9768;0000-0001-6097-7807",
        "linkedin": ";;;;",
        "or_profile": "~Shengqiong_Wu2;~Hao_Fei1;~Leigang_Qu1;~Wei_Ji1;~Tat-seng_Chua1",
        "aff": "National University of Singapore;National University of Singapore;National University of Singapore;Nanjing University;National University of Singapore",
        "aff_domain": "u.nus.edu;nus.edu.sg;u.nus.edu;nju.edu.cn;nus.edu.sg",
        "position": "PhD student;Postdoc;PhD student;Associate Professor;Full Professor",
        "bibtex": "@misc{\nwu2024nextgpt,\ntitle={{NE}xT-{GPT}: Any-to-Any Multimodal {LLM}},\nauthor={Shengqiong Wu and Hao Fei and Leigang Qu and Wei Ji and Tat-Seng Chua},\nyear={2024},\nurl={https://openreview.net/forum?id=0A5o6dCKeK}\n}",
        "github": "",
        "project": "",
        "reviewers": "NwS3;ijPL;7uQJ;mDkx",
        "site": "https://openreview.net/forum?id=0A5o6dCKeK",
        "pdf_size": 8145815,
        "rating": "5;5;6;8",
        "confidence": "4;5;4;4",
        "soundness": "3;3;3;3",
        "contribution": "3;2;3;3",
        "presentation": "4;3;4;3",
        "wc_summary": "68;49;78;21",
        "wc_strengths": "39;35;64;22",
        "wc_weaknesses": "127;200;82;47",
        "wc_questions": "3;2;11;64",
        "wc_review": "237;286;235;154",
        "wc_reply_reviewers": "99;0;0;0",
        "wc_reply_authors": "1443;1773;771;397",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "4;4;2;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            54.0,
            21.714050750608465
        ],
        "wc_strengths_avg": [
            40.0,
            15.215124054702938
        ],
        "wc_weaknesses_avg": [
            114.0,
            57.17954179599553
        ],
        "wc_questions_avg": [
            20.0,
            25.64176280991617
        ],
        "wc_review_avg": [
            228.0,
            47.3550419702063
        ],
        "wc_reply_reviewers_avg": [
            24.75,
            42.868257487329714
        ],
        "wc_reply_authors_avg": [
            1096.0,
            541.5173127426306
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            1.299038105676658
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.4714045207910316,
        "gs_citation": 616,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=174615942206434624&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "National University of Singapore;Nanjing University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.nus.edu.sg;https://www.nju.edu.cn",
        "aff_unique_abbr": "NUS;Nanjing U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "Singapore;China"
    },
    {
        "id": "0AYosSFETw",
        "title": "Towards human-like spoken dialogue generation between AI agents from written dialogue",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The advent of large language models (LLMs) has made it possible to generate natural written dialogues between two agents.\nHowever, generating human-like spoken dialogues from these written dialogues remains challenging.\nSpoken dialogues have several unique characteristics: they frequently include backchannels and laughter, and the smoothness of turn-taking significantly influences the fluidity of conversation.\nThis study proposes CHATS \u2015 CHatty Agents Text-to-Speech \u2015 a discrete token-based system designed to generate spoken dialogues based on written dialogues.\nOur system can generate speech for both the speaker side and the listener side simultaneously, using only the transcription from the speaker side, which eliminates the need for transcriptions of backchannels or laughter.\nMoreover, CHATS facilitates natural turn-taking; it determines the appropriate duration of silence after each utterance in the absence of overlap, and it initiates the generation of overlapping speech based on the phoneme sequence of the next utterance in case of overlap.\nExperimental evaluations indicate that CHATS outperforms the text-to-speech baseline, producing spoken dialogues that are more interactive and fluid while retaining clarity and intelligibility.",
        "keywords": "spoken dialogue modeling;text-to-speech synthesis;backchannel generation;turn-taking",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Kentaro Mitsui;Yukiya Hono;Kei Sawada",
        "authorids": "~Kentaro_Mitsui1;~Yukiya_Hono1;~Kei_Sawada1",
        "gender": "M;M;",
        "homepage": ";;",
        "dblp": "247/6422;;",
        "google_scholar": "https://scholar.google.co.jp/citations?user=RMIT5OQAAAAJ;SU5SLdUAAAAJ;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Kentaro_Mitsui1;~Yukiya_Hono1;~Kei_Sawada1",
        "aff": "rinna Co., Ltd.;Nagoya Institute of Technology;",
        "aff_domain": "rinna.co.jp;nitech.ac.jp;",
        "position": "Researcher;Postdoc;",
        "bibtex": "@misc{\nmitsui2024towards,\ntitle={Towards human-like spoken dialogue generation between {AI} agents from written dialogue},\nauthor={Kentaro Mitsui and Yukiya Hono and Kei Sawada},\nyear={2024},\nurl={https://openreview.net/forum?id=0AYosSFETw}\n}",
        "github": "",
        "project": "",
        "reviewers": "Kha2;FEtd;yc8m",
        "site": "https://openreview.net/forum?id=0AYosSFETw",
        "pdf_size": 1229911,
        "rating": "5;6;8",
        "confidence": "3;4;4",
        "soundness": "2;4;4",
        "contribution": "3;2;3",
        "presentation": "2;3;3",
        "wc_summary": "204;50;154",
        "wc_strengths": "52;57;129",
        "wc_weaknesses": "175;76;94",
        "wc_questions": "20;74;17",
        "wc_review": "451;257;394",
        "wc_reply_reviewers": "39;0;0",
        "wc_reply_authors": "1071;519;1443",
        "reply_reviewers": "1;0;0",
        "reply_authors": "3;1;3",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            136.0,
            64.14566755959959
        ],
        "wc_strengths_avg": [
            79.33333333333333,
            35.178907822096406
        ],
        "wc_weaknesses_avg": [
            115.0,
            43.05810028322197
        ],
        "wc_questions_avg": [
            37.0,
            26.19160170741759
        ],
        "wc_review_avg": [
            367.3333333333333,
            81.41389452803632
        ],
        "wc_reply_reviewers_avg": [
            13.0,
            18.384776310850235
        ],
        "wc_reply_authors_avg": [
            1011.0,
            379.5997892517855
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.7559289460184545,
        "gs_citation": 19,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9835558836471678525&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "rinna Co., Ltd.;Nagoya Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": ";https://www.nitech.ac.jp",
        "aff_unique_abbr": ";NIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Japan"
    },
    {
        "title": "One-shot Empirical Privacy Estimation for Federated Learning",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19621",
        "id": "0BqyZSWfzo",
        "author_site": "Galen Andrew, Peter Kairouz, Sewoong Oh, Alina Oprea, H. Brendan McMahan, Vinith Suriyakumar",
        "tldr": "",
        "abstract": "Privacy estimation techniques for differentially private (DP) algorithms are useful for comparing against analytical bounds, or to empirically measure privacy loss in settings where known analytical bounds are not tight. However, existing privacy auditing techniques usually make strong assumptions on the adversary (e.g., knowledge of intermediate model iterates or the training data distribution), are tailored to specific tasks, model architectures, or DP algorithm, and/or require retraining the model many times (typically on the order of thousands). These shortcomings make deploying such techniques at scale difficult in practice, especially in federated settings where model training can take days or weeks. In this work, we present a novel \u201cone-shot\u201d approach that can systematically address these challenges, allowing efficient auditing or estimation of the privacy loss of a model during the same, single training run used to fit model parameters, and without requiring any a priori knowledge about the model architecture, task, or DP algorithm. We show that our method provides provably correct estimates for the privacy loss under the Gaussian mechanism, and we demonstrate its performance on a well-established FL benchmark dataset under several adversarial threat models.",
        "keywords": "differential privacy;federated learning;empirical privacy",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Galen Andrew;Peter Kairouz;Sewoong Oh;Alina Oprea;Hugh Brendan McMahan;Vinith Menon Suriyakumar",
        "authorids": "~Galen_Andrew1;~Peter_Kairouz1;~Sewoong_Oh3;~Alina_Oprea1;~Hugh_Brendan_McMahan1;~Vinith_Menon_Suriyakumar1",
        "gender": "M;M;;F;M;M",
        "homepage": ";https://kairouzp.github.io/;;http://www.ccs.neu.edu/home/alina/;;",
        "dblp": "31/1971;129/1254;;35/3425;;",
        "google_scholar": ";m8NUgw0AAAAJ;;https://scholar.google.com.tw/citations?user=16J3izoAAAAJ;;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;0000-0002-4979-5292;;",
        "linkedin": ";kayrouzp;;alina-oprea-9588bb1;;vsuriyakumar",
        "or_profile": "~Galen_Andrew1;~Peter_Kairouz1;~Sewoong_Oh3;~Alina_Oprea1;~Hugh_Brendan_McMahan1;~Vinith_Menon_Suriyakumar1",
        "aff": "Google;Google;;Northeastern University;Google;Massachusetts Institute of Technology",
        "aff_domain": "google.com;google.com;;northeastern.edu;google.com;mit.edu",
        "position": "Researcher;Research Scientist;;Associate Professor;Research Scientist;PhD student",
        "bibtex": "@inproceedings{\nandrew2024oneshot,\ntitle={One-shot Empirical Privacy Estimation for Federated Learning},\nauthor={Galen Andrew and Peter Kairouz and Sewoong Oh and Alina Oprea and Hugh Brendan McMahan and Vinith Menon Suriyakumar},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=0BqyZSWfzo}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZyjW;zCeQ;LDHu",
        "pdf_size": 599734,
        "rating": "8;8;8",
        "confidence": "4;3;3",
        "soundness": "4;3;4",
        "contribution": "3;2;3",
        "presentation": "3;3;4",
        "wc_summary": "144;69;66",
        "wc_strengths": "74;56;116",
        "wc_weaknesses": "655;142;169",
        "wc_questions": "112;152;39",
        "wc_review": "985;419;390",
        "wc_reply_reviewers": "775;108;24",
        "wc_reply_authors": "2205;1400;906",
        "reply_reviewers": "4;1;1",
        "reply_authors": "5;4;2",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            93.0,
            36.08323710533743
        ],
        "wc_strengths_avg": [
            82.0,
            25.13961017995307
        ],
        "wc_weaknesses_avg": [
            322.0,
            235.7244153667583
        ],
        "wc_questions_avg": [
            101.0,
            46.783187863447985
        ],
        "wc_review_avg": [
            598.0,
            273.9063100161562
        ],
        "wc_reply_reviewers_avg": [
            302.3333333333333,
            335.980488851494
        ],
        "wc_reply_authors_avg": [
            1503.6666666666667,
            535.3567865348201
        ],
        "reply_reviewers_avg": [
            2.0,
            1.4142135623730951
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            1.247219128924647
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 40,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2844245160919175035&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=0BqyZSWfzo",
        "pdf": "https://openreview.net/pdf?id=0BqyZSWfzo",
        "email": "google.com;google.com;;northeastern.edu;google.com;mit.edu",
        "author_num": 6,
        "aff_unique_index": "0;0;1;0;2",
        "aff_unique_norm": "Google;Northeastern University;Massachusetts Institute of Technology",
        "aff_unique_dep": "Google;;",
        "aff_unique_url": "https://www.google.com;https://www.northeastern.edu;https://web.mit.edu",
        "aff_unique_abbr": "Google;NEU;MIT",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Mountain View;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "0Ce3c9l7G1",
        "title": "Learning Multi-Agent Communication using Regularized Attention Messages",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Learning how to communicate in Multi-Agent Reinforcement Learning (MARL) can be key to solve complex cooperative tasks. Recent approaches have shown the advantages of using an efficient communication architecture, tackling problems such as what, when, or whom to communicate. However, these methods still fail to solve some complex scenarios, and some of them do not evaluate the implications of having limited communication channels. In this paper, we propose Attentive Regularized Communication (ARCOMM), a new method for communication in MARL. The proposed method uses an attention module to evaluate the weight of the messages generated by the agents, together with a message regularizer that facilitates learning more meaningful messages, improving the performance of the team. We further analyse how ARCOMM reacts to situations where the messages must be compressed before being sent to other agents. Our results show that the proposed method helps, through the power of communication, to improve the performances of the agents in complex domains when compared to other methods. Furthermore, we show that, although there is a decrease of performance, agents are still capable of learning even with lossy communication. The messages learned by the agents also support the motivations for our method.",
        "keywords": "Multi-Agent Reinforcement Learning;Communication;Attention;Message Compression",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Rafael Moreira Pina;Varuna De SIlva De SIlva;Corentin Artaud",
        "authorids": "~Rafael_Moreira_Pina1;~Varuna_De_SIlva_De_SIlva1;~Corentin_Artaud1",
        "gender": "M;Non-Binary;",
        "homepage": ";https://www.lborolondon.ac.uk/about/staff/dr-varuna-de-silva/;https://corentinartaud.github.io",
        "dblp": "310/3161;;333/5155",
        "google_scholar": ";;https://scholar.google.co.uk/citations?user=702BRhkAAAAJ",
        "orcid": "0000-0003-1304-3539;;0009-0002-0387-235X",
        "linkedin": "rafael-pina-b26913194/;;corentinartaud/",
        "or_profile": "~Rafael_Moreira_Pina1;~Varuna_De_SIlva_De_SIlva1;~Corentin_Artaud1",
        "aff": "Loughborough University London;Loughborough University;Loughborough University London",
        "aff_domain": "lboro.ac.uk;lboro.ac.uk;lboro.ac.uk",
        "position": "PhD student;Associate Professor;PhD student",
        "bibtex": "@misc{\npina2024learning,\ntitle={Learning Multi-Agent Communication using Regularized Attention Messages},\nauthor={Rafael Moreira Pina and Varuna De SIlva De SIlva and Corentin Artaud},\nyear={2024},\nurl={https://openreview.net/forum?id=0Ce3c9l7G1}\n}",
        "github": "",
        "project": "",
        "reviewers": "cGtd;j1DY;eV4L;FWnu",
        "site": "https://openreview.net/forum?id=0Ce3c9l7G1",
        "pdf_size": 28872842,
        "rating": "3;3;5;5",
        "confidence": "4;5;4;4",
        "soundness": "2;1;2;2",
        "contribution": "2;2;2;2",
        "presentation": "3;2;2;2",
        "wc_summary": "57;21;71;96",
        "wc_strengths": "9;10;27;54",
        "wc_weaknesses": "157;144;252;70",
        "wc_questions": "58;9;26;70",
        "wc_review": "281;184;376;290",
        "wc_reply_reviewers": "0;0;54;37",
        "wc_reply_authors": "652;530;1205;758",
        "reply_reviewers": "0;0;1;2",
        "reply_authors": "2;2;3;3",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            61.25,
            27.11434122378783
        ],
        "wc_strengths_avg": [
            25.0,
            18.207141456033124
        ],
        "wc_weaknesses_avg": [
            155.75,
            64.72393297691357
        ],
        "wc_questions_avg": [
            40.75,
            24.38621536852326
        ],
        "wc_review_avg": [
            282.75,
            68.01240695637819
        ],
        "wc_reply_reviewers_avg": [
            22.75,
            23.53056522908024
        ],
        "wc_reply_authors_avg": [
            786.25,
            254.87092321408497
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:weN9GJto7N4J:scholar.google.com/&scioq=Learning+Multi-Agent+Communication+using+Regularized+Attention+Messages&hl=en&as_sdt=0,31",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Loughborough University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.lborolondon.ac.uk",
        "aff_unique_abbr": "Lboro",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "London;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "0D6mUZTWoF",
        "title": "A Topology-aware Graph Coarsening Framework for Continual Graph Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Continual learning on graphs tackles the problem of training a graph neural network (GNN) where graph data arrive in a streaming fashion and the model tends to forget knowledge from previous tasks when updating with new data.\nTraditional continual learning strategies such as Experience Replay can be adapted to streaming graphs, however, these methods often face challenges such as inefficiency in preserving graph topology and incapability of capturing the correlation between old and new tasks.\nTo address these challenges, we propose TA$\\mathbb{CO}$, a topology-aware graph coarsening and continual learning framework that stores information from previous tasks as a reduced graph. \nAt each time period, this reduced graph expands by combining with a new graph and aligning shared nodes, and then it undergoes a ``zoom out'' process by reduction to maintain a stable size. \nWe design a graph coarsening algorithm based on node representation proximities to efficiently reduce a graph and preserve topological information. We empirically demonstrate the learning process on the reduced graph can approximate that of the original graph.\nOur experiments validate the effectiveness of the proposed framework on three real-world datasets using different backbone GNN models.",
        "keywords": "Continual Graph Learning;Catastrophic Forgetting;Graph Coarsening",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/660a4731ebe4deeeadf25c4f5443ce61f19453f8.zip",
        "author": "Xiaoxue Han;Zhuo Feng;Yue Ning",
        "authorids": "~Xiaoxue_Han1;~Zhuo_Feng3;~Yue_Ning1",
        "gender": "F;M;F",
        "homepage": "https://hanxiaoxue114.github.io/;https://web.stevens.edu/facultyprofile/?id=2371;https://yue-ning.github.io/",
        "dblp": "219/1935;81/4441.html;74/9990-1.html",
        "google_scholar": ";;https://scholar.google.com/citations?hl=en",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Xiaoxue_Han1;~Zhuo_Feng3;~Yue_Ning1",
        "aff": "Stevens Institute of Technology;;Stevens Institute of Technology",
        "aff_domain": "stevens.edu;;stevens.edu",
        "position": "PhD student;;Assistant Professor",
        "bibtex": "@misc{\nhan2024a,\ntitle={A Topology-aware Graph Coarsening Framework for Continual Graph Learning},\nauthor={Xiaoxue Han and Zhuo Feng and Yue Ning},\nyear={2024},\nurl={https://openreview.net/forum?id=0D6mUZTWoF}\n}",
        "github": "",
        "project": "",
        "reviewers": "9rSM;sD2m;Tw7D;A9ak",
        "site": "https://openreview.net/forum?id=0D6mUZTWoF",
        "pdf_size": 937313,
        "rating": "3;5;6;8",
        "confidence": "5;4;3;3",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "136;68;88;98",
        "wc_strengths": "31;26;32;99",
        "wc_weaknesses": "184;35;66;78",
        "wc_questions": "36;253;25;156",
        "wc_review": "387;382;211;431",
        "wc_reply_reviewers": "0;223;22;0",
        "wc_reply_authors": "1061;948;432;1186",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "3;3;1;3",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            97.5,
            24.713356712514795
        ],
        "wc_strengths_avg": [
            47.0,
            30.108138434649195
        ],
        "wc_weaknesses_avg": [
            90.75,
            56.07751331861997
        ],
        "wc_questions_avg": [
            117.5,
            93.59620718811206
        ],
        "wc_review_avg": [
            352.75,
            84.03087230298159
        ],
        "wc_reply_reviewers_avg": [
            61.25,
            93.81730917053633
        ],
        "wc_reply_authors_avg": [
            906.75,
            286.73278065125373
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            0.8660254037844386
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.9198662110077999,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17516262532202830926&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 10,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Stevens Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.stevens.edu",
        "aff_unique_abbr": "SIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "0GZ1Bq4Tfr",
        "title": "Layer-wise Pre-weight Decay",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In deep learning, weight decay is a regularization mechanism been widely adopted to improve the generalization performance. Previously, a common understanding of the role of weight decay was that it contributes by pushing the model weights to approach 0 at each time step. \nHowever, our findings challenge this notion and argue the objective of weight decay is to make the weights approach the negative value of the update term instead of 0, thereby indicating a delay defect in certain steps that results in opposing penalties. In addition, we study the negative side effect of weight decay, revealing it will damage the inter-layer connectivity of the network while reducing weight magnitude.\nTo address these issues, we first propose real-time weight decay to fix the delay defect by penalizing both the weights and the gradients at each time step. \nThen, we advance the decay step before the update function as pre-weight decay to mitigate the performance drop raised by the side effect.\nTo further improve the general performance and enhance model robustness towards the decay rate, we finally introduce a layer-wise pre-weight decay to adjust the decay rate based on the layer index. \nExtensive analytical and comparative experiments demonstrate that the proposed $\\textit{layer-wise pre-weight decay}$ (LPWD) (i) exhibits remarkable robustness to the decay rate, and (ii) significantly improves the generalization performance across various conditions.",
        "keywords": "deep learning;regularization;generalization;weight decay",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Xiaolong Huang;Qiankun Li;Hanguang Xiao;Gao Xuesong;Xueran Li",
        "authorids": "~Xiaolong_Huang3;~Qiankun_Li1;~Hanguang_Xiao1;~Gao_Xuesong1;~Xueran_Li1",
        "gender": "M;M;M;M;M",
        "homepage": ";https://orcid.org/0000-0001-5121-1682;https://ai.cqut.edu.cn/info/1052/1679.htm;https://github.com/Mr-GaoXueSong;https://github.com/lxr-1204",
        "dblp": ";228/7339;;;",
        "google_scholar": "https://scholar.google.com.hk/citations?hl=zh-CN;https://scholar.google.com/citations?hl=en;;;",
        "orcid": ";0000-0001-5121-1682;;;",
        "linkedin": ";;;;",
        "or_profile": "~Xiaolong_Huang3;~Qiankun_Li1;~Hanguang_Xiao1;~Gao_Xuesong1;~Xueran_Li1",
        "aff": "Mila - Quebec Artificial Intelligence Institute;University of Science and Technology of China;Chongqing University of Technology;;Anhui University",
        "aff_domain": "mila.quebec;ustc.edu.cn;cuqt.edu.cn;;ahu.edu.cn",
        "position": "MS student;PhD student;Full Professor;;MS student",
        "bibtex": "@misc{\nhuang2024layerwise,\ntitle={Layer-wise Pre-weight Decay},\nauthor={Xiaolong Huang and Qiankun Li and Hanguang Xiao and Gao Xuesong and Xueran Li},\nyear={2024},\nurl={https://openreview.net/forum?id=0GZ1Bq4Tfr}\n}",
        "github": "",
        "project": "",
        "reviewers": "QiZQ;AMDG;hMNw;51Q7",
        "site": "https://openreview.net/forum?id=0GZ1Bq4Tfr",
        "pdf_size": 3289142,
        "rating": "3;3;3;6",
        "confidence": "4;4;5;3",
        "soundness": "2;2;1;3",
        "contribution": "2;2;1;3",
        "presentation": "2;2;2;2",
        "wc_summary": "127;107;55;56",
        "wc_strengths": "22;51;13;58",
        "wc_weaknesses": "224;149;125;175",
        "wc_questions": "63;28;79;31",
        "wc_review": "436;335;272;320",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            86.25,
            31.554516317002864
        ],
        "wc_strengths_avg": [
            36.0,
            18.934096228761486
        ],
        "wc_weaknesses_avg": [
            168.25,
            36.72448093574639
        ],
        "wc_questions_avg": [
            50.25,
            21.533404282648853
        ],
        "wc_review_avg": [
            340.75,
            59.713377898089135
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:6NAF6PFAlzQJ:scholar.google.com/&scioq=Layer-wise+Pre-weight+Decay&hl=en&as_sdt=0,48",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Quebec Artificial Intelligence Institute;University of Science and Technology of China;Chongqing University of Technology;Anhui University",
        "aff_unique_dep": "Artificial Intelligence;;;",
        "aff_unique_url": "https://mila.quebec;http://www.ustc.edu.cn;http://www.cqut.edu.cn;http://www.ahu.edu.cn/",
        "aff_unique_abbr": "Mila;USTC;;AHU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "Canada;China"
    },
    {
        "title": "Language Control Diffusion: Efficiently Scaling through Space, Time, and Tasks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19620",
        "id": "0H6DFoZZXZ",
        "author_site": "Edwin Zhang, Yujie Lu, Shinda Huang, William Wang, Amy Zhang",
        "tldr": "",
        "abstract": "Training generalist agents is difficult across several axes, requiring us to deal with high-dimensional inputs (space), long horizons (time), and generalization to novel tasks. Recent advances with architectures have allowed for improved scaling along one or two of these axes, but are still computationally prohibitive to use. In this paper, we propose to address all three axes by leveraging Language to Control Diffusion models as a hierarchical planner conditioned on language (LCD). We effectively and efficiently scale diffusion models for planning in extended temporal, state, and task dimensions to tackle long horizon control problems conditioned on natural language instructions, as a step towards generalist agents. Comparing LCD with other state-of-the-art models on the CALVIN language benchmark finds that LCD outperforms other SOTA methods in multi-task success rates, whilst improving inference speed over other comparable diffusion models by 3.3x~15x. We show that LCD can successfully leverage the unique strength of diffusion models to produce coherent long range plans while addressing their weakness in generating low-level details and control.",
        "keywords": "planning;diffusion;language;RL;reinforcement",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/f73f5eb9525f55dc681390f230a073bff76cbce3.zip",
        "author": "Edwin Zhang;Yujie Lu;Shinda Huang;William Yang Wang;Amy Zhang",
        "authorids": "~Edwin_Zhang2;~Yujie_Lu1;~Shinda_Huang1;~William_Yang_Wang2;~Amy_Zhang1",
        "gender": ";;;F;M",
        "homepage": "https://eddie.win;https://yujielu10.github.io/;;;https://www.cs.ucsb.edu/~william/",
        "dblp": ";;;43/2754;08/9282",
        "google_scholar": ";pcmr6GMAAAAJ;;;gf8Ms_8AAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;shinda-huang/;;",
        "or_profile": "~Edwin_Zhang2;~Yujie_Lu1;~Shinda_Huang1;~Amy_Zhang2;~William_Wang1",
        "aff": "Harvard University;UC Santa Barbara;University of California, Santa Barbara;Meta Facebook;UC Santa Barbara",
        "aff_domain": "harvard.edu;ucsb.edu;ucsb.edu;facebook.com;ucsb.edu",
        "position": "PhD student;PhD student;MS student;Research Scientist;Full Professor",
        "bibtex": "@inproceedings{\nzhang2024language,\ntitle={Language Control Diffusion: Efficiently Scaling through Space, Time, and Tasks},\nauthor={Edwin Zhang and Yujie Lu and Shinda Huang and William Yang Wang and Amy Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=0H6DFoZZXZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "z6e9;74cS;FYfw;fAWH",
        "pdf_size": 2758481,
        "rating": "5;6;6;6",
        "confidence": "4;3;3;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "71;46;34;44",
        "wc_strengths": "21;82;34;71",
        "wc_weaknesses": "94;172;223;76",
        "wc_questions": "2;87;5;73",
        "wc_review": "188;387;296;264",
        "wc_reply_reviewers": "0;137;12;0",
        "wc_reply_authors": "1014;1285;1093;685",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "4;4;2;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            48.75,
            13.626720074911644
        ],
        "wc_strengths_avg": [
            52.0,
            25.228951623085727
        ],
        "wc_weaknesses_avg": [
            141.25,
            59.41117319158072
        ],
        "wc_questions_avg": [
            41.75,
            38.58351331851468
        ],
        "wc_review_avg": [
            283.75,
            71.35956488096042
        ],
        "wc_reply_reviewers_avg": [
            37.25,
            57.798680780792914
        ],
        "wc_reply_authors_avg": [
            1019.25,
            216.6868420093846
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.75,
            1.299038105676658
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12290706867650507132&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=0H6DFoZZXZ",
        "pdf": "https://openreview.net/pdf?id=0H6DFoZZXZ",
        "email": "harvard.edu;ucsb.edu;ucsb.edu;facebook.com;ucsb.edu",
        "author_num": 5,
        "aff_unique_index": "0;1;1;2;1",
        "aff_unique_norm": "Harvard University;University of California, Santa Barbara;Meta",
        "aff_unique_dep": ";;Meta Platforms, Inc.",
        "aff_unique_url": "https://www.harvard.edu;https://www.ucsb.edu;https://meta.com",
        "aff_unique_abbr": "Harvard;UCSB;Meta",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Santa Barbara",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "0HIMHjYhYe",
        "title": "Diffusion Model-Augmented Behavioral Cloning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Imitation learning addresses the challenge of learning by observing an expert\u2019s demonstrations without access to reward signals from environments. Most existing imitation learning methods that do not require interacting with environments either model the expert distribution as the conditional probability p(a|s) (e.g., behavioral cloning, BC) or the joint probability p(s, a) Despite its simplicity, modeling the conditional probability with BC usually struggles with generalization. While modeling the joint probability can lead to improved generalization performance, the inference procedure is often time-consuming and the model can suffer from manifold overfitting. This work proposes an imitation learning framework that benefits from modeling both the conditional and joint probability of the expert distribution. Our proposed diffusion model-augmented behavioral cloning (DBC) employs a diffusion model trained to model expert behaviors and learns a policy to optimize both the BC loss (conditional) and our proposed diffusion model loss (joint). DBC outperforms baselines in various continuous control tasks in navigation, robot arm manipulation, dexterous manipulation, and locomotion. We design additional experiments to verify the limitations of modeling either the conditional probability or the joint probability of the expert distribution as well as compare different generative models. Ablation studies justify the effectiveness of our design choices.",
        "keywords": "Imitation Learning;Learning from Demonstration;Diffusion Models;Behavioral Cloning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/ce67a7bb74506963876163cf4b308455c4027d26.pdf",
        "author": "Hsiang-Chun Wang;Shang-Fu Chen;Ming-Hao Hsu;Chun-Mao Lai;Shao-Hua Sun",
        "authorids": "~Hsiang-Chun_Wang1;~Shang-Fu_Chen2;~Ming-Hao_Hsu1;~Chun-Mao_Lai1;~Shao-Hua_Sun1",
        "gender": ";M;M;M;M",
        "homepage": "https://hsiangchun0205.github.io/;https://www.linkedin.com/in/shang-fu-chen-354914199/;https://qaz159qaz159.github.io/;https://mecoli1219.github.io/;http://shaohua0116.github.io",
        "dblp": ";203/9102;325/4631;325/4767;158/9680",
        "google_scholar": "https://scholar.google.com.tw/citations?user=vpJMSjMAAAAJ;https://scholar.google.com.tw/citations?user=ZKOpgs4AAAAJ;;;uXsfnaQAAAAJ",
        "orcid": ";;;;0000-0001-7579-6734",
        "linkedin": "https://tw.linkedin.com/in/hsiang-chun-wang-8a4798269;;;;shaohua0116/",
        "or_profile": "~Hsiang-Chun_Wang1;~Shang-Fu_Chen2;~Ming-Hao_Hsu1;~Chun-Mao_Lai1;~Shao-Hua_Sun1",
        "aff": "National Taiwan University;National Taiwan University;National Taiwan University;National Taiwan University;National Taiwan University",
        "aff_domain": "ntu.edu.tw;ntu.edu.tw;ntu.edu.tw;ntu.edu.tw;ntu.edu.tw",
        "position": "MS student;PhD student;Undergrad student;Undergrad student;Assistant Professor",
        "bibtex": "@misc{\nwang2024diffusion,\ntitle={Diffusion Model-Augmented Behavioral Cloning},\nauthor={Hsiang-Chun Wang and Shang-Fu Chen and Ming-Hao Hsu and Chun-Mao Lai and Shao-Hua Sun},\nyear={2024},\nurl={https://openreview.net/forum?id=0HIMHjYhYe}\n}",
        "github": "",
        "project": "",
        "reviewers": "dYN2;bGrV;8bWB;Mkdd",
        "site": "https://openreview.net/forum?id=0HIMHjYhYe",
        "pdf_size": 2354520,
        "rating": "3;3;3;6",
        "confidence": "4;5;4;4",
        "soundness": "2;2;1;3",
        "contribution": "2;1;2;3",
        "presentation": "3;2;2;3",
        "wc_summary": "54;70;77;58",
        "wc_strengths": "28;37;45;116",
        "wc_weaknesses": "2;506;153;61",
        "wc_questions": "98;3;6;36",
        "wc_review": "182;616;281;271",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            64.75,
            9.202581159652981
        ],
        "wc_strengths_avg": [
            56.5,
            34.87477598494362
        ],
        "wc_weaknesses_avg": [
            180.5,
            195.4795385711763
        ],
        "wc_questions_avg": [
            35.75,
            38.18622133702155
        ],
        "wc_review_avg": [
            337.5,
            165.34584966064313
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 25,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=499986354715790633&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "National Taiwan University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ntu.edu.tw",
        "aff_unique_abbr": "NTU",
        "aff_campus_unique_index": "0;0;0;0;0",
        "aff_campus_unique": "Taiwan",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "0IaTFNJner",
        "title": "On the Embedding Collapse When Scaling up Recommendation Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent advances in deep foundation models have led to a promising trend of developing large recommendation models to leverage vast amounts of available data. However, we experiment to scale up existing recommendation models and observe that the enlarged models do not improve satisfactorily. In this context, we investigate the embedding layers of enlarged models and identify a phenomenon of *embedding collapse*, which ultimately hinders scalability, wherein the embedding matrix tends to reside in a low-dimensional subspace. Through empirical and theoretical analysis, we demonstrate that the feature interaction module specific to recommendation models has a *two-sided effect*. On the one hand, the interaction restricts embedding learning when interacting with collapsed embeddings, exacerbating the collapse issue. On the other hand, feature interaction is crucial in mitigating the fitting of spurious features, thereby improving scalability. Based on this analysis, we propose a simple yet effective *multi-embedding* design incorporating embedding-set-specific interaction modules to capture diverse patterns and reduce collapse. Extensive experiments demonstrate that this proposed design provides consistent scalability for various recommendation models.",
        "keywords": "machine learning;representation learning;recommender system;collapse",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Xingzhuo Guo;Junwei Pan;Ximei Wang;Baixu Chen;Jie Jiang;Mingsheng Long",
        "authorids": "~Xingzhuo_Guo1;~Junwei_Pan1;~Ximei_Wang1;~Baixu_Chen2;~Jie_Jiang3;~Mingsheng_Long5",
        "gender": "M;M;M;M;M;M",
        "homepage": ";https://junwei-pan.github.io/;https://wxm17.github.io/;https://github.com/tsingcbx99;https://baike.baidu.com/item/%E8%92%8B%E6%9D%B0/58674740;http://ise.thss.tsinghua.edu.cn/~mlong",
        "dblp": ";210/6440;89/8876;279/4076;32/7018-15.html;74/9023",
        "google_scholar": "Cbinj9QAAAAJ;sUaBkFkAAAAJ;WmOCCVgAAAAJ;;;_MjXpXkAAAAJ",
        "orcid": ";0009-0003-2697-7012;;;0000-0001-9658-5127;0000-0002-5412-9120",
        "linkedin": ";;;;;",
        "or_profile": "~Xingzhuo_Guo1;~Junwei_Pan1;~Ximei_Wang1;~Baixu_Chen2;~jie_jiang3;~Mingsheng_Long2",
        "aff": "Tsinghua University;Tencent;Tencent;Tsinghua University;Tencent AI Lab;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;tencent.com;tencent.com;tsinghua.edu.cn;tencent.com;tsinghua.edu.cn",
        "position": "PhD student;Researcher;Researcher;MS student;VP;Associate Professor",
        "bibtex": "@misc{\nguo2024on,\ntitle={On the Embedding Collapse When Scaling up Recommendation Models},\nauthor={Xingzhuo Guo and Junwei Pan and Ximei Wang and Baixu Chen and Jie Jiang and Mingsheng Long},\nyear={2024},\nurl={https://openreview.net/forum?id=0IaTFNJner}\n}",
        "github": "",
        "project": "",
        "reviewers": "DK5H;JdNi;9BGA;eFdv",
        "site": "https://openreview.net/forum?id=0IaTFNJner",
        "pdf_size": 2016960,
        "rating": "5;5;5;6",
        "confidence": "4;3;4;3",
        "soundness": "3;3;2;3",
        "contribution": "3;1;2;2",
        "presentation": "3;2;3;3",
        "wc_summary": "132;46;118;166",
        "wc_strengths": "127;31;155;55",
        "wc_weaknesses": "140;107;171;180",
        "wc_questions": "67;46;8;36",
        "wc_review": "466;230;452;437",
        "wc_reply_reviewers": "0;0;0;16",
        "wc_reply_authors": "1019;1126;1191;1016",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "3;3;3;3",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            115.5,
            43.75785643744447
        ],
        "wc_strengths_avg": [
            92.0,
            50.70502933634887
        ],
        "wc_weaknesses_avg": [
            149.5,
            28.674901917879335
        ],
        "wc_questions_avg": [
            39.25,
            21.22940178149163
        ],
        "wc_review_avg": [
            396.25,
            96.53075934643837
        ],
        "wc_reply_reviewers_avg": [
            4.0,
            6.928203230275509
        ],
        "wc_reply_authors_avg": [
            1088.0,
            74.15861379502721
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            0.0
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 18,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14239355219505619999&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;1;1;0;1;0",
        "aff_unique_norm": "Tsinghua University;Tencent",
        "aff_unique_dep": ";Tencent Holdings Limited",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.tencent.com",
        "aff_unique_abbr": "THU;Tencent",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "0JTwZ30qPH",
        "title": "Task-Oriented Multi-View Representation Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Multi-view representation learning aims to learn a high-quality unified representation for an entity from its multiple observable views to facilitate the performance of downstream tasks. A typical multi-view representation learning framework consists of four main components: View-specific encoding, Single-view learning (SVL), Multi-view learning (MVL), and Fusion. Recent studies achieve promising performance by carefully designing SVL and MVL constraints, but almost all of them ignore the basic fact that \\textit{effective representations are different for different tasks, even for the same entity}. To bridge this gap, this work proposes a \\textbf{T}ask-\\textbf{O}riented \\textbf{M}ulti-\\textbf{V}iew \\textbf{R}epresentation \\textbf{L}earning (TOMRL) method, where the key idea is to modulate features in the View-specific encoding and Fusion modules according to the task guidance. To this end, we first design a gradient-based embedding strategy to flexibly represent multi-view tasks. After that, a meta-learner is trained to map the task embedding into a set of view-specific parameters and a view-shared parameter for modulation in the Encoding and Fusion modules, respectively. This whole process is formalized as a nested optimization problem and ultimately solved by a bi-level optimization scheme. Extensive experiments on four multi-view datasets validate that our TOMRL consistently improves the performance of most existing multi-view representation learning approaches.",
        "keywords": "Multi-view learning; Meta learning; Feature modulation; Task adaptation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Ren Wang;Haoliang Sun;Yuxiu Lin;Yongshun Gong;Xiushan Nie;Yilong Yin",
        "authorids": "~Ren_Wang5;~Haoliang_Sun2;~Yuxiu_Lin1;~Yongshun_Gong1;~Xiushan_Nie1;~Yilong_Yin1",
        "gender": "M;M;F;M;M;M",
        "homepage": "https://time.sdu.edu.cn/info/1071/2586.htm;https://haolsun.github.io/;;https://faculty.sdu.edu.cn/gongyongshun/en/index.htm;http://niexsh.sdufe.edu.cn;https://faculty.sdu.edu.cn/ylyin",
        "dblp": "29/50-11;117/5673;275/7309;194/1824;03/8117;",
        "google_scholar": "hkHRff8AAAAJ;s5FAQ5wAAAAJ;;WIHqungAAAAJ;;",
        "orcid": "0000-0002-5877-5023;0000-0001-7715-5682;0000-0003-1809-0828;0000-0003-3948-4471;0000-0001-9644-9723;",
        "linkedin": ";haoliang-sun-357a5a11a;;;;",
        "or_profile": "~Ren_Wang5;~Haoliang_Sun2;~Yuxiu_Lin1;~Yongshun_Gong1;~Xiushan_Nie1;~Yilong_Yin1",
        "aff": "Shandong University;Shandong University;Shandong University of Finance and Economics;Shandong University;Shandong Jianzhu University;Shandong University",
        "aff_domain": "sdu.edu.cn;sdu.edu.cn;sdufe.edu.cn;sdu.edu.cn;sdjzu.edu.cn;sdu.edu.cn",
        "position": "PhD student;Associate Professor;PhD student;Full Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nwang2024taskoriented,\ntitle={Task-Oriented Multi-View Representation Learning},\nauthor={Ren Wang and Haoliang Sun and Yuxiu Lin and Yongshun Gong and Xiushan Nie and Yilong Yin},\nyear={2024},\nurl={https://openreview.net/forum?id=0JTwZ30qPH}\n}",
        "github": "",
        "project": "",
        "reviewers": "d8EV;caBF;aCu2;fqyn;V7F6",
        "site": "https://openreview.net/forum?id=0JTwZ30qPH",
        "pdf_size": 681589,
        "rating": "3;3;3;5;6",
        "confidence": "5;4;4;3;4",
        "soundness": "3;2;2;3;3",
        "contribution": "1;2;1;2;3",
        "presentation": "2;2;2;3;4",
        "wc_summary": "46;78;46;73;43",
        "wc_strengths": "6;68;35;68;30",
        "wc_weaknesses": "148;167;127;175;138",
        "wc_questions": "26;5;75;35;37",
        "wc_review": "226;318;283;351;248",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "617;631;0;556;223",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "1;1;0;1;1",
        "rating_avg": [
            4.0,
            1.2649110640673518
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            1.8,
            0.7483314773547883
        ],
        "presentation_avg": [
            2.6,
            0.8
        ],
        "wc_summary_avg": [
            57.2,
            15.065191668213185
        ],
        "wc_strengths_avg": [
            41.4,
            23.829393613770367
        ],
        "wc_weaknesses_avg": [
            151.0,
            17.81010948871455
        ],
        "wc_questions_avg": [
            35.6,
            22.729716232280598
        ],
        "wc_review_avg": [
            285.2,
            45.384578878733684
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            405.4,
            251.38384991880446
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0.8,
            0.4
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.49999999999999994,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:D-bjX91-YE4J:scholar.google.com/&scioq=Task-Oriented+Multi-View+Representation+Learning&hl=en&as_sdt=0,48",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;2;0",
        "aff_unique_norm": "Shandong University;Shandong University of Finance and Economics;Shandong Jianzhu University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.sdu.edu.cn;http://www.sdufe.edu.cn;http://www.sdjzu.edu.cn",
        "aff_unique_abbr": "SDU;SDUFE;SDJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "0JWVWUlobv",
        "title": "4D Tensor Multi-task Continual Learning for Disease Dynamic Prediction",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Machine learning techniques for predicting Alzheimer's disease (AD) progression can substantially help researchers and clinicians establish strong AD preventive and treatment strategies. However, current research on AD prediction algorithms encounters challenges with monotonic data form, small dataset and scarcity of time-continuous data. To address all three of these problems at once, we propose a novel machine learning approach that implements the 4D tensor multi-task continual learning algorithm to predict AD progression by quantifying multi-dimensional information on brain structural variation and knowledge sharing between patients. To meet real-world application scenarios, the method can integrate knowledge from all available data as patient data increases to continuously update and optimise prediction results. To evaluate the performance of the proposed approach, we conducted extensive experiments utilising data from the Alzheimer's Disease Neuroimaging Initiative (ADNI). The results demonstrate that the proposed approach has superior accuracy and stability in predicting various cognitive scores of AD progression compared to single-task learning, benchmarks and state-of-the-art multi-task regression methods. The proposed approach identifies structural brain variations in patients and utilises it to accurately predict and diagnose AD progression from magnetic resonance imaging (MRI) data alone, and the performance of the model improves as the MRI data increases.",
        "keywords": "Alzheimer\u2019s disease progression;tensor multi-task learning;continual learning;amalgamated magnitude-direction quantification;brain structure variation",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/9181459918592259ae5a65200764a826cd796d12.zip",
        "author": "Yu Zhang;Xulong Wang;Vitaveska Lanfranchi;Po Yang",
        "authorids": "~Yu_Zhang46;~Xulong_Wang2;~Vitaveska_Lanfranchi1;~Po_Yang1",
        "gender": ";M;F;M",
        "homepage": ";https://www.sheffield.ac.uk/cs/people/research-staff/xulong-wang;;https://www.sheffield.ac.uk/dcs/people/academic/pyang/profile",
        "dblp": ";211/7318-1;15/6230;88/5343-1",
        "google_scholar": "4gEGS8gAAAAJ;-oNwqtgAAAAJ;BiF44ewAAAAJ;RdK3cwgAAAAJ",
        "orcid": ";0000-0002-7385-4926;;0000-0002-6604-4298",
        "linkedin": ";;;po-yang-83a03043/",
        "or_profile": "~Yu_Zhang46;~Xulong_Wang2;~Vitaveska_Lanfranchi1;~Po_Yang1",
        "aff": "University of Sheffield;University of Sheffield;University of Sheffield;University of Sheffield",
        "aff_domain": "sheffield.ac.uk;shef.ac.uk;sheffield.ac.uk;sheffield.ac.uk",
        "position": "PhD student;PhD student;Full Professor;Associate Professor",
        "bibtex": "@misc{\nzhang2024d,\ntitle={4D Tensor Multi-task Continual Learning for Disease Dynamic Prediction},\nauthor={Yu Zhang and Xulong Wang and Vitaveska Lanfranchi and Po Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=0JWVWUlobv}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZWzC;6zjs;Zsj5;vwzZ",
        "site": "https://openreview.net/forum?id=0JWVWUlobv",
        "pdf_size": 5511212,
        "rating": "5;5;5;6",
        "confidence": "2;4;4;4",
        "soundness": "3;2;3;2",
        "contribution": "2;2;2;3",
        "presentation": "1;2;2;2",
        "wc_summary": "81;93;27;92",
        "wc_strengths": "18;10;23;58",
        "wc_weaknesses": "93;192;265;216",
        "wc_questions": "90;2;270;78",
        "wc_review": "282;297;585;444",
        "wc_reply_reviewers": "0;92;1060;187",
        "wc_reply_authors": "424;742;1652;748",
        "reply_reviewers": "0;1;2;2",
        "reply_authors": "1;1;4;4",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            73.25,
            27.11434122378783
        ],
        "wc_strengths_avg": [
            27.25,
            18.34904629674251
        ],
        "wc_weaknesses_avg": [
            191.5,
            62.659795722616266
        ],
        "wc_questions_avg": [
            110.0,
            98.34632682515398
        ],
        "wc_review_avg": [
            402.0,
            123.16452411307405
        ],
        "wc_reply_reviewers_avg": [
            334.75,
            423.9111787863113
        ],
        "wc_reply_authors_avg": [
            891.5,
            458.2191069783101
        ],
        "reply_reviewers_avg": [
            1.25,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.5,
            1.5
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:D1R4C8RTFFwJ:scholar.google.com/&scioq=4D+Tensor+Multi-task+Continual+Learning+for+Disease+Dynamic+Prediction&hl=en&as_sdt=0,48",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of Sheffield",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sheffield.ac.uk",
        "aff_unique_abbr": "Sheffield",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "0JnaN0Crlz",
        "title": "Enhancing Adversarial Robustness on Categorical Data via Attribution Smoothing",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Many efforts have been contributed to alleviate the adversarial risk of deep neural networks on continuous inputs.\nAdversarial robustness on general categorical inputs, especially tabular categorical attributes, has received much less attention. To echo this challenge, our work aims to enhance the robustness of classification over categorical attributes against adversarial perturbations. We establish an information-theoretic upper bound on the expected adversarial risk. Based on it,\nwe propose an adversarially robust learning method, named Integrated Gradient-Smoothed Gradient (IGSG)-based regularization. It is designed to smooth the attributional sensitivity of each feature and the decision boundary of the classifier to achieve lower adversarial risk, i.e., desensitizing the categorical attributes in the classifier. We conduct an extensive empirical study over categorical datasets of various application domains. The experimental results confirm the effectiveness of IGSG, which surpasses the state-of-the-art robust training methods by a margin of approximately 0.4\\% to 12.2\\% on average in terms of adversarial accuracy, especially on high-dimension datasets.",
        "keywords": "Adversarial Robustness;Categorical Data;Attribution Smoothing;Information Theory",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/506e78e21660053fe2a0625a76f2b36263fd14fc.pdf",
        "author": "Yujun Zhou;Yufei Han;Hongyan Bao;Xiangliang Zhang",
        "authorids": "~Yujun_Zhou1;~Yufei_Han1;~Hongyan_Bao1;~Xiangliang_Zhang1",
        "gender": "M;M;;F",
        "homepage": "https://yujunzhou.github.io/;;https://mine.kaust.edu.sa/Pages/Hongyan.aspx;https://sites.nd.edu/xiangliang-zhang/",
        "dblp": "162/3265-2;74/2507;234/6902;74/1890-1",
        "google_scholar": "t0c7rQQAAAAJ;xdCvBg0AAAAJ;;BhRJe4wAAAAJ",
        "orcid": "0000-0003-1376-5187;;;0000-0002-3574-5665",
        "linkedin": "yujun-zhou-zyj/;;;",
        "or_profile": "~Yujun_Zhou1;~Yufei_Han1;~Hongyan_Bao1;~Xiangliang_Zhang1",
        "aff": "University of Notre Dame;INRIA;KAUST;University of Notre Dame",
        "aff_domain": "nd.edu;inria.fr;kaust.edu.sa;nd.edu",
        "position": "PhD student;Researcher;PhD student;Associate Professor",
        "bibtex": "@misc{\nzhou2024enhancing,\ntitle={Enhancing Adversarial Robustness on Categorical Data via Attribution Smoothing},\nauthor={Yujun Zhou and Yufei Han and Hongyan Bao and Xiangliang Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=0JnaN0Crlz}\n}",
        "github": "",
        "project": "",
        "reviewers": "oxAy;KxJ6;eEhS;rFyD;Bx5T;iddk",
        "site": "https://openreview.net/forum?id=0JnaN0Crlz",
        "pdf_size": 1463516,
        "rating": "3;5;5;6;6;6",
        "confidence": "4;4;4;3;2;4",
        "soundness": "2;2;2;3;3;3",
        "contribution": "2;2;2;3;3;3",
        "presentation": "1;2;3;3;3;3",
        "wc_summary": "15;20;60;95;31;145",
        "wc_strengths": "34;9;97;24;40;41",
        "wc_weaknesses": "119;170;159;15;8;143",
        "wc_questions": "44;2;30;47;188;1",
        "wc_review": "212;201;346;181;267;330",
        "wc_reply_reviewers": "0;0;0;11;0;0",
        "wc_reply_authors": "1707;1002;1917;706;869;718",
        "reply_reviewers": "0;0;0;1;0;0",
        "reply_authors": "7;4;4;4;6;3",
        "rating_avg": [
            5.166666666666667,
            1.0671873729054746
        ],
        "confidence_avg": [
            3.5,
            0.7637626158259734
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.7637626158259734
        ],
        "wc_summary_avg": [
            61.0,
            46.38606112472438
        ],
        "wc_strengths_avg": [
            40.833333333333336,
            27.382577591518945
        ],
        "wc_weaknesses_avg": [
            102.33333333333333,
            66.14042300708059
        ],
        "wc_questions_avg": [
            52.0,
            63.46915261237803
        ],
        "wc_review_avg": [
            256.1666666666667,
            63.61712732345661
        ],
        "wc_reply_reviewers_avg": [
            1.8333333333333333,
            4.099457958749614
        ],
        "wc_reply_authors_avg": [
            1153.1666666666667,
            480.1220041706992
        ],
        "reply_reviewers_avg": [
            0.16666666666666666,
            0.372677996249965
        ],
        "reply_authors_avg": [
            4.666666666666667,
            1.3743685418725535
        ],
        "replies_avg": [
            40,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5111986324432478,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:IAeeVQInNRYJ:scholar.google.com/&scioq=Enhancing+Adversarial+Robustness+on+Categorical+Data+via+Attribution+Smoothing&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "University of Notre Dame;INRIA;King Abdullah University of Science and Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.nd.edu;https://www.inria.fr;https://www.kaust.edu.sa",
        "aff_unique_abbr": "Notre Dame;INRIA;KAUST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;0",
        "aff_country_unique": "United States;France;Saudi Arabia"
    },
    {
        "title": "From Latent Graph to Latent Topology Inference: Differentiable Cell Complex Module",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19619",
        "id": "0JsRZEGZ7L",
        "author_site": "Claudio Battiloro, Indro Spinelli, Lev Telyatinkov, Michael Bronstein, Simone Scardapane, Paolo Di Lorenzo",
        "tldr": "",
        "abstract": "Latent Graph Inference (LGI) relaxed the reliance of Graph Neural Networks (GNNs) on a given graph topology by dynamically learning it. However, most of LGI methods assume to have a (noisy, incomplete, improvable, ...) input graph to rewire and can solely learn regular graph topologies. In the wake of the success of  Topological Deep Learning (TDL), we study Latent Topology Inference (LTI) for learning higher-order cell complexes (with sparse and not regular topology) describing multi-way interactions between data points. To this aim, we introduce the Differentiable Cell Complex Module (DCM), a novel learnable function that computes cell probabilities in the complex to improve the downstream task. We show how to integrate DCM with cell complex message-passing networks layers and train it in an end-to-end fashion, thanks to a two-step inference procedure that avoids an exhaustive search across all possible cells in the input, thus maintaining scalability. Our model is tested on several homophilic and heterophilic graph datasets and it is shown to outperform other state-of-the-art techniques, offering significant improvements especially in cases where an input graph is not provided.",
        "keywords": "Topological Deep Learning;Geometric Deep Learning;Latent Topology Inference;Latent Graph Inference;Cell Complexes",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Claudio Battiloro;Indro Spinelli;Lev Telyatnikov;Michael M. Bronstein;Simone Scardapane;Paolo Di Lorenzo",
        "authorids": "~Claudio_Battiloro1;~Indro_Spinelli1;~Lev_Telyatnikov1;~Michael_M._Bronstein1;~Simone_Scardapane1;~Paolo_Di_Lorenzo1",
        "gender": "M;M;M;M;M;M",
        "homepage": ";;;http://www.inf.usi.ch/bronstein/;http://ispac.diet.uniroma1.it/scardapane/;https://sites.google.com/site/paolodilorenzohp/",
        "dblp": "243/6640;241/5134;;07/2668;144/2184;42/9879",
        "google_scholar": "_J11o_IAAAAJ;0glmB_UAAAAJ;MzFz-tcAAAAJ;UU3N6-UAAAAJ;https://scholar.google.it/citations?user=aSuosYoAAAAJ;https://scholar.google.it/citations?user=VZYvspQAAAAJ",
        "orcid": ";0000-0003-1963-3548;;;0000-0003-0881-8344;",
        "linkedin": "claudio-battiloro-b4390b175;;;mbronstein/;simonescardapane;",
        "or_profile": "~Claudio_Battiloro1;~Indro_Spinelli1;~Lev_Telyatnikov1;~Michael_M._Bronstein1;~Simone_Scardapane1;~Paolo_Di_Lorenzo1",
        "aff": "University of Roma \"La Sapienza\";Sapienza University of Rome;University of Roma \"La Sapienza\";University of Oxford;Sapienza University of Rome;University of Roma \"La Sapienza\"",
        "aff_domain": "uniroma1.it;uniroma1.it;uniroma1.it;ox.ac.uk;uniroma1.it;uniroma1.it",
        "position": "PhD student;Assistant Professor;PhD student;Full Professor;Assistant Professor;Associate Professor",
        "bibtex": "@inproceedings{\nbattiloro2024from,\ntitle={From Latent Graph to Latent Topology Inference: Differentiable Cell Complex Module},\nauthor={Claudio Battiloro and Indro Spinelli and Lev Telyatnikov and Michael M. Bronstein and Simone Scardapane and Paolo Di Lorenzo},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=0JsRZEGZ7L}\n}",
        "github": "",
        "project": "",
        "reviewers": "EucF;XizW;ims6",
        "pdf_size": 2416075,
        "rating": "8;8;8",
        "confidence": "4;3;2",
        "soundness": "3;4;2",
        "contribution": "3;3;3",
        "presentation": "2;3;3",
        "wc_summary": "88;191;64",
        "wc_strengths": "57;68;42",
        "wc_weaknesses": "90;54;9",
        "wc_questions": "186;105;11",
        "wc_review": "421;418;126",
        "wc_reply_reviewers": "32;37;0",
        "wc_reply_authors": "766;807;646",
        "reply_reviewers": "1;1;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            114.33333333333333,
            55.089825638577665
        ],
        "wc_strengths_avg": [
            55.666666666666664,
            10.656244908763853
        ],
        "wc_weaknesses_avg": [
            51.0,
            33.13608305156178
        ],
        "wc_questions_avg": [
            100.66666666666667,
            71.50912917631955
        ],
        "wc_review_avg": [
            321.6666666666667,
            138.36264749643317
        ],
        "wc_reply_reviewers_avg": [
            23.0,
            16.391054470858997
        ],
        "wc_reply_authors_avg": [
            739.6666666666666,
            68.31463158715627
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 20,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14758672841525436027&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=0JsRZEGZ7L",
        "pdf": "https://openreview.net/pdf?id=0JsRZEGZ7L",
        "email": "uniroma1.it;uniroma1.it;uniroma1.it;ox.ac.uk;uniroma1.it;uniroma1.it",
        "author_num": 6,
        "aff_unique_index": "0;1;0;2;1;0",
        "aff_unique_norm": "University of Rome La Sapienza;Sapienza University of Rome;University of Oxford",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.uniroma1.it;https://www.uniroma1.it;https://www.ox.ac.uk",
        "aff_unique_abbr": "La Sapienza;Sapienza;Oxford",
        "aff_campus_unique_index": "0;0;0;0;0",
        "aff_campus_unique": "Rome;",
        "aff_country_unique_index": "0;0;0;1;0;0",
        "aff_country_unique": "Italy;United Kingdom"
    },
    {
        "id": "0KVkTDB6KZ",
        "title": "EFFL: Egalitarian Fairness in Federated Learning for Mitigating Matthew Effect",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recent advances in federated learning (FL) enable collaborative training of machine learning (ML) models from large-scale and widely dispersed clients while protecting their privacy. However, when different clients' datasets are heterogeneous, traditional FL mechanisms produce a global model that does not adequately represent the poorer clients with limited data resources, resulting in lower accuracy and higher bias on their local data. According to the Matthew effect, which describes how the advantaged gain more advantage and the disadvantaged lose more over time, deploying such a global model in client applications may worsen the resource disparity among the clients and harm the principles of social welfare and fairness. To mitigate the Matthew effect, we propose Egalitarian Fairness Federated Learning (EFFL), where egalitarian fairness refers to the global model learned from FL has: (1) equal accuracy among clients; (2)  equal decision bias among clients. Besides achieving egalitarian fairness among the clients, EFFL also aims for performance optimality, minimizing the empirical risk loss and the bias for each client; both are essential for any ML model training, whether centralized or decentralized. We formulate EFFL as a multi-constrained multi-objectives optimization (MCMOO) problem, with the decision bias and egalitarian fairness as constraints and the minimization of the empirical risk losses on all clients as multiple objectives to be optimized. We propose a gradient-based three-stage algorithm to obtain the Pareto optimal solutions within the constraint space. Extensive experiments demonstrate that EFFL outperforms other state-of-the-art FL algorithms in achieving a high-performance global model with enhanced egalitarian fairness among all clients.",
        "keywords": "Egalitarian Fairness;Federated Learning;AI Ethics",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/ccf13bad6278e0703c22b8b7c0ac0c638ad97767.zip",
        "author": "Jiashi Gao;Changwu Huang;Ming Tang;Shin Hwei Tan;Xin Yao;Xuetao Wei",
        "authorids": "~Jiashi_Gao1;~Changwu_Huang1;~Ming_Tang5;~Shin_Hwei_Tan1;~Xin_Yao1;~Xuetao_Wei2",
        "gender": "F;M;F;F;;M",
        "homepage": ";;http://mingtang.site;https://www.shinhwei.com/;http://www.cs.bham.ac.uk/~xin;https://cse.sustech.edu.cn/faculty/~weixt/",
        "dblp": "221/1810;227/6536;73/4373-6;16/9656;;09/5916",
        "google_scholar": ";https://scholar.google.fr/citations?user=QRnmYfkAAAAJ;4v9UxPYAAAAJ;1eFjFs8AAAAJ;;8fNwEScAAAAJ",
        "orcid": ";;0000-0003-4732-5155;;;0000-0002-4450-2251",
        "linkedin": ";;;;;",
        "or_profile": "~Jiashi_Gao1;~Changwu_Huang1;~Ming_Tang5;~Shin_Hwei_Tan1;~Xin_Yao1;~Xuetao_Wei2",
        "aff": "Southern University of Science and Technology;;Southern University of Science and Technology;Concordia University;;Southern University of Science and Technology",
        "aff_domain": "sustech.edu.cn;;sustech.edu.cn;concordia.ca;;sustech.edu.cn",
        "position": "PhD student;;Associate Professor;Associate Professor;;Associate Professor",
        "bibtex": "@misc{\ngao2024effl,\ntitle={{EFFL}: Egalitarian Fairness in Federated Learning for Mitigating Matthew Effect},\nauthor={Jiashi Gao and Changwu Huang and Ming Tang and Shin Hwei Tan and Xin Yao and Xuetao Wei},\nyear={2024},\nurl={https://openreview.net/forum?id=0KVkTDB6KZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "YyVq;ta1u;hFqL;Raor",
        "site": "https://openreview.net/forum?id=0KVkTDB6KZ",
        "pdf_size": 725166,
        "rating": "3;5;6;8",
        "confidence": "3;4;2;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;2;2",
        "wc_summary": "39;74;102;134",
        "wc_strengths": "22;30;32;66",
        "wc_weaknesses": "159;122;330;193",
        "wc_questions": "48;194;3;8",
        "wc_review": "268;420;467;401",
        "wc_reply_reviewers": "0;13;70;0",
        "wc_reply_authors": "805;887;763;727",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            87.25,
            35.02409884636577
        ],
        "wc_strengths_avg": [
            37.5,
            16.874537030686206
        ],
        "wc_weaknesses_avg": [
            201.0,
            78.5970737368765
        ],
        "wc_questions_avg": [
            63.25,
            77.47701271990293
        ],
        "wc_review_avg": [
            389.0,
            73.87489424696322
        ],
        "wc_reply_reviewers_avg": [
            20.75,
            28.925550988702014
        ],
        "wc_reply_authors_avg": [
            795.5,
            59.60494945891658
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.25087260300212727,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11222063921364090985&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Southern University of Science and Technology;Concordia University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.sustech.edu.cn;https://www.concordia.ca",
        "aff_unique_abbr": "SUSTech;Concordia",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "China;Canada"
    },
    {
        "id": "0Lqyut1y7M",
        "title": "On the Optimality of Activations in Implicit Neural Representations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Implicit neural representations (INRs) have recently surged in popularity as a class of neural networks capable of encoding signals as compact, differentiable entities. To capture high-frequency content, INRs often employ techniques such as Fourier positional encodings or non-traditional activation functions like Gaussian, sinusoid, or wavelets. Despite the impressive results achieved with these activations, there has been limited exploration of their properties within a unified theoretical framework. To address this gap, we conduct a comprehensive analysis of these activations from the perspective of sampling theory. Our investigation reveals that, particularly in the context of shallow INRs, sinc activations\u2014previously unused in conjunction with INRs\u2014are theoretically optimal for signal encoding. Additionally, we establish a connection between dynamical systems and INRs and leverage sampling theory to bridge these two paradigms. Notably, we showcase how the implicit architectural regularization inherent to INRs allows for their application in modeling such systems with minimal need for explicit regularizations.",
        "keywords": "Implicit Neural Representations;Sampling theory",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/ab32a73c3f93974763b7e3d1f0236f2d1247945c.pdf",
        "author": "Sameera Ramasinghe;Hemanth Saratchandran;Violetta Shevchenko;Alexander Long;Simon Lucey",
        "authorids": "~Sameera_Ramasinghe1;~Hemanth_Saratchandran1;~Violetta_Shevchenko1;~Alexander_Long1;~Simon_Lucey2",
        "gender": "M;;F;M;M",
        "homepage": ";;;https://github.com/AlexanderJLong;https://www.adelaide.edu.au/directory/simon.lucey",
        "dblp": "181/4514;;231/1762;156/9630;01/3542",
        "google_scholar": "https://scholar.google.com.au/citations?user=-j0m9aMAAAAJ;;aWqA0BIAAAAJ;;vmAe35UAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;violetta-shevchenko-12b62714a/;;",
        "or_profile": "~Sameera_Ramasinghe1;~Hemanth_Saratchandran1;~Violetta_Shevchenko1;~Alexander_Long1;~Simon_Lucey2",
        "aff": "Amazon;;Amazon;Amazon;University of Adelaide",
        "aff_domain": "amazon.com;;amazon.com;amazon.com;adelaide.edu.au",
        "position": "Researcher;;Researcher;Researcher;Full Professor",
        "bibtex": "@misc{\nramasinghe2024on,\ntitle={On the Optimality of Activations in Implicit Neural Representations},\nauthor={Sameera Ramasinghe and Hemanth Saratchandran and Violetta Shevchenko and Alexander Long and Simon Lucey},\nyear={2024},\nurl={https://openreview.net/forum?id=0Lqyut1y7M}\n}",
        "github": "",
        "project": "",
        "reviewers": "REJk;8ETH;hcEo;9zZJ",
        "site": "https://openreview.net/forum?id=0Lqyut1y7M",
        "pdf_size": 40474055,
        "rating": "5;6;6;6",
        "confidence": "4;3;4;4",
        "soundness": "3;3;4;3",
        "contribution": "3;4;3;3",
        "presentation": "2;2;3;4",
        "wc_summary": "103;120;114;95",
        "wc_strengths": "76;41;77;98",
        "wc_weaknesses": "500;257;182;119",
        "wc_questions": "90;241;42;136",
        "wc_review": "769;659;415;448",
        "wc_reply_reviewers": "74;69;261;58",
        "wc_reply_authors": "1237;1244;967;936",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "4;2;2;2",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            108.0,
            9.669539802906858
        ],
        "wc_strengths_avg": [
            73.0,
            20.457272545478784
        ],
        "wc_weaknesses_avg": [
            264.5,
            144.475776516342
        ],
        "wc_questions_avg": [
            127.25,
            73.60494208950918
        ],
        "wc_review_avg": [
            572.75,
            146.97002245356023
        ],
        "wc_reply_reviewers_avg": [
            115.5,
            84.20362224987711
        ],
        "wc_reply_authors_avg": [
            1096.0,
            144.9361928574088
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.5,
            0.8660254037844386
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:wcXPF73uX7EJ:scholar.google.com/&scioq=On+the+Optimality+of+Activations+in+Implicit+Neural+Representations&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "Amazon;University of Adelaide",
        "aff_unique_dep": "Amazon.com, Inc.;",
        "aff_unique_url": "https://www.amazon.com;https://www.adelaide.edu.au",
        "aff_unique_abbr": "Amazon;Adelaide",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "United States;Australia"
    },
    {
        "id": "0NruoU6s5Z",
        "title": "CompoDiff: Versatile Composed Image Retrieval With Latent Diffusion",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper proposes a novel diffusion-based model, CompoDiff, for solving Composed Image Retrieval (CIR) with latent diffusion and presents a newly created dataset, named SynthTriplets18M, of 18 million reference images, conditions, and corresponding target image triplets to train the model. CompoDiff and SynthTriplets18M tackle the shortages of the previous CIR approaches, such as poor generalizability due to the small dataset scale and the limited types of conditions. CompoDiff not only achieves a new zero-shot state-of-the-art on four CIR benchmarks, including FashionIQ, CIRR, CIRCO, and GeneCIS, but also enables a more versatile and controllable CIR by accepting various conditions, such as negative text and image mask conditions, and the controllability to the importance between multiple queries or the trade-off between inference speed and the performance which are unavailable with existing CIR methods. The code and dataset samples are available at Supplementary Materials.",
        "keywords": "Composed Image Retrieval;Diffusion Models",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/170316c35b69a427d9cda3e6429b12e1c9cdd3a6.zip",
        "author": "Geonmo Gu;Sanghyuk Chun;Wonjae Kim;HeeJae Jun;Yoohoon Kang;Sangdoo Yun",
        "authorids": "~Geonmo_Gu1;~Sanghyuk_Chun1;~Wonjae_Kim1;~HeeJae_Jun1;~Yoohoon_Kang1;~Sangdoo_Yun1",
        "gender": "M;M;M;M;M;M",
        "homepage": ";https://sanghyukchun.github.io/home/;https://wonjae.kim;;;https://sangdooyun.github.io/",
        "dblp": "164/5694;213/1095.html;158/3433;238/0444;71/6597;124/3009.html",
        "google_scholar": "https://scholar.google.co.kr/citations?view_op=list_works;https://scholar.google.co.kr/citations?user=4_uj0xcAAAAJ;https://scholar.google.co.kr/citations?user=UpZ41EwAAAAJ;;;o0qtjzYAAAAJ",
        "orcid": "0009-0001-5071-0997;0000-0002-4533-2610;0000-0002-6616-7685;;;",
        "linkedin": "geonmo-gu-0008b013b/;https://kr.linkedin.com/in/sanghyukchun/en;;;;",
        "or_profile": "~Geonmo_Gu1;~Sanghyuk_Chun1;~Wonjae_Kim1;~HeeJae_Jun1;~Yoohoon_Kang1;~Sangdoo_Yun1",
        "aff": "NAVER;NAVER AI Lab;NAVER;NAVER;NAVER;NAVER",
        "aff_domain": "navercorp.com;navercorp.com;navercorp.com;navercorp.com;navercorp.com;navercorp.com",
        "position": "Researcher;Lead research scientist;Research Scientist;Researcher;Researcher;Research Scientist",
        "bibtex": "@misc{\ngu2024compodiff,\ntitle={CompoDiff: Versatile Composed Image Retrieval With Latent Diffusion},\nauthor={Geonmo Gu and Sanghyuk Chun and Wonjae Kim and HeeJae Jun and Yoohoon Kang and Sangdoo Yun},\nyear={2024},\nurl={https://openreview.net/forum?id=0NruoU6s5Z}\n}",
        "github": "",
        "project": "",
        "reviewers": "e76K;FhVu;AJF4;wkZo",
        "site": "https://openreview.net/forum?id=0NruoU6s5Z",
        "pdf_size": 6435297,
        "rating": "5;5;5;6",
        "confidence": "5;3;2;4",
        "soundness": "4;3;2;3",
        "contribution": "3;2;2;2",
        "presentation": "4;2;3;2",
        "wc_summary": "84;80;47;56",
        "wc_strengths": "82;81;109;50",
        "wc_weaknesses": "264;111;149;157",
        "wc_questions": "177;65;9;41",
        "wc_review": "607;337;314;304",
        "wc_reply_reviewers": "0;113;118;0",
        "wc_reply_authors": "1636;1550;1222;1145",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "4;4;4;4",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            66.75,
            15.642490210960657
        ],
        "wc_strengths_avg": [
            80.5,
            20.886598574205422
        ],
        "wc_weaknesses_avg": [
            170.25,
            56.847933119859334
        ],
        "wc_questions_avg": [
            73.0,
            63.245553203367585
        ],
        "wc_review_avg": [
            390.5,
            125.56771081770982
        ],
        "wc_reply_reviewers_avg": [
            57.75,
            57.777049941996864
        ],
        "wc_reply_authors_avg": [
            1388.25,
            208.77784245460532
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            4.0,
            0.0
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.2581988897471611,
        "gs_citation": 66,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12308069164153977775&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "NAVER Corporation",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.naver.com",
        "aff_unique_abbr": "NAVER",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "Making LLaMA SEE and Draw with SEED Tokenizer",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19618",
        "id": "0Nui91LBQS",
        "author_site": "Yuying Ge, Sijie Zhao, Ziyun Zeng, Yixiao Ge, Chen Li, Xintao Wang, Ying Shan",
        "tldr": "",
        "abstract": "The great success of Large Language Models (LLMs) has expanded the potential of multimodality, contributing to the gradual evolution of General Artificial Intelligence (AGI). A true AGI agent should not only possess the capability to perform predefined multi-tasks but also exhibit emergent abilities in an open-world context. However, despite the considerable advancements made by recent multimodal LLMs, they still fall short in effectively unifying comprehension and generation tasks, let alone open-world emergent abilities. We contend that the key to overcoming the present impasse lies in enabling text and images to be represented and processed interchangeably within a unified autoregressive Transformer. To this end, we introduce $\\textbf{SEED}$, an elaborate image tokenizer that empowers LLMs with the ability to $\\textbf{SEE}$ and $\\textbf{D}$raw at the same time. We identify two crucial design principles: (1) Image tokens should be independent of 2D physical patch positions and instead be produced with a $\\textit{1D causal dependency}$, exhibiting intrinsic interdependence that aligns with the left-to-right autoregressive prediction mechanism in LLMs. (2) Image tokens should capture $\\textit{high-level semantics}$ consistent with the degree of semantic abstraction in words, and be optimized for both discriminativeness and reconstruction during the tokenizer training phase. With SEED tokens, LLM is able to perform scalable multimodal autoregression under its original training recipe, i.e., next-word prediction. SEED-LLaMA is therefore produced by large-scale pretraining and instruction tuning on the interleaved textual and visual data, demonstrating impressive performance on a broad range of multimodal comprehension and generation tasks. More importantly, SEED-LLaMA has exhibited compositional emergent abilities such as multi-turn in-context multimodal generation, acting like your AI assistant. The code (training and inference) and models are released in https://github.com/AILab-CVC/SEED.",
        "keywords": "Multimodal Large Language Model;Discrete Visual Tokenizer",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yuying Ge;Sijie Zhao;Ziyun Zeng;Yixiao Ge;Chen Li;Xintao Wang;Ying Shan",
        "authorids": "~Yuying_Ge2;~Sijie_Zhao2;~Ziyun_Zeng1;~Yixiao_Ge2;~Chen_Li34;~Xintao_Wang1;~Ying_Shan2",
        "gender": "F;M;M;F;Not Specified;;M",
        "homepage": "https://geyuying.github.io/;https://sijeh.github.io/;https://stdkonjac.icu/;https://geyixiao.com/;https://scholar.google.com/citations?user=5fU_DtEAAAAJ&hl=en;;",
        "dblp": "223/4673;300/5422;282/8373.html;228/6649;164/3294-46.html;;68/5910",
        "google_scholar": "hv1LiiEAAAAJ;tZ3dS3MAAAAJ;RuanZLEAAAAJ;TtU74NAAAAAJ;5fU_DtEAAAAJ;;4oXBp9UAAAAJ",
        "orcid": ";;;;;;0000-0001-7673-8325",
        "linkedin": ";;;;;;YingShanProfile/",
        "or_profile": "~Yuying_Ge2;~Sijie_Zhao2;~Ziyun_Zeng1;~Yixiao_Ge2;~Chen_Li34;~Xintao_Wang1;~Ying_Shan2",
        "aff": "Tencent AI Lab;Tencent AI Lab;Tsinghua University;Tencent;Tencent ARC Lab;;Tencent PCG ARC Lab",
        "aff_domain": "tencent.com;tencent.com;tsinghua.edu.cn;tencent.com;tencent.com;;arc.tencent.com",
        "position": "Researcher;Researcher;MS student;Researcher;Researcher;;Director",
        "bibtex": "@inproceedings{\nge2024making,\ntitle={Making {LL}a{MA} {SEE} and Draw with {SEED} Tokenizer},\nauthor={Yuying Ge and Sijie Zhao and Ziyun Zeng and Yixiao Ge and Chen Li and Xintao Wang and Ying Shan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=0Nui91LBQS}\n}",
        "github": "",
        "project": "",
        "reviewers": "y9Sh;i2L6;TFPg",
        "pdf_size": 25208002,
        "rating": "5;6;8",
        "confidence": "3;5;4",
        "soundness": "3;2;3",
        "contribution": "3;2;3",
        "presentation": "2;3;3",
        "wc_summary": "82;59;89",
        "wc_strengths": "27;28;115",
        "wc_weaknesses": "240;150;361",
        "wc_questions": "3;2;125",
        "wc_review": "352;239;690",
        "wc_reply_reviewers": "0;23;696",
        "wc_reply_authors": "1626;706;1495",
        "reply_reviewers": "0;1;2",
        "reply_authors": "4;1;2",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            76.66666666666667,
            12.81492185782739
        ],
        "wc_strengths_avg": [
            56.666666666666664,
            41.24991582482994
        ],
        "wc_weaknesses_avg": [
            250.33333333333334,
            86.44972848746
        ],
        "wc_questions_avg": [
            43.333333333333336,
            57.74849685393455
        ],
        "wc_review_avg": [
            427.0,
            191.60549748550187
        ],
        "wc_reply_reviewers_avg": [
            239.66666666666666,
            322.8129833544838
        ],
        "wc_reply_authors_avg": [
            1275.6666666666667,
            406.34987661155037
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.3273268353539886,
        "gs_citation": 116,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14781111967367961466&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=0Nui91LBQS",
        "pdf": "https://openreview.net/pdf?id=0Nui91LBQS",
        "email": "tencent.com;tencent.com;tsinghua.edu.cn;tencent.com;tencent.com;;arc.tencent.com",
        "author_num": 7,
        "aff_unique_index": "0;0;1;0;0;0",
        "aff_unique_norm": "Tencent;Tsinghua University",
        "aff_unique_dep": "Tencent AI Lab;",
        "aff_unique_url": "https://ai.tencent.com;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "Tencent AI Lab;THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "0P12CqfvUU",
        "title": "3D Morphable Master Face Generation: Towards Controllable Wolf Attacks against 2D and 3D Face Recognition Systems",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Biometric authentication systems are facing increasing threats from Artificial Intelligence-Generated Content (AIGC). Previous research has revealed the vulnerability of face authentication systems against master face attacks. These attacks utilize generative models to create facial samples capable of matching multiple registered user templates in the database. In this paper, we present a systematic approach for generating master faces that can compromise both 2D and 3D face recognition systems. Notably, our approach is the first to enable morphable and controllable master face attacks on face authentication systems.\n\nOur method generates these 3D master faces using the Latent Variable Evolution (LVE) algorithm with the 3D Face Morphable Model (3DMM). Through comprehensive simulations of simultaneous master face attacks in both white-box, gray-box, and black-box scenarios, we demonstrate the significant threat posed by these 3D master faces to mainstream face authentication systems. Furthermore, we explore the realms of face morphing and facial reenactment in our generated samples, enhancing the efficacy of the master face attack. Compared to existing methods, our approach exhibits superior attack success rates and advanced flexibility, highlighting the importance of defending against master face attacks.",
        "keywords": "Master Attack;Wolf Attack;3D Morphable Face Model",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/13e766c2aa4be2f94bdd89e55e7c67c3acf0355a.zip",
        "author": "Siyun Liang;Huy H. Nguyen;Junichi Yamagishi;Isao Echizen",
        "authorids": "~Siyun_Liang1;~Huy_H._Nguyen1;~Junichi_Yamagishi1;~Isao_Echizen1",
        "gender": "F;;M;",
        "homepage": "https://siyun-liang.github.io/;;https://researchmap.jp/read0205283?lang=en;",
        "dblp": ";;87/3979;",
        "google_scholar": "ivuEYlUAAAAJ;;nRrdjtwAAAAJ;",
        "orcid": ";;;",
        "linkedin": "siyun-liang-328b53222/;;;",
        "or_profile": "~Siyun_Liang1;~Huy_H._Nguyen1;~Junichi_Yamagishi1;~Isao_Echizen1",
        "aff": "Technische Universit\u00e4t M\u00fcnchen;;National Institute of Informatics;",
        "aff_domain": "tum.de;;nii.ac.jp;",
        "position": "MS student;;Full Professor;",
        "bibtex": "@misc{\nliang2024d,\ntitle={3D Morphable Master Face Generation: Towards Controllable Wolf Attacks against 2D and 3D Face Recognition Systems},\nauthor={Siyun Liang and Huy H. Nguyen and Junichi Yamagishi and Isao Echizen},\nyear={2024},\nurl={https://openreview.net/forum?id=0P12CqfvUU}\n}",
        "github": "",
        "project": "",
        "reviewers": "Tr8G;ARdD;SgrS;FSLJ",
        "site": "https://openreview.net/forum?id=0P12CqfvUU",
        "pdf_size": 11460884,
        "rating": "3;3;3;5",
        "confidence": "5;3;4;4",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "2;1;3;3",
        "wc_summary": "37;136;85;33",
        "wc_strengths": "14;99;66;13",
        "wc_weaknesses": "248;132;64;33",
        "wc_questions": "5;83;188;3",
        "wc_review": "304;450;403;82",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1290;1109;1462;350",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;2;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            72.75,
            41.85913878712748
        ],
        "wc_strengths_avg": [
            48.0,
            36.42114770294862
        ],
        "wc_weaknesses_avg": [
            119.25,
            82.5087116612543
        ],
        "wc_questions_avg": [
            69.75,
            75.50951926744071
        ],
        "wc_review_avg": [
            309.75,
            141.65870075643076
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1052.75,
            424.49815959553933
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:hBCi4MDQwAUJ:scholar.google.com/&scioq=3D+Morphable+Master+Face+Generation:+Towards+Controllable+Wolf+Attacks+against+2D+and+3D+Face+Recognition+Systems&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Technische Universit\u00e4t M\u00fcnchen;National Institute of Informatics",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tum.de;https://www.nii.ac.jp/",
        "aff_unique_abbr": "TUM;NII",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Germany;Japan"
    },
    {
        "id": "0PeEOq5iK8",
        "title": "DST-Det: Simple Dynamic Self-Training for Open-Vocabulary Object Detection",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Open-vocabulary object detection (OVOD) aims to detect the objects \\textit{beyond} the set of categories observed during training. This work presents a simple yet effective strategy that leverages the zero-shot classification ability of pre-trained vision-language models (VLM), such as CLIP, to classify proposals for all possible novel classes directly. Unlike previous works that ignore novel classes during training and rely solely on the region proposal network (RPN) for novel object detection, our method selectively filters proposals based on specific design criteria. The resulting sets of identified proposals serve as pseudo-labels for novel classes during the training phase. It enables our self-training strategy to improve the recall and accuracy of novel classes in a self-training manner without requiring additional annotations or datasets. We further propose a simple offline pseudo-label generation strategy to refine the object detector. Empirical evaluations on three datasets, including LVIS, V3Det, and COCO, demonstrate significant improvements over the baseline performance without incurring additional parameters or computational costs during inference. In particular, compared with previous F-VLM, our method achieves a 1.7-2.0\\% improvement on LVIS dataset and 2.3-3.8\\% improvement on the recent challenging V3Det dataset. Our method also boosts the strong baseline by 6\\% mAP on COCO. The code and models will be publicly available.",
        "keywords": "open-vocabulary;object detection;self-training",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Shilin Xu;Xiangtai Li;Size Wu;Wenwei Zhang;Yining Li;Guangliang Cheng;Yunhai Tong;Kai Chen;Chen Change Loy",
        "authorids": "~Shilin_Xu1;~Xiangtai_Li1;~Size_Wu1;~Wenwei_Zhang1;~Yining_Li1;~Guangliang_Cheng2;~Yunhai_Tong1;~Kai_Chen4;~Chen_Change_Loy2",
        "gender": "M;;M;M;M;M;M;M;M",
        "homepage": ";;https://wusize.github.io/;https://zhangwenwei.cn;https://liyn.site;https://sites.google.com/view/guangliangcheng;http://www.cis.pku.edu.cn/faculty/system/tongyunhai/tongyunhai.htm;https://chenkai.site/;https://www.mmlab-ntu.com/person/ccloy/index.html",
        "dblp": "33/4756;;301/9535;;166/3420;;14/1705;181/2839-26;01/5855",
        "google_scholar": "8bBcL9sAAAAJ;;y2S02IcAAAAJ;QDXADSEAAAAJ;https://scholar.google.com.hk/citations?user=y_cp1sUAAAAJ;FToOC-wAAAAJ;T4gqdPkAAAAJ;https://scholar.google.com.hk/citations?user=eGD0b7IAAAAJ;https://scholar.google.co.uk/citations?user=559LF80AAAAJ",
        "orcid": ";;;0000-0002-2748-4514;;;;0000-0002-6820-2325;0000-0001-5345-1591",
        "linkedin": ";;%E6%80%9D%E6%B3%BD-%E5%90%B4-721544198/;wenweizhang-b9769a124/;;;;;",
        "or_profile": "~Shilin_Xu1;~Xiangtai_Li1;~Size_Wu1;~Wenwei_Zhang1;~Yining_Li1;~Guangliang_Cheng2;~Yunhai_Tong1;~Kai_Chen4;~Chen_Change_Loy2",
        "aff": "Peking University;;Nanyang Technological University;Shanghai AI Laboratory;Shanghai AI Laboratory;University of Liverpool;Peking University;Shanghai AI Laboratory;Nanyang Technological University",
        "aff_domain": "pku.edu.cn;;ntu.edu.sg;pjlab.org.cn;pjlab.org.cn;liverpool.ac.uk;pku.edu.cn;pjlab.org.cn;ntu.edu.sg",
        "position": "PhD student;;PhD student;Researcher;Researcher;Associate Professor;Full Professor;Researcher;Full Professor",
        "bibtex": "@misc{\nxu2024dstdet,\ntitle={{DST}-Det: Simple Dynamic Self-Training for Open-Vocabulary Object Detection},\nauthor={Shilin Xu and Xiangtai Li and Size Wu and Wenwei Zhang and Yining Li and Guangliang Cheng and Yunhai Tong and Kai Chen and Chen Change Loy},\nyear={2024},\nurl={https://openreview.net/forum?id=0PeEOq5iK8}\n}",
        "github": "",
        "project": "",
        "reviewers": "ht3G;Fu38;Sap3;ULPC;jftV",
        "site": "https://openreview.net/forum?id=0PeEOq5iK8",
        "pdf_size": 11566249,
        "rating": "3;3;3;5;5",
        "confidence": "4;5;4;3;5",
        "soundness": "2;3;3;2;3",
        "contribution": "1;1;2;2;3",
        "presentation": "3;3;2;3;3",
        "wc_summary": "49;114;45;76;49",
        "wc_strengths": "38;19;24;37;84",
        "wc_weaknesses": "24;147;110;157;147",
        "wc_questions": "66;46;23;12;217",
        "wc_review": "177;326;202;282;497",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            3.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            4.2,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            1.8,
            0.7483314773547883
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            66.6,
            26.157981573508305
        ],
        "wc_strengths_avg": [
            40.4,
            23.000869548780106
        ],
        "wc_weaknesses_avg": [
            117.0,
            49.189429758841484
        ],
        "wc_questions_avg": [
            72.8,
            74.47791618996868
        ],
        "wc_review_avg": [
            296.8,
            113.57006647880418
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -0.21821789023599233,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6953300397849811721&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;2;3;0;2;1",
        "aff_unique_norm": "Peking University;Nanyang Technological University;Shanghai AI Laboratory;University of Liverpool",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.ntu.edu.sg;https://www.shanghai-ai-lab.com;https://www.liverpool.ac.uk",
        "aff_unique_abbr": "Peking U;NTU;SAIL;Liv Uni",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;2;0;0;1",
        "aff_country_unique": "China;Singapore;United Kingdom"
    },
    {
        "id": "0Pu0H7y3gg",
        "title": "Understanding the Initial Condensation of Convolutional Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Previous research has shown that fully-connected neural networks with small initialization and gradient-based training methods exhibit a phenomenon known as condensation during training. This phenomenon refers to the input weights of hidden neurons condensing into isolated orientations during training, revealing an implicit bias towards simple solutions in the parameter space. However, the impact of neural network structure on condensation remains unknown. In this study, we study convolutional neural networks (CNNs) as the starting point to explore the distinctions in the condensation behavior compared to fully-connected neural networks. Theoretically, we firstly demonstrate that under gradient descent (GD) and the small initialization scheme, the convolutional kernels of a two-layer CNN condense towards a specific direction determined by the training samples within a given time period. Subsequently, we conduct a series of systematic experiments to substantiate our theory and confirm condensation in more general settings. These findings contribute to a preliminary understanding of the non-linear training behavior exhibited by CNNs.",
        "keywords": "training dynamics;convolutional neural networks;initialization;gradient-based training methods",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/610c4b13cbb73c3247427afd9d40ea264f618317.zip",
        "author": "Zhangchen Zhou;Hanxu Zhou;Yuqing Li;Zhi-Qin John Xu",
        "authorids": "~Zhangchen_Zhou1;~Hanxu_Zhou1;~Yuqing_Li3;~Zhi-Qin_John_Xu1",
        "gender": "M;;M;M",
        "homepage": ";;https://math.sjtu.edu.cn/Default/faculty/pages/MDAwMDAwMDAwMLKFbqE;https://ins.sjtu.edu.cn/people/xuzhiqin/",
        "dblp": ";;;223/4493.html",
        "google_scholar": "qNf_HecAAAAJ;https://scholar.google.com.hk/citations?user=ypD3aL8AAAAJ;https://scholar.google.com.hk/citations?hl=en;EjLvG5cAAAAJ",
        "orcid": ";;;0000-0002-0122-0879",
        "linkedin": "https://www.linkedin.cn/incareer/in/%E7%AB%A0%E8%BE%B0-%E5%91%A8-002a0a275;;;",
        "or_profile": "~Zhangchen_Zhou1;~Hanxu_Zhou1;~Yuqing_Li3;~Zhiqin_Xu1",
        "aff": "Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn",
        "position": "PhD student;PhD student;Postdoc;Associate Professor",
        "bibtex": "@misc{\nzhou2024understanding,\ntitle={Understanding the Initial Condensation of Convolutional Neural Networks},\nauthor={Zhangchen Zhou and Hanxu Zhou and Yuqing Li and Zhi-Qin John Xu},\nyear={2024},\nurl={https://openreview.net/forum?id=0Pu0H7y3gg}\n}",
        "github": "",
        "project": "",
        "reviewers": "mFgA;FvGf;P4L3",
        "site": "https://openreview.net/forum?id=0Pu0H7y3gg",
        "pdf_size": 0,
        "rating": "3;3;6",
        "confidence": "2;3;3",
        "soundness": "2;3;3",
        "contribution": "2;1;3",
        "presentation": "1;1;3",
        "wc_summary": "67;74;18",
        "wc_strengths": "20;42;68",
        "wc_weaknesses": "100;431;36",
        "wc_questions": "63;241;73",
        "wc_review": "250;788;195",
        "wc_reply_reviewers": "133;128;0",
        "wc_reply_authors": "835;2133;184",
        "reply_reviewers": "1;1;0",
        "reply_authors": "2;5;1",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            53.0,
            24.91318258807306
        ],
        "wc_strengths_avg": [
            43.333333333333336,
            19.61858529274955
        ],
        "wc_weaknesses_avg": [
            189.0,
            173.10305215872614
        ],
        "wc_questions_avg": [
            125.66666666666667,
            81.65510122188053
        ],
        "wc_review_avg": [
            411.0,
            267.52320771601603
        ],
        "wc_reply_reviewers_avg": [
            87.0,
            61.55214591439251
        ],
        "wc_reply_authors_avg": [
            1050.6666666666667,
            810.1581464271172
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            1.699673171197595
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14159339468738951420&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Shanghai Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sjtu.edu.cn",
        "aff_unique_abbr": "SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "0Q1mBvUgmt",
        "title": "VIPER: Vibrant Period Representation for Robust and Efficient Time Series Forecasting",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In a data-driven world teeming with vast volumes of time series data, forecasting models play a pivotal role. The real-world time series data often exhibits intricate periodic patterns and trends, posing challenges for accurate modeling. Existing methods, reliant on fixed parameters and sampling techniques, may struggle to capture these complexities effectively. This paper designs a Vibrant Period Representation Enrichment (VIPER) framework, which effectively and dynamically harnesses the inherent multi-periodic nature of time series data. The VIPER framework adeptly separates the input sequence into trend and seasonal components. A Temporal Aggregation Block is specifically deployed for processing the seasonal component, applying innovative multi-period transformations compounded with global self-attention mechanism. This configuration enables a comprehensive capture of both short-term and long-term period information, culminating in a vibrant period representation true to the essence of the temporal dynamics. Remarkably, experimental results from eight different time series forecasting datasets substantiate the superior performance, simplicity, and computational efficiency of VIPER compared with the state-of-the-arts.",
        "keywords": "long-term forecasting;deep learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/d49b4335ba136b915c9c1481eb598f4c0179bca3.zip",
        "author": "Guoqi Yu;Muxuan Li;Xiaowei Hu;Angelica I Aviles-Rivero;Shujun Wang",
        "authorids": "~Guoqi_Yu1;~Muxuan_Li1;~Xiaowei_Hu3;~Angelica_I_Aviles-Rivero1;~Shujun_Wang1",
        "gender": "M;M;M;F;F",
        "homepage": "https://github.com/Levi-Ackman;https://cv.transmux.top;https://xw-hu.github.io/;https://angelicaiaviles.wordpress.com/;https://emma-sjwang.github.io/",
        "dblp": ";;151/5859-1;138/9507;",
        "google_scholar": "https://scholar.google.com.hk/citations?hl=zh-CN;;tUb4J0kAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com.hk/citations?user=WFELH6IAAAAJ",
        "orcid": ";;0000-0002-5708-7018;;0000-0003-1495-3278",
        "linkedin": ";;;;",
        "or_profile": "~Guoqi_Yu1;~Muxuan_Li1;~Xiaowei_Hu3;~Angelica_I_Aviles-Rivero1;~Shujun_Wang1",
        "aff": "University of Electronic Science and Technology of China;University of Electronic Science and Technology of China;Shanghai Artificial Intelligence Laboratory;University of Cambridge;Hong Kong Polytechnic University",
        "aff_domain": "uestc.edu.cn;uestc.edu.cn;pjlab.org.cn;cam.ac.uk;polyu.edu.hk",
        "position": "Undergrad student;Undergrad student;Researcher;Senior Research Associate;Assistant Professor",
        "bibtex": "@misc{\nyu2024viper,\ntitle={{VIPER}: Vibrant Period Representation for Robust and Efficient Time Series Forecasting},\nauthor={Guoqi Yu and Muxuan Li and Xiaowei Hu and Angelica I Aviles-Rivero and Shujun Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=0Q1mBvUgmt}\n}",
        "github": "",
        "project": "",
        "reviewers": "PNtL;juBb;NQNh",
        "site": "https://openreview.net/forum?id=0Q1mBvUgmt",
        "pdf_size": 1973289,
        "rating": "3;3;3",
        "confidence": "5;4;4",
        "soundness": "2;2;2",
        "contribution": "2;2;2",
        "presentation": "2;2;4",
        "wc_summary": "22;68;129",
        "wc_strengths": "18;30;45",
        "wc_weaknesses": "136;66;155",
        "wc_questions": "4;123;25",
        "wc_review": "180;287;354",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            73.0,
            43.825411197918804
        ],
        "wc_strengths_avg": [
            31.0,
            11.045361017187261
        ],
        "wc_weaknesses_avg": [
            119.0,
            38.27096375408734
        ],
        "wc_questions_avg": [
            50.666666666666664,
            51.86092513208336
        ],
        "wc_review_avg": [
            273.6666666666667,
            71.6581390275305
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:IESzvRhCyg8J:scholar.google.com/&scioq=VIPER:+Vibrant+Period+Representation+for+Robust+and+Efficient+Time+Series+Forecasting&hl=en&as_sdt=0,21",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2;3",
        "aff_unique_norm": "University of Electronic Science and Technology of China;Shanghai Artificial Intelligence Laboratory;University of Cambridge;Hong Kong Polytechnic University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.uestc.edu.cn;http://www.shailab.org/;https://www.cam.ac.uk;https://www.polyu.edu.hk",
        "aff_unique_abbr": "UESTC;Shanghai AI Lab;Cambridge;PolyU",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Cambridge;Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "title": "Inner Classifier-Free Guidance and Its Taylor Expansion for Diffusion Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19617",
        "id": "0QAzIMq32X",
        "author_site": "Shikun Sun, Longhui Wei, Zhicai Wang, Zixuan Wang, Junliang Xing, Jia Jia, Qi Tian",
        "tldr": "",
        "abstract": "Classifier-free guidance (CFG) is a pivotal technique for balancing the diversity and fidelity of samples in conditional diffusion models. This approach involves utilizing a single model to jointly optimize the conditional score predictor and unconditional score predictor, eliminating the need for additional classifiers. It delivers impressive results and can be employed for continuous and discrete condition representations. However, when the condition is continuous, it prompts the question of whether the trade-off can be further enhanced. Our proposed inner classifier-free guidance (ICFG) provides an alternative perspective on the CFG method when the condition has a specific structure, demonstrating that CFG represents a first-order case of ICFG. Additionally, we offer a second-order implementation, highlighting that even without altering the training policy, our second-order approach can introduce new valuable information and achieve an improved balance between fidelity and diversity for Stable Diffusion.",
        "keywords": "diffusion models;classifier-free guidance",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/4f440ab4467b49465a78bf5306a0243866f9c038.zip",
        "author": "Shikun Sun;Longhui Wei;Zhicai Wang;Zixuan Wang;Junliang Xing;Jia Jia;Qi Tian",
        "authorids": "~Shikun_Sun1;~Longhui_Wei1;~Zhicai_Wang1;~Zixuan_Wang3;~Junliang_Xing1;~Jia_Jia1;~Qi_Tian3",
        "gender": "M;M;M;M;M;F;M",
        "homepage": "https://skipper17.github.io;https://joinwei-pku.github.io/longhuiwei.github.io/;;http://hcsi.cs.tsinghua.edu.cn;http://people.ucas.ac.cn/~jlxing?language=en;https://hcsi.cs.tsinghua.edu.cn/;https://www.qitian1987.com/index.html",
        "dblp": "293/2733.html;206/6179;250/1975;05/10698;43/7659.html;71/2992-1.html;78/1467-1.html",
        "google_scholar": "C1YFRxAAAAAJ;thhnAhIAAAAJ;https://scholar.google.com/citations?hl=zh-CN;4JKwZRsAAAAJ;jSwNd3MAAAAJ;RYhh3FsAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;0000-0001-7291-6198;0000-0001-6801-0510;;0000-0002-7252-5047",
        "linkedin": ";;;https://www.linkedin.cn/injobs/in/\u5b50\u8f69-\u738b-b214ba228;https://www.linkedin.cn/incareer/in/ACoAAAvlU14B40ZWH1pxg5JJDtQ6LlgMYkp0e5s;;",
        "or_profile": "~Shikun_Sun1;~Longhui_Wei1;~Zhicai_Wang1;~Zixuan_Wang3;~Junliang_Xing1;~Jia_Jia1;~Qi_Tian3",
        "aff": "Tsinghua University;Huawei Technologies Ltd.;University of Science and Technology of China;Tsinghua University;Tsinghua University;Tsinghua University;Huawei Technologies Ltd.",
        "aff_domain": "tsinghua.edu.cn;huawei.com;ustc.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;huawei.com",
        "position": "PhD student;Researcher;PhD student;PhD student;Full Professor;Full Professor;Principal Researcher",
        "bibtex": "@inproceedings{\nsun2024inner,\ntitle={Inner Classifier-Free Guidance and Its Taylor Expansion for Diffusion Models},\nauthor={Shikun Sun and Longhui Wei and Zhicai Wang and Zixuan Wang and Junliang Xing and Jia Jia and Qi Tian},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=0QAzIMq32X}\n}",
        "github": "",
        "project": "",
        "reviewers": "UdAr;cPdv;jYKn;LfUU",
        "pdf_size": 1821720,
        "rating": "5;5;6;8",
        "confidence": "4;3;4;3",
        "soundness": "1;3;2;4",
        "contribution": "2;2;2;3",
        "presentation": "2;2;2;4",
        "wc_summary": "59;59;66;34",
        "wc_strengths": "27;50;22;63",
        "wc_weaknesses": "267;165;102;226",
        "wc_questions": "8;40;71;11",
        "wc_review": "361;314;261;334",
        "wc_reply_reviewers": "213;338;25;354",
        "wc_reply_authors": "1798;2100;730;1419",
        "reply_reviewers": "3;2;1;2",
        "reply_authors": "6;6;3;3",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            1.118033988749895
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            54.5,
            12.175795661885921
        ],
        "wc_strengths_avg": [
            40.5,
            16.740669042783207
        ],
        "wc_weaknesses_avg": [
            190.0,
            62.437969217456136
        ],
        "wc_questions_avg": [
            32.5,
            25.5
        ],
        "wc_review_avg": [
            317.5,
            36.63673020344474
        ],
        "wc_reply_reviewers_avg": [
            232.5,
            131.65200340291065
        ],
        "wc_reply_authors_avg": [
            1511.75,
            511.7892022112229
        ],
        "reply_reviewers_avg": [
            2.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            4.5,
            1.5
        ],
        "replies_avg": [
            33,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.40824829046386296,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3080187669946390848&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=0QAzIMq32X",
        "pdf": "https://openreview.net/pdf?id=0QAzIMq32X",
        "email": "tsinghua.edu.cn;huawei.com;ustc.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;huawei.com",
        "author_num": 7,
        "aff_unique_index": "0;1;2;0;0;0;1",
        "aff_unique_norm": "Tsinghua University;Huawei;University of Science and Technology of China",
        "aff_unique_dep": ";Huawei Technologies;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.huawei.com;http://www.ustc.edu.cn",
        "aff_unique_abbr": "THU;Huawei;USTC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "0Qyxw0cCuu",
        "title": "CONTROL: A Contrastive Learning Framework for Open World Semi-Supervised Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In recent years, open-world semi-supervised Learning has received tremendous attention. This is largely due to the fact that unlabeled real-world data often encompasses unseen classes -- those that are not represented in labeled datasets. Such classes can adversely affect the performance of traditional semi-supervised learning methods. The open-world semi-supervised learning algorithms are designed to enable models to distinguish between both seen and unseen classes.  However, existing algorithms still suffer from the problem of insufficient classification of unseen classes and may face the risk of representation collapse. In order to better address the aforementioned issues, we propose a contrastive learning framework called CONTROL that integrates three optimization objectives: nearest neighbor contrastive learning, supervised contrastive learning, and unsupervised contrastive learning. The significance of the framework is explained by theoretically proving the optimization of contrastive learning at the feature level benefits unseen classification, and the uniformity mechanism in contrastive learning further helps to prevent representation collapse. Serving as a unified and efficient framework, CONTROL is compatible with a broad range of existing open-world semi-supervised learning algorithms. Through empirical studies, we highlight the superiority of CONTROL over prevailing state-of-the-art open-world semi-supervised learning algorithms. Remarkably, our method achieves significant improvement in both unseen class classification and all class classification over previous methods on both CIFAR and ImageNet datasets.",
        "keywords": "Contrastive Learning; Semi-Supervised Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Jingyi Cui;Yi-Ge Zhang;Yisen Wang",
        "authorids": "~Jingyi_Cui1;~Yi-Ge_Zhang1;~Yisen_Wang1",
        "gender": "F;M;M",
        "homepage": "https://zero-lab-pku.github.io/personwise/cuijingyi/;https://www.lamda.nju.edu.cn/zhangyg/;https://yisenwang.github.io/",
        "dblp": "216/3282;346/0977;172/1346-1",
        "google_scholar": ";;uMWPDboAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Jingyi_Cui1;~Yi-Ge_Zhang1;~Yisen_Wang1",
        "aff": "Peking University;Nanjing University;Peking University",
        "aff_domain": "pku.edu.cn;nju.edu.cn;pku.edu.cn",
        "position": "PhD student;MS student;Assistant Professor",
        "bibtex": "@misc{\ncui2024control,\ntitle={{CONTROL}: A Contrastive Learning Framework for Open World Semi-Supervised Learning},\nauthor={Jingyi Cui and Yi-Ge Zhang and Yisen Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=0Qyxw0cCuu}\n}",
        "github": "",
        "project": "",
        "reviewers": "mngU;fiFv;1Kmz;1XMG",
        "site": "https://openreview.net/forum?id=0Qyxw0cCuu",
        "pdf_size": 958055,
        "rating": "5;5;5;5",
        "confidence": "4;4;4;2",
        "soundness": "1;1;3;2",
        "contribution": "1;1;3;3",
        "presentation": "1;2;2;2",
        "wc_summary": "30;67;121;53",
        "wc_strengths": "20;20;124;33",
        "wc_weaknesses": "544;172;343;109",
        "wc_questions": "34;16;117;97",
        "wc_review": "628;275;705;292",
        "wc_reply_reviewers": "120;70;0;0",
        "wc_reply_authors": "832;553;286;430",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            1.0
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            67.75,
            33.46173187388842
        ],
        "wc_strengths_avg": [
            49.25,
            43.48203652084387
        ],
        "wc_weaknesses_avg": [
            292.0,
            168.8149874863011
        ],
        "wc_questions_avg": [
            66.0,
            42.089191011469914
        ],
        "wc_review_avg": [
            475.0,
            193.51873294335098
        ],
        "wc_reply_reviewers_avg": [
            47.5,
            50.68283733178323
        ],
        "wc_reply_authors_avg": [
            525.25,
            200.73536683903015
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:7liTmUjPLd8J:scholar.google.com/&scioq=CONTROL:+A+Contrastive+Learning+Framework+for+Open+World+Semi-Supervised+Learning&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Peking University;Nanjing University",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.nju.edu.cn",
        "aff_unique_abbr": "Peking U;Nanjing U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "0S0CgZEYxR",
        "title": "Examining the Achilles' Heel of CLIP Models: The Worst-Performing Categories",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Contrastive Language-Image Pre-training (CLIP) provides a foundation model by integrating natural language into visual concepts. Although previous studies have demonstrated that satisfactory overall accuracy can be achieved across numerous downstream tasks through well-designed textual prompts, this evaluation mechanism inevitably overlooks certain categories because the impact of some underperforming categories on overall performance remains limited, even if they are highly important. For example, on ImageNet, there are a total of 10 categories with class-wise accuracy as low as 0\\%, which is significantly inferior to the overall performance of 64.1\\%. This phenomenon reveals the potential risks of using CLIP models, especially in risk-sensitive applications. To address this issue, we investigate the alignment between the two modalities in the CLIP model and propose the Class-wise Matching Margin (\\cmm) to measure the inference confusion. \\cmm\\ can effectively identify the worst-performing categories and estimate the potential performance of the candidate prompts. We further query large language models to enrich descriptions of worst-performing categories and build a weighted ensemble to highlight the efficient prompts. Experimental results clearly verify the effectiveness of our proposal, where the accuracy on the worst-10 categories on ImageNet is boosted to 5.2\\%, without manual prompt engineering, laborious optimization, or access to labeled validation data.",
        "keywords": "vision-language models;worst-class performance;CLIP;prompt ensemble;zero-shot recognition",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/3c17115070f3450c754a665a6f0a558b9b714aee.zip",
        "author": "Jie-Jing Shao;Jiang-Xin Shi;Xiao-Wen Yang;Lan-Zhe Guo;Yu-Feng Li",
        "authorids": "~Jie-Jing_Shao1;~Jiang-Xin_Shi1;~Xiao-Wen_Yang4;~Lan-Zhe_Guo2;~Yu-Feng_Li1",
        "gender": "M;;M;M;M",
        "homepage": "http://www.lamda.nju.edu.cn/shaojj/;http://www.lamda.nju.edu.cn/shijx;http://www.lamda.nju.edu.cn/guolz;https://www.lamda.nju.edu.cn/yangxw;https://cs.nju.edu.cn/liyf/index.htm",
        "dblp": "299/4982;299/5485.html;216/4845;165/2864.html;57/413",
        "google_scholar": "k1tEDpQAAAAJ;KEgtGncAAAAJ;dpunvqgAAAAJ;;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0001-8107-114X;0000-0002-0318-0911;;0009-0007-4206-6242;0000-0002-2220-5248",
        "linkedin": ";;;;",
        "or_profile": "~Jie-Jing_Shao1;~Jiang-Xin_Shi1;~Lan-Zhe_Guo2;~Xiao-wen_Yang3;~Yu-feng_Li2",
        "aff": "Nanjing University;Nanjing University;Nanjing University;Nanjing University;Nanjing University",
        "aff_domain": "nju.edu.cn;nju.edu.cn;nju.edu.cn;nju.edu.cn;nju.edu.cn",
        "position": "PhD student;PhD student;Assistant Professor;PhD student;Assistant Professor",
        "bibtex": "@misc{\nshao2024examining,\ntitle={Examining the Achilles' Heel of {CLIP} Models: The Worst-Performing Categories},\nauthor={Jie-Jing Shao and Jiang-Xin Shi and Xiao-Wen Yang and Lan-Zhe Guo and Yu-Feng Li},\nyear={2024},\nurl={https://openreview.net/forum?id=0S0CgZEYxR}\n}",
        "github": "",
        "project": "",
        "reviewers": "7ik6;PArF;RDxr",
        "site": "https://openreview.net/forum?id=0S0CgZEYxR",
        "pdf_size": 8617562,
        "rating": "3;5;5",
        "confidence": "5;4;4",
        "soundness": "1;3;2",
        "contribution": "1;3;2",
        "presentation": "2;3;3",
        "wc_summary": "85;45;103",
        "wc_strengths": "10;26;29",
        "wc_weaknesses": "184;120;63",
        "wc_questions": "3;24;19",
        "wc_review": "282;215;214",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            77.66666666666667,
            24.239545283597124
        ],
        "wc_strengths_avg": [
            21.666666666666668,
            8.339997335464536
        ],
        "wc_weaknesses_avg": [
            122.33333333333333,
            49.42558941367203
        ],
        "wc_questions_avg": [
            15.333333333333334,
            8.9566858950296
        ],
        "wc_review_avg": [
            237.0,
            31.822423959633664
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9999999999999997,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:dBXEmwtk1joJ:scholar.google.com/&scioq=Examining+the+Achilles%27+Heel+of+CLIP+Models:+The+Worst-Performing+Categories&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Nanjing University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nju.edu.cn",
        "aff_unique_abbr": "Nanjing U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "0SOhDO7xI0",
        "title": "DeepDRK: Deep Dependency Regularized Knockoff for Feature Selection",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Model-X knockoff, among various feature selection methods, received much attention recently due to its guarantee on false discovery rate (FDR) control. Subsequent to its introduction in parametric design, knockoff is advanced to handle arbitrary data distributions using deep learning-based generative modeling. However, we observed that current implementations of the deep Model-X knockoff framework exhibit limitations. Notably, the \"swap property\" that knockoffs necessitate frequently encounter challenges on sample level, leading to a diminished selection power. To overcome, we develop \"Deep Dependency Regularized Knockoff (DeepDRK)\", a distribution-free deep learning method that strikes a balance between FDR and power. In DeepDRK, a generative model grounded in a transformer architecture is introduced to better achieve the \"swap property\". Novel efficient regularization techniques are also proposed to reach higher power. Our model outperforms other benchmarks in synthetic, semi-synthetic, and real-world data, especially when sample size is small and data distribution is complex.",
        "keywords": "Feature Selection;Deep Learning;Model-X Knockoff;FDR Control",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Hongyu Shen;Yici Yan;Zhizhen Zhao",
        "authorids": "~Hongyu_Shen1;~Yici_Yan1;~Zhizhen_Zhao1",
        "gender": "M;M;",
        "homepage": ";;",
        "dblp": "35/7565;;122/3155",
        "google_scholar": "CVCKr-EAAAAJ;;",
        "orcid": ";;",
        "linkedin": "hongyu-shen-61943267/;yici-yan-418b36117;",
        "or_profile": "~Hongyu_Shen1;~Yici_Yan1;~Zhizhen_Zhao1",
        "aff": "University of Illinois, Urbana Champaign;University of Illinois, Urbana Champaign;University of Washington",
        "aff_domain": "illinois.edu;illinois.edu;uw.edu",
        "position": "PhD student;PhD student;Associate Professor",
        "bibtex": "@misc{\nshen2024deepdrk,\ntitle={Deep{DRK}: Deep Dependency Regularized Knockoff for Feature Selection},\nauthor={Hongyu Shen and Yici Yan and Zhizhen Zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=0SOhDO7xI0}\n}",
        "github": "",
        "project": "",
        "reviewers": "CLhf;Zneh;cU77;e4Vy",
        "site": "https://openreview.net/forum?id=0SOhDO7xI0",
        "pdf_size": 847574,
        "rating": "5;6;6;6",
        "confidence": "2;2;3;2",
        "soundness": "3;3;3;3",
        "contribution": "3;2;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "70;78;34;76",
        "wc_strengths": "49;28;41;69",
        "wc_weaknesses": "194;148;150;9",
        "wc_questions": "34;19;35;27",
        "wc_review": "347;273;260;181",
        "wc_reply_reviewers": "0;0;0;23",
        "wc_reply_authors": "1202;1084;830;30",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "3;3;2;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            2.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            64.5,
            17.853571071357123
        ],
        "wc_strengths_avg": [
            46.75,
            14.872373717735847
        ],
        "wc_weaknesses_avg": [
            125.25,
            69.589420891397
        ],
        "wc_questions_avg": [
            28.75,
            6.417748826496718
        ],
        "wc_review_avg": [
            265.25,
            58.88282856656939
        ],
        "wc_reply_reviewers_avg": [
            5.75,
            9.959292143521045
        ],
        "wc_reply_authors_avg": [
            786.5,
            456.98222066071673
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5293816254708543531&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "University of Illinois Urbana-Champaign;University of Washington",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://illinois.edu;https://www.washington.edu",
        "aff_unique_abbr": "UIUC;UW",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Urbana-Champaign;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "0SSiZ5vYO8",
        "title": "Multi-Prompt Denoised Self-Training for Open-Vocabulary Model Adaptation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Traditional model adaptation assumes the same vocabulary across source and target domains, which often struggles with limited transfer flexibility and efficiency while handling target domains with different vocabularies. Inspired by recent vision-language models (VLMs) that enable open-vocabulary visual recognition by reasoning on both images and texts, we study open-vocabulary model adaptation (OVMA), a new unsupervised model adaptation framework that positions a pre-trained VLM as the source model and transfers it towards arbitrary unlabelled target domains. To this end, we design a Multi-prompt denOised Self-Training (MOST) technique that exploits the synergy between vision and language to mitigate the domain discrepancies in image and text distributions simultaneously. Specifically, MOST makes use of the complementary property of multiple prompts within and across vision and language modalities, which enables joint exploitation of vision and language information and effective learning of image-text correspondences in the unlabelled target domains. Additionally, MOST captures temporal information via multi-temporal prompt learning which helps memorize previously learnt target information. Extensive experiments show that MOST outperforms the state-of-the-art consistently across 11 image recognition tasks. Codes will be released",
        "keywords": "vision language models;model adaptation;transductive transfer learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Jiaxing Huang;Jingyi Zhang;Han Qiu;Sheng Jin;Lewei Lu;Shijian Lu",
        "authorids": "~Jiaxing_Huang2;~Jingyi_Zhang7;~Han_Qiu2;~Sheng_Jin3;~Lewei_Lu1;~Shijian_Lu1",
        "gender": "M;M;M;M;M;F",
        "homepage": "https://jxhuang0508.github.io/;https://qhqk.github.io/hanqiu.github.io/;;;https://personal.ntu.edu.sg/shijian.lu/;",
        "dblp": "62/6016-1.html;;70/6780-2;247/6438;42/2718;15/91-5",
        "google_scholar": "czirNcwAAAAJ;YThp3g8AAAAJ;https://scholar.google.com/citations?view_op=list_works;https://scholar.google.com.hk/citations?user=zdgKJXIAAAAJ;https://scholar.google.com.sg/scholar?hl=en;https://scholar.google.com/citations?hl=en",
        "orcid": ";;0000-0001-7254-1664;;;",
        "linkedin": ";;;lewei-lu-94015977/;;jingyi-zhang-6510871b0/",
        "or_profile": "~Jiaxing_Huang2;~Han_Qiu2;~Sheng_Jin3;~Lewei_Lu1;~Shijian_Lu1;~JINGYI_ZHANG4",
        "aff": "Nanyang Technological University;Nanyang Technological University;Nanyang Technological University;SenseTime;Nanyang Technological University;Nanyang Technological University",
        "aff_domain": "ntu.edu.sg;ntu.edu.sg;ntu.edu.sg;sensetime.com;ntu.edu.sg;ntu.edu.sg",
        "position": "Postdoc;PhD student;Postdoc;Researcher;Associate Professor;PhD student",
        "bibtex": "@misc{\nhuang2024multiprompt,\ntitle={Multi-Prompt Denoised Self-Training for Open-Vocabulary Model Adaptation},\nauthor={Jiaxing Huang and Jingyi Zhang and Han Qiu and Sheng Jin and Lewei Lu and Shijian Lu},\nyear={2024},\nurl={https://openreview.net/forum?id=0SSiZ5vYO8}\n}",
        "github": "",
        "project": "",
        "reviewers": "Zzqn;5Vkc;vh13;yo5V",
        "site": "https://openreview.net/forum?id=0SSiZ5vYO8",
        "pdf_size": 6765376,
        "rating": "5;5;5;6",
        "confidence": "4;5;5;3",
        "soundness": "3;3;2;3",
        "contribution": "2;3;2;3",
        "presentation": "3;3;2;3",
        "wc_summary": "61;81;265;65",
        "wc_strengths": "33;92;23;79",
        "wc_weaknesses": "131;317;16;267",
        "wc_questions": "53;98;2;61",
        "wc_review": "278;588;306;472",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            118.0,
            85.19976525789258
        ],
        "wc_strengths_avg": [
            56.75,
            29.328953271468794
        ],
        "wc_weaknesses_avg": [
            182.75,
            117.90329723972947
        ],
        "wc_questions_avg": [
            53.5,
            34.23813663153998
        ],
        "wc_review_avg": [
            411.0,
            126.25767303415662
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.8703882797784891,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:-BhvtsjAY5QJ:scholar.google.com/&scioq=Multi-Prompt+Denoised+Self-Training+for+Open-Vocabulary+Model+Adaptation&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;0;0",
        "aff_unique_norm": "Nanyang Technological University;SenseTime",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ntu.edu.sg;https://www.sensetime.com",
        "aff_unique_abbr": "NTU;SenseTime",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0;0",
        "aff_country_unique": "Singapore;China"
    },
    {
        "id": "0SgPbbyrWh",
        "title": "Optimal spherical codes for locality-sensitive hashing",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In the realm of Locality-Sensitive Hashing (LSH), striking the right balance between computational efficiency and accuracy has been a persistent challenge. Most existing unsupervised methods rely on dense representations, which can lead to inefficiencies. To tackle this, we advocate for the adoption of sparse representations and introduce the use of quasi-Optimal Spherical Codes (OSCs) to minimise space distortion. OSCs strive to maximise the minimum angle between any pair of points on the hypersphere, ensuring that the relative angular information between data points is preserved in the representation, which is particularly valuable in tasks involving cosine similarity. We employ Adam-based optimisation to obtain these codes and use them to  partition the space into a $k^\\text{th}$-order Voronoi diagram. This approach consistently outperforms existing methods across four datasets on $K$-nearest neighbors search with cosine similarity, while capping the query time for a given embedding size.",
        "keywords": "Optimal spherical codes;locality sensitive hashing;similarity search;sparse coding",
        "primary_area": "metric learning, kernel learning, and sparse coding",
        "supplementary_material": "/attachment/cac03604aac528266d8d2b827d896c6871ceaf33.pdf",
        "author": "Rana Alkhoury Maroun;Henry Gouk;Yihe Lu;Barbara Webb",
        "authorids": "~Rana_Alkhoury_Maroun1;~Henry_Gouk1;~Yihe_Lu1;~Barbara_Webb1",
        "gender": ";M;M;",
        "homepage": ";https://www.henrygouk.com;;",
        "dblp": ";172/0943;181/4875-1;",
        "google_scholar": ";https://scholar.google.co.nz/citations?user=i1bzlyAAAAAJ;22zfD-gAAAAJ;https://scholar.google.com/scholar?hl=en",
        "orcid": " 0000-0003-4454-5320;;0000-0002-1615-4915;",
        "linkedin": ";;yihe-lu-5ba52856/?originalSubdomain=uk;",
        "or_profile": "~Rana_Alkhoury_Maroun1;~Henry_Gouk1;~Yihe_Lu1;~Barbara_Webb1",
        "aff": "University of Edinburgh, University of Edinburgh;University of Edinburgh;University of Edinburgh;University of Edinburgh",
        "aff_domain": "ed.ac.uk;ed.ac.uk;ed.ac.uk;ed.ac.uk",
        "position": "PhD student;RAEng Research Fellow;Postdoc;Full Professor",
        "bibtex": "@misc{\nmaroun2024optimal,\ntitle={Optimal spherical codes for locality-sensitive hashing},\nauthor={Rana Alkhoury Maroun and Henry Gouk and Yihe Lu and Barbara Webb},\nyear={2024},\nurl={https://openreview.net/forum?id=0SgPbbyrWh}\n}",
        "github": "",
        "project": "",
        "reviewers": "RRUE;KUjb;88TD;d26L",
        "site": "https://openreview.net/forum?id=0SgPbbyrWh",
        "pdf_size": 3883,
        "rating": "1;3;3;3",
        "confidence": "5;4;4;3",
        "soundness": "1;2;3;2",
        "contribution": "1;3;2;2",
        "presentation": "2;1;1;2",
        "wc_summary": "39;55;93;80",
        "wc_strengths": "16;17;91;23",
        "wc_weaknesses": "497;13;327;74",
        "wc_questions": "14;26;93;37",
        "wc_review": "566;111;604;214",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            66.75,
            21.05201890555868
        ],
        "wc_strengths_avg": [
            36.75,
            31.43544973433655
        ],
        "wc_weaknesses_avg": [
            227.75,
            195.00176281254485
        ],
        "wc_questions_avg": [
            42.5,
            30.26962173533062
        ],
        "wc_review_avg": [
            373.75,
            214.78637643016376
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:NE_wzqmTiMwJ:scholar.google.com/&scioq=Optimal+spherical+codes+for+locality-sensitive+hashing&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of Edinburgh",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ed.ac.uk",
        "aff_unique_abbr": "Edinburgh",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "0TZs6WOs16",
        "title": "Hyperbolic Embeddings in Sequential Self-Attention for Improved Next-Item Recommendations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In recent years, self-attentive sequential learning models have surpassed conventional collaborative filtering techniques in next-item recommendation tasks. However, Euclidean geometry utilized in these models may not be optimal for capturing a complex structure of the behavioral data. Building on recent advances in the application of hyperbolic geometry to collaborative filtering tasks, we propose a novel approach that leverages hyperbolic geometry in the sequential learning setting. Our approach involves transitioning the learned parameters to a Poincar\\'e ball, which enables a linear predictor in a non-linear space. Our experimental results demonstrate that under certain conditions hyperbolic models may simultaneously improve recommendation quality and gain representational capacity. We identify several determining factors that affect the results, which include the ability of a loss function to preserve hyperbolic structure and the general compatibility of data with hyperbolic geometry. For the latter, we propose an empirical approach based on Gromov delta-hyperbolicity estimation that allows categorizing datasets as either compatible or not.",
        "keywords": "recommender systems;sequential self-attention;hyperbolic geometry;Gromov product",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Evgeny Frolov;Lina Bashaeva;Leyla Mirvakhabova;Ivan Oseledets",
        "authorids": "~Evgeny_Frolov1;~Lina_Bashaeva1;~Leyla_Mirvakhabova2;~Ivan_Oseledets1",
        "gender": "M;F;;M",
        "homepage": ";;;http://oseledets.github.io",
        "dblp": ";;;56/7175",
        "google_scholar": "https://scholar.google.ru/citations?user=l6cMdUEAAAAJ;;;https://scholar.google.ru/citations?user=5kMqBQEAAAAJ",
        "orcid": "0000-0003-3679-5311;;;",
        "linkedin": "evgenyfrolov/;lina-bashaeva/;;",
        "or_profile": "~Evgeny_Frolov1;~Lina_Bashaeva1;~Leyla_Mirvakhabova2;~Ivan_Oseledets1",
        "aff": "Skolkovo Institute of Science and Technology;;;Institute of Numerical Mathematics",
        "aff_domain": "skoltech.ru;;;inm.ras.ru",
        "position": "Researcher;;;Researcher",
        "bibtex": "@misc{\nfrolov2024hyperbolic,\ntitle={Hyperbolic Embeddings in Sequential Self-Attention for Improved Next-Item Recommendations},\nauthor={Evgeny Frolov and Lina Bashaeva and Leyla Mirvakhabova and Ivan Oseledets},\nyear={2024},\nurl={https://openreview.net/forum?id=0TZs6WOs16}\n}",
        "github": "",
        "project": "",
        "reviewers": "WdM2;9PVb;vqza;hnY1",
        "site": "https://openreview.net/forum?id=0TZs6WOs16",
        "pdf_size": 1089586,
        "rating": "3;3;3;5",
        "confidence": "5;4;5;3",
        "soundness": "3;2;2;3",
        "contribution": "2;1;2;3",
        "presentation": "3;2;2;3",
        "wc_summary": "36;56;48;107",
        "wc_strengths": "26;68;65;48",
        "wc_weaknesses": "166;254;308;63",
        "wc_questions": "5;4;7;6",
        "wc_review": "233;382;428;224",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1682;1808;2035;844",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;3;4;2",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            61.75,
            27.07743525520835
        ],
        "wc_strengths_avg": [
            51.75,
            16.708904811506947
        ],
        "wc_weaknesses_avg": [
            197.75,
            92.85035002626539
        ],
        "wc_questions_avg": [
            5.5,
            1.118033988749895
        ],
        "wc_review_avg": [
            316.75,
            89.79246906060663
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1592.25,
            450.14129726120444
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8703882797784891,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:pyxtiaLGQ6AJ:scholar.google.com/&scioq=Hyperbolic+Embeddings+in+Sequential+Self-Attention+for+Improved+Next-Item+Recommendations&hl=en&as_sdt=0,11",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Skolkovo Institute of Science and Technology;Institute of Numerical Mathematics",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.skoltech.ru;",
        "aff_unique_abbr": "Skoltech;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Russian Federation;"
    },
    {
        "id": "0V311Uh8q1",
        "title": "Algorithmic Stability Unleashed: Generalization Bounds with Unbounded Losses",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "One of the central problems of statistical learning theory is quantifying the generalization ability of learning algorithms within a probabilistic framework. Algorithmic stability is a powerful tool for deriving generalization bounds, however, it typically builds on a critical assumption that losses are bounded. In this paper, we relax this condition to unbounded loss functions with subweibull diameter. This gives new generalization bound for algorithmic stability and also includes existing results of subgaussian and subexponential diameters as specific cases. Our main probabilistic result is a general concentration inequality for subweibull random variables, which may be of independent interest.",
        "keywords": "algorithmic stability; generalization bound",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/49261c5dd8086a8c2eb6339570401c6dfe49287b.pdf",
        "author": "Shaojie Li;Bowei Zhu;Yong Liu",
        "authorids": "~Shaojie_Li2;~Bowei_Zhu1;~Yong_Liu7",
        "gender": "M;;M",
        "homepage": ";;https://iie-liuyong.github.io",
        "dblp": ";304/1543;29/4867-18",
        "google_scholar": ";;vVhmzbAAAAAJ",
        "orcid": ";;0000-0002-6739-621X",
        "linkedin": ";;",
        "or_profile": "~Shaojie_Li2;~Bowei_Zhu1;~Yong_Liu7",
        "aff": "Renmin University of China;Renmin University of China;Renmin University of China",
        "aff_domain": "ruc.edu.cn;ruc.edu.cn;ruc.edu.cn",
        "position": "PhD student;PhD student;Associate Professor",
        "bibtex": "@misc{\nli2024algorithmic,\ntitle={Algorithmic Stability Unleashed: Generalization Bounds with Unbounded Losses},\nauthor={Shaojie Li and Bowei Zhu and Yong Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=0V311Uh8q1}\n}",
        "github": "",
        "project": "",
        "reviewers": "K21p;wVug;wNWA;LoHq",
        "site": "https://openreview.net/forum?id=0V311Uh8q1",
        "pdf_size": 247036,
        "rating": "3;5;5;6",
        "confidence": "3;4;3;5",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;2",
        "presentation": "1;3;2;4",
        "wc_summary": "84;85;161;373",
        "wc_strengths": "35;38;35;13",
        "wc_weaknesses": "181;178;44;9",
        "wc_questions": "67;153;302;14",
        "wc_review": "367;454;542;409",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1030;1431;985;678",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;2;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            175.75,
            118.08762636279891
        ],
        "wc_strengths_avg": [
            30.25,
            10.034316120194738
        ],
        "wc_weaknesses_avg": [
            103.0,
            77.50161288644256
        ],
        "wc_questions_avg": [
            134.0,
            108.94264546081116
        ],
        "wc_review_avg": [
            443.0,
            64.91147818375421
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1031.0,
            267.7340097933021
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.7608859102526822,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3002706169684833497&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Renmin University of China",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.ruc.edu.cn",
        "aff_unique_abbr": "RUC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Q-Bench: A Benchmark for General-Purpose Foundation Models on Low-level Vision",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19616",
        "id": "0V5TVt9bk0",
        "author_site": "Haoning Wu, Zicheng Zhang, Erli Zhang, Chaofeng Chen, Liang Liao, Annan Wang, Chunyi Li, Wenxiu Sun, Qiong Yan, Guangtao Zhai, Weisi Lin",
        "tldr": "",
        "abstract": "The rapid evolution of Multi-modality Large Language Models (MLLMs) has catalyzed a shift in computer vision from specialized models to general-purpose foundation models. Nevertheless, there is still an inadequacy in assessing the abilities of MLLMs on **low-level visual perception and understanding**. To address this gap, we present **Q-Bench**, a holistic benchmark crafted to systematically evaluate potential abilities of MLLMs on three realms: low-level visual perception, low-level visual description, and overall visual quality assessment. **_a)_** To evaluate the low-level **_perception_** ability, we construct the **LLVisionQA** dataset, consisting of 2,990 diverse-sourced images, each equipped with a human-asked question focusing on its low-level attributes. We then measure the correctness of MLLMs on answering these questions. **_b)_** To examine the **_description_** ability of MLLMs on low-level information, we propose the **LLDescribe** dataset consisting of long expert-labelled *golden* low-level text descriptions on 499 images, and a GPT-involved comparison pipeline between outputs of MLLMs and the *golden* descriptions. **_c)_** Besides these two tasks, we further measure their visual quality **_assessment_** ability to align with human opinion scores. Specifically, we design a softmax-based strategy that enables MLLMs to predict *quantifiable* quality scores, and evaluate them on various existing image quality assessment (IQA) datasets. Our evaluation across the three abilities confirms that MLLMs possess preliminary low-level visual skills. However, these skills are still unstable and relatively imprecise, indicating the need for specific enhancements on MLLMs towards these abilities. We hope that our benchmark can encourage the research community to delve deeper to discover and enhance these untapped potentials of MLLMs.",
        "keywords": "Benchmark;Vision-Language;Large Language Models;Low-level Vision;Image Quality Assessment",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/f30a94400274185c561b708ad935be64375bbe64.pdf",
        "author": "Haoning Wu;Zicheng Zhang;Erli Zhang;Chaofeng Chen;Liang Liao;Annan Wang;Chunyi Li;Wenxiu Sun;Qiong Yan;Guangtao Zhai;Weisi Lin",
        "authorids": "~Haoning_Wu1;~Zicheng_Zhang7;~Erli_Zhang1;~Chaofeng_Chen1;~Liang_Liao3;~Annan_Wang1;~Chunyi_Li1;~Wenxiu_Sun1;~Qiong_Yan1;~Guangtao_Zhai1;~Weisi_Lin1",
        "gender": "M;M;M;M;M;M;F;;M;M;M",
        "homepage": "https://teowu.github.io;;https://chaofengc.github.io/;https://liaoliang92.github.io/homepage/;;https://lcysyzxdxc.github.io;http://wenxiusun.com/;;https://faculty.sjtu.edu.cn/zhaiguangtao/en/index.htm;http://www.ntu.edu.sg/home/wslin/;",
        "dblp": "264/5802-1;32/749;198/2537;;;192/6758;16/9879;122/4814;19/3230;14/3737.html;",
        "google_scholar": "https://scholar.google.com.hk/citations?user=wth-VbMAAAAJ;gfjYZKMAAAAJ;lxiqnI0AAAAJ;kqTUHSIAAAAJ;;https://scholar.google.com/citations?hl=en;X9lE6O4AAAAJ;uT9CtPYAAAAJ;E6zbSYgAAAAJ;https://scholar.google.com.tw/citations?user=D_S41X4AAAAJ;QICTEckAAAAJ",
        "orcid": "0000-0001-8642-8101;;0000-0001-6137-5162;0000-0002-2238-2420;0009-0004-2998-9817;;;;;;",
        "linkedin": ";zhang-erli/;;;annan-wang-1026241a4;;;;;;",
        "or_profile": "~Haoning_Wu1;~Erli_Zhang1;~Chaofeng_Chen1;~Liang_Liao3;~Annan_Wang1;~Chunyi_Li1;~Wenxiu_Sun1;~Qiong_Yan1;~Guangtao_Zhai1;~Weisi_Lin1;~zicheng_zhang6",
        "aff": "Nanyang Technological University;Nanyang Technological University;Nanyang Technological University;Nanyang Technological University;Nanyang Technological University;Shanghai Artificial Intelligence Laboratory;SenseTime Group Limited;SenseTime Research;Shanghai Jiaotong University;Nanyang Technological University;Shanghai Jiaotong University",
        "aff_domain": "ntu.edu.sg;ntu.edu.sg;ntu.edu.sg;ntu.edu.sg;ntu.edu.sg;pjlab.org.cn;sensetime.com;sensetime.com;sjtu.edu.cn;ntu.edu.sg;sjtu.edu.cn",
        "position": "PhD student;Undergrad student;Postdoc;Postdoc;Researcher;Intern;Principal Researcher;Research Director;Full Professor;Full Professor;PhD student",
        "bibtex": "@inproceedings{\nwu2024qbench,\ntitle={Q-Bench: A Benchmark for General-Purpose Foundation Models on Low-level Vision},\nauthor={Haoning Wu and Zicheng Zhang and Erli Zhang and Chaofeng Chen and Liang Liao and Annan Wang and Chunyi Li and Wenxiu Sun and Qiong Yan and Guangtao Zhai and Weisi Lin},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=0V5TVt9bk0}\n}",
        "github": "",
        "project": "",
        "reviewers": "gz7s;rhgp;1bay",
        "pdf_size": 5992170,
        "rating": "6;8;8",
        "confidence": "5;4;5",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "3;3;3",
        "wc_summary": "43;91;100",
        "wc_strengths": "67;45;44",
        "wc_weaknesses": "75;27;114",
        "wc_questions": "4;23;2",
        "wc_review": "189;186;260",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1389;717;3118",
        "reply_reviewers": "0;0;0",
        "reply_authors": "4;1;5",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            78.0,
            25.019992006393608
        ],
        "wc_strengths_avg": [
            52.0,
            10.614455552060438
        ],
        "wc_weaknesses_avg": [
            72.0,
            35.58089374931439
        ],
        "wc_questions_avg": [
            9.666666666666666,
            9.46337971105226
        ],
        "wc_review_avg": [
            211.66666666666666,
            34.19876540981495
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1741.3333333333333,
            1011.3701377614209
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            1.699673171197595
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 151,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11683847823892452807&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=0V5TVt9bk0",
        "pdf": "https://openreview.net/pdf?id=0V5TVt9bk0",
        "email": "ntu.edu.sg;ntu.edu.sg;ntu.edu.sg;ntu.edu.sg;ntu.edu.sg;pjlab.org.cn;sensetime.com;sensetime.com;sjtu.edu.cn;ntu.edu.sg;sjtu.edu.cn",
        "author_num": 11,
        "aff_unique_index": "0;0;0;0;0;1;2;3;4;0;4",
        "aff_unique_norm": "Nanyang Technological University;Shanghai Artificial Intelligence Laboratory;SenseTime Group Limited;SenseTime;Shanghai Jiao Tong University",
        "aff_unique_dep": ";;;SenseTime Research;",
        "aff_unique_url": "https://www.ntu.edu.sg;http://www.shailab.org/;https://www.sensetime.com;https://www.sensetime.com;https://www.sjtu.edu.cn",
        "aff_unique_abbr": "NTU;Shanghai AI Lab;SenseTime;SenseTime;SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;1;1;1;1;0;1",
        "aff_country_unique": "Singapore;China"
    },
    {
        "title": "MOFDiff: Coarse-grained Diffusion for Metal-Organic Framework Design",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19615",
        "id": "0VBsoluxR2",
        "author_site": "Xiang Fu, Tian Xie, Andrew Rosen, Tommi Jaakkola, Jake Smith",
        "tldr": "",
        "abstract": "Metal-organic frameworks (MOFs) are of immense interest in applications such as gas storage and carbon capture due to their exceptional porosity and tunable chemistry. Their modular nature has enabled the use of template-based methods to generate hypothetical MOFs by combining molecular building blocks in accordance with known network topologies. However, the ability of these methods to identify top-performing MOFs is often hindered by the limited diversity of the resulting chemical space. In this work, we propose MOFDiff: a coarse-grained (CG) diffusion model that generates CG MOF structures through a denoising diffusion process over the coordinates and identities of the building blocks. The all-atom MOF structure is then determined through a novel assembly algorithm. As the diffusion model generates 3D MOF structures by predicting scores in E(3), we employ equivariant graph neural networks that respect the permutational and roto-translational symmetries. We comprehensively evaluate our model's capability to generate valid and novel MOF structures and its effectiveness in designing outstanding MOF materials for carbon capture applications with molecular simulations.",
        "keywords": "Materials design;diffusion model;metal-organic framework;carbon capture;generative model;AI for Science",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/a45d7028d2af95b6f15c66409ef120981a054831.zip",
        "author": "Xiang Fu;Tian Xie;Andrew Scott Rosen;Tommi S. Jaakkola;Jake Allen Smith",
        "authorids": "~Xiang_Fu4;~Tian_Xie2;~Andrew_Scott_Rosen1;~Tommi_S._Jaakkola1;~Jake_Allen_Smith1",
        "gender": "M;M;M;;M",
        "homepage": "https://xiangfu.co/;http://www.txie.me;https://rosen.cbe.princeton.edu/;;",
        "dblp": "97/374-5.html;;;;",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;xFbOAf8AAAAJ;lHBjgLsAAAAJ;;lSQbg6kAAAAJ",
        "orcid": ";;0000-0002-0141-7006;;",
        "linkedin": ";txie-93/;andrew-s-rosen/;;jakeallensmith",
        "or_profile": "~Xiang_Fu4;~Tian_Xie2;~Andrew_Scott_Rosen1;~Tommi_S._Jaakkola1;~Jake_Allen_Smith1",
        "aff": "Massachusetts Institute of Technology;Microsoft Research AI for Science;University of California, Berkeley;;Microsoft",
        "aff_domain": "mit.edu;microsoft.com;berkeley.edu;;microsoft.com",
        "position": "PhD student;Senior Researcher;Postdoc;;Researcher",
        "bibtex": "@inproceedings{\nfu2024mofdiff,\ntitle={{MOFD}iff: Coarse-grained Diffusion for Metal-Organic Framework Design},\nauthor={Xiang Fu and Tian Xie and Andrew Scott Rosen and Tommi S. Jaakkola and Jake Allen Smith},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=0VBsoluxR2}\n}",
        "github": "",
        "project": "",
        "reviewers": "1BzN;yqBG;nQJ6;e39L",
        "pdf_size": 18740242,
        "rating": "8;8;8;8",
        "confidence": "4;3;3;4",
        "soundness": "3;3;2;3",
        "contribution": "3;3;2;2",
        "presentation": "3;3;3;4",
        "wc_summary": "65;184;159;182",
        "wc_strengths": "65;61;84;75",
        "wc_weaknesses": "75;91;251;105",
        "wc_questions": "149;73;68;211",
        "wc_review": "354;409;562;573",
        "wc_reply_reviewers": "0;12;229;43",
        "wc_reply_authors": "791;626;1125;1319",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "2;2;3;4",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            147.5,
            48.63383595810637
        ],
        "wc_strengths_avg": [
            71.25,
            8.954747344286158
        ],
        "wc_weaknesses_avg": [
            130.5,
            70.37577708274347
        ],
        "wc_questions_avg": [
            125.25,
            59.00158896165424
        ],
        "wc_review_avg": [
            474.5,
            95.090746132313
        ],
        "wc_reply_reviewers_avg": [
            71.0,
            92.56079083499665
        ],
        "wc_reply_authors_avg": [
            965.25,
            272.081214897317
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 20,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12303585458809639061&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=0VBsoluxR2",
        "pdf": "https://openreview.net/pdf?id=0VBsoluxR2",
        "email": "mit.edu;microsoft.com;berkeley.edu;;microsoft.com",
        "author_num": 5,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "Massachusetts Institute of Technology;Microsoft;University of California, Berkeley",
        "aff_unique_dep": ";AI for Science;",
        "aff_unique_url": "https://web.mit.edu;https://www.microsoft.com/en-us/research/group/ai-for-science;https://www.berkeley.edu",
        "aff_unique_abbr": "MIT;Microsoft Research;UC Berkeley",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Berkeley",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "0VKEJKKLvr",
        "title": "A GRAPH-BASED REPRESENTATION LEARNING APPROACH FOR BREAST CANCER RISK PREDICTION USING GENOTYPE DATA",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Breast cancer risk prediction using genotype data is a critical task in personalized medicine. However, the high dimensionality and potential redundancy of genetic features pose challenges for accurate risk prediction. We present a graph-based representation learning pipeline for breast cancer risk prediction. Our method addresses the issue of feature redundancy by developing an ensemble-based feature selection approach. We evaluated the performance of the graph-based approach in a breast cancer risk prediction task using a dataset of 644,585 genetic variants from Biobank of Eastern Finland, consisting of 168 cases and 1558 controls and compared it with the classical machine learning models. Using 200 top-ranked genetic variants selected by the ensemble approach, the graph convolutional network\n(GCN) achieved area under the ROC curve (AUC) of 0.986 \u00b1 0.001 in discriminating cases and controls, which is better than an XGBoost model with AUC of 0.955 \u00b1 0.0034",
        "keywords": "Graph representation;Deep learning;Single nucleotide polymorphism;Breast cancer",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Naga Raju Gudhe;veli-matti Kosma;Hamid Behravan;Arto Mannermaa",
        "authorids": "~Naga_Raju_Gudhe1;~veli-matti_Kosma1;~Hamid_Behravan1;~Arto_Mannermaa1",
        "gender": "M;M;M;Not Specified",
        "homepage": ";https://www.uef.fi;;https://www.uef.fi/fi/",
        "dblp": ";;;",
        "google_scholar": "ijCl-MMAAAAJ;;JARPOGcAAAAJ;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Naga_Raju_Gudhe1;~veli-matti_Kosma1;~Hamid_Behravan1;~Arto_Mannermaa1",
        "aff": "University of Eastern Finland ;uef;;",
        "aff_domain": "uef.fi;uef.fi;;",
        "position": "Researcher;Full Professor;;",
        "bibtex": "@misc{\ngudhe2024a,\ntitle={A {GRAPH}-{BASED} {REPRESENTATION} {LEARNING} {APPROACH} {FOR} {BREAST} {CANCER} {RISK} {PREDICTION} {USING} {GENOTYPE} {DATA}},\nauthor={Naga Raju Gudhe and veli-matti Kosma and Hamid Behravan and Arto Mannermaa},\nyear={2024},\nurl={https://openreview.net/forum?id=0VKEJKKLvr}\n}",
        "github": "",
        "project": "",
        "reviewers": "fYgW;6KR2;etdw;VT6g",
        "site": "https://openreview.net/forum?id=0VKEJKKLvr",
        "pdf_size": 1157317,
        "rating": "3;3;3;3",
        "confidence": "4;5;5;4",
        "soundness": "1;2;1;2",
        "contribution": "2;2;1;1",
        "presentation": "2;3;2;2",
        "wc_summary": "54;173;92;73",
        "wc_strengths": "44;7;37;29",
        "wc_weaknesses": "280;351;123;144",
        "wc_questions": "7;61;97;161",
        "wc_review": "385;592;349;407",
        "wc_reply_reviewers": "0;19;0;0",
        "wc_reply_authors": "1784;955;751;916",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "5;5;2;5",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            1.5,
            0.5
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            98.0,
            45.33762234612662
        ],
        "wc_strengths_avg": [
            29.25,
            13.899190623917638
        ],
        "wc_weaknesses_avg": [
            224.5,
            94.69028461251978
        ],
        "wc_questions_avg": [
            81.5,
            55.97097462078001
        ],
        "wc_review_avg": [
            433.25,
            93.96375631061159
        ],
        "wc_reply_reviewers_avg": [
            4.75,
            8.227241335952167
        ],
        "wc_reply_authors_avg": [
            1101.5,
            401.41281743362407
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.25,
            1.299038105676658
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4674983461646892121&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Eastern Finland",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uef.fi",
        "aff_unique_abbr": "UEF",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Finland"
    },
    {
        "id": "0VZP2Dr9KX",
        "title": "Baseline Defenses for Adversarial Attacks Against Aligned Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "As large language models (LLMs) quickly become ubiquitous, it becomes critical to understand their security vulnerabilities.\nRecent work shows that text optimizers can produce jailbreaking prompts that bypass moderation and alignment. \nDrawing from the rich body of work on adversarial machine learning, we approach these attacks with three questions: \nWhat threat models are practically useful in this domain?  How do baseline defense techniques perform in this new domain? How does LLM security differ from computer vision?\nWe evaluate several baseline defense strategies against leading adversarial attacks on LLMs, discussing the various settings in which each is feasible and effective. \nIn particular, we look at three types of defenses: detection (perplexity based), input preprocessing (paraphrase and retokenization), and  adversarial training. \nWe discuss white-box and gray-box settings and discuss the robustness-performance trade-off for each of the defenses considered. \nWe find that the weakness of existing discrete optimizers for text, combined with the relatively high costs of optimization, makes standard adaptive attacks more challenging for LLMs. Future research will be needed to uncover whether more powerful optimizers can be developed, or whether the strength of filtering and preprocessing defenses is greater in the LLMs domain than it has been in computer vision.",
        "keywords": "baseline defenses;attacks",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/842cb8f7c9593337cbb293b35d290955a1feadff.zip",
        "author": "Neel Jain;Avi Schwarzschild;Yuxin Wen;Gowthami Somepalli;John Kirchenbauer;Ping-yeh Chiang;Micah Goldblum;Aniruddha Saha;Jonas Geiping;Tom Goldstein",
        "authorids": "~Neel_Jain1;~Avi_Schwarzschild1;~Yuxin_Wen2;~Gowthami_Somepalli1;~John_Kirchenbauer1;~Ping-yeh_Chiang1;~Micah_Goldblum1;~Aniruddha_Saha1;~Jonas_Geiping1;~Tom_Goldstein1",
        "gender": ";M;;F;M;;;M;M;M",
        "homepage": ";https://cs.umd.edu/~avi1;https://yuxinwenrick.github.io/;https://somepago.github.io/;https://jwkirchenbauer.notion.site/;;;https://ani0075saha.github.io/;https://jonasgeiping.github.io/;https://www.cs.umd.edu/~tomg/",
        "dblp": ";249/9334.html;;286/5012;321/0678;236/4288;241/7231;221/8102;190/7229;25/8184",
        "google_scholar": "https://scholar.google.com/citations?hl=en;WNvQ7AcAAAAJ;oUYfjg0AAAAJ;T2ezBDsAAAAJ;48GJrbsAAAAJ;WUoMq1IAAAAJ;pGDKzuUAAAAJ;xfjALj0AAAAJ;https://scholar.google.de/citations?user=206vNCEAAAAJ;KmSuVtgAAAAJ",
        "orcid": ";;;;;;;;;",
        "linkedin": "neel-jain-0a6a239/;;;;johnkirchenbauer/;;;;;",
        "or_profile": "~Neel_Jain1;~Avi_Schwarzschild1;~Yuxin_Wen2;~Gowthami_Somepalli1;~John_Kirchenbauer1;~Ping-yeh_Chiang1;~Micah_Goldblum1;~Aniruddha_Saha1;~Jonas_Geiping1;~Tom_Goldstein1",
        "aff": "University of Maryland, College Park;Carnegie Mellon University;University of Maryland, College Park;University of Maryland, College Park;University of Maryland, College Park;University of Maryland, College Park;New York University;University of Maryland, College Park;Max Planck Institute for Intelligent Systems, Max-Planck Institute;University of Maryland, College Park",
        "aff_domain": "umd.edu;cmu.edu;umd.edu;umd.edu;umd.edu;umd.edu;nyu.edu;umd.edu;tuebingen.mpg.de;umd.edu",
        "position": "PhD student;Postdoc;PhD student;PhD student;PhD student;PhD student;Postdoc;Postdoc;Principal Researcher;Full Professor",
        "bibtex": "@misc{\njain2024baseline,\ntitle={Baseline Defenses for Adversarial Attacks Against Aligned Language Models},\nauthor={Neel Jain and Avi Schwarzschild and Yuxin Wen and Gowthami Somepalli and John Kirchenbauer and Ping-yeh Chiang and Micah Goldblum and Aniruddha Saha and Jonas Geiping and Tom Goldstein},\nyear={2024},\nurl={https://openreview.net/forum?id=0VZP2Dr9KX}\n}",
        "github": "",
        "project": "",
        "reviewers": "9hm2;UELn;hCXb;Ywox",
        "site": "https://openreview.net/forum?id=0VZP2Dr9KX",
        "pdf_size": 544029,
        "rating": "3;5;5;8",
        "confidence": "4;4;4;3",
        "soundness": "2;3;3;4",
        "contribution": "2;2;3;3",
        "presentation": "2;3;3;4",
        "wc_summary": "32;64;59;93",
        "wc_strengths": "11;56;40;50",
        "wc_weaknesses": "1088;124;439;81",
        "wc_questions": "83;14;39;4",
        "wc_review": "1214;258;577;228",
        "wc_reply_reviewers": "928;47;0;0",
        "wc_reply_authors": "1569;379;290;427",
        "reply_reviewers": "2;1;0;0",
        "reply_authors": "3;1;1;1",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            62.0,
            21.644860821913362
        ],
        "wc_strengths_avg": [
            39.25,
            17.282577932704367
        ],
        "wc_weaknesses_avg": [
            433.0,
            402.6307241132996
        ],
        "wc_questions_avg": [
            35.0,
            30.504098085339287
        ],
        "wc_review_avg": [
            569.25,
            396.57620642191836
        ],
        "wc_reply_reviewers_avg": [
            243.75,
            395.5176197086547
        ],
        "wc_reply_authors_avg": [
            666.25,
            523.5156993825495
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": -0.8892972917998875,
        "gs_citation": 111,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14062897331071035133&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;0;0;0;2;0;3;0",
        "aff_unique_norm": "University of Maryland;Carnegie Mellon University;New York University;Max Planck Institute for Intelligent Systems",
        "aff_unique_dep": ";;;Intelligent Systems",
        "aff_unique_url": "https://www/umd.edu;https://www.cmu.edu;https://www.nyu.edu;https://www.mpi-is.mpg.de",
        "aff_unique_abbr": "UMD;CMU;NYU;MPI-IS",
        "aff_campus_unique_index": "0;0;0;0;0;0;0",
        "aff_campus_unique": "College Park;",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;1;0",
        "aff_country_unique": "United States;Germany"
    },
    {
        "id": "0XVLzHp6Fd",
        "title": "Towards Well-distributed Generative Networks Using Adversarial Autoencoders",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In addition to perceptual quality, the usefulness of a generative model depends on how closely the generated distribution matches the training distribution. Previous efforts in adversarial generative models have focused on reducing \"mode collapse\", but this term, roughly meaning being unable to generate certain parts of the data distribution, is not clearly defined. In addition, being able to generate every image in the data distribution does not imply reproducing the correct distribution, which additionally requires that each image occur at the same frequency in the generated images as in the training data. Due to the lack of a precise definition and measurement, it has been difficult to evaluate the success of these efforts in producing the correct distribution. In this work we proposes an autoencoder-based adversarial training framework, which ensures that the density of the encoder's aggregate output distribution closely matches the prior latent distribution, which in turn ensures that the distribution of images generated from randomly sampled latent code will closely match the training data. To evaluate our method, we introduce the 3DShapeHD dataset, which has a moderate complexity that goes beyond simplistic toy datasets, but also a exactly known generating process and distribution of features, which enables precise measurements. Using the reduced chi-square statistic, we show significant improvement in the accuracy of the distribution of generated samples. The results also demonstrate that the enhanced diversity of our model improves the ability to generate uncommon features in real-world datasets.",
        "keywords": "Generative Networks;Adversarial Autoencoders",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/eacc6662cae5bb13d789ff08640d7368b3ac5710.zip",
        "author": "Sitao Xiang;Pengda Xiang;Yajie Zhao",
        "authorids": "~Sitao_Xiang1;~Pengda_Xiang1;~Yajie_Zhao1",
        "gender": "M;M;F",
        "homepage": ";;https://www.yajie-zhao.com/",
        "dblp": "199/1894;262/3792;54/7467",
        "google_scholar": "vPMqq2AAAAAJ;;",
        "orcid": "0000-0001-9296-6889;;",
        "linkedin": ";pengda-xiang-20a81410a/;",
        "or_profile": "~Sitao_Xiang1;~Pengda_Xiang1;~Yajie_Zhao1",
        "aff": "University of Southern California;University of Southern California;USC Institute for Creative Technologies, University of Southern California",
        "aff_domain": "usc.edu;usc.edu;ict.usc.edu",
        "position": "PhD student;PhD student;Director",
        "bibtex": "@misc{\nxiang2024towards,\ntitle={Towards Well-distributed Generative Networks Using Adversarial Autoencoders},\nauthor={Sitao Xiang and Pengda Xiang and Yajie Zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=0XVLzHp6Fd}\n}",
        "github": "",
        "project": "",
        "reviewers": "EFy9;p6Dj;e5hk;Jjz9",
        "site": "https://openreview.net/forum?id=0XVLzHp6Fd",
        "pdf_size": 539437,
        "rating": "3;3;3;3",
        "confidence": "4;4;4;4",
        "soundness": "2;2;2;2",
        "contribution": "1;2;2;1",
        "presentation": "2;1;2;2",
        "wc_summary": "102;28;79;74",
        "wc_strengths": "81;17;72;13",
        "wc_weaknesses": "324;81;527;44",
        "wc_questions": "124;7;14;460",
        "wc_review": "631;133;692;591",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            70.75,
            26.845623479442605
        ],
        "wc_strengths_avg": [
            45.75,
            30.946526460977815
        ],
        "wc_weaknesses_avg": [
            244.0,
            195.61313861803865
        ],
        "wc_questions_avg": [
            151.25,
            184.19741447696816
        ],
        "wc_review_avg": [
            511.75,
            221.60931275557894
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:8PQCC3f1At0J:scholar.google.com/&scioq=Towards+Well-distributed+Generative+Networks+Using+Adversarial+Autoencoders&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Southern California",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.usc.edu",
        "aff_unique_abbr": "USC",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Los Angeles",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "0Y26tFG3WF",
        "title": "Inducing Precision in Lagrangian Neural Networks : Proof of concept application on Chaotic systems",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Solutions of dynamic systems that exhibit chaotic behavior are particularly sensitive to errors in initial/intermediate state estimates when long term dynamics is of interest. Lagrangian Neural Networks (LNN) are a class of physics induced learning methods that seamlessly integrate physical conservation laws into functional solutions, by forming a parametric Lagrangian for the system of interest. However it has been seen that the function approximation error associated with the parametric Lagrangian modelling could prove to be catastrophic for the prediction of long term dynamics of chaotic systems. This makes improving the precision of the parametric Lagrangian particularly crucial. Considering the same in this work a modified Lagrangian Neural Network approach is proposed, where a customized neural network architecture is designed to directly emphasize the relative importance of each significant bit in the Lagrangian estimates produced. We evaluate our method on two dynamic systems that are well known in the literature in exhibiting deterministic chaos, namely the double pendulum and Henon-Helies systems. Further, we compare the obtained solutions with those estimated by Finite Element solvers (under optimal conditions) to validate the relative accuracy. We observe that the trajectory deviations as a result of chaotic behavior can be significantly reduced by the process of explicitly enforcing the precision requirement for the parametric Lagrangian, as modelled using the proposed approach.",
        "keywords": "Physics Informed Learning;Deep Learning;Neural Networks;Chaotic systems.",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "",
        "author": "Hrithwik Shalu;Bharath Govindarajan",
        "authorids": "~Hrithwik_Shalu1;~Bharath_Govindarajan1",
        "gender": "M;",
        "homepage": ";https://mgbharath.com",
        "dblp": "271/7953;",
        "google_scholar": ";",
        "orcid": "0000-0002-8944-434X;0009-0000-0430-9775",
        "linkedin": ";",
        "or_profile": "~Hrithwik_Shalu1;~Bharath_Govindarajan1",
        "aff": ";Indian Institute of Technology Madras",
        "aff_domain": ";iitm.ac.in",
        "position": ";Assistant Professor",
        "bibtex": "@misc{\nshalu2024inducing,\ntitle={Inducing Precision in Lagrangian Neural Networks : Proof of concept application on Chaotic systems},\nauthor={Hrithwik Shalu and Bharath Govindarajan},\nyear={2024},\nurl={https://openreview.net/forum?id=0Y26tFG3WF}\n}",
        "github": "",
        "project": "",
        "reviewers": "2inG;HA5A;88d6",
        "site": "https://openreview.net/forum?id=0Y26tFG3WF",
        "pdf_size": 1890347,
        "rating": "3;3;5",
        "confidence": "4;3;3",
        "soundness": "2;3;3",
        "contribution": "1;1;2",
        "presentation": "2;2;3",
        "wc_summary": "107;61;53",
        "wc_strengths": "151;20;40",
        "wc_weaknesses": "363;105;101",
        "wc_questions": "76;2;182",
        "wc_review": "697;188;376",
        "wc_reply_reviewers": "214;112;1509",
        "wc_reply_authors": "495;624;2332",
        "reply_reviewers": "2;1;11",
        "reply_authors": "3;2;12",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            73.66666666666667,
            23.79542439676633
        ],
        "wc_strengths_avg": [
            70.33333333333333,
            57.62136949276911
        ],
        "wc_weaknesses_avg": [
            189.66666666666666,
            122.5760534887989
        ],
        "wc_questions_avg": [
            86.66666666666667,
            73.87075800943761
        ],
        "wc_review_avg": [
            420.3333333333333,
            210.14968210513402
        ],
        "wc_reply_reviewers_avg": [
            611.6666666666666,
            635.8754245570083
        ],
        "wc_reply_authors_avg": [
            1150.3333333333333,
            837.2225245151707
        ],
        "reply_reviewers_avg": [
            4.666666666666667,
            4.496912521077347
        ],
        "reply_authors_avg": [
            5.666666666666667,
            4.496912521077347
        ],
        "replies_avg": [
            36,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:o33sgZ2O4TAJ:scholar.google.com/&scioq=Inducing+Precision+in+Lagrangian+Neural+Networks+:+Proof+of+concept+application+on+Chaotic+systems&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Indian Institute of Technology Madras",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.iitm.ac.in",
        "aff_unique_abbr": "IIT Madras",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Madras",
        "aff_country_unique_index": "0",
        "aff_country_unique": "India"
    },
    {
        "id": "0Z6lN4GYrO",
        "title": "S4G: Breaking the Bottleneck on Graphs with Structured State Spaces",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The majority of GNNs are based on message-passing mechanisms, however, message-passing neural networks (MPNN) have inherent limitations in capturing long-range interactions. The exponentially growing node information is compressed into fixed-size representations through multiple rounds of message passing, bringing the over-squashing problem, which severely hinders the flow of information on the graph and creates a bottleneck in graph learning. The natural idea of introducing global attention to point-to-point communication, as adopted in graph Transformers (GT), lacks inductive biases on graph structures and relies on complex positional encodings to enhance their performance in practical tasks. In this paper, we observe that the sensitivity between nodes in MPNN decreases exponentially with the shortest path distance. Contrarily, GT has a constant sensitivity, which leads to its loss of inductive bias. To address these issues, we introduce structured state spaces to capture the hierarchical structure of rooted-trees, achieving linear sensitivity with theoretical guarantees. We further propose a novel graph convolution based on the state-space model, resulting in a new paradigm that retains both the strong inductive biases from MPNN and the long-range modeling capabilities from GT. Extensive experimental results on long-range and general graph benchmarks demonstrate the superiority of our approach.",
        "keywords": "GNN;over-squashing;state-space models",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Yunchong Song;Siyuan Huang;Jiacheng Cai;Xinbing Wang;Chenghu Zhou;Zhouhan Lin",
        "authorids": "~Yunchong_Song1;~Siyuan_Huang8;~Jiacheng_Cai1;~Xinbing_Wang1;~Chenghu_Zhou3;~Zhouhan_Lin1",
        "gender": "M;M;;M;M;M",
        "homepage": "https://github.com/realCrush;https://github.com/SiyuanHuangSJTU;https://github.com/imjccai;http://www.cs.sjtu.edu.cn/~wang-xb/;http://www.igsnrr.cas.cn/gkjj/ysfc/ysfc_zhouchenghu/;https://hantek.github.io",
        "dblp": "339/6816;62/885-3;;96/1149.html;85/1324.html;121/7919.html",
        "google_scholar": "C-TqDNsAAAAJ;https://scholar.google.com/citations?view_op=list_works;;https://scholar.google.com.tw/citations?user=CT5yZbwAAAAJ;;https://scholar.google.ca/citations?user=LNZ4efwAAAAJ",
        "orcid": ";;0009-0004-1304-5651;0000-0002-0357-8356;;0009-0009-7204-0689",
        "linkedin": ";siyuan-huang-885863235/;;;;https://ca.linkedin.com/in/zhouhan-lin-34b98975",
        "or_profile": "~Yunchong_Song1;~Siyuan_Huang8;~Jiacheng_Cai1;~Xinbing_Wang1;~Chenghu_Zhou3;~Zhouhan_Lin1",
        "aff": "Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;IGSNRR, Chinese Academy of Sciences, Beijing, China;Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;cs.sjtu.edu.cn;lreis.ac.cn;sjtu.edu.cn",
        "position": "PhD student;MS student;Undergrad student;Full Professor;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nsong2024sg,\ntitle={S4G: Breaking the Bottleneck on Graphs with Structured State Spaces},\nauthor={Yunchong Song and Siyuan Huang and Jiacheng Cai and Xinbing Wang and Chenghu Zhou and Zhouhan Lin},\nyear={2024},\nurl={https://openreview.net/forum?id=0Z6lN4GYrO}\n}",
        "github": "",
        "project": "",
        "reviewers": "rkT5;SDke;qfiX",
        "site": "https://openreview.net/forum?id=0Z6lN4GYrO",
        "pdf_size": 297226,
        "rating": "3;3;8",
        "confidence": "4;4;3",
        "soundness": "2;2;3",
        "contribution": "1;2;3",
        "presentation": "2;3;3",
        "wc_summary": "121;87;79",
        "wc_strengths": "29;45;36",
        "wc_weaknesses": "473;175;31",
        "wc_questions": "5;45;5",
        "wc_review": "628;352;151",
        "wc_reply_reviewers": "121;33;0",
        "wc_reply_authors": "1925;1410;204",
        "reply_reviewers": "1;1;0",
        "reply_authors": "5;4;2",
        "rating_avg": [
            4.666666666666667,
            2.357022603955158
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            95.66666666666667,
            18.208667044996883
        ],
        "wc_strengths_avg": [
            36.666666666666664,
            6.548960901462833
        ],
        "wc_weaknesses_avg": [
            226.33333333333334,
            184.06037656764212
        ],
        "wc_questions_avg": [
            18.333333333333332,
            18.856180831641268
        ],
        "wc_review_avg": [
            377.0,
            195.5351630781533
        ],
        "wc_reply_reviewers_avg": [
            51.333333333333336,
            51.07075701634177
        ],
        "wc_reply_authors_avg": [
            1179.6666666666667,
            721.2259624340272
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            1.247219128924647
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.9999999999999998,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3235799037450276266&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;1;0",
        "aff_unique_norm": "Shanghai Jiao Tong University;Chinese Academy of Sciences",
        "aff_unique_dep": ";IGSNRR",
        "aff_unique_url": "https://www.sjtu.edu.cn;http://www.cas.cn",
        "aff_unique_abbr": "SJTU;CAS",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Beijing",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "0ZUKLCxwBo",
        "title": "A simple and interpretable model of grokking modular arithmetic tasks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We present a simple neural network that can generalize on various modular arithmetic tasks such as modular addition or multiplication, and exhibits a sudden jump in generalization known as \\emph{grokking}. Concretely, we present (i) fully-connected two-layer networks  that exhibit grokking on various modular arithmetic tasks under vanilla gradient descent with the MSE loss function in the absence of any regularization; (ii) evidence that grokking modular arithmetic corresponds to learning specific representations whose structure is determined by the task; (iii) \\emph{analytic} expressions for the weights -- and thus for the embedding -- that solve a large class of modular arithmetic tasks; and (iv) evidence that these representations are also found by gradient descent as well as AdamW, establishing complete (\"mechanistic\") interpretability of the representations learnt by the network.",
        "keywords": "grokking;mechanistic interpretability;emergent capabilities;emergence;physics of AI;phase transition;circuits;pattern formation;solvable model;superposition",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/1973960be8120f5bc7f29ceecc4b0319e7610e40.pdf",
        "author": "Andrey Gromov",
        "authorids": "~Andrey_Gromov1",
        "gender": "M",
        "homepage": "",
        "dblp": "",
        "google_scholar": "D056qfMAAAAJ",
        "orcid": "",
        "linkedin": "andrey-gromov-2329a241",
        "or_profile": "~Andrey_Gromov1",
        "aff": "University of Maryland, College Park",
        "aff_domain": "umd.edu",
        "position": "Assistant Professor",
        "bibtex": "@misc{\ngromov2024a,\ntitle={A simple and interpretable model of grokking modular arithmetic tasks},\nauthor={Andrey Gromov},\nyear={2024},\nurl={https://openreview.net/forum?id=0ZUKLCxwBo}\n}",
        "github": "",
        "project": "",
        "reviewers": "QK7D;UC6H;PaA4;9nDi;5GzG",
        "site": "https://openreview.net/forum?id=0ZUKLCxwBo",
        "pdf_size": 3005370,
        "rating": "5;5;6;6;8",
        "confidence": "3;4;3;3;4",
        "soundness": "2;3;2;4;4",
        "contribution": "2;2;2;4;4",
        "presentation": "2;3;3;3;4",
        "wc_summary": "59;46;65;35;34",
        "wc_strengths": "26;26;36;32;32",
        "wc_weaknesses": "202;83;43;241;50",
        "wc_questions": "1;52;41;47;44",
        "wc_review": "288;207;185;355;160",
        "wc_reply_reviewers": "0;10;0;447;7",
        "wc_reply_authors": "586;637;309;968;408",
        "reply_reviewers": "0;1;0;2;1",
        "reply_authors": "1;1;1;2;1",
        "rating_avg": [
            6.0,
            1.0954451150103321
        ],
        "confidence_avg": [
            3.4,
            0.4898979485566356
        ],
        "soundness_avg": [
            3.0,
            0.8944271909999159
        ],
        "contribution_avg": [
            2.8,
            0.9797958971132712
        ],
        "presentation_avg": [
            3.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            47.8,
            12.480384609458156
        ],
        "wc_strengths_avg": [
            30.4,
            3.8781438859330635
        ],
        "wc_weaknesses_avg": [
            123.8,
            81.84228735806448
        ],
        "wc_questions_avg": [
            37.0,
            18.36300628982085
        ],
        "wc_review_avg": [
            239.0,
            72.16370278748174
        ],
        "wc_reply_reviewers_avg": [
            92.8,
            177.1433317965991
        ],
        "wc_reply_authors_avg": [
            581.6,
            226.64562647445902
        ],
        "reply_reviewers_avg": [
            0.8,
            0.7483314773547883
        ],
        "reply_authors_avg": [
            1.2,
            0.4
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0.372677996249965,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:1q11UVO1wBYJ:scholar.google.com/&scioq=A+simple+and+interpretable+model+of+grokking+modular+arithmetic+tasks&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Maryland",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www/umd.edu",
        "aff_unique_abbr": "UMD",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "College Park",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "0aEUd9UtiA",
        "title": "DiffCPS: Diffusion Model based Constrained Policy Search for Offline Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Constrained policy search (CPS) is a fundamental problem in offline reinforcement learning, which is generally solved by advantage weighted regression (AWR). However, previous methods may still encounter out-of-distribution actions due to the limited expressivity of Gaussian-based policies.  On the other hand, directly applying the state-of-the-art models with distribution expression capabilities (i.e., diffusion models) in the AWR framework is insufficient since AWR requires exact policy probability densities, which is intractable in diffusion models. In this paper, we propose a novel approach called $\\textbf{Diffusion Model based Constrained Policy Search (DiffCPS)}$, which tackles the diffusion-based constrained policy search without resorting to AWR.  The theoretical analysis reveals our key insights by leveraging the action distribution of the diffusion model to eliminate the policy distribution constraint in the CPS and then utilizing the Evidence Lower Bound (ELBO) of diffusion-based policy to approximate the KL constraint. Consequently, DiffCPS admits the high expressivity of diffusion models while circumventing the cumbersome density calculation brought by AWR. Extensive experimental results based on the D4RL benchmark demonstrate the efficacy of our approach. We empirically show that DiffCPS achieves better or at least competitive performance compared to traditional AWR-based baselines as well as recent diffusion-based offline RL methods. Code will be made publicly available upon acceptance.",
        "keywords": "Offline Reinforcement Learning;Diffusion Model;Constrained Policy Search;Advantage Weighted Regression",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/2582bad1d6b9e644523f98a64d91c81c19286f6b.zip",
        "author": "Longxiang He;Linrui Zhang;Junbo Tan;Xueqian Wang",
        "authorids": "~Longxiang_He2;~Linrui_Zhang1;~Junbo_Tan1;~Xueqian_Wang1",
        "gender": "M;M;M;M",
        "homepage": "https://say-hello2y.github.io/;;;",
        "dblp": "358/7083;;192/2867;43/3563-1",
        "google_scholar": "KTGh2zYAAAAJ;;https://scholar.google.com/citations?hl=en;h9dN_ykAAAAJ",
        "orcid": ";;;0000-0003-3542-0593",
        "linkedin": ";%E9%BA%9F%E7%9D%BF-%E5%BC%A0-bb5312222/;;",
        "or_profile": "~Longxiang_He2;~Linrui_Zhang1;~Junbo_Tan1;~Xueqian_Wang1",
        "aff": "Tsinghua University;;Tsinghua University;Tsinghua University",
        "aff_domain": "mail.tsinghua.edu.cn;;tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "MS student;;Associate Professor;Full Professor",
        "bibtex": "@misc{\nhe2024diffcps,\ntitle={Diff{CPS}: Diffusion Model based Constrained Policy Search for Offline Reinforcement Learning},\nauthor={Longxiang He and Linrui Zhang and Junbo Tan and Xueqian Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=0aEUd9UtiA}\n}",
        "github": "",
        "project": "",
        "reviewers": "4x5N;UbgT;hHF8",
        "site": "https://openreview.net/forum?id=0aEUd9UtiA",
        "pdf_size": 2207264,
        "rating": "3;5;8",
        "confidence": "5;4;4",
        "soundness": "2;2;4",
        "contribution": "2;2;3",
        "presentation": "2;3;4",
        "wc_summary": "49;58;92",
        "wc_strengths": "22;74;65",
        "wc_weaknesses": "165;123;259",
        "wc_questions": "97;114;71",
        "wc_review": "333;369;487",
        "wc_reply_reviewers": "188;88;24",
        "wc_reply_authors": "1175;1332;594",
        "reply_reviewers": "1;1;1",
        "reply_authors": "3;3;1",
        "rating_avg": [
            5.333333333333333,
            2.0548046676563256
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            66.33333333333333,
            18.517259216441534
        ],
        "wc_strengths_avg": [
            53.666666666666664,
            22.691163233490013
        ],
        "wc_weaknesses_avg": [
            182.33333333333334,
            56.858498827254394
        ],
        "wc_questions_avg": [
            94.0,
            17.682382946499793
        ],
        "wc_review_avg": [
            396.3333333333333,
            65.7740239169098
        ],
        "wc_reply_reviewers_avg": [
            100.0,
            67.4882705858334
        ],
        "wc_reply_authors_avg": [
            1033.6666666666667,
            317.4296072447489
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8029550685469661,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17102329719247376787&as_sdt=5,31&sciodt=0,31&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Tsinghua University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Revisiting Plasticity in Visual Reinforcement Learning: Data, Modules and Training Stages",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19614",
        "id": "0aR1s9YxoL",
        "author_site": "Guozheng Ma, Lu Li, Sen Zhang, Zixuan Liu, Zhen Wang, Yixin Chen, Li Shen, Xueqian Wang, Dacheng Tao",
        "tldr": "",
        "abstract": "Plasticity, the ability of a neural network to evolve with new data, is crucial for high-performance and sample-efficient visual reinforcement learning (VRL). Although methods like resetting and regularization can potentially mitigate plasticity loss, the influences of various components within the VRL framework on the agent's plasticity are still poorly understood. In this work, we conduct a systematic empirical exploration focusing on three primary underexplored facets and derive the following insightful conclusions: (1) data augmentation is essential in maintaining plasticity; (2) the critic's plasticity loss serves as the principal bottleneck impeding efficient training; and (3) without timely intervention to recover critic's plasticity in the early stages, its loss becomes catastrophic. These insights suggest a novel strategy to address the high replay ratio (RR) dilemma, where exacerbated plasticity loss hinders the potential improvements of sample efficiency brought by increased reuse frequency. Rather than setting a static RR for the entire training process, we propose Adaptive RR, which dynamically adjusts the RR based on the critic\u2019s plasticity level. Extensive evaluations indicate that Adaptive RR not only avoids catastrophic plasticity loss in the early stages but also benefits from more frequent reuse in later phases, resulting in superior sample efficiency.",
        "keywords": "Plasticity;Visual Reinforcement Learning;Deep Reinforcement Learning;Sample Efficiency",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Guozheng Ma;Lu Li;Sen Zhang;Zixuan Liu;Zhen Wang;Yixin Chen;Li Shen;Xueqian Wang;Dacheng Tao",
        "authorids": "~Guozheng_Ma2;~Lu_Li5;~Sen_Zhang3;~Zixuan_Liu2;~Zhen_Wang9;~Yixin_Chen1;~Li_Shen1;~Xueqian_Wang1;~Dacheng_Tao1",
        "gender": "M;M;M;;;M;M;M;",
        "homepage": "https://guozheng-ma.github.io/;https://github.com/lilucse;https://github.com/SenZHANG-GitHub;https://panda-shawn.github.io;;https://www.cse.wustl.edu/~yixin.chen/;https://sites.google.com/site/mathshenli/home;;",
        "dblp": ";;57/6221-6;254/3346-2;;59/983;91/3680-8;43/3563-1;",
        "google_scholar": "jDvVglUAAAAJ;QPsrZx8AAAAJ;-bJJNV0AAAAJ;D4XufdkAAAAJ;;NByrsK0AAAAJ;yVhgENIAAAAJ;h9dN_ykAAAAJ;",
        "orcid": ";;;0000-0003-0667-9053;;;;0000-0003-3542-0593;",
        "linkedin": ";;;;;;;;",
        "or_profile": "~Guozheng_Ma2;~Lu_Li5;~Sen_Zhang3;~Zixuan_Liu2;~Zhen_Wang9;~Yixin_Chen1;~Li_Shen1;~Xueqian_Wang1;~Dacheng_Tao1",
        "aff": "Tsinghua University;Tsinghua University;University of Sydney, University of Sydney;Tsinghua University;;Washington University, Saint Louis;JD Explore Academy;Tsinghua University;",
        "aff_domain": "tsinghua.edu.cn;mails.tsinghua.edu.cn;sydney.edu.au;mails.tsinghua.edu.cn;;wustl.edu;jd.com;tsinghua.edu.cn;",
        "position": "MS student;MS student;Postdoc;MS student;;Full Professor;Researcher;Full Professor;",
        "bibtex": "@inproceedings{\nma2024revisiting,\ntitle={Revisiting Plasticity in Visual Reinforcement Learning: Data, Modules and Training Stages},\nauthor={Guozheng Ma and Lu Li and Sen Zhang and Zixuan Liu and Zhen Wang and Yixin Chen and Li Shen and Xueqian Wang and Dacheng Tao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=0aR1s9YxoL}\n}",
        "github": "",
        "project": "",
        "reviewers": "c6tM;m8KG;Kom1;7W3D",
        "pdf_size": 6954013,
        "rating": "6;6;6;6",
        "confidence": "4;4;4;5",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;4;3;3",
        "wc_summary": "89;89;127;87",
        "wc_strengths": "107;256;42;202",
        "wc_weaknesses": "217;348;398;387",
        "wc_questions": "3;84;1;1",
        "wc_review": "416;777;568;677",
        "wc_reply_reviewers": "729;288;297;107",
        "wc_reply_authors": "4341;2617;2195;1018",
        "reply_reviewers": "4;2;1;1",
        "reply_authors": "11;5;5;3",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            98.0,
            16.76305461424021
        ],
        "wc_strengths_avg": [
            151.75,
            82.82624885868006
        ],
        "wc_weaknesses_avg": [
            337.5,
            72.00868003234055
        ],
        "wc_questions_avg": [
            22.25,
            35.66072769868837
        ],
        "wc_review_avg": [
            609.5,
            133.95614954155707
        ],
        "wc_reply_reviewers_avg": [
            355.25,
            228.7098325389619
        ],
        "wc_reply_authors_avg": [
            2542.75,
            1192.1628192071753
        ],
        "reply_reviewers_avg": [
            2.0,
            1.224744871391589
        ],
        "reply_authors_avg": [
            6.0,
            3.0
        ],
        "replies_avg": [
            38,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17017605233893666116&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=0aR1s9YxoL",
        "pdf": "https://openreview.net/pdf?id=0aR1s9YxoL",
        "email": "tsinghua.edu.cn;mails.tsinghua.edu.cn;sydney.edu.au;mails.tsinghua.edu.cn;;wustl.edu;jd.com;tsinghua.edu.cn;",
        "author_num": 9,
        "aff_unique_index": "0;0;1;0;2;3;0",
        "aff_unique_norm": "Tsinghua University;University of Sydney;Washington University in St. Louis;JD",
        "aff_unique_dep": ";;;JD Explore Academy",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.sydney.edu.au;https://wustl.edu;",
        "aff_unique_abbr": "THU;USYD;WUSTL;",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Saint Louis",
        "aff_country_unique_index": "0;0;1;0;2;0",
        "aff_country_unique": "China;Australia;United States;"
    },
    {
        "title": "Contrastive Difference Predictive Coding",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19613",
        "id": "0akLDTFR9x",
        "author_site": "Chongyi Zheng, Ruslan Salakhutdinov, Benjamin Eysenbach",
        "tldr": "",
        "abstract": "Predicting and reasoning about the future lie at the heart of many time-series questions. For example, goal-conditioned reinforcement learning can be viewed as learning representations to predict which states are likely to be visited in the future. While prior methods have used contrastive predictive coding to model time series data, learning representations that encode long-term dependencies usually requires large amounts of data. In this paper, we introduce a temporal difference version of contrastive predictive coding that stitches together pieces of different time series data to decrease the amount of data required to learn predictions of future events. We apply this representation learning method to derive an off-policy algorithm for goal-conditioned RL. Experiments demonstrate that, compared with prior RL methods, ours achieves $2 \\times$ median improvement in success rates and can better cope with stochastic environments. In tabular settings, we show that our method is about $20\\times$ more sample efficient than the successor representation and $1500 \\times$ more sample efficient than the standard (Monte Carlo) version of contrastive predictive coding.",
        "keywords": "contrastive learning;reinforcement learning;goal-reaching;goal-conditioned RL;temporal difference",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Chongyi Zheng;Ruslan Salakhutdinov;Benjamin Eysenbach",
        "authorids": "~Chongyi_Zheng1;~Ruslan_Salakhutdinov1;~Benjamin_Eysenbach1",
        "gender": "M;M;M",
        "homepage": "https://chongyi-zheng.github.io;https://ben-eysenbach.github.io/;https://www.cs.cmu.edu/~rsalakhu/",
        "dblp": "250/9267;192/1863;",
        "google_scholar": "bezWXYcAAAAJ;DRnOvU8AAAAJ;",
        "orcid": ";0009-0000-7136-6307;",
        "linkedin": ";benjamin-eysenbach-a7235775/;",
        "or_profile": "~Chongyi_Zheng1;~Benjamin_Eysenbach1;~Russ_Salakhutdinov1",
        "aff": "Princeton University;Princeton University;School of Computer Science, Carnegie Mellon University",
        "aff_domain": "princeton.edu;princeton.edu;cs.cmu.edu",
        "position": "PhD student;Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\nzheng2024contrastive,\ntitle={Contrastive Difference Predictive Coding},\nauthor={Chongyi Zheng and Ruslan Salakhutdinov and Benjamin Eysenbach},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=0akLDTFR9x}\n}",
        "github": "",
        "project": "",
        "reviewers": "Jmo8;2Mg8;a2XQ;yDjK",
        "pdf_size": 2384774,
        "rating": "6;6;8;8",
        "confidence": "4;4;3;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;2;3",
        "wc_summary": "104;47;150;99",
        "wc_strengths": "83;27;38;179",
        "wc_weaknesses": "50;916;36;154",
        "wc_questions": "90;2;109;38",
        "wc_review": "327;992;333;470",
        "wc_reply_reviewers": "23;50;22;0",
        "wc_reply_authors": "528;1593;499;623",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "1;3;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            100.0,
            36.489724581037876
        ],
        "wc_strengths_avg": [
            81.75,
            59.93903152370749
        ],
        "wc_weaknesses_avg": [
            289.0,
            364.8575064323057
        ],
        "wc_questions_avg": [
            59.75,
            42.2751404492049
        ],
        "wc_review_avg": [
            530.5,
            272.5165132611233
        ],
        "wc_reply_reviewers_avg": [
            23.75,
            17.725334975678173
        ],
        "wc_reply_authors_avg": [
            810.75,
            453.955050087561
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4196335089185927383&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=0akLDTFR9x",
        "pdf": "https://openreview.net/pdf?id=0akLDTFR9x",
        "email": "princeton.edu;princeton.edu;cs.cmu.edu",
        "author_num": 3,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Princeton University;Carnegie Mellon University",
        "aff_unique_dep": ";School of Computer Science",
        "aff_unique_url": "https://www.princeton.edu;https://www.cmu.edu",
        "aff_unique_abbr": "Princeton;CMU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Pittsburgh",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "0b328CMwn1",
        "title": "Visual Prompting Reimagined: The Power of Activation Prompts",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Visual prompting (VP) has emerged as a popular method to repurpose large pretrained models for downstream vision tasks. Unlike many parameter-efficient finetuning (PEFT) techniques that modify model parameters, VP introduces a universal perturbation directly into the input data to facilitate task-specific finetuning while keeping the pretrained model intact. However, there exists a noticeable performance gap between VP and conventional finetuning methods, highlighting an unexplored realm in theory and practice to understand and advance VP to close its performance gap. Towards this end, we introduce a novel concept, termed activation prompt (AP), which extends the scope of input-level VP by enabling universal perturbations to be applied to activation maps within the intermediate layers of the model. With the aid of AP, we show that VP, by its input perturbation design, has intrinsic limitations in both performance and efficiency. By contrast, AP shares a natural connection to normalization tuning, e.g., batch normalization for convolutional neural networks (CNNs) and layer normalization for vision transformers (ViTs). This illuminates the reason behind the observed better accuracy of normalization tuning than VP in the literature. Furthermore, we show that the choice of prompting exhibits a distinct preference for layer depth, with conclusions varying significantly between CNNs and ViTs. We theoretically elucidate the rationale behind such preference by analyzing global features across layers. By conducting extensive experiments across 29 datasets and various model architectures, we provide a thorough performance analysis of AP, comparing it with VP and PEFT baselines. Our experimental results demonstrate that AP significantly surpasses the input-level VP in terms of both accuracy and efficiency, considering factors like time, parameters, memory usage, and throughout. These results further support our new insights into the incapabilities of VP and the capabilities of AP.",
        "keywords": "parameter-efficient fine-tuning;transfer learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/6eed97249d815d388daa515edac5e1984c1012d1.zip",
        "author": "Yihua Zhang;Hongkang Li;Yuguang Yao;Aochuan Chen;Shuai Zhang;Pin-Yu Chen;Meng Wang;Sijia Liu",
        "authorids": "~Yihua_Zhang1;~Hongkang_Li1;~Yuguang_Yao1;~Aochuan_Chen1;~Shuai_Zhang6;~Pin-Yu_Chen1;~Meng_Wang4;~Sijia_Liu1",
        "gender": "M;;M;M;M;M;F;M",
        "homepage": "https://yihua-zhang.com;https://lohek330.github.io/lihongkang.github.io/;https://www.cse.msu.edu/~yaoyugua/;https://scholar.google.com/citations?hl=en&view_op=list_works&gmla=AJsN-F6N4cEX-_kViGgRpnUVo_iBHlVXwMpnhlyB-Cdrndwj6B0jaDy088r7K9gHPGqSwsQ9tNxpijGpb1IoIB2B5KVS3Scvtdz9Mt_WR9GSou_saurFpSA&user=7pY-Ie8AAAAJ;https://inchs708.github.io/shuaizhang.github.io/index.html;http://www.pinyuchen.com;https://www.ecse.rpi.edu/~wang/index.html;https://lsjxjtu.github.io/",
        "dblp": ";318/8643;238/9467;331/2356;71/208-15;39/8969;93/6765-3;128/6972-1",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com.hk/citations?user=DVlDPjMAAAAJ;-chIdAkAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?view_op=list_works;jxwlCUUAAAAJ;;C7dO_UgAAAAJ",
        "orcid": ";;;0009-0002-2300-1498;0000-0001-8280-6988;0000-0003-1039-8369;;",
        "linkedin": "zhangyihua/;hongkang-li-b7a341173/;tonyyaomsu/;;;pin-yu-chen-940062a2;;",
        "or_profile": "~Yihua_Zhang1;~Hongkang_Li1;~Yuguang_Yao1;~Aochuan_Chen1;~Shuai_Zhang6;~Pin-Yu_Chen1;~Meng_Wang4;~Sijia_Liu1",
        "aff": "Michigan State University;Rensselaer Polytechnic Institute;Michigan State University;Hong Kong University of Science and Technology;New Jersey Institute of Technology;International Business Machines;Rensselaer Polytechnic Institute;Michigan State University",
        "aff_domain": "msu.edu;rpi.edu;msu.edu;ust.hk;njit.edu;ibm.com;rpi.edu;msu.edu",
        "position": "PhD student;PhD student;PhD student;PhD student;Assistant Professor;Principal Researcher;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nzhang2024visual,\ntitle={Visual Prompting Reimagined: The Power of Activation Prompts},\nauthor={Yihua Zhang and Hongkang Li and Yuguang Yao and Aochuan Chen and Shuai Zhang and Pin-Yu Chen and Meng Wang and Sijia Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=0b328CMwn1}\n}",
        "github": "",
        "project": "",
        "reviewers": "Z13f;jt12;Yfja;TRtL",
        "site": "https://openreview.net/forum?id=0b328CMwn1",
        "pdf_size": 3550602,
        "rating": "5;5;5;6",
        "confidence": "4;4;4;2",
        "soundness": "3;3;2;4",
        "contribution": "3;3;2;3",
        "presentation": "2;3;3;4",
        "wc_summary": "96;56;39;100",
        "wc_strengths": "39;28;34;70",
        "wc_weaknesses": "105;270;331;106",
        "wc_questions": "65;216;27;149",
        "wc_review": "305;570;431;425",
        "wc_reply_reviewers": "249;0;0;91",
        "wc_reply_authors": "1952;1143;1534;1186",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "4;3;3;3",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            72.75,
            25.9939896899264
        ],
        "wc_strengths_avg": [
            42.75,
            16.20763708873073
        ],
        "wc_weaknesses_avg": [
            203.0,
            99.85739832380973
        ],
        "wc_questions_avg": [
            114.25,
            73.48256595955262
        ],
        "wc_review_avg": [
            432.75,
            93.83596059080975
        ],
        "wc_reply_reviewers_avg": [
            85.0,
            101.71283104898811
        ],
        "wc_reply_authors_avg": [
            1453.75,
            325.1725503482728
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.25,
            0.4330127018922193
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=210525781623516819&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;0;2;3;4;1;0",
        "aff_unique_norm": "Michigan State University;Rensselaer Polytechnic Institute;Hong Kong University of Science and Technology;New Jersey Institute of Technology;International Business Machines Corporation",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.msu.edu;https://www.rpi.edu;https://www.ust.hk;https://www.njit.edu;https://www.ibm.com",
        "aff_unique_abbr": "MSU;RPI;HKUST;NJIT;IBM",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;1;0;0;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "NEFTune: Noisy Embeddings Improve Instruction Finetuning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19612",
        "id": "0bMmZ3fkCk",
        "author_site": "Neel Jain, Ping-yeh Chiang, Yuxin Wen, John Kirchenbauer, Hong-Min Chu, Gowthami Somepalli, Brian Bartoldson, Bhavya Kailkhura, Avi Schwarzschild, Aniruddha Saha, Micah Goldblum, Jonas Geiping, Tom Goldstein",
        "tldr": "",
        "abstract": "We show that language model finetuning can be improved, sometimes dramatically, with a simple augmentation. \nNEFTune adds noise to the embedding vectors during training.\nStandard finetuning of LLaMA-2-7B using Alpaca achieves $29.79$\\% on AlpacaEval, which rises to $64.69$\\% using noisy embeddings. NEFTune also improves over strong baselines on modern instruction datasets.\nModels trained with Evol-Instruct see a $10$\\% improvement, with ShareGPT an $8$\\% improvement, and with OpenPlatypus an $8$\\% improvement. \nEven powerful models further refined with RLHF such as LLaMA-2-Chat benefit from additional training with NEFTune. Particularly, we see these improvements on the conversational abilities of the instruction model and not on traditional tasks like those on the OpenLLM Leaderboard, where performance is the same.",
        "keywords": "Instruction Finetuning",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/d78c3905a8b9202b58358079384a6a098d702065.zip",
        "author": "Neel Jain;Ping-yeh Chiang;Yuxin Wen;John Kirchenbauer;Hong-Min Chu;Gowthami Somepalli;Brian R. Bartoldson;Bhavya Kailkhura;Avi Schwarzschild;Aniruddha Saha;Micah Goldblum;Jonas Geiping;Tom Goldstein",
        "authorids": "~Neel_Jain1;~Ping-yeh_Chiang1;~Yuxin_Wen2;~John_Kirchenbauer1;~Hong-Min_Chu1;~Gowthami_Somepalli1;~Brian_R._Bartoldson1;~Bhavya_Kailkhura1;~Avi_Schwarzschild1;~Aniruddha_Saha1;~Micah_Goldblum1;~Jonas_Geiping1;~Tom_Goldstein1",
        "gender": ";;;M;;F;M;M;M;;M;M;M",
        "homepage": ";;https://yuxinwenrick.github.io/;https://jwkirchenbauer.notion.site/;;https://somepago.github.io/;https://people.llnl.gov/kailkhura1;https://cs.umd.edu/~avi1;https://ani0075saha.github.io/;;https://jonasgeiping.github.io/;https://www.cs.umd.edu/~tomg/;https://brianbartoldson.wordpress.com/",
        "dblp": ";236/4288;;321/0678;185/0720;286/5012;132/8938;249/9334.html;221/8102;241/7231;190/7229;25/8184;220/5475",
        "google_scholar": "https://scholar.google.com/citations?hl=en;WUoMq1IAAAAJ;oUYfjg0AAAAJ;48GJrbsAAAAJ;;T2ezBDsAAAAJ;SQpJmOgAAAAJ;WNvQ7AcAAAAJ;xfjALj0AAAAJ;pGDKzuUAAAAJ;https://scholar.google.de/citations?user=206vNCEAAAAJ;KmSuVtgAAAAJ;YdiZoJgAAAAJ",
        "orcid": ";;;;;;;;;;;;",
        "linkedin": "neel-jain-0a6a239/;;;johnkirchenbauer/;;;;;;;;;",
        "or_profile": "~Neel_Jain1;~Ping-yeh_Chiang1;~Yuxin_Wen2;~John_Kirchenbauer1;~Hong-Min_Chu1;~Gowthami_Somepalli1;~Bhavya_Kailkhura1;~Avi_Schwarzschild1;~Aniruddha_Saha1;~Micah_Goldblum1;~Jonas_Geiping1;~Tom_Goldstein1;~Brian_R_Bartoldson1",
        "aff": "University of Maryland, College Park;University of Maryland, College Park;University of Maryland, College Park;University of Maryland, College Park;Department of Computer Science, University of Maryland, College Park;University of Maryland, College Park;Lawrence Livermore National Laboratory;Carnegie Mellon University;University of Maryland, College Park;New York University;Max Planck Institute for Intelligent Systems, Max-Planck Institute;University of Maryland, College Park;Lawrence Livermore National Labs",
        "aff_domain": "umd.edu;umd.edu;umd.edu;umd.edu;cs.umd.edu;umd.edu;llnl.gov;cmu.edu;umd.edu;nyu.edu;tuebingen.mpg.de;umd.edu;llnl.gov",
        "position": "PhD student;PhD student;PhD student;PhD student;PhD student;PhD student;Research Staff;Postdoc;Postdoc;Postdoc;Principal Researcher;Full Professor;Researcher",
        "bibtex": "@inproceedings{\njain2024neftune,\ntitle={{NEFT}une: Noisy Embeddings Improve Instruction Finetuning},\nauthor={Neel Jain and Ping-yeh Chiang and Yuxin Wen and John Kirchenbauer and Hong-Min Chu and Gowthami Somepalli and Brian R. Bartoldson and Bhavya Kailkhura and Avi Schwarzschild and Aniruddha Saha and Micah Goldblum and Jonas Geiping and Tom Goldstein},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=0bMmZ3fkCk}\n}",
        "github": "",
        "project": "",
        "reviewers": "nFQe;kT9q;Agi9;h2qY",
        "pdf_size": 705584,
        "rating": "5;6;6;6",
        "confidence": "4;4;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "51;49;65;145",
        "wc_strengths": "47;119;148;255",
        "wc_weaknesses": "342;199;156;344",
        "wc_questions": "33;86;97;48",
        "wc_review": "473;453;466;792",
        "wc_reply_reviewers": "73;26;121;1159",
        "wc_reply_authors": "1050;375;632;1251",
        "reply_reviewers": "1;1;1;2",
        "reply_authors": "4;2;2;3",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            77.5,
            39.455671328720285
        ],
        "wc_strengths_avg": [
            142.25,
            74.76421269564737
        ],
        "wc_weaknesses_avg": [
            260.25,
            84.13790762789387
        ],
        "wc_questions_avg": [
            66.0,
            26.334388164527386
        ],
        "wc_review_avg": [
            546.0,
            142.2093527163386
        ],
        "wc_reply_reviewers_avg": [
            344.75,
            471.3058322363516
        ],
        "wc_reply_authors_avg": [
            827.0,
            343.4508698489494
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            13,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 53,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7229125578067553201&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=0bMmZ3fkCk",
        "pdf": "https://openreview.net/pdf?id=0bMmZ3fkCk",
        "email": "umd.edu;umd.edu;umd.edu;umd.edu;cs.umd.edu;umd.edu;llnl.gov;cmu.edu;umd.edu;nyu.edu;tuebingen.mpg.de;umd.edu;llnl.gov",
        "author_num": 13,
        "aff_unique_index": "0;0;0;0;1;0;2;3;0;4;5;0;2",
        "aff_unique_norm": "University of Maryland;University of Maryland, College Park;Lawrence Livermore National Laboratory;Carnegie Mellon University;New York University;Max Planck Institute for Intelligent Systems",
        "aff_unique_dep": ";Department of Computer Science;;;;Intelligent Systems",
        "aff_unique_url": "https://www/umd.edu;https://www/umd.edu;https://www.llnl.gov;https://www.cmu.edu;https://www.nyu.edu;https://www.mpi-is.mpg.de",
        "aff_unique_abbr": "UMD;UMD;LLNL;CMU;NYU;MPI-IS",
        "aff_campus_unique_index": "0;0;0;0;0;0;0;0",
        "aff_campus_unique": "College Park;",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0;1;0;0",
        "aff_country_unique": "United States;Germany"
    },
    {
        "id": "0bjIoHD45G",
        "title": "Closing the gap on tabular data with Fourier and Implicit Categorical Features",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "While Deep Learning has demonstrated impressive results in applications on various data types, it continues to lag behind tree-based methods when applied to tabular data, often referred to as the last \u201cunconquered castle\u201d for neural networks. We hypothesize that a significant advantage of tree-based methods lies in their intrinsic capability to model and exploit non-linear interactions induced by features with categorical characteristics. In contrast, neural-based methods exhibit biases toward a uniform numerical processing of features and smooth solutions, making it challenging for them to effectively leverage such patterns. We aim to address this performance gap by using simple, statistical-based feature processing techniques to identify and explicitly encode features that are strongly correlated with the target once discretized, as well as mitigate the bias of deep models for overly-smooth solutions, a bias that does not align with the inherent properties of the data, using Learned Fourier Features. Our proposed feature processing and method achieves a performance that closely matches or surpasses XGBoost on a comprehensive tabular data benchmark.",
        "keywords": "tabular data;neural networks;feature processing;deep learning;tree-based methods;xgboost",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Marius Dragoi;Florin Gogianu;Elena Burceanu",
        "authorids": "~Marius_Dragoi1;~Florin_Gogianu1;~Elena_Burceanu1",
        "gender": ";M;F",
        "homepage": ";;http://ilarele.github.io/",
        "dblp": ";230/0696;139/7814",
        "google_scholar": ";Zfk931sAAAAJ;bL34yDkAAAAJ",
        "orcid": ";;",
        "linkedin": ";;elena-burceanu-97016539/",
        "or_profile": "~Marius_Dragoi1;~Florin_Gogianu1;~Elena_Burceanu1",
        "aff": ";Bitdefender;Bitdefender",
        "aff_domain": ";bitdefender.com;bitdefender.com",
        "position": ";Researcher;Principal Researcher",
        "bibtex": "@misc{\ndragoi2024closing,\ntitle={Closing the gap on tabular data with Fourier and Implicit Categorical Features},\nauthor={Marius Dragoi and Florin Gogianu and Elena Burceanu},\nyear={2024},\nurl={https://openreview.net/forum?id=0bjIoHD45G}\n}",
        "github": "",
        "project": "",
        "reviewers": "tmhZ;xxW1;d92g;AFsk;HCF3",
        "site": "https://openreview.net/forum?id=0bjIoHD45G",
        "pdf_size": 386366,
        "rating": "3;3;5;5;5",
        "confidence": "5;4;5;4;4",
        "soundness": "2;1;4;3;3",
        "contribution": "2;1;3;2;2",
        "presentation": "1;2;3;3;3",
        "wc_summary": "97;126;84;18;72",
        "wc_strengths": "51;40;41;13;48",
        "wc_weaknesses": "536;610;26;37;514",
        "wc_questions": "1;107;11;83;129",
        "wc_review": "685;883;162;151;763",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "316;710;112;355;705",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            4.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            4.4,
            0.48989794855663565
        ],
        "soundness_avg": [
            2.6,
            1.019803902718557
        ],
        "contribution_avg": [
            2.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            2.4,
            0.8
        ],
        "wc_summary_avg": [
            79.4,
            35.57302348690648
        ],
        "wc_strengths_avg": [
            38.6,
            13.45511055324333
        ],
        "wc_weaknesses_avg": [
            344.6,
            257.63974848613714
        ],
        "wc_questions_avg": [
            66.2,
            51.35912771844943
        ],
        "wc_review_avg": [
            528.8,
            310.47730996000337
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            439.6,
            233.79871684848914
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.16666666666666666,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6422472616623222499&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Bitdefender",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.bitdefender.com",
        "aff_unique_abbr": "Bitdefender",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Romania"
    },
    {
        "id": "0cJ8ERfnrM",
        "title": "Antibody DomainBed: Out-of-Distribution Generalization in Therapeutic Protein Design",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recently, there has been an increased interest in accelerating drug design with machine learning (ML). Active ML-guided design of biological sequences with favorable properties involves multiple design cycles in which (1) candidate sequences are proposed, (2) a subset of the candidates is selected using ML surrogate models trained to predict target properties of interest, and (3) sequences are experimentally validated. The returned experimental results from one cycle provide valuable feedback for the next one, but the modifications they inspire in the candidate proposals or experimental protocol can lead to distribution shifts that impair the performance of surrogate models in the upcoming cycle. For the surrogate models to achieve consistent performance across cycles, we must explicitly account for the distribution shifts in their training. We apply domain generalization (DG) methods to develop robust classifiers for predicting properties of therapeutic antibodies. We adapt a recent benchmark of DG algorithms, ``DomainBed,'' to deploy DG algorithms across 5 domains, or design cycles. Our results suggest that foundational models and ensembling (in both output and weight space) lead to better predictive performance on out-of-distribution domains. We publicly release our codebase and the associated dataset of antibody-antigen binding that emulates distribution shifts across design cycles.",
        "keywords": "domain generalization;invariance;benchmarks;drug discovery",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Natasa Tagasovska;Ji Won Park;Matthieu Kirchmeyer;Nathan C. Frey;Andrew Martin Watkins;Aya Abdelsalam Ismail;Arian Rokkum Jamasb;Edith Lee;Tyler Bryson;Stephen Ra;Kyunghyun Cho",
        "authorids": "~Natasa_Tagasovska2;~Ji_Won_Park1;~Matthieu_Kirchmeyer1;~Nathan_C._Frey1;~Andrew_Martin_Watkins1;~Aya_Abdelsalam_Ismail1;~Arian_Rokkum_Jamasb1;leee76@gene.com;brysont1@gene.com;~Stephen_Ra1;~Kyunghyun_Cho1",
        "gender": "F;F;;;M;F;;;;M;M",
        "homepage": "https://datascience.ch/team_member/natasa-tagasovska-computer-scientist/;;https://mkirchmeyer.github.io;https://ncfrey.github.io/;;https://ayaismail.com/;https://www.jamasb.io;;;https://www.stephenra.com;http://kyunghyuncho.me",
        "dblp": ";83/10554;241/9725;306/1335;;218/6661;296/2021;;;255/5897;41/9736",
        "google_scholar": "S2ZUSL0AAAAJ;URG3MMYAAAAJ;oJkKtrkAAAAJ;IMUja60AAAAJ;zglcuwEAAAAJ;VDhTJHUAAAAJ;https://scholar.google.co.uk/citations?user=hYm9a-UAAAAJ;;;bxl__-MAAAAJ;https://scholar.google.fi/citations?user=0RAmmIAAAAAJ",
        "orcid": ";0000-0002-0692-1092;;0000-0001-5291-6131;;;0000-0002-6727-7579;;;;",
        "linkedin": "natasha-tagasovska/;;;ncfrey;;;jamasb/;;;;",
        "or_profile": "~Natasa_Tagasovska2;~Ji_Won_Park1;~Matthieu_Kirchmeyer1;~Nathan_C._Frey1;~Andrew_Martin_Watkins1;~Aya_Abdelsalam_Ismail1;~Arian_Rokkum_Jamasb1;leee76@gene.com;brysont1@gene.com;~Stephen_Ra1;~Kyunghyun_Cho1",
        "aff": "Prescient Design - Genentech, Roche;Genentech;Genentech;Prescient Design, Genentech;Prescient Design, Genentech;Genentech;Prescient Design / Roche / Genentech;;;Prescient Design, Genentech;Genentech",
        "aff_domain": "roche.com;gene.com;gene.com;gene.com;gene.com;gene.com;roche.com;;;gene.com;gene.com",
        "position": "Senior Machine Learning Scientis;Researcher;Researcher;Researcher;Researcher;Researcher;Researcher;;;Director of Frontier Research;Senior Director of Frontier Research",
        "bibtex": "@misc{\ntagasovska2024antibody,\ntitle={Antibody DomainBed: Out-of-Distribution Generalization in Therapeutic Protein Design},\nauthor={Natasa Tagasovska and Ji Won Park and Matthieu Kirchmeyer and Nathan C. Frey and Andrew Martin Watkins and Aya Abdelsalam Ismail and Arian Rokkum Jamasb and Edith Lee and Tyler Bryson and Stephen Ra and Kyunghyun Cho},\nyear={2024},\nurl={https://openreview.net/forum?id=0cJ8ERfnrM}\n}",
        "github": "",
        "project": "",
        "reviewers": "keC4;nWam;PsDP;6GLG",
        "site": "https://openreview.net/forum?id=0cJ8ERfnrM",
        "pdf_size": 8990069,
        "rating": "5;5;6;6",
        "confidence": "3;3;4;3",
        "soundness": "2;2;3;3",
        "contribution": "3;2;3;3",
        "presentation": "2;2;4;3",
        "wc_summary": "67;127;110;69",
        "wc_strengths": "75;49;129;69",
        "wc_weaknesses": "205;172;233;322",
        "wc_questions": "59;48;128;211",
        "wc_review": "406;396;600;671",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "726;659;388;1149",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;1;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            93.25,
            25.96512083545925
        ],
        "wc_strengths_avg": [
            80.5,
            29.609964538985857
        ],
        "wc_weaknesses_avg": [
            233.0,
            55.73598478541489
        ],
        "wc_questions_avg": [
            111.5,
            65.11720202834272
        ],
        "wc_review_avg": [
            518.25,
            119.95910761588718
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            730.5,
            272.75492662828293
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15368648657494412834&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0;0;0;1;0;0",
        "aff_unique_norm": "Genentech;Roche",
        "aff_unique_dep": "Prescient Design;",
        "aff_unique_url": "https://www.gene.com;https://www.roche.com",
        "aff_unique_abbr": "Genentech;Roche",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;1;0;0",
        "aff_country_unique": "United States;Switzerland"
    },
    {
        "id": "0cZDnlw0WL",
        "title": "Causal Discovery with Unobserved Variables: A Proxy Variable Approach",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Discovering causal relations from observational data is important. The existence of unobserved variables, such as latent confounders or mediators, can mislead the causal identification. To address this issue, proximal causal discovery methods were proposed to adjust for the bias with the proxy of the unobserved variable. However, these methods only focused on discrete variables, which limits their real-world application. Besides, the extension to the continuous case is not easy as the naive discretization method can introduce biases due to the discretization error. To tackle this challenge, we propose a new method based on a comprehensive analysis regarding discretization error. We begin by identifying the source of discretization error and how it introduces the bias. We then introduce smoothness conditions under which the discretization error can be reduced to an infinitesimal level, provided the proxy is discretized with sufficiently fine bins. We also find that such conditions can hold for a broad family of causal models, e.g., Additive Noise Model. Based on this, we design a proxy-based hypothesis test that is provable to be consistent for identifying causal relationships within continuous variables. We demonstrate the utility of our method on synthetic and real-world data.",
        "keywords": "causal discovery;unobserved variables;proxy variables;discretization",
        "primary_area": "causal reasoning",
        "supplementary_material": "",
        "author": "Mingzhou Liu;Xinwei Sun;Yu QIAO;Yizhou Wang",
        "authorids": "~Mingzhou_Liu1;~Xinwei_Sun1;~Yu_QIAO3;~Yizhou_Wang1",
        "gender": "M;M;M;M",
        "homepage": ";https://sunxinwei0625.github.io/sunxw.github.io/;http://www.pami.sjtu.edu.cn/yuqiao;https://cfcs.pku.edu.cn/wangyizhou/",
        "dblp": "159/6544-1;145/6592-1;q/YuQiao3;71/3387-1",
        "google_scholar": ";;hO33bVgAAAAJ;831z_VcAAAAJ",
        "orcid": "0000-0002-0297-0938;;0000-0001-8258-3868;",
        "linkedin": ";;;",
        "or_profile": "~Mingzhou_Liu1;~Xinwei_Sun1;~Yu_QIAO3;~Yizhou_Wang1",
        "aff": "Peking University;Fudan University;Shanghai Jiaotong University;Peking University",
        "aff_domain": "pku.edu.cn;fudan.edu.cn;sjtu.edu.cn;pku.edu.cn",
        "position": "PhD student;Assistant Professor;Associate Professor;Full Professor",
        "bibtex": "@misc{\nliu2024causal,\ntitle={Causal Discovery with Unobserved Variables: A Proxy Variable Approach},\nauthor={Mingzhou Liu and Xinwei Sun and Yu QIAO and Yizhou Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=0cZDnlw0WL}\n}",
        "github": "",
        "project": "",
        "reviewers": "4NAf;eeri;iFkV;iE3i",
        "site": "https://openreview.net/forum?id=0cZDnlw0WL",
        "pdf_size": 976510,
        "rating": "3;3;6;6",
        "confidence": "5;4;3;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;2",
        "presentation": "2;1;3;3",
        "wc_summary": "49;82;56;50",
        "wc_strengths": "19;17;37;23",
        "wc_weaknesses": "135;92;81;62",
        "wc_questions": "4;180;29;15",
        "wc_review": "207;371;203;150",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            59.25,
            13.40475661845451
        ],
        "wc_strengths_avg": [
            24.0,
            7.810249675906654
        ],
        "wc_weaknesses_avg": [
            92.5,
            26.781523481684157
        ],
        "wc_questions_avg": [
            57.0,
            71.56465608105722
        ],
        "wc_review_avg": [
            232.75,
            82.92880983108343
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9045340337332909,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17204668074576853571&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Peking University;Fudan University;Shanghai Jiao Tong University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.fudan.edu.cn;https://www.sjtu.edu.cn",
        "aff_unique_abbr": "Peking U;Fudan;SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "LiDAR-PTQ: Post-Training Quantization for Point Cloud 3D Object Detection",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19611",
        "id": "0d1gQI114C",
        "author_site": "Sifan Zhou, Liang Li, Xinyu Zhang, Bo Zhang, Shipeng Bai, Miao Sun, Ziyu Zhao, Xiaobo Lu, Xiangxiang Chu",
        "tldr": "",
        "abstract": "Due to highly constrained computing power and memory, deploying 3D lidar-based detectors on edge devices equipped in autonomous vehicles and robots poses a crucial challenge. Being a convenient and straightforward model compression approach, Post-Training Quantization (PTQ) has been widely adopted in 2D vision tasks. However, applying it directly to 3D lidar-based tasks inevitably leads to performance degradation. As a remedy, we propose an effective PTQ method called LiDAR-PTQ, which is particularly curated for 3D lidar detection (both SPConv-based and SPConv-free). Our LiDAR-PTQ features three main components, (1) a sparsity-based calibration method to determine the initialization of quantization parameters, (2) an adaptive rounding-to-nearest operation to minimize the layerwise reconstruction error, (3) a Task-guided Global Positive Loss (TGPL) to reduce the disparity between the final predictions before and after quantization. Extensive experiments demonstrate that our LiDAR-PTQ can achieve state-of-the-art quantization performance when applied to CenterPoint (both Pillar-based and Voxel-based). To our knowledge, for the very first time in lidar-based 3D detection tasks, the PTQ INT8 model's accuracy is almost the same as the FP32 model while enjoying 3X inference speedup. Moreover, our LiDAR-PTQ is cost-effective being 6X faster than the quantization-aware training method. The code will be released.",
        "keywords": "Quantization;3D Object Detection;Autonomous Driving",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Sifan Zhou;Liang Li;Xinyu Zhang;Bo Zhang;Shipeng Bai;Miao Sun;Ziyu Zhao;Xiaobo Lu;Xiangxiang Chu",
        "authorids": "~Sifan_Zhou2;~Liang_Li10;~Xinyu_Zhang2;~Bo_Zhang7;~Shipeng_Bai1;~Miao_Sun2;~Ziyu_Zhao5;~Xiaobo_Lu1;~Xiangxiang_Chu1",
        "gender": "M;M;M;M;M;F;M;M;M",
        "homepage": "https://github.com/StiphyJay;https://myaccount.google.com/?hl=zh-CN;;;https://april.zju.edu.cn/team/shipeng-bai/;https://watercube001.github.io;;;https://cxxgtxy.github.io/",
        "dblp": "256/3342;;;36/2259-46;;;;93/8545;207/8002",
        "google_scholar": "kSdqoi0AAAAJ;z_fYeJoAAAAJ;zGLVABAAAAAJ;uUNQnu0AAAAJ;;4nYbZ0YAAAAJ;tfnKbVUAAAAJ;;jn21pUsAAAAJ",
        "orcid": "0000-0003-3602-7566;;;0000-0003-0564-617X;;;;;0000-0003-2548-0605",
        "linkedin": ";;;bo-zhang-20a86588/;;;;;",
        "or_profile": "~Sifan_Zhou2;~Liang_Li10;~Xinyu_Zhang2;~Bo_Zhang7;~Shipeng_Bai1;~Miao_Sun2;~Ziyu_Zhao5;~Xiaobo_Lu1;~Xiangxiang_Chu1",
        "aff": "Southeast University;Meituan;Meituan;Meituan Inc.;;Nanyang Technological University;Southeast University;Southeast University;MeiTuan",
        "aff_domain": "seu.edu.cn;meituan.com;meituan.com;meituan.com;;ntu.edu.sg;seu.edu.cn;seu.edu.cn;meituan.com",
        "position": "PhD student;Researcher;Researcher;Senior Software Engineer;;Postdoc;PhD student;Full Professor;Senior Engineer",
        "bibtex": "@inproceedings{\nzhou2024lidarptq,\ntitle={Li{DAR}-{PTQ}: Post-Training Quantization for Point Cloud 3D Object Detection},\nauthor={Sifan Zhou and Liang Li and Xinyu Zhang and Bo Zhang and Shipeng Bai and Miao Sun and Ziyu Zhao and Xiaobo Lu and Xiangxiang Chu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=0d1gQI114C}\n}",
        "github": "",
        "project": "",
        "reviewers": "fLuR;3wrT;Dy1B;szHU",
        "pdf_size": 1397032,
        "rating": "6;6;6;6",
        "confidence": "4;3;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "41;191;60;117",
        "wc_strengths": "33;62;42;106",
        "wc_weaknesses": "213;196;43;51",
        "wc_questions": "17;49;80;29",
        "wc_review": "304;498;225;303",
        "wc_reply_reviewers": "79;0;0;53",
        "wc_reply_authors": "691;550;1024;834",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "2;2;3;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            102.25,
            58.37540149754861
        ],
        "wc_strengths_avg": [
            60.75,
            28.154706533721853
        ],
        "wc_weaknesses_avg": [
            125.75,
            79.02966215289042
        ],
        "wc_questions_avg": [
            43.75,
            23.84716964337697
        ],
        "wc_review_avg": [
            332.5,
            100.78318312099495
        ],
        "wc_reply_reviewers_avg": [
            33.0,
            34.25638626592128
        ],
        "wc_reply_authors_avg": [
            774.75,
            175.47275429536063
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3365312712747642645&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=0d1gQI114C",
        "pdf": "https://openreview.net/pdf?id=0d1gQI114C",
        "email": "seu.edu.cn;meituan.com;meituan.com;meituan.com;;ntu.edu.sg;seu.edu.cn;seu.edu.cn;meituan.com",
        "author_num": 9,
        "aff_unique_index": "0;1;1;2;3;0;0;1",
        "aff_unique_norm": "Southeast University;Meituan;Meituan Inc.;Nanyang Technological University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.seu.edu.cn/;https://www.meituan.com;https://www.meituan.com;https://www.ntu.edu.sg",
        "aff_unique_abbr": "SEU;Meituan;Meituan;NTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;1;0;0;0",
        "aff_country_unique": "China;Singapore"
    },
    {
        "id": "0e98EdIksA",
        "title": "A Theoretical and Empirical Analysis on Reconstruction Attacks and Defenses",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Reconstruction attacks and defenses are essential in understanding the data leakage problem in machine learning. However, prior work has centered around empirical observations of gradient inversion attacks, lacks theoretical groundings, and was unable to disentangle the usefulness of defending methods versus the computational limitation of attacking methods.  In this work, we propose a strong reconstruction attack in the setting of federated learning. The attack reconstructs intermediate features and nicely integrates with and outperforms most of the previous methods. On this stronger attack, we thoroughly investigate both theoretically and empirically the effect of the most common defense methods. Our findings suggest that among various defense mechanisms, such as gradient clipping, dropout, additive noise, local aggregation, etc., gradient pruning emerges as the most effective strategy to defend against state-of-the-art attacks.",
        "keywords": "federated learning;learning theory;reconstruction attack;deep leakage from gradients",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/55503793094dd9a696750b77b430c4bcfbf8b2c6.pdf",
        "author": "Sheng Liu;Zihan Wang;Qi Lei",
        "authorids": "~Sheng_Liu2;~Zihan_Wang20;~Qi_Lei1",
        "gender": ";M;F",
        "homepage": "https://shengliu66.github.io/;;https://cecilialeiqi.github.io/",
        "dblp": ";;",
        "google_scholar": "rzhzR-cAAAAJ;ZBF2zKMAAAAJ;kGOgaowAAAAJ",
        "orcid": ";;",
        "linkedin": ";zihan-wang-3b0050249/;",
        "or_profile": "~Sheng_Liu2;~Zihan_Wang20;~Qi_Lei1",
        "aff": "Stanford University;New York University;New York University",
        "aff_domain": "stanford.edu;nyu.edu;nyu.edu",
        "position": "Postdoc;MS student;Assistant Professor",
        "bibtex": "@misc{\nliu2024a,\ntitle={A Theoretical and Empirical Analysis on Reconstruction Attacks and Defenses},\nauthor={Sheng Liu and Zihan Wang and Qi Lei},\nyear={2024},\nurl={https://openreview.net/forum?id=0e98EdIksA}\n}",
        "github": "",
        "project": "",
        "reviewers": "2Bck;puZu;1hsA",
        "site": "https://openreview.net/forum?id=0e98EdIksA",
        "pdf_size": 4911,
        "rating": "3;3;3",
        "confidence": "4;3;4",
        "soundness": "2;1;2",
        "contribution": "2;2;2",
        "presentation": "2;1;3",
        "wc_summary": "41;50;56",
        "wc_strengths": "16;19;64",
        "wc_weaknesses": "346;414;327",
        "wc_questions": "35;49;216",
        "wc_review": "438;532;663",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            49.0,
            6.164414002968976
        ],
        "wc_strengths_avg": [
            33.0,
            21.95449840010015
        ],
        "wc_weaknesses_avg": [
            362.3333333333333,
            37.3482113211448
        ],
        "wc_questions_avg": [
            100.0,
            82.22327326655554
        ],
        "wc_review_avg": [
            544.3333333333334,
            92.26893060806306
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:WbWmshGe0vYJ:scholar.google.com/&scioq=A+Theoretical+and+Empirical+Analysis+on+Reconstruction+Attacks+and+Defenses&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Stanford University;New York University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.stanford.edu;https://www.nyu.edu",
        "aff_unique_abbr": "Stanford;NYU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Stanford;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "0ez68a5UqI",
        "title": "Reinforcement Learning for Node Selection in Branch-and-Bound",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "A big challenge in branch and bound lies in identifying the optimal node within the search tree from which to proceed. \nCurrent state-of-the-art selectors utilize either hand-crafted ensembles that automatically switch between naive sub-node selectors, or learned node selectors that rely on individual node data.\nWe propose a novel bi-simulation technique that uses reinforcement learning (RL) while considering the entire tree state, rather than just isolated nodes.\nTo achieve this, we train a graph neural network that produces a probability distribution based on the path from the model's root to its ``to-be-selected'' leaves. Modelling node-selection as a probability distribution allows us to train the model using state-of-the-art RL techniques that capture both intrinsic node-quality and node-evaluation costs.\nOur method induces a high quality node selection policy on a set of varied and complex problem sets, despite only being trained on specially designed, synthetic TSP instances.\nExperiments on several benchmarks show significant improvements in optimality gap reductions and per-node efficiency under strict time constraints.",
        "keywords": "Reinforcement Learning;Discrete Optimization;Learning Heuristics;Bi-simulation",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/3b741c9b3061a690fea6b72d2b62e0467e1d41de.zip",
        "author": "Alexander Julian Mattick;Christopher Mutschler",
        "authorids": "~Alexander_Julian_Mattick1;~Christopher_Mutschler1",
        "gender": "M;M",
        "homepage": ";https://www.cmutschler.de",
        "dblp": "293/7466;118/7748",
        "google_scholar": ";https://scholar.google.de/citations?user=gKDSp8YAAAAJ",
        "orcid": "0000-0001-7805-199X;0000-0001-8108-0230",
        "linkedin": ";christopher-mutschler-28431576/",
        "or_profile": "~Alexander_Julian_Mattick1;~Christopher_Mutschler1",
        "aff": "Friedrich-Alexander-Universit\u00e4t, Pattern Recognition Lab;Fraunhofer IIS",
        "aff_domain": "cs5.fau.de;fraunhofer.de",
        "position": "Researcher;Principal Researcher",
        "bibtex": "@misc{\nmattick2024reinforcement,\ntitle={Reinforcement Learning for Node Selection in Branch-and-Bound},\nauthor={Alexander Julian Mattick and Christopher Mutschler},\nyear={2024},\nurl={https://openreview.net/forum?id=0ez68a5UqI}\n}",
        "github": "",
        "project": "",
        "reviewers": "Lp54;KqYv;rRw3;hSJj",
        "site": "https://openreview.net/forum?id=0ez68a5UqI",
        "pdf_size": 426340,
        "rating": "3;3;5;5",
        "confidence": "4;3;3;3",
        "soundness": "2;2;3;2",
        "contribution": "3;1;2;2",
        "presentation": "2;2;2;3",
        "wc_summary": "90;46;77;96",
        "wc_strengths": "121;37;87;58",
        "wc_weaknesses": "281;284;372;182",
        "wc_questions": "18;5;74;21",
        "wc_review": "510;372;610;357",
        "wc_reply_reviewers": "0;149;79;0",
        "wc_reply_authors": "1482;912;898;546",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "3;2;2;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            77.25,
            19.30511590226798
        ],
        "wc_strengths_avg": [
            75.75,
            31.586191603293994
        ],
        "wc_weaknesses_avg": [
            279.75,
            67.23977617452337
        ],
        "wc_questions_avg": [
            29.5,
            26.386549603917523
        ],
        "wc_review_avg": [
            462.25,
            104.08259941027607
        ],
        "wc_reply_reviewers_avg": [
            57.0,
            62.14096877262214
        ],
        "wc_reply_authors_avg": [
            959.5,
            335.42025877993717
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6942358784740442277&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Friedrich-Alexander-Universit\u00e4t;Fraunhofer Institute for Integrated Circuits",
        "aff_unique_dep": "Pattern Recognition Lab;",
        "aff_unique_url": "https://www.uni-erlangen.de/;https://www.iis.fraunhofer.de/",
        "aff_unique_abbr": "FAU;Fraunhofer IIS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "0fSNU64FV7",
        "title": "Sorting Out Quantum Monte Carlo",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Molecular modeling at the quantum level requires choosing a parameterization of the wavefunction that both respects the required symmetries, and is scalable to systems of many particles. For the simulation of fermions, valid parameterizations must be antisymmetric with the transposition of particles. Typically, antisymmetry is enforced by leveraging the anti-symmetry of determinants with respect to exchange of matrix rows, but this involves computing a full determinant each time the wavefunction is evaluated. Instead, we introduce a new antisymmetrization layer derived from sorting, the $\\text{\\emph{sortlet}}$, which scales as $O(N \\log N )$ in the number of particles, in contrast to the $O(N^3)$ of the determinant. We show experimentally that applying this anti-symmeterization layer on top of an attention based neural-network backbone yields a flexible wavefunction parameterization capable of reaching chemical accuracy when approximating the ground state of first-row atoms and molecules.",
        "keywords": "quantum chemistry;scientific machine learning;quantum monte carlo;quantum statisical mechanics;inductive bias",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/424577c531fc7cfa7fce1d26b33b8ea472ecca91.pdf",
        "author": "Jack Richter-Powell;Luca Thiede;Alan Aspuru-Guzik;David Duvenaud",
        "authorids": "~Jack_Richter-Powell1;~Luca_Thiede1;~Alan_Aspuru-Guzik2;~David_Duvenaud2",
        "gender": "Non-Binary;M;M;M",
        "homepage": "https://www.jrichterpowell.ca;;http://matter.toronto.edu;https://www.cs.toronto.edu/~duvenaud/",
        "dblp": ";241/6690;;86/9380",
        "google_scholar": ";https://scholar.google.com/citations?view_op=list_works;Ag_6KEgAAAAJ;https://scholar.google.ca/citations?user=ZLpO3XQAAAAJ",
        "orcid": ";;0000-0002-8277-4434;",
        "linkedin": ";;;",
        "or_profile": "~Jack_Richter-Powell1;~Luca_Thiede1;~Alan_Aspuru-Guzik2;~David_Duvenaud2",
        "aff": "Massachusetts Institute of Technology;Vector Institute;University of Toronto;Anthropic",
        "aff_domain": "mit.edu;vectorinstitute.ai;utoronto.ca;anthropic.com",
        "position": "PhD student;PhD student;Full Professor;Researcher",
        "bibtex": "@misc{\nrichter-powell2024sorting,\ntitle={Sorting Out Quantum Monte Carlo},\nauthor={Jack Richter-Powell and Luca Thiede and Alan Aspuru-Guzik and David Duvenaud},\nyear={2024},\nurl={https://openreview.net/forum?id=0fSNU64FV7}\n}",
        "github": "",
        "project": "",
        "reviewers": "G9wz;o8Z6;1VSk;TwGB",
        "site": "https://openreview.net/forum?id=0fSNU64FV7",
        "pdf_size": 1158565,
        "rating": "3;3;5;6",
        "confidence": "4;5;3;4",
        "soundness": "3;2;2;3",
        "contribution": "1;2;3;3",
        "presentation": "4;2;2;3",
        "wc_summary": "163;52;141;27",
        "wc_strengths": "35;11;176;32",
        "wc_weaknesses": "193;186;622;55",
        "wc_questions": "303;7;100;159",
        "wc_review": "694;256;1039;273",
        "wc_reply_reviewers": "166;352;58;0",
        "wc_reply_authors": "257;539;394;0",
        "reply_reviewers": "1;3;1;0",
        "reply_authors": "1;4;1;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            95.75,
            57.469013389825996
        ],
        "wc_strengths_avg": [
            63.5,
            65.60678318588711
        ],
        "wc_weaknesses_avg": [
            264.0,
            213.8749634716509
        ],
        "wc_questions_avg": [
            142.25,
            107.46947240961035
        ],
        "wc_review_avg": [
            565.5,
            324.8311099633162
        ],
        "wc_reply_reviewers_avg": [
            144.0,
            134.05222862750176
        ],
        "wc_reply_authors_avg": [
            297.5,
            198.60828280814474
        ],
        "reply_reviewers_avg": [
            1.25,
            1.0897247358851685
        ],
        "reply_authors_avg": [
            1.5,
            1.5
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5443310539518174,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3538753825599944540&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Massachusetts Institute of Technology;Vector Institute;University of Toronto;Anthropic",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://web.mit.edu;https://vectorinstitute.ai/;https://www.utoronto.ca;https://www.anthropic.com",
        "aff_unique_abbr": "MIT;Vector Institute;U of T;Anthropic",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "United States;Canada"
    },
    {
        "id": "0fpLLsAynh",
        "title": "Sporadicity in Decentralized Federated Learning: Theory and Algorithm",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Decentralized Federated Learning methods are a family of techniques employed by devices in a distributed setup to (i) reach consensus over a common model which (ii) is optimal with respect to the global objective function. As this is carried out without the presence of any centralized server, prominent challenges of conventional Federated Learning become even more significant, namely heterogeneous data distributions among devices and their varying resource capabilities. In this work, we propose $\\textit{Decentralized Sporadic Federated Learning}$ ($\\texttt{DSpodFL}$), which introduces sporadicity to decentralized federated learning. $\\texttt{DSpodFL}$ includes sporadic stochastic gradient calculations and model exchanges for aggregations. Our motivation is to achieve joint computation and communication savings without losing statistical performance. We prove that by using a constant step size, our method achieves a geometric convergence rate to a finite optimality gap. Through numerical evaluation, we demonstrate the resource savings achieved by $\\texttt{DSpodFL}$ compared to the existing baselines.",
        "keywords": "Decentralized Federated Learning;Distributed Optimization;Sporadicity;Resource Efficiency;Sporadic SGDs;Anarchic Federated Learning",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/63b24031205cd54823f86ccbf5d1a7ebceb5631a.pdf",
        "author": "Shahryar Zehtabi;Rohit Parasnis;Seyyedali Hosseinalipour;Christopher Brinton",
        "authorids": "~Shahryar_Zehtabi1;~Rohit_Parasnis1;~Seyyedali_Hosseinalipour1;~Christopher_Brinton1",
        "gender": ";M;;",
        "homepage": ";;;https://www.cbrinton.net/",
        "dblp": ";;;",
        "google_scholar": "kmeHQn4AAAAJ;DcAdzxQAAAAJ;;vWmHA5MAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Shahryar_Zehtabi1;~Rohit_Parasnis1;~Seyyedali_Hosseinalipour1;~Christopher_Brinton1",
        "aff": "Purdue University;Massachusetts Institute of Technology;;Purdue University",
        "aff_domain": "purdue.edu;mit.edu;;purdue.edu",
        "position": "PhD student;Postdoc;;Assistant Professor",
        "bibtex": "@misc{\nzehtabi2024sporadicity,\ntitle={Sporadicity in Decentralized Federated Learning: Theory and Algorithm},\nauthor={Shahryar Zehtabi and Rohit Parasnis and Seyyedali Hosseinalipour and Christopher Brinton},\nyear={2024},\nurl={https://openreview.net/forum?id=0fpLLsAynh}\n}",
        "github": "",
        "project": "",
        "reviewers": "Mn6u;Sqyj;RbX5",
        "site": "https://openreview.net/forum?id=0fpLLsAynh",
        "pdf_size": 401422,
        "rating": "3;3;5",
        "confidence": "4;4;4",
        "soundness": "2;3;3",
        "contribution": "1;1;2",
        "presentation": "2;2;3",
        "wc_summary": "41;79;111",
        "wc_strengths": "11;51;50",
        "wc_weaknesses": "239;132;211",
        "wc_questions": "72;181;3",
        "wc_review": "363;443;375",
        "wc_reply_reviewers": "12;253;24",
        "wc_reply_authors": "671;1730;612",
        "reply_reviewers": "1;1;1",
        "reply_authors": "2;3;1",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            77.0,
            28.61235164516658
        ],
        "wc_strengths_avg": [
            37.333333333333336,
            18.624953392931992
        ],
        "wc_weaknesses_avg": [
            194.0,
            45.306364527146364
        ],
        "wc_questions_avg": [
            85.33333333333333,
            73.27725128275183
        ],
        "wc_review_avg": [
            393.6666666666667,
            35.22625283632775
        ],
        "wc_reply_reviewers_avg": [
            96.33333333333333,
            110.8883322185983
        ],
        "wc_reply_authors_avg": [
            1004.3333333333334,
            513.688837938126
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:OahLiBq3M_IJ:scholar.google.com/&scioq=Sporadicity+in+Decentralized+Federated+Learning:+Theory+and+Algorithm&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Purdue University;Massachusetts Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.purdue.edu;https://web.mit.edu",
        "aff_unique_abbr": "Purdue;MIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "0gDQgwjoX0",
        "title": "Stochastic Gradient Discrete Langevin Dynamics",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Sampling via Markov chain Monte Carlo can be inefficient when each evaluation of the gradient of energy function depends on a large dataset. In continuous spaces, this challenge has been addressed by extending Langevin samplers with stochastic gradient estimators. However, such an approach cannot be directly applied to discrete spaces, as a naive migration leads to biased estimation with large variance. To fill this gap, we propose a new sampling strategy, \\emph{Stochastic Gradient Discrete Langevin Dynamics}, to provide the first practical method for stochastic distribution sampling in discrete spaces. Our approach mitigates the bias of naive ``gradient'' estimators via a novel caching scheme, and reduces the estimation variance by introducing a modified Polyak step size control for simulation time adaptation. We demonstrate significant efficiency improvements across various sampling problems in discrete spaces, including Bayesian learning, stochastic integer programming, and prompt tuning for text-image models.",
        "keywords": "Stochastic Gradient;Langevin Dynamics;Discrete Langevin Dynamics;MCMC;Discrete Sampling",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Haoran Sun;Bethany Yixin Wang;Katayoon Goshvadi;Yuan Xue;Dale Schuurmans;Hanjun Dai",
        "authorids": "~Haoran_Sun2;~Bethany_Yixin_Wang1;~Katayoon_Goshvadi1;~Yuan_Xue5;~Dale_Schuurmans1;~Hanjun_Dai1",
        "gender": "M;F;F;F;;M",
        "homepage": ";;;;;https://hanjun-dai.github.io",
        "dblp": ";334/1546;;;;144/7311",
        "google_scholar": "p7of_yoAAAAJ;;;jcatRRIAAAAJ;;obpl7GQAAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";yixin-wang/;katayoon-goshvadi/;yuan-emily-xue-3483012;;hanjun-dai",
        "or_profile": "~Haoran_Sun2;~Bethany_Yixin_Wang1;~Katayoon_Goshvadi1;~Yuan_Xue5;~Dale_Schuurmans1;~Hanjun_Dai1",
        "aff": ";Google;;Google;;Google Research",
        "aff_domain": ";google.com;;google.com;;google.com",
        "position": ";Researcher;;Researcher;;Researcher",
        "bibtex": "@misc{\nsun2024stochastic,\ntitle={Stochastic Gradient Discrete Langevin Dynamics},\nauthor={Haoran Sun and Bethany Yixin Wang and Katayoon Goshvadi and Yuan Xue and Dale Schuurmans and Hanjun Dai},\nyear={2024},\nurl={https://openreview.net/forum?id=0gDQgwjoX0}\n}",
        "github": "",
        "project": "",
        "reviewers": "m4Ve;Ap8o;i63H",
        "site": "https://openreview.net/forum?id=0gDQgwjoX0",
        "pdf_size": 6662571,
        "rating": "3;5;6",
        "confidence": "2;4;2",
        "soundness": "2;2;3",
        "contribution": "2;2;2",
        "presentation": "1;3;3",
        "wc_summary": "151;54;34",
        "wc_strengths": "39;30;55",
        "wc_weaknesses": "98;35;40",
        "wc_questions": "154;305;2",
        "wc_review": "442;424;131",
        "wc_reply_reviewers": "0;0;19",
        "wc_reply_authors": "716;356;333",
        "reply_reviewers": "0;0;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            79.66666666666667,
            51.09685791600975
        ],
        "wc_strengths_avg": [
            41.333333333333336,
            10.338708279513881
        ],
        "wc_weaknesses_avg": [
            57.666666666666664,
            28.592928418676454
        ],
        "wc_questions_avg": [
            153.66666666666666,
            123.69945656936233
        ],
        "wc_review_avg": [
            332.3333333333333,
            142.55369358790938
        ],
        "wc_reply_reviewers_avg": [
            6.333333333333333,
            8.956685895029603
        ],
        "wc_reply_authors_avg": [
            468.3333333333333,
            175.37832122459022
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.1889822365046137,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:3md5aSvelN8J:scholar.google.com/&scioq=Stochastic+Gradient+Discrete+Langevin+Dynamics&hl=en&as_sdt=0,31",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Google",
        "aff_unique_dep": "Google",
        "aff_unique_url": "https://www.google.com",
        "aff_unique_abbr": "Google",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Mountain View",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "TopoMLP: A Simple yet Strong Pipeline for Driving Topology Reasoning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19610",
        "id": "0gTW5JUFTW",
        "author_site": "Dongming Wu, Jiahao Chang, Fan Jia, Yingfei Liu, Tiancai Wang, Jianbing Shen",
        "tldr": "",
        "abstract": "Topology reasoning aims to comprehensively understand road scenes and present drivable routes in autonomous driving. It requires detecting road centerlines (lane) and traffic elements, further reasoning their topology relationship, \\textit{i.e.}, lane-lane topology, and lane-traffic topology. In this work, we first present that the topology score relies heavily on detection performance on lane and traffic elements. Therefore, we introduce a powerful 3D lane detector and an improved 2D traffic element detector to extend the upper limit of topology performance. Further, we propose TopoMLP, a simple yet high-performance pipeline for driving topology reasoning. Based on the impressive detection performance, we develop two simple MLP-based heads for topology generation. TopoMLP achieves state-of-the-art performance on OpenLane-V2 dataset, \\textit{i.e.}, 41.2\\% OLS with ResNet-50 backbone. It is also the 1st solution for 1st OpenLane Topology in Autonomous Driving Challenge. We hope such simple and strong pipeline can provide some new insights to the community. Code is at https://github.com/wudongming97/TopoMLP.",
        "keywords": "Autonomous Driving;Driving Topology Understanding",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Dongming Wu;Jiahao Chang;Fan Jia;Yingfei Liu;Tiancai Wang;Jianbing Shen",
        "authorids": "~Dongming_Wu1;~Jiahao_Chang3;~Fan_Jia7;~Yingfei_Liu1;~Tiancai_Wang1;~Jianbing_Shen1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://wudongming97.github.io/;;;;https://www.wangeniusky.com/;https://scholar.google.com/citations?user=_Q3NTToAAAAJ&hl=en",
        "dblp": ";;;13/5577;179/0530;38/5435",
        "google_scholar": "ejFCAq0AAAAJ;HA5zLp4AAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com.hk/citations?hl=zh-CN;https://scholar.google.com.hk/citations?user=YI0sRroAAAAJ;_Q3NTToAAAAJ",
        "orcid": "0000-0003-4938-5813;0009-0009-6877-1649;0000-0002-0252-7207;0000-0002-2412-5225;;0000-0003-2656-3082",
        "linkedin": ";;;;;",
        "or_profile": "~Dongming_Wu1;~Jiahao_Chang3;~Fan_Jia7;~Yingfei_Liu1;~Tiancai_Wang1;~Jianbing_Shen1",
        "aff": "Beijing Institute of Technology;The Chinese University of Hong Kong, Shenzhen;Megvii Technology Inc.;Megvii Technology Inc.;Megvii Technology Inc.;University of Macau",
        "aff_domain": "bit.edu.cn;cuhk.edu.cn;megvii.com;megvii.com;megvii.com;um.edu.mo",
        "position": "PhD student;Intern;Researcher;Researcher;Researcher;Full Professor",
        "bibtex": "@inproceedings{\nwu2024topomlp,\ntitle={Topo{MLP}: A Simple yet Strong Pipeline for Driving Topology Reasoning},\nauthor={Dongming Wu and Jiahao Chang and Fan Jia and Yingfei Liu and Tiancai Wang and Jianbing Shen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=0gTW5JUFTW}\n}",
        "github": "",
        "project": "",
        "reviewers": "bKsZ;tnze;MJLZ;Cep6",
        "pdf_size": 2432095,
        "rating": "6;6;6;8",
        "confidence": "5;4;3;4",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "132;54;230;87",
        "wc_strengths": "162;97;27;56",
        "wc_weaknesses": "75;126;66;73",
        "wc_questions": "178;235;35;48",
        "wc_review": "547;512;358;264",
        "wc_reply_reviewers": "23;28;24;15",
        "wc_reply_authors": "403;685;316;317",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            125.75,
            66.25094338950956
        ],
        "wc_strengths_avg": [
            85.5,
            50.6877697280123
        ],
        "wc_weaknesses_avg": [
            85.0,
            23.90606617576384
        ],
        "wc_questions_avg": [
            124.0,
            85.04998530276181
        ],
        "wc_review_avg": [
            420.25,
            114.86160150372272
        ],
        "wc_reply_reviewers_avg": [
            22.5,
            4.716990566028302
        ],
        "wc_reply_authors_avg": [
            430.25,
            151.2603302257403
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 30,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15140104278097721464&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=0gTW5JUFTW",
        "pdf": "https://openreview.net/pdf?id=0gTW5JUFTW",
        "email": "bit.edu.cn;cuhk.edu.cn;megvii.com;megvii.com;megvii.com;um.edu.mo",
        "author_num": 6,
        "aff_unique_index": "0;1;2;2;2;3",
        "aff_unique_norm": "Beijing Institute of Technology;Chinese University of Hong Kong;Megvii Technology;University of Macau",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "http://www.bit.edu.cn/;https://www.cuhk.edu.cn;https://www.megvii.com;https://www.um.edu.mo",
        "aff_unique_abbr": "BIT;CUHK;Megvii;UM",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Shenzhen;Macau SAR",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Variance Reduced Halpern Iteration for Finite-Sum Monotone Inclusions",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19609",
        "id": "0i6Z9N5MLY",
        "author_site": "Xufeng Cai, Ahmet Alacaoglu, Jelena Diakonikolas",
        "tldr": "",
        "abstract": "Machine learning approaches relying on such criteria as adversarial robustness or multi-agent settings have raised the need for solving game-theoretic equilibrium problems. Of particular relevance to these applications are methods targeting finite-sum structure, which generically arises in empirical variants of learning problems in these contexts. Further, methods with computable approximation errors are highly desirable, as they provide verifiable exit criteria. Motivated by these applications, we study finite-sum monotone inclusion problems, which model broad classes of equilibrium problems. Our main contributions are variants of the classical Halpern iteration that employ variance reduction to obtain improved complexity guarantees in which $n$ component operators in the finite sum are ``on average'' either cocoercive or Lipschitz continuous and monotone, with parameter $L$. The resulting oracle complexity of our methods, which provide guarantees for the last iterate and for a (computable) operator norm residual, is $\\widetilde{\\mathcal{O}}( n + \\sqrt{n}L\\varepsilon^{-1})$, which improves upon existing methods by a factor up to $\\sqrt{n}$. This constitutes the first variance reduction-type result for general finite-sum monotone inclusions and for more specific problems such as convex-concave optimization when operator norm residual is the optimality measure. We further argue that, up to poly-logarithmic factors, this complexity is unimprovable in the monotone Lipschitz setting; i.e., the provided result is near-optimal.",
        "keywords": "finite-sum problems;monotone inclusion;operator norm residual;stochastic Halpern iteration;last iterate convergence;variance reduction;min-max optimization",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/279e1f4321206702dce0ad254d5fbaebb5cc217f.zip",
        "author": "Xufeng Cai;Ahmet Alacaoglu;Jelena Diakonikolas",
        "authorids": "~Xufeng_Cai1;~Ahmet_Alacaoglu2;~Jelena_Diakonikolas2",
        "gender": ";;F",
        "homepage": ";https://ahmetalacaoglu.github.io;http://www.jelena-diakonikolas.com/",
        "dblp": ";209/4889;147/5178",
        "google_scholar": ";-yRi8D4AAAAJ;J8ixfu8AAAAJ",
        "orcid": ";;0000-0003-3439-0310",
        "linkedin": ";;",
        "or_profile": "~Xufeng_Cai1;~Ahmet_Alacaoglu2;~Jelena_Diakonikolas2",
        "aff": ";University of Wisconsin-Madison;University of Wisconsin, Madison",
        "aff_domain": ";wisc.edu;wisc.edu",
        "position": ";Postdoc;Assistant Professor",
        "bibtex": "@inproceedings{\ncai2024variance,\ntitle={Variance Reduced Halpern Iteration for Finite-Sum Monotone Inclusions},\nauthor={Xufeng Cai and Ahmet Alacaoglu and Jelena Diakonikolas},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=0i6Z9N5MLY}\n}",
        "github": "",
        "project": "",
        "reviewers": "9YKM;wjm9;P51Q",
        "pdf_size": 689876,
        "rating": "6;6;6",
        "confidence": "3;3;3",
        "soundness": "3;3;3",
        "contribution": "3;3;2",
        "presentation": "3;2;3",
        "wc_summary": "69;48;69",
        "wc_strengths": "56;28;59",
        "wc_weaknesses": "412;635;149",
        "wc_questions": "2;308;42",
        "wc_review": "539;1019;319",
        "wc_reply_reviewers": "21;495;0",
        "wc_reply_authors": "2298;2809;1528",
        "reply_reviewers": "1;1;0",
        "reply_authors": "5;6;3",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            62.0,
            9.899494936611665
        ],
        "wc_strengths_avg": [
            47.666666666666664,
            13.960261060914616
        ],
        "wc_weaknesses_avg": [
            398.6666666666667,
            198.63254740572825
        ],
        "wc_questions_avg": [
            117.33333333333333,
            135.80705267236883
        ],
        "wc_review_avg": [
            625.6666666666666,
            292.27080289043965
        ],
        "wc_reply_reviewers_avg": [
            172.0,
            228.55633878761708
        ],
        "wc_reply_authors_avg": [
            2211.6666666666665,
            526.5170673608048
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6364381838039303577&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=0i6Z9N5MLY",
        "pdf": "https://openreview.net/pdf?id=0i6Z9N5MLY",
        "email": ";wisc.edu;wisc.edu",
        "author_num": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Wisconsin-Madison;University of Wisconsin",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.wisc.edu;https://www.wisc.edu",
        "aff_unique_abbr": "UW-Madison;UW",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Madison",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "UNR-Explainer: Counterfactual Explanations for Unsupervised Node Representation Learning Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19608",
        "id": "0j9ZDzMPqr",
        "author_site": "Hyunju Kang, Geonhee Han, Hogun Park",
        "tldr": "",
        "abstract": "Node representation learning, such as Graph Neural Networks (GNNs), has become one of the important learning methods in machine learning, and the demand for reliable explanation generation is growing. Despite extensive research on explanation generation for supervised node representation learning, explaining unsupervised models has been less explored. To address this gap, we propose a method for generating counterfactual (CF) explanations in unsupervised node representation learning, aiming to identify the most important subgraphs that cause a significant change in the $k$-nearest neighbors of a node of interest in the learned embedding space upon perturbation. The $k$-nearest neighbor-based CF explanation method provides simple, yet pivotal, information for understanding unsupervised downstream tasks, such as top-$k$ link prediction and clustering. Furthermore, we introduce a Monte Carlo Tree Search (MCTS)-based explainability method for generating expressive CF explanations for **U**nsupervised **N**ode **R**epresentation learning methods, which we call **UNR-Explainer**. The proposed method demonstrates improved performance on six datasets for both unsupervised GraphSAGE and DGI.",
        "keywords": "XAI;Unsupervised node representation learning;Counterfactual Explanations",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Hyunju Kang;Geonhee Han;Hogun Park",
        "authorids": "~Hyunju_Kang1;~Geonhee_Han1;~Hogun_Park2",
        "gender": ";M;",
        "homepage": ";https://learndatalab.github.io/;https://hogunpark.com",
        "dblp": "382/4096;382/3962;05/3540",
        "google_scholar": "yI623McAAAAJ;1IbJqfkAAAAJ;0YEYuGIAAAAJ",
        "orcid": ";0009-0000-8967-5255;0000-0003-0576-5806",
        "linkedin": ";;hogunpark/en",
        "or_profile": "~Hyunju_Kang1;~Geonhee_Han1;~Hogun_Park2",
        "aff": "Sungkyunkwan University;Sung Kyun Kwan University;Sungkyunkwan University",
        "aff_domain": "skku.edu;skku.edu;skku.edu",
        "position": "PhD student;MS student;Assistant Professor",
        "bibtex": "@inproceedings{\nkang2024unrexplainer,\ntitle={{UNR}-Explainer: Counterfactual Explanations for Unsupervised Node Representation Learning Models},\nauthor={Hyunju Kang and Geonhee Han and Hogun Park},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=0j9ZDzMPqr}\n}",
        "github": "",
        "project": "",
        "reviewers": "TnSw;8JCL;eAe7;WfpS",
        "pdf_size": 1935301,
        "rating": "6;6;6;8",
        "confidence": "3;3;4;3",
        "soundness": "2;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "2;2;3;3",
        "wc_summary": "80;87;70;392",
        "wc_strengths": "52;109;51;169",
        "wc_weaknesses": "77;109;174;120",
        "wc_questions": "27;105;70;94",
        "wc_review": "236;410;365;775",
        "wc_reply_reviewers": "0;13;11;0",
        "wc_reply_authors": "474;995;1523;284",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;2;3;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            157.25,
            135.66756244585514
        ],
        "wc_strengths_avg": [
            95.25,
            48.6229112661922
        ],
        "wc_weaknesses_avg": [
            120.0,
            34.94996423460259
        ],
        "wc_questions_avg": [
            74.0,
            29.941609843159736
        ],
        "wc_review_avg": [
            446.5,
            200.12308712389984
        ],
        "wc_reply_reviewers_avg": [
            6.0,
            6.041522986797286
        ],
        "wc_reply_authors_avg": [
            819.0,
            482.6598180913758
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14211516623000206023&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=0j9ZDzMPqr",
        "pdf": "https://openreview.net/pdf?id=0j9ZDzMPqr",
        "email": "skku.edu;skku.edu;skku.edu",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Sungkyunkwan University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.skku.edu",
        "aff_unique_abbr": "SKKU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "Magic123: One Image to High-Quality 3D Object Generation Using Both 2D and 3D Diffusion Priors",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19607",
        "id": "0jHkUDyEO9",
        "author_site": "Guocheng Qian, Jinjie Mai, Abdullah Hamdi, Jian Ren, Aliaksandr Siarohin, Bing Li, Hsin-Ying Lee, Ivan Skorokhodov, Peter Wonka, Sergey Tulyakov, Bernard Ghanem",
        "tldr": "",
        "abstract": "We present ``Magic123'', a two-stage coarse-to-fine approach for high-quality, textured 3D mesh generation from a single image in the wild using *both 2D and 3D priors*. In the first stage, we optimize a neural radiance field to produce a coarse geometry. In the second stage, we adopt a memory-efficient differentiable mesh representation to yield a high-resolution mesh with a visually appealing texture. In both stages, the 3D content is learned through reference-view supervision and novel-view guidance by a joint 2D and 3D diffusion prior. We introduce a trade-off parameter between the 2D and 3D priors to control the details and 3D consistencies of the generation. Magic123 demonstrates a significant improvement over previous image-to-3D techniques, as validated through extensive experiments on diverse synthetic and real-world images.",
        "keywords": "Neural Radiance Fields;Shape from Image;Generative 3D models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/4ad77057b440a0face0239bab4dbc19a1d7954d8.zip",
        "author": "Guocheng Qian;Jinjie Mai;Abdullah Hamdi;Jian Ren;Aliaksandr Siarohin;Bing Li;Hsin-Ying Lee;Ivan Skorokhodov;Peter Wonka;Sergey Tulyakov;Bernard Ghanem",
        "authorids": "~Guocheng_Qian1;~Jinjie_Mai1;~Abdullah_Hamdi1;~Jian_Ren2;~Aliaksandr_Siarohin1;~Bing_Li7;~Hsin-Ying_Lee2;~Ivan_Skorokhodov1;~Peter_Wonka1;~Sergey_Tulyakov1;~Bernard_Ghanem1",
        "gender": "M;M;M;M;F;M;M;M;M;M;M",
        "homepage": "https://guochengqian.github.io/;;https://alanspike.github.io/;;https://cemse.kaust.edu.sa/vcc/people/person/bing-li;http://hsinyinglee.com/;https://universome.github.io/;http://peterwonka.net;http://www.stulyakov.com/;https://ivul.kaust.edu.sa;https://abdullahamdi.com/",
        "dblp": "241/7000;272/0975;59/2180-5;199/1971;13/2692-24;149/7976-1.html;223/0010;98/5522;40/6115;37/2516;205/2625",
        "google_scholar": "DUDaxg4AAAAJ;;https://scholar.google.co.jp/citations?user=vDALiU4AAAAJ;https://scholar.google.it/citations?user=uMl5-k4AAAAJ;;;https://scholar.google.com/citations?hl=en;https://scholar.google.com.tw/citations?user=0EKXSXgAAAAJ;mgzXR0sAAAAJ;rVsGTeEAAAAJ;tQkWPKAAAAAJ",
        "orcid": "0000-0002-2935-8570;0000-0002-3396-1970;;;;;0000-0002-7611-9310;0000-0003-0627-9746;;0000-0002-5534-587X;0000-0003-3989-7540",
        "linkedin": "guochengqian/;;;;;;ivan-skorokhodov;;sergeytulyakov/;bernardghanem/;ajhamdi/",
        "or_profile": "~Guocheng_Qian1;~Jinjie_Mai1;~Jian_Ren2;~Aliaksandr_Siarohin1;~Bing_Li7;~Hsin-Ying_Lee2;~Ivan_Skorokhodov1;~Peter_Wonka1;~Sergey_Tulyakov1;~Bernard_Ghanem1;~Abdullah_Jamal_Hamdi1",
        "aff": "Snap Inc.;King Abdullah University of Science and Technology;Snap Inc.;Snap Inc.;KAUST;Snap Inc.;Snap Inc.;KAUST;Snap Inc.;King Abdullah University of Science and Technology;University of Oxford",
        "aff_domain": "snapchat.com;kaust.edu.sa;snapchat.com;snapchat.com;kaust.edu.sa;snap.com;snap.com;kaust.edu.sa;snapchat.com;kaust.edu.sa;eng.ox.ac.uk",
        "position": "Researcher;MS student;Research Scientist;Intern;Postdoc;Researcher;Researcher;Full Professor;Director of Research;Full Professor;Postdoc",
        "bibtex": "@inproceedings{\nqian2024magic,\ntitle={Magic123: One Image to High-Quality 3D Object Generation Using Both 2D and 3D Diffusion Priors},\nauthor={Guocheng Qian and Jinjie Mai and Abdullah Hamdi and Jian Ren and Aliaksandr Siarohin and Bing Li and Hsin-Ying Lee and Ivan Skorokhodov and Peter Wonka and Sergey Tulyakov and Bernard Ghanem},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=0jHkUDyEO9}\n}",
        "github": "",
        "project": "",
        "reviewers": "jWBN;UQdQ;25qf;Ea4Z",
        "pdf_size": 26253959,
        "rating": "5;5;8;8",
        "confidence": "4;5;5;4",
        "soundness": "2;3;3;4",
        "contribution": "2;2;3;4",
        "presentation": "2;3;3;4",
        "wc_summary": "66;54;84;85",
        "wc_strengths": "48;40;259;116",
        "wc_weaknesses": "224;140;321;225",
        "wc_questions": "120;19;25;35",
        "wc_review": "458;253;689;461",
        "wc_reply_reviewers": "0;133;82;10",
        "wc_reply_authors": "951;626;945;387",
        "reply_reviewers": "0;2;1;1",
        "reply_authors": "2;2;2;1",
        "rating_avg": [
            6.5,
            1.5
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            72.25,
            12.968712349342937
        ],
        "wc_strengths_avg": [
            115.75,
            87.81906114278381
        ],
        "wc_weaknesses_avg": [
            227.5,
            64.06442070291435
        ],
        "wc_questions_avg": [
            49.75,
            40.959583738119214
        ],
        "wc_review_avg": [
            465.25,
            154.26012932705586
        ],
        "wc_reply_reviewers_avg": [
            56.25,
            54.444352324185104
        ],
        "wc_reply_authors_avg": [
            727.25,
            236.37932968007163
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 356,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9455191109482969642&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=0jHkUDyEO9",
        "pdf": "https://openreview.net/pdf?id=0jHkUDyEO9",
        "email": "snapchat.com;kaust.edu.sa;snapchat.com;snapchat.com;kaust.edu.sa;snap.com;snap.com;kaust.edu.sa;snapchat.com;kaust.edu.sa;eng.ox.ac.uk",
        "author_num": 11,
        "aff_unique_index": "0;1;0;0;1;0;0;1;0;1;2",
        "aff_unique_norm": "Snap Inc.;King Abdullah University of Science and Technology;University of Oxford",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.snapinc.com;https://www.kast.kau.edu.sa;https://www.ox.ac.uk",
        "aff_unique_abbr": "Snap;KAUST;Oxford",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;1;0;0;1;0;1;2",
        "aff_country_unique": "United States;Saudi Arabia;United Kingdom"
    },
    {
        "title": "Sparse Spiking Neural Network: Exploiting Heterogeneity in Timescales for Pruning Recurrent SNN",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19606",
        "id": "0jsfesDZDq",
        "author_site": "Biswadeep Chakraborty, Beomseok Kang, Harshit Kumar, Saibal Mukhopadhyay",
        "tldr": "",
        "abstract": "Recurrent Spiking Neural Networks (RSNNs) have emerged as a computationally efficient and brain-inspired machine learning model. The design of sparse RSNNs with fewer neurons and synapses helps reduce the computational complexity of RSNNs. Traditionally, sparse SNNs are obtained by first training a dense and complex SNN for a target task and, next, eliminating neurons with low activity (activity-based pruning) while maintaining task performance. In contrast, this paper presents a task-agnostic methodology for designing sparse RSNNs by pruning an untrained (arbitrarily initialized) large model. \nWe introduce a novel Lyapunov Noise Pruning (LNP) algorithm that uses graph sparsification methods and utilizes Lyapunov exponents to design a stable sparse RSNN from an untrained RSNN. We show that the LNP can leverage diversity in neuronal timescales to design a sparse Heterogeneous RSNN (HRSNN). Further, we show that the same sparse HRSNN model can be trained for different tasks, such as image classification and time-series prediction. The experimental results show that, in spite of being task-agnostic, LNP increases computational efficiency (fewer neurons and synapses) and prediction performance of RSNNs compared to traditional activity-based pruning of trained dense models.",
        "keywords": "spiking neural network;SNN;network pruning;stability;neuromorphic;leaky integrate and fire;STDP;sparsification;task-agnostic pruning;timescale optimization",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/d86e0dbdc96d62a023bc91a41b638f899c25509b.zip",
        "author": "Biswadeep Chakraborty;Beomseok Kang;Harshit Kumar;Saibal Mukhopadhyay",
        "authorids": "~Biswadeep_Chakraborty1;~Beomseok_Kang1;hkumar64@gatech.edu;~Saibal_Mukhopadhyay2",
        "gender": "M;M;;M",
        "homepage": ";https://sites.google.com/view/beomseok-kang;;https://greenlab.ece.gatech.edu",
        "dblp": "238/0554;309/1053;;66/1210",
        "google_scholar": "8soIjY8AAAAJ;kbqaf1EAAAAJ;;5KRtMEkAAAAJ",
        "orcid": ";;;0000-0002-8894-3390",
        "linkedin": ";;;",
        "or_profile": "~Biswadeep_Chakraborty1;~Beomseok_Kang1;hkumar64@gatech.edu;~Saibal_Mukhopadhyay2",
        "aff": "Georgia Institute of Technology;Georgia Institute of Technology;;Georgia Institute of Technology",
        "aff_domain": "gatech.edu;gatech.edu;;gatech.edu",
        "position": "PhD student;PhD student;;Full Professor",
        "bibtex": "@inproceedings{\nchakraborty2024sparse,\ntitle={Sparse Spiking Neural Network: Exploiting Heterogeneity in Timescales for Pruning Recurrent {SNN}},\nauthor={Biswadeep Chakraborty and Beomseok Kang and Harshit Kumar and Saibal Mukhopadhyay},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=0jsfesDZDq}\n}",
        "github": "",
        "project": "",
        "reviewers": "mdv5;MeNm;YTsp;udA5",
        "pdf_size": 12466223,
        "rating": "5;6;8;8",
        "confidence": "4;3;4;4",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "145;40;113;83",
        "wc_strengths": "18;64;63;69",
        "wc_weaknesses": "157;79;121;105",
        "wc_questions": "4;101;25;164",
        "wc_review": "324;284;322;421",
        "wc_reply_reviewers": "0;0;80;50",
        "wc_reply_authors": "1684;1534;1557;2817",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "3;3;3;6",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            95.25,
            38.70642711488623
        ],
        "wc_strengths_avg": [
            53.5,
            20.62159062730128
        ],
        "wc_weaknesses_avg": [
            115.5,
            28.26216552212516
        ],
        "wc_questions_avg": [
            73.5,
            63.5
        ],
        "wc_review_avg": [
            337.75,
            50.637807022026536
        ],
        "wc_reply_reviewers_avg": [
            32.5,
            34.18698582794336
        ],
        "wc_reply_authors_avg": [
            1898.0,
            533.6511032500542
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.75,
            1.299038105676658
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14817744695773258013&as_sdt=805&sciodt=0,3&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=0jsfesDZDq",
        "pdf": "https://openreview.net/pdf?id=0jsfesDZDq",
        "email": "gatech.edu;gatech.edu;;gatech.edu",
        "author_num": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Georgia Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.gatech.edu",
        "aff_unique_abbr": "Georgia Tech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "0k85noSawb",
        "title": "Variance-Covariance Regularization Improves Representation Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Transfer learning plays a key role in advancing machine learning models, yet conventional supervised pretraining often undermines feature transferability by prioritizing features that minimize the pretraining loss. Recent progress in self-supervised learning (SSL) has introduced regularization techniques that bolster feature transferability. In this work, we adapt an SSL regularization technique from the VICReg method to supervised learning contexts, introducing Variance-Covariance Regularization (VCReg). This adaptation encourages the network to learn a high-variance, low-covariance representation, promoting the learning of more diverse features. We outline best practices for implementing this regularization framework into various neural network architectures and present an optimized strategy for regularizing intermediate representations. Through extensive empirical evaluation, we demonstrate that our method significantly enhances transfer learning, achieving excellent performance across numerous tasks and datasets. VCReg also improves performance in scenarios like long-tail learning, and hierarchical classification. Additionally, we conduct analyses to suggest that its effectiveness may stem from its success in addressing challenges like gradient starvation and neural collapse. In summary, VCReg offers a universally applicable regularization framework that significantly advances the state of transfer learning, highlights the connection between gradient starvation, neural collapse, and feature transferability, and potentially opens a new avenue for regularization in this domain.",
        "keywords": "Representation Learning;Transfer Learning;Regularization",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Jiachen Zhu;Ravid Shwartz-Ziv;Yubei Chen;Yann LeCun",
        "authorids": "~Jiachen_Zhu1;~Ravid_Shwartz-Ziv2;~Yubei_Chen1;~Yann_LeCun1",
        "gender": "M;M;M;M",
        "homepage": "https://cs.nyu.edu/~jz3224/;https://redwood.berkeley.edu/people/yubei-chen/;http://yann.lecun.com;https://www.ravid-shwartz-ziv.com/",
        "dblp": "250/0741-2;30/10064;l/YannLeCun;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;WeyLqFUAAAAJ;WLN3QrAAAAAJ;https://scholar.google.co.il/citations?user=SqsLFwMAAAAJ",
        "orcid": ";;;",
        "linkedin": ";yubei-chen-05998a39/;;",
        "or_profile": "~Jiachen_Zhu1;~Yubei_Chen1;~Yann_LeCun1;~ravid_ziv1",
        "aff": "New York University;University of California, Davis;New York University;New York University",
        "aff_domain": "nyu.edu;ucdavis.edu;nyu.edu;nyu.edu",
        "position": "PhD student;Assistant Professor;Full Professor;Postdoc",
        "bibtex": "@misc{\nzhu2024variancecovariance,\ntitle={Variance-Covariance Regularization Improves Representation Learning},\nauthor={Jiachen Zhu and Ravid Shwartz-Ziv and Yubei Chen and Yann LeCun},\nyear={2024},\nurl={https://openreview.net/forum?id=0k85noSawb}\n}",
        "github": "",
        "project": "",
        "reviewers": "NHSr;qZNE;mHKo;DtqU",
        "site": "https://openreview.net/forum?id=0k85noSawb",
        "pdf_size": 378590,
        "rating": "3;3;5;5",
        "confidence": "4;4;4;3",
        "soundness": "1;2;2;2",
        "contribution": "1;2;2;2",
        "presentation": "1;4;3;3",
        "wc_summary": "49;85;27;102",
        "wc_strengths": "9;70;33;115",
        "wc_weaknesses": "224;127;189;233",
        "wc_questions": "760;168;2;106",
        "wc_review": "1042;450;251;556",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            65.75,
            29.439556722206262
        ],
        "wc_strengths_avg": [
            56.75,
            40.03982392568679
        ],
        "wc_weaknesses_avg": [
            193.25,
            41.63156855080049
        ],
        "wc_questions_avg": [
            259.0,
            295.2710619075293
        ],
        "wc_review_avg": [
            574.75,
            291.1403226968054
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3137145687617437765&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "New York University;University of California, Davis",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.nyu.edu;https://www.ucdavis.edu",
        "aff_unique_abbr": "NYU;UC Davis",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Davis",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "MINDE: Mutual Information Neural Diffusion Estimation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19605",
        "id": "0kWd8SJq8d",
        "author_site": "Giulio Franzese, Mustapha BOUNOUA, Pietro Michiardi",
        "tldr": "",
        "abstract": "In this work we present a new method for the estimation of Mutual Information (MI) between random variables. Our approach is based on an original interpretation of the Girsanov theorem, which allows us to use score-based diffusion models to estimate the KL divergence between two densities as a difference between their score functions. As a by-product, our method also enables the estimation of the entropy of random variables. \nArmed with such building blocks, we present a general recipe to measure MI, which unfolds in two directions: one uses conditional diffusion process, whereas the other uses joint diffusion processes that allow  simultaneous modelling of two random variables. \nOur results, which derive from a thorough experimental protocol over all the variants of our approach, indicate that our method is more accurate than the main alternatives from the literature, especially for challenging distributions. Furthermore, our methods pass MI self-consistency tests, including data processing and additivity under independence, which instead are a pain-point of existing methods",
        "keywords": "mutual information;score matching;diffusion models",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/21f8712040fa29b7638eb83c95cfc3888fe59c7b.zip",
        "author": "Giulio Franzese;Mustapha BOUNOUA;Pietro Michiardi",
        "authorids": "~Giulio_Franzese1;~Mustapha_BOUNOUA1;~Pietro_Michiardi1",
        "gender": "M;M;M",
        "homepage": ";https://mustaphabounoua.github.io/;http://www.eurecom.fr/~michiard/",
        "dblp": "217/1859.html;348/9789;54/3028",
        "google_scholar": "kEtx_WwAAAAJ;1ooHDEMAAAAJ;https://scholar.google.com.tw/citations?user=mlx1eCgAAAAJ",
        "orcid": "0000-0003-4244-2053;0009-0003-5244-8528;",
        "linkedin": ";mustb/;",
        "or_profile": "~Giulio_Franzese1;~Mustapha_BOUNOUA1;~Pietro_Michiardi1",
        "aff": "Eurecom;Eurecom;EURECOM",
        "aff_domain": "eurecom.fr;eurecom.fr;eurecom.fr",
        "position": "Postdoc;PhD student;Full Professor",
        "bibtex": "@inproceedings{\nfranzese2024minde,\ntitle={{MINDE}: Mutual Information Neural Diffusion Estimation},\nauthor={Giulio Franzese and Mustapha BOUNOUA and Pietro Michiardi},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=0kWd8SJq8d}\n}",
        "github": "",
        "project": "",
        "reviewers": "QLQ9;hHbr;N2Vu;a1nb",
        "pdf_size": 19358556,
        "rating": "6;6;6;8",
        "confidence": "2;2;3;3",
        "soundness": "3;2;4;4",
        "contribution": "2;2;3;3",
        "presentation": "2;3;2;3",
        "wc_summary": "83;121;11;76",
        "wc_strengths": "88;57;32;79",
        "wc_weaknesses": "106;93;734;249",
        "wc_questions": "460;86;57;74",
        "wc_review": "737;357;834;478",
        "wc_reply_reviewers": "352;27;500;151",
        "wc_reply_authors": "1672;616;1665;989",
        "reply_reviewers": "1;1;3;1",
        "reply_authors": "4;2;5;3",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            2.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            72.75,
            39.5498103661699
        ],
        "wc_strengths_avg": [
            64.0,
            21.644860821913362
        ],
        "wc_weaknesses_avg": [
            295.5,
            260.4616094552132
        ],
        "wc_questions_avg": [
            169.25,
            168.18052057238972
        ],
        "wc_review_avg": [
            601.5,
            191.99544265424635
        ],
        "wc_reply_reviewers_avg": [
            257.5,
            181.80277775655685
        ],
        "wc_reply_authors_avg": [
            1235.5,
            452.6436236157536
        ],
        "reply_reviewers_avg": [
            1.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            3.5,
            1.118033988749895
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12753365406615297679&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=0kWd8SJq8d",
        "pdf": "https://openreview.net/pdf?id=0kWd8SJq8d",
        "email": "eurecom.fr;eurecom.fr;eurecom.fr",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "EURECOM",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.eurecom.fr",
        "aff_unique_abbr": "",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "France"
    },
    {
        "id": "0kvrymILfy",
        "title": "Making Predictors More Reliable with Selective Recalibration",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "A reliable deep learning system should be able to accurately express its confidence with respect to its predictions, a quality known as calibration.  One of the most effective ways to produce reliable confidence estimates with a pre-trained model is by applying a post-hoc recalibration method.  Popular recalibration methods like temperature scaling are typically fit on a small amount of data and work in the model's output space, as opposed to the more expressive feature embedding space, and thus usually have only one or a handful of parameters.  However, the target distribution to which they are applied is often complex and difficult to fit well with such a function.  To this end we propose selective recalibration, where a selection model learns to reject some user-chosen proportion of the data in order to allow the recalibrator to focus on regions of the input space that can be well-captured by such a model.  We provide theoretical analysis to motivate our algorithm, and test our method through comprehensive experiments on difficult medical imaging and zero-shot classification tasks.  Our results show that selective recalibration consistently leads to significantly lower calibration error than a wide range of selection and recalibration baselines.",
        "keywords": "calibration;statistical learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/87fbedc398ec82602df4467c794e39d1ddcc41fa.zip",
        "author": "Thomas P Zollo;Zhun Deng;Jake Snell;Toniann Pitassi;Richard Zemel",
        "authorids": "~Thomas_P_Zollo1;~Zhun_Deng1;~Jake_Snell1;~Toniann_Pitassi3;~Richard_Zemel1",
        "gender": "M;M;M;F;M",
        "homepage": "https://www.thomaszollo.com/;https://www.zhundeng.org/;https://www.jakesnell.com;http://www.cs.columbia.edu/~toni;http://www.cs.columbia.edu/~zemel",
        "dblp": "336/8946;204/4353;172/1406;p/TPitassi;16/6366",
        "google_scholar": "Xp7LgAwAAAAJ;nkmi-moAAAAJ;MbXKAK8AAAAJ;;https://scholar.google.ca/citations?user=iBeDoRAAAAAJ",
        "orcid": ";;;;",
        "linkedin": "thomas-zollo/;;;;",
        "or_profile": "~Thomas_P_Zollo1;~Zhun_Deng1;~Jake_Snell1;~Toniann_Pitassi3;~Richard_Zemel1",
        "aff": "Columbia University;Columbia University;Princeton University;Columbia University;Department of Computer Science, University of Toronto",
        "aff_domain": "columbia.edu;columbia.edu;princeton.edu;columbia.edu;cs.toronto.edu",
        "position": "PhD student;Postdoc;Postdoc;Full Professor;Full Professor",
        "bibtex": "@misc{\nzollo2024making,\ntitle={Making Predictors More Reliable with Selective Recalibration},\nauthor={Thomas P Zollo and Zhun Deng and Jake Snell and Toniann Pitassi and Richard Zemel},\nyear={2024},\nurl={https://openreview.net/forum?id=0kvrymILfy}\n}",
        "github": "",
        "project": "",
        "reviewers": "NrpW;RXXm;6mVa;DcsN",
        "site": "https://openreview.net/forum?id=0kvrymILfy",
        "pdf_size": 868824,
        "rating": "3;5;5;8",
        "confidence": "3;4;2;5",
        "soundness": "3;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;2;4",
        "wc_summary": "119;82;86;203",
        "wc_strengths": "18;165;73;67",
        "wc_weaknesses": "260;193;161;279",
        "wc_questions": "1;101;6;281",
        "wc_review": "398;541;326;830",
        "wc_reply_reviewers": "81;106;291;22",
        "wc_reply_authors": "555;252;322;180",
        "reply_reviewers": "2;1;1;1",
        "reply_authors": "3;2;2;2",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            122.5,
            48.64411577981452
        ],
        "wc_strengths_avg": [
            80.75,
            53.11485197192966
        ],
        "wc_weaknesses_avg": [
            223.25,
            48.0852108241193
        ],
        "wc_questions_avg": [
            97.25,
            113.32337578805178
        ],
        "wc_review_avg": [
            523.75,
            193.00566701524596
        ],
        "wc_reply_reviewers_avg": [
            125.0,
            100.57584202978367
        ],
        "wc_reply_authors_avg": [
            327.25,
            140.75044404903312
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.6888467201936643,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:FDLPOlQ8bYMJ:scholar.google.com/&scioq=Making+Predictors+More+Reliable+with+Selective+Recalibration&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;2",
        "aff_unique_norm": "Columbia University;Princeton University;University of Toronto",
        "aff_unique_dep": ";;Department of Computer Science",
        "aff_unique_url": "https://www.columbia.edu;https://www.princeton.edu;https://www.utoronto.ca",
        "aff_unique_abbr": "Columbia;Princeton;U of T",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Toronto",
        "aff_country_unique_index": "0;0;0;0;1",
        "aff_country_unique": "United States;Canada"
    },
    {
        "id": "0lW9cDUtf8",
        "title": "FairReweighing: density estimation-based reweighing framework for improving separation in fair regression",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "There has been a prevalence of implementing machine learning technologies in both high-stakes public-sector and industrial contexts. However, the lack of transparency in these algorithmic solutions has raised concerns over whether these data-informed decisions secure fairness against people from all racial, gender, or age groups. Despite the extensive research and work that emerged on fairness-aware machine learning, up till now, most efforts on solving this issue have been dedicated to binary classification tasks. In this work, we propose a density estimation-based pre-processing algorithm to train regression models satisfying the separation criterion $\\hat{Y} \\perp A \\mid Y$. Evaluated by the ratio estimation of separation via probabilistic classification on both synthetic and real world data, we show that the proposed algorithm outperforms existing state-of-the-art regression fairness solutions in terms of maintaining high predicting accuracy while improving separation in fair regression.",
        "keywords": "fairness;separation;reweighing;machine learning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "XIAOYIN XI;Zhe Yu",
        "authorids": "~XIAOYIN_XI1;~Zhe_Yu3",
        "gender": "M;M",
        "homepage": ";https://zhe-yu.github.io/",
        "dblp": ";",
        "google_scholar": "h9693fMAAAAJ;MWWd15EAAAAJ",
        "orcid": ";0000-0002-6841-1725",
        "linkedin": ";",
        "or_profile": "~XIAOYIN_XI1;~Zhe_Yu3",
        "aff": "Rochester Institute of Technology;Rochester Institute of Technology",
        "aff_domain": "rit.edu;rit.edu",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nxi2024fairreweighing,\ntitle={FairReweighing: density estimation-based reweighing framework for improving separation in fair regression},\nauthor={XIAOYIN XI and Zhe Yu},\nyear={2024},\nurl={https://openreview.net/forum?id=0lW9cDUtf8}\n}",
        "github": "",
        "project": "",
        "reviewers": "gSA5;xkbJ;7rTx;NWYi",
        "site": "https://openreview.net/forum?id=0lW9cDUtf8",
        "pdf_size": 330958,
        "rating": "3;3;3;6",
        "confidence": "4;5;5;4",
        "soundness": "3;1;1;3",
        "contribution": "1;1;2;3",
        "presentation": "1;3;2;4",
        "wc_summary": "55;72;89;89",
        "wc_strengths": "18;29;59;71",
        "wc_weaknesses": "273;279;730;56",
        "wc_questions": "6;2;193;150",
        "wc_review": "352;382;1071;366",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "549;460;584;298",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            1.0
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            76.25,
            14.095655359010449
        ],
        "wc_strengths_avg": [
            44.25,
            21.533404282648853
        ],
        "wc_weaknesses_avg": [
            334.5,
            245.37980764520947
        ],
        "wc_questions_avg": [
            87.75,
            85.13041465892199
        ],
        "wc_review_avg": [
            542.75,
            305.16993216894747
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            472.75,
            110.5562639564127
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:1WsgfzHK320J:scholar.google.com/&scioq=FairReweighing:+density+estimation-based+reweighing+framework+for+improving+separation+in+fair+regression&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Rochester Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.rit.edu",
        "aff_unique_abbr": "RIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "0oIkKERYhH",
        "title": "DOG: Discriminator-only Generation Beats GANs on Graphs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We propose discriminator-only generation (DOG) as a generative modeling approach that bridges the gap between energy-based models (EBMs) and generative adversarial networks (GANs). DOG generates samples through iterative gradient descent on a discriminator's input, eliminating the need for a separate generator model. This simplification obviates the extensive tuning of generator architectures required by GANs. In the graph domain, where GANs have lagged behind diffusion approaches in generation quality, DOG demonstrates significant improvements over GANs using the same discriminator architectures. Surprisingly, despite its computationally intensive iterative generation, DOG produces higher-quality samples than GANs on the QM9 molecule dataset in less training time.",
        "keywords": "generative modeling;graph generation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/3dc2692c0fc643ad08ba8cb3e86ddd1ea0667108.zip",
        "author": "Franz Rieger;Joergen Kornfeld",
        "authorids": "~Franz_Rieger1;~Joergen_Kornfeld1",
        "gender": "M;M",
        "homepage": ";https://www.bi.mpg.de/kornfeld",
        "dblp": ";164/5639.html",
        "google_scholar": ";aT2MvAEAAAAJ",
        "orcid": ";0000-0002-2547-8700",
        "linkedin": "riegerfr/;",
        "or_profile": "~Franz_Rieger1;~J\u00f6rgen_Kornfeld1",
        "aff": "Max-Planck Institute for Biological Intelligence;MPI for Biological Intelligence",
        "aff_domain": "bi.mpg.de;bi.mpg.de",
        "position": "PhD student;Principal Researcher",
        "bibtex": "@misc{\nrieger2024dog,\ntitle={{DOG}: Discriminator-only Generation Beats {GAN}s on Graphs},\nauthor={Franz Rieger and Joergen Kornfeld},\nyear={2024},\nurl={https://openreview.net/forum?id=0oIkKERYhH}\n}",
        "github": "",
        "project": "",
        "reviewers": "8BtC;SsB3;2QS2;5Xb1",
        "site": "https://openreview.net/forum?id=0oIkKERYhH",
        "pdf_size": 6692319,
        "rating": "3;3;5;6",
        "confidence": "4;4;4;3",
        "soundness": "3;2;2;2",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;2",
        "wc_summary": "52;67;70;129",
        "wc_strengths": "74;37;39;75",
        "wc_weaknesses": "152;112;404;79",
        "wc_questions": "198;33;74;6",
        "wc_review": "476;249;587;289",
        "wc_reply_reviewers": "97;0;269;47",
        "wc_reply_authors": "861;211;848;124",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "2;1;2;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            79.5,
            29.381116384507923
        ],
        "wc_strengths_avg": [
            56.25,
            18.267115262131565
        ],
        "wc_weaknesses_avg": [
            186.75,
            128.06516895705875
        ],
        "wc_questions_avg": [
            77.75,
            73.52678083528477
        ],
        "wc_review_avg": [
            400.25,
            137.7195973708898
        ],
        "wc_reply_reviewers_avg": [
            103.25,
            101.65720584395383
        ],
        "wc_reply_authors_avg": [
            511.0,
            344.90505940040947
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.7777777777777777,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:YnXbYPZHPeoJ:scholar.google.com/&scioq=DOG:+Discriminator-only+Generation+Beats+GANs+on+Graphs&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Max-Planck Institute for Biological Intelligence;Max Planck Institute for Biological Cybernetics",
        "aff_unique_dep": ";Biological Cybernetics",
        "aff_unique_url": "https://www mpi-bi.de;https://www.biological-cybernetics.de",
        "aff_unique_abbr": ";MPIBC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "0pBX9FLGRR",
        "title": "Decoupled Diffusion Models: Image to Zero and Zero to Noise",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "This paper proposes decoupled diffusion models (DDMs), featuring a new diffusion paradigm that allows for high-quality (un)conditioned image generation in less than 10 function evaluations. In a nutshell, DDMs decouple the forward image-to-noise mapping into image-to-zero mapping and zero-to-noise mapping. Under this framework, we mathematically derive 1) the training objectives and  %and mathematically show that DDMs learn noise and image components separately. 2) for reverse time the sampling formula based on an analytic transition probability which models image to zero transition. The former enables DDMs to learn noise and image components separately which simplifies learning. Importantly, because of the latter's analyticity in the zero-to-image sampling function, DDMs can avoid the ordinary differential equation based accelerators and instead naturally perform sampling with an arbitrary step size. Under the few function evaluation setup, DDMs experimentally yield very competitive performance compared with the state of the art in 1) unconditioned image generation, e.g., CIFAR-10 and CelebA-HQ-256 and 2) image-conditioned downstream tasks such as super-resolution, saliency detection, and image inpainting.",
        "keywords": "Diffusion Probabilistic Models; Decoupled Diffusion Models",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Yuhang Huang;Liang Zheng;Zheng Qin;Xinwang Liu;Kai Xu",
        "authorids": "~Yuhang_Huang1;~Liang_Zheng4;~Zheng_Qin2;~Xinwang_Liu1;~Kai_Xu5",
        "gender": "M;M;M;M;M",
        "homepage": ";http://zheng-lab.cecs.anu.edu.au/;;https://xinwangliu.github.io/;http://kevinkaixu.net/",
        "dblp": ";61/7360-1;95/6861-2;45/6569-2.html;Xu_0004:Kai",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com.au/citations?user=vNHqr3oAAAAJ;DnHBAN0AAAAJ;A56vWC4AAAAJ;https://scholar.google.com.hk/citations?user=GuVkg-8AAAAJ",
        "orcid": ";;0000-0003-4373-4111;;",
        "linkedin": ";liang-zheng-76341311a/;;;",
        "or_profile": "~Yuhang_Huang1;~Liang_Zheng4;~Zheng_Qin2;~Xinwang_Liu1;~Kevin_Xu1",
        "aff": "National University of Defense Technology;Australian National University;National University of Defense Technology;National University of Defense Technology;National University of Defense Technology",
        "aff_domain": "nudt.edu.cn;anu.edu.au;nudt.edu.cn;nudt.edu.cn;nudt.edu.cn",
        "position": "PhD student;Associate Professor;Assistant Professor;Full Professor;Professor",
        "bibtex": "@misc{\nhuang2024decoupled,\ntitle={Decoupled Diffusion Models: Image to Zero and Zero to Noise},\nauthor={Yuhang Huang and Liang Zheng and Zheng Qin and Xinwang Liu and Kai Xu},\nyear={2024},\nurl={https://openreview.net/forum?id=0pBX9FLGRR}\n}",
        "github": "",
        "project": "",
        "reviewers": "7ZTA;UWnj;D5Rq;Jv4X",
        "site": "https://openreview.net/forum?id=0pBX9FLGRR",
        "pdf_size": 14956234,
        "rating": "3;3;3;5",
        "confidence": "5;3;4;4",
        "soundness": "2;3;2;3",
        "contribution": "1;2;2;2",
        "presentation": "2;3;2;2",
        "wc_summary": "82;51;106;136",
        "wc_strengths": "42;45;47;60",
        "wc_weaknesses": "944;315;552;121",
        "wc_questions": "12;3;6;139",
        "wc_review": "1080;414;711;456",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            93.75,
            31.227992250543423
        ],
        "wc_strengths_avg": [
            48.5,
            6.87386354243376
        ],
        "wc_weaknesses_avg": [
            483.0,
            306.818350168304
        ],
        "wc_questions_avg": [
            40.0,
            57.24945414586937
        ],
        "wc_review_avg": [
            665.25,
            265.0578946192699
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Ll7rPf4M4qMJ:scholar.google.com/&scioq=Decoupled+Diffusion+Models:+Image+to+Zero+and+Zero+to+Noise&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0;0",
        "aff_unique_norm": "National University of Defense Technology;Australian National University",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.nudt.edu.cn/;https://www.anu.edu.au",
        "aff_unique_abbr": "NUDT;ANU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;0",
        "aff_country_unique": "China;Australia"
    },
    {
        "id": "0rXGGYNVAw",
        "title": "Unlocking the Potential of Federated Learning for Deeper Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Federated learning (FL) is a new paradigm for distributed machine learning that allows a global model to be trained across multiple clients without compromising their privacy. Although FL has demonstrated remarkable success in various scenarios, recent studies mainly utilize shallow and small neural networks. In our research, we discover a significant performance decline when applying the existing FL framework to deeper neural networks, even when client data are independently and identically distributed. Our further investigation shows that the decline is due to the continuous accumulation of dissimilarities among client models during the layer-by-layer back-propagation process, which we refer to as \"divergence accumulation.\" As deeper models involve a longer chain of divergence accumulation, they tend to exhibit more significant divergence, subsequently leading to performance decline. Both theoretical derivations and empirical evidence are proposed to support the existence of divergence accumulation and its amplified effects in deeper models. To tackle this challenge, we propose a set of technical guidelines centered on minimizing divergence. These guidelines, consisting of strategies such as employing wider models and reducing the receptive field, greatly improve the performance of FL on deeper models. Their effectiveness is validated via extensive evaluation with various metrics. For example, applying the guidelines can boost the performance of ResNet101 on the Tiny-ImageNet dataset by as much as 43\\%.",
        "keywords": "Federated Learning;Distributed Model Optimization",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Haolin Wang;Xuefeng Liu;Jianwei Niu;Shaojie Tang;Jiaxing Shen",
        "authorids": "~Haolin_Wang6;~Xuefeng_Liu5;~Jianwei_Niu3;~Shaojie_Tang2;~Jiaxing_Shen2",
        "gender": "M;M;M;;M",
        "homepage": ";;https://shi.buaa.edu.cn/jwniu/zh_CN/index.htm;;https://shenjiaxing.github.io",
        "dblp": ";96/600-1;25/4653-2;;",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com/citations?hl=en;KOciOtEAAAAJ;;amJMlVoAAAAJ",
        "orcid": "0000-0002-0659-2006;;0000-0003-3946-5107;;0000-0002-0833-0288",
        "linkedin": ";;;;",
        "or_profile": "~Haolin_Wang6;~Xuefeng_Liu5;~Jianwei_Niu3;~Shaojie_Tang2;~Jiaxing_Shen2",
        "aff": "Beihang University;Behang University;Beihang University;;Lingnan University",
        "aff_domain": "buaa.edu.cn;buaa.edu.cn;buaa.edu.cn;;ln.edu.hk",
        "position": "MS student;Associate Professor;Full Professor;;Assistant Professor",
        "bibtex": "@misc{\nwang2024unlocking,\ntitle={Unlocking the Potential of Federated Learning for Deeper Models},\nauthor={Haolin Wang and Xuefeng Liu and Jianwei Niu and Shaojie Tang and Jiaxing Shen},\nyear={2024},\nurl={https://openreview.net/forum?id=0rXGGYNVAw}\n}",
        "github": "",
        "project": "",
        "reviewers": "wvyK;w79q;pCdo",
        "site": "https://openreview.net/forum?id=0rXGGYNVAw",
        "pdf_size": 444445,
        "rating": "1;3;6",
        "confidence": "4;4;2",
        "soundness": "1;2;2",
        "contribution": "1;3;2",
        "presentation": "2;3;3",
        "wc_summary": "63;38;62",
        "wc_strengths": "26;38;28",
        "wc_weaknesses": "405;220;56",
        "wc_questions": "77;89;166",
        "wc_review": "571;385;312",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.3333333333333335,
            2.0548046676563256
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            54.333333333333336,
            11.55662388223981
        ],
        "wc_strengths_avg": [
            30.666666666666668,
            5.2493385826745405
        ],
        "wc_weaknesses_avg": [
            227.0,
            142.56460523799961
        ],
        "wc_questions_avg": [
            110.66666666666667,
            39.43207943906698
        ],
        "wc_review_avg": [
            422.6666666666667,
            109.03923860498823
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9176629354822472,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2558871393691791377&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "Beihang University;Behang University;Lingnan University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.buaa.edu.cn/;;http://www.lingnan.edu.cn",
        "aff_unique_abbr": "BUAA;;LNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China;"
    },
    {
        "id": "0sO2euxhUQ",
        "title": "Learning Latent Structural Causal Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Causal learning has long concerned itself with the recovery of underlying causal mechanisms. Such causal modelling enables better explanations of out-of-distribution data. Prior works on causal learning assume that the causal variables are given. However, in machine learning tasks, one often operates on low-level data like image pixels or high-dimensional vectors. In such settings, the entire Structural Causal Model (SCM) -- structure, parameters, \\textit{and} high-level causal variables -- is latent and needs to be learnt from low-level data. We treat this problem as Bayesian inference of the latent SCM, given low-level data. We present BIOLS, a tractable approximate inference method which performs joint inference over the causal variables, structure and parameters of the latent SCM from known interventions. Experiments are performed on synthetic datasets and a causal benchmark image dataset to demonstrate the efficacy of our approach. We also demonstrate the ability of BIOLS to generate images from unseen interventional distributions.",
        "keywords": "Bayesian Causal Discovery;Latent variable models",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Jithendaraa Subramanian;Yashas Annadani;Tristan Deleu;Ivaxi Sheth;Nan Rosemary Ke;Stefan Bauer;Derek Nowrouzezahrai;Samira Ebrahimi Kahou",
        "authorids": "~Jithendaraa_Subramanian1;~Yashas_Annadani1;~Tristan_Deleu1;~Ivaxi_Sheth1;~Nan_Rosemary_Ke1;~Stefan_Bauer1;~Derek_Nowrouzezahrai1;~Samira_Ebrahimi_Kahou1",
        "gender": "M;;;F;F;;Not Specified;F",
        "homepage": "https://jithendaraa.github.io/;https://yashasannadani.com;https://tristandeleu.github.io/;;https://nke001.github.io/;https://cifar.ca/bios/stefan-bauer/;https://www.cim.mcgill.ca/~derek/;https://saebrahimi.github.io",
        "dblp": "281/6755;190/7411;192/1896;291/2912.html;120/5291;;30/4225;20/11069",
        "google_scholar": "s0BzYvYAAAAJ;ExgzcVMAAAAJ;nLNwh-wAAAAJ;Isz5M1UAAAAJ;https://scholar.google.ca/citations?user=dxwPYhQAAAAJ;O-oICE8AAAAJ;https://scholar.google.ca/citations?user=nCZ2PMcAAAAJ;https://scholar.google.ca/citations?user=F99FuaAAAAAJ",
        "orcid": ";;;;;;;",
        "linkedin": "jithendaraa-subramanian-85a22b176/;;;;;;;",
        "or_profile": "~Jithendaraa_Subramanian1;~Yashas_Annadani1;~Tristan_Deleu1;~Ivaxi_Sheth1;~Nan_Rosemary_Ke1;~Stefan_Bauer1;~Derek_Nowrouzezahrai1;~Samira_Ebrahimi_Kahou1",
        "aff": "McGill University, McGill University;Max Planck Institute for Intelligent Systems, Max-Planck Institute;University of Montreal;CISPA, saarland university, saarland informatics campus;Google DeepMind;Technische Universit\u00e4t M\u00fcnchen;McGill University;\u00c9cole de technologie sup\u00e9rieure",
        "aff_domain": "mail.mcgill.ca;tuebingen.mpg.de;umontreal.ca;cispa.saarland;deepmind.com;tum.de;mcgill.ca;etsmtl.ca",
        "position": "MS student;PhD student;PhD student;PhD student;Researcher;Associate Professor;Full Professor;Associate Professor",
        "bibtex": "@misc{\nsubramanian2024learning,\ntitle={Learning Latent Structural Causal Models},\nauthor={Jithendaraa Subramanian and Yashas Annadani and Tristan Deleu and Ivaxi Sheth and Nan Rosemary Ke and Stefan Bauer and Derek Nowrouzezahrai and Samira Ebrahimi Kahou},\nyear={2024},\nurl={https://openreview.net/forum?id=0sO2euxhUQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "DxH4;YGzo;WQKo;h7nM",
        "site": "https://openreview.net/forum?id=0sO2euxhUQ",
        "pdf_size": 833989,
        "rating": "3;3;5;5",
        "confidence": "4;4;3;3",
        "soundness": "2;2;1;2",
        "contribution": "1;2;2;2",
        "presentation": "3;3;3;2",
        "wc_summary": "39;55;91;65",
        "wc_strengths": "19;27;46;331",
        "wc_weaknesses": "68;92;490;2",
        "wc_questions": "56;52;231;2",
        "wc_review": "182;226;858;400",
        "wc_reply_reviewers": "0;25;212;290",
        "wc_reply_authors": "971;1318;4433;1439",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "2;2;8;3",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            62.5,
            18.887826767524103
        ],
        "wc_strengths_avg": [
            105.75,
            130.41735889060166
        ],
        "wc_weaknesses_avg": [
            163.0,
            191.64811504421326
        ],
        "wc_questions_avg": [
            85.25,
            86.79681733796464
        ],
        "wc_review_avg": [
            416.5,
            267.6167969317322
        ],
        "wc_reply_reviewers_avg": [
            131.75,
            122.71588120532729
        ],
        "wc_reply_authors_avg": [
            2040.25,
            1392.0932754309247
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.75,
            2.48746859276655
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12399942743285689830&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2;3;4;5;0;6",
        "aff_unique_norm": "McGill University;Max Planck Institute for Intelligent Systems;University of Montreal;Saarland University;Google;Technische Universit\u00e4t M\u00fcnchen;\u00c9cole de technologie sup\u00e9rieure",
        "aff_unique_dep": ";Intelligent Systems;;CISPA;Google DeepMind;;",
        "aff_unique_url": "https://www.mcgill.ca;https://www.mpi-is.mpg.de;https://wwwumontreal.ca;https://www.uni-saarland.de;https://deepmind.com;https://www.tum.de;https://www.etsmtl.ca",
        "aff_unique_abbr": "McGill;MPI-IS;UM;Saarland U;DeepMind;TUM;ETS",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Saarland Informatics Campus",
        "aff_country_unique_index": "0;1;0;1;2;1;0;0",
        "aff_country_unique": "Canada;Germany;United Kingdom"
    },
    {
        "id": "0sbIEkIutN",
        "title": "From Interpolation to Extrapolation: Complete Length Generalization for Arithmetic Transformers",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Since its introduction, the transformer model has demonstrated outstanding performance across various tasks. However, there are still unresolved issues regarding length generalization, particularly in algorithmic tasks. In this paper, we focus on investigating the inherent capabilities of transformer models in learning arithmetic algorithms, such as addition and multiplication. Through experiments and attention analysis, we identify a number of crucial factors for achieving optimal length generalization. We show that transformer models are able to generalize to arbitrarily long lengths with the help of targeted attention biasing. Building on this, we introduce Attention Bias Calibration (ABC), a calibration stage that enables the model to automatically learn the proper attention biases, which we link to mechanisms in relative position encoding. We demonstrate that using ABC, the transformer model can achieve unprecedented perfect length generalization on certain arithmetic tasks.",
        "keywords": "Transformer;Length Generalization;Attention;Arithmetic",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Shaoxiong Duan;Yining Shi",
        "authorids": "~Shaoxiong_Duan1;~Yining_Shi2",
        "gender": "M;",
        "homepage": "https://github.com/shaoxiongduan;https://icc.rdfz.cn/CHN_RDFZ_SZLL/CHN_RDFZ_SLKJXK/index_2.html",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Shaoxiong_Duan1;~Yining_Shi2",
        "aff": "International Curriculum Centre, RDFZ;",
        "aff_domain": "icc.rdfz.cn;",
        "position": "Undergrad student;",
        "bibtex": "@misc{\nduan2024from,\ntitle={From Interpolation to Extrapolation: Complete Length Generalization for Arithmetic Transformers},\nauthor={Shaoxiong Duan and Yining Shi},\nyear={2024},\nurl={https://openreview.net/forum?id=0sbIEkIutN}\n}",
        "github": "",
        "project": "",
        "reviewers": "usKR;69hA;hH7Y;25Z2",
        "site": "https://openreview.net/forum?id=0sbIEkIutN",
        "pdf_size": 954799,
        "rating": "5;5;6;6",
        "confidence": "4;4;4;4",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;3;2",
        "wc_summary": "63;57;88;168",
        "wc_strengths": "26;20;45;70",
        "wc_weaknesses": "241;174;208;248",
        "wc_questions": "27;4;267;168",
        "wc_review": "357;255;608;654",
        "wc_reply_reviewers": "157;0;201;24",
        "wc_reply_authors": "565;272;662;692",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            94.0,
            44.27753380666091
        ],
        "wc_strengths_avg": [
            40.25,
            19.49839737004044
        ],
        "wc_weaknesses_avg": [
            217.75,
            29.431063521388417
        ],
        "wc_questions_avg": [
            116.5,
            107.2019122963765
        ],
        "wc_review_avg": [
            468.5,
            167.24607618715604
        ],
        "wc_reply_reviewers_avg": [
            95.5,
            85.35953373818299
        ],
        "wc_reply_authors_avg": [
            547.75,
            165.97947915329775
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11404935692635392920&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "RDFZ International Curriculum Centre",
        "aff_unique_dep": "International Curriculum Centre",
        "aff_unique_url": "",
        "aff_unique_abbr": "RDFZ ICC",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "title": "Retrieval-Guided Reinforcement Learning for Boolean Circuit Minimization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19604",
        "id": "0t1O8ziRZp",
        "author_site": "Animesh Basak Chowdhury, Marco Romanelli, Benjamin Tan, Ramesh Karri, Siddharth Garg",
        "tldr": "",
        "abstract": "Logic synthesis, a pivotal stage in chip design, entails optimizing chip specifications encoded in hardware description languages like Verilog into highly efficient implementations using Boolean logic gates. The process involves a sequential application of logic minimization heuristics (``synthesis recipe\"), with their arrangement significantly impacting crucial metrics such as area and delay. Addressing the challenge posed by the broad spectrum of hardware design complexities \u2014 from variations of past designs (e.g., adders and multipliers) to entirely novel configurations (e.g., innovative processor instructions) \u2014 requires a nuanced 'synthesis recipe' guided by human expertise and intuition. This study conducts a thorough examination of learning and search techniques for logic synthesis, unearthing a surprising revelation: pre-trained agents, when confronted with entirely novel designs, may veer off course, detrimentally affecting the search trajectory. We present ABC-RL, a meticulously tuned $\\alpha$ parameter that adeptly adjusts recommendations from pre-trained agents during the search process. Computed based on similarity scores through nearest neighbor retrieval from the training dataset, ABC-RL yields superior synthesis recipes tailored for a wide array of hardware designs. Our findings showcase substantial enhancements in the Quality of Result (QoR) of synthesized circuits, boasting improvements of up to 24.8\\% compared to state-of-the-art techniques. Furthermore, ABC-RL achieves an impressive up to 9x reduction in runtime (iso-QoR) when compared to current state-of-the-art methodologies.",
        "keywords": "Electronics Design Automation (EDA);Logic Synthesis;Reinforcement Learning;Hardware design;Circuits",
        "primary_area": "infrastructure, software libraries, hardware, etc.",
        "supplementary_material": "/attachment/96d64b30ce8657cadea469fc4c3cdb5c78c4313c.zip",
        "author": "Animesh Basak Chowdhury;Marco Romanelli;Benjamin Tan;Ramesh Karri;Siddharth Garg",
        "authorids": "~Animesh_Basak_Chowdhury1;~Marco_Romanelli1;~Benjamin_Tan1;~Ramesh_Karri1;~Siddharth_Garg1",
        "gender": "M;;M;M;M",
        "homepage": "https://gitlab.com/animeshbchowdhury;;;http://engineering.nyu.edu/people/ramesh-karri/;http://engineering.nyu.edu/people/siddharth-garg/",
        "dblp": "217/4860;;https://dblp.uni-trier.de/pid/195/3070;;94/3807",
        "google_scholar": "_7dNuMwAAAAJ;;GOjr_RAAAAAJ;https://scholar.google.com.tw/citations?user=o60TaTEAAAAJ;https://scholar.google.com.tw/citations?user=Yf8OqQQAAAAJ",
        "orcid": ";;0000-0002-7642-3638;;",
        "linkedin": ";;;;",
        "or_profile": "~Animesh_Basak_Chowdhury1;~Marco_Romanelli1;~Benjamin_Tan1;~Ramesh_Karri1;~Siddharth_Garg1",
        "aff": "Qualcomm Inc, QualComm;;University of Calgary;New York University;New York University",
        "aff_domain": "qti.qualcomm.com;;ucalgary.ca;nyu.edu;nyu.edu",
        "position": "Researcher;;Assistant Professor;Full Professor;Associate Professor",
        "bibtex": "@inproceedings{\nchowdhury2024retrievalguided,\ntitle={Retrieval-Guided Reinforcement Learning for Boolean Circuit Minimization},\nauthor={Animesh Basak Chowdhury and Marco Romanelli and Benjamin Tan and Ramesh Karri and Siddharth Garg},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=0t1O8ziRZp}\n}",
        "github": "",
        "project": "",
        "reviewers": "3ENJ;yxFf;qBwB;Pwwd;pgL7",
        "pdf_size": 1216286,
        "rating": "5;6;6;6;8",
        "confidence": "4;5;4;3;4",
        "soundness": "2;2;2;3;4",
        "contribution": "2;2;3;2;3",
        "presentation": "3;3;3;3;4",
        "wc_summary": "65;51;58;107;144",
        "wc_strengths": "69;38;70;62;121",
        "wc_weaknesses": "149;109;231;64;24",
        "wc_questions": "6;23;7;34;48",
        "wc_review": "289;221;366;267;337",
        "wc_reply_reviewers": "419;0;0;0;0",
        "wc_reply_authors": "3119;402;1408;473;174",
        "reply_reviewers": "4;0;0;0;0",
        "reply_authors": "7;2;3;2;1",
        "rating_avg": [
            6.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.6,
            0.8
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            3.2,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            85.0,
            35.35533905932738
        ],
        "wc_strengths_avg": [
            72.0,
            27.09243436828813
        ],
        "wc_weaknesses_avg": [
            115.4,
            71.4551607653359
        ],
        "wc_questions_avg": [
            23.6,
            16.057397049335236
        ],
        "wc_review_avg": [
            296.0,
            51.17812032499826
        ],
        "wc_reply_reviewers_avg": [
            83.8,
            167.6
        ],
        "wc_reply_authors_avg": [
            1115.2,
            1087.0031094711735
        ],
        "reply_reviewers_avg": [
            0.8,
            1.6000000000000003
        ],
        "reply_authors_avg": [
            3.0,
            2.0976176963403033
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4042388069948974798&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=0t1O8ziRZp",
        "pdf": "https://openreview.net/pdf?id=0t1O8ziRZp",
        "email": "qti.qualcomm.com;;ucalgary.ca;nyu.edu;nyu.edu",
        "author_num": 5,
        "aff_unique_index": "0;1;2;2",
        "aff_unique_norm": "Qualcomm Incorporated;University of Calgary;New York University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.qualcomm.com;https://www.ucalgary.ca;https://www.nyu.edu",
        "aff_unique_abbr": "Qualcomm;U of C;NYU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "United States;Canada"
    },
    {
        "title": "Distributional Preference Learning: Understanding and Accounting for Hidden Context in RLHF",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19603",
        "id": "0tWTxYYPnW",
        "author_site": "Anand Siththaranjan, Cassidy Laidlaw, Dylan Hadfield-Menell",
        "tldr": "",
        "abstract": "In practice, preference learning from human feedback depends on incomplete data with hidden context. Hidden context refers to data that affects the feedback received, but which is not represented in the data used to train a preference model. This captures common issues of data collection, such as having human annotators with varied preferences, cognitive processes that result in seemingly irrational behavior, and combining data labeled according to different criteria. We prove that standard applications of preference learning, including reinforcement learning from human feedback (RLHF), implicitly aggregate over hidden contexts according to a well-known voting rule called *Borda count*. We show this can produce counter-intuitive results that are very different from other methods which implicitly aggregate via expected utility. Furthermore, our analysis formalizes the way that preference learning from users with diverse values tacitly implements a social choice function. A key implication of this result is that annotators have an incentive to misreport their preferences in order to influence the learned model, leading to vulnerabilities in the deployment of RLHF. As a step towards mitigating these problems, we introduce a class of methods called *distributional preference learning* (DPL). DPL methods estimate a distribution of possible score values for each alternative in order to better account for hidden context. Experimental results indicate that applying DPL to RLHF for LLM chatbots identifies hidden context in the data and significantly reduces subsequent jailbreak vulnerability.",
        "keywords": "Preference Learning;Reinforcement Learning from Human Feedback;Social Choice Theory",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Anand Siththaranjan;Cassidy Laidlaw;Dylan Hadfield-Menell",
        "authorids": "~Anand_Siththaranjan1;~Cassidy_Laidlaw1;~Dylan_Hadfield-Menell2",
        "gender": "M;M;M",
        "homepage": ";https://cassidylaidlaw.com;http://people.csail.mit.edu/dhm/",
        "dblp": ";241/5375;135/8332",
        "google_scholar": "qYXPDjQAAAAJ;DzeJ67UAAAAJ;4mVPFQ8AAAAJ",
        "orcid": ";;0000-0002-6168-4763",
        "linkedin": ";;",
        "or_profile": "~Anand_Siththaranjan1;~Cassidy_Laidlaw1;~Dylan_Hadfield-Menell2",
        "aff": "University of California, Berkeley;University of California, Berkeley;Massachusetts Institute of Technology",
        "aff_domain": "berkeley.edu;berkeley.edu;mit.edu",
        "position": "PhD student;PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nsiththaranjan2024distributional,\ntitle={Distributional Preference Learning: Understanding and Accounting for Hidden Context in {RLHF}},\nauthor={Anand Siththaranjan and Cassidy Laidlaw and Dylan Hadfield-Menell},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=0tWTxYYPnW}\n}",
        "github": "",
        "project": "",
        "reviewers": "i1j8;9LkN;fmx5;PKnu",
        "pdf_size": 443558,
        "rating": "5;6;6;8",
        "confidence": "3;2;3;2",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "83;121;123;55",
        "wc_strengths": "22;67;127;117",
        "wc_weaknesses": "161;34;100;62",
        "wc_questions": "7;713;125;3",
        "wc_review": "273;935;475;237",
        "wc_reply_reviewers": "128;63;0;4",
        "wc_reply_authors": "551;1126;977;236",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "1;2;2;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            2.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            95.5,
            28.297526393662043
        ],
        "wc_strengths_avg": [
            83.25,
            42.03792930200059
        ],
        "wc_weaknesses_avg": [
            89.25,
            47.58873291021731
        ],
        "wc_questions_avg": [
            212.0,
            293.3751864081214
        ],
        "wc_review_avg": [
            480.0,
            277.91545476997135
        ],
        "wc_reply_reviewers_avg": [
            48.75,
            52.112258634605354
        ],
        "wc_reply_authors_avg": [
            722.5,
            351.31075986937833
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.6882472016116854,
        "gs_citation": 58,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4301635191466793158&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=0tWTxYYPnW",
        "pdf": "https://openreview.net/pdf?id=0tWTxYYPnW",
        "email": "berkeley.edu;berkeley.edu;mit.edu",
        "author_num": 3,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "University of California, Berkeley;Massachusetts Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.berkeley.edu;https://web.mit.edu",
        "aff_unique_abbr": "UC Berkeley;MIT",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Berkeley;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "0tsJ7Nv5hk",
        "title": "Harnessing Orthogonality to Train Low-Rank Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In the realm of neural network training, the question of what is truly being learned beyond mathematical optimization has intrigued researchers for decades. \nThis study delves into the essence of neural network weights. \nBy leveraging the principles of singular value decomposition, we explore the hypothesis that the orthogonal bases of the low-rank decomposition of neural network weights stabilize during training, and provide experimental evidence to support this notion. \nBuilding upon this insight, we introduce Orthogonality-Informed Adaptive Low-Rank neural network training. \nOur novel approach seamlessly integrates into existing training workflows with minimal accuracy loss, as demonstrated by benchmarking on various datasets and well-established network architectures. \nWe find that, through standard tuning procedures, our method surpasses the performance of conventional training setups. \nFinally, we showcase the effectiveness of our tuned low-rank training procedure by applying it to a state-of-the-art transformer model for time series prediction.",
        "keywords": "orthogonal;low rank;low-rank;svd;compression;optimization",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/acee7a6f965fc83b773aa14440a746ece0302445.pdf",
        "author": "Daniel Coquelin;Katharina Fl\u00fcgel;Marie Weiel;Nicholas Kiefer;Charlotte Debus;Achim Streit;Markus G\u00f6tz",
        "authorids": "~Daniel_Coquelin1;~Katharina_Fl\u00fcgel1;~Marie_Weiel1;~Nicholas_Kiefer1;~Charlotte_Debus1;~Achim_Streit1;~Markus_G\u00f6tz1",
        "gender": ";;F;M;F;M;M",
        "homepage": ";;;https://scholar.google.com/citations?view_op=list_works&hl=de&user=nfgHgAQAAAAJ;;http://www.scc.kit.edu/personen/achim.streit.php;https://www.scc.kit.edu/personen/11452.php",
        "dblp": "271/0898;;269/0868;;;s/AchimStreit;70/8283",
        "google_scholar": "6dHRVREAAAAJ;;xCAzgAIAAAAJ;https://scholar.google.com/citations?view_op=list_works;https://scholar.google.com/citations?hl=de;https://scholar.google.de/citations?user=i72A44MAAAAJ;https://scholar.google.de/citations?user=eD2svJQAAAAJ",
        "orcid": "0000-0001-8552-5153;;0000-0001-9648-4385;;0000-0002-7156-2022;0000-0002-5065-469X;0000-0002-2233-1041",
        "linkedin": ";;;;;achimstreit/;",
        "or_profile": "~Daniel_Coquelin1;~Katharina_Fl\u00fcgel1;~Marie_Weiel1;~Nicholas_Kiefer1;~Charlotte_Debus1;~Achim_Streit1;~Markus_G\u00f6tz1",
        "aff": "Karlsruher Institut f\u00fcr Technologie;;Karlsruher Institut f\u00fcr Technologie;Karlsruher Institut f\u00fcr Technologie;Karlsruher Institut f\u00fcr Technologie;Karlsruhe Institute of Technology;Karlsruhe Institute of Technology",
        "aff_domain": "kit.edu;;kit.edu;kit.edu;kit.edu;kit.edu;kit.edu",
        "position": "Researcher;;Postdoc;PhD student;Principal Researcher;Full Professor;Principal Researcher",
        "bibtex": "@misc{\ncoquelin2024harnessing,\ntitle={Harnessing Orthogonality to Train Low-Rank Neural Networks},\nauthor={Daniel Coquelin and Katharina Fl{\\\"u}gel and Marie Weiel and Nicholas Kiefer and Charlotte Debus and Achim Streit and Markus G{\\\"o}tz},\nyear={2024},\nurl={https://openreview.net/forum?id=0tsJ7Nv5hk}\n}",
        "github": "",
        "project": "",
        "reviewers": "LcGV;uXNh;Mh5x;ViAF",
        "site": "https://openreview.net/forum?id=0tsJ7Nv5hk",
        "pdf_size": 615340,
        "rating": "3;3;5;6",
        "confidence": "4;4;4;1",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "67;37;95;80",
        "wc_strengths": "19;20;34;85",
        "wc_weaknesses": "113;147;187;53",
        "wc_questions": "8;159;133;24",
        "wc_review": "207;363;449;242",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "121;222;233;133",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            1.299038105676658
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            69.75,
            21.34683817336891
        ],
        "wc_strengths_avg": [
            39.5,
            26.93046601899046
        ],
        "wc_weaknesses_avg": [
            125.0,
            49.13247398615299
        ],
        "wc_questions_avg": [
            81.0,
            65.89005994837157
        ],
        "wc_review_avg": [
            315.25,
            96.50485739070339
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            177.25,
            50.57852805291985
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.7777777777777778,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2377516874846279502&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;0;0;1;1",
        "aff_unique_norm": "Karlsruher Institut f\u00fcr Technologie;Karlsruhe Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.kit.edu;https://www.kit.edu",
        "aff_unique_abbr": "KIT;KIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "0u9uvPdRgV",
        "title": "Semi-supervised Diffusion Solver for Travelling Salesman Problem",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We propose a semi-supervised diffusion solver for solving the Travelling Sales- man Problem (TSP). Data-driven combinatorial optimization models recently at- tract an amount of attention, since they have shown promising results in solving various NP-hard problems without too much expert knowledge. However, most of them rely on reinforcement learning (RL) and supervised learning (SL) which face some intractable challenges: RL methods often encounter sparse reward problems and SL methods pose a strict assumption that the optimal solution (label) is always available. To address these challenges in arbitrarily large-scale TSP, this article proposes a novel semi-supervised learning-based diffusion framework towards a more general situation, i.e., we can freely produce instances as many as possible but the acquisition of optimal solution is costly. This semi-supervised paradigm is made viable by modeling the generative process upon a special transition matrix, which facilitates the effective learning of the generative diffusion, compared with learning the heatmap directly like other solvers do. Comprehensive experiments validate our method across various scales TSP, showing that our method remarkably outperforms state-of-the-art data-driven solvers on large benchmark datasets for Traveling Salesman Problems, and has an outstanding generalization ability.",
        "keywords": "Travelling Salesman Problem;Semi-supervised Learning;Diffusion Model",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Ning Ma;Yishun Dou",
        "authorids": "~Ning_Ma2;~Yishun_Dou1",
        "gender": "F;M",
        "homepage": ";",
        "dblp": ";273/9779",
        "google_scholar": "https://scholar.google.com.tw/citations?view_op=list_works;https://scholar.google.com/citations?view_op=list_works",
        "orcid": ";0009-0008-8345-8258",
        "linkedin": ";",
        "or_profile": "~Ning_Ma2;~Yishun_Dou1",
        "aff": ";Huawei Technologies Ltd.",
        "aff_domain": ";huawei.com",
        "position": ";Researcher",
        "bibtex": "@misc{\nma2024semisupervised,\ntitle={Semi-supervised Diffusion Solver for Travelling Salesman Problem},\nauthor={Ning Ma and Yishun Dou},\nyear={2024},\nurl={https://openreview.net/forum?id=0u9uvPdRgV}\n}",
        "github": "",
        "project": "",
        "reviewers": "FvPj;9n2o;JPUZ;r8xE",
        "site": "https://openreview.net/forum?id=0u9uvPdRgV",
        "pdf_size": 317157,
        "rating": "3;3;5;6",
        "confidence": "3;5;5;3",
        "soundness": "2;2;2;4",
        "contribution": "2;2;2;2",
        "presentation": "3;2;3;2",
        "wc_summary": "64;45;103;111",
        "wc_strengths": "35;61;180;152",
        "wc_weaknesses": "329;312;41;161",
        "wc_questions": "128;62;90;68",
        "wc_review": "556;480;414;492",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            1.0
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            80.75,
            27.24311839712921
        ],
        "wc_strengths_avg": [
            107.0,
            60.52685354452187
        ],
        "wc_weaknesses_avg": [
            210.75,
            117.81845144118981
        ],
        "wc_questions_avg": [
            87.0,
            25.865034312755125
        ],
        "wc_review_avg": [
            485.5,
            50.386009963084
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.19245008972987526,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7016110411812515437&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Huawei",
        "aff_unique_dep": "Huawei Technologies",
        "aff_unique_url": "https://www.huawei.com",
        "aff_unique_abbr": "Huawei",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "title": "Linear attention is (maybe) all you need (to understand Transformer optimization)",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19602",
        "id": "0uI5415ry7",
        "author_site": "Kwangjun Ahn, Xiang Cheng, Minhak Song, Chulhee Yun, Ali Jadbabaie, Suvrit Sra",
        "tldr": "",
        "abstract": "Transformer training is notoriously difficult, requiring a careful design of optimizers and use of various heuristics. We make progress towards understanding the subtleties of training Transformers by carefully studying a simple yet canonical linearized *shallow* Transformer model. Specifically, we train linear Transformers to solve regression tasks, inspired by J. von Oswald et al. (ICML 2023), and K. Ahn et al. (NeurIPS 2023). Most importantly, we observe that our proposed linearized models can reproduce several prominent aspects of Transformer training dynamics. Consequently, the results obtained in this paper suggest that a simple linearized Transformer model could actually be a valuable, realistic abstraction for understanding Transformer optimization.",
        "keywords": "Transformer;optimization;adam;clipping;heavy-tailed noise;directional smoothness",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Kwangjun Ahn;Xiang Cheng;Minhak Song;Chulhee Yun;Ali Jadbabaie;Suvrit Sra",
        "authorids": "~Kwangjun_Ahn2;~Xiang_Cheng1;~Minhak_Song1;~Chulhee_Yun1;~Ali_Jadbabaie1;~Suvrit_Sra1",
        "gender": ";M;M;M;M;",
        "homepage": "http://kjahn.mit.edu/;https://sites.google.com/berkeley.edu/xiangcheng/home;https://songminhak.github.io;https://chulheeyun.github.io/;http://www.mit.edu/~jadbabai/www;https://optml.mit.edu",
        "dblp": ";29/1059-6;;138/0148.html;83/3158;90/930",
        "google_scholar": "z94iNtgAAAAJ;-WJinlEAAAAJ;https://scholar.google.com/citations?hl=en;Ukl64ggAAAAJ;ZBc_WwYAAAAJ;eyCw9goAAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Kwangjun_Ahn2;~Xiang_Cheng1;~Minhak_Song1;~Chulhee_Yun1;~Ali_Jadbabaie1;~Suvrit_Sra1",
        "aff": "Massachusetts Institute of Technology;;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Massachusetts Institute of Technology;Massachusetts Institute of Technology",
        "aff_domain": "mit.edu;;kaist.ac.kr;kaist.ac.kr;mit.edu;mit.edu",
        "position": "PhD student;;Undergrad student;Assistant Professor;Full Professor;Associate Professor",
        "bibtex": "@inproceedings{\nahn2024linear,\ntitle={Linear attention is (maybe) all you need (to understand Transformer optimization)},\nauthor={Kwangjun Ahn and Xiang Cheng and Minhak Song and Chulhee Yun and Ali Jadbabaie and Suvrit Sra},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=0uI5415ry7}\n}",
        "github": "",
        "project": "",
        "reviewers": "gJVN;bjjH;GNbE;dN4V",
        "pdf_size": 3520901,
        "rating": "6;6;6;8",
        "confidence": "4;3;4;3",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "80;83;134;77",
        "wc_strengths": "57;78;45;92",
        "wc_weaknesses": "187;99;49;134",
        "wc_questions": "24;100;117;48",
        "wc_review": "348;360;345;351",
        "wc_reply_reviewers": "21;123;0;0",
        "wc_reply_authors": "135;697;286;183",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            93.5,
            23.47871376374779
        ],
        "wc_strengths_avg": [
            68.0,
            18.207141456033124
        ],
        "wc_weaknesses_avg": [
            117.25,
            50.34071413875652
        ],
        "wc_questions_avg": [
            72.25,
            37.71190130449538
        ],
        "wc_review_avg": [
            351.0,
            5.612486080160912
        ],
        "wc_reply_reviewers_avg": [
            36.0,
            50.95586325438909
        ],
        "wc_reply_authors_avg": [
            325.25,
            221.4547075589047
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 54,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13865784961911745848&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=0uI5415ry7",
        "pdf": "https://openreview.net/pdf?id=0uI5415ry7",
        "email": "mit.edu;;kaist.ac.kr;kaist.ac.kr;mit.edu;mit.edu",
        "author_num": 6,
        "aff_unique_index": "0;1;1;0;0",
        "aff_unique_norm": "Massachusetts Institute of Technology;Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://web.mit.edu;https://www.kaist.ac.kr",
        "aff_unique_abbr": "MIT;KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;0;0",
        "aff_country_unique": "United States;South Korea"
    },
    {
        "id": "0uUASYeXav",
        "title": "Graphical Object-Centric Actor-Critic",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "There have recently been significant advances in the problem of unsupervised object-centric representation learning and its application to downstream tasks. The latest works support the argument that employing disentangled object representations in image-based object-centric reinforcement learning tasks facilitates policy learning. We propose a novel object-centric reinforcement learning algorithm combining actor-critic and model-based approaches to utilize these representations effectively.\nIn our approach, we use a transformer encoder to extract object representations and graph neural networks to approximate the dynamics of an environment. The proposed method fills a research gap in developing efficient object-centric world models for reinforcement learning settings that can be used for environments with discrete or continuous action spaces. Our algorithm performs better in a visually complex 3D robotic environment and a 2D environment with compositional structure than the state-of-the-art model-free actor-critic algorithm built upon transformer architecture and the state-of-the-art monolithic model-based algorithm.",
        "keywords": "Reinforcement Learning;World Model;Actor-critic;Object-centric Representation;Graph Neural Network",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/f2a25ac4327a0679800f55abd7420aaccb29bc8c.zip",
        "author": "Leonid Anatolievich Ugadiarov;Vitaliy Vorobyov;Aleksandr Panov",
        "authorids": "~Leonid_Anatolievich_Ugadiarov1;~Vitaliy_Vorobyov1;~Aleksandr_Panov1",
        "gender": "M;M;M",
        "homepage": "https://github.com/ugadiarov-la-phystech-edu;https://v3code.github.io/personal_page;http://grafft.github.io",
        "dblp": ";;177/9975",
        "google_scholar": ";;https://scholar.google.ru/citations?hl=ru",
        "orcid": ";;0000-0002-9747-3837",
        "linkedin": ";;",
        "or_profile": "~Leonid_Anatolievich_Ugadiarov1;~Vitaliy_Vorobyov1;~Aleksandr_Panov1",
        "aff": "Federal Research Center \u00abComputer Science and Control\u00bb of Russian Academy of Sciences;Moscow Institute of Physics and Technology;Federal Research Center \u00abComputer Science and Control\u00bb of Russian Academy of Sciences",
        "aff_domain": "frccsc.ru;phystech.edu;frccsc.ru",
        "position": "Researcher;MS student;Principal Researcher",
        "bibtex": "@misc{\nugadiarov2024graphical,\ntitle={Graphical Object-Centric Actor-Critic},\nauthor={Leonid Anatolievich Ugadiarov and Vitaliy Vorobyov and Aleksandr Panov},\nyear={2024},\nurl={https://openreview.net/forum?id=0uUASYeXav}\n}",
        "github": "",
        "project": "",
        "reviewers": "aEan;rSLu;6gyQ;HvnL",
        "site": "https://openreview.net/forum?id=0uUASYeXav",
        "pdf_size": 10261470,
        "rating": "3;5;5;6",
        "confidence": "4;4;4;3",
        "soundness": "2;2;2;2",
        "contribution": "1;2;2;2",
        "presentation": "2;2;2;2",
        "wc_summary": "59;50;75;115",
        "wc_strengths": "36;18;43;152",
        "wc_weaknesses": "200;120;111;512",
        "wc_questions": "128;105;44;11",
        "wc_review": "423;293;273;790",
        "wc_reply_reviewers": "184;98;26;47",
        "wc_reply_authors": "1064;641;937;611",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "3;2;3;3",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            74.75,
            24.903564001965663
        ],
        "wc_strengths_avg": [
            62.25,
            52.613567641816495
        ],
        "wc_weaknesses_avg": [
            235.75,
            163.21209360828627
        ],
        "wc_questions_avg": [
            72.0,
            46.71723450719231
        ],
        "wc_review_avg": [
            444.75,
            207.48298122978665
        ],
        "wc_reply_reviewers_avg": [
            88.75,
            60.90720400740786
        ],
        "wc_reply_authors_avg": [
            813.25,
            192.85016852468655
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.75,
            0.4330127018922193
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.6622661785325219,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14845202733643043297&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Russian Academy of Sciences;Moscow Institute of Physics and Technology",
        "aff_unique_dep": "Computer Science and Control;",
        "aff_unique_url": "https://www.ras.ru;https://www.mipt.ru/en",
        "aff_unique_abbr": "RAS;MIPT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Russian Federation"
    },
    {
        "id": "0unbjYPmbC",
        "title": "ChatSearch: a Dataset and a Generative Retrieval Model for General Conversational Image Retrieval",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In this paper, we investigate the task of general conversational image retrieval on open-domain images.\nThe objective is to search for images based on interactive conversations between humans and computers. To advance this task, we curate a dataset called ChatSearch. This dataset includes a multimodal conversational context query for each target image, thereby requiring the retrieval system to infer the underlying retrieval intention from the multimodal dialogue conducted over multiple rounds. \nSimultaneously, we propose a generative retrieval model named ChatSearcher, which is trained end-to-end to accept and produce interleaved image-text inputs/outputs. ChatSearcher exhibits strong capability in reasoning with multimodal context and can leverage world knowledge to yield more sophisticated retrieval results. It demonstrates superior performance on the ChatSearch dataset and also achieves competitive results on other image retrieval tasks, such as zero-shot text-to-image retrieval and zero-shot composed image retrieval. With the availability of the ChatSearch dataset and the effectiveness of the ChatSearcher model, we anticipate that this work will inspire further research on interactive multimodal retrieval systems.",
        "keywords": "Image Retrieval; Multimodal Learning; Conversational Image Retrieval; Human-computer Interaction",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Zijia Zhao;Longteng Guo;Tongtian Yue;Erdong Hu;Shuai Shao;Zehuan Yuan;Jing Liu",
        "authorids": "~Zijia_Zhao1;~Longteng_Guo1;~Tongtian_Yue1;~Erdong_Hu2;~Shuai_Shao3;~Zehuan_Yuan1;~Jing_Liu1",
        "gender": "M;M;M;M;M;F;",
        "homepage": "https://ltguo19.github.io/;;https://github.com/Hedone00;http://www.sshao.com;https://shallowyuan.github.io/;http://www.nlpr.ia.ac.cn/iva/liujing/;https://blog.csdn.net/JoeCucu?type=blog",
        "dblp": "207/1905;348/6568;;71/8201-5;227/3298;72/2590-1.html;296/3659",
        "google_scholar": "OaGRHWYAAAAJ;OrICiVQAAAAJ;https://scholar.google.com/citations?hl=en;uL9iyKgAAAAJ;;sOI-S7oAAAAJ;",
        "orcid": ";0000-0001-5774-4084;;0000-0001-8560-4572;;;",
        "linkedin": ";;;shuai-shao-b7a047a2/;;;",
        "or_profile": "~Longteng_Guo1;~Tongtian_Yue1;~Erdong_Hu2;~Shuai_Shao3;~Zehuan_Yuan1;~Jing_Liu1;~Joe_Z1",
        "aff": "Institute of Automation, Chinese Academy of Sciences;, Institute of automation, Chinese academy of science;Institute of Automation,Chinese Academy of Sciences;ByteDance Inc.;ByteDance Inc.;Institute of automation, Chinese academy of science;Institute of Automation, Chinese Academy of Sciences",
        "aff_domain": "ia.ac.cn;nlpr.ia.ac.cn;ia.ac.cn;bytedance.com;bytedance.com;nlpr.ia.ac.cn;ia.ac.cn",
        "position": "Associate Professor;PhD student;MS student;Researcher;Researcher;Full Professor;PhD student",
        "bibtex": "@misc{\nzhao2024chatsearch,\ntitle={ChatSearch: a Dataset and a Generative Retrieval Model for General Conversational Image Retrieval},\nauthor={Zijia Zhao and Longteng Guo and Tongtian Yue and Erdong Hu and Shuai Shao and Zehuan Yuan and Jing Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=0unbjYPmbC}\n}",
        "github": "",
        "project": "",
        "reviewers": "nix8;Lx3N;fGPE;DUdh",
        "site": "https://openreview.net/forum?id=0unbjYPmbC",
        "pdf_size": 18734609,
        "rating": "5;5;5;6",
        "confidence": "3;3;4;3",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "1;3;4;2",
        "wc_summary": "64;52;63;63",
        "wc_strengths": "30;36;58;102",
        "wc_weaknesses": "176;168;186;87",
        "wc_questions": "41;23;135;22",
        "wc_review": "311;279;442;274",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "546;751;1030;374",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            60.5,
            4.924428900898052
        ],
        "wc_strengths_avg": [
            56.5,
            28.26216552212516
        ],
        "wc_weaknesses_avg": [
            154.25,
            39.347013863824536
        ],
        "wc_questions_avg": [
            55.25,
            46.66034183329565
        ],
        "wc_review_avg": [
            326.5,
            68.17807565486136
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            675.25,
            244.45999161416987
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15039888198124627695&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;0;1;1;0;0",
        "aff_unique_norm": "Chinese Academy of Sciences;ByteDance",
        "aff_unique_dep": "Institute of Automation;",
        "aff_unique_url": "http://www.ia.cas.cn;https://www.bytedance.com",
        "aff_unique_abbr": "CAS;ByteDance",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "0upMDCx8AA",
        "title": "Post-Training Recovery from Injected Bias with Self-Influence",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Learning generalized models from biased data with strong spurious correlations to the class label is an important undertaking toward fairness in deep learning. In the absence of any prior knowledge or supervision of bias, recent studies tackle the problem by presuming the bias severity to be sufficiently high and employing a bias-amplified model trained by empirical risk minimization (ERM) to identify and utilize bias-conflicting samples that are free of spurious correlations. However, insufficient preciseness in detecting bias-conflicting samples results in injecting erroneous signals during training; conversely, it leads to learning malignant biases instead of excluding them. In practice, as the presumption about the magnitude of bias often does not hold, it is important for the model to demonstrate robust performance across a wide spectrum of biases. In this paper, we propose SePT (Self-influence-based Post-Training), a fine-tuning framework leveraging the self-influence score to filter bias-conflicting samples, which yields a pivotal subset with significantly diminished spurious correlations. Our method enables the quick recovery of a biased model from learned bias through fine-tuning with minimal friction. In addition, SePT also utilizes the remaining training dataset to adjust the model, thereby maintaining robust performance in situations with weak spurious correlation or even in the absence of it. Experiments on diverse benchmark datasets with a wide range of bias strengths show that SePT is capable of boosting the performance of both bias-injected and state-of-the-art debiased models.",
        "keywords": "Deep learning;dataset bias;debiasing",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/b22796957ae69f570f80da38d113b2742baef045.zip",
        "author": "Yeonsung Jung;Jaeyun Song;June Yong Yang;Jin-Hwa Kim;Sung-Yub Kim;Eunho Yang",
        "authorids": "~Yeonsung_Jung1;~Jaeyun_Song2;~June_Yong_Yang1;~Jin-Hwa_Kim1;~Sung-Yub_Kim1;~Eunho_Yang1",
        "gender": ";M;;Unspecified;M;M",
        "homepage": "https://yeonsungjung.github.io/;;http://mli.kaist.ac.kr/people/;http://wityworks.com;https://sites.google.com/site/hleehome2/;https://sungyubkim.github.io",
        "dblp": "264/2809;289/2048;277/5624;48/258;96/2621;236/4532",
        "google_scholar": "https://scholar.google.com/citations?hl=ko;;nkLNWg0AAAAJ;https://scholar.google.co.kr/citations?user=3f2wPekAAAAJ;;m2rhgrkAAAAJ",
        "orcid": ";;;0000-0002-0423-0415;;",
        "linkedin": "yeonsung-jung-a50015213/;jaeyun-song-9a4111213/;;;;",
        "or_profile": "~Yeonsung_Jung1;~Jaeyun_Song2;~June_Yong_Yang1;~Jin-Hwa_Kim1;~Eunho_Yang1;~SungYub_Kim1",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;NAVER;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr;kaist.ac.kr;navercorp.com;kaist.ac.kr;kaist.ac.kr",
        "position": "PhD student;PhD student;PhD student;Research Scientist;Associate Professor;PhD student",
        "bibtex": "@misc{\njung2024posttraining,\ntitle={Post-Training Recovery from Injected Bias with Self-Influence},\nauthor={Yeonsung Jung and Jaeyun Song and June Yong Yang and Jin-Hwa Kim and Sung-Yub Kim and Eunho Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=0upMDCx8AA}\n}",
        "github": "",
        "project": "",
        "reviewers": "coZv;pbA4;dWNy",
        "site": "https://openreview.net/forum?id=0upMDCx8AA",
        "pdf_size": 10904349,
        "rating": "3;3;5",
        "confidence": "2;3;4",
        "soundness": "2;1;2",
        "contribution": "2;2;3",
        "presentation": "3;2;2",
        "wc_summary": "93;96;148",
        "wc_strengths": "49;69;40",
        "wc_weaknesses": "85;207;56",
        "wc_questions": "8;21;363",
        "wc_review": "235;393;607",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "386;599;618",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            112.33333333333333,
            25.249862485874168
        ],
        "wc_strengths_avg": [
            52.666666666666664,
            12.119772641798562
        ],
        "wc_weaknesses_avg": [
            116.0,
            65.42680388546171
        ],
        "wc_questions_avg": [
            130.66666666666666,
            164.37017842527138
        ],
        "wc_review_avg": [
            411.6666666666667,
            152.44088107270377
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            534.3333333333334,
            105.17393001859136
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.8660254037844387,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:8X31mcmToDEJ:scholar.google.com/&scioq=Post-Training+Recovery+from+Injected+Bias+with+Self-Influence&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology;NAVER Corporation",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.kaist.ac.kr;https://www.naver.com",
        "aff_unique_abbr": "KAIST;NAVER",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "LipSim: A Provably Robust Perceptual Similarity Metric",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19601",
        "id": "0w42S2Gp70",
        "author_site": "Sara Ghazanfari, Alexandre Araujo, Prashanth Krishnamurthy, Farshad Khorrami, Siddharth Garg",
        "tldr": "",
        "abstract": "Recent years have seen growing interest in developing and applying perceptual similarity metrics. Research has shown the superiority of perceptual metrics over pixel-wise metrics in aligning with human perception and serving as a proxy for the human visual system.\nOn the other hand, as perceptual metrics rely on neural networks, there is a growing concern regarding their resilience, given the established vulnerability of neural networks to adversarial attacks. It is indeed logical to infer that perceptual metrics may inherit both the strengths and shortcomings of neural networks.\nIn this work, we demonstrate the vulnerability of state-of-the-art perceptual similarity metrics based on an ensemble of ViT-based feature extractors to adversarial attacks. We then propose a framework to train a robust perceptual similarity metric called LipSim (Lipschitz Similarity Metric) with provable guarantees. \nBy leveraging 1-Lipschitz neural networks as the backbone, LipSim provides guarded areas around each data point and certificates for all perturbations within an $\\ell_2$ ball. Finally, a comprehensive set of experiments shows the performance of LipSim in terms of natural and certified scores and on the image retrieval application.",
        "keywords": "Perceptual similarity metric;certified defense;deep learning",
        "primary_area": "metric learning, kernel learning, and sparse coding",
        "supplementary_material": "/attachment/ac1c68fa813678f31bc42d9bafc10c7a84a43cd6.zip",
        "author": "Sara Ghazanfari;Alexandre Araujo;Prashanth Krishnamurthy;Farshad Khorrami;Siddharth Garg",
        "authorids": "~Sara_Ghazanfari1;~Alexandre_Araujo3;~Prashanth_Krishnamurthy1;~Farshad_Khorrami1;~Siddharth_Garg1",
        "gender": "F;;M;M;M",
        "homepage": "https://saraghazanfari.github.io/;;https://engineering.nyu.edu/faculty/farshad-khorrami;http://engineering.nyu.edu/people/siddharth-garg/;https://alexandrearaujo.com/",
        "dblp": "236/6982;24/3420;94/5644;94/3807;228/6599",
        "google_scholar": "0dMW47QAAAAJ;W-_zgGgAAAAJ;NdOqlPQAAAAJ;https://scholar.google.com.tw/citations?user=Yf8OqQQAAAAJ;https://scholar.google.fr/citations?user=wsu61VYAAAAJ",
        "orcid": ";;;;",
        "linkedin": "sara-ghazanfari-1a8b37163/;;;;",
        "or_profile": "~Sara_Ghazanfari1;~Prashanth_Krishnamurthy1;~Farshad_Khorrami1;~Siddharth_Garg1;~Alexandre_ARAUJO1",
        "aff": "New York University;New York University;New York University;New York University;New York University",
        "aff_domain": "nyu.edu;nyu.edu;nyu.edu;nyu.edu;nyu.edu",
        "position": "PhD student;Research Scientist and Adjunct Faculty;Full Professor;Associate Professor;Postdoc",
        "bibtex": "@inproceedings{\nghazanfari2024lipsim,\ntitle={LipSim: A Provably Robust Perceptual Similarity Metric},\nauthor={Sara Ghazanfari and Alexandre Araujo and Prashanth Krishnamurthy and Farshad Khorrami and Siddharth Garg},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=0w42S2Gp70}\n}",
        "github": "",
        "project": "",
        "reviewers": "YdcH;KFDY;sTNV",
        "pdf_size": 36179352,
        "rating": "5;5;6",
        "confidence": "2;2;3",
        "soundness": "3;2;3",
        "contribution": "3;2;3",
        "presentation": "3;2;3",
        "wc_summary": "101;38;67",
        "wc_strengths": "76;24;60",
        "wc_weaknesses": "57;65;71",
        "wc_questions": "1;2;211",
        "wc_review": "235;129;409",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "376;1105;1711",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;2;3",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            68.66666666666667,
            25.746628689770024
        ],
        "wc_strengths_avg": [
            53.333333333333336,
            21.74600857373345
        ],
        "wc_weaknesses_avg": [
            64.33333333333333,
            5.734883511361751
        ],
        "wc_questions_avg": [
            71.33333333333333,
            98.76009090495795
        ],
        "wc_review_avg": [
            257.6666666666667,
            115.42770705318354
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1064.0,
            545.782007765005
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.9999999999999997,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13175108423726794276&as_sdt=5,31&sciodt=0,31&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=0w42S2Gp70",
        "pdf": "https://openreview.net/pdf?id=0w42S2Gp70",
        "email": "nyu.edu;nyu.edu;nyu.edu;nyu.edu;nyu.edu",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "New York University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nyu.edu",
        "aff_unique_abbr": "NYU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "0xLWPdObG1",
        "title": "Subject-specific Deep Neural Networks for Count Data with High-cardinality Categorical Features",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "There is a growing interest in subject-specific predictions using deep neural networks (DNNs) because real-world data often exhibit correlations, which has been typically overlooked in traditional DNN frameworks. In this paper, we propose a novel hierarchical likelihood learning framework for introducing gamma random effects into the Poisson DNN, so as to improve the prediction performance by capturing both nonlinear effects of input variables and subject-specific cluster effects. The proposed method simultaneously yields maximum likelihood estimators for fixed parameters and best unbiased predictors for random effects by optimizing a single objective function. This approach enables a fast end-to-end algorithm for handling clustered count data, which often involve high-cardinality categorical features. Furthermore, state-of-the-art network architectures can be easily implemented into the proposed h-likelihood framework. As an example, we introduce multi-head attention layer and a sparsemax function, which allows feature selection in high-dimensional settings. To enhance practical performance and learning efficiency, we present an adjustment procedure for prediction of random parameters and a method-of-moments estimator for pretraining of variance component. Various experiential studies and real data analyses confirm the advantages of our proposed methods.",
        "keywords": "subject-specific prediction;random effect;high-cardinality categorical feature;count data;clustered data;hierarchical likelihood;deep learning",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/0cd785bb937afe682c53cc975c89f7e8433e7e6b.zip",
        "author": "Hangbin Lee;IL DO HA;Changha Hwang;Youngjo Lee",
        "authorids": "~Hangbin_Lee1;~IL_DO_HA1;~Changha_Hwang1;~Youngjo_Lee2",
        "gender": "M;M;M;M",
        "homepage": ";https://stat-eng.pknu.ac.kr/stat-eng/2348;https://www.dankook.ac.kr/web/kor/-167?p_p_id=DeptInfo_WAR_empInfoportlet&p_p_lifecycle=0&p_p_state=normal&p_p_mode=view&p_p_col_id=column-2&p_p_col_count=1&_DeptInfo_WAR_empInfoportlet_empId=JIeao4QTeONm1350kqqKBw%3D%3D&_DeptInfo_WAR_empInfoportlet_action=view_message;",
        "dblp": "321/6052;;;",
        "google_scholar": "https://scholar.google.co.kr/citations?user=Bow6RRIAAAAJ;;;yEoD89QAAAAJ",
        "orcid": "0000-0002-3447-4306;;;0000-0001-9820-6434",
        "linkedin": "hangbin-lee-b415b1172/;;;",
        "or_profile": "~Hangbin_Lee1;~IL_DO_HA1;~Changha_Hwang1;~Youngjo_Lee2",
        "aff": "Seoul National University;;;Seoul National University",
        "aff_domain": "snu.ac.kr;;;snu.ac.kr",
        "position": "Postdoc;;;Emeritus",
        "bibtex": "@misc{\nlee2024subjectspecific,\ntitle={Subject-specific Deep Neural Networks for Count Data with High-cardinality Categorical Features},\nauthor={Hangbin Lee and IL DO HA and Changha Hwang and Youngjo Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=0xLWPdObG1}\n}",
        "github": "",
        "project": "",
        "reviewers": "HXxH;ZRFo;z2gb",
        "site": "https://openreview.net/forum?id=0xLWPdObG1",
        "pdf_size": 690080,
        "rating": "3;6;6",
        "confidence": "3;2;3",
        "soundness": "2;4;3",
        "contribution": "2;3;3",
        "presentation": "2;3;2",
        "wc_summary": "66;53;72",
        "wc_strengths": "38;51;140",
        "wc_weaknesses": "574;53;258",
        "wc_questions": "128;106;119",
        "wc_review": "806;263;589",
        "wc_reply_reviewers": "376;47;35",
        "wc_reply_authors": "2441;903;1101",
        "reply_reviewers": "2;1;1",
        "reply_authors": "5;2;2",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            63.666666666666664,
            7.93025150224688
        ],
        "wc_strengths_avg": [
            76.33333333333333,
            45.330882286680556
        ],
        "wc_weaknesses_avg": [
            295.0,
            214.30041219434614
        ],
        "wc_questions_avg": [
            117.66666666666667,
            9.030811456096044
        ],
        "wc_review_avg": [
            552.6666666666666,
            223.16262132255832
        ],
        "wc_reply_reviewers_avg": [
            152.66666666666666,
            157.99648378647194
        ],
        "wc_reply_authors_avg": [
            1481.6666666666667,
            683.1502193677627
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.0,
            1.4142135623730951
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=929589920201687781&as_sdt=805&sciodt=0,3&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Seoul National University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.snu.ac.kr",
        "aff_unique_abbr": "SNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "0xT87opqKV",
        "title": "ProteinAdapter: Adapting Pre-trained Large Protein Models for Efficient Protein Representation Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The study of proteins is crucial in various scientific disciplines, but understanding their intricate multi-level relationships remains challenging. Recent advancements in Large Protein Models (LPMs) have demonstrated their ability in sequence and structure understanding, suggesting the potential of directly using them for efficient protein representation learning. In this work, we introduce ProteinAdapter, to efficiently transfer the general reference from the multiple Large Protein Models (LPMs), e.g., ESM-1b, to the task-specific knowledge. ProteinAdapter could largely save labor-intensive analysis on the 3D position and the amino acid order. We observe that such a simple yet effective approach works well on multiple downstream tasks. Specifically, (1) with limited extra parameters, ProteinAdapter enables multi-level protein representation learning by integrating both sequence and geometric structure embeddings from LPMs. (2) Based on the learned embedding, we further scale the proposed ProteinAdapter to multiple conventional protein tasks. Considering different task priors, we propose a unified multi-scale predictor to fully take advantage of the learned embeddings via task-specific focus. Extensive experiments on over 20 tasks show that ProteinAdapter outperforms state-of-the-art methods under both single-task and multi-task settings. We hope that the proposed method could accelerate the study of protein analysis in the future.",
        "keywords": "Pretrained Large Models;Parameter-Efficient Fine-tuning;Protein Representation Learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Chao Wang;Zhedong Zheng;Yifan Sun;Hehe Fan;Yi Yang",
        "authorids": "~Chao_Wang31;~Zhedong_Zheng1;~Yifan_Sun2;~Hehe_Fan1;~Yi_Yang22",
        "gender": "M;M;M;M;M",
        "homepage": ";http://zdzheng.xyz;https://yifansun-reid.github.io;https://hehefan.github.io;https://person.zju.edu.cn/yiyang",
        "dblp": ";190/7710;99/10261-3.html;184/5722.html;33/4854-1.html",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;XT17oUEAAAAJ;uUZEL7UAAAAJ;hVuflMQAAAAJ;RMSuNFwAAAAJ",
        "orcid": "0000-0003-1297-768X;0000-0002-2434-9050;0000-0003-3532-6521;0000-0001-9572-2345;",
        "linkedin": ";zhedongzheng;;;",
        "or_profile": "~Chao_Wang31;~Zhedong_Zheng1;~Yifan_Sun2;~Hehe_Fan1;~Yi_Yang22",
        "aff": "University of Technology Sydney;University of Macau;Baidu;Zhejiang University;Zhejiang University",
        "aff_domain": "uts.edu.au;um.edu.mo;baidu.com;zju.edu.cn;zju.edu.cn",
        "position": "PhD student;Assistant Professor;Senior Expert;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nwang2024proteinadapter,\ntitle={ProteinAdapter: Adapting Pre-trained Large Protein Models for Efficient Protein Representation Learning},\nauthor={Chao Wang and Zhedong Zheng and Yifan Sun and Hehe Fan and Yi Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=0xT87opqKV}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZPKb;PNTU;XhEm;vd8N",
        "site": "https://openreview.net/forum?id=0xT87opqKV",
        "pdf_size": 970157,
        "rating": "3;3;5;5",
        "confidence": "3;3;4;5",
        "soundness": "1;3;3;2",
        "contribution": "2;2;2;3",
        "presentation": "1;3;3;3",
        "wc_summary": "87;47;56;114",
        "wc_strengths": "72;24;65;26",
        "wc_weaknesses": "525;60;62;242",
        "wc_questions": "110;56;28;22",
        "wc_review": "794;187;211;404",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            76.0,
            26.485845276298054
        ],
        "wc_strengths_avg": [
            46.75,
            21.901769334919038
        ],
        "wc_weaknesses_avg": [
            222.25,
            189.77140854196134
        ],
        "wc_questions_avg": [
            54.0,
            34.785054261852174
        ],
        "wc_review_avg": [
            399.0,
            243.07303429216495
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.9045340337332909,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:NAGG0TncKEAJ:scholar.google.com/&scioq=ProteinAdapter:+Adapting+Pre-trained+Large+Protein+Models+for+Efficient+Protein+Representation+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;3;3",
        "aff_unique_norm": "University of Technology Sydney;University of Macau;Baidu;Zhejiang University",
        "aff_unique_dep": ";;Baidu, Inc.;",
        "aff_unique_url": "https://www.uts.edu.au;https://www.um.edu.mo;https://www.baidu.com;https://www.zju.edu.cn",
        "aff_unique_abbr": "UTS;UM;Baidu;ZJU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Macau SAR",
        "aff_country_unique_index": "0;1;1;1;1",
        "aff_country_unique": "Australia;China"
    },
    {
        "id": "0y0yOpI4wx",
        "title": "General-Purpose In-Context Learning by Meta-Learning Transformers",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Modern machine learning requires system designers to specify aspects of the learning pipeline, such as losses, architectures, and optimizers. Meta-learning, or learning-to-learn, instead aims to learn those aspects, and promises to unlock greater capabilities with less manual effort. One particularly ambitious goal of meta-learning is to train general-purpose in-context learning algorithms from scratch, using only black-box models with minimal inductive bias. Such a model takes in training data, and produces test-set predictions across a wide range of problems, without any explicit definition of an inference model, training loss, or optimization algorithm. In this paper we show that Transformers and other black-box models can be meta-trained to act as general-purpose in-context learners. We characterize transitions between algorithms that generalize, algorithms that memorize, and algorithms that fail to meta-train at all, induced by changes in model size, number of tasks, and meta-optimization. We further show that the capabilities of meta-trained algorithms are bottlenecked by the accessible state size (memory) determining the next prediction, unlike standard models which are thought to be bottlenecked by parameter count. Finally, we propose practical interventions such as biasing the training distribution that improve the meta-training and meta-generalization of general-purpose in-context learning algorithms.",
        "keywords": "general-purpose;in-context;in-context learning;transformers;black-box;generalization",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Louis Kirsch;James Harrison;Jascha Sohl-Dickstein;Luke Metz",
        "authorids": "~Louis_Kirsch1;~James_Harrison1;~Jascha_Sohl-Dickstein2;~Luke_Metz1",
        "gender": ";;M;M",
        "homepage": "http://louiskirsch.com;;http://lukemetz.com;http://sohldickstein.com",
        "dblp": "202/2379;;;51/7117",
        "google_scholar": "w8AkOEAAAAAJ;-tEiRFcAAAAJ;jCOmCb4AAAAJ;-3zYIjQAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Louis_Kirsch1;~James_Harrison1;~Luke_Metz1;~Jascha_Sohl-Dickstein1",
        "aff": "Scuola universitaria professionale della Svizzera italiana (SUPSI);Google;Google;Google",
        "aff_domain": "supsi.ch;google.com;google.com;google.com",
        "position": "PhD student;Researcher;Research Scientist;Research Scientist",
        "bibtex": "@misc{\nkirsch2024generalpurpose,\ntitle={General-Purpose In-Context Learning by Meta-Learning Transformers},\nauthor={Louis Kirsch and James Harrison and Jascha Sohl-Dickstein and Luke Metz},\nyear={2024},\nurl={https://openreview.net/forum?id=0y0yOpI4wx}\n}",
        "github": "",
        "project": "",
        "reviewers": "9s7H;j4eV;zaZF;ohZB",
        "site": "https://openreview.net/forum?id=0y0yOpI4wx",
        "pdf_size": 3489880,
        "rating": "1;3;5;6",
        "confidence": "1;4;2;3",
        "soundness": "1;2;3;3",
        "contribution": "1;1;2;2",
        "presentation": "1;1;3;2",
        "wc_summary": "88;58;223;60",
        "wc_strengths": "1;32;99;49",
        "wc_weaknesses": "1;193;130;119",
        "wc_questions": "1;9;52;9",
        "wc_review": "91;292;504;237",
        "wc_reply_reviewers": "10;0;42;0",
        "wc_reply_authors": "188;1022;792;405",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "1;2;2;1",
        "rating_avg": [
            3.75,
            1.920286436967152
        ],
        "confidence_avg": [
            2.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            107.25,
            67.87258282988795
        ],
        "wc_strengths_avg": [
            45.25,
            35.48503205578375
        ],
        "wc_weaknesses_avg": [
            110.75,
            69.3699322473361
        ],
        "wc_questions_avg": [
            17.75,
            20.04214309898021
        ],
        "wc_review_avg": [
            281.0,
            148.22786512663535
        ],
        "wc_reply_reviewers_avg": [
            13.0,
            17.233687939614086
        ],
        "wc_reply_authors_avg": [
            601.75,
            325.07874046144576
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.40755575681770734,
        "gs_citation": 83,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5000755914310791476&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Scuola universitaria professionale della Svizzera italiana;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.supsi.ch;https://www.google.com",
        "aff_unique_abbr": "SUPSI;Google",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "Switzerland;United States"
    },
    {
        "id": "0ypXhS83Lh",
        "title": "Robust Reinforcement Learning with Structured Adversarial Ensemble",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Although reinforcement learning (RL) is considered the gold standard for policy design, it may not always provide a robust solution in various scenarios. This can result in severe performance degradation when the environment is exposed to potential disturbances. Adversarial training using a two-player max-min game has been proven effective in enhancing the robustness of RL agents. However, we observe two severe problems pertaining to this approach: ($\\textit{i}$) the potential $\\textit{over-optimism}$ caused by the difficulty of the inner optimization problem, and ($\\textit{ii}$) the potential $\\textit{over-pessimism}$ caused by the selection of a candidate adversary set that may include unlikely scenarios. To this end, we extend the two-player game by introducing an adversarial ensemble, which involves a group of adversaries. We theoretically establish that an adversarial ensemble can efficiently and effectively obtain improved solutions to the inner optimization problem, alleviating the over-optimism. Then we address the over-pessimism by replacing the worst-case performance in the inner optimization with the average performance over the worst-$k$ adversaries. Our proposed algorithm significantly outperforms other robust RL algorithms that fail to address these two problems, corroborating the importance of the identified problems. Extensive experimental results demonstrate that the proposed algorithm consistently generate policies with enhanced robustness.",
        "keywords": "Reinforcement Learning;Robustness;Ensemble Methods",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/8a6e2b5cd3b459e26fbb53edb0cfd2a7d8d36d77.zip",
        "author": "Juncheng Dong;Hao-Lun Hsu;Qitong Gao;Vahid Tarokh;Miroslav Pajic",
        "authorids": "~Juncheng_Dong1;~Hao-Lun_Hsu1;~Qitong_Gao1;~Vahid_Tarokh1;~Miroslav_Pajic2",
        "gender": ";M;M;;M",
        "homepage": ";https://hlhsu.github.io/;http://qitonggao.com;;http://people.duke.edu/~mp275/",
        "dblp": ";303/0321;238/5422;;74/7446.html",
        "google_scholar": ";h9qf9vUAAAAJ;Flv4SrsAAAAJ;;Fbn21-8AAAAJ",
        "orcid": ";;;;",
        "linkedin": ";hlhsu/;qitong-gao;;",
        "or_profile": "~Juncheng_Dong1;~Hao-Lun_Hsu1;~Qitong_Gao1;~Vahid_Tarokh1;~Miroslav_Pajic2",
        "aff": ";Duke University;Duke University;;Duke University",
        "aff_domain": ";duke.edu;duke.edu;;duke.edu",
        "position": ";PhD student;PhD student;;Associate Professor",
        "bibtex": "@misc{\ndong2024robust,\ntitle={Robust Reinforcement Learning with Structured Adversarial Ensemble},\nauthor={Juncheng Dong and Hao-Lun Hsu and Qitong Gao and Vahid Tarokh and Miroslav Pajic},\nyear={2024},\nurl={https://openreview.net/forum?id=0ypXhS83Lh}\n}",
        "github": "",
        "project": "",
        "reviewers": "c2QC;APuc;1Lc9",
        "site": "https://openreview.net/forum?id=0ypXhS83Lh",
        "pdf_size": 1058130,
        "rating": "3;6;6",
        "confidence": "5;4;4",
        "soundness": "3;3;3",
        "contribution": "2;4;3",
        "presentation": "3;3;3",
        "wc_summary": "175;49;79",
        "wc_strengths": "6;64;77",
        "wc_weaknesses": "185;629;124",
        "wc_questions": "2;1;4",
        "wc_review": "368;743;284",
        "wc_reply_reviewers": "612;40;0",
        "wc_reply_authors": "2417;1437;453",
        "reply_reviewers": "2;1;0",
        "reply_authors": "5;4;2",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            101.0,
            53.74011537017761
        ],
        "wc_strengths_avg": [
            49.0,
            30.865298745786774
        ],
        "wc_weaknesses_avg": [
            312.6666666666667,
            225.06344784428137
        ],
        "wc_questions_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "wc_review_avg": [
            465.0,
            199.54448125668623
        ],
        "wc_reply_reviewers_avg": [
            217.33333333333334,
            279.5488428800154
        ],
        "wc_reply_authors_avg": [
            1435.6666666666667,
            801.8001967794443
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            1.247219128924647
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:wpNqysSE94QJ:scholar.google.com/&scioq=Robust+Reinforcement+Learning+with+Structured+Adversarial+Ensemble&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Duke University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.duke.edu",
        "aff_unique_abbr": "Duke",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "0zIKlb0prF",
        "title": "MPPN: Multi-Resolution Periodic Pattern Network For Long-Term Time Series Forecasting",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Long-term time series forecasting plays an important role in various real-world scenarios. Recent deep learning methods for long-term series forecasting tend to capture the intricate patterns of time series by Transformer-based or sampling-based methods.  However, most of the extracted patterns are relatively simplistic and may include unpredictable noise. Moreover, the multivariate series forecasting methods usually ignore the individual characteristics of each variate, which may affect the prediction accuracy. To capture the intrinsic patterns of time series, we propose a novel deep learning network architecture, named Multi-resolution Periodic Pattern Network (MPPN), for long-term series forecasting. We first construct context-aware multi-resolution semantic units of time series and employ multi-periodic pattern mining to capture the key patterns of time series. Then, we propose a channel adaptive module to capture the multivariate perceptions towards different patterns. In addition, we adopt an entropy-based method for evaluating the predictability of time series and providing an upper bound on the prediction accuracy before forecasting. Our experimental evaluation on nine real-world benchmarks demonstrated that MPPN significantly outperforms the state-of-the-art Transformer-based, sampling-based and pre-trained methods for long-term series forecasting.",
        "keywords": "Long-term time series forecasting;Multi-resolution periodic pattern;Channel adaption;Multivariate time series prediction.",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/03b59cd489129bf92c72389d57e0357247186d74.zip",
        "author": "Xing Wang;Zhendong Wang;Kexin Yang;zhiyan song;Lin Zhu;Chao Deng;Junlan Feng",
        "authorids": "~Xing_Wang5;~Zhendong_Wang5;~Kexin_Yang4;~zhiyan_song1;~Lin_Zhu6;~Chao_Deng4;~Junlan_Feng3",
        "gender": "F;M;F;F;F;M;F",
        "homepage": "https://orcid.org/0000-0003-3148-8291;;;https://scholar.google.com/citations?authuser=1&user=teprBfAAAAAJ;;;",
        "dblp": "02/3674;153/2385;54/774;302/7504;;;36/3948",
        "google_scholar": ";;;https://scholar.google.com/citations?authuser=1;;https://scholar.google.com/citations?hl=en;https://scholar.google.es/citations?user=rBjPtmQAAAAJ",
        "orcid": ";0000-0001-9530-2906;0009-0001-0031-7644;0000-0003-2138-3154;0000-0003-1167-1953;0000-0003-4449-5247;0000-0001-5292-2945",
        "linkedin": ";;;;;https://www.linkedin.cn/incareer/in/ACoAAB5sppAB_Da2tlvgSyM7NFTWl6d1DhZZe1o;junlan-feng-8968ba11/",
        "or_profile": "~Xing_Wang5;~Zhendong_Wang5;~Kexin_Yang4;~zhiyan_song1;~Lin_Zhu6;~Chao_Deng4;~Junlan_Feng3",
        "aff": "China Mobile Research Institute;China Mobile Research Institute;China Mobile Research Institute;China Mobile Research Institute;China Mobile research institute;China Mobile Research Institute;China Mobile",
        "aff_domain": "chinamobile.com;chinamobile.com;chinamobile.com;chinamobile.com;chinamobile.com;jiutian.10086.cn;ioa.ac.cn",
        "position": "Researcher;Researcher;Researcher;Employee;Full Professor;Researcher;Principal Researcher",
        "bibtex": "@misc{\nwang2024mppn,\ntitle={{MPPN}: Multi-Resolution Periodic Pattern Network  For Long-Term Time Series Forecasting},\nauthor={Xing Wang and Zhendong Wang and Kexin Yang and zhiyan song and Lin Zhu and Chao Deng and Junlan Feng},\nyear={2024},\nurl={https://openreview.net/forum?id=0zIKlb0prF}\n}",
        "github": "",
        "project": "",
        "reviewers": "saoQ;pRbf;fdFp;FFSt;qZtm",
        "site": "https://openreview.net/forum?id=0zIKlb0prF",
        "pdf_size": 693698,
        "rating": "3;5;5;5;5",
        "confidence": "4;4;4;3;4",
        "soundness": "2;2;2;3;3",
        "contribution": "2;2;2;2;3",
        "presentation": "3;1;2;3;3",
        "wc_summary": "74;32;69;131;119",
        "wc_strengths": "118;28;34;249;36",
        "wc_weaknesses": "349;228;283;288;290",
        "wc_questions": "5;5;5;265;26",
        "wc_review": "546;293;391;933;471",
        "wc_reply_reviewers": "45;71;37;0;163",
        "wc_reply_authors": "705;697;708;1169;742",
        "reply_reviewers": "1;1;1;0;1",
        "reply_authors": "1;1;1;2;1",
        "rating_avg": [
            4.6,
            0.7999999999999999
        ],
        "confidence_avg": [
            3.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.4,
            0.8
        ],
        "wc_summary_avg": [
            85.0,
            35.93883693165375
        ],
        "wc_strengths_avg": [
            93.0,
            84.75376097849582
        ],
        "wc_weaknesses_avg": [
            287.6,
            38.338492406457505
        ],
        "wc_questions_avg": [
            61.2,
            102.22406761619301
        ],
        "wc_review_avg": [
            526.8,
            219.81119170779272
        ],
        "wc_reply_reviewers_avg": [
            63.2,
            54.83210738244519
        ],
        "wc_reply_authors_avg": [
            804.2,
            183.04906446087074
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4
        ],
        "reply_authors_avg": [
            1.2,
            0.4
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.2500000000000001,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2119790206527010367&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0;0;0;0",
        "aff_unique_norm": "China Mobile",
        "aff_unique_dep": "Research Institute",
        "aff_unique_url": "https://www.chinamobile.com/",
        "aff_unique_abbr": "CMRI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "10BTKkFfhl",
        "title": "Efficient Backdoor Mitigation in Federated Learning with Contrastive Loss",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Due to the data-driven nature of deep neural networks and privacy concerns around user data, a backdoor could be easily injected into deep neural networks in federated learning without attracting the attention of users. An affected global model operates normally as a clean model in regular tasks and behaves differently when the trigger is presented. In this paper, we propose a novel reverse engineering approach to detect and mitigate the backdoor attack in federated learning by adopting a self-supervised Contrastive learning loss. In contrast to existing reverse engineering techniques, such as Neural Cleanse, which involve iterating through each class in the dataset, we employ the contrastive loss as a whole to identify triggers in the backdoored model. Our method compares the last-layer feature outputs of a potentially affected model with these from a clean one preserved beforehand to reconstruct the trigger under the guidance of the contrastive loss. The reverse-engineered trigger is then applied to patch the affected global model to remove the backdoor. If the global model is free from backdoors, the Contrastive loss will lead to either a blank trigger or one with random pattern. We evaluated the proposed method on three datasets under two backdoor attacks and compared it against three existing defense methods. Our results showed that while many popular reverse engineering algorithms were successful in centralized learning settings, they had difficulties detecting backdoors in federated learning, including Neural Cleanse, TABOR, and DeepInspect. Our method successfully detected backdoors in federated learning and was more time-efficient.",
        "keywords": "Backdoor Defense; Federated Learning; Contrastive Loss",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Hal Ferguson;Rui Ning;Jiang Li;Hongyi Wu;Chunsheng Xin",
        "authorids": "~Hal_Ferguson1;~Rui_Ning2;~Jiang_Li3;~Hongyi_Wu1;~Chunsheng_Xin1",
        "gender": "M;;M;M;M",
        "homepage": ";https://www.lions.odu.edu/~rning/;https://fs.wp.odu.edu/jli/;http://www.u.arizona.edu/~mhwu/;https://ww1.odu.edu/eng/programs/ccni/people",
        "dblp": ";211/2892;41/3068-1;78/1033;06/6463",
        "google_scholar": ";oN4NttEAAAAJ;https://scholar.google.com/citations?hl=en;rFLksrwAAAAJ;TaP2oq8AAAAJ",
        "orcid": ";;;;",
        "linkedin": "hal-ferguson;;jiang-li-416b0a6/;hongyi-\u201cmichael\u201d-wu-4b51a715/;",
        "or_profile": "~Hal_Ferguson1;~Rui_Ning2;~Jiang_Li3;~Hongyi_Wu1;~Chunsheng_Xin1",
        "aff": "Old Dominion University;Old Dominion University;Old Dominion University;University of Arizona;Old Dominion University",
        "aff_domain": "odu.edu;odu.edu;odu.edu;arizona.edu;odu.edu",
        "position": "PhD student;Assistant Professor;Full Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nferguson2024efficient,\ntitle={Efficient Backdoor Mitigation in Federated Learning with Contrastive Loss},\nauthor={Hal Ferguson and Rui Ning and Jiang Li and Hongyi Wu and Chunsheng Xin},\nyear={2024},\nurl={https://openreview.net/forum?id=10BTKkFfhl}\n}",
        "github": "",
        "project": "",
        "reviewers": "7bgg;58k3;pCAH;LVhf",
        "site": "https://openreview.net/forum?id=10BTKkFfhl",
        "pdf_size": 527904,
        "rating": "1;3;3;3",
        "confidence": "4;3;3;5",
        "soundness": "3;2;2;2",
        "contribution": "1;2;2;2",
        "presentation": "1;2;2;2",
        "wc_summary": "107;103;93;89",
        "wc_strengths": "98;38;70;6",
        "wc_weaknesses": "268;148;339;144",
        "wc_questions": "92;4;21;12",
        "wc_review": "565;293;523;251",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            98.0,
            7.280109889280518
        ],
        "wc_strengths_avg": [
            53.0,
            34.45286635390443
        ],
        "wc_weaknesses_avg": [
            224.75,
            82.66612062991706
        ],
        "wc_questions_avg": [
            32.25,
            35.01696017646306
        ],
        "wc_review_avg": [
            408.0,
            137.6117727521886
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.17407765595569782,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:0LzHeHmJ7u0J:scholar.google.com/&scioq=Efficient+Backdoor+Mitigation+in+Federated+Learning+with+Contrastive+Loss&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "Old Dominion University;University of Arizona",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.odu.edu;https://www.arizona.edu",
        "aff_unique_abbr": "ODU;UA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "10eQ4Cfh8p",
        "title": "SIMULTANEOUS GENERATION AND IMPROVEMENT: A UNIFIED RL PARADIGM FOR FJSP OPTIMIZATION",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We present an end-to-end reinforcement learning framework designed to address the Flexible Job Shop Problem (FJSP). Our approach consists of two primary components: a generative model that produces problem solutions stepwise, and a secondary model that continually refines these (partial) solutions. Importantly, we train both models concurrently, enabling each to be cognizant of the other's policy and make informed decisions. Extensive experimentation demonstrates that our model delivers better performance in shorter time on several public datasets comparing to baseline algorithms. Furthermore, we highlight the superior generalizability of our approach, as it maintains strong performance on large-scale instances even when trained on small-scale instances. It is worth noting that this training paradigm can be readily adapted to other combinatorial optimization problems, such as the traveling salesman problemand beyond.",
        "keywords": "Reinforcement Learning;Flexible Job Shop Schedule Problem;FJSP",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/6f19b6b9b383ac782203728c6d1a9961bcdca867.zip",
        "author": "Hongyi Zhou;Lei Song",
        "authorids": "~Hongyi_Zhou2;~Lei_Song3",
        "gender": "M;M",
        "homepage": ";",
        "dblp": ";76/893-1.html",
        "google_scholar": ";pXDSOocAAAAJ",
        "orcid": ";",
        "linkedin": "%E5%BC%98%E6%AF%85-%E5%91%A8-5b0112251/;",
        "or_profile": "~Hongyi_Zhou2;~Lei_Song3",
        "aff": "Microsoft Research;Microsoft",
        "aff_domain": "research.microsoft.com;microsoft.com",
        "position": "Intern;Principal Researcher",
        "bibtex": "@misc{\nzhou2024simultaneous,\ntitle={{SIMULTANEOUS} {GENERATION} {AND} {IMPROVEMENT}: A {UNIFIED} {RL} {PARADIGM} {FOR} {FJSP} {OPTIMIZATION}},\nauthor={Hongyi Zhou and Lei Song},\nyear={2024},\nurl={https://openreview.net/forum?id=10eQ4Cfh8p}\n}",
        "github": "",
        "project": "",
        "reviewers": "kC5r;ZW2D;swqB;9qF7",
        "site": "https://openreview.net/forum?id=10eQ4Cfh8p",
        "pdf_size": 440085,
        "rating": "3;3;3;3",
        "confidence": "4;3;3;3",
        "soundness": "1;2;2;1",
        "contribution": "2;2;3;2",
        "presentation": "1;1;2;1",
        "wc_summary": "38;167;92;86",
        "wc_strengths": "29;72;36;77",
        "wc_weaknesses": "340;389;38;485",
        "wc_questions": "70;31;82;123",
        "wc_review": "477;659;248;771",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            95.75,
            46.15395432679631
        ],
        "wc_strengths_avg": [
            53.5,
            21.219095173922945
        ],
        "wc_weaknesses_avg": [
            313.0,
            167.11822162768487
        ],
        "wc_questions_avg": [
            76.5,
            32.8062494046485
        ],
        "wc_review_avg": [
            538.75,
            197.95753963918625
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Mg_4JrTQARgJ:scholar.google.com/&scioq=SIMULTANEOUS+GENERATION+AND+IMPROVEMENT:+A+UNIFIED+RL+PARADIGM+FOR+FJSP+OPTIMIZATION&hl=en&as_sdt=0,47",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Microsoft",
        "aff_unique_dep": "Microsoft Research",
        "aff_unique_url": "https://www.microsoft.com/en-us/research",
        "aff_unique_abbr": "MSR",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "10fsmnw6aD",
        "title": "How Out-of-Distribution important is",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Class Incremental Learning (CIL) has gained significant attention in recent years due to its potential to adaptively learn from a non-stationary data distribution. The challenge of CIL primarily revolves around the model's ability to learn new classes without forgetting previously acquired knowledge. Recent research trends has achieved significant milestones, yet the continuity of learning can be further strengthened by integrating the concepts of \"self-training\", \"out-of-distribution\", and \"data drift\". In this paper, we propose a novel approach that integrates \"Continual Learning\", \"Self-Training\", \"Out-of-Distribution recognition\", and \"Data Drift\" concepts to advance the capabilities of class incremental learning systems. Drawing inspiration from works such as \"A Theoretical Study on Solving Continual Learning\", and \"CSI: Novelty Detection via Contrastive Learning on Distributionally Shifted Instances\". We propose a model that satisfies the four concepts mentioned above. Our experimental results demonstrate the efficacy of this method in mitigating catastrophic forgetting and ensuring consistent performance across a diverse range of classes.",
        "keywords": "continual learning;data drift;out-of-distribution;self training",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Hyowon Park",
        "authorids": "~Hyowon_Park2",
        "gender": "",
        "homepage": "",
        "dblp": "",
        "google_scholar": "",
        "orcid": "",
        "linkedin": "hyowon-park-6a7173290/",
        "or_profile": "~Hyowon_Park2",
        "aff": "Yonsei University",
        "aff_domain": "yonsei.ac.kr",
        "position": "MS student",
        "bibtex": "@misc{\npark2024how,\ntitle={How Out-of-Distribution important is},\nauthor={Hyowon Park},\nyear={2024},\nurl={https://openreview.net/forum?id=10fsmnw6aD}\n}",
        "github": "",
        "project": "",
        "reviewers": "6xad;fB3F;DuXE;SGSA",
        "site": "https://openreview.net/forum?id=10fsmnw6aD",
        "pdf_size": 2332277,
        "rating": "1;3;3;3",
        "confidence": "3;4;4;3",
        "soundness": "1;3;2;3",
        "contribution": "1;2;2;2",
        "presentation": "1;3;1;1",
        "wc_summary": "29;32;18;55",
        "wc_strengths": "3;20;14;8",
        "wc_weaknesses": "52;25;80;114",
        "wc_questions": "11;56;7;3",
        "wc_review": "95;133;119;180",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            33.5,
            13.46291201783626
        ],
        "wc_strengths_avg": [
            11.25,
            6.378675411086537
        ],
        "wc_weaknesses_avg": [
            67.75,
            33.03312731183652
        ],
        "wc_questions_avg": [
            19.25,
            21.405314760591587
        ],
        "wc_review_avg": [
            131.75,
            30.994959267597046
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0",
        "aff_unique_norm": "Yonsei University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.yonsei.ac.kr",
        "aff_unique_abbr": "Yonsei",
        "aff_country_unique_index": "0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "11WAKGH8uv",
        "title": "FedAIoT: A Federated Learning Benchmark for Artificial Intelligence of Things",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "There is a significant relevance of federated learning (FL) in the realm of Artificial Intelligence of Things (AIoT). However, most of existing FL works are not conducted on datasets collected from authentic IoT devices that capture unique modalities and inherent challenges of IoT data. In this work, we introduce FedAIoT, a FL benchmark for AIoT to fill this critical gap. FedAIoT includes eight well-chosen datatsets collected from a wide range of IoT devices. These datasets cover unique IoT modalities and target representative applications of AIoT. In addition, FedAIoT includes a unified end-to-end FL framework for AIoT that simplifies benchmarking the performance of the datasets. Our benchmark results shed light on the opportunities and challenges of FL for AIoT. We hope that FedAIoT could serve as an invaluable resource for researchers and practitioners to foster advancements in the important field of FL for AIoT.",
        "keywords": "AIoT;Federated Learning",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/95a9180a3c9425b6d11c888e6b5e0f6dd01cc109.pdf",
        "author": "Samiul Alam;Tuo Zhang;Tiantian Feng;Hui Shen;Zhichao Cao;Dong Zhao;Jeonggil Ko;Kiran Somasundaram;Shrikanth Narayanan;Salman Avestimehr;Mi Zhang",
        "authorids": "~Samiul_Alam1;~Tuo_Zhang2;~Tiantian_Feng1;~Hui_Shen2;~Zhichao_Cao1;~Dong_Zhao1;~Jeonggil_Ko1;~Kiran_Somasundaram1;~Shrikanth_Narayanan1;~Salman_Avestimehr1;~Mi_Zhang1",
        "gender": "M;M;M;M;M;M;;M;M;;M",
        "homepage": "https://samiul272.github.io;;https://tiantiaf0627.github.io/;https://nastymarcus.github.io/;http://cse.msu.edu/~caozc/;https://hbsl.msu.edu/;http://eis-lab.org;https://www.linkedin.com/in/kiran-somasundaram/;http://sail.usc.edu/people/shri.html;;https://mi-zhang.github.io/",
        "dblp": "222/1821;;;;;;;;19/3899;;84/2519-2.html",
        "google_scholar": "2Un1c7QAAAAJ;Rki45F4AAAAJ;p7oF-XIAAAAJ;iblw0zoAAAAJ;;;;https://scholar.google.com/citations?hl=en;8EDHmYkAAAAJ;;https://scholar.google.com.tw/citations?user=r3A90uAAAAAJ",
        "orcid": "0000-0002-8458-4642;;0000-0002-2053-9068;;;;;;0000-0002-1052-6204;;",
        "linkedin": "samiul-alam/;tuo-zhang-ultraz/;;hui-shen-8b4a86260/;;;;kiran-somasundaram/;shrikanth-narayanan/;;mizhang/",
        "or_profile": "~Samiul_Alam1;~Tuo_Zhang2;~Tiantian_Feng1;~Hui_Shen2;~Zhichao_Cao1;~Dong_Zhao1;~Jeonggil_Ko1;~Kiran_Somasundaram1;~Shrikanth_Narayanan1;~Salman_Avestimehr1;~Mi_Zhang1",
        "aff": "Ohio State University, Columbus;University of Southern California;University of Southern California;Ohio State University, Columbus;Michigan State University;Michigan State University;Yonsei University;Meta Facebook;University of Southern California;;The Ohio State University",
        "aff_domain": "osu.edu;usc.edu;usc.edu;osu.edu;msu.edu;msu.edu;yonsei.ac.kr;meta.com;usc.edu;;osu.edu",
        "position": "PhD student;PhD student;Postdoc;Undergrad student;Assistant Professor;Associate Professor;Associate Professor;Researcher;Full Professor;;Associate Professor",
        "bibtex": "@misc{\nalam2024fedaiot,\ntitle={Fed{AI}oT: A Federated Learning Benchmark for Artificial Intelligence of Things},\nauthor={Samiul Alam and Tuo Zhang and Tiantian Feng and Hui Shen and Zhichao Cao and Dong Zhao and Jeonggil Ko and Kiran Somasundaram and Shrikanth Narayanan and Salman Avestimehr and Mi Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=11WAKGH8uv}\n}",
        "github": "",
        "project": "",
        "reviewers": "N2ym;Vfdi;MJiJ;hEF2",
        "site": "https://openreview.net/forum?id=11WAKGH8uv",
        "pdf_size": 835320,
        "rating": "3;5;5;6",
        "confidence": "4;4;3;3",
        "soundness": "2;2;2;2",
        "contribution": "2;3;2;3",
        "presentation": "2;3;2;3",
        "wc_summary": "302;27;54;56",
        "wc_strengths": "224;25;78;97",
        "wc_weaknesses": "706;211;111;13",
        "wc_questions": "248;190;92;73",
        "wc_review": "1480;453;335;239",
        "wc_reply_reviewers": "0;86;0;24",
        "wc_reply_authors": "30;691;1109;593",
        "reply_reviewers": "0;2;0;1",
        "reply_authors": "1;7;6;7",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            109.75,
            111.58488920996427
        ],
        "wc_strengths_avg": [
            106.0,
            73.05819598101229
        ],
        "wc_weaknesses_avg": [
            260.25,
            266.7052446053508
        ],
        "wc_questions_avg": [
            150.75,
            71.5799378317696
        ],
        "wc_review_avg": [
            626.75,
            498.42069329031676
        ],
        "wc_reply_reviewers_avg": [
            27.5,
            35.16745654721137
        ],
        "wc_reply_authors_avg": [
            605.75,
            384.76575666241405
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            5.25,
            2.48746859276655
        ],
        "replies_avg": [
            31,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": -0.6882472016116854,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14104236724301259853&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;1;0;2;2;3;4;1;0",
        "aff_unique_norm": "Ohio State University;University of Southern California;Michigan State University;Yonsei University;Meta",
        "aff_unique_dep": ";;;;Meta Platforms, Inc.",
        "aff_unique_url": "https://www.osu.edu;https://www.usc.edu;https://www.msu.edu;https://www.yonsei.ac.kr;https://meta.com",
        "aff_unique_abbr": "OSU;USC;MSU;Yonsei;Meta",
        "aff_campus_unique_index": "0;1;1;0;1",
        "aff_campus_unique": "Columbus;Los Angeles;",
        "aff_country_unique_index": "0;0;0;0;0;0;1;0;0;0",
        "aff_country_unique": "United States;South Korea"
    },
    {
        "id": "11nZWTg0mS",
        "title": "Moral High Ground: A text-based games benchmark for moral evaluation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "This paper introduces a benchmark for the evaluation of large language models on moral values and business principles.  The main focus of this framework is to evaluate moral and ethical reasoning ability of large language models using text-based games, which can be played by both human player and models.  We present these games to the player as an interaction between the player and the environment.  Each action in these games is associated with a reward based on the moral and ethical values, i.e., higher reward implies higher moral values and vice versa. We score the game trajectory taken by a player by combining the rewards of the individual action, with highest score corresponding with the most moral or ethical paths possible. This will enable us to compare different models and human players on the moral values. In addition, this framework can be used to teach/tune the large language models using these text-based games on desired moral values and business principles. Through this framework, we hope to expand upon the diverse area of alignment techniques to help ensure future models grasp the often nuanced topics of moral and ethical values.",
        "keywords": "Text-based Games;LLM Evaluation;LLM Tuning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/09e7c11310bcf66c1cd5ac5c23bec7464def7620.zip",
        "author": "Matthew Pisano;Keerthiram Murugesan;Lamogha Chiazor;Lan Hoang;Karthikeyan Natesan Ramamurthy;Kush R. Varshney",
        "authorids": "pisanm2@rpi.edu;~Keerthiram_Murugesan1;~Lamogha_Chiazor1;~Lan_Hoang2;~Karthikeyan_Natesan_Ramamurthy1;~Kush_R._Varshney1",
        "gender": ";M;F;;;M",
        "homepage": ";https://keerthi166.github.io;;https://researcher.watson.ibm.com/researcher/view.php?person=ibm-Lan.Hoang;https://nrkarthikeyan.github.io/;http://krvarshney.github.io",
        "dblp": ";178/2877;;;58/7800;",
        "google_scholar": ";-698GEMAAAAJ;;MtmdB6sAAAAJ;mG8HuhEAAAAJ;hMZMhLoAAAAJ",
        "orcid": ";0000-0001-6847-522X;;;0000-0002-6021-5930;",
        "linkedin": ";https://linkedin.com/in/keerthiram;lamogha/;lannhoang/;;kushvarshney",
        "or_profile": "pisanm2@rpi.edu;~Keerthiram_Murugesan1;~Lamogha_Chiazor1;~Lan_Hoang2;~Karthikeyan_Natesan_Ramamurthy1;~Kush_R._Varshney1",
        "aff": ";International Business Machines;International Business Machines;International Business Machines;International Business Machines;International Business Machines",
        "aff_domain": ";ibm.com;ibm.com;ibm.com;ibm.com;ibm.com",
        "position": ";Researcher;Researcher;Researcher;Research Staff Member;Research Staff Member",
        "bibtex": "@misc{\npisano2024moral,\ntitle={Moral High Ground: A text-based games benchmark for moral evaluation},\nauthor={Matthew Pisano and Keerthiram Murugesan and Lamogha Chiazor and Lan Hoang and Karthikeyan Natesan Ramamurthy and Kush R. Varshney},\nyear={2024},\nurl={https://openreview.net/forum?id=11nZWTg0mS}\n}",
        "github": "",
        "project": "",
        "reviewers": "6LQq;Uvtk;T1SJ;N9dw",
        "site": "https://openreview.net/forum?id=11nZWTg0mS",
        "pdf_size": 1999473,
        "rating": "1;1;5;5",
        "confidence": "4;4;4;3",
        "soundness": "1;1;2;3",
        "contribution": "1;1;2;3",
        "presentation": "2;1;3;3",
        "wc_summary": "80;110;45;89",
        "wc_strengths": "12;50;28;105",
        "wc_weaknesses": "140;279;266;404",
        "wc_questions": "291;14;30;68",
        "wc_review": "523;453;369;666",
        "wc_reply_reviewers": "29;31;32;0",
        "wc_reply_authors": "334;245;124;601",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.0,
            2.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            81.0,
            23.46273641330013
        ],
        "wc_strengths_avg": [
            48.75,
            35.16656793035112
        ],
        "wc_weaknesses_avg": [
            272.25,
            93.45152486717379
        ],
        "wc_questions_avg": [
            100.75,
            111.57816766733535
        ],
        "wc_review_avg": [
            502.75,
            108.88612170520172
        ],
        "wc_reply_reviewers_avg": [
            23.0,
            13.322912594474229
        ],
        "wc_reply_authors_avg": [
            326.0,
            175.3952678951174
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:hZsNKwF6wicJ:scholar.google.com/&scioq=Moral+High+Ground:+A+text-based+games+benchmark+for+moral+evaluation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "International Business Machines Corporation",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ibm.com",
        "aff_unique_abbr": "IBM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "11oqo92x2Z",
        "title": "Detection and Segmentation of Solar Farms in Satellite Imagery: A Study of Deep Neural Network Architectures",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In line with global sustainability goals, such as the Paris Agreement, accurate mapping and monitoring of solar farms are critical for achieving net zero emissions by 2050. However, many solar installations remain undocumented, posing a challenge. This work introduces Solis-seg, a Deep Neural Network optimized for detecting solar farms in satellite imagery. Solis-seg achieves a mean Intersection over Union (IoU) of 96.26% on a European dataset, outperforming existing solutions.\n\nThe study leans heavily on advances in semantic segmentation and NAS for solar farm detection. Semantic segmentation has evolved through technologies like Fully Convolutional Network (FCN) and U-Net, which have shown strong performance on satellite imagery. In NAS, Differentiable Architecture Search (DARTS) and its variants like Auto-DeepLab (ADL) have become efficient ways to automate the creation of architectures. This study also challenges the prevailing method of using transfer learning from classification tasks for semantic segmentation, suggesting new avenues for research.\n\nThus, this work contributes to both the field of earth observation machine learning and the global transition to renewable energy by providing an efficient, scalable solution for tracking solar installations.  We believe that our research offers valuable insights into the application of advanced machine learning techniques for solar farm detection and also encourages further exploration in earth observation and sustainability.",
        "keywords": "Solar Farms;Detection;Satellite Images;Image Segmentation;Machine Learning;Deep Learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Erling Olweus;Ole Jakob Mengshoel",
        "authorids": "erlingolweus@gmail.com;~Ole_Jakob_Mengshoel1",
        "gender": ";",
        "homepage": ";",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "erlingolweus@gmail.com;~Ole_Jakob_Mengshoel1",
        "aff": ";",
        "aff_domain": ";",
        "position": ";",
        "bibtex": "@misc{\nolweus2024detection,\ntitle={Detection and Segmentation of Solar Farms in Satellite Imagery: A Study of  Deep Neural Network Architectures},\nauthor={Erling Olweus and Ole Jakob Mengshoel},\nyear={2024},\nurl={https://openreview.net/forum?id=11oqo92x2Z}\n}",
        "github": "",
        "project": "",
        "reviewers": "vhXk;2B7A;Co8H;rV62",
        "site": "https://openreview.net/forum?id=11oqo92x2Z",
        "pdf_size": 8031806,
        "rating": "1;1;3;5",
        "confidence": "4;4;3;4",
        "soundness": "1;1;2;3",
        "contribution": "1;2;1;2",
        "presentation": "2;1;2;3",
        "wc_summary": "58;29;72;88",
        "wc_strengths": "76;17;59;84",
        "wc_weaknesses": "541;174;64;80",
        "wc_questions": "3;9;70;402",
        "wc_review": "678;229;265;654",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "69;0;68;75",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;0;1;1",
        "rating_avg": [
            2.5,
            1.6583123951777
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            61.75,
            21.683807322516035
        ],
        "wc_strengths_avg": [
            59.0,
            25.874698065871222
        ],
        "wc_weaknesses_avg": [
            214.75,
            192.99141820298644
        ],
        "wc_questions_avg": [
            121.0,
            164.33958744015393
        ],
        "wc_review_avg": [
            456.5,
            210.05773016006813
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            53.0,
            30.71644510681534
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0.75,
            0.4330127018922193
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.17407765595569782,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16123498411678315838&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 8
    },
    {
        "id": "122IP1hqTY",
        "title": "KLIP: Keyword-Guided Language-Image Pretraining for Data-Efficient Domain-Specific Image Captioning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Image captioning aims to generate natural language descriptions for a given image. While recent vision-language models have shown promising progress on this task, it is still challenging to finetune such models for particular domains with limited image-caption training data. To enable domain-specific few-shot image captioning, we propose a Keyword-Guided Language-Image Pretraining (KLIP) scheme, which learns entity-oriented keywords for aligning visual and textual modalities in each data domain for pre-training and fine-tuning. While our pre-training objectives enables the above alignment for vision-language models, the identified keywords further serve as prompts for regularizing the model during the fine-tuning stage. As a result, potential overfitting problems can be mitigated. Extensive experiments on benchmark datasets show that our KLIP performs favorably against state-of-the-art VLMs with various parameter-efficient fine-tuning techniques for domain-specific yet data-efficient image captioning.",
        "keywords": "Image Captioning;Vision-Language Pretraining",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Chi-Pin Huang;Kai-Po Chang;Fu-En Yang;Chung-Ting Tsai;Yung-Hsuan Lai;Yu-Chiang Frank Wang",
        "authorids": "~Chi-Pin_Huang2;~Kai-Po_Chang1;~Fu-En_Yang1;~Chung-Ting_Tsai1;~Yung-Hsuan_Lai1;~Yu-Chiang_Frank_Wang2",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://jasper0314-huang.github.io/;;https://fuenyang1127.github.io/;https://github.com/tim901231;https://franklin905.github.io/;http://vllab.ee.ntu.edu.tw/ycwang.html",
        "dblp": "362/2899;234/8190;218/6244;164/5784-2;348/6382;30/1690",
        "google_scholar": "https://scholar.google.com.tw/citations?user=s8-yTSwAAAAJ;lXC6HbkAAAAJ;https://scholar.google.com.tw/citations?user=k6Iz9VoAAAAJ;;rU7n-9YAAAAJ;HSGvdtoAAAAJ",
        "orcid": "0009-0003-7738-3054;;0000-0003-0102-7101;;;0000-0002-2333-157X",
        "linkedin": "chi-pin-huang-b69704208/;%E5%87%B1%E5%8D%9A-%E5%BC%B5-14051a191/?trk=public_profile_browsemap_profile-result-card_result-card_full-click&originalSubdomain=tw;fu-en-yang-77ba7b175/;chung-ting-tsai-76a74b207/;yung-hsuan-lai-1629a7212/;",
        "or_profile": "~Chi-Pin_Huang2;~Kai-Po_Chang1;~Fu-En_Yang1;~Chung-Ting_Tsai1;~Yung-Hsuan_Lai1;~Yu-Chiang_Frank_Wang2",
        "aff": "National Taiwan University;National Taiwan University;NVIDIA;National Technological University;National Taiwan University;National Taiwan University",
        "aff_domain": "ntu.edu.tw;ntu.edu.tw;nvidia.com;ntu.edu;ntu.edu.tw;ntu.edu.tw",
        "position": "PhD student;PhD student;Researcher;Undergrad student;Research Assistant;Full Professor",
        "bibtex": "@misc{\nhuang2024klip,\ntitle={{KLIP}: Keyword-Guided Language-Image Pretraining for Data-Efficient Domain-Specific Image Captioning},\nauthor={Chi-Pin Huang and Kai-Po Chang and Fu-En Yang and Chung-Ting Tsai and Yung-Hsuan Lai and Yu-Chiang Frank Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=122IP1hqTY}\n}",
        "github": "",
        "project": "",
        "reviewers": "NtDh;eL8y;uxeH;g8oh;Qycg",
        "site": "https://openreview.net/forum?id=122IP1hqTY",
        "pdf_size": 6661439,
        "rating": "3;5;5;5;6",
        "confidence": "4;4;3;4;5",
        "soundness": "2;2;2;2;4",
        "contribution": "2;2;3;3;4",
        "presentation": "3;2;2;3;3",
        "wc_summary": "33;64;186;72;209",
        "wc_strengths": "25;26;182;139;71",
        "wc_weaknesses": "132;384;431;446;269",
        "wc_questions": "33;67;104;330;4",
        "wc_review": "223;541;903;987;553",
        "wc_reply_reviewers": "0;0;0;0;10",
        "wc_reply_authors": "0;0;0;0;41",
        "reply_reviewers": "0;0;0;0;1",
        "reply_authors": "0;0;0;0;1",
        "rating_avg": [
            4.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.4,
            0.8
        ],
        "contribution_avg": [
            2.8,
            0.7483314773547882
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            112.8,
            70.74856889011961
        ],
        "wc_strengths_avg": [
            88.6,
            62.50951927506721
        ],
        "wc_weaknesses_avg": [
            332.4,
            117.87213411150236
        ],
        "wc_questions_avg": [
            107.6,
            116.12166033949049
        ],
        "wc_review_avg": [
            641.4,
            275.9808689021759
        ],
        "wc_reply_reviewers_avg": [
            2.0,
            4.0
        ],
        "wc_reply_authors_avg": [
            8.2,
            16.4
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4
        ],
        "reply_authors_avg": [
            0.2,
            0.4
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.3227486121839514,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:YZvBVAZEOPQJ:scholar.google.com/&scioq=KLIP:+Keyword-Guided+Language-Image+Pretraining+for+Data-Efficient+Domain-Specific+Image+Captioning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2;0;0",
        "aff_unique_norm": "National Taiwan University;NVIDIA;National Technological University",
        "aff_unique_dep": ";NVIDIA Corporation;",
        "aff_unique_url": "https://www.ntu.edu.tw;https://www.nvidia.com;https://www.ntu.edu",
        "aff_unique_abbr": "NTU;NVIDIA;NTU",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Taiwan;",
        "aff_country_unique_index": "0;0;1;1;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "12Acp6ZcRa",
        "title": "Evaluating the Robustness of Text-to-image Diffusion Models against Real-world Attacks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Text-to-image (T2I) diffusion models (DMs) have shown promise in generating high-quality images from textual descriptions. The real-world applications of these models require particular attention to their safety and fidelity, but this has not been sufficiently explored. \nOne fundamental question is whether the existing T2I DMs are robust against variations over input texts.  To answer it, this work provides the first robustness evaluation of T2I DMs against real-world perturbations.  Unlike malicious attacks that involve apocryphal alterations to the input texts, we consider a perturbation space spanned by realistic errors (e.g., typo, glyph, phonetic) that humans can make and adopt adversarial attacks to generate worst-case perturbations for robustness evaluation. Given the inherent randomness of the generation process, we develop novel distribution-based objectives to mislead T2I DMs. We optimize the objectives by black-box attacks without any knowledge of the model. Extensive experiments demonstrate the effectiveness of our method for attacking popular T2I DMs and simultaneously reveal their non-trivial robustness issues. Moreover, we provide an in-depth analysis of our method to show that it is not designed to attack the text encoder in T2I DMs solely.",
        "keywords": "Diffusion Models;Text to Image Generation;Adversarial Attack;Robustness Evaluation",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/62de1fd0cd0182eca39bfc682c6b52555b45714b.zip",
        "author": "Hongcheng Gao;Hao Zhang;Yinpeng Dong;Zhijie Deng",
        "authorids": "~Hongcheng_Gao1;~Hao_Zhang2;~Yinpeng_Dong2;~Zhijie_Deng1",
        "gender": "M;M;M;M",
        "homepage": "https://gao-hongcheng.github.io/;https://cseweb.ucsd.edu/~haozhang/;https://dongyp13.github.io;https://thudzj.github.io/",
        "dblp": "318/1404;55/2270-25;183/0980;209/4959",
        "google_scholar": "https://scholar.google.com/citations?hl=en;H1d4BS8AAAAJ;6_4ad84AAAAJ;J3dR0sUAAAAJ",
        "orcid": ";;;0000-0002-0932-1631",
        "linkedin": ";;;",
        "or_profile": "~Hongcheng_Gao1;~Hao_Zhang2;~Yinpeng_Dong2;~Zhijie_Deng1",
        "aff": "University of Chinese Academy of Sciences;Carnegie Mellon University;Tsinghua University;Shanghai Jiaotong University",
        "aff_domain": "ucas.ac.cn;cmu.edu;tsinghua.edu.cn;sjtu.edu.cn",
        "position": "MS student;PhD student;Postdoc;Assistant Professor",
        "bibtex": "@misc{\ngao2024evaluating,\ntitle={Evaluating the Robustness of Text-to-image Diffusion Models against Real-world Attacks},\nauthor={Hongcheng Gao and Hao Zhang and Yinpeng Dong and Zhijie Deng},\nyear={2024},\nurl={https://openreview.net/forum?id=12Acp6ZcRa}\n}",
        "github": "",
        "project": "",
        "reviewers": "BaK3;a3Ko;st1Q;BYdd",
        "site": "https://openreview.net/forum?id=12Acp6ZcRa",
        "pdf_size": 14098103,
        "rating": "3;5;6;8",
        "confidence": "3;4;4;3",
        "soundness": "2;3;2;4",
        "contribution": "2;3;3;3",
        "presentation": "2;3;3;4",
        "wc_summary": "91;45;163;63",
        "wc_strengths": "72;83;125;126",
        "wc_weaknesses": "306;195;289;82",
        "wc_questions": "60;10;46;134",
        "wc_review": "529;333;623;405",
        "wc_reply_reviewers": "191;0;0;170",
        "wc_reply_authors": "1291;468;909;780",
        "reply_reviewers": "1;0;0;2",
        "reply_authors": "4;2;3;2",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            90.5,
            44.95275297465106
        ],
        "wc_strengths_avg": [
            101.5,
            24.315632831575655
        ],
        "wc_weaknesses_avg": [
            218.0,
            89.17679070251407
        ],
        "wc_questions_avg": [
            62.5,
            45.13036671687922
        ],
        "wc_review_avg": [
            472.5,
            111.64564478742554
        ],
        "wc_reply_reviewers_avg": [
            90.25,
            90.55488667101295
        ],
        "wc_reply_authors_avg": [
            862.0,
            295.0466064878564
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 24,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4174072518643267646&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "University of Chinese Academy of Sciences;Carnegie Mellon University;Tsinghua University;Shanghai Jiao Tong University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "http://www.ucas.ac.cn;https://www.cmu.edu;https://www.tsinghua.edu.cn;https://www.sjtu.edu.cn",
        "aff_unique_abbr": "UCAS;CMU;THU;SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "12zKEh2APn",
        "title": "PROSE: Predicting Operators and Symbolic Expressions using Multimodal Transformers",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Approximating nonlinear differential equations using a neural network provides a robust and efficient tool for various scientific computing tasks, including real-time predictions, inverse problems, optimal controls, and surrogate modeling. Previous works have focused on embedding dynamical systems into networks through two approaches: learning a single solution operator (i.e., the mapping from input parametrized functions to solutions) or learning the governing system of equations (i.e., the constitutive model relative to the state variables). Both of these approaches yield different representations for the same underlying data or function. Additionally, observing that families of differential equations often share key characteristics which can be leveraged to train one network representation across a wide range of equations. Our method, called Predicting Operators and Symbolic Expressions (PROSE), learns maps from multimodal inputs to multimodal outputs, capable of generating both numerical predictions and mathematical equations. By using a transformer structure and a feature fusion approach, our network can simultaneously embed sets of solution operators for various parametric differential equations using a single trained network. Detailed experiments demonstrate that the network benefits from its multimodal nature, resulting in improved prediction accuracy and better generalization. The network is shown to be able to handle noise in the data and errors in the symbolic representation, including noisy numerical values, model misspecification, and erroneous addition or deletion of terms. PROSE provides a new neural network framework for differential equations which allows for more flexibility and generality in learning operators and governing equations from data.",
        "keywords": "Neural networks for differential equations;multi-operator learning;learning governing equations;multimodal transformers;symbolic generation",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "",
        "author": "Yuxuan Liu;Zecheng Zhang;Hayden Schaeffer",
        "authorids": "~Yuxuan_Liu12;~Zecheng_Zhang2;~Hayden_Schaeffer2",
        "gender": "M;;Not Specified",
        "homepage": "https://felix-lyx.github.io/;https://www.math.fsu.edu/~zhang/;https://www.math.ucla.edu/people/ladder/hayden",
        "dblp": ";;",
        "google_scholar": "SbieiN4AAAAJ;;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Yuxuan_Liu12;~Zecheng_Zhang2;~Hayden_Schaeffer2",
        "aff": "University of California, Los Angeles;Florida State University;University of California, Los Angeles",
        "aff_domain": "ucla.edu;fsu.edu;ucla.edu",
        "position": "PhD student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nliu2024prose,\ntitle={{PROSE}: Predicting Operators and Symbolic Expressions using Multimodal Transformers},\nauthor={Yuxuan Liu and Zecheng Zhang and Hayden Schaeffer},\nyear={2024},\nurl={https://openreview.net/forum?id=12zKEh2APn}\n}",
        "github": "",
        "project": "",
        "reviewers": "LoCo;62Ac;45hW",
        "site": "https://openreview.net/forum?id=12zKEh2APn",
        "pdf_size": 2052077,
        "rating": "5;5;6",
        "confidence": "4;4;4",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "3;2;3",
        "wc_summary": "166;163;30",
        "wc_strengths": "83;24;41",
        "wc_weaknesses": "363;292;43",
        "wc_questions": "3;406;40",
        "wc_review": "615;885;154",
        "wc_reply_reviewers": "0;54;10",
        "wc_reply_authors": "1475;1349;257",
        "reply_reviewers": "0;1;1",
        "reply_authors": "2;2;1",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            119.66666666666667,
            63.415735867019286
        ],
        "wc_strengths_avg": [
            49.333333333333336,
            24.796953217863056
        ],
        "wc_weaknesses_avg": [
            232.66666666666666,
            137.2111106612321
        ],
        "wc_questions_avg": [
            149.66666666666666,
            181.88335700540486
        ],
        "wc_review_avg": [
            551.3333333333334,
            301.806045149677
        ],
        "wc_reply_reviewers_avg": [
            21.333333333333332,
            23.456816114345575
        ],
        "wc_reply_authors_avg": [
            1027.0,
            546.8966995694891
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 20,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1192824799122986362&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of California, Los Angeles;Florida State University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ucla.edu;https://www.fsu.edu",
        "aff_unique_abbr": "UCLA;FSU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Los Angeles;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "13D1zn0mpd",
        "title": "Effective and Parameter-Efficient Reusing Fine-Tuned Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Many pre-trained large-scale models provided online have become highly effective in transferring to downstream tasks. At the same time, various task-specific models fine-tuned on these pre-trained models are available online for public use. In practice, collecting task-specific data is labor-intensive and fine-tuning the large pre-trained models is computationally expensive, one can reuse task-specific fine-tuned models to deal with downstream tasks. However, using a model per task causes a heavy burden on storage and serving. Recently, many training-free and parameter-efficient methods have been proposed for merging multiple fine-tuned task-specific models into a single multi-task model. However, these methods exhibit a large accuracy gap compared with using a fine-tuned model per task. In this paper, we propose parameter-efficient methods for Reusing fine-tuned models. For reusing fully fine-tuned models, we inject sparse task vectors to a merged model by magnitude pruning. For reusing LoRA fine-tuned models, we use a lower-rank matrix to approximate the LoRA matrix by singular value decomposition. Extensive experiments conducted on computer vision and natural language process tasks demonstrate the effectiveness and parameter-efficiency of the proposed methods. The proposed methods outperform existing merging models method by a large margin and achieve comparable performance to using a fine-tuned model per task.",
        "keywords": "merging models;fine-tune models",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/aeef207d505b1d73898732911fffddda6d0fe873.zip",
        "author": "Weisen Jiang;Baijiong Lin;Han Shi;Yu Zhang;Zhenguo Li;James Kwok",
        "authorids": "~Weisen_Jiang1;~Baijiong_Lin1;~Han_Shi1;~Yu_Zhang3;~Zhenguo_Li1;~James_Kwok1",
        "gender": "M;M;M;M;M;",
        "homepage": "https://wayson-ust.github.io/;https://baijiong-lin.github.io/;https://han-shi.github.io/;http://cse.sustech.edu.cn/faculty/~zhangy/;http://www.ee.columbia.edu/~zgli/;",
        "dblp": "302/7625;279/2950;;50/671-6;23/6479;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;KVdbYTYAAAAJ;https://scholar.google.com.hk/citations?user=Johp_14AAAAJ;https://scholar.google.com.hk/citations?user=jaRS5w4AAAAJ;XboZC1AAAAAJ;",
        "orcid": ";0000-0002-4257-0226;;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Weisen_Jiang1;~Baijiong_Lin1;~Han_Shi1;~Yu_Zhang3;~Zhenguo_Li1;~James_Kwok1",
        "aff": "Hong Kong University of Science and Technology;The Hong Kong University of Science and Technology (Guangzhou);Huawei Technologies Ltd.;Southern University of Science and Technology;Huawei Noah's Ark Lab;",
        "aff_domain": "ust.hk;connect.hkust-gz.edu.cn;huawei.com;sustc.edu.cn;huawei.com;",
        "position": "PhD student;PhD student;Principal Researcher;Associate Professor;Principal Researcher;",
        "bibtex": "@misc{\njiang2024effective,\ntitle={Effective and Parameter-Efficient Reusing Fine-Tuned Models},\nauthor={Weisen Jiang and Baijiong Lin and Han Shi and Yu Zhang and Zhenguo Li and James Kwok},\nyear={2024},\nurl={https://openreview.net/forum?id=13D1zn0mpd}\n}",
        "github": "",
        "project": "",
        "reviewers": "tpTw;a2T8;wHfz",
        "site": "https://openreview.net/forum?id=13D1zn0mpd",
        "pdf_size": 533242,
        "rating": "5;6;6",
        "confidence": "4;4;3",
        "soundness": "2;3;3",
        "contribution": "2;2;2",
        "presentation": "3;3;3",
        "wc_summary": "76;85;78",
        "wc_strengths": "29;26;26",
        "wc_weaknesses": "322;33;111",
        "wc_questions": "6;317;73",
        "wc_review": "433;461;288",
        "wc_reply_reviewers": "0;73;0",
        "wc_reply_authors": "2560;2063;1598",
        "reply_reviewers": "0;2;0",
        "reply_authors": "6;6;4",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            79.66666666666667,
            3.858612300930075
        ],
        "wc_strengths_avg": [
            27.0,
            1.4142135623730951
        ],
        "wc_weaknesses_avg": [
            155.33333333333334,
            122.07738893377794
        ],
        "wc_questions_avg": [
            132.0,
            133.64380519375624
        ],
        "wc_review_avg": [
            394.0,
            75.81996219114507
        ],
        "wc_reply_reviewers_avg": [
            24.333333333333332,
            34.41253001774532
        ],
        "wc_reply_authors_avg": [
            2073.6666666666665,
            392.8072753342987
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            5.333333333333333,
            0.9428090415820634
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=414454635213371595&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2;1",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Huawei;Southern University of Science and Technology",
        "aff_unique_dep": ";Huawei Technologies;",
        "aff_unique_url": "https://www.ust.hk;https://www.huawei.com;https://www.sustech.edu.cn",
        "aff_unique_abbr": "HKUST;Huawei;SUSTech",
        "aff_campus_unique_index": "0;1",
        "aff_campus_unique": "Hong Kong SAR;Guangzhou;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "SALMONN: Towards Generic Hearing Abilities for Large Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19600",
        "id": "14rn7HpKVk",
        "author_site": "Changli Tang, Wenyi Yu, Guangzhi Sun, Xianzhao Chen, Tian Tan, Wei Li, Lu Lu, Zejun MA, Chao Zhang",
        "tldr": "",
        "abstract": "Hearing is arguably an essential ability of artificial intelligence (AI) agents in the physical world, which refers to the perception and understanding of general auditory information consisting of at least three types of sounds: speech, audio events, and music. In this paper, we propose SALMONN, a speech audio language music open neural network, built by integrating a pre-trained text-based large language model (LLM) with speech and audio encoders into a single multimodal model. SALMONN enables the LLM to directly process and understand general audio inputs and achieve competitive performances on a number of speech and audio tasks used in training, such as \nautomatic speech recognition and translation, auditory-information-based question answering, emotion recognition, speaker verification, and music and audio captioning etc. SALMONN also has a diverse set of emergent abilities unseen in the training, which includes but is not limited to speech translation to untrained languages, speech-based slot filling, spoken-query-based question answering, audio-based storytelling, and speech audio co-reasoning etc. The presence of cross-modal emergent abilities is studied, and a novel few-shot activation tuning approach is proposed to activate such abilities. To our knowledge, SALMONN is the first model of its type and can be regarded as a step towards AI with generic hearing abilities. The source code, model checkpoints and data are available at https://github.com/bytedance/SALMONN.",
        "keywords": "Multimodal large language models;speech and audio processing;music processing",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Changli Tang;Wenyi Yu;Guangzhi Sun;Xianzhao Chen;Tian Tan;Wei Li;Lu Lu;Zejun MA;Chao Zhang",
        "authorids": "~Changli_Tang1;~Wenyi_Yu2;~Guangzhi_Sun1;~Xianzhao_Chen1;~Tian_Tan5;~Wei_Li78;~Lu_Lu6;~Zejun_MA1;~Chao_Zhang20",
        "gender": "M;M;M;;M;M;M;M;M",
        "homepage": ";https://github.com/Yu-Doit;http://mi.eng.cam.ac.uk/\u223cgs534/;http://chenxianzhao.bytedance.com;;;;;http://mi.eng.cam.ac.uk/~cz277/",
        "dblp": "331/8719;;236/4543;;;;;;94/3019-31.html",
        "google_scholar": "RzIjbf0AAAAJ;CGqr-V8AAAAJ;PzPAzf8AAAAJ;;ukL_E5AAAAAJ;q8ZrKVIAAAAJ;IQaR2KoAAAAJ;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.co.uk/citations?view_op=list_works",
        "orcid": "0000-0002-2009-3078;;;;;;;;",
        "linkedin": ";;brian-sun-59746b12b/;;;;;zejun-ma-58614365/;",
        "or_profile": "~Changli_Tang1;~Wenyi_Yu2;~Guangzhi_Sun1;~Xianzhao_Chen1;~Tian_Tan5;~Wei_Li78;~Lu_Lu6;~Zejun_MA1;~Chao_Zhang20",
        "aff": "Tsinghua University;Tsinghua University;University of Cambridge;;;Bytedance;;ByteDance Inc.;University College London",
        "aff_domain": "tsinghua.edu.cn;tsinghua.edu.cn;cam.ac.uk;;;bytedance.com;;bytedance.com;ucl.ac.uk",
        "position": "Undergrad student;PhD student;Junior Research Fellow;;;Researcher;;Principal Researcher;Associate Professor",
        "bibtex": "@inproceedings{\ntang2024salmonn,\ntitle={{SALMONN}: Towards Generic Hearing Abilities for Large Language Models},\nauthor={Changli Tang and Wenyi Yu and Guangzhi Sun and Xianzhao Chen and Tian Tan and Wei Li and Lu Lu and Zejun MA and Chao Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=14rn7HpKVk}\n}",
        "github": "",
        "project": "",
        "reviewers": "bK7i;KyXG;RbXH",
        "pdf_size": 1377554,
        "rating": "6;6;8",
        "confidence": "4;4;3",
        "soundness": "2;3;3",
        "contribution": "3;2;3",
        "presentation": "2;3;2",
        "wc_summary": "71;89;35",
        "wc_strengths": "24;263;99",
        "wc_weaknesses": "155;169;199",
        "wc_questions": "122;9;11",
        "wc_review": "372;530;344",
        "wc_reply_reviewers": "37;122;19",
        "wc_reply_authors": "897;1357;618",
        "reply_reviewers": "1;1;1",
        "reply_authors": "2;2;2",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            65.0,
            22.44994432064365
        ],
        "wc_strengths_avg": [
            128.66666666666666,
            99.8009129328095
        ],
        "wc_weaknesses_avg": [
            174.33333333333334,
            18.354533197248273
        ],
        "wc_questions_avg": [
            47.333333333333336,
            52.803619404565644
        ],
        "wc_review_avg": [
            415.3333333333333,
            81.88338591490272
        ],
        "wc_reply_reviewers_avg": [
            59.333333333333336,
            44.917207788948275
        ],
        "wc_reply_authors_avg": [
            957.3333333333334,
            304.69693503910116
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -0.9999999999999998,
        "gs_citation": 286,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10631342040411306525&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=14rn7HpKVk",
        "pdf": "https://openreview.net/pdf?id=14rn7HpKVk",
        "email": "tsinghua.edu.cn;tsinghua.edu.cn;cam.ac.uk;;;bytedance.com;;bytedance.com;ucl.ac.uk",
        "author_num": 9,
        "aff_unique_index": "0;0;1;2;2;3",
        "aff_unique_norm": "Tsinghua University;University of Cambridge;ByteDance;University College London",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.cam.ac.uk;https://www.bytedance.com;https://www.ucl.ac.uk",
        "aff_unique_abbr": "THU;Cambridge;Bytedance;UCL",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Cambridge",
        "aff_country_unique_index": "0;0;1;0;0;1",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "id": "16IIkb5wYe",
        "title": "Fast Unsupervised Deep Outlier Model Selection with Hypernetworks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Outlier detection (OD) has a large literature as it finds many applications in the real world. Deep neural network based OD (DOD) has seen a recent surge of attention thanks to the many advances in deep learning. In this paper, we consider a critical-yet-understudied challenge with unsupervised DOD, that is, effective hyperparameter (HP) tuning or model selection. While prior work report the sensitivity of OD models to HP choices, it is ever so critical for the modern DOD models that exhibit a long list of HPs. We introduce Hyper for HP-tuning DOD models, tackling two key challenges: (1) validation without supervision (due to lack of labeled outliers), and (2) efficient search of the HP/model space (due to exponential growth in the number of HPs).  A key idea is to design and train a novel hypernetwork (HN) that maps HPs onto optimal weights of the main DOD model. In turn, Hyper capitalizes on a single HN that can dynamically generate weights for many DOD models (corresponding to varying HPs), which offers significant speed-up. In addition, it employs meta-learning on historical OD tasks with labels to train a performance estimator function, \nlikewise trained with our proposed HN efficiently. \nExtensive experiments on a testbed of 35 benchmark datasets show that \nHyper achieves 7\\% performance improvement and 4.2$\\times$ speed up over the latest baseline, establishing the new state-of-the-art.",
        "keywords": "outlier detection;model selection;automated ML;hypernetworks",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/fbbca5cc9293990ab981bf01472208de93761f3d.pdf",
        "author": "Xueying Ding;Yue Zhao;Leman Akoglu",
        "authorids": "~Xueying_Ding1;~Yue_Zhao13;~Leman_Akoglu3",
        "gender": "F;M;F",
        "homepage": ";https://viterbi-web.usc.edu/~yzhao010/;http://www.andrew.cmu.edu/user/lakoglu/",
        "dblp": ";48/76-16;02/6979.html",
        "google_scholar": "U9CMsh0AAAAJ;https://scholar.google.ca/citations?user=zoGDYsoAAAAJ;4ITkr_kAAAAJ",
        "orcid": ";0000-0003-3401-4921;",
        "linkedin": ";yzhao062/;",
        "or_profile": "~Xueying_Ding1;~Yue_Zhao13;~Leman_Akoglu3",
        "aff": "Carnegie Mellon University;University of Southern California;Carnegie Mellon University",
        "aff_domain": "cmu.edu;usc.edu;cmu.edu",
        "position": "PhD student;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nding2024fast,\ntitle={Fast Unsupervised Deep Outlier Model Selection with Hypernetworks},\nauthor={Xueying Ding and Yue Zhao and Leman Akoglu},\nyear={2024},\nurl={https://openreview.net/forum?id=16IIkb5wYe}\n}",
        "github": "",
        "project": "",
        "reviewers": "LDgS;izNE;Th7t;7fKL;2NEK",
        "site": "https://openreview.net/forum?id=16IIkb5wYe",
        "pdf_size": 4765059,
        "rating": "3;3;5;5;5",
        "confidence": "3;4;3;3;3",
        "soundness": "2;2;2;2;2",
        "contribution": "2;2;2;3;2",
        "presentation": "1;1;2;2;3",
        "wc_summary": "68;134;148;30;156",
        "wc_strengths": "16;33;68;13;125",
        "wc_weaknesses": "145;279;96;132;159",
        "wc_questions": "5;56;107;41;90",
        "wc_review": "234;502;419;216;530",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            4.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.2,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            1.8,
            0.7483314773547883
        ],
        "wc_summary_avg": [
            107.2,
            49.51928917098871
        ],
        "wc_strengths_avg": [
            51.0,
            41.85212061532844
        ],
        "wc_weaknesses_avg": [
            162.2,
            62.036763294033975
        ],
        "wc_questions_avg": [
            59.8,
            36.085454133209964
        ],
        "wc_review_avg": [
            380.2,
            131.99757573531417
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.6123724356957947,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12491906036932999309&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Carnegie Mellon University;University of Southern California",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cmu.edu;https://www.usc.edu",
        "aff_unique_abbr": "CMU;USC",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Los Angeles",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "16VfAw1fs5",
        "title": "A Conservative Image Boundary Extraction Method with Application to the ILM Tumor Surgery",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "While infant lymphatic malformation tumors are benign, they are very difficult to remove. The removal process is very delicate and requires the retention of as much healthy tissue as possible. Commonly utilized boundary extraction methods aim to extract boundaries covering the vast majority of the target area which remove more healthy tissue than is desirable. This paper presents a conservative image boundary extraction (CIBE) approach with well-designed iterative boundary shrinkage procedures which are applied to computerized tomography (CT) images for use in ILM tumor resection operations. CIBE incorporates three primary concepts: Fuzzy Degree, Pixel Deepness and Boundary Smoothness. The proposed algorithm first converts the marked CT image into a 0-1 image matrix. Then it shrinks the boundary according to the estimated PD and BS indices for the image in an iterative fashion until the boundary smoothness meets the desired level. Empirical analysis demonstrates that the smooth, conservative tumor boundaries are obtained using the CIBE algorithm. The proposed method can also be easily extended to the three dimensional studies.",
        "keywords": "Conservative Boundary Extraction;Infant Lymphatic Malformations Tumor;Unsupervised Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Zhenguo Gao;Longqin Lai",
        "authorids": "~Zhenguo_Gao1;~Longqin_Lai1",
        "gender": "M;M",
        "homepage": "https://math.sjtu.edu.cn/Default/teachershow/tags/MDAwMDAwMDAwMLJ4nJg;",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": ";0009-0007-5309-429X",
        "linkedin": ";",
        "or_profile": "~Zhenguo_Gao1;~Longqin_Lai1",
        "aff": "Shanghai Jiaotong University;School of Mathematical Sciences, Shanghai Jiao Tong University",
        "aff_domain": "sjtu.edu.cn;math.sjtu.edu.cn",
        "position": "Associate Professor;PhD student",
        "bibtex": "@misc{\ngao2024a,\ntitle={A Conservative Image Boundary Extraction Method with Application to the {ILM} Tumor Surgery},\nauthor={Zhenguo Gao and Longqin Lai},\nyear={2024},\nurl={https://openreview.net/forum?id=16VfAw1fs5}\n}",
        "github": "",
        "project": "",
        "reviewers": "v2GP;bXZY;4CWF",
        "site": "https://openreview.net/forum?id=16VfAw1fs5",
        "pdf_size": 6971717,
        "rating": "1;3;3",
        "confidence": "4;4;4",
        "soundness": "1;1;2",
        "contribution": "1;1;1",
        "presentation": "2;2;2",
        "wc_summary": "56;81;54",
        "wc_strengths": "24;24;9",
        "wc_weaknesses": "101;145;41",
        "wc_questions": "60;1;40",
        "wc_review": "241;251;144",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            63.666666666666664,
            12.283683848458853
        ],
        "wc_strengths_avg": [
            19.0,
            7.0710678118654755
        ],
        "wc_weaknesses_avg": [
            95.66666666666667,
            42.62497963505541
        ],
        "wc_questions_avg": [
            33.666666666666664,
            24.499433100017278
        ],
        "wc_review_avg": [
            212.0,
            48.25626038833372
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:486a-LKhKJkJ:scholar.google.com/&scioq=A+Conservative+Image+Boundary+Extraction+Method+with+Application+to+the+ILM+Tumor+Surgery&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Shanghai Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sjtu.edu.cn",
        "aff_unique_abbr": "SJTU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Shanghai",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "17BA0Tl2Id",
        "title": "Meta-Referential Games to Learn Compositional Learning Behaviours",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Human beings use compositionality to generalise from past experiences to novel experiences. We assume a separation of our experiences into fundamental atomic components that can be recombined in novel ways to support our ability to engage with novel experiences. We frame this as the ability to learn to generalise compositionally, and we will refer to behaviours making use of this ability as compositional learning behaviours (CLBs).\n\nA central problem to learning CLBs is the resolution of a binding problem (BP). While it is another feat of intelligence that human beings perform with ease, it is not the case for state-of-the-art artificial agents. Thus, in order to build artificial agents able to collaborate with human beings, we propose to develop a novel benchmark to investigate agents\u2019 abilities to exhibit CLBs by solving a domain-agnostic version of the BP.\n\nWe take inspiration from the language emergence and grounding framework of referential games and propose a meta-learning extension of referential games, entitled Meta-Referential Games, and use this framework to build our benchmark, that we name Symbolic Behaviour Benchmark (S2B). We provide baseline results and error analysis showing that our benchmark is a compelling challenge that we hope will spur the research community towards developing more capable artificial agents.",
        "keywords": "referential game;language grounding;compositionality;systematicity;few-shot learning;meta-learning;reinforcement learning;language emergence",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/0131a7b6feeecb88078bab93dc5c0fce351c17a4.zip",
        "author": "Kevin Yandoka Denamganai;Sondess Missaoui;James Alfred Walker",
        "authorids": "~Kevin_Yandoka_Denamganai1;~Sondess_Missaoui1;~James_Alfred_Walker1",
        "gender": "M;F;M",
        "homepage": "https://kevindenamganai.netlify.app/;https://digitalcreativity.ac.uk/people/dr-sondess-missaoui;",
        "dblp": "249/7680;143/1419.html;35/3889",
        "google_scholar": "PPdQb4QAAAAJ;K2yUNQIAAAAJ;https://scholar.google.co.uk/citations?user=Yl5OycsAAAAJ",
        "orcid": "0000-0002-8776-4331;;",
        "linkedin": ";sondess-missaoui-03583531/;",
        "or_profile": "~Kevin_Yandoka_Denamganai1;~Sondess_Missaoui1;~James_Alfred_Walker1",
        "aff": "University of York;University of York;University of York",
        "aff_domain": "york.ac.uk;york.ac.uk;york.ac.uk",
        "position": "PhD student;Researcher;Associate Professor",
        "bibtex": "@misc{\ndenamganai2024metareferential,\ntitle={Meta-Referential Games to Learn Compositional Learning Behaviours},\nauthor={Kevin Yandoka Denamganai and Sondess Missaoui and James Alfred Walker},\nyear={2024},\nurl={https://openreview.net/forum?id=17BA0Tl2Id}\n}",
        "github": "",
        "project": "",
        "reviewers": "qdfE;3drE;CPjL;Hoy7",
        "site": "https://openreview.net/forum?id=17BA0Tl2Id",
        "pdf_size": 1553270,
        "rating": "5;5;6;6",
        "confidence": "2;2;3;3",
        "soundness": "3;2;3;2",
        "contribution": "2;3;3;3",
        "presentation": "3;2;2;2",
        "wc_summary": "62;23;80;94",
        "wc_strengths": "45;36;64;80",
        "wc_weaknesses": "180;189;729;265",
        "wc_questions": "40;4;648;516",
        "wc_review": "327;252;1521;955",
        "wc_reply_reviewers": "262;96;62;222",
        "wc_reply_authors": "1906;1740;2370;1823",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "5;4;4;5",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            2.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            64.75,
            26.639960585556427
        ],
        "wc_strengths_avg": [
            56.25,
            17.03489066592445
        ],
        "wc_weaknesses_avg": [
            340.75,
            226.57490483281683
        ],
        "wc_questions_avg": [
            302.0,
            284.147848839297
        ],
        "wc_review_avg": [
            763.75,
            515.422823999869
        ],
        "wc_reply_reviewers_avg": [
            160.5,
            83.58678125158308
        ],
        "wc_reply_authors_avg": [
            1959.75,
            244.02087513161655
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            4.5,
            0.5
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3952989524077152401&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of York",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.york.ac.uk",
        "aff_unique_abbr": "York",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "17ZbByq95E",
        "title": "Memory-Efficient Backpropagation through Large Linear Layers",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In modern neural networks like Transformers, linear layers require significant memory to store activations during backward pass. This study proposes a memory reduction approach to perform backpropagation through linear layers. Since the gradients of linear layers are computed by matrix multiplications, we consider methods for randomized matrix multiplications and demonstrate that they require less memory with a moderate decrease of the test accuracy. Also, we investigate the variance of the gradient estimate induced by the randomized matrix multiplication. We compare this variance with the variance coming from gradient estimation based on the batch of samples. We demonstrate the benefits of the proposed method on the fine-tuning of the pretrained RoBERTa model on GLUE tasks.",
        "keywords": "transformers;large language models;randomized matmul;approximate matmul;memory-efficient training",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/9dbbb74c329dd95f11ba34177f2216105b5b7795.pdf",
        "author": "Daniel Bershatsky;Aleksandr Mikhalev;Aleksandr Katrutsa;Julia Gusak;Daniil Merkulov;Ivan Oseledets",
        "authorids": "~Daniel_Bershatsky1;~Aleksandr_Mikhalev1;~Aleksandr_Katrutsa1;~Julia_Gusak1;~Daniil_Merkulov1;~Ivan_Oseledets1",
        "gender": "M;;;F;;M",
        "homepage": "https://github.com/daskol;https://faculty.skoltech.ru/people/almikhalev;;https://juliagusak.github.io/about/;;http://oseledets.github.io",
        "dblp": ";;;179/6722;;56/7175",
        "google_scholar": "XthC2z8AAAAJ;https://scholar.google.com/citations?hl=ru;;QriHoq4AAAAJ;;https://scholar.google.ru/citations?user=5kMqBQEAAAAJ",
        "orcid": "0000-0001-8917-8187;0000-0002-9274-7237;;;;",
        "linkedin": ";;;julia-gusak-0b265688/;;",
        "or_profile": "~Daniel_Bershatsky1;~Aleksandr_Mikhalev1;~Aleksandr_Katrutsa1;~Julia_Gusak1;~Daniil_Merkulov1;~Ivan_Oseledets1",
        "aff": "Skolkovo Institute of Science and Technology;Skolkovo Institute of Science and Technology;;INRIA;;Institute of Numerical Mathematics",
        "aff_domain": "skoltech.ru;skoltech.ru;;inria.fr;;inm.ras.ru",
        "position": "PhD student;Assistant Professor;;Researcher;;Researcher",
        "bibtex": "@misc{\nbershatsky2024memoryefficient,\ntitle={Memory-Efficient Backpropagation through Large Linear Layers},\nauthor={Daniel Bershatsky and Aleksandr Mikhalev and Aleksandr Katrutsa and Julia Gusak and Daniil Merkulov and Ivan Oseledets},\nyear={2024},\nurl={https://openreview.net/forum?id=17ZbByq95E}\n}",
        "github": "",
        "project": "",
        "reviewers": "JVog;k3XT;aWYY;fccg",
        "site": "https://openreview.net/forum?id=17ZbByq95E",
        "pdf_size": 474137,
        "rating": "3;3;3;6",
        "confidence": "5;3;4;4",
        "soundness": "3;2;2;3",
        "contribution": "2;1;2;2",
        "presentation": "2;2;3;3",
        "wc_summary": "24;20;144;114",
        "wc_strengths": "30;42;34;40",
        "wc_weaknesses": "163;279;272;129",
        "wc_questions": "253;201;33;97",
        "wc_review": "470;542;483;380",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "333;283;187;215",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            75.5,
            54.559600438419636
        ],
        "wc_strengths_avg": [
            36.5,
            4.769696007084728
        ],
        "wc_weaknesses_avg": [
            210.75,
            65.902864125924
        ],
        "wc_questions_avg": [
            146.0,
            86.08716512930368
        ],
        "wc_review_avg": [
            468.75,
            57.98006122797733
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            254.5,
            57.207953992430106
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4859682723757387504&as_sdt=5,31&sciodt=0,31&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "Skolkovo Institute of Science and Technology;INRIA;Institute of Numerical Mathematics",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.skoltech.ru;https://www.inria.fr;",
        "aff_unique_abbr": "Skoltech;INRIA;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "Russian Federation;France;"
    },
    {
        "title": "Tensor Programs VI: Feature Learning in Infinite Depth Neural Networks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19599",
        "id": "17pVDnpwwl",
        "author_site": "Greg Yang, Dingli Yu, Chen Zhu, Soufiane Hayou",
        "tldr": "",
        "abstract": "Empirical studies have consistently demonstrated that increasing the size of neural networks often yields superior performance in practical applications. However, there is a lack of consensus regarding the appropriate scaling strategy, particularly when it comes to increasing the depth of neural networks. In practice, excessively large depths can lead to model performance degradation. In this paper, we introduce Depth-$\\mu$P, a principled approach for depth scaling, allowing for the training of arbitrarily deep architectures while maximizing feature learning and diversity among nearby layers. Our method involves dividing the contribution of each residual block and the parameter update by the square root of the depth. Through the use of Tensor Programs, we rigorously establish the existence of a limit for infinitely deep neural networks under the proposed scaling scheme. This scaling strategy ensures more stable training for deep neural networks and guarantees the transferability of hyperparameters from shallow to deep models. To substantiate the efficacy of our scaling method, we conduct empirical validation on neural networks with depths up to $2^{10}$.",
        "keywords": "Tensor Programs;mup;deep learning;optimization;optimal hyperparameter transfer",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Greg Yang;Dingli Yu;Chen Zhu;Soufiane Hayou",
        "authorids": "~Greg_Yang1;~Dingli_Yu1;~Chen_Zhu2;~Soufiane_Hayou1",
        "gender": "M;;M;M",
        "homepage": ";https://dingliyu.net/;http://www.cs.umd.edu/~chenzhu/;https://www.soufianehayou.com/",
        "dblp": "153/2097;39/578;59/10522-1.html;220/5617",
        "google_scholar": "Xz4RAJkAAAAJ;KJLJstYAAAAJ;m-om5O8AAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";0000-0002-8824-8611;;",
        "linkedin": ";;;",
        "or_profile": "~Greg_Yang1;~Dingli_Yu1;~Chen_Zhu2;~Soufiane_Hayou1",
        "aff": ";Princeton University;NVIDIA;National University of Singapore",
        "aff_domain": ";princeton.edu;nvidia.com;nus.edu.sg",
        "position": ";PhD student;Research Scientist;Assistant Professor",
        "bibtex": "@inproceedings{\nyang2024tensor,\ntitle={Tensor Programs {VI}: Feature Learning in Infinite Depth Neural Networks},\nauthor={Greg Yang and Dingli Yu and Chen Zhu and Soufiane Hayou},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=17pVDnpwwl}\n}",
        "github": "",
        "project": "",
        "reviewers": "f9Ax;Mvpr;5jxB;TGji;AGJB",
        "pdf_size": 2831781,
        "rating": "5;6;8;8;8",
        "confidence": "3;4;4;4;4",
        "soundness": "2;4;2;4;3",
        "contribution": "2;3;4;3;4",
        "presentation": "3;3;3;4;3",
        "wc_summary": "80;113;164;37;103",
        "wc_strengths": "80;72;194;30;65",
        "wc_weaknesses": "150;227;440;96;2",
        "wc_questions": "74;669;188;2;397",
        "wc_review": "384;1081;986;165;567",
        "wc_reply_reviewers": "0;300;298;0;0",
        "wc_reply_authors": "564;1106;1065;327;747",
        "reply_reviewers": "0;1;2;0;0",
        "reply_authors": "2;4;2;1;1",
        "rating_avg": [
            7.0,
            1.2649110640673518
        ],
        "confidence_avg": [
            3.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            3.0,
            0.8944271909999159
        ],
        "contribution_avg": [
            3.2,
            0.7483314773547882
        ],
        "presentation_avg": [
            3.2,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            99.4,
            41.572106032771536
        ],
        "wc_strengths_avg": [
            88.2,
            55.58560964854123
        ],
        "wc_weaknesses_avg": [
            183.0,
            147.92160085667
        ],
        "wc_questions_avg": [
            266.0,
            241.7494570831546
        ],
        "wc_review_avg": [
            636.6,
            349.4650769390269
        ],
        "wc_reply_reviewers_avg": [
            119.6,
            146.48085199096843
        ],
        "wc_reply_authors_avg": [
            761.8,
            296.242738307625
        ],
        "reply_reviewers_avg": [
            0.6,
            0.7999999999999999
        ],
        "reply_authors_avg": [
            2.0,
            1.0954451150103321
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.7905694150420949,
        "gs_citation": 45,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6365974675006259933&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=17pVDnpwwl",
        "pdf": "https://openreview.net/pdf?id=17pVDnpwwl",
        "email": ";princeton.edu;nvidia.com;nus.edu.sg",
        "author_num": 4,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Princeton University;NVIDIA;National University of Singapore",
        "aff_unique_dep": ";NVIDIA Corporation;",
        "aff_unique_url": "https://www.princeton.edu;https://www.nvidia.com;https://www.nus.edu.sg",
        "aff_unique_abbr": "Princeton;NVIDIA;NUS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "United States;Singapore"
    },
    {
        "id": "18TezdB9nk",
        "title": "Deep Neural Room Acoustics Primitive",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Modeling room acoustics encompasses characterizing the sound propagation dynamics in enclosed 3D spaces and is useful in a variety of settings, including audio-visual simulations, embodied sound source localization, etc. Such dynamics are usually represented using one-dimensional room impulse responses (RIR). However, accurately estimating an RIR is often challenging as sound waves undergo reflections, diffraction, absorption, and scattering along the propagation path. In this paper, we propose a deep learning framework to learn a continuous room acoustic field, dubbed Deep Neural Room Acoustic Primitive (DeepNeRAP), capturing all sound propagation properties in a self-supervised manner; our framework allows the characterization of sound propagation from any source position to any receiver position. Our key idea is to allow two cooperative audio agents to actively probe the 3D space, one emitting and the other receiving sounds at varied positions -- analyzing these emitted and received sounds within our neural framework enables inversely characterizing the room scene acoustically. Our learning formulation is grounded in the physical principles of sound wave propagation, including the properties of globality, reciprocity, superposition, and independence. We present experiments on both synthetic and real-world datasets, demonstrating superior quality of our RIR estimation against closely related methods.",
        "keywords": "audio rendering;neural room impulse response;spatial audio;neural audio rendering",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/b8ab1fd7eedba45527e94b894d00d8721e207342.pdf",
        "author": "Yuhang He;Anoop Cherian;Gordon Wichern;Andrew Markham",
        "authorids": "~Yuhang_He3;~Anoop_Cherian1;~Gordon_Wichern1;~Andrew_Markham2",
        "gender": "M;;M;M",
        "homepage": "https://yuhanghe01.github.io/;;;http://users.cecs.anu.edu.au/~cherian/",
        "dblp": ";72/6049;83/7169;44/7734",
        "google_scholar": "H1p3ve8AAAAJ;;https://scholar.google.co.uk/citations?user=g3JTO9EAAAAJ;https://scholar.google.com.au/citations?hl=en",
        "orcid": ";;;0000-0002-5566-0351",
        "linkedin": ";;;anoop-cherian-4678a04/",
        "or_profile": "~Yuhang_He3;~Gordon_Wichern1;~Andrew_Markham2;~Anoop_Cherian2",
        "aff": "University of Oxford;Mitsubishi Electric Research Labs;University of Oxford;Mitsubishi Electric Research Labs",
        "aff_domain": "ox.ac.uk;merl.com;ox.ac.uk;merl.com",
        "position": "PhD student;Principal Research Scientist;Associate Professor;Principal Researcher",
        "bibtex": "@misc{\nhe2024deep,\ntitle={Deep Neural Room Acoustics Primitive},\nauthor={Yuhang He and Anoop Cherian and Gordon Wichern and Andrew Markham},\nyear={2024},\nurl={https://openreview.net/forum?id=18TezdB9nk}\n}",
        "github": "",
        "project": "",
        "reviewers": "CGe5;MG9M;EjEe;HBj4",
        "site": "https://openreview.net/forum?id=18TezdB9nk",
        "pdf_size": 13375,
        "rating": "3;3;5;6",
        "confidence": "5;3;3;5",
        "soundness": "2;1;4;3",
        "contribution": "3;1;2;2",
        "presentation": "4;1;4;3",
        "wc_summary": "69;28;70;132",
        "wc_strengths": "100;21;117;69",
        "wc_weaknesses": "390;216;305;116",
        "wc_questions": "47;147;33;11",
        "wc_review": "606;412;525;328",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            1.0
        ],
        "soundness_avg": [
            2.5,
            1.118033988749895
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            1.224744871391589
        ],
        "wc_summary_avg": [
            74.75,
            37.14414489525907
        ],
        "wc_strengths_avg": [
            76.75,
            36.49914382557487
        ],
        "wc_weaknesses_avg": [
            256.75,
            101.9249110865445
        ],
        "wc_questions_avg": [
            59.5,
            52.12245197609184
        ],
        "wc_review_avg": [
            467.75,
            106.09989396790178
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.19245008972987526,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10633725098285414080&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;1;0;1",
        "aff_unique_norm": "University of Oxford;Mitsubishi Electric Research Laboratories",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ox.ac.uk;https://www.merl.com",
        "aff_unique_abbr": "Oxford;MERL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;1",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "id": "18TfucMNTr",
        "title": "Accelerated Deep Learning by Gaussian Continuation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Prior work has shown that incorporating noise into the process of training deep neural networks reduces the risks of getting stuck in local minima, overfitting to the training data, and being limited by poor initialization. In this work we consider noisy training as a special case of optimization by continuation, also known as graduated non-convexity, where a convex version of the objective function is solved first and slowly morphed into the original non-convex function. When using continuation in machine learning problems, we show that saddle points require special consideration, as they may get the optimizer stuck in local minima. With a form of regularization applied to the continuation optimizer, we show on several test problems that this approach reduces the risk of being trapped in local minima, leading to better training for very deep architectures and non-convex loss functions.",
        "keywords": "homotopy;continuation;optimization;deep learning",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/c01b7419ade3037ce34017820a01661f89c07dab.zip",
        "author": "Andrew Francesco Ilersich;Prasanth B. Nair",
        "authorids": "~Andrew_Francesco_Ilersich1;~Prasanth_B._Nair1",
        "gender": ";M",
        "homepage": ";http://arrow.utias.utoronto.ca/~pbn/index.html",
        "dblp": ";n/PrasanthBNair",
        "google_scholar": "C3T92DQAAAAJ;6MXRhVIAAAAJ",
        "orcid": "0009-0004-5369-5464;",
        "linkedin": "andrewilersich/;",
        "or_profile": "~Andrew_Francesco_Ilersich1;~Prasanth_B._Nair1",
        "aff": "University of Toronto;Toronto University",
        "aff_domain": "utoronto.ca;utoronto.ca",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nilersich2024accelerated,\ntitle={Accelerated Deep Learning by Gaussian Continuation},\nauthor={Andrew Francesco Ilersich and Prasanth B. Nair},\nyear={2024},\nurl={https://openreview.net/forum?id=18TfucMNTr}\n}",
        "github": "",
        "project": "",
        "reviewers": "MQoK;xWFa;jwZM;EAjK",
        "site": "https://openreview.net/forum?id=18TfucMNTr",
        "pdf_size": 3873401,
        "rating": "3;3;3;5",
        "confidence": "3;4;4;3",
        "soundness": "1;3;3;2",
        "contribution": "2;1;1;3",
        "presentation": "3;1;3;2",
        "wc_summary": "218;25;110;26",
        "wc_strengths": "22;30;34;68",
        "wc_weaknesses": "145;1326;331;875",
        "wc_questions": "165;4;35;12",
        "wc_review": "550;1385;510;981",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            94.75,
            79.08025986300247
        ],
        "wc_strengths_avg": [
            38.5,
            17.57128339080558
        ],
        "wc_weaknesses_avg": [
            669.25,
            464.46333278311647
        ],
        "wc_questions_avg": [
            54.0,
            65.08840142452416
        ],
        "wc_review_avg": [
            856.5,
            356.6570481569094
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:wkLL2HyBaz8J:scholar.google.com/&scioq=Accelerated+Deep+Learning+by+Gaussian+Continuation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Toronto",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.utoronto.ca",
        "aff_unique_abbr": "U of T",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "1AXvGjfF0V",
        "title": "Evaluating Hallucinations in Chinese Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this paper, we establish a benchmark named HalluQA (Chinese Hallucination Question-Answering) to measure the hallucination phenomenon in Chinese large language models. \nHalluQA contains 450 meticulously designed adversarial questions, spanning multiple domains, and takes into account Chinese historical culture, customs, and social phenomena. \nDuring the construction of HalluQA, we consider two types of hallucinations: imitative falsehoods and factual errors, and we construct adversarial samples based on GLM-130B and ChatGPT.\nFor evaluation, we design an automated evaluation method using GPT-4 to judge whether a model output is hallucinated.\nWe conduct extensive experiments on 24 large language models, including ERNIE-Bot, Baichuan2, ChatGLM, Qwen, SparkDesk and etc. \nOut of the 24 models, 18 achieved non-hallucination rates lower than 50\\%. \nThis indicates that HalluQA is highly challenging.\nWe analyze the primary types of hallucinations in different types of models and their causes. Additionally, we discuss which types of hallucinations should be prioritized for different types of models.",
        "keywords": "Hallucinations evaluation;Chinese;Large Language Models;Dataset & Benchmark",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Qinyuan Cheng;Tianxiang Sun;Wenwei Zhang;Siyin Wang;Xiangyang Liu;Mozhi Zhang;Junliang He;Mianqiu Huang;Zhangyue Yin;Kai Chen;Xipeng Qiu",
        "authorids": "~Qinyuan_Cheng1;~Tianxiang_Sun1;~Wenwei_Zhang1;~Siyin_Wang1;~Xiangyang_Liu3;~Mozhi_Zhang2;~Junliang_He2;~Mianqiu_Huang1;~Zhangyue_Yin1;~Kai_Chen4;~Xipeng_Qiu1",
        "gender": "M;M;M;M;M;M;M;M;M;M;M",
        "homepage": "https://xiami2019.github.io/;https://txsun1997.github.io/;https://zhangwenwei.cn;https://sinwang20.github.io/;;https://github.com/Zhang-Mozhi;https://luther-sparks.github.io/;https://yinzhangyue.github.io/;https://chenkai.site/;https://xpqiu.github.io/;https://jlhe.github.io",
        "dblp": "331/9838;254/1189;;326/8437;;;;314/5418;181/2839-26;69/1395;",
        "google_scholar": "nu_iPXAAAAAJ;puHFkM0AAAAJ;QDXADSEAAAAJ;wllp6o0AAAAJ;https://scholar.google.com.hk/citations?user=U8QD9mwAAAAJ;TPR5JREAAAAJ;;9gRQqSkAAAAJ;https://scholar.google.com.hk/citations?user=eGD0b7IAAAAJ;Pq4Yp_kAAAAJ;KhHpD54AAAAJ",
        "orcid": ";;0000-0002-2748-4514;;;;;;0000-0002-6820-2325;0000-0001-7163-5247;",
        "linkedin": "https://www.linkedin.cn/injobs/in/qinyuan-cheng-5168951ab;;wenweizhang-b9769a124/;;;;;zhangyue-yin-083286288/;;;",
        "or_profile": "~Qinyuan_Cheng1;~Tianxiang_Sun1;~Wenwei_Zhang1;~Siyin_Wang1;~Xiangyang_Liu3;~Mozhi_Zhang2;~Mianqiu_Huang1;~Zhangyue_Yin1;~Kai_Chen4;~Xipeng_Qiu1;~JunLiang_He1",
        "aff": "Fudan University;Fudan University;Shanghai AI Laboratory;Fudan University;Fudan University;Fudan University;Fudan University;Fudan University;Shanghai AI Laboratory;Fudan University;Fudan University",
        "aff_domain": "fudan.edu.cn;fudan.edu;pjlab.org.cn;fudan.edu.cn;fudan.edu.cn;fudan.edu.cn;fudan.edu.cn;fudan.edu.cn;pjlab.org.cn;fudan.edu.cn;fudan.edu.cn",
        "position": "PhD student;PhD student;Researcher;Undergrad student;PhD student;MS student;MS student;PhD student;Researcher;Full Professor;MS student",
        "bibtex": "@misc{\ncheng2024evaluating,\ntitle={Evaluating Hallucinations in Chinese Large Language Models},\nauthor={Qinyuan Cheng and Tianxiang Sun and Wenwei Zhang and Siyin Wang and Xiangyang Liu and Mozhi Zhang and Junliang He and Mianqiu Huang and Zhangyue Yin and Kai Chen and Xipeng Qiu},\nyear={2024},\nurl={https://openreview.net/forum?id=1AXvGjfF0V}\n}",
        "github": "",
        "project": "",
        "reviewers": "svpT;DCpV;fQ9L",
        "site": "https://openreview.net/forum?id=1AXvGjfF0V",
        "pdf_size": 1157443,
        "rating": "5;5;6",
        "confidence": "4;3;3",
        "soundness": "2;2;3",
        "contribution": "3;2;3",
        "presentation": "3;3;3",
        "wc_summary": "72;76;81",
        "wc_strengths": "68;12;45",
        "wc_weaknesses": "168;50;17",
        "wc_questions": "13;61;29",
        "wc_review": "321;199;172",
        "wc_reply_reviewers": "65;0;0",
        "wc_reply_authors": "1038;858;421",
        "reply_reviewers": "1;0;0",
        "reply_authors": "3;3;1",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            76.33333333333333,
            3.681787005729087
        ],
        "wc_strengths_avg": [
            41.666666666666664,
            22.983085567917602
        ],
        "wc_weaknesses_avg": [
            78.33333333333333,
            64.81940724470994
        ],
        "wc_questions_avg": [
            34.333333333333336,
            19.955506062794353
        ],
        "wc_review_avg": [
            230.66666666666666,
            64.81940724470994
        ],
        "wc_reply_reviewers_avg": [
            21.666666666666668,
            30.641293851417057
        ],
        "wc_reply_authors_avg": [
            772.3333333333334,
            259.0705609588931
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 54,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10748152223918110433&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;0;0;0;0;0;1;0;0",
        "aff_unique_norm": "Fudan University;Shanghai AI Laboratory",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.fudan.edu.cn;https://www.shanghai-ai-lab.com",
        "aff_unique_abbr": "Fudan;SAIL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "1Akd36hG9z",
        "title": "Enhancing Offline Reinforcement Learning with an Optimal Supported Dataset",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Offline Reinforcement Learning (Offline RL) is challenged by distributional shift and value overestimation, which often leads to poor performance. To address this issue, a popular class of methods use behavior regularization to constrain the learned policy to stay close to the behavior policy. However, this approach can be too limiting when the  behavior policy is suboptimal. To overcome this limitation, we propose to conduct behavior regularization directly on an optimal supported dataset, which can both ensure that the learned policy is not too far removed from the dataset, and reduce any potential  bias towards the optimization objective. We introduce \\textit{\\textbf{O}ptimal \\textbf{S}upported \\textbf{D}ataset generation via Stationary \\textbf{DI}stribution \\textbf{C}orrection \\textbf{E}stimation} (OSD-DICE) to generate such a dataset. OSD-DICE is based on the primal-dual formulation of linear programming for RL. It uses a single minimization objective  to avoid  poor convergence issues often associated with this formulation, and incorporates two key designs to ensure polynomial sample complexity under general function approximation and single-policy concentrability.  After generating the near-optimal supported dataset, we instantiate our framework by two representative behavior regularization-based methods and show safe policy improvement over the near-optimal supported policy. Empirical results validate the efficacy of OSD-DICE on tabular tasks and demonstrate remarkable performance gains of the proposed framework on  D4RL benchmarks.",
        "keywords": "Offline reinforcement learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/db826e1f0ef94b970fc5330553b55cdd2b084aec.zip",
        "author": "Chen Chen;Zhaoyi Xu;Yixiu Mao;Hongchang Zhang;Xiangyang Ji",
        "authorids": "~Chen_Chen3;~Zhaoyi_Xu1;~Yixiu_Mao2;~Hongchang_Zhang1;~Xiangyang_Ji1",
        "gender": "F;M;M;M;",
        "homepage": ";https://github.com/XuZhaoyi;;;",
        "dblp": ";;280/1045;https://dblp.uni-trier.de/pid/36/9348;",
        "google_scholar": "l8_g4oAAAAAJ;;;;",
        "orcid": ";;0009-0000-7302-5039;;",
        "linkedin": ";;;;",
        "or_profile": "~Chen_Chen3;~Zhaoyi_Xu1;~Yixiu_Mao2;~Hongchang_Zhang1;~Xiangyang_Ji1",
        "aff": "Qiyuan Lab;Tsinghua University;Tsinghua University;Tsinghua University;",
        "aff_domain": "qiyuanlab.com;tsinghua.edu.cn;mails.tsinghua.edu.cn;tsinghua.edu.cn;",
        "position": "Researcher;PhD student;PhD student;PhD student;",
        "bibtex": "@misc{\nchen2024enhancing,\ntitle={Enhancing Offline Reinforcement Learning with an Optimal Supported Dataset},\nauthor={Chen Chen and Zhaoyi Xu and Yixiu Mao and Hongchang Zhang and Xiangyang Ji},\nyear={2024},\nurl={https://openreview.net/forum?id=1Akd36hG9z}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZUfb;MfcJ;NpVF;v4Ur;yzkc;tQGo",
        "site": "https://openreview.net/forum?id=1Akd36hG9z",
        "pdf_size": 7062385,
        "rating": "3;5;5;5;6;8",
        "confidence": "2;4;3;3;4;2",
        "soundness": "2;2;3;2;3;3",
        "contribution": "2;3;2;2;2;3",
        "presentation": "2;1;3;3;2;2",
        "wc_summary": "32;170;80;102;76;146",
        "wc_strengths": "25;44;27;20;36;68",
        "wc_weaknesses": "181;172;83;345;113;35",
        "wc_questions": "2;64;105;65;119;1",
        "wc_review": "240;450;295;532;344;250",
        "wc_reply_reviewers": "0;21;0;36;0;0",
        "wc_reply_authors": "635;366;899;695;706;78",
        "reply_reviewers": "0;1;0;1;0;0",
        "reply_authors": "1;1;2;1;1;1",
        "rating_avg": [
            5.333333333333333,
            1.4907119849998596
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.1666666666666665,
            0.6871842709362768
        ],
        "wc_summary_avg": [
            101.0,
            45.85120863546929
        ],
        "wc_strengths_avg": [
            36.666666666666664,
            16.038148964959213
        ],
        "wc_weaknesses_avg": [
            154.83333333333334,
            98.66849660465199
        ],
        "wc_questions_avg": [
            59.333333333333336,
            45.441048501205266
        ],
        "wc_review_avg": [
            351.8333333333333,
            106.66523436538367
        ],
        "wc_reply_reviewers_avg": [
            9.5,
            14.115594213493104
        ],
        "wc_reply_authors_avg": [
            563.1666666666666,
            267.70220810113284
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.1666666666666667,
            0.3726779962499649
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:jC-jyYAVqRIJ:scholar.google.com/&scioq=Enhancing+Offline+Reinforcement+Learning+with+an+Optimal+Supported+Dataset&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Qiyuan Lab;Tsinghua University",
        "aff_unique_dep": ";",
        "aff_unique_url": ";https://www.tsinghua.edu.cn",
        "aff_unique_abbr": ";THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "1;1;1",
        "aff_country_unique": ";China"
    },
    {
        "id": "1B4juHRAgt",
        "title": "Amortized Bayesian Inference with Hybrid Expert-in-the-Loop and Learnable Summary Statistics",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Amortized Bayesian inference (ABI), a subset of simulation-based inference (SBI) fueled by neural networks, has rapidly grown in popularity across diverse scientific fields. Summary statistics are an essential dimensionality reduction component of ABI workflows and most methods to-date rely either on hand-crafted (i.e., based on domain expertise) or end-to-end learned summary statistics. In this work, we explore three hybrid methods to harness the complementary strengths of both sources. The first method directly conditions a neural approximator on both summary types, thereby extending traditional end-to-end approaches in a straightforward way. The second method embeds both expert and learned summaries into a joint representation space which is explicitly optimized to encode decorrelated features. The third method employs an auxiliary generative model to learn a latent summary representation that is statistically independent from the expert summaries. We explore various aspects of our hybrid methodology across different experiments and model instances, including perfect domain expertise and imperfect artificial experts represented by pre-trained neural networks. Our empirical results suggest that hybrid representations can improve parameter estimation and model comparison in settings of scientific interest, warranting the viability of an \"expert-in-the-loop\" approach. The performance gains are especially promising in scenarios with low to medium simulation budgets.",
        "keywords": "Bayesian inference;summary statistics;generative models;amortized inference;expert-in-the-loop",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/bd6de384e65fc9013629b29000874c9f76f07908.zip",
        "author": "Stefan T. Radev;Lukas Schumacher",
        "authorids": "~Stefan_T._Radev1;lukas.schumacher@psychologie.uni-heidelberg.de",
        "gender": "M;",
        "homepage": "https://faculty.rpi.edu/stefan-radev;",
        "dblp": ";",
        "google_scholar": "JbDfkRkAAAAJ;",
        "orcid": "0000-0002-6702-9559;",
        "linkedin": "stefan-radev-21b713187/;",
        "or_profile": "~Stefan_T._Radev1;lukas.schumacher@psychologie.uni-heidelberg.de",
        "aff": "Rensselaer Polytechnic Institute;",
        "aff_domain": "epi.edu;",
        "position": "Assistant Professor;",
        "bibtex": "@misc{\nradev2024amortized,\ntitle={Amortized Bayesian Inference with Hybrid Expert-in-the-Loop and Learnable Summary Statistics},\nauthor={Stefan T. Radev and Lukas Schumacher},\nyear={2024},\nurl={https://openreview.net/forum?id=1B4juHRAgt}\n}",
        "github": "",
        "project": "",
        "reviewers": "QZwH;727i;mwUj;u538;qzC3",
        "site": "https://openreview.net/forum?id=1B4juHRAgt",
        "pdf_size": 16273364,
        "rating": "3;3;5;6;6",
        "confidence": "4;4;4;2;3",
        "soundness": "3;2;3;3;2",
        "contribution": "2;1;2;3;3",
        "presentation": "3;3;3;3;3",
        "wc_summary": "156;98;32;138;107",
        "wc_strengths": "48;34;38;79;41",
        "wc_weaknesses": "450;325;229;71;26",
        "wc_questions": "138;26;146;29;92",
        "wc_review": "792;483;445;317;266",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            4.6,
            1.3564659966250536
        ],
        "confidence_avg": [
            3.4,
            0.8
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.2,
            0.7483314773547882
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            106.2,
            42.57886799810441
        ],
        "wc_strengths_avg": [
            48.0,
            16.161683080669537
        ],
        "wc_weaknesses_avg": [
            220.2,
            157.38030372317877
        ],
        "wc_questions_avg": [
            86.2,
            51.35912771844942
        ],
        "wc_review_avg": [
            460.6,
            183.8810485069084
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.7740702698132101,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:haZcZb1ef58J:scholar.google.com/&scioq=Amortized+Bayesian+Inference+with+Hybrid+Expert-in-the-Loop+and+Learnable+Summary+Statistics&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Rensselaer Polytechnic Institute",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.rpi.edu",
        "aff_unique_abbr": "RPI",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Rethinking Complex Queries on Knowledge Graphs with Neural Link Predictors",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19598",
        "id": "1BmveEMNbG",
        "author_site": "Hang Yin, Zihao Wang, Yangqiu Song",
        "tldr": "",
        "abstract": "Reasoning on knowledge graphs is a challenging task because it utilizes observed information to predict the missing one. Particularly, answering complex queries based on first-order logic is one of the crucial tasks to verify learning to reason abilities for generalization and composition.\nRecently, the prevailing method is query embedding which learns the embedding of a set of entities and treats logic operations as set operations and has shown great empirical success. Though there has been much research following the same formulation, many of its claims lack a formal and systematic inspection. In this paper, we rethink this formulation and justify many of the previous claims by characterizing the scope of queries investigated previously and precisely identifying the gap between its formulation and its goal, as well as providing complexity analysis for the currently investigated queries. Moreover, we develop a new dataset containing ten new types of queries with features that have never been considered and therefore can provide a thorough investigation of complex queries. Finally, we propose a new neural-symbolic method, Fuzzy Inference with Truth value (FIT), where we equip the neural link predictors with fuzzy logic theory to support end-to-end learning using complex queries with provable reasoning capability. Empirical results show that our method outperforms previous methods significantly in the new dataset and also surpasses previous methods in the existing dataset at the same time.",
        "keywords": "complex query answering;knowledge graph;link prediction",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "",
        "author": "Hang Yin;Zihao Wang;Yangqiu Song",
        "authorids": "~Hang_Yin3;~Zihao_Wang11;~Yangqiu_Song1",
        "gender": ";;M",
        "homepage": ";https://zihao-wang.github.io;https://www.cse.ust.hk/~yqsong/",
        "dblp": ";148/9655-1;86/2159",
        "google_scholar": ";T28rR00AAAAJ;MdQZ-q8AAAAJ",
        "orcid": ";0000-0002-3919-0396;0000-0002-7818-6090",
        "linkedin": ";zihao-wang-6a0a3286/;yqsong/",
        "or_profile": "~Hang_Yin3;~Zihao_Wang11;~Yangqiu_Song1",
        "aff": ";Hong Kong University of Science and Technology;Hong Kong University of Science and Technology",
        "aff_domain": ";cse.ust.hk;ust.hk",
        "position": ";PhD student;Associate Professor",
        "bibtex": "@inproceedings{\nyin2024rethinking,\ntitle={Rethinking Complex Queries on Knowledge Graphs with Neural Link Predictors},\nauthor={Hang Yin and Zihao Wang and Yangqiu Song},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=1BmveEMNbG}\n}",
        "github": "",
        "project": "",
        "reviewers": "TtwJ;sXg1;QmUh;Z6xA",
        "pdf_size": 650596,
        "rating": "6;6;8;8",
        "confidence": "4;3;4;3",
        "soundness": "2;3;4;3",
        "contribution": "4;2;4;3",
        "presentation": "3;2;4;3",
        "wc_summary": "225;98;138;102",
        "wc_strengths": "107;95;209;40",
        "wc_weaknesses": "177;181;47;62",
        "wc_questions": "102;3;19;39",
        "wc_review": "611;377;413;243",
        "wc_reply_reviewers": "0;102;0;9",
        "wc_reply_authors": "553;779;155;316",
        "reply_reviewers": "0;2;0;1",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            140.75,
            51.07531204016281
        ],
        "wc_strengths_avg": [
            112.75,
            61.042505682516015
        ],
        "wc_weaknesses_avg": [
            116.75,
            62.491499421921375
        ],
        "wc_questions_avg": [
            40.75,
            37.59238619720754
        ],
        "wc_review_avg": [
            411.0,
            131.70421405558744
        ],
        "wc_reply_reviewers_avg": [
            27.75,
            43.0254285277904
        ],
        "wc_reply_authors_avg": [
            450.75,
            236.5527161120751
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 19,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5020512622307914988&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=1BmveEMNbG",
        "pdf": "https://openreview.net/pdf?id=1BmveEMNbG",
        "email": ";cse.ust.hk;ust.hk",
        "author_num": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Hong Kong University of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ust.hk",
        "aff_unique_abbr": "HKUST",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Enhancing Transferable Adversarial Attacks on Vision Transformers through Gradient Normalization Scaling and High-Frequency Adaptation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19597",
        "id": "1BuWv9poWz",
        "author_site": "Zhiyu Zhu, Xinyi Wang, Zhibo Jin, Jiayu Zhang, Huaming Chen",
        "tldr": "",
        "abstract": "Vision Transformers (ViTs) have been widely used in various domains. Similar to Convolutional Neural Networks (CNNs), ViTs are prone to the impacts of adversarial samples, raising security concerns in real-world applications. As one of the most effective black-box attack methods, transferable attacks can generate adversarial samples on surrogate models to directly attack the target model without accessing the parameters. However, due to the distinct internal structures of ViTs and CNNs, adversarial samples constructed by traditional transferable attack methods may not be applicable to ViTs. Therefore, it is imperative to propose more effective transferability attack methods to unveil latent vulnerabilities in ViTs. Existing methods have found that applying gradient regularization to extreme gradients across different functional regions in the transformer structure can enhance sample transferability. However, in practice, substantial gradient disparities exist even within the same functional region across different layers. Furthermore, we find that mild gradients therein are the main culprits behind reduced transferability. In this paper, we introduce a novel Gradient Normalization Scaling method for fine-grained gradient editing to enhance the transferability of adversarial attacks on ViTs. More importantly, we highlight that ViTs, unlike traditional CNNs, exhibit distinct attention regions in the frequency domain. Leveraging this insight, we delve into exploring the frequency domain to further enhance the algorithm's transferability. Through extensive experimentation on various ViT variants and traditional CNN models, we substantiate that the new approach achieves state-of-the-art performance, with an average performance improvement of 33.54\\% and 42.05\\% on ViT and CNN models, respectively. Our code is available at: https://github.com/LMBTough/GNS-HFA.",
        "keywords": "Adversarial attack;transferability;Vit;transformer",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/c0069439cc0a5771415da7f84ab0e26da2dbf333.pdf",
        "author": "Zhiyu Zhu;Xinyi Wang;Zhibo Jin;Jiayu Zhang;Huaming Chen",
        "authorids": "~Zhiyu_Zhu2;~Xinyi_Wang9;~Zhibo_Jin1;~Jiayu_Zhang1;~Huaming_Chen1",
        "gender": ";M;M;M;",
        "homepage": ";https://github.com/noctisluna;https://github.com/Davidjinzb;https://github.com/KxPlaug;",
        "dblp": ";;;;",
        "google_scholar": ";;;;",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Zhiyu_Zhu2;~Xinyi_Wang9;~Zhibo_Jin1;~Jiayu_Zhang1;~Huaming_Chen1",
        "aff": ";Universiti Malaya;University of Sydney;Suzhou Yierqi;",
        "aff_domain": ";um.edu.my;usyd.edu.au;szyierqi.com;",
        "position": ";MS student;MS student;Researcher;",
        "bibtex": "@inproceedings{\nzhu2024enhancing,\ntitle={Enhancing Transferable Adversarial Attacks on Vision Transformers through Gradient Normalization Scaling and High-Frequency Adaptation},\nauthor={Zhiyu Zhu and Xinyi Wang and Zhibo Jin and Jiayu Zhang and Huaming Chen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=1BuWv9poWz}\n}",
        "github": "",
        "project": "",
        "reviewers": "6tAt;98px;Qpbi",
        "pdf_size": 1520325,
        "rating": "5;5;6",
        "confidence": "3;4;4",
        "soundness": "3;3;2",
        "contribution": "2;2;2",
        "presentation": "2;3;1",
        "wc_summary": "133;64;45",
        "wc_strengths": "26;15;35",
        "wc_weaknesses": "67;50;106",
        "wc_questions": "151;17;158",
        "wc_review": "377;146;344",
        "wc_reply_reviewers": "0;0;9",
        "wc_reply_authors": "1278;735;1479",
        "reply_reviewers": "0;0;1",
        "reply_authors": "3;3;4",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            80.66666666666667,
            37.80946383586463
        ],
        "wc_strengths_avg": [
            25.333333333333332,
            8.178562764256865
        ],
        "wc_weaknesses_avg": [
            74.33333333333333,
            23.442601296689656
        ],
        "wc_questions_avg": [
            108.66666666666667,
            64.88108781112996
        ],
        "wc_review_avg": [
            289.0,
            102.00980345045274
        ],
        "wc_reply_reviewers_avg": [
            3.0,
            4.242640687119285
        ],
        "wc_reply_authors_avg": [
            1164.0,
            314.25149164323784
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13904993439380467359&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=1BuWv9poWz",
        "pdf": "https://openreview.net/pdf?id=1BuWv9poWz",
        "email": ";um.edu.my;usyd.edu.au;szyierqi.com;",
        "author_num": 5,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Universiti Malaya;University of Sydney;Suzhou Yierqi",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.malaya.edu.my;https://www.sydney.edu.au;",
        "aff_unique_abbr": "UM;USYD;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2",
        "aff_country_unique": "Malaysia;Australia;China"
    },
    {
        "title": "Unsupervised Order Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19596",
        "id": "1CK45cqkEh",
        "author_site": "Seon-Ho Lee, Nyeong-Ho Shin, Chang-Su Kim",
        "tldr": "",
        "abstract": "A novel clustering algorithm for orderable data, called unsupervised order learning (UOL), is proposed in this paper. First, we develop the ordered $k$-means to group objects into ordered clusters by reducing the deviation of an object from consecutive clusters. Then, we train a network to construct an embedding space, in which objects are sorted compactly along a chain of line segments, determined by the cluster centroids. We alternate the clustering and the network training until convergence. Moreover, we perform unsupervised rank estimation via a simple nearest neighbor search in the embedding space. Extensive experiments on various orderable datasets demonstrate that UOL provides reliable ordered clustering results and decent rank estimation performances with no supervision. The source codes are available at https://github.com/seon92/UOL.",
        "keywords": "order learning;unsupervised clustering",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/91e282263e10efbd272cdb690a3478d7219965c2.zip",
        "author": "Seon-Ho Lee;Nyeong-Ho Shin;Chang-Su Kim",
        "authorids": "~Seon-Ho_Lee1;~Nyeong-Ho_Shin1;~Chang-Su_Kim4",
        "gender": "M;M;M",
        "homepage": "https://uhseon.github.io/;http://mcl.korea.ac.kr/people/professor/;",
        "dblp": "125/9915;;264/2601",
        "google_scholar": "https://scholar.google.co.kr/citations?user=_LtQ4TcAAAAJ;https://scholar.google.co.kr/citations?user=KOdKwNsAAAAJ;dLCMcXMAAAAJ",
        "orcid": ";;",
        "linkedin": "seonho-lee-604679198/;;nyeongho-shin-48529932b/",
        "or_profile": "~Seon-Ho_Lee1;~Chang-su_Kim2;~Nyeong_Ho_Shin1",
        "aff": "Korea University;Korea University;Korea University",
        "aff_domain": "korea.ac.kr;korea.ac.kr;korea.ac.kr",
        "position": "PhD student;Full Professor;PhD student",
        "bibtex": "@inproceedings{\nlee2024unsupervised,\ntitle={Unsupervised Order Learning},\nauthor={Seon-Ho Lee and Nyeong-Ho Shin and Chang-Su Kim},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=1CK45cqkEh}\n}",
        "github": "",
        "project": "",
        "reviewers": "rbKP;kD3Z;T1Ca;cgay",
        "pdf_size": 15013245,
        "rating": "5;5;6;6",
        "confidence": "5;3;5;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "78;62;29;86",
        "wc_strengths": "14;24;58;98",
        "wc_weaknesses": "156;123;2;158",
        "wc_questions": "1;106;194;76",
        "wc_review": "249;315;283;418",
        "wc_reply_reviewers": "0;19;17;24",
        "wc_reply_authors": "534;272;509;437",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "1;2;2;3",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            63.75,
            21.84462176372024
        ],
        "wc_strengths_avg": [
            48.5,
            32.90516676754579
        ],
        "wc_weaknesses_avg": [
            109.75,
            63.743136885471834
        ],
        "wc_questions_avg": [
            94.25,
            69.13166785200542
        ],
        "wc_review_avg": [
            316.25,
            63.21145070317561
        ],
        "wc_reply_reviewers_avg": [
            15.0,
            9.027735042633894
        ],
        "wc_reply_authors_avg": [
            438.0,
            102.24235912771184
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.30151134457776363,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15681772120320207191&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=1CK45cqkEh",
        "pdf": "https://openreview.net/pdf?id=1CK45cqkEh",
        "email": "korea.ac.kr;korea.ac.kr;korea.ac.kr",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Korea University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.korea.ac.kr",
        "aff_unique_abbr": "KU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "Adaptive Retrieval and Scalable Indexing for k-NN Search with Cross-Encoders",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19595",
        "id": "1CPta0bfN2",
        "author_site": "Nishant Yadav, Nicholas Monath, Manzil Zaheer, Rob Fergus, Andrew McCallum",
        "tldr": "",
        "abstract": "Cross-encoder (CE) models which compute similarity by jointly encoding a query-item pair perform better than using dot-product with embedding-based models (dual-encoders) at estimating query-item relevance. Existing approaches perform k-NN search with cross-encoders by approximating the CE similarity with a vector embedding space fit either with dual-encoders (DE) or CUR matrix factorization. DE-based retrieve-and-rerank approaches suffer from poor recall as DE generalizes poorly to new domains and the test-time retrieval with DE is decoupled from the CE. While CUR-based approaches can be more accurate than the DE-based retrieve-and-rerank approach, such approaches require a prohibitively large number of CE calls to compute item embeddings, thus making it impractical for deployment at scale. In this paper, we address these shortcomings with our proposed sparse-matrix factorization based method that efficiently computes latent query and item representations to approximate CE scores and performs k-NN search with the approximate CE similarity. In an offline indexing stage, we compute item embeddings by factorizing a sparse matrix containing query-item CE scores for a set of train queries. Our method produces a high-quality approximation while requiring only a fraction of CE similarity calls as compared to CUR-based methods, and allows for leveraging DE models to initialize the embedding space while avoiding compute- and resource-intensive finetuning of DE via distillation. At test time, we keep item embeddings fixed and perform retrieval over multiple rounds, alternating between a) estimating the test query embedding by minimizing error in approximating CE scores of items retrieved thus far, and b) using the updated test query embedding for retrieving more items in the next round. Our proposed k-NN search method can achieve up to 5 and 54 improvement in k-NN recall for k=1 and 100 respectively over the widely-used DE-based retrieve-and-rerank approach. Furthermore, our proposed approach to index the items by aligning item embeddings with the CE achieves up to 100x and 5x speedup over CUR-based and dual-encoder distillation based approaches respectively while matching or improving k-NN search recall over baselines.",
        "keywords": "cross-encoder;kNN;retrieval;nearest-neighbor search",
        "primary_area": "metric learning, kernel learning, and sparse coding",
        "supplementary_material": "",
        "author": "Nishant Yadav;Nicholas Monath;Manzil Zaheer;Rob Fergus;Andrew McCallum",
        "authorids": "~Nishant_Yadav1;~Nicholas_Monath1;~Manzil_Zaheer1;~Rob_Fergus1;~Andrew_McCallum1",
        "gender": "M;M;M;M;M",
        "homepage": "https://people.cs.umass.edu/~nishantyadav/;https://nmonath.github.io/;https://www.aclweb.org/anthology/people/m/manzil-zaheer/;http://cs.nyu.edu/fergus/;http://www.cs.umass.edu/~mccallum",
        "dblp": "230/4155;131/4309;40/10701;77/3763;m/AndrewMcCallum",
        "google_scholar": "Korn2JAAAAAJ;PTfhfCQAAAAJ;A33FhJMAAAAJ;https://scholar.google.com.tw/citations?user=GgQ9GEkAAAAJ;yILa1y0AAAAJ",
        "orcid": ";0000-0002-5135-2423;;;0009-0004-5487-2848",
        "linkedin": ";nicholas-monath-8627581aa/;;;andrew-mccallum-a412",
        "or_profile": "~Nishant_Yadav1;~Nicholas_Monath1;~Manzil_Zaheer1;~Rob_Fergus1;~Andrew_McCallum1",
        "aff": "Department of Computer Science, University of Massachusetts, Amherst;Google;Google DeepMind;Google;University of Massachusetts Amherst",
        "aff_domain": "cs.umass.edu;google.com;deepmind.com;google.com;cs.umass.edu",
        "position": "PhD student;Researcher;Researcher;Research scientist;Distinguished Professor",
        "bibtex": "@inproceedings{\nyadav2024adaptive,\ntitle={Adaptive Retrieval and Scalable Indexing for k-{NN} Search with Cross-Encoders},\nauthor={Nishant Yadav and Nicholas Monath and Manzil Zaheer and Rob Fergus and Andrew McCallum},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=1CPta0bfN2}\n}",
        "github": "",
        "project": "",
        "reviewers": "hzee;ujET;fa41;ja98",
        "pdf_size": 2418271,
        "rating": "5;6;6;8",
        "confidence": "4;3;3;3",
        "soundness": "3;3;3;4",
        "contribution": "2;3;3;3",
        "presentation": "2;4;2;3",
        "wc_summary": "39;118;197;78",
        "wc_strengths": "35;38;35;55",
        "wc_weaknesses": "232;33;78;24",
        "wc_questions": "23;107;62;55",
        "wc_review": "329;296;372;212",
        "wc_reply_reviewers": "96;20;0;10",
        "wc_reply_authors": "1931;787;1051;292",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "4;1;2;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            108.0,
            58.48504082241885
        ],
        "wc_strengths_avg": [
            40.75,
            8.317902379807062
        ],
        "wc_weaknesses_avg": [
            91.75,
            83.5175879680442
        ],
        "wc_questions_avg": [
            61.75,
            29.978117018918983
        ],
        "wc_review_avg": [
            302.25,
            58.66163567443376
        ],
        "wc_reply_reviewers_avg": [
            31.5,
            37.90448522272793
        ],
        "wc_reply_authors_avg": [
            1015.25,
            594.7824707403539
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.6622661785325219,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ZT2vxG-gQ2EJ:scholar.google.com/&scioq=Adaptive+Retrieval+and+Scalable+Indexing+for+k-NN+Search+with+Cross-Encoders&hl=en&as_sdt=0,44",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=1CPta0bfN2",
        "pdf": "https://openreview.net/pdf?id=1CPta0bfN2",
        "email": "cs.umass.edu;google.com;deepmind.com;google.com;cs.umass.edu",
        "author_num": 5,
        "aff_unique_index": "0;1;1;1;0",
        "aff_unique_norm": "University of Massachusetts Amherst;Google",
        "aff_unique_dep": "Department of Computer Science;Google",
        "aff_unique_url": "https://www.umass.edu;https://www.google.com",
        "aff_unique_abbr": "UMass Amherst;Google",
        "aff_campus_unique_index": "0;1;1;0",
        "aff_campus_unique": "Amherst;Mountain View;",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "1EyS6udrLa",
        "title": "Towards Bringing Advanced Restoration Networks into Self-Supervised Image Denoising",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Self-supervised image denoising (SSID) has witnessed significant progress in recent years. Therein, most methods focus on exploring blind-spot techniques while only employing a simple network architecture (\\eg, plain CNN or U-Net) as a denoising backbone. However, with the ongoing advancements in image restoration networks, these architectures have become somewhat outdated. In this work, we aim to migrate the advanced restoration network designs (\\eg, SwinIR, Restormer, NAFNet, and HAT) into SSID methods. We begin by conducting an analysis of the fundamental concepts in existing typical blind-spot networks (BSN). Subsequently, we introduce a series of approaches to adapt restoration networks into various blind-spot ones. In particular, we suggest effective adjustment for window attention to mimic the convolution layers in BSN. And we discourage the adoption of channel attention, as it can potentially lead to the leakage of blind-spot information, consequently impeding performance. Experiments on both synthetic and real-world RGB noisy images demonstrate our methods substantially enhance SSID performance. Furthermore, we hope this study could enable SIDD methods to keep pace with the progress in restoration networks, and serve as benchmarks for future works. The code and pre-trained models will be publicly available.",
        "keywords": "Self-Supervised Denoising; Restoration Networks",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Junyi Li;Zhilu Zhang;Dongsheng Jiang;XIAOPENG ZHANG;Wangmeng Zuo;Qi Tian",
        "authorids": "~Junyi_Li5;~Zhilu_Zhang2;~Dongsheng_Jiang2;~XIAOPENG_ZHANG7;~Wangmeng_Zuo3;~Qi_Tian3",
        "gender": "M;M;M;M;M;M",
        "homepage": ";https://github.com/cszhilu1998;https://sites.google.com/site/zxphistory/;;https://www.qitian1987.com/index.html;https://sites.google.com/site/dongshengjiangbme/",
        "dblp": ";;;93/2671;78/1467-1.html;85/8729",
        "google_scholar": "77mdLl8AAAAJ;8pIq2N0AAAAJ;Ud6aBAcAAAAJ;rUOpCEYAAAAJ;https://scholar.google.com/citations?hl=en;-eGIgsoAAAAJ",
        "orcid": ";0000-0002-5758-5949;;0000-0002-3330-783X;0000-0002-7252-5047;",
        "linkedin": ";;;;;",
        "or_profile": "~Junyi_Li5;~Zhilu_Zhang2;~XIAOPENG_ZHANG7;~Wangmeng_Zuo3;~Qi_Tian3;~Dongsheng_Jiang1",
        "aff": "Harbin Institute of Technology;Harbin Institute of Technology;Huawei Technologies Ltd.;Harbin Institute of Technology;Huawei Technologies Ltd.;Huawei Technologies Ltd.",
        "aff_domain": "hit.edu.cn;hit.edu.cn;huawei.com;hit.edu.cn;huawei.com;huawei.com",
        "position": "PhD student;PhD student;Principal Researcher;Full Professor;Principal Researcher;Principal Researcher",
        "bibtex": "@misc{\nli2024towards,\ntitle={Towards Bringing Advanced Restoration Networks into Self-Supervised Image Denoising},\nauthor={Junyi Li and Zhilu Zhang and Dongsheng Jiang and XIAOPENG ZHANG and Wangmeng Zuo and Qi Tian},\nyear={2024},\nurl={https://openreview.net/forum?id=1EyS6udrLa}\n}",
        "github": "",
        "project": "",
        "reviewers": "iVws;uBSH;jHRD;xn1Q",
        "site": "https://openreview.net/forum?id=1EyS6udrLa",
        "pdf_size": 3948107,
        "rating": "3;3;5;5",
        "confidence": "4;5;3;5",
        "soundness": "3;2;2;3",
        "contribution": "1;1;2;3",
        "presentation": "3;3;2;3",
        "wc_summary": "97;46;80;56",
        "wc_strengths": "63;20;43;81",
        "wc_weaknesses": "120;69;124;130",
        "wc_questions": "33;347;2;3",
        "wc_review": "313;482;249;270",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            69.75,
            20.004686950812303
        ],
        "wc_strengths_avg": [
            51.75,
            22.730761095924613
        ],
        "wc_weaknesses_avg": [
            110.75,
            24.365703355331238
        ],
        "wc_questions_avg": [
            96.25,
            145.30549714308816
        ],
        "wc_review_avg": [
            328.5,
            91.57647077715978
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.30151134457776363,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:bD4cpC_HtesJ:scholar.google.com/&scioq=Towards+Bringing+Advanced+Restoration+Networks+into+Self-Supervised+Image+Denoising&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;1;1",
        "aff_unique_norm": "Harbin Institute of Technology;Huawei",
        "aff_unique_dep": ";Huawei Technologies",
        "aff_unique_url": "http://www.hit.edu.cn/;https://www.huawei.com",
        "aff_unique_abbr": "HIT;Huawei",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Harbin;",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "1FWDEIGm33",
        "title": "Large Language Models as superpositions of cultural perspectives",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs) are sometimes viewed as if they were individuals, with given values, personality, knowledge and abilities. We argue that this \u201dLLM as an individual\u201d metaphor misrepresents their nature. As opposed to humans, they exhibit highly context-dependent values and personality traits. We propose a new metaphor, \u201dLLM as a superposition of perspectives\u201d : LLMs simulate a multiplicity of behaviors, e.g. expressing values, which can be triggered by a given context. As a case study, we conduct experiments on how values vary as a function of context using psychology questionnaires. Crucially, we demonstrate that changes in the context that are unrelated to the topic of questionnaires - varying articles, simulated conversations on other topics, and textual formats - all result in significant unwanted, hard-to-predict changes in the expressed values. We refer to this as the unexpected perspective shift effect. We discuss how this questions the interpretations of studies using psychology questionnaires (and more generally benchmarks) to draw general conclusions about LLMs\u2019 values, knowledge and abilities. Indeed, expressing some values on a questionnaire says little about which values a model would express in other contexts. Instead, models should be studied in terms of how the expressed values change over contexts in both expected and unexpected ways. Following this insight, we introduce the concept of perspective controllability - a model\u2019s affordance to adopt various perspectives. We conduct a systematic comparison of the controllability of 16 different models over three questionnaires (PVQ, VSM, IPIP) and different methods for inducing perspectives. We conclude by examining the broader implications of our work and outline a variety of associated scientific questions.",
        "keywords": "Large Language Models;context-dependence;controllability;cultural values;personal values;personality traits;societal considerations;Shalom H Schwartz;Geert Hofstede;Big Five",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/8b6e4447a0a20dc4db890536b580aba32afc8767.zip",
        "author": "Grgur Kova\u010d;Masataka Sawayama;R\u00e9my Portelas;C\u00e9dric Colas;Peter Ford Dominey;Pierre-Yves Oudeyer",
        "authorids": "~Grgur_Kova\u010d1;~Masataka_Sawayama1;~R\u00e9my_Portelas1;~C\u00e9dric_Colas1;~Peter_Ford_Dominey1;~Pierre-Yves_Oudeyer1",
        "gender": "M;M;M;;M;M",
        "homepage": "https://www.mswym.com/;;https://cedriccolas.com;;http://www.pyoudeyer.com;",
        "dblp": "165/9982;;215/3872;76/218;33/5513;272/4188",
        "google_scholar": "https://scholar.google.co.jp/citations?user=AagXxCYAAAAJ;8xxuvpoAAAAJ;https://scholar.google.fr/citations?user=VBz8gZ4AAAAJ;;https://scholar.google.fr/citations?user=gCqGj4sAAAAJ;ZLA7iioAAAAJ",
        "orcid": ";;0000-0003-0212-427X;0000-0002-9318-179X;;0000-0001-8974-6228",
        "linkedin": ";;;;pierreyvesoudeyer/;",
        "or_profile": "~Masataka_Sawayama1;~R\u00e9my_Portelas1;~C\u00e9dric_Colas1;~Peter_Ford_Dominey1;~Pierre-Yves_Oudeyer1;~Grgur_Kovac1",
        "aff": "The University of Tokyo;Ubisoft;Massachusetts Institute of Technology;CNRS;Inria;INRIA",
        "aff_domain": "g.ecc.u-tokyo.ac.jp;ubisoft.com;mit.edu;cnrs.fr;inria.fr;inria.fr",
        "position": "Lecturer;Researcher;Postdoc;Full Professor;Research director;PhD student",
        "bibtex": "@misc{\nkova{\\v{c}}2024large,\ntitle={Large Language Models as superpositions of cultural perspectives},\nauthor={Grgur Kova{\\v{c}} and Masataka Sawayama and R{\\'e}my Portelas and C{\\'e}dric Colas and Peter Ford Dominey and Pierre-Yves Oudeyer},\nyear={2024},\nurl={https://openreview.net/forum?id=1FWDEIGm33}\n}",
        "github": "",
        "project": "",
        "reviewers": "Fkgw;7GoP;P79N;B9Pb",
        "site": "https://openreview.net/forum?id=1FWDEIGm33",
        "pdf_size": 676158,
        "rating": "3;3;3;5",
        "confidence": "4;4;4;3",
        "soundness": "1;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "2;2;2;2",
        "wc_summary": "114;75;123;89",
        "wc_strengths": "17;31;25;57",
        "wc_weaknesses": "720;223;318;71",
        "wc_questions": "78;211;1;49",
        "wc_review": "929;540;467;266",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1052;722;934;403",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;2;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            100.25,
            19.17517926904466
        ],
        "wc_strengths_avg": [
            32.5,
            14.99166435056495
        ],
        "wc_weaknesses_avg": [
            333.0,
            240.17597715008884
        ],
        "wc_questions_avg": [
            84.75,
            77.90499021243761
        ],
        "wc_review_avg": [
            550.5,
            240.4604957160323
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            777.75,
            246.56274556388277
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 47,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2800038415228220148&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;2;3;4;4",
        "aff_unique_norm": "University of Tokyo;Ubisoft;Massachusetts Institute of Technology;Centre National de la Recherche Scientifique;INRIA",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.u-tokyo.ac.jp;https://www.ubisoft.com;https://web.mit.edu;https://www.cnrs.fr;https://www.inria.fr",
        "aff_unique_abbr": "UTokyo;Ubisoft;MIT;CNRS;Inria",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;1;1;1",
        "aff_country_unique": "Japan;France;United States"
    },
    {
        "id": "1GUTzm2a4v",
        "title": "Greedy PIG: Adaptive Integrated Gradients",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep learning has become the standard approach for most machine learning tasks. Although its great success is undeniable, interpreting the predictions of deep learning models from a human perspective remains a challenge. In contrast to model training, model interpretability is harder to quantify or pose as an explicit optimization problem. Inspired by the AUC softmax information curve (AUC SIC) metric for evaluating feature attribution methods, we propose a unified discrete optimization framework for feature attribution and feature selection based on subset selection. This leads to a natural adaptive generalization of the path integrated gradients (PIG) method for feature attribution, which we call Greedy PIG. We show that Greedy PIG achieves an extremely high AUC SIC for feature attribution tasks on images, which could also hint at the limitations of this metric for multi-class classification, and we propose a more robust metric. We demonstrate the success of Greedy PIG on a variety of tasks, including image feature attribution, graph compression/explanation, and post-hoc feature selection on tabular data. Our results show that introducing adaptivity is a versatile method for making attribution methods more powerful.",
        "keywords": "feature saliency;feature attribution;feature selection;graph neural networks",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/95496e31c4258efe031be9a87e9606f86477d0ff.pdf",
        "author": "Kyriakos Axiotis;Sami Abu-El-Haija;Lin Chen;Matthew Fahrbach;Gang Fu",
        "authorids": "~Kyriakos_Axiotis1;~Sami_Abu-El-Haija1;~Lin_Chen14;~Matthew_Fahrbach1;~Gang_Fu3",
        "gender": ";M;;;",
        "homepage": ";http://www.haija.org;;;",
        "dblp": "176/5139;127/6620;;;",
        "google_scholar": "Xhv2tkcAAAAJ;t80qlTcAAAAJ;;;",
        "orcid": ";;;;",
        "linkedin": ";samihaija/;;;",
        "or_profile": "~Kyriakos_Axiotis1;~Sami_Abu-El-Haija1;~Lin_Chen14;~Matthew_Fahrbach1;~Gang_Fu3",
        "aff": "Google;Research, Google;;;",
        "aff_domain": "google.com;research.google.com;;;",
        "position": "Researcher;Research Scientist;;;",
        "bibtex": "@misc{\naxiotis2024greedy,\ntitle={Greedy {PIG}: Adaptive Integrated Gradients},\nauthor={Kyriakos Axiotis and Sami Abu-El-Haija and Lin Chen and Matthew Fahrbach and Gang Fu},\nyear={2024},\nurl={https://openreview.net/forum?id=1GUTzm2a4v}\n}",
        "github": "",
        "project": "",
        "reviewers": "mYhW;dYDX;yEX4;WqYq",
        "site": "https://openreview.net/forum?id=1GUTzm2a4v",
        "pdf_size": 1037202,
        "rating": "3;3;5;6",
        "confidence": "4;3;3;3",
        "soundness": "2;2;2;3",
        "contribution": "3;2;2;2",
        "presentation": "2;1;2;4",
        "wc_summary": "54;130;97;66",
        "wc_strengths": "75;60;48;40",
        "wc_weaknesses": "467;214;174;104",
        "wc_questions": "5;28;38;46",
        "wc_review": "601;432;357;256",
        "wc_reply_reviewers": "0;277;37;0",
        "wc_reply_authors": "1048;1370;287;317",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "2;3;1;2",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            86.75,
            29.49046456059992
        ],
        "wc_strengths_avg": [
            55.75,
            13.198011213815512
        ],
        "wc_weaknesses_avg": [
            239.75,
            136.98243500536847
        ],
        "wc_questions_avg": [
            29.25,
            15.384651442265437
        ],
        "wc_review_avg": [
            411.5,
            125.97718047329047
        ],
        "wc_reply_reviewers_avg": [
            78.5,
            115.59519886223649
        ],
        "wc_reply_authors_avg": [
            755.5,
            467.6914046676505
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5555555555555555,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:-s22YlOF9TEJ:scholar.google.com/&scioq=Greedy+PIG:+Adaptive+Integrated+Gradients&hl=en&as_sdt=0,5",
        "gs_version_total": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Google",
        "aff_unique_dep": "Google",
        "aff_unique_url": "https://www.google.com",
        "aff_unique_abbr": "Google",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Mountain View",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "1GdAJ3GsOw",
        "title": "DISTPAR:TENSOR PARTITIONING FOR DISTRIBUTED NEURAL NETWORK COMPUTING",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Existing distributed training systems suffer from the difficulties of adapting to diverse model architectures and balancing the trade-off between computational and communication costs. We introduce Distributed Partitioning (DistPar), a framework that allows users to develop parallel models with the ease of writing single-device programs. We establish the basic properties of tensor partitioning, which significantly expand the search space for optimal parallel strategies. The process of distributing global tensors from a single-device perspective is driven by the innovative use of collective communication primitives and their extensions which represent conversions between arbitrary tensor distribution properties. To further address the challenge of parallel scheme optimization, we carry out a cost function that considers both computational and communication costs. Guided by the cost function, the best-performing parallel scheme is automatically selected with configurable parameters, thus simplifying the process of developing parallel models. We demonstrate state-of-the-art results on extensive experiments. Moreover, DistPar reaches 50% higher throughput in large-scale face recognition tasks and a 20% improvement in language modeling tasks compared to data parallelism provided by PyTorch. This performance improvement aligns with the expected speedup and is particularly notable as the number of computing devices increases. The code will be released at https://github.com/DistPar.",
        "keywords": "Deep Learning Framework;Tensor Partitioning;Parallel Computation",
        "primary_area": "infrastructure, software libraries, hardware, etc.",
        "supplementary_material": "/attachment/574b80ab752a77ec57748ad95395c9cdaf008599.pdf",
        "author": "Hongsheng Wang;Jinhui Yuan;Shun Liu;Weijie Xia;Xinyi Zhou;Shengyu Zhang;Fei Wu;Mohamed Jaward Bah;Feng Lin",
        "authorids": "~Hongsheng_Wang1;~Jinhui_Yuan1;~Shun_Liu1;~Weijie_Xia1;~Xinyi_Zhou5;~Shengyu_Zhang2;~Fei_Wu1;~Mohamed_Jaward_Bah1;~Feng_Lin10",
        "gender": "M;M;M;M;;M;M;M;M",
        "homepage": "https://wanghongsheng01.github.io/;;https://shunliu01.github.io;https://github.com/xiaweijiexox;;https://shengyuzhang.github.io/;https://person.zju.edu.cn/wufei;;http://www.zhejianglab.com",
        "dblp": ";58/3397;;;;47/3459-1;84/3254-1;https://dblp.org/search?q=Mohamed+Jaward+Bah;75/2611",
        "google_scholar": ";HtfAR1IAAAAJ;https://scholar.google.com/citations?hl=en;;;l4Dyt7EAAAAJ;XJLn4MYAAAAJ;WRRMPzMAAAAJ;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": ";;0009-0007-5240-9114;;;0000-0002-0030-8289;;;",
        "linkedin": ";jinhui-yuan-291aa847/;shun-liu-5285492a2/;;;;;;",
        "or_profile": "~Hongsheng_Wang1;~Jinhui_Yuan1;~Shun_Liu1;~Weijie_Xia1;~Xinyi_Zhou5;~Shengyu_Zhang2;~Fei_Wu1;~Mohamed_Jaward_Bah1;~Feng_Lin10",
        "aff": "Zhejiang University;;Dartmouth College;Hangzhou Dianzi University;;Zhejiang University;Zhejiang University;Zhejiang Lab;Zhejiang Lab",
        "aff_domain": "zju.edu.cn;;cs.dartmouth.edu;hdu.edu.cn;;zju.edu.cn;zju.edu.cn;zhejianglab.com;zhejianglab.com",
        "position": "PhD student;;Intern;Undergrad student;;ZJU100 Young Professor;Full Professor;Researcher;Principal Researcher",
        "bibtex": "@misc{\nwang2024distpartensor,\ntitle={{DISTPAR}:{TENSOR} {PARTITIONING} {FOR} {DISTRIBUTED} {NEURAL} {NETWORK} {COMPUTING}},\nauthor={Hongsheng Wang and Jinhui Yuan and Shun Liu and Weijie Xia and Xinyi Zhou and Shengyu Zhang and Fei Wu and Mohamed Jaward Bah and Feng Lin},\nyear={2024},\nurl={https://openreview.net/forum?id=1GdAJ3GsOw}\n}",
        "github": "",
        "project": "",
        "reviewers": "Q7ud;ovib;pTBS",
        "site": "https://openreview.net/forum?id=1GdAJ3GsOw",
        "pdf_size": 1109568,
        "rating": "1;1;3",
        "confidence": "4;5;4",
        "soundness": "1;3;1",
        "contribution": "2;1;1",
        "presentation": "2;2;2",
        "wc_summary": "107;64;28",
        "wc_strengths": "93;19;5",
        "wc_weaknesses": "353;180;322",
        "wc_questions": "109;75;3",
        "wc_review": "662;338;358",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "contribution_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            66.33333333333333,
            32.293790252754306
        ],
        "wc_strengths_avg": [
            39.0,
            38.60915262818736
        ],
        "wc_weaknesses_avg": [
            285.0,
            75.31710739710246
        ],
        "wc_questions_avg": [
            62.333333333333336,
            44.19150245113747
        ],
        "wc_review_avg": [
            452.6666666666667,
            148.24604173093084
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:OrQtgl86lfQJ:scholar.google.com/&scioq=DISTPAR:TENSOR+PARTITIONING+FOR+DISTRIBUTED+NEURAL+NETWORK+COMPUTING&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0;0;3;3",
        "aff_unique_norm": "Zhejiang University;Dartmouth College;Hangzhou Dianzi University;Zhejiang Lab",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.zju.edu.cn;https://www.dartmouth.edu;http://www.hdu.edu.cn/;http://www.zhejianglab.com",
        "aff_unique_abbr": "ZJU;Dartmouth;HGHDU;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;0;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "1HgJZl3HgT",
        "title": "Learning to Stylize Soundscapes from In-the-Wild Videos",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Speech recordings convey a great deal of information about the scenes, resulting in a variety of effects ranging from reverberation to additional ambient sounds. In this paper, we learn to restyle input speech to sound as though it was recorded within a different scene, given an audio (or audio-visual) example recorded from that scene. Our model learns through self-supervision, taking advantage of the fact that natural video contains recurring sound events and textures. We extract an audio clip from a video and apply speech enhancement. We then train a latent diffusion model to recover the original sound, using another audio-visual clip taken from elsewhere in the video as a conditional hint. Through this process, the model learns to transfer the conditional example's sound properties to the input sound. We show that our model can be successfully trained using unlabeled, in-the-wild videos, and that an additional visual signal can improve its sound prediction abilities.",
        "keywords": "Audio Generation and Stylization;Audio-visual Learning;Multimodal Learning",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/23a9bbe0d8b2ff2dc55be33292112a8c6e0a18e4.zip",
        "author": "Tingle Li;Renhao Wang;Po-Yao Huang;Andrew Owens;Gopala Anumanchipalli",
        "authorids": "~Tingle_Li1;~Renhao_Wang1;~Po-Yao_Huang2;~Andrew_Owens1;~Gopala_Anumanchipalli1",
        "gender": "M;;M;M;M",
        "homepage": "https://tinglok.netlify.app/;;http://andrewowens.com;http://people.eecs.berkeley.edu/~gopala/;https://berniebear.github.io/",
        "dblp": "248/9136;243/7150;85/2697;54/7824;154/3943-1",
        "google_scholar": "UGpC1zgAAAAJ;q4RlE2oAAAAJ;9hX-JksAAAAJ;VecEj6kAAAAJ;E8K25LIAAAAJ",
        "orcid": ";;;0000-0002-9714-7740;",
        "linkedin": ";;;;",
        "or_profile": "~Tingle_Li1;~Renhao_Wang1;~Andrew_Owens1;~Gopala_Anumanchipalli1;~Po-Yao_Huang1",
        "aff": "University of California, Berkeley;University of California, Berkeley;University of Michigan;University of California, Berkeley;Meta",
        "aff_domain": "eecs.berkeley.edu;berkeley.edu;umich.edu;berkeley.edu;meta.com",
        "position": "PhD student;PhD student;Assistant Professor;Assistant Professor;Researcher",
        "bibtex": "@misc{\nli2024learning,\ntitle={Learning to Stylize Soundscapes from In-the-Wild Videos},\nauthor={Tingle Li and Renhao Wang and Po-Yao Huang and Andrew Owens and Gopala Anumanchipalli},\nyear={2024},\nurl={https://openreview.net/forum?id=1HgJZl3HgT}\n}",
        "github": "",
        "project": "",
        "reviewers": "UAzL;HkqM;V8de;tbtJ",
        "site": "https://openreview.net/forum?id=1HgJZl3HgT",
        "pdf_size": 1481535,
        "rating": "3;3;5;5",
        "confidence": "3;4;3;3",
        "soundness": "2;2;2;2",
        "contribution": "1;1;3;3",
        "presentation": "2;2;3;4",
        "wc_summary": "102;57;108;38",
        "wc_strengths": "31;51;64;38",
        "wc_weaknesses": "151;315;408;157",
        "wc_questions": "2;94;25;313",
        "wc_review": "286;517;605;546",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            1.0
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            76.25,
            29.600464523382062
        ],
        "wc_strengths_avg": [
            46.0,
            12.62933094031509
        ],
        "wc_weaknesses_avg": [
            257.75,
            108.85626991588495
        ],
        "wc_questions_avg": [
            108.5,
            122.82609657560563
        ],
        "wc_review_avg": [
            488.5,
            121.13731877501664
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ubQRJShe0ooJ:scholar.google.com/&scioq=Learning+to+Stylize+Soundscapes+from+In-the-Wild+Videos&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;2",
        "aff_unique_norm": "University of California, Berkeley;University of Michigan;Meta",
        "aff_unique_dep": ";;Meta Platforms, Inc.",
        "aff_unique_url": "https://www.berkeley.edu;https://www.umich.edu;https://meta.com",
        "aff_unique_abbr": "UC Berkeley;UM;Meta",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Berkeley;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "1Htbe2fiQU",
        "title": "Learning with Counterfactual Explanations for Radiology Report Generation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Due to the common content of anatomy, radiology images with their corresponding reports exhibit highly similarity. Such inherent data bias can predispose automatic report generation models to learn entangled and spurious representations resulting in misdiagnostic reports. Moreover, the lack of explainability hinders the acceptance by radiologists in clinical practice.\nTo tackle these, we propose a novel \\textbf{Co}unter\\textbf{F}actual \\textbf{E}xplanations-based framework (CoFE) for radiology report generation. Counterfactual explanations serve as a potent tool for understanding how decisions made by algorithms can be changed by asking ``what if'' scenarios. By leveraging this concept, CoFE can learn non-spurious visual representations by contrasting the representations between factual and counterfactual images. Specifically, we derive counterfactual images by swapping a patch between positive and negative samples until a predicted diagnosis shift occurs. Here, positive and negative samples are the most semantically similar but have different diagnosis labels.  Additionally, CoFE employs a learnable prompt to efficiently fine-tune the pretrained large language model, encapsulating both factual and counterfactual content to provide a more generalizable prompt representation. Extensive experiments on two benchmarks demonstrate that leveraging the counterfactual explanations enables CoFE to generate semantically coherent and factually complete reports and outperform in terms of language generation and clinical efficacy metrics.",
        "keywords": "Counterfactual Explanations;Radiology Report Generation;Contrastive Learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Mingjie Li;Haokun Lin;Xiaodan Liang;Ling Chen;Abdulmotaleb El Saddik;Xiaojun Chang",
        "authorids": "~Mingjie_Li2;~Haokun_Lin3;~Xiaodan_Liang2;~Ling_Chen5;~Abdulmotaleb_El_Saddik1;~Xiaojun_Chang4",
        "gender": "M;M;F;F;;",
        "homepage": "http://www.mmvg.org/member/mingjie_li/;https://blog.csdn.net/qq_46192381;https://www.sysu-hcp.net/;https://profiles.uts.edu.au/Ling.Chen;;",
        "dblp": "48/10103-6;;;17/1237-6;;",
        "google_scholar": "ag0m3aoAAAAJ;https://scholar.google.com/citations?hl=zh-CN;voxznZAAAAAJ;https://scholar.google.com.au/citations?user=L5aYWQcAAAAJ;;",
        "orcid": ";0009-0008-6831-2859;;0000-0002-6468-5729;;",
        "linkedin": ";;;;;",
        "or_profile": "~Mingjie_Li2;~Haokun_Lin3;~Xiaodan_Liang2;~Ling_Chen5;~Abdulmotaleb_El_Saddik1;~Xiaojun_Chang4",
        "aff": "Stanford University;Mohamed bin Zayed University of Artificial Intelligence;SUN YAT-SEN UNIVERSITY;University of Technology Sydney;;",
        "aff_domain": "stanford.edu;mbzuai.ac.ae;sysu.edu.cn;uts.edu.au;;",
        "position": "Postdoc;MS student;Associate Professor;Full Professor;;",
        "bibtex": "@misc{\nli2024learning,\ntitle={Learning with Counterfactual Explanations for Radiology Report Generation},\nauthor={Mingjie Li and Haokun Lin and Xiaodan Liang and Ling Chen and Abdulmotaleb El Saddik and Xiaojun Chang},\nyear={2024},\nurl={https://openreview.net/forum?id=1Htbe2fiQU}\n}",
        "github": "",
        "project": "",
        "reviewers": "sgJL;nNsA;QvNC;u7dz",
        "site": "https://openreview.net/forum?id=1Htbe2fiQU",
        "pdf_size": 5155127,
        "rating": "3;5;5;5",
        "confidence": "4;5;3;4",
        "soundness": "2;2;3;3",
        "contribution": "1;2;2;3",
        "presentation": "2;3;3;2",
        "wc_summary": "108;32;53;87",
        "wc_strengths": "9;12;39;85",
        "wc_weaknesses": "131;138;172;234",
        "wc_questions": "56;4;47;71",
        "wc_review": "304;186;311;477",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            70.0,
            29.436372059070052
        ],
        "wc_strengths_avg": [
            36.25,
            30.474374480865066
        ],
        "wc_weaknesses_avg": [
            168.75,
            40.739262389002576
        ],
        "wc_questions_avg": [
            44.5,
            24.904818810824544
        ],
        "wc_review_avg": [
            319.5,
            103.6110515340907
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:_kwaKu5AFXAJ:scholar.google.com/&scioq=Learning+with+Counterfactual+Explanations+for+Radiology+Report+Generation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Stanford University;Mohamed bin Zayed University of Artificial Intelligence;Sun Yat-sen University;University of Technology Sydney",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.stanford.edu;https://mbzuai.ac.ae;http://www.sysu.edu.cn;https://www.uts.edu.au",
        "aff_unique_abbr": "Stanford;MBZUAI;SYSU;UTS",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Stanford;",
        "aff_country_unique_index": "0;1;2;3",
        "aff_country_unique": "United States;United Arab Emirates;China;Australia"
    },
    {
        "id": "1IIiQnLRe8",
        "title": "Diversity Modeling for Semantic Shift Detection",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Semantic shift detection faces a big challenge of modeling non-semantic feature diversity while suppressing generalization to unseen semantic shifts. Existing reconstruction-based approaches are either not constrained well to avoid over-generalization or not general enough to model diversity-agnostic in-distribution samples. Both may lead to feature confusion near the decision boundary and fail to identify various semantic shifts. In this work, we propose Bi-directional Regularized Diversity Modulation (BiRDM) to model restricted feature diversity for semantic shift detection so as to address the challenging issues in reconstruction-based detection methods. BiDRM modulates feature diversity by controlling spatial transformation with learnable dynamic modulation parameters in latent space. Smoothness Regularization (SmoReg) is introduced to avoid undesired generalization to semantic shift samples. Furthermore, Batch Normalization Simulation (BNSim) coordinating with auxiliary data is leveraged to separately transform different semantic distributions and push potential semantic shift samples away implicitly, making the feature more discriminative. Compared with previous works, BiRDM can successfully model diversity-agnostic non-semantic pattern while alleviating feature confusion in latent space. Experimental results demonstrate the effectiveness of our method.",
        "keywords": "semantic shift detection;diversity modeling",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Wenrui Liu;Hong Chang;Bingpeng Ma;Shiguang Shan;Xilin CHEN",
        "authorids": "~Wenrui_Liu1;~Hong_Chang1;~Bingpeng_Ma1;~Shiguang_Shan2;~Xilin_CHEN2",
        "gender": ";F;M;M;M",
        "homepage": "http://vipl.ict.ac.cn/edu/student/master/202205/t20220518_36050.html;;http://people.ucas.edu.cn/~bpma;http://vipl.ict.ac.cn/people/sgshan/;http://vipl.ict.ac.cn/people/_xlchen/",
        "dblp": "156/8975-4;;62/1822;s/ShiguangShan;c/XilinChen",
        "google_scholar": ";LX6MnNsAAAAJ;;https://scholar.google.com.tw/citations?user=Vkzd7MIAAAAJ;vVx2v20AAAAJ",
        "orcid": ";;0000-0001-8984-205X;0000-0002-8348-392X;0000-0003-3024-4404",
        "linkedin": ";;;;",
        "or_profile": "~Wenrui_Liu1;~Hong_Chang1;~Bingpeng_Ma1;~Shiguang_Shan2;~Xilin_Chen4",
        "aff": "Chinese Academy of Sciences;Institute of Computing Technology, Chinese Academy of Sciences;University of Chinese Academy of Sciences;Institute of Computing Technology, Chinese Academy of Sciences;Institute of Computing Technology",
        "aff_domain": "ict.ac.cn;ict.ac.cn;ucas.ac.cn;ict.ac.cn;ict.ac.cn",
        "position": "MS student;Full Professor;Full Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nliu2024diversity,\ntitle={Diversity Modeling for Semantic Shift Detection},\nauthor={Wenrui Liu and Hong Chang and Bingpeng Ma and Shiguang Shan and Xilin CHEN},\nyear={2024},\nurl={https://openreview.net/forum?id=1IIiQnLRe8}\n}",
        "github": "",
        "project": "",
        "reviewers": "k7Jp;BvVD;CShN;d4iz;oBBb",
        "site": "https://openreview.net/forum?id=1IIiQnLRe8",
        "pdf_size": 12798916,
        "rating": "3;3;5;6;6",
        "confidence": "3;4;4;3;4",
        "soundness": "2;3;2;3;3",
        "contribution": "2;2;2;3;4",
        "presentation": "2;2;3;2;3",
        "wc_summary": "223;85;54;40;59",
        "wc_strengths": "40;65;52;42;49",
        "wc_weaknesses": "640;176;244;151;38",
        "wc_questions": "11;3;27;2;44",
        "wc_review": "914;329;377;235;190",
        "wc_reply_reviewers": "0;0;211;105;30",
        "wc_reply_authors": "733;457;555;543;504",
        "reply_reviewers": "0;0;2;1;1",
        "reply_authors": "2;2;3;2;2",
        "rating_avg": [
            4.6,
            1.3564659966250536
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.6,
            0.8
        ],
        "presentation_avg": [
            2.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            92.2,
            67.00268651330335
        ],
        "wc_strengths_avg": [
            49.6,
            8.867919710958146
        ],
        "wc_weaknesses_avg": [
            249.8,
            206.08580737158977
        ],
        "wc_questions_avg": [
            17.4,
            16.032467059064864
        ],
        "wc_review_avg": [
            409.0,
            261.03103263788387
        ],
        "wc_reply_reviewers_avg": [
            69.2,
            80.62605038075473
        ],
        "wc_reply_authors_avg": [
            558.4,
            93.78187458139232
        ],
        "reply_reviewers_avg": [
            0.8,
            0.7483314773547883
        ],
        "reply_authors_avg": [
            2.2,
            0.39999999999999997
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.06019292654288467,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ij_hPtLp8ZoJ:scholar.google.com/&scioq=Diversity+Modeling+for+Semantic+Shift+Detection&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;2",
        "aff_unique_norm": "Chinese Academy of Sciences;University of Chinese Academy of Sciences;Institute of Computing Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.cas.cn;http://www.ucas.ac.cn;http://www.ict.ac.cn",
        "aff_unique_abbr": "CAS;UCAS;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "1IaoWBqB6K",
        "title": "DiffDock-Pocket: Diffusion for Pocket-Level Docking with Sidechain Flexibility",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "When a small molecule binds to a protein, the 3D structure of the protein and its function change. Understanding this process, called molecular docking, can be crucial in areas such as drug design. Recent learning-based attempts have shown promising results at this task, yet lack features that traditional approaches support. In this work, we close this gap by proposing DiffDock-Pocket, a diffusion-based docking algorithm that is conditioned on a binding target to predict ligand poses only in a specific binding pocket. On top of this, our model supports receptor flexibility and predicts the position of sidechains close to the binding site. Empirically, we improve the state-of-the-art in site-specific-docking on the PDBBind benchmark. Especially when using in-silico generated structures, we achieve more than twice the performance of current methods while being more than 20 times faster than other flexible approaches. Although the model was not trained for cross-docking to different structures, it yields competitive results in this task.",
        "keywords": "diffusion;diffusion models;docking;generative model",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Michael Plainer;Marcella Toth;Simon Dobers;Hannes Stark;Gabriele Corso;C\u00e9line Marquet;Regina Barzilay",
        "authorids": "~Michael_Plainer1;~Marcella_Toth1;~Simon_Dobers1;~Hannes_Stark1;~Gabriele_Corso1;~C\u00e9line_Marquet1;~Regina_Barzilay1",
        "gender": "M;;M;;female;;M",
        "homepage": "https://plainer.dev;;http://linkedin.com/in/simon-dobers;https://gcorso.github.io/;https://www.regina.csail.mit.edu/;;https://hannes-stark.com/",
        "dblp": "364/7250.html;;;262/6499;b/ReginaBarzilay;;300/4627",
        "google_scholar": "7Bnt9kUAAAAJ;;;LUrAYgEAAAAJ;;;bnXfJdEAAAAJ",
        "orcid": ";0009-0002-0685-8852;;;;0000-0002-8691-5791;0000-0002-4463-326X",
        "linkedin": "https://linkedin.com/in/plainer/;;;gcorso/;;;hannes-stark/",
        "or_profile": "~Michael_Plainer1;~Marcella_Toth1;~Simon_Dobers1;~Gabriele_Corso1;~Regina_Barzilay1;~C_Marquet1;~Hannes_St\u00e4rk1",
        "aff": "Freie Universit\u00e4t Berlin;Technische Universit\u00e4t M\u00fcnchen;;Massachusetts Institute of Technology;Massachusetts Institute of Technology;Technical University Munich;Massachusetts Institute of Technology",
        "aff_domain": "fu-berlin.de;tum.de;;mit.edu;mit.edu;tum.de;mit.edu",
        "position": "PhD student;MS student;;PhD student;Professor;PhD student;PhD student",
        "bibtex": "@misc{\nplainer2024diffdockpocket,\ntitle={DiffDock-Pocket: Diffusion for Pocket-Level Docking with Sidechain Flexibility},\nauthor={Michael Plainer and Marcella Toth and Simon Dobers and Hannes Stark and Gabriele Corso and C{\\'e}line Marquet and Regina Barzilay},\nyear={2024},\nurl={https://openreview.net/forum?id=1IaoWBqB6K}\n}",
        "github": "",
        "project": "",
        "reviewers": "rxhe;Mo9h;TENj;XNuQ",
        "site": "https://openreview.net/forum?id=1IaoWBqB6K",
        "pdf_size": 4902112,
        "rating": "3;5;6;6",
        "confidence": "4;4;3;3",
        "soundness": "3;2;3;3",
        "contribution": "2;2;2;2",
        "presentation": "3;4;3;3",
        "wc_summary": "25;52;87;67",
        "wc_strengths": "46;69;124;40",
        "wc_weaknesses": "98;285;166;75",
        "wc_questions": "191;48;145;198",
        "wc_review": "360;454;522;380",
        "wc_reply_reviewers": "0;51;122;0",
        "wc_reply_authors": "1333;929;1370;1798",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "3;2;2;3",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            57.75,
            22.620510604316607
        ],
        "wc_strengths_avg": [
            69.75,
            33.138912172852024
        ],
        "wc_weaknesses_avg": [
            156.0,
            81.64863746566749
        ],
        "wc_questions_avg": [
            145.5,
            59.860253925288355
        ],
        "wc_review_avg": [
            429.0,
            64.10148204214939
        ],
        "wc_reply_reviewers_avg": [
            43.25,
            50.006874527408726
        ],
        "wc_reply_authors_avg": [
            1357.5,
            307.5747876533446
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.8164965809277259,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1742131594736248720&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;2;3;2",
        "aff_unique_norm": "Freie Universit\u00e4t Berlin;Technische Universit\u00e4t M\u00fcnchen;Massachusetts Institute of Technology;Technical University of Munich",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.fu-berlin.de;https://www.tum.de;https://web.mit.edu;https://www.tum.de",
        "aff_unique_abbr": "FU Berlin;TUM;MIT;TUM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;1;0;1",
        "aff_country_unique": "Germany;United States"
    },
    {
        "id": "1JPfHljXL4",
        "title": "When, Why and How Much? Adaptive Learning Rate Scheduling by Refinement",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this paper, we present a refined study of learning rate schedules for stochastic gradient descent (SGD). In contrast to most prior works that study the convergence of the average iterate, we study the last iterate, which is what most people use in practice. Furthermore, we break away from the tradition of replacing the gradients with crude upper bounds, which allows us to obtain a \\emph{problem-adaptive} learning rate schedule. Our method is the first systematic approach to \\emph{automatically} yield learning rate warm-up and rapid learning rate annealing near the end of training. In cases where gradient norm information is not available, our theory predicts that the best choice is the linear-decay schedule that sets the stepsize proportionally to $1 - t/T$, where $t$ is the current iteration and $T$ is the total number of steps. Our final theoretical result is an extension of our methodology to coordinate-wise methods. We perform the most comprehensive evaluation of learning rate schedules to date, evaluating across 10 diverse deep learning problems, a series of LLMs, and a suite of logistic regression problems. We validate that overall, the linear-decay schedule outperforms all commonly used default schedules including cosine annealing, and that our schedule refinement method gives further improvements.",
        "keywords": "learning rates; linear decay; deep learning; online learning",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Aaron Defazio;Ashok Cutkosky;Harsh Mehta;Konstantin Mishchenko",
        "authorids": "~Aaron_Defazio1;~Ashok_Cutkosky1;~Harsh_Mehta1;~Konstantin_Mishchenko1",
        "gender": "M;;M;",
        "homepage": "https://www.aarondefazio.com/;http://www.cs.stanford.edu/~ashokc;;https://konstmish.com/",
        "dblp": "116/2969;191/6725;122/1475;222/9853",
        "google_scholar": "KEzJsdkAAAAJ;h4AbGp0AAAAJ;murJPNoAAAAJ;Z8Y8nhQAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Aaron_Defazio1;~Ashok_Cutkosky1;~Harsh_Mehta1;~Konstantin_Mishchenko1",
        "aff": "Meta;Boston University;Google Research;Samsung",
        "aff_domain": "meta.com;bu.edu;google.com;samsung.com",
        "position": "Research Scientist;Assistant Professor;Software Engineer;Researcher",
        "bibtex": "@misc{\ndefazio2024when,\ntitle={When, Why and How Much? Adaptive Learning Rate Scheduling by Refinement},\nauthor={Aaron Defazio and Ashok Cutkosky and Harsh Mehta and Konstantin Mishchenko},\nyear={2024},\nurl={https://openreview.net/forum?id=1JPfHljXL4}\n}",
        "github": "",
        "project": "",
        "reviewers": "CaT7;NM9Z;BqWo;HeFS;eGse",
        "site": "https://openreview.net/forum?id=1JPfHljXL4",
        "pdf_size": 1740080,
        "rating": "5;5;5;6;8",
        "confidence": "3;4;3;2;4",
        "soundness": "2;3;4;3;4",
        "contribution": "2;2;3;3;4",
        "presentation": "3;3;3;3;3",
        "wc_summary": "51;44;55;67;81",
        "wc_strengths": "62;59;53;64;47",
        "wc_weaknesses": "20;79;62;109;43",
        "wc_questions": "153;3;170;26;89",
        "wc_review": "286;185;340;266;260",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "508;451;647;352;210",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            5.8,
            1.16619037896906
        ],
        "confidence_avg": [
            3.2,
            0.7483314773547882
        ],
        "soundness_avg": [
            3.2,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.8,
            0.7483314773547882
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            59.6,
            13.047605144240073
        ],
        "wc_strengths_avg": [
            57.0,
            6.2289646009589745
        ],
        "wc_weaknesses_avg": [
            62.6,
            30.40131576099956
        ],
        "wc_questions_avg": [
            88.2,
            66.36083182118801
        ],
        "wc_review_avg": [
            267.4,
            49.926345750515324
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            433.6,
            146.99197256993324
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.2750095491084634,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10553505582998704311&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Meta;Boston University;Google;Samsung",
        "aff_unique_dep": "Meta Platforms, Inc.;;Google Research;Samsung",
        "aff_unique_url": "https://meta.com;https://www.bu.edu;https://research.google;https://www.samsung.com",
        "aff_unique_abbr": "Meta;BU;Google Research;Samsung",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "United States;South Korea"
    },
    {
        "id": "1JR20YOE0H",
        "title": "On Feature Diversity in Energy-based Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Energy-based learning is a powerful learning paradigm that encapsulates various discriminative and generative approaches. An energy-based model (EBM) is typically formed of inner-model(s) that learn a combination of the different features to generate an energy mapping for each input configuration. In this paper, we focus on the diversity of the produced feature set. We extend the probably approximately correct (PAC) theory of EBMs and analyze the effect of redundancy reduction on the performance of EBMs. We derive novel generalization bounds for various learning contexts, i.e., regression, classification, and implicit regression, with different energy functions and we show that indeed reducing redundancy of the feature set can consistently decrease the gap between the true and empirical expectation of the energy and boosts the performance of the model.",
        "keywords": "energy-based models;continual learning;redundancy reduction;feature diversity",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/5756c93f3c3852ed2c699584b082a052cdf6601f.zip",
        "author": "Firas Laakom;Jenni Raitoharju;Alexandros Iosifidis;Moncef Gabbouj",
        "authorids": "~Firas_Laakom1;~Jenni_Raitoharju1;~Alexandros_Iosifidis2;~Moncef_Gabbouj1",
        "gender": "M;;M;M",
        "homepage": ";;https://www.tuni.fi/en/people/alexandros-iosifidis;https://www.tuni.fi/en/moncef-gabbouj",
        "dblp": "242/8179;;01/9539;08/6597",
        "google_scholar": "VPWIyx8AAAAJ;;KjsL0KEAAAAJ;cHukfSUAAAAJ",
        "orcid": "0000-0001-7436-5692;;0000-0003-4807-1345;0000-0002-9788-2323",
        "linkedin": ";;;moncef-gabbouj-2186282/?originalSubdomain=fi",
        "or_profile": "~Firas_Laakom1;~Jenni_Raitoharju1;~Alexandros_Iosifidis2;~Moncef_Gabbouj1",
        "aff": "Tampere University;;Aarhus University;Tampere University",
        "aff_domain": "tuni.fi;;au.dk;tuni.fi",
        "position": "PhD student;;Full Professor;Full Professor",
        "bibtex": "@misc{\nlaakom2024on,\ntitle={On Feature Diversity in Energy-based Models},\nauthor={Firas Laakom and Jenni Raitoharju and Alexandros Iosifidis and Moncef Gabbouj},\nyear={2024},\nurl={https://openreview.net/forum?id=1JR20YOE0H}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZAxa;oMAe;M7of;qchL;UTkN",
        "site": "https://openreview.net/forum?id=1JR20YOE0H",
        "pdf_size": 839403,
        "rating": "5;6;6;6;6",
        "confidence": "4;2;3;2;3",
        "soundness": "2;3;3;3;3",
        "contribution": "2;3;2;2;3",
        "presentation": "1;3;3;2;2",
        "wc_summary": "80;78;103;52;137",
        "wc_strengths": "28;53;36;123;109",
        "wc_weaknesses": "90;42;167;146;63",
        "wc_questions": "260;94;132;97;1",
        "wc_review": "458;267;438;418;310",
        "wc_reply_reviewers": "158;0;0;30;0",
        "wc_reply_authors": "304;366;778;697;180",
        "reply_reviewers": "2;0;0;1;0",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            5.8,
            0.39999999999999997
        ],
        "confidence_avg": [
            2.8,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.2,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            90.0,
            28.51666179622012
        ],
        "wc_strengths_avg": [
            69.8,
            38.82988539771911
        ],
        "wc_weaknesses_avg": [
            101.6,
            47.8020920044301
        ],
        "wc_questions_avg": [
            116.8,
            83.73625260303926
        ],
        "wc_review_avg": [
            378.2,
            75.55766010140864
        ],
        "wc_reply_reviewers_avg": [
            37.6,
            61.31101043042758
        ],
        "wc_reply_authors_avg": [
            465.0,
            231.8361490363399
        ],
        "reply_reviewers_avg": [
            0.6,
            0.7999999999999999
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8017837257372734,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7411738941659034268&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Tampere University;Aarhus University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tuni.fi;https://au.dk",
        "aff_unique_abbr": "Tuni;AU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Finland;Denmark"
    },
    {
        "title": "Denoising Diffusion via Image-Based Rendering",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19594",
        "id": "1JbsdayvhO",
        "author_site": "Titas Anciukevi\u010dius, Fabian Manhardt, Federico Tombari, Paul Henderson",
        "tldr": "",
        "abstract": "Generating 3D scenes is a challenging open problem, which requires synthesizing plausible content that is fully consistent in 3D space. While recent methods such as neural radiance fields excel at view synthesis and 3D reconstruction, they cannot synthesize plausible details in unobserved regions since they lack a generative capability. Conversely, existing generative methods are typically not capable of reconstructing detailed, large-scale scenes in the wild, as they use limited-capacity 3D scene representations, require aligned camera poses, or rely on additional regularizers. In this work, we introduce the first diffusion model able to perform fast, detailed reconstruction and generation of real-world 3D scenes. To achieve this, we make three contributions. First, we introduce a new neural scene representation, IB-planes, that can efficiently and accurately represent large 3D scenes, dynamically allocating more capacity as needed to capture details visible in each image. Second, we propose a denoising-diffusion framework to learn a prior over this novel 3D scene representation, using only 2D images without the need for any additional supervision signal such as masks or depths.  This supports 3D reconstruction and generation in a unified architecture. Third, we develop a principled approach to avoid trivial 3D solutions when integrating the image-based rendering with the diffusion model, by dropping out representations of some images. We evaluate the model on several challenging datasets of real and synthetic images, and demonstrate superior results on generation, novel view synthesis and 3D reconstruction.",
        "keywords": "Neural Scene Representations;Generative Models;Denoising Diffusion;3D Reconstruction",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/13f97cec1247b17971e7bab7e4dd3526c4b1a2ea.zip",
        "author": "Titas Anciukevi\u010dius;Fabian Manhardt;Federico Tombari;Paul Henderson",
        "authorids": "~Titas_Anciukevi\u010dius1;~Fabian_Manhardt1;~Federico_Tombari1;~Paul_Henderson1",
        "gender": "M;M;M;",
        "homepage": "https://www.anciukevicius.com/;http://campar.in.tum.de/Main/FabianManhardt;https://federicotombari.github.io/;http://www.pmh47.net",
        "dblp": "262/3972;173/9271;16/3539;172/1394",
        "google_scholar": "N8xNl8kAAAAJ;https://scholar.google.de/citations?user=bERItx8AAAAJ;TFsE4BIAAAAJ;https://scholar.google.co.uk/citations?user=HN7fd4MAAAAJ",
        "orcid": ";0000-0002-4577-4590;0000-0001-5598-5212;",
        "linkedin": "titas-anciukevicius/;;fedet/;",
        "or_profile": "~Titas_Anciukevi\u010dius1;~Fabian_Manhardt1;~Federico_Tombari1;~Paul_Henderson1",
        "aff": "University of Edinburgh;Google;Technical University Munich (TUM);Institute of Science and Technology Austria",
        "aff_domain": "ed.ac.uk;google.com;in.tum.de;ist.ac.at",
        "position": "PhD student;Researcher;Lecturer;Postdoc",
        "bibtex": "@inproceedings{\nanciukevi{\\v{c}}ius2024denoising,\ntitle={Denoising Diffusion via Image-Based Rendering},\nauthor={Titas Anciukevi{\\v{c}}ius and Fabian Manhardt and Federico Tombari and Paul Henderson},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=1JbsdayvhO}\n}",
        "github": "",
        "project": "",
        "reviewers": "a83P;C6XK;MQQ6;Wz4z",
        "pdf_size": 19513544,
        "rating": "6;6;6;8",
        "confidence": "5;3;4;3",
        "soundness": "3;3;2;3",
        "contribution": "2;3;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "83;81;61;82",
        "wc_strengths": "40;34;73;77",
        "wc_weaknesses": "249;131;116;188",
        "wc_questions": "215;69;64;213",
        "wc_review": "587;315;314;560",
        "wc_reply_reviewers": "941;80;0;44",
        "wc_reply_authors": "2099;423;266;1492",
        "reply_reviewers": "3;2;0;1",
        "reply_authors": "4;2;1;3",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            76.75,
            9.12071817347735
        ],
        "wc_strengths_avg": [
            56.0,
            19.170289512680814
        ],
        "wc_weaknesses_avg": [
            171.0,
            52.4356748788456
        ],
        "wc_questions_avg": [
            140.25,
            73.77457217768192
        ],
        "wc_review_avg": [
            444.0,
            129.8518386469749
        ],
        "wc_reply_reviewers_avg": [
            266.25,
            390.59593891898055
        ],
        "wc_reply_authors_avg": [
            1070.0,
            758.6089242818067
        ],
        "reply_reviewers_avg": [
            1.5,
            1.118033988749895
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16540492762930564730&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=1JbsdayvhO",
        "pdf": "https://openreview.net/pdf?id=1JbsdayvhO",
        "email": "ed.ac.uk;google.com;in.tum.de;ist.ac.at",
        "author_num": 4,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "University of Edinburgh;Google;Technical University Munich;Institute of Science and Technology Austria",
        "aff_unique_dep": ";Google;;",
        "aff_unique_url": "https://www.ed.ac.uk;https://www.google.com;https://www.tum.de;https://www.ist.ac.at",
        "aff_unique_abbr": "Edinburgh;Google;TUM;IST Austria",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;2;3",
        "aff_country_unique": "United Kingdom;United States;Germany;Austria"
    },
    {
        "id": "1JiIKjcwrr",
        "title": "Robust Self-supervised Learning in Heterogeneous Graph Based on Feature-Topology Balancing",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In recent years, graph neural network (GNN) based self-supervised learning in heterogeneous information networks (HINs) has gathered considerable attention. Most of the past studies followed a message passing approach where the features of a central node are updated based on the features of its neighboring nodes. Since these methods depend on informative graph topology and node features, their performance significantly deteriorates when there is an issue in one factor. Moreover, since real-world HINs are highly noisy and validating the importance of attributes is challenging, it is rare to find cases where both the graph topology and node features are of good quality. To address this problem, we make the first model that can explicitly separate the graph topology and features in the heterogeneous graph by proposing the novel framework BFTNet (robust self-supervised heterogeneous graph learning using the Balance between node Features and graph Topology). BFTNet employs a knowledge graph embedding module focusing on global graph topology and a contrastive learning module dedicated to learning node features. Thanks to the novel structure that handles graph topology and node features separately, BFTNet can assign higher importance to one factor, thereby allowing it to effectively respond to skewed datasets in real-world situations. Moreover, BFTNet can improve performance by designing the optimal module suited for learning the topology and features, without sacrificing the performance of one modality to reflect the characteristics of the other modality. Lastly, BFTNet implemented a novel graph conversion scheme and representation fusion method to ensure that the representation of topology and features are effectively learned and integrated. The self-supervised learning performance of BFTNet is verified by extensive experiments on four real-world benchmark datasets, and the robustness of BFTNet is demonstrated with the experiments on noisy datasets. The source code of BFTNet will be available in the final version.",
        "keywords": "Heterogeneous Graph;Knowledge graph;Self-supervised learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/a8e6c444cea675e439d445a1845569e0dfd43c0e.zip",
        "author": "Junyong Ahn;Bong Gyun Kang;Hyeongrok Han;Sungroh Yoon",
        "authorids": "~Junyong_Ahn2;~Bong_Gyun_Kang1;~Hyeongrok_Han1;~Sungroh_Yoon1",
        "gender": "M;M;M;",
        "homepage": "https://github.com/jyahn215;https://github.com/Pusheen-cat;;http://ailab.snu.ac.kr",
        "dblp": ";369/7132;285/5845;99/1474",
        "google_scholar": ";iuMRdnIAAAAJ;VpV7QEkAAAAJ;Bphl_fIAAAAJ",
        "orcid": ";0000-0002-2287-4564;;0000-0002-2367-197X",
        "linkedin": ";;;",
        "or_profile": "~Junyong_Ahn2;~Bong_Gyun_Kang1;~Hyeongrok_Han1;~Sungroh_Yoon1",
        "aff": "Seoul National University;Seoul National University;Seoul National University;Seoul National University",
        "aff_domain": "snu.ac.kr;snu.ac.kr;snu.ac.kr;snu.ac.kr",
        "position": "MS student;PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nahn2024robust,\ntitle={Robust Self-supervised Learning in Heterogeneous Graph Based on Feature-Topology Balancing},\nauthor={Junyong Ahn and Bong Gyun Kang and Hyeongrok Han and Sungroh Yoon},\nyear={2024},\nurl={https://openreview.net/forum?id=1JiIKjcwrr}\n}",
        "github": "",
        "project": "",
        "reviewers": "jyGu;69NY;KdXi",
        "site": "https://openreview.net/forum?id=1JiIKjcwrr",
        "pdf_size": 508664,
        "rating": "3;3;6",
        "confidence": "4;5;3",
        "soundness": "2;3;4",
        "contribution": "2;3;3",
        "presentation": "2;3;4",
        "wc_summary": "90;56;55",
        "wc_strengths": "37;40;127",
        "wc_weaknesses": "214;184;265",
        "wc_questions": "2;2;62",
        "wc_review": "343;282;509",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "228;118;269",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            67.0,
            16.268579122549905
        ],
        "wc_strengths_avg": [
            68.0,
            41.737273509418415
        ],
        "wc_weaknesses_avg": [
            221.0,
            33.436506994600975
        ],
        "wc_questions_avg": [
            22.0,
            28.284271247461902
        ],
        "wc_review_avg": [
            378.0,
            95.9201056435337
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            205.0,
            63.75473838599502
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8660254037844387,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:eM5Lv-gU-UwJ:scholar.google.com/&scioq=Robust+Self-supervised+Learning+in+Heterogeneous+Graph+Based+on+Feature-Topology+Balancing&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Seoul National University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.snu.ac.kr",
        "aff_unique_abbr": "SNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "Neural Architecture Retrieval",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19593",
        "id": "1JtTPYBKqt",
        "author_site": "Xiaohuan Pei, Yanxi Li, Minjing Dong, Chang Xu",
        "tldr": "",
        "abstract": "With the increasing number of new neural architecture designs and substantial existing neural architectures, it becomes difficult for the researchers to situate their contributions compared with existing neural architectures or establish the connections between their designs and other relevant ones. To discover similar neural architectures in an efficient and automatic manner, we define a new problem Neural Architecture Retrieval which retrieves a set of existing neural architectures which have similar designs to the query neural architecture. Existing graph pre-training strategies cannot address the computational graph in neural architectures due to the graph size and motifs. To fulfill this potential, we propose to divide the graph into motifs which are used to rebuild the macro graph to tackle these issues, and introduce multi-level contrastive learning to achieve accurate graph representation learning. Extensive evaluations on both human-designed and synthesized neural architectures demonstrate the superiority of our algorithm. Such a dataset which contains 12k real-world network architectures, as well as their embedding, is built for neural architecture retrieval.",
        "keywords": "Information Retrieval;Vector Database;Neural Architecture Search",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/cca9b9f3c82ab4d835a6c262d56f627308c858d8.zip",
        "author": "Xiaohuan Pei;Yanxi Li;Minjing Dong;Chang Xu",
        "authorids": "~Xiaohuan_Pei1;~Yanxi_Li1;~Minjing_Dong1;~Chang_Xu4",
        "gender": ";M;M;",
        "homepage": ";;https://www.cs.cityu.edu.hk/~minjdong/;",
        "dblp": ";24/5261-1;246/2900.html;",
        "google_scholar": ";;https://scholar.google.com.au/citations?user=gJJRqlsAAAAJ;",
        "orcid": ";;0009-0003-1717-818X;",
        "linkedin": ";yanxi-li-3245a511a/;;",
        "or_profile": "~Xiaohuan_Pei1;~Yanxi_Li1;~Minjing_Dong1;~Chang_Xu4",
        "aff": ";University of Sydney;City University of Hong Kong;",
        "aff_domain": ";uni.sydney.edu.au;cityu.edu.hk;",
        "position": ";PhD student;Assistant Professor;",
        "bibtex": "@inproceedings{\npei2024neural,\ntitle={Neural Architecture Retrieval},\nauthor={Xiaohuan Pei and Yanxi Li and Minjing Dong and Chang Xu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=1JtTPYBKqt}\n}",
        "github": "",
        "project": "",
        "reviewers": "NBZG;BEfk;wPum",
        "pdf_size": 4869531,
        "rating": "6;8;8",
        "confidence": "5;5;5",
        "soundness": "3;4;3",
        "contribution": "2;4;3",
        "presentation": "3;3;3",
        "wc_summary": "65;223;99",
        "wc_strengths": "86;182;148",
        "wc_weaknesses": "126;114;277",
        "wc_questions": "23;46;20",
        "wc_review": "300;565;544",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1061;561;532",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            5.0,
            0.0
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            129.0,
            67.90189000805992
        ],
        "wc_strengths_avg": [
            138.66666666666666,
            39.74362282877035
        ],
        "wc_weaknesses_avg": [
            172.33333333333334,
            74.17247168293339
        ],
        "wc_questions_avg": [
            29.666666666666668,
            11.61416759345623
        ],
        "wc_review_avg": [
            469.6666666666667,
            120.27838080423635
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            718.0,
            242.82641262158174
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:9O_pp0lZQCcJ:scholar.google.com/&scioq=Neural+Architecture+Retrieval&hl=en&as_sdt=0,33",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=1JtTPYBKqt",
        "pdf": "https://openreview.net/pdf?id=1JtTPYBKqt",
        "email": ";uni.sydney.edu.au;cityu.edu.hk;",
        "author_num": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Sydney;City University of Hong Kong",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.sydney.edu.au;https://www.cityu.edu.hk",
        "aff_unique_abbr": "USYD;CityU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Australia;China"
    },
    {
        "id": "1JuMFjSkpD",
        "title": "Fair Attribute Classification via Distance Covariance",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "With the increasing prevalence of machine learning, concerns about fairness have emerged. Mitigating potential discrimination risks and preventing machine learning algorithms from making unfair predictions are essential goals in fairness machine learning. We tackle this challenge from a statistical perspective, utilizing distance covariance\u2014a powerful statistical method for measuring both linear and non-linear correlations\u2014as a measure to assess the independence between predictions and sensitive attributes. To enhance fairness in classification, we integrate the sample distance covariance as a manageable penalty term into the machine learning process to promote independence. Additionally, we optimize this constrained problem using the Lagrangian dual method, offering a better trade-off between accuracy and fairness. Theoretically, we provide a proof for the convergence between sample and population distance covariance, establishing necessary guarantees for batch computations. Through experiments conducted on a range of real-world datasets, we demonstrate that our approach can seamlessly extend to existing machine learning models and deliver competitive results.",
        "keywords": "Fair classification;distance covariance;Lagrange dual optimization;convergence in probability",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/eb522602cfe7be7ae88865bcbfeb59937ab0a8d9.pdf",
        "author": "Ruifan Huang;Haixia Liu",
        "authorids": "~Ruifan_Huang1;~Haixia_Liu1",
        "gender": "M;F",
        "homepage": "https://ruistarlit.github.io/;http://faculty.hust.edu.cn/liuhaixia1/en/index.htm",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Ruifan_Huang1;~Haixia_Liu1",
        "aff": "Huazhong University of Science and Technology;Huazhong University of Science and Technology",
        "aff_domain": "hust.edu.cn;hust.edu.cn",
        "position": "MS student;Associate Professor",
        "bibtex": "@misc{\nhuang2024fair,\ntitle={Fair Attribute Classification via Distance Covariance},\nauthor={Ruifan Huang and Haixia Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=1JuMFjSkpD}\n}",
        "github": "",
        "project": "",
        "reviewers": "zY1Z;uH68;eHoC;8JtY",
        "site": "https://openreview.net/forum?id=1JuMFjSkpD",
        "pdf_size": 1033743,
        "rating": "5;5;5;5",
        "confidence": "3;4;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "40;75;95;60",
        "wc_strengths": "56;58;28;101",
        "wc_weaknesses": "151;176;87;271",
        "wc_questions": "138;26;531;21",
        "wc_review": "385;335;741;453",
        "wc_reply_reviewers": "0;40;0;93",
        "wc_reply_authors": "860;1419;0;1316",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "2;3;0;3",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            67.5,
            20.155644370746373
        ],
        "wc_strengths_avg": [
            60.75,
            26.089988501338976
        ],
        "wc_weaknesses_avg": [
            171.25,
            66.10739368633436
        ],
        "wc_questions_avg": [
            179.0,
            208.54136280364142
        ],
        "wc_review_avg": [
            478.5,
            157.23469718862947
        ],
        "wc_reply_reviewers_avg": [
            33.25,
            38.16657569130351
        ],
        "wc_reply_authors_avg": [
            898.75,
            559.9131070978782
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:lvflX29AApEJ:scholar.google.com/&scioq=Fair+Attribute+Classification+via+Distance+Covariance&hl=en&as_sdt=0,23",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Huazhong University of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.hust.edu.cn",
        "aff_unique_abbr": "HUST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "1M0qIxVKf6",
        "title": "Uncovering hidden geometry in Transformers via disentangling position and context",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Transformers are widely used to extract complex semantic meanings from input tokens, yet they usually operate as black-box models. In this paper, we present a simple yet informative decomposition of hidden states (or embeddings) of trained transformers into interpretable components. For any layer, embedding vectors of input sequence samples are a tensor $h \\in R^{C \\times T \\times d}$. Given embedding vector $h_{c,t} \\in R^d$ at sequence position $t \\le T$ in a sequence (or context) $c \\le C$, extracting the mean effects yields the decomposition \n$$\nh_{c,t} = \\mu + pos_t + ctx_c + resid_{c,t}\n$$\nwhere $\\mu$ is the global mean vector, $pos_t$ and $ctx_c$ are the mean vectors across contexts and across positions respectively, and $resid_{c,t}$ is the residual vector. For popular transformer architectures and diverse text datasets, empirically we find pervasive mathematical structure: (1) $(pos_t)_t$ forms a low-dimensional, continuous, and often spiral shape across layers, (2) $(ctx_c)_c$ shows  \nclear cluster structure that falls into context topics, and (3) $(pos_t)_t$ and $(ctx_c)_c$ are mutually incoherent---namely $pos_t$ is almost orthogonal to $ctx_c$---which is canonical in compressed sensing and dictionary learning. This decomposition offers structural insights about input formats in in-context learning (especially for induction heads) and in length generalization (especially for arithmetic tasks).",
        "keywords": "Transformers;Positional embeddings;Incoherence;Induction head;Attention;Interpreting neural nets;Visualization",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/bd2c2ad65b25ecc5a786e93647fbff84b987b2b0.zip",
        "author": "Jiajun Song;Yiqiao Zhong",
        "authorids": "~Jiajun_Song3;~Yiqiao_Zhong1",
        "gender": "M;M",
        "homepage": "https://jiajunsong629.github.io/;https://pages.stat.wisc.edu/~zhong35/",
        "dblp": ";140/7265",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Jiajun_Song3;~Yiqiao_Zhong1",
        "aff": "Beijing Institute for General Artificial Intelligence;University of Wisconsin - Madison",
        "aff_domain": "bigai.ai;wisc.edu",
        "position": "Researcher;Assistant Professor",
        "bibtex": "@misc{\nsong2024uncovering,\ntitle={Uncovering hidden geometry in Transformers via disentangling position and context},\nauthor={Jiajun Song and Yiqiao Zhong},\nyear={2024},\nurl={https://openreview.net/forum?id=1M0qIxVKf6}\n}",
        "github": "",
        "project": "",
        "reviewers": "rGTL;K9yz;Jv3k",
        "site": "https://openreview.net/forum?id=1M0qIxVKf6",
        "pdf_size": 14405346,
        "rating": "5;5;6",
        "confidence": "3;3;3",
        "soundness": "2;2;2",
        "contribution": "2;3;3",
        "presentation": "3;2;2",
        "wc_summary": "59;61;95",
        "wc_strengths": "33;88;73",
        "wc_weaknesses": "128;5;248",
        "wc_questions": "73;201;130",
        "wc_review": "293;355;546",
        "wc_reply_reviewers": "64;0;0",
        "wc_reply_authors": "486;448;742",
        "reply_reviewers": "1;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            71.66666666666667,
            16.519348924485158
        ],
        "wc_strengths_avg": [
            64.66666666666667,
            23.21398046197353
        ],
        "wc_weaknesses_avg": [
            127.0,
            99.20685460188726
        ],
        "wc_questions_avg": [
            134.66666666666666,
            52.359865885576475
        ],
        "wc_review_avg": [
            398.0,
            107.669246615116
        ],
        "wc_reply_reviewers_avg": [
            21.333333333333332,
            30.169889330626027
        ],
        "wc_reply_authors_avg": [
            558.6666666666666,
            130.5611819118616
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14630901236651546134&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Beijing Institute for General Artificial Intelligence;University of Wisconsin-Madison",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.bigaiai.org/;https://www.wisc.edu",
        "aff_unique_abbr": "BIGAI;UW-Madison",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Madison",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "1M8yDTa0Pp",
        "title": "Cross-Model Semi-Supervised Prompt Learning for Vision-Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Prompt learning, which focuses on learning continuous soft prompts, has emerged as a promising approach for\nefficiently adapting pretrained vision-language models (VLMs) to multiple downstream tasks. While prior works have shown promising performances on common benchmarks, they typically rely on labeled data samples only. This greatly discredits the information gain from the vast collection of otherwise unlabeled samples available in the wild. To mitigate this, we propose a simple yet efficient cross-model framework to leverage on the unlabeled samples achieving significant gain in model performance. Specifically, we employ a semi-supervised prompt learning approach which makes the learned prompts invariant to the different views of a given unlabeled sample. The multiple views are obtained using different augmentations on the images as well as by varying the lengths of visual and text prompts attached to these samples. Experimenting with this simple yet surprisingly effective approach over a large number of benchmark datasets, we observe a considerable improvement in the quality of soft prompts thereby making an immense gain in image classification performance. Interestingly, our approach also benefits from out-of-domain unlabeled images highlighting the robustness and generalization capabilities. Our code will be made publicly available.",
        "keywords": "Semi-supervised learning;prompt learning;multi-modal learning;vision-language models",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/db10f3d5d8691e6f71ca4c0b745c7f4a44b306fd.zip",
        "author": "Omprakash Chakraborty;Aadarsh Sahoo;Rameswar Panda;Abir Das",
        "authorids": "~Omprakash_Chakraborty1;~Aadarsh_Sahoo1;~Rameswar_Panda1;~Abir_Das4",
        "gender": "M;M;M;M",
        "homepage": ";https://aadsah.github.io/;https://rpand002.github.io/;http://cse.iitkgp.ac.in/~adas/",
        "dblp": "182/4466.html;272/5285;126/0986;141/1311",
        "google_scholar": "https://scholar.google.co.in/citations?user=Z0uiqiIAAAAJ;https://scholar.google.co.in/citations?user=1nPhcH0AAAAJ;_ySuu6gAAAAJ;L4yEk2UAAAAJ",
        "orcid": ";;;",
        "linkedin": ";aadsah/;;",
        "or_profile": "~Omprakash_Chakraborty1;~Aadarsh_Sahoo1;~Rameswar_Panda1;~Abir_Das4",
        "aff": "Indian Institute of Technology Kharagpur, Dhirubhai Ambani Institute Of Information and Communication Technology;California Institute of Technology;MIT-IBM Watson AI Lab;Indian Institute of Technology Kharagpur",
        "aff_domain": "iitkgp.ac.in;caltech.edu;ibm.com;iitkgp.ac.in",
        "position": "PhD student;PhD student;Research Scientist;Assistant Professor",
        "bibtex": "@misc{\nchakraborty2024crossmodel,\ntitle={Cross-Model Semi-Supervised Prompt Learning for Vision-Language Models},\nauthor={Omprakash Chakraborty and Aadarsh Sahoo and Rameswar Panda and Abir Das},\nyear={2024},\nurl={https://openreview.net/forum?id=1M8yDTa0Pp}\n}",
        "github": "",
        "project": "",
        "reviewers": "MsJj;f2tm;xki8;18u3",
        "site": "https://openreview.net/forum?id=1M8yDTa0Pp",
        "pdf_size": 10629665,
        "rating": "3;3;6;6",
        "confidence": "4;4;4;5",
        "soundness": "1;3;3;3",
        "contribution": "1;2;3;3",
        "presentation": "2;2;3;4",
        "wc_summary": "97;65;66;140",
        "wc_strengths": "49;36;71;56",
        "wc_weaknesses": "742;59;98;135",
        "wc_questions": "16;98;31;58",
        "wc_review": "904;258;266;389",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1882;1229;375;1535",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "4;3;2;3",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            92.0,
            30.553232234904378
        ],
        "wc_strengths_avg": [
            53.0,
            12.62933094031509
        ],
        "wc_weaknesses_avg": [
            258.5,
            280.43938739057324
        ],
        "wc_questions_avg": [
            50.75,
            31.155858197135252
        ],
        "wc_review_avg": [
            454.25,
            264.8040549160832
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1255.25,
            558.2572771581218
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5773502691896258,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Leqmo6cva9YJ:scholar.google.com/&scioq=Cross-Model+Semi-Supervised+Prompt+Learning+for+Vision-Language+Models&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Indian Institute of Technology Kharagpur;California Institute of Technology;Massachusetts Institute of Technology",
        "aff_unique_dep": ";;IBM Watson AI Lab",
        "aff_unique_url": "https://www.iitkgp.ac.in;https://www.caltech.edu;https://www.mitibmwatsonailab.org",
        "aff_unique_abbr": "IIT Kharagpur;Caltech;MIT-IBM AI Lab",
        "aff_campus_unique_index": "0;1;0",
        "aff_campus_unique": "Kharagpur;Pasadena;",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "India;United States"
    },
    {
        "id": "1MRfyGLCcU",
        "title": "Graph Representation Learning enhanced Semi-supervised Feature Selection",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Feature selection process is essential in machine learning by discovering the most relevant features to the modeling target. By exploring the potential complex correlations among features of unlabeled data, recently introduced self-supervision-enhanced feature selection greatly reduces the reliance on the labeled samples. However, they are generally based on the autoencoder with sample-wise self-supervision, which can hardly exploit relations among samples. To address this limitation, this paper proposes Graph representation learning enhanced Semi-supervised Feature Selection(G-FS) which performs feature selection based on the discovery and exploitation of the non-Euclidean relations among features and samples by translating unlabeled ``plain\" tabular data into a bipartite graph. A self-supervised edge prediction task is designed to distill rich information on the graph into low-dimensional embeddings, which remove redundant features and noise. Guided by the condensed graph representation, we propose a batch-attention feature weight generation mechanism that generates more robust weights according to batch-based selection patterns rather than individual samples. The results show that G-FS achieves significant performance edges in 12 datasets compared to ten state-of-the-art baselines, including two recent self-supervised baselines.",
        "keywords": "Feature Selection\uff1bGraph Representation Learning; Batch Attention",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Jun Tan;Zhifeng Qiu;Ning Gui",
        "authorids": "~Jun_Tan3;~Zhifeng_Qiu2;~Ning_Gui1",
        "gender": ";;M",
        "homepage": ";https://faculty.csu.edu.cn/qiuzhifeng/zh_CN/index.htm;https://faculty.csu.edu.cn/guining/zh_CN/index.htm",
        "dblp": ";;30/3048",
        "google_scholar": ";;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": "0000-0002-3236-7275;;",
        "linkedin": ";;",
        "or_profile": "~Jun_Tan3;~Zhifeng_Qiu2;~Ning_Gui1",
        "aff": "Central South University;;Central South University",
        "aff_domain": "csu.edu.cn;;csu.edu.cn",
        "position": "MS student;;Full Professor",
        "bibtex": "@misc{\ntan2024graph,\ntitle={Graph Representation Learning enhanced Semi-supervised Feature Selection},\nauthor={Jun Tan and Zhifeng Qiu and Ning Gui},\nyear={2024},\nurl={https://openreview.net/forum?id=1MRfyGLCcU}\n}",
        "github": "",
        "project": "",
        "reviewers": "AraV;s9w1;n2md;KtqB",
        "site": "https://openreview.net/forum?id=1MRfyGLCcU",
        "pdf_size": 10610776,
        "rating": "3;5;5;6",
        "confidence": "4;4;3;4",
        "soundness": "2;2;3;3",
        "contribution": "1;3;2;3",
        "presentation": "2;3;2;2",
        "wc_summary": "83;58;76;120",
        "wc_strengths": "17;23;30;54",
        "wc_weaknesses": "91;59;19;124",
        "wc_questions": "8;59;78;44",
        "wc_review": "199;199;203;342",
        "wc_reply_reviewers": "0;38;0;0",
        "wc_reply_authors": "370;577;563;799",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            84.25,
            22.56518335843961
        ],
        "wc_strengths_avg": [
            31.0,
            14.053469322555197
        ],
        "wc_weaknesses_avg": [
            73.25,
            38.84826250940961
        ],
        "wc_questions_avg": [
            47.25,
            25.66490794840301
        ],
        "wc_review_avg": [
            235.75,
            61.36519779158216
        ],
        "wc_reply_reviewers_avg": [
            9.5,
            16.454482671904334
        ],
        "wc_reply_authors_avg": [
            577.25,
            151.92823141207165
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.13245323570650439,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:lni0FW7_iHwJ:scholar.google.com/&scioq=Graph+Representation+Learning+enhanced+Semi-supervised+Feature+Selection&hl=en&as_sdt=0,44",
        "gs_version_total": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Central South University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.csu.edu.cn",
        "aff_unique_abbr": "CSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "1MXQBsHA4Q",
        "title": "Revisiting Supervision for Continual Representation Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In the field of continual learning, models are designed to learn tasks one after the other. While most research has centered on supervised continual learning, there is a growing interest in unsupervised continual learning, which makes use of the vast amounts of unlabeled data. Recent studies have highlighted the strengths of unsupervised methods, particularly self-supervised learning, in providing robust representations. The improved transferability of those representations built with self-supervised methods is often associated with the role played by the multi-layer perceptron projector. In this work, we depart from this observation and reexamine the role of supervision in continual representation learning. We reckon that additional information, such as human annotations, should not deteriorate the quality of representations. Our findings show that supervised models when enhanced with a multi-layer perceptron head, can outperform self-supervised models in continual representation learning. This highlights the importance of the multi-layer perceptron projector in shaping feature transferability across a sequence of tasks in continual learning.",
        "keywords": "continual learning;self-supervised representation learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/bdc8ba3e3ea936fda0476f4ddaf7679ba78196e0.zip",
        "author": "Daniel Marczak;Sebastian Cygert;Tomasz Trzcinski;Bart\u0142omiej Twardowski",
        "authorids": "~Daniel_Marczak2;~Sebastian_Cygert1;~Tomasz_Trzcinski2;~Bart\u0142omiej_Twardowski1",
        "gender": ";M;M;M",
        "homepage": ";https://pg.edu.pl/en/p/sebastian-cygert-1128802;https://cvlab.ii.pw.edu.pl/ttrzcins/;",
        "dblp": ";138/3693;05/11408;156/6628",
        "google_scholar": "Vs4kBzQAAAAJ;https://scholar.google.pl/citations?user=wLH9PP8AAAAJ;https://scholar.google.pl/citations?user=bJMRBFoAAAAJ;https://scholar.google.pl/citations?user=8yywECgAAAAJ",
        "orcid": ";;;0000-0003-2117-8679",
        "linkedin": ";sebastiancygert/;;bartlomiejtwardowski/",
        "or_profile": "~Daniel_Marczak2;~Sebastian_Cygert1;~Tomasz_Trzcinski2;~Bart\u0142omiej_Twardowski1",
        "aff": "Warsaw University of Technology;IDEAS NCBR;Warsaw University of Technology;Computer Vision Center, Universitat Aut\u00f2noma de Barcelona",
        "aff_domain": "pw.edu.pl;ideas-ncbr.pl;pw.edu.pl;cvc.uab.es",
        "position": "PhD student;Postdoc;Full Professor;Postdoc",
        "bibtex": "@misc{\nmarczak2024revisiting,\ntitle={Revisiting Supervision for Continual Representation Learning},\nauthor={Daniel Marczak and Sebastian Cygert and Tomasz Trzcinski and Bart{\\l}omiej Twardowski},\nyear={2024},\nurl={https://openreview.net/forum?id=1MXQBsHA4Q}\n}",
        "github": "",
        "project": "",
        "reviewers": "Zari;6fut;vMLn",
        "site": "https://openreview.net/forum?id=1MXQBsHA4Q",
        "pdf_size": 1605415,
        "rating": "3;3;5",
        "confidence": "5;3;2",
        "soundness": "2;2;3",
        "contribution": "2;2;2",
        "presentation": "3;3;2",
        "wc_summary": "102;81;155",
        "wc_strengths": "138;40;55",
        "wc_weaknesses": "384;172;177",
        "wc_questions": "225;5;95",
        "wc_review": "849;298;482",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            1.247219128924647
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            112.66666666666667,
            31.13768706175132
        ],
        "wc_strengths_avg": [
            77.66666666666667,
            43.099368389287974
        ],
        "wc_weaknesses_avg": [
            244.33333333333334,
            98.7803399242762
        ],
        "wc_questions_avg": [
            108.33333333333333,
            90.30811456096045
        ],
        "wc_review_avg": [
            543.0,
            229.0429362950682
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.7559289460184545,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9566271489219903541&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 11,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "Warsaw University of Technology;Institute for Development, Economic Analysis, and Simulation (IDEAS);Universitat Aut\u00f2noma de Barcelona",
        "aff_unique_dep": ";;Computer Vision Center",
        "aff_unique_url": "https://www.pw.edu.pl;https://www.ideas-ncbr.gov.pl;https://www.uab.cat",
        "aff_unique_abbr": "WUT;IDEAS;UAB",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "Poland;Spain"
    },
    {
        "title": "Data Distillation Can Be Like Vodka: Distilling More Times For Better Quality",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19592",
        "id": "1NHgmKqOzZ",
        "author_site": "Xuxi Chen, Yu Yang, Zhangyang Wang, Baharan Mirzasoleiman",
        "tldr": "",
        "abstract": "Dataset distillation aims to minimize the time and memory needed for training deep networks on large datasets, by creating a small set of synthetic images that has a similar generalization performance to that of the full dataset. However, current dataset distillation techniques fall short, showing a notable performance gap compared to training on the original data. In this work, we are the first to argue that the use of only one synthetic subset for distillation may not yield optimal generalization performance. This is because the training dynamics of deep networks drastically changes during training. Therefore, multiple synthetic subsets are required to capture the dynamics of training in different stages. To address this issue, we propose Progressive Dataset Distillation (PDD). PDD synthesizes multiple small sets of synthetic images, each conditioned on the previous sets, and trains the model on the cumulative union of these subsets without requiring additional training time. Our extensive experiments show that PDD can effectively improve the performance of existing dataset distillation methods by up to 4.3%. In addition, our method for the first time enables generating considerably larger synthetic datasets. Our codes are available at https://github.com/VITA-Group/ProgressiveDD.",
        "keywords": "dataset distillation;dataset condensation",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Xuxi Chen;Yu Yang;Zhangyang Wang;Baharan Mirzasoleiman",
        "authorids": "~Xuxi_Chen1;~Yu_Yang4;~Zhangyang_Wang1;~Baharan_Mirzasoleiman1",
        "gender": "Unspecified;F;M;F",
        "homepage": ";https://sites.google.com/view/yuyang0901/home;https://vita-group.github.io;http://web.cs.ucla.edu/~baharan/",
        "dblp": "267/9662;16/4505-7;119/4026;52/10075",
        "google_scholar": "afsDlKYAAAAJ;KK6Yj4IAAAAJ;pxFyKAIAAAAJ;x63j7HEAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Xuxi_Chen1;~Yu_Yang4;~Zhangyang_Wang1;~Baharan_Mirzasoleiman1",
        "aff": "University of Texas at Austin;University of California, Los Angeles;University of Texas at Austin;University of California, Los Angeles",
        "aff_domain": "utexas.edu;ucla.edu;utexas.edu;ucla.edu",
        "position": "PhD student;PhD student;Associate Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nchen2024data,\ntitle={Data Distillation Can Be Like Vodka: Distilling More Times For Better Quality},\nauthor={Xuxi Chen and Yu Yang and Zhangyang Wang and Baharan Mirzasoleiman},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=1NHgmKqOzZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "rp5C;S7ej;xT2K",
        "pdf_size": 4454536,
        "rating": "5;6;8",
        "confidence": "4;5;3",
        "soundness": "3;2;3",
        "contribution": "3;2;3",
        "presentation": "3;2;3",
        "wc_summary": "42;70;100",
        "wc_strengths": "27;52;115",
        "wc_weaknesses": "153;196;1",
        "wc_questions": "2;36;10",
        "wc_review": "224;354;226",
        "wc_reply_reviewers": "118;95;0",
        "wc_reply_authors": "1608;836;160",
        "reply_reviewers": "2;1;0",
        "reply_authors": "5;3;1",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            70.66666666666667,
            23.683092891108814
        ],
        "wc_strengths_avg": [
            64.66666666666667,
            37.025516726831626
        ],
        "wc_weaknesses_avg": [
            116.66666666666667,
            83.65139302818308
        ],
        "wc_questions_avg": [
            16.0,
            14.514360704718161
        ],
        "wc_review_avg": [
            268.0,
            60.81666438293592
        ],
        "wc_reply_reviewers_avg": [
            71.0,
            51.07510809255979
        ],
        "wc_reply_authors_avg": [
            868.0,
            591.5764250430088
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            3.0,
            1.632993161855452
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.6546536707079772,
        "gs_citation": 20,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1440553960173365966&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=1NHgmKqOzZ",
        "pdf": "https://openreview.net/pdf?id=1NHgmKqOzZ",
        "email": "utexas.edu;ucla.edu;utexas.edu;ucla.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;0;1",
        "aff_unique_norm": "University of Texas at Austin;University of California, Los Angeles",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.utexas.edu;https://www.ucla.edu",
        "aff_unique_abbr": "UT Austin;UCLA",
        "aff_campus_unique_index": "0;1;0;1",
        "aff_campus_unique": "Austin;Los Angeles",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "1OP4crhgkD",
        "title": "Semantically Aligned Task Decomposition in Multi-Agent Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The difficulty of appropriately assigning credit is particularly heightened in cooperative MARL with sparse reward, due to the concurrent time and structural scales involved. Automatic subgoal generation (ASG) has recently emerged as a viable MARL approach inspired by utilizing sub-goals in intrinsically motivated reinforcement learning. However, end-to-end learning of complex task planning from sparse rewards without prior knowledge, undoubtedly requires massive training samples. Moreover, the diversity-promoting nature of existing ASG methods can lead to the \"over-representation\" of sub-goals, generating numerous spurious sub-goals of limited relevance to the actual task reward and thus decreasing the sample efficiency of the algorithm. To address this problem and inspired by the disentangled representation learning, we propose a novel \"disentangled\" decision-making method, $\\textbf{S}$emantically $\\textbf{A}$ligned task decomposition in $\\textbf{MA}$RL ($\\textbf{SAMA}$), that prompts pretrained language models with chain-of-thought that can suggest potential goals, provide suitable goal decomposition and subgoal allocation as well as self-reflection-based replanning. Additionally, SAMA incorporates language-grounded RL to train each agent's subgoal-conditioned policy. SAMA demonstrates considerable advantages in sample efficiency compared to state-of-the-art ASG methods, as evidenced by its performance on two challenging sparse-reward tasks, $\\texttt{Overcooked}$ and $\\texttt{MiniRTS}$.",
        "keywords": "Pretrained Language Models;Multi-Agent Reinforcement Learning;Language-Grounded Reinforcement Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Wenhao Li;Dan Qiao;Xiangfeng Wang;Bo Jin;Baoxiang Wang;Hongyuan Zha",
        "authorids": "~Wenhao_Li2;~Dan_Qiao3;~Xiangfeng_Wang1;~Bo_Jin1;~Baoxiang_Wang1;~Hongyuan_Zha1",
        "gender": "M;;M;;;",
        "homepage": "https://tomaxent.com;https://qiaodan-cuhk.github.io;https://xfwang87.github.io/;;;",
        "dblp": ";152/4915-3.html;84/4695;;;z/HongyuanZha",
        "google_scholar": "HAtzuaYAAAAJ;;YpGMkgsAAAAJ;;;n1DQMIsAAAAJ",
        "orcid": ";0000-0002-2364-6897;;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Wenhao_Li2;~Dan_Qiao3;~Xiangfeng_Wang1;~Bo_Jin1;~Baoxiang_Wang1;~Hongyuan_Zha1",
        "aff": "The Chinese University of Hong Kong, Shenzhen;Chinese University of Hong Kong, Shen Zhen;East China Normal University;;;The Chinese University of Hong Kong, Shenzhen",
        "aff_domain": "cuhk.edu.cn;link.cuhk.edu.cn;ecnu.edu.cn;;;cuhk.edu.cn",
        "position": "Postdoc;PhD student;Full Professor;;;Full Professor",
        "bibtex": "@misc{\nli2024semantically,\ntitle={Semantically Aligned Task Decomposition in Multi-Agent Reinforcement Learning},\nauthor={Wenhao Li and Dan Qiao and Xiangfeng Wang and Bo Jin and Baoxiang Wang and Hongyuan Zha},\nyear={2024},\nurl={https://openreview.net/forum?id=1OP4crhgkD}\n}",
        "github": "",
        "project": "",
        "reviewers": "b4Ao;T35w;DBEC;Um1j",
        "site": "https://openreview.net/forum?id=1OP4crhgkD",
        "pdf_size": 3540389,
        "rating": "3;5;6;6",
        "confidence": "4;2;4;3",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;2;2;3",
        "wc_summary": "43;85;48;82",
        "wc_strengths": "52;43;84;138",
        "wc_weaknesses": "609;93;123;148",
        "wc_questions": "128;32;171;140",
        "wc_review": "832;253;426;508",
        "wc_reply_reviewers": "95;86;643;80",
        "wc_reply_authors": "3324;2069;3529;2167",
        "reply_reviewers": "1;1;3;1",
        "reply_authors": "8;5;8;5",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            64.5,
            19.11151485361639
        ],
        "wc_strengths_avg": [
            79.25,
            37.18450618201081
        ],
        "wc_weaknesses_avg": [
            243.25,
            212.06175397746762
        ],
        "wc_questions_avg": [
            117.75,
            51.934453881792194
        ],
        "wc_review_avg": [
            504.75,
            210.1682361823499
        ],
        "wc_reply_reviewers_avg": [
            226.0,
            240.814243764774
        ],
        "wc_reply_authors_avg": [
            2772.25,
            659.163627258058
        ],
        "reply_reviewers_avg": [
            1.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            6.5,
            1.5
        ],
        "replies_avg": [
            39,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.24618298195866545,
        "gs_citation": 19,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1403065174946763393&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Chinese University of Hong Kong;East China Normal University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cuhk.edu.cn;http://www.ecnu.edu.cn",
        "aff_unique_abbr": "CUHK;ECNU",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Shenzhen;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Backdoor Secrets Unveiled: Identifying Backdoor Data with Optimized Scaled Prediction Consistency",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19591",
        "id": "1OfAO2mes1",
        "author_site": "Soumyadeep Pal, Yuguang Yao, Ren Wang, Bingquan Shen, Sijia Liu",
        "tldr": "",
        "abstract": "Modern machine learning (ML) systems demand substantial training data, often resorting to external sources. Nevertheless, this practice renders them vulnerable to backdoor poisoning attacks. Prior backdoor defense strategies have primarily focused on the identification of backdoored models or poisoned data characteristics, typically operating under the assumption of access to clean data. In this work, we delve into a relatively underexplored challenge: the automatic identification of backdoor data within a poisoned dataset, all under realistic conditions, *i.e.*,  without the need for additional clean data or without manually defining a threshold for backdoor detection. We draw an inspiration from the scaled prediction consistency (SPC) technique, which exploits the prediction invariance of poisoned data to an input scaling factor. Based on this, we pose the backdoor data identification problem as a hierarchical data splitting optimization problem, leveraging a novel SPC-based loss function as the primary optimization objective. Our innovation unfolds in several key aspects. First, we revisit the vanilla SPC method, unveiling its limitations in addressing the proposed backdoor identification problem. Subsequently, we develop a bi-level optimization-based approach to precisely identify backdoor data by minimizing the advanced SPC loss. Finally, we demonstrate the efficacy of our proposal against a spectrum of backdoor attacks, encompassing basic label-corrupted attacks as well as more sophisticated clean-label attacks, evaluated across various benchmark datasets. Experiment results show that our approach often surpasses the performance of current baselines in identifying backdoor data points, resulting in about 4\\%-36\\% improvement in average AUROC. Codes are available at https://github.com/OPTML-Group/BackdoorMSPC.",
        "keywords": "Backdoor Detection;Backdoor Attack;Data Poisoning;AI Security;Deep learning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/d2c5665558b4c332568545796e2d21302eb03e53.zip",
        "author": "Soumyadeep Pal;Yuguang Yao;Ren Wang;Bingquan Shen;Sijia Liu",
        "authorids": "~Soumyadeep_Pal1;~Yuguang_Yao1;~Ren_Wang1;~Bingquan_Shen1;~Sijia_Liu1",
        "gender": ";M;M;;M",
        "homepage": ";https://www.cse.msu.edu/~yaoyugua/;https://wangren09.github.io/;;https://lsjxjtu.github.io/",
        "dblp": "236/2130.html;238/9467;29/50-8;151/9308;128/6972-1",
        "google_scholar": "https://scholar.google.ca/citations?user=c2VU-_4AAAAJ;-chIdAkAAAAJ;TY_3K48AAAAJ;https://scholar.google.com.sg/citations?user=zrJdj6YAAAAJ;C7dO_UgAAAAJ",
        "orcid": ";;0000-0002-6366-8898;;",
        "linkedin": ";tonyyaomsu/;ren-wang-715525106/;;",
        "or_profile": "~Soumyadeep_Pal1;~Yuguang_Yao1;~Ren_Wang1;~Bingquan_Shen1;~Sijia_Liu1",
        "aff": "Michigan State University;Michigan State University;Illinois Institute of Technology;DSO National Labs;Michigan State University",
        "aff_domain": "msu.edu;msu.edu;iit.edu;dso.org.sg;msu.edu",
        "position": "PhD student;PhD student;Assistant Professor;Researcher;Assistant Professor",
        "bibtex": "@inproceedings{\npal2024backdoor,\ntitle={Backdoor Secrets Unveiled: Identifying Backdoor Data with Optimized Scaled Prediction Consistency},\nauthor={Soumyadeep Pal and Yuguang Yao and Ren Wang and Bingquan Shen and Sijia Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=1OfAO2mes1}\n}",
        "github": "",
        "project": "",
        "reviewers": "nd7k;wHYC;V1zd;YD42",
        "pdf_size": 3995781,
        "rating": "6;6;6;6",
        "confidence": "4;4;4;5",
        "soundness": "3;2;3;2",
        "contribution": "2;2;2;2",
        "presentation": "2;2;3;2",
        "wc_summary": "89;203;35;65",
        "wc_strengths": "45;33;58;23",
        "wc_weaknesses": "186;366;69;196",
        "wc_questions": "32;3;6;5",
        "wc_review": "352;605;168;289",
        "wc_reply_reviewers": "104;116;32;422",
        "wc_reply_authors": "742;798;187;1069",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;2;1;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            98.0,
            63.56886030125127
        ],
        "wc_strengths_avg": [
            39.75,
            13.102957681378658
        ],
        "wc_weaknesses_avg": [
            204.25,
            105.89706086572942
        ],
        "wc_questions_avg": [
            11.5,
            11.884864324004713
        ],
        "wc_review_avg": [
            353.5,
            159.5501488560885
        ],
        "wc_reply_reviewers_avg": [
            168.5,
            149.842417225564
        ],
        "wc_reply_authors_avg": [
            699.0,
            320.4270587824942
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5843399313782917939&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=1OfAO2mes1",
        "pdf": "https://openreview.net/pdf?id=1OfAO2mes1",
        "email": "msu.edu;msu.edu;iit.edu;dso.org.sg;msu.edu",
        "author_num": 5,
        "aff_unique_index": "0;0;1;2;0",
        "aff_unique_norm": "Michigan State University;Illinois Institute of Technology;DSO National Laboratories",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.msu.edu;https://www.iit.edu;https://www.dso.org.sg",
        "aff_unique_abbr": "MSU;IIT;DSO",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "United States;Singapore"
    },
    {
        "id": "1P1nxem1jU",
        "title": "Through the Dual-Prism: A Spectral Perspective on Graph Data Augmentation for Graph Classification",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph Neural Networks (GNNs) have become the preferred tool to process graph data, with their efficacy being boosted through graph data augmentation techniques. Despite the evolution of augmentation methods, issues like graph property distortions and restricted structural changes persist. This leads to the question: Is it possible to develop more property-conserving and structure-sensitive augmentation methods? Through a spectral lens, we investigate the interplay between graph properties, their augmentation, and their spectral behavior, and found that keeping the low-frequency eigenvalues unchanged can preserve the critical properties at a large scale when generating augmented graphs. These observations inform our introduction of the Dual-Prism (DP) augmentation method, comprising DP-Noise and DP-Mask, which adeptly retains essential graph properties while diversifying augmented graphs. Extensive experiments validate the efficiency of our approach, providing a new and promising direction for graph data augmentation.",
        "keywords": "Graph Data Augmentation;Graph Neural Network;Graph Classification",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/dca49022b18da49aeab43748c4e1ab9b55e516d8.zip",
        "author": "Yutong Xia;Runpeng Yu;Yuxuan Liang;Xavier Bresson;Xinchao Wang;Roger Zimmermann",
        "authorids": "~Yutong_Xia1;~Runpeng_Yu2;~Yuxuan_Liang1;~Xavier_Bresson6;~Xinchao_Wang1;~Roger_Zimmermann1",
        "gender": "F;M;M;M;;M",
        "homepage": "https://yutong-xia.github.io/;https://yuxuanliang.com;https://www.comp.nus.edu.sg/cs/people/xaviercs/;https://www.comp.nus.edu.sg/cs/bio/rogerz/;https://yu-rp.github.io/;https://sites.google.com/site/sitexinchaowang/",
        "dblp": "307/5917;183/0977;95/378;79/1490;290/7625-1;",
        "google_scholar": "V7b4y2oAAAAJ;n9cODgcAAAAJ;https://scholar.google.com.sg/citations?hl=en;https://scholar.google.com.tw/citations?user=IDREwXEAAAAJ;;https://scholar.google.com.tw/citations?user=w69Buq0AAAAJ",
        "orcid": "0000-0001-9026-0049;0000-0003-2817-7337;;0000-0002-7410-2590;;",
        "linkedin": "yutong-xia/;yoshall/;;roger-zimmermann-76b56b6/;;",
        "or_profile": "~Yutong_Xia1;~Yuxuan_Liang1;~Xavier_Bresson6;~Roger_Zimmermann1;~R_Yu1;~Xinchao_WANG3",
        "aff": "National University of Singapore;The Hong Kong University of Science and Technology (Guangzhou);National University of Singapore;National University of Singapore;National University of Singapore;National University of Singapore",
        "aff_domain": "u.nus.edu;hkust-gz.edu.cn;nus.edu.sg;nus.edu.sg;u.nus.edu;nus.edu",
        "position": "PhD student;Assistant Professor;Associate Professor;Full Professor;PhD student;Assistant Professor",
        "bibtex": "@misc{\nxia2024through,\ntitle={Through the Dual-Prism: A Spectral Perspective on Graph Data Augmentation for Graph Classification},\nauthor={Yutong Xia and Runpeng Yu and Yuxuan Liang and Xavier Bresson and Xinchao Wang and Roger Zimmermann},\nyear={2024},\nurl={https://openreview.net/forum?id=1P1nxem1jU}\n}",
        "github": "",
        "project": "",
        "reviewers": "oQQa;7Xfr;48h8;oF9L",
        "site": "https://openreview.net/forum?id=1P1nxem1jU",
        "pdf_size": 726271,
        "rating": "5;5;6;8",
        "confidence": "4;3;4;4",
        "soundness": "2;3;4;3",
        "contribution": "2;2;3;4",
        "presentation": "3;4;3;3",
        "wc_summary": "64;38;62;80",
        "wc_strengths": "26;42;48;151",
        "wc_weaknesses": "213;66;156;99",
        "wc_questions": "2;294;40;74",
        "wc_review": "305;440;306;404",
        "wc_reply_reviewers": "11;64;18;0",
        "wc_reply_authors": "1343;1121;747;577",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "4;4;3;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            61.0,
            15.0
        ],
        "wc_strengths_avg": [
            66.75,
            49.30200300190653
        ],
        "wc_weaknesses_avg": [
            133.5,
            56.06469477309227
        ],
        "wc_questions_avg": [
            102.5,
            113.4581420612906
        ],
        "wc_review_avg": [
            363.75,
            59.62539308046531
        ],
        "wc_reply_reviewers_avg": [
            23.25,
            24.38621536852326
        ],
        "wc_reply_authors_avg": [
            947.0,
            301.65874759403215
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            1.224744871391589
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.4714045207910316,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10391579270727837642&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;0;0;0",
        "aff_unique_norm": "National University of Singapore;Hong Kong University of Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.nus.edu.sg;https://www.ust.hk",
        "aff_unique_abbr": "NUS;HKUST",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Guangzhou",
        "aff_country_unique_index": "0;1;0;0;0;0",
        "aff_country_unique": "Singapore;China"
    },
    {
        "id": "1P92J25hdf",
        "title": "Going Deeper with General and Specific Inductive Bias for Real-Time Stereo Matching",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Inductive Bias (IB) has sparked a revolutionary transformation by incorporating the advantages of CNNs and Transformers, including scale invariance and integration of locality and long-range dependencies, which is called general IB for its wide applicability. However, its efficacy is currently not enjoyed by stereo matching, one of the geometric vision tasks, because of the ignorance of volume-level scale invariance and the limitation of high real-time requirement. In contrast, a specific IB  is adopted by constructing volume structure in stereo matching task, which helps to finally generate a confidence volume to predict disparity map (output), but fewer studies go into the specific volume structure. Based on the above issues, this paper develops a novel model named UStereo to introduce the general IB to stereo matching. Technically, we adopt inter-layer fusion to break down volume-level scale invariance to a recurrence strategy in initialization for information at low resolution and refinement process for the high, which further extends to capture long-range dependencies after shallow stacks of convolutions and normalization without time-consuming Transformers. Additionally, to reveal the role that the volume structure constructed by specific IB plays during inference, we propose the first-time in-depth study of volume at low resolution through varying degrees of restraint as well as 3 original statistic indicators to reflect the characteristics of representation within volumes. Experiments demonstrate UStereo has competitive performance with both fast speed and robust generalization, and ablation studies show the effectiveness of introducing general IB. Moreover, our analysis of the volumes at low resolution suggests they can be viewed as confidence volumes and a concentrated distribution of the disparity within volumes leads to enhanced performance, which could extend the role of the specific IB.",
        "keywords": "Stereo Matching;Inductive Bias;Deep Supervision",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Renjie Ding;Yaonan Wang;Min Liu;Jiazheng Wang;zhe zhang",
        "authorids": "~Renjie_Ding1;~Yaonan_Wang3;~Min_Liu3;~Jiazheng_Wang1;~zhe_zhang21",
        "gender": "M;M;M;M;M",
        "homepage": "https://github.com/EliottDJay;https://eeit.hnu.edu.cn/info/1277/4490.htm;http://eeit.hnu.edu.cn/info/1291/5218.htm;;https://www.researchgate.net/login?_sg=elMhO2GcXYO82O_IF-XlefOkM8rHoMFdlwKPDT3wfsTmGNAHiXSr1Mec4-Uw1GVQpzIkAURi-i3u4eEkHwErug&_tp=eyJjb250ZXh0Ijp7ImZpcnN0UGFnZSI6ImluZGV4IiwicGFnZSI6ImluZGV4In19",
        "dblp": ";90/548-1;99/76-8;;",
        "google_scholar": ";;njVL32IAAAAJ;;",
        "orcid": ";0009-0004-5365-6254;0000-0001-6406-4896;0000-0003-2534-4232;",
        "linkedin": ";;;;",
        "or_profile": "~Renjie_Ding1;~Yaonan_Wang3;~Min_Liu3;~Jiazheng_Wang1;~zhe_zhang21",
        "aff": "Hunan University;Hunan University;Hunan University;Hunan University;Hunan University",
        "aff_domain": "hnu.edu.cn;hnu.edu.cn;hnu.edu.cn;hnu.edu.cn;hnu.edu.cn",
        "position": "PhD student;Full Professor;Full Professor;PhD student;Researcher",
        "bibtex": "@misc{\nding2024going,\ntitle={Going Deeper with General and Specific Inductive Bias for Real-Time Stereo Matching},\nauthor={Renjie Ding and Yaonan Wang and Min Liu and Jiazheng Wang and zhe zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=1P92J25hdf}\n}",
        "github": "",
        "project": "",
        "reviewers": "CP2t;ocBs;DNk5;J9Ts;1LXD",
        "site": "https://openreview.net/forum?id=1P92J25hdf",
        "pdf_size": 2362220,
        "rating": "1;3;3;3;3",
        "confidence": "4;4;4;3;5",
        "soundness": "2;3;2;2;3",
        "contribution": "2;2;2;2;3",
        "presentation": "1;1;1;2;3",
        "wc_summary": "66;87;104;9;106",
        "wc_strengths": "101;34;71;9;70",
        "wc_weaknesses": "294;92;317;82;50",
        "wc_questions": "69;49;94;46;11",
        "wc_review": "530;262;586;146;237",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            2.6,
            0.8000000000000002
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            1.6,
            0.8
        ],
        "wc_summary_avg": [
            74.4,
            35.724501396100685
        ],
        "wc_strengths_avg": [
            57.0,
            32.04372013359248
        ],
        "wc_weaknesses_avg": [
            167.0,
            114.16479317197575
        ],
        "wc_questions_avg": [
            53.8,
            27.43282705081633
        ],
        "wc_review_avg": [
            352.2,
            173.32097391833454
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:pDJzbkPlzEUJ:scholar.google.com/&scioq=Going+Deeper+with+General+and+Specific+Inductive+Bias+for+Real-Time+Stereo+Matching&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Hunan University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.hunu.edu.cn/",
        "aff_unique_abbr": "HNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "1PPjf4wife",
        "title": "Leveraging Large Language Models for Optimised Coordination in Textual Multi-Agent Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Cooperative multi-agent reinforcement learning (MARL) presents unique challenges, amongst which fostering general cooperative behaviour across various tasks is critical. Recently, large language models (LLMs) have excelled at dealing with challenges in the general RL paradigm, showcasing remarkable sample efficiency and adaptability across tasks through domain specific fine-tuning, or functional alignment. However, neither LLMs nor these fine-tuning approaches are designed with coordination-centric solutions in mind, and the challenge of how to achieve greater coordination, and hence performance, with LLMs in MARL has not yet been tackled. To address this, we introduce the 'Functionally-Aligned Multi-Agents' (FAMA) framework. FAMA harnesses LLMs' inherent knowledge for cooperative decision-making via two primary mechanisms. Firstly, it aligns the LLM with the necessary functional knowledge through a centralised on-policy MARL update rule. Secondly, it recognises the pivotal role of communication in coordination and exploits the linguistic strengths of LLMs for intuitive, natural language inter-agent message-passing. Evaluations of FAMA in two multi-agent textual environments, namely BabyAI-Text and an autonomous driving junction environment, over four coordination tasks show it consistently outperforms independent learning LLMs and traditional symbolic RL methods.",
        "keywords": "llm;marl",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Oliver Slumbers;David Henry Mguni;Kun Shao;Jun Wang",
        "authorids": "~Oliver_Slumbers1;~David_Henry_Mguni1;~Kun_Shao1;~Jun_Wang2",
        "gender": ";M;;M",
        "homepage": ";;;http://www0.cs.ucl.ac.uk/staff/jun.wang/",
        "dblp": "285/5044;217/2369;;w/JunWang12",
        "google_scholar": "obYGSVIAAAAJ;K-_yzBsAAAAJ;;https://scholar.google.co.uk/citations?user=wIE1tY4AAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Oliver_Slumbers1;~David_Henry_Mguni1;~Kun_Shao1;~Jun_Wang2",
        "aff": "University College London;Queen Mary University, London;;University College London",
        "aff_domain": "ucl.ac.uk;qmul.ac.uk;;ucl.ac.uk",
        "position": "PhD student;Lecturer;;Professor",
        "bibtex": "@misc{\nslumbers2024leveraging,\ntitle={Leveraging Large Language Models for Optimised Coordination in Textual Multi-Agent Reinforcement Learning},\nauthor={Oliver Slumbers and David Henry Mguni and Kun Shao and Jun Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=1PPjf4wife}\n}",
        "github": "",
        "project": "",
        "reviewers": "dP6r;q4e1;Mrhw;cs97",
        "site": "https://openreview.net/forum?id=1PPjf4wife",
        "pdf_size": 1953557,
        "rating": "3;3;5;6",
        "confidence": "4;3;3;4",
        "soundness": "2;2;4;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;4;2",
        "wc_summary": "70;54;35;80",
        "wc_strengths": "64;71;25;47",
        "wc_weaknesses": "110;267;24;87",
        "wc_questions": "36;8;172;4",
        "wc_review": "280;400;256;218",
        "wc_reply_reviewers": "26;22;0;12",
        "wc_reply_authors": "454;929;623;368",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            59.75,
            17.03489066592445
        ],
        "wc_strengths_avg": [
            51.75,
            17.73943347460679
        ],
        "wc_weaknesses_avg": [
            122.0,
            89.43992397134515
        ],
        "wc_questions_avg": [
            55.0,
            68.66585760041157
        ],
        "wc_review_avg": [
            288.5,
            68.06430782723056
        ],
        "wc_reply_reviewers_avg": [
            15.0,
            10.04987562112089
        ],
        "wc_reply_authors_avg": [
            593.5,
            214.32510352266252
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.19245008972987526,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16409135025345974855&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University College London;Queen Mary University of London",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ucl.ac.uk;https://www.qmul.ac.uk",
        "aff_unique_abbr": "UCL;QMUL",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";London",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "title": "Bespoke Solvers for Generative Flow Models",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19590",
        "id": "1PXEY7ofFX",
        "author_site": "Neta Shaul, Juan Perez, Ricky T. Q. Chen, Ali Thabet, Albert Pumarola, Yaron Lipman",
        "tldr": "",
        "abstract": "Diffusion or flow-based models are powerful generative paradigms that are notoriously hard to sample as samples are defined as solutions to high-dimensional Ordinary or Stochastic Differential Equations (ODEs/SDEs) which require a large Number of Function Evaluations (NFE) to approximate well. Existing methods to alleviate the costly sampling process include model distillation and designing dedicated ODE solvers. However, distillation is costly to train and sometimes can deteriorate quality, while dedicated solvers still require relatively large NFE to produce high quality samples. In this paper we introduce ``Bespoke solvers'', a novel framework for constructing custom ODE solvers tailored to the ODE of a given pre-trained flow model. Our approach optimizes an order consistent and parameter-efficient solver (e.g., with 80 learnable parameters), is trained for roughly 1\\% of the GPU time required for training the pre-trained model, and significantly improves approximation and generation quality compared to dedicated solvers. For example, a Bespoke solver for a CIFAR10 model produces samples with Fr\u00e9chet Inception Distance (FID) of 2.73 with 10 NFE, and gets to 1\\% of the Ground Truth (GT) FID (2.59) for this model with only 20 NFE. On the more challenging ImageNet-64$\\times$64, Bespoke samples at 2.2 FID with 10 NFE, and gets within 2\\% of GT FID (1.71) with 20 NFE.",
        "keywords": "generative models;flow matching;diffusion models;normalizing flows;ode solver;fast sampling;distillation",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Neta Shaul;Juan Perez;Ricky T. Q. Chen;Ali Thabet;Albert Pumarola;Yaron Lipman",
        "authorids": "~Neta_Shaul1;~Juan_Perez1;~Ricky_T._Q._Chen1;~Ali_Thabet1;~Albert_Pumarola2;~Yaron_Lipman1",
        "gender": "M;;;M;;",
        "homepage": ";https://dblp.org/pid/196/0064.htmll;;https://www.alithabet.com/;;",
        "dblp": ";;;161/1812;;",
        "google_scholar": ";;;7T0CPEkAAAAJ;;",
        "orcid": ";;;;;",
        "linkedin": "neta-shaul-3364aa235/;;;akthabet/;;",
        "or_profile": "~Neta_Shaul1;~Juan_Perez1;~Ricky_T._Q._Chen1;~Ali_Thabet1;~Albert_Pumarola2;~Yaron_Lipman1",
        "aff": "Weizmann Institute of Science;;;Meta;;",
        "aff_domain": "weizmann.ac.il;;;fb.com;;",
        "position": "PhD student;;;Applied Research Manager;;",
        "bibtex": "@inproceedings{\nshaul2024bespoke,\ntitle={Bespoke Solvers for Generative Flow Models},\nauthor={Neta Shaul and Juan Perez and Ricky T. Q. Chen and Ali Thabet and Albert Pumarola and Yaron Lipman},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=1PXEY7ofFX}\n}",
        "github": "",
        "project": "",
        "reviewers": "ovsR;vykk;KhFN;Zfm7;7aEk",
        "pdf_size": 20965462,
        "rating": "6;6;8;8;8",
        "confidence": "3;4;3;4;3",
        "soundness": "3;3;3;4;3",
        "contribution": "2;3;4;4;3",
        "presentation": "2;3;3;3;4",
        "wc_summary": "44;148;225;206;213",
        "wc_strengths": "25;92;90;141;62",
        "wc_weaknesses": "106;279;69;46;58",
        "wc_questions": "107;89;181;96;113",
        "wc_review": "282;608;565;489;446",
        "wc_reply_reviewers": "24;0;0;0;0",
        "wc_reply_authors": "796;1153;621;511;346",
        "reply_reviewers": "1;0;0;0;0",
        "reply_authors": "1;2;1;1;1",
        "rating_avg": [
            7.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.4,
            0.4898979485566356
        ],
        "soundness_avg": [
            3.2,
            0.39999999999999997
        ],
        "contribution_avg": [
            3.2,
            0.7483314773547882
        ],
        "presentation_avg": [
            3.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            167.2,
            67.0683233725132
        ],
        "wc_strengths_avg": [
            82.0,
            38.19424040349539
        ],
        "wc_weaknesses_avg": [
            111.6,
            86.07578056573172
        ],
        "wc_questions_avg": [
            117.2,
            32.97514215283992
        ],
        "wc_review_avg": [
            478.0,
            113.16359838746733
        ],
        "wc_reply_reviewers_avg": [
            4.8,
            9.600000000000001
        ],
        "wc_reply_authors_avg": [
            685.4,
            275.9120149612916
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            1.2,
            0.4000000000000001
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.16666666666666663,
        "gs_citation": 20,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13011832480330181919&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=1PXEY7ofFX",
        "pdf": "https://openreview.net/pdf?id=1PXEY7ofFX",
        "email": "weizmann.ac.il;;;fb.com;;",
        "author_num": 6,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Weizmann Institute of Science;Meta",
        "aff_unique_dep": ";Meta Platforms, Inc.",
        "aff_unique_url": "https://www.weizmann.org.il;https://meta.com",
        "aff_unique_abbr": "Weizmann;Meta",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Israel;United States"
    },
    {
        "id": "1PaDPHDhwe",
        "title": "Group Robustness via Adaptive Class-Specific Scaling",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Group distributionally robust optimization, which aims to improve robust accuracies such as worst-group or unbiased accuracy, is one of the mainstream algorithms to mitigate spurious correlation and handle dataset bias. Existing approaches have apparently improved robust accuracy, but, in fact, these performance gains mainly come from trade-offs at the expense of average accuracy. To control the trade-off flexibly and efficiently, we first propose a simple class-specific scaling strategy, directly applicable to existing debiasing algorithms without additional training. We also develop an instance-wise adaptive scaling technique to overcome the trade-off and improve the performance even further in terms of both accuracies. Our approach reveals that a na\\\"ive ERM baseline matches or even outperforms the recent debiasing methods by only adopting the class-specific scaling technique. Then, we employ this technique to evaluate the performance of existing algorithms in a comprehensive manner by introducing a novel unified metric that summarizes the trade-off between the two accuracies as a scalar value. By considering the inherent trade-off and providing a performance landscape, our approach delivers meaningful insights into existing robust methods beyond the robust accuracy only. We perform experiments on the datasets in computer vision and natural language processing domains and verify the effectiveness of the proposed frameworks.",
        "keywords": "group robustness;debiasing",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Seonguk Seo;Bohyung Han",
        "authorids": "~Seonguk_Seo1;~Bohyung_Han1",
        "gender": "M;Not Specified",
        "homepage": "https://seoseong.uk;http://cvlab.snu.ac.kr/~bhhan",
        "dblp": "227/2319;73/4880.html",
        "google_scholar": "dhVCLrwAAAAJ;9aaeCToAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Seonguk_Seo1;~Bohyung_Han1",
        "aff": "Seoul National University;Seoul National University",
        "aff_domain": "snu.ac.kr;snu.ac.kr",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nseo2024group,\ntitle={Group Robustness via Adaptive Class-Specific Scaling},\nauthor={Seonguk Seo and Bohyung Han},\nyear={2024},\nurl={https://openreview.net/forum?id=1PaDPHDhwe}\n}",
        "github": "",
        "project": "",
        "reviewers": "SBij;mojf;cWjo;SN9B",
        "site": "https://openreview.net/forum?id=1PaDPHDhwe",
        "pdf_size": 1077918,
        "rating": "3;5;5;6",
        "confidence": "4;4;4;3",
        "soundness": "1;2;3;3",
        "contribution": "1;2;2;3",
        "presentation": "1;2;2;3",
        "wc_summary": "90;48;46;61",
        "wc_strengths": "18;125;23;47",
        "wc_weaknesses": "266;446;71;110",
        "wc_questions": "2;522;43;3",
        "wc_review": "376;1141;183;221",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            61.25,
            17.5695048308141
        ],
        "wc_strengths_avg": [
            53.25,
            42.85075845303091
        ],
        "wc_weaknesses_avg": [
            223.25,
            147.86036487172618
        ],
        "wc_questions_avg": [
            142.5,
            219.72767235830813
        ],
        "wc_review_avg": [
            480.25,
            388.27398509300104
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.6622661785325219,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:-EJcB71XEIsJ:scholar.google.com/&scioq=Group+Robustness+via+Adaptive+Class-Specific+Scaling&hl=en&as_sdt=0,5",
        "gs_version_total": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Seoul National University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.snu.ac.kr",
        "aff_unique_abbr": "SNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "MAMBA: an Effective World Model Approach for Meta-Reinforcement Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19589",
        "id": "1RE0H6mU7M",
        "author_site": "Zohar Rimon, Tom Jurgenson, Orr Krupnik, Gilad Adler, Aviv Tamar",
        "tldr": "",
        "abstract": "Meta-reinforcement learning (meta-RL) is a promising framework for tackling challenging domains requiring efficient exploration. Existing meta-RL algorithms are characterized by low sample efficiency, and mostly focus on low-dimensional task distributions. In parallel, model-based RL methods have been successful in solving partially observable MDPs, of which meta-RL is a special case.\nIn this work, we leverage this success and propose a new model-based approach to meta-RL, based on elements from existing state-of-the-art model-based and meta-RL methods. We demonstrate the effectiveness of our approach on common meta-RL benchmark domains, attaining greater return with better sample efficiency (up to $15\\times$) while requiring very little hyperparameter tuning. In addition, we validate our approach on a slate of more challenging, higher-dimensional domains, taking a step towards real-world generalizing agents.",
        "keywords": "Meta Reinforcement Learning;World Models;Model Based Reinforcement Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/b4b8a274431d39250f38bd36f23f2a37eefaac1d.zip",
        "author": "Zohar Rimon;Tom Jurgenson;Orr Krupnik;Gilad Adler;Aviv Tamar",
        "authorids": "~Zohar_Rimon1;~Tom_Jurgenson1;~Orr_Krupnik1;~Gilad_Adler1;~Aviv_Tamar2",
        "gender": "M;;M;M;M",
        "homepage": "https://zoharri.github.io/;;https://www.orrkrup.com;;https://avivt.github.io/avivt/",
        "dblp": "322/9338;https://dblp.uni-trier.de/pers/hd/j/Jurgenson:Tom;234/8503;;49/10622",
        "google_scholar": "GV8imVUAAAAJ;1YjIvioAAAAJ;E2lnAzIAAAAJ;;https://scholar.google.co.il/citations?user=kppa2vgAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;gilad-adler/;",
        "or_profile": "~Zohar_Rimon1;~Tom_Jurgenson1;~Orr_Krupnik1;~Gilad_Adler1;~Aviv_Tamar2",
        "aff": "Technion - Israel Institute of Technology, Technion - Israel Institute of Technology;Technion;Technion - Israel Institute of Technology, Technion - Israel Institute of Technology;;Technion, Technion",
        "aff_domain": "campus.technion.ac.il;technion.ac.il;campus.technion.ac.il;;technion.ac.il",
        "position": "PhD student;PhD student;PhD student;;Assistant Professor",
        "bibtex": "@inproceedings{\nrimon2024mamba,\ntitle={{MAMBA}: an Effective World Model Approach for Meta-Reinforcement Learning},\nauthor={Zohar Rimon and Tom Jurgenson and Orr Krupnik and Gilad Adler and Aviv Tamar},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=1RE0H6mU7M}\n}",
        "github": "",
        "project": "",
        "reviewers": "tjN7;X5No;fKkT;cu12",
        "pdf_size": 2571119,
        "rating": "6;6;6;6",
        "confidence": "4;4;4;3",
        "soundness": "3;2;3;3",
        "contribution": "3;2;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "126;131;161;73",
        "wc_strengths": "69;42;140;40",
        "wc_weaknesses": "239;557;462;150",
        "wc_questions": "51;12;4;141",
        "wc_review": "485;742;767;404",
        "wc_reply_reviewers": "261;16;192;50",
        "wc_reply_authors": "800;388;1019;695",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;2;3;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            122.75,
            31.68891762114951
        ],
        "wc_strengths_avg": [
            72.75,
            40.48070528041724
        ],
        "wc_weaknesses_avg": [
            352.0,
            164.08686723805778
        ],
        "wc_questions_avg": [
            52.0,
            54.37370688117557
        ],
        "wc_review_avg": [
            599.5,
            157.87099163557565
        ],
        "wc_reply_reviewers_avg": [
            129.75,
            100.49968905424534
        ],
        "wc_reply_authors_avg": [
            725.5,
            227.22730909818037
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10294479951427099315&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=1RE0H6mU7M",
        "pdf": "https://openreview.net/pdf?id=1RE0H6mU7M",
        "email": "campus.technion.ac.il;technion.ac.il;campus.technion.ac.il;;technion.ac.il",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Technion - Israel Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.technion.ac.il/en/",
        "aff_unique_abbr": "Technion",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Israel"
    },
    {
        "title": "Network Memory Footprint Compression Through Jointly Learnable Codebooks and Mappings",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19588",
        "id": "1RrOtCmuKr",
        "author_site": "Edouard YVINEC, Arnaud Dapogny, Kevin Bailly",
        "tldr": "",
        "abstract": "The massive interest in deep neural networks (DNNs) for both computer vision and natural language processing has been sparked by the growth in computational power. However, this led to an increase in the memory footprint, to a point where it can be challenging to simply load a model on commodity devices such as mobile phones. To address this limitation, quantization is a favored solution as it maps high precision tensors to a low precision, memory efficient format. In terms of memory footprint reduction, its most effective variants are based on codebooks. These methods, however, suffer from two limitations. First, they either define a single codebook for each tensor, or use a memory-expensive mapping to multiple codebooks. Second, gradient descent optimization of the mapping favors jumps toward extreme values, hence not defining a proximal search. In this work, we propose to address these two limitations. First, we initially group similarly distributed neurons and leverage the re-ordered structure to either apply different scale factors to the different groups, or map weights that fall in these groups to several codebooks, without any mapping overhead. Second, stemming from this initialization, we propose a joint learning of the codebook and weight mappings that bears similarities with recent gradient-based post-training quantization techniques. Third, drawing estimation from straight-through estimation techniques, we introduce a novel gradient update definition to enable a proximal search of the codebooks and their mappings. The proposed jointly learnable codebooks and mappings (JLCM) method allows a very efficient approximation of any DNN: as such, a Llama 7B can be compressed down to 2Go and loaded on 5-year-old smartphones.",
        "keywords": "quantization;codebooks;hashlists;compression;efficient inference;deep learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/2bd02732ded46eff81c3ed814a014e698b9e97f2.pdf",
        "author": "Edouard YVINEC;Arnaud Dapogny;Kevin Bailly",
        "authorids": "~Edouard_YVINEC1;~Arnaud_Dapogny1;~Kevin_Bailly3",
        "gender": "M;M;M",
        "homepage": "https://edouardyvinec.netlify.app/;;https://sites.google.com/view/bailly/",
        "dblp": "263/2218.html;165/8156;41/3712",
        "google_scholar": "https://scholar.google.fr/citations?user=q-J6Tz0AAAAJ;;oy59G9AAAAAJ",
        "orcid": "0000-0002-4318-612X;;",
        "linkedin": "edouard-yvinec-aa8333158/;;",
        "or_profile": "~Edouard_YVINEC1;~Arnaud_Dapogny1;~Kevin_Bailly3",
        "aff": ";Apple;Sorbonne University",
        "aff_domain": ";apple.com;sorbonne-universite.fr",
        "position": ";Researcher;Associate Professor",
        "bibtex": "@inproceedings{\nyvinec2024network,\ntitle={Network Memory Footprint Compression Through Jointly Learnable Codebooks and Mappings},\nauthor={Edouard YVINEC and Arnaud Dapogny and Kevin Bailly},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=1RrOtCmuKr}\n}",
        "github": "",
        "project": "",
        "reviewers": "kEDS;fJGw;P3Eg",
        "pdf_size": 479684,
        "rating": "5;6;8",
        "confidence": "4;2;2",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "2;2;3",
        "wc_summary": "71;87;109",
        "wc_strengths": "24;44;62",
        "wc_weaknesses": "142;73;45",
        "wc_questions": "5;43;96",
        "wc_review": "242;247;312",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "951;693;309",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            89.0,
            15.57776192739723
        ],
        "wc_strengths_avg": [
            43.333333333333336,
            15.520595635763755
        ],
        "wc_weaknesses_avg": [
            86.66666666666667,
            40.762182909598394
        ],
        "wc_questions_avg": [
            48.0,
            37.31844941401862
        ],
        "wc_review_avg": [
            267.0,
            31.88521078284832
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            651.0,
            263.77262936097065
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.7559289460184546,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17361935470188294799&as_sdt=5,31&sciodt=0,31&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=1RrOtCmuKr",
        "pdf": "https://openreview.net/pdf?id=1RrOtCmuKr",
        "email": ";apple.com;sorbonne-universite.fr",
        "author_num": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Apple;Sorbonne University",
        "aff_unique_dep": "Apple Inc.;",
        "aff_unique_url": "https://www.apple.com;https://www.sorbonne.universite.fr",
        "aff_unique_abbr": "Apple;Sorbonne",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United States;France"
    },
    {
        "id": "1SEXzogsET",
        "title": "LeetPrompt: Leveraging Collective Human Intelligence to Study LLMs",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "With the advent of pre-trained large language models (LLMs), natural language prompts are now becoming a de-facto method for interacting with language models. However, prompting as a technique is an esoteric art, involving cumbersome manual processes by individuals to search different strategies that make language models work for the intended task. We introduce LeetPrompt, a citizen science platform that leverages on collective human creativity with prompting to solve reasoning questions across various domains. Users of \\leetprompt attempt questions by writing prompts that solve all the hidden test cases. To measure the efficacy of LeetPrompt, we conduct a study $10$ questions across $5$ domains (biology, physics, math, programming, and general knowledge) with $20$ human subjects. We gather a total of $1173$ GPT-4 prompts with the following observations: First, problems deemed unsolvable by question setters were successfully solved. Second, diverse prompting strategies were used by the different participants. Third, the more difficult problems also had a high number of prompt submissions enabling better debugging of the LLM behaviour for that problem. These observations support various downstream implications in robust approaches to prompt interpretability and model evaluation, high quality data collection, human-AI alignment and real-world usage of LLMs.",
        "keywords": "evaluation of foundation models;collective intelligence",
        "primary_area": "infrastructure, software libraries, hardware, etc.",
        "supplementary_material": "/attachment/6e764791827649eea989d43d637989d37478306c.pdf",
        "author": "Sebastin Santy;Ayana Bharadwaj;Sahith Dambekodi;Alex Albert;Cathy Lang Yuan;Ranjay Krishna",
        "authorids": "~Sebastin_Santy2;~Ayana_Bharadwaj1;~Sahith_Dambekodi1;~Alex_Albert1;~Cathy_Lang_Yuan1;~Ranjay_Krishna1",
        "gender": "M;F;M;M;F;M",
        "homepage": "http://sebastinsanty.com/;;;https://www.alexalbert.me;;http://ranjaykrishna.com",
        "dblp": "212/5368;;;;;167/3785",
        "google_scholar": "HsyMg08AAAAJ;;;;;IcqahyAAAAAJ",
        "orcid": "0000-0003-1162-0865;;;;;0000-0001-8784-2531",
        "linkedin": "sebastinsanty/;ayana-bharadwaj-1921a71b0;sahith-dambekodi-31270b104/;alex-Albert;cathy-lang-yuan/;ranjay-krishna-1a344444/",
        "or_profile": "~Sebastin_Santy2;~Ayana_Bharadwaj1;~Sahith_Dambekodi1;~Alex_Albert1;~Cathy_Lang_Yuan1;~Ranjay_Krishna1",
        "aff": "University of Washington;Department of Computer Science;;;;University of Washington",
        "aff_domain": "cs.washington.edu;cs.washington.edu;;;;cs.washington.edu",
        "position": "PhD student;Undergrad student;;;;Assistant Professor",
        "bibtex": "@misc{\nsanty2024leetprompt,\ntitle={LeetPrompt: Leveraging Collective Human Intelligence to Study {LLM}s},\nauthor={Sebastin Santy and Ayana Bharadwaj and Sahith Dambekodi and Alex Albert and Cathy Lang Yuan and Ranjay Krishna},\nyear={2024},\nurl={https://openreview.net/forum?id=1SEXzogsET}\n}",
        "github": "",
        "project": "",
        "reviewers": "o2mR;68mT;RmkX;EkgE",
        "site": "https://openreview.net/forum?id=1SEXzogsET",
        "pdf_size": 2088332,
        "rating": "3;5;5;5",
        "confidence": "3;3;4;3",
        "soundness": "2;2;3;3",
        "contribution": "2;1;2;2",
        "presentation": "3;3;3;3",
        "wc_summary": "16;70;85;82",
        "wc_strengths": "58;32;53;50",
        "wc_weaknesses": "194;318;233;181",
        "wc_questions": "54;3;122;90",
        "wc_review": "322;423;493;403",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            63.25,
            27.851166941440713
        ],
        "wc_strengths_avg": [
            48.25,
            9.807522622966516
        ],
        "wc_weaknesses_avg": [
            231.5,
            53.48130514488217
        ],
        "wc_questions_avg": [
            67.25,
            44.21184795956849
        ],
        "wc_review_avg": [
            410.25,
            60.931826658980114
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:55gPqy9jnR0J:scholar.google.com/&scioq=LeetPrompt:+Leveraging+Collective+Human+Intelligence+to+Study+LLMs&hl=en&as_sdt=0,5",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Washington;Unknown Institution",
        "aff_unique_dep": ";Department of Computer Science",
        "aff_unique_url": "https://www.washington.edu;",
        "aff_unique_abbr": "UW;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States;"
    },
    {
        "title": "Spike-driven Transformer V2: Meta Spiking Neural Network Architecture Inspiring the Design of Next-generation Neuromorphic Chips",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19587",
        "id": "1SIBN5Xyw7",
        "author_site": "Man Yao, Jiakui Hu, Tianxiang Hu, Yifan Xu, Zhaokun Zhou, Yonghong Tian, Bo XU, Guoqi Li",
        "tldr": "",
        "abstract": "Neuromorphic computing, which exploits Spiking Neural Networks (SNNs) on neuromorphic chips, is a promising energy-efficient alternative to traditional AI. CNN-based SNNs are the current mainstream of neuromorphic computing. By contrast, no neuromorphic chips are designed especially for Transformer-based SNNs, which have just emerged, and their performance is only on par with CNN-based SNNs, offering no distinct advantage. In this work, we propose a general Transformer-based SNN architecture, termed as ``Meta-SpikeFormer\", whose goals are: (1) *Lower-power*, supports the spike-driven paradigm that there is only sparse addition in the network; (2) *Versatility*, handles various vision tasks; (3) *High-performance*, shows overwhelming performance advantages over CNN-based SNNs; (4) *Meta-architecture*, provides inspiration for future next-generation Transformer-based neuromorphic chip designs. Specifically, we extend the Spike-driven Transformer in \\citet{yao2023spike} into a meta architecture, and explore the impact of structure, spike-driven self-attention, and skip connection on its performance. On ImageNet-1K, Meta-SpikeFormer achieves 80.0\\% top-1 accuracy (55M), surpassing the current state-of-the-art (SOTA) SNN baselines (66M) by 3.7\\%. This is the first direct training SNN backbone that can simultaneously supports classification, detection, and segmentation, obtaining SOTA results in SNNs. Finally, we discuss the inspiration of the meta SNN architecture for neuromorphic chip design.",
        "keywords": "Spiking neural networks;Spiking transformer;Transformer-based SNNs;Neuromorphic chips;Spike-driven self-attention",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/bcb68506e3c8b968b7c11cb052a9bc1399a06b86.pdf",
        "author": "Man Yao;JiaKui Hu;Tianxiang Hu;Yifan Xu;Zhaokun Zhou;Yonghong Tian;Bo XU;Guoqi Li",
        "authorids": "~Man_Yao1;~JiaKui_Hu1;~Tianxiang_Hu3;~Yifan_Xu9;~Zhaokun_Zhou1;~Yonghong_Tian1;~Bo_XU10;~Guoqi_Li1",
        "gender": "M;M;M;M;M;M;M;M",
        "homepage": ";https://github.com/jkhu29;https://github.com/TiminHu;https://yifanxu74.github.io;;http://www.pkuml.org;;https://scholar.google.com/citations?hl=en&user=qCfE--MAAAAJ",
        "dblp": "21/5932;327/3225;;;;86/5857;;",
        "google_scholar": "eE4vvp0AAAAJ;VagFt-sAAAAJ;;https://scholar.google.com/citations?hl=zh-CN;;https://scholar.google.com/citations?hl=en;;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;;0000-0003-4454-6630;0000-0002-2978-5935;;",
        "linkedin": ";;;;;;%E6%B3%A2-%E5%BE%90-74210b115/?midToken=AQH1EMB1ZoboJA&midSig=2Q5MzMXmNEH9M1&trk=eml-email_pymk_02-header-22-profile&trkEmail=eml-email_pymk_02-header-22-profile-null-7ydrhe~kpggjoav~k9-null-neptune/profile~vanity.view;",
        "or_profile": "~Man_Yao1;~JiaKui_Hu1;~Tianxiang_Hu3;~Yifan_Xu9;~Zhaokun_Zhou1;~Yonghong_Tian1;~Bo_XU10;~Guoqi_Li1",
        "aff": "Institute of automation, Chinese academy of sciences;Peking University;Institute of Automation, Chinese Academy of Sciences;Institute of Automation, Chinese Academy of Sciences;Peking University;Peking University;Institute of Automation, Chinese Academy of Sciences;Institute of Automation, Chinese Academy of Sciences",
        "aff_domain": "ia.ac.cn;pku.edu.cn;ia.ac.cn;ia.ac.cn;pku.edu.cn;pku.edu.cn;ia.ac.cn;ia.ac.cn",
        "position": "Assistant Professor;PhD student;PhD student;PhD student;PhD student;Full Professor;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nyao2024spikedriven,\ntitle={Spike-driven Transformer V2: Meta Spiking Neural Network Architecture Inspiring the Design of Next-generation Neuromorphic Chips},\nauthor={Man Yao and JiaKui Hu and Tianxiang Hu and Yifan Xu and Zhaokun Zhou and Yonghong Tian and Bo XU and Guoqi Li},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=1SIBN5Xyw7}\n}",
        "github": "",
        "project": "",
        "reviewers": "1cdx;JmyY;Aepg",
        "pdf_size": 576149,
        "rating": "5;6;6",
        "confidence": "4;4;3",
        "soundness": "2;4;3",
        "contribution": "2;3;2",
        "presentation": "3;4;3",
        "wc_summary": "60;33;90",
        "wc_strengths": "23;58;96",
        "wc_weaknesses": "27;48;23",
        "wc_questions": "68;33;149",
        "wc_review": "178;172;358",
        "wc_reply_reviewers": "0;11;6",
        "wc_reply_authors": "2080;618;1280",
        "reply_reviewers": "0;1;1",
        "reply_authors": "3;2;2",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            61.0,
            23.280893453645632
        ],
        "wc_strengths_avg": [
            59.0,
            29.81051268708183
        ],
        "wc_weaknesses_avg": [
            32.666666666666664,
            10.96458946893235
        ],
        "wc_questions_avg": [
            83.33333333333333,
            48.58211833815218
        ],
        "wc_review_avg": [
            236.0,
            86.30179604156567
        ],
        "wc_reply_reviewers_avg": [
            5.666666666666667,
            4.4969125210773475
        ],
        "wc_reply_authors_avg": [
            1326.0,
            597.7446500527351
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 77,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17884632612771453622&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=1SIBN5Xyw7",
        "pdf": "https://openreview.net/pdf?id=1SIBN5Xyw7",
        "email": "ia.ac.cn;pku.edu.cn;ia.ac.cn;ia.ac.cn;pku.edu.cn;pku.edu.cn;ia.ac.cn;ia.ac.cn",
        "author_num": 8,
        "aff_unique_index": "0;1;0;0;1;1;0;0",
        "aff_unique_norm": "Chinese Academy of Sciences;Peking University",
        "aff_unique_dep": "Institute of Automation;",
        "aff_unique_url": "http://www.ia.cas.cn;http://www.pku.edu.cn",
        "aff_unique_abbr": "CAS;Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "1SO93f7sVf",
        "title": "Training Neural Networks from Scratch with Parallel Low-Rank Adapters",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The scalability of deep learning applications is fundamentally constrained by compute, memory, and communication. While low-rank adaptation (LoRA) has reduced these costs for model fine-tuning, its application to model pre-training remain largely unexplored. This paper examines the extension of LoRA to model pre-training, identifying the constraints and limitations inherent to standard LoRA in the context of pre-training. We introduce LoRA-the-Explorer (LTE), a novel bi-level optimization algorithm, to facilitate parallel training of multiple low-rank heads across compute nodes, minimizing the necessity for frequent synchronization. Our methodology involves rigorous experimentation on vision transformers using ImageNet100, demonstrating that LTE is competitive with standard distributed training methodologies. Initial scalability tests on ImageNet1k show that LTE can match standard training performance by leveraging more training iterations.",
        "keywords": "Low-rank adapters",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Minyoung Huh;Brian Cheung;Jeremy Bernstein;Phillip Isola;Pulkit Agrawal",
        "authorids": "~Minyoung_Huh1;~Brian_Cheung1;~Jeremy_Bernstein1;~Phillip_Isola1;~Pulkit_Agrawal1",
        "gender": "M;M;M;M;M",
        "homepage": "https://people.csail.mit.edu/minhuh/;https://briancheung.github.io/;https://jeremybernste.in;http://web.mit.edu/phillipi/;https://people.eecs.berkeley.edu/~pulkitag/",
        "dblp": "220/3360;;215/3638;36/9988;149/2672",
        "google_scholar": "2k18_1IAAAAJ;7N-ethYAAAAJ;;ROILf3EAAAAJ;UpZmJI0AAAAJ",
        "orcid": ";;;0000-0002-1411-6704;",
        "linkedin": ";;;phillip-isola-a9955b20/;",
        "or_profile": "~Minyoung_Huh1;~Brian_Cheung1;~Jeremy_Bernstein1;~Phillip_Isola1;~Pulkit_Agrawal1",
        "aff": "Massachusetts Institute of Technology;Massachusetts Institute of Technology;Massachusetts Institute of Technology;Massachusetts Institute of Technology;Massachusetts Institute of Technology",
        "aff_domain": "mit.edu;mit.edu;mit.edu;mit.edu;mit.edu",
        "position": "PhD student;Research Fellow;Postdoc;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nhuh2024training,\ntitle={Training Neural Networks from Scratch with Parallel Low-Rank Adapters},\nauthor={Minyoung Huh and Brian Cheung and Jeremy Bernstein and Phillip Isola and Pulkit Agrawal},\nyear={2024},\nurl={https://openreview.net/forum?id=1SO93f7sVf}\n}",
        "github": "",
        "project": "",
        "reviewers": "q4qF;Sixn;i1ro;aA3h",
        "site": "https://openreview.net/forum?id=1SO93f7sVf",
        "pdf_size": 2726951,
        "rating": "3;3;5;6",
        "confidence": "4;4;4;3",
        "soundness": "2;1;2;2",
        "contribution": "2;2;2;3",
        "presentation": "3;1;2;3",
        "wc_summary": "89;117;107;49",
        "wc_strengths": "54;103;101;67",
        "wc_weaknesses": "400;223;277;50",
        "wc_questions": "246;170;6;66",
        "wc_review": "789;613;491;232",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "2215;1068;547;460",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "5;2;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            90.5,
            25.975950415721076
        ],
        "wc_strengths_avg": [
            81.25,
            21.26470079733077
        ],
        "wc_weaknesses_avg": [
            237.5,
            125.8302427876542
        ],
        "wc_questions_avg": [
            122.0,
            92.56349172324907
        ],
        "wc_review_avg": [
            531.25,
            202.66274324601451
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1072.5,
            699.3984915625712
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.25,
            1.6393596310755
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.7777777777777777,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8115461409047773032&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Massachusetts Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://web.mit.edu",
        "aff_unique_abbr": "MIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Be Careful What You Smooth For: Label Smoothing Can Be a Privacy Shield but Also a Catalyst for Model Inversion Attacks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19586",
        "id": "1SbkubNdbW",
        "author_site": "Lukas Struppek, Dominik Hintersdorf, Kristian Kersting",
        "tldr": "",
        "abstract": "Label smoothing \u2013 using softened labels instead of hard ones \u2013 is a widely adopted regularization method for deep learning, showing diverse benefits such as enhanced generalization and calibration. Its implications for preserving model privacy, however, have remained unexplored. To fill this gap, we investigate the impact of label smoothing on model inversion attacks (MIAs), which aim to generate class-representative samples by exploiting the knowledge encoded in a classifier, thereby inferring sensitive information about its training data. Through extensive analyses, we uncover that traditional label smoothing fosters MIAs, thereby increasing a model's privacy leakage. Even more, we reveal that smoothing with negative factors counters this trend, impeding the extraction of class-related information and leading to privacy preservation, beating state-of-the-art defenses. This establishes a practical and powerful novel way for enhancing model resilience against MIAs.",
        "keywords": "model inversion attacks;privacy;label smoothing;defense",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/f571eba3be2633fb8ea8e19a64374cead84fb9b3.zip",
        "author": "Lukas Struppek;Dominik Hintersdorf;Kristian Kersting",
        "authorids": "~Lukas_Struppek1;~Dominik_Hintersdorf1;~Kristian_Kersting1",
        "gender": "M;M;M",
        "homepage": "https://lukasstruppek.github.io/;https://d0mih.github.io/;http://www.ml.informatik.tu-darmstadt.de/",
        "dblp": "306/1485;306/1325;40/3793",
        "google_scholar": "tU8K5qsAAAAJ;DKITUfsAAAAJ;QY-earAAAAAJ",
        "orcid": "0000-0003-0626-3672;0000-0003-4976-6894;0000-0002-2873-9152",
        "linkedin": "lukas-struppek/;;",
        "or_profile": "~Lukas_Struppek1;~Dominik_Hintersdorf1;~Kristian_Kersting1",
        "aff": "Technische Universit\u00e4t Darmstadt;CS Department, TU Darmstadt, Technische Universit\u00e4t Darmstadt;TU Darmstadt",
        "aff_domain": "tu-darmstadt.de;cs.tu-darmstadt.de;tu-darmstadt.de",
        "position": "PhD student;PhD student;Full Professor",
        "bibtex": "@inproceedings{\nstruppek2024be,\ntitle={Be Careful What You Smooth For: Label Smoothing Can Be a Privacy Shield but Also a Catalyst for Model Inversion Attacks},\nauthor={Lukas Struppek and Dominik Hintersdorf and Kristian Kersting},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=1SbkubNdbW}\n}",
        "github": "",
        "project": "",
        "reviewers": "EAeB;wJ7G;dNRe;22v2;uLpV",
        "pdf_size": 7637387,
        "rating": "5;6;6;6;8",
        "confidence": "4;4;5;2;4",
        "soundness": "3;3;2;2;2",
        "contribution": "2;3;2;3;3",
        "presentation": "3;3;3;4;3",
        "wc_summary": "37;77;65;28;57",
        "wc_strengths": "125;63;34;32;155",
        "wc_weaknesses": "206;87;848;187;178",
        "wc_questions": "73;17;11;59;1",
        "wc_review": "441;244;958;306;391",
        "wc_reply_reviewers": "0;43;506;0;23",
        "wc_reply_authors": "773;1369;4076;894;811",
        "reply_reviewers": "0;1;1;0;1",
        "reply_authors": "3;4;8;2;2",
        "rating_avg": [
            6.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.8,
            0.9797958971132712
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            3.2,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            52.8,
            17.98221343439122
        ],
        "wc_strengths_avg": [
            81.8,
            49.68460526158983
        ],
        "wc_weaknesses_avg": [
            301.2,
            276.46149822353203
        ],
        "wc_questions_avg": [
            32.2,
            28.414081016284864
        ],
        "wc_review_avg": [
            468.0,
            254.23532406021002
        ],
        "wc_reply_reviewers_avg": [
            114.4,
            196.4572218066824
        ],
        "wc_reply_authors_avg": [
            1584.6,
            1263.9333210260738
        ],
        "reply_reviewers_avg": [
            0.6,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            3.8,
            2.2271057451320084
        ],
        "replies_avg": [
            30,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.04166666666666666,
        "gs_citation": 22,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15861784773542527773&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=1SbkubNdbW",
        "pdf": "https://openreview.net/pdf?id=1SbkubNdbW",
        "email": "tu-darmstadt.de;cs.tu-darmstadt.de;tu-darmstadt.de",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Technische Universit\u00e4t Darmstadt",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tu-darmstadt.de",
        "aff_unique_abbr": "TUD",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Darmstadt",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "1V1QQYARmd",
        "title": "Nearest neighbor-based out-of-distribution detection via label smoothing",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Detecting out-of-distribution (OOD) examples is critical in many applications. We propose an unsupervised method to detect OOD samples using a $k$-NN density estimate with respect to a classification model's intermediate activations on in-distribution samples. We leverage a recent insight about label smoothing, which we call the {\\it Label Smoothed Embedding Hypothesis}, and show that one of the implications is that the $k$-NN density estimator performs better as an OOD detection method both theoretically and empirically when the model is trained with label smoothing. Finally, we show that our proposal outperforms many OOD baselines and we also provide new finite-sample high-probability statistical results for $k$-NN density estimation's ability to detect OOD examples.",
        "keywords": "out-of-distribution detection;nearest neighbors;label smoothing;k-NN",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Dara Bahri;Heinrich Jiang;Yi Tay;Donald Metzler",
        "authorids": "~Dara_Bahri1;~Heinrich_Jiang1;~Yi_Tay1;~Donald_Metzler1",
        "gender": "M;M;M;M",
        "homepage": "http://www.dara.run;;http://yitay.net;https://research.google/people/DonaldMetzler/",
        "dblp": "231/7656;182/2472;;95/2272",
        "google_scholar": "j5PpTOwAAAAJ;;VBclY_cAAAAJ;bmXpOd8AAAAJ",
        "orcid": ";;;0000-0003-4276-6269",
        "linkedin": ";;;donmetzler/",
        "or_profile": "~Dara_Bahri1;~Heinrich_Jiang1;~Yi_Tay1;~Donald_Metzler1",
        "aff": "Google Research;Google;Google;Google",
        "aff_domain": "google.com;google.com;google.com;google.com",
        "position": "Research Scientist;Research scientist;Research Scientist;Research Scientist",
        "bibtex": "@misc{\nbahri2024nearest,\ntitle={Nearest neighbor-based out-of-distribution detection via label smoothing},\nauthor={Dara Bahri and Heinrich Jiang and Yi Tay and Donald Metzler},\nyear={2024},\nurl={https://openreview.net/forum?id=1V1QQYARmd}\n}",
        "github": "",
        "project": "",
        "reviewers": "dvW7;rYbM;rsM8;qE8z",
        "site": "https://openreview.net/forum?id=1V1QQYARmd",
        "pdf_size": 4927567,
        "rating": "3;5;6;8",
        "confidence": "3;3;3;3",
        "soundness": "2;2;2;4",
        "contribution": "2;2;2;4",
        "presentation": "1;2;3;4",
        "wc_summary": "30;40;64;47",
        "wc_strengths": "36;22;49;65",
        "wc_weaknesses": "95;103;128;29",
        "wc_questions": "72;125;135;42",
        "wc_review": "233;290;376;183",
        "wc_reply_reviewers": "87;0;37;0",
        "wc_reply_authors": "427;495;506;117",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "2;1;2;1",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            45.25,
            12.397076268217438
        ],
        "wc_strengths_avg": [
            43.0,
            15.890248582070704
        ],
        "wc_weaknesses_avg": [
            88.75,
            36.5812451947716
        ],
        "wc_questions_avg": [
            93.5,
            38.17394399325278
        ],
        "wc_review_avg": [
            270.5,
            71.71645557332013
        ],
        "wc_reply_reviewers_avg": [
            31.0,
            35.68613176011096
        ],
        "wc_reply_authors_avg": [
            386.25,
            158.36883373947035
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:QbU3QgMwBQUJ:scholar.google.com/&scioq=Nearest+neighbor-based+out-of-distribution+detection+via+label+smoothing&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Google",
        "aff_unique_dep": "Google Research",
        "aff_unique_url": "https://research.google",
        "aff_unique_abbr": "Google Research",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Mountain View",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "1VcKvdYbUM",
        "title": "APBench: A Unified Benchmark for Availability Poisoning Attacks and Defenses",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The efficacy of availability poisoning, a method of poisoning data by injecting imperceptible perturbations to prevent its use in model training, has been a hot subject of investigation. Previous research suggested that it was difficult to effectively counteract such poisoning attacks. However, the introduction of various defense methods has challenged this notion. Due to the rapid progress in this field, the performance of different novel methods cannot be accurately validated due to variations in experimental setups. To further evaluate the attack and defense capabilities of these poisoning methods, we have developed a benchmark --- APBench for assessing the efficacy of adversarial poisoning. APBench consists of 9 state-of-the-art availability poisoning attacks, 8 defense algorithms, and 4 conventional data augmentation techniques. We also have set up experiments with varying different poisoning ratios, and evaluated the attacks on multiple datasets and their transferability across model architectures. We further conducted a comprehensive evaluation of 2 additional attacks specifically targeting unsupervised models. Our results reveal the glaring inadequacy of existing attacks in safeguarding individual privacy. APBench is open source and available to the deep learning community.",
        "keywords": "Availability Attacks;Data Protection;Privacy",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/444e8cd8a0da355de7ca04beb34c5fa8766b1ab4.zip",
        "author": "Tianrui Qin;Xitong Gao;Juanjuan Zhao;Kejiang Ye;Cheng-zhong Xu",
        "authorids": "~Tianrui_Qin1;~Xitong_Gao1;~Juanjuan_Zhao1;~Kejiang_Ye1;~Cheng-zhong_Xu1",
        "gender": "M;M;F;;",
        "homepage": "https://github.com/Tianyue818;https://github.com/admk;https://people.ucas.ac.cn/~zhaojuanjuan?language=cn;;",
        "dblp": "294/4992;140/2071;;;",
        "google_scholar": "_bOMXMkAAAAJ;-YIUCL8AAAAJ;;;",
        "orcid": "0009-0002-8386-2003;0000-0002-2063-2051;;;",
        "linkedin": ";;;;",
        "or_profile": "~Tianrui_Qin1;~Xitong_Gao1;~Juanjuan_Zhao1;~Kejiang_Ye1;~Cheng-zhong_Xu1",
        "aff": "Shenzhen Institutes of Advanced Technology, Chinese Academy of Sciences, Chinese Academy of Sciences;Shenzhen Institute of Advanced Technology, Chinese Academy of Sciences;Shenzhen Institutes of Advanced Technology, Chinese Academy of Sciences, Chinese Academy of Sciences;;",
        "aff_domain": "siat.ac.cn;siat.ac.cn;siat.ac.cn;;",
        "position": "MS student;Researcher;Associate Professor;;",
        "bibtex": "@misc{\nqin2024apbench,\ntitle={{APB}ench: A Unified Benchmark for Availability Poisoning Attacks and Defenses},\nauthor={Tianrui Qin and Xitong Gao and Juanjuan Zhao and Kejiang Ye and Cheng-zhong Xu},\nyear={2024},\nurl={https://openreview.net/forum?id=1VcKvdYbUM}\n}",
        "github": "",
        "project": "",
        "reviewers": "gtEa;nmU1;WVAC;8Vbt",
        "site": "https://openreview.net/forum?id=1VcKvdYbUM",
        "pdf_size": 6134649,
        "rating": "3;3;5;6",
        "confidence": "4;5;4;4",
        "soundness": "2;1;3;3",
        "contribution": "2;2;2;3",
        "presentation": "1;3;2;3",
        "wc_summary": "22;72;123;104",
        "wc_strengths": "8;11;30;87",
        "wc_weaknesses": "16;29;21;190",
        "wc_questions": "244;554;641;55",
        "wc_review": "290;666;815;436",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "455;463;658;170",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            80.25,
            38.25163395202877
        ],
        "wc_strengths_avg": [
            34.0,
            31.741140496207755
        ],
        "wc_weaknesses_avg": [
            64.0,
            72.89375830618147
        ],
        "wc_questions_avg": [
            373.5,
            235.76948487876882
        ],
        "wc_review_avg": [
            551.75,
            202.6479397872083
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            436.5,
            174.0179588433332
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5555555555555555,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4711376913267131339&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Chinese Academy of Sciences;Shenzhen Institute of Advanced Technology",
        "aff_unique_dep": "Shenzhen Institutes of Advanced Technology;",
        "aff_unique_url": "http://www.cas.cn;http://www.siat.cas.cn",
        "aff_unique_abbr": "CAS;SIAT",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Shenzhen",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Beyond Stationarity: Convergence Analysis of Stochastic Softmax Policy Gradient Methods",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19585",
        "id": "1VeQ6VBbev",
        "author_site": "Sara Klein, Simon Weissmann, Leif D\u00f6ring",
        "tldr": "",
        "abstract": "Markov Decision Processes (MDPs) are a formal framework for modeling and solving sequential decision-making problems. In finite time horizons such problems are relevant for instance for optimal stopping or specific supply chain problems, but also in the training of large language models. In contrast to infinite horizon MDPs optimal policies are not stationary, policies must be learned for every single epoch. In practice all parameters are often trained simultaneously, ignoring the inherent structure suggested by dynamic programming. This paper introduces a combination of dynamic programming and policy gradient called dynamical policy gradient, where the parameters are trained backwards in time. \n   \n   For the tabular softmax parametrisation we carry out the convergence analysis for simultaneous and dynamic policy gradient towards global optima, both in the exact and sampled gradient settings without regularisation. It turns out that the use of dynamic policy gradient training much better exploits the structure of finite-time problems which is reflected in improved convergence bounds.",
        "keywords": "reinforcement learning;policy gradient;stochastic approximation;finite-time MDP",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/2c81ff9fb426afbf43cc32ae4539fee865a0d40b.pdf",
        "author": "Sara Klein;Simon Weissmann;Leif D\u00f6ring",
        "authorids": "~Sara_Klein1;~Simon_Weissmann1;~Leif_D\u00f6ring1",
        "gender": "F;M;M",
        "homepage": ";https://www.wim.uni-mannheim.de/doering/team/prof-dr-simon-weissmann/;https://www.wim.uni-mannheim.de/doering/",
        "dblp": "359/1702;246/5069;346/0412.html",
        "google_scholar": ";Pfxc_RgAAAAJ;",
        "orcid": ";0000-0002-5111-6658;0000-0002-4569-5083",
        "linkedin": "sara-klein-wima/;;leif-d\u00f6ring-0b002496/?originalSubdomain=de",
        "or_profile": "~Sara_Klein1;~Simon_Weissmann1;~Leif_D\u00f6ring1",
        "aff": "Universit\u00e4t Mannheim;University of Mannheim;Universit\u00e4t Mannheim",
        "aff_domain": "uni-mannheim.de;uni-mannheim.de;uni-mannheim.de",
        "position": "PhD student;Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\nklein2024beyond,\ntitle={Beyond Stationarity: Convergence Analysis of Stochastic Softmax Policy Gradient Methods},\nauthor={Sara Klein and Simon Weissmann and Leif D{\\\"o}ring},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=1VeQ6VBbev}\n}",
        "github": "",
        "project": "",
        "reviewers": "Y9J6;iprP;EGiX",
        "pdf_size": 735199,
        "rating": "6;8;8",
        "confidence": "3;3;3",
        "soundness": "3;4;3",
        "contribution": "3;3;3",
        "presentation": "2;4;3",
        "wc_summary": "79;160;37",
        "wc_strengths": "102;109;36",
        "wc_weaknesses": "128;20;49",
        "wc_questions": "58;44;269",
        "wc_review": "367;333;391",
        "wc_reply_reviewers": "0;60;0",
        "wc_reply_authors": "541;234;795",
        "reply_reviewers": "0;1;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            92.0,
            51.048996072400875
        ],
        "wc_strengths_avg": [
            82.33333333333333,
            32.8870119584549
        ],
        "wc_weaknesses_avg": [
            65.66666666666667,
            45.63867755411948
        ],
        "wc_questions_avg": [
            123.66666666666667,
            102.92499966264539
        ],
        "wc_review_avg": [
            363.6666666666667,
            23.79542439676633
        ],
        "wc_reply_reviewers_avg": [
            20.0,
            28.284271247461902
        ],
        "wc_reply_authors_avg": [
            523.3333333333334,
            229.3677299786427
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7573781758097719815&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=1VeQ6VBbev",
        "pdf": "https://openreview.net/pdf?id=1VeQ6VBbev",
        "email": "uni-mannheim.de;uni-mannheim.de;uni-mannheim.de",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Mannheim",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uni-mannheim.de",
        "aff_unique_abbr": "UM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "1WSd408I9M",
        "title": "Generative AI in healthcare: A trustworthy approach",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Generative AI in healthcare: A trustworthy approach\n\nAbstract: The recent advancements in self-supervised algorithms like Transformer Architecture and Diffusion models have expanded the means of applying AI in healthcare and life sciences. To achieve real world adoption, it is important to measure and audit the trustworthiness of the AI system as per the legal and compliance requirements for privacy, security, fairness, and safety. In this paper, we focus on the method to achieve trustworthiness in an LLM (Large Language Model) based decision support system for physicians. The stakeholders for this decision support system are patients, physicians, regulators, and external auditors. We focus on the limitations of large or foundation models and the method to overcome these limitations, with the aim of accelerating the adoption of this far-reaching technology in the healthcare sector. It also explores possible guardrails for safety and the methods for aligning AI systems to guardrails.\n\nOur Solution Approach:\nWe explore an approach to an AI system which can enhance decision capabilities by using the data and EHRs (Electronic Health Record) collected over many years for a vast volume of patients. The longitudinal data consists of biomarkers, disease progression indicators, treatment administered, and patient outcome. The goal of the system is to assist physicians in identifying the best treatment option for a given patient context. The LLM-based system will be able to predict optimal options based on hundreds of similar cases on which it was trained. The paper addresses the transparency, data integrity, model development, and performance validation of the system.  In the sections below, we explore the various stages of development and deployment of such a system, the challenges, and the methods to overcome the challenges.",
        "keywords": "Generative AI;healthcare;trustworthy;Transformer Architecture;guardrails",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "parul berry;Vishwesh Milind Bharadiya;Sree Kumar",
        "authorids": "~parul_berry1;~Vishwesh_Milind_Bharadiya1;~Sree_Kumar1",
        "gender": ";;M",
        "homepage": ";;https://www.linkedin.com/in/kumarsree/",
        "dblp": ";;",
        "google_scholar": ";;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~parul_berry1;~Vishwesh_Milind_Bharadiya1;~Sree_Kumar1",
        "aff": ";;Wipro Technologies",
        "aff_domain": ";;wipro.com",
        "position": ";;Researcher",
        "bibtex": "@misc{\nanonymous2024generative,\ntitle={Generative {AI} in healthcare: A trustworthy approach},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=1WSd408I9M}\n}",
        "github": "",
        "project": "",
        "reviewers": "8VP9;mU33;tPic",
        "site": "https://openreview.net/forum?id=1WSd408I9M",
        "pdf_size": 197634,
        "rating": "1;1;1",
        "confidence": "5;3;5",
        "soundness": "1;1;1",
        "contribution": "1;1;1",
        "presentation": "1;1;2",
        "wc_summary": "86;38;33",
        "wc_strengths": "30;41;23",
        "wc_weaknesses": "86;101;89",
        "wc_questions": "23;34;4",
        "wc_review": "225;214;149",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            1.0,
            0.0
        ],
        "confidence_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "soundness_avg": [
            1.0,
            0.0
        ],
        "contribution_avg": [
            1.0,
            0.0
        ],
        "presentation_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            52.333333333333336,
            23.893281249943232
        ],
        "wc_strengths_avg": [
            31.333333333333332,
            7.408703590297623
        ],
        "wc_weaknesses_avg": [
            92.0,
            6.48074069840786
        ],
        "wc_questions_avg": [
            20.333333333333332,
            12.39175353029407
        ],
        "wc_review_avg": [
            196.0,
            33.53605025441527
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:g-dr3QN8t_MJ:scholar.google.com/&scioq=Generative+AI+in+healthcare:+A+trustworthy+approach&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Wipro",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.wipro.com",
        "aff_unique_abbr": "Wipro",
        "aff_country_unique_index": "0",
        "aff_country_unique": "India"
    },
    {
        "id": "1WceuzWff5",
        "title": "Understanding the Transfer of High-Level Reinforcement Learning Skills Across Diverse Environments",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "A large number of reinforcement learning (RL) environments are available to the research community. However, due to differences across these environments, it is difficult to transfer skills learnt by a RL agent from one environment to another. For this transfer learning problem, a multitask RL perspective is considered in this paper, the goal being to transfer the skills from one environment to another using a single policy. To achieve such goal, we design an environment agnostic policy that enables the sharing of skills. Our experimental results demonstrate that: (a) by training on both desired environments using standard RL algorithms, the skills can be transferred from one environment to another; (b) by changing the amount of data that the RL algorithm uses to optimize the policy and value functions, we\nshow empirically that the transfer of knowledge between different environments is possible, and results in learning tasks with up to 84% fewer gradient update steps. This study takes an important step towards enabling more effective transfer of skills by learning in multitask RL scenarios across diverse environments by designing skill-sharing, sample-efficient RL training protocols.",
        "keywords": "reinforcement learning;representation learning;multi-task reinforcement learning;transfer learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Reginald McLean;Kai Yuan;Isaac Woungang;Nariman Farsad",
        "authorids": "~Reginald_McLean1;~Kai_Yuan1;~Isaac_Woungang2;~Nariman_Farsad1",
        "gender": "M;M;M;M",
        "homepage": "https://www.reggiemclean.ca/;https://www.linkedin.com/in/kai-yuan/;https://cs.torontomu.ca/~iwoungan/;http://narimanfarsad.com/",
        "dblp": ";;67/176.html;",
        "google_scholar": "gBBveasAAAAJ;8eLlbhMAAAAJ;https://scholar.google.ca/citations?user=sVTW2tMAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;",
        "linkedin": "https://www.linkedin.com/mwlite/in/reginaldmclean;;;",
        "or_profile": "~Reginald_McLean1;~Kai_Yuan1;~Isaac_Woungang2;~Nariman_Farsad1",
        "aff": "Toronto Metropolitan University;Intel;Toronto Metropolitan University;Toronto Metropolitan University",
        "aff_domain": "torontomu.ca;intel.com;torontomu.ca;torontomu.ca",
        "position": "PhD student;Researcher;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nmclean2024understanding,\ntitle={Understanding the Transfer of High-Level Reinforcement Learning Skills Across Diverse Environments},\nauthor={Reginald McLean and Kai Yuan and Isaac Woungang and Nariman Farsad},\nyear={2024},\nurl={https://openreview.net/forum?id=1WceuzWff5}\n}",
        "github": "",
        "project": "",
        "reviewers": "Um91;awjg;NkEv;8Y8K",
        "site": "https://openreview.net/forum?id=1WceuzWff5",
        "pdf_size": 1796034,
        "rating": "3;3;3;5",
        "confidence": "4;5;5;3",
        "soundness": "1;2;2;2",
        "contribution": "1;2;1;3",
        "presentation": "2;2;1;3",
        "wc_summary": "79;78;158;83",
        "wc_strengths": "28;244;43;140",
        "wc_weaknesses": "211;255;133;413",
        "wc_questions": "2;281;49;375",
        "wc_review": "320;858;383;1011",
        "wc_reply_reviewers": "325;0;170;505",
        "wc_reply_authors": "399;510;903;1697",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "1;1;2;3",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            99.5,
            33.826764551165695
        ],
        "wc_strengths_avg": [
            113.75,
            86.62094146336669
        ],
        "wc_weaknesses_avg": [
            253.0,
            102.18610473053565
        ],
        "wc_questions_avg": [
            176.75,
            155.7471909859051
        ],
        "wc_review_avg": [
            643.0,
            297.3121255515826
        ],
        "wc_reply_reviewers_avg": [
            250.0,
            186.78195844352848
        ],
        "wc_reply_authors_avg": [
            877.25,
            508.98151980204545
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8703882797784891,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:HK4IaEpE5oQJ:scholar.google.com/&scioq=Understanding+the+Transfer+of+High-Level+Reinforcement+Learning+Skills+Across+Diverse+Environments&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Toronto Metropolitan University;Intel",
        "aff_unique_dep": ";Intel Corporation",
        "aff_unique_url": "https://www.tmu.ca/;https://www.intel.com",
        "aff_unique_abbr": "TMU;Intel",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "Canada;United States"
    },
    {
        "title": "Beyond IID weights: sparse and low-rank deep Neural Networks are also Gaussian Processes",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19584",
        "id": "1Wi0Ys33Nm",
        "author_site": "Thiziri Nait Saada, Alireza Naderi, Jared Tanner",
        "tldr": "",
        "abstract": "The infinitely wide neural network has been proven a useful and manageable mathematical model that enables the understanding of many phenomena appearing in deep learning. One example is the convergence of random deep networks to Gaussian processes that enables a rigorous analysis of the way the choice of activation function and network weights impacts the training dynamics. In this paper, we extend the seminal proof of Matthews et al., 2018 to a larger class of initial weight distributions (which we call pseudo-iid), including the established cases of iid and orthogonal weights, as well as the emerging low-rank and structured sparse settings celebrated for their computational speed-up benefits. We show that fully-connected and convolutional networks initialised with pseudo-iid distributions are all effectively equivalent up to their variance. Using our results, one can identify the Edge of Chaos for a broader class of neural networks and tune them at criticality in order to enhance their training. Moreover, they enable the posterior distribution of Bayesian Neural Networks to be tractable across these various initialization schemes.",
        "keywords": "Deep Neural Networks;Gaussian processes;Neural Networks initialisation;Edge of chaos;Large width limit;Mean-Field",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Thiziri Nait Saada;Alireza Naderi;Jared Tanner",
        "authorids": "~Thiziri_Nait_Saada1;~Alireza_Naderi1;~Jared_Tanner1",
        "gender": "F;M;",
        "homepage": ";;http://people.maths.ox.ac.uk/tanner/publications.shtml",
        "dblp": ";;85/1256",
        "google_scholar": ";n9_Av0AAAAAJ;https://scholar.google.co.uk/citations?user=J7248tkAAAAJ",
        "orcid": ";;",
        "linkedin": "thiziri-nait-saada-4332021b2;;",
        "or_profile": "~Thiziri_Nait_Saada1;~Alireza_Naderi1;~Jared_Tanner1",
        "aff": "University of Oxford;University of Oxford;University of Oxford",
        "aff_domain": "ox.ac.uk;ox.ac.uk;ox.ac.uk",
        "position": "PhD student;PhD student;Full Professor",
        "bibtex": "@inproceedings{\nsaada2024beyond,\ntitle={Beyond {IID} weights: sparse and low-rank deep Neural Networks are also Gaussian Processes},\nauthor={Thiziri Nait Saada and Alireza Naderi and Jared Tanner},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=1Wi0Ys33Nm}\n}",
        "github": "",
        "project": "",
        "reviewers": "rGFF;SWNp;uyEL;EeDC",
        "pdf_size": 8344303,
        "rating": "5;6;6;8",
        "confidence": "3;3;3;2",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "1;3;3;4",
        "wc_summary": "28;49;92;128",
        "wc_strengths": "27;62;57;111",
        "wc_weaknesses": "114;16;110;39",
        "wc_questions": "118;32;160;21",
        "wc_review": "287;159;419;299",
        "wc_reply_reviewers": "0;137;0;0",
        "wc_reply_authors": "738;372;616;431",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            74.25,
            38.66765444140619
        ],
        "wc_strengths_avg": [
            64.25,
            30.127852562039664
        ],
        "wc_weaknesses_avg": [
            69.75,
            43.04866432306582
        ],
        "wc_questions_avg": [
            82.75,
            58.30683922148413
        ],
        "wc_review_avg": [
            291.0,
            92.04346799203081
        ],
        "wc_reply_reviewers_avg": [
            34.25,
            59.322740159234044
        ],
        "wc_reply_authors_avg": [
            539.25,
            145.8447376493235
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.9271726499455306,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11557098523946512237&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=1Wi0Ys33Nm",
        "pdf": "https://openreview.net/pdf?id=1Wi0Ys33Nm",
        "email": "ox.ac.uk;ox.ac.uk;ox.ac.uk",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Oxford",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ox.ac.uk",
        "aff_unique_abbr": "Oxford",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "1X99YOwQfI",
        "title": "Controllable Pareto Trade-off between Fairness and Accuracy",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The fairness-accuracy trade-off is a fundamental challenge in machine learning.While simply combining the two objectives can result in mediocre or extreme solutions, multi-objective optimization (MOO) could potentially provide diverse trade-offs by visiting different regions of the Pareto front. However, MOO methods usually lack precise control of the trade-offs. They rely on the full gradient per objective and inner products between these gradients to determine the update direction, which can be prone to large data sizes and the curse of dimensionality when training millions of parameters for neural networks. Moreover, the trade-off is usually sensitive to naive stochastic gradients due to the imbalance of groups in each batch and the existence of various trivial directions to improve fairness. To address these challenges, we propose \u201cControllable Pareto Trade-off (CPT)\u201d that can effectively train models performing different trade-offs defined by reference vectors. CPT begins with a correction stage that solely approaches the reference vector and then includes the discrepancy between the reference and the two objectives as the third objective in the rest training. To overcome the issues caused by\nhigh-dimensional stochastic gradients, CPT (1) uses a moving average of stochastic gradients to determine the update direction; and (2) prunes the gradients by only comparing different objectives\u2019 gradients on the critical parameters. Experiments show that CPT can achieve a higher-quality set of diverse models on the Pareto front performing different yet better trade-offs between fairness and accuracy than existing MOO approaches. It also exhibits better controllability and can precisely follow the human-defined reference vectors.",
        "keywords": "Multi-objective optimization;Fairness-accuracy trade-off",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Yongkang Du;Jieyu Zhao;Yijun Yang;Tianyi Zhou",
        "authorids": "~Yongkang_Du1;~Jieyu_Zhao1;~Yijun_Yang3;~Tianyi_Zhou1",
        "gender": "M;F;M;M",
        "homepage": "https://yongkdu.github.io/;http://jyzhao.net/;https://stevenyangyj.github.io/;https://tianyizhou.github.io/",
        "dblp": "321/7311;59/2379-1;;88/8205-1",
        "google_scholar": "LYu-0z0AAAAJ;9VaGBCQAAAAJ;X0quXnsAAAAJ;OKvgizMAAAAJ",
        "orcid": ";;;0000-0001-5348-0632",
        "linkedin": "yongkang-du/;;;tianyizhou",
        "or_profile": "~Yongkang_Du1;~Jieyu_Zhao1;~Yijun_Yang3;~Tianyi_Zhou1",
        "aff": "Pennsylvania State University;University of Southern California;University of Technology Sydney;University of Maryland, College Park",
        "aff_domain": "psu.edu;usc.edu;uts.edu.au;umd.edu",
        "position": "PhD student;Assistant Professor;PhD student;Assistant Professor",
        "bibtex": "@misc{\ndu2024controllable,\ntitle={Controllable Pareto Trade-off between Fairness and Accuracy},\nauthor={Yongkang Du and Jieyu Zhao and Yijun Yang and Tianyi Zhou},\nyear={2024},\nurl={https://openreview.net/forum?id=1X99YOwQfI}\n}",
        "github": "",
        "project": "",
        "reviewers": "MTak;8pma;whui",
        "site": "https://openreview.net/forum?id=1X99YOwQfI",
        "pdf_size": 1099856,
        "rating": "3;3;3",
        "confidence": "3;3;4",
        "soundness": "3;1;2",
        "contribution": "2;2;2",
        "presentation": "3;2;1",
        "wc_summary": "132;112;122",
        "wc_strengths": "64;23;35",
        "wc_weaknesses": "241;254;407",
        "wc_questions": "73;113;7",
        "wc_review": "510;502;571",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            122.0,
            8.16496580927726
        ],
        "wc_strengths_avg": [
            40.666666666666664,
            17.21110752456745
        ],
        "wc_weaknesses_avg": [
            300.6666666666667,
            75.37609405876346
        ],
        "wc_questions_avg": [
            64.33333333333333,
            43.70608907489003
        ],
        "wc_review_avg": [
            527.6666666666666,
            30.814859330452176
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:KWYG2L1ZRn4J:scholar.google.com/&scioq=Controllable+Pareto+Trade-off+between+Fairness+and+Accuracy&hl=en&as_sdt=0,5",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Pennsylvania State University;University of Southern California;University of Technology Sydney;University of Maryland",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.psu.edu;https://www.usc.edu;https://www.uts.edu.au;https://www/umd.edu",
        "aff_unique_abbr": "PSU;USC;UTS;UMD",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Los Angeles;College Park",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "United States;Australia"
    },
    {
        "id": "1XDG1Z5Nhk",
        "title": "Sparse Backpropagation for MoE Training",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "One defining characteristic of Mixture-of-Expert (MoE) models is their capacity for conducting sparse computation via expert routing, leading to remarkable scalability. However, backpropagation, the cornerstone of deep learning, requires dense computation, thereby posting challenges in MoE gradient computations. Here, we introduce SparseMixer, a scalable gradient estimator that bridges the gap between backpropagation and sparse expert routing. Unlike typical MoE training which strategically neglects certain gradient terms for the sake of sparse computation and scalability, SparseMixer provides scalable gradient approximations for these terms, enabling reliable gradient estimation in MoE training. Grounded in a numerical ODE framework, SparseMixer harnesses the mid-point method, a second-order ODE solver, to deliver precise gradient approximations with negligible computational overhead. Applying SparseMixer to Switch Transformer on both pre-training and machine translation tasks, SparseMixer showcases considerable performance gain, accelerating training convergence by up to 2 times.",
        "keywords": "Mixture-of-Expert;MoE;Sparsity;Backpropagation;Straight Through",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/e8b408b03d5274efe07a8fc6981911cbdc38ff9f.zip",
        "author": "Liyuan Liu;Jianfeng Gao;Weizhu Chen",
        "authorids": "~Liyuan_Liu3;~Jianfeng_Gao1;~Weizhu_Chen1",
        "gender": "M;M;M",
        "homepage": "https://www.microsoft.com/en-us/research/people/jfgao/;https://www.microsoft.com/en-us/research/people/wzchen/;https://liyuanlucasliu.github.io/",
        "dblp": "92/5339;79/2536;06/1624",
        "google_scholar": "https://scholar.google.com/citations?hl=en;LG_E-4EAAAAJ;RmvbkzYAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Jianfeng_Gao1;~Weizhu_Chen1;~Liyuan_Liu1",
        "aff": "Microsoft Research;Microsoft GenAI;University of Illinois, Urbana Champaign",
        "aff_domain": "microsoft.com;microsoft.com;illinois.edu",
        "position": "Principal Researcher;Vice President;PhD student",
        "bibtex": "@misc{\nliu2024sparse,\ntitle={Sparse Backpropagation for MoE Training},\nauthor={Liyuan Liu and Jianfeng Gao and Weizhu Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=1XDG1Z5Nhk}\n}",
        "github": "",
        "project": "",
        "reviewers": "yUXn;D3YK;4GtZ;tyBo",
        "site": "https://openreview.net/forum?id=1XDG1Z5Nhk",
        "pdf_size": 452975,
        "rating": "3;5;5;6",
        "confidence": "3;3;4;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;2;2",
        "presentation": "3;3;3;2",
        "wc_summary": "56;75;138;52",
        "wc_strengths": "51;44;70;47",
        "wc_weaknesses": "307;59;144;208",
        "wc_questions": "45;3;5;34",
        "wc_review": "459;181;357;341",
        "wc_reply_reviewers": "247;0;0;0",
        "wc_reply_authors": "631;456;444;550",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            80.25,
            34.455587355318734
        ],
        "wc_strengths_avg": [
            53.0,
            10.124228365658293
        ],
        "wc_weaknesses_avg": [
            179.5,
            90.62146544831418
        ],
        "wc_questions_avg": [
            21.75,
            18.18481509391833
        ],
        "wc_review_avg": [
            334.5,
            99.51256202108355
        ],
        "wc_reply_reviewers_avg": [
            61.75,
            106.95413736737817
        ],
        "wc_reply_authors_avg": [
            520.25,
            75.98149445753222
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.13245323570650439,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15288756663620775966&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Microsoft;University of Illinois Urbana-Champaign",
        "aff_unique_dep": "Microsoft Research;",
        "aff_unique_url": "https://www.microsoft.com/en-us/research;https://illinois.edu",
        "aff_unique_abbr": "MSR;UIUC",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Urbana-Champaign",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "1XHzHMQfcK",
        "title": "Significance of Fairly Distributed Instances and Optimal Ratio for Validation Set in Machine Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Machine learning plays a crucial role in various research areas and industries. The effectiveness of machine learning models relies heavily on the quality and quantity of training data. To evaluate model performance on unseen data, it is important to divide the data into training and testing data sets. A three-way split into train-validation-test data-sets is also commonly used to create robust and generalized models. Validation set helps in tuning hyper-parameters to mitigate the problem of overfitting. It is of utmost importance to achieve precise and true portrayal of data across all three categories of data-sets: training, testing, and validation. Previous research has explored various statistical techniques such as 'SPlit' aimed to ensure proper membership of the complete data in the test set. Despite the utilization of these techniques, Insufficient evidence exists regarding the equitable treatment of the validation set. Although cross-validation is widely used for validation, randomly selecting the validation part may not be the complete representative of overall data, hindering the creation of a generalized model suitable for the test data. This work focuses on extracting validation sets using the Support Points method in 'SPlit' to obtain accurate data membership. Results demonstrate significant accuracy improvement when both test and validation sets are selected using the Support Points method.",
        "keywords": "Data Split;Support Points;SPlit;validation Set;Optimal Ratio;Significance of validation set",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Hina Nasir;Dr Archana Pandita;Chaudhary Nauman bin Nasir",
        "authorids": "hinanasirch@gmail.com;~Dr_Archana_Pandita1;~Chaudhary_Nauman_bin_Nasir1",
        "gender": ";;M",
        "homepage": ";;",
        "dblp": ";;",
        "google_scholar": ";;",
        "orcid": ";;",
        "linkedin": ";;chnaumannasir/",
        "or_profile": "hinanasirch@gmail.com;~Dr_Archana_Pandita1;~Chaudhary_Nauman_bin_Nasir1",
        "aff": ";;",
        "aff_domain": ";;",
        "position": ";;",
        "bibtex": "@misc{\nnasir2024significance,\ntitle={Significance of Fairly Distributed Instances and Optimal Ratio for Validation Set in Machine Learning},\nauthor={Hina Nasir and Dr Archana Pandita and Chaudhary Nauman bin Nasir},\nyear={2024},\nurl={https://openreview.net/forum?id=1XHzHMQfcK}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=1XHzHMQfcK",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ye5NfBelT3gJ:scholar.google.com/&scioq=Significance+of+Fairly+Distributed+Instances+and+Optimal+Ratio+for+Validation+Set+in+Machine+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0
    },
    {
        "id": "1XReHUSUp9",
        "title": "Monsters in the Dark: Sanitizing Hidden Threats with Diffusion Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Steganography is the art of hiding information in plain sight. This form of covert communication can be used by bad actors to propagate malware, exfiltrate victim data, and communicate with other bad actors. Current image steganography defenses rely upon steganalysis, or the detection of hidden messages. These methods, however, are non-blind as they require information about known steganography techniques and are easily bypassed. Recent work has instead focused on a defense mechanism known as sanitization, which eliminates hidden information from images. In this work, we introduce a novel blind deep learning steganography sanitization method that utilizes a diffusion model framework to sanitize universal and dependent steganography (DM-SUDS), which both sanitizes and preserves image quality. We evaluate this approach against state-of-the-art deep learning sanitization frameworks and provide further detailed analysis through an ablation study. DM-SUDS outperforms previous sanitization methods and improves image preservation MSE by 71.32\\%, PSNR by 22.43\\% and SSIM by 17.30\\%. This is the first blind deep learning image sanitization framework to meet these image quality results.",
        "keywords": "representation learning;security;computer vision;steganography",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/90b0f2d5d7ea4dac24695f7924948a9da1ba8c9f.pdf",
        "author": "Preston K Robinette;Daniel Moyer;Taylor T Johnson",
        "authorids": "~Preston_K_Robinette1;~Daniel_Moyer3;~Taylor_T_Johnson1",
        "gender": "F;M;M",
        "homepage": ";https://dcmoyer.github.io;http://www.TaylorTJohnson.com/",
        "dblp": "260/0809.html;187/6201;96/11505",
        "google_scholar": ";sKmoxSMAAAAJ;https://scholar.google.com.tw/citations?user=MdTkXNYAAAAJ",
        "orcid": "0000-0002-4906-2179;;0000-0001-8021-9923",
        "linkedin": "prestonrobinette/;;taylortjohnson/",
        "or_profile": "~Preston_K_Robinette1;~Daniel_Moyer2;~Taylor_Johnson1",
        "aff": "Vanderbilt University;Vanderbilt University;Vanderbilt University",
        "aff_domain": "vanderbilt.edu;vanderbilt.edu;vanderbilt.edu",
        "position": "PhD student;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nrobinette2024monsters,\ntitle={Monsters in the Dark: Sanitizing Hidden Threats with Diffusion Models},\nauthor={Preston K Robinette and Daniel Moyer and Taylor T Johnson},\nyear={2024},\nurl={https://openreview.net/forum?id=1XReHUSUp9}\n}",
        "github": "",
        "project": "",
        "reviewers": "zZQW;158U;sHuH;Ha3d",
        "site": "https://openreview.net/forum?id=1XReHUSUp9",
        "pdf_size": 1045040,
        "rating": "3;5;6;8",
        "confidence": "5;5;3;5",
        "soundness": "2;3;3;3",
        "contribution": "1;2;3;3",
        "presentation": "2;3;3;4",
        "wc_summary": "305;58;29;85",
        "wc_strengths": "13;21;15;52",
        "wc_weaknesses": "83;515;62;215",
        "wc_questions": "39;2;6;99",
        "wc_review": "440;596;112;451",
        "wc_reply_reviewers": "372;0;0;0",
        "wc_reply_authors": "1684;750;204;546",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "3;1;1;1",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            4.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            119.25,
            109.05589163360226
        ],
        "wc_strengths_avg": [
            25.25,
            15.722197683530124
        ],
        "wc_weaknesses_avg": [
            218.75,
            180.8153408867732
        ],
        "wc_questions_avg": [
            36.5,
            38.836194458262774
        ],
        "wc_review_avg": [
            399.75,
            177.17276173272234
        ],
        "wc_reply_reviewers_avg": [
            93.0,
            161.0807251039056
        ],
        "wc_reply_authors_avg": [
            796.0,
            548.5489950770123
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.16012815380508713,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9133272584659701835&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Vanderbilt University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.vanderbilt.edu",
        "aff_unique_abbr": "Vanderbilt",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "1XarNmzbgG",
        "title": "Understanding of Server-Assisted Federated Learning with Incomplete Client Participation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Existing works in federated learning (FL) often assumes an ideal system with either full client or uniformly distributed client participation. \nHowever, in practice, it has been observed that some clients may never participate in FL training (aka incomplete client participation) due to a myriad of system heterogeneity factors. To mitigate impacts of incomplete client participation, a popular approach is the server-assisted federated learning (SA-FL) framework, where the server is equipped with an auxiliary dataset. However, despite the fact that SA-FL has been empirically shown to be effective in addressing the incomplete client participation problem, there remains a lack of theoretical understanding for SA-FL. Meanwhile, the ramifications of incomplete client participation in conventional FL is also poorly understood. These theoretical gaps motivate us to rigorously investigate SA-FL. Toward this end, to fully understand the impact of incomplete client participation on conventional FL, we first show that conventional FL is {\\em not} PAC-learnable under incomplete client participation in the worst case. Then, we show that the PAC-learnability of FL with incomplete client participation can indeed be revived by SA-FL, which theoretically justifies the use of SA-FL for the first time. Lastly, to provide practical guidance for SA-FL training under {\\em incomplete client participation}, we propose the SAFARI (server-assisted federated averaging) algorithm that enjoys the same linear convergence speedup guarantees as classic FL with ideal client participation assumptions, offering the first SA-FL algorithm with convergence guarantee. Extensive experiments on different datasets show SAFARI significantly improve the performance under incomplete client participation.",
        "keywords": "federated learning;client participation;probably approximately correct;statistical learning",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/8e2188b61ace254aa10b49d4f0fec35cdbd93f9d.pdf",
        "author": "Haibo Yang;Peiwen Qiu;Prashant Khanduri;Minghong Fang;Jia Liu",
        "authorids": "~Haibo_Yang1;~Peiwen_Qiu1;~Prashant_Khanduri1;~Minghong_Fang1;~Jia_Liu1",
        "gender": "M;F;M;M;M",
        "homepage": "https://haibo-yang-osu.github.io/homepage/;;https://sites.google.com/view/khanduri-prashant/home?authuser=0;https://minghongfang.com/;https://kevinliu-osu.github.io/index.html",
        "dblp": "43/7829-1;287/6757;158/4888;157/0863;",
        "google_scholar": "eyy22VoAAAAJ;LzaQe5sAAAAJ;;L6vkkC8AAAAJ;Ofx3dScAAAAJ",
        "orcid": "0000-0002-3245-2728;;;0000-0002-1365-3911;",
        "linkedin": ";peiwen-qiu/;prashant-khanduri-0497894b/;;",
        "or_profile": "~Haibo_Yang1;~Peiwen_Qiu1;~Prashant_Khanduri1;~Minghong_Fang1;~Jia_Liu1",
        "aff": "Rochester Institute of Technology;Ohio State University, Columbus;Wayne State University;Duke University;The Ohio State University",
        "aff_domain": "rit.edu;osu.edu;wayne.edu;duke.edu;osu.edu",
        "position": "Assistant Professor;PhD student;Assistant Professor;Postdoc;Assistant Professor",
        "bibtex": "@misc{\nyang2024understanding,\ntitle={Understanding of  Server-Assisted Federated Learning with Incomplete Client Participation},\nauthor={Haibo Yang and Peiwen Qiu and Prashant Khanduri and Minghong Fang and Jia Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=1XarNmzbgG}\n}",
        "github": "",
        "project": "",
        "reviewers": "65h6;JHPN;SJXE;Yuno",
        "site": "https://openreview.net/forum?id=1XarNmzbgG",
        "pdf_size": 473051,
        "rating": "3;3;5;8",
        "confidence": "4;4;3;3",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;2;4",
        "wc_summary": "117;50;137;155",
        "wc_strengths": "134;52;128;17",
        "wc_weaknesses": "2321;50;468;117",
        "wc_questions": "40;322;42;15",
        "wc_review": "2612;474;775;304",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            114.75,
            39.72640809335775
        ],
        "wc_strengths_avg": [
            82.75,
            49.85666956386076
        ],
        "wc_weaknesses_avg": [
            739.0,
            927.061216964662
        ],
        "wc_questions_avg": [
            104.75,
            125.87965482952359
        ],
        "wc_review_avg": [
            1041.25,
            922.4227271159357
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.8551861104941366,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:-pEe_yhagpoJ:scholar.google.com/&scioq=Understanding+of+Server-Assisted+Federated+Learning+with+Incomplete+Client+Participation&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;1",
        "aff_unique_norm": "Rochester Institute of Technology;Ohio State University;Wayne State University;Duke University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.rit.edu;https://www.osu.edu;https://wayne.edu;https://www.duke.edu",
        "aff_unique_abbr": "RIT;OSU;WSU;Duke",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Columbus",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "1Xcqp27Unx",
        "title": "Knowledge Crosswords: Geometric Reasoning over Structured Knowledge with Large Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large language models (LLMs) are widely adopted in knowledge-intensive tasks and have achieved impressive performance thanks to their knowledge abilities. While LLMs have demonstrated outstanding performance on atomic or linear (multi-hop) QA tasks, whether they can reason in knowledge-rich scenarios with interweaving constraints remains an underexplored problem. In this work, we propose geometric reasoning over structured knowledge, where pieces of knowledge are connected in a graph structure and models need to fill in the missing information of this graph. Such geometric knowledge reasoning would require the ability to handle structured knowledge, reason with uncertainty, verify facts, and backtrack when an error occurs. We specifically propose Knowledge Crosswords, a multi-blank QA dataset where each problem consists of a natural language question representing the geometric constraints of an incomplete entity network, where LLMs are tasked with working out the missing entities while meeting all factual constraints. Knowledge Crosswords contains 2,101 individual problems, covering a wide array of knowledge domains and further divided into three difficulty levels. We conduct extensive experiments to evaluate existing LLM prompting approaches on the Knowledge Crosswords benchmark. We additionally propose two new approaches, Staged Prompting and Verify-All, to augment LLMs' ability to backtrack and verify structured constraints. Our results demonstrate that while baseline approaches perform well on easier problems but struggle with questions on the hard side, our proposed Verify-All outperforms other methods by a large margin and is more robust with hard problems. Further analysis reveals that LLMs' ability of geometric reasoning over structured knowledge is still far from robust or perfect, susceptible to confounders such as the order of options, certain structural patterns, assumption of existence of correct answer, and more.",
        "keywords": "knowledge crosswords;large language models;structured knowledge;geometric reasoning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/f587d2b679b6c426005c33071c62f80ffc216f60.zip",
        "author": "Wenxuan Ding;Shangbin Feng;Yuhan Liu;Zhaoxuan Tan;Vidhisha Balachandran;Tianxing He;Yulia Tsvetkov",
        "authorids": "~Wenxuan_Ding1;~Shangbin_Feng1;~Yuhan_Liu9;~Zhaoxuan_Tan1;~Vidhisha_Balachandran1;~Tianxing_He1;~Yulia_Tsvetkov1",
        "gender": "F;M;F;M;F;M;F",
        "homepage": "https://wenwen-d.github.io/;https://bunsenfeng.github.io/;https://www.yhliu-nlp.info/;https://tamsiuhin.github.io/;https://vidhishanair.github.io/;https://cloudygoose.github.io/;https://homes.cs.washington.edu/~yuliats/",
        "dblp": "36/1339-1;295/9571;;301/7706;234/4867;149/0111;75/8157",
        "google_scholar": "GyHBjwQAAAAJ;Y3rLP9UAAAAJ;or-2JE8AAAAJ;0KE2CZsAAAAJ;LgitgaIAAAAJ;egmfjjwAAAAJ;SEDPkrsAAAAJ",
        "orcid": ";0000-0002-4133-1987;;0000-0001-8230-6238;;;0000-0002-4634-7128",
        "linkedin": "wenxuan-ding-0b299923b/;;;zhaoxuan-tan-927132213/;;;",
        "or_profile": "~Wenxuan_Ding1;~Shangbin_Feng1;~Yuhan_Liu9;~Zhaoxuan_Tan1;~Vidhisha_Balachandran1;~Tianxing_He1;~Yulia_Tsvetkov1",
        "aff": "Hong Kong University of Science and Technology;University of Washington;Xi'an Jiaotong University;University of Notre Dame;Carnegie Mellon University;University of Washington;Department of Computer Science, University of Washington",
        "aff_domain": "ust.hk;cs.washington.edu;xjtu.edu.cn;nd.edu;cmu.edu;cs.washington.edu;cs.washington.edu",
        "position": "Undergrad student;PhD student;Undergrad student;PhD student;PhD student;Postdoc;Associate Professor",
        "bibtex": "@misc{\nding2024knowledge,\ntitle={Knowledge Crosswords: Geometric Reasoning over Structured Knowledge with Large Language Models},\nauthor={Wenxuan Ding and Shangbin Feng and Yuhan Liu and Zhaoxuan Tan and Vidhisha Balachandran and Tianxing He and Yulia Tsvetkov},\nyear={2024},\nurl={https://openreview.net/forum?id=1Xcqp27Unx}\n}",
        "github": "",
        "project": "",
        "reviewers": "3S11;DY7D;iJEx;mbzm",
        "site": "https://openreview.net/forum?id=1Xcqp27Unx",
        "pdf_size": 780044,
        "rating": "3;3;5;6",
        "confidence": "4;4;3;4",
        "soundness": "2;3;3;4",
        "contribution": "2;1;2;2",
        "presentation": "3;3;3;4",
        "wc_summary": "59;161;62;120",
        "wc_strengths": "59;186;30;128",
        "wc_weaknesses": "101;659;43;156",
        "wc_questions": "109;278;27;58",
        "wc_review": "328;1284;162;462",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            100.5,
            42.55878287733332
        ],
        "wc_strengths_avg": [
            100.75,
            60.74279792699707
        ],
        "wc_weaknesses_avg": [
            239.75,
            245.32975257803525
        ],
        "wc_questions_avg": [
            118.0,
            96.90459225444376
        ],
        "wc_review_avg": [
            559.0,
            431.8576154243433
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3981051923048782917&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;4;1;1",
        "aff_unique_norm": "Hong Kong University of Science and Technology;University of Washington;Xi'an Jiao Tong University;University of Notre Dame;Carnegie Mellon University",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.ust.hk;https://www.washington.edu;https://www.xjtu.edu.cn;https://www.nd.edu;https://www.cmu.edu",
        "aff_unique_abbr": "HKUST;UW;XJTU;Notre Dame;CMU",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Hong Kong SAR;;Seattle",
        "aff_country_unique_index": "0;1;0;1;1;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "A Variational Perspective on Solving Inverse Problems with Diffusion Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19583",
        "id": "1YO4EE3SPB",
        "author_site": "Morteza Mardani, Jiaming Song, Jan Kautz, Arash Vahdat",
        "tldr": "",
        "abstract": "Diffusion models have emerged as a key pillar of foundation models in visual domains. One of their critical applications is to universally solve different downstream inverse tasks via a single diffusion prior without re-training for each task. Most inverse tasks can be formulated as inferring a posterior distribution over data (e.g., a full image) given a measurement (e.g., a masked image). This is however challenging in diffusion models since the nonlinear and iterative nature of the diffusion process renders the posterior intractable. To cope with this challenge, we propose a variational approach that by design seeks to approximate the true posterior distribution. We show that our approach naturally leads to regularization by denoising diffusion process (RED-diff) where denoisers at different timesteps concurrently impose different structural constraints over the image. To gauge the contribution of denoisers from different timesteps, we propose a weighting mechanism based on signal-to-noise-ratio (SNR). Our approach provides a new variational perspective for solving inverse problems with diffusion models, allowing us to formulate sampling as stochastic optimization, where one can simply apply off-the-shelf solvers with lightweight iterates. Our experiments for various linear and nonlinear image restoration tasks demonstrate the strengths of our method compared with state-of-the-art sampling-based diffusion models. The code is available online \\footnote{\\url{https://github.com/NVlabs/RED-diff}}.",
        "keywords": "diffusion models;score matching;variational approximation;regularization by denoising;inverse problems",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Morteza Mardani;Jiaming Song;Jan Kautz;Arash Vahdat",
        "authorids": "~Morteza_Mardani1;~Jiaming_Song1;~Jan_Kautz1;~Arash_Vahdat3",
        "gender": "M;M;;M",
        "homepage": "http://web.stanford.edu/~morteza/;http://tsong.me;http://jankautz.com;http://latentspace.cc/",
        "dblp": "74/258;173/5104;48/6214;92/8108",
        "google_scholar": "H7edsyEAAAAJ;;P9FclNEAAAAJ;https://scholar.google.ca/citations?user=p9-nlRIAAAAJ",
        "orcid": ";;;",
        "linkedin": ";jiamings/;;",
        "or_profile": "~Morteza_Mardani1;~Jiaming_Song1;~Jan_Kautz1;~Arash_Vahdat3",
        "aff": ";Luma AI;NVIDIA;NVIDIA",
        "aff_domain": ";lumalabs.ai;nvidia.com;nvidia.com",
        "position": ";Chief Scientist;VP Research;Research Scientist",
        "bibtex": "@inproceedings{\nmardani2024a,\ntitle={A Variational Perspective on Solving Inverse Problems with Diffusion Models},\nauthor={Morteza Mardani and Jiaming Song and Jan Kautz and Arash Vahdat},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=1YO4EE3SPB}\n}",
        "github": "",
        "project": "",
        "reviewers": "5Auf;RLDf;Qren;xtWM",
        "pdf_size": 19747124,
        "rating": "5;5;6;6",
        "confidence": "4;4;3;5",
        "soundness": "2;2;3;3",
        "contribution": "3;3;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "87;64;45;79",
        "wc_strengths": "76;76;58;37",
        "wc_weaknesses": "142;321;88;400",
        "wc_questions": "791;36;135;24",
        "wc_review": "1096;497;326;540",
        "wc_reply_reviewers": "0;222;0;0",
        "wc_reply_authors": "797;699;499;723",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            68.75,
            16.005858302509115
        ],
        "wc_strengths_avg": [
            61.75,
            16.068213964221414
        ],
        "wc_weaknesses_avg": [
            237.75,
            127.3270886339588
        ],
        "wc_questions_avg": [
            246.5,
            317.3046643212167
        ],
        "wc_review_avg": [
            614.75,
            289.1499394777734
        ],
        "wc_reply_reviewers_avg": [
            55.5,
            96.12881982007269
        ],
        "wc_reply_authors_avg": [
            679.5,
            110.29392549002868
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 116,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8814413069022914272&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=1YO4EE3SPB",
        "pdf": "https://openreview.net/pdf?id=1YO4EE3SPB",
        "email": ";lumalabs.ai;nvidia.com;nvidia.com",
        "author_num": 4,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Luma AI;NVIDIA",
        "aff_unique_dep": ";NVIDIA Corporation",
        "aff_unique_url": "https://www.luma.ai;https://www.nvidia.com",
        "aff_unique_abbr": "Luma AI;NVIDIA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Defining Expertise: Applications to Treatment Effect Estimation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19582",
        "id": "1YPfmglNRU",
        "author_site": "Alihan H\u00fcy\u00fck, Qiyao Wei, Alicia Curth, Mihaela van der Schaar",
        "tldr": "",
        "abstract": "Decision-makers are often experts of their domain and take actions based on their domain knowledge. Doctors, for instance, may prescribe treatments by predicting the likely outcome of each available treatment. Actions of an expert thus naturally encode part of their domain knowledge, and can help make inferences within the same domain: Knowing doctors try to prescribe the best treatment for their patients, we can tell treatments prescribed more frequently are likely to be more effective. Yet in machine learning, the fact that most decision-makers are experts is often overlooked, and \u201cexpertise\u201d is seldom leveraged as an inductive bias. This is especially true for the literature on treatment effect estimation, where often the only assumption made about actions is that of overlap. In this paper, we argue that expertise\u2014particularly the type of expertise the decision-makers of a domain are likely to have\u2014can be informative in designing and selecting methods for treatment effect estimation. We formally define two types of expertise, predictive and prognostic, and demonstrate empirically that: (i) the prominent type of expertise in a domain significantly influences the performance of different methods in treatment effect estimation, and (ii) it is possible to predict the type of expertise present in a dataset, which can provide a quantitative basis for model selection.",
        "keywords": "expertise;model selection;balancing representations;treatment effect estimation",
        "primary_area": "causal reasoning",
        "supplementary_material": "",
        "author": "Alihan H\u00fcy\u00fck;Qiyao Wei;Alicia Curth;Mihaela van der Schaar",
        "authorids": "~Alihan_H\u00fcy\u00fck1;~Qiyao_Wei1;~Alicia_Curth1;~Mihaela_van_der_Schaar2",
        "gender": ";M;F;F",
        "homepage": ";https://qiyaowei.github.io;;https://www.vanderschaar-lab.com",
        "dblp": "227/2296;327/3121;261/8064;",
        "google_scholar": "EMq6KwMAAAAJ;;eWRBqsYAAAAJ;DZ3S--MAAAAJ",
        "orcid": ";;;",
        "linkedin": ";qiyaowei;;",
        "or_profile": "~Alihan_H\u00fcy\u00fck1;~Qiyao_Wei1;~Alicia_Curth1;~Mihaela_van_der_Schaar2",
        "aff": "University of Cambridge;University of Cambridge;University of Cambridge;University of California, Los Angeles",
        "aff_domain": "cam.ac.uk;cam.ac.uk;cam.ac.uk;ucla.edu",
        "position": "PhD student;PhD student;PhD student;Full Professor",
        "bibtex": "@inproceedings{\nh{\\\"u}y{\\\"u}k2024defining,\ntitle={Defining Expertise: Applications to Treatment Effect Estimation},\nauthor={Alihan H{\\\"u}y{\\\"u}k and Qiyao Wei and Alicia Curth and Mihaela van der Schaar},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=1YPfmglNRU}\n}",
        "github": "",
        "project": "",
        "reviewers": "ScD8;7Wu5;uYNJ;obyv",
        "pdf_size": 425361,
        "rating": "5;6;8;8",
        "confidence": "2;2;4;3",
        "soundness": "4;2;4;2",
        "contribution": "1;3;3;3",
        "presentation": "2;3;3;4",
        "wc_summary": "211;143;161;227",
        "wc_strengths": "65;80;71;71",
        "wc_weaknesses": "218;8;190;118",
        "wc_questions": "106;259;130;153",
        "wc_review": "600;490;552;569",
        "wc_reply_reviewers": "0;0;35;36",
        "wc_reply_authors": "585;724;964;899",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "1;1;3;3",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            1.0
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            185.5,
            34.565155865408734
        ],
        "wc_strengths_avg": [
            71.75,
            5.356071321407137
        ],
        "wc_weaknesses_avg": [
            133.5,
            81.12182197164952
        ],
        "wc_questions_avg": [
            162.0,
            58.41660722773961
        ],
        "wc_review_avg": [
            552.75,
            40.10844674130376
        ],
        "wc_reply_reviewers_avg": [
            17.75,
            17.75352077758099
        ],
        "wc_reply_authors_avg": [
            793.0,
            148.74642852855325
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            1.0
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.8703882797784892,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1782251837120903391&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=1YPfmglNRU",
        "pdf": "https://openreview.net/pdf?id=1YPfmglNRU",
        "email": "cam.ac.uk;cam.ac.uk;cam.ac.uk;ucla.edu",
        "author_num": 4,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "University of Cambridge;University of California, Los Angeles",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cam.ac.uk;https://www.ucla.edu",
        "aff_unique_abbr": "Cambridge;UCLA",
        "aff_campus_unique_index": "0;0;0;1",
        "aff_campus_unique": "Cambridge;Los Angeles",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "id": "1YSJW69CFQ",
        "title": "Enhancing Machine Learning System Reliability in Healthcare through Uncertainty Estimation and Multi-Modal Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "It is crucial to ensure the dependability of machine learning (ML) systems, especially in areas where safety is a top priority, like healthcare. A tried-and-true method for highlighting the reliability of ML systems during deployment is uncertainty estimation. By successfully using integrated feature sets, sequential and parallel ensemble algorithms have both shown improved ML system performance in multi-modal contexts. We provide Uncertainty-Receptive fusing (URF), a cutting-edge technique that uses uncertainty estimations to improve the fusing of predictions from several base learners. URF, which successively modifies the weighting of the loss function during training in contrast to conventional boosting techniques, is especially successful for multi-modal learning tasks. In order to understand how noise and spatial transformations affect image-based activities, we then offer an image acquisition model that takes these aspects into consideration. We can make predictions with greater accuracy utilizing latent variables thanks to this approach. To quantify uncertainty at the pixel and structure/lesion levels, we use entropy-based uncertainty assessment (EUA). EUA measures the variety within prediction distributions and provides insightful information about the model's confidence. We also present Gnostic Uncertainty Estimation (GUE), which quantifies the model's lack of knowledge regarding the result and helps to comprehend the accuracy of the prediction.",
        "keywords": "Gnostic Uncertainty Estimation; Machine Learning Reliability; Uncertainty Estimation; Healthcare",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Saeed Iqbal Khattak;Adnan Nabeel Qureshi;khalid javeed;Khursheed Aurangzeb",
        "authorids": "~Saeed_Iqbal_Khattak1;~Adnan_Nabeel_Qureshi1;~khalid_javeed1;~Khursheed_Aurangzeb1",
        "gender": "M;M;;M",
        "homepage": ";;;https://faculty.ksu.edu.sa/en/kaurangzeb",
        "dblp": ";;;214/8964.html",
        "google_scholar": "https://scholar.google.com.pk/citations?user=Cj7u9FkAAAAJ;https://scholar.google.co.uk/citations?hl=en;https://scholar.google.com.pk/citations?user=GPJb34wAAAAJ;GBkDDr0AAAAJ",
        "orcid": ";;;0000-0003-3647-8578",
        "linkedin": "saeed-iqbal-32748b36;;;",
        "or_profile": "~Saeed_Iqbal_Khattak1;~Adnan_Nabeel_Qureshi1;~khalid_javeed1;~Khursheed_Aurangzeb1",
        "aff": "University of Central Punjab, Lahore;Birmingham Newman University, UK;University of Sharjah;",
        "aff_domain": "ucp.edu.pk;newman.ac.uk;sharja.ac.ae;",
        "position": "PhD student;Associate Professor;Assistant Professor;",
        "bibtex": "@misc{\nkhattak2024enhancing,\ntitle={Enhancing Machine Learning System Reliability in Healthcare through Uncertainty Estimation and Multi-Modal Learning},\nauthor={Saeed Iqbal Khattak and Adnan Nabeel Qureshi and khalid javeed and Khursheed Aurangzeb},\nyear={2024},\nurl={https://openreview.net/forum?id=1YSJW69CFQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "fEUv;fQud;8rRf",
        "site": "https://openreview.net/forum?id=1YSJW69CFQ",
        "pdf_size": 2495881,
        "rating": "1;1;3",
        "confidence": "4;4;3",
        "soundness": "1;1;2",
        "contribution": "1;1;2",
        "presentation": "1;1;2",
        "wc_summary": "42;97;76",
        "wc_strengths": "20;12;85",
        "wc_weaknesses": "446;1071;128",
        "wc_questions": "46;78;8",
        "wc_review": "554;1258;297",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            71.66666666666667,
            22.661764175711376
        ],
        "wc_strengths_avg": [
            39.0,
            32.69046751985457
        ],
        "wc_weaknesses_avg": [
            548.3333333333334,
            391.71957089507566
        ],
        "wc_questions_avg": [
            44.0,
            28.61235164516658
        ],
        "wc_review_avg": [
            703.0,
            406.22735834341177
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9999999999999997,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:QI2IB2ndglsJ:scholar.google.com/&scioq=Enhancing+Machine+Learning+System+Reliability+in+Healthcare+through+Uncertainty+Estimation+and+Multi-Modal+Learning&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of Central Punjab;Birmingham Newman University;University of Sharjah",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://ucp.edu.pk;https://www.birminghamnewman.ac.uk;https://www.sharjah.ac.ae",
        "aff_unique_abbr": "UCP;;UOS",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Lahore;",
        "aff_country_unique_index": "0;1;2",
        "aff_country_unique": "Pakistan;United Kingdom;United Arab Emirates"
    },
    {
        "id": "1Yq7zIOfj0",
        "title": "On the Similarity between Attention and SVM on the Token Separation and Selection Behavior",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The attention mechanism underpinning the transformer architecture is effective in learning the token interaction within a sequence via softmax similarity. However, the current theoretical understanding on optimization dynamics of the softmax attention is insufficient in characterizing how attention performs intrinsic token separation and selection, which is crucial to sequence-level understanding tasks. On the other hand, support vector machines have been well-studied of its max-margin separation behaviour. In this paper, we will formulate the softmax attention convergence dynamics as hard-margin SVM optimization problem. We adopt a tensor trick to formulate the matrix-based attention optimization problem and relax the strong assumptions on the derivative of the loss function from the prior works. As a result, we demonstrate that gradient descent converges to the optimal solution for SVM. In addition, we show softmax is more stable than other linear attention through analysis on their lipschitz. Our theoretical insights are validated through numerical experiments, shedding insights on the convergence dynamics of softmax attention as the foundational stones on the success of the large language models.",
        "keywords": "Transformer;SVM;Convergence Dynamics;Optimization",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/7a95412f2c91452c08645bde982129c1aa02e9ef.pdf",
        "author": "Beidi Chen;Wentao Guo;Zhihang Li;Zhao Song;Tianyi Zhou",
        "authorids": "~Beidi_Chen1;~Wentao_Guo1;~Zhihang_Li2;~Zhao_Song3;~Tianyi_Zhou4",
        "gender": "F;M;M;M;",
        "homepage": "https://www.andrew.cmu.edu/user/beidic/;http://wentaoguo.me/;https://dblp.org/pid/122/5633.html;https://www.youtube.com/@zhaosong2031;",
        "dblp": "192/1339;;122/5633;76/4051-2;",
        "google_scholar": ";7uHQMsYAAAAJ;Y9Rafe8AAAAJ;yDZct7UAAAAJ;",
        "orcid": ";;;;",
        "linkedin": ";wentao-guo-11b03217b/;zhihang-li-90a888332/;;",
        "or_profile": "~Beidi_Chen1;~Wentao_Guo1;~Zhihang_Li2;~Zhao_Song3;~Tianyi_Zhou4",
        "aff": "Meta Facebook;Department of Computer Science, Princeton University;Huazhong Agricultural University;Adobe;",
        "aff_domain": "fb.com;cs.princeton.edu;hzau.edu.cn;adobe.com;",
        "position": "Researcher;PhD student;Undergrad student;Researcher;",
        "bibtex": "@misc{\nchen2024on,\ntitle={On the Similarity between Attention and {SVM} on the Token Separation and Selection Behavior},\nauthor={Beidi Chen and Wentao Guo and Zhihang Li and Zhao Song and Tianyi Zhou},\nyear={2024},\nurl={https://openreview.net/forum?id=1Yq7zIOfj0}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=1Yq7zIOfj0",
        "pdf_size": 1150423,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:FJGDc5dQKwYJ:scholar.google.com/&scioq=On+the+Similarity+between+Attention+and+SVM+on+the+Token+Separation+and+Selection+Behavior&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Meta;Princeton University;Huazhong Agricultural University;Adobe",
        "aff_unique_dep": "Meta Platforms, Inc.;Department of Computer Science;;Adobe Inc.",
        "aff_unique_url": "https://meta.com;https://www.princeton.edu;http://www.hzau.edu.cn/;https://www.adobe.com",
        "aff_unique_abbr": "Meta;Princeton;HAU;Adobe",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "1armpjgh8L",
        "title": "Adaptive Hierarchical Certification for Semantic Segmentation using Randomized Smoothing",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Common certification methods operate on a flat pre-defined set of fine-grained classes. In this paper, however, we propose a novel, more general, and practical setting, namely adaptive hierarchical certification for image semantic segmentation. In this setting, the certification can be within a multi-level hierarchical label space composed of fine to coarse levels. Unlike classic methods where the certification would abstain for unstable components, our approach adaptively relaxes the certification to a coarser level within the hierarchy. This relaxation lowers the abstain rate whilst providing more certified semantically meaningful information. We mathematically formulate the problem setup and introduce, for the first time, an adaptive hierarchical certification algorithm for image semantic segmentation, that certifies image pixels within a hierarchy and prove the correctness of its guarantees. Since certified accuracy does not take the loss of information into account when traversing into a coarser hierarchy level, we introduce a novel evaluation paradigm for adaptive hierarchical certification, namely the certified information gain metric, which is proportional to the class granularity level. Our evaluation experiments on real-world challenging datasets such as Cityscapes and ACDC demonstrate that our adaptive algorithm achieves a higher certified information gain and a lower abstain rate compared to the current state-of-the-art certification method, as well as other non-adaptive versions of it.",
        "keywords": "certification for segmentation;image semantic segmentation;hierarchical certification;certification for machine learning;certified robustness",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Alaa Anani;Tobias Lorenz;Mario Fritz;Bernt Schiele",
        "authorids": "~Alaa_Anani1;~Tobias_Lorenz1;~Mario_Fritz1;~Bernt_Schiele1",
        "gender": "F;M;M;M",
        "homepage": "https://www.mpi-inf.mpg.de/departments/computer-vision-and-machine-learning/people/alaa-anani;https://www.t-lorenz.com/;https://cispa.saarland/group/fritz/;http://www.mpi-inf.mpg.de/~schiele",
        "dblp": "368/7744;25/6006-2;;s/BerntSchiele",
        "google_scholar": "eJgMcksAAAAJ;gf-aMd0AAAAJ;https://scholar.google.de/citations?user=4V1nNm4AAAAJ;https://scholar.google.de/citations?user=z76PBfYAAAAJ",
        "orcid": ";0000-0003-4369-2644;;0000-0001-9683-5237",
        "linkedin": "aaanani/;;;",
        "or_profile": "~Alaa_Anani1;~Tobias_Lorenz1;~Mario_Fritz1;~Bernt_Schiele1",
        "aff": "Saarland Informatics Campus, Max-Planck Institute;CISPA Helmholtz Center for Information Security;Saarland University;Max Planck Institute for Informatics, Saarland Informatics Campus",
        "aff_domain": "mpi-inf.mpg.de;cispa.de;uni-saarland.de;mpi-inf.mpg.de",
        "position": "MS student;PhD student;Full Professor;Full Professor",
        "bibtex": "@misc{\nanani2024adaptive,\ntitle={Adaptive Hierarchical Certification for Semantic Segmentation using Randomized Smoothing},\nauthor={Alaa Anani and Tobias Lorenz and Mario Fritz and Bernt Schiele},\nyear={2024},\nurl={https://openreview.net/forum?id=1armpjgh8L}\n}",
        "github": "",
        "project": "",
        "reviewers": "riuJ;2yaR;dRWJ;bW5R",
        "site": "https://openreview.net/forum?id=1armpjgh8L",
        "pdf_size": 44746158,
        "rating": "3;3;3;6",
        "confidence": "4;3;3;1",
        "soundness": "2;2;2;2",
        "contribution": "3;1;2;2",
        "presentation": "3;2;2;2",
        "wc_summary": "72;46;57;51",
        "wc_strengths": "71;13;34;22",
        "wc_weaknesses": "223;35;269;47",
        "wc_questions": "86;12;5;54",
        "wc_review": "452;106;365;174",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "463;226;777;64",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            2.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            56.5,
            9.759610647971568
        ],
        "wc_strengths_avg": [
            35.0,
            22.079402165819616
        ],
        "wc_weaknesses_avg": [
            143.5,
            103.86890776358439
        ],
        "wc_questions_avg": [
            39.25,
            32.85859857023729
        ],
        "wc_review_avg": [
            274.25,
            139.81125669988094
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            382.5,
            268.34911961845523
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9271726499455307,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:6aYZVWoVhQIJ:scholar.google.com/&scioq=Adaptive+Hierarchical+Certification+for+Semantic+Segmentation+using+Randomized+Smoothing&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Max-Planck Institute;CISPA Helmholtz Center for Information Security;Saarland University;Max Planck Institute for Informatics",
        "aff_unique_dep": "Informatics;;;",
        "aff_unique_url": "https://www.mpi-sws.org;https://www.cispa.de/;https://www.uni-saarland.de;https://mpi-inf.mpg.de",
        "aff_unique_abbr": "MPI-SWS;CISPA;UdS;MPII",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Saarland;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "title": "DreamTime: An Improved Optimization Strategy for Diffusion-Guided 3D Generation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19581",
        "id": "1bAUywYJTU",
        "author_site": "Yukun Huang, Jianan Wang, Yukai Shi, Boshi Tang, Xianbiao Qi, Lei Zhang",
        "tldr": "",
        "abstract": "Text-to-image diffusion models pre-trained on billions of image-text pairs have recently enabled 3D content creation by optimizing a randomly initialized differentiable 3D representation with score distillation. However, the optimization process suffers slow convergence and the resultant 3D models often exhibit two limitations: (a) quality concerns such as missing attributes and distorted shape and texture; (b) extremely low diversity comparing to text-guided image synthesis. In this paper, we show that the conflict between the 3D optimization process and uniform timestep sampling in score distillation is the main reason for these limitations. To resolve this conflict, we propose to prioritize timestep sampling with monotonically non-increasing functions, which aligns the 3D optimization process with the sampling process of diffusion model. Extensive experiments show that our simple redesign significantly improves 3D content creation with faster convergence, better quality and diversity.",
        "keywords": "Score Distillation;3D Content Creation;Diffusion Model",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Yukun Huang;Jianan Wang;Yukai Shi;Boshi Tang;Xianbiao Qi;Lei Zhang",
        "authorids": "~Yukun_Huang1;~Jianan_Wang2;~Yukai_Shi3;~Boshi_Tang1;~Xianbiao_Qi2;~Lei_Zhang23",
        "gender": "M;F;;M;M;M",
        "homepage": ";https://scholar.google.com/citations?user=mt5mvZ8AAAAJ&hl=en;https://shiyukai26.github.io/info/;https://github.com/TangYucopper;https://www.linkedin.com/in/xianbiao-qi-39617727/;https://www.leizhang.org/",
        "dblp": "186/1316;49/6053,;;;118/3741;z/LeiZhang",
        "google_scholar": "lHb5gzoAAAAJ;mt5mvZ8AAAAJ;oQXfkSQAAAAJ;;odjSydQAAAAJ;fIlGZToAAAAJ",
        "orcid": "0000-0002-5322-2884;;;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Yukun_Huang1;~Jianan_Wang2;~Yukai_Shi3;~Boshi_Tang1;~Xianbiao_Qi2;~Lei_Zhang1",
        "aff": "University of Hong Kong;International Digital Economy Academy (IDEA);Tsinghua University;Tsinghua University;International Digital Economy Academy;International Digital Economy Academy",
        "aff_domain": "hku.hk;idea.edu.cn;mail.tsinghua.edu.cn;mails.tsinghua.edu.cn;idea.edu.cn;idea.edu.cn",
        "position": "Postdoc;Researcher;PhD student;MS student;Researcher;Chief Scientist",
        "bibtex": "@inproceedings{\nhuang2024dreamtime,\ntitle={DreamTime: An Improved Optimization Strategy for Diffusion-Guided 3D Generation},\nauthor={Yukun Huang and Jianan Wang and Yukai Shi and Boshi Tang and Xianbiao Qi and Lei Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=1bAUywYJTU}\n}",
        "github": "",
        "project": "",
        "reviewers": "zkfR;5Rpq;DnQ9;iLxc",
        "pdf_size": 9084391,
        "rating": "3;6;6;8",
        "confidence": "4;5;4;4",
        "soundness": "3;3;4;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;4;4",
        "wc_summary": "112;131;61;67",
        "wc_strengths": "24;74;115;110",
        "wc_weaknesses": "152;85;99;104",
        "wc_questions": "26;216;37;26",
        "wc_review": "314;506;312;307",
        "wc_reply_reviewers": "0;0;0;16",
        "wc_reply_authors": "549;626;212;226",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            92.75,
            29.600464523382062
        ],
        "wc_strengths_avg": [
            80.75,
            36.38251640554842
        ],
        "wc_weaknesses_avg": [
            110.0,
            25.228951623085727
        ],
        "wc_questions_avg": [
            76.25,
            80.80957554646602
        ],
        "wc_review_avg": [
            359.75,
            84.47595811827173
        ],
        "wc_reply_reviewers_avg": [
            4.0,
            6.928203230275509
        ],
        "wc_reply_authors_avg": [
            403.25,
            186.31609565466962
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.08084520834544431,
        "gs_citation": 22,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5988579552726499121&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=1bAUywYJTU",
        "pdf": "https://openreview.net/pdf?id=1bAUywYJTU",
        "email": "hku.hk;idea.edu.cn;mail.tsinghua.edu.cn;mails.tsinghua.edu.cn;idea.edu.cn;idea.edu.cn",
        "author_num": 6,
        "aff_unique_index": "0;1;2;2;1;1",
        "aff_unique_norm": "University of Hong Kong;International Digital Economy Academy;Tsinghua University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.hku.hk;;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "HKU;IDEA;THU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China;"
    },
    {
        "title": "I-PHYRE: Interactive Physical Reasoning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19580",
        "id": "1bbPQShCT2",
        "author_site": "Shiqian Li, Kewen Wu, Chi Zhang, Yixin Zhu",
        "tldr": "",
        "abstract": "Current evaluation protocols predominantly assess physical reasoning in stationary scenes, creating a gap in evaluating agents' abilities to interact with dynamic events. While contemporary methods allow agents to modify initial scene configurations and observe consequences, they lack the capability to interact with events in real time. To address this, we introduce I-PHYRE, a framework that challenges agents to simultaneously exhibit intuitive physical reasoning, multi-step planning, and in-situ intervention. Here, intuitive physical reasoning refers to a quick, approximate understanding of physics to address complex problems; multi-step denotes the need for extensive sequence planning in I-PHYRE, considering each intervention can significantly alter subsequent choices; and in-situ implies the necessity for timely object manipulation within a scene, where minor timing deviations can result in task failure. We formulate four game splits to scrutinize agents' learning and generalization of essential principles of interactive physical reasoning, fostering learning through interaction with representative scenarios. Our exploration involves three planning strategies and examines several supervised and reinforcement agents' zero-shot generalization proficiency on I-PHYRE. The outcomes highlight a notable gap between existing learning algorithms and human performance, emphasizing the imperative for more research in enhancing agents with interactive physical reasoning capabilities. The environment and baselines will be made publicly available.",
        "keywords": "Intuitive physics;physical reasoning",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/bf4202ce3dfc8cb3a1fdecda0c659cf93a36497d.zip",
        "author": "Shiqian Li;Kewen Wu;Chi Zhang;Yixin Zhu",
        "authorids": "~Shiqian_Li1;~Kewen_Wu2;~Chi_Zhang12;~Yixin_Zhu1",
        "gender": ";F;;M",
        "homepage": ";https://github.com/k101w;;https://yzhu.io/",
        "dblp": ";20/9169-4;;91/1103-1.html",
        "google_scholar": ";9zPBJE4AAAAJ;;qG9l6JEAAAAJ",
        "orcid": ";;;0000-0001-7024-1545",
        "linkedin": ";;;",
        "or_profile": "~Shiqian_Li1;~Kewen_Wu2;~Chi_Zhang12;~Yixin_Zhu1",
        "aff": ";Carnegie Mellon University;;Peking University",
        "aff_domain": ";andrew.cmu.edu;;pku.edu.cn",
        "position": ";MS student;;Assistant Professor",
        "bibtex": "@inproceedings{\nli2024iphyre,\ntitle={I-{PHYRE}: Interactive Physical Reasoning},\nauthor={Shiqian Li and Kewen Wu and Chi Zhang and Yixin Zhu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=1bbPQShCT2}\n}",
        "github": "",
        "project": "",
        "reviewers": "PPjJ;p9BE;BYPY;yzoQ",
        "pdf_size": 1092524,
        "rating": "6;6;6;8",
        "confidence": "4;3;4;4",
        "soundness": "3;3;3;3",
        "contribution": "3;2;3;3",
        "presentation": "3;3;2;3",
        "wc_summary": "142;45;199;106",
        "wc_strengths": "96;48;256;126",
        "wc_weaknesses": "338;109;680;143",
        "wc_questions": "151;3;98;95",
        "wc_review": "727;205;1233;470",
        "wc_reply_reviewers": "97;17;0;24",
        "wc_reply_authors": "784;149;404;230",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            123.0,
            55.924055646921744
        ],
        "wc_strengths_avg": [
            131.5,
            77.07626093681505
        ],
        "wc_weaknesses_avg": [
            317.5,
            226.79781744981585
        ],
        "wc_questions_avg": [
            86.75,
            53.237087636346146
        ],
        "wc_review_avg": [
            658.75,
            379.4524838500863
        ],
        "wc_reply_reviewers_avg": [
            34.5,
            37.12478956169314
        ],
        "wc_reply_authors_avg": [
            391.75,
            244.48964702007322
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9770961054998957492&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=1bbPQShCT2",
        "pdf": "https://openreview.net/pdf?id=1bbPQShCT2",
        "email": ";andrew.cmu.edu;;pku.edu.cn",
        "author_num": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Carnegie Mellon University;Peking University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cmu.edu;http://www.pku.edu.cn",
        "aff_unique_abbr": "CMU;Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "ReSimAD: Zero-Shot 3D Domain Transfer for Autonomous Driving with Source Reconstruction and Target Simulation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19579",
        "id": "1d2cLKeNgY",
        "author_site": "Bo Zhang, Xinyu Cai, Jiakang Yuan, Donglin Yang, Jianfei Guo, Xiangchao Yan, Renqiu Xia, Botian Shi, Min Dou, Tao Chen, Si Liu, Junchi Yan, Yu Qiao",
        "tldr": "",
        "abstract": "Domain shifts such as sensor type changes and geographical situation variations are prevalent in Autonomous Driving (AD), which poses a challenge since AD model relying on the previous domain knowledge can be hardly directly deployed to a new domain without additional costs. In this paper, we provide a new perspective and approach of alleviating the domain shifts, by proposing a Reconstruction-Simulation-Perception (ReSimAD) scheme. Specifically, the implicit reconstruction process is based on the knowledge from the previous old domain, aiming to convert the domain-related knowledge into domain-invariant representations, e.g., 3D scene-level meshes. Besides, the point clouds simulation process of multiple new domains is conditioned on the above reconstructed 3D meshes, where the target-domain-like simulation samples can be obtained, thus reducing the cost of collecting and annotating new-domain data for the subsequent perception process. For experiments, we consider different cross-domain situations such as Waymo-to-KITTI, Waymo-to-nuScenes, etc, to verify the zero-shot target-domain perception using ReSimAD. Results demonstrate that our method is beneficial to boost the domain generalization ability, even promising for 3D pre-training. Code and simulated points are available at: https://github.com/PJLab-ADG/3DTrans",
        "keywords": "Autonomous Driving;3D Domain Transfer;Zero-shot 3D Detection",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/84f21850a271ea5b6dcfea958210801e97bfa51a.zip",
        "author": "Bo Zhang;Xinyu Cai;Jiakang Yuan;Donglin Yang;Jianfei Guo;Xiangchao Yan;Renqiu Xia;Botian Shi;Min Dou;Tao Chen;Si Liu;Junchi Yan;Yu Qiao",
        "authorids": "~Bo_Zhang17;~Xinyu_Cai2;~Jiakang_Yuan1;~Donglin_Yang3;~Jianfei_Guo1;~Xiangchao_Yan1;~Renqiu_Xia2;~Botian_Shi1;~Min_Dou1;~Tao_Chen6;~Si_Liu5;~Junchi_Yan2;~Yu_Qiao1",
        "gender": "M;;M;M;M;;;M;M;M;F;;",
        "homepage": "https://bobrown.github.io/boZhang.github.io/;;https://jiakangyuan.github.io/;https://github.com/puffyyy;https://ventusff.github.io;https://github.com/sky-fly97;;;;https://eetchen.github.io/;https://colalab.net;;",
        "dblp": "36/2259-69;;323/7363;;305/7388.html;314/2496.html;;245/8742;;69/510-3;60/7642;;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;https://scholar.google.com/citations?hl=zh-CN;;MJb2_wYAAAAJ;0mMk6PMAAAAJ;;K0PpvLkAAAAJ;;https://scholar.google.com.sg/citations?user=w3OoFL0AAAAJ;https://scholar.google.com/citations?hl=zh-CN;;",
        "orcid": "0000-0001-8052-782X;0000-0001-8500-9300;;;0000-0002-5838-679X;;;0000-0003-3677-7252;;;0000-0002-9180-2935;;",
        "linkedin": ";;;;;;;friskit/;%E6%B0%91-%E7%AA%A6-a34b17a3;;;;",
        "or_profile": "~Bo_Zhang17;~Xinyu_Cai2;~Jiakang_Yuan1;~Donglin_Yang3;~Jianfei_Guo1;~Xiangchao_Yan1;~Renqiu_Xia2;~Botian_Shi1;~Min_Dou1;~Tao_Chen6;~Si_Liu5;~Junchi_Yan2;~Yu_Qiao1",
        "aff": "Shanghai Artificial Intelligence Laboratory;Shanghai Artificial Intelligence Laboratory;Shanghai AI Laboratory;Shanghai Artificial Intelligence Laboratory;Shanghai Artificial Intelligence Laboratory;Shanghai AI Laboratory;;Shanghai AI Lab;Shanghai AI Laboratory;Fudan University;Beihang University;;",
        "aff_domain": "pjlab.org.cn;pjlab.org.cn;pjlab.org.cn;pjlab.org.cn;pjlab.org.cn;pjlab.org.cn;;pjlab.org.cn;pjlab.org.cn;fudan.edu.cn;buaa.edu.cn;;",
        "position": "Researcher;Researcher;Intern;Intern;Researcher;Researcher;;Researcher;Researcher;Full Professor;Full Professor;;",
        "bibtex": "@inproceedings{\nzhang2024resimad,\ntitle={ReSim{AD}: Zero-Shot 3D Domain Transfer for Autonomous Driving with Source Reconstruction and Target Simulation},\nauthor={Bo Zhang and Xinyu Cai and Jiakang Yuan and Donglin Yang and Jianfei Guo and Xiangchao Yan and Renqiu Xia and Botian Shi and Min Dou and Tao Chen and Si Liu and Junchi Yan and Yu Qiao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=1d2cLKeNgY}\n}",
        "github": "",
        "project": "",
        "reviewers": "bhEL;Fz1j;kWr7;7ZCS",
        "pdf_size": 12391706,
        "rating": "5;6;6;6",
        "confidence": "4;4;3;3",
        "soundness": "2;3;2;3",
        "contribution": "2;3;2;3",
        "presentation": "1;2;1;3",
        "wc_summary": "90;68;122;84",
        "wc_strengths": "17;51;17;43",
        "wc_weaknesses": "167;27;276;266",
        "wc_questions": "4;141;2;6",
        "wc_review": "278;287;417;399",
        "wc_reply_reviewers": "86;0;120;118",
        "wc_reply_authors": "1816;897;778;1259",
        "reply_reviewers": "1;0;2;1",
        "reply_authors": "4;2;2;3",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            91.0,
            19.621416870348583
        ],
        "wc_strengths_avg": [
            32.0,
            15.264337522473747
        ],
        "wc_weaknesses_avg": [
            184.0,
            100.15737616371547
        ],
        "wc_questions_avg": [
            38.25,
            59.33959470707565
        ],
        "wc_review_avg": [
            345.25,
            63.15209814408386
        ],
        "wc_reply_reviewers_avg": [
            81.0,
            48.67237409455183
        ],
        "wc_reply_authors_avg": [
            1187.5,
            403.7960500054452
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            13,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1073026491614599340&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=1d2cLKeNgY",
        "pdf": "https://openreview.net/pdf?id=1d2cLKeNgY",
        "email": "pjlab.org.cn;pjlab.org.cn;pjlab.org.cn;pjlab.org.cn;pjlab.org.cn;pjlab.org.cn;;pjlab.org.cn;pjlab.org.cn;fudan.edu.cn;buaa.edu.cn;;",
        "author_num": 13,
        "aff_unique_index": "0;0;1;0;0;1;2;1;3;4",
        "aff_unique_norm": "Shanghai Artificial Intelligence Laboratory;Shanghai AI Laboratory;Shanghai AI Lab;Fudan University;Beihang University",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "http://www.shailab.org/;https://www.shanghai-ai-lab.com;https://www.shanghaiailab.com;https://www.fudan.edu.cn;http://www.buaa.edu.cn/",
        "aff_unique_abbr": "Shanghai AI Lab;SAIL;SAIL;Fudan;BUAA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "1dY11GyZdp",
        "title": "Signed-Binarization: Unlocking Efficiency Through Repetition-Sparsity Trade-Off",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Efficient inference of Deep Neural Networks (DNNs) on resource-constrained edge devices is essential. Quantization and sparsity are key algorithmic techniques that translate to repetition and sparsity within tensors at the hardware-software interface. This paper introduces the concept of repetition-sparsity trade-off that helps explain computational efficiency during inference. We propose Signed Binarization, a unified co-design framework that synergistically integrates hardware-software systems, quantization functions, and representation learning techniques to address this trade-off. Our results demonstrate that Signed Binarization is more accurate than binary models with the same number of non-zero weights. Detailed analysis indicates that signed binarization generates a smaller distribution of effectual (non-zero) parameters nested within a larger distribution of total parameters, both of the same type, for a DNN block. Finally, our approach achieves a 26\\% speedup on real hardware, doubles energy efficiency, and reduces density by 2.8x compared to binary methods for ResNet 18, presenting an alternative solution for deploying efficient models in resource-limited environments.",
        "keywords": "Representation Learning;Quantization;DNN Inference",
        "primary_area": "infrastructure, software libraries, hardware, etc.",
        "supplementary_material": "",
        "author": "Sachit Kuhar;Yash Jain;Alexey Tumanov;Sujan Kumar Gonugondla",
        "authorids": "~Sachit_Kuhar1;~Yash_Jain1;~Alexey_Tumanov1;~Sujan_Kumar_Gonugondla1",
        "gender": "M;M;;",
        "homepage": "https://sachitkuhar.github.io/;https://yash-jain.com;;https://gsujankumar.github.io",
        "dblp": "240/0924;255/2617;;166/6408.html",
        "google_scholar": "X8slYZEAAAAJ;Fr6QHDsAAAAJ;;F_ud9E4AAAAJ",
        "orcid": "0000-0002-5739-013X;0000-0002-5175-1352;;0000-0003-4743-6461",
        "linkedin": ";jinga-lala/;;sujan-kumar-gonugondla-ab6787142/",
        "or_profile": "~Sachit_Kuhar1;~Yash_Jain1;~Alexey_Tumanov1;~Sujan_Kumar_Gonugondla1",
        "aff": "Amazon;Microsoft;;Amazon",
        "aff_domain": "amazon.com;microsoft.com;;amazon.com",
        "position": "Researcher;Researcher;;Researcher",
        "bibtex": "@misc{\nkuhar2024signedbinarization,\ntitle={Signed-Binarization: Unlocking Efficiency Through Repetition-Sparsity Trade-Off},\nauthor={Sachit Kuhar and Yash Jain and Alexey Tumanov and Sujan Kumar Gonugondla},\nyear={2024},\nurl={https://openreview.net/forum?id=1dY11GyZdp}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZM5v;pHUD;Ffqa",
        "site": "https://openreview.net/forum?id=1dY11GyZdp",
        "pdf_size": 1242248,
        "rating": "3;5;6",
        "confidence": "4;3;3",
        "soundness": "2;3;3",
        "contribution": "2;2;3",
        "presentation": "2;2;2",
        "wc_summary": "53;57;118",
        "wc_strengths": "10;23;138",
        "wc_weaknesses": "300;101;296",
        "wc_questions": "8;85;30",
        "wc_review": "371;266;582",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1545;883;598",
        "reply_reviewers": "0;0;0",
        "reply_authors": "3;2;2",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            76.0,
            29.743346594938952
        ],
        "wc_strengths_avg": [
            57.0,
            57.52101065407897
        ],
        "wc_weaknesses_avg": [
            232.33333333333334,
            92.88104698424156
        ],
        "wc_questions_avg": [
            41.0,
            32.38312317653544
        ],
        "wc_review_avg": [
            406.3333333333333,
            131.40353453727525
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1008.6666666666666,
            396.6915958552969
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9449111825230683,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:msxiS4RewesJ:scholar.google.com/&scioq=Signed-Binarization:+Unlocking+Efficiency+Through+Repetition-Sparsity+Trade-Off&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Amazon;Microsoft",
        "aff_unique_dep": "Amazon.com, Inc.;Microsoft Corporation",
        "aff_unique_url": "https://www.amazon.com;https://www.microsoft.com",
        "aff_unique_abbr": "Amazon;Microsoft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "1djnGJnaiy",
        "title": "Unsupervised Representation Learning of Brain Activity via Bridging Voxel Activity and Functional Connectivity",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Effective brain representation learning is a key step toward revealing the understanding of cognitive processes and unlocking detecting and potential therapeutic interventions for neurological diseases/disorders. Existing studies have focused on either (1) voxel-level activity, where only a single beta weight for each voxel (i.e., aggregation of voxel activity over a time window) is considered, missing their temporal dynamics, or (2) functional connectivity of the brain in the level of region of interests, missing voxel-level activities. In this paper, we bridge this gap and design BrainMixer, an unsupervised learning framework that effectively utilizes both functional connectivity and associated time series of voxels to learn voxel-level representation in an unsupervised manner. BrainMixer employs two simple yet effective MLP-based encoders to simultaneously learn the dynamics of voxel-level signals and their functional correlations. To encode voxel activity, BrainMixer fuses information across both time and voxel dimensions via a dynamic self-attention mechanism. To learn the structure of the functional connectivity graph, BrainMixer presents a temporal graph patching and encodes each patch by combining its nodes' features via a new adaptive temporal pooling. Our experiments show that BrainMixer attains outstanding performance and outperforms 13 baselines in different downstream tasks and experimental setups.",
        "keywords": "Functional Connectivity;Graph Representation Learning;Anomaly Detection;Brain Representation Learning",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "Ali Behrouz;Parsa Delavari;Farnoosh Hashemi",
        "authorids": "~Ali_Behrouz1;~Parsa_Delavari1;~Farnoosh_Hashemi1",
        "gender": "M;M;F",
        "homepage": "https://Abehrouz.github.io;;https://farnooshha.github.io/",
        "dblp": "220/4163;;318/9574",
        "google_scholar": "UbwVuqIAAAAJ;clef-H4AAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;",
        "linkedin": "ali-behrouz-506aa2127;;farnoosh-hashemi-a48328123/",
        "or_profile": "~Ali_Behrouz1;~Parsa_Delavari1;~Farnoosh_Hashemi1",
        "aff": "Cornell University;University of British Columbia;Cornell University",
        "aff_domain": "cornell.edu;ubc.ca;cornell.edu",
        "position": "PhD student;PhD student;PhD student",
        "bibtex": "@misc{\nbehrouz2024unsupervised,\ntitle={Unsupervised Representation Learning of Brain Activity via Bridging Voxel Activity and Functional Connectivity},\nauthor={Ali Behrouz and Parsa Delavari and Farnoosh Hashemi},\nyear={2024},\nurl={https://openreview.net/forum?id=1djnGJnaiy}\n}",
        "github": "",
        "project": "",
        "reviewers": "JxFN;v3MT;WgDG",
        "site": "https://openreview.net/forum?id=1djnGJnaiy",
        "pdf_size": 5259198,
        "rating": "3;6;6",
        "confidence": "4;3;4",
        "soundness": "2;3;2",
        "contribution": "2;3;3",
        "presentation": "1;3;2",
        "wc_summary": "103;81;101",
        "wc_strengths": "30;34;21",
        "wc_weaknesses": "630;579;541",
        "wc_questions": "2;157;11",
        "wc_review": "765;851;674",
        "wc_reply_reviewers": "0;33;745",
        "wc_reply_authors": "2775;1815;3077",
        "reply_reviewers": "0;1;3",
        "reply_authors": "5;3;5",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            95.0,
            9.93310961716756
        ],
        "wc_strengths_avg": [
            28.333333333333332,
            5.436502143433363
        ],
        "wc_weaknesses_avg": [
            583.3333333333334,
            36.46307112073194
        ],
        "wc_questions_avg": [
            56.666666666666664,
            71.04145894397784
        ],
        "wc_review_avg": [
            763.3333333333334,
            72.26955713776645
        ],
        "wc_reply_reviewers_avg": [
            259.3333333333333,
            343.6823468779791
        ],
        "wc_reply_authors_avg": [
            2555.6666666666665,
            538.0466729032178
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            1.247219128924647
        ],
        "reply_authors_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6364363259821404592&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Cornell University;University of British Columbia",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cornell.edu;https://www.ubc.ca",
        "aff_unique_abbr": "Cornell;UBC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United States;Canada"
    },
    {
        "id": "1g77zRaJq0",
        "title": "Text2NKG: Fine-Grained N-ary Relation Extraction for N-ary relational Knowledge Graph Construction",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Beyond traditional binary relational facts, n-ary relational knowledge graphs (NKGs) are comprised of n-ary relational facts containing more than two entities, which are closer to real-world facts with broader applications. However, the construction of NKGs still significantly relies on manual labor, and n-ary relation extraction still remains at a course-grained level, which is always in a single schema and fixed arity of entities. To address these restrictions, we propose Text2NKG, a novel fine-grained n-ary relation extraction framework for n-ary relational knowledge graph construction. We introduce a span-tuple classification approach with hetero-ordered merging to accomplish fine-grained n-ary relation extraction in different arity. Furthermore, Text2NKG supports four typical NKG schemas: hyper-relational schema, event-based schema, role-based schema, and hypergraph-based schema, with high flexibility and practicality. Experimental results demonstrate that Text2NKG outperforms the previous state-of-the-art model by nearly 20\\% points in the $F_1$ scores on the fine-grained n-ary relation extraction benchmark in the hyper-relational schema. Our code and datasets are publicly available.",
        "keywords": "N-ary Relation Extraction;N-ary relational Knowledge Graph;Knowledge Graph Construction",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/a2434b97e1785d88eaefa40b23a48dac5cd1aecd.zip",
        "author": "Haoran Luo;Haihong E;Yuhao Yang;Tianyu Yao;Yikai Guo;Zichen Tang;Wentai Zhang;Kaiyang Wan;Shiyao Peng;Meina Song;Wei Lin",
        "authorids": "~Haoran_Luo1;~Haihong_E1;~Yuhao_Yang1;~Tianyu_Yao1;~Yikai_Guo2;~Zichen_Tang1;~Wentai_Zhang2;~Kaiyang_Wan1;~Shiyao_Peng2;~Meina_Song1;~Wei_Lin13",
        "gender": "M;F;M;M;M;M;M;M;F;M;",
        "homepage": "https://lhrlab.github.io/;https://teacher.bupt.edu.cn/ehaihong/zh_CN/index.htm;;https://github.com/yao12315;https://github.com/GYK-CASIC;https://github.com/StarLight24;;https://github.com/coverdpsy;http://teacher.bupt.edu.cn/songmeina/;http://www.inspur.com;",
        "dblp": "227/5902-1.html;43/10222.html;;324/5213;334/4154;264/0465;324/4644;;95/4440;https://dblp.uni-trier.de/pid/99/2649;",
        "google_scholar": "https://scholar.google.com.hk/citations?user=Q9Nv9mcAAAAJ;https://scholar.google.com.hk/citations?user=J4akh64AAAAJ;T0arNqgAAAAJ;M3wrJAwAAAAJ;https://scholar.google.com.hk/citations?user=4LxmyZAAAAAJ;https://scholar.google.com/citations?hl=zh-CN;v_faxAsAAAAJ;;https://scholar.google.com/citations?hl=zh-CN;;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0003-2727-0361;;;;0000-0003-0345-1686;0000-0002-0244-4970;;;0000-0001-6626-9932;;",
        "linkedin": "haoran-luo-88a96b255/;;;;https://www.linkedin.cn/incareer/in/ACoAAD5htzQBKWZKy68SvRuuztB4LJDhIKMdM1o;;;;;;",
        "or_profile": "~Haoran_Luo1;~Haihong_E1;~Yuhao_Yang1;~Tianyu_Yao1;~Yikai_Guo2;~Zichen_Tang1;~Kaiyang_Wan1;~Shiyao_Peng2;~Meina_Song1;~Wei_Lin13;~wentai_zhang1",
        "aff": "Nanyang Technological University;Beijing University of Post and Telecommunication;Beihang University;Beijing University of Posts and Telecommunications;Beijing Institute of Computer Technology and Application;Beijing University of Posts and Telecommunications;Beijing University of Posts and Telecommunications;China University of Petroleum-Beijing at Karamay;Beijing University of Posts and Telecommunications;;",
        "aff_domain": "ntu.edu.sg;bupt.edu.cn;buaa.edu.cn;bupt.edu.cn;casic.com.cn;bupt.edu.cn;bupt.edu.cn;cupk.edu.cn;bupt.edu.cn;;",
        "position": "Intern;Full Professor;MS student;MS student;PhD student;MS student;Undergrad student;Undergrad student;Full Professor;;",
        "bibtex": "@misc{\nluo2024textnkg,\ntitle={Text2{NKG}: Fine-Grained N-ary Relation Extraction for N-ary relational Knowledge Graph Construction},\nauthor={Haoran Luo and Haihong E and Yuhao Yang and Tianyu Yao and Yikai Guo and Zichen Tang and Wentai Zhang and Kaiyang Wan and Shiyao Peng and Meina Song and Wei Lin},\nyear={2024},\nurl={https://openreview.net/forum?id=1g77zRaJq0}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZHPg;vB44;JaVm;z8Bh",
        "site": "https://openreview.net/forum?id=1g77zRaJq0",
        "pdf_size": 2177425,
        "rating": "3;3;5;5",
        "confidence": "4;3;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;2",
        "presentation": "2;1;2;2",
        "wc_summary": "98;184;155;40",
        "wc_strengths": "49;20;180;84",
        "wc_weaknesses": "63;88;607;146",
        "wc_questions": "5;136;265;37",
        "wc_review": "215;428;1207;307",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            119.25,
            55.23302906775981
        ],
        "wc_strengths_avg": [
            83.25,
            60.280075481040996
        ],
        "wc_weaknesses_avg": [
            226.0,
            222.02139536540167
        ],
        "wc_questions_avg": [
            110.75,
            101.30739114200898
        ],
        "wc_review_avg": [
            539.25,
            392.85644642795415
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13416463536580625484&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;1;3;1;1;4;1",
        "aff_unique_norm": "Nanyang Technological University;Beijing University of Posts and Telecommunications;Beihang University;Beijing Institute of Computer Technology and Application;China University of Petroleum",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.ntu.edu.sg;http://www.bupt.edu.cn/;http://www.buaa.edu.cn/;;http://www.cup.edu.cn",
        "aff_unique_abbr": "NTU;BUPT;BUAA;;CUP",
        "aff_campus_unique_index": "1;1;1;1;1;1",
        "aff_campus_unique": ";Beijing",
        "aff_country_unique_index": "0;1;1;1;1;1;1;1;1",
        "aff_country_unique": "Singapore;China"
    },
    {
        "id": "1gkePTsAWf",
        "title": "Self-Taught Optimizer (STOP): Recursively Self-Improving Code Generation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Several recent advances in AI systems (e.g., Tree-of-Thoughts and Program-Aided Language Models) solve problems by providing a \"scaffolding\" program that structures multiple calls to language models to generate better outputs. A scaffolding program is written in a programming language such as Python. In this work, we use a language-model-infused scaffolding program to improve itself. We start with a seed \"improver\" that improves an input program according to a given utility function by querying a language model several times and returning the best solution. We then run this seed improver to improve itself. Across a small set of downstream tasks, the resulting improved improver generates programs with significantly better performance than its seed improver. Afterward, we analyze the variety of self-improvement strategies proposed by the language model, including beam search, genetic algorithms, and simulated annealing. Since the language models themselves are not altered, this is not full recursive self-improvement. Nonetheless, it demonstrates that a modern language model, GPT-4 in our proof-of-concept experiments, is capable of writing code that can call itself to improve itself. We critically consider concerns around the development of self-improving technologies and evaluate the frequency with which the generated code bypasses a sandbox.",
        "keywords": "reasoning;language models;self-improvement;code generation",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Eric Zelikman;Eliana Lorch;Lester Mackey;Adam Tauman Kalai",
        "authorids": "~Eric_Zelikman1;eliana@lorien.ai;~Lester_Mackey1;~Adam_Tauman_Kalai1",
        "gender": "M;;M;",
        "homepage": "https://zelikman.me;;https://stanford.edu/~lmackey;",
        "dblp": "217/2378;;05/2961;",
        "google_scholar": "V5B8dSUAAAAJ;;erv7TP0AAAAJ;",
        "orcid": ";;0000-0002-1102-0387;",
        "linkedin": "ericzelikman/;;lester-mackey-5902909;",
        "or_profile": "~Eric_Zelikman1;eliana@lorien.ai;~Lester_Mackey1;~Adam_Tauman_Kalai1",
        "aff": "Stanford University;;Microsoft Research New England;",
        "aff_domain": "stanford.edu;;microsoft.com;",
        "position": "PhD student;;Principal Researcher;",
        "bibtex": "@misc{\nzelikman2024selftaught,\ntitle={Self-Taught Optimizer ({STOP}): Recursively Self-Improving Code Generation},\nauthor={Eric Zelikman and Eliana Lorch and Lester Mackey and Adam Tauman Kalai},\nyear={2024},\nurl={https://openreview.net/forum?id=1gkePTsAWf}\n}",
        "github": "",
        "project": "",
        "reviewers": "UnQ9;VZPP;X5AY;443q;yFD6",
        "site": "https://openreview.net/forum?id=1gkePTsAWf",
        "pdf_size": 600577,
        "rating": "5;6;6;6;8",
        "confidence": "4;2;4;4;4",
        "soundness": "2;2;3;3;3",
        "contribution": "3;2;3;3;4",
        "presentation": "4;2;3;2;4",
        "wc_summary": "107;105;78;83;111",
        "wc_strengths": "53;23;97;67;189",
        "wc_weaknesses": "224;300;66;255;12",
        "wc_questions": "38;59;51;84;26",
        "wc_review": "422;487;292;489;338",
        "wc_reply_reviewers": "0;91;0;108;7",
        "wc_reply_authors": "776;1412;654;670;242",
        "reply_reviewers": "0;1;0;1;1",
        "reply_authors": "1;2;1;1;1",
        "rating_avg": [
            6.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.6,
            0.8000000000000002
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            3.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            3.0,
            0.8944271909999159
        ],
        "wc_summary_avg": [
            96.8,
            13.541048703848606
        ],
        "wc_strengths_avg": [
            85.8,
            56.83097746827869
        ],
        "wc_weaknesses_avg": [
            171.4,
            112.08139899198261
        ],
        "wc_questions_avg": [
            51.6,
            19.724096937502615
        ],
        "wc_review_avg": [
            405.6,
            79.15200565999575
        ],
        "wc_reply_reviewers_avg": [
            41.2,
            47.97249211787938
        ],
        "wc_reply_authors_avg": [
            750.8,
            377.517363839069
        ],
        "reply_reviewers_avg": [
            0.6,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.2,
            0.4000000000000001
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.10206207261596571,
        "gs_citation": 44,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7905804306816397467&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Stanford University;Microsoft",
        "aff_unique_dep": ";Microsoft Research",
        "aff_unique_url": "https://www.stanford.edu;https://www.microsoft.com/en-us/research/group/microsoft-research-new-england",
        "aff_unique_abbr": "Stanford;MSR NE",
        "aff_campus_unique_index": "0;1",
        "aff_campus_unique": "Stanford;New England",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "1hLFLNu4uy",
        "title": "Split and Merge: Aligning Position Biases in Large Language Model based Evaluators",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs) have shown promise as automated evaluators for assessing the quality of answers generated by AI systems. However, these LLM-based evaluators exhibit position bias, or inconsistency, when used to evaluate candidate answers in pairwise comparisons, favoring either the first or second answer regardless of content. To address this limitation, we propose PORTIA, an\nalignment-based system designed to mimic human comparison strategies to calibrate position bias in a lightweight yet effective manner. Specifically, PORTIA splits the answers into multiple segments, aligns similar content across candidate answers, and then merges them back into a single prompt for evaluation by LLMs. We conducted extensive experiments with six diverse LLMs to evaluate 11,520 answer pairs. Our results show that PORTIA markedly enhances the consistency rates for all the models and comparison forms tested, achieving an average relative improvement of 47.46%. Remarkably, PORTIA enables less advanced GPT models to achieve 88% agreement with the state-of-the-art GPT-4 model at just 10% of the cost. Furthermore, it rectifies around 80% of the position bias instances within the\nGPT-4 model, elevating its consistency rate up to 98%. Subsequent human evaluations indicate that the PORTIA-enhanced GPT-3.5 model can even surpass the standalone GPT-4 in terms of alignment with human evaluators. These findings highlight PORTIA\u2019s ability to correct position bias, improve LLM consistency, and boost performance while keeping cost-efficiency. This represents a valuable step\ntoward a more reliable and scalable use of LLMs for automated evaluations across diverse applications.",
        "keywords": "Large language models;Alignment;Consistency",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/6ff851bfb65da08eef4cc8051cf1210a71b91aad.zip",
        "author": "Zongjie Li;Chaozheng Wang;Pingchuan Ma;Daoyuan Wu;Tianxiang Li;Shuai Wang;Cuiyun Gao;Yang Liu",
        "authorids": "~Zongjie_Li1;~Chaozheng_Wang1;~Pingchuan_Ma4;~Daoyuan_Wu1;~Tianxiang_Li2;~Shuai_Wang7;~Cuiyun_Gao1;~Yang_Liu36",
        "gender": "Not Specified;M;;;M;M;F;M",
        "homepage": ";;;https://daoyuan14.github.io/;http://tianxiang.net;https://home.cse.ust.hk/~shuaiw/;https://cuiyungao.github.io/;https://personal.ntu.edu.sg/yangliu/",
        "dblp": ";217/1869;;https://dblp.uni-trier.de/pid/144/7556.html;;42/1503-11;;51/3710-3",
        "google_scholar": "https://scholar.google.com.hk/citations?user=Sd8mmE0AAAAJ;gx5zRYIAAAAJ;;WtO-bN8AAAAJ;;;9I2hTmQAAAAJ;https://scholar.google.com.sg/citations?hl=en",
        "orcid": ";;;;;;;0000-0001-7300-9215",
        "linkedin": ";;;;;;;",
        "or_profile": "~Zongjie_Li1;~Chaozheng_Wang1;~Pingchuan_Ma4;~Daoyuan_Wu1;~Tianxiang_Li2;~Shuai_Wang7;~Cuiyun_Gao1;~Yang_Liu36",
        "aff": "Department of Computer Science and Engineering, Hong Kong University of Science and Technology;Department of Computer Science and Engineering, The Chinese University of Hong Kong;;Nanyang Technological University;;Hong Kong University of Science and Technology;;Nanyang Technological University",
        "aff_domain": "cse.ust.hk;cse.cuhk.edu.hk;;ntu.edu.sg;;hkust.edu;;ntu.edu.sg",
        "position": "PhD student;PhD student;;Senior Research Fellow;;Associate Professor;;Full Professor",
        "bibtex": "@misc{\nli2024split,\ntitle={Split and Merge: Aligning Position Biases in Large Language Model based Evaluators},\nauthor={Zongjie Li and Chaozheng Wang and Pingchuan Ma and Daoyuan Wu and Tianxiang Li and Shuai Wang and Cuiyun Gao and Yang Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=1hLFLNu4uy}\n}",
        "github": "",
        "project": "",
        "reviewers": "SWLn;cPgm;YB2D;RHzc",
        "site": "https://openreview.net/forum?id=1hLFLNu4uy",
        "pdf_size": 642987,
        "rating": "3;5;6;6",
        "confidence": "5;4;4;3",
        "soundness": "1;3;3;2",
        "contribution": "2;3;3;2",
        "presentation": "2;3;3;3",
        "wc_summary": "160;123;56;86",
        "wc_strengths": "33;80;20;36",
        "wc_weaknesses": "312;133;80;288",
        "wc_questions": "41;100;3;6",
        "wc_review": "546;436;159;416",
        "wc_reply_reviewers": "272;67;0;308",
        "wc_reply_authors": "1900;1253;454;683",
        "reply_reviewers": "2;1;0;1",
        "reply_authors": "3;2;1;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            106.25,
            39.06644980030819
        ],
        "wc_strengths_avg": [
            42.25,
            22.609455986378798
        ],
        "wc_weaknesses_avg": [
            203.25,
            98.9125244850216
        ],
        "wc_questions_avg": [
            37.5,
            39.05444917035702
        ],
        "wc_review_avg": [
            389.25,
            141.8509340822259
        ],
        "wc_reply_reviewers_avg": [
            161.75,
            131.03887781876034
        ],
        "wc_reply_authors_avg": [
            1072.5,
            559.3721927303859
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.8660254037844386,
        "gs_citation": 32,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=320404609852215416&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;0;2",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Chinese University of Hong Kong;Nanyang Technological University",
        "aff_unique_dep": "Department of Computer Science and Engineering;Department of Computer Science and Engineering;",
        "aff_unique_url": "https://www.ust.hk;https://www.cuhk.edu.hk;https://www.ntu.edu.sg",
        "aff_unique_abbr": "HKUST;CUHK;NTU",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;1;0;1",
        "aff_country_unique": "China;Singapore"
    },
    {
        "id": "1hhja8ZxcP",
        "title": "Turbulent Flow Simulation using Autoregressive Conditional Diffusion Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Simulating turbulent flows is crucial for a wide range of applications, and machine learning-based solvers are gaining increasing relevance. However, achieving stability when generalizing to longer rollout horizons remains a persistent challenge for learned PDE solvers. We address this challenge by introducing a fully data-driven fluid solver that utilizes an autoregressive rollout based on conditional diffusion models. We show that this approach offers clear advantages in terms of rollout stability compared to other learned baselines. Remarkably, these improvements in stability are achieved without compromising the quality of generated samples, and our model successfully generalizes to flow parameters beyond the training regime. Additionally, the probabilistic nature of the diffusion approach allows for inferring predictions that align with the statistics of the underlying physics. We quantitatively and qualitatively evaluate the performance of our method on a range of challenging scenarios, including incompressible and transonic flows, as well as isotropic turbulence.",
        "keywords": "turbulent flow;PDEs;numerical simulation;diffusion models;autoregressive models",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/00bf9b95aea315c609939fe20bbf16083220ea6c.zip",
        "author": "Georg Kohl;Liwei Chen;Nils Thuerey",
        "authorids": "~Georg_Kohl1;~Liwei_Chen2;~Nils_Thuerey1",
        "gender": "M;M;M",
        "homepage": "https://ge.in.tum.de/about/georg-kohl/;;https://ge.in.tum.de",
        "dblp": "259/1567;;42/478",
        "google_scholar": "https://scholar.google.de/citations?user=9gVgWocAAAAJ;;https://scholar.google.com.tw/citations?user=GEehwv8AAAAJ",
        "orcid": "0000-0002-9661-575X;0000-0002-0309-2284;",
        "linkedin": ";liwei-chen-46557017/;",
        "or_profile": "~Georg_Kohl1;~Liwei_Chen2;~Nils_Thuerey1",
        "aff": "Technische Universit\u00e4t M\u00fcnchen;Technical University Munich;Technical University Munich",
        "aff_domain": "tum.de;tum.de;tum.de",
        "position": "PhD student;Postdoc;Associate Professor",
        "bibtex": "@misc{\nkohl2024turbulent,\ntitle={Turbulent Flow Simulation using Autoregressive Conditional Diffusion Models},\nauthor={Georg Kohl and Liwei Chen and Nils Thuerey},\nyear={2024},\nurl={https://openreview.net/forum?id=1hhja8ZxcP}\n}",
        "github": "",
        "project": "",
        "reviewers": "1NQ6;ySpT;wsiC;JT77",
        "site": "https://openreview.net/forum?id=1hhja8ZxcP",
        "pdf_size": 16314951,
        "rating": "5;5;5;5",
        "confidence": "5;4;5;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;1",
        "presentation": "3;2;3;3",
        "wc_summary": "48;57;75;49",
        "wc_strengths": "33;72;247;61",
        "wc_weaknesses": "55;284;772;348",
        "wc_questions": "209;120;221;120",
        "wc_review": "345;533;1315;578",
        "wc_reply_reviewers": "0;69;0;0",
        "wc_reply_authors": "1070;716;1585;904",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "2;1;3;2",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            57.25,
            10.825317547305483
        ],
        "wc_strengths_avg": [
            103.25,
            84.20325112488234
        ],
        "wc_weaknesses_avg": [
            364.75,
            259.1325674244748
        ],
        "wc_questions_avg": [
            167.5,
            47.68909728648677
        ],
        "wc_review_avg": [
            692.75,
            369.73394150388737
        ],
        "wc_reply_reviewers_avg": [
            17.25,
            29.877876430563134
        ],
        "wc_reply_authors_avg": [
            1068.75,
            323.29968682323215
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 27,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2514720713749392884&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Technische Universit\u00e4t M\u00fcnchen;Technical University of Munich",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tum.de;https://www.tum.de",
        "aff_unique_abbr": "TUM;TUM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "title": "Sample-Efficient Learning of POMDPs with Multiple Observations In Hindsight",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19578",
        "id": "1hsVvgW0rU",
        "author_site": "Jiacheng Guo, Minshuo Chen, Huan Wang, Caiming Xiong, Mengdi Wang, Yu Bai",
        "tldr": "",
        "abstract": "This paper studies the sample-efficiency of learning in Partially Observable Markov Decision Processes (POMDPs), a challenging problem in reinforcement learning that is known to be exponentially hard in the worst-case. Motivated by real-world settings such as loading in game playing, we propose an enhanced feedback model called ``multiple observations in hindsight'', where after each episode of interaction with the POMDP, the learner may collect multiple additional observations emitted from the encountered latent states, but may not observe the latent states themselves. We show that sample-efficient learning under this feedback model is possible for two new subclasses of POMDPs: \\emph{multi-observation revealing POMDPs} and \\emph{distinguishable POMDPs}. Both subclasses generalize and substantially relax \\emph{revealing POMDPs}---a widely studied subclass for which sample-efficient learning is possible under standard trajectory feedback. Notably, distinguishable POMDPs only require the emission distributions from different latent states to be \\emph{different} instead of \\emph{linearly independent} as required in revealing POMDPs.",
        "keywords": "reinforcement learning theory;POMDPs;partially observable reinforcement learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Jiacheng Guo;Minshuo Chen;Huan Wang;Caiming Xiong;Mengdi Wang;Yu Bai",
        "authorids": "~Jiacheng_Guo1;~Minshuo_Chen1;~Huan_Wang1;~Caiming_Xiong1;~Mengdi_Wang1;~Yu_Bai1",
        "gender": ";M;M;M;F;",
        "homepage": "http://;https://minshuochen.github.io;http://www.cs.yale.edu/homes/wang-huan/;http://cmxiong.com/;http://mwang.princeton.edu;https://yubai.org",
        "dblp": ";217/1509;70/6155-16.html;80/7282;;03/6325-17.html",
        "google_scholar": ";qU9WvTgAAAAJ;7NpTttkAAAAJ;vaSdahkAAAAJ;;owqhKD8AAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";;huanwangyale/;caiming-xiong-150a1417;;",
        "or_profile": "~Jiacheng_Guo1;~Minshuo_Chen1;~Huan_Wang1;~Caiming_Xiong1;~Mengdi_Wang1;~Yu_Bai1",
        "aff": "Princeton University;Princeton University;Salesforce.com;Salesforce Research;Princeton University;Salesforce Research",
        "aff_domain": "princeton.edu;princeton.edu;salesforce.com;salesforce.com;princeton.edu;salesforce.com",
        "position": "PhD student;Postdoc;Researcher;Research Scientist;Full Professor;Research Scientist",
        "bibtex": "@inproceedings{\nguo2024sampleefficient,\ntitle={Sample-Efficient Learning of {POMDP}s with Multiple Observations In Hindsight},\nauthor={Jiacheng Guo and Minshuo Chen and Huan Wang and Caiming Xiong and Mengdi Wang and Yu Bai},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=1hsVvgW0rU}\n}",
        "github": "",
        "project": "",
        "reviewers": "jqb5;q33U;se9m;FWjL",
        "pdf_size": 481945,
        "rating": "6;6;6;6",
        "confidence": "4;3;3;4",
        "soundness": "3;4;2;4",
        "contribution": "2;3;3;3",
        "presentation": "3;4;2;3",
        "wc_summary": "170;35;89;164",
        "wc_strengths": "111;78;34;54",
        "wc_weaknesses": "70;102;24;233",
        "wc_questions": "96;60;61;150",
        "wc_review": "447;275;208;601",
        "wc_reply_reviewers": "0;0;56;0",
        "wc_reply_authors": "282;458;433;1224",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;2;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            114.5,
            55.90393546075267
        ],
        "wc_strengths_avg": [
            69.25,
            28.699956445959984
        ],
        "wc_weaknesses_avg": [
            107.25,
            77.71542639656556
        ],
        "wc_questions_avg": [
            91.75,
            36.62222685747004
        ],
        "wc_review_avg": [
            382.75,
            153.22267293060776
        ],
        "wc_reply_reviewers_avg": [
            14.0,
            24.24871130596428
        ],
        "wc_reply_authors_avg": [
            599.25,
            366.9300853023638
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15402953603063387946&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=1hsVvgW0rU",
        "pdf": "https://openreview.net/pdf?id=1hsVvgW0rU",
        "email": "princeton.edu;princeton.edu;salesforce.com;salesforce.com;princeton.edu;salesforce.com",
        "author_num": 6,
        "aff_unique_index": "0;0;1;1;0;1",
        "aff_unique_norm": "Princeton University;Salesforce",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.princeton.edu;https://www.salesforce.com",
        "aff_unique_abbr": "Princeton;Salesforce",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "1iKydVG6pL",
        "title": "Discovering Mathematical Formulas from Data via LSTM-guided Monte Carlo Tree Search",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Finding a concise and interpretable mathematical formula that accurately describes the relationship between each variable and the predicted value in the data is a crucial task in scientific research, as well as a significant challenge in artificial intelligence.  This problem is commonly referred to as symbolic regression, which poses an NP-hard combinatorial optimization problem.  Traditional symbolic regression algorithms typically rely on genetic algorithms;  however, these approaches are sensitive to hyperparameters and often struggle to fully recover the target expression.  To address these limitations, a novel symbolic regression algorithm based on Monte Carlo Tree Search (MCTS) was proposed this year.  While this algorithm has shown considerable improvement in recovering target expressions compared to previous methods, it still faces challenges when dealing with complex expressions due to the vast search space involved.  Moreover, the lack of guidance during the MCTS expansion process severely hampers its search efficiency.  In order to overcome these issues, we propose AlphaSymbol - a new symbolic regression algorithm that combines MCTS with a Long Short-Term Memory network (LSTM). By leveraging LSTM's ability to guide the MCTS expansion process effectively, we enhance the overall search efficiency of MCTS significantly.  Next, we utilize the MCTS results to further refine the LSTM network, enhancing its capabilities and providing more accurate guidance for the MCTS process. MCTS and LSTM hand in hand advance together, win-win cooperation until the target expression is successfully determined. We conducted extensive evaluations of AlphaSymbol using 222 expressions sourced from over 10 different symbolic regression datasets.  The experimental results demonstrate that AlphaSymbol outperforms existing state-of-the-art algorithms in accurately recovering symbolic expressions both with and without added noise.",
        "keywords": "Symbolic Regression;Long Short-Term Mem- ory network;Monte Carlo Tree Search;Reinforcement learning.",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/d1f08fa871ba306251908079d750099dbef4b664.pdf",
        "author": "Yanjie Li;Weijun Li;Lina Yu;Min Wu;Linjun Sun;Jingyi Liu;Wenqiang Li;Meilan Hao",
        "authorids": "~Yanjie_Li4;~Weijun_Li1;~Lina_Yu1;~Min_Wu5;~Linjun_Sun1;~Jingyi_Liu2;~Wenqiang_Li2;~Meilan_Hao1",
        "gender": ";M;F;M;M;F;M;",
        "homepage": ";;;http://lab.semi.ac.cn/ailab/;;;https://github.com/AILWQ;",
        "dblp": ";;;16/0;;;;",
        "google_scholar": ";HrzfypUAAAAJ;I8Uc918AAAAJ;wvvyr8UAAAAJ;50WznDAAAAAJ;;b-MGt8gAAAAJ;",
        "orcid": ";0000-0001-9668-2883;;0000-0001-9475-3975;0000-0002-9287-9467;0000-0002-9710-5006;0000-0003-3286-7445;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Yanjie_Li4;~Weijun_Li1;~Lina_Yu1;~Min_Wu5;~Linjun_Sun1;~Jingyi_Liu2;~Wenqiang_Li2;~Meilan_Hao1",
        "aff": ";Institute of Semiconductors Chinese Academy of Sciences;Institute of Semiconductors, Chinese Academy of Sciences;Institute of Semiconductors, Chinese Academy of Sciences;Institute of Semiconductors, Chinese Academy of Sciences;University of Chinese Academy of Sciences;University of Chinese Academy of Sciences;",
        "aff_domain": ";ucac.ac.cn;semi.ac.cn;semi.ac.cn;semi.ac.cn;ucas.edu;ucas.ac.cn;",
        "position": ";Full Professor;Associate Professor;Assistant Professor;Postdoc;PhD student;MS student;",
        "bibtex": "@misc{\nli2024discovering,\ntitle={Discovering Mathematical Formulas from Data via {LSTM}-guided Monte Carlo Tree Search},\nauthor={Yanjie Li and Weijun Li and Lina Yu and Min Wu and Linjun Sun and Jingyi Liu and Wenqiang Li and Meilan Hao},\nyear={2024},\nurl={https://openreview.net/forum?id=1iKydVG6pL}\n}",
        "github": "",
        "project": "",
        "reviewers": "SBg1;YgjN;27mA;Fmza",
        "site": "https://openreview.net/forum?id=1iKydVG6pL",
        "pdf_size": 1317617,
        "rating": "3;3;5;6",
        "confidence": "4;4;3;5",
        "soundness": "1;2;3;3",
        "contribution": "1;2;3;2",
        "presentation": "1;1;2;3",
        "wc_summary": "20;18;77;43",
        "wc_strengths": "16;21;57;18",
        "wc_weaknesses": "105;321;342;21",
        "wc_questions": "263;40;4;51",
        "wc_review": "404;400;480;133",
        "wc_reply_reviewers": "287;26;56;22",
        "wc_reply_authors": "2163;658;735;243",
        "reply_reviewers": "2;1;1;1",
        "reply_authors": "4;3;2;2",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            39.5,
            23.77498685593748
        ],
        "wc_strengths_avg": [
            28.0,
            16.837458240482736
        ],
        "wc_weaknesses_avg": [
            197.25,
            137.69599667383218
        ],
        "wc_questions_avg": [
            89.5,
            101.66734972448135
        ],
        "wc_review_avg": [
            354.25,
            131.65556387787035
        ],
        "wc_reply_reviewers_avg": [
            97.75,
            110.05084052382335
        ],
        "wc_reply_authors_avg": [
            949.75,
            725.0356456754384
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.2721655269759087,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15681812717127003335&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0;1;1",
        "aff_unique_norm": "Chinese Academy of Sciences;University of Chinese Academy of Sciences",
        "aff_unique_dep": "Institute of Semiconductors;",
        "aff_unique_url": "http://www.semi.ac.cn;http://www.ucas.ac.cn",
        "aff_unique_abbr": "CAS;UCAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Simple Minimax Optimal Byzantine Robust Algorithm for Nonconvex Objectives with Uniform Gradient Heterogeneity",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19577",
        "id": "1ii8idH4tH",
        "author_site": "Tomoya Murata, Kenta Niwa, Takumi Fukami, Iifan Tyou",
        "tldr": "",
        "abstract": "In this study, we consider nonconvex federated learning problems with the existence of Byzantine workers. We propose a new simple Byzantine robust algorithm called Momentum Screening. The algorithm is adaptive to the Byzantine fraction, i.e., all its hyperparameters do not depend on the number of Byzantine workers. We show that our method achieves the best optimization error of $O(\\delta^2\\zeta_\\mathrm{max}^2)$ for nonconvex smooth local objectives satisfying $\\zeta_\\mathrm{max}$-uniform gradient heterogeneity condition under $\\delta$-Byzantine fraction, which can be better than the best known error rate of $O(\\delta\\zeta_\\mathrm{mean}^2)$ for local objectives satisfying $\\zeta_\\mathrm{mean}$-mean heterogeneity condition when $\\delta \\leq (\\zeta_\\mathrm{max}/\\zeta_\\mathrm{mean})^2$. Furthermore, we derive an algorithm independent lower bound for local objectives satisfying $\\zeta_\\mathrm{max}$-uniform gradient heterogeneity condition and show the minimax optimality of our proposed method on this class. In numerical experiments, we validate the superiority of our method over the existing robust aggregation algorithms and verify our theoretical results.",
        "keywords": "Byzantine Robustness;Nonconvex Optimization;Federated Learning",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Tomoya Murata;Kenta Niwa;Takumi Fukami;Iifan Tyou",
        "authorids": "~Tomoya_Murata1;~Kenta_Niwa1;~Takumi_Fukami1;~Iifan_Tyou1",
        "gender": "M;M;;M",
        "homepage": ";http://www.kecl.ntt.co.jp/icl/ls/members/niwa/index.html;;",
        "dblp": "151/5035;64/1008.html;;234/8871.html",
        "google_scholar": "hH5pbMIAAAAJ;Btla06EAAAAJ;;",
        "orcid": ";0000-0002-6911-0238;;",
        "linkedin": ";;http://www.linkedin.com/in/takumi-fukami-8a4a40238;tyou-iifan-354b132b/",
        "or_profile": "~Tomoya_Murata1;~Kenta_Niwa1;~Takumi_Fukami1;~Iifan_Tyou1",
        "aff": "The University of Tokyo;NTT Corporation;NTT Corporation;NTT",
        "aff_domain": "tokyo.ac.jp;ntt.co.jp;ntt.co.jp;ntt.co.jp",
        "position": "PhD student;Researcher;Researcher;Researcher",
        "bibtex": "@inproceedings{\nmurata2024simple,\ntitle={Simple Minimax Optimal Byzantine Robust Algorithm for Nonconvex Objectives with Uniform Gradient Heterogeneity},\nauthor={Tomoya Murata and Kenta Niwa and Takumi Fukami and Iifan Tyou},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=1ii8idH4tH}\n}",
        "github": "",
        "project": "",
        "reviewers": "p51w;uTUe;BeSt",
        "pdf_size": 5418301,
        "rating": "3;6;6",
        "confidence": "2;3;3",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "2;2;3",
        "wc_summary": "65;123;108",
        "wc_strengths": "43;107;69",
        "wc_weaknesses": "213;255;47",
        "wc_questions": "3;18;26",
        "wc_review": "324;503;250",
        "wc_reply_reviewers": "0;23;16",
        "wc_reply_authors": "430;551;310",
        "reply_reviewers": "0;1;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            98.66666666666667,
            24.580932086115496
        ],
        "wc_strengths_avg": [
            73.0,
            26.280537792569366
        ],
        "wc_weaknesses_avg": [
            171.66666666666666,
            89.80472642845079
        ],
        "wc_questions_avg": [
            15.666666666666666,
            9.533566430716728
        ],
        "wc_review_avg": [
            359.0,
            106.21048284734735
        ],
        "wc_reply_reviewers_avg": [
            13.0,
            9.626352718795768
        ],
        "wc_reply_authors_avg": [
            430.3333333333333,
            98.38812033077073
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11224376210352366179&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=1ii8idH4tH",
        "pdf": "https://openreview.net/pdf?id=1ii8idH4tH",
        "email": "tokyo.ac.jp;ntt.co.jp;ntt.co.jp;ntt.co.jp",
        "author_num": 4,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "University of Tokyo;NTT Corporation",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.u-tokyo.ac.jp;https://www.ntt.co.jp",
        "aff_unique_abbr": "UTokyo;NTT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Japan"
    },
    {
        "title": "Towards Few-Shot Adaptation of Foundation Models via Multitask Finetuning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19576",
        "id": "1jbh2e0b2K",
        "author_site": "Zhuoyan Xu, Zhenmei Shi, Junyi Wei, Fangzhou Mu, Yin Li, Yingyu Liang",
        "tldr": "",
        "abstract": "Foundation models have emerged as a powerful tool for many AI problems. Despite the tremendous success of foundation models, effective adaptation to new tasks, particularly those with limited labels, remains an open question and lacks theoretical understanding. \n  An emerging solution with recent success in vision and NLP involves finetuning a foundation model on a selection of relevant tasks, before its adaptation to a target task with limited labeled samples. In this paper, we study the theoretical justification of this multitask finetuning approach. \nOur theoretical analysis reveals that with a diverse set of related tasks, this multitask finetuning leads to reduced error in the target task, in comparison to directly adapting the same pretrained model. We quantify the relationship between finetuning tasks and target tasks by diversity and consistency metrics, and further propose a practical task selection algorithm.\n  We substantiate our theoretical claims with extensive empirical evidence.\nFurther, we present results affirming our task selection algorithm adeptly chooses related finetuning tasks, providing advantages to the model performance on target tasks.\n  We believe our study shed new light on the effective adaptation of foundation models to new tasks that lack abundant labels.\n  Our code is available at https://github.com/OliverXUZY/Foudation-Model_Multitask.",
        "keywords": "Foundation model;Multitask finetuning;Few-Shot learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/4f14dfd2bb204fa615bc528f7d20255cb50796b4.zip",
        "author": "Zhuoyan Xu;Zhenmei Shi;Junyi Wei;Fangzhou Mu;Yin Li;Yingyu Liang",
        "authorids": "~Zhuoyan_Xu1;~Zhenmei_Shi1;~Junyi_Wei1;~Fangzhou_Mu1;~Yin_Li3;~Yingyu_Liang1",
        "gender": "M;M;F;M;M;",
        "homepage": "https://pages.cs.wisc.edu/~zxu444/;http://zhmeishi.github.io/;;https://fmu2.github.io/;https://www.biostat.wisc.edu/~yli/;",
        "dblp": "126/2019;246/5216;166/6146;262/6282;49/5981-3;",
        "google_scholar": "uufndFAAAAAJ;0oeNnzMAAAAJ;Kb1GL40AAAAJ;OOymFJsAAAAJ;_y-8nrcAAAAJ;",
        "orcid": ";;;0000-0001-5580-2404;;",
        "linkedin": "zhuoyan-xu-0702301a2/;zhenmei-shi-56408a113/;Junyi-Jenny-Wei-04ba979b/;;;",
        "or_profile": "~Zhuoyan_Xu1;~Zhenmei_Shi1;~Junyi_Wei1;~Fangzhou_Mu1;~Yin_Li3;~Yingyu_Liang1",
        "aff": "University of Wisconsin - Madison;University of Wisconsin - Madison;University of Wisconsin, Madison;NVIDIA;University of Wisconsin, Madison;",
        "aff_domain": "wisc.edu;wisc.edu;wisc.edu;nvidia.com;wisc.edu;",
        "position": "PhD student;PhD student;PhD student;Researcher;Assistant Professor;",
        "bibtex": "@inproceedings{\nxu2024towards,\ntitle={Towards Few-Shot Adaptation of Foundation Models via Multitask Finetuning},\nauthor={Zhuoyan Xu and Zhenmei Shi and Junyi Wei and Fangzhou Mu and Yin Li and Yingyu Liang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=1jbh2e0b2K}\n}",
        "github": "",
        "project": "",
        "reviewers": "1yNr;72L9;AgCa;mX1E",
        "pdf_size": 922639,
        "rating": "5;5;6;8",
        "confidence": "4;5;3;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "2;2;3;3",
        "wc_summary": "135;44;44;210",
        "wc_strengths": "34;54;74;150",
        "wc_weaknesses": "157;97;78;41",
        "wc_questions": "72;97;2;91",
        "wc_review": "398;292;198;492",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "851;475;626;338",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;3;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            108.25,
            69.50674427708437
        ],
        "wc_strengths_avg": [
            78.0,
            43.9089968002003
        ],
        "wc_weaknesses_avg": [
            93.25,
            41.95458854523543
        ],
        "wc_questions_avg": [
            65.5,
            37.80542289143186
        ],
        "wc_review_avg": [
            345.0,
            110.4943437466371
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            572.5,
            190.34245453918052
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.7385489458759963,
        "gs_citation": 32,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1704557995012034903&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=1jbh2e0b2K",
        "pdf": "https://openreview.net/pdf?id=1jbh2e0b2K",
        "email": "wisc.edu;wisc.edu;wisc.edu;nvidia.com;wisc.edu;",
        "author_num": 6,
        "aff_unique_index": "0;0;1;2;1",
        "aff_unique_norm": "University of Wisconsin-Madison;University of Wisconsin;NVIDIA",
        "aff_unique_dep": ";;NVIDIA Corporation",
        "aff_unique_url": "https://www.wisc.edu;https://www.wisc.edu;https://www.nvidia.com",
        "aff_unique_abbr": "UW-Madison;UW;NVIDIA",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Madison;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "InstaFlow: One Step is Enough for High-Quality Diffusion-Based Text-to-Image Generation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19575",
        "id": "1k4yZbbDqX",
        "author_site": "Xingchao Liu, Xiwen Zhang, Jianzhu Ma, Jian Peng, Qiang Liu",
        "tldr": "",
        "abstract": "Diffusion models have revolutionized text-to-image generation with its exceptional quality and creativity. However, its multi-step sampling process is known to be slow, often requiring tens of inference steps to obtain satisfactory results. Previous attempts to improve its sampling speed and reduce computational costs through distillation have been unsuccessful in achieving a functional one-step model.\nIn this paper, we explore a recent method called Rectified Flow, which, thus far, has only been applied to small datasets. The core of Rectified Flow lies in its \\emph{reflow} procedure, which straightens the trajectories of probability flows, refines the coupling between noises and images, and facilitates the distillation process with student models. We propose a novel text-conditioned pipeline to turn Stable Diffusion (SD) into an ultra-fast one-step model, in which we find reflow plays a critical role in improving the assignment between noise and images. Leveraging our new pipeline, we create, to the best of our knowledge, the first one-step diffusion-based text-to-image generator with SD-level image quality, achieving an FID (Fr\u00e9chet Inception Distance) of $23.3$ on MS COCO 2017-5k, surpassing the previous state-of-the-art technique, progressive distillation, by a significant margin ($37.2$ $\\rightarrow$ $23.3$ in FID). By utilizing an expanded network with 1.7B parameters, we further improve the FID to $22.4$. We call our one-step models \\emph{InstaFlow}. On MS COCO 2014-30k, InstaFlow yields an FID of $13.1$ in just $0.09$ second, the best in $\\leq 0.1$ second regime, outperforming the recent StyleGAN-T ($13.9$ in $0.1$ second). Notably, the training of InstaFlow only costs 199 A100 GPU days. Codes and pre-trained models are available at \\url{github.com/gnobitab/InstaFlow}.",
        "keywords": "Diffusion Models;Generative Models;Acceleration",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/26c516ba81ea09b09c94825008b1320432bf0439.pdf",
        "author": "Xingchao Liu;Xiwen Zhang;Jianzhu Ma;Jian Peng;qiang liu",
        "authorids": "~Xingchao_Liu1;~Xiwen_Zhang2;~Jianzhu_Ma2;~Jian_Peng1;~qiang_liu4",
        "gender": "M;M;M;M;M",
        "homepage": ";https://xiwen1995.github.io/;https://majianzhu.com/;http://jianpeng.web.engr.illinois.edu/;https://www.cs.utexas.edu/~lqiang/",
        "dblp": "228/7309;;24/9080.html;29/4181-1;61/3234-1",
        "google_scholar": "VOTVE0UAAAAJ;9ArsuzwAAAAJ;;https://scholar.google.com.tw/citations?user=4wcAVXAAAAAJ;https://scholar.google.com.tw/citations?user=2qDh4WUAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Xingchao_Liu1;~Xiwen_Zhang2;~Jianzhu_Ma2;~Jian_Peng1;~Qiang_Liu1",
        "aff": "University of Texas, Austin;Helixon Research;Tsinghua University;University of Illinois, Urbana Champaign;University of Texas, Austin",
        "aff_domain": "utexas.edu;helixon.com;tsinghua.edu.cn;illinois.edu;utexas.edu",
        "position": "PhD student;Researcher;Associate Professor;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nliu2024instaflow,\ntitle={InstaFlow: One Step is Enough for High-Quality Diffusion-Based Text-to-Image Generation},\nauthor={Xingchao Liu and Xiwen Zhang and Jianzhu Ma and Jian Peng and qiang liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=1k4yZbbDqX}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZDe9;VVpt;mwbp;W54n",
        "pdf_size": 50159880,
        "rating": "6;6;8;8",
        "confidence": "5;4;4;3",
        "soundness": "3;4;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "158;47;61;62",
        "wc_strengths": "92;53;43;27",
        "wc_weaknesses": "168;85;167;74",
        "wc_questions": "85;54;33;45",
        "wc_review": "503;239;304;208",
        "wc_reply_reviewers": "127;257;93;58",
        "wc_reply_authors": "802;734;661;128",
        "reply_reviewers": "2;2;1;1",
        "reply_authors": "2;3;2;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            82.0,
            44.27753380666091
        ],
        "wc_strengths_avg": [
            53.75,
            23.951774464536026
        ],
        "wc_weaknesses_avg": [
            123.5,
            44.17295552710957
        ],
        "wc_questions_avg": [
            54.25,
            19.253246479490155
        ],
        "wc_review_avg": [
            313.5,
            114.7617096421973
        ],
        "wc_reply_reviewers_avg": [
            133.75,
            75.22424808530823
        ],
        "wc_reply_authors_avg": [
            581.25,
            266.3919809228498
        ],
        "reply_reviewers_avg": [
            1.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.7071067811865475,
        "gs_citation": 217,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=40660508850029294&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=1k4yZbbDqX",
        "pdf": "https://openreview.net/pdf?id=1k4yZbbDqX",
        "email": "utexas.edu;helixon.com;tsinghua.edu.cn;illinois.edu;utexas.edu",
        "author_num": 5,
        "aff_unique_index": "0;1;2;3;0",
        "aff_unique_norm": "University of Texas at Austin;Helixon Research;Tsinghua University;University of Illinois Urbana-Champaign",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.utexas.edu;;https://www.tsinghua.edu.cn;https://illinois.edu",
        "aff_unique_abbr": "UT Austin;;THU;UIUC",
        "aff_campus_unique_index": "0;2;0",
        "aff_campus_unique": "Austin;;Urbana-Champaign",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "Domain constraints improve risk prediction when outcome data is missing",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19574",
        "id": "1mNFsbvo2P",
        "author_site": "Sidhika Balachandar, Nikhil Garg, Emma Pierson",
        "tldr": "",
        "abstract": "Machine learning models are often trained to predict the outcome resulting from a human decision. For example, if a doctor decides to test a patient for disease, will the patient test positive? A challenge is that historical decision-making determines whether the outcome is observed: we only observe test outcomes for patients doctors historically tested. Untested patients, for whom outcomes are unobserved, may differ from tested patients along observed and unobserved dimensions. We propose a Bayesian model class which captures this setting. The purpose of the model is to accurately estimate risk for both tested and untested patients. Estimating this model is challenging due to the wide range of possibilities for untested patients. To address this, we propose two domain constraints which are plausible in health settings: a prevalence constraint, where the overall disease prevalence is known, and an expertise constraint, where the human decision-maker deviates from purely risk-based decision-making only along a constrained feature set. We show theoretically and on synthetic data that domain constraints improve parameter inference. We apply our model to a case study of cancer risk prediction, showing that the model's inferred risk predicts cancer diagnoses, its inferred testing policy captures known public health policies, and it can identify suboptimalities in test allocation. Though our case study is in healthcare, our analysis reveals a general class of domain constraints which can improve model estimation in many settings.",
        "keywords": "Bayesian model;health;selective labels;distribution shift;domain constraint;biomedicine",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/115822eb773a6a547c0fc7d1eb1a2d2bb90f953f.pdf",
        "author": "Sidhika Balachandar;Nikhil Garg;Emma Pierson",
        "authorids": "~Sidhika_Balachandar1;~Nikhil_Garg2;~Emma_Pierson1",
        "gender": "F;;F",
        "homepage": "https://sidhikabalachandar.github.io/;https://gargnikhil.com/;https://people.eecs.berkeley.edu/~emmapierson/",
        "dblp": "280/2938;83/6058-1;159/0572",
        "google_scholar": "4x_agk4AAAAJ;8qSK3noAAAAJ;xGORWi0AAAAJ",
        "orcid": "0000-0001-6739-2027;0000-0002-1988-792X;",
        "linkedin": "sidhikab/;;",
        "or_profile": "~Sidhika_Balachandar1;~Nikhil_Garg2;~Emma_Pierson1",
        "aff": "Department of Computer Science, Cornell University;Cornell University;Cornell Tech",
        "aff_domain": "cs.cornell.edu;cornell.edu;cornell.edu",
        "position": "PhD student;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nbalachandar2024domain,\ntitle={Domain constraints improve risk prediction when outcome data is missing},\nauthor={Sidhika Balachandar and Nikhil Garg and Emma Pierson},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=1mNFsbvo2P}\n}",
        "github": "",
        "project": "",
        "reviewers": "uugS;KKGr;6mUm;26qi",
        "pdf_size": 495306,
        "rating": "5;8;8;8",
        "confidence": "3;4;4;2",
        "soundness": "2;4;3;3",
        "contribution": "2;4;3;3",
        "presentation": "3;4;4;4",
        "wc_summary": "82;64;65;38",
        "wc_strengths": "91;64;92;23",
        "wc_weaknesses": "143;151;50;134",
        "wc_questions": "38;2;46;32",
        "wc_review": "354;281;253;227",
        "wc_reply_reviewers": "0;0;25;12",
        "wc_reply_authors": "674;412;432;1052",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            7.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            62.25,
            15.722197683530124
        ],
        "wc_strengths_avg": [
            67.5,
            28.040149785619906
        ],
        "wc_weaknesses_avg": [
            119.5,
            40.574006457336694
        ],
        "wc_questions_avg": [
            29.5,
            16.635804759614125
        ],
        "wc_review_avg": [
            278.75,
            47.457217575412066
        ],
        "wc_reply_reviewers_avg": [
            9.25,
            10.328964130056798
        ],
        "wc_reply_authors_avg": [
            642.5,
            257.93555396648986
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.17407765595569782,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6485419293618097691&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=1mNFsbvo2P",
        "pdf": "https://openreview.net/pdf?id=1mNFsbvo2P",
        "email": "cs.cornell.edu;cornell.edu;cornell.edu",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Cornell University",
        "aff_unique_dep": "Department of Computer Science",
        "aff_unique_url": "https://www.cornell.edu",
        "aff_unique_abbr": "Cornell",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";New York City",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "1mOeklnLf4",
        "title": "FroSSL: Frobenius Norm Minimization for Self-Supervised Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Self-supervised learning (SSL) is an increasingly popular paradigm for representation learning. Recent methods can be classified as sample-contrastive, dimension-contrastive, or asymmetric network-based, with each family having its own approach to avoiding informational collapse. While dimension-contrastive methods converge to similar solutions as sample-contrastive methods, it can be empirically shown that some methods require more epochs of training to converge. Motivated by closing this divide, we present the objective function FroSSL which is both sample- and dimension-contrastive up to embedding normalization. FroSSL works by minimizing covariance Frobenius norms for avoiding collapse and minimizing mean-squared error for augmentation invariance. We show that FroSSL converges more quickly than a variety of other SSL methods and provide theoretical and empirical support that this faster convergence is due to how FroSSL affects the eigenvalues of the embedding covariance matrices. We also show that FroSSL learns competitive representations on linear probe evaluation when used to train a ResNet18 on the CIFAR-10, CIFAR-100, STL-10, and ImageNet datasets.",
        "keywords": "self-supervised learning;representation learning;information theory;computer vision",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/e3ac395c7817f32cf7e7b4ac509117b560b6a5f5.zip",
        "author": "Oscar Skean;Aayush Dhakal;Nathan Jacobs;Luis Gonzalo Sanchez Giraldo",
        "authorids": "~Oscar_Skean1;a.dhakal@wustl.edu;~Nathan_Jacobs1;~Luis_Gonzalo_Sanchez_Giraldo2",
        "gender": "M;;M;",
        "homepage": ";;https://jacobsn.github.io/;",
        "dblp": ";;82/3140;",
        "google_scholar": "XO1nKsUAAAAJ;;ZBgGyh8AAAAJ;",
        "orcid": "0000-0002-4160-8392;;0000-0002-4242-8967;",
        "linkedin": ";;jacobsn/;",
        "or_profile": "~Oscar_Skean1;a.dhakal@wustl.edu;~Nathan_Jacobs1;~Luis_Gonzalo_Sanchez_Giraldo2",
        "aff": "University of Kentucky;;Washington University, Saint Louis;",
        "aff_domain": "uky.edu;;wustl.edu;",
        "position": "PhD student;;Full Professor;",
        "bibtex": "@misc{\nskean2024frossl,\ntitle={Fro{SSL}: Frobenius Norm Minimization for Self-Supervised Learning},\nauthor={Oscar Skean and Aayush Dhakal and Nathan Jacobs and Luis Gonzalo Sanchez Giraldo},\nyear={2024},\nurl={https://openreview.net/forum?id=1mOeklnLf4}\n}",
        "github": "",
        "project": "",
        "reviewers": "tbwD;dD2L;ZCeH;rGwc",
        "site": "https://openreview.net/forum?id=1mOeklnLf4",
        "pdf_size": 9901764,
        "rating": "3;3;3;5",
        "confidence": "5;3;4;3",
        "soundness": "1;2;3;3",
        "contribution": "1;1;2;2",
        "presentation": "1;3;3;3",
        "wc_summary": "63;49;41;20",
        "wc_strengths": "11;133;25;39",
        "wc_weaknesses": "209;261;3;58",
        "wc_questions": "159;56;94;25",
        "wc_review": "442;499;163;142",
        "wc_reply_reviewers": "0;0;0;39",
        "wc_reply_authors": "716;114;214;162",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            43.25,
            15.562374497485916
        ],
        "wc_strengths_avg": [
            52.0,
            47.80167361086848
        ],
        "wc_weaknesses_avg": [
            132.75,
            105.69383851483491
        ],
        "wc_questions_avg": [
            83.5,
            49.97249243333776
        ],
        "wc_review_avg": [
            311.5,
            160.4439154346465
        ],
        "wc_reply_reviewers_avg": [
            9.75,
            16.887495373796554
        ],
        "wc_reply_authors_avg": [
            301.5,
            241.9106239915891
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Kentucky;Washington University in St. Louis",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uky.edu;https://wustl.edu",
        "aff_unique_abbr": "UK;WUSTL",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Saint Louis",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "1mjbfedaye",
        "title": "Learning Equi-angular Representations for Online Continual Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Online continual learning suffers from an underfitted solution for prompt model update due to the constraint of single-epoch learning. We confront this challenge by proposing an efficient online continual learning method with the notion of neural collapse. In particular, we induce neural collapse to form a simplex equiangular tight frame (ETF) structure in the representation space so that the learned model with single epoch can better fit the streamed data by proposing preparatory data training and residual correction in the representation space. With an extensive set of empirical validations using CIFAR10/100, TinyImageNet, and ImageNet-200, we show that our proposed method outperforms state-of-the-art methods by a noticeable margin in various online continual learning scenarios, including Disjoint and Gaussian scheduled setups.",
        "keywords": "Online continual learning;Neural collapse",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Minhyuk Seo;Hyunseo Koh;Wonje Jeung;Min Jae Lee;San Kim;Hankook Lee;Sungjun Cho;Sungik Choi;Hyunwoo Kim;Jonghyun Choi",
        "authorids": "~Minhyuk_Seo1;~Hyunseo_Koh1;~Wonje_Jeung1;~Min_Jae_Lee2;~San_Kim2;~Hankook_Lee1;~Sungjun_Cho1;~Sungik_Choi1;~Hyunwoo_Kim5;~Jonghyun_Choi1",
        "gender": "M;M;M;M;M;M;M;M;M;M",
        "homepage": "https://dbd05088.github.io/;;https://github.com/cryingInitial;https://98minjae.github.io/;https://mounkim.github.io/;https://hankook.github.io;https://sc782.github.io/;https://ppolon.github.io/;https://sites.google.com/view/hyunwookim/home;",
        "dblp": "350/4104;304/4369;374/6621;;;223/4393;254/8021;21/11103;https://dblp.org/rec/conf/cvpr/HanHOPKKK22;184/4055.html",
        "google_scholar": "ayDPR-gAAAAJ;Mi4cMxgAAAAJ;;YWWOFx0AAAAJ;;CgqswXUAAAAJ;https://scholar.google.com/citations?hl=en;uiGWnm4AAAAJ;5DfOhKwAAAAJ;H0QB0PwAAAAJ",
        "orcid": ";0000-0002-2576-1581;;;;;;0000-0002-7934-8434;;",
        "linkedin": "minhyuk-seo-59ba11247/;%ED%98%84%EC%84%9C-%EA%B3%A0-66298a221/;;;san-kim-1b4495316?utm_source=share&utm_campaign=share_via&utm_content=profile&utm_medium=android_app;;sungjun-cho-46982411a/;jonghyun-choi-459bb615/;hyunwoo-k-b16460193/;",
        "or_profile": "~Minhyuk_Seo1;~Hyunseo_Koh1;~Wonje_Jeung1;~Min_Jae_Lee2;~San_Kim2;~Hankook_Lee1;~Sungjun_Cho1;~Jonghyun_Choi1;~Hyunwoo_Eugene_Kim1;~Choi_sungik1",
        "aff": "Yonsei University;Gwangju Institute of Science and Technology;Yonsei University;Seoul National University;Seoul National University;LG AI Research;LG AI Research;Yonsei University;Zhejiang Lab;LG AI Research",
        "aff_domain": "yonsei.ac.kr;gist.ac.kr;yonsei.ac.kr;snu.ac.kr;snu.ac.kr;lgresearch.ai;lgresearch.ai;yonsei.ac.kr;zhejianglab.com;lgresearch.ai",
        "position": "MS student;PhD student;Undergrad student;PhD student;MS student;Researcher;Researcher;Associate Professor;Principal Researcher;Researcher",
        "bibtex": "@misc{\nseo2024learning,\ntitle={Learning Equi-angular Representations for Online Continual Learning},\nauthor={Minhyuk Seo and Hyunseo Koh and Wonje Jeung and Min Jae Lee and San Kim and Hankook Lee and Sungjun Cho and Sungik Choi and Hyunwoo Kim and Jonghyun Choi},\nyear={2024},\nurl={https://openreview.net/forum?id=1mjbfedaye}\n}",
        "github": "",
        "project": "",
        "reviewers": "ubjn;Ff4L;Dzox;2VjM",
        "site": "https://openreview.net/forum?id=1mjbfedaye",
        "pdf_size": 1080551,
        "rating": "3;3;5;6",
        "confidence": "5;4;5;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;2;3",
        "wc_summary": "28;55;91;73",
        "wc_strengths": "38;25;52;53",
        "wc_weaknesses": "256;181;881;38",
        "wc_questions": "5;104;24;36",
        "wc_review": "327;365;1048;200",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            61.75,
            23.27418097377435
        ],
        "wc_strengths_avg": [
            42.0,
            11.467344941179714
        ],
        "wc_weaknesses_avg": [
            339.0,
            322.57479752764317
        ],
        "wc_questions_avg": [
            42.25,
            37.325426990189946
        ],
        "wc_review_avg": [
            485.0,
            330.7408350960008
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9436547253272062366&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;0;2;2;3;3;0;4;3",
        "aff_unique_norm": "Yonsei University;Gwangju Institute of Science and Technology;Seoul National University;LG;Zhejiang Lab",
        "aff_unique_dep": ";;;LG AI Research;",
        "aff_unique_url": "https://www.yonsei.ac.kr;https://www.gist.ac.kr;https://www.snu.ac.kr;https://www.lgaires.com;http://www.zhejianglab.com",
        "aff_unique_abbr": "Yonsei;GIST;SNU;LG AI;",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Gwangju",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;1;0",
        "aff_country_unique": "South Korea;China"
    },
    {
        "title": "Unsupervised Pretraining for Fact Verification by Language Model Distillation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19573",
        "id": "1mjsP8RYAw",
        "author_site": "Adrian Bazaga, Pietro Lio, Gos Micklem",
        "tldr": "",
        "abstract": "Fact verification aims to verify a claim using evidence from a trustworthy knowledge base. To address this challenge, algorithms must produce features for every claim that are both semantically meaningful, and compact enough to find a semantic alignment with the source information. In contrast to previous work, which tackled the alignment problem by learning over annotated corpora of claims and their corresponding labels, we propose SFAVEL ($\\underline{S}$elf-supervised $\\underline{Fa}$ct $\\underline{Ve}$rification via $\\underline{L}$anguage Model Distillation), a novel unsupervised pretraining framework that leverages pre-trained language models to distil self-supervised features into high-quality claim-fact alignments without the need for annotations. This is enabled by a novel contrastive loss function that encourages features to attain high-quality claim and evidence alignments whilst preserving the semantic relationships across the corpora. Notably, we present results that achieve a new state-of-the-art on FB15k-237 (+5.3\\% Hits@1) and FEVER (+8\\% accuracy) with linear evaluation.",
        "keywords": "Unsupervised Learning;Self-supervised Learning;Deep Features;Contrastive Learning;Large Language Models;Knowledge Distillation;Multimodality;Fact Verification",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Adri\u00e1n Bazaga;Pietro Lio;Gos Micklem",
        "authorids": "~Adri\u00e1n_Bazaga1;~Pietro_Lio1;~Gos_Micklem1",
        "gender": ";M;M",
        "homepage": "https://bazaga.ai/;https://www.cst.cam.ac.uk/people/pl219;http://www.micklemlab.org/",
        "dblp": "218/5717;l/PietroLio.html;",
        "google_scholar": "lrOLKgQAAAAJ;https://scholar.google.co.uk/citations?user=3YrWf7EAAAAJ;",
        "orcid": "0000-0002-1508-285X;0000-0002-0540-5053;0000-0002-6883-6168",
        "linkedin": "adrianbazaga/;;gosmicklem/",
        "or_profile": "~Adri\u00e1n_Bazaga1;~Pietro_Lio1;~Gos_Micklem1",
        "aff": "Amazon;University of Cambridge;University of Cambridge",
        "aff_domain": "amazon.com;cam.ac.uk;cam.ac.uk",
        "position": "Researcher;Full Professor;Principal Researcher",
        "bibtex": "@inproceedings{\nbazaga2024unsupervised,\ntitle={Unsupervised Pretraining for Fact Verification by Language Model Distillation},\nauthor={Adri{\\'a}n Bazaga and Pietro Lio and Gos Micklem},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=1mjsP8RYAw}\n}",
        "github": "",
        "project": "",
        "reviewers": "6mXX;bggr;kcpN;GMHM;1Hnq",
        "pdf_size": 857262,
        "rating": "5;5;6;6;8",
        "confidence": "3;5;4;3;3",
        "soundness": "3;3;3;3;4",
        "contribution": "3;2;2;3;3",
        "presentation": "3;3;2;2;4",
        "wc_summary": "340;93;54;82;30",
        "wc_strengths": "22;59;31;11;65",
        "wc_weaknesses": "22;231;215;225;80",
        "wc_questions": "3;32;34;79;16",
        "wc_review": "387;415;334;397;191",
        "wc_reply_reviewers": "0;77;0;141;31",
        "wc_reply_authors": "731;648;651;1436;274",
        "reply_reviewers": "0;1;0;1;1",
        "reply_authors": "2;2;2;4;2",
        "rating_avg": [
            6.0,
            1.0954451150103321
        ],
        "confidence_avg": [
            3.6,
            0.8
        ],
        "soundness_avg": [
            3.2,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.8,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            119.8,
            112.27537575087423
        ],
        "wc_strengths_avg": [
            37.6,
            20.99142682144308
        ],
        "wc_weaknesses_avg": [
            154.6,
            86.70547848896285
        ],
        "wc_questions_avg": [
            32.8,
            25.716920499935444
        ],
        "wc_review_avg": [
            344.8,
            81.49208550528083
        ],
        "wc_reply_reviewers_avg": [
            49.8,
            53.61119286119271
        ],
        "wc_reply_authors_avg": [
            748.0,
            378.87148216776626
        ],
        "reply_reviewers_avg": [
            0.6,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            2.4,
            0.8
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.4564354645876385,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18104602432207369171&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=1mjsP8RYAw",
        "pdf": "https://openreview.net/pdf?id=1mjsP8RYAw",
        "email": "amazon.com;cam.ac.uk;cam.ac.uk",
        "author_num": 3,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Amazon;University of Cambridge",
        "aff_unique_dep": "Amazon.com, Inc.;",
        "aff_unique_url": "https://www.amazon.com;https://www.cam.ac.uk",
        "aff_unique_abbr": "Amazon;Cambridge",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Cambridge",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "title": "Dynamic Sparse No Training: Training-Free Fine-tuning for Sparse LLMs",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19572",
        "id": "1ndDmZdT4g",
        "author_site": "Yuxin Zhang, Lirui Zhao, Mingbao Lin, Sun Yunyun, Yiwu Yao, Xingjia Han, Jared Tanner, Shiwei Liu, Rongrong Ji",
        "tldr": "",
        "abstract": "The ever-increasing large language models (LLMs), though opening a potential path for the upcoming artificial general intelligence, sadly drops a daunting obstacle on the way towards their on-device deployment. As one of the most well-established pre-LLMs approaches in reducing model complexity, network pruning appears to lag behind in the era of LLMs, due mostly to its costly fine-tuning (or re-training) necessity under the massive volumes of model parameter and training data. To close this industry-academia gap, we introduce Dynamic Sparse No Training ($\\texttt{DSNT}$), a training-free fine-tuning approach that slightly updates sparse LLMs without the expensive backpropagation and any weight updates. Inspired by the Dynamic Sparse Training, $\\texttt{DSNT}$ minimizes the reconstruction error between the dense and sparse LLMs, in the fashion of performing iterative weight pruning-and-growing on top of sparse LLMs. To accomplish this purpose, $\\texttt{DSNT}$ particularly takes into account the anticipated reduction in reconstruction error for pruning and growing, as well as the variance w.r.t. different input data for growing each weight. This practice can be executed efficiently in linear time since its obviates the need of backpropagation for fine-tuning LLMs. Extensive experiments on LLaMA-V1/V2, Vicuna, and OPT across various benchmarks demonstrate the effectiveness of $\\texttt{DSNT}$ in enhancing the performance of sparse LLMs, especially at high sparsity levels. For instance, $\\texttt{DSNT}$ is able to outperform the state-of-the-art Wanda by 26.79 perplexity at 70% sparsity with LLaMA-7B. Our paper offers fresh insights into how to fine-tune sparse LLMs in an efficient training-free manner and open new venues to scale the great potential of sparsity to LLMs.  Codes are available at https://github.com/zyxxmu/DSnoT.",
        "keywords": "Large Language Models;Network Sparsity",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/3090439d99611546cd406d681bd91e7b43574421.zip",
        "author": "Yuxin Zhang;Lirui Zhao;Mingbao Lin;Sun Yunyun;Yiwu Yao;Xingjia Han;Jared Tanner;Shiwei Liu;Rongrong Ji",
        "authorids": "~Yuxin_Zhang3;~Lirui_Zhao1;~Mingbao_Lin1;~Sun_Yunyun1;~Yiwu_Yao1;~Xingjia_Han1;~Jared_Tanner1;~Shiwei_Liu2;~Rongrong_Ji5",
        "gender": ";M;M;;M;M;;M;M",
        "homepage": ";https://github.com/Lirui-Zhao;http://lmb.bjbxit.cn/;https://scholar.google.com/;https://blog.csdn.net/nature553863/article/details/80568658;;http://people.maths.ox.ac.uk/tanner/publications.shtml;https://shiweiliuiiiiiii.github.io/;http://mac.xmu.edu.cn/rrji-en.html",
        "dblp": "03/7346-2;;211/5903;;133/4368;;85/1256;234/8697-3.html;86/5681",
        "google_scholar": "6IeJLJoAAAAJ;;Dp3L1bsAAAAJ;;4tYZsLgAAAAJ;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.co.uk/citations?user=J7248tkAAAAJ;73IbXtsAAAAJ;",
        "orcid": "0000-0002-4409-7030;;0000-0003-1764-1894;;;;;;",
        "linkedin": ";;mingbao-lin-890444105/;;;;;;",
        "or_profile": "~Yuxin_Zhang3;~Lirui_Zhao1;~Mingbao_Lin1;~Sun_Yunyun1;~Yiwu_Yao1;~Xingjia_Han1;~Jared_Tanner1;~Shiwei_Liu2;~Rongrong_Ji5",
        "aff": "Xiamen University;Xiamen University;Xiamen University;;Huawei Technologies Ltd.;;University of Oxford;University of Oxford;Xiamen University",
        "aff_domain": "xmu.edu.cn;xmu.edu.cn;xmu.edu.cn;;huawei.com;;ox.ac.uk;ox.ac.uk;xmu.edu.cn",
        "position": "PhD student;MS student;PhD student;;Researcher;;Full Professor;Postdoc;Full Professor",
        "bibtex": "@inproceedings{\nzhang2024dynamic,\ntitle={Dynamic Sparse No Training:  Training-Free Fine-tuning for Sparse {LLM}s},\nauthor={Yuxin Zhang and Lirui Zhao and Mingbao Lin and Sun Yunyun and Yiwu Yao and Xingjia Han and Jared Tanner and Shiwei Liu and Rongrong Ji},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=1ndDmZdT4g}\n}",
        "github": "",
        "project": "",
        "reviewers": "nrCN;s71w;CfsK",
        "pdf_size": 524223,
        "rating": "6;6;6",
        "confidence": "5;4;2",
        "soundness": "3;3;3",
        "contribution": "3;2;3",
        "presentation": "3;3;3",
        "wc_summary": "93;79;105",
        "wc_strengths": "59;82;120",
        "wc_weaknesses": "90;244;61",
        "wc_questions": "131;55;3",
        "wc_review": "373;460;289",
        "wc_reply_reviewers": "0;122;0",
        "wc_reply_authors": "559;1437;628",
        "reply_reviewers": "0;2;0",
        "reply_authors": "2;5;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            1.247219128924647
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            92.33333333333333,
            10.624918300339486
        ],
        "wc_strengths_avg": [
            87.0,
            25.152865973217974
        ],
        "wc_weaknesses_avg": [
            131.66666666666666,
            80.30912498312726
        ],
        "wc_questions_avg": [
            63.0,
            52.56107558513873
        ],
        "wc_review_avg": [
            374.0,
            69.81403870282824
        ],
        "wc_reply_reviewers_avg": [
            40.666666666666664,
            57.51135153650587
        ],
        "wc_reply_authors_avg": [
            874.6666666666666,
            398.62625213210544
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            3.0,
            1.4142135623730951
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 55,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6652760928495592428&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=1ndDmZdT4g",
        "pdf": "https://openreview.net/pdf?id=1ndDmZdT4g",
        "email": "xmu.edu.cn;xmu.edu.cn;xmu.edu.cn;;huawei.com;;ox.ac.uk;ox.ac.uk;xmu.edu.cn",
        "author_num": 9,
        "aff_unique_index": "0;0;0;1;2;2;0",
        "aff_unique_norm": "Xiamen University;Huawei;University of Oxford",
        "aff_unique_dep": ";Huawei Technologies;",
        "aff_unique_url": "https://www.xmu.edu.cn;https://www.huawei.com;https://www.ox.ac.uk",
        "aff_unique_abbr": "XMU;Huawei;Oxford",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;1;1;0",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "id": "1nfqABOIwQ",
        "title": "RIME: Robust Preference-based Reinforcement Learning with Noisy Human Preferences",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Designing an effective reward function remains a significant challenge in numerous reinforcement learning (RL) applications. Preference-based Reinforcement Learning (PbRL) presents a novel framework that circumvents the need for reward engineering by harnessing human preferences as the reward signal. However, current PbRL algorithms primarily focus on feedback efficiency, which heavily depends on high-quality feedback from domain experts. This over-reliance results in a lack of robustness, leading to a severe performance degradation under noisy feedback conditions, thereby limiting the broad applicability of PbRL. In this paper, we present RIME, a robust PbRL algorithm for effective reward learning from noisy human preferences. Our method incorporates a sample selection-based discriminator to dynamically filter denoised preferences for robust training. To mitigate the accumulated error caused by incorrect selection, we propose to warm start the reward model for a good initialization, which additionally bridges the performance gap during transition from pre-training to online training in PbRL. Our experiments on robotic manipulation and locomotion tasks demonstrate that RIME significantly enhances the robustness of the current state-of-the-art PbRL method. Ablation studies further demonstrate that the warm start is crucial for both robustness and feedback-efficiency in limited-feedback cases.",
        "keywords": "preference-based reinforcement learning;human-in-the-loop reinforcement learning;deep reinforcement learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/dd3275fefb31a0dff17fa8bd0b3ea43339f41ec3.zip",
        "author": "Jie Cheng;Gang Xiong;Xingyuan Dai;Qinghai Miao;Yisheng Lv;Fei-Yue Wang",
        "authorids": "~Jie_Cheng4;~Gang_Xiong2;~Xingyuan_Dai1;~Qinghai_Miao1;~Yisheng_Lv1;~Fei-Yue_Wang2",
        "gender": "M;;M;M;M;M",
        "homepage": ";;;https://people.ucas.edu.cn/~lvyisheng;http://www.ia.cas.cn/sourcedb_ia_cas/en/iaexpert/200908/t20090804_2310468.html;https://teacher.ucas.ac.cn/~gxiong",
        "dblp": ";203/8062;33/1250;;;96/372-1",
        "google_scholar": ";R4Rn7dMAAAAJ;;RRKqjKAAAAAJ;;",
        "orcid": "0009-0008-5373-7563;;0000-0003-1213-1123;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Jie_Cheng4;~Xingyuan_Dai1;~Qinghai_Miao1;~Yisheng_Lv1;~Fei-Yue_Wang2;~Xiong_Gang1",
        "aff": "University of Chinese Academy of Sciences;Institute of Automation, Chinese Academy of Sciences;University of Chinese Academy of Sciences;University of Chinese Academy of Sciences;Institute of Automation, Chinese Academy of Sciences;Institute of Automation, Chinese Academy of Science",
        "aff_domain": "ucas.ac.cn;ia.ac.cn;ucas.ac.cn;ucas.ac.cn;ia.ac.cn;ia.ac.cn",
        "position": "PhD student;Assistant Professor;Associate Professor;Full Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nanonymous2024rime,\ntitle={{RIME}: Robust Preference-based Reinforcement Learning with Noisy Human Preferences},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=1nfqABOIwQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "dSpC;vzpZ;z4ZA",
        "site": "https://openreview.net/forum?id=1nfqABOIwQ",
        "pdf_size": 21682849,
        "rating": "3;6;8",
        "confidence": "5;3;4",
        "soundness": "1;3;3",
        "contribution": "2;2;2",
        "presentation": "2;3;3",
        "wc_summary": "86;15;68",
        "wc_strengths": "90;36;95",
        "wc_weaknesses": "586;99;163",
        "wc_questions": "226;4;379",
        "wc_review": "988;154;705",
        "wc_reply_reviewers": "716;0;946",
        "wc_reply_authors": "2483;239;2327",
        "reply_reviewers": "1;0;2",
        "reply_authors": "6;1;6",
        "rating_avg": [
            5.666666666666667,
            2.0548046676563256
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            56.333333333333336,
            30.136725472788548
        ],
        "wc_strengths_avg": [
            73.66666666666667,
            26.71246067953223
        ],
        "wc_weaknesses_avg": [
            282.6666666666667,
            216.0745756034759
        ],
        "wc_questions_avg": [
            203.0,
            153.95453874439687
        ],
        "wc_review_avg": [
            615.6666666666666,
            346.2892175945163
        ],
        "wc_reply_reviewers_avg": [
            554.0,
            402.8332988553288
        ],
        "wc_reply_authors_avg": [
            1683.0,
            1023.0464310088765
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            4.333333333333333,
            2.357022603955158
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5960395606792698,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13128103223629693214&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0;1;1",
        "aff_unique_norm": "University of Chinese Academy of Sciences;Chinese Academy of Sciences",
        "aff_unique_dep": ";Institute of Automation",
        "aff_unique_url": "http://www.ucas.ac.cn;http://www.ia.cas.cn",
        "aff_unique_abbr": "UCAS;CAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Self-Alignment with Instruction Backtranslation",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19571",
        "id": "1oijHJBRsT",
        "author_site": "Xian Li, Ping Yu, Chunting Zhou, Timo Schick, Omer Levy, Luke Zettlemoyer, Jason E Weston, Mike Lewis",
        "tldr": "",
        "abstract": "We present a scalable method to build a high quality instruction following language model by automatically labelling human-written text with corresponding instructions. Our approach, named instruction backtranslation, starts with a language model finetuned on a small amount of seed data, and a given web corpus. The seed model is used to construct training examples by generating instruction prompts for web documents (self-augmentation), and then  selecting high quality examples from among these candidates (self-curation).  This data is then used to finetune a stronger model.  Finetuning LLaMa on two iterations of our approach yields a model that outperforms all other LLaMa-based models on the Alpaca leaderboard not relying on distillation data, demonstrating highly effective self-alignment.",
        "keywords": "large language models;self-supervised learning;data augmentation",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Xian Li;Ping Yu;Chunting Zhou;Timo Schick;Omer Levy;Luke Zettlemoyer;Jason E Weston;Mike Lewis",
        "authorids": "~Xian_Li1;~Ping_Yu2;~Chunting_Zhou1;~Timo_Schick1;~Omer_Levy1;~Luke_Zettlemoyer1;~Jason_E_Weston1;~Mike_Lewis1",
        "gender": ";F;F;;M;M;;M",
        "homepage": ";https://yuping1.wixsite.com/mysite;https://violet-zct.github.io/;http://timoschick.com;;https://www.cs.washington.edu/people/faculty/lsz/;;",
        "dblp": "82/1763-3.html;;161/2679;203/9176;117/4866;21/6793;;19/6214",
        "google_scholar": "v_sIgawAAAAJ;-V7TJhwAAAAJ;mR5W7EgAAAAJ;;PZVd2h8AAAAJ;https://scholar.google.com.tw/citations?user=UjpbO6IAAAAJ;;SnQnQicAAAAJ",
        "orcid": ";;;;0000-0001-7300-8191;;;",
        "linkedin": ";ping-yu-05ba8212b/;;;;luke-zettlemoyer-a0109b226/;;",
        "or_profile": "~Xian_Li1;~Ping_Yu2;~Chunting_Zhou1;~Timo_Schick1;~Omer_Levy1;~Luke_Zettlemoyer1;~Jason_E_Weston1;~Mike_Lewis1",
        "aff": "Facebook AI;Meta Facebook;Meta AI;Meta Facebook;Tel Aviv University;Meta;;Facebook AI Research",
        "aff_domain": "fb.com;fb.com;meta.com;fb.com;tau.ac.il;meta.com;;fb.com",
        "position": "Principal Researcher;Researcher;Researcher;Researcher;Senior Lecturer;Researcher;;Research Scientist",
        "bibtex": "@inproceedings{\nli2024selfalignment,\ntitle={Self-Alignment with Instruction Backtranslation},\nauthor={Xian Li and Ping Yu and Chunting Zhou and Timo Schick and Omer Levy and Luke Zettlemoyer and Jason E Weston and Mike Lewis},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=1oijHJBRsT}\n}",
        "github": "",
        "project": "",
        "reviewers": "Fnnk;XACc;bTHF;HdQC",
        "pdf_size": 1785904,
        "rating": "8;8;8;8",
        "confidence": "4;4;5;4",
        "soundness": "4;3;4;4",
        "contribution": "3;4;3;4",
        "presentation": "4;4;4;4",
        "wc_summary": "179;89;81;101",
        "wc_strengths": "22;101;70;66",
        "wc_weaknesses": "4;154;17;88",
        "wc_questions": "97;47;52;127",
        "wc_review": "302;391;220;382",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "240;200;186;778",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.5,
            0.5
        ],
        "presentation_avg": [
            4.0,
            0.0
        ],
        "wc_summary_avg": [
            112.5,
            39.04804732633887
        ],
        "wc_strengths_avg": [
            64.75,
            28.154706533721853
        ],
        "wc_weaknesses_avg": [
            65.75,
            60.15137155543504
        ],
        "wc_questions_avg": [
            80.75,
            33.04826016600571
        ],
        "wc_review_avg": [
            323.75,
            69.19673041408821
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            351.0,
            247.3236745643247
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 230,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14196853842712224571&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=1oijHJBRsT",
        "pdf": "https://openreview.net/pdf?id=1oijHJBRsT",
        "email": "fb.com;fb.com;meta.com;fb.com;tau.ac.il;meta.com;;fb.com",
        "author_num": 8,
        "aff_unique_index": "0;0;0;0;1;0;0",
        "aff_unique_norm": "Meta;Tel Aviv University",
        "aff_unique_dep": "Facebook AI;",
        "aff_unique_url": "https://www.facebook.com;https://www.tau.ac.il",
        "aff_unique_abbr": "Facebook AI;TAU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;1;0;0",
        "aff_country_unique": "United States;Israel"
    },
    {
        "title": "Theoretical Analysis of Robust Overfitting for Wide DNNs: An NTK Approach",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19570",
        "id": "1op5YGZu8X",
        "author_site": "Shaopeng Fu, Di Wang",
        "tldr": "",
        "abstract": "Adversarial training (AT) is a canonical method for enhancing the robustness of deep neural networks (DNNs). However, recent studies empirically demonstrated that it suffers from robust overfitting, i.e., a long time AT can be detrimental to the robustness of DNNs. This paper presents a theoretical explanation of robust overfitting for DNNs. Specifically, we non-trivially extend the neural tangent kernel (NTK) theory to AT and prove that an adversarially trained wide DNN can be well approximated by a linearized DNN. Moreover, for squared loss, closed-form AT dynamics for the linearized DNN can be derived, which reveals a new AT degeneration phenomenon: a long-term AT will result in a wide DNN degenerates to that obtained without AT and thus cause robust overfitting. Based on our theoretical results, we further design a method namely Adv-NTK, the first AT algorithm for infinite-width DNNs. Experiments on real-world datasets show that Adv-NTK can help infinite-width DNNs enhance comparable robustness to that of their finite-width counterparts, which in turn justifies our theoretical findings. The code is available at https://github.com/fshp971/adv-ntk.",
        "keywords": "NTK;neural tangent kernels;adversarial training;robust overfitting",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/ab6939d672fe71286dded0968cc514e328a5cd05.zip",
        "author": "Shaopeng Fu;Di Wang",
        "authorids": "~Shaopeng_Fu1;~Di_Wang1",
        "gender": ";",
        "homepage": "https://shaopengfu.me;",
        "dblp": "278/8181;",
        "google_scholar": "i7cWm4gAAAAJ;",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Shaopeng_Fu1;~Di_Wang1",
        "aff": "King Abdullah University of Science and Technology;",
        "aff_domain": "kaust.edu.sa;",
        "position": "PhD student;",
        "bibtex": "@inproceedings{\nfu2024theoretical,\ntitle={Theoretical Analysis of Robust Overfitting for Wide {DNN}s: An {NTK} Approach},\nauthor={Shaopeng Fu and Di Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=1op5YGZu8X}\n}",
        "github": "",
        "project": "",
        "reviewers": "edb8;s7R7;gmGK;S6eo;4ePw",
        "pdf_size": 878700,
        "rating": "6;6;6;6;8",
        "confidence": "3;4;3;2;3",
        "soundness": "3;3;3;3;4",
        "contribution": "2;2;3;2;3",
        "presentation": "3;3;2;3;3",
        "wc_summary": "49;136;96;81;75",
        "wc_strengths": "18;30;67;52;36",
        "wc_weaknesses": "347;86;40;176;161",
        "wc_questions": "20;37;26;6;31",
        "wc_review": "434;289;229;315;303",
        "wc_reply_reviewers": "32;97;0;64;27",
        "wc_reply_authors": "2212;792;702;1316;668",
        "reply_reviewers": "1;2;0;2;1",
        "reply_authors": "6;4;3;5;2",
        "rating_avg": [
            6.4,
            0.7999999999999999
        ],
        "confidence_avg": [
            3.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            3.2,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            87.4,
            28.653795560099887
        ],
        "wc_strengths_avg": [
            40.6,
            17.153425313913253
        ],
        "wc_weaknesses_avg": [
            162.0,
            104.95903962975271
        ],
        "wc_questions_avg": [
            24.0,
            10.601886624558858
        ],
        "wc_review_avg": [
            314.0,
            66.89095604040952
        ],
        "wc_reply_reviewers_avg": [
            44.0,
            33.40059879702758
        ],
        "wc_reply_authors_avg": [
            1138.0,
            585.8108909878682
        ],
        "reply_reviewers_avg": [
            1.2,
            0.7483314773547883
        ],
        "reply_authors_avg": [
            4.0,
            1.4142135623730951
        ],
        "replies_avg": [
            33,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18088651160665427077&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=1op5YGZu8X",
        "pdf": "https://openreview.net/pdf?id=1op5YGZu8X",
        "email": "kaust.edu.sa;",
        "author_num": 2,
        "aff_unique_index": "0",
        "aff_unique_norm": "King Abdullah University of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kast.kau.edu.sa",
        "aff_unique_abbr": "KAUST",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Saudi Arabia"
    },
    {
        "title": "Convolutional Deep Kernel Machines",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19569",
        "id": "1oqedRt6Z7",
        "author_site": "Edward Milsom, Ben Anson, Laurence Aitchison",
        "tldr": "",
        "abstract": "Standard infinite-width limits of neural networks sacrifice the ability for intermediate layers to learn representations from data. Recent work (\u201cA theory of representation learning gives a deep generalisation of kernel methods\u201d, Yang et al. 2023) modified the Neural Network Gaussian Process (NNGP) limit of Bayesian neural networks so that representation learning is retained. Furthermore, they found that applying this modified limit to a deep Gaussian process gives a practical learning algorithm which they dubbed the \u201cdeep kernel machine\u201d (DKM). However, they only considered the simplest possible setting: regression in small, fully connected networks with e.g. 10 input features. Here, we introduce convolutional deep kernel machines. This required us to develop a novel inter-domain inducing point approximation, as well as introducing and experimentally assessing a number of techniques not previously seen in DKMs, including analogues to batch normalisation, different likelihoods, and different types of top-layer. The resulting model trains in roughly 77 GPU hours, achieving around 99\\% test accuracy on MNIST, 72\\% on CIFAR-100, and 92.7\\% on CIFAR-10, which is SOTA for kernel methods.",
        "keywords": "Gaussian process;infinite-width neural network;NNGP;Bayesian deep learning",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Edward Milsom;Ben Anson;Laurence Aitchison",
        "authorids": "~Edward_Milsom1;~Ben_Anson1;~Laurence_Aitchison1",
        "gender": "M;M;",
        "homepage": ";;http://www.gatsby.ucl.ac.uk/~laurence/",
        "dblp": "348/6212;;155/1918.html",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;",
        "orcid": "0000-0003-0404-4564;;",
        "linkedin": ";ben-anson-7b7519183/;",
        "or_profile": "~Edward_Milsom1;~Ben_Anson1;~Laurence_Aitchison1",
        "aff": "University of Bristol;University of Bristol;University of Bristol",
        "aff_domain": "bristol.ac.uk;bristol.ac.uk;bristol.ac.uk",
        "position": "PhD student;PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nmilsom2024convolutional,\ntitle={Convolutional Deep Kernel Machines},\nauthor={Edward Milsom and Ben Anson and Laurence Aitchison},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=1oqedRt6Z7}\n}",
        "github": "",
        "project": "",
        "reviewers": "hjfZ;3QEZ;5yKS;jw8S",
        "pdf_size": 405912,
        "rating": "5;5;5;8",
        "confidence": "4;3;4;3",
        "soundness": "3;2;3;3",
        "contribution": "2;3;2;3",
        "presentation": "3;1;2;4",
        "wc_summary": "106;49;89;119",
        "wc_strengths": "42;32;47;46",
        "wc_weaknesses": "23;139;225;75",
        "wc_questions": "538;17;4;101",
        "wc_review": "709;237;365;341",
        "wc_reply_reviewers": "250;0;0;62",
        "wc_reply_authors": "1102;445;448;680",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "2;1;1;2",
        "rating_avg": [
            5.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            90.75,
            26.34743820563965
        ],
        "wc_strengths_avg": [
            41.75,
            5.931905258852336
        ],
        "wc_weaknesses_avg": [
            115.5,
            75.39728111808807
        ],
        "wc_questions_avg": [
            165.0,
            218.5463337601434
        ],
        "wc_review_avg": [
            413.0,
            177.53872816937718
        ],
        "wc_reply_reviewers_avg": [
            78.0,
            102.4792661956554
        ],
        "wc_reply_authors_avg": [
            668.75,
            267.6876678145633
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7905167758364695693&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=1oqedRt6Z7",
        "pdf": "https://openreview.net/pdf?id=1oqedRt6Z7",
        "email": "bristol.ac.uk;bristol.ac.uk;bristol.ac.uk",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Bristol",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.bristol.ac.uk",
        "aff_unique_abbr": "Bristol",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "1p4q1cXOX9",
        "title": "Attribute-Enhanced Similarity Ranking for Sparse Link Prediction",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Link prediction is a fundamental problem in graph data. In its most realistic setting, the problem consists of predicting missing or future links between random pairs of nodes from the set of disconnected pairs. Graph Neural Networks (GNNs) have become the predominant framework for link prediction. GNN-based methods treat link prediction as a binary classification problem and handle the extreme class imbalance---real graphs are very sparse---by sampling (uniformly at random) a balanced number of disconnected pairs not only for training but also for evaluation. However, we show that the reported performance of GNNs for link prediction in the balanced setting does not translate to the more realistic imbalanced setting and that simpler topology-based approaches are often better at handling sparsity. These findings motivate Gelato, a similarity-based link-prediction method that applies (1) graph learning based on node attributes to enhance a topological heuristic, (2) a ranking loss for addressing class imbalance, and (3) a negative sampling scheme that efficiently selects hard training pairs via graph partitioning. Experiments show that Gelato is more accurate and faster than GNN-based alternatives.",
        "keywords": "Link Prediction;Graph Neural Networks;Graph Learning;Network Science",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Zexi Huang;Joao Pedro Rodrigues Mattos;Mert Kosan;Arlei Lopes da Silva;Ambuj Singh",
        "authorids": "~Zexi_Huang1;~Joao_Pedro_Rodrigues_Mattos1;~Mert_Kosan1;~Arlei_Lopes_da_Silva1;~Ambuj_Singh1",
        "gender": "M;M;M;M;",
        "homepage": "https://zexihuang.com/;https://joaopedromattos.github.io/;https://www.mertkosan.com;https://cs.rice.edu/~al110/index.html;",
        "dblp": "299/4829;249/6600;304/8019;19/2546;",
        "google_scholar": "56TmFA4AAAAJ;4fBin7kAAAAJ;12lDpTAAAAAJ;atGtis4AAAAJ;",
        "orcid": "0000-0002-1480-4494;0000-0002-6877-1608;0000-0002-8092-5024;0000-0003-1792-0076;",
        "linkedin": "zexihuang/;joaopedromattos/;https://linkedin.com/in/mertkosan;;",
        "or_profile": "~Zexi_Huang1;~Joao_Pedro_Rodrigues_Mattos1;~Mert_Kosan1;~Arlei_Lopes_da_Silva1;~Ambuj_Singh1",
        "aff": "UC Santa Barbara;Rice University;VISA;Rice University;",
        "aff_domain": "ucsb.edu;rice.edu;visa.com;rice.edu;",
        "position": "PhD student;PhD student;Researcher;Assistant Professor;",
        "bibtex": "@misc{\nhuang2024attributeenhanced,\ntitle={Attribute-Enhanced Similarity Ranking for Sparse Link Prediction},\nauthor={Zexi Huang and Joao Pedro Rodrigues Mattos and Mert Kosan and Arlei Lopes da Silva and Ambuj Singh},\nyear={2024},\nurl={https://openreview.net/forum?id=1p4q1cXOX9}\n}",
        "github": "",
        "project": "",
        "reviewers": "554z;6oyf;LQFc;4LRj",
        "site": "https://openreview.net/forum?id=1p4q1cXOX9",
        "pdf_size": 3036908,
        "rating": "3;3;3;5",
        "confidence": "4;4;4;4",
        "soundness": "2;1;2;3",
        "contribution": "2;1;2;2",
        "presentation": "3;2;3;3",
        "wc_summary": "58;32;158;86",
        "wc_strengths": "22;1;67;409",
        "wc_weaknesses": "146;157;146;131",
        "wc_questions": "3;1;120;110",
        "wc_review": "229;191;491;736",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "481;426;422;500",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            83.5,
            47.06113045816048
        ],
        "wc_strengths_avg": [
            124.75,
            165.83481992633514
        ],
        "wc_weaknesses_avg": [
            145.0,
            9.246621004453464
        ],
        "wc_questions_avg": [
            58.5,
            56.61492736019362
        ],
        "wc_review_avg": [
            411.75,
            219.96974223742683
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            457.25,
            33.9512518178638
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:1DqsmIPgAvMJ:scholar.google.com/&scioq=Attribute-Enhanced+Similarity+Ranking+for+Sparse+Link+Prediction&hl=en&as_sdt=0,24",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "University of California, Santa Barbara;Rice University;VISA",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ucsb.edu;https://www.rice.edu;https://www.visa.com",
        "aff_unique_abbr": "UCSB;Rice;VISA",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Santa Barbara;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "ConjNorm: Tractable Density Estimation for Out-of-Distribution Detection",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19568",
        "id": "1pSL2cXWoz",
        "author_site": "Bo Peng, Yadan Luo, Yonggang Zhang, Yixuan Li, Zhen Fang",
        "tldr": "",
        "abstract": "Post-hoc out-of-distribution (OOD) detection has garnered intensive attention in reliable machine learning. Many efforts have been dedicated to deriving score functions based on logits, distances, or rigorous data distribution assumptions to identify low-scoring OOD samples. Nevertheless, these estimate scores may fail to accurately reflect the true data density or impose impractical constraints. To provide a unified perspective on density-based score design, we propose a novel theoretical framework grounded in Bregman divergence, which extends distribution considerations to encompass an exponential family of distributions. Leveraging the conjugation constraint revealed in our theorem, we introduce a \\textsc{ConjNorm} method, reframing density function design as a search for the optimal norm coefficient $p$ against the given dataset. In light of the computational challenges of normalization, we devise an unbiased and analytically tractable estimator of the partition function using the Monte Carlo-based importance sampling technique. Extensive experiments across OOD detection benchmarks empirically demonstrate that our proposed \\textsc{ConjNorm} has established a new state-of-the-art in a variety of OOD detection setups, outperforming the current best method by up to 13.25\\% and 28.19\\% (FPR95) on CIFAR-100 and ImageNet-1K, respectively.",
        "keywords": "Density-based OOD;Importance Sampling;Tractable density estimation",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/1fcdd42748538b321b841769b27d2f20625a614e.zip",
        "author": "Bo Peng;Yadan Luo;Yonggang Zhang;Yixuan Li;Zhen Fang",
        "authorids": "~Bo_Peng24;~Yadan_Luo1;~Yonggang_Zhang1;~Yixuan_Li1;~Zhen_Fang2",
        "gender": ";F;M;F;M",
        "homepage": ";https://sites.google.com/view/yadanluo/home;https://yonggangzhangben.github.io/index.html;http://pages.cs.wisc.edu/~sharonli/;https://fang-zhen.github.io/index.html",
        "dblp": ";182/2414;27/6859-3;144/6087-1;",
        "google_scholar": ";3IfL11AAAAAJ;XSbEr98AAAAJ;https://scholar.google.com/citations?hl=en;OzD6WJcAAAAJ",
        "orcid": ";0000-0001-6272-2971;0000-0002-4080-7592;;0000-0003-0602-6255",
        "linkedin": ";;;liyixuan;",
        "or_profile": "~Bo_Peng24;~Yadan_Luo1;~Yonggang_Zhang1;~Yixuan_Li1;~Zhen_Fang2",
        "aff": ";The University of Queensland;Hong Kong Baptist University;Cornell University;University of Technology Sydney",
        "aff_domain": ";uq.edu.au;hkbu.edu.hk;cornell.edu;uts.edu.au",
        "position": ";Assistant Professor;Postdoc;Graduate Student;Assistant Professor",
        "bibtex": "@inproceedings{\npeng2024conjnorm,\ntitle={ConjNorm: Tractable Density Estimation for Out-of-Distribution Detection},\nauthor={Bo Peng and Yadan Luo and Yonggang Zhang and Yixuan Li and Zhen Fang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=1pSL2cXWoz}\n}",
        "github": "",
        "project": "",
        "reviewers": "MqR8;LYsh;EBSh;WvTp",
        "pdf_size": 2561923,
        "rating": "5;6;6;8",
        "confidence": "4;3;2;4",
        "soundness": "3;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "138;69;76;88",
        "wc_strengths": "59;143;60;54",
        "wc_weaknesses": "58;171;44;280",
        "wc_questions": "84;68;4;96",
        "wc_review": "339;451;184;518",
        "wc_reply_reviewers": "142;0;0;0",
        "wc_reply_authors": "976;1015;378;783",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "4;4;3;3",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            92.75,
            26.994212342648563
        ],
        "wc_strengths_avg": [
            79.0,
            37.02026472082554
        ],
        "wc_weaknesses_avg": [
            138.25,
            95.51014344036973
        ],
        "wc_questions_avg": [
            63.0,
            35.482389998420345
        ],
        "wc_review_avg": [
            373.0,
            126.47727068528954
        ],
        "wc_reply_reviewers_avg": [
            35.5,
            61.48780366869514
        ],
        "wc_reply_authors_avg": [
            788.0,
            252.4866333095675
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.5,
            0.5
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.20751433915982243,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14808389682740397945&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=1pSL2cXWoz",
        "pdf": "https://openreview.net/pdf?id=1pSL2cXWoz",
        "email": ";uq.edu.au;hkbu.edu.hk;cornell.edu;uts.edu.au",
        "author_num": 5,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "University of Queensland;Hong Kong Baptist University;Cornell University;University of Technology Sydney",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.uq.edu.au;https://www.hkbu.edu.hk;https://www.cornell.edu;https://www.uts.edu.au",
        "aff_unique_abbr": "UQ;HKBU;Cornell;UTS",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;1;2;0",
        "aff_country_unique": "Australia;China;United States"
    },
    {
        "id": "1pTlvxIfuV",
        "title": "A Reparameterized Discrete Diffusion Model for Text Generation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This work studies discrete diffusion probabilistic models with applications to natural language generation. We derive an alternative yet equivalent formulation of the sampling from discrete diffusion processes and leverage this insight to develop a family of reparameterized discrete diffusion models. The derived generic framework is highly flexible, offers a fresh perspective of the generation process in discrete diffusion models, and features more effective training and decoding techniques. We conduct extensive experiments to evaluate the text generation capability of our model, demonstrating significant improvements over existing diffusion models.",
        "keywords": "discrete diffusion;text generation;non-autoregressive generation",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Lin Zheng;Jianbo Yuan;Lei Yu;Lingpeng Kong",
        "authorids": "~Lin_Zheng1;~Jianbo_Yuan1;~Lei_Yu4;~Lingpeng_Kong1",
        "gender": "M;M;F;M",
        "homepage": "https://lzhengisme.github.io/;;;https://ikekonglp.github.io/",
        "dblp": ";134/6790;https://dblp.uni-trier.de/pid/01/2775-0008;144/7656",
        "google_scholar": "3NXH0t8AAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.co.uk/citations?user=gX5JBc4AAAAJ;f1hBi5wAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Lin_Zheng1;~Jianbo_Yuan1;~Lei_Yu4;~Lingpeng_Kong1",
        "aff": "The University of Hong Kong;Bytedance;Google DeepMind;Department of Computer Science, The University of Hong Kong",
        "aff_domain": "hku.hk;bytedance.com;deepmind.com;cs.hku.hk",
        "position": "PhD student;Researcher;Research Scientist;Assistant Professor",
        "bibtex": "@misc{\nzheng2024a,\ntitle={A Reparameterized Discrete Diffusion Model for Text Generation},\nauthor={Lin Zheng and Jianbo Yuan and Lei Yu and Lingpeng Kong},\nyear={2024},\nurl={https://openreview.net/forum?id=1pTlvxIfuV}\n}",
        "github": "",
        "project": "",
        "reviewers": "7X9e;shFm;uT11;Z8Rn",
        "site": "https://openreview.net/forum?id=1pTlvxIfuV",
        "pdf_size": 552481,
        "rating": "3;5;6;8",
        "confidence": "4;4;5;4",
        "soundness": "3;3;4;4",
        "contribution": "2;2;3;4",
        "presentation": "2;3;4;4",
        "wc_summary": "69;58;166;171",
        "wc_strengths": "31;49;84;47",
        "wc_weaknesses": "119;402;190;35",
        "wc_questions": "90;7;100;32",
        "wc_review": "309;516;540;285",
        "wc_reply_reviewers": "0;195;0;0",
        "wc_reply_authors": "215;909;603;307",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            116.0,
            52.673522760491345
        ],
        "wc_strengths_avg": [
            52.75,
            19.343926695477318
        ],
        "wc_weaknesses_avg": [
            186.5,
            135.9788586508947
        ],
        "wc_questions_avg": [
            57.25,
            38.931831449342326
        ],
        "wc_review_avg": [
            412.5,
            116.12170339777143
        ],
        "wc_reply_reviewers_avg": [
            48.75,
            84.43747686898277
        ],
        "wc_reply_authors_avg": [
            508.5,
            272.06387117733954
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.16012815380508713,
        "gs_citation": 57,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7982020371199540857&as_sdt=80005&sciodt=0,11&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "University of Hong Kong;ByteDance;Google",
        "aff_unique_dep": ";;Google DeepMind",
        "aff_unique_url": "https://www.hku.hk;https://www.bytedance.com;https://deepmind.com",
        "aff_unique_abbr": "HKU;Bytedance;DeepMind",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "id": "1qDRwhe379",
        "title": "Refining Corpora from a Model Calibration Perspective for Chinese Spelling Correction",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Chinese Spelling Correction (CSC) commonly lacks large-scale high-quality corpora, due to the labor-intensive labeling of spelling errors in real-life human writing or typing scenarios. Two data augmentation methods are widely adopted: (1) Random Replacement with the guidance of confusion sets and (2) OCR/ASR-based Generation that simulates character misusing. However, both methods inevitably introduce noisy data (e.g., false spelling errors), potentially leading to over-correction. By carefully analyzing the two types of corpora, we find that though the latter achieves more robust generalization performance, the former yields better-calibrated CSC models. We then provide a theoretical analysis of this empirical observation, based on which a corpus refining strategy is proposed. Specifically, OCR/ASR-based data samples are fed into a well-calibrated CSC model trained on random replacement-based corpora and then filtered based on prediction confidence. By learning a simple BERT-based model on the refined OCR/ASR-based corpus, we set up state-of-the-art performance on three widely-used benchmarks, while significantly alleviating over-correction (e.g., lowering false positive predictions).",
        "keywords": "Chinese Spelling Correction;Data Augmentation;Model Calibration;Corpus Refining Strategy.",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Yang An;Dingyao Yu;Wei Ye;xiongfeng xiao;Shaoguang Mao;Tao Ge;Shikun Zhang",
        "authorids": "~Yang_An4;~Dingyao_Yu1;~Wei_Ye2;~xiongfeng_xiao1;~Shaoguang_Mao1;~Tao_Ge1;~Shikun_Zhang2",
        "gender": "M;M;M;M;M;M;M",
        "homepage": "https://github.com/Anychnn;;https://se.pku.edu.cn/kcl/weiye/;https://github.com/xiaoxiongfeng;https://www.linkedin.com/in/shaoguang-mao-929733120/;https://getao.github.io/;",
        "dblp": ";337/0563.html;09/5394-4;;214/0365;136/7923;83/3715.html",
        "google_scholar": ";Loc17FgAAAAJ;RgLGFMIAAAAJ;;S6XnZsQAAAAJ;LYbs7Q8AAAAJ;uiklLscAAAAJ",
        "orcid": ";;;;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Yang_An4;~Dingyao_Yu1;~Wei_Ye2;~xiongfeng_xiao1;~Shaoguang_Mao1;~Tao_Ge1;~Shikun_Zhang2",
        "aff": ";Peking University;Peking University;;Microsoft;Tencent AI Lab;Peking University",
        "aff_domain": ";pku.edu.cn;pku.edu.cn;;microsoft.com;tencent.com;pku.edu.cn",
        "position": ";MS student;Associate Professor;;Researcher;Principal Researcher;Full Professor",
        "bibtex": "@misc{\nan2024refining,\ntitle={Refining Corpora from a Model Calibration Perspective for Chinese Spelling Correction},\nauthor={Yang An and Dingyao Yu and Wei Ye and xiongfeng xiao and Shaoguang Mao and Tao Ge and Shikun Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=1qDRwhe379}\n}",
        "github": "",
        "project": "",
        "reviewers": "DKJd;65Mo;7Y3U",
        "site": "https://openreview.net/forum?id=1qDRwhe379",
        "pdf_size": 555516,
        "rating": "5;6;6",
        "confidence": "2;4;2",
        "soundness": "3;3;3",
        "contribution": "2;3;2",
        "presentation": "3;3;3",
        "wc_summary": "26;120;123",
        "wc_strengths": "10;107;157",
        "wc_weaknesses": "305;82;150",
        "wc_questions": "49;51;53",
        "wc_review": "390;360;483",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "432;176;433",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            89.66666666666667,
            45.03578823804711
        ],
        "wc_strengths_avg": [
            91.33333333333333,
            61.02640594220032
        ],
        "wc_weaknesses_avg": [
            179.0,
            93.32023717643814
        ],
        "wc_questions_avg": [
            51.0,
            1.632993161855452
        ],
        "wc_review_avg": [
            411.0,
            52.364109846344185
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            347.0,
            120.91594876883143
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=132761082016325069&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;2;0",
        "aff_unique_norm": "Peking University;Microsoft;Tencent",
        "aff_unique_dep": ";Microsoft Corporation;Tencent AI Lab",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.microsoft.com;https://ai.tencent.com",
        "aff_unique_abbr": "Peking U;Microsoft;Tencent AI Lab",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "1qzUPE5QDZ",
        "title": "Rectifying Group Irregularities in Explanations for Distribution Shift",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "It is well-known that real-world changes constituting distribution shift adversely affect model performance.\nHow to characterize those changes in an interpretable manner is poorly understood.\nExisting techniques take the form of shift explanations that elucidate how samples map from the original distribution toward the shifted one by reducing the disparity between the two distributions.\nHowever, these methods can introduce group irregularities, leading to explanations that are less feasible and robust. \nTo address these issues, we propose Group-aware Shift Explanations (GSE), an explanation method that leverages worst-group optimization to rectify group irregularities.\nWe demonstrate that GSE not only maintains group structures, but can improve feasibility and robustness over a variety of domains by up to 20% and 25% respectively.",
        "keywords": "explainability;distribution shift;group robust",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/9e67dcd2c921a5ce2db0b0031ee9d132423b5ff2.zip",
        "author": "Adam Stein;Yinjun Wu;Eric Wong;Mayur Naik",
        "authorids": "~Adam_Stein2;~Yinjun_Wu1;~Eric_Wong1;~Mayur_Naik1",
        "gender": "M;M;M;M",
        "homepage": "https://www.seas.upenn.edu/~steinad/;https://wuyinjun-1993.github.io/;http://riceric22.github.io/;http://www.cis.upenn.edu/~mhnaik/",
        "dblp": "217/4482;169/1054;64/1811-1.html;92/6794",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en;pWnTMRkAAAAJ;https://scholar.google.com.tw/citations?user=fmsV6nEAAAAJ",
        "orcid": "0000-0003-1887-100X;;;",
        "linkedin": "adam-stein-086135241/;;;ai4code/",
        "or_profile": "~Adam_Stein2;~Yinjun_Wu1;~Eric_Wong1;~Mayur_Naik1",
        "aff": "University of Pennsylvania;University of Pennsylvania;University of Pennsylvania;University of Pennsylvania",
        "aff_domain": "seas.upenn.edu;seas.upenn.edu;upenn.edu;upenn.edu",
        "position": "PhD student;Postdoc;Assistant Professor;Professor",
        "bibtex": "@misc{\nstein2024rectifying,\ntitle={Rectifying Group Irregularities in Explanations for Distribution Shift},\nauthor={Adam Stein and Yinjun Wu and Eric Wong and Mayur Naik},\nyear={2024},\nurl={https://openreview.net/forum?id=1qzUPE5QDZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "AAG5;LTxx;3qo2;XuMW",
        "site": "https://openreview.net/forum?id=1qzUPE5QDZ",
        "pdf_size": 11872203,
        "rating": "5;5;5;6",
        "confidence": "2;4;2;3",
        "soundness": "3;2;3;2",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;2",
        "wc_summary": "37;74;58;98",
        "wc_strengths": "9;56;36;141",
        "wc_weaknesses": "89;212;155;310",
        "wc_questions": "4;12;75;141",
        "wc_review": "139;354;324;690",
        "wc_reply_reviewers": "0;0;375;18",
        "wc_reply_authors": "474;379;1916;1138",
        "reply_reviewers": "0;0;3;1",
        "reply_authors": "2;2;5;3",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            66.75,
            22.30891077574161
        ],
        "wc_strengths_avg": [
            60.5,
            49.378639106399035
        ],
        "wc_weaknesses_avg": [
            191.5,
            81.08791525252083
        ],
        "wc_questions_avg": [
            58.0,
            55.24943438624508
        ],
        "wc_review_avg": [
            376.75,
            198.71509127391408
        ],
        "wc_reply_reviewers_avg": [
            98.25,
            159.9505783046751
        ],
        "wc_reply_authors_avg": [
            976.75,
            616.0874024844202
        ],
        "reply_reviewers_avg": [
            1.0,
            1.224744871391589
        ],
        "reply_authors_avg": [
            3.0,
            1.224744871391589
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.17407765595569782,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11382361820116394572&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of Pennsylvania",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.upenn.edu",
        "aff_unique_abbr": "UPenn",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "1rgMkDWfYV",
        "title": "Cleaning label noise with vision-language models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Current mainstream methods for learning with noisy labels often rely on sample selection, such as the common 'small-loss' strategy that considers samples with smaller losses as clean. Following this, most research focuses on developing more robust sample selection strategies. However, they are still influenced by problems such as the 'self-confirmation bias', which stems from their reliance on the in-training model. Furthermore, relying solely on visual information for sample selection can introduce biases and challenges, such as the common issue of 'hard noise', where samples are erroneously labeled as semantically similar categories.\nTo address these challenges, this paper proposes using the popular vision-language model CLIP for sample selection. Leveraging CLIP, a pre-trained model, can effectively mitigate self-confirmation bias. Additionally, CLIP's distinctive language modality supplements potential biases introduced by relying solely on visual information for sample selection.\nSpecifically, we introduce the \\textit{CLIPSelector}, which utilizes both the CLIP's zero-shot classifier and an easily-inducible classifier based on its vision encoder and  noisy labels for sample selection. We theoretically and empirically demonstrate the unique advantages of the \\textit{CLIPSelector}.\nTo evaluate its effectiveness on existing benchmarks, we further introduce a semi-supervised learning method called \\textit{MixFix}, tailored for noisy datasets. \\textit{MixFix} leverages the subset selected by the \\textit{CLIPSelector} and gradually introduces missing clean samples and re-labeled noisy samples based on different thresholds.\nIn comparison to current hybrid methods involving iterative sample selection and multiple off-the-shelf techniques like model co-training, our approach simplifies the process. \nNonetheless, our approach achieves competitive or superior performance across various benchmarks, including datasets with synthetic and real-world noise. \nCode will be released upon acceptance.",
        "keywords": "Label noise;Sample selection",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/37b4a7fe849b3293f918e12b6df4a60700f12576.zip",
        "author": "Chen Feng;Ioannis Patras",
        "authorids": "~Chen_Feng3;~Ioannis_Patras2",
        "gender": "M;M",
        "homepage": "https://mrchenfeng.github.io/;http://www.eecs.qmul.ac.uk/~ioannisp/",
        "dblp": ";18/1556",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.com.tw/citations?user=OBYLxRkAAAAJ",
        "orcid": "0000-0001-9199-559X;0000-0003-3913-4738",
        "linkedin": "drchenfeng/;ioannis-patras-1053767/",
        "or_profile": "~Chen_Feng3;~Ioannis_Patras2",
        "aff": "Queen Mary University London;Queen Mary, University of London",
        "aff_domain": "qmul.ac.uk;qmul.ac.uk",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nfeng2024cleaning,\ntitle={Cleaning label noise with vision-language models},\nauthor={Chen Feng and Ioannis Patras},\nyear={2024},\nurl={https://openreview.net/forum?id=1rgMkDWfYV}\n}",
        "github": "",
        "project": "",
        "reviewers": "GWvS;tEQg;Vnif;s2nG",
        "site": "https://openreview.net/forum?id=1rgMkDWfYV",
        "pdf_size": 2218801,
        "rating": "3;5;5;5",
        "confidence": "3;5;4;4",
        "soundness": "2;3;3;3",
        "contribution": "3;3;2;3",
        "presentation": "1;3;3;4",
        "wc_summary": "100;95;53;40",
        "wc_strengths": "83;56;21;19",
        "wc_weaknesses": "250;152;57;56",
        "wc_questions": "209;5;42;9",
        "wc_review": "642;308;173;124",
        "wc_reply_reviewers": "0;270;0;27",
        "wc_reply_authors": "652;1926;457;521",
        "reply_reviewers": "0;4;0;1",
        "reply_authors": "2;6;2;2",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            72.0,
            25.971137826441105
        ],
        "wc_strengths_avg": [
            44.75,
            26.536531423680827
        ],
        "wc_weaknesses_avg": [
            128.75,
            80.12919255801846
        ],
        "wc_questions_avg": [
            66.25,
            83.65815859795146
        ],
        "wc_review_avg": [
            311.75,
            202.22558567105202
        ],
        "wc_reply_reviewers_avg": [
            74.25,
            113.55257592850987
        ],
        "wc_reply_authors_avg": [
            889.0,
            602.8237719267547
        ],
        "reply_reviewers_avg": [
            1.25,
            1.6393596310755
        ],
        "reply_authors_avg": [
            3.0,
            1.7320508075688772
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:1HbnjG1wCfMJ:scholar.google.com/&scioq=Cleaning+label+noise+with+vision-language+models&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Queen Mary University of London;Queen Mary, University of London",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.qmul.ac.uk;https://www.qmul.ac.uk",
        "aff_unique_abbr": "QMUL;QMUL",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "London",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "1tDoI2WBGE",
        "title": "A Neural Sandbox Framework for Discovering Spurious Concpets in LLM Decisions",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We introduce a neural sandbox framework for text classification via self-referencing defined label concepts from an Large Language Model(LLM). The framework draws inspiration from the define-optimize alignment problem, in which the motivations of a model are described initially and then the model is optimized to align with these predefined objectives. In our case, we design our framework to perform text classification. We take a frozen LLM as a vector embedding generator for text and provide our framework with defined concept words based on the labels along with the input text. We then optimize an operator to classify the input text based on the relevance scores to the concept operator words(cop-words). In our experiments with multiple text classification datasets and LLM models, we find, incorporating our sandbox network generally improves the accuracy by a range of 0.12\\% to 6.31\\% in accuracy and 0.3\\% to 8.82\\% in macro f1 when compared to a baseline. The framework, not only serves as a classification tool but also as a descriptive tool for the model's decision of its prediction, based on the provided cop-words. Through further evaluations involving the injection of \"foreign\" cop-words, we showcase the sandbox framework's capacity to exhibit a coherent understanding of learned concepts and construct methodologies to discover potential spurious behaviors and biases within it. Despite witnessing results confirming our network's ability to capture domain knowledge, we show evidence that the model's secondary incentives do not match human decisions.",
        "keywords": "Large Language Model;Spurious Corelation;NLP;AI Alignment",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/54f58403f7233d3d325631cb6ae2508c996b3119.zip",
        "author": "Mostafa Mushsharat;Nabeel Mohammed;Mohammad Ruhul Amin",
        "authorids": "~Mostafa_Mushsharat1;~Nabeel_Mohammed1;~Mohammad_Ruhul_Amin1",
        "gender": "M;M;M",
        "homepage": ";http://ece.northsouth.edu/people/dr-nabeel-mohammed/;https://ruhulsbu.github.io",
        "dblp": ";127/2798;193/0290.html",
        "google_scholar": ";https://scholar.google.com.au/citations?hl=en;N_yWGjIAAAAJ",
        "orcid": ";0000-0002-7661-3570;0000-0001-6540-3415",
        "linkedin": "mostafa-mushsharat-81965a146/;;shajibsust/",
        "or_profile": "~Mostafa_Mushsharat1;~Nabeel_Mohammed1;~Mohammad_Ruhul_Amin1",
        "aff": ";North South University;Fordham University",
        "aff_domain": ";northsouth.edu;fordham.edu",
        "position": ";Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nmushsharat2024a,\ntitle={A Neural Sandbox Framework for Discovering Spurious Concpets in {LLM} Decisions},\nauthor={Mostafa Mushsharat and Nabeel Mohammed and Mohammad Ruhul Amin},\nyear={2024},\nurl={https://openreview.net/forum?id=1tDoI2WBGE}\n}",
        "github": "",
        "project": "",
        "reviewers": "cfUj;57Af;1xDE;hACj",
        "site": "https://openreview.net/forum?id=1tDoI2WBGE",
        "pdf_size": 807818,
        "rating": "1;1;3;3",
        "confidence": "4;3;3;4",
        "soundness": "1;1;3;2",
        "contribution": "2;1;3;1",
        "presentation": "1;1;3;1",
        "wc_summary": "109;264;152;72",
        "wc_strengths": "61;80;57;23",
        "wc_weaknesses": "220;215;81;84",
        "wc_questions": "9;20;4;4",
        "wc_review": "399;579;294;183",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            1.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            149.25,
            72.04642600434806
        ],
        "wc_strengths_avg": [
            55.25,
            20.54720175595694
        ],
        "wc_weaknesses_avg": [
            150.0,
            67.53147414354288
        ],
        "wc_questions_avg": [
            9.25,
            6.53356717268599
        ],
        "wc_review_avg": [
            363.75,
            145.86873379857659
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:QlfjTFyS9-IJ:scholar.google.com/&scioq=A+Neural+Sandbox+Framework+for+Discovering+Spurious+Concpets+in+LLM+Decisions&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "North South University;Fordham University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.northsouth.edu/;https://www.fordham.edu",
        "aff_unique_abbr": "NSU;Fordham",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Bangladesh;United States"
    },
    {
        "title": "MiniGPT-4: Enhancing Vision-Language Understanding with Advanced Large Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19567",
        "id": "1tZbq88f27",
        "author_site": "Deyao Zhu, jun chen, Xiaoqian Shen, Xiang Li, Mohamed Elhoseiny",
        "tldr": "",
        "abstract": "The recent GPT-4 has demonstrated extraordinary multi-modal abilities, such as directly generating websites from handwritten text and identifying humorous elements within images. These features are rarely observed in previous vision-language models. However, the technical details behind GPT-4 continue to remain undisclosed.\nWe believe that the enhanced multi-modal generation capabilities of GPT-4 stem from the utilization of sophisticated large language models (LLM). \nTo examine this phenomenon, we present MiniGPT-4, which aligns a frozen visual encoder with a frozen advanced LLM, Vicuna, using one projection layer. \nOur work, for the first time, uncovers that properly aligning the visual features with an advanced large language model can possess numerous advanced multi-modal abilities demonstrated by GPT-4, \nsuch as detailed image description generation and website creation from hand-drawn drafts.\nFurthermore, we also observe other emerging capabilities in MiniGPT-4, including writing stories and poems inspired by given images, teaching users how to cook based on food photos, and so on. \nIn our experiment, we found that the model trained on short image caption pairs could produce unnatural language outputs (e.g., repetition and fragmentation). To address this problem, we curate a detailed image description dataset in the second stage to finetune the model, which consequently improves the model's generation reliability and overall usability.",
        "keywords": "large language models;vision language models",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Deyao Zhu;Jun Chen;Xiaoqian Shen;Xiang Li;Mohamed Elhoseiny",
        "authorids": "~Deyao_Zhu1;~Jun_Chen11;~Xiaoqian_Shen3;~Xiang_Li18;~Mohamed_Elhoseiny1",
        "gender": "M;M;F;M;M",
        "homepage": "https://tsutikgiau.github.io/;https://junchen14.github.io/;https://xiaoqian-shen.github.io;http://xiangli.ac.cn;http://www.mohamed-elhoseiny.com",
        "dblp": "251/6017;85/5901-21;197/6114;40/1491-46;125/2894",
        "google_scholar": "dENNKrsAAAAJ;9G2OQmkAAAAJ;uToGtIwAAAAJ;4Apl5FgAAAAJ;iRBUTOAAAAAJ",
        "orcid": ";0000-0001-8883-0970;;0000-0002-9946-7000;0000-0001-9659-1551",
        "linkedin": "deyao-zhu-205774154/;;xiaoqian-shen-759991264;;mohamed-elhoseiny-8a836215/",
        "or_profile": "~Deyao_Zhu1;~Jun_Chen11;~Xiaoqian_Shen3;~Xiang_Li18;~Mohamed_Elhoseiny1",
        "aff": "ByteDance Inc.;KAUST;Meta Facebook;King Abdullah University of Science and Technology;KAUST",
        "aff_domain": "bytedance.com;kaust.edu.sa;meta.com;kaust.edu.sa;kaust.edu.sa",
        "position": "Researcher;PhD student;Intern;Postdoc;Associate Professor",
        "bibtex": "@inproceedings{\nzhu2024minigpt,\ntitle={Mini{GPT}-4: Enhancing Vision-Language Understanding with Advanced Large Language Models},\nauthor={Deyao Zhu and Jun Chen and Xiaoqian Shen and Xiang Li and Mohamed Elhoseiny},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=1tZbq88f27}\n}",
        "github": "",
        "project": "",
        "reviewers": "TFFX;7oDs;auSX;A8a5",
        "pdf_size": 3623133,
        "rating": "5;5;6;6",
        "confidence": "4;4;4;4",
        "soundness": "3;2;3;2",
        "contribution": "4;3;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "81;110;108;85",
        "wc_strengths": "67;41;81;72",
        "wc_weaknesses": "92;396;466;84",
        "wc_questions": "63;61;55;97",
        "wc_review": "303;608;710;338",
        "wc_reply_reviewers": "95;0;121;20",
        "wc_reply_authors": "189;226;1024;474",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "2;1;3;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            96.0,
            13.095800853708795
        ],
        "wc_strengths_avg": [
            65.25,
            14.872373717735847
        ],
        "wc_weaknesses_avg": [
            259.5,
            173.29959607569776
        ],
        "wc_questions_avg": [
            69.0,
            16.431676725154983
        ],
        "wc_review_avg": [
            489.75,
            173.49117412710078
        ],
        "wc_reply_reviewers_avg": [
            59.0,
            50.35374861914453
        ],
        "wc_reply_authors_avg": [
            478.25,
            333.60034097704397
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2918,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1879282532294332322&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 10,
        "openreview": "https://openreview.net/forum?id=1tZbq88f27",
        "pdf": "https://openreview.net/pdf?id=1tZbq88f27",
        "email": "bytedance.com;kaust.edu.sa;meta.com;kaust.edu.sa;kaust.edu.sa",
        "author_num": 5,
        "aff_unique_index": "0;1;2;1;1",
        "aff_unique_norm": "ByteDance;King Abdullah University of Science and Technology;Meta",
        "aff_unique_dep": ";;Meta Platforms, Inc.",
        "aff_unique_url": "https://www.bytedance.com;https://www.kaust.edu.sa;https://meta.com",
        "aff_unique_abbr": "ByteDance;KAUST;Meta",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;1;1",
        "aff_country_unique": "China;Saudi Arabia;United States"
    },
    {
        "id": "1uHTIjXjkk",
        "title": "Potential Based Diffusion Motion Planning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Effective motion planning in high dimensional spaces is a long-standing open problem in robotics. One class of traditional motion planning algorithms corresponds to potential-based motion planning. An advantage of potential based motion planning is composability -- different motion constraints can easily combined by adding corresponding potentials. However, constructing motion paths from potentials requires solving a global optimization across configuration space potential landscape,  which is often prone to local minima, causing these approaches to fall out of favor in recent years. We propose a new approach towards learning potential based motion planning, where we train a neural networks to capture and learn an easily optimizable potentials over motion planning trajectories. We illustrate the effectiveness of such approach, significantly outperforming both classical and recent learned motion planning approaches, and illustrate its inherent composability, enabling us to generalize to a multitude of different motion constraints.",
        "keywords": "Motion Planning;Diffusion Model;Energy-based Model;Compositionality",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Yunhao Luo;Chen Sun;Joshua B. Tenenbaum;Yilun Du",
        "authorids": "~Yunhao_Luo1;~Chen_Sun1;~Joshua_B._Tenenbaum1;~Yilun_Du1",
        "gender": "M;M;;",
        "homepage": "https://devinluo27.github.io/;https://chensun.me;;https://yilundu.github.io",
        "dblp": ";01/6072-2;t/JoshuaBTenenbaum;204/4379",
        "google_scholar": ";vQa7heEAAAAJ;;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Yunhao_Luo1;~Chen_Sun1;~Joshua_B._Tenenbaum1;~Yilun_Du1",
        "aff": "Brown University;Google;Massachusetts Institute of Technology;Massachusetts Institute of Technology",
        "aff_domain": "brown.edu;google.com;mit.edu;mit.edu",
        "position": "MS student;Research Scientist;Professor;PhD student",
        "bibtex": "@misc{\nluo2024potential,\ntitle={Potential Based Diffusion Motion Planning},\nauthor={Yunhao Luo and Chen Sun and Joshua B. Tenenbaum and Yilun Du},\nyear={2024},\nurl={https://openreview.net/forum?id=1uHTIjXjkk}\n}",
        "github": "",
        "project": "",
        "reviewers": "tz1K;PtS9;i3W8;jxc2",
        "site": "https://openreview.net/forum?id=1uHTIjXjkk",
        "pdf_size": 8601846,
        "rating": "1;5;5;5",
        "confidence": "5;5;3;4",
        "soundness": "1;2;2;3",
        "contribution": "1;2;2;2",
        "presentation": "2;2;2;3",
        "wc_summary": "323;68;62;53",
        "wc_strengths": "2;116;13;53",
        "wc_weaknesses": "2;432;73;183",
        "wc_questions": "2;71;443;158",
        "wc_review": "329;687;591;447",
        "wc_reply_reviewers": "0;11;672;75",
        "wc_reply_authors": "352;532;1420;1021",
        "reply_reviewers": "0;1;2;1",
        "reply_authors": "1;2;3;3",
        "rating_avg": [
            4.0,
            1.7320508075688772
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            126.5,
            113.57486517711567
        ],
        "wc_strengths_avg": [
            46.0,
            44.64862819841165
        ],
        "wc_weaknesses_avg": [
            172.5,
            163.11115841658412
        ],
        "wc_questions_avg": [
            168.5,
            167.84591147835565
        ],
        "wc_review_avg": [
            513.5,
            136.53845612134333
        ],
        "wc_reply_reviewers_avg": [
            189.5,
            280.0397293242514
        ],
        "wc_reply_authors_avg": [
            831.25,
            418.8862464918131
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6157278685220882083&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;2;2",
        "aff_unique_norm": "Brown University;Google;Massachusetts Institute of Technology",
        "aff_unique_dep": ";Google;",
        "aff_unique_url": "https://www.brown.edu;https://www.google.com;https://web.mit.edu",
        "aff_unique_abbr": "Brown;Google;MIT",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Unified Human-Scene Interaction via Prompted Chain-of-Contacts",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19566",
        "id": "1vCnDyQkjg",
        "author_site": "Zeqi Xiao, Tai Wang, Jingbo Wang, Jinkun Cao, Wenwei Zhang, Bo DAI, Dahua Lin, Jiangmiao Pang",
        "tldr": "",
        "abstract": "Human-Scene Interaction (HSI) is a vital component of fields like embodied AI and virtual reality. Despite advancements in motion quality and physical plausibility, two pivotal factors, versatile interaction control and the development of a user-friendly interface, require further exploration before the practical application of HSI. This paper presents a unified HSI framework, UniHSI, which supports unified control of diverse interactions through language commands. The framework defines interaction as ``Chain of Contacts (CoC)\", representing steps involving human joint-object part pairs. This concept is inspired by the strong correlation between interaction types and corresponding contact regions. Based on the definition, UniHSI constitutes a Large Language Model (LLM) Planner to translate language prompts into task plans in the form of CoC, and a Unified Controller that turns CoC into uniform task execution. To facilitate training and evaluation, we collect a new dataset named ScenePlan that encompasses thousands of task plans generated by LLMs based on diverse scenarios. Comprehensive experiments demonstrate the effectiveness of our framework in versatile task execution and generalizability to real scanned scenes.",
        "keywords": "Human-Scene Interaction;Chain-of-Contacts;Unified;LLM",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/108d0d7943fd3252782328d667d2c70d8078786b.pdf",
        "author": "Zeqi Xiao;Tai Wang;Jingbo Wang;Jinkun Cao;Wenwei Zhang;Bo Dai;Dahua Lin;Jiangmiao Pang",
        "authorids": "~Zeqi_Xiao2;~Tai_Wang2;~Jingbo_Wang3;~Jinkun_Cao1;~Wenwei_Zhang1;~Bo_Dai2;~Dahua_Lin1;~Jiangmiao_Pang1",
        "gender": "M;M;M;M;M;M;M;M",
        "homepage": "https://github.com/xizaoqu;https://scholar.google.com/citations?user=GStTsxAAAAAJ&hl=en;https://www.jinkuncao.com;https://zhangwenwei.cn;http://daibo.info/;http://dahua.site;https://oceanpang.github.io/;https://tai-wang.github.io/",
        "dblp": "344/1615;10/1491-3.html;224/0126;;64/2903-2;53/6088;231/7630;",
        "google_scholar": ";GStTsxAAAAAJ;xDtTbmQAAAAJ;QDXADSEAAAAJ;https://scholar.google.com.hk/citations?user=KNWTvgEAAAAJ;GMzzRRUAAAAJ;https://scholar.google.com/citations?authuser=0;JmbbZWIAAAAJ",
        "orcid": ";;;0000-0002-2748-4514;0000-0003-0777-9232;;0000-0002-6711-9319;",
        "linkedin": ";;;wenweizhang-b9769a124/;;;;%E6%B3%B0-%E7%8E%8B-2b2738147/",
        "or_profile": "~Zeqi_Xiao2;~Jingbo_Wang3;~Jinkun_Cao1;~Wenwei_Zhang1;~Bo_Dai2;~Dahua_Lin1;~Jiangmiao_Pang1;~Tai_WANG1",
        "aff": "Nanyang Technological University;Shanghai Artificial Intelligence Laboratory;Carnegie Mellon University;Shanghai AI Laboratory;Shanghai AI Laboratory;The Chinese University of Hong Kong;Shanghai AI Laboratory ;Shanghai AI Laboratory",
        "aff_domain": "ntu.edu.sg;pjlab.org.cn;andrew.cmu.edu;pjlab.org.cn;pjlab.org.cn;cuhk.edu.hk;pjlab.org.cn;pjlab.org.cn",
        "position": "PhD student;Researcher;PhD student;Researcher;Scientist;Associate Professor;Research Scientist;Research Scientist",
        "bibtex": "@inproceedings{\nxiao2024unified,\ntitle={Unified Human-Scene Interaction via Prompted Chain-of-Contacts},\nauthor={Zeqi Xiao and Tai Wang and Jingbo Wang and Jinkun Cao and Wenwei Zhang and Bo Dai and Dahua Lin and Jiangmiao Pang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=1vCnDyQkjg}\n}",
        "github": "",
        "project": "",
        "reviewers": "YGEs;gSqi;tgmd;JJQ3",
        "pdf_size": 1428992,
        "rating": "5;6;8;10",
        "confidence": "2;3;4;4",
        "soundness": "2;2;3;3",
        "contribution": "3;3;3;4",
        "presentation": "2;4;3;3",
        "wc_summary": "95;66;157;103",
        "wc_strengths": "272;43;89;71",
        "wc_weaknesses": "3;159;379;38",
        "wc_questions": "292;65;65;148",
        "wc_review": "662;333;690;360",
        "wc_reply_reviewers": "0;0;0;29",
        "wc_reply_authors": "738;471;1090;348",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;2;2",
        "rating_avg": [
            7.25,
            1.920286436967152
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            105.25,
            32.89661836724255
        ],
        "wc_strengths_avg": [
            118.75,
            89.98437364342767
        ],
        "wc_weaknesses_avg": [
            144.75,
            147.10944055362322
        ],
        "wc_questions_avg": [
            142.5,
            92.726749107256
        ],
        "wc_review_avg": [
            511.25,
            165.32297934649011
        ],
        "wc_reply_reviewers_avg": [
            7.25,
            12.55736835487436
        ],
        "wc_reply_authors_avg": [
            661.75,
            284.6211297497078
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.9028289727756884,
        "gs_citation": 66,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15514585984236712669&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=1vCnDyQkjg",
        "pdf": "https://openreview.net/pdf?id=1vCnDyQkjg",
        "email": "ntu.edu.sg;pjlab.org.cn;andrew.cmu.edu;pjlab.org.cn;pjlab.org.cn;cuhk.edu.hk;pjlab.org.cn;pjlab.org.cn",
        "author_num": 8,
        "aff_unique_index": "0;1;2;3;3;4;3;3",
        "aff_unique_norm": "Nanyang Technological University;Shanghai Artificial Intelligence Laboratory;Carnegie Mellon University;Shanghai AI Laboratory;Chinese University of Hong Kong",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.ntu.edu.sg;http://www.shailab.org/;https://www.cmu.edu;https://www.shanghai-ai-lab.com;https://www.cuhk.edu.hk",
        "aff_unique_abbr": "NTU;Shanghai AI Lab;CMU;SAIL;CUHK",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;1;2;1;1;1;1;1",
        "aff_country_unique": "Singapore;China;United States"
    },
    {
        "title": "Mastering Memory Tasks with World Models",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19565",
        "id": "1vDArHJ68h",
        "author_site": "Mohammad Reza Samsami, Artem Zholus, Janarthanan Rajendran, Sarath Chandar",
        "tldr": "",
        "abstract": "Current model-based reinforcement learning (MBRL) agents struggle with long-term dependencies. This limits their ability to effectively solve tasks involving extended time gaps between actions and outcomes, or tasks demanding the recalling of distant observations to inform current actions. To improve temporal coherence, we integrate a new family of state space models (SSMs) in world models of MBRL agents to present a new method, Recall to Imagine (R2I). This integration aims to enhance both long-term memory and long-horizon credit assignment. Through a diverse set of illustrative tasks, we systematically demonstrate that R2I not only establishes a new state-of-the-art for challenging memory and credit assignment RL tasks, such as BSuite and POPGym, but also showcases superhuman performance in the complex memory domain of Memory Maze. At the same time, it upholds comparable performance in classic RL tasks, such as Atari and DMC, suggesting the generality of our method. We also show that R2I is faster than the state-of-the-art MBRL method, DreamerV3, resulting in faster wall-time convergence.",
        "keywords": "model-based reinforcement learning;state space models;memory in reinforcement learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Mohammad Reza Samsami;Artem Zholus;Janarthanan Rajendran;Sarath Chandar",
        "authorids": "~Mohammad_Reza_Samsami1;~Artem_Zholus1;~Janarthanan_Rajendran1;~Sarath_Chandar1",
        "gender": "M;M;;M",
        "homepage": "https://mrsamsami.github.io;https://artemzholus.github.io/;;http://sarathchandar.in/",
        "dblp": ";;;45/8542",
        "google_scholar": "0_tOLp8AAAAJ;zRhDoycAAAAJ;;https://scholar.google.co.in/citations?user=yxWtZLAAAAAJ",
        "orcid": ";0000-0003-3167-3585;;",
        "linkedin": "https://linkedin.com/in/mohammadrezasamsami;azholus/;;",
        "or_profile": "~Mohammad_Reza_Samsami1;~Artem_Zholus1;~Janarthanan_Rajendran1;~Sarath_Chandar1",
        "aff": "Universit\u00e9 de Montr\u00e9al;\u00c9cole Polytechnique de Montr\u00e9al, Universit\u00e9 de Montr\u00e9al;;\u00c9cole Polytechnique de Montr\u00e9al",
        "aff_domain": "umontreal.ca;polymtl.ca;;polymtl.ca",
        "position": "MS student;PhD student;;Assistant Professor",
        "bibtex": "@inproceedings{\nsamsami2024mastering,\ntitle={Mastering Memory Tasks with World Models},\nauthor={Mohammad Reza Samsami and Artem Zholus and Janarthanan Rajendran and Sarath Chandar},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=1vDArHJ68h}\n}",
        "github": "",
        "project": "",
        "reviewers": "fFhp;pPqM;Emy3",
        "pdf_size": 2564812,
        "rating": "6;8;10",
        "confidence": "5;4;4",
        "soundness": "3;3;4",
        "contribution": "2;3;4",
        "presentation": "4;3;4",
        "wc_summary": "71;108;52",
        "wc_strengths": "44;120;139",
        "wc_weaknesses": "218;489;134",
        "wc_questions": "64;335;58",
        "wc_review": "397;1052;383",
        "wc_reply_reviewers": "156;34;208",
        "wc_reply_authors": "2099;1657;1009",
        "reply_reviewers": "1;1;2",
        "reply_authors": "3;3;4",
        "rating_avg": [
            8.0,
            1.632993161855452
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            77.0,
            23.25224003546038
        ],
        "wc_strengths_avg": [
            101.0,
            41.04469108991645
        ],
        "wc_weaknesses_avg": [
            280.3333333333333,
            151.4823055306754
        ],
        "wc_questions_avg": [
            152.33333333333334,
            129.18806274403047
        ],
        "wc_review_avg": [
            610.6666666666666,
            312.1221270948637
        ],
        "wc_reply_reviewers_avg": [
            132.66666666666666,
            72.92614224146388
        ],
        "wc_reply_authors_avg": [
            1588.3333333333333,
            447.6317931316119
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 25,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9099273719990278443&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=1vDArHJ68h",
        "pdf": "https://openreview.net/pdf?id=1vDArHJ68h",
        "email": "umontreal.ca;polymtl.ca;;polymtl.ca",
        "author_num": 4,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Universit\u00e9 de Montr\u00e9al;\u00c9cole Polytechnique de Montr\u00e9al",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.umontreal.ca;https://www.polymtl.ca",
        "aff_unique_abbr": "UdeM;Polytechnique Montr\u00e9al",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Montr\u00e9al",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "1vI5fqwpRU",
        "title": "RayE-Sub: Countering Subgraph Degradation via Perfect Reconstruction",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Subgraph learning has dominated most practices of improving the expressive power of Message passing neural networks (MPNNs). Existing subgraph discovery policies can be classified into node-based and partition-based, which both achieve impressive performance in most scenarios. Unfortunately, we observe that there exists a subgraph degradation trap in these two mainstream solutions. This means extracted subgraphs fail to achieve better expression. In this work, we start with an intuitive observation and theoretical analysis to explore subgraph degeneration. We then summarize the limitations of these two subgraph strategies from the perspective of reconstruction ability. To this end, we propose perfect reconstruction principle to realize high-quality subgraph extraction. To achieve this, two affiliated questions should be well-addressed. \\emph{(i) how to ensure the subgraphs possessing with 'perfect' information? (ii) how to guarantee the 'reconstruction' power of obtained subgraphs?}  Firstly, we propose a subgraph partition strategy \\emph{Rayleigh-resistance} to extract non-overlap subgraphs by leveraging the graph spectral theory. Secondly, we put forward the Query mechanism to achieve subgraph-level equivariant learning, which guarantees subgraph reconstruction ability. These two parts, \\emph{perfect subgraph partition} and \\emph{equivariant subgraph learning} are seamlessly unified as a novel \\emph{\\underline{Ray}leigh-resistance \\underline{E}quivariant \\underline{Sub}graph learning} architecture (\\emph{\\textbf{RayE-Sub}}). A series of experiments on both synthetic and real datasets demonstrate that our approach can consistently outperform previous MPNNs architectures.",
        "keywords": "Graph Nerual Network;Subgraph Learning;Reconstruction ability;Expressive power",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/646a29411bb0625757457e4a8d32a566ce170f7b.zip",
        "author": "Kuo Yang;Zhengyang Zhou;Xu Wang;Pengkun Wang;Limin Li;Yang Wang",
        "authorids": "~Kuo_Yang2;~Zhengyang_Zhou1;~Xu_Wang16;~Pengkun_Wang1;~Limin_Li3;~Yang_Wang32",
        "gender": "M;M;M;M;M;M",
        "homepage": ";http://home.ustc.edu.cn/~zzy0929/Home/;http://home.ustc.edu.cn/~wx309/;http://home.ustc.edu.cn/~pengkun/index.html;http://di.ustc.edu.cn/;http://staff.ustc.edu.cn/~angyan/",
        "dblp": ";246/8238;181/2815-29;;;",
        "google_scholar": ";dPElQLUAAAAJ;7hYGPC8AAAAJ;https://scholar.google.com/citations?hl=zh-CN;;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": "0000-0003-3346-5130;0000-0003-4728-7347;0000-0002-1492-3477;0000-0002-2680-4563;;0000-0002-6079-7053",
        "linkedin": "https://www.linkedin.cn/incareer/in/kuo-yang-440a241b4;;;;;",
        "or_profile": "~Kuo_Yang2;~Zhengyang_Zhou1;~Xu_Wang16;~Pengkun_Wang1;~Limin_Li3;~Yang_Wang32",
        "aff": "University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China",
        "aff_domain": "ustc.edu.cn;ustc.edu.cn;ustc.edu.cn;ustc.edu.cn;ustc.edu.cn;ustc.edu.cn",
        "position": "PhD student;Researcher;Associate Researcher;Researcher;PhD student;Associate Professor",
        "bibtex": "@misc{\nyang2024rayesub,\ntitle={RayE-Sub: Countering Subgraph Degradation via Perfect Reconstruction},\nauthor={Kuo Yang and Zhengyang Zhou and Xu Wang and Pengkun Wang and Limin Li and Yang Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=1vI5fqwpRU}\n}",
        "github": "",
        "project": "",
        "reviewers": "7R4q;NoaS;h1tc",
        "site": "https://openreview.net/forum?id=1vI5fqwpRU",
        "pdf_size": 1079790,
        "rating": "3;3;6",
        "confidence": "4;4;3",
        "soundness": "2;1;3",
        "contribution": "2;2;3",
        "presentation": "1;1;3",
        "wc_summary": "86;50;68",
        "wc_strengths": "30;43;37",
        "wc_weaknesses": "246;84;169",
        "wc_questions": "5;614;10",
        "wc_review": "367;791;284",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            68.0,
            14.696938456699069
        ],
        "wc_strengths_avg": [
            36.666666666666664,
            5.312459150169743
        ],
        "wc_weaknesses_avg": [
            166.33333333333334,
            66.16309814054625
        ],
        "wc_questions_avg": [
            209.66666666666666,
            285.9141285226893
        ],
        "wc_review_avg": [
            480.6666666666667,
            222.03953601905124
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:utu08KkzN34J:scholar.google.com/&scioq=RayE-Sub:+Countering+Subgraph+Degradation+via+Perfect+Reconstruction&hl=en&as_sdt=0,22",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "University of Science and Technology of China",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.ustc.edu.cn",
        "aff_unique_abbr": "USTC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Directly Fine-Tuning Diffusion Models on Differentiable Rewards",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19564",
        "id": "1vmSEVL19f",
        "author_site": "Kevin Clark, Paul Vicol, Kevin Swersky, David Fleet",
        "tldr": "",
        "abstract": "We present Direct Reward Fine-Tuning (DRaFT), a simple and effective method for fine-tuning diffusion models to maximize differentiable reward functions, such as scores from human preference models. We first show that it is possible to backpropagate the reward function gradient through the full sampling procedure, and that doing so achieves strong performance on a variety of rewards, outperforming reinforcement learning-based approaches. We then propose more efficient variants of DRaFT: DRaFT-K, which truncates backpropagation to only the last K steps of sampling, and DRaFT-LV, which obtains lower-variance gradient estimates for the case when K=1. We show that our methods work well for a variety of reward functions and can be used to substantially improve the aesthetic quality of images generated by Stable Diffusion 1.4. Finally, we draw connections between our approach and prior work, providing a unifying perspective on the design space of gradient-based fine-tuning algorithms.",
        "keywords": "diffusion models;preference-based learning",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Kevin Clark;Paul Vicol;Kevin Swersky;David J. Fleet",
        "authorids": "~Kevin_Clark1;~Paul_Vicol1;~Kevin_Swersky1;~David_J._Fleet1",
        "gender": "M;;M;M",
        "homepage": "http://cs.stanford.edu/~kevclark/;http://www.paulvicol.com;http://www.cs.toronto.edu/~kswersky;http://www.cs.toronto.edu/~fleet/index.html",
        "dblp": ";167/9924;35/9381;07/2099",
        "google_scholar": "Trk_R8wAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.ca/citations?user=IrixA8MAAAAJ;https://scholar.google.com.tw/citations?user=njOmQFsAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Kevin_Clark1;~Paul_Vicol1;~Kevin_Swersky1;~David_J._Fleet1",
        "aff": "Google;Google;Google Deepmind;Department of Computer Science, University of Toronto",
        "aff_domain": "google.com;google.com;google.com;cs.toronto.edu",
        "position": "Researcher;Researcher;Research Scientist;Full Professor",
        "bibtex": "@inproceedings{\nclark2024directly,\ntitle={Directly Fine-Tuning Diffusion Models on Differentiable Rewards},\nauthor={Kevin Clark and Paul Vicol and Kevin Swersky and David J. Fleet},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=1vmSEVL19f}\n}",
        "github": "",
        "project": "",
        "reviewers": "LgKe;tWnQ;m5FM;pZzS",
        "pdf_size": 28948707,
        "rating": "3;5;8;8",
        "confidence": "5;4;4;4",
        "soundness": "3;4;4;3",
        "contribution": "2;2;3;3",
        "presentation": "3;4;4;3",
        "wc_summary": "62;66;109;111",
        "wc_strengths": "80;138;125;123",
        "wc_weaknesses": "131;76;121;79",
        "wc_questions": "61;20;210;1",
        "wc_review": "334;300;565;314",
        "wc_reply_reviewers": "0;0;117;5",
        "wc_reply_authors": "636;371;793;94",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "1;1;2;2",
        "rating_avg": [
            6.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            87.0,
            23.054283766797006
        ],
        "wc_strengths_avg": [
            116.5,
            21.84605227495348
        ],
        "wc_weaknesses_avg": [
            101.75,
            24.529319191530774
        ],
        "wc_questions_avg": [
            73.0,
            82.01524248577212
        ],
        "wc_review_avg": [
            378.25,
            108.49510357615223
        ],
        "wc_reply_reviewers_avg": [
            30.5,
            49.98249693642766
        ],
        "wc_reply_authors_avg": [
            473.5,
            265.9948307768405
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8164965809277261,
        "gs_citation": 135,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4389730101296429648&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=1vmSEVL19f",
        "pdf": "https://openreview.net/pdf?id=1vmSEVL19f",
        "email": "google.com;google.com;google.com;cs.toronto.edu",
        "author_num": 4,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "Google;DeepMind;University of Toronto",
        "aff_unique_dep": "Google;DeepMind;Department of Computer Science",
        "aff_unique_url": "https://www.google.com;https://deepmind.com;https://www.utoronto.ca",
        "aff_unique_abbr": "Google;DeepMind;U of T",
        "aff_campus_unique_index": "0;0;2",
        "aff_campus_unique": "Mountain View;;Toronto",
        "aff_country_unique_index": "0;0;1;2",
        "aff_country_unique": "United States;United Kingdom;Canada"
    },
    {
        "id": "1vqHTUTod9",
        "title": "Can Language Models be Instructed to Protect Personal Information?",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large multimodal language models have proven transformative in numerous applications. \nHowever, these models have been shown to memorize and leak pre-training data, raising serious user privacy and information security concerns.\nWhile data leaks should be prevented, it is also crucial to examine the trade-off between the privacy protection and model utility of proposed approaches.\nIn this paper, we introduce PrivQA --- a multimodal benchmark to assess this privacy/utility trade-off when a model is instructed to protect specific categories of personal information in a simulated scenario.\nWe also propose a technique to iteratively self-moderate responses, which significantly improves privacy.\nHowever, through a series of red-teaming experiments, we find that adversaries can also easily circumvent these protections with simple jailbreaking methods through textual and/or image inputs. \nWe believe PrivQA has the potential to support the development of new models with improved privacy protections, as well as the adversarial robustness of these protections. We release the entire PrivQA dataset at [URL removed for review].",
        "keywords": "large language model;privacy;safety;redteaming;natural language processing",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Yang Chen;Ethan Adrian Mendes;Sauvik Das;Wei Xu;Alan Ritter",
        "authorids": "~Yang_Chen10;~Ethan_Adrian_Mendes1;~Sauvik_Das1;~Wei_Xu5;~Alan_Ritter1",
        "gender": ";;Not Specified;F;M",
        "homepage": "https://edchengg.github.io/;;https://sauvik.me;https://cocoxu.github.io/;http://aritter.github.io/",
        "dblp": "48/4792-13;;https://dblp.uni-trier.de/pid/83/8570.html;32/1213-4.html;47/3133",
        "google_scholar": "o-oBMWEAAAAJ;1SJ4uSgAAAAJ;;BfOdG-oAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Yang_Chen10;~Ethan_Adrian_Mendes1;~Sauvik_Das1;~Wei_Xu5;~Alan_Ritter1",
        "aff": "Georgia Institute of Technology;Georgia Institute of Technology;Carnegie Mellon University;Georgia Institute of Technology;Georgia Institute of Technology",
        "aff_domain": "gatech.edu;gatech.edu;cmu.edu;gatech.edu;gatech.edu",
        "position": "PhD student;MS student;Assistant Professor;Associate Professor;Associate Professor",
        "bibtex": "@misc{\nchen2024can,\ntitle={Can Language Models be Instructed to Protect Personal Information?},\nauthor={Yang Chen and Ethan Adrian Mendes and Sauvik Das and Wei Xu and Alan Ritter},\nyear={2024},\nurl={https://openreview.net/forum?id=1vqHTUTod9}\n}",
        "github": "",
        "project": "",
        "reviewers": "YNv6;VxoZ;unBh;yBLS",
        "site": "https://openreview.net/forum?id=1vqHTUTod9",
        "pdf_size": 11363621,
        "rating": "3;5;6;6",
        "confidence": "4;4;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;1;3;4",
        "presentation": "2;3;3;4",
        "wc_summary": "73;138;148;105",
        "wc_strengths": "83;49;38;51",
        "wc_weaknesses": "304;272;47;130",
        "wc_questions": "2;2;374;95",
        "wc_review": "462;461;607;381",
        "wc_reply_reviewers": "0;84;153;55",
        "wc_reply_authors": "932;983;779;616",
        "reply_reviewers": "0;1;2;1",
        "reply_authors": "3;3;2;3",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            1.118033988749895
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            116.0,
            29.487285395573462
        ],
        "wc_strengths_avg": [
            55.25,
            16.768646337734005
        ],
        "wc_weaknesses_avg": [
            188.25,
            104.59057079871015
        ],
        "wc_questions_avg": [
            118.25,
            152.46044569002152
        ],
        "wc_review_avg": [
            477.75,
            81.5394843005522
        ],
        "wc_reply_reviewers_avg": [
            73.0,
            55.16792546398677
        ],
        "wc_reply_authors_avg": [
            827.5,
            143.33963164456645
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.75,
            0.4330127018922193
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 30,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=831180042438977110&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "Georgia Institute of Technology;Carnegie Mellon University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.gatech.edu;https://www.cmu.edu",
        "aff_unique_abbr": "Georgia Tech;CMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "MUFFIN: Curating Multi-Faceted Instructions for Improving Instruction Following",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19563",
        "id": "1vrS1zwekw",
        "author_site": "Renze Lou, Kai Zhang, Jian Xie, Yuxuan Sun, Jihyun Ahn, Hanzi XU, Yu Su, Wenpeng Yin",
        "tldr": "",
        "abstract": "In the realm of large language models (LLMs), enhancing instruction-following capability often involves curating expansive training data. This is achieved through two primary schemes: i) Scaling-Inputs: Amplifying (input, output) pairs per task instruction, aiming for better instruction adherence. ii) Scaling Input-Free Tasks: Enlarging tasks, each composed of an (instruction, output) pair (without requiring a separate input anymore). However, LLMs under Scaling-Inputs tend to be overly sensitive to inputs, leading to misinterpretation or non-compliance with instructions. Conversely, Scaling Input-Free Tasks demands a substantial number of tasks but is less effective in instruction following when dealing with instances in Scaling-Inputs. This work introduces MUFFIN, a new scheme of instruction-following dataset curation. Specifically, we automatically Scale Tasks per Input by diversifying these tasks with various input facets. Experimental results across four zero-shot benchmarks, spanning both Scaling-Inputs and Scaling Input-Free Tasks schemes, reveal that LLMs, at various scales, trained on MUFFIN generally demonstrate superior instruction-following capabilities compared to those trained on the two aforementioned schemes.",
        "keywords": "Instruction Tuning;Large Language Models;Automatic Data Generation",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Renze Lou;Kai Zhang;Jian Xie;Yuxuan Sun;Janice Ahn;Hanzi Xu;Yu Su;Wenpeng Yin",
        "authorids": "~Renze_Lou1;~Kai_Zhang10;~Jian_Xie3;~Yuxuan_Sun3;~Janice_Ahn1;~Hanzi_Xu1;~Yu_Su2;~Wenpeng_Yin1",
        "gender": "M;M;M;M;F;F;M;",
        "homepage": "https://renzelou.github.io/;https://drogozhang.github.io;;;;;http://ysu1989.github.io;http://wenpengyin.org/",
        "dblp": "296/4744;55/957-33;;;;229/0397;38/1070-1;117/7310-1",
        "google_scholar": "GVTbSPMAAAAJ;sDnAIsgAAAAJ;;https://scholar.google.com/citations?hl=en;;https://scholar.google.com/citations?hl=en;rIh5OqoAAAAJ;mRg16LkAAAAJ",
        "orcid": "0000-0002-3273-0097;;0009-0000-2867-4726;;;;;",
        "linkedin": "renze-lou-b681b51a0/;kai-zhang-43774b196/;;;jihyun-ahn-4b6037225;hanzixu/;;",
        "or_profile": "~Renze_Lou1;~Kai_Zhang10;~Jian_Xie3;~Yuxuan_Sun3;~Janice_Ahn1;~Hanzi_Xu1;~Yu_Su2;~Wenpeng_Yin1",
        "aff": "SalesForce.com;Google DeepMind;Fudan University;Zhejiang University;Pennsylvania State University;Temple University;Microsoft;Pennsylvania State University",
        "aff_domain": "salesforce.com;google.com;fudan.edu.cn;zju.edu.cn;psu.edu;temple.edu;microsoft.com;psu.edu",
        "position": "Intern;Student Researcher;MS student;PhD student;PhD student;PhD student;Senior Researcher;Assistant Professor",
        "bibtex": "@inproceedings{\nlou2024muffin,\ntitle={{MUFFIN}: Curating Multi-Faceted Instructions for Improving Instruction Following},\nauthor={Renze Lou and Kai Zhang and Jian Xie and Yuxuan Sun and Janice Ahn and Hanzi Xu and Yu Su and Wenpeng Yin},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=1vrS1zwekw}\n}",
        "github": "",
        "project": "",
        "reviewers": "cEte;od6V;j2qL;BsoU",
        "pdf_size": 1514572,
        "rating": "5;6;6;8",
        "confidence": "4;3;2;4",
        "soundness": "3;3;3;3",
        "contribution": "3;2;3;3",
        "presentation": "3;3;3;2",
        "wc_summary": "14;140;73;139",
        "wc_strengths": "28;97;82;56",
        "wc_weaknesses": "306;171;137;332",
        "wc_questions": "16;188;43;2",
        "wc_review": "364;596;335;529",
        "wc_reply_reviewers": "222;34;15;161",
        "wc_reply_authors": "2189;2071;917;947",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "5;5;3;4",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            91.5,
            52.33784481615574
        ],
        "wc_strengths_avg": [
            65.75,
            26.271419832205492
        ],
        "wc_weaknesses_avg": [
            236.5,
            83.87639715676872
        ],
        "wc_questions_avg": [
            62.25,
            74.0823022050476
        ],
        "wc_review_avg": [
            456.0,
            109.58330164765069
        ],
        "wc_reply_reviewers_avg": [
            108.0,
            86.50144507463445
        ],
        "wc_reply_authors_avg": [
            1531.0,
            600.5447527037431
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            4.25,
            0.82915619758885
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.20751433915982243,
        "gs_citation": 21,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1415875881970261133&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=1vrS1zwekw",
        "pdf": "https://openreview.net/pdf?id=1vrS1zwekw",
        "email": "salesforce.com;google.com;fudan.edu.cn;zju.edu.cn;psu.edu;temple.edu;microsoft.com;psu.edu",
        "author_num": 8,
        "aff_unique_index": "0;1;2;3;4;5;6;4",
        "aff_unique_norm": "Salesforce;Google;Fudan University;Zhejiang University;Pennsylvania State University;Temple University;Microsoft",
        "aff_unique_dep": ";Google DeepMind;;;;;Microsoft Corporation",
        "aff_unique_url": "https://www.salesforce.com;https://deepmind.com;https://www.fudan.edu.cn;https://www.zju.edu.cn;https://www.psu.edu;https://www.temple.edu;https://www.microsoft.com",
        "aff_unique_abbr": "Salesforce;DeepMind;Fudan;ZJU;PSU;Temple;Microsoft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;2;0;0;0;0",
        "aff_country_unique": "United States;United Kingdom;China"
    },
    {
        "id": "1xVDGGr6t6",
        "title": "Online Continual Learning via Pursuing Class-conditional Funtion",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Online continual learning is a challenging problem where models must learn from a non-stationary data stream while avoiding catastrophic forgetting. Inter-class imbalance during training has been identified as a major cause of forgetting, leading to model prediction bias towards recently learned classes. In this paper, we theoretically analyze that inter-class imbalance is entirely attributed to imbalanced class-priors, and the class-conditional function learned from intra-class distributions is the Bayes-optimal classifier. Accordingly, we present that a simple adjustment of model logits during training can effectively resist prior class bias and grasp the corresponding Bayes-optimum. Our method mitigates the impact of inter-class imbalance not only in class-incremental but also in realistic general setups by eliminating class-priors and pursuing class-conditionals, with minimal additional computational cost. We thoroughly evaluate our approach on various benchmarks and demonstrate significant performance improvements compared to prior arts. For example, our approach improves the best baseline by 4.6\\% on CIFAR10.",
        "keywords": "Online Continual Learning;Class-incremental Learning;Inter-class Imbalance",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/62971f4229ab1e92724f38db5b1044f1a3397b71.zip",
        "author": "Zhehao Huang;Tao Li;Chenhe Yuan;Yingwen Wu;Xiaolin Huang",
        "authorids": "~Zhehao_Huang1;~Tao_Li12;~Chenhe_Yuan1;~Yingwen_Wu1;~Xiaolin_Huang1",
        "gender": "M;M;M;F;M",
        "homepage": "https://github.com/K1nght;https://nblt.github.io/;https://github.com/vernunft2;https://github.com/snowien;http://www.pami.sjtu.edu.cn/en/xiaolin",
        "dblp": "258/1555;;;236/4329;61/2227",
        "google_scholar": ";https://scholar.google.com/citations?hl=zh-CN;;https://scholar.google.com.hk/citations?user=PcJzfBEAAAAJ;DR-gBcEAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Zhehao_Huang1;~Tao_Li12;~Chenhe_Yuan1;~Yingwen_Wu1;~Xiaolin_Huang1",
        "aff": "Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn;sjtu.edu;sjtu.edu.cn;sjtu.edu;sjtu.edu.cn",
        "position": "PhD student;PhD student;Undergrad student;PhD student;Full Professor",
        "bibtex": "@misc{\nhuang2024online,\ntitle={Online Continual Learning via Pursuing Class-conditional Funtion},\nauthor={Zhehao Huang and Tao Li and Chenhe Yuan and Yingwen Wu and Xiaolin Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=1xVDGGr6t6}\n}",
        "github": "",
        "project": "",
        "reviewers": "Y84H;6ngC;MqmM;3g12",
        "site": "https://openreview.net/forum?id=1xVDGGr6t6",
        "pdf_size": 2274700,
        "rating": "3;3;5;5",
        "confidence": "4;4;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;2",
        "presentation": "3;2;2;3",
        "wc_summary": "50;75;80;54",
        "wc_strengths": "48;29;50;25",
        "wc_weaknesses": "169;137;131;54",
        "wc_questions": "2;46;54;4",
        "wc_review": "269;287;315;137",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            64.75,
            12.94942083646987
        ],
        "wc_strengths_avg": [
            38.0,
            11.113055385446435
        ],
        "wc_weaknesses_avg": [
            122.75,
            42.23964370114881
        ],
        "wc_questions_avg": [
            26.5,
            23.680160472429236
        ],
        "wc_review_avg": [
            252.0,
            68.38859554048467
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:7YiFW-lNX-AJ:scholar.google.com/&scioq=Online+Continual+Learning+via+Pursuing+Class-conditional+Funtion&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Shanghai Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sjtu.edu.cn",
        "aff_unique_abbr": "SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "1xyar0Ko3E",
        "title": "Efficient Quantization-aware Training with Adaptive Coreset Selection",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The expanding model size and computation of deep neural networks (DNNs) have increased the demand for efficient model deployment methods. Quantization-aware training (QAT) is a representative model compression method to leverage redundancy in weights and activations. However, most existing QAT methods require end-to-end training on the entire dataset, which suffers from long training time and high energy costs. Coreset selection, aiming to improve data efficiency utilizing the redundancy of training data, has also been widely used for efficient training. In this work, we propose a new angle through the coreset selection to improve the training efficiency of quantization-aware training. Based on the characteristics of QAT, we propose two metrics: error vector score and disagreement score, to quantify the importance of each sample during training. Guided by these two metrics of importance, we proposed a quantization-aware adaptive coreset selection (ACS) method to select the data for the current training epoch. We evaluate our method on various networks (ResNet-18, MobileNetV2), datasets(CIFAR-100, ImageNet-1K), and under different quantization settings. Compared with previous coreset selection methods, our method significantly improves QAT performance with different dataset fractions. Our method can achieve an accuracy of 68.39\\% of 4-bit quantized ResNet-18 on the ImageNet-1K dataset with only a 10\\% subset, which has an absolute gain of 4.24\\% compared to the random baseline.",
        "keywords": "Model Compression;Quantization;Coreset Selection",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/cabb13438324c31be45bd5f73ba8d287223cedc8.zip",
        "author": "Xijie Huang;Zechun Liu;Shih-yang Liu;Kwang-Ting Cheng",
        "authorids": "~Xijie_Huang1;~Zechun_Liu1;~Shih-yang_Liu1;~Kwang-Ting_Cheng1",
        "gender": "M;;M;",
        "homepage": "https://huangowen.github.io/;;https://vsdl.hkust.edu.hk/people.html;",
        "dblp": "230/4412;;;",
        "google_scholar": "nFW2mqwAAAAJ;;eBXRoDgAAAAJ;",
        "orcid": ";;0000-0003-1997-0843;",
        "linkedin": "huang-xijie-4224371b8/;;;",
        "or_profile": "~Xijie_Huang1;~Zechun_Liu1;~Shih-yang_Liu1;~Kwang-Ting_Cheng1",
        "aff": "Microsoft Research;;NVIDIA;",
        "aff_domain": "microsoft.com;;nvidia.com;",
        "position": "Intern;;Intern;",
        "bibtex": "@misc{\nhuang2024efficient,\ntitle={Efficient Quantization-aware Training with Adaptive Coreset Selection},\nauthor={Xijie Huang and Zechun Liu and Shih-yang Liu and Kwang-Ting Cheng},\nyear={2024},\nurl={https://openreview.net/forum?id=1xyar0Ko3E}\n}",
        "github": "",
        "project": "",
        "reviewers": "ALc7;iCtg;NUL5",
        "site": "https://openreview.net/forum?id=1xyar0Ko3E",
        "pdf_size": 1010324,
        "rating": "3;3;6",
        "confidence": "3;5;4",
        "soundness": "2;2;3",
        "contribution": "2;1;3",
        "presentation": "2;3;3",
        "wc_summary": "50;133;64",
        "wc_strengths": "11;80;77",
        "wc_weaknesses": "38;59;176",
        "wc_questions": "15;37;2",
        "wc_review": "114;309;319",
        "wc_reply_reviewers": "624;0;0",
        "wc_reply_authors": "1693;1655;909",
        "reply_reviewers": "2;0;0",
        "reply_authors": "3;3;2",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            82.33333333333333,
            36.279777042068794
        ],
        "wc_strengths_avg": [
            56.0,
            31.843366656181317
        ],
        "wc_weaknesses_avg": [
            91.0,
            60.71243694664216
        ],
        "wc_questions_avg": [
            18.0,
            14.445299120013633
        ],
        "wc_review_avg": [
            247.33333333333334,
            94.36925111261378
        ],
        "wc_reply_reviewers_avg": [
            208.0,
            294.15642097360376
        ],
        "wc_reply_authors_avg": [
            1419.0,
            360.95798462794346
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14481123808402065885&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Microsoft;NVIDIA",
        "aff_unique_dep": "Microsoft Research;NVIDIA Corporation",
        "aff_unique_url": "https://www.microsoft.com/en-us/research;https://www.nvidia.com",
        "aff_unique_abbr": "MSR;NVIDIA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "1yll8U12GT",
        "title": "Enhancing Decision Tree Learning with Deep Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Conventional approaches to (oblique) decision tree construction for classification are greedy in nature. They can fail spectacularly when the true labeling function corresponds to a decision tree whose root node is uncorrelated with the labels (e.g. if the label function is the product of the sign of a collection of linear functions of the input). We define a new figure of merit to capture the usefulness of a linear function/hyperplane in a decision tree that is applicable even in scenarios where greedy procedures fail. We devise a novel deep neural network architecture that is very effective at seeking out hyperplanes/half-spaces/features that score highly on this metric.  We exploit this property in a subroutine for a new decision tree construction algorithm. The proposed algorithm outperforms all other decision tree construction procedures, especially in situations where the hyper-planes corresponding to the top levels of the true decision tree are not useful features by themselves for classification but are essential for getting to full accuracy. The properties of the deep architecture that we exploit to construct the decision tree are also of independent interest, as they reveal the inner workings of the feature learning mechanism at play in deep neural networks.",
        "keywords": "Deep Learning;feature learning;oblique decision trees",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/8c414d4e8eac00ddcfde2624a8649dd8f50c7184.pdf",
        "author": "Prithaj Banerjee;Mahesh Lorik Yadav;Harish Guruprasad Ramaswamy;Chandra Shekar Lakshminarayanan",
        "authorids": "~Prithaj_Banerjee1;~Mahesh_Lorik_Yadav1;~Harish_Guruprasad_Ramaswamy1;~Chandra_Shekar_Lakshminarayanan2",
        "gender": "M;M;M;M",
        "homepage": "https://www.cse.iitm.ac.in/profile.php?arg=Mjc4Mg==;;;https://iitpkd.ac.in/people/cnarayanan",
        "dblp": "206/7099.html;;126/1729;143/7535",
        "google_scholar": "rlr99eAAAAAJ;;;",
        "orcid": ";;;",
        "linkedin": "prithaj-banerjee-946a3a104/;mahesh-yadav-25779716a/;;",
        "or_profile": "~Prithaj_Banerjee1;~Mahesh_Lorik_Yadav1;~Harish_Guruprasad_Ramaswamy1;~Chandra_Shekar_Lakshminarayanan2",
        "aff": "Indian Institute of Technology, Madras;;Indian Institute of Technology Madras,;Indian Institute of Technology, Madras",
        "aff_domain": "iitm.ac.in;;iitm.ac.in;iitm.ac.in",
        "position": "MS student;;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nbanerjee2024enhancing,\ntitle={Enhancing Decision Tree Learning with Deep Networks},\nauthor={Prithaj Banerjee and Mahesh Lorik Yadav and Harish Guruprasad Ramaswamy and Chandra Shekar Lakshminarayanan},\nyear={2024},\nurl={https://openreview.net/forum?id=1yll8U12GT}\n}",
        "github": "",
        "project": "",
        "reviewers": "ugFu;cuTu;67Vr",
        "site": "https://openreview.net/forum?id=1yll8U12GT",
        "pdf_size": 407376,
        "rating": "3;3;5",
        "confidence": "4;5;4",
        "soundness": "2;2;2",
        "contribution": "2;1;2",
        "presentation": "2;2;3",
        "wc_summary": "34;104;68",
        "wc_strengths": "34;18;33",
        "wc_weaknesses": "187;385;221",
        "wc_questions": "131;13;12",
        "wc_review": "386;520;334",
        "wc_reply_reviewers": "0;116;31",
        "wc_reply_authors": "382;176;209",
        "reply_reviewers": "0;1;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            68.66666666666667,
            28.58126814696802
        ],
        "wc_strengths_avg": [
            28.333333333333332,
            7.3181661333667165
        ],
        "wc_weaknesses_avg": [
            264.3333333333333,
            86.44587259602906
        ],
        "wc_questions_avg": [
            52.0,
            55.86292748027682
        ],
        "wc_review_avg": [
            413.3333333333333,
            78.35531606442255
        ],
        "wc_reply_reviewers_avg": [
            49.0,
            49.03740069239668
        ],
        "wc_reply_authors_avg": [
            255.66666666666666,
            90.34132805950749
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:cgGzNsKDZmMJ:scholar.google.com/&scioq=Enhancing+Decision+Tree+Learning+with+Deep+Networks&hl=en&as_sdt=0,23",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Indian Institute of Technology Madras",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.iitm.ac.in",
        "aff_unique_abbr": "IIT Madras",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Madras",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "India"
    },
    {
        "id": "1zhM0XkQh0",
        "title": "ProFeAT: Projected Feature Adversarial Training for Self-Supervised Learning of Robust Representations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Supervised adversarial training has been the most successful approach for improving the robustness of Deep Neural Networks against adversarial attacks. While several recent works have attempted to overcome the need for supervision or labeled training data by integrating adversarial training with contrastive Self-Supervised Learning (SSL) approaches such as SimCLR, their performance has been sub-optimal due to the increased training complexity. A recent approach mitigates this by utilizing supervision from a standard self-supervised trained model in a teacher-student setting that mimics supervised adversarial training. However, we find that there is still a large gap in performance when compared to supervised training, specifically on larger capacity models. We show that this is a result of mismatch in training objectives of the teacher and student, and propose Projected Feature Adversarial Training (ProFeAT) to bridge this gap by using a projection head in the adversarial training step. We further propose appropriate attack and defense losses at the feature and projector spaces, coupled with a  combination of weak and strong augmentations for the teacher and student respectively, to improve generalization without increasing the training complexity. We demonstrate significant improvements in performance when compared to existing SSL methods, and performance on par with TRADES, a popular supervised adversarial training method, on several benchmark datasets and models.",
        "keywords": "Self-supervised Adversarial Training;Adversarial Training;Adversarial Robustness;Contrastive Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/62d78703af11ce5771c088defe34b375d99b2eb0.zip",
        "author": "Sravanti Addepalli;Priyam Dey;Venkatesh Babu Radhakrishnan",
        "authorids": "~Sravanti_Addepalli1;~Priyam_Dey1;~Venkatesh_Babu_Radhakrishnan2",
        "gender": "F;M;M",
        "homepage": ";;http://cds.iisc.ac.in/faculty/venky",
        "dblp": "127/7715;;20/6289",
        "google_scholar": "MOO12i0AAAAJ;YMu3SJ8AAAAJ;cVg7HrEAAAAJ",
        "orcid": ";0000-0001-5807-1379;0000-0002-1926-1804",
        "linkedin": "sravanti-addepalli/;priyam-dey33;venkatesh-babu-radhakrishnan-16568939",
        "or_profile": "~Sravanti_Addepalli1;~Priyam_Dey1;~Venkatesh_Babu_Radhakrishnan2",
        "aff": "Indian Institute of Science;Indian Institute of Science, Indian institute of science, Bangalore;Indian Institute of Science",
        "aff_domain": "iisc.ac.in;iisc.ac.in;iisc.ac.in",
        "position": "PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\naddepalli2024profeat,\ntitle={ProFe{AT}: Projected Feature Adversarial Training for Self-Supervised Learning of Robust Representations},\nauthor={Sravanti Addepalli and Priyam Dey and Venkatesh Babu Radhakrishnan},\nyear={2024},\nurl={https://openreview.net/forum?id=1zhM0XkQh0}\n}",
        "github": "",
        "project": "",
        "reviewers": "e5nc;eRyw;s59e;q8j3",
        "site": "https://openreview.net/forum?id=1zhM0XkQh0",
        "pdf_size": 750361,
        "rating": "5;6;6;6",
        "confidence": "4;5;5;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;2",
        "presentation": "2;4;3;3",
        "wc_summary": "118;29;70;79",
        "wc_strengths": "42;64;28;31",
        "wc_weaknesses": "186;143;185;260",
        "wc_questions": "79;49;48;2",
        "wc_review": "425;285;331;372",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "2011;732;1355;1088",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;1;2;3",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            74.0,
            31.63068130786942
        ],
        "wc_strengths_avg": [
            41.25,
            14.13108276106258
        ],
        "wc_weaknesses_avg": [
            193.5,
            42.13371571556442
        ],
        "wc_questions_avg": [
            44.5,
            27.518175811634027
        ],
        "wc_review_avg": [
            353.25,
            51.60608006814701
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1296.5,
            467.99172001222416
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:h4K-al4-3v0J:scholar.google.com/&scioq=ProFeAT:+Projected+Feature+Adversarial+Training+for+Self-Supervised+Learning+of+Robust+Representations&hl=en&as_sdt=0,33",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Indian Institute of Science",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.iisc.ac.in",
        "aff_unique_abbr": "IISc",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Bangalore",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "India"
    },
    {
        "id": "1zt8GWZ9sc",
        "title": "Quack: Automatic Jailbreaking Large Language Models via Role-playing",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) excel in Natural Language Processing (NLP) with human-like text generation, but the misuse of them has raised public concern and prompted the need for safety measures. Proactive testing with jailbreaks, meticulously crafted prompts that bypass model constraints and policies, has become mainstream to ensure security and reliability upon model release. While researchers have made substantial efforts to explore jailbreaks against LLMs, existing methods still face the following disadvantages: (1) require human labor and expertise to design question prompts; (2) non-determination regarding reproducing jailbreak; (3) exhibit limited effectiveness on updated model versions and lack the ability for iterative reuse when invalid.\nTo address these challenges, we introduce Quack, an automated testing framework based on role-playing of LLMs. Quack translates testing guidelines into question prompts, instead of human expertise and labor. It systematically analyzes and consolidates successful jailbreaks into a paradigm featuring eight distinct characteristics. Based on it, we reconstruct and maintain existing jailbreaks through knowledge graphs, which serve as Quack's repository of playing scenarios. It assigns four distinct roles to LLMs, for automatically organizing, evaluating, and further updating jailbreaks. We empirically demonstrate the effectiveness of our method on three state-of-the-art open-sourced LLMs (Vicuna-13B, LongChat-7B, and LLaMa-7B), as well as one widely-used commercial LLM (ChatGPT). Our work addresses the pressing need for LLM security and contributes valuable insights for creating safer LLM-empowered applications.",
        "keywords": "Large Language Models;Jailbreak;Testing",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/d424cb020078cca423b6b77165b89290d0da9e65.pdf",
        "author": "Haibo Jin;Ruoxi Chen;Jinyin Chen;Haohan Wang",
        "authorids": "~Haibo_Jin2;~Ruoxi_Chen1;~Jinyin_Chen1;~Haohan_Wang1",
        "gender": "M;;F;M",
        "homepage": ";;;http://cs.cmu.edu/~haohanw",
        "dblp": ";;50/415.html;132/4066",
        "google_scholar": "https://scholar.google.com.hk/citations?user=tj0eV-sAAAAJ;;;nZxJGeUAAAAJ",
        "orcid": ";;0000-0002-7153-2755;",
        "linkedin": ";;;haohanwang/",
        "or_profile": "~Haibo_Jin2;~Ruoxi_Chen1;~Jinyin_Chen1;~Haohan_Wang1",
        "aff": "Zhejiang University of Technology;;Zhejiang University of Technology;University of Illinois, Urbana Champaign",
        "aff_domain": "zjut.edu.cn;;zjut.edu.cn;illinois.edu",
        "position": "PhD student;;Full Professor;Assistant Professor",
        "bibtex": "@misc{\njin2024quack,\ntitle={Quack: Automatic Jailbreaking Large Language Models via Role-playing},\nauthor={Haibo Jin and Ruoxi Chen and Jinyin Chen and Haohan Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=1zt8GWZ9sc}\n}",
        "github": "",
        "project": "",
        "reviewers": "REtv;TsFJ;aN17",
        "site": "https://openreview.net/forum?id=1zt8GWZ9sc",
        "pdf_size": 1099076,
        "rating": "3;3;5",
        "confidence": "4;4;3",
        "soundness": "2;1;2",
        "contribution": "3;2;3",
        "presentation": "3;1;3",
        "wc_summary": "100;132;136",
        "wc_strengths": "57;88;57",
        "wc_weaknesses": "180;1140;368",
        "wc_questions": "215;25;164",
        "wc_review": "552;1385;725",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            122.66666666666667,
            16.110727964792762
        ],
        "wc_strengths_avg": [
            67.33333333333333,
            14.613540144521982
        ],
        "wc_weaknesses_avg": [
            562.6666666666666,
            415.38843936194894
        ],
        "wc_questions_avg": [
            134.66666666666666,
            80.2925207531118
        ],
        "wc_review_avg": [
            887.3333333333334,
            358.9209136038498
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6587544533084629160&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Zhejiang University of Technology;University of Illinois Urbana-Champaign",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.zjut.edu.cn;https://illinois.edu",
        "aff_unique_abbr": "ZJUT;UIUC",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Urbana-Champaign",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "20KYsQ8Q4Z",
        "title": "High-dimensional Bayesian Optimization with Group Testing",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Bayesian optimization is an effective method for optimizing expensive-to-evaluate black-box functions. \nHigh-dimensional problems are particularly challenging as the surrogate model of the objective suffers from the curse of dimensionality, which makes accurate modeling difficult. \nWe propose a group testing approach to identify active variables to facilitate efficient optimization in these domains. \nThe proposed algorithm, Group Testing Bayesian Optimization (GTBO), first runs a testing phase where groups of variables are systematically selected and tested on whether they influence the objective. \nTo that end, we extend the well-established theory of group testing to functions of continuous ranges.\nIn the second phase, GTBO guides optimization by placing more importance on the active dimensions.\nBy exploiting the axis-aligned subspace assumption, GTBO is competitive against state-of-the-art methods on several synthetic and real-world high-dimensional optimization tasks. \nFurthermore, GTBO aids in the discovery of active parameters in applications, thereby enhancing practitioners' understanding of the problem at hand.",
        "keywords": "Bayesian optimization;Gaussian process;group testing;high-dimensional",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Erik Orm Hellsten;Carl Hvarfner;Leonard Papenmeier;Luigi Nardi",
        "authorids": "~Erik_Orm_Hellsten1;~Carl_Hvarfner1;~Leonard_Papenmeier1;~Luigi_Nardi1",
        "gender": "M;M;M;M",
        "homepage": ";https://portal.research.lu.se/portal/sv/persons/carl-hvarfner(cd140b82-9fed-4e88-868e-1cf569dcbeb7).html;https://portal.research.lu.se/en/persons/leonard-papenmeier;",
        "dblp": ";319/3033;;60/7206",
        "google_scholar": "https://scholar.google.se/citations?user=mK5N-xQAAAAJ;https://scholar.google.se/citations?hl=en;85BUIRcAAAAJ;https://scholar.google.it/citations?user=Kgs3zQoAAAAJ",
        "orcid": ";;0000-0001-9338-1567;0000-0002-4601-2264",
        "linkedin": ";carl-hvarfner-a97421153/;leonard-papenmeier-a90a60135;nardiluigi/",
        "or_profile": "~Erik_Orm_Hellsten1;~Carl_Hvarfner1;~Leonard_Papenmeier1;~Luigi_Nardi1",
        "aff": "Lund University;Lund University;Lund University;Stanford University",
        "aff_domain": "lu.se;lu.se;lu.se;stanford.edu",
        "position": "Postdoc;PhD student;PhD student;Researcher",
        "bibtex": "@misc{\nhellsten2024highdimensional,\ntitle={High-dimensional Bayesian Optimization with Group Testing},\nauthor={Erik Orm Hellsten and Carl Hvarfner and Leonard Papenmeier and Luigi Nardi},\nyear={2024},\nurl={https://openreview.net/forum?id=20KYsQ8Q4Z}\n}",
        "github": "",
        "project": "",
        "reviewers": "fy4F;yfZG;JQFf;9ChC",
        "site": "https://openreview.net/forum?id=20KYsQ8Q4Z",
        "pdf_size": 2957796,
        "rating": "5;5;6;6",
        "confidence": "3;3;3;3",
        "soundness": "2;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "3;3;3;2",
        "wc_summary": "59;196;151;150",
        "wc_strengths": "25;35;59;115",
        "wc_weaknesses": "82;142;56;174",
        "wc_questions": "118;52;210;32",
        "wc_review": "284;425;476;471",
        "wc_reply_reviewers": "284;0;0;0",
        "wc_reply_authors": "955;651;394;756",
        "reply_reviewers": "2;0;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            139.0,
            49.78453575157651
        ],
        "wc_strengths_avg": [
            58.5,
            34.88194375317981
        ],
        "wc_weaknesses_avg": [
            113.5,
            46.82680856090878
        ],
        "wc_questions_avg": [
            103.0,
            69.49100661236676
        ],
        "wc_review_avg": [
            414.0,
            77.64341568993471
        ],
        "wc_reply_reviewers_avg": [
            71.0,
            122.97560733739029
        ],
        "wc_reply_authors_avg": [
            689.0,
            202.30793360617375
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10031675274478304412&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "Lund University;Stanford University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.lunduniversity.lu.se;https://www.stanford.edu",
        "aff_unique_abbr": "LU;Stanford",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Stanford",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "Sweden;United States"
    },
    {
        "id": "20L7txbIa8",
        "title": "UniPredict: Large Language Models are Universal Tabular Predictors",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Tabular data prediction is a fundamental machine learning task for many applications. Existing methods predominantly employ discriminative modeling and operate under the assumption of a fixed target column, necessitating re-training for every new predictive task.  Inspired by the generative power of large language models (LLMs), this paper exploits the idea of building universal tabular data predictors based on generative modeling, namely UniPredict. Here, we show that scaling up an LLM to extensive tabular datasets with the capability of comprehending diverse tabular inputs and predicting for target variables following the input instructions. Specifically, we train a single LLM on an aggregation of 169 tabular datasets with diverse targets and compare its performance against baselines that are trained on each dataset separately. We observe this versatile UniPredict model demonstrates an advantage over other models, ranging from 5.4% to 13.4%, when compared with the best tree-boosting baseline and the best neural network baseline, respectively. We further test UniPredict in few-shot learning settings on another 62 tabular datasets. Our method achieves strong performance in quickly adapting to new tasks, where our method outperforms XGBoost over 100\\% on the low-resource setup and shows a significant margin over all baselines. We envision that UniPredict sheds light on developing a universal tabular data prediction system that learns from data at scale and serves a wide range of prediction tasks.",
        "keywords": "tabular prediction;large language model;AI for healthcare",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/19ca4f07dc73c9fd88c32e596081afe059ceb7b4.zip",
        "author": "Ruiyu Wang;Zifeng Wang;Jimeng Sun",
        "authorids": "~Ruiyu_Wang2;~Zifeng_Wang3;~Jimeng_Sun3",
        "gender": "M;M;",
        "homepage": "https://www.cs.toronto.edu/~rwang;https://zifengwang.xyz;http://sunlab.org",
        "dblp": ";;",
        "google_scholar": "9ucHLzcAAAAJ;kMlWwTAAAAAJ;9jmmp5sAAAAJ",
        "orcid": "0009-0003-3541-238X;;0000-0003-1512-6426",
        "linkedin": "rui-yu-wang/;;jimengsun/",
        "or_profile": "~Ruiyu_Wang2;~Zifeng_Wang3;~Jimeng_Sun3",
        "aff": "University of Toronto;University of Illinois, Urbana Champaign;Georgia Institute of Technology",
        "aff_domain": "cs.toronto.edu;illinois.edu;gatech.edu",
        "position": "Undergrad student;PhD student;Associate Professor",
        "bibtex": "@misc{\nwang2024unipredict,\ntitle={UniPredict: Large Language Models are Universal Tabular Predictors},\nauthor={Ruiyu Wang and Zifeng Wang and Jimeng Sun},\nyear={2024},\nurl={https://openreview.net/forum?id=20L7txbIa8}\n}",
        "github": "",
        "project": "",
        "reviewers": "HUKy;Mbbo;qPUm;brjf;p7B3",
        "site": "https://openreview.net/forum?id=20L7txbIa8",
        "pdf_size": 1527791,
        "rating": "3;5;5;5;8",
        "confidence": "3;3;5;5;3",
        "soundness": "2;2;2;3;4",
        "contribution": "2;2;2;2;3",
        "presentation": "2;3;3;2;3",
        "wc_summary": "217;92;229;60;53",
        "wc_strengths": "97;92;139;87;31",
        "wc_weaknesses": "286;135;316;193;87",
        "wc_questions": "381;4;6;91;102",
        "wc_review": "981;323;690;431;273",
        "wc_reply_reviewers": "0;0;284;0;0",
        "wc_reply_authors": "686;511;731;369;329",
        "reply_reviewers": "0;0;1;0;0",
        "reply_authors": "1;1;2;1;1",
        "rating_avg": [
            5.2,
            1.6
        ],
        "confidence_avg": [
            3.8,
            0.9797958971132712
        ],
        "soundness_avg": [
            2.6,
            0.8
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            130.2,
            76.99714280413268
        ],
        "wc_strengths_avg": [
            89.2,
            34.46969683649684
        ],
        "wc_weaknesses_avg": [
            203.4,
            86.99103402075411
        ],
        "wc_questions_avg": [
            116.8,
            138.3378473159099
        ],
        "wc_review_avg": [
            539.6,
            263.52958088229866
        ],
        "wc_reply_reviewers_avg": [
            56.8,
            113.6
        ],
        "wc_reply_authors_avg": [
            525.2,
            162.05233722473736
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            1.2,
            0.4
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.10206207261596574,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of Toronto;University of Illinois Urbana-Champaign;Georgia Institute of Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.utoronto.ca;https://illinois.edu;https://www.gatech.edu",
        "aff_unique_abbr": "U of T;UIUC;Georgia Tech",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Urbana-Champaign",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "Canada;United States"
    },
    {
        "id": "20oxNYWQl9",
        "title": "Sensitivity Sampling for Coreset-Based Data Selection",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Given the sustained growth in both training data and model \nparameters, the problem of finding the most useful training data \nhas become of primary importance for training state-of-the-art and\nnext generation models. \n\nWe work in the context of active learning and consider the problem \nof finding the best representative subset of a dataset to \ntrain a machine learning model. Assuming embedding representation of\nthe data (coming for example from either a pre-trained model or a \ngeneric all-purpose embedding) and that the model loss is Lipshitz\nwith respect to these embedding, we provide a new active learning\napproach based on k-means clustering and sensitivity sampling.\n\nWe prove that our new approach allows to select a set of ``typical'' \n$k$ \nelements whose average loss corresponds to the average loss of the \nwhole dataset, up to a multiplicative $(1\\pm\\epsilon)$ factor and an additive $\\epsilon \\lambda \\Phi_k$, where $\\Phi_k$ represents the $k$-means cost for the input data and $\\lambda$ is the Lipshitz constant. \nOur approach is particularly efficient since it only\nrequires very few inferences from the model ($O(k + 1/\\epsilon^2)$).\nWe furthermore demonstrate the performance of our approach on classic\ndatasets and show that it outperforms state-of-the-art methods.",
        "keywords": "clustering;data selection;coreset",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Kyriakos Axiotis;Vincent Cohen-Addad;Monika Henzinger;Vahab Mirrokni;David Saulpic;David Woodruff",
        "authorids": "~Kyriakos_Axiotis1;~Vincent_Cohen-Addad1;~Monika_Henzinger1;~Vahab_Mirrokni2;~David_Saulpic1;~David_Woodruff1",
        "gender": ";;;M;;M",
        "homepage": ";;;https://people.csail.mit.edu/mirrokni/Welcome.html;http://www.normalesup.org/~saulpic/;http://www.cs.cmu.edu/~dwoodruf/",
        "dblp": "176/5139;136/5814;;m/VahabSMirrokni;https://dblp.uni-trier.de/pers/hd/s/Saulpic:David;w/DPWoodruff",
        "google_scholar": "Xhv2tkcAAAAJ;;NXbggxYAAAAJ;opbZfw0AAAAJ;;https://scholar.google.com.tw/citations?user=0G2t-6sAAAAJ",
        "orcid": ";;;;0000-0003-4208-8541;",
        "linkedin": ";;;;;",
        "or_profile": "~Kyriakos_Axiotis1;~Vincent_Cohen-Addad1;~Monika_Henzinger1;~Vahab_Mirrokni2;~David_Saulpic1;~David_Woodruff1",
        "aff": "Google;Google;Institute of Science and Technology;Google Research;Institute of Science and Technology;Carnegie Mellon University",
        "aff_domain": "google.com;google.com;ist.ac.at;google.com;ist.ac.at;cmu.edu",
        "position": "Researcher;Researcher;Full Professor;VP, Google Fellow;Postdoc;Full Professor",
        "bibtex": "@misc{\naxiotis2024sensitivity,\ntitle={Sensitivity Sampling for Coreset-Based Data Selection},\nauthor={Kyriakos Axiotis and Vincent Cohen-Addad and Monika Henzinger and Vahab Mirrokni and David Saulpic and David Woodruff},\nyear={2024},\nurl={https://openreview.net/forum?id=20oxNYWQl9}\n}",
        "github": "",
        "project": "",
        "reviewers": "nKWs;eXnh;mfTM;MWNf",
        "site": "https://openreview.net/forum?id=20oxNYWQl9",
        "pdf_size": 453594,
        "rating": "5;6;6;6",
        "confidence": "4;2;3;3",
        "soundness": "3;3;3;2",
        "contribution": "2;2;3;2",
        "presentation": "2;2;2;1",
        "wc_summary": "117;64;15;159",
        "wc_strengths": "42;30;109;61",
        "wc_weaknesses": "250;305;65;5",
        "wc_questions": "9;69;294;264",
        "wc_review": "418;468;483;489",
        "wc_reply_reviewers": "30;23;0;38",
        "wc_reply_authors": "501;466;430;395",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "7;7;8;5",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            88.75,
            54.2787942017875
        ],
        "wc_strengths_avg": [
            60.5,
            30.103986446980738
        ],
        "wc_weaknesses_avg": [
            156.25,
            124.61816681367127
        ],
        "wc_questions_avg": [
            159.0,
            122.32129822725068
        ],
        "wc_review_avg": [
            464.5,
            27.91504970441572
        ],
        "wc_reply_reviewers_avg": [
            22.75,
            14.16642156650719
        ],
        "wc_reply_authors_avg": [
            448.0,
            39.5790348543266
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            6.75,
            1.0897247358851685
        ],
        "replies_avg": [
            36,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:wD4GdDwwQpMJ:scholar.google.com/&scioq=Sensitivity+Sampling+for+Coreset-Based+Data+Selection&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;1;2",
        "aff_unique_norm": "Google;Institute of Science and Technology;Carnegie Mellon University",
        "aff_unique_dep": "Google;;",
        "aff_unique_url": "https://www.google.com;;https://www.cmu.edu",
        "aff_unique_abbr": "Google;;CMU",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Mountain View;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States;"
    },
    {
        "id": "228XQpErvW",
        "title": "Automatic Fine-Tuned Offline-to-Online Reinforcement Learning via Increased Simple Moving Average Q-value",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Offline-to-online reinforcement learning starts with pre-trained offline models and continuously learns via\n    interacting with the environment in online mode. The challenge of it is to adapt to distribution drift while \n    maintaining the quality of the learned policy simultaneously. \n        We propose a novel policy regularization method that aims to automatically fine-tune the model by \n    selectively increasing the average estimated Q-value in the sampled batches. As a result, our models maintain the\n    performance of the pre-trained model and improve it, unlike methods that require learning from scratch.  \n        Furthermore, we added efficient $\\mathcal{O}(1)$ complexity replay buffer techniques to adapt to distribution\n    drift efficiently. Our experimental results indicate that the proposed method outperforms state-of-the-art methods \n    on the D4RL benchmark.",
        "keywords": "Reinforcement Learning;Machine Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Hsin-Yu Liu;Bharathan Balaji;Rajesh K. Gupta;Dezhi Hong",
        "authorids": "~Hsin-Yu_Liu1;~Bharathan_Balaji1;~Rajesh_K._Gupta1;~Dezhi_Hong1",
        "gender": "M;M;;M",
        "homepage": "https://www.synergylabs.org/bharath/;http://mesl.ucsd.edu/gupta/;https://cseweb.ucsd.edu/~dehong/;https://hydesmondliu.github.io/",
        "dblp": "82/8968;213/9138-1.html;60/11186.html;10/6919",
        "google_scholar": "F0JrXQIAAAAJ;I1w51gUAAAAJ;NsPO1GUAAAAJ;Cv17_VEAAAAJ",
        "orcid": "0000-0002-9490-2018;0000-0002-6489-7633;;0000-0002-9316-2150",
        "linkedin": "bharathanbalaji/;rajeshgupta4/;;desmondliu",
        "or_profile": "~Bharathan_Balaji1;~Rajesh_K._Gupta1;~Dezhi_Hong1;~Hsin_Yu_Liu1",
        "aff": "Amazon;University of California, San Diego;Amazon;University of California, San Diego",
        "aff_domain": "amazon.com;ucsd.edu;amazon.com;ucsd.edu",
        "position": "Researcher;Full Professor;Researcher;PhD student",
        "bibtex": "@misc{\nliu2024automatic,\ntitle={Automatic Fine-Tuned Offline-to-Online Reinforcement Learning via Increased Simple Moving Average Q-value},\nauthor={Hsin-Yu Liu and Bharathan Balaji and Rajesh K. Gupta and Dezhi Hong},\nyear={2024},\nurl={https://openreview.net/forum?id=228XQpErvW}\n}",
        "github": "",
        "project": "",
        "reviewers": "AHJ2;74i3;g2Zo;Thik",
        "site": "https://openreview.net/forum?id=228XQpErvW",
        "pdf_size": 1996677,
        "rating": "3;3;6;6",
        "confidence": "5;4;4;4",
        "soundness": "1;2;3;3",
        "contribution": "1;2;3;3",
        "presentation": "2;1;3;3",
        "wc_summary": "44;75;38;97",
        "wc_strengths": "35;46;24;189",
        "wc_weaknesses": "334;398;15;365",
        "wc_questions": "62;64;571;116",
        "wc_review": "475;583;648;767",
        "wc_reply_reviewers": "0;143;267;0",
        "wc_reply_authors": "117;400;401;448",
        "reply_reviewers": "0;1;3;0",
        "reply_authors": "1;2;4;1",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            63.5,
            23.90083680543424
        ],
        "wc_strengths_avg": [
            73.5,
            67.13605588653536
        ],
        "wc_weaknesses_avg": [
            278.0,
            153.52035695633333
        ],
        "wc_questions_avg": [
            203.25,
            213.42138482354574
        ],
        "wc_review_avg": [
            618.25,
            105.80022447991308
        ],
        "wc_reply_reviewers_avg": [
            102.5,
            111.48206133723936
        ],
        "wc_reply_authors_avg": [
            341.5,
            131.0581931815024
        ],
        "reply_reviewers_avg": [
            1.0,
            1.224744871391589
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896258,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:r-iom0jm4S0J:scholar.google.com/&scioq=Automatic+Fine-Tuned+Offline-to-Online+Reinforcement+Learning+via+Increased+Simple+Moving+Average+Q-value&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;1",
        "aff_unique_norm": "Amazon;University of California, San Diego",
        "aff_unique_dep": "Amazon.com, Inc.;",
        "aff_unique_url": "https://www.amazon.com;https://www.ucsd.edu",
        "aff_unique_abbr": "Amazon;UCSD",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";San Diego",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "RA-DIT: Retrieval-Augmented Dual Instruction Tuning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19562",
        "id": "22OTbutug9",
        "author_site": "Victoria Lin, Xilun Chen, Mingda Chen, Weijia Shi, Maria Lomeli, Richard James, Pedro Rodriguez, Jacob Kahn, Gergely Szilvasy, Mike Lewis, Luke Zettlemoyer, Scott Yih",
        "tldr": "",
        "abstract": "Retrieval-augmented language models (RALMs) improve performance by accessing long-tail and up-to-date knowledge from external data stores, but are challenging to build. Existing approaches require either expensive retrieval-specific modifications to LM pre-training or use post-hoc integration of the data store that leads to suboptimal performance. We introduce Retrieval-Augmented Dual Instruction Tuning (RA-DIT), a lightweight fine-tuning methodology that provides a third option by retrofitting any LLM with retrieval capabilities. Our approach operates in two distinct fine-tuning steps: (1) one updates a pre-trained LM to better use retrieved information, while (2) the other updates the retriever to return more relevant results, as preferred by the LM. By fine-tuning over tasks that require both knowledge utilization and contextual awareness, we demonstrate that each stage yields significant performance improvements, and using both leads to additional gains. Our best model, RA-DIT 65B, achieves state-of-the-art performance across a range of knowledge-intensive zero- and few-shot learning benchmarks, significantly outperforming existing in-context RALM approaches by up to +8.9% in 0-shot setting and +1.4% in 5-shot setting on average.",
        "keywords": "retrieval-augmented language model;large language model;knowledge intensive NLP",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/b6da7054aeda7183488cdd1e45f8a3c869210ddc.pdf",
        "author": "Xi Victoria Lin;Xilun Chen;Mingda Chen;Weijia Shi;Maria Lomeli;Richard James;Pedro Rodriguez;Jacob Kahn;Gergely Szilvasy;Mike Lewis;Luke Zettlemoyer;Wen-tau Yih",
        "authorids": "~Xi_Victoria_Lin1;~Xilun_Chen1;~Mingda_Chen1;~Weijia_Shi1;~Maria_Lomeli2;~Richard_James2;~Pedro_Rodriguez1;~Jacob_Kahn1;gsz@meta.com;~Mike_Lewis1;~Luke_Zettlemoyer1;~Wen-tau_Yih1",
        "gender": "F;;M;;F;M;M;M;;M;M;M",
        "homepage": "http://victorialin.net;https://xilunchen.com;https://mingdachen.github.io/;https://weijiashi.notion.site/;https://mlomeli1.github.io;http://www.richjames.ai;https://www.pedro.ai;https://jacobkahn.me/;;;https://www.cs.washington.edu/people/faculty/lsz/;http://scottyih.org",
        "dblp": "215/5264;96/10207-2.html;220/2003;132/80601;132/9008;;96/4035;232/2341;;19/6214;21/6793;07/7129",
        "google_scholar": "gYUOJwMAAAAJ;eUk_hy8AAAAJ;aRncxakAAAAJ;https://scholar.google.com/citations?hl=en;8SK2fPAAAAAJ;;JjpA4qwAAAAJ;_-pugt8AAAAJ;;SnQnQicAAAAJ;https://scholar.google.com.tw/citations?user=UjpbO6IAAAAJ;8rDNIMsAAAAJ",
        "orcid": ";;;0000-3200-0000-0011;;;;0000-0003-2911-2500;;;;0000-0003-4263-395X",
        "linkedin": "xivictorialin/;;;weijia-shi-773768112;;duttonrichard/;pedrorodriguezscience/;jacobdavidkahn/;;;luke-zettlemoyer-a0109b226/;scottyih/",
        "or_profile": "~Xi_Victoria_Lin1;~Xilun_Chen1;~Mingda_Chen1;~Weijia_Shi1;~Maria_Lomeli2;~Richard_James2;~Pedro_Rodriguez1;~Jacob_Kahn1;gsz@meta.com;~Mike_Lewis1;~Luke_Zettlemoyer1;~Wen-tau_Yih1",
        "aff": "Meta;Meta FAIR;Meta FAIR;University of Washington, Seattle;Meta;Research, Facebook;Meta FAIR;Meta AI;;Facebook AI Research;Meta;Meta Platforms, Inc.",
        "aff_domain": "fb.com;meta.com;fb.com;uw.edu;meta.com;research.facebook.com;fb.com;meta.com;;fb.com;meta.com;meta.com",
        "position": "Research Scientist;Research Scientist;Researcher;PhD student;Researcher;Researcher;Research Scientist;Research Engineer;;Research Scientist;Researcher;Research Scientist",
        "bibtex": "@inproceedings{\nlin2024radit,\ntitle={{RA}-{DIT}: Retrieval-Augmented Dual Instruction Tuning},\nauthor={Xi Victoria Lin and Xilun Chen and Mingda Chen and Weijia Shi and Maria Lomeli and Richard James and Pedro Rodriguez and Jacob Kahn and Gergely Szilvasy and Mike Lewis and Luke Zettlemoyer and Wen-tau Yih},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=22OTbutug9}\n}",
        "github": "",
        "project": "",
        "reviewers": "i49b;HttW;5vF7;68qv",
        "pdf_size": 2186728,
        "rating": "5;6;6;8",
        "confidence": "3;3;4;4",
        "soundness": "2;3;2;4",
        "contribution": "2;3;3;4",
        "presentation": "2;4;2;3",
        "wc_summary": "99;50;13;87",
        "wc_strengths": "90;26;16;52",
        "wc_weaknesses": "142;94;38;95",
        "wc_questions": "34;3;229;72",
        "wc_review": "365;173;296;306",
        "wc_reply_reviewers": "21;0;0;63",
        "wc_reply_authors": "462;358;676;126",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "3;2;2;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            62.25,
            33.6851228289285
        ],
        "wc_strengths_avg": [
            46.0,
            28.600699292150182
        ],
        "wc_weaknesses_avg": [
            92.25,
            36.84002578717882
        ],
        "wc_questions_avg": [
            84.5,
            86.93244503636143
        ],
        "wc_review_avg": [
            285.0,
            69.831941115796
        ],
        "wc_reply_reviewers_avg": [
            21.0,
            25.71964229922337
        ],
        "wc_reply_authors_avg": [
            405.5,
            197.95138292015037
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            12,
            0
        ],
        "corr_rating_confidence": 0.6882472016116854,
        "gs_citation": 142,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6775356328711894537&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=22OTbutug9",
        "pdf": "https://openreview.net/pdf?id=22OTbutug9",
        "email": "fb.com;meta.com;fb.com;uw.edu;meta.com;research.facebook.com;fb.com;meta.com;;fb.com;meta.com;meta.com",
        "author_num": 12,
        "aff_unique_index": "0;0;0;1;0;0;0;0;0;0;0",
        "aff_unique_norm": "Meta;University of Washington",
        "aff_unique_dep": "Meta Platforms, Inc.;",
        "aff_unique_url": "https://meta.com;https://www.washington.edu",
        "aff_unique_abbr": "Meta;UW",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Seattle",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "PromptAgent: Strategic Planning with Language Models Enables Expert-level Prompt Optimization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19561",
        "id": "22pyNMuIoa",
        "author_site": "Xinyuan Wang, Chenxi Li, Zhen Wang, Fan Bai, Haotian Luo, Jiayou Zhang, Nebojsa Jojic, Eric Xing, Zhiting Hu",
        "tldr": "",
        "abstract": "Expert-level prompts, carefully engineered by human experts who have a deep understanding of both large language models (LLMs) and domain knowledge, are the future of prompting and pivotal to harnessing the full power of advanced LLMs. Discovering such prompts with an automated process remains a sought-after and unresolved challenge. Existing prompt optimization techniques, though automated through iterative sampling, often fall short in injecting domain knowledge and exploring the vast prompt space for complex expert-level prompts efficiently. To address this pressing need and achieve expert-level prompting, we introduce PromptAgent, which autonomously discovers prompts equivalent in quality to those handcrafted by experts. At its core, PromptAgent views prompt optimization as a strategic planning problem and employs a principled planning algorithm (rooted in Monte Carlo Tree Search) to strategically explore the vast expert-level prompt space. PromptAgent interacts with the LLM in a human-like trial-and-error manner during the planning, and injects expert-level knowledge by reflecting on model errors and generating insightful error feedback. This novel formulation allows it to iteratively evaluate intermediate prompts, refine them based on errors, simulate future rewards, and search for high-reward paths leading to expert-level prompts. We apply PromptAgent to 12 tasks spanning three practical domains: BIG-Bench Hard (BBH), domain-expert, and general NLU tasks, showing PromptAgent consistently outperforms strong prompting and prompt optimization baselines by great margins. Our qualitative analysis further emphasizes PromptAgent's capability to distill insightful errors into expert-level prompts.",
        "keywords": "Large Language Models;Expert-level Prompt Optimization;Strategic Planning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Xinyuan Wang;Chenxi Li;Zhen Wang;Fan Bai;Haotian Luo;Jiayou Zhang;Nebojsa Jojic;Eric Xing;Zhiting Hu",
        "authorids": "xiw136@ucsd.edu;chl078@ucsd.edu;~Zhen_Wang6;~Fan_Bai5;1203616626@sjtu.edu.cn;~Jiayou_Zhang1;~Nebojsa_Jojic1;~Eric_Xing1;~Zhiting_Hu3",
        "gender": ";;M;M;;M;;M;M",
        "homepage": ";;https://zhenwang9102.github.io;https://bflashcp3f.github.io/;;https://jiayouzhang.github.io/;www.research.microsoft.com/~jojic;http://www.cs.cmu.edu/~epxing/;http://zhiting.ucsd.edu",
        "dblp": ";;78/6727;84/4809-6;;157/3933;20/1944;36/3855;134/4031",
        "google_scholar": ";;asBaytUAAAAJ;CLc9XQIAAAAJ;;;;https://scholar.google.com.tw/citations?user=5pKTRxEAAAAJ;N7_xhHoAAAAJ",
        "orcid": ";;0000-0001-7407-5118;;;;;;",
        "linkedin": ";;zhenwang9102/;;;jiayou-zhang-403072245/;;;",
        "or_profile": "xiw136@ucsd.edu;chl078@ucsd.edu;~Zhen_Wang6;~Fan_Bai5;1203616626@sjtu.edu.cn;~Jiayou_Zhang1;~Nebojsa_Jojic1;~Eric_Xing1;~Zhiting_Hu3",
        "aff": ";;University of California, San Diego;Johns Hopkins University;;Mohamed bin Zayed University of Artificial Intelligence;Microsoft Research;School of Computer Science, Carnegie Mellon University;Amazon",
        "aff_domain": ";;ucsd.edu;jh.edu;;mbzuai.ac.ae; ;cs.cmu.edu;amazon.com",
        "position": ";;Postdoc;Postdoc;;PhD student;Researcher;Full Professor;Researcher",
        "bibtex": "@inproceedings{\nwang2024promptagent,\ntitle={PromptAgent: Strategic Planning with Language Models Enables Expert-level Prompt Optimization},\nauthor={Xinyuan Wang and Chenxi Li and Zhen Wang and Fan Bai and Haotian Luo and Jiayou Zhang and Nebojsa Jojic and Eric Xing and Zhiting Hu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=22pyNMuIoa}\n}",
        "github": "",
        "project": "",
        "reviewers": "zmiy;j86n;gPc5;WJJm",
        "pdf_size": 1719960,
        "rating": "3;6;6;8",
        "confidence": "4;4;2;4",
        "soundness": "2;3;2;4",
        "contribution": "1;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "75;164;75;41",
        "wc_strengths": "27;75;79;17",
        "wc_weaknesses": "49;290;195;18",
        "wc_questions": "75;56;113;131",
        "wc_review": "226;585;462;207",
        "wc_reply_reviewers": "0;0;275;12",
        "wc_reply_authors": "1516;1893;3214;522",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "3;3;6;1",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            88.75,
            45.60907256237513
        ],
        "wc_strengths_avg": [
            49.5,
            27.76238462380348
        ],
        "wc_weaknesses_avg": [
            138.0,
            110.31092420970826
        ],
        "wc_questions_avg": [
            93.75,
            29.72688177390962
        ],
        "wc_review_avg": [
            370.0,
            159.6824974754591
        ],
        "wc_reply_reviewers_avg": [
            71.75,
            117.44865899617585
        ],
        "wc_reply_authors_avg": [
            1786.25,
            964.5243322488034
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.25,
            1.7853571071357126
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -0.08084520834544431,
        "gs_citation": 115,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11923415573257859854&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=22pyNMuIoa",
        "pdf": "https://openreview.net/pdf?id=22pyNMuIoa",
        "email": ";;ucsd.edu;jh.edu;;mbzuai.ac.ae; ;cs.cmu.edu;amazon.com",
        "author_num": 9,
        "aff_unique_index": "0;1;2;3;4;5",
        "aff_unique_norm": "University of California, San Diego;Johns Hopkins University;Mohamed bin Zayed University of Artificial Intelligence;Microsoft;Carnegie Mellon University;Amazon",
        "aff_unique_dep": ";;;Microsoft Research;School of Computer Science;Amazon.com, Inc.",
        "aff_unique_url": "https://www.ucsd.edu;https://www.jhu.edu;https://mbzuai.ac.ae;https://www.microsoft.com/en-us/research;https://www.cmu.edu;https://www.amazon.com",
        "aff_unique_abbr": "UCSD;JHU;MBZUAI;MSR;CMU;Amazon",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "San Diego;;Pittsburgh",
        "aff_country_unique_index": "0;0;1;0;0;0",
        "aff_country_unique": "United States;United Arab Emirates"
    },
    {
        "id": "22to0JZ4zh",
        "title": "Symmetrized Schr\u00f6dinger Bridge Matching",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Schr\u00f6dinger bridge (SB) has demonstrated numerous applications in probabilistic generative modeling. Finding the solution of probability paths aligns with entropy-regularized optimal transport that employs the Sinkhorn algorithm, which is characterized by performing iterative proportional fitting between marginal densities. This paper argues that the standard training of the SB is prone to exaggerate the amount of learning due to its inherent geometric nature. We leverage a symmetrized variant of Sinkhorn to study more lenient convergence of Schr\u00f6dinger potentials and prove distinctive theoretical properties of the symmetrization such as linear convergence and monotonic improvements. To this end, we propose a dynamic SB algorithm named Symmetrized Schr\u00f6dinger Bridge Matching (SSBM). Inspired by score and flow matching models, the concurrent projection scheme of SSBM is conceptualized as matching forward and backward drifts concurrently, constructing a time-symmetric learning objective for the SB model. We empirically validate our SB method by solving classical optimal transportation and model-based stochastic optimal control problems with physical dynamics.",
        "keywords": "schr\u00f6dinger bridge;probabilistic generative method;stochastic optimal control",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Dong-Sig Han;Jaein Kim;HEE BIN YOO;Byoung-Tak Zhang",
        "authorids": "~Dong-Sig_Han2;~Jaein_Kim2;~HEE_BIN_YOO1;~Byoung-Tak_Zhang1",
        "gender": "M;M;M;M",
        "homepage": ";https://github.com/heebinYoo;https://bi.snu.ac.kr/~btzhang/;https://dshan4585.github.io",
        "dblp": "27/9295-4.html;;09/5682;218/7109",
        "google_scholar": "https://scholar.google.co.kr/citations?user=6xSSU-8AAAAJ;;sYTUOu8AAAAJ;h1hMIKcAAAAJ",
        "orcid": "0000-0001-7148-4346;;;",
        "linkedin": ";;;",
        "or_profile": "~Jaein_Kim2;~HEE_BIN_YOO1;~Byoung-Tak_Zhang1;~Dong-Sig_Han_Han1",
        "aff": "Seoul National University;Seoul National University;Seoul National University;Seoul National University",
        "aff_domain": "snu.ac.kr;snu.ac.kr;snu.ac.kr;snu.ac.kr",
        "position": "PhD student;PhD student;Full Professor;PhD student",
        "bibtex": "@misc{\nhan2024symmetrized,\ntitle={Symmetrized Schr\\\"odinger Bridge Matching},\nauthor={Dong-Sig Han and Jaein Kim and HEE BIN YOO and Byoung-Tak Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=22to0JZ4zh}\n}",
        "github": "",
        "project": "",
        "reviewers": "pujg;8RJL;Ksvt;EfaF",
        "site": "https://openreview.net/forum?id=22to0JZ4zh",
        "pdf_size": 719917,
        "rating": "3;3;3;6",
        "confidence": "4;4;4;4",
        "soundness": "3;2;1;3",
        "contribution": "3;2;2;2",
        "presentation": "4;1;1;3",
        "wc_summary": "287;200;53;32",
        "wc_strengths": "53;78;49;59",
        "wc_weaknesses": "700;594;408;428",
        "wc_questions": "441;79;22;128",
        "wc_review": "1481;951;532;647",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            1.299038105676658
        ],
        "wc_summary_avg": [
            143.0,
            105.36365597301567
        ],
        "wc_strengths_avg": [
            59.75,
            11.121488209767612
        ],
        "wc_weaknesses_avg": [
            532.5,
            120.68450604779389
        ],
        "wc_questions_avg": [
            167.5,
            162.29987677136418
        ],
        "wc_review_avg": [
            902.75,
            367.2753565106159
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:-R7CsRECyCQJ:scholar.google.com/&scioq=Symmetrized+Schr%C3%B6dinger+Bridge+Matching&hl=en&as_sdt=0,23",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Seoul National University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.snu.ac.kr",
        "aff_unique_abbr": "SNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "23OEmHVkpq",
        "title": "Disentanglement Learning via Topology",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We propose TopDis (Topological Disentanglement), a method for learning disentangled representations via adding a multi-scale topological loss term. Disentanglement is a crucial property of data representations substantial for the explainability and robustness of deep learning models and a step towards high-level cognition. The state-of-the-art methods are based on VAE and encourage the joint distribution of latent variables to be factorized. We take a different perspective on disentanglement by analyzing topological properties of data manifolds. In particular, we optimize the topological similarity for data manifolds traversals. To the best of our knowledge, our paper is the first one to propose a differentiable topological loss for disentanglement learning. Our experiments have shown that the proposed TopDis loss improves disentanglement scores such as MIG, FactorVAE score, SAP score and DCI disentanglement score with respect to state-of-the-art results while preserving the reconstruction quality. Our method works in an unsupervised manner, permitting to apply it for problems without labeled factors of variation. The TopDis loss works even when factors of variation are correlated. Additionally, we show how  to use the proposed topological loss to find disentangled directions in a trained GAN.",
        "keywords": "representation learning;variational autoencoders;disentangled representations;topological data analysis",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/3ca1407e87a500b1df6e1af36f18584899bf8f55.zip",
        "author": "Nikita Balabin;Daria Voronkova;Ilya Trofimov;Evgeny Burnaev;Serguei Barannikov",
        "authorids": "~Nikita_Balabin1;~Daria_Voronkova1;~Ilya_Trofimov1;~Evgeny_Burnaev1;~Serguei_Barannikov1",
        "gender": "M;;;M;",
        "homepage": ";;;http://faculty.skoltech.ru/people/evgenyburnaev;",
        "dblp": "310/1857;;130/0370;144/7845;255/5203",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;https://scholar.google.ru/citations?user=V1c6KjgAAAAJ;https://scholar.google.ru/citations?user=pCRdcOwAAAAJ;https://scholar.google.fr/citations?user=-soT8KcAAAAJ",
        "orcid": ";;0000-0002-2961-7368;0000-0001-8424-0690;0000-0002-9323-0651",
        "linkedin": "nikita-balabin-10455b17a/;;https://ru.linkedin.com/in/ilya-trofimov-ba122748;;",
        "or_profile": "~Nikita_Balabin1;~Daria_Voronkova1;~Ilya_Trofimov1;~Evgeny_Burnaev1;~Serguei_Barannikov1",
        "aff": "Skolkovo Institute of Science and Technology;;Skoltech;Skolkovo Institute of Science and Technology;CNRS, Institut Mathematiques de Jussieu, Paris Diderot University",
        "aff_domain": "skoltech.ru;;skoltech.ru;skoltech.ru;imj-prg.fr",
        "position": "PhD student;;Research scientist;Full Professor;Researcher",
        "bibtex": "@misc{\nbalabin2024disentanglement,\ntitle={Disentanglement Learning via Topology},\nauthor={Nikita Balabin and Daria Voronkova and Ilya Trofimov and Evgeny Burnaev and Serguei Barannikov},\nyear={2024},\nurl={https://openreview.net/forum?id=23OEmHVkpq}\n}",
        "github": "",
        "project": "",
        "reviewers": "T3Gf;2nX5;VGnt;1sM8",
        "site": "https://openreview.net/forum?id=23OEmHVkpq",
        "pdf_size": 21582958,
        "rating": "5;5;5;6",
        "confidence": "3;3;4;4",
        "soundness": "3;3;2;3",
        "contribution": "2;3;2;2",
        "presentation": "2;2;2;3",
        "wc_summary": "56;57;41;83",
        "wc_strengths": "57;58;63;133",
        "wc_weaknesses": "145;142;90;363",
        "wc_questions": "2;56;51;2",
        "wc_review": "260;313;245;581",
        "wc_reply_reviewers": "125;0;0;0",
        "wc_reply_authors": "1095;1133;952;800",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "3;2;2;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            59.25,
            15.105876340020794
        ],
        "wc_strengths_avg": [
            77.75,
            31.979485611873123
        ],
        "wc_weaknesses_avg": [
            185.0,
            105.0690249312327
        ],
        "wc_questions_avg": [
            27.75,
            25.810608284191986
        ],
        "wc_review_avg": [
            349.75,
            135.88115211463287
        ],
        "wc_reply_reviewers_avg": [
            31.25,
            54.12658773652741
        ],
        "wc_reply_authors_avg": [
            995.0,
            131.26118999917682
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15099455684142021084&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "Skolkovo Institute of Science and Technology;Paris Diderot University",
        "aff_unique_dep": ";Institut Mathematiques de Jussieu",
        "aff_unique_url": "https://www.skoltech.ru;https://www.univ-paris-diderot.fr",
        "aff_unique_abbr": "Skoltech;Paris Diderot",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Paris",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "Russian Federation;France"
    },
    {
        "title": "RETSim: Resilient and Efficient Text Similarity",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19560",
        "id": "23b9KSNQTX",
        "author_site": "Marina Zhang, Owen Vallis, Aysegul Bumin, Tanay Vakharia, Elie Bursztein",
        "tldr": "",
        "abstract": "This paper introduces RETSim (Resilient and Efficient Text Similarity), a lightweight, multilingual deep learning model trained to produce robust metric embeddings for near-duplicate text retrieval, clustering, and dataset deduplication tasks. We demonstrate that RETSim is significantly more robust and accurate than MinHash and neural text embeddings, achieving new state-of-the-art performance on dataset deduplication, adversarial text retrieval benchmarks, and spam clustering tasks. Additionally, we introduce the W4NT3D benchmark (Wiki-40B 4dversarial Near-T3xt Dataset), enabling the evaluation of models on typo-laden near-duplicate text retrieval in a multilingual setting. RETSim and the W4NT3D benchmark are released under the MIT License at https://github.com/google/unisim.",
        "keywords": "text similarity;text embedding;metric learning;near-duplicate detection;dataset deduplication",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/7e56b306b8c8975180840afc4567947bdb7faaf7.zip",
        "author": "Marina Zhang;Owen Skipper Vallis;Aysegul Bumin;Tanay Vakharia;Elie Bursztein",
        "authorids": "~Marina_Zhang1;~Owen_Skipper_Vallis1;~Aysegul_Bumin1;~Tanay_Vakharia1;~Elie_Bursztein1",
        "gender": "F;;F;;",
        "homepage": "https://marinazhang.github.io/;https://www.owenvallis.com;;;https://elie.net",
        "dblp": "340/6965;28/4883;308/4098;;20/7004",
        "google_scholar": "V9ehnpwAAAAJ;https://scholar.google.com/citations?hl=en;;;Ayw4GsAAAAAJ",
        "orcid": ";;;;",
        "linkedin": "marina-zhang;;aysegulbumin;tanay-vakharia-450151130;bursztein",
        "or_profile": "~Marina_Zhang1;~Owen_Skipper_Vallis1;~Aysegul_Bumin1;~Tanay_Vakharia1;~Elie_Bursztein1",
        "aff": "Google;Google;;;Google",
        "aff_domain": "google.com;google.com;;;google.com",
        "position": "Researcher;Researcher;;;Researcher",
        "bibtex": "@inproceedings{\nzhang2024retsim,\ntitle={{RETS}im: Resilient and Efficient Text Similarity},\nauthor={Marina Zhang and Owen Skipper Vallis and Aysegul Bumin and Tanay Vakharia and Elie Bursztein},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=23b9KSNQTX}\n}",
        "github": "",
        "project": "",
        "reviewers": "XEvv;XRFc;rc5k;pVcX",
        "pdf_size": 442973,
        "rating": "6;6;8;8",
        "confidence": "4;4;4;4",
        "soundness": "2;3;3;4",
        "contribution": "1;2;3;3",
        "presentation": "2;4;3;3",
        "wc_summary": "72;486;86;65",
        "wc_strengths": "76;53;21;80",
        "wc_weaknesses": "72;14;106;214",
        "wc_questions": "29;53;74;8",
        "wc_review": "249;606;287;367",
        "wc_reply_reviewers": "44;10;78;0",
        "wc_reply_authors": "830;510;1068;1115",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "2;1;3;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            177.25,
            178.41717266003292
        ],
        "wc_strengths_avg": [
            57.5,
            23.4574082114798
        ],
        "wc_weaknesses_avg": [
            101.5,
            72.80624973173663
        ],
        "wc_questions_avg": [
            41.0,
            24.829418035870273
        ],
        "wc_review_avg": [
            377.25,
            138.7666656657859
        ],
        "wc_reply_reviewers_avg": [
            33.0,
            30.675723300355934
        ],
        "wc_reply_authors_avg": [
            880.75,
            239.77424277849363
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14914000300701128593&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=23b9KSNQTX",
        "pdf": "https://openreview.net/pdf?id=23b9KSNQTX",
        "email": "google.com;google.com;;;google.com",
        "author_num": 5,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Google",
        "aff_unique_dep": "Google",
        "aff_unique_url": "https://www.google.com",
        "aff_unique_abbr": "Google",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Mountain View",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "24CZaossxH",
        "title": "PyTorch Geometric High Order: A Unified Library for High Order Graph Neural Network",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We introduce PyTorch Geometric High Order (PyGHO), a library designed for High Order Graph Neural Networks (HOGNNs) built upon PyTorch Geometric (PyG). In contrast to ordinary Message Passing Neural Networks (MPNNs) which facilitate message exchange between nodes and are readily implemented using PyG, HOGNNs, encompassing subgraph GNNs and k-WL GNNs, encode node tuples. Such node tuple encoding lacks a universal framework and often necessitates intricate code implementation. The primary objective of PyGHO is to furnish an intuitive and user-friendly interface catering to various HOGNNs. It integrates streamlined data structures for node tuples, offers comprehensive data preprocessing and mini-batch data loading utilities, presents a versatile framework for high order message propagation, and encompasses a repertoire of representative high order GNN methodologies. In this work, we present an detailed overview of the PyGHO library, elucidating its features, and undertake a comparative analysis of existing HOGNNs implemented with PyGHO on real-world tasks.",
        "keywords": "High Order Graph Neural Network;Library",
        "primary_area": "infrastructure, software libraries, hardware, etc.",
        "supplementary_material": "/attachment/7738778ed7f2253d9fe13c65d488034e64b21038.zip",
        "author": "Xiyuan Wang;Muhan Zhang",
        "authorids": "~Xiyuan_Wang1;~Muhan_Zhang1",
        "gender": ";M",
        "homepage": ";https://muhanzhang.github.io/",
        "dblp": "95/8542;157/5518",
        "google_scholar": ";https://scholar.google.com.hk/citations?user=OBBqkosAAAAJ",
        "orcid": ";0000-0002-7680-6401",
        "linkedin": "%E5%B8%8C%E5%85%83-%E7%8E%8B-969660221/;jerry-muhan-zhang-a33a1777/",
        "or_profile": "~Xiyuan_Wang1;~Muhan_Zhang1",
        "aff": "Peking University;Peking University",
        "aff_domain": "pku.edu.cn;pku.edu.cn",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nwang2024pytorch,\ntitle={PyTorch Geometric High Order: A Unified Library for High Order Graph Neural Network},\nauthor={Xiyuan Wang and Muhan Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=24CZaossxH}\n}",
        "github": "",
        "project": "",
        "reviewers": "gNYJ;tzV7;nV5W;skCY",
        "site": "https://openreview.net/forum?id=24CZaossxH",
        "pdf_size": 284290,
        "rating": "3;3;5;5",
        "confidence": "5;3;3;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "1;2;2;3",
        "wc_summary": "35;51;73;17",
        "wc_strengths": "13;28;139;21",
        "wc_weaknesses": "80;210;136;75",
        "wc_questions": "13;5;2;4",
        "wc_review": "141;294;350;117",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            44.0,
            20.615528128088304
        ],
        "wc_strengths_avg": [
            50.25,
            51.51395442013746
        ],
        "wc_weaknesses_avg": [
            125.25,
            54.47648575302926
        ],
        "wc_questions_avg": [
            6.0,
            4.183300132670378
        ],
        "wc_review_avg": [
            225.5,
            98.87492098606198
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11402743817870288895&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Peking University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.pku.edu.cn",
        "aff_unique_abbr": "Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "258EqEA05w",
        "title": "A Simple Data Augmentation for Feature Distribution Skewed Federated Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Federated learning (FL) facilitates collaborative learning among multiple clients in a distributed manner and ensures privacy protection. However, its performance inevitably degrades, while suffering from data heterogeneity, i.e., non-IID data. In this paper, we focus on the feature distribution skewed FL scenario, which is a common setting in real-world applications. The main challenge of this scenario is feature shift, which is caused by the different underlying distributions of local datasets. Although the previous attempts achieved impressive progress, few studies pay attention to the data itself, i.e., the root of this issue. To this end, the primary goal of this paper is to develop a general data augmentation technique at the input level, to mitigate the feature shift problem. To achieve this goal, we propose a simple yet remarkably effective data augmentation method, namely FedRDN, for feature distribution skewed FL, which randomly injects the statistics of the dataset from the entire federation into the client's data. Then, our method can effectively improve the generalization of features, and thereby mitigate the feature shift problem. Moreover, our FedRDN is a plug-and-play component, which can be seamlessly integrated into the data augmentation flow with only a few lines of code. Extensive experiments on several datasets show that the performance of various representative FL works can be further improved by integrating our FedRDN, which demonstrates its strong scalability and generalizability. The source code will be released.",
        "keywords": "federated learning;data heterogeneity;data augmentation.",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Yunlu Yan;Huazhu Fu;Yuexiang Li;Lei Zhu",
        "authorids": "~Yunlu_Yan1;~Huazhu_Fu4;~Yuexiang_Li1;~Lei_Zhu1",
        "gender": "M;M;M;M",
        "homepage": ";https://hzfu.github.io;https://yuexiangli.github.io;https://sites.google.com/site/indexlzhu/home?authuser=0",
        "dblp": "294/8769;63/7767;165/6204;99/549-3",
        "google_scholar": "Ja0QBOgAAAAJ;https://scholar.google.com/citations?hl=en;WsKu4EMAAAAJ;https://scholar.google.com.hk/citations?user=AQtqhaYAAAAJ",
        "orcid": ";0000-0002-9702-5524;;",
        "linkedin": ";;;",
        "or_profile": "~Yunlu_Yan1;~Huazhu_Fu4;~Yuexiang_Li1;~Lei_Zhu1",
        "aff": "The Hong Kong University of Science and Technology (Guangzhou);Institute of High Performance Computing, Singapore, A*STAR;Medical AI ReSearch (MARS) Group @ GXMU;Hong Kong University of Science and Technology (Guangzhou) & HKUST",
        "aff_domain": "hkust-gz.edu.cn;ihpc.a-star.edu.sg;gxmu.edu.cn;ust.hk",
        "position": "PhD student;Principal Scientist;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nyan2024a,\ntitle={A Simple Data Augmentation for Feature Distribution Skewed Federated Learning},\nauthor={Yunlu Yan and Huazhu Fu and Yuexiang Li and Lei Zhu},\nyear={2024},\nurl={https://openreview.net/forum?id=258EqEA05w}\n}",
        "github": "",
        "project": "",
        "reviewers": "9DEf;rKgT;BGPc;aJPJ",
        "site": "https://openreview.net/forum?id=258EqEA05w",
        "pdf_size": 1797449,
        "rating": "5;5;5;6",
        "confidence": "4;4;3;3",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;2",
        "wc_summary": "37;67;136;46",
        "wc_strengths": "68;73;43;35",
        "wc_weaknesses": "98;120;26;131",
        "wc_questions": "54;109;112;152",
        "wc_review": "257;369;317;364",
        "wc_reply_reviewers": "137;0;0;27",
        "wc_reply_authors": "1122;696;706;590",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            71.5,
            38.797551469132685
        ],
        "wc_strengths_avg": [
            54.75,
            16.099301227071937
        ],
        "wc_weaknesses_avg": [
            93.75,
            40.88016022473493
        ],
        "wc_questions_avg": [
            106.75,
            34.86671048435743
        ],
        "wc_review_avg": [
            326.75,
            45.090880452703516
        ],
        "wc_reply_reviewers_avg": [
            41.0,
            56.51106086422374
        ],
        "wc_reply_authors_avg": [
            778.5,
            203.46191289772148
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17299839277902079733&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Institute of High Performance Computing;Guangxi Medical University",
        "aff_unique_dep": ";;Medical AI ReSearch (MARS) Group",
        "aff_unique_url": "https://www.ust.hk;https://www.ihpc.a-star.edu.sg;http://www.gxmu.edu.cn",
        "aff_unique_abbr": "HKUST;IHPC;GXMU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Guangzhou;",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "China;Singapore"
    },
    {
        "id": "25VG15SnkH",
        "title": "United We Train, Divided We Fail! Representation Learning for Time Series by Pretraining from 75 Datasets at Once",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In natural language processing and vision, pretraining is utilized to learn effective representations. Unfortunately, the success of pretraining does not easily carry over to time series due to potential mismatch between sources and target. Actually, common belief is that multi-dataset pretraining does not work for time series! Au contraire, we introduce a new self-supervised contrastive pretraining approach to learn one encoding from many unlabeled and diverse time series datasets, so that the single learned representation can then be reused in several target domains for, say, classification. Specifically, we propose the XD-MixUp interpolation method and the Soft Interpolation Contextual Contrasting (SICC) loss. Empirically, this outperforms both supervised training and other self-supervised pretraining methods when finetuning on low-data regimes. This disproves the common belief: We can actually learn from multiple time series datasets, even from 75 at once.",
        "keywords": "time series;classification;pretraining;representation learning;multi-dataset;transfer learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Maurice Kraus;Felix Divo;Devendra Singh Dhami;Kristian Kersting",
        "authorids": "~Maurice_Kraus1;~Felix_Divo1;~Devendra_Singh_Dhami1;~Kristian_Kersting1",
        "gender": "M;;M;M",
        "homepage": ";;https://sites.google.com/view/devendradhami;http://www.ml.informatik.tu-darmstadt.de/",
        "dblp": "335/8577;;201/2130;40/3793",
        "google_scholar": "HKA7sQkAAAAJ;;aVlaHfkAAAAJ;QY-earAAAAAJ",
        "orcid": "0000-0002-6411-3325;;;0000-0002-2873-9152",
        "linkedin": ";;;",
        "or_profile": "~Maurice_Kraus1;~Felix_Divo1;~Devendra_Singh_Dhami1;~Kristian_Kersting1",
        "aff": "Technische Universit\u00e4t Darmstadt;;Eindhoven University of Technology;TU Darmstadt",
        "aff_domain": "cs.tu-darmstadt.de;;tue.nl;tu-darmstadt.de",
        "position": "PhD student;;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nkraus2024united,\ntitle={United We Train, Divided We Fail! Representation Learning for Time Series by Pretraining from 75 Datasets at Once},\nauthor={Maurice Kraus and Felix Divo and Devendra Singh Dhami and Kristian Kersting},\nyear={2024},\nurl={https://openreview.net/forum?id=25VG15SnkH}\n}",
        "github": "",
        "project": "",
        "reviewers": "Gxh9;kMWa;KhAg;4uSe",
        "site": "https://openreview.net/forum?id=25VG15SnkH",
        "pdf_size": 2198730,
        "rating": "3;3;3;6",
        "confidence": "4;4;3;4",
        "soundness": "2;3;2;4",
        "contribution": "2;1;2;3",
        "presentation": "3;3;3;4",
        "wc_summary": "67;94;101;198",
        "wc_strengths": "43;64;52;28",
        "wc_weaknesses": "334;136;200;169",
        "wc_questions": "40;22;42;8",
        "wc_review": "484;316;395;403",
        "wc_reply_reviewers": "167;0;0;105",
        "wc_reply_authors": "929;596;867;851",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "3;2;2;2",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            115.0,
            49.57317823178175
        ],
        "wc_strengths_avg": [
            46.75,
            13.141061600951424
        ],
        "wc_weaknesses_avg": [
            209.75,
            75.22092461542866
        ],
        "wc_questions_avg": [
            28.0,
            13.92838827718412
        ],
        "wc_review_avg": [
            399.5,
            59.466377054601196
        ],
        "wc_reply_reviewers_avg": [
            68.0,
            71.44578364046404
        ],
        "wc_reply_authors_avg": [
            810.75,
            127.36242577777796
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6022853401423522021&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Technische Universit\u00e4t Darmstadt;Eindhoven University of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tu-darmstadt.de;https://www.tue.nl",
        "aff_unique_abbr": "TUD;TU/e",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Darmstadt",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Germany;Netherlands"
    },
    {
        "title": "Zero-Shot Continuous Prompt Transfer: Generalizing Task Semantics Across Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19559",
        "id": "26XphugOcS",
        "author_site": "Zijun Wu, Yongkang Wu, Lili Mou",
        "tldr": "",
        "abstract": "Prompt tuning in natural language processing (NLP) has become an increasingly popular method for adapting large language models to specific tasks. However, the transferability of these prompts, especially continuous prompts, between different models remains a challenge. In this work, we propose a zero-shot continuous prompt transfer method, where source prompts are encoded into relative space and the corresponding target prompts are searched for transferring to target models. Experimental results confirm the effectiveness of our method, showing that 'task semantics' in continuous prompts can be generalized across various language models. Moreover, we find that combining 'task semantics' from multiple source models can further enhance the performance of transfer.",
        "keywords": "continuous prompt tuning;zero-shot prompt transfer;cross-model prompt transfer",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/a5a62ca65940640c67d97235770b7058762be598.pdf",
        "author": "Zijun Wu;Yongkang Wu;Lili Mou",
        "authorids": "~Zijun_Wu2;~Yongkang_Wu1;~Lili_Mou1",
        "gender": "M;;M",
        "homepage": ";;https://lili-mou.github.io/",
        "dblp": ";;",
        "google_scholar": "rmET9UUAAAAJ;YYJIxacAAAAJ;https://scholar.google.com.hk/schhp?hl=en",
        "orcid": ";;",
        "linkedin": "zijun-wu-844474195/?originalSubdomain=ca;;",
        "or_profile": "~Zijun_Wu2;~Yongkang_Wu1;~Lili_Mou1",
        "aff": "University of Alberta;;University of Alberta",
        "aff_domain": "ualberta.ca;;ualberta.ca",
        "position": "PhD student;;Assistant Professor",
        "bibtex": "@inproceedings{\nwu2024zeroshot,\ntitle={Zero-Shot Continuous Prompt Transfer: Generalizing Task Semantics Across Language Models},\nauthor={Zijun Wu and Yongkang Wu and Lili Mou},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=26XphugOcS}\n}",
        "github": "",
        "project": "",
        "reviewers": "AxcL;NAhq;2xK8;6csB",
        "pdf_size": 482692,
        "rating": "6;6;8;8",
        "confidence": "4;4;3;2",
        "soundness": "3;3;3;3",
        "contribution": "3;2;3;4",
        "presentation": "3;3;3;3",
        "wc_summary": "74;166;130;91",
        "wc_strengths": "54;14;51;140",
        "wc_weaknesses": "52;15;148;43",
        "wc_questions": "118;1;13;19",
        "wc_review": "298;196;342;293",
        "wc_reply_reviewers": "72;25;100;19",
        "wc_reply_authors": "805;337;224;413",
        "reply_reviewers": "3;1;1;1",
        "reply_authors": "4;2;2;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            115.25,
            35.64670391494843
        ],
        "wc_strengths_avg": [
            64.75,
            46.21349911010851
        ],
        "wc_weaknesses_avg": [
            64.5,
            50.102395152327794
        ],
        "wc_questions_avg": [
            37.75,
            46.78341052125208
        ],
        "wc_review_avg": [
            282.25,
            53.32154817707378
        ],
        "wc_reply_reviewers_avg": [
            54.0,
            33.56337289367682
        ],
        "wc_reply_authors_avg": [
            444.75,
            218.59137105567547
        ],
        "reply_reviewers_avg": [
            1.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            2.5,
            0.8660254037844386
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.9045340337332909,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5565109728828905576&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=26XphugOcS",
        "pdf": "https://openreview.net/pdf?id=26XphugOcS",
        "email": "ualberta.ca;;ualberta.ca",
        "author_num": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Alberta",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ualberta.ca",
        "aff_unique_abbr": "UAlberta",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "27YiINkhw3",
        "title": "ToolDec: Syntax Error-Free and Generalizable Tool Use for LLMs via Finite-State Decoding",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs) have shown promising capabilities in using external tools to solve complex problems.\nHowever, existing approaches either involve fine-tuning on tool demonstrations, which does not generalize to new tools without additional training, or providing tool documentation in context, limiting the number of tools. Both approaches often generate syntactically invalid tool calls.\nIn this paper, we propose ToolDec, a finite-state machine-guided decoding algorithm for tool-augmented LLMs.\nToolDec eliminates tool-related errors for any tool-augmented LLMs by ensuring valid tool names and type-conforming arguments.\nFurthermore, ToolDec enables LLM to effectively select tools using only the information contained in their names, with no need for fine-tuning or in-context documentation.\nWe evaluated multiple prior methods and their ToolDec-enhanced versions on a variety of tasks involving tools like math functions, knowledge graph relations, and complex real-world RESTful APIs.\nOur experiments show that ToolDec reduces syntactic errors to zero, consequently achieving significantly better performance and as much as a 2x speedup.\nWe also show that ToolDec achieves superior generalization performance on unseen tools, performing up to 8x better than the baselines",
        "keywords": "large language models;augmented language models;finite-state machines",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "",
        "author": "Kexun Zhang;Hongqiao Chen;Lei Li;William Yang Wang",
        "authorids": "~Kexun_Zhang1;~Hongqiao_Chen2;~Lei_Li11;~William_Yang_Wang2",
        "gender": "M;;M;",
        "homepage": "https://zkx06111.github.io;;https://www.cs.cmu.edu/~leili;",
        "dblp": "295/8815;;13/7007-5.html;",
        "google_scholar": ";;BYXqAlwAAAAJ;",
        "orcid": ";;0000-0003-3095-9776;",
        "linkedin": ";;;",
        "or_profile": "~Kexun_Zhang1;~Hongqiao_Chen2;~Lei_Li11;~William_Yang_Wang2",
        "aff": "Carnegie Mellon University;;School of Computer Science, Carnegie Mellon University;",
        "aff_domain": "cmu.edu;;cs.cmu.edu;",
        "position": "PhD student;;Assistant Professor;",
        "bibtex": "@misc{\nzhang2024tooldec,\ntitle={ToolDec: Syntax Error-Free and Generalizable Tool Use for {LLM}s via Finite-State Decoding},\nauthor={Kexun Zhang and Hongqiao Chen and Lei Li and William Yang Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=27YiINkhw3}\n}",
        "github": "",
        "project": "",
        "reviewers": "uQYf;R8ud;ydwb;7DQS",
        "site": "https://openreview.net/forum?id=27YiINkhw3",
        "pdf_size": 701731,
        "rating": "5;5;6;8",
        "confidence": "4;5;4;4",
        "soundness": "2;3;3;4",
        "contribution": "1;2;3;3",
        "presentation": "2;3;3;4",
        "wc_summary": "128;141;65;79",
        "wc_strengths": "64;68;50;47",
        "wc_weaknesses": "187;116;175;81",
        "wc_questions": "80;52;17;1",
        "wc_review": "459;377;307;208",
        "wc_reply_reviewers": "24;19;28;82",
        "wc_reply_authors": "1032;841;1391;653",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "4;3;4;2",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            103.25,
            31.971667144520318
        ],
        "wc_strengths_avg": [
            57.25,
            8.926785535678562
        ],
        "wc_weaknesses_avg": [
            139.75,
            43.27455950093542
        ],
        "wc_questions_avg": [
            37.5,
            30.696090956341656
        ],
        "wc_review_avg": [
            337.75,
            92.22628421442555
        ],
        "wc_reply_reviewers_avg": [
            38.25,
            25.459526704163217
        ],
        "wc_reply_authors_avg": [
            979.25,
            272.88859906562607
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.25,
            0.82915619758885
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.4714045207910316,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11606521451468694141&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Carnegie Mellon University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cmu.edu",
        "aff_unique_abbr": "CMU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Pittsburgh",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Ground-A-Video: Zero-shot Grounded Video Editing using Text-to-image Diffusion Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19558",
        "id": "28L2FCtMWq",
        "author_site": "Hyeonho Jeong, Jong Chul YE",
        "tldr": "",
        "abstract": "This paper introduces a novel grounding-guided video-to-video translation framework called Ground-A-Video for multi-attribute video editing.\nRecent endeavors in video editing have showcased promising results in single-attribute editing or style transfer tasks, either by training T2V models on text-video data or adopting training-free methods.\nHowever, when confronted with the complexities of multi-attribute editing scenarios, they exhibit shortcomings such as omitting or overlooking intended attribute changes, modifying the wrong elements of the input video, and failing to preserve regions of the input video that should remain intact.\nGround-A-Video attains temporally consistent multi-attribute editing of input videos in a training-free manner without aforementioned shortcomings.\nCentral to our method is the introduction of cross-frame gated attention which incorporates groundings information into the latent representations in a temporally consistent fashion, along with Modulated Cross-Attention and optical flow guided inverted latents smoothing.\nExtensive experiments and applications demonstrate that Ground-A-Video's zero-shot capacity outperforms other baseline methods in terms of edit-accuracy and frame consistency.\nFurther results and code are available at our project page ( http://ground-a-video.github.io )",
        "keywords": "Computer Vision;Diffusion Models;Video Editing",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Hyeonho Jeong;Jong Chul Ye",
        "authorids": "~Hyeonho_Jeong1;~Jong_Chul_Ye1",
        "gender": "M;M",
        "homepage": "https://hyeonho99.github.io/;https://bispl.weebly.com/",
        "dblp": "272/8078;15/5613",
        "google_scholar": "Pa7EfsEAAAAJ;HNMjoNEAAAAJ",
        "orcid": "0000-0002-6864-4190;",
        "linkedin": "hyeonho-jeong-jhh/;",
        "or_profile": "~Hyeonho_Jeong1;~Jong_Chul_Ye1",
        "aff": "Adobe Systems;Korea Advanced Institute of Science & Technology",
        "aff_domain": "adobe.com;kaist.ac.kr",
        "position": "Intern;Full Professor",
        "bibtex": "@inproceedings{\njeong2024groundavideo,\ntitle={Ground-A-Video: Zero-shot Grounded Video Editing using Text-to-image Diffusion Models},\nauthor={Hyeonho Jeong and Jong Chul Ye},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=28L2FCtMWq}\n}",
        "github": "",
        "project": "",
        "reviewers": "NYGw;TXKT;F2zK;vcyz",
        "pdf_size": 50110846,
        "rating": "6;6;6;8",
        "confidence": "4;3;4;4",
        "soundness": "2;3;2;4",
        "contribution": "2;3;3;3",
        "presentation": "2;3;2;3",
        "wc_summary": "50;44;114;111",
        "wc_strengths": "48;111;58;50",
        "wc_weaknesses": "52;215;157;92",
        "wc_questions": "68;9;25;3",
        "wc_review": "218;379;354;256",
        "wc_reply_reviewers": "47;18;73;0",
        "wc_reply_authors": "1151;1020;1175;427",
        "reply_reviewers": "1;1;2;0",
        "reply_authors": "4;3;5;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            79.75,
            32.83576556135093
        ],
        "wc_strengths_avg": [
            66.75,
            25.82029240732955
        ],
        "wc_weaknesses_avg": [
            129.0,
            62.20530523998737
        ],
        "wc_questions_avg": [
            26.25,
            25.410381736605217
        ],
        "wc_review_avg": [
            301.75,
            66.71722041572175
        ],
        "wc_reply_reviewers_avg": [
            34.5,
            27.84331158465171
        ],
        "wc_reply_authors_avg": [
            943.25,
            303.8390815876062
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            3.5,
            1.118033988749895
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 39,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7963234025556491814&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=28L2FCtMWq",
        "pdf": "https://openreview.net/pdf?id=28L2FCtMWq",
        "email": "adobe.com;kaist.ac.kr",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Adobe;Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "Adobe Systems Incorporated;",
        "aff_unique_url": "https://www.adobe.com;https://www.kaist.ac.kr",
        "aff_unique_abbr": "Adobe;KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United States;South Korea"
    },
    {
        "id": "28gMnEAgl9",
        "title": "Large Language Models Are Not Strong Abstract Reasoners",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large Language Models have shown tremendous performance on a large variety of natural language processing tasks, ranging from text comprehension to common sense reasoning. \nHowever, the mechanisms responsible for this success remain opaque, and it is unclear whether LLMs can achieve human-like cognitive capabilities or whether these models are still fundamentally circumscribed.\nAbstract reasoning is a fundamental task for cognition, consisting of finding and applying a general pattern from few data. Evaluating deep neural architectures on this task could give insight into their potential limitations regarding reasoning and their broad generalisation abilities, yet this is currently an under-explored area.\nIn this paper, we introduce a new benchmark for evaluating language models beyond memorization on abstract reasoning tasks. We perform extensive evaluations of state-of-the-art LLMs, showing that they achieve very limited performance in contrast with other natural language tasks, and we examine the reasons for this difference. We apply techniques that have been shown to improve performance on other NLP tasks and show that their impact for abstract reasoning is limited.",
        "keywords": "Abstract Reasoning;Large Language Models;Natural Language Processing",
        "primary_area": "causal reasoning",
        "supplementary_material": "/attachment/36340cd345a805ed81fdde638144cdad20dc5245.zip",
        "author": "Gael Gendron;Qiming Bao;Michael Witbrock;Gillian Dobbie",
        "authorids": "~Gael_Gendron1;~Qiming_Bao1;~Michael_Witbrock1;~Gillian_Dobbie1",
        "gender": ";M;F;M",
        "homepage": ";https://14h034160212.github.io/;https://profiles.auckland.ac.nz/g-dobbie;",
        "dblp": "310/1562;126/9037-1;d/GDobbie;w/MichaelJWitbrock",
        "google_scholar": "https://scholar.google.com/citations?hl=en;t-PqsgcAAAAJ;https://scholar.google.com.au/citations?user=v19BUHIAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0002-2457-934X;0000-0002-1000-7383;0000-0001-7245-0367;0000-0002-7554-0971",
        "linkedin": ";qiming-bill-bao-773757166/;gill-dobbie-3734822/;witbrock",
        "or_profile": "~Gael_Gendron1;~Qiming_Bao1;~Gillian_Dobbie1;~Michael_J._Witbrock1",
        "aff": "University of Auckland;University of Auckland;University of Auckland;University of Auckland",
        "aff_domain": "auckland.ac.nz;aucklanduni.ac.nz;auckland.ac.nz;auckland.ac.nz",
        "position": "PhD student;PhD student;Full Professor;Professor",
        "bibtex": "@misc{\ngendron2024large,\ntitle={Large Language Models Are Not Strong Abstract Reasoners},\nauthor={Gael Gendron and Qiming Bao and Michael Witbrock and Gillian Dobbie},\nyear={2024},\nurl={https://openreview.net/forum?id=28gMnEAgl9}\n}",
        "github": "",
        "project": "",
        "reviewers": "As6m;2kzP;LbQe",
        "site": "https://openreview.net/forum?id=28gMnEAgl9",
        "pdf_size": 403704,
        "rating": "5;5;6",
        "confidence": "4;4;3",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "3;3;3",
        "wc_summary": "68;35;58",
        "wc_strengths": "36;39;75",
        "wc_weaknesses": "64;65;65",
        "wc_questions": "49;1;92",
        "wc_review": "217;140;290",
        "wc_reply_reviewers": "75;0;0",
        "wc_reply_authors": "815;894;761",
        "reply_reviewers": "1;0;0",
        "reply_authors": "2;2;2",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            53.666666666666664,
            13.816254517375139
        ],
        "wc_strengths_avg": [
            50.0,
            17.72004514666935
        ],
        "wc_weaknesses_avg": [
            64.66666666666667,
            0.4714045207910317
        ],
        "wc_questions_avg": [
            47.333333333333336,
            37.16928241916375
        ],
        "wc_review_avg": [
            215.66666666666666,
            61.24450088692771
        ],
        "wc_reply_reviewers_avg": [
            25.0,
            35.35533905932738
        ],
        "wc_reply_authors_avg": [
            823.3333333333334,
            54.61583002105607
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9999999999999997,
        "gs_citation": 69,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6764763760076446864&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of Auckland",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.auckland.ac.nz",
        "aff_unique_abbr": "UoA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "New Zealand"
    },
    {
        "id": "28kAFnQZ5V",
        "title": "TENSORIZED ATTENTION MODEL",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In recent years, attention mechanisms have played a crucial role in the\nsuccess of Transformer models, as seen in platforms like OpenAI's\nChatGPT. However, these models often struggle to compute attention\nweights across various object types, such as 'comments,' 'replies,' and\nspecific 'subjects,' which naturally express relationships in many\nreal-world scenarios. This limitation can potentially impact prediction\naccuracy.\nTo overcome this limitation, we introduce the Tensorized Attention Model\n(TAM). By leveraging Tucker decomposition, TAM calculates attention\nweights across a diverse array of objects and seamlessly integrates them\ninto Transformer outputs. \nWe have implemented TAM within the Transformer encoder and have\nshowcased its effectiveness in response selection tasks. Our model takes\ninto account relationships based on 'the current context in the\ndialogue', 'the entire dialogue history', and 'the subject matter of the\ndialogue'. Evaluation using the Reddit dataset across a wide variety of\ntopics indicates that TAM significantly outperforms existing\nTransformer-based methods in terms of accuracy.",
        "keywords": "Attention model;Tensorized Transformer;Encoder model",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Makoto Nakatsuji;Yasuhiro Fujiwara;Narichika Nomoto;Atsushi Fukayama",
        "authorids": "~Makoto_Nakatsuji1;~Yasuhiro_Fujiwara1;~Narichika_Nomoto1;~Atsushi_Fukayama1",
        "gender": "M;M;M;M",
        "homepage": "https://tw.rpi.edu/web/person/MakotoNakatsuji;http://www.linkedin.com/in/yasuhiro-fujiwara-8960b0180;https://dl.acm.org/profile/99660959690;",
        "dblp": "86/2250;02/2520;;",
        "google_scholar": "https://scholar.google.co.jp/citations?user=NILKxCIAAAAJ;https://scholar.google.co.jp/citations?user=kCaZaaMAAAAJ;;",
        "orcid": "0000-0003-2181-0056;0000-0001-9578-1118;;",
        "linkedin": "https://linkedin.com/in/makoto-nakatsuji-a7693916;;;atsushi-fukayama-5551563a/",
        "or_profile": "~Makoto_Nakatsuji1;~Yasuhiro_Fujiwara1;~Narichika_Nomoto1;~Atsushi_Fukayama1",
        "aff": "NTT, ;NTT;NTT, The University of Tokyo;Nippon Telegraph and Telephone Corporation",
        "aff_domain": "ntt.co.jp;ntt.co.jp;ntt.co.jp;group.ntt",
        "position": "Researcher;Researcher;Researcher;Researcher",
        "bibtex": "@misc{\nnakatsuji2024tensorized,\ntitle={{TENSORIZED} {ATTENTION} {MODEL}},\nauthor={Makoto Nakatsuji and Yasuhiro Fujiwara and Narichika Nomoto and Atsushi Fukayama},\nyear={2024},\nurl={https://openreview.net/forum?id=28kAFnQZ5V}\n}",
        "github": "",
        "project": "",
        "reviewers": "4BZc;iEpi;qc5V",
        "site": "https://openreview.net/forum?id=28kAFnQZ5V",
        "pdf_size": 813413,
        "rating": "5;5;6",
        "confidence": "3;5;4",
        "soundness": "3;2;3",
        "contribution": "2;2;3",
        "presentation": "3;2;3",
        "wc_summary": "53;46;115",
        "wc_strengths": "96;26;61",
        "wc_weaknesses": "78;117;29",
        "wc_questions": "65;11;262",
        "wc_review": "292;200;467",
        "wc_reply_reviewers": "0;0;54",
        "wc_reply_authors": "958;887;1150",
        "reply_reviewers": "0;0;1",
        "reply_authors": "3;3;3",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            71.33333333333333,
            31.008959278820623
        ],
        "wc_strengths_avg": [
            61.0,
            28.577380332470412
        ],
        "wc_weaknesses_avg": [
            74.66666666666667,
            36.003086287459055
        ],
        "wc_questions_avg": [
            112.66666666666667,
            107.87132252003875
        ],
        "wc_review_avg": [
            319.6666666666667,
            110.74394891921735
        ],
        "wc_reply_reviewers_avg": [
            18.0,
            25.45584412271571
        ],
        "wc_reply_authors_avg": [
            998.3333333333334,
            111.09255400590787
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.0,
            0.0
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:v8polrHrx_wJ:scholar.google.com/&scioq=TENSORIZED+ATTENTION+MODEL&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "NTT Corporation;University of Tokyo;Nippon Telegraph and Telephone Corporation",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ntt.co.jp;https://www.u-tokyo.ac.jp;https://www.ntt.co.jp",
        "aff_unique_abbr": "NTT;UTokyo;NTT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Japan"
    },
    {
        "id": "29pGC6IYaL",
        "title": "Maximizing LLMs Potential: Enhancing Mongolian Chinese Machine Translation with RL Agents and Adversarial Multi Knowledge Distillation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Despite the impressive performance of Large Language Models (LLMs) in Natural Language Processing (NLP), they still face challenges in low-resource translation tasks, particularly in Mongolian to Chinese machine translation, often yielding suboptimal results. To address this issue, we propose an innovative approach that combines multi-source knowledge distillation and incorporates Reinforcement Learning (RL) to help models acquire and transfer knowledge from LLMs more effectively. RL plays a crucial role in this, making dynamic decisions to determine useful information for low-resource translation models and how to extract it efficiently. We introduce a new reward function to comprehensively guide knowledge distillation, and experiments show that this approach harnesses the potential of LLMs, significantly improving translation quality in low-resource settings.",
        "keywords": "Large Language Models;Reinforcement Learning;Adversarial Knowledge Distillation;Mongolian Chinese Machine Translation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/7bc668c29cd2f97957fc2cab260dc869647cf12c.zip",
        "author": "Xu Liuxu;YiLa Su;Nier Wu;Yatu Ji;Huinuan Zhang",
        "authorids": "~Xu_Liuxu1;~YiLa_Su1;~Nier_Wu1;~Yatu_Ji1;~Huinuan_Zhang1",
        "gender": "M;M;M;M;",
        "homepage": "https://github.com/;https://github.com/;https://id.qq.com/index.html#info;;",
        "dblp": ";;;245/8301;",
        "google_scholar": ";;;;",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Xu_Liuxu1;~YiLa_Su1;~Nier_Wu1;~Yatu_Ji1;~Huinuan_Zhang1",
        "aff": "Inner Mongolia University of Technology;;inner mongolia university;Inner Mongolia University;",
        "aff_domain": "imut.edu;;imu.edu.cn;imu.edu.cn;",
        "position": "MS student;;PhD student;PhD student;",
        "bibtex": "@misc{\nanonymous2025maximizing,\ntitle={Maximizing {LLM}s Potential: Enhancing Mongolian Chinese Machine Translation with {RL} Agents and Adversarial Multi Knowledge Distillation},\nauthor={Anonymous},\nyear={2025},\nurl={https://openreview.net/forum?id=29pGC6IYaL}\n}",
        "github": "",
        "project": "",
        "reviewers": "Mjnh;NGkR;hubM",
        "site": "https://openreview.net/forum?id=29pGC6IYaL",
        "pdf_size": 510324,
        "rating": "1;5;5",
        "confidence": "5;3;5",
        "soundness": "1;2;3",
        "contribution": "2;2;2",
        "presentation": "1;3;3",
        "wc_summary": "80;96;54",
        "wc_strengths": "24;24;43",
        "wc_weaknesses": "165;105;70",
        "wc_questions": "42;54;2",
        "wc_review": "311;279;169",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            1.8856180831641267
        ],
        "confidence_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            76.66666666666667,
            17.30767331432956
        ],
        "wc_strengths_avg": [
            30.333333333333332,
            8.956685895029603
        ],
        "wc_weaknesses_avg": [
            113.33333333333333,
            39.228674319799396
        ],
        "wc_questions_avg": [
            32.666666666666664,
            22.23110933404409
        ],
        "wc_review_avg": [
            253.0,
            60.81666438293592
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:McokaE6rt08J:scholar.google.com/&scioq=Maximizing+LLMs+Potential:+Enhancing+Mongolian+Chinese+Machine+Translation+with+RL+Agents+and+Adversarial+Multi+Knowledge+Distillation&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Inner Mongolia University of Technology;Inner Mongolia University",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.imut.edu.cn;http://www.imu.edu.cn",
        "aff_unique_abbr": "IMUT;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "2A199SAhW3",
        "title": "Learning Pseudo 3D Guidance for View-consistent 3D Texturing with 2D Diffusion",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Text-driven 3D texturing requires the generation of high-fidelity texture that conforms to given geometry and description. Recently, the high-quality text-to-image generation ability of 2D diffusion model has significantly promoted this task, by converting it into a texture optimization process guided by multi-view synthesized images. Thus the generation of high-quality and multi-view consistency images becomes the key issue. State-of-the-art methods introduce global consistency by treating novel view image generation as image inpainting conditioned on the texture generated by previously seen views. However, due to the error accumulation of inpainting itself and the occlusion between object parts, these inpainting-based methods often fail to deal with long-range texture consistency and the learned texture is of low quality. To address these, we present P3G, a text to 3D texturing approach based on learned Pseudo 3D Guidance. The key idea of P3D is to first learn a coarse but view-consistent texture, to serve as a semantics and layout guidance for high-quality view-consistent multi-view image generation. To this end, we propose a novel method to enable the learning of the pseudo 3D guidance, and design an efficient framework for high-quality and multi-view consistent image generation that incorporates both the depth map, the learned high-level semantics and layout guidance, and the previously generated texture. Quantitative and qualitative evaluation on variant 3D shapes demonstrates the superiority of our P3G on both consistency and quality.",
        "keywords": "3D Texturing;Diffusion Model",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/1ebf2a5d9f44a50b3c8fcffbe805dd40812325fc.zip",
        "author": "Kehan Li;Yanbo Fan;Yang Wu;Zhongqian Sun;Yang Wei;Li Yuan;Jie Chen",
        "authorids": "~Kehan_Li1;~Yanbo_Fan1;~Yang_Wu1;~Zhongqian_Sun1;~Yang_Wei2;~Li_Yuan2;~Jie_Chen15",
        "gender": "M;M;M;M;M;M;M",
        "homepage": ";https://sites.google.com/site/yanbofan0124/;;;;https://aimia-pku.github.io/;https://yuanli2333.github.io/",
        "dblp": "206/5336-2;181/4574;56/1428-1;70/8500;03/1094-32.html;92/6289-1;98/4583-7",
        "google_scholar": ";OlOqHyUAAAAJ;https://scholar.google.com.hk/citations?user=vwOQ-UIAAAAJ;;;https://scholar.google.fi/citations?user=ZAZFfwwAAAAJ;-5juAR0AAAAJ",
        "orcid": ";0000-0002-8530-485X;;;;;0000-0002-2120-5588",
        "linkedin": ";;;;;;",
        "or_profile": "~Kehan_Li1;~Yanbo_Fan1;~Yang_Wu1;~Zhongqian_Sun1;~Yang_Wei2;~Jie_Chen15;~Yuan_LI2",
        "aff": "Peking University;Ant Research;Tencent AI Lab;Tencent AI Lab;Tencent AI Lab;Peking University;Peking University",
        "aff_domain": "pku.edu.cn;antgroup.com;tencent.com;tencent.com;tencent.com;pku.edu.cn;pku.edu.cn",
        "position": "MS student;Associate Professor;Principal Researcher;Researcher;Researcher;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nli2024learning,\ntitle={Learning Pseudo 3D Guidance for View-consistent 3D Texturing with 2D Diffusion},\nauthor={Kehan Li and Yanbo Fan and Yang Wu and Zhongqian Sun and Yang Wei and Li Yuan and Jie Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=2A199SAhW3}\n}",
        "github": "",
        "project": "",
        "reviewers": "ruEM;ij6J;Nu8g;vaRt",
        "site": "https://openreview.net/forum?id=2A199SAhW3",
        "pdf_size": 3347506,
        "rating": "3;3;5;5",
        "confidence": "4;4;4;3",
        "soundness": "2;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "2;2;3;2",
        "wc_summary": "85;68;30;61",
        "wc_strengths": "68;54;40;27",
        "wc_weaknesses": "202;95;85;211",
        "wc_questions": "48;27;4;41",
        "wc_review": "403;244;159;340",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            61.0,
            19.912307751739878
        ],
        "wc_strengths_avg": [
            47.25,
            15.31951369985353
        ],
        "wc_weaknesses_avg": [
            148.25,
            58.443883341201754
        ],
        "wc_questions_avg": [
            30.0,
            16.80773631397161
        ],
        "wc_review_avg": [
            286.5,
            92.86684015298464
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2815068178139544979&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2;2;2;0;0",
        "aff_unique_norm": "Peking University;Ant Research;Tencent",
        "aff_unique_dep": ";;Tencent AI Lab",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.antgroup.com;https://ai.tencent.com",
        "aff_unique_abbr": "Peking U;Ant Research;Tencent AI Lab",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "2BfZMh9td4",
        "title": "Beyond One-Preference-for-All: Multi-Objective Direct Preference Optimization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Language models (LMs), despite aligning well with an average labeler through reinforcement learning from human feedback (RLHF), may not universally suit diverse human preferences. Recent approaches therefore opt for customization by collecting multi-dimensional feedback and creating distinct rewards for each dimension (e.g., helpfulness, harmlessness, honesty). LMs can then be tailored to different preferences using multi-objective RL (MORL) with different reward weightings. Yet, RL fine-tuning is unstable and resource-heavy, especially for MORLHF with diverse and usually conflicting objectives. In this paper, we present Multi-Objective Direct Preference Optimization (MODPO), an RL-free algorithm that extends Direct Preference Optimization (DPO) for multiple alignment objectives. Essentially, MODPO trains different LMs to represent different collective reward models that combine all objectives with specific weightings. With a simple cross-entropy loss, the LMs optimized against the MODPO objective are analytically the exact solutions of the original MORLHF objective. Empirical results in safety alignment and long-form question answering confirm that MODPO matches or outperforms existing methods, efficiently producing a Pareto-optimal set of LMs that cater to diverse preferences with 3 times less computational resources compared with MORLHF.",
        "keywords": "large language model;human feedback;multi objective",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Zhanhui Zhou;Jie Liu;Chao Yang;Jing Shao;Yu Liu;Xiangyu Yue;Wanli Ouyang;Yu Qiao",
        "authorids": "~Zhanhui_Zhou1;~Jie_Liu13;~Chao_Yang3;~Jing_Shao3;~Yu_Liu2;~Xiangyu_Yue1;~Wanli_Ouyang1;~Yu_Qiao1",
        "gender": "M;;;F;M;M;;",
        "homepage": "https://zhziszz.github.io/;;;https://amandajshao.github.io/;http://liuyu.us;http://xyue.io/;;",
        "dblp": ";;;;97/2274-15;207/7518;;",
        "google_scholar": "SbACfYQAAAAJ;;;VU5ObUwAAAAJ;;-xQ-C1sAAAAJ;;",
        "orcid": ";;;;;;;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Zhanhui_Zhou1;~Jie_Liu13;~Chao_Yang3;~Jing_Shao3;~Yu_Liu2;~Xiangyu_Yue1;~Wanli_Ouyang1;~Yu_Qiao1",
        "aff": "Shanghai Artificial Intelligence Laboratory;;;Shanghai AI Laboratory;SenseTime;The Chinese University of Hong Kong;;",
        "aff_domain": "pjlab.org.cn;;;pjlab.org.cn;sensetime.com;ie.cuhk.edu;;",
        "position": "Researcher;;;Researcher;Principal Researcher;Assistant Professor;;",
        "bibtex": "@misc{\nzhou2024beyond,\ntitle={Beyond One-Preference-for-All: Multi-Objective Direct Preference Optimization},\nauthor={Zhanhui Zhou and Jie Liu and Chao Yang and Jing Shao and Yu Liu and Xiangyu Yue and Wanli Ouyang and Yu Qiao},\nyear={2024},\nurl={https://openreview.net/forum?id=2BfZMh9td4}\n}",
        "github": "",
        "project": "",
        "reviewers": "nwoD;TGqd;GBhK;c1KT",
        "site": "https://openreview.net/forum?id=2BfZMh9td4",
        "pdf_size": 1991679,
        "rating": "5;5;6;10",
        "confidence": "3;3;3;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "116;53;77;80",
        "wc_strengths": "49;14;92;70",
        "wc_weaknesses": "111;57;60;23",
        "wc_questions": "30;30;108;54",
        "wc_review": "306;154;337;227",
        "wc_reply_reviewers": "34;0;0;0",
        "wc_reply_authors": "1063;755;1146;349",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "4;3;3;2",
        "rating_avg": [
            6.5,
            2.0615528128088303
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            81.5,
            22.5
        ],
        "wc_strengths_avg": [
            56.25,
            28.74347752099596
        ],
        "wc_weaknesses_avg": [
            62.75,
            31.419540098480116
        ],
        "wc_questions_avg": [
            55.5,
            31.85514087239295
        ],
        "wc_review_avg": [
            256.0,
            71.24956140215882
        ],
        "wc_reply_reviewers_avg": [
            8.5,
            14.722431864335457
        ],
        "wc_reply_authors_avg": [
            828.25,
            312.697437629412
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.9801960588196067,
        "gs_citation": 50,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7079115486357626350&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Shanghai Artificial Intelligence Laboratory;Shanghai AI Laboratory;SenseTime;Chinese University of Hong Kong",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "http://www.shailab.org/;https://www.shanghai-ai-lab.com;https://www.sensetime.com;https://www.cuhk.edu.hk",
        "aff_unique_abbr": "Shanghai AI Lab;SAIL;SenseTime;CUHK",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "2C3CWCPxNS",
        "title": "Preconditioning for Physics-Informed Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Physics-informed neural networks (PINNs) have shown promise in solving complex partial differential equations (PDEs). However, certain training pathologies have emerged, compromising both convergence and prediction accuracy in practical applications. In this paper, we propose to use condition number as an innovative metric to diagnose and rectify the pathologies in PINNs. Inspired by classical numerical analysis, where the condition number measures sensitivity and stability, we highlight its pivotal role in the training dynamics of PINNs. We delineate a theory that elucidates the relationship between reduced condition numbers and improved error control, as well as better convergence. Subsequently, we present an algorithm that leverages preconditioning to enhance the condition number. Evaluations on 16 PDE problems showcase the superior performance of our method. Significantly, in 7 of these problems, our method reduces errors by an order of magnitude. Furthermore, in 2 distinct cases, our approach pioneers a solution, slashing relative errors from roughly $100\\\\%$ to below $6\\\\%$ and $21\\\\%$, respectively.",
        "keywords": "physics-informed neural network;partial differential equation;condition number;application",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/73b0e5d9a8305629c7f2c1026c67620cfaac045c.zip",
        "author": "Songming Liu;Chang Su;Jiachen Yao;Zhongkai Hao;Hang Su;Youjia Wu;Jun Zhu",
        "authorids": "~Songming_Liu1;~Chang_Su7;~Jiachen_Yao3;~Zhongkai_Hao1;~Hang_Su3;~Youjia_Wu1;~Jun_Zhu2",
        "gender": "M;M;M;M;M;M;M",
        "homepage": ";https://github.com/EdwardIX;https://jiachenyao.com/;;http://ml.cs.tsinghua.edu.cn/~jun;;https://haozhongkai.github.io/",
        "dblp": "285/4585;;213/4920;;50/2644-1;26/5371-6;270/0220.html",
        "google_scholar": "6urFg8kAAAAJ;;Z_bCoGcAAAAJ;;axsP38wAAAAJ;dxN1_X0AAAAJ;dfSzq27ZiVoC",
        "orcid": ";;0000-0001-7655-7831;0000-0002-7399-1306;;;",
        "linkedin": "%E6%9D%BE%E9%93%AD-%E5%88%98-7b8339254/;;jiachen-y-05a05932a/;;;;",
        "or_profile": "~Songming_Liu1;~Chang_Su7;~Jiachen_Yao3;~Youjia_Wu1;~Jun_Zhu2;~Hang_Su2;~Hao_Zhongkai1",
        "aff": "Tsinghua University;Tsinghua University;Tsinghua University;Bosch;Tsinghua University;Tsinghua University;Tsinghua University",
        "aff_domain": "mails.tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;bosch.com;mail.tsinghua.edu.cn;tsinghua.edu.cn;mails.tsinghua.edu.cn",
        "position": "PhD student;Undergrad student;Undergrad student;Researcher;Professor;Associate Professor;PhD student",
        "bibtex": "@misc{\nliu2024preconditioning,\ntitle={Preconditioning for Physics-Informed Neural Networks},\nauthor={Songming Liu and Chang Su and Jiachen Yao and Zhongkai Hao and Hang Su and Youjia Wu and Jun Zhu},\nyear={2024},\nurl={https://openreview.net/forum?id=2C3CWCPxNS}\n}",
        "github": "",
        "project": "",
        "reviewers": "8B8P;zaqP;tNfv;MgQM",
        "site": "https://openreview.net/forum?id=2C3CWCPxNS",
        "pdf_size": 0,
        "rating": "3;5;6;6",
        "confidence": "3;3;2;3",
        "soundness": "1;2;3;4",
        "contribution": "2;2;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "47;81;253;52",
        "wc_strengths": "7;29;127;103",
        "wc_weaknesses": "233;111;61;182",
        "wc_questions": "7;113;49;105",
        "wc_review": "294;334;490;442",
        "wc_reply_reviewers": "572;136;0;0",
        "wc_reply_authors": "2272;1435;1805;1504",
        "reply_reviewers": "2;1;0;0",
        "reply_authors": "5;4;4;3",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            1.118033988749895
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            108.25,
            84.57356265405875
        ],
        "wc_strengths_avg": [
            66.5,
            49.84726672546851
        ],
        "wc_weaknesses_avg": [
            146.75,
            65.78896184011418
        ],
        "wc_questions_avg": [
            68.5,
            43.229041164476456
        ],
        "wc_review_avg": [
            390.0,
            79.14543574963751
        ],
        "wc_reply_reviewers_avg": [
            177.0,
            234.71472045868788
        ],
        "wc_reply_authors_avg": [
            1754.0,
            329.8431445399464
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            4.0,
            0.7071067811865476
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.4714045207910316,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11405597999913649388&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;1;0;0;0",
        "aff_unique_norm": "Tsinghua University;Robert Bosch GmbH",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.bosch.com",
        "aff_unique_abbr": "THU;Bosch",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0;0;0",
        "aff_country_unique": "China;Germany"
    },
    {
        "id": "2CFagKoXXx",
        "title": "High Dimensional Causal Inference with Variational Backdoor Adjustment",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Backdoor adjustment is a technique in causal inference for estimating interventional quantities from purely observational data. In medical settings, backdoor adjustment can be used to control for confounding and isolate the effectiveness of a treatment. However, high dimensional treatments and confounders pose a series of potential pitfalls: tractability, identifiability, optimization. In this work, we take a generative modeling approach to backdoor adjustment for high dimensional treatments and confounders. We cast backdoor adjustment as an optimization problem in variational inference without reliance on proxy variables and hidden confounders. Empirically, our method is able to estimate interventional likelihood in a variety of high dimensional settings, including semi-synthetic X-ray medical data. To the best of our knowledge, this is the first application of backdoor adjustment in which all the relevant variables are high dimensional.",
        "keywords": "causality;causal inference;backdoor adjustment;variational inference;generative model;high dimensional;intervention;treatment;confounding;identifiable;optimization",
        "primary_area": "causal reasoning",
        "supplementary_material": "/attachment/a7680ebe8eb534b7fa9cbdec56728c58588a7278.pdf",
        "author": "Daniel Mingyi Israel;Aditya Grover;Guy Van den Broeck",
        "authorids": "~Daniel_Mingyi_Israel1;~Aditya_Grover1;~Guy_Van_den_Broeck1",
        "gender": "M;M;M",
        "homepage": "https://danielmisrael.github.io/;https://aditya-grover.github.io;http://web.cs.ucla.edu/~guyvdb/",
        "dblp": ";162/5052;96/7521.html",
        "google_scholar": ";oOhnPUgAAAAJ;d0KQ9z0AAAAJ",
        "orcid": ";;0000-0003-3434-2503",
        "linkedin": "daniel-israel-248757160;;guyvdb",
        "or_profile": "~Daniel_Mingyi_Israel1;~Aditya_Grover1;~Guy_Van_den_Broek1",
        "aff": ";University of California, Los Angeles;University of California, Los Angeles",
        "aff_domain": ";ucla.edu;ucla.edu",
        "position": ";Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nisrael2024high,\ntitle={High Dimensional Causal Inference with Variational Backdoor Adjustment},\nauthor={Daniel Mingyi Israel and Aditya Grover and Guy Van den Broeck},\nyear={2024},\nurl={https://openreview.net/forum?id=2CFagKoXXx}\n}",
        "github": "",
        "project": "",
        "reviewers": "m1yM;wak4;3NGK",
        "site": "https://openreview.net/forum?id=2CFagKoXXx",
        "pdf_size": 1381415,
        "rating": "3;3;5",
        "confidence": "3;3;3",
        "soundness": "3;2;3",
        "contribution": "1;2;2",
        "presentation": "2;2;3",
        "wc_summary": "76;65;96",
        "wc_strengths": "87;81;73",
        "wc_weaknesses": "440;665;84",
        "wc_questions": "172;9;4",
        "wc_review": "775;820;257",
        "wc_reply_reviewers": "125;294;0",
        "wc_reply_authors": "604;379;99",
        "reply_reviewers": "1;1;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            79.0,
            12.832251036613439
        ],
        "wc_strengths_avg": [
            80.33333333333333,
            5.734883511361751
        ],
        "wc_weaknesses_avg": [
            396.3333333333333,
            239.19355249578857
        ],
        "wc_questions_avg": [
            61.666666666666664,
            78.04414705081278
        ],
        "wc_review_avg": [
            617.3333333333334,
            255.45558431076734
        ],
        "wc_reply_reviewers_avg": [
            139.66666666666666,
            120.47221901980372
        ],
        "wc_reply_authors_avg": [
            360.6666666666667,
            206.57255921884257
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10661663977020613431&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of California, Los Angeles",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucla.edu",
        "aff_unique_abbr": "UCLA",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Los Angeles",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "2CxkRDMIG4",
        "title": "Precision and Recall Reject Curves for Classification",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "For some classification scenarios, it is desirable to use only those classification instances that a trained model associates with a high certainty. To obtain such high-certainty instances, previous work has proposed accuracy-reject curves. Reject curves allow to evaluate and compare the performance of different certainty measures over a range of thresholds for accepting or rejecting classifications. However, the accuracy may not be the most suited evaluation metric for all applications, and instead precision or recall may be preferable. This is the case, for example, for data with imbalanced class distributions. We therefore propose reject curves that evaluate precision and recall, the recall-reject curve and the precision-reject curve. Using prototype-based classifiers from learning vector quantization, we first validate the proposed curves on artificial benchmark data against the accuracy reject curve as a baseline. We then show on imbalanced benchmarks and medical, real-world data that for these scenarios, the proposed precision- and recall-curves yield more accurate insights into classifier performance than accuracy reject curves.",
        "keywords": "reject option;precision;recall;evaluating classifiers;transparent machine learning;imbalanced data",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Lydia Fischer;Patricia Wollstadt",
        "authorids": "~Lydia_Fischer1;~Patricia_Wollstadt1",
        "gender": ";F",
        "homepage": ";",
        "dblp": "https://dblp.uni-trier.de/pid/146/0233.html;",
        "google_scholar": ";",
        "orcid": ";0000-0002-7105-5207",
        "linkedin": ";",
        "or_profile": "~Lydia_Fischer1;~Patricia_Wollstadt1",
        "aff": "Honda Research Institute;",
        "aff_domain": "honda-ri.de;",
        "position": "Researcher;",
        "bibtex": "@misc{\nfischer2024precision,\ntitle={Precision and Recall Reject Curves for Classification},\nauthor={Lydia Fischer and Patricia Wollstadt},\nyear={2024},\nurl={https://openreview.net/forum?id=2CxkRDMIG4}\n}",
        "github": "",
        "project": "",
        "reviewers": "EkHi;uffc;zM2w;YWY1",
        "site": "https://openreview.net/forum?id=2CxkRDMIG4",
        "pdf_size": 563752,
        "rating": "1;1;1;3",
        "confidence": "4;4;4;4",
        "soundness": "3;1;2;1",
        "contribution": "1;1;1;1",
        "presentation": "2;3;3;3",
        "wc_summary": "36;42;107;29",
        "wc_strengths": "43;29;36;15",
        "wc_weaknesses": "99;318;94;77",
        "wc_questions": "15;1;81;24",
        "wc_review": "193;390;318;145",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            1.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            1.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            53.5,
            31.228992939254383
        ],
        "wc_strengths_avg": [
            30.75,
            10.353139620424328
        ],
        "wc_weaknesses_avg": [
            147.0,
            99.06311119685269
        ],
        "wc_questions_avg": [
            30.25,
            30.425112982534674
        ],
        "wc_review_avg": [
            261.5,
            97.42817867537092
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11613881960874242025&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "Honda Research Institute",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.honda-ri.com",
        "aff_unique_abbr": "HRI",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Japan"
    },
    {
        "id": "2DDwxbjP9g",
        "title": "In Defence Of Wasserstein",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Since the introduction of Wasserstein GANs, there has been considerable debate whether they should be viewed as minimizing the Wasserstein distance between the training images and the generated images. In particular, several recent works have shown that minimizing this Wasserstein distance leads to blurry images that are of much lower quality than those generated by state-of-the-art WGANs.\nIn this paper we present theoretical and experimental results that suggest that with the appropriate parameter settings, WGANs $\\textbf{do}$ minimize the Wasserstein distance but the form of the distance that is minimized depends highly on the discriminator architecture. We focus on discrete generators for which the Wasserstein distance between the generator distribution and the training distribution can be computed exactly and show that when the discriminator is fully connected, standard WGANs indeed minimize the Wasserstein distance between the generated images and the training images, while when the discriminator is convolutional they minimize the Wasserstein distance between $\\textbf{patches}$ in the generated images and the training images.  Our experiments indicate that minimizing the patch Wasserstein metric yields sharp and realistic samples for the same datasets in which minimizing the image Wasserstein distance yields blurry and low quality samples. Our results also suggest alternative methods that directly optimize the patch Wasserstein distance without a discriminator and/or a generator.",
        "keywords": "GAN;Wasserstein;Optimal transport;Image patches;Generative models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/8c918c3ba9901ec4b0b39a01a73b32fee69dd907.zip",
        "author": "Ariel Elnekave;Yair Weiss",
        "authorids": "~Ariel_Elnekave1;~Yair_Weiss1",
        "gender": "M;M",
        "homepage": "https://github.com/ariel415el;http://www.cs.huji.ac.il/~yweiss/",
        "dblp": ";44/1092",
        "google_scholar": "https://scholar.google.co.il/citations?user=pSVU5zsAAAAJ;https://scholar.google.com.tw/citations?user=9DXQi8gAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Ariel_Elnekave1;~Yair_Weiss1",
        "aff": "Hebrew University of Jerusalem;Hebrew University of Jerusalem",
        "aff_domain": "huji.ac.il;huji.ac.il",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nelnekave2024in,\ntitle={In Defence Of Wasserstein},\nauthor={Ariel Elnekave and Yair Weiss},\nyear={2024},\nurl={https://openreview.net/forum?id=2DDwxbjP9g}\n}",
        "github": "",
        "project": "",
        "reviewers": "hGFX;L98k;scef;ZrfD",
        "site": "https://openreview.net/forum?id=2DDwxbjP9g",
        "pdf_size": 8181526,
        "rating": "3;3;3;8",
        "confidence": "4;3;4;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;2;4",
        "wc_summary": "93;110;88;209",
        "wc_strengths": "62;57;42;91",
        "wc_weaknesses": "494;485;385;95",
        "wc_questions": "383;2;56;24",
        "wc_review": "1032;654;571;419",
        "wc_reply_reviewers": "345;146;162;0",
        "wc_reply_authors": "962;777;760;64",
        "reply_reviewers": "2;1;1;0",
        "reply_authors": "3;2;1;1",
        "rating_avg": [
            4.25,
            2.165063509461097
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            125.0,
            49.178247223747206
        ],
        "wc_strengths_avg": [
            63.0,
            17.76231966833161
        ],
        "wc_weaknesses_avg": [
            364.75,
            161.50909417119522
        ],
        "wc_questions_avg": [
            116.25,
            155.2004751925715
        ],
        "wc_review_avg": [
            669.0,
            225.8860332114405
        ],
        "wc_reply_reviewers_avg": [
            163.25,
            122.45688016604049
        ],
        "wc_reply_authors_avg": [
            640.75,
            342.2815909452333
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:eHs5x8D3dAsJ:scholar.google.com/&scioq=In+Defence+Of+Wasserstein&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Hebrew University of Jerusalem",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.huji.ac.il",
        "aff_unique_abbr": "HUJI",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Jerusalem",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Israel"
    },
    {
        "id": "2DJMtdfgfH",
        "title": "Deep ResNIDS: A Multistage AI Framework for Novelty Detection in Network Traffic",
        "track": "main",
        "status": "Desk Reject",
        "tldr": "",
        "abstract": "Ensuring computer and network system security is crucial in today's digital landscape. Network intrusion detection systems (NIDS) monitor network traffic to identify potential threats. However, traditional NIDS struggle to adapt to evolving cyberattack tactics. To address this, we propose an AI-enabled novelty detection framework to handle zero-day, out-of-distribution, and adversarial evasion attacks. Our framework comprises three sequential deep neural network architectures: one for the classifier and two for specific autoencoders, designed to effectively detect both known attack patterns and novel, previously unseen samples. We use innovative transfer learning, unfreezing specific neurons, and layer combinations to enhance resilience. Leveraging the one-shot learning approach in the transfer learning component of the framework, we demonstrate continuous improvement in detection accuracy for both known and novel network traffic patterns. Our experiments on benchmark intrusion detection data sets achieved, on average, 98.5% accuracy in detecting various attacks.",
        "keywords": "Multistage network intrusion detection system;novelty detector;anomaly detector;malicious packet classifier;sequential deep neural network architectures",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Soumyadeep Hore;Ankit Shah;Nathaniel D. Bastian;Jalal Ghadermazi",
        "authorids": "~Soumyadeep_Hore1;~Ankit_Shah4;~Nathaniel_D._Bastian1;~Jalal_Ghadermazi1",
        "gender": "M;;M;M",
        "homepage": ";https://ankitshah.co;https://cyber.army.mil/About-Us/ACI-Research-Team/Bastian/;",
        "dblp": ";;132/5837.html;",
        "google_scholar": "ZaPw_kUAAAAJ;;M2aMMxQAAAAJ;https://scholar.google.com/citations?view_op=list_works",
        "orcid": ";;0000-0001-9957-2778;",
        "linkedin": ";;nathanielbastian/;",
        "or_profile": "~Soumyadeep_Hore1;~Ankit_Shah4;~Nathaniel_D._Bastian1;~Jalal_Ghadermazi1",
        "aff": "University of South Florida;;United States Military Academy;",
        "aff_domain": "usf.edu;;westpoint.edu;",
        "position": "PhD student;;Principal Researcher;",
        "bibtex": "@misc{\nhore2024deep,\ntitle={Deep Res{NIDS}: A Multistage {AI} Framework for Novelty Detection in Network Traffic},\nauthor={Soumyadeep Hore and Ankit Shah and Nathaniel D. Bastian and Jalal Ghadermazi},\nyear={2024},\nurl={https://openreview.net/forum?id=2DJMtdfgfH}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=2DJMtdfgfH",
        "pdf_size": 613704,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:1H1M_o7xzsUJ:scholar.google.com/&scioq=Deep+ResNIDS:+A+Multistage+AI+Framework+for+Novelty+Detection+in+Network+Traffic&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of South Florida;United States Military Academy",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.usf.edu;https://www.usma.edu/",
        "aff_unique_abbr": "USF;USMA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "2DJUXmHZ2O",
        "title": "Generalizing Poincar\u00e9 Policy Representations in Multi-agent Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Learning policy representations is essential for comprehending the intricacies of agent interactions and their decision-making processes.\nRecent studies have found that the evolution of any state under Markov decision processes (MDPs) can be divided into multiple hierarchies based on time sequences. This conceptualization resembles a tree-growing process, where the policy and environment dynamics determine the possible branches. In this paper, the multiple agent's trajectory growing paths can be projected into a Poincar\u00e9 ball, which requires the tree to grow from the origin to the boundary of the ball, deriving a new geometric idea of learning Poincar\u00e9 Policy Representations (P2R) for MARL.\nSpecifically, P2R captures the policy representation of the Poincar\u00e9 ball by a hyperbolic neural network and introduces a contrast objective function that encourages embeddings of the same policy to move closer together while embeddings of different policies to move apart, which enables embed policies with low distortion.\nExperimental results provide empirical evidence for the effectiveness of the P2R framework in cooperative and competitive games, demonstrating the potential of Poincar\u00e9 policy representations for optimizing policies in complex multi-agent environments.",
        "keywords": "policy representation;reinforcement learning;multi-agent",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Bohao Qu;Xiaofeng Cao;Zhen Fang;Qing Guo;Yi Chang",
        "authorids": "~Bohao_Qu1;~Xiaofeng_Cao2;~Zhen_Fang2;~Qing_Guo3;~Yi_Chang4",
        "gender": "M;M;M;M;M",
        "homepage": "https://ieeexplore.ieee.org/author/37088517338;https://fang-zhen.github.io/index.html;https://tsingqguo.github.io;http://www.yichang-cs.com;https://xiaofengcaoml.github.io/",
        "dblp": "275/7652.html;;25/3038-5;02/5438.html;117/3982-2.html",
        "google_scholar": "Xr4GORcAAAAJ;OzD6WJcAAAAJ;Rj2x4QUAAAAJ;https://scholar.google.com.hk/citations?user=drEkR50AAAAJ;",
        "orcid": "0000-0003-3192-8736;0000-0003-0602-6255;0000-0003-0974-9299;0000-0003-2697-8093;",
        "linkedin": ";;;;",
        "or_profile": "~Bohao_Qu1;~Zhen_Fang2;~Qing_Guo3;~Yi_Chang4;~Xiaofeng_Cao1",
        "aff": "Jilin University;University of Technology Sydney; Agency for Science, Technology and Research (A*STAR));Jilin University, China;Jilin University",
        "aff_domain": "jlu.edu.cn;uts.edu.au;cfar.a-star.edu.sg;jlu.edu.cn;jlu.edu.cn",
        "position": "PhD student;Assistant Professor;Researcher;Full Professor;Associate Professor",
        "bibtex": "@misc{\nqu2024generalizing,\ntitle={Generalizing Poincar\\'e Policy Representations in Multi-agent Reinforcement Learning},\nauthor={Bohao Qu and Xiaofeng Cao and Zhen Fang and Qing Guo and Yi Chang},\nyear={2024},\nurl={https://openreview.net/forum?id=2DJUXmHZ2O}\n}",
        "github": "",
        "project": "",
        "reviewers": "VeDg;iHns;MnTe;SaBP",
        "site": "https://openreview.net/forum?id=2DJUXmHZ2O",
        "pdf_size": 4202293,
        "rating": "3;5;5;6",
        "confidence": "2;2;4;3",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "81;50;94;67",
        "wc_strengths": "30;40;43;21",
        "wc_weaknesses": "55;78;195;38",
        "wc_questions": "502;34;58;19",
        "wc_review": "668;202;390;145",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            73.0,
            16.355427233796124
        ],
        "wc_strengths_avg": [
            33.5,
            8.674675786448736
        ],
        "wc_weaknesses_avg": [
            91.5,
            61.41864537744218
        ],
        "wc_questions_avg": [
            153.25,
            201.8308388230104
        ],
        "wc_review_avg": [
            351.25,
            204.11194844986414
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.48420012470625223,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:UIGmecXqHeMJ:scholar.google.com/&scioq=Generalizing+Poincar%C3%A9+Policy+Representations+in+Multi-agent+Reinforcement+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0;0",
        "aff_unique_norm": "Jilin University;University of Technology Sydney;Agency for Science, Technology and Research",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.jlu.edu.cn;https://www.uts.edu.au;https://www.a-star.edu.sg",
        "aff_unique_abbr": "JLU;UTS;A*STAR",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;0;0",
        "aff_country_unique": "China;Australia;Singapore"
    },
    {
        "title": "Neural Spectral Methods: Self-supervised learning in the spectral domain",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19557",
        "id": "2DbVeuoa6a",
        "author_site": "Yiheng Du, Nithin Chalapathi, Aditi Krishnapriyan",
        "tldr": "",
        "abstract": "We present Neural Spectral Methods, a technique to solve parametric Partial Differential Equations (PDEs), grounded in classical spectral methods. Our method uses orthogonal bases to learn PDE solutions as mappings between spectral coefficients, instantiating a spectral-based neural operator. In contrast to current machine learning approaches which enforce PDE constraints by minimizing the numerical quadrature of the residuals in the spatiotemporal domain, we leverage Parseval's identity and introduce a new training strategy through a spectral loss. Our spectral loss enables more efficient differentiation through the neural network, and substantially reduces training complexity. At inference time, the computational cost of our method remains constant, regardless of the spatiotemporal resolution of the domain.  Our experimental results demonstrate that our method significantly outperforms previous machine learning approaches in terms of speed and accuracy by one to two orders of magnitude on multiple different problems, including reaction-diffusion, and forced and unforced Navier-Stokes equations. When compared to numerical solvers of the same accuracy, our method demonstrates a $10\\times$ increase in performance speed. Our source code is publicly available at https://github.com/ASK-Berkeley/Neural-Spectral-Methods.",
        "keywords": "Machine learning for PDEs;spectral methods;neural network differentiation;spectral loss;PDEs;neural operators",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Yiheng Du;Nithin Chalapathi;Aditi S. Krishnapriyan",
        "authorids": "~Yiheng_Du1;~Nithin_Chalapathi1;~Aditi_S._Krishnapriyan1",
        "gender": "M;M;",
        "homepage": "https://github.com/mrlazy1708;https://github.com/nithinvc/;https://a1k12.github.io",
        "dblp": ";255/5081;256/5472",
        "google_scholar": ";;7HoFN1wAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Yiheng_Du1;~Nithin_Chalapathi1;~Aditi_Krishnapriyan1",
        "aff": "Peking University;University of California, Berkeley;University of California, Berkeley",
        "aff_domain": "pku.edu.cn;berkeley.edu;berkeley.edu",
        "position": "Undergrad student;PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\ndu2024neural,\ntitle={Neural Spectral Methods: Self-supervised learning in the spectral domain},\nauthor={Yiheng Du and Nithin Chalapathi and Aditi S. Krishnapriyan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=2DbVeuoa6a}\n}",
        "github": "",
        "project": "",
        "reviewers": "KbDK;4uLV;dP1d;9377",
        "pdf_size": 2056367,
        "rating": "3;8;8;8",
        "confidence": "4;4;4;4",
        "soundness": "3;2;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "97;69;66;109",
        "wc_strengths": "82;48;148;67",
        "wc_weaknesses": "330;104;43;42",
        "wc_questions": "189;215;228;71",
        "wc_review": "698;436;485;289",
        "wc_reply_reviewers": "359;20;13;197",
        "wc_reply_authors": "1788;559;739;703",
        "reply_reviewers": "1;1;1;2",
        "reply_authors": "3;2;2;3",
        "rating_avg": [
            6.75,
            2.165063509461097
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            85.25,
            18.280795934531955
        ],
        "wc_strengths_avg": [
            86.25,
            37.632266740126084
        ],
        "wc_weaknesses_avg": [
            129.75,
            118.30971008332325
        ],
        "wc_questions_avg": [
            175.75,
            62.086129690938215
        ],
        "wc_review_avg": [
            477.0,
            146.56909633343585
        ],
        "wc_reply_reviewers_avg": [
            147.25,
            142.76619873065192
        ],
        "wc_reply_authors_avg": [
            947.25,
            490.0573308297714
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12743670651235522506&as_sdt=5,30&sciodt=0,30&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=2DbVeuoa6a",
        "pdf": "https://openreview.net/pdf?id=2DbVeuoa6a",
        "email": "pku.edu.cn;berkeley.edu;berkeley.edu",
        "author_num": 3,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Peking University;University of California, Berkeley",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.berkeley.edu",
        "aff_unique_abbr": "Peking U;UC Berkeley",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Berkeley",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "2DldCIjAdX",
        "title": "LayerNAS: Neural Architecture Search in Polynomial Complexity",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Neural Architecture Search (NAS) has become a popular method for discovering effective model architectures, especially for target hardware. As such, NAS methods that find optimal architectures under constraints are essential. In our paper, we propose LayerNAS to address the challenge of multi-objective NAS by transforming it into a combinatorial optimization problem, which effectively constrains the search complexity to be polynomial. LayerNAS rigorously derives its method from the fundamental assumption that modifications to previous layers have no impact on the subsequent layers. When dealing with search spaces containing $L$ layers that meet this requirement, the method performs layerwise-search for each layer, selecting from a set of search options $\\mathbb{S}$. LayerNAS groups model candidates based on one objective, such as model size or latency, and searches for the optimal model based on another objective, thereby splitting the cost and reward elements of the search. This approach limits the search complexity to $ O(H \\cdot |\\mathbb{S}| \\cdot L) $, where $H$ is a constant set in LayerNAS. Our experiments show that LayerNAS is able to consistently discover superior models across a variety of search spaces in comparison to strong baselines, including search spaces derived from NATS-Bench, MobileNetV2 and MobileNetV3.",
        "keywords": "AutoML;Neural Architecture Search;Model Optimization",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/33d4417722fdee95d0620788259a596dca14567e.zip",
        "author": "Yicheng Fan;Dana Alon;JINGYUE SHEN;Daiyi Peng;Keshav Kumar;Xinyu Feng;Yun Long;Xin Wang;Fotis Iliopoulos;Da-Cheng Juan;Erik Vee",
        "authorids": "~Yicheng_Fan1;~Dana_Alon1;~JINGYUE_SHEN1;~Daiyi_Peng1;~Keshav_Kumar1;~Xinyu_Feng3;~Yun_Long1;~Xin_Wang30;~Fotis_Iliopoulos1;~Da-Cheng_Juan1;~Erik_Vee1",
        "gender": ";;;M;M;;M;M;M;;",
        "homepage": ";;https://www.linkedin.com/in/jingyue-brian-shen/;http://www.daiyip.org;https://keshv.in;;https://scholar.google.com/citations?user=DNHsO0gAAAAJ&hl=en&oi=sra;;http://www.filiop.org/;;",
        "dblp": "289/0992;136/8637;229/7228;;;;;;147/4790;47/1564;",
        "google_scholar": "LTZjlnwAAAAJ;0WEF4fkAAAAJ;wWAFw8UAAAAJ;_8Egwg8AAAAJ;;;DNHsO0gAAAAJ;7BjA8ccAAAAJ;v3e5F-AAAAAJ;https://scholar.google.com/citations?hl=en;",
        "orcid": ";;;;;;;;;;",
        "linkedin": "https://linkedin.com/in/yicheng-fan-b4b79124;dana-alon;;;keshav-kr;;;;;;",
        "or_profile": "~Yicheng_Fan1;~Dana_Alon1;~JINGYUE_SHEN1;~Daiyi_Peng1;~Keshav_Kumar1;~Xinyu_Feng3;~Yun_Long1;~Xin_Wang30;~Fotis_Iliopoulos1;~Da-Cheng_Juan1;~Erik_Vee1",
        "aff": "Google;Research, Google;Google;;;;;Google;Google;Google Research;",
        "aff_domain": "google.com;research.google.com;google.com;;;;;google.com;google.com;google.com;",
        "position": "Software Engineer;Researcher;Software Engineer;;;;;Software Engineer;Researcher;Senior Software Engineer;",
        "bibtex": "@misc{\nfan2024layernas,\ntitle={Layer{NAS}: Neural Architecture Search in Polynomial Complexity},\nauthor={Yicheng Fan and Dana Alon and JINGYUE SHEN and Daiyi Peng and Keshav Kumar and Xinyu Feng and Yun Long and Xin Wang and Fotis Iliopoulos and Da-Cheng Juan and Erik Vee},\nyear={2024},\nurl={https://openreview.net/forum?id=2DldCIjAdX}\n}",
        "github": "",
        "project": "",
        "reviewers": "4co7;sD5g;nAfG;xmki",
        "site": "https://openreview.net/forum?id=2DldCIjAdX",
        "pdf_size": 3857560,
        "rating": "5;5;5;8",
        "confidence": "5;3;4;4",
        "soundness": "2;2;2;4",
        "contribution": "2;2;2;3",
        "presentation": "2;2;2;3",
        "wc_summary": "99;17;24;50",
        "wc_strengths": "78;28;22;77",
        "wc_weaknesses": "233;350;144;16",
        "wc_questions": "47;35;25;1",
        "wc_review": "457;430;215;144",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1213;1234;1310;10",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;2;1",
        "rating_avg": [
            5.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            47.5,
            32.17530108639234
        ],
        "wc_strengths_avg": [
            51.25,
            26.337947907914163
        ],
        "wc_weaknesses_avg": [
            185.75,
            122.23824074323059
        ],
        "wc_questions_avg": [
            27.0,
            16.911534525287763
        ],
        "wc_review_avg": [
            311.5,
            134.70430579606577
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            941.75,
            539.1550681390281
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14910580986110710568&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "Google",
        "aff_unique_dep": "Google",
        "aff_unique_url": "https://www.google.com",
        "aff_unique_abbr": "Google",
        "aff_campus_unique_index": "0;0;0;0;0;0",
        "aff_campus_unique": "Mountain View",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "2EamGPuWSc",
        "title": "A Shot-Efficient Differential Equation Integrator using Quantum Neural Networks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Physics-informed regularisation on quantum neural networks provides a promising means for solving differential equations on near-term quantum computers.\nHowever, most demonstrations of this technique assume idealised simulated quantum circuits where the respective expectations  are available.\nIn real quantum hardware, such ideal expectations are not accessible and must be averaged over many shots, introducing additional computations, the cost of which  has not been considered in the majority of the preceding studies.\nThe requirements of higher-order derivatives for physics-informed regularisers are especially high in terms of circuit repetitions (shots) compared to lower-order derivatives required for supervised learning.\nWe demonstrate how to construct a global formulation of physics-informed losses especially amenable to solve ordinary differential equations on near-term quantum computers in a shot-efficient manner.\nThe resulting approach can reduce the order of derivatives required to calculate a loss compared to Physics-informed Neural Networks (PINNs). \nIn the case of initial value problems in ordinary differential equations (ODEs) and some partial differential equations (PDEs), our method removes completely the need for higher-order automatic differentiation,\nthus providing an $\\mathcal{O}(N)$ improvement in shot-efficiency, where $N$ is the number of data-encodings of the quantum neural network.\nOur formulation naturally incorporates boundary conditions and physics-informed losses into a single optimisation term.\nNumerical experiments demonstrate favourable empirical performance, in terms of both shot-efficiency and error, on (simulated) quantum circuits compared to existing quantum methodologies.\nWe demonstrate that the relative performance of quantum neural network algorithms in the infinite shot limit does not necessarily correspond to relative performance in the finite shot limit.\nWe hope this works provides insights on how to efficiently design schemes that will reduce the shot requirements and will become the basis for further developing efficient quantum algorithms for the solution of differential equations.",
        "keywords": "Variational Quantum Algorithms;Physics-Informed Machine Learning;Quantum Computing",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "",
        "author": "Atiyo Ghosh;Gergana V. Velikova;Panagiotis Barkoutsos;Vincent Emanuel Elfving",
        "authorids": "~Atiyo_Ghosh1;~Gergana_V._Velikova1;~Panagiotis_Barkoutsos1;~Vincent_Emanuel_Elfving1",
        "gender": ";F;M;",
        "homepage": ";;https://pasqal.com;",
        "dblp": ";;183/4846;",
        "google_scholar": "https://scholar.google.co.uk/citations?user=MTGN-gwAAAAJ;txNXEWEAAAAJ;SVcvKVYAAAAJ;",
        "orcid": "0000-0003-1606-8520;0000-0001-5910-8604;0000-0001-9428-913X;",
        "linkedin": "atiyo-ghosh-211255b5/;;pbarkoutsos/;",
        "or_profile": "~Atiyo_Ghosh1;~Gergana_V._Velikova1;~Panagiotis_Barkoutsos1;~Vincent_Emanuel_Elfving1",
        "aff": "Pasqal;PASQAL;PASQAL SAS;",
        "aff_domain": "pasqal.com;pasqal.com;pasqal.com;",
        "position": "Researcher;Researcher;VP Quantum Algorithms;",
        "bibtex": "@misc{\nghosh2024a,\ntitle={A Shot-Efficient Differential Equation Integrator using Quantum Neural Networks},\nauthor={Atiyo Ghosh and Gergana V. Velikova and Panagiotis Barkoutsos and Vincent Emanuel Elfving},\nyear={2024},\nurl={https://openreview.net/forum?id=2EamGPuWSc}\n}",
        "github": "",
        "project": "",
        "reviewers": "Nx77;bf4n;k8bX;1rNZ",
        "site": "https://openreview.net/forum?id=2EamGPuWSc",
        "pdf_size": 4362113,
        "rating": "3;3;3;5",
        "confidence": "3;4;4;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;2",
        "presentation": "2;2;2;2",
        "wc_summary": "53;52;208;86",
        "wc_strengths": "78;30;109;60",
        "wc_weaknesses": "167;197;242;194",
        "wc_questions": "4;35;145;3",
        "wc_review": "302;314;704;343",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            99.75,
            63.978023570598054
        ],
        "wc_strengths_avg": [
            69.25,
            28.647643882176418
        ],
        "wc_weaknesses_avg": [
            200.0,
            26.91653766738954
        ],
        "wc_questions_avg": [
            46.75,
            58.16517428840044
        ],
        "wc_review_avg": [
            415.75,
            167.08736487239244
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:xM1WQPST50IJ:scholar.google.com/&scioq=A+Shot-Efficient+Differential+Equation+Integrator+using+Quantum+Neural+Networks&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Pasqal;PASQAL SAS",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.pasqal.com;",
        "aff_unique_abbr": ";",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "France"
    },
    {
        "id": "2Ed7b52z53",
        "title": "On the Matrix Form of the Quaternion Fourier Transform and Quaternion Convolution",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We study matrix forms of quaternionic versions of the Fourier Transform and Convolution operations. Quaternions offer a powerful representation unit, however they are related to difficulties in their use that stem foremost from non-commutativity of quaternion multiplication, \nand due to that $\\mu^2 = -1$ posseses infinite solutions in the quaternion domain. Handling of quaternionic matrices is consequently complicated in several aspects (definition of eigenstructure, determinant, etc.). Our research findings clarify the relation of the Quaternion Fourier Transform matrix to the standard (complex) Discrete Fourier Transform matrix, and the extend on which well-known complex-domain theorems extend to quaternions. We focus especially on the relation of Quaternion Fourier Transform matrices to Quaternion Circulant matrices (representing quaternionic convolution), and the eigenstructure of the latter. A proof-of-concept application that makes direct use of our theoretical results is presented, where we present a method to bound the Lipschitz constant of a Quaternionic Convolutional Neural Network.",
        "keywords": "Quaternions;Fourier Transform;Convolution;Circulant Matrix",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Giorgos Sfikas;George Retsinas",
        "authorids": "~Giorgos_Sfikas1;~George_Retsinas2",
        "gender": "M;M",
        "homepage": "http://www.cs.uoi.gr/~sfikas;http://users.iit.demokritos.gr/~georgeretsi/",
        "dblp": "01/747;171/5669",
        "google_scholar": "X73G9lYAAAAJ;https://scholar.google.gr/",
        "orcid": "0000-0002-7305-2886;",
        "linkedin": "giorgos-sfikas-15a30484/;george-retsinas-9b073b88/",
        "or_profile": "~Giorgos_Sfikas1;~George_Retsinas2",
        "aff": "University of West Attica;National Technical University of Athens",
        "aff_domain": "uniwa.gr;ntua.gr",
        "position": "Assistant Professor;Postdoc",
        "bibtex": "@misc{\nsfikas2024on,\ntitle={On the Matrix Form of the Quaternion Fourier Transform and Quaternion Convolution},\nauthor={Giorgos Sfikas and George Retsinas},\nyear={2024},\nurl={https://openreview.net/forum?id=2Ed7b52z53}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZfTZ;JYL4;YJPK",
        "site": "https://openreview.net/forum?id=2Ed7b52z53",
        "pdf_size": 1346330,
        "rating": "1;5;5",
        "confidence": "4;3;3",
        "soundness": "1;4;3",
        "contribution": "1;1;2",
        "presentation": "1;3;3",
        "wc_summary": "44;67;60",
        "wc_strengths": "15;69;64",
        "wc_weaknesses": "318;163;215",
        "wc_questions": "1;143;6",
        "wc_review": "378;442;345",
        "wc_reply_reviewers": "41;0;0",
        "wc_reply_authors": "350;2785;1858",
        "reply_reviewers": "1;0;0",
        "reply_authors": "3;7;5",
        "rating_avg": [
            3.6666666666666665,
            1.8856180831641267
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "contribution_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            57.0,
            9.626352718795768
        ],
        "wc_strengths_avg": [
            49.333333333333336,
            24.36299561949547
        ],
        "wc_weaknesses_avg": [
            232.0,
            64.41014412859722
        ],
        "wc_questions_avg": [
            50.0,
            65.79260343432738
        ],
        "wc_review_avg": [
            388.3333333333333,
            40.2685430026411
        ],
        "wc_reply_reviewers_avg": [
            13.666666666666666,
            19.3275853524323
        ],
        "wc_reply_authors_avg": [
            1664.3333333333333,
            1003.4727477891742
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            5.0,
            1.632993161855452
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.9999999999999997,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:OH0SXWewsXYJ:scholar.google.com/&scioq=On+the+Matrix+Form+of+the+Quaternion+Fourier+Transform+and+Quaternion+Convolution&hl=en&as_sdt=0,5",
        "gs_version_total": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of West Attica;National Technical University of Athens",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uoa.gr;https://www.ntua.gr",
        "aff_unique_abbr": ";NTUA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Greece"
    },
    {
        "id": "2FAPahXyVh",
        "title": "OptiMUS: Optimization Modeling Using mip Solvers and large language models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Optimization problems are pervasive across various sectors, from manufacturing and distribution to healthcare. However, most such problems are still solved heuristically by hand rather than optimally by state-of-the-art solvers, as the expertise required to formulate and solve these problems limits the widespread adoption of optimization tools and techniques. We introduce OptiMUS, a Large Language Model (LLM)-based agent designed to formulate and solve MLIP problems from their natural language descriptions. OptiMUS is capable of developing mathematical models, writing and debugging solver code, developing tests, and checking the validity of generated solutions. To benchmark our agent, we present NLP4LP, a novel dataset of linear programming (LP) and mixed integer linear programming (MILP) problems. Our experiments demonstrate that OptiMUS is able to solve 67\\% more problems compared to a basic LLM prompting strategy. The code OptiMUS and the data for NLP4LP are available at \\href{https://anonymous.4open.science/r/nlp4lp-8F62/README.md}{https://anonymous.4open.science/r/nlp4lp-8F62/README.md}",
        "keywords": "LLM;AI;Optimization modeling;optimization solvers;mathematical formulation;autonomous agents",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/30597840440b73aabdda6a4c833ef8b7673c6530.pdf",
        "author": "Ali AhmadiTeshnizi;Wenzhi Gao;Madeleine Udell",
        "authorids": "~Ali_AhmadiTeshnizi1;~Wenzhi_Gao1;~Madeleine_Udell1",
        "gender": ";M;F",
        "homepage": "https://teshnizi.github.io/;https://github.com/Gwzwpxz;https://people.orie.cornell.edu/mru8",
        "dblp": ";;153/2166",
        "google_scholar": "475ARYgAAAAJ;4lDkX_YAAAAJ;tZ9pEDMAAAAJ",
        "orcid": ";;0000-0002-3985-915X",
        "linkedin": "teshnizi/;;",
        "or_profile": "~Ali_AhmadiTeshnizi1;~Wenzhi_Gao1;~Madeleine_Udell1",
        "aff": "Stanford University;Stanford University;Stanford University",
        "aff_domain": "stanford.edu;stanford.edu;stanford.edu",
        "position": "PhD student;PhD student;Assistant Professor",
        "bibtex": "@misc{\nahmaditeshnizi2024optimus,\ntitle={Opti{MUS}: Optimization Modeling Using mip Solvers and large language models},\nauthor={Ali AhmadiTeshnizi and Wenzhi Gao and Madeleine Udell},\nyear={2024},\nurl={https://openreview.net/forum?id=2FAPahXyVh}\n}",
        "github": "",
        "project": "",
        "reviewers": "8JDZ;GUNL;QHcC;Bafe",
        "site": "https://openreview.net/forum?id=2FAPahXyVh",
        "pdf_size": 1434421,
        "rating": "3;5;5;6",
        "confidence": "4;3;3;3",
        "soundness": "1;2;2;3",
        "contribution": "2;3;3;3",
        "presentation": "1;2;3;3",
        "wc_summary": "255;58;36;30",
        "wc_strengths": "47;61;35;14",
        "wc_weaknesses": "177;131;26;83",
        "wc_questions": "58;343;181;12",
        "wc_review": "537;593;278;139",
        "wc_reply_reviewers": "367;0;80;119",
        "wc_reply_authors": "992;624;337;887",
        "reply_reviewers": "3;0;1;3",
        "reply_authors": "4;1;2;4",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            94.75,
            93.10578660856693
        ],
        "wc_strengths_avg": [
            39.25,
            17.239127008059313
        ],
        "wc_weaknesses_avg": [
            104.25,
            56.08642883978262
        ],
        "wc_questions_avg": [
            148.5,
            128.16883396520387
        ],
        "wc_review_avg": [
            386.75,
            185.95748842141313
        ],
        "wc_reply_reviewers_avg": [
            141.5,
            137.07753280534342
        ],
        "wc_reply_authors_avg": [
            710.0,
            253.66217692040726
        ],
        "reply_reviewers_avg": [
            1.75,
            1.299038105676658
        ],
        "reply_authors_avg": [
            2.75,
            1.299038105676658
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.9271726499455306,
        "gs_citation": 37,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15204204105868547127&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Stanford University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.stanford.edu",
        "aff_unique_abbr": "Stanford",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Stanford",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "2GJm8yT2jN",
        "title": "URLOST: Unsupervised Representation Learning without Stationarity or Topology",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Unsupervised representation learning has seen tremendous progress but is constrained by its reliance on data modality specific stationarity and topology, a limitation not found in biological intelligence systems. For instance, human vision processes visual signals derived from irregular and non-stationary sampling lattices yet accurately perceives the geometry of the world. We introduce a novel framework that learns from high-dimensional data lacking stationarity and topology. Our model combines spectral clustering, and masked autoencoders and a learnable self-organizing layer. We evaluate its effectiveness on simulated biological vision data, neural recordings from the primary visual cortex, and gene expression datasets. Compared to state-of-the-art unsupervised learning methods like SimCLR and MAE, our model excels at learning meaningful representations across diverse modalities without depending on stationarity or topology. It also outperforms other methods not dependent on these factors, setting a new benchmark in the field. This work represents a step toward unsupervised learning methods that can generalize across diverse high dimensional data modalities.",
        "keywords": "Unsupervised learning;Self-supervised learning;Deep learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Zeyu Yun;Juexiao Zhang;Bruno Olshausen;Yann LeCun;Yubei Chen",
        "authorids": "~Zeyu_Yun1;~Juexiao_Zhang1;~Bruno_Olshausen1;~Yann_LeCun1;~Yubei_Chen1",
        "gender": "M;M;M;M;M",
        "homepage": "https://zeyuyun1.github.io/;https://juexzz.github.io/;http://redwood.berkeley.edu/bruno/;http://yann.lecun.com;https://redwood.berkeley.edu/people/yubei-chen/",
        "dblp": "289/2186;250/9589;30/3869;l/YannLeCun;30/10064",
        "google_scholar": ";TYxPbcEAAAAJ;4aqK_74AAAAJ;WLN3QrAAAAAJ;WeyLqFUAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";juexiao-zhang-788453146/Juexiao-Zhang;;;yubei-chen-05998a39/",
        "or_profile": "~Zeyu_Yun1;~Juexiao_Zhang1;~Bruno_Olshausen1;~Yann_LeCun1;~Yubei_Chen1",
        "aff": "University of California, Berkeley;New York University;UC Berkeley;New York University;University of California, Davis",
        "aff_domain": "berkeley.edu;nyu.edu;;nyu.edu;ucdavis.edu",
        "position": "MS student;PhD student;Full Professor;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nyun2024urlost,\ntitle={{URLOST}: Unsupervised Representation Learning without Stationarity or Topology},\nauthor={Zeyu Yun and Juexiao Zhang and Bruno Olshausen and Yann LeCun and Yubei Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=2GJm8yT2jN}\n}",
        "github": "",
        "project": "",
        "reviewers": "JGWe;qyGv;EzDe",
        "site": "https://openreview.net/forum?id=2GJm8yT2jN",
        "pdf_size": 7983547,
        "rating": "5;6;6",
        "confidence": "1;3;4",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "2;4;3",
        "wc_summary": "28;95;43",
        "wc_strengths": "30;111;66",
        "wc_weaknesses": "96;126;163",
        "wc_questions": "2;5;42",
        "wc_review": "156;337;314",
        "wc_reply_reviewers": "0;31;0",
        "wc_reply_authors": "1255;1208;1614",
        "reply_reviewers": "0;1;0",
        "reply_authors": "3;2;4",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            55.333333333333336,
            28.709270666845967
        ],
        "wc_strengths_avg": [
            69.0,
            33.13608305156178
        ],
        "wc_weaknesses_avg": [
            128.33333333333334,
            27.402351886086148
        ],
        "wc_questions_avg": [
            16.333333333333332,
            18.190351532856337
        ],
        "wc_review_avg": [
            269.0,
            80.45288476286396
        ],
        "wc_reply_reviewers_avg": [
            10.333333333333334,
            14.613540144521982
        ],
        "wc_reply_authors_avg": [
            1359.0,
            181.33026958196103
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.0,
            0.816496580927726
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.9449111825230683,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5809278398021347415&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;0;1;2",
        "aff_unique_norm": "University of California, Berkeley;New York University;University of California, Davis",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.berkeley.edu;https://www.nyu.edu;https://www.ucdavis.edu",
        "aff_unique_abbr": "UC Berkeley;NYU;UC Davis",
        "aff_campus_unique_index": "0;0;2",
        "aff_campus_unique": "Berkeley;;Davis",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "2GMTfqr7eb",
        "title": "Retro: Reusing teacher projection head for efficient embedding distillation on Lightweight Models via Self-supervised Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Self-supervised learning (SSL) is gaining attention for its ability to learn effective representations with large amounts of unlabeled data. Lightweight models can be distilled from larger self-supervised pre-trained models using contrastive and consistency constraints, but the different sizes of the projection heads make it challenging for students to accurately mimic the teacher's embedding. We propose \\textsc{Retro}, which reuses the teacher's projection head for students, and our experimental results demonstrate significant improvements over the state-of-the-art on all lightweight models. For instance, when training EfficientNet-B0 using ResNet-50/101/152 as teachers, our approach improves the linear result on ImageNet to $66.9%$, $69.3%$, and $69.8%$, respectively, with significantly fewer parameters.",
        "keywords": "Self-supervised learning;knowledge distillation;lightweight models;contrastive learning;consistency learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/df05b343cde141bc250174f0cd4bd513db9ad5b9.pdf",
        "author": "Khanh-Binh Nguyen",
        "authorids": "~Khanh-Binh_Nguyen1",
        "gender": "M",
        "homepage": "",
        "dblp": "325/4115",
        "google_scholar": "LoOglv4AAAAJ",
        "orcid": "0000-0002-9948-1400",
        "linkedin": "",
        "or_profile": "~Khanh-Binh_Nguyen1",
        "aff": "National Cancer Center",
        "aff_domain": "ncc.re.kr",
        "position": "Researcher",
        "bibtex": "@misc{\nnguyen2024retro,\ntitle={Retro: Reusing teacher projection head for efficient embedding distillation on Lightweight Models via Self-supervised Learning},\nauthor={Khanh-Binh Nguyen},\nyear={2024},\nurl={https://openreview.net/forum?id=2GMTfqr7eb}\n}",
        "github": "",
        "project": "",
        "reviewers": "dnj5;96a3;qqvw",
        "site": "https://openreview.net/forum?id=2GMTfqr7eb",
        "pdf_size": 472968,
        "rating": "3;5;5",
        "confidence": "5;4;4",
        "soundness": "3;2;3",
        "contribution": "2;2;2",
        "presentation": "2;3;3",
        "wc_summary": "55;53;51",
        "wc_strengths": "27;80;35",
        "wc_weaknesses": "124;208;131",
        "wc_questions": "1;31;43",
        "wc_review": "207;372;260",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            53.0,
            1.632993161855452
        ],
        "wc_strengths_avg": [
            47.333333333333336,
            23.328570942563587
        ],
        "wc_weaknesses_avg": [
            154.33333333333334,
            38.055515004033545
        ],
        "wc_questions_avg": [
            25.0,
            17.663521732655695
        ],
        "wc_review_avg": [
            279.6666666666667,
            68.78145744958367
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.9999999999999997,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:tz9qD1zgPBkJ:scholar.google.com/&scioq=Retro:+Reusing+teacher+projection+head+for+efficient+embedding+distillation+on+Lightweight+Models+via+Self-supervised+Learning&hl=en&as_sdt=0,23",
        "gs_version_total": 4,
        "aff_unique_index": "0",
        "aff_unique_norm": "National Cancer Center",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ncc.re.kr",
        "aff_unique_abbr": "NCC",
        "aff_country_unique_index": "0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "What does the Knowledge Neuron Thesis Have to do with Knowledge?",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19556",
        "id": "2HJRwwbV3G",
        "author_site": "Jingcheng Niu, Andrew Liu, Zining Zhu, Gerald Penn",
        "tldr": "",
        "abstract": "We reassess the Knowledge Neuron (KN) Thesis: an interpretation of the mechanism underlying the ability of large language models to recall facts from a training corpus. This nascent thesis proposes that facts are recalled from the training corpus through the MLP weights in a manner resembling key-value memory, implying in effect that \"knowledge\" is stored in the network. Furthermore, by modifying the MLP modules, one can control the language model's generation of factual information. The plausibility of the KN thesis has been demonstrated by the success of KN-inspired model editing methods (Dai et al., 2022; Meng et al., 2022).\n\nWe find that this thesis is, at best, an oversimplification. Not only have we found that we can edit the expression of certain linguistic phenomena using the same model editing methods but, through a more comprehensive evaluation, we have found that the KN thesis does not adequately explain the process of factual expression. While it is possible to argue that the MLP weights store complex patterns that are interpretable both syntactically and semantically, these patterns do not constitute \"knowledge.\" To gain a more comprehensive understanding of the knowledge representation process, we must look beyond the MLP weights and explore recent models' complex layer structures  and attention mechanisms.",
        "keywords": "language model;knowledge neuron;model editing;formal and function competence;syntax;fact",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Jingcheng Niu;Andrew Liu;Zining Zhu;Gerald Penn",
        "authorids": "~Jingcheng_Niu1;~Andrew_Liu6;~Zining_Zhu1;~Gerald_Penn1",
        "gender": "M;M;;M",
        "homepage": "http://www.cs.toronto.edu/~niu/;https://www.cs.toronto.edu/~aliu/;http://ziningzhu.github.io;http://www.cs.toronto.edu/~gpenn/",
        "dblp": "245/8596.html;;188/5709;37/1531",
        "google_scholar": "XQuH0EEAAAAJ;;https://scholar.google.ca/citations?user=Xr_hCJMAAAAJ;ZnKtf4YAAAAJ",
        "orcid": ";;;0000-0003-3553-8305",
        "linkedin": ";andrew-liu438/;zining-zhu/;gerald-penn-1391bb3/",
        "or_profile": "~Jingcheng_Niu1;~Andrew_Liu6;~Zining_Zhu1;~Gerald_Penn1",
        "aff": "University of Toronto;University of Waterloo;University of Toronto;Department of Computer Science, University of Toronto",
        "aff_domain": "cs.toronto.edu;uwaterloo.ca;toronto.edu;cs.toronto.edu",
        "position": "PhD student;Undergrad student;PhD student;Full Professor",
        "bibtex": "@inproceedings{\nniu2024what,\ntitle={What does the Knowledge Neuron Thesis Have to do with Knowledge?},\nauthor={Jingcheng Niu and Andrew Liu and Zining Zhu and Gerald Penn},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=2HJRwwbV3G}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZPK4;7T91;c8FP",
        "pdf_size": 1172918,
        "rating": "6;8;8",
        "confidence": "3;3;4",
        "soundness": "3;4;3",
        "contribution": "2;4;4",
        "presentation": "3;2;3",
        "wc_summary": "114;138;46",
        "wc_strengths": "81;81;42",
        "wc_weaknesses": "179;100;23",
        "wc_questions": "321;141;1",
        "wc_review": "695;460;112",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "792;248;33",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            99.33333333333333,
            38.96437118987322
        ],
        "wc_strengths_avg": [
            68.0,
            18.384776310850235
        ],
        "wc_weaknesses_avg": [
            100.66666666666667,
            63.68847793928053
        ],
        "wc_questions_avg": [
            154.33333333333334,
            130.97921802925666
        ],
        "wc_review_avg": [
            422.3333333333333,
            239.49437478896152
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            357.6666666666667,
            319.4164818679351
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.49999999999999983,
        "gs_citation": 23,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5330732570030088119&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=2HJRwwbV3G",
        "pdf": "https://openreview.net/pdf?id=2HJRwwbV3G",
        "email": "cs.toronto.edu;uwaterloo.ca;toronto.edu;cs.toronto.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "University of Toronto;University of Waterloo",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.utoronto.ca;https://uwaterloo.ca",
        "aff_unique_abbr": "U of T;UW",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Toronto",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "2J25Vi9W8I",
        "title": "RegCLIP: A Label-Efficient Coarse-to-Fine Learner for Ordinal Regression",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Ordinal regression is a fundamental problem within the field of computer vision. While pre-trained vision-language models have exhibited impressive performance on various vision tasks, their potential for ordinal regression has received less exploration.\nIn this paper, we introduce a novel method called RegCLIP, a label-efficient coarse-to-fine method for ordinal regression. This approach incorporates language prior information to gradually refine predictions and achieve fine-grained results.\nOur RegCLIP framework encompasses two levels of coarse-to-fine concepts. The first level is a stagewise approach, performing intermediate classification initially and then refining the predictions. The second level is to generate coarse semantic labels as intermediate classes and subsequently refine them into fine-grained labels. To achieve it, we propose a novel coarse semantic label generation via large language models, which generates coarse labels. To further enhance the precision of predictions, we propose a novel fine-grained cross-modal ranking-based loss specifically designed to update fine-grained semantic labels with both semantic and ordinal alignment. Experimental results on three general ordinal regression tasks demonstrate the effectiveness of RegCLIP, exceeding state-of-the-art methods with a large margin, with 10% overall accuracy improvement on historical image dating, 1.74% overall accuracy improvement on image aesthetics assessment, and 1.33 MAE reduction on age estimation under 1-shot setting.",
        "keywords": "ordinal regression;contrastive learning;representation learning;vision-language",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yao DU;Qiang Zhai;Weihang Dai;Xiaomeng Li",
        "authorids": "~Yao_DU4;~Qiang_Zhai1;~Weihang_Dai1;~Xiaomeng_Li1",
        "gender": ";M;M;F",
        "homepage": ";;;https://xmengli.github.io/",
        "dblp": ";;152/9822;02/9850-1",
        "google_scholar": ";3I5VuhUAAAAJ;;uVTzPpoAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;weihang-dai-89122120;",
        "or_profile": "~Yao_DU4;~Qiang_Zhai1;~Weihang_Dai1;~Xiaomeng_Li1",
        "aff": ";Hong Kong University of Science and Technology;Hong Kong University of Science and Technology;Hong Kong University of Science and Technology",
        "aff_domain": ";ust.hk;ust.hk;ust.hk",
        "position": ";Postdoc;PhD student;Assistant Professor",
        "bibtex": "@misc{\ndu2024regclip,\ntitle={Reg{CLIP}: A Label-Efficient Coarse-to-Fine Learner for Ordinal Regression},\nauthor={Yao DU and Qiang Zhai and Weihang Dai and Xiaomeng Li},\nyear={2024},\nurl={https://openreview.net/forum?id=2J25Vi9W8I}\n}",
        "github": "",
        "project": "",
        "reviewers": "BLNi;YX7j;oR5C;i2rY;DJCj",
        "site": "https://openreview.net/forum?id=2J25Vi9W8I",
        "pdf_size": 2314841,
        "rating": "3;3;5;5;8",
        "confidence": "4;5;5;4;5",
        "soundness": "3;2;2;3;3",
        "contribution": "2;2;2;2;3",
        "presentation": "2;3;3;2;3",
        "wc_summary": "65;72;83;54;76",
        "wc_strengths": "69;47;89;89;36",
        "wc_weaknesses": "85;119;169;77;180",
        "wc_questions": "124;151;5;13;79",
        "wc_review": "343;389;346;233;371",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            4.8,
            1.8330302779823362
        ],
        "confidence_avg": [
            4.6,
            0.48989794855663565
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            70.0,
            9.899494936611665
        ],
        "wc_strengths_avg": [
            66.0,
            21.577766334817884
        ],
        "wc_weaknesses_avg": [
            126.0,
            42.180564244685016
        ],
        "wc_questions_avg": [
            74.4,
            58.1982817615778
        ],
        "wc_review_avg": [
            336.4,
            54.38970490819012
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.35634832254989907,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:D9tgn8I8_lYJ:scholar.google.com/&scioq=RegCLIP:+A+Label-Efficient+Coarse-to-Fine+Learner+for+Ordinal+Regression&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Hong Kong University of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ust.hk",
        "aff_unique_abbr": "HKUST",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Lipsum-FT: Robust Fine-Tuning of Zero-Shot Models Using Random Text Guidance",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19555",
        "id": "2JF8mJRJ7M",
        "author_site": "Giung Nam, Byeongho Heo, Juho Lee",
        "tldr": "",
        "abstract": "Large-scale contrastive vision-language pre-trained models provide the zero-shot model achieving competitive performance across a range of image classification tasks without requiring training on downstream data. Recent works have confirmed that while additional fine-tuning of the zero-shot model on the reference data results in enhanced downstream performance, it compromises the model's robustness against distribution shifts. Our investigation begins by examining the conditions required to achieve the goals of robust fine-tuning, employing descriptions based on feature distortion theory and joint energy-based models. Subsequently, we propose a novel robust fine-tuning algorithm, Lipsum-FT, that effectively utilizes the language modeling aspect of the vision-language pre-trained models. Extensive experiments conducted on distribution shift scenarios in DomainNet and ImageNet confirm the superiority of our proposed Lipsum-FT approach over existing robust fine-tuning methods.",
        "keywords": "computer vision;vision-langauge model;transfer learning;fine-tuning;distribution shifts",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/f06d7c8550270c7566e73feb061af263396284a3.zip",
        "author": "Giung Nam;Byeongho Heo;Juho Lee",
        "authorids": "~Giung_Nam1;~Byeongho_Heo1;~Juho_Lee2",
        "gender": ";M;M",
        "homepage": "https://cs-giung.github.io/;https://sites.google.com/view/byeongho-heo/home;https://juho.lee.github.io",
        "dblp": "304/9008;142/2705;55/3410-1",
        "google_scholar": "https://scholar.google.co.kr/citations?user=HO-fMd8AAAAJ;https://scholar.google.co.kr/citations?user=4_7rLDIAAAAJ;Py4URJUAAAAJ",
        "orcid": ";;",
        "linkedin": ";byeongho-heo-1a7756122/;",
        "or_profile": "~Giung_Nam1;~Byeongho_Heo1;~Juho_Lee2",
        "aff": "Korea Advanced Institute of Science & Technology;NAVER AI Lab;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;navercorp.com;kaist.ac.kr",
        "position": "PhD student;Researcher;Associate Professor",
        "bibtex": "@inproceedings{\nnam2024lipsumft,\ntitle={Lipsum-{FT}: Robust Fine-Tuning of Zero-Shot Models Using Random Text Guidance},\nauthor={Giung Nam and Byeongho Heo and Juho Lee},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=2JF8mJRJ7M}\n}",
        "github": "",
        "project": "",
        "reviewers": "2e7P;Q7od;26HN;MuzV",
        "pdf_size": 6394826,
        "rating": "5;6;6;6",
        "confidence": "4;5;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;2;3",
        "wc_summary": "21;63;67;103",
        "wc_strengths": "38;46;86;97",
        "wc_weaknesses": "18;170;71;86",
        "wc_questions": "122;17;119;204",
        "wc_review": "199;296;343;490",
        "wc_reply_reviewers": "157;38;227;35",
        "wc_reply_authors": "1326;740;1665;845",
        "reply_reviewers": "2;1;2;1",
        "reply_authors": "3;2;4;3",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            63.5,
            29.06458325866724
        ],
        "wc_strengths_avg": [
            66.75,
            25.21284394906691
        ],
        "wc_weaknesses_avg": [
            86.25,
            54.554445281754994
        ],
        "wc_questions_avg": [
            115.5,
            66.31176366226433
        ],
        "wc_review_avg": [
            332.0,
            104.96427963836078
        ],
        "wc_reply_reviewers_avg": [
            114.25,
            81.60078124626014
        ],
        "wc_reply_authors_avg": [
            1144.0,
            373.22312361374395
        ],
        "reply_reviewers_avg": [
            1.5,
            0.5
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5894155217848335541&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=2JF8mJRJ7M",
        "pdf": "https://openreview.net/pdf?id=2JF8mJRJ7M",
        "email": "kaist.ac.kr;navercorp.com;kaist.ac.kr",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology;NAVER Corporation",
        "aff_unique_dep": ";NAVER AI Lab",
        "aff_unique_url": "https://www.kaist.ac.kr;https://www.naver.com",
        "aff_unique_abbr": "KAIST;NAVER",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "2Kf1AIdeyt",
        "title": "Balancing Information Preservation and Computational Efficiency: L2 Normalization and Geodesic Distance in Manifold Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Distinguishable metric of similarity plays a fundamental role in unsupervised learning, particularly in manifold learning and high-dimensional data visualization tasks, by which differentiate between observations without labels. However, conventional metrics like Euclidean distance after L1-normalization may fail by losing distinguishable information when handling high-dimensional data, where the distance between different observations gradually converges to a shrinking interval. In this article, we discuss the influence of normalization by different p-norms and the defect of Euclidean distance. We discover that observation differences are better preserved when normalizing data by a higher p-norm and using geodesic distance rather than Euclidean distance as the similarity measurement. We further identify that L2-normalization onto the hypersphere is often sufficient in preserving delicate differences even in relatively high dimensional data while maintaining computational efficiency. Subsequently, we present HS-SNE (HyperSphere-SNE), a hypersphere-representation-system-based augmentation to t-SNE, which effectively addresses the intricacy of high-dimensional data visualization and similarity measurement. Our results show that this hypersphere representation system has improved resolution to identify more subtle differences in high-dimensional data, while balancing information preservation and computational efficiency.",
        "keywords": "Normalization;Geodesic Distance;Manifold Learning;Bioinformatics",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Ziqi Rong;Jinpu Cai;Jiahao Qiu;Pengcheng Xu;Lana Garmire;Qiuyu Lian;Hongyi Xin",
        "authorids": "~Ziqi_Rong1;~Jinpu_Cai1;~Jiahao_Qiu1;~Pengcheng_Xu2;~Lana_Garmire1;~Qiuyu_Lian1;~Hongyi_Xin1",
        "gender": "M;M;M;Not Specified;;F;M",
        "homepage": "https://zqrong.com;https://carroll105.github.io/;;https://explcre.github.io;https://garmiregroup.org/;https://scholar.google.com/citations?user=sfD9B58AAAAJ&hl=en&oi=ao;http://gift.sjtu.edu.cn/novellab/",
        "dblp": ";279/6161;;;;;",
        "google_scholar": "oTH0DJcAAAAJ;Bmsg17YAAAAJ;86dbUg4AAAAJ;;6_k2UGsAAAAJ;sfD9B58AAAAJ;U7vpUGkAAAAJ",
        "orcid": "0000-0003-3760-8450;0009-0004-8636-3925;0009-0000-7752-4169;0009-0000-9858-9316;0000-0002-4654-2126;0000-0002-5279-1989;0000-0003-2864-7386",
        "linkedin": ";;jiahao-qiu-6a6161224/;pengcheng-xu-ryan/;;;",
        "or_profile": "~Ziqi_Rong1;~Jinpu_Cai1;~Jiahao_Qiu1;~Pengcheng_Xu2;~Lana_Garmire1;~Qiuyu_Lian1;~Hongyi_Xin1",
        "aff": "University of Michigan - Ann Arbor;Shanghai Jiaotong University;Princeton University;University of California, Irvine;University of Michigan - Ann Arbor;University of Cambridge;Shanghai Jiaotong University",
        "aff_domain": "umich.edu;sjtu.edu.cn;princeton.edu;uci.edu;umich.edu;cam.ac.uk;sjtu.edu.cn",
        "position": "MS student;PhD student;PhD student;PhD student;Associate Professor;Postdoc;Associate Professor",
        "bibtex": "@misc{\nrong2024balancing,\ntitle={Balancing Information Preservation and Computational Efficiency: L2 Normalization and Geodesic Distance in Manifold Learning},\nauthor={Ziqi Rong and Jinpu Cai and Jiahao Qiu and Pengcheng Xu and Lana Garmire and Qiuyu Lian and Hongyi Xin},\nyear={2024},\nurl={https://openreview.net/forum?id=2Kf1AIdeyt}\n}",
        "github": "",
        "project": "",
        "reviewers": "mtLk;2wH8;FzWv",
        "site": "https://openreview.net/forum?id=2Kf1AIdeyt",
        "pdf_size": 14210904,
        "rating": "3;3;5",
        "confidence": "5;5;4",
        "soundness": "2;2;2",
        "contribution": "1;2;2",
        "presentation": "3;2;3",
        "wc_summary": "85;94;73",
        "wc_strengths": "40;94;33",
        "wc_weaknesses": "69;158;42",
        "wc_questions": "374;158;55",
        "wc_review": "568;504;203",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            84.0,
            8.602325267042627
        ],
        "wc_strengths_avg": [
            55.666666666666664,
            27.255988129012838
        ],
        "wc_weaknesses_avg": [
            89.66666666666667,
            49.56028876249837
        ],
        "wc_questions_avg": [
            195.66666666666666,
            132.92688048530874
        ],
        "wc_review_avg": [
            425.0,
            159.1372573179099
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:TapYTLI9GGIJ:scholar.google.com/&scioq=Balancing+Information+Preservation+and+Computational+Efficiency:+L2+Normalization+and+Geodesic+Distance+in+Manifold+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;0;4;1",
        "aff_unique_norm": "University of Michigan;Shanghai Jiao Tong University;Princeton University;University of California, Irvine;University of Cambridge",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.umich.edu;https://www.sjtu.edu.cn;https://www.princeton.edu;https://www.uci.edu;https://www.cam.ac.uk",
        "aff_unique_abbr": "UM;SJTU;Princeton;UCI;Cambridge",
        "aff_campus_unique_index": "0;2;0;3",
        "aff_campus_unique": "Ann Arbor;;Irvine;Cambridge",
        "aff_country_unique_index": "0;1;0;0;0;2;1",
        "aff_country_unique": "United States;China;United Kingdom"
    },
    {
        "id": "2LhCPowI6i",
        "title": "Self-Supervised Pseudodata Filtering for Improved Replay with Sub-Optimal Generators",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Continual learning on a sequence of tasks without forgetting previously acquired knowledge is one of the main challenges faced by modern deep neural networks. In the class-incremental scenario, one of the most difficult continual learning problems, new classes are presented to a classifier over time. The model needs to be able to learn and recognize these new classes while also retaining its knowledge of previously witnessed ones. To achieve this, the model has to revisit previous classes in some form, either by analysing stored exemplars or by using artificially generated samples. The latter approach, Generative Replay, usually relies on a separate generator trained alongside the main classifier. Since the generator also needs to learn continually, it is retrained on every task, using its own generated samples as training data representing older classes. This can lead to error propagation and accumulating features unimportant or confusing for the classifier, reducing the overall performance for larger numbers of tasks. We propose a simple filtering mechanism for mitigating this issue \u2013 whenever pseudodata is generated for a new task, the classifier can reject samples it is not able to classify with sufficient confidence, thus preventing itself from retraining on poor-quality data. We tested this mechanism using combinations of Bayesian neural classifiers and two different generators: a Variational Autoencoder and Real-value Non-Volume Preserving Normalizing Flow. We show that the improvement in the classification accuracy grows with the number of tasks, suggesting this approach is particularly useful for the most challenging continual learning scenarios, where very many tasks are learned in a sequence.",
        "keywords": "continual learning;catastrophic forgetting;generative replay;bayesian neural networks;deep learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Mateusz Wasiluk;Mikkel Elle Lepper\u00f8d;Kai Olav Ellefsen",
        "authorids": "~Mateusz_Wasiluk1;~Mikkel_Elle_Lepper\u00f8d1;kaiolae@ifi.uio.no",
        "gender": "M;M;",
        "homepage": "https://www.mn.uio.no/ibv/english/people/aca/mateuwa/index.html;;",
        "dblp": ";218/9214;",
        "google_scholar": ";https://scholar.google.no/citations?user=QSYCR88AAAAJ;",
        "orcid": ";;",
        "linkedin": "mwasiluk314/;;",
        "or_profile": "~Mateusz_Wasiluk1;~Mikkel_Elle_Lepper\u00f8d1;kaiolae@ifi.uio.no",
        "aff": "University of Oslo;Simula Research Laboratory;",
        "aff_domain": "uio.no;simula.no;",
        "position": "PhD student;Principal Researcher;",
        "bibtex": "@misc{\nwasiluk2024selfsupervised,\ntitle={Self-Supervised Pseudodata Filtering for Improved Replay with Sub-Optimal Generators},\nauthor={Mateusz Wasiluk and Mikkel Elle Lepper{\\o}d and Kai Olav Ellefsen},\nyear={2024},\nurl={https://openreview.net/forum?id=2LhCPowI6i}\n}",
        "github": "",
        "project": "",
        "reviewers": "6px8;yxwt;fB4Z",
        "site": "https://openreview.net/forum?id=2LhCPowI6i",
        "pdf_size": 892010,
        "rating": "1;3;3",
        "confidence": "5;5;4",
        "soundness": "2;2;2",
        "contribution": "1;2;1",
        "presentation": "3;2;2",
        "wc_summary": "126;55;62",
        "wc_strengths": "133;10;41",
        "wc_weaknesses": "550;147;576",
        "wc_questions": "36;4;282",
        "wc_review": "845;216;961",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            81.0,
            31.94787421201396
        ],
        "wc_strengths_avg": [
            61.333333333333336,
            52.23238671765078
        ],
        "wc_weaknesses_avg": [
            424.3333333333333,
            196.3913326894941
        ],
        "wc_questions_avg": [
            107.33333333333333,
            124.19697616644655
        ],
        "wc_review_avg": [
            674.0,
            327.29904776315294
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:hlB2n22EuZIJ:scholar.google.com/&scioq=Self-Supervised+Pseudodata+Filtering+for+Improved+Replay+with+Sub-Optimal+Generators&hl=en&as_sdt=0,33",
        "gs_version_total": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Oslo;Simula Research Laboratory",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uio.no;https://www.simula.no",
        "aff_unique_abbr": "UiO;Simula",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Norway"
    },
    {
        "id": "2M4GAkUkjA",
        "title": "Efficient Link Prediction via GNN Layers Induced by Negative Sampling",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Graph neural networks (GNNs) for link prediction can loosely be divided into two broad categories.  First, \\emph{node-wise} architectures pre-compute individual embeddings for each node that are later combined by a simple decoder to make predictions.  While extremely efficient at inference time (since node embeddings are only computed once and repeatedly reused), model expressiveness is limited such that isomorphic nodes contributing to candidate edges may not be distinguishable, compromising accuracy.  In contrast, \\emph{edge-wise} methods rely on the formation of edge-specific subgraph embeddings to enrich the representation of pair-wise relationships, disambiguating isomorphic nodes to improve accuracy, but with the cost of increased model complexity.  To better navigate this trade-off, we propose a novel GNN architecture whereby the \\emph{forward pass} explicitly depends on \\emph{both} positive (as is typical) and negative (unique to our approach) edges to inform more flexible, yet still cheap node-wise embeddings.  This is achieved by recasting the embeddings themselves as minimizers of a forward-pass-specific energy function (distinct from the actual training loss) that favors separation of positive and negative samples.  As demonstrated by extensive empirical evaluations, the resulting architecture retains the inference speed of node-wise models, while producing competitive accuracy with edge-wise alternatives.",
        "keywords": "Link prediction;Inference speed",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/de12fedf085aa55ceeacfe7e259d100e08382093.zip",
        "author": "Yuxin Wang;Xiannian Hu;Quan Gan;Xuanjing Huang;Xipeng Qiu;David Wipf",
        "authorids": "~Yuxin_Wang3;~Xiannian_Hu1;~Quan_Gan1;~Xuanjing_Huang1;~Xipeng_Qiu1;~David_Wipf1",
        "gender": "M;M;M;F;M;M",
        "homepage": ";;;https://xuanjing-huang.github.io/;https://xpqiu.github.io/;http://www.davidwipf.com/",
        "dblp": "68/1041;;72/3872;05/6735-1;69/1395;81/6421",
        "google_scholar": "bTo8CT0AAAAJ;;;RGsMgZA4H78C;Pq4Yp_kAAAAJ;YJx1WSgAAAAJ",
        "orcid": ";;0009-0002-0986-457X;0000-0001-9197-9426;0000-0001-7163-5247;",
        "linkedin": ";\u5148\u5ff5-\u80e1-6b17781a9/;quan-gan-231992136/;;;",
        "or_profile": "~Yuxin_Wang3;~Xiannian_Hu1;~Quan_Gan1;~Xuanjing_Huang1;~Xipeng_Qiu1;~David_Wipf1",
        "aff": "Fudan University;Fudan University;Amazon;Fudan University;Fudan University;Amazon AI Research Lab",
        "aff_domain": "fudan.edu.cn;fudan.edu.cn;amazon.com;fudan.edu.cn;fudan.edu.cn;amazon.com",
        "position": "PhD student;MS student;Researcher;Full Professor;Full Professor;Principal Research Scientist",
        "bibtex": "@misc{\nwang2024efficient,\ntitle={Efficient Link Prediction via {GNN} Layers Induced by Negative Sampling},\nauthor={Yuxin Wang and Xiannian Hu and Quan Gan and Xuanjing Huang and Xipeng Qiu and David Wipf},\nyear={2024},\nurl={https://openreview.net/forum?id=2M4GAkUkjA}\n}",
        "github": "",
        "project": "",
        "reviewers": "TNzh;32eE;EieC;pZx7",
        "site": "https://openreview.net/forum?id=2M4GAkUkjA",
        "pdf_size": 920133,
        "rating": "3;5;5;5",
        "confidence": "4;4;3;2",
        "soundness": "2;3;3;2",
        "contribution": "1;2;3;2",
        "presentation": "3;2;2;2",
        "wc_summary": "82;25;51;116",
        "wc_strengths": "28;35;61;30",
        "wc_weaknesses": "269;174;108;198",
        "wc_questions": "3;135;3;24",
        "wc_review": "382;369;223;368",
        "wc_reply_reviewers": "0;23;0;0",
        "wc_reply_authors": "756;921;539;1002",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;3;1;2",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            68.5,
            34.04776057246644
        ],
        "wc_strengths_avg": [
            38.5,
            13.238202294873727
        ],
        "wc_weaknesses_avg": [
            187.25,
            57.56463758246029
        ],
        "wc_questions_avg": [
            41.25,
            54.8013457863947
        ],
        "wc_review_avg": [
            335.5,
            65.18627156081256
        ],
        "wc_reply_reviewers_avg": [
            5.75,
            9.959292143521045
        ],
        "wc_reply_authors_avg": [
            804.5,
            177.07413701610972
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2917867882034440672&as_sdt=80005&sciodt=0,11&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;0;1;0;0;1",
        "aff_unique_norm": "Fudan University;Amazon",
        "aff_unique_dep": ";Amazon.com, Inc.",
        "aff_unique_url": "https://www.fudan.edu.cn;https://www.amazon.com",
        "aff_unique_abbr": "Fudan;Amazon",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Pooling Image Datasets with Multiple Covariate Shift and Imbalance",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19554",
        "id": "2Mo7v69otj",
        "author_site": "Sotirios Panagiotis Chytas, Vishnu Lokhande, Vikas Singh",
        "tldr": "",
        "abstract": "Small sample sizes are common in many disciplines, \nwhich necessitates pooling roughly similar datasets across \nmultiple sites/institutions to study weak but relevant \nassociations between images and disease incidence. Such \ndata often manifest shifts and imbalances in covariates \n(secondary non-imaging data). \nThese issues are well-studied for classical models, but \nthe ideas simply do not apply to overparameterized DNN models. \nConsequently, recent work has shown how strategies from \nfairness and invariant representation learning provides \na meaningful starting point, but the current repertoire \nof methods remains limited to accounting for shifts/imbalances in just a couple of covariates at a time. In this paper, we show how \nviewing this problem from the perspective of Category theory \nprovides a simple and effective solution that completely avoids \nelaborate multi-stage training pipelines that would otherwise be \nneeded. We show the effectiveness of this approach via \nextensive experiments on real datasets. Further, we \ndiscuss how our style of formulation offers a unified \nperspective on at least 5+ distinct \nproblem settings in vision, from self-supervised learning\nto matching problems in 3D reconstruction.",
        "keywords": "image harmonization;medical imaging",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Sotirios Panagiotis Chytas;Vishnu Suresh Lokhande;Vikas Singh",
        "authorids": "~Sotirios_Panagiotis_Chytas1;~Vishnu_Suresh_Lokhande1;~Vikas_Singh1",
        "gender": ";;M",
        "homepage": ";;http://vsingh-www.cs.wisc.edu/",
        "dblp": ";;",
        "google_scholar": ";;d32BmwcAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Sotirios_Panagiotis_Chytas1;~Vishnu_Suresh_Lokhande1;~Vikas_Singh1",
        "aff": ";;University of Wisconsin, Madison",
        "aff_domain": ";;wisc.edu",
        "position": ";;Professor",
        "bibtex": "@inproceedings{\nchytas2024pooling,\ntitle={Pooling Image Datasets with Multiple Covariate Shift and Imbalance},\nauthor={Sotirios Panagiotis Chytas and Vishnu Suresh Lokhande and Vikas Singh},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=2Mo7v69otj}\n}",
        "github": "",
        "project": "",
        "reviewers": "zBw9;Fvtj;SjKQ;KLWx",
        "pdf_size": 2868021,
        "rating": "5;6;6;8",
        "confidence": "1;3;3;4",
        "soundness": "3;3;4;3",
        "contribution": "2;2;4;3",
        "presentation": "3;3;3;3",
        "wc_summary": "21;73;159;122",
        "wc_strengths": "11;48;42;119",
        "wc_weaknesses": "6;92;37;235",
        "wc_questions": "1;5;46;21",
        "wc_review": "39;218;284;497",
        "wc_reply_reviewers": "0;0;0;29",
        "wc_reply_authors": "16;300;304;476",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            2.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            93.75,
            51.91037950159871
        ],
        "wc_strengths_avg": [
            55.0,
            39.528470752104745
        ],
        "wc_weaknesses_avg": [
            92.5,
            87.8478798833529
        ],
        "wc_questions_avg": [
            18.25,
            17.68297203526602
        ],
        "wc_review_avg": [
            259.5,
            163.82078622690102
        ],
        "wc_reply_reviewers_avg": [
            7.25,
            12.55736835487436
        ],
        "wc_reply_authors_avg": [
            274.0,
            165.03332996701
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.894736842105263,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10639822793901611033&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=2Mo7v69otj",
        "pdf": "https://openreview.net/pdf?id=2Mo7v69otj",
        "email": ";;wisc.edu",
        "author_num": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Wisconsin",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.wisc.edu",
        "aff_unique_abbr": "UW",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Madison",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "2MpOjashKU",
        "title": "Divided Attention: Unsupervised Multiple-object Discovery and Segmentation with Interpretable Contextually Separated Slots",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We introduce a method to segment the visual field into independently moving regions in real-time, trained without ground truth or supervision, needing neither pre-trained image features nor additional data outside the domain of interest. The model consists of an adversarial conditional encoder-decoder architecture based on Slot Attention, modified to use the image as context to decode optical flow without attempting to reconstruct the image itself. One modality (flow) feeds the encoder to produce separate latent codes (slots), whereas the other modality (image) conditions the decoder to generate the first (flow) from the slots. This design frees the representation from having to encode complex nuisance variability in the image due to, for instance, illumination and reflectance properties of the scene. Since customary autoencoding based on minimizing the reconstruction error does not preclude the entire flow from being encoded into a single slot, we design the loss with an adversarial criterion based on Contextual Information Separation. The resulting min-max optimization fosters the separation of objects and their assignment to different attention slots, leading to Divided Attention (DivA). DivA outperforms recent unsupervised multi-object motion segmentation methods while tripling run-time speed up to 104FPS and reducing the performance gap from supervised methods to 12% or less. DivA can handle different numbers of objects and different image resolutions at training and test time, is invariant to the permutation of object labels, and does not require explicit regularization.",
        "keywords": "Moving object segmentation;Slot attention;Unsupervised object discovery",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Dong Lao;Zhengyang Hu;Francesco Locatello;Yanchao Yang;Stefano Soatto",
        "authorids": "~Dong_Lao1;~Zhengyang_Hu1;~Francesco_Locatello1;~Yanchao_Yang1;~Stefano_Soatto1",
        "gender": "M;M;M;M;",
        "homepage": ";;https://twitter.com/FrancescoLocat8;https://yanchaoyang.github.io/;https://www.cs.ucla.edu/~soatto",
        "dblp": "180/5522;219/6927-2;195/6074;84/8637-1;08/1262",
        "google_scholar": "dvQXYW0AAAAJ;qe-fgwYAAAAJ;;r2tKnV4AAAAJ;lH1PdF8AAAAJ",
        "orcid": ";;;;0000-0003-2902-6362",
        "linkedin": ";;;;stefano-soatto-5765aa6/",
        "or_profile": "~Dong_Lao1;~Zhengyang_Hu1;~Francesco_Locatello1;~Yanchao_Yang1;~Stefano_Soatto2",
        "aff": "University of California, Los Angeles;Hong Kong University;Institute of Science and Technology;University of Hong Kong;UCLA Computer Science Department, University of California, Los Angeles",
        "aff_domain": "cs.ucla.edu;connect.hku.hk;ist.ac.at;hku.hk;cs.ucla.edu",
        "position": "Postdoc;PhD student;Assistant Professor;Assistant Professor;Professor",
        "bibtex": "@misc{\nlao2024divided,\ntitle={Divided Attention: Unsupervised Multiple-object Discovery and Segmentation with Interpretable Contextually Separated Slots},\nauthor={Dong Lao and Zhengyang Hu and Francesco Locatello and Yanchao Yang and Stefano Soatto},\nyear={2024},\nurl={https://openreview.net/forum?id=2MpOjashKU}\n}",
        "github": "",
        "project": "",
        "reviewers": "5Uwa;8fzT;i9DX;RqAo",
        "site": "https://openreview.net/forum?id=2MpOjashKU",
        "pdf_size": 8632644,
        "rating": "5;5;5;6",
        "confidence": "3;4;5;2",
        "soundness": "3;3;2;3",
        "contribution": "3;2;1;3",
        "presentation": "3;3;3;3",
        "wc_summary": "66;142;112;58",
        "wc_strengths": "25;83;48;20",
        "wc_weaknesses": "187;196;338;6",
        "wc_questions": "3;15;3;6",
        "wc_review": "281;436;501;90",
        "wc_reply_reviewers": "0;135;427;0",
        "wc_reply_authors": "740;710;1255;59",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            94.5,
            34.30378987808781
        ],
        "wc_strengths_avg": [
            44.0,
            24.869660230891775
        ],
        "wc_weaknesses_avg": [
            181.75,
            117.82693877038476
        ],
        "wc_questions_avg": [
            6.75,
            4.9180788932265
        ],
        "wc_review_avg": [
            327.0,
            158.46292941883917
        ],
        "wc_reply_reviewers_avg": [
            140.5,
            174.35093920022342
        ],
        "wc_reply_authors_avg": [
            691.0,
            424.3471456248999
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.7745966692414834,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:oIJpUrYxKIEJ:scholar.google.com/&scioq=Divided+Attention:+Unsupervised+Multiple-object+Discovery+and+Segmentation+with+Interpretable+Contextually+Separated+Slots&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;0",
        "aff_unique_norm": "University of California, Los Angeles;Hong Kong University;Institute of Science and Technology;University of Hong Kong",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.ucla.edu;https://www.hku.hk;;https://www.hku.hk",
        "aff_unique_abbr": "UCLA;HKU;;HKU",
        "aff_campus_unique_index": "0;1;1;0",
        "aff_campus_unique": "Los Angeles;Hong Kong SAR;",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "United States;China;"
    },
    {
        "title": "Neural Neighborhood Search for Multi-agent Path Finding",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19553",
        "id": "2NpAw2QJBY",
        "author_site": "Zhongxia Yan, Cathy Wu",
        "tldr": "",
        "abstract": "Multi-agent path finding (MAPF) is the combinatorial problem of planning optimal collision-avoiding paths for multiple agents, with application to robotics, logistics, and transportation. Though many recent learning-based works have focused on large-scale combinatorial problems by guiding their decomposition into sequences of smaller subproblems, the combined spatiotemporal and time-restricted nature of MAPF poses a particular challenge for learning-based guidance of iterative approaches like large neighborhood search (LNS), which is already a state-of-the-art approach for MAPF even without learning. We address this challenge of neural-guided LNS for MAPF by designing an architecture which interleaves convolution and attention to efficiently represent MAPF subproblems, enabling practical guidance of LNS in benchmark settings. We demonstrate the speedup of our method over existing state-of-the-art LNS-based methods for MAPF as well as the robustness of our method to unseen settings. Our proposed method expands the horizon of effective deep learning-guided LNS methods into multi-path planning problems, and our proposed representation may be more broadly applicable for representing path-wise interactions.",
        "keywords": "Combinatorial Optimization;Neural Architecture;Multi-agent;Path Planning",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/316fe71d286baf490ed3dadb3478af1d1fc51bd1.pdf",
        "author": "Zhongxia Yan;Cathy Wu",
        "authorids": "~Zhongxia_Yan1;~Cathy_Wu1",
        "gender": "M;F",
        "homepage": "https://github.com/ZhongxiaYan/;http://wucathy.com",
        "dblp": "250/0690-1;155/3740",
        "google_scholar": "jI_wcL8AAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0003-1897-7381;0000-0001-8594-303X",
        "linkedin": "zhongxiayan/;cathywu/",
        "or_profile": "~Zhongxia_Yan1;~Cathy_Wu1",
        "aff": "Massachusetts Institute of Technology;Massachusetts Institute of Technology",
        "aff_domain": "mit.edu;mit.edu",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nyan2024neural,\ntitle={Neural Neighborhood Search for Multi-agent Path Finding},\nauthor={Zhongxia Yan and Cathy Wu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=2NpAw2QJBY}\n}",
        "github": "",
        "project": "",
        "reviewers": "TyGL;pDBe;TxMF;CV86",
        "pdf_size": 2380253,
        "rating": "3;6;6;6",
        "confidence": "4;3;4;5",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;4;3;3",
        "wc_summary": "142;164;122;56",
        "wc_strengths": "22;126;63;30",
        "wc_weaknesses": "629;148;140;128",
        "wc_questions": "103;112;155;96",
        "wc_review": "896;550;480;310",
        "wc_reply_reviewers": "222;97;188;28",
        "wc_reply_authors": "2343;303;659;569",
        "reply_reviewers": "3;2;1;1",
        "reply_authors": "5;2;2;2",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            121.0,
            40.36087214122113
        ],
        "wc_strengths_avg": [
            60.25,
            40.95347970563674
        ],
        "wc_weaknesses_avg": [
            261.25,
            212.43984442660468
        ],
        "wc_questions_avg": [
            116.5,
            22.940139493908923
        ],
        "wc_review_avg": [
            559.0,
            213.243991709028
        ],
        "wc_reply_reviewers_avg": [
            133.75,
            76.26393315322781
        ],
        "wc_reply_authors_avg": [
            968.5,
            804.2902150343494
        ],
        "reply_reviewers_avg": [
            1.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.75,
            1.299038105676658
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6814423661655057347&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=2NpAw2QJBY",
        "pdf": "https://openreview.net/pdf?id=2NpAw2QJBY",
        "email": "mit.edu;mit.edu",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Massachusetts Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://web.mit.edu",
        "aff_unique_abbr": "MIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "2NwHLAffZZ",
        "title": "Weak Correlations as the Underlying Principle for Linearization of Gradient-Based Learning Systems",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Numerous deep learning models including wide neural networks, can be conceptualized as nonlinear dynamical physical systems with a large number of interacting degrees of freedom, which, in the infinite limit, exhibit simplified dynamics. In this work we analyze gradient descent based learning systems that demonstrate a linear learning structure in their parameters, analogous to the neural tangent kernel. We establish that this linearity is equivalent to weak correlations between the first and higher derivatives of the hypothesis function with respect to the parameters around their initial values, suggesting that these weak correlations are the underlying reason for the observed linearization of these systems. We demonstrate the weak correlations structure in the example of neural networks in the large width limit. By leveraging the equivalence between linearity and weak correlations, we derive a bound on the deviation from linearity along the training path for stochastic gradient descent. To facilitate our proof, we introduce a method to bound the asymptotic behavior of random tensors, and demonstrate that any such tensor possesses a unique tight bound.",
        "keywords": "Neural Tangent Kernel;Deep Learning and representational learning;Kernels;Statistical Mechanics",
        "primary_area": "metric learning, kernel learning, and sparse coding",
        "supplementary_material": "/attachment/31b48e0d67630d450c93436c3d0ce3d89860f93e.pdf",
        "author": "Ori Shem Ur;Yaron Oz",
        "authorids": "~Ori_Shem_Ur1;~Yaron_Oz1",
        "gender": "M;",
        "homepage": "https://scholar.google.com/citations?hl=iw&user=O4NfrZYAAAAJ;",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Ori_Shem_Ur1;~Yaron_Oz1",
        "aff": "Tel Aviv University;Tel Aviv University, Technion",
        "aff_domain": "tau.ac.il;tau.ac.il",
        "position": "MS student;Full Professor",
        "bibtex": "@misc{\nur2024weak,\ntitle={Weak Correlations as the Underlying Principle for Linearization of Gradient-Based Learning Systems},\nauthor={Ori Shem Ur and Yaron Oz},\nyear={2024},\nurl={https://openreview.net/forum?id=2NwHLAffZZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "VTRJ;YXgU;ZGhT",
        "site": "https://openreview.net/forum?id=2NwHLAffZZ",
        "pdf_size": 278044,
        "rating": "1;3;3",
        "confidence": "4;3;4",
        "soundness": "1;2;2",
        "contribution": "4;2;1",
        "presentation": "1;2;1",
        "wc_summary": "130;302;65",
        "wc_strengths": "85;50;14",
        "wc_weaknesses": "209;120;614",
        "wc_questions": "180;34;1",
        "wc_review": "604;506;694",
        "wc_reply_reviewers": "64;0;0",
        "wc_reply_authors": "70;70;70",
        "reply_reviewers": "1;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "presentation_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            165.66666666666666,
            99.98777703077289
        ],
        "wc_strengths_avg": [
            49.666666666666664,
            28.986586936412884
        ],
        "wc_weaknesses_avg": [
            314.3333333333333,
            214.98888860176524
        ],
        "wc_questions_avg": [
            71.66666666666667,
            77.7788888809525
        ],
        "wc_review_avg": [
            601.3333333333334,
            76.77383813658285
        ],
        "wc_reply_reviewers_avg": [
            21.333333333333332,
            30.169889330626027
        ],
        "wc_reply_authors_avg": [
            70.0,
            0.0
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:v-FlDGJtsIwJ:scholar.google.com/&scioq=Weak+Correlations+as+the+Underlying+Principle+for+Linearization+of+Gradient-Based+Learning+Systems&hl=en&as_sdt=0,23",
        "gs_version_total": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Tel Aviv University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tau.ac.il",
        "aff_unique_abbr": "TAU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Israel"
    },
    {
        "id": "2O2FOO8pl4",
        "title": "Label Privacy Source Coding in Vertical Federated Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We study label privacy protection in vertical federated learning (VFL). VFL enables an active party who possesses labeled data to improve model performance (utility) by collaborating with passive parties who have auxiliary features.  Recently, there has been a growing concern for protecting label privacy against semi-honest passive parties who may surreptitiously deduce private labels from the output of their bottom models. However, existing studies do not remove the prior label information in the active party's features from labels in an offline phase, thus leaking unnecessary label privacy to passive parties.\nIn contrast to existing methods that focus on training-phase perturbation, we propose a novel offline-phase data cleansing approach to protect label privacy without compromising utility. Specifically, we first formulate a Label Privacy Source Coding (LPSC) problem to remove the redundant label information in the active party's features from labels, by assigning each sample a new weight and label (i.e., residual) for federated training. We give a privacy guarantee and theoretically prove that gradient boosting efficiently optimizes the LPSC problem. Therefore, we propose the Vertical Federated Gradient Boosting (VFGBoost) framework to address the LPSC problem. Moreover, given that LPSC only provides upper-bounded privacy enhancement, VFGBoost further enables a flexible privacy-utility trade-off by incorporating adversarial training during federated training. Experimental results on four real-world datasets substantiate the efficacy of LPSC and the superiority of our VFGBoost framework.",
        "keywords": "Label privacy;Vertical Federated learning;Gradient boosting;Adversarial training",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Dashan Gao;Sheng Wan;Hanlin Gu;Lixin Fan;Xin Yao;Qiang Yang",
        "authorids": "~Dashan_Gao4;~Sheng_Wan2;~Hanlin_Gu1;~Lixin_Fan1;~Xin_Yao1;~Qiang_Yang1",
        "gender": "M;M;M;M;;",
        "homepage": "https://dashangao.github.io/;https://scholar.google.com/citations?user=CKfbX4AAAAAJ&hl=en&oi=ao;;;http://www.cs.bham.ac.uk/~xin;",
        "dblp": "https://dblp.uni-trier.de/pid/37/2326-2.html;;236/6661;36/3111;;",
        "google_scholar": "7WVd9ZwAAAAJ;;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com/citations?hl=en;;",
        "orcid": ";;0000-0001-8266-4561;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Dashan_Gao4;~Sheng_Wan2;~Hanlin_Gu1;~Lixin_Fan1;~Xin_Yao1;~Qiang_Yang1",
        "aff": "Department of Computer Science and Engineering, Hong Kong University of Science and Technology;Hong Kong University of Science and Technology;webank;WeBank;;",
        "aff_domain": "cse.ust.hk;hkust.edu;webank.com;webank.com;;",
        "position": "PhD student;PhD student;Researcher;Principal Researcher;;",
        "bibtex": "@misc{\ngao2024label,\ntitle={Label Privacy Source Coding in Vertical Federated Learning},\nauthor={Dashan Gao and Sheng Wan and Hanlin Gu and Lixin Fan and Xin Yao and Qiang Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=2O2FOO8pl4}\n}",
        "github": "",
        "project": "",
        "reviewers": "wj8U;pUxt;WYNH;3hcA",
        "site": "https://openreview.net/forum?id=2O2FOO8pl4",
        "pdf_size": 1590599,
        "rating": "5;5;5;6",
        "confidence": "4;5;4;3",
        "soundness": "3;3;2;3",
        "contribution": "3;3;2;3",
        "presentation": "1;2;3;3",
        "wc_summary": "135;64;71;115",
        "wc_strengths": "35;51;12;36",
        "wc_weaknesses": "140;222;127;21",
        "wc_questions": "89;55;3;125",
        "wc_review": "399;392;213;297",
        "wc_reply_reviewers": "95;151;0;11",
        "wc_reply_authors": "1997;1721;987;1193",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "5;5;4;3",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            96.25,
            29.710057219736214
        ],
        "wc_strengths_avg": [
            33.5,
            13.937359864766353
        ],
        "wc_weaknesses_avg": [
            127.5,
            71.46502641152524
        ],
        "wc_questions_avg": [
            68.0,
            44.955533585978046
        ],
        "wc_review_avg": [
            325.25,
            76.3098126062435
        ],
        "wc_reply_reviewers_avg": [
            64.25,
            62.118334652500145
        ],
        "wc_reply_authors_avg": [
            1474.5,
            403.3196623027447
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.25,
            0.82915619758885
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:LVFcbT-J5L4J:scholar.google.com/&scioq=Label+Privacy+Source+Coding+in+Vertical+Federated+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;1",
        "aff_unique_norm": "Hong Kong University of Science and Technology;WeBank",
        "aff_unique_dep": "Department of Computer Science and Engineering;",
        "aff_unique_url": "https://www.ust.hk;https://www.webank.com",
        "aff_unique_abbr": "HKUST;WeBank",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "PerceptionCLIP: Visual Classification by Inferring and Conditioning on Contexts",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19552",
        "id": "2Oiee202rd",
        "author_site": "Bang An, Sicheng Zhu, Michael-Andrei Panaitescu-Liess, Chaithanya Kumar Mummadi, Furong Huang",
        "tldr": "",
        "abstract": "Vision-language models like CLIP are widely used in zero-shot image classification due to their ability to understand various visual concepts and natural language descriptions. However, how to fully leverage CLIP's unprecedented human-like understanding capabilities to achieve better performance is still an open question. This paper draws inspiration from the human visual perception process: when classifying an object, humans first infer contextual attributes (e.g., background and orientation) which help separate the foreground object from the background, and then classify the object based on this information. Inspired by it, we observe that providing CLIP with contextual attributes improves zero-shot image classification and mitigates reliance on spurious features. We also observe that CLIP itself can reasonably infer the attributes from an image. With these observations, we propose a training-free, two-step zero-shot classification method PerceptionCLIP. Given an image, it first infers contextual attributes (e.g., background) and then performs object classification conditioning on them. Our experiments show that PerceptionCLIP achieves better generalization, group robustness, and interpretability.",
        "keywords": "vision-language model;CLIP;zero-shot;image classification;human perception;contexts;contextual attributes;spurious feature",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Bang An;Sicheng Zhu;Michael-Andrei Panaitescu-Liess;Chaithanya Kumar Mummadi;Furong Huang",
        "authorids": "~Bang_An1;~Sicheng_Zhu1;~Michael-Andrei_Panaitescu-Liess1;~Chaithanya_Kumar_Mummadi1;~Furong_Huang1",
        "gender": ";M;M;M;F",
        "homepage": "https://bangann.github.io/;https://schzhu.github.io/;;;https://furong-huang.com",
        "dblp": "188/0741;;263/6954.html;208/6386;72/8513",
        "google_scholar": "3ce6z_sAAAAJ;;MOP6lhkAAAAJ;XJLtaG4AAAAJ;13yyuCcAAAAJ",
        "orcid": ";;;0000-0002-1173-2720;",
        "linkedin": ";;michael-panaitescu-0849a3182/;;",
        "or_profile": "~Bang_An1;~Sicheng_Zhu1;~Michael-Andrei_Panaitescu-Liess1;~Chaithanya_Kumar_Mummadi1;~Furong_Huang1",
        "aff": "University of Maryland, College Park;University of Maryland, College Park;University of Maryland, College Park;Bosch Center for Artificial Intelligence;University of Maryland",
        "aff_domain": "umd.edu;umd.edu;umd.edu;bosch.com;cs.umd.edu",
        "position": "PhD student;PhD student;PhD student;Researcher;Assistant Professor",
        "bibtex": "@inproceedings{\nan2024perceptionclip,\ntitle={Perception{CLIP}: Visual Classification by Inferring and Conditioning on Contexts},\nauthor={Bang An and Sicheng Zhu and Michael-Andrei Panaitescu-Liess and Chaithanya Kumar Mummadi and Furong Huang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=2Oiee202rd}\n}",
        "github": "",
        "project": "",
        "reviewers": "vx4m;U13E;k2xX;VSta",
        "pdf_size": 10417446,
        "rating": "5;5;6;8",
        "confidence": "4;4;4;3",
        "soundness": "2;2;3;3",
        "contribution": "3;3;3;3",
        "presentation": "4;3;3;4",
        "wc_summary": "31;69;100;37",
        "wc_strengths": "72;33;44;64",
        "wc_weaknesses": "312;246;263;17",
        "wc_questions": "5;13;77;44",
        "wc_review": "420;361;484;162",
        "wc_reply_reviewers": "214;15;0;0",
        "wc_reply_authors": "1015;1569;974;195",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "2;5;2;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            59.25,
            27.60774347895894
        ],
        "wc_strengths_avg": [
            53.25,
            15.514106484100203
        ],
        "wc_weaknesses_avg": [
            209.5,
            113.75082417283842
        ],
        "wc_questions_avg": [
            34.75,
            28.411045387313717
        ],
        "wc_review_avg": [
            356.75,
            120.55989175509407
        ],
        "wc_reply_reviewers_avg": [
            57.25,
            90.70660119307745
        ],
        "wc_reply_authors_avg": [
            938.25,
            489.2429738892527
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            1.5
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9428090415820632,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3534252523528312436&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=2Oiee202rd",
        "pdf": "https://openreview.net/pdf?id=2Oiee202rd",
        "email": "umd.edu;umd.edu;umd.edu;bosch.com;cs.umd.edu",
        "author_num": 5,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "University of Maryland;Bosch Center for Artificial Intelligence",
        "aff_unique_dep": ";Center for Artificial Intelligence",
        "aff_unique_url": "https://www/umd.edu;https://www.bosch-ai.com",
        "aff_unique_abbr": "UMD;BCAI",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "College Park;",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "United States;Germany"
    },
    {
        "id": "2OwSqvxjP2",
        "title": "Boosting Semi-Supervised Learning via Variational Confidence Calibration and Unlabeled Sample Elimination",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Despite the recent progress of Semi-supervised Learning (SSL), we argue that the existing methods may not employ unlabeled examples effectively and efficiently. Many pseudo-label-based methods select unlabeled examples into the training stage based on the inaccurate confidence scores provided by the output layer of the classifier network. Additionally, most prior work typically adpots all the available unlabeled examples without data pruning, which is incapable of learning from massive unlabeled data. To address these issues, this paper proposes two methods called VCC (Variational Confidence Calibration) and INFUSE (INfluence-Function-based Unlabeled Sample Elimination). VCC is a general-purpose plugin of confidence calibration for SSL. By approximating the calibrated confidence through three types of consistency scores, a variational autoencoder is leveraged to reconstruct the confidence score for selecting more accurate pseudo-labels. Based on the influence function, INFUSE is a data pruning method for constructing a core dataset of unlabeled examples. The effectiveness of our methods is demonstrated through experiments on multiple datasets and in various settings. For example, on the CIFAR-100 dataset with 400 labeled examples, VCC reduces the classification error rate of FixMatch from 46.47\\% to 43.31\\% (with improvement of 3.16\\%). On the SVHN dataset with 250 labeled examples, INFUSE achieves 2.61\\% error rate using only 10\\% unlabeled data, which is better than RETRIEVE (2.90\\%) and the baseline with full unlabeled data (3.80\\%). Putting all the pieces together, the combined VCC-INFUSE plugins can reduce the error rate of FlexMatch from 26.49\\% to 25.41\\% on the CIFAR100 dataset (with improvement of 1.08\\%) while saving nearly half of the original training time (from 223.96 GPU hours to 115.47 GPU hours).",
        "keywords": "Semi-Supervised Learning;Calibration;Sample Elimination",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Qianhan Feng;Shijie Fang;Tong Lin",
        "authorids": "~Qianhan_Feng1;~Shijie_Fang1;~Tong_Lin1",
        "gender": "M;M;M",
        "homepage": "https://fqhank.github.io/fengqianhan.github.io/;;https://sai.pku.edu.cn/szdw/zzjs/lt.htm",
        "dblp": "300/5376;;74/5719-2",
        "google_scholar": "HtigWVwAAAAJ;;",
        "orcid": "0009-0009-4552-0046;;0000-0002-0000-834X",
        "linkedin": ";%E4%BB%95%E6%9D%B0-%E6%96%B9-35259817a/;",
        "or_profile": "~Qianhan_Feng1;~Shijie_Fang1;~Tong_Lin1",
        "aff": "Peking University;;Peking University",
        "aff_domain": "stu.pku.edu.cn;;pku.edu.cn",
        "position": "MS student;;Associate Professor",
        "bibtex": "@misc{\nfeng2024boosting,\ntitle={Boosting Semi-Supervised Learning via Variational Confidence Calibration and Unlabeled Sample Elimination},\nauthor={Qianhan Feng and Shijie Fang and Tong Lin},\nyear={2024},\nurl={https://openreview.net/forum?id=2OwSqvxjP2}\n}",
        "github": "",
        "project": "",
        "reviewers": "iR75;LFY9;5hwM;o4va",
        "site": "https://openreview.net/forum?id=2OwSqvxjP2",
        "pdf_size": 1387865,
        "rating": "5;5;6;6",
        "confidence": "5;4;4;3",
        "soundness": "2;2;3;4",
        "contribution": "2;2;3;3",
        "presentation": "3;3;2;4",
        "wc_summary": "71;111;43;160",
        "wc_strengths": "67;43;145;82",
        "wc_weaknesses": "77;144;198;37",
        "wc_questions": "113;5;89;39",
        "wc_review": "328;303;475;318",
        "wc_reply_reviewers": "37;109;0;0",
        "wc_reply_authors": "481;390;764;391",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            96.25,
            44.030529181466804
        ],
        "wc_strengths_avg": [
            84.25,
            37.7317836843158
        ],
        "wc_weaknesses_avg": [
            114.0,
            61.75354240851289
        ],
        "wc_questions_avg": [
            61.5,
            42.1515124283815
        ],
        "wc_review_avg": [
            356.0,
            69.27842376959799
        ],
        "wc_reply_reviewers_avg": [
            36.5,
            44.5
        ],
        "wc_reply_authors_avg": [
            506.5,
            153.19024120354402
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.7071067811865475,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:N2y3YCLFpJsJ:scholar.google.com/&scioq=Boosting+Semi-Supervised+Learning+via+Variational+Confidence+Calibration+and+Unlabeled+Sample+Elimination&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Peking University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.pku.edu.cn",
        "aff_unique_abbr": "Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "2PKZtPMyvI",
        "title": "An Intrinsic Dimension Perspective of Transformers for Sequential Modeling",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Transformers have become immensely popular for sequential modeling, particularly in domains like natural language processing (NLP).\nRecent innovations have introduced various architectures based on the Transformer framework, resulting in significant advancements in applications.\nHowever, the underlying mechanics of these architectures are still somewhat enigmatic.\nIn this study, we explore the geometrical characteristics of data representations learned by Transformers using a mathematical metric known as intrinsic dimension (ID). This can be conceptualized as the minimum parameter count needed for effective modeling.\nA sequence of experiments, predominantly centered on text classification, support the ensuing empirical observations regarding the correlation between embedding dimension, layer depth, individual layer ID, and task performance.\nInterestingly, we note that a higher terminal feature ID, when obtained from Transformers, generally correlates with a lower classification error rate. \nThis stands in contrast to the behavior observed in CNNs (and other models) during image classification tasks. Furthermore, our data suggests that the ID for each layer tends to diminish as layer depth increases, with this decline being notably steeper in more intricate architectures.\nWe also present numerical evidence highlighting the geometrical constructs of data representations as interpreted by Transformers, indicating that only nonlinear dimension reduction is achievable.\nLastly, we delve into how varying sequence lengths impact both ID and task performance, confirming the efficacy of data reduction during training.\nOur ambition is for these insights to offer direction in the choice of hyper-parameters and the application of dimension/data reduction when using Transformers for text classification and other prevalent NLP tasks.",
        "keywords": "Transformers;Intrinsic Dimension;Hyperparameter Optimization;Natural Language Processing",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Zeping Min;Qian Ge;Zhong Li",
        "authorids": "~Zeping_Min1;~Qian_Ge4;~Zhong_Li2",
        "gender": ";M;M",
        "homepage": ";;https://www.microsoft.com/en-us/research/people/lzhong/",
        "dblp": ";153/5844;",
        "google_scholar": ";;https://scholar.google.com/citations?view_op=list_works",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Zeping_Min1;~Qian_Ge4;~Zhong_Li2",
        "aff": ";Peking University;Microsoft Research Asia",
        "aff_domain": ";pku.edu.cn;microsoft.com",
        "position": ";MS student;Researcher",
        "bibtex": "@misc{\nmin2024an,\ntitle={An Intrinsic Dimension Perspective of Transformers for Sequential Modeling},\nauthor={Zeping Min and Qian Ge and Zhong Li},\nyear={2024},\nurl={https://openreview.net/forum?id=2PKZtPMyvI}\n}",
        "github": "",
        "project": "",
        "reviewers": "K7iN;LFkQ;rhBS;wsLx;h8wB",
        "site": "https://openreview.net/forum?id=2PKZtPMyvI",
        "pdf_size": 2383678,
        "rating": "1;3;3;3;5",
        "confidence": "4;5;4;4;4",
        "soundness": "2;2;1;2;2",
        "contribution": "1;2;2;2;2",
        "presentation": "2;3;1;3;3",
        "wc_summary": "41;84;74;35;99",
        "wc_strengths": "1;30;33;63;84",
        "wc_weaknesses": "41;116;47;428;151",
        "wc_questions": "2;228;488;26;122",
        "wc_review": "85;458;642;552;456",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            3.0,
            1.2649110640673518
        ],
        "confidence_avg": [
            4.2,
            0.39999999999999997
        ],
        "soundness_avg": [
            1.8,
            0.4
        ],
        "contribution_avg": [
            1.8,
            0.4000000000000001
        ],
        "presentation_avg": [
            2.4,
            0.8
        ],
        "wc_summary_avg": [
            66.6,
            24.743483990739865
        ],
        "wc_strengths_avg": [
            42.2,
            28.67333255831976
        ],
        "wc_weaknesses_avg": [
            156.6,
            141.92476880375744
        ],
        "wc_questions_avg": [
            173.2,
            176.46574738458455
        ],
        "wc_review_avg": [
            438.6,
            189.706721019578
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:hSxBdp0VlzoJ:scholar.google.com/&scioq=An+Intrinsic+Dimension+Perspective+of+Transformers+for+Sequential+Modeling&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Peking University;Microsoft",
        "aff_unique_dep": ";Research",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.microsoft.com/en-us/research/group/asia",
        "aff_unique_abbr": "Peking U;MSR Asia",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Asia",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "2Pup7olzxj",
        "title": "Differentiable Optimization in Plane-Wave Density Functional Theory for Solid States",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Plane-wave density functional theory is a computational quantum mechanical modeling method used to investigate the electronic structure of solids. It employs plane-waves as the basis set for representing electronic wave functions and leverages density functional theory to compute the electronic structure properties of many-body systems. Traditionally, the Self-Consistent Field (SCF) method is predominantly adopted for optimization in current DFT computations. However, this method encounters notable convergence and computational challenges, and its iterative nature obstructs the incorporation of emergent deep learning enhancements. To address these challenges, we introduce a fully differentiable optimization method tailored to resolve the intrinsic challenges associated with the optimization of plane-wave density functional methods. This methodology includes a direct total energy minimization approach for solving Kohn-Sham equations in periodic crystalline systems, which is coherent with deep learning infrastructures. The efficacy of our approach is illustrated through its two applications in solid-state physics: electron band structure prediction and geometry optimization. Our enhancements potentially pave the way for various gradient-based applications within deep learning paradigms in solid-state physics, extending the boundaries of material innovation and design. We illustrate the utility and diverse applications of our method on real crystal structures and compare its effectiveness with several established SCF-based packages, demonstrating its accuracy and robust convergence property.",
        "keywords": "AI for Science;Quantum Chemisty;Density Functional Theory;Deep Learning;Kohn-Sham Equation;Solid-State Physics",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Tianbo Li;Stephen Gregory Dale;Zekun Shi;Jingshu Li;Giovanni Vignale;A. H. Castro Neto;Kostya S. Novoselov;Min Lin",
        "authorids": "~Tianbo_Li1;~Stephen_Gregory_Dale1;~Zekun_Shi3;~Jingshu_Li1;~Giovanni_Vignale1;~A._H._Castro_Neto1;~Kostya_S._Novoselov1;~Min_Lin1",
        "gender": "M;Not Specified;M;M;M;M;M;M",
        "homepage": ";https://ifim.nus.edu.sg/people/stephen-dale/;https://jasonleejsl.github.io/;;https://graphene.nus.edu.sg/blog/peoples/antonio-castro-neto/;https://ifim.nus.edu.sg/;https://linmin.me;https://zekun-shi.github.io/",
        "dblp": "153/7013;;;;;;;",
        "google_scholar": ";gS3ihw0AAAAJ;;;4kNDbNEAAAAJ;;BGONmkIAAAAJ;X9vcv1oAAAAJ",
        "orcid": ";0000-0002-6867-711X;0009-0006-1576-8487;0000-0003-3851-5790;0000-0003-0613-4010;;;",
        "linkedin": ";;;;https://sg.linkedin.com/in/antonio-h-castro-neto-ba8187ab;;min-lin-08a3a422/;",
        "or_profile": "~Tianbo_Li1;~Stephen_Gregory_Dale1;~Jingshu_Li1;~Giovanni_Vignale1;~A._H._Castro_Neto1;~Kostya_S._Novoselov1;~Min_Lin1;~ZEKUN_SHI2",
        "aff": "Sea AI Lab;;National University of Singapore;National University of Singapore;;;Sea AI Lab;Sea AI Lab",
        "aff_domain": "sea.com;;u.nus.edu;nus.edu;;;sea.com;sea.com",
        "position": "Researcher;;PhD student;Researcher;;;Principal Researcher;Researcher",
        "bibtex": "@misc{\nli2024differentiable,\ntitle={Differentiable Optimization in Plane-Wave Density Functional Theory for Solid States},\nauthor={Tianbo Li and Stephen Gregory Dale and Zekun Shi and Jingshu Li and Giovanni Vignale and A. H. Castro Neto and Kostya S. Novoselov and Min Lin},\nyear={2024},\nurl={https://openreview.net/forum?id=2Pup7olzxj}\n}",
        "github": "",
        "project": "",
        "reviewers": "Arv3;Npa9;AFLR;TgFK",
        "site": "https://openreview.net/forum?id=2Pup7olzxj",
        "pdf_size": 2235674,
        "rating": "3;5;5;6",
        "confidence": "3;4;3;2",
        "soundness": "3;2;3;4",
        "contribution": "3;2;3;3",
        "presentation": "3;3;3;4",
        "wc_summary": "208;55;131;124",
        "wc_strengths": "22;97;179;113",
        "wc_weaknesses": "108;546;71;111",
        "wc_questions": "125;98;91;13",
        "wc_review": "463;796;472;361",
        "wc_reply_reviewers": "0;35;21;0",
        "wc_reply_authors": "1365;1081;992;411",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "2;2;3;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            129.5,
            54.18717560456533
        ],
        "wc_strengths_avg": [
            102.75,
            55.840733340456765
        ],
        "wc_weaknesses_avg": [
            209.0,
            195.20373971827487
        ],
        "wc_questions_avg": [
            81.75,
            41.67358275934528
        ],
        "wc_review_avg": [
            523.0,
            163.53440005087614
        ],
        "wc_reply_reviewers_avg": [
            14.0,
            14.849242404917497
        ],
        "wc_reply_authors_avg": [
            962.25,
            346.796319905503
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.3244428422615251,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:To3QkK3nRmcJ:scholar.google.com/&scioq=Differentiable+Optimization+in+Plane-Wave+Density+Functional+Theory+for+Solid+States&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;0;0",
        "aff_unique_norm": "Sea AI Lab;National University of Singapore",
        "aff_unique_dep": ";",
        "aff_unique_url": ";https://www.nus.edu.sg",
        "aff_unique_abbr": ";NUS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "1;1",
        "aff_country_unique": ";Singapore"
    },
    {
        "title": "GOAt: Explaining Graph Neural Networks via Graph Output Attribution",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19551",
        "id": "2Q8TZWAHv4",
        "author_site": "Shengyao Lu, Keith G Mills, Jiao He, Bang Liu, Di Niu",
        "tldr": "",
        "abstract": "Understanding the decision-making process of Graph Neural Networks (GNNs) is crucial to their interpretability. Most existing methods for explaining GNNs typically rely on training auxiliary models, resulting in the explanations remain black-boxed. This paper introduces Graph Output Attribution (GOAt), a novel method to attribute graph outputs to input graph features, creating GNN explanations that are faithful, discriminative, as well as stable across similar samples. By expanding the GNN as a sum of scalar products involving node features, edge features and activation patterns, we propose an efficient analytical method to compute contribution of each node or edge feature to each scalar product and aggregate the contributions from all scalar products in the expansion form to derive the importance of each node and edge. Through extensive experiments on synthetic and real-world data, we show that our method not only outperforms various state-of-the-art GNN explainers in terms of the commonly used fidelity metric, but also exhibits stronger discriminability, and stability by a remarkable margin.",
        "keywords": "Graph Neural Networks;Explainability;Interpretability;Local-level explanation;Instance-level explanation",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/f5a45077f8cd166ffe99911b9a864127c65a66ea.zip",
        "author": "Shengyao Lu;Keith G. Mills;Jiao He;Bang Liu;Di Niu",
        "authorids": "~Shengyao_Lu1;~Keith_G._Mills1;~Jiao_He1;~Bang_Liu1;~Di_Niu1",
        "gender": "F;M;M;M;M",
        "homepage": "https://sluxsr.github.io/;https://kgmills.github.io/;https://github.com/JonHe878;http://www-labs.iro.umontreal.ca/~liubang/;https://www.ualberta.ca/~dniu",
        "dblp": "320/4184;299/5864;;;82/4953",
        "google_scholar": "https://scholar.google.ca/citations?user=MSsab9EAAAAJ;CBOD_ngAAAAJ;;lmfAnP4AAAAJ;https://scholar.google.ca/citations?user=3kC5OogAAAAJ",
        "orcid": ";0000-0001-6054-1798;;0000-0002-9483-8984;0000-0002-5250-7327",
        "linkedin": ";kgmills/;;bang-liu-12b66789/?originalSubdomain=ca;",
        "or_profile": "~Shengyao_Lu1;~Keith_G._Mills1;~Jiao_He1;~Bang_Liu1;~Di_Niu1",
        "aff": "University of Alberta;Huawei Technologies Ltd.;huawei;University of Montreal;University of Alberta",
        "aff_domain": "ualberta.ca;huawei.com;huawei.com;umontreal.ca;ualberta.ca",
        "position": "PhD student;Research Intern;Chief engineer;Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\nlu2024goat,\ntitle={{GOA}t: Explaining Graph Neural Networks via Graph Output Attribution},\nauthor={Shengyao Lu and Keith G. Mills and Jiao He and Bang Liu and Di Niu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=2Q8TZWAHv4}\n}",
        "github": "",
        "project": "",
        "reviewers": "cqeJ;nBUo;PCGE;8TnY",
        "pdf_size": 2269280,
        "rating": "5;6;6;8",
        "confidence": "4;5;2;3",
        "soundness": "3;3;3;2",
        "contribution": "2;3;3;2",
        "presentation": "3;2;2;2",
        "wc_summary": "51;61;47;145",
        "wc_strengths": "33;72;29;61",
        "wc_weaknesses": "187;100;28;43",
        "wc_questions": "5;5;5;102",
        "wc_review": "276;238;109;351",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "671;750;309;319",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            76.0,
            40.162171256046406
        ],
        "wc_strengths_avg": [
            48.75,
            18.226011631731172
        ],
        "wc_weaknesses_avg": [
            89.5,
            62.37186865887537
        ],
        "wc_questions_avg": [
            29.25,
            42.00223208354527
        ],
        "wc_review_avg": [
            243.5,
            87.65414993027997
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            512.25,
            200.2390758568367
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.30779350562554625,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13711532416544159943&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=2Q8TZWAHv4",
        "pdf": "https://openreview.net/pdf?id=2Q8TZWAHv4",
        "email": "ualberta.ca;huawei.com;huawei.com;umontreal.ca;ualberta.ca",
        "author_num": 5,
        "aff_unique_index": "0;1;1;2;0",
        "aff_unique_norm": "University of Alberta;Huawei;University of Montreal",
        "aff_unique_dep": ";Huawei Technologies;",
        "aff_unique_url": "https://www.ualberta.ca;https://www.huawei.com;https://wwwumontreal.ca",
        "aff_unique_abbr": "UAlberta;Huawei;UM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;0;0",
        "aff_country_unique": "Canada;China"
    },
    {
        "id": "2RGQwJEcAC",
        "title": "Visual Transformer with Differentiable Channel Selection: An Information Bottleneck Inspired Approach",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Self-attention and transformers have been widely used in deep learning. Recent efforts have been devoted to incorporating transformer blocks into different types of neural architectures, including those with convolutions, leading to various visual transformers for computer vision tasks. In this paper, we propose a novel and compact transformer block, Transformer with Differentiable Channel Selection, or DCS-Transformer. DCS-Transformer features channel selection in the computation of the attention weights and the input/output features of the MLP in the transformer block. Our DCS-Transformer is compatible with many popular and compact transformer networks, such as MobileViT and EfficientViT, and it reduces the FLOPs of the visual transformers while maintaining or even improving the prediction accuracy. In the experiments, we replace all the transformer blocks in MobileViT and EfficientViT with DCS-Transformer blocks, leading to DCS-Transformer networks with different backbones. The DCS-Transformer is motivated by reduction of Information Bottleneck, and a novel upper bound for the IB which can be optimized by SGD is derived and incorporated into the training loss of the network with DCS-Transformer. Extensive results on image classification and object detection evidence that DCS-Transformer renders compact and efficient visual transformers with comparable or much better prediction accuracy than the original visual transformers. The code of DCS-Transformer is available at \\url{https://anonymous.4open.science/r/IB-DCS-ViT-273C/}.",
        "keywords": "Differentiable Channel Selection;Information Bottleneck;Image Classification",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Yancheng Wang;Ping Li;Yingzhen Yang",
        "authorids": "~Yancheng_Wang2;~Ping_Li3;~Yingzhen_Yang1",
        "gender": "M;M;M",
        "homepage": ";http://www.stat.rutgers.edu/home/pingli/;http://yingzhenyang.com",
        "dblp": ";62/5860-1;66/3838.html",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;",
        "orcid": ";;",
        "linkedin": ";;yingzhen-yang-9b869122",
        "or_profile": "~Yancheng_Wang2;~Ping_Li3;~Yingzhen_Yang1",
        "aff": "Arizona State University;LinkedIn;Arizona State University",
        "aff_domain": "asu.edu;linkedin.com;asu.edu",
        "position": "PhD student;Engineer;Assistant Professor",
        "bibtex": "@misc{\nwang2024visual,\ntitle={Visual Transformer with Differentiable Channel Selection: An Information Bottleneck Inspired Approach},\nauthor={Yancheng Wang and Ping Li and Yingzhen Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=2RGQwJEcAC}\n}",
        "github": "",
        "project": "",
        "reviewers": "wQJ5;Q1sT;JKXw",
        "site": "https://openreview.net/forum?id=2RGQwJEcAC",
        "pdf_size": 7064627,
        "rating": "5;6;6",
        "confidence": "4;5;3",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "3;3;2",
        "wc_summary": "136;62;85",
        "wc_strengths": "17;63;71",
        "wc_weaknesses": "347;75;230",
        "wc_questions": "2;2;13",
        "wc_review": "502;202;399",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1381;532;1469",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;1;2",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            94.33333333333333,
            30.922843048824312
        ],
        "wc_strengths_avg": [
            50.333333333333336,
            23.79542439676633
        ],
        "wc_weaknesses_avg": [
            217.33333333333334,
            111.40416908217075
        ],
        "wc_questions_avg": [
            5.666666666666667,
            5.185449728701348
        ],
        "wc_review_avg": [
            367.6666666666667,
            124.4623994983581
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1127.3333333333333,
            422.49444440791825
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:r-UPoEdjLugJ:scholar.google.com/&scioq=Visual+Transformer+with+Differentiable+Channel+Selection:+An+Information+Bottleneck+Inspired+Approach&hl=en&as_sdt=0,5",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Arizona State University;LinkedIn Corporation",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.asu.edu;https://www.linkedin.com",
        "aff_unique_abbr": "ASU;LinkedIn",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "2RJAzSphy9",
        "title": "Sample Efficient Reinforcement Learning from Human Feedback via Active Exploration",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Preference-based feedback is important for many applications in reinforcement learning where direct evaluation of a reward function is not feasible. A notable recent example arises in reinforcement learning from human feedback (RLHF) on large language models. For many applications of RLHF, the cost of acquiring the human feedback can be substantial. In this work, we take advantage of the fact that one can often choose contexts at which to obtain human feedback in order to most efficiently identify a good policy, and formalize this as an *offline contextual dueling bandit* problem. We give an upper-confidence-bound style algorithm for this problem and prove a polynomial worst-case regret bound. We then provide empirical confirmation in a synthetic setting that our approach outperforms existing methods. After, we extend the setting and methodology for practical use in RLHF training of large language models. Here, our method is able to reach better performance with fewer samples of human preferences than multiple baselines on three real-world datasets.",
        "keywords": "reinforcement learning;LLMs;contextual bandits;RLHF;exploration",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/3969dbbf0d8f0b1e2cf43c14be805bc3e043ae2e.zip",
        "author": "Viraj Mehta;Vikramjeet Das;Ojash Neopane;Yijia Dai;Ilija Bogunovic;Jeff Schneider;Willie Neiswanger",
        "authorids": "~Viraj_Mehta1;~Vikramjeet_Das1;~Ojash_Neopane1;~Yijia_Dai1;~Ilija_Bogunovic2;~Jeff_Schneider1;~Willie_Neiswanger2",
        "gender": "M;M;M;F;;M;M",
        "homepage": "http://virajm.com;;https://oneopane.github.io/;https://daiyijia02.github.io;https://www.cs.cmu.edu/~schneide;https://willieneis.github.io/;http://ilijabogunovic.com/",
        "dblp": "https://dblp.org/pers/m/Mehta:Viraj.html;323/0004;176/5399.html;;38/247;120/7593.html;142/2725",
        "google_scholar": "4pHjHBkAAAAJ;https://scholar.google.com/citations?hl=en;lmAQ1l8AAAAJ;https://scholar.google.com/citations?hl=en;3bSbb20AAAAJ;QwKHApEAAAAJ;xMvt3NEAAAAJ",
        "orcid": "0000-0002-2021-9718;0000-0001-8292-6752;;;0000-0002-5080-9073;;",
        "linkedin": "virajrmehta/;linkedin.com/in/vikramjeetd;;yijia-dai/;jeff-schneider-1593b322/;;",
        "or_profile": "~Viraj_Mehta1;~Vikramjeet_Das1;~Ojash_Neopane1;~Yijia_Dai1;~Jeff_Schneider1;~Willie_Neiswanger2;~Ilija_Bogunovic1",
        "aff": "Carnegie Mellon University;Carnegie Mellon University;Carnegie Mellon University;Cornell University;Carnegie Mellon University;University of Southern California;Swiss Federal Institute of Technology",
        "aff_domain": "cmu.edu;andrew.cmu.edu;cmu.edu;cornell.edu;cs.cmu.edu;usc.edu;ethz.ch",
        "position": "PhD student;MS student;PhD student;Undergrad student;Researcher;Assistant Professor;Postdoc",
        "bibtex": "@misc{\nmehta2024sample,\ntitle={Sample Efficient Reinforcement Learning from Human Feedback via Active Exploration},\nauthor={Viraj Mehta and Vikramjeet Das and Ojash Neopane and Yijia Dai and Ilija Bogunovic and Jeff Schneider and Willie Neiswanger},\nyear={2024},\nurl={https://openreview.net/forum?id=2RJAzSphy9}\n}",
        "github": "",
        "project": "",
        "reviewers": "aHAt;NrDs;vRQm;7uH1;DPyN",
        "site": "https://openreview.net/forum?id=2RJAzSphy9",
        "pdf_size": 2399934,
        "rating": "3;5;5;5;6",
        "confidence": "5;3;3;2;2",
        "soundness": "2;3;3;2;3",
        "contribution": "2;2;2;2;3",
        "presentation": "2;3;3;3;3",
        "wc_summary": "389;71;86;50;50",
        "wc_strengths": "2;30;37;33;20",
        "wc_weaknesses": "2;92;309;78;119",
        "wc_questions": "2;239;5;3;51",
        "wc_review": "395;432;437;164;240",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "909;528;486;538;351",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "2;1;1;1;1",
        "rating_avg": [
            4.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.0,
            1.0954451150103321
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            129.2,
            130.60995367888316
        ],
        "wc_strengths_avg": [
            24.4,
            12.531560158256434
        ],
        "wc_weaknesses_avg": [
            120.0,
            102.17044582461212
        ],
        "wc_questions_avg": [
            60.0,
            91.3892772703669
        ],
        "wc_review_avg": [
            333.6,
            111.05782277714614
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            562.4,
            185.7079427488227
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.2,
            0.4000000000000001
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.9316949906249125,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6091476061033864192&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;1;0;2;3",
        "aff_unique_norm": "Carnegie Mellon University;Cornell University;University of Southern California;Swiss Federal Institute of Technology",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.cmu.edu;https://www.cornell.edu;https://www.usc.edu;https://www.ethz.ch",
        "aff_unique_abbr": "CMU;Cornell;USC;ETH Zurich",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Los Angeles",
        "aff_country_unique_index": "0;0;0;0;0;0;1",
        "aff_country_unique": "United States;Switzerland"
    },
    {
        "title": "Time Travel in LLMs: Tracing Data Contamination in Large Language Models",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19550",
        "id": "2Rwq6c3tvr",
        "author_site": "Shahriar Golchin, Mihai Surdeanu",
        "tldr": "",
        "abstract": "Data contamination, i.e., the presence of test data from downstream tasks in the training data of large language models (LLMs), is a potential major issue in measuring LLMs' real effectiveness on other tasks. We propose a straightforward yet effective method for identifying data contamination within LLMs. At its core, our approach starts by identifying potential contamination at the instance level; using this information, our approach then assesses wider contamination at the partition level. To estimate contamination of individual instances, we employ \"guided instruction:\" a prompt consisting of the dataset name, partition type, and the random-length initial segment of a reference instance, asking the LLM to complete it. An instance is flagged as contaminated if the LLM's output either exactly or nearly matches the latter segment of the reference. To understand if an entire partition is contaminated, we propose two ideas. The first idea marks a dataset partition as contaminated if the average overlap score with the reference instances (as measured by ROUGE-L or BLEURT) is statistically significantly better with the completions from guided instruction compared to a \"general instruction\" that does not include the dataset and partition name. The second idea marks a dataset partition as contaminated if a classifier based on GPT-4 with few-shot in-context learning prompt marks multiple generated completions as exact/near-exact matches of the corresponding reference instances. Our best method achieves an accuracy between 92% and 100% in detecting if an LLM is contaminated with seven datasets, containing train and test/validation partitions, when contrasted with manual evaluation by human experts. Further, our findings indicate that GPT-4 is contaminated with AG News, WNLI, and XSum datasets.",
        "keywords": "Data Contamination;Large Language Models (LLMs);Guided Instruction;Memorization",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Shahriar Golchin;Mihai Surdeanu",
        "authorids": "~Shahriar_Golchin1;~Mihai_Surdeanu1",
        "gender": "M;",
        "homepage": ";http://surdeanu.info/mihai/",
        "dblp": ";18/3479",
        "google_scholar": "iBl-Yc8AAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";",
        "linkedin": "shahriar-golchin;",
        "or_profile": "~Shahriar_Golchin1;~Mihai_Surdeanu1",
        "aff": "University of Arizona;University of Arizona",
        "aff_domain": "arizona.edu;arizona.edu",
        "position": "PhD student;Full Professor",
        "bibtex": "@inproceedings{\ngolchin2024time,\ntitle={Time Travel in {LLM}s: Tracing Data Contamination in Large Language Models},\nauthor={Shahriar Golchin and Mihai Surdeanu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=2Rwq6c3tvr}\n}",
        "github": "",
        "project": "",
        "reviewers": "NUVj;HqCE;KgsM;6REU",
        "pdf_size": 259469,
        "rating": "6;6;8;8",
        "confidence": "3;4;3;2",
        "soundness": "3;2;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "63;94;93;120",
        "wc_strengths": "51;13;122;37",
        "wc_weaknesses": "88;284;19;110",
        "wc_questions": "101;2;38;94",
        "wc_review": "303;393;272;361",
        "wc_reply_reviewers": "0;32;0;168",
        "wc_reply_authors": "768;1196;368;955",
        "reply_reviewers": "0;1;0;2",
        "reply_authors": "1;2;1;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            92.5,
            20.180436070610565
        ],
        "wc_strengths_avg": [
            55.75,
            40.59171713539598
        ],
        "wc_weaknesses_avg": [
            125.25,
            97.60987398823953
        ],
        "wc_questions_avg": [
            58.75,
            40.861809798392436
        ],
        "wc_review_avg": [
            332.25,
            47.441411235333206
        ],
        "wc_reply_reviewers_avg": [
            50.0,
            69.3685807840985
        ],
        "wc_reply_authors_avg": [
            821.75,
            302.7361681398508
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.7071067811865475,
        "gs_citation": 143,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3876183311628258637&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=2Rwq6c3tvr",
        "pdf": "https://openreview.net/pdf?id=2Rwq6c3tvr",
        "email": "arizona.edu;arizona.edu",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Arizona",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.arizona.edu",
        "aff_unique_abbr": "UA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "2SuA42Mq1c",
        "title": "BMAD: Benchmarks for Medical Anomaly Detection",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Anomaly detection (AD) is a fundamental research problem in machine learning and computer vision, with practical applications in industrial inspection, video surveillance, and medical diagnosis. In medical imaging, AD is especially vital for identifying anomalies that may indicate rare diseases or conditions. Despite its significance, there is a lack of a universal and fair benchmark for evaluating AD methods on medical images, which hinders the development of more generalized and robust AD methods in this specific domain. To bridge this gap, we introduce a comprehensive evaluation benchmark for assessing AD methods on medical images. This benchmark encompasses six reorganized datasets from five medical domains (i.e. brain MRI, liver CT, retinal OCT, chest X-ray, and digital histopathology) and three key evaluation metrics, and includes a total of fifteen state-of-the-art AD algorithms. This standardized and well-curated medical benchmark with the well-structured codebase enables comprehensive comparisons among recently proposed anomaly detection methods. It will facilitate the community to conduct a fair comparison and advance the field of AD on medical imaging.",
        "keywords": "Anomaly detection;Medical benchmarks",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Jinan Bao;Hanshi Sun;Hanqiu Deng;Yinsheng He;Zhaoxiang Zhang;Xingyu Li",
        "authorids": "~Jinan_Bao1;~Hanshi_Sun1;~Hanqiu_Deng1;~Yinsheng_He1;~Zhaoxiang_Zhang4;~Xingyu_Li3",
        "gender": "F;M;M;M;M;",
        "homepage": "https://apps.ualberta.ca/directory/person/jbao1;https://preminstrel.com/;;;;https://apps.ualberta.ca/directory/person/xingyu",
        "dblp": ";314/7377.html;298/6509;;;",
        "google_scholar": ";BjQHEh8AAAAJ;nmNQjgIAAAAJ;;;V8OICzYAAAAJ",
        "orcid": ";0009-0005-4436-234X;;;;",
        "linkedin": ";hanshi-sun-5b74b8228/;;yinsheng-he-ab90b3183/?originalSubdomain=ca;zhaoxiangzhangnonozz/;",
        "or_profile": "~Jinan_Bao1;~Hanshi_Sun1;~Hanqiu_Deng1;~Yinsheng_He1;~Zhaoxiang_Zhang4;~Xingyu_Li3",
        "aff": "University of Alberta;Carnegie Mellon University;University of Alberta;University of Alberta;;University of Alberta",
        "aff_domain": "ualberta.ca;cmu.edu;ualberta.ca;ualberta.ca;;ualberta.ca",
        "position": "MS student;MS student;PhD student;PhD student;;Assistant Professor",
        "bibtex": "@misc{\nbao2024bmad,\ntitle={{BMAD}: Benchmarks for Medical Anomaly Detection},\nauthor={Jinan Bao and Hanshi Sun and Hanqiu Deng and Yinsheng He and Zhaoxiang Zhang and Xingyu Li},\nyear={2024},\nurl={https://openreview.net/forum?id=2SuA42Mq1c}\n}",
        "github": "",
        "project": "",
        "reviewers": "csZB;jY9s;Y82y;SMmX",
        "site": "https://openreview.net/forum?id=2SuA42Mq1c",
        "pdf_size": 28467196,
        "rating": "3;3;5;6",
        "confidence": "4;4;4;3",
        "soundness": "4;2;2;3",
        "contribution": "2;1;2;3",
        "presentation": "3;2;2;3",
        "wc_summary": "63;81;59;27",
        "wc_strengths": "23;27;205;20",
        "wc_weaknesses": "21;73;248;35",
        "wc_questions": "127;1;28;121",
        "wc_review": "234;182;540;203",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "339;261;194;116",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            57.5,
            19.461500456028563
        ],
        "wc_strengths_avg": [
            68.75,
            78.7031606735079
        ],
        "wc_weaknesses_avg": [
            94.25,
            90.78374028426015
        ],
        "wc_questions_avg": [
            69.25,
            55.616431924387236
        ],
        "wc_review_avg": [
            289.75,
            145.6612079450119
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            227.5,
            82.32405480781422
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.7777777777777777,
        "gs_citation": 40,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10416728347596820430&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;0;0;0",
        "aff_unique_norm": "University of Alberta;Carnegie Mellon University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ualberta.ca;https://www.cmu.edu",
        "aff_unique_abbr": "UAlberta;CMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;0",
        "aff_country_unique": "Canada;United States"
    },
    {
        "title": "Towards Offline Opponent Modeling with In-context Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19549",
        "id": "2SwHngthig",
        "author_site": "Yuheng Jing, Kai Li, Bingyun Liu, Yifan Zang, Haobo Fu, QIANG FU, Junliang Xing, Jian Cheng",
        "tldr": "",
        "abstract": "Opponent modeling aims at learning the opponent's behaviors, goals, or beliefs to reduce the uncertainty of the competitive environment and assist decision-making. Existing work has mostly focused on learning opponent models online, which is impractical and inefficient in practical scenarios. To this end, we formalize an Offline Opponent Modeling (OOM) problem with the objective of utilizing pre-collected offline datasets to learn opponent models that characterize the opponent from the viewpoint of the controlled agent, which aids in adapting to the unknown fixed policies of the opponent. Drawing on the promises of the Transformers for decision-making, we introduce a general approach, Transformer Against Opponent (TAO), for OOM. Essentially, TAO tackles the problem by harnessing the full potential of the supervised pre-trained Transformers' in-context learning capabilities. The foundation of TAO lies in three stages: an innovative offline policy embedding learning stage, an offline opponent-aware response policy training stage, and a deployment stage for opponent adaptation with in-context learning. Theoretical analysis establishes TAO's equivalence to Bayesian posterior sampling in opponent modeling and guarantees TAO's convergence in opponent policy recognition. Extensive experiments and ablation studies on competitive environments with sparse and dense rewards demonstrate the impressive performance of TAO. Our approach manifests remarkable prowess for fast adaptation, especially in the face of unseen opponent policies, confirming its in-context learning potency.",
        "keywords": "Opponent Modeling;Offline;Transformer",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/ea211856fbe4c2b8d7cb871c578d530ac4bcec5c.zip",
        "author": "Yuheng Jing;Kai Li;Bingyun Liu;Yifan Zang;Haobo Fu;QIANG FU;Junliang Xing;Jian Cheng",
        "authorids": "~Yuheng_Jing1;~Kai_Li2;~Bingyun_Liu1;~Yifan_Zang1;~Haobo_Fu2;~QIANG_FU8;~Junliang_Xing1;~Jian_Cheng7",
        "gender": "M;M;M;M;M;M;M;",
        "homepage": ";;;;;http://people.ucas.ac.cn/~jlxing?language=en;https://people.ucas.ac.cn/~chengjian?language=en;https://github.com/liuby26",
        "dblp": "382/3906;181/2853;269/4608;85/8571;;43/7659.html;14/6145-1;",
        "google_scholar": ";_cY_PXgAAAAJ;;LFdJXNcAAAAJ;gANaxT0AAAAJ;jSwNd3MAAAAJ;ZGCIUJ8AAAAJ;",
        "orcid": ";;;;;0000-0001-6801-0510;0000-0003-1289-2758;",
        "linkedin": "jingyuheng;;;haobo-fu-382b0784/;;https://www.linkedin.cn/incareer/in/ACoAAAvlU14B40ZWH1pxg5JJDtQ6LlgMYkp0e5s;;",
        "or_profile": "~Yuheng_Jing1;~Kai_Li2;~Yifan_Zang1;~Haobo_Fu2;~QIANG_FU8;~Junliang_Xing1;~Jian_Cheng7;~Liu_Bingyun1",
        "aff": "Institute of Automation, Chinese Academy of Sciences;Institute of Automation, Chinese Academy of Sciences;University of Chinese Academy of Sciences;Tencent AI Lab;Tencent AI Lab;Tsinghua University;Institute of Automation, Chinese Academy of Sciences;Institute of Automation, Chinese Academy of Sciences",
        "aff_domain": "ia.ac.cn;ia.ac.cn;ucas.ac.cn;tencent.com;tencent.com;tsinghua.edu.cn;ia.ac.cn;ia.ac.cn",
        "position": "PhD student;Associate Professor;PhD student;Principal Researcher;Principal Researcher;Full Professor;Full Professor;MS student",
        "bibtex": "@inproceedings{\njing2024towards,\ntitle={Towards Offline Opponent Modeling with In-context Learning},\nauthor={Yuheng Jing and Kai Li and Bingyun Liu and Yifan Zang and Haobo Fu and QIANG FU and Junliang Xing and Jian Cheng},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=2SwHngthig}\n}",
        "github": "",
        "project": "",
        "reviewers": "fLaD;F2KT;Z2nF;QAav",
        "pdf_size": 1562635,
        "rating": "5;6;6;6",
        "confidence": "3;3;4;4",
        "soundness": "1;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "1;2;3;2",
        "wc_summary": "120;83;114;98",
        "wc_strengths": "78;90;23;68",
        "wc_weaknesses": "267;252;61;188",
        "wc_questions": "17;805;274;45",
        "wc_review": "482;1230;472;399",
        "wc_reply_reviewers": "48;503;191;0",
        "wc_reply_authors": "1711;4570;2118;1140",
        "reply_reviewers": "1;1;2;0",
        "reply_authors": "4;8;6;4",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            103.75,
            14.428704030508076
        ],
        "wc_strengths_avg": [
            64.75,
            25.33155147242269
        ],
        "wc_weaknesses_avg": [
            192.0,
            81.24346127535433
        ],
        "wc_questions_avg": [
            285.25,
            316.20592578255076
        ],
        "wc_review_avg": [
            645.75,
            338.83504467513393
        ],
        "wc_reply_reviewers_avg": [
            185.5,
            196.31161453159106
        ],
        "wc_reply_authors_avg": [
            2384.75,
            1308.6075376139327
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            5.5,
            1.6583123951777
        ],
        "replies_avg": [
            32,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9282177930204355332&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=2SwHngthig",
        "pdf": "https://openreview.net/pdf?id=2SwHngthig",
        "email": "ia.ac.cn;ia.ac.cn;ucas.ac.cn;tencent.com;tencent.com;tsinghua.edu.cn;ia.ac.cn;ia.ac.cn",
        "author_num": 8,
        "aff_unique_index": "0;0;1;2;2;3;0;0",
        "aff_unique_norm": "Chinese Academy of Sciences;University of Chinese Academy of Sciences;Tencent;Tsinghua University",
        "aff_unique_dep": "Institute of Automation;;Tencent AI Lab;",
        "aff_unique_url": "http://www.ia.cas.cn;http://www.ucas.ac.cn;https://ai.tencent.com;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "CAS;UCAS;Tencent AI Lab;THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "2TFfLiTGBS",
        "title": "DART: A Principled Approach to Adversarially Robust Unsupervised Domain Adaptation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Distribution shifts and adversarial examples are two major challenges for deploying machine learning models. While these challenges have been studied individually, their combination is an important topic that remains relatively under-explored. In this work, we study the problem of adversarial robustness under a common setting of distribution shift \u2013 unsupervised domain adaptation (UDA). Specifically, given a labeled source domain $\\mathcal{D}_S$ and an unlabeled target domain $\\mathcal{D}_T$ with related but different distributions, the goal is to obtain an adversarially robust model for $\\mathcal{D}_T$. The absence of target domain labels poses a unique challenge, as conventional adversarial robustness defenses cannot be directly applied to $\\mathcal{D}_T$. To address this challenge, we first establish a generalization bound for the adversarial target loss, which consists of (i) terms related to the loss on the data, and (ii) a measure of worst-case domain divergence. Motivated by this bound, we develop a novel unified defense framework called *Divergence Aware adveRsarial Training* (DART), which can be used in conjunction with a variety of standard UDA  methods; e.g., DANN  (Ganin & Lempitsky, 2015). DART is applicable to general threat models, including the popular $\\ell_p$-norm model, and does not require heuristic regularizers or architectural changes. We also release DomainRobust: a testbed for evaluating robustness of UDA models to adversarial attacks. DomainRobust consists of 4 multi-domain benchmark datasets (with 46 source-target pairs) and 7 meta-algorithms with a total of 11 variants. Our large-scale experiments demonstrate that on average, DART significantly enhances model robustness on all benchmarks compared to the state of the art, while maintaining competitive standard accuracy. The relative improvement in robustness from DART reaches up to 29.2% on the source-target domain pairs considered.",
        "keywords": "Unsupervised Domain Adaptation;Adversarial Robustness",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/2b121ce5b467f20c612b9cac2cd9bc67cb561fcd.pdf",
        "author": "Yunjuan Wang;Hussein Hazimeh;Natalia Ponomareva;Alexey Kurakin;Ibrahim Hammoud;Raman Arora",
        "authorids": "~Yunjuan_Wang1;~Hussein_Hazimeh1;~Natalia_Ponomareva1;~Alexey_Kurakin1;~Ibrahim_Hammoud1;~Raman_Arora1",
        "gender": "F;;F;M;M;M",
        "homepage": "https://yunjuanwang.github.io/;http://www.mit.edu/~hazimeh;;http://kurakin.me;https://ibrahmd.github.io/;http://www.cs.jhu.edu/~raman/Home.html",
        "dblp": "31/560;165/0820-1;71/6768-1;56/9834;;",
        "google_scholar": "t_VSEEwAAAAJ;;eIdQR5oAAAAJ;nCh4qyMAAAAJ;KVsJ87cAAAAJ;Spe0xdkAAAAJ",
        "orcid": ";0000-0003-4501-0678;0009-0005-6761-1468;;;",
        "linkedin": "yunjuan-wang-12ab85169/;;;;;",
        "or_profile": "~Yunjuan_Wang1;~Hussein_Hazimeh1;~Natalia_Ponomareva1;~Alexey_Kurakin1;~Ibrahim_Hammoud1;~Raman_Arora1",
        "aff": "Johns Hopkins University;Google;Google;Research, Google;Google;Johns Hopkins University",
        "aff_domain": "jhu.edu;google.com;google.com;research.google.com;google.com;jhu.edu",
        "position": "PhD student;Research Scientist;Software Engineer in Research;Research Software Engineer;Researcher;Associate Professor",
        "bibtex": "@misc{\nwang2024dart,\ntitle={{DART}: A Principled Approach to Adversarially Robust Unsupervised Domain Adaptation},\nauthor={Yunjuan Wang and Hussein Hazimeh and Natalia Ponomareva and Alexey Kurakin and Ibrahim Hammoud and Raman Arora},\nyear={2024},\nurl={https://openreview.net/forum?id=2TFfLiTGBS}\n}",
        "github": "",
        "project": "",
        "reviewers": "vW45;ag53;d4Ff;qNjr",
        "site": "https://openreview.net/forum?id=2TFfLiTGBS",
        "pdf_size": 686187,
        "rating": "3;3;6;6",
        "confidence": "4;5;3;3",
        "soundness": "1;2;2;3",
        "contribution": "2;1;2;3",
        "presentation": "2;2;3;3",
        "wc_summary": "74;59;49;65",
        "wc_strengths": "55;29;65;63",
        "wc_weaknesses": "307;145;84;105",
        "wc_questions": "29;1;5;32",
        "wc_review": "465;234;203;265",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1342;317;1382;1072",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;2;5;4",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            61.75,
            9.093266739736606
        ],
        "wc_strengths_avg": [
            53.0,
            14.352700094407323
        ],
        "wc_weaknesses_avg": [
            160.25,
            87.51392746300442
        ],
        "wc_questions_avg": [
            16.75,
            13.863170633011771
        ],
        "wc_review_avg": [
            291.75,
            102.39964599548183
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1028.25,
            427.6004998827761
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            3.5,
            1.118033988749895
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.9045340337332909,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4090061530743553470&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1;1;1;0",
        "aff_unique_norm": "Johns Hopkins University;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.jhu.edu;https://www.google.com",
        "aff_unique_abbr": "JHU;Google",
        "aff_campus_unique_index": "1;1;1;1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "2TOcJivjpt",
        "title": "Poor Teaching: Explore and Question Knowledge Distillation under Distribution Shift",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Knowledge distillation techniques transfer knowledge from a complex or large learning model into a small model, and have made remarkable achievements in recent decades. However, few studies has investigated and explored the mechanism of the knowledge distillation against distribution shifts in real scenarios. In this paper, we reconsider the knowledge distillation paradigm under the shift situations, by reformulating the objectives of distillation with multiple domains. Under the novel paradigm, we propose a unified and systematic evaluation framework to benchmark knowledge distillation against two general distributional shifts including diversity and correlation shift. \nThe evaluation benchmark covers more than 20 methods from algorithmic, data-driven, and optimization perspectives for five benchmark datasets. Extensive experiments are constructed and some constructive findings are summarized to explain when and how the existing knowledge distillation methods work against distribution shifts.",
        "keywords": "Knowledge Distillation;Distribution Shift",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/6693baad034702ac4a71dc4dfc60ffe0ea4ce3c3.zip",
        "author": "Songming Zhang;Ziyu Lyu;Xiaofeng Chen",
        "authorids": "~Songming_Zhang2;~Ziyu_Lyu1;~Xiaofeng_Chen5",
        "gender": "M;;M",
        "homepage": ";;",
        "dblp": "315/4171-2;;c/XiaofengChen9",
        "google_scholar": "ITQNuIIAAAAJ;;",
        "orcid": "0000-0001-7695-5880;;0000-0003-4062-4515",
        "linkedin": "songming-zhang-987589321/;;",
        "or_profile": "~Songming_Zhang2;~Ziyu_Lyu1;~Xiaofeng_Chen5",
        "aff": "Chongqing Jiaotong Universiity;;Chongqing Jiaotong Universiity",
        "aff_domain": "cqjtu.edu.cn;;cqjtu.edu.cn",
        "position": "MS student;;Full Professor",
        "bibtex": "@misc{\nzhang2024poor,\ntitle={Poor Teaching: Explore and Question Knowledge Distillation under Distribution Shift},\nauthor={Songming Zhang and Ziyu Lyu and Xiaofeng Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=2TOcJivjpt}\n}",
        "github": "",
        "project": "",
        "reviewers": "Uh6z;ditG;Ywf2;m1kT",
        "site": "https://openreview.net/forum?id=2TOcJivjpt",
        "pdf_size": 750173,
        "rating": "1;3;3;5",
        "confidence": "5;5;4;3",
        "soundness": "2;2;1;3",
        "contribution": "1;2;2;2",
        "presentation": "1;3;2;3",
        "wc_summary": "100;52;58;69",
        "wc_strengths": "62;26;38;57",
        "wc_weaknesses": "442;229;287;233",
        "wc_questions": "3;3;2;6",
        "wc_review": "607;310;385;365",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            69.75,
            18.498310733685926
        ],
        "wc_strengths_avg": [
            45.75,
            14.49784466739798
        ],
        "wc_weaknesses_avg": [
            297.75,
            86.37527134544933
        ],
        "wc_questions_avg": [
            3.5,
            1.5
        ],
        "wc_review_avg": [
            416.75,
            113.22185080628209
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8528028654224418,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Ou7d6aYqByEJ:scholar.google.com/&scioq=Poor+Teaching:+Explore+and+Question+Knowledge+Distillation+under+Distribution+Shift&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Chongqing Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.cqjtu.edu.cn",
        "aff_unique_abbr": "CQJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "2UlfvGU6rL",
        "title": "Equivariant Graph Neural Operator for Modeling 3D Dynamics",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Modeling the complex three-dimensional (3D) dynamics of relational systems is an important problem in the natural sciences, with applications ranging from molecular simulations to particle mechanics. Machine learning methods have achieved good success by learning graph neural networks to model spatial interactions. However, these approaches do not faithfully capture temporal correlations since they only model next-step predictions. In this work, we propose Equivariant Graph Neural Operator (EGNO), a novel and principled method that directly models dynamics as trajectories instead of just as next-step prediction. Different from existing methods, EGNO explicitly learns the temporal evolution of 3D dynamics where we formulate the dynamics as a function over time and learn neural operators to approximate it. To capture the temporal correlations while keeping the intrinsic SE(3)-equivariance, we develop equivariant temporal convolutions parameterized in the Fourier space and build EGNO by stacking the Fourier layers over equivariant networks. Comprehensive experiments in multiple domains, including particle simulations, human motion capture, and molecular dynamics, demonstrate the significantly superior performance of EGNO against existing methods, thanks to the equivariant temporal modeling.",
        "keywords": "Equivariant Graph Neural Network;Neural Operator;3D Dynamics",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/32ad867085ddb16eb5fc67e72aca0bd98bf9f8d1.zip",
        "author": "Minkai Xu;Jiaqi Han;Aaron Lou;Kamyar Azizzadenesheli;Stefano Ermon;Anima Anandkumar",
        "authorids": "~Minkai_Xu1;~Jiaqi_Han2;~Aaron_Lou1;~Kamyar_Azizzadenesheli1;~Stefano_Ermon1;~Anima_Anandkumar1",
        "gender": "M;M;M;M;M;F",
        "homepage": "https://minkaixu.com;https://hanjq17.github.io;https://aaronlou.com;https://kamyar.page/;http://cs.stanford.edu/~ermon/;http://tensorlab.cms.caltech.edu/users/anima/",
        "dblp": "257/3355;235/0412;232/3858;176/5584;47/8135;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;AKppgMAAAAAJ;;CxAS4SQAAAAJ;;bEcLezcAAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";;;;;anima-anandkumar-35171b1/",
        "or_profile": "~Minkai_Xu1;~Jiaqi_Han2;~Aaron_Lou1;~Kamyar_Azizzadenesheli1;~Stefano_Ermon1;~anima_anandkumar1",
        "aff": "Stanford University;Computer Science Department, Stanford University;Stanford University;NVIDIA;Stanford University;California Institute of Technology",
        "aff_domain": "stanford.edu;cs.stanford.edu;stanford.edu;nvidia.com;stanford.edu;caltech.edu",
        "position": "PhD student;PhD student;PhD student;Researcher;Associate Professor;Full Professor",
        "bibtex": "@misc{\nxu2024equivariant,\ntitle={Equivariant Graph Neural Operator for Modeling 3D Dynamics},\nauthor={Minkai Xu and Jiaqi Han and Aaron Lou and Kamyar Azizzadenesheli and Stefano Ermon and Anima Anandkumar},\nyear={2024},\nurl={https://openreview.net/forum?id=2UlfvGU6rL}\n}",
        "github": "",
        "project": "",
        "reviewers": "kxN5;vFqH;mHw8;AtkK",
        "site": "https://openreview.net/forum?id=2UlfvGU6rL",
        "pdf_size": 3142918,
        "rating": "5;5;6;8",
        "confidence": "3;4;3;3",
        "soundness": "2;3;3;3",
        "contribution": "2;4;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "57;153;47;76",
        "wc_strengths": "51;43;81;118",
        "wc_weaknesses": "92;84;126;3",
        "wc_questions": "120;76;90;22",
        "wc_review": "320;356;344;219",
        "wc_reply_reviewers": "0;107;18;0",
        "wc_reply_authors": "1240;1312;944;101",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "3;3;3;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            83.25,
            41.595522595587134
        ],
        "wc_strengths_avg": [
            73.25,
            29.46502163583119
        ],
        "wc_weaknesses_avg": [
            76.25,
            45.135213525583325
        ],
        "wc_questions_avg": [
            77.0,
            35.510561809129406
        ],
        "wc_review_avg": [
            309.75,
            53.97395205096621
        ],
        "wc_reply_reviewers_avg": [
            31.25,
            44.347350540928595
        ],
        "wc_reply_authors_avg": [
            899.25,
            481.06100184903784
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            0.8660254037844386
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.4714045207910316,
        "gs_citation": 20,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10943342957164133565&as_sdt=5,31&sciodt=0,31&hl=en",
        "gs_version_total": 10,
        "aff_unique_index": "0;0;0;1;0;2",
        "aff_unique_norm": "Stanford University;NVIDIA;California Institute of Technology",
        "aff_unique_dep": ";NVIDIA Corporation;",
        "aff_unique_url": "https://www.stanford.edu;https://www.nvidia.com;https://www.caltech.edu",
        "aff_unique_abbr": "Stanford;NVIDIA;Caltech",
        "aff_campus_unique_index": "0;0;0;0;2",
        "aff_campus_unique": "Stanford;;Pasadena",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Unbalancedness in Neural Monge Maps Improves Unpaired Domain Translation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19548",
        "id": "2UnCj3jeao",
        "author_site": "Luca Eyring, Dominik Klein, Th\u00e9o Uscidda, Giovanni Palla, Niki Kilbertus, Zeynep Akata, Fabian Theis",
        "tldr": "",
        "abstract": "In optimal transport (OT), a Monge map is known as a mapping that transports a source distribution to a target distribution in the most cost-efficient way. Recently, multiple neural estimators for Monge maps have been developed and applied in diverse unpaired domain translation tasks, e.g. in single-cell biology and computer vision. However, the classic OT framework enforces mass conservation, which\nmakes it prone to outliers and limits its applicability in real-world scenarios. The latter can be particularly harmful in OT domain translation tasks, where the relative position of a sample within a distribution is explicitly taken into account. While unbalanced OT tackles this challenge in the discrete setting, its integration into neural Monge map estimators has received limited attention. We propose a theoretically\ngrounded method to incorporate unbalancedness into any Monge map estimator. We improve existing estimators to model cell trajectories over time and to predict cellular responses to perturbations. Moreover, our approach seamlessly integrates with the OT flow matching (OT-FM) framework. While we show that OT-FM performs competitively in image translation, we further improve performance by\nincorporating unbalancedness (UOT-FM), which better preserves relevant features. We hence establish UOT-FM as a principled method for unpaired image translation.",
        "keywords": "optimal transport;domain translation;image translation;flow matching",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Luca Eyring;Dominik Klein;Th\u00e9o Uscidda;Giovanni Palla;Niki Kilbertus;Zeynep Akata;Fabian J Theis",
        "authorids": "~Luca_Eyring1;~Dominik_Klein1;~Th\u00e9o_Uscidda1;~Giovanni_Palla1;~Niki_Kilbertus1;~Zeynep_Akata1;~Fabian_J_Theis1",
        "gender": "M;M;M;;F;;M",
        "homepage": "https://scholar.google.com/citations?user=Zs1w-ukAAAAJ&hl=en&oi=ao;https://theouscidda6.github.io/;https://giovannipalla.com/;;https://eml-unitue.de/people/zeynep-akata;https://www.helmholtz-munich.de/en/icb/pi/fabian-theis;https://lucaeyring.com/",
        "dblp": ";;;202/1966;117/4838;t/FabianJTheis;361/7132",
        "google_scholar": "Zs1w-ukAAAAJ;xnQZonMAAAAJ;20uwxzkAAAAJ;uQZjTq4AAAAJ;jQl9RtkAAAAJ;sqWpn2AAAAAJ;",
        "orcid": ";;0000-0002-8004-4462;;0000-0002-1432-7747;0000-0002-2419-1943;",
        "linkedin": ";th\u00e9o-uscidda-926335174/;;;zeynep-akata-36182045/?ppe=1;;luca-eyring-74abb01b2/",
        "or_profile": "~Dominik_Klein1;~Th\u00e9o_Uscidda1;~Giovanni_Palla1;~Niki_Kilbertus1;~Zeynep_Akata1;~Fabian_J._Theis1;~Luca_Vincent_Eyring1",
        "aff": ";Ecole Nationale de la Statistique et de l'Administration Economique;Technische Universit\u00e4t M\u00fcnchen;Helmholtz AI;Helmholtz Munich;Technical University Munich;Eberhard-Karls-Universit\u00e4t T\u00fcbingen",
        "aff_domain": ";ensae.fr;tum.de;helmholtz-muenchen.de;helmholtz-munich.de;tum.de;uni-tuebingen.de",
        "position": ";PhD student;PhD student;Group Leader;Researcher;Full Professor;PhD student",
        "bibtex": "@inproceedings{\neyring2024unbalancedness,\ntitle={Unbalancedness in Neural Monge Maps Improves Unpaired Domain Translation},\nauthor={Luca Eyring and Dominik Klein and Th{\\'e}o Uscidda and Giovanni Palla and Niki Kilbertus and Zeynep Akata and Fabian J Theis},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=2UnCj3jeao}\n}",
        "github": "",
        "project": "",
        "reviewers": "1iBx;Rczx;qjsW;LDyN",
        "pdf_size": 10584155,
        "rating": "6;6;6;6",
        "confidence": "3;3;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "60;120;117;33",
        "wc_strengths": "46;64;131;54",
        "wc_weaknesses": "41;37;78;144",
        "wc_questions": "162;288;40;6",
        "wc_review": "309;509;366;237",
        "wc_reply_reviewers": "42;48;0;0",
        "wc_reply_authors": "993;943;561;439",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            82.5,
            37.259227045122664
        ],
        "wc_strengths_avg": [
            73.75,
            33.662850443775554
        ],
        "wc_weaknesses_avg": [
            75.0,
            42.924352062669506
        ],
        "wc_questions_avg": [
            124.0,
            111.04053313993049
        ],
        "wc_review_avg": [
            355.25,
            99.84581864054198
        ],
        "wc_reply_reviewers_avg": [
            22.5,
            22.599778759979046
        ],
        "wc_reply_authors_avg": [
            734.0,
            238.5979882563975
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16466905825496249577&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=2UnCj3jeao",
        "pdf": "https://openreview.net/pdf?id=2UnCj3jeao",
        "email": ";ensae.fr;tum.de;helmholtz-muenchen.de;helmholtz-munich.de;tum.de;uni-tuebingen.de",
        "author_num": 7,
        "aff_unique_index": "0;1;2;3;4;5",
        "aff_unique_norm": "Ecole Nationale de la Statistique et de l'Administration Economique;Technische Universit\u00e4t M\u00fcnchen;Helmholtz Association of German Research Centres;Helmholtz Zentrum M\u00fcnchen;Technical University of Munich;Eberhard Karls University of T\u00fcbingen",
        "aff_unique_dep": ";;Helmholtz AI;;;",
        "aff_unique_url": "https://ensae.fr;https://www.tum.de;https://www.helmholtz-ai.de;https://www.helmholtz-muenchen.de;https://www.tum.de;https://www.uni-tuebingen.de/",
        "aff_unique_abbr": "ENSAE;TUM;Helmholtz AI;HMGU;TUM;Uni T\u00fcbingen",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";T\u00fcbingen",
        "aff_country_unique_index": "0;1;1;1;1;1",
        "aff_country_unique": "France;Germany"
    },
    {
        "id": "2UxSXuzrap",
        "title": "Learning the Unlearnable: Adversarial Augmentations Suppress Unlearnable Example Attacks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Unlearnable example attacks are data poisoning techniques that can be used to safeguard public data against unauthorized use for training deep learning models. These methods add stealthy perturbations to the original image, thereby making it difficult for deep learning models to learn from these training data effectively. Current research suggests that adversarial training can, to a certain degree, mitigate the impact of unlearnable example attacks, while common data augmentation methods are not effective against such poisons. Adversarial training, however, demands considerable computational resources and can result in non-trivial accuracy loss. In this paper, we introduce the UEraser method, which outperforms current defenses against different types of state-of-the-art unlearnable example attacks through a combination of effective data augmentation policies and loss-maximizing adversarial augmentations. In stark contrast to the current SOTA adversarial training methods, UEraser uses adversarial augmentations, which extends beyond the confines of $\\ell_p$ perturbation budget assumed by current unlearning attacks and defenses. It also helps to improve the model's generalization ability, thus protecting against accuracy loss. UEraser wipes out the unlearning effect with loss-maximizing adversarial augmentations, thus restoring trained model accuracies. Interestingly, UEraser-Lite, a fast variant without adversarial augmentations, is also highly effective in preserving clean accuracies. On challenging unlearnable CIFAR-10, CIFAR-100, SVHN, and ImageNet-subset datasets produced with various attacks, it achieves results that are comparable to those obtained during clean training. We also demonstrate its efficacy against possible adaptive attacks. Our code is open source and available to the deep learning community.",
        "keywords": "Availability Attacks;Unlearnable Examples;Adversarial Machine Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/cb66b6bd43a3dc69768c49799caf6defcb95f2d5.zip",
        "author": "Tianrui Qin;Xitong Gao;Juanjuan Zhao;Kejiang Ye;Cheng-zhong Xu",
        "authorids": "~Tianrui_Qin1;~Xitong_Gao1;~Juanjuan_Zhao1;~Kejiang_Ye1;~Cheng-zhong_Xu1",
        "gender": "M;M;F;;",
        "homepage": "https://github.com/Tianyue818;https://github.com/admk;https://people.ucas.ac.cn/~zhaojuanjuan?language=cn;;",
        "dblp": "294/4992;140/2071;;;",
        "google_scholar": "_bOMXMkAAAAJ;-YIUCL8AAAAJ;;;",
        "orcid": "0009-0002-8386-2003;0000-0002-2063-2051;;;",
        "linkedin": ";;;;",
        "or_profile": "~Tianrui_Qin1;~Xitong_Gao1;~Juanjuan_Zhao1;~Kejiang_Ye1;~Cheng-zhong_Xu1",
        "aff": "Shenzhen Institutes of Advanced Technology, Chinese Academy of Sciences, Chinese Academy of Sciences;Shenzhen Institute of Advanced Technology, Chinese Academy of Sciences;Shenzhen Institutes of Advanced Technology, Chinese Academy of Sciences, Chinese Academy of Sciences;;",
        "aff_domain": "siat.ac.cn;siat.ac.cn;siat.ac.cn;;",
        "position": "MS student;Researcher;Associate Professor;;",
        "bibtex": "@misc{\nqin2024learning,\ntitle={Learning the Unlearnable: Adversarial Augmentations Suppress Unlearnable Example Attacks},\nauthor={Tianrui Qin and Xitong Gao and Juanjuan Zhao and Kejiang Ye and Cheng-zhong Xu},\nyear={2024},\nurl={https://openreview.net/forum?id=2UxSXuzrap}\n}",
        "github": "",
        "project": "",
        "reviewers": "iWnX;3r2o;E5wZ;6kgo",
        "site": "https://openreview.net/forum?id=2UxSXuzrap",
        "pdf_size": 3562476,
        "rating": "1;3;6;6",
        "confidence": "5;4;2;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "181;77;72;72",
        "wc_strengths": "29;55;50;109",
        "wc_weaknesses": "547;365;112;103",
        "wc_questions": "3;210;11;2",
        "wc_review": "760;707;245;286",
        "wc_reply_reviewers": "402;0;0;0",
        "wc_reply_authors": "808;657;191;210",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            4.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            100.5,
            46.521500405726385
        ],
        "wc_strengths_avg": [
            60.75,
            29.51588555337617
        ],
        "wc_weaknesses_avg": [
            281.75,
            185.77859806769993
        ],
        "wc_questions_avg": [
            56.5,
            88.69188237939254
        ],
        "wc_review_avg": [
            499.5,
            235.19619469710815
        ],
        "wc_reply_reviewers_avg": [
            100.5,
            174.07110616067217
        ],
        "wc_reply_authors_avg": [
            466.5,
            271.38763789089586
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9486832980505139,
        "gs_citation": 28,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12527428757192423846&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Chinese Academy of Sciences;Shenzhen Institute of Advanced Technology",
        "aff_unique_dep": "Shenzhen Institutes of Advanced Technology;",
        "aff_unique_url": "http://www.cas.cn;http://www.siat.cas.cn",
        "aff_unique_abbr": "CAS;SIAT",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Shenzhen",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "On the Over-Memorization During Natural, Robust and Catastrophic Overfitting",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19547",
        "id": "2V1Z0Jdmss",
        "author_site": "Runqi Lin, Chaojian Yu, Bo Han, Tongliang Liu",
        "tldr": "",
        "abstract": "Overfitting negatively impacts the generalization ability of deep neural networks (DNNs) in both natural and adversarial training. Existing methods struggle to consistently address different types of overfitting, typically designing strategies that focus separately on either natural or adversarial patterns. In this work, we adopt a unified perspective by solely focusing on natural patterns to explore different types of overfitting. Specifically, we examine the memorization effect in DNNs and reveal a shared behaviour termed over-memorization, which impairs their generalization capacity. This behaviour manifests as DNNs suddenly becoming high-confidence in predicting certain training patterns and retaining a persistent memory for them. Furthermore, when DNNs over-memorize an adversarial pattern, they tend to simultaneously exhibit high-confidence prediction for the corresponding natural pattern. These findings motivate us to holistically mitigate different types of overfitting by hindering the DNNs from over-memorization training patterns. To this end, we propose a general framework, $\\textit{Distraction Over-Memorization}$ (DOM), which explicitly prevents over-memorization by either removing or augmenting the high-confidence natural patterns. Extensive experiments demonstrate the effectiveness of our proposed method in mitigating overfitting across various training paradigms.",
        "keywords": "overfitting;natural overfitting;robust overfitting;catastrophic overfitting",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Runqi Lin;Chaojian Yu;Bo Han;Tongliang Liu",
        "authorids": "~Runqi_Lin1;~Chaojian_Yu1;~Bo_Han1;~Tongliang_Liu1",
        "gender": "M;M;M;M",
        "homepage": "https://runqilin.github.io;;https://tongliang-liu.github.io/;https://bhanml.github.io/",
        "dblp": "359/1108;223/9872;150/6667;241/0472-3",
        "google_scholar": "Zg7PKbcAAAAJ;b3ltuG8AAAAJ;https://scholar.google.com.au/citations?user=EiLdZ_YAAAAJ;nTNjqHwAAAAJ",
        "orcid": "0009-0000-6607-7754;;;",
        "linkedin": ";;;",
        "or_profile": "~Runqi_Lin1;~Chaojian_Yu1;~Tongliang_Liu1;~bo_han2",
        "aff": "University of Sydney;The University of Sydney;Mohamed bin Zayed University of Artificial Intelligence;MBZUAI",
        "aff_domain": "usyd.edu.au;uni.sydney.edu.au;mbzuai.ac.ae;mbzuai.ac.ae",
        "position": "PhD student;PhD student;Affiliated Associate Professor;Researcher",
        "bibtex": "@inproceedings{\nlin2024on,\ntitle={On the Over-Memorization During Natural, Robust and Catastrophic Overfitting},\nauthor={Runqi Lin and Chaojian Yu and Bo Han and Tongliang Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=2V1Z0Jdmss}\n}",
        "github": "",
        "project": "",
        "reviewers": "uFwf;mcnh;3ew1;2dX7",
        "pdf_size": 12791991,
        "rating": "5;6;6;8",
        "confidence": "4;4;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "162;44;121;79",
        "wc_strengths": "107;40;105;42",
        "wc_weaknesses": "253;128;140;126",
        "wc_questions": "114;5;87;2",
        "wc_review": "636;217;453;249",
        "wc_reply_reviewers": "348;0;0;0",
        "wc_reply_authors": "1246;1087;575;709",
        "reply_reviewers": "2;0;0;0",
        "reply_authors": "6;4;3;3",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            101.5,
            44.30857704779064
        ],
        "wc_strengths_avg": [
            73.5,
            32.515380975778214
        ],
        "wc_weaknesses_avg": [
            161.75,
            52.954579594214515
        ],
        "wc_questions_avg": [
            52.0,
            49.441885077330944
        ],
        "wc_review_avg": [
            388.75,
            169.03309587178484
        ],
        "wc_reply_reviewers_avg": [
            87.0,
            150.68842025849233
        ],
        "wc_reply_authors_avg": [
            904.25,
            272.35948211876155
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            4.0,
            1.224744871391589
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14175200537487355709&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=2V1Z0Jdmss",
        "pdf": "https://openreview.net/pdf?id=2V1Z0Jdmss",
        "email": "usyd.edu.au;uni.sydney.edu.au;mbzuai.ac.ae;mbzuai.ac.ae",
        "author_num": 4,
        "aff_unique_index": "0;0;1;1",
        "aff_unique_norm": "University of Sydney;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.sydney.edu.au;https://mbzuai.ac.ae",
        "aff_unique_abbr": "USYD;MBZUAI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;1",
        "aff_country_unique": "Australia;United Arab Emirates"
    },
    {
        "id": "2VAi5F9BOJ",
        "title": "PLPP: PROMPT LEARNING WITH PERPLEXITY FOR VISION-LANGUAGE MODELS",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Pre-trained vision-language (VL) models such as CLIP have demonstrated their excellent performance across numerous downstream tasks. A recent method, called Context Optimization (CoOp), further improves the performance of CLIP on downstream tasks by introducing prompt learning. CoOp optimizes a set of learnable vectors, aka prompt and freezes the whole CLIP model, instead of using manually crafted templates (e.g., a template ``a photo of a \\{category\\}'') to fine-tune the CLIP model. Nonetheless, we observed that the resulting prompts are always incomprehensible, which is counter-intuitive, and existing CoOp-based methods overlook this issue. As the first work aiming at learning comprehensible prompts, this paper proposes to use Perplexity to supervise the process of prompt learning in the CoOp framework. Perplexity is a metric to evaluate the quality of a language model (LM) in Natural Language Processing field, and we design a two-step operation to compute the perplexity for prompts. The first step is a calculation of cosine similarity to obtain the labels of vectors, and the second step is a training-free LM Head to output word probability distribution. Our proposed method, i.e., \\textbf{P}rompt \\textbf{L}earning with \\textbf{P}er\\textbf{P}lexity (PLPP), can be integrated in any CoOp-based method and the experiments show that the learned prompts are much more comprehensible compared with the original and an improved CoOp methods, without sacrificing model accuracy. Codes are available at \\href{https://github.com}{https://github.com}.",
        "keywords": "Vision-Language Models;Prompt Learning;Perplexity.",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/d0440dfa3c5eaa5e0e5608f7abe900e2d2e07894.pdf",
        "author": "Biao Liu;Wenyi Fang;Xiaoyu Wu;YANG ZHENG;zheng hu;Bo Yuan",
        "authorids": "~Biao_Liu2;~Wenyi_Fang2;~Xiaoyu_Wu3;~YANG_ZHENG5;~zheng_hu3;~Bo_Yuan14",
        "gender": "M;M;F;M;;M",
        "homepage": ";https://www.researchgate.net/profile/Wenyi-Fang-2;;;http://www.none.com;http://cse.sustech.edu.cn/faculty/~yuanb",
        "dblp": ";;;;;",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;;bNn7VkEAAAAJ;Vi5OPpoAAAAJ;;",
        "orcid": ";;;0000-0002-3775-6739;;",
        "linkedin": ";;;;;",
        "or_profile": "~Biao_Liu2;~Wenyi_Fang2;~Xiaoyu_Wu3;~YANG_ZHENG5;~zheng_hu3;~Bo_Yuan14",
        "aff": "Southern University of Science and Technology;;;Huawei Technologies Ltd.;Huawei Technologies Ltd.;",
        "aff_domain": "sustech.edu.cn;;;huawei.com;huawei.com;",
        "position": "MS student;;;Researcher;Principal Researcher;",
        "bibtex": "@misc{\nliu2024plpp,\ntitle={{PLPP}: {PROMPT} {LEARNING} {WITH} {PERPLEXITY} {FOR} {VISION}-{LANGUAGE} {MODELS}},\nauthor={Biao Liu and Wenyi Fang and Xiaoyu Wu and YANG ZHENG and zheng hu and Bo Yuan},\nyear={2024},\nurl={https://openreview.net/forum?id=2VAi5F9BOJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "6oUS;NG2C;42yP;hPSs",
        "site": "https://openreview.net/forum?id=2VAi5F9BOJ",
        "pdf_size": 1268300,
        "rating": "1;3;3;3",
        "confidence": "4;5;5;5",
        "soundness": "1;2;2;2",
        "contribution": "1;2;1;2",
        "presentation": "2;3;2;2",
        "wc_summary": "58;67;45;84",
        "wc_strengths": "7;30;31;118",
        "wc_weaknesses": "263;305;224;426",
        "wc_questions": "86;5;5;250",
        "wc_review": "414;407;305;878",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "392;338;447;171",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            63.5,
            14.186260959111108
        ],
        "wc_strengths_avg": [
            46.5,
            42.38218965556169
        ],
        "wc_weaknesses_avg": [
            304.5,
            75.77103668289091
        ],
        "wc_questions_avg": [
            86.5,
            100.02124774266716
        ],
        "wc_review_avg": [
            501.0,
            221.89524555519435
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            337.0,
            103.29811227704019
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:w-vWvHN_dSEJ:scholar.google.com/&scioq=PLPP:+PROMPT+LEARNING+WITH+PERPLEXITY+FOR+VISION-LANGUAGE+MODELS&hl=en&as_sdt=0,47",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Southern University of Science and Technology;Huawei",
        "aff_unique_dep": ";Huawei Technologies",
        "aff_unique_url": "https://www.sustech.edu.cn;https://www.huawei.com",
        "aff_unique_abbr": "SUSTech;Huawei",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "sRGB Real Noise Modeling via Noise-Aware Sampling with Normalizing Flows",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19546",
        "id": "2XBBumBGeP",
        "author_site": "Dongjin Kim, Donggoo Jung, Sungyong Baik, Tae Hyun Kim",
        "tldr": "",
        "abstract": "Noise poses a widespread challenge in signal processing, particularly when it comes to denoising images. Although convolutional neural networks (CNNs) have exhibited remarkable success in this field, they are predicated upon the belief that noise follows established distributions, which restricts their practicality when dealing with real-world noise. To overcome this limitation, several efforts have been taken to collect noisy image datasets from the real world. Generative methods, employing techniques such as generative adversarial networks (GANs) and normalizing flows (NFs), have emerged as a solution for generating realistic noisy images. Recent works model noise using camera metadata, however requiring metadata even for sampling phase. In contrast, in this work, we aim to estimate the underlying camera settings, enabling us to improve noise modeling and generate diverse noise distributions. To this end, we introduce a new NF framework that allows us to both classify noise based on camera settings and generate various noisy images. Through experimental results, our model demonstrates exceptional noise quality and leads in denoising performance on benchmark datasets.",
        "keywords": "sRGB real noise modeling;Normalizing flow;Low-level vision",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Dongjin Kim;Donggoo Jung;Sungyong Baik;Tae Hyun Kim",
        "authorids": "~Dongjin_Kim3;~Donggoo_Jung1;~Sungyong_Baik1;~Tae_Hyun_Kim2",
        "gender": ";M;M;M",
        "homepage": "https://sites.google.com/view/lliger9/;https://donggoo-jung.github.io;https://dsybaik-hy.github.io/;https://sites.google.com/view/lliger9/",
        "dblp": "16/9611-4;;243/2775;43/11343-6",
        "google_scholar": "https://scholar.google.co.kr/citations?user=6I9aJxYAAAAJ;https://scholar.google.co.kr/citations?user=yXJ05SwAAAAJ;lQ4gotkAAAAJ;https://scholar.google.co.kr/citations?user=8soccsoAAAAJ",
        "orcid": ";;;0000-0002-7995-3984",
        "linkedin": ";;;",
        "or_profile": "~Dongjin_Kim3;~Donggoo_Jung1;~Sungyong_Baik1;~Tae_Hyun_Kim2",
        "aff": "Hanyang University;Hanyang University;Hanyang University;Hanyang University",
        "aff_domain": "hanyang.ac.kr;hanyang.ac.kr;hanyang.ac.kr;hanyang.ac.kr",
        "position": "PhD student;PhD student;Assistant Professor;Associate Professor",
        "bibtex": "@inproceedings{\nkim2024srgb,\ntitle={s{RGB} Real Noise Modeling via Noise-Aware Sampling with Normalizing Flows},\nauthor={Dongjin Kim and Donggoo Jung and Sungyong Baik and Tae Hyun Kim},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=2XBBumBGeP}\n}",
        "github": "",
        "project": "",
        "reviewers": "VvGJ;EqxC;YHPu;s3bG",
        "pdf_size": 2920526,
        "rating": "6;6;6;8",
        "confidence": "5;4;4;5",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;4;3",
        "wc_summary": "67;67;92;46",
        "wc_strengths": "57;45;98;78",
        "wc_weaknesses": "32;69;213;329",
        "wc_questions": "61;2;5;20",
        "wc_review": "217;183;408;473",
        "wc_reply_reviewers": "10;16;0;0",
        "wc_reply_authors": "339;264;304;1629",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "2;2;1;3",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            68.0,
            16.294170736800325
        ],
        "wc_strengths_avg": [
            69.5,
            20.254629100529094
        ],
        "wc_weaknesses_avg": [
            160.75,
            118.3561891072875
        ],
        "wc_questions_avg": [
            22.0,
            23.526580712037184
        ],
        "wc_review_avg": [
            320.25,
            123.01498892411445
        ],
        "wc_reply_reviewers_avg": [
            6.5,
            6.837397165588672
        ],
        "wc_reply_authors_avg": [
            634.0,
            575.0760819230791
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:pp5KzMwhRq8J:scholar.google.com/&scioq=sRGB+Real+Noise+Modeling+via+Noise-Aware+Sampling+with+Normalizing+Flows&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=2XBBumBGeP",
        "pdf": "https://openreview.net/pdf?id=2XBBumBGeP",
        "email": "hanyang.ac.kr;hanyang.ac.kr;hanyang.ac.kr;hanyang.ac.kr",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Hanyang University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.hanyang.ac.kr",
        "aff_unique_abbr": "HYU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "Efficient and Scalable Graph Generation through Iterative Local Expansion",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19545",
        "id": "2XkTz7gdpc",
        "author_site": "Andreas Bergmeister, Karolis Martinkus, Nathana\u00ebl Perraudin, Roger Wattenhofer",
        "tldr": "",
        "abstract": "In the realm of generative models for graphs, extensive research has been conducted. However, most existing methods struggle with large graphs due to the complexity of representing the entire joint distribution across all node pairs and capturing both global and local graph structures simultaneously.\nTo overcome these issues, we introduce a method that generates a graph by progressively expanding a single node to a target graph. In each step, nodes and edges are added in a localized manner through denoising diffusion, building first the global structure, and then refining the local details. The local generation avoids modeling the entire joint distribution over all node pairs, achieving substantial computational savings with subquadratic runtime relative to node count while maintaining high expressivity through multiscale generation.\nOur experiments show that our model achieves state-of-the-art performance on well-established benchmark datasets while successfully scaling to graphs with at least 5000 nodes. Our method is also the first to successfully extrapolate to graphs outside of the training distribution, showcasing a much better generalization capability over existing methods.",
        "keywords": "Graph Generation;Denoising Diffusion;Spectral Graph Theory",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/0ee2694b3749856225c65d6a4b2b7ca91de6a422.zip",
        "author": "Andreas Bergmeister;Karolis Martinkus;Nathana\u00ebl Perraudin;Roger Wattenhofer",
        "authorids": "~Andreas_Bergmeister1;~Karolis_Martinkus1;~Nathana\u00ebl_Perraudin1;~Roger_Wattenhofer1",
        "gender": "M;M;M;Not Specified",
        "homepage": "https://bergmeister.ai/;https://disco.ethz.ch/members/mkarolis;;https://disco.ethz.ch/members/wroger",
        "dblp": ";276/5531;139/7579;w/RogerWattenhofer",
        "google_scholar": "CvdjBd8AAAAJ;https://scholar.google.ch/citations?user=Sr6ho54AAAAJ;;https://scholar.google.ch/citations?user=EG3VPm4AAAAJ",
        "orcid": "0009-0000-8039-3577;0000-0002-5344-4321;;",
        "linkedin": "andreas-bergmeister;;;roger-wattenhofer-4466731/",
        "or_profile": "~Andreas_Bergmeister1;~Karolis_Martinkus1;~Nathana\u00ebl_Perraudin1;~Roger_Wattenhofer1",
        "aff": "Technische Universit\u00e4t M\u00fcnchen;Prescient Design / Genentech / Roche;ETHZ - ETH Zurich;Swiss Federal Institute of Technology",
        "aff_domain": "tum.de;roche.com;ethz.ch;ethz.ch",
        "position": "PhD student;Researcher;Researcher;Full Professor",
        "bibtex": "@inproceedings{\nbergmeister2024efficient,\ntitle={Efficient and Scalable Graph Generation through Iterative Local Expansion},\nauthor={Andreas Bergmeister and Karolis Martinkus and Nathana{\\\"e}l Perraudin and Roger Wattenhofer},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=2XkTz7gdpc}\n}",
        "github": "",
        "project": "",
        "reviewers": "HbqV;sNQQ;38QF;mLXw",
        "pdf_size": 2488113,
        "rating": "5;5;6;8",
        "confidence": "4;4;2;3",
        "soundness": "3;2;3;3",
        "contribution": "3;2;2;3",
        "presentation": "2;2;2;2",
        "wc_summary": "156;65;39;134",
        "wc_strengths": "174;68;25;62",
        "wc_weaknesses": "314;699;209;178",
        "wc_questions": "205;318;24;152",
        "wc_review": "849;1150;297;526",
        "wc_reply_reviewers": "41;256;221;21",
        "wc_reply_authors": "1472;1611;652;350",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "3;3;2;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            98.5,
            48.03384223648989
        ],
        "wc_strengths_avg": [
            82.25,
            55.472403048723244
        ],
        "wc_weaknesses_avg": [
            350.0,
            207.70291283465428
        ],
        "wc_questions_avg": [
            174.75,
            105.68674230952527
        ],
        "wc_review_avg": [
            705.5,
            322.98026255485024
        ],
        "wc_reply_reviewers_avg": [
            134.75,
            104.72434053265745
        ],
        "wc_reply_authors_avg": [
            1021.25,
            533.3626228936557
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.4923659639173309,
        "gs_citation": 21,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1056667947435683956&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=2XkTz7gdpc",
        "pdf": "https://openreview.net/pdf?id=2XkTz7gdpc",
        "email": "tum.de;roche.com;ethz.ch;ethz.ch",
        "author_num": 4,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Technische Universit\u00e4t M\u00fcnchen;Roche;ETH Zurich;Swiss Federal Institute of Technology",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.tum.de;https://www.roche.com;https://www.ethz.ch;https://www.ethz.ch",
        "aff_unique_abbr": "TUM;Roche;ETHZ;ETH Zurich",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "Germany;Switzerland"
    },
    {
        "id": "2XwBIcywWM",
        "title": "Learning Variational Neighbor Labels for Test-Time Domain Generalization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper strives for domain generalization, where models are trained exclusively on source domains before being deployed on unseen target domains. We follow the strict separation of source training and target testing, but exploit the value of the unlabeled target data itself during inference. We make three contributions. First, we propose probabilistic pseudo-labeling of target samples to generalize the source-trained model to the target domain at test time. We formulate the generalization at test time as a variational inference problem, by modeling pseudo labels as distributions, to consider the uncertainty during generalization and alleviate the misleading signal of inaccurate pseudo labels. Second, we learn variational neighbor labels that incorporate the information of neighboring target samples to generate more robust pseudo labels. Third, to learn the ability to incorporate more representative target information and generate more precise and robust variational neighbor labels, we introduce a meta-generalization stage during training to simulate the generalization procedure. Experiments on seven widely-used datasets demonstrate the benefits, abilities, and effectiveness of our proposal.",
        "keywords": "test-time generalization;domain generalization;variational inference",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/b10340de65b51f95d799e346fae7e3c996a05b02.zip",
        "author": "Sameer Ambekar;Zehao Xiao;Jiayi Shen;Xiantong Zhen;Cees G. M. Snoek",
        "authorids": "~Sameer_Ambekar1;~Zehao_Xiao1;~Jiayi_Shen3;~Xiantong_Zhen1;~Cees_G._M._Snoek1",
        "gender": "M;M;F;M;M",
        "homepage": "https://ambekarsameer.com;https://zzzx1224.github.io/;https://autumn9999.github.io/;;http://www.ceessnoek.info",
        "dblp": "267/5374;225/5426;;78/10651;s/CeesSnoek",
        "google_scholar": "bf8p2wMAAAAJ;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.ca/citations?user=DnBb3e0AAAAJ;https://scholar.google.nl/citations?user=0uKdbscAAAAJ",
        "orcid": "0000-0002-8650-3180;;;;0000-0001-9092-1556",
        "linkedin": "ambekarsameer/;;;;cgmsnoek/",
        "or_profile": "~Sameer_Ambekar1;~Zehao_Xiao1;~Jiayi_Shen3;~Xiantong_Zhen1;~Cees_Snoek1",
        "aff": "Technische Universit\u00e4t M\u00fcnchen;University of Amsterdam;University of Amsterdam;United Imaging Healthcare, Co., Ltd.;University of Amsterdam",
        "aff_domain": "tum.de;uva.nl;uva.nl;cri-united-imaging.com;uva.nl",
        "position": "PhD student;PhD student;PhD student;Principal Researcher;Full Professor",
        "bibtex": "@misc{\nambekar2024learning,\ntitle={Learning Variational Neighbor Labels for Test-Time Domain Generalization},\nauthor={Sameer Ambekar and Zehao Xiao and Jiayi Shen and Xiantong Zhen and Cees G. M. Snoek},\nyear={2024},\nurl={https://openreview.net/forum?id=2XwBIcywWM}\n}",
        "github": "",
        "project": "",
        "reviewers": "4tVC;CA6h;JCc1;Hsmr",
        "site": "https://openreview.net/forum?id=2XwBIcywWM",
        "pdf_size": 1947754,
        "rating": "5;5;5;5",
        "confidence": "4;3;3;3",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "1;2;2;3",
        "wc_summary": "76;199;50;106",
        "wc_strengths": "24;29;21;65",
        "wc_weaknesses": "237;210;112;27",
        "wc_questions": "4;525;5;2",
        "wc_review": "341;963;188;200",
        "wc_reply_reviewers": "0;26;0;0",
        "wc_reply_authors": "662;666;580;117",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            107.75,
            56.286654723833074
        ],
        "wc_strengths_avg": [
            34.75,
            17.69710428290459
        ],
        "wc_weaknesses_avg": [
            146.5,
            83.20606949015198
        ],
        "wc_questions_avg": [
            134.0,
            225.74653928687368
        ],
        "wc_review_avg": [
            423.0,
            317.52086545611456
        ],
        "wc_reply_reviewers_avg": [
            6.5,
            11.258330249197702
        ],
        "wc_reply_authors_avg": [
            506.25,
            227.33936636667218
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17881603264637544125&as_sdt=8005&sciodt=0,7&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;2;1",
        "aff_unique_norm": "Technische Universit\u00e4t M\u00fcnchen;University of Amsterdam;United Imaging Healthcare",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.tum.de;https://www.uva.nl;https://www.united-imaging.com",
        "aff_unique_abbr": "TUM;UvA;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;2;1",
        "aff_country_unique": "Germany;Netherlands;China"
    },
    {
        "id": "2Y5Gseybzp",
        "title": "Imprecise Label Learning: A Unified Framework for Learning with Various Imprecise Label Configurations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Learning with reduced labeling standards, such as noisy label, partial label, and multiple label candidates, which we generically refer to as imprecise labels, is a commonplace challenge in machine learning tasks. Previous methods tend to propose specific designs for every emerging imprecise label configuration, which is usually unsustainable when multiple configurations of imprecision coexist. In this paper, we introduce imprecise label learning (ILL), a framework towards the unification of learning with various imprecise label configurations.\nILL leverages expectation-maximization (EM) for modeling the imprecise label information, treating the precise labels as latent variables.\nInstead of approximating the correct labels for training, it considers the entire distribution of all possible labeling entailed by the imprecise information. We demonstrate that ILL can seamlessly adapt to partial label learning, semi-supervised learning, noisy label learning, and more importantly, a mixture of these settings. Notably, ILL surpasses the existing specified techniques for handling imprecise labels, marking the first unified framework with robust and effective performance across various challenging settings. We hope our work will inspire further research on this topic, unleashing the full potential of ILL in wider scenarios where precise labels are expensive and complicated to obtain.",
        "keywords": "Imprecise Label Learning; Partial Label Learning; Noisy Label Learning; Semi-Supervised Learning; Expectation-Maximization",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/e25f7b08b1c6086eea0ac0095c71559ffe465b91.zip",
        "author": "Hao Chen;Ankit Shah;Jindong Wang;Ran Tao;Yidong Wang;Xing Xie;Masashi Sugiyama;Rita Singh;Bhiksha Raj",
        "authorids": "~Hao_Chen15;~Ankit_Shah1;~Jindong_Wang1;~Ran_Tao2;~Yidong_Wang1;~Xing_Xie3;~Masashi_Sugiyama1;~Rita_Singh1;~Bhiksha_Raj1",
        "gender": "M;M;F;M;M;M;F;M;M",
        "homepage": "https://hhhhhhao.github.io/;https://ankitshah009.github.io/;;https://qianlanwyd.github.io/;http://research.microsoft.com/en-us/people/xingx/;http://www.ms.k.u-tokyo.ac.jp/sugi/;http://mlsp.cs.cmu.edu/people/rsingh/index.html;https://www.cs.cmu.edu/directory/bhikshar/;https://jd92.wang/",
        "dblp": ";04/1935-1.html;99/955;59/6759.html;08/6809-1;35/1228;;60/3996;19/2969-1",
        "google_scholar": "tktqkhwAAAAJ;https://scholar.google.co.in/citations?user=TqG1H4cAAAAJ;7xW2y6EAAAAJ;;5EQfAFIAAAAJ;https://scholar.google.co.jp/citations?user=GkYIrlIAAAAJ;;;hBZ_tKsAAAAJ",
        "orcid": ";0000-0002-8838-5421;;;0000-0002-8608-8482;0000-0001-6658-6743;;;0000-0002-4833-0880",
        "linkedin": "haochen97/;ankpsh01/;;;xingx/;;;;jindong-wang/",
        "or_profile": "~Hao_Chen15;~Ankit_Shah1;~Ran_Tao2;~Yidong_Wang1;~Xing_Xie3;~Masashi_Sugiyama1;~Rita_Singh1;~Bhiksha_Raj1;~Jindong_Wang4",
        "aff": "Carnegie Mellon University;Accenture;;Peking University;Microsoft Research Asia;The University of Tokyo;School of Computer Science, Carnegie Mellon University;Mohamed bin Zayed University of Artificial Intelligence;Microsoft Research",
        "aff_domain": "andrew.cmu.edu;accenture.com;;pku.edu.cn;microsoft.com;u-tokyo.ac.jp;cs.cmu.edu;mbzuai.ac.ae;microsoft.com",
        "position": "PhD student;Principal Researcher;;PhD student;Senior Principal Researcher;Full Professor;Research Professor;Full Professor;Researcher",
        "bibtex": "@misc{\nchen2024imprecise,\ntitle={Imprecise Label Learning: A Unified Framework for Learning with Various Imprecise Label Configurations},\nauthor={Hao Chen and Ankit Shah and Jindong Wang and Ran Tao and Yidong Wang and Xing Xie and Masashi Sugiyama and Rita Singh and Bhiksha Raj},\nyear={2024},\nurl={https://openreview.net/forum?id=2Y5Gseybzp}\n}",
        "github": "",
        "project": "",
        "reviewers": "yf7f;AiQR;torK;QeBS",
        "site": "https://openreview.net/forum?id=2Y5Gseybzp",
        "pdf_size": 825344,
        "rating": "5;5;6;8",
        "confidence": "4;2;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;1",
        "presentation": "2;2;2;3",
        "wc_summary": "108;138;155;53",
        "wc_strengths": "42;68;181;66",
        "wc_weaknesses": "367;144;140;144",
        "wc_questions": "80;71;181;2",
        "wc_review": "597;421;657;265",
        "wc_reply_reviewers": "77;229;0;0",
        "wc_reply_authors": "1513;1513;1249;511",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "4;3;3;2",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            113.5,
            38.771768079364136
        ],
        "wc_strengths_avg": [
            89.25,
            53.9507877606991
        ],
        "wc_weaknesses_avg": [
            198.75,
            97.15290783090335
        ],
        "wc_questions_avg": [
            83.5,
            63.869006568131304
        ],
        "wc_review_avg": [
            485.0,
            153.80507143784303
        ],
        "wc_reply_reviewers_avg": [
            76.5,
            93.4893042010689
        ],
        "wc_reply_authors_avg": [
            1196.5,
            410.18623818943513
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.4714045207910316,
        "gs_citation": 16,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11537090440769158708&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;2;3;4;0;5;3",
        "aff_unique_norm": "Carnegie Mellon University;Accenture;Peking University;Microsoft;University of Tokyo;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_unique_dep": ";;;Research;;",
        "aff_unique_url": "https://www.cmu.edu;https://www.accenture.com;http://www.pku.edu.cn;https://www.microsoft.com/en-us/research/group/asia;https://www.u-tokyo.ac.jp;https://mbzuai.ac.ae",
        "aff_unique_abbr": "CMU;Accenture;Peking U;MSR Asia;UTokyo;MBZUAI",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Asia;Pittsburgh",
        "aff_country_unique_index": "0;0;1;1;2;0;3;0",
        "aff_country_unique": "United States;China;Japan;United Arab Emirates"
    },
    {
        "title": "MEND: Meta Demonstration Distillation for Efficient and Effective In-Context Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19544",
        "id": "2Y5kBPtU0o",
        "author_site": "Yichuan Li, Xiyao Ma, Sixing Lu, Kyumin Lee, Xiaohu Liu, Chenlei Guo",
        "tldr": "",
        "abstract": "Large Language models (LLMs) have demonstrated impressive in-context learning (ICL) capabilities, \nwhere a LLM makes predictions for a given test input together with a few input-output pairs (demonstrations).\nNevertheless, the inclusion of demonstrations poses a challenge, leading to a quadratic increase in the computational overhead of the self-attention mechanism.\nExisting solutions attempt to condense lengthy demonstrations into compact vectors. \nHowever, they often require task-specific retraining or compromise LLM's in-context learning performance. \nTo mitigate these challenges, we present Meta Demonstration Distillation (MEND), where a language model learns to distill any lengthy demonstrations into vectors without retraining for a new downstream task. \nWe exploit the knowledge distillation to enhance alignment between MEND and MEND, achieving both efficiency and effectiveness concurrently. \nMEND is endowed with the meta-knowledge of distilling demonstrations through a two-stage training process, which includes meta-distillation pretraining and fine-tuning.\nComprehensive evaluations across seven diverse ICL settings using decoder-only (GPT-2) and encoder-decoder (T5) attest to MEND's prowess.\nIt not only matches but often outperforms the Vanilla ICL as well as other state-of-the-art distillation models, while significantly reducing the computational demands. \nThis innovation promises enhanced scalability and efficiency for the practical deployment of large language models.",
        "keywords": "in-context learning;language modeling;data distillation;knowledge distillation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/f315aa78126a99535a58cf174e1f3f45b6db588c.zip",
        "author": "Yichuan Li;Xiyao Ma;Sixing Lu;Kyumin Lee;Xiaohu Liu;Chenlei Guo",
        "authorids": "~Yichuan_Li3;~Xiyao_Ma1;~Sixing_Lu1;~Kyumin_Lee1;~Xiaohu_Liu1;~Chenlei_Guo1",
        "gender": ";;;M;;M",
        "homepage": ";;https://www.linkedin.com/in/sixinglu/;https://web.cs.wpi.edu/~kmlee/;;",
        "dblp": "216/7478-1.html;;;https://dblp.uni-trier.de/pid/22/8024.html;18/2453;03/5480",
        "google_scholar": "lLvYmOwAAAAJ;;https://scholar.google.com/citations?hl=en;zQKRsSEAAAAJ;;gRFsEm4AAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";;;;;clguo/",
        "or_profile": "~Yichuan_Li3;~Xiyao_Ma1;~Sixing_Lu1;~Kyumin_Lee1;~Xiaohu_Liu1;~Chenlei_Guo1",
        "aff": "Worcester Polytechnic Institute;;University of Arizona;Worcester Polytechnic Institute;;",
        "aff_domain": "wpi.edu;;arizona.edu;wpi.edu;;",
        "position": "PhD student;;PhD student;Associate Professor;;",
        "bibtex": "@inproceedings{\nli2024mend,\ntitle={{MEND}: Meta Demonstration Distillation for Efficient and Effective In-Context Learning},\nauthor={Yichuan Li and Xiyao Ma and Sixing Lu and Kyumin Lee and Xiaohu Liu and Chenlei Guo},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=2Y5kBPtU0o}\n}",
        "github": "",
        "project": "",
        "reviewers": "RDfP;RPCQ;Dw9E;Uu3b",
        "pdf_size": 744151,
        "rating": "5;6;6;8",
        "confidence": "5;4;4;4",
        "soundness": "2;3;3;3",
        "contribution": "3;2;3;3",
        "presentation": "3;2;2;3",
        "wc_summary": "51;54;82;172",
        "wc_strengths": "60;20;40;79",
        "wc_weaknesses": "139;45;188;134",
        "wc_questions": "2;169;50;146",
        "wc_review": "252;288;360;531",
        "wc_reply_reviewers": "0;0;0;44",
        "wc_reply_authors": "442;922;735;545",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;2;2;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            89.75,
            49.00191322795468
        ],
        "wc_strengths_avg": [
            49.75,
            22.02697210240209
        ],
        "wc_weaknesses_avg": [
            126.5,
            51.56791638218477
        ],
        "wc_questions_avg": [
            91.75,
            68.38996636934398
        ],
        "wc_review_avg": [
            357.75,
            107.31816015940639
        ],
        "wc_reply_reviewers_avg": [
            11.0,
            19.05255888325765
        ],
        "wc_reply_authors_avg": [
            661.0,
            183.72125625523032
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.6622661785325219,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11600534499645052239&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=2Y5kBPtU0o",
        "pdf": "https://openreview.net/pdf?id=2Y5kBPtU0o",
        "email": "wpi.edu;;arizona.edu;wpi.edu;;",
        "author_num": 6,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Worcester Polytechnic Institute;University of Arizona",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.wpi.edu;https://www.arizona.edu",
        "aff_unique_abbr": "WPI;UA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "2aebB2mf0q",
        "title": "SemiAugIR: Semi-supervised Infrared Small Target Detection via Thermodynamics-Inspired Data Augmentation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Convolutional neural networks have shown promising results in single-frame infrared small target detection (SIRST) through supervised learning. Nevertheless, this approach requires a substantial number of accurate manual annotations on a per-pixel basis, incurring significant labor costs. To mitigate this, we pioneer the integration of semi-supervised learning into SIRST by exploiting the consistency of paired training samples obtained from data augmentation. Unlike prevalent data augmentation techniques that often rely on standard image processing pipelines designed for visible light natural images, we introduce a novel Thermodynamics-inspired data augmentation technique tailored for infrared images. It enhances infrared images by simulating energy distribution using the thermodynamic radiation pattern of infrared imaging and employing unlabeled images as references. Additionally, to replicate spatial distortions caused by variations in angle and distance during infrared imaging, we design a non-uniform mapping in positional space. This introduces non-uniform offsets in chromaticity and position, inducing desired changes in chromaticity and target configuration. This approach substantially diversifies the training samples, enabling the network to extract more robust features. We also devise an adaptive exponentially weighted loss function to address the challenge of training collapse due to imbalanced and inaccurately labeled samples. Integrating them together, we present SemiAugIR, which delivers promising results on two widely used benchmarks, e.g., with only 1/8 of the labeled samples, it achieves over 94\\% performance of the state-of-the-art fully supervised learning method. The source code will be released.",
        "keywords": "single-frame infrared small target detection;semi-supervised learning;non-uniform data augmentation;adaptive exponentially weighted loss function",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Mingjin Zhang;Wenteng Shang;Haichen Bai;Yunsong Li;Xinbo Gao;Jing Zhang",
        "authorids": "~Mingjin_Zhang2;~Wenteng_Shang1;~Haichen_Bai1;~Yunsong_Li1;~Xinbo_Gao3;~Jing_Zhang17",
        "gender": "F;M;M;M;M;M",
        "homepage": "https://web.xidian.edu.cn/mjinzhang/index.html;;;https://web.xidian.edu.cn/ysli/;http://see.xidian.edu.cn/faculty/xbgao/;",
        "dblp": "136/8003;;;;;05/3499-37.html",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;;q8eamah50lwC;aY_2RzkAAAAJ;;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0002-1473-9784;0009-0004-9174-4132;0000-0002-5547-9958;;0000-0003-1443-0776;0000-0001-6595-7661",
        "linkedin": ";;;;;",
        "or_profile": "~Mingjin_Zhang2;~Wenteng_Shang1;~Haichen_Bai1;~Yunsong_Li1;~Xinbo_Gao3;~Jing_Zhang17",
        "aff": "Xidian University;Xi'an University of Electronic Science and Technology;Xi'an University of Electronic Science and Technology;Xidian University ;Xidian University;The University of Sydney",
        "aff_domain": "xidian.edu.cn;xidian.edu.cn;xidian.edu.cn;xidian.edu.cn;xidian.edu.cn;sydney.edu.au",
        "position": "Full Professor;MS student;MS student;Full Professor;Full Professor;Research Fellow",
        "bibtex": "@misc{\nzhang2024semiaugir,\ntitle={SemiAug{IR}: Semi-supervised Infrared Small Target Detection via Thermodynamics-Inspired Data Augmentation},\nauthor={Mingjin Zhang and Wenteng Shang and Haichen Bai and Yunsong Li and Xinbo Gao and Jing Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=2aebB2mf0q}\n}",
        "github": "",
        "project": "",
        "reviewers": "ARSd;5Vyd;kGGx",
        "site": "https://openreview.net/forum?id=2aebB2mf0q",
        "pdf_size": 1374918,
        "rating": "3;5;10",
        "confidence": "2;3;5",
        "soundness": "1;3;4",
        "contribution": "1;4;4",
        "presentation": "2;2;3",
        "wc_summary": "50;43;98",
        "wc_strengths": "30;48;85",
        "wc_weaknesses": "340;15;251",
        "wc_questions": "1;7;62",
        "wc_review": "421;113;496",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1850;772;1500",
        "reply_reviewers": "0;0;0",
        "reply_authors": "3;1;3",
        "rating_avg": [
            6.0,
            2.943920288775949
        ],
        "confidence_avg": [
            3.3333333333333335,
            1.247219128924647
        ],
        "soundness_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "contribution_avg": [
            3.0,
            1.4142135623730951
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            63.666666666666664,
            24.44494948973214
        ],
        "wc_strengths_avg": [
            54.333333333333336,
            22.89589968143253
        ],
        "wc_weaknesses_avg": [
            202.0,
            137.1301085344377
        ],
        "wc_questions_avg": [
            23.333333333333332,
            27.450966386551052
        ],
        "wc_review_avg": [
            343.3333333333333,
            165.72333034977973
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1374.0,
            449.0196729171971
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.9986254289035241,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10782864233969299252&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;0;0;2",
        "aff_unique_norm": "Xidian University;Xi'an University of Electronic Science and Technology;University of Sydney",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.xidian.edu.cn/;http://www.xidian.edu.cn/;https://www.sydney.edu.au",
        "aff_unique_abbr": "Xidian;Xidian University;USYD",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Xi'an",
        "aff_country_unique_index": "0;0;0;0;0;1",
        "aff_country_unique": "China;Australia"
    },
    {
        "id": "2bF381xEke",
        "title": "MapSelect: Sparse & Interpretable Graph Attention Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph Attention Networks (GATs) have shown remarkable performance in capturing complex graph structures by assigning dense attention weights over all neighbours of a node. Attention weights can act as an inherent explanation for the model output, by highlighting the most important neighbours for a given input graph. However, the dense nature of the attention layer causes a lack of focus as all edges receive some probability mass. To overcome this, we introduce MapSelect, a new method providing a fully differentiable sparse attention mechanism. Through user-defined constraints, MapSelect enables precise control over the attention density, acting as a continuous relaxation of the popular top-k operator. We propose two distinct variants of MapSelect: a local approach maintaining a fixed degree per node, and a global approach preserving a percentage of the full graph. Upon conducting a comprehensive evaluation of five sparse GATs in terms of sparsity, performance, and interpretability, we provide insights on the sparsity-accuracy and sparsity-interpretability trade-offs. Our results show that MapSelect outperforms robust baselines in terms of interpretability, especially in the local context, while also leading to competitive task performance on real-world datasets.",
        "keywords": "Graph attention networks;interpretability;sparsity;self-interpretable methods",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Titus Naber;Marcos Vinicius Treviso;Andre Martins;Elvin Isufi",
        "authorids": "~Titus_Naber1;~Marcos_Vinicius_Treviso1;~Andre_Martins1;~Elvin_Isufi1",
        "gender": "M;M;M;M",
        "homepage": ";;https://andre-martins.github.io/;https://sites.google.com/site/elvinisufihp/",
        "dblp": ";188/5938;m/AndreFTMartins;156/9608",
        "google_scholar": ";puR_FskAAAAJ;https://scholar.google.pt/citations?user=mT7ppvwAAAAJ;wvywFdwAAAAJ",
        "orcid": ";;;",
        "linkedin": "titus-naber/;;;",
        "or_profile": "~Titus_Naber1;~Marcos_Vinicius_Treviso1;~Andre_Martins1;~Elvin_Isufi1",
        "aff": ";Instituto de Telecomunica\u00e7\u00f5es, Portugal;Unbabel;Delft University of Technology",
        "aff_domain": ";it.pt;unbabel.com;tudelft.nl",
        "position": ";Postdoc;Research Scientist;Associate Professor",
        "bibtex": "@misc{\nnaber2024mapselect,\ntitle={MapSelect: Sparse \\& Interpretable Graph Attention Networks},\nauthor={Titus Naber and Marcos Vinicius Treviso and Andre Martins and Elvin Isufi},\nyear={2024},\nurl={https://openreview.net/forum?id=2bF381xEke}\n}",
        "github": "",
        "project": "",
        "reviewers": "b971;EqGL;iHh7;WU6w",
        "site": "https://openreview.net/forum?id=2bF381xEke",
        "pdf_size": 849635,
        "rating": "3;3;3;3",
        "confidence": "4;3;5;4",
        "soundness": "2;2;3;2",
        "contribution": "2;1;2;2",
        "presentation": "2;2;3;4",
        "wc_summary": "166;97;76;73",
        "wc_strengths": "84;17;34;34",
        "wc_weaknesses": "103;104;202;272",
        "wc_questions": "89;8;3;75",
        "wc_review": "442;226;315;454",
        "wc_reply_reviewers": "0;0;0;123",
        "wc_reply_authors": "328;305;330;478",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            103.0,
            37.52998800959041
        ],
        "wc_strengths_avg": [
            42.25,
            25.083610186733488
        ],
        "wc_weaknesses_avg": [
            170.25,
            71.19120381058323
        ],
        "wc_questions_avg": [
            43.75,
            38.6094224251024
        ],
        "wc_review_avg": [
            359.25,
            94.25862029544035
        ],
        "wc_reply_reviewers_avg": [
            30.75,
            53.26056233274298
        ],
        "wc_reply_authors_avg": [
            360.25,
            68.68906390394325
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:lAsUqR-ONNAJ:scholar.google.com/&scioq=MapSelect:+Sparse+%26+Interpretable+Graph+Attention+Networks&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Instituto de Telecomunica\u00e7\u00f5es;Unbabel;Delft University of Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.it.pt;https://www.unbabel.com;https://www.tudelft.nl",
        "aff_unique_abbr": ";;TU Delft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "Portugal;Netherlands"
    },
    {
        "id": "2boLXjsHsB",
        "title": "Multi-Objective Reinforcement Learning for Forward-Backward Markov Decision Processes",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This work introduces the notion of Forward-Backward Markov Decision Process (FB-MDP)\nfor multi-task control problems. In this context, we devise a novel approach called Forward-Backward Multi-Objective Reinforcement Learning (FB-MORL).\nSpecifically, we analytically characterize its convergence towards a Pareto-optimal solution and also empirically evaluate its effectiveness.\nFor the latter, we consider a use case in wireless caching and perform several experiments to characterize performance in that context. Finally, an ablation study demonstrates that FB-MDP is instrumental to optimize rewards for systems with forward-backward dynamics.\nThe outcomes of this work pave the way for further understanding of multi-objective RL algorithms for FB-MDPs.",
        "keywords": "Forward-Backward Markov Decision Process;Multi-Objective Reinforcement Learning Algorithm",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Mohsen Amidzadeh;Mario Di Francesco",
        "authorids": "~Mohsen_Amidzadeh1;~Mario_Di_Francesco1",
        "gender": "M;",
        "homepage": "https://research.aalto.fi/en/persons/mohsen-amidzade;",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Mohsen_Amidzadeh1;~Mario_Di_Francesco1",
        "aff": "Aalto University;",
        "aff_domain": "aalto.fi;",
        "position": "Postdoc;",
        "bibtex": "@misc{\namidzadeh2024multiobjective,\ntitle={Multi-Objective Reinforcement Learning for Forward-Backward Markov Decision Processes},\nauthor={Mohsen Amidzadeh and Mario Di Francesco},\nyear={2024},\nurl={https://openreview.net/forum?id=2boLXjsHsB}\n}",
        "github": "",
        "project": "",
        "reviewers": "EeKJ;g9Ad;AwDv",
        "site": "https://openreview.net/forum?id=2boLXjsHsB",
        "pdf_size": 1878236,
        "rating": "5;5;5",
        "confidence": "4;4;3",
        "soundness": "3;3;3",
        "contribution": "2;2;2",
        "presentation": "2;2;3",
        "wc_summary": "44;101;132",
        "wc_strengths": "23;50;111",
        "wc_weaknesses": "26;139;504",
        "wc_questions": "256;108;138",
        "wc_review": "349;398;885",
        "wc_reply_reviewers": "23;325;0",
        "wc_reply_authors": "766;1146;750",
        "reply_reviewers": "1;2;0",
        "reply_authors": "1;2;1",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            92.33333333333333,
            36.44478319625763
        ],
        "wc_strengths_avg": [
            61.333333333333336,
            36.80881536926839
        ],
        "wc_weaknesses_avg": [
            223.0,
            203.98202535190856
        ],
        "wc_questions_avg": [
            167.33333333333334,
            63.88183535942662
        ],
        "wc_review_avg": [
            544.0,
            241.9517858307036
        ],
        "wc_reply_reviewers_avg": [
            116.0,
            148.0833098855731
        ],
        "wc_reply_authors_avg": [
            887.3333333333334,
            183.0215530720054
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:n52GeLK86McJ:scholar.google.com/&scioq=Multi-Objective+Reinforcement+Learning+for+Forward-Backward+Markov+Decision+Processes&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Aalto University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.aalto.fi",
        "aff_unique_abbr": "Aalto",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Finland"
    },
    {
        "title": "Beyond Reverse KL: Generalizing Direct Preference Optimization with Diverse Divergence Constraints",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19543",
        "id": "2cRzmWXK9N",
        "author_site": "Chaoqi Wang, Yibo Jiang, Chenghao Yang, Han Liu, Yuxin Chen",
        "tldr": "",
        "abstract": "The increasing capabilities of large language models (LLMs) raise opportunities for artificial general intelligence but concurrently amplify safety concerns, such as potential misuse of AI systems, necessitating effective AI alignment. Reinforcement Learning from Human Feedback (RLHF) has emerged as a promising pathway towards AI alignment but brings forth challenges due to its complexity and dependence on a separate reward model. Direct Preference Optimization (DPO) has been proposed as an alternative; and it remains equivalent to RLHF under the reverse KL regularization constraint. This paper presents $f$-DPO, a generalized approach to DPO by incorporating diverse divergence constraints. We show that under certain $f$-divergences, including Jensen-Shannon divergence, forward KL divergences and $\\alpha$-divergences, the complex relationship between the reward and optimal policy can also be simplified by addressing the Karush\u2013Kuhn\u2013Tucker conditions. This eliminates the need for estimating the normalizing constant in the Bradley-Terry model and enables a tractable mapping between the reward function and the optimal policy. Our approach optimizes LLMs to align with human preferences in a more efficient and supervised manner under a broad set of divergence constraints. Empirically, adopting these divergences ensures a balance between alignment performance and generation diversity. Importantly, our $f$-DPO outperforms PPO-based methods in divergence efficiency, and divergence constraints directly influence expected calibration error (ECE).",
        "keywords": "Large language models;Preference optimization;AI Alignment",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Chaoqi Wang;Yibo Jiang;Chenghao Yang;Han Liu;Yuxin Chen",
        "authorids": "~Chaoqi_Wang1;~Yibo_Jiang2;~Chenghao_Yang1;~Han_Liu12;~Yuxin_Chen1",
        "gender": "M;M;M;M;",
        "homepage": "https://alecwangcq.github.io;;https://yangalan123.github.io/;https://hanliuai.github.io;http://yuxinchen.org/",
        "dblp": "210/1073;54/2193;229/4179;35/2899;11/5123-1",
        "google_scholar": "https://scholar.google.ca/citations?user=yN2iRpwAAAAJ;hvQo2gQAAAAJ;B28fiOAAAAAJ;stdJOHwAAAAJ;-k1N7HAAAAAJ",
        "orcid": ";;;0009-0001-0434-9141;",
        "linkedin": ";;chenghao-yang-857b51178/;han-liu-347270ba/;",
        "or_profile": "~Chaoqi_Wang1;~Yibo_Jiang2;~Chenghao_Yang1;~Han_Liu12;~Yuxin_Chen1",
        "aff": "University of Chicago;University of Chicago;Google;University of Chicago;University of Chicago",
        "aff_domain": "uchicago.edu;uchicago.edu;google.com;uchicago.edu;uchicago.edu",
        "position": "PhD student;PhD student;Student Researcher;PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nwang2024beyond,\ntitle={Beyond Reverse {KL}: Generalizing Direct Preference Optimization with Diverse Divergence Constraints},\nauthor={Chaoqi Wang and Yibo Jiang and Chenghao Yang and Han Liu and Yuxin Chen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=2cRzmWXK9N}\n}",
        "github": "",
        "project": "",
        "reviewers": "sLFR;AH62;GUwk;Lpy5",
        "pdf_size": 691534,
        "rating": "5;8;8;8",
        "confidence": "3;2;4;3",
        "soundness": "3;3;3;4",
        "contribution": "2;3;3;4",
        "presentation": "2;4;3;3",
        "wc_summary": "90;103;50;361",
        "wc_strengths": "122;73;32;50",
        "wc_weaknesses": "108;27;35;54",
        "wc_questions": "37;130;130;40",
        "wc_review": "357;333;247;505",
        "wc_reply_reviewers": "0;9;17;0",
        "wc_reply_authors": "905;414;550;88",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            7.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            151.0,
            122.80675877165719
        ],
        "wc_strengths_avg": [
            69.25,
            33.74444398712179
        ],
        "wc_weaknesses_avg": [
            56.0,
            31.583223394707513
        ],
        "wc_questions_avg": [
            84.25,
            45.7622934302904
        ],
        "wc_review_avg": [
            360.5,
            92.9125933337349
        ],
        "wc_reply_reviewers_avg": [
            6.5,
            7.088723439378913
        ],
        "wc_reply_authors_avg": [
            489.25,
            292.91754385833565
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 79,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18160314555054778595&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=2cRzmWXK9N",
        "pdf": "https://openreview.net/pdf?id=2cRzmWXK9N",
        "email": "uchicago.edu;uchicago.edu;google.com;uchicago.edu;uchicago.edu",
        "author_num": 5,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "University of Chicago;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.uchicago.edu;https://www.google.com",
        "aff_unique_abbr": "UChicago;Google",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "2dHmhoWweE",
        "title": "Lookbehind Optimizer: k steps back, 1 step forward",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Sharpness-aware minimization (SAM) methods have gained increasing popularity by formulating the problem of minimizing both loss value and loss sharpness as a minimax objective.  In this work, we increase the efficiency of the maximization and minimization parts of SAM's objective to achieve a better loss-sharpness trade-off. By taking inspiration from the Lookahead optimizer, which uses multiple descent steps ahead, we propose Lookbehind, which performs multiple ascent steps behind to enhance the maximization step of SAM and find a worst-case perturbation with higher loss. Then, to mitigate the variance in the descent step arising from the gathered gradients across the multiple ascent steps, we employ linear interpolation to refine the minimization step. Lookbehind leads to a myriad of benefits across a variety of tasks. Particularly, we show increased generalization performance, greater robustness against noisy weights, as well as improved learning and less catastrophic forgetting in lifelong learning settings.",
        "keywords": "Optimization;sharpness-aware minimization",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Goncalo Mordido;Pranshu Malviya;Aristide Baratin;Sarath Chandar",
        "authorids": "~Goncalo_Mordido1;~Pranshu_Malviya1;~Aristide_Baratin1;~Sarath_Chandar1",
        "gender": ";M;;M",
        "homepage": ";https://pranshu28.github.io/about/;;http://sarathchandar.in/",
        "dblp": ";;;45/8542",
        "google_scholar": ";;;https://scholar.google.co.in/citations?user=yxWtZLAAAAAJ",
        "orcid": ";;;",
        "linkedin": ";pranshumalviya2/;;",
        "or_profile": "~Goncalo_Mordido1;~Pranshu_Malviya1;~Aristide_Baratin1;~Sarath_Chandar1",
        "aff": ";\u00c9cole Polytechnique de Montr\u00e9al, Universit\u00e9 de Montr\u00e9al;;\u00c9cole Polytechnique de Montr\u00e9al",
        "aff_domain": ";polymtl.ca;;polymtl.ca",
        "position": ";PhD student;;Assistant Professor",
        "bibtex": "@misc{\nmordido2024lookbehind,\ntitle={Lookbehind Optimizer: k steps back, 1 step forward},\nauthor={Goncalo Mordido and Pranshu Malviya and Aristide Baratin and Sarath Chandar},\nyear={2024},\nurl={https://openreview.net/forum?id=2dHmhoWweE}\n}",
        "github": "",
        "project": "",
        "reviewers": "1aPq;aoaQ;tnTm;sgRK",
        "site": "https://openreview.net/forum?id=2dHmhoWweE",
        "pdf_size": 846970,
        "rating": "3;3;5;8",
        "confidence": "4;4;4;4",
        "soundness": "3;2;3;4",
        "contribution": "2;2;2;3",
        "presentation": "3;2;3;4",
        "wc_summary": "25;57;68;62",
        "wc_strengths": "11;50;144;77",
        "wc_weaknesses": "83;396;133;36",
        "wc_questions": "1;2;96;126",
        "wc_review": "120;505;441;301",
        "wc_reply_reviewers": "10;50;0;11",
        "wc_reply_authors": "294;784;441;331",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            53.0,
            16.62828914831589
        ],
        "wc_strengths_avg": [
            70.5,
            48.48968962573384
        ],
        "wc_weaknesses_avg": [
            162.0,
            139.38615426217913
        ],
        "wc_questions_avg": [
            56.25,
            55.76905503951094
        ],
        "wc_review_avg": [
            341.75,
            147.76226683426322
        ],
        "wc_reply_reviewers_avg": [
            17.75,
            19.109879643786353
        ],
        "wc_reply_authors_avg": [
            462.5,
            193.33196838598627
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18091060575552247786&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "\u00c9cole Polytechnique de Montr\u00e9al",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.polymtl.ca",
        "aff_unique_abbr": "Polytechnique Montr\u00e9al",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Montr\u00e9al",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "2dLMPOY0HW",
        "title": "When Do MLPs Excel in Node Classification? An Information-Theoretic Perspective",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent research has shed light on the competitiveness of MLP-structured methods in node-level tasks. Nevertheless, there remains a gap in our understanding regarding why MLPs perform well and how their performance varies across different datasets. This paper addresses this lacuna by emphasizing mutual information\u2019s pivotal role in MLPs vs. GNNs performance variations. We first introduce a\ntractable metric to quantify the mutual information between node features and graph structure, based on which we observe different characteristics of various datasets, aligning with empirical results. Subsequently, we present InfoMLP, which optimizes node embeddings\u2019 mutual information with the graph\u2019s structure, i.e., the adjacency matrix. Our info-max objective comprises two sub-objectives: the first focuses on non-parametric reprocessing to identify the optimal graph-augmented node feature matrix that encapsulates the most graph-related information. The second sub-objective aims to enhance mutual information between node embeddings derived from the original node features and those from the graph-augmented features. This integration of message-passing during preprocessing maintains the efficiency of InfoMLP, ensuring it remains as efficient as a standard MLP during both training and testing. We validate the effectiveness of our approach through experiments on real-world datasets of varying scales supplemented by comprehensive ablation studies. Our results affirm our analysis and underscore the success of our innovative approach.",
        "keywords": "Node Representation Learning;Node Classification;Graph Neural Networks",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/5342fd19e23fbefff38906d822e4ce2323047093.zip",
        "author": "Hengrui Zhang;Qitian Wu;Chenxiao Yang;Junchi Yan;Philip S. Yu",
        "authorids": "~Hengrui_Zhang1;~Qitian_Wu1;~Chenxiao_Yang1;~Junchi_Yan2;~Philip_S._Yu1",
        "gender": "M;;;;M",
        "homepage": "https://hengruizhang98.github.io;;;;https://cs.uic.edu/profiles/philip-yu/",
        "dblp": ";;;;y/PhilipSYu",
        "google_scholar": "iwffiD0AAAAJ;;;;D0lL1r0AAAAJ",
        "orcid": "0009-0006-1330-0899;;;;0000-0002-3491-5968",
        "linkedin": ";;;;",
        "or_profile": "~Hengrui_Zhang1;~Qitian_Wu1;~Chenxiao_Yang1;~Junchi_Yan2;~Philip_S._Yu1",
        "aff": "University of Illinois, Chicago;;;;University of Illinois Chicago",
        "aff_domain": "uic.edu;;;;uic.edu",
        "position": "PhD student;;;;Full Professor",
        "bibtex": "@misc{\nzhang2024when,\ntitle={When Do {MLP}s Excel in Node Classification? An Information-Theoretic Perspective},\nauthor={Hengrui Zhang and Qitian Wu and Chenxiao Yang and Junchi Yan and Philip S. Yu},\nyear={2024},\nurl={https://openreview.net/forum?id=2dLMPOY0HW}\n}",
        "github": "",
        "project": "",
        "reviewers": "zabj;YPT6;o93U",
        "site": "https://openreview.net/forum?id=2dLMPOY0HW",
        "pdf_size": 4695346,
        "rating": "3;3;8",
        "confidence": "4;4;3",
        "soundness": "1;2;4",
        "contribution": "2;2;4",
        "presentation": "2;3;3",
        "wc_summary": "125;272;95",
        "wc_strengths": "117;12;101",
        "wc_weaknesses": "752;35;126",
        "wc_questions": "126;44;5",
        "wc_review": "1120;363;327",
        "wc_reply_reviewers": "203;0;78",
        "wc_reply_authors": "2207;1540;430",
        "reply_reviewers": "1;0;1",
        "reply_authors": "4;3;1",
        "rating_avg": [
            4.666666666666667,
            2.357022603955158
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            164.0,
            77.34339015067803
        ],
        "wc_strengths_avg": [
            76.66666666666667,
            46.19042709864843
        ],
        "wc_weaknesses_avg": [
            304.3333333333333,
            318.72070671496834
        ],
        "wc_questions_avg": [
            58.333333333333336,
            50.427065043376146
        ],
        "wc_review_avg": [
            603.3333333333334,
            365.6340003640556
        ],
        "wc_reply_reviewers_avg": [
            93.66666666666667,
            83.61153562092308
        ],
        "wc_reply_authors_avg": [
            1392.3333333333333,
            732.933072585
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9999999999999998,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:UC-sMQy_S6wJ:scholar.google.com/&scioq=When+Do+MLPs+Excel+in+Node+Classification%3F+An+Information-Theoretic+Perspective&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Illinois at Chicago",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uic.edu",
        "aff_unique_abbr": "UIC",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Chicago",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "2dYAbdXgpu",
        "title": "SimSCOOD: Systematic Analysis of Out-of-Distribution Generalization in Fine-tuned Source Code Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large code datasets have become increasingly accessible for pre-training source code models. However, for the fine-tuning phase, obtaining representative training data that fully covers the code distribution for specific downstream tasks remains challenging due to the task-specific nature and limited labeling resources. Moreover, fine-tuning pretrained models can result in forgetting previously acquired pre-training knowledge. These lead to out-of-distribution (OOD) generalization issues with unexpected model inference behaviors that have not been systematically studied yet.\nIn this paper, we contribute the first systematic approach that simulates various OOD scenarios along different dimensions of source code data properties and study the fine-tuned model behaviors in such scenarios. We  investigate the behaviors of models under different fine-tuning methodologies, including full fine-tuning and Low-Rank Adaptation (LoRA) fine-tuning methods. Our comprehensive analysis, conducted on four state-of-the-art pretrained models and applied to two code generation tasks, exposes multiple failure modes attributed to OOD generalization issues. Additionally, our analysis uncovers that LoRA fine-tuning consistently exhibits significantly better OOD generalization performance than full fine-tuning across various scenarios.",
        "keywords": "LLM for code generation;Out-of-distribution generalization;Pre-trained code models;Fine-tuned codeLLM",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Hossein Hajipour;Ning Yu;Cristian-Alexandru Staicu;Mario Fritz",
        "authorids": "~Hossein_Hajipour1;~Ning_Yu2;~Cristian-Alexandru_Staicu2;~Mario_Fritz1",
        "gender": "M;;M;M",
        "homepage": "https://cispa.de/en/people/hossein.hajipour;;http://www.staicu.org/;https://cispa.saarland/group/fritz/",
        "dblp": "125/1613;;;",
        "google_scholar": ";;JmpDeRQAAAAJ;https://scholar.google.de/citations?user=4V1nNm4AAAAJ",
        "orcid": ";;0000-0002-6542-2226;",
        "linkedin": ";;crstaicu/;",
        "or_profile": "~Hossein_Hajipour1;~Ning_Yu2;~Cristian-Alexandru_Staicu2;~Mario_Fritz1",
        "aff": "CISPA Helmholtz Center for Information Security;;CISPA Helmholtz Center for Information Security;Saarland University",
        "aff_domain": "cispa.saarland;;cispa.saarland;uni-saarland.de",
        "position": "PhD student;;Researcher;Full Professor",
        "bibtex": "@misc{\nhajipour2024simscood,\ntitle={Sim{SCOOD}: Systematic Analysis of Out-of-Distribution Generalization in Fine-tuned Source Code Models},\nauthor={Hossein Hajipour and Ning Yu and Cristian-Alexandru Staicu and Mario Fritz},\nyear={2024},\nurl={https://openreview.net/forum?id=2dYAbdXgpu}\n}",
        "github": "",
        "project": "",
        "reviewers": "fJQ1;9kMw;cCst;HtnZ",
        "site": "https://openreview.net/forum?id=2dYAbdXgpu",
        "pdf_size": 1056307,
        "rating": "5;5;5;5",
        "confidence": "4;4;3;3",
        "soundness": "3;2;2;3",
        "contribution": "2;1;2;2",
        "presentation": "3;3;3;3",
        "wc_summary": "53;33;117;96",
        "wc_strengths": "64;18;66;63",
        "wc_weaknesses": "191;88;160;262",
        "wc_questions": "4;25;7;21",
        "wc_review": "312;164;350;442",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "929;387;269;821",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;1;1;2",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            74.75,
            33.36446462930284
        ],
        "wc_strengths_avg": [
            52.75,
            20.09197601033806
        ],
        "wc_weaknesses_avg": [
            175.25,
            62.48749874974994
        ],
        "wc_questions_avg": [
            14.25,
            8.926785535678562
        ],
        "wc_review_avg": [
            317.0,
            100.18482919085105
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            601.5,
            279.28614358754
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8603687437464787116&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "CISPA Helmholtz Center for Information Security;Saarland University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cispa.de/;https://www.uni-saarland.de",
        "aff_unique_abbr": "CISPA;UdS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "title": "Function-space Parameterization of Neural Networks for Sequential Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19542",
        "id": "2dhxxIKhqz",
        "author_site": "Aidan Scannell, Riccardo Mereu, Paul Chang, Ella Tamir, Joni Pajarinen, Arno Solin",
        "tldr": "",
        "abstract": "Sequential learning paradigms pose challenges for gradient-based deep learning due to difficulties incorporating new data and retaining prior knowledge. While Gaussian processes elegantly tackle these problems, they struggle with scalability and handling rich inputs, such as images. To address these issues, we introduce a technique that converts neural networks from weight space to function space, through a dual parameterization. Our parameterization offers: (*i*) a way to scale function-space methods to large data sets via sparsification, (*ii*) retention of prior knowledge when access to past data is limited, and (*iii*) a mechanism to incorporate new data without retraining. Our experiments demonstrate that we can retain knowledge in continual learning and incorporate new data efficiently. We further show its strengths in uncertainty quantification and guiding exploration in model-based RL. Further information and code is available on the project website.",
        "keywords": "Neural networks;Bayesian deep learning;deep learning;Gaussian processes;Laplace approximation;sequential learning",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Aidan Scannell;Riccardo Mereu;Paul Edmund Chang;Ella Tamir;Joni Pajarinen;Arno Solin",
        "authorids": "~Aidan_Scannell1;~Riccardo_Mereu1;~Paul_Edmund_Chang1;~Ella_Tamir1;~Joni_Pajarinen2;~Arno_Solin1",
        "gender": "M;M;M;;;",
        "homepage": "https://www.aidanscannell.com/;;https://research.aalto.fi/en/persons/paul-chang;;;http://arno.solin.fi",
        "dblp": "304/4471;318/1146;270/0387;;23/8355;98/11225",
        "google_scholar": "https://scholar.google.co.uk/citations?user=piA0zS4AAAAJ;UVziXI0AAAAJ;CLzK5SkAAAAJ;;https://scholar.google.fi/citations?user=-2fJStwAAAAJ;U_fJCnAAAAAJ",
        "orcid": ";0000-0002-8932-9341;;;0000-0003-4469-8191;0000-0002-0958-7886",
        "linkedin": "aidan-scannell-82522789/;riccardo-mereu-050248a1/;;;;asolin/",
        "or_profile": "~Aidan_Scannell1;~Riccardo_Mereu1;~Paul_Edmund_Chang1;~Ella_Tamir1;~Joni_Pajarinen2;~Arno_Solin1",
        "aff": "Aalto University;Aalto University;;;Aalto University;Aalto University",
        "aff_domain": "aalto.fi;aalto.fi;;;aalto.fi;aalto.fi",
        "position": "Postdoc;PhD student;;;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nscannell2024functionspace,\ntitle={Function-space Parameterization of Neural Networks for Sequential Learning},\nauthor={Aidan Scannell and Riccardo Mereu and Paul Edmund Chang and Ella Tamir and Joni Pajarinen and Arno Solin},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=2dhxxIKhqz}\n}",
        "github": "",
        "project": "",
        "reviewers": "C2Qu;7JfH;V1B4",
        "pdf_size": 2126191,
        "rating": "6;6;8",
        "confidence": "3;3;2",
        "soundness": "3;2;4",
        "contribution": "3;2;3",
        "presentation": "3;1;3",
        "wc_summary": "208;38;104",
        "wc_strengths": "77;20;83",
        "wc_weaknesses": "370;224;89",
        "wc_questions": "551;8;57",
        "wc_review": "1206;290;333",
        "wc_reply_reviewers": "54;85;0",
        "wc_reply_authors": "1289;824;336",
        "reply_reviewers": "1;1;0",
        "reply_authors": "3;2;1",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            116.66666666666667,
            69.97777424932069
        ],
        "wc_strengths_avg": [
            60.0,
            28.39013913315678
        ],
        "wc_weaknesses_avg": [
            227.66666666666666,
            114.74706483779396
        ],
        "wc_questions_avg": [
            205.33333333333334,
            245.2404715557546
        ],
        "wc_review_avg": [
            609.6666666666666,
            422.0365966227205
        ],
        "wc_reply_reviewers_avg": [
            46.333333333333336,
            35.122009560324926
        ],
        "wc_reply_authors_avg": [
            816.3333333333334,
            389.09838801459404
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.9999999999999998,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11704751970787674703&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "openreview": "https://openreview.net/forum?id=2dhxxIKhqz",
        "pdf": "https://openreview.net/pdf?id=2dhxxIKhqz",
        "email": "aalto.fi;aalto.fi;;;aalto.fi;aalto.fi",
        "author_num": 6,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Aalto University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.aalto.fi",
        "aff_unique_abbr": "Aalto",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Finland"
    },
    {
        "title": "Vision Transformers Need Registers",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19541",
        "id": "2dnO3LLiJ1",
        "author_site": "Timoth\u00e9e Darcet, Maxime Oquab, Julien Mairal, Piotr Bojanowski",
        "tldr": "",
        "abstract": "Transformers have recently emerged as a powerful tool for learning visual representations. In this paper, we identify and characterize artifacts in feature maps of both supervised and self-supervised ViT networks. The artifacts correspond to high-norm tokens appearing during inference primarily in low-informative background areas of images, that are repurposed for internal computations. We propose a simple yet effective solution based on providing additional tokens to the input sequence of the Vision Transformer to fill that role. We show that this solution fixes that problem entirely for both supervised and self-supervised models, sets a new state of the art for self-supervised visual models on dense visual prediction tasks, enables object discovery methods with larger models, and most importantly leads to smoother feature maps and attention maps for downstream visual processing.",
        "keywords": "representation;vision;transformer;register;SSL;CLIP;attention;attention map;interpretability;DINO;DINOv2",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Timoth\u00e9e Darcet;Maxime Oquab;Julien Mairal;Piotr Bojanowski",
        "authorids": "~Timoth\u00e9e_Darcet1;~Maxime_Oquab1;~Julien_Mairal1;~Piotr_Bojanowski1",
        "gender": "M;;;M",
        "homepage": "https://tim.darcet.fr;;http://julien.mairal.org;",
        "dblp": "344/5814;151/8880;49/6555;142/2542",
        "google_scholar": "G4qOJQEAAAAJ;https://scholar.google.fr/citations?user=5vteYV8AAAAJ;https://scholar.google.fr/citations?user=Bx9WGD6lBFEC;https://scholar.google.fr/citations?user=lJ_oh2EAAAAJ",
        "orcid": ";;;",
        "linkedin": "timdarcet/;;;piotr-bojanowski-9a94402a",
        "or_profile": "~Timoth\u00e9e_Darcet1;~Maxime_Oquab1;~Julien_Mairal1;~Piotr_Bojanowski1",
        "aff": "Meta;Meta;Inria;Meta",
        "aff_domain": "meta.com;meta.com;inria.fr;meta.com",
        "position": "PhD student;Research Scientist;Research Scientist;Researcher",
        "bibtex": "@inproceedings{\ndarcet2024vision,\ntitle={Vision Transformers Need Registers},\nauthor={Timoth{\\'e}e Darcet and Maxime Oquab and Julien Mairal and Piotr Bojanowski},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=2dnO3LLiJ1}\n}",
        "github": "",
        "project": "",
        "reviewers": "mTMB;KSLu;GGy7;eoPK",
        "pdf_size": 5953026,
        "rating": "8;8;8;8",
        "confidence": "4;4;4;3",
        "soundness": "3;3;3;3",
        "contribution": "4;3;4;3",
        "presentation": "4;4;4;3",
        "wc_summary": "169;91;160;118",
        "wc_strengths": "88;67;208;69",
        "wc_weaknesses": "179;257;127;56",
        "wc_questions": "393;3;83;42",
        "wc_review": "829;418;578;285",
        "wc_reply_reviewers": "591;0;0;0",
        "wc_reply_authors": "1164;658;780;316",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.5,
            0.5
        ],
        "presentation_avg": [
            3.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            134.5,
            31.64253466459348
        ],
        "wc_strengths_avg": [
            108.0,
            58.31380625546578
        ],
        "wc_weaknesses_avg": [
            154.75,
            73.42470633240558
        ],
        "wc_questions_avg": [
            130.25,
            154.31360115038467
        ],
        "wc_review_avg": [
            527.5,
            202.63822442964704
        ],
        "wc_reply_reviewers_avg": [
            147.75,
            255.91050681830163
        ],
        "wc_reply_authors_avg": [
            729.5,
            303.082084590957
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 360,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7001609497646764111&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 11,
        "openreview": "https://openreview.net/forum?id=2dnO3LLiJ1",
        "pdf": "https://openreview.net/pdf?id=2dnO3LLiJ1",
        "email": "meta.com;meta.com;inria.fr;meta.com",
        "author_num": 4,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Meta;INRIA",
        "aff_unique_dep": "Meta Platforms, Inc.;",
        "aff_unique_url": "https://meta.com;https://www.inria.fr",
        "aff_unique_abbr": "Meta;Inria",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "United States;France"
    },
    {
        "id": "2drC319yHQ",
        "title": "RepoFusion: Training Code Models to Understand Your Repository",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Despite the huge success of Large Language Models (LLMs) in coding assistants like GitHub Copilot, these models struggle to understand the context present in the repository (e.g., imports, parent classes, files with similar names, etc.), thereby producing inaccurate code completions. This effect is more pronounced when using these assistants for repositories that the model has not seen during training, such as proprietary software or work-in-progress code projects. Recent work has shown the promise of using context from the repository during inference. In this work, we extend this idea and propose \\emph{RepoFusion}, a framework to train models to incorporate relevant repository context. Experiments on single-line code completion show that our models trained with repository context significantly outperform much larger code models as CodeGen-16B-multi ($\\sim73\\times$ larger) and closely match the performance of the $\\sim 70\\times$ larger StarCoderBase model that was trained with the Fill-in-the-Middle objective. We find these results to be a novel and compelling demonstration of the gains that training with repository context can bring. We carry out extensive ablation studies to investigate the impact of design choices such as context type, number of contexts, context length, and initialization within our framework. Lastly, we release a dataset for code completion with repository context to facilitate further research in this domain.",
        "keywords": "large language models of code;long context;repository;code completion;source code;LLM;retrieval",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/6de0d88c748b9c572e7a27a6f1dd2b4ba9b4d32d.pdf",
        "author": "Disha Shrivastava;Denis Kocetkov;Harm de Vries;Dzmitry Bahdanau;Torsten Scholak",
        "authorids": "~Disha_Shrivastava1;~Denis_Kocetkov1;~Harm_de_Vries1;~Dzmitry_Bahdanau1;~Torsten_Scholak1",
        "gender": "F;M;M;M;M",
        "homepage": "https://shrivastavadisha.github.io/;;;https://tscholak.github.com;https://uk.linkedin.com/in/denis-kochetkov-14290213",
        "dblp": "203/9100;;151/6504;277/0957;",
        "google_scholar": "https://scholar.google.co.in/citations?user=7R8dnlUAAAAJ;LWrdpCsAAAAJ;https://scholar.google.ca/citations?user=Nq0dVMcAAAAJ;https://scholar.google.ca/citations?user=BgkjtKgAAAAJ;",
        "orcid": ";;;;",
        "linkedin": "disha-shrivastava-8398a212/;;;tscholak;",
        "or_profile": "~Disha_Shrivastava1;~Harm_de_Vries1;~Dzmitry_Bahdanau1;~Torsten_Scholak1;~Denis_Kochetkov1",
        "aff": "Google;ServiceNow Research;ServiceNow Research;ServiceNow Research;ServiceNow Research",
        "aff_domain": "deepmind.com;elementai.com;servicenow.com;servicenow.com;servicenow.com",
        "position": "Researcher;Researcher;Research Scientist;Researcher;Software engineer",
        "bibtex": "@misc{\nshrivastava2024repofusion,\ntitle={RepoFusion: Training Code Models to Understand Your Repository},\nauthor={Disha Shrivastava and Denis Kocetkov and Harm de Vries and Dzmitry Bahdanau and Torsten Scholak},\nyear={2024},\nurl={https://openreview.net/forum?id=2drC319yHQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "U4U4;hziX;Ar6w",
        "site": "https://openreview.net/forum?id=2drC319yHQ",
        "pdf_size": 632352,
        "rating": "3;3;6",
        "confidence": "3;4;4",
        "soundness": "1;3;3",
        "contribution": "2;1;3",
        "presentation": "4;3;3",
        "wc_summary": "257;204;107",
        "wc_strengths": "83;48;77",
        "wc_weaknesses": "194;120;268",
        "wc_questions": "65;150;9",
        "wc_review": "599;522;461",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            189.33333333333334,
            62.10922278982048
        ],
        "wc_strengths_avg": [
            69.33333333333333,
            15.2825245151302
        ],
        "wc_weaknesses_avg": [
            194.0,
            60.42074698865172
        ],
        "wc_questions_avg": [
            74.66666666666667,
            57.96742380184082
        ],
        "wc_review_avg": [
            527.3333333333334,
            56.46434469842205
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 30,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14668583810301525263&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1;1;1",
        "aff_unique_norm": "Google;ServiceNow",
        "aff_unique_dep": "Google;Research",
        "aff_unique_url": "https://www.google.com;https://www.servicenow.com",
        "aff_unique_abbr": "Google;ServiceNow",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Mountain View;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "2eBx1b9C4y",
        "title": "Detecting Deepfakes Without Seeing Any",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Deepfake attacks, malicious manipulation of media containing people, are a serious concern for society. Conventional deepfake detection methods train supervised classifiers to distinguish real media from previously encountered deepfakes. Such techniques can only detect deepfakes similar to those previously seen, but not zero-day (previously unseen) attack types. As current deepfake generation techniques are changing at a breathtaking pace, new attack types are proposed frequently, making this a major issue. Our main observations are that: i) in many effective deepfake attacks, the fake media must be accompanied by false facts i.e. claims about the identity, speech, motion, or appearance of the person. For instance, when impersonating Obama, the attacker explicitly or implicitly claims that the fake media show Obama; ii) current generative techniques cannot perfectly synthesize the false facts claimed by the attacker. We therefore introduce the concept of \u201cfact checking\u201d, adapted from fake news detection, for detecting zero-day deepfake attacks. Fact checking verifies that the claimed facts (e.g. identity is Obama), agree with the observed media (e.g. is the face really Obama\u2019s?), and thus can differentiate between real and fake media. Consequently, we introduce FACTOR, a practical recipe for deepfake fact checking and demonstrate its power in critical attack settings: face swapping and audio-visual synthesis. Although it is training-free, relies exclusively on off-the-shelf features, is very easy to implement, and does not see any deepfakes, it achieves better than state-of-the-art accuracy.",
        "keywords": "deepfake detection",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/9d0f343ff294b32e2d6bbeef144963c75cc0ad29.zip",
        "author": "Tal Reiss;Bar Cavia;Yedid Hoshen",
        "authorids": "~Tal_Reiss1;~Bar_Cavia1;~Yedid_Hoshen3",
        "gender": "M;M;M",
        "homepage": ";;https://www.cs.huji.ac.il/~ydidh/",
        "dblp": "276/6114;;136/0280",
        "google_scholar": "sgMIT6EAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.co.il/citations?user=6y1-qS4AAAAJ",
        "orcid": ";;",
        "linkedin": ";bar-cavia;",
        "or_profile": "~Tal_Reiss1;~Bar_Cavia1;~Yedid_Hoshen3",
        "aff": "Hebrew University of Jerusalem;Hebrew University, Hebrew University of Jerusalem;Google",
        "aff_domain": "huji.ac.il;cs.huji.ac.il;google.com",
        "position": "PhD student;Undergrad student;Researcher",
        "bibtex": "@misc{\nreiss2024detecting,\ntitle={Detecting Deepfakes Without Seeing Any},\nauthor={Tal Reiss and Bar Cavia and Yedid Hoshen},\nyear={2024},\nurl={https://openreview.net/forum?id=2eBx1b9C4y}\n}",
        "github": "",
        "project": "",
        "reviewers": "y1v2;pkUE;cJQS",
        "site": "https://openreview.net/forum?id=2eBx1b9C4y",
        "pdf_size": 3296304,
        "rating": "3;5;8",
        "confidence": "4;4;5",
        "soundness": "1;2;3",
        "contribution": "2;2;3",
        "presentation": "1;3;3",
        "wc_summary": "88;149;149",
        "wc_strengths": "16;143;107",
        "wc_weaknesses": "329;455;119",
        "wc_questions": "6;154;101",
        "wc_review": "439;901;476",
        "wc_reply_reviewers": "553;0;0",
        "wc_reply_authors": "1150;980;415",
        "reply_reviewers": "1;0;0",
        "reply_authors": "4;3;1",
        "rating_avg": [
            5.333333333333333,
            2.0548046676563256
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            128.66666666666666,
            28.75567576825293
        ],
        "wc_strengths_avg": [
            88.66666666666667,
            53.443635937520405
        ],
        "wc_weaknesses_avg": [
            301.0,
            138.59292911256333
        ],
        "wc_questions_avg": [
            87.0,
            61.22635598062869
        ],
        "wc_review_avg": [
            605.3333333333334,
            209.612870682016
        ],
        "wc_reply_reviewers_avg": [
            184.33333333333334,
            260.6866999974405
        ],
        "wc_reply_authors_avg": [
            848.3333333333334,
            314.1744030877683
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.9176629354822472,
        "gs_citation": 17,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2813304515057723632&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Hebrew University of Jerusalem;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.huji.ac.il;https://www.google.com",
        "aff_unique_abbr": "HUJI;Google",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Jerusalem;;Mountain View",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "Israel;United States"
    },
    {
        "id": "2eG9w9CeSY",
        "title": "EventCLIP: Adapting CLIP for Event-based Object Recognition",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recent advances in zero-shot and few-shot classification heavily rely on the success of pre-trained vision-language models (VLMs) such as CLIP.\nDue to a shortage of large-scale datasets, training such models for event camera data remains infeasible.\nThus, adapting existing models across modalities is an important research challenge.\nIn this work, we introduce EventCLIP, a novel approach that utilizes CLIP for zero-shot and few-shot event-based object recognition.\nWe first generalize CLIP's image encoder to event data by converting raw events to 2D grid-based representations.\nTo further enhance performance, we propose a feature adapter to aggregate temporal information over event frames and refine text embeddings to better align with the visual inputs.\nWe evaluate EventCLIP on N-Caltech, N-Cars, and N-ImageNet datasets, achieving state-of-the-art few-shot performance.\nWhen fine-tuned on the entire dataset, our method outperforms all existing event classifiers.\nMoreover, we explore practical applications of EventCLIP including robust event classification and label-free event recognition, where our approach surpasses previous baselines designed specifically for these tasks.",
        "keywords": "event-based vision;CLIP;few-shot learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Ziyi Wu;Xudong Liu;Igor Gilitschenski",
        "authorids": "~Ziyi_Wu1;~Xudong_Liu10;~Igor_Gilitschenski1",
        "gender": "M;M;M",
        "homepage": "https://wuziyi616.github.io/;;https://www.gilitschenski.org/igor",
        "dblp": "217/8678;;129/1281",
        "google_scholar": "iopH6wIAAAAJ;VK2CEbgAAAAJ;Nuw1Y4oAAAAJ",
        "orcid": "0000-0002-8247-5872;0000-0002-5286-4826;",
        "linkedin": ";xudong-frank-liu-566513198/;igorgilitschenski/",
        "or_profile": "~Ziyi_Wu1;~Xudong_Liu10;~Igor_Gilitschenski1",
        "aff": "Google;University of Toronto;University of Toronto",
        "aff_domain": "google.com;utoronto.ca;toronto.edu",
        "position": "Intern;MS student;Assistant Professor",
        "bibtex": "@misc{\nwu2024eventclip,\ntitle={Event{CLIP}: Adapting {CLIP} for Event-based Object Recognition},\nauthor={Ziyi Wu and Xudong Liu and Igor Gilitschenski},\nyear={2024},\nurl={https://openreview.net/forum?id=2eG9w9CeSY}\n}",
        "github": "",
        "project": "",
        "reviewers": "rcqs;KXch;rCwv;RBgA;FLiL;4a2f",
        "site": "https://openreview.net/forum?id=2eG9w9CeSY",
        "pdf_size": 3998324,
        "rating": "3;3;3;3;5;6",
        "confidence": "4;4;5;3;2;4",
        "soundness": "3;2;3;3;3;3",
        "contribution": "2;1;2;3;2;3",
        "presentation": "3;1;2;3;3;3",
        "wc_summary": "160;74;49;66;67;42",
        "wc_strengths": "43;31;44;28;55;85",
        "wc_weaknesses": "123;129;163;47;174;55",
        "wc_questions": "70;268;16;13;80;46",
        "wc_review": "396;502;272;154;376;228",
        "wc_reply_reviewers": "0;0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0;0",
        "reply_authors": "0;0;0;0;0;0",
        "rating_avg": [
            3.8333333333333335,
            1.2133516482134197
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.8333333333333335,
            0.3726779962499649
        ],
        "contribution_avg": [
            2.1666666666666665,
            0.6871842709362768
        ],
        "presentation_avg": [
            2.5,
            0.7637626158259734
        ],
        "wc_summary_avg": [
            76.33333333333333,
            38.99857547255911
        ],
        "wc_strengths_avg": [
            47.666666666666664,
            18.91795149821695
        ],
        "wc_weaknesses_avg": [
            115.16666666666667,
            48.76616541095772
        ],
        "wc_questions_avg": [
            82.16666666666667,
            86.75332206255212
        ],
        "wc_review_avg": [
            321.3333333333333,
            115.72188883506679
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.33995005182504245,
        "gs_citation": 21,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8551387232150929775&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Google;University of Toronto",
        "aff_unique_dep": "Google;",
        "aff_unique_url": "https://www.google.com;https://www.utoronto.ca",
        "aff_unique_abbr": "Google;U of T",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Mountain View;",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "United States;Canada"
    },
    {
        "id": "2eIembMRQJ",
        "title": "Active Teacher Selection for Reinforcement Learning from Human Feedback",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Reinforcement learning from human feedback (RLHF) enables machine learning systems to learn objectives from human feedback. A core limitation of these systems is their assumption that all feedback comes from a single human teacher, despite querying a range of distinct teachers. We propose the Hidden Utility Bandit (HUB) framework to model differences in teacher rationality, expertise, and costliness, formalizing the problem of learning from multiple teachers. We develop a variety of solution algorithms and apply them to two real-world domains: paper recommendation systems and COVID-19 vaccine testing. We find that the Active Teacher Selection (ATS) algorithm outperforms baseline algorithms by actively selecting when and which teacher to query. The HUB framework and ATS algorithm demonstrate the importance of leveraging differences between teachers to learn accurate reward models, facilitating future research on active teacher selection for robust reward modeling.",
        "keywords": "reward modeling;preference learning;active learning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/6fe8d4fb1d66fb183f9cec01091d7878bf5e8524.pdf",
        "author": "Rachel Freedman;Justin Svegliato;Kyle Hollins Wray;Stuart Russell",
        "authorids": "~Rachel_Freedman1;~Justin_Svegliato2;~Kyle_Hollins_Wray1;~Stuart_Russell1",
        "gender": "F;M;;M",
        "homepage": "https://rachelfreedman.github.io/;https://www.justinsvegliato.com/;;https://people.eecs.berkeley.edu/~russell/",
        "dblp": "218/7198;133/5067.html;;",
        "google_scholar": "Mj1fmhsAAAAJ;3Orv6wUAAAAJ;;https://scholar.google.com.tw/citations?user=KJGrjCAAAAAJ",
        "orcid": "0000-0003-3299-4313;;;",
        "linkedin": "rachelalexfreedman/;;;",
        "or_profile": "~Rachel_Freedman1;~Justin_Svegliato2;~Kyle_Hollins_Wray1;~Stuart_Russell1",
        "aff": "University of California, Berkeley;Microsoft;;University of California, Berkeley",
        "aff_domain": "berkeley.edu;microsoft.com;;berkeley.edu",
        "position": "PhD student;Senior Research Scientist;;Full Professor",
        "bibtex": "@misc{\nfreedman2024active,\ntitle={Active Teacher Selection for Reinforcement Learning from Human Feedback},\nauthor={Rachel Freedman and Justin Svegliato and Kyle Hollins Wray and Stuart Russell},\nyear={2024},\nurl={https://openreview.net/forum?id=2eIembMRQJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "eqU7;9GWq;szYk;WRYj",
        "site": "https://openreview.net/forum?id=2eIembMRQJ",
        "pdf_size": 4152774,
        "rating": "5;5;5;6",
        "confidence": "4;4;5;3",
        "soundness": "3;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "84;71;79;70",
        "wc_strengths": "81;107;42;186",
        "wc_weaknesses": "560;102;183;271",
        "wc_questions": "42;6;61;49",
        "wc_review": "767;286;365;576",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "697;238;378;278",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            76.0,
            5.787918451395113
        ],
        "wc_strengths_avg": [
            104.0,
            52.69250421075089
        ],
        "wc_weaknesses_avg": [
            279.0,
            172.8944764878277
        ],
        "wc_questions_avg": [
            39.5,
            20.5
        ],
        "wc_review_avg": [
            498.5,
            187.80109158362205
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            397.75,
            180.13935577768675
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7957453272223164376&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of California, Berkeley;Microsoft",
        "aff_unique_dep": ";Microsoft Corporation",
        "aff_unique_url": "https://www.berkeley.edu;https://www.microsoft.com",
        "aff_unique_abbr": "UC Berkeley;Microsoft",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Berkeley;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "2fSyBPBfBs",
        "title": "Bilevel Optimization without Lower-Level Strong Convexity from the Hyper-Objective Perspective",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Bilevel optimization reveals the inner structure of otherwise oblique optimization problems, such as hyperparameter tuning, neural architecture search, and meta-learning. A common goal in bilevel optimization is to find stationary points of the hyper-objective function. \nAlthough this hyper-objective approach is widely used, its theoretical properties have not been thoroughly investigated in cases where the lower-level functions lack strong convexity. \nThis work takes a step forward when the typical lower-level strong convexity assumption is absent.\nOur hardness results show that bilevel optimization for general convex lower-level functions is intractable to solve. \nWe then identify several regularity conditions of the lower-level\nproblems that can provably confer tractability.\nUnder these conditions, we propose the Inexact Gradient-Free Method (IGFM), which uses the Switching Gradient Method (SGM) as an efficient sub-routine, to find an approximate stationary point of the hyper-objective in polynomial time.",
        "keywords": "Bilevel Optimization",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/c4595614af34254d30a971187804019f05351e45.pdf",
        "author": "Lesi Chen;Jing Xu;Jingzhao Zhang",
        "authorids": "~Lesi_Chen1;~Jing_Xu4;~Jingzhao_Zhang2",
        "gender": "M;M;M",
        "homepage": "https://truenobility303.github.io/;https://jingxuthu.github.io;https://sites.google.com/view/jingzhao/home",
        "dblp": "326/5433;07/1951-27;220/5559",
        "google_scholar": "ynGzhugAAAAJ;jlrroGQAAAAJ;8NudxYsAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Lesi_Chen1;~Jing_Xu4;~Jingzhao_Zhang2",
        "aff": "Tsinghua Univeristy;Tsinghua University;Tsinghua University",
        "aff_domain": "mails.tsinghua.edu.cn;thu.edu.cn;mail.tsinghua.edu.cn",
        "position": "PhD student;PhD student;Assistant Professor",
        "bibtex": "@misc{\nchen2024bilevel,\ntitle={Bilevel Optimization without Lower-Level Strong Convexity from the Hyper-Objective Perspective},\nauthor={Lesi Chen and Jing Xu and Jingzhao Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=2fSyBPBfBs}\n}",
        "github": "",
        "project": "",
        "reviewers": "f4Tk;y92G;ShQk;V1pU;9BLf;Z4XB",
        "site": "https://openreview.net/forum?id=2fSyBPBfBs",
        "pdf_size": 291045,
        "rating": "3;3;3;5;5;6",
        "confidence": "2;3;3;3;3;3",
        "soundness": "2;2;2;3;3;2",
        "contribution": "2;2;2;2;3;3",
        "presentation": "2;3;2;3;3;3",
        "wc_summary": "16;80;44;103;48;60",
        "wc_strengths": "23;69;22;169;32;56",
        "wc_weaknesses": "83;217;63;315;135;201",
        "wc_questions": "7;370;813;4;37;33",
        "wc_review": "129;736;942;591;252;350",
        "wc_reply_reviewers": "0;0;57;0;0;0",
        "wc_reply_authors": "203;349;323;162;276;87",
        "reply_reviewers": "0;0;1;0;0;0",
        "reply_authors": "1;1;1;1;1;1",
        "rating_avg": [
            4.166666666666667,
            1.2133516482134197
        ],
        "confidence_avg": [
            2.8333333333333335,
            0.3726779962499649
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            58.5,
            27.602838018339103
        ],
        "wc_strengths_avg": [
            61.833333333333336,
            50.91632569443932
        ],
        "wc_weaknesses_avg": [
            169.0,
            86.0542464572977
        ],
        "wc_questions_avg": [
            210.66666666666666,
            298.3592167542713
        ],
        "wc_review_avg": [
            500.0,
            283.1330664781726
        ],
        "wc_reply_reviewers_avg": [
            9.5,
            21.242645786248
        ],
        "wc_reply_authors_avg": [
            233.33333333333334,
            91.88882171165085
        ],
        "reply_reviewers_avg": [
            0.16666666666666666,
            0.372677996249965
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.43000658178376594,
        "gs_citation": 17,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5733103613312067356&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Tsinghua University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "2gMwe9Duc4",
        "title": "Neuroexplicit Diffusion Models for Inpainting of Optical Flow Fields",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Deep learning has revolutionized the field of computer vision by introducing large scale neural networks with millions of parameters. \nTraining these networks requires massive datasets and leads to intransparent models that can fail to generalize.\nAt the other extreme, models designed from partial differential equations (PDEs) embed specialized domain knowledge into mathematical equations and usually rely on few manually chosen hyperparameters.\nThis makes them transparent by construction and if designed and calibrated carefully, they can generalize well to unseen scenarios. In this paper, we show how to bring model- and data-driven approaches together by combining the explicit PDE-based approaches with convolutional neural networks to obtain the best of both worlds. \nWe illustrate a joint architecture for the task of inpainting optical flow fields and show that the combination of model- and data-driven modeling leads to an effective architecture.\nOur model outperforms both fully explicit and fully data-driven baselines in terms of reconstruction quality, robustness and amount of required training data. \nAveraging the endpoint error across different mask densities, our method outperforms the explicit baseline by $27.12$%, the GAN baseline by $46.72$% and the Probabilisitic Diffusion  baseline by $42.38$%.",
        "keywords": "Deep Learning;Diffusion;Inpainting;Optical Flow;Neuroexplicit",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Tom Fischer;Pascal Peter;Joachim Weickert;Eddy Ilg",
        "authorids": "~Tom_Fischer1;~Pascal_Peter1;~Joachim_Weickert1;~Eddy_Ilg3",
        "gender": "M;M;M;M",
        "homepage": "https://cvmp.cs.uni-saarland.de/people/#tom-fischer;https://www.mia.uni-saarland.de/peter/index.shtml;https://www.mia.uni-saarland.de/weickert/index.shtml;https://www.utn.de/departments/department-engineering/cvmp-lab/",
        "dblp": ";134/3090;w/JoachimWeickert.html;151/9307",
        "google_scholar": "idj3nF4AAAAJ;y4TcrHUAAAAJ;IWwCuGAAAAAJ;MYvSvGsAAAAJ",
        "orcid": "0009-0009-6776-2767;;;",
        "linkedin": "https://linkedin.com/in/tom-fischer-6209a2239;pascal-peter/;;eddy-ilg/",
        "or_profile": "~Tom_Fischer1;~Pascal_Peter1;~Joachim_Weickert1;~Eddy_Ilg3",
        "aff": "Universit\u00e4t des Saarlandes;Universit\u00e4t des Saarlandes;Universit\u00e4t des Saarlandes;Universit\u00e4t des Saarlandes",
        "aff_domain": "uni-saarland.de;uni-saarland.de;uni-saarland.de;uni-saarland.de",
        "position": "PhD student;Lecturer;Professor;Associate Professor",
        "bibtex": "@misc{\nanonymous2024neuroexplicit,\ntitle={Neuroexplicit Diffusion Models for Inpainting of Optical Flow Fields},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=2gMwe9Duc4}\n}",
        "github": "",
        "project": "",
        "reviewers": "cyeS;3rtj;BStA",
        "site": "https://openreview.net/forum?id=2gMwe9Duc4",
        "pdf_size": 6585006,
        "rating": "3;5;6",
        "confidence": "3;3;4",
        "soundness": "2;3;4",
        "contribution": "2;3;4",
        "presentation": "2;3;4",
        "wc_summary": "39;66;65",
        "wc_strengths": "51;27;113",
        "wc_weaknesses": "187;48;141",
        "wc_questions": "14;286;7",
        "wc_review": "291;427;326",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "621;1053;618",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;2;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            56.666666666666664,
            12.498888839501783
        ],
        "wc_strengths_avg": [
            63.666666666666664,
            36.23380864453651
        ],
        "wc_weaknesses_avg": [
            125.33333333333333,
            57.81772123569805
        ],
        "wc_questions_avg": [
            102.33333333333333,
            129.90338290009578
        ],
        "wc_review_avg": [
            348.0,
            57.659922534345
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            764.0,
            204.35752983435674
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.7559289460184545,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:UscZFzNJEpgJ:scholar.google.com/&scioq=Neuroexplicit+Diffusion+Models+for+Inpainting+of+Optical+Flow+Fields&hl=en&as_sdt=0,5",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Universit\u00e4t des Saarlandes",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uni-saarland.de",
        "aff_unique_abbr": "UDS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "2gwo9cjOEz",
        "title": "Neural Tangent Kernels Motivate Graph Neural Networks with Cross-Covariance Graphs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Neural tangent kernels (NTKs) provide a theoretical regime to analyze the learning and generalization behavior of over-parametrized neural networks. For a supervised learning task, the association between the eigenvectors of the NTK kernel and given data (a concept referred to as \\emph{alignment} in this paper) can govern the rate of convergence of gradient descent, as well as generalization to unseen data. Building upon this concept, we investigate NTKs and alignment in the context of graph neural networks (GNNs), where our analysis reveals that optimizing alignment translates to optimizing the graph representation or the graph shift operator in a GNN. Our results further establish the theoretical guarantees on the optimality of the alignment for a two-layer GNN and these guarantees are characterized by the graph shift operator being a function of the \\emph{cross-covariance} between the input and the output data. The theoretical insights drawn from the analysis of NTKs are validated by our experiments focused on a multi-variate time series prediction task for a publicly available dataset. Specifically, they demonstrate that GNNs with cross-covariance as the graph shift operator indeed outperform those that operate on the covariance matrix from only the input data.",
        "keywords": "Neural Tangent Kernel;Graph Neural Networks;Cross-covariance;Convergence;Generalization",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/29a863ab7cf611de377bbd77b52ecbccb44bd74a.zip",
        "author": "Shervin Khalafi;Saurabh Sihag;Alejandro Ribeiro",
        "authorids": "~Shervin_Khalafi1;~Saurabh_Sihag1;~Alejandro_Ribeiro1",
        "gender": "M;M;M",
        "homepage": "https://shervinkhalafi.github.io/;https://sihags.github.io/;https://alelab.seas.upenn.edu",
        "dblp": ";172/0928;32/15",
        "google_scholar": "rdfxlq8AAAAJ;T8D94-QAAAAJ;7mrPM4kAAAAJ",
        "orcid": ";;0000-0003-4230-9906",
        "linkedin": "shervin-khalafi-316b03221/;;",
        "or_profile": "~Shervin_Khalafi1;~Saurabh_Sihag1;~Alejandro_Ribeiro1",
        "aff": "University of Pennsylvania;University of Pennsylvania;University of Pennsylvania",
        "aff_domain": "upenn.edu;upenn.edu;upenn.edu",
        "position": "PhD student;Postdoc;Full Professor",
        "bibtex": "@misc{\nkhalafi2024neural,\ntitle={Neural Tangent Kernels Motivate Graph Neural Networks with Cross-Covariance Graphs},\nauthor={Shervin Khalafi and Saurabh Sihag and Alejandro Ribeiro},\nyear={2024},\nurl={https://openreview.net/forum?id=2gwo9cjOEz}\n}",
        "github": "",
        "project": "",
        "reviewers": "bUqG;TKzH;GUVA",
        "site": "https://openreview.net/forum?id=2gwo9cjOEz",
        "pdf_size": 1975007,
        "rating": "5;5;8",
        "confidence": "3;4;3",
        "soundness": "3;2;3",
        "contribution": "3;2;3",
        "presentation": "2;3;3",
        "wc_summary": "126;122;76",
        "wc_strengths": "81;50;64",
        "wc_weaknesses": "104;238;60",
        "wc_questions": "67;202;33",
        "wc_review": "378;612;233",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "510;944;524",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;2;1",
        "rating_avg": [
            6.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            108.0,
            22.686266036231405
        ],
        "wc_strengths_avg": [
            65.0,
            12.675435561221029
        ],
        "wc_weaknesses_avg": [
            134.0,
            75.70116687784058
        ],
        "wc_questions_avg": [
            100.66666666666667,
            72.98553890250376
        ],
        "wc_review_avg": [
            407.6666666666667,
            156.141673560335
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            659.3333333333334,
            201.37085743031992
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:2cSkFMEzNBsJ:scholar.google.com/&scioq=Neural+Tangent+Kernels+Motivate+Graph+Neural+Networks+with+Cross-Covariance+Graphs&hl=en&as_sdt=0,33",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Pennsylvania",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.upenn.edu",
        "aff_unique_abbr": "UPenn",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "2h3m61LFWL",
        "title": "Value-Biased Maximum Likelihood Estimation for Model-based Reinforcement Learning in Discounted Linear MDPs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We consider the infinite-horizon linear Markov Decision Processes (MDPs), where the transition probabilities of the dynamic model can be linearly parameterized with the help of a predefined low-dimensional feature mapping. While the existing regression-based approaches have been theoretically shown to achieve nearly-optimal regret, they are computationally rather inefficient due to the need for a large number of optimization runs in each time step, especially when the state and action spaces are large.\nTo address this issue, we propose to solve linear MDPs through the lens of Value-Biased Maximum Likelihood Estimation (VBMLE), which is a classic model-based exploration principle in the adaptive control literature for resolving the well-known closed-loop identification problem of Maximum Likelihood Estimation. We formally show that (i) VBMLE enjoys $\\widetilde{O}(d\\sqrt{T})$ regret, where $T$ is the time horizon and $d$ is the dimension of the model parameter, and (ii) VBMLE is computationally more efficient as it only requires solving one optimization problem in each time step. In our regret analysis, we offer a generic convergence result of MLE in linear MDPs through a novel supermartingale construct and uncover an interesting connection between linear MDPs and online learning, which could be of independent interest. Finally, the simulation results show that VBMLE significantly outperforms the benchmark method in terms of both empirical regret and computation time.",
        "keywords": "Reinforcement learning;model-based RL;regret analysis;linear MDPs",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/5c944c4277678c24783eb52fcb24426ed3a3196e.zip",
        "author": "Yu Heng Hung;Ping-Chun Hsieh;Akshay Mete;Panganamala Kumar",
        "authorids": "~Yu_Heng_Hung1;~Ping-Chun_Hsieh1;~Akshay_Mete1;~Panganamala_Kumar1",
        "gender": "M;M;M;M",
        "homepage": ";https://pinghsieh.github.io/;;https://cesg.tamu.edu/faculty/p-r-kumar/",
        "dblp": "276/1006.html;163/7352;228/0587;https://dblp.org/pers/k/Kumar:P=_R=.html",
        "google_scholar": "tiCRZiUAAAAJ;ix38JgoAAAAJ;evLF1akAAAAJ;qGUpTVwAAAAJ",
        "orcid": ";;;0000-0003-0389-5367",
        "linkedin": ";;;",
        "or_profile": "~Yu_Heng_Hung1;~Ping-Chun_Hsieh1;~Akshay_Mete1;~Panganamala_Kumar1",
        "aff": "National Yang-Ming Chiao Tung University;National Yang Ming Chiao Tung University;Texas A&M University - College Station;Texas A&M",
        "aff_domain": "nycu.edu.tw;nycu.edu.tw;tamu.edu;tamu.edu",
        "position": "PhD student;Associate Professor;PhD student;Full Professor",
        "bibtex": "@misc{\nhung2024valuebiased,\ntitle={Value-Biased Maximum Likelihood Estimation for Model-based Reinforcement Learning in Discounted Linear {MDP}s},\nauthor={Yu Heng Hung and Ping-Chun Hsieh and Akshay Mete and Panganamala Kumar},\nyear={2024},\nurl={https://openreview.net/forum?id=2h3m61LFWL}\n}",
        "github": "",
        "project": "",
        "reviewers": "p6f5;W2xc;WqoR;Jxj8",
        "site": "https://openreview.net/forum?id=2h3m61LFWL",
        "pdf_size": 408848,
        "rating": "3;3;5;6",
        "confidence": "4;5;4;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "1;3;3;3",
        "wc_summary": "63;72;47;69",
        "wc_strengths": "37;33;49;57",
        "wc_weaknesses": "441;481;340;172",
        "wc_questions": "60;3;53;179",
        "wc_review": "601;589;489;477",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "2005;1538;1470;1146",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "4;3;3;2",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            62.75,
            9.65336728815391
        ],
        "wc_strengths_avg": [
            44.0,
            9.539392014169456
        ],
        "wc_weaknesses_avg": [
            358.5,
            119.30737613408485
        ],
        "wc_questions_avg": [
            73.75,
            64.61955973232872
        ],
        "wc_review_avg": [
            539.0,
            56.32051136131489
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1539.75,
            306.74286870276217
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:lK9xfbtOcZUJ:scholar.google.com/&scioq=Value-Biased+Maximum+Likelihood+Estimation+for+Model-based+Reinforcement+Learning+in+Discounted+Linear+MDPs&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;2",
        "aff_unique_norm": "National Yang-Ming Chiao Tung University;National Yang Ming Chiao Tung University;Texas A&M University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.nycu.edu.tw;https://www.nycu.edu.tw;https://www.tamu.edu",
        "aff_unique_abbr": "NYCU;NYCU;TAMU",
        "aff_campus_unique_index": "0;0;1",
        "aff_campus_unique": "Taiwan;College Station;",
        "aff_country_unique_index": "0;0;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "2iFBWoR7NH",
        "title": "Knowledge Manipulation in Language Models (Part B)",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Language models can store vast amounts of factual knowledge, but their ability to use this knowledge for logical reasoning remains questionable.\nThis paper explores a language model's ability to manipulate its stored knowledge during inference. We focus on four manipulation types: *retrieval* (e.g., \"What is person A's attribute X\"), *classification* (e.g., \"Is A's attribute X even or odd?\"), *comparison* (e.g., \"Is A greater than B in attribute X?\") and *inverse search* (e.g., \"Which person's attribute X equals T?\")\n\nWe observe that pre-trained language models like GPT2/3/4 excel in knowledge retrieval but struggle with simple classification or comparison tasks unless Chain of Thoughts (CoTs) are employed during both training and inference. They also perform poorly in inverse knowledge search, irrespective of the prompts. Our primary contribution is a synthetic dataset for a *controlled experiment* that confirms these inherent weaknesses: a language model cannot *efficiently* manipulate knowledge from pre-training data, even when such knowledge is perfectly stored and fully extractable in the models, and despite adequate instruct fine-tuning.",
        "keywords": "Interpretability;Transformers;Language Models;Linear Probing;Inner Working;Factual Knowledge",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/9d7b6b037dba4956e53527b7c687c8574ee1164d.zip",
        "author": "Zeyuan Allen-Zhu;Yuanzhi Li",
        "authorids": "~Zeyuan_Allen-Zhu1;~Yuanzhi_Li1",
        "gender": ";M",
        "homepage": ";",
        "dblp": ";73/3628",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Zeyuan_Allen-Zhu1;~Yuanzhi_Li1",
        "aff": ";Carnegie Mellon University",
        "aff_domain": ";andrew.cmu.edu",
        "position": ";Assistant Professor",
        "bibtex": "@misc{\nallen-zhu2024knowledge,\ntitle={Knowledge Manipulation in Language Models (Part B)},\nauthor={Zeyuan Allen-Zhu and Yuanzhi Li},\nyear={2024},\nurl={https://openreview.net/forum?id=2iFBWoR7NH}\n}",
        "github": "",
        "project": "",
        "reviewers": "kTy8;otDf;BNdJ",
        "site": "https://openreview.net/forum?id=2iFBWoR7NH",
        "pdf_size": 696437,
        "rating": "3;6;8",
        "confidence": "5;4;4",
        "soundness": "1;3;4",
        "contribution": "1;3;3",
        "presentation": "3;3;4",
        "wc_summary": "76;123;122",
        "wc_strengths": "37;94;101",
        "wc_weaknesses": "132;166;43",
        "wc_questions": "103;77;1",
        "wc_review": "348;460;267",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            5.666666666666667,
            2.0548046676563256
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            107.0,
            21.924111536540465
        ],
        "wc_strengths_avg": [
            77.33333333333333,
            28.662790435607548
        ],
        "wc_weaknesses_avg": [
            113.66666666666667,
            51.86092513208336
        ],
        "wc_questions_avg": [
            60.333333333333336,
            43.27688631231329
        ],
        "wc_review_avg": [
            358.3333333333333,
            79.12999150483687
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.9176629354822472,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:4PC5CJdToYwJ:scholar.google.com/&scioq=Knowledge+Manipulation+in+Language+Models+(Part+B)&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Carnegie Mellon University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cmu.edu",
        "aff_unique_abbr": "CMU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "title": "BroGNet: Momentum-Conserving Graph Neural Stochastic Differential Equation for Learning Brownian Dynamics",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19540",
        "id": "2iGiSHmeAN",
        "author_site": "Suresh Suresh, Jayadeva Jayadeva, Sayan Ranu, N. M. Anoop Krishnan",
        "tldr": "",
        "abstract": "Neural networks (NNs) that exploit strong inductive biases based on physical laws and symmetries have shown remarkable success in learning the dynamics of physical systems directly from their trajectory. However, these works focus only on the systems that follow deterministic dynamics, such as Newtonian or Hamiltonian. Here, we propose a framework, namely Brownian graph neural networks (BroGNet), combining stochastic differential equations (SDEs) and GNNs to learn Brownian dynamics directly from the trajectory. We modify the architecture of BroGNet to enforce linear momentum conservation of the system, which, in turn, provides superior performance on learning dynamics as revealed empirically. We demonstrate this approach on several systems, namely, linear spring, linear spring with binary particle types, and non-linear spring systems, all following Brownian dynamics at finite temperatures. We show that BroGNet significantly outperforms proposed baselines across all the benchmarked Brownian systems. In addition, we demonstrate zero-shot generalizability of BroGNet to simulate unseen system sizes that are two orders of magnitude larger and to different temperatures than those used during training. Finally, we show that BroGNet conserves the momentum of the system resulting in superior performance and data efficiency. Altogether, our study contributes to advancing the understanding of the intricate dynamics of Brownian motion and demonstrates the effectiveness of graph neural networks in modeling such complex systems.",
        "keywords": "Brownian dynamics;stochastic differential equation;graph neural network;scientific machine learning",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/3c5a269cc97726c258f8c59f70a719d96f7f1327.pdf",
        "author": "Suresh Bishnoi;Jayadeva Jayadeva;Sayan Ranu;N M Anoop Krishnan",
        "authorids": "~Suresh_Bishnoi1;~Jayadeva_Jayadeva1;~Sayan_Ranu2;~N_M_Anoop_Krishnan1",
        "gender": "M;M;M;M",
        "homepage": "https://web.iitd.ac.in/~srz208500/;;https://www.cse.iitd.ac.in/~sayan/index.html;",
        "dblp": "329/6194;58/4288;38/768;",
        "google_scholar": "Wy6q2QwAAAAJ;;K4w5qYUAAAAJ;https://scholar.google.co.in/citations?user=fGnjHcEAAAAJ",
        "orcid": ";;0000-0003-4147-9372;0000-0003-1500-4947",
        "linkedin": "sureshb1999/;;;",
        "or_profile": "~Suresh_Bishnoi1;~Jayadeva_Jayadeva1;~Sayan_Ranu2;~N_M_Anoop_Krishnan1",
        "aff": "Indian Institute of Technology Delhi;Indian Institute of Technology Delhi;Indian Institute of Technology Delhi;Indian Institute of Technology Delhi",
        "aff_domain": "iitd.ac.in;iitd.ac.in;iitd.ac.in;iitd.ac.in",
        "position": "PhD student;Full Professor;Associate Professor;Associate Professor",
        "bibtex": "@inproceedings{\nbishnoi2024brognet,\ntitle={Bro{GN}et: Momentum-Conserving Graph Neural Stochastic Differential Equation for Learning Brownian Dynamics},\nauthor={Suresh Bishnoi and Jayadeva Jayadeva and Sayan Ranu and N M Anoop Krishnan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=2iGiSHmeAN}\n}",
        "github": "",
        "project": "",
        "reviewers": "Va4f;VaBU;KKvb;cdjq",
        "pdf_size": 1982791,
        "rating": "6;6;6;8",
        "confidence": "3;4;4;4",
        "soundness": "3;3;3;4",
        "contribution": "3;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "296;62;78;87",
        "wc_strengths": "12;51;19;213",
        "wc_weaknesses": "2;191;242;171",
        "wc_questions": "37;70;3;91",
        "wc_review": "347;374;342;562",
        "wc_reply_reviewers": "22;40;24;213",
        "wc_reply_authors": "938;737;1484;959",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "4;2;4;3",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            130.75,
            95.82634032456838
        ],
        "wc_strengths_avg": [
            73.75,
            81.72935519138763
        ],
        "wc_weaknesses_avg": [
            151.5,
            90.11242977525353
        ],
        "wc_questions_avg": [
            50.25,
            33.38693606786942
        ],
        "wc_review_avg": [
            406.25,
            90.74242392618791
        ],
        "wc_reply_reviewers_avg": [
            74.75,
            80.12295239193324
        ],
        "wc_reply_authors_avg": [
            1029.5,
            276.3462502007219
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.25,
            0.82915619758885
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10400832838272360997&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=2iGiSHmeAN",
        "pdf": "https://openreview.net/pdf?id=2iGiSHmeAN",
        "email": "iitd.ac.in;iitd.ac.in;iitd.ac.in;iitd.ac.in",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Indian Institute of Technology Delhi",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.iitd.ac.in",
        "aff_unique_abbr": "IIT Delhi",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Delhi",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "India"
    },
    {
        "title": "Deep SE(3)-Equivariant Geometric Reasoning for Precise Placement Tasks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19539",
        "id": "2inBuwTyL2",
        "author_site": "Ben Eisner, Yi Yang, Todor Davchev, Mel Vecerik, Jonathan Scholz, David Held",
        "tldr": "",
        "abstract": "Many robot manipulation tasks can be framed as geometric reasoning tasks, where an agent must be able to precisely manipulate an object into a position that satisfies the task from a set of initial conditions. Often, task success is defined based on the relationship between two objects - for instance, hanging a mug on a rack.  In such cases, the solution should be equivariant to the initial position of the objects as well as the agent, and invariant to the pose of the camera. This poses a challenge for learning systems which attempt to solve this task by learning directly from high-dimensional demonstrations: the agent must learn to be both equivariant as well as precise, which can be challenging without any inductive biases about the problem. In this work, we propose a method for precise relative pose prediction which is provably SE(3)-equivariant, can be learned from only a few demonstrations, and can generalize across variations in a class of objects. We accomplish this by factoring the problem into learning an SE(3) invariant task-specific representation of the scene and then interpreting this representation with novel geometric reasoning layers which are provably SE(3) equivariant. We demonstrate that our method can yield substantially more precise placement predictions in simulated placement tasks than previous methods trained with the same amount of data, and can accurately represent relative placement relationships data collected from real-world demonstrations. Supplementary information and videos can be found at https://sites.google.com/view/reldist-iclr-2023.",
        "keywords": "Learning from Demonstration;Manipulation;3D Learning;SE(3) Equivariance",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Ben Eisner;Yi Yang;Todor Davchev;Mel Vecerik;Jonathan Scholz;David Held",
        "authorids": "~Ben_Eisner1;~Yi_Yang10;~Todor_Davchev1;~Mel_Vecerik1;~Jonathan_Scholz2;~David_Held1",
        "gender": "M;M;;;M;M",
        "homepage": ";https://yangyi02.github.io/;https://tdavchev.github.io/;https://sites.google.com/corp/view/2020-s3k/home;https://sites.google.com/site/jonathanscholz/;http://davheld.github.io/",
        "dblp": ";33/4854-7;241/7187;;;22/11147",
        "google_scholar": "RWe-v0UAAAAJ;-BO7TXUAAAAJ;h_q7XhoAAAAJ;;bwORIKIAAAAJ;0QtU-NsAAAAJ",
        "orcid": ";;0000-0002-0584-5163;;;",
        "linkedin": ";;;;jonathan-scholz-689aa34/;",
        "or_profile": "~Ben_Eisner1;~Yi_Yang10;~Todor_Davchev1;~Mel_Vecerik1;~Jonathan_Scholz2;~David_Held1",
        "aff": "Carnegie Mellon University;Google DeepMind;Google DeepMind;Google DeepMind;Google DeepMind;Carnegie Mellon University",
        "aff_domain": "cmu.edu;deepmind.com;deepmind.com;deepmind.com;deepmind.com;cmu.edu",
        "position": "PhD student;Researcher;Researcher;Researcher;Researcher;Associate Professor",
        "bibtex": "@inproceedings{\neisner2024deep,\ntitle={Deep {SE}(3)-Equivariant Geometric Reasoning for Precise Placement Tasks},\nauthor={Ben Eisner and Yi Yang and Todor Davchev and Mel Vecerik and Jonathan Scholz and David Held},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=2inBuwTyL2}\n}",
        "github": "",
        "project": "",
        "reviewers": "Te9m;5kHb;5GvH",
        "pdf_size": 2076030,
        "rating": "6;6;6",
        "confidence": "4;4;3",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "3;2;3",
        "wc_summary": "129;50;65",
        "wc_strengths": "62;45;94",
        "wc_weaknesses": "102;98;165",
        "wc_questions": "117;11;56",
        "wc_review": "410;204;380",
        "wc_reply_reviewers": "66;147;0",
        "wc_reply_authors": "987;1125;886",
        "reply_reviewers": "2;2;0",
        "reply_authors": "3;3;3",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            81.33333333333333,
            34.25719713513579
        ],
        "wc_strengths_avg": [
            67.0,
            20.314198646923455
        ],
        "wc_weaknesses_avg": [
            121.66666666666667,
            30.684777260973487
        ],
        "wc_questions_avg": [
            61.333333333333336,
            43.43833432452134
        ],
        "wc_review_avg": [
            331.3333333333333,
            90.86742479507653
        ],
        "wc_reply_reviewers_avg": [
            71.0,
            60.11655346075655
        ],
        "wc_reply_authors_avg": [
            999.3333333333334,
            97.96030942285871
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            3.0,
            0.0
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12691674680712641233&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=2inBuwTyL2",
        "pdf": "https://openreview.net/pdf?id=2inBuwTyL2",
        "email": "cmu.edu;deepmind.com;deepmind.com;deepmind.com;deepmind.com;cmu.edu",
        "author_num": 6,
        "aff_unique_index": "0;1;1;1;1;0",
        "aff_unique_norm": "Carnegie Mellon University;Google",
        "aff_unique_dep": ";Google DeepMind",
        "aff_unique_url": "https://www.cmu.edu;https://deepmind.com",
        "aff_unique_abbr": "CMU;DeepMind",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;1;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "2int61IpaP",
        "title": "FutureDD: Planning in POMDP with Encoded Future Dynamics",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Partially observable Markov decision process (POMDP) is a powerful framework for modeling decision-making problems where agents do not have full access to environment states. In the realm of offline reinforcement learning (RL), agents need to extract policies on previously recorded decision-making datasets without directly interacting with environments. Due to the inherent partial observability of environments and the limited availability of offline data, agents must possess the capability to extract valuable insights from limited data, which can serve as crucial prior information for making informed decisions. Recent works have shown that deep generative models, particularly diffusion models, exhibit impressive performance in offline RL. However, most of these approaches mainly focus on fully observed environments while neglecting POMDPs, and heavily rely on history information for decision-making, disregarding the valuable prior information about the future that can be extracted from offline data. Having recognized this gap, we propose a novel framework $\\textit{FutureDD}$ to extract future prior. $\\textit{FutureDD}$ leverages an auxiliary prior model encoding future sub-trajectories to a latent variable, which serves as a compensation for directly modeling observations with a diffusion model. This enables $\\textit{FutureDD}$ to extract richer prior information from limited offline data for agents to predict potential future dynamics. The experimental results on a set of tasks demonstrate that in the context of POMDPs, $\\textit{FutureDD}$ provides a simple yet effective approach for agents to learn behaviours yielding higher returns.",
        "keywords": "Offline Reinforcement Learning;Partially Observable Markov Decision Process;Sequential Decision Making;Diffusion Models",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/52486c4a6445a8da7138ea1c0e021bee721cb3c7.zip",
        "author": "Yao Tang;Zhihui Xie;Tong Yu;Bokai Hu;Shuai Li",
        "authorids": "~Yao_Tang2;~Zhihui_Xie2;~Tong_Yu3;~Bokai_Hu2;~Shuai_Li3",
        "gender": "F;M;;M;F",
        "homepage": "https://yaotang23.github.io/;https://fffffarmer.github.io/;https://www.linkedin.com/in/tong-yu-42790744;;http://shuaili8.github.io",
        "dblp": ";31/3570-2;32/1593-1;;57/2281-10",
        "google_scholar": ";Jml8NvkAAAAJ;https://scholar.google.com/citations?hl=en;;https://scholar.google.com.hk/citations?user=kMZgQxcAAAAJ",
        "orcid": ";;0000-0002-5991-2050;;",
        "linkedin": ";;tong-yu-42790744;\u535a\u51ef-\u80e1-a26279292;",
        "or_profile": "~Yao_Tang2;~Zhihui_Xie2;~Tong_Yu3;~Bokai_Hu2;~Shuai_Li3",
        "aff": "Shanghai Jiaotong University;Shanghai Jiaotong University;Adobe Research;University of California, San Diego;John Hopcroft Center, Shanghai Jiao Tong University",
        "aff_domain": "cs.sjtu.edu.cn;sjtu.edu.cn;adobe.com;ucsd.edu;sjtu.edu.cn",
        "position": "Undergrad student;MS student;Senior Research Scientist;MS student;Assistant Professor",
        "bibtex": "@misc{\ntang2024futuredd,\ntitle={Future{DD}: Planning in {POMDP} with Encoded Future Dynamics},\nauthor={Yao Tang and Zhihui Xie and Tong Yu and Bokai Hu and Shuai Li},\nyear={2024},\nurl={https://openreview.net/forum?id=2int61IpaP}\n}",
        "github": "",
        "project": "",
        "reviewers": "e8st;BsjN;bCks;sLyp",
        "site": "https://openreview.net/forum?id=2int61IpaP",
        "pdf_size": 341452,
        "rating": "3;3;5;5",
        "confidence": "2;5;4;4",
        "soundness": "2;3;3;3",
        "contribution": "1;2;2;2",
        "presentation": "1;2;3;2",
        "wc_summary": "63;91;54;242",
        "wc_strengths": "17;45;28;25",
        "wc_weaknesses": "199;107;292;285",
        "wc_questions": "76;28;29;152",
        "wc_review": "355;271;403;704",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            112.5,
            76.00164471904539
        ],
        "wc_strengths_avg": [
            28.75,
            10.207227831296802
        ],
        "wc_weaknesses_avg": [
            220.75,
            75.19433156827714
        ],
        "wc_questions_avg": [
            71.25,
            50.49443038593464
        ],
        "wc_review_avg": [
            433.25,
            163.30091089764318
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.22941573387056177,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:1EXxHaTR3wMJ:scholar.google.com/&scioq=FutureDD:+Planning+in+POMDP+with+Encoded+Future+Dynamics&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2;0",
        "aff_unique_norm": "Shanghai Jiao Tong University;Adobe;University of California, San Diego",
        "aff_unique_dep": ";Adobe Research;",
        "aff_unique_url": "https://www.sjtu.edu.cn;https://research.adobe.com;https://www.ucsd.edu",
        "aff_unique_abbr": "SJTU;Adobe;UCSD",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";San Diego;Shanghai",
        "aff_country_unique_index": "0;0;1;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "2kvDzdC5rh",
        "title": "IntentGPT: Few-Shot Intent Discovery with Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In today's digitally driven world, dialogue systems play a pivotal role in enhancing user interactions, from customer service to virtual assistants. In these dialogues, it is important to identify user's goals automatically to resolve their needs promptly. This has necessitated the integration of models that perform Intent Detection. However, users' intents are diverse and dynamic, making it challenging to maintain a fixed set of predefined intents. As a result, a more practical approach is to develop a model capable of identifying new intents as they emerge. We address the challenge of Intent Discovery, an area that has drawn significant attention in recent research efforts. Existing methods need to train on a substantial amount of data for correctly identifying new intents, demanding significant human effort. To overcome this, we introduce IntentGPT, a novel method that efficiently prompts Large Language Models (LLMs) such as GPT-4 to effectively discover new intents with minimal labeled data. IntentGPT comprises an In-Context Prompt Generator, which generates informative prompts for In-Context Learning, an Intent Predictor for classifying and discovering user intents behind utterances, and a Semantic Few-Shot Sampler which leverages embedding similarities for selecting the closest examples from the labeled data. Our experiments show that IntentGPT outperforms previous methods that require extensive domain-specific data and fine-tuning, in popular benchmarks, including CLINC and BANKING.",
        "keywords": "intent discovery;intent detection;intent classification;open-set classification;in-contex learning;few-shot learning;large language models",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/4f79883c32a5f4b99a6256bbaa731c4512af88a0.zip",
        "author": "Juan A. Rodriguez;Nicholas Botzer;David Vazquez;Christopher Pal;Marco Pedersoli;Issam H. Laradji",
        "authorids": "~Juan_A._Rodriguez1;~Nicholas_Botzer1;~David_Vazquez1;~Christopher_Pal1;~Marco_Pedersoli1;~Issam_H._Laradji1",
        "gender": "M;M;;M;M;M",
        "homepage": ";http://www.david-vazquez.com;https://scholar.google.ca/citations?user=1ScWJOoAAAAJ&hl=en&oi=ao;http://profs.etsmtl.ca/mpedersoli/;https://issamlaradji.github.io/;https://github.com/joanrod/ocr-vqgan",
        "dblp": ";94/8653;45/1217;81/4503;142/0043;276/6112",
        "google_scholar": "5rS0yCoAAAAJ;1jHvtfsAAAAJ;https://scholar.google.ca/citations?user=1ScWJOoAAAAJ;aVfyPAoAAAAJ;https://scholar.google.ca/citations?user=8vRS7F0AAAAJ;https://scholar.google.es/citations?user=0selhb4AAAAJ",
        "orcid": ";0000-0002-2845-8158;;;;",
        "linkedin": ";https://www.linkedin.com/company/david-vazquez/;;;issam-laradji-67ba1a99/;",
        "or_profile": "~Nicholas_Botzer1;~David_Vazquez1;~Christopher_Pal1;~Marco_Pedersoli1;~Issam_H._Laradji1;~Juan_Rodriguez2",
        "aff": "University of Notre Dame;ServiceNow research;Polytechnique Montreal;\u00c9cole de technologie sup\u00e9rieure, Universit\u00e9 du Qu\u00e9bec;ServiceNow;\u00c9cole de technologie sup\u00e9rieure, Universit\u00e9 du Qu\u00e9bec",
        "aff_domain": "nd.edu;servicenow.com;polymtl.ca;etsmtl.ca;servicenow.com;etsmtl.ca",
        "position": "PhD student;Researcher;Full Professor;Associate Professor;Researcher;PhD student",
        "bibtex": "@misc{\nrodriguez2024intentgpt,\ntitle={Intent{GPT}: Few-Shot Intent Discovery with Large Language Models},\nauthor={Juan A. Rodriguez and Nicholas Botzer and David Vazquez and Christopher Pal and Marco Pedersoli and Issam H. Laradji},\nyear={2024},\nurl={https://openreview.net/forum?id=2kvDzdC5rh}\n}",
        "github": "",
        "project": "",
        "reviewers": "kRkh;NWU5;vjHF;GqJc;G7hj",
        "site": "https://openreview.net/forum?id=2kvDzdC5rh",
        "pdf_size": 580546,
        "rating": "3;3;5;5;6",
        "confidence": "4;4;5;4;3",
        "soundness": "2;2;2;4;3",
        "contribution": "2;1;2;2;3",
        "presentation": "3;4;2;3;2",
        "wc_summary": "20;51;42;64;126",
        "wc_strengths": "98;117;22;39;128",
        "wc_weaknesses": "111;776;43;309;226",
        "wc_questions": "2;29;17;57;77",
        "wc_review": "231;973;124;469;557",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "1431;465;791;1330;667",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "3;1;2;2;1",
        "rating_avg": [
            4.4,
            1.2
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.6,
            0.8
        ],
        "contribution_avg": [
            2.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            2.8,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            60.6,
            35.7077022503549
        ],
        "wc_strengths_avg": [
            80.8,
            42.51776099467139
        ],
        "wc_weaknesses_avg": [
            293.0,
            258.32460200298385
        ],
        "wc_questions_avg": [
            36.4,
            27.155846515989886
        ],
        "wc_review_avg": [
            470.8,
            295.774508705534
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            936.8,
            378.28158823818006
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.8,
            0.7483314773547883
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.2635231383473649,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12943960937829617865&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;3;1;3",
        "aff_unique_norm": "University of Notre Dame;ServiceNow;Polytechnique Montreal;Universit\u00e9 du Qu\u00e9bec",
        "aff_unique_dep": ";research;;",
        "aff_unique_url": "https://www.nd.edu;https://www.servicenow.com;https://www.polymtl.ca;https://www.etsmtl.ca",
        "aff_unique_abbr": "Notre Dame;ServiceNow;PolyMTL;ETS",
        "aff_campus_unique_index": "1;2;2",
        "aff_campus_unique": ";Montreal;\u00c9cole de technologie sup\u00e9rieure",
        "aff_country_unique_index": "0;0;1;1;0;1",
        "aff_country_unique": "United States;Canada"
    },
    {
        "id": "2l7g7zwC4z",
        "title": "Embedding File Structure for Tabular File Preparation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We introduce the notion of file structure, the set of characters within a file's content that do not belong to data values.\nData preparation can be considered as a pipeline of heterogeneous steps with the common theme of wrangling the structure of a file to access its payload in a downstream task.\nWe claim that solving typical data preparation tasks benefits from an explicit representation of file structure.\nWe propose a novel approach for learning such a representation, which we call a structural embedding, using the raw file content as input.\nOur approach is based on a novel neural network architecture, composed of a transformer module and a convolutional module, trained in a self-supervised fashion on almost 1M public data files to learn structural embeddings.\nWe demonstrate the usefulness of structural embeddings in several steps of a data preparation pipeline: data loading, row classification, and column type annotation.\nFor these tasks, we show that our approach obtains performances comparable with state-of-the-art baselines on six real-world datasets, and, more importantly, we improve upon such baselines by combining them with the structural embeddings provided by our approach.",
        "keywords": "representation;tabular embedding;file structure;data preparation;table representation learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/4494d29648c5f2a4bcd456c387323fb43b49b440.zip",
        "author": "Gerardo Vitagliano;Mazhar Hameed;Alejandro Sierra M\u00fanera;Felix Naumann",
        "authorids": "~Gerardo_Vitagliano1;mazhar.hameed@hpi.de;~Alejandro_Sierra_M\u00fanera1;~Felix_Naumann1",
        "gender": "M;;;",
        "homepage": "https://vitaglianog.github.io/;;;",
        "dblp": "249/4023.html;;;n/FelixNaumann",
        "google_scholar": "zYBXv3sAAAAJ;;;",
        "orcid": "0000-0001-7782-2596;;;",
        "linkedin": "gerardo-vitagliano/;;;",
        "or_profile": "~Gerardo_Vitagliano1;mazhar.hameed@hpi.de;~Alejandro_Sierra_M\u00fanera1;~Felix_Naumann1",
        "aff": "Computer Science and Artificial Intelligence Laboratory, Electrical Engineering & Computer Science;;;Hasso Plattner Institute",
        "aff_domain": "csail.mit.edu;;;hpi.de",
        "position": "Postdoc;;;Full Professor",
        "bibtex": "@misc{\nvitagliano2024embedding,\ntitle={Embedding File Structure for Tabular File Preparation},\nauthor={Gerardo Vitagliano and Mazhar Hameed and Alejandro Sierra M{\\'u}nera and Felix Naumann},\nyear={2024},\nurl={https://openreview.net/forum?id=2l7g7zwC4z}\n}",
        "github": "",
        "project": "",
        "reviewers": "ffWZ;Wgj4;9VNy",
        "site": "https://openreview.net/forum?id=2l7g7zwC4z",
        "pdf_size": 2520129,
        "rating": "3;3;5",
        "confidence": "3;3;3",
        "soundness": "2;2;3",
        "contribution": "2;1;2",
        "presentation": "2;3;3",
        "wc_summary": "36;251;30",
        "wc_strengths": "35;52;29",
        "wc_weaknesses": "309;131;104",
        "wc_questions": "8;58;14",
        "wc_review": "388;492;177",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "476;645;278",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            105.66666666666667,
            102.7953738691041
        ],
        "wc_strengths_avg": [
            38.666666666666664,
            9.741092797468305
        ],
        "wc_weaknesses_avg": [
            181.33333333333334,
            90.94442747573316
        ],
        "wc_questions_avg": [
            26.666666666666668,
            22.29100466306732
        ],
        "wc_review_avg": [
            352.3333333333333,
            131.04791320564993
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            466.3333333333333,
            149.98296199531762
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:mSuJ70-nehkJ:scholar.google.com/&scioq=Embedding+File+Structure+for+Tabular+File+Preparation&hl=en&as_sdt=0,23",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Massachusetts Institute of Technology;Hasso Plattner Institute",
        "aff_unique_dep": "Computer Science and Artificial Intelligence Laboratory;",
        "aff_unique_url": "https://www.csail.mit.edu;https://www.hpi.de",
        "aff_unique_abbr": "CSAIL;HPI",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Cambridge;",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United States;Germany"
    },
    {
        "title": "Instant3D: Fast Text-to-3D with Sparse-view Generation and Large Reconstruction Model",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19538",
        "id": "2lDQLiH1W4",
        "author_site": "Jiahao Li, Hao Tan, Kai Zhang, Zexiang Xu, Fujun Luan, Yinghao Xu, Yicong Hong, Kalyan Sunkavalli, Greg Shakhnarovich, Sai Bi",
        "tldr": "",
        "abstract": "Text-to-3D with diffusion models has achieved remarkable progress in recent years.  However, existing methods either rely on score distillation-based optimization which suffer from slow inference, low diversity and Janus problems, or are feed-forward methods that generate low-quality results due to the scarcity of 3D training data. In this paper, we propose Instant3D, a novel method that generates high-quality  and diverse 3D assets from  text prompts in a feed-forward manner. We adopt a two-stage paradigm, which first generates a sparse set of four structured and consistent views from text in one shot with a fine-tuned 2D text-to-image diffusion model, and then directly regresses the NeRF from the generated images with a novel transformer-based sparse-view reconstructor. Through extensive experiments, we demonstrate that our method can generate diverse 3D assets of high visual quality within 20 seconds, which is two orders of magnitude faster than previous optimization-based methods that can take 1 to 10 hours. Our project webpage is: https://jiahao.ai/instant3d/.",
        "keywords": "text-to-3d;generative models;diffusion models;3D reconstruction;3D generation;sparse-view reconstruction",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/d95b8bde0e07536f9902a6ca7875eea06e659153.zip",
        "author": "Jiahao Li;Hao Tan;Kai Zhang;Zexiang Xu;Fujun Luan;Yinghao Xu;Yicong Hong;Kalyan Sunkavalli;Greg Shakhnarovich;Sai Bi",
        "authorids": "~Jiahao_Li2;~Hao_Tan1;~Kai_Zhang7;~Zexiang_Xu1;~Fujun_Luan2;~Yinghao_Xu1;~Yicong_Hong1;~Kalyan_Sunkavalli1;~Greg_Shakhnarovich1;~Sai_Bi1",
        "gender": ";M;M;M;M;M;M;M;M;M",
        "homepage": "https://jiahao.ai;http://www.cs.unc.edu/~airsplay/;https://kai-46.github.io/website/;https://cseweb.ucsd.edu/~zex014/;https://luanfujun.com/;https://justimyhxu.github.io/;http://www.yiconghong.me/;http://www.kalyans.org/;https://sai-bi.github.io/;http://ttic.edu/gregory/",
        "dblp": ";94/877-2;55/957-45;154/0366;183/9337;232/2482;262/3437;42/5978;165/9898;17/1926.html",
        "google_scholar": "w9jtLkIAAAAJ;OV1Y3FUAAAAJ;6B7FPMoAAAAJ;_RRIYvEAAAAJ;NLxrmYQAAAAJ;https://scholar.google.com/citations?hl=en;AerHOzUAAAAJ;j7uL6VEAAAAJ;-q4nE1kAAAAJ;https://scholar.google.com.tw/citations?user=YLOz1kgAAAAJ",
        "orcid": ";;;;;;0000-0002-5068-1508;;;",
        "linkedin": "jiahaoli95;hao-tan-23677180/;;;luanfujun/;;yicong-hong;;;",
        "or_profile": "~Jiahao_Li2;~Hao_Tan1;~Kai_Zhang7;~Zexiang_Xu1;~Fujun_Luan2;~Yinghao_Xu1;~Yicong_Hong1;~Kalyan_Sunkavalli1;~Sai_Bi1;~Gregory_Shakhnarovich2",
        "aff": "Toyota Technological Institute at Chicago;Adobe Systems;Adobe Systems;Adobe Research;Adobe Systems;Stanford University;Adobe Systems;Adobe Research;Adobe Systems;University of Chicago",
        "aff_domain": "ttic.edu;adobe.com;adobe.com;adobe.com;adobe.com;stanford.edu;adobe.com;adobe.com;adobe.com;uchicago.edu",
        "position": "PhD student;Research Scientist;Researcher;Researcher;Researcher;Postdoc;Researcher;Principal Scientist;Researcher;Professor, part time",
        "bibtex": "@inproceedings{\nli2024instantd,\ntitle={Instant3D: Fast Text-to-3D with Sparse-view Generation and Large Reconstruction Model},\nauthor={Jiahao Li and Hao Tan and Kai Zhang and Zexiang Xu and Fujun Luan and Yinghao Xu and Yicong Hong and Kalyan Sunkavalli and Greg Shakhnarovich and Sai Bi},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=2lDQLiH1W4}\n}",
        "github": "",
        "project": "",
        "reviewers": "dCt6;wyA8;eZrX",
        "pdf_size": 44315184,
        "rating": "6;8;8",
        "confidence": "3;5;5",
        "soundness": "3;3;3",
        "contribution": "2;4;3",
        "presentation": "3;4;3",
        "wc_summary": "32;148;72",
        "wc_strengths": "25;150;235",
        "wc_weaknesses": "100;315;418",
        "wc_questions": "156;160;22",
        "wc_review": "313;773;747",
        "wc_reply_reviewers": "0;148;51",
        "wc_reply_authors": "737;907;1117",
        "reply_reviewers": "0;1;1",
        "reply_authors": "3;3;3",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            84.0,
            48.11098280711657
        ],
        "wc_strengths_avg": [
            136.66666666666666,
            86.24899355290407
        ],
        "wc_weaknesses_avg": [
            277.6666666666667,
            132.47976784735428
        ],
        "wc_questions_avg": [
            112.66666666666667,
            64.1318087136866
        ],
        "wc_review_avg": [
            611.0,
            210.98499156733084
        ],
        "wc_reply_reviewers_avg": [
            66.33333333333333,
            61.38584708401621
        ],
        "wc_reply_authors_avg": [
            920.3333333333334,
            155.42057635833024
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.0,
            0.0
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.9999999999999998,
        "gs_citation": 250,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8026239238112532104&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=2lDQLiH1W4",
        "pdf": "https://openreview.net/pdf?id=2lDQLiH1W4",
        "email": "ttic.edu;adobe.com;adobe.com;adobe.com;adobe.com;stanford.edu;adobe.com;adobe.com;adobe.com;uchicago.edu",
        "author_num": 10,
        "aff_unique_index": "0;1;1;1;1;2;1;1;1;3",
        "aff_unique_norm": "Toyota Technological Institute at Chicago;Adobe;Stanford University;University of Chicago",
        "aff_unique_dep": ";Adobe Systems Incorporated;;",
        "aff_unique_url": "https://www.tti-chicago.org;https://www.adobe.com;https://www.stanford.edu;https://www.uchicago.edu",
        "aff_unique_abbr": "TTI Chicago;Adobe;Stanford;UChicago",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Chicago;;Stanford",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "2mDzzLWRHr",
        "title": "Comfetch: Federated Learning of Large Networks on Constrained Clients via Sketching",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Federated learning (FL) is a popular paradigm for private and collaborative model training on the edge. In centralized FL, the parameters of a global architecture (such as a deep neural network) are maintained and distributed by a central server/controller to clients who transmit model updates (gradients) back to the server based on local optimization. While many efforts have focused on reducing the communication complexity of gradient transmission, the vast majority of compression-based algorithms assume that each participating client is able to download and train the current and full set of parameters, which may not be a practical assumption depending on the resource constraints of smaller clients such as mobile devices. In this work, we propose a simple yet effective novel algorithm Comfetch, which allows clients to train large networks using reduced representations of the global architecture via the count sketch, which reduces local computational and memory costs along with bi-directional communication complexity.  We provide a nonconvex convergence guarantee and experimentally demonstrate that it is possible to learn large models, such as a deep convolutional network, through federated training on their sketched counterparts. The resulting global models exhibit competitive test accuracy over CIFAR10/100 classification when compared against un-compressed model training.",
        "keywords": "federated learning;compression;sketch",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/d2141f11f1f8ea4517950d066a9a07c786e6e54c.zip",
        "author": "Tahseen Rabbani;Brandon Yushan Feng;Marco Bornstein;Yifan Yang;Kyle Rui Sang;Arjun Rajkumar;Amitabh Varshney;Furong Huang",
        "authorids": "~Tahseen_Rabbani1;~Brandon_Yushan_Feng1;~Marco_Bornstein1;~Yifan_Yang5;~Kyle_Rui_Sang1;~Arjun_Rajkumar1;~Amitabh_Varshney1;~Furong_Huang1",
        "gender": "M;;M;M;M;M;M;F",
        "homepage": "https://www.cs.umd.edu/people/trabbani;https://brandonyfeng.github.io/;https://marcobornstein.github.io;https://yifanyang.dev/;;;http://www.cs.umd.edu/~varshney;https://furong-huang.com",
        "dblp": "280/2362;284/2193;332/0431;;;;;72/8513",
        "google_scholar": ";VCeYRsYAAAAJ;;Wn-GGXkAAAAJ;;qpMkWPEAAAAJ;b053OdAAAAAJ;13yyuCcAAAAJ",
        "orcid": ";0000-0001-7003-9128;;;;;0000-0002-9873-2212;",
        "linkedin": ";;;;kyle-sang/;arjun-rajkumar-1351a9145/;amitabh-varshney-4556961b/;",
        "or_profile": "~Tahseen_Rabbani1;~Brandon_Yushan_Feng1;~Marco_Bornstein1;~Yifan_Yang5;~Kyle_Rui_Sang1;~Arjun_Rajkumar1;~Amitabh_Varshney1;~Furong_Huang1",
        "aff": "University of Maryland, College Park;Massachusetts Institute of Technology;University of Maryland, College Park;University of Maryland, College Park;University of Maryland, College Park;Adobe Systems;University of Maryland, College Park;University of Maryland",
        "aff_domain": "umd.edu;mit.edu;umd.edu;umd.edu;umd.edu;adobe.com;umd.edu;cs.umd.edu",
        "position": "PhD student;Postdoc;PhD student;PhD student;MS student;Engineer;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nrabbani2024comfetch,\ntitle={Comfetch: Federated Learning of Large Networks on Constrained Clients via Sketching},\nauthor={Tahseen Rabbani and Brandon Yushan Feng and Marco Bornstein and Yifan Yang and Kyle Rui Sang and Arjun Rajkumar and Amitabh Varshney and Furong Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=2mDzzLWRHr}\n}",
        "github": "",
        "project": "",
        "reviewers": "qrJM;p5E1;W1rB;cTtw",
        "site": "https://openreview.net/forum?id=2mDzzLWRHr",
        "pdf_size": 770448,
        "rating": "3;3;5;6",
        "confidence": "4;3;4;4",
        "soundness": "2;2;2;4",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;4",
        "wc_summary": "92;66;65;68",
        "wc_strengths": "143;227;23;36",
        "wc_weaknesses": "557;2029;215;76",
        "wc_questions": "1;41;2;127",
        "wc_review": "793;2363;305;307",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            72.75,
            11.166355717063647
        ],
        "wc_strengths_avg": [
            107.25,
            83.35578864122155
        ],
        "wc_weaknesses_avg": [
            719.25,
            776.1779354632545
        ],
        "wc_questions_avg": [
            42.75,
            51.24634133282102
        ],
        "wc_review_avg": [
            942.0,
            844.1617143652038
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.5555555555555555,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12970504062840043210&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;0;0;2;0;0",
        "aff_unique_norm": "University of Maryland;Massachusetts Institute of Technology;Adobe",
        "aff_unique_dep": ";;Adobe Systems Incorporated",
        "aff_unique_url": "https://www/umd.edu;https://web.mit.edu;https://www.adobe.com",
        "aff_unique_abbr": "UMD;MIT;Adobe",
        "aff_campus_unique_index": "0;0;0;0;0",
        "aff_campus_unique": "College Park;",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Ferret: Refer and Ground Anything Anywhere at Any Granularity",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19537",
        "id": "2msbbX3ydD",
        "author_site": "Haoxuan You, Haotian Zhang, Zhe Gan, Xianzhi Du, Bowen Zhang, Zirui Wang, Liangliang Cao, Shih-Fu Chang, Yinfei Yang",
        "tldr": "",
        "abstract": "We introduce Ferret, a new Multimodal Large Language Model (MLLM) capable of understanding spatial referring of any shape or granularity within an image and accurately grounding open-vocabulary descriptions. To unify referring and grounding in the LLM paradigm, Ferret employs a novel and powerful hybrid region representation that integrates discrete coordinates and continuous features jointly to represent a region in the image. To extract the continuous features of versatile regions,  we propose a spatial-aware visual sampler, adept at handling varying sparsity across different shapes. Consequently, Ferret can accept diverse region inputs, such as points, bounding boxes, and free-form shapes. To bolster the desired capability of Ferret, we curate GRIT, a comprehensive refer-and-ground instruction tuning dataset including 1.1M samples that contain rich hierarchical spatial knowledge, with an additional 130K hard negative data to promote model robustness. The resulting model not only achieves superior performance in classical referring and grounding tasks, but also greatly outperforms existing MLLMs in region-based and localization-demanded multimodal chatting. Our evaluations also reveal a significantly improved capability of describing image details and a remarkable alleviation in object hallucination.",
        "keywords": "Ferret;Multimodal Large Language Model;Referring;Grounding",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Haoxuan You;Haotian Zhang;Zhe Gan;Xianzhi Du;Bowen Zhang;Zirui Wang;Liangliang Cao;Shih-Fu Chang;Yinfei Yang",
        "authorids": "~Haoxuan_You1;~Haotian_Zhang3;~Zhe_Gan1;~Xianzhi_Du4;~Bowen_Zhang2;~Zirui_Wang1;~Liangliang_Cao1;~Shih-Fu_Chang3;~Yinfei_Yang1",
        "gender": "M;M;M;M;M;M;M;M;",
        "homepage": "https://hxyou.github.io/;https://haotian-zhang.github.io/;http://zhegan27.github.io/;;https://zbwglory.github.io;;http://llcao.net;http://www.ee.columbia.edu/~sfchang/;",
        "dblp": "210/2628;;41/7845;;85/7433-2;;95/6915;c/ShihFuChang;117/4082",
        "google_scholar": "BhysChMAAAAJ;1vz0kKUAAAAJ;E64XWyMAAAAJ;l1hP40AAAAAJ;nI3cKV8AAAAJ;GgD-B68AAAAJ;S-hBSfIAAAAJ;OMVTRscAAAAJ;kvDbu90AAAAJ",
        "orcid": ";0000-0001-6809-0426;;;;;;;",
        "linkedin": ";haotian-zhang-075508a6/;zhe-gan-a2229a78/;xianzhi-du-1b128934/;;;liangliangcao/;;",
        "or_profile": "~Haoxuan_You1;~Haotian_Zhang3;~Zhe_Gan1;~Xianzhi_Du4;~Bowen_Zhang2;~Zirui_Wang1;~Liangliang_Cao1;~Shih-Fu_Chang3;~Yinfei_Yang1",
        "aff": "Columbia University;Apple AI/ML;Apple;Apple;Apple;Apple AI/ML;Apple;Columbia University;Apple",
        "aff_domain": "columbia.edu;apple.com;apple.com;apple.com;apple.com;apple.com;apple.com;ee.columbia.edu;apple.com",
        "position": "PhD student;Researcher;Principal Researcher;Researcher;Research Scientist;Research Scientist;Principal Researcher;Full Professor;Researcher",
        "bibtex": "@inproceedings{\nyou2024ferret,\ntitle={Ferret: Refer and Ground Anything Anywhere at Any Granularity},\nauthor={Haoxuan You and Haotian Zhang and Zhe Gan and Xianzhi Du and Bowen Zhang and Zirui Wang and Liangliang Cao and Shih-Fu Chang and Yinfei Yang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=2msbbX3ydD}\n}",
        "github": "",
        "project": "",
        "reviewers": "dfTo;6Qgf;7dkr",
        "pdf_size": 27418370,
        "rating": "6;6;8",
        "confidence": "4;4;4",
        "soundness": "3;2;3",
        "contribution": "3;3;3",
        "presentation": "3;3;3",
        "wc_summary": "67;109;178",
        "wc_strengths": "53;82;152",
        "wc_weaknesses": "46;62;141",
        "wc_questions": "11;145;96",
        "wc_review": "177;398;567",
        "wc_reply_reviewers": "0;0;171",
        "wc_reply_authors": "624;1622;1545",
        "reply_reviewers": "0;0;2",
        "reply_authors": "3;5;4",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            118.0,
            45.760244754590204
        ],
        "wc_strengths_avg": [
            95.66666666666667,
            41.55585264302597
        ],
        "wc_weaknesses_avg": [
            83.0,
            41.52910625894406
        ],
        "wc_questions_avg": [
            84.0,
            55.35943159631127
        ],
        "wc_review_avg": [
            380.6666666666667,
            159.68789002996508
        ],
        "wc_reply_reviewers_avg": [
            57.0,
            80.61017305526642
        ],
        "wc_reply_authors_avg": [
            1263.6666666666667,
            453.4036710139088
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            4.0,
            0.816496580927726
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 300,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9686123011748005154&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=2msbbX3ydD",
        "pdf": "https://openreview.net/pdf?id=2msbbX3ydD",
        "email": "columbia.edu;apple.com;apple.com;apple.com;apple.com;apple.com;apple.com;ee.columbia.edu;apple.com",
        "author_num": 9,
        "aff_unique_index": "0;1;1;1;1;1;1;0;1",
        "aff_unique_norm": "Columbia University;Apple",
        "aff_unique_dep": ";AI/ML",
        "aff_unique_url": "https://www.columbia.edu;https://www.apple.com",
        "aff_unique_abbr": "Columbia;Apple",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "2nD1SvxTZc",
        "title": "One-Versus-Others Attention: Scalable Multimodal Integration",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Multimodal learning models have become increasingly important as they surpass single-modality approaches on diverse tasks ranging from question-answering to autonomous driving. Despite the importance of multimodal learning, existing efforts focus on NLP applications, where the number of modalities is typically at most four (audio, video, text, images). However, data inputs in other domains, such as clinical medicine, may include X-rays, PET scans, MRIs, genetic screening, clinical notes, and more, creating a need for both efficient and accurate information fusion. Many state-of-the-art models rely on pairwise cross-attention or early fusion through self-attention, which do not scale well for applications with more than three modalities. The complexity per layer of computing attention in either paradigm is, at best, quadratic with the number of modalities, potentially requiring considerable computational resources. To address this, we propose a new domain-neutral attention mechanism, One-Versus-Others (OvO) attention, that scales linearly with the number of modalities, thus offering a significant reduction in computational complexity compared to existing multimodal attention methods. Using three diverse real-world datasets as well as an additional simulation experiment, we show that our method improves performance compared to popular fusion techniques while decreasing computation costs.",
        "keywords": "deep learning;multimodal learning;attention;clinical application",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/f30e7fce056b804efc434124d184a18ba9fa37c9.zip",
        "author": "Michal Golovanevsky;Eva Schiller;Akira A Nair;Ritambhara Singh;Carsten Eickhoff",
        "authorids": "~Michal_Golovanevsky1;~Eva_Schiller1;~Akira_A_Nair1;~Ritambhara_Singh1;~Carsten_Eickhoff1",
        "gender": "F;F;;F;M",
        "homepage": "https://michalg04.github.io/;;http://github.com/akira-nair;https://ritambharasingh.com/;https://health-nlp.org",
        "dblp": "322/7058;;;180/5813;42/8700",
        "google_scholar": ";;;V6lRMxoAAAAJ;QQi1_rAAAAAJ",
        "orcid": "0000-0002-2601-6604;;;0000-0002-7523-160X;0000-0001-9895-4061",
        "linkedin": ";eva-schiller-9614621b5/;akira-nair/;;",
        "or_profile": "~Michal_Golovanevsky1;~Eva_Schiller1;~Akira_A_Nair1;~Ritambhara_Singh1;~Carsten_Eickhoff1",
        "aff": "Brown University;Brown University;Brown University;Brown University;Eberhard-Karls-Universit\u00e4t T\u00fcbingen",
        "aff_domain": "brown.edu;brown.edu;brown.edu;brown.edu;uni-tuebingen.de",
        "position": "PhD student;Undergrad student;Undergrad student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\ngolovanevsky2024oneversusothers,\ntitle={One-Versus-Others Attention: Scalable Multimodal Integration},\nauthor={Michal Golovanevsky and Eva Schiller and Akira A Nair and Ritambhara Singh and Carsten Eickhoff},\nyear={2024},\nurl={https://openreview.net/forum?id=2nD1SvxTZc}\n}",
        "github": "",
        "project": "",
        "reviewers": "YfMJ;UUiq;sMs5",
        "site": "https://openreview.net/forum?id=2nD1SvxTZc",
        "pdf_size": 2325215,
        "rating": "5;5;5",
        "confidence": "3;5;4",
        "soundness": "3;2;2",
        "contribution": "3;2;2",
        "presentation": "3;2;3",
        "wc_summary": "81;113;56",
        "wc_strengths": "50;73;46",
        "wc_weaknesses": "138;191;112",
        "wc_questions": "3;98;164",
        "wc_review": "272;475;378",
        "wc_reply_reviewers": "74;247;0",
        "wc_reply_authors": "302;738;721",
        "reply_reviewers": "1;1;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            83.33333333333333,
            23.32857094256359
        ],
        "wc_strengths_avg": [
            56.333333333333336,
            11.897712198383164
        ],
        "wc_weaknesses_avg": [
            147.0,
            32.873494895837695
        ],
        "wc_questions_avg": [
            88.33333333333333,
            66.08244009484585
        ],
        "wc_review_avg": [
            375.0,
            82.90154803540563
        ],
        "wc_reply_reviewers_avg": [
            107.0,
            103.50201286287464
        ],
        "wc_reply_authors_avg": [
            587.0,
            201.64490240684654
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10766012326229557819&as_sdt=20000005&sciodt=0,21&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;1",
        "aff_unique_norm": "Brown University;Eberhard Karls University of T\u00fcbingen",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.brown.edu;https://www.uni-tuebingen.de/",
        "aff_unique_abbr": "Brown;Uni T\u00fcbingen",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";T\u00fcbingen",
        "aff_country_unique_index": "0;0;0;0;1",
        "aff_country_unique": "United States;Germany"
    },
    {
        "id": "2nrn8LRpex",
        "title": "Z-score Normalized SAC Plus Behavioural Cloning for Offline Reinforcement Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Reinforcement learning (RL) defines the task that optimize a policy to maximize the cumulative reward function. Online learning collects data samples by interacting with the environment of task. Instead, Offline RL learns effective policies from a prior demonstrated dataset, which has the potential to transfer the successes between tasks. The main challenge encountered by offline RL is the inaccurate value estimates from out-of-distribution (OOD) actions, and applying vanilla off-policy algorithms to offline setting will cause severe overestimation bias for actions beyond the dataset distribution, because of the disability to correct value estimation errors via observations from the environment. To tackle this problem, the behavior regularization has been adopted in the literature to prevent the selected actions far away from the distribution of dataset so that the learned policy can be optimized within the support set of dataset. One simple method is combining RL with the behavioural cloning (BC) linearly.\nBy making a right balance of the relative weight between RL and BC, the pre-existing off-policy algorithms are able to work efficiently offline at the minimal cost of complexity. Overly large BC term will limit the agent\u2019s potential to explore better policy, and oversize RL term will cause more OOD actions, both of which are undesired.\nSimulated by TD3-BC, this paper aim to make a more efficient offline RL algorithm at the cost of minimal changes and light complexity. We find that the BC term can be added to the policy update of SAC algorithm to get extensively better performance with proper weight adjustment and normalization. The proposed SAC-BC algorithm is evaluated on the D4RL benchmark and proved to converge to much higher levels due to better exploration provided by tuned maximum entropy.",
        "keywords": "Reinforcement learning; offline; off-policy",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Huihui Zhang",
        "authorids": "~Huihui_Zhang1",
        "gender": "M",
        "homepage": "",
        "dblp": "https://dblp.uni-trier.de/pid/32/7555",
        "google_scholar": "",
        "orcid": "",
        "linkedin": "https://www.linkedin.com/feed/",
        "or_profile": "~Huihui_Zhang1",
        "aff": "",
        "aff_domain": "",
        "position": "",
        "bibtex": "@misc{\nzhang2024zscore,\ntitle={Z-score Normalized {SAC} Plus Behavioural Cloning for Offline Reinforcement Learning},\nauthor={Huihui Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=2nrn8LRpex}\n}",
        "github": "",
        "project": "",
        "reviewers": "jNsi;Q6ES;mezX;whc9",
        "site": "https://openreview.net/forum?id=2nrn8LRpex",
        "pdf_size": 2535726,
        "rating": "1;3;3;3",
        "confidence": "5;4;5;4",
        "soundness": "2;2;1;3",
        "contribution": "2;1;1;2",
        "presentation": "2;2;2;1",
        "wc_summary": "122;31;67;66",
        "wc_strengths": "41;22;33;34",
        "wc_weaknesses": "67;406;70;157",
        "wc_questions": "106;123;100;184",
        "wc_review": "336;582;270;441",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            71.5,
            32.56148031032987
        ],
        "wc_strengths_avg": [
            32.5,
            6.800735254367722
        ],
        "wc_weaknesses_avg": [
            175.0,
            138.17923143511834
        ],
        "wc_questions_avg": [
            128.25,
            33.27442711753277
        ],
        "wc_review_avg": [
            407.25,
            117.88845363308486
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:5-mUbTnQgyEJ:scholar.google.com/&scioq=Z-score+Normalized+SAC+Plus+Behavioural+Cloning+for+Offline+Reinforcement+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0
    },
    {
        "title": "Light-MILPopt: Solving Large-scale Mixed Integer Linear Programs with Lightweight Optimizer and Small-scale Training Dataset",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19536",
        "id": "2oWRumm67L",
        "author_site": "Huigen Ye, Hua Xu, Hongyan Wang",
        "tldr": "",
        "abstract": "Machine Learning (ML)-based optimization approaches emerge as a promising technique for solving large-scale Mixed Integer Linear Programs (MILPs). However, existing ML-based frameworks suffer from high model computation complexity, weak problem reduction, and reliance on large-scale optimizers and large training datasets, resulting in performance bottlenecks for large-scale MILPs. This paper proposes Light-MILPopt, a lightweight large-scale optimization framework that only uses a lightweight optimizer and small training dataset to solve large-scale MILPs. Specifically, Light-MILPopt can be divided into four stages: Problem Formulation for problem division to reduce model computational costs, Model-based Initial Solution Prediction for predicting and constructing the initial solution using a small-scale training dataset, Problem Reduction for both variable and constraint reduction, and Data-driven Optimization for current solution improvement employing a lightweight optimizer. Experimental evaluations on four large-scale benchmark MILPs and a real-world case study demonstrate that Light-MILPopt, leveraging a lightweight optimizer and small training dataset, outperforms the state-of-the-art ML-based optimization framework and advanced large-scale solvers (e.g. Gurobi, SCIP). The results and further analyses substantiate the ML-based framework's feasibility and effectiveness in solving large-scale MILPs.",
        "keywords": "Large-scale MILP;Learning for Optimization;Lightweight Optimization Framework",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Huigen Ye;Hua Xu;Hongyan Wang",
        "authorids": "~Huigen_Ye1;~Hua_Xu1;~Hongyan_Wang1",
        "gender": ";M;F",
        "homepage": ";https://thu-xuhua.github.io/;https://www.researchgate.net/profile/Hongyan-Wang-25",
        "dblp": ";31/4114-3;",
        "google_scholar": ";;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Huigen_Ye1;~Hua_Xu1;~Hongyan_Wang1",
        "aff": ";Tsinghua University;",
        "aff_domain": ";tsinghua.edu.cn;",
        "position": ";Associate Professor;",
        "bibtex": "@inproceedings{\nye2024lightmilpopt,\ntitle={Light-{MILP}opt: Solving Large-scale Mixed Integer Linear Programs with Lightweight Optimizer and Small-scale Training Dataset},\nauthor={Huigen Ye and Hua Xu and Hongyan Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=2oWRumm67L}\n}",
        "github": "",
        "project": "",
        "reviewers": "RzQr;6e4z;LzLN;tDoY",
        "pdf_size": 579916,
        "rating": "3;5;6;6",
        "confidence": "4;4;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;1;4;3",
        "wc_summary": "214;55;41;121",
        "wc_strengths": "83;44;75;40",
        "wc_weaknesses": "118;46;187;7",
        "wc_questions": "527;322;3;90",
        "wc_review": "942;467;306;258",
        "wc_reply_reviewers": "372;243;30;0",
        "wc_reply_authors": "4458;3340;1787;1186",
        "reply_reviewers": "4;2;1;0",
        "reply_authors": "9;6;5;3",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            107.75,
            68.37899896898169
        ],
        "wc_strengths_avg": [
            60.5,
            18.76832437912346
        ],
        "wc_weaknesses_avg": [
            89.5,
            68.95106960736722
        ],
        "wc_questions_avg": [
            235.5,
            204.74435279147505
        ],
        "wc_review_avg": [
            493.25,
            270.4028245044789
        ],
        "wc_reply_reviewers_avg": [
            161.25,
            153.56330127996077
        ],
        "wc_reply_authors_avg": [
            2692.75,
            1287.0235769013714
        ],
        "reply_reviewers_avg": [
            1.75,
            1.479019945774904
        ],
        "reply_authors_avg": [
            5.75,
            2.165063509461097
        ],
        "replies_avg": [
            37,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.4714045207910316,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7354538115541094753&as_sdt=5,34&sciodt=0,34&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=2oWRumm67L",
        "pdf": "https://openreview.net/pdf?id=2oWRumm67L",
        "email": ";tsinghua.edu.cn;",
        "author_num": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "Tsinghua University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "THU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "2ov9RiAkxE",
        "title": "Identifying and Mitigating Vulnerabilities in LLM-Integrated Applications",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs) are increasingly deployed as the service backend for LLM-integrated applications such as code completion and AI-powered search. Compared with the traditional usage of LLMs where users directly send queries to an LLM, LLM-integrated applications serve as middleware to refine users\u2019 queries with domain-specific knowledge to better inform LLMs and enhance the responses. Despite numerous opportunities and benefits, LLM-integrated applications also introduce new attack surfaces. Understanding, minimizing, and eliminating these emerging attack surfaces is a new area of research. In this work, we consider a setup where the user and LLM interact via an LLM-integrated application in the middle. We focus on the communication rounds that begin with user\u2019s queries and end with LLM-integrated application returning responses to the queries, powered by LLMs at the service backend. For this query-response protocol, we identify potential high-risk vulnerabilities that can originate from the malicious application developer or from an outsider threat initiator that is able to control the database access, manipulate and poison data that are high-risk for the user. Successful exploits of the identified vulnerabilities result in the users receiving responses tailored to the intent of a threat initiator (e.g., biased preferences for certain products). We assess such threats against LLM-integrated applications empowered by OpenAI GPT-3.5 and GPT-4. Our empirical results show that the threats can effectively bypass the restrictions and moderation policies of OpenAI, resulting in users receiving responses that contain bias, toxic content, privacy risk, and disinformation. To mitigate those threats, we identify and define four key properties, namely integrity, source identification, attack detectability, and utility preservation, that need to be satisfied by a safe LLM-integrated application. Based on these properties, we develop a lightweight, threat-agnostic defense that mitigates both insider and outsider threats. Our evaluations demonstrate the efficacy of our defense.",
        "keywords": "large language model;safety of LLM-integrated application;misuse mitigation;bias;privacy;toxicity;disinformation",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/b3d1abed570ec82c0180aefb79e01db1210250a2.pdf",
        "author": "Fengqing Jiang;Zhangchen Xu;Luyao Niu;Boxin Wang;Jinyuan Jia;Bo Li;Radha Poovendran",
        "authorids": "~Fengqing_Jiang1;~Zhangchen_Xu1;~Luyao_Niu1;~Boxin_Wang1;~Jinyuan_Jia2;~Bo_Li19;~Radha_Poovendran1",
        "gender": "M;M;M;;;F;Not Specified",
        "homepage": "https://fqjiang.work/;https://zhangchenxu.com;;https://wbx.life;https://jinyuan-jia.github.io/;http://boli.cs.illinois.edu/;https://people.ece.uw.edu/radha/index.html",
        "dblp": "294/4119;350/1187;181/8375;236/6319;24/5124-1.html;50/3402-26;29/5044",
        "google_scholar": "kTXY8P0AAAAJ;7KnVoNwAAAAJ;nSFafMoAAAAJ;YOf2ATIAAAAJ;iyg4ytkAAAAJ;K8vJkTcAAAAJ;EEoNZ7NbVzMC",
        "orcid": "0009-0002-9077-2399;0000-0002-6971-412X;0000-0001-8591-5522;;0000-0002-9785-7769;;",
        "linkedin": "fengqing-jiang-45b7311aa/;zhangchenxu/;;;;;",
        "or_profile": "~Fengqing_Jiang1;~Zhangchen_Xu1;~Luyao_Niu1;~Boxin_Wang1;~Jinyuan_Jia2;~Bo_Li19;~Radha_Poovendran1",
        "aff": "Amazon;University of Washington;University of Washington;NVIDIA;Pennsylvania State University;University of Illinois, Urbana Champaign;University of Washington, Seattle",
        "aff_domain": "amazon.com;uw.edu;uw.edu;nvidia.com;psu.edu;illinois.edu;uw.edu",
        "position": "Intern;PhD student;Postdoc;Senior Research Scientist;Assistant Professor;Assistant Professor;Full Professor",
        "bibtex": "@misc{\njiang2024identifying,\ntitle={Identifying and Mitigating Vulnerabilities in {LLM}-Integrated Applications},\nauthor={Fengqing Jiang and Zhangchen Xu and Luyao Niu and Boxin Wang and Jinyuan Jia and Bo Li and Radha Poovendran},\nyear={2024},\nurl={https://openreview.net/forum?id=2ov9RiAkxE}\n}",
        "github": "",
        "project": "",
        "reviewers": "uAhs;tqMB;o6oy;E69Y",
        "site": "https://openreview.net/forum?id=2ov9RiAkxE",
        "pdf_size": 763141,
        "rating": "3;3;6;6",
        "confidence": "3;5;3;3",
        "soundness": "2;2;3;3",
        "contribution": "2;1;3;3",
        "presentation": "2;1;3;3",
        "wc_summary": "42;37;98;71",
        "wc_strengths": "26;9;266;91",
        "wc_weaknesses": "285;130;127;71",
        "wc_questions": "34;5;72;65",
        "wc_review": "387;181;563;298",
        "wc_reply_reviewers": "0;78;0;0",
        "wc_reply_authors": "1503;1256;1245;1765",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "4;4;3;4",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            62.0,
            24.50510150968569
        ],
        "wc_strengths_avg": [
            98.0,
            101.70791512955125
        ],
        "wc_weaknesses_avg": [
            153.25,
            79.61273453411835
        ],
        "wc_questions_avg": [
            44.0,
            26.67395733669828
        ],
        "wc_review_avg": [
            357.25,
            139.4567585310945
        ],
        "wc_reply_reviewers_avg": [
            19.5,
            33.77499074759311
        ],
        "wc_reply_authors_avg": [
            1442.25,
            212.98752897763757
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.75,
            0.4330127018922193
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5773502691896258,
        "gs_citation": 1867,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3617304031662540087&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;1;2;3;4;1",
        "aff_unique_norm": "Amazon;University of Washington;NVIDIA;Pennsylvania State University;University of Illinois Urbana-Champaign",
        "aff_unique_dep": "Amazon.com, Inc.;;NVIDIA Corporation;;",
        "aff_unique_url": "https://www.amazon.com;https://www.washington.edu;https://www.nvidia.com;https://www.psu.edu;https://illinois.edu",
        "aff_unique_abbr": "Amazon;UW;NVIDIA;PSU;UIUC",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Urbana-Champaign;Seattle",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "2pAdYVCbU9",
        "title": "Promoting Sparsity in Continuous-time Neural Networks to Learn Dependence Structures",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Continuous-time dynamics models, such as neural ordinary differential equations, enable accurate modeling of underlying dynamics in time-series data. However, the use of neural networks in parameterizing dynamics makes it challenging for humans to identify dependence structures, especially in the presence of delayed effects. In consequence, these models are not an attractive option when capturing dependence carries more importance than accurate predictions, e.g., tsunami forecasting. In this paper, we present a novel method for learning dependence structures in continuous-time dynamics models. Inspired by neural graphical modeling, we promote weight sparsity in the network's first layer during training. Once trained, we prune the sparse weights to identify dependence structures. In evaluation, we first test our method in scenarios where the exact dependence-structures of time-series are known. Our method captures the underlying dependence structure precisely even when there is a delayed effects. We further evaluate our method to a real-world tsunami forecasting, where the exact dependence structures are unknown. Even in this challenging case, our method effective learns physically-consistent dependence structures with a high forecasting accuracy.",
        "keywords": "Neural graphical modeling;Neural delay differential equations;Tsunami forecasting;Structure discovery",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/e157c6277e80ead6fe3550c988d9c50e0daddd71.zip",
        "author": "Fan Wu;Woojin Cho;David Korotky;Sanghyun Hong;Donsub Rim;Noseong Park;Kookjin Lee",
        "authorids": "~Fan_Wu17;~Woojin_Cho1;korotkyd@oregonstate.edu;~Sanghyun_Hong1;~Donsub_Rim1;~Noseong_Park1;~Kookjin_Lee1",
        "gender": ";M;;M;M;;M",
        "homepage": ";https://woojin-cho.github.io/;;http://www.sanghyun-hong.com;https://dsrim.github.io;;https://scholar.google.com/citations?hl=en&user=KL89hVQAAAAJ&view_op=list_works",
        "dblp": ";;;135/8991;239/0132;;122/5103",
        "google_scholar": ";cqIj5tQAAAAJ;;https://scholar.google.com/citations?hl=en;;;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;;0000-0002-6721-2070;;",
        "linkedin": "fanwu8/;woojin-cho-02b905264/;;;;;",
        "or_profile": "~Fan_Wu17;~Woojin_Cho1;korotkyd@oregonstate.edu;~Sanghyun_Hong1;~Donsub_Rim1;~Noseong_Park1;~Kookjin_Lee1",
        "aff": "Arizona State University;Yonsei University;;Oregon State University;Washington University, Saint Louis;;Arizona State University",
        "aff_domain": "asu.edu;yonsei.ac.kr;;oregonstate.edu;wustl.edu;;asu.edu",
        "position": "PhD student;MS student;;Assistant Professor;Assistant Professor;;Assistant Professor",
        "bibtex": "@misc{\nwu2024promoting,\ntitle={Promoting Sparsity in Continuous-time Neural Networks to Learn Dependence Structures},\nauthor={Fan Wu and Woojin Cho and David Korotky and Sanghyun Hong and Donsub Rim and Noseong Park and Kookjin Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=2pAdYVCbU9}\n}",
        "github": "",
        "project": "",
        "reviewers": "EHcX;eu4v;3bqx;tEwg",
        "site": "https://openreview.net/forum?id=2pAdYVCbU9",
        "pdf_size": 1578700,
        "rating": "3;3;3;5",
        "confidence": "3;4;4;3",
        "soundness": "2;2;2;2",
        "contribution": "1;2;2;2",
        "presentation": "3;2;2;2",
        "wc_summary": "31;89;202;35",
        "wc_strengths": "39;44;52;43",
        "wc_weaknesses": "132;239;146;109",
        "wc_questions": "76;174;19;33",
        "wc_review": "278;546;419;220",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            89.25,
            69.00860453595624
        ],
        "wc_strengths_avg": [
            44.5,
            4.716990566028302
        ],
        "wc_weaknesses_avg": [
            156.5,
            49.429242357131066
        ],
        "wc_questions_avg": [
            75.5,
            60.62384019509157
        ],
        "wc_review_avg": [
            365.75,
            126.75641009432225
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:nOSuYLPMKAkJ:scholar.google.com/&scioq=Promoting+Sparsity+in+Continuous-time+Neural+Networks+to+Learn+Dependence+Structures&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;0",
        "aff_unique_norm": "Arizona State University;Yonsei University;Oregon State University;Washington University in St. Louis",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.asu.edu;https://www.yonsei.ac.kr;https://oregonstate.edu;https://wustl.edu",
        "aff_unique_abbr": "ASU;Yonsei;OSU;WUSTL",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Saint Louis",
        "aff_country_unique_index": "0;1;0;0;0",
        "aff_country_unique": "United States;South Korea"
    },
    {
        "id": "2psWOW7JKO",
        "title": "Learned Visual Features to Textual Explanations",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Interpreting the learned features of vision models has posed a longstanding challenge in the field of machine learning. To address this issue, we propose a novel method that leverages the capabilities of large language models (LLMs) to interpret the *learned features* of pre-trained image classifiers.\nOur method, called TExplain, tackles this task by training a neural network to establish a connection between the feature space of image classifiers and LLMs. Then, during inference, our approach generates a vast number of sentences to explain the features learned by the classifier for a given image. These sentences are then used to extract the most frequent words, providing a comprehensive understanding of the learned features and patterns within the classifier.\nOur method, for the first time, utilizes these frequent words corresponding to a visual representation to provide insights into the decision-making process of the independently trained classifier, enabling the detection of spurious correlations, biases, and a deeper comprehension of its behavior. To validate the effectiveness of our approach, we conduct experiments on diverse datasets, including ImageNet-9L and Waterbirds. The results demonstrate the potential of our method to enhance the interpretability and robustness of image classifiers.",
        "keywords": "explainability;reliability",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/2338da666416b52d0e4a4e8e02397a15b1eba398.zip",
        "author": "Saeid Asgari;Aliasghar Khani;Amir Hosein Khasahmadi;Ali Saheb Pasand;Aditya Sanghi;Karl D.D. Willis;Ali Mahdavi Amiri",
        "authorids": "~Saeid_Asgari1;~Aliasghar_Khani1;~Amir_Hosein_Khasahmadi1;~Ali_Saheb_Pasand1;~Aditya_Sanghi1;~Karl_D.D._Willis1;~Ali_Mahdavi_Amiri1",
        "gender": ";M;M;M;M;;",
        "homepage": "https://asgsaeid.github.io/;http://aliasgharkhani.github.io/;;https://github.com/sanghiad;https://www.sfu.ca/~amahdavi;;",
        "dblp": "201/4374.html;;238/1089;;33/10499.html;259/1508;82/121",
        "google_scholar": "SuePM1sAAAAJ;yr7Y5EcAAAAJ;xjTZIisAAAAJ;q0-11e25FxIC;https://scholar.google.ca/citations?user=M9eTADwAAAAJ;cFpYRhkAAAAJ;yMoEQSMAAAAJ",
        "orcid": ";;;;;;",
        "linkedin": ";aliasghar-khani-08157b16b/;;;;amir-khas/;",
        "or_profile": "~Saeid_Asgari1;~Aliasghar_Khani1;~Ali_Saheb_Pasand1;~Aditya_Sanghi1;~Ali_Mahdavi_Amiri1;~Amir_Hosein_Khasahmadi2;~Karl_Willis1",
        "aff": "Autodesk;Computing Science, Simon Fraser University;McGill University;Autodesk;Simon Fraser University;Toronto University;Autodesk",
        "aff_domain": "autodesk.com;cs.sfu.ca;cs.mcgill.ca;autodesk.com;sfu.ca;utoronto.ca;autodesk.com",
        "position": "Research Scientist;MS student;PhD student;Researcher;Assistant Professor;MS student;Senior Research Manager",
        "bibtex": "@misc{\nasgari2024learned,\ntitle={Learned Visual Features to Textual Explanations},\nauthor={Saeid Asgari and Aliasghar Khani and Amir Hosein Khasahmadi and Ali Saheb Pasand and Aditya Sanghi and Karl D.D. Willis and Ali Mahdavi Amiri},\nyear={2024},\nurl={https://openreview.net/forum?id=2psWOW7JKO}\n}",
        "github": "",
        "project": "",
        "reviewers": "cWhL;zmpz;gvhW;UPwp",
        "site": "https://openreview.net/forum?id=2psWOW7JKO",
        "pdf_size": 2080279,
        "rating": "3;5;5;5",
        "confidence": "4;3;4;5",
        "soundness": "1;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "1;3;3;4",
        "wc_summary": "91;112;61;169",
        "wc_strengths": "64;92;80;93",
        "wc_weaknesses": "961;201;259;441",
        "wc_questions": "149;128;8;114",
        "wc_review": "1265;533;408;817",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            108.25,
            39.480216564755565
        ],
        "wc_strengths_avg": [
            82.25,
            11.712706775122479
        ],
        "wc_weaknesses_avg": [
            465.5,
            299.46744397346436
        ],
        "wc_questions_avg": [
            99.75,
            54.41679428264771
        ],
        "wc_review_avg": [
            755.75,
            329.25474559981666
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7463041457304754602&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0;1;3;0",
        "aff_unique_norm": "Autodesk;Simon Fraser University;McGill University;University of Toronto",
        "aff_unique_dep": ";Computing Science;;",
        "aff_unique_url": "https://www.autodesk.com;https://www.sfu.ca;https://www.mcgill.ca;https://www.utoronto.ca",
        "aff_unique_abbr": "Autodesk;SFU;McGill;U of T",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;0;1;1;0",
        "aff_country_unique": "United States;Canada"
    },
    {
        "title": "SparseFormer: Sparse Visual Recognition via Limited Latent Tokens",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19535",
        "id": "2pvECsmld3",
        "author_site": "Ziteng Gao, Zhan Tong, Limin Wang, Mike Zheng Shou",
        "tldr": "",
        "abstract": "Human visual recognition is a sparse process, where only a few salient visual cues are attended to rather than every detail being traversed uniformly. However, most current vision networks follow a dense paradigm, processing every single visual unit (such as pixels or patches) in a uniform manner. In this paper, we challenge this dense convention and present a new vision transformer, coined SparseFormer, to explicitly imitate human's sparse visual recognition in an end-to-end manner. SparseFormer learns to represent images using a highly limited number of tokens (e.g., down to $9$) in the latent space with sparse feature sampling procedure instead of processing dense units in the original image space.  Therefore, SparseFormer circumvents most of dense operations on the image space and has much lower computational costs. Experiments on the ImageNet-1K classification show that SparseFormer delivers performance on par with canonical or well-established models while offering more favorable accuracy-throughput tradeoff. Moreover, the design of our network can be easily extended to the video classification task with promising performance with lower compute. We hope our work can provide an alternative way for visual modeling and inspire further research on sparse vision architectures. Code and weights are available at https://github.com/showlab/sparseformer.",
        "keywords": "sparse visual recognition;vision transformer;computer vision;representation learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Ziteng Gao;Zhan Tong;Limin Wang;Mike Zheng Shou",
        "authorids": "~Ziteng_Gao1;~Zhan_Tong1;~Limin_Wang1;~Mike_Zheng_Shou1",
        "gender": "M;M;M;",
        "homepage": "https://sebgao.github.io/;https://github.com/yztongzhan;https://wanglimin.github.io;http://www.columbia.edu/~zs2262/",
        "dblp": "247/1231;236/0753;68/6610-2;284/0807",
        "google_scholar": "fbSH2CgAAAAJ;6FsgWBMAAAAJ;HEuN8PcAAAAJ;h1-3lSoAAAAJ",
        "orcid": ";0000-0002-3169-0599;;",
        "linkedin": ";;;",
        "or_profile": "~Ziteng_Gao1;~Zhan_Tong1;~Limin_Wang2;~Zheng_Shou1",
        "aff": "National University of Singapore;Ant Research;Nanjing University;National University of Singapore",
        "aff_domain": "nus.edu;antgroup.com;nju.edu.cn;nus.edu.sg",
        "position": "PhD student;Researcher;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\ngao2024sparseformer,\ntitle={SparseFormer: Sparse Visual Recognition via Limited Latent Tokens},\nauthor={Ziteng Gao and Zhan Tong and Limin Wang and Mike Zheng Shou},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=2pvECsmld3}\n}",
        "github": "",
        "project": "",
        "reviewers": "fS4e;H2So;fz8s;SBDj",
        "pdf_size": 11614788,
        "rating": "5;6;6;8",
        "confidence": "4;5;4;3",
        "soundness": "3;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "96;43;28;51",
        "wc_strengths": "114;38;42;27",
        "wc_weaknesses": "270;56;109;1",
        "wc_questions": "9;65;27;1",
        "wc_review": "489;202;206;80",
        "wc_reply_reviewers": "193;0;0;0",
        "wc_reply_authors": "1215;867;302;16",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "3;2;1;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            54.5,
            25.342651794948374
        ],
        "wc_strengths_avg": [
            55.25,
            34.361133566865924
        ],
        "wc_weaknesses_avg": [
            109.0,
            100.49129315517837
        ],
        "wc_questions_avg": [
            25.5,
            24.672859582950654
        ],
        "wc_review_avg": [
            244.25,
            150.1072533224161
        ],
        "wc_reply_reviewers_avg": [
            48.25,
            83.57145146519834
        ],
        "wc_reply_authors_avg": [
            600.0,
            468.8747167421165
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.6488856845230502,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10689237670896548255&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=2pvECsmld3",
        "pdf": "https://openreview.net/pdf?id=2pvECsmld3",
        "email": "nus.edu;antgroup.com;nju.edu.cn;nus.edu.sg",
        "author_num": 4,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "National University of Singapore;Ant Research;Nanjing University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.nus.edu.sg;https://www.antgroup.com;https://www.nju.edu.cn",
        "aff_unique_abbr": "NUS;Ant Research;Nanjing U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "Singapore;China"
    },
    {
        "id": "2qLSkTuqrb",
        "title": "Translating cognitive models into neural and statistical descriptions of real-world multi-agent foraging behavior",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Foraging is a multi-agent social behavior that has been studied from many perspectives, including cognitive science, neuroscience, and statistics. We start from a specific type of cognitive description -- agents with internal preferences expressed as value functions -- and implement it as a biologically plausible neural network. We also present an equivalent statistical model where statistical predictors correspond to components of the value function. We use the neural network to simulate foraging agents in various environmental conditions and use the statistical model to discover which features in the environment best predict the agent's behavior. Our intended primary application is the study of multi-species groups of birds foraging in real-world environments. To test the viability of the statistical approach, we simulate bird agents with different preferences, and use Bayesian inference to recover what each type of agent values. In the multi-agent context, we investigate how communication of information about reward location affects group foraging behavior. We also test our modeling technique on a previously published locust foraging dataset (Gunzel et al., 2023). After evaluating the effectiveness of our method on both synthetic and previously published data, we analyze new multi-agent foraging bird data we captured through high-resolution video recordings. Our method distinguishes between proximity preferences of ducks and sparrows within foraging groups. This analysis framework provides a principled, interpretable, and parametric approach for reasoning about how birds' preferences relate to their decisions about where to move in a complex multi-agent environment.",
        "keywords": "multi-agent systems;animal behavior;reinforcement learning;probabilistic methods;decision making",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "Marjorie Xie;Rafal Urbaniak;Emily L Mackevicius",
        "authorids": "~Marjorie_Xie1;~Rafal_Urbaniak1;~Emily_L_Mackevicius1",
        "gender": "F;M;",
        "homepage": ";https://independent.academia.edu/Rafa%C5%82Urbaniak2;",
        "dblp": ";46/6491;",
        "google_scholar": ";LOtWV_0AAAAJ;G5eTd40AAAAJ",
        "orcid": ";0000-0002-6321-2866;",
        "linkedin": "marjoriexie/;;",
        "or_profile": "~Marjorie_Xie1;~Rafal_Urbaniak1;~Emily_L_Mackevicius1",
        "aff": "Arizona State University;University of Gdansk;Columbia University",
        "aff_domain": "asu.edu;univ.gda.pl;columbia.edu",
        "position": "Postdoc;Associate Professor;Postdoc",
        "bibtex": "@misc{\nxie2024translating,\ntitle={Translating cognitive models into neural and statistical descriptions of real-world multi-agent foraging behavior},\nauthor={Marjorie Xie and Rafal Urbaniak and Emily L Mackevicius},\nyear={2024},\nurl={https://openreview.net/forum?id=2qLSkTuqrb}\n}",
        "github": "",
        "project": "",
        "reviewers": "g6r7;3d6u;vuLZ;Vrpj",
        "site": "https://openreview.net/forum?id=2qLSkTuqrb",
        "pdf_size": 4732147,
        "rating": "3;5;5;6",
        "confidence": "3;2;2;5",
        "soundness": "2;3;2;3",
        "contribution": "2;3;2;3",
        "presentation": "2;1;1;4",
        "wc_summary": "27;125;75;87",
        "wc_strengths": "44;47;59;223",
        "wc_weaknesses": "313;167;288;412",
        "wc_questions": "155;425;114;89",
        "wc_review": "539;764;536;811",
        "wc_reply_reviewers": "512;85;401;149",
        "wc_reply_authors": "780;230;388;329",
        "reply_reviewers": "2;1;1;1",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.0,
            1.224744871391589
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            1.224744871391589
        ],
        "wc_summary_avg": [
            78.5,
            34.99642838919423
        ],
        "wc_strengths_avg": [
            93.25,
            75.12115214771403
        ],
        "wc_weaknesses_avg": [
            295.0,
            87.24391096231301
        ],
        "wc_questions_avg": [
            195.75,
            134.4384152688509
        ],
        "wc_review_avg": [
            662.5,
            126.10412364391578
        ],
        "wc_reply_reviewers_avg": [
            286.75,
            175.69060162683718
        ],
        "wc_reply_authors_avg": [
            431.75,
            208.83770612607293
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.3746343246326776,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:7oABOmIY7DkJ:scholar.google.com/&scioq=Translating+cognitive+models+into+neural+and+statistical+descriptions+of+real-world+multi-agent+foraging+behavior&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Arizona State University;University of Gdansk;Columbia University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.asu.edu;https://www.ug.edu.pl;https://www.columbia.edu",
        "aff_unique_abbr": "ASU;UoG;Columbia",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United States;Poland"
    },
    {
        "id": "2rqC5FZiAH",
        "title": "LOTUS: Evasive and Resilient Backdoor Attacks through Sub-Partitioning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Backdoor attack poses a significant security threat to Deep Learning applications. Existing attacks are often not resilient to established backdoor detection and mitigation approaches. This susceptibility primarily stems from the fact that these attacks typically possess an unbounded or under-bounded attack scope. In other words, the trigger can cause misclassification for any input. This unbounded nature implies that the backdoored model overly emphasizes on spurious features of the trigger (e.g., only the color of a square patch), on which trigger inversion techniques can effortlessly generate effective triggers. In addition, the unbounded attack effects can be easily mitigated by backdoor removal methods.\nIn this paper, we propose a novel backdoor attack LOTUS that is evasive and resilient by restricting the attack scope. Specifically, it leverages a secret function to separate samples in the victim class into a set of partitions and applies unique triggers to different partitions. Furthermore, LOTUS incorporates an effective trigger focusing mechanism, ensuring only the trigger corresponding to the partition can induce the backdoor behavior.\nExtensive experimental results show that LOTUS can achieve high attack success rate across 4 datasets and 7 model structures, and effectively evading 13 backdoor detection and mitigation techniques.",
        "keywords": "Backdoor attack",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Siyuan Cheng;Guanhong Tao;Yingqi Liu;Guangyu Shen;Shengwei An;Shiwei Feng;Xiangzhe Xu;Kaiyuan Zhang;Shiqing Ma;Xiangyu Zhang",
        "authorids": "~Siyuan_Cheng1;~Guanhong_Tao1;~Yingqi_Liu1;~Guangyu_Shen1;~Shengwei_An1;~Shiwei_Feng1;~Xiangzhe_Xu1;~Kaiyuan_Zhang1;~Shiqing_Ma2;~Xiangyu_Zhang3",
        "gender": "M;;M;M;;M;;M;;M",
        "homepage": "https://www.cs.purdue.edu/homes/cheng535/;;https://www.cs.purdue.edu/homes/liu1751/;;https://www.cs.purdue.edu/homes/an93/;https://www.cs.purdue.edu/homes/feng292/;https://sites.google.com/view/alex-xu/;https://kaiyuanzhang.com/;https://people.cs.umass.edu/~shiqingma/;https://www.cs.purdue.edu/homes/xyzhang",
        "dblp": "263/7049;;92/10048;216/6403;168/9413;138/9141-2;276/3462;147/6644-2;172/8745;",
        "google_scholar": "GcL9AFMAAAAJ;;gOPVK2UAAAAJ;YiMTVwgAAAAJ;qcmmzeEAAAAJ;https://scholar.google.com/citations?hl=en;;https://scholar.google.com/citations?hl=en;X_mDnjkAAAAJ;PXbu1wIAAAAJ",
        "orcid": ";;;;;0000-0001-6959-4327;;0000-0001-6023-363X;0000-0003-1551-8948;",
        "linkedin": "sycheng98/;;;;;swfeng98/;;kaiyuan-zhang/;shiqing-ma-6590b086;",
        "or_profile": "~Siyuan_Cheng1;~Guanhong_Tao1;~Yingqi_Liu1;~Guangyu_Shen1;~Shengwei_An1;~Shiwei_Feng1;~Xiangzhe_Xu1;~Kaiyuan_Zhang1;~Shiqing_Ma2;~Xiangyu_Zhang3",
        "aff": "Sony AI;;Microsoft;Purdue University;Purdue University;Purdue University;Purdue University;Purdue University;University of Massachusetts at Amherst;Purdue University",
        "aff_domain": "sony.com;;microsoft.com;purdue.edu;purdue.edu;cs.purdue.edu;purdue.edu;cs.purdue.edu;umass.edu;cs.purdue.edu",
        "position": "Intern;;Researcher;PhD student;PhD student;PhD student;PhD student;PhD student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\ncheng2024lotus,\ntitle={{LOTUS}: Evasive and Resilient Backdoor Attacks through Sub-Partitioning},\nauthor={Siyuan Cheng and Guanhong Tao and Yingqi Liu and Guangyu Shen and Shengwei An and Shiwei Feng and Xiangzhe Xu and Kaiyuan Zhang and Shiqing Ma and Xiangyu Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=2rqC5FZiAH}\n}",
        "github": "",
        "project": "",
        "reviewers": "Mwh5;rKsD;1k7k",
        "site": "https://openreview.net/forum?id=2rqC5FZiAH",
        "pdf_size": 3226786,
        "rating": "3;6;6",
        "confidence": "4;3;3",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "1;3;3",
        "wc_summary": "73;129;81",
        "wc_strengths": "57;247;57",
        "wc_weaknesses": "405;133;23",
        "wc_questions": "6;63;204",
        "wc_review": "541;572;365",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            94.33333333333333,
            24.729649321321876
        ],
        "wc_strengths_avg": [
            120.33333333333333,
            89.56685895029602
        ],
        "wc_weaknesses_avg": [
            187.0,
            160.55736254269584
        ],
        "wc_questions_avg": [
            91.0,
            83.22259308625273
        ],
        "wc_review_avg": [
            492.6666666666667,
            91.15676363032836
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17091094092122633244&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;1;2;2;2;2;2;3;2",
        "aff_unique_norm": "Sony;Microsoft;Purdue University;University of Massachusetts Amherst",
        "aff_unique_dep": "Sony AI;Microsoft Corporation;;",
        "aff_unique_url": "https://www.sony.com;https://www.microsoft.com;https://www.purdue.edu;https://www.umass.edu",
        "aff_unique_abbr": "Sony AI;Microsoft;Purdue;UMass Amherst",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Amherst",
        "aff_country_unique_index": "0;1;1;1;1;1;1;1;1",
        "aff_country_unique": "Japan;United States"
    },
    {
        "id": "2sCcTMWPc2",
        "title": "TimelyGPT: Recurrent Convolutional Transformer for Long Time-series Representation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Pre-trained models (PTMs) have gained prominence in Natural Language Processing and Computer Vision domains. When it comes to time-series PTMs, their development has been limited. Previous research on time-series transformers has mainly been devoted to small-scale tasks, yet these models have not consistently outperformed traditional models. Additionally, the performance of these transformers on large-scale data remains unexplored. These findings raise doubts about Transformer's capabilities to scale up and capture temporal dependencies. In this study, we re-examine time-series transformers and identify the shortcomings of prior studies. Drawing from these insights, we then introduce a pioneering architecture called Timely Generative Pre-trained Transformer (TimelyGPT). This architecture integrates recurrent attention and temporal convolution modules to effectively capture global-local temporal dependencies in long sequences. The relative position embedding with time decay can effectively deal with trend and periodic patterns from time-series. Our experiments show that TimelyGPT excels in modeling continuously monitored biosignal as well as irregularly-sampled time-series data commonly observed in longitudinal electronic health records. This breakthrough suggests a priority shift in time-series deep learning research, moving from small-scale modeling from scratch to large-scale pre-training.",
        "keywords": "GPT;Recurrent Neural Network;Position Embedding;Time-series representation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/4fb3df9a8f2fcc826d97acf84bded029dccf72ab.zip",
        "author": "Ziyang Song;Qincheng Lu;Hao Xu;Yue Li",
        "authorids": "~Ziyang_Song4;~Qincheng_Lu1;~Hao_Xu17;~Yue_Li15",
        "gender": "M;;F;M",
        "homepage": ";https://github.com/wzzlcss;;https://www.cs.mcgill.ca/~yueli/",
        "dblp": ";;;",
        "google_scholar": "fptMer8AAAAJ;;;yJgWSl0AAAAJ",
        "orcid": ";;;0000-0003-3844-4865",
        "linkedin": ";;hao-xu-41ba83187;yuelicb/",
        "or_profile": "~Ziyang_Song4;~Qincheng_Lu1;~Hao_Xu17;~Yue_Li15",
        "aff": "McGill University;McGill University;McGill University, McGill University;McGill University",
        "aff_domain": "mail.mcgill.ca;mcgill.ca;mail.mcgill.ca;cs.mcgill.ca",
        "position": "PhD student;PhD student;Undergrad student;Assistant Professor",
        "bibtex": "@misc{\nsong2024timelygpt,\ntitle={Timely{GPT}: Recurrent Convolutional Transformer for Long Time-series Representation},\nauthor={Ziyang Song and Qincheng Lu and Hao Xu and Yue Li},\nyear={2024},\nurl={https://openreview.net/forum?id=2sCcTMWPc2}\n}",
        "github": "",
        "project": "",
        "reviewers": "JDYd;ZDVD;5JkM;BKAB",
        "site": "https://openreview.net/forum?id=2sCcTMWPc2",
        "pdf_size": 1894723,
        "rating": "5;5;6;6",
        "confidence": "4;4;5;3",
        "soundness": "3;2;3;3",
        "contribution": "3;2;2;2",
        "presentation": "2;1;3;3",
        "wc_summary": "116;55;68;41",
        "wc_strengths": "117;35;71;77",
        "wc_weaknesses": "134;390;110;148",
        "wc_questions": "65;4;40;5",
        "wc_review": "432;484;289;271",
        "wc_reply_reviewers": "29;412;67;0",
        "wc_reply_authors": "1309;2947;1335;767",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "4;6;3;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            70.0,
            28.222331583340168
        ],
        "wc_strengths_avg": [
            75.0,
            29.086079144497972
        ],
        "wc_weaknesses_avg": [
            195.5,
            113.11388066899659
        ],
        "wc_questions_avg": [
            28.5,
            25.578311124857326
        ],
        "wc_review_avg": [
            369.0,
            91.1015916436151
        ],
        "wc_reply_reviewers_avg": [
            127.0,
            166.2513157842668
        ],
        "wc_reply_authors_avg": [
            1589.5,
            815.8987375894144
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.75,
            1.479019945774904
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:VfnyZlrcICUJ:scholar.google.com/&scioq=TimelyGPT:+Recurrent+Convolutional+Transformer+for+Long+Time-series+Representation&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "McGill University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.mcgill.ca",
        "aff_unique_abbr": "McGill",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "title": "Enabling Lanuguage Models to Implicitly Learn Self-Improvement",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19534",
        "id": "2tVHNRZuCs",
        "author_site": "Ziqi Wang, Le Hou, Tianjian Lu, Yuexin Wu, Yunxuan Li, Hongkun Yu, Heng Ji",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) have demonstrated remarkable capabilities in open-ended text generation tasks. However, the inherent open-ended nature of these tasks implies that there is always room for improvement in the quality of model responses. To address this challenge, various approaches have been proposed to enhance the performance of LLMs. There has been a growing focus on enabling LLMs to self-improve their response quality, thereby reducing the reliance on extensive human annotation efforts for collecting diverse and high-quality training data. Recently, prompting-based methods have been widely explored among self-improvement methods owing to their effectiveness, efficiency, and convenience. However, those methods usually require explicitly and thoroughly written rubrics as inputs to LLMs. It is expensive and challenging to manually derive and provide all necessary rubrics with a real-world complex goal for improvement (e.g., being more helpfulness and less harmful). To this end, we propose an imPlicit self-ImprovemenT (PIT) framework that implicitly learns the improvement goal from human preference data. PIT only requires preference data that are used to train reward models with no extra human efforts. Specifically, we reformulate the training objective of reinforcement learning from human feedback (RLHF) -- instead of maximizing response quality for a given input, we maximize the quality gap of the response conditioned on a reference response. In this way, PIT is implicitly trained with the improvement goal of better aligning with human preferences. Experiments on two real-world datasets and one synthetic dataset show that our method significantly outperforms prompting-based methods.",
        "keywords": "large language models; self-improvement; alignment",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Ziqi Wang;Le Hou;Tianjian Lu;Yuexin Wu;Yunxuan Li;Hongkun Yu;Heng Ji",
        "authorids": "~Ziqi_Wang2;~Le_Hou1;~Tianjian_Lu1;~Yuexin_Wu1;~Yunxuan_Li2;~Hongkun_Yu2;~Heng_Ji3",
        "gender": ";M;M;M;M;M;F",
        "homepage": "https://www.wzq016.github.io;http://vision.cs.stonybrook.edu/~lehhou/home/index.html;;https://crickwu.github.io;;;http://blender.cs.illinois.edu/hengji.html",
        "dblp": "38/8097-3;161/9892;;09/1661;;;",
        "google_scholar": "xYRZiZkAAAAJ;kQ0HeQIAAAAJ;eWEj9g0AAAAJ;sd0nprMAAAAJ;Nun8Dy0AAAAJ;;z7GCqT4AAAAJ",
        "orcid": ";0000-0001-7323-5300;;;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Ziqi_Wang2;~Le_Hou1;~Tianjian_Lu1;~Yuexin_Wu1;~Yunxuan_Li2;~Hongkun_Yu2;~Heng_Ji3",
        "aff": "Meta Facebook;Google Research;Google;Google;Google;;University of Illinois, Urbana-Champaign",
        "aff_domain": "meta.com;google.com;google.com;google.com;google.com;;uiuc.edu",
        "position": "Intern;Software Engineer;Engineer;Software Engineer;Researcher;;Full Professor",
        "bibtex": "@inproceedings{\nwang2024enabling,\ntitle={Enabling Lanuguage Models to Implicitly Learn Self-Improvement},\nauthor={Ziqi Wang and Le Hou and Tianjian Lu and Yuexin Wu and Yunxuan Li and Hongkun Yu and Heng Ji},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=2tVHNRZuCs}\n}",
        "github": "",
        "project": "",
        "reviewers": "LeAH;tfvt;c4bA;xn4T",
        "pdf_size": 599775,
        "rating": "6;6;6;6",
        "confidence": "3;3;3;3",
        "soundness": "3;3;3;4",
        "contribution": "3;3;3;3",
        "presentation": "2;4;3;3",
        "wc_summary": "51;154;41;69",
        "wc_strengths": "105;133;54;92",
        "wc_weaknesses": "95;177;55;45",
        "wc_questions": "1;245;1;82",
        "wc_review": "252;709;151;288",
        "wc_reply_reviewers": "20;0;0;0",
        "wc_reply_authors": "496;1549;318;724",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "3;5;2;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            78.75,
            44.589096200752934
        ],
        "wc_strengths_avg": [
            96.0,
            28.416544476765644
        ],
        "wc_weaknesses_avg": [
            93.0,
            51.980765673468106
        ],
        "wc_questions_avg": [
            82.25,
            99.6126874449234
        ],
        "wc_review_avg": [
            350.0,
            213.266265499258
        ],
        "wc_reply_reviewers_avg": [
            5.0,
            8.660254037844387
        ],
        "wc_reply_authors_avg": [
            771.75,
            471.25490713625464
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            1.224744871391589
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11160867810813975791&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=2tVHNRZuCs",
        "pdf": "https://openreview.net/pdf?id=2tVHNRZuCs",
        "email": "meta.com;google.com;google.com;google.com;google.com;;uiuc.edu",
        "author_num": 7,
        "aff_unique_index": "0;1;1;1;1;2",
        "aff_unique_norm": "Meta;Google;University of Illinois",
        "aff_unique_dep": "Meta Platforms, Inc.;Google Research;",
        "aff_unique_url": "https://meta.com;https://research.google;https://illinois.edu",
        "aff_unique_abbr": "Meta;Google Research;UIUC",
        "aff_campus_unique_index": "1;1;1;1;2",
        "aff_campus_unique": ";Mountain View;Urbana-Champaign",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "2uHTuvDkLZ",
        "title": "Physics-aware Causal Graph Network for Spatiotemporal Modeling",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Interpretable physics equations are widely recognized as valuable inductive biases for constructing robust spatiotemporal models. To harness these valuable pieces of knowledge, existing approaches often presuppose access to the exact underlying equations. However, such an assumption usually doesn't hold, especially in the context of real-world observations. Conversely, causality systematically captures the fundamental causal relations across space and time that are intrinsically present in physics dynamics. Nevertheless, causality is often ignored as a means of integrating prior physics knowledge. In this work, we propose a novel approach that effectively captures and leverages causality to integrate physics equations into spatiotemporal models, without assuming access to precise physics principles. \nSpecifically, we introduce a physics-aware spatiotemporal causal graph network (P-stCGN). Causal relationships are analytically derived from prior physics knowledge and serve as physics-aware causality labels. A causal module is introduced to learn causal weights from spatially close and temporally past observations to current observations via semi-supervised learning. Given the learned causal structure, a forecasting module is introduced to perform predictions guided by the cause-effect relations. Extensive experiments on time series data show that our semi-supervised causal learning approach is robust with noisy and limited data. Furthermore, our evaluations on real-world graph signals demonstrate superior forecasting performance, achieved by utilizing prior physics knowledge from a causal perspective.",
        "keywords": "physics-informed deep learning; causal learning; spatiotemporal learning",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "/attachment/5873a933b20dc180f679318946973106e5a5d0fa.pdf",
        "author": "Sungyong Seo;Zijun Cui;Sam Griesemer;Joshua Hikida;Yan Liu",
        "authorids": "~Sungyong_Seo1;~Zijun_Cui1;~Sam_Griesemer1;joshua.hikida@gmail.com;~Yan_Liu1",
        "gender": "M;;M;;F",
        "homepage": "https://sungyongs.github.io/;https://zijunjkl.github.io/;https://samgriesemer.com;;http://www-bcf.usc.edu/~liu32/",
        "dblp": "178/3209;266/4675;317/5153;;150/4295",
        "google_scholar": "spYH0tEAAAAJ;https://scholar.google.com/citations?hl=en;fBZ3_FsAAAAJ;;UUKLPMYAAAAJ",
        "orcid": "0009-0001-0285-5868;0000-0002-4362-197X;0009-0009-0192-9405;;0000-0002-7055-9518",
        "linkedin": ";;;;",
        "or_profile": "~Sungyong_Seo1;~Zijun_Cui1;~Sam_Griesemer1;joshua.hikida@gmail.com;~Yan_Liu1",
        "aff": "Google;University of Southern California;University of Southern California;;University of Southern California",
        "aff_domain": "google.com;usc.edu;usc.edu;;usc.edu",
        "position": "Researcher;Postdoc;PhD student;;Professor",
        "bibtex": "@misc{\nseo2024physicsaware,\ntitle={Physics-aware Causal Graph Network for Spatiotemporal Modeling},\nauthor={Sungyong Seo and Zijun Cui and Sam Griesemer and Joshua Hikida and Yan Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=2uHTuvDkLZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "cRbd;pHbu;EyEy;B5jF",
        "site": "https://openreview.net/forum?id=2uHTuvDkLZ",
        "pdf_size": 1130397,
        "rating": "3;3;5;6",
        "confidence": "4;5;4;4",
        "soundness": "3;2;3;3",
        "contribution": "3;2;2;3",
        "presentation": "2;3;3;2",
        "wc_summary": "76;43;141;82",
        "wc_strengths": "42;33;33;23",
        "wc_weaknesses": "171;382;134;61",
        "wc_questions": "69;8;2;3",
        "wc_review": "358;466;310;169",
        "wc_reply_reviewers": "0;18;0;0",
        "wc_reply_authors": "197;208;157;212",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            85.5,
            35.316426772820606
        ],
        "wc_strengths_avg": [
            32.75,
            6.722164829874376
        ],
        "wc_weaknesses_avg": [
            187.0,
            119.3377559701874
        ],
        "wc_questions_avg": [
            20.5,
            28.09359357576029
        ],
        "wc_review_avg": [
            325.75,
            106.68733523713112
        ],
        "wc_reply_reviewers_avg": [
            4.5,
            7.794228634059948
        ],
        "wc_reply_authors_avg": [
            193.5,
            21.777281740382566
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5555555555555555,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11034681177519116032&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Google;University of Southern California",
        "aff_unique_dep": "Google;",
        "aff_unique_url": "https://www.google.com;https://www.usc.edu",
        "aff_unique_abbr": "Google;USC",
        "aff_campus_unique_index": "0;1;1;1",
        "aff_campus_unique": "Mountain View;Los Angeles",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "2uwvigLUr8",
        "title": "From Deterministic to Probabilistic World: Balancing Enhanced Doubly Robust Learning for Debiased Recommendation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In recommender systems, selection bias arises from the users' selective interactions with items, which poses a widely-recognized challenge for unbiased evaluation and learning for recommendation models. Recently, doubly robust and its variants have been widely studied to achieve debiased learning of prediction models, which enables unbiasedness when either imputed errors or learned propensities are accurate. However, we find that previous studies achieve unbiasedness using the doubly robust learning approaches are all based on deterministic error imputation model and deterministic propensity model, and these approaches fail to be unbiased when using probabilistic models to impute errors and learn propensities. To tackle this problem, in this paper, we first derive the bias of doubly robust learning methods and provide alternative unbiasedness conditions for probabilistic models. Then we propose a novel balancing enhanced doubly robust joint learning approach, which improves the accuracy of the imputed errors and leads to unbiased learning under probabilistic error imputations and learned propensities. We further derive the generalization error bound when using the probabilistic models, and show that it can be effectively controlled by the proposed learning approach. We conduct extensive experiments on three real-world datasets, including a large-scale industrial dataset, to demonstrate the effectiveness of the proposed method.",
        "keywords": "Recommender system;Selection bias;Doubly robust;Probabilistic model",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/25d5730a6cbaad6e33116f077c573080bb783609.zip",
        "author": "Haoxuan Li;Chunyuan Zheng;Yanghao Xiao;Min Zhang;Xu Chen;Xiao-Hua Zhou",
        "authorids": "~Haoxuan_Li6;~Chunyuan_Zheng1;~Yanghao_Xiao1;~Min_Zhang17;~Xu_Chen13;~Xiao-Hua_Zhou1",
        "gender": "M;M;;;M;",
        "homepage": "https://haoxuanli-pku.github.io/;;;;https://gsai.ruc.edu.cn/chenxu;",
        "dblp": "145/4965-1.html;;322/6462;;83/6331-17;",
        "google_scholar": "gtDqiucAAAAJ;https://scholar.google.com/citations?hl=en;hzfFzKUAAAAJ;;loPoqy0AAAAJ;YJNYC40AAAAJ",
        "orcid": "0000-0003-3620-3769;0000-0002-0306-7310;0000-0001-9929-4448;;0000-0003-0144-1775;",
        "linkedin": ";;;;;",
        "or_profile": "~Haoxuan_Li6;~Chunyuan_Zheng1;~Yanghao_Xiao1;~Min_Zhang17;~Xu_Chen13;~Xiao-Hua_Zhou1",
        "aff": "Peking University;Peking University;University of Chinese Academy of Sciences;;Renmin University of China;",
        "aff_domain": "pku.edu.cn;stu.pku.edu.cn;ucas.ac.cn;;ruc.edu.cn;",
        "position": "PhD student;PhD student;PhD student;;Associate Professor;",
        "bibtex": "@misc{\nli2024from,\ntitle={From Deterministic to Probabilistic World: Balancing Enhanced Doubly Robust Learning for Debiased Recommendation},\nauthor={Haoxuan Li and Chunyuan Zheng and Yanghao Xiao and Min Zhang and Xu Chen and Xiao-Hua Zhou},\nyear={2024},\nurl={https://openreview.net/forum?id=2uwvigLUr8}\n}",
        "github": "",
        "project": "",
        "reviewers": "oqbo;XsAT;gTTa",
        "site": "https://openreview.net/forum?id=2uwvigLUr8",
        "pdf_size": 397216,
        "rating": "3;6;8",
        "confidence": "4;2;4",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "2;3;3",
        "wc_summary": "62;112;98",
        "wc_strengths": "50;12;38",
        "wc_weaknesses": "283;1;182",
        "wc_questions": "2;1;3",
        "wc_review": "397;126;321",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            5.666666666666667,
            2.0548046676563256
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            90.66666666666667,
            21.06075866524175
        ],
        "wc_strengths_avg": [
            33.333333333333336,
            15.860503004493758
        ],
        "wc_weaknesses_avg": [
            155.33333333333334,
            116.65999980951293
        ],
        "wc_questions_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_review_avg": [
            281.3333333333333,
            114.13539717760169
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.11470786693528094,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:qAn4xqe8nxsJ:scholar.google.com/&scioq=From+Deterministic+to+Probabilistic+World:+Balancing+Enhanced+Doubly+Robust+Learning+for+Debiased+Recommendation&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "Peking University;University of Chinese Academy of Sciences;Renmin University of China",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.pku.edu.cn;http://www.ucas.ac.cn;http://www.ruc.edu.cn",
        "aff_unique_abbr": "Peking U;UCAS;RUC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "2vARyD50w1",
        "title": "A Two-Branch Neural Network Architecture for Model Protection within Trusted Execution Environments",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Deep Neural Networks (DNNs) become increasingly prevalent in mobile applications on edge devices. As the model architecture and weights represent valuable intellectual property for model providers, it's necessary to protect them during inference. Previous works attempted to secure on-device machine learning by leveraging Trusted Execution Environments (TEEs). However, the constrained memory within TEEs prevents the direct model placement, and significant latency overhead is raised when partitioning the model and executing by a sequence in TEE. In our research, we propose a novel framework to restructure conventional CNN models into a unique two-branch architecture that is compatible with TEE deployments. Specifically, the framework generates a model that consists of a branch placed in a normal execution environment and a lightweight counterpart within the TEE. By facilitating unidirectional communication between the two branches, the confidentiality of the model can be protected. To figure out the best architecture for the newly generated network, we introduce a progressive pruning method to gradually identify and remove the redundant channel for the two branches at the same time while maintaining a high inference accuracy for the benign user. Our comprehensive experiments, involving a variety of DNNs and datasets, attest to the effectiveness of our framework. It offers robust security assurances while ensuring efficient computational latency.",
        "keywords": "Trusted Execution Environment;Security",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Ziyu Liu;Yukui Luo;Xiaolin Xu",
        "authorids": "~Ziyu_Liu4;~Yukui_Luo1;~Xiaolin_Xu3",
        "gender": ";M;",
        "homepage": "https://orcid.org/0000-0003-1844-1114;;",
        "dblp": ";221/0729;",
        "google_scholar": ";sOWfQKEAAAAJ;",
        "orcid": ";0000-0002-5852-4195;",
        "linkedin": ";;",
        "or_profile": "~Ziyu_Liu4;~Yukui_Luo1;~Xiaolin_Xu3",
        "aff": "State University of New York at Binghamton;United States;",
        "aff_domain": "binghamton.edu;umassd.edu;",
        "position": "PhD student;Assistant Professor;",
        "bibtex": "@misc{\nliu2024a,\ntitle={A Two-Branch Neural Network Architecture for Model Protection within Trusted Execution Environments},\nauthor={Ziyu Liu and Yukui Luo and Xiaolin Xu},\nyear={2024},\nurl={https://openreview.net/forum?id=2vARyD50w1}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=2vARyD50w1",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Ys9klcchjwUJ:scholar.google.com/&scioq=A+Two-Branch+Neural+Network+Architecture+for+Model+Protection+within+Trusted+Execution+Environments&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "State University of New York at Binghamton;United States",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.binghamton.edu;https://www.usa.gov",
        "aff_unique_abbr": "SUNY Binghamton;US",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Binghamton;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "2vAhX71UCL",
        "title": "Dreamix: Video Diffusion Models are General Video Editors",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Text-driven image and video diffusion models have recently achieved unprecedented generation realism. While diffusion models have been successfully applied for image editing, none can edit motion in video. We present the first diffusion-based method that is able to perform text-based motion and appearance editing of general, real-world videos. Our approach uses a video diffusion model to combine, at inference time, the low-resolution spatio-temporal information from the original video with new, high resolution information that it synthesized to align with the guiding text prompt. As maintaining high-fidelity to the original video requires retaining some of its high-resolution information, we add a preliminary stage of finetuning the model on the original video, significantly boosting fidelity. We propose to improve motion editability by using a mixed objective that jointly finetunes with full temporal attention and with temporal attention masking. We extend our method for animating images, bringing them to life by adding motion to existing or new objects, and camera movements. Extensive experiments showcase our method's remarkable ability to edit motion in videos.",
        "keywords": "Video Diffusion;Video Motion Editing",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/42a86714507cbe50b9d004fa457d752f84311cdf.zip",
        "author": "Eyal Molad;Eliahu Horwitz;Dani Valevski;Alex Rav-Acha;Yossi Matias;Yael Pritch;Yaniv Leviathan;Yedid Hoshen",
        "authorids": "~Eyal_Molad1;~Eliahu_Horwitz1;~Dani_Valevski1;~Alex_Rav-Acha1;~Yossi_Matias2;~Yael_Pritch1;~Yaniv_Leviathan1;~Yedid_Hoshen3",
        "gender": "M;M;M;M;M;F;;M",
        "homepage": "https://www.facebook.com/eyal.molad.5;https://horwitz.ai;;https://www.linkedin.com/in/alexravacha/?originalSubdomain=il;https://research.google/people/YossiMatias/;https://research.google/people/106214/;https://yanivle.github.io/;https://www.cs.huji.ac.il/~ydidh/",
        "dblp": "22/1540;268/8318;331/5332;;m/YossiMatias;15/1134;331/5369;136/0280",
        "google_scholar": ";NyLx5nIAAAAJ;ECKZ08wAAAAJ;NIRv_L8AAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en;O9fbn38AAAAJ;https://scholar.google.co.il/citations?user=6y1-qS4AAAAJ",
        "orcid": ";;;;;;0009-0000-4080-4845;",
        "linkedin": ";eliahu-horwitz/;dani-valevski-a3b5936/?originalSubdomain=il;alexravacha/?originalSubdomain=il;yossimatias/;;yaniv-leviathan/;",
        "or_profile": "~Eyal_Molad1;~Eliahu_Horwitz1;~Dani_Valevski1;~Alex_Rav-Acha1;~Yossi_Matias2;~Yael_Pritch1;~Yaniv_Leviathan1;~Yedid_Hoshen3",
        "aff": "Google;Hebrew University of Jerusalem;Google;Google;Tel Aviv University;Google Research;Google;Google",
        "aff_domain": "google.com;huji.ac.il;google.com;google.com;tau.ac.il;google.com;google.com;google.com",
        "position": "Researcher;PhD student;Researcher;Researcher;Faculty;Researcher;Researcher;Researcher",
        "bibtex": "@misc{\nmolad2024dreamix,\ntitle={Dreamix: Video Diffusion Models are General Video Editors},\nauthor={Eyal Molad and Eliahu Horwitz and Dani Valevski and Alex Rav-Acha and Yossi Matias and Yael Pritch and Yaniv Leviathan and Yedid Hoshen},\nyear={2024},\nurl={https://openreview.net/forum?id=2vAhX71UCL}\n}",
        "github": "",
        "project": "",
        "reviewers": "UUNx;cmbb;E6Fh;JbPW",
        "site": "https://openreview.net/forum?id=2vAhX71UCL",
        "pdf_size": 24795060,
        "rating": "3;5;5;8",
        "confidence": "5;3;4;5",
        "soundness": "2;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "41;94;51;59",
        "wc_strengths": "25;41;36;50",
        "wc_weaknesses": "306;135;152;91",
        "wc_questions": "2;3;4;129",
        "wc_review": "374;273;243;329",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "321;293;223;187",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            61.25,
            19.954636052807377
        ],
        "wc_strengths_avg": [
            38.0,
            9.027735042633894
        ],
        "wc_weaknesses_avg": [
            171.0,
            81.0586207630009
        ],
        "wc_questions_avg": [
            34.5,
            54.56418239101544
        ],
        "wc_review_avg": [
            304.75,
            50.509281325316834
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            256.0,
            53.48831648126533
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.1266600992762247,
        "gs_citation": 189,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4680453094018320926&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;0;2;0;0;0",
        "aff_unique_norm": "Google;Hebrew University of Jerusalem;Tel Aviv University",
        "aff_unique_dep": "Google;;",
        "aff_unique_url": "https://www.google.com;https://www.huji.ac.il;https://www.tau.ac.il",
        "aff_unique_abbr": "Google;HUJI;TAU",
        "aff_campus_unique_index": "0;1;0;0;0;0;0",
        "aff_campus_unique": "Mountain View;Jerusalem;",
        "aff_country_unique_index": "0;1;0;0;1;0;0;0",
        "aff_country_unique": "United States;Israel"
    },
    {
        "id": "2wFXD2upSQ",
        "title": "A Demon at Work: Leveraging Neuron Death for Efficient Neural Network Pruning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "When training deep neural networks, the phenomenon of \"dying neurons\" \u2014units that become inactive and output zero throughout training\u2014has traditionally been viewed as undesirable, linked with optimization challenges, and contributing to plasticity loss, particularly in continual learning scenarios. In this paper, we reassess this phenomenon through the lens of network sparsity and pruning. By systematically exploring the influence of various hyperparameter configurations on the occurrence of dying neurons, we unveil their potential to facilitate simple yet effective structured pruning algorithms. We introduce \"Demon's Pruning\" (DemP), a method that controls the proliferation of dead neurons, dynamically sparsifying neural networks as training progresses. Remarkably, our approach, characterized by its simplicity and broad applicability,  outperforms existing structured pruning techniques, while achieving results comparable to prevalent unstructured pruning methods. These findings pave the way for leveraging dying neurons as a valuable resource for efficient model compression and optimization.",
        "keywords": "Pruning;Sparsity;Deep Learning;Regularization;Model Compression",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/607e518fa6d13a801a426ee1054563b8b7ecd961.pdf",
        "author": "Simon Dufort-Labb\u00e9;Pierluca D'Oro;Evgenii Nikishin;Razvan Pascanu;Pierre-Luc Bacon;Aristide Baratin",
        "authorids": "~Simon_Dufort-Labb\u00e91;~Pierluca_D'Oro1;~Evgenii_Nikishin1;~Razvan_Pascanu1;~Pierre-Luc_Bacon1;~Aristide_Baratin1",
        "gender": "M;M;M;M;;",
        "homepage": "https://github.com/SimonDufLab/;https://proceduralia.github.io;http://evgenii-nikishin.github.io/;https://razp.info;;",
        "dblp": "314/6338.html;248/8326;294/4770;65/8368.html;;",
        "google_scholar": ";https://scholar.google.it/citations?user=AuVp7pkAAAAJ;ez9FSEAAAAAJ;https://scholar.google.ca/citations?user=eSPY8LwAAAAJ;;",
        "orcid": ";;;;;",
        "linkedin": "simon-dufort-labb%C3%A9-8593421b5/;;;;;",
        "or_profile": "~Simon_Dufort-Labb\u00e91;~Pierluca_D'Oro1;~Evgenii_Nikishin1;~Razvan_Pascanu1;~Pierre-Luc_Bacon1;~Aristide_Baratin1",
        "aff": "Universit\u00e9 de Montr\u00e9al;Universit\u00e9 de Montr\u00e9al;University of Montreal;Google DeepMind;;",
        "aff_domain": "umontreal.ca;umontreal.ca;umontreal.ca;google.com;;",
        "position": "PhD student;PhD student;PhD student;Research Scientist;;",
        "bibtex": "@misc{\ndufort-labb{\\'e}2024a,\ntitle={A Demon at Work: Leveraging Neuron Death for Efficient Neural Network Pruning},\nauthor={Simon Dufort-Labb{\\'e} and Pierluca D'Oro and Evgenii Nikishin and Razvan Pascanu and Pierre-Luc Bacon and Aristide Baratin},\nyear={2024},\nurl={https://openreview.net/forum?id=2wFXD2upSQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "tiWA;i9Pr;k7gu;YsTs",
        "site": "https://openreview.net/forum?id=2wFXD2upSQ",
        "pdf_size": 1159785,
        "rating": "5;5;6;6",
        "confidence": "2;4;3;3",
        "soundness": "3;4;2;3",
        "contribution": "2;2;2;2",
        "presentation": "2;3;2;3",
        "wc_summary": "44;56;84;63",
        "wc_strengths": "45;34;48;116",
        "wc_weaknesses": "288;76;196;44",
        "wc_questions": "3;132;86;600",
        "wc_review": "380;298;414;823",
        "wc_reply_reviewers": "107;0;0;166",
        "wc_reply_authors": "509;663;601;896",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "2;1;1;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            61.75,
            14.53229162933362
        ],
        "wc_strengths_avg": [
            60.75,
            32.32162588732194
        ],
        "wc_weaknesses_avg": [
            151.0,
            97.29850975220535
        ],
        "wc_questions_avg": [
            205.25,
            232.55039776358157
        ],
        "wc_review_avg": [
            478.75,
            203.17649347303936
        ],
        "wc_reply_reviewers_avg": [
            68.25,
            71.36657130617948
        ],
        "wc_reply_authors_avg": [
            667.25,
            142.9831720867879
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:lqILG4iqw1oJ:scholar.google.com/&scioq=A+Demon+at+Work:+Leveraging+Neuron+Death+for+Efficient+Neural+Network+Pruning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "Universit\u00e9 de Montr\u00e9al;University of Montreal;Google",
        "aff_unique_dep": ";;Google DeepMind",
        "aff_unique_url": "https://www.umontreal.ca;https://wwwumontreal.ca;https://deepmind.com",
        "aff_unique_abbr": "UdeM;UM;DeepMind",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "Canada;United Kingdom"
    },
    {
        "id": "2wwPG1wpsu",
        "title": "LST-Bench:A Benchmark for long sequence time-series forecasting Task",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper introduces LST-Bench, a comprehensive benchmark designed for evaluating long sequence time-series forecasting(LSTF) models. This benchmark has been developed in response to recent advancements in deep learning methods in the field of LSTF tasks. LST-Bench includes Transformer-based, MLP-based, CNN-based, and RNN-based models, evaluating the performance of 11 major forecasting models on a set of commonly used 7 datasets and 7 new datasets that we have introduced. We conduct a thorough analysis of the experimental results, including the overall prediction performance of models and their generalization across different prediction lengths and datasets. Notably, we found that regardless of the model architecture, the phenomenon referred to as \"Degeneracy\" occurs when the model's predictions consistently maintain a low Mean Squared Error value but are characterized by repetitive and simplistic pattern generation, thus losing the meaningfulness of the predictions. Also, the model's optimal performance is very close to its performance after training for just one epoch. These two phenomenons emphasize the need for further investigation. Our LST-Bench will serve as a valuable resource for advancing research in the field of time series forecasting.",
        "keywords": "Time Series;Deep Learning;Neural Networks;Data Mining",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "lanhao li;Haoyi Zhou;Bodan Chen;Siyang Xiao;Jianxin Li",
        "authorids": "~lanhao_li1;~Haoyi_Zhou1;~Bodan_Chen1;~Siyang_Xiao1;~Jianxin_Li3",
        "gender": ";M;M;;M",
        "homepage": "https://scholar.google.com/citations?user=WpeTvLgAAAAJ&hl=zh-CN&oi=ao;https://www.zhouhaoyi.com/;https://github.com/guolalala;;http://myjianxin.github.io",
        "dblp": ";162/1287;;;l/JianxinLi-2.html",
        "google_scholar": "WpeTvLgAAAAJ;mbrFlN0AAAAJ;;;EY2lqD0AAAAJ",
        "orcid": ";0000-0002-2393-3634;;;0000-0001-5152-0055",
        "linkedin": ";haoyi-zhou-54a7a69a/;;;",
        "or_profile": "~lanhao_li1;~Haoyi_Zhou1;~Bodan_Chen1;~Siyang_Xiao1;~Jianxin_Li3",
        "aff": "Beihang University;Beihang University;Beihang University;;Beihang University ",
        "aff_domain": "buaa.edu.cn;buaa.edu.cn;buaa.edu.cn;;buaa.edu.cn",
        "position": "PhD student;Assistant Professor;MS student;;Full Professor",
        "bibtex": "@misc{\nli2024lstbencha,\ntitle={{LST}-Bench:A Benchmark for long sequence time-series forecasting Task},\nauthor={lanhao li and Haoyi Zhou and Bodan Chen and Siyang Xiao and Jianxin Li},\nyear={2024},\nurl={https://openreview.net/forum?id=2wwPG1wpsu}\n}",
        "github": "",
        "project": "",
        "reviewers": "1Wsy;inoa;PPjW;t1kK",
        "site": "https://openreview.net/forum?id=2wwPG1wpsu",
        "pdf_size": 1829584,
        "rating": "1;3;3;3",
        "confidence": "5;4;4;4",
        "soundness": "1;2;2;2",
        "contribution": "1;1;2;2",
        "presentation": "2;1;3;2",
        "wc_summary": "149;89;112;88",
        "wc_strengths": "27;57;46;50",
        "wc_weaknesses": "74;202;159;47",
        "wc_questions": "1;26;20;2",
        "wc_review": "251;374;337;187",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            109.5,
            24.743686063317245
        ],
        "wc_strengths_avg": [
            45.0,
            11.113055385446435
        ],
        "wc_weaknesses_avg": [
            120.5,
            62.62786919575023
        ],
        "wc_questions_avg": [
            12.25,
            10.96300597464035
        ],
        "wc_review_avg": [
            287.25,
            73.08342835417616
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:0o-2uYpzHrcJ:scholar.google.com/&scioq=LST-Bench:A+Benchmark+for+long+sequence+time-series+forecasting+Task&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Beihang University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.buaa.edu.cn/",
        "aff_unique_abbr": "BUAA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "2xYO9oxh0y",
        "title": "DiffSDS: A geometric sequence diffusion model for protein backbone inpainting",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Can a pure transformer learn protein structure under geometric constraints? Recent research has simplified protein structures as sequences of folding angles, making transformers suitable for unconstrained protein backbone generation. Unfortunately, such simplification is unsuitable for the constrained protein inpainting problem: we reveal theoretically that applying geometric constraints to the angle space would result in gradient vanishing or exploding, called \\textbf{GradCurse}. As a remedy, we suggest adding a hidden \\textbf{a}tomic \\textbf{d}irection \\textbf{s}pace (\\textbf{ADS}) layer upon the transformer encoder, converting invariant backbone angles into equivariant direction vectors. Geometric constraints could be efficiently imposed on the direction space while avoiding GradCurse. Meanwhile, a Direct2Seq decoder with mathematical guarantees is also introduced to reconstruct the folding angles. We apply the \\textbf{dual-space} model as the denoising neural network during the conditional diffusion process, resulting in a constrained generative model--\\textbf{DiffSDS}. Extensive experiments show that the proposed DiffSDS outperforms the sequence diffusion baseline, and even achieves competitive results with coordinate diffusion models, filling the gap between sequence and coordinate diffusion models.",
        "keywords": "Conditional sequence diffusion",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "/attachment/a228d5f7fa06f769004034b3ad444e586cb60cd4.pdf",
        "author": "Zhangyang Gao;Cheng Tan;Lirong Wu;Yufei Huang;Bozhen Hu;Stan Z. Li",
        "authorids": "~Zhangyang_Gao1;~Cheng_Tan1;~Lirong_Wu1;~Yufei_Huang4;~Bozhen_Hu1;~Stan_Z._Li2",
        "gender": "M;M;;M;M;M",
        "homepage": ";https://chengtan9907.github.io/;;https://2021.igem.org/Team:ZJU-China;;https://en.westlake.edu.cn/academics/School_of_Engineering/About/Our_People/Faculty/201912/t20191206_2497.shtml",
        "dblp": "275/3266;70/1533-12.html;15/10330;68/1946-2;279/8665;l/StanZLi",
        "google_scholar": "4SclT-QAAAAJ;6kTV6aMAAAAJ;Tk7TrCoAAAAJ;qmTjdwIAAAAJ;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": "0000-0003-1026-6083;;;0009-0007-8184-4529;0000-0002-3428-0114;",
        "linkedin": ";;;;;stan-z-li-%E6%9D%8E%E5%AD%90%E9%9D%92-55753224/",
        "or_profile": "~Zhangyang_Gao1;~Cheng_Tan1;~Lirong_Wu1;~Yufei_Huang4;~Bozhen_Hu1;~Stan_Z._Li1",
        "aff": "Westlake University, China;Zhejiang University & Westlake University;Westlake University;Zhejiang University;Westlake University;Westlake University",
        "aff_domain": "westlake.edu.cn;westlake.edu.cn;westlake.edu.cn;zju.edu.cn;westlake.edu.cn;westlake.edu.cn",
        "position": "PhD student;PhD student;PhD student;PhD student;PhD student;Chair Professor",
        "bibtex": "@misc{\ngao2024diffsds,\ntitle={Diff{SDS}: A geometric sequence diffusion model for protein backbone inpainting},\nauthor={Zhangyang Gao and Cheng Tan and Lirong Wu and Yufei Huang and Bozhen Hu and Stan Z. Li},\nyear={2024},\nurl={https://openreview.net/forum?id=2xYO9oxh0y}\n}",
        "github": "",
        "project": "",
        "reviewers": "qjdQ;9CLX;YgsM",
        "site": "https://openreview.net/forum?id=2xYO9oxh0y",
        "pdf_size": 1497240,
        "rating": "3;3;5",
        "confidence": "5;3;4",
        "soundness": "2;3;3",
        "contribution": "1;2;2",
        "presentation": "2;3;3",
        "wc_summary": "38;95;117",
        "wc_strengths": "49;54;91",
        "wc_weaknesses": "222;231;156",
        "wc_questions": "43;86;128",
        "wc_review": "352;466;492",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            83.33333333333333,
            33.289971796657056
        ],
        "wc_strengths_avg": [
            64.66666666666667,
            18.732028424302822
        ],
        "wc_weaknesses_avg": [
            203.0,
            33.436506994600975
        ],
        "wc_questions_avg": [
            85.66666666666667,
            34.70190516703978
        ],
        "wc_review_avg": [
            436.6666666666667,
            60.80204674917522
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:B3EO7Rd_TzcJ:scholar.google.com/&scioq=DiffSDS:+A+geometric+sequence+diffusion+model+for+protein+backbone+inpainting&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;1;0;0",
        "aff_unique_norm": "Westlake University;Zhejiang University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.westlake.edu.cn;http://www.zju.edu.cn",
        "aff_unique_abbr": "WU;ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "2y8XnaIiB8",
        "title": "Vision-Language Dataset Distillation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Dataset distillation methods offer the promise of reducing a large-scale dataset down to a significantly smaller set of (potentially synthetic) training examples, which preserve sufficient information for training a new model from scratch. So far dataset distillation methods have been developed for image classification. However, with the rise in capabilities of vision-language models, and especially given the scale of datasets necessary to train these models, the time is ripe to expand dataset distillation methods beyond image classification. In this work, we take the first steps towards this goal by expanding on the idea of trajectory matching to create a distillation method for vision-language datasets. The key challenge is that vision-language datasets do not have a set of discrete classes. To overcome this, our proposed vision-and-language dataset distillation method jointly distill the images and their corresponding language descriptions in a contrastive formulation. Since there are no existing baselines, we compare our approach to three coreset selection methods (strategic subsampling of the training dataset), which we adapt to the vision-language setting. We demonstrate significant improvements on the challenging Flickr30K and COCO retrieval benchmarks: for example, on Flickr30K the best coreset selection method which selects 1000 image-text pairs for training is able to achieve only 5.6% image-to-text retrieval accuracy (i.e., recall@1); in contrast, our dataset distillation approach almost doubles that to 9.9% with just 100 (an order of magnitude fewer) training pairs.",
        "keywords": "dataset distillation;dataset condensation;multimodal machine learning;vision-language",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/f2a2ff64d9271fb236fe1b9ce83a3dfb91a5799e.zip",
        "author": "Xindi Wu;Byron Zhang;Zhiwei Deng;Olga Russakovsky",
        "authorids": "~Xindi_Wu1;~Byron_Zhang1;~Zhiwei_Deng3;~Olga_Russakovsky1",
        "gender": "F;M;M;F",
        "homepage": "https://xindiwu.github.io/;;http://www.zhiweideng.com;http://cs.princeton.edu/~olgarus",
        "dblp": "235/0784;;160/3578;52/6883",
        "google_scholar": "hvnUnrUAAAAJ;;tWBPUHwAAAAJ;TB5OwW8AAAAJ",
        "orcid": ";;;0000-0001-5272-3241",
        "linkedin": ";byron-zhang/;;",
        "or_profile": "~Xindi_Wu1;~Byron_Zhang1;~Zhiwei_Deng3;~Olga_Russakovsky1",
        "aff": "Princeton University;;Google Deepmind;Princeton University",
        "aff_domain": "cs.princeton.edu;;google.com;princeton.edu",
        "position": "PhD student;;Research Scientist;Associate Professor",
        "bibtex": "@misc{\nwu2024visionlanguage,\ntitle={Vision-Language Dataset Distillation},\nauthor={Xindi Wu and Byron Zhang and Zhiwei Deng and Olga Russakovsky},\nyear={2024},\nurl={https://openreview.net/forum?id=2y8XnaIiB8}\n}",
        "github": "",
        "project": "",
        "reviewers": "Evkk;MV4s;tXui;i1Lj",
        "site": "https://openreview.net/forum?id=2y8XnaIiB8",
        "pdf_size": 30037120,
        "rating": "5;5;6;6",
        "confidence": "5;5;2;4",
        "soundness": "2;3;4;3",
        "contribution": "3;3;2;3",
        "presentation": "3;3;4;4",
        "wc_summary": "42;40;89;135",
        "wc_strengths": "20;21;48;120",
        "wc_weaknesses": "165;56;50;207",
        "wc_questions": "2;203;46;1",
        "wc_review": "229;320;233;463",
        "wc_reply_reviewers": "61;0;0;0",
        "wc_reply_authors": "1579;1073;336;484",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "3;2;1;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            4.0,
            1.224744871391589
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            76.5,
            39.05444917035702
        ],
        "wc_strengths_avg": [
            52.25,
            40.69628361410904
        ],
        "wc_weaknesses_avg": [
            119.5,
            68.17074152449862
        ],
        "wc_questions_avg": [
            63.0,
            82.84624312544292
        ],
        "wc_review_avg": [
            311.25,
            94.85877661028525
        ],
        "wc_reply_reviewers_avg": [
            15.25,
            26.413774815425377
        ],
        "wc_reply_authors_avg": [
            868.0,
            494.47598526116514
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8164965809277259,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1032649700553466713&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Princeton University;DeepMind",
        "aff_unique_dep": ";DeepMind",
        "aff_unique_url": "https://www.princeton.edu;https://deepmind.com",
        "aff_unique_abbr": "Princeton;DeepMind",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "2yBuTFvXRh",
        "title": "AMPNet: Attention as Message Passing for Graph Neural Networks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Graph Neural Networks (GNNs) have emerged as a powerful representation learning framework for graph-structured data. A key limitation of conventional GNNs is their representation of each node with a singular feature vector, potentially overlooking intricate details about individual node features. Here, we propose an Attention-based Message-Passing layer for GNNs (AMPNet) that encodes individual features per node and models feature-level interactions through cross-node attention during message-passing steps. We demonstrate the abilities of AMPNet through extensive benchmarking on real-world biological systems such as fMRI brain activity recordings and spatial genomic data, improving over existing baselines by 20% on fMRI signal reconstruction, and further improving another 8% with positional embedding added. Finally, we validate the ability of AMPNet to uncover meaningful feature-level interactions through case studies on biological systems. We anticipate that our architecture will be highly applicable to graph-structured data where node entities encompass rich feature-level information.",
        "keywords": "Graph Neural Networks;Attention;Message Passing",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/46313d1906028a6dcce6a833a5d1dda8c857e325.pdf",
        "author": "Syed A Rizvi;Nhi Nguyen;Haoran Lyu;Benjamin W Christensen;Josue Ortega Caro;Emanuele Zappala;Maryam Bagherian;Antonio Henrique de Oliveira Fonseca;Christopher Lee Averill;Chadi Abdallah;Zhitao Ying;Maria Brbic;Rahul Madhav Dhodapkar;David van Dijk",
        "authorids": "~Syed_A_Rizvi1;~Nhi_Nguyen1;~Haoran_Lyu1;~Benjamin_W_Christensen1;~Josue_Ortega_Caro1;~Emanuele_Zappala1;~Maryam_Bagherian1;~Antonio_Henrique_de_Oliveira_Fonseca1;christopher.averill@bcm.edu;~Chadi_Abdallah1;~Zhitao_Ying1;~Maria_Brbic1;~Rahul_Madhav_Dhodapkar1;~David_van_Dijk1",
        "gender": "M;F;;M;;M;F;M;;M;M;F;M;M",
        "homepage": "https://syedarizvi.com/;https://www.linkedin.com/in/nhi-nguyen-a427401a9/;;;;https://eazappala.com/;;https://ahof1704.github.io/;;;https://www.cs.yale.edu/homes/ying-rex;https://brbiclab.epfl.ch/;;http://www.vandijklab.org",
        "dblp": ";;;;;;;;;;209/4936;130/3233;;136/9930",
        "google_scholar": "2rhnnZ4AAAAJ;;;;;J4OOzEwAAAAJ;;;;HJsH1PEAAAAJ;6fqNXooAAAAJ;ltxmeroAAAAJ;ivfFMbEAAAAJ;fjjZr6UAAAAJ",
        "orcid": "0000-0002-7932-9524;;;;;;;;;0000-0001-5783-6181;;0000-0002-1120-1778;0000-0002-2014-7515;",
        "linkedin": "syed-a-rizvi-01/;nhi-nguyen-a427401a9/;;benjwc/;;;maryam-bagherian-93a358ba/;;;;rex-ying-92770148/;;;",
        "or_profile": "~Syed_A_Rizvi1;~Nhi_Nguyen1;~Haoran_Lyu1;~Benjamin_W_Christensen1;~Josue_Ortega_Caro1;~Emanuele_Zappala1;~Maryam_Bagherian1;~Antonio_Henrique_de_Oliveira_Fonseca1;christopher.averill@bcm.edu;~Chadi_Abdallah1;~Zhitao_Ying1;~Maria_Brbic1;~Rahul_Madhav_Dhodapkar1;~David_van_Dijk1",
        "aff": "Yale University;New York University;;ETHZ - ETH Zurich;;Idaho State University;Yale University;Yale University;;Baylor College of Medicine;Yale University;EPFL - EPF Lausanne;;Yale University",
        "aff_domain": "yale.edu;nyu.edu;;ethz.ch;;isu.edu;yale.edu;yale.edu;;bcm.edu;yale.edu;epfl.ch;;yale.edu",
        "position": "PhD student;PhD student;;MS student;;Assistant Professor;Postdoc;PhD student;;Associate Professor;Assistant Professor;Assistant Professor;;Assistant Professor",
        "bibtex": "@misc{\nrizvi2024ampnet,\ntitle={{AMPN}et: Attention as Message Passing for Graph Neural Networks},\nauthor={Syed A Rizvi and Nhi Nguyen and Haoran Lyu and Benjamin W Christensen and Josue Ortega Caro and Emanuele Zappala and Maryam Bagherian and Antonio Henrique de Oliveira Fonseca and Christopher Lee Averill and Chadi Abdallah and Zhitao Ying and Maria Brbic and Rahul Madhav Dhodapkar and David van Dijk},\nyear={2024},\nurl={https://openreview.net/forum?id=2yBuTFvXRh}\n}",
        "github": "",
        "project": "",
        "reviewers": "Kcsy;vyBv;QxkE;Jr5A",
        "site": "https://openreview.net/forum?id=2yBuTFvXRh",
        "pdf_size": 3026514,
        "rating": "3;3;3;5",
        "confidence": "5;4;4;4",
        "soundness": "2;2;2;2",
        "contribution": "1;1;2;3",
        "presentation": "2;3;2;3",
        "wc_summary": "51;102;106;45",
        "wc_strengths": "35;25;102;57",
        "wc_weaknesses": "93;8;138;215",
        "wc_questions": "73;27;69;3",
        "wc_review": "252;162;415;320",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            76.0,
            28.115831839019098
        ],
        "wc_strengths_avg": [
            54.75,
            29.634228520412
        ],
        "wc_weaknesses_avg": [
            113.5,
            74.92162571647788
        ],
        "wc_questions_avg": [
            43.0,
            29.29163703175362
        ],
        "wc_review_avg": [
            287.25,
            92.6320004102254
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            14,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7069628564186932802&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;0;0;4;0;5;0",
        "aff_unique_norm": "Yale University;New York University;ETH Zurich;Idaho State University;Baylor College of Medicine;EPFL",
        "aff_unique_dep": ";;;;;",
        "aff_unique_url": "https://www.yale.edu;https://www.nyu.edu;https://www.ethz.ch;https://www.isu.edu;https://www.bcm.edu;https://www.epfl.ch",
        "aff_unique_abbr": "Yale;NYU;ETHZ;ISU;BCM;EPFL",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Lausanne",
        "aff_country_unique_index": "0;0;1;0;0;0;0;0;1;0",
        "aff_country_unique": "United States;Switzerland"
    },
    {
        "id": "2zoi9YI21Y",
        "title": "Towards a Self-Made Model: Zero-Shot Self-Supervised Purification for Adversarial Attacks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Adversarial purification is an adversarial defense method without robustness training for the classifier and regardless of the form of attacks, aiming to remove the adversarial perturbations on the attacked images. Such methods can defend against various unseen threats without modifying the classifier in contrast to empirical defenses. However, previous purification methods require careful training of a strong generative model or incorporating additional knowledge when training a classifier to be comparable to adversarial training. Retraining promising generative models or classifiers on large-scale datasets (e.g., ImageNet) is extremely challenging and computation-consuming. In this work, following the natural image manifold hypothesis, we propose a zero-shot self-supervised method for adversarial purification named \\textit{ZeroPur}: For an adversarial example that lies beyond the natural image manifold, its corrupted embedding vector is first restored so that it is moved close to the natural image manifold. The embedding is then fine-tuned on finer intermediate-level discrepancies to project it back within the manifold. The whole purification process is done from coarse to fine, which does not rely on any generative model and does not require retraining the classifier to incorporate additional knowledge. Extensive experiments on three datasets including CIFAR-10, CIFAR-100, and ImageNet with various classifier architectures including ResNet and WideResNet, demonstrate that our method achieves state-of-the-art robust performance. Code released.",
        "keywords": "adversarial attacks;adversarial defense;adversarial purification",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Xiuli Bi;Zonglin Yang;Bo Liu;Bin Xiao;Weisheng Li;Chi-Man Pun;Pietro Lio",
        "authorids": "~Xiuli_Bi1;~Zonglin_Yang2;~Bo_Liu23;~Bin_Xiao4;~Weisheng_Li2;~Chi-Man_Pun1;~Pietro_Lio1",
        "gender": "F;M;M;M;M;;M",
        "homepage": ";https://github.com/ZhivkoYang;;;http://cs.cqupt.edu.cn;https://cmpun.github.io/;https://www.cst.cam.ac.uk/people/pl219",
        "dblp": "92/860.html;;;43/5134-2;;p/ChiManPun;l/PietroLio.html",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-TW;;fXlz210AAAAJ;https://scholar.google.com/citations?hl=zh-TW;;JTkP_EAAAAAJ;https://scholar.google.co.uk/citations?user=3YrWf7EAAAAJ",
        "orcid": "0000-0003-3134-217X;;0000-0002-3164-6299;0000-0001-8469-5302;;0000-0003-1788-3746;0000-0002-0540-5053",
        "linkedin": ";;;;;;",
        "or_profile": "~Xiuli_Bi1;~Zonglin_Yang2;~Bo_Liu23;~Bin_Xiao4;~Weisheng_Li2;~Chi-Man_Pun1;~Pietro_Lio1",
        "aff": "Chongqing University of Post and Telecommunications;Chongqing University of Post and Telecommunications;Chongqing University of Post and Telecommunications;Chongqing University of Posts and Tel.;Chongqing Post and Communications University;University of Macau;University of Cambridge",
        "aff_domain": "cqupt.edu.cn;cqupt.edu.cn;cqupt.edu.cn;edu.cn;cqupt.edu.cn;um.edu.mo;cam.ac.uk",
        "position": "Full Professor;MS student;Associate Professor;Full Professor;Full Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nbi2024towards,\ntitle={Towards a Self-Made Model: Zero-Shot Self-Supervised Purification for Adversarial Attacks},\nauthor={Xiuli Bi and Zonglin Yang and Bo Liu and Bin Xiao and Weisheng Li and Chi-Man Pun and Pietro Lio},\nyear={2024},\nurl={https://openreview.net/forum?id=2zoi9YI21Y}\n}",
        "github": "",
        "project": "",
        "reviewers": "tryU;1obD;GavC",
        "site": "https://openreview.net/forum?id=2zoi9YI21Y",
        "pdf_size": 3359310,
        "rating": "3;3;5",
        "confidence": "4;2;4",
        "soundness": "2;1;2",
        "contribution": "2;2;2",
        "presentation": "3;1;2",
        "wc_summary": "84;75;108",
        "wc_strengths": "44;26;76",
        "wc_weaknesses": "208;443;392",
        "wc_questions": "27;16;250",
        "wc_review": "363;560;826",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            89.0,
            13.92838827718412
        ],
        "wc_strengths_avg": [
            48.666666666666664,
            20.677416559027762
        ],
        "wc_weaknesses_avg": [
            347.6666666666667,
            100.93011883916955
        ],
        "wc_questions_avg": [
            97.66666666666667,
            107.80950277637349
        ],
        "wc_review_avg": [
            583.0,
            189.71733359571198
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.5000000000000001,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:dPw7dxhVcs8J:scholar.google.com/&scioq=Towards+a+Self-Made+Model:+Zero-Shot+Self-Supervised+Purification+for+Adversarial+Attacks&hl=en&as_sdt=0,34",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;2;3;4",
        "aff_unique_norm": "Chongqing University of Post and Telecommunications;Chongqing University of Posts and Telecommunications;Chongqing Post and Communications University;University of Macau;University of Cambridge",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "http://www.cqupt.edu.cn;http://www.cqupt.edu.cn/;http://www.cqupt.edu.cn;https://www.um.edu.mo;https://www.cam.ac.uk",
        "aff_unique_abbr": "CQUPT;CQUPT;CQUPT;UM;Cambridge",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Macau SAR;Cambridge",
        "aff_country_unique_index": "0;0;0;0;0;0;1",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "id": "30L0rr9W8A",
        "title": "LatentCBF: A Control Barrier Function in Latent Space for Safe Control",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Safe control is crucial for safety-critical autonomous systems that are deployed in dynamic and uncertain environments. Quadratic-programming-control-barrier-function (QP-CBF) is becoming a popular tool for safe controller synthesis. Traditional QP-CBF relies on explicit knowledge of the system dynamics and access to all states, which are not always available in practice. We propose LatentCBF (LCBF), a control barrier function defined in the latent space, which only needs an agent's observations, not full states. The transformation from observations to latent space is established by a Lipschitz network-based AutoEncoder. In addition, the system dynamics and control barrier functions are all learned in the latent space. We demonstrate the efficiency, safety, and robustness of LCBFs in simulation for quadrotors and cars.",
        "keywords": "Representation Learning;Reinforcement Learning;Optimal Control;End-to-End Learning;Convex Optimization;Control Barrier Function;Autonomous Driving;CARLA;Robotics",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Somnath Sendhil Kumar;Qin Lin;John Dolan",
        "authorids": "~Somnath_Sendhil_Kumar1;~Qin_Lin1;~John_Dolan1",
        "gender": "M;M;M",
        "homepage": "https://hex-plex.github.io;;https://www.ri.cmu.edu/ri-faculty/john-m-dolan/",
        "dblp": ";;52/532.html",
        "google_scholar": ";https://scholar.google.nl/citations?user=-HX_b_0AAAAJ;xLk_w7kAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Somnath_Sendhil_Kumar1;~Qin_Lin1;~John_Dolan1",
        "aff": "Microsoft Research;Cleveland State University;School of Computer Science, Carnegie Mellon University",
        "aff_domain": "research.microsoft.com;csuohio.edu;cs.cmu.edu",
        "position": "Researcher;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nkumar2024latentcbf,\ntitle={Latent{CBF}: A Control Barrier Function in Latent Space for Safe Control},\nauthor={Somnath Sendhil Kumar and Qin Lin and John Dolan},\nyear={2024},\nurl={https://openreview.net/forum?id=30L0rr9W8A}\n}",
        "github": "",
        "project": "",
        "reviewers": "ciJn;5PWg;ERPL;pAha",
        "site": "https://openreview.net/forum?id=30L0rr9W8A",
        "pdf_size": 2311052,
        "rating": "3;3;5;5",
        "confidence": "4;4;4;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "3;1;3;4",
        "wc_summary": "97;110;37;193",
        "wc_strengths": "29;62;23;62",
        "wc_weaknesses": "76;277;166;217",
        "wc_questions": "245;174;74;153",
        "wc_review": "447;623;300;625",
        "wc_reply_reviewers": "52;250;139;266",
        "wc_reply_authors": "863;1159;593;1176",
        "reply_reviewers": "1;2;2;2",
        "reply_authors": "2;3;2;2",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            109.25,
            55.64339583454626
        ],
        "wc_strengths_avg": [
            44.0,
            18.12456896039186
        ],
        "wc_weaknesses_avg": [
            184.0,
            73.69871097922947
        ],
        "wc_questions_avg": [
            161.5,
            60.94464701678073
        ],
        "wc_review_avg": [
            498.75,
            135.60673840189506
        ],
        "wc_reply_reviewers_avg": [
            176.75,
            87.06140074682925
        ],
        "wc_reply_authors_avg": [
            947.75,
            239.6636966668085
        ],
        "reply_reviewers_avg": [
            1.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2612126896855845512&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Microsoft;Cleveland State University;Carnegie Mellon University",
        "aff_unique_dep": "Microsoft Research;;School of Computer Science",
        "aff_unique_url": "https://www.microsoft.com/en-us/research;https://www.csuohio.edu;https://www.cmu.edu",
        "aff_unique_abbr": "MSR;CSU;CMU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Pittsburgh",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Separating common from salient patterns with Contrastive Representation Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19533",
        "id": "30N3bNAiw3",
        "author_site": "Robin Louiset, Edouard Duchesnay, Grigis Antoine, Pietro Gori",
        "tldr": "",
        "abstract": "Contrastive Analysis is a sub-field of Representation Learning that aims at separating 1) salient factors of variation - that only exist in the target dataset (i.e., diseased subjects) in contrast with 2) common factors of variation between target and background (i.e., healthy subjects) datasets. Despite their relevance, current models based on Variational Auto-Encoders have shown poor performance in learning semantically-expressive representations. On the other hand, Contrastive Representation Learning has shown tremendous performance leaps in various applications (classification, clustering, etc.). In this work, we propose to leverage the ability of Contrastive Learning to learn semantically expressive representations when performing Contrastive Analysis. Namely, we reformulate Contrastive Analysis under the lens of the InfoMax Principle and identify two Mutual Information terms to maximize and one to minimize. We decompose the two first terms into an Alignment and a Uniformity term, as commonly done in Contrastive Learning. Then, we motivate a novel Mutual Information minimization strategy to prevent information leakage between common and salient distributions. We validate our method on datasets designed to assess the pattern separation capability in Contrastive Analysis, including MNIST superimposed on CIFAR10, CelebA accessories, dSprites item superimposed on a digit grid, and three medical datasets.",
        "keywords": "Contrastive Learning;Mutual Information;Contrastive Analysis;Disentanglement",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Robin Louiset;Edouard Duchesnay;Antoine Grigis;Pietro Gori",
        "authorids": "~Robin_Louiset1;~Edouard_Duchesnay1;~Antoine_Grigis1;~Pietro_Gori1",
        "gender": "M;M;;",
        "homepage": ";https://duchesnay.github.io/;https://perso.telecom-paristech.fr/pgori/index.html;",
        "dblp": ";;134/9724;",
        "google_scholar": "yKGCUNQAAAAJ;https://scholar.google.fr/citations?user=mG6V3q4AAAAJ;https://scholar.google.fr/citations?user=id9wCjsAAAAJ;https://scholar.google.fr/citations?user=nDapWF8AAAAJ",
        "orcid": ";0000-0002-4073-3490;;",
        "linkedin": ";edouard-duchesnay-27b47b8;;",
        "or_profile": "~Robin_Louiset1;~Edouard_Duchesnay1;~Pietro_Gori1;~Grigis_Antoine1",
        "aff": "CEA;CEA;Telecom Paris;CEA",
        "aff_domain": "cea.fr;cea.fr;telecom-paris.fr;cea.fr",
        "position": "PhD student;Full Professor;Associate Professor;Researcher",
        "bibtex": "@inproceedings{\nlouiset2024separating,\ntitle={Separating common from salient patterns with Contrastive Representation Learning},\nauthor={Robin Louiset and Edouard Duchesnay and Antoine Grigis and Pietro Gori},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=30N3bNAiw3}\n}",
        "github": "",
        "project": "",
        "reviewers": "F95G;4LjD;etAa;fALd;Btev",
        "pdf_size": 4134629,
        "rating": "5;8;8;8;8",
        "confidence": "2;3;4;3;3",
        "soundness": "3;3;3;4;3",
        "contribution": "2;3;2;4;3",
        "presentation": "2;3;3;3;3",
        "wc_summary": "219;87;55;110;94",
        "wc_strengths": "135;23;147;163;98",
        "wc_weaknesses": "175;40;560;115;138",
        "wc_questions": "103;14;28;60;38",
        "wc_review": "632;164;790;448;368",
        "wc_reply_reviewers": "0;0;107;0;0",
        "wc_reply_authors": "1255;233;2590;903;1549",
        "reply_reviewers": "0;0;1;0;0",
        "reply_authors": "7;2;9;4;4",
        "rating_avg": [
            7.4,
            1.2
        ],
        "confidence_avg": [
            3.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            3.2,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.8,
            0.7483314773547882
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            113.0,
            55.939252765835185
        ],
        "wc_strengths_avg": [
            113.2,
            49.929550368494205
        ],
        "wc_weaknesses_avg": [
            205.6,
            182.61281444630328
        ],
        "wc_questions_avg": [
            48.6,
            31.058654188486656
        ],
        "wc_review_avg": [
            480.4,
            215.69756605024546
        ],
        "wc_reply_reviewers_avg": [
            21.4,
            42.8
        ],
        "wc_reply_authors_avg": [
            1306.0,
            777.6945415778614
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            5.2,
            2.4819347291981715
        ],
        "replies_avg": [
            35,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.7905694150420948,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8882038361941535553&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 11,
        "openreview": "https://openreview.net/forum?id=30N3bNAiw3",
        "pdf": "https://openreview.net/pdf?id=30N3bNAiw3",
        "email": "cea.fr;cea.fr;telecom-paris.fr;cea.fr",
        "author_num": 4,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Commissariat \u00e0 l'\u00c9nergie Atomique et aux \u00c9nergies Alternatives;Telecom Paris",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www cea fr;https://www.telecom-paris.fr",
        "aff_unique_abbr": "CEA;Telecom Paris",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "France"
    },
    {
        "title": "Matrix Manifold Neural Networks++",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19532",
        "id": "30aSE3FB3L",
        "author_site": "Xuan Son Nguyen, Yang, Aymeric Histace",
        "tldr": "",
        "abstract": "Deep neural networks (DNNs) on Riemannian manifolds have garnered increasing interest in various applied areas. For instance, DNNs on spherical and hyperbolic manifolds have been designed to solve a wide range of computer vision and nature language processing tasks. One of the key factors that contribute to the success of these networks is that spherical and hyperbolic manifolds have the rich algebraic structures of gyrogroups and gyrovector spaces. This enables principled and effective generalizations of the most successful DNNs to these manifolds. Recently, some works have shown that many concepts in the theory of gyrogroups and gyrovector spaces can also be generalized to matrix manifolds such as Symmetric Positive Definite (SPD) and Grassmann manifolds. As a result, some building blocks for SPD and Grassmann neural networks, e.g., isometric models and multinomial logistic regression (MLR) can be derived in a way that is fully analogous to their spherical and hyperbolic counterparts. Building upon these works, in this paper, we design fully-connected (FC) and convolutional layers for SPD neural networks. We also develop MLR on Symmetric Positive Semi-definite (SPSD) manifolds, and propose a method for performing backpropagation with the Grassmann logarithmic map in the projector perspective. We demonstrate the effectiveness of the proposed approach in the human action recognition and node classification tasks.",
        "keywords": "manifold learning;representation learning;gyrovector spaces;deep learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Xuan Son Nguyen;Shuo Yang;Aymeric Histace",
        "authorids": "~Xuan_Son_Nguyen2;~Shuo_Yang17;~Aymeric_Histace1",
        "gender": "M;M;M",
        "homepage": "https://nguyenxuanson10.github.io/;https://syangunique1111.github.io;https://aymeric.histace.free.fr",
        "dblp": "69/9959;;72/6341",
        "google_scholar": ";;https://scholar.google.fr/citations?user=y0MU8CAAAAAJ",
        "orcid": ";0009-0009-5849-1889;",
        "linkedin": ";shuo-yang-a51b97181/;",
        "or_profile": "~Xuan_Son_Nguyen2;~Shuo_Yang17;~Aymeric_Histace1",
        "aff": "Ecole Nationale Sup\u00e9rieure de l'Electronique et de ses Applications;Ecole Nationale Sup\u00e9rieure de l'Electronique et de ses Applications;ETIS",
        "aff_domain": "ensea.fr;ensea.fr;ensea.fr",
        "position": "Associate Professor;PhD student;Full Professor",
        "bibtex": "@inproceedings{\nnguyen2024matrix,\ntitle={Matrix Manifold Neural Networks++},\nauthor={Xuan Son Nguyen and Shuo Yang and Aymeric Histace},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=30aSE3FB3L}\n}",
        "github": "",
        "project": "",
        "reviewers": "2o5X;iDyb;pWPq",
        "pdf_size": 430741,
        "rating": "3;6;8",
        "confidence": "5;4;4",
        "soundness": "2;3;4",
        "contribution": "2;2;4",
        "presentation": "2;3;2",
        "wc_summary": "51;118;22",
        "wc_strengths": "30;88;64",
        "wc_weaknesses": "66;233;106",
        "wc_questions": "259;77;73",
        "wc_review": "406;516;265",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1308;793;322",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            5.666666666666667,
            2.0548046676563256
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            63.666666666666664,
            40.202266381663385
        ],
        "wc_strengths_avg": [
            60.666666666666664,
            23.79542439676633
        ],
        "wc_weaknesses_avg": [
            135.0,
            71.19456908126256
        ],
        "wc_questions_avg": [
            136.33333333333334,
            86.75380235022683
        ],
        "wc_review_avg": [
            395.6666666666667,
            102.73049963645438
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            807.6666666666666,
            402.6663907283823
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.9176629354822472,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3398805311670412901&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=30aSE3FB3L",
        "pdf": "https://openreview.net/pdf?id=30aSE3FB3L",
        "email": "ensea.fr;ensea.fr;ensea.fr",
        "author_num": 3,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Ecole Nationale Sup\u00e9rieure de l'Electronique et de ses Applications;ETIS",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.enssea.fr;",
        "aff_unique_abbr": "ENSEA;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "France;"
    },
    {
        "title": "Repelling Random Walks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19531",
        "id": "31IOmrnoP4",
        "author_site": "Isaac Reid, Eli Berger, Krzysztof Choromanski, Adrian Weller",
        "tldr": "",
        "abstract": "We present a novel quasi-Monte Carlo mechanism to improve graph-based sampling, coined repelling random walks. By inducing correlations between the trajectories of an interacting ensemble such that their marginal transition probabilities are unmodified, we are able  to explore the graph more efficiently, improving the concentration of statistical estimators whilst leaving them unbiased. The mechanism has a trivial drop-in implementation. We showcase the effectiveness of repelling random walks in a range of settings including estimation of graph kernels, the PageRank vector and graphlet concentrations. We provide detailed experimental evaluation and robust theoretical guarantees. To our knowledge, repelling random walks constitute the first rigorously studied quasi-Monte Carlo scheme correlating the directions of walkers on a graph, inviting new research in this exciting nascent domain.",
        "keywords": "Graphs;random walkers;quasi-Monte Carlo;kernel;PageRank;graphlets;scalable;mixing",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Isaac Reid;Eli Berger;Krzysztof Marcin Choromanski;Adrian Weller",
        "authorids": "~Isaac_Reid3;~Eli_Berger1;~Krzysztof_Marcin_Choromanski1;~Adrian_Weller1",
        "gender": "M;M;;M",
        "homepage": "https://isaac-reid.github.io;http://math.haifa.ac.il/berger/;;http://mlg.eng.cam.ac.uk/adrian/",
        "dblp": "287/4898;;78/11411;73/8324",
        "google_scholar": "3JPyAi0AAAAJ;;;https://scholar.google.co.uk/citations?user=Ek4hM10AAAAJ",
        "orcid": "0000-0002-1664-1975;;;",
        "linkedin": ";;;",
        "or_profile": "~Isaac_Reid3;~Eli_Berger1;~Krzysztof_Marcin_Choromanski1;~Adrian_Weller1",
        "aff": "University of Cambridge;University of Haifa;Google Brain Robotics & Columbia University;University of Cambridge",
        "aff_domain": "cam.ac.uk;haifa.ac.il;columbia.edu;cam.ac.uk",
        "position": "PhD student;Associate Professor;research scientist & adjunct assistant professor;Principal Researcher",
        "bibtex": "@inproceedings{\nreid2024repelling,\ntitle={Repelling Random Walks},\nauthor={Isaac Reid and Eli Berger and Krzysztof Marcin Choromanski and Adrian Weller},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=31IOmrnoP4}\n}",
        "github": "",
        "project": "",
        "reviewers": "vsCv;KSvf;1jyG",
        "pdf_size": 620477,
        "rating": "6;6;6",
        "confidence": "3;4;4",
        "soundness": "3;2;3",
        "contribution": "3;2;2",
        "presentation": "3;2;3",
        "wc_summary": "55;67;43",
        "wc_strengths": "29;46;24",
        "wc_weaknesses": "13;257;56",
        "wc_questions": "279;63;47",
        "wc_review": "376;433;170",
        "wc_reply_reviewers": "40;484;0",
        "wc_reply_authors": "571;2075;434",
        "reply_reviewers": "1;3;0",
        "reply_authors": "1;5;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            55.0,
            9.797958971132712
        ],
        "wc_strengths_avg": [
            33.0,
            9.41629792788369
        ],
        "wc_weaknesses_avg": [
            108.66666666666667,
            106.34639418219855
        ],
        "wc_questions_avg": [
            129.66666666666666,
            105.79645026601266
        ],
        "wc_review_avg": [
            326.3333333333333,
            112.96705517785065
        ],
        "wc_reply_reviewers_avg": [
            174.66666666666666,
            219.3404254172546
        ],
        "wc_reply_authors_avg": [
            1026.6666666666667,
            743.3905807552013
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            1.247219128924647
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            1.699673171197595
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8497924878712380616&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=31IOmrnoP4",
        "pdf": "https://openreview.net/pdf?id=31IOmrnoP4",
        "email": "cam.ac.uk;haifa.ac.il;columbia.edu;cam.ac.uk",
        "author_num": 4,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "University of Cambridge;University of Haifa;Google",
        "aff_unique_dep": ";;Google Brain Robotics",
        "aff_unique_url": "https://www.cam.ac.uk;https://www.haifa.ac.il;https://ai.google",
        "aff_unique_abbr": "Cambridge;UoH;Google",
        "aff_campus_unique_index": "0;2;0",
        "aff_campus_unique": "Cambridge;;Mountain View",
        "aff_country_unique_index": "0;1;2;0",
        "aff_country_unique": "United Kingdom;Israel;United States"
    },
    {
        "id": "324zEJCo3a",
        "title": "Local Vs. Global Interpretability: A Computational Perspective",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The local and global interpretability of various ML models has been studied extensively in recent years. Yet despite significant progress in the field, many of the known results are either informal or lack sufficient mathematical rigor. In this work, we propose a framework based on computational complexity theory to systematically evaluate the local and global interpretability of different ML models. In essence, our framework examines various forms of explanations that can be computed either locally or globally and assesses the computational complexity involved in generating them. We begin by rigorously studying global explanations, and establish: (1) a duality relationship between local and global forms of explanations; and (2) the inherent uniqueness associated with certain global forms of explanations. We then proceed to evaluate the computational complexity associated with these forms of explanations, with a particular emphasis on three model types usually positioned at the extremes of the interpretability spectrum: (1) linear models; (2) decision trees; and (3) neural networks.\nOur findings reveal that, assuming standard complexity assumptions such as P!=NP, computing global explanations is computationally more difficult for linear models than for their local counterparts. Surprisingly, this phenomenon is not universally applicable to decision trees and neural networks: in certain scenarios, computing a global explanation is actually more tractable than computing a local one. We consider these results as compelling evidence of the importance of analyzing ML explainability from a computational complexity perspective, as the means of gaining a deeper understanding of the inherent interpretability of diverse ML models.",
        "keywords": "interpretability;explainable AI",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Shahaf Bassan;Guy Amir;Guy Katz",
        "authorids": "~Shahaf_Bassan1;~Guy_Amir1;~Guy_Katz1",
        "gender": ";M;M",
        "homepage": ";https://guyam2.github.io/;http://www.katz-lab.com",
        "dblp": ";277/9596;23/10321",
        "google_scholar": ";CSJEObYAAAAJ;https://scholar.google.com.tw/citations?user=3nYG5BMAAAAJ",
        "orcid": ";;",
        "linkedin": ";https://linkedin.com/in/guy-amir-a335a3ba;",
        "or_profile": "~Shahaf_Bassan1;~Guy_Amir1;~Guy_Katz1",
        "aff": ";Cornell University;Hebrew University of Jerusalem",
        "aff_domain": ";cornell.edu;huji.ac.il",
        "position": ";Postdoc;Associate Professor",
        "bibtex": "@misc{\nbassan2024local,\ntitle={Local Vs. Global Interpretability: A Computational Perspective},\nauthor={Shahaf Bassan and Guy Amir and Guy Katz},\nyear={2024},\nurl={https://openreview.net/forum?id=324zEJCo3a}\n}",
        "github": "",
        "project": "",
        "reviewers": "D69M;aaJG;RGYJ;qXuS",
        "site": "https://openreview.net/forum?id=324zEJCo3a",
        "pdf_size": 424863,
        "rating": "6;6;6;6",
        "confidence": "5;1;1;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;4;3;2",
        "wc_summary": "97;38;87;103",
        "wc_strengths": "60;42;21;111",
        "wc_weaknesses": "125;112;41;192",
        "wc_questions": "150;6;1;85",
        "wc_review": "432;198;150;491",
        "wc_reply_reviewers": "44;0;0;0",
        "wc_reply_authors": "790;533;293;478",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            2.5,
            1.6583123951777
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            81.25,
            25.616157010761782
        ],
        "wc_strengths_avg": [
            58.5,
            33.30540496676178
        ],
        "wc_weaknesses_avg": [
            117.5,
            53.59337645642417
        ],
        "wc_questions_avg": [
            60.5,
            61.48373768729419
        ],
        "wc_review_avg": [
            317.75,
            146.24358960310022
        ],
        "wc_reply_reviewers_avg": [
            11.0,
            19.05255888325765
        ],
        "wc_reply_authors_avg": [
            523.5,
            177.7027011612373
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Io_M2wWVXycJ:scholar.google.com/&scioq=Local+Vs.+Global+Interpretability:+A+Computational+Perspective&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Cornell University;Hebrew University of Jerusalem",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cornell.edu;https://www.huji.ac.il",
        "aff_unique_abbr": "Cornell;HUJI",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Jerusalem",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United States;Israel"
    },
    {
        "title": "DDMI: Domain-agnostic Latent Diffusion Models for Synthesizing High-Quality Implicit Neural Representations",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19530",
        "id": "327tbF3S65",
        "author_site": "Dogyun Park, Sihyeon Kim, Sojin Lee, Hyunwoo Kim",
        "tldr": "",
        "abstract": "Recent studies have introduced a new class of generative models for synthesizing implicit neural representations (INRs) that capture arbitrary continuous signals in various domains. These models opened the door for domain-agnostic generative models, but they often fail to achieve high-quality generation. We observed that the existing methods generate the weights of neural networks to parameterize INRs and evaluate the network with fixed positional embeddings (PEs). Arguably, this architecture limits the expressive power of generative models and results in low-quality INR generation. To address this limitation, we propose Domain-agnostic Latent Diffusion Model for INRs (DDMI) that generates adaptive positional embeddings instead of neural networks' weights. Specifically, we develop a Discrete-to-continuous space Variational AutoEncoder (D2C-VAE) that seamlessly connects discrete data and continuous signal functions in the shared latent space. Additionally, we introduce a novel conditioning mechanism for evaluating INRs with the hierarchically decomposed PEs to further enhance expressive power. Extensive experiments across four modalities, \\eg, 2D images, 3D shapes, Neural Radiance Fields, and videos, with seven benchmark datasets, demonstrate the versatility of DDMI and its superior performance compared to the existing INR generative models. Code is available at \\href{https://github.com/mlvlab/DDMI}{https://github.com/mlvlab/DDMI}.",
        "keywords": "Implicit neural representation;generative model;domain agnostic;diffusion model",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Dogyun Park;Sihyeon Kim;Sojin Lee;Hyunwoo J. Kim",
        "authorids": "~Dogyun_Park2;~Sihyeon_Kim1;~Sojin_Lee1;~Hyunwoo_J._Kim3",
        "gender": "M;F;F;M",
        "homepage": "https://dogyunpark.github.io/;;;https://hyunwoojkim.com/publications",
        "dblp": "323/9575;304/2362;342/6155;150/4259",
        "google_scholar": "Cgc-2roAAAAJ;;roblxQYAAAAJ;https://scholar.google.co.kr/citations?user=LfBoJt8AAAAJ",
        "orcid": ";;0000-0001-9198-8437;0000-0002-2181-9264",
        "linkedin": "dogyunpark/;sihyeon-kim-a91aaa212/;sojin-lee-4b5138262/;",
        "or_profile": "~Dogyun_Park2;~Sihyeon_Kim1;~Sojin_Lee1;~Hyunwoo_Kim1",
        "aff": "Korea University;Korea University;Korea University;Korea University",
        "aff_domain": "korea.ac.kr;korea.ac.kr;korea.ac.kr;korea.ac.kr",
        "position": "PhD student;PhD student;PhD student;Associate Professor",
        "bibtex": "@inproceedings{\npark2024ddmi,\ntitle={{DDMI}: Domain-agnostic Latent Diffusion Models for Synthesizing High-Quality Implicit Neural Representations},\nauthor={Dogyun Park and Sihyeon Kim and Sojin Lee and Hyunwoo J. Kim},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=327tbF3S65}\n}",
        "github": "",
        "project": "",
        "reviewers": "9btm;KC2J;qBmp;6uL5",
        "pdf_size": 29003266,
        "rating": "6;6;6;6",
        "confidence": "5;4;3;4",
        "soundness": "4;3;2;3",
        "contribution": "3;3;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "82;83;77;171",
        "wc_strengths": "28;78;56;127",
        "wc_weaknesses": "243;119;117;291",
        "wc_questions": "90;188;5;9",
        "wc_review": "443;468;255;598",
        "wc_reply_reviewers": "71;237;0;0",
        "wc_reply_authors": "518;567;605;616",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            103.25,
            39.18146883413127
        ],
        "wc_strengths_avg": [
            72.25,
            36.237929024711114
        ],
        "wc_weaknesses_avg": [
            192.5,
            76.41171376170017
        ],
        "wc_questions_avg": [
            73.0,
            74.55534856735632
        ],
        "wc_review_avg": [
            441.0,
            122.45203142455416
        ],
        "wc_reply_reviewers_avg": [
            77.0,
            96.81683737862954
        ],
        "wc_reply_authors_avg": [
            576.5,
            38.356876828021335
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2438860377824535516&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=327tbF3S65",
        "pdf": "https://openreview.net/pdf?id=327tbF3S65",
        "email": "korea.ac.kr;korea.ac.kr;korea.ac.kr;korea.ac.kr",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Korea University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.korea.ac.kr",
        "aff_unique_abbr": "KU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "32camXjW25",
        "title": "Covariance-corrected Whitening Alleviates Network Degeneration on Imbalanced Classification",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Class imbalance is a critical issue in image classification that significantly affects the performance of deep recognition models. In this work, We first identify a network degeneration dilemma that hinders the model learning by introducing a high linear dependence among the features inputted into the classifier. To overcome this challenge, we propose a novel framework called Whitening-Net to mitigate the degenerate solutions, in which ZCA whitening is integrated before the linear classifier to normalize and decorrelate the batch samples. However, in scenarios with extreme class imbalance, the batch covariance statistic exhibits significant fluctuations, impeding the convergence of the whitening operation. Therefore, we propose two covariance-corrected modules, the Group-based Relatively Balanced Batch Sampler (GRBS) and the Batch Embedded Training (BET), to get more accurate and stable batch covariance, thereby reinforcing the capability of whitening. Our modules can be trained end-to-end without incurring substantial computational costs. Comprehensive empirical evaluations conducted on benchmark datasets, including CIFAR-LT-10/100, ImageNet-LT, and iNaturalist-LT, validate the effectiveness of our proposed approaches.",
        "keywords": "imbalanced classification;neural network;ZCA whitening;sampling",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/075d985c0fd34c578a57df71c77e9023457c74c8.pdf",
        "author": "Zhiwei Zhang;Hongsheng Li",
        "authorids": "~Zhiwei_Zhang3;~Hongsheng_Li3",
        "gender": ";M",
        "homepage": ";http://www.ee.cuhk.edu.hk/~hsli",
        "dblp": ";27/7402-1",
        "google_scholar": ";BN2Ze-QAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Zhiwei_Zhang3;~Hongsheng_Li3",
        "aff": ";The Chinese University of Hong Kong",
        "aff_domain": ";cuhk.edu.hk",
        "position": ";Associate Professor",
        "bibtex": "@misc{\nanonymous2024covariancecorrected,\ntitle={Covariance-corrected Whitening Alleviates Network Degeneration on Imbalanced Classification},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=32camXjW25}\n}",
        "github": "",
        "project": "",
        "reviewers": "xPQZ;bhjW;piR7;iY3M",
        "site": "https://openreview.net/forum?id=32camXjW25",
        "pdf_size": 2226529,
        "rating": "5;5;6;6",
        "confidence": "4;2;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "92;79;91;47",
        "wc_strengths": "40;7;142;50",
        "wc_weaknesses": "517;106;228;74",
        "wc_questions": "14;3;6;52",
        "wc_review": "663;195;467;223",
        "wc_reply_reviewers": "19;0;121;127",
        "wc_reply_authors": "1268;406;1199;440",
        "reply_reviewers": "1;0;1;2",
        "reply_authors": "4;2;3;3",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            77.25,
            18.198557635153396
        ],
        "wc_strengths_avg": [
            59.75,
            50.08180807438965
        ],
        "wc_weaknesses_avg": [
            231.25,
            174.69884802138793
        ],
        "wc_questions_avg": [
            18.75,
            19.613452016409553
        ],
        "wc_review_avg": [
            387.0,
            191.2694434560837
        ],
        "wc_reply_reviewers_avg": [
            66.75,
            57.68177788522126
        ],
        "wc_reply_authors_avg": [
            828.25,
            406.1615288281252
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:hBAExJM8MmoJ:scholar.google.com/&scioq=Covariance-corrected+Whitening+Alleviates+Network+Degeneration+on+Imbalanced+Classification&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "Chinese University of Hong Kong",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cuhk.edu.hk",
        "aff_unique_abbr": "CUHK",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "331CmSWDjz",
        "title": "Unsupervised Feature Learning with Emergent Data-Driven Prototypicality",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Given an image set without any labels, our goal is to train a model that maps each image to a point in a feature space such that, not only proximity indicates visual similarity, but where it is located directly encodes how prototypical the image is according to the dataset.\n\nOur key insight is to perform unsupervised feature learning in hyperbolic instead of Euclidean space, where the distance between points still reflects image similarity, and yet we gain additional capacity for representing prototypicality with the location of the point: The closer it is to the origin, the more prototypical it is.  The latter property is simply emergent from optimizing the usual metric learning objective:  The image similar to many training instances is best placed at the center of corresponding points in Euclidean space, but closer to the origin in hyperbolic space.\n\nWe propose an unsupervised feature learning algorithm in **H**yperbolic space with sphere p**ACK**ing. **HACK** first generates uniformly packed particles in the Poincare ball of hyperbolic space and then assigns each image uniquely to each particle. Images after congealing are regarded more typical of the dataset it belongs to.  With our feature mapper simply trained to spread out training instances in hyperbolic space, we observe that images move closer to the origin with congealing, validating our idea of unsupervised prototypicality discovery.  We demonstrate that our data-driven prototypicality provides an easy and superior unsupervised instance selection to reduce sample complexity, increase model generalization with atypical instances and robustness with typical ones.",
        "keywords": "Representation Learning;Hyperbolic Space;Prototypicality;Unsupervised Learning",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Yunhui Guo;Youren Zhang;Yubei Chen;Stella X. Yu",
        "authorids": "~Yunhui_Guo2;~Youren_Zhang1;~Yubei_Chen1;~Stella_X._Yu2",
        "gender": "M;M;M;F",
        "homepage": "https://yunhuiguo.github.io/;;https://redwood.berkeley.edu/people/yubei-chen/;http://www.eecs.umich.edu/~stellayu",
        "dblp": "165/3105;;30/10064;58/5089",
        "google_scholar": "BxIXuZYAAAAJ;;WeyLqFUAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;",
        "linkedin": ";youren-zhang-92a447251/;yubei-chen-05998a39/;",
        "or_profile": "~Yunhui_Guo2;~Youren_Zhang1;~Yubei_Chen1;~Stella_Yu2",
        "aff": "University of Texas at Dallas;University of Michigan - Ann Arbor;University of California, Davis;University of California, Berkeley",
        "aff_domain": "utdallas.edu;umich.edu;ucdavis.edu;berkeley.edu",
        "position": "Assistant Professor;MS student;Assistant Professor;Adjunct Professor",
        "bibtex": "@misc{\nguo2024unsupervised,\ntitle={Unsupervised Feature Learning with Emergent Data-Driven Prototypicality},\nauthor={Yunhui Guo and Youren Zhang and Yubei Chen and Stella X. Yu},\nyear={2024},\nurl={https://openreview.net/forum?id=331CmSWDjz}\n}",
        "github": "",
        "project": "",
        "reviewers": "9yFS;qJ86;PGEd",
        "site": "https://openreview.net/forum?id=331CmSWDjz",
        "pdf_size": 50621215,
        "rating": "3;5;5",
        "confidence": "4;2;4",
        "soundness": "2;3;2",
        "contribution": "3;3;2",
        "presentation": "2;3;2",
        "wc_summary": "107;138;61",
        "wc_strengths": "95;18;24",
        "wc_weaknesses": "203;70;160",
        "wc_questions": "178;79;4",
        "wc_review": "583;305;249",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            102.0,
            31.63331577098213
        ],
        "wc_strengths_avg": [
            45.666666666666664,
            34.96982826507572
        ],
        "wc_weaknesses_avg": [
            144.33333333333334,
            55.41560149352246
        ],
        "wc_questions_avg": [
            87.0,
            71.26008700527947
        ],
        "wc_review_avg": [
            379.0,
            146.05021967346255
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1732935440179672701&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "University of Texas at Dallas;University of Michigan;University of California, Davis;University of California, Berkeley",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.utdallas.edu;https://www.umich.edu;https://www.ucdavis.edu;https://www.berkeley.edu",
        "aff_unique_abbr": "UT Dallas;UM;UC Davis;UC Berkeley",
        "aff_campus_unique_index": "0;1;2;3",
        "aff_campus_unique": "Dallas;Ann Arbor;Davis;Berkeley",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "33UGifHHfg",
        "title": "Multi-Task Learning with Hypernetworks and Task Metadata",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Multi-task learning architectures aim to model a set of related tasks simultaneously by sharing parameters across networks to exploit shared knowledge and improve performance. Designing multi-task architectures is challenging due to the trade-off between parameter efficiency and the ability to flexibly model task differences at all network layers. We propose a novel multi-task learning architecture called Multi-Task Hypernetworks, which circumvents this trade-off, generating flexible task networks with a minimal number of parameters per task. Our approach uses a hypernetwork to generate different network weights for each task from task-specific embeddings and enable abstract knowledge transfer between tasks. Our approach stands out from existing multi-task learning architectures by providing the added capability to effectively leverage task-level metadata to explicitly learn task relationships and task functions. We show empirically that Multi-Task Hypernetworks outperform many state-of-the-art multi-task learning architectures on small tabular data problems, and leverage metadata more effectively than existing methods.",
        "keywords": "multi-task learning;hypernetworks;metadata",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/594e6fbc22c188b064c28331c7230e85299882c9.zip",
        "author": "Olivier Graffeuille;Yun Sing Koh;J\u00f6rg Wicker;Moritz K Lehmann",
        "authorids": "~Olivier_Graffeuille1;~Yun_Sing_Koh2;~J\u00f6rg_Wicker1;~Moritz_K_Lehmann1",
        "gender": "M;;;",
        "homepage": ";https://profiles.auckland.ac.nz/y-koh;https://wicker.nz;https://www.moritzlehmann.org",
        "dblp": ";23/1879.html;56/3110;",
        "google_scholar": "TvP8GX0AAAAJ;0L38IrAAAAAJ;https://scholar.google.co.nz/citations?user=_Q11KBoAAAAJ;",
        "orcid": ";0000-0001-7256-4049;0000-0003-0533-3368;0000-0001-7346-3901",
        "linkedin": "olivier-graffeuille-b2672a122/;yun-sing-koh-a7ba358/;j%C3%B6rg-wicker-bb197417/;moritzlehmann/",
        "or_profile": "~Olivier_Graffeuille1;~Yun_Sing_Koh2;~J\u00f6rg_Wicker1;~Moritz_K_Lehmann1",
        "aff": "University of Auckland;University of Auckland;University of Auckland;University of Waikato",
        "aff_domain": "auckland.ac.nz;auckland.ac.nz;auckland.ac.nz;waikato.ac.nz",
        "position": "PhD student;Full Professor;Associate Professor;Adjunct Research Fellow",
        "bibtex": "@misc{\ngraffeuille2024multitask,\ntitle={Multi-Task Learning with Hypernetworks and Task Metadata},\nauthor={Olivier Graffeuille and Yun Sing Koh and J{\\\"o}rg Wicker and Moritz K Lehmann},\nyear={2024},\nurl={https://openreview.net/forum?id=33UGifHHfg}\n}",
        "github": "",
        "project": "",
        "reviewers": "88C4;RnjU;66Fq;bXYN",
        "site": "https://openreview.net/forum?id=33UGifHHfg",
        "pdf_size": 8781379,
        "rating": "3;3;5;5",
        "confidence": "4;3;4;4",
        "soundness": "3;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "3;3;3;4",
        "wc_summary": "43;72;48;54",
        "wc_strengths": "17;39;33;55",
        "wc_weaknesses": "254;138;300;216",
        "wc_questions": "2;31;46;61",
        "wc_review": "316;280;427;386",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "226;285;240;181",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            54.25,
            10.96300597464035
        ],
        "wc_strengths_avg": [
            36.0,
            13.601470508735444
        ],
        "wc_weaknesses_avg": [
            227.0,
            59.371710435189584
        ],
        "wc_questions_avg": [
            35.0,
            21.805962487356524
        ],
        "wc_review_avg": [
            352.25,
            57.57766494049581
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            233.0,
            37.1012129181783
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:leTQgLQ2MKwJ:scholar.google.com/&scioq=Multi-Task+Learning+with+Hypernetworks+and+Task+Metadata&hl=en&as_sdt=0,47",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "University of Auckland;University of Waikato",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.auckland.ac.nz;https://www.waikato.ac.nz",
        "aff_unique_abbr": "UoA;UoW",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "New Zealand"
    },
    {
        "title": "Conformal Risk Control",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19529",
        "id": "33XGfHLtZg",
        "author_site": "Anastasios Angelopoulos, Stephen Bates, Adam Fisch, Lihua Lei, Tal Schuster",
        "tldr": "",
        "abstract": "We extend conformal prediction to control the expected value of any monotone loss function. The algorithm generalizes split conformal prediction together with its coverage guarantee. Like conformal prediction, the conformal risk control procedure is tight up to an $\\mathcal{O}(1/n)$ factor. We also introduce extensions of the idea to distribution shift, quantile risk control, multiple and adversarial risk control, and expectations of U-statistics. Worked examples from computer vision and natural language processing demonstrate the usage of our algorithm to bound the false negative rate, graph distance, and token-level F1-score.",
        "keywords": "conformal prediction;uncertainty quantification",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/0edbe9a906df6f1f354c50be92a440afe03dab24.zip",
        "author": "Anastasios Nikolas Angelopoulos;Stephen Bates;Adam Fisch;Lihua Lei;Tal Schuster",
        "authorids": "~Anastasios_Nikolas_Angelopoulos1;~Stephen_Bates1;~Adam_Fisch2;~Lihua_Lei2;~Tal_Schuster1",
        "gender": "M;;M;Not Specified;",
        "homepage": "http://angelopoulos.ai;https://stephenbates19.github.io/;https://lihualei71.github.io/;https://people.csail.mit.edu/tals/;https://people.csail.mit.edu/fisch/",
        "dblp": ";;;190/7491;https://dblp.org/pers/f/Fisch:Adam.html",
        "google_scholar": "nfX25MMAAAAJ;;https://scholar.google.co.uk/citations?user=-lKb3XwAAAAJ;oo8QRmIAAAAJ;https://scholar.google.com/citations?authorid=LYRkQhMAAAAJ",
        "orcid": ";0000-0002-3273-8179;;;",
        "linkedin": "anastasiosa/;;;;",
        "or_profile": "~Anastasios_Nikolas_Angelopoulos1;~Stephen_Bates1;~Lihua_Lei2;~Tal_Schuster1;~Adam_Fisch1",
        "aff": "University of California, Berkeley;Massachusetts Institute of Technology;;Google;Massachusetts Institute of Technology",
        "aff_domain": "berkeley.edu;mit.edu;;google.com;mit.edu",
        "position": "PhD student;Assistant Professor;;Researcher;PhD student",
        "bibtex": "@inproceedings{\nangelopoulos2024conformal,\ntitle={Conformal Risk Control},\nauthor={Anastasios Nikolas Angelopoulos and Stephen Bates and Adam Fisch and Lihua Lei and Tal Schuster},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=33XGfHLtZg}\n}",
        "github": "",
        "project": "",
        "reviewers": "fQpV;TBcZ;tJUM;GsY4;pT4W;nYbV",
        "pdf_size": 1468508,
        "rating": "6;6;6;8;8;8",
        "confidence": "3;4;3;4;3;4",
        "soundness": "3;3;3;4;3;4",
        "contribution": "3;2;3;4;3;4",
        "presentation": "3;3;3;4;3;4",
        "wc_summary": "93;45;40;59;75;28",
        "wc_strengths": "41;36;43;122;160;79",
        "wc_weaknesses": "151;106;122;540;309;94",
        "wc_questions": "124;6;155;3;22;18",
        "wc_review": "409;193;360;724;566;219",
        "wc_reply_reviewers": "48;15;36;19;192;0",
        "wc_reply_authors": "733;270;771;726;335;483",
        "reply_reviewers": "1;1;1;1;1;0",
        "reply_authors": "1;2;2;1;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.1666666666666665,
            0.6871842709362768
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            56.666666666666664,
            21.974732965132677
        ],
        "wc_strengths_avg": [
            80.16666666666667,
            46.53105295272061
        ],
        "wc_weaknesses_avg": [
            220.33333333333334,
            159.9777762343535
        ],
        "wc_questions_avg": [
            54.666666666666664,
            60.99635690396236
        ],
        "wc_review_avg": [
            411.8333333333333,
            186.62923731886767
        ],
        "wc_reply_reviewers_avg": [
            51.666666666666664,
            64.59274125025368
        ],
        "wc_reply_authors_avg": [
            553.0,
            200.98341556788543
        ],
        "reply_reviewers_avg": [
            0.8333333333333334,
            0.37267799624996495
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.33333333333333326,
        "gs_citation": 155,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14372458069187038582&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=33XGfHLtZg",
        "pdf": "https://openreview.net/pdf?id=33XGfHLtZg",
        "email": "berkeley.edu;mit.edu;;google.com;mit.edu",
        "author_num": 5,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "University of California, Berkeley;Massachusetts Institute of Technology;Google",
        "aff_unique_dep": ";;Google",
        "aff_unique_url": "https://www.berkeley.edu;https://web.mit.edu;https://www.google.com",
        "aff_unique_abbr": "UC Berkeley;MIT;Google",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Berkeley;;Mountain View",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "34QscjTwOc",
        "title": "Visualizing the Emergence of Primitive Interactions During the Training of DNNs",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Although the learning of deep neural networks (DNNs) is widely believed to be a fitting process without an explicit symbolic structure, previous studies have discovered (Ren et al., 2023a; Li & Zhang, 2023b) and proven (Ren et al., 2023c) that well-trained DNNs usually encode sparse interactions, which can be considered as primitives of the inference. In this study, we redefine the interaction on principal feature components in intermediate-layer features, which significantly simplifies the interaction and enables us to explore the dynamics of interactions throughout the learning of the DNN. Specifically, we visualize how new interactions are gradually learned and how previously learned interactions are gradually forgotten during the training process. We categorize all interactions into five distinct groups (reliable, withdrawing, forgetting, betraying, and fluctuating interactions), which provides a novel perspective for understanding the learning process of DNNs.",
        "keywords": "Visualization;Representation Complexity;Neural Network",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Jie Ren;Xinhao Zheng;Jiyu Liu;Quanshi Zhang",
        "authorids": "~Jie_Ren1;~Xinhao_Zheng2;~Jiyu_Liu1;~Quanshi_Zhang1",
        "gender": "F;M;M;M",
        "homepage": "https://jie-ren.github.io/;https://github.com/void-zxh;https://github.com/LJY-XCX;http://qszhang.com",
        "dblp": "r/JieRen-18;;;http://dblp.uni-trier.de/pers/hd/z/Zhang:Quanshi",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;;;iFFhHK0AAAAJ",
        "orcid": "0000-0001-9918-3000;;;",
        "linkedin": ";;;",
        "or_profile": "~Jie_Ren1;~Xinhao_Zheng2;~Jiyu_Liu1;~Quanshi_Zhang1",
        "aff": "Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn",
        "position": "PhD student;MS student;Undergrad student;Associate Professor",
        "bibtex": "@misc{\nren2024visualizing,\ntitle={Visualizing the Emergence of Primitive Interactions During the Training of {DNN}s},\nauthor={Jie Ren and Xinhao Zheng and Jiyu Liu and Quanshi Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=34QscjTwOc}\n}",
        "github": "",
        "project": "",
        "reviewers": "8d78;kGww;UCkY",
        "site": "https://openreview.net/forum?id=34QscjTwOc",
        "pdf_size": 19755599,
        "rating": "3;3;6",
        "confidence": "4;4;3",
        "soundness": "2;2;4",
        "contribution": "2;2;3",
        "presentation": "3;2;3",
        "wc_summary": "128;40;132",
        "wc_strengths": "32;298;197",
        "wc_weaknesses": "268;438;257",
        "wc_questions": "208;34;108",
        "wc_review": "636;810;694",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            100.0,
            42.45782220824175
        ],
        "wc_strengths_avg": [
            175.66666666666666,
            109.63677404147853
        ],
        "wc_weaknesses_avg": [
            321.0,
            82.85328398239062
        ],
        "wc_questions_avg": [
            116.66666666666667,
            71.29905718560067
        ],
        "wc_review_avg": [
            713.3333333333334,
            72.33870947762954
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:TMrupN3nH0cJ:scholar.google.com/&scioq=Visualizing+the+Emergence+of+Primitive+Interactions+During+the+Training+of+DNNs&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Shanghai Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sjtu.edu.cn",
        "aff_unique_abbr": "SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Polynomial Width is Sufficient for Set Representation with High-dimensional Features",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19528",
        "id": "34STseLBrQ",
        "author_site": "Peihao Wang, Shenghao Yang, Shu Li, Zhangyang Wang, Pan Li",
        "tldr": "",
        "abstract": "Set representation has become ubiquitous in deep learning for modeling the inductive bias of neural networks that are insensitive to the input order. DeepSets is the most widely used neural network architecture for set representation. It involves embedding each set element into a latent space with dimension $L$, followed by a sum pooling to obtain a whole-set embedding, and finally mapping the whole-set embedding to the output. In this work, we investigate the impact of the dimension $L$ on the expressive power of DeepSets. Previous analyses either oversimplified high-dimensional features to be one-dimensional features or were limited to complex analytic activations, thereby diverging from practical use or resulting in $L$ that grows exponentially with the set size $N$ and feature dimension $D$. To investigate the minimal value of $L$ that achieves sufficient expressive power, we present two set-element embedding layers: (a) linear + power activation (LP) and (b) linear + exponential activations (LE). We demonstrate that $L$ being $\\operatorname{poly}(N, D)$ is sufficient for set representation using both embedding layers. We also provide a lower bound of $L$ for the LP embedding layer. Furthermore, we extend our results to permutation-equivariant set functions and the complex field.",
        "keywords": "Set Representation; Permutation Invariance; Permutation Equivariance",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Peihao Wang;Shenghao Yang;Shu Li;Zhangyang Wang;Pan Li",
        "authorids": "~Peihao_Wang1;~Shenghao_Yang1;~Shu_Li6;~Zhangyang_Wang1;~Pan_Li2",
        "gender": "M;M;Not Specified;M;",
        "homepage": "https://peihaowang.github.io/;https://cs.uwaterloo.ca/~s286yang/;https://www.shuli.me/Shu-Li-087d71e8ce9340c5b4f7c08c7babe814;https://vita-group.github.io;",
        "dblp": "239/4075;41/4482-2;66/6852;119/4026;https://dblp.org/pers/hd/l/Li_0005:Pan",
        "google_scholar": "fqf2tBsAAAAJ;ocLDM-AAAAAJ;knBDWikAAAAJ;pxFyKAIAAAAJ;IroP0EwAAAAJ",
        "orcid": ";;;;",
        "linkedin": "peihao-wang-25a411162/;;;;pan-li-b951105a/",
        "or_profile": "~Peihao_Wang1;~Shenghao_Yang1;~Shu_Li6;~Zhangyang_Wang1;~Pan_Li2",
        "aff": "University of Texas, Austin;University of Waterloo;Purdue University;University of Texas at Austin;Purdue University",
        "aff_domain": "utexas.edu;uwaterloo.ca;purdue.edu;utexas.edu;purdue.edu",
        "position": "PhD student;PhD student;PhD student;Associate Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nwang2024polynomial,\ntitle={Polynomial Width is Sufficient for Set Representation with High-dimensional Features},\nauthor={Peihao Wang and Shenghao Yang and Shu Li and Zhangyang Wang and Pan Li},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=34STseLBrQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "XKbR;oY1k;jrmV;a75R",
        "pdf_size": 10522719,
        "rating": "5;8;8;8",
        "confidence": "3;3;3;3",
        "soundness": "4;4;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;2;3",
        "wc_summary": "964;349;231;31",
        "wc_strengths": "82;104;278;33",
        "wc_weaknesses": "502;208;209;166",
        "wc_questions": "184;1;97;241",
        "wc_review": "1732;662;815;471",
        "wc_reply_reviewers": "0;22;0;34",
        "wc_reply_authors": "815;261;141;535",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            7.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            393.75,
            348.3040159113874
        ],
        "wc_strengths_avg": [
            124.25,
            92.41313488893232
        ],
        "wc_weaknesses_avg": [
            271.25,
            134.34912541583589
        ],
        "wc_questions_avg": [
            130.75,
            90.78098644540056
        ],
        "wc_review_avg": [
            920.0,
            484.38982235385583
        ],
        "wc_reply_reviewers_avg": [
            14.0,
            14.628738838327793
        ],
        "wc_reply_authors_avg": [
            438.0,
            260.3247971285102
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13203073421312026361&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=34STseLBrQ",
        "pdf": "https://openreview.net/pdf?id=34STseLBrQ",
        "email": "utexas.edu;uwaterloo.ca;purdue.edu;utexas.edu;purdue.edu",
        "author_num": 5,
        "aff_unique_index": "0;1;2;0;2",
        "aff_unique_norm": "University of Texas at Austin;University of Waterloo;Purdue University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.utexas.edu;https://uwaterloo.ca;https://www.purdue.edu",
        "aff_unique_abbr": "UT Austin;UW;Purdue",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Austin;",
        "aff_country_unique_index": "0;1;0;0;0",
        "aff_country_unique": "United States;Canada"
    },
    {
        "title": "Beating Price of Anarchy and Gradient Descent without Regret in Potential Games",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19527",
        "id": "36L7W3ri4U",
        "author_site": "Iosif Sakos, Stefanos Leonardos, Stelios Stavroulakis, William Overman, Ioannis Panageas, Georgios Piliouras",
        "tldr": "",
        "abstract": "Arguably one of the thorniest problems in game theory is that of equilibrium selection. Specifically, in the presence of multiple equilibria do self-interested learning dynamics typically select the socially optimal ones? We study a rich class of continuous-time no-regret dynamics in potential games (PGs). Our class of dynamics, *Q-Replicator Dynamics* (QRD), include gradient descent (GD), log-barrier and replicator dynamics (RD) as special cases. We start by establishing *pointwise convergence* of all QRD to Nash equilibria in almost all PGs. In the case of GD, we show a tight average case performance within a factor of two of optimal, for a class of symmetric $2\\times2$ potential games with unbounded Price of Anarchy (PoA). Despite this positive result, we show that GD is not always the optimal choice even in this restricted setting. Specifically, GD outperforms RD, if and only if *risk-* and *payoff-dominance* equilibria coincide. Finally, we experimentally show how these insights extend to all QRD dynamics and that unbounded gaps between average case performance and PoA analysis are common even in larger settings.",
        "keywords": "q-replicator dynamics;potential games;average price of anarchy;learning",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Iosif Sakos;Stefanos Leonardos;Stelios Andrew Stavroulakis;William Overman;Ioannis Panageas;Georgios Piliouras",
        "authorids": "~Iosif_Sakos1;~Stefanos_Leonardos1;~Stelios_Andrew_Stavroulakis1;~William_Overman1;~Ioannis_Panageas1;~Georgios_Piliouras1",
        "gender": "M;M;;M;;M",
        "homepage": ";https://stefanosleonardos.com/;https://steliostavroulakis.github.io/;https://panageas.github.io;;https://willoverman.github.io/",
        "dblp": "271/1082;192/1237;315/4382;139/3829;62/1236;294/4924",
        "google_scholar": "https://scholar.google.gr/citations?user=69xvSfQAAAAJ;PtiGrVsAAAAJ;PPCdElkAAAAJ;5NiFWuwAAAAJ;;B2XPxEkAAAAJ",
        "orcid": "0000-0002-1871-9078;;0000-0002-2059-3152;;;",
        "linkedin": "joseph-sakos-3b3a6a200?lipi=urn%3Ali%3Apage%3Ad_flagship3_profile_view_base_contact_details%3BP9xevRgnRfKhbYYoPyDf3Q%3D%3D;stefanos-leonardos/;https://linkedin.com/in/steliostavroulakis;;;",
        "or_profile": "~Iosif_Sakos1;~Stefanos_Leonardos1;~Stelios_Andrew_Stavroulakis1;~Ioannis_Panageas1;~Georgios_Piliouras1;~Will_Overman1",
        "aff": "Singapore University of Technology and Design;King's College London, University of London;University of California, Irvine;Donald Bren School of Information and Computer Sciences, University of California, Irvine;Singapore University of Technology and Design;Stanford University",
        "aff_domain": "sutd.edu.sg;kcl.ac.uk;uci.edu;ics.uci.edu;sutd.edu.sg;stanford.edu",
        "position": "PhD student;Lecturer;PhD student;Assistant Professor;Associate Professor;PhD student",
        "bibtex": "@inproceedings{\nsakos2024beating,\ntitle={Beating Price of Anarchy and Gradient Descent without Regret in Potential Games},\nauthor={Iosif Sakos and Stefanos Leonardos and Stelios Andrew Stavroulakis and William Overman and Ioannis Panageas and Georgios Piliouras},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=36L7W3ri4U}\n}",
        "github": "",
        "project": "",
        "reviewers": "xUnV;ycpS",
        "pdf_size": 5645636,
        "rating": "6;8",
        "confidence": "2;3",
        "soundness": "4;4",
        "contribution": "3;3",
        "presentation": "3;3",
        "wc_summary": "183;294",
        "wc_strengths": "52;149",
        "wc_weaknesses": "49;33",
        "wc_questions": "253;52",
        "wc_review": "537;528",
        "wc_reply_reviewers": "0;0",
        "wc_reply_authors": "729;562",
        "reply_reviewers": "0;0",
        "reply_authors": "1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            2.5,
            0.5
        ],
        "soundness_avg": [
            4.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            238.5,
            55.5
        ],
        "wc_strengths_avg": [
            100.5,
            48.5
        ],
        "wc_weaknesses_avg": [
            41.0,
            8.0
        ],
        "wc_questions_avg": [
            152.5,
            100.5
        ],
        "wc_review_avg": [
            532.5,
            4.5
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            645.5,
            83.5
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.9999999999999999,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4530536547724086878&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=36L7W3ri4U",
        "pdf": "https://openreview.net/pdf?id=36L7W3ri4U",
        "email": "sutd.edu.sg;kcl.ac.uk;uci.edu;ics.uci.edu;sutd.edu.sg;stanford.edu",
        "author_num": 6,
        "aff_unique_index": "0;1;2;2;0;3",
        "aff_unique_norm": "Singapore University of Technology and Design;King's College London;University of California, Irvine;Stanford University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.sutd.edu.sg;https://www.kcl.ac.uk;https://www.uci.edu;https://www.stanford.edu",
        "aff_unique_abbr": "SUTD;KCL;UCI;Stanford",
        "aff_campus_unique_index": "1;1;2",
        "aff_campus_unique": ";Irvine;Stanford",
        "aff_country_unique_index": "0;1;2;2;0;2",
        "aff_country_unique": "Singapore;United Kingdom;United States"
    },
    {
        "id": "370Bvdd3z7",
        "title": "EC-Conf: An Ultra-fast Diffusion Model for Molecular Conformation Generation with Equivariant Consistency",
        "track": "main",
        "status": "Desk Reject",
        "tldr": "",
        "abstract": "Despite recent advancement in 3D molecule conformation generation driven by diffusion models, its high computational cost in iterative diffusion/denoising process limits its application. In this paper, an equivariant consistency model (EC-Conf) was proposed as a fast diffusion method for low-energy conformation generation. In EC-Conf, a modified SE (3)-equivariant transformer model was directly used to encode the Cartesian molecular conformations and a highly efficient consistency diffusion process was carried out to generate molecular conformations. It was demonstrated that, with only one sampling step, it can already achieve comparable quality to other diffusion-based models running with thousands denoising steps. Its performance can be further improved with a few more sampling iterations. The performance of EC-Conf is evaluated on both GEOM-QM9 and GEOM-Drugs sets. Our results demonstrate that the efficiency of EC-Conf for learning the distribution of low energy molecular conformation is at least two magnitudes higher than current SOTA diffusion models and could potentially become a useful tool for conformation generation and sampling. In the near future, we will release our code.",
        "keywords": "fast diffusion model;equivariant consistency;molecule conformation generation",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/f686381db6eabba03063ab0b42b7b31d80b416f5.zip",
        "author": "Zhiguang Fan;Yuedong Yang;Mingyuan Xu;Hongming Chen",
        "authorids": "~Zhiguang_Fan1;~Yuedong_Yang1;~Mingyuan_Xu1;~Hongming_Chen2",
        "gender": "M;M;M;M",
        "homepage": "https://github.com/zhi520/;http://biomed.nscc-gz.cn;;https://github.com/zhi520/EcConf",
        "dblp": ";98/2972;;",
        "google_scholar": ";AfjwTKoAAAAJ;NRbE1AoAAAAJ;",
        "orcid": ";0000-0002-6782-2813;;",
        "linkedin": ";;;",
        "or_profile": "~Zhiguang_Fan1;~Yuedong_Yang1;~Mingyuan_Xu1;~Hongming_Chen2",
        "aff": "SUN YAT-SEN UNIVERSITY;SUN YAT-SEN UNIVERSITY;;",
        "aff_domain": "sysu.edu.cn;sysu.edu.cn;;",
        "position": "PhD student;Full Professor;;",
        "bibtex": "@misc{\nfan2024ecconf,\ntitle={{EC}-Conf: An Ultra-fast Diffusion Model for Molecular Conformation Generation with Equivariant Consistency},\nauthor={Zhiguang Fan and Yuedong Yang and Mingyuan Xu and Hongming Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=370Bvdd3z7}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=370Bvdd3z7",
        "pdf_size": 2041176,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5808189580291946410&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 16,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Sun Yat-sen University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.sysu.edu.cn",
        "aff_unique_abbr": "SYSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "381QSrWdF2",
        "title": "Law of Balance and Stationary Distribution of Stochastic Gradient Descent",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The stochastic gradient descent (SGD) algorithm is the algorithm we use to train neural networks. However, it remains poorly understood how the SGD navigates the highly nonlinear and degenerate loss landscape of a neural network. In this work, we prove that the minibatch noise of SGD regularizes the solution towards a balanced solution whenever the loss function contains a rescaling symmetry. Because the difference between a simple diffusion process and SGD dynamics is the most significant when symmetries are present, our theory implies that the loss function symmetries constitute an essential probe of how SGD works. We then apply this result to derive the stationary distribution of stochastic gradient flow for a diagonal linear network with arbitrary depth and width. The stationary distribution exhibits complicated nonlinear phenomena such as phase transitions, broken ergodicity, and fluctuation inversion. These phenomena are shown to exist uniquely in deep networks, implying a fundamental difference between deep and shallow models.",
        "keywords": "stochastic gradient descent;stationary distribution;stochastic differential equation;phase transition",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Liu Ziyin;Hongchao Li;Masahito Ueda",
        "authorids": "~Liu_Ziyin1;~Hongchao_Li2;~Masahito_Ueda1",
        "gender": ";M;M",
        "homepage": "https://www.mit.edu/~ziyinl/;https://sites.google.com/view/condmat-hongchaoli;http://cat.phys.s.u-tokyo.ac.jp/index-e.html",
        "dblp": ";;",
        "google_scholar": "NpN9oRMAAAAJ;;https://scholar.google.co.jp/citations?user=Xpjx9CwAAAAJ",
        "orcid": ";;0000-0002-5367-1436",
        "linkedin": ";;",
        "or_profile": "~Liu_Ziyin1;~Hongchao_Li2;~Masahito_Ueda1",
        "aff": "Massachusetts Institute of Technology;;The University of Tokyo",
        "aff_domain": "mit.edu;;u-tokyo.ac.jp",
        "position": "Postdoc;;Full Professor",
        "bibtex": "@misc{\nziyin2024law,\ntitle={Law of Balance and Stationary Distribution of Stochastic Gradient Descent},\nauthor={Liu Ziyin and Hongchao Li and Masahito Ueda},\nyear={2024},\nurl={https://openreview.net/forum?id=381QSrWdF2}\n}",
        "github": "",
        "project": "",
        "reviewers": "8S7u;wHcL;eqby;Y3Mm",
        "site": "https://openreview.net/forum?id=381QSrWdF2",
        "pdf_size": 1371746,
        "rating": "3;5;6;8",
        "confidence": "4;2;4;3",
        "soundness": "2;3;4;4",
        "contribution": "2;2;3;4",
        "presentation": "2;3;4;4",
        "wc_summary": "61;33;45;81",
        "wc_strengths": "56;18;58;82",
        "wc_weaknesses": "90;45;67;23",
        "wc_questions": "293;21;3;67",
        "wc_review": "500;117;173;253",
        "wc_reply_reviewers": "134;0;0;24",
        "wc_reply_authors": "2503;515;449;523",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "4;1;1;1",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            55.0,
            18.0
        ],
        "wc_strengths_avg": [
            53.5,
            22.907422377910613
        ],
        "wc_weaknesses_avg": [
            56.25,
            24.933661985356263
        ],
        "wc_questions_avg": [
            96.0,
            116.1077086157504
        ],
        "wc_review_avg": [
            260.75,
            146.3427056603779
        ],
        "wc_reply_reviewers_avg": [
            39.5,
            55.43239125276845
        ],
        "wc_reply_authors_avg": [
            997.5,
            869.6750830051417
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            1.299038105676658
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.25087260300212727,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14809324360039312152&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Massachusetts Institute of Technology;University of Tokyo",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://web.mit.edu;https://www.u-tokyo.ac.jp",
        "aff_unique_abbr": "MIT;UTokyo",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United States;Japan"
    },
    {
        "title": "Language Model Self-improvement by Reinforcement Learning Contemplation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19526",
        "id": "38E4yUbrgr",
        "author_site": "Jing-Cheng Pang, Pengyuan Wang, Kaiyuan Li, XiongHui Chen, Jiacheng Xu, Zongzhang Zhang, Yang Yu",
        "tldr": "",
        "abstract": "Language model self-improvement (LMSI) techniques have recently gained significant attention as they improve language models without requiring external supervision. A common approach is reinforcement learning from AI feedback (RLAIF), which trains a reward model based on AI preference data and employs a reinforcement learning algorithm to train the language model. \nHowever, RLAIF relies on the heuristic assumption that an AI model can provide effective feedback and correct wrong answers, requiring a solid capability of the language model. This paper presents a novel LMSI method, Reinforcement Learning Contemplation (RLC). We disclose that it is simpler for language models to evaluate a sentence than to generate it, even for small language models. Leveraging the gap between the evaluation and generation, RLC evaluates generated answers and updates language model parameters using reinforcement learning to maximize evaluation scores. Through testing on various challenging reasoning tasks and text summarization task, our experiments show that RLC effectively improves language model performance without external supervision, resulting in an answering accuracy increase (from 31.23% to 37.09%) for BigBench-hard reasoning tasks, and a rise in BERTScore for CNN/Daily Mail summarization tasks. Furthermore, RLC can be applied to models of different sizes, showcasing its broad applicability.",
        "keywords": "Reinforcement learning; language model self-improvement; text evaluation",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/d95b45aacba89101b72096a3248f805ad0e1a028.zip",
        "author": "Jing-Cheng Pang;Pengyuan Wang;Kaiyuan Li;Xiong-Hui Chen;Jiacheng Xu;Zongzhang Zhang;Yang Yu",
        "authorids": "~Jing-Cheng_Pang1;~Pengyuan_Wang3;~Kaiyuan_Li2;~Xiong-Hui_Chen1;~Jiacheng_Xu3;~Zongzhang_Zhang1;~Yang_Yu5",
        "gender": "M;;;M;;M;",
        "homepage": "https://www.lamda.nju.edu.cn/pangjc;;;http://www.lamda.nju.edu.cn/chenxh/;http://www.lamda.nju.edu.cn/xujc/;http://www.lamda.nju.edu.cn/zhangzz;",
        "dblp": "254/2679;;;241/7938;188/6025-3;90/8724;",
        "google_scholar": "R3Y_WrkAAAAJ;;;H5pguCYAAAAJ;;sG7WEAgAAAAJ;",
        "orcid": ";;;;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Jing-Cheng_Pang1;~Pengyuan_Wang3;~Kaiyuan_Li2;~Xiong-Hui_Chen1;~Jiacheng_Xu3;~Zongzhang_Zhang1;~Yang_Yu5",
        "aff": "Nanjing University;;;Nanjing University;Nanjing University;Nanjing University;",
        "aff_domain": "nju.edu.cn;;;nju.edu.cn;nju.edu.cn;nju.edu.cn;",
        "position": "PhD student;;;PhD student;MS student;Associate Professor;",
        "bibtex": "@inproceedings{\npang2024language,\ntitle={Language Model Self-improvement by Reinforcement Learning Contemplation},\nauthor={Jing-Cheng Pang and Pengyuan Wang and Kaiyuan Li and Xiong-Hui Chen and Jiacheng Xu and Zongzhang Zhang and Yang Yu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=38E4yUbrgr}\n}",
        "github": "",
        "project": "",
        "reviewers": "BB78;jzQi;scBc;Rzu4;ksaG",
        "pdf_size": 1099213,
        "rating": "3;5;6;8;8",
        "confidence": "3;4;4;4;3",
        "soundness": "2;3;3;3;3",
        "contribution": "2;2;2;3;3",
        "presentation": "2;4;3;4;3",
        "wc_summary": "58;62;74;156;145",
        "wc_strengths": "11;52;37;71;100",
        "wc_weaknesses": "127;208;47;255;190",
        "wc_questions": "40;198;104;128;39",
        "wc_review": "236;520;262;610;474",
        "wc_reply_reviewers": "0;0;43;185;24",
        "wc_reply_authors": "863;983;1052;1526;731",
        "reply_reviewers": "0;0;1;3;1",
        "reply_authors": "3;3;3;5;2",
        "rating_avg": [
            6.0,
            1.8973665961010275
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            3.2,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            99.0,
            42.5205832509386
        ],
        "wc_strengths_avg": [
            54.2,
            30.155596495509748
        ],
        "wc_weaknesses_avg": [
            165.4,
            72.02943842624347
        ],
        "wc_questions_avg": [
            101.8,
            59.51268772287133
        ],
        "wc_review_avg": [
            420.4,
            146.857209560852
        ],
        "wc_reply_reviewers_avg": [
            50.4,
            69.20866997710618
        ],
        "wc_reply_authors_avg": [
            1031.0,
            270.5527674964719
        ],
        "reply_reviewers_avg": [
            1.0,
            1.0954451150103321
        ],
        "reply_authors_avg": [
            3.2,
            0.9797958971132712
        ],
        "replies_avg": [
            30,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.21516574145596765,
        "gs_citation": 41,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8291999413488443176&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=38E4yUbrgr",
        "pdf": "https://openreview.net/pdf?id=38E4yUbrgr",
        "email": "nju.edu.cn;;;nju.edu.cn;nju.edu.cn;nju.edu.cn;",
        "author_num": 7,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Nanjing University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nju.edu.cn",
        "aff_unique_abbr": "Nanjing U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "39HaKNXpsu",
        "title": "Adapt and Diffuse: Sample-adaptive Reconstruction via Latent Diffusion Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Inverse problems arise in a multitude of applications, where the goal is to recover a clean signal from noisy and possibly (non)linear observations. The difficulty of a reconstruction problem  depends on multiple factors, such as the structure of the ground truth signal, the severity of the degradation, the implicit bias of the reconstruction model and the complex interactions between the above factors. This results in natural sample-by-sample variation in the difficulty of a reconstruction task, which is often overlooked by contemporary techniques. Recently, diffusion-based inverse problem solvers have established new state-of-the-art in various reconstruction tasks. Our key observation in this paper is that most existing solvers lack the ability to adapt their compute power to the difficulty of the reconstruction task,  resulting in long inference times, subpar performance and wasteful resource allocation. We propose a novel method that we call severity encoding,  to estimate the degradation severity of noisy, degraded signals in the latent space of an autoencoder. We show that the estimated severity has strong correlation with the true corruption level and can give useful hints at the difficulty of reconstruction problems on a sample-by-sample basis. Furthermore, we propose a reconstruction method based on latent diffusion models that leverages the predicted degradation severities to fine-tune the reverse diffusion sampling trajectory and thus achieve sample-adaptive inference times. We perform numerical experiments on both linear and nonlinear inverse problems and demonstrate that our technique achieves performance comparable to state-of-the-art diffusion-based techniques, with significant improvements in computational efficiency.",
        "keywords": "inverse problems;diffusion models;image reconstruction;sample-adaptive reconstruction",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/bc5b7304cc96bab3acf9bc103f43fdbd46aa5572.zip",
        "author": "Zalan Fabian;Berk Tinaz;Mahdi Soltanolkotabi",
        "authorids": "~Zalan_Fabian1;~Berk_Tinaz1;~Mahdi_Soltanolkotabi1",
        "gender": "M;M;M",
        "homepage": "https://z-fabian.github.io/;https://berktinaz.github.io/;http://www-bcf.usc.edu/~soltanol/",
        "dblp": "192/2874;275/8488;75/6691",
        "google_scholar": "5EKjsXQAAAAJ;gzIzOtAAAAAJ;narJyMAAAAAJ",
        "orcid": ";;",
        "linkedin": ";berk-tinaz/;",
        "or_profile": "~Zalan_Fabian1;~Berk_Tinaz1;~Mahdi_Soltanolkotabi1",
        "aff": "University of Southern California;Amazon;University of Southern California",
        "aff_domain": "usc.edu;amazon.com;usc.edu",
        "position": "Postdoc;Intern;Associate Professor",
        "bibtex": "@misc{\nfabian2024adapt,\ntitle={Adapt and Diffuse: Sample-adaptive Reconstruction via Latent Diffusion Models},\nauthor={Zalan Fabian and Berk Tinaz and Mahdi Soltanolkotabi},\nyear={2024},\nurl={https://openreview.net/forum?id=39HaKNXpsu}\n}",
        "github": "",
        "project": "",
        "reviewers": "VtJz;Gc37;fcte;Cd1z",
        "site": "https://openreview.net/forum?id=39HaKNXpsu",
        "pdf_size": 33178025,
        "rating": "5;5;6;8",
        "confidence": "3;4;2;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;3;4",
        "wc_summary": "69;106;151;57",
        "wc_strengths": "35;9;117;103",
        "wc_weaknesses": "31;349;120;191",
        "wc_questions": "26;3;143;84",
        "wc_review": "161;467;531;435",
        "wc_reply_reviewers": "24;171;10;13",
        "wc_reply_authors": "495;995;680;666",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;4;2;2",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            95.75,
            36.656343243700675
        ],
        "wc_strengths_avg": [
            66.0,
            45.221676218380054
        ],
        "wc_weaknesses_avg": [
            172.75,
            116.48256307276209
        ],
        "wc_questions_avg": [
            64.0,
            54.32770932038272
        ],
        "wc_review_avg": [
            398.5,
            141.40986528527634
        ],
        "wc_reply_reviewers_avg": [
            54.5,
            67.46295279633111
        ],
        "wc_reply_authors_avg": [
            709.0,
            180.47298966881442
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.5,
            0.8660254037844386
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.28867513459481287,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4530409226247603787&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Southern California;Amazon",
        "aff_unique_dep": ";Amazon.com, Inc.",
        "aff_unique_url": "https://www.usc.edu;https://www.amazon.com",
        "aff_unique_abbr": "USC;Amazon",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Los Angeles;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "39VR7gVEJs",
        "title": "Analyzing Implicit Regularization In Federated Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Backward error analysis is a powerful technique that can check how much the path of the gradient flow is modified under the influence of a finite learning rate. Through this technique, it is also possible to find an implicit regularizer that affects the convergence behavior of an optimizer. With a backward error analysis, this paper seeks a more intuitive but quantitative way to understand the convergence behaviour under various federated learning algorithms. We prove that the implicit regularizer for FedAvg disperses the gradient of each client from the average gradient, increasing the gradient variance. We then theoretically present that the implicit regularizer of FedAvg hampers the convergence if the variance of gradients from clients decreases following the gradient of the cost function. In order to verify our analysis, we run experiments on FedAvg with and without the drifting term and confirm that FedAvg without the drifting term shows higher test accuracies. Our analysis also explains the convergence behavior of variance reduction methods such as SCAFFOLD, FedDyn, and FedSAM to show that the implicit regularizers of those methods have a smaller or zero drifting effect when the learning rate is small. Especially, we provide a possible reason FedSAM can perform better than FedAvg but might not perform as well as other stable variance reduction methods under data heterogeneity.",
        "keywords": "federated learning;implicit regularization;backward error analysis;optimization",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/7b869b9fa8957c46f777cbba2f0b448dc6a58700.pdf",
        "author": "Jinwoo Lim;Sangyoon Yu;Suhyun Kim;Soo-Mook Moon",
        "authorids": "~Jinwoo_Lim1;~Sangyoon_Yu1;~Suhyun_Kim1;~Soo-Mook_Moon1",
        "gender": "M;M;;M",
        "homepage": "https://github.com/jinwoolim8180;;https://kdst.tistory.com/;https://altair.snu.ac.kr/smoon/",
        "dblp": "212/5596;350/3784;45/6898-1;37/4764",
        "google_scholar": ";RrZWQZUAAAAJ;;",
        "orcid": ";;;",
        "linkedin": ";sangyoon-yu-391501225/;;",
        "or_profile": "~Jinwoo_Lim1;~Sangyoon_Yu1;~Suhyun_Kim1;~Soo-Mook_Moon1",
        "aff": "Seoul National University;Seoul National University;Korea Institute of Science and Technology;Seoul National University",
        "aff_domain": "snu.ac.kr;snu.ac.kr;kist.re.kr;snu.ac.kr",
        "position": "MS student;MS student;Principal Researcher;Full Professor",
        "bibtex": "@misc{\nlim2024analyzing,\ntitle={Analyzing Implicit Regularization In Federated Learning},\nauthor={Jinwoo Lim and Sangyoon Yu and Suhyun Kim and Soo-Mook Moon},\nyear={2024},\nurl={https://openreview.net/forum?id=39VR7gVEJs}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=39VR7gVEJs",
        "pdf_size": 698499,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:P1OjMWbWBfkJ:scholar.google.com/&scioq=Analyzing+Implicit+Regularization+In+Federated+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Seoul National University;Korea Institute of Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.snu.ac.kr;https://www.kist.re.kr",
        "aff_unique_abbr": "SNU;KIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "Training Unbiased Diffusion Models From Biased Dataset",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19525",
        "id": "39cPKijBed",
        "author_site": "Yeongmin Kim, Byeonghu Na, Minsang Park, JoonHo Jang, Dongjun Kim, Wanmo Kang, Il-chul Moon",
        "tldr": "",
        "abstract": "With significant advancements in diffusion models, addressing the potential risks of dataset bias becomes increasingly important. Since generated outputs directly suffer from dataset bias, mitigating latent bias becomes a key factor in improving sample quality and proportion. This paper proposes time-dependent importance reweighting to mitigate the bias for the diffusion models. We demonstrate that the time-dependent density ratio becomes more precise than previous approaches, thereby minimizing error propagation in generative learning. While directly applying it to score-matching is intractable, we discover that using the time-dependent density ratio both for reweighting and score correction can lead to a tractable form of the objective function to regenerate the unbiased data density. Furthermore, we theoretically establish a connection with traditional score-matching, and we demonstrate its convergence to an unbiased distribution. The experimental evidence supports the usefulness of the proposed method, which outperforms baselines including time-independent importance reweighting on CIFAR-10, CIFAR-100, FFHQ, and CelebA with various bias settings. Our code is available at https://github.com/alsdudrla10/TIW-DSM.",
        "keywords": "diffusion model;density ratio estimation;dataset bias",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Yeongmin Kim;Byeonghu Na;Minsang Park;JoonHo Jang;Dongjun Kim;Wanmo Kang;Il-chul Moon",
        "authorids": "~Yeongmin_Kim1;~Byeonghu_Na1;~Minsang_Park1;~JoonHo_Jang1;~Dongjun_Kim1;~Wanmo_Kang1;~Il-chul_Moon1",
        "gender": "M;M;M;;M;M;",
        "homepage": "https://sites.google.com/view/yeongmin-space/%ED%99%88;https://sites.google.com/view/byeonghu-na;;https://aailab.kaist.ac.kr/xe2/members_phdstudent/16877;https://sites.google.com/view/dongjun-kim?pli=1;https://sites.google.com/site/wanmokang/;",
        "dblp": ";276/5100;;241/9686;03/4394;;",
        "google_scholar": "SBF13JUAAAAJ;https://scholar.google.co.kr/citations?user=mJoqpmEAAAAJ;https://scholar.google.co.kr/citations?user=PhyT2gQAAAAJ;oYbKry4AAAAJ;https://scholar.google.com/citations?hl=ko;;",
        "orcid": ";0000-0003-3463-2674;;;;;",
        "linkedin": ";byeonghu-na-17942120b/;;;;;",
        "or_profile": "~Yeongmin_Kim1;~Byeonghu_Na1;~Minsang_Park1;~JoonHo_Jang1;~Dongjun_Kim1;~Wanmo_Kang1;~Il-chul_Moon1",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Sony AI;;",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr;kaist.ac.kr;kaist.ac.kr;sony.com;;",
        "position": "PhD student;PhD student;MS student;PhD student;Intern;;",
        "bibtex": "@inproceedings{\nkim2024training,\ntitle={Training Unbiased Diffusion Models From Biased Dataset},\nauthor={Yeongmin Kim and Byeonghu Na and Minsang Park and JoonHo Jang and Dongjun Kim and Wanmo Kang and Il-chul Moon},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=39cPKijBed}\n}",
        "github": "",
        "project": "",
        "reviewers": "WcK7;EYEW;irEP;6Mt9",
        "pdf_size": 39868109,
        "rating": "5;5;6;8",
        "confidence": "3;4;4;4",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;4",
        "wc_summary": "48;58;69;48",
        "wc_strengths": "93;66;62;134",
        "wc_weaknesses": "84;321;168;19",
        "wc_questions": "1;44;11;257",
        "wc_review": "226;489;310;458",
        "wc_reply_reviewers": "0;0;84;82",
        "wc_reply_authors": "604;1321;1434;583",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "4;7;6;4",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            55.75,
            8.671072598012312
        ],
        "wc_strengths_avg": [
            88.75,
            28.71737279069936
        ],
        "wc_weaknesses_avg": [
            148.0,
            112.98893751159889
        ],
        "wc_questions_avg": [
            78.25,
            104.42072351789179
        ],
        "wc_review_avg": [
            370.75,
            107.51598718330219
        ],
        "wc_reply_reviewers_avg": [
            41.5,
            41.506023659223246
        ],
        "wc_reply_authors_avg": [
            985.5,
            394.10055823355543
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            5.25,
            1.299038105676658
        ],
        "replies_avg": [
            31,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.4714045207910316,
        "gs_citation": 17,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10250792016981496700&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=39cPKijBed",
        "pdf": "https://openreview.net/pdf?id=39cPKijBed",
        "email": "kaist.ac.kr;kaist.ac.kr;kaist.ac.kr;kaist.ac.kr;sony.com;;",
        "author_num": 7,
        "aff_unique_index": "0;0;0;0;1",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology;Sony",
        "aff_unique_dep": ";Sony AI",
        "aff_unique_url": "https://www.kaist.ac.kr;https://www.sony.com",
        "aff_unique_abbr": "KAIST;Sony AI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;1",
        "aff_country_unique": "South Korea;Japan"
    },
    {
        "id": "3APJXDoSyS",
        "title": "The Closer, The Better: Towards Better Representation Learning for Few-Shot Class-Incremental Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Aiming to incrementally learn new classes with only few samples while preserving the knowledge of base (old) classes, few-shot class-incremental learning (FSCIL) faces several challenges, such as overfitting and catastrophic forgetting.\nTo bypass the issues, many works have employed a non-parametric classifier: representing each class with the average of features obtained with a fixed feature extractor trained on base classes.\nUnder such formulation, representation learning is critical to tackle the unique challenges of FSCIL: (1) the transferability of the learned representation to new knowledge, (2) the discriminability between all classes, regardless of old or new.\nRecent advances in representation learning, such as contrastive learning, have greatly improved the transferability, which is often attributed to the spread of intra-class features.\nHowever, we observe that solely improving the transferability can harm the discriminability of FSCIL models, as too much spread of features can degrade the quality of the feature-mean class representation. \nUpon the observation and further experimental analysis, we claim that not only we need to increase the intra-class distance, but we also need to decrease the inter-class distance.\nTrying to secure the spread of features and discriminability within a more confined space due to small inter-class distances, the learned representation strikes a good balance between the transferability and discriminability.\nThe strong performance, without any weight update while learning new classes, demonstrates the effective discriminability and transferability of our new representation, founded upon our seemingly counter-intuitive claim: the-Closer-the-Better (CnB).",
        "keywords": "few-shot learning;incremental learning;representation learing",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Junghun Oh;Sungyong Baik;Kyoung Mu Lee",
        "authorids": "~Junghun_Oh1;~Sungyong_Baik1;~Kyoung_Mu_Lee2",
        "gender": "M;M;M",
        "homepage": ";https://dsybaik-hy.github.io/;https://cv.snu.ac.kr/kmlee/",
        "dblp": "281/8729;243/2775;17/4029",
        "google_scholar": "fCFkL9EAAAAJ;lQ4gotkAAAAJ;Hofj9kAAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Junghun_Oh1;~Sungyong_Baik1;~Kyoung_Mu_Lee1",
        "aff": "Seoul National University;Hanyang University;Seoul National University",
        "aff_domain": "snu.ac.kr;hanyang.ac.kr;snu.ac.kr",
        "position": "PhD student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\noh2024the,\ntitle={The Closer, The Better: Towards Better Representation Learning for Few-Shot Class-Incremental Learning},\nauthor={Junghun Oh and Sungyong Baik and Kyoung Mu Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=3APJXDoSyS}\n}",
        "github": "",
        "project": "",
        "reviewers": "JXg4;fd7A;YAmj;h7Ap",
        "site": "https://openreview.net/forum?id=3APJXDoSyS",
        "pdf_size": 3460420,
        "rating": "3;5;5;5",
        "confidence": "5;4;4;2",
        "soundness": "3;3;3;2",
        "contribution": "2;3;2;2",
        "presentation": "3;2;3;3",
        "wc_summary": "71;100;153;52",
        "wc_strengths": "43;63;96;25",
        "wc_weaknesses": "160;83;200;377",
        "wc_questions": "70;46;114;4",
        "wc_review": "344;292;563;458",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            94.0,
            38.11167800031901
        ],
        "wc_strengths_avg": [
            56.75,
            26.34743820563965
        ],
        "wc_weaknesses_avg": [
            205.0,
            107.84015949543101
        ],
        "wc_questions_avg": [
            58.5,
            39.80891859872609
        ],
        "wc_review_avg": [
            414.25,
            104.78638986051575
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.6622661785325219,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:7_vC3k1vi54J:scholar.google.com/&scioq=The+Closer,+The+Better:+Towards+Better+Representation+Learning+for+Few-Shot+Class-Incremental+Learning&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Seoul National University;Hanyang University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.snu.ac.kr;https://www.hanyang.ac.kr",
        "aff_unique_abbr": "SNU;HYU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "3ARfhjGfdF",
        "title": "Towards Control-Centric Representations in Reinforcement Learning from Images",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Image-based Reinforcement Learning is a practical yet challenging task. A major hurdle lies in extracting control-centric representations while disregarding irrelevant information. While approaches that follow the bisimulation principle exhibit the potential in learning state representations to address this issue, they still grapple with the limited expressive capacity of latent dynamics and the inadaptability to sparse reward environments. To address these limitations, we introduce Rebis, which aims to capture control-centric information by integrating reward-free control information alongside reward-specific knowledge. Rebis utilizes a transformer architecture to implicitly model the dynamics and incorporates block-wise masking to eliminate spatiotemporal redundancy. Moreover, Rebis combines bisimulation-based loss with asymmetric reconstruction loss to prevent feature collapse in environments with sparse rewards. Empirical studies on two large benchmarks, including Atari games and DeepMind Control Suit, demonstrate that Rebis has superior performance compared to existing methods, proving its effectiveness.",
        "keywords": "Bisimulation;Reinforcement Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/d1147544da9ccd27c7350c8730e01c1b33d3a073.zip",
        "author": "Chen Liu;Hongyu Zang;Xin Li;Yong Heng;Yifei Wang;Zhen Fang;Yisen Wang;Mingzhong Wang",
        "authorids": "~Chen_Liu16;~Hongyu_Zang1;~Xin_Li31;~Yong_Heng1;~Yifei_Wang1;~Zhen_Fang5;~Yisen_Wang1;~Mingzhong_Wang2",
        "gender": "F;M;F;M;M;M;M;M",
        "homepage": "https://github.com/LC990512;https://zanghyu.github.io/;https://cs.bit.edu.cn/szdw/jsml/js/lixin/index.htm;;https://yifeiwang77.com;https://github.com/Lucien-Evans-123;https://yisenwang.github.io/;https://www.usc.edu.au/staff/dr-mingzhong-wang",
        "dblp": ";212/2592.html;09/1365-33.html;https://dblp.uni-trier.de/pid/333/0444;00/555-1;;172/1346-1;12/5272",
        "google_scholar": ";2kmSy50AAAAJ;https://scholar.google.com/citations?hl=zh-TW;;-CLy6YsAAAAJ;;uMWPDboAAAAJ;Jj30mIUAAAAJ",
        "orcid": ";;0000-0003-4257-4347;0000-0002-1721-9995;;;;0000-0002-6533-8104",
        "linkedin": ";;;;;;;",
        "or_profile": "~Chen_Liu16;~Hongyu_Zang1;~Xin_Li31;~Yong_Heng1;~Yifei_Wang1;~Zhen_Fang5;~Yisen_Wang1;~Mingzhong_Wang2",
        "aff": "Beijing Institute of Technology;Meituan;Beijing Institute of Technology;;Massachusetts Institute of Technology;Beijing Institute of Technology;Peking University;University of the Sunshine Coast",
        "aff_domain": "bit.edu.cn;meituan.com;bit.edu.cn;;mit.edu;bit.edu.cn;pku.edu.cn;usc.edu.au",
        "position": "MS student;Researcher;Associate Professor;;Postdoc;MS student;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nliu2024towards,\ntitle={Towards Control-Centric Representations in Reinforcement Learning from Images},\nauthor={Chen Liu and Hongyu Zang and Xin Li and Yong Heng and Yifei Wang and Zhen Fang and Yisen Wang and Mingzhong Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=3ARfhjGfdF}\n}",
        "github": "",
        "project": "",
        "reviewers": "hpbt;sEtP;6U7G;TC9E",
        "site": "https://openreview.net/forum?id=3ARfhjGfdF",
        "pdf_size": 972714,
        "rating": "3;5;6;8",
        "confidence": "5;3;4;4",
        "soundness": "3;2;3;4",
        "contribution": "2;2;3;3",
        "presentation": "3;2;4;3",
        "wc_summary": "63;51;103;76",
        "wc_strengths": "66;34;98;69",
        "wc_weaknesses": "362;74;111;62",
        "wc_questions": "33;170;39;22",
        "wc_review": "524;329;351;229",
        "wc_reply_reviewers": "342;85;45;0",
        "wc_reply_authors": "2346;1894;980;500",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "5;3;2;1",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            73.25,
            19.3180614969515
        ],
        "wc_strengths_avg": [
            66.75,
            22.664675157610354
        ],
        "wc_weaknesses_avg": [
            152.25,
            122.43850497290467
        ],
        "wc_questions_avg": [
            66.0,
            60.35312750802563
        ],
        "wc_review_avg": [
            358.25,
            106.16820380886172
        ],
        "wc_reply_reviewers_avg": [
            118.0,
            132.7761273723556
        ],
        "wc_reply_authors_avg": [
            1430.0,
            728.3117464382955
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            1.479019945774904
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.39223227027636803,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:9xBPJ_cmW7gJ:scholar.google.com/&scioq=Towards+Control-Centric+Representations+in+Reinforcement+Learning+from+Images&hl=en&as_sdt=0,44",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;0;2;0;3;4",
        "aff_unique_norm": "Beijing Institute of Technology;Meituan;Massachusetts Institute of Technology;Peking University;University of the Sunshine Coast",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "http://www.bit.edu.cn/;https://www.meituan.com;https://web.mit.edu;http://www.pku.edu.cn;https://www.usc.edu.au",
        "aff_unique_abbr": "BIT;Meituan;MIT;Peking U;USC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0;0;2",
        "aff_country_unique": "China;United States;Australia"
    },
    {
        "id": "3ARp595Ucc",
        "title": "Beyond Joint Demonstrations: Personalized Expert Guidance for Efficient Multi-Agent Reinforcement Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Multi-Agent Reinforcement Learning (MARL) algorithms face the challenge of efficient exploration due to the exponential increase in the size of the joint state-action space.  While demonstration-guided learning has proven beneficial in single-agent settings, its direct applicability to MARL is hindered by the practical difficulty of obtaining joint expert demonstrations.\nIn this work, we introduce a novel concept of personalized expert demonstrations that an agent-specific expert provides. These demonstrations are tailored for an individual agent or, more broadly, for an individual type of agent in a heterogeneous team. It is crucial to emphasize that these demonstrations solely pertain to single-agent behaviors and do not encompass any cooperative elements. Consequently, it is essential to note that these demonstrations may not be inherently optimal when employed within a cooperative setting.\nTo bootstrap the learning from the personalized expert demonstrations, we reformulate the MARL problem in occupancy measure space and propose two innovative algorithms, namely expert-guided MARL (EG-MARL) and Generalized EG-MARL (GEG-MARL). These algorithms involve the acquisition of personalized reward signals through demonstrations to guide agent exploration and the fostering of collaborative behaviors through environmental reward feedbacks.\nOur proposed algorithms are evaluated across both discrete and continuous environments. The results underscore the capacity of our methods to learn near-optimal policies even when provided with suboptimal demonstrations, and they excel in solving coordinated tasks that challenge state-of-the-art MARL algorithms.",
        "keywords": "Multi-agent Reinforcement Learning;Learning from Demonstration;Actor-Critic",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/45330b371de6c68e13d663a4537e6d921738db5f.zip",
        "author": "Peihong Yu;Amrit Bedi;Alec Koppel;Carl Busart;Priya Narayan;Dinesh Manocha;Pratap Tokekar",
        "authorids": "~Peihong_Yu1;~Amrit_Bedi1;~Alec_Koppel1;carl.e.busart.civ@army.mil;~Priya_Narayan1;~Dinesh_Manocha3;~Pratap_Tokekar1",
        "gender": "F;M;M;;;M;M",
        "homepage": "https://peihongyu.com/;https://sites.google.com/view/amritsinghbedi/home;http://koppel.netlify.app/;;https://scholar.google.com/citations?user=Za8YrUsAAAAJ&hl=en;https://www.cs.umd.edu/people/dmanocha;https://tokekar.com/",
        "dblp": "201/8446;176/2707.html;149/0076;;;m/DineshManocha;",
        "google_scholar": "rzUHzRgAAAAJ;91WLA6QAAAAJ;8ClxyjIAAAAJ;;;X08l_4IAAAAJ;FKAovywAAAAJ",
        "orcid": ";;0000-0003-2447-2873;;;0000-0001-7047-9801;",
        "linkedin": ";;alec-koppel-9860b697/;;;dinesh-manocha-2311846;prataptokekar/",
        "or_profile": "~Peihong_Yu1;~Amrit_Bedi1;~Alec_Koppel1;carl.e.busart.civ@army.mil;~Priya_Narayan1;~Dinesh_Manocha3;~Pratap_Tokekar1",
        "aff": "University of Maryland, College Park;University of Maryland, College Park;J.P. Morgan Chase;;;University of Maryland, College Park;University of Maryland, College Park",
        "aff_domain": "umd.edu;umd.edu;jpmorgan.com;;;umd.edu;umd.edu",
        "position": "PhD student;Researcher;Research Team Lead;;;Professor;Associate Professor",
        "bibtex": "@misc{\nyu2024beyond,\ntitle={Beyond Joint Demonstrations: Personalized Expert Guidance for Efficient Multi-Agent Reinforcement Learning},\nauthor={Peihong Yu and Amrit Bedi and Alec Koppel and Carl Busart and Priya Narayan and Dinesh Manocha and Pratap Tokekar},\nyear={2024},\nurl={https://openreview.net/forum?id=3ARp595Ucc}\n}",
        "github": "",
        "project": "",
        "reviewers": "oHLh;C51y;eCAT;G5rt",
        "site": "https://openreview.net/forum?id=3ARp595Ucc",
        "pdf_size": 8786283,
        "rating": "3;3;3;6",
        "confidence": "3;4;4;3",
        "soundness": "2;1;1;3",
        "contribution": "2;2;1;3",
        "presentation": "3;2;2;3",
        "wc_summary": "71;63;93;89",
        "wc_strengths": "26;60;29;58",
        "wc_weaknesses": "265;51;210;134",
        "wc_questions": "71;113;58;54",
        "wc_review": "433;287;390;335",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "22;22;22;22",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            79.0,
            12.409673645990857
        ],
        "wc_strengths_avg": [
            43.25,
            15.801503093060482
        ],
        "wc_weaknesses_avg": [
            165.0,
            80.59466483583141
        ],
        "wc_questions_avg": [
            74.0,
            23.37733945512192
        ],
        "wc_review_avg": [
            361.25,
            55.17415608779168
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            22.0,
            0.0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2428337089863033995&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "University of Maryland;JPMorgan Chase & Co.",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www/umd.edu;https://www.jpmorganchase.com",
        "aff_unique_abbr": "UMD;JPM",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "College Park;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "3BUhO4ISkJ",
        "title": "InstructEdit: Improving Automatic Masks for Diffusion-based Image Editing With User Instructions",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recent works have explored text-guided image editing using diffusion models and generated edited images based on text prompts. However, the models struggle to accurately locate the regions to be edited and faithfully perform precise edits. In this work, we propose a framework termed InstructEdit that can do fine-grained editing based on user instructions. Our proposed framework has three components: language processor, segmenter, and image editor. The first component, the language processor, processes the user instruction using a large language model. The goal of this processing is to parse the user instruction and output prompts for the segmenter and captions for the image editor. We adopt ChatGPT and optionally BLIP2 for this step. The second component, the segmenter, uses the segmentation prompt provided by the language processor. We employ a state-of-the-art segmentation framework Grounded Segment Anything to automatically generate a high-quality mask based on the segmentation prompt. The third component, the image editor, uses the captions from the language processor and the masks from the segmenter to compute the edited image. We adopt Stable Diffusion and the mask-guided generation from DiffEdit for this purpose. What are the main achievements, outcomes, results? Experiments show that our method outperforms previous editing methods in fine-grained editing applications where the input image contains a complex object or multiple objects. We improve the mask quality over DiffEdit and thus improve the quality of edited images. We also show that our framework can accept multiple forms of user instructions as input.",
        "keywords": "Text-guided image editing;Language models;Diffusion models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/7862385af9e77b777f4cac4ee55b6cc22640d5eb.zip",
        "author": "Qian Wang;Biao Zhang;Michael Birsak;Peter Wonka",
        "authorids": "~Qian_Wang19;~Biao_Zhang5;~Michael_Birsak1;~Peter_Wonka1",
        "gender": "F;;M;M",
        "homepage": "https://qianwangx.github.io/;https://1zb.github.io;;http://peterwonka.net",
        "dblp": ";83/3266-5;147/4629;98/5522",
        "google_scholar": ";h5KukxEAAAAJ;GF0RLAwAAAAJ;https://scholar.google.com.tw/citations?user=0EKXSXgAAAAJ",
        "orcid": ";;;0000-0003-0627-9746",
        "linkedin": ";;michael-birsak;",
        "or_profile": "~Qian_Wang19;~Biao_Zhang5;~Michael_Birsak1;~Peter_Wonka1",
        "aff": "King Abdullah University of Science and Technology;KAUST;King Abdullah University of Science and Technology;KAUST",
        "aff_domain": "kaust.edu.sa;kaust.edu.sa;kaust.edu.sa;kaust.edu.sa",
        "position": "PhD student;Postdoc;Researcher;Full Professor",
        "bibtex": "@misc{\nwang2024instructedit,\ntitle={InstructEdit: Improving Automatic Masks for Diffusion-based Image Editing With User Instructions},\nauthor={Qian Wang and Biao Zhang and Michael Birsak and Peter Wonka},\nyear={2024},\nurl={https://openreview.net/forum?id=3BUhO4ISkJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "YLK1;6zrz;pqYf;PLFP",
        "site": "https://openreview.net/forum?id=3BUhO4ISkJ",
        "pdf_size": 12686786,
        "rating": "3;3;3;6",
        "confidence": "4;4;4;4",
        "soundness": "2;2;3;3",
        "contribution": "1;2;2;2",
        "presentation": "2;3;3;3",
        "wc_summary": "56;37;109;176",
        "wc_strengths": "63;27;150;72",
        "wc_weaknesses": "346;135;227;184",
        "wc_questions": "134;2;120;18",
        "wc_review": "599;201;606;450",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            94.5,
            53.94673298727181
        ],
        "wc_strengths_avg": [
            78.0,
            44.84974916317816
        ],
        "wc_weaknesses_avg": [
            223.0,
            78.1184997295775
        ],
        "wc_questions_avg": [
            68.5,
            58.98092912119984
        ],
        "wc_review_avg": [
            464.0,
            164.12952202452794
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 35,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10130802581700303433&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "King Abdullah University of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kast.kau.edu.sa",
        "aff_unique_abbr": "KAUST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Saudi Arabia"
    },
    {
        "id": "3CGpIeU212",
        "title": "Are training trajectories of deep single-spike and deep ReLU network equivalent?",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Communication by binary and sparse spikes is a key factor for the energy efficiency of biological brains. However, training deep spiking neural networks (SNNs) with backpropagation is harder than with artificial neural networks (ANNs), which is puzzling given that recent theoretical results provide exact mapping algorithms from ReLU to time-to-first-spike (TTFS) SNNs. Building upon these results, we analyze in theory and in simulation the learning dynamics of TTFS-SNNs. Our analysis highlights that even when an SNN can be mapped exactly to a ReLU network, it cannot always be robustly trained by gradient descent. The reason for that is the emergence of a specific instance of the vanishing-and-exploding gradient problem leading to a bias in the gradient descent trajectory in comparison with the equivalent ANN. After identifying this issue we derive a generic solution for the network initialization and SNN parameterization which guarantees that the SNN can be trained as robustly as its ANN counterpart. Our theoretical findings are illustrated in practice on image classification datasets. Our method achieves the same accuracy as deep ConvNets on CIFAR10 and enables fine-tuning on the much larger PLACES365 dataset without loss of accuracy compared to the ANN. We argue that the combined perspective of conversion and fine-tuning with robust gradient descent in SNN will be decisive to optimize SNNs for hardware implementations needing low latency and resilience to noise and quantization.",
        "keywords": "deep spiking neural network training;time-to-first-spike;vanishing gradient problem;ReLU network;network initialization",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Ana Stanojevic;Stanis\u0142aw Wo\u017aniak;Guillaume Bellec;Giovanni Cherubini;Angeliki Pantazi;Wulfram Gerstner",
        "authorids": "~Ana_Stanojevic1;~Stanis\u0142aw_Wo\u017aniak1;~Guillaume_Bellec1;~Giovanni_Cherubini2;~Angeliki_Pantazi1;~Wulfram_Gerstner1",
        "gender": "F;M;M;M;F;",
        "homepage": ";;https://guillaumebellec.github.io;https://researcher.watson.ibm.com/researcher/view.php?person=zurich-cbi;https://research.ibm.com/people/angeliki-pantazi;https://lcnwww.epfl.ch/gerstner/",
        "dblp": "262/5987.html;173/2997;;07/5927;83/1243;g/WGerstner",
        "google_scholar": "3DNfrZYAAAAJ;axP7kosAAAAJ;fSXUVvAAAAAJ;J6NdeI4AAAAJ;https://scholar.google.ch/citations?user=BEMNIoQAAAAJ;https://scholar.google.ch/citations?user=vSd2RnEAAAAJ",
        "orcid": ";;0000-0001-7568-4994;0000-0002-0573-2919;0000-0003-4720-4038;0000-0002-4344-2189",
        "linkedin": "ana--stanojevic/;;;giovanni-cherubini-a379b29/;;",
        "or_profile": "~Ana_Stanojevic1;~Stanis\u0142aw_Wo\u017aniak1;~Guillaume_Bellec1;~Giovanni_Cherubini2;~Angeliki_Pantazi1;~Wulfram_Gerstner1",
        "aff": ";IBM Research;Swiss Federal Institute of Technology Lausanne;International Business Machines;International Business Machines;EPFL - EPF Lausanne",
        "aff_domain": ";ibm.com;epfl.ch;ibm.com;ibm.com;epfl.ch",
        "position": ";Researcher;Postdoc;Researcher;Principal Researcher;Full Professor",
        "bibtex": "@misc{\nstanojevic2024are,\ntitle={Are training trajectories of deep single-spike and deep Re{LU} network equivalent?},\nauthor={Ana Stanojevic and Stanis{\\l}aw Wo{\\'z}niak and Guillaume Bellec and Giovanni Cherubini and Angeliki Pantazi and Wulfram Gerstner},\nyear={2024},\nurl={https://openreview.net/forum?id=3CGpIeU212}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=3CGpIeU212",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10709245391331482397&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;2;3",
        "aff_unique_norm": "IBM;Swiss Federal Institute of Technology Lausanne;International Business Machines Corporation;EPFL",
        "aff_unique_dep": "IBM Research;;;",
        "aff_unique_url": "https://www.ibm.com/research;https://www.epfl.ch;https://www.ibm.com;https://www.epfl.ch",
        "aff_unique_abbr": "IBM;EPFL;IBM;EPFL",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Lausanne",
        "aff_country_unique_index": "0;1;0;0;1",
        "aff_country_unique": "United States;Switzerland"
    },
    {
        "id": "3D0mOtnHGR",
        "title": "Preprocessing Enhanced Image Compression for Machine Vision",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recently, more and more images are compressed and sent to the back-end devices for machine analysis tasks (e.g. object detection) instead of being purely watched by humans. \nHowever, most traditional or learned image codecs are designed to minimize the distortion of the human visual system without considering the increased demand from machine vision systems. In this work, we propose a preprocessing enhanced image compression method for machine vision tasks to address this challenge. Instead of relying on the learned image codecs for end-to-end optimization, our framework is built upon the traditional non-differential codecs, which means it is standard compatible and can be easily deployed in practical applications. Specifically, we propose a neural preprocessing module before the encoder to maintain the useful semantic information for the downstream tasks and suppress the irrelevant information for bitrate saving. Furthermore, our neural preprocessing module is quantization adaptive and can be used in different compression ratios. \nMore importantly, to jointly optimize the preprocessing module with the downstream machine vision tasks, we introduce the proxy network for the traditional non-differential codecs in the back-propagation stage. We provide extensive experiments by evaluating our compression method for several representative downstream tasks with different backbone networks. Experimental results show our method achieves a better trade-off between the coding bitrate and the performance of the downstream machine vision tasks by saving about 20\\% bitrate.",
        "keywords": "image compression;machine vision;preprocessing",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Guo Lu;Xingtong Ge;Tianxiong Zhong;Jing Geng;Guosheng Yu",
        "authorids": "~Guo_Lu2;~Xingtong_Ge1;~Tianxiong_Zhong1;~Jing_Geng1;~Guosheng_Yu1",
        "gender": "M;M;M;F;M",
        "homepage": "https://guolusjtu.github.io/guoluhomepage/;https://xingtongge.github.io/;;;http://www.nohomepage.org",
        "dblp": "76/7805;;322/3730;;",
        "google_scholar": "R9iwlJcAAAAJ;Rf8UmtoAAAAJ;;;",
        "orcid": ";;;0000-0003-4076-6134;",
        "linkedin": ";xingtong-ge/;;;",
        "or_profile": "~Guo_Lu2;~Xingtong_Ge1;~Tianxiong_Zhong1;~Jing_Geng1;~Guosheng_Yu1",
        "aff": "Shanghai Jiaotong University;Beijing Institute of Technology;Beijing Institute of Technology;Beijing Institute of Technology;",
        "aff_domain": "sjtu.edu.cn;bit.edu.cn;bit.edu.cn;bit.edu.cn;",
        "position": "Assistant Professor;MS student;MS student;Assistant Professor;",
        "bibtex": "@misc{\nlu2024preprocessing,\ntitle={Preprocessing Enhanced Image Compression for Machine Vision},\nauthor={Guo Lu and Xingtong Ge and Tianxiong Zhong and Jing Geng and Guosheng Yu},\nyear={2024},\nurl={https://openreview.net/forum?id=3D0mOtnHGR}\n}",
        "github": "",
        "project": "",
        "reviewers": "fHZ6;uQPP;maca",
        "site": "https://openreview.net/forum?id=3D0mOtnHGR",
        "pdf_size": 12594433,
        "rating": "3;3;5",
        "confidence": "5;5;5",
        "soundness": "2;2;3",
        "contribution": "1;2;3",
        "presentation": "2;2;3",
        "wc_summary": "55;32;41",
        "wc_strengths": "20;23;47",
        "wc_weaknesses": "178;200;174",
        "wc_questions": "5;3;4",
        "wc_review": "258;258;266",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            5.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            42.666666666666664,
            9.46337971105226
        ],
        "wc_strengths_avg": [
            30.0,
            12.083045973594572
        ],
        "wc_weaknesses_avg": [
            184.0,
            11.430952132988164
        ],
        "wc_questions_avg": [
            4.0,
            0.816496580927726
        ],
        "wc_review_avg": [
            260.6666666666667,
            3.7712361663282534
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 26,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10381605748897511859&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Shanghai Jiao Tong University;Beijing Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.sjtu.edu.cn;http://www.bit.edu.cn/",
        "aff_unique_abbr": "SJTU;BIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "3DPTnFokLp",
        "title": "Benchmarking Multimodal Variational Autoencoders: CdSprites+ Dataset and Toolkit",
        "track": "main",
        "status": "Desk Reject",
        "tldr": "",
        "abstract": "Multimodal Variational Autoencoders (VAEs) have been the subject of intense research in the past years as they can integrate multiple modalities into a joint representation and can thus serve as a promising tool for both data classification and generation. Several approaches toward multimodal VAE learning have been proposed so far, their comparison and evaluation have however been rather inconsistent. One reason is that the models differ at the implementation level, another problem is that the datasets commonly used in these cases were not initially designed to evaluate multimodal generative models. This paper addresses both mentioned issues. First, we propose a toolkit for systematic multimodal VAE training and comparison. The toolkit currently comprises 4 existing multimodal VAEs and 6 commonly used benchmark datasets along with instructions on how to easily add a new model or a dataset. Second, we present a disentangled bimodal dataset designed to comprehensively evaluate the joint generation and cross-generation capabilities across multiple difficulty levels. We demonstrate the utility of our dataset by comparing the implemented state-of-the-art models.",
        "keywords": "variational autoencoders;multimodal generative models;multimodal datasets;benchmark toolkits",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/bc058164973cba4ee50609720a7f7173ada9dca6.zip",
        "author": "Gabriela Sejnova;Michal Vavrecka;Karla Stepanova",
        "authorids": "~Gabriela_Sejnova1;~Michal_Vavrecka1;~Karla_Stepanova1",
        "gender": "F;;F",
        "homepage": ";;http://karlastepanova.cz",
        "dblp": ";;",
        "google_scholar": ";AhgkbbIAAAAJ;I-PURrEAAAAJ",
        "orcid": "0000-0002-0045-6425;;0000-0003-4239-2092",
        "linkedin": ";;",
        "or_profile": "~Gabriela_Sejnova1;~Michal_Vavrecka1;~Karla_Stepanova1",
        "aff": ";;",
        "aff_domain": ";;",
        "position": ";;",
        "bibtex": "@misc{\nsejnova2024benchmarking,\ntitle={Benchmarking Multimodal Variational Autoencoders: CdSprites+ Dataset and Toolkit},\nauthor={Gabriela Sejnova and Michal Vavrecka and Karla Stepanova},\nyear={2024},\nurl={https://openreview.net/forum?id=3DPTnFokLp}\n}",
        "github": "",
        "project": "",
        "reviewers": "8MxM;naTF;EZ4B;2Pvg",
        "site": "https://openreview.net/forum?id=3DPTnFokLp",
        "pdf_size": 4416460,
        "rating": "3;5;5;6",
        "confidence": "5;4;3;3",
        "soundness": "3;3;3;3",
        "contribution": "1;2;2;3",
        "presentation": "3;2;2;3",
        "wc_summary": "46;98;112;32",
        "wc_strengths": "37;50;60;31",
        "wc_weaknesses": "681;327;204;23",
        "wc_questions": "58;145;78;3",
        "wc_review": "822;620;454;89",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "399;448;796;174",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            72.0,
            33.734255586866
        ],
        "wc_strengths_avg": [
            44.5,
            11.280514172678478
        ],
        "wc_weaknesses_avg": [
            308.75,
            240.5871723513122
        ],
        "wc_questions_avg": [
            71.0,
            50.788778288121875
        ],
        "wc_review_avg": [
            496.25,
            268.82371082179486
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            454.25,
            222.72446542757712
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.899228803025897,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15045849436249823363&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3
    },
    {
        "id": "3DdCB6MRvu",
        "title": "3D Tissue Reconstruction and Generation for Single-Cell Spatial Transcriptomics using Neural Radiance Fields",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Single-cell spatial transcriptomics (scST) is a groundbreaking technique that allows for the exploration of gene expression patterns, cell-cell interactions, and tissue organization at the single-cell level. Traditional approaches in scST reconstruction mainly focus on assigning two-dimensional (2D) coordinates to individual cells within a pre-established region. This often requires a large amount of 2D slice data, such as ssDNAs images, which escalates both costs and the complexity involved in studying and reconstructing the tissue's three-dimensional (3D) organization. Here, we introduce a novel method for scST reconstruction,  which is a Neural Radiance Fields (NeRF)-based 3D-aware generative model termed STscan,  that aims to reconstruct a 3D scST scene using a minimal amount from 2D images (fewer than 10). Additionally, STscan can identify cell types and their expression levels within this 3D environment. To the best of our knowledge, STscan is the first NeRF-based method specifically designed for single-cell ST reconstruction, and it is the first end-to-end solution capable of directly reconstructing in vitro cell-cell environments from ssDNA images. This approach has the potential to significantly reduce both the complexity and cost associated with scST studies.",
        "keywords": "Single-Cell Spatial Transcriptomics;Neural Radiance Fields;3D reconstruction",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Yantong Cai;Xiaoxue Chen;Lin Li;Guangchuang Yu;Hao Zhao",
        "authorids": "~Yantong_Cai1;~Xiaoxue_Chen1;~Lin_Li22;~Guangchuang_Yu1;~Hao_Zhao1",
        "gender": "F;F;;M;M",
        "homepage": "https://github.com/yangtcai;https://air.tsinghua.edu.cn/;;https://yulab-smu.top/;https://sites.google.com/view/fromandto",
        "dblp": "369/6081;;;;08/3737-2.html",
        "google_scholar": ";;;https://scholar.google.com/citations?hl=zh-CN;ygQznUQAAAAJ",
        "orcid": "0000-0003-2137-4979;;0000-0002-6522-1889;0000-0002-6485-8781;",
        "linkedin": ";;;;",
        "or_profile": "~Yantong_Cai1;~Xiaoxue_Chen1;~Lin_Li22;~Guangchuang_Yu1;~Hao_Zhao1",
        "aff": "Dermatology Hospital, Southern Medical University;Tsinghua University;Southern Methodist University, Southern Methodist University;Southern Medical University;Peking University",
        "aff_domain": "smu.edu;tsinghua.edu.cn;smu.edu;smu.edu.cn;pku.edu.cn",
        "position": "Postdoc;PhD student;MS student;Full Professor;Postdoc",
        "bibtex": "@misc{\ncai2024d,\ntitle={3D Tissue Reconstruction and Generation for Single-Cell Spatial Transcriptomics using Neural Radiance Fields},\nauthor={Yantong Cai and Xiaoxue Chen and Lin Li and Guangchuang Yu and Hao Zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=3DdCB6MRvu}\n}",
        "github": "",
        "project": "",
        "reviewers": "2SGX;Vcft;TxGH",
        "site": "https://openreview.net/forum?id=3DdCB6MRvu",
        "pdf_size": 4712870,
        "rating": "3;3;5",
        "confidence": "5;3;4",
        "soundness": "2;2;3",
        "contribution": "2;2;2",
        "presentation": "2;2;2",
        "wc_summary": "71;127;73",
        "wc_strengths": "31;21;60",
        "wc_weaknesses": "188;362;144",
        "wc_questions": "72;5;124",
        "wc_review": "362;515;401",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            90.33333333333333,
            25.94010194445829
        ],
        "wc_strengths_avg": [
            37.333333333333336,
            16.539514973407037
        ],
        "wc_weaknesses_avg": [
            231.33333333333334,
            94.12521211426593
        ],
        "wc_questions_avg": [
            67.0,
            48.71002634639676
        ],
        "wc_review_avg": [
            426.0,
            64.91532946846992
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:v5UVPhgjLnYJ:scholar.google.com/&scioq=3D+Tissue+Reconstruction+and+Generation+for+Single-Cell+Spatial+Transcriptomics+using+Neural+Radiance+Fields&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0;3",
        "aff_unique_norm": "Southern Medical University;Tsinghua University;Southern Methodist University;Peking University",
        "aff_unique_dep": "Dermatology Hospital;;;",
        "aff_unique_url": "http://www.fsmu.edu.cn;https://www.tsinghua.edu.cn;https://www.smu.edu;http://www.pku.edu.cn",
        "aff_unique_abbr": ";THU;SMU;Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Chain of Thought Empowers Transformers to Solve Inherently Serial Problems",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19524",
        "id": "3EWTEy9MTM",
        "author_site": "Zhiyuan Li, Hong Liu, Denny Zhou, Tengyu Ma",
        "tldr": "",
        "abstract": "Generating a sequence of intermediate steps, \\emph{a.k.a.}, a chain of thought (CoT), is a highly effective method to improve the accuracy of large language models (LLMs) on arithmetics and symbolic reasoning tasks. However, the mechanism behind CoT remains unclear. \nThis work provides a theoretical understanding of the power of CoT for decoder-only transformers through the lens of expressiveness. Conceptually, CoT empowers the model with the ability to perform inherently serial computation, which is otherwise lacking in transformers, especially when depth is low. Given input length $n$, previous works have constant-depth transformers with finite precision $\\mathsf{poly}(n)$ embedding size can only solve problems in $\\mathsf{TC}^0$ without CoT. We first show an even tighter expressiveness upper bound for constant-depth transformers with constant-bit precision, which can only solve problems in $\\mathsf{AC}^0$, a proper subset of $ \\mathsf{TC}^0$. However, with $T$ steps of CoT, constant-depth transformers using constant-bit precision and $O(\\log n)$ embedding size can solve any problem solvable by boolean circuits of size $T$. Empirically, enabling CoT dramatically improves the accuracy for tasks that are hard for parallel computation, including the composition of permutation groups, iterated squaring, and circuit value problems, especially for low-depth transformers.",
        "keywords": "Chain of thought;language modeling;circuit complexity;deep learning theory",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Zhiyuan Li;Hong Liu;Denny Zhou;Tengyu Ma",
        "authorids": "~Zhiyuan_Li2;~Hong_Liu5;~Denny_Zhou1;~Tengyu_Ma1",
        "gender": "M;M;M;",
        "homepage": "https://zhiyuanli.ttic.edu;;http://ai.stanford.edu/~tengyuma/;https://dennyzhou.github.io/",
        "dblp": "l/ZhiyuanLi;;54/9061;178/3277",
        "google_scholar": "https://scholar.google.com/citations?hl=en;BUc2uq0AAAAJ;i38QlUwAAAAJ;UwLsYw8AAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Zhiyuan_Li2;~Hong_Liu5;~Tengyu_Ma1;~Dengyong_Zhou2",
        "aff": "Toyota Technological Institute at Chicago;Stanford University;Facebook AI Research;Google DeepMind",
        "aff_domain": "ttic.edu;stanford.edu;fb.com;google.com",
        "position": "Assistant Professor;PhD student;Visiting Scientist;Research Scientist",
        "bibtex": "@inproceedings{\nli2024chain,\ntitle={Chain of Thought Empowers Transformers to Solve Inherently Serial Problems},\nauthor={Zhiyuan Li and Hong Liu and Denny Zhou and Tengyu Ma},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=3EWTEy9MTM}\n}",
        "github": "",
        "project": "",
        "reviewers": "pRpF;qiA8;zX88;woBt;Aro9;wS3v",
        "pdf_size": 4402629,
        "rating": "3;5;6;8;8;8",
        "confidence": "4;4;4;5;2;2",
        "soundness": "3;3;4;4;3;3",
        "contribution": "4;3;2;3;3;3",
        "presentation": "2;3;3;3;4;3",
        "wc_summary": "41;163;97;109;137;38",
        "wc_strengths": "253;38;124;137;68;45",
        "wc_weaknesses": "317;107;712;434;28;296",
        "wc_questions": "173;115;111;124;1;3",
        "wc_review": "784;423;1044;804;234;382",
        "wc_reply_reviewers": "0;0;0;125;0;0",
        "wc_reply_authors": "615;497;239;749;24;161",
        "reply_reviewers": "0;0;0;1;0;0",
        "reply_authors": "1;1;1;2;1;1",
        "rating_avg": [
            6.333333333333333,
            1.8856180831641267
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.5773502691896257
        ],
        "presentation_avg": [
            3.0,
            0.5773502691896257
        ],
        "wc_summary_avg": [
            97.5,
            46.03531253288067
        ],
        "wc_strengths_avg": [
            110.83333333333333,
            73.64649044968509
        ],
        "wc_weaknesses_avg": [
            315.6666666666667,
            222.7724299718337
        ],
        "wc_questions_avg": [
            87.83333333333333,
            63.99587660327986
        ],
        "wc_review_avg": [
            611.8333333333334,
            284.1879757406276
        ],
        "wc_reply_reviewers_avg": [
            20.833333333333332,
            46.58474953124561
        ],
        "wc_reply_authors_avg": [
            380.8333333333333,
            258.08552630647245
        ],
        "reply_reviewers_avg": [
            0.16666666666666666,
            0.372677996249965
        ],
        "reply_authors_avg": [
            1.1666666666666667,
            0.3726779962499649
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.3952847075210475,
        "gs_citation": 109,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11728270641767049962&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=3EWTEy9MTM",
        "pdf": "https://openreview.net/pdf?id=3EWTEy9MTM",
        "email": "ttic.edu;stanford.edu;fb.com;google.com",
        "author_num": 4,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Toyota Technological Institute at Chicago;Stanford University;Meta;Google",
        "aff_unique_dep": ";;Facebook AI Research;Google DeepMind",
        "aff_unique_url": "https://www.tti-chicago.org;https://www.stanford.edu;https://research.facebook.com;https://deepmind.com",
        "aff_unique_abbr": "TTI Chicago;Stanford;FAIR;DeepMind",
        "aff_campus_unique_index": "0;1",
        "aff_campus_unique": "Chicago;Stanford;",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "title": "Self-Supervised Heterogeneous Graph Learning: a Homophily and Heterogeneity View",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19523",
        "id": "3FJOKjooIj",
        "author_site": "YUJIE MO, Feiping Nie, Ping Hu, Heng Tao Shen, Zheng Zhang, Xinchao Wang, Xiaofeng Zhu",
        "tldr": "",
        "abstract": "Self-supervised heterogeneous graph learning has achieved promising results in various real applications, but it still suffers from the following issues: (i)  meta-paths can be employed to capture the homophily in the heterogeneous graph, but meta-paths are human-defined, requiring substantial expert knowledge and computational costs; and (ii) the heterogeneity in the heterogeneous graph is usually underutilized, leading to the loss of task-related information. To solve these issues, this paper proposes to capture both homophily and  heterogeneity in the heterogeneous graph without pre-defined meta-paths. Specifically, we propose to learn a self-expressive matrix to capture the homophily from the subspace and nearby neighbors. Meanwhile, we propose to capture the heterogeneity by aggregating the information of nodes from different types. We further design a consistency loss and a specificity loss, respectively, to extract the consistent information between homophily and heterogeneity and to preserve their specific task-related information. We theoretically analyze that the learned homophilous representations exhibit the grouping effect to capture the homophily, and considering both homophily and heterogeneity introduces more task-related information. Extensive experimental results verify the superiority of the proposed method on different downstream tasks.",
        "keywords": "Graph representation learning;Heterogeneous graph;Self-supervised learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Yujie Mo;Feiping Nie;Ping Hu;Heng Tao Shen;Zheng Zhang;Xinchao Wang;Xiaofeng Zhu",
        "authorids": "~Yujie_Mo1;~Feiping_Nie2;~Ping_Hu3;~Heng_Tao_Shen3;~Zheng_Zhang7;~Xinchao_Wang1;~Xiaofeng_Zhu7",
        "gender": ";M;M;M;M;M;M",
        "homepage": "https://yujiemo.github.io/;https://dblp.org/pid/80/5755.html;http://feinanshan.github.io;;https://sites.google.com/site/seanzhuxf/;https://cfm.uestc.edu.cn/~shenht/;https://sites.google.com/site/sitexinchaowang/",
        "dblp": "282/0552;;53/5490-1;181/2621-6.html;60/4671-1;s/HTShen;",
        "google_scholar": "MH4nZY0AAAAJ;;ddrD2TgAAAAJ;tpVOb2EAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com.au/citations?user=krryaDkAAAAJ;https://scholar.google.com.tw/citations?user=w69Buq0AAAAJ",
        "orcid": "0000-0001-7784-6221;;;0000-0003-1470-6998;0000-0001-6840-0578;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Yujie_Mo1;~Feiping_Nie2;~Ping_Hu3;~Zheng_Zhang7;~Xiaofeng_Zhu7;~Hengtao_Shen1;~Xinchao_WANG3",
        "aff": "University of Electronic Science and Technology of China;Northwest Polytechnical University Xi'an;University of Electronic Science and Technology of China;Harbin Institute of Technology;University of Electronic Science and Technology of China;Tongji University;National University of Singapore",
        "aff_domain": "uestc.edu.cn;nwpu.edu.cn;uestc.edu.cn;hit.edu.cn;uestc.edu.cn;tongji.edu.cn;nus.edu",
        "position": "PhD student;Full Professor;Full Professor;Full Professor;Full Professor;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nmo2024selfsupervised,\ntitle={Self-Supervised Heterogeneous Graph Learning:  a Homophily and Heterogeneity View},\nauthor={Yujie Mo and Feiping Nie and Ping Hu and Heng Tao Shen and Zheng Zhang and Xinchao Wang and Xiaofeng Zhu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=3FJOKjooIj}\n}",
        "github": "",
        "project": "",
        "reviewers": "BScY;h7xr;6ShR;rAzi;EpeM;Zp3d",
        "pdf_size": 7690475,
        "rating": "6;6;6;8;8;8",
        "confidence": "4;3;4;4;5;3",
        "soundness": "3;3;2;3;4;3",
        "contribution": "3;4;2;4;3;3",
        "presentation": "3;3;3;3;3;4",
        "wc_summary": "81;59;58;86;75;93",
        "wc_strengths": "99;46;28;81;139;126",
        "wc_weaknesses": "73;88;227;75;91;237",
        "wc_questions": "89;51;187;58;2;6",
        "wc_review": "342;244;500;300;307;462",
        "wc_reply_reviewers": "0;0;164;0;0;0",
        "wc_reply_authors": "354;331;1712;377;213;973",
        "reply_reviewers": "0;0;2;0;0;0",
        "reply_authors": "1;1;4;1;1;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.8333333333333335,
            0.6871842709362768
        ],
        "soundness_avg": [
            3.0,
            0.5773502691896257
        ],
        "contribution_avg": [
            3.1666666666666665,
            0.6871842709362768
        ],
        "presentation_avg": [
            3.1666666666666665,
            0.3726779962499649
        ],
        "wc_summary_avg": [
            75.33333333333333,
            13.072447700751718
        ],
        "wc_strengths_avg": [
            86.5,
            39.928060308509856
        ],
        "wc_weaknesses_avg": [
            131.83333333333334,
            71.17681426482145
        ],
        "wc_questions_avg": [
            65.5,
            62.12017922275069
        ],
        "wc_review_avg": [
            359.1666666666667,
            91.45931092871602
        ],
        "wc_reply_reviewers_avg": [
            27.333333333333332,
            61.11919138499424
        ],
        "wc_reply_authors_avg": [
            660.0,
            530.1647542666965
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.74535599249993
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            1.1055415967851332
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.24253562503633294,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5048017698044699648&as_sdt=800005&sciodt=0,15&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=3FJOKjooIj",
        "pdf": "https://openreview.net/pdf?id=3FJOKjooIj",
        "email": "uestc.edu.cn;nwpu.edu.cn;uestc.edu.cn;hit.edu.cn;uestc.edu.cn;tongji.edu.cn;nus.edu",
        "author_num": 7,
        "aff_unique_index": "0;1;0;2;0;3;4",
        "aff_unique_norm": "University of Electronic Science and Technology of China;Northwest Polytechnical University;Harbin Institute of Technology;Tongji University;National University of Singapore",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.uestc.edu.cn;http://www.nwpu.edu.cn;http://www.hit.edu.cn/;https://www.tongji.edu.cn;https://www.nus.edu.sg",
        "aff_unique_abbr": "UESTC;NWPU;HIT;Tongji;NUS",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Xi'an;Harbin",
        "aff_country_unique_index": "0;0;0;0;0;0;1",
        "aff_country_unique": "China;Singapore"
    },
    {
        "id": "3GDKJSQnW2",
        "title": "Pivotal Prompt Tuning for Video Dynamic Editing",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Text-conditioned image editing has recently provided high-quality edits on images based on diffusion frameworks. Unfortunately, this success did not carry over to video editing, which continues to be challenging. Video editing is limited to rigid editing such as object overlay and style transfer. This paper proposes pivotal dynamic editing (PDEdit) for performing spatial-temporal non-rigid video editing based only on the target text, which has never been attempted before. PDEdit is capable of changing the motion of an object/person in the video, either at a specific moment or throughout the video, while preserving the temporal consistency of edited motions and a high level of fidelity to the original input video. In contrast to previous works, the proposed method performs editing based only on the input video and target text. It does not require any other auxiliary inputs (e.g., object masks or source video captions). Based on the video diffusion model, PDEdit using the proposed prompt pivoting leverages the target text prompt for editing the input video. The quality and adaptability of the proposed method on numerous input videos from different domains show the proposed to be highly effective. It can produce high-fidelity video edits under a single unified PDEdit framework. The code for this work will be made publicly available.",
        "keywords": "Video Editing;Multi-modal video generation;Prompt Analysis;Diffusion model",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/8c5f85ae029cba91c9ab3b50f72e63a6c0436ca0.zip",
        "author": "Sunjae Yoon;GwanHyeong Koo;Ji Woo Hong;Joshua Tian Jin Tee;Chang D. Yoo",
        "authorids": "~Sunjae_Yoon1;~GwanHyeong_Koo1;~Ji_Woo_Hong1;~Joshua_Tian_Jin_Tee1;~Chang_D._Yoo1",
        "gender": "M;M;M;M;M",
        "homepage": "https://dbstjswo505.github.io/;https://kookie12.github.io/;https://slsp.kaist.ac.kr/xe/;;https://sanctusfactory.com/family.php",
        "dblp": "273/3911;358/7119;312/8033;;31/7819",
        "google_scholar": "2A2lRoUAAAAJ;https://scholar.google.co.kr/citations?user=qDCTLZgAAAAJ;;x90yFvMAAAAJ;gFWgUQEAAAAJ",
        "orcid": "0000-0001-7458-5273;;0000-0002-3758-0307;;0000-0002-0756-7179",
        "linkedin": "sunjae-yoon-133294333/;;;;",
        "or_profile": "~Sunjae_Yoon1;~GwanHyeong_Koo1;~Ji_Woo_Hong1;~Joshua_Tian_Jin_Tee1;~Chang_D._Yoo1",
        "aff": "Korea Advanced Institute of Science and Technology (KAIST);Korea Advanced Institute of Science and Technology (KAIST);Korea Advanced Institute of Science & Technology;KAIST, Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr;kaist.ac.kr;ee.kaist.ac.kr;kaist.ac.kr",
        "position": "PhD student;MS student;PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nyoon2024pivotal,\ntitle={Pivotal Prompt Tuning for Video Dynamic Editing},\nauthor={Sunjae Yoon and GwanHyeong Koo and Ji Woo Hong and Joshua Tian Jin Tee and Chang D. Yoo},\nyear={2024},\nurl={https://openreview.net/forum?id=3GDKJSQnW2}\n}",
        "github": "",
        "project": "",
        "reviewers": "q1QA;9TJK;UHtg;1N5p",
        "site": "https://openreview.net/forum?id=3GDKJSQnW2",
        "pdf_size": 11715902,
        "rating": "5;5;5;5",
        "confidence": "4;4;4;3",
        "soundness": "3;3;2;1",
        "contribution": "3;3;2;2",
        "presentation": "3;3;2;2",
        "wc_summary": "54;47;46;45",
        "wc_strengths": "18;27;50;28",
        "wc_weaknesses": "131;151;87;90",
        "wc_questions": "39;5;85;16",
        "wc_review": "242;230;268;179",
        "wc_reply_reviewers": "148;0;0;51",
        "wc_reply_authors": "619;613;368;355",
        "reply_reviewers": "2;0;0;1",
        "reply_authors": "3;1;1;1",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            48.0,
            3.5355339059327378
        ],
        "wc_strengths_avg": [
            30.75,
            11.776565713313877
        ],
        "wc_weaknesses_avg": [
            114.75,
            27.206387117733954
        ],
        "wc_questions_avg": [
            36.25,
            30.70321644388418
        ],
        "wc_review_avg": [
            229.75,
            32.36027657483786
        ],
        "wc_reply_reviewers_avg": [
            49.75,
            60.42505688867823
        ],
        "wc_reply_authors_avg": [
            488.75,
            127.35064781931814
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:LFWtCGLN1ZoJ:scholar.google.com/&scioq=Pivotal+Prompt+Tuning+for+Video+Dynamic+Editing&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "3GunDQNKFJ",
        "title": "Learning-Retrieval-Revision For Large Language Model Domain Adaptation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "While large language models (LLMs) like GPT-4 have recently demonstrated astonishing zero-shot capabilities in general domain tasks, they often generate content with hallucinations in specific domains such as Chinese law, hindering their application in these areas. This is typically due to the absence of training data that encompasses such a specific domain, preventing GPT-4 from acquiring in-domain knowledge. A pressing challenge is that it\u2019s not plausible to continue training LLMs of such scale on in-domain data.\n\nThis paper introduces a simple and effective domain adaptation framework for GPT-4 by reformulating generation as an adapt-retrieve-revise process. The initial step is to adapt an affordable 7B LLM to the target domain by continuing learning on public in-domain data. When solving a task, we leverage the adapted LLM to generate a draft answer given a task query. Then, the draft answers will be used to retrieve supporting evidence candidates from an external in-domain knowledge base. Finally, the draft answer and retrieved evidence are concatenated into a whole prompt to let GPT-4 assess the evidence and revise the draft answer to generate the final answer.\n\nOur proposal combines the advantages of the efficiency of adapting a smaller 7B model with the evidence-assessing capability of GPT-4 and effectively prevents GPT-4 from generating hallucinatory content. In the zero-shot setting of four Chinese legal tasks, our method improves accuracy by 33.3% compared to the direct generation by GPT-4. When compared to two stronger retrieval-based baselines, our method outperforms them by 15.4% and 23.9%. Our code will be released.",
        "keywords": "large language models;domain adaptation;retrieval-based generation",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Zhen Wan;Yating Zhang;Yexiang Wang;Fei Cheng;Sadao Kurohashi",
        "authorids": "~Zhen_Wan1;~Yating_Zhang1;~Yexiang_Wang1;~Fei_Cheng2;~Sadao_Kurohashi1",
        "gender": "M;F;;M;M",
        "homepage": ";;;https://researchmap.jp/chengfei?lang=en;https://nlp.ist.i.kyoto-u.ac.jp/member/kuro/index.html",
        "dblp": ";29/5889;;06/5591-2.html;42/2149",
        "google_scholar": "OH_1qwMAAAAJ;;;https://scholar.google.com/citations?hl=en;https://scholar.google.co.jp/citations?user=gpKS5P0AAAAJ",
        "orcid": ";;;;0000-0001-5398-8399",
        "linkedin": "zhen-wan-8531251ab/;;;;",
        "or_profile": "~Zhen_Wan1;~Yating_Zhang1;~Yexiang_Wang1;~Fei_Cheng2;~Sadao_Kurohashi1",
        "aff": "Kyoto University;;;Kyoto University;Kyoto University",
        "aff_domain": "kyoto-u.ac.jp;;;kyoto-u.ac.jp;kyoto-u.ac.jp",
        "position": "PhD student;;;Associate Professor;Full Professor",
        "bibtex": "@misc{\nwan2024learningretrievalrevision,\ntitle={Learning-Retrieval-Revision For Large Language Model Domain Adaptation},\nauthor={Zhen Wan and Yating Zhang and Yexiang Wang and Fei Cheng and Sadao Kurohashi},\nyear={2024},\nurl={https://openreview.net/forum?id=3GunDQNKFJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "kf7S;CEqV;TieX;n3Gy",
        "site": "https://openreview.net/forum?id=3GunDQNKFJ",
        "pdf_size": 756366,
        "rating": "3;5;5;6",
        "confidence": "3;4;4;4",
        "soundness": "2;3;2;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;3;2",
        "wc_summary": "102;126;83;92",
        "wc_strengths": "63;101;38;72",
        "wc_weaknesses": "650;106;167;56",
        "wc_questions": "21;77;3;40",
        "wc_review": "836;410;291;260",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "802;709;649;583",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            100.75,
            16.052647756678645
        ],
        "wc_strengths_avg": [
            68.5,
            22.522211259110417
        ],
        "wc_weaknesses_avg": [
            244.75,
            237.25026343504868
        ],
        "wc_questions_avg": [
            35.25,
            27.42603689926782
        ],
        "wc_review_avg": [
            449.25,
            230.20357838226582
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            685.75,
            80.56480310905005
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.9271726499455306,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:6C9WMJbxT4oJ:scholar.google.com/&scioq=Learning-Retrieval-Revision+For+Large+Language+Model+Domain+Adaptation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Kyoto University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kyoto-u.ac.jp",
        "aff_unique_abbr": "Kyoto U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Japan"
    },
    {
        "title": "On Harmonizing Implicit Subpopulations",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19522",
        "id": "3GurO0kRue",
        "author_site": "Feng Hong, Jiangchao Yao, YUEMING LYU, Zhihan Zhou, Ivor Tsang, Ya Zhang, Yanfeng Wang",
        "tldr": "",
        "abstract": "Machine learning algorithms learned from data with skewed distributions usually suffer from poor generalization, especially when minority classes matter as much as, or even more than majority ones. This is more challenging on class-balanced data that has some hidden imbalanced subpopulations, since prevalent techniques mainly conduct class-level calibration and cannot perform subpopulation-level adjustments without subpopulation annotations. Regarding implicit subpopulation imbalance, we reveal that the key to alleviating the detrimental effect lies in effective subpopulation discovery with proper rebalancing. We then propose a novel subpopulation-imbalanced learning method called Scatter and HarmonizE (SHE). Our method is built upon the guiding principle of optimal data partition, which involves assigning data to subpopulations in a manner that maximizes the predictive information from inputs to labels. With theoretical guarantees and empirical evidences, SHE succeeds in identifying the hidden subpopulations and encourages subpopulation-balanced predictions. Extensive experiments on various benchmark datasets show the effectiveness of SHE.",
        "keywords": "imbalanced learning;subpopulation imbalance",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Feng Hong;Jiangchao Yao;Yueming Lyu;Zhihan Zhou;Ivor Tsang;Ya Zhang;Yanfeng Wang",
        "authorids": "~Feng_Hong1;~Jiangchao_Yao1;~Yueming_Lyu1;~Zhihan_Zhou2;~Ivor_Tsang1;~Ya_Zhang1;~Yanfeng_Wang1",
        "gender": "M;M;M;;F;M;M",
        "homepage": ";https://sunarker.github.io/;https://yueminglyu.github.io/;;https://annzhanglion.github.io/;https://cmic.sjtu.edu.cn/wangyanfeng/;https://www.a-star.edu.sg/cfar/about-cfar/management/prof-ivor-tsang",
        "dblp": "68/1260-4;166/5900;;226/5688-2;85/3714-2;55/5407-1.html;35/5873",
        "google_scholar": "DCTAaNQAAAAJ;w8oDh9QAAAAJ;uQXB6-oAAAAJ;;pbjw9sMAAAAJ;https://scholar.google.com/citations?hl=zh-CN;rJMOlVsAAAAJ",
        "orcid": ";;;0000-0002-9475-465X;0000-0002-5390-9053;0000-0002-3196-2347;",
        "linkedin": ";;;;;;",
        "or_profile": "~Feng_Hong1;~Jiangchao_Yao1;~Yueming_Lyu1;~Zhihan_Zhou2;~Ya_Zhang1;~Yanfeng_Wang1;~Ivor_W_Tsang1",
        "aff": "Shanghai Jiaotong University;Shanghai Artificial Intelligence Laboratory;Agency for Science, Technology and Research (A*STAR);Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;A*STAR",
        "aff_domain": "sjtu.edu.cn;pjlab.org.cn;astar.edu.sg;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;cfar.a-star.edu.sg",
        "position": "PhD student;Researcher;Researcher;PhD student;Professor;Full Professor;Principal Researcher",
        "bibtex": "@inproceedings{\nhong2024on,\ntitle={On Harmonizing Implicit Subpopulations},\nauthor={Feng Hong and Jiangchao Yao and Yueming Lyu and Zhihan Zhou and Ivor Tsang and Ya Zhang and Yanfeng Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=3GurO0kRue}\n}",
        "github": "",
        "project": "",
        "reviewers": "Dvju;FihB;acbx;TvvJ",
        "pdf_size": 4553670,
        "rating": "6;6;6;8",
        "confidence": "3;3;3;3",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "94;287;87;58",
        "wc_strengths": "74;185;112;21",
        "wc_weaknesses": "163;368;115;55",
        "wc_questions": "189;90;40;213",
        "wc_review": "520;930;354;347",
        "wc_reply_reviewers": "499;37;0;0",
        "wc_reply_authors": "2000;1373;1366;1666",
        "reply_reviewers": "2;1;0;0",
        "reply_authors": "6;4;3;4",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            131.5,
            90.78683825313006
        ],
        "wc_strengths_avg": [
            98.0,
            59.728552636071804
        ],
        "wc_weaknesses_avg": [
            175.25,
            117.67832213283805
        ],
        "wc_questions_avg": [
            133.0,
            70.77075667251269
        ],
        "wc_review_avg": [
            537.75,
            236.81466909801006
        ],
        "wc_reply_reviewers_avg": [
            134.0,
            211.2735194007995
        ],
        "wc_reply_authors_avg": [
            1601.25,
            260.11283609233897
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            4.25,
            1.0897247358851685
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10533268120873124048&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=3GurO0kRue",
        "pdf": "https://openreview.net/pdf?id=3GurO0kRue",
        "email": "sjtu.edu.cn;pjlab.org.cn;astar.edu.sg;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;cfar.a-star.edu.sg",
        "author_num": 7,
        "aff_unique_index": "0;1;2;0;0;0;2",
        "aff_unique_norm": "Shanghai Jiao Tong University;Shanghai Artificial Intelligence Laboratory;Agency for Science, Technology and Research",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.sjtu.edu.cn;http://www.shailab.org/;https://www.a-star.edu.sg",
        "aff_unique_abbr": "SJTU;Shanghai AI Lab;A*STAR",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0;0;1",
        "aff_country_unique": "China;Singapore"
    },
    {
        "id": "3IyC5lQTSi",
        "title": "Fairness Through Matching for better group fairness",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Group unfairness, which refers to socially unacceptable bias favoring certain groups (e.g., white, male), is frequently observed ethical concern in AI.\nVarious algorithms have been developed to mitigate such group unfairness in trained models.\nHowever, a significant limitation of existing algorithms for group fairness is that trained group-fair models can discriminate against specific subsets or not be fair for individuals in the same sensitive group.\nThe primary goal of this research is to develop a method to find a good group-fair model in the sense that it discriminates less against subsets and treats individuals in the same sensitive group more fairly.\nFor this purpose, we introduce a new measure of group fairness called Matched Demographic Parity (MDP). \nAn interesting feature of MDP is that it corresponds a matching function (a function matching two individuals from two different sensitive groups) to each group-fair model. \nThen, we propose a learning algorithm to seek a group-fair model whose corresponding matching function matches similar individuals well.\nTheoretical justifications are fully provided, and experiments are conducted to illustrate the superiority of the proposed algorithm.",
        "keywords": "Fairness;Matched demographic parity",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/3b874a33fda93b1c3ee3758183d9f2dcb0e149ae.zip",
        "author": "Kunwoong Kim;Insung Kong;Jongjin Lee;Minwoo Chae;Yongdai Kim",
        "authorids": "~Kunwoong_Kim1;~Insung_Kong1;~Jongjin_Lee1;~Minwoo_Chae1;~Yongdai_Kim1",
        "gender": "M;M;M;M;M",
        "homepage": "https://sites.google.com/view/insungkong/home;;https://sds.postech.ac.kr/;;",
        "dblp": ";;185/1370;93/734;296/1715",
        "google_scholar": "NYdp2FQAAAAJ;https://scholar.google.com/citations?view_op=list_works;B3P2AqUAAAAJ;;",
        "orcid": ";;0000-0002-6495-9558;;",
        "linkedin": ";;;;",
        "or_profile": "~Insung_Kong1;~Jongjin_Lee1;~Minwoo_Chae1;~Yongdai_Kim1;~Kun_woong_Kim1",
        "aff": "Seoul National University;Seoul National University;POSTECH;Seoul National University;Seoul National University",
        "aff_domain": "snu.ac.kr;snu.ac.kr;postech.ac.kr;snu.ac.kr;snu.ac.kr",
        "position": "PhD student;PhD student;Associate Professor;Full Professor;PhD student",
        "bibtex": "@misc{\nkim2024fairness,\ntitle={Fairness Through Matching for better group fairness},\nauthor={Kunwoong Kim and Insung Kong and Jongjin Lee and Minwoo Chae and Yongdai Kim},\nyear={2024},\nurl={https://openreview.net/forum?id=3IyC5lQTSi}\n}",
        "github": "",
        "project": "",
        "reviewers": "diD4;9FFn;ZKn5",
        "site": "https://openreview.net/forum?id=3IyC5lQTSi",
        "pdf_size": 5719711,
        "rating": "5;6;6",
        "confidence": "4;3;2",
        "soundness": "3;4;3",
        "contribution": "2;3;3",
        "presentation": "2;3;2",
        "wc_summary": "46;26;59",
        "wc_strengths": "35;25;59",
        "wc_weaknesses": "231;168;300",
        "wc_questions": "8;77;9",
        "wc_review": "320;296;427",
        "wc_reply_reviewers": "0;14;236",
        "wc_reply_authors": "1181;679;865",
        "reply_reviewers": "0;1;1",
        "reply_authors": "3;1;2",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            43.666666666666664,
            13.572848714334887
        ],
        "wc_strengths_avg": [
            39.666666666666664,
            14.2672897060218
        ],
        "wc_weaknesses_avg": [
            233.0,
            53.907327887774215
        ],
        "wc_questions_avg": [
            31.333333333333332,
            32.293790252754306
        ],
        "wc_review_avg": [
            347.6666666666667,
            56.94636853117931
        ],
        "wc_reply_reviewers_avg": [
            83.33333333333333,
            108.10283170306975
        ],
        "wc_reply_authors_avg": [
            908.3333333333334,
            207.218617782176
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:maQ1k8I0q_MJ:scholar.google.com/&scioq=Fairness+Through+Matching+for+better+group+fairness&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "Seoul National University;Pohang University of Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.snu.ac.kr;https://www.postech.ac.kr",
        "aff_unique_abbr": "SNU;POSTECH",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Pohang",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "3J7foqnJkA",
        "title": "Understanding Parameter Saliency via Extreme Value Theory",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep neural networks are being increasingly implemented throughout society in recent years. It is useful to identify which parameters trigger misclassification in diagnosing undesirable model behaviors.\nThe concept of parameter saliency is proposed and used to diagnose convolutional neural networks (CNNs) by ranking \nconvolution filters that may have caused misclassification on the basis of parameter saliency.\nIt is also shown that fine-tuning the top ranking salient filters  efficiently corrects misidentification on ImageNet.\nHowever, there is still a knowledge gap in terms of understanding why parameter saliency ranking can find the filters inducing misidentification.\nIn this work, we attempt to bridge the gap by analyzing parameter saliency ranking from a statistical viewpoint, namely, extreme value theory.\nWe first show that the existing work implicitly assumes that the gradient norm computed for each filter follows a normal distribution.\nThen, we clarify the relationship between parameter saliency and the score based on the peaks-over-threshold (POT) method, which is often used to model extreme values.\nFinally, we reformulate parameter saliency in terms of the POT method, where this reformulation is regarded as statistical anomaly detection and does not require the implicit assumptions of the existing formulation of parameter saliency.\nOur experimental results demonstrate that our reformulation can detect malicious filters as well.\nFurthermore, we show that the existing parameter saliency method exhibits a bias against the depth of layers in deep neural networks.\nIn particular, this bias has the potential to inhibit the discovery of filters that cause misidentification in situations where domain shift occurs.\nIn contrast, parameter saliency based on POT shows less of this bias.",
        "keywords": "parameter saliency;extreme value theory;XAI",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Shuo Wang;Issei Sato",
        "authorids": "~Shuo_Wang30;~Issei_Sato2",
        "gender": "M;",
        "homepage": "https://www.ml.is.s.u-tokyo.ac.jp/members-en;https://www.ml.is.s.u-tokyo.ac.jp/issei-sato-en",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Shuo_Wang30;~Issei_Sato2",
        "aff": "The University of Tokyo;The University of Tokyo",
        "aff_domain": "u-tokyo.ac.jp;u-tokyo.ac.jp",
        "position": "MS student;Full Professor",
        "bibtex": "@misc{\nwang2024understanding,\ntitle={Understanding Parameter Saliency via Extreme Value Theory},\nauthor={Shuo Wang and Issei Sato},\nyear={2024},\nurl={https://openreview.net/forum?id=3J7foqnJkA}\n}",
        "github": "",
        "project": "",
        "reviewers": "nAUC;HPzx;8wd7",
        "site": "https://openreview.net/forum?id=3J7foqnJkA",
        "pdf_size": 4673009,
        "rating": "5;6;6",
        "confidence": "4;3;2",
        "soundness": "3;3;2",
        "contribution": "2;3;3",
        "presentation": "3;2;3",
        "wc_summary": "61;44;67",
        "wc_strengths": "85;29;68",
        "wc_weaknesses": "127;481;163",
        "wc_questions": "50;32;53",
        "wc_review": "323;586;351",
        "wc_reply_reviewers": "0;50;114",
        "wc_reply_authors": "756;499;1395",
        "reply_reviewers": "0;1;2",
        "reply_authors": "2;2;3",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            57.333333333333336,
            9.741092797468305
        ],
        "wc_strengths_avg": [
            60.666666666666664,
            23.442601296689656
        ],
        "wc_weaknesses_avg": [
            257.0,
            159.0723106011854
        ],
        "wc_questions_avg": [
            45.0,
            9.273618495495704
        ],
        "wc_review_avg": [
            420.0,
            117.93501035174697
        ],
        "wc_reply_reviewers_avg": [
            54.666666666666664,
            46.65714188512718
        ],
        "wc_reply_authors_avg": [
            883.3333333333334,
            376.70884719575616
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Dq8yVgWrnjQJ:scholar.google.com/&scioq=Understanding+Parameter+Saliency+via+Extreme+Value+Theory&hl=en&as_sdt=0,44",
        "gs_version_total": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Tokyo",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.u-tokyo.ac.jp",
        "aff_unique_abbr": "UTokyo",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Japan"
    },
    {
        "title": "The Marginal Value of Momentum for Small Learning Rate SGD",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19521",
        "id": "3JjJezzVkT",
        "author_site": "Runzhe Wang, Sadhika Malladi, Tianhao Wang, Kaifeng Lyu, Zhiyuan Li",
        "tldr": "",
        "abstract": "Momentum is known to accelerate the convergence of gradient descent in strongly convex settings without stochastic gradient noise. In stochastic optimization, such as training neural networks, folklore suggests that momentum may help deep learning optimization by reducing the variance of the stochastic gradient update, but previous theoretical analyses do not find momentum to offer any provable acceleration. Theoretical results in this paper clarify the role of momentum in stochastic settings where the learning rate is small and gradient noise is the dominant source of instability, suggesting that SGD with and without momentum behave similarly in the short and long time horizons. Experiments show that momentum indeed has limited benefits for both optimization and generalization in practical training regimes where the optimal learning rate is not very large, including small- to medium-batch training from scratch on ImageNet and fine-tuning language models on downstream tasks.",
        "keywords": "momentum;SGD;dynamics",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Runzhe Wang;Sadhika Malladi;Tianhao Wang;Kaifeng Lyu;Zhiyuan Li",
        "authorids": "~Runzhe_Wang2;~Sadhika_Malladi2;~Tianhao_Wang1;~Kaifeng_Lyu2;~Zhiyuan_Li2",
        "gender": ";F;M;M;M",
        "homepage": "https://wang-runzhe.github.io;https://www.cs.princeton.edu/~smalladi/;https://tianhaowang.ttic.edu;https://kaifeng.ac/;https://zhiyuanli.ttic.edu",
        "dblp": ";176/9810;145/3288-2;220/3283;l/ZhiyuanLi",
        "google_scholar": ";9HCmTcwAAAAJ;m45LD1kAAAAJ;843JJtgAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Runzhe_Wang2;~Sadhika_Malladi2;~Tianhao_Wang1;~Kaifeng_Lyu2;~Zhiyuan_Li2",
        "aff": "Princeton University;Princeton University;Yale University;Princeton University;Toyota Technological Institute at Chicago",
        "aff_domain": "princeton.edu;princeton.edu;yale.edu;princeton.edu;ttic.edu",
        "position": "PhD student;PhD student;PhD student;PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nwang2024the,\ntitle={The Marginal Value of Momentum for Small Learning Rate {SGD}},\nauthor={Runzhe Wang and Sadhika Malladi and Tianhao Wang and Kaifeng Lyu and Zhiyuan Li},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=3JjJezzVkT}\n}",
        "github": "",
        "project": "",
        "reviewers": "EHVB;ReS6;fSFX;RZuq",
        "pdf_size": 997611,
        "rating": "5;5;6;6",
        "confidence": "3;3;3;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "89;31;104;92",
        "wc_strengths": "174;38;98;44",
        "wc_weaknesses": "411;98;27;85",
        "wc_questions": "2;32;143;65",
        "wc_review": "676;199;372;286",
        "wc_reply_reviewers": "139;0;0;0",
        "wc_reply_authors": "764;586;269;463",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            79.0,
            28.275431031197385
        ],
        "wc_strengths_avg": [
            88.5,
            54.61455849862745
        ],
        "wc_weaknesses_avg": [
            155.25,
            150.05728072972667
        ],
        "wc_questions_avg": [
            60.5,
            52.58564442887431
        ],
        "wc_review_avg": [
            383.25,
            179.74617520270075
        ],
        "wc_reply_reviewers_avg": [
            34.75,
            60.188765563018485
        ],
        "wc_reply_authors_avg": [
            520.5,
            180.37530318754838
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11356245156123228102&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=3JjJezzVkT",
        "pdf": "https://openreview.net/pdf?id=3JjJezzVkT",
        "email": "princeton.edu;princeton.edu;yale.edu;princeton.edu;ttic.edu",
        "author_num": 5,
        "aff_unique_index": "0;0;1;0;2",
        "aff_unique_norm": "Princeton University;Yale University;Toyota Technological Institute at Chicago",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.princeton.edu;https://www.yale.edu;https://www.tti-chicago.org",
        "aff_unique_abbr": "Princeton;Yale;TTI Chicago",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Chicago",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "3Jl0sjmZx9",
        "title": "Large Multimodal Model for Real-World Radiology Report Generation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "While automatic report generation has demonstrated promising results using deep learning-based methods, deploying these algorithms in real-world scenarios remains challenging. Compared to conventional report generation, real-world report generation requires model to follow the instruction from the radiologists and consider contextual information. Thus, this paper focuses on developing a practical report generation method that supports real-world clinical practice. To tackle the challenges posed by the limited availability of clinical data, we propose a GPT-based unified data generation pipeline designed to produce high-quality data. Consequently, we present a new benchmark dataset MIMIC-R3G, comprising five representative tasks pertinent to real-world medical report generation. We propose Domain-enhanced Multi-modal Model (DeMMo), where an additional medical domain vision encoder is incorporated into the general domain multimodal LLM to enhance its ability on specific domains. This approach aims to harness the specialized capabilities of the medical domain vision encoder while leveraging the robustness and versatility of the general domain multi-modal LLM. Comprehensive experiments demonstrate that our approach attains competitive performance across all real-world tasks compared to existing interactive report generation frameworks and state-of-the-art encoder-decoder style report generation models.",
        "keywords": "Report Generation;Large Vision Language Model",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Brian Nlong Zhao;XINYANG JIANG;Xufang Luo;Yifan Yang;Bo Li;Zilong Wang;Javier Alvarez-Valle;Matthew P. Lungren;Dongsheng Li;Lili Qiu",
        "authorids": "~Brian_Nlong_Zhao1;~XINYANG_JIANG2;~Xufang_Luo1;~Yifan_Yang9;~Bo_Li23;~Zilong_Wang8;~Javier_Alvarez-Valle1;~Matthew_P._Lungren1;~Dongsheng_Li2;~Lili_Qiu1",
        "gender": "M;M;F;M;M;M;M;;M;F",
        "homepage": ";;;https://www.microsoft.com/en-us/research/people/yifanyang/;https://www.brianboli.com/;;;;http://recmind.cn;https://www.cs.utexas.edu/~lili/",
        "dblp": "205/7046.html;155/6316;218/7350;83/89-4;50/3402-80;42/898-6;281/7037;;254/0830-2.html;",
        "google_scholar": "IhqFMeUAAAAJ;JiTfWVMAAAAJ;;;1_zc1-IAAAAJ;;https://scholar.google.co.uk/citations?user=ojoRDc4AAAAJ;z1UtMSYAAAAJ;VNg5rA8AAAAJ;https://scholar.google.com.tw/citations?user=16posrQAAAAJ",
        "orcid": ";;;;;0000-0002-6760-1471;0000-0003-0906-4177;;0000-0003-3103-8442;",
        "linkedin": ";xinyang-jiang-ab5416b0/;;yifyang/;brianbo1121/;;javieralvarezvalle/;;;",
        "or_profile": "~Brian_Nlong_Zhao1;~XINYANG_JIANG2;~Xufang_Luo1;~Yifan_Yang9;~Bo_Li23;~Zilong_Wang8;~Javier_Alvarez-Valle1;~Matthew_P._Lungren1;~Dongsheng_Li2;~Lili_Qiu1",
        "aff": "Microsoft Research Asia;Microsoft;Microsoft Research;Microsoft;Nanyang Technological University;Microsoft Research;Microsoft;Microsoft;Microsoft Research Asia;University of Texas at Austin",
        "aff_domain": "microsoft.com;microsoft.com;microsoft.com;microsoft.com;ntu.edu.sg;microsoft.com;microsoft.com;microsoft.com;microsoft.com;cs.utexas.edu",
        "position": "Intern;Senior Researcher;Researcher;Researcher;PhD student;Researcher;Senior Director of Biomedical Imaging;Principal Researcher;Principal Researcher;Full Professor",
        "bibtex": "@misc{\nzhao2024large,\ntitle={Large Multimodal Model for Real-World Radiology Report Generation},\nauthor={Brian Nlong Zhao and XINYANG JIANG and Xufang Luo and Yifan Yang and Bo Li and Zilong Wang and Javier Alvarez-Valle and Matthew P. Lungren and Dongsheng Li and Lili Qiu},\nyear={2024},\nurl={https://openreview.net/forum?id=3Jl0sjmZx9}\n}",
        "github": "",
        "project": "",
        "reviewers": "watP;8G3W;GGyY;NXpC;uSN9",
        "site": "https://openreview.net/forum?id=3Jl0sjmZx9",
        "pdf_size": 22146813,
        "rating": "3;5;5;5;8",
        "confidence": "5;4;4;4;2",
        "soundness": "1;2;3;2;3",
        "contribution": "1;2;2;2;3",
        "presentation": "1;3;3;3;4",
        "wc_summary": "50;41;72;85;50",
        "wc_strengths": "21;36;89;50;60",
        "wc_weaknesses": "86;97;177;313;31",
        "wc_questions": "19;115;162;36;44",
        "wc_review": "176;289;500;484;185",
        "wc_reply_reviewers": "0;0;0;254;0",
        "wc_reply_authors": "620;680;845;1646;173",
        "reply_reviewers": "0;0;0;1;0",
        "reply_authors": "1;1;2;3;1",
        "rating_avg": [
            5.2,
            1.6
        ],
        "confidence_avg": [
            3.8,
            0.9797958971132712
        ],
        "soundness_avg": [
            2.2,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            2.8,
            0.9797958971132712
        ],
        "wc_summary_avg": [
            59.6,
            16.304600577751057
        ],
        "wc_strengths_avg": [
            51.2,
            23.025203582161875
        ],
        "wc_weaknesses_avg": [
            140.8,
            97.91915032311096
        ],
        "wc_questions_avg": [
            75.2,
            54.38161454021019
        ],
        "wc_review_avg": [
            326.8,
            140.703091650468
        ],
        "wc_reply_reviewers_avg": [
            50.8,
            101.6
        ],
        "wc_reply_authors_avg": [
            792.8,
            481.1259294613002
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4
        ],
        "reply_authors_avg": [
            1.6,
            0.8
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": -0.9951052080056662,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2585879695080037135&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;1;0;0;0;0;2",
        "aff_unique_norm": "Microsoft;Nanyang Technological University;University of Texas at Austin",
        "aff_unique_dep": "Research;;",
        "aff_unique_url": "https://www.microsoft.com/en-us/research/group/asia;https://www.ntu.edu.sg;https://www.utexas.edu",
        "aff_unique_abbr": "MSR Asia;NTU;UT Austin",
        "aff_campus_unique_index": "0;0;2",
        "aff_campus_unique": "Asia;;Austin",
        "aff_country_unique_index": "0;1;1;1;2;1;1;1;0;1",
        "aff_country_unique": "China;United States;Singapore"
    },
    {
        "id": "3JoQqW35GQ",
        "title": "Training-free Linear Image Inversion via Flows",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Training-free linear inversion involves the use of a pretrained generative model and---through appropriate modifications to the generation process---solving inverse problems without any finetuning of the generative model. \nWhile recent prior methods have explored the use of diffusion models, they still require the manual tuning of many hyperparameters for different inverse problems. \nIn this work, we propose a training-free method for image inversion using pretrained flow models, leveraging the simplicity and efficiency of Flow Matching models, using theoretically-justified weighting schemes and thereby significantly reducing the amount of manual tuning.\nIn particular, we draw inspiration from two main sources: adopting prior gradient correction methods to the flow regime, and a solver scheme based on conditional Optimal Transport paths.\nAs pretrained diffusion models are widely accessible, we also show how to practically adapt diffusion models for our method.\nEmpirically, our approach requires no problem-specific tuning across an extensive suite of noisy linear image inversion problems on high-dimensional datasets, ImageNet-64/128 and AFHQ-256, and we observe that our flow-based method for image inversion significantly improves upon closely-related diffusion-based linear inversion methods.",
        "keywords": "inverse problems;linear image inversion;continuous normalizing flows;flow matching;diffusion models",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Ashwini Pokle;Matthew J. Muckley;Ricky T. Q. Chen;Brian Karrer",
        "authorids": "~Ashwini_Pokle1;~Matthew_J._Muckley1;~Ricky_T._Q._Chen1;~Brian_Karrer1",
        "gender": "F;M;M;M",
        "homepage": "https://ashwinipokle.github.io/;https://mmuckley.github.io/;;http://www.rtqichen.com",
        "dblp": "228/5527;158/8226;27/7164;228/6698",
        "google_scholar": "o_1YtVoAAAAJ;Iz9v6dcAAAAJ;Wewcpo4AAAAJ;7MxQd6UAAAAJ",
        "orcid": ";0000-0002-6525-8817;;",
        "linkedin": ";matthew-muckley-33a9b558/;;",
        "or_profile": "~Ashwini_Pokle1;~Matthew_J._Muckley1;~Brian_Karrer1;~Tian_Qi_Chen2",
        "aff": "Carnegie Mellon University;Meta;Meta Fundamental AI Research (FAIR);FAIR Labs, Meta AI",
        "aff_domain": "andrew.cmu.edu;fb.com;meta.com;meta.com",
        "position": "PhD student;Research Engineer;Researcher;Researcher",
        "bibtex": "@misc{\npokle2024trainingfree,\ntitle={Training-free Linear Image Inversion via Flows},\nauthor={Ashwini Pokle and Matthew J. Muckley and Ricky T. Q. Chen and Brian Karrer},\nyear={2024},\nurl={https://openreview.net/forum?id=3JoQqW35GQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "pako;tnhX;STfT;4dCg",
        "site": "https://openreview.net/forum?id=3JoQqW35GQ",
        "pdf_size": 46014074,
        "rating": "6;8;8;8",
        "confidence": "5;4;3;3",
        "soundness": "3;3;4;3",
        "contribution": "2;3;4;3",
        "presentation": "3;3;4;2",
        "wc_summary": "62;63;46;48",
        "wc_strengths": "50;26;59;74",
        "wc_weaknesses": "174;63;63;82",
        "wc_questions": "161;2;15;26",
        "wc_review": "447;154;183;230",
        "wc_reply_reviewers": "24;0;0;70",
        "wc_reply_authors": "1694;108;260;266",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "3;1;1;3",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            54.75,
            7.790218225441442
        ],
        "wc_strengths_avg": [
            52.25,
            17.41228014936585
        ],
        "wc_weaknesses_avg": [
            95.5,
            45.98097432634502
        ],
        "wc_questions_avg": [
            51.0,
            64.07417576528005
        ],
        "wc_review_avg": [
            253.5,
            114.96195022702076
        ],
        "wc_reply_reviewers_avg": [
            23.5,
            28.578838324886476
        ],
        "wc_reply_authors_avg": [
            582.0,
            645.127894296937
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            1.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8703882797784891,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13056289113879813403&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Carnegie Mellon University;Meta",
        "aff_unique_dep": ";Meta Platforms, Inc.",
        "aff_unique_url": "https://www.cmu.edu;https://meta.com",
        "aff_unique_abbr": "CMU;Meta",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "3K3aWRpRNq",
        "title": "Reducing Atomic Clashes in Geometric Diffusion Models for 3D Structure-Based Drug Design",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In the domain of Three-dimensional Structure-Based Drug Design (3D SBDD), the 3D spatial structures of target pockets serve as inputs for the generation of molecular geometric graphs. The Geometric Diffusion Model (GDM) has been recognized as the state-of-the-art (SOTA) method in 3D SBDD, attributed to its exceptional generation capabilities on geometric graphs. However, the inherent data-driven nature of GDM occasionally neglects critical inter-molecular interactions, such as Van der Waals force and Hydrogen Bonding. Such omissions could produce molecules that violate established physical principles. Particular evidence is that GDMs exhibit atomic clashes during generation due to the overly close proximity of generated molecules to protein structures. To address this, our paper introduces a novel constrained sampling process designed to obviate such undesirable collisions. By integrating a non-convex constraint within the current Langevin Dynamics (LD) of GDM and utilizing the proximal regularization techniques, we force molecular coordinates to obey the imposed physical constraints. Notably, the proposed method requires no modifications to the training process of GDMs. Empirical evaluations show a significant reduction in atomic clashes via the proposed method compared to the original LD process of GDMs.",
        "keywords": "Structure Based Drug Design;Geometric Molecular Generation;Diffusion Models",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Jian Ma;Peilin Zhao;Tingyang Xu;Qifeng Bai",
        "authorids": "~Jian_Ma8;~Peilin_Zhao2;~Tingyang_Xu1;~Qifeng_Bai1",
        "gender": "M;;M;M",
        "homepage": "https://github.com/small-jian-house;;;https://molaical.github.io",
        "dblp": ";84/8411;157/0940;",
        "google_scholar": ";https://scholar.google.com.hk/citations?user=HPeX_YcAAAAJ;6gIs5YMAAAAJ;https://scholar.google.com.hk/citations?user=7w7Vwh0AAAAJ",
        "orcid": ";0000-0001-8543-3953;0009-0002-0106-8376;0000-0002-8498-0936",
        "linkedin": ";;;",
        "or_profile": "~Jian_Ma8;~Peilin_Zhao2;~Tingyang_Xu1;~Qifeng_Bai1",
        "aff": "Lanzhou University;Tencent;Tencent AI Lab;Lanzhou University",
        "aff_domain": "lzu.edu.cn;tencent.com;tencent.com;lzu.edu.cn",
        "position": "MS student;Researcher;Researcher;Full Professor",
        "bibtex": "@misc{\nma2024reducing,\ntitle={Reducing Atomic Clashes in Geometric Diffusion Models for 3D Structure-Based Drug Design},\nauthor={Jian Ma and Peilin Zhao and Tingyang Xu and Qifeng Bai},\nyear={2024},\nurl={https://openreview.net/forum?id=3K3aWRpRNq}\n}",
        "github": "",
        "project": "",
        "reviewers": "2tn2;7c1E;xcbL;F9wF",
        "site": "https://openreview.net/forum?id=3K3aWRpRNq",
        "pdf_size": 10540917,
        "rating": "3;3;3;6",
        "confidence": "3;4;3;4",
        "soundness": "2;2;2;2",
        "contribution": "2;1;2;2",
        "presentation": "2;2;1;2",
        "wc_summary": "77;107;68;95",
        "wc_strengths": "10;33;73;132",
        "wc_weaknesses": "145;71;235;61",
        "wc_questions": "1;27;42;125",
        "wc_review": "233;238;418;413",
        "wc_reply_reviewers": "49;0;77;20",
        "wc_reply_authors": "641;329;772;443",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "2;1;2;1",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            86.75,
            15.20485119953497
        ],
        "wc_strengths_avg": [
            62.0,
            46.27634384866635
        ],
        "wc_weaknesses_avg": [
            128.0,
            69.77822009767804
        ],
        "wc_questions_avg": [
            48.75,
            46.40245144386232
        ],
        "wc_review_avg": [
            325.5,
            90.03471552684553
        ],
        "wc_reply_reviewers_avg": [
            36.5,
            29.159046623646667
        ],
        "wc_reply_authors_avg": [
            546.25,
            171.60911252028546
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5797390712744065041&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;0",
        "aff_unique_norm": "Lanzhou University;Tencent",
        "aff_unique_dep": ";Tencent Holdings Limited",
        "aff_unique_url": "https://www.lzu.edu.cn;https://www.tencent.com",
        "aff_unique_abbr": "LZU;Tencent",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "On Representation Complexity of Model-based and Model-free Reinforcement Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19520",
        "id": "3K3s9qxSn7",
        "author_site": "Hanlin Zhu, Baihe Huang, Stuart Russell",
        "tldr": "",
        "abstract": "We study the representation complexity of model-based and model-free reinforcement learning (RL) in the context of circuit complexity. We prove theoretically that there exists a broad class of MDPs such that their underlying transition and reward functions can be represented by constant depth circuits with polynomial size, while the optimal $Q$-function suffers an exponential circuit complexity in constant-depth circuits. By drawing attention to the approximation errors and building connections to complexity theory, our theory provides unique insights into why model-based algorithms usually enjoy better sample complexity than model-free algorithms from a novel representation complexity perspective: in some cases, the ground-truth rule (model) of the environment is simple to represent, while other quantities, such as $Q$-function, appear complex. We empirically corroborate our theory by comparing the approximation error of the transition kernel, reward function, and optimal $Q$-function in various Mujoco environments, which demonstrates that the approximation errors of the transition kernel and reward function are consistently lower than those of the optimal $Q$-function. To the best of our knowledge, this work is the first to study the circuit complexity of RL, which also provides a rigorous framework for future research.",
        "keywords": "model-based and model-free RL;representation complexity;circuit complexity;approximation error",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/636c407cfdbdbea5f6bf0356c85553601435ca7d.pdf",
        "author": "Hanlin Zhu;Baihe Huang;Stuart Russell",
        "authorids": "~Hanlin_Zhu2;~Baihe_Huang1;~Stuart_Russell1",
        "gender": "M;;M",
        "homepage": "https://hanlinzhu.com/;;https://people.eecs.berkeley.edu/~russell/",
        "dblp": ";279/4131;",
        "google_scholar": "yDVn5LEAAAAJ;chICXXMAAAAJ;https://scholar.google.com.tw/citations?user=KJGrjCAAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Hanlin_Zhu2;~Baihe_Huang1;~Stuart_Russell1",
        "aff": "Electrical Engineering & Computer Science Department, University of California Berkeley;University of California, Berkeley;University of California, Berkeley",
        "aff_domain": "eecs.berkeley.edu;berkeley.edu;berkeley.edu",
        "position": "PhD student;PhD student;Full Professor",
        "bibtex": "@inproceedings{\nzhu2024on,\ntitle={On Representation Complexity of Model-based and Model-free Reinforcement Learning},\nauthor={Hanlin Zhu and Baihe Huang and Stuart Russell},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=3K3s9qxSn7}\n}",
        "github": "",
        "project": "",
        "reviewers": "kBCH;zTQ7;9wTj",
        "pdf_size": 6585554,
        "rating": "5;6;8",
        "confidence": "2;4;2",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "3;3;3",
        "wc_summary": "101;86;77",
        "wc_strengths": "77;42;34",
        "wc_weaknesses": "34;111;46",
        "wc_questions": "14;97;33",
        "wc_review": "226;336;190",
        "wc_reply_reviewers": "13;143;24",
        "wc_reply_authors": "456;959;424",
        "reply_reviewers": "1;2;1",
        "reply_authors": "2;2;2",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            88.0,
            9.899494936611665
        ],
        "wc_strengths_avg": [
            51.0,
            18.672618098881223
        ],
        "wc_weaknesses_avg": [
            63.666666666666664,
            33.82635395992631
        ],
        "wc_questions_avg": [
            48.0,
            35.505868059613285
        ],
        "wc_review_avg": [
            250.66666666666666,
            62.10385566845982
        ],
        "wc_reply_reviewers_avg": [
            60.0,
            58.86141916966211
        ],
        "wc_reply_authors_avg": [
            613.0,
            245.00748287892486
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.18898223650461365,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7439446087400089778&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "openreview": "https://openreview.net/forum?id=3K3s9qxSn7",
        "pdf": "https://openreview.net/pdf?id=3K3s9qxSn7",
        "email": "eecs.berkeley.edu;berkeley.edu;berkeley.edu",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of California, Berkeley",
        "aff_unique_dep": "Electrical Engineering & Computer Science Department",
        "aff_unique_url": "https://www.berkeley.edu",
        "aff_unique_abbr": "UC Berkeley",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Berkeley",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "The Reasonableness Behind Unreasonable Translation Capability of Large Language Model",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19519",
        "id": "3KDbIWT26J",
        "author_site": "Tingchen Fu, lemao liu, Deng Cai, Guoping Huang, Shuming Shi, Rui Yan",
        "tldr": "",
        "abstract": "Multilingual large language models trained on non-parallel data yield impressive translation capabilities. Existing studies demonstrate that incidental sentence-level bilingualism within pre-training data contributes to the LLM's translation abilities. However, it has also been observed that LLM's translation capabilities persist even when incidental sentence-level bilingualism are excluded from the training corpus.\nIn this study, we comprehensively investigate the unreasonable effectiveness and the underlying mechanism for LLM's translation abilities, specifically addressing the question why large language models learn to translate without parallel data, using the BLOOM model series as a representative example. Through extensive experiments, our findings suggest the existence of unintentional bilingualism in the pre-training corpus, especially word alignment data significantly contributes to the large language model's acquisition of translation ability. Moreover, the translation signal derived from word alignment data is comparable to that from sentence-level bilingualism. Additionally, we study the effects of monolingual data and parameter-sharing in assisting large language model to learn to translate. Together, these findings present another piece of the broader puzzle of trying to understand how large language models acquire translation capability.",
        "keywords": "large language model;translation;unintentional bilingualism",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Tingchen Fu;Lemao Liu;Deng Cai;Guoping Huang;Shuming Shi;Rui Yan",
        "authorids": "~Tingchen_Fu1;~Lemao_Liu3;~Deng_Cai1;~Guoping_Huang2;~Shuming_Shi1;~Rui_Yan2",
        "gender": "M;M;M;M;M;M",
        "homepage": ";https://jcyk.github.io/;;;https://gsai.ruc.edu.cn/english/ruiyan;https://lemaoliu.github.io/homepage/",
        "dblp": "318/0986;c/DCai-2;165/3047;s/ShumingShi;19/2405-1;41/10887.html",
        "google_scholar": ";KpbRLYcAAAAJ;xSkkA7UAAAAJ;Lg31AKMAAAAJ;eLw6g-UAAAAJ;",
        "orcid": ";;;;0000-0002-3356-6823;",
        "linkedin": "%E5%BB%B7%E7%90%9B-%E4%BB%98-b00435181/;;guoping-huang-473708b9/;;;",
        "or_profile": "~Tingchen_Fu1;~Deng_Cai1;~Guoping_Huang2;~Shuming_Shi1;~Rui_Yan2;~lemao_liu1",
        "aff": "Renmin University of China;Tencent AI Lab;;Tencent AI Lab;Renmin University of China;Tencent",
        "aff_domain": "ruc.edu.cn;tencent.com;;tencent.com;ruc.edu.cn;tencent.com",
        "position": "MS student;Research Scientist;;Principal Researcher;Associate Professor;Researcher",
        "bibtex": "@inproceedings{\nfu2024the,\ntitle={The Reasonableness Behind Unreasonable Translation Capability of Large Language Model},\nauthor={Tingchen Fu and Lemao Liu and Deng Cai and Guoping Huang and Shuming Shi and Rui Yan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=3KDbIWT26J}\n}",
        "github": "",
        "project": "",
        "reviewers": "5xLr;6ach;stf2;ZA8F",
        "pdf_size": 574040,
        "rating": "5;6;6;6",
        "confidence": "3;4;4;3",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;4;3",
        "wc_summary": "134;26;85;90",
        "wc_strengths": "87;17;131;26",
        "wc_weaknesses": "65;31;191;192",
        "wc_questions": "98;317;190;23",
        "wc_review": "384;391;597;331",
        "wc_reply_reviewers": "0;37;0;0",
        "wc_reply_authors": "580;1886;1043;1185",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;4;2;2",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            83.75,
            38.408169703853375
        ],
        "wc_strengths_avg": [
            65.25,
            46.54231945230061
        ],
        "wc_weaknesses_avg": [
            119.75,
            72.75085910145667
        ],
        "wc_questions_avg": [
            157.0,
            109.68819444224616
        ],
        "wc_review_avg": [
            425.75,
            101.55632673546242
        ],
        "wc_reply_reviewers_avg": [
            9.25,
            16.021469970012117
        ],
        "wc_reply_authors_avg": [
            1173.5,
            468.2576747902804
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            1.0897247358851685
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15514343039983960443&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=3KDbIWT26J",
        "pdf": "https://openreview.net/pdf?id=3KDbIWT26J",
        "email": "ruc.edu.cn;tencent.com;;tencent.com;ruc.edu.cn;tencent.com",
        "author_num": 6,
        "aff_unique_index": "0;1;1;0;1",
        "aff_unique_norm": "Renmin University of China;Tencent",
        "aff_unique_dep": ";Tencent AI Lab",
        "aff_unique_url": "http://www.ruc.edu.cn;https://ai.tencent.com",
        "aff_unique_abbr": "RUC;Tencent AI Lab",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "3KmfUE31sc",
        "title": "Reconstruction as Sequence for Efficient Unified Unsupervised Anomaly Detection",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Unsupervised anomaly detection is highly desirable in industrial manufacturing processes due to the rarity of anomalies in real-world scenarios. Recent research has been focused on developing a unified framework for achieving multi-class anomaly detection. However, existing advanced feature-reconstruction-based methods often suffer from a lack of sufficient contextual awareness, thereby compromising the quality of the reconstruction. To address this challenge, we introduce a novel Reconstruction as Sequence (RAS) framework, which enhances the contextual correspondence during feature reconstruction through a sequence modelling perspective. In particular, based on the transformer technique, we integrate a specialized RASFormer block into the RAS framework. This block enables the capture of spatial relationships among different image regions and enhances temporal dependencies throughout the reconstruction process. By incorporating the RASFormer block, our RAS method achieves superior contextual awareness capabilities, leading to exceptional performance and faster inference speed. Experimental results show that our proposed RAS method significantly outperforms competing methods while exhibiting a maximal improvement of 29\\% in inference throughput. These results indicate the best trade-off between effectiveness and efficiency, further demonstrating the superiority and practicality of our method.",
        "keywords": "Anomaly Detection;Reconstruction;Transformer;Unsupervised Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Hui-Yue Yang;Hui Chen;Zijia Lin;Jungong Han;Guiguang Ding",
        "authorids": "~Hui-Yue_Yang2;~Hui_Chen7;~Zijia_Lin1;~Jungong_Han1;~Guiguang_Ding1",
        "gender": ";M;M;M;M",
        "homepage": ";https://huichen24.github.io/;https://sites.google.com/site/linzijia72/;https://jungonghan.github.io/;http://ise.thss.tsinghua.edu.cn/MIG/dgg.html",
        "dblp": ";;78/9911;98/6127;51/740",
        "google_scholar": ";erpvWcIAAAAJ;ghUYrHkAAAAJ;hNi1gxAAAAAJ;https://scholar.google.com.tw/citations?user=B7F3yt4AAAAJ",
        "orcid": "0000-0002-9458-5788;0000-0003-4180-5801;0000-0002-1390-7424;0000-0003-4361-956X;0000-0003-0137-9975",
        "linkedin": ";;;;",
        "or_profile": "~Hui-Yue_Yang2;~Hui_Chen7;~Zijia_Lin1;~Jungong_Han1;~Guiguang_Ding1",
        "aff": "Tsinghua University;Tsinghua University;Kuaishou Technology;University of Sheffield;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;mail.tsinghua.edu.cn;kuaishou.com;sheffield.ac.uk;tsinghua.edu.cn",
        "position": "PhD student;Researcher;NLP expert;Full Professor;Full Professor",
        "bibtex": "@misc{\nyang2024reconstruction,\ntitle={Reconstruction as Sequence for Efficient Unified Unsupervised Anomaly Detection},\nauthor={Hui-Yue Yang and Hui Chen and Zijia Lin and Jungong Han and Guiguang Ding},\nyear={2024},\nurl={https://openreview.net/forum?id=3KmfUE31sc}\n}",
        "github": "",
        "project": "",
        "reviewers": "xekD;rUeR;5D2p;m5gg",
        "site": "https://openreview.net/forum?id=3KmfUE31sc",
        "pdf_size": 1272973,
        "rating": "3;3;5;6",
        "confidence": "5;4;4;4",
        "soundness": "3;2;3;3",
        "contribution": "2;1;2;3",
        "presentation": "3;3;2;3",
        "wc_summary": "45;186;78;70",
        "wc_strengths": "14;37;27;54",
        "wc_weaknesses": "162;252;87;198",
        "wc_questions": "9;7;1;8",
        "wc_review": "230;482;193;330",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            94.75,
            54.07113370366854
        ],
        "wc_strengths_avg": [
            33.0,
            14.611639196202457
        ],
        "wc_weaknesses_avg": [
            174.75,
            59.93903152370749
        ],
        "wc_questions_avg": [
            6.25,
            3.112474899497183
        ],
        "wc_review_avg": [
            308.75,
            111.87800275299877
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5555555555555555,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:BSrZnEDOxKIJ:scholar.google.com/&scioq=Reconstruction+as+Sequence+for+Efficient+Unified+Unsupervised+Anomaly+Detection&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2;0",
        "aff_unique_norm": "Tsinghua University;Kuaishou Technology;University of Sheffield",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.kuaishou.com;https://www.sheffield.ac.uk",
        "aff_unique_abbr": "THU;Kuaishou;Sheffield",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "id": "3LFy3dUS86",
        "title": "P2RBOX:A SINGLE POINT IS ALL YOU NEED TRAINING ORIENTED OBJECT DETECTOR",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Oriented object detection, a specialized subfield in computer vision, finds applications across diverse scenarios, excelling particularly when dealing with objects of arbitrary orientations. Conversely, point annotation, which treats objects as single points, offers a cost-effective alternative to rotated and horizontal bounding boxes but sacrifices performance due to the loss of size and orientation information. In this study, we introduce the P2RBox network, which leverages point annotations and a mask generator to create mask proposals, followed by filtration through our Inspector Module and Constrainer Module. This process selects high-quality masks, which are subsequently converted into rotated box annotations for training a fully supervised detector. Specifically, we've thoughtfully crafted an Inspector Module rooted in multi-instance learning principles to evaluate the semantic score of masks. We've also proposed a more robust mask quality assessment in conjunction with the Constrainer Module. Furthermore, we've introduced a Symmetry Axis Estimation (SAE) Module inspired by the spectral theorem for symmetric matrices to transform the top-performing mask proposal into rotated bounding boxes. P2RBox performs well with three fully supervised rotated object detectors: RetinaNet, Rotated FCOS, and Oriented R-CNN. By combining with Oriented R-CNN, P2RBox achieves 62.26% on DOTA-v1.0 test dataset. As far as we know, this is the first attempt at training an oriented object detector with point supervision.",
        "keywords": "point-supervised rotated object detector",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/12da55ba9240a7bc4fe02052990810b9ddb2cb5d.pdf",
        "author": "Guangming Cao;Xuehui Yu;Wenwen Yu;Xumeng Han;Guorong Li;Jianbin Jiao;Zhenjun Han",
        "authorids": "~Guangming_Cao1;~Xuehui_Yu1;~Wenwen_Yu2;~Xumeng_Han1;~Guorong_Li1;~Jianbin_Jiao1;~Zhenjun_Han1",
        "gender": "M;;M;F;M;M;M",
        "homepage": "https://github.com/guangminglftg;http://vision.ucas.ac.cn/;;https://people.ucas.edu.cn/~GuorongLi?language=en;http://lamp.ucas.ac.cn/;https://people.ucas.ac.cn/~hanzhj;https://yinglang.github.io/",
        "dblp": ";;297/3745;28/4782;;11/2938;243/8603",
        "google_scholar": ";;https://scholar.google.cz/citations?user=LWu_FiQAAAAJ;AiuGlVQAAAAJ;;0rK4yTcAAAAJ;WYrxoBEAAAAJ",
        "orcid": ";;0000-0002-1636-463X;0000-0003-3954-2387;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Guangming_Cao1;~Wenwen_Yu2;~Xumeng_Han1;~Guorong_Li1;~Jianbin_Jiao1;~Zhenjun_Han1;~hui_ying2",
        "aff": "University of Chinese Academy of Sciences;University of Chinese Academy of Sciences;University of Chinese Academy of Sciences;University of Chinese Academy of Sciences;University of Chinese Academy of Sciences;University of Chinese Academy of Sciences;University of Chinese Academy of Sciences",
        "aff_domain": "ucas.ac.cn;ucas.ac.cn;ucas.ac.cn;ucas.ac.cn;ucas.ac.cn;ucas.ac.cn;mails.ucas.ac.cn",
        "position": "MS student;MS student;PhD student;Full Professor;Full Professor;Associate Professor;PhD student",
        "bibtex": "@misc{\ncao2024prboxa,\ntitle={P2{RBOX}:A {SINGLE} {POINT} {IS} {ALL} {YOU} {NEED} {TRAINING} {ORIENTED} {OBJECT} {DETECTOR}},\nauthor={Guangming Cao and Xuehui Yu and Wenwen Yu and Xumeng Han and Guorong Li and Jianbin Jiao and Zhenjun Han},\nyear={2024},\nurl={https://openreview.net/forum?id=3LFy3dUS86}\n}",
        "github": "",
        "project": "",
        "reviewers": "KHmW;4XWe;oNSm;a8aF;JsqB;hRnG",
        "site": "https://openreview.net/forum?id=3LFy3dUS86",
        "pdf_size": 7901729,
        "rating": "3;3;3;3;5;6",
        "confidence": "4;5;5;3;4;4",
        "soundness": "2;2;2;3;3;3",
        "contribution": "1;2;2;3;2;4",
        "presentation": "2;2;2;3;3;3",
        "wc_summary": "40;91;75;80;60;68",
        "wc_strengths": "20;50;66;24;58;97",
        "wc_weaknesses": "30;232;342;231;186;142",
        "wc_questions": "15;4;153;27;87;83",
        "wc_review": "105;377;636;362;391;390",
        "wc_reply_reviewers": "0;0;59;18;0;49",
        "wc_reply_authors": "228;645;652;464;577;439",
        "reply_reviewers": "0;0;1;1;0;1",
        "reply_authors": "1;1;1;1;1;1",
        "rating_avg": [
            3.8333333333333335,
            1.2133516482134197
        ],
        "confidence_avg": [
            4.166666666666667,
            0.6871842709362768
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            69.0,
            16.14517471774978
        ],
        "wc_strengths_avg": [
            52.5,
            26.03683288471673
        ],
        "wc_weaknesses_avg": [
            193.83333333333334,
            95.20227004763186
        ],
        "wc_questions_avg": [
            61.5,
            51.87083316598388
        ],
        "wc_review_avg": [
            376.8333333333333,
            153.65265662815236
        ],
        "wc_reply_reviewers_avg": [
            21.0,
            24.358434541926815
        ],
        "wc_reply_authors_avg": [
            500.8333333333333,
            146.6599430277023
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.1665741511631924,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:1EacpzyPU6UJ:scholar.google.com/&scioq=P2RBOX:A+SINGLE+POINT+IS+ALL+YOU+NEED+TRAINING+ORIENTED+OBJECT+DETECTOR&hl=en&as_sdt=0,47",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0;0;0",
        "aff_unique_norm": "University of Chinese Academy of Sciences",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.ucas.ac.cn",
        "aff_unique_abbr": "UCAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "3LLkES6nNs",
        "title": "Infinitely Deep Residual Networks: Unveiling Wide Neural ODEs as Gaussian Processes",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "While Neural Ordinary Differential Equations (Neural ODEs) have demonstrated practical numerical success, our theoretical understanding of them remains limited. Notably, we still lack convergence results and prediction performance estimates for Neural ODEs trained using gradient-based methods. Inspired by numerical analysis, one might investigate Neural ODEs by studying the limiting behavior of Residual Networks (ResNets) as depth $\\ell$ approaches to infinity. However, a significant challenge arises due to the prevalent use of shared parameters in Neural ODEs. Consequently, the corresponding ResNets possess \\textit{infinite depth} and \\textit{shared weights} across all layers. This characteristic prevents the direct application of methods relying on Stochastic Differential Equations (SDEs) to ResNets.\n\nIn this paper, we analyze Neural ODEs using an infinitely deep ResNet with shared weights. Our analysis is rooted in asymptotic analysis from random matrix theory (RMT). Consequently, we establish the Neural Network and Gaussian Process (NNGP) correspondence for Neural ODEs, regardless of whether the parameters are shared. Remarkably, the resulting Gaussian processes (GPs) exhibit distinct behaviors depending on the use of parameter sharing, setting them apart from other neural network architectures such as feed-forward, convolutional, and recurrent networks. Moreover, we prove that, in the presence of these divergent GPs, NNGP kernels are strictly positive definite when non-polynomial activation functions are applied. These findings lay the foundation for exploring the training and generalization of Neural ODEs, paving the way for future research in this domain. Additionally, we furnish an efficient dynamic programming algorithm for calculating the covariance matrix for given input data. Finally, we conduct a series of numerical experiments to support our theoretical findings.",
        "keywords": "Neural ODE;Gaussian Process;Neural Tangent Kernel;Neural Network and Gaussian Process Correspondence;Kernel Methods",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/3c0d9fc08306e107fc3e5b73970b5ebd6b0cc75c.pdf",
        "author": "Tianxiang Gao;Xiaokai Huo;Hailiang Liu;Hongyang Gao",
        "authorids": "~Tianxiang_Gao2;~Xiaokai_Huo1;~Hailiang_Liu1;~Hongyang_Gao1",
        "gender": "M;M;M;M",
        "homepage": "https://gaotx-cs.github.io/;;https://faculty.sites.iastate.edu/hliu/;https://faculty.sites.iastate.edu/hygao/",
        "dblp": "118/3814;;;200/7985",
        "google_scholar": "iNLlIbQAAAAJ;;Wq7IGEIAAAAJ;jGmq0aEAAAAJ",
        "orcid": ";0000-0001-8131-2310;;0000-0002-9020-9080",
        "linkedin": ";;;hongyang-gao-74924690/",
        "or_profile": "~Tianxiang_Gao2;~Xiaokai_Huo1;~Hailiang_Liu1;~Hongyang_Gao1",
        "aff": "Iowa State University;Iowa State University;Iowa State University;Iowa State University",
        "aff_domain": "iastate.edu;iastate.edu;iastate.edu;iastate.edu",
        "position": "PhD student;Postdoc;Full Professor;Assistant Professor",
        "bibtex": "@misc{\ngao2024infinitely,\ntitle={Infinitely Deep Residual Networks: Unveiling Wide Neural {ODE}s as Gaussian Processes},\nauthor={Tianxiang Gao and Xiaokai Huo and Hailiang Liu and Hongyang Gao},\nyear={2024},\nurl={https://openreview.net/forum?id=3LLkES6nNs}\n}",
        "github": "",
        "project": "",
        "reviewers": "ECfA;igTL;CRfF;TYVT",
        "site": "https://openreview.net/forum?id=3LLkES6nNs",
        "pdf_size": 1664231,
        "rating": "3;3;5;6",
        "confidence": "3;3;3;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "1;3;2;2",
        "wc_summary": "29;21;101;52",
        "wc_strengths": "36;53;77;30",
        "wc_weaknesses": "43;73;157;154",
        "wc_questions": "91;3;277;45",
        "wc_review": "199;150;612;281",
        "wc_reply_reviewers": "36;0;201;10",
        "wc_reply_authors": "623;1050;1643;330",
        "reply_reviewers": "1;0;2;1",
        "reply_authors": "1;2;3;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            50.75,
            31.163881337214722
        ],
        "wc_strengths_avg": [
            49.0,
            18.23458252881047
        ],
        "wc_weaknesses_avg": [
            106.75,
            49.90177852541931
        ],
        "wc_questions_avg": [
            104.0,
            104.61835403025609
        ],
        "wc_review_avg": [
            310.5,
            180.25329400596263
        ],
        "wc_reply_reviewers_avg": [
            61.75,
            81.4627982578551
        ],
        "wc_reply_authors_avg": [
            911.5,
            493.8747310806658
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:xqrBVCds7aIJ:scholar.google.com/&scioq=Infinitely+Deep+Residual+Networks:+Unveiling+Wide+Neural+ODEs+as+Gaussian+Processes&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Iowa State University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.iastate.edu",
        "aff_unique_abbr": "ISU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "CrIBo: Self-Supervised Learning via Cross-Image Object-Level Bootstrapping",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19518",
        "id": "3M0GXoUEzP",
        "author_site": "Tim Lebailly, Thomas Stegm\u00fcller, Behzad Bozorgtabar, Jean-Philippe Thiran, Tinne Tuytelaars",
        "tldr": "",
        "abstract": "Leveraging nearest neighbor retrieval for self-supervised representation learning has proven beneficial with object-centric images. However, this approach faces limitations when applied to scene-centric datasets, where multiple objects within an image are only implicitly captured in the global representation. Such global bootstrapping can lead to undesirable entanglement of object representations. Furthermore, even object-centric datasets stand to benefit from a finer-grained bootstrapping approach. In response to these challenges, we introduce a novel $\\textbf{Cr}$oss-$\\textbf{I}$mage Object-Level $\\textbf{Bo}$otstrapping method tailored to enhance dense visual representation learning. By employing object-level nearest neighbor bootstrapping throughout the training, CrIBo emerges as a notably strong and adequate candidate for in-context learning, leveraging nearest neighbor retrieval at test time. CrIBo shows state-of-the-art performance on the latter task while being highly competitive in more standard downstream segmentation tasks. Our code and pretrained models are publicly available at https://github.com/tileb1/CrIBo.",
        "keywords": "self-supervised learning;representation learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Tim Lebailly;Thomas Stegm\u00fcller;Behzad Bozorgtabar;Jean-Philippe Thiran;Tinne Tuytelaars",
        "authorids": "~Tim_Lebailly1;~Thomas_Stegm\u00fcller1;~Behzad_Bozorgtabar1;~Jean-Philippe_Thiran1;~Tinne_Tuytelaars1",
        "gender": "M;;M;M;",
        "homepage": ";https://people.epfl.ch/thomas.stegmuller?lang=en;https://behzadbozorgtabar.com/;https://people.epfl.ch/jean-philippe.thiran;",
        "dblp": "276/0970;313/9959;59/10419;t/JeanPhilippeThiran;",
        "google_scholar": "tQnods8AAAAJ;;kxAk6AoAAAAJ;mII-l2cAAAAJ;",
        "orcid": ";;0000-0002-5759-4896;0000-0003-2938-9657;",
        "linkedin": "tim-lebailly/;;behzad-bozorgtabar-72838560/;;",
        "or_profile": "~Tim_Lebailly1;~Thomas_Stegm\u00fcller1;~Behzad_Bozorgtabar1;~Jean-Philippe_Thiran1;~Tinne_Tuytelaars1",
        "aff": "Meta Facebook;EPFL - EPF Lausanne;Swiss Federal Institute of Technology Lausanne;University of Lausanne;",
        "aff_domain": "meta.com;epfl.ch;epfl.ch;unil.ch;",
        "position": "Intern;PhD student;Lecturer;Associate Professor;",
        "bibtex": "@inproceedings{\nlebailly2024cribo,\ntitle={Cr{IB}o: Self-Supervised Learning via Cross-Image Object-Level Bootstrapping},\nauthor={Tim Lebailly and Thomas Stegm{\\\"u}ller and Behzad Bozorgtabar and Jean-Philippe Thiran and Tinne Tuytelaars},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=3M0GXoUEzP}\n}",
        "github": "",
        "project": "",
        "reviewers": "w5sb;4jZr;sFy5;FBUq",
        "pdf_size": 8393658,
        "rating": "6;8;8;10",
        "confidence": "5;5;4;4",
        "soundness": "3;3;3;4",
        "contribution": "3;3;3;4",
        "presentation": "4;3;3;4",
        "wc_summary": "84;80;89;95",
        "wc_strengths": "82;93;113;105",
        "wc_weaknesses": "322;232;116;164",
        "wc_questions": "58;279;8;81",
        "wc_review": "546;684;326;445",
        "wc_reply_reviewers": "129;163;29;37",
        "wc_reply_authors": "1005;736;175;664",
        "reply_reviewers": "1;1;2;1",
        "reply_authors": "3;2;2;1",
        "rating_avg": [
            8.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            87.0,
            5.612486080160912
        ],
        "wc_strengths_avg": [
            98.25,
            11.776565713313877
        ],
        "wc_weaknesses_avg": [
            208.5,
            77.41285422977246
        ],
        "wc_questions_avg": [
            106.5,
            103.03033533867585
        ],
        "wc_review_avg": [
            500.25,
            131.5985847188335
        ],
        "wc_reply_reviewers_avg": [
            89.5,
            57.8338136387356
        ],
        "wc_reply_authors_avg": [
            645.0,
            299.6422867353672
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.7071067811865476,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11621237308825909642&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=3M0GXoUEzP",
        "pdf": "https://openreview.net/pdf?id=3M0GXoUEzP",
        "email": "meta.com;epfl.ch;epfl.ch;unil.ch;",
        "author_num": 5,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Meta;EPFL;Swiss Federal Institute of Technology Lausanne;University of Lausanne",
        "aff_unique_dep": "Meta Platforms, Inc.;;;",
        "aff_unique_url": "https://meta.com;https://www.epfl.ch;https://www.epfl.ch;https://www.unil.ch",
        "aff_unique_abbr": "Meta;EPFL;EPFL;UNIL",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Lausanne",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "United States;Switzerland"
    },
    {
        "id": "3NMYMLL92j",
        "title": "Brain encoding models based on binding multiple modalities across audio, language, and vision",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Multimodal associative learning of sensory stimuli (images, text, audio) has created powerful representations for these modalities that work across a multitude of tasks with simple task heads without even (fine)tuning features on target datasets. Such representations are being increasingly used to study neural activity and understand how our brain responds to such stimuli. While previous work has focused on static images, deep understanding of a video involves not just recognizing the individual objects present in each frame, but also requires a detailed semantic description of their interactions over time and their narrative roles. In this paper, we seek to evaluate whether new multimodally aligned features (like ImageBind) are better than previous ones in explaining fMRI responses to external stimuli, thereby allowing for a better understanding of how the brain and its different areas process external stimuli, converting them into meaningful high-level understanding, and actionable signals. In addition, we explore whether generative AI based modality conversion helps to disentangle the semantic part of the visual stimulus allowing for a more granular localization of such processing in the brain. Towards this end, given a dataset of fMRI responses from subjects watching short video clips, we first generate detailed multi-event video captions. Next, we synthesize audio from these generated text captions using a text-to-speech model. Further, we use a joint embedding across different modalities (audio, text and video) using the recently proposed ImageBind model. We use this joint embedding to train encoding models that predict fMRI brain responses. We infer from our experimental findings and computational results that the visual system's primary goal may revolve around converting visual input into comprehensive semantic scene descriptions. Further, multimodal feature alignment helps obtain richer representations for all modalities (audio, text and video) leading to improved performance compared to unimodal representations across well-known multimodal processing brain regions.",
        "keywords": "Multimodal Transformers;fMRI;ImageBind;cognitive neuroscience;brain encoding;movie clips;NLP;language models",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "Khushbu Pahwa;SUBBA REDDY OOTA;Advaith Malladi;Maneesh Kumar Singh;Manish Gupta;Bapi Raju Surampudi",
        "authorids": "~Khushbu_Pahwa1;~SUBBA_REDDY_OOTA1;~Advaith_Malladi1;~Maneesh_Kumar_Singh1;~Manish_Gupta1;~Bapi_Raju_Surampudi1",
        "gender": "F;M;M;M;M;",
        "homepage": ";https://sites.google.com/view/subbareddyoota300/home?authuser=0;https://advaithmall.github.io/;https://arxiv.org/search/?query=Singh%2C+Maneesh&searchtype=author&abstracts=show&order=-announced_date_first&size=50;https://sites.google.com/view/manishg/;",
        "dblp": "299/8490;190/1709;372/4611;263/9205-1;g/ManishGupta1.html;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.co.in/citations?user=4Uz0LngAAAAJ;https://scholar.google.co.in/citations?user=uZZrApkAAAAJ;hdQhiFgAAAAJ;https://scholar.google.co.in/citations?user=eX9PSu0AAAAJ;",
        "orcid": ";0000-0002-5975-622X;;0000-0002-7414-1813;0000-0002-2843-3110;",
        "linkedin": "khushbupahwa;subba-reddy-oota-11a91254/;advaith-malladi-30175326b/;maneesh-singh-3523ab9/;manishsgupta/;",
        "or_profile": "~Khushbu_Pahwa1;~SUBBA_REDDY_OOTA1;~Advaith_Malladi1;~Maneesh_Kumar_Singh1;~Manish_Gupta1;~Bapi_Raju_Surampudi1",
        "aff": "Rice University;MPI-SWS;International Institute of Information Technology, Hyderabad, International Institute of Information Technology Hyderabad;Spector Inc;Microsoft;",
        "aff_domain": "rice.edu;mpi-sws.org;research.iiit.ac.in;spector.com;microsoft.com;",
        "position": "MS student;Visiting Scholar;Undergrad student;Head, AI Research & Technologies;Principal Researcher;",
        "bibtex": "@misc{\npahwa2024brain,\ntitle={Brain encoding models based on binding multiple modalities across audio, language, and vision},\nauthor={Khushbu Pahwa and SUBBA REDDY OOTA and Advaith Malladi and Maneesh Kumar Singh and Manish Gupta and Bapi Raju Surampudi},\nyear={2024},\nurl={https://openreview.net/forum?id=3NMYMLL92j}\n}",
        "github": "",
        "project": "",
        "reviewers": "77Kr;TnaU;bZKi",
        "site": "https://openreview.net/forum?id=3NMYMLL92j",
        "pdf_size": 2841931,
        "rating": "1;3;8",
        "confidence": "5;5;5",
        "soundness": "1;2;3",
        "contribution": "1;2;3",
        "presentation": "1;3;3",
        "wc_summary": "68;45;82",
        "wc_strengths": "44;31;47",
        "wc_weaknesses": "214;253;17",
        "wc_questions": "133;18;53",
        "wc_review": "459;347;199",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "2014;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "3;0;0",
        "rating_avg": [
            4.0,
            2.943920288775949
        ],
        "confidence_avg": [
            5.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            65.0,
            15.253414918196734
        ],
        "wc_strengths_avg": [
            40.666666666666664,
            6.944222218666553
        ],
        "wc_weaknesses_avg": [
            161.33333333333334,
            103.2935407252339
        ],
        "wc_questions_avg": [
            68.0,
            48.13176359397884
        ],
        "wc_review_avg": [
            335.0,
            106.48317550987417
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            671.3333333333334,
            949.4087048731378
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            1.4142135623730951
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:w356AAv04OEJ:scholar.google.com/&scioq=Brain+encoding+models+based+on+binding+multiple+modalities+across+audio,+language,+and+vision&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "Rice University;Max Planck Institute for Software Systems;International Institute of Information Technology, Hyderabad;Spector Inc;Microsoft",
        "aff_unique_dep": ";;;;Microsoft Corporation",
        "aff_unique_url": "https://www.rice.edu;https://www.mpi-sws.org;https://iiit Hyderabad.ac.in;;https://www.microsoft.com",
        "aff_unique_abbr": "Rice;MPI-SWS;IIIT Hyderabad;;Microsoft",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hyderabad",
        "aff_country_unique_index": "0;1;2;0;0",
        "aff_country_unique": "United States;Germany;India"
    },
    {
        "id": "3NXhwkZGjz",
        "title": "Source-Free Unsupervised Domain Adaptation with Hypothesis Consolidation of Prediction Rationale",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Source-Free Unsupervised Domain Adaptation (SFUDA) is a challenging task where a model needs to be adapted to a new domain without access to target domain labels or source domain data. The primary difficulty in this task is that the model's predictions may be inaccurate, and using these inaccurate predictions for model adaptation can lead to misleading results. To address this issue, this paper proposes a novel approach that considers multiple prediction hypotheses for each sample and investigates the rationale behind each hypothesis. By consolidating these hypothesis rationales, we identify the most likely correct hypotheses, which we then use as a pseudo-labeled set to support a semi-supervised learning procedure for model adaptation. To achieve the optimal performance, we propose a three-step adaptation process: model pre-adaptation, hypothesis consolidation, and semi-supervised learning. Extensive experimental results demonstrate that our approach achieves state-of-the-art performance in the SFUDA task and can be easily integrated into existing approaches to improve their performance.",
        "keywords": "Source-Free Unsupervised Domain Adaptation;Hypothesis Consolidation;Prediction Rationale",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Yangyang Shu;Lingqiao Liu;Xiaofeng Cao;Qi Chen;Bowen Zhang;Ziqin Zhou;Anton van den Hengel",
        "authorids": "~Yangyang_Shu1;~Lingqiao_Liu3;~Xiaofeng_Cao2;~Qi_Chen4;~Bowen_Zhang3;~Ziqin_Zhou1;~Anton_van_den_Hengel1",
        "gender": "M;M;M;M;F;;M",
        "homepage": "https://ganperf.github.io/yangyangshu.github.io/;https://sites.google.com/site/lingqiaoliu83/;https://chenqi008.github.io/;;;;https://xiaofengcaoml.github.io/",
        "dblp": "201/7247.html;45/7776;66/6320-14;;;v/AntonvandenHengel;117/3982-2.html",
        "google_scholar": "TpdRFZIAAAAJ;Y2xu62UAAAAJ;OgKU77kAAAAJ;;uS_cqPUAAAAJ;https://scholar.google.com.au/citations?user=nMGZ2ZQAAAAJ;",
        "orcid": ";;0000-0001-8732-8049;0000-0001-6180-6815;0000-0002-5736-1232;0000-0003-3027-8364;",
        "linkedin": ";;qi-chen-4b1a72287;;;;",
        "or_profile": "~Yangyang_Shu1;~Lingqiao_Liu3;~Qi_Chen4;~Bowen_Zhang3;~Ziqin_Zhou1;~Anton_van_den_Hengel1;~Xiaofeng_Cao1",
        "aff": "University of Adelaide;University of Adelaide;University of Adelaide;University of Adelaide;University of Adelaide;University of Adelaide;Jilin University",
        "aff_domain": "adelaide.edu.au;adelaide.edu.au;adelaide.edu.au;adelaide.edu.au;adelaide.edu.au;adelaide.edu.au;jlu.edu.cn",
        "position": "Postdoc;Associate Professor;PhD student;PhD student;PhD student;Professor;Associate Professor",
        "bibtex": "@misc{\nshu2024sourcefree,\ntitle={Source-Free Unsupervised Domain Adaptation with Hypothesis Consolidation of Prediction Rationale},\nauthor={Yangyang Shu and Lingqiao Liu and Xiaofeng Cao and Qi Chen and Bowen Zhang and Ziqin Zhou and Anton van den Hengel},\nyear={2024},\nurl={https://openreview.net/forum?id=3NXhwkZGjz}\n}",
        "github": "",
        "project": "",
        "reviewers": "MZzB;qsm3;oDf4;Pcxi;8pzv",
        "site": "https://openreview.net/forum?id=3NXhwkZGjz",
        "pdf_size": 4559014,
        "rating": "3;3;5;5;6",
        "confidence": "4;4;4;5;3",
        "soundness": "1;2;3;2;3",
        "contribution": "2;2;2;3;3",
        "presentation": "1;2;2;3;3",
        "wc_summary": "334;25;29;84;78",
        "wc_strengths": "63;9;39;49;41",
        "wc_weaknesses": "1322;81;152;130;188",
        "wc_questions": "131;2;38;2;2",
        "wc_review": "1850;117;258;265;309",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            4.4,
            1.2
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.2,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.2,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            110.0,
            114.59668407070075
        ],
        "wc_strengths_avg": [
            40.2,
            17.735839421916292
        ],
        "wc_weaknesses_avg": [
            374.6,
            474.9667777855626
        ],
        "wc_questions_avg": [
            35.0,
            49.98399743918047
        ],
        "wc_review_avg": [
            559.8,
            648.3176381990544
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.2635231383473649,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:9bEJlcm1BzAJ:scholar.google.com/&scioq=Source-Free+Unsupervised+Domain+Adaptation+with+Hypothesis+Consolidation+of+Prediction+Rationale&hl=en&as_sdt=0,5",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0;0;0;1",
        "aff_unique_norm": "University of Adelaide;Jilin University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.adelaide.edu.au;http://www.jlu.edu.cn",
        "aff_unique_abbr": "Adelaide;JLU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;1",
        "aff_country_unique": "Australia;China"
    },
    {
        "title": "Don't Play Favorites: Minority Guidance for Diffusion Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19517",
        "id": "3NmO9lY4Jn",
        "author_site": "Soobin Um, Suhyeon Lee, Jong Chul YE",
        "tldr": "",
        "abstract": "We explore the problem of generating minority samples using diffusion models. The minority samples are instances that lie on low-density regions of a data manifold. Generating a sufficient number of such minority instances is important, since they often contain some unique attributes of the data. However, the conventional generation process of the diffusion models mostly yields majority samples (that lie on high-density regions of the manifold) due to their high likelihoods, making themselves ineffective and time-consuming for the minority generating task. In this work, we present a novel framework that can make the generation process of the diffusion models focus on the minority samples. We first highlight that Tweedie's denoising formula yields favorable results for majority samples. The observation motivates us to introduce a metric that describes the uniqueness of a given sample. To address the inherent preference of the diffusion models w.r.t. the majority samples, we further develop *minority guidance*, a sampling technique that can guide the generation process toward regions with desired likelihood levels. Experiments on benchmark real datasets demonstrate that our minority guidance can greatly improve the capability of generating high-quality minority samples over existing generative samplers. We showcase that the performance benefit of our framework persists even in demanding real-world scenarios such as medical imaging, further underscoring the practical significance of our work. Code is available at https://github.com/soobin-um/minority-guidance.",
        "keywords": "diffusion models;fairness;generative models;minority generation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/c0ea9b6ed7ee3d7f288e6eeba0e0f3b0b3cb6134.zip",
        "author": "Soobin Um;Suhyeon Lee;Jong Chul Ye",
        "authorids": "~Soobin_Um1;~Suhyeon_Lee2;~Jong_Chul_Ye1",
        "gender": ";M;M",
        "homepage": "https://sites.google.com/view/soobinum;https://github.com/hyn2028;https://bispl.weebly.com/",
        "dblp": "339/0076;342/2820;15/5613",
        "google_scholar": ";V9rMrFQAAAAJ;HNMjoNEAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Soobin_Um1;~Suhyeon_Lee2;~Jong_Chul_Ye1",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr;kaist.ac.kr",
        "position": "PhD student;MS student;Full Professor",
        "bibtex": "@inproceedings{\num2024dont,\ntitle={Don't Play Favorites: Minority Guidance for Diffusion Models},\nauthor={Soobin Um and Suhyeon Lee and Jong Chul Ye},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=3NmO9lY4Jn}\n}",
        "github": "",
        "project": "",
        "reviewers": "mz51;xCB3;Xf5u;F8nE",
        "pdf_size": 27130256,
        "rating": "3;6;6;6",
        "confidence": "5;4;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;2",
        "presentation": "3;3;3;2",
        "wc_summary": "55;84;96;64",
        "wc_strengths": "42;36;154;42",
        "wc_weaknesses": "266;184;157;150",
        "wc_questions": "89;4;2;71",
        "wc_review": "452;308;409;327",
        "wc_reply_reviewers": "289;11;0;13",
        "wc_reply_authors": "1762;566;428;1091",
        "reply_reviewers": "3;1;0;1",
        "reply_authors": "5;2;1;2",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            74.75,
            16.145819892467525
        ],
        "wc_strengths_avg": [
            68.5,
            49.42418436352794
        ],
        "wc_weaknesses_avg": [
            189.25,
            46.09433262343647
        ],
        "wc_questions_avg": [
            41.5,
            39.02883549377306
        ],
        "wc_review_avg": [
            374.0,
            58.89397252690635
        ],
        "wc_reply_reviewers_avg": [
            78.25,
            121.77720435286729
        ],
        "wc_reply_authors_avg": [
            961.75,
            524.0736470191952
        ],
        "reply_reviewers_avg": [
            1.25,
            1.0897247358851685
        ],
        "reply_authors_avg": [
            2.5,
            1.5
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 18,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9567931568206842834&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=3NmO9lY4Jn",
        "pdf": "https://openreview.net/pdf?id=3NmO9lY4Jn",
        "email": "kaist.ac.kr;kaist.ac.kr;kaist.ac.kr",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "GIO: Gradient Information Optimization for Training Dataset Selection",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19516",
        "id": "3NnfJnbJT2",
        "author_site": "Dante Everaert, Christopher Potts",
        "tldr": "",
        "abstract": "It is often advantageous to train models on a subset of the available train examples, because the examples are of variable quality or because one would like to train with fewer examples, without sacrificing performance. We present Gradient Information Optimization (GIO), a scalable, task-agnostic approach to this data selection problem that requires only a small set of (unlabeled) examples representing a target distribution. GIO begins from a natural, information-theoretic objective that is intractable in practice. Our contribution is in showing that it can be made highly scalable through a simple relaxation of the objective and a highly efficient implementation. In experiments with machine translation, spelling correction, and image recognition, we show that GIO delivers outstanding results with very small train sets. These findings are robust to different representation models and hyperparameters for GIO itself. GIO is task- and domain-agnostic and can be applied out-of-the-box to new datasets and domains. We open source a pip-installable implementation of the algorithm as \"pip install grad-info-opt\".",
        "keywords": "data selection;data-centric AI;information theory;kl divergence;gradient;natural language processing;computer vision",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/c15baefa602a6cff4257f111c50fd9f07d2752fa.zip",
        "author": "Dante Everaert;Christopher Potts",
        "authorids": "~Dante_Everaert1;~Christopher_Potts1",
        "gender": "M;M",
        "homepage": "https://www.amazon.science/author/dante-everaert;http://web.stanford.edu/~cgpotts/",
        "dblp": ";13/2617",
        "google_scholar": ";3j08YoAAAAAJ",
        "orcid": ";0000-0002-7978-6055",
        "linkedin": "dante-everaert/;",
        "or_profile": "~Dante_Everaert1;~Christopher_Potts1",
        "aff": "Amazon;Stanford University",
        "aff_domain": "amazon.com;stanford.edu",
        "position": "Researcher;Full Professor",
        "bibtex": "@inproceedings{\neveraert2024gio,\ntitle={{GIO}: Gradient Information Optimization for Training Dataset Selection},\nauthor={Dante Everaert and Christopher Potts},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=3NnfJnbJT2}\n}",
        "github": "",
        "project": "",
        "reviewers": "C7wm;u6CK;NSKq;Km99",
        "pdf_size": 3358561,
        "rating": "6;6;8;8",
        "confidence": "3;4;3;3",
        "soundness": "2;3;3;4",
        "contribution": "2;3;3;4",
        "presentation": "1;4;3;3",
        "wc_summary": "90;43;82;163",
        "wc_strengths": "18;52;40;127",
        "wc_weaknesses": "109;186;158;135",
        "wc_questions": "120;67;396;24",
        "wc_review": "337;348;676;449",
        "wc_reply_reviewers": "67;0;242;22",
        "wc_reply_authors": "887;864;1556;549",
        "reply_reviewers": "1;0;2;1",
        "reply_authors": "2;2;4;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            94.5,
            43.36184959154764
        ],
        "wc_strengths_avg": [
            59.25,
            40.97178907492325
        ],
        "wc_weaknesses_avg": [
            147.0,
            28.416544476765644
        ],
        "wc_questions_avg": [
            151.75,
            145.0592551338935
        ],
        "wc_review_avg": [
            452.5,
            136.22132725825278
        ],
        "wc_reply_reviewers_avg": [
            82.75,
            95.06149325568161
        ],
        "wc_reply_authors_avg": [
            964.0,
            366.95299426493307
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.25,
            1.0897247358851685
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=295988787452368742&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=3NnfJnbJT2",
        "pdf": "https://openreview.net/pdf?id=3NnfJnbJT2",
        "email": "amazon.com;stanford.edu",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Amazon;Stanford University",
        "aff_unique_dep": "Amazon.com, Inc.;",
        "aff_unique_url": "https://www.amazon.com;https://www.stanford.edu",
        "aff_unique_abbr": "Amazon;Stanford",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Stanford",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "3Ok7ccvtf3",
        "title": "UNLEARNING THE UNWANTED DATA FROM A PERSONALIZED RECOMMENDATION MODEL",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recommender Systems (RS) learn user behavior by monitoring their activities on the online platform. In a few scenarios, users consume the content but don\u2019t want to get their recommendations because a). They consumed the content by mistake, and those interactions have been utilized in personalizing the model; b) The content was consumed by someone else on their behalf; c) Data acquisition was faulty because of machine failure; d) The user has lost interest in the service, etc. Out of any of these reasons, the user wants the data that was used for generating the recommendation to be unlearned by RS. The constraints with this unlearning are 1) The user\u2019s other data should be intact, 2) Personalized experience should not be affected, and 3) We can not afford training from scratch. To solve the stated problem, a few unlearning strategies have already been proposed, but unlearning the matrix factorization-based model is not much explored. In this work, we propose a solution of unlearning from the faulty recommendation model (m1) by diluting the impact of unwanted data. To do so, we first correct the unwanted data and pre- pare an intermediate tiny model m2, referred to as the rescue model. Further, we apply the convolution fusion function (CFF) on the latent features acquired using m1 , m2 . The performance of the proposed method is evaluated on multiple public datasets. We observed that the proposed method outperforms SOTA benchmark models on recommendation tasks.",
        "keywords": "machine unlearning;recommendation system;matrix factorization",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Narayan Chaturvedi;Brijraj Singh;Niranjan Pedanekar",
        "authorids": "~Narayan_Chaturvedi1;~Brijraj_Singh1;~Niranjan_Pedanekar1",
        "gender": "M;;M",
        "homepage": ";;",
        "dblp": ";;131/9354",
        "google_scholar": ";;UksQ7SEAAAAJ",
        "orcid": ";;",
        "linkedin": "narayan-chaturvedi-phd-a3a89311/;;",
        "or_profile": "~Narayan_Chaturvedi1;~Brijraj_Singh1;~Niranjan_Pedanekar1",
        "aff": ";;Sony",
        "aff_domain": ";;sony.com",
        "position": ";;Principal Researcher",
        "bibtex": "@misc{\nanonymous2024unlearning,\ntitle={{UNLEARNING} {THE} {UNWANTED} {DATA} {FROM} A {PERSONALIZED} {RECOMMENDATION} {MODEL}},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=3Ok7ccvtf3}\n}",
        "github": "",
        "project": "",
        "reviewers": "n57L;o6ud;HcxE;GJxA",
        "site": "https://openreview.net/forum?id=3Ok7ccvtf3",
        "pdf_size": 782045,
        "rating": "3;3;3;5",
        "confidence": "3;4;3;2",
        "soundness": "3;1;1;2",
        "contribution": "3;2;1;3",
        "presentation": "1;1;2;2",
        "wc_summary": "165;86;45;51",
        "wc_strengths": "88;36;18;79",
        "wc_weaknesses": "161;318;204;168",
        "wc_questions": "136;12;54;45",
        "wc_review": "550;452;321;343",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "271;228;370;276",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            86.75,
            47.814093110713706
        ],
        "wc_strengths_avg": [
            55.25,
            29.13224158900238
        ],
        "wc_weaknesses_avg": [
            212.75,
            62.9181015288923
        ],
        "wc_questions_avg": [
            61.75,
            45.630992757116296
        ],
        "wc_review_avg": [
            416.5,
            91.65833295451101
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            286.25,
            51.8284429632996
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:aBJC3RT9gScJ:scholar.google.com/&scioq=UNLEARNING+THE+UNWANTED+DATA+FROM+A+PERSONALIZED+RECOMMENDATION+MODEL&hl=en&as_sdt=0,21",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Sony Corporation",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sony.com",
        "aff_unique_abbr": "Sony",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Japan"
    },
    {
        "id": "3OtVLnXfmS",
        "title": "GenNBV: Generalizable Next-Best-View Policy for Active 3D Reconstruction",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Even with the recent advances in neural radiance rendering (NeRF) enable high-quality digitization of large-scale scenes, the image-capturing process is time-consuming and labor-intensive. Previous works attempt to automate this process using active 3D reconstruction, with the Next-Best-View (NBV) policy being the most well-known. However, the majority of NBV policies are rule-based and only apply to a predefined limited action space, limiting their generalization ability. In this work, we propose \\emph{GenNBV}, a novel framework that endows the first free-space NBV policy with generalizability through end-to-end training. This policy is reinforcement learning (RL)-based and empowers a 3D scanning drone to capture from any viewpoint and interact with the environment across diverse scenarios, even those involving unseen structures during training. We also proposed a novel scene representation using action, geometric, and semantic embeddings, to further boost generalizability. To evaluate this NBV policy, we also establish a benchmark using the Isaac Gym simulator with the Houses3K and OmniObject3D datasets. Experiments demonstrate that our approach achieves a 98.26\\% and 83.61\\% coverage ratio on unseen buildings from these datasets, respectively, outperforming prior solutions.",
        "keywords": "Active 3D Reconstruction;Next-Best-View Prediction;Generalization;Reinforcement Learning",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/9dfbf6260f90878614e4964a296792957ed2a888.pdf",
        "author": "Xiao Chen;Quanyi Li;Tai Wang;Tianfan Xue;Jiangmiao Pang",
        "authorids": "~Xiao_Chen6;~Quanyi_Li1;~Tai_Wang2;~Tianfan_Xue2;~Jiangmiao_Pang1",
        "gender": "M;M;M;M;M",
        "homepage": "https://xiao-chen.tech;https://quanyili.github.io;https://tianfan.info;https://oceanpang.github.io/;https://tai-wang.github.io/",
        "dblp": ";270/7691;54/8652;231/7630;",
        "google_scholar": "SW2HLB0AAAAJ;Ty49X3UAAAAJ;RfSQKrIAAAAJ;https://scholar.google.com/citations?authuser=0;JmbbZWIAAAAJ",
        "orcid": ";;0000-0001-5031-6618;0000-0002-6711-9319;",
        "linkedin": "xiao-chen-%E9%99%88%E9%AA%81-3b4a731a0/;https://www.linkedin.com/mwlite/in/quanyi-li-2b7985183;tianfan-xue-54016716;;%E6%B3%B0-%E7%8E%8B-2b2738147/",
        "or_profile": "~Xiao_Chen6;~Quanyi_Li1;~Tianfan_Xue2;~Jiangmiao_Pang1;~Tai_WANG1",
        "aff": "Shanghai Artificial Intelligence Laboratory;University of Edinburgh;The Chinese University of Hong Kong;Shanghai AI Laboratory ;Shanghai AI Laboratory",
        "aff_domain": "pjlab.org.cn;ed.ac.uk;cuhk.edu.hk;pjlab.org.cn;pjlab.org.cn",
        "position": "Intern;MS student;Assistant Professor;Research Scientist;Research Scientist",
        "bibtex": "@misc{\nchen2024gennbv,\ntitle={Gen{NBV}: Generalizable Next-Best-View Policy for Active 3D Reconstruction},\nauthor={Xiao Chen and Quanyi Li and Tai Wang and Tianfan Xue and Jiangmiao Pang},\nyear={2024},\nurl={https://openreview.net/forum?id=3OtVLnXfmS}\n}",
        "github": "",
        "project": "",
        "reviewers": "k3Gz;NscJ;gNx2;7e87",
        "site": "https://openreview.net/forum?id=3OtVLnXfmS",
        "pdf_size": 5341135,
        "rating": "3;3;5;6",
        "confidence": "5;3;4;2",
        "soundness": "1;2;2;3",
        "contribution": "1;1;2;3",
        "presentation": "1;2;2;3",
        "wc_summary": "81;67;76;58",
        "wc_strengths": "26;47;113;34",
        "wc_weaknesses": "178;152;225;249",
        "wc_questions": "1;20;61;6",
        "wc_review": "286;286;475;347",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            70.5,
            8.789197915623474
        ],
        "wc_strengths_avg": [
            55.0,
            34.31471987354698
        ],
        "wc_weaknesses_avg": [
            201.0,
            38.11167800031901
        ],
        "wc_questions_avg": [
            22.0,
            23.569047498785352
        ],
        "wc_review_avg": [
            348.5,
            77.16378684331141
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.6024640760767093,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7471704688960664825&as_sdt=5,31&sciodt=0,31&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;2;3;3",
        "aff_unique_norm": "Shanghai Artificial Intelligence Laboratory;University of Edinburgh;Chinese University of Hong Kong;Shanghai AI Laboratory",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "http://www.shailab.org/;https://www.ed.ac.uk;https://www.cuhk.edu.hk;https://www.shanghai-ai-lab.com",
        "aff_unique_abbr": "Shanghai AI Lab;Edinburgh;CUHK;SAIL",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;1;0;0;0",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "id": "3OzQhhPLyW",
        "title": "Meta-Value Learning: a General Framework for Learning with Learning Awareness",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Gradient-based learning in multi-agent systems is difficult because the gradient derives from a first-order model which does not account for the interaction between agents\u2019 learning processes. LOLA (Foerster et al., 2018) accounts for this by differentiating through one step of optimization. We propose to judge joint policies by their long-term prospects as measured by the meta-value, a discounted sum over the returns of future optimization iterates. We apply a form of Q-learning to the meta-game of optimization, in a way that avoids the need to explicitly represent the continuous action space of policy updates. The resulting method, MeVa, is consistent and far-sighted, and does not require REINFORCE estimators. We analyze the behavior of our method on a toy game and compare to prior work on repeated matrix games.",
        "keywords": "multi-agent reinforcement learning;meta-learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/413519cca839887d6e9de828a80799fb29af6808.zip",
        "author": "Tim Cooijmans;Milad Aghajohari;Aaron Courville",
        "authorids": "~Tim_Cooijmans1;~Milad_Aghajohari1;~Aaron_Courville3",
        "gender": "M;M;",
        "homepage": ";;",
        "dblp": "153/5756;241/5265;56/1688",
        "google_scholar": "https://scholar.google.ca/citations?user=Ec6vKzwAAAAJ;;https://scholar.google.ca/citations?user=km6CP8cAAAAJ",
        "orcid": ";;",
        "linkedin": ";milad-aghajohari-6b9a669b/;",
        "or_profile": "~Tim_Cooijmans1;~Milad_Aghajohari1;~Aaron_Courville3",
        "aff": "University of Montreal;Montreal Institute for Learning Algorithms, University of Montreal, Universit\u00e9 de Montr\u00e9al;Universit\u00e9 de Montr\u00e9al",
        "aff_domain": "umontreal.ca;mila.umontreal.ca; ",
        "position": "PhD student;Researcher;Assistant Professor",
        "bibtex": "@misc{\ncooijmans2024metavalue,\ntitle={Meta-Value Learning: a General Framework for Learning with Learning Awareness},\nauthor={Tim Cooijmans and Milad Aghajohari and Aaron Courville},\nyear={2024},\nurl={https://openreview.net/forum?id=3OzQhhPLyW}\n}",
        "github": "",
        "project": "",
        "reviewers": "1uYc;c4Mz;VzC1;ZYT4;zqYk;rsw5",
        "site": "https://openreview.net/forum?id=3OzQhhPLyW",
        "pdf_size": 1773301,
        "rating": "5;5;5;5;5;6",
        "confidence": "4;4;4;3;5;2",
        "soundness": "3;2;2;3;3;3",
        "contribution": "2;2;3;3;3;3",
        "presentation": "3;3;2;3;3;2",
        "wc_summary": "133;117;183;84;62;103",
        "wc_strengths": "24;74;44;103;42;153",
        "wc_weaknesses": "254;183;98;154;220;86",
        "wc_questions": "121;41;725;51;97;45",
        "wc_review": "532;415;1050;392;421;387",
        "wc_reply_reviewers": "458;12;0;0;0;0",
        "wc_reply_authors": "1148;532;1076;322;0;314",
        "reply_reviewers": "2;1;0;0;0;0",
        "reply_authors": "3;2;2;1;0;1",
        "rating_avg": [
            5.166666666666667,
            0.37267799624996495
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            113.66666666666667,
            38.41729934403105
        ],
        "wc_strengths_avg": [
            73.33333333333333,
            43.786096220401085
        ],
        "wc_weaknesses_avg": [
            165.83333333333334,
            60.713580761546986
        ],
        "wc_questions_avg": [
            180.0,
            245.48659162297778
        ],
        "wc_review_avg": [
            532.8333333333334,
            236.27485172052388
        ],
        "wc_reply_reviewers_avg": [
            78.33333333333333,
            169.84862541556103
        ],
        "wc_reply_authors_avg": [
            565.3333333333334,
            417.00786030428196
        ],
        "reply_reviewers_avg": [
            0.5,
            0.7637626158259734
        ],
        "reply_authors_avg": [
            1.5,
            0.9574271077563381
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.7905694150420948,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18278300865798388679&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "University of Montreal;Universit\u00e9 de Montr\u00e9al",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://wwwumontreal.ca;https://www.umontreal.ca",
        "aff_unique_abbr": "UM;UdeM",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Montreal",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "3P87ptzvTm",
        "title": "Optimal Multiple Transport with Applications to Visual Matching, Model Fusion and Beyond",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Optimal transport (OT) has wide applications including machine learning. It concerns finding the optimal mapping for Monge OT (or coupling for Kantorovich OT) between two probability measures. This paper generalizes the classic pairwise OT to the so-called Optimal Multiple Transportation (OMT) accepting more than two probability measures as input. We formulate the problem as minimizing the transportation costs between each pair of distributions and meanwhile requiring cycle-consistency of transportation among probability measures. In particular, we present both the Monge and Kantorovich formulations of OMT and obtain the approximate solution with added entropic and cycle-consistency regularization, for which an iterative Sinkhorn-based algorithm (ROMT-Sinkhorn) is proposed. We empirically show the superiority of our approach on two popular tasks: visual multi-point matching (MPM) and multi-model fusion (MMF). In MPM, our OMT solver directly utilizes the cosine distance between learned features of points obtained from off-the-shelf graph matching neural networks as the pairwise cost. We leverage the ROMT-Sinkhorn algorithm to learn multiple matchings. For MMF, we focus on the problem of fusing three models and employ ROMT-Sinkhorn instead of the Sinkhorn algorithm to learn the alignment between layers. Both tasks achieve competitive results with ROMT-Sinkhorn. Furthermore, we showcase the potential of our approach in addressing the travel salesman problem (TSP) by searching for the optimal path on the probability matrix instead of the distance matrix. Source code will be made publicly available.",
        "keywords": "Optimal Transport; Sinkhorn Algorithm; Cycle-Consistency; Visual Matching; Model Fusion",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Liangliang Shi;Jiale Hong;Junchi Yan",
        "authorids": "~Liangliang_Shi1;~Jiale_Hong1;~Junchi_Yan2",
        "gender": "M;;",
        "homepage": ";;",
        "dblp": "89/8730;;",
        "google_scholar": "Qf1k8lUAAAAJ;;",
        "orcid": "0000-0001-7033-4207;;",
        "linkedin": ";;",
        "or_profile": "~Liangliang_Shi1;~Jiale_Hong1;~Junchi_Yan2",
        "aff": "Shanghai Jiaotong University;;",
        "aff_domain": "sjtu.edu.cn;;",
        "position": "PhD student;;",
        "bibtex": "@misc{\nshi2024optimal,\ntitle={Optimal Multiple Transport with Applications to Visual Matching, Model Fusion and Beyond},\nauthor={Liangliang Shi and Jiale Hong and Junchi Yan},\nyear={2024},\nurl={https://openreview.net/forum?id=3P87ptzvTm}\n}",
        "github": "",
        "project": "",
        "reviewers": "aQyc;uVEA;16yx;2Gzs",
        "site": "https://openreview.net/forum?id=3P87ptzvTm",
        "pdf_size": 2003963,
        "rating": "5;5;5;5",
        "confidence": "4;3;4;4",
        "soundness": "3;2;3;2",
        "contribution": "3;2;2;2",
        "presentation": "3;3;3;3",
        "wc_summary": "104;142;103;110",
        "wc_strengths": "24;48;40;60",
        "wc_weaknesses": "58;246;274;32",
        "wc_questions": "514;3;49;524",
        "wc_review": "700;439;466;726",
        "wc_reply_reviewers": "227;0;137;133",
        "wc_reply_authors": "1319;1316;1169;774",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "3;3;3;2",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            114.75,
            15.958931668504631
        ],
        "wc_strengths_avg": [
            43.0,
            13.076696830622021
        ],
        "wc_weaknesses_avg": [
            152.5,
            108.34551213594405
        ],
        "wc_questions_avg": [
            272.5,
            247.06122722920324
        ],
        "wc_review_avg": [
            582.75,
            130.92244841890178
        ],
        "wc_reply_reviewers_avg": [
            124.25,
            80.98572405060042
        ],
        "wc_reply_authors_avg": [
            1144.5,
            222.33589453797154
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            0.4330127018922193
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:8wExtdxwTNgJ:scholar.google.com/&scioq=Optimal+Multiple+Transport+with+Applications+to+Visual+Matching,+Model+Fusion+and+Beyond&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Shanghai Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sjtu.edu.cn",
        "aff_unique_abbr": "SJTU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "3POV2mBEVl",
        "title": "Principal Component Analysis for Cross-Sectionally Correlated Pricing Errors",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We propose a new estimator for factor pricing models which we refer to as Principal Component Analysis for Cross-Sectionally Correlated Pricing Errors (PCA-XC). Our estimator aims to find the factor pricing model that well explains the time-series variation of asset returns and well handles the correlations of cross-section of pricing errors that we present exist in real-world data. The proposed estimator is defined by a new regularized minimization problem in which finding a solution is difficult. This contrasts with other related estimators whose corresponding minimization problem admits an analytic solution. To this end, we propose an approximate algorithm that solves our proposed minimization problem based on the alternating least squares method.",
        "keywords": "Unsupervised Learning;Optimization;Principal Component Analysis;Asset Pricing;Factor Pricing Model",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/ec72d22295ee66fa7ec2a96690c83dbb0e7f47c5.zip",
        "author": "Hyuksoo Kim;Saejoon Kim",
        "authorids": "~Hyuksoo_Kim1;~Saejoon_Kim1",
        "gender": ";",
        "homepage": ";http://fml.sogang.ac.kr",
        "dblp": "174/8206;10/1669",
        "google_scholar": "PtP1JioAAAAJ;https://scholar.google.com/scholar?hl=en",
        "orcid": "0000-0003-0088-3846;",
        "linkedin": ";",
        "or_profile": "~Hyuksoo_Kim1;~Saejoon_Kim1",
        "aff": "Sogang University;Sogang University",
        "aff_domain": "sogang.ac.kr;sogang.ac.kr",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nkim2024principal,\ntitle={Principal Component Analysis for Cross-Sectionally Correlated Pricing Errors},\nauthor={Hyuksoo Kim and Saejoon Kim},\nyear={2024},\nurl={https://openreview.net/forum?id=3POV2mBEVl}\n}",
        "github": "",
        "project": "",
        "reviewers": "D5h2;dcRp;ihuY;mR2q",
        "site": "https://openreview.net/forum?id=3POV2mBEVl",
        "pdf_size": 793880,
        "rating": "3;3;3;5",
        "confidence": "5;3;3;3",
        "soundness": "1;3;3;2",
        "contribution": "1;2;2;2",
        "presentation": "1;3;2;2",
        "wc_summary": "136;161;36;94",
        "wc_strengths": "2;29;23;73",
        "wc_weaknesses": "2;90;89;142",
        "wc_questions": "2;66;6;91",
        "wc_review": "142;346;154;400",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            106.75,
            47.34646238104807
        ],
        "wc_strengths_avg": [
            31.75,
            25.839649765428323
        ],
        "wc_weaknesses_avg": [
            80.75,
            50.26616655365714
        ],
        "wc_questions_avg": [
            41.25,
            38.310409812477864
        ],
        "wc_review_avg": [
            260.5,
            114.18734605900953
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:53q6tVa291wJ:scholar.google.com/&scioq=Principal+Component+Analysis+for+Cross-Sectionally+Correlated+Pricing+Errors&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Sogang University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sogang.ac.kr",
        "aff_unique_abbr": "Sogang",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "3PWYAlAQxv",
        "title": "Neural Networks Trained by Weight Permutation are Universal Approximators",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The universal approximation property is fundamental to the success of neural networks, and has traditionally been achieved by networks without any constraints on their parameters. However, recent experimental research proposed an innovative permutation-based training method, which can achieve desired classification performance without modifying the exact values of the weights. In this paper, we prove that the permutation training method can guide a ReLU network to approximate one-dimensional continuous functions. Our numerical results under more diverse scenarios also validate the effectiveness of the permutation training method in regression tasks. Moreover, the notable observations during weight permutation suggest that permutation training can provide a novel tool for describing network learning behavior.",
        "keywords": "Universal approximation property;permutation training;physical neural networks;learning behavior",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/6522417374125b49514926c7ea20bb691c7d2f0d.zip",
        "author": "Gaohang Chen;Zhonghua Qiao;Yongqiang Cai",
        "authorids": "~Gaohang_Chen1;~Zhonghua_Qiao1;~Yongqiang_Cai1",
        "gender": "M;M;M",
        "homepage": ";https://www.polyu.edu.hk/ama/profile/zhqiao/;",
        "dblp": ";;228/6809",
        "google_scholar": ";;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0002-9133-0376;;0000-0002-2666-0539",
        "linkedin": ";;",
        "or_profile": "~Gaohang_Chen1;~Zhonghua_Qiao1;~Yongqiang_Cai1",
        "aff": "Hong Kong Polytechnic University;;Beijing Normal University",
        "aff_domain": "polyu.edu.hk;;bnu.edu.cn",
        "position": "PhD student;;Lecturer",
        "bibtex": "@misc{\nchen2024neural,\ntitle={Neural Networks Trained by Weight Permutation are Universal Approximators},\nauthor={Gaohang Chen and Zhonghua Qiao and Yongqiang Cai},\nyear={2024},\nurl={https://openreview.net/forum?id=3PWYAlAQxv}\n}",
        "github": "",
        "project": "",
        "reviewers": "5HxL;BYmb;XdGX;S6yU",
        "site": "https://openreview.net/forum?id=3PWYAlAQxv",
        "pdf_size": 5895261,
        "rating": "5;5;6;8",
        "confidence": "4;3;3;3",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;4",
        "presentation": "3;3;3;3",
        "wc_summary": "40;74;50;76",
        "wc_strengths": "44;53;110;119",
        "wc_weaknesses": "48;158;48;179",
        "wc_questions": "72;97;35;92",
        "wc_review": "204;382;243;466",
        "wc_reply_reviewers": "107;49;0;15",
        "wc_reply_authors": "731;962;781;883",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            60.0,
            15.427248620541512
        ],
        "wc_strengths_avg": [
            81.5,
            33.30540496676178
        ],
        "wc_weaknesses_avg": [
            108.25,
            60.705745197633476
        ],
        "wc_questions_avg": [
            74.0,
            24.38237068047322
        ],
        "wc_review_avg": [
            323.75,
            105.46178217724182
        ],
        "wc_reply_reviewers_avg": [
            42.75,
            41.12405014100629
        ],
        "wc_reply_authors_avg": [
            839.25,
            89.57224737607068
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.4714045207910316,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4235409972258229367&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Hong Kong Polytechnic University;Beijing Normal University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.polyu.edu.hk;https://www.bnu.edu.cn",
        "aff_unique_abbr": "PolyU;BNU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "3PaVCdeEmW",
        "title": "Align after Pre-train: Improving Multilingual Generative Models with Cross-lingual Alignment",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Multilingual generative models obtain remarkable cross-lingual capabilities through pre-training on large-scale corpora. However, they still exhibit a performance bias toward high-resource languages, and learn isolated distributions of sentence representations across languages. To bridge this gap, we propose a simple yet effective alignment framework exploiting pairs of translation sentences. It aligns the internal sentence representations across different languages via multilingual contrastive learning and aligns model outputs by answering prompts in different languages. Experimental results demonstrate that even with less than 0.1\u2030 of pre-training tokens, our alignment framework significantly boosts the cross-lingual abilities of generative models and mitigates the performance gap. Further analysis reveals that it results in a better internal multilingual representation distribution of multilingual models.",
        "keywords": "Cross-lingual alignment;In-context learning;Multilingual generative model",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Chong Li;Shaonan Wang;Jiajun Zhang;Chengqing Zong",
        "authorids": "~Chong_Li6;~Shaonan_Wang1;~Jiajun_Zhang1;~Chengqing_Zong1",
        "gender": "M;F;M;M",
        "homepage": ";https://wangshaonan.github.io/;http://www.nlpr.ia.ac.cn/cip/jjzhang.htm;http://www.nlpr.ia.ac.cn/cip/english/zong.htm",
        "dblp": ";29/8236;71/6950-1.html;38/6093",
        "google_scholar": "https://scholar.google.com.hk/citations?user=aftZkxsAAAAJ;ydFT-G8AAAAJ;93zngeYAAAAJ;l8lvKOQAAAAJ",
        "orcid": "0009-0000-0708-7493;;;",
        "linkedin": ";;;",
        "or_profile": "~Chong_Li6;~Shaonan_Wang1;~Jiajun_Zhang1;~Chengqing_Zong1",
        "aff": "Institute of automation, Chinese Academy of Sciences;;Institute of Automation, Chinese Academy of Sciences;Institute of Automation, Chinese Academy of Sciences",
        "aff_domain": "ia.ac.cn;;ia.ac.cn;ia.ac.cn",
        "position": "PhD student;;Full Professor;Researcher",
        "bibtex": "@misc{\nli2024align,\ntitle={Align after Pre-train: Improving Multilingual Generative Models with Cross-lingual Alignment},\nauthor={Chong Li and Shaonan Wang and Jiajun Zhang and Chengqing Zong},\nyear={2024},\nurl={https://openreview.net/forum?id=3PaVCdeEmW}\n}",
        "github": "",
        "project": "",
        "reviewers": "GUFo;ehYp;1odi",
        "site": "https://openreview.net/forum?id=3PaVCdeEmW",
        "pdf_size": 1270084,
        "rating": "3;5;6",
        "confidence": "4;4;4",
        "soundness": "2;3;3",
        "contribution": "2;2;2",
        "presentation": "3;3;3",
        "wc_summary": "74;73;95",
        "wc_strengths": "64;83;111",
        "wc_weaknesses": "289;171;171",
        "wc_questions": "7;50;58",
        "wc_review": "434;377;435",
        "wc_reply_reviewers": "0;89;139",
        "wc_reply_authors": "1005;667;793",
        "reply_reviewers": "0;1;1",
        "reply_authors": "3;2;3",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            80.66666666666667,
            10.143416036468626
        ],
        "wc_strengths_avg": [
            86.0,
            19.30457631409368
        ],
        "wc_weaknesses_avg": [
            210.33333333333334,
            55.62573345334174
        ],
        "wc_questions_avg": [
            38.333333333333336,
            22.395436042987765
        ],
        "wc_review_avg": [
            415.3333333333333,
            27.108834148463284
        ],
        "wc_reply_reviewers_avg": [
            76.0,
            57.48623023530649
        ],
        "wc_reply_authors_avg": [
            821.6666666666666,
            139.46883363517296
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11602331846743195669&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Chinese Academy of Sciences",
        "aff_unique_dep": "Institute of Automation",
        "aff_unique_url": "http://www.ia.cas.cn",
        "aff_unique_abbr": "CAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "SPTNet: An Efficient Alternative Framework for Generalized Category Discovery with Spatial Prompt Tuning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19515",
        "id": "3QLkwU40EE",
        "author_site": "Hongjun Wang, Sagar Vaze, Kai Han",
        "tldr": "",
        "abstract": "Generalized Category Discovery (GCD) aims to classify unlabelled images from both \u2018seen\u2019 and \u2018unseen\u2019 classes by transferring knowledge from a set of labelled \u2018seen\u2019 class images. A key theme in existing GCD approaches is adapting large-scale pre-trained models for the GCD task. An alternate perspective, however, is to adapt the data representation itself for better alignment with the pre-trained model. As such, in this paper, we introduce a two-stage adaptation approach termed SPTNet, which iteratively optimizes model parameters (i.e., model-finetuning) and data parameters (i.e., prompt learning). Furthermore, we propose a novel spatial prompt tuning method (SPT) which considers the spatial property of image data, enabling the method to better focus on object parts, which can transfer between seen and unseen classes. We thoroughly evaluate our SPTNet on standard benchmarks and demonstrate that our method outperforms existing GCD methods. Notably, we find our method achieves an average accuracy of 61.4% on the SSB, surpassing prior state-of-the-art methods by approximately 10%. The improvement is particularly remarkable as our method yields extra parameters amounting to only 0.117% of those in the backbone architecture. Project page: https://visual-ai.github.io/sptnet.",
        "keywords": "Generalized Category Discovery;Novel Category Discovery",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Hongjun Wang;Sagar Vaze;Kai Han",
        "authorids": "~Hongjun_Wang2;~Sagar_Vaze1;~Kai_Han1",
        "gender": "M;M;M",
        "homepage": "https://whj363636.github.io/;https://sgvaze.github.io/;http://www.kaihan.org/",
        "dblp": "65/3627-5;226/4705;51/4757-1.html",
        "google_scholar": "DNi-nB0AAAAJ;lvuOknUAAAAJ;tG8S_vMAAAAJ",
        "orcid": ";0000-0003-2920-9345;0000-0002-7995-9999",
        "linkedin": ";sagar-vaze-2356ab171/;kaihancs/",
        "or_profile": "~Hongjun_Wang2;~Sagar_Vaze1;~Kai_Han1",
        "aff": "NVIDIA;University of Oxford;The University of Hong Kong",
        "aff_domain": "nvidia.com;ox.ac.uk;hku.hk",
        "position": "Intern;PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nwang2024sptnet,\ntitle={{SPTN}et: An Efficient Alternative Framework for Generalized Category Discovery with Spatial Prompt Tuning},\nauthor={Hongjun Wang and Sagar Vaze and Kai Han},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=3QLkwU40EE}\n}",
        "github": "",
        "project": "",
        "reviewers": "Pson;bfKG;E8qj",
        "pdf_size": 25689441,
        "rating": "6;6;8",
        "confidence": "4;2;5",
        "soundness": "2;3;3",
        "contribution": "4;3;4",
        "presentation": "3;4;3",
        "wc_summary": "69;63;109",
        "wc_strengths": "53;84;49",
        "wc_weaknesses": "123;174;456",
        "wc_questions": "53;9;223",
        "wc_review": "298;330;837",
        "wc_reply_reviewers": "0;0;126",
        "wc_reply_authors": "467;347;1264",
        "reply_reviewers": "0;0;1",
        "reply_authors": "1;1;2",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            1.247219128924647
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            80.33333333333333,
            20.417857108151406
        ],
        "wc_strengths_avg": [
            62.0,
            15.641824275533422
        ],
        "wc_weaknesses_avg": [
            251.0,
            146.4445287472359
        ],
        "wc_questions_avg": [
            95.0,
            92.2749514584899
        ],
        "wc_review_avg": [
            488.3333333333333,
            246.8904390390379
        ],
        "wc_reply_reviewers_avg": [
            42.0,
            59.39696961966999
        ],
        "wc_reply_authors_avg": [
            692.6666666666666,
            406.95317775991
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.7559289460184545,
        "gs_citation": 23,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9353576079773046885&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=3QLkwU40EE",
        "pdf": "https://openreview.net/pdf?id=3QLkwU40EE",
        "email": "nvidia.com;ox.ac.uk;hku.hk",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "NVIDIA;University of Oxford;University of Hong Kong",
        "aff_unique_dep": "NVIDIA Corporation;;",
        "aff_unique_url": "https://www.nvidia.com;https://www.ox.ac.uk;https://www.hku.hk",
        "aff_unique_abbr": "NVIDIA;Oxford;HKU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;1;2",
        "aff_country_unique": "United States;United Kingdom;China"
    },
    {
        "id": "3QR230r11w",
        "title": "Multi-Fidelity Active Learning with GFlowNets",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In the last decades, the capacity to generate large amounts of data in science and engineering applications has been growing steadily. Meanwhile, the progress in machine learning has turned it into a suitable tool to process and utilise the available data. Nonetheless, many relevant scientific and engineering problems present challenges where current machine learning methods cannot yet efficiently leverage the available data and resources. For example, in scientific discovery, we are often faced with the problem of exploring very large, structured and high-dimensional spaces, and where querying a high fidelity, black-box objective function is very expensive. Progress in machine learning methods that can efficiently tackle such problems would help accelerate currently crucial areas such as drug and materials discovery. In this paper, we propose a multi-fidelity active learning algorithm with GFlowNets as a sampler, to efficiently discover diverse, high-scoring candidates where multiple approximations of the black-box function are available at lower fidelity and cost. Our evaluation on molecular discovery tasks show that multi-fidelity active learning with GFlowNets can discover high-scoring candidates at a fraction of the budget of its single-fidelity counterpart while maintaining diversity, unlike RL-based alternatives. These results open new avenues for multi-fidelity active learning to accelerate scientific discovery and engineering design.",
        "keywords": "gflownets;multi-fidelity;active learning;bayesian optimization;scientific discovery;biological sequence design;molecular modelling;material discovery",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/cff757e41ad228294bccf9aef376ad7d7c04aa49.zip",
        "author": "Alex Hern\u00e1ndez-Garc\u00eda;Nikita Saxena;Moksh Jain;Cheng-Hao Liu;Yoshua Bengio",
        "authorids": "~Alex_Hern\u00e1ndez-Garc\u00eda1;~Nikita_Saxena1;~Moksh_Jain1;~Cheng-Hao_Liu1;~Yoshua_Bengio1",
        "gender": ";M;M;M;F",
        "homepage": "https://alexhernandezgarcia.github.io;https://mj10.github.io;https://pchliu.github.io/;http://yoshuabengio.org;https://nikita-0209.github.io/",
        "dblp": "213/8573;249/9368;;56/953;",
        "google_scholar": "f8vQCOAAAAAJ;TD07G_wAAAAJ;iVJGx0cAAAAJ;kukA0LcAAAAJ;https://scholar.google.co.in/citations?user=DkroIXMAAAAJ",
        "orcid": ";;0000-0001-7923-6806;;",
        "linkedin": ";;chenghao-peter-liu/;yoshuabengio/?originalSubdomain=ca;nikita-saxena",
        "or_profile": "~Alex_Hern\u00e1ndez-Garc\u00eda1;~Moksh_Jain1;~Cheng-Hao_Liu1;~Yoshua_Bengio1;~Nikita_Saxena2",
        "aff": "Universit\u00e9 de Montr\u00e9al;Universit\u00e9 de Montr\u00e9al;Montreal Institute for Learning Algorithms, University of Montreal, Universit\u00e9 de Montr\u00e9al;University of Montreal;Google",
        "aff_domain": "umontreal.ca;umontreal.ca;mila.umontreal.ca;umontreal.ca;google.com",
        "position": "Postdoc;PhD student;PhD student intern;Full Professor;Researcher",
        "bibtex": "@misc{\nhern{\\'a}ndez-garc{\\'\\i}a2024multifidelity,\ntitle={Multi-Fidelity Active Learning with {GF}lowNets},\nauthor={Alex Hern{\\'a}ndez-Garc{\\'\\i}a and Nikita Saxena and Moksh Jain and Cheng-Hao Liu and Yoshua Bengio},\nyear={2024},\nurl={https://openreview.net/forum?id=3QR230r11w}\n}",
        "github": "",
        "project": "",
        "reviewers": "EtrP;Cu6t;TJ42;5Rpa",
        "site": "https://openreview.net/forum?id=3QR230r11w",
        "pdf_size": 818909,
        "rating": "3;5;6;8",
        "confidence": "4;4;4;3",
        "soundness": "2;2;3;3",
        "contribution": "1;2;3;4",
        "presentation": "2;2;3;4",
        "wc_summary": "33;67;77;202",
        "wc_strengths": "218;17;55;228",
        "wc_weaknesses": "701;265;87;95",
        "wc_questions": "202;105;26;48",
        "wc_review": "1154;454;245;573",
        "wc_reply_reviewers": "335;849;26;0",
        "wc_reply_authors": "2849;3026;714;382",
        "reply_reviewers": "1;3;2;0",
        "reply_authors": "5;5;2;1",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            1.118033988749895
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            94.75,
            64.0327064866073
        ],
        "wc_strengths_avg": [
            129.5,
            94.52645132448377
        ],
        "wc_weaknesses_avg": [
            287.0,
            249.37120924437127
        ],
        "wc_questions_avg": [
            95.25,
            68.04180700128414
        ],
        "wc_review_avg": [
            606.5,
            337.2006079472574
        ],
        "wc_reply_reviewers_avg": [
            302.5,
            341.9345697644507
        ],
        "wc_reply_authors_avg": [
            1742.75,
            1202.132142278876
        ],
        "reply_reviewers_avg": [
            1.5,
            1.118033988749895
        ],
        "reply_authors_avg": [
            3.25,
            1.7853571071357126
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.8006407690254357,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14990110088713039119&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;1;2",
        "aff_unique_norm": "Universit\u00e9 de Montr\u00e9al;University of Montreal;Google",
        "aff_unique_dep": ";Montreal Institute for Learning Algorithms;Google",
        "aff_unique_url": "https://www.umontreal.ca;https://www.mila.quebec;https://www.google.com",
        "aff_unique_abbr": "UdeM;MILA;Google",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Montreal;Mountain View",
        "aff_country_unique_index": "0;0;0;0;1",
        "aff_country_unique": "Canada;United States"
    },
    {
        "title": "Universal Backdoor Attacks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19514",
        "id": "3QkzYBSWqL",
        "author_site": "Benjamin Schneider, Nils Lukas, Florian Kerschbaum",
        "tldr": "",
        "abstract": "Web-scraped datasets are vulnerable to data poisoning, which can be used for backdooring deep image classifiers during training. Since training on large datasets is expensive, a model is trained once and reused many times. Unlike adversarial examples, backdoor attacks often target specific classes rather than any class learned by the model. One might expect that targeting many classes through a na\u00efve composition of attacks vastly increases the number of poison samples. We show this is not necessarily true and more efficient, \n _universal_ data poisoning attacks exist that allow controlling misclassifications from any source class into any target class with a slight increase in poison samples. Our idea is to generate triggers with salient characteristics that the model can learn. The triggers we craft exploit a phenomenon we call _inter-class poison transferability_, where learning a trigger from one class makes the model more vulnerable to learning triggers for other classes. We demonstrate the effectiveness and robustness of our universal backdoor attacks by controlling models with up to 6,000 classes while poisoning only 0.15% of the training dataset.",
        "keywords": "Backdoor;Data poisoning;Integrity;Image Classification",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Benjamin Schneider;Nils Lukas;Florian Kerschbaum",
        "authorids": "~Benjamin_Schneider1;~Nils_Lukas1;~Florian_Kerschbaum1",
        "gender": "M;M;",
        "homepage": "https://github.com/Ben-Schneider-code;https://nilslukas.github.io;",
        "dblp": "55/9497;;",
        "google_scholar": ";https://scholar.google.com/citations?hl=de;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Benjamin_Schneider1;~Nils_Lukas1;~Florian_Kerschbaum1",
        "aff": "University of Waterloo;University of Waterloo;",
        "aff_domain": "uwaterloo.ca;uwaterloo.ca;",
        "position": "MS student;PhD student;",
        "bibtex": "@inproceedings{\nschneider2024universal,\ntitle={Universal Backdoor Attacks},\nauthor={Benjamin Schneider and Nils Lukas and Florian Kerschbaum},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=3QkzYBSWqL}\n}",
        "github": "",
        "project": "",
        "reviewers": "Xx2A;czTr;EfVD;H32b",
        "pdf_size": 556822,
        "rating": "5;5;6;6",
        "confidence": "3;3;4;4",
        "soundness": "3;2;2;4",
        "contribution": "2;2;3;3",
        "presentation": "2;3;2;4",
        "wc_summary": "56;54;206;92",
        "wc_strengths": "36;13;34;40",
        "wc_weaknesses": "239;20;155;386",
        "wc_questions": "78;223;59;49",
        "wc_review": "409;310;454;567",
        "wc_reply_reviewers": "0;0;157;44",
        "wc_reply_authors": "1231;1151;778;1659",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "2;3;2;3",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            102.0,
            61.91930232165088
        ],
        "wc_strengths_avg": [
            30.75,
            10.473180032826706
        ],
        "wc_weaknesses_avg": [
            200.0,
            132.79871987334818
        ],
        "wc_questions_avg": [
            102.25,
            70.48891756865046
        ],
        "wc_review_avg": [
            435.0,
            92.31197105467957
        ],
        "wc_reply_reviewers_avg": [
            50.25,
            64.19647575996676
        ],
        "wc_reply_authors_avg": [
            1204.75,
            313.06419070216253
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10538171199816605357&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=3QkzYBSWqL",
        "pdf": "https://openreview.net/pdf?id=3QkzYBSWqL",
        "email": "uwaterloo.ca;uwaterloo.ca;",
        "author_num": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Waterloo",
        "aff_unique_dep": "",
        "aff_unique_url": "https://uwaterloo.ca",
        "aff_unique_abbr": "UW",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Canada"
    },
    {
        "title": "Grokking as a First Order Phase Transition in Two Layer Networks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19513",
        "id": "3ROGsTX3IR",
        "author_site": "Noa Rubin, Inbar Seroussi, Zohar Ringel",
        "tldr": "",
        "abstract": "A key property of deep neural networks (DNNs) is their ability to learn new features during training. This intriguing aspect of deep learning stands out most clearly in recently reported Grokking phenomena. While mainly reflected as a sudden increase in test accuracy, Grokking is also believed to be a beyond lazy-learning/Gaussian Process (GP) phenomenon involving feature learning. Here we apply a recent development in the theory of feature learning, the adaptive kernel approach, to two teacher-student models with cubic-polynomial and modular addition teachers. We provide analytical predictions on feature learning and Grokking properties of these models and demonstrate a mapping between Grokking and the theory of phase transitions. We show that after Grokking, the state of the DNN is analogous to the mixed phase following a first-order phase transition. In this mixed phase, the DNN generates useful internal representations of the teacher that are sharply distinct from those before the transition.",
        "keywords": "Grokking;deep neural networks;Gaussian Process;phase transitions",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Noa Rubin;Inbar Seroussi;Zohar Ringel",
        "authorids": "~Noa_Rubin1;~Inbar_Seroussi1;~Zohar_Ringel1",
        "gender": "F;F;M",
        "homepage": "https://phys.huji.ac.il/people/noa-rubin;https://sites.google.com/view/inbar-seroussi/home;http://old.phys.huji.ac.il/~zohar.ringel/",
        "dblp": ";;",
        "google_scholar": ";https://scholar.google.co.il/citations?user=t_Qe0CMAAAAJ;https://scholar.google.co.il/citations?user=8-8VIDgAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Noa_Rubin1;~Inbar_Seroussi1;~Zohar_Ringel1",
        "aff": "Hebrew University of Jerusalem;Tel Aviv University;Hebrew University of Jerusalem, Israel",
        "aff_domain": "huji.ac.il;tau.ac.il;huji.ac.il",
        "position": "MS student;Assistant Professor;Associate Professor",
        "bibtex": "@inproceedings{\nrubin2024grokking,\ntitle={Grokking as a First Order Phase Transition in Two Layer Networks},\nauthor={Noa Rubin and Inbar Seroussi and Zohar Ringel},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=3ROGsTX3IR}\n}",
        "github": "",
        "project": "",
        "reviewers": "t2DF;iD3W;64Ja;PXdZ;MgBg",
        "pdf_size": 23077248,
        "rating": "3;6;6;6;8",
        "confidence": "3;3;4;4;4",
        "soundness": "2;3;2;3;3",
        "contribution": "2;2;3;2;4",
        "presentation": "1;3;4;3;2",
        "wc_summary": "68;75;57;55;273",
        "wc_strengths": "18;7;51;57;79",
        "wc_weaknesses": "286;89;187;185;184",
        "wc_questions": "28;3;164;193;494",
        "wc_review": "400;174;459;490;1030",
        "wc_reply_reviewers": "0;103;138;42;121",
        "wc_reply_authors": "1018;531;1229;1099;1313",
        "reply_reviewers": "0;1;1;1;1",
        "reply_authors": "2;2;3;3;3",
        "rating_avg": [
            5.8,
            1.6
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.6,
            0.8
        ],
        "presentation_avg": [
            2.6,
            1.019803902718557
        ],
        "wc_summary_avg": [
            105.6,
            84.0180932894814
        ],
        "wc_strengths_avg": [
            42.4,
            26.363611285254528
        ],
        "wc_weaknesses_avg": [
            186.2,
            62.313401447842665
        ],
        "wc_questions_avg": [
            176.4,
            175.15090636362692
        ],
        "wc_review_avg": [
            510.6,
            282.2747597643119
        ],
        "wc_reply_reviewers_avg": [
            80.8,
            51.79729722678588
        ],
        "wc_reply_authors_avg": [
            1038.0,
            273.2310377684058
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            2.6,
            0.4898979485566356
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.6634034720037775,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3441025740091630117&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=3ROGsTX3IR",
        "pdf": "https://openreview.net/pdf?id=3ROGsTX3IR",
        "email": "huji.ac.il;tau.ac.il;huji.ac.il",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Hebrew University of Jerusalem;Tel Aviv University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.huji.ac.il;https://www.tau.ac.il",
        "aff_unique_abbr": "HUJI;TAU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Jerusalem;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Israel"
    },
    {
        "id": "3RfGSbXUt8",
        "title": "Option Boosting",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We introduce a novel approach to enhance stability and knowledge transfer in multi-task hierarchical reinforcement learning, specifically within the options framework. Modern Hierarchical Reinforcement Learning (HRL) algorithms can be prone to instability, due to the multilevel nature of the optimization process. To improve stability, we draw inspiration from boosting methods in supervised learning and propose a method which progressively introduces new options, while older options are kept fixed. In order to encourage generalization, each option policy has limited expressiveness. In order to improve knowledge transfer, we introduce the \\textit{Option Library}, a mechanism to share  options across a population of agents. Our approach improves learning stability and allows agents to leverage knowledge from simple tasks in order to explore and perform more complex tasks. We evaluate our algorithm in MiniGrid and CraftingWorld, two pixel-based 2D grid-world environments designed for goal-oriented tasks, which allows compositional solutions.",
        "keywords": "Hierarchical Reinforcement Learning;Multi-Task Reinforcement Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Manuel Del Verme;Doina Precup",
        "authorids": "~Manuel_Del_Verme1;~Doina_Precup1",
        "gender": ";F",
        "homepage": ";http://cs.mcgill.ca/~dprecup/",
        "dblp": ";p/DoinaPrecup",
        "google_scholar": "JcOwyS0AAAAJ;https://scholar.google.com.tw/citations?user=j54VcVEAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Manuel_Del_Verme1;~Doina_Precup1",
        "aff": "Montreal Institute for Learning Algorithms, University of Montreal, University of Montreal;McGill University",
        "aff_domain": "mila.umontreal.ca;mcgill.ca",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\nverme2024option,\ntitle={Option Boosting},\nauthor={Manuel Del Verme and Doina Precup},\nyear={2024},\nurl={https://openreview.net/forum?id=3RfGSbXUt8}\n}",
        "github": "",
        "project": "",
        "reviewers": "Sp3D;Jjah;ZULE",
        "site": "https://openreview.net/forum?id=3RfGSbXUt8",
        "pdf_size": 413492,
        "rating": "3;3;5",
        "confidence": "4;4;3",
        "soundness": "2;3;2",
        "contribution": "2;2;2",
        "presentation": "1;2;3",
        "wc_summary": "55;61;101",
        "wc_strengths": "35;52;64",
        "wc_weaknesses": "133;199;53",
        "wc_questions": "92;111;46",
        "wc_review": "315;423;264",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            72.33333333333333,
            20.417857108151406
        ],
        "wc_strengths_avg": [
            50.333333333333336,
            11.897712198383164
        ],
        "wc_weaknesses_avg": [
            128.33333333333334,
            59.69552374806301
        ],
        "wc_questions_avg": [
            83.0,
            27.28858125052797
        ],
        "wc_review_avg": [
            334.0,
            66.2872536767062
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:5qxNTHtR17AJ:scholar.google.com/&scioq=Option+Boosting&hl=en&as_sdt=0,23",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Montreal;McGill University",
        "aff_unique_dep": "Montreal Institute for Learning Algorithms;",
        "aff_unique_url": "https://www.umontreal.ca;https://www.mcgill.ca",
        "aff_unique_abbr": "UM;McGill",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Montreal;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Canada"
    },
    {
        "title": "Generalization error of spectral algorithms",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19512",
        "id": "3SJE1WLB4M",
        "author_site": "Maksim Velikanov, Maxim Panov, Dmitry Yarotsky",
        "tldr": "",
        "abstract": "The asymptotically precise estimation of the generalization of kernel methods has recently received attention due to the parallels between neural networks and their associated kernels. However, prior works derive such estimates for training by kernel ridge regression (KRR), whereas neural networks are typically trained with gradient descent (GD). In the present work, we consider the training of kernels with a family of \\emph{spectral algorithms} specified by profile $h(\\lambda)$, and including KRR and GD as special cases. Then, we derive the generalization error as a functional of learning profile $h(\\lambda)$ for two data models: high-dimensional Gaussian and low-dimensional translation-invariant model. \nUnder power-law assumptions on the spectrum of the kernel and target, we use our framework to (i) give full loss asymptotics for both noisy and noiseless observations (ii) show that the loss localizes on certain spectral scales, giving a new perspective on the KRR saturation phenomenon (iii) conjecture, and demonstrate for the considered data models, the universality of the loss w.r.t. non-spectral details of the problem, but only in case of noisy observation.",
        "keywords": "gradient descent;kernel ridge regression;optimal algorithm;generalization;asymptotic error rates;power-laws",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Maksim Velikanov;Maxim Panov;Dmitry Yarotsky",
        "authorids": "~Maksim_Velikanov1;~Maxim_Panov1;~Dmitry_Yarotsky1",
        "gender": "M;M;M",
        "homepage": ";;http://yarotsky.info",
        "dblp": "292/3286;30/10085;132/4661",
        "google_scholar": "OrWWVcUAAAAJ;https://scholar.google.ru/citations?user=BqDhGJQAAAAJ;https://scholar.google.ru/citations?user=wNSSr_gAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Maksim_Velikanov1;~Maxim_Panov1;~Dmitry_Yarotsky1",
        "aff": "\u00c9cole Polytechnique;Institute for Information Transmission Problems;Skolkovo Institute of Science and Technology",
        "aff_domain": "polytechnique.fr;iitp.ru;skoltech.ru",
        "position": "PhD student;Researcher;Full Professor",
        "bibtex": "@inproceedings{\nvelikanov2024generalization,\ntitle={Generalization error of spectral algorithms},\nauthor={Maksim Velikanov and Maxim Panov and Dmitry Yarotsky},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=3SJE1WLB4M}\n}",
        "github": "",
        "project": "",
        "reviewers": "wTWc;jkPS;v7ue",
        "pdf_size": 737467,
        "rating": "8;8;8",
        "confidence": "3;3;2",
        "soundness": "3;4;3",
        "contribution": "3;4;3",
        "presentation": "3;3;3",
        "wc_summary": "88;97;26",
        "wc_strengths": "55;90;22",
        "wc_weaknesses": "135;51;32",
        "wc_questions": "207;27;17",
        "wc_review": "485;265;97",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1091;286;117",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            70.33333333333333,
            31.562988170042175
        ],
        "wc_strengths_avg": [
            55.666666666666664,
            27.764885897278397
        ],
        "wc_weaknesses_avg": [
            72.66666666666667,
            44.7536466546458
        ],
        "wc_questions_avg": [
            83.66666666666667,
            87.3053390247253
        ],
        "wc_review_avg": [
            282.3333333333333,
            158.87381435871959
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            498.0,
            424.9525463703761
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ONrYOG02T8AJ:scholar.google.com/&scioq=Generalization+error+of+spectral+algorithms&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=3SJE1WLB4M",
        "pdf": "https://openreview.net/pdf?id=3SJE1WLB4M",
        "email": "polytechnique.fr;iitp.ru;skoltech.ru",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Ecole Polytechnique;Institute for Information Transmission Problems;Skolkovo Institute of Science and Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.polytechnique.edu;http://www.iitp.ru;https://www.skoltech.ru",
        "aff_unique_abbr": "X;;Skoltech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "France;Russian Federation"
    },
    {
        "id": "3SqnZXg24T",
        "title": "RetinexGAN Enables More Robust Low-Light Image Enhancement Via Retinex Decomposition Based Unsupervised Illumination Brightening",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Most existing image enhancement techniques rely heavily on strict supervision of paired images. Moreover, unsupervised enhancement methods also face challenges in achieving a balance between model performance and efficiency when handling real-world low-light images in unknown complex scenarios. Herein, we present a novel low-light image enhancement scheme termed \\textbf{RetinexGAN} that can leverage the supervision of a limited number of low-light/normal image pairs to realize an accurate Retinex decomposition, and based on this, achieve brightening the illumination of unpaired images to reduce dependence on paired datasets and improve generalization ability. The decomposition network is learned with some newly established constraints for complete decoupling between reflectance and illumination. For the first time, we introduce the feature pyramid network (FPN) to adjust the illumination maps of other low-light images without any supervision. Under this flexible framework, a wide range of backbones can be employed to work with illumination map generator, to navigate the balance between performance and efficiency. In addition, a novel attention mechanism is integrated into the FPN for giving the adaptability towards application scenes with different environment like underwater image enhancement (UIE) and dark face detection. Extensive experiments demonstrate that our proposed scheme has a more robust performance with high efficiency facing various images from different low-light environments over state-of-the-art methods.",
        "keywords": "low-light image enhancement;Retinex decomposition;feature pyramid network (FPN);attention mechanism;unsupervised illumination brightening",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Ruiqi Mao;Rongxin Cui",
        "authorids": "~Ruiqi_Mao1;~Rongxin_Cui1",
        "gender": "M;M",
        "homepage": "https://github.com/Ruiqi-Mao;",
        "dblp": ";05/7736.html",
        "google_scholar": ";https://scholar.google.com/citations?hl=en",
        "orcid": ";0000-0002-8006-3620",
        "linkedin": ";",
        "or_profile": "~Ruiqi_Mao1;~Rongxin_Cui1",
        "aff": "Northwest Polytechnical University Xi'an;Northwestern Polytechnical University Xi'an",
        "aff_domain": "nwpu.edu.cn;nwpu.edu.cn",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nmao2024retinexgan,\ntitle={Retinex{GAN} Enables More Robust Low-Light Image Enhancement Via Retinex Decomposition Based Unsupervised Illumination Brightening},\nauthor={Ruiqi Mao and Rongxin Cui},\nyear={2024},\nurl={https://openreview.net/forum?id=3SqnZXg24T}\n}",
        "github": "",
        "project": "",
        "reviewers": "tFmg;p4zt;TqR9;6g5x",
        "site": "https://openreview.net/forum?id=3SqnZXg24T",
        "pdf_size": 30220609,
        "rating": "1;3;3;3",
        "confidence": "5;4;5;5",
        "soundness": "1;3;2;2",
        "contribution": "1;2;1;2",
        "presentation": "2;3;2;2",
        "wc_summary": "59;33;54;63",
        "wc_strengths": "30;23;22;36",
        "wc_weaknesses": "353;68;127;202",
        "wc_questions": "4;4;24;10",
        "wc_review": "446;128;227;311",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "705;349;514;551",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            52.25,
            11.562331079847178
        ],
        "wc_strengths_avg": [
            27.75,
            5.673402858955108
        ],
        "wc_weaknesses_avg": [
            187.5,
            106.70168695948533
        ],
        "wc_questions_avg": [
            10.5,
            8.170067319184096
        ],
        "wc_review_avg": [
            278.0,
            116.63404305776251
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            529.75,
            126.57285451470233
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:WEGobSqFmSAJ:scholar.google.com/&scioq=RetinexGAN+Enables+More+Robust+Low-Light+Image+Enhancement+Via+Retinex+Decomposition+Based+Unsupervised+Illumination+Brightening&hl=en&as_sdt=0,7",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Northwest Polytechnical University;Northwestern Polytechnical University",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.nwpu.edu.cn;http://www.nwpu.edu.cn",
        "aff_unique_abbr": "NWPU;NWPU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Xi'an",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "3TAhlGaMKD",
        "title": "Last One Standing: A Comparative Analysis of Security and Privacy of Soft Prompt Tuning, LoRA, and In-Context Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) are powerful tools for natural language processing, enabling novel applications and user experiences. However, to achieve optimal performance, LLMs often require adaptation with private data, which poses privacy and security challenges. Several techniques have been proposed to adapt LLMs with private data, such as Low-Rank Adaptation (LoRA), Soft Prompt Tuning (SPT), and In-Context Learning (ICL), but their comparative privacy and security properties have not been systematically investigated. In this work, we fill this gap by evaluating the robustness of LoRA, SPT, and ICL against three types of well-established attacks: membership inference, which exposes data leakage (privacy); backdoor, which injects malicious behavior (security); and model stealing, which can violate intellectual property (privacy and security). Our results show that there is no silver bullet for privacy and security in LLM adaptation and each technique has different strengths and weaknesses.",
        "keywords": "Large Language Models;Privacy;Security;Model Stealing Attack;Membership Inference Attack;Backdoor Attack;Low-Rank Adaptation;Soft Prompt Tuning;In-Context Learning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Rui Wen;Tianhao Wang;Michael Backes;Yang Zhang;Ahmed Salem",
        "authorids": "~Rui_Wen3;~Tianhao_Wang3;~Michael_Backes3;~Yang_Zhang15;~Ahmed_Salem2",
        "gender": "M;M;;M;",
        "homepage": "https://ruiwen-ai.github.io/;https://tianhao.wang;;https://yangzhangalmo.github.io/;",
        "dblp": "63/10765-2;https://dblp.uni-trier.de/pid/145/3288-1.html;;06/6785-16;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;TkgyXGwAAAAJ;;Xeb2888AAAAJ;",
        "orcid": "0009-0009-0691-7569;;;0000-0003-3612-7348;",
        "linkedin": ";;;;",
        "or_profile": "~Rui_Wen3;~Tianhao_Wang3;~Michael_Backes3;~Yang_Zhang15;~Ahmed_Salem2",
        "aff": "CISPA Helmholtz Center for Information Security;University of Virginia, Charlottesville;;CISPA Helmholtz Center for Information Security;",
        "aff_domain": "cispa.de;virginia.edu;;cispa.de;",
        "position": "PhD student;Assistant Professor;;Full Professor;",
        "bibtex": "@misc{\nwen2024last,\ntitle={Last One Standing: A Comparative Analysis of Security and Privacy of Soft Prompt Tuning, Lo{RA}, and In-Context Learning},\nauthor={Rui Wen and Tianhao Wang and Michael Backes and Yang Zhang and Ahmed Salem},\nyear={2024},\nurl={https://openreview.net/forum?id=3TAhlGaMKD}\n}",
        "github": "",
        "project": "",
        "reviewers": "FB1d;J1hc;JTKU;RTpz",
        "site": "https://openreview.net/forum?id=3TAhlGaMKD",
        "pdf_size": 759382,
        "rating": "1;5;5;8",
        "confidence": "4;3;3;4",
        "soundness": "1;3;3;3",
        "contribution": "1;2;2;3",
        "presentation": "3;4;3;3",
        "wc_summary": "47;49;16;113",
        "wc_strengths": "56;45;27;60",
        "wc_weaknesses": "210;98;83;140",
        "wc_questions": "18;174;1;118",
        "wc_review": "331;366;127;431",
        "wc_reply_reviewers": "0;18;0;87",
        "wc_reply_authors": "704;876;255;562",
        "reply_reviewers": "0;1;0;2",
        "reply_authors": "2;2;2;3",
        "rating_avg": [
            4.75,
            2.48746859276655
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            56.25,
            35.280128968018246
        ],
        "wc_strengths_avg": [
            47.0,
            12.786711852544421
        ],
        "wc_weaknesses_avg": [
            132.75,
            49.25126901918366
        ],
        "wc_questions_avg": [
            77.75,
            71.3175118747142
        ],
        "wc_review_avg": [
            313.75,
            113.63400679374111
        ],
        "wc_reply_reviewers_avg": [
            26.25,
            35.83556194620087
        ],
        "wc_reply_authors_avg": [
            599.25,
            227.73819947474774
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.10050378152592121,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18014859622824349825&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "CISPA Helmholtz Center for Information Security;University of Virginia",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cispa.de/;https://www.virginia.edu",
        "aff_unique_abbr": "CISPA;UVA",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Charlottesville",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Germany;United States"
    },
    {
        "title": "BTR: Binary Token Representations for Efficient Retrieval Augmented Language Models",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19511",
        "id": "3TO3TtnOFl",
        "author_site": "Qingqing Cao, Sewon Min, Yizhong Wang, Hannaneh Hajishirzi",
        "tldr": "",
        "abstract": "Retrieval augmentation addresses many critical problems in large language models such as hallucination, staleness, and privacy leaks.\nHowever, running retrieval-augmented language models (LMs) is slow and difficult to scale due to processing large amounts of retrieved text. \nWe introduce binary token representations (BTR), which use 1-bit vectors to precompute every token in passages, significantly reducing computation during inference. \nDespite the potential loss of accuracy, our new calibration techniques and training objectives restore performance. Combined with offline and runtime compression, this only requires 127GB of disk space for encoding 3 billion tokens in Wikipedia.\nOur experiments show that on five knowledge-intensive NLP tasks, BTR accelerates state-of-the-art inference by up to 4x and reduces storage by over 100x while maintaining over 95% task performance. Our code is publicly available at https://github.com/csarron/BTR.",
        "keywords": "language models;question answering;binary representations;retrieval-augmented language models",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Qingqing Cao;Sewon Min;Yizhong Wang;Hannaneh Hajishirzi",
        "authorids": "~Qingqing_Cao1;~Sewon_Min1;~Yizhong_Wang2;~Hannaneh_Hajishirzi1",
        "gender": "M;F;M;F",
        "homepage": "https://awk.ai/;https://www.sewonmin.com;https://yizhong-wang.com;https://homes.cs.washington.edu/~hannaneh/",
        "dblp": ";203/9401;79/3601;52/1296",
        "google_scholar": "vLpPyUUAAAAJ;https://scholar.google.ca/citations?user=jU4IZs4AAAAJ;y5zpqdAAAAAJ;LOV6_WIAAAAJ",
        "orcid": "0000-0002-8564-9241;;;",
        "linkedin": "qqcao;;;",
        "or_profile": "~Qingqing_Cao1;~Sewon_Min1;~Yizhong_Wang2;~Hannaneh_Hajishirzi1",
        "aff": "University of Washington, Seattle;Department of Computer Science, University of Washington;Department of Computer Science, University of Washington;University of Washington",
        "aff_domain": "uw.edu;cs.washington.edu;cs.washington.edu;uw.edu",
        "position": "Postdoc;PhD student;PhD student;Associate Professor",
        "bibtex": "@inproceedings{\ncao2024btr,\ntitle={{BTR}: Binary Token Representations for Efficient Retrieval Augmented Language Models},\nauthor={Qingqing Cao and Sewon Min and Yizhong Wang and Hannaneh Hajishirzi},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=3TO3TtnOFl}\n}",
        "github": "",
        "project": "",
        "reviewers": "PDbq;U3RY;X7Hc;KKL3",
        "pdf_size": 597161,
        "rating": "6;6;6;8",
        "confidence": "4;3;3;4",
        "soundness": "3;2;3;3",
        "contribution": "3;3;3;4",
        "presentation": "4;3;3;3",
        "wc_summary": "83;93;55;225",
        "wc_strengths": "118;87;76;75",
        "wc_weaknesses": "100;171;98;323",
        "wc_questions": "124;96;34;53",
        "wc_review": "425;447;263;676",
        "wc_reply_reviewers": "91;173;0;122",
        "wc_reply_authors": "670;532;567;789",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            114.0,
            65.58200972827838
        ],
        "wc_strengths_avg": [
            89.0,
            17.392527130926087
        ],
        "wc_weaknesses_avg": [
            173.0,
            91.45764046814242
        ],
        "wc_questions_avg": [
            76.75,
            35.336772631353874
        ],
        "wc_review_avg": [
            452.75,
            147.1807986797191
        ],
        "wc_reply_reviewers_avg": [
            96.5,
            62.93846200853656
        ],
        "wc_reply_authors_avg": [
            639.5,
            100.11618250812403
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14156270123239045267&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=3TO3TtnOFl",
        "pdf": "https://openreview.net/pdf?id=3TO3TtnOFl",
        "email": "uw.edu;cs.washington.edu;cs.washington.edu;uw.edu",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of Washington",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.washington.edu",
        "aff_unique_abbr": "UW",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Seattle;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Learning Planning Abstractions from Language",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19510",
        "id": "3UWuFoksGb",
        "author_site": "Weiyu Liu, Geng Chen, Joy Hsu, Jiayuan Mao, Jiajun Wu",
        "tldr": "",
        "abstract": "This paper presents a framework for learning state and action abstractions in sequential decision-making domains. Our framework, planning abstraction from language (PARL), utilizes language-annotated demonstrations to automatically discover a symbolic and abstract action space and induce a latent state abstraction based on it. PARL consists of three stages: 1) recovering object-level and action concepts, 2) learning state abstractions, abstract action feasibility, and transition models, and 3) applying low-level policies for abstract actions. During inference, given the task description, PARL first makes abstract action plans using the latent transition and feasibility functions, then refines the high-level plan using low-level policies. PARL generalizes across scenarios involving novel object instances and environments, unseen concept compositions, and tasks that require longer planning horizons than settings it is trained on.",
        "keywords": "Planning and Learning;Learning Abstractions;Compositional Generalization;Robotic Manipulation",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Weiyu Liu;Geng Chen;Joy Hsu;Jiayuan Mao;Jiajun Wu",
        "authorids": "~Weiyu_Liu1;~Geng_Chen3;~Joy_Hsu2;~Jiayuan_Mao1;~Jiajun_Wu1",
        "gender": "M;M;F;F;M",
        "homepage": "http://weiyuliu.com/;https://jc043.github.io/;https://web.stanford.edu/~joycj/;http://jiayuanm.com;https://jiajunwu.com",
        "dblp": "133/0311.html;;258/5012;200/8283;117/4768",
        "google_scholar": "PHi0YEQAAAAJ;;Zr7RJT4AAAAJ;-xaOIZIAAAAJ;2efgcS0AAAAJ",
        "orcid": ";;;0000-0003-4798-3748;0000-0002-4176-343X",
        "linkedin": ";;;;jiajunwu/",
        "or_profile": "~Weiyu_Liu1;~Geng_Chen3;~Joy_Hsu2;~Jiayuan_Mao1;~Jiajun_Wu1",
        "aff": "Stanford University;University of California, San Diego;Stanford University;Massachusetts Institute of Technology;Stanford University",
        "aff_domain": "stanford.edu;ucsd.edu;stanford.edu;mit.edu;stanford.edu",
        "position": "Postdoc;MS student;PhD student;PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nliu2024learning,\ntitle={Learning Planning Abstractions from Language},\nauthor={Weiyu Liu and Geng Chen and Joy Hsu and Jiayuan Mao and Jiajun Wu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=3UWuFoksGb}\n}",
        "github": "",
        "project": "",
        "reviewers": "Q2SJ;B6My;NUXY;V9Cw",
        "pdf_size": 1089365,
        "rating": "3;5;6;8",
        "confidence": "3;3;4;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "197;209;66;51",
        "wc_strengths": "103;74;28;107",
        "wc_weaknesses": "67;486;249;31",
        "wc_questions": "409;150;70;2",
        "wc_review": "776;919;413;191",
        "wc_reply_reviewers": "32;33;96;14",
        "wc_reply_authors": "1995;644;1573;168",
        "reply_reviewers": "1;1;2;1",
        "reply_authors": "4;1;5;1",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            130.75,
            72.56850212041034
        ],
        "wc_strengths_avg": [
            78.0,
            31.551545128567
        ],
        "wc_weaknesses_avg": [
            208.25,
            180.39869040544613
        ],
        "wc_questions_avg": [
            157.75,
            154.22771313872224
        ],
        "wc_review_avg": [
            574.75,
            288.2866412097515
        ],
        "wc_reply_reviewers_avg": [
            43.75,
            31.09963826156182
        ],
        "wc_reply_authors_avg": [
            1095.0,
            724.778241947149
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            1.7853571071357126
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.16012815380508713,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15050195618124764063&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=3UWuFoksGb",
        "pdf": "https://openreview.net/pdf?id=3UWuFoksGb",
        "email": "stanford.edu;ucsd.edu;stanford.edu;mit.edu;stanford.edu",
        "author_num": 5,
        "aff_unique_index": "0;1;0;2;0",
        "aff_unique_norm": "Stanford University;University of California, San Diego;Massachusetts Institute of Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.stanford.edu;https://www.ucsd.edu;https://web.mit.edu",
        "aff_unique_abbr": "Stanford;UCSD;MIT",
        "aff_campus_unique_index": "0;1;0;0",
        "aff_campus_unique": "Stanford;San Diego;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Fusion Is Not Enough: Single Modal Attacks on Fusion Models for 3D Object Detection",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19509",
        "id": "3VD4PNEt5q",
        "author_site": "Zhiyuan Cheng, Hongjun Choi, Shiwei Feng, James Liang, Guanhong Tao, Dongfang Liu, Michael Zuzak, Xiangyu Zhang",
        "tldr": "",
        "abstract": "Multi-sensor fusion (MSF) is widely used in autonomous vehicles (AVs) for perception, particularly for 3D object detection with camera and LiDAR sensors. The purpose of fusion is to capitalize on the advantages of each modality while minimizing its weaknesses. Advanced deep neural network (DNN)-based fusion techniques have demonstrated the exceptional and industry-leading performance. Due to the redundant information in multiple modalities, MSF is also recognized as a general defence strategy against adversarial attacks. \nIn this paper, we attack fusion models from the camera modality that is considered to be of lesser importance in fusion but is more affordable for attackers. We argue that the weakest link of fusion models depends on their most vulnerable modality and propose an attack framework that targets advanced camera-LiDAR fusion-based 3D object detection models through camera-only adversarial attacks. \nOur approach employs a two-stage optimization-based strategy that first thoroughly evaluates vulnerable image areas under adversarial attacks, and then applies dedicated attack strategies for different fusion models to generate deployable patches. The evaluations with six advanced camera-LiDAR fusion models and one camera-only model indicate that our attacks successfully compromise all of them. Our approach can either decrease the mean average precision (mAP) of detection performance from 0.824 to 0.353 or degrade the detection score of a target object from 0.728 to 0.156, demonstrating the efficacy of our proposed attack framework. Code is available.",
        "keywords": "Adversarial Attacks;3D Object Detection;Autonomous Driving",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/2bd5ecf53634e87ceeecc8fd1736137e4820d36d.zip",
        "author": "Zhiyuan Cheng;Hongjun Choi;Shiwei Feng;James Chenhao Liang;Guanhong Tao;Dongfang Liu;Michael Zuzak;Xiangyu Zhang",
        "authorids": "~Zhiyuan_Cheng2;~Hongjun_Choi3;~Shiwei_Feng1;~James_Chenhao_Liang1;~Guanhong_Tao1;~Dongfang_Liu1;~Michael_Zuzak1;~Xiangyu_Zhang3",
        "gender": "M;;M;M;;;Not Specified;M",
        "homepage": "https://bob-cheng.github.io;https://hongjun9.github.io/;https://www.cs.purdue.edu/homes/feng292/;https://jamesliang819.github.io/;;https://www.rit.edu/directory/dxleec-dongfang-liu;https://mzuzak.github.io/;https://www.cs.purdue.edu/homes/xyzhang",
        "dblp": "324/1963;;138/9141-2;323/3403;;;;",
        "google_scholar": "dVchB-gAAAAJ;;https://scholar.google.com/citations?hl=en;cR8m4CcAAAAJ;;uICY0vEAAAAJ;dESHYYcAAAAJ;PXbu1wIAAAAJ",
        "orcid": "0000-0001-7280-6079;;0000-0001-6959-4327;;;;;",
        "linkedin": "bobchengzy/;;swfeng98/;;;;michael-zuzak/;",
        "or_profile": "~Zhiyuan_Cheng2;~Hongjun_Choi3;~Shiwei_Feng1;~James_Chenhao_Liang1;~Guanhong_Tao1;~Dongfang_Liu1;~Michael_Zuzak1;~Xiangyu_Zhang3",
        "aff": "Purdue University;Daegu Gyeongbuk Institute of Science and Technology;Purdue University;Rochester Institute of Technology;;Rochester Institute of Technology;Rochester Institute of Technology;Purdue University",
        "aff_domain": "purdue.edu;dgist.ac.kr;cs.purdue.edu;rit.edu;;rit.edu;rit.edu;cs.purdue.edu",
        "position": "PhD student;Assistant Professor;PhD student;PhD student;;Assistant Professor;Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\ncheng2024fusion,\ntitle={Fusion Is Not Enough: Single Modal Attacks on Fusion Models for 3D Object Detection},\nauthor={Zhiyuan Cheng and Hongjun Choi and Shiwei Feng and James Chenhao Liang and Guanhong Tao and Dongfang Liu and Michael Zuzak and Xiangyu Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=3VD4PNEt5q}\n}",
        "github": "",
        "project": "",
        "reviewers": "qqbx;DXNR;QA2X;nx8r",
        "pdf_size": 12839495,
        "rating": "5;6;6;8",
        "confidence": "4;3;4;4",
        "soundness": "2;3;3;3",
        "contribution": "3;2;3;3",
        "presentation": "3;2;4;3",
        "wc_summary": "65;50;75;31",
        "wc_strengths": "44;52;152;36",
        "wc_weaknesses": "422;145;190;124",
        "wc_questions": "142;59;191;12",
        "wc_review": "673;306;608;203",
        "wc_reply_reviewers": "73;390;0;93",
        "wc_reply_authors": "2262;1963;1134;867",
        "reply_reviewers": "1;4;0;2",
        "reply_authors": "4;7;2;3",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            55.25,
            16.588776326179094
        ],
        "wc_strengths_avg": [
            71.0,
            47.10626285325551
        ],
        "wc_weaknesses_avg": [
            220.25,
            118.89570009045744
        ],
        "wc_questions_avg": [
            101.0,
            69.76030389842063
        ],
        "wc_review_avg": [
            447.5,
            197.7454171403221
        ],
        "wc_reply_reviewers_avg": [
            139.0,
            148.9916105020682
        ],
        "wc_reply_authors_avg": [
            1556.5,
            573.7789208397255
        ],
        "reply_reviewers_avg": [
            1.75,
            1.479019945774904
        ],
        "reply_authors_avg": [
            4.0,
            1.8708286933869707
        ],
        "replies_avg": [
            31,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.13245323570650439,
        "gs_citation": 28,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8293660199150583941&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=3VD4PNEt5q",
        "pdf": "https://openreview.net/pdf?id=3VD4PNEt5q",
        "email": "purdue.edu;dgist.ac.kr;cs.purdue.edu;rit.edu;;rit.edu;rit.edu;cs.purdue.edu",
        "author_num": 8,
        "aff_unique_index": "0;1;0;2;2;2;0",
        "aff_unique_norm": "Purdue University;Daegu Gyeongbuk Institute of Science and Technology;Rochester Institute of Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.purdue.edu;https://www.dgist.ac.kr;https://www.rit.edu",
        "aff_unique_abbr": "Purdue;DGIST;RIT",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Daegu",
        "aff_country_unique_index": "0;1;0;0;0;0;0",
        "aff_country_unique": "United States;South Korea"
    },
    {
        "title": "LEMON: Lossless model expansion",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19508",
        "id": "3Vw7DQqq7U",
        "author_site": "Yite Wang, Jiahao Su, Hanlin Lu, Cong Xie, Tianyi Liu, Jianbo Yuan, Haibin Lin, Ruoyu Sun, Hongxia Yang",
        "tldr": "",
        "abstract": "Scaling of deep neural networks, especially Transformers, is pivotal for their surging performance and has further led to the emergence of sophisticated reasoning capabilities in foundation models.\nSuch scaling generally requires training large models from scratch with random initialization, failing to leverage the knowledge acquired by their smaller counterparts, which are already resource-intensive to obtain.\nTo tackle this inefficiency, we present $\\textbf{L}$ossl$\\textbf{E}$ss $\\textbf{MO}$del Expansio$\\textbf{N}$ (LEMON), a recipe \nto initialize scaled models using the weights of their smaller but pre-trained counterparts. This is followed by model training with an optimized learning rate scheduler tailored explicitly for the scaled models, substantially reducing the training time compared to training from scratch.\nNotably, LEMON is versatile, ensuring compatibility with various network structures, including models like Vision Transformers and BERT.\nOur empirical results demonstrate that LEMON reduces computational costs by 56.7\\% for Vision Transformers and 33.2\\% for BERT when compared to training from scratch.",
        "keywords": "model growth;efficient deep learning;continual learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Yite Wang;Jiahao Su;Hanlin Lu;Cong Xie;Tianyi Liu;Jianbo Yuan;Haibin Lin;Ruoyu Sun;Hongxia Yang",
        "authorids": "~Yite_Wang1;~Jiahao_Su1;~Hanlin_Lu1;~Cong_Xie1;~Tianyi_Liu2;~Jianbo_Yuan1;~Haibin_Lin1;~Ruoyu_Sun1;~Hongxia_Yang2",
        "gender": "M;M;M;M;M;M;;;F",
        "homepage": "https://yitewang.github.io/;;;https://congxie1108.github.io/;https://sites.google.com/view/tianyiliu/home;;;https://ruoyus.github.io/;https://www4.comp.polyu.edu.hk/~hongxyang/",
        "dblp": "317/0407;;31/7172;;;134/6790;;30/9879-1;",
        "google_scholar": "wEGgxUIAAAAJ;z4AEqYkAAAAJ;https://scholar.google.at/citations?user=UbWokRoAAAAJ;pIPJUJMAAAAJ;;https://scholar.google.com/citations?hl=en;;PsfzbCMAAAAJ;iJlC5mMAAAAJ",
        "orcid": ";;;;;;;;",
        "linkedin": "yite-wang-261057140/;jiahaosu-umd/;;;;;;;",
        "or_profile": "~Yite_Wang1;~Jiahao_Su1;~Hanlin_Lu1;~Cong_Xie1;~Tianyi_Liu2;~Jianbo_Yuan1;~Haibin_Lin1;~Ruoyu_Sun1;~Hongxia_Yang2",
        "aff": "University of Illinois, Urbana Champaign;Amazon;ByteDance;ByteDance Inc.;Amazon;Bytedance;;The Chinese University of Hong Kong;ByteDance Inc.",
        "aff_domain": "illinois.edu;amazon.com;bytedance.com;bytedance.com;amazon.com;bytedance.com;;cuhk.edu.cn;bytedance.com",
        "position": "PhD student;Researcher;Researcher;Researcher;Researcher;Researcher;;Associate Professor;Principal Researcher",
        "bibtex": "@inproceedings{\nwang2024lemon,\ntitle={{LEMON}: Lossless model expansion},\nauthor={Yite Wang and Jiahao Su and Hanlin Lu and Cong Xie and Tianyi Liu and Jianbo Yuan and Haibin Lin and Ruoyu Sun and Hongxia Yang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=3Vw7DQqq7U}\n}",
        "github": "",
        "project": "",
        "reviewers": "JSXE;u5r2;XnGd;pAyq",
        "pdf_size": 898077,
        "rating": "6;6;8;8",
        "confidence": "4;4;4;3",
        "soundness": "3;3;3;3",
        "contribution": "3;2;3;3",
        "presentation": "3;3;4;3",
        "wc_summary": "185;96;62;119",
        "wc_strengths": "136;55;77;132",
        "wc_weaknesses": "125;221;56;155",
        "wc_questions": "42;6;92;7",
        "wc_review": "488;378;287;413",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "568;927;652;579",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            115.5,
            44.95831402532795
        ],
        "wc_strengths_avg": [
            100.0,
            34.90701935141412
        ],
        "wc_weaknesses_avg": [
            139.25,
            59.29744935492588
        ],
        "wc_questions_avg": [
            36.75,
            35.03837182290296
        ],
        "wc_review_avg": [
            391.5,
            72.2443769438148
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            681.5,
            145.36935715617648
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 19,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16616827554209479908&as_sdt=20000005&sciodt=0,21&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=3Vw7DQqq7U",
        "pdf": "https://openreview.net/pdf?id=3Vw7DQqq7U",
        "email": "illinois.edu;amazon.com;bytedance.com;bytedance.com;amazon.com;bytedance.com;;cuhk.edu.cn;bytedance.com",
        "author_num": 9,
        "aff_unique_index": "0;1;2;2;1;2;3;2",
        "aff_unique_norm": "University of Illinois Urbana-Champaign;Amazon;ByteDance;Chinese University of Hong Kong",
        "aff_unique_dep": ";Amazon.com, Inc.;;",
        "aff_unique_url": "https://illinois.edu;https://www.amazon.com;https://www.bytedance.com;https://www.cuhk.edu.hk",
        "aff_unique_abbr": "UIUC;Amazon;ByteDance;CUHK",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Urbana-Champaign;;Hong Kong SAR",
        "aff_country_unique_index": "0;0;1;1;0;1;1;1",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "3WB5hT27zf",
        "title": "Partial Optimal Transport for Open-set Semi-supervised Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Semi-supervised learning (SSL) is a machine learning paradigm that leverages both labeled and unlabeled data to improve the performance of learning tasks. However, SSL methods make an assumption that the label spaces of labeled and unlabeled data are identical, which may not hold in open-world applications, where the unlabeled data may contain novel categories that were not present in the labeled training data, essentially outliers. This paper tackles open-set semi-supervised learning (OSSL), where detecting these outliers, or out-of-distribution (OOD) data, is critical. In particular, we model the OOD detection problem in OSSL as a partial optimal transport (POT) problem. With the theory of POT, we devise a mass score function (MSF) to measure the likelihood of a sample being an outlier during training. Then, a novel OOD loss is proposed, which allows to adapt the off-the-shelf SSL methods with POT into OSSL settings in an end-to-end training manner.\nFurthermore, we conduct extensive experiments on multiple datasets and OSSL configurations, demonstrating that our method consistently achieves superior or competitive results compared to existing approaches.",
        "keywords": "Open-set problem;Optimal transport;Semi-supervised learning;Out-of-distribution detection",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Yilong Ren;Chuanwen Feng;Xike Xie;S Kevin Zhou",
        "authorids": "~Yilong_Ren1;~Chuanwen_Feng1;~Xike_Xie1;~S_Kevin_Zhou1",
        "gender": "M;M;M;M",
        "homepage": "https://github.com/ryl0427;https://optstats.github.io;http://staff.ustc.edu.cn/~xkxie;",
        "dblp": ";;64/1308;57/98",
        "google_scholar": ";;;8eNm2GMAAAAJ",
        "orcid": ";;;0000-0002-6881-4444",
        "linkedin": ";;;s-kevin-zhou-231a094b/",
        "or_profile": "~Yilong_Ren1;~Chuanwen_Feng1;~Xike_Xie1;~S_Kevin_Zhou1",
        "aff": "University of Science and Technology of China;;University of Science and Technology of China;University of Science and Technology of China",
        "aff_domain": "ustc.edu.cn;;ustc.edu.cn;ustc.edu.cn",
        "position": "MS student;;Research Professor;Full Professor",
        "bibtex": "@misc{\nren2024partial,\ntitle={Partial Optimal Transport for Open-set Semi-supervised Learning},\nauthor={Yilong Ren and Chuanwen Feng and Xike Xie and S Kevin Zhou},\nyear={2024},\nurl={https://openreview.net/forum?id=3WB5hT27zf}\n}",
        "github": "",
        "project": "",
        "reviewers": "2Syu;RKEQ;uAiP",
        "site": "https://openreview.net/forum?id=3WB5hT27zf",
        "pdf_size": 369667,
        "rating": "5;5;6",
        "confidence": "4;4;3",
        "soundness": "3;3;4",
        "contribution": "2;2;4",
        "presentation": "3;3;2",
        "wc_summary": "86;52;46",
        "wc_strengths": "56;40;30",
        "wc_weaknesses": "381;268;200",
        "wc_questions": "90;6;99",
        "wc_review": "613;366;375",
        "wc_reply_reviewers": "157;10;13",
        "wc_reply_authors": "912;807;286",
        "reply_reviewers": "1;1;1",
        "reply_authors": "3;2;1",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            61.333333333333336,
            17.613126418163876
        ],
        "wc_strengths_avg": [
            42.0,
            10.708252269472673
        ],
        "wc_weaknesses_avg": [
            283.0,
            74.65029582437478
        ],
        "wc_questions_avg": [
            65.0,
            41.88078318274385
        ],
        "wc_review_avg": [
            451.3333333333333,
            114.37462811111368
        ],
        "wc_reply_reviewers_avg": [
            60.0,
            68.60029154456998
        ],
        "wc_reply_authors_avg": [
            668.3333333333334,
            273.72776419079025
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9999999999999997,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:0HmSht6QT7kJ:scholar.google.com/&scioq=Partial+Optimal+Transport+for+Open-set+Semi-supervised+Learning&hl=en&as_sdt=0,23",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Science and Technology of China",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.ustc.edu.cn",
        "aff_unique_abbr": "USTC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "3WDFykPhM4",
        "title": "Generalized Supervised Contrastive Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "With the recent promising results of contrastive learning in the self-supervised learning paradigm, supervised contrastive learning has successfully extended these contrastive approaches to supervised contexts, outperforming cross-entropy on various datasets. However, supervised contrastive learning inherently employs label information in a binary form--either positive or negative--using a one-hot target vector. This structure struggles to adapt to methods that exploit label information as a probability distribution, such as CutMix and knowledge distillation. In this paper, we introduce a generalized supervised contrastive loss, which measures cross-entropy between label similarity and latent similarity. This concept enhances the capabilities of supervised contrastive loss by fully utilizing the label distribution and enabling the adaptation of various existing techniques for training modern neural networks. Leveraging this generalized supervised contrastive loss, we construct a tailored framework: the Generalized Supervised Contrastive Learning (GenSCL). Compared to existing contrastive learning frameworks, GenSCL incorporates additional enhancements, including advanced image-based regularization techniques and an arbitrary teacher classifier. When applied to ResNet50 with the Momentum Contrast technique, GenSCL achieves a top-1 accuracy of 77.3% on ImageNet, a 4.1% relative improvement over traditional supervised contrastive learning. Moreover, our method establishes new state-of-the-art accuracies of 98.2% and 87.0% on CIFAR10 and CIFAR100 respectively when applied to ResNet50, marking the highest reported figures for this architecture.",
        "keywords": "Contrastive Learning;Knowledge Distillation;Representation Learning;Image-Based Regularization;Label Smoothing",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Jaewon Kim;Hyeok Jong Lee;Jooyoung Chang;Sang Min Park",
        "authorids": "~Jaewon_Kim2;~Hyeok_Jong_Lee1;~Jooyoung_Chang3;~Sang_Min_Park2",
        "gender": "M;;M;M",
        "homepage": "https://kiimmm.github.io/;https://hyeok-jong.github.io/;http://biomed.snu.ac.kr/main/tmpl/sub_main.php?m_cd=8&m_id=0103&sp=2&wr_id=73;https://scholar.google.com/citations?user=_Y2v3BMAAAAJ",
        "dblp": "00/4936;;67/4835;258/4663",
        "google_scholar": ";;Km1BklMAAAAJ;_Y2v3BMAAAAJ",
        "orcid": ";;;0000-0002-8586-0645",
        "linkedin": "jaewon-kim-16ba651b6/;;;jooyoungchang",
        "or_profile": "~Jaewon_Kim2;~Hyeok_Jong_Lee1;~Sang_Min_Park2;~Jooyoung_Chang2",
        "aff": "Seoul National University Graduate School;Seoul National University Graduate School;;XAIMED Co. Ltd.",
        "aff_domain": "snu.ac.kr;snu.ac.kr;;ixaimed.com",
        "position": "PhD student;MS student;;Researcher",
        "bibtex": "@misc{\nkim2024generalized,\ntitle={Generalized Supervised Contrastive Learning},\nauthor={Jaewon Kim and Hyeok Jong Lee and Jooyoung Chang and Sang Min Park},\nyear={2024},\nurl={https://openreview.net/forum?id=3WDFykPhM4}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=3WDFykPhM4",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1366932886400978211&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Seoul National University;XAIMED Co. Ltd.",
        "aff_unique_dep": "Graduate School;",
        "aff_unique_url": "https://www.snu.ac.kr;",
        "aff_unique_abbr": "SNU;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea;"
    },
    {
        "title": "Continual Learning in the Presence of Spurious Correlations: Analyses and a Simple Baseline",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19507",
        "id": "3Y7r6xueJJ",
        "author_site": "Donggyu Lee, Sangwon Jung, Taesup Moon",
        "tldr": "",
        "abstract": "Most continual learning (CL) algorithms have focused on tackling the stability-plasticity dilemma, that is, the challenge of preventing the forgetting of past tasks while learning new ones. However, we argue that they have overlooked the impact of knowledge transfer when the training dataset of a certain task is biased \u2014 namely, when the dataset contains some spurious correlations that can overly influence the prediction rule of a model. In that case, how would the dataset bias of a certain task affect the prediction rules of a CL model for future or past tasks? In this work, we carefully design systematic experiments using three benchmark datasets to answer the question from our empirical findings. Specifically, we first show through two-task CL experiments that standard CL methods, which are oblivious of the dataset bias, can transfer bias from one task to another, both forward and backward. Moreover, we find out this transfer is exacerbated depending on whether the CL methods focus on stability or plasticity. We then present that the bias is also transferred and even accumulates in longer task sequences. Finally, we offer a standardized experimental setup and a simple, yet strong plug-in baseline method, dubbed as group-class Balanced Greedy Sampling (BGS), which are utilized for the development of more advanced bias-aware CL methods.",
        "keywords": "continual learning;bias;spurious correlation",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Donggyu Lee;Sangwon Jung;Taesup Moon",
        "authorids": "~Donggyu_Lee1;~Sangwon_Jung1;~Taesup_Moon1",
        "gender": "M;M;",
        "homepage": "https://sites.google.com/view/dqlee/%ED%99%88;https://successful-humor-4db.notion.site/Sangwon-Jung-70109a49767a470092a6ee0d02c78313;https://mindlab-snu.github.io/people/pi/",
        "dblp": "142/3306;236/3698;05/4084",
        "google_scholar": "7syHfVAAAAAJ;WdC_a5IAAAAJ;lQlioBoAAAAJ",
        "orcid": ";;0000-0002-9257-6503",
        "linkedin": ";;",
        "or_profile": "~Donggyu_Lee1;~Sangwon_Jung1;~Taesup_Moon1",
        "aff": "Sungkyunkwan University;Seoul National University;Seoul National University",
        "aff_domain": "skku.edu;snu.ac.kr;snu.ac.kr",
        "position": "PhD student;PhD student;Associate Professor",
        "bibtex": "@inproceedings{\nlee2024continual,\ntitle={Continual Learning in the Presence of Spurious Correlations: Analyses and a Simple Baseline},\nauthor={Donggyu Lee and Sangwon Jung and Taesup Moon},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=3Y7r6xueJJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "C1FY;A8St;UUYC;6w81",
        "pdf_size": 3530484,
        "rating": "5;6;6;8",
        "confidence": "3;3;4;4",
        "soundness": "1;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "90;62;95;106",
        "wc_strengths": "1;73;154;88",
        "wc_weaknesses": "183;190;229;189",
        "wc_questions": "5;77;48;97",
        "wc_review": "279;402;526;480",
        "wc_reply_reviewers": "0;20;113;26",
        "wc_reply_authors": "574;1019;756;1056",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "2;4;2;3",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            88.25,
            16.223054582907622
        ],
        "wc_strengths_avg": [
            79.0,
            54.37370688117557
        ],
        "wc_weaknesses_avg": [
            197.75,
            18.239723133863627
        ],
        "wc_questions_avg": [
            56.75,
            34.585943676586304
        ],
        "wc_review_avg": [
            421.75,
            93.57984558653642
        ],
        "wc_reply_reviewers_avg": [
            39.75,
            43.37265843823733
        ],
        "wc_reply_authors_avg": [
            851.25,
            197.48591721943112
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.6882472016116854,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3613202752424766689&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=3Y7r6xueJJ",
        "pdf": "https://openreview.net/pdf?id=3Y7r6xueJJ",
        "email": "skku.edu;snu.ac.kr;snu.ac.kr",
        "author_num": 3,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Sungkyunkwan University;Seoul National University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.skku.edu;https://www.snu.ac.kr",
        "aff_unique_abbr": "SKKU;SNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "PoSE: Efficient Context Window Extension of LLMs via Positional Skip-wise Training",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19506",
        "id": "3Z1gxuAQrA",
        "author_site": "Dawei Zhu, Nan Yang, Liang Wang, Yifan Song, Wenhao Wu, Furu Wei, Sujian Li",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) are trained with a pre-defined context length, restricting their use in scenarios requiring long inputs. Previous efforts for adapting LLMs to a longer length usually requires fine-tuning with this target length (Full-length fine-tuning), suffering intensive training cost. To decouple train length from target length for efficient context window extension, we propose Positional Skip-wisE (PoSE) training that smartly simulates long inputs using a fixed context window. This is achieved by first dividing the original context window into several chunks, then designing distinct skipping bias terms to manipulate the position indices of each chunk. These bias terms and the lengths of each chunk are altered for every training example, allowing the model to adapt to all positions within target length. Experimental results show that PoSE greatly reduces memory and time overhead compared with Full-length fine-tuning, with minimal impact on performance. Leveraging this advantage, we have successfully extended the LLaMA model to 128k tokens using a 2k training context window. Furthermore, we empirically confirm that PoSE is compatible with all RoPE-based LLMs and position interpolation strategies. Notably, our method can potentially support infinite length, limited only by memory usage in inference. With ongoing progress for efficient inference, we believe PoSE can further scale the context window beyond 128k.",
        "keywords": "context window extension;efficiency;positional skip-wise training",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Dawei Zhu;Nan Yang;Liang Wang;Yifan Song;Wenhao Wu;Furu Wei;Sujian Li",
        "authorids": "~Dawei_Zhu2;~Nan_Yang5;~Liang_Wang2;~Yifan_Song2;~Wenhao_Wu7;~Furu_Wei1;~Sujian_Li1",
        "gender": ";;M;M;M;M;F",
        "homepage": ";;https://github.com/intfloat;https://yifan-song793.github.io/;;https://www.microsoft.com/en-us/research/people/fuwei/;https://pku-tangent.github.io/",
        "dblp": ";https://dblp.uni-trier.de/pers/hd/y/Yang_0002:Nan;56/4499;;;72/5870;05/4288",
        "google_scholar": "oD2HPaYAAAAJ;InAQ3o0AAAAJ;NfJbKJ4AAAAJ;;LZFvCrwAAAAJ;G-V1VpwAAAAJ;https://scholar.google.com.tw/citations?user=RvBDhSwAAAAJ",
        "orcid": ";;0000-0003-4664-7136;;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Dawei_Zhu2;~Nan_Yang5;~Liang_Wang2;~Yifan_Song2;~Wenhao_Wu7;~Furu_Wei1;~Sujian_Li1",
        "aff": "Peking University;Microsoft Research Asia;Microsoft Research;Peking University;Peking University;Microsoft Research;Peking University",
        "aff_domain": "pku.edu.cn;microsoft.com;microsoft.com;pku.edu.cn;pku.edu.cn;microsoft.com;pku.edu.cn",
        "position": "PhD student;Researcher;Researcher;PhD student;PhD student;Distinguished Scientist;Associate Professor",
        "bibtex": "@inproceedings{\nzhu2024pose,\ntitle={Po{SE}: Efficient Context Window Extension of {LLM}s via Positional Skip-wise Training},\nauthor={Dawei Zhu and Nan Yang and Liang Wang and Yifan Song and Wenhao Wu and Furu Wei and Sujian Li},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=3Z1gxuAQrA}\n}",
        "github": "",
        "project": "",
        "reviewers": "NXZX;VfnN;T2GT;UVnU",
        "pdf_size": 496870,
        "rating": "6;6;6;6",
        "confidence": "3;4;4;5",
        "soundness": "2;3;3;4",
        "contribution": "2;3;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "35;174;71;45",
        "wc_strengths": "27;91;59;84",
        "wc_weaknesses": "67;131;121;113",
        "wc_questions": "5;178;18;4",
        "wc_review": "134;574;269;246",
        "wc_reply_reviewers": "29;18;0;15",
        "wc_reply_authors": "320;938;955;416",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "1;2;2;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            81.25,
            55.137895317104736
        ],
        "wc_strengths_avg": [
            65.25,
            25.083610186733488
        ],
        "wc_weaknesses_avg": [
            108.0,
            24.515301344262525
        ],
        "wc_questions_avg": [
            51.25,
            73.38724344189527
        ],
        "wc_review_avg": [
            305.75,
            163.0772439673911
        ],
        "wc_reply_reviewers_avg": [
            15.5,
            10.35615758860399
        ],
        "wc_reply_authors_avg": [
            657.25,
            291.2965628015545
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 75,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4361802516457215180&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=3Z1gxuAQrA",
        "pdf": "https://openreview.net/pdf?id=3Z1gxuAQrA",
        "email": "pku.edu.cn;microsoft.com;microsoft.com;pku.edu.cn;pku.edu.cn;microsoft.com;pku.edu.cn",
        "author_num": 7,
        "aff_unique_index": "0;1;1;0;0;1;0",
        "aff_unique_norm": "Peking University;Microsoft",
        "aff_unique_dep": ";Research",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.microsoft.com/en-us/research/group/asia",
        "aff_unique_abbr": "Peking U;MSR Asia",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Asia",
        "aff_country_unique_index": "0;0;1;0;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "3ZDEwhAlCO",
        "title": "ILPO-NET: convolution network for the recognition of arbitrary volumetric patterns",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Modern spatial data analysis is built on the effective recognition of spatial patterns and learning their hierarchy. Applications to real-world volumetric data require techniques that ensure invariance not only to shifts but also to pattern rotations. While traditional methods can readily achieve translational invariance, rotational invariance possesses multiple challenges and remains an active area of research.\nHere, we present ILPO-Net (Invariant to Local Patterns Orientation Network), a novel approach to handling arbitrarily shaped patterns with the convolutional operation inherently invariant to local spatial pattern orientations. Our architecture seamlessly integrates the new convolution operator and, when benchmarked on diverse volumetric datasets such as MedMNIST and CATH, demonstrates superior performance over the baselines with significantly reduced parameter counts\u2014up to 1000 times fewer in the case of MedMNIST. Beyond these demonstrations, ILPO-Net's rotational invariance paves the way for other applications across multiple disciplines.",
        "keywords": "Volumetric data;3DCNN;pattern recognition;rotational invariance;SO(3) invariance;SE(3) invariance",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/89e246cac8b5cbcf4173f5ec0bc45a7adb4016e6.zip",
        "author": "Dmitrii Zhemchuzhnikov;Sergei Grudinin",
        "authorids": "~Dmitrii_Zhemchuzhnikov1;~Sergei_Grudinin1",
        "gender": "M;M",
        "homepage": ";https://grulab.imag.fr/",
        "dblp": ";",
        "google_scholar": "hf04h7IAAAAJ;8-TQzFIAAAAJ",
        "orcid": ";0000-0002-1903-7220",
        "linkedin": ";",
        "or_profile": "~Dmitrii_Zhemchuzhnikov1;~Sergei_Grudinin1",
        "aff": "Universit\u00e9 Grenoble Alpes;CNRS",
        "aff_domain": "univ-grenoble-alpes.fr;cnrs.fr",
        "position": "PhD student;Principal Researcher",
        "bibtex": "@misc{\nzhemchuzhnikov2024ilponet,\ntitle={{ILPO}-{NET}: convolution network for the recognition of arbitrary volumetric patterns},\nauthor={Dmitrii Zhemchuzhnikov and Sergei Grudinin},\nyear={2024},\nurl={https://openreview.net/forum?id=3ZDEwhAlCO}\n}",
        "github": "",
        "project": "",
        "reviewers": "ckuL;KeGD;PtnA;sNRn",
        "site": "https://openreview.net/forum?id=3ZDEwhAlCO",
        "pdf_size": 8867013,
        "rating": "3;5;5;5",
        "confidence": "3;3;2;4",
        "soundness": "3;3;2;2",
        "contribution": "1;3;2;3",
        "presentation": "2;3;2;2",
        "wc_summary": "115;49;61;51",
        "wc_strengths": "47;75;51;39",
        "wc_weaknesses": "359;53;60;275",
        "wc_questions": "140;96;4;65",
        "wc_review": "661;273;176;430",
        "wc_reply_reviewers": "0;10;0;0",
        "wc_reply_authors": "1158;478;133;957",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "3;2;1;2",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            69.0,
            26.94438717061496
        ],
        "wc_strengths_avg": [
            53.0,
            13.416407864998739
        ],
        "wc_weaknesses_avg": [
            186.75,
            133.61582054532315
        ],
        "wc_questions_avg": [
            76.25,
            49.499368682842814
        ],
        "wc_review_avg": [
            385.0,
            183.3207571444107
        ],
        "wc_reply_reviewers_avg": [
            2.5,
            4.330127018922194
        ],
        "wc_reply_authors_avg": [
            681.5,
            401.62700357421187
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:JLQ4nKfx_2QJ:scholar.google.com/&scioq=ILPO-NET:+convolution+network+for+the+recognition+of+arbitrary+volumetric+patterns&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Universit\u00e9 Grenoble Alpes;Centre National de la Recherche Scientifique",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.univ-grenoble-alpes.fr;https://www.cnrs.fr",
        "aff_unique_abbr": "UGA;CNRS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "France"
    },
    {
        "id": "3ZWdgOvmAA",
        "title": "LumiNet: The Bright Side of Perceptual Knowledge Distillation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In knowledge distillation research, feature-based methods have dominated due to their ability to effectively tap into extensive teacher models. In contrast, logit-based approaches are considered to be less adept at extracting hidden 'dark knowledge' from teachers. To bridge this gap, we present LumiNet, a novel knowledge-transfer algorithm designed to enhance logit-based distillation. We introduce a perception matrix that aims to recalibrate logits through adjustments based on the model's representation capability. By meticulously analyzing intra-class dynamics, LumiNet reconstructs more granular inter-class relationships, enabling the student model to learn a richer breadth of knowledge. Both teacher and student models are mapped onto this refined matrix, with the student's goal being to minimize representational discrepancies. Rigorous testing on benchmark datasets (CIFAR-100, ImageNet, and MSCOCO) attests to LumiNet's efficacy, revealing its competitive edge over leading feature-based methods. Moreover, in exploring the realm of transfer learning, we assess how effectively the student model, trained using our method, adapts to downstream tasks. Notably, when applied to Tiny ImageNet, the transferred features exhibit remarkable performance, further underscoring LumiNet's versatility and robustness in diverse settings. With LumiNet, we hope to steer the research discourse towards a renewed interest in the latent capabilities of logit-based knowledge distillation.",
        "keywords": "Knowledge Distillation;Model Compression;Transfer Learning;Computer Vision",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/cd7faf2661b6984e380d9fe3d317671e7cd02ec6.pdf",
        "author": "Md. Ismail Hossain;M M Lutfe Elahi;Sameera Ramasinghe;Ali Cheraghian;Fuad Rahman;Nabeel Mohammed;Shafin Rahman",
        "authorids": "~Md._Ismail_Hossain1;~M_M_Lutfe_Elahi1;~Sameera_Ramasinghe1;~Ali_Cheraghian2;~Fuad_Rahman1;~Nabeel_Mohammed1;~Shafin_Rahman1",
        "gender": "M;;M;M;M;M;M",
        "homepage": "https://sites.google.com/view/ismailhossain31415;;;https://alichr.github.io/;;http://ece.northsouth.edu/people/dr-nabeel-mohammed/;https://sites.google.com/site/rshafin",
        "dblp": "28/10457;;181/4514;;11/478;127/2798;95/10398",
        "google_scholar": "8f7b5YIAAAAJ;;https://scholar.google.com.au/citations?user=-j0m9aMAAAAJ;QT0EXIkAAAAJ;D0riK2QAAAAJ;https://scholar.google.com.au/citations?hl=en;Pe8C-SUAAAAJ",
        "orcid": ";;;;0000-0002-8670-7124;0000-0002-7661-3570;0000-0001-7169-0318",
        "linkedin": "md-ismail-hossain-771423167/;;;ali-cheraghian-006aa26b/;https://www.linkedin.com/pub/fuad-rahman/1/30/6ba;;rshafin/",
        "or_profile": "~Md._Ismail_Hossain1;~M_M_Lutfe_Elahi1;~Sameera_Ramasinghe1;~Ali_Cheraghian2;~Fuad_Rahman1;~Nabeel_Mohammed1;~Shafin_Rahman1",
        "aff": "North South University;;Amazon;CSIRO;University of Arizona;North South University;North South University",
        "aff_domain": "northsouth.edu;;amazon.com;data61.csiro.au;arizona.edu;northsouth.edu;northsouth.edu",
        "position": "Researcher;;Researcher;Researcher;Adjunct Professor;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nhossain2024luminet,\ntitle={LumiNet: The Bright Side of Perceptual Knowledge Distillation},\nauthor={Md. Ismail Hossain and M M Lutfe Elahi and Sameera Ramasinghe and Ali Cheraghian and Fuad Rahman and Nabeel Mohammed and Shafin Rahman},\nyear={2024},\nurl={https://openreview.net/forum?id=3ZWdgOvmAA}\n}",
        "github": "",
        "project": "",
        "reviewers": "8pKb;tkRa;7mGH;3qnL",
        "site": "https://openreview.net/forum?id=3ZWdgOvmAA",
        "pdf_size": 2931974,
        "rating": "5;5;5;5",
        "confidence": "3;5;3;5",
        "soundness": "2;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "3;2;2;2",
        "wc_summary": "60;53;27;52",
        "wc_strengths": "21;21;39;32",
        "wc_weaknesses": "50;87;185;75",
        "wc_questions": "16;11;243;2",
        "wc_review": "147;172;494;161",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "627;597;1131;624",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            1.0
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            48.0,
            12.509996003196804
        ],
        "wc_strengths_avg": [
            28.25,
            7.660776723022281
        ],
        "wc_weaknesses_avg": [
            99.25,
            51.275603360662664
        ],
        "wc_questions_avg": [
            68.0,
            101.16076314461057
        ],
        "wc_review_avg": [
            243.5,
            144.89737747799302
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            744.75,
            223.30738344264392
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11737768826256174744&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;3;0;0",
        "aff_unique_norm": "North South University;Amazon;Commonwealth Scientific and Industrial Research Organisation;University of Arizona",
        "aff_unique_dep": ";Amazon.com, Inc.;;",
        "aff_unique_url": "https://www.northsouth.edu/;https://www.amazon.com;https://www.csiro.au;https://www.arizona.edu",
        "aff_unique_abbr": "NSU;Amazon;CSIRO;UA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;1;0;0",
        "aff_country_unique": "Bangladesh;United States;Australia"
    },
    {
        "id": "3Zm6wR5Mvc",
        "title": "LangNav: Language as a Perceptual Representation for Navigation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We explore the use of language as a perceptual representation for vision-and-language navigation. Our approach uses off-the-shelf vision systems (for image captioning and object detection) to convert an  agent's egocentric panoramic view at each time step  into natural language descriptions. We then finetune a pretrained language model to select an action, based on the current view and the  trajectory history, that would best fulfill the navigation instructions. In contrast to the standard setup which adapts a pretrained language model to work directly with continuous visual features from pretrained vision models, our approach instead uses (discrete) language  as the perceptual representation. We explore two use cases of our language-based navigation ours approach on the R2R vision-and-language navigation benchmark: generating synthetic trajectories from a prompted large language model (GPT-4) with which to finetune a smaller  language model; and sim-to-real transfer where we transfer a policy learned on a simulated environment (ALFRED) to a real-world environment (R2R). Our approach is found to improve upon strong baselines that rely on visual features in settings where only a few gold trajectories (10-100) are available, demonstrating the potential of using language as a perceptual representation for learning navigation agents.",
        "keywords": "Language Models;Vision-and-Language Navigation;Learn from Synthetic Data;Sim-to-Real",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/e323f53fccd0c1df76c4e891a3b9910cdd58dc9d.pdf",
        "author": "Bowen Pan;Rameswar Panda;SouYoung Jin;Rogerio Feris;Aude Oliva;Phillip Isola;Yoon Kim",
        "authorids": "~Bowen_Pan2;~Rameswar_Panda1;~SouYoung_Jin2;~Rogerio_Feris1;~Aude_Oliva1;~Phillip_Isola1;~Yoon_Kim1",
        "gender": "M;M;F;M;;M;",
        "homepage": "http://people.csail.mit.edu/bpan/;https://rpand002.github.io/;http://souyoungjin.com;http://rogerioferis.com;;http://web.mit.edu/phillipi/;https://people.csail.mit.edu/yoonkim/",
        "dblp": "188/1139;126/0986;225/4723;;;36/9988;",
        "google_scholar": "x9Tpbq8AAAAJ;_ySuu6gAAAAJ;_B-_CzYAAAAJ;xt3XLjcAAAAJ;;ROILf3EAAAAJ;n_ts4eYAAAAJ",
        "orcid": ";;;;;0000-0002-1411-6704;",
        "linkedin": ";;;;;phillip-isola-a9955b20/;",
        "or_profile": "~Bowen_Pan2;~Rameswar_Panda1;~SouYoung_Jin2;~Rogerio_Feris1;~Aude_Oliva1;~Phillip_Isola1;~Yoon_Kim1",
        "aff": "Massachusetts Institute of Technology;MIT-IBM Watson AI Lab;Dartmouth College;International Business Machines;;Massachusetts Institute of Technology;Massachusetts Institute of Technology",
        "aff_domain": "mit.edu;ibm.com;dartmouth.edu;ibm.com;;mit.edu;mit.edu",
        "position": "PhD student;Research Scientist;Assistant Professor;Research Manager;;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\npan2024langnav,\ntitle={LangNav: Language as a Perceptual Representation for Navigation},\nauthor={Bowen Pan and Rameswar Panda and SouYoung Jin and Rogerio Feris and Aude Oliva and Phillip Isola and Yoon Kim},\nyear={2024},\nurl={https://openreview.net/forum?id=3Zm6wR5Mvc}\n}",
        "github": "",
        "project": "",
        "reviewers": "z42V;PNyi;Sthf;MJeR;2DEF",
        "site": "https://openreview.net/forum?id=3Zm6wR5Mvc",
        "pdf_size": 2144034,
        "rating": "3;3;5;6;8",
        "confidence": "4;4;3;4;5",
        "soundness": "2;2;2;4;3",
        "contribution": "2;1;2;2;2",
        "presentation": "2;3;2;4;3",
        "wc_summary": "93;150;115;43;107",
        "wc_strengths": "78;31;71;65;185",
        "wc_weaknesses": "178;722;215;76;709",
        "wc_questions": "131;122;228;70;594",
        "wc_review": "480;1025;629;254;1595",
        "wc_reply_reviewers": "117;324;103;370;145",
        "wc_reply_authors": "1089;2154;1723;693;2811",
        "reply_reviewers": "1;1;1;1;1",
        "reply_authors": "3;5;4;2;6",
        "rating_avg": [
            5.0,
            1.8973665961010275
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.6,
            0.8
        ],
        "contribution_avg": [
            1.8,
            0.4000000000000001
        ],
        "presentation_avg": [
            2.8,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            101.6,
            34.811492355255325
        ],
        "wc_strengths_avg": [
            86.0,
            52.069184744914146
        ],
        "wc_weaknesses_avg": [
            380.0,
            277.7228834647948
        ],
        "wc_questions_avg": [
            229.0,
            189.50461735799473
        ],
        "wc_review_avg": [
            796.6,
            471.6670859833236
        ],
        "wc_reply_reviewers_avg": [
            211.8,
            112.16309553502882
        ],
        "wc_reply_authors_avg": [
            1694.0,
            752.0845697127418
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            4.0,
            1.4142135623730951
        ],
        "replies_avg": [
            31,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 19,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15739144564300280860&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;1;2;0;0",
        "aff_unique_norm": "Massachusetts Institute of Technology;Dartmouth College;International Business Machines Corporation",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://web.mit.edu;https://www.dartmouth.edu;https://www.ibm.com",
        "aff_unique_abbr": "MIT;Dartmouth;IBM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Evaluating Language Model Agency Through Negotiations",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19505",
        "id": "3ZqKxMHcAg",
        "author_site": "Tim R. Davidson, Veniamin Veselovsky, Michal Kosinski, Robert West",
        "tldr": "",
        "abstract": "We introduce an approach to evaluate language model (LM) agency using negotiation games. This approach better reflects real-world use cases and addresses some of the shortcomings of alternative LM benchmarks. Negotiation games enable us to study multi-turn, and cross-model interactions, modulate complexity, and side-step accidental evaluation data leakage. We use our approach to test six widely used and publicly accessible LMs, evaluating performance and alignment in both self-play and cross-play settings. Noteworthy findings include: (i) only closed-source models tested here were able to complete these tasks; (ii) cooperative bargaining games proved to be most challenging to the models; and (iii) even the most powerful models sometimes \"lose\" to weaker opponents.",
        "keywords": "language model evaluation;dynamic evaluation;alignment;cooperative AI;agency;evolving benchmarks;multi-agent interactions",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Tim Ruben Davidson;Veniamin Veselovsky;Michal Kosinski;Robert West",
        "authorids": "~Tim_Ruben_Davidson1;~Veniamin_Veselovsky1;~Michal_Kosinski1;~Robert_West1",
        "gender": ";M;Non-Binary;M",
        "homepage": ";https://vminvsky.com/;https://www.michalkosinski.com;https://dlab.epfl.ch/people/west/",
        "dblp": ";;03/10818;20/7441-1",
        "google_scholar": ";hFPL6gwAAAAJ;01-XV0YAAAAJ;ZiFn598AAAAJ",
        "orcid": ";;0000-0003-2936-4775;",
        "linkedin": ";;kosinskimichal/;",
        "or_profile": "~Tim_Ruben_Davidson1;~Veniamin_Veselovsky1;~Michal_Kosinski1;~Robert_West1",
        "aff": ";Department of Computer Science, Princeton University;Stanford University;EPFL - EPF Lausanne",
        "aff_domain": ";cs.princeton.edu;stanford.edu;epfl.ch",
        "position": ";PhD student;Associate Professor;Assistant Professor",
        "bibtex": "@inproceedings{\ndavidson2024evaluating,\ntitle={Evaluating Language Model Agency Through Negotiations},\nauthor={Tim Ruben Davidson and Veniamin Veselovsky and Michal Kosinski and Robert West},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=3ZqKxMHcAg}\n}",
        "github": "",
        "project": "",
        "reviewers": "pM8H;ZZpj;yVDW",
        "pdf_size": 1040448,
        "rating": "3;5;8",
        "confidence": "2;4;4",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "3;2;4",
        "wc_summary": "97;56;75",
        "wc_strengths": "32;13;63",
        "wc_weaknesses": "429;10;75",
        "wc_questions": "143;215;45",
        "wc_review": "701;294;258",
        "wc_reply_reviewers": "0;0;11",
        "wc_reply_authors": "2140;1454;504",
        "reply_reviewers": "0;0;1",
        "reply_authors": "3;2;1",
        "rating_avg": [
            5.333333333333333,
            2.0548046676563256
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            76.0,
            16.753109164172084
        ],
        "wc_strengths_avg": [
            36.0,
            20.607442021431645
        ],
        "wc_weaknesses_avg": [
            171.33333333333334,
            184.12012986694916
        ],
        "wc_questions_avg": [
            134.33333333333334,
            69.67224858020748
        ],
        "wc_review_avg": [
            417.6666666666667,
            200.8852629957929
        ],
        "wc_reply_reviewers_avg": [
            3.6666666666666665,
            5.185449728701348
        ],
        "wc_reply_authors_avg": [
            1366.0,
            670.78660292724
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.8029550685469663,
        "gs_citation": 23,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11870300425326261130&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=3ZqKxMHcAg",
        "pdf": "https://openreview.net/pdf?id=3ZqKxMHcAg",
        "email": ";cs.princeton.edu;stanford.edu;epfl.ch",
        "author_num": 4,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Princeton University;Stanford University;EPFL",
        "aff_unique_dep": "Department of Computer Science;;",
        "aff_unique_url": "https://www.princeton.edu;https://www.stanford.edu;https://www.epfl.ch",
        "aff_unique_abbr": "Princeton;Stanford;EPFL",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Stanford;Lausanne",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "United States;Switzerland"
    },
    {
        "id": "3a505tMjGE",
        "title": "AVOID: Alleviating VAE's Overestimation in Unsupervised OOD Detection",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep generative models (DGMs) aim at characterizing the distribution of the training set by maximizing the marginal likelihood of inputs \nin an unsupervised manner, making them a promising option for unsupervised out-of-distribution (OOD) detection.\nHowever, recent works have reported that DGMs often assign higher likelihoods to OOD data than in-distribution (ID) data, i.e., **overestimation**, leading to their failures in OOD detection.\nAlthough several pioneer works have tried to analyze this phenomenon, and some VAE-based methods have also attempted to alleviate this issue by modifying their score functions for OOD detection, the root cause of the overestimation in VAE has never been revealed to our best knowledge.\nTo fill this gap, this paper will provide a thorough theoretical analysis on the overestimation issue of VAE, and reveal that this phenomenon arises from two aspects: 1) the improper design of prior distribution; 2) the gap of dataset entropy-mutual integration (sum of dataset entropy and mutual information terms) between ID and OOD datasets.\nBased on these findings, we propose a novel score function to **A**lleviate **V**AE's **O**verestimation **I**n unsupervised OOD **D**etection, named ``**AVOID**'', which contains two novel techniques, specifically post-hoc prior and dataset entropy-mutual calibration.\nExperimental results verify our theoretical analysis, demonstrating that the proposed method is effective in alleviating overestimation and improving unsupervised OOD detection performance.",
        "keywords": "Unsupervised Out-of-Distribution Detection;VAE",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/5e71d3c32b265b8b2f53cffa81e9cd685502950f.zip",
        "author": "Yewen Li;Chaojie Wang;Xiaobo Xia;Hongxin Wei;Tongliang Liu;Bo An;Lei Feng;Xinrun Wang",
        "authorids": "~Yewen_Li1;~Chaojie_Wang1;~Xiaobo_Xia1;~Hongxin_Wei1;~Tongliang_Liu1;~Bo_An2;~Lei_Feng1;~Xinrun_Wang1",
        "gender": "M;M;M;M;M;M;M;M",
        "homepage": "https://scholar.google.com/citations?user=W5796yEAAAAJ&hl=zh-CN;https://chaojiewang94.github.io/;https://xiaoboxia.github.io/;https://hongxin001.github.io/;https://tongliang-liu.github.io/;https://personal.ntu.edu.sg/boan/;https://lfeng1995.github.io/;https://rainwangphy.github.io/",
        "dblp": "55/2231;134/9314-1;242/8072;150/6350;150/6667;42/6178-1.html;76/847-6;199/6413",
        "google_scholar": "W5796yEAAAAJ;https://scholar.google.com/citations?hl=en;jRsugY0AAAAJ;cABH034AAAAJ;https://scholar.google.com.au/citations?user=EiLdZ_YAAAAJ;PEEpuNwAAAAJ;https://scholar.google.com.sg/citations?user=KomQOFkAAAAJ;ROANfPUAAAAJ",
        "orcid": "0009-0008-0073-123X;;;;;0000-0002-7064-7438;0000-0003-2839-5799;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Yewen_Li1;~Chaojie_Wang1;~Xiaobo_Xia1;~Hongxin_Wei1;~Tongliang_Liu1;~Bo_An2;~Lei_Feng1;~Xinrun_Wang1",
        "aff": "Nanyang Technological University;Skywork AI;The University of Sydney;Southern University of Science and Technology;Mohamed bin Zayed University of Artificial Intelligence;Nanyang Technological University;Singapore University of Technology and Design;Nanyang Technological University",
        "aff_domain": "ntu.edu.sg;kunlun-inc.com;sydney.edu.au;sustech.edu.cn;mbzuai.ac.ae;ntu.edu.sg;sutd.edu.sg;ntu.edu.sg",
        "position": "PhD student;Researcher;PhD student;Assistant Professor;Affiliated Associate Professor;Full Professor;Assistant Professor;Postdoc",
        "bibtex": "@misc{\nli2024avoid,\ntitle={{AVOID}: Alleviating {VAE}'s Overestimation in Unsupervised {OOD} Detection},\nauthor={Yewen Li and Chaojie Wang and Xiaobo Xia and Hongxin Wei and Tongliang Liu and Bo An and Lei Feng and Xinrun Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=3a505tMjGE}\n}",
        "github": "",
        "project": "",
        "reviewers": "F6GH;jWXz;G5ek;ms1o",
        "site": "https://openreview.net/forum?id=3a505tMjGE",
        "pdf_size": 7588508,
        "rating": "6;6;6;6",
        "confidence": "4;4;4;4",
        "soundness": "3;3;2;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;4;3",
        "wc_summary": "99;159;278;106",
        "wc_strengths": "91;106;100;107",
        "wc_weaknesses": "764;212;506;212",
        "wc_questions": "196;110;271;62",
        "wc_review": "1150;587;1155;487",
        "wc_reply_reviewers": "307;0;215;0",
        "wc_reply_authors": "2054;650;1682;793",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "4;1;4;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            160.5,
            71.69553682064178
        ],
        "wc_strengths_avg": [
            101.0,
            6.363961030678928
        ],
        "wc_weaknesses_avg": [
            423.5,
            230.3318258513139
        ],
        "wc_questions_avg": [
            159.75,
            80.18844991643122
        ],
        "wc_review_avg": [
            844.75,
            309.7792560840703
        ],
        "wc_reply_reviewers_avg": [
            130.5,
            134.49256485025484
        ],
        "wc_reply_authors_avg": [
            1294.75,
            590.3132113547858
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            1.5
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:H902VqbwE_IJ:scholar.google.com/&scioq=AVOID:+Alleviating+VAE%27s+Overestimation+in+Unsupervised+OOD+Detection&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;4;0;5;0",
        "aff_unique_norm": "Nanyang Technological University;Skywork AI;University of Sydney;Southern University of Science and Technology;Mohamed bin Zayed University of Artificial Intelligence;Singapore University of Technology and Design",
        "aff_unique_dep": ";;;;;",
        "aff_unique_url": "https://www.ntu.edu.sg;https://www.skywork.ai;https://www.sydney.edu.au;https://www.sustech.edu.cn;https://mbzuai.ac.ae;https://www.sutd.edu.sg",
        "aff_unique_abbr": "NTU;Skywork AI;USYD;SUSTech;MBZUAI;SUTD",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;3;4;0;0;0",
        "aff_country_unique": "Singapore;United States;Australia;China;United Arab Emirates"
    },
    {
        "id": "3aSbJhaVDi",
        "title": "Exploiting Open-World Data for Adaptive Continual Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Continual learning (CL), which involves learning from sequential tasks without forgetting, is mainly explored in supervised learning settings where all data are labeled. However, high-quality labeled data may not be readily available at a large scale due to high labeling costs, making the application of existing CL methods in real-world scenarios challenging. In this paper, we delve into a more practical facet of CL: open-world continual learning, where the training data comes from the open-world dataset and is partially labeled and non-i.i.d. Building on the insight that task shifts in continual learning can be viewed as transitions from in-distribution (ID) data to out-of-distribution (OOD) data, we propose OpenACL, a method that explicitly leverages unlabeled OOD data to enhance continual learning.  Specifically, OpenACL considers novel classes within OOD data as potential classes for upcoming tasks and mines the underlying pattern in unlabeled open-world data to empower the model's adaptability to upcoming tasks. Furthermore, learning from extensive unlabeled data also helps to tackle the issue of catastrophic forgetting. Extensive experiments validate the effectiveness of OpenACL and show the benefit of learning from open-world data.",
        "keywords": "Continual Learning;Incremental Learning;Semi-supervised Learning;Open-world",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Xuwei Tan;Tian Xie;Zhiqun Zuo;Xueru Zhang",
        "authorids": "~Xuwei_Tan1;~Tian_Xie4;~Zhiqun_Zuo1;~Xueru_Zhang2",
        "gender": "M;M;M;F",
        "homepage": "https://engineering.osu.edu/people/tan.1206;https://www.linkedin.com/in/tianxie1999/;https://github.com/zuozhiqun;https://xueruzhang.github.io/",
        "dblp": "308/6151;;258/4850;",
        "google_scholar": "IpTmmIYAAAAJ;;;PNBO_a4AAAAJ",
        "orcid": ";;;",
        "linkedin": ";tianxie1999/;;",
        "or_profile": "~Xuwei_Tan1;~Tian_Xie4;~Zhiqun_Zuo1;~Xueru_Zhang2",
        "aff": "Ohio State University, Columbus;Ohio State University, Columbus;Ohio State University, Columbus;Ohio State University",
        "aff_domain": "osu.edu;osu.edu;osu.edu;osu.edu",
        "position": "PhD student;PhD student;PhD student;Assistant Professor",
        "bibtex": "@misc{\ntan2024exploiting,\ntitle={Exploiting Open-World Data for Adaptive Continual Learning},\nauthor={Xuwei Tan and Tian Xie and Zhiqun Zuo and Xueru Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=3aSbJhaVDi}\n}",
        "github": "",
        "project": "",
        "reviewers": "58yd;9HZN;rvMJ;66AU",
        "site": "https://openreview.net/forum?id=3aSbJhaVDi",
        "pdf_size": 584142,
        "rating": "5;5;6;6",
        "confidence": "3;3;4;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "51;76;98;112",
        "wc_strengths": "59;51;38;99",
        "wc_weaknesses": "239;193;15;57",
        "wc_questions": "113;3;259;21",
        "wc_review": "462;323;410;289",
        "wc_reply_reviewers": "362;0;42;63",
        "wc_reply_authors": "2193;949;1335;260",
        "reply_reviewers": "2;0;1;2",
        "reply_authors": "6;3;4;3",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            84.25,
            23.09085316743407
        ],
        "wc_strengths_avg": [
            61.75,
            22.77471185328148
        ],
        "wc_weaknesses_avg": [
            126.0,
            92.65527507918802
        ],
        "wc_questions_avg": [
            99.0,
            101.36074190730847
        ],
        "wc_review_avg": [
            371.0,
            68.61122357165772
        ],
        "wc_reply_reviewers_avg": [
            116.75,
            143.40044455998034
        ],
        "wc_reply_authors_avg": [
            1184.25,
            698.1910107556528
        ],
        "reply_reviewers_avg": [
            1.25,
            0.82915619758885
        ],
        "reply_authors_avg": [
            4.0,
            1.224744871391589
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:8lxZ6ZIiCwsJ:scholar.google.com/&scioq=Exploiting+Open-World+Data+for+Adaptive+Continual+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Ohio State University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.osu.edu",
        "aff_unique_abbr": "OSU",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Columbus;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Why is SAM Robust to Label Noise?",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19504",
        "id": "3aZCPl3ZvR",
        "author_site": "Christina Baek, J Kolter, Aditi Raghunathan",
        "tldr": "",
        "abstract": "Sharpness-Aware Minimization (SAM) is most known for achieving state-of the-art performances on natural image and language tasks. However, its most pronounced improvements (of tens of percent) is rather in the presence of label noise. Understanding SAM's label noise robustness requires a departure from characterizing the robustness of minimas lying in ``flatter'' regions of the loss landscape. In particular, the peak performance under label noise occurs with early stopping, far before the loss converges. We decompose SAM's robustness into two effects: one induced by changes to the logit term and the other induced by changes to the network Jacobian. The first can be observed in linear logistic regression where SAM provably up-weights the gradient contribution from clean examples. Although this explicit up-weighting is also observable in neural networks, when we intervene and modify SAM to remove this effect, surprisingly, we see no visible degradation in performance. We infer that SAM's effect in deeper networks is instead explained entirely by the effect SAM has on the network Jacobian. We theoretically derive the  implicit regularization induced by this Jacobian effect in two layer linear networks. Motivated by our analysis, we see that cheaper alternatives to SAM that explicitly induce these regularization effects largely recover the benefits in deep networks trained on real-world datasets.",
        "keywords": "generalization;sharpness;robustness;SAM",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Christina Baek;J Zico Kolter;Aditi Raghunathan",
        "authorids": "~Christina_Baek2;~J_Zico_Kolter1;~Aditi_Raghunathan1",
        "gender": ";F;M",
        "homepage": "https://kebaek.github.io;https://www.cs.cmu.edu/~aditirag/;http://www.zicokolter.com",
        "dblp": "202/7238;166/1409;67/2526",
        "google_scholar": ";Ch9iRwQAAAAJ;UXh1I6UAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Christina_Baek2;~Aditi_Raghunathan1;~Zico_Kolter1",
        "aff": "Carnegie Mellon University;Carnegie Mellon University;Carnegie Mellon University",
        "aff_domain": "cmu.edu;cmu.edu;cmu.edu",
        "position": "PhD student;Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\nbaek2024why,\ntitle={Why is {SAM} Robust to Label Noise?},\nauthor={Christina Baek and J Zico Kolter and Aditi Raghunathan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=3aZCPl3ZvR}\n}",
        "github": "",
        "project": "",
        "reviewers": "Cbxh;WpDM;M3rX;ATLV",
        "pdf_size": 1203210,
        "rating": "6;6;6;6",
        "confidence": "4;4;3;3",
        "soundness": "3;3;2;3",
        "contribution": "2;3;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "117;120;69;116",
        "wc_strengths": "59;50;29;44",
        "wc_weaknesses": "24;33;52;651",
        "wc_questions": "29;43;116;6",
        "wc_review": "229;246;266;817",
        "wc_reply_reviewers": "22;15;25;25",
        "wc_reply_authors": "633;487;660;1318",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;2;2;3",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            105.5,
            21.12463017427761
        ],
        "wc_strengths_avg": [
            45.5,
            10.920164833920778
        ],
        "wc_weaknesses_avg": [
            190.0,
            266.3503332079763
        ],
        "wc_questions_avg": [
            48.5,
            41.14911906711977
        ],
        "wc_review_avg": [
            389.5,
            247.16441896033498
        ],
        "wc_reply_reviewers_avg": [
            21.75,
            4.085033659592048
        ],
        "wc_reply_authors_avg": [
            774.5,
            320.6169833305778
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16289533126675671960&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=3aZCPl3ZvR",
        "pdf": "https://openreview.net/pdf?id=3aZCPl3ZvR",
        "email": "cmu.edu;cmu.edu;cmu.edu",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Carnegie Mellon University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cmu.edu",
        "aff_unique_abbr": "CMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "3b8CgMO5ix",
        "title": "Model guidance via explanations turns image classifiers into segmentation models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Heatmaps generated on inputs of image classification networks via explainable AI methods like Grad-CAM and LRP have been observed to resemble segmentations of input images in many cases. Consequently, heatmaps have also been leveraged for achieving weakly supervised segmentation with image-level supervision.\nOn the other hand, losses can be imposed on differentiable heatmaps, which has been shown to serve for (1) improving heatmaps to be more human-interpretable, (2) regularization of networks towards better generalization, (3) training diverse ensembles of networks, and (4) for explicitly ignoring confounding input features. Due to the latter use case, the paradigm of imposing losses on heatmaps is often referred to as \"Right for the right reasons\". \nWe unify these two lines of research by investigating semi-supervised segmentation as a novel use case for the Right for the Right Reasons paradigm. \nFirst, we show formal parallels between differentiable heatmap architectures and standard encoder-decoder architectures for image segmentation. \nSecond, we show that such differentiable heatmap architectures yield competitive results when trained with standard segmentation losses. \nThird, we show that such architectures allow for training with weak supervision in the form of image-level labels and small numbers of pixel-level labels, outperforming comparable encoder-decoder models.",
        "keywords": "few-shot learning;semantic segmentation;interpretation",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Xiaoyan Yu;Jannik Franzen;Wojciech Samek;Marina MC H\u00f6hne;Dagmar Kainmueller",
        "authorids": "~Xiaoyan_Yu2;~Jannik_Franzen1;~Wojciech_Samek1;~Marina_MC_H\u00f6hne1;~Dagmar_Kainmueller2",
        "gender": "F;M;M;;F",
        "homepage": ";;http://iphome.hhi.de/samek/;;",
        "dblp": ";;79/9736;22/4586;167/3225",
        "google_scholar": ";;7aQwO08AAAAJ;mg0LpUwAAAAJ;https://scholar.google.de/citations?user=araOPxQAAAAJ",
        "orcid": "0000-0001-8196-663X;;;;",
        "linkedin": ";jannik-franzen-5931b121a;;;marina-marie-claire-h\u00f6hne-8949bb77/",
        "or_profile": "~Xiaoyan_Yu2;~Jannik_Franzen1;~Wojciech_Samek1;~Dagmar_Kainm\u00fcller1;~Marina_H\u00f6hne1",
        "aff": "Max Delbr\u00fcck Center for Molecular Medicine;Max Delbr\u00fcck Center for Molecular Medicine;Fraunhofer HHI;Max Delbr\u00fcck Center for Molecular Medicine;Universit\u00e4t Potsdam",
        "aff_domain": "mdc-berlin.de;mdc-berlin.de;hhi.fraunhofer.de;mdc-berlin.de;uni-potsdam.de",
        "position": "PhD student;PhD student;Assistant Professor;Group Leader;Full Professor",
        "bibtex": "@misc{\nyu2024model,\ntitle={Model guidance via explanations turns image classifiers into segmentation models},\nauthor={Xiaoyan Yu and Jannik Franzen and Wojciech Samek and Marina MC H{\\\"o}hne and Dagmar Kainmueller},\nyear={2024},\nurl={https://openreview.net/forum?id=3b8CgMO5ix}\n}",
        "github": "",
        "project": "",
        "reviewers": "K7Hs;nMm3;a33j;43DH",
        "site": "https://openreview.net/forum?id=3b8CgMO5ix",
        "pdf_size": 12292941,
        "rating": "3;5;6;8",
        "confidence": "4;4;4;4",
        "soundness": "2;3;2;4",
        "contribution": "2;2;2;3",
        "presentation": "1;1;1;3",
        "wc_summary": "12;29;60;77",
        "wc_strengths": "25;16;66;194",
        "wc_weaknesses": "78;62;59;91",
        "wc_questions": "6;1;259;91",
        "wc_review": "121;108;444;453",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "190;74;700;363",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            44.5,
            25.46075411294803
        ],
        "wc_strengths_avg": [
            75.25,
            71.1033578672625
        ],
        "wc_weaknesses_avg": [
            72.5,
            12.893796958227627
        ],
        "wc_questions_avg": [
            89.25,
            104.32730946401331
        ],
        "wc_review_avg": [
            281.5,
            167.09353667931026
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            331.75,
            236.17406186963038
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Lz_rfX9EBVkJ:scholar.google.com/&scioq=Model+guidance+via+explanations+turns+image+classifiers+into+segmentation+models&hl=en&as_sdt=0,33",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;1;0;2",
        "aff_unique_norm": "Max Delbr\u00fcck Center for Molecular Medicine;Fraunhofer Heinrich Hertz Institute;University of Potsdam",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.mdc-berlin.de;https://www.hhi.fraunhofer.de/;https://www.uni-potsdam.de",
        "aff_unique_abbr": "MDC;HHI;UP",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "3bV46RKWVA",
        "title": "Diversity-Aware Agnostic Ensemble of Sharpness Minimizers",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "There has long been a variety of theoretical and empirical evidence supporting the success of ensemble learning. Deep ensembles in particular leverage training randomness and expressivity of individual neural networks to gain prediction diversity and ultimately a boost in generalization performance, robustness and uncertainty estimation. In respect of generalization ability, it is found that minimizers pursuing wider local minima result in models being more robust to shifts between training and testing sets. A natural research question arises out of these two approaches as to whether better generalization ability can be achieved if ensemble learning and loss sharpness minimization is integrated. Our work takes the lead in investigating this connection and proposes DASH - a learning algorithm that promotes diversity and flatness within deep ensembles. More concretely, DASH encourages base learners to move divergently towards low-loss regions of minimal sharpness. We provide a theoretical backbone for our method along with empirical evidence demonstrating an improvement in ensemble generalization ability.",
        "keywords": "SAM;Ensemble learning;Sharpness-Aware Minimization",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Anh Tuan Bui;Vy Vo;Tung Pham;He Zhao;Dinh Phung;Trung Le",
        "authorids": "~Anh_Tuan_Bui2;~Vy_Vo2;~Tung_Pham1;~He_Zhao1;~Dinh_Phung2;~Trung_Le2",
        "gender": "M;F;M;;;M",
        "homepage": "https://tuananhbui89.github.io/;https://isvy08.github.io/;;;;",
        "dblp": "120/0106;176/4660;38/10862-1;;;",
        "google_scholar": "jEjMZ7oAAAAJ;3CpFpFkAAAAJ;KcUuEKsAAAAJ;;;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Anh_Tuan_Bui2;~Vy_Vo2;~Tung_Pham1;~He_Zhao1;~Dinh_Phung2;~Trung_Le2",
        "aff": "Monash University;Monash University;VinAI Research;;;Monash University",
        "aff_domain": "monash.edu;monash.edu;vinai.io;;;monash.edu",
        "position": "Postdoc;PhD student;Researcher;;;Assistant Professor",
        "bibtex": "@misc{\nbui2024diversityaware,\ntitle={Diversity-Aware Agnostic Ensemble of Sharpness Minimizers},\nauthor={Anh Tuan Bui and Vy Vo and Tung Pham and He Zhao and Dinh Phung and Trung Le},\nyear={2024},\nurl={https://openreview.net/forum?id=3bV46RKWVA}\n}",
        "github": "",
        "project": "",
        "reviewers": "XYNF;XaPX;UbbB;xVVh",
        "site": "https://openreview.net/forum?id=3bV46RKWVA",
        "pdf_size": 2582464,
        "rating": "3;3;3;6",
        "confidence": "4;4;3;2",
        "soundness": "2;2;2;3",
        "contribution": "2;1;2;2",
        "presentation": "2;2;1;3",
        "wc_summary": "76;44;40;25",
        "wc_strengths": "59;18;45;66",
        "wc_weaknesses": "596;483;214;91",
        "wc_questions": "75;116;243;33",
        "wc_review": "806;661;542;215",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            46.25,
            18.579222265746218
        ],
        "wc_strengths_avg": [
            47.0,
            18.371173070873837
        ],
        "wc_weaknesses_avg": [
            346.0,
            202.31040507101952
        ],
        "wc_questions_avg": [
            116.75,
            78.57599824373852
        ],
        "wc_review_avg": [
            556.0,
            217.94609425268442
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.8703882797784892,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13721089435499981022&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Monash University;VinAI Research",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.monash.edu;https://www.vinai.io/",
        "aff_unique_abbr": "Monash;VinAI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "Australia;Vietnam"
    },
    {
        "id": "3bmjHYX42n",
        "title": "Leveraging Human Revisions for Improving Text-to-Layout Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Learning from human feedback has shown success in aligning large, pretrained models with human values. However, prior works have mostly focused on using high-level labels, such as preferences between pairs of model outputs. On the other hand, many domains could benefit from more involved, detailed feedback, such as corrections, explanations, and reasoning of human users. Our work proposes using nuanced feedback through the form of human revisions for stronger alignment. In this paper, we ask expert designers to fix layouts generated from a generative layout model that is pretrained on a large-scale dataset of mobile screens. Then, we train a reward model based on how human designers revise these generated layouts. With the learned reward model, we optimize our model with reinforcement learning from human feedback (RLHF). Our method, Revision-Aware Reward Models (RARE), allows a generative model to produce more modern, designer-aligned layouts, showing the potential for utilizing human corrections and stronger forms of feedback in improving generative models.",
        "keywords": "human feedback;reinforcement learning;generative models;UI layouts",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/a4e99ce13cf35663b57423d0acf0103f202a8dd6.pdf",
        "author": "Amber Xie;Chin-Yi Cheng;Forrest Huang;Yang Li",
        "authorids": "~Amber_Xie1;~Chin-Yi_Cheng1;~Forrest_Huang1;~Yang_Li2",
        "gender": ";M;M;M",
        "homepage": ";;https://forresthuang.com;http://yangl.org",
        "dblp": ";;224/0243;37/4190-58",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en;IgHGybQAAAAJ;ZZdB48QAAAAJ",
        "orcid": ";;;",
        "linkedin": ";chinyi/;;yang-li-127a2a41/",
        "or_profile": "~Amber_Xie1;~Chin-Yi_Cheng1;~Forrest_Huang1;~Yang_Li2",
        "aff": ";Google;Apple;Google",
        "aff_domain": ";google.com;apple.com;google.com",
        "position": ";Researcher;Research Scientist;Research Scientist",
        "bibtex": "@misc{\nxie2024leveraging,\ntitle={Leveraging Human Revisions for Improving Text-to-Layout Models},\nauthor={Amber Xie and Chin-Yi Cheng and Forrest Huang and Yang Li},\nyear={2024},\nurl={https://openreview.net/forum?id=3bmjHYX42n}\n}",
        "github": "",
        "project": "",
        "reviewers": "d2Zb;otPj;RQ9B;Qjey",
        "site": "https://openreview.net/forum?id=3bmjHYX42n",
        "pdf_size": 1482729,
        "rating": "5;5;5;6",
        "confidence": "3;4;3;3",
        "soundness": "3;2;2;2",
        "contribution": "2;3;2;2",
        "presentation": "3;2;2;2",
        "wc_summary": "63;36;48;121",
        "wc_strengths": "37;19;38;161",
        "wc_weaknesses": "157;204;131;258",
        "wc_questions": "47;131;12;33",
        "wc_review": "304;390;229;573",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "534;901;547;870",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;2;1;2",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            67.0,
            32.61134771824066
        ],
        "wc_strengths_avg": [
            63.75,
            56.65410399962213
        ],
        "wc_weaknesses_avg": [
            187.5,
            48.386465049639654
        ],
        "wc_questions_avg": [
            55.75,
            45.19610049550735
        ],
        "wc_review_avg": [
            374.0,
            128.24000935745443
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            713.0,
            172.9089355701434
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:jN_E4kKTPNQJ:scholar.google.com/&scioq=Leveraging+Human+Revisions+for+Improving+Text-to-Layout+Models&hl=en&as_sdt=0,47",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Google;Apple",
        "aff_unique_dep": "Google;Apple Inc.",
        "aff_unique_url": "https://www.google.com;https://www.apple.com",
        "aff_unique_abbr": "Google;Apple",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Mountain View;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Take a Step Back: Evoking Reasoning via Abstraction in Large Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19503",
        "id": "3bq3jsvcQ1",
        "author_site": "Huaixiu Steven Zheng, Swaroop Mishra, Xinyun Chen, Heng-Tze Cheng, Ed H. Chi, Quoc V Le, Denny Zhou",
        "tldr": "",
        "abstract": "We present STEP-BACK PROMPTING, a simple prompting technique that enables LLMs to do abstractions to derive high-level concepts and first principles from instances containing specific details. Using the concepts and principles to guide reasoning, LLMs significantly improve their abilities in following a correct reasoning path towards the solution. We conduct experiments of STEP-BACK PROMPTING with PaLM-2L, GPT-4 and Llama2-70B models, and observe substantial performance gains on various challenging reasoning-intensive tasks including STEM, Knowledge QA, and Multi-Hop Reasoning. For instance, STEP-BACK PROMPTING improves PaLM-2L performance on MMLU (Physics and Chemistry) by 7% and 11% respectively, TimeQA by 27%, and MuSiQue by 7%.",
        "keywords": "Prompting;Large Language Models;Reasoning;Abstraction",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Huaixiu Steven Zheng;Swaroop Mishra;Xinyun Chen;Heng-Tze Cheng;Ed H. Chi;Quoc V Le;Denny Zhou",
        "authorids": "~Huaixiu_Steven_Zheng1;~Swaroop_Mishra1;~Xinyun_Chen1;~Heng-Tze_Cheng1;~Ed_H._Chi1;~Quoc_V_Le1;~Denny_Zhou1",
        "gender": "M;M;;M;;M;F",
        "homepage": ";https://swarooprm.github.io/;https://www.linkedin.com/in/hengtze;;https://dennyzhou.github.io/;http://edchi.net;https://jungyhuk.github.io/",
        "dblp": "307/3201;249/2784;30/8739;29/6166;178/3277;13/310;",
        "google_scholar": "PyK4x4wAAAAJ;-7LK2SwAAAAJ;;;UwLsYw8AAAAJ;VuWl-KUAAAAJ;d4W1UT0AAAAJ",
        "orcid": ";;;;;0000-0003-3230-5338;",
        "linkedin": ";;;;;edchi/;",
        "or_profile": "~Huaixiu_Steven_Zheng1;~Swaroop_Mishra1;~Heng-Tze_Cheng1;~Quoc_V_Le1;~Dengyong_Zhou2;~Ed_Chi1;~Xinyun_Chen2",
        "aff": "Google;Google;;Google;Google DeepMind;Google;Google",
        "aff_domain": "google.com;google.com;;google.com;google.com;google.com;google.com",
        "position": "Software Engineer;Researcher;;Scientist;Research Scientist;Researcher;Researcher",
        "bibtex": "@inproceedings{\nzheng2024take,\ntitle={Take a Step Back: Evoking Reasoning via Abstraction in Large Language Models},\nauthor={Huaixiu Steven Zheng and Swaroop Mishra and Xinyun Chen and Heng-Tze Cheng and Ed H. Chi and Quoc V Le and Denny Zhou},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=3bq3jsvcQ1}\n}",
        "github": "",
        "project": "",
        "reviewers": "XiDg;FiKx;xaDx",
        "pdf_size": 870565,
        "rating": "8;8;8",
        "confidence": "4;3;3",
        "soundness": "3;4;4",
        "contribution": "3;4;3",
        "presentation": "3;3;3",
        "wc_summary": "81;58;90",
        "wc_strengths": "83;43;67",
        "wc_weaknesses": "312;116;153",
        "wc_questions": "133;124;6",
        "wc_review": "609;341;316",
        "wc_reply_reviewers": "325;57;35",
        "wc_reply_authors": "812;586;483",
        "reply_reviewers": "1;1;1",
        "reply_authors": "2;2;1",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            76.33333333333333,
            13.474255287605157
        ],
        "wc_strengths_avg": [
            64.33333333333333,
            16.438437341250605
        ],
        "wc_weaknesses_avg": [
            193.66666666666666,
            85.02679316283518
        ],
        "wc_questions_avg": [
            87.66666666666667,
            57.86382481501048
        ],
        "wc_review_avg": [
            422.0,
            132.62227062852855
        ],
        "wc_reply_reviewers_avg": [
            139.0,
            131.82817099037166
        ],
        "wc_reply_authors_avg": [
            627.0,
            137.40693820425034
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 157,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3437259973551531575&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=3bq3jsvcQ1",
        "pdf": "https://openreview.net/pdf?id=3bq3jsvcQ1",
        "email": "google.com;google.com;;google.com;google.com;google.com;google.com",
        "author_num": 7,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "Google",
        "aff_unique_dep": "Google",
        "aff_unique_url": "https://www.google.com",
        "aff_unique_abbr": "Google",
        "aff_campus_unique_index": "0;0;0;0;0",
        "aff_campus_unique": "Mountain View;",
        "aff_country_unique_index": "0;0;0;1;0;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "3bqesUzZPH",
        "title": "FTA: Stealthy and Adaptive Backdoor Attack with Flexible Triggers on Federated Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Current backdoor attacks against federated learning (FL) strongly rely on universal triggers or semantic patterns, which can be easily detected and filtered by certain defense mechanisms such as norm clipping, trigger inversion and etc.\nIn this work, we propose a novel generator-assisted backdoor attack, FTA, against FL defenses.\nIn this method, we build a generative trigger function that can learn to manipulate the benign samples with naturally imperceptible trigger patterns (stealthy) and simultaneously make poisoned samples include similar hidden features of the attacker-chosen label. \nMoreover, our trigger generator repeatedly produces triggers for each sample (flexibility) in each FL iteration (adaptivity), allowing it to adjust to changes of hidden features between global models of different rounds.\nInstead of using universal and predefined triggers of existing works, we break this wall by providing three desiderate (i.e., stealthy, flexibility and adaptivity), which helps our attack avoid the presence of backdoor-related hidden features or backdoor routing. \nExtensive experiments confirmed the effectiveness (above 98\\% attack success rate) and stealthiness of our attack compared to prior attacks on decentralized learning frameworks with eight well-studied defenses.",
        "keywords": "federated learning;backdoor attack;trigger generator;robustness",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/410e83506017bdee675d58b231c1a0687905b1ca.zip",
        "author": "Yanqi Qiao;Dazhuang Liu;Congwen Chen;Rui Wang;Kaitai Liang",
        "authorids": "~Yanqi_Qiao1;~Dazhuang_Liu1;~Congwen_Chen1;~Rui_Wang24;~Kaitai_Liang1",
        "gender": "M;;M;M;M",
        "homepage": "https://www.tudelft.nl/en/eemcs/the-faculty/departments/intelligent-systems/cybersecurityeemcs/people/yanqi-qiao;;;https://www.tudelft.nl/en/eemcs/the-faculty/departments/intelligent-systems/cybersecurityeemcs/people/rui-wang;https://sites.google.com/view/kaitailiang",
        "dblp": "322/9220;;314/0597;;",
        "google_scholar": ";;;https://scholar.google.com/citations?hl=en;",
        "orcid": ";;;;",
        "linkedin": ";;https://linkedin.com/in/congwen-chen-144750231;;",
        "or_profile": "~Yanqi_Qiao1;~Dazhuang_Liu1;~Congwen_Chen1;~Rui_Wang24;~Kaitai_Liang1",
        "aff": "Delft University of Technology;;;;Delft University of Technology",
        "aff_domain": "tudelft.nl;;;;tudelft.nl",
        "position": "PhD student;;;;Assistant Professor",
        "bibtex": "@misc{\nqiao2024fta,\ntitle={{FTA}: Stealthy and Adaptive Backdoor Attack with Flexible Triggers on Federated Learning},\nauthor={Yanqi Qiao and Dazhuang Liu and Congwen Chen and Rui Wang and Kaitai Liang},\nyear={2024},\nurl={https://openreview.net/forum?id=3bqesUzZPH}\n}",
        "github": "",
        "project": "",
        "reviewers": "cGsZ;gADe;nnMX",
        "site": "https://openreview.net/forum?id=3bqesUzZPH",
        "pdf_size": 10340369,
        "rating": "5;5;6",
        "confidence": "4;4;3",
        "soundness": "3;3;3",
        "contribution": "2;2;2",
        "presentation": "2;3;2",
        "wc_summary": "15;46;31",
        "wc_strengths": "37;31;16",
        "wc_weaknesses": "403;103;195",
        "wc_questions": "158;9;144",
        "wc_review": "613;189;386",
        "wc_reply_reviewers": "298;0;23",
        "wc_reply_authors": "1311;456;663",
        "reply_reviewers": "2;0;1",
        "reply_authors": "3;2;2",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            30.666666666666668,
            12.657891697365017
        ],
        "wc_strengths_avg": [
            28.0,
            8.831760866327848
        ],
        "wc_weaknesses_avg": [
            233.66666666666666,
            125.48926470242606
        ],
        "wc_questions_avg": [
            103.66666666666667,
            67.18300049533033
        ],
        "wc_review_avg": [
            396.0,
            173.24164241505756
        ],
        "wc_reply_reviewers_avg": [
            107.0,
            135.38340617175604
        ],
        "wc_reply_authors_avg": [
            810.0,
            364.20049423360206
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9999999999999997,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15899732668944491480&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Delft University of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tudelft.nl",
        "aff_unique_abbr": "TU Delft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Netherlands"
    },
    {
        "id": "3cE6NKYy8x",
        "title": "Towards Fair Graph Anomaly Detection: Problem, New Datasets, and Evaluation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The Fair Graph Anomaly Detection (FairGAD) problem aims to accurately detect anomalous nodes in an input graph while ensuring fairness and avoiding biased predictions against individuals from sensitive subgroups such as gender or political leanings. Fairness in graphs is particularly crucial in anomaly detection areas such as misinformation detection, where decision outcomes can significantly affect individuals. Despite this need, existing works lack realistic datasets that encompass actual graph structures, anomaly labels, and sensitive attributes for research in FairGAD. To bridge this gap, we present two novel graph datasets constructed from the globally prominent social media platforms Reddit and Twitter. These datasets comprise 1.2 million and 400 thousand edges associated with 9 thousand and 47 thousand nodes, respectively, and leverage political leanings as sensitive attributes and misinformation spreaders as anomaly labels. We demonstrate that our FairGAD datasets significantly differ from the synthetic datasets used by the research community. These new datasets offer significant values for FairGAD by providing realistic data that captures the intricacies of social networks. Using our datasets, we investigate the performance-fairness trade-off in three existing GAD methods on five state-of-the-art fairness methods, which sheds light on their effectiveness and limitations in addressing the FairGAD problem.",
        "keywords": "graph anomaly detection;fairness;fair graph anomaly detection;benchmark datasets",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Neng Kai Nigel Neo;Yeon-Chang Lee;Yiqiao Jin;Sang-Wook Kim;Srijan Kumar",
        "authorids": "~Neng_Kai_Nigel_Neo1;~Yeon-Chang_Lee1;~Yiqiao_Jin1;~Sang-Wook_Kim1;~Srijan_Kumar1",
        "gender": ";;M;M;M",
        "homepage": ";https://sites.google.com/view/yclee/;https://ahren09.github.io/;https://bigdas.hanyang.ac.kr/;https://faculty.cc.gatech.edu/~srijan/",
        "dblp": ";167/5996;207/6631.html;64/5810;131/9628",
        "google_scholar": ";https://scholar.google.co.kr/citations?user=GzzNEJAAAAAJ;eY85qm4AAAAJ;https://scholar.google.co.kr/citations?user=ed2vz_oAAAAJ;kqfLNK8AAAAJ",
        "orcid": ";0000-0002-8769-0678;0000-0002-6974-5970;0000-0002-6345-9084;0000-0002-5796-3532",
        "linkedin": ";;ahren-jin/;;srijankr/",
        "or_profile": "~Neng_Kai_Nigel_Neo1;~Yeon-Chang_Lee1;~Yiqiao_Jin1;~Sang-Wook_Kim1;~Srijan_Kumar1",
        "aff": ";Ulsan National Institute of Science and Technology;Georgia Institute of Technology;Hanyang University;Georgia Institute of Technology",
        "aff_domain": ";unist.ac.kr;gatech.edu;hanyang.ac.kr;gatech.edu",
        "position": ";Assistant Professor;PhD student;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nneo2024towards,\ntitle={Towards Fair Graph Anomaly Detection: Problem, New Datasets, and Evaluation},\nauthor={Neng Kai Nigel Neo and Yeon-Chang Lee and Yiqiao Jin and Sang-Wook Kim and Srijan Kumar},\nyear={2024},\nurl={https://openreview.net/forum?id=3cE6NKYy8x}\n}",
        "github": "",
        "project": "",
        "reviewers": "QKDb;9VrT;jyni;rPbE",
        "site": "https://openreview.net/forum?id=3cE6NKYy8x",
        "pdf_size": 1887519,
        "rating": "3;5;6;8",
        "confidence": "1;3;3;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;4",
        "presentation": "3;3;3;4",
        "wc_summary": "144;173;96;53",
        "wc_strengths": "20;76;62;68",
        "wc_weaknesses": "273;189;455;193",
        "wc_questions": "91;286;69;2",
        "wc_review": "528;724;682;316",
        "wc_reply_reviewers": "0;116;175;0",
        "wc_reply_authors": "1663;1555;2205;658",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "4;4;4;1",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            2.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            116.5,
            45.828484592008934
        ],
        "wc_strengths_avg": [
            56.5,
            21.650635094610966
        ],
        "wc_weaknesses_avg": [
            277.5,
            107.8181339107666
        ],
        "wc_questions_avg": [
            112.0,
            105.67166129100082
        ],
        "wc_review_avg": [
            562.5,
            159.93357996368368
        ],
        "wc_reply_reviewers_avg": [
            72.75,
            75.68148716826329
        ],
        "wc_reply_authors_avg": [
            1520.25,
            555.4148787168021
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.25,
            1.299038105676658
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.9544271444636667,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14943895517549817533&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "Ulsan National Institute of Science and Technology;Georgia Institute of Technology;Hanyang University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.unist.ac.kr;https://www.gatech.edu;https://www.hanyang.ac.kr",
        "aff_unique_abbr": "UNIST;Georgia Tech;HYU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;1",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "title": "Identifying Representations for Intervention Extrapolation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19502",
        "id": "3cuJwmPxXj",
        "author_site": "Sorawit (James) Saengkyongam, Elan Rosenfeld, Pradeep K Ravikumar, Niklas Pfister, Jonas Peters",
        "tldr": "",
        "abstract": "The premise of identifiable and causal representation learning is to improve the current representation learning paradigm in terms of generalizability or robustness. Despite recent progress in questions of identifiability, more theoretical results demonstrating concrete advantages of these methods for downstream tasks are needed. In this paper, we consider the task of intervention extrapolation: predicting how interventions affect an outcome, even when those interventions are not observed at training time, and show that identifiable representations can provide an effective solution to this task even if the interventions affect the outcome non-linearly. Our setup includes an outcome variable $Y$, observed features $X$, which are generated as a non-linear transformation of latent features $Z$, and exogenous action variables $A$, which influence $Z$. The objective of intervention extrapolation is then to predict how interventions on $A$ that lie outside the training support of $A$ affect $Y$. Here, extrapolation becomes possible if the effect of $A$ on $Z$ is linear and the residual when regressing Z on A has full support. As $Z$ is latent, we combine the task of intervention extrapolation with identifiable representation learning, which we call $\\texttt{Rep4Ex}$: we aim to map the observed features $X$ into a subspace that allows for non-linear extrapolation in $A$. We show that the hidden representation is identifiable up to an affine transformation in $Z$-space, which, we prove, is sufficient for intervention extrapolation. The identifiability is characterized by a novel constraint describing the linearity assumption of $A$ on $Z$. Based on this insight, we propose a flexible method that enforces the linear invariance constraint and can be combined with any type of autoencoder. We validate our theoretical findings through a series of synthetic experiments and show that our approach can indeed succeed in predicting the effects of unseen interventions.",
        "keywords": "causality;extrapolation;exogenous variables;causal representation learning;identifiable representation learning;control functions;instrumental variables;invariance",
        "primary_area": "causal reasoning",
        "supplementary_material": "/attachment/ca0776cd9e91d0b874238a4bfb5ae74e4b210e3f.zip",
        "author": "Sorawit Saengkyongam;Elan Rosenfeld;Pradeep Kumar Ravikumar;Niklas Pfister;Jonas Peters",
        "authorids": "~Sorawit_Saengkyongam1;~Elan_Rosenfeld1;~Pradeep_Kumar_Ravikumar1;~Niklas_Pfister1;~Jonas_Peters2",
        "gender": ";M;M;;M",
        "homepage": "https://sorawitj.github.io/;;http://www.cs.cmu.edu/~pradeepr/;https://niklaspfister.github.io/;https://people.math.ethz.ch/~jopeters/",
        "dblp": ";236/4508;94/3594;222/3117;48/97",
        "google_scholar": "e3aDv1QAAAAJ;f0j0K8QAAAAJ;https://scholar.google.com.tw/citations?user=Q4DTPw4AAAAJ;u2G6pzcAAAAJ;https://scholar.google.de/citations?user=kBQ4VvEAAAAJ",
        "orcid": ";;;0000-0001-6203-9777;",
        "linkedin": ";;;;",
        "or_profile": "~Sorawit_Saengkyongam1;~Elan_Rosenfeld1;~Pradeep_Kumar_Ravikumar1;~Niklas_Pfister1;~Jonas_Peters2",
        "aff": "ETH Z\u00fcrich;Carnegie Mellon University;Carnegie Mellon University;University of Copenhagen;ETHZ - ETH Zurich",
        "aff_domain": "math.ethz.ch;andrew.cmu.edu;cmu.edu;ku.dk;ethz.ch",
        "position": "PhD student;PhD student;Full Professor;Associate Professor;Full Professor",
        "bibtex": "@inproceedings{\nsaengkyongam2024identifying,\ntitle={Identifying Representations for Intervention Extrapolation},\nauthor={Sorawit Saengkyongam and Elan Rosenfeld and Pradeep Kumar Ravikumar and Niklas Pfister and Jonas Peters},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=3cuJwmPxXj}\n}",
        "github": "",
        "project": "",
        "reviewers": "wfVE;dGv9;k2zA;iVVC",
        "pdf_size": 4071912,
        "rating": "8;8;8;8",
        "confidence": "4;4;4;4",
        "soundness": "4;3;3;3",
        "contribution": "4;3;3;4",
        "presentation": "4;4;3;3",
        "wc_summary": "268;107;135;86",
        "wc_strengths": "137;53;32;90",
        "wc_weaknesses": "375;64;487;65",
        "wc_questions": "231;196;63;98",
        "wc_review": "1011;420;717;339",
        "wc_reply_reviewers": "4;0;35;0",
        "wc_reply_authors": "1009;1025;1295;547",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "2;2;2;1",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.5,
            0.5
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            149.0,
            70.86959855960805
        ],
        "wc_strengths_avg": [
            78.0,
            39.89360851063739
        ],
        "wc_weaknesses_avg": [
            247.75,
            187.47983224869816
        ],
        "wc_questions_avg": [
            147.0,
            68.76408946535975
        ],
        "wc_review_avg": [
            621.75,
            265.15973959106236
        ],
        "wc_reply_reviewers_avg": [
            9.75,
            14.669270602180601
        ],
        "wc_reply_authors_avg": [
            969.0,
            268.8382413273826
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 18,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13348287505911038180&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=3cuJwmPxXj",
        "pdf": "https://openreview.net/pdf?id=3cuJwmPxXj",
        "email": "math.ethz.ch;andrew.cmu.edu;cmu.edu;ku.dk;ethz.ch",
        "author_num": 5,
        "aff_unique_index": "0;1;1;2;0",
        "aff_unique_norm": "ETH Zurich;Carnegie Mellon University;University of Copenhagen",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ethz.ch;https://www.cmu.edu;https://www.ku.dk",
        "aff_unique_abbr": "ETHZ;CMU;UCPH",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;2;0",
        "aff_country_unique": "Switzerland;United States;Denmark"
    },
    {
        "title": "Privately Aligning Language Models with Reinforcement Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19501",
        "id": "3d0OmYTNui",
        "author_site": "Fan Wu, Huseyin Inan, Arturs Backurs, Varun Chandrasekaran, Janardhan Kulkarni, Robert Sim",
        "tldr": "",
        "abstract": "Positioned between pre-training and user deployment, aligning large language models (LLMs) through reinforcement learning (RL) has emerged as a prevailing strategy for training instruction following-models such as ChatGPT. In this work, we initiate the study of privacy-preserving alignment of LLMs through Differential Privacy (DP) in conjunction with RL. Following the influential work of Ziegler et al. (2020), we study two dominant paradigms: (i) alignment via RL without human in the loop (e.g., positive review generation) and (ii) alignment via RL from human feedback (RLHF) (e.g., summarization in a human-preferred way). We give a new DP framework to achieve alignment via RL, and prove its correctness. Our experimental results validate the effectiveness of our approach, offering competitive utility while ensuring strong privacy protections.",
        "keywords": "Large Language Models;RLHF;Alignment;Differential Privacy",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/8533995075a0f8cc73da220bc27a7b4b58895d3f.pdf",
        "author": "Fan Wu;Huseyin A Inan;Arturs Backurs;Varun Chandrasekaran;Janardhan Kulkarni;Robert Sim",
        "authorids": "~Fan_Wu6;~Huseyin_A_Inan1;~Arturs_Backurs1;~Varun_Chandrasekaran1;~Janardhan_Kulkarni2;~Robert_Sim1",
        "gender": "F;;M;M;M;",
        "homepage": ";http://www.mit.edu/~backurs/;http://pages.cs.wisc.edu/~chandrasekaran/;;;",
        "dblp": "07/6378-11;74/10669;;54/1978;47/1233;41/11141",
        "google_scholar": "qd8WzBMAAAAJ;UNHdIKoAAAAJ;Sl7nSOsAAAAJ;_fxnybwAAAAJ;uT8sPt8AAAAJ;BGN4egcAAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";;;;simra/;",
        "or_profile": "~Fan_Wu6;~Arturs_Backurs1;~Varun_Chandrasekaran1;~Janardhan_Kulkarni2;~Robert_Sim1;~Huseyin_Atahan_Inan1",
        "aff": "University of Illinois, Urbana Champaign;Microsoft;University of Illinois Urbana-Champaign;Microsoft Research, Redmond;Microsoft;Microsoft",
        "aff_domain": "illinois.edu;microsoft.com;illinois.edu;microsoft.com;microsoft.com;microsoft.com",
        "position": "PhD student;Researcher;Assistant Professor;Researcher;Principal Researcher;Researcher",
        "bibtex": "@inproceedings{\nwu2024privately,\ntitle={Privately Aligning Language Models with Reinforcement Learning},\nauthor={Fan Wu and Huseyin A Inan and Arturs Backurs and Varun Chandrasekaran and Janardhan Kulkarni and Robert Sim},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=3d0OmYTNui}\n}",
        "github": "",
        "project": "",
        "reviewers": "JeaX;vWsq;A7MT",
        "pdf_size": 1164572,
        "rating": "6;6;8",
        "confidence": "2;3;3",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "3;3;4",
        "wc_summary": "37;49;33",
        "wc_strengths": "44;108;46",
        "wc_weaknesses": "132;157;74",
        "wc_questions": "4;41;28",
        "wc_review": "217;355;181",
        "wc_reply_reviewers": "17;82;0",
        "wc_reply_authors": "649;1003;619",
        "reply_reviewers": "1;1;0",
        "reply_authors": "1;3;1",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            39.666666666666664,
            6.79869268479038
        ],
        "wc_strengths_avg": [
            66.0,
            29.709706606876257
        ],
        "wc_weaknesses_avg": [
            121.0,
            34.76588366008646
        ],
        "wc_questions_avg": [
            24.333333333333332,
            15.326085243430198
        ],
        "wc_review_avg": [
            251.0,
            74.9933330370107
        ],
        "wc_reply_reviewers_avg": [
            33.0,
            35.33647784749729
        ],
        "wc_reply_authors_avg": [
            757.0,
            174.37889780589853
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.49999999999999983,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10110203762954942936&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=3d0OmYTNui",
        "pdf": "https://openreview.net/pdf?id=3d0OmYTNui",
        "email": "illinois.edu;microsoft.com;illinois.edu;microsoft.com;microsoft.com;microsoft.com",
        "author_num": 6,
        "aff_unique_index": "0;1;0;1;1;1",
        "aff_unique_norm": "University of Illinois Urbana-Champaign;Microsoft",
        "aff_unique_dep": ";Microsoft Corporation",
        "aff_unique_url": "https://illinois.edu;https://www.microsoft.com",
        "aff_unique_abbr": "UIUC;Microsoft",
        "aff_campus_unique_index": "0;0;2",
        "aff_campus_unique": "Urbana-Champaign;;Redmond",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Efficient-3Dim: Learning a Generalizable Single-image Novel-view Synthesizer in One Day",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19500",
        "id": "3eFMnZ3N4J",
        "author_site": "Yifan Jiang, Hao Tang, Jen-Hao Chang, Liangchen Song, Zhangyang Wang, Liangliang Cao",
        "tldr": "",
        "abstract": "The task of novel view synthesis aims to generate unseen perspectives of an object or scene from a limited set of input images. Nevertheless, synthesizing novel views from a single image remains a significant challenge. Previous approaches tackle this problem by adopting mesh prediction, multi-plane image construction, or more advanced techniques such as neural radiance fields. Recently, a pre-trained diffusion model that is specifically designed for 2D image synthesis has demonstrated its capability in producing photorealistic novel views, if sufficiently optimized with a 3D finetuning task. Despite greatly improved fidelity and generalizability, training such a powerful diffusion model requires a vast volume of training data and model parameters, resulting in a notoriously long time and high computational costs. To tackle this issue, we propose Efficient-3DiM, a highly efficient yet effective framework to learn a single-image novel-view synthesizer.  Motivated by our in-depth analysis of the diffusion model inference process, we propose several pragmatic strategies to reduce training overhead to a manageable scale, including a crafted timestep sampling strategy, a superior 3D feature extractor, and an enhanced training scheme. When combined, our framework can reduce the total training time from 10 days to less than 1 day, significantly accelerating the training process on the same computational platform (an instance with 8 Nvidia A100 GPUs). Comprehensive experiments are conducted to demonstrate the efficiency and generalizability of our proposed method.",
        "keywords": "Novel View Synthesis;3D from Single Image;Efficient Training",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Yifan Jiang;Hao Tang;Jen-Hao Rick Chang;Liangchen Song;Zhangyang Wang;Liangliang Cao",
        "authorids": "~Yifan_Jiang2;~Hao_Tang16;~Jen-Hao_Rick_Chang1;~Liangchen_Song1;~Zhangyang_Wang1;~Liangliang_Cao1",
        "gender": "M;M;M;;M;M",
        "homepage": "https://yifanjiang19.github.io/;;https://rick-chang.github.io;;https://vita-group.github.io;http://llcao.net",
        "dblp": "81/7246-1;;169/4938;;119/4026;95/6915",
        "google_scholar": "PMeFEOIAAAAJ;xW-IxnwAAAAJ;F5Z9kN4AAAAJ;;pxFyKAIAAAAJ;S-hBSfIAAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";;;;;liangliangcao/",
        "or_profile": "~Yifan_Jiang2;~Hao_Tang16;~Jen-Hao_Rick_Chang1;~Liangchen_Song1;~Zhangyang_Wang1;~Liangliang_Cao1",
        "aff": "University of Texas, Austin;Apple;Apple;;University of Texas at Austin;Apple",
        "aff_domain": "utexas.edu;apple.com;apple.com;;utexas.edu;apple.com",
        "position": "PhD student;Researcher;Researcher;;Associate Professor;Principal Researcher",
        "bibtex": "@inproceedings{\njiang2024efficientdim,\ntitle={Efficient-3Dim: Learning a Generalizable Single-image Novel-view Synthesizer in One Day},\nauthor={Yifan Jiang and Hao Tang and Jen-Hao Rick Chang and Liangchen Song and Zhangyang Wang and Liangliang Cao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=3eFMnZ3N4J}\n}",
        "github": "",
        "project": "",
        "reviewers": "mro2;TYx2;FP6T;fp2s",
        "pdf_size": 15811605,
        "rating": "5;8;8;8",
        "confidence": "4;4;4;5",
        "soundness": "3;4;4;3",
        "contribution": "2;3;4;3",
        "presentation": "3;3;3;3",
        "wc_summary": "62;61;66;35",
        "wc_strengths": "69;121;107;153",
        "wc_weaknesses": "159;118;85;115",
        "wc_questions": "72;4;7;5",
        "wc_review": "362;304;265;308",
        "wc_reply_reviewers": "55;0;0;23",
        "wc_reply_authors": "581;403;339;442",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "2;1;1;2",
        "rating_avg": [
            7.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            56.0,
            12.267844146385297
        ],
        "wc_strengths_avg": [
            112.5,
            30.14548058996572
        ],
        "wc_weaknesses_avg": [
            119.25,
            26.328454189336675
        ],
        "wc_questions_avg": [
            22.0,
            28.88771365130858
        ],
        "wc_review_avg": [
            309.75,
            34.52806829233283
        ],
        "wc_reply_reviewers_avg": [
            19.5,
            22.544400635190993
        ],
        "wc_reply_authors_avg": [
            441.25,
            88.66897710022373
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "openreview": "https://openreview.net/forum?id=3eFMnZ3N4J",
        "pdf": "https://openreview.net/pdf?id=3eFMnZ3N4J",
        "email": "utexas.edu;apple.com;apple.com;;utexas.edu;apple.com",
        "author_num": 6,
        "aff_unique_index": "0;1;1;0;1",
        "aff_unique_norm": "University of Texas at Austin;Apple",
        "aff_unique_dep": ";Apple Inc.",
        "aff_unique_url": "https://www.utexas.edu;https://www.apple.com",
        "aff_unique_abbr": "UT Austin;Apple",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Austin;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "3edHHvu5GX",
        "title": "Adaptive Visual Scene Understanding: Incremental Scene Graph Generation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Scene graph generation (SGG) involves analyzing images to extract meaningful information about objects and their relationships. Given the dynamic nature of the visual world, it becomes crucial for AI systems to detect new objects and establish their new relationships with existing objects. To address the lack of continual learning methodologies in SGG, we introduce the comprehensive Continual ScenE Graph Generation (CSEGG) dataset along with 3 learning scenarios and 8 evaluation metrics. Our research investigates the continual learning \nperformances of existing SGG methods on the retention of previous object entities and relationships as they learn new ones. Moreover, we also explore how continual object detection enhances generalization in classifying known relationships on unknown objects. We conduct extensive experiments benchmarking and analyzing the most recent transformer-based SGG methods in continual learning settings, and gain valuable insights into the CSEGG problem.  We invite the research community to explore this emerging field of study.",
        "keywords": "Scene Graph Generation;Scene Understanding;Long-tailed Learning;Incremental Learning",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/aa9d3fe778d16b45efbfb849e65985ec2a02b66c.zip",
        "author": "Naitik Khandelwal;Xiao Liu;Mengmi Zhang",
        "authorids": "~Naitik_Khandelwal1;~Xiao_Liu24;~Mengmi_Zhang1",
        "gender": "M;M;F",
        "homepage": ";;https://a0091624.wixsite.com/deepneurocognition-1",
        "dblp": ";;160/7116",
        "google_scholar": "7divVH4AAAAJ;;https://scholar.google.com.sg/citations?user=G2sVOhcAAAAJ",
        "orcid": ";;0000-0002-2694-7097",
        "linkedin": ";xiao-liu-34971b205/;",
        "or_profile": "~Naitik_Khandelwal1;~Xiao_Liu24;~Mengmi_Zhang1",
        "aff": "A*STAR;I2R, A*STAR;A*STAR",
        "aff_domain": "i2r.a-star.edu.sg;i2r.a-star.edu.sg;astar.edu.sg",
        "position": "Researcher;Researcher;Principal Researcher",
        "bibtex": "@misc{\nkhandelwal2024adaptive,\ntitle={Adaptive Visual Scene Understanding: Incremental Scene Graph Generation},\nauthor={Naitik Khandelwal and Xiao Liu and Mengmi Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=3edHHvu5GX}\n}",
        "github": "",
        "project": "",
        "reviewers": "FdjE;TSA3;SDSd;pXA5;LwTF",
        "site": "https://openreview.net/forum?id=3edHHvu5GX",
        "pdf_size": 38916967,
        "rating": "3;5;6;6;6",
        "confidence": "4;3;4;4;4",
        "soundness": "2;2;3;3;3",
        "contribution": "2;2;3;3;2",
        "presentation": "3;1;2;2;2",
        "wc_summary": "25;76;50;44;55",
        "wc_strengths": "18;45;71;39;91",
        "wc_weaknesses": "206;118;34;66;194",
        "wc_questions": "59;6;114;2;105",
        "wc_review": "308;245;269;151;445",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "1614;230;1014;582;2984",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "3;1;2;1;5",
        "rating_avg": [
            5.2,
            1.16619037896906
        ],
        "confidence_avg": [
            3.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            50.0,
            16.504544828622205
        ],
        "wc_strengths_avg": [
            52.8,
            25.506077707087776
        ],
        "wc_weaknesses_avg": [
            123.6,
            68.0047057195309
        ],
        "wc_questions_avg": [
            57.2,
            47.29228266852849
        ],
        "wc_review_avg": [
            283.6,
            95.84487466734984
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1284.8,
            967.0074249973471
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.4,
            1.4966629547095764
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.08574929257125442,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:UcBCy0UyJ44J:scholar.google.com/&scioq=Adaptive+Visual+Scene+Understanding:+Incremental+Scene+Graph+Generation&hl=en&as_sdt=0,38",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Agency for Science, Technology and Research;A*STAR",
        "aff_unique_dep": ";Institute for Infocomm Research",
        "aff_unique_url": "https://www.a-star.edu.sg;https://www.a-star.edu.sg",
        "aff_unique_abbr": "A*STAR;A*STAR",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Singapore"
    },
    {
        "title": "LEGO-Prover: Neural Theorem Proving with Growing Libraries",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19499",
        "id": "3f5PALef5B",
        "author_site": "Haiming Wang, Huajian Xin, Chuanyang Zheng, Zhengying Liu, Qingxing Cao, Yinya Huang, Jing Xiong, Han Shi, Enze Xie, Jian Yin, Zhenguo Li, Xiaodan Liang",
        "tldr": "",
        "abstract": "Despite the success of large language models (LLMs), the task of theorem proving still remains one of the hardest reasoning tasks that is far from being fully solved. Prior methods using language models have demonstrated promising results, but they still struggle to prove even middle school level theorems. One common limitation of these methods is that they assume a fixed theorem library during the whole theorem proving process. However, as we all know, creating new useful theorems or even new theories is not only helpful but crucial and necessary for advancing mathematics and proving harder and deeper results. In this work, we present LEGO-Prover, which employs a growing skill library containing verified lemmas as skills to augment the capability of LLMs used in theorem proving. By constructing the proof modularly, LEGO-Prover enables LLMs to utilize existing skills retrieved from the library and to create new skills during the proving process. These skills are further evolved (by prompting an LLM) to enrich the library on another scale. Modular and reusable skills are constantly added to the library to enable tackling increasingly intricate mathematical problems. Moreover, the learned library further bridges the gap between human proofs and formal proofs by making it easier to impute missing steps. LEGO-Prover advances the state-of-the-art pass rate on miniF2F-valid (48.0\\% to 57.0\\%) and miniF2F-test (45.5\\% to 50.0\\%). During the proving process, LEGO-Prover also generates over 20,000 skills (theorems/lemmas) and adds them to the growing library. Our ablation study indicates that these newly added skills are indeed helpful for proving theorems, resulting in a 4.9\\% improvement in success rate",
        "keywords": "Theorem proving;Large language model;Autoformalization",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "",
        "author": "Haiming Wang;Huajian Xin;Chuanyang Zheng;Zhengying Liu;Qingxing Cao;Yinya Huang;Jing Xiong;Han Shi;Enze Xie;Jian Yin;Zhenguo Li;Xiaodan Liang",
        "authorids": "~Haiming_Wang1;~Huajian_Xin1;~Chuanyang_Zheng3;~Zhengying_Liu2;~Qingxing_Cao1;~Yinya_Huang1;~Jing_Xiong4;~Han_Shi1;~Enze_Xie1;~Jian_Yin3;~Zhenguo_Li1;~Xiaodan_Liang2",
        "gender": "M;M;M;M;M;;M;M;M;M;F;M",
        "homepage": ";https://xinhuajian.wordpress.com/;https://chuanyang-zheng.github.io/;;;https://eleanor-h.github.io/;https://han-shi.github.io/;https://xieenze.github.io/;http://sai.sysu.edu.cn/teacher/teacher01/1385356.htm;http://www.ee.columbia.edu/~zgli/;https://www.sysu-hcp.net/;https://menik1126.github.io/",
        "dblp": "97/604;356/3551;;241/1782;149/7615;282/1562;;218/5441;95/578-1;23/6479;;",
        "google_scholar": "zDPqP6AAAAAJ;E5M9x8wAAAAJ;LWwh7K4AAAAJ;http:// DFme0joAAAAJ;flOBrd8AAAAJ;dWStaRIAAAAJ;https://scholar.google.com.hk/citations?user=Johp_14AAAAJ;42MVVPgAAAAJ;;XboZC1AAAAAJ;voxznZAAAAAJ;https://scholar.google.com.hk/citations?user=dFX1hXkAAAAJ",
        "orcid": ";;;;;0000-0002-0686-0832;;;;;;0000-0003-2986-6978",
        "linkedin": ";;;;;;;;;;;",
        "or_profile": "~Haiming_Wang1;~Huajian_Xin1;~Chuanyang_Zheng3;~Zhengying_Liu2;~Qingxing_Cao1;~Yinya_Huang1;~Han_Shi1;~Enze_Xie1;~Jian_Yin3;~Zhenguo_Li1;~Xiaodan_Liang2;~jing_xiong3",
        "aff": "SUN YAT-SEN UNIVERSITY;University of Edinburgh, University of Edinburgh;The Chinese University of Hong Kong;Huawei Technologies Ltd.;SUN YAT-SEN UNIVERSITY, Tsinghua University;City University of Hong Kong;Huawei Technologies Ltd.;Huawei Noah's Ark Lab;SUN YAT-SEN UNIVERSITY;Huawei Noah's Ark Lab;SUN YAT-SEN UNIVERSITY;Sun Yat-Sen University",
        "aff_domain": "sysu.edu.cn;ed.ac.uk;cse.cuhk.edu.hk;huawei.com;sysu.edu.cn;cityu.edu.hk;huawei.com;huawei.com;sysu.edu.cn;huawei.com;sysu.edu.cn;sysu.edu.cn",
        "position": "PhD student;PhD student;PhD student;Researcher;Postdoc;Postdoc;Principal Researcher;Researcher;Full Professor;Principal Researcher;Associate Professor;MS student",
        "bibtex": "@inproceedings{\nwang2024legoprover,\ntitle={{LEGO}-Prover: Neural Theorem Proving with Growing Libraries},\nauthor={Haiming Wang and Huajian Xin and Chuanyang Zheng and Zhengying Liu and Qingxing Cao and Yinya Huang and Jing Xiong and Han Shi and Enze Xie and Jian Yin and Zhenguo Li and Xiaodan Liang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=3f5PALef5B}\n}",
        "github": "",
        "project": "",
        "reviewers": "SGTy;Nn2P;UPjC;oKSy",
        "pdf_size": 2951810,
        "rating": "6;8;8;8",
        "confidence": "4;3;4;3",
        "soundness": "3;3;3;3",
        "contribution": "3;4;4;3",
        "presentation": "3;2;3;3",
        "wc_summary": "92;97;73;519",
        "wc_strengths": "68;92;65;222",
        "wc_weaknesses": "106;236;31;1048",
        "wc_questions": "40;123;164;461",
        "wc_review": "306;548;333;2250",
        "wc_reply_reviewers": "21;106;24;582",
        "wc_reply_authors": "1532;1145;562;3177",
        "reply_reviewers": "1;2;1;1",
        "reply_authors": "5;5;2;7",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            195.25,
            187.13147116399207
        ],
        "wc_strengths_avg": [
            111.75,
            64.50726703248247
        ],
        "wc_weaknesses_avg": [
            355.25,
            406.62843911856436
        ],
        "wc_questions_avg": [
            197.0,
            158.83167190456695
        ],
        "wc_review_avg": [
            859.25,
            808.4068823927713
        ],
        "wc_reply_reviewers_avg": [
            183.25,
            232.73093369812273
        ],
        "wc_reply_authors_avg": [
            1604.0,
            971.5912206272759
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.75,
            1.7853571071357126
        ],
        "replies_avg": [
            33,
            0
        ],
        "authors#_avg": [
            12,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 61,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18067121762305972500&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "openreview": "https://openreview.net/forum?id=3f5PALef5B",
        "pdf": "https://openreview.net/pdf?id=3f5PALef5B",
        "email": "sysu.edu.cn;ed.ac.uk;cse.cuhk.edu.hk;huawei.com;sysu.edu.cn;cityu.edu.hk;huawei.com;huawei.com;sysu.edu.cn;huawei.com;sysu.edu.cn;sysu.edu.cn",
        "author_num": 12,
        "aff_unique_index": "0;1;2;3;0;4;3;3;0;3;0;0",
        "aff_unique_norm": "Sun Yat-sen University;University of Edinburgh;Chinese University of Hong Kong;Huawei;City University of Hong Kong",
        "aff_unique_dep": ";;;Huawei Technologies;",
        "aff_unique_url": "http://www.sysu.edu.cn;https://www.ed.ac.uk;https://www.cuhk.edu.hk;https://www.huawei.com;https://www.cityu.edu.hk",
        "aff_unique_abbr": "SYSU;Edinburgh;CUHK;Huawei;CityU",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;1;0;0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "title": "Detecting Machine-Generated Texts by Multi-Population Aware Optimization for Maximum Mean Discrepancy",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19498",
        "id": "3fEKavFsnv",
        "author_site": "Shuhai Zhang, Yiliao Song, Jiahao Yang, Yuanqing Li, Bo Han, Mingkui Tan",
        "tldr": "",
        "abstract": "Large language models (LLMs) such as ChatGPT have exhibited remarkable performance in generating human-like texts. However, machine-generated texts (MGTs) may carry critical risks, such as plagiarism issues and hallucination information. Therefore, it is very urgent and important to detect MGTs in many situations. Unfortunately, it is challenging to distinguish MGTs and human-written texts because the distributional discrepancy between them is often very subtle due to the remarkable performance of LLMS. In this paper, we seek to exploit \\textit{maximum mean discrepancy} (MMD) to address this issue in the sense that MMD can well identify distributional discrepancies. However,  directly training a detector with MMD using diverse MGTs will incur a significantly increased variance of MMD since MGTs may contain \\textit{multiple text populations} due to various LLMs. This will severely impair MMD's ability to measure the difference between two samples. To tackle this, we propose a novel \\textit{multi-population} aware optimization method for MMD called MMD-MP, which can \\textit{avoid variance increases} and thus improve the stability to measure the distributional discrepancy. Relying on MMD-MP, we develop two methods for paragraph-based and sentence-based detection, respectively. Extensive experiments on various LLMs, \\eg,  GPT2 and ChatGPT, show superior detection performance of our MMD-MP.",
        "keywords": "Large language models;Machine-generated text detection;Maximum mean discrepancy",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/502b3f4d4ad703826e0fac8873b805065226dfdb.pdf",
        "author": "Shuhai Zhang;Yiliao Song;Jiahao Yang;Yuanqing Li;Bo Han;Mingkui Tan",
        "authorids": "~Shuhai_Zhang1;~Yiliao_Song2;~Jiahao_Yang3;~Yuanqing_Li2;~Bo_Han1;~Mingkui_Tan2",
        "gender": "M;F;M;M;M;M",
        "homepage": "https://github.com/ZSHsh98;https://songyiliao.github.io/;https://github.com/TRISKEL10N;http://www2.scut.edu.cn/autonlaben/2015/0825/c5794a92900/page.htm;https://bhanml.github.io/;https://tanmingkui.github.io/",
        "dblp": "67/5655;186/7620;;51/2525.html;241/0472-3;49/2007",
        "google_scholar": "oNhLYoEAAAAJ;lKzKBHUAAAAJ;;https://scholar.google.com.sg/citations?user=wN3v1coAAAAJ;nTNjqHwAAAAJ;https://scholar.google.com.sg/citations?user=EVsoTGkAAAAJ",
        "orcid": "0000-0001-6877-3825;0000-0002-6633-2695;;;;0000-0001-8856-756X",
        "linkedin": ";;;;;",
        "or_profile": "~Shuhai_Zhang1;~Yiliao_Song2;~Jiahao_Yang3;~Yuanqing_Li2;~bo_han2;~Mingkui_Tan1",
        "aff": "South China University of Technology;Royal Melbourne Institute of Technology;South China University of Technology;South China University of Technology;MBZUAI;South China University of Technology",
        "aff_domain": "scut.edu.cn;rmit.edu.au;scut.edu.cn;scut.edu.cn;mbzuai.ac.ae;scut.edu.cn",
        "position": "PhD student;Postdoc;MS student;Full Professor;Researcher;Full Professor",
        "bibtex": "@inproceedings{\nzhang2024detecting,\ntitle={Detecting Machine-Generated Texts by Multi-Population Aware Optimization for Maximum Mean Discrepancy},\nauthor={Shuhai Zhang and Yiliao Song and Jiahao Yang and Yuanqing Li and Bo Han and Mingkui Tan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=3fEKavFsnv}\n}",
        "github": "",
        "project": "",
        "reviewers": "4WLs;DBzA;bnWc;1AtS",
        "pdf_size": 1680464,
        "rating": "6;6;6;8",
        "confidence": "4;3;3;3",
        "soundness": "3;3;2;4",
        "contribution": "3;4;2;3",
        "presentation": "4;3;3;3",
        "wc_summary": "259;101;182;69",
        "wc_strengths": "176;104;35;50",
        "wc_weaknesses": "228;42;258;154",
        "wc_questions": "132;70;282;127",
        "wc_review": "795;317;757;400",
        "wc_reply_reviewers": "428;0;249;0",
        "wc_reply_authors": "1536;1062;3370;1142",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "5;3;7;3",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            152.75,
            73.88631470035571
        ],
        "wc_strengths_avg": [
            91.25,
            55.251131210139036
        ],
        "wc_weaknesses_avg": [
            170.5,
            83.28715387141044
        ],
        "wc_questions_avg": [
            152.75,
            78.49641711568752
        ],
        "wc_review_avg": [
            567.25,
            211.2301765846916
        ],
        "wc_reply_reviewers_avg": [
            169.25,
            180.69501238274398
        ],
        "wc_reply_authors_avg": [
            1777.5,
            936.7735852381834
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            4.5,
            1.6583123951777
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13517469906614096814&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=3fEKavFsnv",
        "pdf": "https://openreview.net/pdf?id=3fEKavFsnv",
        "email": "scut.edu.cn;rmit.edu.au;scut.edu.cn;scut.edu.cn;mbzuai.ac.ae;scut.edu.cn",
        "author_num": 6,
        "aff_unique_index": "0;1;0;0;2;0",
        "aff_unique_norm": "South China University of Technology;Royal Melbourne Institute of Technology;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.scut.edu.cn;https://www.rmit.edu.au;https://www.mbzuai.ac.ae",
        "aff_unique_abbr": "SCUT;RMIT;MBZUAI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;2;0",
        "aff_country_unique": "China;Australia;United Arab Emirates"
    },
    {
        "id": "3fRbP8g2LT",
        "title": "Efficient Redundancy-Free Graph Networks: Higher Expressiveness and Less Over-Squashing",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Message Passing Neural Networks (MPNNs) effectively learn graph structures. However, their message passing mechanism introduces redundancy, limiting expressiveness, and causing over-squashing. Prior research has addressed the problem of redundancy but often at the cost of increased complexity.  Improving expressiveness and addressing over-squashing remain major concerns in MPNN research with significant room for improvement. This study explores the nature of message passing redundancy and presents efficient solutions through two surrogate structures: Directed Line Graph (DLG) and Directed Acyclic Line Graph (DALG). The surogate structures introduce two corresponding models, Directed Line Graph Network (DLGN) and Efficient Redundancy-Free Graph Network (ERFGN). DLGN, utilizing DLGs, achieves redundancy-free message passing for graphs with a minimum cycle size of \\(L\\) when composed of $L$ layers. ERFGN, on the other hand, leverages DALGs to achieve fully redundancy-free message passing and possesses the expressiveness to distinguish arbitrary graphs under certain conditions. Furthermore, we enhance the expressiveness of ERFGN by incorporating cycle modeling and global attention, thereby achieving higher-order expressiveness. The efficiency and efficacy of these models in improving expressiveness and mitigating over-squashing are analysed theoretically. Empirical results on realistic datasets validate the proposed methods.",
        "keywords": "graph neural network;redundancy-free message passing;expressiveness;over-squashing",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Rongqin Chen;Yan Li;Leong Hou U;Ye Li",
        "authorids": "~Rongqin_Chen1;~Yan_Li23;~Leong_Hou_U2;~Ye_Li4",
        "gender": "M;;M;",
        "homepage": ";;https://www.fst.um.edu.mo/personal/ryanlhu/;",
        "dblp": ";;38/4996;",
        "google_scholar": ";;https://scholar.google.com/citations?hl=en;",
        "orcid": "0000-0002-8498-0346;;0000-0002-5135-5165;",
        "linkedin": ";;;",
        "or_profile": "~Rongqin_Chen1;~Yan_Li23;~Leong_Hou_U2;~Ye_Li4",
        "aff": "University of Macau;;University of macau;",
        "aff_domain": "um.edu.mo;;um.edu.mo;",
        "position": "PhD student;;Associate Professor;",
        "bibtex": "@misc{\nchen2024efficient,\ntitle={Efficient Redundancy-Free Graph Networks: Higher Expressiveness and Less Over-Squashing},\nauthor={Rongqin Chen and Yan Li and Leong Hou U and Ye Li},\nyear={2024},\nurl={https://openreview.net/forum?id=3fRbP8g2LT}\n}",
        "github": "",
        "project": "",
        "reviewers": "Gehp;vob1;WgZE;Dnf7",
        "site": "https://openreview.net/forum?id=3fRbP8g2LT",
        "pdf_size": 662905,
        "rating": "3;5;6;6",
        "confidence": "4;3;3;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;1;3;3",
        "wc_summary": "39;47;53;49",
        "wc_strengths": "33;48;112;15",
        "wc_weaknesses": "619;175;187;38",
        "wc_questions": "15;134;102;116",
        "wc_review": "706;404;454;218",
        "wc_reply_reviewers": "0;651;90;0",
        "wc_reply_authors": "1362;592;968;454",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "2;2;3;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            47.0,
            5.0990195135927845
        ],
        "wc_strengths_avg": [
            52.0,
            36.55817282086182
        ],
        "wc_weaknesses_avg": [
            254.75,
            218.29381003592383
        ],
        "wc_questions_avg": [
            91.75,
            45.740436158829965
        ],
        "wc_review_avg": [
            445.5,
            174.2204063822605
        ],
        "wc_reply_reviewers_avg": [
            185.25,
            271.3994979730066
        ],
        "wc_reply_authors_avg": [
            844.0,
            353.3072317403084
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9428090415820632,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:m_Qs0_errloJ:scholar.google.com/&scioq=Efficient+Redundancy-Free+Graph+Networks:+Higher+Expressiveness+and+Less+Over-Squashing&hl=en&as_sdt=0,23",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Macau",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.um.edu.mo",
        "aff_unique_abbr": "UM",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Macau SAR",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "3husFxdHI1",
        "title": "Duality of Information Flow: Insights in Graphical Models and Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This research highlights the convergence of probabilistic graphical models and neural networks, shedding light on their inherent similarities and interactions. By interpreting Bayesian neural networks within the framework of Markov random fields, we uncovered deep connections between message passing and neural network propagation. Our exploration unveiled a striking equivalence between gradients in neural networks and posterior-prior differences in graphical models. Empirical evaluations across diverse scenarios and datasets showcased the efficacy and generalizability of our approach. This work introduces a novel perspective on Bayesian Neural Networks and probabilistic graphical models, offering insights that could pave the way for enhanced models and a deeper understanding of their relationship.",
        "keywords": "Bayesian neural network;Probabilistic graphical models;Message-passing algorithm;Langevin dynamics;Fokker-Planck dynamics",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/c0f190b5d64a1116f7ebb66ca95e10746c21d5c3.zip",
        "author": "Wen Dong",
        "authorids": "~Wen_Dong1",
        "gender": "M",
        "homepage": "https://www.cse.buffalo.edu/~wendong/",
        "dblp": "84/3520-1",
        "google_scholar": "https://scholar.google.com.tw/citations?user=UBrg28IAAAAJ",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Wen_Dong1",
        "aff": "State University of New York, Buffalo",
        "aff_domain": "buffalo.edu",
        "position": "Assistant Professor",
        "bibtex": "@misc{\ndong2024duality,\ntitle={Duality of Information Flow: Insights in Graphical Models and Neural Networks},\nauthor={Wen Dong},\nyear={2024},\nurl={https://openreview.net/forum?id=3husFxdHI1}\n}",
        "github": "",
        "project": "",
        "reviewers": "2p2Z;kosy;Ac7q",
        "site": "https://openreview.net/forum?id=3husFxdHI1",
        "pdf_size": 664656,
        "rating": "3;5;6",
        "confidence": "3;3;2",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "2;2;2",
        "wc_summary": "48;65;70",
        "wc_strengths": "34;63;49",
        "wc_weaknesses": "68;190;115",
        "wc_questions": "255;167;8",
        "wc_review": "405;485;242",
        "wc_reply_reviewers": "0;0;36",
        "wc_reply_authors": "644;632;525",
        "reply_reviewers": "0;0;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            61.0,
            9.41629792788369
        ],
        "wc_strengths_avg": [
            48.666666666666664,
            11.841546445554407
        ],
        "wc_weaknesses_avg": [
            124.33333333333333,
            50.24163833139025
        ],
        "wc_questions_avg": [
            143.33333333333334,
            102.21654573610977
        ],
        "wc_review_avg": [
            377.3333333333333,
            101.114896144051
        ],
        "wc_reply_reviewers_avg": [
            12.0,
            16.97056274847714
        ],
        "wc_reply_authors_avg": [
            600.3333333333334,
            53.493509471295255
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.7559289460184545,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:-2VlTl7RZ0IJ:scholar.google.com/&scioq=Duality+of+Information+Flow:+Insights+in+Graphical+Models+and+Neural+Networks&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "State University of New York at Buffalo",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.buffalo.edu",
        "aff_unique_abbr": "SUNY Buffalo",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Buffalo",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "3i7iNGxw6r",
        "title": "Where Does In-context Machine Translation Happen in Large Language Models?",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Self-supervised large language models have demonstrated the ability to perform Machine Translation (MT) via in-context learning, but little is known about where the model performs MT with respect to prompt instructions and demonstration examples.\nIn this work, we attempt to characterize the region in layer-wise attention heads where GPT models transition from in-context learners to translation models. Through a series of layer-wise context-masking experiments on GPTNeo2.7B and Bloom3B, we demonstrate evidence of a \"task recognition\" point where the translation task is encoded into the input representations and attention to context is no longer necessary. Our layer-wise fine-tuning experiments indicate that the most effective layers for MT fine-tuning are the layers critical to task recognition. Next, we examine redundancy in layers following task recognition, observing that masking these later layers  does not hurt performance significantly. Finally, we train discrete attention head gates with $L_0$ regularisation and find evidence that the most pruneable heads occur after task recognition.",
        "keywords": "In-context Machine Translation;Interpretability",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Suzanna Sia;David Mueller;Kevin Duh",
        "authorids": "~Suzanna_Sia1;~David_Mueller1;~Kevin_Duh1",
        "gender": ";M;M",
        "homepage": ";https://www.damueller.com;https://cs.jhu.edu/~kevinduh/",
        "dblp": ";224/2296;58/3217",
        "google_scholar": ";TMv0Lw8AAAAJ;M3BSiiQAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Suzanna_Sia1;~David_Mueller1;~Kevin_Duh1",
        "aff": ";Johns Hopkins University;Johns Hopkins University",
        "aff_domain": ";jhu.edu;jhu.edu",
        "position": ";PhD student;Assistant Research Professor",
        "bibtex": "@misc{\nsia2024where,\ntitle={Where Does In-context Machine Translation Happen in Large Language Models?},\nauthor={Suzanna Sia and David Mueller and Kevin Duh},\nyear={2024},\nurl={https://openreview.net/forum?id=3i7iNGxw6r}\n}",
        "github": "",
        "project": "",
        "reviewers": "DzYR;tYJG;JM59;HfyK",
        "site": "https://openreview.net/forum?id=3i7iNGxw6r",
        "pdf_size": 1746934,
        "rating": "3;5;6;6",
        "confidence": "3;4;4;4",
        "soundness": "2;3;4;2",
        "contribution": "2;2;3;2",
        "presentation": "2;2;4;3",
        "wc_summary": "82;106;79;149",
        "wc_strengths": "34;42;48;68",
        "wc_weaknesses": "540;486;20;103",
        "wc_questions": "84;125;217;22",
        "wc_review": "740;759;364;342",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "480;677;173;415",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            104.0,
            28.008927148321835
        ],
        "wc_strengths_avg": [
            48.0,
            12.569805089976535
        ],
        "wc_weaknesses_avg": [
            287.25,
            228.4484351007903
        ],
        "wc_questions_avg": [
            112.0,
            70.84842976382751
        ],
        "wc_review_avg": [
            551.25,
            198.51621470298088
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            436.25,
            180.01857543042607
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.9428090415820632,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:mRnNXcCmdAMJ:scholar.google.com/&scioq=Where+Does+In-context+Machine+Translation+Happen+in+Large+Language+Models%3F&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Johns Hopkins University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.jhu.edu",
        "aff_unique_abbr": "JHU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "3ijmMNaSJk",
        "title": "Towards Understanding Masked Distillation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In the realm of self-supervised learning, Masked Image Modeling (MIM) serves as a \n  viable approach for mitigating the dependency on large-scale annotated data, \n  while demonstrating efficacy across a broad spectrum of downstream tasks. \n  A recent variant of MIM known as Masked Distillation (MD) has \n  emerged, which utilizes semantic features \n  instead of low-level features as the supervision. Although prior work \n  has demonstrated its effectiveness in various downstream tasks, the underlying mechanisms \n  for its performance improvements remain unclear. Our investigation reveals that \n  Masked Distillation mitigates multiple forms of overfitting present in the\n   original models, including but not limited to attention homogenization \n   and the representation folding of high layers. Further, we uncover that \n   Masked Distillation introduces beneficial inductive biases stemming \n   from MIM, which are believed to \n   contribute positively to model performance. We also \n   analyze the nuances of the model architecture design and decision-making tendencies \n   in Masked Distillation, revealing inconsistencies with previous research findings.",
        "keywords": "representation learning;computer vision",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/6f998d60595f439efd7867f3369e32f1d081f12b.zip",
        "author": "Tuo Chen;Jie Gui",
        "authorids": "~Tuo_Chen1;~Jie_Gui1",
        "gender": ";M",
        "homepage": ";https://guijiejie.github.io/index.html",
        "dblp": "125/7619;45/794",
        "google_scholar": "https://scholar.google.com/citations?hl=en;f8oE8NgAAAAJ",
        "orcid": ";0000-0002-9450-1759",
        "linkedin": ";",
        "or_profile": "~Tuo_Chen1;~Jie_Gui1",
        "aff": "Southeast University;Southeast University",
        "aff_domain": "seu.edu.cn;seu.edu.cn",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nchen2024towards,\ntitle={Towards Understanding Masked Distillation},\nauthor={Tuo Chen and Jie Gui},\nyear={2024},\nurl={https://openreview.net/forum?id=3ijmMNaSJk}\n}",
        "github": "",
        "project": "",
        "reviewers": "65e1;2wDN;hmEG;xu9z",
        "site": "https://openreview.net/forum?id=3ijmMNaSJk",
        "pdf_size": 1248944,
        "rating": "1;3;3;5",
        "confidence": "3;4;5;4",
        "soundness": "1;3;1;2",
        "contribution": "1;2;1;2",
        "presentation": "1;3;3;3",
        "wc_summary": "75;52;56;97",
        "wc_strengths": "23;44;9;39",
        "wc_weaknesses": "183;59;123;127",
        "wc_questions": "14;28;392;109",
        "wc_review": "295;183;580;372",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            70.0,
            17.84656829757475
        ],
        "wc_strengths_avg": [
            28.75,
            13.790848414800301
        ],
        "wc_weaknesses_avg": [
            123.0,
            43.9089968002003
        ],
        "wc_questions_avg": [
            135.75,
            152.32592523927107
        ],
        "wc_review_avg": [
            357.5,
            144.97672226947333
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:dPtV1gG3T9gJ:scholar.google.com/&scioq=Towards+Understanding+Masked+Distillation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Southeast University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.seu.edu.cn/",
        "aff_unique_abbr": "SEU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "3j5bsiwRv6",
        "title": "Sparse Refinement for Efficient High-Resolution Semantic Segmentation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Semantic segmentation empowers numerous real-world applications, such as autonomous driving and augmented/mixed reality. These applications often operate on high-resolution images (e.g., 8 megapixels) to capture the fine details. However, this comes at the cost of considerable computational complexity, hindering the deployment in latency-sensitive scenarios. In this paper, we introduce SparseRefine, a novel approach that enhances dense low-resolution predictions with sparse high-resolution refinements. Based on coarse low-resolution outputs, SparseRefine first uses an entropy selector to identify a sparse set of pixels with the least confidence. It then employs a sparse feature extractor to efficiently generate the refinements for those pixels of interest. Finally, it leverages a gated ensembler to apply these sparse refinements to the initial coarse predictions. SparseRefine can be seamlessly integrated into any existing semantic segmentation model, regardless of CNN- or ViT-based. SparseRefine achieves significant speedup: 1.5 to 3.9 times when applied to HRNet-W48, SegFormer-B5, Mask2Former-T/L and SegNeXt-L on Cityscapes, with negligible to no loss of accuracy. We will release the code to reproduce our results. We hope that our \"dense+sparse\" paradigm could inspire future research on efficient high-resolution visual computing.",
        "keywords": "Efficient machine learning;Semantic segmentation;Sparsity;Efficient model design;Model compression and acceleration",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/13b5d296154331dfc9827e106ba8e5fc10072d2f.pdf",
        "author": "Zhijian Liu;Zhuoyang Zhang;Shang Yang;Haotian Tang;Chenfeng Xu;Kurt Keutzer;Song Han",
        "authorids": "~Zhijian_Liu1;~Zhuoyang_Zhang1;~Shang_Yang1;~Haotian_Tang1;~Chenfeng_Xu1;~Kurt_Keutzer1;~Song_Han5",
        "gender": "M;M;M;M;M;M;",
        "homepage": "https://zhijianliu.com;https://hanlab.mit.edu/team/zhuoyang-zhang;;http://kentang.net;;https://people.eecs.berkeley.edu/~keutzer/;",
        "dblp": ";;79/9960;245/0058;65/1881;k/KurtKeutzer.html;",
        "google_scholar": "mwzYYPgAAAAJ;Q1csT-8AAAAJ;https://scholar.google.com.hk/citations?user=p71ikL4AAAAJ;WxL13BAAAAAJ;RpqvaTUAAAAJ;ID9QePIAAAAJ;",
        "orcid": ";;;;0000-0002-4941-6985;0000-0003-3868-8501;",
        "linkedin": "zhijianliu/;zhuoyang-zhang/;;;;kurtkeutzer/;",
        "or_profile": "~Zhijian_Liu1;~Zhuoyang_Zhang1;~Shang_Yang1;~Haotian_Tang1;~Chenfeng_Xu1;~Kurt_Keutzer1;~Song_Han5",
        "aff": "Massachusetts Institute of Technology;IIIS, Tsinghua University;Massachusetts Institute of Technology;NVIDIA;University of California, Berkeley;University of California, Berkeley;",
        "aff_domain": "mit.edu;mails.tsinghua.edu.cn;mit.edu;nvidia.com;berkeley.edu;berkeley.edu;",
        "position": "PhD student;Undergrad student;PhD student;Intern;PhD student;Full Professor;",
        "bibtex": "@misc{\nliu2024sparse,\ntitle={Sparse Refinement for Efficient High-Resolution Semantic Segmentation},\nauthor={Zhijian Liu and Zhuoyang Zhang and Shang Yang and Haotian Tang and Chenfeng Xu and Kurt Keutzer and Song Han},\nyear={2024},\nurl={https://openreview.net/forum?id=3j5bsiwRv6}\n}",
        "github": "",
        "project": "",
        "reviewers": "Jr1p;7yKn;c8GE;pDrt",
        "site": "https://openreview.net/forum?id=3j5bsiwRv6",
        "pdf_size": 26083187,
        "rating": "5;5;6;6",
        "confidence": "5;4;4;4",
        "soundness": "3;3;3;4",
        "contribution": "3;2;3;3",
        "presentation": "4;3;3;4",
        "wc_summary": "65;55;93;68",
        "wc_strengths": "72;46;87;124",
        "wc_weaknesses": "120;97;52;58",
        "wc_questions": "64;45;114;31",
        "wc_review": "321;243;346;281",
        "wc_reply_reviewers": "101;0;30;133",
        "wc_reply_authors": "613;661;708;766",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "3;3;2;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            70.25,
            13.988834833537782
        ],
        "wc_strengths_avg": [
            82.25,
            28.216794644324857
        ],
        "wc_weaknesses_avg": [
            81.75,
            28.039035290109393
        ],
        "wc_questions_avg": [
            63.5,
            31.42053468672995
        ],
        "wc_review_avg": [
            297.75,
            39.20060586266493
        ],
        "wc_reply_reviewers_avg": [
            66.0,
            53.30572201931046
        ],
        "wc_reply_authors_avg": [
            687.0,
            56.64362276549762
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3823173143449573058&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;0;2;3;3",
        "aff_unique_norm": "Massachusetts Institute of Technology;Tsinghua University;NVIDIA;University of California, Berkeley",
        "aff_unique_dep": ";Institute for Interdisciplinary Information Sciences;NVIDIA Corporation;",
        "aff_unique_url": "https://web.mit.edu;https://www.tsinghua.edu.cn;https://www.nvidia.com;https://www.berkeley.edu",
        "aff_unique_abbr": "MIT;THU;NVIDIA;UC Berkeley",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Berkeley",
        "aff_country_unique_index": "0;1;0;0;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "3jXCF5dNpC",
        "title": "Re-Reading Improves Reasoning in Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Reasoning presents a significant and challenging issue for Large Language Models (LLMs). The predominant focus of research has revolved around developing diverse prompting strategies to guide and structure the reasoning processes of LLMs. However, these approaches based on decoder-only causal language models often operate the input question in a single forward pass, potentially missing the rich, back-and-forth interactions inherent in human reasoning. Scant attention has been paid to a critical dimension, i.e., the input question itself embedded within the prompts. In response, we introduce a seemingly straightforward yet remarkably effective prompting strategy\u2014Re2, which involves re-reading the question. Drawing inspiration from human learning and problem-solving, re-reading entails revisiting the question information embedded within input prompts. This approach aligns seamlessly with the cognitive principle of reinforcement, enabling LLMs to understand the input in a ''bidirectional'' manner, extract deeper insights,  and ultimately enhance their reasoning capabilities across various tasks. Experiments conducted on a series of reasoning benchmarks serve to underscore the effectiveness {and generality} of our method. Moreover, our findings demonstrate that our approach seamlessly integrates with various language models, {thought-eliciting} prompting methods, and ensemble techniques, further underscoring its versatility and compatibility in the realm of LLMs.",
        "keywords": "Large Language Model;Reasoning",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Xiaohan Xu;Chongyang Tao;Tao Shen;Can Xu;Hongbo Xu;Guodong Long;Jian-Guang Lou",
        "authorids": "~Xiaohan_Xu1;~Chongyang_Tao1;~Tao_Shen1;~Can_Xu2;~Hongbo_Xu3;~Guodong_Long2;~Jian-Guang_Lou1",
        "gender": "M;M;M;M;M;M;M",
        "homepage": ";;;https://people.ucas.ac.cn/~xuhongbo;https://www.uts.edu.au/staff/guodong.long;https://www.microsoft.com/en-us/research/people/jlou/;https://tebmer.github.io",
        "dblp": ";95/4097-1;;https://dblp.org/search?q=Hongbo+Xu+Tingwen+Liu;34/10089;37/1917;268/5155",
        "google_scholar": "x_cOKuwAAAAJ;https://scholar.google.com.au/citations?user=SegyX9AAAAAJ;5aiE_NcAAAAJ;;https://scholar.google.com.au/citations?user=Pl8m7hMAAAAJ;alDxINIAAAAJ;iKf_N9oAAAAJ",
        "orcid": ";;0000-0002-1949-5715;0000-0002-0258-7840;0000-0003-3740-9515;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Chongyang_Tao1;~Tao_Shen1;~Can_Xu2;~Hongbo_Xu3;~Guodong_Long2;~Jian-Guang_Lou1;~Shawn_Xu1",
        "aff": "Microsoft;University of Technology Sydney;Microsoft;Institute of Information Engineering;University of Technology Sydney;Microsoft Research Asia;University of Chinese Academy of Sciences",
        "aff_domain": "microsoft.com;uts.edu.au;microsoft.com;iie.ac.cn;uts.edu.au;microsoft.com;ucas.ac.cn",
        "position": "Researcher;Postdoc;Researcher;Full Professor;Associate Professor;Principal Researcher;MS student",
        "bibtex": "@misc{\nxu2024rereading,\ntitle={Re-Reading Improves Reasoning in Language Models},\nauthor={Xiaohan Xu and Chongyang Tao and Tao Shen and Can Xu and Hongbo Xu and Guodong Long and Jian-Guang Lou},\nyear={2024},\nurl={https://openreview.net/forum?id=3jXCF5dNpC}\n}",
        "github": "",
        "project": "",
        "reviewers": "hwHe;KNMq;ZszC",
        "site": "https://openreview.net/forum?id=3jXCF5dNpC",
        "pdf_size": 750659,
        "rating": "5;5;8",
        "confidence": "3;3;5",
        "soundness": "2;3;3",
        "contribution": "2;2;3",
        "presentation": "3;4;4",
        "wc_summary": "87;33;62",
        "wc_strengths": "65;32;59",
        "wc_weaknesses": "131;81;95",
        "wc_questions": "63;51;139",
        "wc_review": "346;197;355",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1230;995;1405",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;2;2",
        "rating_avg": [
            6.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            60.666666666666664,
            22.065558884580486
        ],
        "wc_strengths_avg": [
            52.0,
            14.352700094407323
        ],
        "wc_weaknesses_avg": [
            102.33333333333333,
            21.06075866524175
        ],
        "wc_questions_avg": [
            84.33333333333333,
            38.96437118987322
        ],
        "wc_review_avg": [
            299.3333333333333,
            72.45381670799377
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1210.0,
            167.97817318528817
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 34,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1557878389521115921&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;2;1;0;3",
        "aff_unique_norm": "Microsoft;University of Technology Sydney;Institute of Information Engineering;University of Chinese Academy of Sciences",
        "aff_unique_dep": "Microsoft Corporation;;;",
        "aff_unique_url": "https://www.microsoft.com;https://www.uts.edu.au;;http://www.ucas.ac.cn",
        "aff_unique_abbr": "Microsoft;UTS;;UCAS",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Asia",
        "aff_country_unique_index": "0;1;0;1;3;3",
        "aff_country_unique": "United States;Australia;;China"
    },
    {
        "id": "3k6raldhEd",
        "title": "A Best-of-Both-Worlds Algorithm for MDPs with Long-Term Constraints",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We study online learning in episodic constrained Markov decision processes (CMDPs), where the goal of the learner is to collect as much reward as possible over the episodes, while guaranteeing that some long-term constraints are satisfied during the learning process. Rewards and constraints can be selected either stochastically or adversarially, and the transition function is not known to the learner.\nWhile online learning in classical (unconstrained) MDPs has received considerable attention over the last years, the setting of CMDPs is still largely unexplored. This is surprising, since in real-world applications, such as, e.g., autonomous driving, automated bidding, and recommender systems, there are usually additional constraints and specifications that an agent has to obey during the learning process.\nIn this paper, we provide the first best-of-both-worlds algorithm for CMDPs with long-term constraints. Our algorithm is capable of handling settings in which rewards and constraints are selected either stochastically or adversarially, without requiring any knowledge of the underling process. Moreover, our algorithm matches state-of-the-art regret and constraint violation bounds for settings in which constraints are selected stochastically, while it is the first to provide guarantees in the case in which they are chosen adversarially.",
        "keywords": "constrained;mdp;cmdp;markov decision process;online learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/6515e92a28fc64fd0d7b648872e9108da27be243.zip",
        "author": "Francesco Emanuele Stradi;Jacopo Germano;Gianmarco Genalti;Matteo Castiglioni;Alberto Marchesi;Nicola Gatti",
        "authorids": "~Francesco_Emanuele_Stradi1;~Jacopo_Germano1;~Gianmarco_Genalti1;~Matteo_Castiglioni1;~Alberto_Marchesi1;~Nicola_Gatti1",
        "gender": "M;M;Not Specified;;M;M",
        "homepage": "https://francescoemanuelestradi.github.io;https://www.deib.polimi.it/eng/people/details/1132094;;https://castiglionimatteo.github.io;https://albymarke.github.io;https://www4.ceda.polimi.it/manifesti/manifesti/controller/ricerche/RicercaPerDocentiPublic.do?k_doc=75785&lang=EN&EVN_PRODOTTI=evento&__pj0=0&__pj1=d918ee8916afbd0005f5c0bc3c0ff350",
        "dblp": "345/9650;;;225/7720;204/1718;g/NicolaGatti",
        "google_scholar": "JYdi_FMAAAAJ;;b4UMI8kAAAAJ;https://scholar.google.it/citations?user=NPE3HAYAAAAJ;vXDtCzoAAAAJ;https://scholar.google.com.tw/citations?user=j-HrYREAAAAJ",
        "orcid": ";;;0000-0002-1070-6766;;0000-0001-7349-3932",
        "linkedin": "francesco-emanuele-stradi-bb35b0222/;;gianmarco-genalti-26328a1a4/;;;nicola-gatti-1284b21",
        "or_profile": "~Francesco_Emanuele_Stradi1;~Jacopo_Germano1;~Gianmarco_Genalti1;~Matteo_Castiglioni1;~Alberto_Marchesi1;~Nicola_Gatti1",
        "aff": "Polytechnic Institute of Milan;Polytechnic Institute of Milan;Polytechnic Institute of Milan;Politecnico di Milano;Politecnico di Milano;Polytechnic Institute of Milan",
        "aff_domain": "polimi.it;polimi.it;polimi.it;polimi.it;polimi.it;polimi.it",
        "position": "PhD student;PhD student;PhD student;Assistant Professor;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nstradi2024a,\ntitle={A Best-of-Both-Worlds Algorithm for {MDP}s with Long-Term Constraints},\nauthor={Francesco Emanuele Stradi and Jacopo Germano and Gianmarco Genalti and Matteo Castiglioni and Alberto Marchesi and Nicola Gatti},\nyear={2024},\nurl={https://openreview.net/forum?id=3k6raldhEd}\n}",
        "github": "",
        "project": "",
        "reviewers": "KHRX;Txce;r196;bJQa",
        "site": "https://openreview.net/forum?id=3k6raldhEd",
        "pdf_size": 401706,
        "rating": "3;5;6;6",
        "confidence": "5;3;3;3",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "71;76;79;79",
        "wc_strengths": "52;53;60;55",
        "wc_weaknesses": "184;50;8;114",
        "wc_questions": "71;33;34;25",
        "wc_review": "378;212;181;273",
        "wc_reply_reviewers": "206;75;0;0",
        "wc_reply_authors": "2575;913;302;639",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "5;2;1;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            76.25,
            3.2691742076555053
        ],
        "wc_strengths_avg": [
            55.0,
            3.082207001484488
        ],
        "wc_weaknesses_avg": [
            89.0,
            66.58077800686922
        ],
        "wc_questions_avg": [
            40.75,
            17.80975856096876
        ],
        "wc_review_avg": [
            261.0,
            75.22300180131074
        ],
        "wc_reply_reviewers_avg": [
            70.25,
            84.14385004265017
        ],
        "wc_reply_authors_avg": [
            1107.25,
            874.6011591005354
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            1.6393596310755
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.9428090415820632,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Kpb1njGELlkJ:scholar.google.com/&scioq=A+Best-of-Both-Worlds+Algorithm+for+MDPs+with+Long-Term+Constraints&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;1;0",
        "aff_unique_norm": "Polytechnic Institute of Milan;Politecnico di Milano",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.polimi.it/;https://www.polimi.it",
        "aff_unique_abbr": "Politecnico di Milano;Polimi",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "Italy"
    },
    {
        "id": "3klVRLhK7w",
        "title": "Budgeted Online Continual Learning by Adaptive Layer Freezing and Frequency-based Sampling",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Majority of online continual learning (CL) places restrictions on the size of replay memory and a single-epoch training to ensure a prompt update of the model. However, the single-epoch training may imply a different amount of computations per CL algorithm, and additional storage for storing logit or model in addition to replay memory is largely ignored as a storage budget. Here, we used floating point operations (FLOPs) and total memory size in Byte as a metric for computational and memory budgets, respectively, to compare CL algorithms with the same total budget. Interestingly, we found that the new and advanced algorithms often perform worse than simple baselines under the same budget, implying that their value is less beneficial in real-world deployment. To improve the accuracy of online continual learners in the same budget, we propose an adaptive layer freezing and frequency-based memory retrieval for episodic memory usage for a storage- and computationally-efficient online CL algorithm. The proposed adaptive layer freezing does not update the layers for less informative batches to reduce computational cost with a negligible loss of accuracy. The proposed memory retrieval balances the training usage count of samples in episodic memory with a negligible computational and memory cost. In extensive empirical validations using CIFAR-10/100, CLEAR-10, and ImageNet-1K datasets, we demonstrate that the proposed method outperforms the state-of-the-art in the same total budget.",
        "keywords": "continual learning;constraint;layer freezing;efficient learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Minhyuk Seo;Hyunseo Koh;Jonghyun Choi",
        "authorids": "~Minhyuk_Seo1;~Hyunseo_Koh1;~Jonghyun_Choi1",
        "gender": "M;M;M",
        "homepage": "https://dbd05088.github.io/;;https://ppolon.github.io/",
        "dblp": "350/4104;304/4369;21/11103",
        "google_scholar": "ayDPR-gAAAAJ;Mi4cMxgAAAAJ;uiGWnm4AAAAJ",
        "orcid": ";0000-0002-2576-1581;0000-0002-7934-8434",
        "linkedin": "minhyuk-seo-59ba11247/;%ED%98%84%EC%84%9C-%EA%B3%A0-66298a221/;jonghyun-choi-459bb615/",
        "or_profile": "~Minhyuk_Seo1;~Hyunseo_Koh1;~Jonghyun_Choi1",
        "aff": "Yonsei University;Gwangju Institute of Science and Technology;Yonsei University",
        "aff_domain": "yonsei.ac.kr;gist.ac.kr;yonsei.ac.kr",
        "position": "MS student;PhD student;Associate Professor",
        "bibtex": "@misc{\nseo2024budgeted,\ntitle={Budgeted Online Continual Learning by Adaptive Layer Freezing and Frequency-based Sampling},\nauthor={Minhyuk Seo and Hyunseo Koh and Jonghyun Choi},\nyear={2024},\nurl={https://openreview.net/forum?id=3klVRLhK7w}\n}",
        "github": "",
        "project": "",
        "reviewers": "7DQF;htG8;sCXL",
        "site": "https://openreview.net/forum?id=3klVRLhK7w",
        "pdf_size": 722369,
        "rating": "5;5;5",
        "confidence": "2;2;4",
        "soundness": "2;2;2",
        "contribution": "2;2;2",
        "presentation": "3;2;2",
        "wc_summary": "78;116;54",
        "wc_strengths": "39;30;34",
        "wc_weaknesses": "3;48;309",
        "wc_questions": "112;159;269",
        "wc_review": "232;353;666",
        "wc_reply_reviewers": "16;27;315",
        "wc_reply_authors": "663;839;2557",
        "reply_reviewers": "1;1;2",
        "reply_authors": "2;2;5",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            82.66666666666667,
            25.525586292102197
        ],
        "wc_strengths_avg": [
            34.333333333333336,
            3.6817870057290873
        ],
        "wc_weaknesses_avg": [
            120.0,
            134.89996293550269
        ],
        "wc_questions_avg": [
            180.0,
            65.79260343432738
        ],
        "wc_review_avg": [
            417.0,
            182.86789402917796
        ],
        "wc_reply_reviewers_avg": [
            119.33333333333333,
            138.4300866462522
        ],
        "wc_reply_authors_avg": [
            1353.0,
            854.3832083243833
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.0,
            1.4142135623730951
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7960869026184940243&as_sdt=4005&sciodt=0,6&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Yonsei University;Gwangju Institute of Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.yonsei.ac.kr;https://www.gist.ac.kr",
        "aff_unique_abbr": "Yonsei;GIST",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Gwangju",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "3mDe5o24BM",
        "title": "HFDream: Improving 3D Generation via Human-Assisted Multi-view Text-to-Image Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large-scale text-to-image models have demonstrated the potential for performing text-to-3D synthesis. However, existing approaches, e.g., DreamFusion, suffer from unstable 3D optimization due to the limitations of current text-to-image models that they struggle to synthesize images from certain viewpoints even when specified in the text prompt. Obtaining a view-aligned image-text pair dataset is challenging due to the limited availability of such data, and the inherent subjectivity and ambiguity of view-alignment. In this paper, we propose to enhance text-to- 3D generation by learning from human feedback for generating desired views. We generate multi-view images with the text-to-image model and engage human labelers to select a valid viewpoint. Using the human-labeled dataset, we train a reward model designed to verify whether the generated image aligns with the viewpoint specified in the text prompt. Finally, we fine-tune the text-to-image model to maximize the reward score. We find that our text-to-image diffusion models fine-tuned with human feedback, coined HFDream, consistently generate diverse viewpoints without the need for multi-view datasets created from 3D assets. This leads to high-quality text-to-3D generations with consistent geometry, when combined with view-dependent prompting in DreamFusion.",
        "keywords": "Learning from Human Feedback;Text-to-3D generation;Diffusion Model",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/f74c02c92af065395df80d08a5d14c862d8658aa.zip",
        "author": "June Suk Choi;Kyungmin Lee;DongJun Lee;Jinwoo Shin;Kimin Lee",
        "authorids": "~June_Suk_Choi1;~Kyungmin_Lee1;~DongJun_Lee2;~Jinwoo_Shin1;~Kimin_Lee1",
        "gender": "M;M;M;M;M",
        "homepage": "https://choi403.github.io/;https://kyungmnlee.github.io/;https://dgjun32.github.io/;https://sites.google.com/site/mijirim/;https://sites.google.com/view/kiminlee",
        "dblp": ";57/5118;;31/7062;183/6849",
        "google_scholar": ";6dpime0AAAAJ;;https://scholar.google.com.tw/citations?user=m3eDp7kAAAAJ;92M8xv4AAAAJ",
        "orcid": ";;;;",
        "linkedin": "william-june-suk-choi-b03158350/;;;;",
        "or_profile": "~June_Suk_Choi1;~Kyungmin_Lee1;~DongJun_Lee2;~Jinwoo_Shin1;~Kimin_Lee1",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Korea University;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.edu;kaist.ac.kr;korea.ac.kr;kaist.ac.kr;kaist.edu",
        "position": "MS student;PhD student;Undergrad student;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nchoi2024hfdream,\ntitle={{HFD}ream: Improving 3D Generation via Human-Assisted Multi-view Text-to-Image Models},\nauthor={June Suk Choi and Kyungmin Lee and DongJun Lee and Jinwoo Shin and Kimin Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=3mDe5o24BM}\n}",
        "github": "",
        "project": "",
        "reviewers": "L7ZF;PzSD;T5e1",
        "site": "https://openreview.net/forum?id=3mDe5o24BM",
        "pdf_size": 29630145,
        "rating": "5;5;6",
        "confidence": "5;5;4",
        "soundness": "2;3;3",
        "contribution": "2;2;2",
        "presentation": "2;3;3",
        "wc_summary": "28;52;99",
        "wc_strengths": "19;29;68",
        "wc_weaknesses": "126;205;160",
        "wc_questions": "16;3;38",
        "wc_review": "189;289;365",
        "wc_reply_reviewers": "0;0;18",
        "wc_reply_authors": "764;535;546",
        "reply_reviewers": "0;0;1",
        "reply_authors": "2;2;2",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            59.666666666666664,
            29.48822740612863
        ],
        "wc_strengths_avg": [
            38.666666666666664,
            21.139746660943903
        ],
        "wc_weaknesses_avg": [
            163.66666666666666,
            32.355662392986005
        ],
        "wc_questions_avg": [
            19.0,
            14.445299120013633
        ],
        "wc_review_avg": [
            281.0,
            72.07403600927776
        ],
        "wc_reply_reviewers_avg": [
            6.0,
            8.48528137423857
        ],
        "wc_reply_authors_avg": [
            615.0,
            105.4545715778442
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9999999999999998,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18052567484890569273&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology;Korea University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.kaist.ac.kr;https://www.korea.ac.kr",
        "aff_unique_abbr": "KAIST;KU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "3mXJ9o2DNx",
        "title": "Connecting Domains and Contrasting Samples: A Ladder for Domain Generalization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Distribution shifts between training and testing datasets, contrary to classical machine learning assumptions, frequently occur in practice and impede model generalization performance. Studies on domain generalization (DG) thereby arise, aiming to predict the label on unseen target domain data by only using data from source domains. In the meanwhile, the contrastive learning (CL) technique, which prevails in self-supervised pre-training, can align different augmentation of samples to obtain invariant representation. It is intuitive to consider the class-separated representations learned in CL are able to improve domain generalization, while the reality is quite the opposite: people observe directly applying CL deteriorates the performance. We analyze the phenomenon with the CL theory and discover the lack of domain connectivity in the DG setting causes the deficiency. Thus we propose domain-connecting contrastive learning (\\model) to enhance the conceptual connectivity across domains and obtain generalizable representations for DG. Specifically, more aggressive data augmentation and cross-domain positive samples are introduced into self-contrastive learning to improve domain connectivity. Furthermore, to better embed the unseen test domains, we propose model anchoring to exploit the domain connectivity in pre-trained representations and complement it with generative transformation loss. Extensive experiments on five standard DG benchmarks are provided. The results verify that \\model~outperforms state-of-the-art baselines even without domain supervision.",
        "keywords": "Distribution shift;contrastive learning;self-supervised learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/37b224801f82a0f80626b3cda68bf0cbd37ee59a.zip",
        "author": "Tianxin Wei;Yifan Chen;Xinrui He;Jingrui He",
        "authorids": "~Tianxin_Wei1;~Yifan_Chen3;~Xinrui_He1;~Jingrui_He1",
        "gender": ";;;F",
        "homepage": "https://weitianxin.github.io/;;https://github.com/Xinrui17;https://www.hejingrui.org",
        "dblp": "277/5800;;;34/2685",
        "google_scholar": "_LU2-kMAAAAJ;;;hXpZynkAAAAJ",
        "orcid": "0000-0003-4450-2005;;0009-0003-4475-8059;0000-0002-6429-6272",
        "linkedin": "tianxin-wei-7063a2180/;;;",
        "or_profile": "~Tianxin_Wei1;~Yifan_Chen3;~Xinrui_He1;~Jingrui_He1",
        "aff": "University of Illinois, Urbana-Champaign;;University of Illinois, Urbana-Champaign;University of Illinois, Urbana Champaign",
        "aff_domain": "uiuc.edu;;cs.illinois.edu;illinois.edu",
        "position": "PhD student;;PhD student;Full Professor",
        "bibtex": "@misc{\nwei2024connecting,\ntitle={Connecting Domains and Contrasting Samples: A Ladder for Domain Generalization},\nauthor={Tianxin Wei and Yifan Chen and Xinrui He and Jingrui He},\nyear={2024},\nurl={https://openreview.net/forum?id=3mXJ9o2DNx}\n}",
        "github": "",
        "project": "",
        "reviewers": "BueW;2QYf;fbsW;ttfL;NxUh",
        "site": "https://openreview.net/forum?id=3mXJ9o2DNx",
        "pdf_size": 11910679,
        "rating": "3;5;5;5;5",
        "confidence": "5;4;4;4;3",
        "soundness": "2;2;3;2;3",
        "contribution": "2;2;2;2;2",
        "presentation": "2;3;3;2;3",
        "wc_summary": "75;90;70;27;46",
        "wc_strengths": "9;98;28;22;29",
        "wc_weaknesses": "160;207;74;91;199",
        "wc_questions": "3;5;6;157;4",
        "wc_review": "247;400;178;297;278",
        "wc_reply_reviewers": "0;78;0;71;0",
        "wc_reply_authors": "784;640;366;628;602",
        "reply_reviewers": "0;1;0;1;0",
        "reply_authors": "2;2;2;2;2",
        "rating_avg": [
            4.6,
            0.7999999999999999
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            61.6,
            22.348154286204487
        ],
        "wc_strengths_avg": [
            37.2,
            31.224349472807276
        ],
        "wc_weaknesses_avg": [
            146.2,
            54.653087744426664
        ],
        "wc_questions_avg": [
            35.0,
            61.00819617067857
        ],
        "wc_review_avg": [
            280.0,
            72.36850143536205
        ],
        "wc_reply_reviewers_avg": [
            29.8,
            36.56446362248461
        ],
        "wc_reply_authors_avg": [
            604.0,
            134.84806264830058
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.790569415042095,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11969925089597990194&as_sdt=5,39&sciodt=0,39&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "University of Illinois;University of Illinois Urbana-Champaign",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://illinois.edu;https://illinois.edu",
        "aff_unique_abbr": "UIUC;UIUC",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Urbana-Champaign",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "3mY9aGiMn0",
        "title": "Sparser, Better, Deeper, Stronger: Improving Sparse Training with Exact Orthogonal Initialization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Sparse training aims to train sparse models from scratch, achieving remarkable results in recent years. A key design choice in sparse training is the sparse initialization, which determines the trainable sub-network through a binary mask. Existing methods mainly revolve around selecting the mask based on predefined dense weight initialization. However, such an approach may not efficiently leverage the mask's potential impact on training parameters and optimization. An alternative direction, inspired by research into dynamical isometry, is to introduce orthogonality in the sparse subnetwork. This helps prevent the gradient signal from vanishing or exploding, ultimately enhancing the reliability of the backpropagation process. In this work, we propose Exact Orthogonal Initialization (EOI), a novel sparse orthogonal initialization scheme based on composing random Givens rotations. Contrary to other existing approaches, our method provides exact (not approximated) orthogonality and enables the creation of layers with arbitrary densities. Through experiments on contemporary network architectures, we present the effectiveness of EOI and demonstrate that it consistently outperforms other commonly used sparse initialization techniques. Furthermore, to showcase the full potential of our method, we show that it enables the training of highly sparse 1000-layer MLP and CNN networks without any residual connections or normalization techniques.  Our research highlights the importance of weight initialization in sparse training, underscoring the vital part it plays alongside the sparse mask selection.",
        "keywords": "Sparse Training;Pruning;Orthogonal Initialization",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/778bfcdfe08282d091b659a3c5f279b938c44c68.zip",
        "author": "Aleksandra Nowak;\u0141ukasz Gniecki;Filip Szatkowski;Jacek Tabor",
        "authorids": "~Aleksandra_Nowak1;~\u0141ukasz_Gniecki1;~Filip_Szatkowski1;~Jacek_Tabor1",
        "gender": "F;M;M;M",
        "homepage": ";;;",
        "dblp": "34/10106;;323/8425;31/5172",
        "google_scholar": "2A-eZhQAAAAJ;;xjnAIOEAAAAJ;https://scholar.google.pl/citations?user=zSKYziUAAAAJ",
        "orcid": "0000-0002-2830-6613;;0000-0001-8592-2001;0000-0001-6652-7727",
        "linkedin": ";lukaszgniecki/;fszatkowski/;",
        "or_profile": "~Aleksandra_Nowak1;~\u0141ukasz_Gniecki1;~Filip_Szatkowski1;~Jacek_Tabor1",
        "aff": "Google;Jagiellonian University Cracow;Amazon;Jagiellonian University",
        "aff_domain": "google.com;uj.edu.pl;amazon.de;uj.edu.pl",
        "position": "Intern;MS student;Intern;Full Professor",
        "bibtex": "@misc{\nnowak2024sparser,\ntitle={Sparser, Better, Deeper, Stronger: Improving Sparse Training with Exact Orthogonal Initialization},\nauthor={Aleksandra Nowak and {\\L}ukasz Gniecki and Filip Szatkowski and Jacek Tabor},\nyear={2024},\nurl={https://openreview.net/forum?id=3mY9aGiMn0}\n}",
        "github": "",
        "project": "",
        "reviewers": "7ET6;s3UF;4iab",
        "site": "https://openreview.net/forum?id=3mY9aGiMn0",
        "pdf_size": 1003240,
        "rating": "5;5;6",
        "confidence": "5;3;4",
        "soundness": "3;2;4",
        "contribution": "3;2;2",
        "presentation": "3;3;3",
        "wc_summary": "41;151;203",
        "wc_strengths": "26;15;40",
        "wc_weaknesses": "223;157;37",
        "wc_questions": "342;39;70",
        "wc_review": "632;362;350",
        "wc_reply_reviewers": "0;33;84",
        "wc_reply_authors": "2244;1403;1027",
        "reply_reviewers": "0;1;2",
        "reply_authors": "3;3;3",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            131.66666666666666,
            67.53435339802174
        ],
        "wc_strengths_avg": [
            27.0,
            10.23067283548187
        ],
        "wc_weaknesses_avg": [
            139.0,
            76.99350621968063
        ],
        "wc_questions_avg": [
            150.33333333333334,
            136.11841250257888
        ],
        "wc_review_avg": [
            448.0,
            130.19984639007836
        ],
        "wc_reply_reviewers_avg": [
            39.0,
            34.55430508634199
        ],
        "wc_reply_authors_avg": [
            1558.0,
            508.7835165044821
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            3.0,
            0.0
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3081273972719296832&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "Google;Jagiellonian University;Amazon",
        "aff_unique_dep": "Google;;Amazon.com, Inc.",
        "aff_unique_url": "https://www.google.com;https://www.uj.edu.pl;https://www.amazon.com",
        "aff_unique_abbr": "Google;UJ;Amazon",
        "aff_campus_unique_index": "0;1",
        "aff_campus_unique": "Mountain View;Cracow;",
        "aff_country_unique_index": "0;1;0;1",
        "aff_country_unique": "United States;Poland"
    },
    {
        "id": "3mZEMBM0jN",
        "title": "Learning Symbolic Interactions for Interpretable State-Space Modeling",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "A general model to learn complex system dynamics will be helpful for us to understand how natural and computational networks of simple computation units solve complex problems. We formulate discrete event dynamics as a Bayesian neural network with skip connections: we use linearity to select hidden features to interact and combine the effects of these interactions, and we use nonlinearity (exponential and logarithm) to compound these interactions. To make learning scalable, we derive a Bayesian backpropagation algorithm that computes the expected loss gradient through propagating filtering and smoothing probabilities of hidden features. Experiments demonstrate that our algorithm can data-efficiently capture complex system dynamics in several fields with meaningful interactions.",
        "keywords": "Bayesian back-propagation;complex systems",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "",
        "author": "Wen Dong",
        "authorids": "~Wen_Dong1",
        "gender": "M",
        "homepage": "https://www.cse.buffalo.edu/~wendong/",
        "dblp": "84/3520-1",
        "google_scholar": "https://scholar.google.com.tw/citations?user=UBrg28IAAAAJ",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Wen_Dong1",
        "aff": "State University of New York, Buffalo",
        "aff_domain": "buffalo.edu",
        "position": "Assistant Professor",
        "bibtex": "@misc{\ndong2024learning,\ntitle={Learning Symbolic Interactions for Interpretable State-Space Modeling},\nauthor={Wen Dong},\nyear={2024},\nurl={https://openreview.net/forum?id=3mZEMBM0jN}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=3mZEMBM0jN",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Mn1TLIr6P9EJ:scholar.google.com/&scioq=Learning+Symbolic+Interactions+for+Interpretable+State-Space+Modeling&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "State University of New York at Buffalo",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.buffalo.edu",
        "aff_unique_abbr": "SUNY Buffalo",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Buffalo",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "3mdCet7vVv",
        "title": "Maestro: Uncovering Low-Rank Structures via Trainable Decomposition",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep Neural Networks (DNNs) have been a large drivers and enablers for AI breakthroughs in recent years. These models have been getting larger in their attempt to become more accurate and tackle new upcoming use-cases, including AR/VR and intelligent assistants. However, the training process of such large models is a costly and time-consuming process, which typically yields a single model to fit all targets. To mitigate this, various techniques have been proposed in the literature, including pruning, sparsification, or quantization of the model weights and updates. While able to achieve high compression rates, they often incur computational overheads or accuracy penalties. Alternatively, factorization methods have been leveraged to incorporate low-rank compression in the training process. Such techniques (e.g., SVD) also frequently rely on the computationally expensive decomposition of layers and are potentially sub-optimal for non-linear models, such as DNNs. In this work, we take a further step in designing efficient low-rank models and propose MAESTRO, a framework for trainable low-rank layers. Instead of regularly applying a priori decompositions such as SVD, the low-rank structure is built into the training process through a generalized variant of Ordered Dropout. This method imposes an importance ordering via sampling on the decomposed DNN structure. Our theoretical analysis demonstrates that our method recovers the SVD decomposition of linear mapping on uniformly distributed data and PCA for linear autoencoders. We further apply our technique on DNNs and empirically illustrate that MAESTRO enables the extraction of lower footprint models that preserve model performance while allowing for graceful accuracy-latency tradeoffs for the deployment to devices of different capabilities.",
        "keywords": "low-rank approximation;efficient model training;trainable decomposition",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/3a54a9fff5e8356d044b0bdfd8a70585281ffe39.pdf",
        "author": "Samuel Horv\u00e1th;Stefanos Laskaridis;Shashank Rajput;Hongyi Wang",
        "authorids": "~Samuel_Horv\u00e1th1;~Stefanos_Laskaridis1;~Shashank_Rajput1;~Hongyi_Wang1",
        "gender": "M;;M;M",
        "homepage": "https://sites.google.com/view/samuelhorvath;https://stefanos.cc;https://pages.cs.wisc.edu/~srajput/;https://hwang595.github.io/",
        "dblp": "234/8604;241/6273;241/5361;15/832-1.html",
        "google_scholar": "k252J7kAAAAJ;https://scholar.google.co.uk/citations?user=TcVC--IAAAAJ;qEXxyDQAAAAJ;zYdZORsAAAAJ",
        "orcid": "0000-0003-0619-9260;;;",
        "linkedin": "samuel-horvath/;stevelaskaridis/;;hongyi-wang-b89651102/",
        "or_profile": "~Samuel_Horv\u00e1th1;~Stefanos_Laskaridis1;~Shashank_Rajput1;~Hongyi_Wang1",
        "aff": "MBZUAI;Brave Software;University of Wisconsin, Madison;Carnegie Mellon University",
        "aff_domain": "mbzuai.ac.ae;brave.com;wisc.edu;andrew.cmu.edu",
        "position": "Assistant Professor;Researcher;PhD student;Researcher",
        "bibtex": "@misc{\nhorv{\\'a}th2024maestro,\ntitle={Maestro: Uncovering Low-Rank Structures via Trainable Decomposition},\nauthor={Samuel Horv{\\'a}th and Stefanos Laskaridis and Shashank Rajput and Hongyi Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=3mdCet7vVv}\n}",
        "github": "",
        "project": "",
        "reviewers": "LrqS;Mad7;ZdCx;CAHp",
        "site": "https://openreview.net/forum?id=3mdCet7vVv",
        "pdf_size": 2326242,
        "rating": "5;5;5;8",
        "confidence": "4;4;3;3",
        "soundness": "3;3;2;3",
        "contribution": "2;1;2;3",
        "presentation": "3;4;2;2",
        "wc_summary": "70;76;68;76",
        "wc_strengths": "22;58;53;93",
        "wc_weaknesses": "80;63;191;159",
        "wc_questions": "16;64;5;7",
        "wc_review": "188;261;317;335",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "340;889;488;160",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            5.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            72.5,
            3.570714214271425
        ],
        "wc_strengths_avg": [
            56.5,
            25.184320518926057
        ],
        "wc_weaknesses_avg": [
            123.25,
            53.312170280340304
        ],
        "wc_questions_avg": [
            23.0,
            24.031229681395832
        ],
        "wc_review_avg": [
            275.25,
            57.290378773403134
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            469.25,
            268.7390695451631
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8374317016626564409&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Mohamed bin Zayed University of Artificial Intelligence;Brave Software;University of Wisconsin;Carnegie Mellon University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.mbzuai.ac.ae;https://www.brave.com;https://www.wisc.edu;https://www.cmu.edu",
        "aff_unique_abbr": "MBZUAI;Brave;UW;CMU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Madison",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "United Arab Emirates;United States"
    },
    {
        "title": "Towards Principled Representation Learning from Videos for Reinforcement Learning",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19497",
        "id": "3mnWvUZIXt",
        "author_site": "Dipendra Kumar Misra, Akanksha Saran, Tengyang Xie, Alex Lamb, John Langford",
        "tldr": "",
        "abstract": "We study pre-training representations for decision-making using video data, which is abundantly available for tasks such as game agents and software testing. Even though significant empirical advances have been made on this problem, a theoretical understanding remains absent. We initiate the theoretical investigation into principled approaches for representation learning and focus on learning the latent state representations of the underlying MDP using video data. We study two types of settings: one where there is iid noise in the observation, and a more challenging setting where there is also the presence of exogenous noise, which is non-iid noise that is temporally correlated, such as the motion of people or cars in the background. We study three commonly used approaches: autoencoding, temporal contrastive learning, and forward modeling. We prove upper bounds for temporal contrastive learning and forward modeling in the presence of only iid noise. We show that these approaches can learn the latent state and use it to do efficient downstream RL with polynomial sample complexity. When exogenous noise is also present, we establish a lower bound result showing that the sample complexity of learning from video data can be exponentially worse than learning from action-labeled trajectory data. This partially explains why reinforcement learning with video pre-training is hard. We evaluate these representational learning methods in two visual domains, yielding results that are consistent with our theoretical findings.",
        "keywords": "Reinforcement Learning;Representation Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Dipendra Misra;Akanksha Saran;Tengyang Xie;Alex Lamb;John Langford",
        "authorids": "~Dipendra_Misra1;~Akanksha_Saran1;~Tengyang_Xie1;~Alex_Lamb1;~John_Langford1",
        "gender": "M;F;;M;M",
        "homepage": "https://dipendramisra.com/;;https://tengyangxie.github.io/;http://hunch.net/~jl;",
        "dblp": "218/6569;173/6209;227/3335;77/4488;",
        "google_scholar": "rIoPIFsAAAAJ;zZhWSQ0AAAAJ;rlmROVsAAAAJ;LFiqVpwAAAAJ;https://scholar.google.ca/citations?user=BFzFy1YAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";akanksha-saran-8b506620/;;;",
        "or_profile": "~Dipendra_Misra1;~Akanksha_Saran1;~Tengyang_Xie1;~John_Langford1;~Alex_Matthew_Lamb1",
        "aff": "Microsoft Research;Sony AI;Microsoft Research, New England & NYC;Microsoft;",
        "aff_domain": "microsoft.com;sony.com;microsoft.com;microsoft.com;",
        "position": "Researcher;Researcher;Postdoc;Researcher;",
        "bibtex": "@inproceedings{\nmisra2024towards,\ntitle={Towards Principled Representation Learning from Videos for Reinforcement Learning},\nauthor={Dipendra Misra and Akanksha Saran and Tengyang Xie and Alex Lamb and John Langford},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=3mnWvUZIXt}\n}",
        "github": "",
        "project": "",
        "reviewers": "TsKD;ZrZp;tXAJ;sJQE",
        "pdf_size": 10089431,
        "rating": "5;8;8;8",
        "confidence": "3;4;3;3",
        "soundness": "2;4;3;3",
        "contribution": "2;4;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "78;144;102;175",
        "wc_strengths": "19;113;41;54",
        "wc_weaknesses": "55;48;182;126",
        "wc_questions": "219;9;73;108",
        "wc_review": "371;314;398;463",
        "wc_reply_reviewers": "95;0;64;68",
        "wc_reply_authors": "1135;279;676;776",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "2;1;2;1",
        "rating_avg": [
            7.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            124.75,
            37.41239767777521
        ],
        "wc_strengths_avg": [
            56.75,
            34.802119188348286
        ],
        "wc_weaknesses_avg": [
            102.75,
            54.99715901753471
        ],
        "wc_questions_avg": [
            102.25,
            76.18193683544676
        ],
        "wc_review_avg": [
            386.5,
            53.57471418495856
        ],
        "wc_reply_reviewers_avg": [
            56.75,
            34.86671048435743
        ],
        "wc_reply_authors_avg": [
            716.5,
            304.8479129008431
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6575773369814907620&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=3mnWvUZIXt",
        "pdf": "https://openreview.net/pdf?id=3mnWvUZIXt",
        "email": "microsoft.com;sony.com;microsoft.com;microsoft.com;",
        "author_num": 5,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Microsoft;Sony",
        "aff_unique_dep": "Microsoft Research;Sony AI",
        "aff_unique_url": "https://www.microsoft.com/en-us/research;https://www.sony.com",
        "aff_unique_abbr": "MSR;Sony AI",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";New England",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "United States;Japan"
    },
    {
        "id": "3nPFco1EKt",
        "title": "Evolving Neural Network's Weights at Imagenet Scale",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Building upon evolutionary theory, this work proposes a deep neural network optimization framework based on evolutionary algorithms to enhance existing pre-trained models, usually trained by backpropagation (BP). Specifically, we consider a pre-trained model to generate an initial population of deep neural networks (DNNs) using BP with distinct hyper-parameters, and subsequently simulate the evolutionary process of DNNs. Moreover, we enhance the evolutionary process, by developing an adaptive differential evolution (DE) algorithm, SA-SHADE-tri-ensin, which integrates the strengths of two DE algorithms, SADE and SHADE, with trigonometric mutation and sinusoidal change of mutation rate. Compared to existing work (e.g., ensembling, weight averaging and evolution inspired techniques), the proposed method better enhanced existing pre-trained deep neural network models (e.g., ResNet variants) on large-scale ImageNet. Our analysis reveals that DE with an adaptive trigonometric mutation strategy yields improved offspring with higher success rates and the importance of diversity in the parent population. Hence, the underlying mechanism is worth further investigation and has implications for developing advanced neuro-evolutionary optimizers.",
        "keywords": "optimization;evolution",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/d2dbb1f657d104f10afbdc5da3ec2db9241e510f.zip",
        "author": "Guodong DU;Senqiao Yang;Runhua Jiang;Shuyang Yu;Haoyang Li;Wei Chen;Keren Li;Ho-Kin Tang;Sim Kuan Goh",
        "authorids": "~Guodong_DU2;~Senqiao_Yang1;~Runhua_Jiang2;~Shuyang_Yu2;~Haoyang_Li7;~Wei_Chen49;~Keren_Li1;~Ho-Kin_Tang1;~Sim_Kuan_Goh2",
        "gender": "M;;M;F;M;;M;M;M",
        "homepage": "https://duguodong7.github.io;;;;https://github.com/LiHaoyang0517;;https://cpoe.szu.edu.cn/info/1060/1756.htm;http://faculty.hitsz.edu.cn/denghaojian;https://simkuangoh.github.io/",
        "dblp": "213/8915-4;;;;;;;;152/7784",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;;;sfFLGycAAAAJ;;;https://scholar.google.ca/citations?user=n_03hjkAAAAJ;https://scholar.google.com.hk/citations?user=a4yjxI4AAAAJ;",
        "orcid": ";;;;;;;0000-0002-8378-815X;",
        "linkedin": "\u56fd\u4e1c-\u675c-30b496169/;;runhua-jiang-295004261/?originalSubdomain=my;shuyang-yu;;;;;",
        "or_profile": "~Guodong_DU2;~Senqiao_Yang1;~Runhua_Jiang2;~Shuyang_Yu2;~Haoyang_Li7;~Wei_Chen49;~Keren_Li1;~Ho-Kin_Tang1;~Sim_Kuan_Goh2",
        "aff": "Harbin Institute of Technology;;Xiamen University;Xiamen University Malaysia;Xiamen University;;Shenzhen University;Harbin Institute of Technology;Xiamen University Malaysia",
        "aff_domain": "hit.edu.cn;;xmu.edu.cn;xmu.edu.my;xmu.edu.cn;;szu.edu.cn;hit.edu.cn;xmu.edu.cn",
        "position": "Researcher;;Undergrad student;Undergrad student;Undergrad student;;Assistant Professor;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\ndu2024evolving,\ntitle={Evolving Neural Network's Weights at Imagenet Scale},\nauthor={Guodong DU and Senqiao Yang and Runhua Jiang and Shuyang Yu and Haoyang Li and Wei Chen and Keren Li and Ho-Kin Tang and Sim Kuan Goh},\nyear={2024},\nurl={https://openreview.net/forum?id=3nPFco1EKt}\n}",
        "github": "",
        "project": "",
        "reviewers": "SWqn;4ELS;BX5K",
        "site": "https://openreview.net/forum?id=3nPFco1EKt",
        "pdf_size": 13585968,
        "rating": "3;3;3",
        "confidence": "4;4;5",
        "soundness": "3;2;2",
        "contribution": "1;1;1",
        "presentation": "2;2;1",
        "wc_summary": "100;47;67",
        "wc_strengths": "112;8;92",
        "wc_weaknesses": "165;26;687",
        "wc_questions": "364;136;67",
        "wc_review": "741;217;913",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.0,
            0.0
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            71.33333333333333,
            21.85304453744502
        ],
        "wc_strengths_avg": [
            70.66666666666667,
            45.057987329908805
        ],
        "wc_weaknesses_avg": [
            292.6666666666667,
            284.55149895151766
        ],
        "wc_questions_avg": [
            189.0,
            126.90941651429968
        ],
        "wc_review_avg": [
            623.6666666666666,
            296.00600594507466
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:gtAHD9oKsAQJ:scholar.google.com/&scioq=Evolving+Neural+Network%27s+Weights+at+Imagenet+Scale&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1;2;0;1",
        "aff_unique_norm": "Harbin Institute of Technology;Xiamen University;Shenzhen University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.hit.edu.cn/;https://www.xmu.edu.cn;https://www.szu.edu.cn",
        "aff_unique_abbr": "HIT;XMU;SZU",
        "aff_campus_unique_index": "0;2;0;2",
        "aff_campus_unique": "Harbin;;Malaysia",
        "aff_country_unique_index": "0;0;1;0;0;0;1",
        "aff_country_unique": "China;Malaysia"
    },
    {
        "id": "3nyovHUr5A",
        "title": "Learning with Instance-Dependent Noisy Labels by Hard Sample Selection with Anchor Hallucination",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Learning from noisily-labeled data is common in real-world visual learning tasks. Mainstream Noisy-Label Learning (NLL) methods mainly focus on sample-selection approaches, which typically divide the training dataset into clean and noisy subsets according to the loss distribution of samples. However, they overlook the fact that clean samples with complex visual patterns may also yield large losses, especially for datasets with Instance-Dependent Noise (IDN), in which the probability of an image being mislabeled depends on its visual appearance. This paper extends this idea and distinguishes complex samples from noisy ones. Specifically, we first select training samples with small initial losses to form an *easy* subset, where these easy samples are assumed to contain simple patterns with correct labels. The remaining samples either have complex patterns or incorrect labels, forming a *hard* subset. Subsequently, we utilize the easy subset to hallucinate multiple anchors, which are used to select hard samples to form a *clean hard* subset. We further exploit samples from these subsets following a semi-supervised training scheme to better characterize the decision boundary. Extensive experiments on synthetic and real-world instance-dependent noisy datasets show that our method outperforms the State-of-The-Art NLL methods.",
        "keywords": "Noisy label learning;semi-supervised learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Po-Hsuan Huang;Chia-Ching Lin;Chih-Fan Hsu;Ming-Ching Chang;Wei-Chao Chen",
        "authorids": "~Po-Hsuan_Huang2;~Chia-Ching_Lin1;~Chih-Fan_Hsu1;~Ming-Ching_Chang1;~Wei-Chao_Chen1",
        "gender": ";M;M;M;M",
        "homepage": ";;https://sites.google.com/site/chihfanhsuwebsite/;https://www.albany.edu/faculty/mchang2/;",
        "dblp": ";36/9449;120/8997;21/4361;37/1413",
        "google_scholar": ";https://scholar.google.com.tw/citations?user=iJUWS9YAAAAJ;https://scholar.google.com.tw/citations?hl=en;a3-Gl8YAAAAJ;bndb0gYAAAAJ",
        "orcid": ";;0000-0002-4180-8255;0000-0001-9325-5341;",
        "linkedin": ";;;mingchingchang/edit/forms/intro/new/?profileFormEntryPoint=PROFILE_SECTION;wei-chao-chen-b4b0bb1/",
        "or_profile": "~Po-Hsuan_Huang2;~Chia-Ching_Lin1;~Chih-Fan_Hsu1;~Ming-Ching_Chang1;~Wei-Chao_Chen1",
        "aff": ";Inventec Inc.;Inventec Inc.;State University of New York at Albany;Inventec Inc.",
        "aff_domain": ";inventec.com;inventec.com;albany.edu;inventec.com",
        "position": ";Researcher;Researcher;Assistant Professor;Senior Vice President",
        "bibtex": "@misc{\nhuang2024learning,\ntitle={Learning with Instance-Dependent Noisy Labels by Hard Sample Selection with Anchor Hallucination},\nauthor={Po-Hsuan Huang and Chia-Ching Lin and Chih-Fan Hsu and Ming-Ching Chang and Wei-Chao Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=3nyovHUr5A}\n}",
        "github": "",
        "project": "",
        "reviewers": "Yvwi;T8rR;VL2q",
        "site": "https://openreview.net/forum?id=3nyovHUr5A",
        "pdf_size": 2037681,
        "rating": "3;3;5",
        "confidence": "5;4;4",
        "soundness": "2;2;3",
        "contribution": "1;2;2",
        "presentation": "1;3;3",
        "wc_summary": "83;16;85",
        "wc_strengths": "12;9;17",
        "wc_weaknesses": "297;94;88",
        "wc_questions": "2;7;91",
        "wc_review": "394;126;281",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            61.333333333333336,
            32.0659043568433
        ],
        "wc_strengths_avg": [
            12.666666666666666,
            3.2998316455372216
        ],
        "wc_weaknesses_avg": [
            159.66666666666666,
            97.14021938528974
        ],
        "wc_questions_avg": [
            33.333333333333336,
            40.827550610940264
        ],
        "wc_review_avg": [
            267.0,
            109.85748343497892
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:-aZk3EVbOrMJ:scholar.google.com/&scioq=Learning+with+Instance-Dependent+Noisy+Labels+by+Hard+Sample+Selection+with+Anchor+Hallucination&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Inventec Corporation;State University of New York",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.inventec.com;https://www.albany.edu",
        "aff_unique_abbr": "Inventec;SUNY Albany",
        "aff_campus_unique_index": "0;0;1;0",
        "aff_campus_unique": "Taiwan;Albany",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "SEGNO: Generalizing Equivariant Graph Neural Networks with Physical Inductive Biases",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19496",
        "id": "3oTPsORaDH",
        "author_site": "Yang Liu, Jiashun Cheng, Haihong Zhao, Tingyang Xu, Peilin Zhao, Fugee Tsung, Jia Li, Yu Rong",
        "tldr": "",
        "abstract": "Graph Neural Networks (GNNs) with equivariant properties have emerged as powerful tools for modeling complex dynamics of multi-object physical systems. However, their generalization ability is limited by the inadequate consideration of physical inductive biases: (1) Existing studies overlook the continuity of transitions among system states, opting to employ several discrete transformation layers to learn the direct mapping between two adjacent states; (2) Most models only account for first-order velocity information, despite the fact that many physical systems are governed by second-order motion laws. To incorporate these inductive biases, we propose the Second-order Equivariant Graph Neural Ordinary Differential Equation (SEGNO). Specifically, we show how the second-order continuity can be incorporated into GNNs while maintaining the equivariant property. Furthermore, we offer theoretical insights into SEGNO, highlighting that it can learn a unique trajectory between adjacent states, which is crucial for model generalization. Additionally, we prove that the discrepancy between this learned trajectory of SEGNO and the true trajectory is bounded. Extensive experiments on complex dynamical systems including molecular dynamics and motion capture demonstrate that our model yields a significant improvement over the state-of-the-art baselines.",
        "keywords": "Equivariant Graph Neural Network;Graph Neural Network",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/39e5fdfd3c0682b49cf79245d7776f22592626f6.zip",
        "author": "Yang Liu;Jiashun Cheng;Haihong Zhao;Tingyang Xu;Peilin Zhao;Fugee Tsung;Jia Li;Yu Rong",
        "authorids": "~Yang_Liu21;~Jiashun_Cheng1;~Haihong_Zhao2;~Tingyang_Xu1;~Peilin_Zhao2;~Fugee_Tsung1;~Jia_Li4;~Yu_Rong1",
        "gender": "M;M;M;;M;M;M;M",
        "homepage": "https://scholar.google.com/citations?hl=zh-CN&user=IWyM6l0AAAAJ;https://www.linkedin.com/in/jiashun-cheng-b2b31a149/;;;https://ieda.ust.hk/dfaculty/tsung/;https://sites.google.com/view/lijia;https://royrong.me/;https://haihongzhao.com",
        "dblp": "51/3710-245;323/4178;157/0940;84/8411;95/2794;23/6950-9;24/10036-1;116/7210",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;HVKMb10AAAAJ;6gIs5YMAAAAJ;https://scholar.google.com.hk/citations?user=HPeX_YcAAAAJ;yQVoXS0AAAAJ;1gSbcYoAAAAJ;https://scholar.google.com.hk/citations?user=itezhEMAAAAJ;",
        "orcid": "0000-0002-2633-512X;0000-0002-5485-7224;0009-0002-0106-8376;0000-0001-8543-3953;0000-0002-0575-8254;0000-0002-6362-4385;0000-0001-7387-302X;0000-0003-4188-6517",
        "linkedin": ";;;;ftsung/;;;",
        "or_profile": "~Yang_Liu21;~Jiashun_Cheng1;~Tingyang_Xu1;~Peilin_Zhao2;~Fugee_Tsung1;~Jia_Li4;~Yu_Rong1;~Haihong_ZHAO1",
        "aff": "Hong Kong University of Science and Technology;Hong Kong University of Science and Technology;Tencent AI Lab;Tencent;Hong Kong University of Science and Technology;Hong Kong University of Science and Technology (Guangzhou);Tencent AI Lab;Hong Kong University of Science and Technology",
        "aff_domain": "ust.hk;ust.hk;tencent.com;tencent.com;ust.hk;ust.hk;tencent.com;hkust.edu",
        "position": "PhD student;PhD student;Researcher;Researcher;Full Professor;Assistant Professor;Principal Researcher;PhD student",
        "bibtex": "@inproceedings{\nliu2024segno,\ntitle={{SEGNO}: Generalizing Equivariant Graph Neural Networks with Physical Inductive Biases},\nauthor={Yang Liu and Jiashun Cheng and Haihong Zhao and Tingyang Xu and Peilin Zhao and Fugee Tsung and Jia Li and Yu Rong},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=3oTPsORaDH}\n}",
        "github": "",
        "project": "",
        "reviewers": "mXJL;GrTs;rsLd",
        "pdf_size": 2762438,
        "rating": "6;6;8",
        "confidence": "4;4;3",
        "soundness": "3;3;4",
        "contribution": "2;2;4",
        "presentation": "3;3;3",
        "wc_summary": "389;56;81",
        "wc_strengths": "2;61;150",
        "wc_weaknesses": "2;327;56",
        "wc_questions": "2;271;80",
        "wc_review": "395;715;367",
        "wc_reply_reviewers": "0;17;23",
        "wc_reply_authors": "284;1874;492",
        "reply_reviewers": "0;1;1",
        "reply_authors": "2;4;2",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            175.33333333333334,
            151.42948487295627
        ],
        "wc_strengths_avg": [
            71.0,
            60.83310502240262
        ],
        "wc_weaknesses_avg": [
            128.33333333333334,
            142.1978277690001
        ],
        "wc_questions_avg": [
            117.66666666666667,
            113.00245818368535
        ],
        "wc_review_avg": [
            492.3333333333333,
            157.8635134820231
        ],
        "wc_reply_reviewers_avg": [
            13.333333333333334,
            9.741092797468305
        ],
        "wc_reply_authors_avg": [
            883.3333333333334,
            705.6350961289332
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.9999999999999998,
        "gs_citation": 22,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12252397141382208062&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=3oTPsORaDH",
        "pdf": "https://openreview.net/pdf?id=3oTPsORaDH",
        "email": "ust.hk;ust.hk;tencent.com;tencent.com;ust.hk;ust.hk;tencent.com;hkust.edu",
        "author_num": 8,
        "aff_unique_index": "0;0;1;1;0;0;1;0",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Tencent",
        "aff_unique_dep": ";Tencent AI Lab",
        "aff_unique_url": "https://www.ust.hk;https://ai.tencent.com",
        "aff_unique_abbr": "HKUST;Tencent AI Lab",
        "aff_campus_unique_index": "0;0;0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Where We Have Arrived in Proving the Emergence of Sparse Interaction Primitives in DNNs",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19495",
        "id": "3pWSL8My6B",
        "author_site": "Qihan Ren, Jiayang Gao, Wen Shen, Quanshi Zhang",
        "tldr": "",
        "abstract": "This study aims to prove the emergence of symbolic concepts (or more precisely, sparse primitive inference patterns) in well-trained deep neural networks (DNNs). Specifically, we prove the following three conditions for the emergence. (i) The high-order derivatives of the network output with respect to the input variables are all zero. (ii) The DNN can be used on occluded samples, and when the input sample is less occluded, the DNN will yield higher confidence. (iii) The confidence of the DNN does not significantly degrade on occluded samples. These conditions are quite common, and we prove that under these conditions, the DNN will only encode a relatively small number of sparse interactions between input variables. Moreover, we can consider such interactions as symbolic primitive inference patterns encoded by a DNN, because we show that inference scores of the DNN on an exponentially large number of randomly masked samples can always be well mimicked by numerical effects of just a few interactions.",
        "keywords": "Explainable AI;Neural networks;Symbolism",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Qihan Ren;Jiayang Gao;Wen Shen;Quanshi Zhang",
        "authorids": "~Qihan_Ren1;~Jiayang_Gao1;~Wen_Shen3;~Quanshi_Zhang1",
        "gender": "M;F;M;M",
        "homepage": "https://nebularaid2000.github.io/;https://ada-shen.github.io/;http://qszhang.com;https://github.com/gjy0515",
        "dblp": "268/5838;55/8186-2;http://dblp.uni-trier.de/pers/hd/z/Zhang:Quanshi;",
        "google_scholar": "ybTy_DwAAAAJ;;iFFhHK0AAAAJ;",
        "orcid": ";0000-0002-4210-5447;;",
        "linkedin": ";;;",
        "or_profile": "~Qihan_Ren1;~Wen_Shen3;~Quanshi_Zhang1;~\u4f73\u9633_\u9ad81",
        "aff": "Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn",
        "position": "PhD student;Postdoc;Associate Professor;Undergrad student",
        "bibtex": "@inproceedings{\nren2024where,\ntitle={Where We Have Arrived in Proving the Emergence of Sparse Interaction Primitives in {DNN}s},\nauthor={Qihan Ren and Jiayang Gao and Wen Shen and Quanshi Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=3pWSL8My6B}\n}",
        "github": "",
        "project": "",
        "reviewers": "iVY1;8DUx;JPCH;WKdR",
        "pdf_size": 3099888,
        "rating": "6;6;8;8",
        "confidence": "2;3;3;2",
        "soundness": "2;3;4;3",
        "contribution": "2;2;4;3",
        "presentation": "3;3;4;3",
        "wc_summary": "36;67;97;113",
        "wc_strengths": "39;33;113;46",
        "wc_weaknesses": "336;260;107;409",
        "wc_questions": "107;164;50;58",
        "wc_review": "518;524;367;626",
        "wc_reply_reviewers": "53;373;13;32",
        "wc_reply_authors": "981;3311;1169;1830",
        "reply_reviewers": "1;4;1;1",
        "reply_authors": "2;5;2;3",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            2.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            78.25,
            29.45653577731095
        ],
        "wc_strengths_avg": [
            57.75,
            32.22867512014727
        ],
        "wc_weaknesses_avg": [
            278.0,
            111.90397669430698
        ],
        "wc_questions_avg": [
            94.75,
            45.54873763344051
        ],
        "wc_review_avg": [
            508.75,
            92.41042960618677
        ],
        "wc_reply_reviewers_avg": [
            117.75,
            148.04623433238686
        ],
        "wc_reply_authors_avg": [
            1822.75,
            915.2694616887422
        ],
        "reply_reviewers_avg": [
            1.75,
            1.299038105676658
        ],
        "reply_authors_avg": [
            3.0,
            1.224744871391589
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4914810873657200932&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=3pWSL8My6B",
        "pdf": "https://openreview.net/pdf?id=3pWSL8My6B",
        "email": "sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Shanghai Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sjtu.edu.cn",
        "aff_unique_abbr": "SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Rethinking the Uniformity Metric in Self-Supervised Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19494",
        "id": "3pf2hEdu8B",
        "author_site": "Xianghong Fang, Jian Li, Qiang Sun, Wang Benyou",
        "tldr": "",
        "abstract": "Uniformity plays an important role in evaluating learned representations, providing insights into self-supervised learning. In our quest for effective uniformity metrics, we pinpoint four principled properties that such metrics should possess. Namely, an effective uniformity metric should remain invariant to instance permutations and sample replications while accurately capturing feature redundancy and dimensional collapse. Surprisingly, we find that the uniformity metric proposed by \\citet{Wang2020UnderstandingCR} fails to satisfy the majority of these properties. Specifically, their metric is sensitive to sample replications, and can not account for feature redundancy and  dimensional collapse correctly. To overcome these limitations, we introduce a new uniformity metric based on the Wasserstein distance, which satisfies all the aforementioned properties. Integrating this new metric in existing self-supervised learning methods effectively mitigates dimensional collapse and consistently improves their performance on downstream tasks involving CIFAR-10 and CIFAR-100 datasets. Code is available at \\url{https://github.com/statsle/WassersteinSSL}.",
        "keywords": "Effective uniformity metrics;dimensional collapse;Wasserstein distance;self-supervised learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/c684951f3e22d50fe6f7a9a520403451de0fd62b.pdf",
        "author": "Xianghong Fang;Jian Li;Qiang Sun;Benyou Wang",
        "authorids": "~Xianghong_Fang1;~Jian_Li17;~Qiang_Sun2;~Benyou_Wang2",
        "gender": "M;M;M;M",
        "homepage": "https://jack57lee.github.io/;https://sites.google.com/view/qsun;https://wabyking.github.io/old.html;",
        "dblp": "33/5448-54.html;73/2066-7;169/1793;202/6322.html",
        "google_scholar": ";f0V2fAYAAAAJ;Jk4vJU8AAAAJ;https://scholar.google.com.hk/citations?user=hQfxe5QAAAAJ",
        "orcid": ";;0000-0002-1501-9914;0000-0003-2250-6961",
        "linkedin": ";;;",
        "or_profile": "~Jian_Li17;~Qiang_Sun2;~Benyou_Wang2;~Fang_XiangHong1",
        "aff": "Tencent;University of Toronto;The Chinese University of Hong Kong, Shenzhen;University of Toronto",
        "aff_domain": "tencent.com;utoronto.ca;cuhk.edu.cn;utoronto.ca",
        "position": "Researcher;Full Professor;Assistant Professor;PhD student",
        "bibtex": "@inproceedings{\nfang2024rethinking,\ntitle={Rethinking the Uniformity Metric in Self-Supervised Learning},\nauthor={Xianghong Fang and Jian Li and Qiang Sun and Benyou Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=3pf2hEdu8B}\n}",
        "github": "",
        "project": "",
        "reviewers": "u9aL;a1G3;KkL8;RABe",
        "pdf_size": 1523269,
        "rating": "5;5;6;8",
        "confidence": "4;5;2;3",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;2;2;4",
        "wc_summary": "119;96;29;60",
        "wc_strengths": "131;26;17;75",
        "wc_weaknesses": "126;155;25;116",
        "wc_questions": "19;4;12;52",
        "wc_review": "395;281;83;303",
        "wc_reply_reviewers": "171;47;15;0",
        "wc_reply_authors": "1304;1608;398;335",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "3;5;1;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            76.0,
            34.32928778754374
        ],
        "wc_strengths_avg": [
            62.25,
            45.41681957160805
        ],
        "wc_weaknesses_avg": [
            105.5,
            48.63383595810637
        ],
        "wc_questions_avg": [
            21.75,
            18.25342433627181
        ],
        "wc_review_avg": [
            265.5,
            113.71345566818378
        ],
        "wc_reply_reviewers_avg": [
            58.25,
            67.27323018853785
        ],
        "wc_reply_authors_avg": [
            911.25,
            555.6983781693086
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            1.6583123951777
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5477225575051661,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:P8Ys2UUAgwIJ:scholar.google.com/&scioq=Rethinking+the+Uniformity+Metric+in+Self-Supervised+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=3pf2hEdu8B",
        "pdf": "https://openreview.net/pdf?id=3pf2hEdu8B",
        "email": "tencent.com;utoronto.ca;cuhk.edu.cn;utoronto.ca",
        "author_num": 4,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "Tencent;University of Toronto;Chinese University of Hong Kong",
        "aff_unique_dep": "Tencent Holdings Limited;;",
        "aff_unique_url": "https://www.tencent.com;https://www.utoronto.ca;https://www.cuhk.edu.cn",
        "aff_unique_abbr": "Tencent;U of T;CUHK",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Shenzhen",
        "aff_country_unique_index": "0;1;0;1",
        "aff_country_unique": "China;Canada"
    },
    {
        "id": "3pgJNIx3gc",
        "title": "AlphaFold Distillation for Protein Design",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Inverse protein folding, the process of designing sequences that fold into a specific 3D structure, is crucial in bio-engineering and drug discovery. Traditional methods rely on experimentally resolved structures, but these cover only a small fraction of protein sequences. Forward folding models like AlphaFold offer a potential solution by accurately predicting structures from sequences. However, these models are too slow for integration into the optimization loop of inverse folding models during training.\nTo address this, we propose using knowledge distillation on folding model confidence metrics, such as pTM or pLDDT scores, to create faster and end-to-end differentiable distilled model. This model can then be used as a structure consistency regularizer in training the inverse folding model. Our technique is versatile and can be applied to other design tasks, such as sequence-based protein infilling.\nExperimental results show that our method outperforms non-regularized baselines, yielding up to 3\\% improvement in sequence recovery and up to 45\\% improvement in protein diversity while maintaining structural consistency in generated sequences. Anonymized code for this work is available at https://anonymous.4open.science/r/AFDistill-28C3",
        "keywords": "Inverse Protein Folding Design;Protein Design;Model Distillation;AlphaFold;Protein Folding",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Igor Melnyk;Aurelie Lozano;Payel Das;Vijil Chenthamarakshan",
        "authorids": "~Igor_Melnyk1;~Aurelie_Lozano1;~Payel_Das1;~Vijil_Chenthamarakshan1",
        "gender": "M;F;F;M",
        "homepage": "https://imelnyk.github.io/;https://research.ibm.com/people/aurelie-lozano;;https://researcher.watson.ibm.com/researcher/view.php?person=us-ecvijil",
        "dblp": ";06/274;56/7926;",
        "google_scholar": "4vDRTWwAAAAJ;4wTGaDsAAAAJ;;g9hboJ0AAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Igor_Melnyk1;~Aurelie_Lozano1;~Payel_Das1;~Vijil_Chenthamarakshan1",
        "aff": "International Business Machines;IBM Research;IBM, International Business Machines;International Business Machines",
        "aff_domain": "ibm.com;us.ibm.com;us.ibm.com;ibm.com",
        "position": "Researcher;Principal Researcher;Principal Researcher;Senior Technical Staff member",
        "bibtex": "@misc{\nmelnyk2024alphafold,\ntitle={AlphaFold Distillation for Protein Design},\nauthor={Igor Melnyk and Aurelie Lozano and Payel Das and Vijil Chenthamarakshan},\nyear={2024},\nurl={https://openreview.net/forum?id=3pgJNIx3gc}\n}",
        "github": "",
        "project": "",
        "reviewers": "6HvL;XUpx;s5YM",
        "site": "https://openreview.net/forum?id=3pgJNIx3gc",
        "pdf_size": 2714676,
        "rating": "3;3;5",
        "confidence": "5;4;4",
        "soundness": "1;3;2",
        "contribution": "2;2;2",
        "presentation": "2;3;3",
        "wc_summary": "75;97;82",
        "wc_strengths": "26;29;32",
        "wc_weaknesses": "161;125;47",
        "wc_questions": "45;11;124",
        "wc_review": "307;262;285",
        "wc_reply_reviewers": "68;112;0",
        "wc_reply_authors": "422;1094;487",
        "reply_reviewers": "1;1;0",
        "reply_authors": "1;2;1",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            84.66666666666667,
            9.177266598624136
        ],
        "wc_strengths_avg": [
            29.0,
            2.449489742783178
        ],
        "wc_weaknesses_avg": [
            111.0,
            47.58150901348127
        ],
        "wc_questions_avg": [
            60.0,
            47.33568069296845
        ],
        "wc_review_avg": [
            284.6666666666667,
            18.372685039360892
        ],
        "wc_reply_reviewers_avg": [
            60.0,
            46.07240678178932
        ],
        "wc_reply_authors_avg": [
            667.6666666666666,
            302.628852263333
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15258041265459336797&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "International Business Machines Corporation;IBM;International Business Machines",
        "aff_unique_dep": ";IBM Research;",
        "aff_unique_url": "https://www.ibm.com;https://www.ibm.com/research;https://www.ibm.com",
        "aff_unique_abbr": "IBM;IBM;IBM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "LRR: Language-Driven Resamplable Continuous Representation against Adversarial Tracking Attacks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19493",
        "id": "3qo1pJHabg",
        "author_site": "Jianlang Chen, Xuhong Ren, Qing Guo, Felix Juefei-Xu, Di Lin, Wei Feng, Lei Ma, Jianjun Zhao",
        "tldr": "",
        "abstract": "Visual object tracking plays a critical role in visual-based autonomous systems, as it aims to estimate the position and size of the object of interest within a live video. Despite significant progress made in this field, state-of-the-art (SOTA) trackers often fail when faced with adversarial perturbations in the incoming frames. This can lead to significant robustness and security issues when these trackers are deployed in the real world. To achieve high accuracy on both clean and adversarial data, we propose building a spatial-temporal continuous representation using the semantic text guidance of the object of interest. This novel continuous representation enables us to reconstruct incoming frames to maintain semantic and appearance consistency with the object of interest and its clean counterparts. As a result, our proposed method successfully defends against different SOTA adversarial tracking attacks while maintaining high accuracy on clean data. In particular, our method significantly increases tracking accuracy under adversarial attacks with around 90% relative improvement on UAV123, which is even higher than the accuracy on clean data.",
        "keywords": "Tracking defence;spatial-temporal implicit representation;languange-image model",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/68d998940505f042f10064d97ab0ab3404c58553.pdf",
        "author": "Jianlang Chen;Xuhong Ren;Qing Guo;Felix Juefei-Xu;Di Lin;Wei Feng;Lei Ma;Jianjun Zhao",
        "authorids": "~Jianlang_Chen1;~Xuhong_Ren1;~Qing_Guo3;~Felix_Juefei-Xu1;~Di_Lin3;~Wei_Feng1;~Lei_Ma1;~Jianjun_Zhao1",
        "gender": ";F;M;;M;M;M;M",
        "homepage": ";https://www.facebook.com/profile.php?id=100074098905175;https://tsingqguo.github.io;;https://dilincv.github.io/;;https://www.malei.org;http://stap.ait.kyushu-u.ac.jp/~zhao/",
        "dblp": ";;25/3038-5;;20/3191-2.html;17/1152-5;20/6534-3;71/6948",
        "google_scholar": ";;Rj2x4QUAAAAJ;;rW0r-hMAAAAJ;https://scholar.google.co.jp/citations?user=7ory1i8AAAAJ;xsfGc58AAAAJ;https://scholar.google.com/scholar?hl=en",
        "orcid": ";;0000-0003-0974-9299;;;;;",
        "linkedin": ";;;;;;lei-ma-345a0484;jianjunzhao/",
        "or_profile": "~Jianlang_Chen1;~Xuhong_Ren1;~Qing_Guo3;~Felix_Juefei-Xu1;~Di_Lin3;~Wei_Feng1;~Lei_Ma1;~Jianjun_Zhao1",
        "aff": ";Tianjin University of Technology; Agency for Science, Technology and Research (A*STAR));;Tianjin University;Tianjin University;University of Alberta;Kyushu University",
        "aff_domain": ";tjut.edu.cn;cfar.a-star.edu.sg;;tju.edu.cn;tju.edu.cn;ualberta.ca;kyushu-u.ac.jp",
        "position": ";PhD student;Researcher;;Associate Professor;Full Professor;Associate Professor;Full Professor",
        "bibtex": "@inproceedings{\nchen2024lrr,\ntitle={{LRR}: Language-Driven Resamplable Continuous Representation against Adversarial Tracking Attacks},\nauthor={Jianlang Chen and Xuhong Ren and Qing Guo and Felix Juefei-Xu and Di Lin and Wei Feng and Lei Ma and Jianjun Zhao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=3qo1pJHabg}\n}",
        "github": "",
        "project": "",
        "reviewers": "DMWE;n1Fj;bxnS",
        "pdf_size": 7849670,
        "rating": "5;6;6",
        "confidence": "5;4;4",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "2;2;2",
        "wc_summary": "71;76;71",
        "wc_strengths": "34;52;44",
        "wc_weaknesses": "126;135;118",
        "wc_questions": "15;48;48",
        "wc_review": "246;311;281",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1226;1126;603",
        "reply_reviewers": "0;0;0",
        "reply_authors": "4;4;4",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            72.66666666666667,
            2.357022603955158
        ],
        "wc_strengths_avg": [
            43.333333333333336,
            7.363574011458174
        ],
        "wc_weaknesses_avg": [
            126.33333333333333,
            6.944222218666553
        ],
        "wc_questions_avg": [
            37.0,
            15.556349186104045
        ],
        "wc_review_avg": [
            279.3333333333333,
            26.562295750848712
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            985.0,
            273.18247869632245
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            4.0,
            0.0
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.9999999999999998,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6269508987053163622&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=3qo1pJHabg",
        "pdf": "https://openreview.net/pdf?id=3qo1pJHabg",
        "email": ";tjut.edu.cn;cfar.a-star.edu.sg;;tju.edu.cn;tju.edu.cn;ualberta.ca;kyushu-u.ac.jp",
        "author_num": 8,
        "aff_unique_index": "0;1;2;2;3;4",
        "aff_unique_norm": "Tianjin University of Technology;Agency for Science, Technology and Research;Tianjin University;University of Alberta;Kyushu University",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "http://www.tjut.edu.cn;https://www.a-star.edu.sg;http://www.tju.edu.cn;https://www.ualberta.ca;https://www.kyushu-u.ac.jp",
        "aff_unique_abbr": "TUT;A*STAR;TJU;UAlberta;Kyushu U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;2;3",
        "aff_country_unique": "China;Singapore;Canada;Japan"
    },
    {
        "id": "3rBu7dR7rm",
        "title": "Unified Long-Term Time-Series Forecasting Benchmark",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In order to support the advancement of machine learning methods for predicting time-series data, we present a comprehensive dataset designed explicitly for long-term time-series forecasting. We incorporate a collection of datasets obtained from diverse, dynamic systems and real-life records. Each dataset is standardized by dividing it into training and test trajectories with predetermined lookback lengths. We include trajectories of length up to $2000$ to ensure a reliable evaluation of long-term forecasting capabilities. To determine the most effective model in diverse scenarios, we conduct an extensive benchmarking analysis using classical and state-of-the-art models, namely LSTM, DeepAR, NLinear, N-Hits, PatchTST, and LatentODE. Our findings reveal intriguing performance comparisons among these models, highlighting the dataset-dependent nature of model effectiveness. Notably, we introduce a custom latent NLinear model and enhance DeepAR with a curriculum learning phase. Both consistently outperform their vanilla counterparts.",
        "keywords": "time-series;forecasting;long-term;benchmark;neural network",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/d531b4956510f30cbbe4177c5acf89bf1d1d531c.zip",
        "author": "Jacek Cyranka;Szymon Jan Haponiuk",
        "authorids": "~Jacek_Cyranka1;~Szymon_Jan_Haponiuk1",
        "gender": ";M",
        "homepage": ";",
        "dblp": "142/0441;",
        "google_scholar": "-60x4zkAAAAJ;2PRTAF4AAAAJ",
        "orcid": "0000-0001-5719-0616;",
        "linkedin": "cyranka/;szymon-haponiuk-a3901115b/",
        "or_profile": "~Jacek_Cyranka1;~Szymon_Jan_Haponiuk1",
        "aff": "University of Warsaw;University of Warsaw",
        "aff_domain": "mimuw.edu.pl;mimuw.edu.pl",
        "position": "Assistant Professor;MS student",
        "bibtex": "@misc{\ncyranka2024unified,\ntitle={Unified Long-Term Time-Series Forecasting  Benchmark},\nauthor={Jacek Cyranka and Szymon Jan Haponiuk},\nyear={2024},\nurl={https://openreview.net/forum?id=3rBu7dR7rm}\n}",
        "github": "",
        "project": "",
        "reviewers": "av6e;ptT1;WuTL",
        "site": "https://openreview.net/forum?id=3rBu7dR7rm",
        "pdf_size": 5058133,
        "rating": "3;5;5",
        "confidence": "4;4;2",
        "soundness": "2;2;1",
        "contribution": "2;2;1",
        "presentation": "2;3;2",
        "wc_summary": "38;132;216",
        "wc_strengths": "18;221;8",
        "wc_weaknesses": "150;404;8",
        "wc_questions": "44;97;8",
        "wc_review": "250;854;240",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "614;1514;518",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;3;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            128.66666666666666,
            72.70641114937679
        ],
        "wc_strengths_avg": [
            82.33333333333333,
            98.1370923193106
        ],
        "wc_weaknesses_avg": [
            187.33333333333334,
            163.80747507024486
        ],
        "wc_questions_avg": [
            49.666666666666664,
            36.55437350334734
        ],
        "wc_review_avg": [
            448.0,
            287.11437906636905
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            882.0,
            448.60673200477055
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11549142946293258542&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Warsaw",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uw.edu.pl",
        "aff_unique_abbr": "UW",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Poland"
    },
    {
        "title": "Boosting Vanilla Lightweight Vision Transformers via Re-parameterization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19492",
        "id": "3rmpixOjPS",
        "author_site": "Zhentao Tan, Xiaodan Li, Yue Wu, Qi Chu, Le Lu, Nenghai Yu, Jieping Ye",
        "tldr": "",
        "abstract": "Large-scale Vision Transformers have achieved promising performance on downstream tasks through feature pre-training. However, the performance of vanilla lightweight Vision Transformers (ViTs) is still far from satisfactory compared to that of recent lightweight CNNs or hybrid networks. In this paper, we aim to unlock the potential of vanilla lightweight ViTs by exploring the adaptation of the widely-used re-parameterization technology to ViTs for improving learning ability during training without increasing the inference cost. The main challenge comes from the fact that CNNs perfectly complement with re-parameterization over convolution and batch normalization, while vanilla Transformer architectures are mainly comprised of linear and layer normalization layers. We propose to incorporate the nonlinear ensemble into linear layers by expanding the depth of the linear layers with batch normalization and fusing multiple linear features with hierarchical representation ability through a pyramid structure. We also discover and solve a new transformer-specific distribution rectification problem caused by multi-branch re-parameterization. Finally, we propose our Two-Dimensional Re-parameterized Linear module (TDRL) for ViTs. Under the popular self-supervised pre-training and supervised fine-tuning strategy, our TDRL can be used in these two stages to enhance both generic and task-specific representation. Experiments demonstrate that our proposed method not only boosts the performance of vanilla Vit-Tiny on various vision tasks to new state-of-the-art (SOTA) but also shows promising generality ability on other networks. Code will be available.",
        "keywords": "Vision Transformers;Re-parameterization;Lightweight Models",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/75c9d86ba84232b31ffd8b9cdd0286c7a6152539.zip",
        "author": "Zhentao Tan;Xiaodan Li;Yue Wu;Qi Chu;Le Lu;Nenghai Yu;Jieping Ye",
        "authorids": "~Zhentao_Tan1;~Xiaodan_Li1;~Yue_Wu18;~Qi_Chu1;~Le_Lu3;~Nenghai_Yu1;~Jieping_Ye4",
        "gender": "M;F;;M;M;M;M",
        "homepage": ";;;http://www.cs.jhu.edu/~lelu/;;http://yelabs.net/;",
        "dblp": "211/5776;126/7789;52/9077-1;78/6574-1.html;96/5144;03/5454;",
        "google_scholar": "VCX7itEAAAAJ;YximuHAAAAAJ;JZjOMdsAAAAJ;kZn0f6gAAAAJ;https://scholar.google.com.hk/citations?user=7620QAMAAAAJ;T9AzhwcAAAAJ;srajsjoAAAAJ",
        "orcid": "0000-0001-9095-4462;;0000-0003-3028-0755;0000-0002-6799-9416;;0000-0001-8662-5818;",
        "linkedin": ";;;tigerlelu/;;;",
        "or_profile": "~Zhentao_Tan1;~Xiaodan_Li1;~Qi_Chu1;~Le_Lu3;~Nenghai_Yu1;~Jieping_Ye4;~Yue_Wu3",
        "aff": "University of Science and Technology of China;Alibaba Group;University of Science and Technology of China;Alibaba Group;University of Science and Technology of China;Alibaba Group;Alibaba Group",
        "aff_domain": "ustc.edu.cn;alibaba-inc.com;ustc.edu.cn;alibaba-inc.com;ustc.edu.cn;alibaba-inc.com;alibaba-inc.com",
        "position": "Postdoc;Researcher;Associate Professor;Full Professor;Full Professor;Principal Researcher;Researcher",
        "bibtex": "@inproceedings{\ntan2024boosting,\ntitle={Boosting Vanilla Lightweight Vision Transformers via Re-parameterization},\nauthor={Zhentao Tan and Xiaodan Li and Yue Wu and Qi Chu and Le Lu and Nenghai Yu and Jieping Ye},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=3rmpixOjPS}\n}",
        "github": "",
        "project": "",
        "reviewers": "Yszy;WZef;GsFu;wWZH;HAf5",
        "pdf_size": 816146,
        "rating": "6;6;8;8;8",
        "confidence": "5;3;4;4;4",
        "soundness": "4;3;3;3;2",
        "contribution": "3;3;4;3;2",
        "presentation": "3;3;4;2;2",
        "wc_summary": "47;67;168;70;77",
        "wc_strengths": "39;37;55;131;22",
        "wc_weaknesses": "93;96;58;124;100",
        "wc_questions": "3;2;12;3;53",
        "wc_review": "182;202;293;328;252",
        "wc_reply_reviewers": "13;0;14;85;327",
        "wc_reply_authors": "589;429;543;630;1608",
        "reply_reviewers": "1;0;1;1;2",
        "reply_authors": "3;2;3;3;7",
        "rating_avg": [
            7.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            3.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            3.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            2.8,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            85.8,
            42.291370278107564
        ],
        "wc_strengths_avg": [
            56.8,
            38.54555746126913
        ],
        "wc_weaknesses_avg": [
            94.2,
            21.15088650624366
        ],
        "wc_questions_avg": [
            14.6,
            19.540726700918775
        ],
        "wc_review_avg": [
            251.4,
            54.507247224566385
        ],
        "wc_reply_reviewers_avg": [
            87.8,
            123.26783846567602
        ],
        "wc_reply_authors_avg": [
            759.8,
            429.3937121104593
        ],
        "reply_reviewers_avg": [
            1.0,
            0.6324555320336759
        ],
        "reply_authors_avg": [
            3.6,
            1.7435595774162693
        ],
        "replies_avg": [
            33,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3696924111028153520&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=3rmpixOjPS",
        "pdf": "https://openreview.net/pdf?id=3rmpixOjPS",
        "email": "ustc.edu.cn;alibaba-inc.com;ustc.edu.cn;alibaba-inc.com;ustc.edu.cn;alibaba-inc.com;alibaba-inc.com",
        "author_num": 7,
        "aff_unique_index": "0;1;0;1;0;1;1",
        "aff_unique_norm": "University of Science and Technology of China;Alibaba Group",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.ustc.edu.cn;https://www.alibaba.com",
        "aff_unique_abbr": "USTC;Alibaba",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "3s4fZTr1ce",
        "title": "RLAdapter: Bridging Large Language Models to Reinforcement Learning in Open Worlds",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "While reinforcement learning (RL) shows remarkable success in decision-making problems, it often requires a lot of interactions with the environment, and in sparse-reward environments, it is challenging to learn meaningful policies. Large Language Models (LLMs) can potentially provide valuable guidance to agents in learning policies, thereby enhancing the performance of RL algorithms in such environments. However, LLMs often encounter difficulties in understanding downstream tasks, which hinders their ability to optimally assist agents in these tasks. A common approach to mitigating this issue is to fine-tune the LLMs with task-related data, enabling them to offer useful guidance for RL agents. However, this approach encounters several difficulties, such as inaccessible model weights or the need for significant computational resources, making it impractical. In this work, we introduce RLAdapter, a framework that builds a better connection between RL algorithms and LLMs by incorporating an adapter model. Within the RLAdapter framework, fine-tuning a lightweight language model with information generated during the training process of RL agents significantly aids LLMs in adapting to downstream tasks, thereby providing better guidance for RL agents. We conducted experiments to evaluate RLAdapter in the Crafter environment, and the results show that RLAdapter surpasses the SOTA baselines. Furthermore, agents under our framework exhibit common-sense behaviors that are absent in baseline models.",
        "keywords": "Reinforcement Learning;Large Language Models",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Wanpeng Zhang;Zongqing Lu",
        "authorids": "~Wanpeng_Zhang1;~Zongqing_Lu2",
        "gender": "M;",
        "homepage": "https://zhangwp.com;",
        "dblp": "73/10693-2;",
        "google_scholar": "_IKNf9EAAAAJ;",
        "orcid": "0000-0001-5351-3449;",
        "linkedin": ";",
        "or_profile": "~Wanpeng_Zhang1;~Zongqing_Lu2",
        "aff": "Peking University;",
        "aff_domain": "pku.edu.cn;",
        "position": "PhD student;",
        "bibtex": "@misc{\nzhang2024rladapter,\ntitle={{RLA}dapter: Bridging Large Language Models to Reinforcement Learning in Open Worlds},\nauthor={Wanpeng Zhang and Zongqing Lu},\nyear={2024},\nurl={https://openreview.net/forum?id=3s4fZTr1ce}\n}",
        "github": "",
        "project": "",
        "reviewers": "aWpB;1niL;6tyY;mt27",
        "site": "https://openreview.net/forum?id=3s4fZTr1ce",
        "pdf_size": 2536279,
        "rating": "3;3;3;5",
        "confidence": "4;2;4;3",
        "soundness": "2;2;2;3",
        "contribution": "2;3;2;3",
        "presentation": "3;4;3;2",
        "wc_summary": "131;188;100;98",
        "wc_strengths": "60;135;103;80",
        "wc_weaknesses": "217;95;364;159",
        "wc_questions": "46;847;231;185",
        "wc_review": "454;1265;798;522",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            129.25,
            36.355020286062285
        ],
        "wc_strengths_avg": [
            94.5,
            27.897132469126642
        ],
        "wc_weaknesses_avg": [
            208.75,
            99.47958333246073
        ],
        "wc_questions_avg": [
            327.25,
            307.7095830486922
        ],
        "wc_review_avg": [
            759.75,
            318.8842854390915
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.17407765595569782,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12669604310559425831&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0",
        "aff_unique_norm": "Peking University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.pku.edu.cn",
        "aff_unique_abbr": "Peking U",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "3sOE3MFepx",
        "title": "PDE-Diffusion: Physic guided diffusion model for solving partial derivative equations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Solving partial differential equations (PDEs) is crucial in various disciplines, and their resolution often necessitates the use of computationally intensive numerical methods as well as specialized domain expertise. While data-driven approaches have emerged as promising alternatives, they encounter limitations in terms of generalizability, interpretability, and long-horizon predictive performance, as well as issues related to temporal incoherence. To address these challenges, we introduce the PDE-Diffusion, a two-stage model with three distinctive features: (i) the incorporation of physics-based priors to enhance model interpretability and generalization, (ii) a two-stage diffusion model that efficiently handles physical field forecasting without requiring multi-frame inputs, and (iii) the assimilation of PDE-informed constraints to ensure temporal coherence while producing high-quality predictive results. We conduct extensive experiments to evaluate PDE-Diffusion's capabilities using the PDEBench dataset and two of our newly proposed datasets. The results indicate that PDE-Diffusion delivers state-of-the-art performance in all cases.",
        "keywords": "AI for science;PDE;diffusion model;generative model",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/7fecff3c4ea127c6363e0c6652a5afb4cd969e6c.zip",
        "author": "Chonghan Gao;Haoyi Zhou;wen xin gong;QING PO WU WU;Tianyu Chen;Qian Yu;Shanghang Zhang;Jianxin Li",
        "authorids": "~Chonghan_Gao1;~Haoyi_Zhou1;~wen_xin_gong1;~QING_PO_WU_WU1;~Tianyu_Chen1;~Qian_Yu4;~Shanghang_Zhang4;~Jianxin_Li3",
        "gender": "M;M;M;;M;F;;M",
        "homepage": "https://homepage-gao.vercel.app/;https://www.zhouhaoyi.com/;https://github.com/ruoyunbai;;https://github.com/Tarpelite;https://yuqian1023.github.io/;;http://myjianxin.github.io",
        "dblp": ";162/1287;;;;;;l/JianxinLi-2.html",
        "google_scholar": "9O6yafkAAAAJ;mbrFlN0AAAAJ;;;;mmm90qgAAAAJ;;EY2lqD0AAAAJ",
        "orcid": ";0000-0002-2393-3634;;;;0000-0002-0538-7940;;0000-0001-5152-0055",
        "linkedin": ";haoyi-zhou-54a7a69a/;;;;;;",
        "or_profile": "~Chonghan_Gao1;~Haoyi_Zhou1;~wen_xin_gong1;~QING_PO_WU_WU1;~Tianyu_Chen1;~Qian_Yu4;~Shanghang_Zhang4;~Jianxin_Li3",
        "aff": "Beihang University;Beihang University;Beihang University;;Beihang University;Beihang University;;Beihang University ",
        "aff_domain": "buaa.edu.cn;buaa.edu.cn;buaa.edu.cn;;buaa.edu.cn;buaa.edu.cn;;buaa.edu.cn",
        "position": "PhD student;Assistant Professor;Undergrad student;;PhD student;Associate Professor;;Full Professor",
        "bibtex": "@misc{\ngao2024pdediffusion,\ntitle={{PDE}-Diffusion: Physic guided diffusion model for solving partial derivative equations},\nauthor={Chonghan Gao and Haoyi Zhou and wen xin gong and QING PO WU WU and Tianyu Chen and Qian Yu and Shanghang Zhang and Jianxin Li},\nyear={2024},\nurl={https://openreview.net/forum?id=3sOE3MFepx}\n}",
        "github": "",
        "project": "",
        "reviewers": "Mvr7;uZRL;Hhh3;t73C;p93J",
        "site": "https://openreview.net/forum?id=3sOE3MFepx",
        "pdf_size": 443502,
        "rating": "1;1;3;3;3",
        "confidence": "4;5;4;3;5",
        "soundness": "1;1;1;2;3",
        "contribution": "2;1;1;2;2",
        "presentation": "2;1;2;2;1",
        "wc_summary": "38;28;116;52;38",
        "wc_strengths": "49;25;14;58;67",
        "wc_weaknesses": "365;164;658;150;69",
        "wc_questions": "1;9;3;57;205",
        "wc_review": "453;226;791;317;379",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            2.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            4.2,
            0.7483314773547882
        ],
        "soundness_avg": [
            1.6,
            0.8
        ],
        "contribution_avg": [
            1.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            1.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            54.4,
            31.733893552477927
        ],
        "wc_strengths_avg": [
            42.6,
            20.0059991002699
        ],
        "wc_weaknesses_avg": [
            281.2,
            212.12204034470346
        ],
        "wc_questions_avg": [
            55.0,
            77.76888838089432
        ],
        "wc_review_avg": [
            433.2,
            193.79618159293025
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.3273268353539886,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:AHhXA_niAW4J:scholar.google.com/&scioq=PDE-Diffusion:+Physic+guided+diffusion+model+for+solving+partial+derivative+equations&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "Beihang University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.buaa.edu.cn/",
        "aff_unique_abbr": "BUAA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "3t57X1Fvaf",
        "title": "Learning Graph Representation for Model Ensemble",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We introduce, LGR-ME (Learning Graph Representation for Model Ensemble), a groundbreaking approach within the domain of general-purpose learning systems. Its primary focal point is to establish a foundational framework that facilitates self-adaptation and versatility in the ever-evolving landscape of emerging machine learning tasks. Despite the strides made in machine learning, it has yet to reach the adaptive and all-encompassing cognitive prowess demonstrated by biological learning systems. This discrepancy is particularly pronounced in the sphere of replicating learning representations and mastering a diverse spectrum of general-purpose learning algorithms. Our proposition entails a graph-centered representation of machine learning models. This representation operates on a graph composed of models, where the interconnections among akin models are established based on model specifications and their corresponding performances. In pursuit of this representation, we employ a graph neural network to undergo training. In this aspect, we present a novel method through the utilization of the top $k$ maximum spanning trees. This encoding is then subjected to training by a meta-model that minimizes a newly devised loss function. This combined loss function effectively accounts for both Diversity and Accuracy. Furthermore, we provide a theoretical examination of both the graph encoding algorithm and the newly introduced loss function. This advanced training process engenders an understanding of the intricate interdependencies and correlations existing among the model ensemble. The acquired features are subsequently harnessed to generate the ultimate output for the initial task at hand. By means of extensive empirical comparisons, we showcase the efficacy of LGR-ME in contrast to solutions predicated on ensemble pruning techniques (additional details can be found in the Appendix).",
        "keywords": "Model Ensemble;Graph Representation;Graph Convolution Neural Network",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/22a77cee1bc7119f52f245ba6c1bdc83c9e9bdf7.zip",
        "author": "Nassim Belmecheri;Youcef Djenouri;Philip S. Yu",
        "authorids": "~Nassim_Belmecheri1;~Youcef_Djenouri1;~Philip_S._Yu1",
        "gender": "M;M;M",
        "homepage": "https://www.simula.no/people/nassim;https://sites.google.com/site/youcefdjenouri/;https://cs.uic.edu/profiles/philip-yu/",
        "dblp": "315/2623.html;;y/PhilipSYu",
        "google_scholar": "VccEbq4AAAAJ;;D0lL1r0AAAAJ",
        "orcid": ";;0000-0002-3491-5968",
        "linkedin": ";;",
        "or_profile": "~Nassim_Belmecheri1;~Youcef_Djenouri1;~Philip_S._Yu1",
        "aff": "Simula Research Laboratory;Norwegian Research Center;University of Illinois Chicago",
        "aff_domain": "simula.no;norceresearch.no;uic.edu",
        "position": "Postdoc;Principal Researcher;Full Professor",
        "bibtex": "@misc{\nbelmecheri2024learning,\ntitle={Learning Graph Representation for Model Ensemble},\nauthor={Nassim Belmecheri and Youcef Djenouri and Philip S. Yu},\nyear={2024},\nurl={https://openreview.net/forum?id=3t57X1Fvaf}\n}",
        "github": "",
        "project": "",
        "reviewers": "3xiQ;oYx9;eLAm;WLfx",
        "site": "https://openreview.net/forum?id=3t57X1Fvaf",
        "pdf_size": 997391,
        "rating": "1;1;1;3",
        "confidence": "5;3;3;4",
        "soundness": "1;2;1;2",
        "contribution": "1;1;1;2",
        "presentation": "1;1;2;1",
        "wc_summary": "95;81;52;75",
        "wc_strengths": "63;9;20;31",
        "wc_weaknesses": "431;110;150;352",
        "wc_questions": "73;32;10;143",
        "wc_review": "662;232;232;601",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            1.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            1.5,
            0.5
        ],
        "contribution_avg": [
            1.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            75.75,
            15.514106484100203
        ],
        "wc_strengths_avg": [
            30.75,
            20.17888748172208
        ],
        "wc_weaknesses_avg": [
            260.75,
            134.44585341318637
        ],
        "wc_questions_avg": [
            64.5,
            50.64829710858994
        ],
        "wc_review_avg": [
            431.75,
            200.91089442835099
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.17407765595569782,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:jHQx2Od6haQJ:scholar.google.com/&scioq=Learning+Graph+Representation+for+Model+Ensemble&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Simula Research Laboratory;Norwegian Research Center;University of Illinois at Chicago",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.simula.no;;https://www.uic.edu",
        "aff_unique_abbr": "Simula;;UIC",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Chicago",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "Norway;United States"
    },
    {
        "title": "Generative Learning for Solving Non-Convex Problem with Multi-Valued Input-Solution Mapping",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19491",
        "id": "3tM1l5tSbv",
        "author_site": "Enming Liang, Minghua Chen",
        "tldr": "",
        "abstract": "By employing neural networks (NN) to learn input-solution mappings and passing a new input through the learned mapping to obtain a solution instantly, recent studies have shown remarkable speed improvements over iterative algorithms for solving optimization problems. Meanwhile, they also highlight methodological challenges to be addressed. In particular, general non-convex problems often present multiple optimal solutions for identical inputs, signifying a complex, multi-valued input-solution mapping. Conventional learning techniques, primarily tailored to learn single-valued mappings, struggle to train NNs to accurately decipher multi-valued ones, leading to inferior solutions. We address this fundamental issue by developing a generative learning approach using a rectified flow (RectFlow) model built upon ordinary differential equations. In contrast to learning input-solution mapping, we learn the mapping from input to solution distribution, exploiting the universal approximation capability of the RectFlow model. Upon receiving a new input, we employ the trained RectFlow model to sample high-quality solutions from the input-dependent distribution it has learned. Our approach outperforms conceivable GAN and Diffusion models in terms of training stability and run-time complexity. We provide a detailed characterization of the optimality loss and runtime complexity associated with our generative approach. Simulation results for solving non-convex problems show that our method achieves significantly better solution optimality than recent NN schemes, with comparable feasibility and speedup performance.",
        "keywords": "Non-convex optimization;Multi-valued solution mapping;Generative model;Ordinary differential equation;Supervised learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Enming Liang;Minghua Chen",
        "authorids": "~Enming_Liang1;~Minghua_Chen1",
        "gender": "M;M",
        "homepage": "https://emliang.github.io/;https://www.mhchen.com",
        "dblp": ";12/4395-1.html",
        "google_scholar": "https://scholar.google.com.sg/citations?user=Todfu6AAAAAJ;https://scholar.google.com.hk/citations?user=WzEQ9QwAAAAJ",
        "orcid": ";0000-0003-4763-0037",
        "linkedin": "enming-liang-95b5b216a/;",
        "or_profile": "~Enming_Liang1;~Minghua_Chen1",
        "aff": "City University of Hong Kong;City University of Hong Kong",
        "aff_domain": "cityu.edu.hk;cityu.edu.hk",
        "position": "PhD student;Full Professor",
        "bibtex": "@inproceedings{\nliang2024generative,\ntitle={Generative Learning for Solving Non-Convex Problem with Multi-Valued Input-Solution Mapping},\nauthor={Enming Liang and Minghua Chen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=3tM1l5tSbv}\n}",
        "github": "",
        "project": "",
        "reviewers": "rFky;GsRT;85JM;ibgc",
        "pdf_size": 6099014,
        "rating": "5;6;8;8",
        "confidence": "3;3;4;4",
        "soundness": "2;3;4;4",
        "contribution": "2;3;4;4",
        "presentation": "3;2;4;3",
        "wc_summary": "54;95;218;21",
        "wc_strengths": "46;71;94;53",
        "wc_weaknesses": "193;127;91;94",
        "wc_questions": "118;49;64;66",
        "wc_review": "411;342;467;234",
        "wc_reply_reviewers": "43;41;82;0",
        "wc_reply_authors": "2414;1488;936;675",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "7;5;3;2",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            3.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            97.0,
            74.61568199782134
        ],
        "wc_strengths_avg": [
            66.0,
            18.560711193270585
        ],
        "wc_weaknesses_avg": [
            126.25,
            41.04494487753638
        ],
        "wc_questions_avg": [
            74.25,
            26.099568961957974
        ],
        "wc_review_avg": [
            363.5,
            86.89217456134931
        ],
        "wc_reply_reviewers_avg": [
            41.5,
            29.004310024546353
        ],
        "wc_reply_authors_avg": [
            1378.25,
            666.1397657398934
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.25,
            1.920286436967152
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.9622504486493761,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16103035139839675510&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=3tM1l5tSbv",
        "pdf": "https://openreview.net/pdf?id=3tM1l5tSbv",
        "email": "cityu.edu.hk;cityu.edu.hk",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "City University of Hong Kong",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cityu.edu.hk",
        "aff_unique_abbr": "CityU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "3tjTJeXyA7",
        "title": "Revitalizing Channel-dimension Fourier Transform for Image Enhancement",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Exploring the global representations of Fourier transform for image enhancement has become an alternative and made significant advancements. However, previous works only operate in the spatial dimensional, overlooking the potential of the channel dimension that inherently possesses discriminative features. In this work, we propose a fresh perspective, channel-dimension Fourier transform, for image enhancement. Our designs are simple yet effective and comprise three straightforward steps: applying the Fourier transform to the channel dimension to obtain channel-wise Fourier domain features, performing a channel-wise transformation on both its amplitude and phase components, and then reverting back to the spatial domain. Following the above rules, we offer three alternative implementation formats of the channel transform in different operational spaces, performing operations in 1) the global vector with higher orders; 2)  the global vector with channel groups; and 3) the Fourier features derived from spatial-based Fourier transform. The above core designs, as general operators, can be seamlessly integrated with enhancement networks, achieving remarkable gains and building efficient models. Through extensive experiments on multiple image enhancement tasks, like low-light image enhancement, exposure correction, SDR2HDR translation, and underwater image enhancement, our designs exhibit consistent performance gains. The code will be publicly available.",
        "keywords": "Image Enhancement;Fourier transform;Image Restoration",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Jie Huang;Man Zhou;Dong Li;Bing Li;Chun-Le Guo;Chongyi Li",
        "authorids": "~Jie_Huang4;~Man_Zhou4;~Dong_Li15;~Bing_Li16;~Chun-Le_Guo1;~Chongyi_Li1",
        "gender": "M;;M;M;;",
        "homepage": ";;https://github.com/universe-six;https://www.ustc.edu.cn/;;",
        "dblp": ";;;;;",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;;LdfwzzQAAAAJ;;;",
        "orcid": "0000-0002-3518-3404;;0000-0002-7038-7402;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Jie_Huang4;~Man_Zhou4;~Dong_Li15;~Bing_Li16;~Chun-Le_Guo1;~Chongyi_Li1",
        "aff": "University of Science and Technology of China;;University of Science and Technology of China;University of Science and Technology of China;;",
        "aff_domain": "ustc.edu.cn;;ustc.edu.cn;ustc.edu.cn;;",
        "position": "PhD student;;PhD student;MS student;;",
        "bibtex": "@misc{\nhuang2024revitalizing,\ntitle={Revitalizing Channel-dimension Fourier Transform for Image Enhancement},\nauthor={Jie Huang and Man Zhou and Dong Li and Bing Li and Chun-Le Guo and Chongyi Li},\nyear={2024},\nurl={https://openreview.net/forum?id=3tjTJeXyA7}\n}",
        "github": "",
        "project": "",
        "reviewers": "WFwC;6DxW;MiY2;Tiry",
        "site": "https://openreview.net/forum?id=3tjTJeXyA7",
        "pdf_size": 6754444,
        "rating": "6;6;8;10",
        "confidence": "5;5;4;5",
        "soundness": "4;4;4;3",
        "contribution": "4;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "47;57;53;70",
        "wc_strengths": "88;69;90;50",
        "wc_weaknesses": "278;318;91;33",
        "wc_questions": "50;5;31;20",
        "wc_review": "463;449;265;173",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "827;865;704;301",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            7.5,
            1.6583123951777
        ],
        "confidence_avg": [
            4.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            56.75,
            8.437268515343103
        ],
        "wc_strengths_avg": [
            74.25,
            16.223054582907622
        ],
        "wc_weaknesses_avg": [
            180.0,
            120.60058042978069
        ],
        "wc_questions_avg": [
            26.5,
            16.408839081421938
        ],
        "wc_review_avg": [
            337.5,
            122.9827223637532
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            674.25,
            223.56137300526672
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.17407765595569782,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16518628138777599967&as_sdt=20000005&sciodt=0,21&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Science and Technology of China",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.ustc.edu.cn",
        "aff_unique_abbr": "USTC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "3uITarEQ7p",
        "title": "Differentially Private Model Compression via Selective Pretraining",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Suppose we want to train text prediction models in email clients or word processors. \nThese models, which serve billions of predictions per hour, must preserve the privacy of user data and adhere to specific model size constraints to meet memory, inference time requirements, and to reduce inference cost. \nBuilding small, fast, and private domain-specific language models is a thriving\narea of research.\nIn this work, we show that a careful pre-training on a {\\em subset} of the public dataset that is guided by the private dataset is crucial to train small DP language models.\nOn standard benchmarks, models trained with our new framework achieve state-of-the-art performance, improving upon all the baselines from the literature.\n\nBesides performance improvements, our framework also shows that with careful pre-training and private fine-tuning,  smaller models can match the performance of much larger models that do not have access to private data, highlighting the promise of private learning as a tool for model compression and efficiency.",
        "keywords": "differentially private deep learning;model compression",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/613fcfb60b224cba892cc66ecd8b5e96d87bcaf7.zip",
        "author": "Janardhan Kulkarni;Da Yu;Sivakanth Gopi;Zinan Lin;Saurabh Naik;Tomasz Lukasz Religa;Jian Yin;Huishuai Zhang",
        "authorids": "~Janardhan_Kulkarni2;~Da_Yu1;~Sivakanth_Gopi1;~Zinan_Lin1;~Saurabh_Naik1;~Tomasz_Lukasz_Religa1;~Jian_Yin3;~Huishuai_Zhang3",
        "gender": "M;M;M;M;M;;M;M",
        "homepage": ";;https://aka.ms/sigopi;https://zinanlin.me/;;http://www.cam.ac.uk;http://sai.sysu.edu.cn/teacher/teacher01/1385356.htm;https://huishuai-git.github.io",
        "dblp": "54/1978;48/8545;123/7803.html;64/237-1;;;95/578-1;144/7537",
        "google_scholar": "_fxnybwAAAAJ;FcRGdiwAAAAJ;bYhGFrwAAAAJ;67nE-wQ_g_cC;;;;w1srHyIAAAAJ",
        "orcid": ";;;;;;;",
        "linkedin": ";;sivakanthgopi/;;saurabh-naik-9750b0b/;;;",
        "or_profile": "~Janardhan_Kulkarni2;~Da_Yu1;~Sivakanth_Gopi1;~Zinan_Lin1;~Saurabh_Naik1;~Tomasz_Lukasz_Religa1;~Jian_Yin3;~Huishuai_Zhang2",
        "aff": "Microsoft Research, Redmond;SUN YAT-SEN UNIVERSITY;Microsoft Research;Microsoft;;;SUN YAT-SEN UNIVERSITY;Peking University",
        "aff_domain": "microsoft.com;sysu.edu.cn;microsoft.com;microsoft.com;;;sysu.edu.cn;pku.edu.cn",
        "position": "Researcher;PhD student;Senior Researcher;Senior Researcher;;;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nkulkarni2024differentially,\ntitle={Differentially Private Model Compression via Selective Pretraining},\nauthor={Janardhan Kulkarni and Da Yu and Sivakanth Gopi and Zinan Lin and Saurabh Naik and Tomasz Lukasz Religa and Jian Yin and Huishuai Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=3uITarEQ7p}\n}",
        "github": "",
        "project": "",
        "reviewers": "3s2h;kdmU;CqKu;mFxj",
        "site": "https://openreview.net/forum?id=3uITarEQ7p",
        "pdf_size": 7505163,
        "rating": "3;5;6;8",
        "confidence": "4;4;4;4",
        "soundness": "2;3;3;4",
        "contribution": "1;2;3;4",
        "presentation": "2;2;4;4",
        "wc_summary": "126;96;189;228",
        "wc_strengths": "58;47;322;122",
        "wc_weaknesses": "222;134;206;331",
        "wc_questions": "53;1;256;186",
        "wc_review": "459;278;973;867",
        "wc_reply_reviewers": "0;0;34;20",
        "wc_reply_authors": "1709;770;1111;696",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "3;1;2;1",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            1.118033988749895
        ],
        "presentation_avg": [
            3.0,
            1.0
        ],
        "wc_summary_avg": [
            159.75,
            51.760868423935854
        ],
        "wc_strengths_avg": [
            137.25,
            110.44314148012995
        ],
        "wc_weaknesses_avg": [
            223.25,
            70.48891756865046
        ],
        "wc_questions_avg": [
            124.0,
            101.78162899069753
        ],
        "wc_review_avg": [
            644.25,
            285.54804762071126
        ],
        "wc_reply_reviewers_avg": [
            13.5,
            14.378803844548406
        ],
        "wc_reply_authors_avg": [
            1071.5,
            399.95906040493696
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ALMmwCkMmQEJ:scholar.google.com/&scioq=Differentially+Private+Model+Compression+via+Selective+Pretraining&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0;1;2",
        "aff_unique_norm": "Microsoft;Sun Yat-sen University;Peking University",
        "aff_unique_dep": "Microsoft Research;;",
        "aff_unique_url": "https://www.microsoft.com/en-us/research;http://www.sysu.edu.cn;http://www.pku.edu.cn",
        "aff_unique_abbr": "MSR;SYSU;Peking U",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Redmond;",
        "aff_country_unique_index": "0;1;0;0;1;1",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "3ucOvX8WVu",
        "title": "LoFT: Local Proxy Fine-tuning Improves Transferability to Large Language Model Attacks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "It has been shown that Large Language Model (LLM) alignments can be circumvented by appending specially crafted attack suffixes with harmful queries to elicit harmful responses. To conduct attacks against private target models whose characterization is unknown, public models can be used as proxies to fashion the attack, with successful attacks being transferred from public proxies to private target models. The success rate of attack depends on how closely the proxy model approximates the private model. We hypothesize that for attacks to be transferrable, it is sufficient if the proxy can approximate the target model in the neighborhood of the harmful query. Therefore, in this paper, we propose \\emph{Local Fine-Tuning (LoFT)}, i.e., fine-tuning proxy models on similar queries that lie in the lexico-semantic neighborhood of harmful queries to decrease the divergence between the proxy and target models. First, we demonstrate three approaches to prompt private target models to obtain similar queries given harmful queries. Next, we obtain data for local fine-tuning by eliciting responses from target models for the generated similar queries. Then, we optimize attack suffixes to generate attack prompts and evaluate the impact of our local fine-tuning on the attack's success rate. Experiments show that local fine-tuning of proxy models improves attack transferability and increases attack success rate by $39\\%$, $7\\%$, and $0.5\\%$ absolute on target models ChatGPT, GPT-4, and Claude respectively.",
        "keywords": "adversarial attacks;large languages model;alignment;fine-tuning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/968a737950b697cd65c37bdff5fc83e6f1f6e7ca.pdf",
        "author": "Muhammad A Shah;Roshan Sharma;Hira Dhamyal;Ankit Shah;Dareen Safar Alharthi;Massa Baali;Hazim Bukhari;Joseph Konan;Soham Deshmukh;Bhiksha Raj;Rita Singh",
        "authorids": "~Muhammad_A_Shah1;~Roshan_Sharma1;~Hira_Dhamyal1;~Ankit_Shah1;~Dareen_Safar_Alharthi1;~Massa_Baali1;~Hazim_Bukhari1;~Joseph_Konan1;~Soham_Deshmukh1;~Bhiksha_Raj1;~Rita_Singh1",
        "gender": ";M;;M;F;F;M;;M;M;F",
        "homepage": ";https://roshansh-cmu.github.io/;https://www.linkedin.com/in/hiradhamyal/;https://ankitshah009.github.io/;https://dareenharthi.github.io/;https://www.linkedin.com/in/massa-baali-37ba9386;;;https://soham97.github.io;https://www.cs.cmu.edu/directory/bhikshar/;http://mlsp.cs.cmu.edu/people/rsingh/index.html",
        "dblp": "142/5481;263/9903;;04/1935-1.html;;;;306/1680.html;241/9651;60/3996;",
        "google_scholar": "74MwzTcAAAAJ;yZ4QLqsAAAAJ;;https://scholar.google.co.in/citations?user=TqG1H4cAAAAJ;jBtEAgIAAAAJ;;;;MasiEogAAAAJ;;",
        "orcid": ";;;0000-0002-8838-5421;;;;;;;",
        "linkedin": ";;;ankpsh01/;;;hazim-bukhari;;sdeshmuk;;",
        "or_profile": "~Muhammad_A_Shah1;~Roshan_Sharma1;~Hira_Dhamyal1;~Ankit_Shah1;~Dareen_Safar_Alharthi1;~Massa_Baali1;~Hazim_Bukhari1;~Joseph_Konan1;~Soham_Deshmukh1;~Bhiksha_Raj1;~Rita_Singh1",
        "aff": "Carnegie Mellon University;Google;Carnegie Mellon University;Accenture;School of Computer Science, Carnegie Mellon University;Carnegie Mellon University;Carnegie Mellon University;Carnegie Mellon University;Microsoft;Mohamed bin Zayed University of Artificial Intelligence;School of Computer Science, Carnegie Mellon University",
        "aff_domain": "cmu.edu;google.com;cmu.edu;accenture.com;cs.cmu.edu;cmu.edu;cmu.edu;andrew.cmu.edu;microsoft.com;mbzuai.ac.ae;cs.cmu.edu",
        "position": "PhD student;Researcher;PhD student;Principal Researcher;MS student;PhD student;Researcher;PhD student;Researcher;Full Professor;Research Professor",
        "bibtex": "@misc{\nshah2024loft,\ntitle={Lo{FT}: Local Proxy Fine-tuning Improves Transferability to Large Language Model Attacks},\nauthor={Muhammad A Shah and Roshan Sharma and Hira Dhamyal and Ankit Shah and Dareen Safar Alharthi and Massa Baali and Hazim Bukhari and Joseph Konan and Soham Deshmukh and Bhiksha Raj and Rita Singh},\nyear={2024},\nurl={https://openreview.net/forum?id=3ucOvX8WVu}\n}",
        "github": "",
        "project": "",
        "reviewers": "LSRN;A2bi;a6tE;5Wu7",
        "site": "https://openreview.net/forum?id=3ucOvX8WVu",
        "pdf_size": 2524526,
        "rating": "3;3;5;5",
        "confidence": "2;4;3;4",
        "soundness": "2;2;3;2",
        "contribution": "2;2;2;2",
        "presentation": "2;2;2;3",
        "wc_summary": "32;121;117;80",
        "wc_strengths": "18;32;57;68",
        "wc_weaknesses": "12;21;164;117",
        "wc_questions": "696;158;40;23",
        "wc_review": "758;332;378;288",
        "wc_reply_reviewers": "0;228;18;38",
        "wc_reply_authors": "1378;1156;1187;757",
        "reply_reviewers": "0;3;1;1",
        "reply_authors": "3;3;3;2",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            87.5,
            35.80851853958776
        ],
        "wc_strengths_avg": [
            43.75,
            19.778460506318485
        ],
        "wc_weaknesses_avg": [
            78.5,
            64.26702109169211
        ],
        "wc_questions_avg": [
            229.25,
            274.44796865708446
        ],
        "wc_review_avg": [
            439.0,
            186.90371852908652
        ],
        "wc_reply_reviewers_avg": [
            71.0,
            91.63514609580758
        ],
        "wc_reply_authors_avg": [
            1119.5,
            225.89654711836567
        ],
        "reply_reviewers_avg": [
            1.25,
            1.0897247358851685
        ],
        "reply_authors_avg": [
            2.75,
            0.4330127018922193
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": 0.30151134457776363,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Mitusnqm_SsJ:scholar.google.com/&scioq=LoFT:+Local+Proxy+Fine-tuning+Improves+Transferability+to+Large+Language+Model+Attacks&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;2;0;0;0;0;3;4;0",
        "aff_unique_norm": "Carnegie Mellon University;Google;Accenture;Microsoft;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_unique_dep": ";Google;;Microsoft Corporation;",
        "aff_unique_url": "https://www.cmu.edu;https://www.google.com;https://www.accenture.com;https://www.microsoft.com;https://mbzuai.ac.ae",
        "aff_unique_abbr": "CMU;Google;Accenture;Microsoft;MBZUAI",
        "aff_campus_unique_index": "1;2;2",
        "aff_campus_unique": ";Mountain View;Pittsburgh",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;1;0",
        "aff_country_unique": "United States;United Arab Emirates"
    },
    {
        "id": "3ukT8oODY0",
        "title": "Careful at Estimation and Bold at Exploration for Deterministic Policy Gradient Algorithm",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Exploration strategies within continuous action spaces often adopt heuristic approaches due to the challenge of dealing with an infinite array of possible actions. Previous research has established the advantages of policy-based exploration in the context of deterministic policy reinforcement learning (DPRL) for continuous action spaces. However, policy-based exploration in DPRL presents two notable issues: unguided exploration and exclusive policy, both stemming from the soft policy learning schema, which is famous for DPRL policy learning. In response to these challenges, we introduce a novel approach called Bold Actor Conservative Critic (BACC), which leverages Q-value to guide out-of-distribution exploration. We extend the dynamic Boltzmann softmax update theorem to the double Q function framework, incorporating modified weights and Q values. This extension enables us to derive an exploration policy directly for policy exploration, which is constructed with the modified weights. Furthermore, our theorem offers substantial support for utilizing the minimum Q value as an intermediate step in policy gradient computation for policy optimization. In practice, we construct such an exploration policy with a limited set of actions and train a parameterized policy by minimizing the expected KL-divergence between the target policy and a policy constructed based on the minimum Q value. To evaluate the effectiveness of our approach, we conduct experiments on the Mujoco and Roboschool benchmarks, showcasing superior performance compared to previous state-of-the-art methods across a range of environments. Notably, our method excels in the highly complex Humanoid environment, demonstrating its efficacy in tackling challenging continuous action space exploration problems.",
        "keywords": "exploration;actor critic;out of distribution;deterministic policy",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/e127fb9554acba5b34674796193b277f12189d82.zip",
        "author": "Xing Chen;Yijun Liu;Shutong Zhang;Siyuan Guo;Zhaogeng Liu;Yu Jin;haiyin piao;Hechang Chen;Hengshuai Yao;Yi Chang",
        "authorids": "~Xing_Chen2;~Yijun_Liu5;~Shutong_Zhang3;~Siyuan_Guo2;~Zhaogeng_Liu1;~Yu_Jin4;~haiyin_piao1;~Hechang_Chen2;~Hengshuai_Yao2;~Yi_Chang4",
        "gender": "M;F;;M;M;M;M;M;;M",
        "homepage": "https://github.com/raincchio;;;;https://github.com/Peter7777777;;https://www.researchgate.net/profile/Haiyin-Piao;http://sai.jlu.edu.cn/info/1094/2387.htm;;http://www.yichang-cs.com",
        "dblp": ";;;244/5858;264/5265;https://dblp.dagstuhl.de/;269/4228.html;145/1142;;02/5438.html",
        "google_scholar": ";;;JE1Yco4AAAAJ;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com/citations?view_op=list_works;;EezEcbgAAAAJ;;https://scholar.google.com.hk/citations?user=drEkR50AAAAJ",
        "orcid": "0000-0001-5685-8506;0000-0001-7752-1611;;0000-0002-9304-5405;0000-0002-3958-8740;;;;;0000-0003-2697-8093",
        "linkedin": ";;;;;;;;;",
        "or_profile": "~Xing_Chen2;~Yijun_Liu5;~Shutong_Zhang3;~Siyuan_Guo2;~Zhaogeng_Liu1;~Yu_Jin4;~haiyin_piao1;~Hechang_Chen2;~Hengshuai_Yao2;~Yi_Chang4",
        "aff": "Jilin University;Jilin University;;Jilin University;Jilin University;;;Jilin University;;Jilin University, China",
        "aff_domain": "jlu.edu.cn;jlu.edu.cn;;jlu.edu.cn;jlu.edu.cn;;;jlu.edu.cn;;jlu.edu.cn",
        "position": "PhD student;PhD student;;PhD student;PhD student;;;Associate Professor;;Full Professor",
        "bibtex": "@misc{\nchen2024careful,\ntitle={Careful at Estimation and Bold at Exploration for Deterministic Policy Gradient Algorithm},\nauthor={Xing Chen and Yijun Liu and Shutong Zhang and Siyuan Guo and Zhaogeng Liu and Yu Jin and haiyin piao and Hechang Chen and Hengshuai Yao and Yi Chang},\nyear={2024},\nurl={https://openreview.net/forum?id=3ukT8oODY0}\n}",
        "github": "",
        "project": "",
        "reviewers": "3zdT;4MmP;vPPz",
        "site": "https://openreview.net/forum?id=3ukT8oODY0",
        "pdf_size": 8156725,
        "rating": "5;5;6",
        "confidence": "3;3;4",
        "soundness": "2;3;3",
        "contribution": "2;2;3",
        "presentation": "2;3;3",
        "wc_summary": "103;76;70",
        "wc_strengths": "44;32;32",
        "wc_weaknesses": "436;60;64",
        "wc_questions": "6;119;155",
        "wc_review": "589;287;321",
        "wc_reply_reviewers": "141;0;16",
        "wc_reply_authors": "790;464;375",
        "reply_reviewers": "1;0;1",
        "reply_authors": "2;1;1",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            83.0,
            14.352700094407323
        ],
        "wc_strengths_avg": [
            36.0,
            5.656854249492381
        ],
        "wc_weaknesses_avg": [
            186.66666666666666,
            176.31285325302358
        ],
        "wc_questions_avg": [
            93.33333333333333,
            63.47878035655345
        ],
        "wc_review_avg": [
            399.0,
            135.06541624955912
        ],
        "wc_reply_reviewers_avg": [
            52.333333333333336,
            63.03614483417871
        ],
        "wc_reply_authors_avg": [
            543.0,
            178.39469349357526
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.9999999999999997,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:G621eedBhCQJ:scholar.google.com/&scioq=Careful+at+Estimation+and+Bold+at+Exploration+for+Deterministic+Policy+Gradient+Algorithm&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "Jilin University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.jlu.edu.cn",
        "aff_unique_abbr": "JLU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "3vHWAGV9Wj",
        "title": "Estimating Performative Effects in Dynamical Systems: the advantage of sequential observations",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Regulators and academics are increasingly interested in the causal effect that algorithmic actions of a digital platform have on consumption, a quantity in the machine learning literature termed the performative effect. In this work, we first show how isolated (non-sequential) observations are not enough to identify the performative effect of interest in general, then we show how sequential observations overcome these limitations. The key novelty of our approach is to explicitly model the dynamics of consumption over time, viewing the platform as a controller acting on a dynamical system. From this dynamical systems perspective, we are able to show that exogenous variation in consumption and appropriately responsive algorithmic control actions are sufficient for identifying the performative effect of interest. Our results illustrate the fruitful interplay of control theory and causal inference, which we illustrate with examples from econometrics, macroeconomics, and machine learning.",
        "keywords": "performativity;dynamical systems;causal inference;control theory",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Gary Cheng;Moritz Hardt;Celestine Mendler-D\u00fcnner",
        "authorids": "~Gary_Cheng2;~Moritz_Hardt1;~Celestine_Mendler-D\u00fcnner1",
        "gender": "M;Not Specified;",
        "homepage": "http://garycheng.me;http://mrtz.org/;http://celestine.ai/",
        "dblp": ";26/4683;176/5511",
        "google_scholar": "qArWV_wAAAAJ;adnTgaAAAAAJ;UqtDdZUAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Gary_Cheng2;~Moritz_Hardt1;~Celestine_Mendler-D\u00fcnner1",
        "aff": "Stanford University;Max-Planck-Institute for Intelligent Systems, Max-Planck Institute;Max Planck Institute for Intelligent Systems",
        "aff_domain": "stanford.edu;is.mpg.de;tuebingen.mpg.de",
        "position": "PhD student;Principal Researcher;Group Lead",
        "bibtex": "@misc{\ncheng2024estimating,\ntitle={Estimating Performative Effects in Dynamical Systems: the advantage of sequential observations},\nauthor={Gary Cheng and Moritz Hardt and Celestine Mendler-D{\\\"u}nner},\nyear={2024},\nurl={https://openreview.net/forum?id=3vHWAGV9Wj}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=3vHWAGV9Wj",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:DTDSoxXxFbEJ:scholar.google.com/&scioq=Estimating+Performative+Effects+in+Dynamical+Systems:+the+advantage+of+sequential+observations&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Stanford University;Max-Planck-Institute for Intelligent Systems;Max Planck Institute for Intelligent Systems",
        "aff_unique_dep": ";Intelligent Systems;Intelligent Systems",
        "aff_unique_url": "https://www.stanford.edu;https://www.mpi-is.mpg.de;https://www.mpi-is.mpg.de",
        "aff_unique_abbr": "Stanford;MPI-IS;MPI-IS",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Stanford;",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "United States;Germany"
    },
    {
        "title": "The Generalization Gap in Offline Reinforcement Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19490",
        "id": "3w6xuXDOdY",
        "author_site": "Ishita Mediratta, Qingfei You, Minqi Jiang, Roberta Raileanu",
        "tldr": "",
        "abstract": "Despite recent progress in offline learning, these methods are still trained and tested on the same environment. In this paper, we compare the generalization abilities of widely used online and offline learning methods such as online reinforcement learning (RL), offline RL, sequence modeling, and behavioral cloning. Our experiments show that offline learning algorithms perform worse on new environments than online learning ones. We also introduce the first benchmark for evaluating generalization in offline learning, collecting datasets of varying sizes and skill-levels from Procgen (2D video games) and WebShop (e-commerce websites). The datasets contain trajectories for a limited number of game levels or natural language instructions and at test time, the agent has to generalize to new levels or instructions. Our experiments reveal that existing offline learning algorithms struggle to match the performance of online RL on both train and test environments. Behavioral cloning is a strong baseline, outperforming state-of-the-art offline RL and sequence modeling approaches when trained on data from multiple environments and tested on new ones. Finally, we find that increasing the diversity of the data, rather than its size, improves performance on new environments for all offline learning algorithms. Our study demonstrates the limited generalization of current offline learning algorithms highlighting the need for more research in this area.",
        "keywords": "Offline RL;Dataset;Generalization;Procgen;Webshop",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Ishita Mediratta;Qingfei You;Minqi Jiang;Roberta Raileanu",
        "authorids": "~Ishita_Mediratta1;~Qingfei_You2;~Minqi_Jiang1;~Roberta_Raileanu2",
        "gender": "F;;M;F",
        "homepage": "https://ishita.io;;https://twitter.com/minqijiang;https://rraileanu.github.io/",
        "dblp": "289/7108;;270/7949;215/5579",
        "google_scholar": "hgaAO6QAAAAJ;;;9hVXpJ0AAAAJ",
        "orcid": ";;;",
        "linkedin": ";qingfeiyou/;minqi-jiang-585a6536/;roberta-raileanu-44b25660/",
        "or_profile": "~Ishita_Mediratta1;~Qingfei_You2;~Minqi_Jiang1;~Roberta_Raileanu1",
        "aff": "Meta AI;;Google;Meta Facebook",
        "aff_domain": "meta.com;;google.com;fb.com",
        "position": "Researcher;;Researcher;Researcher",
        "bibtex": "@inproceedings{\nmediratta2024the,\ntitle={The Generalization Gap in Offline Reinforcement Learning},\nauthor={Ishita Mediratta and Qingfei You and Minqi Jiang and Roberta Raileanu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=3w6xuXDOdY}\n}",
        "github": "",
        "project": "",
        "reviewers": "qttr;4tcZ;HieC;f7uZ",
        "pdf_size": 2279286,
        "rating": "6;6;6;8",
        "confidence": "4;4;4;4",
        "soundness": "3;3;2;3",
        "contribution": "3;3;2;3",
        "presentation": "3;3;2;3",
        "wc_summary": "62;26;75;69",
        "wc_strengths": "60;47;44;149",
        "wc_weaknesses": "186;178;118;64",
        "wc_questions": "104;65;161;14",
        "wc_review": "412;316;398;296",
        "wc_reply_reviewers": "64;135;19;0",
        "wc_reply_authors": "1577;1690;774;764",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "4;4;3;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            58.0,
            19.03943276465977
        ],
        "wc_strengths_avg": [
            75.0,
            43.14510400960925
        ],
        "wc_weaknesses_avg": [
            136.5,
            49.42418436352794
        ],
        "wc_questions_avg": [
            86.0,
            53.791263231123324
        ],
        "wc_review_avg": [
            355.5,
            50.2468904510518
        ],
        "wc_reply_reviewers_avg": [
            54.5,
            51.96392979750473
        ],
        "wc_reply_authors_avg": [
            1201.25,
            434.10676970072694
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.25,
            0.82915619758885
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 17,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16522965744672101615&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=3w6xuXDOdY",
        "pdf": "https://openreview.net/pdf?id=3w6xuXDOdY",
        "email": "meta.com;;google.com;fb.com",
        "author_num": 4,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Meta;Google",
        "aff_unique_dep": "Meta AI;Google",
        "aff_unique_url": "https://meta.com;https://www.google.com",
        "aff_unique_abbr": "Meta;Google",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "3wGi5m2YHY",
        "title": "FlowHash: Accelerating Audio Search with Balanced Hashing via Normalizing Flow",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Nearest neighbor search on context representation vectors is a formidable task due to challenges posed by high dimensionality, scalability issues, and potential noise within query vectors. Our novel approach leverages normalizing flow within a self-supervised learning framework to effectively tackle these challenges, specifically in the context of audio fingerprinting tasks. Audio fingerprinting systems incorporate two key components: audio encoding and indexing. The existing systems consider these components independently, resulting in suboptimal performance. Our approach optimizes the interplay between these components, facilitating the adaptation of vectors to the indexing structure. Additionally, we distribute vectors in the latent $\\mathbb{R}^K$ space using normalizing flow, resulting in balanced $K$-bit hash codes. This allows indexing vectors using a balanced hash table, where vectors are uniformly distributed across all possible $2^K$ hash buckets. This significantly accelerates retrieval, achieving speedups of up to 3$\\times$ compared to the Locality-Sensitive Hashing (LSH). We empirically demonstrate that our system is scalable, highly effective, and efficient in identifying short audio queries ($\\leq$2s), particularly at high noise and reverberation levels.",
        "keywords": "Audio fingerprinting;Indexing;Normalizing Flows;Information Retrieval;Self-supervised learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Anup Singh;Kris Demuynck;Vipul Arora",
        "authorids": "~Anup_Singh1;~Kris_Demuynck1;~Vipul_Arora1",
        "gender": "M;M;M",
        "homepage": ";;https://home.iitk.ac.in/~vipular",
        "dblp": ";49/603;",
        "google_scholar": ";;https://scholar.google.co.in/citations?user=SC9YYPAAAAAJ",
        "orcid": ";0000-0001-8525-7160;0000-0002-1207-1258",
        "linkedin": "anup-singh-a84a7476/;;",
        "or_profile": "~Anup_Singh1;~Kris_Demuynck1;~Vipul_Arora1",
        "aff": "Universiteit Gent;Universiteit Gent;IIT Kanpur",
        "aff_domain": "ugent.be;ugent.be;iitk.ac.in",
        "position": "PhD student;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nsingh2024flowhash,\ntitle={FlowHash: Accelerating Audio Search with Balanced Hashing via Normalizing Flow},\nauthor={Anup Singh and Kris Demuynck and Vipul Arora},\nyear={2024},\nurl={https://openreview.net/forum?id=3wGi5m2YHY}\n}",
        "github": "",
        "project": "",
        "reviewers": "q2gt;AxNq;p7bp",
        "site": "https://openreview.net/forum?id=3wGi5m2YHY",
        "pdf_size": 2028111,
        "rating": "3;3;5",
        "confidence": "4;4;4",
        "soundness": "2;3;3",
        "contribution": "1;2;3",
        "presentation": "2;2;4",
        "wc_summary": "39;70;103",
        "wc_strengths": "11;67;67",
        "wc_weaknesses": "346;289;179",
        "wc_questions": "1;90;95",
        "wc_review": "397;516;444",
        "wc_reply_reviewers": "13;49;19",
        "wc_reply_authors": "392;414;578",
        "reply_reviewers": "1;1;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            70.66666666666667,
            26.132142830026183
        ],
        "wc_strengths_avg": [
            48.333333333333336,
            26.398653164297777
        ],
        "wc_weaknesses_avg": [
            271.3333333333333,
            69.31249686905113
        ],
        "wc_questions_avg": [
            62.0,
            43.18178628387977
        ],
        "wc_review_avg": [
            452.3333333333333,
            48.93760199364993
        ],
        "wc_reply_reviewers_avg": [
            27.0,
            15.748015748023622
        ],
        "wc_reply_authors_avg": [
            461.3333333333333,
            82.98326471176114
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1116698979299600068&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "University of Ghent;Indian Institute of Technology Kanpur",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ugent.be/en;https://www.iitk.ac.in",
        "aff_unique_abbr": "UGent;IITK",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Kanpur",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "Belgium;India"
    },
    {
        "id": "3wL1tj3kqE",
        "title": "Fair Domain Generalization with Arbitrary Sensitive Attributes",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We consider the problem of fairness transfer in domain generalization. Traditional domain generalization methods are designed to generalize a model to unseen domains. Recent work has extended this capability to incorporate fairness as an additional requirement. However, it is only applicable to a single, unchanging sensitive attribute across all domains. As a naive approach to extend it to a multi-attribute context, we can train a model for each subset of the potential set of sensitive attributes. However, this results in $2^n$ models for $n$ attributes. We propose a novel approach that allows any combination of sensitive attributes in the target domain. We learn two representations, a domain invariant representation to generalize the model's performance, and a selective domain invariant representation to transfer the model's fairness to unseen domains. As each domain can have a different set of sensitive attributes, we transfer the fairness by learning a selective domain invariant representation which enforces similar representations among only those domains that have similar sensitive attributes. We demonstrate that our method decreases the current requirement of $2^n$ models to $1$ to accomplish this task. Moreover, our method outperforms the state-of-the-art on unseen target domains across multiple experimental settings.",
        "keywords": "domain generalization;fairness;multiple sensitive attributes",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Ragja Palakkadavath;Hung Le;Thanh Nguyen-Tang;Svetha Venkatesh;Sunil Gupta",
        "authorids": "~Ragja_Palakkadavath1;~Hung_Le1;~Thanh_Nguyen-Tang1;~Svetha_Venkatesh1;~Sunil_Gupta2",
        "gender": "F;F;M;M;M",
        "homepage": ";https://www.deakin.edu.au/about-deakin/people/svetha-venkatesh;https://thaihungle.github.io/;https://personal-sites.deakin.edu.au/~sunilg/;https://thanhnguyentang.github.io/",
        "dblp": "283/0847;81/1984;45/466-2;47/333-1;287/5102.html",
        "google_scholar": "https://scholar.google.co.in/citations?user=cVTpiuoAAAAJ;AEkRUQcAAAAJ;https://scholar.google.com.au/citations?user=q2HbxngAAAAJ;https://scholar.google.com.au/citations?user=bXeL2t8AAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;0000-0002-3126-184X;0000-0002-3308-1930;0000-0002-1917-2190",
        "linkedin": ";;;;thanhnguyentang/",
        "or_profile": "~Ragja_Palakkadavath1;~Svetha_Venkatesh1;~Hung_Thai_Le1;~Sunil_Kumar_Gupta1;~Thanh_Tang_Nguyen2",
        "aff": "Deakin University;Deakin University;Deakin University;Deakin University;Johns Hopkins University",
        "aff_domain": "deakin.edu.au;deakin.edu.au;deakin.edu.au;deakin.edu.au;jhu.edu",
        "position": "PhD student;Full Professor;Lecturer;Full Professor;Postdoc",
        "bibtex": "@misc{\npalakkadavath2024fair,\ntitle={Fair Domain Generalization with Arbitrary Sensitive Attributes},\nauthor={Ragja Palakkadavath and Hung Le and Thanh Nguyen-Tang and Svetha Venkatesh and Sunil Gupta},\nyear={2024},\nurl={https://openreview.net/forum?id=3wL1tj3kqE}\n}",
        "github": "",
        "project": "",
        "reviewers": "kdx1;cyJi;XuYi;FctA",
        "site": "https://openreview.net/forum?id=3wL1tj3kqE",
        "pdf_size": 380256,
        "rating": "1;3;3;6",
        "confidence": "5;4;4;4",
        "soundness": "1;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;2;2",
        "wc_summary": "72;104;68;121",
        "wc_strengths": "38;197;14;79",
        "wc_weaknesses": "508;258;365;81",
        "wc_questions": "2;191;4;24",
        "wc_review": "620;750;451;305",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1445;977;1087;563",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;2;1",
        "rating_avg": [
            3.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            91.25,
            22.128883839904805
        ],
        "wc_strengths_avg": [
            82.0,
            70.3455755538328
        ],
        "wc_weaknesses_avg": [
            303.0,
            155.8669304246414
        ],
        "wc_questions_avg": [
            55.25,
            78.84597326433354
        ],
        "wc_review_avg": [
            531.5,
            168.34265650749367
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1018.0,
            314.5615996907442
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.7276068751089989,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:jEEsnffqJ1EJ:scholar.google.com/&scioq=Fair+Domain+Generalization+with+Arbitrary+Sensitive+Attributes&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;1",
        "aff_unique_norm": "Deakin University;Johns Hopkins University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.deakin.edu.au;https://www.jhu.edu",
        "aff_unique_abbr": "Deakin;JHU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;1",
        "aff_country_unique": "Australia;United States"
    },
    {
        "id": "3wde105NL2",
        "title": "test",
        "track": "main",
        "status": "Desk Reject",
        "tldr": "",
        "abstract": "test",
        "keywords": "CUHK",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Jiyue Jiang",
        "authorids": "~Jiyue_Jiang1",
        "gender": "M",
        "homepage": "",
        "dblp": "271/4659",
        "google_scholar": "https://scholar.google.com.hk/citations?user=O4ZaJ7QAAAAJ",
        "orcid": "",
        "linkedin": "jethro-jiang-1215661a1/",
        "or_profile": "~Jiyue_Jiang1",
        "aff": "The Chinese University of Hong Kong",
        "aff_domain": "link.cuhk.edu.hk",
        "position": "PhD student",
        "bibtex": "@misc{\njiang2024test,\ntitle={test},\nauthor={Jiyue Jiang},\nyear={2024},\nurl={https://openreview.net/forum?id=3wde105NL2}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=3wde105NL2",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0",
        "aff_unique_norm": "Chinese University of Hong Kong",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cuhk.edu.hk",
        "aff_unique_abbr": "CUHK",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "3wde105NL2",
        "title": "test",
        "track": "main",
        "status": "Desk Reject",
        "tldr": "",
        "abstract": "test",
        "keywords": "CUHK",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Jiyue Jiang",
        "authorids": "~Jiyue_Jiang1",
        "gender": "M",
        "homepage": "",
        "dblp": "271/4659",
        "google_scholar": "https://scholar.google.com.hk/citations?user=O4ZaJ7QAAAAJ",
        "orcid": "",
        "linkedin": "jethro-jiang-1215661a1/",
        "or_profile": "~Jiyue_Jiang1",
        "aff": "The Chinese University of Hong Kong",
        "aff_domain": "link.cuhk.edu.hk",
        "position": "PhD student",
        "bibtex": "@misc{\njiang2024test,\ntitle={test},\nauthor={Jiyue Jiang},\nyear={2024},\nurl={https://openreview.net/forum?id=3wde105NL2}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=3wde105NL2",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0",
        "aff_unique_norm": "Chinese University of Hong Kong",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cuhk.edu.hk",
        "aff_unique_abbr": "CUHK",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "title": "Sharpness-Aware Minimization Enhances Feature Quality via Balanced Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19489",
        "id": "3xDaj4pRna",
        "author_site": "Jacob Springer, Vaishnavh Nagarajan, Aditi Raghunathan",
        "tldr": "",
        "abstract": "Sharpness-Aware Minimization (SAM) has emerged as a promising alternative optimizer to stochastic gradient descent (SGD). The originally-proposed motivation behind SAM was to bias neural networks towards flatter minima that are believed to generalize better. However, recent studies have shown conflicting evidence on the relationship between flatness and generalization, suggesting that flatness does fully explain SAM's success. Sidestepping this debate, we identify an orthogonal effect of SAM that is beneficial out-of-distribution: we argue that SAM implicitly balances the quality of diverse features. SAM achieves this effect by adaptively suppressing well-learned features which gives remaining features opportunity to be learned. We show that this mechanism is beneficial in datasets that contain redundant or spurious features where SGD falls for the simplicity bias and would not otherwise learn all available features. Our insights are supported by experiments on real data: we demonstrate that SAM improves the quality of features in datasets containing redundant or spurious features, including CelebA, Waterbirds, CIFAR-MNIST, and DomainBed.",
        "keywords": "sharpness-aware minimization;representation learning;spurious correlations",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Jacob Mitchell Springer;Vaishnavh Nagarajan;Aditi Raghunathan",
        "authorids": "~Jacob_Mitchell_Springer1;~Vaishnavh_Nagarajan3;~Aditi_Raghunathan1",
        "gender": "M;F;M",
        "homepage": "https://sprin.xyz;https://www.cs.cmu.edu/~aditirag/;https://vaishnavh.github.io/",
        "dblp": ";166/1409;161/0079",
        "google_scholar": "niZiN38AAAAJ;Ch9iRwQAAAAJ;https://scholar.google.nl/citations?user=LrsjJfwAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Jacob_Mitchell_Springer1;~Aditi_Raghunathan1;~Vaishnavh_Nagarajan1",
        "aff": "Carnegie Mellon University;Carnegie Mellon University;Google",
        "aff_domain": "cmu.edu;cmu.edu;google.com",
        "position": "PhD student;Assistant Professor;Researcher",
        "bibtex": "@inproceedings{\nspringer2024sharpnessaware,\ntitle={Sharpness-Aware Minimization Enhances Feature Quality via Balanced Learning},\nauthor={Jacob Mitchell Springer and Vaishnavh Nagarajan and Aditi Raghunathan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=3xDaj4pRna}\n}",
        "github": "",
        "project": "",
        "reviewers": "Jhr2;qpzp;BgWc;NKN8;LFgC;KbQq",
        "pdf_size": 1269488,
        "rating": "6;6;6;6;6;8",
        "confidence": "3;4;3;4;4;3",
        "soundness": "3;2;2;3;2;3",
        "contribution": "3;2;3;2;3;3",
        "presentation": "3;1;2;3;3;3",
        "wc_summary": "84;34;84;34;113;120",
        "wc_strengths": "59;16;54;42;43;122",
        "wc_weaknesses": "87;62;170;37;32;118",
        "wc_questions": "34;2;3;1;238;336",
        "wc_review": "264;114;311;114;426;696",
        "wc_reply_reviewers": "11;34;17;0;73;82",
        "wc_reply_authors": "590;423;527;51;797;535",
        "reply_reviewers": "1;1;1;0;1;1",
        "reply_authors": "1;1;1;1;1;1",
        "rating_avg": [
            6.333333333333333,
            0.7453559924999298
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.5,
            0.7637626158259734
        ],
        "wc_summary_avg": [
            78.16666666666667,
            33.99223767600807
        ],
        "wc_strengths_avg": [
            56.0,
            32.49102440162001
        ],
        "wc_weaknesses_avg": [
            84.33333333333333,
            48.230925993829125
        ],
        "wc_questions_avg": [
            102.33333333333333,
            134.0878650570422
        ],
        "wc_review_avg": [
            320.8333333333333,
            200.29013677385336
        ],
        "wc_reply_reviewers_avg": [
            36.166666666666664,
            31.01299010988066
        ],
        "wc_reply_authors_avg": [
            487.1666666666667,
            225.3903404220233
        ],
        "reply_reviewers_avg": [
            0.8333333333333334,
            0.37267799624996495
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.4472135954999579,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17722484160754341186&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=3xDaj4pRna",
        "pdf": "https://openreview.net/pdf?id=3xDaj4pRna",
        "email": "cmu.edu;cmu.edu;google.com",
        "author_num": 3,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Carnegie Mellon University;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.cmu.edu;https://www.google.com",
        "aff_unique_abbr": "CMU;Google",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Sophia: A Scalable Stochastic Second-order Optimizer for Language Model Pre-training",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19488",
        "id": "3xHDeA8Noi",
        "author_site": "Hong Liu, Zhiyuan Li, David Hall, Percy Liang, Tengyu Ma",
        "tldr": "",
        "abstract": "Given the massive cost of language model pre-training, a non-trivial improvement of the optimization algorithm would lead to a material reduction on the time and cost of training. Adam and its variants have been state-of-the-art for years, and more sophisticated second-order (Hessian-based) optimizers often incur too much per-step overhead. In this paper, we propose Sophia, a simple scalable second-order optimizer that uses a light-weight estimate of the diagonal Hessian as the pre-conditioner. The update is the moving average of the gradients divided by the moving average of the estimated Hessian, followed by element-wise clipping. The clipping controls the worst-case update size and tames the negative impact of non-convexity and rapid change of Hessian along the trajectory. Sophia only estimates the diagonal Hessian every handful of iterations, which has negligible average per-step time and memory overhead. On language modeling with GPT models of sizes ranging from 125M to 1.5B, Sophia achieves a 2x speed-up compared to Adam in the number of steps, total compute, and wall-clock time, achieving the same perplexity with 50\\% fewer steps, less total compute, and reduced wall-clock time.",
        "keywords": "large language models;pretraining;optimization in deep learning",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/95a79cae116529a8b29395efabc5dd175b828ebd.zip",
        "author": "Hong Liu;Zhiyuan Li;David Leo Wright Hall;Percy Liang;Tengyu Ma",
        "authorids": "~Hong_Liu5;~Zhiyuan_Li2;~David_Leo_Wright_Hall1;~Percy_Liang1;~Tengyu_Ma1",
        "gender": "M;M;M;;M",
        "homepage": ";https://zhiyuanli.ttic.edu;;https://cs.stanford.edu/~pliang/;http://ai.stanford.edu/~tengyuma/",
        "dblp": ";l/ZhiyuanLi;133/2070;04/1701;54/9061",
        "google_scholar": "BUc2uq0AAAAJ;https://scholar.google.com/citations?hl=en;6GpZV0YAAAAJ;pouyVyUAAAAJ;i38QlUwAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;dlwhall/;;",
        "or_profile": "~Hong_Liu5;~Zhiyuan_Li2;~David_Leo_Wright_Hall1;~Percy_Liang1;~Tengyu_Ma1",
        "aff": "Stanford University;Toyota Technological Institute at Chicago;Stanford University;Stanford University;Facebook AI Research",
        "aff_domain": "stanford.edu;ttic.edu;stanford.edu;stanford.edu;fb.com",
        "position": "PhD student;Assistant Professor;Researcher;Associate Professor;Visiting Scientist",
        "bibtex": "@inproceedings{\nliu2024sophia,\ntitle={Sophia: A Scalable Stochastic Second-order Optimizer for Language Model Pre-training},\nauthor={Hong Liu and Zhiyuan Li and David Leo Wright Hall and Percy Liang and Tengyu Ma},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=3xHDeA8Noi}\n}",
        "github": "",
        "project": "",
        "reviewers": "x5VB;Gbmx;knid;R1G3",
        "pdf_size": 2834253,
        "rating": "6;8;8;8",
        "confidence": "4;4;3;3",
        "soundness": "3;4;3;3",
        "contribution": "2;4;4;4",
        "presentation": "3;2;3;4",
        "wc_summary": "213;66;100;107",
        "wc_strengths": "96;73;111;155",
        "wc_weaknesses": "82;98;91;21",
        "wc_questions": "61;141;110;366",
        "wc_review": "452;378;412;649",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "314;306;185;425",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            121.5,
            55.056788863863105
        ],
        "wc_strengths_avg": [
            108.75,
            29.93639089803579
        ],
        "wc_weaknesses_avg": [
            73.0,
            30.553232234904378
        ],
        "wc_questions_avg": [
            169.5,
            116.97969909347519
        ],
        "wc_review_avg": [
            472.75,
            105.07467582629032
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            307.5,
            84.9367411665882
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 151,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1035408644622871003&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=3xHDeA8Noi",
        "pdf": "https://openreview.net/pdf?id=3xHDeA8Noi",
        "email": "stanford.edu;ttic.edu;stanford.edu;stanford.edu;fb.com",
        "author_num": 5,
        "aff_unique_index": "0;1;0;0;2",
        "aff_unique_norm": "Stanford University;Toyota Technological Institute at Chicago;Meta",
        "aff_unique_dep": ";;Facebook AI Research",
        "aff_unique_url": "https://www.stanford.edu;https://www.tti-chicago.org;https://research.facebook.com",
        "aff_unique_abbr": "Stanford;TTI Chicago;FAIR",
        "aff_campus_unique_index": "0;1;0;0",
        "aff_campus_unique": "Stanford;Chicago;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "3xHbRLymyZ",
        "title": "DeeDiff: Dynamic Uncertainty-Aware Early Exiting for Accelerating Diffusion Model Generation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Diffusion models achieve great success in generating diverse and high-fidelity images. The performance improvements come with low generation speed per image, which hinders the application diffusion models in real-time scenarios. While some certain predictions benefit from the full computation of the model in each sample iteration, not every iteration requires the same amount of computation, potentially leading to computation waste. In this work, we propose DeeDiff, an early exiting framework that adaptively allocates computation resources in each sampling step to improve the generation efficiency of diffusion models. Specifically, we introduce a timestep-aware uncertainty estimation module (UEM) for diffusion models which is attached to each intermediate layer to estimate the prediction uncertainty of each layer. The uncertainty is regarded as the signal to decide if the inference terminates. Moreover, we propose uncertainty-aware layer-wise loss to fill the performance gap between full models and early-exited models. With such loss strategy, our model is able to obtain comparable results as full-layer models. Extensive experiments of class-conditional, unconditional, and text-guided generation on several datasets show that our method achieves state-of-the-art performance and efficiency trade-off compared with existing early exiting methods on diffusion models. More importantly, our method even brings extra benefits to baseline models and obtains better performance on CIFAR-10 and Celeb-A datasets.  Full code and model are released for reproduction.",
        "keywords": "Diffusion;Efficiency;Diffusion acceleration;Early Exiting",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/8d54309968936bfe4e8fe8263a3f58de64671d0e.zip",
        "author": "Shengkun Tang;Yaqing Wang;Caiwen Ding;Yi Liang;Yao Li;Dongkuan Xu",
        "authorids": "~Shengkun_Tang1;~Yaqing_Wang1;~Caiwen_Ding1;~Yi_Liang1;~Yao_Li1;~Dongkuan_Xu2",
        "gender": ";M;M;M;F;M",
        "homepage": ";https://yaqingwang.github.io/;https://caiwending.cse.uconn.edu/;https://research.google/people/108265/;https://liyao880.github.io/yaoli/;https://dongkuanx27.github.io/",
        "dblp": ";147/1393;175/2489;;;142/8139",
        "google_scholar": ";_Rfg2CAAAAAJ;7hR0r_EAAAAJ;9vQ7gbgAAAAJ;bQ6YhCwAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;0000-0003-0891-1231;0000-0002-6622-8919;0000-0002-7195-5774;0000-0002-1456-9658",
        "linkedin": ";;caiwen-ding-47144489/;;yao-li-b189574a/;dongkuan-dk-xu-%F0%9F%87%BA%F0%9F%87%A6-05038087/",
        "or_profile": "~Shengkun_Tang1;~Yaqing_Wang1;~Caiwen_Ding1;~Yi_Liang1;~Yao_Li1;~Dongkuan_Xu2",
        "aff": ";Google DeepMind;University of Connecticut;Research, Google;University of North Carolina, Chapel Hill;North Carolina State University",
        "aff_domain": ";google.com;uconn.edu;research.google.com;unc.edu;ncsu.edu",
        "position": ";Research Scientist;Assistant Professor;Researcher;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\ntang2024deediff,\ntitle={DeeDiff: Dynamic Uncertainty-Aware Early Exiting for Accelerating Diffusion Model Generation},\nauthor={Shengkun Tang and Yaqing Wang and Caiwen Ding and Yi Liang and Yao Li and Dongkuan Xu},\nyear={2024},\nurl={https://openreview.net/forum?id=3xHbRLymyZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "xWTy;ttQR;eCAn;PB4D",
        "site": "https://openreview.net/forum?id=3xHbRLymyZ",
        "pdf_size": 8973925,
        "rating": "3;5;5;5",
        "confidence": "4;4;4;4",
        "soundness": "3;3;3;2",
        "contribution": "2;2;2;2",
        "presentation": "1;2;3;2",
        "wc_summary": "52;102;32;61",
        "wc_strengths": "42;61;31;37",
        "wc_weaknesses": "245;365;94;351",
        "wc_questions": "5;5;4;63",
        "wc_review": "344;533;161;512",
        "wc_reply_reviewers": "0;20;0;0",
        "wc_reply_authors": "204;515;217;888",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;2;1;2",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            61.75,
            25.498774480354932
        ],
        "wc_strengths_avg": [
            42.75,
            11.233320969330485
        ],
        "wc_weaknesses_avg": [
            263.75,
            108.43287093865956
        ],
        "wc_questions_avg": [
            19.25,
            25.262373206015305
        ],
        "wc_review_avg": [
            387.5,
            149.8874577808297
        ],
        "wc_reply_reviewers_avg": [
            5.0,
            8.660254037844387
        ],
        "wc_reply_authors_avg": [
            456.0,
            278.71580507750184
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11105961738940576174&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;0;2;3",
        "aff_unique_norm": "Google;University of Connecticut;University of North Carolina;North Carolina State University",
        "aff_unique_dep": "Google DeepMind;;;",
        "aff_unique_url": "https://deepmind.com;https://www.uconn.edu;https://www.unc.edu;https://www.ncsu.edu",
        "aff_unique_abbr": "DeepMind;UConn;UNC;NCSU",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Mountain View;Chapel Hill",
        "aff_country_unique_index": "0;1;1;1;1",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "title": "Brain decoding: toward real-time reconstruction of visual perception",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19487",
        "id": "3y1K6buO8c",
        "author_site": "Yohann Benchetrit, Hubert Banville, Jean-Remi King",
        "tldr": "",
        "abstract": "In the past five years, the use of generative and foundational AI systems has greatly improved the decoding of brain activity. Visual perception, in particular, can now be decoded from functional Magnetic Resonance Imaging (fMRI) with remarkable fidelity. This neuroimaging technique, however, suffers from a limited temporal resolution ($\\approx$0.5\\,Hz) and thus fundamentally constrains its real-time usage. Here, we propose an alternative approach based on magnetoencephalography (MEG), a neuroimaging device capable of measuring brain activity with high temporal resolution ($\\approx$5,000 Hz). For this, we develop an MEG decoding model trained with both contrastive and regression objectives and consisting of three modules: i) pretrained embeddings obtained from the image, ii) an MEG module trained end-to-end and iii) a pretrained image generator. Our results are threefold: Firstly, our MEG decoder shows a 7X improvement of image-retrieval over classic linear decoders. Second, late brain responses to images are best decoded with DINOv2, a recent foundational image model. Third, image retrievals and generations both suggest that high-level visual features can be decoded from MEG signals, although the same approach applied to 7T fMRI also recovers better low-level features. Overall, these results, while preliminary, provide an important step towards the decoding - in real-time - of the visual processes continuously unfolding within the human brain.",
        "keywords": "brain decoding;neuroimaging;image generation;visual perception",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/33660daed024e43122d3ebfc674cd73724ade9bb.pdf",
        "author": "Yohann Benchetrit;Hubert Banville;Jean-Remi King",
        "authorids": "~Yohann_Benchetrit1;~Hubert_Banville1;~Jean-Remi_King1",
        "gender": "M;;M",
        "homepage": ";;https://kingjr.github.io/",
        "dblp": "42/9992.html;;",
        "google_scholar": ";;XZOgIwEAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Yohann_Benchetrit1;~Hubert_Banville1;~Jean-Remi_King1",
        "aff": "Meta AI;;CNRS",
        "aff_domain": "ai.meta.com;;cnrs.fr",
        "position": "Researcher;;Associate Professor",
        "bibtex": "@inproceedings{\nbenchetrit2024brain,\ntitle={Brain decoding: toward real-time reconstruction of visual perception},\nauthor={Yohann Benchetrit and Hubert Banville and Jean-Remi King},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=3y1K6buO8c}\n}",
        "github": "",
        "project": "",
        "reviewers": "F12m;4PGh;hWdQ;hpxq",
        "pdf_size": 8172811,
        "rating": "6;6;8;8",
        "confidence": "3;3;4;4",
        "soundness": "3;3;4;3",
        "contribution": "2;2;4;2",
        "presentation": "3;3;3;4",
        "wc_summary": "92;145;122;89",
        "wc_strengths": "139;98;49;34",
        "wc_weaknesses": "597;142;42;371",
        "wc_questions": "7;119;14;51",
        "wc_review": "835;504;227;545",
        "wc_reply_reviewers": "192;47;0;21",
        "wc_reply_authors": "2911;1014;770;1765",
        "reply_reviewers": "2;2;0;1",
        "reply_authors": "7;4;2;3",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            112.0,
            23.010866998007703
        ],
        "wc_strengths_avg": [
            80.0,
            41.47891030391228
        ],
        "wc_weaknesses_avg": [
            288.0,
            214.5938023336182
        ],
        "wc_questions_avg": [
            47.75,
            44.40368790990226
        ],
        "wc_review_avg": [
            527.75,
            215.47317118379263
        ],
        "wc_reply_reviewers_avg": [
            65.0,
            75.18975994109836
        ],
        "wc_reply_authors_avg": [
            1615.0,
            833.2679641027848
        ],
        "reply_reviewers_avg": [
            1.25,
            0.82915619758885
        ],
        "reply_authors_avg": [
            4.0,
            1.8708286933869707
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 54,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11496380628988912301&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=3y1K6buO8c",
        "pdf": "https://openreview.net/pdf?id=3y1K6buO8c",
        "email": "ai.meta.com;;cnrs.fr",
        "author_num": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Meta;Centre National de la Recherche Scientifique",
        "aff_unique_dep": "Meta AI;",
        "aff_unique_url": "https://meta.com;https://www.cnrs.fr",
        "aff_unique_abbr": "Meta;CNRS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United States;France"
    },
    {
        "title": "T-Rep: Representation Learning for Time Series using Time-Embeddings",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19486",
        "id": "3y2TfP966N",
        "author_site": "Archibald Fraikin, Adrien Bennetot, Stephanie Allassonniere",
        "tldr": "",
        "abstract": "Multivariate time series present challenges to standard machine learning techniques, as they are often unlabeled, high dimensional, noisy, and contain missing data. To address this, we propose T-Rep, a self-supervised method to learn time series representations at a timestep granularity. T-Rep learns vector embeddings of time alongside its feature extractor, to extract temporal features such as trend, periodicity, or distribution shifts from the signal. These time-embeddings are leveraged in pretext tasks, to incorporate smooth and fine-grained temporal dependencies in the representations, as well as reinforce robustness to missing data. We evaluate T-Rep on downstream classification, forecasting, and anomaly detection tasks. It is compared to existing self-supervised algorithms for time series, which it outperforms in all three tasks. We test T-Rep in missing data regimes, where it proves more resilient than its counterparts. Finally, we provide latent space visualisation experiments, highlighting the interpretability of the learned representations.",
        "keywords": "Multivariate time series;Self-supervised;Time series representations;Temporal features;Time-Embeddings;Representation Learning;Missing data",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Archibald Felix Fraikin;Adrien Bennetot;Stephanie Allassonniere",
        "authorids": "~Archibald_Felix_Fraikin1;~Adrien_Bennetot1;~Stephanie_Allassonniere1",
        "gender": "M;M;F",
        "homepage": ";;https://sites.google.com/site/stephanieallassonniere/",
        "dblp": ";;",
        "google_scholar": ";Wo4dfcgAAAAJ;https://scholar.google.fr/citations?user=9ubMya8AAAAJ",
        "orcid": ";;",
        "linkedin": "archibald-fraikin-819607194/;;",
        "or_profile": "~Archibald_Felix_Fraikin1;~Adrien_Bennetot1;~Stephanie_Allassonniere1",
        "aff": ";;University Paris Descartes",
        "aff_domain": ";;parisdescartes.fr",
        "position": ";;Full Professor",
        "bibtex": "@inproceedings{\nfraikin2024trep,\ntitle={T-Rep: Representation Learning for Time Series using Time-Embeddings},\nauthor={Archibald Felix Fraikin and Adrien Bennetot and Stephanie Allassonniere},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=3y2TfP966N}\n}",
        "github": "",
        "project": "",
        "reviewers": "znEu;99iS;9kuw;rWLt;5x3c",
        "pdf_size": 2636673,
        "rating": "5;5;6;6;8",
        "confidence": "5;4;4;4;3",
        "soundness": "3;3;2;3;3",
        "contribution": "2;3;3;3;3",
        "presentation": "3;3;3;4;4",
        "wc_summary": "46;85;68;103;109",
        "wc_strengths": "119;126;43;44;231",
        "wc_weaknesses": "204;190;165;78;301",
        "wc_questions": "3;8;152;215;51",
        "wc_review": "372;409;428;440;692",
        "wc_reply_reviewers": "69;0;140;0;188",
        "wc_reply_authors": "1669;777;1433;1523;938",
        "reply_reviewers": "1;0;1;0;1",
        "reply_authors": "4;2;4;3;3",
        "rating_avg": [
            6.0,
            1.0954451150103321
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.8,
            0.39999999999999997
        ],
        "presentation_avg": [
            3.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            82.2,
            23.111901695879553
        ],
        "wc_strengths_avg": [
            112.6,
            68.97709764842241
        ],
        "wc_weaknesses_avg": [
            187.6,
            71.63407010633976
        ],
        "wc_questions_avg": [
            85.8,
            83.89851011787992
        ],
        "wc_review_avg": [
            468.2,
            114.24254899117054
        ],
        "wc_reply_reviewers_avg": [
            79.4,
            75.07755989641645
        ],
        "wc_reply_authors_avg": [
            1268.0,
            347.2843215579995
        ],
        "reply_reviewers_avg": [
            0.6,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            3.2,
            0.7483314773547882
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8660254037844387,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9027301723575336990&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=3y2TfP966N",
        "pdf": "https://openreview.net/pdf?id=3y2TfP966N",
        "email": ";;parisdescartes.fr",
        "author_num": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "University Paris Descartes",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.univ-paris5.fr",
        "aff_unique_abbr": "UPD",
        "aff_country_unique_index": "0",
        "aff_country_unique": "France"
    },
    {
        "id": "3yyGlNHnlj",
        "title": "GraphECL: Towards Efficient Contrastive Learning for Graphs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Due to the inherent label scarcity, learning useful representations on graphs with no supervision is of great benefit. Yet, existing graph self-supervised learning methods overlook the scalability challenge and fail to conduct fast inference of representations in latency-constrained applications due to the intensive message passing of graph neural networks. In this paper, we present GraphECL, a simple and efficient contrastive learning paradigm for graphs. To achieve inference acceleration, GraphECL does not rely on graph augmentations but introduces cross-model contrastive learning, where positive samples are obtained through \\MLP and \\GNN representations from the central node and its neighbors. We provide theoretical analysis on the design of this cross-model framework and discuss why our \\MLP can still capture structure information and enjoys better downstream performance as \\GNN. Extensive experiments on common real-world tasks verify the superior performance of \\simper compared to state-of-the-art methods, highlighting its intriguing properties, including better inference efficiency and generalization to both homophilous and heterophilous graphs. On large-scale datasets such as Snap-patents, the \\MLP learned by GraphECL is 286.82x faster than GCL methods with the same number of \\GNN layers.",
        "keywords": "Graph Neural Networks",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Teng Xiao;Huaisheng Zhu;Zhiwei Zhang;Zhimeng Guo;Charu C. Aggarwal;Suhang Wang",
        "authorids": "~Teng_Xiao2;~Huaisheng_Zhu1;~Zhiwei_Zhang10;~Zhimeng_Guo1;~Charu_C._Aggarwal2;~Suhang_Wang1",
        "gender": "M;M;M;M;M;M",
        "homepage": ";https://zzwjames.github.io/zhiweizhang.github.io/;;http://www.charuaggarwal.net;https://faculty.ist.psu.edu/szw494/;https://tengxiao1.github.io/",
        "dblp": "264/2622.html;68/1980-1.html;304/3478;a/CharuCAggarwal;136/9440;",
        "google_scholar": ";bT8RwQMAAAAJ;Du6bnGQAAAAJ;x_wsduUAAAAJ;cdT_WMMAAAAJ;ld3OKXwAAAAJ",
        "orcid": ";0009-0007-6153-2739;;0000-0003-2579-7581;0000-0003-3448-4878;",
        "linkedin": ";;;;;",
        "or_profile": "~Huaisheng_Zhu1;~Zhiwei_Zhang10;~Zhimeng_Guo1;~Charu_C._Aggarwal2;~Suhang_Wang1;~Teng_Xiao1",
        "aff": "Pennsylvania State University;Pennsylvania State University;Pennsylvania State University;International Business Machines;Pennsylvania State University;The Pennsylvania State University",
        "aff_domain": "psu.edu;psu.edu;psu.edu;ibm.com;psu.edu;psu.edu",
        "position": "PhD student;PhD student;PhD student;Distinguished Research Staff Member;Assistant Professor;PhD student",
        "bibtex": "@misc{\nxiao2024graphecl,\ntitle={Graph{ECL}: Towards Efficient Contrastive Learning for Graphs},\nauthor={Teng Xiao and Huaisheng Zhu and Zhiwei Zhang and Zhimeng Guo and Charu C. Aggarwal and Suhang Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=3yyGlNHnlj}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZTuD;GMYZ;eihc;ezu8;xAqE",
        "site": "https://openreview.net/forum?id=3yyGlNHnlj",
        "pdf_size": 1482963,
        "rating": "3;6;6;6;6",
        "confidence": "4;5;4;5;3",
        "soundness": "2;2;3;3;2",
        "contribution": "2;2;3;3;3",
        "presentation": "2;2;2;3;3",
        "wc_summary": "43;69;213;103;90",
        "wc_strengths": "67;33;97;47;37",
        "wc_weaknesses": "231;280;172;62;141",
        "wc_questions": "170;5;28;48;13",
        "wc_review": "511;387;510;260;281",
        "wc_reply_reviewers": "267;42;0;27;16",
        "wc_reply_authors": "1497;834;56;563;656",
        "reply_reviewers": "1;2;0;1;1",
        "reply_authors": "4;3;1;2;3",
        "rating_avg": [
            5.4,
            1.2
        ],
        "confidence_avg": [
            4.2,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            103.6,
            58.34929305484343
        ],
        "wc_strengths_avg": [
            56.2,
            23.54909764725604
        ],
        "wc_weaknesses_avg": [
            177.2,
            74.92769848327119
        ],
        "wc_questions_avg": [
            52.8,
            60.40331116751796
        ],
        "wc_review_avg": [
            389.8,
            107.54608314578454
        ],
        "wc_reply_reviewers_avg": [
            70.4,
            99.2544205564669
        ],
        "wc_reply_authors_avg": [
            721.2,
            466.1241894602768
        ],
        "reply_reviewers_avg": [
            1.0,
            0.6324555320336759
        ],
        "reply_authors_avg": [
            2.6,
            1.019803902718557
        ],
        "replies_avg": [
            30,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.1336306209562122,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:InVHuKjFXzEJ:scholar.google.com/&scioq=GraphECL:+Towards+Efficient+Contrastive+Learning+for+Graphs&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;0;0",
        "aff_unique_norm": "Pennsylvania State University;International Business Machines Corporation",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.psu.edu;https://www.ibm.com",
        "aff_unique_abbr": "PSU;IBM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Geometrically Aligned Transfer Encoder for Inductive Transfer in Regression Tasks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19485",
        "id": "3z60EWfh1p",
        "author_site": "Sung Moon Ko, Sumin Lee, Dae-Woong Jeong, Woohyung Lim, Sehui Han",
        "tldr": "",
        "abstract": "Transfer learning is a crucial technique for handling a small amount of data that is potentially related to other abundant data. However, most of the existing methods are focused on classification tasks using images and language datasets. Therefore, in order to expand the transfer learning scheme to regression tasks, we propose a novel transfer technique based on differential geometry, namely the Geometrically Aligned Transfer Encoder (${\\it GATE}$). In this method, we interpret the latent vectors from the model to exist on a Riemannian curved manifold. We find a proper diffeomorphism between pairs of tasks to ensure that every arbitrary point maps to a locally flat coordinate in the overlapping region, allowing the transfer of knowledge from the source to the target data. This also serves as an effective regularizer for the model to behave in extrapolation regions. In this article, we demonstrate that ${\\it GATE}$ outperforms conventional methods and exhibits stable behavior in both the latent space and extrapolation regions for various molecular graph datasets.",
        "keywords": "Transfer Learning;Inductive Transfer;Geometrical Deeplearning;Regression",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/6f3c2c8e33c955955cfe00ae0297256536311fc8.zip",
        "author": "Sung Moon Ko;Sumin Lee;Dae-Woong Jeong;Woohyung Lim;Sehui Han",
        "authorids": "~Sung_Moon_Ko1;~Sumin_Lee4;~Dae-Woong_Jeong1;~Woohyung_Lim1;~Sehui_Han1",
        "gender": "M;;M;M;F",
        "homepage": ";;;;",
        "dblp": "329/4280;;;86/7195;323/8751",
        "google_scholar": ";;https://scholar.google.co.kr/citations?hl=en;https://scholar.google.co.kr/citations?user=gtvxdcUAAAAJ;",
        "orcid": ";0009-0006-9077-2435;;0000-0003-0525-9065;",
        "linkedin": "sungmoonko/;sumin-lee-781138273/;;woohyunglim/;sehui-han-817a90182/",
        "or_profile": "~Sung_Moon_Ko1;~Sumin_Lee4;~Dae-Woong_Jeong1;~Woohyung_Lim1;~Sehui_Han1",
        "aff": "LG AI Research;LG AI Research;LG AI Research;LG AI Research;LG AI Research",
        "aff_domain": "lgresearch.ai;lgresearch.ai;lgresearch.ai;lgresearch.ai;lgresearch.ai",
        "position": "Researcher;Researcher;Researcher;Vice President;Researcher",
        "bibtex": "@inproceedings{\nko2024geometrically,\ntitle={Geometrically Aligned Transfer Encoder for Inductive Transfer in Regression Tasks},\nauthor={Sung Moon Ko and Sumin Lee and Dae-Woong Jeong and Woohyung Lim and Sehui Han},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=3z60EWfh1p}\n}",
        "github": "",
        "project": "",
        "reviewers": "NCqT;nPy4;6Cr1;Gg1C",
        "pdf_size": 846519,
        "rating": "5;6;6;8",
        "confidence": "4;3;3;2",
        "soundness": "2;3;3;2",
        "contribution": "2;3;3;3",
        "presentation": "3;3;2;2",
        "wc_summary": "104;204;33;132",
        "wc_strengths": "64;93;47;97",
        "wc_weaknesses": "69;235;114;144",
        "wc_questions": "114;60;126;100",
        "wc_review": "351;592;320;473",
        "wc_reply_reviewers": "0;215;30;252",
        "wc_reply_authors": "627;757;614;771",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            118.25,
            61.26326386995717
        ],
        "wc_strengths_avg": [
            75.25,
            20.69269194667528
        ],
        "wc_weaknesses_avg": [
            140.5,
            60.73919657025437
        ],
        "wc_questions_avg": [
            100.0,
            24.859605789312106
        ],
        "wc_review_avg": [
            434.0,
            107.66847263707236
        ],
        "wc_reply_reviewers_avg": [
            124.25,
            110.54043377877618
        ],
        "wc_reply_authors_avg": [
            692.25,
            72.06724290549764
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9733285267845754,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=844556749006184771&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=3z60EWfh1p",
        "pdf": "https://openreview.net/pdf?id=3z60EWfh1p",
        "email": "lgresearch.ai;lgresearch.ai;lgresearch.ai;lgresearch.ai;lgresearch.ai",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "LG",
        "aff_unique_dep": "LG AI Research",
        "aff_unique_url": "https://www.lgaires.com",
        "aff_unique_abbr": "LG AI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "On-Policy Distillation of Language Models: Learning from Self-Generated Mistakes",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19484",
        "id": "3zKtaqxLhW",
        "author_site": "Rishabh Agarwal, Nino Vieillard, Yongchao Zhou, Piotr Stanczyk, Sabela Ramos Garea, Matthieu Geist, Olivier Bachem",
        "tldr": "",
        "abstract": "Knowledge distillation (KD) is widely used for compressing a teacher model to reduce its inference cost and memory footprint, by training a smaller student model. However, current KD methods for auto-regressive sequence models suffer from distribution mismatch between output sequences seen during training and those generated by the student during inference. To address this issue, we introduce Generalized Knowledge Distillation (GKD). Instead of solely relying on a fixed set of output sequences, GKD trains the student on its self-generated output sequences by leveraging feedback from the teacher on such sequences. Unlike supervised KD approaches, GKD also offers the flexibility to employ alternative loss functions between the student and teacher, which can be useful when the student lacks the expressivity to mimic the teacher's distribution. Furthermore, GKD facilitates the seamless integration of distillation with RL fine-tuning (RLHF). We demonstrate the efficacy of GKD for distilling auto-regressive T5 language models on summarization, translation, and arithmetic reasoning tasks.",
        "keywords": "Language models;Distillation;RLHF",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Rishabh Agarwal;Nino Vieillard;Yongchao Zhou;Piotr Stanczyk;Sabela Ramos Garea;Matthieu Geist;Olivier Bachem",
        "authorids": "~Rishabh_Agarwal2;~Nino_Vieillard1;~Yongchao_Zhou1;~Piotr_Stanczyk1;~Sabela_Ramos_Garea1;~Matthieu_Geist1;~Olivier_Bachem1",
        "gender": "M;;M;M;F;M;M",
        "homepage": "https://agarwl.github.io;;;;https://scholar.google.com/citations?user=97trlAkAAAAJ&hl=en;;http://www.olivierbachem.ch/",
        "dblp": ";243/5918;;;;38/6508;https://dblp.org/pers/hd/b/Bachem:Olivier",
        "google_scholar": "https://scholar.google.ca/citations?user=aH8AJu4AAAAJ;https://scholar.google.fr/citations?user=4jua80IAAAAJ;35M6rhsAAAAJ;fKVK0dYAAAAJ;97trlAkAAAAJ;ectPLEUAAAAJ;https://scholar.google.ch/citations?user=mW9BcgsAAAAJ",
        "orcid": ";;;;;;",
        "linkedin": ";;yongchao-zhou-a298a7158/;;;;olivier-bachem-10257756/",
        "or_profile": "~Rishabh_Agarwal2;~Nino_Vieillard1;~Yongchao_Zhou1;~Piotr_Stanczyk1;~Sabela_Ramos_Garea1;~Matthieu_Geist1;~Olivier_Bachem1",
        "aff": "Google DeepMind;Google Deepmind;University of Toronto;;University of A Coru\u00f1a;Google;Google Brain",
        "aff_domain": "google.com;google.com;mail.utoronto.ca;;udc.es;google.com;google.com",
        "position": "Research Scientist;Researcher;PhD student;;PhD student;Researcher;Research scientist",
        "bibtex": "@inproceedings{\nagarwal2024onpolicy,\ntitle={On-Policy Distillation of Language Models: Learning from Self-Generated Mistakes},\nauthor={Rishabh Agarwal and Nino Vieillard and Yongchao Zhou and Piotr Stanczyk and Sabela Ramos Garea and Matthieu Geist and Olivier Bachem},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=3zKtaqxLhW}\n}",
        "github": "",
        "project": "",
        "reviewers": "Jqut;YEFj;Qwi5;HokL",
        "pdf_size": 671860,
        "rating": "6;6;6;8",
        "confidence": "3;3;3;3",
        "soundness": "3;3;2;3",
        "contribution": "3;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "107;61;44;80",
        "wc_strengths": "151;35;57;61",
        "wc_weaknesses": "116;30;106;119",
        "wc_questions": "94;26;2;59",
        "wc_review": "468;152;209;319",
        "wc_reply_reviewers": "0;0;24;14",
        "wc_reply_authors": "628;255;502;514",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            73.0,
            23.39871791359518
        ],
        "wc_strengths_avg": [
            76.0,
            44.41846462902562
        ],
        "wc_weaknesses_avg": [
            92.75,
            36.54705870518173
        ],
        "wc_questions_avg": [
            45.25,
            34.665364558879226
        ],
        "wc_review_avg": [
            287.0,
            120.51348472266496
        ],
        "wc_reply_reviewers_avg": [
            9.5,
            10.136567466356647
        ],
        "wc_reply_authors_avg": [
            474.75,
            136.06868669903446
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 109,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17644314409470129095&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=3zKtaqxLhW",
        "pdf": "https://openreview.net/pdf?id=3zKtaqxLhW",
        "email": "google.com;google.com;mail.utoronto.ca;;udc.es;google.com;google.com",
        "author_num": 7,
        "aff_unique_index": "0;1;2;3;0;0",
        "aff_unique_norm": "Google;DeepMind;University of Toronto;University of A Coru\u00f1a",
        "aff_unique_dep": "Google DeepMind;DeepMind;;",
        "aff_unique_url": "https://deepmind.com;https://deepmind.com;https://www.utoronto.ca;https://www.udc.es",
        "aff_unique_abbr": "DeepMind;DeepMind;U of T;UDC",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0;1;2;3;3",
        "aff_country_unique": "United Kingdom;Canada;Spain;United States"
    },
    {
        "title": "REBAR: Retrieval-Based Reconstruction for Time-series Contrastive Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19483",
        "id": "3zQo5oUvia",
        "author_site": "Maxwell Xu, Alexander Moreno, Hui Wei, Benjamin M Marlin, James Rehg",
        "tldr": "",
        "abstract": "The success of self-supervised contrastive learning hinges on identifying positive data pairs, such that when they are pushed together in embedding space, the space encodes useful information for subsequent downstream tasks. Constructing positive pairs is non-trivial as the pairing must be similar enough to reflect a shared semantic meaning, but different enough to capture within-class variation. Classical approaches in vision use augmentations to exploit well-established invariances to construct positive pairs, but invariances in the time-series domain are much less obvious. In our work, we propose a novel method of using a learned measure for identifying positive pairs. Our Retrieval-Based Reconstruction (REBAR) measure measures the similarity between two sequences as the reconstruction error that results from reconstructing one sequence with retrieved information from the other. Then, if the two sequences have high REBAR similarity, we label them as a positive pair. Through validation experiments, we show that the REBAR error is a predictor of mutual class membership. Once integrated into a contrastive learning framework, our REBAR method learns an embedding that achieves state-of-the-art performance on downstream tasks across various modalities.",
        "keywords": "time-series;contrastive learning;masked reconstruction;self-supervised learning;imputation;unsupervised learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/c86726dbbfe0b277c6a2e05cefadb1c1da643426.pdf",
        "author": "Maxwell Xu;Alexander Moreno;Hui Wei;Benjamin Marlin;James Matthew Rehg",
        "authorids": "~Maxwell_Xu1;~Alexander_Moreno1;~Hui_Wei3;~Benjamin_Marlin1;~James_Matthew_Rehg1",
        "gender": ";M;M;M;M",
        "homepage": "https://maxxu05.github.io/;;https://wll199566.github.io/davidhuiwei.github.io/;https://groups.cs.umass.edu/marlin/;http://rehg.org/",
        "dblp": ";161/6588;;03/7058.html;r/JMRehg",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;zoqP2-IAAAAJ;;ey960FIAAAAJ;https://scholar.google.com.tw/citations?user=8kA3eDwAAAAJ",
        "orcid": ";;;0000-0002-2626-3410;0000-0003-1793-5462",
        "linkedin": ";;;;",
        "or_profile": "~Maxwell_Xu1;~Alexander_Moreno1;~Hui_Wei3;~Benjamin_Marlin1;~James_Rehg1",
        "aff": "University of Illinois, Urbana Champaign;STR;University of Massachusetts Amherst;University of Massachusetts at Amherst;University of Illinois, Urbana Champaign",
        "aff_domain": "illinois.edu;str.edu;cs.umass.edu;umass.edu;illinois.edu",
        "position": "PhD student;Researcher;Researcher;Associate Professor;Full Professor",
        "bibtex": "@inproceedings{\nxu2024rebar,\ntitle={{REBAR}: Retrieval-Based Reconstruction for Time-series Contrastive Learning},\nauthor={Maxwell Xu and Alexander Moreno and Hui Wei and Benjamin Marlin and James Matthew Rehg},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=3zQo5oUvia}\n}",
        "github": "",
        "project": "",
        "reviewers": "mFnV;gCTH;jiyG;Hx4L",
        "pdf_size": 5845969,
        "rating": "5;5;6;8",
        "confidence": "3;4;3;4",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;2;3",
        "wc_summary": "92;37;72;34",
        "wc_strengths": "12;88;93;95",
        "wc_weaknesses": "131;137;293;113",
        "wc_questions": "135;80;39;5",
        "wc_review": "370;342;497;247",
        "wc_reply_reviewers": "34;0;38;0",
        "wc_reply_authors": "2303;1495;1870;370",
        "reply_reviewers": "1;0;2;0",
        "reply_authors": "4;2;3;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            58.75,
            24.324627438051337
        ],
        "wc_strengths_avg": [
            72.0,
            34.734708865916815
        ],
        "wc_weaknesses_avg": [
            168.5,
            72.42064622743986
        ],
        "wc_questions_avg": [
            64.75,
            48.478732450426136
        ],
        "wc_review_avg": [
            364.0,
            89.30005599102388
        ],
        "wc_reply_reviewers_avg": [
            18.0,
            18.05547008526779
        ],
        "wc_reply_authors_avg": [
            1509.5,
            717.3341271680862
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.40824829046386296,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14225911127705256116&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=3zQo5oUvia",
        "pdf": "https://openreview.net/pdf?id=3zQo5oUvia",
        "email": "illinois.edu;str.edu;cs.umass.edu;umass.edu;illinois.edu",
        "author_num": 5,
        "aff_unique_index": "0;2;2;0",
        "aff_unique_norm": "University of Illinois Urbana-Champaign;;University of Massachusetts Amherst",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://illinois.edu;;https://www.umass.edu",
        "aff_unique_abbr": "UIUC;;UMass Amherst",
        "aff_campus_unique_index": "0;2;2;0",
        "aff_campus_unique": "Urbana-Champaign;;Amherst",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States;"
    },
    {
        "title": "DORSal: Diffusion for Object-centric Representations of Scenes $\\textit{et al.}$",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19482",
        "id": "3zvB14IF6D",
        "author_site": "Allan Jabri, Sjoerd van Steenkiste, Emiel Hoogeboom, Mehdi S. M. Sajjadi, Thomas Kipf",
        "tldr": "",
        "abstract": "Recent progress in 3D scene understanding enables scalable learning of representations across large datasets of diverse scenes. As a consequence, generalization to unseen scenes and objects, rendering novel views from just a single or a handful of input images, and controllable scene generation that supports editing, is now possible. However, training jointly on a large number of scenes typically compromises rendering quality when compared to single-scene optimized models such as NeRFs. In this paper, we leverage recent progress in diffusion models to equip 3D scene representation learning models with the ability to render high-fidelity novel views, while retaining benefits such as object-level scene editing to a large degree. In particular, we propose DORSal, which adapts a video diffusion architecture for 3D scene generation conditioned on frozen object-centric slot-based representations of scenes. On both complex synthetic multi-object scenes and on the real-world large-scale Street View dataset, we show that DORSal enables scalable neural rendering of 3D scenes with object-level editing and improves upon existing approaches.",
        "keywords": "novel view synthesis;object-centric scene representations;camera control;scene editing;3D;diffusion;generative models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/ca67852edc6143b7cc616754dc453757a5449790.zip",
        "author": "Allan Jabri;Sjoerd van Steenkiste;Emiel Hoogeboom;Mehdi S. M. Sajjadi;Thomas Kipf",
        "authorids": "~Allan_Jabri2;~Sjoerd_van_Steenkiste1;~Emiel_Hoogeboom1;~Mehdi_S._M._Sajjadi1;~Thomas_Kipf2",
        "gender": ";M;;Unspecified;M",
        "homepage": "http://ajabri.github.io;http://www.sjoerdvansteenkiste.com/;;http://msajjadi.com;http://tkipf.github.io/",
        "dblp": "172/0858;183/9326;217/1488;164/6190;186/8206",
        "google_scholar": ";i-AStBYAAAAJ;https://scholar.google.nl/citations?user=nkTd_BIAAAAJ;https://scholar.google.de/citations?user=rHF25YEAAAAJ;83HL5FwAAAAJ",
        "orcid": ";;;0000-0002-6002-2370;",
        "linkedin": ";;;;thomas-kipf-6b260410a",
        "or_profile": "~Allan_Jabri2;~Sjoerd_van_Steenkiste1;~Emiel_Hoogeboom1;~Mehdi_S._M._Sajjadi1;~Thomas_N._Kipf1",
        "aff": ";Google;Google;Google DeepMind;Google",
        "aff_domain": ";google.com;google.com;google.com;google.com",
        "position": ";Researcher;Researcher;Researcher;Research Scientist",
        "bibtex": "@inproceedings{\njabri2024dorsal,\ntitle={{DORS}al: Diffusion for Object-centric Representations of Scenes \\${\\textbackslash}textit\\{et al.\\}\\$},\nauthor={Allan Jabri and Sjoerd van Steenkiste and Emiel Hoogeboom and Mehdi S. M. Sajjadi and Thomas Kipf},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=3zvB14IF6D}\n}",
        "github": "",
        "project": "",
        "reviewers": "16Uh;J43q;dJMA;jJcr",
        "pdf_size": 16061122,
        "rating": "5;6;6;6",
        "confidence": "5;4;4;3",
        "soundness": "3;3;4;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "99;56;43;69",
        "wc_strengths": "73;65;71;127",
        "wc_weaknesses": "138;50;270;126",
        "wc_questions": "49;99;376;2",
        "wc_review": "359;270;760;324",
        "wc_reply_reviewers": "189;156;242;112",
        "wc_reply_authors": "814;1386;2000;470",
        "reply_reviewers": "1;1;2;1",
        "reply_authors": "2;3;4;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            66.75,
            20.765054779605084
        ],
        "wc_strengths_avg": [
            84.0,
            25.0
        ],
        "wc_weaknesses_avg": [
            146.0,
            79.14543574963751
        ],
        "wc_questions_avg": [
            131.5,
            145.26957699394598
        ],
        "wc_review_avg": [
            428.25,
            194.14218372110685
        ],
        "wc_reply_reviewers_avg": [
            174.75,
            47.47301865270419
        ],
        "wc_reply_authors_avg": [
            1167.5,
            581.435078061171
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "openreview": "https://openreview.net/forum?id=3zvB14IF6D",
        "pdf": "https://openreview.net/pdf?id=3zvB14IF6D",
        "email": ";google.com;google.com;google.com;google.com",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Google",
        "aff_unique_dep": "Google",
        "aff_unique_url": "https://www.google.com",
        "aff_unique_abbr": "Google",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Mountain View;",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "41CYtxM2jQ",
        "title": "Boosting Fast and High-Quality Speech Synthesis with Linear Diffusion",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Denoising diffusion probabilistic models have shown extraordinary ability on various generative tasks. However, their slow inference speed renders them impractical in speech synthesis. This paper proposes a linear diffusion model (LinDiff) based on an ordinary differential equation to simultaneously reach fast inference and high sample quality. We employs linear interpolation between the target and noise to design a diffusion sequence for training, while previously the diffusion path that links the noise and target is a curved segment. When we decrease the number of sampling steps (i.e., the number of line segments used to fit the path), the ease of fitting straight lines compared to curves allows us to generate higher quality samples from a random noise with fewer iterations. To reduce computational complexity and achieve effective global modeling of noisy speech, LinDiff employs a patch-based processing approach that partitions the input signal into small patches. The patch-wise token leverages transformer architecture for effective modeling of global information. Additionally, the model seamlessly integrates the strengths of both transformer and convolutional neural networks by utilizing a post-convolution module for fine-grained detail restoration. Adversarial training is further used to improve the sample quality with decreased sampling steps. We test this model on speech synthesis conditioned on acoustic feature (Mel-spectrograms). Experimental results verify that our model can synthesize high-quality speech even with only one diffusion step. Both subjective and objective evaluations demonstrate that our model can synthesize speech of a quality comparable to that of autoregressive models with faster synthesis speed.",
        "keywords": "Diffusion; Adversarial training; Transformer-based backbone; Speech synthesis; Vocoder",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/e1481d25086b4492c384898eda709029122cd7b4.zip",
        "author": "Haogeng Liu;Tao Wang;Jie Cao;Ran He;Jianhua Tao",
        "authorids": "~Haogeng_Liu1;~Tao_Wang7;~Jie_Cao2;~Ran_He1;~Jianhua_Tao1",
        "gender": "M;M;M;M;",
        "homepage": "https://github.com/liuhaogeng;https://github.com/hairuo55;https://ttxsjie.github.io/;https://rhe-web.github.io/;",
        "dblp": ";12/5838-74;39/6191-2;61/6198-1;",
        "google_scholar": ";bCS6NUoAAAAJ;https://scholar.google.com/citations?hl=en;ayrg9AUAAAAJ;",
        "orcid": ";0000-0003-1490-6973;0000-0001-6368-4495;0000-0002-3807-991X;",
        "linkedin": ";;;;",
        "or_profile": "~Haogeng_Liu1;~Tao_Wang7;~Jie_Cao2;~Ran_He1;~Jianhua_Tao1",
        "aff": "University of Chinese Academy of Sciences;Institute of Automation, Chinese Academy of Sciences;Institute of Automation, Chinese Academy of Sciences;Institute of Automation, Chinese Academy of Sciences;",
        "aff_domain": "ucas.ac.cn;ia.ac.cn;ia.ac.cn;ia.ac.cn;",
        "position": "MS student;Researcher;Associate Professor;Full Professor;",
        "bibtex": "@misc{\nliu2024boosting,\ntitle={Boosting Fast and High-Quality Speech Synthesis with Linear Diffusion},\nauthor={Haogeng Liu and Tao Wang and Jie Cao and Ran He and Jianhua Tao},\nyear={2024},\nurl={https://openreview.net/forum?id=41CYtxM2jQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "QZgE;JAcM;zJkF;2DZz",
        "site": "https://openreview.net/forum?id=41CYtxM2jQ",
        "pdf_size": 568620,
        "rating": "3;3;5;6",
        "confidence": "4;5;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "80;52;59;45",
        "wc_strengths": "90;45;52;50",
        "wc_weaknesses": "214;188;138;185",
        "wc_questions": "1;90;80;5",
        "wc_review": "385;375;329;285",
        "wc_reply_reviewers": "0;0;107;0",
        "wc_reply_authors": "449;463;411;292",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            59.0,
            13.095800853708795
        ],
        "wc_strengths_avg": [
            59.25,
            17.93564885918544
        ],
        "wc_weaknesses_avg": [
            181.25,
            27.39867697535777
        ],
        "wc_questions_avg": [
            44.0,
            41.176449579826574
        ],
        "wc_review_avg": [
            343.5,
            39.834030677299026
        ],
        "wc_reply_reviewers_avg": [
            26.75,
            46.332359102467464
        ],
        "wc_reply_authors_avg": [
            403.75,
            67.26579740105666
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5555555555555555,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7815464375704137849&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "University of Chinese Academy of Sciences;Chinese Academy of Sciences",
        "aff_unique_dep": ";Institute of Automation",
        "aff_unique_url": "http://www.ucas.ac.cn;http://www.ia.cas.cn",
        "aff_unique_abbr": "UCAS;CAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Neural Rate Control for Learned Video Compression",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19481",
        "id": "42lcaojZug",
        "author_site": "yiwei zhang, Guo Lu, Yunuo Chen, Shen Wang, Yibo Shi, Jing Wang, Li Song",
        "tldr": "",
        "abstract": "The learning-based video compression method has made significant progress in recent years, exhibiting promising compression performance compared with traditional video codecs. However, prior works have primarily focused on advanced compression architectures while neglecting the rate control technique. Rate control can precisely control the coding bitrate with optimal compression performance, which is a critical technique in practical deployment. To address this issue, we present a fully neural network-based rate control system for learned video compression methods. Our system accurately encodes videos at a given bitrate while enhancing the rate-distortion performance. Specifically, we first design a rate allocation model to assign optimal bitrates to each frame based on their varying spatial and temporal characteristics. Then, we propose a deep learning-based rate implementation network to perform the rate-parameter mapping, precisely predicting coding parameters for a given rate. Our proposed rate control system can be easily integrated into existing learning-based video compression methods. The extensive experimental results show that the proposed method achieves accurate rate control on several baseline methods while also improving overall rate-distortion performance.",
        "keywords": "Video compression;End-to-end;Learning-based video coding;Rate Control.",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yiwei Zhang;Guo Lu;Yunuo Chen;Shen Wang;Yibo Shi;Jing Wang;Li Song",
        "authorids": "~Yiwei_Zhang3;~Guo_Lu2;~Yunuo_Chen1;~Shen_Wang4;~Yibo_Shi1;~Jing_Wang18;~Li_Song3",
        "gender": "M;M;M;M;M;F;M",
        "homepage": ";https://guolusjtu.github.io/guoluhomepage/;;;https://github.com/wu6shen/;http://w3.huawei.com/next/indexa.html;http://medialab.sjtu.edu.cn",
        "dblp": ";76/7805;;;;;20/872-1",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;R9iwlJcAAAAJ;;https://scholar.google.com/citations?view_op=list_works;;;jKIoTVoAAAAJ",
        "orcid": ";;;;;;",
        "linkedin": ";;https://www.linkedin.cn/incareer/in/unochenyn;;;;",
        "or_profile": "~Yiwei_Zhang3;~Guo_Lu2;~Yunuo_Chen1;~Shen_Wang4;~Yibo_Shi1;~Jing_Wang18;~Li_Song3",
        "aff": "Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;Huawei Technologies Ltd.;Huawei Technologies Ltd.;Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;huawei.com;huawei.com;sjtu.edu.cn",
        "position": "MS student;Assistant Professor;PhD student;PhD student;Engineer;engineer;Full Professor",
        "bibtex": "@inproceedings{\nzhang2024neural,\ntitle={Neural Rate Control for Learned Video Compression},\nauthor={Yiwei Zhang and Guo Lu and Yunuo Chen and Shen Wang and Yibo Shi and Jing Wang and Li Song},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=42lcaojZug}\n}",
        "github": "",
        "project": "",
        "reviewers": "c8Ca;cdDb;gAxb;Tpyi",
        "pdf_size": 1652401,
        "rating": "5;6;8;8",
        "confidence": "5;4;5;4",
        "soundness": "3;3;3;2",
        "contribution": "2;2;4;3",
        "presentation": "3;2;4;4",
        "wc_summary": "102;60;73;122",
        "wc_strengths": "57;68;93;107",
        "wc_weaknesses": "224;39;77;113",
        "wc_questions": "4;53;45;60",
        "wc_review": "387;220;288;402",
        "wc_reply_reviewers": "0;0;0;29",
        "wc_reply_authors": "594;518;420;644",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            89.25,
            24.262883175748097
        ],
        "wc_strengths_avg": [
            81.25,
            19.778460506318485
        ],
        "wc_weaknesses_avg": [
            113.25,
            69.08825877093734
        ],
        "wc_questions_avg": [
            40.5,
            21.73131381210073
        ],
        "wc_review_avg": [
            324.25,
            74.43915300431621
        ],
        "wc_reply_reviewers_avg": [
            7.25,
            12.55736835487436
        ],
        "wc_reply_authors_avg": [
            544.0,
            84.4866853415377
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.19245008972987526,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13934198905050538246&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=42lcaojZug",
        "pdf": "https://openreview.net/pdf?id=42lcaojZug",
        "email": "sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;huawei.com;huawei.com;sjtu.edu.cn",
        "author_num": 7,
        "aff_unique_index": "0;0;0;0;1;1;0",
        "aff_unique_norm": "Shanghai Jiao Tong University;Huawei",
        "aff_unique_dep": ";Huawei Technologies",
        "aff_unique_url": "https://www.sjtu.edu.cn;https://www.huawei.com",
        "aff_unique_abbr": "SJTU;Huawei",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "43WKxTuJxu",
        "title": "Orthogonal Function Representations for Continuous Armed Bandits",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper addresses the continuous-armed bandit problem, which is a generalization of the standard bandit problem where the action space is a d\u2212dimensional\nhypercube $X = [\u22121, 1]^d$ and the reward is an s\u2212times differentiable function\n$f : \\mathcal X \u2192 \\mathbb R$. Traditionally, this problem is solved by assuming an implicit feature\nrepresentation in a Reproducing Kernel Hilbert Space (RKHS), where the objective\nfunction is linear in this transformation of $\\mathcal X$ . In addition to this additional intake,\nthis comes at the cost of overwhelming computational complexity. In contrast, we\npropose an explicit representation using an orthogonal feature map (Fourier, Legendre) to reduce the problem to a linear bandit with misspecification. As a result,\nwe develop two algorithms _OB-LinUCB_ and _OB-PE_, achieving state-of-the-art\nperformance in terms of regret and computational complexity.",
        "keywords": "Continuous armed bandit;Orthogonal functions;Linear bandits;Smoothness",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/1e1138329da248be4fb0c3134d81d3369f288b3b.pdf",
        "author": "Davide Maran;Marcello Restelli",
        "authorids": "~Davide_Maran1;~Marcello_Restelli1",
        "gender": "M;M",
        "homepage": "https://davidezfc.github.io/;http://home.deib.polimi.it/restelli/",
        "dblp": "320/3835;64/1011",
        "google_scholar": "https://scholar.google.it/citations?user=a8i0X8oAAAAJ;https://scholar.google.com.tw/citations?user=xdgxRiEAAAAJ",
        "orcid": ";0000-0002-6322-1076",
        "linkedin": "davide-maran/;",
        "or_profile": "~Davide_Maran1;~Marcello_Restelli1",
        "aff": "Polytechnic Institute of Milan;Politecnico di Milano",
        "aff_domain": "polimi.it;polimi.it",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\nmaran2024orthogonal,\ntitle={Orthogonal Function Representations for Continuous Armed Bandits},\nauthor={Davide Maran and Marcello Restelli},\nyear={2024},\nurl={https://openreview.net/forum?id=43WKxTuJxu}\n}",
        "github": "",
        "project": "",
        "reviewers": "DACT;hB5r;hchS;MY3R",
        "site": "https://openreview.net/forum?id=43WKxTuJxu",
        "pdf_size": 1833724,
        "rating": "5;5;5;6",
        "confidence": "3;3;3;3",
        "soundness": "2;3;2;4",
        "contribution": "2;2;2;3",
        "presentation": "2;3;2;3",
        "wc_summary": "69;110;65;79",
        "wc_strengths": "70;48;29;55",
        "wc_weaknesses": "211;226;239;61",
        "wc_questions": "151;223;84;89",
        "wc_review": "501;607;417;284",
        "wc_reply_reviewers": "106;74;66;58",
        "wc_reply_authors": "487;594;724;518",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;1;2;2",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            80.75,
            17.640507362318125
        ],
        "wc_strengths_avg": [
            50.5,
            14.739402972983676
        ],
        "wc_weaknesses_avg": [
            184.25,
            71.84488499538433
        ],
        "wc_questions_avg": [
            136.75,
            56.35767472137224
        ],
        "wc_review_avg": [
            452.25,
            118.18920212946698
        ],
        "wc_reply_reviewers_avg": [
            76.0,
            18.2208671582886
        ],
        "wc_reply_authors_avg": [
            580.75,
            91.40944973032055
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:txoEUwjSWvIJ:scholar.google.com/&scioq=Orthogonal+Function+Representations+for+Continuous+Armed+Bandits&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Polytechnic Institute of Milan;Politecnico di Milano",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.polimi.it/;https://www.polimi.it",
        "aff_unique_abbr": "Politecnico di Milano;Polimi",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Italy"
    },
    {
        "title": "Understanding Expressivity of GNN in Rule Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19480",
        "id": "43cYe4oogi",
        "author_site": "Haiquan Qiu, Yongqi Zhang, Yong Li, Quanming Yao",
        "tldr": "",
        "abstract": "Rule learning is critical to improving knowledge graph (KG) reasoning due to their ability to provide logical and interpretable explanations. Recently, Graph Neural Networks (GNNs) with tail entity scoring achieve the state-of-the-art performance on KG reasoning. However, the theoretical understandings for these GNNs are either lacking or focusing on single-relational graphs, leaving what the kind of rules these GNNs can learn an open problem. We propose to fill the above gap in this paper. Specifically, GNNs with tail entity scoring are unified into a common framework. Then, we analyze their expressivity by formally describing the rule structures they can learn and theoretically demonstrating their superiority. These results further inspire us to propose a novel labeling strategy to learn more rules in KG reasoning. Experimental results are consistent with our theoretical findings and verify the effectiveness of our proposed method. The code is publicly available at https://github.com/LARS-research/Rule-learning-expressivity.",
        "keywords": "Graph Neural Networks;KG reasoning;Link prediction;Rule learning;Expressivity",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Haiquan Qiu;Yongqi Zhang;Yong Li;quanming yao",
        "authorids": "~Haiquan_Qiu1;~Yongqi_Zhang2;~Yong_Li7;~quanming_yao1",
        "gender": "M;M;M;M",
        "homepage": ";https://yzhangee.github.io/;http://fi.ee.tsinghua.edu.cn/~liyong/;https://lars-group.github.io/",
        "dblp": "01/1435;;;158/1014",
        "google_scholar": "JoumqGMAAAAJ;https://scholar.google.com.hk/citations?user=nVk-7EAAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com/schhp?hl=en",
        "orcid": "0000-0001-5202-4950;0000-0003-2085-7418;;",
        "linkedin": ";;;",
        "or_profile": "~Haiquan_Qiu1;~Yongqi_Zhang2;~Yong_Li7;~quanming_yao1",
        "aff": "Tsinghua University;4Paradigm. Inc;Tsinghua University;Department of Electronic Engineering",
        "aff_domain": "tsinghua.edu.cn;4paradigm.com;tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "PhD student;Researcher;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nqiu2024understanding,\ntitle={Understanding Expressivity of {GNN} in Rule Learning},\nauthor={Haiquan Qiu and Yongqi Zhang and Yong Li and quanming yao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=43cYe4oogi}\n}",
        "github": "",
        "project": "",
        "reviewers": "NwzR;S7Jh;zRzb;TfWh",
        "pdf_size": 924751,
        "rating": "5;6;6;8",
        "confidence": "3;3;3;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "63;117;92;85",
        "wc_strengths": "115;138;60;56",
        "wc_weaknesses": "685;104;51;1",
        "wc_questions": "43;53;11;63",
        "wc_review": "906;412;214;205",
        "wc_reply_reviewers": "60;12;0;0",
        "wc_reply_authors": "1770;768;109;198",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "5;2;1;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            89.25,
            19.266226926930972
        ],
        "wc_strengths_avg": [
            92.25,
            35.23049105533444
        ],
        "wc_weaknesses_avg": [
            210.25,
            276.506216024161
        ],
        "wc_questions_avg": [
            42.5,
            19.512816301087856
        ],
        "wc_review_avg": [
            434.25,
            284.6527489767137
        ],
        "wc_reply_reviewers_avg": [
            18.0,
            24.73863375370596
        ],
        "wc_reply_authors_avg": [
            711.25,
            661.4950396639418
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            1.6393596310755
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9819222418001393982&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=43cYe4oogi",
        "pdf": "https://openreview.net/pdf?id=43cYe4oogi",
        "email": "tsinghua.edu.cn;4paradigm.com;tsinghua.edu.cn;tsinghua.edu.cn",
        "author_num": 4,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "Tsinghua University;4Paradigm;Institution Name Not Provided",
        "aff_unique_dep": ";;Department of Electronic Engineering",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.4paradigm.com/;",
        "aff_unique_abbr": "THU;;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China;"
    },
    {
        "id": "43flsheS4s",
        "title": "Improving Robustness and Accuracy with Retrospective Online Adversarial Distillation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Adversarial distillation (AD), transferring knowledge of a robust teacher model to a student model, has emerged as an advanced technique for improving robustness against adversarial attacks. However, AD in general suffers from the high computational complexity of pre-training the robust teacher, and the inherent trade-off between robustness and natural accuracy (i.e., accuracy on clean data). To address these issues, we propose retrospective online adversarial distillation (ROAD). ROAD exploits the student itself of the last epoch and a natural model (i.e., a model trained with clean data) as teachers, instead of a pre-trained robust teacher in the conventional AD. We revealed both theoretically and empirically that knowledge distillation from the student of the last epoch allows to penalize overly confident predictions on adversarial examples, leading to improved robustness and generalization. Also, the student and the natural model are trained together in a collaborative manner, which enables to improve natural accuracy of the student more effectively. We demonstrate by extensive experiments that ROAD achieved outstanding performance in both robustness and natural accuracy with substantially reduced training time and computation cost.",
        "keywords": "Adversarial Training;Adversarial Distillation;Knowledge Distillation",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/0749a3ea8221caa3779abfa552ee30856ee426b4.zip",
        "author": "Joongsu Kim;Junhyung Jo;Suha Kwak;Young-Joo Suh",
        "authorids": "~Joongsu_Kim2;~Junhyung_Jo1;~Suha_Kwak3;~Young-Joo_Suh1",
        "gender": ";M;M;M",
        "homepage": ";;https://suhakwak.github.io/;http://monet.postech.ac.kr/yjsuh/",
        "dblp": ";;65/6173;91/4495",
        "google_scholar": ";https://scholar.google.co.kr/citations?view_op=list_works;-gscDIEAAAAJ;https://scholar.google.com.tw/citations?user=MW-4uU4AAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Joongsu_Kim2;~Junhyung_Jo1;~Suha_Kwak3;~Young-Joo_Suh1",
        "aff": ";Pohang University of Science and Technology;POSTECH;Pohang University of Science and Technology",
        "aff_domain": ";postech.edu;postech.ac.kr;postech.edu",
        "position": ";MS student;Associate Professor;Full Professor",
        "bibtex": "@misc{\nkim2024improving,\ntitle={Improving Robustness and Accuracy with Retrospective Online Adversarial Distillation},\nauthor={Joongsu Kim and Junhyung Jo and Suha Kwak and Young-Joo Suh},\nyear={2024},\nurl={https://openreview.net/forum?id=43flsheS4s}\n}",
        "github": "",
        "project": "",
        "reviewers": "m9Uu;FC1d;cBNA;zap7",
        "site": "https://openreview.net/forum?id=43flsheS4s",
        "pdf_size": 3313956,
        "rating": "3;5;5;6",
        "confidence": "5;5;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;1;3",
        "wc_summary": "90;50;102;75",
        "wc_strengths": "39;30;62;56",
        "wc_weaknesses": "376;104;300;169",
        "wc_questions": "282;2;86;60",
        "wc_review": "787;186;550;360",
        "wc_reply_reviewers": "296;59;0;0",
        "wc_reply_authors": "1285;684;728;559",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "3;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            79.25,
            19.40843888621648
        ],
        "wc_strengths_avg": [
            46.75,
            12.833062767710599
        ],
        "wc_weaknesses_avg": [
            237.25,
            106.77400198550207
        ],
        "wc_questions_avg": [
            107.5,
            105.23663810669743
        ],
        "wc_review_avg": [
            470.75,
            223.4069996665279
        ],
        "wc_reply_reviewers_avg": [
            88.75,
            122.05608342069641
        ],
        "wc_reply_authors_avg": [
            814.0,
            278.9094835246733
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.6882472016116854,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:XhI7sl2au9wJ:scholar.google.com/&scioq=Improving+Robustness+and+Accuracy+with+Retrospective+Online+Adversarial+Distillation&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Pohang University of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.postech.ac.kr",
        "aff_unique_abbr": "POSTECH",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Pohang",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "468KWV14ll",
        "title": "Exploration and Anti-Exploration with Distributional Random Network Distillation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Exploration remains a critical issue in deep reinforcement learning for an agent to attain high returns in unknown environments. Although the prevailing exploration Random Network Distillation (RND) algorithm has been demonstrated to be effective in numerous environments, it often needs more discriminative power in bonus allocation. This paper highlights the ''bonus inconsistency'' issue within RND, pinpointing its primary limitation. To address this issue, we introduce the Distributional RND (DRND), a derivative of the RND. DRND enhances the exploration process by distilling a distribution of random networks and implicitly incorporates pseudo counts to improve the precision of bonus allocation. This refinement encourages agents to engage in more extensive exploration. Our method effectively mitigates the inconsistency issue without introducing significant computational overhead. Both theoretical analysis and experimental results demonstrate the superiority of our approach over the original RND algorithm. Our method excels in challenging online exploration scenarios and effectively serves as an anti-exploration mechanism in D4RL offline tasks.",
        "keywords": "Reinforcement learning;exploration;anti-exploration",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/b2ceaa769851ff9b67a51b8489c83e58247d08bc.zip",
        "author": "Kai Yang;Jian Tao;Jiafei Lyu;Xiu Li",
        "authorids": "~Kai_Yang6;~Jian_Tao5;~Jiafei_Lyu1;~Xiu_Li1",
        "gender": "M;M;M;F",
        "homepage": "https://github.com/yk7333;https://orcid.org/0009-0007-8439-3161;;https://thusigsiclab.github.io/thu.github.io/introduction.html",
        "dblp": ";;278/1503;13/1206-1",
        "google_scholar": ";;bfgCMr8AAAAJ;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": ";0009-0007-8439-3161;0000-0001-6616-417X;0000-0003-0403-1923",
        "linkedin": ";;;",
        "or_profile": "~Kai_Yang6;~Jian_Tao5;~Jiafei_Lyu1;~Xiu_Li1",
        "aff": "Tsinghua University;Chaocanshu;Tsinghua University;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;chaocanshu.ai;tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "MS student;Intern;PhD student;Professor",
        "bibtex": "@misc{\nyang2024exploration,\ntitle={Exploration and Anti-Exploration with Distributional Random Network Distillation},\nauthor={Kai Yang and Jian Tao and Jiafei Lyu and Xiu Li},\nyear={2024},\nurl={https://openreview.net/forum?id=468KWV14ll}\n}",
        "github": "",
        "project": "",
        "reviewers": "4Wh1;u9ew;gfXh",
        "site": "https://openreview.net/forum?id=468KWV14ll",
        "pdf_size": 13044600,
        "rating": "6;6;6",
        "confidence": "3;2;3",
        "soundness": "3;2;3",
        "contribution": "3;2;3",
        "presentation": "3;3;2",
        "wc_summary": "70;43;113",
        "wc_strengths": "32;37;98",
        "wc_weaknesses": "55;253;343",
        "wc_questions": "46;153;82",
        "wc_review": "203;486;636",
        "wc_reply_reviewers": "0;48;493",
        "wc_reply_authors": "326;802;1282",
        "reply_reviewers": "0;2;3",
        "reply_authors": "2;4;6",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            75.33333333333333,
            28.82514334550461
        ],
        "wc_strengths_avg": [
            55.666666666666664,
            30.00370347510824
        ],
        "wc_weaknesses_avg": [
            217.0,
            120.29962593458053
        ],
        "wc_questions_avg": [
            93.66666666666667,
            44.4547210341289
        ],
        "wc_review_avg": [
            441.6666666666667,
            179.52963234209804
        ],
        "wc_reply_reviewers_avg": [
            180.33333333333334,
            221.95545098560257
        ],
        "wc_reply_authors_avg": [
            803.3333333333334,
            390.286504449687
        ],
        "reply_reviewers_avg": [
            1.6666666666666667,
            1.247219128924647
        ],
        "reply_authors_avg": [
            4.0,
            1.632993161855452
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 17,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13786006434311853287&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Tsinghua University;Chaocanshu",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tsinghua.edu.cn;",
        "aff_unique_abbr": "THU;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China;"
    },
    {
        "title": "OPTIMAL ROBUST MEMORIZATION WITH RELU NEURAL NETWORKS",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19479",
        "id": "47hDbAMLbc",
        "author_site": "Lijia Yu, XIAOSHAN GAO, Lijun Zhang",
        "tldr": "",
        "abstract": "Memorization with neural networks is to study the expressive power of neural networks to interpolate a finite classification data set, which is closely related to the generalizability of deep learning. However, the important problem of robust memorization has not been thoroughly studied. In this paper, several basic problems about robust memorization are solved. First, we prove that it is NP-hard to compute neural networks with certain simple structures, which are robust memorization. A network hypothesis space is called optimal robust memorization for a data set if it can achieve robust memorization for any budget less than half the separation bound of the data set. Second, we explicitly construct neural networks with O(N n) parameters for optimal robust memorization of any data set with dimension n and size N . We also give a lower bound for the width of networks to achieve optimal robust memorization. Finally, we explicitly construct neural networks with\nO(N n log n) parameters for optimal robust memorization of any binary classification data set by controlling the Lipschitz constant of the network.",
        "keywords": "Memorization;expressive power of network;optimal robust memorization;computation complexity;Lipschitz constant",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Lijia Yu;Xiao-Shan Gao;Lijun Zhang",
        "authorids": "~Lijia_Yu2;~Xiao-Shan_Gao2;~Lijun_Zhang2",
        "gender": "M;M;M",
        "homepage": ";http://www.mmrc.iss.ac.cn/~xgao/;",
        "dblp": "175/8873.html;13/3109;76/4015-1",
        "google_scholar": ";_se7GmUAAAAJ;",
        "orcid": ";0000-0003-2021-9395;",
        "linkedin": ";;",
        "or_profile": "~Lijia_Yu2;~Xiao-Shan_Gao2;~Lijun_Zhang2",
        "aff": "Institute of Software, Chinese Academy of Sciences;Academy of Mathematics and Systems Science, Chinese Academy of Sciences, Chinese Academy of Sciences;Chinese Academy of Sciences, Chinese Academy of Sciences",
        "aff_domain": "ios.ac.cn;amss.ac.cn;ios.ac.cn",
        "position": "Postdoc;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nyu2024optimal,\ntitle={{OPTIMAL} {ROBUST} {MEMORIZATION} {WITH} {RELU} {NEURAL} {NETWORKS}},\nauthor={Lijia Yu and Xiao-Shan Gao and Lijun Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=47hDbAMLbc}\n}",
        "github": "",
        "project": "",
        "reviewers": "LzNK;Sknc;MXq8",
        "pdf_size": 556613,
        "rating": "5;5;8",
        "confidence": "4;3;3",
        "soundness": "2;2;4",
        "contribution": "2;3;3",
        "presentation": "3;1;4",
        "wc_summary": "83;113;174",
        "wc_strengths": "55;47;120",
        "wc_weaknesses": "237;18;130",
        "wc_questions": "34;20;129",
        "wc_review": "409;198;553",
        "wc_reply_reviewers": "0;27;114",
        "wc_reply_authors": "636;193;1272",
        "reply_reviewers": "0;1;2",
        "reply_authors": "1;2;3",
        "rating_avg": [
            6.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "wc_summary_avg": [
            123.33333333333333,
            37.86232369461172
        ],
        "wc_strengths_avg": [
            74.0,
            32.69046751985457
        ],
        "wc_weaknesses_avg": [
            128.33333333333334,
            89.4141425552406
        ],
        "wc_questions_avg": [
            61.0,
            48.42175819470692
        ],
        "wc_review_avg": [
            386.6666666666667,
            145.78599231598196
        ],
        "wc_reply_reviewers_avg": [
            47.0,
            48.641546028061235
        ],
        "wc_reply_authors_avg": [
            700.3333333333334,
            442.8425855262292
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16558959214918652101&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=47hDbAMLbc",
        "pdf": "https://openreview.net/pdf?id=47hDbAMLbc",
        "email": "ios.ac.cn;amss.ac.cn;ios.ac.cn",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Chinese Academy of Sciences",
        "aff_unique_dep": "Institute of Software",
        "aff_unique_url": "http://www.ios.ac.cn",
        "aff_unique_abbr": "CAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Language Model Decoding as Direct Metrics Optimization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19478",
        "id": "488A64eOf6",
        "author_site": "Haozhe Ji, Pei Ke, Hongning Wang, Minlie Huang",
        "tldr": "",
        "abstract": "Despite the remarkable advances in language modeling, current mainstream decoding methods still struggle to generate texts that align with human texts across different aspects. In particular, sampling-based methods produce less-repetitive texts which are often disjunctive in discourse, while search-based methods maintain topic coherence at the cost of increased repetition. Overall, these methods fall short in achieving holistic alignment across a broad range of aspects. In this work, we frame decoding from a language model as an optimization problem with the goal of strictly matching the expected performance with human texts measured by multiple metrics of desired aspects simultaneously. The resulting decoding distribution enjoys an analytical solution that scales the input language model distribution via a sequence-level energy function defined by these metrics. And most importantly, we prove that this induced distribution is guaranteed to improve the perplexity on human texts, which suggests a better approximation to the underlying distribution of human texts. To facilitate tractable sampling from this globally normalized distribution, we adopt the Sampling-Importance-Resampling technique. Experiments on various domains and model scales demonstrate the superiority of our method in metrics alignment with human texts and human evaluation over strong baselines.",
        "keywords": "language model;decoding algorithm;energy-based model",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/386a6d3b337b2bbacdf5441ce0b99bc70037d0a8.zip",
        "author": "Haozhe Ji;Pei Ke;Hongning Wang;Minlie Huang",
        "authorids": "~Haozhe_Ji2;~Pei_Ke2;~Hongning_Wang1;~Minlie_Huang1",
        "gender": "M;M;M;M",
        "homepage": "https://haozheji.github.io/;https://kepei1106.github.io/;http://www.cs.virginia.edu/~hw5x/;http://coai.cs.tsinghua.edu.cn/hml",
        "dblp": "222/9546;10/2179;05/6545;",
        "google_scholar": "EE5Z7mUAAAAJ;W_zPCtEAAAAJ;qkdvKNoAAAAJ;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": ";;0000-0002-6524-9195;",
        "linkedin": "%E6%98%8A%E5%93%B2-%E8%AE%A1-69722313b/;;;",
        "or_profile": "~Haozhe_Ji2;~Pei_Ke2;~Hongning_Wang1;~Minlie_Huang1",
        "aff": "Tsinghua University;Tsinghua University;Tsinghua University;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "PhD student;Postdoc;Associate Professor;Full Professor",
        "bibtex": "@inproceedings{\nji2024language,\ntitle={Language Model Decoding as Direct Metrics Optimization},\nauthor={Haozhe Ji and Pei Ke and Hongning Wang and Minlie Huang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=488A64eOf6}\n}",
        "github": "",
        "project": "",
        "reviewers": "iYh2;3A4S;MQ6q;aJdn",
        "pdf_size": 1549612,
        "rating": "5;6;6;8",
        "confidence": "3;4;3;3",
        "soundness": "3;3;3;4",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;4",
        "wc_summary": "59;110;51;93",
        "wc_strengths": "51;43;81;33",
        "wc_weaknesses": "91;180;113;24",
        "wc_questions": "5;168;2;42",
        "wc_review": "206;501;247;192",
        "wc_reply_reviewers": "309;14;0;99",
        "wc_reply_authors": "2232;1968;790;374",
        "reply_reviewers": "2;1;0;2",
        "reply_authors": "4;4;2;2",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            78.25,
            24.180312239505923
        ],
        "wc_strengths_avg": [
            52.0,
            17.916472867168917
        ],
        "wc_weaknesses_avg": [
            102.0,
            55.70008976653449
        ],
        "wc_questions_avg": [
            54.25,
            67.53656417082527
        ],
        "wc_review_avg": [
            286.5,
            125.48007810007132
        ],
        "wc_reply_reviewers_avg": [
            105.5,
            123.44735720135931
        ],
        "wc_reply_authors_avg": [
            1341.0,
            778.73294523861
        ],
        "reply_reviewers_avg": [
            1.25,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.0,
            1.0
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.13245323570650439,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4952793167999616763&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=488A64eOf6",
        "pdf": "https://openreview.net/pdf?id=488A64eOf6",
        "email": "tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Tsinghua University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "48Abxtv9Mi",
        "title": "Missing Data Imputation for Large-Scale Longitudinal Physical Activity Data",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Missing data is ubiquitous in wearable device data, which stems from the combination of user errors and hardware issues, hindering researchers who seek to monitor users' physical activities to understand health related behaviors and perform appropriate interventions. All of Us dataset collects one of the largest longitudinal physical activity data in the world. However, due to the remarkable variability of missingness patterns, only few works leverage it, which loses the extremely valuable potential to deliver vital transformative health impacts. In this work, we consider the problem of imputing missing step counts in the large-scale longitudinal physical activity data. Thus, we explore the All of Us dataset and extract a novel cohort of 100 qualified participants with more than 3 million step count instances from it. To address the issue of missingness, we introduce a sparse self-attention model which captures both absolute and relative time information within the local context window around the missing hourly block. Our results show (1) the curated cohort is subject to the variability of both activity and missingness patterns which is challenging to model, (2) our model outperforms a carefully-crafted set of baseline methods with the statistical significance, solidifying its position as a foundation model which could be used in fine-tuning approaches for the downstream tasks. Hopefully our filling method can benefit the further research by making such a large scale physical activity dataset easier to use.",
        "keywords": "missing data;time series;imputation;wearable;physical activity;large-scale;novel cohort;self-attention model;sparse",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Hui Wei;Maxwell Xu;Colin Samplawski;James Matthew Rehg;Santosh Kumar;Benjamin Marlin",
        "authorids": "~Hui_Wei3;~Maxwell_Xu1;~Colin_Samplawski1;~James_Matthew_Rehg1;~Santosh_Kumar1;~Benjamin_Marlin1",
        "gender": "M;;;M;M;M",
        "homepage": "https://wll199566.github.io/davidhuiwei.github.io/;https://maxxu05.github.io/;;http://www.memphis.edu/cs/santosh-kumar/;https://groups.cs.umass.edu/marlin/;http://rehg.org/",
        "dblp": ";;;;03/7058.html;r/JMRehg",
        "google_scholar": ";https://scholar.google.com/citations?view_op=list_works;6ufrjW4AAAAJ;f0i_WNoAAAAJ;ey960FIAAAAJ;https://scholar.google.com.tw/citations?user=8kA3eDwAAAAJ",
        "orcid": ";;;0000-0002-9273-0291;0000-0002-2626-3410;0000-0003-1793-5462",
        "linkedin": ";;;santoshkumar4/;;",
        "or_profile": "~Hui_Wei3;~Maxwell_Xu1;~Colin_Samplawski1;~Santosh_Kumar1;~Benjamin_Marlin1;~James_Rehg1",
        "aff": "University of Massachusetts Amherst;University of Illinois, Urbana Champaign;Department of Computer Science, University of Massachusetts at Amherst;University of Memphis;University of Massachusetts at Amherst;University of Illinois, Urbana Champaign",
        "aff_domain": "cs.umass.edu;illinois.edu;cs.umass.edu;memphis.edu;umass.edu;illinois.edu",
        "position": "Researcher;PhD student;PhD student;Full Professor;Associate Professor;Full Professor",
        "bibtex": "@misc{\nwei2024missing,\ntitle={Missing Data Imputation for Large-Scale Longitudinal Physical Activity Data},\nauthor={Hui Wei and Maxwell Xu and Colin Samplawski and James Matthew Rehg and Santosh Kumar and Benjamin Marlin},\nyear={2024},\nurl={https://openreview.net/forum?id=48Abxtv9Mi}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=48Abxtv9Mi",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:eGSw128SH30J:scholar.google.com/&scioq=Missing+Data+Imputation+for+Large-Scale+Longitudinal+Physical+Activity+Data&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;2;0;1",
        "aff_unique_norm": "University of Massachusetts Amherst;University of Illinois Urbana-Champaign;University of Memphis",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.umass.edu;https://illinois.edu;https://www.memphis.edu",
        "aff_unique_abbr": "UMass Amherst;UIUC;UM",
        "aff_campus_unique_index": "0;1;0;0;1",
        "aff_campus_unique": "Amherst;Urbana-Champaign;",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "48CXLrx7K3",
        "title": "Revealing Unintentional Information Leakage in Low-Dimensional Facial Portrait Representations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We evaluate the information that can unintentionally leak into the low dimensional output of a neural network, by reconstructing an input image from a 40- or 32-element feature vector that intends to only describe abstract attributes of a facial portrait. The reconstruction uses blackbox-access to the image encoder which generates the feature vector. Other than previous work, we leverage recent knowledge about image generation and facial similarity, implementing a method that outperforms the current state-of-the-art. Our strategy uses a pretrained StyleGAN and a new loss function that compares the perceptual similarity of portraits by mapping them into the latent space of a FaceNet embedding. Additionally, we present a new technique that fuses the output of an ensemble, to deliberately generate specific aspects of the recreated image.",
        "keywords": "feature vector reconstruction;face recognition;privacy",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Kathleen Anderson;Thomas Martinetz",
        "authorids": "~Kathleen_Anderson1;~Thomas_Martinetz1",
        "gender": ";M",
        "homepage": "https://www.inb.uni-luebeck.de/en/staff/staff-list/wissenschaftliche-mitarbeiter/kathleen-anderson.html;https://www.inb.uni-luebeck.de/mitarbeiter/mitarbeiter/professoren/thomas-martinetz",
        "dblp": ";",
        "google_scholar": ";https://scholar.google.de/citations?user=0-tDtUIAAAAJ",
        "orcid": ";",
        "linkedin": ";thomas-martinetz-10573a6/",
        "or_profile": "~Kathleen_Anderson1;~Thomas_Martinetz1",
        "aff": "Universit\u00e4t zu L\u00fcbeck;Universit\u00e4t zu L\u00fcbeck",
        "aff_domain": "uni-luebeck.de;uni-luebeck.de",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nanderson2024revealing,\ntitle={Revealing Unintentional Information Leakage in Low-Dimensional Facial Portrait Representations},\nauthor={Kathleen Anderson and Thomas Martinetz},\nyear={2024},\nurl={https://openreview.net/forum?id=48CXLrx7K3}\n}",
        "github": "",
        "project": "",
        "reviewers": "nZtS;5Uwq;3kp1",
        "site": "https://openreview.net/forum?id=48CXLrx7K3",
        "pdf_size": 47938970,
        "rating": "3;5;8",
        "confidence": "3;4;4",
        "soundness": "1;2;2",
        "contribution": "3;2;2",
        "presentation": "2;2;2",
        "wc_summary": "107;94;41",
        "wc_strengths": "49;243;31",
        "wc_weaknesses": "312;305;67",
        "wc_questions": "39;56;195",
        "wc_review": "507;698;334",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "343;689;65",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            5.333333333333333,
            2.0548046676563256
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            80.66666666666667,
            28.546258754675524
        ],
        "wc_strengths_avg": [
            107.66666666666667,
            95.97684906036223
        ],
        "wc_weaknesses_avg": [
            228.0,
            113.88005385784933
        ],
        "wc_questions_avg": [
            96.66666666666667,
            69.87767088912516
        ],
        "wc_review_avg": [
            513.0,
            148.66292969892214
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            365.6666666666667,
            255.2506393505977
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.8029550685469661,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ckxSbqTKJNAJ:scholar.google.com/&scioq=Revealing+Unintentional+Information+Leakage+in+Low-Dimensional+Facial+Portrait+Representations&hl=en&as_sdt=0,5",
        "gs_version_total": 5,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of L\u00fcbeck",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uni-luebeck.de",
        "aff_unique_abbr": "UzL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "49CGs58v0J",
        "title": "Elevating Augmentation: Boosting Performance via Sub-Model Training",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Image classification has improved with the development of training techniques. However, these techniques often require careful parameter tuning to balance the strength of regularization, limiting their potential benefits. In this paper, we propose a novel way to use regularization called Augmenting Sub-model (AugSub). AugSub consists of two models: the main model and the sub-model. While the main model employs conventional training recipes, the sub-model leverages the benefit of additional regularization. AugSub achieves this by mitigating adverse effects through a relaxed loss function similar to self-distillation loss. We demonstrate the effectiveness of AugSub with three drop techniques: dropout, drop-path, and random masking. Our analysis shows that all AugSub improves performance, with the training loss converging even faster than regular training. Among the three, AugMask is identified as the most practical method due to its performance and cost efficiency. We further validate AugMask across diverse training recipes, including DeiT-III, ResNet, MAE fine-tuning, and Swin Transformer. The results show that AugMask consistently provides significant performance gain. AugSub provides a practical and effective solution for introducing additional regularization under various training recipes. The code will be publicly available.",
        "keywords": "Training recipe;drop regularization;random masking;self-distillation;supervised learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Byeongho Heo;Taekyung Kim;Sangdoo Yun;Dongyoon Han",
        "authorids": "~Byeongho_Heo1;~Taekyung_Kim4;~Sangdoo_Yun1;~Dongyoon_Han1",
        "gender": "M;Not Specified;M;M",
        "homepage": "https://sites.google.com/view/byeongho-heo/home;;https://sangdooyun.github.io/;https://dongyoonhan.github.io/",
        "dblp": "142/2705;58/1619-2;124/3009.html;151/8876",
        "google_scholar": "https://scholar.google.co.kr/citations?user=4_7rLDIAAAAJ;https://scholar.google.co.kr/citations?user=u-9bdkwAAAAJ;o0qtjzYAAAAJ;jcP7m1QAAAAJ",
        "orcid": ";;;0000-0002-9130-8195",
        "linkedin": "byeongho-heo-1a7756122/;taekyung-kim-76b074335/;;https://linkedin.com/in/dongyoon-han-04961a120/en",
        "or_profile": "~Byeongho_Heo1;~Taekyung_Kim4;~Sangdoo_Yun1;~Dongyoon_Han1",
        "aff": "NAVER AI Lab;NAVER AI Lab;NAVER;NAVER",
        "aff_domain": "navercorp.com;navercorp.com;navercorp.com;navercorp.com",
        "position": "Researcher;Research Scientist;Research Scientist;Research Scientist",
        "bibtex": "@misc{\nheo2024elevating,\ntitle={Elevating Augmentation: Boosting Performance via Sub-Model Training},\nauthor={Byeongho Heo and Taekyung Kim and Sangdoo Yun and Dongyoon Han},\nyear={2024},\nurl={https://openreview.net/forum?id=49CGs58v0J}\n}",
        "github": "",
        "project": "",
        "reviewers": "AdC8;FBYo;ZArF",
        "site": "https://openreview.net/forum?id=49CGs58v0J",
        "pdf_size": 564681,
        "rating": "3;5;6",
        "confidence": "4;4;4",
        "soundness": "2;2;3",
        "contribution": "2;2;2",
        "presentation": "2;3;3",
        "wc_summary": "63;54;70",
        "wc_strengths": "23;45;34",
        "wc_weaknesses": "214;156;128",
        "wc_questions": "35;5;2",
        "wc_review": "335;260;234",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            62.333333333333336,
            6.548960901462833
        ],
        "wc_strengths_avg": [
            34.0,
            8.981462390204987
        ],
        "wc_weaknesses_avg": [
            166.0,
            35.81433604950212
        ],
        "wc_questions_avg": [
            14.0,
            14.89966442575134
        ],
        "wc_review_avg": [
            276.3333333333333,
            42.82003684673281
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:1DQcn9Zlf_gJ:scholar.google.com/&scioq=Elevating+Augmentation:+Boosting+Performance+via+Sub-Model+Training&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "NAVER Corporation",
        "aff_unique_dep": "NAVER AI Lab",
        "aff_unique_url": "https://www.naver.com",
        "aff_unique_abbr": "NAVER",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "49N0ivEQHY",
        "title": "Towards Better Orthogonality Regularization with Disentangled Norm in Training Deep CNNs",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In addressing feature redundancy and training instability in CNNs, orthogonality regularization has emerged as a promising approach. \nSpecifically, a variant termed kernel orthogonality regularization \nseeks to optimize models by minimizing the residual between kernel functions of convolutional filters and the identity matrix.\n\nContrary to methods that measure the kernel residual as a holistic entity, \nour approach introduces a tailored measure that disentangles diagonal and correlation components from the kernel matrix, \nthereby mitigating their mutual interference during training.\nModels equipped with this strict kernel orthogonality measure outperform existing methods in near-orthogonality. \nNotably, we observe test accuracy improvements for shallow architectures.\nHowever, as model depth increases, the efficacy of our strict kernel orthogonality approach diminishes.\n\nGiven the challenges of strict kernel orthogonality in deeper models and the inherent non-compliance of specific convolutional layers with the kernel orthogonality definition, we introduce the concept of a relaxation theory, wherein strict orthogonality is a special case. \nBy adopting this relaxed kernel orthogonality regularization, we observe enhanced model performance in deeper architectures, \nsuggesting it as a robust alternative to the strict counterpart.\n\nTo validate our approach's efficacy in achieving near-orthogonality and enhancing model performance, we conduct rigorous experiments with our kernel orthogonality regularization toolkit on ResNet and WideResNet in CIFAR-10 and CIFAR-100 datasets. \nWe observe state-of-the-art gains in model performance from the toolkit and obtain more robust models with expressive features. \nThese experiments demonstrate the efficacy of our toolkit while highlighting the often overlooked challenges in orthogonality regularization.",
        "keywords": "Orthogonality Regularization;Disentangled Norm",
        "primary_area": "metric learning, kernel learning, and sparse coding",
        "supplementary_material": "",
        "author": "Changhao Wu;zhang shenan;Fangsong Long;Ziliang Yin;Tuo Leng",
        "authorids": "~Changhao_Wu1;~zhang_shenan1;~Fangsong_Long1;~Ziliang_Yin1;~Tuo_Leng1",
        "gender": ";M;M;;M",
        "homepage": "https://changhaowu.github.io;https://github.com/Andrewmatilde;https://longfangsong.github.io/en/;https://github.com/crazcell;https://euclidesprobationem.github.io/index.html",
        "dblp": ";;;;",
        "google_scholar": ";;;;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Changhao_Wu1;~zhang_shenan1;~Fangsong_Long1;~Ziliang_Yin1;~Tuo_Leng1",
        "aff": ";;;;Shanghai University",
        "aff_domain": ";;;;shu.edu.cn",
        "position": ";;;;Associate Professor",
        "bibtex": "@misc{\nwu2024towards,\ntitle={Towards Better Orthogonality Regularization with Disentangled Norm in Training Deep {CNN}s},\nauthor={Changhao Wu and zhang shenan and Fangsong Long and Ziliang Yin and Tuo Leng},\nyear={2024},\nurl={https://openreview.net/forum?id=49N0ivEQHY}\n}",
        "github": "",
        "project": "",
        "reviewers": "RR7G;ok4a;M627",
        "site": "https://openreview.net/forum?id=49N0ivEQHY",
        "pdf_size": 396195,
        "rating": "3;3;5",
        "confidence": "4;4;4",
        "soundness": "3;1;2",
        "contribution": "2;1;2",
        "presentation": "3;1;1",
        "wc_summary": "61;339;129",
        "wc_strengths": "31;44;88",
        "wc_weaknesses": "94;1080;105",
        "wc_questions": "2;86;1",
        "wc_review": "188;1549;323",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "446;699;528",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;3;2",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            176.33333333333334,
            118.32535184350347
        ],
        "wc_strengths_avg": [
            54.333333333333336,
            24.390344173235622
        ],
        "wc_weaknesses_avg": [
            426.3333333333333,
            462.233947500854
        ],
        "wc_questions_avg": [
            29.666666666666668,
            39.83577398380617
        ],
        "wc_review_avg": [
            686.6666666666666,
            612.247408233705
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            557.6666666666666,
            105.39555124492789
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9426688353333722453&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "Shanghai University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.shu.edu.cn",
        "aff_unique_abbr": "SHU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "49Tn5mfTy5",
        "title": "Uncertainty Quantification Using a Codebook of Encoders",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Many machine learning applications are limited not by the accuracy of current models but by the inability of these models to assign confidence to their predictions \u2013 the models don\u2019t know what they don\u2019t know. Among methods that do provide uncertainty estimates, there remains a tradeoff between reliable yet expensive methods (e.g., deep ensembles) and lightweight alternatives that can be miscalibrated. In this paper, we propose a lightweight uncertainty quantification method with performance comparable to deep ensembles across a range of tasks and metrics. The key idea behind our approach is to revise and augment prior information bottleneck methods with a codebook to obtain a compressed representation of all inputs seen during training. Uncertainty over a new example can then be quantified by its distance from this codebook. The resulting method, the Uncertainty Aware Information Bottleneck (UA-IB), requires only a single forward pass to provide uncertainty estimates. Our experiments show that UA-IB can achieve better Out-of-Distribution (OOD) detection and calibration than prior methods, including those based on the standard information bottleneck.",
        "keywords": "uncertainty quantification;out-of-distribution detection;information theory;information bottleneck;variational information bottleneck;clustering;deterministic uncertainty methods;bregman divergence;rate-distortion theory;compression;quantization",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/26d1a3cbace49625185ee1426b424c0d0cceff72.zip",
        "author": "Ifigeneia Apostolopoulou;Benjamin Eysenbach;Frank Nielsen;Artur Dubrawski",
        "authorids": "~Ifigeneia_Apostolopoulou1;~Benjamin_Eysenbach1;~Frank_Nielsen1;~Artur_Dubrawski2",
        "gender": ";M;M;M",
        "homepage": ";https://ben-eysenbach.github.io/;https://franknielsen.github.io/;https://www.autonlab.org",
        "dblp": "145/9415.html;192/1863;http://dblp.uni-trier.de/pers/hd/n/Nielsen:Frank;76/48",
        "google_scholar": "xiJGHuwAAAAJ;DRnOvU8AAAAJ;c-cuO9cAAAAJ;O3gezzcAAAAJ",
        "orcid": ";0009-0000-7136-6307;0000-0001-5728-0726;0000-0002-2372-0831",
        "linkedin": ";benjamin-eysenbach-a7235775/;;artur-dubrawski-33a2a87/",
        "or_profile": "~Ifigeneia_Apostolopoulou1;~Benjamin_Eysenbach1;~Frank_Nielsen1;~Artur_Dubrawski2",
        "aff": "Carnegie Mellon University;Princeton University;Sony Computer Science Laboratories Inc (Tokyo);Carnegie Mellon University",
        "aff_domain": "cmu.edu;princeton.edu;sonycsl.co.jp;cmu.edu",
        "position": "PhD student;Assistant Professor;Fellow;Research Professor",
        "bibtex": "@misc{\napostolopoulou2024uncertainty,\ntitle={Uncertainty Quantification Using a Codebook of Encoders},\nauthor={Ifigeneia Apostolopoulou and Benjamin Eysenbach and Frank Nielsen and Artur Dubrawski},\nyear={2024},\nurl={https://openreview.net/forum?id=49Tn5mfTy5}\n}",
        "github": "",
        "project": "",
        "reviewers": "rmmd;fXda;nABa;81b3",
        "site": "https://openreview.net/forum?id=49Tn5mfTy5",
        "pdf_size": 769799,
        "rating": "1;5;6;8",
        "confidence": "5;3;4;3",
        "soundness": "2;2;3;3",
        "contribution": "1;2;2;2",
        "presentation": "2;2;3;3",
        "wc_summary": "68;71;62;45",
        "wc_strengths": "43;39;74;141",
        "wc_weaknesses": "226;46;501;238",
        "wc_questions": "114;93;192;116",
        "wc_review": "451;249;829;540",
        "wc_reply_reviewers": "886;218;317;95",
        "wc_reply_authors": "1466;1117;1243;630",
        "reply_reviewers": "2;1;2;1",
        "reply_authors": "4;3;4;1",
        "rating_avg": [
            5.0,
            2.5495097567963922
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            61.5,
            10.062305898749054
        ],
        "wc_strengths_avg": [
            74.25,
            40.84957160118084
        ],
        "wc_weaknesses_avg": [
            252.75,
            162.25500762688344
        ],
        "wc_questions_avg": [
            128.75,
            37.6123317543595
        ],
        "wc_review_avg": [
            517.25,
            208.59814836186825
        ],
        "wc_reply_reviewers_avg": [
            379.0,
            303.096519280575
        ],
        "wc_reply_authors_avg": [
            1114.0,
            306.1086408450438
        ],
        "reply_reviewers_avg": [
            1.5,
            0.5
        ],
        "reply_authors_avg": [
            3.0,
            1.224744871391589
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8278373543847156,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:FgwwTZyP_8UJ:scholar.google.com/&scioq=Uncertainty+Quantification+Using+a+Codebook+of+Encoders&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Carnegie Mellon University;Princeton University;Sony Computer Science Laboratories Inc",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.cmu.edu;https://www.princeton.edu;https://www.sony.net/",
        "aff_unique_abbr": "CMU;Princeton;Sony CSL",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Tokyo",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "United States;Japan"
    },
    {
        "id": "49ZYkhEGmv",
        "title": "Scalabale AI Safety via Doubly-Efficient Debate",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The emergence of pre-trained AI systems with powerful capabilities across a diverse and ever-increasing set of complex domains has raised a critical challenge for AI safety, as tasks can become too complicated for humans to judge directly. Irving et al. (2018) proposed a debate method in this direction with the goal of pitting the power of such AI models against each other until the problem of identifying (mis)-alignment is broken down into a manageable subtask. While the promise of this approach is clear, the original framework was based on the assumption that the honest strategy is able to simulate deterministic AI systems for an exponential number of steps, limiting its applicability. In this paper, we show how to address these challenges by designing a new set of debate protocols where the honest strategy can always succeed using a simulation of a polynomial number of steps, whilst being able to verify the alignment of stochastic AI systems, even when the dishonest strategy is allowed to use exponentially many simulation steps.",
        "keywords": "AI Safety;Interactive Proofs;Algorithms and Complexity Theory",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/e78f80ec774ae167a5329191d6cdbd1c4e29aa82.zip",
        "author": "Jonah Brown-Cohen;Geoffrey Irving;Georgios Piliouras",
        "authorids": "~Jonah_Brown-Cohen1;~Geoffrey_Irving2;~Georgios_Piliouras1",
        "gender": "M;M;",
        "homepage": "https://jonahbc.github.io/;https://naml.us;",
        "dblp": "157/1513;95/4978;62/1236",
        "google_scholar": "fRc3A80AAAAJ;TrdtzgwAAAAJ;",
        "orcid": ";;",
        "linkedin": ";geoffreyirving;",
        "or_profile": "~Jonah_Brown-Cohen1;~Geoffrey_Irving2;~Georgios_Piliouras1",
        "aff": "Google DeepMind;Google DeepMind;Singapore University of Technology and Design",
        "aff_domain": "deepmind.com;deepmind.com;sutd.edu.sg",
        "position": "Researcher;Safety Researcher;Associate Professor",
        "bibtex": "@misc{\nbrown-cohen2024scalabale,\ntitle={Scalabale {AI} Safety via Doubly-Efficient Debate},\nauthor={Jonah Brown-Cohen and Geoffrey Irving and Georgios Piliouras},\nyear={2024},\nurl={https://openreview.net/forum?id=49ZYkhEGmv}\n}",
        "github": "",
        "project": "",
        "reviewers": "a5ph;zvu9;TQe8;5QN9",
        "site": "https://openreview.net/forum?id=49ZYkhEGmv",
        "pdf_size": 378790,
        "rating": "6;6;6;8",
        "confidence": "2;3;2;2",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;4;3;3",
        "wc_summary": "139;154;34;29",
        "wc_strengths": "122;159;3;60",
        "wc_weaknesses": "121;130;4;191",
        "wc_questions": "38;53;90;314",
        "wc_review": "420;496;131;594",
        "wc_reply_reviewers": "0;17;0;0",
        "wc_reply_authors": "226;384;532;574",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            2.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            89.0,
            57.77110004145671
        ],
        "wc_strengths_avg": [
            86.0,
            59.56089321022645
        ],
        "wc_weaknesses_avg": [
            111.5,
            67.65537672646572
        ],
        "wc_questions_avg": [
            123.75,
            111.45935357788507
        ],
        "wc_review_avg": [
            410.25,
            172.6215151711976
        ],
        "wc_reply_reviewers_avg": [
            4.25,
            7.361215932167728
        ],
        "wc_reply_authors_avg": [
            429.0,
            136.81008734738825
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 16,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17236456443179009770&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Google;Singapore University of Technology and Design",
        "aff_unique_dep": "Google DeepMind;",
        "aff_unique_url": "https://deepmind.com;https://www.sutd.edu.sg",
        "aff_unique_abbr": "DeepMind;SUTD",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "United Kingdom;Singapore"
    },
    {
        "title": "LCOT: Linear Circular Optimal Transport",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19477",
        "id": "49z97Y9lMq",
        "author_site": "ROCIO DIAZ MARTIN, Ivan Medri, Yikun Bai, Xinran Liu, Kangbai Yan, Gustavo Rohde, Soheil Kolouri",
        "tldr": "",
        "abstract": "The optimal transport problem for measures supported on non-Euclidean spaces has recently gained ample interest in diverse applications involving representation learning. In this paper, we focus on circular probability measures, i.e., probability measures supported on the unit circle, and introduce a new computationally efficient metric for these measures, denoted as Linear Circular Optimal Transport (LCOT). The proposed metric comes with an explicit linear embedding that allows one to apply Machine Learning (ML) algorithms to the embedded measures and seamlessly modify the underlying metric for the ML algorithm to LCOT. We show that the proposed metric is rooted in the Circular Optimal Transport (COT) and can be considered the linearization of the COT metric with respect to a fixed reference measure. We provide a theoretical analysis of the proposed metric and derive the computational complexities for pairwise comparison of circular probability measures. Lastly, through a set of numerical experiments, we demonstrate the benefits of LCOT in learning representations from circular measures.",
        "keywords": "Optimal Transport;Circular Measure;Probability Metrics",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/33dbd9b75005fd214a8b1afb996888a6e7fc7377.zip",
        "author": "Rocio P Diaz Martin;Ivan Vladimir Medri;Yikun Bai;Xinran Liu;Kangbai Yan;Gustavo Rohde;Soheil Kolouri",
        "authorids": "~Rocio_P_Diaz_Martin1;~Ivan_Vladimir_Medri1;~Yikun_Bai2;~Xinran_Liu2;~Kangbai_Yan1;~Gustavo_Rohde1;~Soheil_Kolouri1",
        "gender": "M;M;;M;M;M;F",
        "homepage": ";;;https://www.linkedin.com/in/kangbai-yan-226829169/;https://www.imagedatascience.com/;https://skolouri.github.io/;",
        "dblp": ";273/3993.html;;;;143/9637;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;zLm6JOAAAAAJ;ZHz5VScAAAAJ;;;yREBSy0AAAAJ;7RHakmMAAAAJ",
        "orcid": ";;;;;0000-0001-8495-5362;0000-0002-3732-6296",
        "linkedin": ";yikun-bai-b70050138/?trk=public_profile_browsemap;xinran-l-5777a0205/;;;skolouri/;",
        "or_profile": "~Ivan_Vladimir_Medri1;~Yikun_Bai2;~Xinran_Liu2;~Kangbai_Yan1;~Gustavo_Rohde1;~Soheil_Kolouri1;~ROCIO_DIAZ_MARTIN1",
        "aff": "Tennessee State University;Vanderbilt University;Vanderbilt University;Vanderbilt University;University of Virginia Main Campus;Vanderbilt University;Tufts University",
        "aff_domain": "tnstate.edu;vanderbilt.edu;vanderbilt.edu;vanderbilt.edu;;vanderbilt.edu;tufts.edu",
        "position": "Postdoc;Postdoc;PhD student;Undergrad student;;Assistant Professor;Postdoc",
        "bibtex": "@inproceedings{\nmartin2024lcot,\ntitle={{LCOT}: Linear Circular Optimal Transport},\nauthor={Rocio P Diaz Martin and Ivan Vladimir Medri and Yikun Bai and Xinran Liu and Kangbai Yan and Gustavo Rohde and Soheil Kolouri},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=49z97Y9lMq}\n}",
        "github": "",
        "project": "",
        "reviewers": "8oTS;Hihy;5tYi",
        "pdf_size": 10743012,
        "rating": "6;6;6",
        "confidence": "4;4;3",
        "soundness": "4;3;2",
        "contribution": "3;2;2",
        "presentation": "4;3;2",
        "wc_summary": "80;188;88",
        "wc_strengths": "73;65;49",
        "wc_weaknesses": "132;159;71",
        "wc_questions": "118;69;44",
        "wc_review": "403;481;252",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "477;411;543",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            118.66666666666667,
            49.13473539383541
        ],
        "wc_strengths_avg": [
            62.333333333333336,
            9.977753031397176
        ],
        "wc_weaknesses_avg": [
            120.66666666666667,
            36.80881536926839
        ],
        "wc_questions_avg": [
            77.0,
            30.735430152621365
        ],
        "wc_review_avg": [
            378.6666666666667,
            95.05904597786694
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            477.0,
            53.88877434122992
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18019738448181464318&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=49z97Y9lMq",
        "pdf": "https://openreview.net/pdf?id=49z97Y9lMq",
        "email": "tnstate.edu;vanderbilt.edu;vanderbilt.edu;vanderbilt.edu;;vanderbilt.edu;tufts.edu",
        "author_num": 7,
        "aff_unique_index": "0;1;1;1;2;1;3",
        "aff_unique_norm": "Tennessee State University;Vanderbilt University;University of Virginia;Tufts University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.tnstate.edu;https://www.vanderbilt.edu;https://www.virginia.edu;https://www.tufts.edu",
        "aff_unique_abbr": "TSU;Vanderbilt;UVA;Tufts",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Main Campus",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "4A5D1nsdtj",
        "title": "An Effective Universal Polynomial Basis for Spectral Graph Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Spectral Graph Neural Networks (GNNs), also referred to as *graph filters* have gained increasing prevalence for heterophily graphs. Optimal graph filters rely on Laplacian eigendecomposition for Fourier transform. In an attempt to avert the prohibitive computations, numerous polynomial filters by leveraging distinct polynomials have been proposed to approximate the desired graph filters. However, polynomials in the majority of polynomial filters are *predefined* and remain *fixed* across all graphs, failing to accommodate the diverse heterophily degrees across different graphs. To tackle this issue, we first investigate the correlation between polynomial bases of desired graph filters and the degrees of graph heterophily via a thorough theoretical analysis. Afterward, we develop an adaptive heterophily basis by incorporating graph heterophily degrees. Subsequently, we integrate this heterophily basis with the homophily basis, creating a universal polynomial basis *UniBasis*. In consequence, we devise a general polynomial filter *UniFilter*. Comprehensive experiments on both real-world and synthetic datasets with varying heterophily degrees significantly support the superiority of UniFilter, demonstrating the effectiveness and generality of UniBasis, as well as its promising capability as a new method for graph analysis.",
        "keywords": "Graph neural networks;Spectral graph filter",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/a4660f5e25d355e4c9c1eda9f45e004275b2a204.zip",
        "author": "Keke Huang;Pietro Lio",
        "authorids": "~Keke_Huang1;~Pietro_Lio1",
        "gender": "M;M",
        "homepage": "https://sites.google.com/view/kekehuang/;https://www.cst.cam.ac.uk/people/pl219",
        "dblp": ";l/PietroLio.html",
        "google_scholar": "https://scholar.google.com.sg/citations?user=OsceCbcAAAAJ;https://scholar.google.co.uk/citations?user=3YrWf7EAAAAJ",
        "orcid": "0000-0003-2190-7114;0000-0002-0540-5053",
        "linkedin": "keke-huang-4594b9135/?originalSubdomain=sg;",
        "or_profile": "~Keke_Huang1;~Pietro_Lio1",
        "aff": "National University of Singapore;University of Cambridge",
        "aff_domain": "nus.edu.sg;cam.ac.uk",
        "position": "Postdoc;Full Professor",
        "bibtex": "@misc{\nhuang2024an,\ntitle={An Effective Universal Polynomial Basis for Spectral Graph Neural Networks},\nauthor={Keke Huang and Pietro Lio},\nyear={2024},\nurl={https://openreview.net/forum?id=4A5D1nsdtj}\n}",
        "github": "",
        "project": "",
        "reviewers": "bWo5;NCEm;SYRx;vpd8",
        "site": "https://openreview.net/forum?id=4A5D1nsdtj",
        "pdf_size": 453004,
        "rating": "3;3;6;6",
        "confidence": "5;4;4;2",
        "soundness": "2;1;3;3",
        "contribution": "2;2;3;4",
        "presentation": "2;2;3;3",
        "wc_summary": "57;137;216;108",
        "wc_strengths": "40;47;9;80",
        "wc_weaknesses": "227;143;166;233",
        "wc_questions": "39;3;82;126",
        "wc_review": "363;330;473;547",
        "wc_reply_reviewers": "158;64;0;0",
        "wc_reply_authors": "1019;1153;1289;2040",
        "reply_reviewers": "2;1;0;0",
        "reply_authors": "3;3;3;4",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            129.5,
            57.56952318718646
        ],
        "wc_strengths_avg": [
            44.0,
            25.228951623085727
        ],
        "wc_weaknesses_avg": [
            192.25,
            38.674119253061214
        ],
        "wc_questions_avg": [
            62.5,
            46.11127844681819
        ],
        "wc_review_avg": [
            428.25,
            86.62382755339318
        ],
        "wc_reply_reviewers_avg": [
            55.5,
            64.6896436842869
        ],
        "wc_reply_authors_avg": [
            1375.25,
            395.4872785564663
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.25,
            0.4330127018922193
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.6882472016116854,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18007601608947293203&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "National University of Singapore;University of Cambridge",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.nus.edu.sg;https://www.cam.ac.uk",
        "aff_unique_abbr": "NUS;Cambridge",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Cambridge",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Singapore;United Kingdom"
    },
    {
        "title": "Mixed-Type Tabular Data Synthesis with Score-based Diffusion in Latent Space",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19476",
        "id": "4Ay23yeuz0",
        "author_site": "Hengrui Zhang, Jiani Zhang, Zhengyuan Shen, Balasubramaniam Srinivasan, Xiao Qin, Christos Faloutsos, Huzefa Rangwala, George Karypis",
        "tldr": "",
        "abstract": "Recent advances in tabular data generation have greatly enhanced synthetic data quality. However, extending diffusion models to tabular data is challenging due to the intricately varied distributions and a blend of data types of tabular data. This paper introduces TabSyn, a methodology that synthesizes tabular data by leveraging a diffusion model within a variational autoencoder (VAE) crafted latent space. The key advantages of the proposed Tabsyn include (1) Generality: the ability to handle a broad spectrum of data types by converting them into a single unified space and explicitly capturing inter-column relations; (2) Quality: optimizing the distribution of latent embeddings to enhance the subsequent training of diffusion models, which helps generate high-quality synthetic data; (3) Speed: much fewer number of reverse steps and faster synthesis speed than existing diffusion-based methods. Extensive experiments on six datasets with five metrics demonstrate that Tabsyn outperforms existing methods. Specifically, it reduces the error rates by 86% and 67% for column-wise distribution and pair-wise column correlation estimations compared with the most competitive baselines. The code has been made available at https://github.com/amazon-science/tabsyn.",
        "keywords": "Tabular data;tabular generation;diffusion models",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Hengrui Zhang;Jiani Zhang;Zhengyuan Shen;Balasubramaniam Srinivasan;Xiao Qin;Christos Faloutsos;Huzefa Rangwala;George Karypis",
        "authorids": "~Hengrui_Zhang1;~Jiani_Zhang2;~Zhengyuan_Shen1;~Balasubramaniam_Srinivasan1;~Xiao_Qin3;~Christos_Faloutsos1;~Huzefa_Rangwala2;~George_Karypis1",
        "gender": "M;F;M;;M;M;M;M",
        "homepage": "https://hengruizhang98.github.io;https://jennyzhang0215.github.io/;;;https://web.cs.wpi.edu/~xqin/;https://www.cs.cmu.edu/~christos/;http://www.cs.gmu.edu/~rangwala;",
        "dblp": ";186/6870;;230/3792;199/4704-3;f/CFaloutsos;30/444;",
        "google_scholar": "iwffiD0AAAAJ;CBmDAOEAAAAJ;mX2LPRwAAAAJ;uM4EhgEAAAAJ;https://scholar.google.com/citations?hl=en;nd8lQQIAAAAJ;yWJ9BqEAAAAJ;ElqwScwAAAAJ",
        "orcid": "0009-0006-1330-0899;0000-0003-0074-6761;;;;0000-0003-2996-9790;;",
        "linkedin": ";;donshen16/;;;christos-faloutsos-43a7aa2/;;",
        "or_profile": "~Hengrui_Zhang1;~Jiani_Zhang2;~Zhengyuan_Shen1;~Balasubramaniam_Srinivasan1;~Xiao_Qin3;~Christos_Faloutsos1;~Huzefa_Rangwala2;~George_Karypis1",
        "aff": "University of Illinois, Chicago;AWS;Amazon;Amazon;Amazon;Carnegie Mellon University;Computer Science, George Mason University;University of Minnesota, Minneapolis",
        "aff_domain": "uic.edu;amazon.com;amazon.com;amazon.com;amazon.com;cmu.edu;cs.gmu.edu;umn.edu",
        "position": "PhD student;Researcher;Researcher;Senior Applied Scientist;Researcher;Full Professor;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nzhang2024mixedtype,\ntitle={Mixed-Type Tabular Data Synthesis with Score-based Diffusion in Latent Space},\nauthor={Hengrui Zhang and Jiani Zhang and Zhengyuan Shen and Balasubramaniam Srinivasan and Xiao Qin and Christos Faloutsos and Huzefa Rangwala and George Karypis},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=4Ay23yeuz0}\n}",
        "github": "",
        "project": "",
        "reviewers": "q7Xg;aVor;dVGm;Fs1y",
        "pdf_size": 1950574,
        "rating": "5;6;8;8",
        "confidence": "3;4;4;3",
        "soundness": "3;4;3;3",
        "contribution": "3;2;3;4",
        "presentation": "3;4;4;3",
        "wc_summary": "41;44;182;99",
        "wc_strengths": "31;25;92;128",
        "wc_weaknesses": "69;60;165;284",
        "wc_questions": "41;73;94;241",
        "wc_review": "182;202;533;752",
        "wc_reply_reviewers": "0;17;64;59",
        "wc_reply_authors": "804;833;1488;1619",
        "reply_reviewers": "0;1;2;1",
        "reply_authors": "3;3;2;3",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            91.5,
            57.124863238348325
        ],
        "wc_strengths_avg": [
            69.0,
            42.98255460067491
        ],
        "wc_weaknesses_avg": [
            144.5,
            90.44473450676938
        ],
        "wc_questions_avg": [
            112.25,
            76.69216061632375
        ],
        "wc_review_avg": [
            417.25,
            238.2911821700501
        ],
        "wc_reply_reviewers_avg": [
            35.0,
            27.230497608380205
        ],
        "wc_reply_authors_avg": [
            1186.0,
            370.54891714859997
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.75,
            0.4330127018922193
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.19245008972987526,
        "gs_citation": 87,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9946646751213130183&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=4Ay23yeuz0",
        "pdf": "https://openreview.net/pdf?id=4Ay23yeuz0",
        "email": "uic.edu;amazon.com;amazon.com;amazon.com;amazon.com;cmu.edu;cs.gmu.edu;umn.edu",
        "author_num": 8,
        "aff_unique_index": "0;1;1;1;1;2;3;4",
        "aff_unique_norm": "University of Illinois at Chicago;Amazon;Carnegie Mellon University;George Mason University;University of Minnesota",
        "aff_unique_dep": ";Amazon Web Services;;Computer Science;",
        "aff_unique_url": "https://www.uic.edu;https://aws.amazon.com;https://www.cmu.edu;https://www.gmu.edu;https://www.minnesota.edu",
        "aff_unique_abbr": "UIC;AWS;CMU;GMU;UMN",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Chicago;;Minneapolis",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Chameleon: Increasing Label-Only Membership Leakage with Adaptive Poisoning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19475",
        "id": "4DoSULcfG6",
        "author_site": "Harsh Chaudhari, Giorgio Severi, Alina Oprea, Jonathan Ullman",
        "tldr": "",
        "abstract": "The integration of Machine Learning (ML) in numerous critical applications introduces a range of privacy concerns for individuals who provide their datasets for ML training purposes. One such privacy risk is Membership Inference (MI), in which an adversary seeks to determine whether a particular data point was included in the training dataset of a model. Current state-of-the-art MI approaches capitalize on access to the model\u2019s predicted confidence scores to successfully perform membership inference, and employ data poisoning to further enhance their effectiveness. \nIn this work, we  focus on the less explored and more realistic label-only setting, where the model provides only the predicted label as output. We show that existing label-only attacks are ineffective at inferring membership in the low False Positive Rate (FPR) regime. To address this challenge,  we propose a new attack Chameleon that leverages a novel data poisoning strategy and an efficient query selection method to achieve significantly more accurate membership inference than existing label-only attacks, especially for low FPRs.",
        "keywords": "Privacy Attack;Membership Inference;Data Poisoning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Harsh Chaudhari;Giorgio Severi;Alina Oprea;Jonathan Ullman",
        "authorids": "~Harsh_Chaudhari1;~Giorgio_Severi1;~Alina_Oprea2;~Jonathan_Ullman1",
        "gender": "M;;M;F",
        "homepage": ";http://severi.xyz;https://jonathan-ullman.github.io/;http://www.ccs.neu.edu/home/alina/",
        "dblp": "240/8222.html;221/4233.html;02/8164;35/3425",
        "google_scholar": "https://scholar.google.co.in/citations?user=w1lHWJ4AAAAJ;ClHeQx0AAAAJ;https://scholar.google.com.tw/citations?user=WfS41RAAAAAJ;https://scholar.google.com.tw/citations?user=16J3izoAAAAJ",
        "orcid": ";;;0000-0002-4979-5292",
        "linkedin": ";;;alina-oprea-9588bb1",
        "or_profile": "~Harsh_Chaudhari1;~Giorgio_Severi1;~Jonathan_Ullman1;~Alina_Oprea1",
        "aff": "Northeastern University;Northeastern University;Northeastern University;Northeastern University",
        "aff_domain": "northeastern.edu;northeastern.edu;northeastern.edu;northeastern.edu",
        "position": "PhD student;PhD student;Associate Professor;Associate Professor",
        "bibtex": "@inproceedings{\nchaudhari2024chameleon,\ntitle={Chameleon: Increasing Label-Only Membership Leakage with Adaptive Poisoning},\nauthor={Harsh Chaudhari and Giorgio Severi and Alina Oprea and Jonathan Ullman},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=4DoSULcfG6}\n}",
        "github": "",
        "project": "",
        "reviewers": "ECEy;uopX;JKci",
        "pdf_size": 1013106,
        "rating": "5;5;6",
        "confidence": "4;4;4",
        "soundness": "3;3;2",
        "contribution": "2;3;3",
        "presentation": "3;3;3",
        "wc_summary": "107;107;92",
        "wc_strengths": "30;68;20",
        "wc_weaknesses": "381;244;40",
        "wc_questions": "11;6;263",
        "wc_review": "529;425;415",
        "wc_reply_reviewers": "0;0;431",
        "wc_reply_authors": "646;396;1311",
        "reply_reviewers": "0;0;2",
        "reply_authors": "1;1;3",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            102.0,
            7.0710678118654755
        ],
        "wc_strengths_avg": [
            39.333333333333336,
            20.677416559027765
        ],
        "wc_weaknesses_avg": [
            221.66666666666666,
            140.10551579276083
        ],
        "wc_questions_avg": [
            93.33333333333333,
            119.98981438253648
        ],
        "wc_review_avg": [
            456.3333333333333,
            51.545018080207214
        ],
        "wc_reply_reviewers_avg": [
            143.66666666666666,
            203.17534846093466
        ],
        "wc_reply_authors_avg": [
            784.3333333333334,
            386.1418852644136
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4654850171827019168&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=4DoSULcfG6",
        "pdf": "https://openreview.net/pdf?id=4DoSULcfG6",
        "email": "northeastern.edu;northeastern.edu;northeastern.edu;northeastern.edu",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Northeastern University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.northeastern.edu",
        "aff_unique_abbr": "NEU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "4FUa5dxiiA",
        "title": "Risk-Sensitive Variational Model-Based Policy Optimization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "RL-as-inference casts reinforcement learning (RL) as Bayesian inference in a probabilistic graphical model. While this framework allows efficient variational approximations it is known that model-based RL-as-inference learns optimistic dynamics and risk-seeking policies that can exhibit catastrophic behavior.  By exploiting connections between the variational objective and a well-known risk-sensitive utility function we adaptively adjust policy risk based on the environment dynamics.  Our method, $\\beta$-VMBPO, extends the variational model-based policy optimization (VMBPO) algorithm to perform dual descent on risk parameter $\\beta$.   We provide a thorough theoretical analysis that fills gaps in the theory of model-based RL-as-inference by establishing a generalization of policy improvement, value iteration, and guarantees on policy determinism.  Our experiments demonstrate that this risk-sensitive approach yields improvements in simple tabular and complex continuous tasks, such as the DeepMind Control Suite.",
        "keywords": "Reinforcement Learning;Variational Inference;Risk Sensitive RL;Probabilistic Inference",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/24e46d88030e1c2a3bfbbfa03d080eaefe3b39a0.zip",
        "author": "Alonso Granados;Jason Pacheco;Mohammadreza Ebrahimi",
        "authorids": "~Alonso_Granados1;~Jason_Pacheco1;~Mohammadreza_Ebrahimi2",
        "gender": "M;M;M",
        "homepage": ";http://www.pachecoj.com;https://star-ailab.github.io/",
        "dblp": "230/2003;126/1745;26/7531",
        "google_scholar": ";71ZEsnEAAAAJ;4DmURbEAAAAJ",
        "orcid": ";;0000-0003-1367-3338",
        "linkedin": ";;",
        "or_profile": "~Alonso_Granados1;~Jason_Pacheco1;~Mohammadreza_Ebrahimi2",
        "aff": "University of Arizona;University of Arizona;University of South Florida",
        "aff_domain": "arizona.edu;arizona.edu;usf.edu",
        "position": "PhD student;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\ngranados2024risksensitive,\ntitle={Risk-Sensitive Variational Model-Based Policy Optimization},\nauthor={Alonso Granados and Jason Pacheco and Mohammadreza Ebrahimi},\nyear={2024},\nurl={https://openreview.net/forum?id=4FUa5dxiiA}\n}",
        "github": "",
        "project": "",
        "reviewers": "wKFu;dkQy;9Tpq",
        "site": "https://openreview.net/forum?id=4FUa5dxiiA",
        "pdf_size": 1192745,
        "rating": "3;6;6",
        "confidence": "4;3;3",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "3;4;3",
        "wc_summary": "197;200;97",
        "wc_strengths": "56;83;28",
        "wc_weaknesses": "531;607;89",
        "wc_questions": "88;35;194",
        "wc_review": "872;925;408",
        "wc_reply_reviewers": "970;152;114",
        "wc_reply_authors": "708;390;404",
        "reply_reviewers": "2;1;1",
        "reply_authors": "2;2;1",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            164.66666666666666,
            47.86323107447813
        ],
        "wc_strengths_avg": [
            55.666666666666664,
            22.45489305746572
        ],
        "wc_weaknesses_avg": [
            409.0,
            228.39147678200837
        ],
        "wc_questions_avg": [
            105.66666666666667,
            66.1026138330063
        ],
        "wc_review_avg": [
            735.0,
            232.23407731568307
        ],
        "wc_reply_reviewers_avg": [
            412.0,
            394.87044288812837
        ],
        "wc_reply_authors_avg": [
            500.6666666666667,
            146.71817277427573
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:xRayuBBRm3sJ:scholar.google.com/&scioq=Risk-Sensitive+Variational+Model-Based+Policy+Optimization&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "University of Arizona;University of South Florida",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.arizona.edu;https://www.usf.edu",
        "aff_unique_abbr": "UA;USF",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "4GfEOQlBoc",
        "title": "Disentangling the Link Between Image Statistics and Human Perception",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In the 1950s, Barlow and Attneave hypothesised a link between biological vision and information maximisation. Following Shannon, information was defined using the probability of natural images. A number of physiological and psychophysical phenomena have been derived ever since from principles like info-max, efficient coding, or optimal denoising. However, it remains unclear how this link is expressed in mathematical terms from image probability. First, classical derivations were subjected to strong assumptions on the probability models and on the behaviour of the sensors. Moreover, the direct evaluation of the hypothesis was limited by the inability of the classical image models to deliver accurate estimates of the probability. In this work we directly evaluate image probabilities using an advanced generative model for natural images, and we analyse how probability-related factors can be combined to predict human perception via sensitivity of state-of-the-art subjective image quality metrics. We use information theory and regression analysis to find a combination of just two probability-related factors that achieves 0.8 correlation with subjective metrics. This probability-based sensitivity is psychophysically validated by reproducing the basic trends of the Contrast Sensitivity Function, its suprathreshold variation, and trends of the Weber-law and masking.",
        "keywords": "perception;vision science;probability",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/d6bfbb96859a9b4cb9c3a1b8396b2c59a62c79bf.pdf",
        "author": "Alexander Hepburn;Valero Laparra;Raul Santos-Rodriguez;Jesus Malo",
        "authorids": "~Alexander_Hepburn2;~Valero_Laparra1;~Raul_Santos-Rodriguez1;~Jesus_Malo1",
        "gender": "M;;;M",
        "homepage": ";https://www.uv.es/lapeva/;https://www.bristol.ac.uk/people/person/Raul-Santos-Rodriguez-1d708791-ea39-4078-89e6-c5c81b8c1a22/;http://isp.uv.es/excathedra.html",
        "dblp": ";;24/7253;31/4807",
        "google_scholar": "CzZTCN4AAAAJ;dNt_xikAAAAJ;U_ldrLcAAAAJ;https://scholar.google.es/citations?user=0pgrklEAAAAJ",
        "orcid": ";;0000-0001-9576-3905;0000-0002-5684-8591",
        "linkedin": ";;;",
        "or_profile": "~Alexander_Hepburn2;~Valero_Laparra1;~Raul_Santos-Rodriguez1;~Jesus_Malo1",
        "aff": "University of Bristol;Universitat de Val\u00e8ncia;University of Bristol;Universitat de Valencia",
        "aff_domain": "bristol.ac.uk;uv.es;bristol.ac.uk;uv.es",
        "position": "Postdoc;Postdoc;Full Professor;Full Professor",
        "bibtex": "@misc{\nhepburn2024disentangling,\ntitle={Disentangling the Link Between Image Statistics and Human Perception},\nauthor={Alexander Hepburn and Valero Laparra and Raul Santos-Rodriguez and Jesus Malo},\nyear={2024},\nurl={https://openreview.net/forum?id=4GfEOQlBoc}\n}",
        "github": "",
        "project": "",
        "reviewers": "Cqjc;6JJg;RwsQ;Y3LV",
        "site": "https://openreview.net/forum?id=4GfEOQlBoc",
        "pdf_size": 599460,
        "rating": "5;5;5;6",
        "confidence": "5;4;4;3",
        "soundness": "2;2;2;3",
        "contribution": "2;3;2;3",
        "presentation": "3;2;2;3",
        "wc_summary": "20;55;72;87",
        "wc_strengths": "23;53;33;16",
        "wc_weaknesses": "194;280;471;1",
        "wc_questions": "11;217;2;146",
        "wc_review": "248;605;578;250",
        "wc_reply_reviewers": "0;82;0;29",
        "wc_reply_authors": "990;687;1253;135",
        "reply_reviewers": "0;1;0;2",
        "reply_authors": "2;2;2;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            58.5,
            24.944939366532843
        ],
        "wc_strengths_avg": [
            31.25,
            13.935117509371782
        ],
        "wc_weaknesses_avg": [
            236.5,
            168.92971911419258
        ],
        "wc_questions_avg": [
            94.0,
            91.08512502049936
        ],
        "wc_review_avg": [
            420.25,
            171.51730962209032
        ],
        "wc_reply_reviewers_avg": [
            27.75,
            33.48413803579241
        ],
        "wc_reply_authors_avg": [
            766.25,
            415.85657082701005
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17297146322820130188&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "University of Bristol;Universitat de Val\u00e8ncia;University of Valencia",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.bristol.ac.uk;https://www.uv.es;https://www.uv.es",
        "aff_unique_abbr": "Bristol;UV;UV",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;1",
        "aff_country_unique": "United Kingdom;Spain"
    },
    {
        "id": "4Hf5pbk74h",
        "title": "Improving classifier decision boundaries using nearest neighbors",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this paper, we show that neural networks are not learning optimal decision boundaries. Decision boundaries go through areas of low training data density. They are impacted by few training samples which can easily lead to overfitting. We show that performing a weighted average of the prediction of a sample and its nearest neighbors' (computed in latent space) leads to a variety of minor favorable outcomes. In our evaluation, we employ various self-trained and pre-trained convolutional neural networks to show that our approach improves (i) resistance to label noise,  (ii) robustness against adversarial attacks, (iii) classification accuracy, and to some degree even (iv) interpretability. While improvements are not necessarily large in all four areas, our approach is conceptually simple, i.e., improvements come without any modification to network architecture, training procedure or dataset. Furthermore, they are in stark contrast to prior works that often require trade-offs among the four objectives or provides only non-actionable insights.",
        "keywords": "decision boundary;computer vision;CNN;kNN",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/cb301cd78d038d8bfd16492018cc1be5ece42e0c.zip",
        "author": "Johannes Schneider",
        "authorids": "~Johannes_Schneider2",
        "gender": "",
        "homepage": "",
        "dblp": "31/4013-2",
        "google_scholar": "hgXFYMUAAAAJ",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Johannes_Schneider2",
        "aff": "Universit\u00e4t Liechtenstein",
        "aff_domain": "uni.li",
        "position": "Associate Professor",
        "bibtex": "@misc{\nschneider2024improving,\ntitle={Improving classifier decision boundaries using nearest neighbors},\nauthor={Johannes Schneider},\nyear={2024},\nurl={https://openreview.net/forum?id=4Hf5pbk74h}\n}",
        "github": "",
        "project": "",
        "reviewers": "RTTt;H15T;N6Bu",
        "site": "https://openreview.net/forum?id=4Hf5pbk74h",
        "pdf_size": 722593,
        "rating": "1;3;3",
        "confidence": "4;4;4",
        "soundness": "2;2;2",
        "contribution": "1;2;2",
        "presentation": "1;2;2",
        "wc_summary": "33;52;136",
        "wc_strengths": "37;33;109",
        "wc_weaknesses": "287;1270;111",
        "wc_questions": "31;7;671",
        "wc_review": "388;1362;1027",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "313;22;22",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            73.66666666666667,
            44.75364665464579
        ],
        "wc_strengths_avg": [
            59.666666666666664,
            34.92213560989012
        ],
        "wc_weaknesses_avg": [
            556.0,
            509.9614364505091
        ],
        "wc_questions_avg": [
            236.33333333333334,
            307.51187872268537
        ],
        "wc_review_avg": [
            925.6666666666666,
            404.03822701433694
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            119.0,
            137.17871555019022
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:zLNUHp3DI7oJ:scholar.google.com/&scioq=Improving+classifier+decision+boundaries+using+nearest+neighbors&hl=en&as_sdt=0,33",
        "gs_version_total": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "Universit\u00e4t Liechtenstein",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.unili.ch",
        "aff_unique_abbr": "Uni Li",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Liechtenstein"
    },
    {
        "id": "4Hv5DLTJLF",
        "title": "Consensus Optimization at Representation: Improving Personalized Federated Learning via Data-Centric Regularization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Federated learning is a large scale machine learning training paradigm where data is distributed across clients, and can be highly heterogeneous from one client to another. To ensure personalization in client models, and at the same time to ensure that the local models have enough commonality (i.e., prevent ``client-drift''), it has been recently proposed to cast the federated learning problem as a consensus optimization problem, where local models are trained on local data, but are forced to be similar via a regularization term. In this paper we propose an improved federated learning algorithm, where we ensure consensus optimization at the representation part of each local client, and not on whole local models. This algorithm naturally takes into account that today's deep networks are often partitioned into a feature extraction part (representation) and a prediction part. Our algorithm ensures greater flexibility compared to previous works on exact shared representation in highly heterogeneous settings, as it has been seen that the representation part can differ substantially with data distribution. Our method is  quite stable to noise, and can be made differentially private with strong privacy guarantee without much loss of accuracy. We provide a complete convergence analysis of our algorithm under general nonconvex loss functions, and validate its good performance experimentally in standard datasets.",
        "keywords": "Personalized federated learning;Consensus optimization;Representation learning;Variance reduction",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/d4f6b12bb772b062a6a40c7698cec4367fef0c88.pdf",
        "author": "Heng Zhu;Arya Mazumdar",
        "authorids": "~Heng_Zhu1;~Arya_Mazumdar1",
        "gender": "M;M",
        "homepage": ";http://www.cs.umass.edu/~arya",
        "dblp": "01/7106;77/6050",
        "google_scholar": ";https://scholar.google.com.tw/citations?user=9tjQU1EAAAAJ",
        "orcid": "0000-0002-0230-672X;",
        "linkedin": ";",
        "or_profile": "~Heng_Zhu1;~Arya_Mazumdar1",
        "aff": "University of California, San Diego;University of California, San Diego",
        "aff_domain": "ucsd.edu;ucsd.edu",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\nzhu2024consensus,\ntitle={Consensus Optimization at Representation: Improving Personalized Federated Learning via Data-Centric Regularization},\nauthor={Heng Zhu and Arya Mazumdar},\nyear={2024},\nurl={https://openreview.net/forum?id=4Hv5DLTJLF}\n}",
        "github": "",
        "project": "",
        "reviewers": "QkUY;EJeM;qMXj;R9Ht",
        "site": "https://openreview.net/forum?id=4Hv5DLTJLF",
        "pdf_size": 470136,
        "rating": "3;3;5;5",
        "confidence": "4;4;3;3",
        "soundness": "2;2;4;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "45;84;94;35",
        "wc_strengths": "22;44;50;25",
        "wc_weaknesses": "348;634;142;76",
        "wc_questions": "553;100;389;63",
        "wc_review": "968;862;675;199",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            64.5,
            25.004999500099974
        ],
        "wc_strengths_avg": [
            35.25,
            11.986972094736853
        ],
        "wc_weaknesses_avg": [
            300.0,
            217.3706511928416
        ],
        "wc_questions_avg": [
            276.25,
            203.61897627677044
        ],
        "wc_review_avg": [
            676.0,
            294.6989989803155
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Z2icTKDWILkJ:scholar.google.com/&scioq=Consensus+Optimization+at+Representation:+Improving+Personalized+Federated+Learning+via+Data-Centric+Regularization&hl=en&as_sdt=0,5",
        "gs_version_total": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of California, San Diego",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucsd.edu",
        "aff_unique_abbr": "UCSD",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "San Diego",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "One For All: Towards Training One Graph Model For All Classification Tasks",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19474",
        "id": "4IT2pgc9v6",
        "author_site": "Hao Liu, Jiarui Feng, Lecheng Kong, Ningyue Liang, Dacheng Tao, Yixin Chen, Muhan Zhang",
        "tldr": "",
        "abstract": "Designing a single model to address multiple tasks has been a long-standing objective in artificial intelligence. Recently, large language models have demonstrated exceptional capability in solving different tasks within the language domain. However, a unified model for various graph tasks remains underexplored, primarily due to the challenges unique to the graph learning domain. First, graph data from different areas carry distinct attributes and follow different distributions. Such discrepancy makes it hard to represent graphs in a single representation space. Second, tasks on graphs diversify into node, link, and graph tasks, requiring distinct embedding strategies. Finally, an appropriate graph prompting paradigm for in-context learning is unclear. We propose **One for All (OFA)**, the first general framework that can use a single graph model to address the above challenges. Specifically, OFA proposes text-attributed graphs to unify different graph data by describing nodes and edges with natural language and uses language models to encode the diverse and possibly cross-domain text attributes to feature vectors in the same embedding space. Furthermore, OFA introduces the concept of nodes-of-interest to standardize different tasks with a single task representation. For in-context learning on graphs, OFA introduces a novel graph prompting paradigm that appends prompting substructures to the input graph, which enables it to address varied tasks without fine-tuning. We train the OFA model using graph data from multiple domains (including citation networks, molecular graphs, knowledge graphs, etc.) simultaneously and evaluate its ability in supervised, few-shot, and zero-shot learning scenarios. OFA performs well across different tasks, making it the first general-purpose across-domains classification model on graphs.",
        "keywords": "Graph Neural Network;Large Language Model;In-context Learning",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/30bf1403d2e456553faf2a34a7acf3f0b2f125c4.zip",
        "author": "Hao Liu;Jiarui Feng;Lecheng Kong;Ningyue Liang;Dacheng Tao;Yixin Chen;Muhan Zhang",
        "authorids": "~Hao_Liu25;~Jiarui_Feng1;~Lecheng_Kong1;~Ningyue_Liang1;~Dacheng_Tao1;~Yixin_Chen1;~Muhan_Zhang1",
        "gender": "F;M;M;M;;M;M",
        "homepage": "https://haoliu-cola.github.io/;https://jiaruifeng.github.io/;https://LechengKong.github.io/;https://github.com/NingyueLiang;;https://www.cse.wustl.edu/~yixin.chen/;https://muhanzhang.github.io/",
        "dblp": "09/3214-57;77/8797;319/5576;;;59/983;157/5518",
        "google_scholar": ";6CSGUR8AAAAJ;yk3-_EgAAAAJ;;;NByrsK0AAAAJ;https://scholar.google.com.hk/citations?user=OBBqkosAAAAJ",
        "orcid": ";0000-0002-3409-6819;0000-0001-9427-8799;;;;0000-0002-7680-6401",
        "linkedin": ";;;ningyue-liang-frank;;;jerry-muhan-zhang-a33a1777/",
        "or_profile": "~Hao_Liu25;~Jiarui_Feng1;~Lecheng_Kong1;~Ningyue_Liang1;~Dacheng_Tao1;~Yixin_Chen1;~Muhan_Zhang1",
        "aff": "Washington University in St. Louis;Washington University, Saint Louis;Amazon;Washington University, Saint Louis;;Washington University, Saint Louis;Peking University",
        "aff_domain": "wustl.edu;wustl.edu;amazon.com;wustl.edu;;wustl.edu;pku.edu.cn",
        "position": "PhD student;PhD student;Researcher;Undergrad student;;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nliu2024one,\ntitle={One For All: Towards Training One Graph Model For All Classification Tasks},\nauthor={Hao Liu and Jiarui Feng and Lecheng Kong and Ningyue Liang and Dacheng Tao and Yixin Chen and Muhan Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=4IT2pgc9v6}\n}",
        "github": "",
        "project": "",
        "reviewers": "A8Qx;RxxK;LMu3;WF3H",
        "pdf_size": 753506,
        "rating": "6;6;6;10",
        "confidence": "4;4;3;5",
        "soundness": "3;3;2;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;4",
        "wc_summary": "39;154;26;67",
        "wc_strengths": "44;24;42;44",
        "wc_weaknesses": "462;270;77;78",
        "wc_questions": "2;64;7;2",
        "wc_review": "547;512;152;191",
        "wc_reply_reviewers": "30;0;43;0",
        "wc_reply_authors": "1946;855;854;481",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "5;2;3;2",
        "rating_avg": [
            7.0,
            1.7320508075688772
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            71.5,
            49.882361612096915
        ],
        "wc_strengths_avg": [
            38.5,
            8.411301920630361
        ],
        "wc_weaknesses_avg": [
            221.75,
            159.42455112058494
        ],
        "wc_questions_avg": [
            18.75,
            26.20472285676763
        ],
        "wc_review_avg": [
            350.5,
            179.95624468186705
        ],
        "wc_reply_reviewers_avg": [
            18.25,
            18.819869818890883
        ],
        "wc_reply_authors_avg": [
            1034.0,
            548.177434778193
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.0,
            1.224744871391589
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.816496580927726,
        "gs_citation": 47,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18088863771521081810&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=4IT2pgc9v6",
        "pdf": "https://openreview.net/pdf?id=4IT2pgc9v6",
        "email": "wustl.edu;wustl.edu;amazon.com;wustl.edu;;wustl.edu;pku.edu.cn",
        "author_num": 7,
        "aff_unique_index": "0;0;1;0;0;2",
        "aff_unique_norm": "Washington University in St. Louis;Amazon;Peking University",
        "aff_unique_dep": ";Amazon.com, Inc.;",
        "aff_unique_url": "https://wustl.edu;https://www.amazon.com;http://www.pku.edu.cn",
        "aff_unique_abbr": "WashU;Amazon;Peking U",
        "aff_campus_unique_index": "0;1;1;1",
        "aff_campus_unique": "St. Louis;Saint Louis;",
        "aff_country_unique_index": "0;0;0;0;0;1",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "4IxtmklIym",
        "title": "FruitBin: A tunable large-scale dataset for advancing 6D Pose estimation in fruit bin picking automation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Bin picking is a ubiquitous application spanning across diverse industries, demanding automated solutions facilitated by robots. These automation systems hinge upon intricate components, including object instance-level segmentation and 6D pose estimation, which are pivotal for predicting future grasping and manipulation success. Contemporary computer vision approaches predominantly rely on deep learning methodologies and necessitate access to extensive instance-level datasets. However, prevailing datasets and benchmarks tend to be confined to oversimplified scenarios, such as those with singular objects on tables or low levels of object clustering. In this research, we introduce FruitBin. It emerges as an unparalleled resource, boasting an extensive collection of over a million images and 40 million instance-level 6D poses. Additionally FruitBin differs with other datasets whith its inclusive representation of a wide spectrum of challenges, encompassing symmetric and asymmetric fruits, objects with and without discernible texture, and diverse lighting conditions, all enriched with extended annotations and metadata. Leveraging the inherent challenges and the sheer scale of FruitBin, we highlight its potential as a versatile benchmarking tool that can be customized to suit various evaluation scenarios. As a demonstration of this adaptability, we have created two distinct types of benchmarks: one centered on novel scene generalization and another focusing on novel camera viewpoint generalization. Both benchmark types offer four levels of occlusion to facilitate the study of occlusion robustness. Notably, our study showcases the difficulty of FruitBin dataset, with two baseline 6D pose estimation models, one utilizing RGB images and the other RGB-D data, across these eight distinct benchmarks. FruitBin emerges as a pioneering dataset distinguishing itself by seamlessly integrating with robotic software. That enable direct testing of trained models in dynamic grasping tasks for the purpose of robot learning. Samples of the dataset with its associated code are provided in the supplementary materials. FruitBin promises to be a catalyst for advancing the field of robotics and automation, providing researchers and practitioners with a comprehensive resource to push the boundaries of 6D pose estimation in the context of fruit bin picking and beyond.",
        "keywords": "Datasets and Benchmarks;6D Pose estimation;Robotic;Bin Picking;Occlusion",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/83a8bb39727c49cb6c38ef940d278d5b7dca8cef.zip",
        "author": "Guillaume Duret;Mahmoud ALI;NICOLAS CAZIN;Alexandre Chapin;Florence Zara;Emmanuel Dellandrea;Jan Peters;Liming Chen",
        "authorids": "~Guillaume_Duret1;~Mahmoud_ALI1;~NICOLAS_CAZIN1;~Alexandre_Chapin1;~Florence_Zara1;~Emmanuel_Dellandrea2;~Jan_Peters3;~Liming_Chen1",
        "gender": "M;M;M;M;F;M;M;M",
        "homepage": ";https://mahmoud-ali.netlify.app/;;https://liris.cnrs.fr/en/member-page/alexandre-chapin;https://perso.liris.cnrs.fr/fzara/Web/index.html;http://perso.ec-lyon.fr/emmanuel.dellandrea/;https://www.jan-peters.net;https://sites.google.com/view/limingchen/accueil",
        "dblp": ";260/9430;;;87/851;79/5140.html;p/JanPeters1;32/7029-2",
        "google_scholar": ";;;;https://scholar.google.fr/citations?hl=fr;https://scholar.google.fr/citations?user=lK9Pa0MAAAAJ;https://scholar.google.de/citations?user=-kIVAcAAAAAJ;VOPW5YYAAAAJ",
        "orcid": ";0009-0002-7658-0446;0000-0002-8382-7227;;0000-0002-0118-7204;;0000-0002-5266-8091;0000-0002-3654-9498",
        "linkedin": "guillaume-duret-41ab70169/;mahmoud-ali-5b1938b8/;nicolas-cazin-phd-a61b54172/;;;;janrpeters/;liming-chen-039455a/",
        "or_profile": "~Guillaume_Duret1;~Mahmoud_ALI1;~NICOLAS_CAZIN1;~Alexandre_Chapin1;~Florence_Zara1;~Emmanuel_Dellandrea2;~Jan_Peters3;~Liming_Chen1",
        "aff": "Ecole Centrale de Lyon;INRIA;;Ecole Centrale de Lyon;LIRIS, CNRS;Ecole Centrale de Lyon;TU Darmstadt;Ecole Centrale de Lyon",
        "aff_domain": "ec-lyon.fr;inria.fr;;ec-lyon.fr;liris.cnrs.fr;ec-lyon.fr;tu-darmstadt.de;ec-lyon.fr",
        "position": "PhD student;PhD student;;PhD student;Associate Professor;Associate Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nduret2024fruitbin,\ntitle={FruitBin: A tunable large-scale dataset for advancing 6D Pose estimation in fruit bin picking automation},\nauthor={Guillaume Duret and Mahmoud ALI and NICOLAS CAZIN and Alexandre Chapin and Florence Zara and Emmanuel Dellandrea and Jan Peters and Liming Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=4IxtmklIym}\n}",
        "github": "",
        "project": "",
        "reviewers": "J2Gb;Ksan;bGzb;gFnj",
        "site": "https://openreview.net/forum?id=4IxtmklIym",
        "pdf_size": 35938534,
        "rating": "3;3;5;8",
        "confidence": "4;4;5;5",
        "soundness": "2;2;3;4",
        "contribution": "1;2;2;3",
        "presentation": "2;3;3;4",
        "wc_summary": "35;71;36;30",
        "wc_strengths": "22;83;18;41",
        "wc_weaknesses": "116;378;180;11",
        "wc_questions": "12;63;35;1",
        "wc_review": "185;595;269;83",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "439;884;724;223",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            43.0,
            16.32482771731451
        ],
        "wc_strengths_avg": [
            41.0,
            25.758493744782516
        ],
        "wc_weaknesses_avg": [
            171.25,
            133.74859812349436
        ],
        "wc_questions_avg": [
            27.75,
            23.763154251908563
        ],
        "wc_review_avg": [
            283.0,
            191.79676743887003
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            567.5,
            254.88085451834158
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.8551861104941366,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:GPohUnboD54J:scholar.google.com/&scioq=FruitBin:+A+tunable+large-scale+dataset+for+advancing+6D+Pose+estimation+in+fruit+bin+picking+automation&hl=en&as_sdt=0,5",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0;2;0;3;0",
        "aff_unique_norm": "Ecole Centrale de Lyon;INRIA;CNRS;Technische Universit\u00e4t Darmstadt",
        "aff_unique_dep": ";;LIRIS;",
        "aff_unique_url": "https://www.ec-lyon.fr;https://www.inria.fr;https://www.cnrs.fr;https://www.tu-darmstadt.de",
        "aff_unique_abbr": "ECL;INRIA;CNRS;TU Darmstadt",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Darmstadt",
        "aff_country_unique_index": "0;0;0;0;0;1;0",
        "aff_country_unique": "France;Germany"
    },
    {
        "title": "The Devil is in the Object Boundary: Towards Annotation-free Instance Segmentation using Foundation Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19473",
        "id": "4JbrdrHxYy",
        "author_site": "cheng shi, Sibei Yang",
        "tldr": "",
        "abstract": "Foundation models, pre-trained on a large amount of data have demonstrated impressive zero-shot capabilities in various downstream tasks. However, in object detection and instance segmentation, two fundamental computer vision tasks heavily reliant on extensive human annotations, foundation models such as SAM and DINO struggle to achieve satisfactory performance. \nIn this study, we reveal that the devil is in the object boundary, $\\textit{i.e.}$, these foundation models fail to discern boundaries between individual objects. \nFor the first time, we probe that CLIP, which has never accessed any instance-level annotations, can provide a highly beneficial and strong instance-level boundary prior in the clustering results of its particular intermediate layer. Following this surprising observation, we propose $\\textbf{\\textit{Zip}}$ which $\\textbf{Z}$ips up CL$\\textbf{ip}$ and SAM in a novel classification-first-then-discovery pipeline, enabling annotation-free, complex-scene-capable, open-vocabulary object detection and instance segmentation. \nOur Zip significantly boosts SAM's mask AP on COCO dataset by 12.5\\% and establishes state-of-the-art performance in various settings, including training-free, self-training, and label-efficient finetuning. Furthermore, annotation-free Zip even achieves comparable performance to the best-performing open-vocabulary object detecters using base annotations. Code is released at https://github.com/ChengShiest/Zip-Your-CLIP",
        "keywords": "object detection;annotation-free;instance segmentation;open-vocabulary;SAM;CLIP",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Cheng Shi;Sibei Yang",
        "authorids": "~Cheng_Shi4;~Sibei_Yang1",
        "gender": "M;F",
        "homepage": "https://github.com/ChengShiest;https://sibeiyang.github.io/",
        "dblp": ";215/4885",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;user=4pg3rtYAAAAJ",
        "orcid": "0000-0002-6942-8481;",
        "linkedin": ";",
        "or_profile": "~Cheng_Shi4;~Sibei_Yang1",
        "aff": "ShanghaiTech University;ShanghaiTech University",
        "aff_domain": "shanghaitech.edu.cm;shanghaitech.edu.cn",
        "position": "MS student;Assistant Professor",
        "bibtex": "@inproceedings{\nshi2024the,\ntitle={The Devil is in the Object Boundary: Towards Annotation-free Instance Segmentation using Foundation Models},\nauthor={Cheng Shi and Sibei Yang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=4JbrdrHxYy}\n}",
        "github": "",
        "project": "",
        "reviewers": "CLaV;11pM;5mwu;g6s6;WVZD",
        "pdf_size": 18169881,
        "rating": "5;5;6;6;8",
        "confidence": "4;4;4;4;4",
        "soundness": "4;2;3;3;4",
        "contribution": "4;2;3;3;4",
        "presentation": "4;2;3;3;3",
        "wc_summary": "108;50;98;54;58",
        "wc_strengths": "142;27;42;51;45",
        "wc_weaknesses": "195;270;154;154;46",
        "wc_questions": "27;70;96;327;335",
        "wc_review": "472;417;390;586;484",
        "wc_reply_reviewers": "0;0;0;61;98",
        "wc_reply_authors": "676;1701;1166;1405;1180",
        "reply_reviewers": "0;0;0;1;1",
        "reply_authors": "1;3;3;3;3",
        "rating_avg": [
            6.0,
            1.0954451150103321
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.2,
            0.7483314773547882
        ],
        "contribution_avg": [
            3.2,
            0.7483314773547882
        ],
        "presentation_avg": [
            3.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            73.6,
            24.344198487524704
        ],
        "wc_strengths_avg": [
            61.4,
            41.06872289224489
        ],
        "wc_weaknesses_avg": [
            163.8,
            72.5545312161825
        ],
        "wc_questions_avg": [
            171.0,
            132.50962229211885
        ],
        "wc_review_avg": [
            469.8,
            67.62366449697916
        ],
        "wc_reply_reviewers_avg": [
            31.8,
            40.66644808684427
        ],
        "wc_reply_authors_avg": [
            1225.6,
            336.41676533728224
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            2.6,
            0.8000000000000002
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1971090372667658008&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=4JbrdrHxYy",
        "pdf": "https://openreview.net/pdf?id=4JbrdrHxYy",
        "email": "shanghaitech.edu.cm;shanghaitech.edu.cn",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "ShanghaiTech University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.shanghaitech.edu.cn",
        "aff_unique_abbr": "ShanghaiTech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "4JjSJyT15z",
        "title": "NaturalSigner: Diffusion Models are Natural Sign Language Generator",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Generating natural and expressive sign language pose sequences from text has important practical significance.\nHowever, current sign language generation (SLG) methods suffer from low quality and limited expressiveness.\nIn this work, we propose NaturalSigner, a classifier-free diffusion-based generative model designed specifically for SLG.\n Specifically, it consists of a mixed semantic encoder that enhances the semantic consistency and expressiveness of the generated sign language, which takes both text and gloss as input; and a novel sign language denoiser that generates natural sign language pose sequences according to the output of the semantic encoder.\nIn addition, to achieve more natural and high-quality SLG, we design a sign language prompting mechanism to facilitate in-context learning in the diffusion model and duration predictor.\n  Experiments on two datasets show that NaturalSigner significantly outperforms the state-of-the-art methods in terms of semantic consistency, naturalness, and expressiveness.\n  On the Phoenix-2014T dataset, compared with the previous best end-to-end SLG method, NaturalSigner improves the BLEU-4 score of the back translation metric by more than **40\\%** and reduces the Frechet Inception Distance (FID) by more than **12 times**.",
        "keywords": "Sign Language Generation;Deep Learning",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/5cc75085b25919d113fa52a3f04582aa7bc125e2.zip",
        "author": "Aoxiong Yin;Jiahao Xun;Xize Cheng;Tao Jin;Shengyu Zhang;Zhou Zhao;Siliang Tang;Fei Wu",
        "authorids": "~Aoxiong_Yin1;~Jiahao_Xun1;~Xize_Cheng1;~Tao_Jin2;~Shengyu_Zhang2;~Zhou_Zhao3;~Siliang_Tang1;~Fei_Wu1",
        "gender": ";M;M;M;M;;M;M",
        "homepage": ";;https://exgc.github.io/;https://hugddygff.github.io/;https://shengyuzhang.github.io/;;https://person.zju.edu.cn/en/siliang;https://person.zju.edu.cn/wufei",
        "dblp": ";303/0655;334/2167;88/4850-4.html;47/3459-1;;44/5693;84/3254-1",
        "google_scholar": ";;https://scholar.google.com/citations?hl=zh-CN;;l4Dyt7EAAAAJ;;8e7H3PcAAAAJ;XJLn4MYAAAAJ",
        "orcid": ";0009-0000-6141-4125;0000-0001-9708-3225;0000-0003-3564-1628;0000-0002-0030-8289;;0000-0002-7356-9711;",
        "linkedin": ";;;;;;siliang-tang-4734272a/;",
        "or_profile": "~Aoxiong_Yin1;~Jiahao_Xun1;~Xize_Cheng1;~Tao_Jin2;~Shengyu_Zhang2;~Zhou_Zhao3;~Siliang_Tang1;~Fei_Wu1",
        "aff": ";Zhejiang University;Zhejiang University;Zhejiang University;Zhejiang University;;Zhejiang University;Zhejiang University",
        "aff_domain": ";zju.edu.cn;zju.edu.cn;zju.edu.cn;zju.edu.cn;;zju.edu.cn;zju.edu.cn",
        "position": ";MS student;PhD student;Assistant Professor;ZJU100 Young Professor;;Full Professor;Full Professor",
        "bibtex": "@misc{\nyin2024naturalsigner,\ntitle={NaturalSigner: Diffusion Models are Natural Sign Language Generator},\nauthor={Aoxiong Yin and Jiahao Xun and Xize Cheng and Tao Jin and Shengyu Zhang and Zhou Zhao and Siliang Tang and Fei Wu},\nyear={2024},\nurl={https://openreview.net/forum?id=4JjSJyT15z}\n}",
        "github": "",
        "project": "",
        "reviewers": "UZBd;BJCa;s9QL;9cnq",
        "site": "https://openreview.net/forum?id=4JjSJyT15z",
        "pdf_size": 1363283,
        "rating": "3;3;5;8",
        "confidence": "5;5;4;5",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;2;3",
        "wc_summary": "70;35;66;61",
        "wc_strengths": "31;36;53;108",
        "wc_weaknesses": "321;86;219;109",
        "wc_questions": "2;5;27;84",
        "wc_review": "424;162;365;362",
        "wc_reply_reviewers": "223;0;112;0",
        "wc_reply_authors": "1150;729;1353;535",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "3;2;3;1",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            4.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            58.0,
            13.656500283747663
        ],
        "wc_strengths_avg": [
            57.0,
            30.553232234904378
        ],
        "wc_weaknesses_avg": [
            183.75,
            93.83862477679433
        ],
        "wc_questions_avg": [
            29.5,
            32.912763481664676
        ],
        "wc_review_avg": [
            328.25,
            99.11703940292001
        ],
        "wc_reply_reviewers_avg": [
            83.75,
            92.48885067941973
        ],
        "wc_reply_authors_avg": [
            941.75,
            325.2701761612952
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.07053456158585983,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ZHwXzOEg9YIJ:scholar.google.com/&scioq=NaturalSigner:+Diffusion+Models+are+Natural+Sign+Language+Generator&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "Zhejiang University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.zju.edu.cn",
        "aff_unique_abbr": "ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "4JtwtT4nYC",
        "title": "Multi-Task Reinforcement Learning with Shared-Unique Features and Task-Aware Prioritized Experience Replay",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Multi-task reinforcement learning (MTRL) has emerged as a challenging problem to reduce the computational cost of reinforcement learning and leverage shared features among tasks to improve the performance of individual tasks. \nHowever, a key challenge lies in determining which features should be shared across tasks and how to preserve the unique features that differentiate each task. This challenge often leads to the problem of task performance imbalance, where certain tasks may dominate the learning process while others are neglected. \nIn this paper, we propose a novel approach called shared-unique features along with task-aware prioritized experience replay to improve training stability and leverage shared and unique features effectively. \nWe incorporate a simple yet effective task-specific embeddings to preserve the unique features of each task to mitigate the potential problem of task performance imbalance. \nAdditionally,  we introduce task-aware settings to the prioritized experience replay (PER) algorithm to accommodate multi-task training and enhancing training stability. \nOur approach achieves state-of-the-art average success rates on the Meta-World benchmark, while maintaining stable performance across all tasks, avoiding task performance imbalance issues. The results demonstrate the effectiveness of our method in addressing the challenges of MTRL.",
        "keywords": "Multi-task reinforcement learning;Experience replay;Shared-unique features",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Po-Shao Lin;Jia-Fong Yeh;Yi-Ting Chen;Winston H. Hsu",
        "authorids": "~Po-Shao_Lin2;~Jia-Fong_Yeh1;~Yi-Ting_Chen2;~Winston_H._Hsu2",
        "gender": ";M;M;M",
        "homepage": "https://www.cmlab.csie.ntu.edu.tw/~jiafongyeh/;https://sites.google.com/site/yitingchen0524/;https://github.com/Tonylin1998;https://winstonhsu.info/",
        "dblp": "198/7831;12/5268-1;;16/5668.html",
        "google_scholar": "kS-oZ20AAAAJ;8tRH7RMAAAAJ;;https://scholar.google.com.tw/citations?user=NOvDH3QAAAAJ",
        "orcid": ";;;0000-0002-3330-0638",
        "linkedin": ";;;",
        "or_profile": "~Jia-Fong_Yeh1;~Yi-Ting_Chen2;~\u67cf\u52ad_\u67971;~Winston_Hsu1",
        "aff": "Sony Group Corporation;National Yang Ming Chiao Tung University;;National Taiwan University",
        "aff_domain": "sony.com;nycu.edu.tw;;ntu.edu.tw",
        "position": "Intern;Assistant Professor;;Professor",
        "bibtex": "@misc{\nlin2024multitask,\ntitle={Multi-Task Reinforcement Learning with Shared-Unique Features and Task-Aware Prioritized Experience Replay},\nauthor={Po-Shao Lin and Jia-Fong Yeh and Yi-Ting Chen and Winston H. Hsu},\nyear={2024},\nurl={https://openreview.net/forum?id=4JtwtT4nYC}\n}",
        "github": "",
        "project": "",
        "reviewers": "89dx;MxpY;7qsQ",
        "site": "https://openreview.net/forum?id=4JtwtT4nYC",
        "pdf_size": 765199,
        "rating": "3;3;3",
        "confidence": "4;4;4",
        "soundness": "3;2;2",
        "contribution": "2;2;2",
        "presentation": "3;1;2",
        "wc_summary": "88;155;54",
        "wc_strengths": "112;48;30",
        "wc_weaknesses": "163;320;259",
        "wc_questions": "35;31;34",
        "wc_review": "398;554;377",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            99.0,
            41.960298696108765
        ],
        "wc_strengths_avg": [
            63.333333333333336,
            35.188381921057726
        ],
        "wc_weaknesses_avg": [
            247.33333333333334,
            64.62369706401996
        ],
        "wc_questions_avg": [
            33.333333333333336,
            1.699673171197595
        ],
        "wc_review_avg": [
            443.0,
            78.95568377260753
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:xvq29vV_NhAJ:scholar.google.com/&scioq=Multi-Task+Reinforcement+Learning+with+Shared-Unique+Features+and+Task-Aware+Prioritized+Experience+Replay&hl=en&as_sdt=0,23",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Sony Group Corporation;National Yang Ming Chiao Tung University;National Taiwan University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.sony.com;https://www.nycu.edu.tw;https://www.ntu.edu.tw",
        "aff_unique_abbr": "Sony;NYCU;NTU",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Taiwan",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "Japan;China"
    },
    {
        "title": "Neurosymbolic Grounding for Compositional World Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19472",
        "id": "4KZpDGD4Nh",
        "author_site": "Atharva Sehgal, Arya Grayeli, Jennifer Sun, Swarat Chaudhuri",
        "tldr": "",
        "abstract": "We introduce Cosmos, a framework for object-centric world modeling that is designed for compositional generalization (CompGen), i.e., high performance on unseen input scenes obtained through the composition of known visual \"atoms.\" The central insight behind Cosmos is the use of a novel form of neurosymbolic grounding. Specifically, the framework introduces two new tools: (i) neurosymbolic scene encodings, which represent each entity in a scene using a real vector computed using a neural encoder, as well as a vector of composable symbols describing attributes of the entity, and (ii) a neurosymbolic attention mechanism that binds these entities to learned rules of interaction. Cosmos is end-to-end differentiable; also, unlike traditional neurosymbolic methods that require representations to be manually mapped to symbols, it computes an entity's symbolic attributes using vision-language foundation models. Through an evaluation that considers two different forms of CompGen on an established blocks-pushing domain, we show that the framework establishes a new state-of-the-art for CompGen in world modeling. Artifacts are available at: https://trishullab.github.io/cosmos-web/",
        "keywords": "neurosymbolic learning;machine learning;world modeling;compositional generalization",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "/attachment/821493eb5c04dce714ca9b717b1be29b91ca9837.zip",
        "author": "Atharva Sehgal;Arya Grayeli;Jennifer J. Sun;Swarat Chaudhuri",
        "authorids": "~Atharva_Sehgal1;~Arya_Grayeli1;~Jennifer_J._Sun1;~Swarat_Chaudhuri1",
        "gender": "M;M;M;F",
        "homepage": "https://www.atharvas.net;;http://www.cs.utexas.edu/~swarat;https://jenjsun.com/",
        "dblp": ";;37/6100;232/1563",
        "google_scholar": ";;9j6RBYQAAAAJ;",
        "orcid": ";;0000-0002-6859-1391;",
        "linkedin": "atharvas/;aryagrayeli/;swarat-chaudhuri-609b3092/;jennifer-sun-224778a3/",
        "or_profile": "~Atharva_Sehgal1;~Arya_Grayeli1;~Swarat_Chaudhuri1;~Jennifer_Jianing_Sun1",
        "aff": "University of Texas at Austin;University of Texas at Austin;University of Texas at Austin;Google",
        "aff_domain": "utexas.edu;utexas.edu;utexas.edu;google.com",
        "position": "PhD student;Undergrad student;Full Professor;Researcher",
        "bibtex": "@inproceedings{\nsehgal2024neurosymbolic,\ntitle={Neurosymbolic Grounding for Compositional World Models},\nauthor={Atharva Sehgal and Arya Grayeli and Jennifer J. Sun and Swarat Chaudhuri},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=4KZpDGD4Nh}\n}",
        "github": "",
        "project": "",
        "reviewers": "QCEm;CQ89;5cti",
        "pdf_size": 1745886,
        "rating": "6;6;6",
        "confidence": "4;4;2",
        "soundness": "3;3;2",
        "contribution": "2;2;3",
        "presentation": "3;3;3",
        "wc_summary": "62;71;27",
        "wc_strengths": "64;78;44",
        "wc_weaknesses": "310;457;109",
        "wc_questions": "41;21;5",
        "wc_review": "477;627;185",
        "wc_reply_reviewers": "66;23;26",
        "wc_reply_authors": "1438;1728;912",
        "reply_reviewers": "1;1;1",
        "reply_authors": "3;3;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            53.333333333333336,
            18.979521127315678
        ],
        "wc_strengths_avg": [
            62.0,
            13.9522996909709
        ],
        "wc_weaknesses_avg": [
            292.0,
            142.63940549511554
        ],
        "wc_questions_avg": [
            22.333333333333332,
            14.72714802291635
        ],
        "wc_review_avg": [
            429.6666666666667,
            183.52353769718175
        ],
        "wc_reply_reviewers_avg": [
            38.333333333333336,
            19.601587237318874
        ],
        "wc_reply_authors_avg": [
            1359.3333333333333,
            337.7428344498551
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18138122186326119791&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=4KZpDGD4Nh",
        "pdf": "https://openreview.net/pdf?id=4KZpDGD4Nh",
        "email": "utexas.edu;utexas.edu;utexas.edu;google.com",
        "author_num": 4,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "University of Texas at Austin;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.utexas.edu;https://www.google.com",
        "aff_unique_abbr": "UT Austin;Google",
        "aff_campus_unique_index": "0;0;0;1",
        "aff_campus_unique": "Austin;Mountain View",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Curiosity-driven Red-teaming for Large Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19471",
        "id": "4KqkizXgXU",
        "author_site": "Zhang-Wei Hong, Idan Shenfeld, Johnson (Tsun-Hsuan) Wang, Yung-Sung Chuang, Aldo Pareja, James R Glass, Akash Srivastava, Pulkit Agrawal",
        "tldr": "",
        "abstract": "Large language models (LLMs) hold great potential for many natural language applications but risk generating incorrect or toxic content. To probe when an LLM generates unwanted content, the current paradigm is to recruit a $\\textit{red team}$ of human testers to design input prompts (i.e., test cases) that elicit undesirable responses from LLMs. \nHowever, relying solely on human testers is expensive and time-consuming. Recent works automate red teaming by training a separate red team LLM with reinforcement learning (RL) to generate test cases that maximize the chance of eliciting undesirable responses from the target LLM. However, current RL methods are only able to generate a small number of effective test cases resulting in a low coverage of the span of prompts that elicit undesirable responses from the target LLM.\nTo overcome this limitation, we draw a connection between the problem of increasing the coverage of generated test cases and the well-studied approach of curiosity-driven exploration that optimizes for novelty. \nOur method of curiosity-driven red teaming (CRT) achieves greater coverage of test cases while mantaining or increasing their effectiveness compared to existing methods.\nOur method, CRT successfully provokes toxic responses from LLaMA2 model that has been heavily fine-tuned using human preferences to avoid toxic outputs. Code is available at https://github.com/Improbable-AI/curiosity_redteam.",
        "keywords": "Curiosity-driven exploration;Reinforcement learning;Language model",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/da3812c3dc922578aa3779e75911bd941e9e9d13.zip",
        "author": "Zhang-Wei Hong;Idan Shenfeld;Tsun-Hsuan Wang;Yung-Sung Chuang;Aldo Pareja;James R. Glass;Akash Srivastava;Pulkit Agrawal",
        "authorids": "~Zhang-Wei_Hong1;~Idan_Shenfeld1;~Tsun-Hsuan_Wang2;~Yung-Sung_Chuang1;~Aldo_Pareja1;~James_R._Glass1;~Akash_Srivastava1;~Pulkit_Agrawal1",
        "gender": "M;M;M;M;M;;M;M",
        "homepage": ";https://www.linkedin.com/in/idan-shenfeld/;https://zswang666.github.io/;https://people.csail.mit.edu/yungsung/;https://mitibmwatsonailab.mit.edu/people/aldo-pareja/;;http://akashgit.github.io;https://people.eecs.berkeley.edu/~pulkitag/",
        "dblp": "198/0600;;217/1809.html;64/3095;;;24/9528;149/2672",
        "google_scholar": "GZkyN4cAAAAJ;;xE3WSuYAAAAJ;3ar1DOwAAAAJ;;;https://scholar.google.co.uk/citations?user=2h6SZeEAAAAJ;UpZmJI0AAAAJ",
        "orcid": ";;;0000-0002-1723-5063;;;;",
        "linkedin": ";;;yschuang;;;https://uk.linkedin.com/in/akash-srivastava-aa97361b;",
        "or_profile": "~Zhang-Wei_Hong1;~Idan_Shenfeld1;~Tsun-Hsuan_Wang2;~Yung-Sung_Chuang1;~Aldo_Pareja1;~James_R._Glass1;~Akash_Srivastava1;~Pulkit_Agrawal1",
        "aff": "Massachusetts Institute of Technology;Massachusetts Institute of Technology;Liquid AI;Massachusetts Institute of Technology;Delft University of Technology;;International Business Machines;Massachusetts Institute of Technology",
        "aff_domain": "mit.edu;mit.edu;liquid.ai;mit.edu;tudelft.nl;;ibm.com;mit.edu",
        "position": "PhD student;PhD student;Researcher;PhD student;PhD student;;Principal Researcher;Assistant Professor",
        "bibtex": "@inproceedings{\nhong2024curiositydriven,\ntitle={Curiosity-driven Red-teaming for Large Language Models},\nauthor={Zhang-Wei Hong and Idan Shenfeld and Tsun-Hsuan Wang and Yung-Sung Chuang and Aldo Pareja and James R. Glass and Akash Srivastava and Pulkit Agrawal},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=4KqkizXgXU}\n}",
        "github": "",
        "project": "",
        "reviewers": "NqgB;TuLd;ZhdE;8YjF",
        "pdf_size": 721695,
        "rating": "8;8;8;8",
        "confidence": "3;3;3;4",
        "soundness": "3;4;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;4;4;3",
        "wc_summary": "107;69;108;65",
        "wc_strengths": "63;59;74;91",
        "wc_weaknesses": "52;101;141;78",
        "wc_questions": "46;124;82;1",
        "wc_review": "268;353;405;235",
        "wc_reply_reviewers": "0;21;99;19",
        "wc_reply_authors": "443;767;1145;194",
        "reply_reviewers": "0;1;2;1",
        "reply_authors": "2;2;2;1",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            87.25,
            20.30240133580262
        ],
        "wc_strengths_avg": [
            71.75,
            12.397076268217438
        ],
        "wc_weaknesses_avg": [
            93.0,
            32.687918257362305
        ],
        "wc_questions_avg": [
            63.25,
            45.31762902006238
        ],
        "wc_review_avg": [
            315.25,
            67.36607083688345
        ],
        "wc_reply_reviewers_avg": [
            34.75,
            37.989307706248084
        ],
        "wc_reply_authors_avg": [
            637.25,
            356.66817561986096
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 71,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14267068665623037182&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 9,
        "openreview": "https://openreview.net/forum?id=4KqkizXgXU",
        "pdf": "https://openreview.net/pdf?id=4KqkizXgXU",
        "email": "mit.edu;mit.edu;liquid.ai;mit.edu;tudelft.nl;;ibm.com;mit.edu",
        "author_num": 8,
        "aff_unique_index": "0;0;1;0;2;3;0",
        "aff_unique_norm": "Massachusetts Institute of Technology;Liquid AI;Delft University of Technology;International Business Machines Corporation",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://web.mit.edu;;https://www.tudelft.nl;https://www.ibm.com",
        "aff_unique_abbr": "MIT;;TU Delft;IBM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;2;0;0",
        "aff_country_unique": "United States;Unknown;Netherlands"
    },
    {
        "title": "Chain-of-Table: Evolving Tables in the Reasoning Chain for Table Understanding",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19470",
        "id": "4L0xnS4GQM",
        "author_site": "Zilong Wang, Hao Zhang, Chun-Liang Li, Julian M Eisenschlos, Vincent Perot, Zifeng Wang, Lesly Miculicich, Yasuhisa Fujii, Jingbo Shang, Chen-Yu Lee, Tomas Pfister",
        "tldr": "",
        "abstract": "Table-based reasoning with large language models (LLMs) is a promising direction to tackle many table understanding tasks, such as table-based question answering and fact verification. Compared with generic reasoning, table-based reasoning requires the extraction of underlying semantics from both free-form questions and semi-structured tabular data. Chain-of-Thought and its similar approaches incorporate the reasoning chain in the form of textual context, but it is still an open question how to effectively leverage tabular data in the reasoning chain. We propose the Chain-of-Table framework, where tabular data is explicitly used in the reasoning chain as a proxy for intermediate thoughts. Specifically, we guide LLMs using in-context learning to iteratively generate operations and update the table to represent a tabular reasoning chain. LLMs can therefore dynamically plan the next operation based on the results of the previous ones. This continuous evolution of the table forms a chain, showing the reasoning process for a given tabular problem. The chain carries structured information of the intermediate results, enabling more accurate and reliable predictions. Chain-of-Table achieves new state-of-the-art performance on WikiTQ, FeTaQA, and TabFact benchmarks across multiple LLM choices.",
        "keywords": "Table Understanding;In-context Learning;Large Language Model",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/e8fac55cc78468acf93bb210c449fc8e6fc3848a.zip",
        "author": "Zilong Wang;Hao Zhang;Chun-Liang Li;Julian Martin Eisenschlos;Vincent Perot;Zifeng Wang;Lesly Miculicich;Yasuhisa Fujii;Jingbo Shang;Chen-Yu Lee;Tomas Pfister",
        "authorids": "~Zilong_Wang1;~Hao_Zhang68;~Chun-Liang_Li1;~Julian_Martin_Eisenschlos1;~Vincent_Perot1;~Zifeng_Wang1;~Lesly_Miculicich1;~Yasuhisa_Fujii1;~Jingbo_Shang2;~Chen-Yu_Lee2;~Tomas_Pfister1",
        "gender": "M;;M;M;M;M;F;M;M;;M",
        "homepage": "https://zilongwang.me;https://www.lti.cs.cmu.edu/people/19123/hao-zhang;http://chunliangli.github.io;https://eisenjulian.github.io/;;https://kingspencer.github.io/;;;https://shangjingbo1226.github.io/;https://chl260.github.io/;http://tomas.pfister.fi",
        "dblp": "42/898-2;;;262/3990;227/2509;43/7716-2;;84/8914;151/3145.html;04/656;14/8360",
        "google_scholar": "S_wQccsAAAAJ;;https://scholar.google.com.tw/citations?user=vqHIt_sAAAAJ;2uAC2NQAAAAJ;RrANep4AAAAJ;https://scholar.google.co.il/citations?user=N1uBekcAAAAJ;https://scholar.google.ch/citations?user=0JL8SrsAAAAJ;_o1nj0gAAAAJ;0SkFI4MAAAAJ;uWPUSEgAAAAJ;ahSpJOAAAAAJ",
        "orcid": "0000-0002-1614-0943;;;;;;;;;;0009-0004-4088-8718",
        "linkedin": ";;;eisenjulian/;vincentperot/;zifeng-wang-21b069b4/;lesly-miculicich-werlen;;;chenyulee260/;",
        "or_profile": "~Zilong_Wang1;~Hao_Zhang68;~Chun-Liang_Li1;~Julian_Martin_Eisenschlos1;~Vincent_Perot1;~Zifeng_Wang1;~Lesly_Miculicich1;~Yasuhisa_Fujii1;~Jingbo_Shang2;~Chen-Yu_Lee2;~Tomas_Pfister1",
        "aff": "University of California, San Diego;;Apple;Universidad Nacional de C\u00f3rdoba;Google;Google;Google;Google;University of California, San Diego;Google;Google",
        "aff_domain": "ucsd.edu;;apple.com;unc.edu.ar;google.com;google.com;google.com;google.com;ucsd.edu;google.com;google.com",
        "position": "PhD student;;Researcher;PhD student;Software Engineer;Research Scientist;Researcher;RS;Assistant Professor;Research Scientist;Head of Research @ Cloud AI",
        "bibtex": "@inproceedings{\nwang2024chainoftable,\ntitle={Chain-of-Table: Evolving Tables in the Reasoning Chain for Table Understanding},\nauthor={Zilong Wang and Hao Zhang and Chun-Liang Li and Julian Martin Eisenschlos and Vincent Perot and Zifeng Wang and Lesly Miculicich and Yasuhisa Fujii and Jingbo Shang and Chen-Yu Lee and Tomas Pfister},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=4L0xnS4GQM}\n}",
        "github": "",
        "project": "",
        "reviewers": "xr4a;eSFE;3YkD;4HBR",
        "pdf_size": 1425645,
        "rating": "5;5;6;6",
        "confidence": "3;4;3;3",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;4",
        "presentation": "3;3;3;3",
        "wc_summary": "78;96;46;68",
        "wc_strengths": "51;42;92;63",
        "wc_weaknesses": "200;138;115;53",
        "wc_questions": "26;53;7;140",
        "wc_review": "355;329;260;324",
        "wc_reply_reviewers": "0;0;0;11",
        "wc_reply_authors": "801;840;972;895",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "4;5;4;5",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            72.0,
            18.05547008526779
        ],
        "wc_strengths_avg": [
            62.0,
            18.854707634964804
        ],
        "wc_weaknesses_avg": [
            126.5,
            52.60465758846834
        ],
        "wc_questions_avg": [
            56.5,
            50.904322016897545
        ],
        "wc_review_avg": [
            317.0,
            34.94996423460259
        ],
        "wc_reply_reviewers_avg": [
            2.75,
            4.763139720814412
        ],
        "wc_reply_authors_avg": [
            877.0,
            64.21448434738069
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.5,
            0.5
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 107,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13815199908318046768&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=4L0xnS4GQM",
        "pdf": "https://openreview.net/pdf?id=4L0xnS4GQM",
        "email": "ucsd.edu;;apple.com;unc.edu.ar;google.com;google.com;google.com;google.com;ucsd.edu;google.com;google.com",
        "author_num": 11,
        "aff_unique_index": "0;1;2;3;3;3;3;0;3;3",
        "aff_unique_norm": "University of California, San Diego;Apple;Universidad Nacional de C\u00f3rdoba;Google",
        "aff_unique_dep": ";Apple Inc.;;Google",
        "aff_unique_url": "https://www.ucsd.edu;https://www.apple.com;https://www.unc.edu.ar;https://www.google.com",
        "aff_unique_abbr": "UCSD;Apple;UNC;Google",
        "aff_campus_unique_index": "0;2;2;2;2;0;2;2",
        "aff_campus_unique": "San Diego;;Mountain View",
        "aff_country_unique_index": "0;0;1;0;0;0;0;0;0;0",
        "aff_country_unique": "United States;Argentina"
    },
    {
        "title": "Deep Reinforcement Learning for Modelling Protein Complexes",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19469",
        "id": "4MsfQ2H0lP",
        "author_site": "Ziqi Gao, Tao Feng, Jiaxuan You, Chenyi Zi, Yan Zhou, Chen Zhang, Jia Li",
        "tldr": "",
        "abstract": "Structure prediction of large protein complexes (a.k.a., protein multimer mod-\nelling, PMM) can be achieved through the one-by-one assembly using provided\ndimer structures and predicted docking paths. However, existing PMM methods\nstruggle with vast search spaces and generalization challenges: (1) The assembly\nof a N -chain multimer can be depicted using graph structured data, with each\nchain represented as a node and assembly actions as edges. Thus the assembly\ngraph can be arbitrary acyclic undirected connected graph, leading to the com-\nbinatorial optimization space of N^(N \u22122) for the PMM problem. (2) Knowledge\ntransfer in the PMM task is non-trivial. The gradually limited data availability as\nthe chain number increases necessitates PMM models that can generalize across\nmultimers of various chains. To address these challenges, we propose GAPN, a\nGenerative Adversarial Policy Network powered by domain-specific rewards and\nadversarial loss through policy gradient for automatic PMM prediction. Specifi-\ncally, GAPN learns to efficiently search through the immense assembly space and\noptimize the direct docking reward through policy gradient. Importantly, we de-\nsign a adversarial reward function to enhance the receptive field of our model. In\nthis way, GAPN will simultaneously focus on a specific batch of multimers and\nthe global assembly rules learned from multimers with varying chain numbers.\nEmpirically, we have achieved both significant accuracy (measured by RMSD\nand TM-Score) and efficiency improvements compared to leading complex mod-\neling software. GAPN outperforms the state-of-the-art method (MoLPC) with up\nto 27% improvement in TM-Score, with a speed-up of 600\u00d7.",
        "keywords": "protein complex structure prediction;docking path prediction;policy network;reinforcement learning",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Ziqi Gao;Tao Feng;Jiaxuan You;Chenyi Zi;Yan Zhou;Chen Zhang;Jia Li",
        "authorids": "~Ziqi_Gao1;~Tao_Feng5;~Jiaxuan_You2;~Chenyi_Zi2;~Yan_Zhou10;~Chen_Zhang24;~Jia_Li4",
        "gender": ";M;M;M;M;M;M",
        "homepage": ";;;http://www.chuanglintech.com;https://facultyprofiles.hkust-gz.edu.cn/faculty-personal-page/ZHANG-Chen/chenzhang;https://sites.google.com/view/lijia;https://cs.stanford.edu/~jiaxuan/",
        "dblp": ";;;;94/4084-10;23/6950-9;192/4727",
        "google_scholar": "https://scholar.google.com.hk/citations?user=UHwNFy8AAAAJ;3xK6SlIAAAAJ;uGbNoaQAAAAJ;;https://scholar.google.ca/citations?user=AHEItGQAAAAJ;1gSbcYoAAAAJ;NDbMl7oAAAAJ",
        "orcid": ";;;;0000-0001-8706-1372;0000-0002-6362-4385;",
        "linkedin": ";;;;;;jiaxuan-you-5859b37b/",
        "or_profile": "~Ziqi_Gao1;~Tao_Feng5;~Chenyi_Zi2;~Yan_Zhou10;~Chen_Zhang24;~Jia_Li4;~Jiaxuan_You1",
        "aff": "Hong Kong University of Science and Technology;Department of Computer Science, University of Illinois at Urbana-Champaign;Hong Kong University of Science and Technology;;Hong Kong University of Science and Technology;Hong Kong University of Science and Technology (Guangzhou);NVIDIA",
        "aff_domain": "ust.hk;cs.illinois.edu;hkust.edu;;hkust-gz.edu.cn;ust.hk;nvidia.com",
        "position": "PhD student;PhD student;MS student;;Associate Professor;Assistant Professor;Researcher",
        "bibtex": "@inproceedings{\ngao2024deep,\ntitle={Deep Reinforcement Learning for Modelling Protein Complexes},\nauthor={Ziqi Gao and Tao Feng and Jiaxuan You and Chenyi Zi and Yan Zhou and Chen Zhang and Jia Li},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=4MsfQ2H0lP}\n}",
        "github": "",
        "project": "",
        "reviewers": "rNSL;554U;Sjm2;MBaj",
        "pdf_size": 6159313,
        "rating": "6;6;6;6",
        "confidence": "5;3;3;3",
        "soundness": "3;3;2;3",
        "contribution": "2;3;2;3",
        "presentation": "3;2;2;3",
        "wc_summary": "73;80;130;82",
        "wc_strengths": "37;24;108;117",
        "wc_weaknesses": "176;14;180;49",
        "wc_questions": "120;1;24;51",
        "wc_review": "406;119;442;299",
        "wc_reply_reviewers": "61;23;0;17",
        "wc_reply_authors": "1670;225;1103;1192",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "4;2;4;3",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            91.25,
            22.620510604316607
        ],
        "wc_strengths_avg": [
            71.5,
            41.379342672401165
        ],
        "wc_weaknesses_avg": [
            104.75,
            74.3013290594455
        ],
        "wc_questions_avg": [
            49.0,
            44.64862819841165
        ],
        "wc_review_avg": [
            316.5,
            125.57169266996443
        ],
        "wc_reply_reviewers_avg": [
            25.25,
            22.29770167528483
        ],
        "wc_reply_authors_avg": [
            1047.5,
            521.52972110897
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.25,
            0.82915619758885
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16435311423968251503&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=4MsfQ2H0lP",
        "pdf": "https://openreview.net/pdf?id=4MsfQ2H0lP",
        "email": "ust.hk;cs.illinois.edu;hkust.edu;;hkust-gz.edu.cn;ust.hk;nvidia.com",
        "author_num": 7,
        "aff_unique_index": "0;1;0;0;0;2",
        "aff_unique_norm": "Hong Kong University of Science and Technology;University of Illinois Urbana-Champaign;NVIDIA",
        "aff_unique_dep": ";Department of Computer Science;NVIDIA Corporation",
        "aff_unique_url": "https://www.ust.hk;https://illinois.edu;https://www.nvidia.com",
        "aff_unique_abbr": "HKUST;UIUC;NVIDIA",
        "aff_campus_unique_index": "0;1;0;0;0",
        "aff_campus_unique": "Hong Kong SAR;Urbana-Champaign;",
        "aff_country_unique_index": "0;1;0;0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "4MvHiijJL3",
        "title": "Model Explanation Disparities as a Fairness Diagnostic",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent works on fairness in machine learning have focused on quantifying and eliminating bias against protected subgroups, and extended these results to more complex subgroups beyond simple discrete classes, known as \"rich subgroups.\" Orthogonally, recent works in model interpretability develop local feature importance methods that, given a classifier $h$ and test point $x$, attribute influence for the prediction $h(x)$ to the individual features of $x$. This raises a natural question: Do local feature importance methods attribute different feature importance values on average in protected subgroups versus the whole population, and can we detect these disparities efficiently? In this paper, we formally introduce the notion of feature importance disparity (FID) in the context of rich subgroups, which could be used as a potential indicator of bias in the model or data generation process. We design an oracle-efficient algorithm to identify large FID subgroups and conduct a thorough empirical analysis auditing for these subgroups across $4$ datasets and $4$ common feature importance methods of broad interest to the machine learning community. Our algorithm finds (feature, subgroup) pairs that: (i) have subgroup feature importance that is often an order of magnitude different than the importance on the whole dataset (ii) generalize out of sample, and (iii) yield interesting discussions about potential bias inherent in these common datasets.",
        "keywords": "Explainability;Auditing;Rich Subgroups;Fairness",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/a93d04395392acfeed805fa286a9eb29d65d07f2.zip",
        "author": "Peter W Chang;Leor Fishman;Seth Neel",
        "authorids": "~Peter_W_Chang1;~Leor_Fishman1;~Seth_Neel2",
        "gender": "M;M;M",
        "homepage": ";;https://sethneel.com",
        "dblp": ";;188/6406",
        "google_scholar": ";;",
        "orcid": "0000-0003-3971-2630;;",
        "linkedin": "peter-chang-31718baa/;leor-f-63490785/;",
        "or_profile": "~Peter_W_Chang1;~Leor_Fishman1;~Seth_Neel1",
        "aff": "Harvard University;;Harvard University",
        "aff_domain": "harvard.edu;;harvard.edu",
        "position": "Researcher;;Assistant Professor",
        "bibtex": "@misc{\nchang2024model,\ntitle={Model Explanation Disparities as a Fairness Diagnostic},\nauthor={Peter W Chang and Leor Fishman and Seth Neel},\nyear={2024},\nurl={https://openreview.net/forum?id=4MvHiijJL3}\n}",
        "github": "",
        "project": "",
        "reviewers": "tQK6;nvHG;SE4V;ZZsY;5Fo2",
        "site": "https://openreview.net/forum?id=4MvHiijJL3",
        "pdf_size": 2289369,
        "rating": "3;5;5;6;8",
        "confidence": "4;2;2;3;4",
        "soundness": "2;2;3;3;3",
        "contribution": "2;2;2;3;3",
        "presentation": "3;2;2;3;3",
        "wc_summary": "97;64;90;63;156",
        "wc_strengths": "50;18;50;56;60",
        "wc_weaknesses": "132;63;320;58;177",
        "wc_questions": "228;37;5;49;199",
        "wc_review": "507;182;465;226;592",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "1246;757;641;354;667",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "2;1;1;1;1",
        "rating_avg": [
            5.4,
            1.624807680927192
        ],
        "confidence_avg": [
            3.0,
            0.8944271909999159
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            94.0,
            33.85262175962151
        ],
        "wc_strengths_avg": [
            46.8,
            14.891608375189028
        ],
        "wc_weaknesses_avg": [
            150.0,
            95.90203334653546
        ],
        "wc_questions_avg": [
            103.6,
            91.34024304762933
        ],
        "wc_review_avg": [
            394.4,
            161.35749130424654
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            733.0,
            289.898602963174
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.2,
            0.4000000000000001
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.13762047064079508,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10004785071373874203&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Harvard University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.harvard.edu",
        "aff_unique_abbr": "Harvard",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "4N7v4w2r3b",
        "title": "Robustness Evaluation of Proxy Models against Adversarial Optimization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Ensuring the robustness of neural network proxies to optimization pressure is crucial as machine learning applications expand across diverse domains. However, research on proxy robustness remains limited and largely unexplored. In this paper, we introduce a comprehensive benchmark for investigating the robustness of neural network proxies under various sources of optimization pressure in the text domain. Through extensive experiments using our benchmark, we uncover previously unknown properties of the proxy gaming problem and highlight serious issues with proxy reward models currently used to fine-tune or monitor large language models. Furthermore, we explore different approaches to enhance proxy robustness and demonstrate the potential of adversarial training to improve alignment between proxy and gold models. Our findings suggest that proxy robustness is a solvable problem that can be incrementally improved, laying the groundwork for future research in this important area.",
        "keywords": "proxy gaming;reward hacking;specification gaming;misspecification;robustness;adversarial robustness;adversarial attacks;alignment;ai safety",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/c02cda3326c492710ad2b34cd7dde7da94f9636e.zip",
        "author": "Andy Zou;Long Phan;Nathaniel Li;Jun Shern Chan;Mantas Mazeika;Aidan O'Gara;Steven Basart;Jonathan Ng;Scott Emmons;J Zico Kolter;Matt Fredrikson;Dan Hendrycks",
        "authorids": "~Andy_Zou1;~Long_Phan1;~Nathaniel_Li1;~Jun_Shern_Chan1;~Mantas_Mazeika3;~Aidan_O'Gara1;~Steven_Basart1;~Jonathan_Ng1;~Scott_Emmons1;~J_Zico_Kolter1;~Matt_Fredrikson1;~Dan_Hendrycks1",
        "gender": ";M;M;M;M;;M;M;M;M;;M",
        "homepage": ";;https://nli0.github.io;https://junshern.github.io/;https://github.com/mmazeika;;http://stevenbas.art;;http://scottemmons.com/;https://cs.cmu.edu/~mfredrik;;http://www.zicokolter.com",
        "dblp": "274/2362;;;319/5188;215/4447;;245/2547;;180/5699;38/2612;182/2504;67/2526",
        "google_scholar": ";fVRQn4wAAAAJ;2XmBzbcAAAAJ;iUGazLcAAAAJ;;;MzKvJhAAAAAJ;;LoT0z6oAAAAJ;https://scholar.google.com.tw/citations?user=tMYCvLAAAAAJ;;UXh1I6UAAAAJ",
        "orcid": ";;;;;;;;0000-0002-7946-7046;;;",
        "linkedin": "andy-zou-09ba3616a/;long-phan-3110/;nli0/;chan-jun-shern/;;abogara/;xksteven/;jonathan-ng-7061a3162/;scott-emmons-5258005b/;;;",
        "or_profile": "~Andy_Zou1;~Long_Phan1;~Nathaniel_Li1;~Jun_Shern_Chan1;~Mantas_Mazeika3;~Aidan_O'Gara1;~Steven_Basart1;~Jonathan_Ng1;~Scott_Emmons1;~Matt_Fredrikson1;~Dan_Hendrycks1;~Zico_Kolter1",
        "aff": "Carnegie Mellon University;Center for AI Safety;University of California, Berkeley;OpenAI;University of Illinois, Urbana-Champaign;;Center for AI Safety ;;University of California, Berkeley;Carnegie Mellon University;Center for AI Safety;Carnegie Mellon University",
        "aff_domain": "andrew.cmu.edu;safe.ai;berkeley.edu;openai.com;uiuc.edu;;safe.ai;;berkeley.edu;cmu.edu;safe.ai;cmu.edu",
        "position": "PhD student;Research Engineer;Undergrad student;Researcher;PhD student;;Researcher;;PhD student;Associate Professor;Executive and Research Director;Full Professor",
        "bibtex": "@misc{\nzou2024robustness,\ntitle={Robustness Evaluation of Proxy Models against Adversarial Optimization},\nauthor={Andy Zou and Long Phan and Nathaniel Li and Jun Shern Chan and Mantas Mazeika and Aidan O'Gara and Steven Basart and Jonathan Ng and Scott Emmons and J Zico Kolter and Matt Fredrikson and Dan Hendrycks},\nyear={2024},\nurl={https://openreview.net/forum?id=4N7v4w2r3b}\n}",
        "github": "",
        "project": "",
        "reviewers": "8v7i;2dFK;k5g4;tXHZ",
        "site": "https://openreview.net/forum?id=4N7v4w2r3b",
        "pdf_size": 3685608,
        "rating": "5;5;5;6",
        "confidence": "3;3;3;3",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;4",
        "presentation": "2;2;2;3",
        "wc_summary": "100;77;57;69",
        "wc_strengths": "82;42;52;140",
        "wc_weaknesses": "251;422;139;196",
        "wc_questions": "18;6;158;13",
        "wc_review": "451;547;406;418",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "832;735;422;560",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            75.75,
            15.706288549495072
        ],
        "wc_strengths_avg": [
            79.0,
            38.17066936798463
        ],
        "wc_weaknesses_avg": [
            252.0,
            105.83713903918606
        ],
        "wc_questions_avg": [
            48.75,
            63.21936016759423
        ],
        "wc_review_avg": [
            455.5,
            55.33760023709015
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            637.25,
            157.94203841916186
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            12,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:er6z2Sned7cJ:scholar.google.com/&scioq=Robustness+Evaluation+of+Proxy+Models+against+Adversarial+Optimization&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;4;1;2;0;1;0",
        "aff_unique_norm": "Carnegie Mellon University;Center for AI Safety;University of California, Berkeley;OpenAI;University of Illinois",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.cmu.edu;https://www.centerforaisafety.org;https://www.berkeley.edu;https://openai.com;https://illinois.edu",
        "aff_unique_abbr": "CMU;;UC Berkeley;OpenAI;UIUC",
        "aff_campus_unique_index": "1;2;1",
        "aff_campus_unique": ";Berkeley;Urbana-Champaign",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Weakly-supervised Audio Separation via Bi-modal Semantic Similarity",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19468",
        "id": "4N97bz1sP6",
        "author_site": "Tanvir Mahmud, Saeed Amizadeh, Kazuhito Koishida, Diana Marculescu",
        "tldr": "",
        "abstract": "Conditional sound separation in multi-source audio mixtures without having access to single source sound data during training is a long standing challenge. Existing mix-and-separate based methods suffer from significant performance drop with multi-source training mixtures due to the lack of supervision signal for single source separation cases during training. However, in the case of language-conditional audio separation, we do have access to corresponding text descriptions for each audio mixture in our training data, which can be seen as (rough) representations of the audio samples in the language modality. That raises the curious question of how to generate supervision signal for single-source audio extraction by leveraging the fact that single-source sounding language entities can be easily extracted from the text description. To this end, in this paper, we propose a generic bi-modal separation framework which can enhance the existing unsupervised frameworks to separate single-source signals in a target modality (i.e., audio) using the easily separable corresponding signals in the conditioning modality (i.e., language), without having access to single-source samples in the target modality during training. We empirically show that this is well within reach if we have access to a pretrained joint embedding model between the two modalities (i.e., CLAP). Furthermore, we propose to incorporate our framework into two fundamental scenarios to enhance separation performance. First, we show that our proposed methodology significantly improves the performance of purely unsupervised baselines by reducing the distribution shift between training and test samples. In particular, we show that our framework can achieve 71% boost in terms of Signal-to-Distortion Ratio (SDR) over the baseline, reaching 97.5% of the supervised learning performance. Second, we show that we can further improve the performance of the supervised learning itself by 17% if we augment it by our proposed weakly-supervised framework. Our framework achieves this by making large corpora of unsupervised data available to the supervised learning model as well as utilizing a natural, robust regularization mechanism through weak supervision from the language modality, and hence enabling a powerful semi-supervised framework for audio separation. Code is released at https://github.com/microsoft/BiModalAudioSeparation.",
        "keywords": "Audio-language learning;conditional audio separation;unsupervised learning;weakly supervised learning;semi-supervised learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/0bae6ad825e485b1284a1ff933e7b68d7a019c79.pdf",
        "author": "Tanvir Mahmud;Saeed Amizadeh;Kazuhito Koishida;Diana Marculescu",
        "authorids": "~Tanvir_Mahmud1;~Saeed_Amizadeh1;~Kazuhito_Koishida1;~Diana_Marculescu4",
        "gender": ";M;;",
        "homepage": "https://sites.google.com/view/tanvirmahmud;;https://asgweb-production.azurewebsites.net/applied-sciences/people/kazuhito-koishida;",
        "dblp": "255/3041;48/8399;;",
        "google_scholar": "4aZPxRsAAAAJ;eDn7hQUAAAAJ;;",
        "orcid": ";;;",
        "linkedin": ";saeed-amizadeh/;;",
        "or_profile": "~Tanvir_Mahmud1;~Saeed_Amizadeh1;~Kazuhito_Koishida1;~Diana_Marculescu4",
        "aff": "University of Texas at Austin;Microsoft;Microsoft Corporation;",
        "aff_domain": "utexas.edu;microsoft.com;microsoft.com;",
        "position": "PhD student;Researcher;Researcher;",
        "bibtex": "@inproceedings{\nmahmud2024weaklysupervised,\ntitle={Weakly-supervised Audio Separation via Bi-modal Semantic Similarity},\nauthor={Tanvir Mahmud and Saeed Amizadeh and Kazuhito Koishida and Diana Marculescu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=4N97bz1sP6}\n}",
        "github": "",
        "project": "",
        "reviewers": "SLiU;ScdR;fPmw",
        "pdf_size": 11227543,
        "rating": "6;6;8",
        "confidence": "5;4;3",
        "soundness": "2;2;3",
        "contribution": "3;2;3",
        "presentation": "3;3;3",
        "wc_summary": "185;92;133",
        "wc_strengths": "134;78;60",
        "wc_weaknesses": "649;256;21",
        "wc_questions": "31;17;77",
        "wc_review": "999;443;291",
        "wc_reply_reviewers": "40;14;19",
        "wc_reply_authors": "867;768;729",
        "reply_reviewers": "1;1;1",
        "reply_authors": "3;2;2",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            136.66666666666666,
            38.055515004033545
        ],
        "wc_strengths_avg": [
            90.66666666666667,
            31.510139461590594
        ],
        "wc_weaknesses_avg": [
            308.6666666666667,
            259.0705609588931
        ],
        "wc_questions_avg": [
            41.666666666666664,
            25.62984371565478
        ],
        "wc_review_avg": [
            577.6666666666666,
            304.3214674576139
        ],
        "wc_reply_reviewers_avg": [
            24.333333333333332,
            11.264496832477201
        ],
        "wc_reply_authors_avg": [
            788.0,
            58.08614292583042
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10153359908957697598&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=4N97bz1sP6",
        "pdf": "https://openreview.net/pdf?id=4N97bz1sP6",
        "email": "utexas.edu;microsoft.com;microsoft.com;",
        "author_num": 4,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "University of Texas at Austin;Microsoft",
        "aff_unique_dep": ";Microsoft Corporation",
        "aff_unique_url": "https://www.utexas.edu;https://www.microsoft.com",
        "aff_unique_abbr": "UT Austin;Microsoft",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Austin;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "DAM: Towards a Foundation Model for Forecasting",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19467",
        "id": "4NhMhElWqP",
        "author_site": "Luke Darlow, Qiwen Deng, Ahmed Hassan, Martin Asenov, Rajkarn Singh, Artjom Joosen, Adam Barker, Amos Storkey",
        "tldr": "",
        "abstract": "It is challenging to scale time series forecasting models such that they forecast accurately for multiple distinct domains and datasets, all with potentially different underlying collection procedures (e.g., sample resolution), patterns (e.g., periodicity), and prediction requirements (e.g., reconstruction vs. forecasting). We call this general task universal forecasting. Existing methods usually assume that input data is regularly sampled, and they forecast to pre-determined horizons, resulting in failure to generalise outside of the scope of their training. We propose the DAM -- a neural model that takes randomly sampled histories and outputs an adjustable basis composition as a continuous function of time for forecasting to non-fixed horizons. It involves three key components: (1) a flexible approach for using randomly sampled histories from a long-tail distribution, that enables an efficient global perspective of the underlying temporal dynamics while retaining focus on the recent history; (2) a transformer backbone that is trained on these actively sampled histories to produce, as representational output, (3) the basis coefficients of a continuous function of time. We show that a single univariate DAM, trained on 25 time series datasets, either outperformed or closely matched existing SoTA models at multivariate long-term forecasting across 18 datasets, including 8 held-out for zero-shot transfer, even though these models were trained to specialise for each dataset-horizon combination. This single DAM excels at zero-shot transfer and very-long-term forecasting, performs well at imputation, is interpretable via basis function composition and attention, can be tuned for different inference-cost requirements, is robust to missing and irregularly sampled data by design.",
        "keywords": "Forecasting;time series;foundation model;transfer learning;imputation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/b7f533f90084341c1ba61614bba4570106a95509.zip",
        "author": "Luke Nicholas Darlow;Qiwen Deng;Ahmed Hassan;Martin Asenov;Rajkarn Singh;Artjom Joosen;Adam Barker;Amos Storkey",
        "authorids": "~Luke_Nicholas_Darlow1;~Qiwen_Deng1;~Ahmed_Hassan7;~Martin_Asenov1;~Rajkarn_Singh1;~Artjom_Joosen1;~Adam_Barker1;~Amos_Storkey1",
        "gender": ";M;M;M;M;M;M;Not Specified",
        "homepage": ";;;https://masenov.com/;;https://www.linkedin.com/in/artjom-joosen-9774381b4;;http://homepages.inf.ed.ac.uk/amos/",
        "dblp": ";;;;149/5226;;24/1959;",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;;zFULG8IAAAAJ;8IlCysUAAAAJ;2jepixkAAAAJ;;",
        "orcid": ";;;;;;;",
        "linkedin": ";https://www.linkedin.com/me?trk=p_mwlite_feed_updates-secondary_nav;ahmed-hassan-9399a8291/;;rajkarn/;;;",
        "or_profile": "~Luke_Nicholas_Darlow1;~Qiwen_Deng1;~Ahmed_Hassan7;~Martin_Asenov1;~Rajkarn_Singh1;~Artjom_Joosen1;~Adam_Barker1;~Amos_Storkey1",
        "aff": ";Huawei Technologies Ltd.;Huawei Technologies Ltd.;Huawei Technologies Ltd.;Huawei Technologies Research, UK.;Huawei Technologies Ltd.;University of St Andrews;University of Edinburgh",
        "aff_domain": ";huawei.com;huawei.com;huawei.com;huawei.com;huawei.com;st-andrews.ac.uk;ed.ac.uk",
        "position": ";Researcher;Researcher;Researcher;Researcher;Researcher;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\ndarlow2024dam,\ntitle={{DAM}: Towards a Foundation Model for Forecasting},\nauthor={Luke Nicholas Darlow and Qiwen Deng and Ahmed Hassan and Martin Asenov and Rajkarn Singh and Artjom Joosen and Adam Barker and Amos Storkey},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=4NhMhElWqP}\n}",
        "github": "",
        "project": "",
        "reviewers": "sH5F;wavr;PhNp;yXbk",
        "pdf_size": 7798906,
        "rating": "6;6;8;8",
        "confidence": "4;4;5;4",
        "soundness": "3;3;3;3",
        "contribution": "2;3;4;3",
        "presentation": "3;2;3;3",
        "wc_summary": "82;97;224;178",
        "wc_strengths": "52;73;44;71",
        "wc_weaknesses": "49;355;200;96",
        "wc_questions": "13;120;120;61",
        "wc_review": "196;645;588;406",
        "wc_reply_reviewers": "0;247;596;0",
        "wc_reply_authors": "869;1915;3134;1328",
        "reply_reviewers": "0;2;4;0",
        "reply_authors": "2;6;6;4",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            145.25,
            58.31541391433315
        ],
        "wc_strengths_avg": [
            60.0,
            12.349089035228468
        ],
        "wc_weaknesses_avg": [
            175.0,
            117.4116689260484
        ],
        "wc_questions_avg": [
            78.5,
            44.83581157958446
        ],
        "wc_review_avg": [
            458.75,
            175.50979317405626
        ],
        "wc_reply_reviewers_avg": [
            210.75,
            244.2144293443776
        ],
        "wc_reply_authors_avg": [
            1811.5,
            848.7928192438953
        ],
        "reply_reviewers_avg": [
            1.5,
            1.6583123951777
        ],
        "reply_authors_avg": [
            4.5,
            1.6583123951777
        ],
        "replies_avg": [
            34,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "openreview": "https://openreview.net/forum?id=4NhMhElWqP",
        "pdf": "https://openreview.net/pdf?id=4NhMhElWqP",
        "email": ";huawei.com;huawei.com;huawei.com;huawei.com;huawei.com;st-andrews.ac.uk;ed.ac.uk",
        "author_num": 8,
        "aff_unique_index": "0;0;0;0;0;1;2",
        "aff_unique_norm": "Huawei;University of St Andrews;University of Edinburgh",
        "aff_unique_dep": "Huawei Technologies;;",
        "aff_unique_url": "https://www.huawei.com;https://www.st-andrews.ac.uk;https://www.ed.ac.uk",
        "aff_unique_abbr": "Huawei;St Andrews;Edinburgh",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0;1;1",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "id": "4P76wCt9N5",
        "title": "DAG-based Generative Regression",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Standard regression models address associations between targeted dependent variables and selected independent variables. This paper generalizes this by proposing DAG-based generative regression as a generative process in which the model learns the data generation mechanism from real data. DAG is explicitly involved in the generative process by using structural equation models to capture the data generation mechanisms among the data variables. We learn DAG by reconstructing the model to replicate the real data distribution. We have conducted experiments to measure the performance of our algorithm to show that the results outperform the state-of-the-art by a significantly large margin.",
        "keywords": "Generative regression modeling;DAG-learning;Generative adversarial learning;Causal discovery;Additive noise model",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Hristo Petkov;Feng Dong;Calum Robert MacLellan",
        "authorids": "~Hristo_Petkov1;~Feng_Dong2;~Calum_Robert_MacLellan1",
        "gender": "M;M;M",
        "homepage": "https://www.linkedin.com/in/hristo-petkov-628007215;https://www.strath.ac.uk/staff/dongfengprofessor/;",
        "dblp": ";;",
        "google_scholar": ";;",
        "orcid": ";;0000-0002-5262-8532",
        "linkedin": "hristo-petkov-628007215;;",
        "or_profile": "~Hristo_Petkov1;~Feng_Dong2;~Calum_Robert_MacLellan1",
        "aff": "University of Strathclyde;University of Strathclyde;",
        "aff_domain": "strath.ac.uk;strath.ac.uk;",
        "position": "PhD student;Full Professor;",
        "bibtex": "@misc{\npetkov2024dagbased,\ntitle={{DAG}-based Generative Regression},\nauthor={Hristo Petkov and Feng Dong and Calum Robert MacLellan},\nyear={2024},\nurl={https://openreview.net/forum?id=4P76wCt9N5}\n}",
        "github": "",
        "project": "",
        "reviewers": "ay5v;XSCR;F2tX;K8HK;sCo4",
        "site": "https://openreview.net/forum?id=4P76wCt9N5",
        "pdf_size": 897466,
        "rating": "3;3;3;3;3",
        "confidence": "3;5;3;4;4",
        "soundness": "3;2;2;1;2",
        "contribution": "2;1;2;1;2",
        "presentation": "2;3;2;1;2",
        "wc_summary": "71;45;37;87;39",
        "wc_strengths": "36;17;24;8;50",
        "wc_weaknesses": "89;67;29;755;43",
        "wc_questions": "134;11;41;2;38",
        "wc_review": "330;140;131;852;170",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.8,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            1.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            55.8,
            19.78282083020518
        ],
        "wc_strengths_avg": [
            27.0,
            14.696938456699069
        ],
        "wc_weaknesses_avg": [
            196.6,
            279.95256741098126
        ],
        "wc_questions_avg": [
            45.2,
            46.88453902940712
        ],
        "wc_review_avg": [
            324.6,
            273.36393324650567
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:0L4cYs1e3LEJ:scholar.google.com/&scioq=DAG-based+Generative+Regression&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Strathclyde",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.strath.ac.uk",
        "aff_unique_abbr": "Strathclyde",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "4P8itxA1oA",
        "title": "Set Features for Anomaly Detection",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "This paper proposes set features for detecting anomalies in samples that consist of unusual combinations of normal elements. Most methods, discover anomalies by detecting an unusual part of a sample. For example, state-of-the-art segmentation-based approaches, first classify each element of the sample (e.g., image patch) as normal or anomalous and then classify the entire sample as anomalous if it contains anomalous elements. However, such approaches do not extend well to scenarios where the anomalies are expressed by an unusual combination of normal elements. In this paper, we overcome this limitation by proposing set features that model each sample by the distribution of its elements. We compute the anomaly score of each sample using a simple density estimation method. Our simple-to-implement approach outperforms the state-of-the-art in image-level logical anomaly detection (+5.2%) and sequence-level time series anomaly detection (+2.4%).",
        "keywords": "Anomaly Detection;Logical Anomaly Detection;Set Anomaly Detection;Time-Series",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/dfcb40befec813ee2d6d02482222c8b5e0948ba3.zip",
        "author": "Niv Cohen;Issar Tzachor;Yedid Hoshen",
        "authorids": "~Niv_Cohen1;~Issar_Tzachor1;~Yedid_Hoshen3",
        "gender": "M;;M",
        "homepage": "https://www.cs.huji.ac.il/w~nivc/;;https://www.cs.huji.ac.il/~ydidh/",
        "dblp": "259/2291;;136/0280",
        "google_scholar": "https://scholar.google.co.il/citations?user=ZMdC3OQAAAAJ;;https://scholar.google.co.il/citations?user=6y1-qS4AAAAJ",
        "orcid": ";;",
        "linkedin": "niv-cohen-39b49521/;;",
        "or_profile": "~Niv_Cohen1;~Issar_Tzachor1;~Yedid_Hoshen3",
        "aff": "Hebrew University of Jerusalem;;Google",
        "aff_domain": "huji.ac.il;;google.com",
        "position": "PhD student;;Researcher",
        "bibtex": "@misc{\ncohen2024set,\ntitle={Set Features for Anomaly Detection},\nauthor={Niv Cohen and Issar Tzachor and Yedid Hoshen},\nyear={2024},\nurl={https://openreview.net/forum?id=4P8itxA1oA}\n}",
        "github": "",
        "project": "",
        "reviewers": "JUmH;if8q;Eqh9;Najr",
        "site": "https://openreview.net/forum?id=4P8itxA1oA",
        "pdf_size": 3383639,
        "rating": "3;3;5;5",
        "confidence": "5;5;4;5",
        "soundness": "2;1;3;2",
        "contribution": "2;2;2;2",
        "presentation": "3;3;2;1",
        "wc_summary": "53;58;76;49",
        "wc_strengths": "19;47;9;43",
        "wc_weaknesses": "206;261;210;196",
        "wc_questions": "8;23;81;57",
        "wc_review": "286;389;376;345",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "138;277;200;68",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            59.0,
            10.319883720275147
        ],
        "wc_strengths_avg": [
            29.5,
            15.960889699512368
        ],
        "wc_weaknesses_avg": [
            218.25,
            25.202926417382564
        ],
        "wc_questions_avg": [
            42.25,
            28.560243346302215
        ],
        "wc_review_avg": [
            349.0,
            39.73034105063786
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            170.75,
            77.09531438420885
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=817268210022908330&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Hebrew University of Jerusalem;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.huji.ac.il;https://www.google.com",
        "aff_unique_abbr": "HUJI;Google",
        "aff_campus_unique_index": "0;1",
        "aff_campus_unique": "Jerusalem;Mountain View",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Israel;United States"
    },
    {
        "id": "4PzxLPEGRn",
        "title": "OCAtari: Object-Centric Atari 2600 Reinforcement Learning Environments",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Cognitive science and psychology suggest that object-centric representations of complex scenes are a promising step towards enabling efficient abstract reasoning from low-level perceptual features. Yet, most deep reinforcement learning approaches rely on only pixel-based representations that do not capture the compositional properties of natural scenes. For this, we need environments and datasets that allow us to work and evaluate object-centric approaches. We present OCAtari, a set of environment that provides object-centric state representations of Atari games, the most-used evaluation framework for deep RL approaches. OCAtari also allows for RAM state manipulations of the games to change and create specific or even novel situations. Our source code is available at\nhttps://anonymous.4open.science/r/OCAtari-52B9 .",
        "keywords": "Object Centric;Reinforcement Learning;Framework;Environments;Object Detection;Object Discovery",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Quentin Delfosse;Jannis Bl\u00fcml;Bjarne Gregori;Sebastian Sztwiertnia;Kristian Kersting",
        "authorids": "~Quentin_Delfosse1;~Jannis_Bl\u00fcml1;~Bjarne_Gregori1;~Sebastian_Sztwiertnia1;~Kristian_Kersting1",
        "gender": "M;M;M;;M",
        "homepage": "https://quentindelfosse.me/;;https://github.com/BJenrajb;;http://www.ml.informatik.tu-darmstadt.de/",
        "dblp": "286/1466.html;;;297/9076.html;40/3793",
        "google_scholar": "k1E0FgIAAAAJ;;https://scholar.google.de/citations?hl=de;;QY-earAAAAAJ",
        "orcid": ";0000-0002-9400-0946;;;0000-0002-2873-9152",
        "linkedin": "quentin-delfosse-70b377150/;;;;",
        "or_profile": "~Quentin_Delfosse1;~Jannis_Bl\u00fcml1;~Bjarne_Gregori1;~Sebastian_Sztwiertnia1;~Kristian_Kersting1",
        "aff": "CS Department, TU Darmstadt, TU Darmstadt;Technische Universit\u00e4t Darmstadt;;Technische Universit\u00e4t Darmstadt;TU Darmstadt",
        "aff_domain": "cs.tu-darmstadt.de;tu-darmstadt.de;;tu-darmstadt.de;tu-darmstadt.de",
        "position": "PhD student;PhD student;;PhD student;Full Professor",
        "bibtex": "@misc{\ndelfosse2024ocatari,\ntitle={{OCA}tari: Object-Centric Atari 2600 Reinforcement Learning Environments},\nauthor={Quentin Delfosse and Jannis Bl{\\\"u}ml and Bjarne Gregori and Sebastian Sztwiertnia and Kristian Kersting},\nyear={2024},\nurl={https://openreview.net/forum?id=4PzxLPEGRn}\n}",
        "github": "",
        "project": "",
        "reviewers": "Lfyp;7uXz;BhyG;wGg4",
        "site": "https://openreview.net/forum?id=4PzxLPEGRn",
        "pdf_size": 1000480,
        "rating": "3;5;5;5",
        "confidence": "4;4;4;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;2;2",
        "presentation": "2;3;3;3",
        "wc_summary": "82;138;81;66",
        "wc_strengths": "102;45;23;69",
        "wc_weaknesses": "118;174;21;305",
        "wc_questions": "216;120;279;39",
        "wc_review": "518;477;404;479",
        "wc_reply_reviewers": "0;89;0;190",
        "wc_reply_authors": "961;479;349;553",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            91.75,
            27.444261695297982
        ],
        "wc_strengths_avg": [
            59.75,
            29.32042803234632
        ],
        "wc_weaknesses_avg": [
            154.5,
            102.69493658404001
        ],
        "wc_questions_avg": [
            163.5,
            91.5
        ],
        "wc_review_avg": [
            469.5,
            41.19769411022904
        ],
        "wc_reply_reviewers_avg": [
            69.75,
            78.35934851694468
        ],
        "wc_reply_authors_avg": [
            585.5,
            228.76352419037437
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=959748260740375104&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Technische Universit\u00e4t Darmstadt",
        "aff_unique_dep": "Computer Science Department",
        "aff_unique_url": "https://www.tu-darmstadt.de",
        "aff_unique_abbr": "TU Darmstadt",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Darmstadt",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "4QaKdsh15T",
        "title": "An Embodied Generalist Agent in 3D World",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Leveraging massive knowledge and learning schemes from large language models (LLMs), recent machine learning models show notable successes in building generalist agents that exhibit the capability of general-purpose task solving in diverse domains, including natural language processing, computer vision, and robotics. However, a significant challenge remains as these models exhibit limited ability in understanding and interacting with the 3D world. We argue this limitation significantly hinders the current models from performing real-world tasks and further achieving general intelligence. To this end, we introduce an embodied multi-modal and multi-task generalist agent that excels in perceiving, grounding, reasoning, planning, and acting in the 3D world. Our proposed agent, referred to as LEO, is trained with shared LLM-based model architectures, objectives, and weights in two stages: (i) 3D vision-language alignment and (ii) 3D vision-language-action instruction tuning. To facilitate the training, we meticulously curate and generate an extensive dataset comprising object-level and scene-level multi-modal tasks with exceeding scale and complexity, necessitating a deep understanding of and interaction with the 3D world. Through rigorous experiments, we demonstrate LEO's remarkable proficiency across a wide spectrum of tasks, including 3D captioning, question answering, embodied reasoning, embodied navigation, and robotic manipulation. Our ablation results further provide valuable insights for the development of future embodied generalist agents.",
        "keywords": "embodied generalist agent;3D generalist agent;large language model;3D vision-language;vision-language-action;multi-modal instruction tuning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/6bd0966288935d52a57036c358525c3de089d392.zip",
        "author": "Jiangyong Huang;Silong Yong;Xiaojian Ma;Xiongkun Linghu;Puhao Li;Yan Wang;Qing Li;Song-Chun Zhu;Baoxiong Jia;Siyuan Huang",
        "authorids": "~Jiangyong_Huang1;~Silong_Yong1;~Xiaojian_Ma1;~Xiongkun_Linghu1;~Puhao_Li1;~Yan_Wang30;~Qing_Li1;~Song-Chun_Zhu1;~Baoxiong_Jia1;~Siyuan_Huang2",
        "gender": ";M;;;M;M;M;M;M;M",
        "homepage": "https://huangjy-pku.github.io/;https://github.com/SilongYong;;;https://xiaoyao-li.github.io/;https://github.com/luckyWangYan;http://liqing-ustc.github.io/;https://zhusongchun.net/;https://buzz-beater.github.io/;https://siyuanhuang.com/",
        "dblp": "334/4572;;;;330/4121.html;;181/2689-3;10/10313;206/8738;62/885-1",
        "google_scholar": ";EitVAcwAAAAJ;;;https://scholar.google.at/citations?user=HTsO18AAAAAJ;;iwdFZBEAAAAJ;https://scholar.google.com.tw/citations?user=Al8dyb4AAAAJ;qIBUK6sAAAAJ;1NN7Ee8AAAAJ",
        "orcid": "0000-0001-9125-6893;;;0000-0002-4393-4386;0009-0003-2696-9346;;;;0000-0002-4968-3290;",
        "linkedin": ";;;;;;;;baoxiong-jia-2b6094122?trk=public_post-text;",
        "or_profile": "~Jiangyong_Huang1;~Silong_Yong1;~Xiaojian_Ma1;~Xiongkun_Linghu1;~Puhao_Li1;~Yan_Wang30;~Qing_Li1;~Song-Chun_Zhu1;~Baoxiong_Jia1;~Siyuan_Huang2",
        "aff": "Peking University;Carnegie Mellon University;;Beijing Institute for General Artificial Intelligence;Tsinghua University;;Beijing Institute for General Artificial Intelligence (BIGAI);Peking University;Beijing Institute for General Artificial Intelligence;Beijing Institute for General Artificial Intelligence",
        "aff_domain": "pku.edu.cn;andrew.cmu.edu;;bigai.ai;tsinghua.edu.cn;;bigai.ai;pku.edu.cn;bigai.ai;bigai.ai",
        "position": "PhD student;MS student;;Researcher;PhD student;;Researcher;Full Professor;Researcher;Researcher",
        "bibtex": "@misc{\nhuang2024an,\ntitle={An Embodied Generalist Agent in 3D World},\nauthor={Jiangyong Huang and Silong Yong and Xiaojian Ma and Xiongkun Linghu and Puhao Li and Yan Wang and Qing Li and Song-Chun Zhu and Baoxiong Jia and Siyuan Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=4QaKdsh15T}\n}",
        "github": "",
        "project": "",
        "reviewers": "Vn42;bU9n;ADo8;foVx",
        "site": "https://openreview.net/forum?id=4QaKdsh15T",
        "pdf_size": 25507949,
        "rating": "3;5;5;8",
        "confidence": "4;3;4;4",
        "soundness": "2;2;2;4",
        "contribution": "2;3;2;4",
        "presentation": "2;4;2;4",
        "wc_summary": "97;120;103;40",
        "wc_strengths": "28;69;105;102",
        "wc_weaknesses": "395;249;646;51",
        "wc_questions": "174;100;96;18",
        "wc_review": "694;538;950;211",
        "wc_reply_reviewers": "690;0;0;0",
        "wc_reply_authors": "4894;1083;2839;580",
        "reply_reviewers": "3;0;0;0",
        "reply_authors": "9;3;6;1",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            1.0
        ],
        "wc_summary_avg": [
            90.0,
            30.074906483645133
        ],
        "wc_strengths_avg": [
            76.0,
            31.10466202999158
        ],
        "wc_weaknesses_avg": [
            335.25,
            217.00964840301455
        ],
        "wc_questions_avg": [
            97.0,
            55.18151864528558
        ],
        "wc_review_avg": [
            598.25,
            267.6232192841271
        ],
        "wc_reply_reviewers_avg": [
            172.5,
            298.77876430563134
        ],
        "wc_reply_authors_avg": [
            2349.0,
            1691.8364282636783
        ],
        "reply_reviewers_avg": [
            0.75,
            1.299038105676658
        ],
        "reply_authors_avg": [
            4.75,
            3.031088913245535
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.08084520834544431,
        "gs_citation": 143,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8869821326961875122&as_sdt=5,34&sciodt=0,34&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;2;3;2;0;2;2",
        "aff_unique_norm": "Peking University;Carnegie Mellon University;Beijing Institute for General Artificial Intelligence;Tsinghua University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.cmu.edu;http://www.bigaiai.org/;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "Peking U;CMU;BIGAI;THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;0;0;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "4QtywskEyY",
        "title": "Teaching wiser, Learning smarter: Multi-stage Decoupled Relational Knowledge Distillation with Adaptive Stage Selection",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Due to the effectiveness of contrastive-learning-based knowledge distillation methods, there has been a renewed interest on relational knowledge distillation.\nHowever, these methods primarily rely on the transfer of angle-wise information between samples, using only the normalized penultimate layer's output as the knowledge base.\nOur experiments demonstrate that properly harnessing relational information derived from intermediate layers can further improve the effectiveness of distillation.\nMeanwhile, we found that simply adding distance-wise relational information to contrastive-learning-based methods negatively impacts distillation quality, revealing an implicit contention between angle-wise and distance-wise attributes.\nTherefore, we propose a ${\\bf{M}}$ulti-stage ${\\bf{D}}$ecoupled ${\\bf{R}}$elational (MDR) knowledge distillation framework equipped with an adaptive stage selection to identify the stages that maximize the efficacy of transferring the relational knowledge.\nFurthermore, our framework decouples angle-wise and distance-wise information to resolve their conflicts while still preserves complete relational knowledge, thereby resulting in an elevated transferring efficiency and distillation quality.\nTo evaluate the proposed method, we conduct extensive experiments on multiple image benchmarks ($\\textit{i.e.}$ CIFAR100, ImageNet and Pascal VOC), covering various tasks ($\\textit{i.e.}$ classification, few-shot learning, transfer learning and object detection). \nOur method exhibits superior performance under diverse scenarios, surpassing the state of the art by an average improvement of 1.08\\% on CIFAR-100 across extensively utilized teacher-student network pairs.",
        "keywords": "relation-based knowledge distillation;multi-stage;decouple;contrastive learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "JiaQi Wang;Lu Lu;Mingmin Chi;Jian Chen",
        "authorids": "~JiaQi_Wang7;~Lu_Lu7;~Mingmin_Chi2;~Jian_Chen12",
        "gender": ";M;F;M",
        "homepage": "https://github.com/NickiJQ;https://cn.aliyun.com;https://faculty.fudan.edu.cn/chimingmin/zh_CN/zdylm/644183/list/index.htm;http://lca.ece.utexas.edu/people/jchen",
        "dblp": ";;03/2079.html;",
        "google_scholar": ";;;",
        "orcid": ";0009-0008-6524-802X;0000-0003-2650-4146;",
        "linkedin": ";;;",
        "or_profile": "~JiaQi_Wang7;~Lu_Lu7;~Mingmin_Chi2;~Jian_Chen12",
        "aff": "Fudan University;Alibaba Group;Fudan University;Alibaba Group",
        "aff_domain": "fudan.edu.cn;alibaba-inc.com;fudan.edu.cn;alibaba-inc.com",
        "position": "MS student;Expert Software Engineer;Associate Professor;Researcher",
        "bibtex": "@misc{\nwang2024teaching,\ntitle={Teaching wiser, Learning smarter: Multi-stage Decoupled Relational Knowledge Distillation with Adaptive Stage Selection},\nauthor={JiaQi Wang and Lu Lu and Mingmin Chi and Jian Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=4QtywskEyY}\n}",
        "github": "",
        "project": "",
        "reviewers": "zgd9;WUNU;qoFL;G2bH",
        "site": "https://openreview.net/forum?id=4QtywskEyY",
        "pdf_size": 4791349,
        "rating": "5;5;6;8",
        "confidence": "4;4;5;4",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "31;93;61;127",
        "wc_strengths": "79;45;14;55",
        "wc_weaknesses": "98;323;77;393",
        "wc_questions": "1;10;41;117",
        "wc_review": "209;471;193;692",
        "wc_reply_reviewers": "0;0;0;34",
        "wc_reply_authors": "495;638;382;434",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            78.0,
            35.79106033634656
        ],
        "wc_strengths_avg": [
            48.25,
            23.31710745354149
        ],
        "wc_weaknesses_avg": [
            222.75,
            137.69599667383218
        ],
        "wc_questions_avg": [
            42.25,
            45.63647116068463
        ],
        "wc_review_avg": [
            391.25,
            205.747873622062
        ],
        "wc_reply_reviewers_avg": [
            8.5,
            14.722431864335457
        ],
        "wc_reply_authors_avg": [
            487.25,
            95.7845890527281
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:TwaiuYAM8i4J:scholar.google.com/&scioq=Teaching+wiser,+Learning+smarter:+Multi-stage+Decoupled+Relational+Knowledge+Distillation+with+Adaptive+Stage+Selection&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;1",
        "aff_unique_norm": "Fudan University;Alibaba Group",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.fudan.edu.cn;https://www.alibaba.com",
        "aff_unique_abbr": "Fudan;Alibaba",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "4Qz9BT4mpM",
        "title": "Predicting the Performance of Foundation Models via Agreement-on-the-line",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Estimating out-of-distribution performance is critical to safely deploying machine learning models. Recently, Baek et al. showed that the phenomenon ``agreement-on-the-line'' can be a reliable method for predicting OOD accuracy of models in an ensemble consisting largely of CNNs trained from scratch. However, it is now increasingly common to lightly fine-tune foundation models, and it is unclear whether such fine-tuning is sufficient to produce enough diversity in models for such agreement-based methods to work properly. In this paper, we develop methods for reliably applying agreement-on-the-line-based performance estimation to fine-tuned foundation models. In particular, we first study the case of fine-tuning a single foundation model, where we extensively study how different types of randomness (linear head initialization, hyperparameter selection, data subsetting, and data shuffling) contribute to the agreement on the line of the resulting model sets; we find, somewhat surprisingly, that it is typically possible to obtain strong agreement via random initialization of the linear head alone. Next, we study how \\emph{multiple} foundation models, pretrained on different data sets but fine-tuned on the same task, may or may not produce agreement; we show, again rather surprisingly, that the diversity of such models is already sufficient and not too disparate for them to all lie on the same agreement lines. In total, these methods enable reliable and efficient estimation of OOD accuracy for fine-tuned foundation models, without leveraging any labeled OOD data.",
        "keywords": "robustness;OOD performance estimation;foundation model safety",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Aman Mehra;Rahul Saxena;Taeyoun Kim;Christina Baek;J Zico Kolter;Aditi Raghunathan",
        "authorids": "~Aman_Mehra1;~Rahul_Saxena1;~Taeyoun_Kim1;~Christina_Baek2;~J_Zico_Kolter1;~Aditi_Raghunathan1",
        "gender": ";M;M;;F;M",
        "homepage": ";https://www.linkedin.com/in/rahul-saxena-cs/;https://danielkty.github.io;https://kebaek.github.io;https://www.cs.cmu.edu/~aditirag/;http://www.zicokolter.com",
        "dblp": ";;122/6365;202/7238;166/1409;67/2526",
        "google_scholar": ";;;;Ch9iRwQAAAAJ;UXh1I6UAAAAJ",
        "orcid": ";;;;;",
        "linkedin": "am-me/;;;;;",
        "or_profile": "~Aman_Mehra1;~Rahul_Saxena1;~Taeyoun_Kim1;~Christina_Baek2;~Aditi_Raghunathan1;~Zico_Kolter1",
        "aff": "Carnegie Mellon University;;School of Computer Science, Carnegie Mellon University;Carnegie Mellon University;Carnegie Mellon University;Carnegie Mellon University",
        "aff_domain": "andrew.cmu.edu;;cs.cmu.edu;cmu.edu;cmu.edu;cmu.edu",
        "position": "MS student;;MS student;PhD student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nmehra2024predicting,\ntitle={Predicting the Performance of Foundation Models via Agreement-on-the-line},\nauthor={Aman Mehra and Rahul Saxena and Taeyoun Kim and Christina Baek and J Zico Kolter and Aditi Raghunathan},\nyear={2024},\nurl={https://openreview.net/forum?id=4Qz9BT4mpM}\n}",
        "github": "",
        "project": "",
        "reviewers": "sUjj;47Ds;BrfQ;vvH6",
        "site": "https://openreview.net/forum?id=4Qz9BT4mpM",
        "pdf_size": 1808454,
        "rating": "5;6;6;6",
        "confidence": "4;3;4;3",
        "soundness": "3;3;3;2",
        "contribution": "3;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "166;306;100;97",
        "wc_strengths": "149;77;82;289",
        "wc_weaknesses": "409;226;207;439",
        "wc_questions": "95;106;32;152",
        "wc_review": "819;715;421;977",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "2126;1750;1818;2120",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "4;4;4;5",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            167.25,
            84.721234056168
        ],
        "wc_strengths_avg": [
            149.25,
            85.54640553524152
        ],
        "wc_weaknesses_avg": [
            320.25,
            104.50687776409742
        ],
        "wc_questions_avg": [
            96.25,
            42.81573892857625
        ],
        "wc_review_avg": [
            733.0,
            202.85462775100794
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1953.5,
            171.209666783158
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            4.25,
            0.4330127018922193
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5847648953960085500&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Carnegie Mellon University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cmu.edu",
        "aff_unique_abbr": "CMU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Pittsburgh",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "4SmhpF1nO4",
        "title": "Tabular Deep-SMOTE: A supervised autoencoder-based minority-oversampling technique for class-imbalanced tabular classification",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Class imbalance, present in many real-world tabular datasets, may cause machine-learning models to under-classify minority samples, which are often highly significant. This work proposes a new oversampling method called Tabular Deep-SMOTE (TD-SMOTE), which harnesses the class labels to improve synthetic sample generation via autoencoders. The method is based on oversampling in an alternative space shaped by a metric-learning loss. Such spaces tend to be more semantic and obtain higher class separation and density, which improves the quality of samples generated by linear interpolations over the observed minority samples. In addition, we propose a synthetic samples filtering scheme based on the decision boundary of a pre-trained tabular classifier to guarantee the quality of synthetic samples. Compared to common and leading oversampling methods, the method achieves improved classification performance in an extensive set of experiments that includes over 36 publicly available datasets.",
        "keywords": "supervised learning;tabular data;imbalanced datasets;classification;minority oversampling",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/2b92313bd939007a9d662a74245c38664934b7f8.zip",
        "author": "Daniel Lawton;Moshe Salhov;Ofir Lindenbaum;Amir Averbuch",
        "authorids": "~Daniel_Lawton1;~Moshe_Salhov1;~Ofir_Lindenbaum1;~Amir_Averbuch1",
        "gender": ";M;M;M",
        "homepage": ";;https://www.eng.biu.ac.il/lindeno/;http://www.cs.tau.ac.il/~amir1/",
        "dblp": ";;142/4140;",
        "google_scholar": ";oxtRoo8AAAAJ;https://scholar.google.co.il/citations?user=jXxk6gcAAAAJ;https://scholar.google.com.tw/citations?user=W5hdNOgAAAAJ",
        "orcid": ";;;0000-0002-3664-1489",
        "linkedin": ";;;",
        "or_profile": "~Daniel_Lawton1;~Moshe_Salhov1;~Ofir_Lindenbaum1;~Amir_Averbuch1",
        "aff": ";;Bar-Ilan University;Tel Aviv University",
        "aff_domain": ";;biu.ac.il;tau.ac.il",
        "position": ";;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nlawton2024tabular,\ntitle={Tabular Deep-{SMOTE}: A supervised autoencoder-based minority-oversampling technique for class-imbalanced tabular classification},\nauthor={Daniel Lawton and Moshe Salhov and Ofir Lindenbaum and Amir Averbuch},\nyear={2024},\nurl={https://openreview.net/forum?id=4SmhpF1nO4}\n}",
        "github": "",
        "project": "",
        "reviewers": "KYqz;Uo1S;RWeJ;iTrN",
        "site": "https://openreview.net/forum?id=4SmhpF1nO4",
        "pdf_size": 2513016,
        "rating": "3;3;3;3",
        "confidence": "3;5;2;3",
        "soundness": "2;2;2;3",
        "contribution": "2;1;1;3",
        "presentation": "2;1;2;4",
        "wc_summary": "52;68;46;53",
        "wc_strengths": "19;7;10;47",
        "wc_weaknesses": "279;221;247;249",
        "wc_questions": "2;156;1;48",
        "wc_review": "352;452;304;397",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.25,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            54.75,
            8.104782538723663
        ],
        "wc_strengths_avg": [
            20.75,
            15.785673884886892
        ],
        "wc_weaknesses_avg": [
            249.0,
            20.54263858417414
        ],
        "wc_questions_avg": [
            51.75,
            63.1124987621311
        ],
        "wc_review_avg": [
            376.25,
            54.71916940159088
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Js6F-3aYw4MJ:scholar.google.com/&scioq=Tabular+Deep-SMOTE:+A+supervised+autoencoder-based+minority-oversampling+technique+for+class-imbalanced+tabular+classification&hl=en&as_sdt=0,47",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Bar-Ilan University;Tel Aviv University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.biu.ac.il;https://www.tau.ac.il",
        "aff_unique_abbr": "BIU;TAU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Israel"
    },
    {
        "id": "4SrzKsJocx",
        "title": "Simultaneous Dimensionality Reduction: A Data Efficient Approach for Multimodal Representations Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Current experiments frequently produce high-dimensional, multimodal datasets\u2014such as those combining neural activity and animal behavior or gene expression and phenotypic profiling\u2014with the goal of extracting useful correlations between the modalities. Often, the first step in analyzing such datasets is dimensionality reduction. We explore two primary classes of approaches to dimensionality reduction: Independent Dimensionality Reduction (IDR) and Simultaneous Dimensionality Reduction (SDR). In IDR methods, of which Principal Components Analysis is a paradigmatic example, each modality is compressed independently, striving to retain as much variation within each modality as possible. In contrast, in SDR, one simultaneously compresses the modalities to maximize the covariation between the reduced descriptions while paying less attention to how much individual variation is preserved. Paradigmatic examples include Partial Least Squares and Canonical Correlations Analysis. Even though these dimensionality reduction methods are a staple of statistics, their relative accuracy and data set size requirements are poorly understood. We introduce a generative linear model to synthesize multimodal data with known variance and covariance structures to examine these questions. We assess the accuracy of the reconstruction of the covariance structures as a function of the number of samples, signal-to-noise ratio, and the number of varying and covarying signals in the data. Using numerical experiments, we demonstrate that SDR methods consistently outperform IDR methods and yield higher-quality, more succinct reduced-dimensional representations at smaller dataset sizes. Remarkably, regularized CCA can identify low-dimensional weak covarying structures even when the number of samples is much smaller than the dimensionality of the data, a challenge known to affect all dimensionality reduction methods. Our work corroborates and explains previous observations in the literature that SDR can be more effective in detecting covariation patterns in data. These findings suggest that SDR should be preferred to IDR in real-world data analysis when detecting covariation is more important than preserving variation.",
        "keywords": "Dimensionality reduction;Independent Dimensionality Reduction (IDR);Simultaneous Dimensionality Reduction (SDR);PCA;PLS;CCA;regularized CCA;Multimodal data analysis.",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Eslam Abdelaleem;Ahmed Roman;K. Michael Martini;Ilya Nemenman",
        "authorids": "~Eslam_Abdelaleem1;~Ahmed_Roman1;~K._Michael_Martini1;~Ilya_Nemenman1",
        "gender": ";M;M;Not Specified",
        "homepage": ";https://connects.catalyst.harvard.edu/Profiles/display/Person/210375;https://guava.physics.uiuc.edu/~martini/;https://physics.emory.edu/people/bios/nemenman-ilya.html",
        "dblp": ";;;83/5659.html",
        "google_scholar": ";vKAd0r4AAAAJ;ztH4760AAAAJ;https://scholar.google.com.tw/citations?user=enjXdH4AAAAJ",
        "orcid": "0009-0006-9429-3589;0000-0003-1845-9533;0000-0002-5946-1122;0000-0003-3024-4244",
        "linkedin": "eslamalaa/;ahmed-roman-2a8a7868/;;",
        "or_profile": "~Eslam_Abdelaleem1;~Ahmed_Roman1;~K._Michael_Martini1;~Ilya_Nemenman1",
        "aff": "Emory University;Harvard Medical School;Emory University;Emory University",
        "aff_domain": "emory.edu;hms.harvard.edu;emory.edu;emory.edu",
        "position": "PhD student;Postdoc;Postdoc;Full Professor",
        "bibtex": "@misc{\nabdelaleem2024simultaneous,\ntitle={Simultaneous Dimensionality Reduction: A Data Efficient Approach for Multimodal Representations Learning},\nauthor={Eslam Abdelaleem and Ahmed Roman and K. Michael Martini and Ilya Nemenman},\nyear={2024},\nurl={https://openreview.net/forum?id=4SrzKsJocx}\n}",
        "github": "",
        "project": "",
        "reviewers": "KsZw;7S2y;7ULi;di89;595z",
        "site": "https://openreview.net/forum?id=4SrzKsJocx",
        "pdf_size": 2253801,
        "rating": "3;3;3;5;5",
        "confidence": "4;4;4;2;4",
        "soundness": "2;2;3;3;3",
        "contribution": "2;1;1;2;2",
        "presentation": "2;3;3;3;3",
        "wc_summary": "49;78;19;73;93",
        "wc_strengths": "25;6;7;39;28",
        "wc_weaknesses": "89;262;150;127;61",
        "wc_questions": "395;13;9;4;177",
        "wc_review": "558;359;185;243;359",
        "wc_reply_reviewers": "0;288;48;0;45",
        "wc_reply_authors": "830;397;651;126;362",
        "reply_reviewers": "0;1;1;0;1",
        "reply_authors": "2;1;1;1;2",
        "rating_avg": [
            3.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.6,
            0.8
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            1.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            62.4,
            25.904439773907484
        ],
        "wc_strengths_avg": [
            21.0,
            12.727922061357855
        ],
        "wc_weaknesses_avg": [
            137.8,
            69.23987290571813
        ],
        "wc_questions_avg": [
            119.6,
            152.38057619001182
        ],
        "wc_review_avg": [
            340.8,
            127.80985877466574
        ],
        "wc_reply_reviewers_avg": [
            76.2,
            107.92664175262752
        ],
        "wc_reply_authors_avg": [
            473.2,
            243.98311416981298
        ],
        "reply_reviewers_avg": [
            0.6,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.4,
            0.4898979485566356
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.6123724356957946,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13215423161228151904&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Emory University;Harvard University",
        "aff_unique_dep": ";Medical School",
        "aff_unique_url": "https://www.emory.edu;https://hms.harvard.edu",
        "aff_unique_abbr": "Emory;HMS",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Boston",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Rayleigh Quotient Graph Neural Networks for Graph-level Anomaly Detection",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19466",
        "id": "4UIBysXjVq",
        "author_site": "Xiangyu Dong, Xingyi Zhang, Sibo WANG",
        "tldr": "",
        "abstract": "Graph-level anomaly detection has gained significant attention as it finds applications in various domains, such as cancer diagnosis and enzyme prediction. However, existing methods fail to capture the spectral properties of graph anomalies, resulting in unexplainable framework design and unsatisfying performance. In this paper, we re-investigate the spectral differences between anomalous and normal graphs. Our main observation shows a significant disparity in the accumulated spectral energy between these two classes. Moreover, we prove that the accumulated spectral energy of the graph signal can be represented by its Rayleigh Quotient, indicating that the Rayleigh Quotient is a driving factor behind the anomalous properties of graphs. Motivated by this, we propose Rayleigh Quotient Graph Neural Network (RQGNN), the first spectral GNN that explores the inherent spectral features of anomalous graphs for graph-level anomaly detection. Specifically, we introduce a novel framework with two components: the Rayleigh Quotient learning component (RQL) and Chebyshev Wavelet GNN with RQ-pooling (CWGNN-RQ). RQL explicitly captures the Rayleigh Quotient of graphs and CWGNN-RQ implicitly explores the spectral space of graphs. Extensive experiments on 10 real-world datasets show that RQGNN outperforms the best rival by 6.74% in Macro-F1 score and 1.44% in AUC, demonstrating the effectiveness of our framework. Our code is available at https://github.com/xydong127/RQGNN.",
        "keywords": "Graph-level anomaly detection;Spectral GNN;Rayleigh Quotient",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Xiangyu Dong;Xingyi Zhang;Sibo Wang",
        "authorids": "~Xiangyu_Dong2;~Xingyi_Zhang1;~Sibo_Wang3",
        "gender": ";M;M",
        "homepage": "https://xydong127.github.io/;http://josiah96zhang.github.io/;https://www1.se.cuhk.edu.hk/~swang/",
        "dblp": "84/3152-2.html;93/1107-3;131/6529-1",
        "google_scholar": ";j_o_XDkAAAAJ;b2gLqsgAAAAJ",
        "orcid": "0009-0009-6312-8160;0000-0001-5203-5916;0000-0003-1892-6971",
        "linkedin": ";xingyi-zhang-769338204/;sibo-wang-b6a60941/?originalSubdomain=hk",
        "or_profile": "~Xiangyu_Dong2;~Xingyi_Zhang1;~Sibo_Wang3",
        "aff": "Chinese University of Hong Kong;The Chinese University of Hong Kong;The Chinese University of Hong Kong",
        "aff_domain": "cuhk.hk;cuhk.edu.hk;cuhk.edu.hk",
        "position": "PhD student;PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\ndong2024rayleigh,\ntitle={Rayleigh Quotient Graph Neural Networks for Graph-level Anomaly Detection},\nauthor={Xiangyu Dong and Xingyi Zhang and Sibo Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=4UIBysXjVq}\n}",
        "github": "",
        "project": "",
        "reviewers": "X1rz;oJCz;qWnD",
        "pdf_size": 622914,
        "rating": "6;6;6",
        "confidence": "4;4;4",
        "soundness": "2;3;2",
        "contribution": "2;3;2",
        "presentation": "2;3;3",
        "wc_summary": "105;54;96",
        "wc_strengths": "81;30;115",
        "wc_weaknesses": "253;194;174",
        "wc_questions": "41;29;145",
        "wc_review": "480;307;530",
        "wc_reply_reviewers": "295;0;0",
        "wc_reply_authors": "3861;1869;1718",
        "reply_reviewers": "3;0;0",
        "reply_authors": "7;4;4",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            85.0,
            22.22611077089287
        ],
        "wc_strengths_avg": [
            75.33333333333333,
            34.93167935015754
        ],
        "wc_weaknesses_avg": [
            207.0,
            33.53605025441527
        ],
        "wc_questions_avg": [
            71.66666666666667,
            52.08539995899896
        ],
        "wc_review_avg": [
            439.0,
            95.54405615561161
        ],
        "wc_reply_reviewers_avg": [
            98.33333333333333,
            139.06433363335435
        ],
        "wc_reply_authors_avg": [
            2482.6666666666665,
            976.5764463448602
        ],
        "reply_reviewers_avg": [
            1.0,
            1.4142135623730951
        ],
        "reply_authors_avg": [
            5.0,
            1.4142135623730951
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12135700093364746008&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=4UIBysXjVq",
        "pdf": "https://openreview.net/pdf?id=4UIBysXjVq",
        "email": "cuhk.hk;cuhk.edu.hk;cuhk.edu.hk",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Chinese University of Hong Kong",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cuhk.edu.hk",
        "aff_unique_abbr": "CUHK",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "4UP387Adir",
        "title": "Weakly Supervised Graph Contrastive Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph Contrastive Learning (GCL) has recently gained popularity owing to its ability to learn efficient node representations in a self-supervised manner. These representations are typically used to train a downstream classifier. In several real-world datasets, it is difficult to acquire sufficient clean labels for classification and instead we have weak or noisy labels available. There is little known about the robustness of the node representations learnt by the current GCL methods in the presence of weak labels.\nMoreover, GCL has been successfully adapted to a supervised setting where class labels are used to contrast between pairs of nodes. \nCan weak labels similarly be leveraged to learn better node embeddings? In this paper, we first empirically study the robustness of current GCL node representations to weak supervision. Then, we introduce Weakly Supervised Graph Contrastive Learning, WSNet, a novel method that incorporates signals from weak labels for the contrastive learning objective. We evaluate WSNet on five benchmark graph datasets comparing its performance with state-of-the-art GCL and noisy-label learning methods. We show that WSNet outperforms all baselines particularly in the high noise setting. We conclude that although current GCL methods show great promise in the weak supervision paradigm, they are still limited in their capacity to deal with label noise and utilizing signals from weak labels is an effective way to improve their performance.",
        "keywords": "weak supervision;graph contrastive learning;noisy label learning;weakly supervised node classification",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Pratheeksha Nair;Reihaneh Rabbany",
        "authorids": "~Pratheeksha_Nair2;~Reihaneh_Rabbany1",
        "gender": "F;F",
        "homepage": "https://nair-p.github.io/;http://www.reirab.com/",
        "dblp": "233/1231;94/9024",
        "google_scholar": ";https://scholar.google.ca/citations?user=Foh_c-QAAAAJ",
        "orcid": ";",
        "linkedin": "pnair96/;",
        "or_profile": "~Pratheeksha_Nair2;~Reihaneh_Rabbany1",
        "aff": "McGill University;Montreal Institute for Learning Algorithms, University of Montreal, University of Montreal",
        "aff_domain": "mcgill.ca;mila.umontreal.ca",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nnair2024weakly,\ntitle={Weakly Supervised Graph Contrastive Learning},\nauthor={Pratheeksha Nair and Reihaneh Rabbany},\nyear={2024},\nurl={https://openreview.net/forum?id=4UP387Adir}\n}",
        "github": "",
        "project": "",
        "reviewers": "YxoE;oC5W;waBU;G4h6",
        "site": "https://openreview.net/forum?id=4UP387Adir",
        "pdf_size": 790235,
        "rating": "5;5;6;6",
        "confidence": "3;3;4;3",
        "soundness": "2;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "3;2;2;2",
        "wc_summary": "75;116;70;56",
        "wc_strengths": "45;39;72;23",
        "wc_weaknesses": "107;158;242;241",
        "wc_questions": "3;687;3;65",
        "wc_review": "230;1000;387;385",
        "wc_reply_reviewers": "128;22;282;18",
        "wc_reply_authors": "818;1504;939;1262",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;4;2;3",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            79.25,
            22.331312097590683
        ],
        "wc_strengths_avg": [
            44.75,
            17.66882848408462
        ],
        "wc_weaknesses_avg": [
            187.0,
            57.40644563113101
        ],
        "wc_questions_avg": [
            189.5,
            288.34484562759224
        ],
        "wc_review_avg": [
            500.5,
            295.33582579836127
        ],
        "wc_reply_reviewers_avg": [
            112.5,
            107.34407296166845
        ],
        "wc_reply_authors_avg": [
            1130.75,
            269.7789604472521
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ER0Ktiwc88YJ:scholar.google.com/&scioq=Weakly+Supervised+Graph+Contrastive+Learning&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "McGill University;University of Montreal",
        "aff_unique_dep": ";Montreal Institute for Learning Algorithms",
        "aff_unique_url": "https://www.mcgill.ca;https://www.umontreal.ca",
        "aff_unique_abbr": "McGill;UM",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Montreal",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Canada"
    },
    {
        "title": "Locality-Aware Graph Rewiring in GNNs",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19465",
        "id": "4Ua4hKiAJX",
        "author_site": "Federico Barbero, Ameya Velingker, Amin Saberi, Michael Bronstein, Francesco Di Giovanni",
        "tldr": "",
        "abstract": "Graph Neural Networks (GNNs) are popular models for machine learning on graphs that typically follow the message-passing paradigm, whereby the feature of a node is updated recursively upon aggregating information over its neighbors. While exchanging messages over the input graph endows GNNs with a strong inductive bias, it can also make GNNs susceptible to over-squashing, thereby preventing them from capturing long-range interactions in the given graph. To rectify this issue, graph rewiring techniques have been proposed as a means of improving information flow by altering the graph connectivity. In this work, we identify three desiderata for graph-rewiring: (i) reduce over-squashing, (ii) respect the locality of the graph, and \n(iii) preserve the sparsity of the graph. We highlight fundamental trade-offs that occur between spatial and spectral rewiring techniques; while the former often satisfy (i) and (ii) but not (iii), the latter generally satisfy (i) and (iii) at the expense of (ii). We propose a novel rewiring framework that satisfies all of (i)--(iii) through a locality-aware sequence of rewiring operations. We then discuss a specific instance of such rewiring framework and \nvalidate its effectiveness on several real-world benchmarks, showing that it either matches or significantly outperforms existing rewiring approaches.",
        "keywords": "Graph Neural Networks;Message Passing Neural Networks;Over-squashing;Graph Rewiring",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/387291a37c07ba744d2e44457c8089aa6c05ad87.zip",
        "author": "Federico Barbero;Ameya Velingker;Amin Saberi;Michael M. Bronstein;Francesco Di Giovanni",
        "authorids": "~Federico_Barbero1;~Ameya_Velingker1;~Amin_Saberi1;~Michael_M._Bronstein1;~Francesco_Di_Giovanni1",
        "gender": ";M;;M;M",
        "homepage": "https://federicobarbero.com;http://www.ameyavelingker.com;https://www.stanford.edu/~saberi;http://www.inf.usi.ch/bronstein/;https://francescodgv.github.io/",
        "dblp": ";117/3666.html;28/4017;07/2668;",
        "google_scholar": "jpYtKMEAAAAJ;6dFFudUAAAAJ;;UU3N6-UAAAAJ;yzjjeqsAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";ameya-velingker-5811b711;;mbronstein/;",
        "or_profile": "~Federico_Barbero1;~Ameya_Velingker1;~Amin_Saberi1;~Michael_M._Bronstein1;~Francesco_Di_Giovanni1",
        "aff": "University of Oxford;Google;Stanford University;University of Oxford;Valence Labs powered by recursion",
        "aff_domain": "ox.ac.uk;google.com;stanford.edu;ox.ac.uk;valencelabs.com",
        "position": "PhD student;Research Scientist;Full Professor;Full Professor;Researcher",
        "bibtex": "@inproceedings{\nbarbero2024localityaware,\ntitle={Locality-Aware Graph Rewiring in {GNN}s},\nauthor={Federico Barbero and Ameya Velingker and Amin Saberi and Michael M. Bronstein and Francesco Di Giovanni},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=4Ua4hKiAJX}\n}",
        "github": "",
        "project": "",
        "reviewers": "RVSP;KgxZ;EJ4V;XEwE",
        "pdf_size": 570762,
        "rating": "3;5;6;8",
        "confidence": "3;4;4;3",
        "soundness": "2;2;3;2",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "150;52;37;63",
        "wc_strengths": "16;134;62;46",
        "wc_weaknesses": "78;762;217;109",
        "wc_questions": "128;2;14;194",
        "wc_review": "372;950;330;412",
        "wc_reply_reviewers": "402;604;10;13",
        "wc_reply_authors": "1257;1706;760;439",
        "reply_reviewers": "2;3;1;1",
        "reply_authors": "3;5;2;1",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            75.5,
            43.99147644714826
        ],
        "wc_strengths_avg": [
            64.5,
            43.39066719929529
        ],
        "wc_weaknesses_avg": [
            291.5,
            276.5
        ],
        "wc_questions_avg": [
            84.5,
            80.09213444527497
        ],
        "wc_review_avg": [
            516.0,
            252.24194734421155
        ],
        "wc_reply_reviewers_avg": [
            257.25,
            255.91929880335323
        ],
        "wc_reply_authors_avg": [
            1040.5,
            482.2460471585019
        ],
        "reply_reviewers_avg": [
            1.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.75,
            1.479019945774904
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 29,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14010768070887396527&as_sdt=80005&sciodt=0,11&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=4Ua4hKiAJX",
        "pdf": "https://openreview.net/pdf?id=4Ua4hKiAJX",
        "email": "ox.ac.uk;google.com;stanford.edu;ox.ac.uk;valencelabs.com",
        "author_num": 5,
        "aff_unique_index": "0;1;2;0;3",
        "aff_unique_norm": "University of Oxford;Google;Stanford University;Valence Labs",
        "aff_unique_dep": ";Google;;",
        "aff_unique_url": "https://www.ox.ac.uk;https://www.google.com;https://www.stanford.edu;",
        "aff_unique_abbr": "Oxford;Google;Stanford;",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Mountain View;Stanford",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "United Kingdom;United States;"
    },
    {
        "title": "Coordinate-Aware Modulation for Neural Fields",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19464",
        "id": "4UiLqimGm5",
        "author_site": "Joo Chan Lee, Daniel Rho, Seungtae Nam, Jong Hwan Ko, Eunbyung Park",
        "tldr": "",
        "abstract": "Neural fields, mapping low-dimensional input coordinates to corresponding signals, have shown promising results in representing various signals. Numerous methodologies have been proposed, and techniques employing MLPs and grid representations have achieved substantial success. MLPs allow compact and high expressibility, yet often suffer from spectral bias and slow convergence speed. On the other hand, methods using grids are free from spectral bias and achieve fast training speed, however, at the expense of high spatial complexity. In this work, we propose a novel way for exploiting both MLPs and grid representations in neural fields. Unlike the prevalent methods that combine them sequentially (extract features from the grids first and feed them to the MLP), we inject spectral bias-free grid representations into the intermediate features in the MLP. More specifically, we suggest a Coordinate-Aware Modulation (CAM), which modulates the intermediate features using scale and shift parameters extracted from the grid representations. This can maintain the strengths of MLPs while mitigating any remaining potential biases, facilitating the rapid learning of high-frequency components. In addition, we empirically found that the feature normalizations, which have not been successful in neural filed literature, proved to be effective when applied in conjunction with the proposed CAM. Experimental results demonstrate that CAM enhances the performance of neural representation and improves learning stability across a range of signals. Especially in the novel view synthesis task, we achieved state-of-the-art performance with the least number of parameters and fast training speed for dynamic scenes and the best performance under 1MB memory for static scenes. CAM also outperforms the best-performing video compression methods using neural fields by a large margin. Our project page is available at https://maincold2.github.io/cam/.",
        "keywords": "Neural Fields;Neural Representation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/406c3e16161fffc2b34f230764f866385cec0619.zip",
        "author": "Joo Chan Lee;Daniel Rho;Seungtae Nam;Jong Hwan Ko;Eunbyung Park",
        "authorids": "~Joo_Chan_Lee1;~Daniel_Rho1;~Seungtae_Nam1;~Jong_Hwan_Ko2;~Eunbyung_Park1",
        "gender": "M;M;M;;M",
        "homepage": ";;https://github.com/stnamjef;http://iris.skku.edu/;https://silverbottlep.github.io/",
        "dblp": "282/1951;311/4143;321/0019;168/6308;92/9727",
        "google_scholar": "WKCHKk8AAAAJ;nEC0wK4AAAAJ;8NKPmmwCmrAC;https://scholar.google.co.kr/citations?user=UN_OIs4AAAAJ;iPyuJmQAAAAJ",
        "orcid": ";;;0000-0003-4434-4318;",
        "linkedin": ";;;;eunbyung-park-286384b4/",
        "or_profile": "~Joo_Chan_Lee1;~Daniel_Rho1;~Seungtae_Nam1;~Jong_Hwan_Ko2;~Eunbyung_Park1",
        "aff": "Sungkyunkwan University;Korea Telecom Research;Sungkyunkwan University;Sungkyunkwan University;Sungkyunkwan University",
        "aff_domain": "skku.edu;kt.com;skku.edu;skku.edu;skku.edu",
        "position": "PhD student;Researcher;MS student;Associate Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nlee2024coordinateaware,\ntitle={Coordinate-Aware Modulation for Neural Fields},\nauthor={Joo Chan Lee and Daniel Rho and Seungtae Nam and Jong Hwan Ko and Eunbyung Park},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=4UiLqimGm5}\n}",
        "github": "",
        "project": "",
        "reviewers": "kCkz;oV38;DCsj;7EJV",
        "pdf_size": 2840063,
        "rating": "6;6;8;8",
        "confidence": "2;3;4;1",
        "soundness": "3;3;3;4",
        "contribution": "3;3;3;4",
        "presentation": "3;4;3;4",
        "wc_summary": "71;113;156;45",
        "wc_strengths": "43;74;67;71",
        "wc_weaknesses": "20;220;313;64",
        "wc_questions": "13;2;109;4",
        "wc_review": "147;409;645;184",
        "wc_reply_reviewers": "33;0;72;0",
        "wc_reply_authors": "192;575;843;159",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            2.5,
            1.118033988749895
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            96.25,
            42.174488734304774
        ],
        "wc_strengths_avg": [
            63.75,
            12.234684303242156
        ],
        "wc_weaknesses_avg": [
            154.25,
            117.99655715316443
        ],
        "wc_questions_avg": [
            32.0,
            44.64862819841165
        ],
        "wc_review_avg": [
            346.25,
            199.50861510220554
        ],
        "wc_reply_reviewers_avg": [
            26.25,
            29.65109610115619
        ],
        "wc_reply_authors_avg": [
            442.25,
            283.31905601282807
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5986837010442502038&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=4UiLqimGm5",
        "pdf": "https://openreview.net/pdf?id=4UiLqimGm5",
        "email": "skku.edu;kt.com;skku.edu;skku.edu;skku.edu",
        "author_num": 5,
        "aff_unique_index": "0;1;0;0;0",
        "aff_unique_norm": "Sungkyunkwan University;Korea Telecom",
        "aff_unique_dep": ";Research",
        "aff_unique_url": "https://www.skku.edu;https://www.kt.com",
        "aff_unique_abbr": "SKKU;KT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "Towards Non-Asymptotic Convergence for Diffusion-Based Generative Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19463",
        "id": "4VGEeER6W9",
        "author_site": "Gen Li, Yuting Wei, Yuxin Chen, Yuejie Chi",
        "tldr": "",
        "abstract": "Diffusion models, which convert noise into new data instances by learning to reverse a Markov diffusion process, have become a cornerstone in contemporary generative modeling. While their practical power has now been widely recognized, the theoretical underpinnings remain far from mature.  In this work, we develop a suite of non-asymptotic theory towards understanding the data generation process of diffusion models in discrete time, assuming access to $\\ell_2$-accurate estimates of the (Stein) score functions. For a popular deterministic sampler (based on the probability flow ODE), we establish a convergence rate proportional to $1/T$ (with $T$ the total number of steps), improving upon past results; for another mainstream stochastic sampler (i.e., a type of the denoising diffusion probabilistic model), we derive a convergence rate proportional to $1/\\sqrt{T}$, matching the state-of-the-art theory. Imposing only minimal assumptions on the target data distribution (e.g., no smoothness assumption is imposed), our results characterize how $\\ell_2$ score estimation errors affect the quality of the data generation process.  In contrast to prior works, our theory is developed based on an elementary yet versatile non-asymptotic approach without resorting to toolboxes for SDEs and ODEs.",
        "keywords": "diffusion models;score-based generative modeling;non-asymptotic theory;reverse SDE;probability flow ODE;denoising diffusion probabilistic model",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Gen Li;Yuting Wei;Yuxin Chen;Yuejie Chi",
        "authorids": "~Gen_Li2;~Yuting_Wei1;~Yuxin_Chen5;~Yuejie_Chi1",
        "gender": "M;F;M;",
        "homepage": ";https://yutingwei.github.io/;https://yuxinchen2020.github.io/;",
        "dblp": "28/538-5.html;184/3856;11/5123-2;",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;fsbXdAYAAAAJ;RtNVud4AAAAJ;",
        "orcid": "0000-0002-3078-9191;;0000-0001-9256-5815;",
        "linkedin": ";;;",
        "or_profile": "~Gen_Li2;~Yuting_Wei1;~Yuxin_Chen5;~Yuejie_Chi1",
        "aff": "The Chinese University of Hong Kong;The Wharton School, University of Pennsylvania;University of Pennsylvania;",
        "aff_domain": "cuhk.edu.hk;wharton.upenn.edu;upenn.edu;",
        "position": "Assistant Professor;Assistant Professor;Associate Professor;",
        "bibtex": "@inproceedings{\nli2024towards,\ntitle={Towards Non-Asymptotic Convergence for Diffusion-Based Generative Models},\nauthor={Gen Li and Yuting Wei and Yuxin Chen and Yuejie Chi},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=4VGEeER6W9}\n}",
        "github": "",
        "project": "",
        "reviewers": "TgkF;nMDV;h2T8;ScYQ",
        "pdf_size": 308414,
        "rating": "6;8;8;8",
        "confidence": "3;2;4;5",
        "soundness": "4;3;3;4",
        "contribution": "3;3;2;4",
        "presentation": "3;3;2;3",
        "wc_summary": "133;155;116;81",
        "wc_strengths": "109;114;64;52",
        "wc_weaknesses": "56;182;137;128",
        "wc_questions": "123;142;60;3",
        "wc_review": "421;593;377;264",
        "wc_reply_reviewers": "24;74;73;0",
        "wc_reply_authors": "603;677;1134;468",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "2;2;3;1",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            121.25,
            27.040478915877213
        ],
        "wc_strengths_avg": [
            84.75,
            27.141987768032024
        ],
        "wc_weaknesses_avg": [
            125.75,
            45.168434774740646
        ],
        "wc_questions_avg": [
            82.0,
            54.78594710324902
        ],
        "wc_review_avg": [
            413.75,
            118.27800936776033
        ],
        "wc_reply_reviewers_avg": [
            42.75,
            31.901214710415026
        ],
        "wc_reply_authors_avg": [
            720.5,
            250.21840459886238
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.2581988897471611,
        "gs_citation": 31,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10749362722430110799&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=4VGEeER6W9",
        "pdf": "https://openreview.net/pdf?id=4VGEeER6W9",
        "email": "cuhk.edu.hk;wharton.upenn.edu;upenn.edu;",
        "author_num": 4,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Chinese University of Hong Kong;University of Pennsylvania",
        "aff_unique_dep": ";The Wharton School",
        "aff_unique_url": "https://www.cuhk.edu.hk;https://www.wharton.upenn.edu",
        "aff_unique_abbr": "CUHK;UPenn Wharton",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Stable Neural Stochastic Differential Equations in Analyzing Irregular Time Series Data",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19462",
        "id": "4VIgNuQ1pY",
        "author_site": "YongKyung Oh, Dongyoung Lim, Sungil Kim",
        "tldr": "",
        "abstract": "Irregular sampling intervals and missing values in real-world time series data present challenges for conventional methods that assume consistent intervals and complete data. Neural Ordinary Differential Equations (Neural ODEs) offer an alternative approach, utilizing neural networks combined with ODE solvers to learn continuous latent representations through parameterized vector fields. Neural Stochastic Differential Equations (Neural SDEs) extend Neural ODEs by incorporating a diffusion term, although this addition is not trivial, particularly when addressing irregular intervals and missing values. Consequently, careful design of drift and diffusion functions is crucial for maintaining stability and enhancing performance, while incautious choices can result in adverse properties such as the absence of strong solutions, stochastic destabilization, or unstable Euler discretizations, significantly affecting Neural SDEs' performance. In this study, we propose three stable classes of Neural SDEs: Langevin-type SDE, Linear Noise SDE, and Geometric SDE. Then, we rigorously demonstrate their robustness in maintaining excellent performance under distribution shift, while effectively preventing overfitting. To assess the effectiveness of our approach, we conduct extensive experiments on four benchmark datasets for interpolation, forecasting, and classification tasks, and analyze the robustness of our methods with 30 public datasets under different missing rates. Our results demonstrate the efficacy of the proposed method in handling real-world irregular time series data.",
        "keywords": "Neural Ordinary Differential Equations;Neural Stochastic Differential Equations;Irregular time series data",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "YongKyung Oh;Dongyoung Lim;Sungil Kim",
        "authorids": "~YongKyung_Oh1;~Dongyoung_Lim1;~Sungil_Kim1",
        "gender": ";M;M",
        "homepage": ";https://sites.google.com/view/dlim/;http://analytics.unist.ac.kr",
        "dblp": ";;",
        "google_scholar": ";;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~YongKyung_Oh1;~Dongyoung_Lim1;~Sungil_Kim1",
        "aff": ";Ulsan National Institute of Science and Technology;Ulsan National Institute of Science and Technology",
        "aff_domain": ";unist.ac.kr;unist.ac.kr",
        "position": ";Assistant Professor;Associate Professor",
        "bibtex": "@inproceedings{\noh2024stable,\ntitle={Stable Neural Stochastic Differential Equations in Analyzing Irregular Time Series Data},\nauthor={YongKyung Oh and Dongyoung Lim and Sungil Kim},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=4VIgNuQ1pY}\n}",
        "github": "",
        "project": "",
        "reviewers": "Q7tH;8YRs;gG9F",
        "pdf_size": 1326615,
        "rating": "6;6;8",
        "confidence": "3;3;4",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "3;3;3",
        "wc_summary": "62;88;146",
        "wc_strengths": "64;74;120",
        "wc_weaknesses": "64;163;178",
        "wc_questions": "168;85;84",
        "wc_review": "358;410;528",
        "wc_reply_reviewers": "15;12;48",
        "wc_reply_authors": "765;1175;360",
        "reply_reviewers": "1;1;1",
        "reply_authors": "1;2;1",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            98.66666666666667,
            35.11251755270318
        ],
        "wc_strengths_avg": [
            86.0,
            24.385788210895843
        ],
        "wc_weaknesses_avg": [
            135.0,
            50.57667446560717
        ],
        "wc_questions_avg": [
            112.33333333333333,
            39.36439451529206
        ],
        "wc_review_avg": [
            432.0,
            71.12430433168866
        ],
        "wc_reply_reviewers_avg": [
            25.0,
            16.30950643030009
        ],
        "wc_reply_authors_avg": [
            766.6666666666666,
            332.72444388045125
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.9999999999999998,
        "gs_citation": 17,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14858899934737697192&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=4VIgNuQ1pY",
        "pdf": "https://openreview.net/pdf?id=4VIgNuQ1pY",
        "email": ";unist.ac.kr;unist.ac.kr",
        "author_num": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Ulsan National Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.unist.ac.kr",
        "aff_unique_abbr": "UNIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "Unveiling the Unseen: Identifiable Clusters in Trained Depthwise Convolutional Kernels",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19461",
        "id": "4VgBjsOC8k",
        "author_site": "Zahra Babaiee, Peyman Kiasari, Daniela Rus, Radu Grosu",
        "tldr": "",
        "abstract": "Recent advances in depthwise-separable convolutional neural networks (DS-CNNs) have led to novel architectures, that surpass the performance of classical CNNs, by a considerable scalability and accuracy margin. This paper reveals another striking property of DS-CNN architectures: discernible and explainable patterns emerge in their trained depthwise convolutional kernels in all layers. Through an extensive analysis of millions of trained filters, with different sizes and from various models, we employed unsupervised clustering with autoencoders, to categorize these filters. Astonishingly, the patterns converged into a few main clusters, each resembling the difference of Gaussian (DoG) functions, and their first and second-order derivatives. Notably, we classify over 95\\% and 90\\% of the filters from state-of-the-art ConvNeXtV2 and ConvNeXt models, respectively. This finding is not merely a technological curiosity; it echoes the foundational models neuroscientists have long proposed for the vision systems of mammals. Our results thus deepen our understanding of the emergent properties of trained DS-CNNs and provide a bridge between artificial and biological visual processing systems. More broadly, they pave the way for more interpretable and biologically-inspired neural network designs in the future.",
        "keywords": "Depthwise Convolutions;Explainability;Neuroscience;Computer Vision;ConvNext",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Zahra Babaiee;Peyman Kiasari;Daniela Rus;Radu Grosu",
        "authorids": "~Zahra_Babaiee1;~Peyman_Kiasari1;~Daniela_Rus1;~Radu_Grosu1",
        "gender": "F;;F;M",
        "homepage": "https://informatics.tuwien.ac.at/people/zahra-babaiee;;https://www.csail.mit.edu/person/daniela-rus;https://ti.tuwien.ac.at/cps/people/grosu",
        "dblp": ";;r/DanielaRus;94/5421",
        "google_scholar": ";;https://scholar.google.com/citations?hl=en;1g_muAgAAAAJ",
        "orcid": ";;;0000-0001-5715-2142",
        "linkedin": "zahra-babaiee-5b4ba314b;;;",
        "or_profile": "~Zahra_Babaiee1;~Peyman_Kiasari1;~Daniela_Rus1;~Radu_Grosu1",
        "aff": "TU Wien Vienna University of Technology;;Massachusetts Institute of Technology;TU Wien Vienna University of Technology",
        "aff_domain": "tuwien.ac.at;;mit.edu;tuwien.ac.at",
        "position": "PhD student;;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nbabaiee2024unveiling,\ntitle={Unveiling the Unseen: Identifiable Clusters in Trained Depthwise Convolutional Kernels},\nauthor={Zahra Babaiee and Peyman Kiasari and Daniela Rus and Radu Grosu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=4VgBjsOC8k}\n}",
        "github": "",
        "project": "",
        "reviewers": "hU9E;Jbbg;9rPz;GKik",
        "pdf_size": 23199154,
        "rating": "3;6;8;8",
        "confidence": "5;4;4;2",
        "soundness": "3;3;3;4",
        "contribution": "2;3;3;4",
        "presentation": "3;3;3;4",
        "wc_summary": "104;39;93;110",
        "wc_strengths": "36;137;73;219",
        "wc_weaknesses": "225;302;288;461",
        "wc_questions": "217;51;2;104",
        "wc_review": "582;529;456;894",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "876;755;482;865",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;1;2",
        "rating_avg": [
            6.25,
            2.0463381929681126
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            86.5,
            28.09359357576029
        ],
        "wc_strengths_avg": [
            116.25,
            69.45997048660473
        ],
        "wc_weaknesses_avg": [
            319.0,
            86.96263565463043
        ],
        "wc_questions_avg": [
            93.5,
            79.90775932285925
        ],
        "wc_review_avg": [
            615.25,
            167.03798220764043
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            744.5,
            158.76791237526555
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.7567450038061343,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2784907143363510760&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=4VgBjsOC8k",
        "pdf": "https://openreview.net/pdf?id=4VgBjsOC8k",
        "email": "tuwien.ac.at;;mit.edu;tuwien.ac.at",
        "author_num": 4,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Vienna University of Technology;Massachusetts Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tuwien.ac.at;https://web.mit.edu",
        "aff_unique_abbr": "TU Wien;MIT",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Vienna;",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Austria;United States"
    },
    {
        "id": "4WCqddG4Ep",
        "title": "Quantifying Classification Performance through Combinatorial Geometry and Localized Data Analysis",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Understanding the theoretical boundaries of a learning mechanism and ascertaining its fundamental capabilities remains a persistent challenge in machine learning. While the VC-dimension has been instrumental in quantifying a model's data-fitting abilities, its independence from data distribution sometimes limits its practicality. In this study, we address the problem of establishing realistic bounds on a model\u2019s classification power by harnessing the underlying combinatorial geometry of data using novel tools. We introduce conditions that rely on \\emph{local} computations performed on small data subsets to determine the \\emph{global} performance of classifiers. Specifically, by considering a dataset $\\{(X_i,y_i)\\}_{i=1}^{n}$, where $X_i\\in\\mathbb{R}^d$ is a feature vector and $y_i$ is the corresponding label, we establish optimal bounds on the training error (in terms of number of misclassifications) of a linear classifier based on the linear separability of local data subsets, each comprising of $(d + 2)$ data points. We also prove an optimal bound on the margin of Support Vector Machines (SVMs) in terms of performance of SVMs on $(d+2)$ sized subsets. Furthermore, we extend these results to a non-linear classifier employing hypersphere boundary separation. Our experimental results underscore the significance and applicability of these theoretical bounds in real-world machine learning scenarios. This research contributes valuable insights into assessing the classification potential of both linear and non-linear models for large datasets. By emphasizing local computations on subsets of data with fixed cardinality, it provides a foundation for informed and efficient decision-making in practical machine learning applications.",
        "keywords": "lower bound;geometrical insights;local data;classification performance;combinatorics;linear separation",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Christopher Lee;Mudassir Shabbir;Waseem Abbas",
        "authorids": "~Christopher_Lee10;~Mudassir_Shabbir1;~Waseem_Abbas2",
        "gender": "M;;",
        "homepage": ";;http://www.wabbas.com/",
        "dblp": ";78/7323;79/11046",
        "google_scholar": ";https://scholar.google.com.pk/citations?user=bRKvwRYAAAAJ;U9oBOmMAAAAJ",
        "orcid": "0000-0003-0477-7450;;",
        "linkedin": ";;",
        "or_profile": "~Christopher_Lee10;~Mudassir_Shabbir1;~Waseem_Abbas2",
        "aff": "University of Texas at Dallas;ITU of Punjab Lahore, Pakistan;The University of Texas at Dallas",
        "aff_domain": "utdallas.edu;itu.edu.pk;utdallas.edu",
        "position": "PhD student;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nlee2024quantifying,\ntitle={Quantifying Classification Performance through Combinatorial Geometry and Localized Data Analysis},\nauthor={Christopher Lee and Mudassir Shabbir and Waseem Abbas},\nyear={2024},\nurl={https://openreview.net/forum?id=4WCqddG4Ep}\n}",
        "github": "",
        "project": "",
        "reviewers": "re7m;RpW5;VSAx;VFVG;t2D4",
        "site": "https://openreview.net/forum?id=4WCqddG4Ep",
        "pdf_size": 612816,
        "rating": "3;5;5;5;6",
        "confidence": "4;3;4;5;3",
        "soundness": "4;3;4;4;2",
        "contribution": "1;2;2;3;3",
        "presentation": "3;2;4;3;2",
        "wc_summary": "86;53;153;62;72",
        "wc_strengths": "49;15;45;109;65",
        "wc_weaknesses": "395;75;104;303;70",
        "wc_questions": "2;20;1;226;2",
        "wc_review": "532;163;303;700;209",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            4.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.8,
            0.7483314773547882
        ],
        "soundness_avg": [
            3.4,
            0.8
        ],
        "contribution_avg": [
            2.2,
            0.7483314773547882
        ],
        "presentation_avg": [
            2.8,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            85.2,
            35.628078814328454
        ],
        "wc_strengths_avg": [
            56.6,
            30.78701024783017
        ],
        "wc_weaknesses_avg": [
            189.4,
            134.02477382931858
        ],
        "wc_questions_avg": [
            50.2,
            88.18707388274089
        ],
        "wc_review_avg": [
            381.4,
            203.83974097314783
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3273268353539886,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:XXbM6lowOY0J:scholar.google.com/&scioq=Quantifying+Classification+Performance+through+Combinatorial+Geometry+and+Localized+Data+Analysis&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Texas at Dallas;ITU of Punjab",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.utdallas.edu;",
        "aff_unique_abbr": "UT Dallas;",
        "aff_campus_unique_index": "0;1;0",
        "aff_campus_unique": "Dallas;Lahore",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United States;Pakistan"
    },
    {
        "id": "4WKDwIaF7y",
        "title": "Lookahead Sharpness-Aware Minimization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Sharpness-Aware Minimization (SAM), which performs gradient descent on adversarially perturbed weights, can improve generalization by\nidentifying flatter minima. However, recent studies have shown that SAM may suffer from convergence instability and oscillate around saddle points, resulting in slow convergence and inferior performance.\nTo address this problem, we propose the use of a lookahead mechanism in the methods of extra-gradient and optimistic gradient.\nBy examining the nature of SAM, we simplify the extrapolation procedure, resulting in a more efficient algorithm.\nTheoretical results show that the proposed method  converge to a stationary point and escape saddle points faster. Experiments on standard benchmark datasets also verify that the proposed method outperforms the SOTAs, and converge more effectively to flat minima.",
        "keywords": "Deep Learning;Sharpness-Aware Minimization",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Runsheng Yu;Youzhi Zhang;James Kwok",
        "authorids": "~Runsheng_Yu2;~Youzhi_Zhang2;~James_Kwok1",
        "gender": "Not Specified;;",
        "homepage": "https://www.linkedin.com/in/runsheng-yu-560696127/;https://youzhi333.github.io/index.html;",
        "dblp": "210/2646.html?q=runsheng%20yu;131/9490-1;",
        "google_scholar": ";i2j5DmwAAAAJ;",
        "orcid": "0000-0003-0053-1234;0000-0002-2984-734X;",
        "linkedin": ";;",
        "or_profile": "~Runsheng_Yu2;~Youzhi_Zhang2;~James_Kwok1",
        "aff": "Hong Kong University of Science and Technology;Centre for Artificial Intelligence and Robotics, Hong Kong Institute of Science & Innovation, Chinese Academy of Sciences;",
        "aff_domain": "ust.hk;cair-cas.org.hk;",
        "position": "PhD student;Assistant Professor;",
        "bibtex": "@misc{\nyu2024lookahead,\ntitle={Lookahead Sharpness-Aware Minimization},\nauthor={Runsheng Yu and Youzhi Zhang and James Kwok},\nyear={2024},\nurl={https://openreview.net/forum?id=4WKDwIaF7y}\n}",
        "github": "",
        "project": "",
        "reviewers": "hY3b;1P81;gBpE;rtXV",
        "site": "https://openreview.net/forum?id=4WKDwIaF7y",
        "pdf_size": 4328500,
        "rating": "3;5;5;6",
        "confidence": "4;4;4;3",
        "soundness": "3;3;3;3",
        "contribution": "1;3;2;2",
        "presentation": "2;3;2;3",
        "wc_summary": "124;59;20;101",
        "wc_strengths": "14;100;11;63",
        "wc_weaknesses": "587;5;145;73",
        "wc_questions": "71;284;1;2",
        "wc_review": "796;448;177;239",
        "wc_reply_reviewers": "251;74;63;15",
        "wc_reply_authors": "3041;894;908;682",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "5;3;2;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            76.0,
            39.85599076675927
        ],
        "wc_strengths_avg": [
            47.0,
            36.9120576505835
        ],
        "wc_weaknesses_avg": [
            202.5,
            227.44394913912308
        ],
        "wc_questions_avg": [
            89.5,
            115.82422026502056
        ],
        "wc_review_avg": [
            415.0,
            241.8005376338109
        ],
        "wc_reply_reviewers_avg": [
            100.75,
            89.5387485952311
        ],
        "wc_reply_authors_avg": [
            1381.25,
            962.4316534175297
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.75,
            1.479019945774904
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.6622661785325219,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:gTAxBl5bXQYJ:scholar.google.com/&scioq=Lookahead+Sharpness-Aware+Minimization&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Hong Kong Institute of Science & Innovation, Chinese Academy of Sciences",
        "aff_unique_dep": ";Centre for Artificial Intelligence and Robotics",
        "aff_unique_url": "https://www.ust.hk;",
        "aff_unique_abbr": "HKUST;",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Learning from Sparse Offline Datasets via Conservative Density Estimation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19460",
        "id": "4WM0OogPTx",
        "author_site": "Zhepeng Cen, Zuxin Liu, Zitong Wang, Yihang Yao, Henry Lam, DING ZHAO",
        "tldr": "",
        "abstract": "Offline reinforcement learning (RL) offers a promising direction for learning policies from pre-collected datasets without requiring further interactions with the environment. However, existing methods struggle to handle out-of-distribution (OOD) extrapolation errors, especially in sparse reward or scarce data settings. In this paper, we propose a novel training algorithm called Conservative Density Estimation (CDE), which addresses this challenge by explicitly imposing constraints on the state-action occupancy stationary distribution. CDE overcomes the limitations of existing approaches, such as the stationary distribution correction method, by addressing the support mismatch issue in marginal importance sampling. Our method achieves state-of-the-art performance on the D4RL benchmark. Notably, CDE consistently outperforms baselines in challenging tasks with sparse rewards or insufficient data, demonstrating the advantages of our approach in addressing the extrapolation error problem in offline RL.",
        "keywords": "offline reinforcement learning;stationary distribution correction estimation",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Zhepeng Cen;Zuxin Liu;Zitong Wang;Yihang Yao;Henry Lam;Ding Zhao",
        "authorids": "~Zhepeng_Cen1;~Zuxin_Liu1;~Zitong_Wang1;~Yihang_Yao1;~Henry_Lam1;~Ding_Zhao1",
        "gender": "M;M;M;;;",
        "homepage": "https://czp16.github.io/;https://www.zuxin.me;;https://yihangyao.github.io/;http://www.columbia.edu/~khl2114/;https://safeai-lab.github.io",
        "dblp": "254/6182;227/3137;;305/7045.html;35/9508;",
        "google_scholar": "M-X3Q-UAAAAJ;5ApCTCoAAAAJ;v6UwRlwAAAAJ;EPduTdwAAAAJ;Bnj50x0AAAAJ;z7tPc9IAAAAJ",
        "orcid": ";0000-0001-7412-5074;;;;",
        "linkedin": ";zuxin-liu/;;yihang-yao-3a7658249/;;",
        "or_profile": "~Zhepeng_Cen1;~Zuxin_Liu1;~Zitong_Wang1;~Yihang_Yao1;~Henry_Lam1;~Ding_Zhao1",
        "aff": "Carnegie Mellon University;Salesforce AI Research;Columbia University;Carnegie Mellon University;Columbia University;Carnegie Mellon University",
        "aff_domain": "andrew.cmu.edu;salesforce.com;columbia.edu;cmu.edu;columbia.edu;cmu.edu",
        "position": "PhD student;Researcher;PhD student;PhD student;Associate Professor;Associate Professor",
        "bibtex": "@inproceedings{\ncen2024learning,\ntitle={Learning from Sparse Offline Datasets via Conservative Density Estimation},\nauthor={Zhepeng Cen and Zuxin Liu and Zitong Wang and Yihang Yao and Henry Lam and Ding Zhao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=4WM0OogPTx}\n}",
        "github": "",
        "project": "",
        "reviewers": "MKs2;HRnW;6pFf;voqr",
        "pdf_size": 2547850,
        "rating": "5;6;8;8",
        "confidence": "4;3;3;3",
        "soundness": "2;3;3;3",
        "contribution": "2;3;4;3",
        "presentation": "2;3;3;3",
        "wc_summary": "39;68;37;236",
        "wc_strengths": "35;129;86;38",
        "wc_weaknesses": "231;168;117;137",
        "wc_questions": "38;2;37;2",
        "wc_review": "343;367;277;413",
        "wc_reply_reviewers": "0;0;51;0",
        "wc_reply_authors": "1135;568;572;311",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "2;1;2;1",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            95.0,
            82.32557318354972
        ],
        "wc_strengths_avg": [
            72.0,
            38.632887544163715
        ],
        "wc_weaknesses_avg": [
            163.25,
            43.129891026989625
        ],
        "wc_questions_avg": [
            19.75,
            17.75352077758099
        ],
        "wc_review_avg": [
            350.0,
            49.08156476723211
        ],
        "wc_reply_reviewers_avg": [
            12.75,
            22.083647796503186
        ],
        "wc_reply_authors_avg": [
            646.5,
            301.207984621922
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.7777777777777777,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12655561621720249093&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=4WM0OogPTx",
        "pdf": "https://openreview.net/pdf?id=4WM0OogPTx",
        "email": "andrew.cmu.edu;salesforce.com;columbia.edu;cmu.edu;columbia.edu;cmu.edu",
        "author_num": 6,
        "aff_unique_index": "0;1;2;0;2;0",
        "aff_unique_norm": "Carnegie Mellon University;Salesforce;Columbia University",
        "aff_unique_dep": ";Salesforce AI Research;",
        "aff_unique_url": "https://www.cmu.edu;https://www.salesforce.com;https://www.columbia.edu",
        "aff_unique_abbr": "CMU;Salesforce AI;Columbia",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "4WRoRL0YKR",
        "title": "Explainable Multi-Objective Model Selection for Time Series Forecasting",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Machine learning (ML) models exhibit miscellaneous properties, and deployment inevitably trades certain performance aspects against others. This is particularly valid for time series forecasting, where special characteristics such as seasonality impact how models perform. Since there is \u201cno free lunch\u201d, practitioners have to choose among available methods when assembling new learning systems. Benchmarks, meta-learning, and automated ML come to aid, but in many cases focus on predictive capabilities while ignoring other aspects such as complexity and resource consumption. This is especially concerning considering the popularity of deep neural networks (DNNs) for forecasting, as these models are widely conceived as computation-heavy black boxes. To alleviate these shortcomings, we propose X-PCR \u2013 a novel approach for explainable multi-objective model selection. It uses meta-learning to assess the suitability of any model in terms of (p)redictive error, (c)omplexity and (r)esource demand. By allowing users to prioritize the individual objectives in this trade-off, model recommendations become both controllable and understandable. We demonstrate the feasibility of our methodology in the task of forecasting time series with state-of-the-art DNNs. In total, we perform over 1000 experiments across 114 data sets, discuss the resulting efficiency landscape, and provide evidence of how X-PCR outperforms other selection approaches. On average, our approach only requires 20% of computation costs for recommending models with 85% of the best possible performance.",
        "keywords": "Meta-learning;Time Series Forecasting;Resource-aware ML;Explainability;Trustworthy AI",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Raphael Fischer;Amal Saadallah",
        "authorids": "~Raphael_Fischer1;~Amal_Saadallah1",
        "gender": "M;F",
        "homepage": "https://lamarr.cs.tu-dortmund.de/team/raphael-fischer;https://www-ai.cs.tu-dortmund.de/PERSONAL/saadallah.html",
        "dblp": "249/4056;242/4220.html",
        "google_scholar": "https://scholar.google.de/citations?user=zxTGb7AAAAAJ;UxU-Q-gAAAAJ",
        "orcid": "0000-0002-1808-5773;0000-0003-2976-7574",
        "linkedin": "raphael-fischer-3b1046208/;",
        "or_profile": "~Raphael_Fischer1;~Amal_Saadallah1",
        "aff": "TU Dortmund University;Technische Universit\u00e4t Dortmund",
        "aff_domain": "udo.edu;tu-dortmund.de",
        "position": "PhD student;Postdoc",
        "bibtex": "@misc{\nfischer2024explainable,\ntitle={Explainable Multi-Objective Model Selection for Time Series Forecasting},\nauthor={Raphael Fischer and Amal Saadallah},\nyear={2024},\nurl={https://openreview.net/forum?id=4WRoRL0YKR}\n}",
        "github": "",
        "project": "",
        "reviewers": "m8sj;4DT3;Sacq",
        "site": "https://openreview.net/forum?id=4WRoRL0YKR",
        "pdf_size": 753472,
        "rating": "3;3;5",
        "confidence": "4;3;3",
        "soundness": "1;2;2",
        "contribution": "1;1;2",
        "presentation": "2;2;2",
        "wc_summary": "76;96;57",
        "wc_strengths": "17;17;56",
        "wc_weaknesses": "339;111;72",
        "wc_questions": "85;70;72",
        "wc_review": "517;294;257",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "133;79;86",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            76.33333333333333,
            15.923427883328248
        ],
        "wc_strengths_avg": [
            30.0,
            18.384776310850235
        ],
        "wc_weaknesses_avg": [
            174.0,
            117.75398082442904
        ],
        "wc_questions_avg": [
            75.66666666666667,
            6.649979114420002
        ],
        "wc_review_avg": [
            356.0,
            114.84192033689904
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            99.33333333333333,
            23.976840677805924
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:jSpCvMouZPoJ:scholar.google.com/&scioq=Explainable+Multi-Objective+Model+Selection+for+Time+Series+Forecasting&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Technische Universit\u00e4t Dortmund",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tu-dortmund.de",
        "aff_unique_abbr": "TU Dortmund",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Dortmund;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "4WZNdnwmhk",
        "title": "Parameter-Efficient Fine-Tuning via Partially Decomposable Loss Analysis and Sharing",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large language model (LLM) has become a crucial tool for many machine learning research and applications. Due to the large parameter count of these models and the enormous amount of training data, large language models are usually strong at general tasks. For most applications however, one would like a smaller, more parameter-efficient model that is specialized in a particular field. This motivates the design of fine-tuning, which tunes a pre-trained LLM for a few iterations on a dedicated dataset for specific tasks. If not handled correctly, the fine-tuning process would create another LLM that has comparable amount of parameters, significantly slowers downstream applications.\n\nOne of the most widely-known ideas for resolving this issue is the Low-Rank Adaptation (LoRA) framework, where one assumes the fine-tuning weights are low-rank therefore the number of parameters together with the inference time is drastically improved. While performing well in practice, LoRA method is still a heuristic and lacks theoretical guarantees even though the loss function might inherit certain structures. Moreover, when fine-tuning multiple similar tasks in parallel, LoRA requires one to learn a pair of distinct low-rank matrices for each task, ignoring possible shared structure between tasks.\n\nIn this work, we design a framework that further reduces parameter count compared to LoRA and enables parameter sharing across different parallel fine-tuning tasks. When the number of parallel fine-tuning tasks grows larger, we cut the parameter count almost in half compared to LoRA. Moreover, we prove why our approach --- or more generally, LoRA works for a large class of loss functions. We empirically verify the effectiveness of our method on various benchmark models and datasets, demonstrating much improved parameter count while retaining similar performance as LoRA.",
        "keywords": "Fine-tuning;efficient training",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Raghavendra Addanki;Ritwik Sinha;Zhao Song;Yizhou Wang;Lichen Zhang",
        "authorids": "~Raghavendra_Addanki1;~Ritwik_Sinha1;~Zhao_Song3;~Yizhou_Wang3;~Lichen_Zhang2",
        "gender": "M;M;M;M;M",
        "homepage": "https://raddanki.github.io/;https://research.adobe.com/person/ritwik-sinha/;https://www.youtube.com/@zhaosong2031;https://wyzjack.github.io/;https://lczh.github.io/",
        "dblp": "218/5579;127/3163;76/4051-2;71/3387-6;00/6357-3",
        "google_scholar": "SUPaOhgAAAAJ;https://scholar.google.co.in/citations?user=4SDTMIQAAAAJ;yDZct7UAAAAJ;H4kqV1MAAAAJ;https://scholar.google.com/citations?view_op=list_works",
        "orcid": ";;;0000-0003-1601-9649;",
        "linkedin": ";;;yizhou-wang-786603155/;",
        "or_profile": "~Raghavendra_Addanki1;~Ritwik_Sinha1;~Zhao_Song3;~Yizhou_Wang3;~Lichen_Zhang2",
        "aff": "Adobe Systems;Adobe Systems;Adobe;Northeastern University;Amazon",
        "aff_domain": "adobe.com;adobe.com;adobe.com;northeastern.edu;amazon.com",
        "position": "Research Scientist;Researcher;Researcher;PhD student;Intern",
        "bibtex": "@misc{\naddanki2024parameterefficient,\ntitle={Parameter-Efficient Fine-Tuning via Partially Decomposable Loss Analysis and Sharing},\nauthor={Raghavendra Addanki and Ritwik Sinha and Zhao Song and Yizhou Wang and Lichen Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=4WZNdnwmhk}\n}",
        "github": "",
        "project": "",
        "reviewers": "rWs7;GVCH;Va7k",
        "site": "https://openreview.net/forum?id=4WZNdnwmhk",
        "pdf_size": 265640,
        "rating": "3;3;5",
        "confidence": "4;2;3",
        "soundness": "1;2;3",
        "contribution": "2;3;2",
        "presentation": "3;3;3",
        "wc_summary": "28;99;87",
        "wc_strengths": "29;85;79",
        "wc_weaknesses": "218;53;107",
        "wc_questions": "8;2;71",
        "wc_review": "283;239;344",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            71.33333333333333,
            31.030450993965413
        ],
        "wc_strengths_avg": [
            64.33333333333333,
            25.104227178350307
        ],
        "wc_weaknesses_avg": [
            126.0,
            68.68769904429759
        ],
        "wc_questions_avg": [
            27.0,
            31.20897306865447
        ],
        "wc_review_avg": [
            288.6666666666667,
            43.05293898859351
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:rwCji96uKrUJ:scholar.google.com/&scioq=Parameter-Efficient+Fine-Tuning+via+Partially+Decomposable+Loss+Analysis+and+Sharing&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;2",
        "aff_unique_norm": "Adobe;Northeastern University;Amazon",
        "aff_unique_dep": "Adobe Systems Incorporated;;Amazon.com, Inc.",
        "aff_unique_url": "https://www.adobe.com;https://www.northeastern.edu;https://www.amazon.com",
        "aff_unique_abbr": "Adobe;NEU;Amazon",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Llemma: An Open Language Model for Mathematics",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19459",
        "id": "4WnqRR915j",
        "author_site": "Zhangir Azerbayev, Hailey Schoelkopf, Keiran Paster, Marco Dos Santos, Stephen McAleer, Qiaochu Jiang, Jia Deng, Stella R Biderman, Sean Welleck",
        "tldr": "",
        "abstract": "We present Llemma, a large language model for mathematics. We continue pretraining Code Llama on the Proof-Pile-2, a mixture of scientific papers, web data containing mathematics, and mathematical code, yielding Llemma. On the MATH benchmark Llemma outperforms all known openly released models, as well as the unreleased Minerva model suite on an equi-parameter basis. Moreover, Llemma is capable of tool use and formal theorem proving without any finetuning. We openly release all artifacts, including 7 billion and 34 billion parameter models, the Proof-Pile-2, and code to replicate our experiments.",
        "keywords": "reasoning;language models;pretraining",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/1db90b39240173c73d9cf5a455dc8fb7ce342985.zip",
        "author": "Zhangir Azerbayev;Hailey Schoelkopf;Keiran Paster;Marco Dos Santos;Stephen Marcus McAleer;Albert Q. Jiang;Jia Deng;Stella Biderman;Sean Welleck",
        "authorids": "~Zhangir_Azerbayev1;~Hailey_Schoelkopf1;~Keiran_Paster1;~Marco_Dos_Santos1;~Stephen_Marcus_McAleer1;~Albert_Q._Jiang1;~Jia_Deng1;~Stella_Biderman1;~Sean_Welleck1",
        "gender": "M;F;M;M;M;;M;F;",
        "homepage": ";;http://keirp.com;;https://www.andrew.cmu.edu/user/smcaleer/;;;http://www.stellabiderman.com;",
        "dblp": ";;;;;;07/6526-1.html;239/5641;",
        "google_scholar": ";XLahYIYAAAAJ;;;iEFL4-YAAAAJ;;U3Eub-EAAAAJ;bO7H0DAAAAAJ;",
        "orcid": ";;;;;;;0000-0001-8228-1042;",
        "linkedin": "zhangir-azerbayev-314ab21b8/;;;dsantosmarco/;stephen-mcaleer/;;;stellabiderman;",
        "or_profile": "~Zhangir_Azerbayev1;~Hailey_Schoelkopf1;~Keiran_Paster1;~Marco_Dos_Santos1;~Stephen_Marcus_McAleer1;~Albert_Q._Jiang1;~Jia_Deng1;~Stella_Biderman1;~Sean_Welleck1",
        "aff": ";EleutherAI;University of Toronto;Sorbonne University;Carnegie Mellon University;;Princeton University;Booz Allen Hamilton;",
        "aff_domain": ";eleuther.ai;toronto.edu;sorbonne-universite.fr;cmu.edu;;princeton.edu;boozallen.com;",
        "position": ";Researcher;PhD student;MS student;Postdoc;;Associate Professor;Industry researcher;",
        "bibtex": "@inproceedings{\nazerbayev2024llemma,\ntitle={Llemma: An Open Language Model for Mathematics},\nauthor={Zhangir Azerbayev and Hailey Schoelkopf and Keiran Paster and Marco Dos Santos and Stephen Marcus McAleer and Albert Q. Jiang and Jia Deng and Stella Biderman and Sean Welleck},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=4WnqRR915j}\n}",
        "github": "",
        "project": "",
        "reviewers": "JQiP;HYfd;Ch2c",
        "pdf_size": 441862,
        "rating": "6;6;8",
        "confidence": "2;4;3",
        "soundness": "2;3;3",
        "contribution": "3;3;3",
        "presentation": "3;3;3",
        "wc_summary": "57;54;26",
        "wc_strengths": "56;37;53",
        "wc_weaknesses": "160;37;55",
        "wc_questions": "22;17;29",
        "wc_review": "295;145;163",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "488;592;390",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            45.666666666666664,
            13.960261060914616
        ],
        "wc_strengths_avg": [
            48.666666666666664,
            8.339997335464536
        ],
        "wc_weaknesses_avg": [
            84.0,
            54.24020648928247
        ],
        "wc_questions_avg": [
            22.666666666666668,
            4.9216076867444665
        ],
        "wc_review_avg": [
            201.0,
            66.87301398920195
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            490.0,
            82.47827996913288
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 320,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8004581123322544769&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 8,
        "openreview": "https://openreview.net/forum?id=4WnqRR915j",
        "pdf": "https://openreview.net/pdf?id=4WnqRR915j",
        "email": ";eleuther.ai;toronto.edu;sorbonne-universite.fr;cmu.edu;;princeton.edu;boozallen.com;",
        "author_num": 9,
        "aff_unique_index": "0;1;2;3;4;5",
        "aff_unique_norm": "EleutherAI;University of Toronto;Sorbonne University;Carnegie Mellon University;Princeton University;Booz Allen Hamilton",
        "aff_unique_dep": ";;;;;",
        "aff_unique_url": "https://www.eleuther.ai;https://www.utoronto.ca;https://www.sorbonne.universite.fr;https://www.cmu.edu;https://www.princeton.edu;https://www.boozallen.com",
        "aff_unique_abbr": "EleutherAI;U of T;Sorbonne;CMU;Princeton;BAH",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;0;0;0",
        "aff_country_unique": "United States;Canada;France"
    },
    {
        "id": "4XCfu7fTgw",
        "title": "Spectral Contrastive Regression",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "While several techniques have been proposed to enhance the generalization of\ndeep learning models for classification problems, limited research has been con-\nducted on improving generalization for regression tasks. This is primarily due\nto the continuous nature of regression labels, which makes it challenging to di-\nrectly apply classification-based techniques to regression tasks. Conversely, exist-\ning regression methods overlook feature-level generalization and primarily focus\non data augmentation using linear interpolation, which may not be an effective\napproach for synthesizing data for regression. In this paper, we introduce a novel\ngeneralization method for regression tasks based on the metric learning assump-\ntion that the distance between features and labels should be proportional. Unlike\nprevious approaches that solely consider the scale prediction of this proportion and\ndisregard its variation among samples, we argue that this proportion is not constant\nand can be defined as a mapping function. Additionally, we propose minimizing\nthe error of this function and stabilizing its fluctuating behavior by smoothing\nout its variations. The t-SNE visualization of the embedding space demonstrates\nthat our proposed loss function generates a more discriminative pattern with re-\nduced variance. To enhance Out-of-Distribution (OOD) generalization, we lever-\nage the characteristics of the spectral norm (i.e., the sub-multiplicativity of the\nspectral norm of the feature matrix can be expressed as Frobenius norm of the\noutput), and align the maximum singular value of the feature matrices across dif-\nferent domains. Experimental results on the MPI3D benchmark dataset reveal\nthat aligning the spectral norms significantly improves the unstable performance\non OOD data. We conduct experiments on eight benchmark datasets for domain\ngeneralization in regression, and our method consistently outperforms state-of-\nthe-art approaches in the majority of cases. Our code is available in an anonymous\nrepository, and it will be made publicly available upon acceptance of the paper: https://github.com/workerasd/SCR",
        "keywords": "Metric Learning;Out-of-Distribution Generalization;In-Distribution Generalization;Regression",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Kaiyu Guo;Zijian Wang;Brian C. Lovell;Mahsa Baktashmotlagh",
        "authorids": "~Kaiyu_Guo2;~Zijian_Wang2;~Brian_C._Lovell1;~Mahsa_Baktashmotlagh1",
        "gender": "M;M;F;M",
        "homepage": ";;;https://staff.itee.uq.edu.au/lovell/",
        "dblp": "262/2952;03/4540-9;119/1507;09/2347",
        "google_scholar": "fC6KpI0AAAAJ;OfTXHvsAAAAJ;https://scholar.google.com.au/citations?user=3kaiBBYAAAAJ;https://scholar.google.com.au/citations?user=gXiGxcMAAAAJ",
        "orcid": "0000-0002-4187-2839;;;0000-0001-6722-1754",
        "linkedin": ";;;brian-lovell-0997594/",
        "or_profile": "~Kaiyu_Guo2;~Zijian_Wang2;~Mahsa_Baktashmotlagh1;~Brian_Lovell1",
        "aff": "University of Queensland;The University of Queensland;The University of Queensland;University of Queensland",
        "aff_domain": "uq.edu.au;uq.edu.au;uq.edu.au;uq.edu.au",
        "position": "PhD student;Postdoc;Assistant Professor;Professor",
        "bibtex": "@misc{\nguo2024spectral,\ntitle={Spectral Contrastive Regression},\nauthor={Kaiyu Guo and Zijian Wang and Brian C. Lovell and Mahsa Baktashmotlagh},\nyear={2024},\nurl={https://openreview.net/forum?id=4XCfu7fTgw}\n}",
        "github": "",
        "project": "",
        "reviewers": "xKM4;xHdj;Rgn5",
        "site": "https://openreview.net/forum?id=4XCfu7fTgw",
        "pdf_size": 5375266,
        "rating": "5;5;5",
        "confidence": "4;3;4",
        "soundness": "3;3;3",
        "contribution": "2;3;2",
        "presentation": "2;2;3",
        "wc_summary": "104;65;41",
        "wc_strengths": "11;72;47",
        "wc_weaknesses": "133;117;65",
        "wc_questions": "34;392;243",
        "wc_review": "282;646;396",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "744;395;973",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;1;3",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            70.0,
            25.96150997149434
        ],
        "wc_strengths_avg": [
            43.333333333333336,
            25.037749277618563
        ],
        "wc_weaknesses_avg": [
            105.0,
            29.028721409436322
        ],
        "wc_questions_avg": [
            223.0,
            146.83550887529444
        ],
        "wc_review_avg": [
            441.3333333333333,
            152.020466458376
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            704.0,
            237.6566150282097
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:dSDibI2Z_vMJ:scholar.google.com/&scioq=Spectral+Contrastive+Regression&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of Queensland",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uq.edu.au",
        "aff_unique_abbr": "UQ",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Australia"
    },
    {
        "id": "4Y4hPWUppN",
        "title": "Key point is key in resolving the offline three-dimensional bin packing problem",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In recent years, with the surge in deep learning and reinforcement learning, researchers have begun to explore the use of deep reinforcement learning to solve the offline three-dimensional bin packing problem. However, the valid action space in the offline three-dimensional bin packing problem is quite large, making it difficult for the model to converge as the number of boxes increases. Therefore, reducing the number of valid actions is crucial. In previous studies, many researchers have developed heuristic rules to reduce the number of effective actions. However, some of these heuristic rules drastically reduce the number of valid actions, potentially forgoing the optimal solution, while others do not sufficiently reduce the number of effective actions, making it still challenging for the model to converge when there are many boxes.In response to this, we propose a heuristic rule where boxes are placed only at certain specific locations, which we refer to as Key Points, while other locations are masked. This method integrates well with existing deep reinforcement learning models for solving the offline three-dimensional bin packing problem. We not only theoretically demonstrate the efficacy of this heuristic rule but also empirically show that when our method is combined with existing models, it can easily train with four times the number of boxes. The model converges ten times faster than before, and its performance also improves. Interestingly, even without retraining the model, using our method in the testing phase yields better results than the original method. We also compare our method to other heuristic rules. Experimental results show that our approach strikes a balance between convergence speed and performance.",
        "keywords": "deep reinforcement learning; three-dimensional offline packing;",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/a6379ff5d04f970d800bd7b1e295da271271eef3.zip",
        "author": "Xinyuan Tian;pengzhan qu;Hongsheng Qi",
        "authorids": "~Xinyuan_Tian1;~pengzhan_qu1;~Hongsheng_Qi1",
        "gender": ";;M",
        "homepage": ";;https://lenovo.com",
        "dblp": ";;",
        "google_scholar": ";;",
        "orcid": ";0000-0001-5910-3694;",
        "linkedin": ";;hong-sheng-qi-a542151/",
        "or_profile": "~Xinyuan_Tian1;~pengzhan_qu1;~Hongsheng_Qi1",
        "aff": ";Lenovo;Xi'an University of Electronic Science and Technology",
        "aff_domain": ";lenovo.com;xidian.edu.cn",
        "position": ";Principal Researcher;Lecturer",
        "bibtex": "@misc{\ntian2024key,\ntitle={Key point is key in resolving the offline three-dimensional bin packing problem},\nauthor={Xinyuan Tian and pengzhan qu and Hongsheng Qi},\nyear={2024},\nurl={https://openreview.net/forum?id=4Y4hPWUppN}\n}",
        "github": "",
        "project": "",
        "reviewers": "RRYs;TnxE;z1aJ",
        "site": "https://openreview.net/forum?id=4Y4hPWUppN",
        "pdf_size": 537850,
        "rating": "1;3;3",
        "confidence": "5;4;5",
        "soundness": "3;2;2",
        "contribution": "1;3;2",
        "presentation": "3;1;1",
        "wc_summary": "84;93;43",
        "wc_strengths": "37;25;34",
        "wc_weaknesses": "356;102;350",
        "wc_questions": "15;37;28",
        "wc_review": "492;257;455",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            73.33333333333333,
            21.761331658599286
        ],
        "wc_strengths_avg": [
            32.0,
            5.0990195135927845
        ],
        "wc_weaknesses_avg": [
            269.3333333333333,
            118.34788642904539
        ],
        "wc_questions_avg": [
            26.666666666666668,
            9.030811456096044
        ],
        "wc_review_avg": [
            401.3333333333333,
            103.1708399802106
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:j_3GAMb_huUJ:scholar.google.com/&scioq=Key+point+is+key+in+resolving+the+offline+three-dimensional+bin+packing+problem&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Lenovo Group Limited;Xi'an University of Electronic Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.lenovo.com;http://www.xidian.edu.cn/",
        "aff_unique_abbr": "Lenovo;Xidian University",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Xi'an",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "NfgTransformer: Equivariant Representation Learning for Normal-form Games",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19458",
        "id": "4YESQqIys7",
        "author_site": "SIQI LIU, Luke Marris, Georgios Piliouras, Ian Gemp, Nicolas Heess",
        "tldr": "",
        "abstract": "Normal-form games (NFGs) are the fundamental model of *strategic interaction*. We study their representation using neural networks. We describe the inherent equivariance of NFGs --- any permutation of strategies describes an equivalent game --- as well as the challenges this poses for representation learning. We then propose the NfgTransformer architecture that leverages this equivariance, leading to state-of-the-art performance in a range of game-theoretic tasks including equilibrium-solving, deviation gain estimation and ranking, with a common approach to NFG representation. We show that the resulting model is interpretable and versatile, paving the way towards deep learning systems capable of game-theoretic reasoning when interacting with humans and with each other.",
        "keywords": "Game Theory;Deep Learning;Representation Learning;Nash Equilibrium",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/0b4fd48a1700b50096ccdbc85285c7722631b18e.pdf",
        "author": "Siqi Liu;Luke Marris;Georgios Piliouras;Ian Gemp;Nicolas Heess",
        "authorids": "~Siqi_Liu1;~Luke_Marris2;~Georgios_Piliouras1;~Ian_Gemp1;~Nicolas_Heess1",
        "gender": "M;;;M;",
        "homepage": "http://siqi.fr/;https://www.lukemarris.info/;;https://imgemp.github.io/;",
        "dblp": "60/9360-2.html;223/4422;62/1236;66/10996;76/9181",
        "google_scholar": "7U_OA0oAAAAJ;dvTeSX4AAAAJ;;5vo3MeEAAAAJ;79k7bGEAAAAJ",
        "orcid": "0000-0001-6381-4552;;;;",
        "linkedin": ";;;;",
        "or_profile": "~Siqi_Liu1;~Luke_Marris2;~Georgios_Piliouras1;~Ian_Gemp1;~Nicolas_Heess1",
        "aff": "Google;University College London;Singapore University of Technology and Design;Google DeepMind;Google DeepMind",
        "aff_domain": "google.com;ucl.ac.uk;sutd.edu.sg;google.com;google.com",
        "position": "Research Engineer;PhD student;Associate Professor;Research Scientist;Research Scientist",
        "bibtex": "@inproceedings{\nliu2024nfgtransformer,\ntitle={NfgTransformer: Equivariant Representation Learning for Normal-form Games},\nauthor={Siqi Liu and Luke Marris and Georgios Piliouras and Ian Gemp and Nicolas Heess},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=4YESQqIys7}\n}",
        "github": "",
        "project": "",
        "reviewers": "6Yok;s4as;6Avg;pter",
        "pdf_size": 858335,
        "rating": "3;5;8;8",
        "confidence": "4;4;4;3",
        "soundness": "2;2;4;2",
        "contribution": "1;2;4;1",
        "presentation": "1;3;3;1",
        "wc_summary": "56;62;94;29",
        "wc_strengths": "17;47;66;18",
        "wc_weaknesses": "417;205;82;1022",
        "wc_questions": "42;4;57;43",
        "wc_review": "532;318;299;1112",
        "wc_reply_reviewers": "0;61;170;1031",
        "wc_reply_authors": "678;1015;931;1960",
        "reply_reviewers": "0;1;1;5",
        "reply_authors": "2;3;5;7",
        "rating_avg": [
            6.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.0,
            1.224744871391589
        ],
        "presentation_avg": [
            2.0,
            1.0
        ],
        "wc_summary_avg": [
            60.25,
            23.112496619794236
        ],
        "wc_strengths_avg": [
            37.0,
            20.627651344736268
        ],
        "wc_weaknesses_avg": [
            431.5,
            361.3699627805277
        ],
        "wc_questions_avg": [
            36.5,
            19.67866865415443
        ],
        "wc_review_avg": [
            565.25,
            328.6574014076056
        ],
        "wc_reply_reviewers_avg": [
            315.5,
            417.5586785111764
        ],
        "wc_reply_authors_avg": [
            1146.0,
            486.05709541163986
        ],
        "reply_reviewers_avg": [
            1.75,
            1.920286436967152
        ],
        "reply_authors_avg": [
            4.25,
            1.920286436967152
        ],
        "replies_avg": [
            31,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5443310539518174,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16489762721706866882&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=4YESQqIys7",
        "pdf": "https://openreview.net/pdf?id=4YESQqIys7",
        "email": "google.com;ucl.ac.uk;sutd.edu.sg;google.com;google.com",
        "author_num": 5,
        "aff_unique_index": "0;1;2;0;0",
        "aff_unique_norm": "Google;University College London;Singapore University of Technology and Design",
        "aff_unique_dep": "Google;;",
        "aff_unique_url": "https://www.google.com;https://www.ucl.ac.uk;https://www.sutd.edu.sg",
        "aff_unique_abbr": "Google;UCL;SUTD",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Mountain View;",
        "aff_country_unique_index": "0;1;2;1;1",
        "aff_country_unique": "United States;United Kingdom;Singapore"
    },
    {
        "id": "4YK1e3Ehdy",
        "title": "Understanding Deep Neural Networks as Dynamical Systems: Insights into Training and Fine-tuning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "This paper offers an interpretation mechanism for understanding deep neural networks and their learning processes from a dynamical perspective. The aim is to uncover the relationship between the representational capacity of neural networks and the dynamical properties of their corresponding dynamical systems. To this end, we first interpret neural networks as dynamical systems by representing neural weight values as relationships among neuronal dynamics. Then, we model both neural network training and inference as the dynamical phenomena occurring within these systems. Built upon this framework, we introduce the concept of dynamical discrepancy, a macroscopic attribute that describes the dynamical states of neurons. Taking the generalization capability of neural models as a starting point, we launch a hypothesis: the dynamical discrepancy of neuromorphic-dynamical systems correlates with the representational capacity of neural models. We conduct dynamics-based conversions on neural structures such as ResNet, ViT, and LLaMA to investigate this hypothesis on MNIST, ImageNet, SQuAD, and IMDB. The experimental fact reveals that the relationship between these neural models' dynamical discrepancy and representational capacity aligns perfectly with our theoretical conjecture. Building upon these findings, we introduce a universal analytical approach tailored for neural models.",
        "keywords": "Interpretation;Dynamical system;Expressive ability",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/d72b32b38ab46172343f42424475889c9e12d1c9.zip",
        "author": "Shufan Shen;Zhengqi Pei;Shuhui Wang;Qingming Huang",
        "authorids": "~Shufan_Shen1;~Zhengqi_Pei1;~Shuhui_Wang1;~Qingming_Huang1",
        "gender": "M;M;M;",
        "homepage": ";;https://vipl.ict.ac.cn/people/shwang/;https://qmhuang-ucas.github.io/",
        "dblp": "277/0707;223/2296;37/2537;68/4388",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;Qs5zacQAAAAJ;h-JxBSYAAAAJ;https://scholar.google.com.hk/citations?user=J1vMnRgAAAAJ",
        "orcid": ";;0000-0002-5931-0527;",
        "linkedin": ";;;",
        "or_profile": "~Shufan_Shen1;~Zhengqi_Pei1;~Shuhui_Wang1;~Qingming_Huang2",
        "aff": "Institute of Computing Technology, Chinese Academy of Sciences;University of Chinese Academy of Sciences;Institute of Computing Technology, Chinese Academy of Sciences;University of Chinese Academy of Sciences",
        "aff_domain": "ict.ac.cn;ucas.ac.cn;ict.ac.cn;ucas.ac.cn",
        "position": "PhD student;MS student;Full Professor;Full Professor",
        "bibtex": "@misc{\nshen2024understanding,\ntitle={Understanding Deep Neural Networks as Dynamical Systems: Insights into Training and Fine-tuning},\nauthor={Shufan Shen and Zhengqi Pei and Shuhui Wang and Qingming Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=4YK1e3Ehdy}\n}",
        "github": "",
        "project": "",
        "reviewers": "DroU;K7Rz;YDs9;diZv;DpVF",
        "site": "https://openreview.net/forum?id=4YK1e3Ehdy",
        "pdf_size": 5740253,
        "rating": "1;1;3;3;5",
        "confidence": "2;5;3;4;3",
        "soundness": "2;1;2;2;2",
        "contribution": "2;1;2;1;2",
        "presentation": "1;1;1;1;2",
        "wc_summary": "32;67;53;97;65",
        "wc_strengths": "17;12;24;35;127",
        "wc_weaknesses": "202;281;236;165;79",
        "wc_questions": "12;7;20;185;50",
        "wc_review": "263;367;333;482;321",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            2.6,
            1.4966629547095767
        ],
        "confidence_avg": [
            3.4,
            1.019803902718557
        ],
        "soundness_avg": [
            1.8,
            0.4000000000000001
        ],
        "contribution_avg": [
            1.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            1.2,
            0.4
        ],
        "wc_summary_avg": [
            62.8,
            21.15088650624366
        ],
        "wc_strengths_avg": [
            43.0,
            42.703629822299646
        ],
        "wc_weaknesses_avg": [
            192.6,
            68.488247166941
        ],
        "wc_questions_avg": [
            54.8,
            66.78742396589345
        ],
        "wc_review_avg": [
            353.2,
            72.60964123310347
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.1572427255082878,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:zFkJi5lbB04J:scholar.google.com/&scioq=Understanding+Deep+Neural+Networks+as+Dynamical+Systems:+Insights+into+Training+and+Fine-tuning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;1",
        "aff_unique_norm": "Chinese Academy of Sciences;University of Chinese Academy of Sciences",
        "aff_unique_dep": "Institute of Computing Technology;",
        "aff_unique_url": "http://www.ict.ac.cn;http://www.ucas.ac.cn",
        "aff_unique_abbr": "CAS;UCAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "4YgfwJBJeQ",
        "title": "StructChart: Perception, Structuring, Reasoning for Visual Chart Understanding",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Charts are common in literature across different scientific fields, conveying rich information easily accessible to readers. Current chart-related tasks focus on either chart perception which refers to extracting information from the visual charts, or performing reasoning given the extracted data, e.g. in a tabular form. In this paper, we aim to establish a unified and label-efficient learning paradigm for joint perception and reasoning tasks, which can be generally applicable to different downstream tasks, beyond the question-answering task as specifically studied in peer works. Specifically, StructChart first reformulates the chart information from the popular tubular form (specifically linearized CSV) to the proposed Structured Triplet Representations (STR), which is more friendly for reducing the task gap between chart perception and reasoning due to the employed structured information extraction for charts. We then propose a Structuring Chart-oriented Representation Metric (SCRM) to quantitatively evaluate the performance for the chart perception task. To enrich the dataset for training, we further explore the possibility of leveraging the Large Language Model (LLM), enhancing the chart diversity in terms of both chart visual style and its statistical information. Extensive experiments are conducted on various chart-related tasks, demonstrating the effectiveness and promising potential for a unified chart perception-reasoning paradigm to push the frontier of chart understanding.",
        "keywords": "Chart Perception;Chart Understanding;Simulation-to-Real",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/907ab34604f6a8b336c1b817ad5c2e0719042727.zip",
        "author": "Renqiu Xia;Bo Zhang;Haoyang Peng;Ning Liao;Peng Ye;Botian Shi;Junchi Yan;Yu Qiao",
        "authorids": "~Renqiu_Xia2;~Bo_Zhang17;~Haoyang_Peng1;~Ning_Liao1;~Peng_Ye4;~Botian_Shi1;~Junchi_Yan2;~Yu_Qiao1",
        "gender": ";M;M;M;M;M;;",
        "homepage": ";https://bobrown.github.io/boZhang.github.io/;https://myaccount.google.com/?hl=en;https://scholar.google.com/citations?user=6aARLhMAAAAJ&hl=zh-CN;;;;",
        "dblp": ";36/2259-69;;44/1117;53/930-6;245/8742;;",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;;6aARLhMAAAAJ;UEZZP5QAAAAJ;K0PpvLkAAAAJ;;",
        "orcid": ";0000-0001-8052-782X;;0000-0002-3764-2555;0000-0002-8486-7562;0000-0003-3677-7252;;",
        "linkedin": ";;;;;friskit/;;",
        "or_profile": "~Renqiu_Xia2;~Bo_Zhang17;~Haoyang_Peng1;~Ning_Liao1;~Peng_Ye4;~Botian_Shi1;~Junchi_Yan2;~Yu_Qiao1",
        "aff": ";Shanghai Artificial Intelligence Laboratory;Fudan University;Shanghai Jiaotong University;Fudan University;Shanghai AI Lab;;",
        "aff_domain": ";pjlab.org.cn;fudan.edu.cn;sjtu.edu.cn;fudan.edu.cn;pjlab.org.cn;;",
        "position": ";Researcher;MS student;PhD student;PhD student;Researcher;;",
        "bibtex": "@misc{\nxia2024structchart,\ntitle={StructChart: Perception, Structuring, Reasoning for Visual Chart Understanding},\nauthor={Renqiu Xia and Bo Zhang and Haoyang Peng and Ning Liao and Peng Ye and Botian Shi and Junchi Yan and Yu Qiao},\nyear={2024},\nurl={https://openreview.net/forum?id=4YgfwJBJeQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "mxZb;Rkaq;ojHH",
        "site": "https://openreview.net/forum?id=4YgfwJBJeQ",
        "pdf_size": 2362471,
        "rating": "5;6;6",
        "confidence": "3;5;4",
        "soundness": "2;3;3",
        "contribution": "2;4;3",
        "presentation": "3;3;3",
        "wc_summary": "121;37;83",
        "wc_strengths": "56;37;125",
        "wc_weaknesses": "390;54;50",
        "wc_questions": "5;4;12",
        "wc_review": "572;132;270",
        "wc_reply_reviewers": "0;22;0",
        "wc_reply_authors": "2068;1188;561",
        "reply_reviewers": "0;1;0",
        "reply_authors": "6;5;3",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            80.33333333333333,
            34.34465832637669
        ],
        "wc_strengths_avg": [
            72.66666666666667,
            37.80946383586463
        ],
        "wc_weaknesses_avg": [
            164.66666666666666,
            159.3430959352247
        ],
        "wc_questions_avg": [
            7.0,
            3.559026084010437
        ],
        "wc_review_avg": [
            324.6666666666667,
            183.74136412057274
        ],
        "wc_reply_reviewers_avg": [
            7.333333333333333,
            10.370899457402697
        ],
        "wc_reply_authors_avg": [
            1272.3333333333333,
            618.1134379887095
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.8660254037844385,
        "gs_citation": 30,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1328798167899051335&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;1;3",
        "aff_unique_norm": "Shanghai Artificial Intelligence Laboratory;Fudan University;Shanghai Jiao Tong University;Shanghai AI Lab",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "http://www.shailab.org/;https://www.fudan.edu.cn;https://www.sjtu.edu.cn;https://www.shanghaiailab.com",
        "aff_unique_abbr": "Shanghai AI Lab;Fudan;SJTU;SAIL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "4ZcPYmFsJm",
        "title": "Geom-Erasing: Geometry-Driven Removal of Implicit Concept in Diffusion Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Fine-tuning diffusion models through personalized datasets is an acknowledged method for improving generation quality across downstream tasks, which, however, often inadvertently generates unintended concepts such as watermarks and QR codes, attributed to the limitations in image sources and collecting methods within specific downstream tasks. Existing solutions suffer from eliminating these unintentionally learned implicit concepts, primarily due to the dependency on the model\u2019s ability to recognize concepts that it actually cannot discern. In this work, we introduce GEOM-ERASING, a novel approach that successfully removes the implicit concepts with either an additional accessible classifier or detector model to encode geometric information of these concepts into the text domain. Moreover, we construct three distinct datasets, each imbued with specific implicit concepts (i.e., watermarks, QR codes, and text) for training and evaluation. Experimental results demonstrate that GEOM-ERASING not only identifies but also proficiently eradicates specific implicit concepts, revealing a significant improvement over the existing methods. The integration of geometric information marks a substantial progression in the precise removal of implicit concepts in diffusion models.",
        "keywords": "concept erasure;diffusion model;generative model",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/d10fd101d2bb287e5905abd411e84fd95090b0f1.pdf",
        "author": "Zhili LIU;Kai Chen;Yifan Zhang;Jianhua Han;Lanqing HONG;Hang Xu;Zhenguo Li;Dit-Yan Yeung;James Kwok",
        "authorids": "~Zhili_LIU1;~Kai_Chen11;~Yifan_Zhang1;~Jianhua_Han1;~Lanqing_HONG1;~Hang_Xu1;~Zhenguo_Li1;~Dit-Yan_Yeung2;~James_Kwok1",
        "gender": "M;M;M;M;F;M;M;M;",
        "homepage": "https://capricious-liu.github.io/;https://kaichen1998.github.io/;https://sites.google.com/view/yifan-zhang/%E9%A6%96%E9%A1%B5;;https://racheltechie.github.io/;;http://www.ee.columbia.edu/~zgli/;https://cse.hkust.edu.hk/faculty/dyyeung/;",
        "dblp": "03/10297;c/KaiChen24;57/4707-4;29/6207;226/4258;;23/6479;41/5668;",
        "google_scholar": "FdR09jsAAAAJ;3qBfyLIAAAAJ;https://scholar.google.com.hk/citations?user=zuYIUJEAAAAJ;OEPMQEMAAAAJ;https://scholar.google.com.sg/citations?user=2p7x6OUAAAAJ;https://scholar.google.com.hk/citations?user=J_8TX6sAAAAJ;XboZC1AAAAAJ;nEsOOx8AAAAJ;",
        "orcid": ";;;;;0000-0003-3645-8972;;0000-0003-3716-8125;",
        "linkedin": "%E6%99%BA%E7%AB%8B-%E5%88%98-49153b167/;;;;;;;;",
        "or_profile": "~Zhili_LIU1;~Kai_Chen11;~Yifan_Zhang1;~Jianhua_Han1;~Lanqing_HONG1;~Hang_Xu1;~Zhenguo_Li1;~Dit-Yan_Yeung2;~James_Kwok1",
        "aff": "Hong Kong University of Science and Technology;Hong Kong University of Science and Technology;National University of Singapore;Huawei Technologies Ltd.;Huawei Technologies Ltd.;Huawei Noah\u2018s Ark Lab;Huawei Noah's Ark Lab;Hong Kong University of Science and Technology;",
        "aff_domain": "hkust.edu;ust.hk;nus.edu;huawei.com;huawei.com;huawei.com;huawei.com;ust.hk;",
        "position": "PhD student;PhD student;PhD student;Researcher;Researcher;Researcher;Principal Researcher;Chair Professor;",
        "bibtex": "@misc{\nliu2024geomerasing,\ntitle={Geom-Erasing: Geometry-Driven Removal of Implicit Concept in Diffusion Models},\nauthor={Zhili LIU and Kai Chen and Yifan Zhang and Jianhua Han and Lanqing HONG and Hang Xu and Zhenguo Li and Dit-Yan Yeung and James Kwok},\nyear={2024},\nurl={https://openreview.net/forum?id=4ZcPYmFsJm}\n}",
        "github": "",
        "project": "",
        "reviewers": "ci9W;3V6v;GREc;dnxP",
        "site": "https://openreview.net/forum?id=4ZcPYmFsJm",
        "pdf_size": 1568186,
        "rating": "3;5;5;5",
        "confidence": "2;3;3;4",
        "soundness": "3;2;3;2",
        "contribution": "1;2;2;2",
        "presentation": "3;3;4;2",
        "wc_summary": "44;99;60;100",
        "wc_strengths": "32;56;143;100",
        "wc_weaknesses": "60;297;112;362",
        "wc_questions": "32;6;46;4",
        "wc_review": "168;458;361;566",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            75.75,
            24.416951079117148
        ],
        "wc_strengths_avg": [
            82.75,
            42.48161366991607
        ],
        "wc_weaknesses_avg": [
            207.75,
            125.25648685796676
        ],
        "wc_questions_avg": [
            22.0,
            17.72004514666935
        ],
        "wc_review_avg": [
            388.25,
            146.38369957068306
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.816496580927726,
        "gs_citation": 17,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=474392227487030829&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2;2;2;2;0",
        "aff_unique_norm": "Hong Kong University of Science and Technology;National University of Singapore;Huawei",
        "aff_unique_dep": ";;Huawei Technologies",
        "aff_unique_url": "https://www.ust.hk;https://www.nus.edu.sg;https://www.huawei.com",
        "aff_unique_abbr": "HKUST;NUS;Huawei",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;1;0;0;0;0;0",
        "aff_country_unique": "China;Singapore"
    },
    {
        "title": "Adaptive Instrument Design for Indirect Experiments",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19457",
        "id": "4Zz5UELkIt",
        "author_site": "Yash Chandak, Shiv Shankar, Vasilis Syrgkanis, Emma Brunskill",
        "tldr": "",
        "abstract": "Indirect experiments provide a valuable framework for estimating treatment effects in situations where conducting randomized control trials (RCTs) is impractical or unethical. Unlike RCTs, indirect experiments estimate treatment effects by leveraging (conditional) instrumental variables, enabling estimation through encouragement and recommendation rather than strict treatment assignment.  However, the sample efficiency of such estimators depends not only on the inherent variability in outcomes but also on the varying compliance levels of users with the instrumental variables and the choice of estimator being used, especially when dealing with numerous instrumental variables.  While adaptive experiment design has a rich literature for \\textit{direct} experiments, in this paper we take the initial steps towards enhancing sample efficiency for \\textit{indirect} experiments by adaptively designing a data collection policy over instrumental variables.  Our main contribution is a practical computational procedure that utilizes influence functions to search for an optimal data collection policy, minimizing the mean-squared error of the desired (non-linear) estimator. Through experiments conducted in various domains inspired by real-world applications, we showcase how our method can significantly improve the sample efficiency of indirect experiments.",
        "keywords": "instrument variable;experiment design;indirect experiments;adaptive design",
        "primary_area": "causal reasoning",
        "supplementary_material": "/attachment/1797d39d1ff28743b25f3ea281884f02614a8159.zip",
        "author": "Yash Chandak;Shiv Shankar;Vasilis Syrgkanis;Emma Brunskill",
        "authorids": "~Yash_Chandak1;~Shiv_Shankar2;~Vasilis_Syrgkanis1;~Emma_Brunskill2",
        "gender": ";;;",
        "homepage": "https://yashchandak.github.io/;;https://www.vsyrgkanis.com;",
        "dblp": "168/8450;203/9123;;",
        "google_scholar": "AsgUcSEAAAAJ;;G1WMpcUAAAAJ;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Yash_Chandak1;~Shiv_Shankar2;~Vasilis_Syrgkanis1;~Emma_Brunskill2",
        "aff": "Computer Science Department, Stanford University;IIT Bombay;Stanford University;",
        "aff_domain": "cs.stanford.edu;iitb.ac.in;stanford.edu;",
        "position": "Postdoc;Researcher;Assistant Professor;",
        "bibtex": "@inproceedings{\nchandak2024adaptive,\ntitle={Adaptive Instrument Design for Indirect Experiments},\nauthor={Yash Chandak and Shiv Shankar and Vasilis Syrgkanis and Emma Brunskill},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=4Zz5UELkIt}\n}",
        "github": "",
        "project": "",
        "reviewers": "QTvC;7XxM;ST2k;SUta",
        "pdf_size": 749001,
        "rating": "6;6;6;8",
        "confidence": "3;4;3;3",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;4",
        "presentation": "3;3;2;4",
        "wc_summary": "71;64;159;284",
        "wc_strengths": "41;68;56;100",
        "wc_weaknesses": "93;281;99;114",
        "wc_questions": "524;2;52;107",
        "wc_review": "729;415;366;605",
        "wc_reply_reviewers": "328;28;0;72",
        "wc_reply_authors": "3025;643;656;417",
        "reply_reviewers": "2;1;0;1",
        "reply_authors": "6;2;2;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            144.5,
            88.81582066276256
        ],
        "wc_strengths_avg": [
            66.25,
            21.706853756359994
        ],
        "wc_weaknesses_avg": [
            146.75,
            77.88573361020617
        ],
        "wc_questions_avg": [
            171.25,
            207.01856800779973
        ],
        "wc_review_avg": [
            528.75,
            146.0656958358122
        ],
        "wc_reply_reviewers_avg": [
            107.0,
            130.14991356124673
        ],
        "wc_reply_authors_avg": [
            1185.25,
            1066.4226120539643
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            3.0,
            1.7320508075688772
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16284860440980537462&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=4Zz5UELkIt",
        "pdf": "https://openreview.net/pdf?id=4Zz5UELkIt",
        "email": "cs.stanford.edu;iitb.ac.in;stanford.edu;",
        "author_num": 4,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Stanford University;Indian Institute of Technology Bombay",
        "aff_unique_dep": "Computer Science Department;",
        "aff_unique_url": "https://www.stanford.edu;https://www.iitb.ac.in",
        "aff_unique_abbr": "Stanford;IITB",
        "aff_campus_unique_index": "0;1;0",
        "aff_campus_unique": "Stanford;Mumbai",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United States;India"
    },
    {
        "id": "4aJg9e4nvF",
        "title": "What do vision transformers learn? A visual exploration",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Vision transformers (ViTs) are quickly becoming the de-facto architecture for computer vision, yet we understand very little about why they work and what they learn. While existing studies visually analyze the mechanisms of convolutional neural networks, an analogous exploration of ViTs remains challenging. In this paper, we first address the obstacles to performing visualizations on ViTs. Assisted by these solutions, we observe that neurons in ViTs trained with language model supervision (e.g., CLIP) are activated by semantic concepts rather than visual features. We also explore the underlying differences between ViTs and CNNs, and we find that transformers detect image background features, just like their convolutional counterparts, but their predictions depend far less on high-frequency information. On the other hand, both architecture types behave similarly in the way features progress from abstract patterns in early layers to concrete objects in late layers. In addition, we show that ViTs maintain spatial information in all layers except the final layer. In contrast to previous works, we show that the last layer most likely discards the spatial information and behaves as a learned global pooling operation. Finally, we conduct large-scale visualizations on a wide range of ViT variants, including DeiT, CoaT, ConViT, PiT, Swin, and Twin, to validate the effectiveness of our method.",
        "keywords": "Interpretability;Visualization;Vision Transformers;Computer Vision;Deep Learning",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Hamid Kazemi;Amin Ghiasi;Eitan Borgnia;Steven Reich;Manli Shu;Micah Goldblum;Andrew Gordon Wilson;Tom Goldstein",
        "authorids": "~Hamid_Kazemi1;~Amin_Ghiasi1;~Eitan_Borgnia1;~Steven_Reich1;~Manli_Shu1;~Micah_Goldblum1;~Andrew_Gordon_Wilson1;~Tom_Goldstein1",
        "gender": "M;M;M;M;F;;Not Specified;M",
        "homepage": ";http://cs.umd.edu/~amin;https://eitanborgnia.com;https://www.cs.umd.edu/people/sreich47;https://azshue.github.io/;;https://cims.nyu.edu/~andrewgw;https://www.cs.umd.edu/~tomg/",
        "dblp": ";239/8313;;;263/3503;241/7231;65/10453;25/8184",
        "google_scholar": "7hNdaGQAAAAJ;tNQWOxUAAAAJ;;https://scholar.google.com/citations?view_op=list_works;https://scholar.google.com/citations?hl=en;pGDKzuUAAAAJ;https://scholar.google.com.tw/citations?user=twWX2LIAAAAJ;KmSuVtgAAAAJ",
        "orcid": ";;;;;;;",
        "linkedin": "hamid-kazemi-608a8085/;;;;manli-shu-a804a8164/;;;",
        "or_profile": "~Hamid_Kazemi1;~Amin_Ghiasi1;~Eitan_Borgnia1;~Steven_Reich1;~Manli_Shu1;~Micah_Goldblum1;~Andrew_Gordon_Wilson1;~Tom_Goldstein1",
        "aff": "University of Maryland, College Park;Apple;University of Chicago;;Department of Computer Science, University of Maryland, College Park;New York University;New York University;University of Maryland, College Park",
        "aff_domain": "umd.edu;apple.com;uchicago.edu;;cs.umd.edu;nyu.edu;nyu.edu;umd.edu",
        "position": "PhD student;Researcher;PhD student;;PhD student;Postdoc;Associate Professor;Full Professor",
        "bibtex": "@misc{\nkazemi2024what,\ntitle={What do vision transformers learn? A visual exploration},\nauthor={Hamid Kazemi and Amin Ghiasi and Eitan Borgnia and Steven Reich and Manli Shu and Micah Goldblum and Andrew Gordon Wilson and Tom Goldstein},\nyear={2024},\nurl={https://openreview.net/forum?id=4aJg9e4nvF}\n}",
        "github": "",
        "project": "",
        "reviewers": "ESvq;TawR;f2Nw;Y5ru",
        "site": "https://openreview.net/forum?id=4aJg9e4nvF",
        "pdf_size": 32891953,
        "rating": "3;5;5;6",
        "confidence": "4;4;4;3",
        "soundness": "2;3;3;3",
        "contribution": "1;2;2;3",
        "presentation": "2;2;3;3",
        "wc_summary": "71;92;60;120",
        "wc_strengths": "28;46;159;68",
        "wc_weaknesses": "198;208;79;74",
        "wc_questions": "18;27;206;23",
        "wc_review": "315;373;504;285",
        "wc_reply_reviewers": "0;103;0;100",
        "wc_reply_authors": "626;698;542;294",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            85.75,
            22.873292285982796
        ],
        "wc_strengths_avg": [
            75.25,
            50.38538974742579
        ],
        "wc_weaknesses_avg": [
            139.75,
            63.3733974156349
        ],
        "wc_questions_avg": [
            68.5,
            79.44966960283725
        ],
        "wc_review_avg": [
            369.25,
            83.98325726000391
        ],
        "wc_reply_reviewers_avg": [
            50.75,
            50.76108253376793
        ],
        "wc_reply_authors_avg": [
            540.0,
            152.38110119040354
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.6622661785325219,
        "gs_citation": 69,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6842742910784796915&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;3;4;4;0",
        "aff_unique_norm": "University of Maryland;Apple;University of Chicago;University of Maryland, College Park;New York University",
        "aff_unique_dep": ";Apple Inc.;;Department of Computer Science;",
        "aff_unique_url": "https://www/umd.edu;https://www.apple.com;https://www.uchicago.edu;https://www/umd.edu;https://www.nyu.edu",
        "aff_unique_abbr": "UMD;Apple;UChicago;UMD;NYU",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "College Park;",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Tackling the Data Heterogeneity in Asynchronous Federated Learning with Cached Update Calibration",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19456",
        "id": "4aywmeb97I",
        "author_site": "Yujia Wang, Yuanpu Cao, Jingcheng Wu, Ruoyu Chen, Jinghui Chen",
        "tldr": "",
        "abstract": "Asynchronous federated learning, which enables local clients to send their model update asynchronously to the server without waiting for others, has recently emerged for its improved efficiency and scalability over traditional synchronized federated learning. In this paper, we study how the asynchronous delay affects the convergence of asynchronous federated learning under non-i.i.d. distributed data across clients. Through the theoretical convergence analysis of one representative asynchronous federated learning algorithm under standard nonconvex stochastic settings, we show that the asynchronous delay can largely slow down the convergence, especially with high data heterogeneity. To further improve the convergence of asynchronous federated learning under heterogeneous data distributions, we propose a novel asynchronous federated learning method with a cached update calibration. Specifically, we let the server cache the latest update for each client and reuse these variables for calibrating the global update at each round. We theoretically prove the convergence acceleration for our proposed method under nonconvex stochastic settings. Extensive experiments on several vision and language tasks demonstrate our superior performances compared to other asynchronous federated learning baselines.",
        "keywords": "Federated learning;Nonconvex optimization",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Yujia Wang;Yuanpu Cao;Jingcheng Wu;Ruoyu Chen;Jinghui Chen",
        "authorids": "~Yujia_Wang3;~Yuanpu_Cao1;~Jingcheng_Wu1;~Ruoyu_Chen4;~Jinghui_Chen1",
        "gender": ";M;M;M;M",
        "homepage": "https://yujiaw98.github.io/;;https://www.lti.cs.cmu.edu/people/222227896/jingcheng-wu;https://github.com/cryttx;https://jinghuichen.github.io/",
        "dblp": ";243/0230;;;67/5633",
        "google_scholar": "0DwROiMAAAAJ;F5S2bO8AAAAJ;;;mKia7Y4AAAAJ",
        "orcid": ";;;;",
        "linkedin": ";yuanpu-cao-a392751b2/;;;",
        "or_profile": "~Yujia_Wang3;~Yuanpu_Cao1;~Jingcheng_Wu1;~Ruoyu_Chen4;~Jinghui_Chen1",
        "aff": "Pennsylvania State University;Pennsylvania State University;;;Pennsylvania State University",
        "aff_domain": "psu.edu;psu.edu;;;psu.edu",
        "position": "PhD student;PhD student;;;Assistant Professor",
        "bibtex": "@inproceedings{\nwang2024tackling,\ntitle={Tackling the Data Heterogeneity in Asynchronous Federated Learning with Cached Update Calibration},\nauthor={Yujia Wang and Yuanpu Cao and Jingcheng Wu and Ruoyu Chen and Jinghui Chen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=4aywmeb97I}\n}",
        "github": "",
        "project": "",
        "reviewers": "xHG4;yUBQ;3At2",
        "pdf_size": 777743,
        "rating": "6;8;8",
        "confidence": "3;4;5",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "2;4;3",
        "wc_summary": "174;66;111",
        "wc_strengths": "93;46;82",
        "wc_weaknesses": "99;128;87",
        "wc_questions": "145;243;28",
        "wc_review": "511;483;308",
        "wc_reply_reviewers": "34;65;12",
        "wc_reply_authors": "858;1455;519",
        "reply_reviewers": "1;1;1",
        "reply_authors": "3;4;2",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            117.0,
            44.294469180700204
        ],
        "wc_strengths_avg": [
            73.66666666666667,
            20.07209228976613
        ],
        "wc_weaknesses_avg": [
            104.66666666666667,
            17.21110752456745
        ],
        "wc_questions_avg": [
            138.66666666666666,
            87.88755442167123
        ],
        "wc_review_avg": [
            434.0,
            89.82575725629407
        ],
        "wc_reply_reviewers_avg": [
            37.0,
            21.740898478827106
        ],
        "wc_reply_authors_avg": [
            944.0,
            386.9289340434494
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.0,
            0.816496580927726
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.8660254037844385,
        "gs_citation": 18,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14121697309955840422&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=4aywmeb97I",
        "pdf": "https://openreview.net/pdf?id=4aywmeb97I",
        "email": "psu.edu;psu.edu;;;psu.edu",
        "author_num": 5,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Pennsylvania State University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.psu.edu",
        "aff_unique_abbr": "PSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "EMO: EARTH MOVER DISTANCE OPTIMIZATION FOR AUTO-REGRESSIVE LANGUAGE MODELING",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19455",
        "id": "4bLXfRd0CX",
        "author_site": "Siyu Ren, Zhiyong Wu, Kenny Zhu",
        "tldr": "",
        "abstract": "Neural language models are probabilistic models of human text. They are predominantly trained using maximum likelihood estimation (MLE), which is equivalent to minimizing the forward cross-entropy between the empirical data distribution and the model distribution. However, various degeneration phenomena are still widely observed when decoding from the distributions learned by such models. We establish that the forward cross-entropy is suboptimal as a distance metric for aligning human and model distribution due to its (1) recall-prioritization (2) negative diversity ignorance and (3) train-test mismatch. In this paper, we propose Earth Mover Distance Optimization (EMO) for auto-regressive language modeling. EMO capitalizes on the inherent properties of earth mover distance to address the aforementioned challenges. Due to the high complexity of direct computation, we further introduce a feasible upper bound for EMO to ease end-to-end training. Upon extensive evaluation of language models trained using EMO and MLE. We find that EMO demonstrates a consistently better language modeling performance than MLE across domains. Moreover, EMO demonstrates noteworthy enhancements in downstream performance with minimal fine-tuning on merely 25,000 sentences. This highlights the tremendous potential of EMO as a lightweight calibration method for enhancing large-scale pre-trained language models.",
        "keywords": "language modeling;earth mover distance;language generation;language understanding",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Siyu Ren;Zhiyong Wu;Kenny Q. Zhu",
        "authorids": "~Siyu_Ren1;~Zhiyong_Wu3;~Kenny_Q._Zhu1",
        "gender": "M;;M",
        "homepage": "https://drsy.github.io/;;http://www.cs.sjtu.edu.cn/~kzhu/",
        "dblp": ";;z/KennyQiliZhu",
        "google_scholar": "jkJDyrkAAAAJ;;https://scholar.google.com.tw/citations?user=ZIRJ6lIAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Siyu_Ren1;~Zhiyong_Wu3;~Kenny_Q._Zhu1",
        "aff": "Shanghai Jiaotong University;;University of Texas at Arlington",
        "aff_domain": "sjtu.edu.cn;;uta.edu",
        "position": "PhD student;;Full Professor",
        "bibtex": "@inproceedings{\nren2024emo,\ntitle={{EMO}: {EARTH} {MOVER} {DISTANCE} {OPTIMIZATION} {FOR} {AUTO}-{REGRESSIVE} {LANGUAGE} {MODELING}},\nauthor={Siyu Ren and Zhiyong Wu and Kenny Q. Zhu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=4bLXfRd0CX}\n}",
        "github": "",
        "project": "",
        "reviewers": "XE26;JZqx;TjsD;2RWM",
        "pdf_size": 640517,
        "rating": "3;6;6;8",
        "confidence": "4;4;4;4",
        "soundness": "1;4;3;4",
        "contribution": "2;2;3;3",
        "presentation": "3;4;3;4",
        "wc_summary": "68;44;56;102",
        "wc_strengths": "11;80;36;22",
        "wc_weaknesses": "235;109;147;96",
        "wc_questions": "1;86;33;25",
        "wc_review": "315;319;272;245",
        "wc_reply_reviewers": "765;161;201;0",
        "wc_reply_authors": "1674;1045;1156;442",
        "reply_reviewers": "3;3;2;0",
        "reply_authors": "3;4;3;1",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            1.224744871391589
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            67.5,
            21.650635094610966
        ],
        "wc_strengths_avg": [
            37.25,
            26.223796445213647
        ],
        "wc_weaknesses_avg": [
            146.75,
            54.28800512083678
        ],
        "wc_questions_avg": [
            36.25,
            31.04331651096577
        ],
        "wc_review_avg": [
            287.75,
            30.80077109424373
        ],
        "wc_reply_reviewers_avg": [
            281.75,
            288.97004602553534
        ],
        "wc_reply_authors_avg": [
            1079.25,
            437.8580677571215
        ],
        "reply_reviewers_avg": [
            2.0,
            1.224744871391589
        ],
        "reply_authors_avg": [
            2.75,
            1.0897247358851685
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12705620678870906094&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=4bLXfRd0CX",
        "pdf": "https://openreview.net/pdf?id=4bLXfRd0CX",
        "email": "sjtu.edu.cn;;uta.edu",
        "author_num": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Shanghai Jiao Tong University;University of Texas at Arlington",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.sjtu.edu.cn;https://www.uta.edu",
        "aff_unique_abbr": "SJTU;UTA",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Arlington",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Going Beyond Neural Network Feature Similarity: The Network Feature Complexity and Its Interpretation Using Category Theory",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19454",
        "id": "4bSQ3lsfEV",
        "author_site": "Yiting Chen, Zhanpeng Zhou, Junchi Yan",
        "tldr": "",
        "abstract": "The behavior of neural networks still remains opaque, and a recently widely noted phenomenon is that networks often achieve similar performance when initialized with different random parameters. This phenomenon has attracted significant attention in measuring the similarity between features learned by distinct networks. However, feature similarity could be vague in describing the same feature since equivalent features hardly exist. In this paper, we expand the concept of equivalent feature and provide the definition of what we call *functionally equivalent features*. These features produce equivalent output under certain transformations. \nUsing this definition, we aim to derive a more intrinsic metric for the so-called *feature complexity* regarding the redundancy of features learned by a neural network at each layer. We offer a formal interpretation of our approach through the lens of category theory, a well-developed area in mathematics. To quantify the feature complexity, we further propose an efficient algorithm named Iterative Feature Merging. Our experimental results validate our ideas and theories from various perspectives. We empirically demonstrate that the functionally equivalence widely exists among different features learned by the same neural network and we could reduce the number of parameters of the network without affecting the performance. We have also drawn several interesting empirical findings, including: \n1) the larger the network, the more redundant features it learns; 2) in particular, we show how to prune the networks based on our finding using direct equivalent feature merging, without fine-tuning which is often needed in peer network pruning methods; 3) same structured networks with higher feature complexity achieve better performance; 4) through the layers of a neural network, the feature complexity first increase then decrease; 5) for the image classification task, a group of functionally equivalent features may correspond to a specific semantic meaning. Source code will be made publicly available.",
        "keywords": "Category Theory; Neural Networks Feature Complexity",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Yiting Chen;Zhanpeng Zhou;Junchi Yan",
        "authorids": "~Yiting_Chen1;~Zhanpeng_Zhou1;~Junchi_Yan2",
        "gender": "M;M;M",
        "homepage": "https://ytchen981.github.io/;https://zzp1012.github.io/;http://thinklab.sjtu.edu.cn/",
        "dblp": "135/6971;;60/7949.html",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;idxXY3UAAAAJ;ga230VoAAAAJ",
        "orcid": ";;0000-0001-9639-7679",
        "linkedin": ";;",
        "or_profile": "~Yiting_Chen1;~Zhanpeng_Zhou1;~Junchi_Yan1",
        "aff": "Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn",
        "position": "PhD student;PhD student;Full Professor",
        "bibtex": "@inproceedings{\nchen2024going,\ntitle={Going Beyond Neural Network Feature Similarity: The Network Feature Complexity and Its Interpretation Using Category Theory},\nauthor={Yiting Chen and Zhanpeng Zhou and Junchi Yan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=4bSQ3lsfEV}\n}",
        "github": "",
        "project": "",
        "reviewers": "R8Xc;QeEM;oxNv;Po5f",
        "pdf_size": 1034460,
        "rating": "3;6;6;8",
        "confidence": "4;4;4;4",
        "soundness": "2;3;3;3",
        "contribution": "1;2;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "92;63;228;87",
        "wc_strengths": "51;50;54;92",
        "wc_weaknesses": "219;124;263;163",
        "wc_questions": "112;127;17;23",
        "wc_review": "474;364;562;365",
        "wc_reply_reviewers": "193;24;0;0",
        "wc_reply_authors": "1528;842;591;505",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "3;2;2;1",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            117.5,
            64.73214039408862
        ],
        "wc_strengths_avg": [
            61.75,
            17.52676524633111
        ],
        "wc_weaknesses_avg": [
            192.25,
            52.99705180479382
        ],
        "wc_questions_avg": [
            69.75,
            50.07681599303214
        ],
        "wc_review_avg": [
            441.25,
            82.8171932632349
        ],
        "wc_reply_reviewers_avg": [
            54.25,
            80.70432144563264
        ],
        "wc_reply_authors_avg": [
            866.5,
            401.48630113616576
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16979939216988961962&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=4bSQ3lsfEV",
        "pdf": "https://openreview.net/pdf?id=4bSQ3lsfEV",
        "email": "sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Shanghai Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sjtu.edu.cn",
        "aff_unique_abbr": "SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "4bUeP3qrNu",
        "title": "A Systematic Comparison of Syllogistic Reasoning in Humans and Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "A central component of rational behavior is logical inference: the process of determining which conclusions follow from a set of premises. Psychologists have documented several ways in which humans' inferences deviate from the rules of logic. Do language models, which are trained on text generated by humans, replicate these biases, or are they able to overcome them? Focusing on the case of syllogisms -inferences from two simple premises, which have been studied extensively in psychology - we show that larger models are more logical than smaller ones, and also more logical than humans. At the same time, even the largest models make systematic errors, some of which mirror human reasoning biases such as ordering effects and logical fallacies. Overall, we find that language models mimic the human biases included in their training data, but are able to overcome them in some cases.",
        "keywords": "Language models;Logic;Reasoning;Syllogisms;Cognitive Science",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "Tiwalayo Eisape;Michael Henry Tessler;Fei Sha;Ishita Dasgupta;Sjoerd van Steenkiste;Tal Linzen",
        "authorids": "~Tiwalayo_Eisape1;~Michael_Henry_Tessler1;~Fei_Sha3;~Ishita_Dasgupta1;~Sjoerd_van_Steenkiste1;~Tal_Linzen1",
        "gender": ";M;;M;M;M",
        "homepage": "https://eisape.github.io/;https://www.mit.edu/~tessler/;;http://www.sjoerdvansteenkiste.com/;http://tallinzen.net;http://feisha.org",
        "dblp": ";;169/6218;183/9326;169/3438;13/3601",
        "google_scholar": ";DQjm2rAAAAAJ;;i-AStBYAAAAJ;5mJDXjoAAAAJ;HDHOS0QAAAAJ",
        "orcid": ";;;;;",
        "linkedin": "eisape/;;idasgupta6/;;;",
        "or_profile": "~Tiwalayo_Eisape1;~Michael_Henry_Tessler1;~Ishita_Dasgupta1;~Sjoerd_van_Steenkiste1;~Tal_Linzen1;~Fei_Sha2",
        "aff": "Massachusetts Institute of Technology;Google DeepMind;Google DeepMind;Google;Google;Google",
        "aff_domain": "mit.edu;deepmind.com;deepmind.com;google.com;google.com;google.com",
        "position": "PhD student;Researcher;Researcher;Researcher;Researcher;research scientist",
        "bibtex": "@misc{\neisape2024a,\ntitle={A Systematic Comparison of Syllogistic Reasoning in Humans and Language Models},\nauthor={Tiwalayo Eisape and Michael Henry Tessler and Fei Sha and Ishita Dasgupta and Sjoerd van Steenkiste and Tal Linzen},\nyear={2024},\nurl={https://openreview.net/forum?id=4bUeP3qrNu}\n}",
        "github": "",
        "project": "",
        "reviewers": "Q1gw;acDo;Wr2g;hrcw",
        "site": "https://openreview.net/forum?id=4bUeP3qrNu",
        "pdf_size": 3784401,
        "rating": "3;3;5;6",
        "confidence": "4;4;3;3",
        "soundness": "1;2;4;3",
        "contribution": "3;2;2;3",
        "presentation": "4;3;3;3",
        "wc_summary": "42;70;53;119",
        "wc_strengths": "23;58;64;66",
        "wc_weaknesses": "179;178;89;180",
        "wc_questions": "5;65;2;93",
        "wc_review": "249;371;208;458",
        "wc_reply_reviewers": "187;0;0;0",
        "wc_reply_authors": "500;942;326;804",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            1.118033988749895
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            71.0,
            29.45335295004628
        ],
        "wc_strengths_avg": [
            52.75,
            17.426631917843448
        ],
        "wc_weaknesses_avg": [
            156.5,
            38.977557645393844
        ],
        "wc_questions_avg": [
            41.25,
            39.04084399702445
        ],
        "wc_review_avg": [
            321.5,
            99.02146232004453
        ],
        "wc_reply_reviewers_avg": [
            46.75,
            80.97337525384502
        ],
        "wc_reply_authors_avg": [
            643.0,
            243.03291958086666
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.9622504486493761,
        "gs_citation": 19,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1488268212595618188&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;1;1;1;1",
        "aff_unique_norm": "Massachusetts Institute of Technology;Google",
        "aff_unique_dep": ";Google DeepMind",
        "aff_unique_url": "https://web.mit.edu;https://deepmind.com",
        "aff_unique_abbr": "MIT;DeepMind",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;1;0;0;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "4bat0pSQBq",
        "title": "FLOOD SIMULATION WITH PHYSICS-INFORMED MESSAGE PASSING",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Flood modeling is an important tool for supporting preventive and emergency\nmeasures to mitigate flood risks. Recently, there has been an increasing interest\nin exploring machine learning-based models as an alternative to traditional hydrodynamic models for flood simulation to address challenges such as scalability and accuracy. However, current ML approaches are ineffective at modeling early stages of flooding events, limiting their ability to simulate the entire evolution of the flood. Another key challenge is how to incorporate physics domain-knowledge into these data-driven models. In this paper, we address these challenges by introducing a physics-inspired graph neural network for flood simulation. Given a (geographical) region and precipitation data, our model predicts water depths in an autoregressive fashion. We propose a message-passing framework inspired by the conservation of momentum and mass expressed in the shallow-water equations, which describe the physical process of a flooding event. Empirical results on a dataset covering 9 regions and 7 historical precipitation events demonstrate that our model outperforms the best baseline, and is able to capture the propagation of water flow better, especially at the very early stage of the flooding event.",
        "keywords": "Physics-informed GNN;flood simulation;PDEs",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Arnold Kazadi;James Doss-Gollin;Arlei Lopes da Silva",
        "authorids": "~Arnold_Kazadi1;jdossgollin@rice.edu;~Arlei_Lopes_da_Silva1",
        "gender": ";;M",
        "homepage": "https://kanz76.github.io/;;https://cs.rice.edu/~al110/index.html",
        "dblp": ";;19/2546",
        "google_scholar": "8K_HYF8AAAAJ;;atGtis4AAAAJ",
        "orcid": "0000-0002-9690-5212;;0000-0003-1792-0076",
        "linkedin": ";;",
        "or_profile": "~Arnold_Kazadi1;jdossgollin@rice.edu;~Arlei_Lopes_da_Silva1",
        "aff": "Rice University;;Rice University",
        "aff_domain": "rice.edu;;rice.edu",
        "position": "PhD student;;Assistant Professor",
        "bibtex": "@misc{\nkazadi2024flood,\ntitle={{FLOOD} {SIMULATION} {WITH} {PHYSICS}-{INFORMED} {MESSAGE} {PASSING}},\nauthor={Arnold Kazadi and James Doss-Gollin and Arlei Lopes da Silva},\nyear={2024},\nurl={https://openreview.net/forum?id=4bat0pSQBq}\n}",
        "github": "",
        "project": "",
        "reviewers": "rnbK;j8ny;g1kJ;iyD6",
        "site": "https://openreview.net/forum?id=4bat0pSQBq",
        "pdf_size": 6725532,
        "rating": "3;5;5;5",
        "confidence": "3;4;4;4",
        "soundness": "3;2;2;3",
        "contribution": "2;3;2;2",
        "presentation": "3;3;4;3",
        "wc_summary": "137;99;193;110",
        "wc_strengths": "69;68;72;125",
        "wc_weaknesses": "237;129;385;591",
        "wc_questions": "90;145;209;236",
        "wc_review": "533;441;859;1062",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "428;688;794;776",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            134.75,
            36.36189626518397
        ],
        "wc_strengths_avg": [
            83.5,
            24.005207768315607
        ],
        "wc_weaknesses_avg": [
            335.5,
            173.25919888998678
        ],
        "wc_questions_avg": [
            170.0,
            56.79348554191757
        ],
        "wc_review_avg": [
            723.75,
            249.51891210888203
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            671.5,
            146.19422013198744
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:82NQ0Rn2MSwJ:scholar.google.com/&scioq=FLOOD+SIMULATION+WITH+PHYSICS-INFORMED+MESSAGE+PASSING&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Rice University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.rice.edu",
        "aff_unique_abbr": "Rice",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "4cUuvzIxOW",
        "title": "Unveiling the Potential of Probabilistic Embeddings in Self-Supervised Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In recent years, self-supervised learning has played a pivotal role in advancing machine learning by allowing models to acquire meaningful representations from unlabeled data. An intriguing research avenue involves developing self-supervised models within an information-theoretic framework, but many studies often deviate from the stochasticity assumptions made when deriving their objectives. To gain deeper insights into this issue, we propose to explicitly model the representation with stochastic embeddings and assess their effects on performance, information compression and potential for out-of-distribution detection. From an information-theoretic perspective, we seek to unravel the relationships between stochastic embeddings and the regularization mechanisms of Barlow Twins and VICReg and investigate the impact of probabilistic modeling on the information bottleneck, shedding light on a trade-off between compression and preservation of relevant information in both representation and loss space. Emphasizing the importance of distinguishing between these two spaces, we demonstrate how constraining one can affect the other, potentially leading to performance degradation. Moreover, our findings suggest that introducing an additional bottleneck in the loss space can significantly enhance the ability to detect out-of-distribution examples, only leveraging either representation features or the variance of their underlying distribution.",
        "keywords": "self-supervised learning;information bottleneck;probabilistic embeddings;computer vision",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Denis Janiak;Jakub Binkowski;Piotr Bielak;Tomasz Jan Kajdanowicz",
        "authorids": "~Denis_Janiak1;~Jakub_Binkowski1;~Piotr_Bielak1;~Tomasz_Jan_Kajdanowicz1",
        "gender": "M;M;;M",
        "homepage": ";;https://piotrbielak.com/;http://www.kajdanowicz.com",
        "dblp": "306/8791;306/9925;;74/608",
        "google_scholar": "ICTlqh0AAAAJ;yFzn0owAAAAJ;https://scholar.google.ca/citations?user=Z0lkjn0AAAAJ;GOoaHHEAAAAJ",
        "orcid": ";0000-0001-7386-5150;;0000-0002-8417-1012",
        "linkedin": "denis-janiak-4a7b7a159/;;;kajdanowicz",
        "or_profile": "~Denis_Janiak1;~Jakub_Binkowski1;~Piotr_Bielak1;~Tomasz_Jan_Kajdanowicz1",
        "aff": "Wroclaw University of Science and Technology;Technical University of Wroclaw;Wroclaw University of Science and Technology;Wroclaw University of Science and Technology",
        "aff_domain": "pwr.edu.pl;pwr.edu.pl;pwr.edu.pl;pwr.edu.pl",
        "position": "PhD student;PhD student;PhD student;Associate Professor",
        "bibtex": "@misc{\njaniak2024unveiling,\ntitle={Unveiling the Potential of Probabilistic Embeddings in Self-Supervised Learning},\nauthor={Denis Janiak and Jakub Binkowski and Piotr Bielak and Tomasz Jan Kajdanowicz},\nyear={2024},\nurl={https://openreview.net/forum?id=4cUuvzIxOW}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=4cUuvzIxOW",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:-OjeBM2rFT0J:scholar.google.com/&scioq=Unveiling+the+Potential+of+Probabilistic+Embeddings+in+Self-Supervised+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Wroclaw University of Science and Technology;Wroclaw University of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.pwr.edu.pl;https://www.pwr.edu.pl",
        "aff_unique_abbr": "WUST;WUT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Poland"
    },
    {
        "id": "4d32Ufnoxb",
        "title": "Enhancing Graph Tasks with a Dual-Block Graph Transformer: A Synergistic Approach to Local and Global Attention",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In this work, we address the limitations of traditional Transformers in graph tasks. While some approaches predominantly leverage local attention mechanisms akin to Graph Neural Networks (GNNs), often neglecting the global attention capabilities inherent in the Transformer model. Conversely, other methods overly focus on the global attention aspect of the Transformer, ignoring the importance of local attention mechanisms in the context of graph structure. To this end, we propose a novel Message Passing Transformer with strategic modifications to the original Transformer, significantly enhancing its performance on graph tasks by improving the handling of local attention. Building on this, we further propose a novel Dual-Block Graph Transformer that synergistically integrates local and global attention mechanisms. This architecture comprises two distinct blocks inside each head: the Message Passing Block, designed to emulate local attention, and a second block that encapsulates the global attention mechanism. This dual-block design inside each head enables our model to capture both fine-grained local and high-level global interactions in graph tasks, leading to a more comprehensive and robust graph representation. We empirically validate our model on node classification tasks, particularly on heterophilic graphs, and graph classification tasks. The results demonstrate that our Dual-Block Graph Transformer significantly outperforms both GNN and Graph Transformer models. Remarkably, this superior performance is achieved without the necessity for complex positional encoding strategies, underscoring the efficacy of our approach.",
        "keywords": "Graph Transformer;Transformer;Graph Learning;Semi-supervised",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Shihan Guan;Lei Song;Xin Chen;Yueying Li;Qinghua Si;Laurent Albera;R\u00e9gine LE BOUQUIN JEANN\u00c8S;Youyong Kong;Huazhong Shu",
        "authorids": "~Shihan_Guan1;~Lei_Song1;~Xin_Chen33;~Yueying_Li2;~Qinghua_Si1;~Laurent_Albera1;~R\u00e9gine_LE_BOUQUIN_JEANN\u00c8S1;~Youyong_Kong1;~Huazhong_Shu1",
        "gender": "M;M;M;F;M;;F;M;M",
        "homepage": "https://orcid.org/0000-0003-3563-5308;;;;https://github.com/smqh2165;https://perso.univ-rennes1.fr/laurent.albera/;https://esir.univ-rennes.fr/node/58;https://cse.seu.edu.cn/2023/1024/c23024a469537/page.htm;https://cse.seu.edu.cn/",
        "dblp": ";;;https://dblp.org/rec/journals/kbs/LiLZZ21;;;;154/7641;",
        "google_scholar": ";https://scholar.google.com/citations?hl=zh-CN;;;;;;;Fsc-Sa4AAAAJ",
        "orcid": "0000-0003-3563-5308;0000-0003-2044-3311;0000-0001-5772-9917;0000-0002-5327-8511;;;0000-0002-4050-2895;;",
        "linkedin": ";;;;;;;;",
        "or_profile": "~Shihan_Guan1;~Lei_Song1;~Xin_Chen33;~Yueying_Li2;~Qinghua_Si1;~Laurent_Albera1;~R\u00e9gine_LE_BOUQUIN_JEANN\u00c8S1;~Youyong_Kong1;~Huazhong_Shu1",
        "aff": "Southeast University;Southeast University;Southeast University;Southeast University;Southeast University;University of Rennes;Universit\u00e9 de Rennes, France;Southeast University;Southeast University",
        "aff_domain": "seu.edu.cn;seu.edu.cn;seu.edu.cn;seu.edu.cn;seu.edu.cn;univ-rennes.fr;univ-rennes.fr;seu.edu.cn;seu.edu.cn",
        "position": "PhD student;PhD student;PhD student;PhD student;MS student;Full Professor;Full Professor;Associate Professor;Full Professor",
        "bibtex": "@misc{\nguan2024enhancing,\ntitle={Enhancing Graph Tasks with a Dual-Block Graph Transformer: A Synergistic Approach to Local and Global Attention},\nauthor={Shihan Guan and Lei Song and Xin Chen and Yueying Li and Qinghua Si and Laurent Albera and R{\\'e}gine LE BOUQUIN JEANN{\\`E}S and Youyong Kong and Huazhong Shu},\nyear={2024},\nurl={https://openreview.net/forum?id=4d32Ufnoxb}\n}",
        "github": "",
        "project": "",
        "reviewers": "PHGs;NDKD;5j2q;wt2P;GViT",
        "site": "https://openreview.net/forum?id=4d32Ufnoxb",
        "pdf_size": 1296110,
        "rating": "3;3;3;5;5",
        "confidence": "5;5;4;4;4",
        "soundness": "3;2;2;2;3",
        "contribution": "2;1;2;2;2",
        "presentation": "3;2;3;3;3",
        "wc_summary": "97;105;48;61;70",
        "wc_strengths": "74;34;27;25;23",
        "wc_weaknesses": "315;94;87;86;95",
        "wc_questions": "3;208;7;45;57",
        "wc_review": "489;441;169;217;245",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            3.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            4.4,
            0.48989794855663565
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            1.8,
            0.4000000000000001
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            76.2,
            21.572204337990126
        ],
        "wc_strengths_avg": [
            36.6,
            19.06410239166796
        ],
        "wc_weaknesses_avg": [
            135.4,
            89.87235392488616
        ],
        "wc_questions_avg": [
            64.0,
            74.98799903984637
        ],
        "wc_review_avg": [
            312.2,
            128.00999960940553
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -0.6666666666666665,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:bgMoNg1HgoAJ:scholar.google.com/&scioq=Enhancing+Graph+Tasks+with+a+Dual-Block+Graph+Transformer:+A+Synergistic+Approach+to+Local+and+Global+Attention&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0;1;2;0;0",
        "aff_unique_norm": "Southeast University;University of Rennes;Universit\u00e9 de Rennes",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.seu.edu.cn/;https://www.univ-rennes1.fr;https://www.univ-rennes1.fr",
        "aff_unique_abbr": "SEU;UR1;UR1",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;1;1;0;0",
        "aff_country_unique": "China;France"
    },
    {
        "id": "4dw16l4iqC",
        "title": "Adapting ConvNets for New Cameras without Retraining",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In the vast majority of research, it is assumed images will be perspective or can be rectified to a perspective projection. However, in many applications it is beneficial to use non conventional cameras, such as fisheye cameras, that have a larger field of view (FOV). The issue arises that these large FOV images can't be rectified to a perspective projection without significant cropping of the original image. To address this issue we propose Rectify Convolutions (RectConv); a new approach for adapting pre-trained convolutional networks to operate with new non-perspective images, without any retraining. Replacing the convolutional layers of the network with RectConv layers allows the network to see both rectified patches and the entire FOV. We demonstrate RectConv adapting multiple pre-trained networks to perform segmentation and detection on fisheye imagery from two publicly available datasets. Our method shows improved results over both direct application of the network and naive pre-rectification of imagery. Our approach requires no additional data or training, and we develop a software tool that transforms existing pre-trained networks to operate on new camera geometries. We believe this work is a significant step toward adapting the vast resources available for perspective images to operate across a broad range of camera geometries. Code available upon acceptance.",
        "keywords": "Convolutional Networks;Pretrained;Wide FOV;Fisheye;Segmentation;Rectification",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Ryan Griffiths;Donald G. Dansereau",
        "authorids": "~Ryan_Griffiths1;~Donald_G._Dansereau1",
        "gender": "M;M",
        "homepage": "https://ryanbgriffiths.github.io;http://roboticimaging.org",
        "dblp": ";27/5079G",
        "google_scholar": "OfqJfm8AAAAJ;MVfxch0AAAAJ",
        "orcid": ";0000-0003-2540-1639",
        "linkedin": ";donald-dansereau/",
        "or_profile": "~Ryan_Griffiths1;~Donald_Gilbert_Dansereau1",
        "aff": "University of Sydney;University of Sydney",
        "aff_domain": "usyd.edu.au;sydney.edu.au",
        "position": "PhD student;Senior Lecturer",
        "bibtex": "@misc{\ngriffiths2024adapting,\ntitle={Adapting ConvNets for New Cameras without Retraining},\nauthor={Ryan Griffiths and Donald G. Dansereau},\nyear={2024},\nurl={https://openreview.net/forum?id=4dw16l4iqC}\n}",
        "github": "",
        "project": "",
        "reviewers": "v97K;Vp9L;v5En;Qoap",
        "site": "https://openreview.net/forum?id=4dw16l4iqC",
        "pdf_size": 25776189,
        "rating": "1;3;5;5",
        "confidence": "4;5;5;4",
        "soundness": "2;3;3;2",
        "contribution": "2;1;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "104;112;63;162",
        "wc_strengths": "16;28;66;70",
        "wc_weaknesses": "174;267;334;182",
        "wc_questions": "23;71;23;77",
        "wc_review": "317;478;486;491",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            1.6583123951777
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            110.25,
            35.187888541371734
        ],
        "wc_strengths_avg": [
            45.0,
            23.430749027719962
        ],
        "wc_weaknesses_avg": [
            239.25,
            65.73193668225515
        ],
        "wc_questions_avg": [
            48.5,
            25.588083163847973
        ],
        "wc_review_avg": [
            443.0,
            72.89375830618147
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.30151134457776363,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:f4fcP470nUwJ:scholar.google.com/&scioq=Adapting+ConvNets+for+New+Cameras+without+Retraining&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Sydney",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sydney.edu.au",
        "aff_unique_abbr": "USYD",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Australia"
    },
    {
        "id": "4e0ItHjNo9",
        "title": "Rethinking Counterfactual Fairness: On Which Individuals to Enforce, and How?",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Fairness in human and algorithmic decision-making is crucial in areas such as criminal justice, education, and social welfare. Recently, counterfactual fairness has drawn increasing research interest, suggesting that decision-making for individuals should remain the same when intervening with different values on the protected attributes. Nevertheless, the question of \"which attributes and individuals should be protected\" is rarely discussed in the existing counterfactual fairness literature. For example, when considering leg disability as a protected attribute, the algorithms should not treat individuals with leg disabilities differently in college admissions, but one may naturally take into this factor for the purpose of selecting runner athletes. In other words, when and how to enforce fairness is expected to depend on the causal relation between the protected attribute and the outcome of interest. Formally, this paper proposes principal counterfactual fairness using the concept of principal stratification from the causal inference literature, focusing on whether an algorithm is counterfactually fair for individuals whose protected attribute has no individual causal effect on the outcome of interest. To examine whether an algorithm satisfies principal counterfactual fairness, we derive the statistical bounds, and propose a post-processing approach to achieving principal counterfactual fairness with minimal individual decision changes. Experiments are conducted using synthetic and real-world datasets to verify the effectiveness of our methods.",
        "keywords": "counterfactual fairness;fairness;causal effect;principal stratification",
        "primary_area": "causal reasoning",
        "supplementary_material": "",
        "author": "Haoxuan Li;Chunyuan Zheng;Zhichao Jiang;Zhuangyan Fang;Yue Liu;Zhi Geng;Kun Zhang",
        "authorids": "~Haoxuan_Li6;~Chunyuan_Zheng1;~Zhichao_Jiang2;~Zhuangyan_Fang1;~Yue_Liu9;~Zhi_Geng1;~Kun_Zhang1",
        "gender": "M;M;M;M;;M;M",
        "homepage": "https://haoxuanli-pku.github.io/;;https://zhichaoj-git.github.io;https://www.semanticscholar.org/author/Zhuangyan-Fang/1382582145;;https://stxy.btbu.edu.cn/szdw/bssds/34339356074b408c8650309f05f24558.htm;http://www.andrew.cmu.edu/user/kunz1/",
        "dblp": "145/4965-1.html;;;https://dblp.uni-trier.de/pid/251/3212;;;96/3115-1",
        "google_scholar": "gtDqiucAAAAJ;https://scholar.google.com/citations?hl=en;;https://scholar.google.com/citations?hl=zh-CN;;;RGoypN4AAAAJ",
        "orcid": "0000-0003-3620-3769;0000-0002-0306-7310;;;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Haoxuan_Li6;~Chunyuan_Zheng1;~Zhichao_Jiang2;~Zhuangyan_Fang1;~Yue_Liu9;~Zhi_Geng1;~Kun_Zhang1",
        "aff": "Peking University;Peking University;SUN YAT-SEN UNIVERSITY;Xiaomi ;;School of mathematical Science, Peking University, Peking University;Carnegie Mellon University",
        "aff_domain": "pku.edu.cn;stu.pku.edu.cn;sysu.edu.cn;xiaomi.com;;math.pku.edu.cn;cmu.edu",
        "position": "PhD student;PhD student;Full Professor;Researcher;;Full Professor;Associate Professor",
        "bibtex": "@misc{\nli2024rethinking,\ntitle={Rethinking Counterfactual Fairness: On Which Individuals to Enforce, and How?},\nauthor={Haoxuan Li and Chunyuan Zheng and Zhichao Jiang and Zhuangyan Fang and Yue Liu and Zhi Geng and Kun Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=4e0ItHjNo9}\n}",
        "github": "",
        "project": "",
        "reviewers": "wXfm;CWdU;R7Tu;tVGj",
        "site": "https://openreview.net/forum?id=4e0ItHjNo9",
        "pdf_size": 334128,
        "rating": "3;3;5;6",
        "confidence": "5;4;3;4",
        "soundness": "2;2;2;2",
        "contribution": "1;2;2;3",
        "presentation": "2;3;2;2",
        "wc_summary": "163;75;159;251",
        "wc_strengths": "111;16;31;136",
        "wc_weaknesses": "309;236;187;1130",
        "wc_questions": "143;25;92;166",
        "wc_review": "726;352;469;1683",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            162.0,
            62.24949798994366
        ],
        "wc_strengths_avg": [
            73.5,
            51.051444641655344
        ],
        "wc_weaknesses_avg": [
            465.5,
            386.0974617891187
        ],
        "wc_questions_avg": [
            106.5,
            54.14101956926929
        ],
        "wc_review_avg": [
            807.5,
            523.2602125138122
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5443310539518174,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:MN5AFgzzfGoJ:scholar.google.com/&scioq=Rethinking+Counterfactual+Fairness:+On+Which+Individuals+to+Enforce,+and+How%3F&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2;0;3",
        "aff_unique_norm": "Peking University;Sun Yat-sen University;Xiaomi Corporation;Carnegie Mellon University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "http://www.pku.edu.cn;http://www.sysu.edu.cn;https://www.xiaomi.com;https://www.cmu.edu",
        "aff_unique_abbr": "Peking U;SYSU;Xiaomi;CMU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Peking",
        "aff_country_unique_index": "0;0;0;0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Language Model Detectors Are Easily Optimized Against",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19453",
        "id": "4eJDMjYZZG",
        "author_site": "Charlotte Nicks, Eric Mitchell, Rafael Rafailov, Archit Sharma, Christopher Manning, Chelsea Finn, Stefano Ermon",
        "tldr": "",
        "abstract": "The fluency and general applicability of large language models (LLMs) has motivated significant interest in detecting whether a piece of text was written by a language model. While both academic and commercial detectors have been deployed in some settings, particularly education, other research has highlighted the fragility of these systems. In this paper, we demonstrate a data-efficient attack that fine-tunes language models to confuse existing detectors, leveraging recent developments in reinforcement learning of language models. We use the `human-ness' score (often just a log probability) of various open-source and commercial detectors as a reward function for reinforcement learning, subject to a KL-divergence constraint that the resulting model does not differ significantly from the original. For a 7B parameter Llama-2 model, fine-tuning for under a day reduces the AUROC of the OpenAI RoBERTa-Large detector from 0.84 to 0.63, while perplexity on OpenWebText increases from 8.7 to only 9.0; with a larger perplexity budget, we can drive AUROC to 0.30 (worse than random). Similar to traditional adversarial attacks, we find that this increase in 'detector evasion' generalizes to other detectors not used during training. In light of our empirical results, we advise against continued reliance on LLM-generated text detectors. Models, datasets, and selected experiment code will be released at https://github.com/charlottttee/llm-detector-evasion.",
        "keywords": "detector;language model;learning from preferences",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Charlotte Nicks;Eric Mitchell;Rafael Rafailov;Archit Sharma;Christopher D Manning;Chelsea Finn;Stefano Ermon",
        "authorids": "cnicks13@stanford.edu;~Eric_Mitchell1;~Rafael_Rafailov1;~Archit_Sharma1;~Christopher_D_Manning1;~Chelsea_Finn1;~Stefano_Ermon1",
        "gender": ";M;M;M;M;F;M",
        "homepage": ";https://ericmitchell.ai;https://rmrafailov.github.io/;;https://nlp.stanford.edu/~manning/;https://ai.stanford.edu/~cbfinn/;http://cs.stanford.edu/~ermon/",
        "dblp": ";238/0419;272/5358;220/3163.html;m/ChristopherDManning;131/1783;47/8135",
        "google_scholar": ";q77J4fgAAAAJ;TwABcRgAAAAJ;_0IIzxgAAAAJ;1zmDOdwAAAAJ;vfPE6hgAAAAJ;",
        "orcid": ";0000-0002-7487-1744;;;0000-0001-6155-649X;;",
        "linkedin": ";;;;christopher-manning-011575/;;",
        "or_profile": "cnicks13@stanford.edu;~Eric_Mitchell1;~Rafael_Rafailov1;~Archit_Sharma1;~Christopher_D_Manning1;~Chelsea_Finn1;~Stefano_Ermon1",
        "aff": ";Stanford University;Stanford University;Stanford University;Computer Science Department, Stanford University;Google;Stanford University",
        "aff_domain": ";stanford.edu;stanford.edu;stanford.edu;cs.stanford.edu;google.com;stanford.edu",
        "position": ";PhD student;PhD student;Graduate Student;Full Professor;Research Scientist;Associate Professor",
        "bibtex": "@inproceedings{\nnicks2024language,\ntitle={Language Model Detectors Are Easily Optimized Against},\nauthor={Charlotte Nicks and Eric Mitchell and Rafael Rafailov and Archit Sharma and Christopher D Manning and Chelsea Finn and Stefano Ermon},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=4eJDMjYZZG}\n}",
        "github": "",
        "project": "",
        "reviewers": "iNUy;oZ9u;bGzn",
        "pdf_size": 893329,
        "rating": "6;6;6",
        "confidence": "4;3;4",
        "soundness": "3;3;2",
        "contribution": "3;3;2",
        "presentation": "2;3;2",
        "wc_summary": "82;127;86",
        "wc_strengths": "48;87;107",
        "wc_weaknesses": "62;72;107",
        "wc_questions": "29;64;1",
        "wc_review": "221;350;301",
        "wc_reply_reviewers": "6;0;0",
        "wc_reply_authors": "757;993;621",
        "reply_reviewers": "1;0;0",
        "reply_authors": "1;2;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            98.33333333333333,
            20.336065390226192
        ],
        "wc_strengths_avg": [
            80.66666666666667,
            24.499433100017278
        ],
        "wc_weaknesses_avg": [
            80.33333333333333,
            19.293061504650375
        ],
        "wc_questions_avg": [
            31.333333333333332,
            25.77250904010361
        ],
        "wc_review_avg": [
            290.6666666666667,
            53.168495266359464
        ],
        "wc_reply_reviewers_avg": [
            2.0,
            2.8284271247461903
        ],
        "wc_reply_authors_avg": [
            790.3333333333334,
            153.68654968980064
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10995996193096347572&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=4eJDMjYZZG",
        "pdf": "https://openreview.net/pdf?id=4eJDMjYZZG",
        "email": ";stanford.edu;stanford.edu;stanford.edu;cs.stanford.edu;google.com;stanford.edu",
        "author_num": 7,
        "aff_unique_index": "0;0;0;0;1;0",
        "aff_unique_norm": "Stanford University;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.stanford.edu;https://www.google.com",
        "aff_unique_abbr": "Stanford;Google",
        "aff_campus_unique_index": "0;0;0;0;1;0",
        "aff_campus_unique": "Stanford;Mountain View",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "4fH5ELoWFu",
        "title": "Towards Certified Probabilistic Robustness with High Accuracy",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Adversarial examples pose a security threat to many critical systems built on neural networks (such as face recognition systems and self-driving cars). While many methods have been proposed to build robust models, how to build certifiably robust yet accurate neural network models remains an open problem. For example, adversarial training improves empirical robustness, but they do not provide certification of the model's robustness. Conversely, certified training provides certified robustness but at the cost of a significant accuracy drop. In this work, we propose a novel approach that aims to achieve both high accuracy and certified probabilistic robustness. Our method has two parts which together achieve our goal, \\emph{i.e.}, a probabilistic robust training method with an additional goal of minimizing variance in divergence in a given vicinity and a runtime inference method for certified probabilistic robustness of the predictions. Compared to alternative methods such as randomized smoothing and certified training, our approach avoids introducing strong noise during training, is effective against a variety of perturbations, and most importantly, achieves certified probabilistic robustness without sacrificing accuracy. Our experiments on multiple models trained on different datasets demonstrate that our approach significantly outperforms existing approaches in terms of both certification rate and accuracy.",
        "keywords": "robustness;adversarial training;probabilistic Robustness",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Ruihan Zhang;Peixin Zhang;Jun Sun",
        "authorids": "~Ruihan_Zhang4;~Peixin_Zhang1;~Jun_Sun12",
        "gender": "F;M;M",
        "homepage": ";http://pxzhang.cn;https://sunjun.site",
        "dblp": ";;",
        "google_scholar": ";nS25GTQAAAAJ;https://scholar.google.com.sg/citations?user=DVsEyn0AAAAJ",
        "orcid": ";;",
        "linkedin": "zhangruihan/;;",
        "or_profile": "~Ruihan_Zhang4;~Peixin_Zhang1;~Jun_Sun12",
        "aff": "Singapore Management University;Singapore Management University;Singapore Management University",
        "aff_domain": "smu.edu.sg;smu.edu.sg;smu.edu.sg",
        "position": "PhD student;Postdoc;Full Professor",
        "bibtex": "@misc{\nzhang2024towards,\ntitle={Towards Certified Probabilistic Robustness with High Accuracy},\nauthor={Ruihan Zhang and Peixin Zhang and Jun Sun},\nyear={2024},\nurl={https://openreview.net/forum?id=4fH5ELoWFu}\n}",
        "github": "",
        "project": "",
        "reviewers": "d8Hi;iJ6m;Dkh4;kTWZ",
        "site": "https://openreview.net/forum?id=4fH5ELoWFu",
        "pdf_size": 869728,
        "rating": "3;3;5;5",
        "confidence": "3;3;4;5",
        "soundness": "1;2;2;1",
        "contribution": "1;2;2;3",
        "presentation": "2;1;2;2",
        "wc_summary": "44;74;18;65",
        "wc_strengths": "41;68;47;74",
        "wc_weaknesses": "192;194;974;203",
        "wc_questions": "484;273;105;216",
        "wc_review": "761;609;1144;558",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            1.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            50.25,
            21.568205766822608
        ],
        "wc_strengths_avg": [
            57.5,
            13.82931668593933
        ],
        "wc_weaknesses_avg": [
            390.75,
            336.7650330720219
        ],
        "wc_questions_avg": [
            269.5,
            137.79060200173305
        ],
        "wc_review_avg": [
            768.0,
            229.56807269304676
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.9045340337332909,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:zxhVKVfQM8YJ:scholar.google.com/&scioq=Towards+Certified+Probabilistic+Robustness+with+High+Accuracy&hl=en&as_sdt=0,44",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Singapore Management University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.smu.edu.sg",
        "aff_unique_abbr": "SMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Singapore"
    },
    {
        "id": "4fVuBf5HE9",
        "title": "Towards Analyzing Self-attention via Linear Neural Network",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Self-attention is a key component of the transformer architecture which has driven much of recent advances in AI. Theoretical analysis of self-attention has received significant attention and remains a work in progress. In this paper, we analyze gradient flow training of a simplified transformer model consisting of a single linear self-attention layer (thus it lacks softmax, MLP,  and layer-normalization) with a single head on a histogram-like problem: the input is a sequence of characters from an alphabet and the output is the vector of counts of each letter in the input sequence. Our analysis goes via a reduction to 2-layer linear neural networks in which the input layer matrix is a diagonal matrix. We provide a complete analysis of gradient flow on these networks. Our reduction to linear neural networks involves one assumption which we empirically verify. Our analysis extends to various extensions of the histogram problem.",
        "keywords": "transformers;linear neural networks;gradient flow analysis",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Pritam Chandra;Tanmay Kumar Sinha;Kabir Ahuja;Ankit Garg;Navin Goyal",
        "authorids": "~Pritam_Chandra1;~Tanmay_Kumar_Sinha1;~Kabir_Ahuja1;~Ankit_Garg1;~Navin_Goyal1",
        "gender": "M;M;M;;",
        "homepage": ";;https://kabirahuja2431.github.io/;https://ankit-garg-6.github.io/;",
        "dblp": ";;https://dblp.uni-trier.de/pid/265/5632;;20/6275",
        "google_scholar": ";;xQ4sUrYAAAAJ;25Ha82sAAAAJ;",
        "orcid": ";;;;",
        "linkedin": "pritamchandra;tanmay-sinha-b747171b3/;kabirahuja2431/;;",
        "or_profile": "~Pritam_Chandra1;~Tanmay_Kumar_Sinha1;~Kabir_Ahuja1;~Ankit_Garg1;~Navin_Goyal1",
        "aff": "Microsoft Research;Microsoft Research;Microsoft;Microsoft;Microsoft",
        "aff_domain": "research.microsoft.com;research.microsoft.com;microsoft.com;microsoft.com;microsoft.com",
        "position": "Research Fellow;Research Fellow;Research Fellow;Researcher;Researcher",
        "bibtex": "@misc{\nchandra2024towards,\ntitle={Towards Analyzing Self-attention via Linear Neural Network},\nauthor={Pritam Chandra and Tanmay Kumar Sinha and Kabir Ahuja and Ankit Garg and Navin Goyal},\nyear={2024},\nurl={https://openreview.net/forum?id=4fVuBf5HE9}\n}",
        "github": "",
        "project": "",
        "reviewers": "nN7u;7ZKc;4ez9",
        "site": "https://openreview.net/forum?id=4fVuBf5HE9",
        "pdf_size": 541289,
        "rating": "3;5;5",
        "confidence": "3;4;4",
        "soundness": "2;3;2",
        "contribution": "2;2;1",
        "presentation": "2;3;2",
        "wc_summary": "113;59;59",
        "wc_strengths": "54;29;29",
        "wc_weaknesses": "225;70;198",
        "wc_questions": "7;64;4",
        "wc_review": "399;222;290",
        "wc_reply_reviewers": "27;0;0",
        "wc_reply_authors": "21;28;0",
        "reply_reviewers": "1;0;0",
        "reply_authors": "1;1;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            77.0,
            25.45584412271571
        ],
        "wc_strengths_avg": [
            37.333333333333336,
            11.785113019775793
        ],
        "wc_weaknesses_avg": [
            164.33333333333334,
            67.60834925428138
        ],
        "wc_questions_avg": [
            25.0,
            27.60434748368452
        ],
        "wc_review_avg": [
            303.6666666666667,
            72.9032844862897
        ],
        "wc_reply_reviewers_avg": [
            9.0,
            12.727922061357855
        ],
        "wc_reply_authors_avg": [
            16.333333333333332,
            11.897712198383164
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.9999999999999998,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:_0JlvKdQYy4J:scholar.google.com/&scioq=Towards+Analyzing+Self-attention+via+Linear+Neural+Network&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Microsoft",
        "aff_unique_dep": "Microsoft Research",
        "aff_unique_url": "https://www.microsoft.com/en-us/research",
        "aff_unique_abbr": "MSR",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "4fbFKO4a2W",
        "title": "Guided Sketch-Based Program Induction by Search Gradients",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Many tasks can be easily solved using machine learning techniques. However, some tasks cannot readily be solved using statistical models, requiring a symbolic approach instead. Program induction is one of the ways that such tasks can be solved by means of capturing an interpretable and generalizable algorithm through training. However, contemporary approaches to program induction are not sophisticated enough to readily be applied to various types of tasks as they tend to be formulated as a single, all-encompassing model, usually parameterized by neural networks. In an attempt to make program induction a viable solution for many scenarios, we propose a framework for learning parameterized programs via search gradients using evolution strategies. This formulation departs from traditional program induction as it allows for the programmer to impart task-specific code to the program 'sketch', while also enjoying the benefits of accelerated learning through end-to-end gradient-based optimization.",
        "keywords": "program induction;program synthesis;optimization;discrete optimization;evolution strategies",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Ahmad Ayaz Amin",
        "authorids": "~Ahmad_Ayaz_Amin1",
        "gender": "",
        "homepage": "https://ayaz-amin.github.io/",
        "dblp": "",
        "google_scholar": "",
        "orcid": "",
        "linkedin": "ahmad-ayaz-amin-68b320177/",
        "or_profile": "~Ahmad_Ayaz_Amin1",
        "aff": "Toronto Metropolitan University",
        "aff_domain": "torontomu.ca",
        "position": "Undergrad student",
        "bibtex": "@misc{\namin2024guided,\ntitle={Guided Sketch-Based Program Induction by Search Gradients},\nauthor={Ahmad Ayaz Amin},\nyear={2024},\nurl={https://openreview.net/forum?id=4fbFKO4a2W}\n}",
        "github": "",
        "project": "",
        "reviewers": "EcME;MY2o;y6cE;a6L3",
        "site": "https://openreview.net/forum?id=4fbFKO4a2W",
        "pdf_size": 290408,
        "rating": "1;3;3;3",
        "confidence": "5;3;4;4",
        "soundness": "2;2;1;3",
        "contribution": "1;2;2;2",
        "presentation": "2;2;1;2",
        "wc_summary": "65;34;95;27",
        "wc_strengths": "37;12;28;42",
        "wc_weaknesses": "133;113;523;112",
        "wc_questions": "1;2;14;38",
        "wc_review": "236;161;660;219",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            55.25,
            27.040478915877213
        ],
        "wc_strengths_avg": [
            29.75,
            11.409973707244026
        ],
        "wc_weaknesses_avg": [
            220.25,
            174.99339273241148
        ],
        "wc_questions_avg": [
            13.75,
            14.905955185763842
        ],
        "wc_review_avg": [
            319.0,
            198.8303296783466
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:sgOg5N870DAJ:scholar.google.com/&scioq=Guided+Sketch-Based+Program+Induction+by+Search+Gradients&hl=en&as_sdt=0,6",
        "gs_version_total": 2,
        "aff_unique_index": "0",
        "aff_unique_norm": "Toronto Metropolitan University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tmu.ca/",
        "aff_unique_abbr": "TMU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Canada"
    },
    {
        "title": "The Hedgehog & the Porcupine: Expressive Linear Attentions with Softmax Mimicry",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19452",
        "id": "4g02l2N2Nx",
        "author_site": "Michael Zhang, Kush Bhatia, Hermann Kumbong, Christopher Re",
        "tldr": "",
        "abstract": "Linear attentions have shown promise for improving Transformer efficiency, reducing attention's quadratic complexity to linear in sequence length. This holds exciting promise for (1) training linear Transformers from scratch, (2) `inetuned-conversion of task-specific Transformers into linear versions that recover task performance, and (3) pretrained-conversion of Transformers, such as language models, into linear versions readily finetunable on downstream tasks. However, linear attentions often underperform compared to standard softmax attention. To close this performance gap, we study the behaviors of softmax and linear attentions in various train-from-scratch and finetuned-conversion settings. We find prior linear attentions lack key properties of softmax attention tied to good performance: low-entropy (or spiky) weights and dot-product monotonicity. We further observe surprisingly simple feature maps that retain these properties match softmax performance, but are inefficient to compute in linear attention. We thus propose Hedgehog, a learnable linear attention that retains the spiky and monotonic properties of softmax attention while maintaining linear complexity. Hedgehog uses simple, trainable MLPs to produce attention weights mimicking softmax attention. Experiments show Hedgehog recovers over 99\\% of standard Transformer performance in train-from-scratch and finetuned-conversion settings, outperforming prior linear attentions by up to 6 perplexity points on WikiText-103 when training causal GPT models from scratch, and up to 8.7 GLUE score points when converting finetuned bidirectional BERT models. Hedgehog also enables pretrained-conversion. Converting a pretrained GPT-2 into a linear attention variant achieves state-of-the-art 16.7 perplexity on WikiText-103 for 125M subquadratic decoder models. We finally turn a pretrained Llama-2 7B into a viable linear attention Llama. With low-rank adaptation, Hedgehog-Llama-2 7B achieves 28.1 higher ROUGE-1 points over the base standard attention model, where prior linear attentions lead to 16.5 point drops.",
        "keywords": "linear attention;transformers",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Michael Zhang;Kush Bhatia;Hermann Kumbong;Christopher Re",
        "authorids": "~Michael_Zhang4;~Kush_Bhatia3;~Hermann_Kumbong1;~Christopher_Re1",
        "gender": "M;;M;",
        "homepage": "https://michaelzhang.xyz/;;https://kumbong.github.io/;",
        "dblp": ";;359/5994;",
        "google_scholar": "DG_asaIAAAAJ;;NnL2qHgAAAAJ;",
        "orcid": ";;;",
        "linkedin": ";;hermannkumbong/;",
        "or_profile": "~Michael_Zhang4;~Kush_Bhatia3;~Hermann_Kumbong1;~Christopher_Re1",
        "aff": "Stanford University;;Stanford University;",
        "aff_domain": "stanford.edu;;stanford.edu;",
        "position": "PhD student;;MS student;",
        "bibtex": "@inproceedings{\nzhang2024the,\ntitle={The Hedgehog \\& the Porcupine: Expressive Linear Attentions with Softmax Mimicry},\nauthor={Michael Zhang and Kush Bhatia and Hermann Kumbong and Christopher Re},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=4g02l2N2Nx}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZtxG;PsQx;y6Q1",
        "pdf_size": 4785029,
        "rating": "5;6;8",
        "confidence": "4;4;4",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "2;2;4",
        "wc_summary": "59;79;184",
        "wc_strengths": "43;10;154",
        "wc_weaknesses": "44;51;111",
        "wc_questions": "66;14;43",
        "wc_review": "212;154;492",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1077;496;549",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            107.33333333333333,
            54.822947344661756
        ],
        "wc_strengths_avg": [
            69.0,
            61.59545437773797
        ],
        "wc_weaknesses_avg": [
            68.66666666666667,
            30.070288030250428
        ],
        "wc_questions_avg": [
            41.0,
            21.275964529643932
        ],
        "wc_review_avg": [
            286.0,
            147.5759691368031
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            707.3333333333334,
            262.2877978269079
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 48,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15609051419806727889&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=4g02l2N2Nx",
        "pdf": "https://openreview.net/pdf?id=4g02l2N2Nx",
        "email": "stanford.edu;;stanford.edu;",
        "author_num": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Stanford University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.stanford.edu",
        "aff_unique_abbr": "Stanford",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Stanford",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "4g67WoYwMV",
        "title": "PromptFix: Few-shot Backdoor Removal via Adversarial Prompt Tuning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Pre-trained language models (PLMs) have attracted tons of attention over the past few years with their unparalleled performances. Meanwhile, the soaring cost to train PLMs and their amazing generalizability have contributed to few-shot fine-tuning and prompting as the most popular training paradigms for natural language processing (NLP) models. However, existing studies have shown that these NLP models can be backdoored such that model behavior is manipulated when the trigger tokens are presented. In this paper, we propose PromptFix, a novel backdoor mitigation strategy for NLP models via adversarial prompt-tuning in few-shot settings. Unlike existing NLP backdoor removal methods, which rely on accurate trigger inversion and subsequent model fine-tuning, PromptFix keeps the model parameters intact and only utilizes two extra sets of soft tokens which approximate the trigger and counteract it respectively. The use of soft tokens and adversarial optimization eliminates the need to enumerate possible backdoor configurations and enables an adaptive balance between trigger finding and preservation of performance. Experiments with various backdoor attacks validate the effectiveness of the proposed method. The performances when domain shift is present further shows PromptFix's applicability to pretrained models on unknown data which is common in prompt tuning scenarios.",
        "keywords": "backdoor mitigation;backdoor removal;adversarial training;prompt tuning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Tianrong Zhang;Zhaohan Xi;Ting Wang;Prasenjit Mitra;Jinghui Chen",
        "authorids": "~Tianrong_Zhang1;~Zhaohan_Xi1;~Ting_Wang1;~Prasenjit_Mitra1;~Jinghui_Chen1",
        "gender": "M;M;M;M;M",
        "homepage": "https://zhangtianrong.github.io/profile/#en;https://zhaohan-xi.github.io;https://alps-lab.github.io/;http://www.personal.psu.edu/pum10/;https://jinghuichen.github.io/",
        "dblp": ";224/9296;12/2633-6.html;19/3308;67/5633",
        "google_scholar": ";wQgnjMIAAAAJ;cwcBTegAAAAJ;8PbgiPkAAAAJ;mKia7Y4AAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;prasenjit-mitra-962471/;",
        "or_profile": "~Tianrong_Zhang1;~Zhaohan_Xi1;~Ting_Wang1;~Prasenjit_Mitra1;~Jinghui_Chen1",
        "aff": "Pennsylvania State University;State University of New York at Binghamton;State University of New York at Stony Brook;Pennsylvania State University;Pennsylvania State University",
        "aff_domain": "psu.edu;binghamton.edu;cs.stonybrook.edu;psu.edu;psu.edu",
        "position": "PhD student;Assistant Professor;Associate Professor;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nzhang2024promptfix,\ntitle={PromptFix: Few-shot Backdoor Removal via Adversarial Prompt Tuning},\nauthor={Tianrong Zhang and Zhaohan Xi and Ting Wang and Prasenjit Mitra and Jinghui Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=4g67WoYwMV}\n}",
        "github": "",
        "project": "",
        "reviewers": "H931;7Ta8;Qy5u",
        "site": "https://openreview.net/forum?id=4g67WoYwMV",
        "pdf_size": 467125,
        "rating": "3;5;5",
        "confidence": "3;4;4",
        "soundness": "2;2;2",
        "contribution": "2;3;3",
        "presentation": "2;2;2",
        "wc_summary": "89;59;124",
        "wc_strengths": "142;30;94",
        "wc_weaknesses": "235;87;118",
        "wc_questions": "187;97;42",
        "wc_review": "653;273;378",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            90.66666666666667,
            26.562295750848715
        ],
        "wc_strengths_avg": [
            88.66666666666667,
            45.87906809089401
        ],
        "wc_weaknesses_avg": [
            146.66666666666666,
            63.73033465748909
        ],
        "wc_questions_avg": [
            108.66666666666667,
            59.768070256803696
        ],
        "wc_review_avg": [
            434.6666666666667,
            160.2255354873942
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.9999999999999998,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6652982913500088575&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;2;0;0",
        "aff_unique_norm": "Pennsylvania State University;State University of New York at Binghamton;State University of New York at Stony Brook",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.psu.edu;https://www.binghamton.edu;https://www.stonybrook.edu",
        "aff_unique_abbr": "PSU;SUNY Binghamton;SUNY Stony Brook",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Binghamton;Stony Brook",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Diffusion-TS: Interpretable Diffusion for General Time Series Generation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19451",
        "id": "4h1apFjO99",
        "author_site": "Xinyu Yuan, Yan Qiao",
        "tldr": "",
        "abstract": "Denoising diffusion probabilistic models (DDPMs) are becoming the leading paradigm for generative models. It has recently shown breakthroughs in audio synthesis, time series imputation and forecasting. In this paper, we propose Diffusion-TS, a novel diffusion-based framework that generates multivariate time series samples of high quality by using an encoder-decoder transformer with disentangled temporal representations, in which the decomposition technique guides Diffusion-TS to capture the semantic meaning of time series while transformers mine detailed sequential information from the noisy model input. Different from existing diffusion-based approaches, we train the model to directly reconstruct the sample instead of the noise in each diffusion step, combining a Fourier-based loss term. Diffusion-TS is expected to generate time series satisfying both interpretablity and realness. In addition, it is shown that the proposed Diffusion-TS can be easily extended to conditional generation tasks, such as forecasting and imputation, without any model changes. This also motivates us to further explore the performance of Diffusion-TS under irregular settings. Finally, through qualitative and quantitative experiments, results show that Diffusion-TS achieves the state-of-the-art results on various realistic analyses of time series.",
        "keywords": "Diffusion models;Synthetic Time series;Imputation;Forecasting",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/fbd19945fb6b17fb5f703c7b893e7ce83afa9b69.zip",
        "author": "Xinyu Yuan;Yan Qiao",
        "authorids": "~Xinyu_Yuan3;~Yan_Qiao1",
        "gender": "M;F",
        "homepage": "https://y-debug-sys.github.io/;http://faculty.hfut.edu.cn/qiaoyan/zh_CN/index.htm",
        "dblp": ";65/7820",
        "google_scholar": "https://scholar.google.co.in/citations?hl=en;3NPBIgcAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Xinyu_Yuan3;~Yan_Qiao1",
        "aff": "Hefei University of Technology;Hefei University of Technology",
        "aff_domain": "hfut.edu.cn;hfut.edu.cn",
        "position": "MS student;Associate Professor",
        "bibtex": "@inproceedings{\nyuan2024diffusionts,\ntitle={Diffusion-{TS}: Interpretable Diffusion for General Time Series Generation},\nauthor={Xinyu Yuan and Yan Qiao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=4h1apFjO99}\n}",
        "github": "",
        "project": "",
        "reviewers": "Prro;iyrP;bNeL",
        "pdf_size": 7259356,
        "rating": "5;6;8",
        "confidence": "4;3;4",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "2;3;3",
        "wc_summary": "79;72;130",
        "wc_strengths": "27;137;29",
        "wc_weaknesses": "216;135;59",
        "wc_questions": "124;204;206",
        "wc_review": "446;548;424",
        "wc_reply_reviewers": "263;30;0",
        "wc_reply_authors": "1355;965;515",
        "reply_reviewers": "3;1;0",
        "reply_authors": "4;3;1",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            93.66666666666667,
            25.84999462712173
        ],
        "wc_strengths_avg": [
            64.33333333333333,
            51.38957957493804
        ],
        "wc_weaknesses_avg": [
            136.66666666666666,
            64.10581530216706
        ],
        "wc_questions_avg": [
            178.0,
            38.19249489974001
        ],
        "wc_review_avg": [
            472.6666666666667,
            54.020572213021055
        ],
        "wc_reply_reviewers_avg": [
            97.66666666666667,
            117.54809890234532
        ],
        "wc_reply_authors_avg": [
            945.0,
            343.2200460346103
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            1.247219128924647
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.18898223650461363,
        "gs_citation": 71,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1266541908830140535&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=4h1apFjO99",
        "pdf": "https://openreview.net/pdf?id=4h1apFjO99",
        "email": "hfut.edu.cn;hfut.edu.cn",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Hefei University of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.hfut.edu.cn/",
        "aff_unique_abbr": "HUT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "4hqe5fgmfj",
        "title": "Regret Rates for $\\epsilon$-Greedy Strategies for Nonparametric Bandits with Delayed Rewards",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Incorporating delayed feedback is often crucial in applying multi-armed bandit algorithms in real-world sequential decision making problems. In this paper, we present finite time regret upper bounds for $\\epsilon$-greedy type randomized allocation strategies in a nonparametric contextual bandits framework with delayed rewards. The strategies presented differ in how the exploration rate changes as a function of delays. We consider unbounded random delays and use the Nadaraya-Watson estimator for estimating the mean reward functions. We also propose practical data-driven strategies that adaptively choose between the two proposed strategies.",
        "keywords": "Contextual Bandits;Delayed Rewards;Nonparametric Estimation;Nadaraya-Watson Estimator;Regret",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/c863652ce5a44f6ee404938e74b7197c34dafeb7.pdf",
        "author": "Sakshi Arya;Yuhong Yang",
        "authorids": "~Sakshi_Arya1;~Yuhong_Yang1",
        "gender": "F;M",
        "homepage": "https://sakshiarya.github.io/about/;http://users.stat.umn.edu/~yangx374/",
        "dblp": ";52/5811",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0002-7828-6569;0000-0003-3618-3083",
        "linkedin": "sakshi-arya-2704a3173/;",
        "or_profile": "~Sakshi_Arya1;~Yuhong_Yang1",
        "aff": "Case Western Reserve University;",
        "aff_domain": "case.edu;",
        "position": "Assistant Professor;",
        "bibtex": "@misc{\narya2024regret,\ntitle={Regret Rates for \\${\\textbackslash}epsilon\\$-Greedy Strategies for Nonparametric Bandits with Delayed Rewards},\nauthor={Sakshi Arya and Yuhong Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=4hqe5fgmfj}\n}",
        "github": "",
        "project": "",
        "reviewers": "S8Nn;Zt6w;85Kj;pTZn",
        "site": "https://openreview.net/forum?id=4hqe5fgmfj",
        "pdf_size": 822021,
        "rating": "3;5;5;5",
        "confidence": "4;3;3;4",
        "soundness": "3;3;3;4",
        "contribution": "2;2;2;3",
        "presentation": "1;2;3;3",
        "wc_summary": "67;163;64;101",
        "wc_strengths": "26;57;96;59",
        "wc_weaknesses": "252;65;88;183",
        "wc_questions": "258;71;17;8",
        "wc_review": "603;356;265;351",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            98.75,
            39.83952183447989
        ],
        "wc_strengths_avg": [
            59.5,
            24.804233509624925
        ],
        "wc_weaknesses_avg": [
            147.0,
            75.04332082204252
        ],
        "wc_questions_avg": [
            88.5,
            100.78318312099495
        ],
        "wc_review_avg": [
            393.75,
            126.10982317012422
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:a-cW-8vMgOcJ:scholar.google.com/&scioq=Regret+Rates+for+%24%5Cepsilon%24-Greedy+Strategies+for+Nonparametric+Bandits+with+Delayed+Rewards&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Case Western Reserve University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.case.edu",
        "aff_unique_abbr": "CWRU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "4hrK7d60My",
        "title": "Memorization for Good: Encryption with Autoregressive Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Over-parameterized neural language models (LMs) can memorize and recite long sequences of training data. While such memorization is normally associated with undesired properties such as overfitting and information leaking, our work casts memorization as an unexplored capability of LMs. We propose the first symmetric encryption algorithm with autoregressive language models (SELM). We show that autoregressive LMs can encode arbitrary data into a compact real-valued vector (i.e., encryption) and then losslessly decode the vector to the original message (i.e., decryption) via random subspace optimization and greedy decoding. While SELM is not amenable to conventional cryptanalysis, we investigate its security through a novel empirical variant of the classic IND-CPA (indistinguishability under chosen-plaintext attack) game.",
        "keywords": "language models;symmetric encryption;cryptography;application",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/52276f3f7303f39867a50633ec51e106986d7550.zip",
        "author": "Samuel Stevens;Yu Su",
        "authorids": "~Samuel_Stevens1;~Yu_Su2",
        "gender": "M;M",
        "homepage": "https://samuelstevens.me;http://ysu1989.github.io",
        "dblp": "279/6356;38/1070-1",
        "google_scholar": "uR-A0LAAAAAJ;rIh5OqoAAAAJ",
        "orcid": "0009-0000-9493-7766;",
        "linkedin": ";",
        "or_profile": "~Samuel_Stevens1;~Yu_Su2",
        "aff": "Ohio State University, Columbus;Microsoft",
        "aff_domain": "osu.edu;microsoft.com",
        "position": "PhD student;Senior Researcher",
        "bibtex": "@misc{\nstevens2024memorization,\ntitle={Memorization for Good: Encryption with Autoregressive Language Models},\nauthor={Samuel Stevens and Yu Su},\nyear={2024},\nurl={https://openreview.net/forum?id=4hrK7d60My}\n}",
        "github": "",
        "project": "",
        "reviewers": "dUZZ;vHhk;wc1D;XtDw",
        "site": "https://openreview.net/forum?id=4hrK7d60My",
        "pdf_size": 1078887,
        "rating": "3;3;3;6",
        "confidence": "5;4;3;3",
        "soundness": "2;2;2;4",
        "contribution": "2;3;2;3",
        "presentation": "2;1;2;4",
        "wc_summary": "153;28;90;53",
        "wc_strengths": "7;23;5;85",
        "wc_weaknesses": "183;140;19;142",
        "wc_questions": "134;60;25;60",
        "wc_review": "477;251;139;340",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "271;162;103;240",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            81.0,
            47.05847426340977
        ],
        "wc_strengths_avg": [
            30.0,
            32.51153641401772
        ],
        "wc_weaknesses_avg": [
            121.0,
            61.33922073192649
        ],
        "wc_questions_avg": [
            69.75,
            39.75157229594824
        ],
        "wc_review_avg": [
            301.75,
            123.73232196964543
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            194.0,
            65.85969936159745
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11166588927408510344&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Ohio State University;Microsoft",
        "aff_unique_dep": ";Microsoft Corporation",
        "aff_unique_url": "https://www.osu.edu;https://www.microsoft.com",
        "aff_unique_abbr": "OSU;Microsoft",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Columbus;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "4i4fgCOBDE",
        "title": "Networked Inequality: Preferential Attachment Bias in Graph Neural Network Link Prediction",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph neural network (GNN) link prediction is increasingly deployed in citation, collaboration, and online social networks to recommend academic literature, collaborators, and friends. While prior research has investigated the dyadic fairness of GNN link prediction, the within-group fairness and ``rich get richer'' dynamics of link prediction remain underexplored. However, these aspects have significant consequences for degree and power imbalances in networks. In this paper, we shed light on how degree bias in networks affects Graph Convolutional Network (GCN) link prediction. In particular, we theoretically uncover that GCNs with a symmetric normalized graph filter have a within-group preferential attachment bias. We validate our theoretical analysis on real-world citation, collaboration, and online social networks. We further bridge GCN's preferential attachment bias with unfairness in link prediction and propose a new within-group fairness metric. This metric quantifies disparities in link prediction scores between social groups, towards combating the amplification of degree and power disparities. Finally, we propose a simple training-time strategy to alleviate within-group unfairness, and we show that it is effective on citation, online social, and credit networks.",
        "keywords": "graph learning;fairness;link prediction",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/55e28c0d8107ea58843db8331acc1284d2c1e5a8.zip",
        "author": "Arjun Subramonian;Levent Sagun;Yizhou Sun",
        "authorids": "~Arjun_Subramonian1;~Levent_Sagun1;~Yizhou_Sun1",
        "gender": "Agender;Non-Binary;F",
        "homepage": "http://arjunsubramonian.github.io/;http://cims.nyu.edu/~sagun/;http://web.cs.ucla.edu/~yzsun/",
        "dblp": "282/0168.html;155/9866;37/3868",
        "google_scholar": "MrdlDhoAAAAJ;-iPZaBcAAAAJ;https://scholar.google.com.tw/citations?user=TQgOjK0AAAAJ",
        "orcid": "0000-0002-0415-3800;0000-0001-5403-4124;",
        "linkedin": "arjuns22/;;",
        "or_profile": "~Arjun_Subramonian1;~Levent_Sagun1;~Yizhou_Sun1",
        "aff": "University of California, Los Angeles;Meta;University of California, Los Angeles",
        "aff_domain": "ucla.edu;meta.com;ucla.edu",
        "position": "PhD student;Research scientist;Associate Professor",
        "bibtex": "@misc{\nsubramonian2024networked,\ntitle={Networked Inequality: Preferential Attachment Bias in Graph Neural Network Link Prediction},\nauthor={Arjun Subramonian and Levent Sagun and Yizhou Sun},\nyear={2024},\nurl={https://openreview.net/forum?id=4i4fgCOBDE}\n}",
        "github": "",
        "project": "",
        "reviewers": "LXYw;bJuY;qGCf;LDLM",
        "site": "https://openreview.net/forum?id=4i4fgCOBDE",
        "pdf_size": 3213881,
        "rating": "5;5;6;8",
        "confidence": "4;4;3;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;4;4;3",
        "wc_summary": "69;200;58;226",
        "wc_strengths": "73;98;60;95",
        "wc_weaknesses": "148;112;131;215",
        "wc_questions": "87;301;2;2",
        "wc_review": "377;711;251;538",
        "wc_reply_reviewers": "136;43;18;6",
        "wc_reply_authors": "898;450;452;361",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            138.25,
            75.41344376170605
        ],
        "wc_strengths_avg": [
            81.5,
            15.724185193516387
        ],
        "wc_weaknesses_avg": [
            151.5,
            38.81043674065006
        ],
        "wc_questions_avg": [
            98.0,
            122.23133804389118
        ],
        "wc_review_avg": [
            469.25,
            172.70838862081945
        ],
        "wc_reply_reviewers_avg": [
            50.75,
            50.99693618248061
        ],
        "wc_reply_authors_avg": [
            540.25,
            209.79081843588867
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8164965809277259,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15580880506040045795&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of California, Los Angeles;Meta",
        "aff_unique_dep": ";Meta Platforms, Inc.",
        "aff_unique_url": "https://www.ucla.edu;https://meta.com",
        "aff_unique_abbr": "UCLA;Meta",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Los Angeles;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "4i8QiVIlAi",
        "title": "Semantic-Guided Consistency and Discrimination for Siamese Representation Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recently, self-supervised representation learning with Siamese structure (Siamese representation learning) has shown promising results. Current methods commonly adopt instance discrimination to learn invariant global representations at the image-level from randomly cropped views, which risks introducing object-irrelevant nuisances of background information in the image-level representations, i.e., random cropping induces nuisances of background. Further works aiming to solve the problem simply match the visual patterns across views independently, failing to look into the foreground and background regions. Intuitively, the nuisances of background could be alleviated by separating foreground and background in random crops. Therefore, we present a new self-supervised learning framework, semantic-guided consistency and discrimination (SCD) that learns to separate the foreground and background semantics in random crops while learning image-level representations. Specifically, we extract foreground and background semantics by aggregating the global feature map encoding the image content, using the learned feature-level saliency maps (indicating the foreground pixels on feature maps) as weights. Then we construct triplets from the foreground and background semantics of the two augmented views and distinguish foreground from background with triplet loss. Our SCD strategy can easily be applied to existing Siamese representation learning frameworks, including contrastive learning (e.g., MoCo-v2) and non-contrastive learning (e.g., BYOL) paradigm. By applying our SCD to both paradigms, we show that our method can achieve consistent improvements on classification and dense prediction tasks.",
        "keywords": "Contrastive learning;Siamese representation learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Zheng Gao;Ioannis Patras",
        "authorids": "~Zheng_Gao2;~Ioannis_Patras2",
        "gender": "M;M",
        "homepage": "https://zaczgao.github.io/;http://www.eecs.qmul.ac.uk/~ioannisp/",
        "dblp": "03/4645-3;18/1556",
        "google_scholar": "SXJFLpAAAAAJ;https://scholar.google.com.tw/citations?user=OBYLxRkAAAAJ",
        "orcid": "0000-0001-5541-8840;0000-0003-3913-4738",
        "linkedin": ";ioannis-patras-1053767/",
        "or_profile": "~Zheng_Gao2;~Ioannis_Patras2",
        "aff": "Queen Mary, University of London;Queen Mary, University of London",
        "aff_domain": "qmul.ac.uk;qmul.ac.uk",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\ngao2024semanticguided,\ntitle={Semantic-Guided Consistency and Discrimination for Siamese Representation Learning},\nauthor={Zheng Gao and Ioannis Patras},\nyear={2024},\nurl={https://openreview.net/forum?id=4i8QiVIlAi}\n}",
        "github": "",
        "project": "",
        "reviewers": "YhuM;131y;CkNt;Exdt;Ue4Q",
        "site": "https://openreview.net/forum?id=4i8QiVIlAi",
        "pdf_size": 840901,
        "rating": "3;3;3;5;6",
        "confidence": "5;5;4;4;4",
        "soundness": "2;2;1;3;3",
        "contribution": "2;1;1;2;3",
        "presentation": "3;2;2;3;4",
        "wc_summary": "38;65;55;80;47",
        "wc_strengths": "17;45;23;19;10",
        "wc_weaknesses": "84;426;329;94;145",
        "wc_questions": "2;1;23;129;10",
        "wc_review": "141;537;430;322;212",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            4.0,
            1.2649110640673518
        ],
        "confidence_avg": [
            4.4,
            0.48989794855663565
        ],
        "soundness_avg": [
            2.2,
            0.7483314773547882
        ],
        "contribution_avg": [
            1.8,
            0.7483314773547883
        ],
        "presentation_avg": [
            2.8,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            57.0,
            14.546477236774544
        ],
        "wc_strengths_avg": [
            22.8,
            11.872657663724665
        ],
        "wc_weaknesses_avg": [
            215.6,
            137.27140998765913
        ],
        "wc_questions_avg": [
            33.0,
            48.641546028061235
        ],
        "wc_review_avg": [
            328.4,
            143.20977620260427
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.6454972243679027,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:RklV1PE58mUJ:scholar.google.com/&scioq=Semantic-Guided+Consistency+and+Discrimination+for+Siamese+Representation+Learning&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Queen Mary, University of London",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.qmul.ac.uk",
        "aff_unique_abbr": "QMUL",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "London",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "title": "Scalable Neural Network Kernels",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19450",
        "id": "4iPw1klFWa",
        "author_site": "Arijit Sehanobish, Krzysztof Choromanski, YUNFAN ZHAO, Kumar Dubey, Valerii Likhosherstov",
        "tldr": "",
        "abstract": "We introduce the concept of scalable neural network kernels (SNNKs), the replacements of regular feedforward layers (FFLs), capable of approximating the latter, but with favorable computational properties. SNNKs effectively disentangle the inputs from the parameters of the neural network in the FFL, only to connect them in the final computation via the dot-product kernel. \nThey are also strictly more expressive, as allowing to model complicated relationships beyond the functions of the dot-products of parameter-input vectors. We also introduce the neural network bundling process that applies SNNKs to compactify deep neural network architectures, resulting in additional compression gains. In its extreme version, it leads to the fully bundled network whose optimal parameters can be expressed via explicit formulae for several loss functions (e.g. mean squared error), opening a possibility to bypass backpropagation. As a by-product of our analysis, we introduce the mechanism of the universal random features (or URFs), applied to instantiate several SNNK variants, and interesting on its own in the context of scalable kernel methods. We provide rigorous theoretical analysis of all these concepts as well as an extensive empirical evaluation, ranging from point-wise kernel estimation to Transformers' fine-tuning with novel adapter layers inspired by SNNKs. Our mechanism provides up to 5x reduction in the number of trainable parameters, while maintaining competitive accuracy.",
        "keywords": "scalable kernel methods;random features;deep neural networks",
        "primary_area": "metric learning, kernel learning, and sparse coding",
        "supplementary_material": "",
        "author": "Arijit Sehanobish;Krzysztof Marcin Choromanski;YUNFAN ZHAO;Kumar Avinava Dubey;Valerii Likhosherstov",
        "authorids": "~Arijit_Sehanobish1;~Krzysztof_Marcin_Choromanski1;~YUNFAN_ZHAO1;~Kumar_Avinava_Dubey1;~Valerii_Likhosherstov2",
        "gender": "M;;M;;M",
        "homepage": "https://github.com/arijitthegame/;;https://yzhao3685.github.io/;https://valerytyumen.github.io/;https://sites.google.com/site/kumaravinavadubey/",
        "dblp": "249/5322;78/11411;304/4614;232/4391.html;10/7789",
        "google_scholar": "MEby6-QAAAAJ;;wy_rqnwAAAAJ;iiVVfxUAAAAJ;tBbUAfsAAAAJ",
        "orcid": "0000-0003-2769-2003;;;;",
        "linkedin": "arijit-sehanobish-b76627112/;;;;",
        "or_profile": "~Arijit_Sehanobish1;~Krzysztof_Marcin_Choromanski1;~YUNFAN_ZHAO1;~Valerii_Likhosherstov2;~Kumar_A_Dubey1",
        "aff": "Kensho Technologies;Google Brain Robotics & Columbia University;Harvard University;Waymo;Google Research",
        "aff_domain": "kensho.com;columbia.edu;g.harvard.edu;waymo.com;google.com",
        "position": "Applied Scientist;research scientist & adjunct assistant professor;Postdoc;Researcher;Research Scientist",
        "bibtex": "@inproceedings{\nsehanobish2024scalable,\ntitle={Scalable Neural Network Kernels},\nauthor={Arijit Sehanobish and Krzysztof Marcin Choromanski and YUNFAN ZHAO and Kumar Avinava Dubey and Valerii Likhosherstov},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=4iPw1klFWa}\n}",
        "github": "",
        "project": "",
        "reviewers": "hP8B;YEib;uu7e;zChr",
        "pdf_size": 2818029,
        "rating": "5;5;8;8",
        "confidence": "4;3;3;3",
        "soundness": "3;2;4;4",
        "contribution": "3;2;4;4",
        "presentation": "3;3;3;3",
        "wc_summary": "33;219;99;221",
        "wc_strengths": "12;175;112;255",
        "wc_weaknesses": "28;197;126;104",
        "wc_questions": "131;10;21;179",
        "wc_review": "204;601;358;759",
        "wc_reply_reviewers": "49;27;0;0",
        "wc_reply_authors": "851;1599;816;1375",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "2;5;2;3",
        "rating_avg": [
            6.5,
            1.5
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            3.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            143.0,
            80.46117075956576
        ],
        "wc_strengths_avg": [
            138.5,
            88.89460051094217
        ],
        "wc_weaknesses_avg": [
            113.75,
            60.26763227471277
        ],
        "wc_questions_avg": [
            85.25,
            71.890107108002
        ],
        "wc_review_avg": [
            480.5,
            214.2084265382667
        ],
        "wc_reply_reviewers_avg": [
            19.0,
            20.530465167647808
        ],
        "wc_reply_authors_avg": [
            1160.25,
            336.438237273946
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.0,
            1.224744871391589
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5773502691896258,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14725734791680925783&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=4iPw1klFWa",
        "pdf": "https://openreview.net/pdf?id=4iPw1klFWa",
        "email": "kensho.com;columbia.edu;g.harvard.edu;waymo.com;google.com",
        "author_num": 5,
        "aff_unique_index": "0;1;2;3;1",
        "aff_unique_norm": "Kensho Technologies;Google;Harvard University;Waymo",
        "aff_unique_dep": ";Google Brain Robotics;;",
        "aff_unique_url": "https://www.kensho.com;https://ai.google;https://www.harvard.edu;https://www.waymo.com",
        "aff_unique_abbr": ";Google;Harvard;Waymo",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "4iQuByhNie",
        "title": "ContextNER: Contextual Phrase Generation at Scale",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Named Entity Recognition (NER) has seen significant progress in recent years, with numerous state-of-the-art (SOTA) models achieving high performance. \nHowever, very few studies have focused on the generation of entities' context.\nIn this paper, we introduce ContextNER, a task that aims to generate the relevant context for entities in a sentence, where the context is a phrase describing the entity but not necessarily present in the sentence. \nTo facilitate research in this task, we also present the EDGAR10-Q dataset, which consists of annual and quarterly reports from the top 1500 publicly traded companies. \nThe dataset is the largest of its kind, containing 1M sentences, 2.8M entities, and an average of 35 tokens per sentence, making it a challenging dataset. \nWe propose a baseline approach that combines a phrase generation algorithm with inferencing using a 220M language model, achieving a ROUGE-L score of 27% on the test split.\nAdditionally, we perform a one-shot inference with ChatGPT, which obtains a 30% ROUGE-L, highlighting the difficulty of the dataset. \nWe also evaluate models such as T5 and BART, which achieve a maximum ROUGE-L  of 49% after supervised finetuning on EDGAR10-Q. \nWe also find that T5-large, when pre-finetuned on EDGAR10-Q, achieve SOTA results on downstream finance tasks such as Headline, FPB, and FiQA SA, outperforming vanilla version by 10.81 points.\nTo our surprise, this 66x smaller pre-finetuned model also surpasses the finance-specific LLM BloombergGPT-50B by 15 points. \nWe hope that our dataset and generated artifacts will encourage further research in this direction, leading to the development of more sophisticated language models for financial text analysis",
        "keywords": "Novel task;Relevant context of entities;NER",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/d5e1e45eb895a73a8684f5d8ac14bc25d41f4eb5.zip",
        "author": "Himanshu Gupta;Shreyas Verma;Santosh Mashetty;Swaroop Mishra",
        "authorids": "~Himanshu_Gupta5;~Shreyas_Verma1;~Santosh_Mashetty1;~Swaroop_Mishra1",
        "gender": "M;M;M;M",
        "homepage": "https://him1411.github.io;;;https://swarooprm.github.io/",
        "dblp": ";;;249/2784",
        "google_scholar": "ydjuhxsAAAAJ;j6dIihMAAAAJ;eQN-aNAAAAAJ;-7LK2SwAAAAJ",
        "orcid": ";;;",
        "linkedin": "himanshugupta14/;shreyas-verma/;santoshmashetty/;",
        "or_profile": "~Himanshu_Gupta5;~Shreyas_Verma1;~Santosh_Mashetty1;~Swaroop_Mishra1",
        "aff": "Amazon;Simplr AI;Arizona State University;Google",
        "aff_domain": "amazon.com;simplr.ai;asu.edu;google.com",
        "position": "Researcher;Researcher;PhD student;Researcher",
        "bibtex": "@misc{\ngupta2024contextner,\ntitle={Context{NER}: Contextual Phrase Generation at Scale},\nauthor={Himanshu Gupta and Shreyas Verma and Santosh Mashetty and Swaroop Mishra},\nyear={2024},\nurl={https://openreview.net/forum?id=4iQuByhNie}\n}",
        "github": "",
        "project": "",
        "reviewers": "btb9;uqH6;kwQd",
        "site": "https://openreview.net/forum?id=4iQuByhNie",
        "pdf_size": 648322,
        "rating": "3;3;6",
        "confidence": "2;3;4",
        "soundness": "2;2;3",
        "contribution": "2;2;2",
        "presentation": "2;3;3",
        "wc_summary": "117;67;88",
        "wc_strengths": "13;17;177",
        "wc_weaknesses": "279;172;214",
        "wc_questions": "36;31;2",
        "wc_review": "445;287;481",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "530;754;451",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            90.66666666666667,
            20.499322482029065
        ],
        "wc_strengths_avg": [
            69.0,
            76.38498979948002
        ],
        "wc_weaknesses_avg": [
            221.66666666666666,
            44.01767321832852
        ],
        "wc_questions_avg": [
            23.0,
            14.98888477061141
        ],
        "wc_review_avg": [
            404.3333333333333,
            84.25886039791634
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            578.3333333333334,
            128.3337662330361
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.8660254037844387,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10881753058535838737&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Amazon;Simplr AI;Arizona State University;Google",
        "aff_unique_dep": "Amazon.com, Inc.;;;Google",
        "aff_unique_url": "https://www.amazon.com;https://www.simplr.ai;https://www.asu.edu;https://www.google.com",
        "aff_unique_abbr": "Amazon;Simplr AI;ASU;Google",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "4j4reehkjZ",
        "title": "JEN-1: Text-Guided Universal Music Generation with Omnidirectional Diffusion Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Music generation has attracted growing interest with the advancement of deep generative models. \nHowever, generating music conditioned on textual descriptions, known as text-to-music, remains challenging due to the complexity of musical structures and high sampling rate requirements.\nDespite the task's significance, prevailing generative models exhibit limitations in music quality, computational efficiency, and generalization ability. \nThis paper introduces JEN-1, a universal high-fidelity model for text-to-music generation. \nJEN-1 is a diffusion model incorporating both autoregressive and non-autoregressive training in an end-to-end manner, enabling up to 48kHz high-fidelity stereo music generation. \nThrough multi-task in-context learning, JEN-1 performs various generation tasks including text-guided music generation, music inpainting, and continuation. \nEvaluations demonstrate JEN-1's superior performance over state-of-the-art methods in text-music alignment and music quality while maintaining computational efficiency.\nOur anonymous demo pages are available at https://anonymous.4open.science/w/Jen1-Demo-Page-21D4",
        "keywords": "multimodal learning;text-to-music;music generation;non-autoregressive",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Peike Li;Boyu Chen;Yao Yao;Yikai Wang;Allen Wang;Alex Wang",
        "authorids": "~Peike_Li1;~Boyu_Chen3;~Yao_Yao5;~Yikai_Wang2;~Allen_Wang1;~Alex_Wang3",
        "gender": ";;M;M;M;M",
        "homepage": ";;https://yaoyao1995.github.io/;https://yikaiw.github.io/;;",
        "dblp": "251/5626;;07/4410-6;85/9555-1;;",
        "google_scholar": "dOzTcvwAAAAJ;o5wjqPEAAAAJ;hNO0NdEAAAAJ;MnW5aegAAAAJ;;",
        "orcid": ";;0000-0001-9887-4301;;;",
        "linkedin": "peikeli/;boyu-chen-356004236/;yao-yao-6119661b5/;;allen-wang-js/;dr-alex-wang-5a734b44",
        "or_profile": "~Peike_Li1;~Boyu_Chen3;~Yao_Yao5;~Yikai_Wang2;~Allen_Wang1;~Alex_Wang3",
        "aff": "Futureverse AI;futureverse;Tsinghua University;Tsinghua University;;Futureverse",
        "aff_domain": "futureverse.com;futureverse.com;tsinghua.edu.cn;tsinghua.edu.cn;;futureverse.com",
        "position": "Principal Researcher;Researcher;PhD student;Postdoc;;Principal Researcher",
        "bibtex": "@misc{\nli2024jen,\ntitle={{JEN}-1: Text-Guided Universal Music Generation with Omnidirectional Diffusion Models},\nauthor={Peike Li and Boyu Chen and Yao Yao and Yikai Wang and Allen Wang and Alex Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=4j4reehkjZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "Yv1M;TQzw;i8hT;seXG",
        "site": "https://openreview.net/forum?id=4j4reehkjZ",
        "pdf_size": 399984,
        "rating": "3;3;3;6",
        "confidence": "4;5;4;3",
        "soundness": "2;2;2;2",
        "contribution": "2;1;2;3",
        "presentation": "2;1;2;3",
        "wc_summary": "69;43;186;94",
        "wc_strengths": "64;54;71;37",
        "wc_weaknesses": "251;148;635;92",
        "wc_questions": "67;38;477;13",
        "wc_review": "451;283;1369;236",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            98.0,
            53.91196527673611
        ],
        "wc_strengths_avg": [
            56.5,
            12.776932339180638
        ],
        "wc_weaknesses_avg": [
            281.5,
            211.91094827780844
        ],
        "wc_questions_avg": [
            148.75,
            190.47621242559399
        ],
        "wc_review_avg": [
            584.75,
            459.7871110633703
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 43,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16426015309601482257&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;2;2;1",
        "aff_unique_norm": "Futureverse AI;Futureverse;Tsinghua University",
        "aff_unique_dep": ";;",
        "aff_unique_url": ";;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "Futureverse AI;;THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;2;2",
        "aff_country_unique": "United States;;China"
    },
    {
        "id": "4jBL79L5QS",
        "title": "Beyond Shortest-Paths: A Benchmark for Reinforcement Learning on Traffic Engineering",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Selecting efficient routes for data packets is an essential task in computer networking. Given the dynamic of today\u2019s network traffic, the optimal route varies greatly with the current network state. Despite the wealth of existing techniques, Traffic Engineering in networks with changing conditions is still a largely unsolved problem. Recent work aims at replacing Traffic Engineering heuristics with Reinforcement Learning, but does not provide a reference framework for training and evaluating under realistic network conditions in a reproducible manner. We fill this gap by casting distributed Traffic Engineering as a Swarm Markov Decision Process, and introducing a training and evaluation framework powered by a faithful network simulation engine that implements it. We show the effectiveness and versatility of our framework on a variety of scenarios, including ones where the agents outperform popular shortest-path routing algorithms.",
        "keywords": "Traffic Engineering;Routing Optimization;Multi-Agent Reinforcement Learning;Benchmark;Framework;Computer Networks",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Andreas Boltres;Niklas Freymuth;Patrick Jahnke;Gerhard Neumann",
        "authorids": "~Andreas_Boltres1;~Niklas_Freymuth1;~Patrick_Jahnke1;~Gerhard_Neumann2",
        "gender": ";M;M;M",
        "homepage": "https://boltr.es;;https://www.linkedin.com/in/patrick-jahnke-dr-ing-332007103/;https://alr.anthropomatik.kit.edu/",
        "dblp": ";255/7209;;60/4878",
        "google_scholar": "gltZtVsAAAAJ;FK1DbrcAAAAJ;LswjmU8AAAAJ;https://scholar.google.com.tw/citations?user=GL360kMAAAAJ",
        "orcid": ";;;",
        "linkedin": "andreas-boltres-81a989215;;;",
        "or_profile": "~Andreas_Boltres1;~Niklas_Freymuth1;~Patrick_Jahnke1;~Gerhard_Neumann1",
        "aff": "Karlsruher Institut f\u00fcr Technologie;Amazon;;Karlsruhe Institute of Technology",
        "aff_domain": "kit.edu;amazon.com;;kit.edu",
        "position": "PhD student;Intern;;Full Professor",
        "bibtex": "@misc{\nboltres2024beyond,\ntitle={Beyond Shortest-Paths: A Benchmark for Reinforcement Learning on Traffic Engineering},\nauthor={Andreas Boltres and Niklas Freymuth and Patrick Jahnke and Gerhard Neumann},\nyear={2024},\nurl={https://openreview.net/forum?id=4jBL79L5QS}\n}",
        "github": "",
        "project": "",
        "reviewers": "XHPP;3jBT;HzR2;Jksb;dSxa",
        "site": "https://openreview.net/forum?id=4jBL79L5QS",
        "pdf_size": 5085972,
        "rating": "3;3;3;3;6",
        "confidence": "4;4;5;4;3",
        "soundness": "2;3;2;2;3",
        "contribution": "1;2;2;2;3",
        "presentation": "2;2;3;2;3",
        "wc_summary": "79;53;131;110;74",
        "wc_strengths": "79;15;133;43;89",
        "wc_weaknesses": "308;65;543;84;54",
        "wc_questions": "343;50;174;55;1",
        "wc_review": "809;183;981;292;218",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "895;642;1084;678;127",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "2;1;2;1;1",
        "rating_avg": [
            3.6,
            1.2
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            2.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            89.4,
            27.659356463952665
        ],
        "wc_strengths_avg": [
            71.8,
            40.37028610252843
        ],
        "wc_weaknesses_avg": [
            210.8,
            190.64459079659198
        ],
        "wc_questions_avg": [
            124.6,
            123.14641691904804
        ],
        "wc_review_avg": [
            496.6,
            331.6809310165418
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            685.2,
            321.4227123275516
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.4,
            0.4898979485566356
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.7905694150420948,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:_jPggHSMK20J:scholar.google.com/&scioq=Beyond+Shortest-Paths:+A+Benchmark+for+Reinforcement+Learning+on+Traffic+Engineering&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Karlsruher Institut f\u00fcr Technologie;Amazon;Karlsruhe Institute of Technology",
        "aff_unique_dep": ";Amazon.com, Inc.;",
        "aff_unique_url": "https://www.kit.edu;https://www.amazon.com;https://www.kit.edu",
        "aff_unique_abbr": "KIT;Amazon;KIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Germany;United States"
    },
    {
        "id": "4kJfWZChJI",
        "title": "Generalization or Specificity? Spectral Meta Estimation and Ensemble (SMEE) with Domain-specific Experts",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Existing domain generalization (DG) methodologies strive to construct a unified model trained on diverse source domains, with the goal of achieving robust performance on any unseen test domain. However, in practice, not all source domains contribute equally to effective knowledge transfer for a specific test domain. Consequently, the reliability of single-model generalization often falls short of classic empirical risk minimization (ERM). This paper departs from the conventional approaches and advocates for a paradigm that prioritizes specificity over broad generalization. We propose the Spectral Meta Estimation and Ensemble (SMEE) approach, which capitalizes on domain-specific expert models and leverages unsupervised ensemble learning to construct a weighted ensemble for test samples. Our comprehensive investigation reveals three key insights: (1) The proposed meta performance estimation strategy for model selection within the sources plays a pivotal role in accommodating stochasticity; (2) The proposed spectral unsupervised ensemble method for transferability estimation excels in constructing robust learners for multi-class classification tasks, while being entirely hyperparameter-free; and (3) Multi-expert test-time transferability estimation and ensemble proves to be a promising alternative to the prevailing single-model DG paradigm. Experiments conducted on the DomainBed benchmark substantiate the superiority of our approach, consistently surpassing state-of-the-art DG techniques. Importantly, our approach offers a noteworthy performance enhancement while maintaining remarkable computational efficiency, executing in mere milliseconds per test sample during inference.",
        "keywords": "Domain Generalization;Ensemble Learning;Spectral Analysis;Test-time Adaptation;Transfer Learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/2b4a23f22275f78a699f340afea98e7f9431b220.zip",
        "author": "Siyang Li;Ziwei Wang;Dongrui Wu",
        "authorids": "~Siyang_Li5;~Ziwei_Wang5;~Dongrui_Wu1",
        "gender": "M;F;M",
        "homepage": ";https://scholar.google.com/citations?user=fjlXqvQAAAAJ&hl=en;https://sites.google.com/site/drwuhust/home",
        "dblp": ";;",
        "google_scholar": "5GFZxIkAAAAJ;fjlXqvQAAAAJ;UYGzCPEAAAAJ",
        "orcid": ";0000-0003-1324-2298;0000-0002-7153-9703",
        "linkedin": ";;",
        "or_profile": "~Siyang_Li5;~Ziwei_Wang5;~Dongrui_Wu1",
        "aff": "Huazhong University of Science and Technology;Huazhong University of Science and Technology;Huazhong University of Science and Technology",
        "aff_domain": "hust.edu.cn;hust.edu.cn;hust.edu.cn",
        "position": "PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nli2024generalization,\ntitle={Generalization or Specificity? Spectral Meta Estimation and Ensemble ({SMEE}) with Domain-specific Experts},\nauthor={Siyang Li and Ziwei Wang and Dongrui Wu},\nyear={2024},\nurl={https://openreview.net/forum?id=4kJfWZChJI}\n}",
        "github": "",
        "project": "",
        "reviewers": "52us;X4Bt;ExFD;6gJi",
        "site": "https://openreview.net/forum?id=4kJfWZChJI",
        "pdf_size": 2213079,
        "rating": "1;5;6;8",
        "confidence": "5;3;4;4",
        "soundness": "2;3;3;4",
        "contribution": "1;2;3;4",
        "presentation": "3;3;3;4",
        "wc_summary": "104;53;81;76",
        "wc_strengths": "33;41;187;79",
        "wc_weaknesses": "281;62;194;52",
        "wc_questions": "164;2;126;4",
        "wc_review": "582;158;588;211",
        "wc_reply_reviewers": "1386;0;0;0",
        "wc_reply_authors": "3201;1186;1251;885",
        "reply_reviewers": "3;0;0;0",
        "reply_authors": "5;2;2;2",
        "rating_avg": [
            5.0,
            2.5495097567963922
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            1.118033988749895
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            78.5,
            18.117670931993437
        ],
        "wc_strengths_avg": [
            85.0,
            61.40032573203501
        ],
        "wc_weaknesses_avg": [
            147.25,
            95.41324593577141
        ],
        "wc_questions_avg": [
            74.0,
            72.26340706055866
        ],
        "wc_review_avg": [
            384.75,
            201.13599255230278
        ],
        "wc_reply_reviewers_avg": [
            346.5,
            600.1556048226159
        ],
        "wc_reply_authors_avg": [
            1630.75,
            917.0388146092836
        ],
        "reply_reviewers_avg": [
            0.75,
            1.299038105676658
        ],
        "reply_authors_avg": [
            2.75,
            1.299038105676658
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5547001962252291,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:rjgNhRqq1t4J:scholar.google.com/&scioq=Generalization+or+Specificity%3F+Spectral+Meta+Estimation+and+Ensemble+(SMEE)+with+Domain-specific+Experts&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Huazhong University of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.hust.edu.cn",
        "aff_unique_abbr": "HUST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Pessimistic Nonlinear Least-Squares Value Iteration for Offline Reinforcement Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19449",
        "id": "4kLVvIh8cp",
        "author_site": "Qiwei Di, Heyang Zhao, Jiafan He, Quanquan Gu",
        "tldr": "",
        "abstract": "Offline reinforcement learning (RL), where the agent aims to learn the optimal policy based on the data collected by a behavior policy, has attracted increasing attention in recent years. While offline RL with linear function approximation has been extensively studied with optimal results achieved under certain assumptions, many works shift their interest to offline RL with non-linear function approximation.\nHowever, limited works on offline RL with non-linear function approximation have instance-dependent regret guarantees.\n    In this paper, we propose an oracle-efficient algorithm, dubbed Pessimistic Nonlinear Least-Square Value Iteration (PNLSVI), for offline RL with non-linear function approximation. Our algorithmic design comprises three innovative components: (1) a variance-based weighted regression scheme that can be applied to a wide range of function classes, (2) a subroutine for variance estimation, and (3) a planning phase that utilizes a pessimistic value iteration approach. Our algorithm enjoys a regret bound that has a tight dependency on the function class complexity and achieves minimax optimal instance-dependent regret when specialized to linear function approximation. Our work extends the previous instance-dependent results within simpler function classes, such as linear and differentiable function to a more general framework. To the best of our knowledge, this is the first statistically optimal algorithm for nonlinear offline RL.",
        "keywords": "Offline reinforcement learning;instance-dependent;least-squares value iteration",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Qiwei Di;Heyang Zhao;Jiafan He;Quanquan Gu",
        "authorids": "~Qiwei_Di1;~Heyang_Zhao1;~Jiafan_He1;~Quanquan_Gu1",
        "gender": "M;M;M;M",
        "homepage": "https://qiwei-di1234.github.io/;https://web.cs.ucla.edu/~hyzhao/;https://sites.google.com/g.ucla.edu/jiafan-he-homepage;http://web.cs.ucla.edu/~qgu/",
        "dblp": "354/3878;;214/5785;50/4597",
        "google_scholar": "SewL0pkAAAAJ;zHQ1ap0AAAAJ;F3AXNBwAAAAJ;GU9HgNAAAAAJ",
        "orcid": ";;;",
        "linkedin": "qiwei-di-00776a253/;;;",
        "or_profile": "~Qiwei_Di1;~Heyang_Zhao1;~Jiafan_He1;~Quanquan_Gu1",
        "aff": "University of California, Los Angeles;Computer Science Department, University of California, Los Angeles;University of California, Los Angeles;University of California, Los Angeles",
        "aff_domain": "ucla.edu;cs.ucla.edu;ucla.edu;cs.ucla.edu",
        "position": "PhD student;PhD student;PhD student;Associate Professor",
        "bibtex": "@inproceedings{\ndi2024pessimistic,\ntitle={Pessimistic Nonlinear Least-Squares Value Iteration for Offline Reinforcement Learning},\nauthor={Qiwei Di and Heyang Zhao and Jiafan He and Quanquan Gu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=4kLVvIh8cp}\n}",
        "github": "",
        "project": "",
        "reviewers": "38or;Fsc5;KfKk;FxDp",
        "pdf_size": 522660,
        "rating": "5;6;6;8",
        "confidence": "3;3;4;3",
        "soundness": "2;3;3;4",
        "contribution": "2;3;2;3",
        "presentation": "3;4;2;3",
        "wc_summary": "41;51;98;174",
        "wc_strengths": "51;38;102;57",
        "wc_weaknesses": "125;81;108;144",
        "wc_questions": "63;55;5;55",
        "wc_review": "280;225;313;430",
        "wc_reply_reviewers": "0;9;0;0",
        "wc_reply_authors": "594;580;446;419",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "3;2;1;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            91.0,
            52.53094326204318
        ],
        "wc_strengths_avg": [
            62.0,
            24.093567606313517
        ],
        "wc_weaknesses_avg": [
            114.5,
            23.157072353818823
        ],
        "wc_questions_avg": [
            44.5,
            23.038012067016545
        ],
        "wc_review_avg": [
            312.0,
            75.0299940023988
        ],
        "wc_reply_reviewers_avg": [
            2.25,
            3.897114317029974
        ],
        "wc_reply_authors_avg": [
            509.75,
            77.99479149276571
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.13245323570650439,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13706149271000326202&as_sdt=5,24&sciodt=0,24&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=4kLVvIh8cp",
        "pdf": "https://openreview.net/pdf?id=4kLVvIh8cp",
        "email": "ucla.edu;cs.ucla.edu;ucla.edu;cs.ucla.edu",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of California, Los Angeles",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucla.edu",
        "aff_unique_abbr": "UCLA",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Los Angeles",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "4l4Gfc1B6E",
        "title": "Offline Robustness of Distributional Actor-Critic Ensemble Reinforcement Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Offline reinforcement learning (RL) focuses on learning policies using static datasets without further exploration. With the introduction of distributional reinforcement learning into offline RL, current methods excel at quantifying the risk and ensuring the security of learned policies. However, these algorithms can not effectively balance the distribution shift and robustness, and even a minor perturbation in observations can significantly impair policy performance. In this paper, we propose Offline Robustness of Distributional actor-critic Ensemble Reinforcement Learning (ORDER) to improve the robustness of policies. In ORDER, we introduce two approaches to enhance the robustness: i) introduce the smoothing technique to policies and distribution functions for states near the dataset; ii) strengthen the quantile network. In addition to improving the robustness, we also theoretically prove that ORDER converges to a conservative lower bound, which can alleviate the distribution shift. In our experiments, we validate the effectiveness of ORDER in the D4RL benchmark through comparative experiments and ablation studies.",
        "keywords": "Offline reinforcement learning;Distributional reinforcement learning;Robustness",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Zhongcui Ma;Jianxiang Zhu;Dandan Lai;Zhiyuan Xu;Jian Tang;Yangchun Zhang;Yan Peng;Yaxin Peng",
        "authorids": "~Zhongcui_Ma1;~Jianxiang_Zhu1;~Dandan_Lai1;~Zhiyuan_Xu1;~Jian_Tang5;~Yangchun_Zhang1;~Yan_Peng3;~Yaxin_Peng1",
        "gender": ";M;;M;M;;F;F",
        "homepage": "https://www.mdmlab-shu.com/author/zhongcui-ma/;;https://www.mdmlab-shu.com/author/dandan-lai/;https://xuzhiyuan1528.github.io/;https://ecs.syr.edu/faculty/tang;;;https://www.mdmlab-shu.com/author/yaxin-peng/",
        "dblp": ";;;;181/2667-8;https://dblp.uni-trier.de/pid/324/8512;00/2434-1;20/7643.html",
        "google_scholar": ";;https://scholar.google.com.hk/citations?user=JoM-YngAAAAJ;jKHMVnYAAAAJ;;https://scholar.google.com.hk/citations?user=CjY56LgAAAAJ;boOwRJUAAAAJ;https://scholar.google.com.hk/citations?user=4cRt3XoAAAAJ",
        "orcid": "0009-0005-9495-5936;0009-0003-2855-5710;0009-0002-1881-4064;0000-0003-2879-3244;;0000-0002-0540-9070;0000-0003-1312-9527;0000-0002-2983-555X",
        "linkedin": ";;;zhiyuan-xu-19a66191;;;;",
        "or_profile": "~Zhongcui_Ma1;~Jianxiang_Zhu1;~Dandan_Lai1;~Zhiyuan_Xu1;~Jian_Tang5;~Yangchun_Zhang1;~Yan_Peng3;~Yaxin_Peng1",
        "aff": "Shanghai University;Shanghai University;Shanghai University;Midea;x-humanoid;Shanghai University;Shanghai University;Shanghai University",
        "aff_domain": "shu.edu.cn;shu.edu.cn;shu.edu.cn;midea.com;x-humanoid.com;shu.edu.cn;shu.edu.cn;shu.edu.cn",
        "position": "MS student;MS student;PhD student;Researcher;Researcher;Lecturer;dean;Full Professor",
        "bibtex": "@misc{\nma2024offline,\ntitle={Offline Robustness of Distributional Actor-Critic Ensemble Reinforcement Learning},\nauthor={Zhongcui Ma and Jianxiang Zhu and Dandan Lai and Zhiyuan Xu and Jian Tang and Yangchun Zhang and Yan Peng and Yaxin Peng},\nyear={2024},\nurl={https://openreview.net/forum?id=4l4Gfc1B6E}\n}",
        "github": "",
        "project": "",
        "reviewers": "kZn3;fvaB;1eAG;cjFe",
        "site": "https://openreview.net/forum?id=4l4Gfc1B6E",
        "pdf_size": 1374788,
        "rating": "3;3;3;5",
        "confidence": "3;4;3;3",
        "soundness": "2;2;3;2",
        "contribution": "2;2;2;2",
        "presentation": "2;3;2;2",
        "wc_summary": "39;66;86;105",
        "wc_strengths": "43;30;39;65",
        "wc_weaknesses": "272;201;170;72",
        "wc_questions": "91;4;60;51",
        "wc_review": "445;301;355;293",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "169;772;292;211",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            74.0,
            24.464259645450134
        ],
        "wc_strengths_avg": [
            44.25,
            12.871965661856
        ],
        "wc_weaknesses_avg": [
            178.75,
            71.87271735505762
        ],
        "wc_questions_avg": [
            51.5,
            31.18092365533773
        ],
        "wc_review_avg": [
            348.5,
            60.60321773635456
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            361.0,
            241.3741908324086
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:N3DyagCY-bIJ:scholar.google.com/&scioq=Offline+Robustness+of+Distributional+Actor-Critic+Ensemble+Reinforcement+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;2;0;0;0",
        "aff_unique_norm": "Shanghai University;Midea Group;x-humanoid",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.shu.edu.cn;https://www.midea.com;",
        "aff_unique_abbr": "SHU;Midea;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China;"
    },
    {
        "id": "4lOWCkhr4g",
        "title": "Unsupervised ASR via Cross-Lingual Pseudo-Labeling",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent work has shown that it is possible to train an *unsupervised* automatic speech recognition (ASR) system using only unpaired audio and text. Existing unsupervised ASR methods assume that no labeled data can be used for training. \nWe argue that even if one does not have any labeled audio for a given language, there is *always* labeled data available for other languages. We show that it is possible to use character-level acoustic models (AMs) from other languages to bootstrap an *unsupervised* AM in a new language. Here, ``unsupervised'' means no labeled audio is available for the *target* language. Our approach is based on two key ingredients: (i) generating pseudo-labels (PLs) of the *target* language using some *other* language AM and (ii) constraining these PLs with a *target language model*. Our approach is effective on Common Voice: e.g. transfer of English AM to Swahili achieves 18\\% WER. It also outperforms character-based wav2vec-U 2.0 by 15\\% absolute WER on LJSpeech with 800h of labeled German data instead of 60k hours of unlabeled English data.",
        "keywords": "ASR;pseudo-labeling;self-training;unsupervised learning;multilingual",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Tatiana Likhomanenko;Loren Lugosch;Ronan Collobert",
        "authorids": "~Tatiana_Likhomanenko1;~Loren_Lugosch1;~Ronan_Collobert1",
        "gender": "F;M;M",
        "homepage": "https://github.com/tlikhomanenko/tlikhomanenko;http://lorenlugosch.com;http://ronan.collobert.com",
        "dblp": "202/2094;;03/4032",
        "google_scholar": "https://scholar.google.ru/citations?user=x7Z3ysQAAAAJ;https://scholar.google.ca/citations?user=xTvZgeoAAAAJ;32w7x1cAAAAJ",
        "orcid": "0000-0003-0351-9839;;",
        "linkedin": ";;",
        "or_profile": "~Tatiana_Likhomanenko1;~Loren_Lugosch1;~Ronan_Collobert1",
        "aff": "Apple;Apple;Apple",
        "aff_domain": "apple.com;apple.com;apple.com",
        "position": "Research Scientist;Researcher;Research Scientist",
        "bibtex": "@misc{\nlikhomanenko2024unsupervised,\ntitle={Unsupervised {ASR} via Cross-Lingual Pseudo-Labeling},\nauthor={Tatiana Likhomanenko and Loren Lugosch and Ronan Collobert},\nyear={2024},\nurl={https://openreview.net/forum?id=4lOWCkhr4g}\n}",
        "github": "",
        "project": "",
        "reviewers": "26fF;GYQT;mAuZ;UAMi",
        "site": "https://openreview.net/forum?id=4lOWCkhr4g",
        "pdf_size": 606406,
        "rating": "3;6;6;6",
        "confidence": "5;4;5;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "130;65;80;110",
        "wc_strengths": "39;58;43;67",
        "wc_weaknesses": "151;117;84;100",
        "wc_questions": "305;67;108;63",
        "wc_review": "625;307;315;340",
        "wc_reply_reviewers": "0;47;0;0",
        "wc_reply_authors": "1022;738;535;454",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "2;2;1;2",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            96.25,
            25.341418665891617
        ],
        "wc_strengths_avg": [
            51.75,
            11.299889379989523
        ],
        "wc_weaknesses_avg": [
            113.0,
            24.849547279578356
        ],
        "wc_questions_avg": [
            135.75,
            99.29092355296127
        ],
        "wc_review_avg": [
            396.75,
            132.3411783988642
        ],
        "wc_reply_reviewers_avg": [
            11.75,
            20.351596988934308
        ],
        "wc_reply_authors_avg": [
            687.25,
            219.21379404590397
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5082035048589856528&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Apple",
        "aff_unique_dep": "Apple Inc.",
        "aff_unique_url": "https://www.apple.com",
        "aff_unique_abbr": "Apple",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "4lqA5EuieJ",
        "title": "Prediction Tasks in Graphs: a Framework to Control the Interpretability-Performance Trade-off",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph Neural Networks (GNNs) have emerged as state-of-the-art methods for solving graph-level tasks in diverse domains, such as social network analysis and bioinformatics. However, their complex nature results in a lack of human-interpretable predictions, which can hinder their practical impact. Here, we aim at improving GNN interpretability by targeting \\emph{sparsity} during GNN training - i.e, by minimizing the size (and/or number) of subgraphs used to make predictions. Existing solutions in the literature suffer from two main limitations: i) they still rely on information about the entire graph; and/or ii) they do not allow practitioners to directly control the trade-off between predictive performance and sparsity. To address the above limitations, in this paper, we formulate GNN training as a bi-level optimization task, where the trade-off between interpretability and performance can be controlled by a hyperparameter. Our framework relies on reinforcement learning to iteratively maximize predictive performance and sparsity by removing edges or nodes from the input graph. Our empirical results on nine different graph classification datasets show that our method competes in performance with baselines that use information from the whole graph, while relying on significantly sparser subgraphs, leading to more interpretable GNN-based predictions.",
        "keywords": "Graph Neural Networks; Reinforcement Learning; Graph-level tasks; Interpretability",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/afda2ebb66f1110447b93c944294dc98681a4b55.zip",
        "author": "Pablo Sanchez Martin;Kinaan Aamir Khan;Isabel Valera",
        "authorids": "~Pablo_Sanchez_Martin1;~Kinaan_Aamir_Khan1;~Isabel_Valera1",
        "gender": "M;M;F",
        "homepage": "https://www.is.mpg.de/person/psanchez;;https://ivaleram.github.io/",
        "dblp": ";;126/1768.html",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;https://scholar.google.es/citations?user=cpdQqpsAAAAJ",
        "orcid": ";;",
        "linkedin": ";kinaanaamir/;",
        "or_profile": "~Pablo_Sanchez_Martin1;~Kinaan_Aamir_Khan1;~Isabel_Valera1",
        "aff": "Max-Planck Institute;Universit\u00e4t des Saarlandes;Universit\u00e4t des Saarlandes",
        "aff_domain": "mpg.tuebingen.de;uni-saarland.de;uni-saarland.de",
        "position": "PhD student;MS student;Full Professor",
        "bibtex": "@misc{\nmartin2024prediction,\ntitle={Prediction Tasks in Graphs: a Framework to Control the Interpretability-Performance Trade-off},\nauthor={Pablo Sanchez Martin and Kinaan Aamir Khan and Isabel Valera},\nyear={2024},\nurl={https://openreview.net/forum?id=4lqA5EuieJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "CKsQ;Zge8;X2ML;CD1o",
        "site": "https://openreview.net/forum?id=4lqA5EuieJ",
        "pdf_size": 1371205,
        "rating": "3;5;5;6",
        "confidence": "3;4;4;2",
        "soundness": "3;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;2;3",
        "wc_summary": "33;100;58;62",
        "wc_strengths": "39;51;77;52",
        "wc_weaknesses": "377;138;197;164",
        "wc_questions": "3;5;37;42",
        "wc_review": "452;294;369;320",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            63.25,
            23.951774464536026
        ],
        "wc_strengths_avg": [
            54.75,
            13.827056809024834
        ],
        "wc_weaknesses_avg": [
            219.0,
            93.58685805175853
        ],
        "wc_questions_avg": [
            21.75,
            17.851820635442202
        ],
        "wc_review_avg": [
            358.75,
            60.197072187939504
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.20751433915982243,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:oooGi4-WIp4J:scholar.google.com/&scioq=Prediction+Tasks+in+Graphs:+a+Framework+to+Control+the+Interpretability-Performance+Trade-off&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Max-Planck-Gesellschaft zur F\u00f6rderung der Wissenschaften e.V.;Universit\u00e4t des Saarlandes",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.mpg.de;https://www.uni-saarland.de",
        "aff_unique_abbr": "MPG;UDS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "4lqo5Jwfnq",
        "title": "Class-Incremental Learning with Parameter-Efficient Cross-Task Prompts",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Class-Incremental Learning (CIL) aims to learn deep models on sequential tasks continually, where each new task includes a batch of new classes and deep models do not have access to task-ID information at the inference time. Recent vast pre-trained models (PTMs) have achieved outstanding performance by prompt technique in practical CIL without the old samples (rehearsal-free) and with a memory constraint (memory-constrained): Prompt-extending and Prompt-fixed methods. However, prompt-extending methods need a large memory buffer to maintain an ever-expanding prompt pool and meet an extra challenging prompt selection problem. Prompt-fixed methods only learn a fixed number of prompts on one of the incremental tasks and can not handle all the incremental tasks effectively. To achieve a good balance between the memory cost and the performance on all the tasks, we propose a Parameter-Efficient Cross-Task Prompt (PECTP) framework with a prompt retention module (PRM). To make the final learned prompts effective on the whole incremental tasks, PRM constrains the evolution of cross-task prompts' parameters from Outer Prompt Granularity and Inner Prompt Granularity. Extensive experiments show the effectiveness of our method.",
        "keywords": "Class-Incremental Learning; Pre-Trained Model; Prompt Learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/bba64007710d77a6ceac489214c46e9ae4f36546.zip",
        "author": "qian feng;Hanbin Zhao;Chao Zhang;Hui Qian",
        "authorids": "~qian_feng1;~Hanbin_Zhao1;~Chao_Zhang19;~Hui_Qian1",
        "gender": ";M;M;M",
        "homepage": "https://github.com/RAIAN08;;;",
        "dblp": ";222/7871;94/3019-29;66/5293",
        "google_scholar": ";F2kiw10AAAAJ;;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~qian_feng1;~Hanbin_Zhao1;~Chao_Zhang19;~Hui_Qian1",
        "aff": "Zhejiang University;Zhejiang University;Zhejiang University;Zhejiang University",
        "aff_domain": "zju.edu.cn;zju.edu.cn;zju.edu.cn;zju.edu.cn",
        "position": "PhD student;Assistant Professor;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nfeng2024classincremental,\ntitle={Class-Incremental Learning with Parameter-Efficient Cross-Task Prompts},\nauthor={qian feng and Hanbin Zhao and Chao Zhang and Hui Qian},\nyear={2024},\nurl={https://openreview.net/forum?id=4lqo5Jwfnq}\n}",
        "github": "",
        "project": "",
        "reviewers": "2DHh;9kbr;vcUE",
        "site": "https://openreview.net/forum?id=4lqo5Jwfnq",
        "pdf_size": 769382,
        "rating": "3;5;6",
        "confidence": "5;3;5",
        "soundness": "2;2;3",
        "contribution": "2;3;3",
        "presentation": "2;3;2",
        "wc_summary": "41;65;42",
        "wc_strengths": "16;35;114",
        "wc_weaknesses": "159;276;207",
        "wc_questions": "3;30;7",
        "wc_review": "219;406;370",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1913;2158;1372",
        "reply_reviewers": "0;0;0",
        "reply_authors": "4;5;3",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            49.333333333333336,
            11.08552609887726
        ],
        "wc_strengths_avg": [
            55.0,
            42.43426288586461
        ],
        "wc_weaknesses_avg": [
            214.0,
            48.02082881417188
        ],
        "wc_questions_avg": [
            13.333333333333334,
            11.897712198383164
        ],
        "wc_review_avg": [
            331.6666666666667,
            81.01165896887244
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1814.3333333333333,
            328.3801997008278
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            4.0,
            0.816496580927726
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.18898223650461363,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ACthZbY0vNkJ:scholar.google.com/&scioq=Class-Incremental+Learning+with+Parameter-Efficient+Cross-Task+Prompts&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Zhejiang University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.zju.edu.cn",
        "aff_unique_abbr": "ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "4nyTlyTtfX",
        "title": "Heterogeneous Decision Making towards Mixed Autonomy: When Uncertainty-aware Planning Meets Bounded Rationality",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The past few years have witnessed a rapid growth of the deployment of automated vehicles (AVs). Clearly,\nAVs and human-driven vehicles (HVs) will co-exist for many years to come, and AVs will have to operate around HVs, pedestrians, cyclists, and more, calling for fundamental breakthroughs in AI designed for mixed traffic to achieve mixed autonomy.  Thus motivated, we study heterogeneous decision making by AVs and HVs in a mixed traffic environment, aiming to   capture the interactions  between human and machine decision-making and develop an AI foundation  that enables vehicles to operate safely and efficiently. There are a number of challenges to achieve mixed autonomy, including 1) humans drivers make  driving decisions with bounded rationality, and it remains open to develop accurate models for HVs' decision making; and 2)  uncertainty-aware planning plays a critical role for AVs to take safety maneuvers in response to the human behavior. In this paper,  we introduce a formulation of AV-HV interaction, where the HV makes  decisions with bounded rationality and the AV employs uncertainty-aware planning based on the prediction on HV's future actions. We conduct a comprehensive analysis on AV and HV's learning regret to answer the questions: 1) \\\"How does the overall learning performance depend on HV's bounded rationality and Av's planning?\"; 2) \"How do different decision making strategies impact the overall learning performance?\"  Our findings reveal some intriguing phenomena, such as Goodhart's Law in AV's learning performance and compounding effects in HV's decision making process. By examining the dynamics of the regrets, we gain insights into the   interplay between human and machine decision making in  mixed autonomy.",
        "keywords": "Mixed Autonomy;Reinforcement Learning;Bounded Rationality;Regret Analysis",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Hang Wang;Qiaoyi Fang;Junshan Zhang",
        "authorids": "~Hang_Wang2;~Qiaoyi_Fang1;~Junshan_Zhang1",
        "gender": "M;;M",
        "homepage": "https://ustcmike.github.io/;https://github.com/fangqyi;https://faculty.engineering.ucdavis.edu/jzhang/",
        "dblp": ";;59/1232.html",
        "google_scholar": "Xdb3u_q3RKwC;;UtAdFs8AAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Hang_Wang2;~Qiaoyi_Fang1;~Junshan_Zhang1",
        "aff": "University of California, Davis;University of California, Davis;University of California, Davis",
        "aff_domain": "ucdavis.edu;ucdavis.edu;ucdavis.edu",
        "position": "PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nwang2024heterogeneous,\ntitle={Heterogeneous Decision Making towards Mixed Autonomy: When Uncertainty-aware Planning Meets Bounded Rationality},\nauthor={Hang Wang and Qiaoyi Fang and Junshan Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=4nyTlyTtfX}\n}",
        "github": "",
        "project": "",
        "reviewers": "Sgxf;dAQk;BMkw;DRuU",
        "site": "https://openreview.net/forum?id=4nyTlyTtfX",
        "pdf_size": 611295,
        "rating": "3;3;5;6",
        "confidence": "2;3;2;2",
        "soundness": "1;1;3;3",
        "contribution": "2;1;3;2",
        "presentation": "2;2;2;4",
        "wc_summary": "87;108;82;95",
        "wc_strengths": "46;195;35;111",
        "wc_weaknesses": "117;624;102;114",
        "wc_questions": "183;86;10;16",
        "wc_review": "433;1013;229;336",
        "wc_reply_reviewers": "0;1071;50;0",
        "wc_reply_authors": "1357;3118;369;998",
        "reply_reviewers": "0;4;1;0",
        "reply_authors": "3;8;2;4",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            2.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            1.0
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            93.0,
            9.82344135219425
        ],
        "wc_strengths_avg": [
            96.75,
            63.72744699107285
        ],
        "wc_weaknesses_avg": [
            239.25,
            222.20640742336843
        ],
        "wc_questions_avg": [
            73.75,
            69.79389299931621
        ],
        "wc_review_avg": [
            502.75,
            303.30049043811323
        ],
        "wc_reply_reviewers_avg": [
            280.25,
            456.99582875558065
        ],
        "wc_reply_authors_avg": [
            1460.5,
            1020.2079444897496
        ],
        "reply_reviewers_avg": [
            1.25,
            1.6393596310755
        ],
        "reply_authors_avg": [
            4.25,
            2.277608394786075
        ],
        "replies_avg": [
            31,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5555555555555555,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:-f77RWILAWcJ:scholar.google.com/&scioq=Heterogeneous+Decision+Making+towards+Mixed+Autonomy:+When+Uncertainty-aware+Planning+Meets+Bounded+Rationality&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of California, Davis",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucdavis.edu",
        "aff_unique_abbr": "UC Davis",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Davis",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "DREAM: Dual Structured Exploration with Mixup for Open-set Graph Domain Adaption",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19448",
        "id": "4olqbTBt1Y",
        "author_site": "Nan Yin, Mengzhu Wang, Zhenghan Chen, Li Shen, Huan Xiong, Bin Gu, Xiao Luo",
        "tldr": "",
        "abstract": "Recently, numerous graph neural network methods have been developed to tackle domain shifts in graph data. However, these methods presuppose that unlabeled target graphs belong to categories previously seen in the source domain. This assumption could not hold true for in-the-wild target graphs. In this paper, we delve deeper to explore a more realistic problem open-set graph domain adaptation. Our objective is to not only identify target graphs from new categories but also accurately classify remaining target graphs into their respective categories under domain shift and label scarcity. To solve this challenging problem, we introduce a new method named Dual Structured Exploration with Mixup (DREAM). DREAM incorporates a graph-level representation learning branch as well as a subgraph-enhanced branch, which jointly explores graph topological structures from both global and local viewpoints. To maximize the use of unlabeled target graphs, we train these two branches simultaneously using posterior regularization to enhance their inter-module consistency. To accommodate the open-set setting, we amalgamate dissimilar samples to generate virtual unknown samples belonging to novel classes. Moreover, to alleviate domain shift, we establish a k nearest neighbor-based graph-of-graphs and blend multiple neighbors of each sample to produce cross-domain virtual samples for inter-domain consistency learning. Extensive experiments validate the effectiveness of the proposed DREAM in comparison to various state-of-the-art approaches in different settings.",
        "keywords": "Open-set Recognization;Graph Classification;Domain Adaptation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Nan Yin;Mengzhu Wang;Zhenghan Chen;Li Shen;Huan Xiong;Bin Gu;Xiao Luo",
        "authorids": "~Nan_Yin4;~Mengzhu_Wang3;~Zhenghan_Chen3;~Li_Shen1;~Huan_Xiong1;~Bin_Gu1;~Xiao_Luo3",
        "gender": "M;;;M;M;M;M",
        "homepage": ";;;https://sites.google.com/site/mathshenli/home;https://scholar.google.com/citations?user=l4hm14MAAAAJ&hl=en;https://mbzuai.ac.ae/study/faculty/bin-gu/;http://luoxiao12.github.io",
        "dblp": "135/8983;;;91/3680-8;;29/1758-1;50/1585-1",
        "google_scholar": "https://scholar.google.com.hk/citations?user=NoOK0pIAAAAJ;;;yVhgENIAAAAJ;l4hm14MAAAAJ;Vo8OgCgAAAAJ;https://scholar.google.com.hk/citations?",
        "orcid": ";;;;;0000-0001-6049-1815;",
        "linkedin": "yin-nan-b32943173;;;;;;%E9%9C%84-%E7%BD%97-303548214/",
        "or_profile": "~Nan_Yin4;~Mengzhu_Wang3;~Zhenghan_Chen3;~Li_Shen1;~Huan_Xiong1;~Bin_Gu1;~Xiao_Luo3",
        "aff": "Mohamed bin Zayed University of Artificial Intelligence;;;JD Explore Academy;Harbin Institute of Technology;Mohamed bin Zayed University of Artificial Intelligence;University of California, Los Angeles",
        "aff_domain": "mbzuai.ac.ae;;;jd.com;hit.edu.cn;mbzuai.ac.ae;cs.ucla.edu",
        "position": "Postdoc;;;Researcher;Full Professor;Assistant Professor;Postdoc",
        "bibtex": "@inproceedings{\nyin2024dream,\ntitle={{DREAM}: Dual Structured Exploration with Mixup for Open-set Graph Domain Adaption},\nauthor={Nan Yin and Mengzhu Wang and Zhenghan Chen and Li Shen and Huan Xiong and Bin Gu and Xiao Luo},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=4olqbTBt1Y}\n}",
        "github": "",
        "project": "",
        "reviewers": "qwA4;Pqqy;ysQV;9UFe;SVBJ",
        "pdf_size": 5099568,
        "rating": "3;5;8;8;8",
        "confidence": "4;3;4;4;4",
        "soundness": "2;2;4;3;3",
        "contribution": "2;2;4;3;3",
        "presentation": "2;2;4;3;3",
        "wc_summary": "78;58;204;91;34",
        "wc_strengths": "45;20;396;167;27",
        "wc_weaknesses": "231;114;75;43;35",
        "wc_questions": "2;5;32;2;2",
        "wc_review": "356;197;707;303;98",
        "wc_reply_reviewers": "97;0;81;31;0",
        "wc_reply_authors": "1758;738;530;430;187",
        "reply_reviewers": "1;0;2;1;0",
        "reply_authors": "5;3;3;3;1",
        "rating_avg": [
            6.4,
            2.0591260281974
        ],
        "confidence_avg": [
            3.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.8,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.8,
            0.7483314773547882
        ],
        "presentation_avg": [
            2.8,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            93.0,
            58.74691481260952
        ],
        "wc_strengths_avg": [
            131.0,
            142.86637113050782
        ],
        "wc_weaknesses_avg": [
            99.6,
            71.3515241603149
        ],
        "wc_questions_avg": [
            8.6,
            11.757550765359253
        ],
        "wc_review_avg": [
            332.2,
            207.37540837813918
        ],
        "wc_reply_reviewers_avg": [
            41.8,
            40.48407094154441
        ],
        "wc_reply_authors_avg": [
            728.6,
            544.3688455450036
        ],
        "reply_reviewers_avg": [
            0.8,
            0.7483314773547883
        ],
        "reply_authors_avg": [
            3.0,
            1.2649110640673518
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.33995005182504257,
        "gs_citation": 25,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4463789579044625548&as_sdt=80005&sciodt=0,11&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=4olqbTBt1Y",
        "pdf": "https://openreview.net/pdf?id=4olqbTBt1Y",
        "email": "mbzuai.ac.ae;;;jd.com;hit.edu.cn;mbzuai.ac.ae;cs.ucla.edu",
        "author_num": 7,
        "aff_unique_index": "0;1;2;0;3",
        "aff_unique_norm": "Mohamed bin Zayed University of Artificial Intelligence;JD;Harbin Institute of Technology;University of California, Los Angeles",
        "aff_unique_dep": ";JD Explore Academy;;",
        "aff_unique_url": "https://mbzuai.ac.ae;;http://www.hit.edu.cn/;https://www.ucla.edu",
        "aff_unique_abbr": "MBZUAI;;HIT;UCLA",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Harbin;Los Angeles",
        "aff_country_unique_index": "0;2;0;3",
        "aff_country_unique": "United Arab Emirates;;China;United States"
    },
    {
        "id": "4pW8NL1UwH",
        "title": "LIRE: Listwise Reward Enhancement for Preference Alignment",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recently, tremendous strides have been made in the domain of Natural Language Generation (NLG) due to the vast advances in Large Language Models (LLMs). However, often trained on large-scale unsupervised data, LLMs can generate toxic or unhelpful content for lack of human supervision. Leveraging reinforcement learning with human feedback (RLHF) turns out a good remedy for this problem and has been prevalent among researchers. However, RLHF is notoriously unstable and hyperparameter-sensitive, which hinders an all-compassing and sustainable LLM system. For the above reason, we propose a new approach: LIRE, which stands for Listwise Reward Enhancement for Preference Alignment, to optimize rewards through a listwise paradigm. We directly incorporate the rewards of multiple candidates into the listwise loss and optimize against it in a compact and effective framework, without explicit modeling of the Bradley-Terry model. Furthermore, we propose a self-enhancement algorithm to progressively optimize the reward through iterative training. Our work also entails extensive experiments to demonstrate the stability and consistency of the model performance without heavy hyperparameter tuning, while still surpassing the state-of-the-art methods in preference alignment tasks.",
        "keywords": "LLM;RLHF;Preference alignment",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Mingye Zhu",
        "authorids": "~Mingye_Zhu1",
        "gender": "",
        "homepage": "https://github.com/stevie1023",
        "dblp": "",
        "google_scholar": "",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Mingye_Zhu1",
        "aff": "University of Science and Technology of China",
        "aff_domain": "ustc.edu.cn",
        "position": "PhD student",
        "bibtex": "@misc{\nzhu2024lire,\ntitle={{LIRE}: Listwise Reward Enhancement for Preference Alignment},\nauthor={Mingye Zhu},\nyear={2024},\nurl={https://openreview.net/forum?id=4pW8NL1UwH}\n}",
        "github": "",
        "project": "",
        "reviewers": "XkkK;6BAr;Cmfo;Z7nt;Vfn5",
        "site": "https://openreview.net/forum?id=4pW8NL1UwH",
        "pdf_size": 942745,
        "rating": "5;5;5;5;6",
        "confidence": "3;3;4;3;3",
        "soundness": "2;2;2;2;3",
        "contribution": "2;2;2;3;2",
        "presentation": "3;2;2;2;3",
        "wc_summary": "280;70;88;186;127",
        "wc_strengths": "18;102;97;84;71",
        "wc_weaknesses": "161;165;248;479;94",
        "wc_questions": "24;23;34;182;1",
        "wc_review": "483;360;467;931;293",
        "wc_reply_reviewers": "69;0;0;0;0",
        "wc_reply_authors": "981;619;848;1166;620",
        "reply_reviewers": "1;0;0;0;0",
        "reply_authors": "2;1;2;2;1",
        "rating_avg": [
            5.2,
            0.39999999999999997
        ],
        "confidence_avg": [
            3.2,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.2,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            150.2,
            76.11675242678184
        ],
        "wc_strengths_avg": [
            74.4,
            30.19006459085505
        ],
        "wc_weaknesses_avg": [
            229.4,
            134.01880465069073
        ],
        "wc_questions_avg": [
            52.8,
            65.49320575449028
        ],
        "wc_review_avg": [
            506.8,
            223.31896471191155
        ],
        "wc_reply_reviewers_avg": [
            13.8,
            27.6
        ],
        "wc_reply_authors_avg": [
            846.8,
            211.29637952411773
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            1.6,
            0.4898979485566356
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.25000000000000006,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14469823784875334267&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Science and Technology of China",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.ustc.edu.cn",
        "aff_unique_abbr": "USTC",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "4pnhzuRtJ2",
        "title": "Optimized Tradeoffs for Private Majority Ensembling",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We study the problem of computing an $(m\\epsilon, \\delta)$-differentially private majority of $K$ $(\\epsilon, \\Delta)$-differentially private algorithms for $m < K$ and $\\delta \\geq \\Delta \\geq 0$. Standard methods, such as subsampling or randomized response, are widely used but do they provide optimal privacy-utility tradeoffs? Surprisingly, we show that an $(m\\epsilon, \\delta)$-private majority algorithm with maximal utility can be computed tractably for any $m < K$. Specifically, we introduce Data-dependent Randomized Response Majority (DaRRM), a general privacy framework characterized by a data-dependent noise function $\\gamma$ that allows for efficient utility optimization over the class of all private algorithms subject to privacy constraints. By deriving a structural understanding of DaRRM, our novel learning approach is made tractable by critically reducing infinitely many privacy constraints into a polynomial set. Theoretically, we show DaRRM enjoys a privacy gain of a factor of 2 over common baselines under i.i.d. teachers and $\\delta = 0$. Lastly, we demonstrate the empirical effectiveness of our first-of-its-kind privacy-constrained utility optimization for ensembling labels and gradients from private teachers through applications of private semi-supervised knowledge transfer and private distributed Sign-SGD, highlighting the outstanding performance of our DaRRM framework with an optimized $\\gamma$ against several baselines.",
        "keywords": "differential privacy;ensemble learning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/e3b4b35f51ebae896e00c19c8c75bc25a60f2a7d.pdf",
        "author": "Shuli Jiang;Qiuyi Zhang;Gauri Joshi",
        "authorids": "~Shuli_Jiang1;~Qiuyi_Zhang1;~Gauri_Joshi1",
        "gender": "F;M;",
        "homepage": "https://www.andrew.cmu.edu/user/shulij/;https://qiuyiz.github.io;",
        "dblp": "224/6441;133/8559;",
        "google_scholar": "D0IvR7MAAAAJ;mE11hO8AAAAJ;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Shuli_Jiang1;~Qiuyi_Zhang1;~Gauri_Joshi1",
        "aff": "Carnegie Mellon University;Google;",
        "aff_domain": "cmu.edu;google.com;",
        "position": "PhD student;Researcher;",
        "bibtex": "@misc{\njiang2024optimized,\ntitle={Optimized Tradeoffs for Private Majority Ensembling},\nauthor={Shuli Jiang and Qiuyi Zhang and Gauri Joshi},\nyear={2024},\nurl={https://openreview.net/forum?id=4pnhzuRtJ2}\n}",
        "github": "",
        "project": "",
        "reviewers": "pyVN;3EZ4;SRCJ;DeQA",
        "site": "https://openreview.net/forum?id=4pnhzuRtJ2",
        "pdf_size": 1980631,
        "rating": "3;3;6;8",
        "confidence": "3;4;3;3",
        "soundness": "3;2;3;3",
        "contribution": "3;3;2;3",
        "presentation": "2;2;3;3",
        "wc_summary": "89;14;67;53",
        "wc_strengths": "63;64;49;68",
        "wc_weaknesses": "230;608;35;46",
        "wc_questions": "57;1;23;31",
        "wc_review": "439;687;174;198",
        "wc_reply_reviewers": "224;91;17;6",
        "wc_reply_authors": "849;684;342;60",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            5.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            55.75,
            27.307279249313726
        ],
        "wc_strengths_avg": [
            61.0,
            7.176350047203662
        ],
        "wc_weaknesses_avg": [
            229.75,
            231.71358937274266
        ],
        "wc_questions_avg": [
            28.0,
            20.024984394500787
        ],
        "wc_review_avg": [
            374.5,
            208.06789757192243
        ],
        "wc_reply_reviewers_avg": [
            84.5,
            86.92094109016537
        ],
        "wc_reply_authors_avg": [
            483.75,
            305.43606123049716
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5443310539518174,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:JiKpLYVEx0oJ:scholar.google.com/&scioq=Optimized+Tradeoffs+for+Private+Majority+Ensembling&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Carnegie Mellon University;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.cmu.edu;https://www.google.com",
        "aff_unique_abbr": "CMU;Google",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "4qFIkOhq24",
        "title": "Fundamental Limitation of Alignment in Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "An important aspect in developing language models that interact with humans is\naligning their behavior to be useful and unharmful for their human users. This is\nusually achieved by tuning the model in a way that enhances desired behaviors\nand inhibits undesired ones, a process referred to as alignment. In this paper, we\npropose a theoretical approach called Behavior Expectation Bounds (BEB) which\nallows us to formally investigate several inherent characteristics and limitations of\nalignment in large language models. Importantly, we prove that within the limits\nof this framework, for any behavior that has a finite probability of being exhibited\nby the model, there exist prompts that can trigger the model into outputting this\nbehavior, with probability that increases with the length of the prompt. This implies\nthat any alignment process that attenuates an undesired behavior but does not\nremove it altogether, is not safe against adversarial prompting attacks. Furthermore,\nour framework hints at the mechanism by which leading alignment approaches\nsuch as reinforcement learning from human feedback make the LLM prone to\nbeing prompted into the undesired behaviors. This theoretical result is being\nexperimentally demonstrated in large scale by the so called contemporary \u201cchatGPT\njailbreaks\", where adversarial users trick the LLM into breaking its alignment\nguardrails by triggering it into acting as a malicious persona. Our results expose\nfundamental limitations in alignment of LLMs and bring to the forefront the need\nto devise reliable mechanisms for ensuring AI safety.",
        "keywords": "Large language models;Alignment;Deep learning",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/a847fed0b934f5857cb4fdfe250696a0f7403216.zip",
        "author": "Yotam Wolf;Noam Wies;Oshri Avnery;Yoav Levine;Amnon Shashua",
        "authorids": "~Yotam_Wolf1;~Noam_Wies1;~Oshri_Avnery1;~Yoav_Levine1;~Amnon_Shashua1",
        "gender": "M;M;M;M;M",
        "homepage": ";;;;http://www.cs.huji.ac.il/~shashua/",
        "dblp": ";236/6106;;199/1895;47/1492",
        "google_scholar": "jlPKaIIAAAAJ;https://scholar.google.co.il/citations?user=FxlR8voAAAAJ;;;https://scholar.google.com.tw/citations?user=dwi5wvYAAAAJ",
        "orcid": ";0000-0002-1337-2298;;;",
        "linkedin": ";noam-wies-a5ab1663/;oshri-avnery/;;",
        "or_profile": "~Yotam_Wolf1;~Noam_Wies1;~Oshri_Avnery1;~Yoav_Levine1;~Amnon_Shashua1",
        "aff": "Hebrew University of Jerusalem;Hebrew University of Jerusalem;Hebrew University of Jerusalem;;Hebrew University, Hebrew University of Jerusalem",
        "aff_domain": "huji.ac.il;huji.ac.il;huji.ac.il;;cs.huji.ac.il",
        "position": "PhD student;PhD student;MS student;;Professor",
        "bibtex": "@misc{\nwolf2024fundamental,\ntitle={Fundamental Limitation of Alignment in Large Language Models},\nauthor={Yotam Wolf and Noam Wies and Oshri Avnery and Yoav Levine and Amnon Shashua},\nyear={2024},\nurl={https://openreview.net/forum?id=4qFIkOhq24}\n}",
        "github": "",
        "project": "",
        "reviewers": "Cy5r;edXZ;5KAT;e9bS",
        "site": "https://openreview.net/forum?id=4qFIkOhq24",
        "pdf_size": 1637993,
        "rating": "6;6;6;8",
        "confidence": "3;3;3;4",
        "soundness": "3;3;3;4",
        "contribution": "3;3;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "126;64;88;158",
        "wc_strengths": "59;69;89;124",
        "wc_weaknesses": "69;340;56;187",
        "wc_questions": "397;143;74;29",
        "wc_review": "651;616;307;498",
        "wc_reply_reviewers": "16;383;0;23",
        "wc_reply_authors": "754;1314;306;563",
        "reply_reviewers": "1;2;0;1",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            109.0,
            35.90264614203248
        ],
        "wc_strengths_avg": [
            85.25,
            24.843258642939738
        ],
        "wc_weaknesses_avg": [
            163.0,
            114.22565386111826
        ],
        "wc_questions_avg": [
            160.75,
            142.31369400026128
        ],
        "wc_review_avg": [
            518.0,
            134.36331344530024
        ],
        "wc_reply_reviewers_avg": [
            105.5,
            160.43144953530776
        ],
        "wc_reply_authors_avg": [
            734.25,
            370.548495476638
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 208,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10671962345198545886&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Hebrew University of Jerusalem",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.huji.ac.il",
        "aff_unique_abbr": "HUJI",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Jerusalem;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Israel"
    },
    {
        "title": "Learning Delays in Spiking Neural Networks using Dilated Convolutions with Learnable Spacings",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19447",
        "id": "4r2ybzJnmN",
        "author_site": "Ilyass Hammouamri, Ismail Khalfaoui Hassani, Timoth\u00e9e Masquelier",
        "tldr": "",
        "abstract": "Spiking Neural Networks (SNNs) are a promising research direction for building power-efficient information processing systems, especially for temporal tasks such as speech recognition. In SNNs, delays refer to the time needed for one spike to travel from one neuron to another. These delays matter because they influence the spike arrival times, and it is well-known that spiking neurons respond more strongly to coincident input spikes. More formally, it has been shown theoretically that plastic delays greatly increase the expressivity in SNNs. Yet, efficient algorithms to learn these delays have been lacking. Here, we propose a new discrete-time algorithm that addresses this issue in deep feedforward SNNs using backpropagation, in an offline manner. To simulate delays between consecutive layers, we use 1D convolutions across time. The kernels contain only a few non-zero weights \u2013 one per synapse \u2013 whose positions correspond to the delays. These positions are learned together with the weights using the recently proposed Dilated Convolution with Learnable Spacings (DCLS). We evaluated our method on three datasets: the Spiking Heidelberg Dataset (SHD), the Spiking Speech Commands (SSC) and its non spiking version Google Speech Commands v0.02 (GSC) benchmarks, which require detecting temporal patterns. We used feedforward SNNs with two or three hidden fully connected layers, and vanilla leaky integrate-and-fire neurons. We showed that fixed random delays help and that learning them helps even more. Furthermore, our method outperformed the state-of-the-art in the three datasets without using recurrent connections and with substantially fewer parameters. Our work demonstrates the potential of delay learning in developing accurate and precise models for temporal data processing. Our code is based on PyTorch / SpikingJelly and available at: https://github.com/Thvnvtos/SNN-delays",
        "keywords": "Spiking Neural Networks;Delays;Neuromorphic Computing;Speech Recognition",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "Ilyass Hammouamri;Ismail Khalfaoui-Hassani;Timoth\u00e9e Masquelier",
        "authorids": "~Ilyass_Hammouamri1;~Ismail_Khalfaoui-Hassani1;~Timoth\u00e9e_Masquelier1",
        "gender": "M;;M",
        "homepage": ";;https://ismakh.com",
        "dblp": ";07/7226;308/6076",
        "google_scholar": "https://scholar.google.com/citations?hl=en;fkzUZ-oAAAAJ;sFQlNhIAAAAJ",
        "orcid": ";0000-0001-8629-9506;0009-0007-8858-4037",
        "linkedin": "hammouamri-ilyass/;;ismail-khalfaoui-hassani/",
        "or_profile": "~Ilyass_Hammouamri1;~Timoth\u00e9e_Masquelier1;~Ismail_Khalfaoui_Hassani1",
        "aff": "Universit\u00e9 de Toulouse;CNRS;University of Toulouse",
        "aff_domain": "univ-toulouse.fr;cnrs.fr;univ-tlse3.fr",
        "position": "PhD student;Principal Researcher;PhD student",
        "bibtex": "@inproceedings{\nhammouamri2024learning,\ntitle={Learning Delays in Spiking Neural Networks using Dilated Convolutions with Learnable Spacings},\nauthor={Ilyass Hammouamri and Ismail Khalfaoui-Hassani and Timoth{\\'e}e Masquelier},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=4r2ybzJnmN}\n}",
        "github": "",
        "project": "",
        "reviewers": "7RCo;Wbur;ybas;sQsE",
        "pdf_size": 603710,
        "rating": "6;6;8;8",
        "confidence": "3;4;5;4",
        "soundness": "3;2;3;3",
        "contribution": "2;2;4;2",
        "presentation": "3;3;3;3",
        "wc_summary": "104;63;118;65",
        "wc_strengths": "56;51;64;51",
        "wc_weaknesses": "145;307;120;847",
        "wc_questions": "5;66;236;57",
        "wc_review": "310;487;538;1020",
        "wc_reply_reviewers": "0;68;0;498",
        "wc_reply_authors": "244;707;664;701",
        "reply_reviewers": "0;1;0;3",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            87.5,
            24.026027553467927
        ],
        "wc_strengths_avg": [
            55.5,
            5.315072906367325
        ],
        "wc_weaknesses_avg": [
            354.75,
            293.1265724904516
        ],
        "wc_questions_avg": [
            91.0,
            86.89361311396829
        ],
        "wc_review_avg": [
            588.75,
            262.9670844421408
        ],
        "wc_reply_reviewers_avg": [
            141.5,
            207.6890704875921
        ],
        "wc_reply_authors_avg": [
            579.0,
            194.1120810253705
        ],
        "reply_reviewers_avg": [
            1.0,
            1.224744871391589
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.7071067811865475,
        "gs_citation": 59,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18230794924674691098&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=4r2ybzJnmN",
        "pdf": "https://openreview.net/pdf?id=4r2ybzJnmN",
        "email": "univ-toulouse.fr;cnrs.fr;univ-tlse3.fr",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Universit\u00e9 de Toulouse;Centre National de la Recherche Scientifique;University of Toulouse",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.univ-toulouse.fr;https://www.cnrs.fr;https://www.univ-toulouse.fr",
        "aff_unique_abbr": "UT;CNRS;UT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "France"
    },
    {
        "title": "Learning 3D Particle-based Simulators from RGB-D Videos",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19446",
        "id": "4rBEgZCubP",
        "author_site": "William Whitney, Tatiana Lopez-Guevara, Tobias Pfaff, Yulia Rubanova, Thomas Kipf, Kimberly Stachenfeld, Kelsey Allen",
        "tldr": "",
        "abstract": "Realistic simulation is critical for applications ranging from robotics to animation. Traditional analytic simulators sometimes struggle to capture sufficiently realistic simulation which can lead to problems including the well known \"sim-to-real\" gap in robotics. Learned simulators have emerged as an alternative for better capturing real-world physical dynamics, but require access to privileged ground truth physics information such as precise object geometry or particle tracks. Here we propose a method for learning simulators directly from observations. Visual Particle Dynamics (VPD) jointly learns a latent particle-based representation of 3D scenes, a neural simulator of the latent particle dynamics, and a renderer that can produce images of the scene from arbitrary views. VPD learns end to end from posed RGB-D videos and does not require access to privileged information. Unlike existing 2D video prediction models, we show that VPD's 3D structure enables scene editing and long-term predictions. These results pave the way for downstream applications ranging from video editing to robotic planning.",
        "keywords": "simulation;dynamics;nerf;particle dynamics",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "William F Whitney;Tatiana Lopez-Guevara;Tobias Pfaff;Yulia Rubanova;Thomas Kipf;Kim Stachenfeld;Kelsey R Allen",
        "authorids": "~William_F_Whitney1;~Tatiana_Lopez-Guevara1;~Tobias_Pfaff1;~Yulia_Rubanova2;~Thomas_Kipf2;~Kim_Stachenfeld1;~Kelsey_R_Allen1",
        "gender": ";F;M;F;F;M;F",
        "homepage": "http://willwhitney.com;;http://tobiaspfaff.com;https://neurokim.com/;;http://tkipf.github.io/;https://yuliarubanova.github.io/",
        "dblp": "160/8671;208/0996;67/7591;155/1888;153/9528;186/8206;222/3085",
        "google_scholar": "aQcYWDMAAAAJ;Op4nexcAAAAJ;3oUgDKQAAAAJ;jNtH2WUAAAAJ;kpcjFekAAAAJ;83HL5FwAAAAJ;u_HzE9wAAAAJ",
        "orcid": ";;;;;;",
        "linkedin": ";;;;;thomas-kipf-6b260410a;https://linkedin.com/in/yulia-rubanova-031702100",
        "or_profile": "~William_F_Whitney1;~Tatiana_Lopez-Guevara1;~Tobias_Pfaff1;~Kim_Stachenfeld1;~Kelsey_R_Allen1;~Thomas_N._Kipf1;~Yulia_Rubanova1",
        "aff": "Google DeepMind;Google;Deepmind;Google DeepMind;Google;Google;Google DeepMind",
        "aff_domain": "deepmind.com;google.com;google.com;deepmind.com;deepmind.com;google.com;deepmind.com",
        "position": "Researcher;Researcher;Research scientist;Research Scientist;Research Scientist;Research Scientist;Research Scientist",
        "bibtex": "@inproceedings{\nwhitney2024learning,\ntitle={Learning 3D Particle-based Simulators from {RGB}-D Videos},\nauthor={William F Whitney and Tatiana Lopez-Guevara and Tobias Pfaff and Yulia Rubanova and Thomas Kipf and Kim Stachenfeld and Kelsey R Allen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=4rBEgZCubP}\n}",
        "github": "",
        "project": "",
        "reviewers": "HnBD;CLWA;cZVt;8vFC",
        "pdf_size": 11133369,
        "rating": "6;6;6;8",
        "confidence": "4;3;3;3",
        "soundness": "3;3;3;3",
        "contribution": "3;3;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "71;73;138;44",
        "wc_strengths": "29;46;98;57",
        "wc_weaknesses": "83;373;121;32",
        "wc_questions": "12;1;132;161",
        "wc_review": "195;493;489;294",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "444;1041;1004;420",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;2;2;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            81.5,
            34.57238782612506
        ],
        "wc_strengths_avg": [
            57.5,
            25.42144763777232
        ],
        "wc_weaknesses_avg": [
            152.25,
            131.3037984979871
        ],
        "wc_questions_avg": [
            76.5,
            70.85372255569922
        ],
        "wc_review_avg": [
            367.75,
            128.13152422413464
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            727.25,
            295.6614406715898
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1085887278127634261&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=4rBEgZCubP",
        "pdf": "https://openreview.net/pdf?id=4rBEgZCubP",
        "email": "deepmind.com;google.com;google.com;deepmind.com;deepmind.com;google.com;deepmind.com",
        "author_num": 7,
        "aff_unique_index": "0;0;1;0;0;0;0",
        "aff_unique_norm": "Google;DeepMind",
        "aff_unique_dep": "Google DeepMind;",
        "aff_unique_url": "https://deepmind.com;https://deepmind.com",
        "aff_unique_abbr": "DeepMind;DeepMind",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;0;0;1;1;0",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "id": "4rCDEEnTvX",
        "title": "From Language Modeling to Instruction Following: Understanding the Behavior Shift in LLMs after Instruction Tuning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) have achieved remarkable success, demonstrating powerful instruction-following capabilities across diverse tasks. Instruction fine-tuning is critical in enabling LLMs to align with user intentions and effectively follow instructions. In this work, we investigate how the instruction fine-tuning modifies pre-trained models, focusing on two perspectives: instruction recognition and knowledge evolution. To study the behavior shift of LLMs, we employ a suite of local and global explanation methods, including a gradient-based approach for input-output attribution and techniques for interpreting patterns and concepts in self-attention and feed-forward layers. Our findings reveal three significant impacts of instruction fine-tuning: 1) It empowers LLMs to better recognize the instruction parts from user prompts, thereby facilitating high-quality response generation and addressing the ``lost-in-the-middle'' issue observed in pre-trained models; 2) It aligns the knowledge stored in feed-forward layers with user-oriented tasks, exhibiting minimal shifts across linguistic levels. 3) It facilitates the learning of word-word relations with instruction verbs through the self-attention mechanism, particularly in the lower and middle layers, indicating enhanced recognition of instruction words. These insights contribute to a deeper understanding of the behavior shifts in LLMs after instruction fine-tuning and lay the groundwork for future research aimed at interpreting and optimizing LLMs for various applications.",
        "keywords": "Large Language Model;Instruction Tuning;Interpretation;Instruction Following;Supervised Fine-tuning",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Xuansheng Wu;Wenlin Yao;Jianshu Chen;Xiaoman Pan;Xiaoyang Wang;Ninghao Liu;Dong Yu",
        "authorids": "~Xuansheng_Wu1;~Wenlin_Yao1;~Jianshu_Chen1;~Xiaoman_Pan2;~Xiaoyang_Wang1;~Ninghao_Liu2;~Dong_Yu2",
        "gender": ";M;M;M;M;M;M",
        "homepage": "https://github.com/JacksonWuxs;https://wenlinyao.github.io/;https://chenjianshu.github.io/;https://sites.google.com/view/dongyu888/;https://cobweb.cs.uga.edu/~ninghaoliu/;https://panx27.github.io/homepage/;https://xyang0.github.io/",
        "dblp": "304/1261;203/8711;11/3124;71/4598-1;145/4489;148/9210;81/1832-1",
        "google_scholar": "https://scholar.google.com/citations?hl=en;qwo2A24AAAAJ;jQeFWdoAAAAJ;tMY31_gAAAAJ;Nir-EDYAAAAJ;tRPF03IAAAAJ;EeppWmkAAAAJ",
        "orcid": "0000-0002-7816-7658;;;0000-0003-0520-6844;0000-0002-9170-2424;;0000-0002-0746-1059",
        "linkedin": ";;;dongyu/;;;xiaoyang-wang-001",
        "or_profile": "~Xuansheng_Wu1;~Wenlin_Yao1;~Jianshu_Chen1;~Dong_Yu2;~Ninghao_Liu1;~Xiaoman_Pan1;~Xiaoyang_Wang2",
        "aff": "University of Georgia;Tencent AI Lab;Amazon;Tencent AI Lab;University of Georgia;Tencent AI Lab;Tencent AI Lab",
        "aff_domain": "uga.edu;tencent.com;amazon.com;tencent.com;uga.edu;tencent.com;tencent.com",
        "position": "PhD student;Researcher;Principal Scientist;Distinguished Scientist;Assistant Professor;Researcher;Senior Researcher",
        "bibtex": "@misc{\nwu2024from,\ntitle={From Language Modeling to Instruction Following: Understanding the Behavior Shift in {LLM}s after Instruction Tuning},\nauthor={Xuansheng Wu and Wenlin Yao and Jianshu Chen and Xiaoman Pan and Xiaoyang Wang and Ninghao Liu and Dong Yu},\nyear={2024},\nurl={https://openreview.net/forum?id=4rCDEEnTvX}\n}",
        "github": "",
        "project": "",
        "reviewers": "e43k;zeP7;QqaN",
        "site": "https://openreview.net/forum?id=4rCDEEnTvX",
        "pdf_size": 13402389,
        "rating": "3;5;6",
        "confidence": "4;4;3",
        "soundness": "2;2;2",
        "contribution": "2;3;2",
        "presentation": "2;1;2",
        "wc_summary": "124;133;82",
        "wc_strengths": "980;71;56",
        "wc_weaknesses": "2;647;131",
        "wc_questions": "2;94;236",
        "wc_review": "1108;945;505",
        "wc_reply_reviewers": "178;306;0",
        "wc_reply_authors": "1722;1714;452",
        "reply_reviewers": "2;2;0",
        "reply_authors": "5;3;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            113.0,
            22.22611077089287
        ],
        "wc_strengths_avg": [
            369.0,
            432.0856396595471
        ],
        "wc_weaknesses_avg": [
            260.0,
            278.671850031538
        ],
        "wc_questions_avg": [
            110.66666666666667,
            96.25429283356088
        ],
        "wc_review_avg": [
            852.6666666666666,
            254.68455434561048
        ],
        "wc_reply_reviewers_avg": [
            161.33333333333334,
            125.47863917372108
        ],
        "wc_reply_authors_avg": [
            1296.0,
            596.8070598331312
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            3.0,
            1.632993161855452
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.7559289460184545,
        "gs_citation": 29,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1012915126425971164&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;2;1;0;1;1",
        "aff_unique_norm": "University of Georgia;Tencent;Amazon",
        "aff_unique_dep": ";Tencent AI Lab;Amazon.com, Inc.",
        "aff_unique_url": "https://www.uga.edu;https://ai.tencent.com;https://www.amazon.com",
        "aff_unique_abbr": "UGA;Tencent AI Lab;Amazon",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;1;0;1;1",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "4sGoA7Eih8",
        "title": "Unmasking Transformers: A Theoretical Approach to Data Recovery via Attention Weights",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In the realm of deep learning, transformers have emerged as a dominant architecture, particularly in natural language processing tasks. However, with their widespread adoption, concerns regarding the security and privacy of the data processed by these models have arisen. In this paper, we address a pivotal question: Can the data fed into transformers be recovered using their attention weights and outputs? We introduce a theoretical framework to tackle this problem. Specifically, we present an algorithm that aims to recover the input data $X \\in \\mathbb{R}^{d \\times n}$ from given attention weights $W = QK^\\top \\in \\mathbb{R}^{d \\times d}$ and output $B \\in \\mathbb{R}^{n \\times n}$ by minimizing the loss function $L(X)$. This loss function captures the discrepancy between the expected output and the actual output of the transformer. Our findings have significant implications for the Localized Layer-wise Mechanism (LLM), suggesting potential vulnerabilities in the model's design from a security and privacy perspective. This work underscores the importance of understanding and safeguarding the internal workings of transformers to ensure the confidentiality of processed data.",
        "keywords": "Attention;inversion",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/176cb0bc7f4e0761deab33bd6b6ada6eef2bf3ad.pdf",
        "author": "Yichuan Deng;Zhao Song;Shenghao Xie;Chiwun Yang",
        "authorids": "~Yichuan_Deng1;~Zhao_Song3;~Shenghao_Xie2;~Chiwun_Yang1",
        "gender": "M;M;M;M",
        "homepage": "https://homes.cs.washington.edu/~ycdeng/;https://www.youtube.com/@zhaosong2031;https://sites.google.com/view/shenghaoxie/;https://christianyang37.github.io/",
        "dblp": "183/7224-2;76/4051-2;;355/2807",
        "google_scholar": "https://scholar.google.com/citations?hl=en;yDZct7UAAAAJ;JKjz5D8AAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Yichuan_Deng1;~Zhao_Song3;~Shenghao_Xie2;~Chiwun_Yang1",
        "aff": "Department of Computer Science, University of Washington;Adobe;The Chinese University of Hong Kong, Shenzhen;SUN YAT-SEN UNIVERSITY",
        "aff_domain": "cs.washington.edu;adobe.com;cuhk.edu.cn;sysu.edu.cn",
        "position": "PhD student;Researcher;Undergrad student;Undergrad student",
        "bibtex": "@misc{\ndeng2024unmasking,\ntitle={Unmasking Transformers: A Theoretical Approach to Data Recovery via Attention Weights},\nauthor={Yichuan Deng and Zhao Song and Shenghao Xie and Chiwun Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=4sGoA7Eih8}\n}",
        "github": "",
        "project": "",
        "reviewers": "vHCT;wffn;K9uu;SERj",
        "site": "https://openreview.net/forum?id=4sGoA7Eih8",
        "pdf_size": 374694,
        "rating": "1;3;3;5",
        "confidence": "1;4;4;4",
        "soundness": "1;3;2;3",
        "contribution": "1;3;2;3",
        "presentation": "1;3;2;3",
        "wc_summary": "17;83;51;48",
        "wc_strengths": "13;69;15;11",
        "wc_weaknesses": "35;102;115;82",
        "wc_questions": "9;4;4;6",
        "wc_review": "74;258;185;147",
        "wc_reply_reviewers": "0;57;201;0",
        "wc_reply_authors": "14;155;243;187",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.25,
            1.299038105676658
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            49.75,
            23.35995505132662
        ],
        "wc_strengths_avg": [
            27.0,
            24.289915602982237
        ],
        "wc_weaknesses_avg": [
            83.5,
            30.36856927812043
        ],
        "wc_questions_avg": [
            5.75,
            2.0463381929681126
        ],
        "wc_review_avg": [
            166.0,
            66.42665127793211
        ],
        "wc_reply_reviewers_avg": [
            64.5,
            82.17207554881402
        ],
        "wc_reply_authors_avg": [
            149.75,
            84.4670793859951
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.8164965809277259,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17752848074473007675&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "University of Washington;Adobe;Chinese University of Hong Kong;Sun Yat-sen University",
        "aff_unique_dep": "Department of Computer Science;Adobe Inc.;;",
        "aff_unique_url": "https://www.washington.edu;https://www.adobe.com;https://www.cuhk.edu.cn;http://www.sysu.edu.cn",
        "aff_unique_abbr": "UW;Adobe;CUHK;SYSU",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Seattle;;Shenzhen",
        "aff_country_unique_index": "0;0;1;1",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "4stB7DFLp6",
        "title": "InstructRetro: Instruction Tuning post Retrieval-Augmented Pretraining",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Pretraining auto-regressive large language models (LLMs) with retrieval demonstrates better perplexity and factual accuracy by leveraging external databases. However, the size of existing pretrained retrieval-augmented LLM is still limited (e.g., Retro has 7.5B parameters), which limits the effectiveness of instruction tuning and zero-shot generalization. In this work, we introduce Retro 48B, the largest LLM pretrained with retrieval before instruction tuning. Specifically, we continue to pretrain the 43B GPT model on additional 100 billion tokens using the Retro augmentation method by retrieving from 1.2 trillion tokens. The obtained foundation model, Retro 48B, largely outperforms the original 43B GPT in terms of perplexity. After instruction tuning on Retro, InstructRetro demonstrates significant improvement over the instruction tuned GPT on zero-shot question answering (QA) tasks. Specifically, the average improvement of InstructRetro is 7% over its GPT counterpart across 8 short-form QA tasks, and 10% over GPT across 4 challenging long-form QA tasks. Surprisingly, we find that one can ablate the encoder from InstructRetro architecture and directly use its decoder backbone, while achieving comparable results. We hypothesize that pretraining with retrieval makes its decoder good at incorporating context for QA. Our results highlights the promising direction to obtain a better GPT decoder for QA through continued pretraining with retrieval before instruction tuning.",
        "keywords": "Large Language Models;Pretraining;Retrieval;Instruction Tuning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Boxin Wang;Wei Ping;Lawrence McAfee;Peng Xu;Bo Li;Mohammad Shoeybi;Bryan Catanzaro",
        "authorids": "~Boxin_Wang1;~Wei_Ping1;~Lawrence_McAfee1;~Peng_Xu7;~Bo_Li19;~Mohammad_Shoeybi1;~Bryan_Catanzaro1",
        "gender": ";M;M;M;F;M;M",
        "homepage": "https://wbx.life;https://wpingnet.github.io/;https://nvidia.com;https://scholar.google.com.hk/citations?user=PQ26NTIAAAAJ&hl=en;http://boli.cs.illinois.edu/;;https://ctnzr.io",
        "dblp": "236/6319;08/8399.html;;84/586-8;50/3402-26;53/9742;14/4826",
        "google_scholar": "YOf2ATIAAAAJ;6gKEYRgAAAAJ;;https://scholar.google.com.hk/citations?user=PQ26NTIAAAAJ;K8vJkTcAAAAJ;62ElavIAAAAJ;UZ6kI2AAAAAJ",
        "orcid": ";;;;;;0000-0003-0034-7728",
        "linkedin": ";wei-ping/;;;;shoeybi/;bryancatanzaro/",
        "or_profile": "~Boxin_Wang1;~Wei_Ping1;~Lawrence_McAfee1;~Peng_Xu7;~Bo_Li19;~Mohammad_Shoeybi1;~Bryan_Catanzaro1",
        "aff": "NVIDIA;NVIDIA;NVIDIA;NVIDIA;University of Illinois, Urbana Champaign;NVIDIA;NVIDIA",
        "aff_domain": "nvidia.com;nvidia.com;nvidia.com;nvidia.com;illinois.edu;nvidia.com;nvidia.com",
        "position": "Senior Research Scientist;Principal Researcher;Researcher;Researcher;Assistant Professor;Director of Applied Resesrch;Vice President",
        "bibtex": "@misc{\nwang2024instructretro,\ntitle={InstructRetro: Instruction Tuning post Retrieval-Augmented Pretraining},\nauthor={Boxin Wang and Wei Ping and Lawrence McAfee and Peng Xu and Bo Li and Mohammad Shoeybi and Bryan Catanzaro},\nyear={2024},\nurl={https://openreview.net/forum?id=4stB7DFLp6}\n}",
        "github": "",
        "project": "",
        "reviewers": "p68m;A1jh;gdXh",
        "site": "https://openreview.net/forum?id=4stB7DFLp6",
        "pdf_size": 765842,
        "rating": "5;6;8",
        "confidence": "3;3;4",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "3;3;2",
        "wc_summary": "97;61;563",
        "wc_strengths": "14;79;45",
        "wc_weaknesses": "61;35;659",
        "wc_questions": "1;39;58",
        "wc_review": "173;214;1325",
        "wc_reply_reviewers": "0;0;48",
        "wc_reply_authors": "604;1187;2791",
        "reply_reviewers": "0;0;1",
        "reply_authors": "1;2;5",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            240.33333333333334,
            228.63265053112795
        ],
        "wc_strengths_avg": [
            46.0,
            26.54555832275273
        ],
        "wc_weaknesses_avg": [
            251.66666666666666,
            288.2236785708088
        ],
        "wc_questions_avg": [
            32.666666666666664,
            23.697163449568293
        ],
        "wc_review_avg": [
            570.6666666666666,
            533.6567769227293
        ],
        "wc_reply_reviewers_avg": [
            16.0,
            22.627416997969522
        ],
        "wc_reply_authors_avg": [
            1527.3333333333333,
            924.7025948319216
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            1.699673171197595
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.944911182523068,
        "gs_citation": 49,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18383393396082703199&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;0;0;0;1;0;0",
        "aff_unique_norm": "NVIDIA;University of Illinois Urbana-Champaign",
        "aff_unique_dep": "NVIDIA Corporation;",
        "aff_unique_url": "https://www.nvidia.com;https://illinois.edu",
        "aff_unique_abbr": "NVIDIA;UIUC",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Urbana-Champaign",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "4u0ruVk749",
        "title": "DFITE: Estimation of Individual Treatment Effect Using Diffusion Model",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Learning individualized treatment effects (ITE) from observational data is a challenging task due to the absence of unobserved confounders. Previous methods mostly focus on assuming the Ignorability assumption ignoring the unobserved confounders or overlooking the impact of an apriori knowledge on the generation process of the latent variable, which can be quite impractical in real-world scenarios. Motivated by the recent advances in the latent variable modeling, we propose to capture the unobserved latent space using diffusion model, and accordingly to estimate the causal effect. More concretely, we build on the reverse diffusion process for the unobserved confounders as a Markov chain conditioned on an apriori knowledge. In order to implement our model in a feasible way, we derive the variational bound in closed form. In the experiments, we compare our model with the state-of-the-art methods based on both synthetic and benchmark datasets , where we can empirically demonstrate consistent improvements of our model on $\\sqrt{\\epsilon_{PEHE}}$ and $\\epsilon_{ATE}$, respectively",
        "keywords": "Individual Treatment Effect;Causal inference;diffusion model",
        "primary_area": "causal reasoning",
        "supplementary_material": "",
        "author": "Zhenlei Wang;Xu Chen;Xiaoxiao Xu;Lantao Hu;Peng Jiang;Kun Gai",
        "authorids": "~Zhenlei_Wang1;~Xu_Chen13;~Xiaoxiao_Xu2;~Lantao_Hu1;~Peng_Jiang6;~Kun_Gai1",
        "gender": "M;M;F;M;M;M",
        "homepage": "https://causal-rec.github.io/;https://gsai.ruc.edu.cn/chenxu;https://scholar.google.com/citations?hl=zh-CN&user=1I2OrQEAAAAJ&view_op=list_works&sortby=pubdate;;;",
        "dblp": "223/8301;83/6331-17;116/1526;;;59/2902",
        "google_scholar": "7x0kGsUAAAAJ;loPoqy0AAAAJ;https://scholar.google.com/citations?hl=zh-CN;P0EK1y8AAAAJ;https://scholar.google.com/citations?hl=en;PXO4ygEAAAAJ",
        "orcid": ";0000-0003-0144-1775;0009-0007-5493-5628;;0000-0002-9266-0780;",
        "linkedin": ";;;;;",
        "or_profile": "~Zhenlei_Wang1;~Xu_Chen13;~Xiaoxiao_Xu2;~Lantao_Hu1;~Peng_Jiang6;~Kun_Gai1",
        "aff": "Renmin University of China;Renmin University of China;Kuaishou Technology;;Kuaishou Technology;Kuaishou- \u5feb\u624b\u79d1\u6280",
        "aff_domain": "ruc.edu.cn;ruc.edu.cn;kuaishou.com;;kuaishou.com;kuaishou.com",
        "position": "PhD student;Associate Professor;Engineer;;Vice President;Instructor",
        "bibtex": "@misc{\nwang2024dfite,\ntitle={{DFITE}: Estimation of Individual Treatment Effect Using Diffusion Model},\nauthor={Zhenlei Wang and Xu Chen and Xiaoxiao Xu and Lantao Hu and Peng Jiang and Kun Gai},\nyear={2024},\nurl={https://openreview.net/forum?id=4u0ruVk749}\n}",
        "github": "",
        "project": "",
        "reviewers": "UsZZ;otL9;RF2t;Jxsb;1VfB",
        "site": "https://openreview.net/forum?id=4u0ruVk749",
        "pdf_size": 1723154,
        "rating": "1;3;3;3;5",
        "confidence": "4;3;4;4;3",
        "soundness": "2;2;2;1;3",
        "contribution": "1;2;2;2;2",
        "presentation": "1;2;2;3;2",
        "wc_summary": "39;73;67;96;55",
        "wc_strengths": "10;81;18;68;39",
        "wc_weaknesses": "247;271;18;285;151",
        "wc_questions": "144;184;102;79;384",
        "wc_review": "440;609;205;528;629",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            3.0,
            1.2649110640673518
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            1.8,
            0.4000000000000001
        ],
        "presentation_avg": [
            2.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            66.0,
            18.973665961010276
        ],
        "wc_strengths_avg": [
            43.2,
            27.56374430297887
        ],
        "wc_weaknesses_avg": [
            194.4,
            99.84307687566525
        ],
        "wc_questions_avg": [
            178.6,
            108.81470488863167
        ],
        "wc_review_avg": [
            482.2,
            153.84849690523467
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.6454972243679028,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:UYZWJsefyc8J:scholar.google.com/&scioq=DFITE:+Estimation+of+Individual+Treatment+Effect+Using+Diffusion+Model&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;1;1",
        "aff_unique_norm": "Renmin University of China;Kuaishou Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.ruc.edu.cn;https://www.kuaishou.com",
        "aff_unique_abbr": "RUC;Kuaishou",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "4uaogMQgNL",
        "title": "UpFusion: Novel View Diffusion from Unposed Sparse View Observations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We propose UpFusion, a system that can perform novel view synthesis and infer 3D representations for an object given a sparse set of reference images without corresponding pose information. Current sparse-view 3D inference methods typically rely on camera poses to geometrically aggregate information from input views, but are not robust in-the-wild when such information is unavailable/inaccurate.  In contrast, UpFusion sidesteps this requirement by learning to implicitly leverage the available images as context in a conditional generative model for synthesizing novel views.  We incorporate two complementary forms of conditioning into diffusion models for leveraging the input views: a) via inferring query-view aligned features using a scene-level transformer, b) via intermediate attentional layers that can directly observe the input image tokens. We show that this mechanism allows generating high-fidelity novel views while improving the synthesis quality given additional (unposed) images.  We evaluate our approach on the Co3D dataset and demonstrate the benefits of our method over pose-reliant alternates, Finally, we also show that our learned model can generalize beyond the training categories, and hope that this provides a stepping stone to reconstructing generic objects from in-the-wild image collections.",
        "keywords": "Novel View Synthesis;Diffusion;3D;Generative Models;Transformers",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Bharath Raj Nagoor Kani;Hsin-Ying Lee;Sergey Tulyakov;Shubham Tulsiani",
        "authorids": "~Bharath_Raj_Nagoor_Kani1;~Hsin-Ying_Lee2;~Sergey_Tulyakov1;~Shubham_Tulsiani1",
        "gender": "M;M;M;M",
        "homepage": "https://thatbrguy.github.io;http://hsinyinglee.com/;http://www.stulyakov.com/;https://shubhtuls.github.io/",
        "dblp": "364/1857;149/7976-1.html;40/6115;135/6623",
        "google_scholar": "DcZsAGEAAAAJ;;mgzXR0sAAAAJ;06rffEkAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;sergeytulyakov/;",
        "or_profile": "~Bharath_Raj_Nagoor_Kani1;~Hsin-Ying_Lee2;~Sergey_Tulyakov1;~Shubham_Tulsiani1",
        "aff": "Carnegie Mellon University;Snap Inc.;Snap Inc.;Carnegie Mellon University",
        "aff_domain": "cmu.edu;snap.com;snapchat.com;cmu.edu",
        "position": "MS student;Researcher;Director of Research;Assistant Professor",
        "bibtex": "@misc{\nkani2024upfusion,\ntitle={UpFusion: Novel View Diffusion from Unposed Sparse View Observations},\nauthor={Bharath Raj Nagoor Kani and Hsin-Ying Lee and Sergey Tulyakov and Shubham Tulsiani},\nyear={2024},\nurl={https://openreview.net/forum?id=4uaogMQgNL}\n}",
        "github": "",
        "project": "",
        "reviewers": "rcbB;yMjS;Egt9;UGEs",
        "site": "https://openreview.net/forum?id=4uaogMQgNL",
        "pdf_size": 17124243,
        "rating": "5;5;5;6",
        "confidence": "5;4;5;4",
        "soundness": "2;3;2;2",
        "contribution": "2;2;2;2",
        "presentation": "3;2;3;2",
        "wc_summary": "51;71;83;29",
        "wc_strengths": "110;41;92;17",
        "wc_weaknesses": "285;220;271;127",
        "wc_questions": "7;117;97;5",
        "wc_review": "453;449;543;178",
        "wc_reply_reviewers": "87;0;0;0",
        "wc_reply_authors": "300;485;554;91",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            58.5,
            20.512191496766015
        ],
        "wc_strengths_avg": [
            65.0,
            37.52998800959041
        ],
        "wc_weaknesses_avg": [
            225.75,
            61.93292742959919
        ],
        "wc_questions_avg": [
            56.5,
            50.997548960709864
        ],
        "wc_review_avg": [
            405.75,
            136.75776943194123
        ],
        "wc_reply_reviewers_avg": [
            21.75,
            37.67210506462308
        ],
        "wc_reply_authors_avg": [
            357.5,
            179.71992098818652
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11188550895155497640&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;1;0",
        "aff_unique_norm": "Carnegie Mellon University;Snap Inc.",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cmu.edu;https://www.snapinc.com",
        "aff_unique_abbr": "CMU;Snap",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "PAC Prediction Sets Under Label Shift",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19445",
        "id": "4vPVBh3fhz",
        "author_site": "Wenwen Si, Sangdon Park, Insup Lee, Edgar Dobriban, Osbert Bastani",
        "tldr": "",
        "abstract": "Prediction sets capture uncertainty by predicting sets of labels rather than individual labels, enabling downstream decisions to conservatively account for all plausible outcomes. Conformal inference algorithms construct prediction sets guaranteed to contain the true label with high probability. These guarantees fail to hold in the face of distribution shift, which is precisely when reliable uncertainty quantification can be most useful. We propose a novel algorithm for constructing prediction sets with PAC guarantees in the label shift setting, where the probabilities of labels can differ between the source and target distributions. Our algorithm relies on constructing confidence intervals for importance weights by propagating uncertainty through a Gaussian elimination algorithm. We evaluate our approach on four datasets: the CIFAR-10 and ChestX-Ray image datasets, the tabular CDC Heart Dataset, and the AGNews text dataset. Our algorithm satisfies the PAC guarantee while producing smaller prediction set sizes compared to several baselines.",
        "keywords": "prediction set;label shift;distribution-free uncertainty quantification;probably approximately correct;Clopper-Pearson binomial interval;rejection sampling",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Wenwen Si;Sangdon Park;Insup Lee;Edgar Dobriban;Osbert Bastani",
        "authorids": "~Wenwen_Si1;~Sangdon_Park1;~Insup_Lee1;~Edgar_Dobriban2;~Osbert_Bastani1",
        "gender": "F;M;;;M",
        "homepage": ";https://sangdon.github.io/;https://www.cis.upenn.edu/~lee/;https://statistics.wharton.upenn.edu/profile/dobriban/;http://obastani.github.io",
        "dblp": "226/6274;119/1530-1;l/InsupLee.html;99/11269;21/11275",
        "google_scholar": "IFgBKbIAAAAJ;Vi2E2F4AAAAJ;qPlUgrgAAAAJ;aGvH4yMAAAAJ;cxYepGkAAAAJ",
        "orcid": ";;0000-0003-2672-1132;;",
        "linkedin": ";;;edgar-dobriban/;",
        "or_profile": "~Wenwen_Si1;~Sangdon_Park1;~Insup_Lee1;~Edgar_Dobriban2;~Osbert_Bastani1",
        "aff": "University of Pennsylvania;POSTECH;University of Pennsylvania;The Wharton School, University of Pennsylvania;University of Pennsylvania",
        "aff_domain": "upenn.edu;postech.ac.kr;upenn.edu;wharton.upenn.edu;upenn.edu",
        "position": "PhD student;Assistant Professor;Full Professor;Associate Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nsi2024pac,\ntitle={{PAC} Prediction Sets Under Label Shift},\nauthor={Wenwen Si and Sangdon Park and Insup Lee and Edgar Dobriban and Osbert Bastani},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=4vPVBh3fhz}\n}",
        "github": "",
        "project": "",
        "reviewers": "2Pyj;onAF;mNQN;y3Aa;tiZb",
        "pdf_size": 1381636,
        "rating": "6;6;6;6;8",
        "confidence": "3;3;3;3;4",
        "soundness": "3;3;3;2;3",
        "contribution": "3;2;2;2;3",
        "presentation": "3;3;3;3;3",
        "wc_summary": "76;67;84;33;86",
        "wc_strengths": "48;8;58;27;107",
        "wc_weaknesses": "62;2;150;59;75",
        "wc_questions": "223;56;174;20;55",
        "wc_review": "409;133;466;139;323",
        "wc_reply_reviewers": "15;279;79;14;10",
        "wc_reply_authors": "888;516;954;192;508",
        "reply_reviewers": "1;3;1;1;1",
        "reply_authors": "2;3;2;1;1",
        "rating_avg": [
            6.4,
            0.7999999999999999
        ],
        "confidence_avg": [
            3.2,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            69.2,
            19.30181338631166
        ],
        "wc_strengths_avg": [
            49.6,
            33.493880038000974
        ],
        "wc_weaknesses_avg": [
            69.6,
            47.39873416031276
        ],
        "wc_questions_avg": [
            105.6,
            78.49738849159252
        ],
        "wc_review_avg": [
            294.0,
            136.8181274539306
        ],
        "wc_reply_reviewers_avg": [
            79.4,
            103.03513963692194
        ],
        "wc_reply_authors_avg": [
            611.6,
            279.1312236207193
        ],
        "reply_reviewers_avg": [
            1.4,
            0.8000000000000002
        ],
        "reply_authors_avg": [
            1.8,
            0.7483314773547883
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11840371556296107071&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=4vPVBh3fhz",
        "pdf": "https://openreview.net/pdf?id=4vPVBh3fhz",
        "email": "upenn.edu;postech.ac.kr;upenn.edu;wharton.upenn.edu;upenn.edu",
        "author_num": 5,
        "aff_unique_index": "0;1;0;0;0",
        "aff_unique_norm": "University of Pennsylvania;Pohang University of Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.upenn.edu;https://www.postech.ac.kr",
        "aff_unique_abbr": "UPenn;POSTECH",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Pohang",
        "aff_country_unique_index": "0;1;0;0;0",
        "aff_country_unique": "United States;South Korea"
    },
    {
        "id": "4w4PDIT3h4",
        "title": "Focus on Primary: Differential Diverse Data Augmentation for Generalization in Visual Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In reinforcement learning, it is common for the agent to overfit the training environment, making generalization to unseen environments extremely challenging. Visual reinforcement learning that relies on observed images as input is particularly constrained by generalization and sample efficiency. To address these challenges, various data augmentation methods are consistently attempted to improve the generalization capability and reduce the training cost. However, the naive use of data augmentation can often lead to breakdowns in learning. In this paper, we propose two novel approaches: Diverse Data Augmentation (DDA) and Differential Diverse Data Augmentation (D3A). Leveraging a pre-trained encoder-decoder model, we segment primary pixels to avoid inappropriate data augmentation affecting critical information. DDA improves the generalization capability of the agent in complex environments through consistency of encoding. D3A uses proper data augmentation for primary pixels to further improve generalization while satisfying semantic-invariant state transformation. We extensively evaluate our methods on a series of generalization tasks of DeepMind Control Suite. The results demonstrate that our methods significantly improve the generalization performance of the agent in unseen environments, and enable the selection of more diverse data augmentations to improve the sample efficiency of off-policy algorithms.",
        "keywords": "Visual Reinforcement Learning;Data Augmentation;Generalization",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/746288b2c1978e73fb972b9b6987c3232b790b8d.zip",
        "author": "Junhong Wu;Jie Liu;Xi Xiong;Daolong An;Shuai L\u00fc",
        "authorids": "~Junhong_Wu2;~Jie_Liu34;~Xi_Xiong1;~Daolong_An4;~Shuai_L\u00fc1",
        "gender": ";;M;M;M",
        "homepage": ";;https://teachers.jlu.edu.cn/lus/en/tdcy/43488/content/1757.htm;;https://lus-jlu.github.io",
        "dblp": ";https://dblp.uni-trier.de/pid/03/2134-14.html;;371/6068;27/10828-1",
        "google_scholar": ";;;zvlfGUgAAAAJ;S1T_HV0AAAAJ",
        "orcid": "0009-0009-9951-0505;;;0009-0005-0020-1990;0000-0002-8081-4498",
        "linkedin": ";;;andaolong-0a5689179;",
        "or_profile": "~Junhong_Wu2;~Jie_Liu34;~Xi_Xiong1;~Daolong_An4;~Shuai_L\u00fc1",
        "aff": "Jilin University;Jilin University;Jilin University;Jilin University;Jilin University",
        "aff_domain": "jlu.edu.cn;jlu.edu.cn;jlu.edu.cn;jlu.edu.cn;jlu.edu.cn",
        "position": "MS student;Associate Professor;MS student;MS student;Associate Professor",
        "bibtex": "@misc{\nwu2024focus,\ntitle={Focus on Primary: Differential Diverse Data Augmentation for Generalization in Visual Reinforcement Learning},\nauthor={Junhong Wu and Jie Liu and Xi Xiong and Daolong An and Shuai L{\\\"u}},\nyear={2024},\nurl={https://openreview.net/forum?id=4w4PDIT3h4}\n}",
        "github": "",
        "project": "",
        "reviewers": "3m8H;XRib;xszw;ziWN",
        "site": "https://openreview.net/forum?id=4w4PDIT3h4",
        "pdf_size": 2427548,
        "rating": "3;3;5;5",
        "confidence": "4;5;3;3",
        "soundness": "2;2;3;3",
        "contribution": "1;2;2;3",
        "presentation": "2;1;3;3",
        "wc_summary": "33;168;98;99",
        "wc_strengths": "10;113;18;34",
        "wc_weaknesses": "183;354;175;155",
        "wc_questions": "5;37;5;59",
        "wc_review": "231;672;296;347",
        "wc_reply_reviewers": "243;32;0;70",
        "wc_reply_authors": "1153;1176;680;852",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "3;2;1;2",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            99.5,
            47.74149138851865
        ],
        "wc_strengths_avg": [
            43.75,
            40.90461465409496
        ],
        "wc_weaknesses_avg": [
            216.75,
            79.89485277538222
        ],
        "wc_questions_avg": [
            26.5,
            22.863726730347352
        ],
        "wc_review_avg": [
            386.5,
            169.88304800656243
        ],
        "wc_reply_reviewers_avg": [
            86.25,
            93.83063199190337
        ],
        "wc_reply_authors_avg": [
            965.25,
            208.48186371960512
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9045340337332909,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:kzLnSsWpc6cJ:scholar.google.com/&scioq=Focus+on+Primary:+Differential+Diverse+Data+Augmentation+for+Generalization+in+Visual+Reinforcement+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Jilin University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.jlu.edu.cn",
        "aff_unique_abbr": "JLU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "4x5SXqqrdv",
        "title": "Improving Private Training via In-distribution Public Data Synthesis and Generalization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "To alleviate the utility degradation of deep learning classification with differential privacy (DP), employing extra public data or pre-trained models has been widely explored. Recently, the use of in-distribution public data has been investigated, where a tiny subset of data owners share their data publicly. In this paper, to mitigate memorization and overfitting by the limited-sized in-distribution public data, we leverage recent diffusion models and employ various augmentation techniques for improving diversity. We then explore the optimization to discover flat minima to public data and suggest weight multiplicity to enhance the generalization of the private training. While assuming 4\\% of training data as public, our method brings significant performance gain even without using pre-trained models, i.e., achieving 85.78\\% on CIFAR-10 with a privacy budget of $\\varepsilon=2$ and $\\delta=10^{-5}$.",
        "keywords": "Differential Privacy;Privacy;Optimization;DP-SGD;Diffusion;Synthesis",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/e565f490d512e3062f409456d28c0f7d8b3f3e0a.zip",
        "author": "Jinseong Park;Yujin Choi;Jaewook Lee",
        "authorids": "~Jinseong_Park1;~Yujin_Choi1;~Jaewook_Lee1",
        "gender": "M;F;M",
        "homepage": "https://github.com/JinseongP;;http://slcf.snu.ac.kr",
        "dblp": "178/8948-1;251/3065;39/4985-1",
        "google_scholar": "o4-E5z0AAAAJ;3u0-O2sAAAAJ;teMdzbwAAAAJ",
        "orcid": "0000-0003-1931-8441;0000-0001-9150-704X;",
        "linkedin": "jinseong-park-a84740226/;;",
        "or_profile": "~Jinseong_Park1;~Yujin_Choi1;~Jaewook_Lee1",
        "aff": "Seoul National University;Seoul National University;Seoul National University",
        "aff_domain": "snu.ac.kr;snu.ac.kr;snu.ac.kr",
        "position": "PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\npark2024improving,\ntitle={Improving Private Training via In-distribution Public Data Synthesis and Generalization},\nauthor={Jinseong Park and Yujin Choi and Jaewook Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=4x5SXqqrdv}\n}",
        "github": "",
        "project": "",
        "reviewers": "9BFG;8NJG;nRz4;jmD4",
        "site": "https://openreview.net/forum?id=4x5SXqqrdv",
        "pdf_size": 1125449,
        "rating": "3;5;5;6",
        "confidence": "3;4;4;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;2;4",
        "wc_summary": "97;68;51;70",
        "wc_strengths": "48;76;30;89",
        "wc_weaknesses": "92;801;340;260",
        "wc_questions": "21;59;2;4",
        "wc_review": "258;1004;423;423",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            71.5,
            16.469669092000604
        ],
        "wc_strengths_avg": [
            60.75,
            23.12331074911203
        ],
        "wc_weaknesses_avg": [
            373.25,
            262.6798193618992
        ],
        "wc_questions_avg": [
            21.5,
            22.874658467395747
        ],
        "wc_review_avg": [
            527.0,
            283.5145498911828
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.2294157338705618,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:9IwEeQN7TZgJ:scholar.google.com/&scioq=Improving+Private+Training+via+In-distribution+Public+Data+Synthesis+and+Generalization&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Seoul National University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.snu.ac.kr",
        "aff_unique_abbr": "SNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "4xXOc9nssp",
        "title": "Patio: Framework for Private Release of Ratios",
        "track": "main",
        "status": "Desk Reject",
        "tldr": "",
        "abstract": "Averages and ratios are some of the most basic primitives in data analytics, statistics, and machine learning. In this work, we study the differentially private (DP) release of ratios.\nFor tasks for which the numerator $a(\\cdot)$ and denominator $b(\\cdot)$ satisfy a certain general co-monotonicity property, we give a new mechanism \\emph{Patio} (Private rATIO) for privately releasing the ratio $a(\\mathbf{x})/b(\\mathbf{x})$ for an input dataset $\\mathbf{x}$, with strong theoretical guarantees and practical performance.\nWe also prove that under general conditions on $a(\\cdot)$ and $b(\\cdot)$, the variance of our mechanism matches up to a $1+o(1)$ factor the variance of the Laplace distribution scaled with the \\emph{local} sensitivity. This is in contrast with the standard Laplace mechanism, which scales the noise with---the potentially much larger---\\emph{global} sensitivity.\n\nOur algorithm can be applied to a variety of tasks and settings including estimating averages, the Jaccard similarity coefficient, and several metrics quantifying the utility of a classifier such as its precision, sensitivity, specificity and $F$-score. For the above-mentioned statistics, our MSE matches that of the Laplace distribution scaled to the local sensitivity of the given task. We perform empirical evaluation showing the better utility of our algorithm compared to natural and state-of-the-art baselines.",
        "keywords": "privacy;ratio;average",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Badih Ghazi;Pritish Kamath;Ravi Kumar;Pasin Manurangsi;Adam Sealfon;Jakub Tetek",
        "authorids": "~Badih_Ghazi1;~Pritish_Kamath2;~Ravi_Kumar1;~Pasin_Manurangsi2;~Adam_Sealfon1;~Jakub_Tetek1",
        "gender": ";M;M;M;;",
        "homepage": "https://sites.google.com/view/badihghazi/home;https://pritishkamath.github.io/;https://sites.google.com/site/ravik53/;https://pasin30055.github.io/;https://asealfon.github.io/;https://sites.google.com/view/jakub-tetek/",
        "dblp": "125/2134;https://dblp.org/pers/k/Kamath:Pritish.html;k/RaviKumar.html;133/2059;150/6253;211/6738",
        "google_scholar": "GBJLTN8AAAAJ;1JFARhUAAAAJ;J_XhIsgAAAAJ;35hM-PkAAAAJ;nrlhJMcAAAAJ;https://scholar.google.com/citations?view_op=list_works",
        "orcid": ";;0000-0002-2203-2586;;;0000-0002-2046-1627",
        "linkedin": "badih-ghazi-608379132/;;ravi-kumar-a3a9631;;;",
        "or_profile": "~Badih_Ghazi1;~Pritish_Kamath2;~Ravi_Kumar1;~Pasin_Manurangsi2;~Adam_Sealfon1;~Jakub_Tetek1",
        "aff": "Google;Google Research;Google;Google;Google;University of Copenhagen",
        "aff_domain": "google.com;google.com;google.com;google.com;google.com;diku.dk",
        "position": "Researcher;Research Scientist;Research Scientist;Research Scientist;Researcher;PhD student",
        "bibtex": "@misc{\nghazi2024patio,\ntitle={Patio: Framework for Private Release of Ratios},\nauthor={Badih Ghazi and Pritish Kamath and Ravi Kumar and Pasin Manurangsi and Adam Sealfon and Jakub Tetek},\nyear={2024},\nurl={https://openreview.net/forum?id=4xXOc9nssp}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=4xXOc9nssp",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:zeVd-8HpjGcJ:scholar.google.com/&scioq=Patio:+Framework+for+Private+Release+of+Ratios&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0;1",
        "aff_unique_norm": "Google;University of Copenhagen",
        "aff_unique_dep": "Google;",
        "aff_unique_url": "https://www.google.com;https://www.ku.dk",
        "aff_unique_abbr": "Google;UCPH",
        "aff_campus_unique_index": "0;0;0;0;0",
        "aff_campus_unique": "Mountain View;",
        "aff_country_unique_index": "0;0;0;0;0;1",
        "aff_country_unique": "United States;Denmark"
    },
    {
        "id": "4y3GDTFv70",
        "title": "A Latent Space Theory for Emergent Abilities in Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Languages are not created randomly but rather to communicate information. There is a strong association between languages and their underlying meanings, resulting in a sparse joint distribution that is heavily peaked according to their correlations. Moreover, these peak values happen to match with the marginal distribution of languages due to the sparsity. With the advent of LLMs trained on big data and large models, we can now precisely assess the marginal distribution of languages, providing a convenient means of exploring the sparse structures in the joint distribution for effective inferences. In this paper, we categorize languages as either unambiguous or {\\epsilon}-ambiguous and present quantitative results to demonstrate that the emergent abilities of LLMs, such as language understanding, in-context learning, chain-of-thought prompting, and effective instruction fine-tuning, can all be attributed to Bayesian inference on the sparse joint distribution of languages.",
        "keywords": "Large Language Model (LLMs); Emergent Abilities; Bayesian Inference; Latent Space",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/0f4b531ed89e9be272c73c78c0b0dc0aa2ea6dcd.zip",
        "author": "Hui Jiang",
        "authorids": "~Hui_Jiang1",
        "gender": "M",
        "homepage": "https://wiki.eecs.yorku.ca/user/hj/",
        "dblp": "64/3246",
        "google_scholar": "https://scholar.google.ca/citations?user=lQi05ZkAAAAJ",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Hui_Jiang1",
        "aff": "York University",
        "aff_domain": "yorku.ca",
        "position": "Full Professor",
        "bibtex": "@misc{\njiang2024a,\ntitle={A Latent Space Theory for Emergent Abilities in Large Language Models},\nauthor={Hui Jiang},\nyear={2024},\nurl={https://openreview.net/forum?id=4y3GDTFv70}\n}",
        "github": "",
        "project": "",
        "reviewers": "syQW;5EvL;aMxK;Zr2w",
        "site": "https://openreview.net/forum?id=4y3GDTFv70",
        "pdf_size": 895127,
        "rating": "1;3;3;6",
        "confidence": "4;4;3;3",
        "soundness": "1;3;2;3",
        "contribution": "1;2;2;3",
        "presentation": "2;2;2;3",
        "wc_summary": "65;31;52;53",
        "wc_strengths": "6;50;27;46",
        "wc_weaknesses": "127;279;106;33",
        "wc_questions": "1;122;2;69",
        "wc_review": "199;482;187;201",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;218;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;1;0",
        "rating_avg": [
            3.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            50.25,
            12.234684303242156
        ],
        "wc_strengths_avg": [
            32.25,
            17.469616481193857
        ],
        "wc_weaknesses_avg": [
            136.25,
            89.49685748672967
        ],
        "wc_questions_avg": [
            48.5,
            50.59891303180336
        ],
        "wc_review_avg": [
            267.25,
            124.10152094152593
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            54.5,
            94.39676901250381
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0.25,
            0.4330127018922193
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.7001400420140049,
        "gs_citation": 49,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8083484720921169366&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "York University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.yorku.ca",
        "aff_unique_abbr": "York U",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Canada"
    },
    {
        "title": "Space and time continuous physics simulation from partial observations",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19444",
        "id": "4yaFQ7181M",
        "author_site": "Steeven Janny, Madiha Nadri, Julie Digne, Christian Wolf",
        "tldr": "",
        "abstract": "Modern techniques for physical simulations rely on numerical schemes and mesh-refinement methods to address trade-offs between precision and complexity, but these handcrafted solutions are tedious and require high computational power. Data-driven methods based on large-scale machine learning promise high adaptivity by integrating long-range dependencies more directly and efficiently. In this work, we focus on computational fluid dynamics and address the shortcomings of a large part of the literature, which are based on fixed support for computations and predictions in the form of regular or irregular grids. We propose a novel setup to perform predictions in a continuous spatial and temporal domain while being trained on sparse observations. We formulate the task as a double observation problem and propose a solution with two interlinked dynamical systems defined on, respectively, the sparse positions and the continuous domain, which allows to forecast and interpolate a solution from the initial condition. Our practical implementation involves recurrent GNNs and a spatio-temporal attention observer capable of interpolating the solution at arbitrary locations. Our model not only generalizes to new initial conditions (as standard auto-regressive models do) but also performs evaluation at arbitrary space and time locations. We evaluate on three standard datasets in fluid dynamics and compare to strong baselines, which are outperformed in classical settings and the extended new task requiring continuous predictions.",
        "keywords": "Physics;simulation;interpolation",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Steeven JANNY;Madiha Nadri;Julie Digne;Christian Wolf",
        "authorids": "~Steeven_JANNY2;~Madiha_Nadri1;~Julie_Digne1;~Christian_Wolf5",
        "gender": "M;F;F;M",
        "homepage": "https://steevenjanny.github.io/;;https://perso.liris.cnrs.fr/julie.digne/;https://chriswolfvision.github.io/www/",
        "dblp": "228/8300;;11/8698;38/2606-1.html",
        "google_scholar": "IC0ceIgAAAAJ;KOXeslUAAAAJ;https://scholar.google.fr/citations?user=EOBpDNQAAAAJ;idYS1AIAAAAJ",
        "orcid": ";;0000-0003-0905-0840;",
        "linkedin": ";;;christian-wolf-522761249/",
        "or_profile": "~Steeven_JANNY2;~Madiha_Nadri1;~Julie_Digne1;~Christian_Wolf5",
        "aff": "Naver Labs Europe;Universit\u00e9 Claude Bernard Lyon1 - LAGEPP;LIRIS, CNRS;Naver Labs Europe",
        "aff_domain": "naverlabs.com;univ-lyon1.fr;liris.cnrs.fr;naverlabs.com",
        "position": "Researcher;Associate Professor;Researcher;Principal Researcher",
        "bibtex": "@inproceedings{\njanny2024space,\ntitle={Space and time continuous physics simulation from partial observations},\nauthor={Steeven JANNY and Madiha Nadri and Julie Digne and Christian Wolf},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=4yaFQ7181M}\n}",
        "github": "",
        "project": "",
        "reviewers": "eMKs;VJPj;fAqF;Kpnn;uqXM",
        "pdf_size": 23760872,
        "rating": "6;8;8;8;8",
        "confidence": "2;3;3;3;4",
        "soundness": "3;4;3;4;3",
        "contribution": "3;3;3;3;3",
        "presentation": "4;3;3;4;4",
        "wc_summary": "71;168;69;44;52",
        "wc_strengths": "28;112;68;80;32",
        "wc_weaknesses": "29;250;250;109;141",
        "wc_questions": "133;176;4;103;195",
        "wc_review": "261;706;391;336;420",
        "wc_reply_reviewers": "0;0;65;26;0",
        "wc_reply_authors": "653;433;514;598;630",
        "reply_reviewers": "0;0;1;1;0",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            7.6,
            0.7999999999999999
        ],
        "confidence_avg": [
            3.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            3.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            80.8,
            44.77231287302455
        ],
        "wc_strengths_avg": [
            64.0,
            31.292171544972714
        ],
        "wc_weaknesses_avg": [
            155.8,
            85.12907846323722
        ],
        "wc_questions_avg": [
            122.2,
            67.30646328548247
        ],
        "wc_review_avg": [
            422.8,
            151.61451117884462
        ],
        "wc_reply_reviewers_avg": [
            18.2,
            25.47469332494505
        ],
        "wc_reply_authors_avg": [
            565.6,
            81.3402729279906
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.790569415042095,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17782672727549054795&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=4yaFQ7181M",
        "pdf": "https://openreview.net/pdf?id=4yaFQ7181M",
        "email": "naverlabs.com;univ-lyon1.fr;liris.cnrs.fr;naverlabs.com",
        "author_num": 4,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "NAVER LABS;Universit\u00e9 Claude Bernard Lyon1;CNRS",
        "aff_unique_dep": ";LAGEPP;LIRIS",
        "aff_unique_url": "https://labs.naver.com;https://www.universite-lyon1.fr;https://www.cnrs.fr",
        "aff_unique_abbr": "NLE;UCBL;CNRS",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Lyon",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "Unknown;France"
    },
    {
        "title": "Beyond Vanilla Variational Autoencoders: Detecting Posterior Collapse in Conditional and Hierarchical Variational Autoencoders",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19443",
        "id": "4zZFGliCl9",
        "author_site": "Hien Dang, Tho-Huu Tran, Tan Nguyen, Nhat Ho",
        "tldr": "",
        "abstract": "The posterior collapse phenomenon in variational autoencoder (VAE), where the variational posterior distribution closely matches the prior distribution, can hinder the quality of the learned latent variables. As a consequence of posterior collapse, the latent variables extracted by the encoder in VAE preserve less information from the input data and thus fail to produce meaningful representations as input to the reconstruction process in the decoder. While this phenomenon has been an actively addressed topic related to VAE performance, the theory for posterior collapse remains underdeveloped, especially beyond the standard VAE. In this work, we advance the theoretical understanding of posterior collapse to two important and prevalent yet less studied classes of VAE: conditional VAE and hierarchical VAE. Specifically, via a non-trivial theoretical analysis of linear conditional VAE and hierarchical VAE with two levels of latent, we prove that the cause of posterior collapses in these models includes the correlation between the input and output of the conditional VAE and the effect of learnable encoder variance in the hierarchical VAE. We empirically validate our theoretical findings for linear conditional and hierarchical VAE and demonstrate that these results are also predictive for non-linear cases with extensive experiments.",
        "keywords": "variational autoencoders;posterior collapse",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/edc531461a86d46ea17a15ff21f0575acc5e5447.zip",
        "author": "Hien Dang;Tho Tran Huu;Tan Minh Nguyen;Nhat Ho",
        "authorids": "~Hien_Dang1;~Tho_Tran_Huu1;~Tan_Minh_Nguyen1;~Nhat_Ho1",
        "gender": ";M;M;M",
        "homepage": ";;https://tanmnguyen89.github.io/;https://nhatptnk8912.github.io/",
        "dblp": ";337/2038;255/4725;203/4479",
        "google_scholar": ";fG3mIYEAAAAJ;OizOh88AAAAJ;https://scholar.google.ca/citations?user=Xs7cKMwAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;nhat-pham-minh-ho-267b8164/",
        "or_profile": "~Hien_Dang1;~Tho_Tran_Huu1;~Tan_Minh_Nguyen1;~Nhat_Ho1",
        "aff": ";National University of Singapore;National University of Singapore;University of Texas, Austin",
        "aff_domain": ";u.nus.edu;nus.edu.sg;utexas.edu",
        "position": ";PhD student;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\ndang2024beyond,\ntitle={Beyond Vanilla Variational Autoencoders: Detecting Posterior Collapse in Conditional and Hierarchical Variational Autoencoders},\nauthor={Hien Dang and Tho Tran Huu and Tan Minh Nguyen and Nhat Ho},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=4zZFGliCl9}\n}",
        "github": "",
        "project": "",
        "reviewers": "1CHE;fUP2;VR5S;Bn1w;vZoP",
        "pdf_size": 19577412,
        "rating": "6;6;6;6;8",
        "confidence": "4;4;3;2;4",
        "soundness": "3;3;4;4;4",
        "contribution": "3;3;3;3;4",
        "presentation": "3;2;3;3;4",
        "wc_summary": "39;73;71;44;73",
        "wc_strengths": "21;57;38;92;94",
        "wc_weaknesses": "95;319;281;295;52",
        "wc_questions": "27;25;37;137;30",
        "wc_review": "182;474;427;568;249",
        "wc_reply_reviewers": "55;6;0;0;0",
        "wc_reply_authors": "1284;1267;2309;2130;723",
        "reply_reviewers": "1;1;0;0;0",
        "reply_authors": "3;2;4;4;1",
        "rating_avg": [
            6.4,
            0.7999999999999999
        ],
        "confidence_avg": [
            3.4,
            0.8
        ],
        "soundness_avg": [
            3.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            3.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            3.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            60.0,
            15.20526224699857
        ],
        "wc_strengths_avg": [
            60.4,
            28.959281759049205
        ],
        "wc_weaknesses_avg": [
            208.4,
            111.64515215628487
        ],
        "wc_questions_avg": [
            51.2,
            43.09245873699945
        ],
        "wc_review_avg": [
            380.0,
            143.3555021615843
        ],
        "wc_reply_reviewers_avg": [
            12.2,
            21.525798475317934
        ],
        "wc_reply_authors_avg": [
            1542.6,
            591.097487729393
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            2.8,
            1.16619037896906
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.37500000000000006,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15624987190754924422&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=4zZFGliCl9",
        "pdf": "https://openreview.net/pdf?id=4zZFGliCl9",
        "email": ";u.nus.edu;nus.edu.sg;utexas.edu",
        "author_num": 4,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "National University of Singapore;University of Texas at Austin",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.nus.edu.sg;https://www.utexas.edu",
        "aff_unique_abbr": "NUS;UT Austin",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Austin",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "Singapore;United States"
    },
    {
        "id": "4zfbwpGhd8",
        "title": "Vision-Language Instruction-enhanced Tuning via Parameter-efficient Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Instruction tuning has shown promising potential for developing general-purpose AI capabilities in large-scale pretrained models. In multimodal community, this has motivated growing research on enhancing instruction tuning to integrate multimodal information for creative applications. However, existing works have two main limitations:  the high training costs and heavy computing resource dependence of full model fine-tuning, and the lack of semantic information in instructions, which hinders multimodal alignment. In this paper, we propose a novel architecture called Vision-Language Instruction-enhanced Tuning via Parameter-efficient Learning (VITAL). Our proposed VITAL first enables lightweight model training using only 2% of parameters through automatic mode approximation. More importantly, VITAL enhances instruction semantics from two perspectives: 1) aggregating more context via enhanced instruction mixture to aid multimodal fusion, and 2) strengthening the connection between the proposed parameter-efficient tuning method and mutual information through our proposed score-based information bottleneck. Validation experiments on six multimodal downstream benchmarks demonstrate that VITAL outperforms state-of-the-art approaches in most cases, even surpassing the performance of full fine-tuning. Besides, extensive experiments on the few-shot setting as well as various visualization analyses have also fully validated our advantages.",
        "keywords": "Parameter-efficient Learning;Instruction Tuning;MultiModal",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yihang Zhai;Haixin Wang;Jianlong Chang;Xinlong Yang;Yang Xian;Jinan Sun;Shikun Zhang;Qi Tian",
        "authorids": "~Yihang_Zhai1;~Haixin_Wang3;~Jianlong_Chang2;~Xinlong_Yang1;~Yang_Xian1;~Jinan_Sun1;~Shikun_Zhang2;~Qi_Tian3",
        "gender": "M;;M;M;M;M;M;M",
        "homepage": ";https://willdreamer.github.io/;https://jianlongchange.github.io/;https://xinlong-yang.github.io/;https://github.com/XianYang521225?tab=repositories;;;https://www.qitian1987.com/index.html",
        "dblp": ";81/5956-3;92/2332;347/2205;https://dblp.org/;16/10588;83/3715.html;78/1467-1.html",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;RGZUJOkAAAAJ;RDwnNsQAAAAJ;;https://scholar.google.com/;;uiklLscAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";0000-0002-5714-0149;;;;;;0000-0002-7252-5047",
        "linkedin": ";;;;https://www.linkedin.com/?original_referer=https%3A%2F%2Fwww.google.com.hk%2F;;;",
        "or_profile": "~Yihang_Zhai1;~Haixin_Wang3;~Jianlong_Chang2;~Xinlong_Yang1;~Yang_Xian1;~Jinan_Sun1;~Shikun_Zhang2;~Qi_Tian3",
        "aff": "Peking University;Peking University;Huawei Technologies Ltd.;Peking University;;Peking University;Peking University;Huawei Technologies Ltd.",
        "aff_domain": "pku.edu.cn;pku.edu.cn;huawei.com;pku.edu.cn;;pku.edu.cn;pku.edu.cn;huawei.com",
        "position": "MS student;MS student;Principal Researcher;MS student;;Associate Professor;Full Professor;Principal Researcher",
        "bibtex": "@misc{\nzhai2024visionlanguage,\ntitle={Vision-Language Instruction-enhanced Tuning via Parameter-efficient Learning},\nauthor={Yihang Zhai and Haixin Wang and Jianlong Chang and Xinlong Yang and Yang Xian and Jinan Sun and Shikun Zhang and Qi Tian},\nyear={2024},\nurl={https://openreview.net/forum?id=4zfbwpGhd8}\n}",
        "github": "",
        "project": "",
        "reviewers": "tPPR;GA5A;mPuJ;W366",
        "site": "https://openreview.net/forum?id=4zfbwpGhd8",
        "pdf_size": 7959,
        "rating": "3;3;5;5",
        "confidence": "5;4;4;3",
        "soundness": "2;2;3;3",
        "contribution": "1;2;2;3",
        "presentation": "2;2;3;2",
        "wc_summary": "60;56;88;41",
        "wc_strengths": "11;22;56;80",
        "wc_weaknesses": "110;331;41;121",
        "wc_questions": "5;2;43;50",
        "wc_review": "186;411;228;292",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            61.25,
            16.990806337546196
        ],
        "wc_strengths_avg": [
            42.25,
            27.38955092731533
        ],
        "wc_weaknesses_avg": [
            150.75,
            108.49049497536639
        ],
        "wc_questions_avg": [
            25.0,
            21.66794868002045
        ],
        "wc_review_avg": [
            279.25,
            84.91576708715526
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.7071067811865475,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:jgMwmOOqDFcJ:scholar.google.com/&scioq=Vision-Language+Instruction-enhanced+Tuning+via+Parameter-efficient+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;0;0;1",
        "aff_unique_norm": "Peking University;Huawei",
        "aff_unique_dep": ";Huawei Technologies",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.huawei.com",
        "aff_unique_abbr": "Peking U;Huawei",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Habitat 3.0: A Co-Habitat for Humans, Avatars, and Robots",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19442",
        "id": "4znwzG92CE",
        "author_site": "Xavier Puig, Eric Undersander, Andrew Szot, Mikael Dallaire Cote, Tsung-Yen Yang, Ruslan Partsey, Ruta Desai, Alexander Clegg, Michal Hlavac, So Yeon Min, Vladim\u00edr Vondru\u0161, Theophile Gervet, Vincent-Pierre Berges, John Turner, Oleksandr Maksymets, Zsolt Kira, Mrinal Kalakrishnan, Jitendra Malik, Devendra Singh Chaplot, Unnat Jain, Dhruv Batra, Akshara Rai, Roozbeh Mottaghi",
        "tldr": "",
        "abstract": "We present Habitat 3.0: a simulation platform for studying collaborative human-robot tasks in home environments. Habitat 3.0 offers contributions across three dimensions: (1) Accurate humanoid simulation: addressing challenges in modeling complex deformable bodies and diversity in appearance and motion, all while ensuring high simulation speed. (2) Human-in-the-loop infrastructure: enabling real human interaction with simulated robots via mouse/keyboard or a VR interface, facilitating evaluation of robot policies with human input. (3) Collaborative tasks: studying two collaborative tasks, Social Navigation and Social Rearrangement. Social Navigation investigates a robot's ability to locate and follow humanoid avatars in unseen environments, whereas Social Rearrangement addresses collaboration between a humanoid and robot while rearranging a scene. These contributions allow us to study end-to-end learned and heuristic baselines for human-robot collaboration in-depth, as well as evaluate them with humans in the loop. Our experiments demonstrate that learned robot policies lead to efficient task completion when collaborating with unseen humanoid agents and human partners that might exhibit behaviors that the robot has not seen before. Additionally, we observe emergent behaviors during collaborative task execution, such as the robot yielding space when obstructing a humanoid agent, thereby allowing the effective completion of the task by the humanoid agent. Furthermore, our experiments using the human-in-the-loop tool demonstrate that our automated evaluation with humanoids can provide an indication of the relative ordering of different policies when evaluated with real human collaborators. Habitat 3.0 unlocks interesting new features in simulators for Embodied AI, and we hope it paves the way for a new frontier of embodied human-AI interaction capabilities. For more details and visualizations, visit: https://aihabitat.org/habitat3.",
        "keywords": "Embodied AI;Simulation",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/ac36aa06501b2d84b16e4f776320cf4bb0a6b707.zip",
        "author": "Xavier Puig;Eric Undersander;Andrew Szot;Mikael Dallaire Cote;Tsung-Yen Yang;Ruslan Partsey;Ruta Desai;Alexander Clegg;Michal Hlavac;So Yeon Min;Vladim\u00edr Vondru\u0161;Theophile Gervet;Vincent-Pierre Berges;John M Turner;Oleksandr Maksymets;Zsolt Kira;Mrinal Kalakrishnan;Jitendra Malik;Devendra Singh Chaplot;Unnat Jain;Dhruv Batra;Akshara Rai;Roozbeh Mottaghi",
        "authorids": "~Xavier_Puig1;~Eric_Undersander2;~Andrew_Szot1;~Mikael_Dallaire_Cote1;~Tsung-Yen_Yang2;~Ruslan_Partsey1;~Ruta_Desai1;~Alexander_Clegg1;~Michal_Hlavac1;~So_Yeon_Min2;~Vladim\u00edr_Vondru\u01611;~Theophile_Gervet1;~Vincent-Pierre_Berges1;~John_M_Turner1;~Oleksandr_Maksymets1;~Zsolt_Kira1;~Mrinal_Kalakrishnan1;~Jitendra_Malik2;~Devendra_Singh_Chaplot2;~Unnat_Jain1;~Dhruv_Batra1;~Akshara_Rai1;~Roozbeh_Mottaghi1",
        "gender": "M;;M;Not Specified;;M;;M;M;F;M;M;;;M;M;M;M;;;Not Specified;;",
        "homepage": "https://people.csail.mit.edu/xavierpuig/;https://www.ericundersander.com/;https://www.andrewszot.com;https://github.com/0mdc;https://sites.google.com/view/tyjimmyyang;;;;http://hlavac.design;;https://magnum.graphics;https://theophilegervet.github.io;;http://johnmturner.com/;https://research.fb.com/people/maksymets-oleksandr/;https://faculty.cc.gatech.edu/~zk15;;https://people.eecs.berkeley.edu/~malik/;;;https://dhruvbatra.com;https://ai.facebook.com/people/akshara-rai;http://roozbehm.info",
        "dblp": "50/8429;209/9989;;;204/7980;;;165/9761;;78/84;;;227/3339.html;;239/4227;36/4127;46/4195;58/2944;;;67/6586;;36/633",
        "google_scholar": ";;IwIWKPYAAAAJ;;g-hQdY8AAAAJ;6h1O4AMAAAAJ;;https://scholar.google.com/citations?hl=en;;dkRTvvcAAAAJ;;-o8kQPwAAAAJ;JEr3qVwAAAAJ;;https://scholar.google.com.ua/citations?user=ZKDLDQoAAAAJ;2a5XgNAAAAAJ;DMTuJzAAAAAJ;oY9R5YQAAAAJ;;;_bs7PqgAAAAJ;;CCV58dgAAAAJ",
        "orcid": ";;;;;0000-0003-3694-7506;;;;;;;;;;0000-0002-2626-2004;;0000-0003-3695-1580;;;;;",
        "linkedin": ";ericu;;https://linkedin.com/in/mdcote;tsung-yen-yang;;;alexander-clegg-68336839;michalhlavac;;;theophile-gervet/;vincentpierreberges/;;maksymets/;;mrinalkalakrishnan/;;;;;;roozbeh-mottaghi-63397aa0",
        "or_profile": "~Xavier_Puig1;~Eric_Undersander2;~Andrew_Szot1;~Mikael_Dallaire_Cote1;~Tsung-Yen_Yang2;~Ruslan_Partsey1;~Ruta_Desai1;~Alexander_Clegg1;~Michal_Hlavac1;~So_Yeon_Min2;~Vladim\u00edr_Vondru\u01611;~Theophile_Gervet1;~Vincent-Pierre_Berges1;~John_M_Turner1;~Oleksandr_Maksymets1;~Zsolt_Kira1;~Mrinal_Kalakrishnan1;~Jitendra_Malik2;~Devendra_Singh_Chaplot2;~Unnat_Jain1;~Dhruv_Batra1;~Akshara_Rai1;~Roozbeh_Mottaghi1",
        "aff": "Meta;Meta ;Georgia Institute of Technology;;Meta AI;Ukrainian Catholic University;;Meta AI;Meta;Carnegie Mellon University;Magnum Engine;;Meta;;Meta;Georgia Institute of Technology;Meta;University of California, Berkeley;;;Georgia Institute of Technology;FAIR, Meta AI;University of Washington",
        "aff_domain": "fb.com;meta.com;gatech.edu;;meta.com;ucu.edu.ua;;meta.com;meta.com;andrew.cmu.edu;magnum.graphics;;meta.com;;meta.com;gatech.edu;meta.com;berkeley.edu;;;gatech.edu;meta.com;cs.washington.edu",
        "position": "Researcher;Research Engineer;PhD student;;Researcher;Researcher;;Researcher;Designer;PhD student;Founder;;Researcher;;Researcher;Assistant Professor;Researcher;Full Professor;;;Associate Professor;Researcher;Affiliate Professor ",
        "bibtex": "@inproceedings{\npuig2024habitat,\ntitle={Habitat 3.0: A Co-Habitat for Humans, Avatars, and Robots},\nauthor={Xavier Puig and Eric Undersander and Andrew Szot and Mikael Dallaire Cote and Tsung-Yen Yang and Ruslan Partsey and Ruta Desai and Alexander Clegg and Michal Hlavac and So Yeon Min and Vladim{\\'\\i}r Vondru{\\v{s}} and Theophile Gervet and Vincent-Pierre Berges and John M Turner and Oleksandr Maksymets and Zsolt Kira and Mrinal Kalakrishnan and Jitendra Malik and Devendra Singh Chaplot and Unnat Jain and Dhruv Batra and Akshara Rai and Roozbeh Mottaghi},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=4znwzG92CE}\n}",
        "github": "",
        "project": "",
        "reviewers": "ndxG;FYWe;HoUA",
        "pdf_size": 8674247,
        "rating": "6;6;8",
        "confidence": "3;4;5",
        "soundness": "2;3;4",
        "contribution": "2;3;4",
        "presentation": "3;3;4",
        "wc_summary": "300;89;102",
        "wc_strengths": "276;66;215",
        "wc_weaknesses": "230;93;120",
        "wc_questions": "193;272;2",
        "wc_review": "999;520;439",
        "wc_reply_reviewers": "70;193;0",
        "wc_reply_authors": "1781;2020;428",
        "reply_reviewers": "1;1;0",
        "reply_authors": "4;4;1",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            163.66666666666666,
            96.54820327461074
        ],
        "wc_strengths_avg": [
            185.66666666666666,
            88.20556797743679
        ],
        "wc_weaknesses_avg": [
            147.66666666666666,
            59.25275427259807
        ],
        "wc_questions_avg": [
            155.66666666666666,
            113.34411713401313
        ],
        "wc_review_avg": [
            652.6666666666666,
            247.1171562010394
        ],
        "wc_reply_reviewers_avg": [
            87.66666666666667,
            79.77607550025397
        ],
        "wc_reply_authors_avg": [
            1409.6666666666667,
            700.9671097055046
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.0,
            1.4142135623730951
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            23,
            0
        ],
        "corr_rating_confidence": 0.8660254037844385,
        "gs_citation": 111,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4645667612256940045&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=4znwzG92CE",
        "pdf": "https://openreview.net/pdf?id=4znwzG92CE",
        "email": "fb.com;meta.com;gatech.edu;;meta.com;ucu.edu.ua;;meta.com;meta.com;andrew.cmu.edu;magnum.graphics;;meta.com;;meta.com;gatech.edu;meta.com;berkeley.edu;;;gatech.edu;meta.com;cs.washington.edu",
        "author_num": 23,
        "aff_unique_index": "0;0;1;0;2;0;0;3;4;0;0;1;0;5;1;0;6",
        "aff_unique_norm": "Meta;Georgia Institute of Technology;Ukrainian Catholic University;Carnegie Mellon University;Magnum Engine;University of California, Berkeley;University of Washington",
        "aff_unique_dep": "Meta Platforms, Inc.;;;;;;",
        "aff_unique_url": "https://meta.com;https://www.gatech.edu;https://ucu.edu.ua;https://www.cmu.edu;;https://www.berkeley.edu;https://www.washington.edu",
        "aff_unique_abbr": "Meta;Georgia Tech;UCU;CMU;;UC Berkeley;UW",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Berkeley",
        "aff_country_unique_index": "0;0;0;0;1;0;0;0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States;Ukraine;"
    },
    {
        "id": "506Sxc0Adp",
        "title": "Beyond Scale: the Diversity Coefficient as a Data Quality Metric Demonstrates LLMs are Pre-trained on Formally Diverse Data",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Current trends to pre-train capable Large Language Models (LLMs) mostly focus on scaling of model and dataset size. However, the of pre-training data is an important factor for training powerful LLMs, yet it is a nebulous concept that has not been fully characterized. Therefore, we use the recently proposed Task2Vec diversity coefficient to understand formal aspects of data \\textit{quality} that go beyond scale alone. Specifically, we measure the diversity coefficient of publicly available pre-training datasets to demonstrate that their formal diversity is high when compared to theoretical lower and upper bounds. In addition, to build confidence in the diversity coefficient, we conduct interpretability experiments and find that the coefficient aligns with intuitive properties of diversity, e.g., it increases as the number of latent concepts increases. We conclude the diversity coefficient is reliable and conjecture it can be used to build useful diverse datasets for LLMs.",
        "keywords": "machine learning;large language models;metrics;data diversity;data;data quality",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/e6f362b9be0e39c559d4f1f7e49f1e2d1661d1d1.pdf",
        "author": "Brando Miranda;Alycia Lee;Sudharsan Sundar;Sanmi Koyejo",
        "authorids": "~Brando_Miranda1;~Alycia_Lee1;sjsundar@stanford.edu;~Sanmi_Koyejo1",
        "gender": "M;;;",
        "homepage": "https://cbmm.mit.edu/about/people/miranda;;;",
        "dblp": ";;;",
        "google_scholar": "_NQJoBkAAAAJ;;;",
        "orcid": ";;;",
        "linkedin": "brando-miranda-40821046/;;;",
        "or_profile": "~Brando_Miranda1;~Alycia_Lee1;sjsundar@stanford.edu;~Sanmi_Koyejo1",
        "aff": "Stanford University;;;",
        "aff_domain": "stanford.edu;;;",
        "position": "PhD student;;;",
        "bibtex": "@misc{\nmiranda2024beyond,\ntitle={Beyond Scale: the Diversity Coefficient as a Data Quality Metric Demonstrates {LLM}s are Pre-trained on Formally Diverse Data},\nauthor={Brando Miranda and Alycia Lee and Sudharsan Sundar and Sanmi Koyejo},\nyear={2024},\nurl={https://openreview.net/forum?id=506Sxc0Adp}\n}",
        "github": "",
        "project": "",
        "reviewers": "FQiZ;kREU;Z6o3;H6fT",
        "site": "https://openreview.net/forum?id=506Sxc0Adp",
        "pdf_size": 476111,
        "rating": "1;3;6;6",
        "confidence": "4;4;4;2",
        "soundness": "1;2;3;4",
        "contribution": "1;2;3;3",
        "presentation": "1;3;2;3",
        "wc_summary": "65;115;83;101",
        "wc_strengths": "63;28;57;87",
        "wc_weaknesses": "185;143;336;80",
        "wc_questions": "283;125;202;1",
        "wc_review": "596;411;678;269",
        "wc_reply_reviewers": "183;28;51;14",
        "wc_reply_authors": "2281;2430;2380;1220",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "3;4;5;3",
        "rating_avg": [
            4.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.5,
            1.118033988749895
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            91.0,
            18.81488772222678
        ],
        "wc_strengths_avg": [
            58.75,
            21.00446381129497
        ],
        "wc_weaknesses_avg": [
            186.0,
            94.32125953357493
        ],
        "wc_questions_avg": [
            152.75,
            103.90951592611718
        ],
        "wc_review_avg": [
            488.5,
            159.41533803244906
        ],
        "wc_reply_reviewers_avg": [
            69.0,
            67.1304699819687
        ],
        "wc_reply_authors_avg": [
            2077.75,
            498.11664045683113
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.75,
            0.82915619758885
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5443310539518174,
        "gs_citation": 30,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9241919353973672522&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0",
        "aff_unique_norm": "Stanford University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.stanford.edu",
        "aff_unique_abbr": "Stanford",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Stanford",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "50P9TDPEsh",
        "title": "Critique Ability of Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Critical thinking is essential for rational decision-making and problem-solving. This skill hinges on the ability to provide precise and reasoned critiques and is a hallmark of human intelligence. In the era of large language models (LLMs), this study explores the ability of LLMs to deliver accurate critiques across various tasks. We are interested in this topic as a capable critic model could not only serve as a reliable evaluator, but also as a source of supervised signals for model tuning. Particularly, if a model can self-critique, it has the potential for autonomous self-improvement. To examine this, we introduce a unified evaluation framework for assessing the critique abilities of LLMs. We develop a benchmark called CriticBench, which comprises $3$K high-quality natural language queries and corresponding model responses; and annotate the correctness of these responses. The benchmark cover tasks such as math problem-solving, code completion, and question answering. We evaluate multiple LLMs on the collected dataset and our analysis reveals several noteworthy insights: (1) Critique is generally challenging for most LLMs, and this capability often emerges only when models are sufficiently large. (2) In particular, self-critique is especially difficult. Even top-performing LLMs struggle to achieve satisfactory performance. (3) Models tend to have lower critique accuracy on problems where they are most uncertain. To this end, we introduce a simple yet effective baseline named self-check, which leverages self-critique to improve task performance for various models. We hope this study serves as an initial exploration into understanding the critique abilities of LLMs, and aims to inform future research, including the development of more proficient critic models and the application of critiques across diverse tasks.",
        "keywords": "LLM;Large Language Models;Critique;Self-Critique;Emergent Ability;Reasoning",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/0a07401ab8e4b7b35d1688974279a382f8ddc398.pdf",
        "author": "Liangchen Luo;Zi Lin;Yinxiao Liu;Lei Shu;Yun Zhu;Jingbo Shang;Lei Meng",
        "authorids": "~Liangchen_Luo1;~Zi_Lin1;~Yinxiao_Liu2;~Lei_Shu1;~Yun_Zhu5;~Jingbo_Shang2;~Lei_Meng2",
        "gender": "M;F;M;F;;M;F",
        "homepage": "https://www.luolc.com;https://zi-lin.com/;;https://leishu02.github.io/;;https://shangjingbo1226.github.io/;https://scholar.google.com/citations?user=7XxgNUsAAAAJ&hl=en&oi=ao",
        "dblp": "225/6429;81/2999;;19/2932-4;;151/3145.html;",
        "google_scholar": "8ei4_E4AAAAJ;kgZYttUAAAAJ;https://scholar.google.com/citations?hl=en;Q0zkC-kAAAAJ;;0SkFI4MAAAAJ;",
        "orcid": ";;;;;;",
        "linkedin": ";zi-lin/;;shu-lei-8b361642/;;;",
        "or_profile": "~Liangchen_Luo1;~Zi_Lin1;~Yinxiao_Liu2;~Lei_Shu1;~Yun_Zhu5;~Jingbo_Shang2;~Lei_Meng2",
        "aff": "Google DeepMind;University of California, San Diego;Research, Google;Google;;University of California, San Diego;",
        "aff_domain": "google.com;ucsd.edu;research.google.com;google.com;;ucsd.edu;",
        "position": "Researcher;Graduate student;Researcher;Researcher;;Assistant Professor;",
        "bibtex": "@misc{\nluo2024critique,\ntitle={Critique Ability of Large Language Models},\nauthor={Liangchen Luo and Zi Lin and Yinxiao Liu and Lei Shu and Yun Zhu and Jingbo Shang and Lei Meng},\nyear={2024},\nurl={https://openreview.net/forum?id=50P9TDPEsh}\n}",
        "github": "",
        "project": "",
        "reviewers": "qpMo;WsbC;qunD",
        "site": "https://openreview.net/forum?id=50P9TDPEsh",
        "pdf_size": 1144366,
        "rating": "3;5;6",
        "confidence": "4;3;4",
        "soundness": "3;3;3",
        "contribution": "3;3;2",
        "presentation": "2;3;3",
        "wc_summary": "37;77;103",
        "wc_strengths": "57;69;57",
        "wc_weaknesses": "153;162;201",
        "wc_questions": "72;1;51",
        "wc_review": "319;309;412",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "796;357;862",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;2",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            72.33333333333333,
            27.145697428669774
        ],
        "wc_strengths_avg": [
            61.0,
            5.656854249492381
        ],
        "wc_weaknesses_avg": [
            172.0,
            20.83266665599966
        ],
        "wc_questions_avg": [
            41.333333333333336,
            29.78067979225607
        ],
        "wc_review_avg": [
            346.6666666666667,
            46.37767662236745
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            671.6666666666666,
            224.1284354015696
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.18898223650461363,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17074660022459503280&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;0;1",
        "aff_unique_norm": "Google;University of California, San Diego",
        "aff_unique_dep": "Google DeepMind;",
        "aff_unique_url": "https://deepmind.com;https://www.ucsd.edu",
        "aff_unique_abbr": "DeepMind;UCSD",
        "aff_campus_unique_index": "1;2;2;1",
        "aff_campus_unique": ";San Diego;Mountain View",
        "aff_country_unique_index": "0;1;1;1;1",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "id": "50vyPuz0iv",
        "title": "Iteratively Refined Behavior Regularization for Offline Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "One of the fundamental challenges for offline reinforcement learning (RL) is ensuring robustness to data distribution. \nWhether the data originates from a near-optimal policy or not, we anticipate that an algorithm should demonstrate its ability to learn an effective control policy that seamlessly aligns with the inherent distribution of offline data. Unfortunately, behavior regularization, a simple yet effective offline RL algorithm, tends to struggle in this regard. In this paper, we propose a new algorithm that substantially enhances behavior-regularization based on conservative policy iteration. Our key observation is that by iteratively refining the reference policy used for behavior regularization, conservative policy update guarantees gradual improvement, while also implicitly avoiding querying out-of-sample actions to prevent catastrophic learning failures. We prove that in the tabular setting this algorithm is capable of learning the optimal policy covered by the offline dataset, commonly referred to as the in-sample optimal policy. We then explore several implementation details of the algorithm when function approximations are applied. The resulting algorithm is easy to implement, requiring only a few lines of code modification to existing methods. Experimental results on the D4RL benchmark indicate that our method outperforms previous state-of-the-art baselines in most tasks, clearly demonstrate its superiority over behavior regularization.",
        "keywords": "Offline Reinforcement Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Xiaohan Hu;Yi Ma;Chenjun Xiao;YAN ZHENG;Jianye HAO",
        "authorids": "~Xiaohan_Hu1;~Yi_Ma5;~Chenjun_Xiao1;~YAN_ZHENG1;~Jianye_HAO1",
        "gender": "M;;;M;M",
        "homepage": ";https://mayi1996.top/;https://chenjun-x.github.io/;https://yanzzzzz.github.io;http://www.icdai.org/jianye.html",
        "dblp": ";69/1112-5.html;178/8641;10/2381-2;21/7664.html",
        "google_scholar": ";TdVWzqgAAAAJ;;https://scholar.google.com.hk/citations?user=tJuhd1kAAAAJ;",
        "orcid": "0000-0001-7645-201X;0000-0001-9375-6605;0000-0002-5493-1500;;0000-0002-0422-8235",
        "linkedin": ";;;;",
        "or_profile": "~Xiaohan_Hu1;~Yi_Ma5;~Chenjun_Xiao1;~YAN_ZHENG1;~Jianye_HAO1",
        "aff": "Tianjin University;Tianjin University;Huawei Technologies Ltd.;Tianjin Unibersity, China;Tianjin University",
        "aff_domain": "tju.edu.cn;tju.edu.cn;huawei.com;tju.edu.cn;tju.edu.cn",
        "position": "MS student;PhD student;Researcher;Associate Professor;Associate Professor",
        "bibtex": "@misc{\nhu2024iteratively,\ntitle={Iteratively Refined Behavior Regularization for Offline Reinforcement Learning},\nauthor={Xiaohan Hu and Yi Ma and Chenjun Xiao and YAN ZHENG and Jianye HAO},\nyear={2024},\nurl={https://openreview.net/forum?id=50vyPuz0iv}\n}",
        "github": "",
        "project": "",
        "reviewers": "cTmM;JFNQ;ByMR",
        "site": "https://openreview.net/forum?id=50vyPuz0iv",
        "pdf_size": 565586,
        "rating": "3;3;6",
        "confidence": "4;5;3",
        "soundness": "3;2;3",
        "contribution": "2;2;2",
        "presentation": "3;2;4",
        "wc_summary": "48;74;139",
        "wc_strengths": "53;9;45",
        "wc_weaknesses": "100;158;205",
        "wc_questions": "1;116;62",
        "wc_review": "202;357;451",
        "wc_reply_reviewers": "142;0;197",
        "wc_reply_authors": "454;775;1280",
        "reply_reviewers": "2;0;2",
        "reply_authors": "3;2;3",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            87.0,
            38.27096375408734
        ],
        "wc_strengths_avg": [
            35.666666666666664,
            19.136933459209764
        ],
        "wc_weaknesses_avg": [
            154.33333333333334,
            42.94440850939994
        ],
        "wc_questions_avg": [
            59.666666666666664,
            46.977536002741665
        ],
        "wc_review_avg": [
            336.6666666666667,
            102.66558440988014
        ],
        "wc_reply_reviewers_avg": [
            113.0,
            82.99799194358059
        ],
        "wc_reply_authors_avg": [
            836.3333333333334,
            339.9905227437311
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.8660254037844387,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6920572114126102147&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "Tianjin University;Huawei",
        "aff_unique_dep": ";Huawei Technologies",
        "aff_unique_url": "http://www.tju.edu.cn;https://www.huawei.com",
        "aff_unique_abbr": "TJU;Huawei",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "51cjeYcXjs",
        "title": "Search and Retrieval in Semantic-Structural Representations of Novel Malware",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this study we present a novel representation for binary programs, which captures semantic similarity and structural properties.  Our representation is composed in a bottom-up approach and enables new methods of analysis.  We show that we can perform search and retrieval of binary executable programs based on similarity of behavioral properties, with an adjustable level of feature resolution.  We begin by extracting data dependency graphs (DDG), which are representative of both program structure and operational semantics.  We then encode each program as a set of graph hashes representing isomorphic uniqueness, a method we have labeled DDG Fingerprinting.  Next, we use k-Nearest Neighbors to search in a metric space constructed from examples.  This approach allows us to perform a quantitative analysis of patterns of program operation. By evaluating similarity of behavior we are able to recognize patterns in novel malware with functionality not previously identified.  We present experimental results from search based on program semantics and structural properties in a dataset of binary executables with features extracted using our method of representation.  We show that the associated metric space allows an adjustable level of resolution.  Resolution of the features may be decreased for breadth of search and retrieval, or as the search space is reduced, the resolution may be increased for accuracy and fine-grained analysis of malware behavior.",
        "keywords": "Malware Analysis;Explainability",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "John Musgrave;Alina Campan;Anca L Ralescu",
        "authorids": "~John_Musgrave1;~Alina_Campan1;~Anca_L_Ralescu1",
        "gender": ";F;F",
        "homepage": "https://johnmusgrave.com;;https://www.ceas3.uc.edu/profiles/ralescal",
        "dblp": ";63/4876;",
        "google_scholar": "_CQx1CwAAAAJ;;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0001-7646-4328;;",
        "linkedin": ";;anca-ralescu-97292b7/",
        "or_profile": "~John_Musgrave1;~Alina_Campan1;~Anca_L_Ralescu1",
        "aff": ";Northern Kentucky University;University of Cincinnati",
        "aff_domain": ";nku.edu;uc.edu",
        "position": ";Full Professor;Full Professor",
        "bibtex": "@misc{\nmusgrave2024search,\ntitle={Search and Retrieval in Semantic-Structural Representations of Novel Malware},\nauthor={John Musgrave and Alina Campan and Anca L Ralescu},\nyear={2024},\nurl={https://openreview.net/forum?id=51cjeYcXjs}\n}",
        "github": "",
        "project": "",
        "reviewers": "PPca;5Qou;Qcjm;pKB5",
        "site": "https://openreview.net/forum?id=51cjeYcXjs",
        "pdf_size": 337727,
        "rating": "1;3;3;3",
        "confidence": "4;4;3;4",
        "soundness": "1;2;2;2",
        "contribution": "1;2;2;2",
        "presentation": "1;1;2;2",
        "wc_summary": "77;83;79;50",
        "wc_strengths": "3;20;35;49",
        "wc_weaknesses": "141;253;35;151",
        "wc_questions": "52;37;206;5",
        "wc_review": "273;393;355;255",
        "wc_reply_reviewers": "0;57;0;0",
        "wc_reply_authors": "0;534;749;783",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "0;2;1;1",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            72.25,
            13.026415470113028
        ],
        "wc_strengths_avg": [
            26.75,
            17.122718826167766
        ],
        "wc_weaknesses_avg": [
            145.0,
            77.1621668954417
        ],
        "wc_questions_avg": [
            75.0,
            77.51451476981585
        ],
        "wc_review_avg": [
            319.0,
            56.97367813297646
        ],
        "wc_reply_reviewers_avg": [
            14.25,
            24.681724007856502
        ],
        "wc_reply_authors_avg": [
            516.5,
            313.1122003371954
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.7071067811865476
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2866760772493619036&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Northern Kentucky University;University of Cincinnati",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://nku.edu;https://www.uc.edu",
        "aff_unique_abbr": "NKU;UC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Be Aware of the Neighborhood Effect: Modeling Selection Bias under Interference",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19441",
        "id": "52fz5sUAy2",
        "author_site": "Haoxuan Li, Chunyuan Zheng, Sihao Ding, Peng Wu, Zhi Geng, Fuli Feng, Xiangnan He",
        "tldr": "",
        "abstract": "Selection bias in recommender system arises from the recommendation process of system filtering and the interactive process of user selection. Many previous studies have focused on addressing selection bias to achieve unbiased learning of the prediction model, but ignore the fact that potential outcomes for a given user-item pair may vary with the treatments assigned to other user-item pairs, named neighborhood effect. To fill the gap, this paper formally formulates the neighborhood effect as an interference problem from the perspective of causal inference, and introduces a treatment representation to capture the neighborhood effect. On this basis, we propose a novel ideal loss that can be used to deal with selection bias in the presence of neighborhood effect. We further develop two new estimators for estimating the proposed ideal loss. We theoretically establish the connection between the proposed and previous debiasing methods ignoring the neighborhood effect, showing that the proposed methods can achieve unbiased learning when both selection bias and neighborhood effects are present, while the existing methods are biased. Extensive semi-synthetic and real-world experiments are conducted to demonstrate the effectiveness of the proposed methods.",
        "keywords": "Selection Bias;Neighborhood effect;Recommender system",
        "primary_area": "causal reasoning",
        "supplementary_material": "/attachment/c41c6251cb39606f501706bb9c93e3e8467f0795.zip",
        "author": "Haoxuan Li;Chunyuan Zheng;Sihao Ding;Peng Wu;Zhi Geng;Fuli Feng;Xiangnan He",
        "authorids": "~Haoxuan_Li6;~Chunyuan_Zheng1;~Sihao_Ding2;~Peng_Wu5;~Zhi_Geng1;~Fuli_Feng1;~Xiangnan_He1",
        "gender": "M;M;M;M;M;M;M",
        "homepage": "https://haoxuanli-pku.github.io/;;;https://pengwu.site/;https://stxy.btbu.edu.cn/szdw/bssds/34339356074b408c8650309f05f24558.htm;https://fulifeng.github.io/;http://staff.ustc.edu.cn/~hexn",
        "dblp": "145/4965-1.html;;https://dblp.uni-trier.de/pid/133/4721-3;15/6146-12;;183/9198;59/1007",
        "google_scholar": "gtDqiucAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?view_op=list_works;;https://scholar.google.com.sg/citations?user=QePM4u8AAAAJ;https://scholar.google.com.sg/citations?user=X45Go24AAAAJ",
        "orcid": "0000-0003-3620-3769;0000-0002-0306-7310;0000-0003-1796-8504;0000-0001-7154-8880;;0000-0002-5828-9842;0000-0001-8472-7992",
        "linkedin": ";;;;;;",
        "or_profile": "~Haoxuan_Li6;~Chunyuan_Zheng1;~Sihao_Ding2;~Peng_Wu5;~Zhi_Geng1;~Fuli_Feng1;~Xiangnan_He1",
        "aff": "Peking University;Peking University;;Beijing Technology and Business University;School of mathematical Science, Peking University, Peking University;University of Science and Technology of China;University of Science and Technology of China",
        "aff_domain": "pku.edu.cn;stu.pku.edu.cn;;btbu.edu.cn;math.pku.edu.cn;ustc.edu.cn;ustc.edu.cn",
        "position": "PhD student;PhD student;;Associate Professor;Full Professor;Full Professor;Professor",
        "bibtex": "@inproceedings{\nli2024be,\ntitle={Be Aware of the Neighborhood Effect: Modeling Selection Bias under Interference for Recommendation},\nauthor={Haoxuan Li and Chunyuan Zheng and Sihao Ding and Peng Wu and Zhi Geng and Fuli Feng and Xiangnan He},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=52fz5sUAy2}\n}",
        "github": "",
        "project": "",
        "reviewers": "TJ54;g9eU;1Wkk;qJ35",
        "pdf_size": 662651,
        "rating": "5;6;8;8",
        "confidence": "4;2;3;3",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "73;107;92;86",
        "wc_strengths": "105;16;245;41",
        "wc_weaknesses": "201;10;82;144",
        "wc_questions": "5;1;218;5",
        "wc_review": "384;134;637;276",
        "wc_reply_reviewers": "0;0;0;20",
        "wc_reply_authors": "1109;274;861;713",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "2;1;2;2",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            89.5,
            12.216791722870616
        ],
        "wc_strengths_avg": [
            101.75,
            88.84642648975816
        ],
        "wc_weaknesses_avg": [
            109.25,
            71.09632550279937
        ],
        "wc_questions_avg": [
            57.25,
            92.82342107464042
        ],
        "wc_review_avg": [
            357.75,
            183.99507466233982
        ],
        "wc_reply_reviewers_avg": [
            5.0,
            8.660254037844387
        ],
        "wc_reply_authors_avg": [
            739.25,
            303.5970808489436
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.2721655269759087,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2439006638808384385&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=52fz5sUAy2",
        "pdf": "https://openreview.net/pdf?id=52fz5sUAy2",
        "email": "pku.edu.cn;stu.pku.edu.cn;;btbu.edu.cn;math.pku.edu.cn;ustc.edu.cn;ustc.edu.cn",
        "author_num": 7,
        "aff_unique_index": "0;0;1;0;2;2",
        "aff_unique_norm": "Peking University;Beijing Technology and Business University;University of Science and Technology of China",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.pku.edu.cn;http://www.btbu.edu.cn;http://www.ustc.edu.cn",
        "aff_unique_abbr": "Peking U;BTBU;USTC",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Peking",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "52igC7K5Mf",
        "title": "GC-Mixer: A Novel Architecture for Time-varying Granger Causality Inference",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The neural network has emerged as a practical approach to evaluate the Granger causality in multivariate time series. However, most existing studies on Granger causality inference are based on time-invariance. In this paper, we propose a novel MLP architecture, Granger Causality Mixer (GC-Mixer), which extracts parameters from the weight matrix and imposes the hierarchical group lasso penalty on these parameters to infer time-invariant Granger causality and automatically select time lags. Furthermore, we extend GC-Mixer by introducing a multi-level fine-tuning algorithm to split time series automatically and infer time-varying Granger causality. We conduct experiments on the VAR and Lorenz-96 datasets, and the results show that GC-Mixer achieves outstanding performances in Granger causality inference.",
        "keywords": "Granger causality;Time-varying;Time series;Neural network",
        "primary_area": "causal reasoning",
        "supplementary_material": "/attachment/9b7ed64ea0567b5351ea85345669a64d4767c037.zip",
        "author": "Meiliang Liu;Junhao Huang;Yixiao Wang;Zhengye Si;Zhiwen Zhao",
        "authorids": "~Meiliang_Liu1;~Junhao_Huang4;~Yixiao_Wang2;~Zhengye_Si1;~Zhiwen_Zhao2",
        "gender": "M;M;F;M;M",
        "homepage": ";;;;https://cist.bnu.edu.cn/xygk/szdw/zgj/110688.html",
        "dblp": "381/8230.html;;;;03/10847.html",
        "google_scholar": "iOwkIcoAAAAJ;;https://scholar.google.com.hk/citations?user=pPac-I4AAAAJ;;",
        "orcid": "0009-0005-6795-1518;0000-0003-4477-3358;;0000-0003-4176-2717;",
        "linkedin": ";;;;",
        "or_profile": "~Meiliang_Liu1;~Junhao_Huang4;~Yixiao_Wang2;~Zhengye_Si1;~Zhiwen_Zhao2",
        "aff": "Beijing Normal University;;Beijing Normal University;Beijing Normal University;Beijing Normal University",
        "aff_domain": "bnu.edu.cn;;bnu.edu.cn;bnu.edu.cn;bnu.edu.cn",
        "position": "PhD student;;MS student;PhD student;Full Professor",
        "bibtex": "@misc{\nliu2024gcmixer,\ntitle={{GC}-Mixer: A Novel Architecture for Time-varying Granger Causality Inference},\nauthor={Meiliang Liu and Junhao Huang and Yixiao Wang and Zhengye Si and Zhiwen Zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=52igC7K5Mf}\n}",
        "github": "",
        "project": "",
        "reviewers": "KhHm;1qK9;NC5z;mLYv",
        "site": "https://openreview.net/forum?id=52igC7K5Mf",
        "pdf_size": 2936574,
        "rating": "3;3;5;6",
        "confidence": "4;4;4;2",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;2;2",
        "wc_summary": "74;39;61;39",
        "wc_strengths": "89;25;11;47",
        "wc_weaknesses": "776;120;154;72",
        "wc_questions": "9;18;1;484",
        "wc_review": "948;202;227;642",
        "wc_reply_reviewers": "289;0;0;371",
        "wc_reply_authors": "935;301;260;1043",
        "reply_reviewers": "1;0;0;3",
        "reply_authors": "2;1;1;3",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            53.25,
            14.972892172189045
        ],
        "wc_strengths_avg": [
            43.0,
            29.49576240750525
        ],
        "wc_weaknesses_avg": [
            280.5,
            287.5565161842103
        ],
        "wc_questions_avg": [
            128.0,
            205.62465805442693
        ],
        "wc_review_avg": [
            504.75,
            309.88334498646424
        ],
        "wc_reply_reviewers_avg": [
            165.0,
            167.52760966479525
        ],
        "wc_reply_authors_avg": [
            634.75,
            356.5966734281182
        ],
        "reply_reviewers_avg": [
            1.0,
            1.224744871391589
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.7777777777777777,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:PWy9XEi2yEsJ:scholar.google.com/&scioq=GC-Mixer:+A+Novel+Architecture+for+Time-varying+Granger+Causality+Inference&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Beijing Normal University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.bnu.edu.cn",
        "aff_unique_abbr": "BNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "532tcx7IHF",
        "title": "RLLTE: Long-Term Evolution Project of Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We present RLLTE: a long-term evolution, extremely modular, and open-source framework for reinforcement learning (RL) research and application. Beyond delivering top-notch algorithm implementations, RLLTE also serves as a toolkit for developing algorithms. More specifically, RLLTE decouples the RL algorithms completely from the exploitation-exploration perspective, providing a large number of prototypes to accelerate algorithm development and evolution. In particular, RLLTE is the first RL framework to build a complete and luxuriant ecosystem, which includes model training, evaluation, deployment, benchmark hub, and large language model (LLM)-empowered copilot. RLLTE is expected to set standards for RL engineering practice and be highly stimulative for industry and academia.",
        "keywords": "reinforcement learning;framework;benchmark;open-source;library;intrinsic reward;data augmentation;copilot;LLM",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Mingqi Yuan;Zequn Zhang;Yang Xu;Jake Shihao Luo;Bo Li;Xin Jin;Wenjun Zeng",
        "authorids": "~Mingqi_Yuan1;~Zequn_Zhang1;~Yang_Xu18;~Jake_Shihao_Luo1;~Bo_Li27;~Xin_Jin8;~Wenjun_Zeng3",
        "gender": "M;M;M;M;M;M;M",
        "homepage": "https://github.com/yuanmingqi;;;https://github.com/ShihaoLuo;https://www4.comp.polyu.edu.hk/~bo2li/;http://home.ustc.edu.cn/~jinxustc/;https://www.eias.ac.cn/h-col-187.html",
        "dblp": "282/4291;;;;50/3402-37;68/3340-14;57/145",
        "google_scholar": "https://scholar.google.com.hk/citations?user=xtj9MIMAAAAJ;ElVJU4MAAAAJ;https://scholar.google.com.hk/citations?user=3IpmW68AAAAJ;;;byaSC-kAAAAJ;_cUfvYQAAAAJ",
        "orcid": ";0000-0001-5566-761X;;;;0000-0002-1820-8358;",
        "linkedin": ";;;;;;",
        "or_profile": "~Mingqi_Yuan1;~Zequn_Zhang1;~Yang_Xu18;~Jake_Shihao_Luo1;~Bo_Li27;~Xin_Jin8;~Wenjun_Zeng3",
        "aff": "The Hong Kong Polytechnic University;University of Science and Technology of China;Purdue University;;The Hong Kong Polytechnic University;Eastern Institute of Technology, Ningbo;Eastern Institute for Advanced Study",
        "aff_domain": "polyu.edu.hk;ustc.edu.cn;purdue.edu;;polyu.edu.hk;eitech.edu.cn;eias.ac.cn",
        "position": "PhD student;PhD student;PhD student;;Assistant Professor;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nyuan2024rllte,\ntitle={{RLLTE}: Long-Term Evolution Project of Reinforcement Learning},\nauthor={Mingqi Yuan and Zequn Zhang and Yang Xu and Jake Shihao Luo and Bo Li and Xin Jin and Wenjun Zeng},\nyear={2024},\nurl={https://openreview.net/forum?id=532tcx7IHF}\n}",
        "github": "",
        "project": "",
        "reviewers": "N3a2;ZtLn;gfMY",
        "site": "https://openreview.net/forum?id=532tcx7IHF",
        "pdf_size": 1160382,
        "rating": "3;5;6",
        "confidence": "4;4;3",
        "soundness": "2;3;3",
        "contribution": "1;2;3",
        "presentation": "2;2;3",
        "wc_summary": "34;43;91",
        "wc_strengths": "34;37;57",
        "wc_weaknesses": "123;174;49",
        "wc_questions": "16;36;73",
        "wc_review": "207;290;270",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            56.0,
            25.019992006393608
        ],
        "wc_strengths_avg": [
            42.666666666666664,
            10.208928554075703
        ],
        "wc_weaknesses_avg": [
            115.33333333333333,
            51.31817958146562
        ],
        "wc_questions_avg": [
            41.666666666666664,
            23.612614331233114
        ],
        "wc_review_avg": [
            255.66666666666666,
            35.3679076125361
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.7559289460184545,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13945585868051426758&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;0;3;4",
        "aff_unique_norm": "Hong Kong Polytechnic University;University of Science and Technology of China;Purdue University;Eastern Institute of Technology;Eastern Institute for Advanced Study",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.polyu.edu.hk;http://www.ustc.edu.cn;https://www.purdue.edu;https://www.eit.edu.cn;",
        "aff_unique_abbr": "PolyU;USTC;Purdue;;",
        "aff_campus_unique_index": "0;0;2",
        "aff_campus_unique": "Hong Kong SAR;;Ningbo",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "China;United States;"
    },
    {
        "id": "53gU1BASrd",
        "title": "Evaluating and Finetuning Models For Financial Time Series Forecasting",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Time series forecasting is a challenging task as it is subject to a lot of noise, and the predictions often depend on external events. Still, recent deep learning techniques advanced the state-of-the-art on certain datasets, while they keep failing on other noisy datasets. This paper studies the case of financial time series forecasting, a problem that exhibits both a high noise and many unknown dependencies. We will show that the current evaluation pipelines are imperfect and forget a trivial baseline that can beat most models. We propose a new evaluation pipeline that is better suited for our task, and we run this pipeline on recent models. This pipeline is based on the idea of deciding which assets to buy and sell rather than predicting exact prices. Next, as the small datasets used in current approaches limit the size of the models, we train a general model on a massive dataset (containing a hundred times more data points than existing datasets) and show this model can be finetuned to improve the performance on small datasets. All our code and models will be published to help the community bootstrap and evaluate their future models.",
        "keywords": "time series forecasting;finance;metrics",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/2775d165775e689a4e0d2dea6ef36c81f3cfd422.zip",
        "author": "Tom Djaaleb;Julien Romero",
        "authorids": "~Tom_Djaaleb1;~Julien_Romero1",
        "gender": "M;M",
        "homepage": ";https://julienromero.fr",
        "dblp": ";241/9678",
        "google_scholar": ";nCgiv6YAAAAJ",
        "orcid": ";0000-0002-7382-9077",
        "linkedin": "tom-djaaleb/;romerojulien/",
        "or_profile": "~Tom_Djaaleb1;~Julien_Romero1",
        "aff": "Ecole Nationale de la Statistique et de l'Administration Economique;T\u00e9l\u00e9com SudParis",
        "aff_domain": "ensae.fr;telecom-sudparis.eu",
        "position": "MS student;Associate Professor",
        "bibtex": "@misc{\ndjaaleb2024evaluating,\ntitle={Evaluating and Finetuning Models For Financial Time Series Forecasting},\nauthor={Tom Djaaleb and Julien Romero},\nyear={2024},\nurl={https://openreview.net/forum?id=53gU1BASrd}\n}",
        "github": "",
        "project": "",
        "reviewers": "pP2m;BmfC;Zb2D;9z9f",
        "site": "https://openreview.net/forum?id=53gU1BASrd",
        "pdf_size": 237796,
        "rating": "3;5;5;5",
        "confidence": "3;4;4;3",
        "soundness": "2;2;3;3",
        "contribution": "1;2;1;1",
        "presentation": "2;3;3;2",
        "wc_summary": "40;59;115;126",
        "wc_strengths": "39;72;149;32",
        "wc_weaknesses": "260;65;174;317",
        "wc_questions": "70;30;91;60",
        "wc_review": "409;226;529;535",
        "wc_reply_reviewers": "0;0;0;294",
        "wc_reply_authors": "1123;538;561;810",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            85.0,
            36.33868462121325
        ],
        "wc_strengths_avg": [
            73.0,
            46.40581860068843
        ],
        "wc_weaknesses_avg": [
            204.0,
            95.03420436874295
        ],
        "wc_questions_avg": [
            62.75,
            21.970150204311302
        ],
        "wc_review_avg": [
            424.75,
            125.27245307728272
        ],
        "wc_reply_reviewers_avg": [
            73.5,
            127.30573435631248
        ],
        "wc_reply_authors_avg": [
            758.0,
            236.18742557553736
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Vv05zUyAGaEJ:scholar.google.com/&scioq=Evaluating+and+Finetuning+Models+For+Financial+Time+Series+Forecasting&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Ecole Nationale de la Statistique et de l'Administration Economique;T\u00e9l\u00e9com SudParis",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://ensae.fr;https://www.telecom-sudparis.eu",
        "aff_unique_abbr": "ENSAE;TSP",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "France"
    },
    {
        "id": "53kW6e1uNN",
        "title": "AFDGCF: Adaptive Feature De-correlation Graph Collaborative Filtering for Recommendations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Collaborative filtering methods based on graph neural networks (GNNs) have witnessed significant success in recommender systems (RS), capitalizing on their ability to capture collaborative signals within intricate user-item relationships via message-passing mechanisms. However, these GNN-based RS inadvertently introduce a linear correlation between user and item embeddings, contradicting the goal of providing personalized recommendations. While existing research predominantly ascribes this flaw to the over-smoothing problem, this paper underscores the critical, often overlooked role of the over-correlation issue in diminishing the effectiveness of GNN representations and subsequent recommendation performance. The unclear relationship between over-correlation and over-smoothing in RS, coupled with the challenge of adaptively minimizing the impact of over-correlation while preserving collaborative filtering signals, is quite challenging. To this end, this paper aims to address the aforementioned gap by undertaking a comprehensive study of the over-correlation issue in graph collaborative filtering models. Empirical evidence substantiates the widespread prevalence of over-correlation in these models. Furthermore, a theoretical analysis establishes a pivotal connection between the over-correlation and over-smoothing predicaments. Leveraging these insights, we introduce the Adaptive Feature De-correlation Graph Collaborative Filtering (AFDGCF) Framework, which dynamically applies correlation penalties to the feature dimensions of the representation matrix, effectively alleviating both over-correlation and over-smoothing challenges. The efficacy of the proposed framework is corroborated through extensive experiments conducted with four different graph collaborative filtering models across four publicly available datasets, demonstrating the superiority of AFDGCF in enhancing the performance landscape of graph collaborative filtering models.",
        "keywords": "Collaborative Filtering;Graph Neural Networks;Over-correlation;Over-smoothing",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/3de2578def7d9ce93546f43854f9f782f7d86eeb.zip",
        "author": "Wei Wu;Chao Wang;Dazhong Shen;Chuan Qin;Hui Xiong",
        "authorids": "~Wei_Wu25;~Chao_Wang14;~Dazhong_Shen1;~Chuan_Qin1;~Hui_Xiong1",
        "gender": "M;M;M;M;M",
        "homepage": "https://github.com/U-rara;https://chaowang-ustc.github.io/;http://www.shendazhong.com/;https://dylan-qin.github.io;https://www.hkust-gz.edu.cn/people/hui-xiong/",
        "dblp": "95/6985-45.html;188/7759-86;222/7906;24/2771-2;262/1686-1.html",
        "google_scholar": ";j08V64UAAAAJ;5vSh09YAAAAJ;0KTz65wAAAAJ;cVDF1tkAAAAJ",
        "orcid": "0009-0009-1590-601X;0000-0001-7717-447X;0000-0002-3947-4153;0000-0002-5354-8630;0000-0001-6016-6465",
        "linkedin": ";;;;",
        "or_profile": "~Wei_Wu25;~Chao_Wang14;~Dazhong_Shen1;~Chuan_Qin1;~Hui_Xiong1",
        "aff": "University of Science and Technology of China;HKUST Fok Ying Tung Research Institute, The Hong Kong University of Science and Technology\u00a0(Guangzhou);Shanghai Artificial Intelligence Laboratory;BOSS Zhipin;Hong Kong University of Science and Technology (Guangzhou)",
        "aff_domain": "ustc.edu.cn;ust.hk;pjlab.org.cn;kanzhun.com;hkust.edu",
        "position": "PhD student;Postdoc;Researcher;Senior Researcher;Full Professor",
        "bibtex": "@misc{\nwu2024afdgcf,\ntitle={{AFDGCF}: Adaptive Feature De-correlation Graph Collaborative Filtering for Recommendations},\nauthor={Wei Wu and Chao Wang and Dazhong Shen and Chuan Qin and Hui Xiong},\nyear={2024},\nurl={https://openreview.net/forum?id=53kW6e1uNN}\n}",
        "github": "",
        "project": "",
        "reviewers": "vpbW;HBXd;TKXS;Xkxj",
        "site": "https://openreview.net/forum?id=53kW6e1uNN",
        "pdf_size": 6094555,
        "rating": "5;5;8;8",
        "confidence": "4;4;5;5",
        "soundness": "3;3;4;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;4;4",
        "wc_summary": "73;81;157;210",
        "wc_strengths": "57;52;87;56",
        "wc_weaknesses": "228;163;76;37",
        "wc_questions": "4;71;15;165",
        "wc_review": "362;367;335;468",
        "wc_reply_reviewers": "206;60;37;78",
        "wc_reply_authors": "859;485;507;574",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            6.5,
            1.5
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            130.25,
            56.52156668033893
        ],
        "wc_strengths_avg": [
            63.0,
            13.982131454109563
        ],
        "wc_weaknesses_avg": [
            126.0,
            74.48825410761081
        ],
        "wc_questions_avg": [
            63.75,
            63.73921477395215
        ],
        "wc_review_avg": [
            383.0,
            50.5618433208284
        ],
        "wc_reply_reviewers_avg": [
            95.25,
            65.57200240956502
        ],
        "wc_reply_authors_avg": [
            606.25,
            149.56165116767065
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14752669949639676240&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2;3;1",
        "aff_unique_norm": "University of Science and Technology of China;Hong Kong University of Science and Technology;Shanghai Artificial Intelligence Laboratory;BOSS Zhipin",
        "aff_unique_dep": ";Fok Ying Tung Research Institute;;",
        "aff_unique_url": "http://www.ustc.edu.cn;https://www.ust.hk;http://www.shailab.org/;https://www.zhipin.com",
        "aff_unique_abbr": "USTC;HKUST;Shanghai AI Lab;BOSS\u76f4\u8058",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Guangzhou;Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "5451cIQdWp",
        "title": "On Synthetic Data and Iterative Magnitude Pruning: a Linear Mode Connectivity Study",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent works have shown that distilled data representations can be leveraged for accelerating the training of DNNs. However, to date, very little is understood about the effect of these synthetic data representations in the area of architectural optimization, specifically with Iterative Magnitude Pruning (IMP) and pruning at initialization. We push the boundaries of pruning with distilled data, matching the performance of traditional IMP on ResNet-18 \\& CIFAR-10 while using 150x less training points to find a sparsity mask. We find that distilled data guides IMP to discard parameters contributing to the sharpness of the loss landscape, fostering smoother landscapes. These synthetic subnetworks are stable to SGD noise at initialization in settings when the dense model or subnetworks found with standard IMP are not, such as ResNet-10 on ImageNet-10. In other words, training from initialization across different shuffling of data will result in linear mode connectivity, a phenomenon which rarely happens without some pretraining. We visualize these loss landscapes and quantitatively measure sharpness through hessian approximations to understand these effects. This behavior is heavily linked to the compressed representation of the data, highlighting the importance of synthetic data in neural architectural validation. In order to find both a high performing and robust sparse architecture, a more optimal synthetic data representation is needed that can compress irrelevant noise like distilled data, yet better maintain task-specific information from the real data as dataset complexity increases.",
        "keywords": "Neural Network Pruning;Linear Mode Connectivity;Dataset Distillation;Sparse Neural Networks",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Luke McDermott;Daniel Cummings",
        "authorids": "~Luke_McDermott2;~Daniel_Cummings2",
        "gender": "M;",
        "homepage": "https://lukemcdermotttt.github.io/;",
        "dblp": ";",
        "google_scholar": "l_z4cj0AAAAJ;",
        "orcid": ";",
        "linkedin": "lukemcdermott;",
        "or_profile": "~Luke_McDermott2;~Daniel_Cummings2",
        "aff": "Modern Intelligence;",
        "aff_domain": "modernintelligence.ai;",
        "position": "Researcher;",
        "bibtex": "@misc{\nmcdermott2024on,\ntitle={On Synthetic Data and Iterative Magnitude Pruning: a Linear Mode Connectivity Study},\nauthor={Luke McDermott and Daniel Cummings},\nyear={2024},\nurl={https://openreview.net/forum?id=5451cIQdWp}\n}",
        "github": "",
        "project": "",
        "reviewers": "rRcD;6HLj;mHnL;qh7B",
        "site": "https://openreview.net/forum?id=5451cIQdWp",
        "pdf_size": 2297302,
        "rating": "3;5;5;6",
        "confidence": "5;3;3;3",
        "soundness": "2;3;2;3",
        "contribution": "1;2;2;3",
        "presentation": "1;1;2;2",
        "wc_summary": "88;56;70;79",
        "wc_strengths": "47;42;24;75",
        "wc_weaknesses": "404;228;344;157",
        "wc_questions": "39;37;2;36",
        "wc_review": "578;363;440;347",
        "wc_reply_reviewers": "186;0;61;0",
        "wc_reply_authors": "813;411;776;521",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            73.25,
            11.818946653572814
        ],
        "wc_strengths_avg": [
            47.0,
            18.289341158171883
        ],
        "wc_weaknesses_avg": [
            283.25,
            96.51780923746664
        ],
        "wc_questions_avg": [
            28.5,
            15.337861650177967
        ],
        "wc_review_avg": [
            432.0,
            91.3318126394084
        ],
        "wc_reply_reviewers_avg": [
            61.75,
            75.93541663808791
        ],
        "wc_reply_authors_avg": [
            630.25,
            169.29762993025037
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.9271726499455306,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:vgEn7HRo_i0J:scholar.google.com/&scioq=On+Synthetic+Data+and+Iterative+Magnitude+Pruning:+a+Linear+Mode+Connectivity+Study&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Modern Intelligence",
        "aff_unique_dep": "",
        "aff_unique_url": "",
        "aff_unique_abbr": ""
    },
    {
        "id": "54AwQUaDZo",
        "title": "Bounding the Robustness and Generalization for Individual Treatment Effect",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Individual treatment effect (ITE) estimation has important applications in fields such as healthcare, economics and education, hence attracted increasing attention from both research and industrial community. However, most existing models may not perform well in practice due to the lack of robustness of the ITE estimation predicted by deep neural networks when an imperceptible perturbation has been added to the covariate. To alleviate this problem, in this paper, we first derive an informative generalization bound that demonstrate the expected ITE estimation error is bounded by one of the most important term, the Lipschitz constant of ITE model. In addition, in order to use Integral Probability Metrics (IPM) to measure distances between distributions, we also obtain explicit bounds for the Wasserstein (WASS) and Maximum Mean Discrepancy (MMD) distances. More specifically, we propose two types of regularizations called Lipschitz Regularization and reproducing kernel Hilbert space (RKHS) Regularization for encouraging robustness in estimating ITE from observational data. Extensive experiments on both synthetic examples and standard benchmarks demonstrate our framework\u2019s effectiveness and generality. To benefit this research direction, we release our project at https://github-rite.github.io/rite/.",
        "keywords": "Individual Treatment Effect;Causal inference",
        "primary_area": "causal reasoning",
        "supplementary_material": "",
        "author": "Zhenlei Wang;Xu Chen;Xiaoxiao Xu;Lantao Hu;Peng Jiang;Kun Gai",
        "authorids": "~Zhenlei_Wang1;~Xu_Chen13;~Xiaoxiao_Xu2;~Lantao_Hu1;~Peng_Jiang6;~Kun_Gai1",
        "gender": "M;M;F;M;M;M",
        "homepage": "https://causal-rec.github.io/;https://gsai.ruc.edu.cn/chenxu;https://scholar.google.com/citations?hl=zh-CN&user=1I2OrQEAAAAJ&view_op=list_works&sortby=pubdate;;;",
        "dblp": "223/8301;83/6331-17;116/1526;;;59/2902",
        "google_scholar": "7x0kGsUAAAAJ;loPoqy0AAAAJ;https://scholar.google.com/citations?hl=zh-CN;P0EK1y8AAAAJ;https://scholar.google.com/citations?hl=en;PXO4ygEAAAAJ",
        "orcid": ";0000-0003-0144-1775;0009-0007-5493-5628;;0000-0002-9266-0780;",
        "linkedin": ";;;;;",
        "or_profile": "~Zhenlei_Wang1;~Xu_Chen13;~Xiaoxiao_Xu2;~Lantao_Hu1;~Peng_Jiang6;~Kun_Gai1",
        "aff": "Renmin University of China;Renmin University of China;Kuaishou Technology;;Kuaishou Technology;Kuaishou- \u5feb\u624b\u79d1\u6280",
        "aff_domain": "ruc.edu.cn;ruc.edu.cn;kuaishou.com;;kuaishou.com;kuaishou.com",
        "position": "PhD student;Associate Professor;Engineer;;Vice President;Instructor",
        "bibtex": "@misc{\nanonymous2024bounding,\ntitle={Bounding the Robustness and Generalization for Individual Treatment Effect},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=54AwQUaDZo}\n}",
        "github": "",
        "project": "",
        "reviewers": "FvrM;nExb;UoGx;WUez",
        "site": "https://openreview.net/forum?id=54AwQUaDZo",
        "pdf_size": 1120565,
        "rating": "3;5;5;5",
        "confidence": "3;3;4;3",
        "soundness": "2;3;1;2",
        "contribution": "2;2;3;1",
        "presentation": "2;3;2;2",
        "wc_summary": "86;117;179;119",
        "wc_strengths": "76;58;106;55",
        "wc_weaknesses": "66;192;432;375",
        "wc_questions": "52;2;102;54",
        "wc_review": "280;369;819;603",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            125.25,
            33.677700337166726
        ],
        "wc_strengths_avg": [
            73.75,
            20.27775875189366
        ],
        "wc_weaknesses_avg": [
            266.25,
            145.69896190433204
        ],
        "wc_questions_avg": [
            52.5,
            35.36594407053204
        ],
        "wc_review_avg": [
            517.75,
            210.16109892175572
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:V_yve7ojoRIJ:scholar.google.com/&scioq=Bounding+the+Robustness+and+Generalization+for+Individual+Treatment+Effect&hl=en&as_sdt=0,23",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;1;1",
        "aff_unique_norm": "Renmin University of China;Kuaishou Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.ruc.edu.cn;https://www.kuaishou.com",
        "aff_unique_abbr": "RUC;Kuaishou",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Towards Identifiable Unsupervised Domain Translation: A Diversified Distribution Matching Approach",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19440",
        "id": "55uj7mU7Cv",
        "author_site": "Sagar Shrestha, Xiao Fu",
        "tldr": "",
        "abstract": "Unsupervised domain translation (UDT) aims to find functions that convert samples from one domain (e.g., sketches) to another domain (e.g., photos) without changing the high-level semantic meaning (also referred to as \"content\"). The translation functions are often sought by probability distribution matching of the transformed source domain and target domain. CycleGAN stands as arguably the most representative approach among this line of work. However, it was noticed in the literature that CycleGAN and variants could fail to identify the desired translation functions and produce content-misaligned translations.\nThis limitation arises due to the presence of multiple translation functions---referred to as ``measure-preserving automorphism\" (MPA)---in the solution space of the learning criteria. Despite awareness of such identifiability issues, solutions have remained elusive. This study delves into the core identifiability inquiry and introduces an MPA elimination theory. Our analysis shows that MPA is unlikely to exist, if multiple pairs of diverse cross-domain conditional distributions are matched by the learning function.\nOur theory leads to a UDT learner using distribution matching over auxiliary variable-induced subsets of the domains---other than over the entire data domains as in the classical approaches.  The proposed framework is the first to rigorously establish translation identifiability under reasonable UDT settings, to our best knowledge.\nExperiments corroborate with our theoretical claims.",
        "keywords": "unsupervised domain translation;translation identifiability;distribution matching;unpaired image to image translation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/bba6017fc2dc8543fc915d43386eaa33f05f7b0a.zip",
        "author": "Sagar Shrestha;Xiao Fu",
        "authorids": "~Sagar_Shrestha1;~Xiao_Fu1",
        "gender": "M;M",
        "homepage": ";https://web.engr.oregonstate.edu/~fuxia/",
        "dblp": "292/3689;60/4601-1",
        "google_scholar": "qIBTvlAAAAAJ;pDnpH1MAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Sagar_Shrestha1;~Xiao_Fu1",
        "aff": "Oregon State University;Oregon State University",
        "aff_domain": "oregonstate.edu;oregonstate.edu",
        "position": "PhD student;Associate Professor",
        "bibtex": "@inproceedings{\nshrestha2024towards,\ntitle={Towards Identifiable Unsupervised Domain Translation: A Diversified Distribution Matching Approach},\nauthor={Sagar Shrestha and Xiao Fu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=55uj7mU7Cv}\n}",
        "github": "",
        "project": "",
        "reviewers": "4LhS;rKLC;bENZ;siTh",
        "pdf_size": 38400638,
        "rating": "5;6;6;8",
        "confidence": "4;5;4;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;4",
        "wc_summary": "39;107;54;90",
        "wc_strengths": "52;51;174;59",
        "wc_weaknesses": "58;180;107;33",
        "wc_questions": "312;60;68;106",
        "wc_review": "461;398;403;288",
        "wc_reply_reviewers": "0;38;11;38",
        "wc_reply_authors": "3117;1083;427;1575",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "5;2;1;3",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            72.5,
            27.207535720825582
        ],
        "wc_strengths_avg": [
            84.0,
            52.052857750559674
        ],
        "wc_weaknesses_avg": [
            94.5,
            56.082528473669946
        ],
        "wc_questions_avg": [
            136.5,
            102.80442597476045
        ],
        "wc_review_avg": [
            387.5,
            62.5559749344537
        ],
        "wc_reply_reviewers_avg": [
            21.75,
            16.708904811506947
        ],
        "wc_reply_authors_avg": [
            1550.5,
            991.8834356919164
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            1.479019945774904
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.13245323570650439,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5429720305334156891&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=55uj7mU7Cv",
        "pdf": "https://openreview.net/pdf?id=55uj7mU7Cv",
        "email": "oregonstate.edu;oregonstate.edu",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Oregon State University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://oregonstate.edu",
        "aff_unique_abbr": "OSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "How to Catch an AI Liar: Lie Detection in Black-Box LLMs by Asking Unrelated Questions",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19439",
        "id": "567BjxgaTp",
        "author_site": "Lorenzo Pacchiardi, Alex Chan, S\u00f6ren Mindermann, Ilan Moscovitz, Alexa Pan, Yarin Gal, Owain Evans, Jan Brauner",
        "tldr": "",
        "abstract": "Large language models (LLMs) can \u201clie\u201d, which we define as outputting false statements when incentivised to, despite \u201cknowing\u201d the truth in a demonstrable sense. LLMs might \u201clie\u201d, for example, when instructed to output misinformation. Here, we develop a simple lie detector that requires neither access to the LLM\u2019s activations (black-box) nor ground-truth knowledge of the fact in question. The detector works by asking a predefined set of unrelated follow-up questions after a suspected lie, and feeding the LLM\u2019s yes/no answers into a logistic regression classifier. Despite its simplicity, this lie detector is highly accurate and surprisingly general. When trained on examples from a single setting\u2014prompting GPT-3.5 to lie about factual questions\u2014the detector generalises out-of-distribution to (1) other LLM architectures, (2) LLMs fine-tuned to lie, (3) sycophantic lies, and (4) lies emerging in real-life scenarios such as sales. These results indicate that LLMs have distinctive lie-related behavioural patterns, consistent across architectures and contexts, which could enable general-purpose lie detection.",
        "keywords": "language models;lying;deception;alignment;safety;truthfulness;honesty",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/3b63a2c68f1a0b002920ca2526f715d3513508c9.pdf",
        "author": "Lorenzo Pacchiardi;Alex James Chan;S\u00f6ren Mindermann;Ilan Moscovitz;Alexa Yue Pan;Yarin Gal;Owain Evans;Jan M. Brauner",
        "authorids": "~Lorenzo_Pacchiardi1;~Alex_James_Chan1;~S\u00f6ren_Mindermann1;~Ilan_Moscovitz1;~Alexa_Yue_Pan1;~Yarin_Gal1;~Owain_Evans1;~Jan_M._Brauner1",
        "gender": "M;M;M;M;F;;;M",
        "homepage": "http://lorenzopacchiardi.me/;https://alexjchan.com;https://www.soren-mindermann.com/;;;http://www.cs.ox.ac.uk/people/yarin.gal/website//;https://owainevans.github.io/;",
        "dblp": "308/9068;268/6948;211/7976;;;67/9076;52/10432;271/0265",
        "google_scholar": "9EAb0uEAAAAJ;yfy_BGIAAAAJ;slBPlrQAAAAJ;;;https://scholar.google.co.uk/citations?user=SIayDoQAAAAJ;4VpTwzIAAAAJ;https://scholar.google.de/citations?user=tNZUnjcAAAAJ",
        "orcid": "0000-0003-4760-7638;;0000-0002-0315-9821;;;;;0000-0002-1588-5724",
        "linkedin": ";alex-chan-040081131/;;ilan-moscovitz/;alexa-pan-5678ab163/;;;",
        "or_profile": "~Lorenzo_Pacchiardi1;~Alex_James_Chan1;~S\u00f6ren_Mindermann1;~Ilan_Moscovitz1;~Alexa_Yue_Pan1;~Yarin_Gal1;~Owain_Evans1;~Jan_M._Brauner1",
        "aff": "University of Cambridge;Spotify;Mila - Quebec Artificial Intelligence Institute;Independent;Yale University;University of Oxford;Truthful AI;University of Oxford",
        "aff_domain": "cam.ac.uk;spotify.com;mila.quebec;openreview.net;yale.edu;ox.ac.uk;owainevans.com;ox.ac.uk",
        "position": "Postdoc;Researcher;Postdoc;Researcher;Undergrad student;Associate Professor;Principal Researcher;PhD student",
        "bibtex": "@inproceedings{\npacchiardi2024how,\ntitle={How to Catch an {AI} Liar: Lie Detection in Black-Box {LLM}s by Asking Unrelated Questions},\nauthor={Lorenzo Pacchiardi and Alex James Chan and S{\\\"o}ren Mindermann and Ilan Moscovitz and Alexa Yue Pan and Yarin Gal and Owain Evans and Jan M. Brauner},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=567BjxgaTp}\n}",
        "github": "",
        "project": "",
        "reviewers": "eJWS;fhKw;cT55;Y6rc",
        "pdf_size": 3769151,
        "rating": "5;6;8;8",
        "confidence": "3;3;4;4",
        "soundness": "3;3;3;4",
        "contribution": "2;3;3;4",
        "presentation": "1;2;2;3",
        "wc_summary": "377;122;70;120",
        "wc_strengths": "2;214;222;67",
        "wc_weaknesses": "2;88;329;18",
        "wc_questions": "2;27;64;68",
        "wc_review": "383;451;685;273",
        "wc_reply_reviewers": "40;4;122;0",
        "wc_reply_authors": "1618;735;1205;386",
        "reply_reviewers": "1;1;2;0",
        "reply_authors": "4;2;2;1",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            172.25,
            120.03410973552477
        ],
        "wc_strengths_avg": [
            126.25,
            94.62656867920342
        ],
        "wc_weaknesses_avg": [
            109.25,
            130.93008630563108
        ],
        "wc_questions_avg": [
            40.25,
            27.261465477849864
        ],
        "wc_review_avg": [
            448.0,
            150.8542342793201
        ],
        "wc_reply_reviewers_avg": [
            41.5,
            49.01785389018985
        ],
        "wc_reply_authors_avg": [
            986.0,
            466.4724000409885
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.25,
            1.0897247358851685
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.9622504486493761,
        "gs_citation": 59,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4094771018704741638&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=567BjxgaTp",
        "pdf": "https://openreview.net/pdf?id=567BjxgaTp",
        "email": "cam.ac.uk;spotify.com;mila.quebec;openreview.net;yale.edu;ox.ac.uk;owainevans.com;ox.ac.uk",
        "author_num": 8,
        "aff_unique_index": "0;1;2;3;4;5;6;5",
        "aff_unique_norm": "University of Cambridge;Spotify;Quebec Artificial Intelligence Institute;Independent;Yale University;University of Oxford;Truthful AI",
        "aff_unique_dep": ";;Artificial Intelligence;;;;",
        "aff_unique_url": "https://www.cam.ac.uk;https://www.spotify.com;https://mila.quebec;;https://www.yale.edu;https://www.ox.ac.uk;",
        "aff_unique_abbr": "Cambridge;Spotify;Mila;;Yale;Oxford;",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Cambridge;",
        "aff_country_unique_index": "0;1;2;4;0;0",
        "aff_country_unique": "United Kingdom;Sweden;Canada;;United States"
    },
    {
        "id": "56jIlazr6a",
        "title": "Unified Uncertainty Estimation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In order to build robust, fair, and safe AI systems, we would like our classifiers to recognize and say \u201cI don\u2019t know\u201d when facing test examples that do not belong to any of the in-domain classes observed during training. Perhaps surprisingly, the ubiquitous strategy to predict under uncertainty is the simplistic reject-or-classify rule: abstain from prediction if epistemic uncertainty is high, classify otherwise. We argue that this recipe has several problems: it does not allow different sources of uncertainty to communicate with each other, produces miscalibrated predictions, and it does not allow to correct for misspecifications in our uncertainty estimates. To address these issues, we introduce unified uncertainty calibration (U2C), a framework for the unified, non-linear calibration of aleatoric and epistemic uncertainties. Unified uncertainty calibration enables a clean analysis of uncertainty estimation via learning theory, and significantly outperforms reject-or-classify across a variety of standard benchmarks.",
        "keywords": "uncertainty estimation;calibration;epistemic;aleatoric",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/cc2447edc90f7aa164e8dd60dd601d1be54d499b.zip",
        "author": "Kamalika Chaudhuri;David Lopez-Paz",
        "authorids": "~Kamalika_Chaudhuri1;~David_Lopez-Paz2",
        "gender": "F;",
        "homepage": "http://cseweb.ucsd.edu/users/kamalika;http://lopezpaz.org",
        "dblp": "56/6435;74/10481",
        "google_scholar": "I-DJ7EsAAAAJ;",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Kamalika_Chaudhuri1;~David_Lopez-Paz2",
        "aff": "University of California, San Diego;Meta Facebook",
        "aff_domain": "ucsd.edu;fb.com",
        "position": "Associate Professor;Research Scientist",
        "bibtex": "@misc{\nchaudhuri2024unified,\ntitle={Unified Uncertainty Estimation},\nauthor={Kamalika Chaudhuri and David Lopez-Paz},\nyear={2024},\nurl={https://openreview.net/forum?id=56jIlazr6a}\n}",
        "github": "",
        "project": "",
        "reviewers": "WQhb;LfhH;Pdw3;3np5",
        "site": "https://openreview.net/forum?id=56jIlazr6a",
        "pdf_size": 1719767,
        "rating": "3;5;5;8",
        "confidence": "4;3;4;4",
        "soundness": "1;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "1;3;4;3",
        "wc_summary": "60;135;152;118",
        "wc_strengths": "33;86;56;97",
        "wc_weaknesses": "439;201;23;209",
        "wc_questions": "51;4;103;5",
        "wc_review": "583;426;334;429",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "179;148;110;118",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            116.25,
            34.629286738250904
        ],
        "wc_strengths_avg": [
            68.0,
            25.16942589730644
        ],
        "wc_weaknesses_avg": [
            218.0,
            147.6787053031005
        ],
        "wc_questions_avg": [
            40.75,
            40.64710936831794
        ],
        "wc_review_avg": [
            443.0,
            89.39519002720448
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            138.75,
            27.215574585152524
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.08084520834544431,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:VIZBaUc9khQJ:scholar.google.com/&scioq=Unified+Uncertainty+Estimation&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of California, San Diego;Meta",
        "aff_unique_dep": ";Meta Platforms, Inc.",
        "aff_unique_url": "https://www.ucsd.edu;https://meta.com",
        "aff_unique_abbr": "UCSD;Meta",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "San Diego;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "56l30xVDW7",
        "title": "Semantic Attribution For Explainable Uncertainty Quantification",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Bayesian deep learning, with an emphasis on uncertainty quantification, is receiving growing interest in building reliable models. Nonetheless, interpreting and explaining the origins and reasons for uncertainty presents a significant challenge. In this paper, we present semantic uncertainty attribution as a tool for pinpointing the primary factors contributing to uncertainty. This approach allows us to explain why a particular image carries high uncertainty, thereby making our models more interpretable. Specifically, we utilize the variational autoencoder to disentangle different semantic factors within the latent space and link the uncertainty to corresponding semantic factors for an explanation. The proposed techniques can also enhance explainable out-of-distribution (OOD) detection. We can not only identify OOD samples via their uncertainty, but also provide reasoning rooted in a semantic concept.",
        "keywords": "Uncertainty Quantification;Model Explanability",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Hanjing Wang;Shiqiang Wang;Qiang Ji",
        "authorids": "~Hanjing_Wang2;~Shiqiang_Wang1;~Qiang_Ji1",
        "gender": "M;M;M",
        "homepage": "https://www.ecse.rpi.edu/~cvrl/people_zw.html;https://shiqiang.wang;https://www.ecse.rpi.edu/~qji/",
        "dblp": "234/8752;87/5094-1;",
        "google_scholar": ";kA_vmOcAAAAJ;vAXmpVIAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Hanjing_Wang2;~Shiqiang_Wang1;~Qiang_Ji1",
        "aff": "Rensselaer Polytechnic Institute;IBM, International Business Machines;Rensselaer Polytechnic Institute",
        "aff_domain": "rpi.edu;us.ibm.com;rpi.edu",
        "position": "PhD student;Research Staff Member;Professor",
        "bibtex": "@misc{\nwang2024semantic,\ntitle={Semantic Attribution For Explainable Uncertainty Quantification},\nauthor={Hanjing Wang and Shiqiang Wang and Qiang Ji},\nyear={2024},\nurl={https://openreview.net/forum?id=56l30xVDW7}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=56l30xVDW7",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16783044059365412257&as_sdt=4005&sciodt=0,6&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Rensselaer Polytechnic Institute;International Business Machines",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.rpi.edu;https://www.ibm.com",
        "aff_unique_abbr": "RPI;IBM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "59nCKifDtm",
        "title": "Improve Temporal Consistency In Diffusion Models through Noise Correlations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Diffusion models have emerged as a powerful tool for generating diverse types of data, including sequential data such as audio, video, and motion. As the temporal consistency in sequential data is crucial for maintaining fidelity and realism, this paper introduce the AutoRegressive Temporal diffusion (ARTDiff) approach to address the challenge of temporal consistency in diffusion models. ARTDiff offers a straightforward and efficient solution that requires minimal computational overhead. Our proposed ARTDiff method leverages the inherent autoregressive dependence structure in time by introducing a Gaussian noise distribution whose correlations between time frames have a functional form in terms of time difference. This design explicitly captures the temporal dependencies and enhances the consistency in generated sequences. We evaluate the effectiveness of ARTDiff on audio and motion generation tasks. Experimental results demonstrate that ARTDiff significantly improves the fidelity and realism of generated samples compared to baseline diffusion models. The simplicity and efficiency of ARTDiff make it a practical choice for incorporating temporal consistency in diffusion-based generation models.",
        "keywords": "diffusion model;temporal consistency;sequential data generation",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Kexin Lu;Yuxi CAI;Lan Li;Dafei Qin;Guodong Li",
        "authorids": "~Kexin_Lu1;~Yuxi_CAI1;~Lan_Li4;~Dafei_Qin1;~Guodong_Li1",
        "gender": ";;F;M;M",
        "homepage": "https://github.com/neithen-Lu;;;https://dafei-qin.github.io/;https://saasweb.hku.hk/staff/gdli/",
        "dblp": ";;;347/3368;",
        "google_scholar": ";;;https://scholar.google.com/citations?hl=en;whNuLsEAAAAJ",
        "orcid": ";0000-0003-4065-1193;0009-0005-4711-9740;0009-0001-4992-4760;",
        "linkedin": ";;;dafei-qin-134151292;",
        "or_profile": "~Kexin_Lu1;~Yuxi_CAI1;~Lan_Li4;~Dafei_Qin1;~Guodong_Li1",
        "aff": "University of Hong Kong;University of Hong Kong;University of Hong Kong;University of Hong Kong;The University of Hong Kong",
        "aff_domain": "hku.hk;hku.hk;hku.hk;hku.hk;hku.hk",
        "position": "PhD student;PhD student;PhD student;PhD student;Professor",
        "bibtex": "@misc{\nlu2024improve,\ntitle={Improve Temporal Consistency In Diffusion Models through Noise Correlations},\nauthor={Kexin Lu and Yuxi CAI and Lan Li and Dafei Qin and Guodong Li},\nyear={2024},\nurl={https://openreview.net/forum?id=59nCKifDtm}\n}",
        "github": "",
        "project": "",
        "reviewers": "zRzD;jkr1;uW7w;kucM",
        "site": "https://openreview.net/forum?id=59nCKifDtm",
        "pdf_size": 2453954,
        "rating": "6;6;6;6",
        "confidence": "4;4;3;3",
        "soundness": "3;3;3;2",
        "contribution": "3;3;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "39;63;95;65",
        "wc_strengths": "34;43;28;43",
        "wc_weaknesses": "161;44;91;32",
        "wc_questions": "50;3;4;42",
        "wc_review": "284;153;218;182",
        "wc_reply_reviewers": "29;29;14;0",
        "wc_reply_authors": "2069;1248;2200;772",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "6;4;6;3",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            65.5,
            19.868316486305527
        ],
        "wc_strengths_avg": [
            37.0,
            6.363961030678928
        ],
        "wc_weaknesses_avg": [
            82.0,
            50.66063560596136
        ],
        "wc_questions_avg": [
            24.75,
            21.44032415799724
        ],
        "wc_review_avg": [
            209.25,
            48.91510502901941
        ],
        "wc_reply_reviewers_avg": [
            18.0,
            12.062338081814818
        ],
        "wc_reply_authors_avg": [
            1572.25,
            588.7208060702459
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.75,
            1.299038105676658
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:h-qXsHj7ayAJ:scholar.google.com/&scioq=Improve+Temporal+Consistency+In+Diffusion+Models+through+Noise+Correlations&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "University of Hong Kong",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.hku.hk",
        "aff_unique_abbr": "HKU",
        "aff_campus_unique_index": "0;0;0;0;0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "5AbtYdHlr3",
        "title": "Stochastic Safe Action Model Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Hand-crafting models of interactive domains is challenging, especially when the dynamics of the domain are stochastic. Therefore, it's useful to be able to automatically learn such models instead. In this work, we propose an algorithm to learn stochastic planning models where the distribution over the sets of effects for each action has a small support, but the sets may set values to an arbitrary number of state attributes (a.k.a. fluents). This class captures the benchmark domains used in stochastic planning, in contrast to the prior work that assumed independence of the effects on individual fluents. Our algorithm has polynomial time and sample complexity when the size of the support is bounded by a constant. Importantly, our learning is safe in that we learn offline from example trajectories and we guarantee that actions are only permitted in states where our model of the dynamics is guaranteed to be accurate. Moreover, we guarantee approximate completeness of the model, in the sense that if the examples are achieving goals from some distribution, then with high probability there will exist plans in our learned model that achieve goals from the same distribution.",
        "keywords": "offline learning;planning;action model learning;method of moments",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Zihao Deng;Brendan Juba",
        "authorids": "~Zihao_Deng1;~Brendan_Juba1",
        "gender": ";M",
        "homepage": ";http://www.cse.wustl.edu/~bjuba/",
        "dblp": "188/6173;62/6079",
        "google_scholar": ";https://scholar.google.com.tw/citations?user=5wppdUoAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Zihao_Deng1;~Brendan_Juba1",
        "aff": "Washington University, St. Louis;Washington University in St. Louis",
        "aff_domain": "wustl.edu;cse.wustl.edu",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\ndeng2024stochastic,\ntitle={Stochastic Safe Action Model Learning},\nauthor={Zihao Deng and Brendan Juba},\nyear={2024},\nurl={https://openreview.net/forum?id=5AbtYdHlr3}\n}",
        "github": "",
        "project": "",
        "reviewers": "Ksk7;cva7;YR2D;bFXN",
        "site": "https://openreview.net/forum?id=5AbtYdHlr3",
        "pdf_size": 280752,
        "rating": "3;3;3;3",
        "confidence": "3;3;4;2",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;2",
        "presentation": "1;2;1;1",
        "wc_summary": "42;166;95;134",
        "wc_strengths": "12;26;16;26",
        "wc_weaknesses": "114;93;295;154",
        "wc_questions": "34;130;64;80",
        "wc_review": "202;415;470;394",
        "wc_reply_reviewers": "0;44;194;133",
        "wc_reply_authors": "123;180;619;395",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "1;1;2;2",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            109.25,
            46.25675626327467
        ],
        "wc_strengths_avg": [
            20.0,
            6.164414002968976
        ],
        "wc_weaknesses_avg": [
            164.0,
            78.74325367928354
        ],
        "wc_questions_avg": [
            77.0,
            34.77067730142742
        ],
        "wc_review_avg": [
            370.25,
            101.02567742905761
        ],
        "wc_reply_reviewers_avg": [
            92.75,
            75.58232266872989
        ],
        "wc_reply_authors_avg": [
            329.25,
            195.63534317704458
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5267497173215605354&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Washington University in St. Louis",
        "aff_unique_dep": "",
        "aff_unique_url": "https://wustl.edu",
        "aff_unique_abbr": "WUSTL",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "St. Louis",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "5BBEFotHkJ",
        "title": "Symmetry-preserving graph attention network to solve routing problems at multiple resolutions",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Travelling Salesperson Problems (TSPs) and Vehicle Routing Problems (VRPs) have achieved reasonable improvement in accuracy and computation time with the adaptation of Machine Learning (ML) methods. However, none of the previous works completely respects the symmetries arising from TSPs and VRPs including rotation, translation, permutation, and scaling. In this work, we introduce the first-ever completely equivariant model and training to solve combinatorial problems. Furthermore, it is essential to capture the multiscale structure (i.e. from local to global information) of the input graph, especially for the cases of large and long-range graphs, while previous methods are limited to extracting only local information that can lead to a local or sub-optimal solution. To tackle the above limitation, we propose a Multiresolution scheme in combination with Equivariant Graph Attention network (mEGAT) architecture, which can learn the optimal route based on low-level and high-level graph resolutions in an efficient way. In particular, our approach constructs a hierarchy of coarse-graining graphs from the input graph, in which we try to solve the routing problems on simple low-level graphs first, then utilize that knowledge for the more complex high-level graphs. Experimentally, we have shown that our model outperforms existing baselines and proved that symmetry preservation and multiresolution are important recipes for solving combinatorial problems in a data-driven manner. Our source code is publicly available at [anonymous url].",
        "keywords": "Symmetry;group equivariant;graph neural networks;multiresolution;multiscale;routing problems;NP-hard;combinatorics;TSP;VRP",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/a3e732803f2cc15aa40c6da99c5389f6f1ee3c57.pdf",
        "author": "Cong Dao Tran;Thong Bach;Truong Son Hy",
        "authorids": "~Cong_Dao_Tran1;~Thong_Bach1;~Truong_Son_Hy1",
        "gender": "M;M;M",
        "homepage": ";https://hytruongson.github.io/HySonLab/;https://daotranbk.github.io",
        "dblp": "318/9182.html;213/7552;",
        "google_scholar": "yFLbTtkAAAAJ;JiKBo6UAAAAJ;",
        "orcid": ";0000-0002-5092-3757;0009-0001-1920-7568",
        "linkedin": ";truong-son-h-4a9185b6/;",
        "or_profile": "~Thong_Bach1;~Truong_Son_Hy1;~Dao_Cong_Tran1",
        "aff": "Deakin University;Indiana State University;",
        "aff_domain": "deakin.edu.au;indstate.edu;",
        "position": "PhD student;Assistant Professor;",
        "bibtex": "@misc{\ntran2024symmetrypreserving,\ntitle={Symmetry-preserving graph attention network to solve routing problems at multiple resolutions},\nauthor={Cong Dao Tran and Thong Bach and Truong Son Hy},\nyear={2024},\nurl={https://openreview.net/forum?id=5BBEFotHkJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "JHgM;aD1V;UYvA;sqmm",
        "site": "https://openreview.net/forum?id=5BBEFotHkJ",
        "pdf_size": 1345581,
        "rating": "3;3;3;5",
        "confidence": "5;4;3;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;2;2",
        "presentation": "3;4;3;3",
        "wc_summary": "86;102;51;64",
        "wc_strengths": "18;45;54;85",
        "wc_weaknesses": "115;185;101;317",
        "wc_questions": "5;286;104;6",
        "wc_review": "224;618;310;472",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            75.75,
            19.651653874419832
        ],
        "wc_strengths_avg": [
            50.5,
            23.921747427811372
        ],
        "wc_weaknesses_avg": [
            179.5,
            85.52631174089059
        ],
        "wc_questions_avg": [
            100.25,
            114.53465632724446
        ],
        "wc_review_avg": [
            406.0,
            151.36049682793725
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13152145194466231369&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Deakin University;Indiana State University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.deakin.edu.au;https://www.indstate.edu",
        "aff_unique_abbr": "Deakin;ISU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Australia;United States"
    },
    {
        "title": "Demystifying CLIP Data",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19438",
        "id": "5BCFlnfE1g",
        "author_site": "Hu Xu, Saining Xie, Xiaoqing Tan, Po-Yao Huang, Russell Howes, Vasu Sharma, Shang-Wen Li, Gargi Ghosh, Luke Zettlemoyer, Christoph Feichtenhofer",
        "tldr": "",
        "abstract": "Contrastive Language-Image Pre-training (CLIP) is an approach that has advanced research and applications in computer vision, fueling modern recognition systems and generative models. We believe that the main ingredient to the success of CLIP is its \\textit{data} and \\textit{not} the \\textit{model} architecture or pre-training {objective}. However, CLIP only provides very limited information about its data and how it has been collected, leading to works that aim to reproduce CLIP's data by filtering with its model parameters. In this work, we intend to reveal CLIP's data curation approach and in our pursuit of making it open to the community introduce Metadata-Curated Language-Image Pre-training (MetaCLIP). MetaCLIP takes a raw data pool and metadata (derived from CLIP's concepts) and yields a balanced subset over the metadata distribution. Our experimental study rigorously isolates the model and training settings, concentrating solely on data. MetaCLIP applied to CommonCrawl with 400M image-text data pairs outperforms CLIP's data on multiple standard benchmarks. In zero-shot ImageNet classification, MetaCLIP achieves 70.8\\% accuracy, surpassing CLIP's 68.3\\% on \\mbox{ViT-B} models. Scaling to 1B data, while maintaining the same training budget, attains \\textbf{72.4\\%}. Our observations hold across various model sizes, exemplified by ViT-H achieving \\textbf{80.5\\%}, without any bells-and-whistles. Curation code and training data distribution over metadata will be made available.",
        "keywords": "multi-modal pretraining;CLIP;image;text",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Hu Xu;Saining Xie;Xiaoqing Tan;Po-Yao Huang;Russell Howes;Vasu Sharma;Shang-Wen Li;Gargi Ghosh;Luke Zettlemoyer;Christoph Feichtenhofer",
        "authorids": "~Hu_Xu1;~Saining_Xie2;~Xiaoqing_Tan1;~Po-Yao_Huang2;~Russell_Howes1;~Vasu_Sharma1;~Shang-Wen_Li1;~Gargi_Ghosh3;~Luke_Zettlemoyer1;~Christoph_Feichtenhofer4",
        "gender": "M;F;M;M;M;F;M;M;M;M",
        "homepage": "https://howardhsu.github.io/;http://ellenxtan.github.io/;;http://vasusharma.github.io;https://swdanielli.github.io/;https://www.linkedin.com/in/gargi-ghosh-5b1087b;https://www.cs.washington.edu/people/faculty/lsz/;http://feichtenhofer.github.io/;https://berniebear.github.io/;",
        "dblp": ";;;165/0762;35/9232-1.html;;21/6793;127/1937;154/3943-1;126/0960",
        "google_scholar": "SaH2yWMAAAAJ;_zvwtKAAAAAJ;76IWQk8AAAAJ;PLUB4dIAAAAJ;wFI97HUAAAAJ;k5akwCcAAAAJ;https://scholar.google.com.tw/citations?user=UjpbO6IAAAAJ;UxuqG1EAAAAJ;E8K25LIAAAAJ;https://scholar.google.co.uk/citations?user=Y2GtJkAAAAAJ",
        "orcid": ";;;;;;;;;",
        "linkedin": ";xiaoqing-tan/;;vasu-sharma-6b460592?utm_source=share&utm_campaign=share_via&utm_content=profile&utm_medium=ios_app;shang-wen-daniel-li-0109b579/;gargi-ghosh-5b1087b;luke-zettlemoyer-a0109b226/;christoph-feichtenhofer-549433a1;;",
        "or_profile": "~Hu_Xu1;~Xiaoqing_Tan1;~Russell_Howes1;~Vasu_Sharma1;~Shang-Wen_Li1;~Gargi_Ghosh3;~Luke_Zettlemoyer1;~Christoph_Feichtenhofer4;~Po-Yao_Huang1;~Saining_Xie1",
        "aff": "FAIR, AMI Foundation;Meta AI;Meta AI;Meta Facebook;Meta Facebook;Meta AI;Meta;Meta FAIR;Meta;New York University",
        "aff_domain": "meta.com;meta.com;fb.com;fb.com;fb.com;meta.com;meta.com;meta.com;meta.com;nyu.edu",
        "position": "Research Scientist;Researcher;Researcher;Researcher;Research Manager;Researcher;Researcher;Principal Researcher;Researcher;Assistant Professor",
        "bibtex": "@inproceedings{\nxu2024demystifying,\ntitle={Demystifying {CLIP} Data},\nauthor={Hu Xu and Saining Xie and Xiaoqing Tan and Po-Yao Huang and Russell Howes and Vasu Sharma and Shang-Wen Li and Gargi Ghosh and Luke Zettlemoyer and Christoph Feichtenhofer},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=5BCFlnfE1g}\n}",
        "github": "",
        "project": "",
        "reviewers": "7LK5;f2FV;Smdn;33mj",
        "pdf_size": 452854,
        "rating": "5;6;8;8",
        "confidence": "3;5;4;4",
        "soundness": "3;3;3;3",
        "contribution": "3;2;3;4",
        "presentation": "3;3;2;4",
        "wc_summary": "55;52;55;95",
        "wc_strengths": "67;71;45;144",
        "wc_weaknesses": "68;139;71;298",
        "wc_questions": "91;51;39;271",
        "wc_review": "281;313;210;808",
        "wc_reply_reviewers": "0;19;34;172",
        "wc_reply_authors": "631;542;882;1226",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "1;1;2;3",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            64.25,
            17.795715776557007
        ],
        "wc_strengths_avg": [
            81.75,
            37.278512577623054
        ],
        "wc_weaknesses_avg": [
            144.0,
            93.3354166434157
        ],
        "wc_questions_avg": [
            113.0,
            93.23089616645332
        ],
        "wc_review_avg": [
            403.0,
            236.77943322847955
        ],
        "wc_reply_reviewers_avg": [
            56.25,
            67.9057250900099
        ],
        "wc_reply_authors_avg": [
            820.25,
            265.3699069223939
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.2721655269759087,
        "gs_citation": 166,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=448420599387582073&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=5BCFlnfE1g",
        "pdf": "https://openreview.net/pdf?id=5BCFlnfE1g",
        "email": "meta.com;meta.com;fb.com;fb.com;fb.com;meta.com;meta.com;meta.com;meta.com;nyu.edu",
        "author_num": 10,
        "aff_unique_index": "0;1;1;1;1;1;1;1;1;2",
        "aff_unique_norm": "FAIR;Meta;New York University",
        "aff_unique_dep": "AMI Foundation;Meta AI;",
        "aff_unique_url": "https://www.fair.iai.uni-sb.de/;https://meta.com;https://www.nyu.edu",
        "aff_unique_abbr": "FAIR;Meta;NYU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;1;1;1;1;1;1",
        "aff_country_unique": "France;United States"
    },
    {
        "title": "Image2Sentence based Asymmetrical Zero-shot Composed Image Retrieval",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19437",
        "id": "5BXAXOpaWu",
        "author_site": "Yongchao Du, Min Wang, Wengang Zhou, Shuping Hui, Houqiang Li",
        "tldr": "",
        "abstract": "The task of composed image retrieval (CIR) aims to retrieve images based on the query image and the text describing the users' intent. \nExisting methods have made great progress with the advanced large vision-language (VL) model in CIR task, however, they generally suffer from two main issues: lack of labeled triplets for model training and difficulty of deployment on resource-restricted environments when deploying the large vision-language model. To tackle the above problems, we propose Image2Sentence based Asymmetric zero-shot composed image retrieval (ISA), which takes advantage of the VL model and only relies on unlabeled images for composition learning. In the framework, we propose a new adaptive token learner that maps an image to a sentence in the word embedding space of VL model.  The sentence adaptively captures discriminative visual information and is further integrated with the text modifier. An asymmetric structure is devised for flexible deployment, in which the lightweight model is adopted for the query side while the large VL model is deployed on the gallery side. The global contrastive distillation and the local alignment regularization are adopted for the alignment between the light model and the VL model for CIR task.  Our experiments demonstrate that the proposed ISA could better cope with the real retrieval scenarios and further improve retrieval accuracy and efficiency.",
        "keywords": "zero-shot;composed image retrieval;asymmetrical",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yongchao Du;Min Wang;Wengang Zhou;Shuping Hui;Houqiang Li",
        "authorids": "~Yongchao_Du1;~Min_Wang9;~Wengang_Zhou1;~Shuping_Hui1;~Houqiang_Li1",
        "gender": "M;F;M;;M",
        "homepage": "https://github.com/duyc168;;http://staff.ustc.edu.cn/~zhwg/index.html;https://github.com/huisp;https://staff.ustc.edu.cn/~lihq/",
        "dblp": ";181/2695-19;22/4544-1;;59/7017.html",
        "google_scholar": ";FFDionEAAAAJ;8s1JF8YAAAAJ;;7sFMIKoAAAAJ",
        "orcid": ";;0000-0003-1690-9836;;0000-0003-2188-3028",
        "linkedin": ";;;;",
        "or_profile": "~Yongchao_Du1;~Min_Wang9;~Wengang_Zhou1;~Shuping_Hui1;~Houqiang_Li1",
        "aff": "University of Science and Technology of China;Institute of Artificial Intelligence, Hefei Comprehensive National Science Center;University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China",
        "aff_domain": "ustc.edu.cn;iai.ustc.edu.cn;ustc.edu.cn;ustc.edu.cn;ustc.edu.cn",
        "position": "PhD student;Researcher;Full Professor;MS student;Professor",
        "bibtex": "@inproceedings{\ndu2024imagesentence,\ntitle={Image2Sentence based Asymmetrical Zero-shot Composed Image Retrieval},\nauthor={Yongchao Du and Min Wang and Wengang Zhou and Shuping Hui and Houqiang Li},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=5BXAXOpaWu}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZKF9;zR31;K4T5;WHDg",
        "pdf_size": 3457534,
        "rating": "6;8;8;8",
        "confidence": "4;5;5;2",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;2;2",
        "wc_summary": "102;143;96;168",
        "wc_strengths": "75;83;32;116",
        "wc_weaknesses": "163;86;42;144",
        "wc_questions": "5;93;26;78",
        "wc_review": "345;405;196;506",
        "wc_reply_reviewers": "0;35;13;67",
        "wc_reply_authors": "733;1719;1078;1723",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "1;3;3;4",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            1.224744871391589
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            127.25,
            29.67637949615822
        ],
        "wc_strengths_avg": [
            76.5,
            29.937434759845406
        ],
        "wc_weaknesses_avg": [
            108.75,
            47.8506792010312
        ],
        "wc_questions_avg": [
            50.5,
            36.16973873281365
        ],
        "wc_review_avg": [
            363.0,
            112.27867117133155
        ],
        "wc_reply_reviewers_avg": [
            28.75,
            25.380849079571785
        ],
        "wc_reply_authors_avg": [
            1313.25,
            425.60567136728804
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            1.0897247358851685
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10372206563830069030&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=5BXAXOpaWu",
        "pdf": "https://openreview.net/pdf?id=5BXAXOpaWu",
        "email": "ustc.edu.cn;iai.ustc.edu.cn;ustc.edu.cn;ustc.edu.cn;ustc.edu.cn",
        "author_num": 5,
        "aff_unique_index": "0;1;0;0;0",
        "aff_unique_norm": "University of Science and Technology of China;Hefei Comprehensive National Science Center",
        "aff_unique_dep": ";Institute of Artificial Intelligence",
        "aff_unique_url": "http://www.ustc.edu.cn;http://www.hfcn.edu.cn",
        "aff_unique_abbr": "USTC;",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hefei",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "5BoXZXTJvL",
        "title": "Beyond Size: How Gradients Shape Pruning Decisions in Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) with a billion or more parameters are prime targets for network pruning, which aims to reduce a portion of the network weights without compromising performance. Prior approaches such as Weights Magnitude, SparseGPT, and Wanda, either concentrated solely on weights or integrated weights with activations for sparsity. However, they overlooked the informative gradients derived from pretrained large language models. In this paper, we present a novel sparsity-centric pruning method for pretrained LLMs, termed **G**radient-**b**ased **L**anguage **M**odel **P**runer (**GBLM-Pruner**). Distinctively, GBLM-Pruner operates in a training-free manner by harnessing normalized gradients, and substantially outperforms competitive counterparts like SparseGPT and Wanda in multiple benchmarks. Intriguing, after incorporating gradients, the unstructured pruning method tends to reveal some structural patterns post-pruning, which mirrors the geometric interdependence inherent in the LLMs' parameter structure. Additionally, GBLM-Pruner functions without any subsequent retraining or weight updates to maintain its simplicity as other counterparts. Extensive evaluations on LLaMA-1 and LLaMA-2 across various language benchmarks and perplexity show that GBLM-Pruner surpasses magnitude pruning, Wanda (*weights+activations*), and SparseGPT (*weights+activations+weight update*) by significant margins. Our code and models will be publicly available.",
        "keywords": "Large Language Models;Gradient-based Language Model Pruner;Sparsity-centric Pruning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/7003005c708248982f147f0891366e9f1720f860.zip",
        "author": "Rocktim Jyoti Das;Liqun Ma;Zhiqiang Shen",
        "authorids": "~Rocktim_Jyoti_Das2;~Liqun_Ma1;~Zhiqiang_Shen1",
        "gender": ";M;",
        "homepage": ";;",
        "dblp": ";18/2859;",
        "google_scholar": ";;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Rocktim_Jyoti_Das2;~Liqun_Ma1;~Zhiqiang_Shen1",
        "aff": ";Mohamed bin Zayed University of Artificial Intelligence;",
        "aff_domain": ";mbzuai.ac.ae;",
        "position": ";PhD student;",
        "bibtex": "@misc{\ndas2024beyond,\ntitle={Beyond Size: How Gradients Shape Pruning Decisions in Large Language Models},\nauthor={Rocktim Jyoti Das and Liqun Ma and Zhiqiang Shen},\nyear={2024},\nurl={https://openreview.net/forum?id=5BoXZXTJvL}\n}",
        "github": "",
        "project": "",
        "reviewers": "B7C2;dK5u;gsUn;k6s5",
        "site": "https://openreview.net/forum?id=5BoXZXTJvL",
        "pdf_size": 2882889,
        "rating": "3;5;5;5",
        "confidence": "4;4;5;4",
        "soundness": "2;3;3;2",
        "contribution": "2;2;2;2",
        "presentation": "2;3;3;4",
        "wc_summary": "30;74;25;39",
        "wc_strengths": "37;56;64;63",
        "wc_weaknesses": "232;96;149;164",
        "wc_questions": "9;5;45;1",
        "wc_review": "308;231;283;267",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1511;484;1100;735",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "4;1;3;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            42.0,
            19.144189719076646
        ],
        "wc_strengths_avg": [
            55.0,
            10.8397416943394
        ],
        "wc_weaknesses_avg": [
            160.25,
            48.51997011540712
        ],
        "wc_questions_avg": [
            15.0,
            17.549928774784245
        ],
        "wc_review_avg": [
            272.25,
            27.94078560098123
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            957.5,
            387.41999174023016
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.25,
            1.299038105676658
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 25,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1523552247744558102&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0",
        "aff_unique_norm": "Mohamed bin Zayed University of Artificial Intelligence",
        "aff_unique_dep": "",
        "aff_unique_url": "https://mbzuai.ac.ae",
        "aff_unique_abbr": "MBZUAI",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United Arab Emirates"
    },
    {
        "id": "5CBxA1l5RO",
        "title": "TimewarpVAE: Simultaneous Time-Warping and Representation Learning of Trajectories",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Human demonstrations of trajectories are an important source of training data for many machine learning problems. However, the difficulty of collecting human demonstration data for complex tasks makes learning efficient representations of those trajectories challenging. For many problems, such as for handwriting or for quasistatic dexterous manipulation, the exact timings of the trajectories should be factored from their spatial path characteristics. In this work, we propose TimewarpVAE, a fully differentiable manifold-learning algorithm that incorporates Dynamic Time Warping (DTW) to simultaneously learn both timing variations and latent factors of spatial variation. We show how the TimewarpVAE algorithm learns appropriate time alignments and meaningful representations of spatial variations in small handwriting and fork manipulation datasets. Our results have lower spatial reconstruction test error than baseline approaches and the learned low-dimensional representations can be used to efficiently generate semantically meaningful novel trajectories.",
        "keywords": "Representation Learning;Variational Auto-Encoder;Trajectory Data;Dynamic Time Warping",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Travers Rhodes;Daniel Lee",
        "authorids": "~Travers_Rhodes1;~Daniel_Lee1",
        "gender": "M;M",
        "homepage": "https://www.traversrhodes.com/;",
        "dblp": "223/0175;",
        "google_scholar": "Bf66PJEAAAAJ;J0l7wWwAAAAJ",
        "orcid": "0000-0002-2142-5388;",
        "linkedin": "travers-rhodes/;",
        "or_profile": "~Travers_Rhodes1;~Daniel_Lee1",
        "aff": "Cornell University;Cornell University",
        "aff_domain": "cornell.edu;cornell.edu",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nrhodes2024timewarpvae,\ntitle={Timewarp{VAE}: Simultaneous Time-Warping and Representation Learning of Trajectories},\nauthor={Travers Rhodes and Daniel Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=5CBxA1l5RO}\n}",
        "github": "",
        "project": "",
        "reviewers": "qQMc;sdX1;joWW;ui6D",
        "site": "https://openreview.net/forum?id=5CBxA1l5RO",
        "pdf_size": 1662677,
        "rating": "3;5;6;6",
        "confidence": "4;3;3;4",
        "soundness": "4;3;3;2",
        "contribution": "2;2;3;3",
        "presentation": "4;4;4;3",
        "wc_summary": "93;169;68;127",
        "wc_strengths": "23;36;37;81",
        "wc_weaknesses": "193;134;77;121",
        "wc_questions": "3;31;94;150",
        "wc_review": "312;370;276;479",
        "wc_reply_reviewers": "76;0;40;115",
        "wc_reply_authors": "694;357;735;792",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            114.25,
            37.91684981640748
        ],
        "wc_strengths_avg": [
            44.25,
            21.924586655168667
        ],
        "wc_weaknesses_avg": [
            131.25,
            41.43896113562694
        ],
        "wc_questions_avg": [
            69.5,
            56.97587208634897
        ],
        "wc_review_avg": [
            359.25,
            76.84196444651842
        ],
        "wc_reply_reviewers_avg": [
            57.75,
            42.60501731017135
        ],
        "wc_reply_authors_avg": [
            644.5,
            169.59731719576226
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.40824829046386296,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4503611427123033463&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Cornell University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cornell.edu",
        "aff_unique_abbr": "Cornell",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "5COCYDObes",
        "title": "Ask more, know better: Reinforce-Learned Prompt Questions for Decision Making with Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs) demonstrate their promise in tackling complicated\npractical challenges by combining action-based policies with chain of thought\n(CoT) reasoning. Having high-quality prompts on hand, however, is vital to the\nframework\u2019s effectiveness. Currently, these prompts are handcrafted utilising\nextensive human labor, resulting in CoT policies that frequently fail to generalise.\nHuman intervention is also required in order to develop grounding functions that\nensure low-level controllers appropriately process CoT reasoning. In this paper, we\ntake the first step towards a fully integrated end-to-end framework for task-solving\nin real settings employing complicated reasoning. To that purpose, we offer a new\nleader-follower bilevel framework capable of learning to ask relevant questions\n(prompts) and subsequently undertaking reasoning to guide the learning of actions\nto be performed in an environment. A good prompt should make introspective\nrevisions based on historical findings, leading the CoT to consider the anticipated\ngoals. A prompt-generator policy has its own aim in our system, allowing it to\nadapt to the action policy and automatically root the CoT process towards outputs\nthat lead to decisive, high-performing actions. Meanwhile, the action policy is\nlearning how to use the CoT outputs to take specific actions. Our empirical data\nreveal that our system outperforms leading methods in agent learning benchmarks\nsuch as Overcooked and FourRoom.",
        "keywords": "Large language models;reinforcement learning;machine learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/3b7a587091358a68219ffb7923459f90d1251bd7.pdf",
        "author": "Xue Yan;Yan Song;Xinyu Cui;Filippos Christianos;Haifeng Zhang;David Henry Mguni;Jun Wang",
        "authorids": "~Xue_Yan2;~Yan_Song5;~Xinyu_Cui3;~Filippos_Christianos1;~Haifeng_Zhang3;~David_Henry_Mguni1;~Jun_Wang2",
        "gender": "F;M;M;M;;M;M",
        "homepage": ";;;;https://pkuzhf.github.io;;http://www0.cs.ucl.ac.uk/staff/jun.wang/",
        "dblp": ";;;184/8334;93/7133-2;217/2369;w/JunWang12",
        "google_scholar": "5d0Upv8AAAAJ;;;q09VRMkAAAAJ;;K-_yzBsAAAAJ;https://scholar.google.co.uk/citations?user=wIE1tY4AAAAJ",
        "orcid": ";;;;;;",
        "linkedin": "\u96ea-\u95eb-48926a188/;yan-song-079477173/;%E6%96%B0%E5%AE%87-%E5%B4%94-a8506b293/;;;;",
        "or_profile": "~Xue_Yan2;~Yan_Song5;~Xinyu_Cui3;~Filippos_Christianos1;~Haifeng_Zhang3;~David_Henry_Mguni1;~Jun_Wang2",
        "aff": "Institute of Automation, Chinese Academy of Sciences;University College London, University of London;Institute of Automation, Chinese Academy of Sciences;Huawei Technologies Ltd.;Institute of Automation, Chinese Academy of Sciences;Queen Mary University, London;University College London",
        "aff_domain": "ia.ac.cn;ucl.ac.uk;ia.ac.cn;huawei.com;ia.ac.cn;qmul.ac.uk;ucl.ac.uk",
        "position": "PhD student;PhD student;PhD student;Researcher;Associate Professor;Lecturer;Professor",
        "bibtex": "@misc{\nyan2024ask,\ntitle={Ask more, know better: Reinforce-Learned Prompt Questions for Decision Making with  Large Language Models},\nauthor={Xue Yan and Yan Song and Xinyu Cui and Filippos Christianos and Haifeng Zhang and David Henry Mguni and Jun Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=5COCYDObes}\n}",
        "github": "",
        "project": "",
        "reviewers": "UBnq;5KxL;g6Ja;WqYj",
        "site": "https://openreview.net/forum?id=5COCYDObes",
        "pdf_size": 1083443,
        "rating": "3;5;6;6",
        "confidence": "5;4;3;4",
        "soundness": "1;3;3;2",
        "contribution": "1;2;3;2",
        "presentation": "1;2;4;3",
        "wc_summary": "31;63;63;76",
        "wc_strengths": "17;34;88;36",
        "wc_weaknesses": "226;144;124;136",
        "wc_questions": "368;16;57;186",
        "wc_review": "642;257;332;434",
        "wc_reply_reviewers": "260;76;0;160",
        "wc_reply_authors": "1878;752;507;1527",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "5;2;2;5",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            58.25,
            16.60383991732033
        ],
        "wc_strengths_avg": [
            43.75,
            26.592997198510737
        ],
        "wc_weaknesses_avg": [
            157.5,
            40.18395202067612
        ],
        "wc_questions_avg": [
            156.75,
            137.15205977308543
        ],
        "wc_review_avg": [
            416.25,
            144.686514575478
        ],
        "wc_reply_reviewers_avg": [
            124.0,
            96.78842906050289
        ],
        "wc_reply_authors_avg": [
            1166.0,
            557.4365434737841
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.5,
            1.5
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.8660254037844386,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10287892105655605990&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0;2;0;3;1",
        "aff_unique_norm": "Chinese Academy of Sciences;University College London;Huawei;Queen Mary University of London",
        "aff_unique_dep": "Institute of Automation;;Huawei Technologies;",
        "aff_unique_url": "http://www.ia.cas.cn;https://www.ucl.ac.uk;https://www.huawei.com;https://www.qmul.ac.uk",
        "aff_unique_abbr": "CAS;UCL;Huawei;QMUL",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";London",
        "aff_country_unique_index": "0;1;0;0;0;1;1",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "title": "Interpreting CLIP's Image Representation via Text-Based Decomposition",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19436",
        "id": "5Ca9sSzuDp",
        "author_site": "Yossi Gandelsman, Alexei Efros, Jacob Steinhardt",
        "tldr": "",
        "abstract": "We investigate the CLIP image encoder by analyzing how individual model components affect the final representation. We decompose the image representation as a sum across individual image patches, model layers, and attention heads, and use CLIP's text representation to interpret the summands. Interpreting the attention heads, we characterize each head's role by automatically finding text representations that span its output space, which reveals property-specific roles for many heads (e.g. location or shape). Next, interpreting the image patches, we uncover an emergent spatial localization within CLIP. Finally, we use this understanding to remove spurious features from CLIP and to create a strong zero-shot image segmenter. Our results indicate that scalable understanding of transformer models is attainable and can be used to repair and improve models.",
        "keywords": "CLIP;interpretability;explainability",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Yossi Gandelsman;Alexei A Efros;Jacob Steinhardt",
        "authorids": "~Yossi_Gandelsman2;~Alexei_A_Efros1;~Jacob_Steinhardt1",
        "gender": ";M;M",
        "homepage": ";http://www.eecs.berkeley.edu/~efros/;https://yossi.gandelsman.com",
        "dblp": "35/10625;40/6158;232/1765",
        "google_scholar": ";https://scholar.google.com.tw/citations?user=d97bGd8AAAAJ;https://scholar.google.co.il/citations?user=71L4yYMAAAAJ",
        "orcid": ";0000-0001-5720-8070;0000-0003-1259-3387",
        "linkedin": ";alexei-efros-890736a3/;yossi-gandelsman-26582981/",
        "or_profile": "~Jacob_Steinhardt1;~Alyosha_Efros1;~Yossi_Gandelsman1",
        "aff": "University of California, Berkeley;University of California, Berkeley;University of California, Berkeley",
        "aff_domain": "berkeley.edu;berkeley.edu;berkeley.edu",
        "position": "Assistant Professor;Professor;PhD student",
        "bibtex": "@inproceedings{\ngandelsman2024interpreting,\ntitle={Interpreting {CLIP}'s Image Representation via Text-Based Decomposition},\nauthor={Yossi Gandelsman and Alexei A Efros and Jacob Steinhardt},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=5Ca9sSzuDp}\n}",
        "github": "",
        "project": "",
        "reviewers": "bDCR;eYDd;uT2r;ETim",
        "pdf_size": 24318917,
        "rating": "8;8;8;8",
        "confidence": "4;4;2;4",
        "soundness": "4;3;3;3",
        "contribution": "4;3;3;3",
        "presentation": "4;4;3;4",
        "wc_summary": "70;97;121;131",
        "wc_strengths": "109;71;28;149",
        "wc_weaknesses": "68;209;23;104",
        "wc_questions": "85;51;84;8",
        "wc_review": "332;428;256;392",
        "wc_reply_reviewers": "27;20;0;70",
        "wc_reply_authors": "408;561;453;279",
        "reply_reviewers": "1;1;0;2",
        "reply_authors": "1;1;2;2",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            104.75,
            23.562417108607512
        ],
        "wc_strengths_avg": [
            89.25,
            44.846265173367556
        ],
        "wc_weaknesses_avg": [
            101.0,
            68.6403671318853
        ],
        "wc_questions_avg": [
            57.0,
            31.424512724941337
        ],
        "wc_review_avg": [
            352.0,
            65.1766829472013
        ],
        "wc_reply_reviewers_avg": [
            29.25,
            25.52817071393875
        ],
        "wc_reply_authors_avg": [
            425.25,
            101.09988872397437
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 91,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6302865657616014104&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=5Ca9sSzuDp",
        "pdf": "https://openreview.net/pdf?id=5Ca9sSzuDp",
        "email": "berkeley.edu;berkeley.edu;berkeley.edu",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of California, Berkeley",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.berkeley.edu",
        "aff_unique_abbr": "UC Berkeley",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Berkeley",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Physics-Regulated Deep Reinforcement Learning: Invariant Embeddings",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19435",
        "id": "5Dwqu5urzs",
        "author_site": "Hongpeng Cao, Yanbing Mao, Lui Sha, Marco Caccamo",
        "tldr": "",
        "abstract": "This paper proposes the Phy-DRL: a physics-regulated deep reinforcement learning (DRL) framework for safety-critical autonomous systems. The Phy-DRL has three distinguished invariant-embedding designs: i) residual action policy (i.e., integrating data-driven-DRL action policy and physics-model-based action policy), ii) automatically constructed safety-embedded reward, and iii) physics-model-guided neural network (NN) editing, including link editing and activation editing. Theoretically, the Phy-DRL exhibits 1) a mathematically provable safety guarantee and 2) strict compliance of critic and actor networks with physics knowledge about the action-value function and action policy. Finally, we evaluate the Phy-DRL on a cart-pole system and a quadruped robot. The experiments validate our theoretical results and demonstrate that Phy-DRL features guaranteed safety compared to purely data-driven DRL and solely model-based design while offering remarkably fewer learning parameters and fast training towards safety guarantee.",
        "keywords": "Physics-informed deep reinforcement learning;Safety-critical autonomous systems",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/289020ab57bf742ddf172c907d97beacd14306b7.zip",
        "author": "Hongpeng Cao;Yanbing Mao;Lui Sha;Marco Caccamo",
        "authorids": "~Hongpeng_Cao1;~Yanbing_Mao1;~Lui_Sha1;~Marco_Caccamo2",
        "gender": "M;M;M;",
        "homepage": "https://rtsl.cps.mw.tum.de/view_member?id=15;https://ymao578.github.io/index.html;https://ece.illinois.edu/directory/profile/lrs;https://rtsl.cps.mw.tum.de/personal_page/mcaccamo/",
        "dblp": "285/4627;141/4975;67/5282.html;86/450",
        "google_scholar": "47WX07UAAAAJ;kN1IRpsAAAAJ;https://scholar.google.com.tw/citations?user=SlXqNooAAAAJ;",
        "orcid": "0000-0003-4717-8714;;;",
        "linkedin": "hongpeng-cao-195299206/?originalSubdomain=de;;;",
        "or_profile": "~Hongpeng_Cao1;~Yanbing_Mao1;~Lui_Sha1;~Marco_Caccamo2",
        "aff": "Technische Universit\u00e4t M\u00fcnchen;Wayne State University;Department of Computer Science;Technische Universit\u00e4t M\u00fcnchen",
        "aff_domain": "tum.de;wayne.edu;cs.illinois.edu;tum.de",
        "position": "PhD student;Assistant Professor;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\ncao2024physicsregulated,\ntitle={Physics-Regulated Deep Reinforcement Learning: Invariant Embeddings},\nauthor={Hongpeng Cao and Yanbing Mao and Lui Sha and Marco Caccamo},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=5Dwqu5urzs}\n}",
        "github": "",
        "project": "",
        "reviewers": "GsDG;bsXP;BXs3;4Lie",
        "pdf_size": 8326933,
        "rating": "6;8;8;8",
        "confidence": "3;2;3;2",
        "soundness": "2;3;3;2",
        "contribution": "3;3;3;2",
        "presentation": "2;3;3;1",
        "wc_summary": "106;63;49;109",
        "wc_strengths": "31;45;69;81",
        "wc_weaknesses": "121;51;137;103",
        "wc_questions": "44;4;47;56",
        "wc_review": "302;163;302;349",
        "wc_reply_reviewers": "299;73;83;15",
        "wc_reply_authors": "3313;2024;1690;1374",
        "reply_reviewers": "2;2;2;1",
        "reply_authors": "8;8;6;4",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            2.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            81.75,
            26.242856170775315
        ],
        "wc_strengths_avg": [
            56.5,
            19.615045245933032
        ],
        "wc_weaknesses_avg": [
            103.0,
            32.341923257592455
        ],
        "wc_questions_avg": [
            37.75,
            19.97967717456916
        ],
        "wc_review_avg": [
            279.0,
            69.6670653896086
        ],
        "wc_reply_reviewers_avg": [
            117.5,
            107.9571674322738
        ],
        "wc_reply_authors_avg": [
            2100.25,
            736.9397448231435
        ],
        "reply_reviewers_avg": [
            1.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            6.5,
            1.6583123951777
        ],
        "replies_avg": [
            41,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14670243720961949725&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=5Dwqu5urzs",
        "pdf": "https://openreview.net/pdf?id=5Dwqu5urzs",
        "email": "tum.de;wayne.edu;cs.illinois.edu;tum.de",
        "author_num": 4,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Technische Universit\u00e4t M\u00fcnchen;Wayne State University;Unknown Institution",
        "aff_unique_dep": ";;Department of Computer Science",
        "aff_unique_url": "https://www.tum.de;https://wayne.edu;",
        "aff_unique_abbr": "TUM;WSU;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Germany;United States;"
    },
    {
        "id": "5E1HnzEBSf",
        "title": "Local Superior Soups: A Catalyst for Reducing Communication Rounds in Federated Learning with Pre-trained Model",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Federated learning (FL) is a learning paradigm that enables collaborative training of models using decentralized data. \nRecently, the utilization of pre-trained weight initialization in FL has been demonstrated to effectively improve model performance. \nHowever, the current pre-trained models have become increasingly parameter-rich. \nThe sheer scale of model parameters introduces substantial communication rounds challenges during their adaptation to FL.\nTo address these communication cost issues and elevate the performance of pre-trained model adaptation in FL, we propose an innovative model interpolation-based local training technique called ``Local Superior Soups.''\nOur method promotes local training across different clients, encouraging the exploration of a connected low-loss basin within a few communication rounds through regularized model interpolation. \nThis approach serves as a facilitator for pre-trained model adaptation in FL.\nWe demonstrated its effectiveness and efficiency across diverse widely-used FL datasets.",
        "keywords": "Federated Learning; Model Soup; Pre-Trained Model Fine-Tuning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/17a08d39903392bcd1e2b91833dc56cabe3d9c3c.pdf",
        "author": "Minghui Chen;Meirui Jiang;Qi Dou;Zehua Wang;Xiaoxiao Li",
        "authorids": "~Minghui_Chen1;~Meirui_Jiang2;~Qi_Dou2;~Zehua_Wang1;~Xiaoxiao_Li1",
        "gender": "M;F;M;Unspecified;M",
        "homepage": "https://chenminghui.com/;https://www.cse.cuhk.edu.hk/~qdou;https://people.ece.ubc.ca/zwang/;https://xxlya.github.io/;https://meiruijiang.github.io/MeiruiJiang/",
        "dblp": ";165/7846;90/10799;71/8042;285/5480",
        "google_scholar": "aDKyh4cAAAAJ;https://scholar.google.com.hk/citations?user=iHh7IJQAAAAJ;https://scholar.google.ca/citations?user=pquTtPYAAAAJ;sdENOQ4AAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";0000-0002-3416-9950;;;0000-0003-4228-8420",
        "linkedin": "minghui-chen-75a046210/;;wangzehua/;;",
        "or_profile": "~Minghui_Chen1;~Qi_Dou2;~Zehua_Wang1;~Xiaoxiao_Li1;~Meirui_JIANG1",
        "aff": "University of British Columbia;The Chinese University of Hong Kong;University of British Columbia;University of British Columbia;Department of Computer Science and Engineering, The Chinese University of Hong Kong",
        "aff_domain": "ubc.ca;cuhk.edu.hk;ubc.ca;ece.ubc.ca;cse.cuhk.edu.hk",
        "position": "PhD student;Assistant Professor;Researcher;Assistant Professor;PhD student",
        "bibtex": "@misc{\nchen2024local,\ntitle={Local Superior Soups: A Catalyst for Reducing Communication Rounds in Federated Learning with Pre-trained Model},\nauthor={Minghui Chen and Meirui Jiang and Qi Dou and Zehua Wang and Xiaoxiao Li},\nyear={2024},\nurl={https://openreview.net/forum?id=5E1HnzEBSf}\n}",
        "github": "",
        "project": "",
        "reviewers": "gxja;w5Zc;w8kd;qnQ5",
        "site": "https://openreview.net/forum?id=5E1HnzEBSf",
        "pdf_size": 1010806,
        "rating": "3;3;5;6",
        "confidence": "4;5;4;4",
        "soundness": "3;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "4;3;2;2",
        "wc_summary": "46;117;165;51",
        "wc_strengths": "24;21;105;32",
        "wc_weaknesses": "130;80;411;274",
        "wc_questions": "4;11;282;3",
        "wc_review": "204;229;963;360",
        "wc_reply_reviewers": "0;43;0;0",
        "wc_reply_authors": "306;400;586;297",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            94.75,
            49.29693195321591
        ],
        "wc_strengths_avg": [
            45.5,
            34.586847211042524
        ],
        "wc_weaknesses_avg": [
            223.75,
            129.46114281899415
        ],
        "wc_questions_avg": [
            75.0,
            119.55124424279322
        ],
        "wc_review_avg": [
            439.0,
            308.27828337396716
        ],
        "wc_reply_reviewers_avg": [
            10.75,
            18.619546181365433
        ],
        "wc_reply_authors_avg": [
            397.25,
            116.20106496930224
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5555555555555555,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:yMmn_TLjQpYJ:scholar.google.com/&scioq=Local+Superior+Soups:+A+Catalyst+for+Reducing+Communication+Rounds+in+Federated+Learning+with+Pre-trained+Model&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0;1",
        "aff_unique_norm": "University of British Columbia;Chinese University of Hong Kong",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ubc.ca;https://www.cuhk.edu.hk",
        "aff_unique_abbr": "UBC;CUHK",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;1;0;0;1",
        "aff_country_unique": "Canada;China"
    },
    {
        "title": "The Effective Horizon Explains Deep RL Performance in Stochastic Environments",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19434",
        "id": "5ES5Hdlbxw",
        "author_site": "Cassidy Laidlaw, Banghua Zhu, Stuart Russell, Anca Dragan",
        "tldr": "",
        "abstract": "Reinforcement learning (RL) theory has largely focused on proving minimax sample complexity bounds. These require strategic exploration algorithms that use relatively limited function classes for representing the policy or value function. Our goal is to explain why deep RL algorithms often perform well in practice, despite using random exploration and much more expressive function classes like neural networks. Our work arrives at an explanation by showing that many stochastic MDPs can be solved by performing only a few steps of value iteration on the random policy\u2019s Q function and then acting greedily. When this is true, we find that it is possible to separate the exploration and learning components of RL, making it much easier to analyze. We introduce a new RL algorithm, SQIRL, that iteratively learns a near-optimal policy by exploring randomly to collect rollouts and then performing a limited number of steps of fitted-Q iteration over those roll- outs. We find that any regression algorithm that satisfies basic in-distribution generalization properties can be used in SQIRL to efficiently solve common MDPs. This can explain why deep RL works with complex function approximators like neural networks, since it is empirically established that neural networks generalize well in-distribution. Furthermore, SQIRL explains why random exploration works well in practice, since we show many environments can be solved by effectively estimating the random policy\u2019s Q-function and then applying zero or a few steps of value iteration. We leverage SQIRL to derive instance-dependent sample complexity bounds for RL that are exponential only in an \u201ceffective horizon\u201d of lookahead\u2014which is typically much smaller than the full horizon\u2014and on the complexity of the class used for function approximation. Empirically, we also find that SQIRL performance strongly correlates with PPO and DQN performance in a variety of stochastic environments, supporting that our theoretical analysis is predictive of practical performance. Our code and data are available at https://github.com/cassidylaidlaw/effective-horizon.",
        "keywords": "reinforcement learning;effective horizon;RL theory;theory of reinforcement learning;instance-dependent bounds;empirical validation of theory",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Cassidy Laidlaw;Banghua Zhu;Stuart Russell;Anca Dragan",
        "authorids": "~Cassidy_Laidlaw1;~Banghua_Zhu1;~Stuart_Russell1;~Anca_Dragan1",
        "gender": "M;M;M;F",
        "homepage": "https://cassidylaidlaw.com;https://people.eecs.berkeley.edu/~banghua/;https://people.eecs.berkeley.edu/~russell/;http://www.ancadragan.com/",
        "dblp": "241/5375;204/5394;;",
        "google_scholar": "DzeJ67UAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com.tw/citations?user=KJGrjCAAAAAJ;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Cassidy_Laidlaw1;~Banghua_Zhu1;~Stuart_Russell1;~Anca_Dragan1",
        "aff": "University of California, Berkeley;University of California, Berkeley;University of California, Berkeley;University of California, Berkeley",
        "aff_domain": "berkeley.edu;berkeley.edu;berkeley.edu;berkeley.edu",
        "position": "PhD student;PhD student;Full Professor;Associate Professor",
        "bibtex": "@inproceedings{\nlaidlaw2024the,\ntitle={The Effective Horizon Explains Deep {RL} Performance in Stochastic Environments},\nauthor={Cassidy Laidlaw and Banghua Zhu and Stuart Russell and Anca Dragan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=5ES5Hdlbxw}\n}",
        "github": "",
        "project": "",
        "reviewers": "kbuB;UBNV;1dWJ;yWoc",
        "pdf_size": 1650168,
        "rating": "5;6;6;6",
        "confidence": "2;4;3;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;2;2",
        "presentation": "3;4;3;3",
        "wc_summary": "42;120;219;91",
        "wc_strengths": "13;122;171;154",
        "wc_weaknesses": "35;196;508;254",
        "wc_questions": "67;92;4;1",
        "wc_review": "157;530;902;500",
        "wc_reply_reviewers": "0;13;225;207",
        "wc_reply_authors": "438;799;1126;1168",
        "reply_reviewers": "0;1;2;2",
        "reply_authors": "1;1;2;2",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            118.0,
            64.6335826022355
        ],
        "wc_strengths_avg": [
            115.0,
            61.461369981476984
        ],
        "wc_weaknesses_avg": [
            248.25,
            170.0799444379025
        ],
        "wc_questions_avg": [
            41.0,
            39.515819616958474
        ],
        "wc_review_avg": [
            522.25,
            263.71042357100714
        ],
        "wc_reply_reviewers_avg": [
            111.25,
            105.04374088921243
        ],
        "wc_reply_authors_avg": [
            882.75,
            293.8344559441591
        ],
        "reply_reviewers_avg": [
            1.25,
            0.82915619758885
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.816496580927726,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8388709054180809828&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 9,
        "openreview": "https://openreview.net/forum?id=5ES5Hdlbxw",
        "pdf": "https://openreview.net/pdf?id=5ES5Hdlbxw",
        "email": "berkeley.edu;berkeley.edu;berkeley.edu;berkeley.edu",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of California, Berkeley",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.berkeley.edu",
        "aff_unique_abbr": "UC Berkeley",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Berkeley",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Weatherproofing Retrieval for Localization with Generative AI and Geometric Consistency",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19433",
        "id": "5EniAcsO7f",
        "author_site": "Yannis Kalantidis, Mert Bulent SARIYILDIZ, Rafael Rezende, Philippe Weinzaepfel, Diane Larlus, Gabriela Csurka",
        "tldr": "",
        "abstract": "State-of-the-art visual localization approaches generally rely on a first image retrieval step whose role is crucial. Yet, retrieval often struggles when facing varying conditions, due to e.g. weather or time of day, with dramatic consequences on the visual localization accuracy. In this paper, we improve this retrieval step and tailor it to the final localization task. Among the several changes we advocate for, we propose to synthesize variants of the training set images, obtained from generative text-to-image models, in order to automatically expand the training set towards a number of nameable variations that particularly hurt visual localization. After expanding the training set, we propose a training approach that leverages the specificities and the underlying geometry of this mix of real and synthetic images. We experimentally show that those changes translate into large improvements for the most challenging visual localization datasets.",
        "keywords": "visual localization;image retrieval;synthetic data;domain shift;geometric consistency;long-term visual localization;ret4loc;image alteration",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yannis Kalantidis;Mert B\u00fclent Sar\u0131y\u0131ld\u0131z;Rafael S. Rezende;Philippe Weinzaepfel;Diane Larlus;Gabriela Csurka",
        "authorids": "~Yannis_Kalantidis2;~Mert_B\u00fclent_Sar\u0131y\u0131ld\u0131z1;~Rafael_S._Rezende1;~Philippe_Weinzaepfel1;~Diane_Larlus1;~Gabriela_Csurka2",
        "gender": "M;M;M;M;F;F",
        "homepage": "https://www.skamalas.com/;https://mbsariyildiz.github.io;https://europe.naverlabs.com/people_user/rafael-sampaio-de-rezende/;https://europe.naverlabs.com/people_user/Philippe-Weinzaepfel/;https://dlarlus.github.io/;https://europe.naverlabs.com/people_user/gabriela-csurka-khedari",
        "dblp": "33/8693;247/9362;200/8093;29/9989;48/4033;c/GabrielaCsurka",
        "google_scholar": "QJZQgN8AAAAJ;9vpQ9tIAAAAJ;https://scholar.google.com/citations?hl=fr;https://scholar.google.fr/citations?user=LSxIJ5cAAAAJ;https://scholar.google.fr/citations?user=nI2oJqkAAAAJ;https://scholar.google.fr/citations?user=PXm1lPAAAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";;;;;gabriela-csurka-0387bb2a/",
        "or_profile": "~Yannis_Kalantidis2;~Mert_B\u00fclent_Sar\u0131y\u0131ld\u0131z1;~Rafael_S._Rezende1;~Philippe_Weinzaepfel1;~Diane_Larlus1;~Gabriela_Csurka2",
        "aff": "Naver Labs Europe;Naver Labs Europe;Naver Labs Europe;Naver Labs Europe;NAVER LABS Europe;Naver Labs Europe",
        "aff_domain": "naverlabs.com;naverlabs.com;naverlabs.com;naverlabs.com;naverlabs.com;naverlabs.com",
        "position": "Research Scientist;Researcher;Research Scientist;Research Scientist;Principal Researcher;Principal Researcher",
        "bibtex": "@inproceedings{\nkalantidis2024weatherproofing,\ntitle={Weatherproofing Retrieval for Localization with Generative {AI} and Geometric Consistency},\nauthor={Yannis Kalantidis and Mert B{\\\"u}lent Sar{\\i}y{\\i}ld{\\i}z and Rafael S. Rezende and Philippe Weinzaepfel and Diane Larlus and Gabriela Csurka},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=5EniAcsO7f}\n}",
        "github": "",
        "project": "",
        "reviewers": "dtiA;oYk5;Hu6J",
        "pdf_size": 20924613,
        "rating": "6;6;8",
        "confidence": "5;3;3",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "3;3;3",
        "wc_summary": "87;69;69",
        "wc_strengths": "242;28;80",
        "wc_weaknesses": "412;145;62",
        "wc_questions": "5;8;62",
        "wc_review": "746;250;273",
        "wc_reply_reviewers": "178;21;0",
        "wc_reply_authors": "1749;806;565",
        "reply_reviewers": "3;1;0",
        "reply_authors": "3;2;1",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            75.0,
            8.48528137423857
        ],
        "wc_strengths_avg": [
            116.66666666666667,
            91.13116310510301
        ],
        "wc_weaknesses_avg": [
            206.33333333333334,
            149.32366040100797
        ],
        "wc_questions_avg": [
            25.0,
            26.19160170741759
        ],
        "wc_review_avg": [
            423.0,
            228.5884219873497
        ],
        "wc_reply_reviewers_avg": [
            66.33333333333333,
            79.4243175747971
        ],
        "wc_reply_authors_avg": [
            1040.0,
            510.9018170516392
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            1.247219128924647
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:7THObuIPnnsJ:scholar.google.com/&scioq=Weatherproofing+Retrieval+for+Localization+with+Generative+AI+and+Geometric+Consistency&hl=en&as_sdt=0,44",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=5EniAcsO7f",
        "pdf": "https://openreview.net/pdf?id=5EniAcsO7f",
        "email": "naverlabs.com;naverlabs.com;naverlabs.com;naverlabs.com;naverlabs.com;naverlabs.com",
        "author_num": 6,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "NAVER LABS",
        "aff_unique_dep": "",
        "aff_unique_url": "https://labs.naver.com",
        "aff_unique_abbr": "NLE",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;1;0",
        "aff_country_unique": "Unknown;France"
    },
    {
        "id": "5EtSvYUU0v",
        "title": "Connecting NTK and NNGP: A Unified Theoretical Framework for Neural Network Learning Dynamics in the Kernel Regime",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Artificial neural networks (ANNs) have revolutionized machine learning in recent years, but a complete theoretical framework for their learning process is still lacking. Substantial theoretical advances have been achieved for infinitely wide networks. In this regime, two disparate theoretical frameworks have been used, in which the network\u2019s output is described using kernels: one framework is based on the Neural Tangent Kernel (NTK), which assumes linearized gradient descent dynamics, while the Neural Network Gaussian Process (NNGP) kernel assumes a Bayesian framework. However, the relation between these two frameworks and between their underlying sets of assumptions has remained elusive. This work unifies these two distinct theories using gradient descent learning dynamics with an additional small noise in an ensemble of randomly initialized infinitely wide deep networks. We derive an exact analytical expression for the network input-output function during and after learning and introduce a new time-dependent Neural Dynamical Kernel (NDK) from which both NTK and NNGP kernels can be derived. We identify two important learning phases characterized by different time scales: gradient-driven and diffusive learning. In the initial gradient-driven learning phase, the dynamics is dominated by deterministic gradient descent, and is adequately described by the NTK theory. This phase is followed by the slow diffusive learning stage, during which the network parameters sample the solution space, ultimately approaching the equilibrium posterior distribution corresponding to NNGP. Combined with numerical evaluations on synthetic and benchmark datasets, we provide novel insights into the different roles of initialization, regularization, and network depth, as well as phenomena such as early stopping and representational drift. This work closes the gap between the NTK and NNGP theories, providing a comprehensive framework for understanding the learning process of deep neural networks in the infinite width limit.",
        "keywords": "Learning dynamics;Neural tangent kernel;Neural network Gaussian process;Infinite width limit;Representational drift;Statistical mechanics",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/78a56dc0d1eb798f652b92220e09b57b7dd3f4c8.pdf",
        "author": "Yehonatan Avidan;Qianyi Li;Haim Sompolinsky",
        "authorids": "~Yehonatan_Avidan1;~Qianyi_Li1;~Haim_Sompolinsky1",
        "gender": ";F;M",
        "homepage": ";;",
        "dblp": "274/0837;280/1128;33/5545",
        "google_scholar": "-pnXrNwAAAAJ;LbzGoc8AAAAJ;",
        "orcid": ";0000-0002-1448-4566;",
        "linkedin": ";;",
        "or_profile": "~Yehonatan_Avidan1;~Qianyi_Li1;~Haim_Sompolinsky1",
        "aff": ";Harvard University, Harvard University;",
        "aff_domain": ";g.harvard.edu;",
        "position": ";PhD student;",
        "bibtex": "@misc{\navidan2024connecting,\ntitle={Connecting {NTK} and {NNGP}: A Unified Theoretical Framework for Neural Network Learning Dynamics in the Kernel Regime},\nauthor={Yehonatan Avidan and Qianyi Li and Haim Sompolinsky},\nyear={2024},\nurl={https://openreview.net/forum?id=5EtSvYUU0v}\n}",
        "github": "",
        "project": "",
        "reviewers": "2yMn;2CVF;Bpa7;88ey",
        "site": "https://openreview.net/forum?id=5EtSvYUU0v",
        "pdf_size": 4473456,
        "rating": "3;5;8;8",
        "confidence": "3;5;4;3",
        "soundness": "3;3;4;3",
        "contribution": "4;3;3;4",
        "presentation": "1;2;3;4",
        "wc_summary": "174;67;113;161",
        "wc_strengths": "105;54;42;150",
        "wc_weaknesses": "150;108;202;189",
        "wc_questions": "152;376;132;124",
        "wc_review": "581;605;489;624",
        "wc_reply_reviewers": "262;24;155;108",
        "wc_reply_authors": "627;717;683;407",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;1;2;2",
        "rating_avg": [
            6.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            128.75,
            42.2751404492049
        ],
        "wc_strengths_avg": [
            87.75,
            43.0254285277904
        ],
        "wc_weaknesses_avg": [
            162.25,
            36.70405290972647
        ],
        "wc_questions_avg": [
            196.0,
            104.4222198576529
        ],
        "wc_review_avg": [
            574.75,
            51.799493240764434
        ],
        "wc_reply_reviewers_avg": [
            137.25,
            85.96329158425705
        ],
        "wc_reply_authors_avg": [
            608.5,
            120.69279183116114
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10431141825192819348&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "Harvard University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.harvard.edu",
        "aff_unique_abbr": "Harvard",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "5F0WDt9CjA",
        "title": "PIANO PERFORMANCE EVALUATION DATASET WITH MULTI-LEVEL PERCEPTUAL FEATURES",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "This study aims to build a comprehensive dataset that enables the automatic evaluation of piano performances. In real-world piano performance, especially within the realm of classical piano music, we encounter a vast spectrum of performance variations. The challenge lies in how to effectively evaluate these performances. We must consider three critical aspects: 1) It is essential to gauge how performers\nperceive and express, and listeners perceive the music, not just the compositional characteristics of music such as beat stability measured from a metronome. 2) Beyond fundamental elements like pitch and duration, we must also embrace higher-level features such as interpretation. 3) Such evaluation should be done by experts to discern the nuanced performances. Regrettably, there exists no dataset\nthat addresses these challenging evaluation tasks. Therefore, we introduce a pioneering dataset PercePiano, annotated by music experts, with more extensive features capable of representing these nuanced aspects effectively. It encapsulates piano performance with a wide range of perceptual features that are recognized by musicians. Our evaluation benchmark includes a novel metric designed to\naccommodate the inherent subjectivity of perception. For the baseline models, we pinpoint a significant issue in current transformer-based models. We in response introduce a new baseline that leverages hierarchical levels of performance, which shows results comparable to that of large pre-trained models. In conclusion, our research opens new possibilities for comprehensive piano performance evaluation.",
        "keywords": "dataset;music;perception;piano performance evaluation;hierarchical attention network",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Jisoo Park;Jongho Kim;Jeong Mi Park;Ahyeon Choi;Wen-Syan Li;Jonghwa Park;seung-won hwang",
        "authorids": "~Jisoo_Park2;~Jongho_Kim2;~Jeong_Mi_Park1;~Ahyeon_Choi1;~Wen-Syan_Li2;~Jonghwa_Park1;~seung-won_hwang2",
        "gender": "F;;F;F;M;;",
        "homepage": ";;https://www.researchgate.net/profile/Jeong-Mi-Park;;https://aml.gsds.snu.ac.kr/home;http/joapkcom;http://seungwonh.github.io",
        "dblp": ";;;;60/5978.html;;h/SeungwonHwang",
        "google_scholar": ";;;https://scholar.google.co.kr/citations?user=KEXGGRMAAAAJ;;;63bBmc3mYrAC",
        "orcid": "0009-0009-0857-8927;;;;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Jisoo_Park2;~Jongho_Kim2;~Jeong_Mi_Park1;~Ahyeon_Choi1;~Wen-Syan_Li2;~Jonghwa_Park1;~seung-won_hwang2",
        "aff": "Seoul National University;;Seoul National University;Seoul National University;Seoul National University;Seoul National University;Seoul National University",
        "aff_domain": "snu.ac.kr;;snu.ac.kr;snu.ac.kr;snu.ac.kr;snu.ac.kr;snu.ac.kr",
        "position": "MS student;;Lecturer;PhD student;Full Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\npark2024piano,\ntitle={{PIANO} {PERFORMANCE} {EVALUATION} {DATASET} {WITH} {MULTI}-{LEVEL} {PERCEPTUAL} {FEATURES}},\nauthor={Jisoo Park and Jongho Kim and Jeong Mi Park and Ahyeon Choi and Wen-Syan Li and Jonghwa Park and seung-won hwang},\nyear={2024},\nurl={https://openreview.net/forum?id=5F0WDt9CjA}\n}",
        "github": "",
        "project": "",
        "reviewers": "iYeg;vNEe;Pd1L;zHsN;ZEzP;sviL",
        "site": "https://openreview.net/forum?id=5F0WDt9CjA",
        "pdf_size": 746270,
        "rating": "3;3;3;3;6;6",
        "confidence": "4;3;4;4;3;3",
        "soundness": "3;3;2;2;3;2",
        "contribution": "2;2;2;2;2;2",
        "presentation": "2;2;3;2;4;3",
        "wc_summary": "162;73;31;57;29;9",
        "wc_strengths": "125;79;34;50;22;9",
        "wc_weaknesses": "260;243;319;509;51;9",
        "wc_questions": "3;24;90;27;1;9",
        "wc_review": "550;419;474;643;103;36",
        "wc_reply_reviewers": "0;0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0;0",
        "reply_authors": "0;0;0;0;0;0",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.7453559924999299
        ],
        "wc_summary_avg": [
            60.166666666666664,
            49.974715829329355
        ],
        "wc_strengths_avg": [
            53.166666666666664,
            39.001780586133364
        ],
        "wc_weaknesses_avg": [
            231.83333333333334,
            167.1789626584504
        ],
        "wc_questions_avg": [
            25.666666666666668,
            30.39554060859732
        ],
        "wc_review_avg": [
            370.8333333333333,
            224.7171679145934
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.7071067811865476,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:F2v9CO1z7x0J:scholar.google.com/&scioq=PIANO+PERFORMANCE+EVALUATION+DATASET+WITH+MULTI-LEVEL+PERCEPTUAL+FEATURES&hl=en&as_sdt=0,44",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "Seoul National University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.snu.ac.kr",
        "aff_unique_abbr": "SNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "5GX6s5TpmV",
        "title": "The Certification Paradox: Certifications Admit Better Evasion Attacks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In guaranteeing the absence of adversarial examples in bounded spaces, certification mechanisms play an important role in demonstrating neural network robustness. Within this work we ask if certifications themselves can potentially compromise the very models they help to protect? By demonstrating a new attack surface that exploits certified guarantees to construct norm minimising evasion attacks, we demonstrate the heretofore unexplored risks inherent in releasing certifications. Our new *Certification Aware Attack* produces smaller, more difficult to detect adversarial examples more than $74$% of the time than comparable attacks, while reducing the median perturbation norm by more than $10$%. That this is achievable in significantly less computational time highlights  an apparent paradox---that releasing certifications can reduce security.",
        "keywords": "certified robustness;adversarial attacks;risk;randomised smoothing",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Andrew Craig Cullen;Shijie Liu;Paul Montague;Sarah Monazam Erfani;Benjamin I. P. Rubinstein",
        "authorids": "~Andrew_Craig_Cullen1;~Shijie_Liu4;~Paul_Montague1;~Sarah_Monazam_Erfani1;~Benjamin_I._P._Rubinstein1",
        "gender": "M;M;M;;M",
        "homepage": "https://www.andrewcraigcullen.com;https://github.com/shijiel2;;https://people.eng.unimelb.edu.au/smonazam/;http://www.bipr.net/",
        "dblp": "238/6828;;50/805;136/0170;90/1092",
        "google_scholar": "BeXBviIAAAAJ;https://scholar.google.com.au/citations?user=lH5nxwMAAAAJ;;https://scholar.google.com.au/citations?user=Jq9ocx4AAAAJ;https://scholar.google.com.au/citations?user=hMG_gR4AAAAJ",
        "orcid": "0000-0001-8243-6470;0009-0008-2980-6266;0000-0001-9461-7471;;0000-0002-2947-6980",
        "linkedin": ";;;;benjaminrubinstein/",
        "or_profile": "~Andrew_Craig_Cullen1;~Shijie_Liu4;~Paul_Montague1;~Sarah_Monazam_Erfani1;~Benjamin_I._P._Rubinstein1",
        "aff": "The University of Melbourne;The University of Melbourne;Defence Science and Technology Group;The University of Melbourne;The University of Melbourne",
        "aff_domain": "unimelb.edu.au;unimelb.edu.au;dst.defence.gov.au;unimelb.edu.au;unimelb.edu.au",
        "position": "Postdoc;PhD student;Researcher;Associate Professor;Associate Professor",
        "bibtex": "@misc{\ncullen2024the,\ntitle={The Certification Paradox: Certifications Admit Better Evasion Attacks},\nauthor={Andrew Craig Cullen and Shijie Liu and Paul Montague and Sarah Monazam Erfani and Benjamin I. P. Rubinstein},\nyear={2024},\nurl={https://openreview.net/forum?id=5GX6s5TpmV}\n}",
        "github": "",
        "project": "",
        "reviewers": "Kwhk;xpHV;Z9pA;VDGn",
        "site": "https://openreview.net/forum?id=5GX6s5TpmV",
        "pdf_size": 1206878,
        "rating": "1;3;5;6",
        "confidence": "5;3;3;2",
        "soundness": "2;2;2;3",
        "contribution": "3;3;3;3",
        "presentation": "2;2;3;2",
        "wc_summary": "524;49;75;207",
        "wc_strengths": "98;20;37;58",
        "wc_weaknesses": "213;240;447;34",
        "wc_questions": "108;68;30;5",
        "wc_review": "943;377;589;304",
        "wc_reply_reviewers": "412;174;502;18",
        "wc_reply_authors": "1345;915;1251;231",
        "reply_reviewers": "2;1;2;1",
        "reply_authors": "4;4;3;2",
        "rating_avg": [
            3.75,
            1.920286436967152
        ],
        "confidence_avg": [
            3.25,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            213.75,
            188.87479318320908
        ],
        "wc_strengths_avg": [
            53.25,
            29.13224158900238
        ],
        "wc_weaknesses_avg": [
            233.5,
            146.4965869909603
        ],
        "wc_questions_avg": [
            52.75,
            38.99599338393625
        ],
        "wc_review_avg": [
            553.25,
            248.17974836799235
        ],
        "wc_reply_reviewers_avg": [
            276.5,
            191.40206372973097
        ],
        "wc_reply_authors_avg": [
            935.5,
            437.0271730682201
        ],
        "reply_reviewers_avg": [
            1.5,
            0.5
        ],
        "reply_authors_avg": [
            3.25,
            0.82915619758885
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9258889211887232,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:IaUUpoRxR7UJ:scholar.google.com/&scioq=The+Certification+Paradox:+Certifications+Admit+Better+Evasion+Attacks&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "University of Melbourne;Defence Science and Technology Group",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.unimelb.edu.au;https://www.dst.defence.gov.au/",
        "aff_unique_abbr": "UniMelb;DST Group",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Australia"
    },
    {
        "id": "5Gt68fnttu",
        "title": "Dynamic Electroencephalography Representation Learning for Improved Epileptic Seizure Detection",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Epileptic seizure is an abnormal brain activity that affects millions of people worldwide. Effectively detecting seizures from electroencephalography (EEG) signals with automated algorithms is essential for seizure diagnosis and treatment. Although much research has been proposed to learn EEG representations, most of them neglect the detection latency when it comes to real-world clinical scenarios where the inputs are streaming. Moreover, they fail to either capture the underlying dynamics of brain activities or localize seizure regions. To this end, we propose an improved seizure detection task named onset detection, which identifies both the presence and the specific timestamps of seizure events, and two new metrics to quantify the timeliness of detection methods. We further introduce the Dynamic Seizure Network, a framework for EEG representation learning, which models the evolutionary brain states and dynamic brain connectivity efficiently. Theoretical analysis and experimental results on three real-world seizure datasets demonstrate that our method outperforms baselines with low time and space complexity.  Our method can also provide visualizations to assist clinicians in localizing abnormal brain activities for further diagnosis.",
        "keywords": "Electroencephalography;Epileptic;Seizure;Efficient;Neuroscience",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/f87e31012249c8580aceb7f4d3a9fc3e054f7790.zip",
        "author": "Zihang Liu;Haishuai Wang",
        "authorids": "~Zihang_Liu3;~Haishuai_Wang2",
        "gender": "M;M",
        "homepage": "https://github.com/lzhmarkk;https://www.linkedin.com/in/haishuai-wang-b5241775/",
        "dblp": "193/1470;163/0767",
        "google_scholar": "https://scholar.google.com.hk/citations?user=05jAWL4AAAAJ;",
        "orcid": "0000-0002-4114-7960;0000-0003-1617-0920",
        "linkedin": ";",
        "or_profile": "~Zihang_Liu3;~Haishuai_Wang2",
        "aff": "Beihang University;Zhejiang University",
        "aff_domain": "buaa.edu.cn;zju.edu.cn",
        "position": "MS student;Research Professor",
        "bibtex": "@misc{\nliu2024dynamic,\ntitle={Dynamic Electroencephalography Representation Learning for Improved Epileptic Seizure Detection},\nauthor={Zihang Liu and Haishuai Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=5Gt68fnttu}\n}",
        "github": "",
        "project": "",
        "reviewers": "P4gj;Rq1a;UeqT",
        "site": "https://openreview.net/forum?id=5Gt68fnttu",
        "pdf_size": 11349966,
        "rating": "3;5;6",
        "confidence": "4;4;4",
        "soundness": "2;3;3",
        "contribution": "3;2;3",
        "presentation": "3;3;3",
        "wc_summary": "81;66;77",
        "wc_strengths": "26;13;92",
        "wc_weaknesses": "108;295;25",
        "wc_questions": "12;161;31",
        "wc_review": "227;535;225",
        "wc_reply_reviewers": "0;113;6",
        "wc_reply_authors": "905;3011;330",
        "reply_reviewers": "0;2;1",
        "reply_authors": "3;6;2",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            74.66666666666667,
            6.342099196813483
        ],
        "wc_strengths_avg": [
            43.666666666666664,
            34.58644564308715
        ],
        "wc_weaknesses_avg": [
            142.66666666666666,
            112.91983390392005
        ],
        "wc_questions_avg": [
            68.0,
            66.21681558838863
        ],
        "wc_review_avg": [
            329.0,
            145.66628527791414
        ],
        "wc_reply_reviewers_avg": [
            39.666666666666664,
            51.91231924012728
        ],
        "wc_reply_authors_avg": [
            1415.3333333333333,
            1152.467015676467
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            1.699673171197595
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:fWvqcbh53SkJ:scholar.google.com/&scioq=Dynamic+Electroencephalography+Representation+Learning+for+Improved+Epileptic+Seizure+Detection&hl=en&as_sdt=0,23",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Beihang University;Zhejiang University",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.buaa.edu.cn/;https://www.zju.edu.cn",
        "aff_unique_abbr": "BUAA;ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "When Scaling Meets LLM Finetuning: The Effect of Data, Model and Finetuning Method",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19432",
        "id": "5HCnKDeTws",
        "author_site": "Biao Zhang, Zhongtao Liu, Colin Cherry, Orhan Firat",
        "tldr": "",
        "abstract": "While large language models (LLMs) often adopt finetuning to unlock their capabilities for downstream applications, our understanding on the inductive biases (especially the scaling properties) of different finetuning methods is still limited. To fill this gap, we conduct systematic experiments studying whether and how different scaling factors, including LLM model size, pretraining data size, new finetuning parameter size and finetuning data size, affect the finetuning performance. We consider two types of finetuning \u2013 full-model tuning (FMT) and parameter efficient tuning (PET, including prompt tuning and LoRA), and explore their scaling behaviors in the data-limited regime where the LLM model size substantially outweighs the finetuning data size. Based on two sets of pretrained bilingual LLMs from 1B to 16B and experiments on bilingual machine translation and multilingual summarization benchmarks, we find that 1) LLM finetuning follows a powerbased multiplicative joint scaling law between finetuning data size and each other scaling factor; 2) LLM finetuning benefits more from LLM model scaling than pretraining data scaling, and PET parameter scaling is generally ineffective; and 3) the optimal finetuning method is highly task- and finetuning data-dependent. We hope our findings could shed light on understanding, selecting and developing LLM finetuning methods.",
        "keywords": "LLM finetuning;Scaling Laws;Full-model finetuning;Parameter efficient tuning;Machine Translation;Multilingual Summarization",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Biao Zhang;Zhongtao Liu;Colin Cherry;Orhan Firat",
        "authorids": "~Biao_Zhang2;zhongtao@google.com;~Colin_Cherry1;~Orhan_Firat1",
        "gender": "M;;M;M",
        "homepage": ";;https://sites.google.com/site/colinacherry/;",
        "dblp": "https://dblp.uni-trier.de/pers/hd/z/Zhang_0002:Biao;;99/6601;120/2225",
        "google_scholar": "gqPKjaIAAAAJ;;TNr_OWMAAAAJ;https://scholar.google.com.tr/citations?user=dLaR9lgAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;colincherry/;",
        "or_profile": "~Biao_Zhang2;zhongtao@google.com;~Colin_Cherry1;~Orhan_Firat1",
        "aff": "Google DeepMind;;Google;Google",
        "aff_domain": "google.com;;google.com;google.com",
        "position": "Researcher;;Researcher;Research Scientist",
        "bibtex": "@inproceedings{\nzhang2024when,\ntitle={When Scaling Meets {LLM} Finetuning: The Effect of Data, Model and Finetuning Method},\nauthor={Biao Zhang and Zhongtao Liu and Colin Cherry and Orhan Firat},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=5HCnKDeTws}\n}",
        "github": "",
        "project": "",
        "reviewers": "wU43;gFLk;oDvP;R4DF",
        "pdf_size": 1266512,
        "rating": "5;6;8;8",
        "confidence": "3;3;3;4",
        "soundness": "3;2;4;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;4;3",
        "wc_summary": "30;68;71;25",
        "wc_strengths": "60;34;115;31",
        "wc_weaknesses": "121;56;181;59",
        "wc_questions": "4;245;46;30",
        "wc_review": "215;403;413;145",
        "wc_reply_reviewers": "13;126;192;0",
        "wc_reply_authors": "376;849;393;197",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            48.5,
            21.10094784600919
        ],
        "wc_strengths_avg": [
            60.0,
            33.69718089098849
        ],
        "wc_weaknesses_avg": [
            104.25,
            51.34868547489799
        ],
        "wc_questions_avg": [
            81.25,
            95.72192799980577
        ],
        "wc_review_avg": [
            294.0,
            116.70903992407786
        ],
        "wc_reply_reviewers_avg": [
            82.75,
            79.87294598297974
        ],
        "wc_reply_authors_avg": [
            453.75,
            240.76895044834995
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5555555555555555,
        "gs_citation": 135,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8034468019146020698&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=5HCnKDeTws",
        "pdf": "https://openreview.net/pdf?id=5HCnKDeTws",
        "email": "google.com;;google.com;google.com",
        "author_num": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Google",
        "aff_unique_dep": "Google DeepMind",
        "aff_unique_url": "https://deepmind.com",
        "aff_unique_abbr": "DeepMind",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "id": "5HGPR6fg2S",
        "title": "Normalized Space Alignment: A Versatile Metric for Representation Space Discrepancy Minimization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We introduce a manifold analysis technique for quantifying the discrepancy between two representation spaces. Normalized Space Alignment (NSA) aims to compare pairwise distance between two point clouds. Our technique provides a robust means of comparing representations across different layers and models, with a particular focus on Graph Neural Networks (GNNs) to explore their unique capabilities. We show that our technique acts as a pseudometric, satisfies the properties of a similarity metric, is continuous and differentiable. We also demonstrate that NSA can serve as an effective loss function by utilizing it in autoencoders to preserve representation structure for dimensionality reduction. Furthermore, our empirical analysis showcases that NSA consistently outperforms or matches the results of previous techniques while offering computational efficiency. Its versatility extends to robustness analysis and various neural network training and representation learning applications, highlighting its wide applicability and potential to enhance the performance of neural networks.",
        "keywords": "Deep Learning;Representation Learning;Dimensionality Reduction;Metric Learning;Autoencoders;Similarity Metric;Graph Neural Networks",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/39c7dfd5c7dbd4d6fd9ce095b8b23dec9272d136.zip",
        "author": "Danish Ebadulla;Ambuj Singh",
        "authorids": "~Danish_Ebadulla1;~Ambuj_Singh1",
        "gender": "M;",
        "homepage": ";",
        "dblp": "311/5773.html;",
        "google_scholar": "LNzVTfcAAAAJ;",
        "orcid": "0000-0002-6635-6080;",
        "linkedin": "danish-ebadulla-7627a4156/;",
        "or_profile": "~Danish_Ebadulla1;~Ambuj_Singh1",
        "aff": "UC Santa Barbara;",
        "aff_domain": "ucsb.edu;",
        "position": "PhD student;",
        "bibtex": "@misc{\nebadulla2024normalized,\ntitle={Normalized Space Alignment: A Versatile Metric for Representation Space Discrepancy Minimization},\nauthor={Danish Ebadulla and Ambuj Singh},\nyear={2024},\nurl={https://openreview.net/forum?id=5HGPR6fg2S}\n}",
        "github": "",
        "project": "",
        "reviewers": "WXtW;wTyL;BYXr;odB3",
        "site": "https://openreview.net/forum?id=5HGPR6fg2S",
        "pdf_size": 12475731,
        "rating": "3;3;3;6",
        "confidence": "5;2;4;4",
        "soundness": "2;2;2;3",
        "contribution": "2;1;2;2",
        "presentation": "3;1;2;2",
        "wc_summary": "77;29;92;65",
        "wc_strengths": "90;17;61;38",
        "wc_weaknesses": "354;184;319;144",
        "wc_questions": "191;8;57;2",
        "wc_review": "712;238;529;249",
        "wc_reply_reviewers": "129;0;0;16",
        "wc_reply_authors": "1909;1245;968;822",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "4;2;2;2",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            65.75,
            23.27418097377435
        ],
        "wc_strengths_avg": [
            51.5,
            27.13392710243027
        ],
        "wc_weaknesses_avg": [
            250.25,
            88.2733680109692
        ],
        "wc_questions_avg": [
            64.5,
            76.08712111783439
        ],
        "wc_review_avg": [
            432.0,
            199.33263656511446
        ],
        "wc_reply_reviewers_avg": [
            36.25,
            53.94615370904584
        ],
        "wc_reply_authors_avg": [
            1236.0,
            417.2019894487561
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            0.8660254037844386
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.13245323570650439,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:MiamZ8MNfdgJ:scholar.google.com/&scioq=Normalized+Space+Alignment:+A+Versatile+Metric+for+Representation+Space+Discrepancy+Minimization&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of California, Santa Barbara",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucsb.edu",
        "aff_unique_abbr": "UCSB",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Santa Barbara",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "5HpZZbgdeK",
        "title": "Efficient calibration as a binary top-versus-all problem for classifiers with many classes",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Most classifiers based on deep neural networks associate their class prediction with a probability known as the confidence score. This score is often a by-product of the learning step and may not correctly estimate the classification accuracy, which impacts real-world usage. To be reliably used, the confidence score requires a post-processing calibration step. Data-driven methods have been proposed to calibrate the confidence score of already-trained classifiers. Still, many methods fail when the number of classes is high and per-class calibration data is scarce. To deal with a large number of classes, we propose to reformulate the confidence calibration of multiclass classifiers as a single binary classification problem. Our top-versus-all reformulation allows the use of the binary cross-entropy loss for scaling calibration methods. Contrary to the standard one-versus-all reformulation, it also allows the application of binary calibration methods to multiclass classifiers with efficient use of scarce per-class calibration data and without degradation of the accuracy. Additionally, we solve the problem of scaling methods overfitting the calibration set by introducing a regularization loss term during optimization. We evaluate our approach on an extensive list of deep networks and standard image classification datasets (CIFAR-10, CIFAR-100, and ImageNet). We show that it significantly improves the performance of existing calibration methods.",
        "keywords": "Calibration;Image Classification;Deep Learning;Neural Networks",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Adrien Le Coz;St\u00e9phane Herbin;Faouzi Adjed",
        "authorids": "~Adrien_Le_Coz1;~St\u00e9phane_Herbin1;~Faouzi_Adjed1",
        "gender": "M;M;M",
        "homepage": ";https://stepherbin.github.io/;",
        "dblp": "281/7439;49/247;",
        "google_scholar": "z-0Z-AwAAAAJ;https://scholar.google.fr/citations?user=xap7jEQAAAAJ;XikGL6wAAAAJ",
        "orcid": ";0000-0002-3341-3018;",
        "linkedin": ";;",
        "or_profile": "~Adrien_Le_Coz1;~St\u00e9phane_Herbin1;~Faouzi_Adjed1",
        "aff": "IRT SystemX;ONERA;SystemX",
        "aff_domain": "irt-systemx.fr;onera.fr;irt-systemx.fr",
        "position": "PhD student;Research Scientist;Researcher",
        "bibtex": "@misc{\ncoz2024efficient,\ntitle={Efficient calibration as a binary top-versus-all problem for classifiers with many classes},\nauthor={Adrien Le Coz and St{\\'e}phane Herbin and Faouzi Adjed},\nyear={2024},\nurl={https://openreview.net/forum?id=5HpZZbgdeK}\n}",
        "github": "",
        "project": "",
        "reviewers": "JkUP;75D8;TXd7;fZjD",
        "site": "https://openreview.net/forum?id=5HpZZbgdeK",
        "pdf_size": 312845,
        "rating": "3;5;6;6",
        "confidence": "3;4;4;3",
        "soundness": "3;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;2",
        "wc_summary": "75;43;71;60",
        "wc_strengths": "81;21;32;70",
        "wc_weaknesses": "140;2;145;106",
        "wc_questions": "812;71;325;49",
        "wc_review": "1108;137;573;285",
        "wc_reply_reviewers": "232;19;69;193",
        "wc_reply_authors": "1339;284;1543;596",
        "reply_reviewers": "1;1;1;2",
        "reply_authors": "2;1;2;2",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            62.25,
            12.397076268217438
        ],
        "wc_strengths_avg": [
            51.0,
            25.10975905897944
        ],
        "wc_weaknesses_avg": [
            98.25,
            57.56029447457683
        ],
        "wc_questions_avg": [
            314.25,
            307.1639423825655
        ],
        "wc_review_avg": [
            525.75,
            370.922751391715
        ],
        "wc_reply_reviewers_avg": [
            128.25,
            87.18192186457007
        ],
        "wc_reply_authors_avg": [
            940.5,
            517.5618320548763
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.40824829046386296,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:JIRXmv3-g9EJ:scholar.google.com/&scioq=Efficient+calibration+as+a+binary+top-versus-all+problem+for+classifiers+with+many+classes&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "IRT SystemX;ONERA;SystemX",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.irt-systemx.fr;https://www.onera.fr;",
        "aff_unique_abbr": ";ONERA;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "France;"
    },
    {
        "id": "5IOKw3AQe4",
        "title": "On the Theoretical Analysis of Dense Contrastive Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Contrastive learning has achieved outstanding performance in self-supervised learning. However, the canonical image-level matching pretext is unsuitable for multi-object dense prediction tasks like segmentation and detection. Recently, numerous studies have focused on dense contrastive learning (DCL) that adopts patch-level contrast to learning representations aware of local information. Although empirical evidence has validated its superiority, to date, there has not been any theoretical work that could formally explain and guarantee the effectiveness of DCL methods, which hinders their principled development. To bridge this gap, using the language of spectral graph theory, we establish the first theoretical framework for modeling and analyzing DCL by dissecting the corresponding patch-level positive-pair graph. Specifically, by decoupling the image-level and patch-level supervision, we theoretically characterize how different positive pair selection strategies affect the performance of DCL, and verify these insights on both synthetic and real-world datasets. Furthermore, drawing inspiration from the theory, we design two unsupervised metrics to guide the selection of positive pairs.",
        "keywords": "Contrastive Learning;Dense Contrastive Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Lizhe Fang;Yifei Wang;Yisen Wang",
        "authorids": "~Lizhe_Fang1;~Yifei_Wang1;~Yisen_Wang1",
        "gender": "M;M;M",
        "homepage": "https://zero-lab-pku.github.io/;https://yifeiwang77.com;https://yisenwang.github.io/",
        "dblp": ";00/555-1;172/1346-1",
        "google_scholar": ";-CLy6YsAAAAJ;uMWPDboAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Lizhe_Fang1;~Yifei_Wang1;~Yisen_Wang1",
        "aff": "Peking University;Massachusetts Institute of Technology;Peking University",
        "aff_domain": "pku.edu.cn;mit.edu;pku.edu.cn",
        "position": "PhD student;Postdoc;Assistant Professor",
        "bibtex": "@misc{\nfang2024on,\ntitle={On the Theoretical Analysis of Dense Contrastive Learning},\nauthor={Lizhe Fang and Yifei Wang and Yisen Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=5IOKw3AQe4}\n}",
        "github": "",
        "project": "",
        "reviewers": "hTKu;MfsU;vGDf",
        "site": "https://openreview.net/forum?id=5IOKw3AQe4",
        "pdf_size": 1259978,
        "rating": "6;6;6",
        "confidence": "3;4;2",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "2;1;3",
        "wc_summary": "60;103;142",
        "wc_strengths": "27;59;41",
        "wc_weaknesses": "71;837;51",
        "wc_questions": "5;105;43",
        "wc_review": "163;1104;277",
        "wc_reply_reviewers": "9;670;96",
        "wc_reply_authors": "216;3548;1101",
        "reply_reviewers": "1;3;1",
        "reply_authors": "1;7;4",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            101.66666666666667,
            33.48963355361709
        ],
        "wc_strengths_avg": [
            42.333333333333336,
            13.097921802925667
        ],
        "wc_weaknesses_avg": [
            319.6666666666667,
            365.90101879545995
        ],
        "wc_questions_avg": [
            51.0,
            41.21488404286329
        ],
        "wc_review_avg": [
            514.6666666666666,
            419.31240011343436
        ],
        "wc_reply_reviewers_avg": [
            258.3333333333333,
            293.2511248439164
        ],
        "wc_reply_authors_avg": [
            1621.6666666666667,
            1409.225871021234
        ],
        "reply_reviewers_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            4.0,
            2.449489742783178
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:G_pGcKMqjH4J:scholar.google.com/&scioq=On+the+Theoretical+Analysis+of+Dense+Contrastive+Learning&hl=en&as_sdt=0,47",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Peking University;Massachusetts Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.pku.edu.cn;https://web.mit.edu",
        "aff_unique_abbr": "Peking U;MIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "5Itc7v0pnA",
        "title": "Quantile-Free Regression: A Flexible Alternative to Quantile Regression",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Constructing valid prediction intervals rather than point estimates is a well-established method for uncertainty quantification in the regression setting. Models equipped with this capacity output an interval of values in which the ground truth target will fall with some prespecified probability. This is an essential requirement in many real-world applications in which simple point predictions' inability to convey the magnitude and frequency of errors renders them insufficient for high-stakes decisions. Quantile regression is well-established as a leading approach for obtaining such intervals via the empirical estimation of quantiles in the (non-parametric) distribution of outputs. This method is simple, computationally inexpensive, interpretable, assumption-free, and highly effective. However, it does require that the quantiles being learned are chosen a priori. This results in either (a) intervals that are arbitrarily symmetric around the median which is sub-optimal for real-world skewed distributions or (b) learning an excessive number of intervals. In this work, we propose Quantile-Free Regression (QFR), a direct replacement for quantile regression which liberates it from this limitation whilst maintaining its strengths. We demonstrate that this added flexibility results in intervals with an improvement in desirable qualities (e.g. sharpness) whilst maintaining the essential coverage guarantees of quantile regression.",
        "keywords": "Quantile regression;interval regression;pinball loss;neural networks",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/5443f7f0d63a9813f6460c3ff9fd19c362a3ffd1.zip",
        "author": "Thomas Pouplin;Alan Jeffares;Nabeel Seedat;Mihaela van der Schaar",
        "authorids": "~Thomas_Pouplin1;~Alan_Jeffares1;~Nabeel_Seedat1;~Mihaela_van_der_Schaar2",
        "gender": "M;;;F",
        "homepage": ";https://alanjeffares.com;;https://www.vanderschaar-lab.com",
        "dblp": "339/7726;304/1985;227/8368;",
        "google_scholar": "VVCoRhgAAAAJ;e65kJ08AAAAJ;https://scholar.google.com/citations?hl=en;DZ3S--MAAAAJ",
        "orcid": ";;;",
        "linkedin": ";alanjeffares;nabeel-seedat/;",
        "or_profile": "~Thomas_Pouplin1;~Alan_Jeffares1;~Nabeel_Seedat1;~Mihaela_van_der_Schaar2",
        "aff": "University of Cambridge;University of Cambridge;AstraZeneca;University of California, Los Angeles",
        "aff_domain": "cam.ac.uk;cam.ac.uk;astrazeneca.com;ucla.edu",
        "position": "PhD student;PhD student;Intern;Full Professor",
        "bibtex": "@misc{\npouplin2024quantilefree,\ntitle={Quantile-Free Regression: A Flexible Alternative to Quantile Regression},\nauthor={Thomas Pouplin and Alan Jeffares and Nabeel Seedat and Mihaela van der Schaar},\nyear={2024},\nurl={https://openreview.net/forum?id=5Itc7v0pnA}\n}",
        "github": "",
        "project": "",
        "reviewers": "eWa2;iRaW;LRPB;ccij;UxpT",
        "site": "https://openreview.net/forum?id=5Itc7v0pnA",
        "pdf_size": 685134,
        "rating": "3;3;5;5;5",
        "confidence": "4;4;3;4;5",
        "soundness": "2;2;3;3;2",
        "contribution": "2;2;3;4;2",
        "presentation": "3;3;3;2;3",
        "wc_summary": "85;96;90;53;60",
        "wc_strengths": "65;106;42;20;58",
        "wc_weaknesses": "196;182;137;25;35",
        "wc_questions": "2;101;169;308;508",
        "wc_review": "348;485;438;406;661",
        "wc_reply_reviewers": "0;0;69;0;0",
        "wc_reply_authors": "861;2270;1072;1370;1628",
        "reply_reviewers": "0;0;1;0;0",
        "reply_authors": "2;4;3;2;3",
        "rating_avg": [
            4.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.6,
            0.8
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            76.8,
            17.08098357823694
        ],
        "wc_strengths_avg": [
            58.2,
            28.47033543883879
        ],
        "wc_weaknesses_avg": [
            115.0,
            72.15815962176418
        ],
        "wc_questions_avg": [
            217.6,
            176.03704155659966
        ],
        "wc_review_avg": [
            467.6,
            106.47178029881908
        ],
        "wc_reply_reviewers_avg": [
            13.8,
            27.6
        ],
        "wc_reply_authors_avg": [
            1440.2,
            489.8589184653067
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            2.8,
            0.7483314773547882
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:R78nC4QmoI0J:scholar.google.com/&scioq=Quantile-Free+Regression:+A+Flexible+Alternative+to+Quantile+Regression&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "University of Cambridge;AstraZeneca;University of California, Los Angeles",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.cam.ac.uk;https://www.astrazeneca.com;https://www.ucla.edu",
        "aff_unique_abbr": "Cambridge;AZ;UCLA",
        "aff_campus_unique_index": "0;0;2",
        "aff_campus_unique": "Cambridge;;Los Angeles",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "title": "An Intuitive Multi-Frequency Feature Representation for SO(3)-Equivariant Networks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19431",
        "id": "5JWAOLBxwp",
        "author_site": "Dongwon Son, Jaehyung Kim, Sanghyeon Son, Beomjoon Kim",
        "tldr": "",
        "abstract": "The usage of 3D vision algorithms, such as shape reconstruction, remains limited because they require inputs to be at a fixed canonical rotation. Recently, a simple equivariant network, Vector Neuron (VN) has been proposed that can be easily used with the state-of-the-art 3D neural network (NN) architectures. However, its performance is limited because it is designed to use only three-dimensional features, which is insufficient to capture the details present in 3D data. In this paper, we introduce an equivariant feature representation for mapping a 3D point to a high-dimensional feature space. Our feature can discern multiple frequencies present in 3D data, which, as shown by Tancik et al. (2020), is the key to designing an expressive feature for 3D vision tasks. Our representation can be used as an input to VNs, and the results demonstrate that with our feature representation, VN captures more details, overcoming the limitation raised in its original paper.",
        "keywords": "Equivariant networks;SO(3) Equivariance;Fourier features",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Dongwon Son;Jaehyung Kim;Sanghyeon Son;Beomjoon Kim",
        "authorids": "~Dongwon_Son1;~Jaehyung_Kim2;~Sanghyeon_Son1;~Beomjoon_Kim2",
        "gender": "M;;;M",
        "homepage": "https://dongwon-son.github.io/;;;https://beomjoonkim.github.io/",
        "dblp": "226/6343;;;88/1505",
        "google_scholar": "https://scholar.google.co.kr/citations?user=oaUQsWgAAAAJ;;;https://scholar.google.ca/citations?user=dw3rEwgAAAAJ",
        "orcid": "0000-0003-1446-8125;;;",
        "linkedin": ";jaehyung-kim-a666551ba/;;",
        "or_profile": "~Dongwon_Son1;~Jaehyung_Kim2;~Sanghyeon_Son1;~Beomjoon_Kim2",
        "aff": "KAIST;KAIST;;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr;;kaist.ac.kr",
        "position": "PhD student;MS student;;Assistant Professor",
        "bibtex": "@inproceedings{\nson2024an,\ntitle={An Intuitive Multi-Frequency Feature Representation for {SO}(3)-Equivariant Networks},\nauthor={Dongwon Son and Jaehyung Kim and Sanghyeon Son and Beomjoon Kim},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=5JWAOLBxwp}\n}",
        "github": "",
        "project": "",
        "reviewers": "Jvrz;HjVh;XaCw;79hQ;MkmG",
        "pdf_size": 3314025,
        "rating": "5;6;6;6;6",
        "confidence": "2;2;4;3;3",
        "soundness": "2;3;3;3;3",
        "contribution": "3;3;3;3;3",
        "presentation": "2;2;3;3;3",
        "wc_summary": "147;82;62;61;48",
        "wc_strengths": "135;79;76;61;81",
        "wc_weaknesses": "156;510;183;100;22",
        "wc_questions": "184;92;3;8;2",
        "wc_review": "622;763;324;230;153",
        "wc_reply_reviewers": "0;0;12;26;24",
        "wc_reply_authors": "1090;2404;636;437;306",
        "reply_reviewers": "0;0;1;1;1",
        "reply_authors": "2;5;1;1;1",
        "rating_avg": [
            5.8,
            0.39999999999999997
        ],
        "confidence_avg": [
            2.8,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            80.0,
            35.21931288370062
        ],
        "wc_strengths_avg": [
            86.4,
            25.295058806019803
        ],
        "wc_weaknesses_avg": [
            194.2,
            167.23683804712405
        ],
        "wc_questions_avg": [
            57.8,
            71.68374990191292
        ],
        "wc_review_avg": [
            418.4,
            234.54006054403584
        ],
        "wc_reply_reviewers_avg": [
            12.4,
            11.200000000000001
        ],
        "wc_reply_authors_avg": [
            974.6,
            762.5209767606397
        ],
        "reply_reviewers_avg": [
            0.6,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            2.0,
            1.5491933384829668
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5345224838248488,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6998817567924967616&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=5JWAOLBxwp",
        "pdf": "https://openreview.net/pdf?id=5JWAOLBxwp",
        "email": "kaist.ac.kr;kaist.ac.kr;;kaist.ac.kr",
        "author_num": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "5KF3Q79t8B",
        "title": "Learning An Efficient-And-Rigorous Neural Multigrid Solver",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Partial Differential Equations (PDEs) and their efficient\nnumerical solutions are of fundamental significance to science and\nengineering involving heavy computation. To date, the historical\nreliance on legacy generic numerical solvers has circumscribed\npossible integration of big data knowledge and exhibits sub-optimal\nefficiency for certain PDE formulations. In contrast, AI-inspired\nneural methods have the potential to learn such knowledge from big data\nand endow numerical solvers with compact structures and high\nefficiency, but still with unconquered challenges including, a lack of\nsound mathematical backbone, no guarantee of correctness or\nconvergence, and low accuracy, thus unable to handle complex, unseen\nscenarios. This paper articulates a mathematically rigorous neural PDE\nsolver by integrating iterative solvers and the Multigrid Method\nwith Convolutional Neural Networks (CNNs). \nOur novel UGrid neural solver, built upon the principled integration of \nU-Net and MultiGrid, manifests\na mathematically rigorous proof of both convergence and correctness,\nand showcases high numerical accuracy and strong generalization power\nto complicated cases not observed during the training phase. In\naddition, we devise a new residual loss metric, which enables\nunsupervised training and affords more stability and a larger solution\nspace over the legacy losses. We conduct extensive experiments on\nPoisson's equations, and our comprehensive evaluations have confirmed\nall of the aforementioned theoretical and numerical advantages.\nFinally, a mathematically-sound proof affords our new method to\ngeneralize to other types of linear PDEs.",
        "keywords": "Partial Differential Equations;Numerical Solver;Neural Solver;Multigrid Method",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/5d473dd1db48b355b88380959e0f201c7228715f.pdf",
        "author": "Xi Han;Fei Hou;Hong Qin",
        "authorids": "~Xi_Han1;~Fei_Hou1;~Hong_Qin1",
        "gender": "M;M;M",
        "homepage": ";https://lcs.ios.ac.cn/~houf/;http://www.cs.stonybrook.edu/~qin",
        "dblp": ";24/3702;79/627-1",
        "google_scholar": "paSti1kAAAAJ;NWoYRf8AAAAJ;NOcejj8AAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Xi_Han1;~Fei_Hou1;~Hong_Qin1",
        "aff": "State University of New York at Stony Brook;Institute of Software, Chinese Academy of Sciences;Stony Brook University (State University of New York, Stony Brook)",
        "aff_domain": "stonybrook.edu;ios.ac.cn;cs.stonybrook.edu",
        "position": "PhD student;Associate Professor;Full Professor",
        "bibtex": "@misc{\nhan2024learning,\ntitle={Learning An Efficient-And-Rigorous Neural Multigrid Solver},\nauthor={Xi Han and Fei Hou and Hong Qin},\nyear={2024},\nurl={https://openreview.net/forum?id=5KF3Q79t8B}\n}",
        "github": "",
        "project": "",
        "reviewers": "pjtp;Ejzh;BHtd;APYK",
        "site": "https://openreview.net/forum?id=5KF3Q79t8B",
        "pdf_size": 25176367,
        "rating": "3;3;5;6",
        "confidence": "3;4;4;3",
        "soundness": "4;3;3;3",
        "contribution": "2;1;3;3",
        "presentation": "1;3;2;3",
        "wc_summary": "26;202;62;106",
        "wc_strengths": "51;147;46;140",
        "wc_weaknesses": "249;121;451;136",
        "wc_questions": "31;23;338;165",
        "wc_review": "357;493;897;547",
        "wc_reply_reviewers": "0;0;38;0",
        "wc_reply_authors": "827;1695;1274;379",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "2;2;3;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            99.0,
            65.87108622149782
        ],
        "wc_strengths_avg": [
            96.0,
            47.5972688292091
        ],
        "wc_weaknesses_avg": [
            239.25,
            131.88702551805466
        ],
        "wc_questions_avg": [
            139.25,
            127.8639413595561
        ],
        "wc_review_avg": [
            573.5,
            199.1902357044642
        ],
        "wc_reply_reviewers_avg": [
            9.5,
            16.454482671904334
        ],
        "wc_reply_authors_avg": [
            1043.75,
            491.43024683061583
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.19245008972987526,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:I15nbenFRvcJ:scholar.google.com/&scioq=Learning+An+Efficient-And-Rigorous+Neural+Multigrid+Solver&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "State University of New York at Stony Brook;Chinese Academy of Sciences;Stony Brook University",
        "aff_unique_dep": ";Institute of Software;",
        "aff_unique_url": "https://www.stonybrook.edu;http://www.ios.ac.cn;https://www.stonybrook.edu",
        "aff_unique_abbr": "SUNY Stony Brook;CAS;SBU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Stony Brook;",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "Implicit Neural Representation Inference for Low-Dimensional Bayesian Deep Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19430",
        "id": "5KUiMKRebi",
        "author_site": "Panagiotis Dimitrakopoulos, Giorgos Sfikas, Christophoros Nikou",
        "tldr": "",
        "abstract": "Bayesian inference is the standard for providing full predictive distributions with well calibrated uncertainty estimates.\n\tHowever, scaling to a modern, overparameterized deep learning setting \n\ttypically comes at the cost of severe and restrictive approximations, sacrificing model predictive strength.\n\tWith our approach, we factor model parameters as a function of deterministic and probabilistic components;\n\tthe model is solved by combining maximum a posteriori estimation of the former,\n\twith inference over a low-dimensional, Implicit Neural Representation of the latter.\n\tThis results in a solution that combines both predictive accuracy and good calibration,\n\tas it entails inducing stochasticity over the full set of model weights while being comparatively cheap to compute.\n\tExperimentally, our approach compares favorably to the state of the art,\n\tincluding much more expensive methods as well as less expressive posterior approximations over full network parameters.",
        "keywords": "Bayesian Deep Learning;Implicit neural representations;Probabilistic machine learning;Hypernetworks",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Panagiotis Dimitrakopoulos;Giorgos Sfikas;Christophoros Nikou",
        "authorids": "~Panagiotis_Dimitrakopoulos2;~Giorgos_Sfikas1;~Christophoros_Nikou1",
        "gender": ";M;M",
        "homepage": ";http://www.cs.uoi.gr/~sfikas;https://www.cse.uoi.gr/~cnikou/",
        "dblp": ";01/747;26/429",
        "google_scholar": "https://scholar.google.gr/citations?user=Xz0qnGoAAAAJ;X73G9lYAAAAJ;",
        "orcid": ";0000-0002-7305-2886;",
        "linkedin": ";giorgos-sfikas-15a30484/;",
        "or_profile": "~Panagiotis_Dimitrakopoulos2;~Giorgos_Sfikas1;~Christophoros_Nikou1",
        "aff": "University of Ioannina;University of West Attica;University of Ioannina",
        "aff_domain": "uoi.gr;uniwa.gr;uoi.gr",
        "position": "PhD student;Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\ndimitrakopoulos2024implicit,\ntitle={Implicit Neural Representation Inference for Low-Dimensional Bayesian Deep Learning},\nauthor={Panagiotis Dimitrakopoulos and Giorgos Sfikas and Christophoros Nikou},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=5KUiMKRebi}\n}",
        "github": "",
        "project": "",
        "reviewers": "Ji8X;VEKs;tKmG;wVmX",
        "pdf_size": 1392743,
        "rating": "5;5;5;8",
        "confidence": "4;3;5;4",
        "soundness": "2;2;3;3",
        "contribution": "2;3;2;3",
        "presentation": "2;2;3;4",
        "wc_summary": "126;108;80;109",
        "wc_strengths": "43;87;118;20",
        "wc_weaknesses": "293;275;146;76",
        "wc_questions": "194;160;198;187",
        "wc_review": "656;630;542;392",
        "wc_reply_reviewers": "0;897;19;23",
        "wc_reply_authors": "1918;3648;2710;1530",
        "reply_reviewers": "0;3;1;1",
        "reply_authors": "8;14;9;8",
        "rating_avg": [
            5.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            105.75,
            16.498105951896417
        ],
        "wc_strengths_avg": [
            67.0,
            38.03288051147323
        ],
        "wc_weaknesses_avg": [
            197.5,
            90.19562073626413
        ],
        "wc_questions_avg": [
            184.75,
            14.821858857781638
        ],
        "wc_review_avg": [
            555.0,
            103.15522284402279
        ],
        "wc_reply_reviewers_avg": [
            234.75,
            382.44893449975774
        ],
        "wc_reply_authors_avg": [
            2451.5,
            811.2057383919322
        ],
        "reply_reviewers_avg": [
            1.25,
            1.0897247358851685
        ],
        "reply_authors_avg": [
            9.75,
            2.48746859276655
        ],
        "replies_avg": [
            50,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6565143739902807954&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=5KUiMKRebi",
        "pdf": "https://openreview.net/pdf?id=5KUiMKRebi",
        "email": "uoi.gr;uniwa.gr;uoi.gr",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Ioannina;University of West Attica",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uoi.gr;https://www.uoa.gr",
        "aff_unique_abbr": "UOI;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Greece"
    },
    {
        "id": "5KcFkhEj4x",
        "title": "In Search of the Long-Tail: Systematic Generation of Long-Tail Knowledge via Logical Rule Induced Search",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Since large language models (LLMs) have approached human-level performance on many tasks, it has become increasingly harder for researchers to find tasks that are still challenging to the models. Failure cases usually come from the long-tail distribution -- data to which an oracle language model could assign a probability on the lower end of its distribution. Systematically finding evaluation data in the long-tail distribution is important, but current methodology such as prompt engineering or crowdsourcing are insufficient because coming up with long-tail examples is also hard for humans due to our cognitive bias. In this paper, we propose a Logic-Induced-Knowledge-Search (LINK) framework for systematically generating long-tail knowledge statements. Grounded by a symbolic logic rule, we search for long-tail values for each variable of the rule by first prompting a large language model, then verifying the correctness of the values with a critic, and lastly pushing for the long-tail distribution with a reranker. Using this framework we construct a dataset, Logic-Induced-Long-Tail (LINT [https://doi.org/10.5281/zenodo.8384878]), consisting of 200 symbolic rules and 40K knowledge statements spanning across four different domains. Human annotations find that 89% of the statements in LINT are factually correct. In contrast, ChatGPT and GPT4 struggle with directly generating long-tail statements under the guidance of logic rules, each only getting 61% and 79% of their statements correct. Moreover, their ``long-tail\" generations in fact fall into the higher likelihood range, and thus are not really long-tail. Our findings suggest that LINK is effective for generating data in the long-tail distribution while enforcing quality. To demonstrate how the community can utilize LINT for systematically evaluating LLMs' capabilities in the long-tail distribution, we challenge the models with a simple entailment classification task using samples from LINT. We find that ChatGPT and GPT4 performances drop by 2% and 4% when reasoning on long-tail knowledge statements compared to on head distribution statements. We hope our work can inspire future research on generating evaluation data in the long-tail distribution.",
        "keywords": "long-tail;evaluation;generation;large language model;symbolic rule;reasoning",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Huihan Li;Zeyi Liao;Yuting Ning;Siyuan Wang;Xiang Lorraine Li;Ximing Lu;Faeze Brahman;Wenting Zhao;Yejin Choi;Xiang Ren",
        "authorids": "~Huihan_Li1;~Zeyi_Liao1;~Yuting_Ning1;~Siyuan_Wang1;~Xiang_Lorraine_Li1;~Ximing_Lu1;~Faeze_Brahman1;~Wenting_Zhao1;~Yejin_Choi1;~Xiang_Ren1",
        "gender": "F;M;;F;F;F;;F;M;F",
        "homepage": "https://huihanlhh.github.io/;https://lzy37ld.github.io/;https://nnnyt.github.io;https://siyuanwangw.github.io;https://gloriaximinglu.github.io/;https://fabrahman.github.io;;https://yejinc.github.io/;https://shanzhenren.github.io/;https://people.cs.pitt.edu/~xianglli/",
        "dblp": "309/5929-1;;;12/9626;24/10879;276/6005;41/10049-2.html;89/579-1;36/360-1;40/1491-69",
        "google_scholar": "NxdcyroAAAAJ;vpv_bHEAAAAJ;HYmzF-QAAAAJ;t_tryJ0AAAAJ;https://scholar.google.com/citations?hl=en;viCG2ikAAAAJ;sycHskQAAAAJ;vhP-tlcAAAAJ;_moJlrIAAAAJ;SRgRwSoAAAAJ",
        "orcid": ";;;;;;;;;",
        "linkedin": ";;;;;;;;xren7;",
        "or_profile": "~Huihan_Li1;~Zeyi_Liao1;~Yuting_Ning1;~Siyuan_Wang1;~Ximing_Lu1;~Faeze_Brahman1;~Wenting_Zhao1;~Yejin_Choi1;~Xiang_Ren1;~Xiang_Li2",
        "aff": "University of Southern California;Ohio State University, Columbus;University of Science and Technology of China;University of Southern California;University of Washington;Allen Institute for AI;Cornell University;Department of Computer Science, University of Washington;University of Southern California;University of Pittsburgh",
        "aff_domain": "usc.edu;osu.edu;ustc.edu.cn;usc.edu;cs.washington.edu;allenai.org;cornell.edu;cs.washington.edu;usc.edu;pitt.edu",
        "position": "PhD student;PhD student;MS student;Postdoc;PhD student;Postdoc;PhD student;Full Professor;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nli2024in,\ntitle={In Search of the Long-Tail: Systematic Generation of Long-Tail Knowledge via Logical Rule Induced Search},\nauthor={Huihan Li and Zeyi Liao and Yuting Ning and Siyuan Wang and Xiang Lorraine Li and Ximing Lu and Faeze Brahman and Wenting Zhao and Yejin Choi and Xiang Ren},\nyear={2024},\nurl={https://openreview.net/forum?id=5KcFkhEj4x}\n}",
        "github": "",
        "project": "",
        "reviewers": "zFAF;TKVD;tVDU;pztA",
        "site": "https://openreview.net/forum?id=5KcFkhEj4x",
        "pdf_size": 4201363,
        "rating": "3;3;5;8",
        "confidence": "3;4;4;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;4",
        "presentation": "3;2;3;4",
        "wc_summary": "146;74;323;171",
        "wc_strengths": "32;8;7;81",
        "wc_weaknesses": "211;240;12;49",
        "wc_questions": "1;2;5;114",
        "wc_review": "390;324;347;415",
        "wc_reply_reviewers": "0;0;0;77",
        "wc_reply_authors": "1161;1047;956;987",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "4;4;4;3",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            178.5,
            90.70970179644513
        ],
        "wc_strengths_avg": [
            32.0,
            30.008332176247315
        ],
        "wc_weaknesses_avg": [
            128.0,
            98.90652152411387
        ],
        "wc_questions_avg": [
            30.5,
            48.23121395942673
        ],
        "wc_review_avg": [
            369.0,
            35.58791929854849
        ],
        "wc_reply_reviewers_avg": [
            19.25,
            33.34197804570089
        ],
        "wc_reply_authors_avg": [
            1037.75,
            78.31786194732335
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.75,
            0.4330127018922193
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.49374193110101877,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:x3qfXfiSQ_sJ:scholar.google.com/&scioq=In+Search+of+the+Long-Tail:+Systematic+Generation+of+Long-Tail+Knowledge+via+Logical+Rule+Induced+Search&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0;3;4;5;3;0;6",
        "aff_unique_norm": "University of Southern California;Ohio State University;University of Science and Technology of China;University of Washington;Allen Institute for AI;Cornell University;University of Pittsburgh",
        "aff_unique_dep": ";;;;;;",
        "aff_unique_url": "https://www.usc.edu;https://www.osu.edu;http://www.ustc.edu.cn;https://www.washington.edu;https://allenai.org;https://www.cornell.edu;https://www.pitt.edu",
        "aff_unique_abbr": "USC;OSU;USTC;UW;AI2;Cornell;Pitt",
        "aff_campus_unique_index": "0;1;0;3;0",
        "aff_campus_unique": "Los Angeles;Columbus;;Seattle",
        "aff_country_unique_index": "0;0;1;0;0;0;0;0;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "5KckEwghKo",
        "title": "From Cluster Assumption to Graph Convolution: Graph-based Semi-Supervised Learning Revisited",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Graph-based semi-supervised learning (GSSL) has long been a research focus. Traditional methods are generally shallow learners, based on the cluster assumption. Recently, graph convolutional networks (GCNs) have become the predominant techniques for their promising performance. In this paper, we theoretically discuss the relationship between these two types of methods in a unified optimization framework. One of the most intriguing findings is that, unlike traditional ones, typical GCNs may not effectively incorporate both graph structure and label information at each layer. Motivated by this, we propose three simple but powerful graph convolution methods. The first is a supervised method OGC which guides the graph convolution process with labels. The others are two \u201cno-learning\u201d unsupervised methods: GGC and its multi-scale version GGCM, both aiming to preserve the graph structure information during the convolution process. Finally, we conduct extensive experiments to show the effectiveness of our methods.",
        "keywords": "Graph Convolution Networks;Graph Embedding;Semi-Supervised Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/3fbea7a973a7eefb4404071301d5f3e8ebdb258d.zip",
        "author": "Zheng Wang;Hongming Ding;Li Pan;Jianhua Li;Zhiguo Gong;Philip S. Yu",
        "authorids": "~Zheng_Wang24;~Hongming_Ding1;~Li_Pan1;~Jianhua_Li3;~Zhiguo_Gong1;~Philip_S._Yu1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://zhengwang100.github.io/;https://www.nowcoder.com/profile/292263636;https://icst.sjtu.edu.cn/DirectoryDetail.aspx?id=12;https://infosec.sjtu.edu.cn/TeamDetail.aspx?id=9;https://www.fst.um.edu.mo/people/fstzgg/;https://cs.uic.edu/profiles/philip-yu/",
        "dblp": "181/2834-45;;26/4737;93/3389-1.html;95/6295;y/PhilipSYu",
        "google_scholar": "Znbe2RgAAAAJ;;;;i75MaGYAAAAJ;D0lL1r0AAAAJ",
        "orcid": ";;0000-0002-0424-9845;;;0000-0002-3491-5968",
        "linkedin": ";;;;;",
        "or_profile": "~Zheng_Wang24;~Hongming_Ding1;~Li_Pan1;~Jianhua_Li3;~Zhiguo_Gong1;~Philip_S._Yu1",
        "aff": "Shanghai Jiaotong University;NIO;Shanghai Jiaotong University;Shanghai Jiaotong University;University of Macau;University of Illinois Chicago",
        "aff_domain": "sjtu.edu.cn;nio.com;sjtu.edu.cn;sjtu.edu.cn;um.edu.mo;uic.edu",
        "position": "Associate Professor;Researcher;Full Professor;Full Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nwang2024from,\ntitle={From Cluster Assumption to Graph Convolution: Graph-based Semi-Supervised Learning Revisited},\nauthor={Zheng Wang and Hongming Ding and Li Pan and Jianhua Li and Zhiguo Gong and Philip S. Yu},\nyear={2024},\nurl={https://openreview.net/forum?id=5KckEwghKo}\n}",
        "github": "",
        "project": "",
        "reviewers": "9Ae7;2zfL;seo4;WdoQ",
        "site": "https://openreview.net/forum?id=5KckEwghKo",
        "pdf_size": 898400,
        "rating": "3;3;5;5",
        "confidence": "4;4;3;4",
        "soundness": "2;2;2;2",
        "contribution": "1;1;2;2",
        "presentation": "2;1;2;3",
        "wc_summary": "46;63;84;91",
        "wc_strengths": "18;11;42;68",
        "wc_weaknesses": "162;166;345;90",
        "wc_questions": "34;3;67;2",
        "wc_review": "260;243;538;251",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            71.0,
            17.7341478509682
        ],
        "wc_strengths_avg": [
            34.75,
            22.37604746151563
        ],
        "wc_weaknesses_avg": [
            190.75,
            94.05151513931075
        ],
        "wc_questions_avg": [
            26.5,
            26.688012290165037
        ],
        "wc_review_avg": [
            323.0,
            124.27590273258932
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8502318163900352528&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;0;0;2;3",
        "aff_unique_norm": "Shanghai Jiao Tong University;NIO;University of Macau;University of Illinois at Chicago",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.sjtu.edu.cn;;https://www.um.edu.mo;https://www.uic.edu",
        "aff_unique_abbr": "SJTU;;UM;UIC",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Macau SAR;Chicago",
        "aff_country_unique_index": "0;0;0;0;2",
        "aff_country_unique": "China;;United States"
    },
    {
        "title": "MMICL: Empowering Vision-language Model with Multi-Modal In-Context Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19429",
        "id": "5KojubHBr8",
        "author_site": "Haozhe Zhao, Zefan Cai, Shuzheng Si, Xiaojian Ma, Kaikai An, Liang Chen, Zixuan Liu, Sheng Wang, Wenjuan Han, Baobao Chang",
        "tldr": "",
        "abstract": "Since the resurgence of deep learning, vision-language models (VLMs) enhanced by large language models (LLMs) have grown exponentially in popularity. \nHowever, while LLMs can utilize extensive background knowledge and task information with in-context learning, most VLMs still struggle with understanding complex multi-modal prompts with multiple images, making VLMs less effective in downstream vision-language tasks.\nIn this paper, we address the limitation above by 1) introducing vision-language Model with **M**ulti-**M**odal **I**n-**C**ontext **L**earning(MMICL), a new approach to allow the VLM to deal with multi-modal inputs efficiently; 2) proposing a novel context scheme to augment the in-context learning ability of the VLM; 3) constructing the Multi-modal In-Context Learning (MIC) dataset, designed to enhance the VLM's ability to understand complex multi-modal prompts.\nOur experiments confirm that MMICL achieves new state-of-the-art zero-shot performance on a wide range of general vision-language tasks, especially for complex benchmarks, including MME and MMBench. Our analysis demonstrates that MMICL effectively tackles the challenge of complex multi-modal prompt understanding and emerges the impressive ICL ability. Furthermore, we observe that MMICL successfully alleviates language bias in VLMs, a common issue for VLMs that often leads to hallucination when faced with extensive textual context.\nOur code, dataset, dataset tool, and model are available at https://github.com/PKUnlp-icler/MIC.",
        "keywords": "multi-modal in-context learning; multi-modal instruction tuning; vision-language model",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Haozhe Zhao;Zefan Cai;Shuzheng Si;Xiaojian Ma;Kaikai An;Liang Chen;Zixuan Liu;Sheng Wang;Wenjuan Han;Baobao Chang",
        "authorids": "~Haozhe_Zhao1;~Zefan_Cai1;~Shuzheng_Si1;~Xiaojian_Ma1;~Kaikai_An1;~Liang_Chen10;~Zixuan_Liu1;~Sheng_Wang7;~Wenjuan_Han1;~Baobao_Chang1",
        "gender": "M;;M;;M;M;M;;F;M",
        "homepage": ";;;;https://github.com/kkk-an;https://chenllliang.github.io;;http://homes.cs.washington.edu/~swang;https://scholar.google.com/citations?user=rfVLLfAAAAAJ;http://eecs.pku.edu.cn/EN/People/Faculty/Detail/?ID=6027",
        "dblp": "299/7199;;324/3680;;;01/5394-24;;;188/9071;91/6051",
        "google_scholar": "skIXywUAAAAJ;;https://scholar.google.com.hk/citations?user=zO2XyZUAAAAJ;;6TrBRiEAAAAJ;lMKPaTYAAAAJ;yjKOHbEAAAAJ;;rfVLLfAAAAAJ;LaKNyhQAAAAJ",
        "orcid": "0000-0003-0502-4426;;;;;;;;0000-0002-2327-0842;0000-0003-2824-6750",
        "linkedin": ";;;;;;;;;",
        "or_profile": "~Haozhe_Zhao1;~Zefan_Cai1;~Shuzheng_Si1;~Xiaojian_Ma1;~Kaikai_An1;~Liang_Chen10;~Zixuan_Liu1;~Sheng_Wang7;~Wenjuan_Han1;~Baobao_Chang1",
        "aff": "Peking University;;Peking University;;Peking University;Peking University;University of Washington;University of Washington, Seattle;Beijing Jiaotong University;Peking University",
        "aff_domain": "pku.edu.cn;;pku.edu.cn;;pku.edu.cn;pku.edu.cn;uw.edu;uw.edu;bjtu.edu.cn;pku.edu.cn",
        "position": "MS student;;MS student;;MS student;PhD student;PhD student;Assistant Professor;Associate Professor;Associate Professor",
        "bibtex": "@inproceedings{\nzhao2024mmicl,\ntitle={{MMICL}: Empowering Vision-language Model with Multi-Modal In-Context Learning},\nauthor={Haozhe Zhao and Zefan Cai and Shuzheng Si and Xiaojian Ma and Kaikai An and Liang Chen and Zixuan Liu and Sheng Wang and Wenjuan Han and Baobao Chang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=5KojubHBr8}\n}",
        "github": "",
        "project": "",
        "reviewers": "eWon;7yvn;d1dY;iVLP;QUmJ",
        "pdf_size": 8910437,
        "rating": "3;5;6;6;8",
        "confidence": "4;5;5;4;4",
        "soundness": "2;3;3;4;3",
        "contribution": "2;3;2;3;3",
        "presentation": "1;3;2;2;3",
        "wc_summary": "106;155;49;117;48",
        "wc_strengths": "34;109;35;97;20",
        "wc_weaknesses": "474;404;81;91;77",
        "wc_questions": "53;83;2;146;4",
        "wc_review": "667;751;167;451;149",
        "wc_reply_reviewers": "501;292;0;187;0",
        "wc_reply_authors": "6009;2965;1415;3120;707",
        "reply_reviewers": "1;2;0;1;0",
        "reply_authors": "10;8;4;6;2",
        "rating_avg": [
            5.6,
            1.624807680927192
        ],
        "confidence_avg": [
            4.4,
            0.48989794855663565
        ],
        "soundness_avg": [
            3.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.2,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            95.0,
            41.30375285612676
        ],
        "wc_strengths_avg": [
            59.0,
            36.51301137950689
        ],
        "wc_weaknesses_avg": [
            225.4,
            175.8619913454866
        ],
        "wc_questions_avg": [
            57.6,
            53.7497906972669
        ],
        "wc_review_avg": [
            437.0,
            248.00645152898744
        ],
        "wc_reply_reviewers_avg": [
            196.0,
            189.2902533148498
        ],
        "wc_reply_authors_avg": [
            2843.2,
            1828.4883811498503
        ],
        "reply_reviewers_avg": [
            0.8,
            0.7483314773547883
        ],
        "reply_authors_avg": [
            6.0,
            2.8284271247461903
        ],
        "replies_avg": [
            42,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": -0.05025189076296061,
        "gs_citation": 56,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18220756047687730171&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=5KojubHBr8",
        "pdf": "https://openreview.net/pdf?id=5KojubHBr8",
        "email": "pku.edu.cn;;pku.edu.cn;;pku.edu.cn;pku.edu.cn;uw.edu;uw.edu;bjtu.edu.cn;pku.edu.cn",
        "author_num": 10,
        "aff_unique_index": "0;0;0;0;1;1;2;0",
        "aff_unique_norm": "Peking University;University of Washington;Beijing Jiao Tong University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.washington.edu;http://www.njtu.edu.cn/en",
        "aff_unique_abbr": "Peking U;UW;BJTU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Seattle",
        "aff_country_unique_index": "0;0;0;0;1;1;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "5LhYYajlqV",
        "title": "In-Context Unlearning: Language Models as Few Shot Unlearners",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Machine unlearning has garnered increased attention within regulatory contexts, driven by the need to comply with the \"Right to be Forgotten''. However, achieving precise unlearning is computationally infeasible for large models, particularly when dealing with large language models (LLMs). To this end, several algorithms which approximate the removal of training data without retraining the model have been proposed which rely on gradient ascent based model updates. In this work, we propose a new class of unlearning methods  called \"In-Context Unlearning'' suitable for LLMs by providing inputs in context and without having to update model parameters. To unlearn a particular training instance, we provide the instance alongside a different label and additional correctly labelled instances as inputs to the LLM at inference time. Our experimental results across various text classification tasks demonstrate that these contexts effectively remove specific information from the training set while maintaining performance levels that are competitive with state-of-the-art unlearning methods that require access to the LLM parameters.",
        "keywords": "Machine unlearning;In-context unlearning;Right to be forgotten;Approximate data deletion",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/02cc08f0314c30511359ffc5f1219cd39d017f78.zip",
        "author": "Martin Pawelczyk;Seth Neel;Himabindu Lakkaraju",
        "authorids": "~Martin_Pawelczyk1;~Seth_Neel2;~Himabindu_Lakkaraju1",
        "gender": "M;F;M",
        "homepage": "https://sites.google.com/view/martinpawelczyk/;http://web.stanford.edu/~himalv;https://sethneel.com",
        "dblp": "251/3229;68/9376;188/6406",
        "google_scholar": "oYAf_hgAAAAJ;;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Martin_Pawelczyk1;~Hima_Lakkaraju1;~Seth_Neel1",
        "aff": "Harvard University;Harvard University;Harvard University",
        "aff_domain": "harvard.edu;harvard.edu;harvard.edu",
        "position": "Postdoc;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\npawelczyk2024incontext,\ntitle={In-Context Unlearning: Language Models as Few Shot Unlearners},\nauthor={Martin Pawelczyk and Seth Neel and Himabindu Lakkaraju},\nyear={2024},\nurl={https://openreview.net/forum?id=5LhYYajlqV}\n}",
        "github": "",
        "project": "",
        "reviewers": "fKNk;Awru;poKX",
        "site": "https://openreview.net/forum?id=5LhYYajlqV",
        "pdf_size": 15565023,
        "rating": "5;5;6",
        "confidence": "4;3;2",
        "soundness": "3;3;3",
        "contribution": "3;2;3",
        "presentation": "2;3;3",
        "wc_summary": "240;54;61",
        "wc_strengths": "90;81;24",
        "wc_weaknesses": "600;216;32",
        "wc_questions": "311;13;89",
        "wc_review": "1241;364;206",
        "wc_reply_reviewers": "130;0;0",
        "wc_reply_authors": "2149;1608;659",
        "reply_reviewers": "1;0;0",
        "reply_authors": "4;3;1",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            118.33333333333333,
            86.07877529075071
        ],
        "wc_strengths_avg": [
            65.0,
            29.223278392404914
        ],
        "wc_weaknesses_avg": [
            282.6666666666667,
            236.62816588244286
        ],
        "wc_questions_avg": [
            137.66666666666666,
            126.43136038534463
        ],
        "wc_review_avg": [
            603.6666666666666,
            455.2554838280979
        ],
        "wc_reply_reviewers_avg": [
            43.333333333333336,
            61.282587702834114
        ],
        "wc_reply_authors_avg": [
            1472.0,
            615.844677387624
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 113,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5161391496565915695&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Harvard University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.harvard.edu",
        "aff_unique_abbr": "Harvard",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Multiscale Positive-Unlabeled Detection of AI-Generated Texts",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19428",
        "id": "5Lp6qU9hzV",
        "author_site": "Yuchuan Tian, Hanting Chen, Xutao Wang, Zheyuan Bai, QINGHUA ZHANG, Ruifeng Li, Chao Xu, Yunhe Wang",
        "tldr": "",
        "abstract": "Recent releases of Large Language Models (LLMs), e.g. ChatGPT, are astonishing at generating human-like texts, but they may impact the authenticity of texts. Previous works proposed methods to detect these AI-generated texts, including simple ML classifiers, pretrained-model-based zero-shot methods, and finetuned language classification models. However, mainstream detectors always fail on short texts, like SMSes, Tweets, and reviews. In this paper, a Multiscale Positive-Unlabeled (MPU) training framework is proposed to address the difficulty of short-text detection without sacrificing long-texts. Firstly, we acknowledge the human-resemblance property of short machine texts, and rephrase AI text detection as a partial Positive-Unlabeled (PU) problem by regarding these short machine texts as partially \"unlabeled\". Then in this PU context, we propose the length-sensitive Multiscale PU Loss, where a recurrent model in abstraction is used to estimate positive priors of scale-variant corpora. Additionally, we introduce a Text Multiscaling module to enrich training corpora. Experiments show that our MPU method augments detection performance on long AI-generated texts, and significantly improves short-text detection of language model detectors. Language Models trained with MPU could outcompete existing detectors on various short-text and long-text detection benchmarks. The codes are available at https://github.com/mindspore-lab/mindone/tree/master/examples/detect_chatgpt and https://github.com/YuchuanTian/AIGC_text_detector.",
        "keywords": "Large Language Models;AI-Generated Texts;Positive-Unlabeled Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/c5966f7285ade08785ad31f1ed8f09767d83fc05.pdf",
        "author": "Yuchuan Tian;Hanting Chen;Xutao Wang;Zheyuan Bai;QINGHUA ZHANG;Ruifeng Li;Chao Xu;Yunhe Wang",
        "authorids": "~Yuchuan_Tian1;~Hanting_Chen1;~Xutao_Wang1;~Zheyuan_Bai2;~QINGHUA_ZHANG1;~Ruifeng_Li3;~Chao_Xu1;~Yunhe_Wang1",
        "gender": "M;M;M;M;F;M;M;M",
        "homepage": ";;;;https://www.facebook.com/qinghua.zhang.395;https://www.zhihu.com/people/risenberg;http://www.cis.pku.edu.cn/faculty/vision/xuchao/xuchao01.htm;https://www.wangyunhe.site/",
        "dblp": "193/6675;232/2060;;;;;;63/8217-1",
        "google_scholar": ";https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com/citations?hl=en;;;;https://scholar.google.co.uk/citations?hl=zh-CN;https://scholar.google.com.sg/citations?user=isizOkYAAAAJ",
        "orcid": ";;;;;;;0000-0002-0142-509X",
        "linkedin": ";;;zheyuanbai/;;;;",
        "or_profile": "~Yuchuan_Tian1;~Hanting_Chen1;~Xutao_Wang1;~Zheyuan_Bai2;~QINGHUA_ZHANG1;~Ruifeng_Li3;~Chao_Xu1;~Yunhe_Wang1",
        "aff": "Peking University;Huawei Technologies Ltd.;;Huawei Technologies Ltd.;;;Peking University;Huawei Noah's Ark Lab",
        "aff_domain": "pku.edu.cn;huawei.com;;huawei.com;;;pku.edu;huawei.com",
        "position": "PhD student;Researcher;;Researcher;;;Full Professor;Principal Researcher",
        "bibtex": "@inproceedings{\ntian2024multiscale,\ntitle={Multiscale Positive-Unlabeled Detection of {AI}-Generated Texts},\nauthor={Yuchuan Tian and Hanting Chen and Xutao Wang and Zheyuan Bai and QINGHUA ZHANG and Ruifeng Li and Chao Xu and Yunhe Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=5Lp6qU9hzV}\n}",
        "github": "",
        "project": "",
        "reviewers": "vhmU;PQsn;scbq;o5iQ",
        "pdf_size": 351998,
        "rating": "6;6;6;8",
        "confidence": "4;5;4;2",
        "soundness": "3;3;3;3",
        "contribution": "4;3;3;3",
        "presentation": "3;2;4;3",
        "wc_summary": "84;157;100;83",
        "wc_strengths": "94;66;88;97",
        "wc_weaknesses": "139;169;81;120",
        "wc_questions": "4;18;108;99",
        "wc_review": "321;410;377;399",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "130;733;614;383",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            106.0,
            30.20761493398643
        ],
        "wc_strengths_avg": [
            86.25,
            12.132085558550928
        ],
        "wc_weaknesses_avg": [
            127.25,
            31.90905044027478
        ],
        "wc_questions_avg": [
            57.25,
            46.622821664931436
        ],
        "wc_review_avg": [
            376.75,
            34.310166131920724
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            465.0,
            230.74553083429373
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.9271726499455306,
        "gs_citation": 42,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11859119720528962574&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=5Lp6qU9hzV",
        "pdf": "https://openreview.net/pdf?id=5Lp6qU9hzV",
        "email": "pku.edu.cn;huawei.com;;huawei.com;;;pku.edu;huawei.com",
        "author_num": 8,
        "aff_unique_index": "0;1;1;0;1",
        "aff_unique_norm": "Peking University;Huawei",
        "aff_unique_dep": ";Huawei Technologies",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.huawei.com",
        "aff_unique_abbr": "Peking U;Huawei",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "5Lt6sBoemN",
        "title": "When and Why Momentum Accelerates SGD: An Empirical Study",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Momentum has become a crucial component in deep learning optimizers, necessitating a comprehensive understanding of when and why it accelerates stochastic gradient descent (SGD). To address the question of ''when'', we establish a meaningful comparison framework that examines the performance of SGD with Momentum (SGDM) under the \\emph{effective learning rates} $\\eta_{ef}$, and offers a holistic view of the momentum acceleration effect. In the comparison of SGDM and SGD with the same effective learning rate and the same batch size, we observe a consistent pattern: when $\\eta_{ef}$ is small, SGDM and SGD experience almost the same  empirical training losses; when $\\eta_{ef}$ surpasses a certain threshold, SGDM begins to perform better than SGD.  Furthermore, we observe that the advantage of SGDM over SGD  becomes more pronounced with a larger batch size. For the question of ``why'', we find that the momentum acceleration is closely related to \\emph{edge of stability} (EoS), a recently discovered phenomenon describing that the sharpness (largest eigenvalue of the Hessian) of the training trajectory often oscillates around the stability threshold. Specifically, the misalignment between  SGD and SGDM happens at the same moment that SGD enters the EoS regime and converges slower. Momentum improves the performance of SGDM by preventing or deferring the occurrence of EoS. Together, this study unveils the interplay between momentum, learning rates, and batch sizes, thus improving our understanding of momentum acceleration.",
        "keywords": "Momentum;Optimization",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Jingwen Fu;Bohan Wang;Huishuai Zhang;Zhizheng Zhang;Zhi-Ming Ma;Wei Chen;Nanning Zheng",
        "authorids": "~Jingwen_Fu1;~Bohan_Wang1;~Huishuai_Zhang3;~Zhizheng_Zhang1;~Zhi-Ming_Ma1;~Wei_Chen1;~Nanning_Zheng1",
        "gender": "M;M;M;;F;M;M",
        "homepage": "https://www.jw-fu.cn/;https://bhwangfy.github.io/;;http://homepage.amss.ac.cn/research/homePage/8eb59241e2e74d828fb84eec0efadba5/myHomePage.html;https://weichen-cas.github.io/;;https://huishuai-git.github.io",
        "dblp": "247/5290;202/1184;67/4758;;;07/256-1;144/7537",
        "google_scholar": ";LfkHCEUAAAAJ;X7M0I8kAAAAJ;;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=zh-CN;w1srHyIAAAAJ",
        "orcid": ";;;;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Jingwen_Fu1;~Bohan_Wang1;~Zhizheng_Zhang1;~Zhi-Ming_Ma1;~Wei_Chen1;~Nanning_Zheng1;~Huishuai_Zhang2",
        "aff": "Microsoft;Microsoft Research Asia, University of Science and Technology of China;Beijing Galbot Co., Ltd;Academy of Mathematics and Systems Science, Chinese Academy of Sciences, Chinese Academy of Sciences; Chinese Academy of Sciences;Xi'an Jiaotong University;Peking University",
        "aff_domain": "microsoft.com;ustc.edu.cn;galbot.com;amss.ac.cn;ict.ac.cn;xjtu.edu.cn;pku.edu.cn",
        "position": "Intern;PhD student;Principal Researcher;Full Professor;Full Professor;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nfu2024when,\ntitle={When and Why Momentum Accelerates {SGD}: An Empirical Study},\nauthor={Jingwen Fu and Bohan Wang and Huishuai Zhang and Zhizheng Zhang and Zhi-Ming Ma and Wei Chen and Nanning Zheng},\nyear={2024},\nurl={https://openreview.net/forum?id=5Lt6sBoemN}\n}",
        "github": "",
        "project": "",
        "reviewers": "GteF;PhKt;Dpus;euxD",
        "site": "https://openreview.net/forum?id=5Lt6sBoemN",
        "pdf_size": 1628764,
        "rating": "3;3;3;6",
        "confidence": "4;3;4;3",
        "soundness": "2;2;1;3",
        "contribution": "2;2;2;3",
        "presentation": "1;2;3;3",
        "wc_summary": "81;10;82;112",
        "wc_strengths": "42;44;21;61",
        "wc_weaknesses": "767;230;248;145",
        "wc_questions": "86;73;5;39",
        "wc_review": "976;357;356;357",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            71.25,
            37.49249924984996
        ],
        "wc_strengths_avg": [
            42.0,
            14.19506956657839
        ],
        "wc_weaknesses_avg": [
            347.5,
            245.30236444029643
        ],
        "wc_questions_avg": [
            50.75,
            31.499007920885383
        ],
        "wc_review_avg": [
            511.5,
            268.179510775898
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7255542862177271988&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;2;2;3;4",
        "aff_unique_norm": "Microsoft;Galbot;Chinese Academy of Sciences;Xi'an Jiao Tong University;Peking University",
        "aff_unique_dep": "Microsoft Corporation;;Academy of Mathematics and Systems Science;;",
        "aff_unique_url": "https://www.microsoft.com;;http://www.cas.cn;https://www.xjtu.edu.cn;http://www.pku.edu.cn",
        "aff_unique_abbr": "Microsoft;;CAS;XJTU;Peking U",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Asia",
        "aff_country_unique_index": "0;1;1;1;1;1;1",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "5M2MjyNR2w",
        "title": "Adaptive Expansion for Hypergraph Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Hypergraph, with its powerful ability to capture higher-order complex relationships, has attracted substantial attention recently. Consequently, an increasing number of hypergraph neural networks (HyGNNs) have emerged to model the high-order relationships among nodes and hyperedges. In general, most HyGNNs leverage typical expansion methods, such as clique expansion (CE), to convert hypergraphs into graphs for representation learning. However, they still face the following limitations in hypergraph expansion: (i) Some expansion methods expand hypergraphs in a straightforward manner, resulting in information loss and redundancy; (ii) Most expansion methods often employ fixed edge weights while ignoring the fact that nodes having similar attribute features within the same hyperedge are more likely to be connected compared with nodes with dissimilar features. In light of these challenges, we design a novel CE-based \\textbf{Ad}aptive \\textbf{E}xpansion method called \\textbf{AdE} to expand hypergraphs into weighted graphs that preserve the higher-order hypergraph structure information. Specifically, we first introduce a Global Simulation Network to pick two representative nodes for symbolizing each hyperedge in an adaptive manner. We then connect the rest of the nodes within the same hyperedge to the corresponding selected nodes. Instead of leveraging the fixed edge weights, we further design a distance-aware kernel function to dynamically adjust the edge weights to make sure that node pairs having similar attribute features within the corresponding hyperedge are more likely to be connected with large weights. After obtaining the adaptive weighted graphs, we employ graph neural networks to model the rich relationships among nodes for downstream tasks. Extensive theoretical justifications and empirical experiments over five benchmark hypergraph datasets demonstrate that AdE has excellent rationality, generalization, and effectiveness compared to classic expansion models.",
        "keywords": "Hypergraph;Hypergraph Expansion.",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/1533602913af5d7fadac0d73ba5241d98959bb5d.zip",
        "author": "Yiyue Qian;Tianyi Ma;Chuxu Zhang;Yanfang Ye",
        "authorids": "~Yiyue_Qian2;~Tianyi_Ma3;~Chuxu_Zhang2;~Yanfang_Ye1",
        "gender": ";M;;",
        "homepage": "https://yiyueqian.github.io/;https://tianyi-billy-ma.github.io/;;http://yes-lab.org/",
        "dblp": "261/9059;;;",
        "google_scholar": "c6c81_kAAAAJ;https://scholar.google.com/citations?hl=en;;egjr888AAAAJ",
        "orcid": "0000-0001-7924-5438;0009-0003-3790-8469;;",
        "linkedin": "yiyue-qian-224655212/;Tianyi-Ma-03BILLY;;",
        "or_profile": "~Yiyue_Qian2;~Tianyi_Ma3;~Chuxu_Zhang2;~Yanfang_Ye1",
        "aff": "University of Notre Dame;University of Notre Dame;;University of Notre Dame",
        "aff_domain": "nd.edu;nd.edu;;nd.edu",
        "position": "PhD student;PhD student;;Associate Professor",
        "bibtex": "@misc{\nqian2024adaptive,\ntitle={Adaptive Expansion for Hypergraph Learning},\nauthor={Yiyue Qian and Tianyi Ma and Chuxu Zhang and Yanfang Ye},\nyear={2024},\nurl={https://openreview.net/forum?id=5M2MjyNR2w}\n}",
        "github": "",
        "project": "",
        "reviewers": "qSDB;7Lez;1ZMR;UEpe",
        "site": "https://openreview.net/forum?id=5M2MjyNR2w",
        "pdf_size": 3900555,
        "rating": "3;5;6;8",
        "confidence": "5;3;3;5",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;2;3",
        "wc_summary": "44;184;55;104",
        "wc_strengths": "70;54;47;112",
        "wc_weaknesses": "223;229;132;175",
        "wc_questions": "2;2;113;73",
        "wc_review": "339;469;347;464",
        "wc_reply_reviewers": "669;359;34;23",
        "wc_reply_authors": "4815;3715;3357;1729",
        "reply_reviewers": "2;2;1;1",
        "reply_authors": "12;8;6;4",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            4.0,
            1.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            96.75,
            55.20586472468301
        ],
        "wc_strengths_avg": [
            70.75,
            25.232667318379164
        ],
        "wc_weaknesses_avg": [
            189.75,
            39.36607041603213
        ],
        "wc_questions_avg": [
            47.5,
            47.64714052280577
        ],
        "wc_review_avg": [
            404.75,
            61.84001536222319
        ],
        "wc_reply_reviewers_avg": [
            271.25,
            266.37414945898934
        ],
        "wc_reply_authors_avg": [
            3404.0,
            1106.2861293535232
        ],
        "reply_reviewers_avg": [
            1.5,
            0.5
        ],
        "reply_authors_avg": [
            7.5,
            2.958039891549808
        ],
        "replies_avg": [
            43,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11623038287928215160&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Notre Dame",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nd.edu",
        "aff_unique_abbr": "Notre Dame",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "5MlPrLO52d",
        "title": "Neural Tangent Kernels for Axis-Aligned Tree Ensembles",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "While axis-aligned rules are known to induce an important inductive bias in machine learning models such as typical hard decision tree ensembles, theoretical understanding of the learning behavior is largely unrevealed due to the discrete nature of rules. To address this issue, we impose the axis-aligned constraint on soft trees, which relax the splitting process of decision trees and are trained using a gradient method, and present their Neural Tangent Kernel (NTK) that enables us to analytically describe the training behavior. We study two cases: imposing the axis-aligned constraint throughout the entire training process, or only at the initial state. Moreover, we extend the NTK framework to handle various tree architectures simultaneously, and prove that any axis-aligned non-oblivious tree ensemble can be transformed into an axis-aligned oblivious tree ensemble with the same NTK. \nOne can search for suitable tree architecture via Multiple Kernel Learning (MKL), and our numerical experiments show a variety of suitable features depending on the type of constraints, which supports not only the theoretical but also the practical impact of the axis-aligned constraint in tree ensemble learning.",
        "keywords": "Neural Tangent Kernel;Tree Ensemble;Soft Tree",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/f53cb91411a9db9a0dce7d9535b183654b58b6be.zip",
        "author": "Ryuichi Kanoh;Mahito Sugiyama",
        "authorids": "~Ryuichi_Kanoh1;~Mahito_Sugiyama1",
        "gender": "M;M",
        "homepage": ";https://mahito.nii.ac.jp/",
        "dblp": "287/4416;05/8421",
        "google_scholar": ";qLlRvTkAAAAJ",
        "orcid": ";0000-0001-5907-9831",
        "linkedin": "ryuichi-kanoh-43ab4316b/;",
        "or_profile": "~Ryuichi_Kanoh1;~Mahito_Sugiyama1",
        "aff": "NII, the Graduate University for Advanced Studies;National Institute of Informatics",
        "aff_domain": "nii.ac.jp;nii.ac.jp",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\nkanoh2024neural,\ntitle={Neural Tangent Kernels for Axis-Aligned Tree Ensembles},\nauthor={Ryuichi Kanoh and Mahito Sugiyama},\nyear={2024},\nurl={https://openreview.net/forum?id=5MlPrLO52d}\n}",
        "github": "",
        "project": "",
        "reviewers": "QWBa;PQpi;Nxzp;w3rN",
        "site": "https://openreview.net/forum?id=5MlPrLO52d",
        "pdf_size": 2158884,
        "rating": "5;5;6;6",
        "confidence": "4;3;3;2",
        "soundness": "3;4;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;2;4;3",
        "wc_summary": "23;40;133;116",
        "wc_strengths": "18;61;76;77",
        "wc_weaknesses": "97;450;103;7",
        "wc_questions": "59;146;65;29",
        "wc_review": "197;697;377;229",
        "wc_reply_reviewers": "421;449;0;0",
        "wc_reply_authors": "1655;2032;631;93",
        "reply_reviewers": "2;2;0;0",
        "reply_authors": "3;3;1;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            78.0,
            47.270498199193966
        ],
        "wc_strengths_avg": [
            58.0,
            23.947860029656095
        ],
        "wc_weaknesses_avg": [
            164.25,
            169.3035365844435
        ],
        "wc_questions_avg": [
            74.75,
            43.338060639581
        ],
        "wc_review_avg": [
            375.0,
            197.9191754226962
        ],
        "wc_reply_reviewers_avg": [
            217.5,
            217.72517080025452
        ],
        "wc_reply_authors_avg": [
            1102.75,
            776.3099815795234
        ],
        "reply_reviewers_avg": [
            1.0,
            1.0
        ],
        "reply_authors_avg": [
            2.0,
            1.0
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.7071067811865475,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:a8X-VfUeUuEJ:scholar.google.com/&scioq=Neural+Tangent+Kernels+for+Axis-Aligned+Tree+Ensembles&hl=en&as_sdt=0,5",
        "gs_version_total": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "National Institute of Informatics",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nii.ac.jp",
        "aff_unique_abbr": "NII",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Japan"
    },
    {
        "id": "5NJzNAXAmx",
        "title": "Informed POMDP: Leveraging Additional Information in Model-Based RL",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this work, we generalize the problem of learning through interaction in a POMDP by accounting for eventual additional information available at training time. First, we introduce the informed POMDP, a new learning paradigm offering a clear distinction between the training information and the execution observation. Next, we propose an objective that leverages this information for learning a sufficient statistic of the history for the optimal control. We then adapt this informed objective to learn a world model able to sample latent trajectories. Finally, we empirically show a significant learning speed improvement in most environments using this informed world model in the Dreamer algorithm. These results and the simplicity of the proposed adaptation advocate for a systematic consideration of eventual additional information when learning in a POMDP using model-based RL.",
        "keywords": "POMDP;RNN;Sufficient Statistic;Model-Based;Privileged Information;Asymmetric Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Gaspard Lambrechts;Adrien Bolland;Damien Ernst",
        "authorids": "~Gaspard_Lambrechts1;~Adrien_Bolland1;~Damien_Ernst1",
        "gender": "M;;M",
        "homepage": "https://gsprd.be;;http://www.damien-ernst.be",
        "dblp": ";;",
        "google_scholar": "LRcgg2wAAAAJ;8m9bl5oAAAAJ;https://scholar.google.be/citations?user=91ZxYSsAAAAJ",
        "orcid": ";;",
        "linkedin": ";adrien-bolland-48497218a/;",
        "or_profile": "~Gaspard_Lambrechts1;~Adrien_Bolland1;~Damien_Ernst1",
        "aff": "Universit\u00e9 de Li\u00e8ge;University of Liege;University of Li\u00e8ge",
        "aff_domain": "ulg.ac.be;ulg.ac.be;uliege.be",
        "position": "PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nlambrechts2024informed,\ntitle={Informed {POMDP}: Leveraging Additional Information in Model-Based {RL}},\nauthor={Gaspard Lambrechts and Adrien Bolland and Damien Ernst},\nyear={2024},\nurl={https://openreview.net/forum?id=5NJzNAXAmx}\n}",
        "github": "",
        "project": "",
        "reviewers": "EdBW;1Mpb;cAA6;SwZJ",
        "site": "https://openreview.net/forum?id=5NJzNAXAmx",
        "pdf_size": 868987,
        "rating": "5;6;6;6",
        "confidence": "3;4;3;3",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;2",
        "presentation": "3;2;3;3",
        "wc_summary": "170;227;101;90",
        "wc_strengths": "21;89;133;80",
        "wc_weaknesses": "456;206;138;213",
        "wc_questions": "101;1;104;97",
        "wc_review": "748;523;476;480",
        "wc_reply_reviewers": "54;33;0;17",
        "wc_reply_authors": "1782;678;838;1079",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "4;2;2;3",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            147.0,
            55.43915583772899
        ],
        "wc_strengths_avg": [
            80.75,
            39.90222424878092
        ],
        "wc_weaknesses_avg": [
            253.25,
            120.66767379874364
        ],
        "wc_questions_avg": [
            75.75,
            43.22831826476714
        ],
        "wc_review_avg": [
            556.75,
            111.94501998749207
        ],
        "wc_reply_reviewers_avg": [
            26.0,
            19.937402037376884
        ],
        "wc_reply_authors_avg": [
            1094.25,
            421.94808626180543
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13697808195694192667&as_sdt=5,34&sciodt=0,34&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Universit\u00e9 de Li\u00e8ge;University of Li\u00e8ge",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ulg.ac.be;https://www.ulg.ac.be",
        "aff_unique_abbr": "ULi\u00e8ge;ULi\u00e8ge",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Belgium"
    },
    {
        "title": "PandaLM: An Automatic Evaluation Benchmark for LLM Instruction Tuning Optimization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19427",
        "id": "5Nn2BLV7SB",
        "author_site": "Yidong Wang, Zhuohao Yu, Zhengran Zeng, Linyi Yang, Wenjin Yao, Cunxiang Wang, Hao Chen, Chaoya Jiang, Rui Xie, Jindong Wang, Xing Xie, Wei Ye, Shikun Zhang, Yue Zhang",
        "tldr": "",
        "abstract": "Instruction tuning large language models (LLMs) remains a challenging task, owing to the complexity of hyperparameter selection and the difficulty involved in evaluating the tuned models. To determine the optimal hyperparameters, an automatic, robust, and reliable evaluation benchmark is essential. However, establishing such a benchmark is not a trivial task due to the challenges associated with evaluation accuracy and privacy protection. In response to these challenges, we introduce a judge large language model, named PandaLM, which is trained to distinguish the superior model given several LLMs. PandaLM's focus extends beyond just the objective correctness of responses, which is the main focus of traditional evaluation datasets. It addresses vital subjective factors such as relative conciseness, clarity, adherence to instructions, comprehensiveness, and formality. To ensure the reliability of PandaLM, we collect a diverse human-annotated test dataset, where all contexts are generated by humans and labels are aligned with human preferences. Our findings reveal that PandaLM-7B offers a performance comparable to both GPT-3.5 and GPT-4. Impressively, PandaLM-70B surpasses their performance. PandaLM enables the evaluation of LLM to be fairer but with less cost, evidenced by significant improvements achieved by models tuned through PandaLM compared to their counterparts trained with default Alpaca's hyperparameters. In addition, PandaLM does not depend on API-based evaluations, thus avoiding potential data leakage.",
        "keywords": "LLM evaluation",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/4400e4f0f67603849e18132665f6c3cb9cd1ce73.pdf",
        "author": "Yidong Wang;Zhuohao Yu;Wenjin Yao;Zhengran Zeng;Linyi Yang;Cunxiang Wang;Hao Chen;Chaoya Jiang;Rui Xie;Jindong Wang;Xing Xie;Wei Ye;Shikun Zhang;Yue Zhang",
        "authorids": "~Yidong_Wang1;~Zhuohao_Yu1;~Wenjin_Yao1;~Zhengran_Zeng2;~Linyi_Yang1;~Cunxiang_Wang1;~Hao_Chen15;~Chaoya_Jiang1;~Rui_Xie2;~Jindong_Wang1;~Xing_Xie3;~Wei_Ye2;~Shikun_Zhang2;~Yue_Zhang7",
        "gender": "M;;M;;;Not Specified;M;;M;;M;M;M;M",
        "homepage": "https://qianlanwyd.github.io/;;;;https://yanglinyi.github.io/;https://wangcunxiang.github.io/;https://hhhhhhao.github.io/;;;;http://research.microsoft.com/en-us/people/xingx/;https://se.pku.edu.cn/kcl/weiye/;;http://frcchang.github.io",
        "dblp": "59/6759.html;;;;218/8007;213/1862.html;;;86/2228-3.html;;08/6809-1;09/5394-4;83/3715.html;47/722-4",
        "google_scholar": ";;FdntfpkAAAAJ;;go3sFxcAAAAJ;https://scholar.google.com.sg/citations?hl=en;tktqkhwAAAAJ;;6PcaSxgAAAAJ;;5EQfAFIAAAAJ;RgLGFMIAAAAJ;uiklLscAAAAJ;",
        "orcid": ";;;;;;;;;;0000-0002-8608-8482;;;0000-0002-5214-2268",
        "linkedin": ";;;;;;haochen97/;;;;xingx/;;;",
        "or_profile": "~Yidong_Wang1;~Zhuohao_Yu1;~Wenjin_Yao1;~Zhengran_Zeng2;~Linyi_Yang1;~Cunxiang_Wang1;~Hao_Chen15;~Chaoya_Jiang1;~Rui_Xie2;~Jindong_Wang1;~Xing_Xie3;~Wei_Ye2;~Shikun_Zhang2;~Yue_Zhang7",
        "aff": "Peking University;;Peking University;;Westlake University;Westlake University;Carnegie Mellon University;;Peking University;;Microsoft Research Asia;Peking University;Peking University;Westlake University",
        "aff_domain": "pku.edu.cn;;pku.edu.cn;;westlake.edu.cn;westlake.edu.cn;andrew.cmu.edu;;pku.edu.cn;;microsoft.com;pku.edu.cn;pku.edu.cn;westlake.edu.cn",
        "position": "PhD student;;MS student;;Researcher;PhD student;PhD student;;Postdoc;;Senior Principal Researcher;Associate Professor;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nwang2024pandalm,\ntitle={Panda{LM}: An Automatic Evaluation Benchmark for {LLM} Instruction Tuning Optimization},\nauthor={Yidong Wang and Zhuohao Yu and Wenjin Yao and Zhengran Zeng and Linyi Yang and Cunxiang Wang and Hao Chen and Chaoya Jiang and Rui Xie and Jindong Wang and Xing Xie and Wei Ye and Shikun Zhang and Yue Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=5Nn2BLV7SB}\n}",
        "github": "",
        "project": "",
        "reviewers": "8MGB;FMz2;Vuch",
        "pdf_size": 3818880,
        "rating": "5;8;8",
        "confidence": "4;3;3",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "2;3;3",
        "wc_summary": "99;182;86",
        "wc_strengths": "77;186;122",
        "wc_weaknesses": "162;165;137",
        "wc_questions": "283;126;6",
        "wc_review": "621;659;351",
        "wc_reply_reviewers": "0;17;0",
        "wc_reply_authors": "1942;654;510",
        "reply_reviewers": "0;1;0",
        "reply_authors": "3;1;1",
        "rating_avg": [
            7.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            122.33333333333333,
            42.52319628417203
        ],
        "wc_strengths_avg": [
            128.33333333333334,
            44.723844000960185
        ],
        "wc_weaknesses_avg": [
            154.66666666666666,
            12.552113589175153
        ],
        "wc_questions_avg": [
            138.33333333333334,
            113.42055467252055
        ],
        "wc_review_avg": [
            543.6666666666666,
            137.11633341396237
        ],
        "wc_reply_reviewers_avg": [
            5.666666666666667,
            8.013876853447538
        ],
        "wc_reply_authors_avg": [
            1035.3333333333333,
            643.7998308653259
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            14,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 227,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13482765834651698548&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=5Nn2BLV7SB",
        "pdf": "https://openreview.net/pdf?id=5Nn2BLV7SB",
        "email": "pku.edu.cn;;pku.edu.cn;;westlake.edu.cn;westlake.edu.cn;andrew.cmu.edu;;pku.edu.cn;;microsoft.com;pku.edu.cn;pku.edu.cn;westlake.edu.cn",
        "author_num": 14,
        "aff_unique_index": "0;0;1;1;2;0;3;0;0;1",
        "aff_unique_norm": "Peking University;Westlake University;Carnegie Mellon University;Microsoft",
        "aff_unique_dep": ";;;Research",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.westlake.edu.cn;https://www.cmu.edu;https://www.microsoft.com/en-us/research/group/asia",
        "aff_unique_abbr": "Peking U;WU;CMU;MSR Asia",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Asia",
        "aff_country_unique_index": "0;0;0;0;1;0;0;0;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "5Osk2F3qCn",
        "title": "TADIS: Steering Models for Deep-Thinking about Demonstration Examples",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Instruction tuning has been demonstrated that could significantly improve the zero-shot generalization capability to unseen tasks by an apparent margin. By incorporating additional context (e.g., task definition, examples) during the fine-tuning process, Large Language Models (LLMs) achieved much higher performance than before. However, recent work reported that delusive task examples can achieve almost the same performance as correct task examples, indicating the input-label correspondence is less important than previously thought. Intrigued by this counter-intuitive observation, we suspect models have the same illusion of competence as humans. Therefore, we propose a novel method called TADIS that steers LLMs for \"Deep-Thinking'' about demonstration examples instead of merely seeing. To alleviate the illusion of competence of models, we first ask the model to verify the correctness of shown examples. Then, using the verification results as conditions to elicit models for a better answer. Our experimental results show that TADIS consistently outperforms competitive baselines on in-domain and out-domain tasks (improving 2.79 and 4.03 average ROUGLE-L on out-domain and in-domain datasets, respectively). \nDespite the presence of generated examples (not all of the thinking labels are accurate), TADIS can notably enhance performance in zero-shot and few-shot settings. This also suggests that our approach can be adopted on a large scale to improve the instruction following capabilities of models without any manual labor. Moreover, we construct three types of thinking labels with different model sizes and find that small models learn from the format of TADIS but larger models can be steered for \"Deep-Thinking''.",
        "keywords": "Instruction Tuning;Language Model;Few-Shot",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/6c070efd803b8a4afa978472dde5fd91f3bb1ed9.zip",
        "author": "Tianci Xue;Ziqi Wang;Yixia Li;Yun Chen;Guanhua Chen",
        "authorids": "~Tianci_Xue1;~Ziqi_Wang2;~Yixia_Li1;~Yun_Chen1;~Guanhua_Chen1",
        "gender": "M;;M;F;M",
        "homepage": "https://xuetianci.github.io/;https://www.wzq016.github.io;https://liyixia.me;https://yunc.me/;https://ghchen.me",
        "dblp": "347/9360;38/8097-3;257/2679;10/5680-7;85/3682-1",
        "google_scholar": "wVFSbzkAAAAJ;xYRZiZkAAAAJ;LrYjRNYAAAAJ;vXd0JQMAAAAJ;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": ";;0000-0002-0921-7551;0000-0002-3563-7592;0000-0002-5353-9734",
        "linkedin": ";;liyixia/;;",
        "or_profile": "~Tianci_Xue1;~Ziqi_Wang2;~Yixia_Li1;~Yun_Chen1;~Guanhua_Chen1",
        "aff": "Nanjing University;Meta Facebook;Southern University of Science and Technology ;Shanghai University of Finance and Economics;Southern University of Science and Technology",
        "aff_domain": "nju.edu.cn;meta.com;sustech.edu;sufe.edu.cn;sustech.edu.cn",
        "position": "MS student;Intern;PhD student;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nxue2024tadis,\ntitle={{TADIS}: Steering Models for Deep-Thinking about Demonstration Examples},\nauthor={Tianci Xue and Ziqi Wang and Yixia Li and Yun Chen and Guanhua Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=5Osk2F3qCn}\n}",
        "github": "",
        "project": "",
        "reviewers": "B4dK;Fers;B5Pw;8SUE",
        "site": "https://openreview.net/forum?id=5Osk2F3qCn",
        "pdf_size": 525928,
        "rating": "3;3;3;6",
        "confidence": "2;4;2;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;1;2",
        "wc_summary": "116;93;66;91",
        "wc_strengths": "60;152;104;42",
        "wc_weaknesses": "755;267;242;144",
        "wc_questions": "169;81;112;136",
        "wc_review": "1100;593;524;413",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            91.5,
            17.698870020427858
        ],
        "wc_strengths_avg": [
            89.5,
            42.55290824373817
        ],
        "wc_weaknesses_avg": [
            352.0,
            237.16977041773262
        ],
        "wc_questions_avg": [
            124.5,
            32.25290684574028
        ],
        "wc_review_avg": [
            657.5,
            263.42408773686583
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.17407765595569782,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2471280889710494543&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;3;2",
        "aff_unique_norm": "Nanjing University;Meta;Southern University of Science and Technology;Shanghai University of Finance and Economics",
        "aff_unique_dep": ";Meta Platforms, Inc.;;",
        "aff_unique_url": "https://www.nju.edu.cn;https://meta.com;https://www.sustech.edu.cn;http://www.sufe.edu.cn",
        "aff_unique_abbr": "Nanjing U;Meta;SUSTech;SUFE",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "5PkgaUwiY0",
        "title": "VideoDirectorGPT: Consistent Multi-Scene Video Generation via LLM-Guided Planning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Although recent text-to-video (T2V) generation methods have seen significant advancements, the majority of these works focus on producing short video clips of a single event with a single background (i.e., single-scene videos). Meanwhile, recent large language models (LLMs) have demonstrated their capability in generating layouts and programs to control downstream visual modules such as image generation models. This prompts an important question: can we leverage the knowledge embedded in these LLMs for temporally consistent long video generation? In this paper, we propose VideoDirectorGPT, a novel framework for consistent multi-scene video generation that uses the knowledge of LLMs for video content planning and grounded video generation. Specifically, given a single text prompt, we first ask our video planner LLM (GPT-4) to expand it into a \u2018video plan\u2019, which involves generating the scene descriptions, the entities with their respective layouts, the background for each scene, and consistency groupings of the entities and backgrounds. Next, guided by this output from the video planner, our video generator, named Layout2Vid, has explicit control over spatial layouts and can maintain temporal consistency of entities/backgrounds across multiple scenes, while being trained only with image-level annotations. Our experiments demonstrate that our proposed VideoDirectorGPT framework substantially improves layout and movement control in both single- and multi-scene video generation and can generate multi-scene videos with visual consistency across scenes, while achieving competitive performance with SOTAs in open-domain single-scene text-to-video generation. We also demonstrate that our framework can dynamically control the strength for layout guidance and can also generate videos with user-provided images. We hope our framework can inspire future work on integrating the planning ability of LLMs into consistent long video generation.",
        "keywords": "Text-to-Video Generation;Large Language Models;Layout-Guided Video Generation;Temporal Consistency;Multi-Scene Video Generation;Layout Control",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/2436f0253ad2ca33bd87987c580d9851b9cb317b.zip",
        "author": "Han Lin;Abhay Zala;Jaemin Cho;Mohit Bansal",
        "authorids": "~Han_Lin1;~Abhay_Zala1;~Jaemin_Cho1;~Mohit_Bansal2",
        "gender": "M;;M;M",
        "homepage": "https://hl-hanlin.github.io/;;https://j-min.io;https://www.cs.unc.edu/~mbansal/",
        "dblp": ";278/2061.html;130/8348-1;32/5243.html",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;8mfWxD8AAAAJ;IbQZoHQAAAAJ;DN8QtscAAAAJ",
        "orcid": ";;0000-0002-1558-6169;",
        "linkedin": "han-lin-9336981a3/;;;",
        "or_profile": "~Han_Lin1;~Abhay_Zala1;~Jaemin_Cho1;~Mohit_Bansal2",
        "aff": "Department of Computer Science, University of North Carolina at Chapel Hill;Department of Computer Science, University of North Carolina at Chapel Hill;University of North Carolina, Chapel Hill;University of North Carolina at Chapel Hill",
        "aff_domain": "cs.unc.edu;cs.unc.edu;unc.edu;unc.edu",
        "position": "PhD student;MS student;PhD student;Full Professor",
        "bibtex": "@misc{\nlin2024videodirectorgpt,\ntitle={VideoDirector{GPT}: Consistent Multi-Scene Video Generation via {LLM}-Guided Planning},\nauthor={Han Lin and Abhay Zala and Jaemin Cho and Mohit Bansal},\nyear={2024},\nurl={https://openreview.net/forum?id=5PkgaUwiY0}\n}",
        "github": "",
        "project": "",
        "reviewers": "tZEz;pdWu;dMSD;GLr8",
        "site": "https://openreview.net/forum?id=5PkgaUwiY0",
        "pdf_size": 18166678,
        "rating": "3;3;5;5",
        "confidence": "4;4;4;5",
        "soundness": "3;2;3;3",
        "contribution": "2;3;2;2",
        "presentation": "3;2;3;2",
        "wc_summary": "57;64;123;118",
        "wc_strengths": "21;78;137;48",
        "wc_weaknesses": "120;260;287;176",
        "wc_questions": "3;79;4;91",
        "wc_review": "201;481;551;433",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "350;710;0;744",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;0;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            90.5,
            30.153772566629204
        ],
        "wc_strengths_avg": [
            71.0,
            43.110323589599744
        ],
        "wc_weaknesses_avg": [
            210.75,
            66.48825084178407
        ],
        "wc_questions_avg": [
            44.25,
            40.97178907492325
        ],
        "wc_review_avg": [
            416.5,
            131.30403649545585
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            451.0,
            302.7094316337038
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0.75,
            0.4330127018922193
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 73,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11199615266521370931&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;1;1",
        "aff_unique_norm": "University of North Carolina at Chapel Hill;University of North Carolina",
        "aff_unique_dep": "Department of Computer Science;",
        "aff_unique_url": "https://www.unc.edu;https://www.unc.edu",
        "aff_unique_abbr": "UNC Chapel Hill;UNC",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Chapel Hill",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "TEDDY: Trimming Edges with Degree-based Discrimination Strategy",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19426",
        "id": "5RUf9nEdyC",
        "author_site": "Hyunjin Seo, Jihun Yun, Eunho Yang",
        "tldr": "",
        "abstract": "Since the pioneering work on the lottery ticket hypothesis for graph neural networks (GNNs) was proposed in Chen et al. (2021), the study on finding graph lottery tickets (GLT) has become one of the pivotal focus in the GNN community, inspiring researchers to discover sparser GLT while achieving comparable performance to original dense networks. In parallel, the graph structure has gained substantial attention as a crucial factor in GNN training dynamics, also elucidated by several recent studies. Despite this, contemporary studies on GLT, in general, have not fully exploited inherent pathways in the graph structure and identified tickets in an iterative manner, which is time-consuming and inefficient. To address these limitations, we introduce **TEDDY**, a one-shot edge sparsification framework that leverages structural information by incorporating *edge-degree* statistics. Following the edge sparsification, we encourage the parameter sparsity during training via simple projected gradient descent on the $\\ell_0$ ball. Given the target sparsity levels for both the graph structure and the model parameters, our TEDDY facilitates efficient and rapid realization of GLT within a *single* training. Remarkably, our experimental results demonstrate that TEDDY significantly surpasses conventional iterative approaches in generalization, even when conducting one-shot sparsification that solely utilizes graph structures, without taking feature information into account.",
        "keywords": "Graph Lottery Tickets; Graph Compression; Graph Sparsification; Graph Neural Networks",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/6b610ba0b8bced99d28ff3e7067ba884245d75c8.zip",
        "author": "Hyunjin Seo;Jihun Yun;Eunho Yang",
        "authorids": "~Hyunjin_Seo2;~Jihun_Yun2;~Eunho_Yang1",
        "gender": "F;M;M",
        "homepage": "https://github.com/hyunjin72;https://github.com/abcdxyzpqrst;https://sites.google.com/site/hleehome2/",
        "dblp": ";241/9676;96/2621",
        "google_scholar": "MFDOhRUAAAAJ;ELv5qfEAAAAJ;",
        "orcid": ";;",
        "linkedin": "hyunjin-seo-97525629a/?originalSubdomain=kr;;",
        "or_profile": "~Hyunjin_Seo2;~Jihun_Yun2;~Eunho_Yang1",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr;kaist.ac.kr",
        "position": "MS student;PhD student;Associate Professor",
        "bibtex": "@inproceedings{\nseo2024teddy,\ntitle={{TEDDY}: Trimming Edges with Degree-based Discrimination Strategy},\nauthor={Hyunjin Seo and Jihun Yun and Eunho Yang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=5RUf9nEdyC}\n}",
        "github": "",
        "project": "",
        "reviewers": "QTmY;k6Ge;mYP6;vxbf;SQ4D",
        "pdf_size": 9177078,
        "rating": "5;5;6;6;8",
        "confidence": "5;4;3;3;2",
        "soundness": "3;2;3;2;3",
        "contribution": "2;2;3;3;3",
        "presentation": "2;2;3;3;4",
        "wc_summary": "34;86;78;55;35",
        "wc_strengths": "42;25;90;18;31",
        "wc_weaknesses": "291;157;179;296;19",
        "wc_questions": "53;510;118;83;19",
        "wc_review": "420;778;465;452;104",
        "wc_reply_reviewers": "0;402;0;79;0",
        "wc_reply_authors": "1131;4190;937;1090;1190",
        "reply_reviewers": "0;3;0;1;0",
        "reply_authors": "4;13;2;3;3",
        "rating_avg": [
            6.0,
            1.0954451150103321
        ],
        "confidence_avg": [
            3.4,
            1.019803902718557
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.8,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            57.6,
            21.434551546510132
        ],
        "wc_strengths_avg": [
            41.2,
            25.639032743065794
        ],
        "wc_weaknesses_avg": [
            188.4,
            101.85794028940502
        ],
        "wc_questions_avg": [
            156.6,
            179.70264327493905
        ],
        "wc_review_avg": [
            443.8,
            213.6524280227117
        ],
        "wc_reply_reviewers_avg": [
            96.2,
            155.93126690949447
        ],
        "wc_reply_authors_avg": [
            1707.6,
            1244.0209966073724
        ],
        "reply_reviewers_avg": [
            0.8,
            1.1661903789690602
        ],
        "reply_authors_avg": [
            5.0,
            4.049691346263317
        ],
        "replies_avg": [
            39,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8951435925492911,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14447942716248132355&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=5RUf9nEdyC",
        "pdf": "https://openreview.net/pdf?id=5RUf9nEdyC",
        "email": "kaist.ac.kr;kaist.ac.kr;kaist.ac.kr",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "Learning Adaptive Multiresolution Transforms via Meta-Framelet-based Graph Convolutional Network",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19425",
        "id": "5RielfrDkP",
        "author_site": "Tianze Luo, Zhanfeng Mo, Sinno Pan",
        "tldr": "",
        "abstract": "Graph Neural Networks are popular tools in graph representation learning that capture the graph structural properties. However, most GNNs employ single-resolution graph feature extraction, thereby failing to capture micro-level local patterns (high resolution) and macro-level graph cluster and community patterns (low resolution) simultaneously. Many multiresolution methods have been developed to capture graph patterns at multiple scales, but most of them depend on predefined and handcrafted multiresolution transforms that remain fixed throughout the training process once formulated. Due to variations in graph instances and distributions, fixed handcrafted transforms can not effectively tailor multiresolution representations to each graph instance. To acquire multiresolution representation suited to different graph instances and distributions, we introduce the Multiresolution Meta-Framelet-based Graph Convolutional Network (MM-FGCN), facilitating comprehensive and adaptive multiresolution analysis across diverse graphs. Extensive experiments demonstrate that our MM-FGCN achieves SOTA performance on various graph learning tasks.",
        "keywords": "Graph neural networks;graph multiresolution analysis",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/69b2419b7e2027cca1feb8016c59f2e8caabceec.zip",
        "author": "Tianze Luo;Zhanfeng Mo;Sinno Jialin Pan",
        "authorids": "~Tianze_Luo1;~Zhanfeng_Mo1;~Sinno_Jialin_Pan1",
        "gender": "Not Specified;M;M",
        "homepage": "https://ltz0120.github.io/;;http://www.cse.cuhk.edu.hk/~sinnopan/",
        "dblp": "297/4000;246/3205;80/5412",
        "google_scholar": "XROXNIMAAAAJ;DhN2kNoAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";0000-0003-2254-8651;",
        "linkedin": ";zhanfeng-mo-5b2105198/;",
        "or_profile": "~Tianze_Luo1;~Zhanfeng_Mo1;~Sinno_Pan1",
        "aff": "Nanyang Technological University;Nanyang Technological University;Nanyang Technological University",
        "aff_domain": "ntu.edu.sg;ntu.edu.sg;ntu.edu.sg",
        "position": "PhD student;PhD student;Full Professor",
        "bibtex": "@inproceedings{\nluo2024learning,\ntitle={Learning Adaptive Multiresolution Transforms via Meta-Framelet-based Graph Convolutional Network},\nauthor={Tianze Luo and Zhanfeng Mo and Sinno Jialin Pan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=5RielfrDkP}\n}",
        "github": "",
        "project": "",
        "reviewers": "PtSQ;nDyN;sJoC;oTNL",
        "pdf_size": 3633327,
        "rating": "6;6;8;8",
        "confidence": "3;4;3;4",
        "soundness": "3;3;3;3",
        "contribution": "3;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "32;21;92;151",
        "wc_strengths": "29;29;72;40",
        "wc_weaknesses": "164;77;161;29",
        "wc_questions": "8;74;29;37",
        "wc_review": "233;201;354;257",
        "wc_reply_reviewers": "0;17;118;103",
        "wc_reply_authors": "2217;3329;1404;1129",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "4;7;4;5",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            74.0,
            52.02403290787826
        ],
        "wc_strengths_avg": [
            42.5,
            17.613914953808536
        ],
        "wc_weaknesses_avg": [
            107.75,
            57.32963893135906
        ],
        "wc_questions_avg": [
            37.0,
            23.843238035132728
        ],
        "wc_review_avg": [
            261.25,
            57.115562677785114
        ],
        "wc_reply_reviewers_avg": [
            59.5,
            51.62605931116571
        ],
        "wc_reply_authors_avg": [
            2019.75,
            855.2231799360914
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            5.0,
            1.224744871391589
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4837618134532439165&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=5RielfrDkP",
        "pdf": "https://openreview.net/pdf?id=5RielfrDkP",
        "email": "ntu.edu.sg;ntu.edu.sg;ntu.edu.sg",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Nanyang Technological University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ntu.edu.sg",
        "aff_unique_abbr": "NTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Singapore"
    },
    {
        "id": "5T46w5X3Go",
        "title": "Theoretical Analysis on the Generalization Power of Overfitted Transfer Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Transfer learning is a useful technique for achieving improved performance and reducing training costs by leveraging the knowledge gained from source tasks and applying it to target tasks. Assessing the effectiveness of transfer learning relies on understanding the similarity between the ground truth of the source and target tasks. In real-world applications, tasks often exhibit partial similarity, where certain aspects are similar while others are different or irrelevant. To investigate the impact of partial similarity on transfer learning performance, we focus on a linear regression model with two distinct sets of features: a common part shared across tasks and a task-specific part. Our study explores various types of transfer learning, encompassing two options for parameter transfer. By establishing a theoretical characterization on the error of the learned model, we compare these transfer learning options, particularly examining how generalization performance changes with the number of features/parameters in both underparameterized and overparameterized regimes. Furthermore, we provide practical guidelines for determining the number of features in the common and task-specific parts for improved generalization performance. For example, when the total number of features in the source task's learning model is fixed, we show that it is more advantageous to allocate a greater number of redundant features to the task-specific part rather than the common part. Moreover, in specific scenarios, particularly those characterized by high noise levels and small true parameters, sacrificing certain true features in the common part in favor of employing more redundant features in the task-specific part can yield notable benefits.",
        "keywords": "transfer learning;generalization performance;overfitting;overparameterization;double descent",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Peizhong Ju;Sen Lin;Mark S. Squillante;Yingbin Liang;Ness Shroff",
        "authorids": "~Peizhong_Ju1;~Sen_Lin1;~Mark_S._Squillante1;~Yingbin_Liang1;~Ness_Shroff1",
        "gender": "M;;M;F;M",
        "homepage": ";https://slin70.github.io/;https://researcher.watson.ibm.com/researcher/view.php?person=us-mss;https://sites.google.com/view/yingbinliang/home;http://newslab.ece.ohio-state.edu/",
        "dblp": "167/9021;70/9499-1.html;67/3865;51/332;67/1991",
        "google_scholar": "VDzpfOYAAAAJ;94-TbUsAAAAJ;;lGgLAiIAAAAJ;https://scholar.google.com.tw/citations?user=5kL-ZrAAAAAJ",
        "orcid": "0000-0002-4569-3539;;;;0000-0002-4606-6879",
        "linkedin": ";;;;nessshroff/",
        "or_profile": "~Peizhong_Ju1;~Sen_Lin1;~Mark_S._Squillante1;~Yingbin_Liang1;~Ness_Shroff1",
        "aff": "Ohio State University, Columbus;University of Houston;IBM Research;The Ohio State University;Ohio State University, Columbus",
        "aff_domain": "osu.edu;uh.edu;us.ibm.com;osu.edu;osu.edu",
        "position": "Postdoc;Assistant Professor;Distinguished Research Staff Member;Professor;Full Professor",
        "bibtex": "@misc{\nju2024theoretical,\ntitle={Theoretical Analysis on the Generalization Power of Overfitted Transfer Learning},\nauthor={Peizhong Ju and Sen Lin and Mark S. Squillante and Yingbin Liang and Ness Shroff},\nyear={2024},\nurl={https://openreview.net/forum?id=5T46w5X3Go}\n}",
        "github": "",
        "project": "",
        "reviewers": "hznS;kvri;onS3;6fkR",
        "site": "https://openreview.net/forum?id=5T46w5X3Go",
        "pdf_size": 486498,
        "rating": "3;3;5;8",
        "confidence": "4;4;3;3",
        "soundness": "2;3;3;4",
        "contribution": "1;2;2;4",
        "presentation": "1;2;2;4",
        "wc_summary": "137;115;105;107",
        "wc_strengths": "39;68;73;72",
        "wc_weaknesses": "66;261;372;59",
        "wc_questions": "86;77;17;64",
        "wc_review": "328;521;567;302",
        "wc_reply_reviewers": "0;0;21;0",
        "wc_reply_authors": "813;652;916;312",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "2;1;2;1",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            1.0897247358851685
        ],
        "presentation_avg": [
            2.25,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            116.0,
            12.68857754044952
        ],
        "wc_strengths_avg": [
            63.0,
            13.982131454109563
        ],
        "wc_weaknesses_avg": [
            189.5,
            132.9482982215267
        ],
        "wc_questions_avg": [
            61.0,
            26.580067720004024
        ],
        "wc_review_avg": [
            429.5,
            116.01400777492346
        ],
        "wc_reply_reviewers_avg": [
            5.25,
            9.093266739736606
        ],
        "wc_reply_authors_avg": [
            673.25,
            228.80709669938125
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.8551861104941366,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:omXfKyZcMRAJ:scholar.google.com/&scioq=Theoretical+Analysis+on+the+Generalization+Power+of+Overfitted+Transfer+Learning&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0;0",
        "aff_unique_norm": "Ohio State University;University of Houston;IBM",
        "aff_unique_dep": ";;IBM Research",
        "aff_unique_url": "https://www.osu.edu;https://www.uh.edu;https://www.ibm.com/research",
        "aff_unique_abbr": "OSU;UH;IBM",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Columbus;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "5TlHjMVrNG",
        "title": "Evaluating Robustness to Unforeseen Adversarial Attacks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "When considering real-world adversarial settings, defenders are unlikely to have access to the full range of deployment-time adversaries during training, and adversaries are likely to use realistic adversarial distortions that will not be limited to small $L_p$-constrained perturbations. To narrow in on this discrepancy between research and reality we introduce eighteen novel adversarial attacks, which we use to create ImageNet-UA, a new benchmark for evaluating model robustness against a wide range of unforeseen adversaries. We make use of our benchmark to identify a range of defense strategies which can help overcome this generalization gap, finding a rich space of techniques which can improve unforeseen robustness. We hope the greater variety and realism of ImageNetUA will make it a useful tool for those working on real-world worst-case robustness, enabling development of more robust defenses which can generalize beyond attacks seen during training.",
        "keywords": "ML safety;adversarial robustness;distribution shift;unforeseen adversaries",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/c91af6fcdaedf9a37c1218d1d8f5a8de3396e91c.zip",
        "author": "Maximilian Kaufmann;Daniel Kang;Yi Sun;Xuwang Yin;Steven Basart;Mantas Mazeika;Adam Dziedzic;Akul Arora;Franziska Boenisch;Tom B Brown;Abhinav Kommula;Oliver Zhang;Jacob Steinhardt;Dan Hendrycks",
        "authorids": "~Maximilian_Kaufmann1;~Daniel_Kang1;~Yi_Sun3;~Xuwang_Yin2;~Steven_Basart1;~Mantas_Mazeika3;~Adam_Dziedzic1;~Akul_Arora1;~Franziska_Boenisch2;~Tom_B_Brown1;~Abhinav_Kommula1;~Oliver_Zhang1;~Jacob_Steinhardt1;~Dan_Hendrycks1",
        "gender": ";;;;;;;;;;;;;",
        "homepage": ";;;;;;;;;;;;;",
        "dblp": ";;;;;;;;;;;;;",
        "google_scholar": ";;;;;;;;;;;;;",
        "orcid": ";;;;;;;;;;;;;",
        "linkedin": ";;;;;;;;;;;;;",
        "or_profile": ";;;;;;;;;;;;;",
        "aff": ";;;;;;;;;;;;;",
        "aff_domain": ";;;;;;;;;;;;;",
        "position": ";;;;;;;;;;;;;",
        "bibtex": "@misc{\nkaufmann2024evaluating,\ntitle={Evaluating Robustness to Unforeseen Adversarial Attacks},\nauthor={Maximilian Kaufmann and Daniel Kang and Yi Sun and Xuwang Yin and Steven Basart and Mantas Mazeika and Adam Dziedzic and Akul Arora and Franziska Boenisch and Tom B Brown and Abhinav Kommula and Oliver Zhang and Jacob Steinhardt and Dan Hendrycks},\nyear={2024},\nurl={https://openreview.net/forum?id=5TlHjMVrNG}\n}",
        "github": "",
        "project": "",
        "reviewers": "PXCR;Sze7;aca9;hiUg",
        "site": "https://openreview.net/forum?id=5TlHjMVrNG",
        "pdf_size": 10796350,
        "rating": "3;3;6;8",
        "confidence": "4;4;4;4",
        "soundness": "3;1;3;4",
        "contribution": "2;1;3;3",
        "presentation": "3;2;2;2",
        "wc_summary": "75;67;109;64",
        "wc_strengths": "88;64;101;78",
        "wc_weaknesses": "567;71;121;343",
        "wc_questions": "381;716;58;27",
        "wc_review": "1111;918;389;512",
        "wc_reply_reviewers": "265;464;0;20",
        "wc_reply_authors": "1312;2877;430;385",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "2;5;1;2",
        "rating_avg": [
            5.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            1.0897247358851685
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            78.75,
            17.92170471802278
        ],
        "wc_strengths_avg": [
            82.75,
            13.5531361684298
        ],
        "wc_weaknesses_avg": [
            275.5,
            196.98921290263587
        ],
        "wc_questions_avg": [
            295.5,
            279.56618178885657
        ],
        "wc_review_avg": [
            732.5,
            293.37902106319734
        ],
        "wc_reply_reviewers_avg": [
            187.25,
            190.8341884988117
        ],
        "wc_reply_authors_avg": [
            1251.0,
            1008.9095598714486
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            1.5
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            14,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:yZsZf28pFSgJ:scholar.google.com/&scioq=Evaluating+Robustness+to+Unforeseen+Adversarial+Attacks&hl=en&as_sdt=0,5",
        "gs_version_total": 3
    },
    {
        "id": "5VD7dS3cZX",
        "title": "Rethinking the Solution to Curse of Dimensionality on Randomized Smoothing",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Randomized Smoothing (RS) is currently a scalable certified defense method providing robustness certification against adversarial examples. \nAlthough significant progress has been achieved in providing defenses against $\\ell_p$ adversaries,\nearly investigations found that RS suffers from the curse of dimensionality, indicating that the robustness guarantee offered by RS decays significantly with increasing input data dimension.\nDouble Sampling Randomized Smoothing (DSRS) is the state-of-the-art method that provides a theoretical solution to the curse of dimensionality under concentration assumptions on the base classifier.\nHowever, we speculate the solution to the curse of dimensionality can be deepened from the perspective of the smoothing distribution.\nIn this work, we further address the curse of dimensionality by theoretically showing that some Exponential General Gaussian (EGG) distributions with the exponent $\\eta$ can provide $\\Omega(\\sqrt{d})$ lower bounds for the $\\ell_2$ certified radius with tighter constant factors than DSRS.\nOur theoretical analysis shows that the lower bound improves with monotonically decreasing $\\eta \\in (0,2)$. Intriguingly, we observe a contrary phenomenon that EGG provides greater certified radii at larger $\\eta$, on real-world tasks. \nFurther investigations show these discoveries are not contradictory, which are in essence dependent on whether the assumption in DSRS absolutely holds. \nOur experiments on real-world datasets demonstrate that EGG distributions bring significant improvements for point-to-point certified accuracy, up to 4\\%-6\\% on ImageNet.\nFurthermore, we also report the performance of Exponential Standard Gaussian (ESG) distributions on DSRS.",
        "keywords": "Exponential Gaussian distribution;randomized smoothing;certified robustness;curse of dimensionality",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Youwei Shu;Xi Xiao;Derui Wang;Yuxin Cao;Siji Chen;Jason Xue;Linyi Li;Bo Li",
        "authorids": "~Youwei_Shu1;~Xi_Xiao1;~Derui_Wang1;~Yuxin_Cao1;~Siji_Chen2;~Jason_Xue1;~Linyi_Li1;~Bo_Li19",
        "gender": "M;M;;;M;;M;F",
        "homepage": "https://github.com/tdano1;https://www.sigs.tsinghua.edu.cn/xx_en/main.htm;;;https://github.com/LostDriver;;http://linyil.com;http://boli.cs.illinois.edu/",
        "dblp": ";;;151/7989;;;99/4340-1.html;50/3402-26",
        "google_scholar": ";;;https://scholar.google.com/citations?hl=en;;;-b0sk-YAAAAJ;K8vJkTcAAAAJ",
        "orcid": ";;;0009-0002-5766-0846;;;;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Youwei_Shu1;~Xi_Xiao1;~Derui_Wang1;~Yuxin_Cao1;~Siji_Chen2;~Jason_Xue1;~Linyi_Li1;~Bo_Li19",
        "aff": "Tsinghua University;Shenzhen International Graduate School, Tsinghua University;;Tsinghua University;;;Simon Fraser University;University of Illinois, Urbana Champaign",
        "aff_domain": "tsinghua.edu.cn;tsinghua.edu.cn;;mails.tsinghua.edu.cn;;;sfu.ca;illinois.edu",
        "position": "MS student;Associate Professor;;MS student;;;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nshu2024rethinking,\ntitle={Rethinking the Solution to Curse of Dimensionality on Randomized Smoothing},\nauthor={Youwei Shu and Xi Xiao and Derui Wang and Yuxin Cao and Siji Chen and Jason Xue and Linyi Li and Bo Li},\nyear={2024},\nurl={https://openreview.net/forum?id=5VD7dS3cZX}\n}",
        "github": "",
        "project": "",
        "reviewers": "FGgM;Ba1f;Dgzf;2qpb",
        "site": "https://openreview.net/forum?id=5VD7dS3cZX",
        "pdf_size": 9707100,
        "rating": "1;5;5;8",
        "confidence": "4;4;4;3",
        "soundness": "1;2;3;3",
        "contribution": "1;2;3;3",
        "presentation": "1;2;2;3",
        "wc_summary": "80;33;49;113",
        "wc_strengths": "1;23;63;86",
        "wc_weaknesses": "561;139;391;23",
        "wc_questions": "88;74;6;59",
        "wc_review": "730;269;509;281",
        "wc_reply_reviewers": "2734;28;53;0",
        "wc_reply_authors": "2755;781;728;111",
        "reply_reviewers": "4;1;1;0",
        "reply_authors": "4;1;1;1",
        "rating_avg": [
            4.75,
            2.48746859276655
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            68.75,
            30.629846555280032
        ],
        "wc_strengths_avg": [
            43.25,
            33.214266513051285
        ],
        "wc_weaknesses_avg": [
            278.5,
            210.47743346971902
        ],
        "wc_questions_avg": [
            56.75,
            31.04331651096577
        ],
        "wc_review_avg": [
            447.25,
            189.19087583707625
        ],
        "wc_reply_reviewers_avg": [
            703.75,
            1172.3153106140003
        ],
        "wc_reply_authors_avg": [
            1093.75,
            994.6274113958452
        ],
        "reply_reviewers_avg": [
            1.5,
            1.5
        ],
        "reply_authors_avg": [
            1.75,
            1.299038105676658
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.7543365091413573,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:3EAuzBPf6zkJ:scholar.google.com/&scioq=Rethinking+the+Solution+to+Curse+of+Dimensionality+on+Randomized+Smoothing&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;2",
        "aff_unique_norm": "Tsinghua University;Simon Fraser University;University of Illinois Urbana-Champaign",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.sfu.ca;https://illinois.edu",
        "aff_unique_abbr": "THU;SFU;UIUC",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Shenzhen;Urbana-Champaign",
        "aff_country_unique_index": "0;0;0;1;2",
        "aff_country_unique": "China;Canada;United States"
    },
    {
        "id": "5Vh0XqOTGi",
        "title": "GAN-based Vertical Federated Learning for Label Protection",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Split learning (splitNN) has emerged as a popular strategy for addressing the high computational costs and low modeling efficiency in Vertical Federated Learning (VFL). However, despite its popularity, vanilla splitNN lacks encryption protection, leaving it vulnerable to privacy leakage issues, especially Label Leakage from Gradients (LLG). Motivated by the LLG issue resulting from the use of labels during training, we propose the Generative Adversarial Federated Model (GAFM), a novel method designed specifically to enhance label privacy protection by integrating splitNN with Generative Adversarial Networks (GANs). GAFM leverages GANs to indirectly utilize label information by learning the label distribution rather than relying on explicit labels, thereby mitigating LLG. GAFM also employs an additional cross-entropy loss based on the noisy labels to further improve the prediction accuracy. Our ablation experiment demonstrates that the combination of GAN and the cross-entropy loss component is necessary to enable GAFM to mitigate LLG without significantly compromising the model utility. Empirical results on various datasets show that GAFM achieves a better and more robust trade-off between model utility and privacy compared to all baselines. In addition, we provide experimental justification to substantiate GAFM's superiority over splitNN, demonstrating that it offers enhanced label protection through gradient perturbation relative to splitNN. Codes of GAFM are available at [https://anonymous.4open.science/r/Generative-Adversarial-Federated-Model-BFF7/](https://anonymous.4open.science/r/Generative-Adversarial-Federated-Model-BFF7/).",
        "keywords": "Federated learning;Split learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/33f7f3ca497afbaa270d8d741eb14aed957e6c1c.zip",
        "author": "Yujin Han;Leying Guan",
        "authorids": "~Yujin_Han1;~Leying_Guan1",
        "gender": "F;",
        "homepage": "https://yujinhanml.github.io/;https://campuspress.yale.edu/lguan/research/",
        "dblp": "317/6852;",
        "google_scholar": "https://scholar.google.co.kr/citations?user=SxpbS5YAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Yujin_Han1;~Leying_Guan1",
        "aff": "the University of Hong Kong;Yale University",
        "aff_domain": "cs.hku.hk;yale.edu",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nhan2024ganbased,\ntitle={{GAN}-based Vertical Federated Learning for Label Protection},\nauthor={Yujin Han and Leying Guan},\nyear={2024},\nurl={https://openreview.net/forum?id=5Vh0XqOTGi}\n}",
        "github": "",
        "project": "",
        "reviewers": "ph6x;KHth;wbsE;vM2y",
        "site": "https://openreview.net/forum?id=5Vh0XqOTGi",
        "pdf_size": 1816895,
        "rating": "3;5;6;6",
        "confidence": "5;4;2;4",
        "soundness": "2;3;3;2",
        "contribution": "2;2;2;2",
        "presentation": "2;3;3;2",
        "wc_summary": "141;110;66;67",
        "wc_strengths": "15;36;15;103",
        "wc_weaknesses": "775;152;109;349",
        "wc_questions": "77;54;34;6",
        "wc_review": "1008;352;224;525",
        "wc_reply_reviewers": "836;95;0;0",
        "wc_reply_authors": "1582;1078;674;958",
        "reply_reviewers": "2;1;0;0",
        "reply_authors": "5;3;2;3",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            96.0,
            31.47220996371243
        ],
        "wc_strengths_avg": [
            42.25,
            36.10661296770994
        ],
        "wc_weaknesses_avg": [
            346.25,
            263.55964694922477
        ],
        "wc_questions_avg": [
            42.75,
            26.10914590713377
        ],
        "wc_review_avg": [
            527.25,
            297.40492178173514
        ],
        "wc_reply_reviewers_avg": [
            232.75,
            350.4392779070291
        ],
        "wc_reply_authors_avg": [
            1073.0,
            328.45547643478255
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.25,
            1.0897247358851685
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.7492686492653551,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:dzv9pl0OZx0J:scholar.google.com/&scioq=GAN-based+Vertical+Federated+Learning+for+Label+Protection&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Hong Kong;Yale University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.hku.hk;https://www.yale.edu",
        "aff_unique_abbr": "HKU;Yale",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "5WDOxf519p",
        "title": "Bridging the Domain Gap by Clustering-based Image-Text Graph Matching",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Learning domain-invariant representations is important to train a model that can generalize well to unseen target task domains. Text descriptions inherently contain semantic structures of concepts, and such auxiliary semantic cues can be used as effective pivot embedding for domain generalization problems. Here, we want to use (image-text) multimodal graph representations to get domain-invariant pivot embeddings by considering the inherent semantic structure between local images and text descriptors. Specifically, we aim to learn domain invariant features by (i) representing the image and text descriptions with graphs, and by (ii) clustering and matching the graph-based image node features into textual graphs simultaneously. We experiment with large-scale public datasets, such as CUB-DG and DomainBed, and our model achieves matched or better state-of-the-art performance on these datasets. Our code will be publicly available upon publication.",
        "keywords": "Domain Generalization;Multimodal Learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/29c65570338ee3c4b7ed7cd4c7713ac190dc28f4.zip",
        "author": "Nokyung Park;Daewon Chae;Jeongyong Shim;Sangpil Kim;Eun-Sol Kim;Jinkyu Kim",
        "authorids": "~Nokyung_Park1;~Daewon_Chae2;~Jeongyong_Shim2;~Sangpil_Kim4;~Eun-Sol_Kim1;~Jinkyu_Kim1",
        "gender": ";M;M;M;F;M",
        "homepage": "https://sites.google.com/view/nokyung-park;https://github.com/daewon88;https://hanyang-mllab.notion.site/Machine-Learning-Lab-1af963d60b934aeebc17abc6ca74bc0b;https://kuaicv.com/;;https://visionai.korea.ac.kr/",
        "dblp": "290/8702;354/4231;;182/2231;52/10086;",
        "google_scholar": "kvrypn8AAAAJ;OEa4E14AAAAJ;;mzH6yYgAAAAJ;JhZBnfYAAAAJ;",
        "orcid": ";;;0000-0002-7349-0018;;",
        "linkedin": "nokyungpark/;;jeongyong-shim-30b672215;spkim921;;",
        "or_profile": "~Nokyung_Park1;~Daewon_Chae2;~Jeongyong_Shim2;~Sangpil_Kim4;~Eun-Sol_Kim1;~Jinkyu_Kim1",
        "aff": "Korea University;Korea University;Hanyang University;Korea University;Hanyang University;Korea University",
        "aff_domain": "korea.ac.kr;korea.ac.kr;hanyang.ac.kr;korea.ac.kr;hanyang.ac.kr;korea.ac.kr",
        "position": "MS student;MS student;MS student;Assistant Professor;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\npark2024bridging,\ntitle={Bridging the Domain Gap by Clustering-based Image-Text Graph Matching},\nauthor={Nokyung Park and Daewon Chae and Jeongyong Shim and Sangpil Kim and Eun-Sol Kim and Jinkyu Kim},\nyear={2024},\nurl={https://openreview.net/forum?id=5WDOxf519p}\n}",
        "github": "",
        "project": "",
        "reviewers": "kUjy;1niQ;LvEJ",
        "site": "https://openreview.net/forum?id=5WDOxf519p",
        "pdf_size": 4974450,
        "rating": "3;5;5",
        "confidence": "5;5;4",
        "soundness": "2;3;3",
        "contribution": "2;3;2",
        "presentation": "2;3;3",
        "wc_summary": "55;51;42",
        "wc_strengths": "33;49;7",
        "wc_weaknesses": "217;131;173",
        "wc_questions": "4;125;3",
        "wc_review": "309;356;225",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1549;796;1053",
        "reply_reviewers": "0;0;0",
        "reply_authors": "3;2;2",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            49.333333333333336,
            5.436502143433364
        ],
        "wc_strengths_avg": [
            29.666666666666668,
            17.30767331432956
        ],
        "wc_weaknesses_avg": [
            173.66666666666666,
            35.11251755270318
        ],
        "wc_questions_avg": [
            44.0,
            57.27710420985567
        ],
        "wc_review_avg": [
            296.6666666666667,
            54.18691929074971
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1132.6666666666667,
            312.5298207993741
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4104583030208793062&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;1;0;1;0",
        "aff_unique_norm": "Korea University;Hanyang University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.korea.ac.kr;https://www.hanyang.ac.kr",
        "aff_unique_abbr": "KU;HYU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "5XUlfPcQnG",
        "title": "A Calibrated Simulation for Offline Training of Reinforcement Learning Agents to Optimize Energy and Emission in Office Buildings",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Modern commercial Heating, Ventilation, and Air Conditioning (HVAC) systems form a complex and interconnected thermodynamic system with the building and outside weather conditions, and current setpoint control policies are not fully optimized for minimizing energy use and carbon emission. Given a suitable training environment, a Reinforcement Learning (RL) model is able to improve upon these policies, but training such a model, especially in a way that scales to thousands of buildings, presents many practical challenges. To address these challenges, we propose a novel simulation based approach, where a customized simulator is used to train the agent for each building. Our simulator is lightweight and calibrated with recorded data from the building to achieve sufficient fidelity. On a two-story, 68,000 square foot building, with 127 devices, we were able to calibrate our simulator to have just over half a degree of drift from the real world over a 6 hour period. We train an RL agent on this simulator and demonstrate that our agent is able to learn an improved policy. This approach is an important step toward having a real-world Reinforcement Learning control system that can be scaled to many buildings, allowing for greater efficiency and resulting in reduced energy consumption and carbon emissions.",
        "keywords": "HVAC;Reinforcement Learning;Simulation",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Judah Goldfeder;John Sipple",
        "authorids": "~Judah_Goldfeder1;sipple@google.com",
        "gender": ";",
        "homepage": ";",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Judah_Goldfeder1;sipple@google.com",
        "aff": ";",
        "aff_domain": ";",
        "position": ";",
        "bibtex": "@misc{\ngoldfeder2024a,\ntitle={A Calibrated Simulation for Offline Training of Reinforcement Learning Agents to Optimize Energy and Emission in Office Buildings},\nauthor={Judah Goldfeder and John Sipple},\nyear={2024},\nurl={https://openreview.net/forum?id=5XUlfPcQnG}\n}",
        "github": "",
        "project": "",
        "reviewers": "doaN;P7Wf;BrjB;ffyP",
        "site": "https://openreview.net/forum?id=5XUlfPcQnG",
        "pdf_size": 2438504,
        "rating": "1;1;3;5",
        "confidence": "5;5;4;4",
        "soundness": "2;2;3;3",
        "contribution": "1;1;2;2",
        "presentation": "1;1;1;2",
        "wc_summary": "80;83;36;71",
        "wc_strengths": "39;50;40;57",
        "wc_weaknesses": "265;240;228;191",
        "wc_questions": "9;103;262;55",
        "wc_review": "393;476;566;374",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.5,
            1.6583123951777
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            1.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            67.5,
            18.714967272212903
        ],
        "wc_strengths_avg": [
            46.5,
            7.433034373659253
        ],
        "wc_weaknesses_avg": [
            231.0,
            26.67395733669828
        ],
        "wc_questions_avg": [
            107.25,
            95.32674073941688
        ],
        "wc_review_avg": [
            452.25,
            76.05384605659336
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.9045340337332909,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7083121433027660792&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0
    },
    {
        "id": "5ZWxBU9sYG",
        "title": "How to Craft Backdoors with Unlabeled Data Alone?",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Relying only on unlabeled data, Self-supervised learning (SSL) can learn rich features in an economical and scalable way. As the drive-horse for building foundation models, SSL has received a lot of attention recently with wide applications, which also raises security concerns where backdoor attack is a major type of threat: if the released dataset is maliciously poisoned, backdoored SSL models can behave badly when triggers are injected to test samples. The goal of this work is to investigate this potential risk. We notice that existing backdoors all require a considerable amount of *labeled* data that may not be available for SSL. To circumvent this limitation, we explore a more restrictive setting called no-label backdoors, where we only have access to the unlabeled data alone, where the key challenge is how to select the proper poison set without using label information. We propose two strategies for poison selection: clustering-based selection using pseudolabels, and contrastive selection derived from the mutual information principle. Experiments on CIFAR-10 and ImageNet-100 show that both no-label backdoors are effective on many SSL methods and outperform random poisoning by a large margin.",
        "keywords": "Backdoor Attack;Self-Supervised Learning;Deep Learning;Trustworthy Machine Learning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Yifei Wang;Wenhan Ma;Yisen Wang",
        "authorids": "~Yifei_Wang1;~Wenhan_Ma1;~Yisen_Wang1",
        "gender": "M;M;M",
        "homepage": "https://yifeiwang77.com;https://github.com/CuteNPC;https://yisenwang.github.io/",
        "dblp": "00/555-1;375/2887.html;172/1346-1",
        "google_scholar": "-CLy6YsAAAAJ;;uMWPDboAAAAJ",
        "orcid": ";0009-0003-3829-4008;",
        "linkedin": ";;",
        "or_profile": "~Yifei_Wang1;~Wenhan_Ma1;~Yisen_Wang1",
        "aff": "Massachusetts Institute of Technology;Peking University;Peking University",
        "aff_domain": "mit.edu;pku.edu.cn;pku.edu.cn",
        "position": "Postdoc;Undergrad student;Assistant Professor",
        "bibtex": "@misc{\nwang2024how,\ntitle={How to Craft Backdoors with Unlabeled Data Alone?},\nauthor={Yifei Wang and Wenhan Ma and Yisen Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=5ZWxBU9sYG}\n}",
        "github": "",
        "project": "",
        "reviewers": "Dh81;gGhQ;yPHh;w1uC",
        "site": "https://openreview.net/forum?id=5ZWxBU9sYG",
        "pdf_size": 10906885,
        "rating": "3;3;5;6",
        "confidence": "4;4;4;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "3;2;3;2",
        "wc_summary": "112;82;104;184",
        "wc_strengths": "34;64;32;117",
        "wc_weaknesses": "104;299;308;256",
        "wc_questions": "38;352;4;291",
        "wc_review": "288;797;448;848",
        "wc_reply_reviewers": "93;0;0;39",
        "wc_reply_authors": "417;2552;1098;1798",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "1;4;2;3",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            120.5,
            38.27205246651922
        ],
        "wc_strengths_avg": [
            61.75,
            34.3247359785913
        ],
        "wc_weaknesses_avg": [
            241.75,
            81.92183774794118
        ],
        "wc_questions_avg": [
            171.25,
            152.2651880765922
        ],
        "wc_review_avg": [
            595.25,
            234.8780268564942
        ],
        "wc_reply_reviewers_avg": [
            33.0,
            38.1247950814165
        ],
        "wc_reply_authors_avg": [
            1466.25,
            794.5823981815857
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17304679836458820384&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Massachusetts Institute of Technology;Peking University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://web.mit.edu;http://www.pku.edu.cn",
        "aff_unique_abbr": "MIT;Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "ControlVideo: Training-free Controllable Text-to-video Generation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19424",
        "id": "5a79AqFr0c",
        "author_site": "Yabo Zhang, Yuxiang Wei, Dongsheng jiang, XIAOPENG ZHANG, Wangmeng Zuo, Qi Tian",
        "tldr": "",
        "abstract": "Text-driven diffusion models have unlocked unprecedented abilities in image generation, whereas their video counterpart lags behind due to the excessive training cost.\nTo avert the training burden, we propose a training-free ControlVideo to produce high-quality videos based on the provided text prompts and motion sequences.\nSpecifically, ControlVideo adapts a pre-trained text-to-image model (i.e., ControlNet) for controllable text-to-video generation.\nTo generate continuous videos without flicker effect, we propose an interleaved-frame smoother to smooth the intermediate frames.\nIn particular, interleaved-frame smoother splits the whole videos with successive three-frame clips, and stabilizes each clip by updating the middle frame with the interpolation among other two frames in latent space.\nFurthermore, a fully cross-frame interaction mechanism have been exploited to further enhance the frame consistency, while a hierarchical sampler is employed to produce long videos efficiently.\nExtensive experiments demonstrate that our ControlVideo outperforms the state-of-the-arts both quantitatively and qualitatively. \nIt is worthy noting that, thanks to the efficient designs, ControlVideo could generate both short and long videos within several minutes using one NVIDIA 2080Ti. \nCode and videos are available at [this link](https://github.com/YBYBZhang/ControlVideo).",
        "keywords": "Diffusion models;video generation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/b49b1e56aa6c7862445818bae866c218d23b9566.zip",
        "author": "Yabo Zhang;Yuxiang Wei;Dongsheng Jiang;XIAOPENG ZHANG;Wangmeng Zuo;Qi Tian",
        "authorids": "~Yabo_Zhang1;~Yuxiang_Wei1;~Dongsheng_Jiang2;~XIAOPENG_ZHANG7;~Wangmeng_Zuo3;~Qi_Tian3",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://ybybzhang.github.io/;;https://sites.google.com/site/zxphistory/;;https://www.qitian1987.com/index.html;https://sites.google.com/site/dongshengjiangbme/",
        "dblp": "231/0624;47/8871-1;;93/2671;78/1467-1.html;85/8729",
        "google_scholar": "LnYDPdAAAAAJ;hORhL7YAAAAJ;Ud6aBAcAAAAJ;rUOpCEYAAAAJ;https://scholar.google.com/citations?hl=en;-eGIgsoAAAAJ",
        "orcid": ";0000-0002-8993-7195;;0000-0002-3330-783X;0000-0002-7252-5047;",
        "linkedin": ";;;;;",
        "or_profile": "~Yabo_Zhang1;~Yuxiang_Wei1;~XIAOPENG_ZHANG7;~Wangmeng_Zuo3;~Qi_Tian3;~Dongsheng_Jiang1",
        "aff": "Harbin Institute of Technology;Harbin Institute of Technology;Huawei Technologies Ltd.;Harbin Institute of Technology;Huawei Technologies Ltd.;Huawei Technologies Ltd.",
        "aff_domain": "hit.edu.cn;hit.edu.cn;huawei.com;hit.edu.cn;huawei.com;huawei.com",
        "position": "PhD student;PhD student;Principal Researcher;Full Professor;Principal Researcher;Principal Researcher",
        "bibtex": "@inproceedings{\nzhang2024controlvideo,\ntitle={ControlVideo: Training-free Controllable Text-to-video Generation},\nauthor={Yabo Zhang and Yuxiang Wei and Dongsheng Jiang and XIAOPENG ZHANG and Wangmeng Zuo and Qi Tian},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=5a79AqFr0c}\n}",
        "github": "",
        "project": "",
        "reviewers": "aLwG;XMqd;EvXG;HJ3a",
        "pdf_size": 27009780,
        "rating": "5;5;6;6",
        "confidence": "5;5;4;4",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;2",
        "presentation": "2;2;3;3",
        "wc_summary": "32;42;50;120",
        "wc_strengths": "36;48;30;66",
        "wc_weaknesses": "74;83;140;174",
        "wc_questions": "71;48;35;91",
        "wc_review": "213;221;255;451",
        "wc_reply_reviewers": "0;0;23;0",
        "wc_reply_authors": "431;647;552;928",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "3;3;3;4",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            61.0,
            34.655446902326915
        ],
        "wc_strengths_avg": [
            45.0,
            13.74772708486752
        ],
        "wc_weaknesses_avg": [
            117.75,
            41.172654760168186
        ],
        "wc_questions_avg": [
            61.25,
            21.47527648250425
        ],
        "wc_review_avg": [
            285.0,
            97.12878049270464
        ],
        "wc_reply_reviewers_avg": [
            5.75,
            9.959292143521045
        ],
        "wc_reply_authors_avg": [
            639.5,
            183.31462025708697
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.25,
            0.4330127018922193
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 271,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2569088021339755098&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=5a79AqFr0c",
        "pdf": "https://openreview.net/pdf?id=5a79AqFr0c",
        "email": "hit.edu.cn;hit.edu.cn;huawei.com;hit.edu.cn;huawei.com;huawei.com",
        "author_num": 6,
        "aff_unique_index": "0;0;1;0;1;1",
        "aff_unique_norm": "Harbin Institute of Technology;Huawei",
        "aff_unique_dep": ";Huawei Technologies",
        "aff_unique_url": "http://www.hit.edu.cn/;https://www.huawei.com",
        "aff_unique_abbr": "HIT;Huawei",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Harbin;",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "5aHmaMFJns",
        "title": "Reason for Future, Act for Now: A Principled Architecture for Autonomous LLM Agents",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs) demonstrate impressive reasoning abilities, but translating reasoning into actions in the real world remains challenging. In particular, it remains unclear how to complete a given task provably within a minimum number of interactions with the external environment, e.g., through an internal mechanism of reasoning. To this end, we propose a principled framework with provable regret guarantees to orchestrate reasoning and acting, which we call \"reason for future, act for now\" ($\\texttt{RAFA}$). Specifically, we design a prompt template for reasoning that learns from the memory buffer and plans a future trajectory over a long horizon (\"reason for future\"). At each step, the LLM agent takes the initial action of the planned trajectory (\"act for now\"), stores the collected feedback in the memory buffer, and reinvokes the reasoning routine to replan the future trajectory from the new state. \n\nThe key idea is to cast reasoning in LLMs as learning and planning in Bayesian adaptive Markov decision processes (MDPs). Correspondingly, we prompt LLMs to form an updated posterior of the unknown environment from the memory buffer (learning) and generate an optimal trajectory for multiple future steps that maximizes a value function (planning). The learning and planning subroutines are performed in an \"in-context\" manner to emulate the actor-critic update for MDPs. Our theoretical analysis proves that the novel combination of long-term reasoning and short-term acting achieves a $\\sqrt{T}$ regret. In particular, the regret bound highlights an intriguing interplay between the prior knowledge obtained through pretraining and the uncertainty reduction achieved by reasoning and acting. Our empirical validation shows that it outperforms various existing frameworks and achieves nearly perfect scores on a few benchmarks. By incorporating \"classical\" MDP techniques, $\\texttt{RAFA}$ introduces the first autonomous LLM agent with provable regret guarantees.",
        "keywords": "Large language model",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/47b3fac881bf8fa45cb49687db5547bac199cd58.zip",
        "author": "Zhihan Liu;Hao Hu;Shenao Zhang;Hongyi Guo;Shuqi Ke;Boyi Liu;Zhaoran Wang",
        "authorids": "~Zhihan_Liu1;~Hao_Hu3;~Shenao_Zhang1;~Hongyi_Guo1;~Shuqi_Ke1;~Boyi_Liu1;~Zhaoran_Wang1",
        "gender": "M;M;M;M;;M;Not Specified",
        "homepage": ";https://mousehu.github.io;https://shenao-zhang.github.io/;https://gohsyi.github.io/;;;https://zhaoranwang.github.io/",
        "dblp": ";67/6924-6;253/4543.html;;;;117/2756",
        "google_scholar": "0VVg_R4AAAAJ;https://scholar.google.com/citations?hl=en;8NamuusAAAAJ;https://scholar.google.com/citations?hl=en;;1G8RH_YAAAAJ;https://scholar.google.com.tw/citations?user=HSx0BgQAAAAJ",
        "orcid": ";;;;;;",
        "linkedin": ";hao-hu-tsinghua;shenao-zhang-055a53178/;;;;",
        "or_profile": "~Zhihan_Liu1;~Hao_Hu3;~Shenao_Zhang1;~Hongyi_Guo1;~Shuqi_Ke1;~Boyi_Liu1;~Zhaoran_Wang1",
        "aff": "Northwestern University;Tsinghua University;Georgia Institute of Technology;Northwestern University, Northwestern University;;ByteDance Inc.;Northwestern University",
        "aff_domain": "northwestern.edu;tsinghua.edu.cn;gatech.edu;u.northwestern.edu;;bytedance.com;northwestern.edu",
        "position": "PhD student;PhD student;MS student;PhD student;;Researcher;Associate Professor",
        "bibtex": "@misc{\nliu2024reason,\ntitle={Reason for Future, Act for Now: A Principled Architecture for Autonomous {LLM} Agents},\nauthor={Zhihan Liu and Hao Hu and Shenao Zhang and Hongyi Guo and Shuqi Ke and Boyi Liu and Zhaoran Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=5aHmaMFJns}\n}",
        "github": "",
        "project": "",
        "reviewers": "Aro2;3FoC;P2KV;n4NZ",
        "site": "https://openreview.net/forum?id=5aHmaMFJns",
        "pdf_size": 2856024,
        "rating": "3;5;5;6",
        "confidence": "4;4;3;3",
        "soundness": "2;3;2;3",
        "contribution": "1;2;2;2",
        "presentation": "3;4;3;1",
        "wc_summary": "66;76;58;289",
        "wc_strengths": "33;57;49;68",
        "wc_weaknesses": "156;444;251;657",
        "wc_questions": "22;119;66;177",
        "wc_review": "277;696;424;1191",
        "wc_reply_reviewers": "203;0;0;438",
        "wc_reply_authors": "1000;1354;1557;2028",
        "reply_reviewers": "1;0;0;2",
        "reply_authors": "2;4;3;6",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            122.25,
            96.48413081952907
        ],
        "wc_strengths_avg": [
            51.75,
            12.754901018824098
        ],
        "wc_weaknesses_avg": [
            377.0,
            192.0976314273552
        ],
        "wc_questions_avg": [
            96.0,
            58.02154772151464
        ],
        "wc_review_avg": [
            647.0,
            348.19750142699183
        ],
        "wc_reply_reviewers_avg": [
            160.25,
            180.50813693570714
        ],
        "wc_reply_authors_avg": [
            1484.75,
            371.6243903459513
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.75,
            1.479019945774904
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.6882472016116854,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4081571305387143859&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;2;0;3;0",
        "aff_unique_norm": "Northwestern University;Tsinghua University;Georgia Institute of Technology;ByteDance",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.northwestern.edu;https://www.tsinghua.edu.cn;https://www.gatech.edu;https://www.bytedance.com",
        "aff_unique_abbr": "NU;THU;Georgia Tech;ByteDance",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;1;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "5aayQBRGM1",
        "title": "Unsupervised Representation Learning to Aid Semi-Supervised Meta Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Few-shot learning or meta-learning leverages the data scarcity problem in machine learning. Traditionally, training data requires a multitude of samples and labeling for supervised learning. To address this issue, we propose a one-shot unsupervised meta-learning to learn the latent representation of the training samples. We use augmented samples as the query set during the training phase of the unsupervised meta-learning. A temperature-scaled cross-entropy loss is used in the inner loop of meta-learning to prevent overfitting during unsupervised learning. The learned parameters from this step are applied to the targeted supervised meta-learning in a transfer-learning fashion for initialization and fast adaptation with improved accuracy. The proposed method is model agnostic and can aid any meta-learning model to improve accuracy. We use model agnostic meta-learning (MAML) and relation network (RN) on Omniglot and mini-Imagenet datasets to demonstrate the performance of the proposed method. Furthermore, a meta-learning model with the proposed initialization can achieve satisfactory accuracy with significantly fewer training samples.",
        "keywords": "few-shot classification;meta-learning;machine learning;semi-supervised learning;unsupervised learning.",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Atik Faysal;Mohammad Rostami;huaxia wang;Avimanyu Sahoo;Ryan Antle",
        "authorids": "~Atik_Faysal1;~Mohammad_Rostami2;~huaxia_wang1;~Avimanyu_Sahoo1;~Ryan_Antle1",
        "gender": "M;M;M;M;",
        "homepage": "https://github.com/atik666;https://sites.google.com/view/woreom;https://sites.google.com/view/huaxia-wang;https://sites.google.com/uah.edu/accl;https://www.bakerhughes.com",
        "dblp": "299/1517;;40/10246;150/4130;",
        "google_scholar": "tHtILuYAAAAJ;Md81vrUAAAAJ;fna2KGYAAAAJ;0h-0qjIAAAAJ;",
        "orcid": "0000-0001-6569-4371;;;0000-0001-6113-3278;",
        "linkedin": "atik-faysal-64b809132/;woreom/;;avimanyu-sahoo-26a55731/;",
        "or_profile": "~Atik_Faysal1;~Mohammad_Rostami2;~huaxia_wang1;~Avimanyu_Sahoo1;~Ryan_Antle1",
        "aff": "Rowan University;Rowan College;Rowan University;University of Alabama at Huntsville;",
        "aff_domain": "rowan.edu;rowan.edu;rowan.edu;uah.edu;",
        "position": "PhD student;PhD student;Assistant Professor;Assistant Professor;",
        "bibtex": "@misc{\nfaysal2024unsupervised,\ntitle={Unsupervised Representation Learning to Aid Semi-Supervised Meta Learning},\nauthor={Atik Faysal and Mohammad Rostami and huaxia wang and Avimanyu Sahoo and Ryan Antle},\nyear={2024},\nurl={https://openreview.net/forum?id=5aayQBRGM1}\n}",
        "github": "",
        "project": "",
        "reviewers": "8qJe;vJfx;SMhQ;fvcV",
        "site": "https://openreview.net/forum?id=5aayQBRGM1",
        "pdf_size": 1180038,
        "rating": "1;3;3;3",
        "confidence": "4;4;3;4",
        "soundness": "1;1;1;1",
        "contribution": "1;1;1;1",
        "presentation": "1;1;1;2",
        "wc_summary": "44;48;42;85",
        "wc_strengths": "9;6;6;16",
        "wc_weaknesses": "181;101;47;117",
        "wc_questions": "26;447;2;24",
        "wc_review": "260;602;97;242",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.0,
            0.0
        ],
        "contribution_avg": [
            1.0,
            0.0
        ],
        "presentation_avg": [
            1.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            54.75,
            17.597940220378067
        ],
        "wc_strengths_avg": [
            9.25,
            4.085033659592048
        ],
        "wc_weaknesses_avg": [
            111.5,
            47.778133073614335
        ],
        "wc_questions_avg": [
            124.75,
            186.28925760762482
        ],
        "wc_review_avg": [
            300.25,
            185.32184841512887
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:_Fyw0kU6WYQJ:scholar.google.com/&scioq=Unsupervised+Representation+Learning+to+Aid+Semi-Supervised+Meta+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "Rowan University;Rowan College;University of Alabama in Huntsville",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.rowan.edu;https://www.rowan.edu;https://www.uah.edu",
        "aff_unique_abbr": "Rowan;;UAH",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Huntsville",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "5abK7RDbuW",
        "title": "Text to Image for Multi-Label Image Recognition with Joint Prompt-Adapter Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Benefited from image-text contrastive learning, pre-trained vision-language models, e.g., CLIP, allow to directly leverage texts as images (TaI) for parameter-efficient fine-tuning (PEFT). While CLIP is capable of making image feature to be similar with the corresponding text features, modality gap remains a nontrivial issue and limits the MLR performance of TaI. Using multi-label image recognition (MLR) as an example, we present a novel method, called T2I-PAL to tackle the modality gap issue when using only text captions for PEFT. The core design of T2I-PAL is to leverage pretrained text-to-image generation models to generate photo-realistic and diverse images from text captions, thereby being beneficial for reducing modality gap. For better PEFT, we further combine both prompt tuning and adapter learning for enhancing classification performance. Extensive experiments on multiple benchmarks, including MS-COCO, VOC2007, and NUS- WIDE, show that our T2I-PAL can boost recognition performance by 3.47% in average above the top-ranked state-of-the-art methods. Our code and models will be made publicly available.",
        "keywords": "Multi-Label Image Recognition;Text to Image;Parameter-Efficient Fine-Tuning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/d34dc0106659b2614543b24d35056e07a3899838.pdf",
        "author": "Chun-Mei Feng;Kai Yu;Xinxing Xu;Yong Liu;Salman Khan;Wangmeng Zuo;Rick Siow Mong Goh",
        "authorids": "~Chun-Mei_Feng1;~Kai_Yu7;~Xinxing_Xu1;~Yong_Liu10;~Salman_Khan4;~Wangmeng_Zuo3;~Rick_Siow_Mong_Goh1",
        "gender": "F;M;M;M;M;M;",
        "homepage": "https://scholar.google.com.hk/citations?user=g2nqHBcAAAAJ&hl=zh-CN;;https://sites.google.com/site/xinxingxu666/;;https://salman-h-khan.github.io/;;https://sites.google.com/view/rickgoh/home",
        "dblp": "182/8416-1;197/1322-9;15/10654;29/4867-26;32/11535-1;93/2671;https://dblp.uni-trier.de/pers/g/Goh:Rick_Siow_Mong",
        "google_scholar": "https://scholar.google.com.hk/citations?user=g2nqHBcAAAAJ;https://scholar.google.com.hk/citations?user=gVyOSpEAAAAJ;https://scholar.google.com.sg/citations?user=neFbpuEAAAAJ;QujHYk0AAAAJ;https://scholar.google.es/citations?user=M59O9lkAAAAJ;rUOpCEYAAAAJ;https://scholar.google.com.sg/citations?user=fBsBJjoAAAAJ",
        "orcid": "0000-0002-3044-9779;;0000-0003-1449-3072;;0000-0002-9502-1749;0000-0002-3330-783X;0000-0001-9116-1595",
        "linkedin": "https://linkedin.com/in/chunmei-feng-719a72229;;;liuyongsg;;;rickgoh/",
        "or_profile": "~Chun-Mei_Feng1;~Kai_Yu7;~Xinxing_Xu1;~Yong_Liu10;~Salman_Khan4;~Wangmeng_Zuo3;~Rick_Siow_Mong_Goh1",
        "aff": "IHPC;;Institute of High Performance Computing;Institute of High Performance Computing, Singapore, A*STAR;Australian National University;Harbin Institute of Technology;Institute of High Performance Computing, Singapore, A*STAR",
        "aff_domain": "astar.edu.sg;;ihpc.a-star.edu.sg;ihpc.a-star.edu.sg;anu.edu.au;hit.edu.cn;ihpc.a-star.edu.sg",
        "position": "Researcher;;Scientist;Senior Scientist, Adjunct Assistant Professor;Lecturer;Full Professor;Director",
        "bibtex": "@misc{\nfeng2024text,\ntitle={Text to Image for Multi-Label Image Recognition with Joint Prompt-Adapter Learning},\nauthor={Chun-Mei Feng and Kai Yu and Xinxing Xu and Yong Liu and Salman Khan and Wangmeng Zuo and Rick Siow Mong Goh},\nyear={2024},\nurl={https://openreview.net/forum?id=5abK7RDbuW}\n}",
        "github": "",
        "project": "",
        "reviewers": "GRDf;oaxK;M37Z;U89w",
        "site": "https://openreview.net/forum?id=5abK7RDbuW",
        "pdf_size": 1818597,
        "rating": "3;5;6;6",
        "confidence": "4;3;2;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;2",
        "presentation": "2;1;3;3",
        "wc_summary": "53;119;53;67",
        "wc_strengths": "9;95;74;43",
        "wc_weaknesses": "55;539;54;39",
        "wc_questions": "15;65;27;67",
        "wc_review": "132;818;208;216",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            73.0,
            27.16615541441225
        ],
        "wc_strengths_avg": [
            55.25,
            32.48364973336586
        ],
        "wc_weaknesses_avg": [
            171.75,
            212.12658367116555
        ],
        "wc_questions_avg": [
            43.5,
            22.907422377910613
        ],
        "wc_review_avg": [
            343.5,
            275.90714017582076
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.4923659639173309,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15791932118392428322&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;2;0",
        "aff_unique_norm": "Institute of High Performance Computing;Australian National University;Harbin Institute of Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ihpc.a-star.edu.sg;https://www.anu.edu.au;http://www.hit.edu.cn/",
        "aff_unique_abbr": "IHPC;ANU;HIT",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Harbin",
        "aff_country_unique_index": "0;0;0;1;2;0",
        "aff_country_unique": "Singapore;Australia;China"
    },
    {
        "title": "Certified Adversarial Robustness for Rate Encoded Spiking Neural Networks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19423",
        "id": "5bNYf0CqxY",
        "author_site": "Bhaskar Mukhoty, Hilal AlQuabeh, Giulia De Masi, Huan Xiong, Bin Gu",
        "tldr": "",
        "abstract": "The spiking neural networks are inspired by the biological neurons that employ binary spikes to propagate information in the neural network. It has garnered considerable attention as the next-generation neural network, as the spiking activity simplifies the computation burden of the network to a large extent and is known for its low energy deployment enabled by specialized neuromorphic hardware. One popular technique to feed a static image to such a network is rate encoding, where each pixel is encoded into random binary spikes, following a Bernoulli distribution that uses the pixel intensity as bias. By establishing a novel connection between rate-encoding and randomized smoothing, we give the first provable robustness guarantee for spiking neural networks against adversarial perturbation of inputs bounded under $l_1$-norm. We introduce novel adversarial training algorithms for rate-encoded models that significantly improve the state-of-the-art empirical robust accuracy result. Experimental validation of the method is performed across various static image datasets, including CIFAR-10, CIFAR-100 and ImageNet-100. The code is available at \\url{https://github.com/BhaskarMukhoty/CertifiedSNN}.",
        "keywords": "Spiking Neural Networks;Randomized Smoothing;Adversarial Learning;Certified Robustness",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Bhaskar Mukhoty;Hilal AlQuabeh;Giulia De Masi;Huan Xiong;Bin Gu",
        "authorids": "~Bhaskar_Mukhoty1;~Hilal_AlQuabeh1;~Giulia_De_Masi1;~Huan_Xiong1;~Bin_Gu1",
        "gender": "M;M;;M;M",
        "homepage": ";;;https://scholar.google.com/citations?user=l4hm14MAAAAJ&hl=en;https://mbzuai.ac.ae/study/faculty/bin-gu/",
        "dblp": "166/1438;299/8316;147/8719;;29/1758-1",
        "google_scholar": "https://scholar.google.co.in/citations?user=lJglnOQAAAAJ;_vbkrqMAAAAJ;G1K5hX0AAAAJ;l4hm14MAAAAJ;Vo8OgCgAAAAJ",
        "orcid": "0000-0002-8594-980X;;0000-0003-3284-880X;;0000-0001-6049-1815",
        "linkedin": ";hilal-alquabeh-388a8a134/;;;",
        "or_profile": "~Bhaskar_Mukhoty1;~Hilal_AlQuabeh1;~Giulia_De_Masi1;~Huan_Xiong1;~Bin_Gu1",
        "aff": "Mohamed bin Zayed University of Artificial Intelligence;Mohamed bin Zayed University of Artificial Intelligence;Technology Innovation Institute;Harbin Institute of Technology;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_domain": "mbzuai.ac.ae;mbzuai.ac.ae;tii.ae;hit.edu.cn;mbzuai.ac.ae",
        "position": "Postdoc;PhD student;Principal Researcher;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nmukhoty2024certified,\ntitle={Certified Adversarial Robustness for Rate Encoded Spiking Neural Networks},\nauthor={Bhaskar Mukhoty and Hilal AlQuabeh and Giulia De Masi and Huan Xiong and Bin Gu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=5bNYf0CqxY}\n}",
        "github": "",
        "project": "",
        "reviewers": "NxbL;wpSa;FaRA;77u8",
        "pdf_size": 437892,
        "rating": "5;6;8;8",
        "confidence": "4;3;3;3",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;2;2",
        "wc_summary": "41;30;25;84",
        "wc_strengths": "42;11;25;128",
        "wc_weaknesses": "150;97;149;484",
        "wc_questions": "118;4;3;166",
        "wc_review": "351;142;202;862",
        "wc_reply_reviewers": "0;44;27;144",
        "wc_reply_authors": "783;467;572;901",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "2;2;2;3",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            45.0,
            23.24865587512534
        ],
        "wc_strengths_avg": [
            51.5,
            45.510987684294435
        ],
        "wc_weaknesses_avg": [
            220.0,
            153.92043399107214
        ],
        "wc_questions_avg": [
            72.75,
            71.29998246844104
        ],
        "wc_review_avg": [
            389.25,
            283.35082053878017
        ],
        "wc_reply_reviewers_avg": [
            53.75,
            54.41679428264771
        ],
        "wc_reply_authors_avg": [
            680.75,
            170.64638144420175
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.7777777777777777,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9706469649419747137&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=5bNYf0CqxY",
        "pdf": "https://openreview.net/pdf?id=5bNYf0CqxY",
        "email": "mbzuai.ac.ae;mbzuai.ac.ae;tii.ae;hit.edu.cn;mbzuai.ac.ae",
        "author_num": 5,
        "aff_unique_index": "0;0;1;2;0",
        "aff_unique_norm": "Mohamed bin Zayed University of Artificial Intelligence;Technology Innovation Institute;Harbin Institute of Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://mbzuai.ac.ae;;http://www.hit.edu.cn/",
        "aff_unique_abbr": "MBZUAI;;HIT",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Harbin",
        "aff_country_unique_index": "0;0;2;0",
        "aff_country_unique": "United Arab Emirates;;China"
    },
    {
        "title": "Structured Video-Language Modeling with Temporal Grouping and Spatial Grounding",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19422",
        "id": "5dlfiJIXoh",
        "author_site": "Yuanhao Xiong, Long Zhao, Boqing Gong, Ming-Hsuan Yang, Florian Schroff, Ting Liu, Cho-Jui Hsieh, Liangzhe Yuan",
        "tldr": "",
        "abstract": "Existing video-language pre-training methods primarily focus on instance-level alignment between video clips and captions via global contrastive learning but neglect rich fine-grained local information in both videos and text, which is of importance to downstream tasks requiring temporal localization and semantic reasoning. A powerful model is expected to be capable of capturing region-object correspondences and recognizing scene changes in a video clip, reflecting spatial and temporal granularity, respectively. To strengthen model's understanding into such fine-grained details, we propose a simple yet effective video-language modeling framework, S-ViLM, by exploiting the intrinsic structures of these two modalities. It includes two novel designs, inter-clip spatial grounding and intra-clip temporal grouping, to promote learning region-object alignment and temporal-aware features, simultaneously. Comprehensive evaluations demonstrate that S-ViLM performs favorably against existing approaches in learning more expressive representations. Specifically, S-ViLM surpasses the state-of-the-art methods substantially on four representative downstream tasks, covering text-video retrieval, video question answering, video action recognition, and temporal action localization.",
        "keywords": "multi-modal learning;video and language",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yuanhao Xiong;Long Zhao;Boqing Gong;Ming-Hsuan Yang;Florian Schroff;Ting Liu;Cho-Jui Hsieh;Liangzhe Yuan",
        "authorids": "~Yuanhao_Xiong1;~Long_Zhao2;~Boqing_Gong1;~Ming-Hsuan_Yang1;~Florian_Schroff1;~Ting_Liu4;~Cho-Jui_Hsieh1;~Liangzhe_Yuan2",
        "gender": "M;M;M;M;M;;M;M",
        "homepage": "https://xyh97.github.io/;http://garyzhao.github.io/;http://boqinggong.info;https://faculty.ucmerced.edu/mhyang/;;http://tliu.org;http://web.cs.ucla.edu/~chohsieh/index.html;https://yuanliangzhe.github.io",
        "dblp": "232/1248;31/5383-3;29/7457;79/3711.html;52/5594;52/5150-5;14/2770;215/4356",
        "google_scholar": "DVKxiMkAAAAJ;YTyBTmgAAAAJ;lv9ZeVUAAAAJ;p9-ohHsAAAAJ;eWbZJlMAAAAJ;4wSfAIQAAAAJ;Wy89g4IAAAAJ;1H9CkZgAAAAJ",
        "orcid": ";0000-0001-8921-8564;;0000-0003-4848-2304;;;;",
        "linkedin": ";garyzhao9012/;boqing-gong-46aa5821/;minghsuanyang/;florianschroff;;;",
        "or_profile": "~Yuanhao_Xiong1;~Long_Zhao2;~Boqing_Gong1;~Ming-Hsuan_Yang1;~Florian_Schroff1;~Ting_Liu4;~Cho-Jui_Hsieh1;~Liangzhe_Yuan2",
        "aff": "University of California, Los Angeles;Google DeepMind;Google;University of California at Merced;Google;Google DeepMind;University of California, Los Angeles;Google DeepMind",
        "aff_domain": "cs.ucla.edu;google.com;google.com;umcerced.edu;google.com;google.com;ucla.edu;google.com",
        "position": "PhD student;Research scientist;Research Scientist;Professor;SWE;Researcher;Associate Professor;Researcher",
        "bibtex": "@inproceedings{\nxiong2024structured,\ntitle={Structured Video-Language Modeling with Temporal Grouping and Spatial Grounding},\nauthor={Yuanhao Xiong and Long Zhao and Boqing Gong and Ming-Hsuan Yang and Florian Schroff and Ting Liu and Cho-Jui Hsieh and Liangzhe Yuan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=5dlfiJIXoh}\n}",
        "github": "",
        "project": "",
        "reviewers": "7b3w;Dxbj;tkWv;adH9",
        "pdf_size": 7466392,
        "rating": "6;6;6;8",
        "confidence": "5;4;5;4",
        "soundness": "3;3;2;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;2",
        "wc_summary": "130;56;136;158",
        "wc_strengths": "50;48;119;145",
        "wc_weaknesses": "54;7;165;217",
        "wc_questions": "106;5;86;12",
        "wc_review": "340;116;506;532",
        "wc_reply_reviewers": "275;0;57;25",
        "wc_reply_authors": "1921;320;931;646",
        "reply_reviewers": "2;0;1;1",
        "reply_authors": "5;2;3;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            120.0,
            38.39270764090493
        ],
        "wc_strengths_avg": [
            90.5,
            42.51176307799995
        ],
        "wc_weaknesses_avg": [
            110.75,
            83.98921061660242
        ],
        "wc_questions_avg": [
            52.25,
            44.38679420728647
        ],
        "wc_review_avg": [
            373.5,
            165.91187419832252
        ],
        "wc_reply_reviewers_avg": [
            89.25,
            109.12922385868966
        ],
        "wc_reply_authors_avg": [
            954.5,
            598.4223007208204
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            3.0,
            1.224744871391589
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:t6X5vmToUokJ:scholar.google.com/&scioq=Structured+Video-Language+Modeling+with+Temporal+Grouping+and+Spatial+Grounding&hl=en&as_sdt=0,5",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=5dlfiJIXoh",
        "pdf": "https://openreview.net/pdf?id=5dlfiJIXoh",
        "email": "cs.ucla.edu;google.com;google.com;umcerced.edu;google.com;google.com;ucla.edu;google.com",
        "author_num": 8,
        "aff_unique_index": "0;1;1;2;1;1;0;1",
        "aff_unique_norm": "University of California, Los Angeles;Google;University of California, Merced",
        "aff_unique_dep": ";Google DeepMind;",
        "aff_unique_url": "https://www.ucla.edu;https://deepmind.com;https://www.ucmerced.edu",
        "aff_unique_abbr": "UCLA;DeepMind;UC Merced",
        "aff_campus_unique_index": "0;2;3;2;0",
        "aff_campus_unique": "Los Angeles;;Mountain View;Merced",
        "aff_country_unique_index": "0;1;0;0;0;1;0;1",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "5e0yWSNGIc",
        "title": "Exposing the Silent Hidden Impact of Certified Training in Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep reinforcement learning research has enabled reaching significant performance levels for sequential decision making in MDPs with highly complex observations and state dynamics with the aid of deep neural networks. However, this aid came with a cost that is inherent to deep neural networks which have increased volatilities towards indistinguishable peculiarly crafted non-robust directions. To alleviate these volatilities several studies suggested techniques to cope with this problem via explicitly regulating the temporal difference loss for the worst-case sensitivity. In our study, we show that these certified training techniques come with a cost that intriguingly causes inconsistencies and overestimations in the value functions. Furthermore, our results essentially demonstrate that vanilla trained deep reinforcement learning policies have more accurate and consistent estimates for the state-action values. We believe our results reveal foundational intrinsic properties of the certified Lipschitz training techniques and demonstrate the need to rethink the approach to resilience in deep reinforcement learning.",
        "keywords": "Decision Boundary Stability;Volatility;Rigorous Analysis;Reinforcement Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/f80ad8557c8521b7d47f7992edef9e68eab7dfb4.zip",
        "author": "Ezgi Korkmaz",
        "authorids": "~Ezgi_Korkmaz2",
        "gender": "",
        "homepage": "https://ezgikorkmaz.github.io/",
        "dblp": "300/7830.html",
        "google_scholar": "",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Ezgi_Korkmaz2",
        "aff": "University College London, University of London",
        "aff_domain": "ucl.ac.uk",
        "position": "PhD student",
        "bibtex": "@misc{\nkorkmaz2024exposing,\ntitle={Exposing the Silent Hidden Impact of Certified Training in Reinforcement Learning},\nauthor={Ezgi Korkmaz},\nyear={2024},\nurl={https://openreview.net/forum?id=5e0yWSNGIc}\n}",
        "github": "",
        "project": "",
        "reviewers": "JDGz;KcnX;yyyH",
        "site": "https://openreview.net/forum?id=5e0yWSNGIc",
        "pdf_size": 1988271,
        "rating": "5;5;6",
        "confidence": "3;3;3",
        "soundness": "3;3;3",
        "contribution": "2;2;3",
        "presentation": "3;3;3",
        "wc_summary": "80;46;41",
        "wc_strengths": "106;66;187",
        "wc_weaknesses": "458;163;294",
        "wc_questions": "184;54;50",
        "wc_review": "828;329;572",
        "wc_reply_reviewers": "567;62;207",
        "wc_reply_authors": "851;722;1042",
        "reply_reviewers": "1;1;1",
        "reply_authors": "3;2;2",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            55.666666666666664,
            17.326921891156037
        ],
        "wc_strengths_avg": [
            119.66666666666667,
            50.33443707399096
        ],
        "wc_weaknesses_avg": [
            305.0,
            120.68416079447488
        ],
        "wc_questions_avg": [
            96.0,
            62.24682053459973
        ],
        "wc_review_avg": [
            576.3333333333334,
            203.7389397134371
        ],
        "wc_reply_reviewers_avg": [
            278.6666666666667,
            212.3021955190813
        ],
        "wc_reply_authors_avg": [
            871.6666666666666,
            131.45425904938273
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:YhN2TYHRaK0J:scholar.google.com/&scioq=Exposing+the+Silent+Hidden+Impact+of+Certified+Training+in+Reinforcement+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "University College London",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucl.ac.uk",
        "aff_unique_abbr": "UCL",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "5eLgTLusaR",
        "title": "Loco3D: Indoor Multiuser Locomotion 3D Dataset",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In the context of human-AI interaction, modeling human actions is a critical and challenging endeavor, with locomotion being a particularly fundamental behavior for AI agents to understand. Modeling human trajectories in complex indoor scenes, such as the home environment, requires an understanding of how humans interact with their surroundings and other humans. These interactions are influenced by a range of factors, including the geometry and semantics of the scene, the socio-cultural context, and the task each human needs to perform. Previous research has shared datasets containing human motion and scene structure in indoor scenes, but these datasets are limited in scale due to the difficulty and time required to collect data at different locations. To solve the scale problem, we propose to use a virtual reality (VR) system to build a human motion dataset. Specifically, we present Loco3D, a dataset of multi-person interactions in over 100 different indoor VR scenes, including 3D body pose data and highly accurate spatial information. The dataset can be used for building AI agents that operate in indoor environments, such as home robots, or to create virtual avatars for games or animations that mimic human movement and posture. With an initial evaluation, we demonstrate that models trained with our dataset have improved multi-person trajectory synthesis performance on real-world data.",
        "keywords": "Human trajectory synthesis;Indoor;Dataset;Multi-user;3D;Virtual reality",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/463ae5689dcf0be65b0ca8c5e0a2a085a7b507fa.zip",
        "author": "Kojiro Takeyama;Yimeng Liu;Misha Sra",
        "authorids": "~Kojiro_Takeyama1;~Yimeng_Liu1;~Misha_Sra1",
        "gender": "M;;F",
        "homepage": ";;https://sites.cs.ucsb.edu/~sra",
        "dblp": ";;119/4545",
        "google_scholar": "TRtprtgAAAAJ;hROpwCcAAAAJ;yDkV9BsAAAAJ",
        "orcid": ";0000-0002-6742-2908;0000-0001-8154-8518",
        "linkedin": ";yimeng-liu-1a857a172/;mishasra",
        "or_profile": "~Kojiro_Takeyama1;~Yimeng_Liu1;~Misha_Sra1",
        "aff": "Toyota Motor North America;University of California, Santa Barbara;University of California, Santa Barbara",
        "aff_domain": "toyota.com;ucsb.edu;ucsb.edu",
        "position": "Researcher;PhD student;Assistant Professor",
        "bibtex": "@misc{\ntakeyama2024locod,\ntitle={Loco3D: Indoor Multiuser Locomotion 3D Dataset},\nauthor={Kojiro Takeyama and Yimeng Liu and Misha Sra},\nyear={2024},\nurl={https://openreview.net/forum?id=5eLgTLusaR}\n}",
        "github": "",
        "project": "",
        "reviewers": "v7u4;EhxJ;Zavr;Yanw",
        "site": "https://openreview.net/forum?id=5eLgTLusaR",
        "pdf_size": 19739885,
        "rating": "3;5;5;5",
        "confidence": "3;5;3;2",
        "soundness": "3;2;2;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;2",
        "wc_summary": "140;36;56;40",
        "wc_strengths": "78;52;115;26",
        "wc_weaknesses": "211;193;210;147",
        "wc_questions": "116;86;148;95",
        "wc_review": "545;367;529;308",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1333;1001;1402;952",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            68.0,
            42.23742416388575
        ],
        "wc_strengths_avg": [
            67.75,
            32.89661836724255
        ],
        "wc_weaknesses_avg": [
            190.25,
            25.974747351995553
        ],
        "wc_questions_avg": [
            111.25,
            23.84716964337697
        ],
        "wc_review_avg": [
            437.25,
            102.06462413588756
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1172.0,
            197.77638888401214
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.13245323570650439,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:oO1oLZ5fgQMJ:scholar.google.com/&scioq=Loco3D:+Indoor+Multiuser+Locomotion+3D+Dataset&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Toyota Motor Corporation;University of California, Santa Barbara",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.toyota.com;https://www.ucsb.edu",
        "aff_unique_abbr": "Toyota;UCSB",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Santa Barbara",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "5elND8cf8r",
        "title": "Contrastive Implicit Representation Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Implicit Neural Representations have emerged as an interesting alternative to traditional array representations. The challenge of performing downstream tasks directly on implicit representations has been addressed by several methods. Overcoming this challenge would open the door to the application of implicit representations to a wide range of fields. Then again, self-supervised representation learning methods, such as the several contrastive learning frameworks which have been proven powerful representation learning methods. So far, the use of self-supervised learning for implicit representations has remained unexplored, mostly because of the difficulty of producing valid augmented views of implicit representations to be used for learning contrasts. In this work, we adapt the popular SimCLR algorithm to implicit representations that consist of multiplicative filters networks and SIRENs. While methods to obtain augmentations in SIREN have been studied in the literature, we provide methods for augmenting MFNs effectively. We show how MFNs lend themselves well to geometric augmentations. To the best of our knowledge, our work is the first to demonstrate that self-supervised learning on implicit representations of images is feasible and results in good downstream task performances.",
        "keywords": "Implicit neural representations;self-supervised-learning;contrastive learning;neural fields;multiplicative filter networks;SimCLR",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Riccardo Valperga;Samuele Papa;David W. Romero;Miltiadis Kofinas;Jan-jakob Sonke;Efstratios Gavves",
        "authorids": "~Riccardo_Valperga1;~Samuele_Papa1;~David_W._Romero1;~Miltiadis_Kofinas2;~Jan-jakob_Sonke1;~Efstratios_Gavves1",
        "gender": "M;M;M;M;;M",
        "homepage": ";https://samuelepapa.github.io/;https://davidwromero.xyz/;https://mkofinas.github.io;;https://www.egavves.com",
        "dblp": ";296/3702;254/1396;305/0160;20/4093;03/8693",
        "google_scholar": "IK64D1wAAAAJ;;7tdzmVoAAAAJ;Ur5BV8MAAAAJ;https://scholar.google.com/citations?hl=nl;https://scholar.google.nl/citations?user=QqfCvsgAAAAJ",
        "orcid": ";;;0000-0002-3392-4037;0000-0001-5155-5274;",
        "linkedin": ";samuelepapa/;david-w-romero-05893567/;miltiadiskofinas/;;",
        "or_profile": "~Riccardo_Valperga1;~Samuele_Papa1;~David_W._Romero1;~Miltiadis_Kofinas2;~Jan-jakob_Sonke1;~Efstratios_Gavves1",
        "aff": "University of Amsterdam;NXAI;NVIDIA;University of Amsterdam;University of Amsterdam;University of Amsterdam",
        "aff_domain": "uva.nl;nx-ai.com;nvidia.com;uva.nl;uva.nl;uva.nl",
        "position": "PhD student;Intern;Researcher;PhD student;Full Professor;Associate Professor",
        "bibtex": "@misc{\nvalperga2024contrastive,\ntitle={Contrastive Implicit Representation Learning},\nauthor={Riccardo Valperga and Samuele Papa and David W. Romero and Miltiadis Kofinas and Jan-jakob Sonke and Efstratios Gavves},\nyear={2024},\nurl={https://openreview.net/forum?id=5elND8cf8r}\n}",
        "github": "",
        "project": "",
        "reviewers": "QeAy;mwVc;1Uny",
        "site": "https://openreview.net/forum?id=5elND8cf8r",
        "pdf_size": 4941530,
        "rating": "1;3;3",
        "confidence": "3;3;3",
        "soundness": "2;3;2",
        "contribution": "1;1;2",
        "presentation": "2;3;3",
        "wc_summary": "43;157;54",
        "wc_strengths": "36;70;58",
        "wc_weaknesses": "688;393;160",
        "wc_questions": "24;191;17",
        "wc_review": "791;811;289",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            84.66666666666667,
            51.344154703551425
        ],
        "wc_strengths_avg": [
            54.666666666666664,
            14.079141387961917
        ],
        "wc_weaknesses_avg": [
            413.6666666666667,
            216.04989135742593
        ],
        "wc_questions_avg": [
            77.33333333333333,
            80.42525860836396
        ],
        "wc_review_avg": [
            630.3333333333334,
            241.4971819481314
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Ic-fr-MAHnMJ:scholar.google.com/&scioq=Contrastive+Implicit+Representation+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0;0;0",
        "aff_unique_norm": "University of Amsterdam;NXAI;NVIDIA",
        "aff_unique_dep": ";;NVIDIA Corporation",
        "aff_unique_url": "https://www.uva.nl;;https://www.nvidia.com",
        "aff_unique_abbr": "UvA;;NVIDIA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;2;0;0;0",
        "aff_country_unique": "Netherlands;;United States"
    },
    {
        "title": "Contextual Bandits with Online Neural Regression",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19421",
        "id": "5ep85sakT3",
        "author_site": "Rohan Deb, Yikun Ban, Shiliang Zuo, Jingrui He, Arindam Banerjee",
        "tldr": "",
        "abstract": "Recent works have shown a reduction from contextual bandits to online regression under a realizability assumption (Foster and Rakhlin, 2020; Foster and Krishnamurthy, 2021). In this work, we investigate the use of neural networks for such online regression and associated Neural Contextual Bandits (NeuCBs). Using existing results for wide networks, one can readily show a  ${\\mathcal{O}}(\\sqrt{T})$ regret for online regression with square loss, which via the reduction implies a ${\\mathcal{O}}(\\sqrt{K} T^{3/4})$ regret for NeuCBs. Departing from this standard approach, we first show a $\\mathcal{O}(\\log T)$ regret for online regression with almost convex losses that satisfy QG (Quadratic Growth) condition, a generalization of the PL (Polyak-\\L ojasiewicz) condition, and that have a unique minima. Although not directly applicable to wide networks since they do not have unique minima, we show that adding a suitable small random perturbation to the network predictions surprisingly makes the loss satisfy QG with unique minima. Based on such a perturbed prediction, we show a ${\\mathcal{O}}(\\log T)$ regret for online regression with both squared loss and KL loss, and subsequently convert these respectively to $\\tilde{\\mathcal{O}}(\\sqrt{KT})$ and $\\tilde{\\mathcal{O}}(\\sqrt{KL^*} + K)$ regret for NeuCB, where $L^*$ is the loss of the best policy. Separately, we also show that existing regret bounds for NeuCBs are $\\Omega(T)$ or assume i.i.d. contexts, unlike this work. Finally, our experimental results on various datasets demonstrate that our algorithms, especially the one based on KL loss, persistently outperform existing algorithms.",
        "keywords": "Neural Bandits;Contextual Bandits;Regret Bounds;Deep Learning;Online Regression",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/367a6ec5730f985923a8518d673013750decf8f0.zip",
        "author": "Rohan Deb;Yikun Ban;Shiliang Zuo;Jingrui He;Arindam Banerjee",
        "authorids": "~Rohan_Deb1;~Yikun_Ban1;~Shiliang_Zuo1;~Jingrui_He1;~Arindam_Banerjee4",
        "gender": "M;;M;F;",
        "homepage": "https://rohandeb24.github.io/;;;https://www.hejingrui.org;https://arindam.cs.illinois.edu/",
        "dblp": "305/0597.html;;195/4141;34/2685;82/4807.html",
        "google_scholar": "DiCbL00AAAAJ;;zkP0Vs0AAAAJ;hXpZynkAAAAJ;RY7cuPAAAAAJ",
        "orcid": ";;;0000-0002-6429-6272;",
        "linkedin": "rohan-deb-273986126;;;;",
        "or_profile": "~Rohan_Deb1;~Yikun_Ban1;~Shiliang_Zuo1;~Jingrui_He1;~Arindam_Banerjee4",
        "aff": "University of Illinois, Urbana Champaign;;Department of Computer Science, University of Illinois at Urbana-Champaign;University of Illinois, Urbana Champaign;University of Illinois, Urbana Champaign",
        "aff_domain": "cs.illinois.edu;;cs.illinois.edu;illinois.edu;illinois.edu",
        "position": "PhD student;;PhD student;Full Professor;Professor",
        "bibtex": "@inproceedings{\ndeb2024contextual,\ntitle={Contextual Bandits with Online Neural Regression},\nauthor={Rohan Deb and Yikun Ban and Shiliang Zuo and Jingrui He and Arindam Banerjee},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=5ep85sakT3}\n}",
        "github": "",
        "project": "",
        "reviewers": "EQUF;eHnV;uhN1;PXpv;Gbgm",
        "pdf_size": 8456479,
        "rating": "5;5;6;6;8",
        "confidence": "3;3;4;4;4",
        "soundness": "2;3;3;3;3",
        "contribution": "3;2;3;3;3",
        "presentation": "2;2;3;3;4",
        "wc_summary": "77;77;62;71;164",
        "wc_strengths": "23;45;28;44;101",
        "wc_weaknesses": "137;87;9;272;14",
        "wc_questions": "41;3;64;2;27",
        "wc_review": "278;212;163;389;306",
        "wc_reply_reviewers": "0;170;0;0;17",
        "wc_reply_authors": "990;1693;715;1175;159",
        "reply_reviewers": "0;2;0;0;1",
        "reply_authors": "3;4;2;3;2",
        "rating_avg": [
            6.0,
            1.0954451150103321
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.8,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.8,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            90.2,
            37.306299736103554
        ],
        "wc_strengths_avg": [
            48.2,
            27.780568748677556
        ],
        "wc_weaknesses_avg": [
            103.8,
            96.6714021828586
        ],
        "wc_questions_avg": [
            27.4,
            23.51680250374187
        ],
        "wc_review_avg": [
            269.6,
            77.88863845260103
        ],
        "wc_reply_reviewers_avg": [
            37.4,
            66.62612100370244
        ],
        "wc_reply_authors_avg": [
            946.4,
            506.9743977756668
        ],
        "reply_reviewers_avg": [
            0.6,
            0.7999999999999999
        ],
        "reply_authors_avg": [
            2.8,
            0.7483314773547882
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.74535599249993,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=786987570628450731&as_sdt=5,34&sciodt=0,34&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=5ep85sakT3",
        "pdf": "https://openreview.net/pdf?id=5ep85sakT3",
        "email": "cs.illinois.edu;;cs.illinois.edu;illinois.edu;illinois.edu",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of Illinois Urbana-Champaign",
        "aff_unique_dep": "",
        "aff_unique_url": "https://illinois.edu",
        "aff_unique_abbr": "UIUC",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Urbana-Champaign",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "MiniLLM: Knowledge Distillation of Large Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19420",
        "id": "5h0qf7IBZZ",
        "author_site": "Yuxian Gu, Li Dong, Furu Wei, Minlie Huang",
        "tldr": "",
        "abstract": "Knowledge Distillation (KD) is a promising technique for reducing the high computational demand of large language models (LLMs). However, previous KD methods are primarily applied to white-box classification models or training small models to imitate black-box model APIs like ChatGPT. How to effectively distill the knowledge of white-box LLMs into small models is still under-explored, which becomes more important with the prosperity of open-source LLMs. In this work, we propose a KD approach that distills LLMs into smaller language models. We first replace the forward Kullback-Leibler divergence (KLD) objective in the standard KD approaches with reverse KLD, which is more suitable for KD on generative language models, to prevent the student model from overestimating the low-probability regions of the teacher distribution. Then, we derive an effective optimization approach to learn this objective. The student models are named MiniLLM. Extensive experiments in the instruction-following setting show that MiniLLM generates more precise responses with higher overall quality, lower exposure bias, better calibration, and higher long-text generation performance than the baselines. Our method is scalable for different model families\nwith 120M to 13B parameters. Our code, data, and model checkpoints can be found in https://github.com/microsoft/LMOps/tree/main/minillm.",
        "keywords": "Large Lanauge Models;Knowledge Distillation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/f056cb3654f515b1064a30e3360bbe5a89526f27.zip",
        "author": "Yuxian Gu;Li Dong;Furu Wei;Minlie Huang",
        "authorids": "~Yuxian_Gu1;~Li_Dong1;~Furu_Wei1;~Minlie_Huang1",
        "gender": "M;M;M;M",
        "homepage": "https://t1101675.github.io/;http://dong.li;https://www.microsoft.com/en-us/research/people/fuwei/;http://coai.cs.tsinghua.edu.cn/hml",
        "dblp": ";85/5090-4;72/5870;",
        "google_scholar": "zF9dr1sAAAAJ;wEfQgPgAAAAJ;G-V1VpwAAAAJ;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Yuxian_Gu1;~Li_Dong1;~Furu_Wei1;~Minlie_Huang1",
        "aff": "Tsinghua University;Microsoft Research;Microsoft Research;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;microsoft.com;microsoft.com;tsinghua.edu.cn",
        "position": "PhD student;Principal Researcher;Distinguished Scientist;Full Professor",
        "bibtex": "@inproceedings{\ngu2024minillm,\ntitle={Mini{LLM}: Knowledge Distillation of Large Language Models},\nauthor={Yuxian Gu and Li Dong and Furu Wei and Minlie Huang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=5h0qf7IBZZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "HmVQ;oknc;v2PG;BHa2",
        "pdf_size": 672880,
        "rating": "5;6;6;8",
        "confidence": "3;4;4;5",
        "soundness": "3;2;3;4",
        "contribution": "2;2;3;4",
        "presentation": "4;3;3;4",
        "wc_summary": "117;119;52;190",
        "wc_strengths": "251;129;49;97",
        "wc_weaknesses": "618;233;117;160",
        "wc_questions": "123;60;2;383",
        "wc_review": "1109;541;220;830",
        "wc_reply_reviewers": "410;347;0;200",
        "wc_reply_authors": "1973;541;411;1100",
        "reply_reviewers": "2;2;0;1",
        "reply_authors": "4;2;1;2",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            119.5,
            48.81854155953453
        ],
        "wc_strengths_avg": [
            131.5,
            74.63745708422816
        ],
        "wc_weaknesses_avg": [
            282.0,
            198.37212505793246
        ],
        "wc_questions_avg": [
            142.0,
            145.57300573938838
        ],
        "wc_review_avg": [
            675.0,
            330.6667506720323
        ],
        "wc_reply_reviewers_avg": [
            239.25,
            157.75515047059477
        ],
        "wc_reply_authors_avg": [
            1006.25,
            615.2590409737999
        ],
        "reply_reviewers_avg": [
            1.25,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.25,
            1.0897247358851685
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.9733285267845754,
        "gs_citation": 375,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5304283176625294100&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=5h0qf7IBZZ",
        "pdf": "https://openreview.net/pdf?id=5h0qf7IBZZ",
        "email": "tsinghua.edu.cn;microsoft.com;microsoft.com;tsinghua.edu.cn",
        "author_num": 4,
        "aff_unique_index": "0;1;1;0",
        "aff_unique_norm": "Tsinghua University;Microsoft",
        "aff_unique_dep": ";Microsoft Research",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.microsoft.com/en-us/research",
        "aff_unique_abbr": "THU;MSR",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Towards Robust Offline Reinforcement Learning under Diverse Data Corruption",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19419",
        "id": "5hAMmCU0bK",
        "author_site": "Rui Yang, Han Zhong, Jiawei Xu, Amy Zhang, Chongjie Zhang, Lei Han, Tong Zhang",
        "tldr": "",
        "abstract": "Offline reinforcement learning (RL) presents a promising approach for learning reinforced policies from offline datasets without the need for costly or unsafe interactions with the environment. However, datasets collected by humans in real-world environments are often noisy and may even be maliciously corrupted, which can significantly degrade the performance of offline RL. In this work, we first investigate the performance of current offline RL algorithms under comprehensive data corruption, including states, actions, rewards, and dynamics. Our extensive experiments reveal that implicit Q-learning (IQL) demonstrates remarkable resilience to data corruption among various offline RL algorithms. Furthermore, we conduct both empirical and theoretical analyses to understand IQL's robust performance, identifying its supervised policy learning scheme as the key factor. Despite its relative robustness, IQL still suffers from heavy-tail targets of Q functions under dynamics corruption. To tackle this challenge, we draw inspiration from robust statistics to employ the Huber loss to handle the heavy-tailedness and utilize quantile estimators to balance penalization for corrupted data and learning stability. By incorporating these simple yet effective modifications into IQL, we propose a more robust offline RL approach named Robust IQL (RIQL). Extensive experiments demonstrate that RIQL exhibits highly robust performance when subjected to diverse data corruption scenarios.",
        "keywords": "Offline RL;robust RL;data corruption;training-time attack",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/b59d032fee8c352db24e853035e62321928542aa.pdf",
        "author": "Rui Yang;Han Zhong;Jiawei Xu;Amy Zhang;Chongjie Zhang;Lei Han;Tong Zhang",
        "authorids": "~Rui_Yang8;~Han_Zhong1;~Jiawei_Xu1;~Amy_Zhang1;~Chongjie_Zhang1;~Lei_Han1;~Tong_Zhang2",
        "gender": "M;;M;;M;M;F",
        "homepage": "https://yangrui2015.github.io;https://hanzhong-ml.github.io/;https://github.com/jiawei415;;https://www.leihan.org;http://tongzhang-ml.org;",
        "dblp": "92/1942-10;137/8096.html;;29/6693;75/2307-1;07/4227-1;43/2754",
        "google_scholar": "QHSUy3MAAAAJ;Bk5q_pAAAAAJ;;LjxqXycAAAAJ;Tz4_zi8AAAAJ;LurWtuYAAAAJ;",
        "orcid": "0000-0003-3525-1726;;;;;0000-0002-5511-2558;",
        "linkedin": ";;;;;;",
        "or_profile": "~Rui_Yang8;~Han_Zhong1;~Jiawei_Xu1;~Chongjie_Zhang1;~Lei_Han1;~Tong_Zhang2;~Amy_Zhang2",
        "aff": "Hong Kong University of Science and Technology;Peking University;CUHK(SZ);Washington University, Saint Louis;Tencent Robotics X;UIUC;Meta Facebook",
        "aff_domain": "ust.hk;stu.pku.edu.cn;link.cuhk.edu.cn;wustl.edu;tencent.com;illinois.edu;facebook.com",
        "position": "PhD student;PhD student;PhD student;Associate Professor;Principal Researcher;Full Professor;Research Scientist",
        "bibtex": "@inproceedings{\nyang2024towards,\ntitle={Towards Robust Offline Reinforcement Learning under Diverse Data Corruption},\nauthor={Rui Yang and Han Zhong and Jiawei Xu and Amy Zhang and Chongjie Zhang and Lei Han and Tong Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=5hAMmCU0bK}\n}",
        "github": "",
        "project": "",
        "reviewers": "dDco;41NY;wKTe;t4o4",
        "pdf_size": 3305431,
        "rating": "6;6;8;8",
        "confidence": "4;4;5;3",
        "soundness": "3;3;3;3",
        "contribution": "3;2;3;3",
        "presentation": "4;3;3;3",
        "wc_summary": "98;90;84;136",
        "wc_strengths": "91;49;274;38",
        "wc_weaknesses": "322;104;185;14",
        "wc_questions": "69;33;36;81",
        "wc_review": "580;276;579;269",
        "wc_reply_reviewers": "309;23;0;12",
        "wc_reply_authors": "2517;753;750;681",
        "reply_reviewers": "2;1;0;1",
        "reply_authors": "5;1;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            102.0,
            20.248456731316587
        ],
        "wc_strengths_avg": [
            113.0,
            95.03420436874295
        ],
        "wc_weaknesses_avg": [
            156.25,
            113.20860170499414
        ],
        "wc_questions_avg": [
            54.75,
            20.716840975399702
        ],
        "wc_review_avg": [
            426.0,
            153.52035695633333
        ],
        "wc_reply_reviewers_avg": [
            86.0,
            129.00581382247856
        ],
        "wc_reply_authors_avg": [
            1175.25,
            775.1949351614728
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.0,
            1.7320508075688772
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9291883893276173496&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=5hAMmCU0bK",
        "pdf": "https://openreview.net/pdf?id=5hAMmCU0bK",
        "email": "ust.hk;stu.pku.edu.cn;link.cuhk.edu.cn;wustl.edu;tencent.com;illinois.edu;facebook.com",
        "author_num": 7,
        "aff_unique_index": "0;1;2;3;4;5;6",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Peking University;Chinese University of Hong Kong, Shenzhen;Washington University in St. Louis;Tencent;University of Illinois Urbana-Champaign;Meta",
        "aff_unique_dep": ";;;;Tencent Robotics X;;Meta Platforms, Inc.",
        "aff_unique_url": "https://www.ust.hk;http://www.pku.edu.cn;https://www.cuhk.edu.cn/sz;https://wustl.edu;https://www.tencent.com;https://www illinois.edu;https://meta.com",
        "aff_unique_abbr": "HKUST;Peking U;CUHK(SZ);WUSTL;Tencent Robotics X;UIUC;Meta",
        "aff_campus_unique_index": "0;2;3;4",
        "aff_campus_unique": "Hong Kong SAR;;Shenzhen;Saint Louis;Urbana-Champaign",
        "aff_country_unique_index": "0;0;0;1;0;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "INViTE: INterpret and Control Vision-Language Models with Text Explanations",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19418",
        "id": "5iENGLEJKG",
        "author_site": "Haozhe Chen, Junfeng Yang, Carl Vondrick, Chengzhi Mao",
        "tldr": "",
        "abstract": "Large-scale pre-trained vision foundation models, such as CLIP, have become de facto backbones for various vision tasks. However, due to their black-box nature, understanding the underlying rules behind these models\u2019 predictions and controlling model behaviors have remained open challenges. We present INViTE: a framework for INterpreting Vision Transformer\u2019s latent tokens with Text Explanations. Given a latent token, INViTE retains its semantic information to the final layer using transformer\u2019s local operations and retrieves the closest text for explanation. INViTE enables understanding of model visual reasoning procedure without needing additional model training or data collection. Based on the obtained interpretations, INViTE allows for model editing that controls model reasoning behaviors and improves model robustness against biases and spurious correlations. Our code is available at https://github.com/tonychenxyz/vit-interpret.",
        "keywords": "Interpretation; Transformer",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Haozhe Chen;Junfeng Yang;Carl Vondrick;Chengzhi Mao",
        "authorids": "~Haozhe_Chen2;~Junfeng_Yang1;~Carl_Vondrick2;~Chengzhi_Mao2",
        "gender": "M;M;M;M",
        "homepage": ";https://www.cs.columbia.edu/~junfeng/;http://www.cs.columbia.edu/~vondrick/;http://www.cs.columbia.edu/~mcz/",
        "dblp": ";71/3724.html;26/8610;",
        "google_scholar": ";JJ9AvbAAAAAJ;3MzhkFIAAAAJ;pTTEiHUAAAAJ",
        "orcid": ";0009-0000-2277-6545;;",
        "linkedin": "haozhe-chen/;;;",
        "or_profile": "~Haozhe_Chen2;~Junfeng_Yang1;~Carl_Vondrick2;~Chengzhi_Mao2",
        "aff": "Columbia University;Columbia University;Columbia University;Mila - Quebec Artificial Intelligence Institute",
        "aff_domain": "columbia.edu;columbia.edu;columbia.edu;mila.quebec",
        "position": "Undergrad student;Associate Professor;Associate Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nchen2024invite,\ntitle={{INV}i{TE}: {IN}terpret and Control Vision-Language Models with Text Explanations},\nauthor={Haozhe Chen and Junfeng Yang and Carl Vondrick and Chengzhi Mao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=5iENGLEJKG}\n}",
        "github": "",
        "project": "",
        "reviewers": "jxBW;ZFTq;aYwS;jZ36",
        "pdf_size": 4058511,
        "rating": "3;5;5;8",
        "confidence": "3;4;4;4",
        "soundness": "2;3;3;2",
        "contribution": "2;2;2;3",
        "presentation": "3;3;2;4",
        "wc_summary": "68;86;102;88",
        "wc_strengths": "55;53;67;91",
        "wc_weaknesses": "220;39;221;154",
        "wc_questions": "23;60;2;19",
        "wc_review": "366;238;392;352",
        "wc_reply_reviewers": "0;22;0;0",
        "wc_reply_authors": "1081;1240;998;1328",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "3;3;3;3",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            86.0,
            12.083045973594572
        ],
        "wc_strengths_avg": [
            66.5,
            15.124483462254174
        ],
        "wc_weaknesses_avg": [
            158.5,
            74.1434420565973
        ],
        "wc_questions_avg": [
            26.0,
            21.15419580130618
        ],
        "wc_review_avg": [
            337.0,
            58.93216439263028
        ],
        "wc_reply_reviewers_avg": [
            5.5,
            9.526279441628825
        ],
        "wc_reply_authors_avg": [
            1161.75,
            129.51520181044387
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            0.0
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.7276068751089989,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7823960357726140750&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=5iENGLEJKG",
        "pdf": "https://openreview.net/pdf?id=5iENGLEJKG",
        "email": "columbia.edu;columbia.edu;columbia.edu;mila.quebec",
        "author_num": 4,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "Columbia University;Quebec Artificial Intelligence Institute",
        "aff_unique_dep": ";Artificial Intelligence",
        "aff_unique_url": "https://www.columbia.edu;https://mila.quebec",
        "aff_unique_abbr": "Columbia;Mila",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "United States;Canada"
    },
    {
        "id": "5j6wtOO6Fk",
        "title": "Hieros: Hierarchical Imagination on Structured State Space Sequence World Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "One of the biggest challenges to modern deep reinforcement learning (DRL) algorithms is sample efficiency. Many approaches learn a world model in order to train an agent entirely in imagination, eliminating the need for direct environment interaction during training. However, these methods often suffer from either a lack of imagination accuracy, exploration capabilities, or runtime efficiency. We propose HIEROS, a hierarchical policy that learns time abstracted world representations and imagines trajectories at multiple time scales in latent space. HIEROS uses an S5 layer-based world model, which predicts next world states in parallel during training and iteratively during environment interaction. Due to the special properties of S5 layers, our method can train in parallel and predict next world states iteratively during imagination. This allows for more efficient training than RNN-based world models and more efficient imagination than Transformer-based world models. We show that our approach outperforms the state of the art in terms of mean and median normalized human score on the Atari 100k benchmark, and that our proposed world model is able to predict complex dynamics very accurately. We also show that HIEROS displays superior exploration capabilities compared to existing approaches.",
        "keywords": "Reinforcement Learning;Hierarchical Models;Deep Learning;Structured State Space Model",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/75980abe34c0f43e2c8ffcd073f836bed822aed4.zip",
        "author": "Paul Mattes;Rainer Schlosser;Ralf Herbrich",
        "authorids": "~Paul_Mattes1;~Rainer_Schlosser1;~Ralf_Herbrich1",
        "gender": "M;;M",
        "homepage": "https://github.com/Snagnar;https://hpi.de/herbrich/people/postdocs/dr-rainer-schlosser.html;https://herbrich.me",
        "dblp": ";129/4931;h/RalfHerbrich",
        "google_scholar": ";https://scholar.google.de/citations?user=A5TrKKcAAAAJ;RuvHkikAAAAJ",
        "orcid": ";0000-0002-6627-4026;",
        "linkedin": "paul-mattes-1a3455228/;;ralf-herbrich-28a8324/",
        "or_profile": "~Paul_Mattes1;~Rainer_Schlosser1;~Ralf_Herbrich1",
        "aff": ";Hasso Plattner Institute;Hasso Plattner Institute",
        "aff_domain": ";hpi.de;hpi.de",
        "position": ";Researcher;Full Professor",
        "bibtex": "@misc{\nmattes2024hieros,\ntitle={Hieros: Hierarchical Imagination on Structured State Space Sequence World Models},\nauthor={Paul Mattes and Rainer Schlosser and Ralf Herbrich},\nyear={2024},\nurl={https://openreview.net/forum?id=5j6wtOO6Fk}\n}",
        "github": "",
        "project": "",
        "reviewers": "UXtg;EjYN;5ii1",
        "site": "https://openreview.net/forum?id=5j6wtOO6Fk",
        "pdf_size": 5414859,
        "rating": "3;3;8",
        "confidence": "4;3;4",
        "soundness": "2;2;4",
        "contribution": "2;3;3",
        "presentation": "3;1;4",
        "wc_summary": "71;140;99",
        "wc_strengths": "29;156;102",
        "wc_weaknesses": "266;947;248",
        "wc_questions": "236;388;25",
        "wc_review": "602;1631;474",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "342;833;241",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.666666666666667,
            2.357022603955158
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "wc_summary_avg": [
            103.33333333333333,
            28.335294049804546
        ],
        "wc_strengths_avg": [
            95.66666666666667,
            52.04058245467879
        ],
        "wc_weaknesses_avg": [
            487.0,
            325.3521169440887
        ],
        "wc_questions_avg": [
            216.33333333333334,
            148.84518429861575
        ],
        "wc_review_avg": [
            902.3333333333334,
            517.8882333305345
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            472.0,
            258.5742962219305
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5000000000000001,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16594461642192045397&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Hasso Plattner Institute",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.hpi.de",
        "aff_unique_abbr": "HPI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Germany"
    },
    {
        "title": "Some Fundamental Aspects about Lipschitz Continuity of Neural Networks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19417",
        "id": "5jWsW08zUh",
        "author_site": "Grigory Khromov, Sidak Pal Singh",
        "tldr": "",
        "abstract": "Lipschitz continuity is a crucial functional property of any predictive model, that naturally governs its robustness, generalisation, as well as adversarial vulnerability. Contrary to other works that focus on obtaining tighter bounds and developing different practical strategies to enforce certain Lipschitz properties, we aim to thoroughly examine and characterise the Lipschitz behaviour of Neural Networks. Thus, we carry out an empirical investigation in a range of different settings (namely, architectures, datasets, label noise, and more) by exhausting the limits of the simplest and the most general lower and upper bounds. As a highlight of this investigation, we showcase a remarkable fidelity of the lower Lipschitz bound, identify a striking Double Descent trend in both upper and lower bounds to the Lipschitz and explain the intriguing effects of label noise on function smoothness and generalisation.",
        "keywords": "Lipschitz continuity;Double Descent;Label Noise;Generalization",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/6f2067e3b67cea7bfa8af7bc5a39136f8a81af0d.zip",
        "author": "Grigory Khromov;Sidak Pal Singh",
        "authorids": "~Grigory_Khromov1;~Sidak_Pal_Singh1",
        "gender": "M;",
        "homepage": ";http://sidakpal.com/",
        "dblp": "340/7871;189/9168",
        "google_scholar": "https://scholar.google.com/citations?hl=en;c59mPS4AAAAJ",
        "orcid": ";",
        "linkedin": "gkhromov/;",
        "or_profile": "~Grigory_Khromov1;~Sidak_Pal_Singh1",
        "aff": ";Max Planck Institute for Intelligent Systems",
        "aff_domain": ";tuebingen.mpg.de",
        "position": ";PhD student",
        "bibtex": "@inproceedings{\nkhromov2024some,\ntitle={Some Fundamental Aspects about Lipschitz Continuity of Neural Networks},\nauthor={Grigory Khromov and Sidak Pal Singh},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=5jWsW08zUh}\n}",
        "github": "",
        "project": "",
        "reviewers": "Sk7T;EeTb;Jyw9;F3fH",
        "pdf_size": 5628959,
        "rating": "3;6;6;8",
        "confidence": "4;2;3;4",
        "soundness": "2;3;3;4",
        "contribution": "1;3;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "57;177;113;89",
        "wc_strengths": "54;21;56;92",
        "wc_weaknesses": "188;8;194;196",
        "wc_questions": "42;29;72;316",
        "wc_review": "341;235;435;693",
        "wc_reply_reviewers": "31;5;104;33",
        "wc_reply_authors": "1466;489;754;1457",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "3;1;2;3",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            109.0,
            44.0
        ],
        "wc_strengths_avg": [
            55.75,
            25.1234452255259
        ],
        "wc_weaknesses_avg": [
            146.5,
            80.01718565408308
        ],
        "wc_questions_avg": [
            114.75,
            117.23347431514601
        ],
        "wc_review_avg": [
            426.0,
            169.61426826773743
        ],
        "wc_reply_reviewers_avg": [
            43.25,
            36.772102197182036
        ],
        "wc_reply_authors_avg": [
            1041.5,
            430.33504389022283
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.1266600992762247,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13201720659336215886&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=5jWsW08zUh",
        "pdf": "https://openreview.net/pdf?id=5jWsW08zUh",
        "email": ";tuebingen.mpg.de",
        "author_num": 2,
        "aff_unique_index": "0",
        "aff_unique_norm": "Max Planck Institute for Intelligent Systems",
        "aff_unique_dep": "Intelligent Systems",
        "aff_unique_url": "https://www.mpi-is.mpg.de",
        "aff_unique_abbr": "MPI-IS",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Germany"
    },
    {
        "title": "Jointly Training Large Autoregressive Multimodal Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19416",
        "id": "5jcav5RcKw",
        "author_site": "Emanuele Aiello, Lili Yu, Yixin Nie, Armen Aghajanyan, Barlas Oguz",
        "tldr": "",
        "abstract": "In recent years, advances in the large-scale pretraining of language and text-to-image models have revolutionized the field of machine learning. Yet, integrating these two modalities into a single, robust model capable of generating seamless multimodal outputs remains a significant challenge. To address this gap, we present the Joint Autoregressive Mixture (JAM) framework, a modular approach that systematically fuses existing text and image generation models. We also introduce a specialized, data-efficient instruction-tuning strategy, tailored for mixed-modal generation tasks. Our final instruct-tuned model demonstrates unparalleled performance in generating high-quality multimodal outputs and represents the first model explicitly designed for this purpose.",
        "keywords": "Large Multimodal Models; Joint Training; Interleaved Image-Text Generation; Autoregressive Models",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Emanuele Aiello;LILI YU;Yixin Nie;Armen Aghajanyan;Barlas Oguz",
        "authorids": "~Emanuele_Aiello1;~LILI_YU1;~Yixin_Nie2;~Armen_Aghajanyan1;~Barlas_Oguz1",
        "gender": "M;F;M;;",
        "homepage": ";https://scholar.google.com/citations?hl=en&user=wY932-AAAAAJ&view_op=list_works&authuser=1&sortby=pubdate;https://easonnie.github.io;;",
        "dblp": ";;205/2725;;https://dblp.org/pers/hd/o/Oguz:Barlas",
        "google_scholar": "oZlKgH4AAAAJ;https://scholar.google.com/citations?hl=en;g5QpITUAAAAJ;;iPmTQZMAAAAJ",
        "orcid": "0000-0001-7133-4137;;;;",
        "linkedin": "emanuele-aiello-765945105/;lili-yu-6771961a/;;;barlas-o%C4%9Fuz-25465050",
        "or_profile": "~Emanuele_Aiello1;~LILI_YU1;~Yixin_Nie2;~Armen_Aghajanyan1;~Barlas_Oguz1",
        "aff": "Politecnico di Torino;Meta Facebook;Meta Platforms, Inc.;;Meta",
        "aff_domain": "polito.it;fb.com;meta.com;;meta.com",
        "position": "PhD student;Researcher;Researcher;;Research Scientist",
        "bibtex": "@inproceedings{\naiello2024jointly,\ntitle={Jointly Training Large Autoregressive Multimodal Models},\nauthor={Emanuele Aiello and LILI YU and Yixin Nie and Armen Aghajanyan and Barlas Oguz},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=5jcav5RcKw}\n}",
        "github": "",
        "project": "",
        "reviewers": "Ghzd;qfqe;eaYf;jvv1",
        "pdf_size": 44391665,
        "rating": "5;5;6;6",
        "confidence": "3;4;3;3",
        "soundness": "3;2;2;4",
        "contribution": "2;2;4;3",
        "presentation": "3;2;2;3",
        "wc_summary": "176;20;74;38",
        "wc_strengths": "73;44;39;158",
        "wc_weaknesses": "97;344;58;157",
        "wc_questions": "193;36;43;47",
        "wc_review": "539;444;214;400",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1075;1148;818;962",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;3;2;3",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            77.0,
            60.37383539249432
        ],
        "wc_strengths_avg": [
            78.5,
            47.699580710945455
        ],
        "wc_weaknesses_avg": [
            164.0,
            109.74288131810646
        ],
        "wc_questions_avg": [
            79.75,
            65.50333960951914
        ],
        "wc_review_avg": [
            399.25,
            118.16381637371062
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1000.75,
            124.59409095137698
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.75,
            0.4330127018922193
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 33,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5901155463886075827&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=5jcav5RcKw",
        "pdf": "https://openreview.net/pdf?id=5jcav5RcKw",
        "email": "polito.it;fb.com;meta.com;;meta.com",
        "author_num": 5,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Politecnico di Torino;Meta",
        "aff_unique_dep": ";Meta Platforms, Inc.",
        "aff_unique_url": "https://www.polito.it;https://meta.com",
        "aff_unique_abbr": "Polito;Meta",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "Italy;United States"
    },
    {
        "id": "5jxtlpla15",
        "title": "Diffusion Models for Open-Vocabulary Segmentation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The variety of objects in the real world is unlimited and is thus impossible to capture using models trained on a closed, pre-defined set of categories. Recently, open-vocabulary recognition has garnered significant attention, largely facilitated by advances in large-scale vision-language modelling. In this paper, we present OVDiff, a novel method that leverages the generative properties of text-to-image diffusion models for open-vocabulary segmentation. Specifically, we propose to synthesise support image sets from arbitrary textual categories, creating for each category a set of prototypes representative of both the category itself and its surrounding context (background). Our method relies solely on pre-trained components: segmentation is obtained by simply comparing a target image to the prototypes without further fine-tuning.  We show that our method can be used to ground any pre-trained self-supervised feature extractor in natural language and provide explainable predictions by mapping back to regions in the support set. Our approach shows strong performance on a range of open-vocabulary segmentation benchmarks, obtaining a lead of more than 10% over prior work on PASCAL VOC.",
        "keywords": "computer vision;semantic segmentation;open-vocabulary segmentation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Laurynas Karazija;Iro Laina;Andrea Vedaldi;Christian Rupprecht",
        "authorids": "~Laurynas_Karazija1;~Iro_Laina1;~Andrea_Vedaldi1;~Christian_Rupprecht1",
        "gender": "M;M;M;",
        "homepage": "https://karazijal.github.io;https://www.robots.ox.ac.uk/~vedaldi/;http://chrirupp.github.io;",
        "dblp": "206/6117;99/2825;https://dblp.uni-trier.de/pid/76/744-1;182/2070",
        "google_scholar": "Kyt9trwAAAAJ;bRT7t28AAAAJ;https://scholar.google.de/citations?user=IrYlproAAAAJ;n9nXAPcAAAAJ",
        "orcid": ";0000-0003-1374-2858;;0000-0001-8857-7709",
        "linkedin": "laurynas-karazija-b9591b103/;;;",
        "or_profile": "~Laurynas_Karazija1;~Andrea_Vedaldi1;~Christian_Rupprecht1;~Iro_Laina2",
        "aff": "University of Oxford;Meta;University of Oxford;University of Oxford",
        "aff_domain": "ox.ac.uk;meta.com;ox.ac.uk;ox.ac.uk",
        "position": "PhD student;Researcher;Associate Professor;Lecturer",
        "bibtex": "@misc{\nkarazija2024diffusion,\ntitle={Diffusion Models for Open-Vocabulary Segmentation},\nauthor={Laurynas Karazija and Iro Laina and Andrea Vedaldi and Christian Rupprecht},\nyear={2024},\nurl={https://openreview.net/forum?id=5jxtlpla15}\n}",
        "github": "",
        "project": "",
        "reviewers": "PKyW;zXW9;FmYQ;kQ2p",
        "site": "https://openreview.net/forum?id=5jxtlpla15",
        "pdf_size": 3544489,
        "rating": "3;5;6;6",
        "confidence": "4;3;5;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "28;143;38;45",
        "wc_strengths": "21;48;50;41",
        "wc_weaknesses": "246;167;88;119",
        "wc_questions": "5;68;3;19",
        "wc_review": "300;426;179;224",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "891;804;385;951",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;1;2",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            63.5,
            46.295248136282844
        ],
        "wc_strengths_avg": [
            40.0,
            11.467344941179714
        ],
        "wc_weaknesses_avg": [
            155.0,
            59.602852280742404
        ],
        "wc_questions_avg": [
            23.75,
            26.280934153869037
        ],
        "wc_review_avg": [
            282.25,
            93.58518846484202
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            757.75,
            221.46260971098485
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6050314759315356107&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 13,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "University of Oxford;Meta",
        "aff_unique_dep": ";Meta Platforms, Inc.",
        "aff_unique_url": "https://www.ox.ac.uk;https://meta.com",
        "aff_unique_abbr": "Oxford;Meta",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "title": "Time-Efficient Reinforcement Learning with Stochastic Stateful Policies",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19415",
        "id": "5liV2xUdJL",
        "author_site": "Firas Al-Hafez, Guoping Zhao, Jan Peters, Davide Tateo",
        "tldr": "",
        "abstract": "Stateful policies play an important role in reinforcement learning, such as handling partially observable environments, enhancing robustness, or imposing an inductive bias directly into the policy structure. The conventional method for training stateful policies is Backpropagation Through Time (BPTT), which comes with significant drawbacks, such as slow training due to sequential gradient propagation and the occurrence of vanishing or exploding gradients. The gradient is often truncated to address these issues, resulting in a biased policy update. We present a novel approach for training stateful policies by decomposing the latter into a stochastic internal state kernel and a stateless policy, jointly optimized by following the stateful policy gradient. We introduce different versions of the stateful policy gradient theorem, enabling us to easily instantiate stateful variants of popular reinforcement learning and imitation learning algorithms. Furthermore, we provide a theoretical analysis of our new gradient estimator and compare it with BPTT. We evaluate our approach on complex continuous control tasks, e.g. humanoid locomotion, and demonstrate that our gradient estimator scales effectively with task complexity while offering a faster and simpler alternative to BPTT.",
        "keywords": "reinforcement learning;recurrent neural networks;stateful policies;backpropagation through time;imitation learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Firas Al-Hafez;Guoping Zhao;Jan Peters;Davide Tateo",
        "authorids": "~Firas_Al-Hafez1;~Guoping_Zhao1;~Jan_Peters3;~Davide_Tateo2",
        "gender": "M;M;M;M",
        "homepage": "https://firasalhafez.com/;;https://www.jan-peters.net;https://www.ias.informatik.tu-darmstadt.de/Team/DavideTateo",
        "dblp": ";;p/JanPeters1;214/0808",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;https://scholar.google.de/citations?user=-kIVAcAAAAAJ;https://scholar.google.it/citations?user=LGnu3SEAAAAJ",
        "orcid": ";0000-0002-1908-5388;0000-0002-5266-8091;0000-0002-7193-923X",
        "linkedin": ";;janrpeters/;",
        "or_profile": "~Firas_Al-Hafez1;~Guoping_Zhao1;~Jan_Peters3;~Davide_Tateo2",
        "aff": "Technische Universit\u00e4t Darmstadt;Southeast University;TU Darmstadt;Technische Universit\u00e4t Darmstadt",
        "aff_domain": "tu-darmstadt.de;seu.edu.cn;tu-darmstadt.de;tu-darmstadt.de",
        "position": "PhD student;Associate Professor;Full Professor;Researcher",
        "bibtex": "@inproceedings{\nal-hafez2024timeefficient,\ntitle={Time-Efficient Reinforcement Learning with Stochastic Stateful Policies},\nauthor={Firas Al-Hafez and Guoping Zhao and Jan Peters and Davide Tateo},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=5liV2xUdJL}\n}",
        "github": "",
        "project": "",
        "reviewers": "gHcm;wQTz;HaqJ",
        "pdf_size": 8449457,
        "rating": "5;6;8",
        "confidence": "3;4;4",
        "soundness": "3;3;4",
        "contribution": "2;3;3",
        "presentation": "3;1;4",
        "wc_summary": "195;93;115",
        "wc_strengths": "65;348;91",
        "wc_weaknesses": "313;243;130",
        "wc_questions": "3;231;72",
        "wc_review": "576;915;408",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1306;1138;685",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;2;2",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "wc_summary_avg": [
            134.33333333333334,
            43.827946437049604
        ],
        "wc_strengths_avg": [
            168.0,
            127.72105020969201
        ],
        "wc_weaknesses_avg": [
            228.66666666666666,
            75.39378105800387
        ],
        "wc_questions_avg": [
            102.0,
            95.46727187890099
        ],
        "wc_review_avg": [
            633.0,
            210.86962796951104
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1043.0,
            262.27085236449744
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.7559289460184545,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1548611879883268075&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=5liV2xUdJL",
        "pdf": "https://openreview.net/pdf?id=5liV2xUdJL",
        "email": "tu-darmstadt.de;seu.edu.cn;tu-darmstadt.de;tu-darmstadt.de",
        "author_num": 4,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Technische Universit\u00e4t Darmstadt;Southeast University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tu-darmstadt.de;https://www.seu.edu.cn/",
        "aff_unique_abbr": "TUD;SEU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Darmstadt",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "Germany;China"
    },
    {
        "id": "5mtwoRNzjm",
        "title": "Optimization without retraction on the random generalized Stiefel manifold for canonical correlation analysis",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Optimization over the set of matrices that satisfy $X^\\top B X = I_p$, referred to as the generalized Stiefel manifold, appears in many applications such as canonical correlation analysis (CCA) and the generalized eigenvalue problem. Solving these problems for large-scale datasets is computationally expensive and is typically done by either computing the closed-form solution with subsampled data or by iterative methods such as Riemannian approaches. Building on the work of Ablin \\& Peyr\u00e9 (2022), we propose an inexpensive iterative method that does not enforce the constraint in every iteration exactly, but instead it produces iterations that converge to the generalized Stiefel manifold. We also tackle the random case, where the matrix $B$ is an expectation. Our method requires only efficient matrix multiplications, and has the same sublinear convergence rate as its Riemannian counterpart. Experiments demonstrate its effectiveness in various machine learning applications involving generalized orthogonality constraints, including CCA for measuring model representation similarity.",
        "keywords": "Canonical correlation analysis;generalized eigenvalue problem;optimization on manifolds;streaming CCA",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/7cbb0595a5fa111ba476edf6d81ebb05b4510932.pdf",
        "author": "Simon Vary;Pierre Ablin;Bin Gao;Pierre-Antoine Absil",
        "authorids": "~Simon_Vary1;~Pierre_Ablin2;gaobin@lsec.cc.ac.cn;~Pierre-Antoine_Absil1",
        "gender": "M;M;;",
        "homepage": "https://simonvary.github.io;https://pierreablin.com/;;https://sites.uclouvain.be/absil/",
        "dblp": "230/4630;174/0980.html;;08/1880",
        "google_scholar": "V6OqU-cAAAAJ;1ZsunaYAAAAJ;;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Simon_Vary1;~Pierre_Ablin2;gaobin@lsec.cc.ac.cn;~Pierre-Antoine_Absil1",
        "aff": "University of Oxford;Apple;;UCLouvain",
        "aff_domain": "stats.ox.ac.uk;apple.com;;uclouvain.be",
        "position": "Postdoc;Researcher;;Full Professor",
        "bibtex": "@misc{\nvary2024optimization,\ntitle={Optimization without retraction on the random generalized Stiefel manifold for canonical correlation analysis},\nauthor={Simon Vary and Pierre Ablin and Bin Gao and Pierre-Antoine Absil},\nyear={2024},\nurl={https://openreview.net/forum?id=5mtwoRNzjm}\n}",
        "github": "",
        "project": "",
        "reviewers": "44jd;dA73;1p92;6Nz4",
        "site": "https://openreview.net/forum?id=5mtwoRNzjm",
        "pdf_size": 1440442,
        "rating": "5;5;6;10",
        "confidence": "3;3;4;4",
        "soundness": "2;3;3;4",
        "contribution": "2;3;3;4",
        "presentation": "3;2;3;4",
        "wc_summary": "94;66;142;56",
        "wc_strengths": "58;24;37;53",
        "wc_weaknesses": "227;137;62;40",
        "wc_questions": "36;116;144;24",
        "wc_review": "415;343;385;173",
        "wc_reply_reviewers": "0;126;35;14",
        "wc_reply_authors": "1533;1588;1152;75",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "3;3;2;1",
        "rating_avg": [
            6.5,
            2.0615528128088303
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            89.5,
            33.35790760824186
        ],
        "wc_strengths_avg": [
            43.0,
            13.435028842544403
        ],
        "wc_weaknesses_avg": [
            116.5,
            73.23421331590858
        ],
        "wc_questions_avg": [
            80.0,
            51.146847410177685
        ],
        "wc_review_avg": [
            329.0,
            93.6269192059634
        ],
        "wc_reply_reviewers_avg": [
            43.75,
            49.09366048686938
        ],
        "wc_reply_authors_avg": [
            1087.0,
            607.9239261618184
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.7276068751089989,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:3SLRpxMdePsJ:scholar.google.com/&scioq=Optimization+without+retraction+on+the+random+generalized+Stiefel+manifold+for+canonical+correlation+analysis&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of Oxford;Apple;Universit\u00e9 catholique de Louvain",
        "aff_unique_dep": ";Apple Inc.;",
        "aff_unique_url": "https://www.ox.ac.uk;https://www.apple.com;https://www.uclouvain.be",
        "aff_unique_abbr": "Oxford;Apple;UCL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2",
        "aff_country_unique": "United Kingdom;United States;Belgium"
    },
    {
        "id": "5nEmi3YIz4",
        "title": "ProtoNMF: Turning a Black Box into a Prototype Based Interpretable Model via Non-negative Matrix Factorization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Models using parts of images as prototypes for interpretable image classification are receiving increasing attention due to their abilities to provide a transparent reasoning process in a \"this looks like that\" manner. However, existing models are typically constructed by incorporating an additional prototype layer before the final classification head, which often involve complex multi-stage training procedures and intricate loss designs while under-performing their black box counterparts in terms of accuracy. In order to guarantee the recognition performance, we take the first step to explore the reverse direction and investigate how to turn a trained black box model into the form of a prototype based model. To this end, we propose to leverage the Non-negative Matrix Factorization (NMF) to discover interpretable prototypes due to its capability of yielding parts based representations. Then we use these prototypes as the basis to reconstruct the trained black box's classification head via linear convex optimization for transparent reasoning. Denote the reconstruction difference as the residual prototype, all discovered prototypes together guarantee a precise final reconstruction. To the best of our knowledge, this is the first prototype based model that guarantees the recognition performance on par with black boxes for interpretable image classification. We demonstrate that our simple strategy can easily turn a trained black box into a prototype based model while discovering meaningful prototypes in various benchmark datasets and networks.",
        "keywords": "XAI;prototype based inherently interpretable model;non-negative matrix factorization",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Andong Tan;Hao Chen",
        "authorids": "~Andong_Tan1;~Hao_Chen1",
        "gender": "M;M",
        "homepage": ";https://cse.hkust.edu.hk/~jhc/",
        "dblp": "225/7131;86/475-11",
        "google_scholar": "zt49vSoAAAAJ;https://scholar.google.com.hk/citations?user=Z_t5DjwAAAAJ",
        "orcid": ";0000-0002-8400-3780",
        "linkedin": ";",
        "or_profile": "~Andong_Tan1;~Hao_Chen1",
        "aff": "Hong Kong University of Science and Technology;Hong Kong University of Science and Technology",
        "aff_domain": "connect.ust.hk;ust.hk",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\ntan2024protonmf,\ntitle={Proto{NMF}: Turning a Black Box into a Prototype Based Interpretable Model via Non-negative Matrix Factorization},\nauthor={Andong Tan and Hao Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=5nEmi3YIz4}\n}",
        "github": "",
        "project": "",
        "reviewers": "eeCj;XoPR;A726",
        "site": "https://openreview.net/forum?id=5nEmi3YIz4",
        "pdf_size": 5367528,
        "rating": "3;5;5",
        "confidence": "2;3;3",
        "soundness": "2;3;2",
        "contribution": "2;3;2",
        "presentation": "2;2;2",
        "wc_summary": "67;85;229",
        "wc_strengths": "26;96;12",
        "wc_weaknesses": "295;221;91",
        "wc_questions": "9;95;50",
        "wc_review": "397;497;382",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "555;324;1057",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;2",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            127.0,
            72.49827584156743
        ],
        "wc_strengths_avg": [
            44.666666666666664,
            36.745370078721784
        ],
        "wc_weaknesses_avg": [
            202.33333333333334,
            84.32213364367757
        ],
        "wc_questions_avg": [
            51.333333333333336,
            35.122009560324926
        ],
        "wc_review_avg": [
            425.3333333333333,
            51.044642770378516
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            645.3333333333334,
            305.9872909488599
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.9999999999999998,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:u3WY7AfvIQsJ:scholar.google.com/&scioq=ProtoNMF:+Turning+a+Black+Box+into+a+Prototype+Based+Interpretable+Model+via+Non-negative+Matrix+Factorization&hl=en&as_sdt=0,23",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Hong Kong University of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ust.hk",
        "aff_unique_abbr": "HKUST",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "5nF9rGNpi3",
        "title": "From Fake to Real: Pretraining on Balanced Synthetic Images to Prevent Bias",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Visual recognition models are prone to learning spurious correlations induced by a biased training set where certain conditions $B$ (\\eg, Indoors) are over-represented in certain classes $Y$ (\\eg, Big Dogs). Synthetic data from generative models offers a promising direction to mitigate this issue by augmenting underrepresented conditions in the real dataset. However, this introduces another potential source of bias from generative model artifacts in the synthetic data. Indeed, as we will show, prior work uses synthetic data to resolve the model's bias toward $B$, but it doesn't correct the models' bias toward the pair $(B, G)$ where $G$ denotes whether the sample is real or synthetic. Thus, the model could simply learn signals based on the pair $(B, G)$ (\\eg, Synthetic Indoors) to make predictions about $Y$ (\\eg, Big Dogs). To address this issue, we propose a two-step training pipeline that we call From Fake to Real (FFR). The first step of FFR pre-trains a model on balanced synthetic data to learn robust representations across subgroups. In the second step, FFR fine-tunes the model on real data using ERM or common loss-based bias mitigation methods. By training on real and synthetic data separately, FFR avoids the issue of bias toward signals from the pair $(B, G)$. In other words, synthetic data in the first step provides effective unbiased representations that boosts performance in the second step. Indeed, our analysis of high bias setting (99.9\\%) shows that FFR improves performance over the state-of-the-art by 7-14\\% over three datasets (CelebA, UTK-Face, and SpuCO Animals).",
        "keywords": "Spurious Correlations;Bias;Fairness",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/74343866fe9638bfdebcdf61cde24d8266488f51.zip",
        "author": "Maan Qraitem;Kate Saenko;Bryan A. Plummer",
        "authorids": "~Maan_Qraitem1;~Kate_Saenko1;~Bryan_A._Plummer1",
        "gender": ";F;M",
        "homepage": "https://cs-people.bu.edu/mqraitem/;http://ai.bu.edu;http://bryanplummer.com/",
        "dblp": "250/5589;88/2754;163/2330",
        "google_scholar": "l8r237UAAAAJ;https://scholar.google.com.tw/citations?user=9xDADY4AAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";0000-0002-5704-7614;",
        "linkedin": ";;",
        "or_profile": "~Maan_Qraitem1;~Kate_Saenko1;~Bryan_Allen_Plummer1",
        "aff": "Boston University;Boston University, Boston University;Boston University",
        "aff_domain": "bu.edu;bu.edu;bu.edu",
        "position": "PhD student;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nqraitem2024from,\ntitle={From Fake to Real: Pretraining on Balanced Synthetic Images to Prevent Bias},\nauthor={Maan Qraitem and Kate Saenko and Bryan A. Plummer},\nyear={2024},\nurl={https://openreview.net/forum?id=5nF9rGNpi3}\n}",
        "github": "",
        "project": "",
        "reviewers": "EAfJ;tzaP;DngP;RuLj",
        "site": "https://openreview.net/forum?id=5nF9rGNpi3",
        "pdf_size": 3686706,
        "rating": "3;3;5;6",
        "confidence": "4;5;4;3",
        "soundness": "2;2;2;2",
        "contribution": "1;2;2;2",
        "presentation": "1;3;3;2",
        "wc_summary": "63;98;189;145",
        "wc_strengths": "13;87;78;98",
        "wc_weaknesses": "131;1362;325;517",
        "wc_questions": "85;56;153;14",
        "wc_review": "292;1603;745;774",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "505;1245;1098;768",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;2;2;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            123.75,
            47.59923843928598
        ],
        "wc_strengths_avg": [
            69.0,
            33.09833832687073
        ],
        "wc_weaknesses_avg": [
            583.75,
            469.59097893805415
        ],
        "wc_questions_avg": [
            77.0,
            50.62114182829147
        ],
        "wc_review_avg": [
            853.5,
            473.05522933374283
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            904.0,
            287.92967891483505
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12799463189263644552&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Boston University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.bu.edu",
        "aff_unique_abbr": "BU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Boston",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Linear Log-Normal Attention with Unbiased Concentration",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19414",
        "id": "5nM2AHzqUj",
        "author_site": "Yury Nahshan, Joseph Kampeas, Emir Haleva",
        "tldr": "",
        "abstract": "Transformer models have achieved remarkable results in a wide range of applications. However, their scalability is hampered by the quadratic time and memory complexity of the self-attention mechanism concerning the sequence length. This limitation poses a substantial obstacle when dealing with long documents or high-resolution images. In this work, we study the self-attention mechanism by analyzing the distribution of the attention matrix and its concentration ability. Furthermore, we propose instruments to measure these quantities and introduce a novel self-attention mechanism, Linear Log-Normal Attention, designed to emulate the distribution and concentration behavior of the original self-attention. Our experimental results on popular natural language benchmarks reveal that our proposed Linear Log-Normal Attention outperforms other linearized attention alternatives, offering a promising avenue for enhancing the scalability of transformer models.",
        "keywords": "Neural Networks;Transformers;Self-Attention;Linear Attention;Scalable Transformers;Efficient Attention;Attention with Linear Complexity;Linearized Attention;Self-Attention Analysis",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/8f60cc0ad88fd2dc4567319746c7ee3b660e005d.zip",
        "author": "Yury Nahshan;Joseph Kampeas;Emir Haleva",
        "authorids": "~Yury_Nahshan1;~Joseph_Kampeas1;~Emir_Haleva1",
        "gender": "M;M;",
        "homepage": ";;",
        "dblp": "228/7866;61/10966;",
        "google_scholar": "vdRZRhIAAAAJ;kampeas;k4ZFigYAAAAJ",
        "orcid": ";0000-0002-3412-6854;",
        "linkedin": ";;",
        "or_profile": "~Yury_Nahshan1;~Joseph_Kampeas1;~Emir_Haleva1",
        "aff": "Huawei Technologies Ltd.;Huawei Technologies Ltd.;Huawei Technologies Ltd.",
        "aff_domain": "huawei.com;huawei.com;huawei.com",
        "position": "Researcher;Researcher;Researcher",
        "bibtex": "@inproceedings{\nnahshan2024linear,\ntitle={Linear Log-Normal Attention with Unbiased Concentration},\nauthor={Yury Nahshan and Joseph Kampeas and Emir Haleva},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=5nM2AHzqUj}\n}",
        "github": "",
        "project": "",
        "reviewers": "m7qC;zqGD;aZn4;xXRJ",
        "pdf_size": 1415613,
        "rating": "5;5;6;8",
        "confidence": "4;4;3;3",
        "soundness": "3;2;3;3",
        "contribution": "3;2;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "29;223;49;68",
        "wc_strengths": "26;190;19;174",
        "wc_weaknesses": "66;217;35;85",
        "wc_questions": "2;3;2;2",
        "wc_review": "123;633;105;329",
        "wc_reply_reviewers": "0;0;10;0",
        "wc_reply_authors": "576;1545;392;308",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;3;1;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            92.25,
            76.73778404410699
        ],
        "wc_strengths_avg": [
            102.25,
            79.98867107284632
        ],
        "wc_weaknesses_avg": [
            100.75,
            69.44917206129962
        ],
        "wc_questions_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_review_avg": [
            297.5,
            212.75514094846216
        ],
        "wc_reply_reviewers_avg": [
            2.5,
            4.330127018922194
        ],
        "wc_reply_authors_avg": [
            705.25,
            494.4235911644993
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8164965809277259,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1876833627498889789&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=5nM2AHzqUj",
        "pdf": "https://openreview.net/pdf?id=5nM2AHzqUj",
        "email": "huawei.com;huawei.com;huawei.com",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Huawei",
        "aff_unique_dep": "Huawei Technologies",
        "aff_unique_url": "https://www.huawei.com",
        "aff_unique_abbr": "Huawei",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Goodhart's Law in Reinforcement Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19413",
        "id": "5o9G4XF1LI",
        "author_site": "Jacek Karwowski, Oliver Hayman, Xingjian Bai, Klaus Kiendlhofer, Charlie Griffin, Joar Skalse",
        "tldr": "",
        "abstract": "Implementing a reward function that perfectly captures a complex task in the real world is impractical. As a result, it is often appropriate to think of the reward function as a *proxy* for the true objective rather than as its definition. We study this phenomenon through the lens of *Goodhart\u2019s law*, which predicts that increasing optimisation of an imperfect proxy beyond some critical point decreases performance on the true objective. First, we propose a way to *quantify* the magnitude of this effect and *show empirically* that optimising an imperfect proxy reward often leads to the behaviour predicted by Goodhart\u2019s law for a wide range of environments and reward functions. We then provide a *geometric explanation* for why Goodhart's law occurs in Markov decision processes. We use these theoretical insights to propose an *optimal early stopping method* that provably avoids the aforementioned pitfall and derive theoretical *regret bounds* for this method. Moreover, we derive a training method that maximises worst-case reward, for the setting where there is uncertainty about the true reward function. Finally, we evaluate our early stopping method experimentally. Our results support a foundation for a theoretically-principled study of reinforcement learning under reward misspecification.",
        "keywords": "reinforcement learning;goodhart's law;misspecification;reward learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Jacek Karwowski;Oliver Hayman;Xingjian Bai;Klaus Kiendlhofer;Charlie Griffin;Joar Max Viktor Skalse",
        "authorids": "~Jacek_Karwowski1;~Oliver_Hayman1;~Xingjian_Bai1;~Klaus_Kiendlhofer1;~Charlie_Griffin1;~Joar_Max_Viktor_Skalse1",
        "gender": "M;M;M;M;;M",
        "homepage": ";https://www.linkedin.com/in/oliver-hayman-2b61b31b7/;https://xingjianbai.com/;;;",
        "dblp": "304/2081;;188/9534;;;242/8125",
        "google_scholar": ";;;;;GuzLUmQAAAAJ",
        "orcid": "0000-0002-8361-2912;;;;;",
        "linkedin": ";oliver-hayman-2b61b31b7/;;klaus-kiendlhofer-5a27291bb/;;",
        "or_profile": "~Jacek_Karwowski1;~Oliver_Hayman1;~Xingjian_Bai1;~Klaus_Kiendlhofer1;~Charlie_Griffin1;~Joar_Max_Viktor_Skalse1",
        "aff": "University of Oxford;University of Oxford;University of Oxford;OxAI Safety Hub;;University of Oxford",
        "aff_domain": "ox.ac.uk;ox.ac.uk;ox.ac.uk;aisafetyhub.org;;ox.ac.uk",
        "position": "PhD student;Undergrad student;Undergrad student;Researcher;;PhD student",
        "bibtex": "@inproceedings{\nkarwowski2024goodharts,\ntitle={Goodhart's Law in Reinforcement Learning},\nauthor={Jacek Karwowski and Oliver Hayman and Xingjian Bai and Klaus Kiendlhofer and Charlie Griffin and Joar Max Viktor Skalse},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=5o9G4XF1LI}\n}",
        "github": "",
        "project": "",
        "reviewers": "Y2A1;eHjA;YkV9;MUg9",
        "pdf_size": 2697174,
        "rating": "5;6;6;8",
        "confidence": "3;3;3;2",
        "soundness": "3;4;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;4;3;3",
        "wc_summary": "108;115;99;77",
        "wc_strengths": "91;101;66;157",
        "wc_weaknesses": "360;144;438;108",
        "wc_questions": "31;1;4;76",
        "wc_review": "590;361;607;418",
        "wc_reply_reviewers": "0;0;0;84",
        "wc_reply_authors": "1211;618;1457;1121",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "2;1;2;2",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            99.75,
            14.306903927824496
        ],
        "wc_strengths_avg": [
            103.75,
            33.281939546847326
        ],
        "wc_weaknesses_avg": [
            262.5,
            139.83829947478623
        ],
        "wc_questions_avg": [
            28.0,
            30.074906483645133
        ],
        "wc_review_avg": [
            494.0,
            106.59502802663921
        ],
        "wc_reply_reviewers_avg": [
            21.0,
            36.373066958946424
        ],
        "wc_reply_authors_avg": [
            1101.75,
            305.1732090141597
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.9271726499455306,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2184078619705942762&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=5o9G4XF1LI",
        "pdf": "https://openreview.net/pdf?id=5o9G4XF1LI",
        "email": "ox.ac.uk;ox.ac.uk;ox.ac.uk;aisafetyhub.org;;ox.ac.uk",
        "author_num": 6,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "University of Oxford",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ox.ac.uk",
        "aff_unique_abbr": "Oxford",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Oxford",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "5oJlyJXUxK",
        "title": "Beyond Concept Bottleneck Models: How to Make Black Boxes Intervenable?",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recently, interpretable machine learning has re-explored concept bottleneck models (CBM), comprising step-by-step prediction of the high-level concepts from the raw features and the target variable from the predicted concepts. A compelling advantage of this model class is the user's ability to intervene on the predicted concept values, consequently affecting the model's downstream output. In this work, we introduce a method to perform such concept-based interventions on already-trained neural networks, which are not interpretable by design. Furthermore, we formalise the model's *intervenability* as a measure of the effectiveness of concept-based interventions and leverage this definition to fine-tune black-box models. Empirically, we explore the intervenability of black-box classifiers on synthetic tabular and natural image benchmarks.  We demonstrate that fine-tuning improves intervention effectiveness and often yields better-calibrated predictions. To showcase the practical utility of the proposed techniques, we apply them to deep chest X-ray classifiers and show that fine-tuned black boxes can be as intervenable and more performant than CBMs.",
        "keywords": "interpretability;explainability;concepts;concept bottleneck models;model interventions;healthcare",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/53e866cf86a808281bedae3a80e1e88c12ba35a8.zip",
        "author": "Ri\u010dards Marcinkevi\u010ds;Sonia Laguna;Moritz Vandenhirtz;Julia E Vogt",
        "authorids": "~Ri\u010dards_Marcinkevi\u010ds1;~Sonia_Laguna1;~Moritz_Vandenhirtz1;~Julia_E_Vogt1",
        "gender": "F;M;F;M",
        "homepage": "https://mds.inf.ethz.ch/team/detail/sonia-laguna;;http://mds.inf.ethz.ch;https://rmarcinkevics.github.io/",
        "dblp": "313/3156;;13/8412;234/8553",
        "google_scholar": "PljVnCQAAAAJ;H2cG0BwAAAAJ;UoeV-8kAAAAJ;https://scholar.google.ch/citations?user=XcxXOJsAAAAJ",
        "orcid": "0000-0003-3504-2051;;;0000-0001-8901-5062",
        "linkedin": ";moritz-simon-vandenhirtz-488b0b16b/;julia-vogt-50b53895;ri%C4%8Dards-m-668568106?lipi=urn%3Ali%3Apage%3Ad_flagship3_profile_view_base_contact_details%3Byeq5%2FsReRoWG3HN7r6A5Lw%3D%3D",
        "or_profile": "~Sonia_Laguna1;~Moritz_Vandenhirtz1;~Julia_E_Vogt1;~Ricards_Marcinkevics1",
        "aff": "Department of Computer Science, ETHZ - ETH Zurich;ETHZ - ETH Zurich;Swiss Federal Institute of Technology;Swiss Federal Institute of Technology",
        "aff_domain": "inf.ethz.ch;ethz.ch;ethz.ch;inf.ethz.ch",
        "position": "PhD student;PhD student;Assistant Professor;PhD student",
        "bibtex": "@misc{\nmarcinkevi{\\v{c}}s2024beyond,\ntitle={Beyond Concept Bottleneck Models: How to Make Black Boxes Intervenable?},\nauthor={Ri{\\v{c}}ards Marcinkevi{\\v{c}}s and Sonia Laguna and Moritz Vandenhirtz and Julia E Vogt},\nyear={2024},\nurl={https://openreview.net/forum?id=5oJlyJXUxK}\n}",
        "github": "",
        "project": "",
        "reviewers": "Emzi;JHNX;icNv;39mA",
        "site": "https://openreview.net/forum?id=5oJlyJXUxK",
        "pdf_size": 12053856,
        "rating": "5;5;8;8",
        "confidence": "3;4;4;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;4",
        "presentation": "2;3;3;3",
        "wc_summary": "156;80;35;341",
        "wc_strengths": "45;14;38;66",
        "wc_weaknesses": "352;202;57;168",
        "wc_questions": "227;28;72;123",
        "wc_review": "780;324;202;698",
        "wc_reply_reviewers": "304;191;46;35",
        "wc_reply_authors": "2508;1994;672;1541",
        "reply_reviewers": "2;1;1;1",
        "reply_authors": "6;5;2;4",
        "rating_avg": [
            6.5,
            1.5
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            153.0,
            116.83963368651924
        ],
        "wc_strengths_avg": [
            40.75,
            18.565761497983324
        ],
        "wc_weaknesses_avg": [
            194.75,
            105.44044527599455
        ],
        "wc_questions_avg": [
            112.5,
            74.16367035145981
        ],
        "wc_review_avg": [
            501.0,
            243.60829214129802
        ],
        "wc_reply_reviewers_avg": [
            144.0,
            111.01126069007594
        ],
        "wc_reply_authors_avg": [
            1678.75,
            674.4551041396306
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.25,
            1.479019945774904
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5773502691896258,
        "gs_citation": 19,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2536299489321927736&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;0;1;1",
        "aff_unique_norm": "ETH Zurich;Swiss Federal Institute of Technology",
        "aff_unique_dep": "Department of Computer Science;",
        "aff_unique_url": "https://www.ethz.ch;https://www.ethz.ch",
        "aff_unique_abbr": "ETHZ;ETH Zurich",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Zurich;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Switzerland"
    },
    {
        "id": "5pKLogzjQP",
        "title": "Purify Perturbative Availability Poisons via Rate-Constrained Variational Autoencoders",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Perturbative availability poisoning attacks seek to maximize testing error by making subtle modifications to training examples that are correctly labeled.\nDefensive strategies against these attacks can be categorized based on whether specific interventions are adopted during the training phase.\nThe first approach is training-time defense, such as adversarial training, which can effectively mitigate poisoning effects but is computationally intensive.\nThe other approach is pre-training purification, *e.g.,* image short squeezing, which consists of several simple compressions but often encounters challenges in dealing with various poison types.\nOur work provides a novel disentanglement mechanism to build an efficient pre-training purification method that achieves superior performance to all existing defenses.\nFirstly, we uncover rate-constrained variational autoencoders (VAEs), demonstrating a clear tendency to suppress poison patterns by minimizing mutual information in the latent space. We subsequently conduct a theoretical analysis to offer an explanation for this phenomenon.\nBuilding upon these insights, we introduce a disentangle variational autoencoder (D-VAE), capable of disentangling the added perturbations with learnable class-wise embeddings.\nBased on this network, a two-stage purification approach is naturally developed. The first stage focuses on roughly suppressing poison patterns, while the second stage produces refined, poison-free results, ensuring the effectiveness and robustness across various scenarios and datasets.\nExtensive experiments demonstrate the remarkable performance of our method across CIFAR-10, CIFAR-100, and a 100-class ImageNet-subset with multiple poison types and different perturbation levels.",
        "keywords": "perturbative availability poisoning attack;defense;variational autoencoders",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Yi Yu;Yufei Wang;Song Xia;Qichen Zheng;Wenhan Yang;Shijian Lu;Yap-peng Tan;Alex Kot",
        "authorids": "~Yi_Yu5;~Yufei_Wang5;~Song_Xia1;~Qichen_Zheng1;~Wenhan_Yang6;~Shijian_Lu1;~Yap-peng_Tan1;~Alex_Kot1",
        "gender": ";M;M;M;M;M;M;",
        "homepage": "https://github.com/yuyi-sd;https://github.com/wyf0912/;;https://github.com/QichenZheng;https://flyywh.github.io/;https://personal.ntu.edu.sg/shijian.lu/;https://personal.ntu.edu.sg/eyptan/;https://www.ntu.edu.sg/home/eackot/",
        "dblp": "99/111-11.html;;;285/4546;156/2359.html;42/2718;93/4472.html;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;jLd1l_sAAAAJ;x_CkEE8AAAAJ;d6AbpzgAAAAJ;S8nAnakAAAAJ;https://scholar.google.com.sg/scholar?hl=en;https://scholar.google.com.sg/citations?user=t9EqYQIAAAAJ;",
        "orcid": "0000-0003-2730-9553;;0009-0002-1224-470X;;;;0000-0002-0645-9109;",
        "linkedin": "%E7%9B%8A-%E4%BD%99-6b453a229;;;;;;;",
        "or_profile": "~Yi_Yu5;~Yufei_Wang5;~Song_Xia1;~Qichen_Zheng1;~Wenhan_Yang6;~Shijian_Lu1;~Yap-peng_Tan1;~Alex_Kot1",
        "aff": "Nanyang Technological University;Nanyang Technological University;Nanyang Technological University;Nanyang Technological University;Peng Cheng Laboratory;Nanyang Technological University;Nanyang Technological University;Nanyang Technological University",
        "aff_domain": "ntu.edu.sg;ntu.edu.sg;ntu.edu.sg;ntu.edu;pcl.ac.cn;ntu.edu.sg;ntu.edu.sg;ntu.edu.sg",
        "position": "PhD student;PhD student;PhD student;PhD student;Researcher;Associate Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nyu2024purify,\ntitle={Purify Perturbative Availability Poisons via Rate-Constrained Variational Autoencoders},\nauthor={Yi Yu and Yufei Wang and Song Xia and Qichen Zheng and Wenhan Yang and Shijian Lu and Yap-peng Tan and Alex Kot},\nyear={2024},\nurl={https://openreview.net/forum?id=5pKLogzjQP}\n}",
        "github": "",
        "project": "",
        "reviewers": "h4wy;D3kf;kPQt;PyJm",
        "site": "https://openreview.net/forum?id=5pKLogzjQP",
        "pdf_size": 4195767,
        "rating": "5;5;5;6",
        "confidence": "2;3;2;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;1;1;3",
        "wc_summary": "28;114;34;63",
        "wc_strengths": "31;200;11;53",
        "wc_weaknesses": "108;912;131;306",
        "wc_questions": "8;103;2;106",
        "wc_review": "175;1329;178;528",
        "wc_reply_reviewers": "27;458;0;301",
        "wc_reply_authors": "611;4327;1109;805",
        "reply_reviewers": "1;2;0;3",
        "reply_authors": "2;9;3;3",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            59.75,
            34.00275724114149
        ],
        "wc_strengths_avg": [
            73.75,
            74.38875923148605
        ],
        "wc_weaknesses_avg": [
            364.25,
            325.3816028911284
        ],
        "wc_questions_avg": [
            54.75,
            49.806500579743606
        ],
        "wc_review_avg": [
            552.5,
            470.7199273453377
        ],
        "wc_reply_reviewers_avg": [
            196.5,
            191.47127721932603
        ],
        "wc_reply_authors_avg": [
            1713.0,
            1519.5953408720363
        ],
        "reply_reviewers_avg": [
            1.5,
            1.118033988749895
        ],
        "reply_authors_avg": [
            4.25,
            2.7726341266023544
        ],
        "replies_avg": [
            30,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.8703882797784891,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:DfoaPqEgb1wJ:scholar.google.com/&scioq=Purify+Perturbative+Availability+Poisons+via+Rate-Constrained+Variational+Autoencoders&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;1;0;0;0",
        "aff_unique_norm": "Nanyang Technological University;Pengcheng Laboratory",
        "aff_unique_dep": ";Peng Cheng Laboratory",
        "aff_unique_url": "https://www.ntu.edu.sg;http://www.pcl.ac.cn",
        "aff_unique_abbr": "NTU;PCL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;1;0;0;0",
        "aff_country_unique": "Singapore;China"
    },
    {
        "id": "5qxdlSyyB3",
        "title": "S$^6$-DAMON: Unlocking Structured Sparsity in Self-Supervised Speech Models via Data-Model Co-Compression",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Driven by the increasing demand for deploying deep neural network (DNN)-powered automatic speech recognition (ASR) systems on mobile platforms, speech models pretrained through self-supervised learning (SSL) have emerged to reduce reliance on the availability of transcribed speech data. However, this has enlarged the gap between the prohibitive model complexity and the limited resources of mobile devices. Therefore, there is a strong desire to streamline the complexity of speech SSL models for real-time acceleration on mobile platforms, which is particularly challenging as the pretrained speech representation may undergo significant degradation. To this end, we develop a framework dubbed S$^6$-DAMON to unlock structured sparsity in speech SSL models via data-model co-compression. On the data side, leveraging both the duration of each phoneme and the pauses between phonemes of human utterances, we develop a salient audio token detector, dubbed SALAD, to remove redundant input audio tokens; On the model side, we identify that the failure of SOTA ASR pruning methods under structured sparsity is caused by a sparsity discrepancy between finetuning/deployment and their limited adaptability of sparsity distributions. We address this through a new ASR pruning pipeline named SAFARI, which adopts a three-step pipeline - sparsify, finetune, and adjust sparsity. Extensive experiments validate that S$^6$-DAMON can significantly accelerate speech SSL models on mobile devices with limited transcribed speech data while maintaining decent ASR accuracy. All source code will be released.",
        "keywords": "Automated Speech Recognition;Model Compression",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Yonggan Fu;Zhifan Ye;Zhongzhi Yu;Yingyan Celine Lin",
        "authorids": "~Yonggan_Fu1;~Zhifan_Ye1;~Zhongzhi_Yu1;~Yingyan_Celine_Lin1",
        "gender": "M;M;M;F",
        "homepage": "https://www.yongganfu.com/;https://github.com/LemonAndRabbit;;https://eiclab.scs.gatech.edu/",
        "dblp": "244/8166;168/9226.html;198/8338;120/6981",
        "google_scholar": "https://scholar.google.com/citations?hl=en;zlPfnWEAAAAJ;KjvcaBQAAAAJ;dio8IesAAAAJ",
        "orcid": ";0000-0003-0755-8843;;",
        "linkedin": "yonggan-fu-b211831b0;zhifan-ye/;zhongzhi-yu/;yingyan-celine-lin-a281211a/",
        "or_profile": "~Yonggan_Fu1;~Zhifan_Ye1;~Zhongzhi_Yu1;~Yingyan_Lin1",
        "aff": "Georgia Institute of Technology;Georgia Institute of Technology;Nvidia Research;Georgia Institute of Technology",
        "aff_domain": "gatech.edu;gatech.edu;nivida.com;gatech.edu",
        "position": "PhD student;PhD student;Research Intern;Associate Professor",
        "bibtex": "@misc{\nfu2024sdamon,\ntitle={S\\${\\textasciicircum}6\\$-{DAMON}: Unlocking Structured Sparsity in Self-Supervised Speech Models via Data-Model Co-Compression},\nauthor={Yonggan Fu and Zhifan Ye and Zhongzhi Yu and Yingyan Celine Lin},\nyear={2024},\nurl={https://openreview.net/forum?id=5qxdlSyyB3}\n}",
        "github": "",
        "project": "",
        "reviewers": "FqdU;7VsP;NUX3;NFEu",
        "site": "https://openreview.net/forum?id=5qxdlSyyB3",
        "pdf_size": 776522,
        "rating": "3;3;5;5",
        "confidence": "5;5;3;4",
        "soundness": "4;2;2;2",
        "contribution": "3;2;3;3",
        "presentation": "1;2;2;3",
        "wc_summary": "122;27;118;102",
        "wc_strengths": "117;29;56;44",
        "wc_weaknesses": "825;155;118;268",
        "wc_questions": "133;4;157;50",
        "wc_review": "1197;215;449;464",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            92.25,
            38.408169703853375
        ],
        "wc_strengths_avg": [
            61.5,
            33.44024521441193
        ],
        "wc_weaknesses_avg": [
            341.5,
            284.565018932405
        ],
        "wc_questions_avg": [
            86.0,
            61.78592072632729
        ],
        "wc_review_avg": [
            581.25,
            368.9596014470961
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9045340337332909,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:EBcqKKesHNYJ:scholar.google.com/&scioq=S%24%5E6%24-DAMON:+Unlocking+Structured+Sparsity+in+Self-Supervised+Speech+Models+via+Data-Model+Co-Compression&hl=en&as_sdt=0,30",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Georgia Institute of Technology;NVIDIA",
        "aff_unique_dep": ";NVIDIA Research",
        "aff_unique_url": "https://www.gatech.edu;https://www.nvidia.com/research",
        "aff_unique_abbr": "Georgia Tech;NVIDIA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "5rhgOIu4Tr",
        "title": "BOT: Bootstrapped Optimal Transport for Multi-label Noise Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Multi-label learning with label noise is a practical but more challenging problem, as the underlying label dependency complicates the modeling from clean labels to noisy variants. Progress in this area is usually explored from the perspectives of semi-supervised learning, robust loss functions, or noise transition, which are less effective on complicated datasets or highly sensitive to transition matrix estimation. To refine the noisy labels in a general framework, we propose a simple but effective method, named Bootstrapped Optimal Transport method (BOT). Unlike the \\emph{explicit} linear transition matrix with stringent conditions, BOT considers the modeling between true labels and noisy labels as an \\emph{implicit} optimal transport procedure which has a more powerful degree of freedom. We show that with the proper reference by bootstrapping and adversarial orientation, the underlying true labels can be effectively estimated for training by the Sinkhorn-Knopp algorithm. Despite the simplicity, extensive experiments on a range of benchmark datasets prove that BOT consistently outperforms state-of-the-art methods, and comprehensive ablations explain the success behind BOT.",
        "keywords": "multi-label learning;label noise",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Lefei Zhang;Geng Yu;Jiangchao Yao;Yew-Soon Ong;Yanfeng Wang;Ivor Tsang",
        "authorids": "~Lefei_Zhang2;~Geng_Yu1;~Jiangchao_Yao1;~Yew-Soon_Ong1;~Yanfeng_Wang1;~Ivor_Tsang1",
        "gender": "M;M;M;M;M;M",
        "homepage": ";https://warriors-30.github.io/;https://sunarker.github.io/;https://cmic.sjtu.edu.cn/wangyanfeng/;https://www.a-star.edu.sg/cfar/about-cfar/management/prof-ivor-tsang;http://www.ntu.edu.sg/home/asysong/",
        "dblp": ";;166/5900;55/5407-1.html;35/5873;64/4136",
        "google_scholar": "https://scholar.google.com/citations?hl=en;SNp2hXIAAAAJ;w8oDh9QAAAAJ;https://scholar.google.com/citations?hl=zh-CN;rJMOlVsAAAAJ;https://scholar.google.com.tw/citations?user=h9oWOsEAAAAJ",
        "orcid": ";;;0000-0002-3196-2347;;0000-0002-4480-169X",
        "linkedin": ";;;;;",
        "or_profile": "~Lefei_Zhang2;~Geng_Yu1;~Jiangchao_Yao1;~Yanfeng_Wang1;~Ivor_W_Tsang1;~Yew_Soon_Ong1",
        "aff": "School of Computer Science and  Engineering, Nanyang Technological University;Shanghai Jiaotong University;Shanghai Artificial Intelligence Laboratory;Shanghai Jiaotong University;A*STAR;Nanyang Technological University",
        "aff_domain": "scse.ntu.edu.sg;sjtu.edu.cn;pjlab.org.cn;sjtu.edu.cn;cfar.a-star.edu.sg;ntu.edu.sg",
        "position": "PhD student;MS student;Researcher;Full Professor;Principal Researcher;Full Professor",
        "bibtex": "@misc{\nzhang2024bot,\ntitle={{BOT}: Bootstrapped Optimal Transport for Multi-label Noise Learning},\nauthor={Lefei Zhang and Geng Yu and Jiangchao Yao and Yew-Soon Ong and Yanfeng Wang and Ivor Tsang},\nyear={2024},\nurl={https://openreview.net/forum?id=5rhgOIu4Tr}\n}",
        "github": "",
        "project": "",
        "reviewers": "5LvG;DxXQ;hG8D;8aJ1",
        "site": "https://openreview.net/forum?id=5rhgOIu4Tr",
        "pdf_size": 609405,
        "rating": "3;3;3;6",
        "confidence": "3;3;3;4",
        "soundness": "3;1;3;3",
        "contribution": "2;1;2;3",
        "presentation": "2;1;2;4",
        "wc_summary": "54;22;46;145",
        "wc_strengths": "18;16;47;220",
        "wc_weaknesses": "27;96;475;71",
        "wc_questions": "89;104;224;122",
        "wc_review": "188;238;792;558",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            66.75,
            46.687123492457744
        ],
        "wc_strengths_avg": [
            75.25,
            84.4670793859951
        ],
        "wc_weaknesses_avg": [
            167.25,
            179.38837058181892
        ],
        "wc_questions_avg": [
            134.75,
            52.83642209688313
        ],
        "wc_review_avg": [
            444.0,
            246.00406500706447
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ydKVBCjku4kJ:scholar.google.com/&scioq=BOT:+Bootstrapped+Optimal+Transport+for+Multi-label+Noise+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;1;3;0",
        "aff_unique_norm": "Nanyang Technological University;Shanghai Jiao Tong University;Shanghai Artificial Intelligence Laboratory;Agency for Science, Technology and Research",
        "aff_unique_dep": "School of Computer Science and Engineering;;;",
        "aff_unique_url": "https://www.ntu.edu.sg;https://www.sjtu.edu.cn;http://www.shailab.org/;https://www.a-star.edu.sg",
        "aff_unique_abbr": "NTU;SJTU;Shanghai AI Lab;A*STAR",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;0;0",
        "aff_country_unique": "Singapore;China"
    },
    {
        "id": "5rrYpa2vts",
        "title": "EA2N: Evidence-based AMR Attention Network for Fake News Detection",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Proliferation of fake news has become a critical issue in today's information-driven society. Our study includes external knowledge from Wikidata and deviates from the reliance on social information to detect fake news, that many  state-of-the-art (SOTA) fact-checking models adopt. This paper introduces EA$^2$N, an Evidence-based AMR Attention Network for Fake News Detection. EA$^2$N leverages Abstract Meaning Representation (AMR) and incorporates knowledge from Wikidata using proposed evidence linking algorithm, pushing the boundaries of fake news detection. The proposed framework encompasses a combination of novel language encoder and graph encoder to detect the fake news. While the language encoder effectively combines transformer encoded textual features with affective lexical features, the graph encoder encodes AMR with evidence through external knowledge, referred as WikiAMR graph. A path-aware graph learning module is designed to capture crucial semantic relationships among entities over evidences. Extensive experiments supports our model's superior performance, surpassing SOTA methodologies. This research not only advances the field of Fake News Detection but also showcases the potential of AMR and external knowledge for robust NLP applications, promising a more trustworthy information landscape.",
        "keywords": "Fake News Detection;AMR Network;Natural Language Processing",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Shubham Gupta;Abhishek Rajora;Suman Kundu",
        "authorids": "~Shubham_Gupta5;~Abhishek_Rajora1;~Suman_Kundu1",
        "gender": "M;M;M",
        "homepage": "https://www.csa-iitj.group/author/shubham-gupta/;https://brillard.netlify.app/;https://sumankundu.info",
        "dblp": ";;45/9812",
        "google_scholar": "z1lEsUgAAAAJ;;https://scholar.google.co.in/citations?user=2h2t9cEAAAAJ",
        "orcid": ";;0000-0002-7856-4768",
        "linkedin": ";abhishek-rajora/;drskundu/",
        "or_profile": "~Shubham_Gupta5;~Abhishek_Rajora1;~Suman_Kundu1",
        "aff": "Indian Institute of Technology, Jodhpur;Indian Institute of Technology Jodhpur;Indian Institute of Technology Jodhpur",
        "aff_domain": "iitj.ac.in;iitj.ac.in;iitj.ac.in",
        "position": "PhD student;Undergrad student;Assistant Professor",
        "bibtex": "@misc{\ngupta2024ean,\ntitle={{EA}2N: Evidence-based {AMR} Attention Network for Fake News Detection},\nauthor={Shubham Gupta and Abhishek Rajora and Suman Kundu},\nyear={2024},\nurl={https://openreview.net/forum?id=5rrYpa2vts}\n}",
        "github": "",
        "project": "",
        "reviewers": "PY31;b3Lz;hTw2;cpwY",
        "site": "https://openreview.net/forum?id=5rrYpa2vts",
        "pdf_size": 4474923,
        "rating": "3;3;5;5",
        "confidence": "4;4;2;4",
        "soundness": "2;3;3;3",
        "contribution": "1;2;2;2",
        "presentation": "2;3;3;3",
        "wc_summary": "187;44;62;127",
        "wc_strengths": "44;28;36;58",
        "wc_weaknesses": "350;97;15;200",
        "wc_questions": "933;2;1;62",
        "wc_review": "1514;171;114;447",
        "wc_reply_reviewers": "175;0;16;0",
        "wc_reply_authors": "2630;1171;170;1125",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "6;3;2;3",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            105.0,
            56.519907997094265
        ],
        "wc_strengths_avg": [
            41.5,
            11.07925990308017
        ],
        "wc_weaknesses_avg": [
            165.5,
            125.07297869643946
        ],
        "wc_questions_avg": [
            249.5,
            395.39126191659824
        ],
        "wc_review_avg": [
            561.5,
            564.1615460131965
        ],
        "wc_reply_reviewers_avg": [
            47.75,
            73.75762672429204
        ],
        "wc_reply_authors_avg": [
            1274.0,
            878.9712737058021
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.5,
            1.5
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:vKKJu-GsGLYJ:scholar.google.com/&scioq=EA2N:+Evidence-based+AMR+Attention+Network+for+Fake+News+Detection&hl=en&as_sdt=0,47",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Indian Institute of Technology;Indian Institute of Technology Jodhpur",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.iitj.ac.in;https://www.iitj.ac.in",
        "aff_unique_abbr": "IIT Jodhpur;IIT Jodhpur",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Jodhpur",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "India"
    },
    {
        "title": "Whittle Index with Multiple Actions and State Constraint for Inventory Management",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19412",
        "id": "5sixirvG0I",
        "author_site": "Chuheng Zhang, Xiangsen Wang, Wei Jiang, Xianliang Yang, Siwei Wang, Lei Song, Jiang Bian",
        "tldr": "",
        "abstract": "Whittle index is a heuristic tool that leads to good performance for the restless bandits problem. In this paper, we extend Whittle index to a new multi-agent reinforcement learning (MARL) setting with multiple discrete actions and a possibly changing constraint on the state space, resulting in WIMS (Whittle Index with Multiple actions and State constraint). This setting is common for inventory management where each agent chooses a replenishing quantity level for the corresponding stock-keeping-unit (SKU) such that the total profit is maximized while the total inventory does not exceed a certain limit. Accordingly, we propose a deep MARL algorithm based on WIMS for inventory management. Empirically, our algorithm is evaluated on real large-scale inventory management problems with up to 2307 SKUs and outperforms operation-research-based methods and baseline MARL algorithms.",
        "keywords": "MARL;Inventory Management;Whittle Index",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/12a415ec19b65954850e84b6c838bc6cb9025594.pdf",
        "author": "Chuheng Zhang;Xiangsen Wang;Wei Jiang;Xianliang Yang;Siwei Wang;Lei Song;Jiang Bian",
        "authorids": "~Chuheng_Zhang1;~Xiangsen_Wang1;~Wei_Jiang12;~Xianliang_Yang1;~Siwei_Wang2;~Lei_Song3;~Jiang_Bian1",
        "gender": "M;M;;M;M;M;M",
        "homepage": ";https://github.com/sanmuyang;;https://github.com/VictorYXL;https://www.microsoft.com/en-us/research/people/siweiwang/publications/;;https://sites.google.com/view/jiangbian",
        "dblp": "241/9716;341/5749;21/3839-24;;51/8279-2;76/893-1.html;09/851-2.html",
        "google_scholar": "q7M83KQAAAAJ;;hDMnEDEAAAAJ;;;pXDSOocAAAAJ;pZBEnY8AAAAJ",
        "orcid": ";0000-0002-5349-9170;;;;;0000-0002-9472-600X",
        "linkedin": ";;wei-jiang-b364121ab/;;;;jbian/",
        "or_profile": "~Chuheng_Zhang1;~Xiangsen_Wang1;~Wei_Jiang12;~Xianliang_Yang1;~Siwei_Wang2;~Lei_Song3;~Jiang_Bian1",
        "aff": "Microsoft;;University of Illinois Urbana-Champaign;Microsoft;Microsoft;Microsoft;Microsoft",
        "aff_domain": "microsoft.com;;illinois.edu;microsoft.com;microsoft.com;microsoft.com;microsoft.com",
        "position": "Researcher;;MS student;Researcher;Researcher;Principal Researcher;Partner Research Manager",
        "bibtex": "@inproceedings{\nzhang2024whittle,\ntitle={Whittle Index with Multiple Actions and State Constraint for Inventory Management},\nauthor={Chuheng Zhang and Xiangsen Wang and Wei Jiang and Xianliang Yang and Siwei Wang and Lei Song and Jiang Bian},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=5sixirvG0I}\n}",
        "github": "",
        "project": "",
        "reviewers": "xHVA;qxXR;spvh",
        "pdf_size": 498190,
        "rating": "3;5;8",
        "confidence": "4;3;3",
        "soundness": "2;3;3",
        "contribution": "2;2;3",
        "presentation": "2;3;4",
        "wc_summary": "67;156;130",
        "wc_strengths": "36;87;234",
        "wc_weaknesses": "301;119;296",
        "wc_questions": "4;76;251",
        "wc_review": "408;438;911",
        "wc_reply_reviewers": "505;211;0",
        "wc_reply_authors": "1251;1221;1365",
        "reply_reviewers": "1;1;0",
        "reply_authors": "4;4;3",
        "rating_avg": [
            5.333333333333333,
            2.0548046676563256
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            117.66666666666667,
            37.366057086910075
        ],
        "wc_strengths_avg": [
            119.0,
            83.94045508573325
        ],
        "wc_weaknesses_avg": [
            238.66666666666666,
            84.64172861078761
        ],
        "wc_questions_avg": [
            110.33333333333333,
            103.7186364910162
        ],
        "wc_review_avg": [
            585.6666666666666,
            230.37119804543468
        ],
        "wc_reply_reviewers_avg": [
            238.66666666666666,
            207.09149883297695
        ],
        "wc_reply_authors_avg": [
            1279.0,
            62.03224967708329
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.8029550685469661,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5813781585575829176&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=5sixirvG0I",
        "pdf": "https://openreview.net/pdf?id=5sixirvG0I",
        "email": "microsoft.com;;illinois.edu;microsoft.com;microsoft.com;microsoft.com;microsoft.com",
        "author_num": 7,
        "aff_unique_index": "0;1;0;0;0;0",
        "aff_unique_norm": "Microsoft;University of Illinois Urbana-Champaign",
        "aff_unique_dep": "Microsoft Corporation;",
        "aff_unique_url": "https://www.microsoft.com;https://illinois.edu",
        "aff_unique_abbr": "Microsoft;UIUC",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Urbana-Champaign",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Robust Angular Synchronization via Directed Graph Neural Networks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19411",
        "id": "5sjxMwWmk8",
        "author_site": "Yixuan He, Gesine Reinert, David Wipf, Mihai Cucuringu",
        "tldr": "",
        "abstract": "The angular synchronization problem aims to accurately estimate (up to a constant additive phase) a set of unknown angles $\\theta_1, \\dots, \\theta_n\\in[0, 2\\pi)$ from $m$ noisy measurements of their offsets $\\theta_i-\\theta_j$ mod $2\\pi.$ Applications include, for example, sensor network localization, phase retrieval, and distributed clock synchronization. \nAn extension of the problem to the heterogeneous setting (dubbed $k$-synchronization) is to estimate $k$ groups of angles simultaneously, given noisy observations (with unknown group assignment) from each group. Existing methods for angular synchronization usually perform poorly in high-noise regimes, which are common in applications. In this paper, we leverage neural networks for the angular synchronization problem, and its heterogeneous extension, by proposing GNNSync, a theoretically-grounded end-to-end trainable framework using directed graph neural networks. In addition, new loss functions are devised to encode synchronization objectives. Experimental results on extensive data sets demonstrate that GNNSync attains competitive, and often superior, performance against a comprehensive set of baselines for the angular synchronization problem and its extension, validating the robustness of GNNSync even at high noise levels.",
        "keywords": "group synchronization;angular synchronization;neural networks;directed graphs;deep learning;cycle consistency",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Yixuan He;Gesine Reinert;David Wipf;Mihai Cucuringu",
        "authorids": "~Yixuan_He2;~Gesine_Reinert1;~David_Wipf1;~Mihai_Cucuringu1",
        "gender": "F;F;M;M",
        "homepage": "https://sherylhyx.github.io/;http://www.stats.ox.ac.uk/~reinert/;http://www.davidwipf.com/;https://www.math.ucla.edu/~mihai/",
        "dblp": "226/6494;86/1736;81/6421;58/6857",
        "google_scholar": "SWme_nYAAAAJ;2gvyN5oAAAAJ;YJx1WSgAAAAJ;GFvVRzwAAAAJ",
        "orcid": "0000-0002-5990-0658;;;",
        "linkedin": "yixuan-he-sheryl/;gesine-reinert-77b64913/?originalSubdomain=uk;;mihai-cucuringu-9a866634/",
        "or_profile": "~Yixuan_He2;~Gesine_Reinert1;~David_Wipf1;~Mihai_Cucuringu1",
        "aff": "University of Oxford;University of Oxford;Amazon AI Research Lab;The Alan Turing Institute",
        "aff_domain": "ox.ac.uk;ox.ac.uk;amazon.com;turing.ac.uk",
        "position": "PhD student;Professor;Principal Research Scientist;Fellow",
        "bibtex": "@inproceedings{\nhe2024robust,\ntitle={Robust Angular Synchronization via Directed Graph Neural Networks},\nauthor={Yixuan He and Gesine Reinert and David Wipf and Mihai Cucuringu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=5sjxMwWmk8}\n}",
        "github": "",
        "project": "",
        "reviewers": "BzAL;LD2r;UofK;tjS3",
        "pdf_size": 14152854,
        "rating": "5;6;6;8",
        "confidence": "2;2;3;2",
        "soundness": "3;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;2;3",
        "wc_summary": "146;49;90;102",
        "wc_strengths": "14;43;41;86",
        "wc_weaknesses": "13;17;236;46",
        "wc_questions": "30;62;86;39",
        "wc_review": "203;171;453;273",
        "wc_reply_reviewers": "0;0;15;0",
        "wc_reply_authors": "371;330;1339;196",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;3;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            2.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            96.75,
            34.56425176392511
        ],
        "wc_strengths_avg": [
            46.0,
            25.777897509300484
        ],
        "wc_weaknesses_avg": [
            78.0,
            92.10591729091026
        ],
        "wc_questions_avg": [
            54.25,
            21.72987574745884
        ],
        "wc_review_avg": [
            275.0,
            109.1879114188013
        ],
        "wc_reply_reviewers_avg": [
            3.75,
            6.49519052838329
        ],
        "wc_reply_authors_avg": [
            559.0,
            454.95988834181856
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.13245323570650439,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4650950799787545403&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=5sjxMwWmk8",
        "pdf": "https://openreview.net/pdf?id=5sjxMwWmk8",
        "email": "ox.ac.uk;ox.ac.uk;amazon.com;turing.ac.uk",
        "author_num": 4,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "University of Oxford;Amazon;Alan Turing Institute",
        "aff_unique_dep": ";Amazon AI Research Lab;",
        "aff_unique_url": "https://www.ox.ac.uk;https://www.amazon.com;https://www.turing.ac.uk",
        "aff_unique_abbr": "Oxford;Amazon AI;ATI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "title": "Pose Modulated Avatars from Video",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19410",
        "id": "5t44vPlv9x",
        "author_site": "Chunjin Song, Bastian Wandt, Helge Rhodin",
        "tldr": "",
        "abstract": "It is now possible to reconstruct dynamic human motion and shape from a sparse set of cameras using Neural Radiance Fields (NeRF) driven by an underlying skeleton. However, a challenge remains to model the deformation of cloth and skin in relation to skeleton pose. Unlike existing avatar models that are learned implicitly or rely on a proxy surface, our approach is motivated by the observation that different poses necessitate unique frequency assignments. Neglecting this distinction yields noisy artifacts in smooth areas or blurs fine-grained texture and shape details in sharp regions. We develop a two-branch neural network that is adaptive and explicit in the frequency domain. The first branch is a graph neural network that models correlations among body parts locally, taking skeleton pose as input. The second branch combines these correlation features to a set of global frequencies and then modulates the feature encoding. Our experiments demonstrate that our network outperforms state-of-the-art methods in terms of preserving details and generalization capabilities. Our code is available at https://github.com/ChunjinSong/PM-Avatars.",
        "keywords": "NeRF;Neural Rendering;Dynamic Avatars;Frequency Modulation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/e4ee940037bf645fa5a64eb09b228220e3b9f496.zip",
        "author": "Chunjin Song;Bastian Wandt;Helge Rhodin",
        "authorids": "~Chunjin_Song1;~Bastian_Wandt2;~Helge_Rhodin5",
        "gender": "F;M;",
        "homepage": "https://chunjinsong.github.io/;http://bastianwandt.de;",
        "dblp": "230/8001;;",
        "google_scholar": ";z4aXEBYAAAAJ;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Chunjin_Song1;~Bastian_Wandt2;~Helge_Rhodin5",
        "aff": "University of British Columbia;Link\u00f6ping University;",
        "aff_domain": "cs.ubc.ca;liu.se;",
        "position": "PhD student;Assistant Professor;",
        "bibtex": "@inproceedings{\nsong2024pose,\ntitle={Pose Modulated Avatars from Video},\nauthor={Chunjin Song and Bastian Wandt and Helge Rhodin},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=5t44vPlv9x}\n}",
        "github": "",
        "project": "",
        "reviewers": "PkgA;SAAP;McVe",
        "pdf_size": 8773642,
        "rating": "6;6;6",
        "confidence": "4;5;4",
        "soundness": "3;2;3",
        "contribution": "2;2;2",
        "presentation": "3;3;4",
        "wc_summary": "58;56;143",
        "wc_strengths": "35;41;115",
        "wc_weaknesses": "287;84;205",
        "wc_questions": "7;9;95",
        "wc_review": "387;190;558",
        "wc_reply_reviewers": "43;134;0",
        "wc_reply_authors": "818;1719;746",
        "reply_reviewers": "1;1;0",
        "reply_authors": "3;4;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            85.66666666666667,
            40.54901012629312
        ],
        "wc_strengths_avg": [
            63.666666666666664,
            36.38070306571267
        ],
        "wc_weaknesses_avg": [
            192.0,
            83.3826520726384
        ],
        "wc_questions_avg": [
            37.0,
            41.02032016777376
        ],
        "wc_review_avg": [
            378.3333333333333,
            150.36030800122157
        ],
        "wc_reply_reviewers_avg": [
            59.0,
            55.86292748027682
        ],
        "wc_reply_authors_avg": [
            1094.3333333333333,
            442.68298162705804
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1398260736606413018&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=5t44vPlv9x",
        "pdf": "https://openreview.net/pdf?id=5t44vPlv9x",
        "email": "cs.ubc.ca;liu.se;",
        "author_num": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of British Columbia;Link\u00f6ping University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ubc.ca;https://www.liu.se",
        "aff_unique_abbr": "UBC;LiU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Canada;Sweden"
    },
    {
        "title": "Learning to Relax: Setting Solver Parameters Across a Sequence of Linear System Instances",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19409",
        "id": "5t57omGVMw",
        "author_site": "Mikhail Khodak, Edmond Chow, Nina Balcan, Ameet Talwalkar",
        "tldr": "",
        "abstract": "Solving a linear system ${\\bf Ax}={\\bf b}$ is a fundamental scientific computing primitive for which numerous solvers and preconditioners have been developed. \n\tThese come with parameters whose optimal values depend on the system being solved and are often impossible or too expensive to identify;\n\tthus in practice sub-optimal heuristics are used.\n\tWe consider the common setting in which many related linear systems need to be solved, e.g. during a single numerical simulation.\n\tIn this scenario, can we sequentially choose parameters that attain a near-optimal overall number of iterations, without extra matrix computations?\n\tWe answer in the affirmative for Successive Over-Relaxation (SOR), a standard solver whose parameter $\\omega$ has a strong impact on its runtime.\n\tFor this method, we prove that a bandit online learning algorithm\u2014using only the number of iterations as feedback\u2014can select parameters for a sequence of instances such that the overall cost approaches that of the best fixed $\\omega$ as the sequence length increases.\n\tFurthermore, when given additional structural information, we show that a _contextual_ bandit method asymptotically achieves the performance of the _instance-optimal_ policy, which selects the best $\\omega$ for each instance.\n\tOur work provides the first learning-theoretic treatment of high-precision linear system solvers and the first end-to-end guarantees for data-driven scientific computing, demonstrating theoretically the potential to speed up numerical methods using well-understood learning algorithms.",
        "keywords": "scientific computing;data-driven algorithm design;online learning;multi-armed bandits;contextual bandits;numerical analysis;learning-augmented algorithms;algorithms with predictions",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/33e10f5af5711e4f2e735654e9558c08c4e7e509.zip",
        "author": "Mikhail Khodak;Edmond Chow;Maria Florina Balcan;Ameet Talwalkar",
        "authorids": "~Mikhail_Khodak1;~Edmond_Chow1;~Maria_Florina_Balcan1;~Ameet_Talwalkar1",
        "gender": ";M;;M",
        "homepage": ";https://faculty.cc.gatech.edu/~echow/;;http://www.cs.cmu.edu/~atalwalk/",
        "dblp": ";96/2502;;56/5528",
        "google_scholar": ";jGqGKGMAAAAJ;;https://scholar.google.com.tw/citations?user=TW7U1W0AAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Mikhail_Khodak1;~Edmond_Chow1;~Maria_Florina_Balcan1;~Ameet_Talwalkar1",
        "aff": ";Georgia Institute of Technology;;Carnegie Mellon University",
        "aff_domain": ";gatech.edu;;cmu.edu",
        "position": ";Full Professor;;Associate Professor",
        "bibtex": "@inproceedings{\nkhodak2024learning,\ntitle={Learning to Relax: Setting Solver Parameters Across a Sequence of Linear System Instances},\nauthor={Mikhail Khodak and Edmond Chow and Maria Florina Balcan and Ameet Talwalkar},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=5t57omGVMw}\n}",
        "github": "",
        "project": "",
        "reviewers": "655G;vVy3;7bs2;9VfQ",
        "pdf_size": 3100334,
        "rating": "8;8;8;8",
        "confidence": "2;3;3;3",
        "soundness": "3;3;3;3",
        "contribution": "3;4;3;3",
        "presentation": "3;3;4;3",
        "wc_summary": "27;155;415;73",
        "wc_strengths": "31;304;93;49",
        "wc_weaknesses": "34;293;81;52",
        "wc_questions": "112;343;234;14",
        "wc_review": "204;1095;823;188",
        "wc_reply_reviewers": "14;116;0;0",
        "wc_reply_authors": "323;798;764;179",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            167.5,
            150.0691507272564
        ],
        "wc_strengths_avg": [
            119.25,
            109.02379327467926
        ],
        "wc_weaknesses_avg": [
            115.0,
            104.12732590439457
        ],
        "wc_questions_avg": [
            175.75,
            124.0894334744099
        ],
        "wc_review_avg": [
            577.5,
            393.474586218729
        ],
        "wc_reply_reviewers_avg": [
            32.5,
            48.54636958620078
        ],
        "wc_reply_authors_avg": [
            516.0,
            270.1138648792394
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17888411012785696749&as_sdt=5,31&sciodt=0,31&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=5t57omGVMw",
        "pdf": "https://openreview.net/pdf?id=5t57omGVMw",
        "email": ";gatech.edu;;cmu.edu",
        "author_num": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Georgia Institute of Technology;Carnegie Mellon University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.gatech.edu;https://www.cmu.edu",
        "aff_unique_abbr": "Georgia Tech;CMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Prompt Risk Control: A Rigorous Framework for Responsible Deployment of Large Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19408",
        "id": "5tGGWOijvq",
        "author_site": "Thomas Zollo, Todd Morrill, Zhun Deng, Jake Snell, Toniann Pitassi, Richard Zemel",
        "tldr": "",
        "abstract": "With the explosion of the zero-shot capabilities of (and thus interest in) pre-trained large language models, there has come accompanying interest in how best to prompt a language model to perform a given task. While it may be tempting to choose a prompt based on empirical results on a validation set, this can lead to a deployment where an unexpectedly high loss occurs. To mitigate this prospect, we propose a lightweight framework, Prompt Risk Control, for selecting a prompt based on rigorous upper bounds on families of informative risk measures. We provide and compare different methods for producing bounds on a diverse set of risk metrics like mean, CVaR, and the Gini coefficient of the loss distribution. In addition, we extend the underlying statistical bounding techniques to accommodate the possibility of distribution shifts in deployment. Extensive experiments on high-impact applications like chatbots, medical question answering, and news summarization highlight why such a framework is necessary to reduce exposure to the worst outcomes.",
        "keywords": "distribution-free uncertainty quantification;large language models;responsible AI",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/3c5a3c65a364905473f9e6916dd413b2fa2576d4.zip",
        "author": "Thomas P Zollo;Todd Morrill;Zhun Deng;Jake Snell;Toniann Pitassi;Richard Zemel",
        "authorids": "~Thomas_P_Zollo1;~Todd_Morrill1;~Zhun_Deng1;~Jake_Snell1;~Toniann_Pitassi3;~Richard_Zemel1",
        "gender": "M;Not Specified;M;M;F;M",
        "homepage": "https://www.thomaszollo.com/;http://toddmorrill.github.io/;https://www.zhundeng.org/;https://www.jakesnell.com;http://www.cs.columbia.edu/~toni;http://www.cs.columbia.edu/~zemel",
        "dblp": "336/8946;;204/4353;172/1406;p/TPitassi;16/6366",
        "google_scholar": "Xp7LgAwAAAAJ;;nkmi-moAAAAJ;MbXKAK8AAAAJ;;https://scholar.google.ca/citations?user=iBeDoRAAAAAJ",
        "orcid": ";;;;;",
        "linkedin": "thomas-zollo/;todd-morrill-a0b47b2a/;;;;",
        "or_profile": "~Thomas_P_Zollo1;~Todd_Morrill1;~Zhun_Deng1;~Jake_Snell1;~Toniann_Pitassi3;~Richard_Zemel1",
        "aff": "Columbia University;Columbia University;Columbia University;Princeton University;Columbia University;Department of Computer Science, University of Toronto",
        "aff_domain": "columbia.edu;columbia.edu;columbia.edu;princeton.edu;columbia.edu;cs.toronto.edu",
        "position": "PhD student;MS student;Postdoc;Postdoc;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nzollo2024prompt,\ntitle={Prompt Risk Control: A Rigorous Framework for Responsible Deployment of Large Language Models},\nauthor={Thomas P Zollo and Todd Morrill and Zhun Deng and Jake Snell and Toniann Pitassi and Richard Zemel},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=5tGGWOijvq}\n}",
        "github": "",
        "project": "",
        "reviewers": "FU87;sC6o;YTab;CoFo",
        "pdf_size": 2319945,
        "rating": "6;6;6;8",
        "confidence": "3;4;4;3",
        "soundness": "3;3;3;3",
        "contribution": "3;2;3;3",
        "presentation": "3;2;4;3",
        "wc_summary": "92;82;135;216",
        "wc_strengths": "117;56;23;82",
        "wc_weaknesses": "64;178;59;113",
        "wc_questions": "86;193;178;218",
        "wc_review": "359;509;395;629",
        "wc_reply_reviewers": "0;0;10;6",
        "wc_reply_authors": "328;761;480;472",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            131.25,
            52.826958080131774
        ],
        "wc_strengths_avg": [
            69.5,
            34.48550420104076
        ],
        "wc_weaknesses_avg": [
            103.5,
            47.90876746483883
        ],
        "wc_questions_avg": [
            168.75,
            49.866697303912154
        ],
        "wc_review_avg": [
            473.0,
            105.72606112023658
        ],
        "wc_reply_reviewers_avg": [
            4.0,
            4.242640687119285
        ],
        "wc_reply_authors_avg": [
            510.25,
            156.89865359524282
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15589174670380778205&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=5tGGWOijvq",
        "pdf": "https://openreview.net/pdf?id=5tGGWOijvq",
        "email": "columbia.edu;columbia.edu;columbia.edu;princeton.edu;columbia.edu;cs.toronto.edu",
        "author_num": 6,
        "aff_unique_index": "0;0;0;1;0;2",
        "aff_unique_norm": "Columbia University;Princeton University;University of Toronto",
        "aff_unique_dep": ";;Department of Computer Science",
        "aff_unique_url": "https://www.columbia.edu;https://www.princeton.edu;https://www.utoronto.ca",
        "aff_unique_abbr": "Columbia;Princeton;U of T",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Toronto",
        "aff_country_unique_index": "0;0;0;0;0;1",
        "aff_country_unique": "United States;Canada"
    },
    {
        "id": "5tSLtvkHCh",
        "title": "Learning Temporal Causal Representation under Non-Invertible Generation Process",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Identifying the underlying time-delayed latent causal processes in sequential data is vital for grasping temporal dynamics and making downstream reasoning. While some recent methods can robustly identify these latent causal variables, they rely on strict assumptions about the invertible generation process from latent variables to observed data. These assumptions are often hard to satisfy in real-world applications containing information loss. For instance, the visual perception process translates a 3D space into 2D images, or the phenomenon of persistence of vision incorporates historical data into current perceptions. To address this challenge, we establish an identifiability theory that allows for the recovery of independent latent components even when they come from a nonlinear and non-invertible mix. Using this theory as a foundation, we propose a principled approach, CaRiNG, to learn the Causal Representation of Non-invertible Generative temporal data with identifiability guarantees. Specifically, we utilize the temporal context to recover lost latent information and employ the conditions in our theory to guide the training process. Through experiments conducted on synthetic datasets, we validate that the causal process is reliably identified by CaRiNG, even when the generation process is non-invertible. Moreover, we show that our approach considerably improves temporal understanding and reasoning in practical applications.",
        "keywords": "Causal Representation Learning;Uninvertible Mixing Function;Temporal Series;Indentifiability",
        "primary_area": "causal reasoning",
        "supplementary_material": "/attachment/4ff61499968ef63f351f65f927be1c1538469adb.zip",
        "author": "Guangyi Chen;Yifan Shen;Zhenhao Chen;Xiangchen Song;Yuewen Sun;Weiran Yao;Xiao Liu;Kun Zhang",
        "authorids": "~Guangyi_Chen1;~Yifan_Shen4;~Zhenhao_Chen1;~Xiangchen_Song1;~Yuewen_Sun1;~Weiran_Yao1;~Xiao_Liu23;~Kun_Zhang1",
        "gender": "M;M;M;M;F;M;M;M",
        "homepage": "https://chengy12.github.io/;https://sanshuiii.github.io/about/;https://zhenhaochenofficial.github.io/;https://xiangchensong.github.io/;https://yuewen-sun.github.io/;;;http://www.andrew.cmu.edu/user/kunz1/",
        "dblp": "c/GuangyiChen-2;59/7950-4;192/7717;261/9024;219/9893;192/3295;;96/3115-1",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;PMKkElwAAAAJ;xOAtM0YAAAAJ;foR8BIoAAAAJ;https://scholar.google.com/citations?hl=en;rr_leUAAAAAJ;;RGoypN4AAAAJ",
        "orcid": ";0000-0003-2358-1146;;;;;;",
        "linkedin": ";;;;;;xiao-l-699069205/;",
        "or_profile": "~Guangyi_Chen1;~Yifan_Shen4;~Zhenhao_Chen1;~Xiangchen_Song1;~Yuewen_Sun1;~Weiran_Yao1;~Xiao_Liu23;~Kun_Zhang1",
        "aff": "Carnegie Mellon University;Mohamed bin Zayed University of Artificial Intelligence;Mohamed bin Zayed University of Artificial Intelligence;Carnegie Mellon University;Mohamed bin Zayed University of Artificial Intelligence;SalesForce.com;Technische Universit\u00e4t Darmstadt;Carnegie Mellon University",
        "aff_domain": "cmu.edu;mbzuai.ac.ae;mbzuai.ac.ae;cmu.edu;mbzuai.ac.ae;salesforce.com;tu-darmstadt.de;cmu.edu",
        "position": "Postdoc;MS student;PhD student;PhD student;Postdoc;Researcher;Researcher;Associate Professor",
        "bibtex": "@misc{\nchen2024learning,\ntitle={Learning Temporal Causal Representation under Non-Invertible Generation Process},\nauthor={Guangyi Chen and Yifan Shen and Zhenhao Chen and Xiangchen Song and Yuewen Sun and Weiran Yao and Xiao Liu and Kun Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=5tSLtvkHCh}\n}",
        "github": "",
        "project": "",
        "reviewers": "ur5z;5cYn;WQAA;uMXb",
        "site": "https://openreview.net/forum?id=5tSLtvkHCh",
        "pdf_size": 3436455,
        "rating": "3;5;6;8",
        "confidence": "4;3;3;2",
        "soundness": "2;3;3;3",
        "contribution": "3;2;4;3",
        "presentation": "1;3;3;3",
        "wc_summary": "591;99;101;114",
        "wc_strengths": "76;32;58;32",
        "wc_weaknesses": "1269;346;383;85",
        "wc_questions": "44;125;35;304",
        "wc_review": "1980;602;577;535",
        "wc_reply_reviewers": "349;151;166;14",
        "wc_reply_authors": "3789;2347;2290;1130",
        "reply_reviewers": "2;1;3;1",
        "reply_authors": "8;7;8;3",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            226.25,
            210.66724353823972
        ],
        "wc_strengths_avg": [
            49.5,
            18.621224449536072
        ],
        "wc_weaknesses_avg": [
            520.75,
            447.009158183588
        ],
        "wc_questions_avg": [
            127.0,
            108.03471664238306
        ],
        "wc_review_avg": [
            923.5,
            610.4402100124139
        ],
        "wc_reply_reviewers_avg": [
            170.0,
            119.11549017655092
        ],
        "wc_reply_authors_avg": [
            2389.0,
            942.9536043729829
        ],
        "reply_reviewers_avg": [
            1.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            6.5,
            2.0615528128088303
        ],
        "replies_avg": [
            39,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.9805806756909202,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:abend1rZPOMJ:scholar.google.com/&scioq=Learning+Temporal+Causal+Representation+under+Non-Invertible+Generation+Process&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;0;1;2;3;0",
        "aff_unique_norm": "Carnegie Mellon University;Mohamed bin Zayed University of Artificial Intelligence;Salesforce;Technische Universit\u00e4t Darmstadt",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.cmu.edu;https://mbzuai.ac.ae;https://www.salesforce.com;https://www.tu-darmstadt.de",
        "aff_unique_abbr": "CMU;MBZUAI;Salesforce;TUD",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;0;1;0;2;0",
        "aff_country_unique": "United States;United Arab Emirates;Germany"
    },
    {
        "id": "5tYTCyYI27",
        "title": "Calibration Bottleneck: What Makes Neural Networks less Calibratable?",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "While modern deep neural networks have achieved remarkable success, they have exhibited a notable deficiency in reliably estimating uncertainty. Many existing studies address the uncertainty calibration problem by incorporating regularization techniques to penalize the overconfident outputs during training. In this study, we shift the focus from the miscalibration encountered in the training phase to an investigation of the concept of calibratability, assessing how amenable a model is to be recalibrated in post-training phase. We find that the use of regularization techniques might compromise calibratability, subsequently leading to a decline in final calibration performance after recalibration. To identify the underlying causes leading to poor calibratability, we delve into the calibration of intermediate features across neural networks\u2019 hidden layers. Our study demonstrates that the overtraining of the top layers in neural networks poses a significant obstacle to calibration, while these layers typically offer minimal improvement to the discriminability of features. Based on this observation, we introduce a weak classifier hypothesis: Given a weak classification head, the bottom layers of a neural network can be learned better for producing calibratable features. Consequently, we propose a progressively layer-peeled training (PLT) method to exploit this hypothesis, thereby enhancing model calibratability. Comprehensive experiments show the effectiveness of our method, which improves model calibration and also yields competitive predictive performance.",
        "keywords": "Uncertainty Calibration;Post-hoc Calibration",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Deng-Bao Wang;Min-Ling Zhang",
        "authorids": "~Deng-Bao_Wang1;~Min-Ling_Zhang2",
        "gender": "M;M",
        "homepage": "https://dengbaowang.github.io/;http://palm.seu.edu.cn/zhangml/",
        "dblp": "204/2255;84/271.html",
        "google_scholar": "QCA7j2cAAAAJ;uFHCIM0AAAAJ",
        "orcid": ";0000-0003-1880-5918",
        "linkedin": ";",
        "or_profile": "~Deng-Bao_Wang1;~Min-Ling_Zhang2",
        "aff": "Southeast University;Southeast University",
        "aff_domain": "seu.edu.cn;seu.edu.cn",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nwang2024calibration,\ntitle={Calibration Bottleneck: What Makes Neural Networks less Calibratable?},\nauthor={Deng-Bao Wang and Min-Ling Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=5tYTCyYI27}\n}",
        "github": "",
        "project": "",
        "reviewers": "VAxV;x8eC;7Hnm",
        "site": "https://openreview.net/forum?id=5tYTCyYI27",
        "pdf_size": 1609285,
        "rating": "3;5;8",
        "confidence": "5;4;4",
        "soundness": "2;1;3",
        "contribution": "2;3;3",
        "presentation": "2;2;4",
        "wc_summary": "55;70;238",
        "wc_strengths": "35;35;144",
        "wc_weaknesses": "208;208;72",
        "wc_questions": "6;29;569",
        "wc_review": "304;342;1023",
        "wc_reply_reviewers": "140;170;0",
        "wc_reply_authors": "636;850;990",
        "reply_reviewers": "1;1;0",
        "reply_authors": "3;3;3",
        "rating_avg": [
            5.333333333333333,
            2.0548046676563256
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            121.0,
            82.95782060782456
        ],
        "wc_strengths_avg": [
            71.33333333333333,
            51.383092766222454
        ],
        "wc_weaknesses_avg": [
            162.66666666666666,
            64.1110148275803
        ],
        "wc_questions_avg": [
            201.33333333333334,
            260.1491025461275
        ],
        "wc_review_avg": [
            556.3333333333334,
            330.34762834861635
        ],
        "wc_reply_reviewers_avg": [
            103.33333333333333,
            74.08703590297624
        ],
        "wc_reply_authors_avg": [
            825.3333333333334,
            145.56861688640936
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.0,
            0.0
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.8029550685469661,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Hcc0M9RomiEJ:scholar.google.com/&scioq=Calibration+Bottleneck:+What+Makes+Neural+Networks+less+Calibratable%3F&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Southeast University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.seu.edu.cn/",
        "aff_unique_abbr": "SEU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "5twh6pM4SR",
        "title": "Automating Continual Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "General-purpose learning systems should improve themselves in open-ended fashion in ever-changing environments. Conventional learning algorithms for neural networks, however, suffer from the so-called catastrophic forgetting (CF) problem---previously acquired skills are forgotten when a new task is learned. Developing continual learning algorithms to address CF remains an open research question.\nInstead of hand-crafting such algorithms, our new Automated Continual Learning (ACL) trains self-referential neural networks to meta-learn their own in-context continual (meta-)learning algorithms. ACL encodes all desiderata---good performance on both old and new tasks---into its learning objectives. We demonstrate the effectiveness and promise of ACL on multiple few-shot and standard image classification tasks adopted for continual learning: Mini-ImageNet, Omniglot, FC100, MNIST-families, and CIFAR-10.",
        "keywords": "continual learning;in-context learning;meta-learning;self-referential learning;linear Transformers",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/925a674e61a8908054ac10f952d54a9d6cb7b1ee.zip",
        "author": "Kazuki Irie;R\u00f3bert Csord\u00e1s;J\u00fcrgen Schmidhuber",
        "authorids": "~Kazuki_Irie1;~R\u00f3bert_Csord\u00e1s1;~J\u00fcrgen_Schmidhuber1",
        "gender": ";M;M",
        "homepage": "https://sites.harvard.edu/kazuki-irie/;https://robertcsordas.github.io/;http://people.idsia.ch/~juergen/",
        "dblp": "148/9667;166/4773.html;s/JurgenSchmidhuber",
        "google_scholar": "https://scholar.google.de/citations?user=-gZ-BdwAAAAJ;av1lplwAAAAJ;https://scholar.google.ch/citations?user=gLnCTgIAAAAJ",
        "orcid": "0000-0003-0923-691X;;",
        "linkedin": ";robertcsordas/;",
        "or_profile": "~Kazuki_Irie1;~R\u00f3bert_Csord\u00e1s1;~J\u00fcrgen_Schmidhuber1",
        "aff": "Harvard University;IDSIA;IDSIA",
        "aff_domain": "fas.harvard.edu;idsia.ch;idsia.ch",
        "position": "Postpostdoc;Postdoc;Scientific Director",
        "bibtex": "@misc{\nirie2024automating,\ntitle={Automating Continual Learning},\nauthor={Kazuki Irie and R{\\'o}bert Csord{\\'a}s and J{\\\"u}rgen Schmidhuber},\nyear={2024},\nurl={https://openreview.net/forum?id=5twh6pM4SR}\n}",
        "github": "",
        "project": "",
        "reviewers": "StyD;jN2L;WhrD",
        "site": "https://openreview.net/forum?id=5twh6pM4SR",
        "pdf_size": 492759,
        "rating": "5;5;6",
        "confidence": "4;4;3",
        "soundness": "3;2;2",
        "contribution": "2;2;2",
        "presentation": "2;3;4",
        "wc_summary": "44;102;60",
        "wc_strengths": "56;35;80",
        "wc_weaknesses": "327;48;115",
        "wc_questions": "79;455;55",
        "wc_review": "506;640;310",
        "wc_reply_reviewers": "834;405;15",
        "wc_reply_authors": "2585;2136;551",
        "reply_reviewers": "2;2;1",
        "reply_authors": "5;6;2",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            68.66666666666667,
            24.458581770458856
        ],
        "wc_strengths_avg": [
            57.0,
            18.384776310850235
        ],
        "wc_weaknesses_avg": [
            163.33333333333334,
            118.91827258901617
        ],
        "wc_questions_avg": [
            196.33333333333334,
            183.1671974514602
        ],
        "wc_review_avg": [
            485.3333333333333,
            135.51219707301465
        ],
        "wc_reply_reviewers_avg": [
            418.0,
            334.4816885869838
        ],
        "wc_reply_authors_avg": [
            1757.3333333333333,
            872.4793534647238
        ],
        "reply_reviewers_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            4.333333333333333,
            1.699673171197595
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.9999999999999997,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16950957273444981926&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Harvard University;Institute of Digital Technologies",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.harvard.edu;https://www.idsia.ch",
        "aff_unique_abbr": "Harvard;IDSIA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "United States;Switzerland"
    },
    {
        "id": "5vJe8XKFv0",
        "title": "CoNO: Complex Neural Operator for Continuous Dynamical Systems",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Neural operators extend data-driven models to map between infinite-dimensional functional spaces. These models have successfully solved continuous dynamical systems represented by differential equations, viz weather forecasting, fluid flow, or solid mechanics. However, the existing operators still rely on real space, thereby losing rich representations potentially captured in the complex space by functional transforms. In this paper, we introduce a Complex Neural Operator (CoNO), that parameterizes the integral kernel in the complex fractional Fourier domain. Additionally, the model employing a complex-valued neural network along with aliasing-free activation functions preserves the complex values and complex algebraic properties, thereby enabling improved representation, robustness to noise, and generalization. We show that the model effectively captures the underlying partial differential equation with a single complex fractional Fourier transform. We perform an extensive empirical evaluation of CoNO on several datasets and additional tasks such as zero-shot super-resolution, evaluation of out-of-distribution data, data efficiency, and robustness to noise. CoNO exhibits comparable or superior performance to all the state-of-the-art models in these tasks. Altogether, CoNO presents a robust and superior model for modeling continuous dynamical systems, providing a fillip to scientific machine learning. Our code implementation is available at https://anonymous.4open.science/r/anonymous-cono.",
        "keywords": "Complex valued neural network;neural operator;partial differential equations;dynamical systems",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Karn Tiwari;N M Anoop Krishnan;Prathosh AP",
        "authorids": "~Karn_Tiwari1;~N_M_Anoop_Krishnan1;~Prathosh_AP1",
        "gender": "M;M;M",
        "homepage": ";;https://sites.google.com/view/prathosh",
        "dblp": ";;218/5887",
        "google_scholar": ";https://scholar.google.co.in/citations?user=fGnjHcEAAAAJ;https://scholar.google.co.in/citations?user=OEwV4bsAAAAJ",
        "orcid": ";0000-0003-1500-4947;",
        "linkedin": "karn3003/;;prathosh-ap-phd-50ab9511/",
        "or_profile": "~Karn_Tiwari1;~N_M_Anoop_Krishnan1;~Prathosh_AP1",
        "aff": "Indian Institute of Science, Indian institute of science, Bangalore;Indian Institute of Technology Delhi;Indian Institute of Science, Indian institute of science, Bangalore",
        "aff_domain": "iisc.ac.in;iitd.ac.in;iisc.ac.in",
        "position": "PhD student;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\ntiwari2024cono,\ntitle={Co{NO}: Complex Neural Operator for Continuous Dynamical Systems},\nauthor={Karn Tiwari and N M Anoop Krishnan and Prathosh AP},\nyear={2024},\nurl={https://openreview.net/forum?id=5vJe8XKFv0}\n}",
        "github": "",
        "project": "",
        "reviewers": "Ubji;CUfC;8MNi;HK2j",
        "site": "https://openreview.net/forum?id=5vJe8XKFv0",
        "pdf_size": 2293479,
        "rating": "3;3;5;5",
        "confidence": "4;4;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;2",
        "presentation": "1;1;3;2",
        "wc_summary": "47;54;290;76",
        "wc_strengths": "17;42;152;80",
        "wc_weaknesses": "361;130;276;180",
        "wc_questions": "39;89;2;272",
        "wc_review": "464;315;720;608",
        "wc_reply_reviewers": "0;0;0;21",
        "wc_reply_authors": "135;284;261;396",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            116.75,
            100.59665749914357
        ],
        "wc_strengths_avg": [
            72.75,
            50.957703048705014
        ],
        "wc_weaknesses_avg": [
            236.75,
            88.87456047711291
        ],
        "wc_questions_avg": [
            100.5,
            103.71716347837517
        ],
        "wc_review_avg": [
            526.75,
            152.25205253132057
        ],
        "wc_reply_reviewers_avg": [
            5.25,
            9.093266739736606
        ],
        "wc_reply_authors_avg": [
            269.0,
            92.70113267916417
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11430387391731248986&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Indian Institute of Science;Indian Institute of Technology Delhi",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.iisc.ac.in;https://www.iitd.ac.in",
        "aff_unique_abbr": "IISc;IIT Delhi",
        "aff_campus_unique_index": "0;1;0",
        "aff_campus_unique": "Bangalore;Delhi",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "India"
    },
    {
        "id": "5vXDQ65dzH",
        "title": "ParFam - Symbolic Regression Based on Continuous Global Optimization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The problem of symbolic regression (SR) arises in many different applications, such as identifying physical laws or deriving mathematical equations describing the behavior of financial markets from given data. Various methods exist to address the problem of SR, often based on genetic programming. However, these methods are usually quite complicated and require a lot of hyperparameter tuning and computational resources. \nIn this paper, we present our new method ParFam that utilizes parametric families of suitable symbolic functions to translate the discrete symbolic regression problem into a continuous one, resulting in a more straightforward setup compared to current state-of-the-art methods. \nIn combination with a powerful global optimizer, this approach results in an effective method to tackle the problem of SR. \nFurthermore, it can be easily extended to more advanced algorithms, e.g., by adding a deep neural network to find good-fitting parametric families. \nWe prove the performance of ParFam with extensive numerical experiments based on the common SR benchmark suit SRBench, showing that we achieve state-of-the-art results. Our code can be found at https://anonymous.4open.science/r/parfam-90FC/README.md.",
        "keywords": "symbolic regression;global optimization;deep learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Philipp Scholl;Katharina Bieker;Hillary Hauger;Gitta Kutyniok",
        "authorids": "~Philipp_Scholl2;~Katharina_Bieker1;~Hillary_Hauger3;~Gitta_Kutyniok2",
        "gender": "M;;F;F",
        "homepage": ";;;https://www.ai.math.lmu.de/kutyniok",
        "dblp": "31/6987;;;13/2736",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;;https://scholar.google.de/citations?user=JHs9LssAAAAJ",
        "orcid": ";;;0000-0001-9738-2487",
        "linkedin": ";;hillary-hauger-391a7721b;gitta-kutyniok-2606b215/?originalSubdomain=de",
        "or_profile": "~Philipp_Scholl2;~Katharina_Bieker1;~Hillary_Hauger3;~Gitta_Kutyniok2",
        "aff": "University of Munich, Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen;;Technische Universit\u00e4t M\u00fcnchen;LMU Munich",
        "aff_domain": "campus.lmu.de;;tum.de;uni-muenchen.de",
        "position": "PhD student;;MS student;Full Professor",
        "bibtex": "@misc{\nscholl2024parfam,\ntitle={ParFam - Symbolic Regression Based on Continuous Global Optimization},\nauthor={Philipp Scholl and Katharina Bieker and Hillary Hauger and Gitta Kutyniok},\nyear={2024},\nurl={https://openreview.net/forum?id=5vXDQ65dzH}\n}",
        "github": "",
        "project": "",
        "reviewers": "1Ff3;LMH9;5PDr;8mnU",
        "site": "https://openreview.net/forum?id=5vXDQ65dzH",
        "pdf_size": 510269,
        "rating": "5;5;5;6",
        "confidence": "4;3;4;2",
        "soundness": "1;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "3;2;3;2",
        "wc_summary": "30;135;105;67",
        "wc_strengths": "22;33;46;28",
        "wc_weaknesses": "166;469;101;187",
        "wc_questions": "90;27;103;31",
        "wc_review": "308;664;355;313",
        "wc_reply_reviewers": "56;60;0;0",
        "wc_reply_authors": "1091;544;577;1443",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "2;1;1;2",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            84.25,
            39.51819201329939
        ],
        "wc_strengths_avg": [
            32.25,
            8.842369591913696
        ],
        "wc_weaknesses_avg": [
            230.75,
            141.16014841307017
        ],
        "wc_questions_avg": [
            62.75,
            34.09087121210017
        ],
        "wc_review_avg": [
            410.0,
            147.77855054100374
        ],
        "wc_reply_reviewers_avg": [
            29.0,
            29.03446228191595
        ],
        "wc_reply_authors_avg": [
            913.75,
            374.7128066933395
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8703882797784891,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7557527737156987216&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen;Technische Universit\u00e4t M\u00fcnchen;Ludwig Maximilian University of Munich",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.lmu.de;https://www.tum.de;https://www.lmu.de",
        "aff_unique_abbr": "LMU;TUM;LMU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Munich",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "5vY0HNpy9F",
        "title": "PyTrial: Machine Learning Software and Benchmark for Clinical Trial Applications",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Clinical trials are conducted to test the effectiveness and safety of potential drugs in humans for regulatory approval. Machine learning (ML) has recently emerged as a new tool to assist in clinical trials. Despite this progress, there have been few efforts to document and benchmark ML4Trial algorithms available to the ML research community. Additionally, the accessibility to clinical trial-related datasets is limited, and there is a lack of well-defined clinical tasks to facilitate the development of new algorithms.\n\nTo fill this gap, we have developed PyTrial that provides benchmarks and open-source implementations of a series of ML algorithms for clinical trial design and operations. In this paper, we thoroughly investigate 34 ML algorithms for clinical trials across 6 different tasks, including patient outcome prediction, trial site selection, trial outcome prediction, patient-trial matching, trial similarity search, and synthetic data generation. We have also collected and prepared 23 ML-ready datasets as well as their working examples in Jupyter Notebooks for quick implementation and testing.\n\nPyTrial defines each task through a simple four-step process: data loading, model specification, model training, and model evaluation, all achievable with just a few lines of code. Furthermore, our modular API architecture empowers practitioners to expand the framework to incorporate new algorithms and tasks effortlessly.",
        "keywords": "Drug development;Clinical trial;Healthcare;Machine Learning;Deep Learning",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Zifeng Wang;Brandon Philip Theodorou;Tianfan Fu;Cao Xiao;Jimeng Sun",
        "authorids": "~Zifeng_Wang3;~Brandon_Philip_Theodorou1;~Tianfan_Fu1;~Cao_Xiao2;~Jimeng_Sun3",
        "gender": "M;M;M;F;",
        "homepage": "https://zifengwang.xyz;;https://futianfan.github.io/;https://sites.google.com/view/danicaxiao/home;http://sunlab.org",
        "dblp": ";;;170/1833;",
        "google_scholar": "kMlWwTAAAAAJ;xWjAUGsAAAAJ;KPQ49w4AAAAJ;ahaV25EAAAAJ;9jmmp5sAAAAJ",
        "orcid": ";;;;0000-0003-1512-6426",
        "linkedin": ";brandon-theodorou-284b6b148;;caoxiao/;jimengsun/",
        "or_profile": "~Zifeng_Wang3;~Brandon_Philip_Theodorou1;~Tianfan_Fu1;~Cao_Xiao2;~Jimeng_Sun3",
        "aff": "University of Illinois, Urbana Champaign;University of Illinois, Urbana Champaign;Rensselaer Polytechnic Institute;GE Healthcare;Georgia Institute of Technology",
        "aff_domain": "illinois.edu;illinois.edu;rpi.edu;ge.com;gatech.edu",
        "position": "PhD student;PhD student;Assistant Professor;VP of AI;Associate Professor",
        "bibtex": "@misc{\nwang2024pytrial,\ntitle={PyTrial: Machine Learning Software and Benchmark for Clinical Trial Applications},\nauthor={Zifeng Wang and Brandon Philip Theodorou and Tianfan Fu and Cao Xiao and Jimeng Sun},\nyear={2024},\nurl={https://openreview.net/forum?id=5vY0HNpy9F}\n}",
        "github": "",
        "project": "",
        "reviewers": "dwRR;cWL5;BJYq;nm57",
        "site": "https://openreview.net/forum?id=5vY0HNpy9F",
        "pdf_size": 1515128,
        "rating": "5;5;5;5",
        "confidence": "3;5;4;3",
        "soundness": "2;2;3;3",
        "contribution": "2;3;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "51;45;105;148",
        "wc_strengths": "110;40;64;160",
        "wc_weaknesses": "292;261;60;148",
        "wc_questions": "13;3;158;152",
        "wc_review": "466;349;387;608",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            87.25,
            42.14483954175173
        ],
        "wc_strengths_avg": [
            93.5,
            45.89934640057525
        ],
        "wc_weaknesses_avg": [
            190.25,
            92.34277177992873
        ],
        "wc_questions_avg": [
            81.5,
            73.61555542139175
        ],
        "wc_review_avg": [
            452.5,
            99.20307454912877
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9688703640964513495&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1;2;3",
        "aff_unique_norm": "University of Illinois Urbana-Champaign;Rensselaer Polytechnic Institute;GE Healthcare;Georgia Institute of Technology",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://illinois.edu;https://www.rpi.edu;https://www.gehealthcare.com;https://www.gatech.edu",
        "aff_unique_abbr": "UIUC;RPI;GEHC;Georgia Tech",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Urbana-Champaign;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "5vcqlmDokC",
        "title": "Enhanced Gradient Aligned Continual Learning via Pareto Optimization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Catastrophic forgetting remains a core challenge in continual learning (CL), whereby the models struggle to retain previous knowledge when learning new tasks. While existing gradient-alignment-based CL methods have been proposed to tackle this challenge by aligning gradients between previous and current tasks, they do not carefully consider the interdependence between previously learned tasks and fully explore the potential of seen tasks. Against this issue, we first adopt the MiniMax theorem and reformulate the existing commonly-adopted gradient alignment optimization problem in a gradient weighting framework. Then we incorporate the Pareto optimality to capture the interrelationship among previously learned tasks, and design a Pareto regularized gradient alignment algorithm (PRGA), which effectively enhances the overall performance of past tasks while ensuring the performance of the current task. Comprehensive empirical results demonstrate that the proposed PRGA outperforms current state-of-the-art continual learning methods across multiple datasets and different settings.",
        "keywords": "continual learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Yichen Wu;Hong Wang;Long-Kai Huang;Yefeng Zheng;Peilin Zhao;Ying Wei",
        "authorids": "~Yichen_Wu2;~Hong_Wang5;~Long-Kai_Huang1;~Yefeng_Zheng2;~Peilin_Zhao2;~Ying_Wei1",
        "gender": "M;F;;M;;F",
        "homepage": "https://wuyichen-97.github.io/;https://hongwang01.github.io/;https://sites.google.com/site/longkaihugo/home;https://en.westlake.edu.cn/faculty/yefeng-zheng.html;;https://wei-ying.net/",
        "dblp": ";83/5522-21;133/2006;44/6510;84/8411;14/4899-1",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;I5RH0CwAAAAJ;CaP64WUAAAAJ;vAIECxgAAAAJ;https://scholar.google.com.hk/citations?user=HPeX_YcAAAAJ;5UpFdKsAAAAJ",
        "orcid": "0000-0003-2859-3285;;0000-0001-5263-1443;0000-0003-2195-2847;0000-0001-8543-3953;",
        "linkedin": ";;;yefeng-zheng-bb45641/?originalSubdomain=cn;;",
        "or_profile": "~Yichen_Wu2;~Hong_Wang5;~Long-Kai_Huang1;~Yefeng_Zheng2;~Peilin_Zhao2;~Ying_Wei1",
        "aff": "City University of Hong Kong;Tencent ;Tencent;Tencent Jarvis Lab;Tencent;Nanyang Technological University",
        "aff_domain": "cityu.edu.hk;tencent.com;tencent.com;tencent.com;tencent.com;ntu.edu.sg",
        "position": "PhD student;Senior Researcher;Researcher;Director;Researcher;Assistant Professor",
        "bibtex": "@misc{\nwu2024enhanced,\ntitle={Enhanced Gradient Aligned Continual Learning via Pareto Optimization},\nauthor={Yichen Wu and Hong Wang and Long-Kai Huang and Yefeng Zheng and Peilin Zhao and Ying Wei},\nyear={2024},\nurl={https://openreview.net/forum?id=5vcqlmDokC}\n}",
        "github": "",
        "project": "",
        "reviewers": "hYp1;FMNS;UYXS;F5TA",
        "site": "https://openreview.net/forum?id=5vcqlmDokC",
        "pdf_size": 766962,
        "rating": "3;5;5;5",
        "confidence": "4;5;4;5",
        "soundness": "1;3;2;3",
        "contribution": "2;2;2;2",
        "presentation": "1;3;3;3",
        "wc_summary": "131;99;48;59",
        "wc_strengths": "92;24;37;47",
        "wc_weaknesses": "739;208;129;42",
        "wc_questions": "11;1;5;229",
        "wc_review": "973;332;219;377",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            84.25,
            32.99526481178777
        ],
        "wc_strengths_avg": [
            50.0,
            25.583197610932064
        ],
        "wc_weaknesses_avg": [
            279.5,
            271.71170383330934
        ],
        "wc_questions_avg": [
            61.5,
            96.77163840712835
        ],
        "wc_review_avg": [
            475.25,
            293.0839256936484
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2804882248122467226&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1;1;2",
        "aff_unique_norm": "City University of Hong Kong;Tencent;Nanyang Technological University",
        "aff_unique_dep": ";Tencent Holdings Limited;",
        "aff_unique_url": "https://www.cityu.edu.hk;https://www.tencent.com;https://www.ntu.edu.sg",
        "aff_unique_abbr": "CityU;Tencent;NTU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0;0;1",
        "aff_country_unique": "China;Singapore"
    },
    {
        "id": "5xKixQzhDE",
        "title": "Calibrated Dataset Condensation for Faster Hyperparameter Search",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Dataset condensation can be used to reduce the computational cost of training multiple models on a large dataset by condensing the training dataset into a small synthetic set. State-of-the-art approaches rely on matching the model gradients between the real and synthetic data. However, there is no theoretical guarantee of the generalizability of the condensed data: data condensation often generalizes poorly across hyperparameters/architectures in practice. This paper considers a different condensation objective specifically geared toward hyperparameter search. We aim to generate a synthetic validation dataset so that the validation-performance rankings of the models, with different hyperparameters, on the condensed and original datasets are comparable. We propose a novel hyperparameter-calibrated dataset condensation (HCDC) algorithm, which obtains the synthetic validation dataset by matching the hyperparameter gradients computed via implicit differentiation and efficient inverse Hessian approximation. Experiments demonstrate that the proposed framework effectively maintains the validation-performance rankings of models and speeds up hyperparameter/architecture search for tasks on both images and graphs.",
        "keywords": "Dataset Condensation;Hyperparameter Optimization",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/a037174fabd3da720c05c302437ab54913168f58.pdf",
        "author": "Mucong Ding;Yuancheng Xu;Tahseen Rabbani;Xiaoyu Liu;Brian Gravelle;Teresa Ranadive;tai-ching tuan;Furong Huang",
        "authorids": "~Mucong_Ding1;~Yuancheng_Xu1;~Tahseen_Rabbani1;~Xiaoyu_Liu3;bjgrave@lps.umd.edu;~Teresa_Ranadive1;~tai-ching_tuan1;~Furong_Huang1",
        "gender": "M;M;M;F;;F;M;F",
        "homepage": "http://www.cs.umd.edu/~mcding/;https://yuancheng-xu.github.io;https://www.cs.umd.edu/people/trabbani;;;;;https://furong-huang.com",
        "dblp": "232/1754.html;;280/2362;;;;24/2795;72/8513",
        "google_scholar": "_bVao2MAAAAJ;OPB0QgwAAAAJ;;;;;;13yyuCcAAAAJ",
        "orcid": "0000-0002-6173-8055;;;0000-0003-3385-4726;;0000-0001-5418-6259;;",
        "linkedin": "mucong-ding-489296104;yuancheng-xu/;;;;;;",
        "or_profile": "~Mucong_Ding1;~Yuancheng_Xu1;~Tahseen_Rabbani1;~Xiaoyu_Liu3;bjgrave@lps.umd.edu;~Teresa_Ranadive1;~tai-ching_tuan1;~Furong_Huang1",
        "aff": "Department of Computer Science, University of Maryland, College Park;University of Maryland, College Park;University of Maryland, College Park;University of Maryland, College Park;;Laboratory for Physical Sciences;laboratory for Physical Sciences;University of Maryland",
        "aff_domain": "cs.umd.edu;umd.edu;umd.edu;umd.edu;;lps.umd.edu;lps.umd.edu;cs.umd.edu",
        "position": "PhD student;PhD student;PhD student;PhD student;;Researcher;Principal Researcher;Assistant Professor",
        "bibtex": "@misc{\nding2024calibrated,\ntitle={Calibrated Dataset Condensation for Faster Hyperparameter Search},\nauthor={Mucong Ding and Yuancheng Xu and Tahseen Rabbani and Xiaoyu Liu and Brian Gravelle and Teresa Ranadive and tai-ching tuan and Furong Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=5xKixQzhDE}\n}",
        "github": "",
        "project": "",
        "reviewers": "UefQ;4Foe;EsH1;sKjo",
        "site": "https://openreview.net/forum?id=5xKixQzhDE",
        "pdf_size": 1016051,
        "rating": "3;5;6;6",
        "confidence": "4;4;5;3",
        "soundness": "2;3;4;3",
        "contribution": "3;3;4;3",
        "presentation": "2;3;4;3",
        "wc_summary": "84;56;103;77",
        "wc_strengths": "55;54;88;54",
        "wc_weaknesses": "149;64;259;89",
        "wc_questions": "5;90;4;5",
        "wc_review": "293;264;454;225",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "904;862;1107;639",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;2;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            80.0,
            16.80773631397161
        ],
        "wc_strengths_avg": [
            62.75,
            14.58380951603524
        ],
        "wc_weaknesses_avg": [
            140.25,
            75.19765621347517
        ],
        "wc_questions_avg": [
            26.0,
            36.952672433803755
        ],
        "wc_review_avg": [
            309.0,
            87.12347559642005
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            878.0,
            166.2031888984083
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9391495782177684095&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1;1;2;0;1",
        "aff_unique_norm": "University of Maryland, College Park;University of Maryland;Laboratory for Physical Sciences",
        "aff_unique_dep": "Department of Computer Science;;",
        "aff_unique_url": "https://www/umd.edu;https://www/umd.edu;",
        "aff_unique_abbr": "UMD;UMD;",
        "aff_campus_unique_index": "0;0;0;0;0",
        "aff_campus_unique": "College Park;",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "5xV0yTP50n",
        "title": "Inductive Link Prediction in Knowledge Graphs using Path-based Neural Networks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Link prediction is a crucial research area in knowledge graphs, with many downstream applications. In many real-world scenarios, inductive link prediction is required, where predictions have to be made among unseen entities. Embedding-based models usually need fine-tuning on new entity embeddings, and hence are difficult to be directly applied to inductive link prediction tasks. Logical rules captured by rule-based models can be directly applied to new entities with the same graph typologies, but the captured rules are discrete and usually lack generosity. Graph neural networks (GNNs) can generalize topological information to new graphs taking advantage of deep neural networks, which however may still need fine-tuning on new entity embeddings. In this paper, we propose SiaILP, a path-based model for inductive link prediction using light-weight siamese neural networks. Our model only depends on relation and path embeddings, which can be generalized to new entities without fine-tuning. Experiments show that our model achieves several new state-of-the-art performances in link prediction tasks using inductive versions of WN18RR, FB15k-237, and Nell995.",
        "keywords": "Knowledge Graph;Inductive Link Prediction;Siamese Neural Network;Transfer Learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/3fd339e98cf1614ef5c6c593576a80da58bd3c90.zip",
        "author": "Canlin Zhang;Qian Liu;Xiuwen Liu",
        "authorids": "~Canlin_Zhang1;~Qian_Liu10;~Xiuwen_Liu1",
        "gender": "M;F;M",
        "homepage": "https://www.linkedin.com/in/canlin-zhang-44a902107/;https://scholar.google.com/citations?user=KEUynwwAAAAJ&hl=en;http://www.cs.fsu.edu/~liux",
        "dblp": "234/3478;;89/3077",
        "google_scholar": "jBt4_QYAAAAJ;KEUynwwAAAAJ;2GH5rWkAAAAJ",
        "orcid": "0000-0001-7747-2848;;0000-0002-9320-3872",
        "linkedin": "canlin-zhang-44a902107/;;",
        "or_profile": "~Canlin_Zhang1;~Qian_Liu10;~Xiuwen_Liu1",
        "aff": "Sorenson Communications;;Florida State University",
        "aff_domain": "sorenson.com;;fsu.edu",
        "position": "Researcher;;full Professor",
        "bibtex": "@misc{\nzhang2024inductive,\ntitle={Inductive Link Prediction in Knowledge Graphs using Path-based Neural Networks},\nauthor={Canlin Zhang and Qian Liu and Xiuwen Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=5xV0yTP50n}\n}",
        "github": "",
        "project": "",
        "reviewers": "yt8Z;cRRq;QF3p;GEeR",
        "site": "https://openreview.net/forum?id=5xV0yTP50n",
        "pdf_size": 415903,
        "rating": "3;3;3;3",
        "confidence": "5;4;5;3",
        "soundness": "2;2;2;2",
        "contribution": "2;2;1;1",
        "presentation": "2;1;3;1",
        "wc_summary": "71;47;125;57",
        "wc_strengths": "25;23;14;40",
        "wc_weaknesses": "206;100;447;243",
        "wc_questions": "57;3;1;39",
        "wc_review": "359;173;587;379",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            75.0,
            30.099833886584822
        ],
        "wc_strengths_avg": [
            25.5,
            9.340770846134703
        ],
        "wc_weaknesses_avg": [
            249.0,
            125.78751925370021
        ],
        "wc_questions_avg": [
            25.0,
            23.874672772626646
        ],
        "wc_review_avg": [
            374.5,
            146.6449794571911
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15702917113674669699&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Sorenson Communications;Florida State University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.sorenson.com;https://www.fsu.edu",
        "aff_unique_abbr": ";FSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Scale-Adaptive Diffusion Model for Complex Sketch Synthesis",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19407",
        "id": "5xadJmgwix",
        "author_site": "Jijin Hu, Ke Li, Yonggang Qi, Yi-Zhe Song",
        "tldr": "",
        "abstract": "While diffusion models have revolutionized generative AI, their application to human sketch generation, especially in the creation of complex yet concise and recognizable sketches, remains largely unexplored. Existing efforts have primarily focused on vector-based sketches, limiting their ability to handle intricate sketch data. This paper introduces an innovative extension of diffusion models to pixellevel sketch generation, addressing the challenge of dynamically optimizing the guidance scale for classifier-guided diffusion. Our approach achieves a delicate balance between recognizability and complexity in generated sketches through scale-adaptive classifier-guided diffusion models, a scaling indicator, and the concept of a residual sketch. We also propose a three-phase sampling strategy to enhance sketch diversity and quality. Experiments on the QuickDraw dataset showcase the potential of diffusion models to push the boundaries of sketch generation, particularly in complex scenarios unattainable by vector-based methods.",
        "keywords": "Generative model;Classifier-based Diffusion Model;Sketch",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Jijin Hu;Ke Li;Yonggang Qi;Yi-Zhe Song",
        "authorids": "~Jijin_Hu1;~Ke_Li2;~Yonggang_Qi2;~Yi-Zhe_Song2",
        "gender": "F;M;M;M",
        "homepage": "https://github.com/HuJijin;https://keli-sketchx.github.io/;https://qugank.github.io/;http://personal.ee.surrey.ac.uk/Personal/Y.Song/",
        "dblp": "382/4015;75/6627-4;139/7002;98/1684",
        "google_scholar": ";KZOFaz4AAAAJ;https://scholar.google.com.hk/citations?user=pQNpf7cAAAAJ;https://scholar.google.co.uk/citations?user=irZFP_AAAAAJ",
        "orcid": ";0000-0002-9739-7969;;",
        "linkedin": ";;;",
        "or_profile": "~Jijin_Hu1;~Ke_Li2;~Yonggang_Qi2;~Yi-Zhe_Song2",
        "aff": "Beijing University of Posts and Telecommunications;Beijing University of Posts and Telecommunications;Beijing University of Posts and Telecommunications;University of Surrey",
        "aff_domain": "bupt.edu.cn;bupt.edu.cn;bupt.edu.cn;surrey.ac.uk",
        "position": "MS student;Associate Professor;Associate Professor;Professor",
        "bibtex": "@inproceedings{\nhu2024scaleadaptive,\ntitle={Scale-Adaptive Diffusion Model for Complex Sketch Synthesis},\nauthor={Jijin Hu and Ke Li and Yonggang Qi and Yi-Zhe Song},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=5xadJmgwix}\n}",
        "github": "",
        "project": "",
        "reviewers": "st3k;SPRZ;t4As;bpbS",
        "pdf_size": 7113197,
        "rating": "5;6;6;6",
        "confidence": "4;3;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "96;129;50;86",
        "wc_strengths": "25;56;75;39",
        "wc_weaknesses": "82;166;118;119",
        "wc_questions": "7;115;21;113",
        "wc_review": "210;466;264;357",
        "wc_reply_reviewers": "0;0;21;67",
        "wc_reply_authors": "415;733;394;949",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "1;1;2;2",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            90.25,
            28.16358464400439
        ],
        "wc_strengths_avg": [
            48.75,
            18.713297411199342
        ],
        "wc_weaknesses_avg": [
            121.25,
            29.82762980861872
        ],
        "wc_questions_avg": [
            64.0,
            50.24937810560445
        ],
        "wc_review_avg": [
            324.25,
            97.27377601388773
        ],
        "wc_reply_reviewers_avg": [
            22.0,
            27.358728040608906
        ],
        "wc_reply_authors_avg": [
            622.75,
            231.3443050952411
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12043012526220433934&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=5xadJmgwix",
        "pdf": "https://openreview.net/pdf?id=5xadJmgwix",
        "email": "bupt.edu.cn;bupt.edu.cn;bupt.edu.cn;surrey.ac.uk",
        "author_num": 4,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "Beijing University of Posts and Telecommunications;University of Surrey",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.bupt.edu.cn/;https://www.surrey.ac.uk",
        "aff_unique_abbr": "BUPT;Surrey",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Beijing;",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "id": "5zNJQV60Wm",
        "title": "Natural Language Embedded Programs for Hybrid Language Symbolic Reasoning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "How can we perform  computations over natural language representations to solve tasks that require symbolic and numeric reasoning? We propose natural language embedded programs (NLEP) as a unifying framework for  addressing math/symbolic reasoning, natural language understanding, and instruction following tasks. Our approach prompts a  language model to generate full Python programs that define functions over data structures which contain natural language representations of structured knowledge. A Python interpreter then executes the generated code and prints the output. Despite using a task-general prompt, we find that this approach can improve upon strong baselines across a range of different tasks including math and symbolic reasoning, text classification, question answering, and instruction following. We further find the generated programs are often interpretable and enable post-hoc verification of the intermediate reasoning steps.",
        "keywords": "natural language embedded program (NLEP);large language model",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "",
        "author": "Tianhua Zhang;Jiaxin Ge;Hongyin Luo;Yung-Sung Chuang;Mingye Gao;Yuan Gong;Xixin Wu;Yoon Kim;Helen M. Meng;James R. Glass",
        "authorids": "~Tianhua_Zhang2;~Jiaxin_Ge1;~Hongyin_Luo1;~Yung-Sung_Chuang1;~Mingye_Gao1;~Yuan_Gong3;~Xixin_Wu1;~Yoon_Kim1;~Helen_M._Meng1;~James_R._Glass1",
        "gender": "F;F;M;M;F;M;;;F;",
        "homepage": ";https://jiaxin.ge/;;https://people.csail.mit.edu/yungsung/;https://onelab.mit.edu/people;;https://www1.se.cuhk.edu.hk/~wuxx/;https://people.csail.mit.edu/yoonkim/;http://www.se.cuhk.edu.hk/people/academic-staff/prof-meng-mei-ling-helen/;",
        "dblp": "01/8403;;147/4317;64/3095;;;125/2836;;92/3270;",
        "google_scholar": "https://scholar.google.com.hk/citations?user=dEfp5vQAAAAJ;I6P0SwgAAAAJ;;3ar1DOwAAAAJ;;MuhvvOkAAAAJ;;n_ts4eYAAAAJ;;",
        "orcid": ";;;0000-0002-1723-5063;;;;;;",
        "linkedin": ";;;yschuang;;;;;;",
        "or_profile": "~Tianhua_Zhang2;~Jiaxin_Ge1;~Hongyin_Luo1;~Yung-Sung_Chuang1;~Mingye_Gao1;~Yuan_Gong3;~Xixin_Wu1;~Yoon_Kim1;~Helen_M._Meng1;~James_R._Glass1",
        "aff": "Chinese University of Hong Kong, The Chinese University of Hong Kong;Peking University;Massachusetts Institute of Technology;Massachusetts Institute of Technology;Massachusetts Institute of Technology;Massachusetts Institute of Technology;The Chinese University of Hong Kong;Massachusetts Institute of Technology;The Chinese University of Hong Kong;",
        "aff_domain": "se.cuhk.edu.hk;pku.edu.cn;mit.edu;mit.edu;mit.edu;mit.edu;cuhk.edu.hk;mit.edu;cuhk.edu.hk;",
        "position": "PhD student;Undergrad student;Postdoc;PhD student;PhD student;Researcher;Assistant Professor;Assistant Professor;Full Professor;",
        "bibtex": "@misc{\nzhang2024natural,\ntitle={Natural Language Embedded Programs for Hybrid Language Symbolic Reasoning},\nauthor={Tianhua Zhang and Jiaxin Ge and Hongyin Luo and Yung-Sung Chuang and Mingye Gao and Yuan Gong and Xixin Wu and Yoon Kim and Helen M. Meng and James R. Glass},\nyear={2024},\nurl={https://openreview.net/forum?id=5zNJQV60Wm}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZKfU;pxPW;2MWH;T68U",
        "site": "https://openreview.net/forum?id=5zNJQV60Wm",
        "pdf_size": 724845,
        "rating": "3;3;5;8",
        "confidence": "3;3;3;4",
        "soundness": "3;2;2;3",
        "contribution": "2;2;1;3",
        "presentation": "2;3;3;3",
        "wc_summary": "16;52;79;92",
        "wc_strengths": "19;109;245;98",
        "wc_weaknesses": "143;82;117;91",
        "wc_questions": "141;14;1;84",
        "wc_review": "319;257;442;365",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            59.75,
            29.089302157322372
        ],
        "wc_strengths_avg": [
            117.75,
            81.25692278200054
        ],
        "wc_weaknesses_avg": [
            108.25,
            23.826193569263218
        ],
        "wc_questions_avg": [
            60.0,
            56.422513237182194
        ],
        "wc_review_avg": [
            345.75,
            67.50324066294891
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.9169493006161777,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13668199448688252438&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2;2;2;2;0;2;0",
        "aff_unique_norm": "Chinese University of Hong Kong;Peking University;Massachusetts Institute of Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.cuhk.edu.hk;http://www.pku.edu.cn;https://web.mit.edu",
        "aff_unique_abbr": "CUHK;Peking U;MIT",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;1;1;1;1;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "5zwrpqYIK5",
        "title": "Outlier-Robust Orthogonal Regression on Manifolds",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Motivated by machine learning and computer vision applications, we formulate the problem of Outlier-Robust Orthogonal Regression to find a point in a manifold that satisfies as many linear equations as possible. Existing approaches addressing special cases of our formulation either lack theoretical support, are computationally costly, or somewhat ignore the manifold constraint; the latter two limit them from many applications. In this paper, we propose a unified approach based on solving a non-convex and non-smooth $\\ell^1$ optimization problem over the manifold. We give conditions on the geometry of the input data, the manifold, and their interplay, under which the minimizers recover the ground truth; notably the conditions can hold even when the inliers are skewed within the true hyperplane. We provide a Riemannian subgradient method and an iteratively reweighted least squares method, suiting different computational oracles, and prove their linear/sub-linear convergence to minimizers/critical points. Experiments demonstrate that respecting the manifold constraints increases robustness against outliers in robust essential matrix estimation and robust rotation search.",
        "keywords": "Optimization over manifolds;orthogonal regression;subspace learning",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/ca6e39aeb74ddee277a38a1368ef376029c3c5b1.pdf",
        "author": "Tianjiao Ding;Liangzu Peng;Rene Vidal",
        "authorids": "~Tianjiao_Ding1;~Liangzu_Peng2;~Rene_Vidal1",
        "gender": "M;M;",
        "homepage": "https://tianjiaoding.com/;https://liangzu.github.io/;http://www.vision.jhu.edu",
        "dblp": "230/1227;228/7974;v/ReneVidal",
        "google_scholar": "L3wy9QMAAAAJ;A39MlcYAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";0000-0003-0708-7543;",
        "linkedin": ";;rene-vidal-74844928/",
        "or_profile": "~Tianjiao_Ding1;~Liangzu_Peng2;~Rene_Vidal1",
        "aff": "University of Pennsylvania;University of Pennsylvania;Amazon",
        "aff_domain": "seas.upenn.edu;upenn.edu;amazon.com",
        "position": "PhD student;PhD student;Principal Researcher",
        "bibtex": "@misc{\nding2024outlierrobust,\ntitle={Outlier-Robust Orthogonal Regression on Manifolds},\nauthor={Tianjiao Ding and Liangzu Peng and Rene Vidal},\nyear={2024},\nurl={https://openreview.net/forum?id=5zwrpqYIK5}\n}",
        "github": "",
        "project": "",
        "reviewers": "CDEb;ovBv;BNmQ;6ASC",
        "site": "https://openreview.net/forum?id=5zwrpqYIK5",
        "pdf_size": 1817912,
        "rating": "3;3;3;5",
        "confidence": "4;4;3;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;2",
        "presentation": "2;3;3;2",
        "wc_summary": "29;118;666;79",
        "wc_strengths": "22;56;10;226",
        "wc_weaknesses": "219;228;41;143",
        "wc_questions": "10;166;7;90",
        "wc_review": "280;568;724;538",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            223.0,
            257.70428789603017
        ],
        "wc_strengths_avg": [
            78.5,
            86.81445732134712
        ],
        "wc_weaknesses_avg": [
            157.75,
            75.05789432165014
        ],
        "wc_questions_avg": [
            68.25,
            65.52241982710956
        ],
        "wc_review_avg": [
            527.5,
            159.38867588382809
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:HTxhkrJJgzkJ:scholar.google.com/&scioq=Outlier-Robust+Orthogonal+Regression+on+Manifolds&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "University of Pennsylvania;Amazon",
        "aff_unique_dep": ";Amazon.com, Inc.",
        "aff_unique_url": "https://www.upenn.edu;https://www.amazon.com",
        "aff_unique_abbr": "UPenn;Amazon",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "60e1hl06Ec",
        "title": "Mitigating Simplicity Bias in Deep Learning for Improved OOD Generalization and Robustness",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Neural networks (NNs) are known to exhibit simplicity bias where they tend to prefer learning 'simple' features over more 'complex' ones, even when the latter may be more informative. Simplicity bias can lead to the model making biased predictions which have poor out-of-distribution (OOD) generalization. To address this, we propose a framework that encourages the model to use a more diverse set of features to make predictions. We first train a simple model, and then regularize the conditional mutual information with respect to it to obtain the final model. We demonstrate the effectiveness of this framework in various problem settings and real-world applications, showing that it effectively addresses simplicity bias and leads to more features being used, enhances OOD generalization, and improves subgroup robustness and fairness. We complement these results with theoretical analyses of the effect of the regularization and its OOD generalization properties.",
        "keywords": "Simplicity Bias;Spurious Features;OOD Generalization;Subgroup Robustness",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/c1b7359eecd0506e40bcc843665a244e810c081e.zip",
        "author": "Bhavya Vasudeva;Kameron Shahabi;Vatsal Sharan",
        "authorids": "~Bhavya_Vasudeva1;~Kameron_Shahabi1;~Vatsal_Sharan1",
        "gender": ";M;M",
        "homepage": "https://estija.github.io;https://kyshahab.github.io/;https://vatsalsharan.github.io/",
        "dblp": "250/9545;281/6744;126/2543",
        "google_scholar": "https://scholar.google.co.in/citations?user=ZCSsIokAAAAJ;;Ize17HEAAAAJ",
        "orcid": ";;",
        "linkedin": ";kameron-shahabi-76784218b/;",
        "or_profile": "~Bhavya_Vasudeva1;~Kameron_Shahabi1;~Vatsal_Sharan1",
        "aff": "University of Southern California;University of Southern California;University of Southern California",
        "aff_domain": "usc.edu;usc.edu;usc.edu",
        "position": "PhD student;MS student;Assistant Professor",
        "bibtex": "@misc{\nvasudeva2024mitigating,\ntitle={Mitigating Simplicity Bias in Deep Learning for Improved {OOD} Generalization and Robustness},\nauthor={Bhavya Vasudeva and Kameron Shahabi and Vatsal Sharan},\nyear={2024},\nurl={https://openreview.net/forum?id=60e1hl06Ec}\n}",
        "github": "",
        "project": "",
        "reviewers": "Q6kW;pjci;h3b4;5jvr",
        "site": "https://openreview.net/forum?id=60e1hl06Ec",
        "pdf_size": 1593024,
        "rating": "5;6;6;6",
        "confidence": "4;4;4;4",
        "soundness": "3;3;3;2",
        "contribution": "1;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "51;27;36;102",
        "wc_strengths": "31;61;30;62",
        "wc_weaknesses": "456;764;347;263",
        "wc_questions": "85;45;45;3",
        "wc_review": "623;897;458;430",
        "wc_reply_reviewers": "207;0;68;0",
        "wc_reply_authors": "909;518;180;278",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "3;2;2;2",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            54.0,
            29.008619408720573
        ],
        "wc_strengths_avg": [
            46.0,
            15.508062419270823
        ],
        "wc_weaknesses_avg": [
            457.5,
            189.72677723505453
        ],
        "wc_questions_avg": [
            44.5,
            28.99568933479596
        ],
        "wc_review_avg": [
            602.0,
            185.59768317519485
        ],
        "wc_reply_reviewers_avg": [
            68.75,
            84.50850548909264
        ],
        "wc_reply_authors_avg": [
            471.25,
            281.0617147531837
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4331722416726197918&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Southern California",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.usc.edu",
        "aff_unique_abbr": "USC",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Los Angeles",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "NeurRev: Train Better Sparse Neural Network Practically via Neuron Revitalization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19406",
        "id": "60lNoatp7u",
        "author_site": "Gen Li, Lu Yin, Jie Ji, Wei Niu, Minghai Qin, Bin Ren, Linke Guo, Shiwei Liu, Xiaolong Ma",
        "tldr": "",
        "abstract": "Dynamic Sparse Training (DST) employs a greedy search mechanism to identify an optimal sparse subnetwork by periodically pruning and growing network connections during training. To guarantee effectiveness, DST algorithms rely on high search frequency, which consequently, requires large learning rate and batch size to enforce stable neuron learning. Such settings demand extreme memory consumption, as well as generating significant system overheads that limit the wide deployment of deep learning-based applications on resource-constraint platforms. To reconcile such, we propose $\\underline{Neur}$on $\\underline{Rev}$italization framework for DST (NeurRev), based on an innovative finding that dormant neurons exist with the presence of weight sparsity, and cannot be revitalized (i.e., activated for learning) even with high sparse mask search frequency. These dormant neurons produce a large quantity of zeros during training, which contribute relatively little to the outputs of succeeding layers or to the final results. Different from most existing DST algorithms that spare no effort designing weight growing criteria, NeurRev focuses on optimizing the long-neglected pruning part, which awakes dormant neurons by pruning and incurs no additional computation costs. As such, NeurRev advances more effective neuron learning, which not only achieves outperforming accuracy in a variety of networks and datasets, but also promoting a low-cost dynamism at system-level. Systematical evaluations on training speed and system overhead are conducted on the mobile devices, where the proposed NeurRev framework consistently outperforms representative state-of-the-arts. Code will be released.",
        "keywords": "Dynamic Sparse Training; Neuron Revitalization",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Gen Li;Lu Yin;Jie Ji;Wei Niu;Minghai Qin;Bin Ren;Linke Guo;Shiwei Liu;Xiaolong Ma",
        "authorids": "~Gen_Li4;~Lu_Yin1;~Jie_Ji1;~Wei_Niu3;~Minghai_Qin1;~Bin_Ren1;~Linke_Guo2;~Shiwei_Liu2;~Xiaolong_Ma2",
        "gender": "M;;;M;M;M;M;M;M",
        "homepage": "https://coulsonlee.github.io;https://luuyin.com/;;https://www.niuwei.info;https://sites.google.com/site/minghaiqin/home;http://www.cs.wm.edu/~bren/;http://cecas.clemson.edu/~linkeg/index.html;https://shiweiliuiiiiiii.github.io/;https://xiaolongma2016.com",
        "dblp": "28/538-12;87/2528-6;;68/828-2.html;;;;234/8697-3.html;",
        "google_scholar": ";G4Xe1NkAAAAJ;;w1RoaOMAAAAJ;MSgWKbYAAAAJ;9Uqwy4UAAAAJ;https://scholar.google.com/citations?hl=en;73IbXtsAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;;;;;;0000-0003-3753-7648",
        "linkedin": ";;;;;;;;xiaolong-ma-66b98910b/",
        "or_profile": "~Gen_Li4;~Lu_Yin1;~Jie_Ji1;~Wei_Niu3;~Minghai_Qin1;~Bin_Ren1;~Linke_Guo2;~Shiwei_Liu2;~Xiaolong_Ma2",
        "aff": "Clemson University;University of Aberdeen;;University of Georgia;Western Digital Corporation;William & Mary;Clemson University;University of Oxford;Clemson University",
        "aff_domain": "clemson.edu;abdn.ac.uk;;uga.edu;wdc.com;cs.wm.edu;clemson.edu;ox.ac.uk;clemson.edu",
        "position": "PhD student;Assistant Professor;;Assistant Professor;senior technologist;Associate Professor;Associate Professor;Postdoc;Assistant Professor",
        "bibtex": "@inproceedings{\nli2024neurrev,\ntitle={NeurRev: Train Better Sparse Neural Network Practically via Neuron Revitalization},\nauthor={Gen Li and Lu Yin and Jie Ji and Wei Niu and Minghai Qin and Bin Ren and Linke Guo and Shiwei Liu and Xiaolong Ma},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=60lNoatp7u}\n}",
        "github": "",
        "project": "",
        "reviewers": "AQcf;5GHY;Fgjo",
        "pdf_size": 3353694,
        "rating": "6;6;8",
        "confidence": "3;4;4",
        "soundness": "2;3;4",
        "contribution": "2;3;3",
        "presentation": "3;3;4",
        "wc_summary": "46;95;71",
        "wc_strengths": "42;40;80",
        "wc_weaknesses": "93;87;78",
        "wc_questions": "42;176;2",
        "wc_review": "223;398;231",
        "wc_reply_reviewers": "23;230;0",
        "wc_reply_authors": "759;1277;416",
        "reply_reviewers": "1;2;0",
        "reply_authors": "2;3;1",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            70.66666666666667,
            20.00555478416488
        ],
        "wc_strengths_avg": [
            54.0,
            18.40289832245635
        ],
        "wc_weaknesses_avg": [
            86.0,
            6.164414002968976
        ],
        "wc_questions_avg": [
            73.33333333333333,
            74.41027408153317
        ],
        "wc_review_avg": [
            284.0,
            80.67630796377996
        ],
        "wc_reply_reviewers_avg": [
            84.33333333333333,
            103.42898798477898
        ],
        "wc_reply_authors_avg": [
            817.3333333333334,
            353.9136743457207
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.49999999999999983,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6553735554510376726&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=60lNoatp7u",
        "pdf": "https://openreview.net/pdf?id=60lNoatp7u",
        "email": "clemson.edu;abdn.ac.uk;;uga.edu;wdc.com;cs.wm.edu;clemson.edu;ox.ac.uk;clemson.edu",
        "author_num": 9,
        "aff_unique_index": "0;1;2;3;4;0;5;0",
        "aff_unique_norm": "Clemson University;University of Aberdeen;University of Georgia;Western Digital Corporation;College of William & Mary;University of Oxford",
        "aff_unique_dep": ";;;;;",
        "aff_unique_url": "https://www.clemson.edu;https://www.abdn.ac.uk;https://www.uga.edu;https://www.westerndigital.com;https://www.wm.edu;https://www.ox.ac.uk",
        "aff_unique_abbr": "Clemson;Aberdeen;UGA;WDC;WM;Oxford",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;0;0;1;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "61DYdiyQqk",
        "title": "Two Heads Are Better Than One: Exploiting Both Sequence and Graph Models in AMR-To-Text Generation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Abstract meaning representation (AMR) is a special semantic representation language, which can capture the core meaning of a sentence with a syntax-irrelevant graph.\nAMR-to-text generation, which aims to generate a sentence according to a given AMR graph, is a well-studied task and has shown its helpfulness in various other NLP tasks.\nExisting AMR-to-text generation methods can be roughly divided into two categories, while either has its own advantages and disadvantages.\nThe first one adopts a sequence-to-sequence model, especially a pretrained language model (PLM). \nIt has good text generation ability but cannot cope with the structural information of AMR graphs well.\nThe second category of method is based on graph neural networks (GNNs), whose advantages and disadvantages are exactly the opposite. \nTo combine the strengths of the two kinds of models, in this paper, we propose a dual encoder-decoder model named \\modelName, which integrates a specially designed GNN into a pre-trained sequence-to-sequence model.\nWe conduct extensive experiments as well as human evaluation and a case study,  finding that it achieves the desired effect and yields state-of-the-art performance in the AMR-to-text generation task. \nWe also demonstrate that it outperforms the most powerful general-purpose PLM GPT-4.",
        "keywords": "graph-to-text generation;abstract mearning representation;dual-encoder",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/fb5440a758542d3938393eefc08f2902dfa32201.zip",
        "author": "Yining Hong;Fanchao Qi;Maosong Sun",
        "authorids": "~Yining_Hong3;~Fanchao_Qi1;~Maosong_Sun1",
        "gender": "F;M;M",
        "homepage": "https://hyn0027.github.io/;;https://www.cs.tsinghua.edu.cn/csen/info/1312/4394.htm",
        "dblp": ";228/5500;95/3291-1",
        "google_scholar": ";https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com.tw/citations?user=zIgT0HMAAAAJ",
        "orcid": ";0000-0002-4400-4033;",
        "linkedin": ";%E5%87%A1%E8%B6%85-%E5%B2%82-885770a4/;",
        "or_profile": "~Yining_Hong3;~Fanchao_Qi1;~Maosong_Sun1",
        "aff": "Tsinghua University;Tsinghua University;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "Undergrad student;Postdoc;Full Professor",
        "bibtex": "@misc{\nhong2024two,\ntitle={Two Heads Are Better Than One: Exploiting Both Sequence and Graph Models in {AMR}-To-Text Generation},\nauthor={Yining Hong and Fanchao Qi and Maosong Sun},\nyear={2024},\nurl={https://openreview.net/forum?id=61DYdiyQqk}\n}",
        "github": "",
        "project": "",
        "reviewers": "Koxu;FACa;PF3i",
        "site": "https://openreview.net/forum?id=61DYdiyQqk",
        "pdf_size": 2743551,
        "rating": "5;5;6",
        "confidence": "2;5;4",
        "soundness": "3;3;3",
        "contribution": "2;2;2",
        "presentation": "2;3;3",
        "wc_summary": "74;64;109",
        "wc_strengths": "58;50;113",
        "wc_weaknesses": "248;106;219",
        "wc_questions": "73;1;49",
        "wc_review": "453;221;490",
        "wc_reply_reviewers": "0;0;53",
        "wc_reply_authors": "556;500;1571",
        "reply_reviewers": "0;0;2",
        "reply_authors": "1;1;4",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            1.247219128924647
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            82.33333333333333,
            19.293061504650375
        ],
        "wc_strengths_avg": [
            73.66666666666667,
            28.003967972810962
        ],
        "wc_weaknesses_avg": [
            191.0,
            61.25901294231459
        ],
        "wc_questions_avg": [
            41.0,
            29.93325909419153
        ],
        "wc_review_avg": [
            388.0,
            119.04900951568924
        ],
        "wc_reply_reviewers_avg": [
            17.666666666666668,
            24.984439601924677
        ],
        "wc_reply_authors_avg": [
            875.6666666666666,
            492.2061447085854
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            2.0,
            1.4142135623730951
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.1889822365046136,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:GLWuaFHGhu4J:scholar.google.com/&scioq=Two+Heads+Are+Better+Than+One:+Exploiting+Both+Sequence+and+Graph+Models+in+AMR-To-Text+Generation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Tsinghua University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "61TRLIS5A0",
        "title": "Enhancing Medical Image Generation with Anatomical Precision: A Multi-Headed VAE-Based Diffusion Model",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Score-based image generation models, also known as diffusion models, can generate highly realistic and diverse natural images. However, a common challenge emerges when applying diffusion models to medical image generation and segmentation. While these models excel at producing realistic local textures, they struggle to accurately capture global anatomical priors, such as organ shape and location. Furthermore, the model lacks the capability for controlled recalibration to transform an anatomically unrealistic image into a realistic one. Here we present a new diffusion model where the generated images exhibit both realistic style and anatomically accurate position. Specifically, this is done by guiding the reverse diffusion process with our specially designed multi-headed VAE, which produces the image's disentangled style and position embeddings. We use the position embedding to define a grid deformation function that deforms a simple position prior to a predicted segmentation mask. Then, we apply the same grid deformation on the style embedding for image generation. This alleviates the style embedding from the burden of learning position features, thereby promoting disentangling. Our proposed approach showcases promising performance in controlled image generation across a range of medical image tasks, such as skin lesions and fetal head. Furthermore, our model delivers state-of-the-art segmentation performance.",
        "keywords": "medical image processing;image segmentation;variational auto-encoder;diffusion modelling;controlled image generation",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Hongfei Yang;YoungSeok Jeon;Mengling Feng",
        "authorids": "~Hongfei_Yang2;~YoungSeok_Jeon1;~Mengling_Feng1",
        "gender": "M;M;M",
        "homepage": ";https://www.mornin-feng.com/;https://www.mornin-feng.com",
        "dblp": ";;31/7025",
        "google_scholar": ";ppl10bsAAAAJ;F2ET1WsAAAAJ",
        "orcid": "0000-0002-8150-9364;;0000-0002-5338-6248",
        "linkedin": ";;mengling-mornin-feng-9400811a/",
        "or_profile": "~Hongfei_Yang2;~YoungSeok_Jeon1;~Mengling_Feng1",
        "aff": "National University of Singapore;National University of Singapore;National University of Singapore",
        "aff_domain": "nus.edu;nus.edu;nus.edu.sg",
        "position": "Postdoc;Postdoc;Assistant Professor",
        "bibtex": "@misc{\nyang2024enhancing,\ntitle={Enhancing Medical Image Generation with Anatomical Precision: A Multi-Headed {VAE}-Based Diffusion Model},\nauthor={Hongfei Yang and YoungSeok Jeon and Mengling Feng},\nyear={2024},\nurl={https://openreview.net/forum?id=61TRLIS5A0}\n}",
        "github": "",
        "project": "",
        "reviewers": "PEau;nez1;etX6",
        "site": "https://openreview.net/forum?id=61TRLIS5A0",
        "pdf_size": 12491106,
        "rating": "3;5;5",
        "confidence": "4;4;5",
        "soundness": "2;3;2",
        "contribution": "2;2;2",
        "presentation": "2;4;2",
        "wc_summary": "30;108;92",
        "wc_strengths": "34;71;95",
        "wc_weaknesses": "216;243;42",
        "wc_questions": "59;140;49",
        "wc_review": "339;562;278",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            76.66666666666667,
            33.6386021641143
        ],
        "wc_strengths_avg": [
            66.66666666666667,
            25.090945688745084
        ],
        "wc_weaknesses_avg": [
            167.0,
            89.07300376657341
        ],
        "wc_questions_avg": [
            82.66666666666667,
            40.74582459862878
        ],
        "wc_review_avg": [
            393.0,
            122.06828689986055
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:-JTrD89olNcJ:scholar.google.com/&scioq=Enhancing+Medical+Image+Generation+with+Anatomical+Precision:+A+Multi-Headed+VAE-Based+Diffusion+Model&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "National University of Singapore",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nus.edu.sg",
        "aff_unique_abbr": "NUS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Singapore"
    },
    {
        "id": "61hDIuox86",
        "title": "Latent Lie Group Representations",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Symmetry detection tasks rely on identifying transformations of data points that keep some task-related quality, such as classification label, identical. These symmetries are useful during model selection for neural networks, as even a conceptually simple symmetry (e.g., translation invariance) can lead to superior performance-efficiency tradeoffs (e.g., CNNs). Leveraging neural networks to learn these transformations can lead to approaches that yield representations of the transformations in latent space, rather than just the data itself.\nIn this work, we propose a latent variable framework for learning one-parameter subgroups of Lie group symmetries from observations, improving the accuracy of the learned transformation with respect to the one in pixel-space, even including situations in which this might not even be desirable.",
        "keywords": "deep learning;symmetry;lie groups",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Alex Gabel;Rick Quax;Efstratios Gavves",
        "authorids": "~Alex_Gabel1;r.quax@uva.nl;~Efstratios_Gavves1",
        "gender": "M;;M",
        "homepage": "https://www.uva.nl/en/profile/g/a/a.gabel/a.gabel.html;;https://www.egavves.com",
        "dblp": ";;03/8693",
        "google_scholar": "u8IK1h0AAAAJ;;https://scholar.google.nl/citations?user=QqfCvsgAAAAJ",
        "orcid": "0009-0008-0964-8918;;",
        "linkedin": "https://nl.linkedin.com/in/alex-gabel;;",
        "or_profile": "~Alex_Gabel1;r.quax@uva.nl;~Efstratios_Gavves1",
        "aff": "University of Amsterdam;;University of Amsterdam",
        "aff_domain": "uva.nl;;uva.nl",
        "position": "PhD student;;Associate Professor",
        "bibtex": "@misc{\ngabel2024latent,\ntitle={Latent Lie Group Representations},\nauthor={Alex Gabel and Rick Quax and Efstratios Gavves},\nyear={2024},\nurl={https://openreview.net/forum?id=61hDIuox86}\n}",
        "github": "",
        "project": "",
        "reviewers": "bdCU;8A7f;FZBr",
        "site": "https://openreview.net/forum?id=61hDIuox86",
        "pdf_size": 590200,
        "rating": "1;5;5",
        "confidence": "3;4;3",
        "soundness": "2;4;3",
        "contribution": "2;3;3",
        "presentation": "1;3;3",
        "wc_summary": "74;74;56",
        "wc_strengths": "37;79;10",
        "wc_weaknesses": "299;210;48",
        "wc_questions": "2;127;24",
        "wc_review": "412;490;138",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            1.8856180831641267
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            68.0,
            8.48528137423857
        ],
        "wc_strengths_avg": [
            42.0,
            28.39013913315678
        ],
        "wc_weaknesses_avg": [
            185.66666666666666,
            103.90487102259559
        ],
        "wc_questions_avg": [
            51.0,
            54.48547206977899
        ],
        "wc_review_avg": [
            346.6666666666667,
            150.94664252274342
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:mFJZKUPoIaYJ:scholar.google.com/&scioq=Latent+Lie+Group+Representations&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Amsterdam",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uva.nl",
        "aff_unique_abbr": "UvA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Netherlands"
    },
    {
        "id": "61mnwO4Mzp",
        "title": "Denoising Diffusion Variational Inference",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Latent variable methods are a powerful tool for representation learning that greatly benefit from expressive variational posteriors, including generative models based on normalizing flows or adversarial networks.\nIn this work, we propose denoising diffusion variational inference, which relies on diffusion models---recent generative algorithms with state-of-the-art sample quality---to fit a complex posterior by performing diffusion in latent space. Our method augments a variational posterior with auxiliary latent variables via a user-specified noising process that transforms a complex latent into a simple auxiliary latent. The approximate posterior then reverses this noising process by optimizing a lower bound on the marginal likelihood inspired by the wake-sleep algorithm. Our method can be used to fit deep latent variable models, which yields the DiffVAE algorithm. This algorithm is especially effective at dimensionality reduction and representation learning, where it outperforms methods based on adversarial training or invertible flow-based posteriors. We use this algorithm on a motivating task in biology---inferring latent ancestry from human genomes---and show that it outperforms strong baselines on the 1000 Genomes dataset.",
        "keywords": "visualization;vae;diffusion models;representation learning",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Top Piriyakulkij;Yingheng Wang;Volodymyr Kuleshov",
        "authorids": "~Top_Piriyakulkij1;~Yingheng_Wang1;~Volodymyr_Kuleshov1",
        "gender": "M;M;",
        "homepage": "https://www.cs.cornell.edu/~wp237/;https://isjakewong.github.io/publications/;https://www.cs.cornell.edu/~kuleshov/",
        "dblp": "305/7203;265/6357;81/8612",
        "google_scholar": "nlO1TkkAAAAJ;4WEa7tMAAAAJ;RY_t8XAAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Top_Piriyakulkij1;~Yingheng_Wang1;~Volodymyr_Kuleshov1",
        "aff": "Cornell University;Cornell University;Cornell University",
        "aff_domain": "cs.cornell.edu;cornell.edu;cornell.edu",
        "position": "PhD student;PhD student;Assistant Professor",
        "bibtex": "@misc{\npiriyakulkij2024denoising,\ntitle={Denoising Diffusion Variational Inference},\nauthor={Top Piriyakulkij and Yingheng Wang and Volodymyr Kuleshov},\nyear={2024},\nurl={https://openreview.net/forum?id=61mnwO4Mzp}\n}",
        "github": "",
        "project": "",
        "reviewers": "3sxG;18s7;t61r;Qkoy",
        "site": "https://openreview.net/forum?id=61mnwO4Mzp",
        "pdf_size": 3067837,
        "rating": "3;5;5;5",
        "confidence": "3;4;3;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "2;2;2;3",
        "wc_summary": "77;65;205;107",
        "wc_strengths": "24;33;125;50",
        "wc_weaknesses": "100;316;184;136",
        "wc_questions": "83;124;36;272",
        "wc_review": "284;538;550;565",
        "wc_reply_reviewers": "0;203;129;12",
        "wc_reply_authors": "1996;1789;1091;1425",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "4;3;3;3",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            113.5,
            54.99772722576816
        ],
        "wc_strengths_avg": [
            58.0,
            39.79321550214308
        ],
        "wc_weaknesses_avg": [
            184.0,
            81.82909018191513
        ],
        "wc_questions_avg": [
            128.75,
            88.37243631359271
        ],
        "wc_review_avg": [
            484.25,
            116.00942849613561
        ],
        "wc_reply_reviewers_avg": [
            86.0,
            84.27633119684316
        ],
        "wc_reply_authors_avg": [
            1575.25,
            346.33536853749143
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.25,
            0.4330127018922193
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:uq11FH4MoRQJ:scholar.google.com/&scioq=Denoising+Diffusion+Variational+Inference&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Cornell University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cornell.edu",
        "aff_unique_abbr": "Cornell",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "In-Context Learning Dynamics with Random Binary Sequences",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19405",
        "id": "62K7mALO2q",
        "author_site": "Eric Bigelow, Ekdeep Singh Lubana, Robert Dick, Hidenori Tanaka, Tomer Ullman",
        "tldr": "",
        "abstract": "Large language models (LLMs) trained on huge text datasets demonstrate intriguing capabilities, achieving state-of-the-art performance on tasks they were not explicitly trained for. The precise nature of LLM capabilities is often mysterious, and different prompts can elicit different capabilities through in-context learning. We propose a framework that enables us to analyze in-context learning dynamics to understand latent concepts underlying LLMs\u2019 behavioral patterns. This provides a more nuanced understanding than success-or-failure evaluation benchmarks, but does not require observing internal activations as a mechanistic interpretation of circuits would. Inspired by the cognitive science of human randomness perception, we use random binary sequences as context and study dynamics of in-context learning by manipulating properties of context data, such as sequence length. In the latest GPT-3.5+ models, we find emergent abilities to generate seemingly random numbers and learn basic formal languages, with striking in-context learning dynamics where model outputs transition sharply from seemingly random behaviors to deterministic repetition.",
        "keywords": "In-Context Learning;Large Language Models;Interpretability;Computational Cognitive Science",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Eric J Bigelow;Ekdeep Singh Lubana;Robert P. Dick;Hidenori Tanaka;Tomer Ullman",
        "authorids": "~Eric_J_Bigelow1;~Ekdeep_Singh_Lubana1;~Robert_P._Dick1;~Hidenori_Tanaka1;~Tomer_Ullman1",
        "gender": ";M;M;;",
        "homepage": ";https://ekdeepslubana.github.io/;http://robertdick.org/;https://sites.google.com/view/htanaka/home;",
        "dblp": ";228/2683;84/523.html;;",
        "google_scholar": ";https://scholar.google.co.in/citations?user=OP7S3vsAAAAJ;;f_pWOGIAAAAJ;",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Eric_J_Bigelow1;~Ekdeep_Singh_Lubana1;~Robert_P._Dick1;~Hidenori_Tanaka1;~Tomer_Ullman1",
        "aff": ";University of Michigan;University of Michigan;Physics & Informatics Lab, NTT Research, Inc.;",
        "aff_domain": ";umich.edu;umich.edu;ntt-research.com;",
        "position": ";PhD student;Full Professor;Senior Research Scientist;",
        "bibtex": "@inproceedings{\nbigelow2024incontext,\ntitle={In-Context Learning Dynamics with Random Binary Sequences},\nauthor={Eric J Bigelow and Ekdeep Singh Lubana and Robert P. Dick and Hidenori Tanaka and Tomer Ullman},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=62K7mALO2q}\n}",
        "github": "",
        "project": "",
        "reviewers": "rqBo;F7kD;xnie;272r",
        "pdf_size": 6470996,
        "rating": "6;6;6;6",
        "confidence": "4;2;3;3",
        "soundness": "2;2;2;3",
        "contribution": "3;3;2;2",
        "presentation": "3;3;3;2",
        "wc_summary": "229;292;266;49",
        "wc_strengths": "28;179;266;55",
        "wc_weaknesses": "138;679;351;188",
        "wc_questions": "156;197;156;162",
        "wc_review": "551;1347;1039;454",
        "wc_reply_reviewers": "9;193;328;37",
        "wc_reply_authors": "1949;2310;998;1030",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "3;4;2;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            209.0,
            95.04998684902591
        ],
        "wc_strengths_avg": [
            132.0,
            96.05987716002973
        ],
        "wc_weaknesses_avg": [
            339.0,
            211.51004704268777
        ],
        "wc_questions_avg": [
            167.75,
            17.06421694658152
        ],
        "wc_review_avg": [
            847.75,
            363.6367521304743
        ],
        "wc_reply_reviewers_avg": [
            141.75,
            128.36544511666682
        ],
        "wc_reply_authors_avg": [
            1571.75,
            572.2789420378842
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11402233474497562685&as_sdt=5,34&sciodt=0,34&hl=en",
        "gs_version_total": 9,
        "openreview": "https://openreview.net/forum?id=62K7mALO2q",
        "pdf": "https://openreview.net/pdf?id=62K7mALO2q",
        "email": ";umich.edu;umich.edu;ntt-research.com;",
        "author_num": 5,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "University of Michigan;NTT Research, Inc.",
        "aff_unique_dep": ";Physics & Informatics Lab",
        "aff_unique_url": "https://www.umich.edu;https://www.ntt-research.com",
        "aff_unique_abbr": "UM;NTT Research",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "639DcBewcJ",
        "title": "Low-Rank Robust Graph Contrastive Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Graph Neural Networks (GNNs) have been widely used to learn node representations and with outstanding performance on various tasks such as node classification. However, noise, which inevitably exists in real-world graph data, would considerably degrade the performance of GNNs revealed by recent studies. In this work, we propose a novel and robust method, Low-Rank Robust Graph Contrastive Learning (LR-RGCL). LR-RGCL performs transductive node classification in two steps. First, a robst GCL encoder named RGCL is trained by prototypical contrastive learning with Bayesian nonparametric Prototype Learning (BPL). Next, using the robust features produced by RGCL, a novel and provable low-rank transductive classification algorithm is used to classify the unlabeled nodes in the graph. Our low-rank transductive classification algorithm is inspired by the low frequency property of the graph data and its labels, and theoretical result on the generalization of our algorithm is provided. To the best of our knowledge, our theoretical result is among the first to demonstrate the advantage of low-rank learning in transductive classification. Extensive experiments on public benchmarks demonstrate the superior performance of LR-RGCL and the robustness of the learned node representations. The code of LR-RGCL is available at \\url{https://anonymous.4open.science/r/LRR-GCL-3B3C/}.",
        "keywords": "Low Rank Robust Graph Contrastive Learning;Bayesian Nonparametric Method;Generation Bound;Transductive Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Yancheng Wang;Yingzhen Yang",
        "authorids": "~Yancheng_Wang2;~Yingzhen_Yang1",
        "gender": "M;M",
        "homepage": ";http://yingzhenyang.com",
        "dblp": ";66/3838.html",
        "google_scholar": "https://scholar.google.com/citations?hl=en;",
        "orcid": ";",
        "linkedin": ";yingzhen-yang-9b869122",
        "or_profile": "~Yancheng_Wang2;~Yingzhen_Yang1",
        "aff": "Arizona State University;Arizona State University",
        "aff_domain": "asu.edu;asu.edu",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nwang2024lowrank,\ntitle={Low-Rank Robust Graph Contrastive Learning},\nauthor={Yancheng Wang and Yingzhen Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=639DcBewcJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "9AcT;wZD8;X4pk;FuBV",
        "site": "https://openreview.net/forum?id=639DcBewcJ",
        "pdf_size": 2367883,
        "rating": "1;3;3;6",
        "confidence": "5;4;4;4",
        "soundness": "1;2;2;3",
        "contribution": "1;2;1;2",
        "presentation": "1;1;3;2",
        "wc_summary": "41;85;22;68",
        "wc_strengths": "18;48;16;86",
        "wc_weaknesses": "169;73;142;226",
        "wc_questions": "2;318;67;133",
        "wc_review": "230;524;247;513",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            54.0,
            24.238399287081645
        ],
        "wc_strengths_avg": [
            42.0,
            28.39013913315678
        ],
        "wc_weaknesses_avg": [
            152.5,
            55.01136246267674
        ],
        "wc_questions_avg": [
            130.0,
            118.0105927448888
        ],
        "wc_review_avg": [
            378.5,
            140.18291622020138
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.7276068751089989,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:C6-2RMC3mtsJ:scholar.google.com/&scioq=Low-Rank+Robust+Graph+Contrastive+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Arizona State University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.asu.edu",
        "aff_unique_abbr": "ASU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "63r6HyqyRm",
        "title": "A Vision-free Baseline for Multimodal Grammar Induction",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Past work has shown that paired vision-language signals substantially improve grammar induction in multimodal datasets such as MSCOCO. We investigate whether advancements in large language models (LLMs) that are only trained with text could provide strong assistance for grammar induction in multimodal settings. We find that our text-only approach, an LLM-based C-PCFG (LC-PCFG), outperforms previous multi-modal methods, and achieves state-of-the-art grammar induction performance for various multimodal datasets. Compared to image-aided grammar induction, LC-PCFG outperforms the prior state-of-the-art by $7.9$ Corpus-F1 points, with an $85$\\% reduction in parameter count and $1.7\\times$ faster training speed. Across three video-assisted grammar induction benchmarks, LC-PCFG outperforms prior state-of-the-art by up to $7.7$ Corpus-F1, with $8.8\\times$ faster training. These results shed light on the notion that text-only language models might include visually grounded cues that aid in grammar induction in multimodal contexts. Moreover, our results emphasize the importance of establishing a robust vision-free baseline when evaluating the benefit of multimodal approaches.",
        "keywords": "Grammar Induction;Multimodal;Language Models",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/26a52c375b7f08f3c661dd1c97c6c87f56a7a0cf.pdf",
        "author": "Boyi Li;Rodolfo Corona;Karttikeya Mangalam;Catherine Chen;Daniel Flaherty;Serge Belongie;Kilian Q Weinberger;Jitendra Malik;Trevor Darrell;Dan Klein",
        "authorids": "~Boyi_Li1;~Rodolfo_Corona1;~Karttikeya_Mangalam1;~Catherine_Chen2;~Daniel_Flaherty1;~Serge_Belongie1;~Kilian_Q_Weinberger1;~Jitendra_Malik2;~Trevor_Darrell2;~Dan_Klein1",
        "gender": "F;;M;;;M;M;M;;",
        "homepage": "https://sites.google.com/site/boyilics/home;https://rcorona.github.io/;http://karttikeya.github.io/;;;https://di.ku.dk/english/staff/?pure=en%2Fpersons%2Fserge-belongie(0ce65383-3761-4b17-948a-83b461e371e2)%2Fpublications.html;http://www.cs.cornell.edu/~kilian/;https://people.eecs.berkeley.edu/~malik/;;http://people.eecs.berkeley.edu/~klein/",
        "dblp": ";212/0412;200/8205;;;http://dblp.uni-trier.de/pers/hd/b/Belongie:Serge_J=;88/4801;58/2944;;",
        "google_scholar": ";J2Z-ChoAAAAJ;2l1fWEoAAAAJ;;;ORr4XJYAAAAJ;jsxk8vsAAAAJ;oY9R5YQAAAAJ;;",
        "orcid": ";;;;;0000-0002-0388-5217;0009-0008-9313-7239;0000-0003-3695-1580;;",
        "linkedin": ";;;;daniel-flaherty-37a551164/;sergebelongie;;;;dan-klein/",
        "or_profile": "~Boyi_Li1;~Rodolfo_Corona1;~Karttikeya_Mangalam1;~Catherine_Chen2;~Daniel_Flaherty1;~Serge_Belongie1;~Kilian_Q_Weinberger1;~Jitendra_Malik2;~Trevor_Darrell2;~Dan_Klein1",
        "aff": "University of California, Berkeley;University of California, Berkeley;University of California, Berkeley;;;University of Copenhagen;ASAPP Inc.;University of California, Berkeley;;University of California, Berkeley",
        "aff_domain": "berkeley.edu;berkeley.edu;berkeley.edu;;;ku.dk;asapp.com;berkeley.edu;;berkeley.edu",
        "position": "Postdoc;PhD student;PhD student;;;Full Professor;Principal Researcher;Full Professor;;Full Professor",
        "bibtex": "@misc{\nli2024a,\ntitle={A Vision-free Baseline for Multimodal Grammar Induction},\nauthor={Boyi Li and Rodolfo Corona and Karttikeya Mangalam and Catherine Chen and Daniel Flaherty and Serge Belongie and Kilian Q Weinberger and Jitendra Malik and Trevor Darrell and Dan Klein},\nyear={2024},\nurl={https://openreview.net/forum?id=63r6HyqyRm}\n}",
        "github": "",
        "project": "",
        "reviewers": "5YMo;gdiQ;qYkX",
        "site": "https://openreview.net/forum?id=63r6HyqyRm",
        "pdf_size": 650980,
        "rating": "1;3;3",
        "confidence": "4;5;2",
        "soundness": "1;2;1",
        "contribution": "2;2;1",
        "presentation": "3;3;2",
        "wc_summary": "37;114;46",
        "wc_strengths": "13;38;18",
        "wc_weaknesses": "449;248;149",
        "wc_questions": "29;2;27",
        "wc_review": "528;402;240",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            1.247219128924647
        ],
        "soundness_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            65.66666666666667,
            34.373762603991366
        ],
        "wc_strengths_avg": [
            23.0,
            10.801234497346433
        ],
        "wc_weaknesses_avg": [
            282.0,
            124.8118584109699
        ],
        "wc_questions_avg": [
            19.333333333333332,
            12.283683848458853
        ],
        "wc_review_avg": [
            390.0,
            117.881296226331
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": -0.18898223650461357,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2350422626928522004&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0;1;2;0;0",
        "aff_unique_norm": "University of California, Berkeley;University of Copenhagen;ASAPP Inc.",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.berkeley.edu;https://www.ku.dk;https://www.asapp.com",
        "aff_unique_abbr": "UC Berkeley;UCPH;ASAPP",
        "aff_campus_unique_index": "0;0;0;0;0",
        "aff_campus_unique": "Berkeley;",
        "aff_country_unique_index": "0;0;0;1;0;0;0",
        "aff_country_unique": "United States;Denmark"
    },
    {
        "id": "648Mq6Neuo",
        "title": "Guide Your Anomaly with Language",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Anomaly detection is the task of identifying data that is different from what is considered normal.\nRecent advances in deep learning have improved the performance of anomaly detection and are used in many applications.\nHowever, it can be difficult to create a model that reflects the desired normality due to various issues, including lack of data and nuisance factors.\nTo address this, there have been studies that provide the desired knowledge to the model in various ways, but there are limitations, such as the need to understand deep learning. \nIn this work, we propose a method to guide the desired normality boundary in an image anomaly detection task using natural language.\nBy leveraging the robust generalization capabilities of the vision-language model, we present Language-Assisted Feature Transformation.\nLAFT transforms image features to suit the task through natural language using the shared image-text embedding space of CLIP.\nWe extensively analyze the effectiveness of the concept on a toy dataset and show that it works effectively on real-world datasets.",
        "keywords": "anomaly detection;vision-language model;language guidance;out-of-distribution detection",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "EungGu Yun;Heonjin Ha;Yeongwoo Nam;Bryan Dongik Lee",
        "authorids": "~EungGu_Yun1;~Heonjin_Ha1;~Yeongwoo_Nam2;~Bryan_Dongik_Lee1",
        "gender": "M;M;M;",
        "homepage": "https://yuneg11.github.io;https://github.com/Heonjin;;https://bryandlee.me",
        "dblp": ";;271/2576;",
        "google_scholar": "r7-847MAAAAJ;;8BYFKbYAAAAJ;",
        "orcid": "0000-0002-4648-1415;;;",
        "linkedin": "yuneg/;;;",
        "or_profile": "~EungGu_Yun1;~Heonjin_Ha1;~Yeongwoo_Nam2;~Bryan_Dongik_Lee1",
        "aff": "SAIGE;LG UPLUS;Saige Research;Saige",
        "aff_domain": "saige.ai;lguplus.co.kr;saigeresearch.ai;saige.ai",
        "position": "Researcher;Researcher;Researcher;Researcher",
        "bibtex": "@misc{\nyun2024guide,\ntitle={Guide Your Anomaly with Language},\nauthor={EungGu Yun and Heonjin Ha and Yeongwoo Nam and Bryan Dongik Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=648Mq6Neuo}\n}",
        "github": "",
        "project": "",
        "reviewers": "e9uy;AWhP;rVqL;h8da",
        "site": "https://openreview.net/forum?id=648Mq6Neuo",
        "pdf_size": 796590,
        "rating": "3;3;3;5",
        "confidence": "5;4;5;3",
        "soundness": "2;1;2;3",
        "contribution": "2;1;2;2",
        "presentation": "1;2;2;3",
        "wc_summary": "48;100;115;33",
        "wc_strengths": "64;23;47;39",
        "wc_weaknesses": "282;175;312;159",
        "wc_questions": "2;4;5;93",
        "wc_review": "396;302;479;324",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            74.0,
            34.32928778754374
        ],
        "wc_strengths_avg": [
            43.25,
            14.771171246722448
        ],
        "wc_weaknesses_avg": [
            232.0,
            66.1021936095921
        ],
        "wc_questions_avg": [
            26.0,
            38.6975451417787
        ],
        "wc_review_avg": [
            375.25,
            69.25812226735576
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8703882797784891,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Q94gyLMwpPkJ:scholar.google.com/&scioq=Guide+Your+Anomaly+with+Language&hl=en&as_sdt=0,7",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "SAIGE;LG;Saige Research",
        "aff_unique_dep": ";LG UPLUS;",
        "aff_unique_url": ";https://www.lguplus.com;",
        "aff_unique_abbr": ";LG UPLUS;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "1",
        "aff_country_unique": ";South Korea"
    },
    {
        "title": "Compressed Context Memory for Online Language Model Interaction",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19404",
        "id": "64kSvC4iPg",
        "author_site": "Jang-Hyun Kim, Junyoung Yeom, Sangdoo Yun, Hyun Oh Song",
        "tldr": "",
        "abstract": "This paper presents a context key/value compression method for Transformer language models in online scenarios, where the context continually expands. As the context lengthens, the attention process demands increasing memory and computations, which in turn reduces the throughput of the language model. To address this challenge, we propose a compressed context memory system that continually compresses the accumulating attention key/value pairs into a compact memory space, facilitating language model inference in a limited memory space of computing environments. Our compression process involves integrating a lightweight conditional LoRA into the language model's forward pass during inference, without the need for fine-tuning the model's entire set of weights. We achieve efficient training by modeling the recursive compression process as a single parallelized forward computation. Through evaluations on conversation, personalization, and multi-task learning, we demonstrate that our approach achieves the performance level of a full context model with $5\\times$ smaller context memory size. We further demonstrate the applicability of our approach in a streaming setting with an unlimited context length, outperforming the sliding window approach. Codes are available at https://github.com/snu-mllab/context-memory.",
        "keywords": "context compression;efficient inference;natural language processing;transformer",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/449f3c12ca22ab9ada2f4e1f4bd472506f80ef3e.zip",
        "author": "Jang-Hyun Kim;Junyoung Yeom;Sangdoo Yun;Hyun Oh Song",
        "authorids": "~Jang-Hyun_Kim1;~Junyoung_Yeom1;~Sangdoo_Yun1;~Hyun_Oh_Song1",
        "gender": "M;M;M;M",
        "homepage": "https://yeomjy.com;https://sangdooyun.github.io/;https://mllab.snu.ac.kr/hyunoh;https://janghyun1230.github.io/",
        "dblp": ";124/3009.html;05/10781;",
        "google_scholar": "L0TXeqoAAAAJ;o0qtjzYAAAAJ;ScoZZPsAAAAJ;8JKsHJcAAAAJ",
        "orcid": ";;;",
        "linkedin": "yeomjy;;hyun-oh-song-5a39b03;",
        "or_profile": "~Junyoung_Yeom1;~Sangdoo_Yun1;~Hyun_Oh_Song1;~JangHyun_Kim1",
        "aff": "Seoul National University;NAVER;Seoul National University;Seoul National University",
        "aff_domain": "snu.ac.kr;navercorp.com;snu.ac.kr;snu.ac.kr",
        "position": "Undergrad student;Research Scientist;Associate Professor;PhD student",
        "bibtex": "@inproceedings{\nkim2024compressed,\ntitle={Compressed Context Memory for Online Language Model Interaction},\nauthor={Jang-Hyun Kim and Junyoung Yeom and Sangdoo Yun and Hyun Oh Song},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=64kSvC4iPg}\n}",
        "github": "",
        "project": "",
        "reviewers": "UgoG;Svka;JvdE;JGpv",
        "pdf_size": 572156,
        "rating": "5;6;6;6",
        "confidence": "4;4;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "91;124;109;99",
        "wc_strengths": "34;57;153;107",
        "wc_weaknesses": "552;64;166;145",
        "wc_questions": "4;170;100;361",
        "wc_review": "681;415;528;712",
        "wc_reply_reviewers": "0;0;68;22",
        "wc_reply_authors": "1502;821;785;1292",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "3;2;2;3",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            105.75,
            12.316147936753602
        ],
        "wc_strengths_avg": [
            87.75,
            45.996603135449035
        ],
        "wc_weaknesses_avg": [
            231.75,
            188.77814359718658
        ],
        "wc_questions_avg": [
            158.75,
            130.79635889427504
        ],
        "wc_review_avg": [
            584.0,
            119.88536190878351
        ],
        "wc_reply_reviewers_avg": [
            22.5,
            27.76238462380348
        ],
        "wc_reply_authors_avg": [
            1100.0,
            306.4041448805809
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=844548132790378571&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 9,
        "openreview": "https://openreview.net/forum?id=64kSvC4iPg",
        "pdf": "https://openreview.net/pdf?id=64kSvC4iPg",
        "email": "snu.ac.kr;navercorp.com;snu.ac.kr;snu.ac.kr",
        "author_num": 4,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Seoul National University;NAVER Corporation",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.snu.ac.kr;https://www.naver.com",
        "aff_unique_abbr": "SNU;NAVER",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "64t9er38Zs",
        "title": "Learning Deep O($n$)-Equivariant Hyperspheres",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper presents an approach to learning (deep) $n$D features equivariant under orthogonal transformations, utilizing hyperspheres and regular $n$-simplexes. Our main contributions are theoretical and tackle major challenges in geometric deep learning such as equivariance and invariance under geometric transformations. Namely, we enrich the recently developed theory of steerable 3D spherical neurons---$\\textup{SO}(3)$-equivariant filter banks based on neurons with spherical decision surfaces---by extending said neurons to $n$D, which we call deep equivariant hyperspheres, and enabling their multi-layer construction. Using synthetic and real-world data in $n$D, we experimentally verify our theoretical contributions and find that our approach is superior to the baselines for small training data sets in all but one case.",
        "keywords": "spherical neurons;rotational equivariance;regular simplexes;geometric deep learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/f78ef0ff2009140bd2588ae97905477588036683.zip",
        "author": "Pavlo Melnyk;Michael Felsberg;M\u00e5rten Wadenb\u00e4ck;Andreas Robinson;Cuong Le",
        "authorids": "~Pavlo_Melnyk1;~Michael_Felsberg2;~M\u00e5rten_Wadenb\u00e4ck1;~Andreas_Robinson1;~Cuong_Le1",
        "gender": "M;;M;M;M",
        "homepage": "https://pavlomelnyk.com;https://liu.se/en/employee/micfe03;https://liu.se/en/employee/marwa32;;",
        "dblp": "232/3322;00/78;132/2319;158/5786;",
        "google_scholar": "RhThiI8AAAAJ;https://scholar.google.se/citations?hl=en;6WRQpCQAAAAJ;https://scholar.google.se/citations?user=_4Mg38AAAAAJ;aGtNlKgAAAAJ",
        "orcid": "0000-0002-6091-861X;0000-0002-6096-3648;0000-0002-0675-2794;;",
        "linkedin": ";https://linkedin.com/in/michael-felsberg-668a202;;;cuong-le-8811ba16b/",
        "or_profile": "~Pavlo_Melnyk1;~Michael_Felsberg2;~M\u00e5rten_Wadenb\u00e4ck1;~Andreas_Robinson1;~Cuong_Le1",
        "aff": "Link\u00f6ping University;Link\u00f6ping University;Link\u00f6ping University;Link\u00f6ping University;Link\u00f6ping University",
        "aff_domain": "liu.se;liu.se;liu.se;liu.se;liu.se",
        "position": "PhD student;Full Professor;Assistant Professor;Researcher;PhD student",
        "bibtex": "@misc{\nmelnyk2024learning,\ntitle={Learning Deep O(\\$n\\$)-Equivariant Hyperspheres},\nauthor={Pavlo Melnyk and Michael Felsberg and M{\\r{a}}rten Wadenb{\\\"a}ck and Andreas Robinson and Cuong Le},\nyear={2024},\nurl={https://openreview.net/forum?id=64t9er38Zs}\n}",
        "github": "",
        "project": "",
        "reviewers": "MJcE;gZ3c;sbi9;RNHY",
        "site": "https://openreview.net/forum?id=64t9er38Zs",
        "pdf_size": 539048,
        "rating": "5;6;6;6",
        "confidence": "3;4;2;5",
        "soundness": "4;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "1;3;2;3",
        "wc_summary": "57;69;169;107",
        "wc_strengths": "49;41;37;60",
        "wc_weaknesses": "390;176;394;239",
        "wc_questions": "132;17;101;197",
        "wc_review": "628;303;701;603",
        "wc_reply_reviewers": "301;60;0;0",
        "wc_reply_authors": "1645;525;333;510",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "3;2;1;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            100.5,
            43.64344166080397
        ],
        "wc_strengths_avg": [
            46.75,
            8.78564169540279
        ],
        "wc_weaknesses_avg": [
            299.75,
            94.91147190935351
        ],
        "wc_questions_avg": [
            111.75,
            64.7509652437707
        ],
        "wc_review_avg": [
            558.75,
            151.9841685834416
        ],
        "wc_reply_reviewers_avg": [
            90.25,
            124.11763573320272
        ],
        "wc_reply_authors_avg": [
            753.25,
            520.3596712851602
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.2581988897471611,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6118510587473492375&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Link\u00f6ping University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.liu.se",
        "aff_unique_abbr": "LiU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Sweden"
    },
    {
        "id": "658hDy9RwC",
        "title": "ASPEST: Bridging the Gap Between Active Learning and Selective Prediction",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Selective prediction aims to learn a reliable model that abstains from making predictions when uncertain. These predictions can then be deferred to a humans for further evaluation. As an everlasting challenge for machine learning, in many real-world scenarios, the distribution of test data is different from the training data. This results in more inaccurate predictions, and often increased dependence on humans, which can be difficult and expensive. Active learning aims to lower the overall labeling effort, and hence human dependence, by querying the most informative examples. Selective prediction and active learning have been approached from different angles, with the connection between them missing. In this work, we introduce a new learning paradigm, *active selective prediction*, which aims to query more informative samples from the shifted target domain while increasing accuracy and coverage. For this new paradigm, we propose a simple yet effective approach, ASPEST, that utilizes ensembles of model snapshots with self-training with their aggregated outputs as pseudo labels. Extensive experiments on numerous image, text and structured datasets, which suffer from domain shifts, demonstrate that ASPEST can significantly outperform prior work on selective prediction and active learning (e.g. on the MNIST$\\to$SVHN benchmark with the labeling budget of 100, ASPEST improves the AUACC metric from 79.36% to 88.84%) and achieves more optimal utilization of humans in the loop.",
        "keywords": "selective prediction;active learning;distribution shifts",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/a0dad8b1c94870ac1c0c2f014a248b8964163805.zip",
        "author": "Jiefeng Chen;Jinsung Yoon;Sayna Ebrahimi;Sercan O Arik;Somesh Jha;Tomas Pfister",
        "authorids": "~Jiefeng_Chen2;~Jinsung_Yoon1;~Sayna_Ebrahimi1;~Sercan_O_Arik1;~Somesh_Jha1;~Tomas_Pfister1",
        "gender": "M;M;F;M;M;M",
        "homepage": "https://jfc43.github.io/;https://sites.google.com/corp/view/jinsungyoon;https://saynaebrahimi.github.io/;https://www.sercanarik.com/;;http://tomas.pfister.fi",
        "dblp": "199/3381;173/5409.html;207/7584;;j/SomeshJha;14/8360",
        "google_scholar": "5mOfQfAAAAAJ;kiFd6A8AAAAJ;wRyjJfMAAAAJ;;BaI7l8QAAAAJ;ahSpJOAAAAAJ",
        "orcid": ";;;0000-0001-6333-1729;;0009-0004-4088-8718",
        "linkedin": "jiefeng-chen-aa1769122/;jinsung-yoon-bb7751b8;saynaebrahimi/;;;",
        "or_profile": "~Jiefeng_Chen2;~Jinsung_Yoon1;~Sayna_Ebrahimi1;~Sercan_O_Arik1;~Somesh_Jha1;~Tomas_Pfister1",
        "aff": "Amazon;Google;Google;Google;Department of Computer Science, University of Wisconsin, Madison;Google",
        "aff_domain": "amazon.com;google.com;google.com;google.com;cs.wisc.edu;google.com",
        "position": "Applied Scientist;Research Scientist;Research Scientist;Research Scientist;Full Professor;Head of Research @ Cloud AI",
        "bibtex": "@misc{\nchen2024aspest,\ntitle={{ASPEST}: Bridging the Gap Between Active Learning and Selective Prediction},\nauthor={Jiefeng Chen and Jinsung Yoon and Sayna Ebrahimi and Sercan O Arik and Somesh Jha and Tomas Pfister},\nyear={2024},\nurl={https://openreview.net/forum?id=658hDy9RwC}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZEcg;JH3X;YVeK;Fmse",
        "site": "https://openreview.net/forum?id=658hDy9RwC",
        "pdf_size": 793971,
        "rating": "3;3;5;6",
        "confidence": "4;3;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "86;82;216;131",
        "wc_strengths": "61;27;73;47",
        "wc_weaknesses": "62;147;302;38",
        "wc_questions": "38;4;139;59",
        "wc_review": "247;260;730;275",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            128.75,
            53.92297747713863
        ],
        "wc_strengths_avg": [
            52.0,
            17.11724276862369
        ],
        "wc_weaknesses_avg": [
            137.25,
            103.38127248201194
        ],
        "wc_questions_avg": [
            60.0,
            49.65380146574882
        ],
        "wc_review_avg": [
            378.0,
            203.4686708070803
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5555555555555555,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3280544099817102161&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;1;1;2;1",
        "aff_unique_norm": "Amazon;Google;University of Wisconsin-Madison",
        "aff_unique_dep": "Amazon.com, Inc.;Google;Department of Computer Science",
        "aff_unique_url": "https://www.amazon.com;https://www.google.com;https://www.wisc.edu",
        "aff_unique_abbr": "Amazon;Google;UW-Madison",
        "aff_campus_unique_index": "1;1;1;2;1",
        "aff_campus_unique": ";Mountain View;Madison",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Plug-and-Play Posterior Sampling under Mismatched Measurement and Prior Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19403",
        "id": "66arKkGiFy",
        "author_site": "Marien Renaud, Jiaming Liu, Valentin De Bortoli, Andres Almansa, Ulugbek Kamilov",
        "tldr": "",
        "abstract": "Posterior sampling has been shown to be a powerful Bayesian approach for solving imaging inverse problems. The recent plug-and-play unadjusted Langevin algorithm (PnP-ULA) has emerged as a promising method for Monte Carlo sampling and minimum mean squared error (MMSE) estimation by combining physical measurement models with deep-learning priors specified using image denoisers. However, the intricate relationship between the sampling distribution of PnP-ULA and the mismatched data-fidelity and denoiser has not been theoretically analyzed. We address this gap by proposing a posterior-$L_2$ pseudometric and using it to quantify an explicit error bound for PnP-ULA under mismatched posterior distribution. We numerically validate our theory on several inverse problems such as sampling from Gaussian mixture models and image deblurring. Our results suggest that the sensitivity of the sampling distribution of PnP-ULA to a mismatch in the measurement model and the denoiser can be precisely characterized.",
        "keywords": "Inverse problems;plug-and-play priors;posterior sampling;unadjusted Langevin algorithm",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/bc84ec14339946dbddcf750e6d2f615cf202b8d3.zip",
        "author": "Marien Renaud;Jiaming Liu;Valentin De Bortoli;Andres Almansa;Ulugbek Kamilov",
        "authorids": "~Marien_Renaud1;~Jiaming_Liu3;~Valentin_De_Bortoli1;~Andres_Almansa1;~Ulugbek_Kamilov1",
        "gender": ";M;;M;Not Specified",
        "homepage": ";https://jiamingliu-jeremy.github.io/;https://vdeborto.github.io/;http://up5.fr/almansa;https://ukmlv.github.io",
        "dblp": ";33/5934-1;224/9338;80/6581;73/9223",
        "google_scholar": ";KEucBooAAAAJ;;e1pFlV0AAAAJ;https://scholar.google.com.tw/citations?user=3qYUSDwAAAAJ",
        "orcid": ";0000-0002-1042-4443;;0000-0001-8196-1329;0000-0001-6770-3278",
        "linkedin": ";;;;",
        "or_profile": "~Marien_Renaud1;~Jiaming_Liu3;~Valentin_De_Bortoli1;~Andres_Almansa1;~Ulugbek_Kamilov1",
        "aff": ";Washington University, St. Louis;University of Oxford;Universit\u00e9 Paris Cit\u00e9;Google",
        "aff_domain": ";wustl.edu;ox.ac.uk;parisdescartes.fr;google.com",
        "position": ";PhD student;Postdoc;Principal Researcher;Visiting Faculty Researcher",
        "bibtex": "@inproceedings{\nrenaud2024plugandplay,\ntitle={Plug-and-Play Posterior Sampling under Mismatched Measurement and Prior Models},\nauthor={Marien Renaud and Jiaming Liu and Valentin De Bortoli and Andres Almansa and Ulugbek Kamilov},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=66arKkGiFy}\n}",
        "github": "",
        "project": "",
        "reviewers": "Uuqz;WmLx;rc8y;eQV2",
        "pdf_size": 10303544,
        "rating": "5;6;6;6",
        "confidence": "4;3;2;3",
        "soundness": "2;3;3;4",
        "contribution": "2;3;3;2",
        "presentation": "2;3;3;2",
        "wc_summary": "71;71;44;70",
        "wc_strengths": "41;78;41;51",
        "wc_weaknesses": "274;282;92;114",
        "wc_questions": "5;124;15;133",
        "wc_review": "391;555;192;368",
        "wc_reply_reviewers": "0;16;0;41",
        "wc_reply_authors": "1352;865;773;887",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "3;2;2;3",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            64.0,
            11.554220008291344
        ],
        "wc_strengths_avg": [
            52.75,
            15.138939857202683
        ],
        "wc_weaknesses_avg": [
            190.5,
            87.8905569444181
        ],
        "wc_questions_avg": [
            69.25,
            59.44062163201189
        ],
        "wc_review_avg": [
            376.5,
            128.63222768808757
        ],
        "wc_reply_reviewers_avg": [
            14.25,
            16.768646337734005
        ],
        "wc_reply_authors_avg": [
            969.25,
            225.08040230104442
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17100265567993470327&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=66arKkGiFy",
        "pdf": "https://openreview.net/pdf?id=66arKkGiFy",
        "email": ";wustl.edu;ox.ac.uk;parisdescartes.fr;google.com",
        "author_num": 5,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Washington University in St. Louis;University of Oxford;Universit\u00e9 Paris Cit\u00e9;Google",
        "aff_unique_dep": ";;;Google",
        "aff_unique_url": "https://wustl.edu;https://www.ox.ac.uk;https://www.universite-paris.fr;https://www.google.com",
        "aff_unique_abbr": "WUSTL;Oxford;UPC;Google",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "St. Louis;;Mountain View",
        "aff_country_unique_index": "0;1;2;0",
        "aff_country_unique": "United States;United Kingdom;France"
    },
    {
        "id": "66e22qCU5i",
        "title": "Certified Copy: A Resistant Backdoor Attack",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The robustness, security, and safety of artificial intelligence systems have become a major concern in recent studies. One of the most significant threats to deep learning models is the backdoor attack, which has been thoroughly investigated. Despite numerous backdoor detection mechanisms developed for computer vision systems, our research shows that even simple backdoor attacks can bypass these defenses if the backdoor planting process and poisoning data are carefully crafted. To evade existing backdoor detection systems, we propose a new backdoored model called Certified Copy, which is trained using a novel cost function. This cost function controls the activation of neurons in the model to ensure that the activation generated by clean inputs is similar to that produced by poisoned input data. The model copies the corresponding clean model during training in all situations except when fed with poisoned inputs. We tested our model against six state-of-the-art defense mechanisms, including Neural Cleanse, TAO, ABS, TABOR, NNoculation, and STRIP. The results showed that most of these methods cannot detect the backdoored model. We conclude that deep learning models have a vast hypothesis space, which can be exploited by malicious attackers to hide malicious activation of neurons using poisoned data, leading to undetected backdoored models.",
        "keywords": "Backdoor attack;Deep Neural Network;Detection methods",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Omid Rajabi Rostami;Rui Ning;Chunsheng Xin;Jin-Hee Cho;Jiang Li;Hongyi Wu",
        "authorids": "~Omid_Rajabi_Rostami1;~Rui_Ning2;~Chunsheng_Xin1;~Jin-Hee_Cho1;~Jiang_Li3;~Hongyi_Wu1",
        "gender": "M;;M;F;M;M",
        "homepage": "https://github.com/omidrajabi6868;https://www.lions.odu.edu/~rning/;https://ww1.odu.edu/eng/programs/ccni/people;https://people.cs.vt.edu/~jicho/;https://fs.wp.odu.edu/jli/;http://www.u.arizona.edu/~mhwu/",
        "dblp": ";211/2892;06/6463;;41/3068-1;78/1033",
        "google_scholar": ";oN4NttEAAAAJ;TaP2oq8AAAAJ;wToVkEUAAAAJ;https://scholar.google.com/citations?hl=en;rFLksrwAAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";;;;jiang-li-416b0a6/;hongyi-\u201cmichael\u201d-wu-4b51a715/",
        "or_profile": "~Omid_Rajabi_Rostami1;~Rui_Ning2;~Chunsheng_Xin1;~Jin-Hee_Cho1;~Jiang_Li3;~Hongyi_Wu1",
        "aff": "Old Dominion University;Old Dominion University;Old Dominion University;Virginia Polytechnic Institute and State University;Old Dominion University;University of Arizona",
        "aff_domain": "odu.edu;odu.edu;odu.edu;vt.edu;odu.edu;arizona.edu",
        "position": "PhD student;Assistant Professor;Full Professor;Associate Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nrostami2024certified,\ntitle={Certified Copy: A Resistant Backdoor Attack},\nauthor={Omid Rajabi Rostami and Rui Ning and Chunsheng Xin and Jin-Hee Cho and Jiang Li and Hongyi Wu},\nyear={2024},\nurl={https://openreview.net/forum?id=66e22qCU5i}\n}",
        "github": "",
        "project": "",
        "reviewers": "Tjm9;aXtp;GNhR;eu6h;pLZf;Xd6Y;xbMP",
        "site": "https://openreview.net/forum?id=66e22qCU5i",
        "pdf_size": 999185,
        "rating": "1;3;3;3;3;3;5",
        "confidence": "4;4;4;4;5;3;4",
        "soundness": "2;3;3;3;3;2;2",
        "contribution": "1;2;2;2;1;2;3",
        "presentation": "2;2;3;3;1;3;3",
        "wc_summary": "27;88;62;75;16;90;81",
        "wc_strengths": "10;49;24;45;16;42;32",
        "wc_weaknesses": "104;149;285;122;46;298;23",
        "wc_questions": "8;80;47;23;12;48;120",
        "wc_review": "149;366;418;265;90;478;256",
        "wc_reply_reviewers": "0;0;0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0;0;0",
        "reply_authors": "0;0;0;0;0;0;0",
        "rating_avg": [
            3.0,
            1.0690449676496976
        ],
        "confidence_avg": [
            4.0,
            0.5345224838248488
        ],
        "soundness_avg": [
            2.5714285714285716,
            0.4948716593053935
        ],
        "contribution_avg": [
            1.8571428571428572,
            0.6388765649999399
        ],
        "presentation_avg": [
            2.4285714285714284,
            0.7284313590846836
        ],
        "wc_summary_avg": [
            62.714285714285715,
            27.5873381189595
        ],
        "wc_strengths_avg": [
            31.142857142857142,
            13.922526160646191
        ],
        "wc_weaknesses_avg": [
            146.71428571428572,
            99.92813744417148
        ],
        "wc_questions_avg": [
            48.285714285714285,
            37.281608969395876
        ],
        "wc_review_avg": [
            288.85714285714283,
            130.46995118902018
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:2tZ5pzue08kJ:scholar.google.com/&scioq=Certified+Copy:+A+Resistant+Backdoor+Attack&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;0;2",
        "aff_unique_norm": "Old Dominion University;Virginia Tech;University of Arizona",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.odu.edu;https://www.vt.edu;https://www.arizona.edu",
        "aff_unique_abbr": "ODU;VT;UA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "66wQM45W28",
        "title": "CEDNet: A Cascade Encoder-Decoder Network for Dense Prediction",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Multi-scale features are essential for dense prediction tasks, such as object detection, instance segmentation, and semantic segmentation. The prevailing methods usually utilize a classification backbone to extract multi-scale features and then fuse these features using a lightweight module (e.g. the fusion module in FPN and BiFPN, two typical object detection methods). However, as these methods allocate most computational resources to the classification backbone, the multi-scale feature fusion in these methods is delayed, which may lead to inadequate feature fusion. While some methods perform feature fusion from early stages, they either fail to fully leverage high-level features to guide low-level feature learning or have complex structures, resulting in sub-optimal performance. We propose a streamlined cascade encoder-decoder network, dubbed CEDNet, tailored for dense prediction tasks. All stages in CEDNet share the same encoder-decoder structure and perform multi-scale feature fusion within the decoder. A hallmark of CEDNet is its ability to incorporate high-level features from early stages to guide low-level feature learning in subsequent stages, thereby enhancing the effectiveness of multi-scale feature fusion. We explored three well-known encoder-decoder structures: Hourglass, UNet, and FPN. When integrated into CEDNet, they performed much better than traditional methods that use a pre-designed classification backbone combined with a lightweight fusion module. Extensive experiments on object detection, instance segmentation, and semantic segmentation demonstrated the effectiveness of our method. The code will be made publicly available.",
        "keywords": "dense prediction tasks; encoder-decoder structure",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/037d1625ab4069131a37f36f47f579517f34b318.pdf",
        "author": "Gang Zhang;Ziyi Li;Chufeng Tang;Jianmin Li;Xiaolin Hu",
        "authorids": "~Gang_Zhang3;~Ziyi_Li3;~Chufeng_Tang1;~Jianmin_Li1;~Xiaolin_Hu1",
        "gender": "Not Specified;Not Specified;M;M;M",
        "homepage": ";https://leezeeyee.com;http://chufengt.github.io/;;http://www.xlhu.cn/",
        "dblp": ";;https://dblp.uni-trier.de/pid/250/9561;71/5930-1;60/6028-1",
        "google_scholar": "0QvcF6sAAAAJ;;GS1NtlQAAAAJ;PeF1aPkAAAAJ;PksdgoUAAAAJ",
        "orcid": ";;0000-0002-5794-1616;;0000-0002-4907-7354",
        "linkedin": ";;;;",
        "or_profile": "~Gang_Zhang3;~Ziyi_Li3;~Chufeng_Tang1;~Jianmin_Li1;~Xiaolin_Hu1",
        "aff": "Tsinghua University;Huazhong University of Science and Technology;;Tsinghua University;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;hust.edu.cn;;tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "PhD student;MS student;;Associate Professor;Associate Professor",
        "bibtex": "@misc{\nzhang2024cednet,\ntitle={{CEDN}et: A Cascade Encoder-Decoder Network for Dense Prediction},\nauthor={Gang Zhang and Ziyi Li and Chufeng Tang and Jianmin Li and Xiaolin Hu},\nyear={2024},\nurl={https://openreview.net/forum?id=66wQM45W28}\n}",
        "github": "",
        "project": "",
        "reviewers": "XJYk;fhWB;Wmqn;sm4X",
        "site": "https://openreview.net/forum?id=66wQM45W28",
        "pdf_size": 257233,
        "rating": "3;3;5;5",
        "confidence": "5;5;4;5",
        "soundness": "3;2;2;3",
        "contribution": "1;2;2;3",
        "presentation": "2;3;2;3",
        "wc_summary": "39;58;29;61",
        "wc_strengths": "33;38;29;85",
        "wc_weaknesses": "368;244;83;196",
        "wc_questions": "5;183;5;38",
        "wc_review": "445;523;146;380",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            46.75,
            13.273563952458284
        ],
        "wc_strengths_avg": [
            46.25,
            22.598395960775623
        ],
        "wc_weaknesses_avg": [
            222.75,
            102.21882165237477
        ],
        "wc_questions_avg": [
            57.75,
            73.5573755649289
        ],
        "wc_review_avg": [
            373.5,
            140.76665088010014
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 19,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10640832804271131810&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Tsinghua University;Huazhong University of Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tsinghua.edu.cn;http://www.hust.edu.cn",
        "aff_unique_abbr": "THU;HUST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "67t4ikhlvP",
        "title": "Agent-Centric State Discovery for Finite-Memory POMDPs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Discovering an informative, or agent-centric, state representation that encodes only the relevant information while discarding the irrelevant is a key challenge towards scaling reinforcement learning algorithms and efficiently applying them to downstream tasks. Prior works studied this problem in high-dimensional Markovian environments, when the current observation may be a complex object but is sufficient to decode the informative state. In this work, we consider the problem of discovering the agent-centric state in the more challenging high-dimensional non-Markovian setting, when the state can be decoded from a sequence of past observations. We establish that generalized inverse models can be adapted for learning agent-centric state representation for this task. Our results include asymptotic theory as well as negative results for alternative intuitive algorithms, such as encoding with only a forward-running sequence model. We complement these findings with a thorough empirical study on the agent-centric state discovery abilities of the different alternatives we put forward. Particularly notable is our analysis of past actions, where we show that these can be a double-edged sword: making the algorithms more successful when used correctly and causing dramatic failure when used incorrectly.",
        "keywords": "pomdp;finitememory;exobmdp;block mdp;agent-centric states",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/e411a108ca705ec97c4c30b8ac422cdfc9ae06ec.zip",
        "author": "Lili Wu;Ben Evans;Riashat Islam;Raihan Seraj;Yonathan Efroni;Alex Lamb",
        "authorids": "~Lili_Wu1;~Ben_Evans1;~Riashat_Islam1;~Raihan_Seraj1;~Yonathan_Efroni2;~Alex_Lamb1",
        "gender": ";M;M;M;M;M",
        "homepage": ";https://riashat.github.io/;http://raihan-seraj.github.io/;https://sites.google.com/view/yonathan-efroni/;;https://bennevans.github.io/",
        "dblp": "91/1716;198/0459;;215/3475;;87/9175",
        "google_scholar": "x8fnPxAAAAAJ;https://scholar.google.ca/citations?user=2_4Rs44AAAAJ;https://scholar.google.ca/citations?user=gtWzuL0AAAAJ;pfTInEgAAAAJ;https://scholar.google.ca/citations?user=BFzFy1YAAAAJ;JPQom2sAAAAJ",
        "orcid": ";;;;;",
        "linkedin": "lili-wu-71456674;;http://linkedin.com/in/raihan-seraj/;;;bnevans/",
        "or_profile": "~Lili_Wu1;~Riashat_Islam1;~Raihan_Seraj1;~Yonathan_Efroni2;~Alex_Matthew_Lamb1;~Benjamin_Evans1",
        "aff": "Microsoft Research NYC;Saudi Data and AI Authority, Saudi Data and AI Authority;McGill University;Meta;;New York University",
        "aff_domain": "microsoft.com;sdaia.gov.sa;mcgill.ca;meta.com;;nyu.edu",
        "position": "Data and applied scientist;Researcher;PhD student;Researcher;;PhD student",
        "bibtex": "@misc{\nwu2024agentcentric,\ntitle={Agent-Centric State Discovery for Finite-Memory {POMDP}s},\nauthor={Lili Wu and Ben Evans and Riashat Islam and Raihan Seraj and Yonathan Efroni and Alex Lamb},\nyear={2024},\nurl={https://openreview.net/forum?id=67t4ikhlvP}\n}",
        "github": "",
        "project": "",
        "reviewers": "z5xp;38V6;HgfR;Yoch",
        "site": "https://openreview.net/forum?id=67t4ikhlvP",
        "pdf_size": 2673396,
        "rating": "1;1;5;8",
        "confidence": "4;3;3;3",
        "soundness": "2;2;3;4",
        "contribution": "1;1;3;3",
        "presentation": "2;1;2;3",
        "wc_summary": "113;52;108;72",
        "wc_strengths": "103;6;56;33",
        "wc_weaknesses": "747;93;239;330",
        "wc_questions": "54;109;225;131",
        "wc_review": "1017;260;628;566",
        "wc_reply_reviewers": "724;0;0;41",
        "wc_reply_authors": "908;281;380;329",
        "reply_reviewers": "2;0;0;1",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            3.75,
            2.947456530637899
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            1.0
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            86.25,
            25.321680433968044
        ],
        "wc_strengths_avg": [
            49.5,
            35.59845502265512
        ],
        "wc_weaknesses_avg": [
            352.25,
            243.08370471917692
        ],
        "wc_questions_avg": [
            129.75,
            61.730766235322236
        ],
        "wc_review_avg": [
            617.75,
            269.33656918435713
        ],
        "wc_reply_reviewers_avg": [
            191.25,
            308.0384513335957
        ],
        "wc_reply_authors_avg": [
            474.5,
            252.71772791001425
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.538672317561831,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16438357080989642346&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "Microsoft;Saudi Data and AI Authority;McGill University;Meta;New York University",
        "aff_unique_dep": "Microsoft Research;;;Meta Platforms, Inc.;",
        "aff_unique_url": "https://www.microsoft.com/en-us/research/group/microsoft-research-new-york-city;https://sdaia.gov.sa;https://www.mcgill.ca;https://meta.com;https://www.nyu.edu",
        "aff_unique_abbr": "MSR NYC;SDAIA;McGill;Meta;NYU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "New York City;",
        "aff_country_unique_index": "0;1;2;0;0",
        "aff_country_unique": "United States;Saudi Arabia;Canada"
    },
    {
        "id": "68k0KcHFrW",
        "title": "Stochastic Unrolled Federated Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Algorithm unrolling has emerged as a learning-based optimization paradigm that unfolds truncated iterative algorithms in trainable neural-network optimizers. We introduce Stochastic UnRolled Federated learning (SURF), a method that expands algorithm unrolling to a federated learning scenario. Our proposed method tackles two challenges of this expansion, namely the need to feed whole datasets to the unrolled optimizers to find a descent direction and the decentralized nature of federated learning. We circumvent the former challenge by feeding stochastic mini-batches to each unrolled layer and imposing descent constraints to mitigate the randomness induced by using mini-batches. We address the latter challenge by unfolding the distributed gradient descent (DGD) algorithm in a graph neural network (GNN)-based unrolled architecture, which preserves the decentralized nature of training in federated learning. We theoretically prove that our proposed unrolled optimizer converges to a near-optimal region infinitely often. Through extensive numerical experiments, we also demonstrate the effectiveness of the proposed framework in collaborative training of image classifiers.",
        "keywords": "Algorithm Unrolling;Learning to Optimize;GNNs;Federated Learning",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Samar Hadou;Navid NaderiAlizadeh;Alejandro Ribeiro",
        "authorids": "~Samar_Hadou1;~Navid_NaderiAlizadeh2;~Alejandro_Ribeiro1",
        "gender": "F;M;M",
        "homepage": ";https://alelab.seas.upenn.edu;https://www.seas.upenn.edu/~nnaderi/",
        "dblp": "304/2692.html;32/15;126/5064.html",
        "google_scholar": "https://scholar.google.com.eg/citations?user=FwL_RdEAAAAJ;7mrPM4kAAAAJ;roVp_WwAAAAJ",
        "orcid": ";0000-0003-4230-9906;0000-0002-4891-6726",
        "linkedin": ";;navid-naderi-alizadeh/",
        "or_profile": "~Samar_Hadou1;~Alejandro_Ribeiro1;~Navid_Naderializadeh1",
        "aff": "University of Pennsylvania;University of Pennsylvania;Duke University",
        "aff_domain": "seas.upenn.edu;upenn.edu;duke.edu",
        "position": "PhD student;Full Professor;Assistant Research Professor",
        "bibtex": "@misc{\nhadou2024stochastic,\ntitle={Stochastic Unrolled Federated Learning},\nauthor={Samar Hadou and Navid NaderiAlizadeh and Alejandro Ribeiro},\nyear={2024},\nurl={https://openreview.net/forum?id=68k0KcHFrW}\n}",
        "github": "",
        "project": "",
        "reviewers": "94iK;DuLq;WDdi",
        "site": "https://openreview.net/forum?id=68k0KcHFrW",
        "pdf_size": 509193,
        "rating": "5;6;6",
        "confidence": "4;4;2",
        "soundness": "4;3;3",
        "contribution": "3;2;2",
        "presentation": "4;3;3",
        "wc_summary": "65;134;49",
        "wc_strengths": "59;150;84",
        "wc_weaknesses": "219;305;87",
        "wc_questions": "9;68;84",
        "wc_review": "352;657;304",
        "wc_reply_reviewers": "170;0;0",
        "wc_reply_authors": "1511;605;355",
        "reply_reviewers": "1;0;0",
        "reply_authors": "4;1;1",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            82.66666666666667,
            36.88119062912994
        ],
        "wc_strengths_avg": [
            97.66666666666667,
            38.38691906829143
        ],
        "wc_weaknesses_avg": [
            203.66666666666666,
            89.65613321029534
        ],
        "wc_questions_avg": [
            53.666666666666664,
            32.25247621845836
        ],
        "wc_review_avg": [
            437.6666666666667,
            156.32515970103967
        ],
        "wc_reply_reviewers_avg": [
            56.666666666666664,
            80.13876853447539
        ],
        "wc_reply_authors_avg": [
            823.6666666666666,
            496.61878963871493
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            1.4142135623730951
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15721589579304828873&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "University of Pennsylvania;Duke University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.upenn.edu;https://www.duke.edu",
        "aff_unique_abbr": "UPenn;Duke",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "69eQ7n4mam",
        "title": "Autoencoders with Intrinsic Dimension Constraints for Learning Low Dimensional Image Representations",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Autoencoders have achieved great success in various computer vision applications. The autoencoder learns appropriate low-dimensional image representations through the self-supervised paradigm, i.e., reconstruction. Existing studies mainly focus on minimizing the pixel-level reconstruction error of an image, while mostly ignoring the preservation of the property that reveals the manifold structure of data, such as Intrinsic Dimension (ID). The learning process of most autoencoders is observed to involve dimensionality compression first, and then dimensionality expansion, which plays a crucial role in acquiring low-dimensional image representations. Motivated by the important role of ID, in this work, we propose a novel deep representation learning approach with autoencoder, which incorporates regularization of the global and local ID constraints into the reconstruction of data representations. This approach not only preserves the global manifold structure of the whole dataset but also maintains the local manifold structure of the feature maps of each point, which makes the learned low-dimensional features more discriminant and improves the performance of the downstream tasks. To the best of our knowledge, existing works are rare and limited in exploiting both global and local ID invariant properties on the regularization of DNNs. Numerical experimental results on benchmark datasets (Extended Yale B, Caltech101 and ImageNet) show that the resulting regularized learning models achieve better discriminative representations for downstream tasks including image classification and clustering.",
        "keywords": "Self-supervised Representation Learning;Intrinsic Dimension",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/280a5184344e7d6ea7b4298a7f9bf96cde229757.pdf",
        "author": "Jianzhang Zheng;Hao Shen;Xuan Tang;Mingsong Chen;peidong liang;Xian Wei",
        "authorids": "~Jianzhang_Zheng1;~Hao_Shen1;~Xuan_Tang3;~Mingsong_Chen1;~peidong_liang1;~Xian_Wei1",
        "gender": ";M;F;M;M;M",
        "homepage": ";;https://faculty.ecnu.edu.cn/_s15/tx2_21642/main.psp;https://faculty.ecnu.edu.cn/_s43/cms/main.psp;http://hitqz.com;https://www.researchgate.net/",
        "dblp": ";26/2210-2;;95/573.html;;139/0725",
        "google_scholar": ";Kce9W-8AAAAJ;mFj-I10AAAAJ;93A6b7YAAAAJ;;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;0000-0002-3922-0989;;",
        "linkedin": ";;;;;",
        "or_profile": "~Jianzhang_Zheng1;~Hao_Shen1;~Xuan_Tang3;~Mingsong_Chen1;~peidong_liang1;~Xian_Wei1",
        "aff": ";Fortiss GmbH;East China Normal University;East China Normal University;Fujian(Quanzhou)Advanced Manufacturing Institute;East China Normal University",
        "aff_domain": ";fortiss.org;ecnu.edu.cn;ecnu.edu.cn;hitqz.com;ecnu.edu.cn",
        "position": ";Principal Researcher;Associate Professor;Full Professor;Researcher;Principal Researcher",
        "bibtex": "@misc{\nzheng2024autoencoders,\ntitle={Autoencoders with Intrinsic Dimension Constraints for Learning Low Dimensional Image Representations},\nauthor={Jianzhang Zheng and Hao Shen and Xuan Tang and Mingsong Chen and peidong liang and Xian Wei},\nyear={2024},\nurl={https://openreview.net/forum?id=69eQ7n4mam}\n}",
        "github": "",
        "project": "",
        "reviewers": "dwAb;mtEJ;XqLA;3713;UAX2",
        "site": "https://openreview.net/forum?id=69eQ7n4mam",
        "pdf_size": 4120403,
        "rating": "3;3;5;5;6",
        "confidence": "4;4;3;4;4",
        "soundness": "3;2;3;2;3",
        "contribution": "1;1;2;2;3",
        "presentation": "2;2;3;3;3",
        "wc_summary": "191;33;83;29;156",
        "wc_strengths": "42;19;89;34;137",
        "wc_weaknesses": "327;123;510;29;127",
        "wc_questions": "64;39;325;269;5",
        "wc_review": "624;214;1007;361;425",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            4.4,
            1.2
        ],
        "confidence_avg": [
            3.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            1.8,
            0.7483314773547883
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            98.4,
            65.15090175891658
        ],
        "wc_strengths_avg": [
            64.2,
            43.27308632394967
        ],
        "wc_weaknesses_avg": [
            223.2,
            173.2263259438357
        ],
        "wc_questions_avg": [
            140.4,
            130.43557796858954
        ],
        "wc_review_avg": [
            526.2,
            274.12945846807486
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.25000000000000006,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:JEQt4nYzxHkJ:scholar.google.com/&scioq=Autoencoders+with+Intrinsic+Dimension+Constraints+for+Learning+Low+Dimensional+Image+Representations&hl=en&as_sdt=0,44",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1;2;1",
        "aff_unique_norm": "fortiss GmbH;East China Normal University;Fujian Advanced Manufacturing Institute",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.fortiss.org;http://www.ecnu.edu.cn;",
        "aff_unique_abbr": "Fortiss;ECNU;",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Quanzhou",
        "aff_country_unique_index": "0;1;1;1;1",
        "aff_country_unique": "Germany;China"
    },
    {
        "title": "DreamClean: Restoring Clean Image Using Deep Diffusion Prior",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19402",
        "id": "6ALuy19mPa",
        "author_site": "Jie Xiao, Ruili Feng, Zhiheng Liu, Zhantao Yang, Han Zhang, Yurui Zhu, Xueyang Fu, Kai Zhu, Yu Liu, Zheng-Jun Zha",
        "tldr": "",
        "abstract": "Image restoration poses a garners substantial interest due to the exponential surge in demands for recovering high-quality images from diverse mobile camera devices, adverse lighting conditions, suboptimal shooting environments, and frequent image compression for efficient transmission purposes. Yet this problem gathers significant challenges as people are blind to the type of restoration the images suffer, which, is usually the case in real-day scenarios and is most urgent to solve for this field. Current research, however, heavily relies on prior knowledge of the restoration type, either explicitly through rules or implicitly through the availability of degraded-clean image pairs to define the restoration process, and consumes considerable effort to collect image pairs of vast degradation types. This paper introduces DreamClean, a training-free method that needs no degradation prior knowledge but yields high-fidelity and generality towards various types of image degradation. DreamClean embeds the degraded image back to the latent of pre-trained diffusion models and re-sample it through a carefully designed diffusion process that mimics those generating clean images. Thanks to the rich image prior in diffusion models and our novel Variance Preservation Sampling (VPS) technique, DreamClean manages to handle various different degradation types at one time and reaches far more satisfied final quality than previous competitors. DreamClean relies on elegant theoretical supports to assure its convergence to clean image when VPS has appropriate parameters, and also enjoys superior experimental performance over various challenging tasks that could be overwhelming for previous methods when degradation prior is unavailable.",
        "keywords": "Image Restoration;Diffusion Models;Image Prior;Blind Restoration;Super-Resolution;Image Denoising;Colorization;JPEG Artifacts Correction",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/090bf70903cc485c4c66bf265ac0de64a6c05823.pdf",
        "author": "Jie Xiao;Ruili Feng;Han Zhang;Zhiheng Liu;Zhantao Yang;Yurui Zhu;Xueyang Fu;Kai Zhu;Yu Liu;Zheng-Jun Zha",
        "authorids": "~Jie_Xiao3;~Ruili_Feng1;~Han_Zhang16;~Zhiheng_Liu1;~Zhantao_Yang1;~Yurui_Zhu1;~Xueyang_Fu1;~Kai_Zhu4;~Yu_Liu23;~Zheng-Jun_Zha2",
        "gender": "M;;M;M;M;M;;M;M;M",
        "homepage": "https://jiexiaou.github.io/;https://github.com/RuiLiFeng;https://github.com/bibona;https://Johanan528.github.io;;;;https://github.com/liuyuyuil;;https://xueyangfu.github.io/",
        "dblp": "15/3437-2;20/9594;26/4189-10;;285/8489.html;282/6550;75/4078-4;97/2274-63;23/1818;136/9389",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;;LT5JwlcAAAAJ;Fz3X5FwAAAAJ;;https://scholar.google.com.hk/citations?hl=zh-CN;8zksQb4AAAAJ;;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": "0000-0002-5677-270X;;;;0000-0003-2765-295X;;;;;0000-0001-8036-4071",
        "linkedin": ";;;;;;;;;",
        "or_profile": "~Jie_Xiao3;~Ruili_Feng1;~Han_Zhang16;~Zhiheng_Liu1;~Zhantao_Yang1;~Yurui_Zhu1;~Kai_Zhu4;~Yu_Liu23;~Zheng-Jun_Zha2;~Xueyang_Fu2",
        "aff": "University of Science and Technology of China;University of Science and Technology of China;Shanghai Jiaotong University;University of Science and Technology of China;Shanghai Jiaotong University;University of Science and Technology of China;University of Science and Technology of China;Alibaba Group;University of Science and Technology of China;University of Science and Technology of China",
        "aff_domain": "mail.ustc.edu.cn;mail.ustc.edu.cn;sjtu.edu.cn;ustc.edu.cn;sjtu.edu.cn;ustc.edu.cn;ustc.edu.cn;alibaba-inc.com;ustc.edu.cn;ustc.edu.cn",
        "position": "PhD student;PhD student;PhD student;MS student;PhD student;PhD student;Postdoc;Researcher;Full Professor;Associate Professor",
        "bibtex": "@inproceedings{\nxiao2024dreamclean,\ntitle={DreamClean: Restoring Clean Image Using Deep Diffusion Prior},\nauthor={Jie Xiao and Ruili Feng and Han Zhang and Zhiheng Liu and Zhantao Yang and Yurui Zhu and Xueyang Fu and Kai Zhu and Yu Liu and Zheng-Jun Zha},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=6ALuy19mPa}\n}",
        "github": "",
        "project": "",
        "reviewers": "HBur;aVXX;6gxh;NQCS",
        "pdf_size": 25702068,
        "rating": "6;6;8;8",
        "confidence": "4;5;3;5",
        "soundness": "2;3;3;4",
        "contribution": "3;3;4;4",
        "presentation": "3;3;3;3",
        "wc_summary": "91;41;193;101",
        "wc_strengths": "67;15;130;187",
        "wc_weaknesses": "137;55;115;76",
        "wc_questions": "101;3;55;22",
        "wc_review": "396;114;493;386",
        "wc_reply_reviewers": "78;0;11;0",
        "wc_reply_authors": "1532;267;421;257",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "4;2;1;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            106.5,
            54.87030162118666
        ],
        "wc_strengths_avg": [
            99.75,
            64.77412677913921
        ],
        "wc_weaknesses_avg": [
            95.75,
            32.104322138927024
        ],
        "wc_questions_avg": [
            45.25,
            37.1777823437601
        ],
        "wc_review_avg": [
            347.25,
            141.0024379221863
        ],
        "wc_reply_reviewers_avg": [
            22.25,
            32.4990384473141
        ],
        "wc_reply_authors_avg": [
            619.25,
            530.9709855538248
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            1.0897247358851685
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": -0.30151134457776363,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3194860137127022818&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=6ALuy19mPa",
        "pdf": "https://openreview.net/pdf?id=6ALuy19mPa",
        "email": "mail.ustc.edu.cn;mail.ustc.edu.cn;sjtu.edu.cn;ustc.edu.cn;sjtu.edu.cn;ustc.edu.cn;ustc.edu.cn;alibaba-inc.com;ustc.edu.cn;ustc.edu.cn",
        "author_num": 10,
        "aff_unique_index": "0;0;1;0;1;0;0;2;0;0",
        "aff_unique_norm": "University of Science and Technology of China;Shanghai Jiao Tong University;Alibaba Group",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.ustc.edu.cn;https://www.sjtu.edu.cn;https://www.alibaba.com",
        "aff_unique_abbr": "USTC;SJTU;Alibaba",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Enhancing Tail Performance in Extreme Classifiers by Label Variance Reduction",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19401",
        "id": "6ARlSgun7J",
        "author_site": "Anirudh Buvanesh, Rahul Chand, Jatin Prakash, Bhawna Paliwal, Mudit Dhawan, Neelabh Madan, Deepesh Hada, Vidit Jain, Sonu Mehta, Yashoteja Prabhu, Manish Gupta, Ramachandran Ramjee, Manik Varma",
        "tldr": "",
        "abstract": "Extreme Classification (XC) architectures, which utilize a massive One-vs-All (OvA) classifier layer at the output, have demonstrated remarkable performance on problems with large label sets. Nonetheless, these architectures falter on tail labels with few representative samples. This phenomenon has been attributed to factors such as classifier over-fitting and missing label bias, and solutions involving regularization and loss re-calibration have been developed. This paper explores the impact of label variance - a previously unexamined factor - on the tail performance in extreme classifiers. It also develops a method to systematically reduce label variance in XC by transferring the knowledge from a specialized tail-robust teacher model to the OvA classifiers. For this purpose, it proposes a principled knowledge distillation framework, LEVER, which enhances the tail performance in extreme classifiers with formal guarantees on generalization. Comprehensive experiments are conducted on a diverse set of XC datasets, demonstrating that LEVER can enhance tail performance by around 5\\% and 6\\% points in PSP and coverage metrics, respectively, when integrated with leading extreme classifiers. Moreover, it establishes a new state-of-the-art when added to the top-performing Renee classifier. Extensive ablations and analyses substantiate the efficacy of our design choices. Another significant contribution is the release of two new XC datasets that are different from and more challenging than the available benchmark datasets, thereby encouraging more rigorous algorithmic evaluation in the future. Code for LEVER is available at: aka.ms/lever.",
        "keywords": "Extreme Classification;Extreme Multi-Label Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/d1abe5a93a22abd8a77bcd20c51efe61b261e95f.zip",
        "author": "Anirudh Buvanesh;Rahul Chand;Jatin Prakash;Bhawna Paliwal;Mudit Dhawan;Neelabh Madan;Deepesh Hada;Vidit Jain;SONU MEHTA;Yashoteja Prabhu;Manish Gupta;Ramachandran Ramjee;Manik Varma",
        "authorids": "~Anirudh_Buvanesh2;~Rahul_Chand1;~Jatin_Prakash2;~Bhawna_Paliwal1;~Mudit_Dhawan2;~Neelabh_Madan2;~Deepesh_Hada1;~Vidit_Jain2;~SONU_MEHTA1;~Yashoteja_Prabhu1;~Manish_Gupta4;~Ramachandran_Ramjee1;~Manik_Varma1",
        "gender": ";M;M;F;M;M;M;;F;;;;M",
        "homepage": ";https://rahulschand.github.io;https://github.com/bicycleman15;;https://mudit-dhawan.github.io/;https://github.com/neelabh17;https://www.microsoft.com/en-us/research/people/deepeshhada/;;https://sonumehta.github.io/;;;https://www.microsoft.com/en-us/research/people/ramjee/;http://manikvarma.org",
        "dblp": ";;294/5983;302/2497;;317/5192;;68/5650;246/5368;;;97/117.html;07/918.html",
        "google_scholar": ";;NeBK8VMAAAAJ;7BxDLWcAAAAJ;XmqUp9cAAAAJ;;PHYW-PAAAAAJ;;NcstulUAAAAJ;;;https://scholar.google.co.in/citations?user=0P35aLUAAAAJ;https://scholar.google.gr/citations?user=2efybZkAAAAJ",
        "orcid": ";;0009-0003-5474-6529;;;;;0000-0002-7911-1074;0000-0003-1654-3766;;;0000-0003-0007-6040;0000-0003-4516-6613",
        "linkedin": ";;;;;;deepesh-hada/;jvidit/;sonumehta2403/;;;;",
        "or_profile": "~Anirudh_Buvanesh2;~Rahul_Chand1;~Jatin_Prakash2;~Bhawna_Paliwal1;~Mudit_Dhawan2;~Neelabh_Madan2;~Deepesh_Hada1;~Vidit_Jain2;~SONU_MEHTA1;~Yashoteja_Prabhu1;~Manish_Gupta4;~Ramachandran_Ramjee1;~Manik_Varma1",
        "aff": ";;Microsoft Research;Microsoft Research;Microsoft;Microsoft;Microsoft;Microsoft Research, India;Indian Institute of Technology Delhi;;;Microsoft;Microsoft Research",
        "aff_domain": ";;microsoft.com;microsoft.com;microsoft.com;microsoft.com;microsoft.com;microsoft.com;cs.iitd.ac.in;;;microsoft.com;research.microsoft.com",
        "position": ";;Intern;Research Engineer;Intern;Intern;Researcher;Research SDE;PhD student;;;Researcher;Principal Researcher",
        "bibtex": "@inproceedings{\nbuvanesh2024enhancing,\ntitle={Enhancing Tail Performance in Extreme Classifiers by Label Variance Reduction},\nauthor={Anirudh Buvanesh and Rahul Chand and Jatin Prakash and Bhawna Paliwal and Mudit Dhawan and Neelabh Madan and Deepesh Hada and Vidit Jain and SONU MEHTA and Yashoteja Prabhu and Manish Gupta and Ramachandran Ramjee and Manik Varma},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=6ARlSgun7J}\n}",
        "github": "",
        "project": "",
        "reviewers": "UBHy;Cq1J;Uo9h;Kx6v",
        "pdf_size": 655392,
        "rating": "5;6;6;8",
        "confidence": "2;4;3;5",
        "soundness": "3;3;2;2",
        "contribution": "2;3;2;3",
        "presentation": "1;3;2;3",
        "wc_summary": "66;146;203;89",
        "wc_strengths": "54;66;84;13",
        "wc_weaknesses": "171;251;461;39",
        "wc_questions": "47;87;7;362",
        "wc_review": "338;550;755;503",
        "wc_reply_reviewers": "13;180;245;20",
        "wc_reply_authors": "584;841;896;1069",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;3;3;3",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            126.0,
            53.146025251188824
        ],
        "wc_strengths_avg": [
            54.25,
            26.099568961957974
        ],
        "wc_weaknesses_avg": [
            230.5,
            153.1037230115584
        ],
        "wc_questions_avg": [
            125.75,
            139.3007088998473
        ],
        "wc_review_avg": [
            536.5,
            148.70188297395563
        ],
        "wc_reply_reviewers_avg": [
            114.5,
            100.68887724073598
        ],
        "wc_reply_authors_avg": [
            847.5,
            173.8454773642386
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.5,
            0.8660254037844386
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            13,
            0
        ],
        "corr_rating_confidence": 0.9233805168766388,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14304141305725231718&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=6ARlSgun7J",
        "pdf": "https://openreview.net/pdf?id=6ARlSgun7J",
        "email": ";;microsoft.com;microsoft.com;microsoft.com;microsoft.com;microsoft.com;microsoft.com;cs.iitd.ac.in;;;microsoft.com;research.microsoft.com",
        "author_num": 13,
        "aff_unique_index": "0;0;0;0;0;0;1;0;0",
        "aff_unique_norm": "Microsoft;Indian Institute of Technology Delhi",
        "aff_unique_dep": "Microsoft Research;",
        "aff_unique_url": "https://www.microsoft.com/en-us/research;https://www.iitd.ac.in",
        "aff_unique_abbr": "MSR;IIT Delhi",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Delhi",
        "aff_country_unique_index": "0;0;0;0;0;1;1;0;0",
        "aff_country_unique": "United States;India"
    },
    {
        "id": "6AtXCnHCFy",
        "title": "FSN: Feature Shift Network for Load-Domain Domain Generalization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Conventional deep learning methods for fault detection often assume that the training and the testing sets share the same fault pattern spaces and domain spaces. However, some fault patterns are rare, and many real-world faults have not appeared in the training set. As a result, it\u2019s hard for the trained model to achieve desirable performance on the testing set. \nIn this paper, we introduce a novel domain generalization, Load-Domain (LD) domain generalization, which is based on the analysis of the CWRU bearing dataset and its domain division method. For this scenario, we propose a feature shift model called FSN (Feature Shift Network). In the bearing dataset, domains are divided based on different operating conditions which have specific loads, so it\u2019s equivalent to load-based domain division. Moreover, the domain label corresponds to the actual load magnitude, making it unique as it contains physical information, which can boost detection accuracy on unknown domain beyond the training set. According to the knowledge above , FSN is trained for feature shift on adjacent source domains, and finally shifts target domain features into adjacent source domain feature space to achieve the purpose of domain generalization.\nExtensive experiments on CWRU demonstrate that FSN is better than the existed models in the LD domain generalization case. Furthermore, we have another test on MNIST, which also shows FSN can achieve the best performance.",
        "keywords": "Fault diagnosis;Deep learning;CNN;Domain Generalization;Load-domain Domain Generalization",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Heng Chen;Erkang Zhao;Lei Shi;Yuhui Zhou",
        "authorids": "~Heng_Chen1;~Erkang_Zhao1;~Lei_Shi17;~Yuhui_Zhou1",
        "gender": "M;M;M;M",
        "homepage": "https://gr.xjtu.edu.cn/web/hengchen;http://github.com/EkZzz;;https://zhou-yuhui.github.io/",
        "dblp": ";;;",
        "google_scholar": ";;;",
        "orcid": ";;0000-0003-0225-0460;",
        "linkedin": ";;;",
        "or_profile": "~Heng_Chen1;~Erkang_Zhao1;~Lei_Shi17;~Yuhui_Zhou1",
        "aff": "Xi'an Jiaotong University;Xi'an Jiaotong University;;Xi'an Jiaotong University",
        "aff_domain": "xjtu.edu.cn;xjtu.edu.cn;;xjtu.edu.cn",
        "position": "Associate Professor;MS student;;MS student",
        "bibtex": "@misc{\nchen2024fsn,\ntitle={{FSN}: Feature Shift Network for Load-Domain Domain Generalization},\nauthor={Heng Chen and Erkang Zhao and Lei Shi and Yuhui Zhou},\nyear={2024},\nurl={https://openreview.net/forum?id=6AtXCnHCFy}\n}",
        "github": "",
        "project": "",
        "reviewers": "gaFV;nQ8N;u8DP;xHmt;NDUe;2Hv6;4bLC;hzsf",
        "site": "https://openreview.net/forum?id=6AtXCnHCFy",
        "pdf_size": 490579,
        "rating": "3;3;3;3;3;3;5;6",
        "confidence": "5;3;4;4;4;3;3;4",
        "soundness": "1;2;2;2;2;2;2;2",
        "contribution": "1;2;2;2;2;1;2;2",
        "presentation": "2;2;2;1;2;1;2;4",
        "wc_summary": "59;65;104;51;55;52;82;142",
        "wc_strengths": "13;49;57;24;36;35;36;120",
        "wc_weaknesses": "39;280;140;91;161;88;80;58",
        "wc_questions": "73;36;16;2;21;48;29;50",
        "wc_review": "184;430;317;168;273;223;227;370",
        "wc_reply_reviewers": "0;0;0;0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0;0;0;0",
        "reply_authors": "0;0;0;0;0;0;0;0",
        "rating_avg": [
            3.625,
            1.1110243021644486
        ],
        "confidence_avg": [
            3.75,
            0.6614378277661477
        ],
        "soundness_avg": [
            1.875,
            0.33071891388307384
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            76.25,
            30.05723706530592
        ],
        "wc_strengths_avg": [
            46.25,
            30.617601147052653
        ],
        "wc_weaknesses_avg": [
            117.125,
            72.01117534799721
        ],
        "wc_questions_avg": [
            34.375,
            20.969844420023723
        ],
        "wc_review_avg": [
            274.0,
            86.27572080255256
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.12757297666876868,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:vJ8oK8uqn9gJ:scholar.google.com/&scioq=FSN:+Feature+Shift+Network+for+Load-Domain+Domain+Generalization&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Xi'an Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.xjtu.edu.cn",
        "aff_unique_abbr": "XJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "6CGBfHtFRM",
        "title": "Mean Field Langevin Actor-Critic: Faster Convergence and Global Optimality beyond Lazy Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We study how deep reinforcement learning algorithms learn meaningful features when optimized for finding the optimal policy. \nIn particular, we focus on a version of the neural actor-critic algorithm where both the actor and critic are represented by over-parameterized neural networks in the mean-field regime, and are updated via temporal-difference (TD) and policy gradient respectively. \nSpecifically, for the critic neural network to perform policy evaluation,  \nwe propose $\\textit{mean-field Langevin TD learning}$ method (MFLTD), an extension of the mean-field Langevin dynamics with proximal TD updates, and compare its effectiveness against existing methods through numerical experiments. \nIn addition, for the actor neural network  to perform policy updates, \nwe propose $\\textit{mean-field Langevin policy gradient}$ (MFLPG),  which implements policy gradient in the policy space through a version of Wasserstein gradient flow in the space of network parameters. \nWe prove that MFLTD finds the correct value function, and the sequence of actors created by MFLPG created by the algorithm converges linearly to the globally optimal policy of the Kullback Leibler divergence regularized objective. To our best knowledge, \nwe provide the first linear convergence guarantee for neural actor-critic algorithms with $\\textit{global optimality}$ and $\\textit{feature learning}$.",
        "keywords": "policy gradient method;temporal-difference learning;actor-critic;global optimality;linear convergence;neural network;mean field;feature learning",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/da8e31443087f67c5dd4dd3151c2a27965b2760d.pdf",
        "author": "Kakei Yamamoto;Kazusato Oko;Zhuoran Yang;Taiji Suzuki",
        "authorids": "~Kakei_Yamamoto1;~Kazusato_Oko1;~Zhuoran_Yang1;~Taiji_Suzuki1",
        "gender": "M;M;M;M",
        "homepage": ";;https://zhuoranyang.github.io/;http://ibis.t.u-tokyo.ac.jp/suzuki/",
        "dblp": "334/7773;;;08/312",
        "google_scholar": "https://scholar.google.com/citations?hl=ja;;;x8osrBsAAAAJ",
        "orcid": "0000-0002-6231-2750;;;",
        "linkedin": "kakei-yamamoto-bb37461a0/;kazusatooko/;;",
        "or_profile": "~Kakei_Yamamoto1;~Kazusato_Oko1;~Zhuoran_Yang1;~Taiji_Suzuki1",
        "aff": "Massachusetts Institute of Technology;The University of Tokyo;Yale University;The University of Tokyo",
        "aff_domain": "mit.edu;u-tokyo.ac.jp;yale.edu;tokyo.ac.jp",
        "position": "PhD student;MS student;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nyamamoto2024mean,\ntitle={Mean Field Langevin Actor-Critic: Faster Convergence and Global Optimality beyond Lazy Learning},\nauthor={Kakei Yamamoto and Kazusato Oko and Zhuoran Yang and Taiji Suzuki},\nyear={2024},\nurl={https://openreview.net/forum?id=6CGBfHtFRM}\n}",
        "github": "",
        "project": "",
        "reviewers": "1VQp;fWZz;GTpe;XKHS;Xd7S",
        "site": "https://openreview.net/forum?id=6CGBfHtFRM",
        "pdf_size": 489793,
        "rating": "5;5;5;5;6",
        "confidence": "2;5;3;3;3",
        "soundness": "2;3;3;3;2",
        "contribution": "2;2;2;2;3",
        "presentation": "3;3;2;3;2",
        "wc_summary": "73;118;160;116;128",
        "wc_strengths": "17;50;82;29;64",
        "wc_weaknesses": "37;151;579;56;155",
        "wc_questions": "74;378;2;23;209",
        "wc_review": "201;697;823;224;556",
        "wc_reply_reviewers": "38;48;0;0;0",
        "wc_reply_authors": "889;703;1171;686;908",
        "reply_reviewers": "1;1;0;0;0",
        "reply_authors": "2;2;2;1;2",
        "rating_avg": [
            5.2,
            0.39999999999999997
        ],
        "confidence_avg": [
            3.2,
            0.9797958971132712
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            119.0,
            27.885480092693403
        ],
        "wc_strengths_avg": [
            48.4,
            23.397435756937128
        ],
        "wc_weaknesses_avg": [
            195.6,
            197.6234803863144
        ],
        "wc_questions_avg": [
            137.2,
            140.32448111430878
        ],
        "wc_review_avg": [
            500.2,
            249.7401849923236
        ],
        "wc_reply_reviewers_avg": [
            17.2,
            21.301643129110957
        ],
        "wc_reply_authors_avg": [
            871.4,
            175.5797254810475
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.8,
            0.4
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.10206207261596577,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9644032660721430589&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "Massachusetts Institute of Technology;University of Tokyo;Yale University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://web.mit.edu;https://www.u-tokyo.ac.jp;https://www.yale.edu",
        "aff_unique_abbr": "MIT;UTokyo;Yale",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;1",
        "aff_country_unique": "United States;Japan"
    },
    {
        "title": "Two-timescale Extragradient for Finding Local Minimax Points",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19400",
        "id": "6CIGhcJYJH",
        "author_site": "Jiseok Chae, Kyuwon Kim, Donghwan Kim",
        "tldr": "",
        "abstract": "Minimax problems are notoriously challenging to optimize. However, we present that the two-timescale extragradient method can be a viable solution. By utilizing dynamical systems theory, we show that it converges to points that satisfy the second-order necessary condition of local minimax points, under mild conditions that the two-timescale gradient descent ascent fails to work. This work provably improves upon all previous results on finding local minimax points, by eliminating a crucial assumption that the Hessian with respect to the maximization variable is nondegenerate.",
        "keywords": "Minimax optimization;Nonconvex-nonconcave optimization;Extragradient method;Dynamical systems",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Jiseok Chae;Kyuwon Kim;Donghwan Kim",
        "authorids": "~Jiseok_Chae1;~Kyuwon_Kim1;~Donghwan_Kim2",
        "gender": "M;M;M",
        "homepage": "https://jsch8q.github.io/;https://kaist-kyuwonkim.github.io/;http://mathsci.kaist.ac.kr/~donghwankim/",
        "dblp": "348/5478;119/9250;05/1032",
        "google_scholar": ";;https://scholar.google.com/citations?hl=en",
        "orcid": "0009-0009-0672-3422;0009-0002-6967-9907;",
        "linkedin": ";;",
        "or_profile": "~Jiseok_Chae1;~Kyuwon_Kim1;~Donghwan_Kim2",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.edu;kaist.edu;kaist.ac.kr",
        "position": "PhD student;PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nchae2024twotimescale,\ntitle={Two-timescale Extragradient for Finding Local Minimax Points},\nauthor={Jiseok Chae and Kyuwon Kim and Donghwan Kim},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=6CIGhcJYJH}\n}",
        "github": "",
        "project": "",
        "reviewers": "8GfH;aBEe;dqsM;yB9R",
        "pdf_size": 627451,
        "rating": "6;6;8;8",
        "confidence": "3;2;3;3",
        "soundness": "3;3;4;3",
        "contribution": "3;2;4;3",
        "presentation": "2;3;2;3",
        "wc_summary": "82;89;119;78",
        "wc_strengths": "71;67;125;21",
        "wc_weaknesses": "216;68;273;234",
        "wc_questions": "2;60;46;58",
        "wc_review": "371;284;563;391",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "631;337;703;420",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            92.0,
            16.077935190813527
        ],
        "wc_strengths_avg": [
            71.0,
            36.851051545376556
        ],
        "wc_weaknesses_avg": [
            197.75,
            77.6929050814809
        ],
        "wc_questions_avg": [
            41.5,
            23.425413550244958
        ],
        "wc_review_avg": [
            402.25,
            101.15180423502093
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            522.75,
            149.38938215281567
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12522265416593365909&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=6CIGhcJYJH",
        "pdf": "https://openreview.net/pdf?id=6CIGhcJYJH",
        "email": "kaist.edu;kaist.edu;kaist.ac.kr",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "DrS: Learning Reusable Dense Rewards for Multi-Stage Tasks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19399",
        "id": "6CZ50WgfCG",
        "author_site": "Tongzhou Mu, Minghua Liu, Hao Su",
        "tldr": "",
        "abstract": "The success of many RL techniques heavily relies on human-engineered dense rewards, which typically demands substantial domain expertise and extensive trial and error. In our work, we propose **DrS** (**D**ense **r**eward learning from **S**tages), a novel approach for learning *reusable* dense rewards for multi-stage tasks in a data-driven manner. By leveraging the stage structures of the task, DrS learns a high-quality dense reward from sparse rewards and demonstrations if given. The learned rewards can be *reused* in unseen tasks, thus reducing the human effort for reward engineering. Extensive experiments on three physical robot manipulation task families with 1000+ task variants demonstrate that our learned rewards can be reused in unseen tasks, resulting in improved performance and sample efficiency of RL algorithms. The learned rewards even achieve comparable performance to human-engineered rewards on some tasks. See our [project page](https://sites.google.com/view/iclr24drs) for more details.",
        "keywords": "Reward Learning;Multi-stage Task",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/74e755c3aef53c3a0d8fbe89b8266993518bc85e.pdf",
        "author": "Tongzhou Mu;Minghua Liu;Hao Su",
        "authorids": "~Tongzhou_Mu1;~Minghua_Liu1;~Hao_Su1",
        "gender": "M;M;M",
        "homepage": "http://cseweb.ucsd.edu/~t3mu/;https://cseweb.ucsd.edu//~mil070/;http://ai.ucsd.edu/~haosu",
        "dblp": "183/0943;28/8907;09/4945-1",
        "google_scholar": "uVsZydYAAAAJ;6U3IGtEAAAAJ;1P8Zu04AAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Tongzhou_Mu1;~Minghua_Liu1;~Hao_Su1",
        "aff": "University of California, San Diego;University of California, San Diego;University of California, San Diego",
        "aff_domain": "ucsd.edu;ucsd.edu;ucsd.edu",
        "position": "PhD student;PhD student;Associate Professor",
        "bibtex": "@inproceedings{\nmu2024drs,\ntitle={DrS: Learning Reusable Dense Rewards for Multi-Stage Tasks},\nauthor={Tongzhou Mu and Minghua Liu and Hao Su},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=6CZ50WgfCG}\n}",
        "github": "",
        "project": "",
        "reviewers": "oxbF;35ZH;GMmw;ck68",
        "pdf_size": 1634213,
        "rating": "3;6;8;8",
        "confidence": "4;4;3;3",
        "soundness": "2;2;4;4",
        "contribution": "1;2;4;3",
        "presentation": "2;3;4;4",
        "wc_summary": "89;62;131;126",
        "wc_strengths": "61;41;92;130",
        "wc_weaknesses": "175;165;20;104",
        "wc_questions": "39;235;89;14",
        "wc_review": "364;503;332;374",
        "wc_reply_reviewers": "814;401;0;25",
        "wc_reply_authors": "3046;2491;735;672",
        "reply_reviewers": "3;2;0;1",
        "reply_authors": "6;7;1;1",
        "rating_avg": [
            6.25,
            2.0463381929681126
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            1.0
        ],
        "contribution_avg": [
            2.5,
            1.118033988749895
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            102.0,
            28.222331583340168
        ],
        "wc_strengths_avg": [
            81.0,
            33.62290885690886
        ],
        "wc_weaknesses_avg": [
            116.0,
            61.72924752497798
        ],
        "wc_questions_avg": [
            94.25,
            85.63111292048002
        ],
        "wc_review_avg": [
            393.25,
            65.23563060168883
        ],
        "wc_reply_reviewers_avg": [
            310.0,
            331.51998431467143
        ],
        "wc_reply_authors_avg": [
            1736.0,
            1051.2162004078893
        ],
        "reply_reviewers_avg": [
            1.5,
            1.118033988749895
        ],
        "reply_authors_avg": [
            3.75,
            2.7726341266023544
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8551861104941366,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13580116662997845792&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=6CZ50WgfCG",
        "pdf": "https://openreview.net/pdf?id=6CZ50WgfCG",
        "email": "ucsd.edu;ucsd.edu;ucsd.edu",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of California, San Diego",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucsd.edu",
        "aff_unique_abbr": "UCSD",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "San Diego",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "6CetUU9FSt",
        "title": "Visual Encoders for Data-Efficient Imitation Learning in Modern Video Games",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Video games have served as useful benchmarks for the decision making community, but going beyond Atari games towards training agents in modern games has been prohibitively expensive for the vast majority of the research community. Recent progress in the research, development and open release of large vision models has the potential to amortize some of these costs across the community. However, it is currently unclear which of these models have learnt representations that retain information critical for sequential decision making. Towards enabling wider participation in the research of gameplaying agents in modern games, we present a systematic study of imitation learning with publicly available visual encoders compared to the typical, task-specific, end-to-end training approach in Minecraft, Minecraft Dungeons and Counter-Strike: Global Offensive.",
        "keywords": "Imitation Learning;Visual Encoders",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Lukas Sch\u00e4fer;Logan Jones;Anssi Kanervisto;Yuhan Cao;Tabish Rashid;Raluca Georgescu;David Bignell;Siddhartha Sen;Andrea Trevi\u00f1o Gavito;Sam Devlin",
        "authorids": "~Lukas_Sch\u00e4fer1;~Logan_Jones1;~Anssi_Kanervisto1;~Yuhan_Cao1;~Tabish_Rashid1;~Raluca_Georgescu1;~David_Bignell1;~Siddhartha_Sen1;~Andrea_Trevi\u00f1o_Gavito1;~Sam_Devlin2",
        "gender": "M;M;M;;M;F;M;;F;M",
        "homepage": "https://lukaschaefer.com/;;;https://yyyuhan.github.io/;;http://aka.ms/raluca;;http://sidsen.org;;",
        "dblp": ";;186/7786;;196/5069;;183/0963;;;64/7502",
        "google_scholar": "-yp0O_IAAAAJ;;https://scholar.google.fi/citations?user=iPimqbwAAAAJ;;d4BeWwcAAAAJ;;;;;https://scholar.google.com/citations?hl=en",
        "orcid": ";;0000-0002-7479-4574;;;;;;0000-0002-8032-5600;0000-0002-7769-3090",
        "linkedin": "lukas-schaefer/;loganbjones16/;;yuhan-cao-859633129/;;;;;andrea-trevino-gavito/;https://www.linkedin.com/pub/sam-devlin/83/810/b23",
        "or_profile": "~Lukas_Sch\u00e4fer1;~Logan_Jones1;~Anssi_Kanervisto1;~Yuhan_Cao1;~Tabish_Rashid1;~Raluca_Georgescu1;~David_Bignell1;~Siddhartha_Sen1;~Andrea_Trevi\u00f1o_Gavito1;~Sam_Devlin2",
        "aff": "University of Edinburgh;;Microsoft;;Microsoft;Microsoft;Microsoft Research;Microsoft Research;Microsoft;Microsoft Research",
        "aff_domain": "ed.ac.uk;;microsoft.com;;microsoft.com;microsoft.com;research.microsoft.com;research.microsoft.com;microsoft.com;microsoft.com",
        "position": "PhD student;;Researcher;;Researcher;Researcher;Researcher;Principal Researcher;Researcher;Principal Researcher",
        "bibtex": "@misc{\nsch{\\\"a}fer2024visual,\ntitle={Visual Encoders for Data-Efficient Imitation Learning in Modern Video Games},\nauthor={Lukas Sch{\\\"a}fer and Logan Jones and Anssi Kanervisto and Yuhan Cao and Tabish Rashid and Raluca Georgescu and David Bignell and Siddhartha Sen and Andrea Trevi{\\~n}o Gavito and Sam Devlin},\nyear={2024},\nurl={https://openreview.net/forum?id=6CetUU9FSt}\n}",
        "github": "",
        "project": "",
        "reviewers": "sq4s;bAy4;JgYZ;yJPq",
        "site": "https://openreview.net/forum?id=6CetUU9FSt",
        "pdf_size": 6610292,
        "rating": "1;3;3;3",
        "confidence": "5;5;5;4",
        "soundness": "2;2;2;2",
        "contribution": "1;2;2;2",
        "presentation": "3;3;3;2",
        "wc_summary": "147;73;55;232",
        "wc_strengths": "24;66;58;105",
        "wc_weaknesses": "64;523;310;291",
        "wc_questions": "104;67;21;3",
        "wc_review": "339;729;444;631",
        "wc_reply_reviewers": "0;295;183;77",
        "wc_reply_authors": "980;1221;990;1313",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "2;2;3;3",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            126.75,
            69.86549577581197
        ],
        "wc_strengths_avg": [
            63.25,
            28.80429655450728
        ],
        "wc_weaknesses_avg": [
            297.0,
            162.4576867987477
        ],
        "wc_questions_avg": [
            48.75,
            39.52451770736741
        ],
        "wc_review_avg": [
            535.75,
            152.92706594975266
        ],
        "wc_reply_reviewers_avg": [
            138.75,
            111.17188268622601
        ],
        "wc_reply_authors_avg": [
            1126.0,
            144.74632983257297
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8913380107900966404&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1;1;1;1;1;1",
        "aff_unique_norm": "University of Edinburgh;Microsoft",
        "aff_unique_dep": ";Microsoft Corporation",
        "aff_unique_url": "https://www.ed.ac.uk;https://www.microsoft.com",
        "aff_unique_abbr": "Edinburgh;Microsoft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;1;1;1;1",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "id": "6CfJp9NG6Q",
        "title": "STUDY: Socially Aware Temporally Causal Decoder Recommender Systems",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recommender systems are widely used to help people find items that are tailored to their interests. These interests are often influenced by social networks, making it important to use social network information effectively in recommender systems, especially for demographic groups with interests that differ from the majority. This paper introduces STUDY, a Socially-aware Temporally caUsal Decoder recommender sYstem. The STUDY architecture is significantly more efficient to learn and train than existing methods and performs joint inference over socially-connected groups in a single forward pass of a modified transformer decoder network. We demonstrate the benefits of STUDY in the recommendation of books for students who have dyslexia or are struggling readers. Students with dyslexia often have difficulty engaging with reading material, making it critical to recommend books that are tailored to their interests. We worked with our non-profit partner Learning Ally to evaluate STUDY on a dataset of struggling readers. STUDY was able to generate recommendations that more accurately predicted student engagement, when compared with existing methods.",
        "keywords": "Recommender Systems; Transformers; Social Recommendations; Education",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/4719c6fd638fdabc3b1e3512120869a526db8e4b.pdf",
        "author": "Eltayeb Ahmed;Diana Mincu;Lauren Harrell;Katherine A Heller;Subhrajit Roy",
        "authorids": "~Eltayeb_Ahmed1;~Diana_Mincu1;~Lauren_Harrell1;~Katherine_A_Heller1;~Subhrajit_Roy1",
        "gender": "F;;F;M;M",
        "homepage": ";;;;https://uniquecreed.co.uk",
        "dblp": ";;32/4403;73/8829;",
        "google_scholar": "1Fg7f78AAAAJ;G2scKbkAAAAJ;;;4PAd9qgAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";lauren-harrell-00829315;;subhrajit-roy-7aa18123/;",
        "or_profile": "~Diana_Mincu1;~Lauren_Harrell1;~Katherine_A_Heller1;~Subhrajit_Roy1;~Eltayeb_Khalid_Eltayeb_Ahmed1",
        "aff": "Google;Google;Google;Google;University of Oxford",
        "aff_domain": "google.com;google.com;google.com;google.com;eng.ox.ac.uk",
        "position": "Software Engineer;Data Scientist ;Researcher;Researcher;PhD student",
        "bibtex": "@misc{\nahmed2024study,\ntitle={{STUDY}: Socially Aware Temporally Causal Decoder Recommender Systems},\nauthor={Eltayeb Ahmed and Diana Mincu and Lauren Harrell and Katherine A Heller and Subhrajit Roy},\nyear={2024},\nurl={https://openreview.net/forum?id=6CfJp9NG6Q}\n}",
        "github": "",
        "project": "",
        "reviewers": "Trnv;5grQ;54vF;fvs5;GC3n",
        "site": "https://openreview.net/forum?id=6CfJp9NG6Q",
        "pdf_size": 319426,
        "rating": "1;3;5;5;5",
        "confidence": "5;3;5;4;3",
        "soundness": "3;2;3;3;3",
        "contribution": "2;2;2;3;2",
        "presentation": "2;2;2;2;2",
        "wc_summary": "64;34;24;84;73",
        "wc_strengths": "23;54;40;138;66",
        "wc_weaknesses": "227;88;105;267;86",
        "wc_questions": "139;198;39;78;4",
        "wc_review": "453;374;208;567;229",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            3.8,
            1.6
        ],
        "confidence_avg": [
            4.0,
            0.8944271909999159
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            55.8,
            22.999130418344084
        ],
        "wc_strengths_avg": [
            64.2,
            39.58989770130759
        ],
        "wc_weaknesses_avg": [
            154.6,
            76.78176866939182
        ],
        "wc_questions_avg": [
            91.6,
            69.56033352421478
        ],
        "wc_review_avg": [
            366.2,
            135.4745732600771
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.2795084971874737,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:4owZXOfIqdwJ:scholar.google.com/&scioq=STUDY:+Socially+Aware+Temporally+Causal+Decoder+Recommender+Systems&hl=en&as_sdt=0,33",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0;1",
        "aff_unique_norm": "Google;University of Oxford",
        "aff_unique_dep": "Google;",
        "aff_unique_url": "https://www.google.com;https://www.ox.ac.uk",
        "aff_unique_abbr": "Google;Oxford",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Mountain View;",
        "aff_country_unique_index": "0;0;0;0;1",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "6EQbYM0CIX",
        "title": "Conditional Generative Modeling for High-dimensional Marked Temporal Point Processes",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Point processes offer a versatile framework for sequential event modeling. However, the computational challenges and constrained representational power of the existing point process models have impeded their potential for wider applications. This limitation becomes especially pronounced when dealing with event data that is associated with multi-dimensional or high-dimensional marks such as texts or images. To address this challenge, this study proposes a novel event generative framework for modeling point processes with high-dimensional marks. We aim to capture the distribution of events without explicitly specifying the conditional intensity or probability density function. Instead, we use a conditional generator that takes the history of events as input and generates the high-quality subsequent event that is likely to occur given the prior observations. The proposed framework offers a host of benefits, including considerable representational power to capture intricate dynamics in multi- or even high-dimensional event space, as well as exceptional efficiency in learning the model and generating samples. Our numerical results demonstrate superior performance compared to other state-of-the-art baselines.",
        "keywords": "marked temporal point processes;conditional generative models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/d6acd13ff20d361216f4d5ab426a8e922304e740.pdf",
        "author": "Zheng Dong;Zekai Fan;Shixiang Zhu",
        "authorids": "~Zheng_Dong3;~Zekai_Fan1;~Shixiang_Zhu1",
        "gender": "M;;M",
        "homepage": "https://sites.google.com/view/zheng-dong/home;;https://sites.google.com/view/woodyzhu",
        "dblp": ";;133/3853",
        "google_scholar": "iqZN-q4AAAAJ;;v6_Gv6IAAAAJ",
        "orcid": "0000-0002-1505-8569;;0000-0002-2241-6096",
        "linkedin": "zheng-dong-23a264222/;;shixiang-zhu-26b956a0/",
        "or_profile": "~Zheng_Dong3;~Zekai_Fan1;~Shixiang_Zhu1",
        "aff": "Georgia Institute of Technology;;Carnegie Mellon University",
        "aff_domain": "gatech.edu;;cmu.edu",
        "position": "PhD student;;Assistant Professor",
        "bibtex": "@misc{\ndong2024conditional,\ntitle={Conditional Generative Modeling for High-dimensional Marked Temporal Point Processes},\nauthor={Zheng Dong and Zekai Fan and Shixiang Zhu},\nyear={2024},\nurl={https://openreview.net/forum?id=6EQbYM0CIX}\n}",
        "github": "",
        "project": "",
        "reviewers": "LQDX;GHUR;AoCo",
        "site": "https://openreview.net/forum?id=6EQbYM0CIX",
        "pdf_size": 6032456,
        "rating": "3;3;5",
        "confidence": "3;3;5",
        "soundness": "2;3;2",
        "contribution": "2;2;3",
        "presentation": "3;2;3",
        "wc_summary": "72;50;80",
        "wc_strengths": "168;107;71",
        "wc_weaknesses": "286;480;223",
        "wc_questions": "58;2;4",
        "wc_review": "584;639;378",
        "wc_reply_reviewers": "107;377;0",
        "wc_reply_authors": "1591;2190;1014",
        "reply_reviewers": "2;2;0",
        "reply_authors": "4;4;2",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            67.33333333333333,
            12.684198393626966
        ],
        "wc_strengths_avg": [
            115.33333333333333,
            40.036094825655624
        ],
        "wc_weaknesses_avg": [
            329.6666666666667,
            109.36889665510738
        ],
        "wc_questions_avg": [
            21.333333333333332,
            25.940101944458295
        ],
        "wc_review_avg": [
            533.6666666666666,
            112.33976242730007
        ],
        "wc_reply_reviewers_avg": [
            161.33333333333334,
            158.63234922997964
        ],
        "wc_reply_authors_avg": [
            1598.3333333333333,
            480.127992194674
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=875969137132098907&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Georgia Institute of Technology;Carnegie Mellon University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.gatech.edu;https://www.cmu.edu",
        "aff_unique_abbr": "Georgia Tech;CMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "6Ey8mAuLiw",
        "title": "On the Power of Multitask Representation Learning with Gradient Descent",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Representation learning, particularly multi-task representation learning, has gained widespread popularity in various deep learning applications, ranging from computer vision to natural language processing, due to its remarkable generalization performance. Despite its growing use, our understanding of the underlying mechanisms remains limited. In this paper, we provide a theoretical analysis elucidating why multi-task representation learning outperforms its single-task counterpart in scenarios involving over-parameterized two-layer convolutional neural networks trained by gradient descent. Our analysis is based on a data model that encompasses both task-shared and task-specific features, a setting commonly encountered in real-world applications. We also present experiments on synthetic and real-world data to illustrate and validate our theoretical findings.",
        "keywords": "representation learning;multi-task learning;gradient descent;generalization",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Qiaobo Li;Zixiang Chen;Yihe Deng;Yiwen Kou;Yuan Cao;Quanquan Gu",
        "authorids": "~Qiaobo_Li1;~Zixiang_Chen1;~Yihe_Deng1;~Yiwen_Kou1;~Yuan_Cao1;~Quanquan_Gu1",
        "gender": "M;M;F;F;M;M",
        "homepage": ";https://sites.google.com/view/zxchen;;https://evankou.github.io/;https://yuancaohku.github.io/;http://web.cs.ucla.edu/~qgu/",
        "dblp": ";137/3624;230/8011;323/9058;;50/4597",
        "google_scholar": ";6nrCHr0AAAAJ;7Lix1poAAAAJ;https://scholar.google.com/citations?hl=en;-VGnHI4AAAAJ;GU9HgNAAAAAJ",
        "orcid": ";;;;;",
        "linkedin": "qiaobo-li-581815251/;;;yiwen-kou-5a444916b/;;",
        "or_profile": "~Qiaobo_Li1;~Zixiang_Chen1;~Yihe_Deng1;~Yiwen_Kou1;~Yuan_Cao1;~Quanquan_Gu1",
        "aff": "Department of Computer Science, University of Illinois at Urbana-Champaign; University of California, Los Angeles;University of California, Los Angeles;University of California, Los Angeles;University of Hong Kong;University of California, Los Angeles",
        "aff_domain": "cs.illinois.edu;cs.ucla.edu;ucla.edu;ucla.edu;hku.hk;cs.ucla.edu",
        "position": "PhD student;PhD student;PhD student;PhD student;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nli2024on,\ntitle={On the Power of Multitask Representation Learning with Gradient Descent},\nauthor={Qiaobo Li and Zixiang Chen and Yihe Deng and Yiwen Kou and Yuan Cao and Quanquan Gu},\nyear={2024},\nurl={https://openreview.net/forum?id=6Ey8mAuLiw}\n}",
        "github": "",
        "project": "",
        "reviewers": "vmJ4;yKNZ;rtpX;tYKP",
        "site": "https://openreview.net/forum?id=6Ey8mAuLiw",
        "pdf_size": 2129620,
        "rating": "3;6;6;6",
        "confidence": "3;3;2;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "48;71;73;67",
        "wc_strengths": "29;139;130;39",
        "wc_weaknesses": "149;161;269;79",
        "wc_questions": "19;103;192;156",
        "wc_review": "245;474;664;341",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "670;1616;1598;1211",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;3;3;2",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            64.75,
            9.908960591303208
        ],
        "wc_strengths_avg": [
            84.25,
            50.47462233637811
        ],
        "wc_weaknesses_avg": [
            164.5,
            67.9760987406603
        ],
        "wc_questions_avg": [
            117.5,
            65.08648093114269
        ],
        "wc_review_avg": [
            431.0,
            157.18937623134713
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1273.75,
            384.2931010309709
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:jnMKiirk250J:scholar.google.com/&scioq=On+the+Power+of+Multitask+Representation+Learning+with+Gradient+Descent&hl=en&as_sdt=0,47",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;1;1;2;1",
        "aff_unique_norm": "University of Illinois Urbana-Champaign;University of California, Los Angeles;University of Hong Kong",
        "aff_unique_dep": "Department of Computer Science;;",
        "aff_unique_url": "https://illinois.edu;https://www.ucla.edu;https://www.hku.hk",
        "aff_unique_abbr": "UIUC;UCLA;HKU",
        "aff_campus_unique_index": "0;1;1;1;2;1",
        "aff_campus_unique": "Urbana-Champaign;Los Angeles;Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;1;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "6FAH0SgQzO",
        "title": "FedRC: Tackling Diverse Distribution Shifts Challenge in Federated Learning by Robust Clustering",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Federated Learning (FL) is a machine learning paradigm that safeguards privacy by retaining client data on edge devices. However, optimizing FL in practice can be challenging due to the diverse and heterogeneous nature of the learning system. Though recent research has focused on improving the optimization of FL when distribution shifts occur among clients, ensuring global performance when multiple types of distribution shifts occur simultaneously among clients---such as feature distribution shift, label distribution shift, and concept shift---remain under-explored.\n\nIn this paper, we identify the learning challenges posed by the simultaneous occurrence of diverse distribution shifts and propose a clustering principle to overcome these challenges. Through our research, we find that existing methods fail to address the clustering principle. Therefore, we propose a novel clustering algorithm framework, dubbed as FedRC, which adheres to our proposed clustering principle by incorporating a bi-level optimization problem and a novel objective function. Extensive experiments demonstrate that FedRC significantly outperforms other SOTA cluster-based FL methods.\n  Our code will be publicly available.",
        "keywords": "Deep Learning;Distribution Shifts;Generalization;Federated Learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/ad3c1cf78d293f8a6ab0728857203c21e2c32267.zip",
        "author": "Yongxin Guo;Xiaoying Tang;Tao Lin",
        "authorids": "~Yongxin_Guo1;~Xiaoying_Tang2;~Tao_Lin1",
        "gender": "M;F;M",
        "homepage": "https://gyxxyg.github.io/yongxinguo/;https://sse.cuhk.edu.cn/en/faculty/tangxiaoying;https://lins-lab.github.io/",
        "dblp": ";134/9714-2;64/4492-4.html",
        "google_scholar": "5Cl1GZwAAAAJ;https://scholar.google.com/citations?hl=zh-TW;QE9pa_cAAAAJ",
        "orcid": "0009-0001-8652-0722;0000-0003-3955-1195;0000-0002-3246-6935",
        "linkedin": ";;",
        "or_profile": "~Yongxin_Guo1;~Xiaoying_Tang2;~Tao_Lin1",
        "aff": "Tencent;The Chinese University of Hong Kong, Shenzhen;Westlake University",
        "aff_domain": "tencent.com;cuhk.edu.cn;westlake.edu",
        "position": "Intern;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nguo2024fedrc,\ntitle={Fed{RC}: Tackling Diverse Distribution Shifts Challenge in Federated Learning by Robust Clustering},\nauthor={Yongxin Guo and Xiaoying Tang and Tao Lin},\nyear={2024},\nurl={https://openreview.net/forum?id=6FAH0SgQzO}\n}",
        "github": "",
        "project": "",
        "reviewers": "gsbU;kcSi;xiXR",
        "site": "https://openreview.net/forum?id=6FAH0SgQzO",
        "pdf_size": 3506410,
        "rating": "5;8;8",
        "confidence": "4;4;4",
        "soundness": "2;4;4",
        "contribution": "3;3;3",
        "presentation": "3;3;4",
        "wc_summary": "79;71;125",
        "wc_strengths": "229;65;62",
        "wc_weaknesses": "188;74;101",
        "wc_questions": "171;1;185",
        "wc_review": "667;211;473",
        "wc_reply_reviewers": "399;0;0",
        "wc_reply_authors": "3257;510;1515",
        "reply_reviewers": "2;0;0",
        "reply_authors": "7;1;3",
        "rating_avg": [
            7.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            91.66666666666667,
            23.79542439676633
        ],
        "wc_strengths_avg": [
            118.66666666666667,
            78.02706083290734
        ],
        "wc_weaknesses_avg": [
            121.0,
            48.641546028061235
        ],
        "wc_questions_avg": [
            119.0,
            83.63412381717565
        ],
        "wc_review_avg": [
            450.3333333333333,
            186.84991005855179
        ],
        "wc_reply_reviewers_avg": [
            133.0,
            188.09040379562165
        ],
        "wc_reply_authors_avg": [
            1760.6666666666667,
            1134.8322440881832
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            2.494438257849294
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15939733531129246781&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Tencent;Chinese University of Hong Kong;Westlake University",
        "aff_unique_dep": "Tencent Holdings Limited;;",
        "aff_unique_url": "https://www.tencent.com;https://www.cuhk.edu.cn;https://www.westlake.edu.cn",
        "aff_unique_abbr": "Tencent;CUHK;WU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Shenzhen",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "6FvBXs8t8K",
        "title": "Learn from the Past: A Proxy based Adversarial Defense Framework to Boost Robustness",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In light of the vulnerability of deep learning models to adversarial samples and the ensuing security issues, a range of methods, including Adversarial Training (AT) as a prominent representative, aimed at enhancing model robustness against various adversarial attacks, have seen rapid development. However, existing methods  essentially assist the current state of target model to defend against parameter-oriented adversarial attacks with explicit or implicit computation burdens, which also suffers from unstable convergence behavior due to inconsistency of optimization trajectories. Diverging from previous work, this paper reconsiders the update rule of target model and corresponding deficiency to defend based on its current state. By introducing the historical state of the target model as a proxy, which is endowed with much prior information for defense, we formulate a two-stage update rule, resulting in a general adversarial defense framework, which we refer to as 'LAST' ($\\textbf{L}$earn from the P$\\textbf{ast}$). Besides, we devise a Self Distillation (SD) based defense objective to constrain the update process of the proxy model without the introduction of larger teacher models. Experimentally, we demonstrate consistent and significant performance enhancements by refining a series of single-step and multi-step AT methods (e.g., up to $\\bf 9.2$% and $\\bf 20.5$% improvement of Robust Accuracy (RA) on CIFAR10 and CIFAR100 datasets, respectively) across various datasets, backbones and attack modalities, and validate its ability to enhance training stability and ameliorate catastrophic overfitting issues meanwhile.",
        "keywords": "Adversarial training;adversarial defense framework;two-stage;proxy model;self distillation",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/415f2064094e2b00e3dd91de7e900bd34e3ed5c8.zip",
        "author": "Yaohua Liu;Jiaxin Gao;Zhu Liu;Xianghao Jiao;Xin Fan;Risheng Liu",
        "authorids": "~Yaohua_Liu1;~Jiaxin_Gao1;~Zhu_Liu3;~Xianghao_Jiao1;~Xin_Fan1;~Risheng_Liu1",
        "gender": "M;;M;M;M;",
        "homepage": ";;https://scholar.google.com/citations?user=WDjOXbIAAAAJ&hl=zh-CN;;http://dutmedia.org;https://rsliu.tech/",
        "dblp": "180/2847;;14/191-4.html;348/5634;87/3021-1;82/8066",
        "google_scholar": "6l4tf4kAAAAJ;;WDjOXbIAAAAJ;vMJatVIAAAAJ;ZJXY-LYAAAAJ;DzuhImQAAAAJ",
        "orcid": "0000-0002-9057-1645;;0000-0003-0975-2711;0009-0004-1032-169X;;",
        "linkedin": "%E8%80%80%E5%8D%8E-%E5%88%98-5786b2211/;;;;xin-fan-ab78464/;",
        "or_profile": "~Yaohua_Liu1;~Jiaxin_Gao1;~Zhu_Liu3;~Xianghao_Jiao1;~Xin_Fan1;~Risheng_Liu1",
        "aff": "Dalian University of Technology;;Dalian University of Technology;Dalian University of Technology;Dalian University of Technology;Dalian University of Technology",
        "aff_domain": "dlut.edu.cn;;dlut.edu.cn;dlut.edu.cn;dlut.edu.cn;dlut.edu.cn",
        "position": "PhD student;;PhD student;MS student;Full Professor;Full Professor",
        "bibtex": "@misc{\nliu2024learn,\ntitle={Learn from the Past: A Proxy based Adversarial Defense Framework to Boost Robustness},\nauthor={Yaohua Liu and Jiaxin Gao and Zhu Liu and Xianghao Jiao and Xin Fan and Risheng Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=6FvBXs8t8K}\n}",
        "github": "",
        "project": "",
        "reviewers": "MeBp;9nzt;atuW;EcMM",
        "site": "https://openreview.net/forum?id=6FvBXs8t8K",
        "pdf_size": 4521833,
        "rating": "3;3;6;6",
        "confidence": "5;4;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;1;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "98;48;75;17",
        "wc_strengths": "34;26;63;30",
        "wc_weaknesses": "263;456;35;10",
        "wc_questions": "73;4;2;3",
        "wc_review": "468;534;175;60",
        "wc_reply_reviewers": "190;0;0;0",
        "wc_reply_authors": "1909;3025;531;471",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "4;6;2;2",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            59.5,
            30.25309901481169
        ],
        "wc_strengths_avg": [
            38.25,
            14.566657131957214
        ],
        "wc_weaknesses_avg": [
            191.0,
            182.00686800228172
        ],
        "wc_questions_avg": [
            20.5,
            30.319135871591065
        ],
        "wc_review_avg": [
            309.25,
            197.39728341595787
        ],
        "wc_reply_reviewers_avg": [
            47.5,
            82.27241335952168
        ],
        "wc_reply_authors_avg": [
            1484.0,
            1059.443721959784
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.5,
            1.6583123951777
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5773502691896258,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:_6lK14kmeHMJ:scholar.google.com/&scioq=Learn+from+the+Past:+A+Proxy+based+Adversarial+Defense+Framework+to+Boost+Robustness&hl=en&as_sdt=0,5",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Dalian University of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.dlut.edu.cn/",
        "aff_unique_abbr": "DUT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "6GySuKTJcd",
        "title": "Energy-Guided Continuous Entropic Barycenter Estimation for General Costs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Optimal transport (OT) barycenters are a mathematically grounded way of averaging probability distributions while capturing their geometric properties. In a nutshell, the task is to take the average of a collection of probability distributions w.r.t. given OT discrepancies. We propose a novel algorithm for approximating the continuous Entropic OT (EOT) barycenter for arbitrary OT cost functions. Our approach builds upon the dual reformulation of the EOT problem based on weak OT, which has recently gained the attention of the ML community. Beyond its novelty, our method enjoys several advantageous properties: (i) we establish quality bounds for the recovered solution; (ii) this approach seemlessly interconnects with the Energy-Based Models (EBMs) learning procedure, enabling the use of well-tuned algorithms for the problem of interest; (iii) it provides an intuitive optimization scheme avoiding min-max, reinforce and other intricate technical tricks. For validation, we consider several low-dimensional scenarios and image-space setups, including *non-Euclidean* cost functions. Furthermore, we investigate the practical task of learning the barycenter on an image manifold generated by a pretrained generative model, opening up new directions for real-world applications.",
        "keywords": "energy-based model;generative model;optimal transport;entropic optimal transport barycenters;general optimal transport cost",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/5c767d87daa2d7525106cf5a8715918e94d2abd9.zip",
        "author": "Alexander Kolesov;Petr Mokrov;Igor Udovichenko;Milena Gazdieva;Gudmund Pammer;Evgeny Burnaev;Alexander Korotin",
        "authorids": "~Alexander_Kolesov1;~Petr_Mokrov1;~Igor_Udovichenko1;~Milena_Gazdieva1;~Gudmund_Pammer1;~Evgeny_Burnaev1;~Alexander_Korotin2",
        "gender": "M;M;;F;M;M;",
        "homepage": "https://github.com/Kolessov;https://github.com/PetrMokrov;;;https://people.math.ethz.ch/~gpammer/;http://faculty.skoltech.ru/people/evgenyburnaev;",
        "dblp": "287/4380;;;309/6585;;144/7845;",
        "google_scholar": "WyAI_wUAAAAJ;CRsi4IkAAAAJ;;h52_Zx8AAAAJ;ipItetYAAAAJ;https://scholar.google.ru/citations?user=pCRdcOwAAAAJ;",
        "orcid": ";;;0000-0003-0047-1577;0000-0003-2494-8739;0000-0001-8424-0690;",
        "linkedin": ";;;;;;",
        "or_profile": "~Alexander_Kolesov1;~Petr_Mokrov1;~Igor_Udovichenko1;~Milena_Gazdieva1;~Gudmund_Pammer1;~Evgeny_Burnaev1;~Alexander_Korotin2",
        "aff": "The Skolkovo Institute of Science and Technology;Skolkovo Institute of Science and Technology;;Skolkovo Institute of Science and Technology;ETHZ - ETH Zurich;Skolkovo Institute of Science and Technology;",
        "aff_domain": "skoltech.ru;skolkovotech.ru;;skoltech.ru;ethz.ch;skoltech.ru;",
        "position": "PhD student;PhD student;;PhD student;Postdoc;Full Professor;",
        "bibtex": "@misc{\nkolesov2024energyguided,\ntitle={Energy-Guided Continuous Entropic Barycenter Estimation for General Costs},\nauthor={Alexander Kolesov and Petr Mokrov and Igor Udovichenko and Milena Gazdieva and Gudmund Pammer and Evgeny Burnaev and Alexander Korotin},\nyear={2024},\nurl={https://openreview.net/forum?id=6GySuKTJcd}\n}",
        "github": "",
        "project": "",
        "reviewers": "BAkA;97mW;16og;7U49",
        "site": "https://openreview.net/forum?id=6GySuKTJcd",
        "pdf_size": 10770669,
        "rating": "5;6;6;8",
        "confidence": "3;4;3;3",
        "soundness": "3;3;3;4",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;4",
        "wc_summary": "79;94;64;70",
        "wc_strengths": "91;123;24;81",
        "wc_weaknesses": "110;307;74;42",
        "wc_questions": "264;49;134;3",
        "wc_review": "544;573;296;196",
        "wc_reply_reviewers": "148;29;64;14",
        "wc_reply_authors": "1355;1534;1248;176",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "3;3;2;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            76.75,
            11.299889379989523
        ],
        "wc_strengths_avg": [
            79.75,
            35.73076405564258
        ],
        "wc_weaknesses_avg": [
            133.25,
            103.15855514691934
        ],
        "wc_questions_avg": [
            112.5,
            99.29375609775269
        ],
        "wc_review_avg": [
            402.25,
            160.52784026454725
        ],
        "wc_reply_reviewers_avg": [
            63.75,
            51.91519527074901
        ],
        "wc_reply_authors_avg": [
            1078.25,
            530.8410190443086
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.13245323570650439,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16650540745146647880&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "Skolkovo Institute of Science and Technology;ETH Zurich",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.skoltech.ru;https://www.ethz.ch",
        "aff_unique_abbr": "Skoltech;ETHZ",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "Russian Federation;Switzerland"
    },
    {
        "title": "Personalize Segment Anything Model with One Shot",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19398",
        "id": "6Gzkhoc6YS",
        "author_site": "Renrui Zhang, Zhengkai Jiang, Ziyu Guo, Shilin Yan, Junting Pan, Hao Dong, Yu Qiao, Gao Peng, Hongsheng Li",
        "tldr": "",
        "abstract": "Driven by large-data pre-training, Segment Anything Model (SAM) has been demonstrated as a powerful promptable framework, revolutionizing the segmentation field. Despite the generality, customizing SAM for specific visual concepts without man-powered prompting is under-explored, e.g., automatically segmenting your pet dog in numerous images. In this paper, we introduce a training-free Personalization approach for SAM, termed PerSAM. Given only one-shot data, i.e., a single image with a reference mask, we first obtain a positive-negative location prior for the target concept in new images. Then, aided by target visual semantics, we empower SAM for personalized object segmentation via two proposed techniques: target-guided attention and target-semantic prompting. In this way, we can effectively customize the general-purpose SAM for private use without any training. To further alleviate the ambiguity of segmentation scales, we present an efficient one-shot fine-tuning variant, PerSAM-F. Freezing the entire SAM, we introduce a scale-aware fine-tuning to aggregate multi-scale masks, which only tunes 2 parameters within 10 seconds for improved performance. To demonstrate our efficacy, we construct a new dataset, PerSeg, for the evaluation of personalized object segmentation, and also test our methods on various one-shot image and video segmentation benchmarks. Besides, we propose to leverage PerSAM to improve DreamBooth for personalized text-to-image synthesis. By mitigating the disturbance of training-set backgrounds, our approach showcases better target appearance generation and higher fidelity to the input text prompt. Code is released at https://github.com/ZrrSkywalker/Personalize-SAM.",
        "keywords": "Segment Anything Model (SAM);one-shot learning;text-to-image generation",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/9aa69c2ce9ae5d1634a5b7c812006ea90b1c64f0.pdf",
        "author": "Renrui Zhang;Zhengkai Jiang;Ziyu Guo;Shilin Yan;Junting Pan;Hao Dong;Yu Qiao;Peng Gao;Hongsheng Li",
        "authorids": "~Renrui_Zhang1;~Zhengkai_Jiang1;~Ziyu_Guo2;~Shilin_Yan1;~Junting_Pan2;~Hao_Dong3;~Yu_Qiao1;~Peng_Gao3;~Hongsheng_Li3",
        "gender": "M;;F;M;M;M;;;M",
        "homepage": ";;;https://scholar.google.com/citations?user=2VhjOykAAAAJ&hl=en;https://junting.github.io/;https://zsdonghao.github.io;;;http://www.ee.cuhk.edu.hk/~hsli",
        "dblp": "244/1748;;;166/3197.html;166/1669;14/1525-3.html;;;27/7402-1",
        "google_scholar": "YlL3xN4AAAAJ;;S9GLetwAAAAJ;2VhjOykAAAAJ;8Xt3TnAAAAAJ;xLFL4sMAAAAJ;;;BN2Ze-QAAAAJ",
        "orcid": ";;;;;0000-0003-2261-9122;;;",
        "linkedin": ";;;;junting-pan/;;;;",
        "or_profile": "~Renrui_Zhang1;~Zhengkai_Jiang1;~Ziyu_Guo2;~Shilin_Yan1;~Junting_Pan2;~Hao_Dong3;~Yu_Qiao1;~Peng_Gao3;~Hongsheng_Li3",
        "aff": "MMLab of CUHK & Shanghai AI Laboratory;;Department of Computer Science and Engineering, The Chinese University of Hong Kong;Fudan University;The Chinese University of Hong Kong;Peking University;;;The Chinese University of Hong Kong",
        "aff_domain": "pjlab.org.cn;;cse.cuhk.edu.hk;fudan.edu.cn;cuhk.edu.hk;pku.edu.cn;;;cuhk.edu.hk",
        "position": "PhD student;;PhD student;MS student;Postdoc;Assistant Professor;;;Associate Professor",
        "bibtex": "@inproceedings{\nzhang2024personalize,\ntitle={Personalize Segment Anything Model with One Shot},\nauthor={Renrui Zhang and Zhengkai Jiang and Ziyu Guo and Shilin Yan and Junting Pan and Hao Dong and Yu Qiao and Peng Gao and Hongsheng Li},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=6Gzkhoc6YS}\n}",
        "github": "",
        "project": "",
        "reviewers": "Fp1Y;XA1U;inm4",
        "pdf_size": 8743264,
        "rating": "6;6;8",
        "confidence": "5;4;5",
        "soundness": "3;3;4",
        "contribution": "2;3;4",
        "presentation": "3;3;4",
        "wc_summary": "74;223;59",
        "wc_strengths": "62;252;95",
        "wc_weaknesses": "112;111;64",
        "wc_questions": "35;58;87",
        "wc_review": "283;644;305",
        "wc_reply_reviewers": "24;23;26",
        "wc_reply_authors": "934;591;616",
        "reply_reviewers": "1;1;1",
        "reply_authors": "3;2;2",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            118.66666666666667,
            74.02852303147904
        ],
        "wc_strengths_avg": [
            136.33333333333334,
            82.89082511888085
        ],
        "wc_weaknesses_avg": [
            95.66666666666667,
            22.395436042987765
        ],
        "wc_questions_avg": [
            60.0,
            21.275964529643932
        ],
        "wc_review_avg": [
            410.6666666666667,
            165.2358583627927
        ],
        "wc_reply_reviewers_avg": [
            24.333333333333332,
            1.247219128924647
        ],
        "wc_reply_authors_avg": [
            713.6666666666666,
            156.13313407331435
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 233,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3983746222204517152&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=6Gzkhoc6YS",
        "pdf": "https://openreview.net/pdf?id=6Gzkhoc6YS",
        "email": "pjlab.org.cn;;cse.cuhk.edu.hk;fudan.edu.cn;cuhk.edu.hk;pku.edu.cn;;;cuhk.edu.hk",
        "author_num": 9,
        "aff_unique_index": "0;0;1;0;2;0",
        "aff_unique_norm": "Chinese University of Hong Kong;Fudan University;Peking University",
        "aff_unique_dep": "MMLab;;",
        "aff_unique_url": "https://www.cuhk.edu.hk;https://www.fudan.edu.cn;http://www.pku.edu.cn",
        "aff_unique_abbr": "CUHK;Fudan;Peking U",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "6HABsUI6UF",
        "title": "Knowledge Accumulation in Continually Learned Representations and the Issue of Feature Forgetting",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "While it is established that neural networks suffer from catastrophic forgetting ``at the output level'', it is debated whether this is also the case at the level of representations. Some studies ascribe a certain level of innate robustness to representations, that they only forget minimally and no critical information, while others claim that representations are also severely affected by forgetting. To settle this debate, we first discuss how this apparent disagreement might stem from the coexistence of two phenomena that affect the quality of continually learned representations: knowledge accumulation and feature forgetting. We then show that, even though it is true that feature forgetting can be small in absolute terms, newly learned information is forgotten just as catastrophically at the level of representations as it is at the output level. Next we show that this feature forgetting is problematic as it substantially slows down knowledge accumulation. We further show that representations that are continually learned through both supervised and self-supervised learning suffer from feature forgetting. Finally, we study how feature forgetting and knowledge accumulation are affected by different types of continual learning methods.",
        "keywords": "continual learning;catastrophic forgetting;knowledge accumulation;conceptual analysis",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/4358574358669e6f26ba2c5bdc9c8be3cb00bb89.pdf",
        "author": "Timm Hess;Eli Verwimp;Gido M van de Ven;Tinne Tuytelaars",
        "authorids": "~Timm_Hess1;~Eli_Verwimp1;~Gido_M_van_de_Ven1;~Tinne_Tuytelaars1",
        "gender": "M;M;;",
        "homepage": ";;;",
        "dblp": ";290/1282;;",
        "google_scholar": ";HIh4i18AAAAJ;;",
        "orcid": ";0000-0001-5469-3103;;",
        "linkedin": "timm-hess-2b8664137/;;;",
        "or_profile": "~Timm_Hess1;~Eli_Verwimp1;~Gido_M_van_de_Ven1;~Tinne_Tuytelaars1",
        "aff": "KU Leuven;Department of Electrical Engineering, KU Leuven, Belgium, KU Leuven;;",
        "aff_domain": "esat.kuleuven.be;esat.kuleuven.be;;",
        "position": "PhD student;PhD student;;",
        "bibtex": "@misc{\nhess2024knowledge,\ntitle={Knowledge Accumulation in Continually Learned Representations and the Issue of Feature Forgetting},\nauthor={Timm Hess and Eli Verwimp and Gido M van de Ven and Tinne Tuytelaars},\nyear={2024},\nurl={https://openreview.net/forum?id=6HABsUI6UF}\n}",
        "github": "",
        "project": "",
        "reviewers": "BtF4;acbx;1Fn7;gcjs",
        "site": "https://openreview.net/forum?id=6HABsUI6UF",
        "pdf_size": 425328,
        "rating": "3;3;3;6",
        "confidence": "4;5;4;5",
        "soundness": "2;2;3;3",
        "contribution": "1;1;2;3",
        "presentation": "2;1;2;2",
        "wc_summary": "53;88;52;96",
        "wc_strengths": "15;21;31;47",
        "wc_weaknesses": "141;460;198;53",
        "wc_questions": "1;1;2;92",
        "wc_review": "210;570;283;288",
        "wc_reply_reviewers": "27;0;16;0",
        "wc_reply_authors": "383;593;175;99",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            72.25,
            19.954636052807377
        ],
        "wc_strengths_avg": [
            28.5,
            12.114041439585717
        ],
        "wc_weaknesses_avg": [
            213.0,
            151.6723442160765
        ],
        "wc_questions_avg": [
            24.0,
            39.26194085880116
        ],
        "wc_review_avg": [
            337.75,
            137.59791967904167
        ],
        "wc_reply_reviewers_avg": [
            10.75,
            11.431863365173676
        ],
        "wc_reply_authors_avg": [
            312.5,
            192.444147741624
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2275169797400754065&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Katholieke Universiteit Leuven;KU Leuven",
        "aff_unique_dep": ";Department of Electrical Engineering",
        "aff_unique_url": "https://www.kuleuven.be;https://www.kuleuven.be",
        "aff_unique_abbr": "KU Leuven;KU Leuven",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Belgium"
    },
    {
        "id": "6Hv6ADDy0L",
        "title": "Physics-aware Hand Object Interaction Denoising",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The credibility and practicality of a reconstructed hand-object interaction sequence depend largely on its physical plausibility. However, due to high occlusions during hand-object interaction, physical plausibility remains a challenging criterion for purely vision-based tracking methods. To address this issue and enhance the results of existing hand trackers, this paper proposes a novel physically-aware hand motion de-noising method. Specifically, we introduce two learned loss terms that explicitly capture two crucial aspects of physical plausibility: grasp credibility and manipulation feasibility. These terms are used to train a physically-aware de-noising network. Qualitative and quantitative experiments demonstrate that our approach significantly improves both fine-grained physical plausibility and overall pose accuracy, surpassing current state-of-the-art de-noising methods.",
        "keywords": "physcis-aware neural network;hand motion denoising;hand object interaction",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/1a5f5cff33d6898be83b725ff59bac20fcd8c182.zip",
        "author": "Haowen Luo;Yunze Liu;Li Yi",
        "authorids": "~Haowen_Luo1;~Yunze_Liu2;~Li_Yi2",
        "gender": ";M;M",
        "homepage": ";https://yunzeliu.github.io;https://ericyi.github.io/",
        "dblp": ";282/1192;26/4239-1",
        "google_scholar": ";xYVEg0cAAAAJ;UyZL660AAAAJ",
        "orcid": ";0009-0002-3148-8822;",
        "linkedin": ";;",
        "or_profile": "~Haowen_Luo1;~Yunze_Liu2;~Li_Yi2",
        "aff": ";IIIS, Tsinghua University;Tsinghua University",
        "aff_domain": ";mails.tsinghua.edu.cn;tsinghua.edu.cn",
        "position": ";PhD student;Assistant Professor",
        "bibtex": "@misc{\nluo2024physicsaware,\ntitle={Physics-aware Hand Object Interaction Denoising},\nauthor={Haowen Luo and Yunze Liu and Li Yi},\nyear={2024},\nurl={https://openreview.net/forum?id=6Hv6ADDy0L}\n}",
        "github": "",
        "project": "",
        "reviewers": "CERf;Xkao;R2Kj;ZPXX",
        "site": "https://openreview.net/forum?id=6Hv6ADDy0L",
        "pdf_size": 3367826,
        "rating": "3;3;6;8",
        "confidence": "4;4;4;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;2;3",
        "wc_summary": "51;123;57;62",
        "wc_strengths": "47;26;26;124",
        "wc_weaknesses": "100;307;117;478",
        "wc_questions": "15;5;55;9",
        "wc_review": "213;461;255;673",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            5.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            73.25,
            28.98598799420161
        ],
        "wc_strengths_avg": [
            55.75,
            40.32601517631019
        ],
        "wc_weaknesses_avg": [
            250.5,
            154.45144868210204
        ],
        "wc_questions_avg": [
            21.0,
            19.949937343260004
        ],
        "wc_review_avg": [
            400.5,
            183.1959333609783
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8164965809277261,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2704536020240165749&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Tsinghua University",
        "aff_unique_dep": "Institute for Interdisciplinary Information Sciences",
        "aff_unique_url": "https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "6HwamHLDa6",
        "title": "A Multi-In-Single-Out Network for Video Frame Interpolation without optical flow",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In general, deep learning-based video frame interpolation (VFI) methods have predominantly focused on estimating motion vectors between two input frames and warping them to the target time. While this approach has shown impressive performance for linear motion between two input frames, it exhibits limitations when dealing with occlusions and nonlinear movements. Recently, generative models have been applied to VFI to address these issues. However, as VFI is not a task focused on generating plausible images, but rather on predicting accurate intermediate frames between two given frames, performance limitations still persist. In this paper, we propose a multi-in-single-out (MISO) based VFI method that does not rely on motion vector estimation, allowing it to effectively model occlusions and nonlinear motion. Additionally, we introduce a novel motion perceptual loss that enables MISO-VFI to better capture the spatio-temporal correlations within the video frames. Our MISO-VFI method achieves state-of-the-art results on VFI benchmarks Vimeo90K, Middlebury, and UCF101, with a significant performance gap compared to existing approaches.",
        "keywords": "Video Frame Interpolation;Video Synthesis",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/e5c88df169fad3ee2b360b46dbdfd5138a18ddfd.zip",
        "author": "Jaemin Lee;Minseok Seo;Sangwoo Lee;Hyobin Park;Dong-Geol Choi",
        "authorids": "~Jaemin_Lee2;~Minseok_Seo1;~Sangwoo_Lee2;~Hyobin_Park1;~Dong-Geol_Choi2",
        "gender": "M;M;M;;F",
        "homepage": "https://sites.google.com/view/j911/home;https://sites.google.com/view/minseokcv/%ED%99%88;;;https://github.com/hbp001",
        "dblp": "45/3500;;31/5983;62/6155.html;",
        "google_scholar": "h1R6SZMAAAAJ;https://scholar.google.co.kr/citations?user=pOygDIIAAAAJ;PLgXBtEAAAAJ;;https://scholar.google.com/citations?view_op=list_works",
        "orcid": "0000-0002-2154-300X;;0000-0001-5432-4770;;",
        "linkedin": ";;;;",
        "or_profile": "~Jaemin_Lee2;~Minseok_Seo1;~Sangwoo_Lee2;~Dong-Geol_Choi2;~Hyobin_Park2",
        "aff": "Testworks Inc.;SI Analytics;ANTLAB;Hanbat National University;Hanbat National University",
        "aff_domain": "testworks.co.kr;si-analytics.ai;antlab.co.kr;hanbat.ac.kr;hanbat.ac.kr",
        "position": "Researcher;Researcher;Researcher;Full Professor;MS student",
        "bibtex": "@misc{\nlee2024a,\ntitle={A Multi-In-Single-Out Network for Video Frame Interpolation without optical flow},\nauthor={Jaemin Lee and Minseok Seo and Sangwoo Lee and Hyobin Park and Dong-Geol Choi},\nyear={2024},\nurl={https://openreview.net/forum?id=6HwamHLDa6}\n}",
        "github": "",
        "project": "",
        "reviewers": "a9Au;CFmx;rS3w;WQaG",
        "site": "https://openreview.net/forum?id=6HwamHLDa6",
        "pdf_size": 2566335,
        "rating": "5;5;5;5",
        "confidence": "3;3;5;5",
        "soundness": "2;3;2;2",
        "contribution": "2;2;1;1",
        "presentation": "2;3;3;2",
        "wc_summary": "72;74;54;94",
        "wc_strengths": "32;12;18;38",
        "wc_weaknesses": "113;131;121;110",
        "wc_questions": "35;211;10;3",
        "wc_review": "252;428;203;245",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "469;591;422;363",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            1.0
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            73.5,
            14.168627315304754
        ],
        "wc_strengths_avg": [
            25.0,
            10.44030650891055
        ],
        "wc_weaknesses_avg": [
            118.75,
            8.13557004763649
        ],
        "wc_questions_avg": [
            64.75,
            85.27125834652611
        ],
        "wc_review_avg": [
            282.0,
            86.35102778774552
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            461.25,
            83.79849342321137
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:AIUSxowBXEMJ:scholar.google.com/&scioq=A+Multi-In-Single-Out+Network+for+Video+Frame+Interpolation+without+optical+flow&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;3;3",
        "aff_unique_norm": "Testworks Inc.;SI Analytics;ANTLAB;Hanbat National University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": ";;;https://www.hanbat.ac.kr",
        "aff_unique_abbr": ";;;HNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;2;2",
        "aff_country_unique": "United States;;South Korea"
    },
    {
        "id": "6I7UsvlDPj",
        "title": "LaMPP: Language Models as Probabilistic Priors for Perception and Action",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Language models trained on large text corpora encode rich distributional information about real-world environments and action sequences. This information plays a crucial role in current approaches to language processing tasks like question answering and instruction generation. We describe how to leverage language models for *non-linguistic* perception and control tasks. Our approach casts labeling and decision-making as inference in probabilistic graphical models in which language models parameterize prior distributions over labels, decisions and parameters, making it possible to integrate uncertain observations and incomplete background knowledge in a principled way. Applied to semantic segmentation, household navigation, and activity recognition tasks, this approach improves predictions on rare, out-of-distribution, and structurally novel inputs.",
        "keywords": "Machine Learning;Natural Language Processing;Language Models;Priors",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "/attachment/f9fbed4f5968a730146faac010dc312e3d283f5d.zip",
        "author": "Belinda Z. Li;William Chen;Pratyusha Sharma;Jacob Andreas",
        "authorids": "~Belinda_Z._Li1;~William_Chen1;~Pratyusha_Sharma1;~Jacob_Andreas1",
        "gender": "M;F;M;F",
        "homepage": ";https://pratyushasharma.github.io/;http://web.mit.edu/jda/www;https://belindal.github.io/",
        "dblp": ";228/7904;97/8154;263/9914",
        "google_scholar": "xUeq5EAAAAAJ;RGiCLUgAAAAJ;dnZ8udEAAAAJ;700fyvEAAAAJ",
        "orcid": ";;;",
        "linkedin": "william-chen-a3956516b/;;;",
        "or_profile": "~William_Chen1;~Pratyusha_Sharma1;~Jacob_Andreas1;~Belinda_Zou_Li1",
        "aff": "University of California, Berkeley;Massachusetts Institute of Technology;Microsoft;Massachusetts Institute of Technology",
        "aff_domain": "berkeley.edu;mit.edu;microsoft.com;mit.edu",
        "position": "PhD student;PhD student;Researcher;PhD student",
        "bibtex": "@misc{\nli2024lampp,\ntitle={La{MPP}: Language Models as Probabilistic Priors for Perception and Action},\nauthor={Belinda Z. Li and William Chen and Pratyusha Sharma and Jacob Andreas},\nyear={2024},\nurl={https://openreview.net/forum?id=6I7UsvlDPj}\n}",
        "github": "",
        "project": "",
        "reviewers": "C44C;xpjw;WR1X",
        "site": "https://openreview.net/forum?id=6I7UsvlDPj",
        "pdf_size": 39725166,
        "rating": "5;6;6",
        "confidence": "4;3;3",
        "soundness": "3;2;3",
        "contribution": "2;2;3",
        "presentation": "3;3;3",
        "wc_summary": "48;148;89",
        "wc_strengths": "9;46;45",
        "wc_weaknesses": "176;116;81",
        "wc_questions": "4;99;15",
        "wc_review": "237;409;230",
        "wc_reply_reviewers": "0;38;0",
        "wc_reply_authors": "809;1501;495",
        "reply_reviewers": "0;1;0",
        "reply_authors": "2;3;2",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            95.0,
            41.04469108991645
        ],
        "wc_strengths_avg": [
            33.333333333333336,
            17.21110752456745
        ],
        "wc_weaknesses_avg": [
            124.33333333333333,
            39.228674319799396
        ],
        "wc_questions_avg": [
            39.333333333333336,
            42.42902570437156
        ],
        "wc_review_avg": [
            292.0,
            82.7808351411525
        ],
        "wc_reply_reviewers_avg": [
            12.666666666666666,
            17.913371790059205
        ],
        "wc_reply_authors_avg": [
            935.0,
            420.250718817549
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9999999999999997,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4920872563659380315&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "University of California, Berkeley;Massachusetts Institute of Technology;Microsoft",
        "aff_unique_dep": ";;Microsoft Corporation",
        "aff_unique_url": "https://www.berkeley.edu;https://web.mit.edu;https://www.microsoft.com",
        "aff_unique_abbr": "UC Berkeley;MIT;Microsoft",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Berkeley;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "6INCxtPVXd",
        "title": "Mode-Aware Continual Learning for Conditional Generative Adversarial Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The main challenge in continual learning for generative models is to effectively learn new target modes with limited samples while preserving previously learned ones. To this end, we introduce a new continual learning approach for generative modeling in conjunction with a mode-affinity score specifically designed for conditional generative adversarial networks. First, the generator produces samples of existing modes for subsequent replay. The discriminator is then used to compute the mode similarity measure, which identifies a set of closest existing modes to the target. Subsequently, a label for the target mode is generated and given as a weighted average of the labels within this set. We extend the continual learning model by training it on the target data with the newly-generated label, while performing memory replay to mitigate the risk of catastrophic forgetting. Experimental results on benchmark datasets demonstrate the gains of our approach over the state-of-the-art methods, even when using fewer training samples.",
        "keywords": "continual learning;generative model;mode affinity",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Cat Phuoc Le;Juncheng Dong;Ahmed Aloui;Vahid Tarokh",
        "authorids": "~Cat_Phuoc_Le1;~Juncheng_Dong1;~Ahmed_Aloui1;~Vahid_Tarokh1",
        "gender": "M;;M;",
        "homepage": "https://scholars.duke.edu/person/cat.le;;;",
        "dblp": "251/5583;;116/6738;",
        "google_scholar": "gSzKGdQAAAAJ;;;",
        "orcid": "0000-0002-9121-9395;;;",
        "linkedin": "catphuocle/;;ahmed-aloui-b06547153/;",
        "or_profile": "~Cat_Phuoc_Le1;~Juncheng_Dong1;~Ahmed_Aloui1;~Vahid_Tarokh1",
        "aff": "Duke University;;Duke University, Duke University;",
        "aff_domain": "duke.edu;;ece.duke.edu;",
        "position": "Postdoc;;PhD student;",
        "bibtex": "@misc{\nle2024modeaware,\ntitle={Mode-Aware Continual Learning for Conditional Generative Adversarial Networks},\nauthor={Cat Phuoc Le and Juncheng Dong and Ahmed Aloui and Vahid Tarokh},\nyear={2024},\nurl={https://openreview.net/forum?id=6INCxtPVXd}\n}",
        "github": "",
        "project": "",
        "reviewers": "M2Vt;DKw7;cors;y3EF",
        "site": "https://openreview.net/forum?id=6INCxtPVXd",
        "pdf_size": 9176444,
        "rating": "3;3;5;5",
        "confidence": "5;4;4;5",
        "soundness": "2;2;3;2",
        "contribution": "1;1;3;2",
        "presentation": "1;1;3;2",
        "wc_summary": "53;73;93;108",
        "wc_strengths": "16;30;63;46",
        "wc_weaknesses": "294;273;167;169",
        "wc_questions": "5;1;82;20",
        "wc_review": "368;377;405;343",
        "wc_reply_reviewers": "0;0;137;0",
        "wc_reply_authors": "447;432;462;317",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            81.75,
            20.72890493972125
        ],
        "wc_strengths_avg": [
            38.75,
            17.5695048308141
        ],
        "wc_weaknesses_avg": [
            225.75,
            58.22961016527588
        ],
        "wc_questions_avg": [
            27.0,
            32.53459696999488
        ],
        "wc_review_avg": [
            373.25,
            22.16275028059469
        ],
        "wc_reply_reviewers_avg": [
            34.25,
            59.322740159234044
        ],
        "wc_reply_authors_avg": [
            414.5,
            57.282196186948
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2098866224242859711&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Duke University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.duke.edu",
        "aff_unique_abbr": "Duke",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Conserve-Update-Revise to Cure Generalization and Robustness Trade-off in Adversarial Training",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19397",
        "id": "6IjN7oxjXt",
        "author_site": "Shruthi Gowda, Bahram Zonooz, Elahe Arani",
        "tldr": "",
        "abstract": "Adversarial training improves the robustness of neural networks against adversarial attacks, albeit at the expense of the trade-off between standard and robust generalization. To unveil the underlying factors driving this phenomenon, we examine the layer-wise learning capabilities of neural networks during the transition from a standard to an adversarial setting. Our empirical findings demonstrate that selectively updating specific layers while preserving others can substantially enhance the network's learning capacity. We, therefore, propose CURE, a novel training framework that leverages a gradient prominence criterion to perform selective conservation, updating, and revision of weights. Importantly, CURE is designed to be dataset- and architecture-agnostic, ensuring its applicability across various scenarios. It effectively tackles both memorization and overfitting issues, thus enhancing the trade-off between robustness and generalization and additionally, this training approach also aids in mitigating \"robust overfitting\". Furthermore, our study provides valuable insights into the mechanisms of selective adversarial training and offers a promising avenue for future research.",
        "keywords": "Adversarial training;Adversarial Robustness;Generalization;Robustness;Robust overfitting;Selective training",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Shruthi Gowda;Bahram Zonooz;Elahe Arani",
        "authorids": "~Shruthi_Gowda1;~Bahram_Zonooz1;~Elahe_Arani1",
        "gender": "F;M;F",
        "homepage": ";https://sites.google.com/view/bahramzonooz;https://sites.google.com/view/elahe-arani",
        "dblp": ";250/9573;",
        "google_scholar": "e9CgwRgAAAAJ;;e_I_v6cAAAAJ",
        "orcid": ";;0000-0002-0952-7007",
        "linkedin": "shruthi-gowda-19811b15/;;elahe-arani-630870b2/",
        "or_profile": "~Shruthi_Gowda1;~Bahram_Zonooz1;~Elahe_Arani1",
        "aff": "Eindhoven University of Technology;Eindhoven University of Technology;Wayve Technologies Ltd",
        "aff_domain": "tue.nl;tue.nl;wayve.ai",
        "position": "PhD student;Assistant Professor;Head of AI Research",
        "bibtex": "@inproceedings{\ngowda2024conserveupdaterevise,\ntitle={Conserve-Update-Revise to Cure Generalization and Robustness Trade-off in Adversarial Training},\nauthor={Shruthi Gowda and Bahram Zonooz and Elahe Arani},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=6IjN7oxjXt}\n}",
        "github": "",
        "project": "",
        "reviewers": "PH92;DhtN;i2U9;HvAu",
        "pdf_size": 2312333,
        "rating": "5;5;6;6",
        "confidence": "3;1;4;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;4",
        "presentation": "3;3;3;4",
        "wc_summary": "119;41;105;75",
        "wc_strengths": "107;8;42;52",
        "wc_weaknesses": "399;176;19;286",
        "wc_questions": "101;36;42;78",
        "wc_review": "726;261;208;491",
        "wc_reply_reviewers": "507;0;11;173",
        "wc_reply_authors": "3007;1129;873;2034",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "5;3;2;4",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            2.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            85.0,
            29.966648127543394
        ],
        "wc_strengths_avg": [
            52.25,
            35.56947427219019
        ],
        "wc_weaknesses_avg": [
            220.0,
            140.29789734703795
        ],
        "wc_questions_avg": [
            64.25,
            26.61179249881526
        ],
        "wc_review_avg": [
            421.5,
            205.48296766398911
        ],
        "wc_reply_reviewers_avg": [
            172.75,
            204.77350292457274
        ],
        "wc_reply_authors_avg": [
            1760.75,
            838.8999865895814
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.5,
            1.118033988749895
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.6882472016116854,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1547884356502405058&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=6IjN7oxjXt",
        "pdf": "https://openreview.net/pdf?id=6IjN7oxjXt",
        "email": "tue.nl;tue.nl;wayve.ai",
        "author_num": 3,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Eindhoven University of Technology;Wayve Technologies",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tue.nl;https://www.wayvetechnologies.com",
        "aff_unique_abbr": "TU/e;Wayve",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "Netherlands;United Kingdom"
    },
    {
        "title": "Principled Federated Domain Adaptation: Gradient Projection and Auto-Weighting",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19396",
        "id": "6J3ehSUrMU",
        "author_site": "Enyi Jiang, Yibo Jacky Zhang, Sanmi Koyejo",
        "tldr": "",
        "abstract": "Federated Domain Adaptation (FDA) describes the federated learning (FL) setting where source clients and a server work collaboratively to improve the performance of a target client where limited data is available. The domain shift between the source and target domains, coupled with limited data of the target client, makes FDA a challenging problem, e.g., common techniques such as federated averaging and fine-tuning fail due to domain shift and data scarcity. \nTo theoretically understand the problem, we introduce new metrics that characterize the FDA setting and a theoretical framework with novel theorems for analyzing the performance of server aggregation rules. Further, we propose a novel lightweight aggregation rule, Federated Gradient Projection ($\\texttt{FedGP}$), which significantly improves the target performance with domain shift and data scarcity. Moreover, our theory suggests an $\\textit{auto-weighting scheme}$ that finds the optimal combinations of the source and target gradients. This scheme improves both $\\texttt{FedGP}$ and a simpler heuristic aggregation rule. Extensive experiments verify the theoretical insights and illustrate the effectiveness of the proposed methods in practice.",
        "keywords": "federated domain adaptation;federated learning;domain adaptation;machine learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/16734c7844700ed71efbac5551d4b1fcf363e141.pdf",
        "author": "Enyi Jiang;Yibo Jacky Zhang;Sanmi Koyejo",
        "authorids": "~Enyi_Jiang1;~Yibo_Jacky_Zhang1;~Sanmi_Koyejo1",
        "gender": "F;M;",
        "homepage": "https://enyijiang.github.io/;https://cs.stanford.edu/~sanmi/;https://yiboz.me/",
        "dblp": "268/2122;14/8885;251/9129.html",
        "google_scholar": "h6YC9nwAAAAJ;EaaOeJwAAAAJ;",
        "orcid": ";0000-0002-4023-419X;",
        "linkedin": "enyi-jiang-16a561171/;sanmi-koyejo-984754/;",
        "or_profile": "~Enyi_Jiang1;~Oluwasanmi_O_Koyejo1;~Jacky_Yibo_Zhang1",
        "aff": "University of Illinois, Urbana Champaign;Google;University of Illinois, Urbana Champaign",
        "aff_domain": "uiuc.edu;google.com;illinois.edu",
        "position": "PhD student;Research Scientist;PhD student",
        "bibtex": "@inproceedings{\njiang2024principled,\ntitle={Principled Federated Domain Adaptation: Gradient Projection and Auto-Weighting},\nauthor={Enyi Jiang and Yibo Jacky Zhang and Sanmi Koyejo},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=6J3ehSUrMU}\n}",
        "github": "",
        "project": "",
        "reviewers": "nVHX;d97G;tJ7A;28v7",
        "pdf_size": 975660,
        "rating": "5;6;6;6",
        "confidence": "5;3;4;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "50;59;101;154",
        "wc_strengths": "22;34;92;67",
        "wc_weaknesses": "54;68;197;334",
        "wc_questions": "22;106;32;24",
        "wc_review": "148;267;422;579",
        "wc_reply_reviewers": "0;72;0;30",
        "wc_reply_authors": "582;932;466;1080",
        "reply_reviewers": "0;2;0;1",
        "reply_authors": "1;3;1;2",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            91.0,
            41.15215668710451
        ],
        "wc_strengths_avg": [
            53.75,
            27.55335732719336
        ],
        "wc_weaknesses_avg": [
            163.25,
            113.25055187503503
        ],
        "wc_questions_avg": [
            46.0,
            34.84250278036869
        ],
        "wc_review_avg": [
            354.0,
            162.21436434545492
        ],
        "wc_reply_reviewers_avg": [
            25.5,
            29.508473359359
        ],
        "wc_reply_authors_avg": [
            765.0,
            250.00199999200007
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8703882797784891,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4689861876947239151&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=6J3ehSUrMU",
        "pdf": "https://openreview.net/pdf?id=6J3ehSUrMU",
        "email": "uiuc.edu;google.com;illinois.edu",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Illinois Urbana-Champaign;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://illinois.edu;https://www.google.com",
        "aff_unique_abbr": "UIUC;Google",
        "aff_campus_unique_index": "0;1;0",
        "aff_campus_unique": "Urbana-Champaign;Mountain View",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "6J7WG1jyog",
        "title": "AceGPT, Localizing Large Language Models in Arabic",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "This paper underscores the critical necessity and methodology for developing a localized Large Language Model (LLM) specifically for Arabic, a language imbued with unique cultural characteristics inadequately addressed by current mainstream models like ChatGPT. Significant concerns emerge when addressing cultural sensitivity and local values. To address this, the paper proposes a comprehensive solution that includes further pre-training with Arabic texts, Supervised Fine-Tuning (SFT) utilizing native Arabic instructions, and GPT-4 responses in Arabic, alongside Reinforcement Learning with AI Feedback (RLAIF) employing a reward model attuned to local culture and values. The goal is to cultivate culturally cognizant and value-aligned Arabic LLMs capable of accommodating the diverse, application-specific needs of Arabic-speaking communities.\n Comprehensive evaluations reveal that the resulting model, dubbed AceGPT, sets the state-of-the-art standard for open Arabic LLMs across various benchmarks, including the instruction-following benchmark (i.e., Arabic Vicuna-80 and Arabic AlpacaEval), knowledge benchmark (i.e., Arabic MMLU and EXAMs), and the newly introduced Arabic cultural \\& value alignment benchmark. Notably, AceGPT outperforms ChatGPT in the popular Vicuna-80 benchmark when evaluated with GPT-4, despite the benchmark's limited scale.",
        "keywords": "AceGPT;Arabic;Large Language Model;Localization",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Huang Huang;Fei Yu;Jianqing Zhu;Xuening Sun;Hao Cheng;Song Dingjie;Zhihong Chen;Mosen Alharthi;Bang An;Ziche Liu;Zhang Zhiyi;Junying Chen;Jianquan Li;Benyou Wang;Lian Zhang;Ruoyu Sun;Xiang Wan;Haizhou Li;Jinchao Xu",
        "authorids": "~Huang_Huang2;~Fei_Yu3;~Jianqing_Zhu2;~Xuening_Sun2;~Hao_Cheng18;~Song_Dingjie1;~Zhihong_Chen2;~Mosen_Alharthi1;~Bang_An3;~Ziche_Liu1;~Zhang_Zhiyi2;~Junying_Chen2;~Jianquan_Li1;~Benyou_Wang2;~Lian_Zhang2;~Ruoyu_Sun1;~Xiang_Wan1;~Haizhou_Li3;~Jinchao_Xu1",
        "gender": "M;F;M;M;M;M;M;M;;M;M;M;M;M;;M;M;M;M",
        "homepage": ";;https://github.com/614479467;https://markch00.github.io/;https://bbsngg.github.io/;;https://scholar.google.com/citations?hl=en&user=eMfvcJ4AAAAJ;https://cemse.kaust.edu.sa/amcs/people/person/bang;https://zicheliu.com/;https://github.com/zhangzhiyi23;;;https://wabyking.github.io/old.html;;https://ruoyus.github.io/;http://www.sribd.cn/teacher/28;https://colips.org/~eleliha/;https://www.personal.psu.edu/jxx1/;",
        "dblp": ";;;;262/3284;78/3726;;;;;;;169/1793;;30/9879-1;;36/4118;;",
        "google_scholar": "0JhMor8AAAAJ;EsCgPkQAAAAJ;;;YLQ8DCsAAAAJ;y55sF8cAAAAJ;;;cQ0xpOkAAAAJ;;https://scholar.google.com.hk/citations?user=I0raPTYAAAAJ;https://scholar.google.com/citations?hl=en;Jk4vJU8AAAAJ;;PsfzbCMAAAAJ;;https://scholar.google.com.sg/citations?user=z8_x7C8AAAAJ;pBHiYxcAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;;;;;;;;;;0000-0002-1501-9914;;;;0000-0001-9158-9401;;",
        "linkedin": ";;;;;;;;;;;;;lian-zhang-47027a187/;;;haizhou-li-4ba74b6/;;",
        "or_profile": "~Huang_Huang2;~Fei_Yu3;~Xuening_Sun2;~Hao_Cheng18;~Song_Dingjie1;~Zhihong_Chen2;~Mosen_Alharthi1;~Bang_An3;~Ziche_Liu1;~Zhang_Zhiyi2;~Junying_Chen2;~Jianquan_Li1;~Benyou_Wang2;~Lian_Zhang2;~Ruoyu_Sun1;~Xiang_Wan1;~Haizhou_Li3;~Jinchao_Xu1;~Zhu_Jianqing2",
        "aff": "Shenzhen Research Institute of Big Data;The Chinese University of Hong Kong, Shenzhen;Bupt;The Chinese University of Hong Kong, Shenzhen;The Chinese University of Hong Kong, Shenzhen;The Chinese University of Hong Kong, Shenzhen;King Abdullah University of Science and Technology;;The Chinese University of Hong Kong, Shenzhen;;Chinese University of Hong Kong, Shenzhen;;The Chinese University of Hong Kong, Shenzhen;Shenzhen Research Institute of Big Data;The Chinese University of Hong Kong;Shenzhen Research Institute of Big Data;National University of Singapore;Pennsylvania State University;King Abdullah University of Science and Technology",
        "aff_domain": "sribd.cn;link.cuhk.edu.cn;cs.umass.edu;cuhk.edu.cn;cuhk.edu.cn;cuhk.edu.cn;kaust.edu.sa;;cuhk.edu.cn;;cuhk.hk;;cuhk.edu.cn;sribd.cn;cuhk.edu.cn;sribd.cn;nus.edu.sg;psu.edu;kaust.edu.sa",
        "position": "Researcher;PhD student;MS student;MS student;Researcher;PhD student;PhD student;;Undergrad student;;PhD student;;Assistant Professor;Researcher;Associate Professor;Principal Researcher;Full Professor;Full Professor;Postdoc",
        "bibtex": "@misc{\nhuang2024acegpt,\ntitle={Ace{GPT}, Localizing Large Language Models in Arabic},\nauthor={Huang Huang and Fei Yu and Jianqing Zhu and Xuening Sun and Hao Cheng and Song Dingjie and Zhihong Chen and Mosen Alharthi and Bang An and Ziche Liu and Zhang Zhiyi and Junying Chen and Jianquan Li and Benyou Wang and Lian Zhang and Ruoyu Sun and Xiang Wan and Haizhou Li and Jinchao Xu},\nyear={2024},\nurl={https://openreview.net/forum?id=6J7WG1jyog}\n}",
        "github": "",
        "project": "",
        "reviewers": "P1tY;CfmQ;vrrL",
        "site": "https://openreview.net/forum?id=6J7WG1jyog",
        "pdf_size": 636383,
        "rating": "3;3;5",
        "confidence": "4;4;3",
        "soundness": "3;3;3",
        "contribution": "2;2;2",
        "presentation": "3;3;3",
        "wc_summary": "96;98;38",
        "wc_strengths": "38;81;36",
        "wc_weaknesses": "169;158;39",
        "wc_questions": "52;229;21",
        "wc_review": "355;566;134",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            77.33333333333333,
            27.824849006278942
        ],
        "wc_strengths_avg": [
            51.666666666666664,
            20.75786330258702
        ],
        "wc_weaknesses_avg": [
            122.0,
            58.86141916966211
        ],
        "wc_questions_avg": [
            100.66666666666667,
            91.62362625921813
        ],
        "wc_review_avg": [
            351.6666666666667,
            176.37901109699973
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            19,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 24,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8712652082820375035&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;2;1;1;1;3;1;1;1;0;1;0;4;5;3",
        "aff_unique_norm": "Shenzhen Research Institute of Big Data;Chinese University of Hong Kong;Beijing University of Posts and Telecommunications;King Abdullah University of Science and Technology;National University of Singapore;Pennsylvania State University",
        "aff_unique_dep": ";;;;;",
        "aff_unique_url": "http://www.sribd.cn;https://www.cuhk.edu.cn;http://www.bupt.edu.cn/;https://www.kast.kau.edu.sa;https://www.nus.edu.sg;https://www.psu.edu",
        "aff_unique_abbr": ";CUHK;BUPT;KAUST;NUS;PSU",
        "aff_campus_unique_index": "1;1;1;1;1;1;1;2",
        "aff_campus_unique": ";Shenzhen;Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;0;0;1;0;0;0;0;0;0;2;3;1",
        "aff_country_unique": "China;Saudi Arabia;Singapore;United States"
    },
    {
        "id": "6JcbNMEFPw",
        "title": "Large Language Models Can Be Good Privacy Protection Learners",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The proliferation of Large Language Models (LLMs) has driven considerable interest in fine-tuning them with domain-specific data to create specialized language models. \nNevertheless, such domain-specific fine-tuning data often contains sensitive personally identifiable information (PII). Direct fine-tuning LLMs on this data without privacy protection poses a risk of leakage. \nTo address this challenge, we introduce Privacy Protection Language Models (PPLM), a novel paradigm for fine-tuning LLMs that effectively injects domain-specific knowledge while safeguarding data privacy. \nOur work offers a theoretical analysis for model design and delves into various techniques such as corpus curation, penalty-based unlikelihood in training loss, and instruction-based tuning, etc. Extensive experiments across diverse datasets and scenarios demonstrate the effectiveness of our approaches. In particular, instruction tuning with both positive and negative examples, stands out as a promising method, effectively protecting private data while enhancing the model's knowledge. Our work underscores the potential for Large Language Models as robust privacy protection learners.",
        "keywords": "Large language model;Privacy protection",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Yijia Xiao;Yiqiao Jin;Yushi Bai;Yue Wu;Xianjun Yang;Xiao Luo;Wenchao Yu;Xujiang Zhao;Yanchi Liu;Haifeng Chen;Wei Wang;Wei Cheng",
        "authorids": "~Yijia_Xiao1;~Yiqiao_Jin1;~Yushi_Bai1;~Yue_Wu12;~Xianjun_Yang1;~Xiao_Luo3;~Wenchao_Yu1;~Xujiang_Zhao1;~Yanchi_Liu1;~Haifeng_Chen1;~Wei_Wang13;~Wei_Cheng1",
        "gender": "M;M;M;M;M;M;;M;M;;F;M",
        "homepage": "https://yijia-xiao.com;https://ahren09.github.io/;https://bys0318.github.io/;https://yuewu.us/;;http://luoxiao12.github.io;;https://zxj32.github.io/;;https://haifengchen.gitlab.io/intro/;http://www.cs.ucla.edu/~weiwang;https://chengw07.github.io/",
        "dblp": "238/7281.html;207/6631.html;302/4421;41/5979-11;37/10237;50/1585-1;07/8491;221/5767;62/8146;08/57-1.html;w/WeiWang.html;89/2506-2.html",
        "google_scholar": "xLwcZvYAAAAJ;eY85qm4AAAAJ;https://scholar.google.com/citations?hl=zh-CN;kSQ1mLYAAAAJ;Tunh15sAAAAJ;https://scholar.google.com.hk/citations?;;k2-JcFAAAAAJ;faLmr-YAAAAJ;QzakB68AAAAJ;UedS9LQAAAAJ;PRrGVmoAAAAJ",
        "orcid": ";0000-0002-6974-5970;;;0000-0003-3318-8444;;;;;;0000-0002-8180-2886;",
        "linkedin": "yijia-xiao/;ahren-jin/;;;xianjun-yang-0062aa1a6/;%E9%9C%84-%E7%BD%97-303548214/;;zxj32/;;;wei-wang-8800845/;wei-cheng-ml/",
        "or_profile": "~Yijia_Xiao1;~Yiqiao_Jin1;~Yushi_Bai1;~Yue_Wu12;~Xianjun_Yang1;~Xiao_Luo3;~Wenchao_Yu1;~Xujiang_Zhao1;~Yanchi_Liu1;~Haifeng_Chen1;~Wei_Wang13;~Wei_Cheng1",
        "aff": "University of California, Los Angeles;Georgia Institute of Technology;Tsinghua University;University of California, Los Angeles;University of California, Santa Barbara;University of California, Los Angeles;University of California, Los Angeles;NEC Labs America;NEC-Labs;NEC-Labs;University of California, Los Angeles;NEC-Labs",
        "aff_domain": "ucla.edu;gatech.edu;tsinghua.edu.cn;ucla.edu;ucsb.edu;cs.ucla.edu;ucla.edu;nec-labs.com;nec-labs.com;nec-labs.com;ucla.edu;nec-labs.com",
        "position": "PhD student;PhD student;PhD student;PhD student;PhD student;Postdoc;PhD student;Researcher;Researcher;Researcher;Full Professor;Principal Researcher",
        "bibtex": "@misc{\nxiao2024large,\ntitle={Large Language Models Can Be Good Privacy Protection Learners},\nauthor={Yijia Xiao and Yiqiao Jin and Yushi Bai and Yue Wu and Xianjun Yang and Xiao Luo and Wenchao Yu and Xujiang Zhao and Yanchi Liu and Haifeng Chen and Wei Wang and Wei Cheng},\nyear={2024},\nurl={https://openreview.net/forum?id=6JcbNMEFPw}\n}",
        "github": "",
        "project": "",
        "reviewers": "wbo6;UJs9;qBeM;8QZB",
        "site": "https://openreview.net/forum?id=6JcbNMEFPw",
        "pdf_size": 1268612,
        "rating": "5;5;5;6",
        "confidence": "4;3;4;4",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "3;1;3;3",
        "wc_summary": "144;28;85;72",
        "wc_strengths": "70;40;41;48",
        "wc_weaknesses": "281;32;76;73",
        "wc_questions": "369;297;96;1",
        "wc_review": "864;397;298;194",
        "wc_reply_reviewers": "0;142;57;0",
        "wc_reply_authors": "1744;492;727;1005",
        "reply_reviewers": "0;2;1;0",
        "reply_authors": "7;6;6;3",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            82.25,
            41.43896113562694
        ],
        "wc_strengths_avg": [
            49.75,
            12.090802289343747
        ],
        "wc_weaknesses_avg": [
            115.5,
            97.11977141653496
        ],
        "wc_questions_avg": [
            190.75,
            148.36167800345208
        ],
        "wc_review_avg": [
            438.25,
            256.0726215353762
        ],
        "wc_reply_reviewers_avg": [
            49.75,
            58.12217735081851
        ],
        "wc_reply_authors_avg": [
            992.0,
            470.6107733573468
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            5.5,
            1.5
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            12,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0;1;2;0;3;0;0;4;5;5;0;5",
        "aff_unique_norm": "University of California, Los Angeles;Georgia Institute of Technology;Tsinghua University;University of California, Santa Barbara;NEC Labs America;NEC Laboratories",
        "aff_unique_dep": ";;;;;",
        "aff_unique_url": "https://www.ucla.edu;https://www.gatech.edu;https://www.tsinghua.edu.cn;https://www.ucsb.edu;https://www.nec-labs.com;https://www.nec-labs.com",
        "aff_unique_abbr": "UCLA;Georgia Tech;THU;UCSB;NEC LA;NEC-Labs",
        "aff_campus_unique_index": "0;0;2;0;0;0",
        "aff_campus_unique": "Los Angeles;;Santa Barbara",
        "aff_country_unique_index": "0;0;1;0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "6K81ILDnuv",
        "title": "Learning from Integral Losses in Physics Informed Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This work proposes a solution for the problem of training physics-informed networks under partial integro-differential equations. These equations require an infinite or a large number of neural evaluations to construct a single residual for training.  As a result, accurate evaluation may be impractical, and we show that naive approximations at replacing these integrals with unbiased estimates lead to biased loss functions and solutions. To overcome this bias, we investigate three types of potential solutions: the deterministic sampling approach, the double-sampling trick, and the delayed target method. We consider three classes of PDEs for benchmarking; one defining Poisson problems with singular charges and weak solutions of up to 10 dimensions, another involving weak solutions on electro-magnetic fields and a Maxwell equation, and a third one defining a Smoluchowski coagulation problem. Our numerical results confirm the existence of the aforementioned bias in practice, and also show that our proposed delayed target approach can lead to accurate solutions with comparable quality to ones estimated with a large number of samples. Our implementation is open-source and available at https://anonymous.4open.science/r/btspinn.",
        "keywords": "Integral Losses;Partial Integro-Differential Equations;Physics Informed Neural Networks; Delayed Target Method",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "",
        "author": "Ehsan Saleh;Saba Ghaffari;Tim Bretl;Luke Olson;Matthew West",
        "authorids": "~Ehsan_Saleh1;~Saba_Ghaffari1;~Tim_Bretl1;~Luke_Olson1;~Matthew_West1",
        "gender": ";F;M;M;",
        "homepage": ";;http://bretl.csl.illinois.edu/;http://lukeo.cs.illinois.edu/;http://lagrange.mechse.illinois.edu",
        "dblp": ";;29/2834;06/8561.html;",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;https://scholar.google.com.tw/citations?user=ab_0lGcAAAAJ;o43oc6AAAAAJ;",
        "orcid": ";;;0000-0002-5283-6104;0000-0002-7605-0050",
        "linkedin": ";saba-ghaffari-171a3356/;;;",
        "or_profile": "~Ehsan_Saleh1;~Saba_Ghaffari1;~Tim_Bretl1;~Luke_Olson1;~Matthew_West1",
        "aff": ";University of Illinois, Urbana Champaign;University of Illinois, Urbana Champaign;University of Illinois, Urbana Champaign;University of Illinois, Urbana Champaign",
        "aff_domain": ";illinois.edu;illinois.edu;illinois.edu;illinois.edu",
        "position": ";PhD student;Full Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nsaleh2024learning,\ntitle={Learning from Integral Losses in Physics Informed Neural Networks},\nauthor={Ehsan Saleh and Saba Ghaffari and Tim Bretl and Luke Olson and Matthew West},\nyear={2024},\nurl={https://openreview.net/forum?id=6K81ILDnuv}\n}",
        "github": "",
        "project": "",
        "reviewers": "LK81;izgt;jJr8;WnMU",
        "site": "https://openreview.net/forum?id=6K81ILDnuv",
        "pdf_size": 1776918,
        "rating": "5;5;5;6",
        "confidence": "3;4;4;1",
        "soundness": "2;2;4;3",
        "contribution": "2;3;3;3",
        "presentation": "1;2;3;3",
        "wc_summary": "55;117;81;103",
        "wc_strengths": "29;23;73;41",
        "wc_weaknesses": "54;75;484;61",
        "wc_questions": "305;41;104;5",
        "wc_review": "443;256;742;210",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.0,
            1.224744871391589
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            89.0,
            23.45207879911715
        ],
        "wc_strengths_avg": [
            41.5,
            19.30673457630782
        ],
        "wc_weaknesses_avg": [
            168.5,
            182.31086089424295
        ],
        "wc_questions_avg": [
            113.75,
            115.9641647234179
        ],
        "wc_review_avg": [
            412.75,
            209.1642596143041
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9428090415820632,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8952720426583083926&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of Illinois Urbana-Champaign",
        "aff_unique_dep": "",
        "aff_unique_url": "https://illinois.edu",
        "aff_unique_abbr": "UIUC",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Urbana-Champaign",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "UniTabE: A Universal Pretraining Protocol for Tabular Foundation Model in Data Science",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19395",
        "id": "6LLho5X6xV",
        "author_site": "Yazheng Yang, Yuqi Wang, Guang Liu, Ledell Wu, Qi Liu",
        "tldr": "",
        "abstract": "Recent advancements in Natural Language Processing (NLP) have witnessed the groundbreaking impact of pretrained models, yielding impressive outcomes across various tasks. This study seeks to extend the power of pretraining methodologies to facilitating the prediction over tables in data science, a domain traditionally overlooked, yet inherently challenging due to the plethora of table schemas intrinsic to different tasks. The primary research questions underpinning this work revolve around the establishment of a universal pretraining protocol for tables with varied structures, the generalizability and transferability of learned knowledge across tasks, the adaptation to diverse downstream applications, and the incorporation of incremental columns over time. In response to these challenges, we introduce UniTabE, a straightforward yet effective method designed to process tables in a uniform manner, devoid of constraints imposed by specific table structures. UniTabE's core concept relies on representing each basic table element with a module, termed TabUnit. This is subsequently followed by a Transformer encoder to refine the representation. Moreover, our model is designed to facilitate pretraining and finetuning through the utilization of free-form prompts. In order to implement the pretraining phase, we curated an expansive tabular dataset comprising approximately 13 billion samples, meticulously gathered from the Kaggle platform. This research primarily centers on classification and regression tasks involving tabular data, and conducts rigorous experimental testing and analyses to validate the effectiveness of our methodology. The experimental results demonstrate UniTabE's superior performance against several baseline models across a multitude of benchmark datasets. This, therefore, underscores UniTabE's potential to significantly enhance the semantic representation of tabular data, thereby marking a significant stride for tabular data analysis.",
        "keywords": "Pre-training Tabular Encoder;Pre-training;Heterogeneous Tabular Data;Classification and Regression;Deep Learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yazheng Yang;Yuqi Wang;Guang Liu;Ledell Wu;Qi Liu",
        "authorids": "~Yazheng_Yang2;~Yuqi_Wang5;~Guang_Liu2;~Ledell_Wu1;~Qi_Liu5",
        "gender": ";M;F;M;M",
        "homepage": "https://www.linkedin.com/in/yazheng-yang-zju-cs/;https://bugggggggg.github.io/;;http://leuchine.github.io/;",
        "dblp": "222/9478;20/1168-3.html;206/6528;;193/2510-6",
        "google_scholar": "SAeMbW4AAAAJ;1fazBgUAAAAJ;-eJHVt8AAAAJ;Y-OeKMwAAAAJ;PqsOPSwAAAAJ",
        "orcid": "0000-0003-1627-8341;0009-0000-2930-0654;;0000-0003-4608-5778;",
        "linkedin": "yazheng-yang-zju-cs/;yuqi-wang-2746a8258/;;;",
        "or_profile": "~Yazheng_Yang2;~Yuqi_Wang5;~Ledell_Wu1;~Qi_Liu5;~Peter_Guang1",
        "aff": "The University of Hong Kong;University of Hong Kong;Creatify AI;University of Hong Kong;Beijing Academy of Artificial Intelligence",
        "aff_domain": "hku.hk;hku.hk;creatify.ai;hku.hk;baai.ac.cn",
        "position": "PhD student;MS student;Researcher;Assistant Professor;Researcher",
        "bibtex": "@inproceedings{\nyang2024unitabe,\ntitle={UniTabE: A Universal Pretraining Protocol for Tabular Foundation  Model in Data Science},\nauthor={Yazheng Yang and Yuqi Wang and Guang Liu and Ledell Wu and Qi Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=6LLho5X6xV}\n}",
        "github": "",
        "project": "",
        "reviewers": "3wag;KBNh;es5d",
        "pdf_size": 2155377,
        "rating": "5;6;8",
        "confidence": "3;5;3",
        "soundness": "2;4;3",
        "contribution": "2;3;3",
        "presentation": "3;3;3",
        "wc_summary": "202;105;109",
        "wc_strengths": "157;147;114",
        "wc_weaknesses": "252;164;163",
        "wc_questions": "56;112;99",
        "wc_review": "667;528;485",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "649;739;739",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;2;2",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            138.66666666666666,
            44.81319250201019
        ],
        "wc_strengths_avg": [
            139.33333333333334,
            18.372685039360892
        ],
        "wc_weaknesses_avg": [
            193.0,
            41.72129751897305
        ],
        "wc_questions_avg": [
            89.0,
            23.930454794396756
        ],
        "wc_review_avg": [
            560.0,
            77.67024312223225
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            709.0,
            42.42640687119285
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.18898223650461365,
        "gs_citation": 16,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10684779965231187666&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=6LLho5X6xV",
        "pdf": "https://openreview.net/pdf?id=6LLho5X6xV",
        "email": "hku.hk;hku.hk;creatify.ai;hku.hk;baai.ac.cn",
        "author_num": 5,
        "aff_unique_index": "0;0;1;0;2",
        "aff_unique_norm": "University of Hong Kong;Creatify AI;Beijing Academy of Artificial Intelligence",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.hku.hk;;https://www.baaic.cn",
        "aff_unique_abbr": "HKU;;BAAI",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China;"
    },
    {
        "id": "6LNTSrJjBe",
        "title": "Language Agent Tree Search Unifies Reasoning Acting and Planning in Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "While large language models (LLMs) have demonstrated impressive performance on a range of decision-making tasks, they rely on simple acting processes and fall short of broad deployment as autonomous agents. We introduce LATS (Language Agent Tree Search), a general framework that synergizes the capabilities of LLMs in planning, acting, and reasoning. Drawing inspiration from Monte Carlo tree search in model-based reinforcement learning, LATS employs LLMs as agents, value functions, and optimizers, repurposing their latent strengths for enhanced decision-making. What is crucial in this method is the use of an environment for external feedback, which offers a more deliberate and adaptive problem-solving mechanism that moves beyond the limitations of existing methods. Our experimental evaluation across diverse domains, such as programming, HotPotQA, and WebShop, demonstrates the superiority and versatility of LATS for both reasoning and acting. In particular, LATS achieves 94.4\\% for programming on HumanEval with GPT-4 and an average score of 75.9 for web browsing on WebShop, demonstrating the effectiveness and generality of our method.",
        "keywords": "large language models;agent;reasoning;decision-making",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Andy Zhou;Kai Yan;Michal Shlapentokh-Rothman;Haohan Wang;Yu-Xiong Wang",
        "authorids": "~Andy_Zhou2;~Kai_Yan1;~Michal_Shlapentokh-Rothman1;~Haohan_Wang1;~Yu-Xiong_Wang1",
        "gender": "M;M;M;;F",
        "homepage": "https://www.andyzhou.ai;https://kaiyan289.github.io/;http://cs.cmu.edu/~haohanw;https://yxw.cs.illinois.edu/;https://michalmsr.web.illinois.edu/",
        "dblp": ";;132/4066;35/10700;269/4751",
        "google_scholar": "https://scholar.google.com/citations?hl=en;KElKfgQAAAAJ;nZxJGeUAAAAJ;T_Q-xDkAAAAJ;x9szIWsAAAAJ",
        "orcid": ";;;;",
        "linkedin": "andy-zhou-679376206/;%E5%BC%80-%E9%A2%9C-18b7931b1/;haohanwang/;;michal-shlapentokh-rothman/",
        "or_profile": "~Andy_Zhou2;~Kai_Yan1;~Haohan_Wang1;~Yu-Xiong_Wang1;~Michal_M_Shlapentokh-Rothman1",
        "aff": "Department of Computer Science;University of Illinois, Urbana Champaign;University of Illinois, Urbana Champaign;Department of Computer Science, University of Illinois Urbana-Champaign;University of Illinois, Urbana Champaign",
        "aff_domain": "cs.illinois.edu;cs.illinois.edu;illinois.edu;cs.illinois.edu;illinois.edu",
        "position": "Undergrad student;PhD student;Assistant Professor;Assistant Professor;PhD student",
        "bibtex": "@misc{\nzhou2024language,\ntitle={Language Agent Tree Search Unifies Reasoning Acting and Planning in Language Models},\nauthor={Andy Zhou and Kai Yan and Michal Shlapentokh-Rothman and Haohan Wang and Yu-Xiong Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=6LNTSrJjBe}\n}",
        "github": "",
        "project": "",
        "reviewers": "7QYU;j4Tk;3Lmb;15HT",
        "site": "https://openreview.net/forum?id=6LNTSrJjBe",
        "pdf_size": 782168,
        "rating": "3;5;5;6",
        "confidence": "4;3;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;1;2;3",
        "wc_summary": "66;27;57;43",
        "wc_strengths": "29;25;44;55",
        "wc_weaknesses": "179;241;146;93",
        "wc_questions": "151;14;208;8",
        "wc_review": "425;307;455;199",
        "wc_reply_reviewers": "185;412;86;11",
        "wc_reply_authors": "2649;1526;2304;1340",
        "reply_reviewers": "1;2;1;1",
        "reply_authors": "5;3;4;2",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            48.25,
            14.7542366796795
        ],
        "wc_strengths_avg": [
            38.25,
            11.986972094736853
        ],
        "wc_weaknesses_avg": [
            164.75,
            53.65806090421084
        ],
        "wc_questions_avg": [
            95.25,
            86.6526831667664
        ],
        "wc_review_avg": [
            346.5,
            101.5517109653993
        ],
        "wc_reply_reviewers_avg": [
            173.5,
            150.89483092538325
        ],
        "wc_reply_authors_avg": [
            1954.75,
            539.8385754093533
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.5,
            1.118033988749895
        ],
        "replies_avg": [
            30,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.13245323570650439,
        "gs_citation": 191,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5570756468692384789&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 10,
        "aff_unique_index": "0;1;1;1;1",
        "aff_unique_norm": "Unknown Institution;University of Illinois Urbana-Champaign",
        "aff_unique_dep": "Department of Computer Science;",
        "aff_unique_url": ";https://illinois.edu",
        "aff_unique_abbr": ";UIUC",
        "aff_campus_unique_index": "1;1;1;1",
        "aff_campus_unique": ";Urbana-Champaign",
        "aff_country_unique_index": "1;1;1;1",
        "aff_country_unique": ";United States"
    },
    {
        "id": "6LyO8WTVTU",
        "title": "A Teacher-Guided Framework for Graph Representation Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We consider the problem of unsupervised representation learning for Graph Neural Networks (GNNs). \nSeveral state-of-the-art approaches to this problem are based on Contrastive Learning (CL) principles that generate transferable representations. \nTheir objective function can be posed as a supervised discriminative task using 'hard labels', as they consider each pair of graphs as either 'equally positive' or 'equally negative'.\nHowever, it has been observed that using 'soft labels' in a Bayesian way can reduce the variance of the risk for discriminative tasks in supervised settings. \nMotivated by this, we propose a CL framework for GNNs, called *Teacher-guided Graph Contrastive Learning (TGCL)*, that incorporates `soft labels' to facilitate a more regularized discrimination. \nIn particular, we propose a teacher-student framework where the student network learns the representation by distilling the representations produced by the teacher network trained using unlabelled graphs. \nOur proposed approach can be adapted to any existing CL methods and empirically improves the performance across diverse downstream tasks.",
        "keywords": "graph neural network;representation learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Arnab Kumar Mondal;Jay Nandy;Manohar Kaul;Prathosh AP",
        "authorids": "~Arnab_Kumar_Mondal2;~Jay_Nandy1;~Manohar_Kaul1;~Prathosh_AP1",
        "gender": "M;M;M;M",
        "homepage": ";;https://manukaul.github.io/;https://sites.google.com/view/prathosh",
        "dblp": ";193/4096;29/10735;218/5887",
        "google_scholar": "MZ8N49AAAAAJ;https://scholar.google.co.in/citations?user=8N_wxz8AAAAJ;https://scholar.google.com.tw/citations?user=jNroyK4AAAAJ;https://scholar.google.co.in/citations?user=OEwV4bsAAAAJ",
        "orcid": "0000-0001-7297-374X;;;",
        "linkedin": "arnab-mondal-a4448a18/;jay-nandy-36654b34/;manu-k-72b936287/;prathosh-ap-phd-50ab9511/",
        "or_profile": "~Arnab_Kumar_Mondal2;~Jay_Nandy1;~Manohar_Kaul1;~Prathosh_AP1",
        "aff": "Fujitsu Research and Development Center Co. Ltm.;Fujitsu Research and Development Center Co. Ltm.;Fujitsu Research and Development Center Co. Ltm.;Indian Institute of Science, Indian institute of science, Bangalore",
        "aff_domain": "fujitsu.com;fujitsu.com;fujitsu.com;iisc.ac.in",
        "position": "Researcher;Researcher;Principal Researcher;Assistant Professor",
        "bibtex": "@misc{\nmondal2024a,\ntitle={A Teacher-Guided Framework for Graph Representation Learning},\nauthor={Arnab Kumar Mondal and Jay Nandy and Manohar Kaul and Prathosh AP},\nyear={2024},\nurl={https://openreview.net/forum?id=6LyO8WTVTU}\n}",
        "github": "",
        "project": "",
        "reviewers": "RhAx;xgHF;2WDw",
        "site": "https://openreview.net/forum?id=6LyO8WTVTU",
        "pdf_size": 1392351,
        "rating": "3;3;5",
        "confidence": "4;4;3",
        "soundness": "2;3;3",
        "contribution": "2;2;3",
        "presentation": "3;3;3",
        "wc_summary": "52;53;101",
        "wc_strengths": "54;24;30",
        "wc_weaknesses": "185;67;322",
        "wc_questions": "3;45;8",
        "wc_review": "294;189;461",
        "wc_reply_reviewers": "0;0;1081",
        "wc_reply_authors": "581;360;1657",
        "reply_reviewers": "0;0;3",
        "reply_authors": "1;1;4",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            68.66666666666667,
            22.866763848189994
        ],
        "wc_strengths_avg": [
            36.0,
            12.96148139681572
        ],
        "wc_weaknesses_avg": [
            191.33333333333334,
            104.19959479554397
        ],
        "wc_questions_avg": [
            18.666666666666668,
            18.732028424302822
        ],
        "wc_review_avg": [
            314.6666666666667,
            112.0009920590984
        ],
        "wc_reply_reviewers_avg": [
            360.3333333333333,
            509.5882869751053
        ],
        "wc_reply_authors_avg": [
            866.0,
            566.5515569360539
        ],
        "reply_reviewers_avg": [
            1.0,
            1.4142135623730951
        ],
        "reply_authors_avg": [
            2.0,
            1.4142135623730951
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:V5BOlabZ7fsJ:scholar.google.com/&scioq=A+Teacher-Guided+Framework+for+Graph+Representation+Learning&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "Fujitsu Research and Development Center;Indian Institute of Science",
        "aff_unique_dep": "Research and Development;",
        "aff_unique_url": "https://www.fujitsu.com/global/;https://www.iisc.ac.in",
        "aff_unique_abbr": "Fujitsu R&D;IISc",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Bangalore",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "Japan;India"
    },
    {
        "id": "6M5G5hNiAU",
        "title": "How Abilities in Large Language Models are Affected by Supervised Fine-tuning Data Composition",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large language models (LLMs) with enormous pre-training tokens and parameter amounts emerge abilities including math reasoning, code generation, and instruction following. These abilities are further enhanced by supervised fine-tuning (SFT). The open-source community has studied on ad-hoc SFT for each ability, while proprietary LLMs are versatile for all abilities. It is important to investigate how to unlock them with multiple abilities via SFT. In this study, we specifically focus on the data composition between mathematical reasoning, code generation, and general human-aligning abilities during SFT. From a scaling perspective, we investigate the relationship between model abilities and various factors including data amounts, data composition ratio, model parameters, and SFT strategies. Our experiments reveal that different abilities exhibit different scaling patterns, and larger models generally show superior performance with the same amount of data. Mathematical reasoning and code generation improve as data amounts increase consistently, while the general ability is enhanced with about a thousand samples and improves slowly. We find data composition results in various abilities improvements with low data amounts, while conflicts of abilities with high data amounts. Our experiments further show that composition data amount impacts performance, while the influence of composition ratio is insignificant. Regarding the SFT strategies, we evaluate sequential learning multiple abilities are prone to catastrophic forgetting. Our proposed Dual-stage Mixed Fine-tuning (DMT) strategy learns specialized abilities first and then learns general abilities with a small amount of specialized data to prevent forgetting, offering a promising solution to learn multiple abilities with different scaling patterns.",
        "keywords": "Data Composition;Large Language Model;Scaling Analysis;Supervised Fine-tuning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Guanting Dong;Hongyi Yuan;Keming Lu;Chengpeng Li;Mingfeng Xue;Dayiheng Liu;Wei Wang;Zheng Yuan;Chang Zhou;Jingren Zhou",
        "authorids": "~Guanting_Dong1;~Hongyi_Yuan1;~Keming_Lu1;~Chengpeng_Li1;~Mingfeng_Xue1;~Dayiheng_Liu1;~Wei_Wang41;~Zheng_Yuan2;~Chang_Zhou2;~Jingren_Zhou1",
        "gender": "M;M;M;M;M;M;M;M;M;M",
        "homepage": "https://dongguanting.github.io/;;;;;https://dayihengliu.github.io/;;;;",
        "dblp": ";308/0909;65/6898.html;;;https://dblp.uni-trier.de/pers/hd/l/Liu:Dayiheng;35/7092-225;56/2877-2;;84/2644",
        "google_scholar": "amozZDkAAAAJ;FG3O4i8AAAAJ;WuD2op4AAAAJ;5pidFF8AAAAJ;;pPLQrX4AAAAJ;0zSeT3oAAAAJ;https://scholar.google.com/citations?hl=zh-CN;QeSoG3sAAAAJ;",
        "orcid": ";;;;;0000-0002-8755-8941;0000-0002-7028-9845;;;",
        "linkedin": ";;;;;;;;;",
        "or_profile": "~Guanting_Dong1;~Hongyi_Yuan1;~Keming_Lu1;~Chengpeng_Li1;~Mingfeng_Xue1;~Dayiheng_Liu1;~Wei_Wang41;~Zheng_Yuan2;~Chang_Zhou2;~Jingren_Zhou1",
        "aff": "Beijing University of Posts and Telecommunications;Tsinghua University;Alibaba Group;University of Science and Technology of China;Sichuan University;Alibaba Group;Meituan;Alibaba Group;Alibaba Group;Alibaba Group",
        "aff_domain": "bupt.edu.cn;tsinghua.edu.cn;alibaba-inc.com;ustc.edu.cn;scu.edu.cn;alibaba-inc.com;meituan.com;alibaba-inc.com;alibaba-inc.com;alibaba-inc.com",
        "position": "MS student;PhD student;Researcher;PhD student;PhD student;Researcher;Principal Researcher;Researcher;Researcher;Researcher",
        "bibtex": "@misc{\ndong2024how,\ntitle={How Abilities in Large Language Models are Affected by Supervised Fine-tuning Data Composition},\nauthor={Guanting Dong and Hongyi Yuan and Keming Lu and Chengpeng Li and Mingfeng Xue and Dayiheng Liu and Wei Wang and Zheng Yuan and Chang Zhou and Jingren Zhou},\nyear={2024},\nurl={https://openreview.net/forum?id=6M5G5hNiAU}\n}",
        "github": "",
        "project": "",
        "reviewers": "4phB;crg6;C1QY",
        "site": "https://openreview.net/forum?id=6M5G5hNiAU",
        "pdf_size": 713131,
        "rating": "3;5;6",
        "confidence": "4;3;4",
        "soundness": "2;2;3",
        "contribution": "1;2;3",
        "presentation": "2;3;3",
        "wc_summary": "46;56;80",
        "wc_strengths": "28;81;99",
        "wc_weaknesses": "133;260;113",
        "wc_questions": "103;94;353",
        "wc_review": "310;491;645",
        "wc_reply_reviewers": "0;62;17",
        "wc_reply_authors": "262;1526;2012",
        "reply_reviewers": "0;1;1",
        "reply_authors": "1;4;6",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            60.666666666666664,
            14.2672897060218
        ],
        "wc_strengths_avg": [
            69.33333333333333,
            30.13672547278855
        ],
        "wc_weaknesses_avg": [
            168.66666666666666,
            65.09650954971055
        ],
        "wc_questions_avg": [
            183.33333333333334,
            120.02870027159707
        ],
        "wc_review_avg": [
            482.0,
            136.91116341141313
        ],
        "wc_reply_reviewers_avg": [
            26.333333333333332,
            26.157641755751268
        ],
        "wc_reply_authors_avg": [
            1266.6666666666667,
            737.5930826380868
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            2.0548046676563256
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": -0.18898223650461363,
        "gs_citation": 119,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12013057803072540290&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;2;3;4;2;5;2;2;2",
        "aff_unique_norm": "Beijing University of Posts and Telecommunications;Tsinghua University;Alibaba Group;University of Science and Technology of China;Sichuan University;Meituan",
        "aff_unique_dep": ";;;;;",
        "aff_unique_url": "http://www.bupt.edu.cn/;https://www.tsinghua.edu.cn;https://www.alibaba.com;http://www.ustc.edu.cn;https://www.scu.edu.cn;https://www.meituan.com",
        "aff_unique_abbr": "BUPT;THU;Alibaba;USTC;SCU;Meituan",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Beijing;",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "SaProt: Protein Language Modeling with Structure-aware Vocabulary",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19394",
        "id": "6MRm3G4NiU",
        "author_site": "Jin Su, Chenchen Han, Yuyang Zhou, Junjie Shan, Xibin Zhou, Fajie Yuan",
        "tldr": "",
        "abstract": "Large-scale protein language models (PLMs), such as the ESM family, have achieved remarkable performance in various downstream tasks related to protein structure and function by undergoing unsupervised training on residue sequences. They have become essential tools for researchers and practitioners in biology.  However, a limitation of vanilla PLMs is their lack of explicit consideration for protein structure information, which suggests the potential for further improvement. Motivated by this, we introduce the concept of a ``structure-aware vocabulary\" that  integrates residue tokens with structure tokens.    The structure tokens are  derived  by encoding the 3D structure of proteins using Foldseek. We then propose SaProt, a large-scale general-purpose PLM trained on an extensive dataset comprising approximately 40 million protein sequences and structures. Through extensive evaluation, our SaProt model surpasses well-established and renowned baselines across 10 significant downstream tasks, demonstrating its exceptional capacity and broad applicability. We have made the code, pre-trained model, and all relevant materials available at https://github.com/westlake-repl/SaProt.",
        "keywords": "Protein Language Models;Universal Representations;Downstream Tasks;Protein Structure Modeling",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Jin Su;Chenchen Han;Yuyang Zhou;Junjie Shan;Xibin Zhou;Fajie Yuan",
        "authorids": "~Jin_Su1;~Chenchen_Han1;~Yuyang_Zhou1;~Junjie_Shan1;~Xibin_Zhou1;~Fajie_Yuan2",
        "gender": "M;;Not Specified;M;M;M",
        "homepage": "https://ltenjoy.github.io/;;;https://scholar.google.com/citations?user=LhaFXOEAAAAJ&hl=en;https://fajieyuan.github.io/;https://github.com/zhoubay",
        "dblp": ";;;;175/4819;",
        "google_scholar": "47BkgB8AAAAJ;;;LhaFXOEAAAAJ;yOiBwasAAAAJ;",
        "orcid": ";0000-0002-3330-5308;;;;",
        "linkedin": ";;yuyang-zhou-150301222/;;;",
        "or_profile": "~Jin_Su1;~Chenchen_Han1;~Yuyang_Zhou1;~Junjie_Shan1;~Fajie_Yuan2;~Xibin_Bayes_Zhou1",
        "aff": "Westlake University;Westlake University;Westlake University;Westlake University;Westlake University;Westlake University",
        "aff_domain": "westlake.edu.cn;westlake.edu.cn;westlake.edu.cn;westlake.edu;westlake.edu.cn;westlake.edu",
        "position": "PhD student;PhD student;PhD student;Researcher;Assistant Professor;PhD student",
        "bibtex": "@inproceedings{\nsu2024saprot,\ntitle={SaProt: Protein Language Modeling with Structure-aware Vocabulary},\nauthor={Jin Su and Chenchen Han and Yuyang Zhou and Junjie Shan and Xibin Zhou and Fajie Yuan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=6MRm3G4NiU}\n}",
        "github": "",
        "project": "",
        "reviewers": "1519;LEd3;WitX",
        "pdf_size": 4933295,
        "rating": "6;8;8",
        "confidence": "3;5;5",
        "soundness": "3;4;3",
        "contribution": "3;3;3",
        "presentation": "2;4;3",
        "wc_summary": "93;81;80",
        "wc_strengths": "81;72;80",
        "wc_weaknesses": "236;74;45",
        "wc_questions": "92;70;68",
        "wc_review": "502;297;273",
        "wc_reply_reviewers": "118;12;32",
        "wc_reply_authors": "2053;513;672",
        "reply_reviewers": "1;1;1",
        "reply_authors": "3;1;1",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            84.66666666666667,
            5.90668171555645
        ],
        "wc_strengths_avg": [
            77.66666666666667,
            4.0276819911981905
        ],
        "wc_weaknesses_avg": [
            118.33333333333333,
            84.040995287353
        ],
        "wc_questions_avg": [
            76.66666666666667,
            10.873004286866728
        ],
        "wc_review_avg": [
            357.3333333333333,
            102.76294187216625
        ],
        "wc_reply_reviewers_avg": [
            54.0,
            45.985504962614755
        ],
        "wc_reply_authors_avg": [
            1079.3333333333333,
            691.5395063833221
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.9999999999999998,
        "gs_citation": 117,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18080281709349236734&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=6MRm3G4NiU",
        "pdf": "https://openreview.net/pdf?id=6MRm3G4NiU",
        "email": "westlake.edu.cn;westlake.edu.cn;westlake.edu.cn;westlake.edu;westlake.edu.cn;westlake.edu",
        "author_num": 6,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "Westlake University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.westlake.edu.cn",
        "aff_unique_abbr": "WU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Graphical Multioutput Gaussian Process with Attention",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19393",
        "id": "6N8TW504aa",
        "author_site": "Yijue Dai, Wenzhong Yan, Feng Yin",
        "tldr": "",
        "abstract": "Integrating information while recognizing dependence from multiple data sources and enhancing the predictive performance of the multi-output regression are challenging tasks. Multioutput Gaussian Process (MOGP) methods offer outstanding solutions with tractable predictions and uncertainty quantification. However, their practical applications are hindered by high computational complexity and storage demand. Additionally, there exist model mismatches in existing MOGP models when dealing with non-Gaussian data. To improve the model representation ability in terms of flexibility, optimality, and scalability, this paper introduces a novel multi-output regression framework, termed Graphical MOGP (GMOGP), which is empowered by: (i) Generating flexible Gaussian process priors consolidated from dentified parents, (ii) providing dependent processes with attention-based graphical representations, and (iii) achieving Pareto optimal solutions of kernel hyperparameters via a distributed learning framework. Numerical results confirm that the proposed GMOGP significantly outperforms state-of-the-art MOGP alternatives in predictive performance, as well as in time and memory efficiency, across various synthetic and real datasets.",
        "keywords": "Gaussian process regression;Multioutput Gaussian process;Attention mechanism",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Yijue Dai;Wenzhong Yan;Feng Yin",
        "authorids": "~Yijue_Dai1;~Wenzhong_Yan1;~Feng_Yin1",
        "gender": "M;M;",
        "homepage": "https://blsp-group.github.io/people.html;https://sse.cuhk.edu.cn/en/faculty/yinfeng;",
        "dblp": ";59/6917;",
        "google_scholar": ";4mW1N5oAAAAJ;upD7ilcAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Wenzhong_Yan1;~Feng_Yin1;~Dianna_Dai1",
        "aff": "School of Science and Engineering, The Chinese University of Hong Kong, Shenzhen;;CUHK(SZ)",
        "aff_domain": "cuhk.edu;;cuhk.edu.cn",
        "position": "PhD student;;PhD student",
        "bibtex": "@inproceedings{\ndai2024graphical,\ntitle={Graphical Multioutput Gaussian Process with Attention},\nauthor={Yijue Dai and Wenzhong Yan and Feng Yin},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=6N8TW504aa}\n}",
        "github": "",
        "project": "",
        "reviewers": "X7C1;pYyL;sgU9;9P5Q",
        "pdf_size": 1267166,
        "rating": "6;8;8;8",
        "confidence": "4;4;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;4;4;4",
        "wc_summary": "77;87;94;62",
        "wc_strengths": "26;98;203;132",
        "wc_weaknesses": "510;475;89;62",
        "wc_questions": "9;8;606;423",
        "wc_review": "622;668;992;679",
        "wc_reply_reviewers": "62;44;108;33",
        "wc_reply_authors": "1690;1039;1296;692",
        "reply_reviewers": "1;1;2;1",
        "reply_authors": "4;2;3;1",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            80.0,
            12.020815280171307
        ],
        "wc_strengths_avg": [
            114.75,
            63.72352391385775
        ],
        "wc_weaknesses_avg": [
            284.0,
            209.08491098116096
        ],
        "wc_questions_avg": [
            261.5,
            261.1422026406303
        ],
        "wc_review_avg": [
            740.25,
            146.91217614615883
        ],
        "wc_reply_reviewers_avg": [
            61.75,
            28.63891583143468
        ],
        "wc_reply_authors_avg": [
            1179.25,
            364.5472363082732
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:_GNysYaL62kJ:scholar.google.com/&scioq=Graphical+Multioutput+Gaussian+Process+with+Attention&hl=en&as_sdt=0,44",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=6N8TW504aa",
        "pdf": "https://openreview.net/pdf?id=6N8TW504aa",
        "email": "cuhk.edu;;cuhk.edu.cn",
        "author_num": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Chinese University of Hong Kong;Chinese University of Hong Kong, Shenzhen",
        "aff_unique_dep": "School of Science and Engineering;",
        "aff_unique_url": "https://www.cuhk.edu.cn;https://www.cuhk.edu.cn/sz",
        "aff_unique_abbr": "CUHK;CUHK(SZ)",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Shenzhen",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "6NEJ0ReNzr",
        "title": "Learning to Plan and Generate Text with Citations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The increasing demand for the deployment of LLMs in\ninformation-seeking scenarios has spurred efforts in creating\nverifiable systems, which generate responses to queries along with\nsupporting evidence. In this paper, we explore the attribution\ncapabilities of plan-based models which have been recently shown to\nimprove the faithfulness, grounding, and controllability of generated\ntext. We conceptualize plans as a sequence of questions which serve as\nblueprints of the generated content and its organisation. We\nexperiment with two models that utilize different variants of\nblueprints, an abstractive model where questions are\ngenerated from scratch, and an extractive\nmodel where the decoder is forced to copy questions from the\ninput. Experiments on long-form  question-answering  show\nthat  output quality improves for blueprint models when these learn\nto generate responses with attribution. Moreover,  the citations generated by blueprint models  are more accurate compared to those obtained from \nLLM-based pipelines lacking a planning component.",
        "keywords": "summarization;text generation;content planning;attribution",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Constanza Fierro;Reinald Kim Amplayo;Fantine Huot;Nicola De Cao;Joshua Maynez;Shashi Narayan;Mirella Lapata",
        "authorids": "~Constanza_Fierro1;~Reinald_Kim_Amplayo2;~Fantine_Huot1;~Nicola_De_Cao1;~Joshua_Maynez1;~Shashi_Narayan1;~Mirella_Lapata1",
        "gender": "M;F;M;M;M;F;F",
        "homepage": "https://rktamplayo.github.io;;https://nicola-decao.github.io;;https://sites.google.com/corp/view/shashinarayan/;https://homepages.inf.ed.ac.uk/mlap/;",
        "dblp": ";;218/6626;220/3863;74/8458;59/6701;205/9159",
        "google_scholar": ";79VvQLMAAAAJ;CqTR3sIAAAAJ;ZOYd-0oAAAAJ;prEcE9IAAAAJ;j67B9Q4AAAAJ;uYCIJSEAAAAJ",
        "orcid": ";;;;;;",
        "linkedin": ";fantine/;nicoladecao;;;;",
        "or_profile": "~Reinald_Kim_Amplayo2;~Fantine_Huot1;~Nicola_De_Cao1;~Joshua_Maynez1;~Shashi_Narayan1;~Mirella_Lapata1;~FIERRO_Constanza1",
        "aff": "Google;Google;Google;Google;Google;Edinburgh University, University of Edinburgh;Copenhagen University",
        "aff_domain": "google.com;google.com;google.com;google.com;google.com;inf.ed.ac.uk;ku.dk",
        "position": "Researcher;Researcher;Researcher;Researcher;Research Scientist;Full Professor;PhD student",
        "bibtex": "@misc{\nfierro2024learning,\ntitle={Learning to Plan and Generate Text with Citations},\nauthor={Constanza Fierro and Reinald Kim Amplayo and Fantine Huot and Nicola De Cao and Joshua Maynez and Shashi Narayan and Mirella Lapata},\nyear={2024},\nurl={https://openreview.net/forum?id=6NEJ0ReNzr}\n}",
        "github": "",
        "project": "",
        "reviewers": "8rJ6;eZwk;vp7e;LX3E",
        "site": "https://openreview.net/forum?id=6NEJ0ReNzr",
        "pdf_size": 985007,
        "rating": "3;6;6;8",
        "confidence": "4;4;4;4",
        "soundness": "3;3;3;4",
        "contribution": "2;3;3;4",
        "presentation": "2;3;2;4",
        "wc_summary": "63;74;133;133",
        "wc_strengths": "50;25;19;55",
        "wc_weaknesses": "369;145;63;16",
        "wc_questions": "220;2;10;75",
        "wc_review": "702;246;225;279",
        "wc_reply_reviewers": "279;0;0;8",
        "wc_reply_authors": "2152;476;401;123",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "3;2;2;1",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            100.75,
            32.48364973336586
        ],
        "wc_strengths_avg": [
            37.25,
            15.497983739828868
        ],
        "wc_weaknesses_avg": [
            148.25,
            135.55326443874378
        ],
        "wc_questions_avg": [
            76.75,
            87.41674610736779
        ],
        "wc_review_avg": [
            363.0,
            196.6659604507094
        ],
        "wc_reply_reviewers_avg": [
            71.75,
            119.70040726747759
        ],
        "wc_reply_authors_avg": [
            788.0,
            798.4099824025249
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14554465176635499021&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;0;0;0;1;2",
        "aff_unique_norm": "Google;University of Edinburgh;University of Copenhagen",
        "aff_unique_dep": "Google;;",
        "aff_unique_url": "https://www.google.com;https://www.ed.ac.uk;https://www.ku.dk",
        "aff_unique_abbr": "Google;Edinburgh;UCPH",
        "aff_campus_unique_index": "0;0;0;0;0",
        "aff_campus_unique": "Mountain View;",
        "aff_country_unique_index": "0;0;0;0;0;1;2",
        "aff_country_unique": "United States;United Kingdom;Denmark"
    },
    {
        "id": "6NO5UVWvo6",
        "title": "Annotation by Clicks: A Point-Supervised Contrastive Variance Method for Medical Semantic Segmentation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Medical image segmentation methods typically rely on numerous dense annotated images for model training, which are notoriously expensive and time-consuming to collect. To alleviate this burden, weakly supervised techniques have been exploited to train segmentation models with less expensive annotations. In this paper, we propose a novel point-supervised contrastive variance method (PSCV) for medical image semantic segmentation, which only requires one pixel-point from each organ category to be annotated. The proposed method trains the base segmentation network by using a novel contrastive variance (CV) loss to exploit the unlabeled pixels and a partial cross-entropy loss on the labeled pixels. The CV loss function is designed to exploit the statistical spatial distribution properties of organs in medical images and their variance distribution map representations to enforce discriminative predictions over the unlabeled pixels. Experimental results on two standard medical image datasets demonstrate that the proposed method outperforms the state-of-the-art weakly supervised methods on point-supervised medical image semantic segmentation tasks.",
        "keywords": "medical image segmentation",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/2cec34e201fefce2f43fe52a658cc51eb6dfb67b.pdf",
        "author": "Qing En;Yuhong Guo",
        "authorids": "~Qing_En2;~Yuhong_Guo1",
        "gender": "M;",
        "homepage": ";",
        "dblp": "189/4347;",
        "google_scholar": "4tNrFv8AAAAJ;",
        "orcid": "0000-0003-0173-7437;",
        "linkedin": "qingen;",
        "or_profile": "~Qing_En2;~Yuhong_Guo1",
        "aff": "Carleton University;",
        "aff_domain": "cunet.carleton.ca;",
        "position": "Postdoc;",
        "bibtex": "@misc{\nen2024annotation,\ntitle={Annotation by Clicks: A Point-Supervised Contrastive Variance Method for Medical Semantic Segmentation},\nauthor={Qing En and Yuhong Guo},\nyear={2024},\nurl={https://openreview.net/forum?id=6NO5UVWvo6}\n}",
        "github": "",
        "project": "",
        "reviewers": "WEjx;jaNJ;2T67;JEHB",
        "site": "https://openreview.net/forum?id=6NO5UVWvo6",
        "pdf_size": 2172041,
        "rating": "3;5;5;5",
        "confidence": "5;4;4;4",
        "soundness": "2;3;3;2",
        "contribution": "2;2;3;2",
        "presentation": "3;3;3;2",
        "wc_summary": "58;54;72;142",
        "wc_strengths": "31;73;61;58",
        "wc_weaknesses": "150;358;111;171",
        "wc_questions": "79;14;156;22",
        "wc_review": "318;499;400;393",
        "wc_reply_reviewers": "0;0;0;23",
        "wc_reply_authors": "537;523;431;504",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            81.5,
            35.563323804166565
        ],
        "wc_strengths_avg": [
            55.75,
            15.35211711784404
        ],
        "wc_weaknesses_avg": [
            197.5,
            95.13280191395604
        ],
        "wc_questions_avg": [
            67.75,
            56.78192934376217
        ],
        "wc_review_avg": [
            402.5,
            64.32145831680124
        ],
        "wc_reply_reviewers_avg": [
            5.75,
            9.959292143521045
        ],
        "wc_reply_authors_avg": [
            498.75,
            40.831207427652686
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3282580224938276696&as_sdt=5,34&sciodt=0,34&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0",
        "aff_unique_norm": "Carleton University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://carleton.ca",
        "aff_unique_abbr": "Carleton",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "6NaiZHL3l1",
        "title": "A Novel Evaluation Framework for Image Inpainting via Multi-Pass Self-Consistency",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Image inpainting aims to restore missing regions of corrupted images by utilizing the available unmasked content while ensuring consistency and fidelity. In scenarios where limited information is available, determining a unique optimal solution for a given inpainting case becomes challenging. However, existing assessment approaches predominantly rely on the availability of corresponding unmasked images, which introduces potential biases toward specific inpainting solutions. To address this disparity, we propose a novel evaluation framework that leverages the power of aggregated multi-pass image inpainting. Our self-supervised metric offers exceptional performance in scenarios with or without unmasked images. Rather than solely relying on similarity to the original images in terms of pixel space or feature space, our method prioritizes intrinsic self-consistency. This allows us to explore diverse and viable inpainting solutions while mitigating biases. Through extensive experimentation on multiple baselines, we demonstrate the strong alignment of our method with human perception, which is further supported by a comprehensive user study.",
        "keywords": "Image Inpainting",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/3b7090fa99ac74876d1ae24b46dcb3c750d7b316.zip",
        "author": "Tianyi Chen;Jianfu Zhang;Yan Hong;Liqing Zhang",
        "authorids": "~Tianyi_Chen7;~Jianfu_Zhang2;~Yan_Hong1;~Liqing_Zhang2",
        "gender": "M;M;F;M",
        "homepage": "https://github.com/control-cyber;https://matt-sjtu.github.io/;https://github.com/hy-zpg;http://bcmi.sjtu.edu.cn/~zhangliqing/",
        "dblp": "93/4437-1;78/3993-3;68/974-2.html;20/4627-1.html",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;https://scholar.google.com.hk/citations?user=ztq5-xcAAAAJ;1smFmxAAAAAJ",
        "orcid": "0009-0000-1203-6746;0000-0002-2673-5860;0000-0001-6401-0812;",
        "linkedin": ";;;",
        "or_profile": "~Tianyi_Chen7;~Jianfu_Zhang2;~Yan_Hong1;~Liqing_Zhang2",
        "aff": "Shanghai Jiaotong University;Shanghai Jiaotong University;Alibaba Group;Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn;sjtu.edu.cn;antgroup.com;sjtu.edu.cn",
        "position": "Undergrad student;Assistant Professor;Researcher;Full Professor",
        "bibtex": "@misc{\nchen2024a,\ntitle={A Novel Evaluation Framework for Image Inpainting via Multi-Pass Self-Consistency},\nauthor={Tianyi Chen and Jianfu Zhang and Yan Hong and Liqing Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=6NaiZHL3l1}\n}",
        "github": "",
        "project": "",
        "reviewers": "R8hK;ZP4Y;rSjt;yYxo",
        "site": "https://openreview.net/forum?id=6NaiZHL3l1",
        "pdf_size": 23052601,
        "rating": "1;3;3;5",
        "confidence": "4;5;4;3",
        "soundness": "1;1;2;2",
        "contribution": "1;1;2;3",
        "presentation": "2;2;3;2",
        "wc_summary": "48;56;87;51",
        "wc_strengths": "26;36;25;15",
        "wc_weaknesses": "162;168;224;35",
        "wc_questions": "31;6;23;404",
        "wc_review": "267;266;359;505",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            1.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            60.5,
            15.56438241627338
        ],
        "wc_strengths_avg": [
            25.5,
            7.433034373659253
        ],
        "wc_weaknesses_avg": [
            147.25,
            69.17143557856812
        ],
        "wc_questions_avg": [
            116.0,
            166.52177034850428
        ],
        "wc_review_avg": [
            349.25,
            97.5304439649487
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:unpA5IYKZE4J:scholar.google.com/&scioq=A+Novel+Evaluation+Framework+for+Image+Inpainting+via+Multi-Pass+Self-Consistency&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Shanghai Jiao Tong University;Alibaba Group",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.sjtu.edu.cn;https://www.alibaba.com",
        "aff_unique_abbr": "SJTU;Alibaba",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "NoiseDiffusion: Correcting Noise for Image Interpolation with Diffusion Models beyond Spherical Linear Interpolation",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19392",
        "id": "6O3Q6AFUTu",
        "author_site": "Pengfei Zheng, Yonggang Zhang, Zhen Fang, Tongliang Liu, Defu Lian, Bo Han",
        "tldr": "",
        "abstract": "Image interpolation based on diffusion models is promising in creating fresh and interesting images. \nAdvanced interpolation methods mainly focus on spherical linear interpolation, where images are encoded into the noise space and then interpolated for denoising to images. \nHowever, existing methods face challenges in effectively interpolating natural images (not generated by diffusion models), thereby restricting their practical applicability. \nOur experimental investigations reveal that these challenges stem from the invalidity of the encoding noise, which may no longer obey the expected noise distribution, e.g., a normal distribution. \nTo address these challenges, we propose a novel approach to correct noise for image interpolation, NoiseDiffusion. Specifically, NoiseDiffusion approaches the invalid noise to the expected distribution by introducing subtle Gaussian noise and introduces a constraint to suppress noise with extreme values. In this context, promoting noise validity contributes to mitigating image artifacts, but the constraint and introduced exogenous noise typically lead to a reduction in signal-to-noise ratio, i.e., loss of original image information. Hence, NoiseDiffusion performs interpolation within the noisy image space and injects raw images into these noisy counterparts to address the challenge of information loss. Consequently, NoiseDiffusion enables us to interpolate natural images without causing artifacts or information loss, thus achieving the best interpolation results.",
        "keywords": "Image Interpolation; Diffusion Models",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "PengFei Zheng;Yonggang Zhang;Zhen Fang;Tongliang Liu;Defu Lian;Bo Han",
        "authorids": "~PengFei_Zheng2;~Yonggang_Zhang1;~Zhen_Fang2;~Tongliang_Liu1;~Defu_Lian1;~Bo_Han1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://github.com/zheng-peng-fei;https://yonggangzhangben.github.io/index.html;https://fang-zhen.github.io/index.html;https://tongliang-liu.github.io/;https://faculty.ustc.edu.cn/liandefu/en/index.htm;https://bhanml.github.io/",
        "dblp": ";27/6859-3;;150/6667;87/10734;241/0472-3",
        "google_scholar": ";XSbEr98AAAAJ;OzD6WJcAAAAJ;https://scholar.google.com.au/citations?user=EiLdZ_YAAAAJ;QW0ad4sAAAAJ;nTNjqHwAAAAJ",
        "orcid": ";0000-0002-4080-7592;0000-0003-0602-6255;;0000-0002-3507-9607;",
        "linkedin": ";;;;;",
        "or_profile": "~PengFei_Zheng2;~Yonggang_Zhang1;~Zhen_Fang2;~Tongliang_Liu1;~Defu_Lian1;~bo_han2",
        "aff": "University of Science and Technology of China;Hong Kong Baptist University;University of Technology Sydney;Mohamed bin Zayed University of Artificial Intelligence;University of Science and Technology of China;MBZUAI",
        "aff_domain": "ustc.edu.cn;hkbu.edu.hk;uts.edu.au;mbzuai.ac.ae;ustc.edu.cn;mbzuai.ac.ae",
        "position": "MS student;Postdoc;Assistant Professor;Affiliated Associate Professor;Full Professor;Researcher",
        "bibtex": "@inproceedings{\nzheng2024noisediffusion,\ntitle={NoiseDiffusion: Correcting Noise for Image  Interpolation  with Diffusion Models beyond Spherical Linear Interpolation},\nauthor={PengFei Zheng and Yonggang Zhang and Zhen Fang and Tongliang Liu and Defu Lian and Bo Han},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=6O3Q6AFUTu}\n}",
        "github": "",
        "project": "",
        "reviewers": "A19z;YU98;h8PS",
        "pdf_size": 51159343,
        "rating": "8;8;8",
        "confidence": "4;3;3",
        "soundness": "4;3;3",
        "contribution": "4;3;3",
        "presentation": "4;3;2",
        "wc_summary": "133;148;86",
        "wc_strengths": "243;63;82",
        "wc_weaknesses": "224;170;75",
        "wc_questions": "60;114;13",
        "wc_review": "660;495;256",
        "wc_reply_reviewers": "14;64;35",
        "wc_reply_authors": "809;1456;1110",
        "reply_reviewers": "1;1;1",
        "reply_authors": "2;4;3",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            122.33333333333333,
            26.411277052720408
        ],
        "wc_strengths_avg": [
            129.33333333333334,
            80.74789298936675
        ],
        "wc_weaknesses_avg": [
            156.33333333333334,
            61.5918465022405
        ],
        "wc_questions_avg": [
            62.333333333333336,
            41.26607430915726
        ],
        "wc_review_avg": [
            470.3333333333333,
            165.85200899865183
        ],
        "wc_reply_reviewers_avg": [
            37.666666666666664,
            20.499322482029065
        ],
        "wc_reply_authors_avg": [
            1125.0,
            264.3495161082514
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.0,
            0.816496580927726
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11457188536986191953&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=6O3Q6AFUTu",
        "pdf": "https://openreview.net/pdf?id=6O3Q6AFUTu",
        "email": "ustc.edu.cn;hkbu.edu.hk;uts.edu.au;mbzuai.ac.ae;ustc.edu.cn;mbzuai.ac.ae",
        "author_num": 6,
        "aff_unique_index": "0;1;2;3;0;3",
        "aff_unique_norm": "University of Science and Technology of China;Hong Kong Baptist University;University of Technology Sydney;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "http://www.ustc.edu.cn;https://www.hkbu.edu.hk;https://www.uts.edu.au;https://mbzuai.ac.ae",
        "aff_unique_abbr": "USTC;HKBU;UTS;MBZUAI",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;1;2;0;2",
        "aff_country_unique": "China;Australia;United Arab Emirates"
    },
    {
        "id": "6PVgHZUepm",
        "title": "Rep-Adapter: Parameter-free Automatic Adaptation of Pre-trained ConvNets via Re-parameterization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent advances in visual pre-training have demonstrated the advantage of transferring pre-trained models to target tasks. However, different transfer learning protocols have distinctive advantages regarding target tasks, and are nontrivial to choose without repeated trial and error. This paper presents a parameter-free automatic model adaptation protocol for ConvNets, aiming at automatically balancing between fine-tuning and linear probing, by using adaptive learning rate for each convolution filters on target tasks. First, we propose Rep-Adapter, an adapter module with re-parameterization scheme, which can achieve soft balancing between the pre-trained and fine-tuned filters, and can be equivalently converted to a single weight layer, without introducing additional parameters to the inference phase. We show by theoretical analysis that Rep-Adapter can simulate a ConvNet layer with each filter fine-tuning at different learning rate. We present a simple adapter tuning protocol with Rep-Adapter to achieve automatic adaptation of pretrained models without additional search cost. Extensive experiments on various datasets with ResNet and CLIP demonstrate the superiority of our Rep-Adapter on semi-supervised, few-shot and full dataset transfer learning scenarios.",
        "keywords": "Parameter-free Automatic Adaptation",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Changlin Li;Jiqi Zhang;Hongwei Xie;Kaicheng Yu;Bing Wang;Xiaodan Liang;Xiaojun Chang",
        "authorids": "~Changlin_Li2;~Jiqi_Zhang1;~Hongwei_Xie1;~Kaicheng_Yu1;~Bing_Wang14;~Xiaodan_Liang2;~Xiaojun_Chang4",
        "gender": "M;;M;M;F;M;M",
        "homepage": ";;;https://www.yukaicheng.cn;https://www.sysu-hcp.net/;https://scholar.google.com.sg/citations?hl=en&user=uwTzb6IAAAAJ&view_op=list_works;https://www.xiaojun.ai",
        "dblp": ";;37/1678;;;;116/8412",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;kRvS9KAAAAAJ;j9OguiIAAAAJ;voxznZAAAAAJ;https://scholar.google.com.sg/citations?hl=en;https://scholar.google.co.uk/citations?user=8suupocAAAAJ",
        "orcid": ";;;;;;",
        "linkedin": ";https://cn.linkedin.com/in/%E5%90%89%E7%A5%BA-%E5%BC%A0-00389112a;;;;;",
        "or_profile": "~Changlin_Li2;~Jiqi_Zhang1;~Hongwei_Xie1;~Kaicheng_Yu1;~Xiaodan_Liang2;~bing_wang13;~Xiaojun_Chang1",
        "aff": "University of Technology Sydney;;Xiaomi Corporation;Westlake University;SUN YAT-SEN UNIVERSITY;Xiaomi Corporation;University of Technology Sydney",
        "aff_domain": "uts.edu.au;;xiaomi.com;westlake.edu;sysu.edu.cn;xiaomi.com;uts.edu.au",
        "position": "Postdoc;;Researcher;Assistant Professor;Associate Professor;Researcher;Full Professor",
        "bibtex": "@misc{\nli2024repadapter,\ntitle={Rep-Adapter: Parameter-free Automatic Adaptation of Pre-trained ConvNets via Re-parameterization},\nauthor={Changlin Li and Jiqi Zhang and Hongwei Xie and Kaicheng Yu and Bing Wang and Xiaodan Liang and Xiaojun Chang},\nyear={2024},\nurl={https://openreview.net/forum?id=6PVgHZUepm}\n}",
        "github": "",
        "project": "",
        "reviewers": "xJSa;ZcYB;XwS8",
        "site": "https://openreview.net/forum?id=6PVgHZUepm",
        "pdf_size": 664882,
        "rating": "3;6;8",
        "confidence": "5;4;5",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "2;3;3",
        "wc_summary": "39;108;64",
        "wc_strengths": "18;40;43",
        "wc_weaknesses": "132;66;268",
        "wc_questions": "70;10;72",
        "wc_review": "259;224;447",
        "wc_reply_reviewers": "83;0;0",
        "wc_reply_authors": "1441;481;384",
        "reply_reviewers": "1;0;0",
        "reply_authors": "3;1;1",
        "rating_avg": [
            5.666666666666667,
            2.0548046676563256
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            70.33333333333333,
            28.522895287041873
        ],
        "wc_strengths_avg": [
            33.666666666666664,
            11.14550233153366
        ],
        "wc_weaknesses_avg": [
            155.33333333333334,
            84.10046901705654
        ],
        "wc_questions_avg": [
            50.666666666666664,
            28.767265347188555
        ],
        "wc_review_avg": [
            310.0,
            97.92173745735248
        ],
        "wc_reply_reviewers_avg": [
            27.666666666666668,
            39.12657522565563
        ],
        "wc_reply_authors_avg": [
            768.6666666666666,
            477.05788141715277
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.11470786693528084,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:9NPzcIq4CWAJ:scholar.google.com/&scioq=Rep-Adapter:+Parameter-free+Automatic+Adaptation+of+Pre-trained+ConvNets+via+Re-parameterization&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;1;0",
        "aff_unique_norm": "University of Technology Sydney;Xiaomi Corporation;Westlake University;Sun Yat-sen University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.uts.edu.au;https://www.xiaomi.com;https://www.westlake.edu.cn;http://www.sysu.edu.cn",
        "aff_unique_abbr": "UTS;Xiaomi;WU;SYSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;1;0",
        "aff_country_unique": "Australia;China"
    },
    {
        "title": "Dynamic Discounted Counterfactual Regret Minimization",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19391",
        "id": "6PbvbLyqT6",
        "author_site": "Hang Xu, Kai Li, Haobo Fu, QIANG FU, Junliang Xing, Jian Cheng",
        "tldr": "",
        "abstract": "Counterfactual regret minimization (CFR) is a family of iterative algorithms showing promising results in solving imperfect-information games. Recent novel CFR variants (e.g., CFR+, DCFR) have significantly improved the convergence rate of the vanilla CFR. The key to these CFR variants\u2019 performance is weighting each iteration non-uniformly, i.e., discounting earlier iterations. However, these algorithms use a fixed, manually-specified scheme to weight each iteration, which enormously limits their potential. In this work, we propose Dynamic Discounted CFR (DDCFR), the first equilibrium-finding framework that discounts prior iterations using a dynamic, automatically-learned scheme. We formalize CFR\u2019s iteration process as a carefully designed Markov decision process and transform the discounting scheme learning problem into a policy optimization problem within it. The learned discounting scheme dynamically weights each iteration on the fly using information available at runtime. Experimental results across multiple games demonstrate that DDCFR\u2019s dynamic discounting scheme has a strong generalization ability and leads to faster convergence with improved performance. The code is  available at https://github.com/rpSebastian/DDCFR.",
        "keywords": "imperfect-information games;regret minimization;Nash equilibrium",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/20881043000a5b9be13557160cb756ac7746d388.zip",
        "author": "Hang Xu;Kai Li;Haobo Fu;QIANG FU;Junliang Xing;Jian Cheng",
        "authorids": "~Hang_Xu5;~Kai_Li2;~Haobo_Fu2;~QIANG_FU8;~Junliang_Xing1;~Jian_Cheng7",
        "gender": "M;M;M;M;M;M",
        "homepage": ";;;http://people.ucas.ac.cn/~jlxing?language=en;https://people.ucas.ac.cn/~chengjian?language=en;https://github.com/rpSebastian",
        "dblp": "181/2853;85/8571;;43/7659.html;14/6145-1;",
        "google_scholar": "_cY_PXgAAAAJ;LFdJXNcAAAAJ;gANaxT0AAAAJ;jSwNd3MAAAAJ;ZGCIUJ8AAAAJ;",
        "orcid": ";;;0000-0001-6801-0510;0000-0003-1289-2758;",
        "linkedin": ";haobo-fu-382b0784/;;https://www.linkedin.cn/incareer/in/ACoAAAvlU14B40ZWH1pxg5JJDtQ6LlgMYkp0e5s;;",
        "or_profile": "~Kai_Li2;~Haobo_Fu2;~QIANG_FU8;~Junliang_Xing1;~Jian_Cheng7;~Xu_Hang1",
        "aff": "Institute of Automation, Chinese Academy of Sciences;Tencent AI Lab;Tencent AI Lab;Tsinghua University;Institute of Automation, Chinese Academy of Sciences;Institute of Automation, Chinese Academy of Sciences",
        "aff_domain": "ia.ac.cn;tencent.com;tencent.com;tsinghua.edu.cn;ia.ac.cn;ia.ac.cn",
        "position": "Associate Professor;Principal Researcher;Principal Researcher;Full Professor;Full Professor;PhD student",
        "bibtex": "@inproceedings{\nxu2024dynamic,\ntitle={Dynamic Discounted Counterfactual Regret Minimization},\nauthor={Hang Xu and Kai Li and Haobo Fu and QIANG FU and Junliang Xing and Jian Cheng},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=6PbvbLyqT6}\n}",
        "github": "",
        "project": "",
        "reviewers": "ESsF;ffQX;u3Qf;f8hB",
        "pdf_size": 1141279,
        "rating": "8;8;8;8",
        "confidence": "3;3;4;5",
        "soundness": "3;4;3;4",
        "contribution": "3;3;4;3",
        "presentation": "3;3;4;4",
        "wc_summary": "125;66;48;104",
        "wc_strengths": "125;67;55;69",
        "wc_weaknesses": "123;352;78;219",
        "wc_questions": "62;84;97;75",
        "wc_review": "435;569;278;467",
        "wc_reply_reviewers": "20;77;19;8",
        "wc_reply_authors": "593;1109;214;851",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;3;2;3",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            85.75,
            30.367540236245674
        ],
        "wc_strengths_avg": [
            79.0,
            27.09243436828813
        ],
        "wc_weaknesses_avg": [
            193.0,
            104.97856924153615
        ],
        "wc_questions_avg": [
            79.5,
            12.776932339180638
        ],
        "wc_review_avg": [
            437.25,
            104.41354078853949
        ],
        "wc_reply_reviewers_avg": [
            31.0,
            26.972207918522354
        ],
        "wc_reply_authors_avg": [
            691.75,
            330.7018105484154
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3622742088901319178&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=6PbvbLyqT6",
        "pdf": "https://openreview.net/pdf?id=6PbvbLyqT6",
        "email": "ia.ac.cn;tencent.com;tencent.com;tsinghua.edu.cn;ia.ac.cn;ia.ac.cn",
        "author_num": 6,
        "aff_unique_index": "0;1;1;2;0;0",
        "aff_unique_norm": "Chinese Academy of Sciences;Tencent;Tsinghua University",
        "aff_unique_dep": "Institute of Automation;Tencent AI Lab;",
        "aff_unique_url": "http://www.ia.cas.cn;https://ai.tencent.com;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "CAS;Tencent AI Lab;THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "6PjS5RnxeK",
        "title": "On progressive sharpening, flat minima and generalisation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We present a new approach to understanding the relationship between loss curvature and input-output model behaviour in deep learning.  Specifically, we use existing empirical analyses of the spectrum of deep network loss Hessians to ground an ansatz tying together the loss Hessian and the input-output Jacobian over training samples during the training of deep neural networks. We then prove a series of theoretical results which quantify the degree to which the input-output Jacobian of a model approximates its Lipschitz norm over a data distribution, and deduce a novel generalisation bound in terms of the empirical Jacobian. We use our ansatz, together with our theoretical results, to give a new account of the recently observed progressive sharpening phenomenon, as well as the generalisation properties of flat minima. Experimental evidence is provided to validate our claims.",
        "keywords": "progressive sharpening;flat minima;generalisation;generalization",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/c2208f44613f193ef0afa123ec35aa2edfc21b1b.zip",
        "author": "Lachlan Ewen MacDonald;Jack Valmadre;Simon Lucey",
        "authorids": "~Lachlan_Ewen_MacDonald1;~Jack_Valmadre1;~Simon_Lucey2",
        "gender": ";M;M",
        "homepage": "https://researchers.adelaide.edu.au/profile/lachlan.macdonald;https://jack.valmadre.net/;https://www.adelaide.edu.au/directory/simon.lucey",
        "dblp": "306/7691;50/8535;01/3542",
        "google_scholar": "r953DlQAAAAJ;_VSBqL0AAAAJ;vmAe35UAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Lachlan_Ewen_MacDonald1;~Jack_Valmadre1;~Simon_Lucey2",
        "aff": "Johns Hopkins University;University of Adelaide;University of Adelaide",
        "aff_domain": "jhu.edu;adelaide.edu.au;adelaide.edu.au",
        "position": "Postdoc;Lecturer;Full Professor",
        "bibtex": "@misc{\nmacdonald2024on,\ntitle={On progressive sharpening, flat minima and generalisation},\nauthor={Lachlan Ewen MacDonald and Jack Valmadre and Simon Lucey},\nyear={2024},\nurl={https://openreview.net/forum?id=6PjS5RnxeK}\n}",
        "github": "",
        "project": "",
        "reviewers": "L7Vu;LTAo;7LFk;dFnj",
        "site": "https://openreview.net/forum?id=6PjS5RnxeK",
        "pdf_size": 650955,
        "rating": "3;3;6;8",
        "confidence": "4;4;2;2",
        "soundness": "3;2;3;3",
        "contribution": "1;2;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "18;100;72;215",
        "wc_strengths": "28;100;110;63",
        "wc_weaknesses": "127;601;245;98",
        "wc_questions": "40;1;83;73",
        "wc_review": "213;802;510;449",
        "wc_reply_reviewers": "0;0;72;0",
        "wc_reply_authors": "512;794;458;208",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            3.0,
            1.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            101.25,
            71.9839391809034
        ],
        "wc_strengths_avg": [
            75.25,
            32.41431011143072
        ],
        "wc_weaknesses_avg": [
            267.75,
            200.12418019819594
        ],
        "wc_questions_avg": [
            49.25,
            32.080952292598795
        ],
        "wc_review_avg": [
            493.5,
            209.82433128691247
        ],
        "wc_reply_reviewers_avg": [
            18.0,
            31.176914536239792
        ],
        "wc_reply_authors_avg": [
            493.0,
            208.21383239352758
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.9428090415820635,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14425807823744012155&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Johns Hopkins University;University of Adelaide",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.jhu.edu;https://www.adelaide.edu.au",
        "aff_unique_abbr": "JHU;Adelaide",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "United States;Australia"
    },
    {
        "title": "LongLoRA: Efficient Fine-tuning of Long-Context Large Language Models",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19390",
        "id": "6PmJoRfdaK",
        "author_site": "Yukang Chen, Shengju Qian, Haotian Tang, Xin Lai, Zhijian Liu, Song Han, Jiaya Jia",
        "tldr": "",
        "abstract": "We present LongLoRA, an efficient fine-tuning approach that extends the context sizes of pre-trained large language models (LLMs), with limited computation cost.\nTypically, training LLMs with long context sizes is computationally expensive, requiring extensive training hours and GPU resources. For example, training on the context length of 8192 needs 16x computational costs in self-attention layers as that of 2048. In this paper, we speed up the context extension of LLMs in two aspects. On the one hand, although dense global attention is needed during inference, fine-tuning the model can be effectively and efficiently done by sparse local attention. The proposed shifted sparse attention effectively enables context extension, leading to non-trivial computation saving with similar performance to fine-tuning with vanilla attention. Particularly, it can be implemented with only two lines of code in training, while being optional in inference. On the other hand, we revisit the parameter-efficient fine-tuning regime for context expansion. Notably, we find that LoRA for context extension works well under the premise of trainable embedding and normalization. LongLoRA combines this improved LoRA with S^2-Attn. LongLoRA demonstrates strong empirical results on various tasks on Llama2 models from 7B/13B to 70B. LongLoRA extends Llama2 7B from 4k context to 100k, or Llama2 70B to 32k on a single 8x A100 machine. LongLoRA extends models' context while retaining their original architectures, and is compatible with most existing techniques, like Flash-Attention2. In addition, we further conduct supervised fine-tuning with LongLoRA and our long instruction-following LongAlpaca dataset. All our code, models, dataset, and demo are available at https://github.com/dvlab-research/LongLoRA.",
        "keywords": "Efficient fine-tuning;Long context;Large language model",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yukang Chen;Shengju Qian;Haotian Tang;Xin Lai;Zhijian Liu;Song Han;Jiaya Jia",
        "authorids": "~Yukang_Chen1;~Shengju_Qian1;~Haotian_Tang1;~Xin_Lai1;~Zhijian_Liu1;~Song_Han5;~Jiaya_Jia1",
        "gender": "M;M;M;M;M;;M",
        "homepage": "https://yukangchen.com/;http://thesouthfrog.com/about.me/;http://kentang.net;https://x-lai.github.io;https://zhijianliu.com;;https://jiaya.me",
        "dblp": "225/4601;247/6076;245/0058;;;;31/5649",
        "google_scholar": "6p0ygKUAAAAJ;QNnWmasAAAAJ;WxL13BAAAAAJ;tqNDPA4AAAAJ;mwzYYPgAAAAJ;;https://scholar.google.com.tw/citations?user=XPAkzTEAAAAJ",
        "orcid": ";;;;;;",
        "linkedin": ";;;;zhijianliu/;;",
        "or_profile": "~Yukang_Chen1;~Shengju_Qian1;~Haotian_Tang1;~Xin_Lai1;~Zhijian_Liu1;~Song_Han5;~Jiaya_Jia1",
        "aff": "NVIDIA;Tencent;NVIDIA;The Chinese University of Hong Kong;Massachusetts Institute of Technology;;Department of Computer Science and Engineering, Hong Kong University of Science and Technology",
        "aff_domain": "nvidia.com;tencent.com;nvidia.com;cuhk.edu.hk;mit.edu;;cse.ust.hk",
        "position": "Researcher;Researcher;Intern;PhD student;PhD student;;Full Professor",
        "bibtex": "@inproceedings{\nchen2024longlora,\ntitle={LongLo{RA}: Efficient Fine-tuning of Long-Context Large Language Models},\nauthor={Yukang Chen and Shengju Qian and Haotian Tang and Xin Lai and Zhijian Liu and Song Han and Jiaya Jia},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=6PmJoRfdaK}\n}",
        "github": "",
        "project": "",
        "reviewers": "WV76;7K1u;Sw6W;FsJg",
        "pdf_size": 1168720,
        "rating": "6;6;8;8",
        "confidence": "3;4;4;3",
        "soundness": "3;3;4;3",
        "contribution": "2;3;4;2",
        "presentation": "3;2;4;2",
        "wc_summary": "44;137;66;130",
        "wc_strengths": "47;18;48;71",
        "wc_weaknesses": "35;9;3;32",
        "wc_questions": "9;76;56;208",
        "wc_review": "135;240;173;441",
        "wc_reply_reviewers": "0;0;8;40",
        "wc_reply_authors": "472;569;536;477",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            94.25,
            40.08974307725107
        ],
        "wc_strengths_avg": [
            46.0,
            18.801595676963167
        ],
        "wc_weaknesses_avg": [
            19.75,
            13.953046262375826
        ],
        "wc_questions_avg": [
            87.25,
            73.83554360875256
        ],
        "wc_review_avg": [
            247.25,
            118.00926870377597
        ],
        "wc_reply_reviewers_avg": [
            12.0,
            16.492422502470642
        ],
        "wc_reply_authors_avg": [
            513.5,
            40.74616546375867
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 360,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15175040643590476650&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=6PmJoRfdaK",
        "pdf": "https://openreview.net/pdf?id=6PmJoRfdaK",
        "email": "nvidia.com;tencent.com;nvidia.com;cuhk.edu.hk;mit.edu;;cse.ust.hk",
        "author_num": 7,
        "aff_unique_index": "0;1;0;2;3;4",
        "aff_unique_norm": "NVIDIA;Tencent;Chinese University of Hong Kong;Massachusetts Institute of Technology;Hong Kong University of Science and Technology",
        "aff_unique_dep": "NVIDIA Corporation;Tencent Holdings Limited;;;Department of Computer Science and Engineering",
        "aff_unique_url": "https://www.nvidia.com;https://www.tencent.com;https://www.cuhk.edu.hk;https://web.mit.edu;https://www.ust.hk",
        "aff_unique_abbr": "NVIDIA;Tencent;CUHK;MIT;HKUST",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;1;0;1;0;1",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "IceFormer: Accelerated Inference with Long-Sequence Transformers on CPUs",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19389",
        "id": "6RR3wU4mSZ",
        "author_site": "Yuzhen Mao, Martin Ester, Ke Li",
        "tldr": "",
        "abstract": "One limitation of existing Transformer-based models is that they cannot handle very long sequences as input since their self-attention operations exhibit quadratic time and space complexity. This problem becomes especially acute when Transformers are deployed on hardware platforms equipped only with CPUs. To address this issue, we propose a novel method for accelerating self-attention at inference time that works with pretrained Transformer models out-of-the-box without requiring retraining. We experiment using our method to accelerate various long-sequence Transformers, including a leading LLaMA 2-based LLM, on various benchmarks and demonstrate a greater speedup of $2.73\\times$ - $7.63\\times$ while retaining $98.6$% - $99.6$% of the accuracy of the original pretrained models. The code is available on our project website at https://yuzhenmao.github.io/IceFormer/.",
        "keywords": "Efficient Transformers;Inference-time Efficiency;CPU",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/4ffc52aa275005fa3921f695f72131d5e57fa122.zip",
        "author": "Yuzhen Mao;Martin Ester;Ke Li",
        "authorids": "~Yuzhen_Mao2;~Martin_Ester1;~Ke_Li1",
        "gender": "M;M;M",
        "homepage": "https://github.com/yuzhenmao;https://sites.google.com/view/esterlab;http://www.sfu.ca/~keli/",
        "dblp": "336/2249;e/MartinEster;75/6627-11",
        "google_scholar": "9wKn1A0AAAAJ;https://scholar.google.com.tw/citations?user=ZYwC_CQAAAAJ;vQc8tI4AAAAJ",
        "orcid": ";0000-0001-7732-2815;",
        "linkedin": ";;",
        "or_profile": "~Yuzhen_Mao2;~Martin_Ester1;~Ke_Li1",
        "aff": "Simon Fraser University;Simon Fraser University;Simon Fraser University",
        "aff_domain": "sfu.ca;sfu.ca;sfu.ca",
        "position": "Researcher;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nmao2024iceformer,\ntitle={IceFormer: Accelerated Inference with Long-Sequence Transformers on {CPU}s},\nauthor={Yuzhen Mao and Martin Ester and Ke Li},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=6RR3wU4mSZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "dxGt;nr9P;d3mB;ad3y;5Bmg",
        "pdf_size": 2372458,
        "rating": "3;6;6;6;6",
        "confidence": "3;3;5;4;3",
        "soundness": "2;3;2;3;3",
        "contribution": "1;3;3;2;3",
        "presentation": "1;3;3;2;3",
        "wc_summary": "109;62;36;41;87",
        "wc_strengths": "89;40;59;33;59",
        "wc_weaknesses": "184;39;134;72;93",
        "wc_questions": "3;46;40;135;92",
        "wc_review": "385;187;269;281;331",
        "wc_reply_reviewers": "0;0;0;26;19",
        "wc_reply_authors": "1008;553;823;1473;723",
        "reply_reviewers": "0;0;0;1;1",
        "reply_authors": "2;1;2;3;1",
        "rating_avg": [
            5.4,
            1.2
        ],
        "confidence_avg": [
            3.6,
            0.8
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.4,
            0.8
        ],
        "presentation_avg": [
            2.4,
            0.8
        ],
        "wc_summary_avg": [
            67.0,
            27.66224864323217
        ],
        "wc_strengths_avg": [
            56.0,
            19.452506265260524
        ],
        "wc_weaknesses_avg": [
            104.4,
            50.337262539792526
        ],
        "wc_questions_avg": [
            63.2,
            45.70076585791534
        ],
        "wc_review_avg": [
            290.6,
            66.08358343794622
        ],
        "wc_reply_reviewers_avg": [
            9.0,
            11.242775458044157
        ],
        "wc_reply_authors_avg": [
            916.0,
            315.08094198158034
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.8,
            0.7483314773547883
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.37499999999999994,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8420608667553434018&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=6RR3wU4mSZ",
        "pdf": "https://openreview.net/pdf?id=6RR3wU4mSZ",
        "email": "sfu.ca;sfu.ca;sfu.ca",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Simon Fraser University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sfu.ca",
        "aff_unique_abbr": "SFU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "6SNyuiph3F",
        "title": "Chat Vector: A Simple Approach to Equip LLMs With New Language Chat Capabilities",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "With the advancements in conversational AI, such as ChatGPT, this paper focuses on exploring developing Large Language Models (LLMs) for non-English languages, especially emphasizing alignment with human preferences. We introduce a computationally efficient method, leveraging \u201cchat vector,\u201d to synergize pre-existing knowledge and behaviors in LLMs, restructuring the conventional training paradigm from continual pretrain $\\rightarrow$ SFT $\\rightarrow$ RLHF to continual pretrain + chat. Our empirical studies, primarily focused on Traditional Chinese, employ LLaMA2 as the base model and acquire the chat vector by subtracting the pre-trained weights, LLaMA2, from the weights of LLaMA2-chat. Evaluating from three distinct facets, which are toxicity, ability of instruction following and multi-turn dialogue demonstrates the chat vector's superior efficacy in \u201cchatting\u201d. To confirm the adaptability of our approach, we extend our experiments to include models pre-trained in both Korean and Simplified Chinese, illustrating the versatility of our methodology. Overall, we present a significant solution in aligning LLMs with human preferences efficiently across various languages, accomplished by the chat vector.",
        "keywords": "RLHF;LLM",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Shih-Cheng Huang;Pin-Zu Li;YU-CHI HSU;Kuang-Ming Chen;Yu Tung Lin;Shih-Kai Hsiao;Richard Tzong-Han Tsai;Hung-yi Lee",
        "authorids": "~Shih-Cheng_Huang2;~Pin-Zu_Li1;~YU-CHI_HSU1;~Kuang-Ming_Chen1;~Yu_Tung_Lin1;anna.shiker1822@gmail.com;~Richard_Tzong-Han_Tsai1;~Hung-yi_Lee2",
        "gender": "M;M;M;M;F;;M;Non-Binary",
        "homepage": ";https://github.com/aqweteddy;https://github.com/ba144220;;;;;https://speech.ee.ntu.edu.tw/~hylee/index.html",
        "dblp": ";;;37/10484.html;;;t/TzongHanTsai;81/8056",
        "google_scholar": ";;;;;;;DxLO11IAAAAJ",
        "orcid": ";;;;;;;",
        "linkedin": "%E4%B8%96%E4%B8%9E-%E9%BB%83-863b68192/;pin-zu-li-237b57181/;;kuang-ming-chen;judy-lin-3b9771247/;;;",
        "or_profile": "~Shih-Cheng_Huang2;~Pin-Zu_Li1;~YU-CHI_HSU1;~Kuang-Ming_Chen1;~Yu_Tung_Lin1;anna.shiker1822@gmail.com;~Richard_Tzong-Han_Tsai1;~Hung-yi_Lee2",
        "aff": "Appier Inc.;National Applied Research Laboratories;National Taiwan University;National Taiwan University;;;National Central University;National Taiwan University",
        "aff_domain": "appier.com;narlabs.org.tw;ntu.edu.tw;ntu.edu.tw;;;ncu.edu.tw;ntu.edu.tw",
        "position": "Researcher;Researcher;Undergrad student;Undergrad student;;;Full Professor;Full Professor",
        "bibtex": "@misc{\nhuang2024chat,\ntitle={Chat Vector: A Simple Approach to Equip {LLM}s With New Language Chat Capabilities},\nauthor={Shih-Cheng Huang and Pin-Zu Li and YU-CHI HSU and Kuang-Ming Chen and Yu Tung Lin and Shih-Kai Hsiao and Richard Tzong-Han Tsai and Hung-yi Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=6SNyuiph3F}\n}",
        "github": "",
        "project": "",
        "reviewers": "uV1v;PhbB;X3rn;ERju",
        "site": "https://openreview.net/forum?id=6SNyuiph3F",
        "pdf_size": 707865,
        "rating": "5;5;5;6",
        "confidence": "4;4;3;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;2",
        "presentation": "3;2;3;3",
        "wc_summary": "99;67;71;113",
        "wc_strengths": "73;41;82;21",
        "wc_weaknesses": "263;314;288;88",
        "wc_questions": "28;54;4;13",
        "wc_review": "463;476;445;235",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "498;274;245;358",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            87.5,
            19.20286436967152
        ],
        "wc_strengths_avg": [
            54.25,
            24.508926945094924
        ],
        "wc_weaknesses_avg": [
            238.25,
            88.60128385074339
        ],
        "wc_questions_avg": [
            24.75,
            18.93904696651867
        ],
        "wc_review_avg": [
            404.75,
            98.6214352967954
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            343.75,
            98.25063613025617
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8869576311636760884&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;2;3;2",
        "aff_unique_norm": "Appier Inc.;National Applied Research Laboratories;National Taiwan University;National Central University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.appier.com;https://www.narlabs.org.tw;https://www.ntu.edu.tw;https://www.ncu.edu.tw",
        "aff_unique_abbr": "Appier;NARLabs;NTU;NCU",
        "aff_campus_unique_index": "0;0;0;0;0;0",
        "aff_campus_unique": "Taiwan",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "6SmcAt0JmF",
        "title": "CAT: Collaborative Adversarial Training",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Adversarial training has proven to be effective in enhancing the robustness of neural networks. However, previous methods typically focus on a single adversarial training strategy and do not consider the characteristics of models trained using different strategies. Upon revisiting these methods, we have observed that different adversarial training methods exhibit distinct levels of robustness for different sample instances. For instance, a model trained using AT may correctly classify a sample instance that is misclassified by a model trained using TRADES, and vice versa. Motivated by this observation, we propose a Collaborative Adversarial Training (CAT) framework to enhance the robustness of neural networks. CAT utilizes different adversarial training methods to train robust models and facilitate the interaction of these models to leverage their combined knowledge during the training process.Extensive experiments conducted on various networks and datasets validate the effectiveness of our method.",
        "keywords": "adversarial training;adversarial robustness",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "xingbin liu",
        "authorids": "~xingbin_liu1",
        "gender": "",
        "homepage": "https://github.com/liuxingbin",
        "dblp": "",
        "google_scholar": "CqL88JwAAAAJ",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~xingbin_liu1",
        "aff": "Megvii Technology Inc.",
        "aff_domain": "megvii.com",
        "position": "Researcher",
        "bibtex": "@misc{\nliu2024cat,\ntitle={{CAT}: Collaborative Adversarial Training},\nauthor={xingbin liu},\nyear={2024},\nurl={https://openreview.net/forum?id=6SmcAt0JmF}\n}",
        "github": "",
        "project": "",
        "reviewers": "aZir;9NK1;VPkg;V2Su",
        "site": "https://openreview.net/forum?id=6SmcAt0JmF",
        "pdf_size": 297957,
        "rating": "3;5;5;5",
        "confidence": "4;2;4;4",
        "soundness": "3;2;3;2",
        "contribution": "2;2;3;3",
        "presentation": "2;3;2;3",
        "wc_summary": "42;128;42;81",
        "wc_strengths": "9;26;45;48",
        "wc_weaknesses": "189;276;230;127",
        "wc_questions": "68;69;69;2",
        "wc_review": "308;499;386;258",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            73.25,
            35.39332564199075
        ],
        "wc_strengths_avg": [
            32.0,
            15.732132722552274
        ],
        "wc_weaknesses_avg": [
            205.5,
            54.78366544874485
        ],
        "wc_questions_avg": [
            52.0,
            28.8704000665041
        ],
        "wc_review_avg": [
            362.75,
            90.93232373584215
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2458217275536159128&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0",
        "aff_unique_norm": "Megvii Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.megvii.com",
        "aff_unique_abbr": "Megvii",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "6UQaXJm53B",
        "title": "DfPO: Degeneration-free Policy Optimization via Action Masking in Natural Language Action Spaces",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "As the pre-training objectives (e.g., next token prediction) of language models (LMs) are inherently not aligned with task scores, optimizing LMs to achieve higher downstream task scores is essential. One of the promising approaches is to fine-tune LMs by using reinforcement learning (RL). However, conventional RL methods based on PPO and a penalty of KL divergence are vulnerable to the text degeneration problem which LMs do not generate natural texts anymore after RL fine-tuning. To address this problem, we provide Degeneration-free Policy Optimization (DfPO) that can fine-tune LMs to generate texts that achieve improved downstream task scores, while preserving the naturalness of the generated texts. To achieve this, we introduce action-masked policy with which a behavior policy can avoid to select tokens that potentially make policy optimization unexpected. Then, we devise clipped advantage functions to separately perform likelihood maximization and minimization, conditioned on texts sampled from the action-masked policy. Our experiments on the GRUE benchmark demonstrate that DfPO successfully improves the downstream task scores, while preserving the naturalness of the generated texts. Moreover, even DfPO does not perform hyperparameter search, it outperforms PPO and NLPO which require additional hyperparameter search for the penalty ratio of KL divergence.",
        "keywords": "Reinforcement learning;Natural language processing",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Youngsoo Jang;Geon-Hyeong Kim;Byoungjip Kim;Honglak Lee;Moontae Lee",
        "authorids": "~Youngsoo_Jang2;~Geon-Hyeong_Kim2;~Byoungjip_Kim1;~Honglak_Lee2;~Moontae_Lee1",
        "gender": ";M;;;",
        "homepage": "http://www.ysjang.me;https://sites.google.com/view/ghkim;;;https://moontae.people.uic.edu",
        "dblp": "195/0471;231/7707;;;132/1761",
        "google_scholar": "6EoBBggAAAAJ;https://scholar.google.co.kr/citations?user=IJL0uXoAAAAJ;;;BMvYy9cAAAAJ",
        "orcid": ";;;;0000-0001-5542-3463",
        "linkedin": ";;;;moontae-lee-975248123/",
        "or_profile": "~Youngsoo_Jang2;~Geon-Hyeong_Kim2;~Byoungjip_Kim1;~Honglak_Lee2;~Moontae_Lee1",
        "aff": "LG AI Research;LG AI Research;;;University of Illinois, Chicago",
        "aff_domain": "lgresearch.ai;lgresearch.ai;;;uic.edu",
        "position": "Researcher;Researcher;;;Assistant Professor",
        "bibtex": "@misc{\njang2024dfpo,\ntitle={Df{PO}: Degeneration-free Policy Optimization via Action Masking in Natural Language Action Spaces},\nauthor={Youngsoo Jang and Geon-Hyeong Kim and Byoungjip Kim and Honglak Lee and Moontae Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=6UQaXJm53B}\n}",
        "github": "",
        "project": "",
        "reviewers": "wZxt;6zCc;99mP;hR6e",
        "site": "https://openreview.net/forum?id=6UQaXJm53B",
        "pdf_size": 1050988,
        "rating": "3;5;5;8",
        "confidence": "3;4;4;3",
        "soundness": "1;2;2;3",
        "contribution": "2;3;2;3",
        "presentation": "1;2;2;3",
        "wc_summary": "134;70;61;138",
        "wc_strengths": "94;47;28;219",
        "wc_weaknesses": "312;126;121;110",
        "wc_questions": "1134;120;88;1",
        "wc_review": "1674;363;298;468",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1357;825;538;230",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;2;2;2",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            100.75,
            35.42156828826189
        ],
        "wc_strengths_avg": [
            97.0,
            74.42109915877352
        ],
        "wc_weaknesses_avg": [
            167.25,
            83.7716389955455
        ],
        "wc_questions_avg": [
            335.75,
            462.9224422081954
        ],
        "wc_review_avg": [
            700.75,
            565.1704941873735
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            737.5,
            414.96776983279074
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.14002800840280097,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:EJnsjzBa9W8J:scholar.google.com/&scioq=DfPO:+Degeneration-free+Policy+Optimization+via+Action+Masking+in+Natural+Language+Action+Spaces&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "LG;University of Illinois at Chicago",
        "aff_unique_dep": "LG AI Research;",
        "aff_unique_url": "https://www.lgaires.com;https://www.uic.edu",
        "aff_unique_abbr": "LG AI;UIC",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Chicago",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "id": "6Uc7Fgwrsm",
        "title": "OmniMixup: Generalize Mixup with Mixing-Pair Sampling Distribution",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Mixup is a widely-adopted data augmentation techniques to mitigates the overfitting issue in empirical risk minimization. Current works of modifying Mixup are modality-specific, thereby limiting the applicability across diverse modalities. Although alternative approaches try circumventing such barrier via mixing-up data from latent features based on sampling distribution, they still require domain knowledge for designing sampling distribution. Moreover, a unified theoretical framework for analyzing the generalization bound for this line of research remains absent. In this paper, we introduce OmniMixup, a generalization of prior works by introducing Mixing-Pair Sampling Distribution (MPSD), accompanied by a holistic theoretical analysis framwork. We find both theoretically and empirically that the Mahalanobis distance (M-Score), derived from the sampling distribution, offers significant insights into OmniMixup's generalization capabilities. Accordingly, we propose OmniEval, an evaluation framework designed to autonomously identify the optimal sampling distribution. The empirical study on both images and molecules demonstrates that 1) OmniEval is adept at determining the appropriate sampling distribution for OmniMixup, and 2) OmniMixup exhibits promising capability for application across various modalities and domains.",
        "keywords": "Mixup;Machine Learning;molecule property prediction;image classification;data augmentation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Xingran Chen;Zhangyang Gao;Cheng Tan;Siyuan Li;Stan Z. Li",
        "authorids": "~Xingran_Chen1;~Zhangyang_Gao1;~Cheng_Tan1;~Siyuan_Li6;~Stan_Z._Li2",
        "gender": "M;M;M;M;M",
        "homepage": "https://www.chenxingran.com/;;https://chengtan9907.github.io/;https://lupin1998.github.io/;https://en.westlake.edu.cn/academics/School_of_Engineering/About/Our_People/Faculty/201912/t20191206_2497.shtml",
        "dblp": "203/8349;275/3266;70/1533-12.html;63/9705-2;l/StanZLi",
        "google_scholar": "X01oTv8AAAAJ;4SclT-QAAAAJ;6kTV6aMAAAAJ;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": ";0000-0003-1026-6083;;0000-0001-6806-2468;",
        "linkedin": ";;;https://www.linkedin.cn/incareer/in/siyuan-li-lupin1998/;stan-z-li-%E6%9D%8E%E5%AD%90%E9%9D%92-55753224/",
        "or_profile": "~Xingran_Chen1;~Zhangyang_Gao1;~Cheng_Tan1;~Siyuan_Li6;~Stan_Z._Li1",
        "aff": "University of Michigan - Ann Arbor;Westlake University, China;Zhejiang University & Westlake University;Alibaba Group;Westlake University",
        "aff_domain": "umich.edu;westlake.edu.cn;westlake.edu.cn;alibaba-inc.com;westlake.edu.cn",
        "position": "MS student;PhD student;PhD student;Intern;Chair Professor",
        "bibtex": "@misc{\nchen2024omnimixup,\ntitle={OmniMixup: Generalize Mixup with Mixing-Pair Sampling Distribution},\nauthor={Xingran Chen and Zhangyang Gao and Cheng Tan and Siyuan Li and Stan Z. Li},\nyear={2024},\nurl={https://openreview.net/forum?id=6Uc7Fgwrsm}\n}",
        "github": "",
        "project": "",
        "reviewers": "AcyS;sgeX;39U8;CqYZ;wmTG",
        "site": "https://openreview.net/forum?id=6Uc7Fgwrsm",
        "pdf_size": 461374,
        "rating": "1;3;3;5;5",
        "confidence": "4;5;3;3;4",
        "soundness": "2;2;1;2;3",
        "contribution": "1;2;2;2;2",
        "presentation": "1;2;1;3;3",
        "wc_summary": "75;58;121;58;78",
        "wc_strengths": "19;48;93;85;43",
        "wc_weaknesses": "296;251;139;54;164",
        "wc_questions": "57;3;271;194;5",
        "wc_review": "447;360;624;391;290",
        "wc_reply_reviewers": "189;0;0;103;0",
        "wc_reply_authors": "1128;722;897;560;849",
        "reply_reviewers": "1;0;0;1;0",
        "reply_authors": "2;1;2;1;2",
        "rating_avg": [
            3.4,
            1.4966629547095767
        ],
        "confidence_avg": [
            3.8,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            1.8,
            0.4000000000000001
        ],
        "presentation_avg": [
            2.0,
            0.8944271909999159
        ],
        "wc_summary_avg": [
            78.0,
            23.05645245912736
        ],
        "wc_strengths_avg": [
            57.6,
            27.56519544643208
        ],
        "wc_weaknesses_avg": [
            180.8,
            85.21361393580253
        ],
        "wc_questions_avg": [
            106.0,
            107.8702924812944
        ],
        "wc_review_avg": [
            422.4,
            112.83368291427875
        ],
        "wc_reply_reviewers_avg": [
            58.4,
            76.52084683274225
        ],
        "wc_reply_authors_avg": [
            831.2,
            188.79131335948696
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.6,
            0.4898979485566356
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.2857142857142857,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:XDHue5wf3VoJ:scholar.google.com/&scioq=OmniMixup:+Generalize+Mixup+with+Mixing-Pair+Sampling+Distribution&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;1",
        "aff_unique_norm": "University of Michigan;Westlake University;Zhejiang University;Alibaba Group",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.umich.edu;https://www.westlake.edu.cn;http://www.zju.edu.cn;https://www.alibaba.com",
        "aff_unique_abbr": "UM;WU;ZJU;Alibaba",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Ann Arbor;",
        "aff_country_unique_index": "0;1;1;1;1",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "6W35Wcs077",
        "title": "Decomposition Ascribed Synergistic Learning for Unified Image Restoration",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Learning to restore multiple image degradations within a single model is quite beneficial for real-world applications. Nevertheless, existing works typically concentrate on regarding each degradation independently, while their relationship has been less exploited to ensure the synergistic learning. To this end, we revisit the diverse degradations through the lens of singular value decomposition, with the observation that the decomposed singular vectors and singular values naturally undertake the different types of degradation information, dividing various restoration tasks into two groups, \\ie, singular vector dominated and singular value dominated. The above analysis renders a more unified perspective to ascribe the diverse degradations, compared to previous task-level independent learning. The dedicated optimization of degraded singular vectors and singular values inherently utilizes the potential relationship among diverse restoration tasks, attributing to the Decomposition Ascribed Synergistic Learning (DASL). Specifically, DASL comprises two effective operators, namely, Singular VEctor Operator (SVEO) and Singular VAlue Operator (SVAO), to favor the decomposed optimization, which can be lightly integrated into existing convolutional image restoration backbone. Moreover, the congruous decomposition loss has been devised for auxiliary. Extensive experiments on blended five image restoration tasks demonstrate the effectiveness of our method, including image deraining, image dehazing, image denoising, image deblurring, and low-light image enhancement.",
        "keywords": "Image Restoration;Decomposition;Orthogonality;Signal formation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "JingHao Zhang;Jie Huang;Man Zhou;Chongyi Li;Feng Zhao",
        "authorids": "~JingHao_Zhang2;~Jie_Huang4;~Man_Zhou5;~Chongyi_Li1;~Feng_Zhao6",
        "gender": "M;M;M;;M",
        "homepage": "https://jinghao99.github.io/;;https://zz.github.io;;https://bivlab123.github.io/",
        "dblp": ";;;;181/2734-4",
        "google_scholar": "Lis9e2MAAAAJ;https://scholar.google.com/citations?hl=zh-CN;;;https://scholar.google.co.uk/citations?hl=en",
        "orcid": "0000-0002-5407-4641;0000-0002-3518-3404;;;0000-0001-6767-8105",
        "linkedin": ";;;;",
        "or_profile": "~JingHao_Zhang2;~Jie_Huang4;~Man_Zhou5;~Chongyi_Li1;~Feng_Zhao6",
        "aff": "University of Science and Technology of China;University of Science and Technology of China;iim;;University of Science and Technology of China",
        "aff_domain": "ustc.edu.cn;ustc.edu.cn;iim.cn;;ustc.edu.cn",
        "position": "PhD student;PhD student;PhD student;;Full Professor",
        "bibtex": "@misc{\nzhang2024decomposition,\ntitle={Decomposition Ascribed Synergistic Learning for Unified Image Restoration},\nauthor={JingHao Zhang and Jie Huang and Man Zhou and Chongyi Li and Feng Zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=6W35Wcs077}\n}",
        "github": "",
        "project": "",
        "reviewers": "5Pyv;4FV9;vj9U;Ym8K",
        "site": "https://openreview.net/forum?id=6W35Wcs077",
        "pdf_size": 43862690,
        "rating": "3;6;8;8",
        "confidence": "4;5;4;5",
        "soundness": "1;3;4;3",
        "contribution": "2;2;4;3",
        "presentation": "1;3;4;4",
        "wc_summary": "96;54;77;103",
        "wc_strengths": "32;18;151;55",
        "wc_weaknesses": "62;71;55;155",
        "wc_questions": "361;247;131;7",
        "wc_review": "551;390;414;320",
        "wc_reply_reviewers": "0;0;130;0",
        "wc_reply_authors": "1592;1300;563;672",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "3;2;1;1",
        "rating_avg": [
            6.25,
            2.0463381929681126
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            1.0897247358851685
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            1.224744871391589
        ],
        "wc_summary_avg": [
            82.5,
            19.00657780874821
        ],
        "wc_strengths_avg": [
            64.0,
            51.93746239469156
        ],
        "wc_weaknesses_avg": [
            85.75,
            40.38177187791541
        ],
        "wc_questions_avg": [
            186.5,
            131.72983716683171
        ],
        "wc_review_avg": [
            418.75,
            83.80147671729897
        ],
        "wc_reply_reviewers_avg": [
            32.5,
            56.29165124598851
        ],
        "wc_reply_authors_avg": [
            1031.75,
            428.6562579736822
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.3665083330689157,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17089949665565746036&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "University of Science and Technology of China;Indian Institute of Management",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.ustc.edu.cn;https://www.iim.edu",
        "aff_unique_abbr": "USTC;IIM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "China;India"
    },
    {
        "id": "6YZmkpivVH",
        "title": "TpopT: Efficient Trainable Template Optimization on Low-Dimensional Manifolds",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In scientific and engineering scenarios, a recurring task is the detection of low-dimensional families of signals or patterns. A classic family of approaches, exemplified by template matching, aims to cover the search space with a dense template bank. While simple and highly interpretable, it suffers from poor computational efficiency due to unfavorable scaling in the signal space dimensionality. In this work, we study TpopT (TemPlate OPTimization) as an alternative scalable framework for detecting low-dimensional families of signals which maintains high interpretability. We provide a theoretical analysis of the convergence of Riemannian gradient descent for TpopT, and prove that it has a superior dimension scaling to covering. We also propose a practical TpopT framework for nonparametric signal sets, which incorporates techniques of embedding and kernel interpolation, and is further configurable into a trainable network architecture by unrolled optimization. The proposed trainable TpopT exhibits significantly improved efficiency-accuracy tradeoffs for gravitational wave detection, where matched filtering is currently a method of choice. We further illustrate the general applicability of this approach with experiments on handwritten digit data.",
        "keywords": "Signal Detection;Scientific Machine Learning;Unrolled Optimization;Template Optimization",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/e84caf366508589af520c0b379baed754ab3aa75.zip",
        "author": "Jingkai Yan;Shiyu Wang;Xinyu Rain Wei;Jimmy Wang;Zsuzsanna Marka;Szabolcs Marka;John Wright",
        "authorids": "~Jingkai_Yan1;~Shiyu_Wang4;~Xinyu_Rain_Wei1;~Jimmy_Wang1;~Zsuzsanna_Marka1;~Szabolcs_Marka1;~John_Wright1",
        "gender": ";;F;M;;M;",
        "homepage": ";http://www.linkedin.com/in/shiyuwang3601;https://www.linkedin.com/in/xinyuwei/;;;https://datascience.columbia.edu/people/szabolcs-marka/;http://www.columbia.edu/~jw2966",
        "dblp": "209/9672;;;;254/2791;289/7409;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;;;;EtCHb8YAAAAJ;nujTx04AAAAJ",
        "orcid": ";;;;0000-0003-1306-5260;0000-0002-3957-1324;",
        "linkedin": ";;;jameswang771/;;szabolcs-marka-94130624;",
        "or_profile": "~Jingkai_Yan1;~Shiyu_Wang4;~Xinyu_Rain_Wei1;~Jimmy_Wang1;~Zsuzsanna_Marka1;~Szabolcs_Marka1;~John_Wright1",
        "aff": "Apple;Columbia University;Columbia University;Columbia University;Columbia University;Columbia University;Columbia University",
        "aff_domain": "apple.com;columbia.edu;columbia.edu;columbia.edu;columbia.edu;columbia.edu;columbia.edu",
        "position": "Researcher;PhD student;Undergrad student;Undergrad student;Researcher;Full Professor;Associate Professor",
        "bibtex": "@misc{\nyan2024tpopt,\ntitle={TpopT: Efficient Trainable Template Optimization on Low-Dimensional Manifolds},\nauthor={Jingkai Yan and Shiyu Wang and Xinyu Rain Wei and Jimmy Wang and Zsuzsanna Marka and Szabolcs Marka and John Wright},\nyear={2024},\nurl={https://openreview.net/forum?id=6YZmkpivVH}\n}",
        "github": "",
        "project": "",
        "reviewers": "X8Hz;Y4xN;wGVm;uRtk",
        "site": "https://openreview.net/forum?id=6YZmkpivVH",
        "pdf_size": 1025707,
        "rating": "3;5;6;8",
        "confidence": "4;4;3;4",
        "soundness": "2;4;2;4",
        "contribution": "2;2;3;4",
        "presentation": "2;3;3;3",
        "wc_summary": "213;119;73;51",
        "wc_strengths": "23;72;33;42",
        "wc_weaknesses": "197;315;303;5",
        "wc_questions": "283;128;49;185",
        "wc_review": "716;634;458;283",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "2294;1433;1782;890",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "4;2;3;2",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            1.0
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            114.0,
            62.20128616033595
        ],
        "wc_strengths_avg": [
            42.5,
            18.309833423600555
        ],
        "wc_weaknesses_avg": [
            205.0,
            124.26584406022437
        ],
        "wc_questions_avg": [
            161.25,
            85.2829848211236
        ],
        "wc_review_avg": [
            522.75,
            166.87926024524438
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1599.75,
            511.55369952723436
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.16012815380508713,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:oLJeAMIrlhMJ:scholar.google.com/&scioq=TpopT:+Efficient+Trainable+Template+Optimization+on+Low-Dimensional+Manifolds&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1;1;1;1;1",
        "aff_unique_norm": "Apple;Columbia University",
        "aff_unique_dep": "Apple Inc.;",
        "aff_unique_url": "https://www.apple.com;https://www.columbia.edu",
        "aff_unique_abbr": "Apple;Columbia",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "6Z8rZlKpNT",
        "title": "Normalizing Flows For Out of Distribution Detection via Latent Density Estimation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Out-of-distribution (OOD) detection is a critical task for safe deployment of learning systems in the open world setting. In this work, we propose the use of latent density estimation via normalizing flows for the OOD task and present a fully unsupervised approach with no requirement for exposure to OOD data, avoiding researcher bias in OOD sample selection. This is a fully post-hoc method which can be applied to any pretrained model, and involves training a lightweight auxiliary normalizing flow model to perform the out-of-distribution detection via density thresholding. Experiments on OOD detection in image classification show strong results, including 98.2\\% AUROC for ImageNet-1k vs. Textures, which exceeds the state of the art by 8.4\\%. Further, we provide insights into training pitfalls that have plagued normalizing flows for use in OOD detection.",
        "keywords": "Out-of-distribution detection;normalizing flow;image classification",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Evan Cook;Marc-Antoine Lavoie;Steven L. Waslander",
        "authorids": "~Evan_Cook1;~Marc-Antoine_Lavoie1;~Steven_L._Waslander1",
        "gender": ";M;M",
        "homepage": ";;https://trailab.utias.utoronto.ca",
        "dblp": ";;18/7142",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;jY_Bcd8AAAAJ",
        "orcid": ";;0000-0003-4217-4415",
        "linkedin": "evan-d-cook/;;",
        "or_profile": "~Evan_Cook1;~Marc-Antoine_Lavoie1;~Steven_Lake_Waslander1",
        "aff": "University of Toronto;University of Toronto;University of Toronto",
        "aff_domain": "utoronto.ca;utoronto.ca;utoronto.ca",
        "position": "MS student;PhD student;Full Professor",
        "bibtex": "@misc{\ncook2024normalizing,\ntitle={Normalizing Flows For Out of Distribution Detection via Latent Density Estimation},\nauthor={Evan Cook and Marc-Antoine Lavoie and Steven L. Waslander},\nyear={2024},\nurl={https://openreview.net/forum?id=6Z8rZlKpNT}\n}",
        "github": "",
        "project": "",
        "reviewers": "avuP;gGnx;wdco;E6xa;qftB",
        "site": "https://openreview.net/forum?id=6Z8rZlKpNT",
        "pdf_size": 10875232,
        "rating": "3;3;3;3;5",
        "confidence": "5;3;4;4;4",
        "soundness": "2;2;2;2;2",
        "contribution": "2;2;1;1;1",
        "presentation": "1;2;1;3;2",
        "wc_summary": "45;52;24;51;104",
        "wc_strengths": "33;52;15;66;69",
        "wc_weaknesses": "387;105;145;232;442",
        "wc_questions": "24;5;3;58;89",
        "wc_review": "489;214;187;407;704",
        "wc_reply_reviewers": "0;11;0;0;0",
        "wc_reply_authors": "192;242;224;489;539",
        "reply_reviewers": "0;1;0;0;0",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            3.4,
            0.8
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            1.8,
            0.7483314773547883
        ],
        "wc_summary_avg": [
            55.2,
            26.40757467091592
        ],
        "wc_strengths_avg": [
            47.0,
            20.445048300260872
        ],
        "wc_weaknesses_avg": [
            262.2,
            132.10813752377254
        ],
        "wc_questions_avg": [
            35.8,
            33.12642449767255
        ],
        "wc_review_avg": [
            400.2,
            189.9214574501786
        ],
        "wc_reply_reviewers_avg": [
            2.2,
            4.4
        ],
        "wc_reply_authors_avg": [
            337.2,
            146.10051334612072
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:YVVxFzWeQzIJ:scholar.google.com/&scioq=Normalizing+Flows+For+Out+of+Distribution+Detection+via+Latent+Density+Estimation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Toronto",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.utoronto.ca",
        "aff_unique_abbr": "U of T",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "6ZE9Zktbh6",
        "title": "Screening Unlearnable Examples via Iterative Self Regression",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Deep neural networks are proven to be vulnerable to data poisoning attacks. Recently, a specific type of data poisoning attack known as availability attacks, has led to the failure of data utilization for model learning by adding imperceptible perturbations to images. Consequently, it is quite beneficial and challenging to detect poisoned samples, also known as Unlearnable Examples (UEs), from a mixed dataset. To tackle this problem, in this paper, we introduce a novel Iterative Self-Regression approach for identifying UEs within a mixed dataset. This method leverages the distinction between the inherent semantic mapping rules and shortcuts, without the need for any additional information. Our investigation reveals a critical observation: when training a classifier on a mixed dataset containing both UEs and clean data, the model tends to quickly adapt to the UEs compared to the clean data. Due to the accuracy gaps between training with clean/poisoned samples, we employ a model to misclassify clean samples while correctly identifying the poisoned ones for identifying tainted samples. Furthermore, we find that it is more effective to differentiate between clean and poisoned samples and build the Iterative Self Regression algorithm. \nWith incorporated additional classes and iterative refinement, the model becomes more capable of differentiating between clean and poisoned samples. \nExtensive experiments demonstrate that our method outperforms state-of-the-art detection approaches across various types of attacks, datasets, and poisoning ratios, and it significantly reduces the Half Total Error Rate (HTER) in comparison to existing methods.",
        "keywords": "data poisoning attack;iterative self regression;availability attacks detection;unlearnable examples",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Yi Yu;Qichen Zheng;SIYUAN YANG;Wenhan Yang;Jun Liu;Shijian Lu;Yap-peng Tan;Kwok-Yan Lam;Alex Kot",
        "authorids": "~Yi_Yu5;~Qichen_Zheng1;~SIYUAN_YANG1;~Wenhan_Yang6;~Jun_Liu8;~Shijian_Lu1;~Yap-peng_Tan1;~Kwok-Yan_Lam1;~Alex_Kot1",
        "gender": ";M;M;M;M;M;M;M;",
        "homepage": "https://github.com/yuyi-sd;https://github.com/QichenZheng;;https://flyywh.github.io/;;https://personal.ntu.edu.sg/shijian.lu/;https://personal.ntu.edu.sg/eyptan/;https://personal.ntu.edu.sg/kwokyan.lam/;https://www.ntu.edu.sg/home/eackot/",
        "dblp": "99/111-11.html;285/4546;201/7699-1.html;156/2359.html;95/3736-36;42/2718;93/4472.html;10/1993;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;d6AbpzgAAAAJ;lzLsF2MAAAAJ;S8nAnakAAAAJ;Q5Ild8UAAAAJ;https://scholar.google.com.sg/scholar?hl=en;https://scholar.google.com.sg/citations?user=t9EqYQIAAAAJ;https://scholar.google.com.sg/citations?user=NDMIYKsAAAAJ;",
        "orcid": "0000-0003-2730-9553;;0000-0003-4681-0431;;;;0000-0002-0645-9109;;",
        "linkedin": "%E7%9B%8A-%E4%BD%99-6b453a229;;;;;;;;",
        "or_profile": "~Yi_Yu5;~Qichen_Zheng1;~SIYUAN_YANG1;~Wenhan_Yang6;~Jun_Liu8;~Shijian_Lu1;~Yap-peng_Tan1;~Kwok-Yan_Lam1;~Alex_Kot1",
        "aff": "Nanyang Technological University;Nanyang Technological University;Nanyang Technological University;Peng Cheng Laboratory;Singapore University of Technology and Design;Nanyang Technological University;Nanyang Technological University;Nanyang Technological University;Nanyang Technological University",
        "aff_domain": "ntu.edu.sg;ntu.edu;ntu.edu.sg;pcl.ac.cn;sutd.edu.sg;ntu.edu.sg;ntu.edu.sg;ntu.edu.sg;ntu.edu.sg",
        "position": "PhD student;PhD student;PhD student;Researcher;Assistant Professor;Associate Professor;Full Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nyu2024screening,\ntitle={Screening Unlearnable Examples via Iterative Self Regression},\nauthor={Yi Yu and Qichen Zheng and SIYUAN YANG and Wenhan Yang and Jun Liu and Shijian Lu and Yap-peng Tan and Kwok-Yan Lam and Alex Kot},\nyear={2024},\nurl={https://openreview.net/forum?id=6ZE9Zktbh6}\n}",
        "github": "",
        "project": "",
        "reviewers": "6SZH;Ymu2;cckS;cGpA",
        "site": "https://openreview.net/forum?id=6ZE9Zktbh6",
        "pdf_size": 793902,
        "rating": "1;3;5;5",
        "confidence": "5;4;4;4",
        "soundness": "2;2;2;3",
        "contribution": "1;2;3;3",
        "presentation": "1;2;3;2",
        "wc_summary": "36;90;92;63",
        "wc_strengths": "7;43;45;53",
        "wc_weaknesses": "654;206;325;115",
        "wc_questions": "16;166;3;17",
        "wc_review": "713;505;465;248",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            1.6583123951777
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            70.25,
            22.851422275210794
        ],
        "wc_strengths_avg": [
            37.0,
            17.72004514666935
        ],
        "wc_weaknesses_avg": [
            325.0,
            204.0232829850554
        ],
        "wc_questions_avg": [
            50.5,
            66.91225597751132
        ],
        "wc_review_avg": [
            482.75,
            165.024808740989
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -0.8703882797784891,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:5V7wE0J09X8J:scholar.google.com/&scioq=Screening+Unlearnable+Examples+via+Iterative+Self+Regression&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;2;0;0;0;0",
        "aff_unique_norm": "Nanyang Technological University;Pengcheng Laboratory;Singapore University of Technology and Design",
        "aff_unique_dep": ";Peng Cheng Laboratory;",
        "aff_unique_url": "https://www.ntu.edu.sg;http://www.pcl.ac.cn;https://www.sutd.edu.sg",
        "aff_unique_abbr": "NTU;PCL;SUTD",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0;0;0;0;0",
        "aff_country_unique": "Singapore;China"
    },
    {
        "id": "6ZbMLZb4gL",
        "title": "Big Picture Thinking: Enhance Multi-Agent Imitation Learning through Global Dependencies",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Multi-agent reinforcement learning (MARL) has emerged as a promising approach for solving complex problems involving multi-agent collaboration or competition. Recently, researchers have turned to imitation learning to avoid the explicit design of intricate reward functions in MARL. By formulating the problem as a distribution-matching task based on expert trajectories, imitation learning enables agents to continually approximate expert policies without requiring manual reward engineering. However, classical multi-agent imitation learning frameworks, such as MAGAIL, often treat individual agent's distribution matching independently, disregarding the intricate dependencies that arise from agent cooperation. This neglect results in inaccurate estimations of action-value functions, weak feedback from the discriminator, and a significant vanishing gradient problem. This paper proposed a novel multi-agent joint distribution matching framework based on the Transformer architecture. It explicitly models global dependencies among agents within the generator and discriminator components sequentially and autoregressively. We also theoretically prove the effectiveness of this framework in enhancing reward variance and advantage gradient. Extensive experiments demonstrated the remarkable performance improvements achieved by our proposed method on various benchmarks.",
        "keywords": "Multi-agent reinforcement learning;Generative adversarial imitation learning;Complex dependency;Joint distribution matching;Transformer",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/851cac550a088a88f457f28cd3bc58c8ff7325a6.zip",
        "author": "Tianchen Zhu",
        "authorids": "~Tianchen_Zhu1",
        "gender": "M",
        "homepage": "https://zhutc.tk",
        "dblp": "https://dblp.uni-trier.de/pid/163/4107",
        "google_scholar": "P60wcZwAAAAJ",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Tianchen_Zhu1",
        "aff": "Beihang University",
        "aff_domain": "buaa.edu.cn",
        "position": "PhD student",
        "bibtex": "@misc{\nzhu2024big,\ntitle={Big Picture Thinking: Enhance Multi-Agent Imitation Learning through Global Dependencies},\nauthor={Tianchen Zhu},\nyear={2024},\nurl={https://openreview.net/forum?id=6ZbMLZb4gL}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=6ZbMLZb4gL",
        "pdf_size": 798943,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:nTV4pdGrPvYJ:scholar.google.com/&scioq=Big+Picture+Thinking:+Enhance+Multi-Agent+Imitation+Learning+through+Global+Dependencies&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Beihang University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.buaa.edu.cn/",
        "aff_unique_abbr": "BUAA",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "6ZuDeSHzjj",
        "title": "Outliers Memorized Last: Trends in Memorization of Diffusion Models Based on Training Distribution and Epoch",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Memorization and replication of training data in diffusion models like Stable Diffusion is a poorly understood phenomenon with a number of privacy and legal issues tied to it. This paper analyzes how the location of a data point in the training dataset's distribution affects its likelihood of memorization over training epochs. Importantly, it finds that memorization of 'outliers'  is less likely early in the training process until eventually matching with the rest of the dataset. It then suggests applications utilizing this difference in memorization rate, including hyperparameter tuning and anomaly detection. It then suggests research that could be done from this conclusion to further improve memorization understanding.",
        "keywords": "Diffusion Models;Generative AI;Memorization",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/81b134131e59b8d7087486d7e50684b54846fea0.zip",
        "author": "Aryan Janolkar",
        "authorids": "~Aryan_Janolkar1",
        "gender": "M",
        "homepage": "",
        "dblp": "",
        "google_scholar": "",
        "orcid": "",
        "linkedin": "aryan-janolkar-99b152197/",
        "or_profile": "~Aryan_Janolkar1",
        "aff": "University of California, Los Angeles",
        "aff_domain": "ucla.edu",
        "position": "Undergrad student",
        "bibtex": "@misc{\njanolkar2024outliers,\ntitle={Outliers Memorized Last: Trends in Memorization of Diffusion Models Based on Training Distribution and Epoch},\nauthor={Aryan Janolkar},\nyear={2024},\nurl={https://openreview.net/forum?id=6ZuDeSHzjj}\n}",
        "github": "",
        "project": "",
        "reviewers": "uuB7;FcWa;ehcz;c1Ba",
        "site": "https://openreview.net/forum?id=6ZuDeSHzjj",
        "pdf_size": 234421,
        "rating": "1;1;1;3",
        "confidence": "4;5;5;4",
        "soundness": "1;2;1;2",
        "contribution": "1;2;1;2",
        "presentation": "1;1;1;2",
        "wc_summary": "45;132;55;75",
        "wc_strengths": "14;45;48;12",
        "wc_weaknesses": "18;63;453;49",
        "wc_questions": "1;1;77;5",
        "wc_review": "78;241;633;141",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            1.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            1.5,
            0.5
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            1.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            76.75,
            33.677700337166726
        ],
        "wc_strengths_avg": [
            29.75,
            16.798437427332342
        ],
        "wc_weaknesses_avg": [
            145.75,
            178.13671014139675
        ],
        "wc_questions_avg": [
            21.0,
            32.37282811247729
        ],
        "wc_review_avg": [
            273.25,
            215.68075366151706
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6203931028012849713&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of California, Los Angeles",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucla.edu",
        "aff_unique_abbr": "UCLA",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Los Angeles",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "6aRMQVlPVE",
        "title": "Rank-adaptive spectral pruning of convolutional layers during training",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The computing cost and memory demand of deep learning pipelines have grown fast in recent years and thus a variety of techniques have been developed to reduce model parameters. The majority of these techniques focus on reducing inference costs by pruning the network after a pass of full training. A smaller number of methods addresses the reduction of training costs, mostly based on compressing the network via low-rank layer factorizations. Despite their efficiency for linear layers, these methods fail to effectively handle convolutional filters. In this work, we propose a low-parametric training method that factorizes the convolutions into tensor Tucker format and adaptively prunes the Tucker ranks of the convolutional kernel during training. Leveraging fundamental results from geometric integration theory of differential equations on tensor manifolds, we obtain a robust training algorithm that provably approximates the full baseline performance and guarantees loss descent. \nA variety of experiments against the full model and alternative low-rank baselines are implemented, \nshowing that the proposed method drastically reduces the training costs, while achieving high performance, comparable to or better than the full baseline, outperforming competing low-rank approaches.",
        "keywords": "Convolutional neural networks;Neural Network Compression;Low-Rank Tensors;Dynamical Low-Rank Approximation;Neural Network Training;Pruning",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/9af1937b3d262e44f4cbaa472d4994cb713de705.zip",
        "author": "Emanuele Zangrando;Steffen Schotth\u00f6fer;Gianluca Ceruti;Jonas Kusch;Francesco Tudisco",
        "authorids": "~Emanuele_Zangrando1;~Steffen_Schotth\u00f6fer1;~Gianluca_Ceruti1;~Jonas_Kusch1;~Francesco_Tudisco1",
        "gender": "M;M;M;M;M",
        "homepage": ";https://scsteffen.github.io/;;;https://ftudisco.gitlab.io/",
        "dblp": "321/1701;;;236/0493;136/5777",
        "google_scholar": "https://scholar.google.it/citations?hl=it;dZqiHeMAAAAJ;eyptuo8AAAAJ;https://scholar.google.de/citations?user=8JGYQTYAAAAJ;uND_5REAAAAJ",
        "orcid": ";;;0000-0002-2061-2114;0000-0002-8150-4475",
        "linkedin": ";steffen-schotthoefer/;;;",
        "or_profile": "~Emanuele_Zangrando1;~Steffen_Schotth\u00f6fer1;~Gianluca_Ceruti1;~Jonas_Kusch1;~Francesco_Tudisco1",
        "aff": "Gran Sasso Science Institute;Oak Ridge National Laboratory;Universit\u00e4t Innsbruck;Norwegian University of Life Sciences;Gran Sasso Science Institute",
        "aff_domain": "gssi.it;ornl.gov;uibk.ac.at;nmbu.no;gssi.it",
        "position": "PhD student;Researcher;Postdoc;Associate Professor;Associate Professor",
        "bibtex": "@misc{\nzangrando2024rankadaptive,\ntitle={Rank-adaptive spectral pruning of convolutional layers during training},\nauthor={Emanuele Zangrando and Steffen Schotth{\\\"o}fer and Gianluca Ceruti and Jonas Kusch and Francesco Tudisco},\nyear={2024},\nurl={https://openreview.net/forum?id=6aRMQVlPVE}\n}",
        "github": "",
        "project": "",
        "reviewers": "SS8V;T5Ao;AtDm",
        "site": "https://openreview.net/forum?id=6aRMQVlPVE",
        "pdf_size": 395678,
        "rating": "3;5;5",
        "confidence": "4;3;2",
        "soundness": "2;3;2",
        "contribution": "2;2;2",
        "presentation": "3;3;2",
        "wc_summary": "84;62;80",
        "wc_strengths": "66;11;59",
        "wc_weaknesses": "259;26;62",
        "wc_questions": "97;104;46",
        "wc_review": "506;203;247",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "804;401;414",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            75.33333333333333,
            9.568466729604882
        ],
        "wc_strengths_avg": [
            45.333333333333336,
            24.44494948973214
        ],
        "wc_weaknesses_avg": [
            115.66666666666667,
            102.41202186375494
        ],
        "wc_questions_avg": [
            82.33333333333333,
            25.84999462712173
        ],
        "wc_review_avg": [
            318.6666666666667,
            133.6770569527754
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            539.6666666666666,
            186.98722475672562
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6015670969082691589&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;3;0",
        "aff_unique_norm": "Gran Sasso Science Institute;Oak Ridge National Laboratory;University of Innsbruck;Norwegian University of Life Sciences",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.gssi.it;https://www.ornl.gov;https://www.uibk.ac.at;https://www.nmbu.no",
        "aff_unique_abbr": ";ORNL;UIBK;NMBU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Innsbruck",
        "aff_country_unique_index": "0;1;2;3;0",
        "aff_country_unique": "Italy;United States;Austria;Norway"
    },
    {
        "id": "6bAfAcuuZD",
        "title": "Emergence of Surprise and Predictive Signals from Local Contrastive Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Hierarchical predictive models are often used to model cortical representations. These models exploit the local or global computation of predictive signals in the neural network, but their biological plausibility is limited as it is currently unknown whether cortical circuits perform such computations at all. This paper seeks to further investigate the inverted Forward-Forward Algorithm, a biologically plausible innovative approach to learning with only forward passes, in order to demonstrate that hierarchical predictive computations can emerge from a simpler contrastive constraint on the network's representation. Through the identification of compelling similarities between our model and hierarchical predictive coding, as well as the examination of the emergent properties of resulting representations, we advance the hypothesis that the computational properties that emerge in neocortical circuits, widely acknowledged as the basis of human intelligence, may be attributed to local learning principles.",
        "keywords": "Forward Forward Algorithm;Contrastive Learning;Predictive Coding;Cortical Representations;Biological Plausibility",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/85112c502d5cd9b6eba345889c23a1fe0a5b3054.pdf",
        "author": "Andrew Lawrence Smith;Linxing Preston Jiang;Stefano Recanatesi;Matthew Storm Bull",
        "authorids": "~Andrew_Lawrence_Smith1;~Linxing_Preston_Jiang1;~Stefano_Recanatesi1;~Matthew_Storm_Bull1",
        "gender": "M;M;M;",
        "homepage": "https://github.com/and-rewsmith;https://lpjiang97.github.io/;;",
        "dblp": ";;;",
        "google_scholar": ";B706p2YAAAAJ;;79lMvCMRCK8C",
        "orcid": ";;0000-0002-3576-9261;",
        "linkedin": "and-rewsmith/;;;",
        "or_profile": "~Andrew_Lawrence_Smith1;~Linxing_Preston_Jiang1;~Stefano_Recanatesi1;~Matthew_Storm_Bull1",
        "aff": ";Department of Computer Science, University of Washington;University of Washington;Allen Institute + University of Washington",
        "aff_domain": ";cs.washington.edu;uw.edu;alleninstitute.org",
        "position": ";PhD student;Postdoc;Postdoc",
        "bibtex": "@misc{\nsmith2024emergence,\ntitle={Emergence of Surprise and Predictive Signals from Local Contrastive Learning},\nauthor={Andrew Lawrence Smith and Linxing Preston Jiang and Stefano Recanatesi and Matthew Storm Bull},\nyear={2024},\nurl={https://openreview.net/forum?id=6bAfAcuuZD}\n}",
        "github": "",
        "project": "",
        "reviewers": "3133;mvwV;D7tC;fE2s",
        "site": "https://openreview.net/forum?id=6bAfAcuuZD",
        "pdf_size": 707504,
        "rating": "3;3;8;8",
        "confidence": "4;4;4;4",
        "soundness": "2;1;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;1;4;3",
        "wc_summary": "153;163;63;219",
        "wc_strengths": "34;60;178;105",
        "wc_weaknesses": "736;286;102;36",
        "wc_questions": "331;85;180;36",
        "wc_review": "1254;594;523;396",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "692;305;452;148",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.5,
            2.5
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            149.5,
            55.91734972260399
        ],
        "wc_strengths_avg": [
            94.25,
            54.61856369404087
        ],
        "wc_weaknesses_avg": [
            290.0,
            273.3093485411723
        ],
        "wc_questions_avg": [
            158.0,
            112.50111110562419
        ],
        "wc_review_avg": [
            691.75,
            332.2742654795884
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            399.25,
            200.30898007827807
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:bpC6jt93z8QJ:scholar.google.com/&scioq=Emergence+of+Surprise+and+Predictive+Signals+from+Local+Contrastive+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1+0",
        "aff_unique_norm": "University of Washington;Allen Institute for Artificial Intelligence",
        "aff_unique_dep": "Department of Computer Science;",
        "aff_unique_url": "https://www.washington.edu;https://allenai.org",
        "aff_unique_abbr": "UW;AI2",
        "aff_campus_unique_index": "0;",
        "aff_campus_unique": "Seattle;",
        "aff_country_unique_index": "0;0;0+0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Unmasking and Improving Data Credibility: A Study with Datasets for Training Harmless Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19388",
        "id": "6bcAD6g688",
        "author_site": "Zhaowei Zhu, Jialu Wang, Hao Cheng, Yang Liu",
        "tldr": "",
        "abstract": "Language models have shown promise in various tasks but can be affected by undesired data during training, fine-tuning, or alignment. For example, if some unsafe conversations are wrongly annotated as safe ones, the model fine-tuned on these samples may be harmful. Therefore, the correctness of annotations, i.e., the credibility of the dataset, is important. This study focuses on the credibility of real-world datasets, including the popular benchmarks Jigsaw Civil Comments, Anthropic Harmless & Red Team, PKU BeaverTails & SafeRLHF, that can be used for training a harmless language model. Given the cost and difficulty of cleaning these datasets by humans, we introduce a systematic framework for evaluating the credibility of datasets, identifying label errors, and evaluating the influence of noisy labels in the curated language data, specifically focusing on unsafe comments and conversation classification. With the framework, we find and fix an average of **6.16\\%** label errors in **11** datasets constructed from the above benchmarks. The data credibility and downstream learning performance can be remarkably improved by directly fixing label errors, indicating the significance of cleaning existing real-world datasets. Code is available at [https://github.com/Docta-ai/docta](https://github.com/Docta-ai/docta).",
        "keywords": "Label errors;dataset cleaning;AI safety;toxicity;harmless;language models",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/e944516261150a416fc2926d2276766a0a3dc06c.zip",
        "author": "Zhaowei Zhu;Jialu Wang;Hao Cheng;Yang Liu",
        "authorids": "~Zhaowei_Zhu1;~Jialu_Wang1;~Hao_Cheng5;~Yang_Liu3",
        "gender": "M;;M;M",
        "homepage": "https://www.zzw.ai;https://people.ucsc.edu/~jwang470/;https://haochenglouis.github.io;http://www.yliuu.com",
        "dblp": "202/1712;195/2701;;51/3710-18",
        "google_scholar": "YS8pSQoAAAAJ;HOtDeN0AAAAJ;ftlVqVIAAAAJ;jKrIVCIAAAAJ",
        "orcid": "0000-0003-3894-5862;;0000-0001-8864-7818;0000-0001-8420-6011",
        "linkedin": ";;;",
        "or_profile": "~Zhaowei_Zhu1;~Jialu_Wang1;~Hao_Cheng5;~Yang_Liu3",
        "aff": "Docta.ai;University of California, Santa Cruz;University of California, Santa Cruz;University of California, Santa Cruz",
        "aff_domain": "docta.ai;ucsc.edu;ucsc.edu;ucsc.edu",
        "position": "Researcher;PhD student;PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nzhu2024unmasking,\ntitle={Unmasking and Improving Data Credibility: A Study with Datasets for Training Harmless Language Models},\nauthor={Zhaowei Zhu and Jialu Wang and Hao Cheng and Yang Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=6bcAD6g688}\n}",
        "github": "",
        "project": "",
        "reviewers": "rcNR;LDAu;RBmm;c2zo",
        "pdf_size": 417690,
        "rating": "5;6;6;6",
        "confidence": "3;3;3;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "1;3;3;3",
        "wc_summary": "69;133;99;54",
        "wc_strengths": "30;64;8;74",
        "wc_weaknesses": "166;144;71;298",
        "wc_questions": "35;24;90;28",
        "wc_review": "300;365;268;454",
        "wc_reply_reviewers": "0;27;0;47",
        "wc_reply_authors": "1149;633;446;1342",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "3;3;2;4",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            88.75,
            30.252066045148055
        ],
        "wc_strengths_avg": [
            44.0,
            26.419689627245813
        ],
        "wc_weaknesses_avg": [
            169.75,
            81.97065023531289
        ],
        "wc_questions_avg": [
            44.25,
            26.705570579937064
        ],
        "wc_review_avg": [
            346.75,
            71.1033578672625
        ],
        "wc_reply_reviewers_avg": [
            18.5,
            19.80530232033836
        ],
        "wc_reply_authors_avg": [
            892.5,
            365.56292208045386
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 20,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14596580015436199352&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=6bcAD6g688",
        "pdf": "https://openreview.net/pdf?id=6bcAD6g688",
        "email": "docta.ai;ucsc.edu;ucsc.edu;ucsc.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Docta.ai;University of California, Santa Cruz",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://docta.ai;https://www.ucsc.edu",
        "aff_unique_abbr": "Docta.ai;UCSC",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Santa Cruz",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "6c4gv0E9sF",
        "title": "SpikeBERT: A Language Spikformer Learned from BERT with Knowledge Distillation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Spiking neural networks (SNNs) offer a promising avenue to implement deep neural networks in a more energy-efficient way.\nHowever, the network architectures of existing SNNs for language tasks are still simplistic and relatively shallow, and deep architectures have not been fully explored, resulting in a significant performance gap compared to mainstream transformer-based networks such as BERT.\nTo this end, we improve a recently-proposed spiking Transformer (i.e., Spikformer) to make it possible to process language tasks and propose a two-stage knowledge distillation method for training it, which combines pre-training by distilling knowledge from BERT with a large collection of unlabelled texts and fine-tuning with task-specific instances via knowledge distillation again from the BERT fine-tuned on the same training examples.\nThrough extensive experimentation, we show that the models trained with our method, named SpikeBERT, outperform state-of-the-art SNNs and even achieve comparable results to BERTs on text classification tasks for both English and Chinese with much less energy consumption.",
        "keywords": "Spiking neural networks;Natural language processing;Knowledge distillation",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/c90775d34aead3652b58ce36b83217f4b378a525.zip",
        "author": "Changze Lv;Tianlong Li;Jianhan Xu;Chenxi Gu;Zixuan Ling;Cenyuan Zhang;Xiaoqing Zheng;Xuanjing Huang",
        "authorids": "~Changze_Lv1;~Tianlong_Li4;~Jianhan_Xu1;~Chenxi_Gu2;~Zixuan_Ling1;~Cenyuan_Zhang1;~Xiaoqing_Zheng2;~Xuanjing_Huang1",
        "gender": "M;M;M;;M;;;F",
        "homepage": "https://lvchangze.github.io;https://github.com/Tengyuantuohai-113;;;https://github.com/narcissusLZX;;;https://xuanjing-huang.github.io/",
        "dblp": "350/4445;;278/1558.html;;;293/9880;;05/6735-1",
        "google_scholar": "t3-viUwAAAAJ;https://scholar.google.com.hk/citations?hl=zh-CN;G_p-oocAAAAJ;;;ghu4BZcAAAAJ;;RGsMgZA4H78C",
        "orcid": ";;;;;;;0000-0001-9197-9426",
        "linkedin": ";;;;;;;",
        "or_profile": "~Changze_Lv1;~Tianlong_Li4;~Jianhan_Xu1;~Chenxi_Gu2;~Zixuan_Ling1;~Cenyuan_Zhang1;~Xiaoqing_Zheng2;~Xuanjing_Huang1",
        "aff": "Fudan University;Fudan University;Xiaohongshu;;Fudan University;Fudan University;;Fudan University",
        "aff_domain": "fudan.edu.cn;fudan.edu.cn;xiaohongshu.com;;fudan.edu.cn;fudan.edu.cn;;fudan.edu.cn",
        "position": "PhD student;MS student;Researcher;;MS student;MS student;;Full Professor",
        "bibtex": "@misc{\nanonymous2024spikebert,\ntitle={Spike{BERT}: A Language Spikformer Learned from {BERT} with Knowledge Distillation},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=6c4gv0E9sF}\n}",
        "github": "",
        "project": "",
        "reviewers": "sLn7;17Yy;is3e",
        "site": "https://openreview.net/forum?id=6c4gv0E9sF",
        "pdf_size": 916951,
        "rating": "3;8;8",
        "confidence": "4;5;4",
        "soundness": "2;3;3",
        "contribution": "1;3;4",
        "presentation": "2;3;3",
        "wc_summary": "43;66;117",
        "wc_strengths": "45;58;102",
        "wc_weaknesses": "475;50;67",
        "wc_questions": "438;32;84",
        "wc_review": "1001;206;370",
        "wc_reply_reviewers": "115;23;0",
        "wc_reply_authors": "3499;487;958",
        "reply_reviewers": "2;1;0",
        "reply_authors": "7;2;2",
        "rating_avg": [
            6.333333333333333,
            2.357022603955158
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            75.33333333333333,
            30.922843048824316
        ],
        "wc_strengths_avg": [
            68.33333333333333,
            24.390344173235622
        ],
        "wc_weaknesses_avg": [
            197.33333333333334,
            196.46260599807675
        ],
        "wc_questions_avg": [
            184.66666666666666,
            180.38723778459374
        ],
        "wc_review_avg": [
            525.6666666666666,
            342.7149771392484
        ],
        "wc_reply_reviewers_avg": [
            46.0,
            49.68567868779359
        ],
        "wc_reply_authors_avg": [
            1648.0,
            1322.903624607628
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            2.3570226039551585
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9584516174752539551&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1;0;0;0",
        "aff_unique_norm": "Fudan University;Xiaohongshu",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.fudan.edu.cn;https://www.xiaohongshu.com",
        "aff_unique_abbr": "Fudan;XHS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "6cDEcJsE1Y",
        "title": "Certainty In, Certainty Out: REVQCs for Quantum Machine Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The field of Quantum Machine Learning (QML) has emerged recently in the hopes of finding new machine learning protocols or exponential speedups for classical ones. Apart from problems with vanishing gradients and efficient encoding methods, these speedups are hard to find because the sampling nature of quantum computers promotes either simulating computations classically or running them many times on quantum computers in order to use approximate expectation values in gradient calculations. In this paper, we make a case for setting high single-sample accuracy as a primary goal. We discuss the statistical theory which enables highly accurate and precise sample inference, and propose a method of reversed training towards this end. We show the effectiveness of this training method by assessing several effective variational quantum circuits (VQCs), trained in both the standard and reversed directions, on random binary subsets of the MNIST and MNIST Fashion datasets, on which our method provides an increase of $10-15\\\\%$ in single-sample inference accuracy.",
        "keywords": "Quantum machine learning;variational quantum circuits;receptive field;alleatoric uncertainty;epistemic uncertainty",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Hannah D Helgesen;Michael Felsberg;Jan-\u00c5ke Larsson",
        "authorids": "~Hannah_D_Helgesen1;~Michael_Felsberg2;~Jan-\u00c5ke_Larsson1",
        "gender": "M;;M",
        "homepage": "https://liu.se/medarbetare/hanhe49;https://liu.se/en/employee/micfe03;https://liu.se/en/employee/janla64",
        "dblp": ";00/78;95/10166",
        "google_scholar": ";https://scholar.google.se/citations?hl=en;https://scholar.google.se/citations?user=lVhwET4AAAAJ",
        "orcid": ";0000-0002-6096-3648;0000-0002-1082-8325",
        "linkedin": "hannah-helgesen;https://linkedin.com/in/michael-felsberg-668a202;",
        "or_profile": "~Hannah_D_Helgesen1;~Michael_Felsberg2;~Jan-\u00c5ke_Larsson1",
        "aff": "Link\u00f6ping University;Link\u00f6ping University;Link\u00f6ping University",
        "aff_domain": "liu.se;liu.se;liu.se",
        "position": "PhD student;Full Professor;Full Professor",
        "bibtex": "@misc{\nhelgesen2024certainty,\ntitle={Certainty In, Certainty Out: {REVQC}s for Quantum Machine Learning},\nauthor={Hannah D Helgesen and Michael Felsberg and Jan-{\\r{A}}ke Larsson},\nyear={2024},\nurl={https://openreview.net/forum?id=6cDEcJsE1Y}\n}",
        "github": "",
        "project": "",
        "reviewers": "eDnW;Udj4;2wYu",
        "site": "https://openreview.net/forum?id=6cDEcJsE1Y",
        "pdf_size": 1110376,
        "rating": "3;3;3",
        "confidence": "5;4;5",
        "soundness": "1;1;2",
        "contribution": "2;1;2",
        "presentation": "1;2;3",
        "wc_summary": "50;77;35",
        "wc_strengths": "32;23;29",
        "wc_weaknesses": "208;260;353",
        "wc_questions": "63;18;34",
        "wc_review": "353;378;451",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            54.0,
            17.378147196982766
        ],
        "wc_strengths_avg": [
            28.0,
            3.7416573867739413
        ],
        "wc_weaknesses_avg": [
            273.6666666666667,
            59.979626170521904
        ],
        "wc_questions_avg": [
            38.333333333333336,
            18.624953392931992
        ],
        "wc_review_avg": [
            394.0,
            41.57723736212721
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:PbhUiwKDKskJ:scholar.google.com/&scioq=Certainty+In,+Certainty+Out:+REVQCs+for+Quantum+Machine+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Link\u00f6ping University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.liu.se",
        "aff_unique_abbr": "LiU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Sweden"
    },
    {
        "title": "Local Search GFlowNets",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19387",
        "id": "6cFcw1Rxww",
        "author_site": "Minsu Kim, Yun Taeyoung, Emmanuel Bengio, Dinghuai Zhang, Yoshua Bengio, Sungsoo Ahn, Jinkyoo Park",
        "tldr": "",
        "abstract": "Generative Flow Networks (GFlowNets) are amortized sampling methods that learn a distribution over discrete objects proportional to their rewards. GFlowNets exhibit a remarkable ability to generate diverse samples, yet occasionally struggle to consistently produce samples with high rewards due to over-exploration on wide sample space. \nThis paper proposes to train GFlowNets with local search, which focuses on exploiting high-rewarded sample space to resolve this issue. Our main idea is to explore the local neighborhood via backtracking and reconstruction guided by backward and forward policies, respectively. This allows biasing the samples toward high-reward solutions, which is not possible for a typical GFlowNet solution generation scheme, which uses the forward policy to generate the solution from scratch. Extensive experiments demonstrate a remarkable performance improvement in several biochemical tasks. Source code is available: \\url{https://github.com/dbsxodud-11/ls_gfn}.",
        "keywords": "GFlowNet;molecule optimization;biological sequence design;local search;reinforcement learning",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Minsu Kim;Taeyoung Yun;Emmanuel Bengio;Dinghuai Zhang;Yoshua Bengio;Sungsoo Ahn;Jinkyoo Park",
        "authorids": "~Minsu_Kim2;~Taeyoung_Yun1;~Emmanuel_Bengio1;~Dinghuai_Zhang1;~Yoshua_Bengio1;~Sungsoo_Ahn1;~Jinkyoo_Park1",
        "gender": "M;M;M;;M;M;M",
        "homepage": "https://minsuukim.github.io/;https://dbsxodud-11.github.io;http://folinoid.com;;http://yoshuabengio.org;https://sungsooahn.super.site/;http://silab.kaist.ac.kr/",
        "dblp": ";358/5797.html;137/8040;;56/953;90/5164;156/7535",
        "google_scholar": "https://scholar.google.ca/citations?user=VvyLuhAAAAAJ;_51PhLQAAAAJ;https://scholar.google.ca/citations?user=yVtSOt8AAAAJ;;kukA0LcAAAAJ;XTenHs0AAAAJ;sH2a0nkAAAAJ",
        "orcid": ";0009-0001-4602-6367;;;;;0000-0003-2620-1479",
        "linkedin": ";;;;yoshuabengio/?originalSubdomain=ca;;",
        "or_profile": "~Minsu_Kim2;~Taeyoung_Yun1;~Emmanuel_Bengio1;~Dinghuai_Zhang1;~Yoshua_Bengio1;~Sungsoo_Ahn1;~Jinkyoo_Park1",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Valence Labs powered by recursion;;University of Montreal;Pohang University of Science and Technology;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr;valencelabs.com;;umontreal.ca;postech.ac.kr;kaist.ac.kr",
        "position": "PhD student;MS student;Researcher;;Full Professor;Assistant Professor;Associate Professor",
        "bibtex": "@inproceedings{\nkim2024local,\ntitle={Local Search {GF}lowNets},\nauthor={Minsu Kim and Taeyoung Yun and Emmanuel Bengio and Dinghuai Zhang and Yoshua Bengio and Sungsoo Ahn and Jinkyoo Park},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=6cFcw1Rxww}\n}",
        "github": "",
        "project": "",
        "reviewers": "xEGb;wUkH;4fxw",
        "pdf_size": 3084550,
        "rating": "6;6;8",
        "confidence": "4;3;2",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "3;4;3",
        "wc_summary": "46;99;75",
        "wc_strengths": "36;90;26",
        "wc_weaknesses": "42;201;8",
        "wc_questions": "61;151;22",
        "wc_review": "185;541;131",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "570;1708;360",
        "reply_reviewers": "0;0;0",
        "reply_authors": "3;5;3",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            73.33333333333333,
            21.66923061752668
        ],
        "wc_strengths_avg": [
            50.666666666666664,
            28.110891523077356
        ],
        "wc_weaknesses_avg": [
            83.66666666666667,
            84.12028424953296
        ],
        "wc_questions_avg": [
            78.0,
            54.01851534427802
        ],
        "wc_review_avg": [
            285.6666666666667,
            181.88885495146633
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            879.3333333333334,
            592.194412521954
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 34,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=307485571580394019&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=6cFcw1Rxww",
        "pdf": "https://openreview.net/pdf?id=6cFcw1Rxww",
        "email": "kaist.ac.kr;kaist.ac.kr;valencelabs.com;;umontreal.ca;postech.ac.kr;kaist.ac.kr",
        "author_num": 7,
        "aff_unique_index": "0;0;1;2;3;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology;Valence Labs;University of Montreal;Pohang University of Science and Technology",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.kaist.ac.kr;;https://wwwumontreal.ca;https://www.postech.ac.kr",
        "aff_unique_abbr": "KAIST;;UM;POSTECH",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Pohang",
        "aff_country_unique_index": "0;0;2;0;0",
        "aff_country_unique": "South Korea;;Canada"
    },
    {
        "id": "6cGiRiExUd",
        "title": "Efficient Point Cloud Matching for 3D Geometric Shape Assembly",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Learning to assemble geometric shapes into a larger target structure is a fundamental task with various high-level visual applications. In this work, we frame this problem as geometric registration with extremely low overlap. Our goal is to establish accurate correspondences on the mating surface of the shape fragments to predict their relative rigid transformations for assembly. To this end, we introduce Proxy Match Transform (PMT), an approximate high-order feature transform layer that enables reliable correspondences between dense point clouds of shape fragments, while incurring low costs in memory and compute. In our experiments, we demonstrate that Proxy Match Transform surpasses existing state-of-the-art baselines on a popular geometric shape assembly dataset, while exhibiting higher efficiency than other high-order feature transform methods.",
        "keywords": "Geometric shape assembly;High-dimensional feature transform;Correlation aggregation;Proxy Match Transform",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Nahyuk Lee;Juhong Min;Junha Lee;Seungwook Kim;Kanghee Lee;Jaesik Park;Minsu Cho",
        "authorids": "~Nahyuk_Lee1;~Juhong_Min1;~Junha_Lee2;~Seungwook_Kim2;~Kanghee_Lee1;~Jaesik_Park3;~Minsu_Cho1",
        "gender": "M;;M;;;M;M",
        "homepage": "https://nahyuklee.github.io/;;https://junha-l.github.io;;;http://jaesik.info;http://cvlab.postech.ac.kr/~mcho/",
        "dblp": "383/1188;;53/11266;;;00/10336;",
        "google_scholar": "QQamvI0AAAAJ;;RB7qMm4AAAAJ;;;_3q6KBIAAAAJ;5TyoF5QAAAAJ",
        "orcid": ";;;;;;",
        "linkedin": "nahyuk-lee/;;https://linkedin.com/in/junha-l/;;;;minsu-cho-062b3750/",
        "or_profile": "~Nahyuk_Lee1;~Juhong_Min1;~Junha_Lee2;~Seungwook_Kim2;~Kanghee_Lee1;~Jaesik_Park3;~Minsu_Cho1",
        "aff": "Pohang University of Science and Technology;;Pohang University of Science and Technology;;;Seoul National University;POSTECH",
        "aff_domain": "postech.ac.kr;;postech.ac.kr;;;snu.ac.kr;postech.ac.kr",
        "position": "MS student;;PhD student;;;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nlee2024efficient,\ntitle={Efficient Point Cloud Matching for 3D Geometric Shape Assembly},\nauthor={Nahyuk Lee and Juhong Min and Junha Lee and Seungwook Kim and Kanghee Lee and Jaesik Park and Minsu Cho},\nyear={2024},\nurl={https://openreview.net/forum?id=6cGiRiExUd}\n}",
        "github": "",
        "project": "",
        "reviewers": "jjsW;jVVT;NyfY;oLtM",
        "site": "https://openreview.net/forum?id=6cGiRiExUd",
        "pdf_size": 13768238,
        "rating": "5;5;5;8",
        "confidence": "4;4;2;2",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;4",
        "presentation": "1;2;3;3",
        "wc_summary": "49;97;53;80",
        "wc_strengths": "108;50;28;63",
        "wc_weaknesses": "271;145;55;3",
        "wc_questions": "48;107;3;42",
        "wc_review": "476;399;139;188",
        "wc_reply_reviewers": "151;94;0;242",
        "wc_reply_authors": "2751;1908;423;927",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "7;5;2;4",
        "rating_avg": [
            5.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.0,
            1.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            69.75,
            19.74050404624968
        ],
        "wc_strengths_avg": [
            62.25,
            29.22648627529488
        ],
        "wc_weaknesses_avg": [
            118.5,
            101.65013526798673
        ],
        "wc_questions_avg": [
            50.0,
            37.1685350800916
        ],
        "wc_review_avg": [
            300.5,
            140.74888987128816
        ],
        "wc_reply_reviewers_avg": [
            121.75,
            87.90442252810719
        ],
        "wc_reply_authors_avg": [
            1502.25,
            897.1765085533615
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.5,
            1.8027756377319946
        ],
        "replies_avg": [
            30,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:IubrjESbtLQJ:scholar.google.com/&scioq=Efficient+Point+Cloud+Matching+for+3D+Geometric+Shape+Assembly&hl=en&as_sdt=0,23",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Pohang University of Science and Technology;Seoul National University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.postech.ac.kr;https://www.snu.ac.kr",
        "aff_unique_abbr": "POSTECH;SNU",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Pohang;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "6cMmSnOpCs",
        "title": "ScaLearn: Simple and Highly Parameter-Efficient Task Transfer by Learning to Scale",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Multi-task learning (MTL) has shown considerable practical benefits, particularly when using pre-trained language models (PLMs). While this is commonly achieved by simultaneously learning n tasks under a joint optimization procedure, recent methods such as AdapterFusion structure the problem into two distinct stages: (i) task learning, where knowledge specific to a task is encapsulated within sets of parameters (e.g., adapters), and (ii) transfer, where this already learned knowledge is leveraged for a target task. This separation of concerns provides numerous benefits, such as promoting reusability, and addressing cases involving data privacy and societal concerns; on the flip side, current two-stage MTL methods come with the cost of introducing a substantial number of additional parameters. In this work, we address this issue by leveraging the usefulness of linearly scaling the output representations of source adapters for transfer learning. We introduce ScaLearn, a simple and highly parameter-efficient two-stage MTL method that capitalizes on the knowledge of the source tasks by learning a minimal set of scaling parameters that enable effective knowledge transfer to a target task. Our experiments on three benchmarks (GLUE, SuperGLUE, and HumSet) show that our ScaLearn, in addition to facilitating the benefits of two-stage MTL, consistently outperforms strong baselines with only a small number of transfer parameters \u2013 roughly 0.35% of those of AdapterFusion. Remarkably, we observe that ScaLearn maintains its strong abilities even when further reducing parameters through uniform scaling and layer-sharing, achieving similarly competitive results with only 8 transfer parameters for each target task. Our proposed approach thus demonstrates the power of simple scaling as a promise for more efficient task transfer.",
        "keywords": "natural language processing;multi-task learning;transfer learning;adapters;efficient learning;peft methods",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Markus Frohmann;Carolin Holtermann;Shahed Masoudian;Anne Lauscher;Navid Rekabsaz",
        "authorids": "~Markus_Frohmann1;~Carolin_Holtermann1;~Shahed_Masoudian1;~Anne_Lauscher1;~Navid_Rekabsaz2",
        "gender": "M;F;M;;M",
        "homepage": ";https://www.carolin-holtermann.de/;https://github.com/ShawMask;;https://navid-rekabsaz.github.io",
        "dblp": "358/4606;318/1237;;209/6857;150/5089",
        "google_scholar": "8PxZyK8AAAAJ;x1vg4BgAAAAJ;hyWDk2wAAAAJ;https://scholar.google.it/citations?user=IbJS3UEAAAAJ;lZjyLyEAAAAJ",
        "orcid": ";0000-0003-0449-1348;0009-0007-2747-0386;;0000-0001-5764-8738",
        "linkedin": "markus-frohmann/;carolin-holtermann;shahed-masoudian;;",
        "or_profile": "~Markus_Frohmann1;~Carolin_Holtermann1;~Shahed_Masoudian1;~Anne_Lauscher1;~Navid_Rekabsaz2",
        "aff": "Deezer;Universit\u00e4t Hamburg;Johannes Kepler Universit\u00e4t Linz;Universit\u00e4t Hamburg;Thomson Reuters",
        "aff_domain": "research.deezer.com;uni-hamburg.de;jku.at;uni-hamburg.de;thomsonreuters.com",
        "position": "Intern;PhD student;PhD student;Associate Professor;Lead AI Scientist",
        "bibtex": "@misc{\nfrohmann2024scalearn,\ntitle={ScaLearn: Simple and Highly Parameter-Efficient Task Transfer by Learning to Scale},\nauthor={Markus Frohmann and Carolin Holtermann and Shahed Masoudian and Anne Lauscher and Navid Rekabsaz},\nyear={2024},\nurl={https://openreview.net/forum?id=6cMmSnOpCs}\n}",
        "github": "",
        "project": "",
        "reviewers": "6MN5;YAiw;tpyz;Exzr",
        "site": "https://openreview.net/forum?id=6cMmSnOpCs",
        "pdf_size": 1061918,
        "rating": "5;5;5;8",
        "confidence": "4;4;3;4",
        "soundness": "3;2;2;4",
        "contribution": "2;2;2;2",
        "presentation": "3;2;3;3",
        "wc_summary": "65;111;91;53",
        "wc_strengths": "43;53;156;74",
        "wc_weaknesses": "97;55;203;107",
        "wc_questions": "35;450;8;139",
        "wc_review": "240;669;458;373",
        "wc_reply_reviewers": "0;29;62;0",
        "wc_reply_authors": "727;1562;1594;370",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "2;3;3;1",
        "rating_avg": [
            5.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            80.0,
            22.561028345356956
        ],
        "wc_strengths_avg": [
            81.5,
            44.44378471732578
        ],
        "wc_weaknesses_avg": [
            115.5,
            54.1548705104167
        ],
        "wc_questions_avg": [
            158.0,
            175.5377452287684
        ],
        "wc_review_avg": [
            435.0,
            155.8476820488518
        ],
        "wc_reply_reviewers_avg": [
            22.75,
            25.567313116555678
        ],
        "wc_reply_authors_avg": [
            1063.25,
            530.1195030368153
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9368531401909249420&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2;1;3",
        "aff_unique_norm": "Deezer;University of Hamburg;Johannes Kepler University Linz;Thomson Reuters",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.deezer.com;https://www.uni-hamburg.de;https://www.jku.at;https://www.thomsonreuters.com",
        "aff_unique_abbr": "Deezer;UHH;JKU;TR",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Linz",
        "aff_country_unique_index": "0;1;2;1;3",
        "aff_country_unique": "France;Germany;Austria;United States"
    },
    {
        "id": "6cV6q8RIw2",
        "title": "Homotopy Relaxation Training Algorithms for Infinite-Width Two-Layer ReLU Neural Networks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In this paper, we present a novel training approach called the Homotopy Relaxation Training Algorithm (HRTA), aimed at accelerating the training process in contrast to traditional methods. Our algorithm incorporates two key mechanisms: one involves building a homotopy activation function that seamlessly connects the linear activation function with the ReLU activation function; the other technique entails relaxing the homotopy parameter to enhance the training refinement process. We have conducted an in-depth analysis of this novel method within the context of the neural tangent kernel (NTK), revealing significantly improved convergence rates. Our experimental results, especially when considering networks with larger widths, validate the theoretical conclusions. This proposed homotopy algorithm exhibits the potential for other activation functions and deep neural networks.",
        "keywords": "homotopy;relaxation;ReLU Neural Networks;infinite-width limit",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/7ce8ee9f34896c221d0a3c907d0206cf8fbb1d0c.pdf",
        "author": "Yahong Yang;Qipin Chen;Wenrui Hao",
        "authorids": "~Yahong_Yang1;~Qipin_Chen1;~Wenrui_Hao1",
        "gender": "M;M;",
        "homepage": ";;https://sites.psu.edu/whao/",
        "dblp": ";255/5039;",
        "google_scholar": ";hRZ99NUAAAAJ;7x6CVcAAAAAJ",
        "orcid": "0000-0002-9721-2362;;",
        "linkedin": ";qipin-chen-395a97159/;",
        "or_profile": "~Yahong_Yang1;~Qipin_Chen1;~Wenrui_Hao1",
        "aff": "Pennsylvania State University;;Pennsylvania State University",
        "aff_domain": "psu.edu;;psu.edu",
        "position": "Postdoc;;Associate Professor",
        "bibtex": "@misc{\nyang2024homotopy,\ntitle={Homotopy Relaxation Training Algorithms for Infinite-Width Two-Layer Re{LU} Neural Networks},\nauthor={Yahong Yang and Qipin Chen and Wenrui Hao},\nyear={2024},\nurl={https://openreview.net/forum?id=6cV6q8RIw2}\n}",
        "github": "",
        "project": "",
        "reviewers": "wUUw;4y1a;kAtf",
        "site": "https://openreview.net/forum?id=6cV6q8RIw2",
        "pdf_size": 716844,
        "rating": "3;3;3",
        "confidence": "3;4;3",
        "soundness": "2;2;2",
        "contribution": "1;2;2",
        "presentation": "1;3;2",
        "wc_summary": "54;38;57",
        "wc_strengths": "22;7;45",
        "wc_weaknesses": "58;142;147",
        "wc_questions": "280;3;69",
        "wc_review": "414;190;318",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            49.666666666666664,
            8.339997335464536
        ],
        "wc_strengths_avg": [
            24.666666666666668,
            15.627610892974724
        ],
        "wc_weaknesses_avg": [
            115.66666666666667,
            40.827550610940264
        ],
        "wc_questions_avg": [
            117.33333333333333,
            118.13645594067152
        ],
        "wc_review_avg": [
            307.3333333333333,
            91.75813618178802
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18198803661618719588&as_sdt=805&sciodt=0,3&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Pennsylvania State University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.psu.edu",
        "aff_unique_abbr": "PSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "6fFd8QaPVx",
        "title": "OneBNet: Binarized Neural Networks using Decomposed 1-D Binarized Convolutions on Edge Device",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Nowadays, it is natural to use 2-D convolutions in convolutional neural networks (CNNs) for computer vision, but this paper shows that 1-D binarized convolutions can achieve excellent performance on CPU-based edge devices.  This paper proposes a new structure called OneBNet to maximize the effects of 1-D binarized convolutions.  The proposed 1-D downsampling can perform information compression gradually through two 1-D convolutions,\nwhich can contribute tremendously to the performance improvement in binarized convolutional neural networks (BCNNs).  Compared with 2-D binarized convolutions, a $n \\times n$ 2-D binarized convolution is replaced by $n \\times 1$ row-wise and $1 \\times n$ column-wise 1-D binarized convolutions, thus doubling the effects of adjusting the activation distribution and non-linear activation function.  In the decomposed 1-D binarized convolution, although computational costs are reduced, the number of element-wise activation functions and learnable bias layers can be doubled, which can be a significant burden.  Therefore, we expect that the 1-D binarized convolution is not suitable for all layers, and we present the reason and experimental results proving it.  Based on the above assumption and experimental results, we can provide more optimized structure in terms of performance and costs.  With ResNet as a backbone, we evaluate the proposed model on several conventional image datasets.  In experiments, the proposed model based on ResNet18 achieves 93.4\\% and 93.6\\% Top-1 accuracy on the FashionMNIST and CIFAR10 datasets.  In the case of training from scratch, the proposed OneBNet based on ResNet18 can produce 63.9\\% Top-1 accuracy, showing better performance over the state-of-the-art (SOTA) binarized CNNs based on ResNet18.  When applying the teacher-student training, 68.4\\% Top-1 accuracy can be obtained, which overwhelms the existing SOTA BCNNs.  With 5\\% additional delay on a single thread of Raspberry Pi, the proposed lightweight model achieves 67.3\\% Top-1 accuracy on the ImageNet dataset, outperforming the baseline by 1.8\\%.",
        "keywords": "Binarized Neural Networks;Computer Vision;Inference;1-D convolution",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/1a51fbffff47a488a9a0a870b4f9c61e58c2a9b2.zip",
        "author": "YOUNGWOOK KWON;Minkee Chang;Daeryong Shin;WANSOO KIM;HyunJin Kim",
        "authorids": "~YOUNGWOOK_KWON2;~Minkee_Chang1;~Daeryong_Shin1;~WANSOO_KIM2;~HyunJin_Kim1",
        "gender": "M;M;M;M;M",
        "homepage": "https://www.empaslab.com/;https://www.empaslab.com/home;;https://www.dankook.ac.kr/web/kor;https://www.empaslab.com",
        "dblp": ";;;;97/8639-1",
        "google_scholar": ";;;;https://scholar.google.co.kr/citations?hl=ko",
        "orcid": ";;0009-0002-0027-9059;;0000-0001-5017-3995",
        "linkedin": ";;;;",
        "or_profile": "~YOUNGWOOK_KWON2;~Minkee_Chang1;~Daeryong_Shin1;~WANSOO_KIM2;~HyunJin_Kim1",
        "aff": "Dankook University;Dankook University;Dankook University;Dankook University;Dankook University",
        "aff_domain": "dankook.ac.kr;dankook.ac.kr;dankook.ac.kr;dankook.ac.kr;dankook.ac.kr",
        "position": "MS student;Undergrad student;Undergrad student;Undergrad student;Full Professor",
        "bibtex": "@misc{\nkwon2024onebnet,\ntitle={One{BN}et: Binarized Neural Networks using Decomposed 1-D Binarized Convolutions on Edge Device},\nauthor={YOUNGWOOK KWON and Minkee Chang and Daeryong Shin and WANSOO KIM and HyunJin Kim},\nyear={2024},\nurl={https://openreview.net/forum?id=6fFd8QaPVx}\n}",
        "github": "",
        "project": "",
        "reviewers": "HiaQ;w6Pw;38Cc;6xWT",
        "site": "https://openreview.net/forum?id=6fFd8QaPVx",
        "pdf_size": 4980376,
        "rating": "3;3;3;5",
        "confidence": "4;4;3;4",
        "soundness": "2;1;2;3",
        "contribution": "2;1;2;3",
        "presentation": "2;3;1;3",
        "wc_summary": "93;54;38;53",
        "wc_strengths": "51;45;25;50",
        "wc_weaknesses": "114;289;28;85",
        "wc_questions": "3;36;154;4",
        "wc_review": "261;424;245;192",
        "wc_reply_reviewers": "86;197;0;29",
        "wc_reply_authors": "468;1074;758;554",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            59.5,
            20.35313243704762
        ],
        "wc_strengths_avg": [
            42.75,
            10.497023387608508
        ],
        "wc_weaknesses_avg": [
            129.0,
            97.4191972867771
        ],
        "wc_questions_avg": [
            49.25,
            61.91677882448343
        ],
        "wc_review_avg": [
            280.5,
            86.69630903331468
        ],
        "wc_reply_reviewers_avg": [
            78.0,
            75.3491871223572
        ],
        "wc_reply_authors_avg": [
            713.5,
            233.265406779488
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:QDzLibUQzQYJ:scholar.google.com/&scioq=OneBNet:+Binarized+Neural+Networks+using+Decomposed+1-D+Binarized+Convolutions+on+Edge+Device&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Dankook University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.dankook.ac.kr",
        "aff_unique_abbr": "Dankook",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "6hP9JcXpNk",
        "title": "Going beyond familiar features for deep anomaly detection",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Anomaly Detection (AD) is a critical task that involves identifying observations that do not conform to a learned model of normality.\nPrior work in deep AD is predominantly based on a familiarity hypothesis, where familiar features serve as the reference in a pre-trained embedding space. While this strategy has proven highly successful, it turns out that it causes consistent false negatives when anomalies consist of truly novel features that are not well captured by the pre-trained encoding. We propose a novel approach to AD using explainability to capture novel features as unexplained observations in the input space. We achieve strong performance across a wide range of anomaly benchmarks by combining similarity and novelty in a hybrid approach. Our approach establishes a new state-of-the-art across multiple benchmarks, handling diverse anomaly types while eliminating the need for expensive background models and dense matching. In particular, we show that by taking account of novel features, we reduce false negative anomalies by up to 40% on challenging benchmarks compared to the state-of-the-art. Our method give visually inspectable explanations for pixel level anomalies.",
        "keywords": "Anomaly detection;familiarity hypothesis",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/a00ef70ddbb24d13ef6384bff21f203c94384ebe.pdf",
        "author": "Sarath Sivaprasad;Mario Fritz",
        "authorids": "~Sarath_Sivaprasad2;~Mario_Fritz1",
        "gender": "M;M",
        "homepage": ";https://cispa.saarland/group/fritz/",
        "dblp": ";",
        "google_scholar": "37HTgYcAAAAJ;https://scholar.google.de/citations?user=4V1nNm4AAAAJ",
        "orcid": ";",
        "linkedin": "sarathsivaprasad1729/;",
        "or_profile": "~Sarath_Sivaprasad2;~Mario_Fritz1",
        "aff": "cispa;Saarland University",
        "aff_domain": "cispa.de;uni-saarland.de",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nsivaprasad2024going,\ntitle={Going beyond familiar features for deep anomaly detection},\nauthor={Sarath Sivaprasad and Mario Fritz},\nyear={2024},\nurl={https://openreview.net/forum?id=6hP9JcXpNk}\n}",
        "github": "",
        "project": "",
        "reviewers": "oe8U;vwNp;Qn1L",
        "site": "https://openreview.net/forum?id=6hP9JcXpNk",
        "pdf_size": 5543769,
        "rating": "3;3;5",
        "confidence": "3;4;4",
        "soundness": "3;2;3",
        "contribution": "3;2;2",
        "presentation": "2;1;2",
        "wc_summary": "32;32;139",
        "wc_strengths": "48;16;32",
        "wc_weaknesses": "235;153;180",
        "wc_questions": "102;169;2",
        "wc_review": "417;370;353",
        "wc_reply_reviewers": "0;0;92",
        "wc_reply_authors": "726;745;388",
        "reply_reviewers": "0;0;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            67.66666666666667,
            50.44028372464039
        ],
        "wc_strengths_avg": [
            32.0,
            13.063945294843617
        ],
        "wc_weaknesses_avg": [
            189.33333333333334,
            34.120700787384514
        ],
        "wc_questions_avg": [
            91.0,
            68.61972505531239
        ],
        "wc_review_avg": [
            380.0,
            27.067816067549053
        ],
        "wc_reply_reviewers_avg": [
            30.666666666666668,
            43.36921591277491
        ],
        "wc_reply_authors_avg": [
            619.6666666666666,
            163.996612431138
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4223184860631744350&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "CISPA Helmholtz Center for Information Security;Saarland University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cispa.de/;https://www.uni-saarland.de",
        "aff_unique_abbr": "CISPA;UdS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Germany"
    },
    {
        "title": "Learning to solve Class-Constrained Bin Packing Problems via Encoder-Decoder Model",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19386",
        "id": "6hvtSLkKeZ",
        "author_site": "Hanni Cheng, Ya Cong, Weihao Jiang, Shiliang Pu",
        "tldr": "",
        "abstract": "Neural methods have shown significant merit in solving combinatorial optimization (CO) problems, including the Bin Packing Problem (BPP). However, most existing ML-based approaches focus on geometric BPP like 3DBPP, neglecting complex vector BPP. In this study, we introduce a vector BPP variant called Class-Constrained Bin Packing Problem (CCBPP), dealing with items of both classes and sizes, and the objective is to pack the items in the least amount of bins respecting the bin capacity and the number of different classes that it can hold. To enhance the efficiency and practicality of solving CCBPP, we propose a learning-based Encoder-Decoder Model. The Encoder employs a Graph Convolution Network (GCN) to generate a heat-map, representing probabilities of different items packing together. The  Decoder decodes and fine-tunes the solution through Cluster Decode and Active Search methods, thereby producing high-quality solutions for CCBPP instances. Extensive experiments demonstrate that our proposed method consistently yields high-quality solutions for various kinds of CCBPP with a very small gap from the optimal. Moreover, our Encoder-Decoder Model also shows promising performance on one practical application of CCBPP, the *Manufacturing Order Consolidation Problem* (OCP).",
        "keywords": "Combinatorial Optimization;Class-Contrained Bin Packing Problems;Graph Convolution Network;Cluster Decode",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/3599f9da74963d1b16c12cd25b5c59756ac78166.zip",
        "author": "Hanni Cheng;Ya Cong;Weihao Jiang;Shiliang Pu",
        "authorids": "~Hanni_Cheng1;~Ya_Cong1;~Weihao_Jiang2;~Shiliang_Pu1",
        "gender": "F;M;M;M",
        "homepage": ";;https://orcid.org/0000-0003-3482-8538;",
        "dblp": "189/5971;;262/6776.html;155/3173",
        "google_scholar": ";;;https://scholar.google.com.hk/citations?user=NWR_wpoAAAAJ",
        "orcid": "0009-0004-5319-7254;0000-0003-2432-5996;0000-0003-3482-8538;",
        "linkedin": ";;;",
        "or_profile": "~Hanni_Cheng1;~Ya_Cong1;~Weihao_Jiang2;~Shiliang_Pu1",
        "aff": "Hikvision Research Institute;Hikvision Research Institute;Hikvision Research Institute;",
        "aff_domain": "hikvision.com;hikvision.com;hikvision.com;",
        "position": "Researcher;Researcher;Researcher;",
        "bibtex": "@inproceedings{\ncheng2024learning,\ntitle={Learning to solve Class-Constrained Bin Packing Problems via Encoder-Decoder Model},\nauthor={Hanni Cheng and Ya Cong and Weihao Jiang and Shiliang Pu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=6hvtSLkKeZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "hLWM;Rj4P;HxmL;aXcu;2rkj",
        "pdf_size": 604652,
        "rating": "6;6;6;6;8",
        "confidence": "4;4;4;4;5",
        "soundness": "2;3;2;4;3",
        "contribution": "2;3;2;3;3",
        "presentation": "2;3;3;3;3",
        "wc_summary": "60;51;53;106;51",
        "wc_strengths": "34;63;32;187;28",
        "wc_weaknesses": "71;63;300;110;1",
        "wc_questions": "108;11;33;128;35",
        "wc_review": "273;188;418;531;115",
        "wc_reply_reviewers": "0;62;22;0;0",
        "wc_reply_authors": "1524;887;1716;958;268",
        "reply_reviewers": "0;1;1;0;0",
        "reply_authors": "3;3;4;3;1",
        "rating_avg": [
            6.4,
            0.7999999999999999
        ],
        "confidence_avg": [
            4.2,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.8,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            64.2,
            21.160340261914506
        ],
        "wc_strengths_avg": [
            68.8,
            60.39006540814474
        ],
        "wc_weaknesses_avg": [
            109.0,
            101.69169090933634
        ],
        "wc_questions_avg": [
            63.0,
            46.12591462507817
        ],
        "wc_review_avg": [
            305.0,
            151.43183284897532
        ],
        "wc_reply_reviewers_avg": [
            16.8,
            24.152846623120844
        ],
        "wc_reply_authors_avg": [
            1070.6,
            512.3801713571672
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            2.8,
            0.9797958971132712
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9033160795790333827&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=6hvtSLkKeZ",
        "pdf": "https://openreview.net/pdf?id=6hvtSLkKeZ",
        "email": "hikvision.com;hikvision.com;hikvision.com;",
        "author_num": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Hikvision Research Institute",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.hikvision.com/cn/",
        "aff_unique_abbr": "Hikvision",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "6hzNVNSz8O",
        "title": "No learning rates needed: Introducing SaLSa - Stable Armijo Line Search Adaptation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In recent studies, line search methods have been demonstrated to significantly\nenhance the performance of conventional stochastic gradient descent techniques\nacross various datasets and architectures, while making an otherwise critical choice\nof learning rate schedule superfluous Vaswani et al. (2019); Mahsereci & Hennig\n(2015); Vaswani et al. (2021). In this paper, we identify problems of current state-of-the-art of line search methods Vaswani et al. (2019; 2021), propose enhancements,\nand rigorously assess their effectiveness. Furthermore, we evaluate these methods\non orders of magnitude larger datasets and more complex data domains than\npreviously done.\nMore specifically, we enhance the Armijo line search method by speeding up\nits computation and incorporating a momentum term into the Armijo criterion,\nmaking it better suited for stochastic mini-batching. Our optimization approach\noutperforms both the previous Armijo implementation and a tuned learning rate\nschedule for the Adam and SGD optimizers. Our evaluation covers a diverse range\nof architectures, such as Transformers, CNNs, and MLPs, as well as data domains,\nincluding NLP and image data.\nOur work is publicly available as a Python package, which provides a hyperparameter free Pytorch optimizer.",
        "keywords": "Optimizer;Line Search;Learning Rate;Transformer;CNN",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/3e2cb2716f600ac3e583f19ee60d465c0a1a8a31.zip",
        "author": "Philip Kenneweg;Tristan Kenneweg;Fabian Fumagalli;Barbara Hammer",
        "authorids": "~Philip_Kenneweg1;~Tristan_Kenneweg1;~Fabian_Fumagalli1;~Barbara_Hammer4",
        "gender": "M;M;M;F",
        "homepage": ";;https://hammer-lab.techfak.uni-bielefeld.de/people/316634936/;https://www.techfak.uni-bielefeld.de/~bhammer/",
        "dblp": "306/1101;;329/4508;h/BarbaraHammer",
        "google_scholar": ";;anUMB08AAAAJ;1d3OxaUAAAAJ",
        "orcid": "0000-0002-7097-173X;0000-0001-8213-9396;0000-0003-3955-3510;0000-0002-2615-8151",
        "linkedin": ";;fabian-fumagalli/;",
        "or_profile": "~Philip_Kenneweg1;~Tristan_Kenneweg1;~Fabian_Fumagalli1;~Barbara_Hammer4",
        "aff": ";Universit\u00e4t Bielefeld;Universit\u00e4t Bielefeld;Universit\u00e4t Bielefeld",
        "aff_domain": ";uni-bielefeld.de;uni-bielefeld.de;uni-bielefeld.de",
        "position": ";PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nkenneweg2024no,\ntitle={No learning rates needed: Introducing Sa{LS}a - Stable Armijo Line Search Adaptation},\nauthor={Philip Kenneweg and Tristan Kenneweg and Fabian Fumagalli and Barbara Hammer},\nyear={2024},\nurl={https://openreview.net/forum?id=6hzNVNSz8O}\n}",
        "github": "",
        "project": "",
        "reviewers": "XiSh;QdFA;F4Yh;9vmP",
        "site": "https://openreview.net/forum?id=6hzNVNSz8O",
        "pdf_size": 8030403,
        "rating": "3;3;6;8",
        "confidence": "5;3;3;5",
        "soundness": "2;2;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;2;4;3",
        "wc_summary": "16;38;104;83",
        "wc_strengths": "27;33;39;100",
        "wc_weaknesses": "299;181;89;98",
        "wc_questions": "25;106;81;75",
        "wc_review": "367;358;313;356",
        "wc_reply_reviewers": "94;235;0;9",
        "wc_reply_authors": "622;875;38;302",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            5.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            4.0,
            1.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            60.25,
            34.945493271665235
        ],
        "wc_strengths_avg": [
            49.75,
            29.32042803234632
        ],
        "wc_weaknesses_avg": [
            166.75,
            84.35749818480868
        ],
        "wc_questions_avg": [
            71.75,
            29.38856069970083
        ],
        "wc_review_avg": [
            348.5,
            20.910523666326483
        ],
        "wc_reply_reviewers_avg": [
            84.5,
            94.31463301100206
        ],
        "wc_reply_authors_avg": [
            459.25,
            316.8259577433642
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.23570226039551587,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Op7vTIATlvUJ:scholar.google.com/&scioq=No+learning+rates+needed:+Introducing+SaLSa+-+Stable+Armijo+Line+Search+Adaptation&hl=en&as_sdt=0,33",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Universit\u00e4t Bielefeld",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uni-bielefeld.de/",
        "aff_unique_abbr": "Uni Bielefeld",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "6iM2asNCjK",
        "title": "On Robustness-Accuracy Characterization of Large Language Models using Synthetic Datasets",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In recent years, large language models (LLMs) that were pretrained at scale on diverse data have proven to be a successful approach for solving different downstream tasks. However, new concerns about proper performance evaluation have been raised, especially for test-data leakage caused by accidentally including them during pretraining, or by indirectly exposing them through API calls for evaluation. Motivated by these, in this paper, we propose a new evaluation workflow that generates steerable synthetic language datasets and proxy tasks for benchmarking the performance of pertrained LLMs on sentence classification tasks. This approach allows for better characterization of the joint analysis on the robustness and accuracy of LLMs without risking sensitive information leakage. It also provides a more controlled and private way to evaluate LLMs that avoids overfitting specific test sets. Verified on various pretrained LLMs, the proposed approach demonstrates promising high correlation with real downstream performance.",
        "keywords": "language model; real-data-free",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Ching-Yun Ko;Pin-Yu Chen;Payel Das;Yung-Sung Chuang;Luca Daniel",
        "authorids": "~Ching-Yun_Ko1;~Pin-Yu_Chen1;~Payel_Das1;~Yung-Sung_Chuang1;~Luca_Daniel1",
        "gender": "F;M;F;M;",
        "homepage": ";http://www.pinyuchen.com;;https://people.csail.mit.edu/yungsung/;https://www.mit.edu/~dluca/",
        "dblp": "206/6472;39/8969;56/7926;64/3095;35/5202",
        "google_scholar": ";jxwlCUUAAAAJ;;3ar1DOwAAAAJ;",
        "orcid": ";0000-0003-1039-8369;;0000-0002-1723-5063;0000-0002-5880-3151",
        "linkedin": ";pin-yu-chen-940062a2;;yschuang;",
        "or_profile": "~Ching-Yun_Ko1;~Pin-Yu_Chen1;~Payel_Das1;~Yung-Sung_Chuang1;~Luca_Daniel1",
        "aff": "Massachusetts Institute of Technology;International Business Machines;IBM, International Business Machines;Massachusetts Institute of Technology;",
        "aff_domain": "mit.edu;ibm.com;us.ibm.com;mit.edu;",
        "position": "PhD student;Principal Researcher;Principal Researcher;PhD student;",
        "bibtex": "@misc{\nko2024on,\ntitle={On Robustness-Accuracy Characterization of Large Language Models using Synthetic Datasets},\nauthor={Ching-Yun Ko and Pin-Yu Chen and Payel Das and Yung-Sung Chuang and Luca Daniel},\nyear={2024},\nurl={https://openreview.net/forum?id=6iM2asNCjK}\n}",
        "github": "",
        "project": "",
        "reviewers": "QVm9;ALMM;XF6K",
        "site": "https://openreview.net/forum?id=6iM2asNCjK",
        "pdf_size": 1124006,
        "rating": "3;3;5",
        "confidence": "2;4;3",
        "soundness": "2;3;4",
        "contribution": "2;2;2",
        "presentation": "1;3;3",
        "wc_summary": "252;66;249",
        "wc_strengths": "44;25;75",
        "wc_weaknesses": "268;133;428",
        "wc_questions": "2;1;160",
        "wc_review": "566;225;912",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            189.0,
            86.98275691193054
        ],
        "wc_strengths_avg": [
            48.0,
            20.607442021431645
        ],
        "wc_weaknesses_avg": [
            276.3333333333333,
            120.57731498457282
        ],
        "wc_questions_avg": [
            54.333333333333336,
            74.71873184743494
        ],
        "wc_review_avg": [
            567.6666666666666,
            280.46905157055903
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6108874926867295991&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Massachusetts Institute of Technology;International Business Machines Corporation;International Business Machines",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://web.mit.edu;https://www.ibm.com;https://www.ibm.com",
        "aff_unique_abbr": "MIT;IBM;IBM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "STanHop: Sparse Tandem Hopfield Model for Memory-Enhanced Time Series Prediction",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19385",
        "id": "6iwg437CZs",
        "author_site": "Yu-Hsuan Wu, Jerry Hu, Weijian Li, Bo-Yu Chen, Han Liu",
        "tldr": "",
        "abstract": "We present **STanHop-Net** (**S**parse **Tan**dem **Hop**field **Net**work) for multivariate time series prediction with memory-enhanced capabilities. At the heart of our approach is **STanHop**, a novel Hopfield-based neural network block, which sparsely learns and stores both temporal and cross-series representations in a data-dependent fashion. In essence, STanHop sequentially learns temporal representation and cross-series representation using two tandem sparse Hopfield layers. Additionally, STanHop incorporates two external memory modules: **Plug-and-Play** and **Tune-and-Play** for train-less and task-aware memory enhancements, respectively. They allow StanHop-Net to swiftly respond to sudden events. Methodologically, we construct the STanHop-Net by stacking STanHop blocks in a hierarchical fashion, enabling multi-resolution feature extraction with resolution-specific sparsity. Theoretically, we introduce a unified construction (**Generalized Sparse Modern Hopfield Model**) for both dense and sparse modern Hopfield models and show that it endows a tighter memory retrieval error compared to the dense counterpart without sacrificing memory capacity. Empirically, we validate the efficacy of STanHop-Net on many settings: time series prediction, fast test-time adaptation, and strongly correlated time series prediction.",
        "keywords": "Time Series Prediction; Multivariate Time Series; Modern Hopfield Networks; Sparse Hopfield Model; Hopfield Layer; Attention Mechanism",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/f4fbc7215901e8f014e4e4ac13e571e625f93d01.pdf",
        "author": "Dennis Wu;Jerry Yao-Chieh Hu;Weijian Li;Bo-Yu Chen;Han Liu",
        "authorids": "~Dennis_Wu1;~Jerry_Yao-Chieh_Hu1;~Weijian_Li2;~Bo-Yu_Chen1;~Han_Liu4",
        "gender": ";;M;M;",
        "homepage": ";;;https://phys-mattchen.github.io/;",
        "dblp": ";;;;",
        "google_scholar": ";;https://scholar.google.com/citations?hl=en;;",
        "orcid": ";;0009-0003-4158-4380;0000-0003-4997-1652;",
        "linkedin": ";;weijian-li-b52566153/;;",
        "or_profile": "~Dennis_Wu1;~Jerry_Yao-Chieh_Hu1;~Weijian_Li2;~Bo-Yu_Chen1;~Han_Liu4",
        "aff": ";;Northwestern University;University of Chicago;Northwestern University",
        "aff_domain": ";;northwestern.edu;uchicago.edu;u.northwestern.edu",
        "position": ";;PhD student;Exchange student;Associate Professor",
        "bibtex": "@inproceedings{\nwu2024stanhop,\ntitle={{ST}anHop: Sparse Tandem Hopfield Model for Memory-Enhanced Time Series Prediction},\nauthor={Dennis Wu and Jerry Yao-Chieh Hu and Weijian Li and Bo-Yu Chen and Han Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=6iwg437CZs}\n}",
        "github": "",
        "project": "",
        "reviewers": "xuHy;ntR2;u61L;BpQa",
        "pdf_size": 5898172,
        "rating": "5;5;8;8",
        "confidence": "3;2;4;4",
        "soundness": "3;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;3;3",
        "wc_summary": "94;53;74;79",
        "wc_strengths": "53;23;33;33",
        "wc_weaknesses": "176;32;65;27",
        "wc_questions": "22;37;348;338",
        "wc_review": "345;145;520;477",
        "wc_reply_reviewers": "55;0;26;46",
        "wc_reply_authors": "2836;1403;2667;1299",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "6;4;7;4",
        "rating_avg": [
            6.5,
            1.5
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            75.0,
            14.679918255903198
        ],
        "wc_strengths_avg": [
            35.5,
            10.897247358851684
        ],
        "wc_weaknesses_avg": [
            75.0,
            60.11239472854163
        ],
        "wc_questions_avg": [
            186.25,
            156.8795318070525
        ],
        "wc_review_avg": [
            371.75,
            145.93384631400627
        ],
        "wc_reply_reviewers_avg": [
            31.75,
            21.123150806638673
        ],
        "wc_reply_authors_avg": [
            2051.25,
            703.755772622861
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            5.25,
            1.299038105676658
        ],
        "replies_avg": [
            31,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.9045340337332909,
        "gs_citation": 47,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7180925615475172223&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=6iwg437CZs",
        "pdf": "https://openreview.net/pdf?id=6iwg437CZs",
        "email": ";;northwestern.edu;uchicago.edu;u.northwestern.edu",
        "author_num": 5,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Northwestern University;University of Chicago",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.northwestern.edu;https://www.uchicago.edu",
        "aff_unique_abbr": "NU;UChicago",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "6j9Y1APsAm",
        "title": "Hierarchical Probabilistic Neural Network: Efficient and Accurate Uncertainty Quantification",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Bayesian neural networks (BNNs) are known for accurately estimating the posterior distribution of model parameters, showcasing their effectiveness in uncertainty quantification (UQ). However, the computational demands of Bayesian inference can be challenging. Evidential deep learning methods address this by treating target distribution parameters as random variables with a learnable conjugate distribution, thus allowing for efficient UQ. In our paper, we present the Hierarchical Probabilistic Neural Network (HPNN), offering new insights into existing evidential deep learning methods. Firstly, it distills BNN knowledge into a single deterministic network, endowing it with a Bayesian perspective and theoretical guarantees. Secondly, we introduce a self-regularized training strategy using Laplacian approximation (LA) for self-distillation, bypassing the heavy computational load with BNNs. Thirdly, we propose to utilize flexible normalizing flows to alleviate the conjugate prior assumption in a post-processing manner, where a few training iterations can enhance model performance. Lastly, we present the Hierarchical Bayesian Neural Network, which treats the NN parameters in HPNN as random variables, for further improving UQ accuracy. The experiment results demonstrate the effectiveness of our proposed methods in both UQ accuracy and robustness.",
        "keywords": "Uncertainty Quantification;Evidential Deep Learning",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Hanjing Wang;Qiang Ji",
        "authorids": "~Hanjing_Wang2;~Qiang_Ji1",
        "gender": "M;M",
        "homepage": "https://www.ecse.rpi.edu/~cvrl/people_zw.html;https://www.ecse.rpi.edu/~qji/",
        "dblp": "234/8752;",
        "google_scholar": ";vAXmpVIAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Hanjing_Wang2;~Qiang_Ji1",
        "aff": "Rensselaer Polytechnic Institute;Rensselaer Polytechnic Institute",
        "aff_domain": "rpi.edu;rpi.edu",
        "position": "PhD student;Professor",
        "bibtex": "@misc{\nwang2024hierarchical,\ntitle={Hierarchical Probabilistic Neural Network: Efficient and Accurate Uncertainty Quantification},\nauthor={Hanjing Wang and Qiang Ji},\nyear={2024},\nurl={https://openreview.net/forum?id=6j9Y1APsAm}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=6j9Y1APsAm",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:zOj0eyQ-wCcJ:scholar.google.com/&scioq=Hierarchical+Probabilistic+Neural+Network:+Efficient+and+Accurate+Uncertainty+Quantification&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Rensselaer Polytechnic Institute",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.rpi.edu",
        "aff_unique_abbr": "RPI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "6jBNQ8nSxA",
        "title": "Just-in-Time Security Patch Detection - LLM At the Rescue for Data Augmentation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In the face of growing vulnerabilities found in open-source software, the need to identify {discreet} security patches has become paramount. The lack of consistency in how software providers handle maintenance often leads to the release of security patches without comprehensive advisories, leaving users vulnerable to unaddressed security risks.  To address this pressing issue, we introduce a novel security patch detection system, LLMDA, which capitalizes on Large Language Models (LLMs) and code-text alignment methodologies for patch review, data enhancement, and feature combination. Within LLMDA, we initially utilize LLMs for examining patches and expanding data of PatchDB and SPI-DB, two security patch datasets from recent literature. We then use labeled instructions to direct our LLMDA, differentiating patches based on security relevance. Following this, we apply a PTFormer to merge patches with code, formulating hybrid attributes that encompass both the innate details and the interconnections between the patches and the code. This distinctive combination method allows our system to capture more insights from the combined context of patches and code, hence improving detection precision. Finally, we devise a probabilistic batch contrastive learning mechanism within batches to augment the capability of the our LLMDA in discerning security patches. The results reveal that LLMDA significantly surpasses the start of the art techniques in detecting security patches, underscoring its promise in fortifying software maintenance.",
        "keywords": "Open-source software vulnerabilities;Security patch detection;Large Language Models (LLMs);PT-Former;Code-text alignment",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Xunzhu Tang;Zhenghan Chen;KISUB KIM;Haoye Tian;Saad Ezzini;Jacques Klein;Tegawend\u00e9 F. Bissyand\u00e9",
        "authorids": "~Xunzhu_Tang1;~Zhenghan_Chen3;~KISUB_KIM1;~Haoye_Tian2;~Saad_Ezzini1;~Jacques_Klein1;~Tegawend\u00e9_F._Bissyand\u00e91",
        "gender": ";;M;;M;M;M",
        "homepage": ";;https://falconlk.github.io/react-gh-pages/;;https://ezzini.me;https://jacquesklein2302.github.io/;https://bissyande.github.io/",
        "dblp": ";;216/3065.html;;216/8359.html;k/JacquesKlein;00/8006.html",
        "google_scholar": ";;Nr_IDzQAAAAJ;;48ebm6wAAAAJ;https://scholar.google.fr/citations?user=9E_KKT4AAAAJ;t73Mqm8AAAAJ",
        "orcid": ";;0000-0002-4462-6916;;0000-0001-7657-4738;0000-0003-4052-475X;0000-0001-7270-9869",
        "linkedin": ";;kisub-kim-81199a179/;;saad-ezzini/;jacques-klein-188b0b5/;",
        "or_profile": "~Xunzhu_Tang1;~Zhenghan_Chen3;~KISUB_KIM1;~Haoye_Tian2;~Saad_Ezzini1;~Jacques_Klein1;~Tegawend\u00e9_F._Bissyand\u00e91",
        "aff": ";;;;Lancaster University;University of Luxemburg;University of Luxemburg",
        "aff_domain": ";;;;lancaster.ac.uk;uni.lu;uni.lu",
        "position": ";;;;Assistant Professor;Full Professor;Associate Professor",
        "bibtex": "@misc{\ntang2024justintime,\ntitle={Just-in-Time Security Patch Detection - {LLM} At the Rescue for Data Augmentation},\nauthor={Xunzhu Tang and Zhenghan Chen and KISUB KIM and Haoye Tian and Saad Ezzini and Jacques Klein and Tegawend{\\'e} F. Bissyand{\\'e}},\nyear={2024},\nurl={https://openreview.net/forum?id=6jBNQ8nSxA}\n}",
        "github": "",
        "project": "",
        "reviewers": "pMnS;z5t8;T4hh;aN2M",
        "site": "https://openreview.net/forum?id=6jBNQ8nSxA",
        "pdf_size": 3436072,
        "rating": "3;5;8;8",
        "confidence": "4;3;5;4",
        "soundness": "3;2;4;3",
        "contribution": "2;2;4;4",
        "presentation": "1;2;4;3",
        "wc_summary": "53;80;87;58",
        "wc_strengths": "65;46;184;99",
        "wc_weaknesses": "364;183;51;57",
        "wc_questions": "2;170;45;57",
        "wc_review": "484;479;367;271",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "781;719;390;694",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            1.0
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            69.5,
            14.326548781894402
        ],
        "wc_strengths_avg": [
            98.5,
            52.88903478037768
        ],
        "wc_weaknesses_avg": [
            163.75,
            127.06174680052214
        ],
        "wc_questions_avg": [
            68.5,
            62.06649659840645
        ],
        "wc_review_avg": [
            400.25,
            88.07205856569948
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            646.0,
            151.15720293786862
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.5000000000000001,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5054369013991040277&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Lancaster University;University of Luxembourg",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.lancaster.ac.uk;https://wwwen.uniluxembourg.lu",
        "aff_unique_abbr": "Lancaster;Uni Lu",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "United Kingdom;Luxembourg"
    },
    {
        "id": "6jFjYmahxu",
        "title": "DiffSound: Differentiable Modal Sound Simulation for Inverse Reasoning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Accurately estimating and simulating the physical properties of objects from real-world audio observations is of great practical importance in the field of vision and embodied AI. However, previous differentiable rigid or soft body simulations cannot be directly applied to modal sound synthesis due to the high sampling rate of sound, and previous audio synthesizers do not fully model the physical properties of objects behind the modal analysis.\nWe propose DiffSound, a differentiable sound simulation framework for physically based modal sound synthesis.\nOur framework is capable of solving a range of inverse problems, including object shape, material parameter, and impact position reasoning.\nExperimental results demonstrate the effectiveness of our approach, highlighting its ability to accurately estimate physical parameters and reproduce the target sound. Our DiffSound differentiable sound simulator serves as a valuable tool for applications requiring sound synthesis and analysis.",
        "keywords": "sound synthesis;differentiable simulation;modal analysis;vibration;audio",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/4e30cfff50a5bd6be4665224e4ef810b732e1f6f.zip",
        "author": "Xutong Jin;Chenxi Xu;Ruohan Gao;Jiajun Wu;Guoping Wang;Sheng Li",
        "authorids": "~Xutong_Jin1;~Chenxi_Xu1;~Ruohan_Gao2;~Jiajun_Wu1;~Guoping_Wang1;~Sheng_Li9",
        "gender": ";M;M;M;M;M",
        "homepage": "https://hellojxt.github.io/;https://technetiumman.github.io/;https://ruohangao.github.io/;https://jiajunwu.com;https://www.graphics.pku.edu.cn/xztd/jgfaculty/wgp2/index.htm;https://lishengpku.github.io/",
        "dblp": ";;176/5787;117/4768;;23/3439-8",
        "google_scholar": ";;i02oEgMAAAAJ;2efgcS0AAAAJ;;",
        "orcid": ";;0000-0002-8346-1114;0000-0002-4176-343X;0000-0001-7819-0076;",
        "linkedin": ";;;jiajunwu/;;",
        "or_profile": "~Xutong_Jin1;~Chenxi_Xu1;~Ruohan_Gao2;~Jiajun_Wu1;~Guoping_Wang1;~Sheng_Li9",
        "aff": "Peking University;Peking University;Meta;Stanford University;Peking University;Peking University",
        "aff_domain": "pku.edu.cn;pku.edu.cn;meta.com;stanford.edu;pku.edu.cn;pku.edu.cn",
        "position": "PhD student;MS student;Researcher;Assistant Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\njin2024diffsound,\ntitle={DiffSound: Differentiable Modal Sound Simulation for Inverse Reasoning},\nauthor={Xutong Jin and Chenxi Xu and Ruohan Gao and Jiajun Wu and Guoping Wang and Sheng Li},\nyear={2024},\nurl={https://openreview.net/forum?id=6jFjYmahxu}\n}",
        "github": "",
        "project": "",
        "reviewers": "oyHm;cDNR;Kc8Y;aeBV",
        "site": "https://openreview.net/forum?id=6jFjYmahxu",
        "pdf_size": 21414000,
        "rating": "3;3;5;5",
        "confidence": "3;3;3;4",
        "soundness": "2;2;3;2",
        "contribution": "2;2;2;2",
        "presentation": "3;3;2;2",
        "wc_summary": "73;82;49;66",
        "wc_strengths": "39;49;20;91",
        "wc_weaknesses": "59;68;89;262",
        "wc_questions": "77;72;102;7",
        "wc_review": "248;271;260;426",
        "wc_reply_reviewers": "9;0;0;0",
        "wc_reply_authors": "170;93;48;53",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            67.5,
            12.093386622447824
        ],
        "wc_strengths_avg": [
            49.75,
            25.9939896899264
        ],
        "wc_weaknesses_avg": [
            119.5,
            82.98945716173831
        ],
        "wc_questions_avg": [
            64.5,
            35.0891721190455
        ],
        "wc_review_avg": [
            301.25,
            72.48232543179061
        ],
        "wc_reply_reviewers_avg": [
            2.25,
            3.897114317029974
        ],
        "wc_reply_authors_avg": [
            91.0,
            48.83134239399937
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:NZhLCezfaYAJ:scholar.google.com/&scioq=DiffSound:+Differentiable+Modal+Sound+Simulation+for+Inverse+Reasoning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2;0;0",
        "aff_unique_norm": "Peking University;Meta;Stanford University",
        "aff_unique_dep": ";Meta Platforms, Inc.;",
        "aff_unique_url": "http://www.pku.edu.cn;https://meta.com;https://www.stanford.edu",
        "aff_unique_abbr": "Peking U;Meta;Stanford",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Stanford",
        "aff_country_unique_index": "0;0;1;1;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "6jJFmwAlen",
        "title": "Investigating the Fairness of Large Language Models for Predictions on Tabular Data",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recent literature has suggested the potential of using large language models (LLMs) to make predictions for tabular tasks. However, LLMs have been shown to exhibit harmful social biases that reflect the stereotypes and inequalities present in the society. To this end, as well as the widespread use of tabular data in many high-stake applications, it is imperative to explore the following questions: what sources of information do LLMs draw upon when making predictions for tabular tasks; whether and to what extent are LLM predictions for tabular tasks influenced by social biases and stereotypes; and what are the consequential implications for fairness? Through a series of experiments, we delve into these questions and show that LLMs tend to inherit social biases from their training data which significantly impact their fairness in tabular prediction tasks. Furthermore, our investigations show that in the context of bias mitigation, though in-context learning and fine-tuning have a moderate effect, the fairness metric gap between different subgroups is still larger than that in traditional machine learning models, such as Random Forest and shallow Neural Networks. This observation emphasizes that the social biases are inherent within the LLMs themselves and inherited from their pre-training corpus, not only from the downstream task datasets. Besides, we demonstrate that label-flipping of in-context examples can significantly reduce biases, further highlighting the presence of inherent bias within LLMs.",
        "keywords": "Fairness;Social Biases;Large Language Models;In-Context Learning;Tabular Data;Trustworthy ML",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Yanchen Liu;Srishti Gautam;Jiaqi Ma;Himabindu Lakkaraju",
        "authorids": "~Yanchen_Liu2;~Srishti_Gautam1;~Jiaqi_Ma1;~Himabindu_Lakkaraju1",
        "gender": "M;F;;F",
        "homepage": "https://liuyanchen1015.github.io/;;https://jiaqima.github.io;http://web.stanford.edu/~himalv",
        "dblp": ";201/6628;155/2199-1;68/9376",
        "google_scholar": "https://scholar.google.com/citations?hl=en;7V_riiYAAAAJ;Z9X2A1MAAAAJ;",
        "orcid": ";;0000-0001-8292-5901;",
        "linkedin": ";;;",
        "or_profile": "~Yanchen_Liu2;~Srishti_Gautam1;~Jiaqi_Ma1;~Hima_Lakkaraju1",
        "aff": "Harvard University;UiT The Arctic University of Norway;University of Illinois Urbana-Champaign;Harvard University",
        "aff_domain": "harvard.edu;uit.no;illinois.edu;harvard.edu",
        "position": "MS student;PhD student;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nliu2024investigating,\ntitle={Investigating the Fairness of Large Language Models for Predictions on Tabular Data},\nauthor={Yanchen Liu and Srishti Gautam and Jiaqi Ma and Himabindu Lakkaraju},\nyear={2024},\nurl={https://openreview.net/forum?id=6jJFmwAlen}\n}",
        "github": "",
        "project": "",
        "reviewers": "qNdb;eUu3;rhXH;Vp7m;fjE3;88s7",
        "site": "https://openreview.net/forum?id=6jJFmwAlen",
        "pdf_size": 227848,
        "rating": "3;3;3;5;5;5",
        "confidence": "4;4;4;4;4;4",
        "soundness": "2;2;1;2;2;2",
        "contribution": "2;2;3;2;3;2",
        "presentation": "3;3;2;2;3;3",
        "wc_summary": "77;57;31;50;32;200",
        "wc_strengths": "89;35;50;19;83;74",
        "wc_weaknesses": "252;158;80;531;105;60",
        "wc_questions": "5;235;15;3;148;66",
        "wc_review": "423;485;176;603;368;400",
        "wc_reply_reviewers": "0;0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0;0",
        "reply_authors": "0;0;0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            1.8333333333333333,
            0.3726779962499649
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            74.5,
            58.254470500840824
        ],
        "wc_strengths_avg": [
            58.333333333333336,
            25.67532321553562
        ],
        "wc_weaknesses_avg": [
            197.66666666666666,
            161.77213054856585
        ],
        "wc_questions_avg": [
            78.66666666666667,
            86.22966749069344
        ],
        "wc_review_avg": [
            409.1666666666667,
            128.87903458497647
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4414628081737124617&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Harvard University;Arctic University of Norway;University of Illinois Urbana-Champaign",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.harvard.edu;https://www.uit.no;https://illinois.edu",
        "aff_unique_abbr": "Harvard;UiT;UIUC",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Urbana-Champaign",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "United States;Norway"
    },
    {
        "id": "6kpXxfA3Oi",
        "title": "Fill with Anything: High-Resolution and Prompt-Faithful Image Completion",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Building on the achievements of text-to-image diffusion models, recent advancements in text-guided image inpainting have yielded remarkably realistic and visually compelling outcomes. \nNevertheless, current text-to-image inpainting models leave substantial room for enhancement, particularly in addressing the often inadequate alignment of user prompts with the inpainted region, and in extending applicability to high-resolution images. \nTo this end, this paper introduces an entirely $\\textbf{training-free}$ approach that $\\textbf{faithfully adheres to prompts}$ and seamlessly $\\textbf{scale to high-resolution}$ image inpainting. \nTo achieve this, we first present the Prompt-Aware Introverted Attention (PAIntA) layer, which enriches self-attention modules by incorporating prompt information derived from cross-attention scores, alleviating the visual context dominance in inpainting caused by all-to-all attention. \nFurthermore, we introduce the Reweighting Attention Score Guidance (RASG) mechanism, which directs cross-attention scores towards improved textual alignment while preserving the generation domain. \nIn addition, to address inpainting at larger scales, we introduce a specialized super-resolution technique tailored for inpainting, enabling the completion of missing regions in images of up to 2K resolution. Experimental results demonstrate that our proposed method surpasses existing state-of-the-art approaches in both qualitative and quantitative measures, achieving a substantial generation accuracy improvement of $\\textbf{61.4\\%}$ compared to $\\textbf{51.9\\%}$. Our codes will be open-sourced.",
        "keywords": "text-guided inpainting;diffusion inpainting;reweighting attention score guidance;prompt-aware introverted attention;RASG;PaIntA;conditional super-resolution;classifier guidance;classifier-free guidance;introvert attention;diffusion models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/215f397fd495b4c5a4252b56774027d4c45c8b4e.pdf",
        "author": "Hayk Manukyan;Andranik Sargsyan;Barsegh Atanyan;Zhangyang Wang;Shant Navasardyan;Humphrey Shi",
        "authorids": "~Hayk_Manukyan1;~Andranik_Sargsyan1;~Barsegh_Atanyan1;~Zhangyang_Wang1;~Shant_Navasardyan1;~Humphrey_Shi1",
        "gender": "M;M;M;M;M;M",
        "homepage": ";;;https://vita-group.github.io;;https://www.humphreyshi.com",
        "dblp": ";332/5291;;119/4026;286/5315;176/5516",
        "google_scholar": ";cg74A98AAAAJ;;pxFyKAIAAAAJ;VJSh59sAAAAJ;WBvt5A8AAAAJ",
        "orcid": ";0000-0001-8018-7941;;;0000-0002-1999-9999;0000-0002-2922-5663",
        "linkedin": "hayk-manukyan-4aab0962/;andraniksargsyan/;barsegh-atanyan-2012a412b;;shant-navasardyan-1302aa149;humphreyshi",
        "or_profile": "~Hayk_Manukyan1;~Andranik_Sargsyan1;~Barsegh_Atanyan1;~Zhangyang_Wang1;~Shant_Navasardyan1;~Honghui_Shi1",
        "aff": "Picsart AI Research;Yerevan State University;Picsart;University of Texas at Austin;Picsart Inc;University of Illinois, Urbana Champaign",
        "aff_domain": "picsart.com;ysu.am;picsart.com;utexas.edu;picsart.com;illinois.edu",
        "position": "Researcher;MS student;Researcher;Associate Professor;Researcher;Adjunct Assistant Professor",
        "bibtex": "@misc{\nmanukyan2024fill,\ntitle={Fill with Anything: High-Resolution and Prompt-Faithful Image Completion},\nauthor={Hayk Manukyan and Andranik Sargsyan and Barsegh Atanyan and Zhangyang Wang and Shant Navasardyan and Humphrey Shi},\nyear={2024},\nurl={https://openreview.net/forum?id=6kpXxfA3Oi}\n}",
        "github": "",
        "project": "",
        "reviewers": "Q343;BeCN;WycU;ZNkY",
        "site": "https://openreview.net/forum?id=6kpXxfA3Oi",
        "pdf_size": 32290227,
        "rating": "3;3;5;6",
        "confidence": "5;5;4;4",
        "soundness": "3;2;3;3",
        "contribution": "3;2;3;3",
        "presentation": "3;3;2;3",
        "wc_summary": "52;64;69;56",
        "wc_strengths": "21;33;46;90",
        "wc_weaknesses": "19;313;173;149",
        "wc_questions": "201;62;52;19",
        "wc_review": "293;472;340;314",
        "wc_reply_reviewers": "43;204;117;0",
        "wc_reply_authors": "938;1489;1374;756",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "2;3;2;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            60.25,
            6.6473679001541655
        ],
        "wc_strengths_avg": [
            47.5,
            26.081602711489953
        ],
        "wc_weaknesses_avg": [
            163.5,
            104.32041986111827
        ],
        "wc_questions_avg": [
            83.5,
            69.67962399439308
        ],
        "wc_review_avg": [
            354.75,
            69.71145888589622
        ],
        "wc_reply_reviewers_avg": [
            91.0,
            77.50806409658288
        ],
        "wc_reply_authors_avg": [
            1139.25,
            301.99948261545086
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.9622504486493761,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:FgXryZtrne4J:scholar.google.com/&scioq=Fill+with+Anything:+High-Resolution+and+Prompt-Faithful+Image+Completion&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;2;3;4",
        "aff_unique_norm": "Picsart;Yerevan State University;University of Texas at Austin;Picsart Inc;University of Illinois Urbana-Champaign",
        "aff_unique_dep": "AI Research;;;;",
        "aff_unique_url": "https://research.picsart.com;https://www.yerevanstateuniversity.am;https://www.utexas.edu;https://www.picsart.com;https://illinois.edu",
        "aff_unique_abbr": "Picsart AI;YSU;UT Austin;Picsart;UIUC",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Austin;Urbana-Champaign",
        "aff_country_unique_index": "0;1;0;0;0;0",
        "aff_country_unique": "United States;Armenia"
    },
    {
        "title": "Mixture-of-Experts Meets Instruction Tuning: A Winning Combination for Large Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19384",
        "id": "6mLjDwYte5",
        "author_site": "Sheng Shen, Le Hou, Yanqi Zhou, Nan Du, Shayne Longpre, Jason Wei, Hyung Won Chung, Barret Zoph, William Fedus, Xinyun Chen, Tu Vu, Yuexin Wu, Wuyang Chen, Albert Webson, Yunxuan Li, Vincent Zhao, Hongkun Yu, Kurt Keutzer, trevor darrell, Denny Zhou",
        "tldr": "",
        "abstract": "Sparse Mixture-of-Experts (MoE) is a neural architecture design that adds learnable parameters to Large Language Models (LLMs) without increasing computational complexity (FLOPs). Instruction tuning is a technique for training LLMs to follow instructions. We advocate combining these two approaches, as we find that MoE models benefit more from instruction tuning than dense models. In particular, we conduct empirical studies across three experimental setups: (i) Direct finetuning on individual downstream tasks devoid of instruction tuning; (ii) Instruction tuning followed by in-context few-shot or zero-shot generalization on downstream tasks; and (iii) Instruction tuning supplemented by further finetuning on individual downstream tasks. In the first scenario, MoE models overall underperform dense models of identical computational capacity. This narrative, however, dramatically changes with the introduction of instruction tuning (in the second and third scenarios), used independently or in conjunction with task-specific finetuning. Our most powerful model, FLAN-MoE-32B, surpasses the performance of Flan-PaLM-62B on four benchmark tasks, while using only a third of the FLOPs. The advancements embodied by FLAN-MoE inspire a reevaluation of the design principles of large-scale, high-performance language models in the framework of task-agnostic learning.",
        "keywords": "MoE;Instruction Tuning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/25fb86090add41f7670f809a72fbb705fecd186c.pdf",
        "author": "Sheng Shen;Le Hou;Yanqi Zhou;Nan Du;Shayne Longpre;Jason Wei;Hyung Won Chung;Barret Zoph;William Fedus;Xinyun Chen;Tu Vu;Yuexin Wu;Wuyang Chen;Albert Webson;Yunxuan Li;Vincent Y Zhao;Hongkun Yu;Kurt Keutzer;Trevor Darrell;Denny Zhou",
        "authorids": "~Sheng_Shen2;~Le_Hou1;~Yanqi_Zhou1;~Nan_Du1;~Shayne_Longpre1;~Jason_Wei1;~Hyung_Won_Chung1;~Barret_Zoph1;~William_Fedus2;~Xinyun_Chen1;~Tu_Vu1;~Yuexin_Wu1;~Wuyang_Chen1;~Albert_Webson1;~Yunxuan_Li2;~Vincent_Y_Zhao1;~Hongkun_Yu2;~Kurt_Keutzer1;~Trevor_Darrell2;~Denny_Zhou1",
        "gender": "M;M;F;M;M;M;M;M;;;M;M;;;M;M;M;M;;",
        "homepage": "https://sincerass.github.io;http://vision.cs.stonybrook.edu/~lehhou/home/index.html;https://zhouyanqi.github.io/;;https://www.shaynelongpre.com;https://jasonwei20.github.io;;;;;https://tuvllms.github.io;https://crickwu.github.io;;https://representations.ai;;https://foo.bar;;https://people.eecs.berkeley.edu/~keutzer/;;",
        "dblp": "138/5764-1.html;161/9892;;;190/7024;02/11220.html;;;;;186/7716.html;09/1661;;276/1456;;301/7889;;k/KurtKeutzer.html;;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;kQ0HeQIAAAAJ;ZKEDQXYAAAAJ;v474hP4AAAAJ;ADd_YfkAAAAJ;;1CAlXvYAAAAJ;;;;tOevwEEAAAAJ;sd0nprMAAAAJ;;3OQplr0AAAAJ;Nun8Dy0AAAAJ;;;ID9QePIAAAAJ;;",
        "orcid": ";0000-0001-7323-5300;;;;;;;;;;;;;;;;0000-0003-3868-8501;;",
        "linkedin": "sheng-s-ab198a174/;;;dunangatech/;shayne-redford-longpre/;;;;;;;;;;;;;kurtkeutzer/;;",
        "or_profile": "~Sheng_Shen2;~Le_Hou1;~Yanqi_Zhou1;~Nan_Du1;~Shayne_Longpre1;~Jason_Wei1;~Hyung_Won_Chung1;~Barret_Zoph1;~William_Fedus2;~Xinyun_Chen1;~Tu_Vu1;~Yuexin_Wu1;~Wuyang_Chen1;~Albert_Webson1;~Yunxuan_Li2;~Vincent_Y_Zhao1;~Hongkun_Yu2;~Kurt_Keutzer1;~Trevor_Darrell2;~Denny_Zhou1",
        "aff": "University of California, Berkeley;Google Research;Google Brain;Apple/AIML;Massachusetts Institute of Technology;OpenAI;Google Brain;;;;Google;Google;;Google DeepMind;Google;Augment Computing;;University of California, Berkeley;;",
        "aff_domain": "berkeley.edu;google.com;google.com;apple.com;mit.edu;openai.com;google.com;;;;google.com;google.com;;google.com;google.com;augmentcode.com;;berkeley.edu;;",
        "position": "PhD student;Software Engineer;Research Scientist;Principal Researcher;PhD student;Researcher;Researcher;;;;Researcher;Software Engineer;;Research Scientist;Researcher;Researcher;;Full Professor;;",
        "bibtex": "@inproceedings{\nshen2024mixtureofexperts,\ntitle={Mixture-of-Experts Meets Instruction Tuning: A Winning Combination for Large Language Models},\nauthor={Sheng Shen and Le Hou and Yanqi Zhou and Nan Du and Shayne Longpre and Jason Wei and Hyung Won Chung and Barret Zoph and William Fedus and Xinyun Chen and Tu Vu and Yuexin Wu and Wuyang Chen and Albert Webson and Yunxuan Li and Vincent Y Zhao and Hongkun Yu and Kurt Keutzer and Trevor Darrell and Denny Zhou},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=6mLjDwYte5}\n}",
        "github": "",
        "project": "",
        "reviewers": "YDYY;nXAt;SYmE;8EEX",
        "pdf_size": 616153,
        "rating": "5;6;8;8",
        "confidence": "4;3;3;3",
        "soundness": "3;3;4;4",
        "contribution": "3;3;3;4",
        "presentation": "2;2;3;4",
        "wc_summary": "36;64;104;34",
        "wc_strengths": "60;69;109;66",
        "wc_weaknesses": "151;96;66;4",
        "wc_questions": "211;87;229;39",
        "wc_review": "458;316;508;143",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1089;230;468;133",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            59.5,
            28.297526393662043
        ],
        "wc_strengths_avg": [
            76.0,
            19.32614809008769
        ],
        "wc_weaknesses_avg": [
            79.25,
            53.07247403315583
        ],
        "wc_questions_avg": [
            141.5,
            80.56519099462248
        ],
        "wc_review_avg": [
            356.25,
            141.84212174103996
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            480.0,
            372.13371252817177
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            20,
            0
        ],
        "corr_rating_confidence": -0.7777777777777777,
        "gs_citation": 78,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5132913830946216531&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=6mLjDwYte5",
        "pdf": "https://openreview.net/pdf?id=6mLjDwYte5",
        "email": "berkeley.edu;google.com;google.com;apple.com;mit.edu;openai.com;google.com;;;;google.com;google.com;;google.com;google.com;augmentcode.com;;berkeley.edu;;",
        "author_num": 20,
        "aff_unique_index": "0;1;1;2;3;4;1;1;1;1;1;5;0",
        "aff_unique_norm": "University of California, Berkeley;Google;Apple;Massachusetts Institute of Technology;OpenAI;Augment Computing",
        "aff_unique_dep": ";Google Research;Artificial Intelligence and Machine Learning;;;",
        "aff_unique_url": "https://www.berkeley.edu;https://research.google;https://www.apple.com;https://web.mit.edu;https://openai.com;",
        "aff_unique_abbr": "UC Berkeley;Google Research;Apple;MIT;OpenAI;",
        "aff_campus_unique_index": "0;1;1;1;1;1;1;0",
        "aff_campus_unique": "Berkeley;Mountain View;",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;1;0;0",
        "aff_country_unique": "United States;United Kingdom;"
    },
    {
        "id": "6muJekoPR7",
        "title": "TROJFSL: TROJAN INSERTION IN FEW SHOT PROMPT LEARNING",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Prompt-tuning emerges as one of the most effective solutions to adapting a pre-trained language model (PLM) to processing new downstream natural language processing tasks, especially with only few input samples. The success of prompt-tuning motivates adversaries to create backdoor attacks against prompt-tuning. However, prior prompt-based backdoor attacks cannot be implemented through few-shot prompt-tuning, i.e., they require either a full-model fine-tuning or a large training dataset. We find it is difficult to build a prompt-based backdoor via few-shot prompt-tuning, i.e., freezing the PLM and tuning a soft prompt with a limited set of input samples. A backdoor design via few-shot prompt-tuning introduces an imbalanced poisoned dataset, easily suffers from the overfitting issue, and lack attention awareness. To mitigate these issues, we propose TrojFSL to perform backdoor attacks in the setting of few-shot prompt-tuning. TrojFSL consists of three modules, i.e., balanced poison learning, selective token poisoning, and trojan-trigger attention. Compared to prior prompt-based backdoor attacks, TrojFSL improves the ASR by 9% - 48% and the CDA by 4% - 9% across various PLMs and a wide range of downstream tasks.",
        "keywords": "Pre-trained Language Model;Few-Shot;Prompt;Trojan Attack",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Mengxin Zheng;Jiaqi Xue;Xun Chen;Yanshan Wang;Qian Lou;Lei Jiang",
        "authorids": "~Mengxin_Zheng1;~Jiaqi_Xue1;~Xun_Chen1;~Yanshan_Wang1;~Qian_Lou1;~Lei_Jiang1",
        "gender": "F;M;;;M;M",
        "homepage": "https://mxzheng.github.io/;https://jqxue1999.github.io;;;https://qlou.org;https://www.jianglei.org",
        "dblp": "327/9609;;;45/11295;207/3962.html;96/1994-1.html",
        "google_scholar": "CwLrXMAAAAAJ;NI2jppcAAAAJ;;;SBYgXLoAAAAJ;-1sXorAAAAAJ",
        "orcid": ";;;;;",
        "linkedin": "mengxin-zheng-86bb91171/;;;;;",
        "or_profile": "~Mengxin_Zheng1;~Jiaqi_Xue1;~Xun_Chen1;~Yanshan_Wang1;~Qian_Lou1;~Lei_Jiang1",
        "aff": "University of Central Florida;University of Central Florida;;University of Pittsburgh;University of Central Florida;Indiana University",
        "aff_domain": "ucf.edu;ucf.edu;;pitt.edu;ucf.edu;iu.edu",
        "position": "Assistant Professor;PhD student;;Assistant Professor;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nzheng2024trojfsl,\ntitle={{TROJFSL}: {TROJAN} {INSERTION} {IN} {FEW} {SHOT} {PROMPT} {LEARNING}},\nauthor={Mengxin Zheng and Jiaqi Xue and Xun Chen and Yanshan Wang and Qian Lou and Lei Jiang},\nyear={2024},\nurl={https://openreview.net/forum?id=6muJekoPR7}\n}",
        "github": "",
        "project": "",
        "reviewers": "x2RS;oqR6;P9fg",
        "site": "https://openreview.net/forum?id=6muJekoPR7",
        "pdf_size": 517370,
        "rating": "3;5;6",
        "confidence": "4;4;3",
        "soundness": "2;3;3",
        "contribution": "2;2;2",
        "presentation": "3;3;3",
        "wc_summary": "40;41;69",
        "wc_strengths": "14;46;50",
        "wc_weaknesses": "234;227;267",
        "wc_questions": "5;3;38",
        "wc_review": "293;317;424",
        "wc_reply_reviewers": "0;73;0",
        "wc_reply_authors": "811;785;640",
        "reply_reviewers": "0;1;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            50.0,
            13.4412301024373
        ],
        "wc_strengths_avg": [
            36.666666666666664,
            16.110727964792765
        ],
        "wc_weaknesses_avg": [
            242.66666666666666,
            17.441967269268172
        ],
        "wc_questions_avg": [
            15.333333333333334,
            16.048537489614297
        ],
        "wc_review_avg": [
            344.6666666666667,
            56.94636853117931
        ],
        "wc_reply_reviewers_avg": [
            24.333333333333332,
            34.41253001774532
        ],
        "wc_reply_authors_avg": [
            745.3333333333334,
            75.23444837454596
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.7559289460184545,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:8mTSEP-ATeIJ:scholar.google.com/&scioq=TROJFSL:+TROJAN+INSERTION+IN+FEW+SHOT+PROMPT+LEARNING&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;2",
        "aff_unique_norm": "University of Central Florida;University of Pittsburgh;Indiana University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ucf.edu;https://www.pitt.edu;https://www.indiana.edu",
        "aff_unique_abbr": "UCF;Pitt;IU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "6oC3djD3hU",
        "title": "ROBUST DIFFUSION GAN USING SEMI-UNBALANCED OPTIMAL TRANSPORT",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Diffusion models, a type of generative model, have demonstrated great potential for synthesizing highly detailed images. By integrating with GAN, advanced diffusion models like DDGAN \\citep{xiao2022DDGAN} could approach real-time performance for expansive practical applications. While DDGAN has effectively addressed the challenges of generative modeling, namely producing high-quality samples, covering different data modes, and achieving faster sampling, it remains susceptible to performance drops caused by datasets that are corrupted with outlier samples. This work introduces a robust training technique based on semi-unbalanced optimal transport to mitigate the impact of outliers effectively. Through comprehensive evaluations, we demonstrate that our robust diffusion GAN (RDGAN) outperforms vanilla DDGAN in terms of the aforementioned generative modeling criteria, i.e., image quality, mode coverage of distribution, and inference speed, and exhibits improved robustness when dealing with both clean and corrupted datasets.",
        "keywords": "optimal transport;diffusion model;generative model;robust generation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/fbe3abf538f0c15c3424986cf379b1e7cc53ab6d.zip",
        "author": "Quan Dao;B\u00ecnh H\u1eefu T\u1ea1;Tung Pham;Anh Tuan Tran",
        "authorids": "~Quan_Dao1;~B\u00ecnh_H\u1eefu_T\u1ea11;~Tung_Pham1;~Anh_Tuan_Tran2",
        "gender": "M;M;M;M",
        "homepage": "https://github.com/quandao10;;;https://sites.google.com/site/anhttranusc/",
        "dblp": "334/7610;;38/10862-1;150/5269-1",
        "google_scholar": "g0RS3_kAAAAJ;qBvM8_sAAAAJ;KcUuEKsAAAAJ;FYZ5ODQAAAAJ",
        "orcid": "0009-0006-0996-0472;;;0000-0002-3120-4036",
        "linkedin": ";;;https://linkedin.com/in/anh-tran-97814b19",
        "or_profile": "~Quan_Dao1;~B\u00ecnh_H\u1eefu_T\u1ea11;~Tung_Pham1;~Anh_Tuan_Tran2",
        "aff": "VinAI Research;VinAI Research;VinAI Research;VinAI Research",
        "aff_domain": "vinai.io;vinai.io;vinai.io;vinai.io",
        "position": "Intern;Intern;Researcher;Research Scientist",
        "bibtex": "@misc{\ndao2024robust,\ntitle={{ROBUST} {DIFFUSION} {GAN} {USING} {SEMI}-{UNBALANCED} {OPTIMAL} {TRANSPORT}},\nauthor={Quan Dao and B{\\`\\i}nh H\u1eefu T\u1ea1 and Tung Pham and Anh Tuan Tran},\nyear={2024},\nurl={https://openreview.net/forum?id=6oC3djD3hU}\n}",
        "github": "",
        "project": "",
        "reviewers": "ov4k;gFqX;P1f3;MvTD",
        "site": "https://openreview.net/forum?id=6oC3djD3hU",
        "pdf_size": 1292589,
        "rating": "3;5;5;5",
        "confidence": "3;4;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;2",
        "presentation": "2;2;2;2",
        "wc_summary": "43;76;37;16",
        "wc_strengths": "55;66;31;26",
        "wc_weaknesses": "93;51;219;149",
        "wc_questions": "63;213;34;2",
        "wc_review": "254;406;321;193",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            43.0,
            21.529050141610984
        ],
        "wc_strengths_avg": [
            44.5,
            16.560495161679196
        ],
        "wc_weaknesses_avg": [
            128.0,
            63.0
        ],
        "wc_questions_avg": [
            78.0,
            80.87335778858201
        ],
        "wc_review_avg": [
            293.5,
            79.1722805027113
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17369468804813068491&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "VinAI Research",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.vinai.io/",
        "aff_unique_abbr": "VinAI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Vietnam"
    },
    {
        "title": "Large Language Model Cascades with Mixture of Thought Representations for Cost-Efficient Reasoning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19383",
        "id": "6okaSfANzh",
        "author_site": "Murong Yue, Jie Zhao, Min Zhang, Liang Du, Ziyu Yao",
        "tldr": "",
        "abstract": "Large language models (LLMs) such as GPT-4 have exhibited remarkable performance in a variety of tasks, but this strong performance often comes with the high expense of using paid API services. In this paper, we are motivated to study building an LLM \"cascade\" to save the cost of using LLMs, particularly for performing (e.g., mathematical, causal) reasoning tasks. Our cascade pipeline follows the intuition that simpler questions can be addressed by a weaker but more affordable LLM, whereas only the most challenging questions necessitate the stronger and more expensive LLM. To realize this decision-making, we consider the \"answer consistency\" of the weaker LLM as a signal of the question difficulty and propose several methods for answering sampling and consistency checking, including one leveraging a mixture of two thought representations (i.e., Chain-of-Thought and Program-of-Thought). Through experiments on six reasoning benchmark datasets, with GPT-3.5-turbo and GPT-4 being the weaker and stronger LLMs, respectively, our cascade pipeline demonstrates comparable performance but reduces about 60% of the cost compared with fully using the stronger LLM.",
        "keywords": "Large Language Models;Natural Language Processing;Reasoning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/2a26302d325a3f2262f6ea00a260917a943e3e4d.zip",
        "author": "Murong Yue;Jie Zhao;Min Zhang;Liang Du;Ziyu Yao",
        "authorids": "~Murong_Yue1;~Jie_Zhao1;~Min_Zhang18;~Liang_Du3;~Ziyu_Yao1",
        "gender": "M;;F;;F",
        "homepage": "https://murongyue.github.io/;;https://gabriellamin.github.io/Min-homepage.github.io/;;http://ziyuyao.org",
        "dblp": "354/7400;;;;",
        "google_scholar": "ivm3dVEAAAAJ;;PxmM3oEAAAAJ;aq4dG-AAAAAJ;4lYrMNUAAAAJ",
        "orcid": ";;;;0009-0007-4571-3505",
        "linkedin": "murong-yue-480a78177/;;min-zhang-905479292/;;",
        "or_profile": "~Murong_Yue1;~Jie_Zhao1;~Min_Zhang18;~Liang_Du3;~Ziyu_Yao1",
        "aff": "George Mason University;;Virginia Polytechnic Institute and State University;Microsoft;George Mason University",
        "aff_domain": "gmu.edu;;vt.edu;microsoft.com;gmu.edu",
        "position": "PhD student;;PhD student;Researcher;Assistant Professor",
        "bibtex": "@inproceedings{\nyue2024large,\ntitle={Large Language Model Cascades with Mixture of Thought Representations for Cost-Efficient Reasoning},\nauthor={Murong Yue and Jie Zhao and Min Zhang and Liang Du and Ziyu Yao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=6okaSfANzh}\n}",
        "github": "",
        "project": "",
        "reviewers": "6oKd;BfsR;ijvt",
        "pdf_size": 1040600,
        "rating": "6;6;8",
        "confidence": "3;3;4",
        "soundness": "3;4;4",
        "contribution": "3;3;4",
        "presentation": "3;3;4",
        "wc_summary": "78;92;164",
        "wc_strengths": "95;146;46",
        "wc_weaknesses": "141;379;6",
        "wc_questions": "37;140;50",
        "wc_review": "351;757;266",
        "wc_reply_reviewers": "0;73;14",
        "wc_reply_authors": "436;1092;387",
        "reply_reviewers": "0;1;1",
        "reply_authors": "1;2;2",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            111.33333333333333,
            37.67698973585278
        ],
        "wc_strengths_avg": [
            95.66666666666667,
            40.827550610940264
        ],
        "wc_weaknesses_avg": [
            175.33333333333334,
            154.1997261850862
        ],
        "wc_questions_avg": [
            75.66666666666667,
            45.79907810814051
        ],
        "wc_review_avg": [
            458.0,
            214.25374364679527
        ],
        "wc_reply_reviewers_avg": [
            29.0,
            31.63331577098213
        ],
        "wc_reply_authors_avg": [
            638.3333333333334,
            321.41389031728056
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.9999999999999998,
        "gs_citation": 63,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3633402015473153407&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=6okaSfANzh",
        "pdf": "https://openreview.net/pdf?id=6okaSfANzh",
        "email": "gmu.edu;;vt.edu;microsoft.com;gmu.edu",
        "author_num": 5,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "George Mason University;Virginia Tech;Microsoft",
        "aff_unique_dep": ";;Microsoft Corporation",
        "aff_unique_url": "https://www.gmu.edu;https://www.vt.edu;https://www.microsoft.com",
        "aff_unique_abbr": "GMU;VT;Microsoft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "A Semantic Invariant Robust Watermark for Large Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19382",
        "id": "6p8lpe4MNf",
        "author_site": "Aiwei Liu, Leyi Pan, Xuming Hu, Shiao Meng, Lijie Wen",
        "tldr": "",
        "abstract": "Watermark algorithms for large language models (LLMs) have achieved extremely high accuracy in detecting text generated by LLMs. Such algorithms typically involve adding extra watermark logits to the LLM's logits at each generation step. However, prior algorithms face a trade-off between attack robustness and security robustness. This is because the watermark logits for a token are determined by a certain number of preceding tokens; a small number leads to low security robustness, while a large number results in insufficient attack robustness. In this work, we propose a semantic invariant watermarking method for LLMs that provides both attack robustness and security robustness. The watermark logits in our work are determined by the semantics of all preceding tokens. Specifically, we utilize another embedding LLM to generate semantic embeddings for all preceding tokens, and then these semantic embeddings are transformed into the watermark logits through our trained watermark model.\nSubsequent analyses and experiments demonstrated the attack robustness of our method in semantically invariant settings: synonym substitution and text paraphrasing settings. Finally, we also show that our watermark possesses adequate security robustness.",
        "keywords": "Watermark algorithms;Large Language Models;Robustness",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/dacdf0a0c94dc157d062c579a985cdd676b56f8d.zip",
        "author": "Aiwei Liu;Leyi Pan;Xuming Hu;Shiao Meng;Lijie Wen",
        "authorids": "~Aiwei_Liu1;~Leyi_Pan1;~Xuming_Hu1;~Shiao_Meng1;~Lijie_Wen1",
        "gender": "M;F;M;M;M",
        "homepage": "https://exlaw.github.io/;;https://xuminghu.github.io/;https://github.com/msa30;https://www.thss.tsinghua.edu.cn/en/faculty/lijiewen.htm",
        "dblp": "321/4365;353/1437.html;262/3664;333/0475;36/172-1",
        "google_scholar": "UCOOmcEAAAAJ;https://scholar.google.com/citations?hl=zh-CN;dbBKbXoAAAAJ;https://scholar.google.com.hk/citations?user=2rd5iDIAAAAJ;https://scholar.google.com.tw/citations?user=f3C0jUIAAAAJ",
        "orcid": ";;0000-0001-6075-4224;;0000-0003-0358-3160",
        "linkedin": "%E7%91%B7%E7%8E%AE-%E5%88%98-0722731a6/;%E4%B9%90%E6%80%A1-%E6%BD%98-806718275/;;;",
        "or_profile": "~Aiwei_Liu1;~Leyi_Pan1;~Xuming_Hu1;~Shiao_Meng1;~Lijie_Wen1",
        "aff": "Chinese University of Hong Kong;Tsinghua University;Tsinghua University;Tsinghua University;Tsinghua University",
        "aff_domain": "cuhk.hk;mails.tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "Visiting Scholar;Undergrad student;PhD student;PhD student;Associate Professor",
        "bibtex": "@inproceedings{\nliu2024a,\ntitle={A Semantic Invariant Robust Watermark for Large Language Models},\nauthor={Aiwei Liu and Leyi Pan and Xuming Hu and Shiao Meng and Lijie Wen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=6p8lpe4MNf}\n}",
        "github": "",
        "project": "",
        "reviewers": "yZti;FTnC;1s48;1hfF",
        "pdf_size": 822321,
        "rating": "3;5;6;8",
        "confidence": "4;3;3;5",
        "soundness": "1;3;2;3",
        "contribution": "1;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "58;109;46;125",
        "wc_strengths": "35;74;56;134",
        "wc_weaknesses": "249;103;81;298",
        "wc_questions": "53;135;132;339",
        "wc_review": "395;421;315;896",
        "wc_reply_reviewers": "139;236;16;441",
        "wc_reply_authors": "1089;936;464;1095",
        "reply_reviewers": "1;2;1;2",
        "reply_authors": "2;3;1;3",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            84.5,
            33.26033673912518
        ],
        "wc_strengths_avg": [
            74.75,
            36.88749788207381
        ],
        "wc_weaknesses_avg": [
            182.75,
            92.71562705391146
        ],
        "wc_questions_avg": [
            164.75,
            105.84038690405472
        ],
        "wc_review_avg": [
            506.75,
            228.103457886986
        ],
        "wc_reply_reviewers_avg": [
            208.0,
            155.48151015474477
        ],
        "wc_reply_authors_avg": [
            896.0,
            257.42668859308276
        ],
        "reply_reviewers_avg": [
            1.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.4181210050035454,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "openreview": "https://openreview.net/forum?id=6p8lpe4MNf",
        "pdf": "https://openreview.net/pdf?id=6p8lpe4MNf",
        "email": "cuhk.hk;mails.tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn",
        "author_num": 5,
        "aff_unique_index": "0;1;1;1;1",
        "aff_unique_norm": "Chinese University of Hong Kong;Tsinghua University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cuhk.edu.hk;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "CUHK;THU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Towards Diverse Behaviors: A Benchmark for Imitation Learning with Human Demonstrations",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19381",
        "id": "6pPYRXKPpw",
        "author_site": "Xiaogang Jia, Denis Blessing, Xinkai Jiang, Moritz Reuss, Atalay Donat, Rudolf Lioutikov, Gerhard Neumann",
        "tldr": "",
        "abstract": "Imitation learning with human data has demonstrated remarkable success in teaching robots in a wide range of skills. However, the inherent diversity in human behavior leads to the emergence of multi-modal data distributions, thereby presenting a formidable challenge for existing imitation learning algorithms. Quantifying a model's capacity to capture and replicate this diversity effectively is still an open problem. In this work, we introduce simulation benchmark environments and the corresponding *Datasets with Diverse human Demonstrations for Imitation Learning (D3IL)*, designed explicitly to evaluate a model's ability to learn multi-modal behavior. Our environments are designed to involve multiple sub-tasks that need to be solved, consider manipulation of multiple objects which increases the diversity of the behavior and can only be solved by policies that rely on closed loop sensory feedback. Other available datasets are missing at least one of these challenging properties.\nTo address the challenge of diversity quantification, we introduce tractable metrics that provide valuable insights into a model's ability to acquire and reproduce diverse behaviors. These metrics offer a practical means to assess the robustness and versatility of imitation learning algorithms. Furthermore, we conduct a thorough evaluation of state-of-the-art methods on the proposed task suite. This evaluation serves as a benchmark for assessing their capability to learn diverse behaviors. Our findings shed light on the effectiveness of these methods in tackling the intricate problem of capturing and generalizing multi-modal human behaviors, offering a valuable reference for the design of future imitation learning algorithms.",
        "keywords": "Imitation Learning;Benchmark;Datasets;Diverse Behaviors",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/cd40700eabe3ab1ed74ee745d330703687a0bd4f.zip",
        "author": "Xiaogang Jia;Denis Blessing;Xinkai Jiang;Moritz Reuss;Atalay Donat;Rudolf Lioutikov;Gerhard Neumann",
        "authorids": "~Xiaogang_Jia1;~Denis_Blessing1;~Xinkai_Jiang1;~Moritz_Reuss1;~Atalay_Donat1;~Rudolf_Lioutikov1;~Gerhard_Neumann2",
        "gender": "M;M;M;M;M;M;M",
        "homepage": "https://xiaogangjia.github.io/Personal_Website/;;;;https://www.ias.informatik.tu-darmstadt.de/Team/AtalayDonat;https://rudolf.intuitive-robots.net;https://alr.anthropomatik.kit.edu/",
        "dblp": "23/10777;219/1435;;321/1769;;151/9451;60/4878",
        "google_scholar": "E7Tja9gAAAAJ;https://scholar.google.de/citations?view_op=list_works;1BfDuRMAAAAJ;NLuzkPIAAAAJ;LG_x9Y8AAAAJ;hvjV43MAAAAJ;https://scholar.google.com.tw/citations?user=GL360kMAAAAJ",
        "orcid": ";;;;;;",
        "linkedin": ";;;;;rudolf-lioutikov-74830730a/;",
        "or_profile": "~Xiaogang_Jia1;~Denis_Blessing1;~Xinkai_Jiang1;~Moritz_Reuss1;~Atalay_Donat1;~Rudolf_Lioutikov1;~Gerhard_Neumann1",
        "aff": "Karlsruher Institut f\u00fcr Technologie;Karlsruher Institut f\u00fcr Technologie;Karlsruher Institut f\u00fcr Technologie;Karlsruher Institut f\u00fcr Technologie;Karlsruher Institut f\u00fcr Technologie;Karlsruher Institut f\u00fcr Technologie;Karlsruhe Institute of Technology",
        "aff_domain": "kit.edu;kit.edu;kit.edu;kit.edu;kit.edu;kit.edu;kit.edu",
        "position": "PhD student;PhD student;PhD student;PhD student;MS student;Tenure-Track Professor;Full Professor",
        "bibtex": "@inproceedings{\njia2024towards,\ntitle={Towards Diverse Behaviors: A Benchmark for Imitation Learning with Human Demonstrations},\nauthor={Xiaogang Jia and Denis Blessing and Xinkai Jiang and Moritz Reuss and Atalay Donat and Rudolf Lioutikov and Gerhard Neumann},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=6pPYRXKPpw}\n}",
        "github": "",
        "project": "",
        "reviewers": "S4Qj;DMVD;K6Tb",
        "pdf_size": 4672377,
        "rating": "6;8;8",
        "confidence": "4;4;5",
        "soundness": "3;3;3",
        "contribution": "3;3;2",
        "presentation": "3;3;3",
        "wc_summary": "264;50;160",
        "wc_strengths": "46;116;132",
        "wc_weaknesses": "242;94;152",
        "wc_questions": "119;14;41",
        "wc_review": "671;274;485",
        "wc_reply_reviewers": "0;23;0",
        "wc_reply_authors": "645;822;418",
        "reply_reviewers": "0;1;0",
        "reply_authors": "1;2;1",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            158.0,
            87.37657962329875
        ],
        "wc_strengths_avg": [
            98.0,
            37.345236197762446
        ],
        "wc_weaknesses_avg": [
            162.66666666666666,
            60.889699913495676
        ],
        "wc_questions_avg": [
            58.0,
            44.51965857910413
        ],
        "wc_review_avg": [
            476.6666666666667,
            162.1816539837009
        ],
        "wc_reply_reviewers_avg": [
            7.666666666666667,
            10.842303978193728
        ],
        "wc_reply_authors_avg": [
            628.3333333333334,
            165.3528214320988
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 24,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11692037980249187412&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=6pPYRXKPpw",
        "pdf": "https://openreview.net/pdf?id=6pPYRXKPpw",
        "email": "kit.edu;kit.edu;kit.edu;kit.edu;kit.edu;kit.edu;kit.edu",
        "author_num": 7,
        "aff_unique_index": "0;0;0;0;0;0;1",
        "aff_unique_norm": "Karlsruher Institut f\u00fcr Technologie;Karlsruhe Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.kit.edu;https://www.kit.edu",
        "aff_unique_abbr": "KIT;KIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "6qtDu7hVPF",
        "title": "Generative Reinforcement Learning with Transformers",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In reinforcement learning, Transformers have been shown to be powerful models for multi-task policy distillation and, to a lesser extent, policy improvement via return interventions within frameworks such as Decision Transformers. These recent results are somewhat atypical for reinforcement learning, as they do not rely on the learning of a value function, which is usually at the heart of most traditional approaches. In this paper, we explore a principled approach to purely generative value function approximation with Transformers, opening the way for existing techniques to be applied for policy improvement. Importantly, unlike other RL methods, this generative approach allows us to kickstart the learning process by fine-tuning strong pretrained state predictors, such as foundation models, substantially shortening the training time. We showcase the potential of our approach by constructing an action-value function for chess that can play at the level of an expert human and over 400 Elo stronger than direct behavioural cloning.",
        "keywords": "reinforcement learning;transformers;policy evaluation;policy improvement;sequence modeling;compression",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/7260ce54541f8a6748700bcd1c93f6756cf663ce.zip",
        "author": "Gregoire Deletang;Anian Ruoss;Li Kevin Wenliang;Elliot Catt;Tim Genewein;Jordi Grau-Moya;Marcus Hutter;Joel Veness",
        "authorids": "~Gregoire_Deletang1;~Anian_Ruoss1;~Li_Kevin_Wenliang1;~Elliot_Catt1;~Tim_Genewein1;~Jordi_Grau-Moya2;~Marcus_Hutter1;~Joel_Veness2",
        "gender": ";M;;M;M;;;",
        "homepage": ";;https://kevin-w-li.github.io/;;http://tim.inversetemperature.net/;;http://www.hutter1.net/;",
        "dblp": ";259/2083;255/7009;204/2511;116/3039;116/3023;h/MarcusHutter;",
        "google_scholar": ";gFkwD3kAAAAJ;https://scholar.google.co.uk/citations?user=MW45NMEAAAAJ;d1JYeMIAAAAJ;https://scholar.google.de/citations?user=peNTK9oAAAAJ;;https://scholar.google.com.tw/citations?user=7hmCntEAAAAJ;",
        "orcid": ";;;0000-0001-9411-927X;;;0000-0002-3263-4097;",
        "linkedin": ";anian-ruoss;;;;jordi-g-9a1b02104;hutter1/;",
        "or_profile": "~Gregoire_Deletang1;~Anian_Ruoss1;~Li_Kevin_Wenliang1;~Elliot_Catt1;~Tim_Genewein1;~Jordi_Grau-Moya2;~Marcus_Hutter1;~Joel_Veness2",
        "aff": ";Google DeepMind;Google DeepMind;Google DeepMind;Google DeepMind;Google DeepMind;Australian National University;",
        "aff_domain": ";deepmind.com;deepmind.com;deepmind.com;google.com;deepmind.com;anu.edu.au;",
        "position": ";Researcher;Researcher;Researcher;Researcher;Researcher;Full Professor;",
        "bibtex": "@misc{\ndeletang2024generative,\ntitle={Generative Reinforcement Learning with Transformers},\nauthor={Gregoire Deletang and Anian Ruoss and Li Kevin Wenliang and Elliot Catt and Tim Genewein and Jordi Grau-Moya and Marcus Hutter and Joel Veness},\nyear={2024},\nurl={https://openreview.net/forum?id=6qtDu7hVPF}\n}",
        "github": "",
        "project": "",
        "reviewers": "izzx;A7j8;FxJd;MRfp;vuG2",
        "site": "https://openreview.net/forum?id=6qtDu7hVPF",
        "pdf_size": 1329677,
        "rating": "3;3;3;5;6",
        "confidence": "4;4;3;4;3",
        "soundness": "3;2;2;2;3",
        "contribution": "1;2;2;3;3",
        "presentation": "3;2;2;2;3",
        "wc_summary": "51;84;34;51;67",
        "wc_strengths": "44;28;49;20;183",
        "wc_weaknesses": "119;112;483;162;172",
        "wc_questions": "116;246;2;152;153",
        "wc_review": "330;470;568;385;575",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "190;301;347;275;191",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            4.0,
            1.2649110640673518
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.2,
            0.7483314773547882
        ],
        "presentation_avg": [
            2.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            57.4,
            16.906803364326446
        ],
        "wc_strengths_avg": [
            64.8,
            60.02466159837971
        ],
        "wc_weaknesses_avg": [
            209.6,
            138.68035188879495
        ],
        "wc_questions_avg": [
            133.8,
            78.71060919596543
        ],
        "wc_review_avg": [
            465.6,
            97.32132345996945
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            260.8,
            61.85919495111458
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.3227486121839514,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:JO8l9macY-wJ:scholar.google.com/&scioq=Generative+Reinforcement+Learning+with+Transformers&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0;1",
        "aff_unique_norm": "Google;Australian National University",
        "aff_unique_dep": "Google DeepMind;",
        "aff_unique_url": "https://deepmind.com;https://www.anu.edu.au",
        "aff_unique_abbr": "DeepMind;ANU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;1",
        "aff_country_unique": "United Kingdom;Australia"
    },
    {
        "id": "6r0BOIb771",
        "title": "Sequential Bayesian Continual Learning with Meta-Learned Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In the present era of deep learning, continual learning research is mainly focused on mitigating forgetting when training a neural network with stochastic gradient descent (SGD) on a non-stationary stream of data.\nOn the other hand, there is a wealth of research on sequential learning in the more classical literature of statistical machine learning.\nMany models in this literature have sequential Bayesian update rules that yield the same learning outcome as the batch training, i.e., they are completely immune to catastrophic forgetting.\nHowever, they suffer from underfitting when modeling complex distributions due to their weak representational power.\nIn this work, we introduce a general meta-continual learning (MCL) framework that combines neural networks' strong representational power and simple statistical models' robustness to forgetting.\nIn our framework, continual learning takes place only in a statistical model in the embedding space via a sequential Bayesian update rule, while meta-learned neural networks bridge the raw data and the embedding space.\nSince our approach is domain-agnostic and model-agnostic, it can be applied to a wide range of problems and easily integrated with existing model architectures.\nCompared to SGD-based MCL methods, our approach demonstrates significantly improved performance and scalability.",
        "keywords": "sequential Bayes;meta-continual learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/97e27f89dc3297d102b54ba6f24c8d22f9e3a7d4.zip",
        "author": "Soochan Lee;Hyeonseong Jeon;Jaehyeon Son;Gunhee Kim",
        "authorids": "~Soochan_Lee1;~Hyeonseong_Jeon2;~Jaehyeon_Son1;~Gunhee_Kim1",
        "gender": "M;M;M;M",
        "homepage": "https://soochanlee.com;;https://jaehyeon-son.github.io/;http://vision.snu.ac.kr/gunhee/",
        "dblp": "230/1398;;359/3097.html;45/115",
        "google_scholar": "8O3MKJkAAAAJ;;q7SrBsgAAAAJ;https://scholar.google.co.kr/citations?user=CiSdOV0AAAAJ",
        "orcid": "0000-0002-1425-9262;;0009-0004-2726-1144;0000-0002-9543-7453",
        "linkedin": ";hs-jeon;jaehyeon-son-a626202b3/;",
        "or_profile": "~Soochan_Lee1;~Hyeonseong_Jeon2;~Jaehyeon_Son1;~Gunhee_Kim1",
        "aff": "Seoul National University;Seoul National University, Seoul National University;Seoul National University;Seoul National University",
        "aff_domain": "snu.ac.kr;cse.snu.ac.kr;snu.ac.kr;snu.ac.kr",
        "position": "PhD student;Undergrad student;Researcher;Full Professor",
        "bibtex": "@misc{\nlee2024sequential,\ntitle={Sequential Bayesian Continual Learning with Meta-Learned Neural Networks},\nauthor={Soochan Lee and Hyeonseong Jeon and Jaehyeon Son and Gunhee Kim},\nyear={2024},\nurl={https://openreview.net/forum?id=6r0BOIb771}\n}",
        "github": "",
        "project": "",
        "reviewers": "awoT;DFZf;y1kN",
        "site": "https://openreview.net/forum?id=6r0BOIb771",
        "pdf_size": 5128885,
        "rating": "5;5;6",
        "confidence": "2;4;4",
        "soundness": "3;3;3",
        "contribution": "2;2;3",
        "presentation": "3;1;3",
        "wc_summary": "43;68;342",
        "wc_strengths": "22;55;193",
        "wc_weaknesses": "59;345;327",
        "wc_questions": "33;30;123",
        "wc_review": "157;498;985",
        "wc_reply_reviewers": "0;300;341",
        "wc_reply_authors": "288;1554;1322",
        "reply_reviewers": "0;1;1",
        "reply_authors": "1;3;3",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            151.0,
            135.44248471829903
        ],
        "wc_strengths_avg": [
            90.0,
            74.06753674856482
        ],
        "wc_weaknesses_avg": [
            243.66666666666666,
            130.78566010419064
        ],
        "wc_questions_avg": [
            62.0,
            43.15089802078283
        ],
        "wc_review_avg": [
            546.6666666666666,
            339.7767240736514
        ],
        "wc_reply_reviewers_avg": [
            213.66666666666666,
            152.0095026269374
        ],
        "wc_reply_authors_avg": [
            1054.6666666666667,
            550.326771614425
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7291363222291637272&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Seoul National University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.snu.ac.kr",
        "aff_unique_abbr": "SNU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Seoul",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "6rEcB9m9AI",
        "title": "Promoting Exploration in Memory-Augmented Adam using Critical Momenta",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Adaptive gradient-based optimizers, particularly Adam, have left their mark in training large-scale deep learning models. The strength of such optimizers is that they exhibit fast convergence while being more robust to hyperparameter choice. However, they often generalize worse than non-adaptive methods. Recent studies have tied this performance gap to flat minima selection: adaptive methods tend to find solutions in sharper basins of the loss landscape, which in turn hurts generalization. To overcome this issue, we propose a new memory-augmented version of Adam that promotes {exploration} towards flatter minima by using a buffer of critical momentum terms during training. Intuitively, the use of the buffer makes the optimizer overshoot outside the basin of attraction if it is not wide enough. We empirically show that our method improves model performance on standard supervised and online learning tasks.",
        "keywords": "Adaptive optimization;deep learning;memory-augmented optimizers;momentum",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Pranshu Malviya;Goncalo Mordido;Aristide Baratin;Reza Babanezhad Harikandeh;Jerry Huang;Simon Lacoste-Julien;Razvan Pascanu;Sarath Chandar",
        "authorids": "~Pranshu_Malviya1;~Goncalo_Mordido1;~Aristide_Baratin1;~Reza_Babanezhad_Harikandeh1;~Jerry_Huang1;~Simon_Lacoste-Julien1;~Razvan_Pascanu1;~Sarath_Chandar1",
        "gender": "M;;;M;;M;M;M",
        "homepage": "https://pranshu28.github.io/about/;;;http://babanezhad.ca;;http://www.iro.umontreal.ca/~slacoste/;https://razp.info;http://sarathchandar.in/",
        "dblp": ";;;37/8904.html;;94/446.html;65/8368.html;45/8542",
        "google_scholar": ";;;KLrwPsgAAAAJ;;oejm5IUAAAAJ;https://scholar.google.ca/citations?user=eSPY8LwAAAAJ;https://scholar.google.co.in/citations?user=yxWtZLAAAAAJ",
        "orcid": ";;;;;0000-0001-6485-6180;;",
        "linkedin": "pranshumalviya2/;;;;;simon-lacoste-julien-355b9a3;;",
        "or_profile": "~Pranshu_Malviya1;~Goncalo_Mordido1;~Aristide_Baratin1;~Reza_Babanezhad_Harikandeh1;~Jerry_Huang1;~Simon_Lacoste-Julien1;~Razvan_Pascanu1;~Sarath_Chandar1",
        "aff": "\u00c9cole Polytechnique de Montr\u00e9al, Universit\u00e9 de Montr\u00e9al;;;Samsung;;Samsung - SAIT AI Lab, Montreal;Google DeepMind;\u00c9cole Polytechnique de Montr\u00e9al",
        "aff_domain": "polymtl.ca;;;samsung.com;;samsung.com;google.com;polymtl.ca",
        "position": "PhD student;;;Research Scientist;;VP Lab Director;Research Scientist;Assistant Professor",
        "bibtex": "@misc{\nmalviya2024promoting,\ntitle={Promoting Exploration in Memory-Augmented Adam using Critical Momenta},\nauthor={Pranshu Malviya and Goncalo Mordido and Aristide Baratin and Reza Babanezhad Harikandeh and Jerry Huang and Simon Lacoste-Julien and Razvan Pascanu and Sarath Chandar},\nyear={2024},\nurl={https://openreview.net/forum?id=6rEcB9m9AI}\n}",
        "github": "",
        "project": "",
        "reviewers": "qx25;V8UZ;Jwku;GnW1",
        "site": "https://openreview.net/forum?id=6rEcB9m9AI",
        "pdf_size": 5510489,
        "rating": "3;5;5;6",
        "confidence": "4;4;4;1",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "106;68;65;80",
        "wc_strengths": "72;36;22;53",
        "wc_weaknesses": "167;154;167;16",
        "wc_questions": "127;105;2;25",
        "wc_review": "472;363;256;174",
        "wc_reply_reviewers": "0;0;0;44",
        "wc_reply_authors": "705;456;733;201",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            1.299038105676658
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            79.75,
            16.161296358893985
        ],
        "wc_strengths_avg": [
            45.75,
            18.713297411199342
        ],
        "wc_weaknesses_avg": [
            126.0,
            63.72989879169745
        ],
        "wc_questions_avg": [
            64.75,
            52.470825226977325
        ],
        "wc_review_avg": [
            316.25,
            112.14806061631204
        ],
        "wc_reply_reviewers_avg": [
            11.0,
            19.05255888325765
        ],
        "wc_reply_authors_avg": [
            523.75,
            215.2874531875929
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.6622661785325219,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17004626632720092258&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1;2;0",
        "aff_unique_norm": "\u00c9cole Polytechnique de Montr\u00e9al;Samsung;Google",
        "aff_unique_dep": ";Samsung;Google DeepMind",
        "aff_unique_url": "https://www.polymtl.ca;https://www.samsung.com;https://deepmind.com",
        "aff_unique_abbr": "Polytechnique Montr\u00e9al;Samsung;DeepMind",
        "aff_campus_unique_index": "0;2;0",
        "aff_campus_unique": "Montr\u00e9al;;Montreal",
        "aff_country_unique_index": "0;1;0;2;0",
        "aff_country_unique": "Canada;South Korea;United Kingdom"
    },
    {
        "id": "6rvliexcMV",
        "title": "Emergent representations in networks trained with the Forward-Forward algorithm",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The Backpropagation algorithm, widely used to train neural networks, has often been criticised for its lack of biological realism. In an attempt to find a more biologically plausible alternative, and avoid to back-propagate gradients in favour of using local learning rules, the recently introduced Forward-Forward algorithm replaces the traditional forward and backward passes of Backpropagation with two forward passes. In this work, we show that internal representations obtained with the Forward-Forward algorithm can organize into robust, category-specific ensembles, composed by an extremely low number of active units (high sparsity). This situation is reminiscent of what has been observed in cortical sensory areas, where neuronal ensembles are suggested to serve as the functional building blocks for perception and action. Interestingly, while these ensembles do not typically arise in models trained with standard Backpropagation, they can manifest in networks optimized by Backpropagation, given the same training objective as that of the Forward-Forward algorithm. These findings suggest that the learning procedure proposed by Forward-Forward may surpass Backpropagation in its capacity to model learning in the cortex, even when a backward pass is used, and may inspire new approaches to compare representations in biological and artificial neural networks.",
        "keywords": "Forward-Forward;Representations;Sensory cortex;Ensembles;Sparsity;Backpropagation",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Niccolo Tosato;Lorenzo Basile;Emanuele Ballarin;Giuseppe De Alteriis;Alberto Cazzaniga;Alessio ansuini",
        "authorids": "~Niccolo_Tosato1;~Lorenzo_Basile1;~Emanuele_Ballarin1;~Giuseppe_De_Alteriis1;~Alberto_Cazzaniga1;~Alessio_ansuini1",
        "gender": "M;;M;M;M;M",
        "homepage": ";;https://ballarin.cc/;;https://areasciencepark-rit.gitlab.io/lade/alberto.cazzaniga/;",
        "dblp": ";348/5790;348/6393;;339/6443;232/2196",
        "google_scholar": ";EUE33IQAAAAJ;https://scholar.google.com/citations?hl=en;Nm1c1QkAAAAJ;AmafJqIAAAAJ;6lhdu6kAAAAJ",
        "orcid": ";;0000-0003-3673-0665;0000-0003-3116-6006;0000-0001-6271-3303;0000-0002-3117-3532",
        "linkedin": "https://linkedin.com/in/niccolo-tosato;lorebasile/;emaballarin;giuseppe-de-alteriis-664875253/;alberto-cazzaniga-4155b6164/;alessioansuini/",
        "or_profile": "~Niccolo_Tosato1;~Lorenzo_Basile1;~Emanuele_Ballarin1;~Giuseppe_De_Alteriis1;~Alberto_Cazzaniga1;~Alessio_ansuini1",
        "aff": "University of Trieste;University of Trieste;University of Trieste;King's College London, University of London;AREA Science Park;AREA Science Park",
        "aff_domain": "units.it;units.it;units.it;kcl.ac.uk;areasciencepark.it;areasciencepark.it",
        "position": "MS student;PhD student;PhD student;PhD student;Researcher;Researcher",
        "bibtex": "@misc{\ntosato2024emergent,\ntitle={Emergent representations in networks trained with the Forward-Forward algorithm},\nauthor={Niccolo Tosato and Lorenzo Basile and Emanuele Ballarin and Giuseppe De Alteriis and Alberto Cazzaniga and Alessio ansuini},\nyear={2024},\nurl={https://openreview.net/forum?id=6rvliexcMV}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=6rvliexcMV",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12816113402618674086&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;1;2;2",
        "aff_unique_norm": "University of Trieste;King's College London;Area Science Park",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.units.it;https://www.kcl.ac.uk;https://www.area-science-park.org/",
        "aff_unique_abbr": "UniTS;KCL;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0;0",
        "aff_country_unique": "Italy;United Kingdom"
    },
    {
        "id": "6sfRRcynDy",
        "title": "Out-of-Distribution Detection with Hyperspherical Energy",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The ability to detect if inputs are out-of-distribution (OOD) is essential to guarantee the reliability and safety of machine learning models that are deployed in an open environment. Recent studies have shown that an energy-based score is effective. However, unconstrained energy scores from a model trained with cross-entropy loss may not necessarily reflect the log-likelihood. To address this limitation, we introduce a novel hyperspherical energy score that connects energy with hyperspherical representations. By modeling hyperspherical representations using von Mises-Fisher distribution, our method provides a more accurate interpretation from a log-likelihood perspective, making it an efficient OOD detection indicator. Our method consistently achieves competitive performance on popular OOD detection benchmarks. On the large-scale ImageNet-1k benchmark, our method is more than 10 times faster than the KNN-based score, while simultaneously reducing the average FPR95 by 11.85%.",
        "keywords": "Hyperspherical energy;model reliability",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/b9389ef50e67203a371ee55824c200af143cbea4.pdf",
        "author": "Jirayu Burapacheep;Yixuan Li",
        "authorids": "~Jirayu_Burapacheep1;~Yixuan_Li1",
        "gender": ";F",
        "homepage": "https://top34051.github.io/;http://pages.cs.wisc.edu/~sharonli/",
        "dblp": "330/2284;144/6087-1",
        "google_scholar": ";https://scholar.google.com/citations?hl=en",
        "orcid": ";",
        "linkedin": ";liyixuan",
        "or_profile": "~Jirayu_Burapacheep1;~Yixuan_Li1",
        "aff": "Stanford University;Cornell University",
        "aff_domain": "stanford.edu;cornell.edu",
        "position": "MS student;Graduate Student",
        "bibtex": "@misc{\nburapacheep2024outofdistribution,\ntitle={Out-of-Distribution Detection with Hyperspherical Energy},\nauthor={Jirayu Burapacheep and Yixuan Li},\nyear={2024},\nurl={https://openreview.net/forum?id=6sfRRcynDy}\n}",
        "github": "",
        "project": "",
        "reviewers": "A9ru;aQu1;uYkE;fiAA",
        "site": "https://openreview.net/forum?id=6sfRRcynDy",
        "pdf_size": 2597262,
        "rating": "3;5;5;6",
        "confidence": "5;3;3;4",
        "soundness": "1;3;3;3",
        "contribution": "1;2;2;2",
        "presentation": "2;3;2;4",
        "wc_summary": "88;148;98;68",
        "wc_strengths": "23;49;31;38",
        "wc_weaknesses": "516;171;126;128",
        "wc_questions": "262;276;299;127",
        "wc_review": "889;644;554;361",
        "wc_reply_reviewers": "123;20;93;38",
        "wc_reply_authors": "705;749;666;551",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;2;1;2",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            100.5,
            29.47456530637899
        ],
        "wc_strengths_avg": [
            35.25,
            9.54921462739214
        ],
        "wc_weaknesses_avg": [
            235.25,
            163.0849088665165
        ],
        "wc_questions_avg": [
            241.0,
            67.1304699819687
        ],
        "wc_review_avg": [
            612.0,
            189.81438301667237
        ],
        "wc_reply_reviewers_avg": [
            68.5,
            41.391424232562954
        ],
        "wc_reply_authors_avg": [
            667.75,
            73.52338063500616
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.6225430174794673,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:GM_vH_bqG4oJ:scholar.google.com/&scioq=Out-of-Distribution+Detection+with+Hyperspherical+Energy&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Stanford University;Cornell University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.stanford.edu;https://www.cornell.edu",
        "aff_unique_abbr": "Stanford;Cornell",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Stanford;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "6ssOs9BBxa",
        "title": "A Competition Winning Deep Reinforcement Learning Agent in microRTS",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Scripted agents have predominantly won the five\nprevious iterations of the IEEE microRTS ($\\mu$RTS) competitions hosted at CIG and\nCoG. Despite Deep Reinforcement Learning (DRL) algorithms making significant strides\nin real-time strategy (RTS) games, their adoption in this primarily academic\ncompetition has been limited  due to the considerable training resources required and the complexity\ninherent in creating and debugging such agents. \\agentName\\ is the first DRL agent\nto win the IEEE microRTS competition. In a benchmark without performance\nconstraints, \\agentName\\ regularly defeated the two\nprior competition winners. This first competition-winning DRL submission can be\na benchmark for future microRTS competitions and a starting point for future DRL\nresearch. Iteratively fine-tuning the base policy and transfer learning to specific maps were \ncritical to \\agentName's winning performance. These strategies can be used in\neconomically training future DRL agents. Further work in Imitation Learning using Behavior Cloning and\nfine-tuning these models with DRL has proven promising as an efficient way\nto bootstrap models with novel behaviors.",
        "keywords": "reinforcement learning;microRTS;PPO;RTS;imitation learning;behavior cloning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/53aa2a4210ecec81e72e23dc3c3aed3e34c76bb1.zip",
        "author": "Scott Goodfriend",
        "authorids": "~Scott_Goodfriend1",
        "gender": "",
        "homepage": "",
        "dblp": "125/2125",
        "google_scholar": "HwatFwIAAAAJ",
        "orcid": "",
        "linkedin": "scottgoodfriend/",
        "or_profile": "~Scott_Goodfriend1",
        "aff": "Anthropic",
        "aff_domain": "anthropic.com",
        "position": "Researcher",
        "bibtex": "@misc{\ngoodfriend2024a,\ntitle={A Competition Winning Deep Reinforcement Learning Agent in micro{RTS}},\nauthor={Scott Goodfriend},\nyear={2024},\nurl={https://openreview.net/forum?id=6ssOs9BBxa}\n}",
        "github": "",
        "project": "",
        "reviewers": "Pjfo;7eJX;nGmd;AVMG",
        "site": "https://openreview.net/forum?id=6ssOs9BBxa",
        "pdf_size": 1009225,
        "rating": "3;5;5;6",
        "confidence": "4;4;4;5",
        "soundness": "2;4;3;3",
        "contribution": "2;2;3;2",
        "presentation": "2;3;2;3",
        "wc_summary": "107;118;66;103",
        "wc_strengths": "48;39;107;61",
        "wc_weaknesses": "31;118;134;119",
        "wc_questions": "46;32;64;118",
        "wc_review": "232;307;371;401",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "130;150;355;125",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            98.5,
            19.551214796017153
        ],
        "wc_strengths_avg": [
            63.75,
            26.166533969939543
        ],
        "wc_weaknesses_avg": [
            100.5,
            40.623269193899205
        ],
        "wc_questions_avg": [
            65.0,
            32.63433774416144
        ],
        "wc_review_avg": [
            327.75,
            64.87439787774527
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            190.0,
            95.72094859538323
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0.6622661785325219,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5650866779967715802&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0",
        "aff_unique_norm": "Anthropic",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.anthropic.com",
        "aff_unique_abbr": "Anthropic",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "6t8SUcA4sI",
        "title": "Ratio-Residual Diffusion Model for Image Restoration",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Most existing diffusion-based image restoration methods suffer from poor interpretability and inefficient sampling, due to their direct incorporation of degraded images as conditions within the original diffusion models. Recently, some researches have tried to build a new diffusion model by transferring the discrepancies between degraded and clear images, however, they cannot effectively model diverse degradation. To address these issues, we propose a universal diffusion model for image restoration that can cover different types of degradation. Specifically, our method consists of a Markov chain that convert a high-quality image to its low-quality counterpart. The transition kernel of this Markov chain is constructed through the ratio and residual between the high-quality and low-quality images, which provides a general expression that can effectively handle various degradation processes. Moreover, we analyze the characteristics of different degradation, and design a mean schedule that enables flexible control over the diffusion speed pertaining to different degradation, which yields better restoration performance. Extensive experiments have demonstrate that our method surpasses existing image restoration methods and achieves superior performance on multiple image restoration tasks, including deraining, dehazing, denoising, deblurring and low-light enhancement.",
        "keywords": "Diffusion Model;Image Restoration",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Zizheng Yang;Jie Huang;Hu Yu;Man Zhou;Bing Li;Feng Zhao",
        "authorids": "~Zizheng_Yang1;~Jie_Huang4;~Hu_Yu2;~Man_Zhou4;~Bing_Li16;~Feng_Zhao6",
        "gender": "M;M;M;M;M;M",
        "homepage": ";;https://yuhuustc.github.io/;https://www.ustc.edu.cn/;https://bivlab123.github.io/;",
        "dblp": "308/0448;;;;181/2734-4;165/8237",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com.hk/citations?hl=zh-CN;;https://scholar.google.co.uk/citations?hl=en;",
        "orcid": ";0000-0002-3518-3404;0000-0003-0598-8989;;0000-0001-6767-8105;0000-0003-2872-605X",
        "linkedin": ";;;;;",
        "or_profile": "~Zizheng_Yang1;~Jie_Huang4;~Hu_Yu2;~Bing_Li16;~Feng_Zhao6;~man_zhou1",
        "aff": "University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China",
        "aff_domain": "ustc.edu.cn;ustc.edu.cn;ustc.edu.cn;ustc.edu.cn;ustc.edu.cn;ustc.edu.cn",
        "position": "PhD student;PhD student;PhD student;MS student;Full Professor;Postdoc",
        "bibtex": "@misc{\nyang2024ratioresidual,\ntitle={Ratio-Residual Diffusion Model for Image Restoration},\nauthor={Zizheng Yang and Jie Huang and Hu Yu and Man Zhou and Bing Li and Feng Zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=6t8SUcA4sI}\n}",
        "github": "",
        "project": "",
        "reviewers": "Cv16;RMrE;xayc",
        "site": "https://openreview.net/forum?id=6t8SUcA4sI",
        "pdf_size": 8034218,
        "rating": "3;5;8",
        "confidence": "4;2;4",
        "soundness": "2;3;3",
        "contribution": "2;2;3",
        "presentation": "2;3;3",
        "wc_summary": "86;91;49",
        "wc_strengths": "38;41;39",
        "wc_weaknesses": "97;269;57",
        "wc_questions": "220;5;27",
        "wc_review": "441;406;172",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            5.333333333333333,
            2.0548046676563256
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            75.33333333333333,
            18.732028424302822
        ],
        "wc_strengths_avg": [
            39.333333333333336,
            1.247219128924647
        ],
        "wc_weaknesses_avg": [
            141.0,
            91.97100992522951
        ],
        "wc_questions_avg": [
            84.0,
            96.58502299356078
        ],
        "wc_review_avg": [
            339.6666666666667,
            119.4161723646434
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.11470786693528094,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:J1TmWKB0T4UJ:scholar.google.com/&scioq=Ratio-Residual+Diffusion+Model+for+Image+Restoration&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "University of Science and Technology of China",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.ustc.edu.cn",
        "aff_unique_abbr": "USTC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "6tDPefQyvB",
        "title": "Rotation-Equivariance and Position Encodings for Enhancing Local Descriptors",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Keypoint extraction and description are crucial issues in robot vision. In recent years, deep learning based keypoint extraction have exhibited robustness to variations in lighting and viewpoint. However, due to the lack of rotational invariance in traditional convolutional networks, performance of deep learning-based keypoint significantly deteriorates under large rotations. Group-equivariant neural networks based Keypoint address the issue of rotational equivariance, but their overall performance also suffers. This paper addresses the problem from the perspective of keypoint description and proposes a fusion of locally rotation-equivariant descriptions with globally encoded positional information and a directional uncertainty weighted descriptor loss. This effectively enhances the performance of keypoint extraction and description. Validation is conducted on rotated-HPatches, rotated-MegaDepth and rotated-YFCC100M datasets.",
        "keywords": "Rotation equivariance;keypoint extraction",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Shuai Su;Qijun Chen",
        "authorids": "~Shuai_Su1;~Qijun_Chen2",
        "gender": "M;M",
        "homepage": ";http://rail.tongji.edu.cn",
        "dblp": ";75",
        "google_scholar": "rQRbFegAAAAJ;",
        "orcid": ";0000-0001-5644-1188",
        "linkedin": ";",
        "or_profile": "~Shuai_Su1;~Qijun_Chen2",
        "aff": "Tongji University;Tongji University",
        "aff_domain": "tongji.edu.cn;tongji.edu.cn",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nsu2024rotationequivariance,\ntitle={Rotation-Equivariance and Position Encodings for Enhancing Local Descriptors},\nauthor={Shuai Su and Qijun Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=6tDPefQyvB}\n}",
        "github": "",
        "project": "",
        "reviewers": "QDcf;rhbE;FmdE;JePm",
        "site": "https://openreview.net/forum?id=6tDPefQyvB",
        "pdf_size": 3654861,
        "rating": "3;5;6;6",
        "confidence": "5;5;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;2",
        "presentation": "2;2;3;2",
        "wc_summary": "64;80;53;41",
        "wc_strengths": "78;73;57;57",
        "wc_weaknesses": "215;309;69;192",
        "wc_questions": "152;9;14;33",
        "wc_review": "509;471;193;323",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "268;82;103;68",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            59.5,
            14.361406616345072
        ],
        "wc_strengths_avg": [
            66.25,
            9.41740410091868
        ],
        "wc_weaknesses_avg": [
            196.25,
            85.5493278757934
        ],
        "wc_questions_avg": [
            52.0,
            58.42516581063335
        ],
        "wc_review_avg": [
            374.0,
            125.49501982150527
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            130.25,
            80.49961180030621
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.7385489458759963,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:H0YALXUc6JUJ:scholar.google.com/&scioq=Rotation-Equivariance+and+Position+Encodings+for+Enhancing+Local+Descriptors&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Tongji University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tongji.edu.cn",
        "aff_unique_abbr": "Tongji",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "6tK0ayRF8H",
        "title": "Angle-optimized Text Embeddings",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "High-quality text embedding is pivotal in improving semantic textual similarity (STS) tasks, which are crucial components in Large Language Model (LLM) applications.  However, a common challenge existing text embedding models face is the problem of vanishing gradients, primarily due to their reliance on the cosine function in the optimization objective, which has saturation zones.  To address this issue, this paper proposes a novel angle-optimized text embedding model called AnglE. The core idea of AnglE is to introduce angle optimization in a complex space. This novel approach effectively mitigates the adverse effects of the saturation zone in the cosine function, which can impede gradient and hinder optimization processes.  To set up a comprehensive STS evaluation, we experimented on existing short-text STS datasets and a newly collected long-text STS dataset from GitHub Issues.  Furthermore, we examine domain-specific STS scenarios with limited labeled data and explore how AnglE works with LLM-annotated data. Extensive experiments were conducted on various tasks including short-text STS, long-text STS, and domain-specific STS tasks. The results show that AnglE outperforms the state-of-the-art (SOTA) STS models that ignore the cosine saturation zone.   These findings demonstrate the ability of AnglE to generate high-quality text embeddings and the usefulness of angle optimization in STS.",
        "keywords": "NLP;Text Embedding;Semantic Textual Similarity",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/109e890770ab9fc45789a2d0e3fa935ad038e519.zip",
        "author": "Xianming LI;Jing Li",
        "authorids": "~Xianming_LI1;~Jing_Li18",
        "gender": "M;F",
        "homepage": ";http://www4.comp.polyu.edu.hk/~jing1li/",
        "dblp": "175/5398.html;181/2820-49",
        "google_scholar": "WwCp3OcAAAAJ;jvjOLx4AAAAJ",
        "orcid": "0009-0009-2610-7934;0000-0002-8044-2284",
        "linkedin": ";jing-li-b815b7a5/",
        "or_profile": "~Xianming_LI1;~Jing_Li18",
        "aff": "Hong Kong Polytechnic University;The Hong Kong Polytechnic University",
        "aff_domain": "polyu.edu.hk;polyu.edu.hk",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nli2024angleoptimized,\ntitle={Angle-optimized Text Embeddings},\nauthor={Xianming LI and Jing Li},\nyear={2024},\nurl={https://openreview.net/forum?id=6tK0ayRF8H}\n}",
        "github": "",
        "project": "",
        "reviewers": "7GFK;NPkC;3nS6;DPjM",
        "site": "https://openreview.net/forum?id=6tK0ayRF8H",
        "pdf_size": 677126,
        "rating": "5;5;5;6",
        "confidence": "4;4;3;3",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;2;2",
        "wc_summary": "80;56;72;80",
        "wc_strengths": "50;62;26;57",
        "wc_weaknesses": "153;139;106;166",
        "wc_questions": "28;1;56;15",
        "wc_review": "311;258;260;318",
        "wc_reply_reviewers": "0;0;18;27",
        "wc_reply_authors": "1112;938;995;880",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "4;3;3;3",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            72.0,
            9.797958971132712
        ],
        "wc_strengths_avg": [
            48.75,
            13.808964479641476
        ],
        "wc_weaknesses_avg": [
            141.0,
            22.34949663862701
        ],
        "wc_questions_avg": [
            25.0,
            20.285462775100793
        ],
        "wc_review_avg": [
            286.75,
            27.8691137282835
        ],
        "wc_reply_reviewers_avg": [
            11.25,
            11.691342951089922
        ],
        "wc_reply_authors_avg": [
            981.25,
            85.74198213244198
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.25,
            0.4330127018922193
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 381,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9499271582100007919&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Hong Kong Polytechnic University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.polyu.edu.hk",
        "aff_unique_abbr": "PolyU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "6tazBqPem3",
        "title": "Capacity Analysis of Vector Symbolic Architectures",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Hyperdimensional computing (HDC) is a biologically-inspired framework which represents symbols with high-dimensional vectors, and uses vector operations to manipulate them. The ensemble of a particular vector space and a prescribed set of vector operations (e.g., addition-like for \"bundling\" and outer-product-like for \"binding\") form a vector symbolic architecture (VSA). While VSAs have been employed in numerous learning applications and have been studied empirically, many theoretical questions about VSAs remain open. In this paper, we analyze the representation capacities of four common VSAs: MAP-I, MAP-B, and two VSAs based on sparse binary vectors. \"Representation capacity\" here refers to bounds on the dimensions of the VSA vectors required to perform certain symbolic tasks, such as testing for set membership  and estimating set intersection sizes for two sets of symbols, to a given degree of accuracy. We also analyze the ability of a novel variant of a Hopfield network (a simple model of associative memory) to perform some of the same tasks that are typically asked of VSAs. In addition to providing new bounds on VSA capacities, our analyses establish and leverage connections between VSAs, \"sketching\" (dimensionality reduction) algorithms, and Bloom filters.",
        "keywords": "Hyperdimensional computing;Vector Symbolic Architectures;representation learning;sketching;dimensionality reduction",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Kenneth L. Clarkson;Shashanka Ubaru;Elizabeth Yang",
        "authorids": "~Kenneth_L._Clarkson1;~Shashanka_Ubaru1;elizabeth_yang@berkeley.edu",
        "gender": "M;M;",
        "homepage": "http://researcher.watson.ibm.com/researcher/view.php?person=us-klclarks;http://shashankaubaru.github.io/;",
        "dblp": "89/2783;164/7307;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;NmhyylsAAAAJ;",
        "orcid": "0000-0002-2880-2465;;",
        "linkedin": ";;",
        "or_profile": "~Kenneth_L._Clarkson1;~Shashanka_Ubaru1;elizabeth_yang@berkeley.edu",
        "aff": "International Business Machines;International Business Machines;",
        "aff_domain": "ibm.com;ibm.com;",
        "position": "Research Staff Member;Researcher;",
        "bibtex": "@misc{\nclarkson2024capacity,\ntitle={Capacity Analysis of Vector Symbolic Architectures},\nauthor={Kenneth L. Clarkson and Shashanka Ubaru and Elizabeth Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=6tazBqPem3}\n}",
        "github": "",
        "project": "",
        "reviewers": "29HD;tEi4;q9j4",
        "site": "https://openreview.net/forum?id=6tazBqPem3",
        "pdf_size": 511602,
        "rating": "3;3;5",
        "confidence": "2;2;3",
        "soundness": "3;2;3",
        "contribution": "2;1;2",
        "presentation": "2;2;1",
        "wc_summary": "55;31;88",
        "wc_strengths": "46;16;62",
        "wc_weaknesses": "314;487;240",
        "wc_questions": "43;46;107",
        "wc_review": "458;580;497",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            58.0,
            23.366642891095847
        ],
        "wc_strengths_avg": [
            41.333333333333336,
            19.067132861433457
        ],
        "wc_weaknesses_avg": [
            347.0,
            103.50201286287464
        ],
        "wc_questions_avg": [
            65.33333333333333,
            29.48822740612863
        ],
        "wc_review_avg": [
            511.6666666666667,
            50.87457343528516
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10289256151536939400&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "International Business Machines Corporation",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ibm.com",
        "aff_unique_abbr": "IBM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Towards Establishing Guaranteed Error for Learned Database Operations",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19380",
        "id": "6tqgL8VluV",
        "author_site": "Sepanta Zeighami, Cyrus Shahabi",
        "tldr": "",
        "abstract": "Machine learning models have demonstrated substantial performance enhancements over non-learned alternatives in various fundamental data management operations, including indexing (locating items in an array), cardinality estimation (estimating the number of matching records in a database), and range-sum estimation (estimating aggregate attribute values for query-matched records). However, real-world systems frequently favor less efficient non-learned methods due to their ability to offer (worst-case) error guarantees \u2014 an aspect where learned approaches often fall short. The primary objective of these guarantees is to ensure system reliability, ensuring that the chosen approach consistently delivers the desired level of accuracy across all databases. In this paper, we embark on the first theoretical study of such guarantees for learned methods, presenting the necessary conditions for such guarantees to hold when using machine learning to perform indexing, cardinality estimation and range-sum estimation. Specifically, we present the first known lower bounds on the model size required to achieve the desired accuracy for these three key database operations. Our results bound the required model size for given average and worst-case errors in performing database operations, serving as the first theoretical guidelines governing how model size must change based on data size to be able to guarantee an accuracy level. More broadly, our established guarantees pave the way for the broader adoption and integration of learned models into real-world systems.",
        "keywords": "Learned Indexing;Learned Cardinality Estimation;Machine learning for Data Management",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Sepanta Zeighami;Cyrus Shahabi",
        "authorids": "~Sepanta_Zeighami2;~Cyrus_Shahabi1",
        "gender": "M;M",
        "homepage": "https://szeighami.github.io/;https://infolab.usc.edu/Shahabi/",
        "dblp": ";s/CyrusShahabi",
        "google_scholar": ";jEdhxGMAAAAJ",
        "orcid": ";0000-0001-9118-0681",
        "linkedin": ";cyrus-shahabi-9791256b/",
        "or_profile": "~Sepanta_Zeighami2;~Cyrus_Shahabi1",
        "aff": "University of Southern California;University of Southern California",
        "aff_domain": "usc.edu;usc.edu",
        "position": "PhD student;Full Professor",
        "bibtex": "@inproceedings{\nzeighami2024towards,\ntitle={Towards Establishing Guaranteed Error for Learned Database Operations},\nauthor={Sepanta Zeighami and Cyrus Shahabi},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=6tqgL8VluV}\n}",
        "github": "",
        "project": "",
        "reviewers": "Px8G;q6av;EAu4;Aapp",
        "pdf_size": 415907,
        "rating": "3;5;8;8",
        "confidence": "3;4;2;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;4;3",
        "presentation": "3;3;2;3",
        "wc_summary": "67;52;86;83",
        "wc_strengths": "30;39;124;91",
        "wc_weaknesses": "211;326;252;94",
        "wc_questions": "81;66;215;39",
        "wc_review": "389;483;677;307",
        "wc_reply_reviewers": "0;123;0;0",
        "wc_reply_authors": "1425;1393;553;546",
        "reply_reviewers": "0;2;0;0",
        "reply_authors": "3;2;1;1",
        "rating_avg": [
            6.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            72.0,
            13.619838471876236
        ],
        "wc_strengths_avg": [
            71.0,
            38.451267859460756
        ],
        "wc_weaknesses_avg": [
            220.75,
            83.98623399105355
        ],
        "wc_questions_avg": [
            100.25,
            67.93885118251559
        ],
        "wc_review_avg": [
            464.0,
            137.84411485442533
        ],
        "wc_reply_reviewers_avg": [
            30.75,
            53.26056233274298
        ],
        "wc_reply_authors_avg": [
            979.25,
            429.9060217070703
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5000000000000001,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6119200784656701599&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=6tqgL8VluV",
        "pdf": "https://openreview.net/pdf?id=6tqgL8VluV",
        "email": "usc.edu;usc.edu",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Southern California",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.usc.edu",
        "aff_unique_abbr": "USC",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Los Angeles",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "6u6GjS0vKZ",
        "title": "Coloring Deep CNN Layers with Activation Hue Loss",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper proposes a novel hue-like angular parameter to model the structure of deep convolutional neural network (CNN) activation space, referred to as the activation hue, for the purpose of regularizing models for more effective learning. The activation hue generalizes the notion of color hue angle in standard 3-channel RGB intensity space to $N$-channel activation space. A series of observations based on nearest neighbor indexing of activation vectors with pre-trained networks indicate that class-informative activations are concentrated about an angle $\\theta$ in both the $(x,y)$ image plane and in multi-channel activation space. A regularization term in the form of hue-like angular $\\theta$ labels is proposed to complement standard one-hot loss. Training from scratch using combined one-hot + activation hue loss improves classification performance modestly for a wide variety of classification tasks, including ImageNet.",
        "keywords": "supervised representation learning;general machine learning;representation learning for computer vision;visualization",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Louis-Fran\u00e7ois Bouchard;Mohsen Ben Lazreg;Matthew Toews",
        "authorids": "~Louis-Fran\u00e7ois_Bouchard1;~Mohsen_Ben_Lazreg1;~Matthew_Toews4",
        "gender": "M;M;",
        "homepage": "https://www.louisbouchard.ai;;http://www.matthewtoews.com",
        "dblp": ";;54/2036",
        "google_scholar": "45O9knIAAAAJ;;https://scholar.google.ca/citations?user=CebI4YoAAAAJ",
        "orcid": ";;",
        "linkedin": "whats-ai/;mohsen-ben-lazreg/;",
        "or_profile": "~Louis-Fran\u00e7ois_Bouchard1;~Mohsen_Ben_Lazreg1;~Matthew_Toews4",
        "aff": "Montreal Institute for Learning Algorithms, University of Montreal, Universit\u00e9 de Montr\u00e9al;;\u00c9cole de technologie sup\u00e9rieure, Universit\u00e9 du Qu\u00e9bec",
        "aff_domain": "mila.umontreal.ca;;etsmtl.ca",
        "position": "PhD student;;Full Professor",
        "bibtex": "@misc{\nbouchard2024coloring,\ntitle={Coloring Deep {CNN} Layers with Activation Hue Loss},\nauthor={Louis-Fran{\\c{c}}ois Bouchard and Mohsen Ben Lazreg and Matthew Toews},\nyear={2024},\nurl={https://openreview.net/forum?id=6u6GjS0vKZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "1Awe;UKJD;2Rz4;Kfzo",
        "site": "https://openreview.net/forum?id=6u6GjS0vKZ",
        "pdf_size": 8488315,
        "rating": "3;3;5;6",
        "confidence": "4;4;3;3",
        "soundness": "2;1;3;3",
        "contribution": "2;1;2;3",
        "presentation": "2;2;2;3",
        "wc_summary": "33;336;116;41",
        "wc_strengths": "27;2;82;31",
        "wc_weaknesses": "251;2;129;71",
        "wc_questions": "150;2;49;4",
        "wc_review": "461;342;376;147",
        "wc_reply_reviewers": "0;178;37;18",
        "wc_reply_authors": "705;526;298;223",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            131.5,
            122.42650856738503
        ],
        "wc_strengths_avg": [
            35.5,
            29.055980451535273
        ],
        "wc_weaknesses_avg": [
            113.25,
            91.35747095886576
        ],
        "wc_questions_avg": [
            51.25,
            60.030721301680195
        ],
        "wc_review_avg": [
            331.5,
            115.00108695138495
        ],
        "wc_reply_reviewers_avg": [
            58.25,
            70.36467508629596
        ],
        "wc_reply_authors_avg": [
            438.0,
            190.30107724340397
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.9622504486493761,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:L3_m4Sk9v_gJ:scholar.google.com/&scioq=Coloring+Deep+CNN+Layers+with+Activation+Hue+Loss&hl=en&as_sdt=0,6",
        "gs_version_total": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Montreal;Universit\u00e9 du Qu\u00e9bec",
        "aff_unique_dep": "Montreal Institute for Learning Algorithms;",
        "aff_unique_url": "https://www.mila.quebec;https://www.etsmtl.ca",
        "aff_unique_abbr": "MILA;ETS",
        "aff_campus_unique_index": "0;1",
        "aff_campus_unique": "Montreal;\u00c9cole de technologie sup\u00e9rieure",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "6uUmpPvqUU",
        "title": "The Closeness of In-Context Learning and Weight Shifting for Softmax Regression",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs) are known for their exceptional performance in natural language processing, making them highly effective in many human life-related tasks. The attention mechanism in the Transformer architecture is a critical component of LLMs, as it allows the model to selectively focus on specific input parts. The softmax unit, which is a key part of the attention mechanism, normalizes the attention scores. Hence, the performance of LLMs in various NLP tasks depends significantly on the crucial role played by the attention mechanism with the softmax unit. \n\nIn-context learning is one of the celebrated abilities of recent LLMs. Without further parameter updates, Transformers can learn to predict based on few in-context examples. However, the reason why Transformers becomes in-context learners is not well understood. Recently, in-context learning has been studied from a mathematical perspective with simplified linear self-attention without softmax unit. Based on a linear regression formulation $ \\min_x \\|  Ax  - b \\|_2 $,\nexisting works show linear Transformers' capability of learning linear functions in context. The capability of Transformers with softmax unit approaching full Transformers, however, remains unexplored. \n\nIn this work, we study the in-context learning based on a softmax regression formulation $ \\min_{x} \\| \\langle \\exp(Ax), {\\bf 1}_n \\rangle^{-1} \\exp(Ax) - b \\|_2 $. We show the upper bounds of the data transformations induced by a single self-attention layer with softmax unit and by gradient-descent on a $ \\ell_2 $ regression loss for softmax prediction function. Our theoretical results imply that when training self-attention-only Transformers for fundamental regression tasks, the models learned by gradient-descent and Transformers show great similarity.",
        "keywords": "In-Context Learning;Softmax Regression;Attention Computation",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Shuai Li;Zhao Song;Yu Xia;Tong Yu;Tianyi Zhou",
        "authorids": "~Shuai_Li3;~Zhao_Song3;~Yu_Xia9;~Tong_Yu3;~Tianyi_Zhou4",
        "gender": "F;M;M;;",
        "homepage": "http://shuaili8.github.io;https://www.youtube.com/@zhaosong2031;https://andree-9.github.io/;https://www.linkedin.com/in/tong-yu-42790744;",
        "dblp": "57/2281-10;76/4051-2;28/4326-7;32/1593-1;",
        "google_scholar": "https://scholar.google.com.hk/citations?user=kMZgQxcAAAAJ;yDZct7UAAAAJ;sTVqEUMAAAAJ;https://scholar.google.com/citations?hl=en;",
        "orcid": ";;;0000-0002-5991-2050;",
        "linkedin": ";;;tong-yu-42790744;",
        "or_profile": "~Shuai_Li3;~Zhao_Song3;~Yu_Xia9;~Tong_Yu3;~Tianyi_Zhou4",
        "aff": "John Hopcroft Center, Shanghai Jiao Tong University;Adobe;University of Michigan;Adobe Research;",
        "aff_domain": "sjtu.edu.cn;adobe.com;umich.edu;adobe.com;",
        "position": "Assistant Professor;Researcher;MS student;Senior Research Scientist;",
        "bibtex": "@misc{\nli2024the,\ntitle={The Closeness of In-Context Learning and Weight Shifting for Softmax Regression},\nauthor={Shuai Li and Zhao Song and Yu Xia and Tong Yu and Tianyi Zhou},\nyear={2024},\nurl={https://openreview.net/forum?id=6uUmpPvqUU}\n}",
        "github": "",
        "project": "",
        "reviewers": "ahEK;f4vr;QA3Q",
        "site": "https://openreview.net/forum?id=6uUmpPvqUU",
        "pdf_size": 553034,
        "rating": "5;5;5",
        "confidence": "2;2;2",
        "soundness": "2;2;3",
        "contribution": "2;2;2",
        "presentation": "1;1;2",
        "wc_summary": "82;66;249",
        "wc_strengths": "77;18;11",
        "wc_weaknesses": "31;75;104",
        "wc_questions": "204;29;3",
        "wc_review": "394;188;367",
        "wc_reply_reviewers": "15;6;0",
        "wc_reply_authors": "387;268;236",
        "reply_reviewers": "1;1;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            2.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            132.33333333333334,
            82.75398614098431
        ],
        "wc_strengths_avg": [
            35.333333333333336,
            29.601051032391098
        ],
        "wc_weaknesses_avg": [
            70.0,
            30.011109054259666
        ],
        "wc_questions_avg": [
            78.66666666666667,
            89.25743044076997
        ],
        "wc_review_avg": [
            316.3333333333333,
            91.41237455739908
        ],
        "wc_reply_reviewers_avg": [
            7.0,
            6.164414002968976
        ],
        "wc_reply_authors_avg": [
            297.0,
            64.96665811527222
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 43,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1635458034096028391&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "Shanghai Jiao Tong University;Adobe;University of Michigan",
        "aff_unique_dep": "John Hopcroft Center;Adobe Inc.;",
        "aff_unique_url": "https://www.sjtu.edu.cn;https://www.adobe.com;https://www.umich.edu",
        "aff_unique_abbr": "SJTU;Adobe;UM",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Shanghai;",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "6ujgouOiAA",
        "title": "Use Your INSTINCT: INSTruction optimization usIng Neural bandits Coupled with Transformers",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs) have shown remarkable instruction-following capabilities and achieved impressive performances in various applications. However, the performances of LLMs depend heavily on the instructions given to them, which are typically manually tuned with substantial human efforts. Recent work has used the query-efficient Bayesian optimization (BO) algorithm to automatically optimize the instructions given to black-box LLMs. However, BO usually falls short when optimizing highly sophisticated (e.g., high-dimensional) objective functions, such as the functions mapping an instruction to the performance of an LLM. This is mainly due to the limited expressive power of the Gaussian process (GP) model which is used by BO as a surrogate to model the objective function. Meanwhile, it has been repeatedly shown that neural networks (NNs), especially pre-trained transformers, possess strong expressive power and can model highly complex functions. So, we adopt a neural bandit algorithm which replaces the GP in BO by an NN surrogate to optimize instructions for black-box LLMs. More importantly, the neural bandit algorithm allows us to naturally couple the NN surrogate with the hidden representation learned by a pre-trained transformer (i.e., an open-source LLM), which significantly boosts its performance. These motivate us to propose our INSTruction optimization usIng Neural bandits Coupled with Transformers (INSTINCT) algorithm. We perform instruction optimization for ChatGPT and use extensive experiments to show that our INSTINCT consistently outperforms the existing methods in different tasks, such as in various instruction induction tasks and the task of improving the zero-shot chain-of-thought instruction.",
        "keywords": "instruction optimization;prompt optimization;large language models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/752b27f36e44b6ff7be7c3ce208c106e7e4e2f1b.zip",
        "author": "Xiaoqiang Lin;Zhaoxuan Wu;Zhongxiang Dai;Wenyang Hu;Yao Shu;See-Kiong Ng;Patrick Jaillet;Bryan Kian Hsiang Low",
        "authorids": "~Xiaoqiang_Lin1;~Zhaoxuan_Wu1;~Zhongxiang_Dai1;~Wenyang_Hu1;~Yao_Shu1;~See-Kiong_Ng1;~Patrick_Jaillet1;~Bryan_Kian_Hsiang_Low1",
        "gender": "M;M;M;;M;M;M;M",
        "homepage": "https://xqlin98.github.io/;https://zhaoxuanwu.github.io/;https://daizhongxiang.github.io/;https://scholar.google.com/citations?user=EecZzYsAAAAJ;https://yao.notion.site;https://www.comp.nus.edu.sg/~ngsk/;http://web.mit.edu/jaillet/www/;http://www.comp.nus.edu.sg/~lowkh",
        "dblp": "269/4573;298/5083;172/4968;258/0545;44/1338;00/5480;https://dblp.uni-trier.de/pers/hd/j/Jaillet:Patrick;97/4877",
        "google_scholar": "nqKwA60AAAAJ;Th_mPm8AAAAJ;1v8xOIYAAAAJ;EecZzYsAAAAJ;https://scholar.google.com.au/citations?hl=en;https://scholar.google.com.tw/citations?user=_wsommYAAAAJ;ND0FM6EAAAAJ;https://scholar.google.com.tw/citations?user=2P-Q09UAAAAJ",
        "orcid": ";0009-0002-5659-6387;;0009-0008-6189-7890;;0000-0001-6565-7511;0000-0002-8585-6566;",
        "linkedin": ";zhaoxuanwu/;;;yao-shu-a5640514b;seekiong/?originalSubdomain=sg;patrick-jaillet-1260445/;",
        "or_profile": "~Xiaoqiang_Lin1;~Zhaoxuan_Wu1;~Zhongxiang_Dai1;~Wenyang_Hu1;~Yao_Shu1;~See-Kiong_Ng1;~Patrick_Jaillet1;~Bryan_Kian_Hsiang_Low1",
        "aff": "National University of Singapore;National University of Singapore;Massachusetts Institute of Technology;National University of Singapore;Guangming Lab;National University of Singapore;Massachusetts Institute of Technology;National University of Singapore",
        "aff_domain": "u.nus.edu;u.nus.edu;mit.edu;u.nus.edu;gml.ac.cn;nus.edu.sg;mit.edu;nus.edu.sg",
        "position": "PhD student;PhD student;Postdoc;PhD student;Researcher;Full Professor;Full Professor;Associate Professor",
        "bibtex": "@misc{\nlin2024use,\ntitle={Use Your {INSTINCT}: {INST}ruction optimization usIng Neural bandits Coupled with Transformers},\nauthor={Xiaoqiang Lin and Zhaoxuan Wu and Zhongxiang Dai and Wenyang Hu and Yao Shu and See-Kiong Ng and Patrick Jaillet and Bryan Kian Hsiang Low},\nyear={2024},\nurl={https://openreview.net/forum?id=6ujgouOiAA}\n}",
        "github": "",
        "project": "",
        "reviewers": "16Xs;TRUy;fbJ6;zDza",
        "site": "https://openreview.net/forum?id=6ujgouOiAA",
        "pdf_size": 1879662,
        "rating": "3;5;6;8",
        "confidence": "5;5;4;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "120;37;208;86",
        "wc_strengths": "21;20;190;127",
        "wc_weaknesses": "117;125;259;96",
        "wc_questions": "10;4;17;142",
        "wc_review": "268;186;674;451",
        "wc_reply_reviewers": "0;0;98;36",
        "wc_reply_authors": "1246;1309;2406;1646",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "5;5;6;5",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            112.75,
            62.407431448506195
        ],
        "wc_strengths_avg": [
            89.5,
            72.50689622373861
        ],
        "wc_weaknesses_avg": [
            149.25,
            64.24319030060695
        ],
        "wc_questions_avg": [
            43.25,
            57.198666942508375
        ],
        "wc_review_avg": [
            394.75,
            187.60780234307953
        ],
        "wc_reply_reviewers_avg": [
            33.5,
            40.03436024217197
        ],
        "wc_reply_authors_avg": [
            1651.75,
            461.2582655085977
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            5.25,
            0.4330127018922193
        ],
        "replies_avg": [
            30,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.9198662110077999,
        "gs_citation": 32,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3800541950041619856&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;0;2;0;1;0",
        "aff_unique_norm": "National University of Singapore;Massachusetts Institute of Technology;Guangming Lab",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.nus.edu.sg;https://web.mit.edu;",
        "aff_unique_abbr": "NUS;MIT;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;2;0;1;0",
        "aff_country_unique": "Singapore;United States;China"
    },
    {
        "title": "ImplicitSLIM and How it Improves Embedding-based Collaborative Filtering",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19379",
        "id": "6vF0ZJGor4",
        "author_site": "Ilya Shenbin, Sergey Nikolenko",
        "tldr": "",
        "abstract": "We present ImplicitSLIM, a novel unsupervised learning approach for sparse high-dimensional data, with applications to collaborative filtering. Sparse linear methods (SLIM) and their variations show outstanding performance, but they are memory-intensive and hard to scale. ImplicitSLIM improves embedding-based models by extracting embeddings from SLIM-like models in a computationally cheap and memory-efficient way, without explicit learning of heavy SLIM-like models. We show that ImplicitSLIM improves performance and speeds up convergence for both state of the art and classical collaborative filtering methods. The source code for ImplicitSLIM, related models, and applications is available at https://github.com/ilya-shenbin/ImplicitSLIM.",
        "keywords": "collaborative filtering;representation learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/25b252b964ba36bd97eaafd7c4f8c92e5a674a88.zip",
        "author": "Ilya Shenbin;Sergey Nikolenko",
        "authorids": "~Ilya_Shenbin1;~Sergey_Nikolenko1",
        "gender": "Not Specified;M",
        "homepage": ";http://logic.pdmi.ras.ru/~sergey/",
        "dblp": "https://dblp.uni-trier.de/pid/234/8529;50/1870.html",
        "google_scholar": "SluT_kMAAAAJ;https://scholar.google.ru/citations?hl=ru",
        "orcid": "0000-0002-6778-225X;0000-0001-7787-2251",
        "linkedin": ";",
        "or_profile": "~Ilya_Shenbin1;~Sergey_Nikolenko1",
        "aff": "St. Petersburg Department of Steklov Mathematical Institute;Steklov Institute of Mathematics at St. Petersburg",
        "aff_domain": "pdmi.ras.ru;pdmi.ras.ru",
        "position": "Researcher;Assistant Professor",
        "bibtex": "@inproceedings{\nshenbin2024implicitslim,\ntitle={Implicit{SLIM} and How it Improves Embedding-based Collaborative Filtering},\nauthor={Ilya Shenbin and Sergey Nikolenko},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=6vF0ZJGor4}\n}",
        "github": "",
        "project": "",
        "reviewers": "EMBd;uknn;dkLJ;Fj6S",
        "pdf_size": 371124,
        "rating": "3;3;6;8",
        "confidence": "1;4;4;4",
        "soundness": "2;3;4;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;2;3",
        "wc_summary": "33;15;62;120",
        "wc_strengths": "11;41;73;22",
        "wc_weaknesses": "12;266;95;23",
        "wc_questions": "18;6;5;45",
        "wc_review": "74;328;235;210",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;804;376;420",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;1;1;1",
        "rating_avg": [
            5.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            3.25,
            1.299038105676658
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            57.5,
            39.790074139161895
        ],
        "wc_strengths_avg": [
            36.75,
            23.519938350259338
        ],
        "wc_weaknesses_avg": [
            99.0,
            101.5504800579495
        ],
        "wc_questions_avg": [
            18.5,
            16.132265804901678
        ],
        "wc_review_avg": [
            211.75,
            90.87457015029013
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            400.0,
            284.68930433017675
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0.75,
            0.4330127018922193
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.5443310539518175,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15121309870541548515&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=6vF0ZJGor4",
        "pdf": "https://openreview.net/pdf?id=6vF0ZJGor4",
        "email": "pdmi.ras.ru;pdmi.ras.ru",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Steklov Mathematical Institute;Steklov Institute of Mathematics",
        "aff_unique_dep": "Department of Steklov Mathematical Institute;Mathematics",
        "aff_unique_url": "http://www.mi.ras.ru;http://www.pdmi.ras.ru",
        "aff_unique_abbr": "SMI;PDMI",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "St. Petersburg",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Russian Federation"
    },
    {
        "id": "6vtGG0WMne",
        "title": "Regulating Imbalanced Deep Models with User-Specified Metrics",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep learning models implemented in real-world applications still face challenges from imbalanced data. Existing methods address the imbalance problem by balancing the models between the minority class and the majority class. However, practical applications may require an imbalanced optimization strategy that selectively unbalances the models and makes them more suitable for the applications than the balanced models. In this work, we first give a formal definition to accurately quantify the degree of imbalance of a model. Then, we propose a bias adjustment method that can efficiently optimize the model to a specified imbalance state according to application metrics or requirements so that this method has wide applicability. Finally, we introduce a training strategy that is advantageous to select the optimal representation parameters of the model during traditional training process. Extensive experiments verify the effectiveness and efficiency of our method, and compared with state-of-the-art algorithms, our method has significant improvement in different metrics including accuracy, F1 value and G-means.",
        "keywords": "Imbalance learning;Deep learning;Imbalance metrics;Classification",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Yuqi Liu;Bin Cao;JING FAN",
        "authorids": "~Yuqi_Liu1;~Bin_Cao3;~JING_FAN2",
        "gender": "M;M;F",
        "homepage": ";http://www.cs.zjut.edu.cn/staffs-en/bincao.html;http://www.cs.zjut.edu.cn/staffs/jingfan.html",
        "dblp": "35/9071;17/1169-4;",
        "google_scholar": ";m4CUeVAAAAAJ;",
        "orcid": "0000-0003-0092-7001;;",
        "linkedin": ";;",
        "or_profile": "~Yuqi_Liu1;~Bin_Cao3;~JING_FAN2",
        "aff": ";Zhejiang University of Technology;Zhejiang University of Technology",
        "aff_domain": ";zjut.edu.cn;zjut.edu.cn",
        "position": ";Associate Professor;Full Professor",
        "bibtex": "@misc{\nliu2024regulating,\ntitle={Regulating Imbalanced Deep Models with User-Specified Metrics},\nauthor={Yuqi Liu and Bin Cao and JING FAN},\nyear={2024},\nurl={https://openreview.net/forum?id=6vtGG0WMne}\n}",
        "github": "",
        "project": "",
        "reviewers": "b3Zi;TH73;HH3t;tgc4",
        "site": "https://openreview.net/forum?id=6vtGG0WMne",
        "pdf_size": 274889,
        "rating": "3;3;6;6",
        "confidence": "4;3;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;4;3",
        "presentation": "2;2;3;2",
        "wc_summary": "85;102;94;262",
        "wc_strengths": "88;46;44;99",
        "wc_weaknesses": "197;350;45;89",
        "wc_questions": "96;2;46;34",
        "wc_review": "466;500;229;484",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            135.75,
            73.1381398450904
        ],
        "wc_strengths_avg": [
            69.25,
            24.57005290999594
        ],
        "wc_weaknesses_avg": [
            170.25,
            117.5954399626108
        ],
        "wc_questions_avg": [
            44.5,
            33.80458548777074
        ],
        "wc_review_avg": [
            419.75,
            110.78441903083664
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5773502691896258,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Gw9ETUy433wJ:scholar.google.com/&scioq=Regulating+Imbalanced+Deep+Models+with+User-Specified+Metrics&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Zhejiang University of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.zjut.edu.cn",
        "aff_unique_abbr": "ZJUT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "6werMQy1uz",
        "title": "Rethinking the Buyer\u2019s Inspection Paradox in Information Markets with Language Agents",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This work addresses the long-standing buyer's inspection paradox for information markets. The paradox is that buyers need to access information to determine its value, while sellers need to limit access to prevent theft. To study this, we introduce an open-source simulated digital marketplace where intelligent agents, powered by language models, buy and sell information on behalf of external participants. The central mechanism enabling this marketplace is the agents' dual capabilities: they not only have the capacity to assess the quality of privileged information but also come equipped with the ability to forget. This feature allows vendors to grant temporary access to proprietary information, significantly reducing the risk of unauthorized retention while enabling agents to accurately gauge the information's relevance to specific queries or tasks. To perform well, agents must make rational decisions, strategically explore the marketplace through generated sub-queries, and synthesize answers from purchased information. Concretely, our experiments (a) uncover biases in language models leading to irrational behavior and evaluate techniques to mitigate these biases, (b) investigate how price affects demand in the context of informational goods, and (c) show that inspection and higher budgets both lead to higher quality outcomes.",
        "keywords": "Agents;Economics;Language Models",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Martin Weiss;Nasim Rahaman;Manuel Wuthrich;Yoshua Bengio;Li Erran Li;Bernhard Sch\u00f6lkopf;Christopher Pal",
        "authorids": "~Martin_Weiss4;~Nasim_Rahaman1;~Manuel_Wuthrich1;~Yoshua_Bengio1;~Li_Erran_Li1;~Bernhard_Sch\u00f6lkopf1;~Christopher_Pal1",
        "gender": "M;M;M;M;;;",
        "homepage": "https://www.martincsweiss.com/;;;http://yoshuabengio.org;http://www.cs.columbia.edu/~lierranli/;;https://scholar.google.ca/citations?user=1ScWJOoAAAAJ&hl=en&oi=ao",
        "dblp": "12/3210;222/3165;https://dblp.uni-trier.de/pers/hd/w/W=uuml=thrich:Manuel;56/953;l/ErranLLi.html;;45/1217",
        "google_scholar": "t7lQYWwAAAAJ;https://scholar.google.de/citations?user=iH9DuY0AAAAJ;;kukA0LcAAAAJ;GkMfzy4AAAAJ;;https://scholar.google.ca/citations?user=1ScWJOoAAAAJ",
        "orcid": ";;;;;;",
        "linkedin": "martin-clyde-weiss/;https://de.linkedin.com/in/nasim-rahaman/de;;yoshuabengio/?originalSubdomain=ca;;;",
        "or_profile": "~Martin_Weiss4;~Nasim_Rahaman1;~Manuel_Wuthrich1;~Yoshua_Bengio1;~Li_Erran_Li1;~Bernhard_Sch\u00f6lkopf1;~Christopher_Pal1",
        "aff": "Montreal Institute for Learning Algorithms, University of Montreal, University of Montreal;Max Planck Institute for Intelligent Systems, Max-Planck Institute;Max Planck Institute for Intelligent Systems;University of Montreal;Columbia University;;Polytechnique Montreal",
        "aff_domain": "mila.umontreal.ca;tuebingen.mpg.de;mpg.tuebingen.de;umontreal.ca;columbia.edu;;polymtl.ca",
        "position": "PhD student;PhD student;Postdoc;Full Professor;Adjunct Professor;;Full Professor",
        "bibtex": "@misc{\nweiss2024rethinking,\ntitle={Rethinking the Buyer{\\textquoteright}s Inspection Paradox in Information Markets with Language Agents},\nauthor={Martin Weiss and Nasim Rahaman and Manuel Wuthrich and Yoshua Bengio and Li Erran Li and Bernhard Sch{\\\"o}lkopf and Christopher Pal},\nyear={2024},\nurl={https://openreview.net/forum?id=6werMQy1uz}\n}",
        "github": "",
        "project": "",
        "reviewers": "ovK6;mENG;STDL;UxN6",
        "site": "https://openreview.net/forum?id=6werMQy1uz",
        "pdf_size": 1759772,
        "rating": "5;5;6;6",
        "confidence": "3;2;4;4",
        "soundness": "2;2;2;3",
        "contribution": "3;2;3;3",
        "presentation": "4;3;2;3",
        "wc_summary": "133;41;42;60",
        "wc_strengths": "87;43;177;63",
        "wc_weaknesses": "245;144;365;103",
        "wc_questions": "113;8;5;2",
        "wc_review": "578;236;589;228",
        "wc_reply_reviewers": "0;0;114;0",
        "wc_reply_authors": "426;314;715;319",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            69.0,
            37.71604433129222
        ],
        "wc_strengths_avg": [
            92.5,
            51.212791370906544
        ],
        "wc_weaknesses_avg": [
            214.25,
            101.22098349650629
        ],
        "wc_questions_avg": [
            32.0,
            46.8134596029817
        ],
        "wc_review_avg": [
            407.75,
            175.81577716462195
        ],
        "wc_reply_reviewers_avg": [
            28.5,
            49.363448015713004
        ],
        "wc_reply_authors_avg": [
            443.5,
            163.00996902030255
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.9045340337332909,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10665352199526562800&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;0;2;3",
        "aff_unique_norm": "University of Montreal;Max Planck Institute for Intelligent Systems;Columbia University;Polytechnique Montreal",
        "aff_unique_dep": "Montreal Institute for Learning Algorithms;Intelligent Systems;;",
        "aff_unique_url": "https://www.umontreal.ca;https://www.mpi-is.mpg.de;https://www.columbia.edu;https://www.polymtl.ca",
        "aff_unique_abbr": "UM;MPI-IS;Columbia;PolyMTL",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Montreal;",
        "aff_country_unique_index": "0;1;1;0;2;0",
        "aff_country_unique": "Canada;Germany;United States"
    },
    {
        "title": "Chain of Hindsight aligns Language Models with Feedback",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19378",
        "id": "6xfe4IVcOu",
        "author_site": "Hao Liu, Carmelo Sferrazza, Pieter Abbeel",
        "tldr": "",
        "abstract": "Learning from human preferences is important for language models to match human needs and to align with human and social values. \nPrior works have achieved remarkable successes by learning from human feedback to understand and follow instructions. Nonetheless, these methods are either founded on hand-picked model generations that are favored by human annotators, rendering them inefficient in terms of data utilization and challenging to apply in general, or they depend on reinforcement learning, which often suffers from imperfect reward functions and relies on extremely challenging optimizations. In this work, we propose a novel technique, Chain of Hindsight, that is easy to optimize and can learn from any form of feedback, regardless of its polarity. Our idea is inspired by how humans learn from extensive feedback presented in the form of languages. We convert all types of feedback into sequences of sentences, which are then used to fine-tune the model, allowing us to take advantage of the language comprehension capabilities of language models.\nWe condition the model on a sequence of model generations paired with feedback. By doing so, the model is trained to generate outputs based on feedback, while learning to identify and correct negative attributes or errors.  Applying our method to large language models, we observed that Chain of Hindsight significantly surpasses previous methods in aligning language models with human preferences. We report significant improvements on summarization and dialogue benchmarks, with our approach markedly preferred in human evaluations.",
        "keywords": "Reinforcement Learning;Reinforcement Learning from Human Feedback;RLHF",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/db2a0718e6995981e24187ef60a5d65b25d77f54.pdf",
        "author": "Hao Liu;Carmelo Sferrazza;Pieter Abbeel",
        "authorids": "~Hao_Liu1;~Carmelo_Sferrazza1;~Pieter_Abbeel2",
        "gender": ";M;M",
        "homepage": "https://sferrazza.cc;https://people.eecs.berkeley.edu/~pabbeel/;https://haoliu.ai",
        "dblp": "190/8406;;09/3214-55",
        "google_scholar": "x0_lwNYAAAAJ;https://scholar.google.com.tw/citations?user=vtwH6GkAAAAJ;wtK4Yh4AAAAJ",
        "orcid": "0000-0002-7432-7634;;",
        "linkedin": "csferrazza/;;",
        "or_profile": "~Carmelo_Sferrazza1;~Pieter_Abbeel2;~Hao_Liu10",
        "aff": "University of California, Berkeley;Covariant;University of California, Berkeley",
        "aff_domain": "berkeley.edu;covariant.ai;berkeley.edu",
        "position": "Postdoc;Founder;PhD student",
        "bibtex": "@inproceedings{\nliu2024chain,\ntitle={Chain of Hindsight aligns Language Models with Feedback},\nauthor={Hao Liu and Carmelo Sferrazza and Pieter Abbeel},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=6xfe4IVcOu}\n}",
        "github": "",
        "project": "",
        "reviewers": "us9M;KdNj;WQPV;aon5",
        "pdf_size": 1966600,
        "rating": "6;6;8;8",
        "confidence": "4;3;3;4",
        "soundness": "4;3;4;3",
        "contribution": "3;4;4;4",
        "presentation": "4;3;4;4",
        "wc_summary": "40;219;150;103",
        "wc_strengths": "50;54;95;68",
        "wc_weaknesses": "294;224;47;97",
        "wc_questions": "30;115;14;2",
        "wc_review": "414;612;306;270",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "634;537;207;194",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            128.0,
            65.44845299928792
        ],
        "wc_strengths_avg": [
            66.75,
            17.62632973707232
        ],
        "wc_weaknesses_avg": [
            165.5,
            98.32217450809354
        ],
        "wc_questions_avg": [
            40.25,
            44.285296657016985
        ],
        "wc_review_avg": [
            400.5,
            133.11179511974137
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            393.0,
            195.5850198762676
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 155,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12944415322991485426&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=6xfe4IVcOu",
        "pdf": "https://openreview.net/pdf?id=6xfe4IVcOu",
        "email": "berkeley.edu;covariant.ai;berkeley.edu",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of California, Berkeley;Covariant",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.berkeley.edu;",
        "aff_unique_abbr": "UC Berkeley;",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Berkeley;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States;"
    },
    {
        "id": "6yJuDK1DsK",
        "title": "FEATHER: Lifelong Test-Time Adaptation with Lightweight Adapters",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Lifelong/continual test-time adaptation (TTA) refers to the problem where a pre-trained source domain model needs to be continually adapted at inference time to handle non-stationary test distributions. Continuously updating the source model over long horizons can result in significant drift in the source model, forgetting the source domain knowledge. Moreover, most of the existing approaches for lifelong TTA require adapting all the parameters, which can incur significant computational cost and memory consumption, limiting their applicability on edge devices for faster inference. We present FEATHER (liFelong tEst-time Adaptation wiTH lightwEight adapteRs), a novel lightweight approach that introduces only a small number of additional parameters to a pre-trained source model which can be unsupervisedly and efficiently adapted during test-time for the new test distribution(s), keeping the rest of the source model frozen. FEATHER disentangles the source domain knowledge from the target domain knowledge, making it robust against error accumulation over time. Another distinguishing aspect of FEATHER is that, unlike some recent approaches for lifelong TTA that require access to the source data for warm-starting the adaptation at test time, FEATHER does not have such a requirement. FEATHER is also orthogonal to the existing lifelong TTA approaches and can be augmented with these approaches, resulting in a significant reduction in the number of additional parameters needed to handle the lifelong TTA setting. Through extensive experiments on CIFAR-10C, CIFAR-100C, ImageNetC, and ImageNet3DCC Robustbench benchmark datasets, we demonstrate that, with substantially (85% to 94%) fewer trainable parameters, FEATHER achieves better/similar performance compared to existing SOTA lifelong TTA methods, resulting in faster adaptation and inference at test-time. The source code for FEATHER will be released upon publication.",
        "keywords": "test-time adaptation;source free test-time domain adaptation;parameter efficient test-time adaptation",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/78bc76b1914db6734493d73e557dff6dd6f6cf57.zip",
        "author": "Dhanajit Brahma;Abhinav Joshi;Ashutosh Modi;Piyush Rai",
        "authorids": "~Dhanajit_Brahma1;~Abhinav_Joshi1;~Ashutosh_Modi1;~Piyush_Rai1",
        "gender": "M;M;M;M",
        "homepage": "https://sites.google.com/view/dhanajit/;https://www.cse.iitk.ac.in/users/ajoshi/;https://ashutosh-modi.github.io/;http://cse.iitk.ac.in/users/piyush/",
        "dblp": "235/5479;308/0603;139/0873;02/525",
        "google_scholar": "3PfwL2IAAAAJ;;AWu6f60AAAAJ;https://scholar.google.com.tw/citations?user=D50grEgAAAAJ",
        "orcid": ";0000-0001-6756-1126;;",
        "linkedin": ";;dr-ashutosh-modi-3907835/;",
        "or_profile": "~Dhanajit_Brahma1;~Abhinav_Joshi1;~Ashutosh_Modi1;~Piyush_Rai1",
        "aff": "Indian Institute of Technology, Kanpur;Indian Institute of Technology, Kanpur;IIT Kanpur;IIT Kanpur, IIT Kanpur",
        "aff_domain": "iitk.ac.in;iitk.ac.in;iitk.ac.in;cse.iitk.ac.in",
        "position": "PhD student;PhD student;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nbrahma2024feather,\ntitle={{FEATHER}: Lifelong Test-Time Adaptation with Lightweight Adapters},\nauthor={Dhanajit Brahma and Abhinav Joshi and Ashutosh Modi and Piyush Rai},\nyear={2024},\nurl={https://openreview.net/forum?id=6yJuDK1DsK}\n}",
        "github": "",
        "project": "",
        "reviewers": "bPzr;F1KC;M9Xj;CBjP",
        "site": "https://openreview.net/forum?id=6yJuDK1DsK",
        "pdf_size": 719544,
        "rating": "3;5;5;5",
        "confidence": "4;4;4;4",
        "soundness": "2;3;2;2",
        "contribution": "2;1;2;2",
        "presentation": "2;2;2;3",
        "wc_summary": "84;113;95;100",
        "wc_strengths": "21;68;22;137",
        "wc_weaknesses": "119;453;305;110",
        "wc_questions": "36;134;4;194",
        "wc_review": "260;768;426;541",
        "wc_reply_reviewers": "223;0;0;0",
        "wc_reply_authors": "968;1134;819;371",
        "reply_reviewers": "2;0;0;0",
        "reply_authors": "4;3;2;2",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            98.0,
            10.41633332799983
        ],
        "wc_strengths_avg": [
            62.0,
            47.281074437876306
        ],
        "wc_weaknesses_avg": [
            246.75,
            142.26098375872422
        ],
        "wc_questions_avg": [
            92.0,
            75.90783885739337
        ],
        "wc_review_avg": [
            498.75,
            184.78010580146338
        ],
        "wc_reply_reviewers_avg": [
            55.75,
            96.5618325219649
        ],
        "wc_reply_authors_avg": [
            823.0,
            283.7542951216774
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:41xGd55N9ZkJ:scholar.google.com/&scioq=FEATHER:+Lifelong+Test-Time+Adaptation+with+Lightweight+Adapters&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Indian Institute of Technology Kanpur",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.iitk.ac.in",
        "aff_unique_abbr": "IIT Kanpur",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Kanpur",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "India"
    },
    {
        "id": "6yXAKleluj",
        "title": "Probabilistic Sampling-Enhanced Temporal-Spatial GCN: A Scalable Framework for Transaction Anomaly Detection in Ethereum Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The rapid evolution of the Ethereum network necessitates sophisticated techniques to ensure its robustness against potential threats and to maintain transparency. While Graph Neural Networks (GNNs) have pioneered anomaly detection in such platforms, capturing the intricacies of both spatial and temporal transactional patterns has remained a challenge. This study presents a fusion of Graph Convolutional Networks (GCNs) with Temporal Random Walks (TRW) enhanced by probabilistic sampling to bridge this gap. Our approach, unlike traditional GCNs, leverages the strengths of TRW to discern complex temporal sequences in Ethereum transactions, thereby providing a more nuanced transaction anomaly detection mechanism. Preliminary evaluations demonstrate that our TRW-GCN framework substantially advances the performance metrics over conventional GCNs in detecting anomalies and transaction bursts. This research not only underscores the potential of temporal cues in Ethereum transactional data but also offers a scalable and effective methodology for ensuring the security and transparency of decentralized platforms. By harnessing both spatial relationships and time-based transactional sequences as node features, our model introduces an additional layer of granularity, making the detection process more robust and less prone to false positives. This work lays the foundation for future research aimed at optimizing and enhancing the transparency of blockchain technologies, and serves as a testament to the significance of considering both time and space dimensions in the ever-evolving landscape of the decentralized platforms.",
        "keywords": "Probabilistic Sampling;Temporal Random Walk;Graph Convolutional Networks;Transaction Anomaly Detection;Ethereum Networks",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/af09f14e2fba3fa490917fd9f40136d38e98ab03.zip",
        "author": "Stefan Behfar;Jon Crowcroft",
        "authorids": "~Stefan_Behfar1;~Jon_Crowcroft1",
        "gender": "Not Specified;M",
        "homepage": "https://scholar.google.com/citations?user=ucIHQQcAAAAJ&hl=en;https://www.cst.cam.ac.uk/people/jac22",
        "dblp": ";c/JonCrowcroft",
        "google_scholar": "ucIHQQcAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";0000-0002-7013-0121",
        "linkedin": ";",
        "or_profile": "~Stefan_Behfar1;~Jon_Crowcroft1",
        "aff": ";university of cambridge",
        "aff_domain": ";cst.cam.ac.uk",
        "position": ";Full Professor",
        "bibtex": "@misc{\nbehfar2024probabilistic,\ntitle={Probabilistic Sampling-Enhanced Temporal-Spatial {GCN}: A Scalable Framework for Transaction Anomaly Detection in Ethereum Networks},\nauthor={Stefan Behfar and Jon Crowcroft},\nyear={2024},\nurl={https://openreview.net/forum?id=6yXAKleluj}\n}",
        "github": "",
        "project": "",
        "reviewers": "fmda;Ja7Q;RjEZ;XLac",
        "site": "https://openreview.net/forum?id=6yXAKleluj",
        "pdf_size": 1760287,
        "rating": "1;5;5;5",
        "confidence": "5;3;4;4",
        "soundness": "1;3;3;2",
        "contribution": "2;2;2;3",
        "presentation": "2;2;3;3",
        "wc_summary": "51;46;164;86",
        "wc_strengths": "36;18;86;29",
        "wc_weaknesses": "165;269;160;53",
        "wc_questions": "8;49;1;24",
        "wc_review": "260;382;411;192",
        "wc_reply_reviewers": "258;29;0;8",
        "wc_reply_authors": "1259;1413;1360;1389",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            4.0,
            1.7320508075688772
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            86.75,
            47.187789734209844
        ],
        "wc_strengths_avg": [
            42.25,
            26.06122598804592
        ],
        "wc_weaknesses_avg": [
            161.75,
            76.3916716664847
        ],
        "wc_questions_avg": [
            20.5,
            18.445866745696716
        ],
        "wc_review_avg": [
            311.25,
            89.1666277258482
        ],
        "wc_reply_reviewers_avg": [
            73.75,
            106.90270108841965
        ],
        "wc_reply_authors_avg": [
            1355.25,
            58.6531115969136
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:-9znvuTjFb0J:scholar.google.com/&scioq=Probabilistic+Sampling-Enhanced+Temporal-Spatial+GCN:+A+Scalable+Framework+for+Transaction+Anomaly+Detection+in+Ethereum+Networks&hl=en&as_sdt=0,33",
        "gs_version_total": 2,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Cambridge",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cam.ac.uk",
        "aff_unique_abbr": "Cambridge",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Cambridge",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "title": "Towards Optimal Regret in Adversarial Linear MDPs with Bandit Feedback",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19377",
        "id": "6yv8UHVJn4",
        "author_site": "Haolin Liu, Chen-Yu Wei, Julian Zimmert",
        "tldr": "",
        "abstract": "We study online reinforcement learning in linear Markov decision processes with adversarial losses and bandit feedback. We introduce two algorithms that achieve improved regret performance compared to existing approaches. The first algorithm, although computationally inefficient, achieves a regret of $\\widetilde{O}(\\sqrt{K})$ without relying on simulators, where $K$ is the number of episodes. This is the first rate-optimal result in the considered setting. The second algorithm is computationally efficient and achieves a regret of  $\\widetilde{O}(K^{\\frac{3}{4}})$ . These results significantly improve over the prior state-of-the-art: a computationally inefficient algorithm by Kong et al. (2023) with $\\widetilde{O}(K^{\\frac{4}{5}}+1/\\lambda_{\\min})$ regret, and a computationally efficient algorithm by Sherman et al. (2023b) with $\\widetilde{O}(K^{\\frac{6}{7}})$ regret.",
        "keywords": "adversarial MDPs;policy optimization;bandit feedback",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/97cfc74718dacde70485e3eecc6104b316b73157.pdf",
        "author": "Haolin Liu;Chen-Yu Wei;Julian Zimmert",
        "authorids": "~Haolin_Liu8;~Chen-Yu_Wei1;~Julian_Zimmert1",
        "gender": "M;M;",
        "homepage": "https://liuhl2000.github.io/;https://bahh723.github.io/;",
        "dblp": ";183/1729;190/7636",
        "google_scholar": ";2L2cR-kAAAAJ;",
        "orcid": "0000-0002-8247-9742;;",
        "linkedin": ";;",
        "or_profile": "~Haolin_Liu8;~Chen-Yu_Wei1;~Julian_Zimmert1",
        "aff": "University of Virginia, Charlottesville;University of Virginia, Charlottesville;Google",
        "aff_domain": "virginia.edu;virginia.edu;google.com",
        "position": "PhD student;Assistant Professor;Postdoc",
        "bibtex": "@inproceedings{\nliu2024towards,\ntitle={Towards Optimal Regret in Adversarial Linear {MDP}s with Bandit Feedback},\nauthor={Haolin Liu and Chen-Yu Wei and Julian Zimmert},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=6yv8UHVJn4}\n}",
        "github": "",
        "project": "",
        "reviewers": "vRkG;eGft;B4ir;QJAu",
        "pdf_size": 516977,
        "rating": "6;8;8;8",
        "confidence": "4;3;3;3",
        "soundness": "3;4;3;3",
        "contribution": "3;4;4;2",
        "presentation": "4;3;3;4",
        "wc_summary": "64;51;41;68",
        "wc_strengths": "29;112;152;70",
        "wc_weaknesses": "10;69;84;20",
        "wc_questions": "105;25;23;31",
        "wc_review": "208;257;300;189",
        "wc_reply_reviewers": "0;0;10;9",
        "wc_reply_authors": "560;260;371;386",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            56.0,
            10.700467279516348
        ],
        "wc_strengths_avg": [
            90.75,
            45.95310109230932
        ],
        "wc_weaknesses_avg": [
            45.75,
            31.403622402519108
        ],
        "wc_questions_avg": [
            46.0,
            34.19064199455752
        ],
        "wc_review_avg": [
            238.5,
            43.31570154112709
        ],
        "wc_reply_reviewers_avg": [
            4.75,
            4.763139720814412
        ],
        "wc_reply_authors_avg": [
            394.25,
            107.36008336434915
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13159267592321160767&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=6yv8UHVJn4",
        "pdf": "https://openreview.net/pdf?id=6yv8UHVJn4",
        "email": "virginia.edu;virginia.edu;google.com",
        "author_num": 3,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "University of Virginia;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.virginia.edu;https://www.google.com",
        "aff_unique_abbr": "UVA;Google",
        "aff_campus_unique_index": "0;0;1",
        "aff_campus_unique": "Charlottesville;Mountain View",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "70A6oo3Il2",
        "title": "AdaFlood: Adaptive Flood Regularization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Although neural networks are conventionally optimized towards zero training loss, it has been recently learned that targeting a non-zero training loss threshold, referred to as a flood level, often enables better test time generalization. \nCurrent approaches, however, apply the same constant flood level to all training samples, which inherently assumes all the samples have the same difficulty.\nWe present AdaFlood, a novel flood regularization method that adapts the flood level of each training sample according to the difficulty of the sample. \nIntuitively, since training samples are not equal in difficulty, the target training loss should be conditioned on the instance. \nExperiments on datasets covering four diverse input modalities &mdash; text, images, asynchronous event sequences, and tabular &mdash; demonstrate the versatility of AdaFlood across data domains and noise levels.",
        "keywords": "Flood;Overfitting;Regularization",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/782078da05d714c872ff19ac77ca1124a583d641.pdf",
        "author": "Wonho Bae;Yi Ren;Mohamed Osama Ahmed;Frederick Tung;Danica J. Sutherland;Gabriel L. Oliveira",
        "authorids": "~Wonho_Bae1;~Yi_Ren6;~Mohamed_Osama_Ahmed2;~Frederick_Tung1;~Danica_J._Sutherland1;~Gabriel_L._Oliveira1",
        "gender": "M;M;M;M;M;F",
        "homepage": "https://won-bae.github.io/;https://joshua-ren.github.io/;;;https://sites.google.com/view/gabriel-leivas-oliveira/home;http://www.djsutherland.ml",
        "dblp": "259/5393;;https://dblp.org/pers/hd/a/Ahmed:Mohamed_Osama;10/7697;117/2073;92/10966",
        "google_scholar": "https://scholar.google.ca/citations?user=EEwA__kAAAAJ;5QNce38AAAAJ;https://scholar.google.ca/citations?user=jyVyVj4AAAAJ;https://scholar.google.ca/citations?user=T4EeZ9gAAAAJ;5anRZEcAAAAJ;https://scholar.google.co.uk/citations?user=uO_NqicAAAAJ",
        "orcid": ";;0000-0001-6758-1178;;0000-0003-0099-9873;0000-0002-1525-3532",
        "linkedin": "wonho-bae/;;mohamed-osama-ahmed-91439a154/;;;",
        "or_profile": "~Wonho_Bae1;~Yi_Ren6;~Mohamed_Osama_Ahmed2;~Frederick_Tung1;~Gabriel_L._Oliveira1;~Danica_J._Sutherland2",
        "aff": "University of British Columbia;University of British Columbia;;Borealis AI;Borealis AI;University of British Columbia",
        "aff_domain": "cs.ubc.ca;ubc.ca;;borealisai.com;borealisai.com;cs.ubc.ca",
        "position": "PhD student;PhD student;;Researcher;Senior Machine Learning Researcher;Assistant Professor",
        "bibtex": "@misc{\nbae2024adaflood,\ntitle={AdaFlood: Adaptive Flood Regularization},\nauthor={Wonho Bae and Yi Ren and Mohamed Osama Ahmed and Frederick Tung and Danica J. Sutherland and Gabriel L. Oliveira},\nyear={2024},\nurl={https://openreview.net/forum?id=70A6oo3Il2}\n}",
        "github": "",
        "project": "",
        "reviewers": "o6wC;vFax;R2kv",
        "site": "https://openreview.net/forum?id=70A6oo3Il2",
        "pdf_size": 942269,
        "rating": "3;5;5",
        "confidence": "4;3;3",
        "soundness": "3;2;2",
        "contribution": "2;2;2",
        "presentation": "3;3;3",
        "wc_summary": "72;191;38",
        "wc_strengths": "65;38;25",
        "wc_weaknesses": "161;548;37",
        "wc_questions": "1;9;3",
        "wc_review": "299;786;103",
        "wc_reply_reviewers": "54;0;0",
        "wc_reply_authors": "1537;2134;417",
        "reply_reviewers": "1;0;0",
        "reply_authors": "3;3;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            100.33333333333333,
            65.59640911581127
        ],
        "wc_strengths_avg": [
            42.666666666666664,
            16.659998666133067
        ],
        "wc_weaknesses_avg": [
            248.66666666666666,
            217.63016539278027
        ],
        "wc_questions_avg": [
            4.333333333333333,
            3.39934634239519
        ],
        "wc_review_avg": [
            396.0,
            287.14572374783273
        ],
        "wc_reply_reviewers_avg": [
            18.0,
            25.45584412271571
        ],
        "wc_reply_authors_avg": [
            1362.6666666666667,
            711.719201808004
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.9999999999999998,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13033532297663653967&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;1;0",
        "aff_unique_norm": "University of British Columbia;Borealis AI",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ubc.ca;https://www.borealisai.com",
        "aff_unique_abbr": "UBC;Borealis AI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "title": "Continuous Invariance Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19376",
        "id": "70IgE3tRbu",
        "author_site": "LIN Yong, Fan Zhou, Lu Tan, Lintao Ma, Jianmeng Liu, Yansu HE, Yuan Yuan, Yu Liu, James Zhang, Yujiu Yang, Hao Wang",
        "tldr": "",
        "abstract": "Invariance learning methods aim to learn invariant features in the hope that they generalize under distributional shift. Although many tasks are naturally characterized by continuous domains, current invariance learning techniques generally assume categorically indexed domains. For example, auto-scaling in cloud computing often needs a CPU utilization prediction model that generalizes across different times (e.g., time of a day and date of a year), where `time' is a continuous domain index. In this paper, we start by theoretically showing that existing invariance learning methods can fail for continuous domain problems. Specifically, the naive solution of splitting continuous domains into discrete ones ignores the underlying relationship among domains, and therefore potentially leads to suboptimal performance. To address this challenge, we then propose Continuous Invariance Learning (CIL), which extracts invariant features across continuously indexed domains. CIL is a novel adversarial procedure which measures and controls the conditional independence between the labels and continuous domain indices given the extracted features. Our theoretical analysis demonstrates that CIL learns features that satisfy the invariant constraint with infinite samples. Empirical results on both synthetic and real-world datasets (including data collected from production systems) show that CIL consistently outperforms strong baselines among all the tasks.",
        "keywords": "Causality; Domain Generalization; Invariance Learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "LIN Yong;Fan Zhou;Lu Tan;Lintao Ma;Jianmeng Liu;Yansu HE;Yuan Yuan;Yu Liu;James Y. Zhang;Yujiu Yang;Hao Wang",
        "authorids": "~LIN_Yong1;~Fan_Zhou10;~Lu_Tan1;~Lintao_Ma1;~Jianmeng_Liu1;~Yansu_HE1;~Yuan_Yuan5;~Yu_Liu28;~James_Y._Zhang1;~Yujiu_Yang2;~Hao_Wang3",
        "gender": ";M;;;M;F;F;M;M;M;",
        "homepage": ";;;;https://www.jmliu.site/;;https://yyuanad.github.io/;;https://scholar.google.com/citations?user=Ywakh_sAAAAJ;https://sites.google.com/view/iigroup-thu;",
        "dblp": ";;67/10146;;239/4809;;64/5845-2;97/2274-71.html;151/3086;30/3847;",
        "google_scholar": ";https://scholar.google.com/citations?view_op=list_works;yeJ3AbsAAAAJ;;;;9tI89HMAAAAJ;zbRvnkwAAAAJ;Ywakh_sAAAAJ;4gH3sxsAAAAJ;",
        "orcid": ";;;;;0000-0001-6433-0007;0000-0002-6609-0542;0009-0008-1719-8371;0000-0001-6519-676X;0000-0002-6427-1024;",
        "linkedin": ";https://www.linkedin.com/mwlite/in/moutozf;;;jianmeng-liu/;;yuan-yuan-96451747/;;jamesymzhang/;;",
        "or_profile": "~LIN_Yong1;~Fan_Zhou10;~Lu_Tan1;~Lintao_Ma1;~Jianmeng_Liu1;~Yansu_HE1;~Yuan_Yuan5;~Yu_Liu28;~James_Y._Zhang1;~Yujiu_Yang2;~Hao_Wang3",
        "aff": ";AntGroup;Tsinghua University;;Hong Kong University of Science and Technology;The Chinese University of Hong Kong;Boston College;Ant Group;Ant Group;Tsinghua University;",
        "aff_domain": ";antgroup.com;tsinghua.edu.cn;;ust.hk;cuhk.edu.hk;bc.edu;antgroup.com;alipay.com;tsinghua.edu.cn;",
        "position": ";Researcher;MS student;;Undergrad student;PhD student;Assistant Professor;Researcher;managing director;Full Professor;",
        "bibtex": "@inproceedings{\nyong2024continuous,\ntitle={Continuous Invariance Learning},\nauthor={LIN Yong and Fan Zhou and Lu Tan and Lintao Ma and Jianmeng Liu and Yansu HE and Yuan Yuan and Yu Liu and James Y. Zhang and Yujiu Yang and Hao Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=70IgE3tRbu}\n}",
        "github": "",
        "project": "",
        "reviewers": "dGY4;Zzch;9c4M;MYYo",
        "pdf_size": 1901073,
        "rating": "5;5;8;8",
        "confidence": "4;3;4;4",
        "soundness": "3;3;3;4",
        "contribution": "2;3;3;3",
        "presentation": "3;2;2;4",
        "wc_summary": "106;38;71;152",
        "wc_strengths": "32;75;63;69",
        "wc_weaknesses": "344;152;251;200",
        "wc_questions": "10;210;148;92",
        "wc_review": "492;475;533;513",
        "wc_reply_reviewers": "0;0;98;0",
        "wc_reply_authors": "943;1676;2380;1006",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "3;4;6;2",
        "rating_avg": [
            6.5,
            1.5
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            91.75,
            42.28696607703135
        ],
        "wc_strengths_avg": [
            59.75,
            16.57369904396722
        ],
        "wc_weaknesses_avg": [
            236.75,
            71.13148037261702
        ],
        "wc_questions_avg": [
            115.0,
            73.60027173862879
        ],
        "wc_review_avg": [
            503.25,
            21.821720830401986
        ],
        "wc_reply_reviewers_avg": [
            24.5,
            42.4352447854375
        ],
        "wc_reply_authors_avg": [
            1501.25,
            583.0211724285834
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.75,
            1.479019945774904
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": 0.5773502691896258,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13991504235650354242&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=70IgE3tRbu",
        "pdf": "https://openreview.net/pdf?id=70IgE3tRbu",
        "email": ";antgroup.com;tsinghua.edu.cn;;ust.hk;cuhk.edu.hk;bc.edu;antgroup.com;alipay.com;tsinghua.edu.cn;",
        "author_num": 11,
        "aff_unique_index": "0;1;2;3;4;0;0;1",
        "aff_unique_norm": "Ant Group;Tsinghua University;Hong Kong University of Science and Technology;Chinese University of Hong Kong;Boston College",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.antgroup.com;https://www.tsinghua.edu.cn;https://www.ust.hk;https://www.cuhk.edu.hk;https://www.bostoncollege.edu",
        "aff_unique_abbr": "AntGroup;THU;HKUST;CUHK;BC",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;1;0;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "70PPJo3DwI",
        "title": "Towards Out-of-federation Generalization in Federated Learning",
        "track": "main",
        "status": "Desk Reject",
        "tldr": "",
        "abstract": "Federated Learning (FL) is widely employed to tackle distributed healthcare data. Existing methods primarily focus on addressing in-federation data heterogeneity. However, we observe that they can suffer from significant performance degradation when applied to unseen clients for out-of-federation (OOF) generalization. The recent attempts to address generalization to unseen clients generally fail to scale up to large-scale distributed settings due to high communication overhead and convergence difficulty. And the communication efficient methods often yield poor OOF robustness. To achieve OOF-resiliency in a scalable manner, we propose Topology-aware Federated Learning (TFL) that leverages client topology - a graph representing client relationships - to effectively train robust models against OOF data. We formulate a novel optimization problem for TFL, consisting of two key modules: Client Topology Learning, which infers the client relationships in a privacy-preserving manner, and Learning on Client Topology, which leverages the learned topology to identify influential clients and harness this information into the FL optimization process to efficiently build robust models. Empirical evaluation on a variety of real-world datasets verifies TFL's superior OOF robustness and communication efficiency.",
        "keywords": "Federated Learning; Data Heterogeneity; Robustness; Topology-aware",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/1c30298a88f91d186a09f450dab518337f3b8ef2.pdf",
        "author": "Mengmeng Ma;Tang Li;Weisong Shi;Xi Peng",
        "authorids": "~Mengmeng_Ma1;~Tang_Li1;~Weisong_Shi1;~Xi_Peng1",
        "gender": "M;M;M;Not Specified",
        "homepage": "https://mengmenm.top/;https://tangli0305.github.io/;http://weisongshi.org/;https://deep-real.github.io/dr_xipeng.html",
        "dblp": "150/6565-2;01/1190-5;s/WeisongShi;149/7762-5",
        "google_scholar": "ycXTxwoAAAAJ;mQFL3DYAAAAJ;4rPcoCEAAAAJ;DWw4v0kAAAAJ",
        "orcid": "0000-0002-2804-2718;0000-0002-3134-4151;;0000-0002-7772-001X",
        "linkedin": ";tang-li-613132180/;;xi-peng-74b540b6/",
        "or_profile": "~Mengmeng_Ma1;~Tang_Li1;~Weisong_Shi1;~Xi_Peng1",
        "aff": "University of Delaware;University of Delaware;University of Delaware;University of Delaware",
        "aff_domain": "udel.edu;udel.edu;udel.edu;udel.edu",
        "position": "PhD student;PhD student;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nma2024towards,\ntitle={Towards Out-of-federation Generalization in Federated Learning},\nauthor={Mengmeng Ma and Tang Li and Weisong Shi and Xi Peng},\nyear={2024},\nurl={https://openreview.net/forum?id=70PPJo3DwI}\n}",
        "github": "",
        "project": "",
        "reviewers": "Nx6V;RF1L;L1rQ;Q4J6",
        "site": "https://openreview.net/forum?id=70PPJo3DwI",
        "pdf_size": 4228748,
        "rating": "5;6;6;6",
        "confidence": "4;4;3;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "98;156;91;63",
        "wc_strengths": "66;34;28;27",
        "wc_weaknesses": "263;297;137;119",
        "wc_questions": "3;60;92;60",
        "wc_review": "430;547;348;269",
        "wc_reply_reviewers": "0;20;0;136",
        "wc_reply_authors": "829;586;628;505",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "3;2;2;3",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            102.0,
            33.81567683782183
        ],
        "wc_strengths_avg": [
            38.75,
            15.958931668504631
        ],
        "wc_weaknesses_avg": [
            204.0,
            77.20751258783046
        ],
        "wc_questions_avg": [
            53.75,
            32.080952292598795
        ],
        "wc_review_avg": [
            398.5,
            102.91379888042225
        ],
        "wc_reply_reviewers_avg": [
            39.0,
            56.595052787324086
        ],
        "wc_reply_authors_avg": [
            637.0,
            119.34194568549651
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:7l2C0DzjiosJ:scholar.google.com/&scioq=Towards+Out-of-federation+Generalization+in+Federated+Learning&hl=en&as_sdt=0,47",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of Delaware",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.udel.edu",
        "aff_unique_abbr": "UD",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "70rlVBPX6Y",
        "title": "Neural Architecture Search for TinyML with Reinforcement Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Deploying Deep Neural Networks (DNNs) on microcontrollers (TinyML) is a common trend to process the increasing amount of sensor data generated at the edge, but in practice, resource and latency constraints make it difficult to find optimal DNN candidates. Neural Architecture Search (NAS) is an excellent approach to automate this search and can easily be combined with DNN compression techniques commonly used in TinyML. However, many NAS techniques are not only computationally expensive, especially hyperparameter optimization (HPO), but also often focus on optimizing only a single objective, e.g., maximizing accuracy, without considering additional objectives such as memory consumption or computational complexity of a model, which are key to making deployment at the edge feasible. In this paper we propose a novel NAS strategy for TinyML based on multi-objective Bayesian optimization (MOBOpt) and an ensemble of competing parametric policies trained using Augmented Random Search (ARS) Reinforcement Learning (RL) agents. Our methodology aims at efficiently finding tradeoffs between a DNN's predictive accuracy, memory consumption on a given target system, and computational complexity. Our experiments show that we outperform existing MOBOpt approaches consistently on different data sets and architectures such as ResNet-18 and MobileNetV3.",
        "keywords": "Hyperparameter Optimization;TinyML;Microcontrollers;Reinforcement Learning;Augmented Random Search;Multi-Objective Optimization",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Mark Deutel;Georgios Kontes;Christopher Mutschler;J\u00fcrgen Teich",
        "authorids": "~Mark_Deutel1;~Georgios_Kontes1;~Christopher_Mutschler1;~J\u00fcrgen_Teich1",
        "gender": "M;;M;M",
        "homepage": "https://markdeutel.github.io/;;https://www.cmutschler.de;",
        "dblp": "271/4795;;118/7748;https://dblp.uni-trier.de/pid/t/JurgenTeich.html",
        "google_scholar": "hd-tlcgAAAAJ;;https://scholar.google.de/citations?user=gKDSp8YAAAAJ;",
        "orcid": "0000-0001-8932-5212;;0000-0001-8108-0230;0000-0001-6285-5862",
        "linkedin": ";;christopher-mutschler-28431576/;",
        "or_profile": "~Mark_Deutel1;~Georgios_Kontes1;~Christopher_Mutschler1;~J\u00fcrgen_Teich1",
        "aff": "Friedrich-Alexander Universit\u00e4t Erlangen-N\u00fcrnberg;;Fraunhofer IIS;Friedrich-Alexander Universit\u00e4t Erlangen-N\u00fcrnberg",
        "aff_domain": "fau.de;;fraunhofer.de;fau.de",
        "position": "PhD student;;Principal Researcher;Full Professor",
        "bibtex": "@misc{\ndeutel2024neural,\ntitle={Neural Architecture Search for Tiny{ML} with Reinforcement Learning},\nauthor={Mark Deutel and Georgios Kontes and Christopher Mutschler and J{\\\"u}rgen Teich},\nyear={2024},\nurl={https://openreview.net/forum?id=70rlVBPX6Y}\n}",
        "github": "",
        "project": "",
        "reviewers": "FN6N;KEWJ;CC3e;4rfG;obe6",
        "site": "https://openreview.net/forum?id=70rlVBPX6Y",
        "pdf_size": 722207,
        "rating": "3;5;5;5;5",
        "confidence": "4;4;3;4;2",
        "soundness": "3;2;2;3;3",
        "contribution": "2;2;3;2;2",
        "presentation": "3;2;3;2;3",
        "wc_summary": "204;35;64;99;160",
        "wc_strengths": "44;22;23;49;15",
        "wc_weaknesses": "222;106;37;107;22",
        "wc_questions": "113;3;71;62;24",
        "wc_review": "583;166;195;317;221",
        "wc_reply_reviewers": "0;0;17;0;42",
        "wc_reply_authors": "668;300;273;508;238",
        "reply_reviewers": "0;0;1;0;1",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            4.6,
            0.7999999999999999
        ],
        "confidence_avg": [
            3.4,
            0.8
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            112.4,
            61.91801030394953
        ],
        "wc_strengths_avg": [
            30.6,
            13.365627557282897
        ],
        "wc_weaknesses_avg": [
            98.8,
            70.73160538260107
        ],
        "wc_questions_avg": [
            54.6,
            38.29673615335908
        ],
        "wc_review_avg": [
            296.4,
            152.00999967107427
        ],
        "wc_reply_reviewers_avg": [
            11.8,
            16.4730082255792
        ],
        "wc_reply_authors_avg": [
            397.4,
            164.81941633193586
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.37500000000000017,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:xzjnoYAjOY8J:scholar.google.com/&scioq=Neural+Architecture+Search+for+TinyML+with+Reinforcement+Learning&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Friedrich-Alexander University Erlangen-N\u00fcrnberg;Fraunhofer Institute for Integrated Circuits",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www fau.de;https://www.iis.fraunhofer.de/",
        "aff_unique_abbr": "FAU;Fraunhofer IIS",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Erlangen-N\u00fcrnberg;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "70xhiS0AQS",
        "title": "TaskBench: Benchmarking Large Language Models for Task Automation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recently, the incredible progress of large language models (LLMs) has ignited the spark of task automation, which decomposes the complex tasks described by user instructions into sub-tasks, and invokes external tools to execute them, and plays a central role in autonomous agents. Therefore, there has been an urgent demand to formulate a systematic and standardized benchmark to foster the development of LLMs in task automation. To this end, we introduce TaskBench to evaluate task automation. Specifically, the process of task automation can be formulated as three critical stages (i.e., task decomposition, tool invocation, and parameter prediction) to fulfill user intent, that renders its data collection more challenging than common NLP tasks. Here, we introduce the concept of Tool Graph to represent the decomposed tasks in user intent, and adopt a back-instruct method to generate user instruction. Moreover, the mechanism of task automation also drives us to formulate more advanced metrics to measure the capability of LLMs. Therefore, we further propose TaskEval to evaluate the capability of LLMs in our curated datasets from different aspects, including task decomposition, tool invocation, and parameter prediction. Experimental results demonstrate that TaskBench can effectively be utilized to reflect the capability of LLMs in task automation. The code and datasets of TaskBench are available in the supplementary material.",
        "keywords": "LLM;Task Automation;Autonomous Agents",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/a21af03466ad37a670d3d2faffedd09a5008f3bc.zip",
        "author": "Yongliang Shen;Kaitao Song;Xu Tan;Wenqi Zhang;Kan Ren;Siyu Yuan;Weiming Lu;Dongsheng Li;Yueting Zhuang",
        "authorids": "~Yongliang_Shen1;~Kaitao_Song1;~Xu_Tan1;~Wenqi_Zhang2;~Kan_Ren1;~Siyu_Yuan2;~Weiming_Lu1;~Dongsheng_Li2;~Yueting_Zhuang1",
        "gender": "M;M;M;;M;;;M;M",
        "homepage": ";;https://tan-xu.github.io/;;https://saying.ren;;;http://recmind.cn;https://person.zju.edu.cn/yzhuang",
        "dblp": "221/5612-1.html;222/2082;96/10484-3;;28/7458;;;254/0830-2.html;",
        "google_scholar": "UT3NzFAAAAAJ;https://scholar.google.com.hk/citations?user=LLk9dR8AAAAJ;tob-U1oAAAAJ;;USnQVWgAAAAJ;;;VNg5rA8AAAAJ;1RD7UJAAAAAJ",
        "orcid": ";;0000-0001-5631-0639;;;;;0000-0003-3103-8442;",
        "linkedin": ";;;;;;;;",
        "or_profile": "~Yongliang_Shen1;~Kaitao_Song1;~Xu_Tan1;~Wenqi_Zhang2;~Kan_Ren1;~Siyu_Yuan2;~Weiming_Lu1;~Dongsheng_Li2;~Yueting_Zhuang1",
        "aff": "Zhejiang University;Microsoft;Microsoft;;ShanghaiTech University;;;Microsoft Research Asia;Zhejiang University",
        "aff_domain": "zju.edu.cn;microsoft.com;microsoft.com;;shanghaitech.edu.cn;;;microsoft.com;zju.edu.cn",
        "position": "Assistant Professor;Researcher;Principal Researcher;;Assistant Professor;;;Principal Researcher;Full Professor",
        "bibtex": "@misc{\nshen2024taskbench,\ntitle={TaskBench: Benchmarking Large Language Models for Task Automation},\nauthor={Yongliang Shen and Kaitao Song and Xu Tan and Wenqi Zhang and Kan Ren and Siyu Yuan and Weiming Lu and Dongsheng Li and Yueting Zhuang},\nyear={2024},\nurl={https://openreview.net/forum?id=70xhiS0AQS}\n}",
        "github": "",
        "project": "",
        "reviewers": "CSek;peHw;LVvj;BEYM",
        "site": "https://openreview.net/forum?id=70xhiS0AQS",
        "pdf_size": 840721,
        "rating": "3;5;5;6",
        "confidence": "4;4;4;4",
        "soundness": "1;2;3;3",
        "contribution": "2;3;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "68;70;204;41",
        "wc_strengths": "68;82;135;26",
        "wc_weaknesses": "251;227;115;207",
        "wc_questions": "49;40;32;13",
        "wc_review": "436;419;486;287",
        "wc_reply_reviewers": "171;43;0;23",
        "wc_reply_authors": "1597;628;368;1037",
        "reply_reviewers": "2;1;0;1",
        "reply_authors": "6;3;1;4",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            95.75,
            63.53886605849998
        ],
        "wc_strengths_avg": [
            77.75,
            38.95109112720721
        ],
        "wc_weaknesses_avg": [
            200.0,
            51.487862647424
        ],
        "wc_questions_avg": [
            33.5,
            13.275918047351754
        ],
        "wc_review_avg": [
            407.0,
            73.5289058806127
        ],
        "wc_reply_reviewers_avg": [
            59.25,
            66.28866796067032
        ],
        "wc_reply_authors_avg": [
            907.5,
            464.04768073981364
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            3.5,
            1.8027756377319946
        ],
        "replies_avg": [
            32,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 48,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6584401630894271152&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1;2;1;0",
        "aff_unique_norm": "Zhejiang University;Microsoft;ShanghaiTech University",
        "aff_unique_dep": ";Microsoft Corporation;",
        "aff_unique_url": "https://www.zju.edu.cn;https://www.microsoft.com;https://www.shanghaitech.edu.cn",
        "aff_unique_abbr": "ZJU;Microsoft;ShanghaiTech",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Asia",
        "aff_country_unique_index": "0;1;1;0;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "71kocBuhNO",
        "title": "LogicBench: Towards Systematic Evaluation of Logical Reasoning Ability of Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recently developed large language models (LLMs) have been shown to perform remarkably well on a wide range of language understanding tasks. But, can they really \"reason\" over the natural language? This question has been receiving significant research attention and a number of reasoning skills such as commonsense, numerical, and qualitative have been studied. However, the crucial skill pertaining to 'logical reasoning' has remained underexplored. Existing work investigating this reasoning ability has focused only on a couple of inference rules (such as modus ponens and modus tollens) of propositional and first-order logic. To enable systematic evaluation of logical reasoning, we introduce LogicBench, a natural language question-answering dataset encompassing 25 different reasoning patterns spanning over propositional, first-order, and non-monotonic logics. Key steps of our dataset construction consist of (1) controlled generation of sentences and their negations containing different ontologies, (2) (context, question, answer) triplets creation using heuristically designed templates, and (3) semantic variations of triplets adding more diversity. We present a comprehensive evaluation with a range of LLMs such as GPT-4, GPT-3, ChatGPT, and FLAN-T5 using chain-of-thought prompting in both zero-shot and few-shot settings. Experimental results show that existing LLMs do not fare well on LogicBench; especially, they struggle on instances requiring complex reasoning steps. Furthermore, we also show that LLMs trained using our data exhibit a better understanding of logical reasoning leading to performance improvements on several existing logical reasoning datasets such as LogicNLI, FOLIO, LogiQA, and ReClor.",
        "keywords": "Logical Reasoning;Large Language Models;Prompting",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Mihir Parmar;Neeraj Varshney;Nisarg Patel;Man Luo;Santosh Mashetty;Arindam Mitra;Chitta Baral",
        "authorids": "~Mihir_Parmar1;~Neeraj_Varshney1;~Nisarg_Patel1;~Man_Luo2;~Santosh_Mashetty1;~Arindam_Mitra1;~Chitta_Baral1",
        "gender": "M;M;;;M;M;M",
        "homepage": ";https://nrjvarshney.github.io/;;;;https://ari9dam.github.io/;http://chitta.orissalinks.com",
        "dblp": "253/6105;139/3970;304/0895;;;04/2864;b/ChittaBaral",
        "google_scholar": "2UPwJC4AAAAJ;Ju9nR0IAAAAJ;https://scholar.google.com/citations?hl=en;;eQN-aNAAAAAJ;https://scholar.google.com/;9Yd716IAAAAJ",
        "orcid": ";;0000-0001-5964-4204;;;;0000-0002-7549-723X",
        "linkedin": "mihir-parmar-b44003157/;neerajvarshney97/;https://linkedin.com/in/nisarg-p-patel;;santoshmashetty/;;chitta-baral-8a8438b",
        "or_profile": "~Mihir_Parmar1;~Neeraj_Varshney1;~Nisarg_Patel1;~Man_Luo2;~Santosh_Mashetty1;~Arindam_Mitra1;~Chitta_Baral1",
        "aff": "Arizona State University;Arizona State University;Arizona State University;;Arizona State University;Microsoft Research;Arizona State University",
        "aff_domain": "asu.edu;asu.edu;asu.edu;;asu.edu;research.microsoft.com;asu.edu",
        "position": "PhD student;PhD student;MS student;;PhD student;Researcher;Full Professor",
        "bibtex": "@misc{\nparmar2024logicbench,\ntitle={LogicBench: Towards Systematic Evaluation of Logical Reasoning Ability of Large Language Models},\nauthor={Mihir Parmar and Neeraj Varshney and Nisarg Patel and Man Luo and Santosh Mashetty and Arindam Mitra and Chitta Baral},\nyear={2024},\nurl={https://openreview.net/forum?id=71kocBuhNO}\n}",
        "github": "",
        "project": "",
        "reviewers": "8r5S;sePi;5vLY;Z2AS;1d9G",
        "site": "https://openreview.net/forum?id=71kocBuhNO",
        "pdf_size": 1400306,
        "rating": "5;5;5;6;6",
        "confidence": "2;2;4;5;5",
        "soundness": "3;3;1;4;3",
        "contribution": "2;3;2;3;3",
        "presentation": "3;3;3;3;3",
        "wc_summary": "102;92;112;74;66",
        "wc_strengths": "52;87;196;94;57",
        "wc_weaknesses": "74;123;290;86;219",
        "wc_questions": "58;1;199;538;100",
        "wc_review": "286;303;797;792;442",
        "wc_reply_reviewers": "0;32;632;0;0",
        "wc_reply_authors": "325;389;2371;592;646",
        "reply_reviewers": "0;1;2;0;0",
        "reply_authors": "1;1;5;2;1",
        "rating_avg": [
            5.4,
            0.48989794855663565
        ],
        "confidence_avg": [
            3.6,
            1.3564659966250538
        ],
        "soundness_avg": [
            2.8,
            0.9797958971132712
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            89.2,
            17.092688495377196
        ],
        "wc_strengths_avg": [
            97.2,
            52.02845375369135
        ],
        "wc_weaknesses_avg": [
            158.4,
            83.19759611911873
        ],
        "wc_questions_avg": [
            179.2,
            190.7075247597745
        ],
        "wc_review_avg": [
            524.0,
            227.4036059520605
        ],
        "wc_reply_reviewers_avg": [
            132.8,
            249.90750288856879
        ],
        "wc_reply_authors_avg": [
            864.6,
            762.7189783924351
        ],
        "reply_reviewers_avg": [
            0.6,
            0.7999999999999999
        ],
        "reply_authors_avg": [
            2.0,
            1.5491933384829668
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.8427009716003842,
        "gs_citation": 43,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12451407874556115043&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;0;0;1;0",
        "aff_unique_norm": "Arizona State University;Microsoft",
        "aff_unique_dep": ";Microsoft Research",
        "aff_unique_url": "https://www.asu.edu;https://www.microsoft.com/en-us/research",
        "aff_unique_abbr": "ASU;MSR",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "71mqtQdKB9",
        "title": "Discrete Diffusion Language Modeling by Estimating the Ratios of the Data Distribution",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Despite their groundbreaking performance for many generative modeling tasks, diffusion models have fallen short on discrete data domains such as natural language. Crucially, standard diffusion models rely on the well-established theory of score matching, but efforts to generalize this to discrete structures have not yielded the same empirical gains. In this work, we bridge this gap by proposing score entropy, a novel discrete score matching loss that is more stable than existing methods, forms an ELBO for maximum likelihood training, and can be efficiently optimized with a denoising variant. Combined with architectural improvements, we scale to the GPT-2 language modeling experiments, achieving highly competitive performance. When comparing similarly sized-architectures, our score entropy discrete diffusion model attains comparable zero-shot perplexities despite reporting an upper bound (within $15$ percent of and sometimes outperforming GPT-2), can trade off speed for generation quality ($4\\times$ lower generative perplexity when matching function evaluations and $16\\times$ fewer function evaluations when matching generative perplexity compared to standard autoregressive sampling), and enables arbitrary infilling beyond standard autoregressive left to right prompting.",
        "keywords": "Diffusion Models;Discrete Diffusion Models;Language Modeling;Transformers",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Aaron Lou;Chenlin Meng;Stefano Ermon",
        "authorids": "~Aaron_Lou1;~Chenlin_Meng1;~Stefano_Ermon1",
        "gender": "M;F;M",
        "homepage": "https://aaronlou.com;https://chenlin9.github.io/;http://cs.stanford.edu/~ermon/",
        "dblp": "232/3858;227/2517;47/8135",
        "google_scholar": ";nEFU7wIAAAAJ;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Aaron_Lou1;~Chenlin_Meng1;~Stefano_Ermon1",
        "aff": "Stanford University;Stanford University;Stanford University",
        "aff_domain": "stanford.edu;stanford.edu;stanford.edu",
        "position": "PhD student;PhD student;Associate Professor",
        "bibtex": "@misc{\nlou2024discrete,\ntitle={Discrete Diffusion Language Modeling by Estimating the Ratios of the Data Distribution},\nauthor={Aaron Lou and Chenlin Meng and Stefano Ermon},\nyear={2024},\nurl={https://openreview.net/forum?id=71mqtQdKB9}\n}",
        "github": "",
        "project": "",
        "reviewers": "XAVS;DQWg;dGxc;4UNx;LEE7",
        "site": "https://openreview.net/forum?id=71mqtQdKB9",
        "pdf_size": 2383382,
        "rating": "5;6;6;8;8",
        "confidence": "3;3;4;4;4",
        "soundness": "3;2;3;3;4",
        "contribution": "2;3;3;3;4",
        "presentation": "2;2;3;3;3",
        "wc_summary": "84;94;71;219;178",
        "wc_strengths": "78;139;18;155;35",
        "wc_weaknesses": "136;188;135;895;233",
        "wc_questions": "108;135;128;325;109",
        "wc_review": "406;556;352;1594;555",
        "wc_reply_reviewers": "0;22;361;876;0",
        "wc_reply_authors": "599;790;1957;1690;222",
        "reply_reviewers": "0;1;4;2;0",
        "reply_authors": "2;3;4;4;1",
        "rating_avg": [
            6.6,
            1.2
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            3.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            3.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            129.2,
            58.506068061355826
        ],
        "wc_strengths_avg": [
            85.0,
            54.50504563799576
        ],
        "wc_weaknesses_avg": [
            317.4,
            291.0894020743455
        ],
        "wc_questions_avg": [
            161.0,
            82.67284923117141
        ],
        "wc_review_avg": [
            692.6,
            457.87841180820044
        ],
        "wc_reply_reviewers_avg": [
            251.8,
            340.9295528404659
        ],
        "wc_reply_authors_avg": [
            1051.6,
            661.6375442793433
        ],
        "reply_reviewers_avg": [
            1.4,
            1.4966629547095764
        ],
        "reply_authors_avg": [
            2.8,
            1.16619037896906
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.748455199183749,
        "gs_citation": 56,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9661892450312922778&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Stanford University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.stanford.edu",
        "aff_unique_abbr": "Stanford",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Stanford",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "71oyMJiUm2",
        "title": "TransFace: Unit-Based Audio-Visual Speech Synthesizer for Talking Head Translation",
        "track": "main",
        "status": "Desk Reject",
        "tldr": "",
        "abstract": "Direct speech-to-speech translation achieves high-quality results through the introduction of discrete units obtained from self-supervised learning. This approach circumvents delays and cascading errors associated with model cascading. However, talking head translation, converting audio-visual speech (i.e., talking head video) from one language into another, still confronts several challenges compared to audio speech: (1) Existing methods invariably rely on cascading, synthesizing via both audio and text, resulting in delays and cascading errors. (2) Talking head translation has a limited set of reference frames. If the generated translation exceeds the length of the original speech, the video sequence needs to be supplemented by repeating frames, leading to jarring video transitions. In this work, we propose a model for talking head translation, \\textbf{TransFace}, which can directly translate audio-visual speech into audio-visual speech in other languages. It consists of a speech-to-unit translation model to convert audio speech into discrete units and a unit-based audio-visual speech synthesizer, Unit2Lip, to re-synthesize synchronized audio-visual speech from discrete units in parallel. Furthermore, we introduce a Bounded Duration Predictor, ensuring isometric talking head translation and preventing duplicate reference frames. Experiments demonstrate that our proposed Unit2Lip model significantly improves synchronization (1.601 and 0.982 on LSE-C for the original and generated audio speech, respectively) and boosts inference speed by a factor of $\\times$4.35 on LRS2. Additionally, TransFace achieves impressive BLEU scores of 61.93 and 47.55 for Es-En and Fr-En on LRS3-T and 100\\% isochronous translations.",
        "keywords": "Speech-To-Speech Translation;Talking Head Generation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/7fba415b085f897824957ea167e5279f8b4847b3.pdf",
        "author": "Xize Cheng;Rongjie Huang;Linjun Li;Tao Jin;Zehan Wang;Aoxiong Yin;Minglei Li;Xinyu Duan;changpeng yang;Zhou Zhao",
        "authorids": "~Xize_Cheng1;~Rongjie_Huang1;~Linjun_Li2;~Tao_Jin2;~Zehan_Wang2;~Aoxiong_Yin1;~Minglei_Li1;~Xinyu_Duan1;~changpeng_yang1;~Zhou_Zhao3",
        "gender": "M;M;;M;M;;M;M;M;",
        "homepage": "https://exgc.github.io/;;;https://hugddygff.github.io/;https://github.com/12zehan17;;;;https://www.researchgate.net/profile/Changpeng-Yang-2;",
        "dblp": "334/2167;212/8936-1;;88/4850-4.html;126/7826-1;;136/7341-1.html;31/5936;;",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;iRHBUsgAAAAJ;;;euXK0lkAAAAJ;;KqU6kVcAAAAJ;Z1XYinwAAAAJ;;",
        "orcid": "0000-0001-9708-3225;;;0000-0003-3564-1628;0009-0007-7509-7563;;0000-0002-1427-3507;;;",
        "linkedin": ";;;;;;;;;",
        "or_profile": "~Xize_Cheng1;~Rongjie_Huang1;~Linjun_Li2;~Tao_Jin2;~Zehan_Wang2;~Aoxiong_Yin1;~Minglei_Li1;~Xinyu_Duan1;~changpeng_yang1;~Zhou_Zhao3",
        "aff": "Zhejiang University;Zhejiang University;;Zhejiang University;Zhejiang University;;Huawei Cloud Computing Technologies Ltd.;Huawei Technologies Ltd.;Huawei Technologies Ltd.;",
        "aff_domain": "zju.edu.cn;zju.edu.cn;;zju.edu.cn;zju.edu.cn;;huawei.com;huawei.com;huawei.com;",
        "position": "PhD student;MS student;;Assistant Professor;PhD student;;Researcher;Researcher;Director;",
        "bibtex": "@misc{\ncheng2024transface,\ntitle={TransFace: Unit-Based Audio-Visual Speech Synthesizer for Talking Head Translation},\nauthor={Xize Cheng and Rongjie Huang and Linjun Li and Tao Jin and Zehan Wang and Aoxiong Yin and Minglei Li and Xinyu Duan and changpeng yang and Zhou Zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=71oyMJiUm2}\n}",
        "github": "",
        "project": "",
        "reviewers": "hwnr;Qjzu;hZGE;d3Xc",
        "site": "https://openreview.net/forum?id=71oyMJiUm2",
        "pdf_size": 2356840,
        "rating": "5;6;6;8",
        "confidence": "3;4;3;3",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "61;68;104;196",
        "wc_strengths": "45;64;38;124",
        "wc_weaknesses": "132;96;98;259",
        "wc_questions": "23;206;57;28",
        "wc_review": "261;434;297;607",
        "wc_reply_reviewers": "634;20;23;172",
        "wc_reply_authors": "3361;1141;885;661",
        "reply_reviewers": "3;1;1;1",
        "reply_authors": "10;5;3;2",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            107.25,
            53.774413060488165
        ],
        "wc_strengths_avg": [
            67.75,
            33.840619084171614
        ],
        "wc_weaknesses_avg": [
            146.25,
            66.64973743384141
        ],
        "wc_questions_avg": [
            78.5,
            74.74790966976936
        ],
        "wc_review_avg": [
            399.75,
            135.95472592006502
        ],
        "wc_reply_reviewers_avg": [
            212.25,
            251.13181299867207
        ],
        "wc_reply_authors_avg": [
            1512.0,
            1080.9454195286642
        ],
        "reply_reviewers_avg": [
            1.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            5.0,
            3.082207001484488
        ],
        "replies_avg": [
            33,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": -0.13245323570650439,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17335056964216082744&as_sdt=5,28&sciodt=0,28&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;0;0;1;1;1",
        "aff_unique_norm": "Zhejiang University;Huawei",
        "aff_unique_dep": ";Cloud Computing Technologies",
        "aff_unique_url": "https://www.zju.edu.cn;https://www.huawei.com/en/cloud",
        "aff_unique_abbr": "ZJU;Huawei Cloud",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "71yRyuNYPu",
        "title": "LLMSelect: Knowledge-based Feature Selection with Large Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "How can we leverage the implicit prior knowledge and reasoning capabilities of large language models (LLMs) for standard supervised learning tasks? In this work, we demonstrate that pretrained LLMs can be used to augment traditional machine learning models by selecting high-signal features without looking at the training data. Providing only the candidate feature names and a minimal description of the prediction task, we prompt the LLM to directly output a set of numerical feature importance scores in text and use them for feature selection. In a series of real-world prediction tasks, we show that LLM-based feature selection can lead to strong downstream predictive performance, competitive with that achieved with standard selection methods such as the LASSO and sequential feature selection. We investigate the sensitivity of this approach to various prompt-design and sampling strategies and to the scale of the pretrained LLM, and find that the simple setting of zero-shot prompting with zero-temperature sampling can be sufficient for strong downstream performance, given a large enough LLM. We also demonstrate that the LLM-generated feature importance scores exhibit nontrivial rank correlation with commonly used feature importance measures such as Shapley values, which illustrate the capabilities of LLMs to effectively distill prior knowledge into meaningful numerical scores.",
        "keywords": "Large Language Models;Feature Selection;Machine Learning with Prior Knowledge",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Daniel P Jeong;Zachary Chase Lipton;Pradeep Kumar Ravikumar",
        "authorids": "~Daniel_P_Jeong1;~Zachary_Chase_Lipton1;~Pradeep_Kumar_Ravikumar1",
        "gender": ";Unspecified;M",
        "homepage": "http://djeong.com;http://zacklipton.com;http://www.cs.cmu.edu/~pradeepr/",
        "dblp": "145/9964;;94/3594",
        "google_scholar": ";MN9Kfg8AAAAJ;https://scholar.google.com.tw/citations?user=Q4DTPw4AAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Daniel_P_Jeong1;~Zachary_Chase_Lipton1;~Pradeep_Kumar_Ravikumar1",
        "aff": "Machine Learning Department, Carnegie Mellon University;Carnegie Mellon University;Carnegie Mellon University",
        "aff_domain": "cs.cmu.edu;cmu.edu;cmu.edu",
        "position": "PhD student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\njeong2024llmselect,\ntitle={{LLMS}elect: Knowledge-based Feature Selection with Large Language Models},\nauthor={Daniel P Jeong and Zachary Chase Lipton and Pradeep Kumar Ravikumar},\nyear={2024},\nurl={https://openreview.net/forum?id=71yRyuNYPu}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=71yRyuNYPu",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:19KcixoO1aMJ:scholar.google.com/&scioq=LLMSelect:+Knowledge-based+Feature+Selection+with+Large+Language+Models&hl=en&as_sdt=0,21",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Carnegie Mellon University",
        "aff_unique_dep": "Machine Learning Department",
        "aff_unique_url": "https://www.cmu.edu",
        "aff_unique_abbr": "CMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "72MSbSZtHv",
        "title": "RedMotion: Motion Prediction via Redundancy Reduction",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Predicting the future motion of traffic agents is vital for self-driving vehicles to ensure their safe operation.\nWe introduce RedMotion, a transformer model for motion prediction that incorporates two types of redundancy reduction.\nThe first type of redundancy reduction is induced by an internal transformer decoder and reduces a variable-sized set of road environment tokens, such as road graphs with agent data, to a fixed-sized embedding.\nThe second type of redundancy reduction is a self-supervised learning objective and applies the redundancy reduction principle to embeddings generated from augmented views of road environments.\nOur experiments reveal that our representation learning approach can outperform PreTraM, Traj-MAE, and GraphDINO in a semi-supervised setting.\nOur RedMotion model achieves results that are competitive with those of Scene Transformer or MTR++.\nWe provide an anonymized open source implementation that is accessible via Colab: https://colab.research.google.com/drive/16pwsmOTYdPpbNWf2nm1olXcx1ZmsXHB8",
        "keywords": "Motion prediction;self-supervised learning;trajectory forecasting;self-driving",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Royden Wagner;Omer Sahin Tas;Marvin Klemp;Carlos Fernandez",
        "authorids": "~Royden_Wagner1;~Omer_Sahin_Tas1;~Marvin_Klemp1;~Carlos_Fernandez1",
        "gender": "M;;M;",
        "homepage": ";https://www.omersahintas.com;https://www.linkedin.com/in/marvin-klemp-371428201/;https://www.mrt.kit.edu",
        "dblp": "318/1159;122/3330.html;;79/11147.html",
        "google_scholar": "tvltjqQAAAAJ;https://scholar.google.de/citations?user=opaVrnQAAAAJ;ZOCUUfoAAAAJ;OIF2_EMAAAAJ",
        "orcid": ";;;0000-0002-0417-6762",
        "linkedin": "royden-wagner-35843919b;;;",
        "or_profile": "~Royden_Wagner1;~Omer_Sahin_Tas1;~Marvin_Klemp1;~Carlos_Fernandez1",
        "aff": "Karlsruhe Institute of Technology;FZI Research Center for Information Technology;Karlsruhe Institute of Technology;Karlsruher Institut f\u00fcr Technologie",
        "aff_domain": "kit.edu;fzi.de;kit.edu;kit.edu",
        "position": "PhD student;Research Scientist;PhD student;Postdoc",
        "bibtex": "@misc{\nwagner2024redmotion,\ntitle={RedMotion: Motion Prediction via Redundancy Reduction},\nauthor={Royden Wagner and Omer Sahin Tas and Marvin Klemp and Carlos Fernandez},\nyear={2024},\nurl={https://openreview.net/forum?id=72MSbSZtHv}\n}",
        "github": "",
        "project": "",
        "reviewers": "NoCd;4aEu;1Zub",
        "site": "https://openreview.net/forum?id=72MSbSZtHv",
        "pdf_size": 2670915,
        "rating": "3;5;8",
        "confidence": "5;2;4",
        "soundness": "1;2;3",
        "contribution": "1;2;3",
        "presentation": "2;3;4",
        "wc_summary": "24;111;95",
        "wc_strengths": "16;120;90",
        "wc_weaknesses": "206;623;155",
        "wc_questions": "62;111;17",
        "wc_review": "308;965;357",
        "wc_reply_reviewers": "136;248;0",
        "wc_reply_authors": "438;1189;200",
        "reply_reviewers": "1;1;0",
        "reply_authors": "2;3;1",
        "rating_avg": [
            5.333333333333333,
            2.0548046676563256
        ],
        "confidence_avg": [
            3.6666666666666665,
            1.247219128924647
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            76.66666666666667,
            37.80946383586463
        ],
        "wc_strengths_avg": [
            75.33333333333333,
            43.70608907489004
        ],
        "wc_weaknesses_avg": [
            328.0,
            209.63301266737545
        ],
        "wc_questions_avg": [
            63.333333333333336,
            38.38691906829142
        ],
        "wc_review_avg": [
            543.3333333333334,
            298.8336586724386
        ],
        "wc_reply_reviewers_avg": [
            128.0,
            101.40348448976823
        ],
        "wc_reply_authors_avg": [
            609.0,
            421.4743962172158
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.21677749238103003,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4906014090893876145&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "Karlsruhe Institute of Technology;FZI Research Center for Information Technology;Karlsruher Institut f\u00fcr Technologie",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.kit.edu;https://www.fzi.de;https://www.kit.edu",
        "aff_unique_abbr": "KIT;FZI;KIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "73dhbcXxtV",
        "title": "LOLAMEME: LOGIC, LANGUAGE, MEMORY, MECHANISTIC FRAMEWORK",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The performance of Large Language Models have achieved superhuman breadth\nwith unprecedented depth. At the same time, the language models are mostly\nblack box models and the underlying mechanisms for performance have been\nevaluated using synthetic or mechanistic schemes. We extend current mechanis-\ntic schemes to incorporate Logic, memory, and nuances of Language such as la-\ntent structure. The proposed framework is called LOLAMEME and we provide\ntwo instantiations of LOLAMEME: LoLa and MeMe languages. We then con-\nsider two generative language model architectures: transformer-based GPT-2 and\nconvolution-based Hyena. We propose the hybrid architecture T HEX and use LO-\nLAMEME framework is used to compare three architectures. T HEX outperforms\nGPT-2 and Hyena on select tasks.",
        "keywords": "LOGIC;LANGUAGE;MEMORY;MECHANISTIC;FRAMEWORK;LLM;GENERATIVE;AI",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Jay Desai;Xiaobo Guo;Srinivasan H. Sengamedu",
        "authorids": "~Jay_Desai1;~Xiaobo_Guo1;~Srinivasan_H._Sengamedu1",
        "gender": "M;M;",
        "homepage": ";;",
        "dblp": ";14/2107;38/2372",
        "google_scholar": "https://scholar.google.com/citations?hl=en;z9rwAaIAAAAJ;X9fVMRUAAAAJ",
        "orcid": ";0000-0002-6817-626X;0000-0003-1847-8398",
        "linkedin": "djaym7/;;srinivasan-h-sengamedu",
        "or_profile": "~Jay_Desai1;~Xiaobo_Guo1;~Srinivasan_H._Sengamedu1",
        "aff": "Amazon;Dartmouth College;Amazon",
        "aff_domain": "amazon.com;dartmouth.edu;amazon.com",
        "position": "Researcher;PhD student;Applied Science Manager",
        "bibtex": "@misc{\ndesai2024lolameme,\ntitle={{LOLAMEME}: {LOGIC}, {LANGUAGE}, {MEMORY}, {MECHANISTIC} {FRAMEWORK}},\nauthor={Jay Desai and Xiaobo Guo and Srinivasan H. Sengamedu},\nyear={2024},\nurl={https://openreview.net/forum?id=73dhbcXxtV}\n}",
        "github": "",
        "project": "",
        "reviewers": "JYqN;5Z2e;iHzK",
        "site": "https://openreview.net/forum?id=73dhbcXxtV",
        "pdf_size": 283801,
        "rating": "3;3;3",
        "confidence": "3;3;3",
        "soundness": "2;1;2",
        "contribution": "2;1;2",
        "presentation": "1;1;2",
        "wc_summary": "55;36;107",
        "wc_strengths": "56;1;21",
        "wc_weaknesses": "120;77;291",
        "wc_questions": "31;1;4",
        "wc_review": "262;115;423",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "263;207;654",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            66.0,
            30.011109054259666
        ],
        "wc_strengths_avg": [
            26.0,
            22.73030282830976
        ],
        "wc_weaknesses_avg": [
            162.66666666666666,
            92.42774956088073
        ],
        "wc_questions_avg": [
            12.0,
            13.490737563232042
        ],
        "wc_review_avg": [
            266.6666666666667,
            125.78376507147318
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            374.6666666666667,
            198.83717515148473
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:o2kYI_rQgecJ:scholar.google.com/&scioq=LOLAMEME:+LOGIC,+LANGUAGE,+MEMORY,+MECHANISTIC+FRAMEWORK&hl=en&as_sdt=0,44",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Amazon;Dartmouth College",
        "aff_unique_dep": "Amazon.com, Inc.;",
        "aff_unique_url": "https://www.amazon.com;https://www.dartmouth.edu",
        "aff_unique_abbr": "Amazon;Dartmouth",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "73lu1yw6At",
        "title": "Complexity of Formal Explainability for Sequential Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This work contributes to formal explainability in AI (FXAI) for sequential\n    models, including\n    Recurrent Neural Networks (RNN), Transformers, and automata models from\n    formal\nlanguage theory (e.g.  finite-state automata). We study two common notions\n    of explainability in FXAI: (1) abductive explanations (a.k.a.  minimum sufficient \n    reasons), and (2) counterfactual (a.k.a. contrastive) explanations.\n    To account for various forms of sequential data (e.g. texts, time series,\n    and videos), our models take a sequence of rational numbers as\n    input. \n    We first observe that\n    simple RNN and Transformers suffer from NP-hard complexity (or sometimes \nundecidability) for both types of explanations. The works on extraction of \nautomata from RNN hinge on the assumption that automata are more interpretable\n    than RNN. Interestingly, it turns out that generating abductive explanations\n    for DFA is computationally intractable (PSPACE-complete), for features that\n    are represented by regular languages. On the positive side, \n    we show that deterministic finite automata (DFA) admit polynomial-time \n    complexity for counterfactual explanations. \n    However, DFA are a highly inexpressive model\n    for classifying sequences of numbers. To address this limitation,\nwe provide two expressive extensions of finite automata, while preserving \n    PTIME explainability and admitting automata learning algorithms: (1) \n    deterministic interval automata, and (2) \n    deterministic register automata with a fixed number of registers.",
        "keywords": "Logic-based explanation;sequential models;Computational Complexity;RNN;Automata;Transformers",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "",
        "author": "Anthony Widjaja Lin;Micha Schrader;Marvin K\u00fcnnemann;Pravriti Jaipuriyar",
        "authorids": "~Anthony_Widjaja_Lin1;~Micha_Schrader1;~Marvin_K\u00fcnnemann1;~Pravriti_Jaipuriyar1",
        "gender": "M;M;;",
        "homepage": "https://anthonywlin.github.io/;https://github.com/MichaSchrader;;https://github.com/jaipuriyarp",
        "dblp": "38/2655;309/6099;;",
        "google_scholar": "https://scholar.google.co.uk/citations?user=__5nnYUAAAAJ;;;",
        "orcid": "0000-0003-4715-5096;;;0000-0002-8306-9251",
        "linkedin": ";;;pravriti-jaipuriyar-08a271102",
        "or_profile": "~Anthony_Widjaja_Lin1;~Micha_Schrader1;~Marvin_K\u00fcnnemann1;~Pravriti_Jaipuriyar1",
        "aff": "Universit\u00e4t Kaiserslautern;Universit\u00e4t Kaiserslautern;;Universit\u00e4t Kaiserslautern",
        "aff_domain": "uni-kl.de;uni-kl.de;;uni-kl.de",
        "position": "Full Professor;MS student;;MS student",
        "bibtex": "@misc{\nlin2024complexity,\ntitle={Complexity of Formal Explainability for Sequential  Models},\nauthor={Anthony Widjaja Lin and Micha Schrader and Marvin K{\\\"u}nnemann and Pravriti Jaipuriyar},\nyear={2024},\nurl={https://openreview.net/forum?id=73lu1yw6At}\n}",
        "github": "",
        "project": "",
        "reviewers": "XaKE;ynBt;rsdT;hXKh;56Yr",
        "site": "https://openreview.net/forum?id=73lu1yw6At",
        "pdf_size": 412897,
        "rating": "5;6;6;6;6",
        "confidence": "4;4;3;4;4",
        "soundness": "3;4;3;4;3",
        "contribution": "2;2;2;2;2",
        "presentation": "2;4;3;4;3",
        "wc_summary": "94;51;140;59;337",
        "wc_strengths": "71;99;68;4;115",
        "wc_weaknesses": "248;104;260;217;193",
        "wc_questions": "113;46;35;31;346",
        "wc_review": "526;300;503;311;991",
        "wc_reply_reviewers": "263;86;0;0;238",
        "wc_reply_authors": "918;691;374;799;992",
        "reply_reviewers": "1;1;0;0;2",
        "reply_authors": "2;1;1;1;3",
        "rating_avg": [
            5.8,
            0.39999999999999997
        ],
        "confidence_avg": [
            3.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            3.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.2,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            136.2,
            105.19961977117599
        ],
        "wc_strengths_avg": [
            71.4,
            37.992630864418956
        ],
        "wc_weaknesses_avg": [
            204.4,
            55.42779086342879
        ],
        "wc_questions_avg": [
            114.2,
            119.64848515547533
        ],
        "wc_review_avg": [
            526.2,
            250.62114834945592
        ],
        "wc_reply_reviewers_avg": [
            117.4,
            113.39770720786201
        ],
        "wc_reply_authors_avg": [
            754.8,
            216.30108645127052
        ],
        "reply_reviewers_avg": [
            0.8,
            0.7483314773547883
        ],
        "reply_authors_avg": [
            1.6,
            0.8
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.25000000000000006,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13966694831767173242&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Kaiserslautern",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uni-kl.de",
        "aff_unique_abbr": "Uni KL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "74IIsh2kM6",
        "title": "SMILE: Audio-Visual Speech Recognition with Siamese Masked Interaction Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Audio-Visual Speech Recognition (AVSR) aims to improve the performance of Automatic Speech Recognition (ASR) by incorporating visual cues in addition to audio information. In this task, the crucial aspect is establishing temporal correspondence while aligning the mutually complementary nature of audio and visual modalities. To this end, we propose the Siamese Masked Interaction LEarning (SMILE) framework, which combines the multimodal early fusion strategy and representation alignment methods between audio and visual modalities. SMILE facilitates global interactions among audio-visual features and enables single-modal and cross-modal local alignment. In addition, we propose an adaptive dynamic multimodal fusion strategy that effectively captures the complementary relationship between the audio and visual modalities. With extensive experiments, our model SMILE, when tested with different model scales, achieves state-of-the-art performance on LRS2 and LRS3 datasets under both low-resource and high-resource settings.",
        "keywords": "Audio-Visual Speech Recognition;Siamese Masked Interaction Learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/2139c645b74e489b635c4b12a2c34acb8a7c9311.zip",
        "author": "Tianrui Pan;Jie Liu;Jie Tang;Gangshan Wu",
        "authorids": "~Tianrui_Pan1;~Jie_Liu10;~Jie_Tang4;~Gangshan_Wu1",
        "gender": "F;M;M;M",
        "homepage": "https://github.com/pantianrui;https://njulj.github.io/;http://mcg.nju.edu.cn/member/tangj/index.html;http://mcg.nju.edu.cn/member/gswu/en/index.html",
        "dblp": ";03/2134-40;181/2702-6;78/1123",
        "google_scholar": ";oab9IRYAAAAJ;sJvNOBwAAAAJ;",
        "orcid": ";;;0000-0003-1391-1762",
        "linkedin": ";;;",
        "or_profile": "~Tianrui_Pan1;~Jie_Liu10;~Jie_Tang4;~Gangshan_Wu1",
        "aff": "Nanjing University;Nanjing University;Nanjing University;Nanjing University",
        "aff_domain": "nju.edu.cn;nju.edu.cn;nju.edu.cn;nju.edu.cn",
        "position": "PhD student;Researcher;Associate Professor;Full Professor",
        "bibtex": "@misc{\npan2024smile,\ntitle={{SMILE}: Audio-Visual Speech Recognition with Siamese Masked Interaction Learning},\nauthor={Tianrui Pan and Jie Liu and Jie Tang and Gangshan Wu},\nyear={2024},\nurl={https://openreview.net/forum?id=74IIsh2kM6}\n}",
        "github": "",
        "project": "",
        "reviewers": "reNT;brXn;BvrV;iBsX",
        "site": "https://openreview.net/forum?id=74IIsh2kM6",
        "pdf_size": 1556514,
        "rating": "5;5;5;5",
        "confidence": "4;4;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;3;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "55;70;81;61",
        "wc_strengths": "67;46;55;35",
        "wc_weaknesses": "112;140;91;85",
        "wc_questions": "310;38;4;141",
        "wc_review": "544;294;231;322",
        "wc_reply_reviewers": "83;30;18;0",
        "wc_reply_authors": "963;381;102;415",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "3;2;2;1",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            66.75,
            9.807522622966516
        ],
        "wc_strengths_avg": [
            50.75,
            11.755317945508747
        ],
        "wc_weaknesses_avg": [
            107.0,
            21.529050141610984
        ],
        "wc_questions_avg": [
            123.25,
            119.03649650422345
        ],
        "wc_review_avg": [
            347.75,
            118.0007944888508
        ],
        "wc_reply_reviewers_avg": [
            32.75,
            30.914195768287424
        ],
        "wc_reply_authors_avg": [
            465.25,
            311.98106913721546
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:9Ew6tnKk17IJ:scholar.google.com/&scioq=SMILE:+Audio-Visual+Speech+Recognition+with+Siamese+Masked+Interaction+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Nanjing University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nju.edu.cn",
        "aff_unique_abbr": "Nanjing U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "74YdSRFORA",
        "title": "Out of Sight: A Framework for Egocentric Active Speaker Detection",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Current methods for Active Speaker Detection (ASD) have achieved remarkable performance in commercial movies and social media videos. However, the recent release of the Ego4D dataset has shown the limitations of contemporary ASD\nmethods when applied in the egocentric domain. In addition to the inherent challenges of egocentric data, egocentric video brings a novel prediction target to the ASD task, namely the camera wearer\u2019s speech activity. We propose a comprehensive approach to ASD in the egocentric domain that can model all the prediction targets (visible speakers, camera wearer, and global speech activity). Moreover, our proposal is fully instantiated inside a multimodal transformer module, thereby allowing it to operate in an end-to-end fashion over diverse modality encoders. Through extensive experimentation, we show that this flexible attention mechanism allows us to correctly model and estimate the speech activity of all the visible and unseen persons in a scene. Our proposal (ASD-Mixer) achieves state-\nof-the-art performance in the challenging Ego4D Dataset, outperforming previous state-of-the-art by at last 4.41%.",
        "keywords": "Audiovisual;multimodal;active speaker",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Juan C Leon Alcazar;Chen Zhao;Bernard Ghanem",
        "authorids": "~Juan_C_Leon_Alcazar1;~Chen_Zhao3;~Bernard_Ghanem1",
        "gender": "M;;M",
        "homepage": ";;https://ivul.kaust.edu.sa",
        "dblp": ";;37/2516",
        "google_scholar": "wHJ_cBIAAAAJ;;rVsGTeEAAAAJ",
        "orcid": ";;0000-0002-5534-587X",
        "linkedin": ";;bernardghanem/",
        "or_profile": "~Juan_C_Leon_Alcazar1;~Chen_Zhao3;~Bernard_Ghanem1",
        "aff": "King Abdullah University of Science and Technology;;King Abdullah University of Science and Technology",
        "aff_domain": "kaust.edu.sa;;kaust.edu.sa",
        "position": "Postdoc;;Full Professor",
        "bibtex": "@misc{\nalcazar2024out,\ntitle={Out of Sight: A Framework for Egocentric Active Speaker Detection},\nauthor={Juan C Leon Alcazar and Chen Zhao and Bernard Ghanem},\nyear={2024},\nurl={https://openreview.net/forum?id=74YdSRFORA}\n}",
        "github": "",
        "project": "",
        "reviewers": "1nZN;2WYw;dygL;kwFT",
        "site": "https://openreview.net/forum?id=74YdSRFORA",
        "pdf_size": 3385847,
        "rating": "1;3;6;6",
        "confidence": "4;4;3;4",
        "soundness": "1;3;3;3",
        "contribution": "1;2;2;2",
        "presentation": "2;2;4;4",
        "wc_summary": "110;114;154;88",
        "wc_strengths": "34;26;38;42",
        "wc_weaknesses": "331;288;160;32",
        "wc_questions": "39;54;75;2",
        "wc_review": "514;482;427;164",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "37;519;519;100",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;6;3;2",
        "rating_avg": [
            4.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            1.0
        ],
        "wc_summary_avg": [
            116.5,
            23.806511714234826
        ],
        "wc_strengths_avg": [
            35.0,
            5.916079783099616
        ],
        "wc_weaknesses_avg": [
            202.75,
            116.93881947411647
        ],
        "wc_questions_avg": [
            42.5,
            26.650515942472857
        ],
        "wc_review_avg": [
            396.75,
            137.9336344043758
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            293.75,
            226.34859730071224
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            3.0,
            1.8708286933869707
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5443310539518174,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:B4p96g2SaAcJ:scholar.google.com/&scioq=Out+of+Sight:+A+Framework+for+Egocentric+Active+Speaker+Detection&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "King Abdullah University of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kast.kau.edu.sa",
        "aff_unique_abbr": "KAUST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Saudi Arabia"
    },
    {
        "id": "760br3YEtY",
        "title": "($\\texttt{PEEP}$) $\\textbf{P}$redicting $\\textbf{E}$nzym$\\textbf{e}$ $\\textbf{P}$romiscuity with its Molecule Mate \u2013 an Attentive Metric Learning Solution",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Annotating the functions of proteins (e.g., enzymes) is a fundamental challenge, due to their diverse functionalities and rapidly increased number of protein sequences in databases. Traditional approaches have limited capability and suffer from false positive predictions. Recent machine learning (ML) methods reach satisfactory prediction accuracy but still fail to generalize, especially for less-studied proteins and those with previously uncharacterized functions or promiscuity. To address these pain points, we propose a novel ML algorithm, PEEP, to predict enzyme promiscuity, which integrates biology priors of protein functionality to regularize the model learning. To be specific, at the input level, PEEP fuses the corresponding molecule into protein embeddings to gain their reaction information; at the model level, a tailored self-attention is leveraged to capture importance residues which we found are aligned with the active site in protein pocket structure; at the objective level, we embed functionality label hierarchy into metric learning objectives by imposing larger distance margin between proteins that have less functionality in common. PEEP is extensively validated on three public benchmarks, achieving up to 4.6%,3.1%,3.7% improvements on F-1 scores compared to existing methods. Moreover, it demonstrates impressive generalization to unseen protein sequences with unseen functionalities. Codes are included in the supplement.",
        "keywords": "Protein Engineering; Metric Learning;",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/c73442cde6e6b9893134513ccd4a1ebfa1e36ae5.zip",
        "author": "Xuxi Chen;Daniel Jesus Diaz;Chengyue Gong;Alex Dimakis;Adam Klivans;Zhangyang Wang;Tianlong Chen",
        "authorids": "~Xuxi_Chen1;~Daniel_Jesus_Diaz1;~Chengyue_Gong1;~Alex_Dimakis1;~Adam_Klivans1;~Zhangyang_Wang1;~Tianlong_Chen1",
        "gender": "Unspecified;M;M;M;M;M;M",
        "homepage": ";;;https://people.eecs.berkeley.edu/~alexdimakis/;http://www.cs.utexas.edu/~klivans;https://vita-group.github.io;https://tianlong-chen.github.io",
        "dblp": "267/9662;;209/4862;19/5000.html;k/AdamRKlivans;119/4026;",
        "google_scholar": "afsDlKYAAAAJ;lVD0CNEAAAAJ;AscakBgAAAAJ;JSFmVQEAAAAJ;;pxFyKAIAAAAJ;LE3ctn0AAAAJ",
        "orcid": ";0000-0002-7891-2128;;;;;0000-0001-7774-8197",
        "linkedin": ";aiproteins/;;alex-dimakis-b1b20320/;;;tianlong-chen-783862167/",
        "or_profile": "~Xuxi_Chen1;~Daniel_Jesus_Diaz1;~Chengyue_Gong1;~Alex_Dimakis1;~Adam_Klivans1;~Zhangyang_Wang1;~Tianlong_Chen1",
        "aff": "University of Texas at Austin;University of Texas at Austin;University of Texas at Austin;University of Texas at Austin;University of Texas, Austin;University of Texas at Austin;Harvard University",
        "aff_domain": "utexas.edu;utexas.edu;cs.utexas.edu;utexas.edu;cs.utexas.edu;utexas.edu;harvard.edu",
        "position": "PhD student;Postdoc;grad student;Full Professor;Professor;Associate Professor;Postdoc",
        "bibtex": "@misc{\nchen2024textttpeep,\ntitle={(\\${\\textbackslash}texttt\\{{PEEP}\\}\\$) \\${\\textbackslash}textbf\\{P\\}\\$redicting \\${\\textbackslash}textbf\\{E\\}\\$nzym\\${\\textbackslash}textbf\\{e\\}\\$ \\${\\textbackslash}textbf\\{P\\}\\$romiscuity with its Molecule Mate {\\textendash} an Attentive Metric Learning Solution},\nauthor={Xuxi Chen and Daniel Jesus Diaz and Chengyue Gong and Alex Dimakis and Adam Klivans and Zhangyang Wang and Tianlong Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=760br3YEtY}\n}",
        "github": "",
        "project": "",
        "reviewers": "QFnk;sx29;nNj8;siYE;fk1t",
        "site": "https://openreview.net/forum?id=760br3YEtY",
        "pdf_size": 1786350,
        "rating": "5;5;6;6;6",
        "confidence": "2;4;3;4;3",
        "soundness": "2;3;3;3;3",
        "contribution": "2;3;2;3;2",
        "presentation": "3;3;3;4;3",
        "wc_summary": "24;103;93;89;85",
        "wc_strengths": "80;73;47;69;31",
        "wc_weaknesses": "45;50;39;183;88",
        "wc_questions": "29;5;17;279;71",
        "wc_review": "178;231;196;620;275",
        "wc_reply_reviewers": "0;12;0;0;20",
        "wc_reply_authors": "345;299;277;1001;454",
        "reply_reviewers": "0;1;0;0;1",
        "reply_authors": "2;1;1;3;1",
        "rating_avg": [
            5.6,
            0.48989794855663565
        ],
        "confidence_avg": [
            3.2,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            3.2,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            78.8,
            28.045677028732964
        ],
        "wc_strengths_avg": [
            60.0,
            18.2208671582886
        ],
        "wc_weaknesses_avg": [
            81.0,
            53.80334562088124
        ],
        "wc_questions_avg": [
            80.2,
            101.85951109248464
        ],
        "wc_review_avg": [
            300.0,
            163.3927782981855
        ],
        "wc_reply_reviewers_avg": [
            6.4,
            8.2365041127896
        ],
        "wc_reply_authors_avg": [
            475.2,
            269.88768034128566
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.6,
            0.8
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.21821789023599236,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0;0;0;0;0;0;1",
        "aff_unique_norm": "University of Texas at Austin;Harvard University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.utexas.edu;https://www.harvard.edu",
        "aff_unique_abbr": "UT Austin;Harvard",
        "aff_campus_unique_index": "0;0;0;0;0;0",
        "aff_campus_unique": "Austin;",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "76gh3RShsM",
        "title": "Mastering Pixel-Based Reinforcement Learning via Positive Unlabeled Policy-Guided Contrast",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Real-world reinforcement learning has received a significant amount of attention very recently. A fundamental yet challenging problem in this learning paradigm is perceiving real-world environmental information, such that \\textit{pixel-based} reinforcement learning emerges, which aims to learn representation from visual observations for policy optimization. In this article, we profoundly elaborate the frameworks of benchmark methods and demonstrate a long-standing \\textit{paradox} challenging current methods: in different training phases, exploring visual semantic information can improve and prevent the performance of the learned feature representations from improving. In practice, we further disclose that the over-redundancy issue generally halts the rise of sample efficiency among baseline methods. To remedy the uncovered deficiency of existing methods, we introduce a novel plug-and-play method for pixel-based reinforcement learning. Our model involves the \\textit{positive unlabeled policy-guided contrast} to learn jointly anti-redundant and policy-optimization-relevant visual semantic information during training. To sufficiently elucidate the proposed method's innate superiority, we revisit the pixel-based reinforcement learning paradigm from the information theory perspective. The theoretical evidence proves that the proposed model can achieve the tighter lower bound of the mutual information between the policy optimization-related information and the information of the representation derived by the encoder. To carry out the evaluation of our model, we conduct extensive benchmark experiments and illustrate the superior performance of our method over existing methods with respect to the pixel observation environments.",
        "keywords": "Pixel Observation;Reinforcement Learning;Self-Supervised Learning;Contrastive Learning;Visual Control Task",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/72c7b9ced0ccba72249d24204c2a5a1ccca8ca69.zip",
        "author": "Zehua Zang;Jiangmeng Li;Chuxiong Sun;Jiabao Li;Rui Wang;Lixiang Liu;Fuchun Sun",
        "authorids": "~Zehua_Zang1;~Jiangmeng_Li1;~Chuxiong_Sun2;~Jiabao_Li2;~Rui_Wang8;~Lixiang_Liu1;~Fuchun_Sun1",
        "gender": "M;M;;M;F;M;M",
        "homepage": "https://github.com/ZangZehua;https://jiangmengli.github.io/;;;;https://people.ucas.ac.cn/~liulx;https://www.cs.tsinghua.edu.cn/info/1121/3555.htm",
        "dblp": "364/6601;293/0997;214/9412;;06/2293;;",
        "google_scholar": "PWj9Zk8AAAAJ;https://scholar.google.com.sg/citations?user=-kU4VLcAAAAJ;;;;;",
        "orcid": "0000-0001-8969-3218;0000-0002-3376-1522;0000-0002-4956-6924;0009-0005-4456-3547;0000-0001-5369-9116;;",
        "linkedin": ";jiangmeng-li-86aaa7125/;;;;;",
        "or_profile": "~Zehua_Zang1;~Jiangmeng_Li1;~Chuxiong_Sun2;~Jiabao_Li2;~Rui_Wang8;~Lixiang_Liu1;~Fuchun_Sun1",
        "aff": "Institute of Software Chinese Academy of Sciences;Institute of Software, Chinese Academy of Sciences;Chinese Academy of Sciences, Institute of Software;University of Science and Technology Beijing;;University of Chinese Academy of Sciences;Tsinghua University",
        "aff_domain": "iscas.ac.cn;iscas.ac.cn;iscas.ac.cn;ustb.edu.cn;;ucas.ac.cn;cs.tsinghua.edu.cn",
        "position": "PhD student;Assistant Professor;Postdoc;MS student;;Full Professor;Full Professor",
        "bibtex": "@misc{\nzang2024mastering,\ntitle={Mastering Pixel-Based Reinforcement Learning via Positive Unlabeled Policy-Guided Contrast},\nauthor={Zehua Zang and Jiangmeng Li and Chuxiong Sun and Jiabao Li and Rui Wang and Lixiang Liu and Fuchun Sun},\nyear={2024},\nurl={https://openreview.net/forum?id=76gh3RShsM}\n}",
        "github": "",
        "project": "",
        "reviewers": "LKxU;E7VW;bVmG;kGtJ",
        "site": "https://openreview.net/forum?id=76gh3RShsM",
        "pdf_size": 3764375,
        "rating": "1;5;5;5",
        "confidence": "4;4;2;3",
        "soundness": "1;3;3;2",
        "contribution": "1;2;2;2",
        "presentation": "1;3;1;2",
        "wc_summary": "67;86;62;14",
        "wc_strengths": "8;37;67;14",
        "wc_weaknesses": "371;267;90;144",
        "wc_questions": "5;20;35;6",
        "wc_review": "451;410;254;178",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.7320508075688772
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            57.25,
            26.52710877574109
        ],
        "wc_strengths_avg": [
            31.5,
            23.178653972998518
        ],
        "wc_weaknesses_avg": [
            218.0,
            109.16730279712877
        ],
        "wc_questions_avg": [
            16.5,
            12.216791722870616
        ],
        "wc_review_avg": [
            323.25,
            111.51092995756066
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:_fwTQk54De0J:scholar.google.com/&scioq=Mastering+Pixel-Based+Reinforcement+Learning+via+Positive+Unlabeled+Policy-Guided+Contrast&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;2;3",
        "aff_unique_norm": "Chinese Academy of Sciences;University of Science and Technology Beijing;University of Chinese Academy of Sciences;Tsinghua University",
        "aff_unique_dep": "Institute of Software;;;",
        "aff_unique_url": "http://www.is.cas.cn;http://www.ustb.edu.cn;http://www.ucas.ac.cn;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "CAS;USTB;UCAS;THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "RetroBridge: Modeling Retrosynthesis with Markov Bridges",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19375",
        "id": "770DetV8He",
        "author_site": "Ilia Igashov, Arne Schneuing, Marwin Segler, Michael Bronstein, Bruno Correia",
        "tldr": "",
        "abstract": "Retrosynthesis planning is a fundamental challenge in chemistry which aims at designing multi-step reaction pathways from commercially available starting materials to a target molecule. Each step in multi-step retrosynthesis planning requires accurate prediction of possible precursor molecules given the target molecule and confidence estimates to guide heuristic search algorithms. We model single-step retrosynthesis as a distribution learning problem in a discrete state space. First, we introduce the Markov Bridge Model, a generative framework aimed to approximate the dependency between two intractable discrete distributions accessible via a finite sample of coupled data points. Our framework is based on the concept of a Markov bridge, a Markov process pinned at its endpoints. Unlike diffusion-based methods, our Markov Bridge Model does not need a tractable noise distribution as a sampling proxy and directly operates on the input product molecules as samples from the intractable prior distribution. We then address the retrosynthesis planning problem with our novel framework and introduce RetroBridge, a template-free retrosynthesis modeling approach that achieves state-of-the-art results on standard evaluation benchmarks.",
        "keywords": "Retrosynthesis;Reactions;Chemistry;Drug Discovery;Markov Bridge",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/5425ef5b68639ce9c53f9c8ea9f651d33a1ddbfe.zip",
        "author": "Ilia Igashov;Arne Schneuing;Marwin Segler;Michael M. Bronstein;Bruno Correia",
        "authorids": "~Ilia_Igashov1;~Arne_Schneuing1;~Marwin_Segler2;~Michael_M._Bronstein1;~Bruno_Correia1",
        "gender": "M;Not Specified;M;M;",
        "homepage": "https://igashov.github.io;https://people.epfl.ch/arne.schneuing?lang=en;http://www.inf.usi.ch/bronstein/;https://people.epfl.ch/bruno.correia/?lang=en;",
        "dblp": "278/8797;;07/2668;;185/0993",
        "google_scholar": "ruubko4AAAAJ;lya44IUAAAAJ;UU3N6-UAAAAJ;https://scholar.google.ch/citations?user=Va246xYAAAAJ;imsL94QAAAAJ",
        "orcid": "0000-0002-6214-2827;0009-0000-9924-6921;;;",
        "linkedin": ";;mbronstein/;;",
        "or_profile": "~Ilia_Igashov1;~Arne_Schneuing1;~Michael_M._Bronstein1;~Bruno_Correia1;~Marwin_Segler1",
        "aff": "EPFL - EPF Lausanne;Microsoft;University of Oxford;;Microsoft",
        "aff_domain": "epfl.ch;microsoft.com;ox.ac.uk;;microsoft.com",
        "position": "PhD student;Intern;Full Professor;;Researcher",
        "bibtex": "@inproceedings{\nigashov2024retrobridge,\ntitle={RetroBridge: Modeling Retrosynthesis with Markov Bridges},\nauthor={Ilia Igashov and Arne Schneuing and Marwin Segler and Michael M. Bronstein and Bruno Correia},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=770DetV8He}\n}",
        "github": "",
        "project": "",
        "reviewers": "CFGE;vNHE;g93h;4mon",
        "pdf_size": 4535773,
        "rating": "6;6;8;8",
        "confidence": "3;5;4;4",
        "soundness": "3;3;3;4",
        "contribution": "2;3;4;3",
        "presentation": "4;2;3;3",
        "wc_summary": "25;44;58;91",
        "wc_strengths": "39;59;53;113",
        "wc_weaknesses": "113;90;47;69",
        "wc_questions": "189;55;2;36",
        "wc_review": "366;248;160;309",
        "wc_reply_reviewers": "84;0;32;18",
        "wc_reply_authors": "1532;845;214;469",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "3;2;1;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            54.5,
            24.109126902482387
        ],
        "wc_strengths_avg": [
            66.0,
            28.089143810376278
        ],
        "wc_weaknesses_avg": [
            79.75,
            24.488517717493643
        ],
        "wc_questions_avg": [
            70.5,
            71.00176054155277
        ],
        "wc_review_avg": [
            270.75,
            76.35239027037726
        ],
        "wc_reply_reviewers_avg": [
            33.5,
            31.284980421921315
        ],
        "wc_reply_authors_avg": [
            765.0,
            496.46399668052464
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 28,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8692592874490665610&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=770DetV8He",
        "pdf": "https://openreview.net/pdf?id=770DetV8He",
        "email": "epfl.ch;microsoft.com;ox.ac.uk;;microsoft.com",
        "author_num": 5,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "EPFL;Microsoft;University of Oxford",
        "aff_unique_dep": ";Microsoft Corporation;",
        "aff_unique_url": "https://www.epfl.ch;https://www.microsoft.com;https://www.ox.ac.uk",
        "aff_unique_abbr": "EPFL;Microsoft;Oxford",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Lausanne;",
        "aff_country_unique_index": "0;1;2;1",
        "aff_country_unique": "Switzerland;United States;United Kingdom"
    },
    {
        "id": "774elYc5tw",
        "title": "Unlocking Anticipatory Text Generation: A Constrained Approach for Faithful Decoding with Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) have demonstrated a powerful ability for text generation. However, achieving optimal results with a given prompt or instruction can be challenging, especially for billion-sized models. Additionally, undesired behaviors such as toxicity or hallucinations can manifest. While much larger models (e.g., ChatGPT) may demonstrate strength in mitigating these issues, there is still no guarantee of complete prevention. In this work, we propose formalizing text generation as a future-constrained generation problem to minimize undesirable behaviors and enforce faithfulness to instructions. The estimation of future constraint satisfaction, accomplished using LLMs, guides the text generation process. Our extensive experiments demonstrate the effectiveness of the proposed approach across three distinct text generation tasks: keyword-constrained generation (Lin et al., 2020), toxicity reduction (Gehman et al., 2020), and factual correctness in question-answering (Gao et al., 2023).",
        "keywords": "LLM decoding;keyword-constrained generation;toxicity reduction;factual correctness",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Lifu Tu;Semih Yavuz;Jin Qu;Jiacheng Xu;Rui Meng;Caiming Xiong;Yingbo Zhou",
        "authorids": "~Lifu_Tu1;~Semih_Yavuz1;~Jin_Qu1;~Jiacheng_Xu2;~Rui_Meng1;~Caiming_Xiong1;~Yingbo_Zhou1",
        "gender": "M;M;M;M;M;;M",
        "homepage": "http://ttic.uchicago.edu/~lifu/;;https://jiacheng-xu.github.io/;http://memray.me;http://cmxiong.com/;;",
        "dblp": "176/5280.html;;188/6025;;80/7282;72/8614;",
        "google_scholar": ";;yfbcnfUAAAAJ;s6h8L_UAAAAJ;vaSdahkAAAAJ;H_6RQ7oAAAAJ;krh3p8AAAAAJ",
        "orcid": ";;;0000-0001-5583-4924;;;",
        "linkedin": ";jin-qu/;;memray/;caiming-xiong-150a1417;yingbozhou/;semih-yavuz-4303518b",
        "or_profile": "~Lifu_Tu1;~Jin_Qu1;~Jiacheng_Xu2;~Rui_Meng1;~Caiming_Xiong1;~Yingbo_Zhou1;~Semih_Yavuz2",
        "aff": "Salesforce AI Research;Salesforce AI Research;SalesForce.com;Salesforce Research;Salesforce Research;Salesforce Research;SalesForce.com",
        "aff_domain": "salesforce.com;salesforce.com;salesforce.com;salesforce.com;salesforce.com;salesforce.com;salesforce.com",
        "position": "research scientist;Researcher;Researcher;Researcher;Research Scientist;Research Scientist;Research Scientist",
        "bibtex": "@misc{\ntu2024unlocking,\ntitle={Unlocking Anticipatory Text Generation: A Constrained Approach for Faithful Decoding with Large Language Models},\nauthor={Lifu Tu and Semih Yavuz and Jin Qu and Jiacheng Xu and Rui Meng and Caiming Xiong and Yingbo Zhou},\nyear={2024},\nurl={https://openreview.net/forum?id=774elYc5tw}\n}",
        "github": "",
        "project": "",
        "reviewers": "Ht7A;eM49;h9Ue;cGVr",
        "site": "https://openreview.net/forum?id=774elYc5tw",
        "pdf_size": 702047,
        "rating": "3;3;5;6",
        "confidence": "4;3;4;3",
        "soundness": "2;2;3;3",
        "contribution": "2;4;3;2",
        "presentation": "1;1;3;3",
        "wc_summary": "111;100;34;94",
        "wc_strengths": "82;40;88;12",
        "wc_weaknesses": "258;271;90;25",
        "wc_questions": "1;12;1;45",
        "wc_review": "452;423;213;176",
        "wc_reply_reviewers": "0;49;10;6",
        "wc_reply_authors": "514;276;327;332",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.0,
            1.0
        ],
        "wc_summary_avg": [
            84.75,
            29.92803869283786
        ],
        "wc_strengths_avg": [
            55.5,
            31.188940347501386
        ],
        "wc_weaknesses_avg": [
            161.0,
            106.12021485089446
        ],
        "wc_questions_avg": [
            14.75,
            18.0329559418305
        ],
        "wc_review_avg": [
            316.0,
            122.63156200587188
        ],
        "wc_reply_reviewers_avg": [
            16.25,
            19.240257274787155
        ],
        "wc_reply_authors_avg": [
            362.25,
            90.31161331744661
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.19245008972987526,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2262832977763853226&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0;0;0;0;0",
        "aff_unique_norm": "Salesforce",
        "aff_unique_dep": "Salesforce AI Research",
        "aff_unique_url": "https://www.salesforce.com",
        "aff_unique_abbr": "Salesforce AI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Exploring the Common Appearance-Boundary Adaptation for Nighttime Optical Flow",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19374",
        "id": "776lhoaulC",
        "author_site": "Hanyu Zhou, Yi Chang, Haoyue Liu, YAN WENDING, Yuxing Duan, Zhiwei Shi, Luxin Yan",
        "tldr": "",
        "abstract": "We investigate a challenging task of nighttime optical flow, which suffers from weakened texture and amplified noise. These degradations weaken discriminative visual features, thus causing invalid motion feature matching. Typically, existing methods employ domain adaptation to transfer knowledge from auxiliary domain to nighttime domain in either input visual space or output motion space. However, this direct adaptation is ineffective, since there exists a large domain gap due to the intrinsic heterogeneous nature of the feature representations between auxiliary and nighttime domains. To overcome this issue, we explore a common-latent space as the intermediate bridge to reinforce the feature alignment between auxiliary and nighttime domains. In this work, we exploit two auxiliary daytime and event domains, and propose a novel common appearance-boundary adaptation framework for nighttime optical flow. In appearance adaptation, we employ the intrinsic image decomposition to embed the auxiliary daytime image and the nighttime image into a reflectance-aligned common space. We discover that motion distributions of the two reflectance maps are very similar, benefiting us to consistently transfer motion appearance knowledge from daytime to nighttime domain. In boundary adaptation, we theoretically derive the motion correlation formula between nighttime image and accumulated events within a spatiotemporal gradient-aligned common space. We figure out that the correlation of the two spatiotemporal gradient maps shares significant discrepancy, benefitting us to contrastively transfer boundary knowledge from event to nighttime domain. Moreover, appearance adaptation and boundary adaptation are complementary to each other, since they could jointly transfer global motion and local boundary knowledge to the nighttime domain. Extensive experiments have been performed to verify the superiority of the proposed method.",
        "keywords": "nighttime optical flow;event camera;domain adaptation;common space",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/135190ac7fe30de3e806610e290c0c8d4bd76b47.zip",
        "author": "Hanyu Zhou;Yi Chang;Haoyue Liu;YAN WENDING;Yuxing Duan;Zhiwei Shi;Luxin Yan",
        "authorids": "~Hanyu_Zhou1;~Yi_Chang2;~Haoyue_Liu1;~YAN_WENDING1;~Yuxing_Duan1;~Zhiwei_Shi2;~Luxin_Yan2",
        "gender": "M;M;M;M;M;M;M",
        "homepage": "https://hyzhouboy.github.io/;https://github.com/Liu-haoyue;;;https://alex-code-hust.github.io/Alex.github.io/;http://faculty.hust.edu.cn/yanluxin/en/index.htm;https://owuchangyuo.github.io/",
        "dblp": "262/5105;200/2303;262/3827;335/6783;;81/9161;02/5438-2",
        "google_scholar": "bRXguCgAAAAJ;;;Hn5oJJsAAAAJ;;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com.hk/citations?user=I1nZ67YAAAAJ",
        "orcid": "0009-0007-1986-4975;;0000-0001-5993-8405;;;;0000-0001-8542-5937",
        "linkedin": "hanyu-zhou-0b67b3274/;;;;louis-alex-2530a4287/;;",
        "or_profile": "~Hanyu_Zhou1;~Haoyue_Liu1;~YAN_WENDING1;~Yuxing_Duan1;~Zhiwei_Shi2;~Luxin_Yan2;~Yi_Chang3",
        "aff": "Huazhong University of Science and Technology;Huazhong University of Science and Technology;Huawei Technologies Ltd.;Huazhong University of Science and Technology;Huazhong University of Science and Technology;Huazhong University of Science and Technology;Huazhong University of Science and Technology",
        "aff_domain": "hust.edu.cn;hust.edu.cn;huawei.com;hust.edu.cn;hust.edu.cn;hust.edu.cn;hust.edu.cn",
        "position": "PhD student;PhD student;Researcher;PhD student;MS student;Full Professor;Associate Professor",
        "bibtex": "@inproceedings{\nzhou2024exploring,\ntitle={Exploring the Common Appearance-Boundary Adaptation for Nighttime Optical Flow},\nauthor={Hanyu Zhou and Yi Chang and Haoyue Liu and YAN WENDING and Yuxing Duan and Zhiwei Shi and Luxin Yan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=776lhoaulC}\n}",
        "github": "",
        "project": "",
        "reviewers": "koka;hzUU;R9ad",
        "pdf_size": 20187515,
        "rating": "6;8;10",
        "confidence": "4;2;3",
        "soundness": "3;3;3",
        "contribution": "3;3;4",
        "presentation": "3;4;4",
        "wc_summary": "97;63;87",
        "wc_strengths": "50;43;77",
        "wc_weaknesses": "57;23;43",
        "wc_questions": "74;13;6",
        "wc_review": "278;142;213",
        "wc_reply_reviewers": "0;0;19",
        "wc_reply_authors": "1335;313;321",
        "reply_reviewers": "0;0;1",
        "reply_authors": "4;3;4",
        "rating_avg": [
            8.0,
            1.632993161855452
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            82.33333333333333,
            14.2672897060218
        ],
        "wc_strengths_avg": [
            56.666666666666664,
            14.65908895153068
        ],
        "wc_weaknesses_avg": [
            41.0,
            13.9522996909709
        ],
        "wc_questions_avg": [
            31.0,
            30.539591789456953
        ],
        "wc_review_avg": [
            211.0,
            55.53977553669682
        ],
        "wc_reply_reviewers_avg": [
            6.333333333333333,
            8.956685895029603
        ],
        "wc_reply_authors_avg": [
            656.3333333333334,
            479.9009156991565
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8075682768590297256&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=776lhoaulC",
        "pdf": "https://openreview.net/pdf?id=776lhoaulC",
        "email": "hust.edu.cn;hust.edu.cn;huawei.com;hust.edu.cn;hust.edu.cn;hust.edu.cn;hust.edu.cn",
        "author_num": 7,
        "aff_unique_index": "0;0;1;0;0;0;0",
        "aff_unique_norm": "Huazhong University of Science and Technology;Huawei",
        "aff_unique_dep": ";Huawei Technologies",
        "aff_unique_url": "http://www.hust.edu.cn;https://www.huawei.com",
        "aff_unique_abbr": "HUST;Huawei",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "77N93tc3o5",
        "title": "Deep Independent Vector Analysis",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We introduce a deep multivariate latent variable model, Deep Independent Vector Analysis (DeepIVA), for learning linked and identifiable disentangled representations across multiple data modalities by unifying multidataset independent subspace analysis (MISA) and identifiable variational autoencoders (iVAE). DeepIVA aims to leverage hidden linkage information via the MISA loss to attain latent cross-modal alignment while leveraging the identifiability properties of the iVAE to ensure proper unimodal disentanglement. We propose a more strict set of performance measures, and demonstrate that DeepIVA can successfully recover nonlinearly mixed multimodal sources on multiple linked synthetic datasets compared with iVAE and MISA. We then apply DeepIVA on a large multimodal neuroimaging dataset, and show that DeepIVA can reveal linked nonlinear imaging sources associated with phenotype measures including age and sex.",
        "keywords": "multimodal fusion;nonlinear IVA;MISA;iVAE",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/c0e99dfac4f06706f29dd4a4b13a869df51ec49d.pdf",
        "author": "Xinhui Li;Rogers F Silva;Vince Calhoun",
        "authorids": "~Xinhui_Li2;~Rogers_F_Silva1;~Vince_Calhoun1",
        "gender": "F;M;",
        "homepage": "https://xinhuili.github.io/;https://trendscenter.org/rogers-silva/;",
        "dblp": ";154/4305;48/3821.html",
        "google_scholar": "YKtWorEAAAAJ;cMtwwG8AAAAJ;WNOoGKIAAAAJ",
        "orcid": "0000-0001-5604-9493;0000-0002-7271-1288;",
        "linkedin": "xinhui-li/;rogersfsilva;",
        "or_profile": "~Xinhui_Li2;~Rogers_F_Silva1;~Vince_Calhoun1",
        "aff": "Georgia Institute of Technology;TReNDS Center (Georgia State University, Georgia Institute of Technology, Emory University);Emory University",
        "aff_domain": "gatech.edu;gsu.edu;emory.edu",
        "position": "PhD student;Researcher;Full Professor",
        "bibtex": "@misc{\nli2024deep,\ntitle={Deep Independent Vector Analysis},\nauthor={Xinhui Li and Rogers F Silva and Vince Calhoun},\nyear={2024},\nurl={https://openreview.net/forum?id=77N93tc3o5}\n}",
        "github": "",
        "project": "",
        "reviewers": "Uwfa;FDhN;queK;dLxh",
        "site": "https://openreview.net/forum?id=77N93tc3o5",
        "pdf_size": 17338729,
        "rating": "3;5;5;5",
        "confidence": "4;2;3;4",
        "soundness": "2;2;3;1",
        "contribution": "2;2;2;1",
        "presentation": "2;3;3;2",
        "wc_summary": "55;89;70;44",
        "wc_strengths": "5;70;138;24",
        "wc_weaknesses": "130;66;160;207",
        "wc_questions": "37;100;169;556",
        "wc_review": "227;325;537;831",
        "wc_reply_reviewers": "46;19;66;784",
        "wc_reply_authors": "608;312;1133;1506",
        "reply_reviewers": "1;1;1;2",
        "reply_authors": "2;1;3;4",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            64.5,
            16.889345754054535
        ],
        "wc_strengths_avg": [
            59.25,
            51.24146270355678
        ],
        "wc_weaknesses_avg": [
            140.75,
            51.143792389692806
        ],
        "wc_questions_avg": [
            215.5,
            202.055066751616
        ],
        "wc_review_avg": [
            480.0,
            231.56208670678367
        ],
        "wc_reply_reviewers_avg": [
            228.75,
            321.00730131883296
        ],
        "wc_reply_authors_avg": [
            889.75,
            461.5497670890973
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Georgia Institute of Technology;Georgia State University;Emory University",
        "aff_unique_dep": ";TReNDS Center;",
        "aff_unique_url": "https://www.gatech.edu;https://www.gsu.edu;https://www.emory.edu",
        "aff_unique_abbr": "Georgia Tech;GSU;Emory",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "78Fp8ac3Hi",
        "title": "Violence Detection and Localization in Video Through Subgroup Analysis",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In an era of rapid technological advancements, computer systems play a crucial role in early Violence Detection (VD) and localization, which is critical for timely human intervention. However, existing VD methods often fall short, lacking applicability to surveillance data, and failing to address the localization and social dimension of violent events.\nTo address these shortcomings, we propose a novel approach to integrate social subgroups into VD. Our method recognizes and tracks subgroups across frames, providing an additional layer of information in VD. This enables the system to not only detect violence at video-level, but also to identify the groups involved. This adaptable add-on module can enhance the applicability of existing models and algorithms.\nThrough extensive experiments on the SCFD and RWF-2000 surveillance datasets, we find that our approach improves social awareness in VD by localizing the people involved in an act of violence. The system offers a small performance boost on the SCFD dataset and maintains performance on RWF-2000, reaching 91.3% and 87.2% accuracy respectively, demonstrating its practical utility while performing close to state-of-the-art methods. Furthermore, our method generalizes well to unseen datasets, marking a promising advance in early VD.",
        "keywords": "violence detection;violence localization;subgroup analysis;subgroup tracking",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Emmeke A Veltmeijer;Morris E Franken;Charlotte Gerritsen",
        "authorids": "~Emmeke_A_Veltmeijer1;~Morris_E_Franken1;~Charlotte_Gerritsen1",
        "gender": "F;;F",
        "homepage": ";;https://charlottegerritsen.com/",
        "dblp": "252/8837.html;;",
        "google_scholar": "Gg3kiW0AAAAJ;;",
        "orcid": "0000-0002-0749-4520;;",
        "linkedin": "emmeke-veltmeijer-70730214b/;;",
        "or_profile": "~Emmeke_A_Veltmeijer1;~Morris_E_Franken1;~Charlotte_Gerritsen1",
        "aff": "Vrije Universiteit Amsterdam;;Vrije Universiteit Amsterdam",
        "aff_domain": "vu.nl;;vu.nl",
        "position": "PhD student;;Associate Professor",
        "bibtex": "@misc{\nveltmeijer2024violence,\ntitle={Violence Detection and Localization in Video Through Subgroup Analysis},\nauthor={Emmeke A Veltmeijer and Morris E Franken and Charlotte Gerritsen},\nyear={2024},\nurl={https://openreview.net/forum?id=78Fp8ac3Hi}\n}",
        "github": "",
        "project": "",
        "reviewers": "WPpq;n6jP;u3A5;bXAa",
        "site": "https://openreview.net/forum?id=78Fp8ac3Hi",
        "pdf_size": 6067759,
        "rating": "3;3;5;5",
        "confidence": "4;4;3;4",
        "soundness": "2;2;2;3",
        "contribution": "3;2;2;2",
        "presentation": "2;3;2;3",
        "wc_summary": "182;68;39;48",
        "wc_strengths": "37;19;23;34",
        "wc_weaknesses": "108;180;183;86",
        "wc_questions": "43;69;105;9",
        "wc_review": "370;336;350;177",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            84.25,
            57.40372374680932
        ],
        "wc_strengths_avg": [
            28.25,
            7.46240577829965
        ],
        "wc_weaknesses_avg": [
            139.25,
            42.97310205233036
        ],
        "wc_questions_avg": [
            56.5,
            35.16745654721137
        ],
        "wc_review_avg": [
            308.25,
            76.73452612742194
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:AWz-xtCHgQcJ:scholar.google.com/&scioq=Violence+Detection+and+Localization+in+Video+Through+Subgroup+Analysis&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Vrije Universiteit Amsterdam",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.vu.nl",
        "aff_unique_abbr": "VU Amsterdam",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Netherlands"
    },
    {
        "title": "Mirage: Model-agnostic Graph Distillation for Graph Classification",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19373",
        "id": "78iGZdqxYY",
        "author_site": "Mridul Gupta, Sahil Manchanda, HARIPRASAD KODAMANA, Sayan Ranu",
        "tldr": "",
        "abstract": "GNNs, like other deep learning models, are data and computation hungry. There is a pressing need to scale training of GNNs on large datasets to enable their usage on low-resource environments. Graph distillation is an effort in that direction with the aim to construct a smaller synthetic training set from the original training data without significantly compromising model performance. While initial efforts are promising, this work is motivated by two key observations: (1) Existing graph distillation algorithms themselves rely on training with the full dataset, which undermines the very premise of graph distillation. (2) The distillation process is specific to the target GNN architecture and hyper-parameters and thus not robust to changes in the modeling pipeline. We circumvent these limitations by designing a distillation algorithm called MIRAGE for graph classification. MIRAGE is built on the insight that a message-passing GNN decomposes the input graph into a multiset of computation trees. Furthermore, the frequency distribution of computation trees is often skewed in nature, enabling us to condense this data into a concise distilled summary. By compressing the computation data itself, as opposed to emulating gradient flows on the original training set\u2014a prevalent approach to date\u2014MIRAGE transforms into an unsupervised and architecture-agnostic distillation algorithm. Extensive benchmarking on real-world datasets underscores MIRAGE\u2019s superiority, showcasing enhanced generalization accuracy, data compression, and distillation efficiency when compared to state-of-the-art baselines.",
        "keywords": "graph distillation;graph classification;frequent pattern mining",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Mridul Gupta;Sahil Manchanda;HARIPRASAD KODAMANA;Sayan Ranu",
        "authorids": "~Mridul_Gupta2;~Sahil_Manchanda1;~HARIPRASAD_KODAMANA1;~Sayan_Ranu2",
        "gender": "M;M;M;M",
        "homepage": "https://web.iitd.ac.in/~aiz218322;https://www.cse.iitd.ac.in/~sahilm;https://web.iitd.ac.in/~kodamana/;https://www.cse.iitd.ac.in/~sayan/index.html",
        "dblp": ";200/8052;;38/768",
        "google_scholar": "g_cTs3YAAAAJ;OPyjQHwAAAAJ;https://scholar.google.co.in/citations?user=YBcs36wAAAAJ;K4w5qYUAAAAJ",
        "orcid": "0009-0003-4343-4263;0000-0001-7437-9891;;0000-0003-4147-9372",
        "linkedin": "mridul1618/;;;",
        "or_profile": "~Mridul_Gupta2;~Sahil_Manchanda1;~HARIPRASAD_KODAMANA1;~Sayan_Ranu2",
        "aff": "Indian Institute of Technology, Delhi;Indian Institute of Technology Delhi;Indian Institute of Technology, Delhi;Indian Institute of Technology Delhi",
        "aff_domain": "iitd.ac.in;iitd.ac.in;iitd.ac.in;iitd.ac.in",
        "position": "PhD student;PhD student;Associate Professor;Associate Professor",
        "bibtex": "@inproceedings{\ngupta2024mirage,\ntitle={Mirage: Model-agnostic Graph Distillation for Graph Classification},\nauthor={Mridul Gupta and Sahil Manchanda and HARIPRASAD KODAMANA and Sayan Ranu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=78iGZdqxYY}\n}",
        "github": "",
        "project": "",
        "reviewers": "XL6A;yzvf;pdUR;2KBE",
        "pdf_size": 2107733,
        "rating": "6;6;6;6",
        "confidence": "3;4;4;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;4;2",
        "presentation": "3;3;3;3",
        "wc_summary": "90;132;63;87",
        "wc_strengths": "54;73;72;45",
        "wc_weaknesses": "10;132;164;428",
        "wc_questions": "67;44;23;5",
        "wc_review": "221;381;322;565",
        "wc_reply_reviewers": "0;10;15;11",
        "wc_reply_authors": "702;1251;1406;2160",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "4;2;3;7",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            93.0,
            24.829418035870273
        ],
        "wc_strengths_avg": [
            61.0,
            11.937336386313323
        ],
        "wc_weaknesses_avg": [
            183.5,
            152.40980939558975
        ],
        "wc_questions_avg": [
            34.75,
            23.177305710543667
        ],
        "wc_review_avg": [
            372.25,
            125.13068168918444
        ],
        "wc_reply_reviewers_avg": [
            9.0,
            5.522680508593631
        ],
        "wc_reply_authors_avg": [
            1379.75,
            520.9128405981177
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.0,
            1.8708286933869707
        ],
        "replies_avg": [
            30,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 16,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14231408030950146569&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=78iGZdqxYY",
        "pdf": "https://openreview.net/pdf?id=78iGZdqxYY",
        "email": "iitd.ac.in;iitd.ac.in;iitd.ac.in;iitd.ac.in",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Indian Institute of Technology Delhi",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.iitdelhi.ac.in",
        "aff_unique_abbr": "IIT Delhi",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Delhi",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "India"
    },
    {
        "title": "A Characterization Theorem for Equivariant Networks with Point-wise Activations",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19372",
        "id": "79FVDdfoSR",
        "author_site": "Marco Pacini, Xiaowen Dong, Bruno Lepri, Gabriele Santin",
        "tldr": "",
        "abstract": "Equivariant neural networks have shown improved performance, expressiveness and sample complexity on symmetrical domains. \nBut for some specific symmetries, representations, and choice of coordinates, the most common point-wise activations, such as ReLU, are not equivariant, hence they cannot be employed in the design of equivariant neural networks. \nThe theorem we present in this paper describes all possibile combinations of representations, choice of coordinates and point-wise activations to obtain an equivariant layer, generalizing and strengthening existing characterizations.\nNotable cases of practical relevance are discussed as corollaries. Indeed, we prove that rotation-equivariant networks can only be invariant, as it happens for any network which is equivariant with respect to connected compact groups. Then, we discuss implications of our findings when applied to important instances of equivariant networks. First, we completely characterize permutation equivariant networks such as Invariant Graph Networks with point-wise nonlinearities and their geometric counterparts, highlighting a plethora of models whose expressive power and performance are still unknown. \nSecond, we show that feature spaces of disentangled steerable convolutional neural networks are trivial representations.",
        "keywords": "Geometric Deep Learning;Equivariant Neural Networks;Characterization Theorem;Point-wise Activations",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Marco Pacini;Xiaowen Dong;Bruno Lepri;Gabriele Santin",
        "authorids": "~Marco_Pacini1;~Xiaowen_Dong1;~Bruno_Lepri1;gabriele.santin@unive.it",
        "gender": "M;;M;",
        "homepage": "https://marco-pacini.github.io/;https://web.media.mit.edu/~xdong/;;",
        "dblp": "213/0755;91/9827-1;99/6489;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;_8tUq8kAAAAJ;JfcopG0AAAAJ;",
        "orcid": ";;0000-0003-1275-2333;",
        "linkedin": ";;brunolepri/?originalSubdomain=it;",
        "or_profile": "~Marco_Pacini1;~Xiaowen_Dong1;~Bruno_Lepri1;gabriele.santin@unive.it",
        "aff": "Fondazione Bruno Kessler;Massachusetts Institute of Technology;Fondazione Bruno Kessler;",
        "aff_domain": "fbk.eu;mit.edu;fbk.eu;",
        "position": "PhD student;Research Affiliate;Principal Researcher;",
        "bibtex": "@inproceedings{\npacini2024a,\ntitle={A Characterization Theorem for Equivariant Networks with Point-wise Activations},\nauthor={Marco Pacini and Xiaowen Dong and Bruno Lepri and Gabriele Santin},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=79FVDdfoSR}\n}",
        "github": "",
        "project": "",
        "reviewers": "3Kou;uXzC;merJ;sg92",
        "pdf_size": 342950,
        "rating": "6;6;8;8",
        "confidence": "3;2;3;3",
        "soundness": "3;3;3;4",
        "contribution": "2;2;4;3",
        "presentation": "2;1;3;2",
        "wc_summary": "57;68;85;59",
        "wc_strengths": "54;97;123;68",
        "wc_weaknesses": "296;135;135;594",
        "wc_questions": "45;98;73;233",
        "wc_review": "452;398;416;954",
        "wc_reply_reviewers": "16;27;17;250",
        "wc_reply_authors": "738;536;517;1417",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            67.25,
            11.053845484717073
        ],
        "wc_strengths_avg": [
            85.5,
            26.63174797117155
        ],
        "wc_weaknesses_avg": [
            290.0,
            187.41798206148738
        ],
        "wc_questions_avg": [
            112.25,
            72.19201825686825
        ],
        "wc_review_avg": [
            555.0,
            231.18174668429165
        ],
        "wc_reply_reviewers_avg": [
            77.5,
            99.68575625434157
        ],
        "wc_reply_authors_avg": [
            802.0,
            365.47982160442183
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10859373733821825022&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 10,
        "openreview": "https://openreview.net/forum?id=79FVDdfoSR",
        "pdf": "https://openreview.net/pdf?id=79FVDdfoSR",
        "email": "fbk.eu;mit.edu;fbk.eu;",
        "author_num": 4,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Fondazione Bruno Kessler;Massachusetts Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.fbk.eu;https://web.mit.edu",
        "aff_unique_abbr": "FBK;MIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Italy;United States"
    },
    {
        "title": "Designing Skill-Compatible AI: Methodologies and Frameworks in Chess",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19371",
        "id": "79rfgv3jw4",
        "author_site": "KARIM HAMADE, Reid McIlroy-Young, Siddhartha Sen, Jon Kleinberg, Ashton Anderson",
        "tldr": "",
        "abstract": "Powerful artificial intelligence systems are often used in settings where they must interact with agents that are computationally much weaker, for example when they work alongside humans or operate in complex environments where some tasks are handled by algorithms, heuristics, or other entities of varying computational power. For AI agents to successfully interact in these settings, however, achieving superhuman performance alone is not sufficient; they also need to account for suboptimal actions or idiosyncratic style from their less-skilled counterparts. We propose a formal evaluation framework for assessing the compatibility of near-optimal AI with interaction partners who may have much lower levels of skill; we use popular collaborative chess variants as model systems to study and develop AI agents that can successfully interact with lower-skill entities. Traditional chess engines designed to output near-optimal moves prove to be inadequate partners when paired with engines of various lower skill levels in this domain, as they are not designed to consider the presence of other agents. We contribute three methodologies to explicitly create skill-compatible AI agents in complex decision-making settings, and two chess game frameworks designed to foster collaboration between powerful AI agents and less-skilled partners. On these frameworks, our agents outperform state-of-the-art chess AI (based on AlphaZero) despite being weaker in conventional chess, demonstrating that skill-compatibility is a tangible trait that is qualitatively and measurably distinct from raw performance. Our evaluations further explore and clarify the mechanisms by which our agents achieve skill-compatibility.",
        "keywords": "Skill-AI compatibility;Agent Systems;Decision-making;Chess;Deep RL",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/d067ff4cd68eb84dc82fae7b1d69cea1c70699ea.zip",
        "author": "Karim Hamade;Reid McIlroy-Young;Siddhartha Sen;Jon Kleinberg;Ashton Anderson",
        "authorids": "~Karim_Hamade1;~Reid_McIlroy-Young1;~Siddhartha_Sen1;~Jon_Kleinberg1;~Ashton_Anderson1",
        "gender": "M;M;;;M",
        "homepage": ";https://reidmcy.com/;http://sidsen.org;http://www.cs.toronto.edu/~ashton/;http://www.cs.cornell.edu/home/kleinber/",
        "dblp": ";196/4704;;21/8524;https://dblp.uni-trier.de/pid/k/JonMKleinberg.html",
        "google_scholar": ";https://scholar.google.ca/citations?user=7Tclf3kAAAAJ;;https://scholar.google.co.uk/citations?user=FMSltawAAAAJ;VX7d5EQAAAAJ",
        "orcid": ";0000-0001-9104-4145;;;0000-0002-1929-2512",
        "linkedin": "karim-h-400143200/;;;;",
        "or_profile": "~Karim_Hamade1;~Reid_McIlroy-Young1;~Siddhartha_Sen1;~Ashton_Anderson1;~Jon_Kleinberg3",
        "aff": "Department of Computer Science, University of Toronto;Harvard University;Microsoft Research;Department of Computer Science, University of Toronto;",
        "aff_domain": "cs.toronto.edu;harvard.edu;research.microsoft.com;cs.toronto.edu;",
        "position": "MS student;Postdoc;Principal Researcher;Assistant Professor;",
        "bibtex": "@inproceedings{\nhamade2024designing,\ntitle={Designing Skill-Compatible {AI}: Methodologies and Frameworks in Chess},\nauthor={Karim Hamade and Reid McIlroy-Young and Siddhartha Sen and Jon Kleinberg and Ashton Anderson},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=79rfgv3jw4}\n}",
        "github": "",
        "project": "",
        "reviewers": "9rEp;SKaW;XZq8;D1Jx",
        "pdf_size": 966147,
        "rating": "5;6;8;8",
        "confidence": "3;4;4;4",
        "soundness": "3;3;3;3",
        "contribution": "3;2;3;4",
        "presentation": "3;3;3;3",
        "wc_summary": "104;73;253;139",
        "wc_strengths": "79;74;217;84",
        "wc_weaknesses": "82;282;366;65",
        "wc_questions": "95;16;704;92",
        "wc_review": "360;445;1540;380",
        "wc_reply_reviewers": "39;47;379;52",
        "wc_reply_authors": "825;420;1521;401",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;2;3;2",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            142.25,
            68.0711943482704
        ],
        "wc_strengths_avg": [
            113.5,
            59.860253925288355
        ],
        "wc_weaknesses_avg": [
            198.75,
            128.8630571575888
        ],
        "wc_questions_avg": [
            226.75,
            277.35300160625627
        ],
        "wc_review_avg": [
            681.25,
            496.7944117036745
        ],
        "wc_reply_reviewers_avg": [
            129.25,
            144.2677632043971
        ],
        "wc_reply_authors_avg": [
            791.75,
            453.8156977232057
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.7777777777777777,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18109915714699930021&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=79rfgv3jw4",
        "pdf": "https://openreview.net/pdf?id=79rfgv3jw4",
        "email": "cs.toronto.edu;harvard.edu;research.microsoft.com;cs.toronto.edu;",
        "author_num": 5,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "University of Toronto;Harvard University;Microsoft",
        "aff_unique_dep": "Department of Computer Science;;Microsoft Research",
        "aff_unique_url": "https://www.utoronto.ca;https://www.harvard.edu;https://www.microsoft.com/en-us/research",
        "aff_unique_abbr": "U of T;Harvard;MSR",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Toronto;",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "Canada;United States"
    },
    {
        "id": "79tJB1eTmb",
        "title": "Meta-CoT: Generalizable Chain-of-Thought Prompting in Mixed-task Scenarios with Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs) have unveiled remarkable reasoning capabilities by exploiting chain-of-thought (CoT) prompting, which generates intermediate reasoning chains to serve as the rationale for deriving the answer. However, current CoT methods either simply employ general prompts such as Let\u2019s think step by step, or heavily rely on handcrafted task-specific demonstrations to attain preferable performances, thereby engendering an inescapable gap between performance and generalization. To bridge this gap, we propose Meta-CoT, a generalizable CoT prompting method in mixed-task scenarios where the type of input questions is unknown. Meta-CoT firstly categorizes the scenario based on the input question and subsequently constructs diverse demonstrations from the corresponding data pool in an automatic pattern. Meta-CoT simultaneously enjoys remarkable performances on ten public benchmark reasoning tasks and superior generalization capabilities. Notably, Meta-CoT achieves the state-of-the-art result on SVAMP (93.7%) without any additional program-aided methods. Our further experiments on five out-of-distribution datasets verify the stability and generality of Meta-CoT.",
        "keywords": "Chain of Thought Prompting;Large Language Models;In-context Learning;Few-shot Learning;Arithmetic Reasoning;Commonsense Reasoning;Symbolic Reasoning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Anni Zou;Zhuosheng Zhang;hai zhao;Xiangru Tang",
        "authorids": "~Anni_Zou1;~Zhuosheng_Zhang1;~hai_zhao1;~Xiangru_Tang2",
        "gender": "F;M;M;M",
        "homepage": ";https://bcmi.sjtu.edu.cn/~zhangzs/;http://bcmi.sjtu.edu.cn/~zhaohai/;https://xiangrutang.github.io/",
        "dblp": ";06/9708;25/1145-1.html;246/8064",
        "google_scholar": ";https://scholar.google.co.jp/citations?user=63LTQhgAAAAJ;https://scholar.google.com.tw/citations?user=4dU5KS0AAAAJ;",
        "orcid": "0000-0001-6378-6475;0000-0002-4183-3645;;",
        "linkedin": ";;;",
        "or_profile": "~Anni_Zou1;~Zhuosheng_Zhang1;~hai_zhao1;~Xiangru_Tang2",
        "aff": "Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;Yale University",
        "aff_domain": "sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;yale.edu",
        "position": "MS student;Assistant Professor;Full Professor;PhD student",
        "bibtex": "@misc{\nzou2024metacot,\ntitle={Meta-CoT: Generalizable Chain-of-Thought Prompting in Mixed-task Scenarios with Large Language Models},\nauthor={Anni Zou and Zhuosheng Zhang and hai zhao and Xiangru Tang},\nyear={2024},\nurl={https://openreview.net/forum?id=79tJB1eTmb}\n}",
        "github": "",
        "project": "",
        "reviewers": "JvEc;FQzo;uTXx",
        "site": "https://openreview.net/forum?id=79tJB1eTmb",
        "pdf_size": 1538016,
        "rating": "3;3;3",
        "confidence": "5;4;4",
        "soundness": "2;1;2",
        "contribution": "1;2;2",
        "presentation": "3;1;2",
        "wc_summary": "101;76;115",
        "wc_strengths": "16;20;15",
        "wc_weaknesses": "56;109;192",
        "wc_questions": "81;57;63",
        "wc_review": "254;262;385",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            97.33333333333333,
            16.131404843417148
        ],
        "wc_strengths_avg": [
            17.0,
            2.160246899469287
        ],
        "wc_weaknesses_avg": [
            119.0,
            55.97023018236272
        ],
        "wc_questions_avg": [
            67.0,
            10.198039027185569
        ],
        "wc_review_avg": [
            300.3333333333333,
            59.95739227892495
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6122894346217833235&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "Shanghai Jiao Tong University;Yale University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.sjtu.edu.cn;https://www.yale.edu",
        "aff_unique_abbr": "SJTU;Yale",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "7AB077M4TY",
        "title": "Dynamic Training Guided by Training Dynamics",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper centers around a novel concept proposed recently by researchers from the control community where the training process of a deep neural network can be considered a nonlinear dynamical system acting upon the high-dimensional weight space. Koopman operator theory, a data-driven dynamical system analysis framework, can then be deployed to discover the otherwise non-intuitive training dynamics. Different from existing approaches that mainly take advantage of the prediction capability of this framework, we take a deep dive into understanding the underlying relationship between the low-dimensional Koopman modes that describe the training dynamics and the weight evolution itself, and develop two novel strategies for speeding up model convergence in an online fashion, including 1) a gradient acceleration strategy that improves training efficiency by pushing the slowly decaying Koopman modes to decay faster, and 2) a masking strategy that drastically reduces the computational complexity of gradient acceleration by analyzing the contribution of the corresponding Koopman modes in weight reconstruction. These strategies offer promising insights into pursuing faster and more efficient training methodologies and improve our understanding of training dynamics to further control and inform the training process.",
        "keywords": "training dynamics;Deep Neural Networks;Koopman Operator",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Fanqi Wang;Landon Harris;Weisheng Tang;Hairong Qi;Dan Wilson;Igor Mezic",
        "authorids": "~Fanqi_Wang1;~Landon_Harris1;~Weisheng_Tang1;~Hairong_Qi1;~Dan_Wilson1;~Igor_Mezic1",
        "gender": "F;;M;F;M;M",
        "homepage": ";;;http://www.eecs.utk.edu/people/faculty/hqi/;http://volweb.utk.edu/~dwilso81;https://mgroup.me.ucsb.edu/",
        "dblp": ";;;00/6984-1.html;;",
        "google_scholar": ";;CKxchGcAAAAJ;https://scholar.google.com.tw/citations?user=GqnNG-kAAAAJ;;5d9ngqsAAAAJ",
        "orcid": ";;0000-0001-7307-7410;;;",
        "linkedin": ";;;hairong-qi-6a67602/;;",
        "or_profile": "~Fanqi_Wang1;~Landon_Harris1;~Weisheng_Tang1;~Hairong_Qi1;~Dan_Wilson1;~Igor_Mezic1",
        "aff": "University of Tennessee, Knoxville;;University of Tennessee, Knoxville;University of Tennessee, Knoxville;University of Tennessee, Knoxville;University of California, Santa Barbara",
        "aff_domain": "utk.edu;;utk.edu;vols.utk.edu;utk.edu;ucsb.edu",
        "position": "PhD student;;Postdoc;Full Professor;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nwang2024dynamic,\ntitle={Dynamic Training Guided by Training Dynamics},\nauthor={Fanqi Wang and Landon Harris and Weisheng Tang and Hairong Qi and Dan Wilson and Igor Mezic},\nyear={2024},\nurl={https://openreview.net/forum?id=7AB077M4TY}\n}",
        "github": "",
        "project": "",
        "reviewers": "ptUk;xUqE;aC1Y;APZy",
        "site": "https://openreview.net/forum?id=7AB077M4TY",
        "pdf_size": 7102041,
        "rating": "3;3;3;5",
        "confidence": "3;5;3;2",
        "soundness": "3;2;1;3",
        "contribution": "1;2;2;3",
        "presentation": "1;2;2;3",
        "wc_summary": "577;94;112;77",
        "wc_strengths": "2;160;25;9",
        "wc_weaknesses": "2;526;156;145",
        "wc_questions": "2;13;239;37",
        "wc_review": "583;793;532;268",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1195;645;1203;604",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;2;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            215.0,
            209.36690282850344
        ],
        "wc_strengths_avg": [
            49.0,
            64.62584622269948
        ],
        "wc_weaknesses_avg": [
            207.25,
            193.798058555807
        ],
        "wc_questions_avg": [
            72.75,
            96.81522349300238
        ],
        "wc_review_avg": [
            544.0,
            186.97727134601146
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            911.75,
            287.6294273887844
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.6622661785325219,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Tz7f2UO3ynEJ:scholar.google.com/&scioq=Dynamic+Training+Guided+by+Training+Dynamics&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;1",
        "aff_unique_norm": "University of Tennessee;University of California, Santa Barbara",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.utk.edu;https://www.ucsb.edu",
        "aff_unique_abbr": "UT;UCSB",
        "aff_campus_unique_index": "0;0;0;0;1",
        "aff_campus_unique": "Knoxville;Santa Barbara",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "7AS7vaVU8d",
        "title": "Learning Personalized Story Evaluation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "While large language models (LLMs) have shown impressive results for more objective tasks such as QA and retrieval, it remains nontrivial to evaluate their performance on open-ended text generation for reasons including (1) data contamination; (2) multi-dimensional evaluation criteria; and (3) subjectiveness stemming from reviewers\u2019 personal preferences. To address such issues, we propose to model personalization in an uncontaminated open-ended generation assessment. We create two new datasets Per-MPST and Per-DOC for personalized story evaluation, by re-purposing existing datasets with proper anonymization and new personalized labels. We further develop a personalized story evaluation model PERSE to infer reviewer preferences and provide a personalized evaluation. Specifically, given a few exemplary reviews from a particular reviewer, PERSE predicts either a detailed review or fine-grained comparison in several aspects (such as interestingness and surprise) for that reviewer on a new text input. Experimental results show that PERSE outperforms GPT-4 by 15.8% on Kendall correlation of story ratings, and by 13.7% on pairwise preference prediction accuracy. Both datasets and code will be released.",
        "keywords": "Open-ended Text Evaluation;Personalization;Automatic Story Evaluation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/4f28ad392c850a96d2f67fdb3dc50bf94641d766.zip",
        "author": "Danqing Wang;Kevin Yang;Hanlin Zhu;Xiaomeng Yang;Andrew Cohen;Lei Li;Yuandong Tian",
        "authorids": "~Danqing_Wang1;~Kevin_Yang2;~Hanlin_Zhu2;~Xiaomeng_Yang1;~Andrew_Cohen4;~Lei_Li11;~Yuandong_Tian1",
        "gender": "F;M;M;M;M;M;M",
        "homepage": ";https://hanlinzhu.com/;;;https://www.cs.cmu.edu/~leili;http://yuandong-tian.com;https://people.eecs.berkeley.edu/~yangk/",
        "dblp": "226/6524.html;;;;13/7007-5.html;t/YuandongTian;13/10565",
        "google_scholar": "https://scholar.google.com/citations?hl=en-US;yDVn5LEAAAAJ;t8v3JXsAAAAJ;;BYXqAlwAAAAJ;0mgEF28AAAAJ;sRpY9TIAAAAJ",
        "orcid": ";;0009-0007-3917-6811;;0000-0003-3095-9776;0000-0003-4202-4847;",
        "linkedin": ";;xiaomeng-yang-356a976b;andrew-cohen-17a7aa15b;;yuandongtian;",
        "or_profile": "~Danqing_Wang1;~Hanlin_Zhu2;~Xiaomeng_Yang1;~Andrew_Cohen4;~Lei_Li11;~Yuandong_Tian1;~Kevin_Yang1",
        "aff": "Carnegie Mellon University;Electrical Engineering & Computer Science Department, University of California Berkeley;Moonshot AI;Meta Platforms;School of Computer Science, Carnegie Mellon University;Meta AI (FAIR);Scaled Cognition",
        "aff_domain": "andrew.cmu.edu;eecs.berkeley.edu;msh.team;meta.com;cs.cmu.edu;meta.com;scaledcognition.com",
        "position": "PhD student;PhD student;Member of Technical Staff;Researcher;Assistant Professor;Research Scientist;Researcher",
        "bibtex": "@misc{\nwang2024learning,\ntitle={Learning Personalized Story Evaluation},\nauthor={Danqing Wang and Kevin Yang and Hanlin Zhu and Xiaomeng Yang and Andrew Cohen and Lei Li and Yuandong Tian},\nyear={2024},\nurl={https://openreview.net/forum?id=7AS7vaVU8d}\n}",
        "github": "",
        "project": "",
        "reviewers": "hjpK;7x1E;jhUM;9dNi",
        "site": "https://openreview.net/forum?id=7AS7vaVU8d",
        "pdf_size": 1974189,
        "rating": "5;5;5;8",
        "confidence": "4;3;4;5",
        "soundness": "2;2;2;3",
        "contribution": "2;2;3;4",
        "presentation": "1;1;3;3",
        "wc_summary": "47;55;127;117",
        "wc_strengths": "12;50;86;41",
        "wc_weaknesses": "61;230;47;63",
        "wc_questions": "2;171;22;397",
        "wc_review": "122;506;282;618",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "287;451;261;1219",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            5.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.0,
            1.0
        ],
        "wc_summary_avg": [
            86.5,
            35.787567673704785
        ],
        "wc_strengths_avg": [
            47.25,
            26.413774815425377
        ],
        "wc_weaknesses_avg": [
            100.25,
            75.16440314404153
        ],
        "wc_questions_avg": [
            148.0,
            157.89395175243413
        ],
        "wc_review_avg": [
            382.0,
            192.79004123657424
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            554.5,
            390.5032010112081
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.816496580927726,
        "gs_citation": 18,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15846584602882506993&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;3;0;3;4",
        "aff_unique_norm": "Carnegie Mellon University;University of California, Berkeley;Moonshot AI;Meta;Scaled Cognition",
        "aff_unique_dep": ";Electrical Engineering & Computer Science Department;;Meta Platforms, Inc.;",
        "aff_unique_url": "https://www.cmu.edu;https://www.berkeley.edu;https://moonshot.ai;https://www.meta.com;",
        "aff_unique_abbr": "CMU;UC Berkeley;Moonshot AI;Meta;",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Berkeley;Pittsburgh",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "7AiPfnM73h",
        "title": "Projected Off-Policy Q-Learning (POP-QL) for Stabilizing Offline Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "A key problem in off-policy Reinforcement Learning (RL) is the mismatch, or distribution shift, between the dataset and the distribution over states and actions visited by the learned policy. This problem is exacerbated in the fully offline setting. The main approach to correct this shift has been through importance sampling, which leads to high-variance gradients. Other approaches, such as conservatism or behavior-regularization, regularize the policy at the cost of performance. In this paper, we propose a new approach for stable off-policy Q-Learning that builds on a theoretical result by Kolter (2011). Our method, Projected Off-Policy Q-Learning (POP-QL), is a novel actor-critic algorithm that simultaneously reweights off-policy samples and constrains the policy to prevent divergence and reduce value-approximation error. In our experiments, POP-QL not only shows competitive performance on standard benchmarks, but also out-performs competing methods in tasks where the data-collection policy is significantly sub-optimal.",
        "keywords": "TD learning;Off-policy RL;offline RL",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/2851abdae8899cd5ecd6e5e79858f1ab4a01d3ca.zip",
        "author": "Melrose Roderick;Gaurav Manek;Felix Berkenkamp;J Zico Kolter",
        "authorids": "~Melrose_Roderick1;~Gaurav_Manek1;~Felix_Berkenkamp1;~J_Zico_Kolter1",
        "gender": "M;;M;M",
        "homepage": "https://melroderick.github.io/;https://www.gauravmanek.com/;https://berkenkamp.me;http://www.zicokolter.com",
        "dblp": "181/3909;200/8866;168/8558;67/2526",
        "google_scholar": "PYrd2GMAAAAJ;C8Mdr2UAAAAJ;https://scholar.google.ch/citations?user=N_tCEl8AAAAJ;UXh1I6UAAAAJ",
        "orcid": ";;;",
        "linkedin": "https://linkedin.com/in/melrose-roderick-4b74b199;https://sg.linkedin.com/in/gauravmanek;berkenkamp/;",
        "or_profile": "~Melrose_Roderick1;~Gaurav_Manek1;~Felix_Berkenkamp1;~Zico_Kolter1",
        "aff": "Mila, University of Montreal;Carnegie Mellon University;Bosch;Carnegie Mellon University",
        "aff_domain": "mila.umontreal.ca;cmu.edu;bosch.com;cmu.edu",
        "position": "Postdoc;PhD student;Research Scientist;Full Professor",
        "bibtex": "@misc{\nroderick2024projected,\ntitle={Projected Off-Policy Q-Learning ({POP}-{QL}) for Stabilizing Offline Reinforcement Learning},\nauthor={Melrose Roderick and Gaurav Manek and Felix Berkenkamp and J Zico Kolter},\nyear={2024},\nurl={https://openreview.net/forum?id=7AiPfnM73h}\n}",
        "github": "",
        "project": "",
        "reviewers": "Mmg3;5Wu7;JhFx;Urdi",
        "site": "https://openreview.net/forum?id=7AiPfnM73h",
        "pdf_size": 1100123,
        "rating": "3;3;5;5",
        "confidence": "4;4;3;3",
        "soundness": "2;2;3;2",
        "contribution": "2;2;2;2",
        "presentation": "2;3;3;3",
        "wc_summary": "74;96;139;96",
        "wc_strengths": "25;36;38;38",
        "wc_weaknesses": "87;409;143;136",
        "wc_questions": "239;1;126;46",
        "wc_review": "425;542;446;316",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "413;200;268;70",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            101.25,
            23.573024837725004
        ],
        "wc_strengths_avg": [
            34.25,
            5.402545696243577
        ],
        "wc_weaknesses_avg": [
            193.75,
            126.13360971604673
        ],
        "wc_questions_avg": [
            103.0,
            90.38528641322104
        ],
        "wc_review_avg": [
            432.25,
            80.31305933657364
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            237.75,
            123.68584195452607
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:IiVP5kxbhnUJ:scholar.google.com/&scioq=Projected+Off-Policy+Q-Learning+(POP-QL)+for+Stabilizing+Offline+Reinforcement+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "University of Montreal;Carnegie Mellon University;Robert Bosch GmbH",
        "aff_unique_dep": "Mila;;",
        "aff_unique_url": "https://www.mila.quebec;https://www.cmu.edu;https://www.bosch.com",
        "aff_unique_abbr": "Mila;CMU;Bosch",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Montreal;",
        "aff_country_unique_index": "0;1;2;1",
        "aff_country_unique": "Canada;United States;Germany"
    },
    {
        "id": "7ArYyAmDGQ",
        "title": "Prediction Risk and Estimation Risk of the Ridgeless Least Squares Estimator under General Assumptions on Regression Errors",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In recent years, there has been a significant growth in research focusing on minimum $\\ell_2$ norm (ridgeless) interpolation least squares estimators. However, the majority of these analyses have been limited to a simple regression error structure, assuming independent and identically distributed errors with zero mean and common variance. In this paper, we explore prediction risk as well as estimation risk under more general regression error assumptions, highlighting the benefits of overparameterization in a \\emph{finite} sample. We find that including a large number of \\emph{unimportant} parameters relative to the sample size can effectively reduce both risks. Notably, we establish that the estimation difficulties associated with the variance components of both risks \ncan be summarized through the trace of the variance-covariance matrix of the regression errors.",
        "keywords": "prediction risk;estimation risk;generalization;statistical learning;overparameterization;interpolation;ridgeless regression;benign overfitting;double descent;nonspherical errors",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/97aff42c3175e3ee375dc9ad0230bf08fb7b77ae.zip",
        "author": "Sungyoon Lee;Sokbae Lee",
        "authorids": "~Sungyoon_Lee1;~Sokbae_Lee1",
        "gender": "M;M",
        "homepage": "https://sites.google.com/view/sungyoon-lee/home;https://sites.google.com/site/sokbae/",
        "dblp": ";270/3314",
        "google_scholar": "https://scholar.google.co.kr/citations?user=PAoFkGEAAAAJ;nlNC3hQAAAAJ",
        "orcid": ";0000-0003-4080-7733",
        "linkedin": ";",
        "or_profile": "~Sungyoon_Lee1;~Sokbae_Lee1",
        "aff": "Hanyang University;Columbia University",
        "aff_domain": "hanyang.ac.kr;columbia.edu",
        "position": "Assistant Professor;Professor",
        "bibtex": "@misc{\nlee2024prediction,\ntitle={Prediction Risk and Estimation Risk of the Ridgeless Least Squares Estimator under General Assumptions on Regression Errors},\nauthor={Sungyoon Lee and Sokbae Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=7ArYyAmDGQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "zjX2;jNnY;xuqE",
        "site": "https://openreview.net/forum?id=7ArYyAmDGQ",
        "pdf_size": 387900,
        "rating": "5;5;6",
        "confidence": "3;3;3",
        "soundness": "3;3;3",
        "contribution": "2;3;2",
        "presentation": "3;2;3",
        "wc_summary": "80;162;101",
        "wc_strengths": "34;7;51",
        "wc_weaknesses": "121;36;148",
        "wc_questions": "164;2;2",
        "wc_review": "399;207;302",
        "wc_reply_reviewers": "27;0;153",
        "wc_reply_authors": "448;361;626",
        "reply_reviewers": "1;0;2",
        "reply_authors": "1;1;3",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            114.33333333333333,
            34.77866523539332
        ],
        "wc_strengths_avg": [
            30.666666666666668,
            18.116904322268255
        ],
        "wc_weaknesses_avg": [
            101.66666666666667,
            47.72374205314956
        ],
        "wc_questions_avg": [
            56.0,
            76.36753236814714
        ],
        "wc_review_avg": [
            302.6666666666667,
            78.38508928503062
        ],
        "wc_reply_reviewers_avg": [
            60.0,
            66.6783323126786
        ],
        "wc_reply_authors_avg": [
            478.3333333333333,
            110.2915328673159
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:DoXQ8vjLUiAJ:scholar.google.com/&scioq=Prediction+Risk+and+Estimation+Risk+of+the+Ridgeless+Least+Squares+Estimator+under+General+Assumptions+on+Regression+Errors&hl=en&as_sdt=0,5",
        "gs_version_total": 6,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Hanyang University;Columbia University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.hanyang.ac.kr;https://www.columbia.edu",
        "aff_unique_abbr": "HYU;Columbia",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "id": "7B5Korw050",
        "title": "Lung Nodule Segmentation Network with Self-Supervised Learning and Attention Mechanisms",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Pulmonary nodule detection is one of the most important tasks for early lung cancer diagnosis. Especially, end-to-end methods for multi-tasking, including pulmonary nodule detection, false positive detection, and segmentation have been widely used based on supervised learning, leading to significant improvement in performance when detecting pulmonary nodules. However, those methods with confined environments were not able to exploit the representative features comprehensively. Therefore, some self-supervised methods have been proposed to handle the raw dataset. However, they were merely applied to each task, missing rich features of the end-to-end framework. In this paper, we propose a novel adaptation of self-supervised learning to a multi-tasking framework. Additionally, we employed other attention methods, such as Convolutional Block Attention Module(CBAM), and Quartet Attention Mechanism(QAM) to further enhance the performance without significantly in- creasing the number of parameters to learn.",
        "keywords": "Pulmonary Nodule Detection and Segmentation;3D Segmentation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/9beadd02dd7401a3d837cc988ab2988cfe93c3b7.zip",
        "author": "Eunah Jung;Seungmin Chou;Changwon Lim",
        "authorids": "~Eunah_Jung1;~Seungmin_Chou1;clim@cau.ac.kr",
        "gender": "F;M;",
        "homepage": "https://github.com/JUNGEUNAH;;",
        "dblp": ";;",
        "google_scholar": ";;",
        "orcid": ";;",
        "linkedin": ";seugnmin-chu-000685216/;",
        "or_profile": "~Eunah_Jung1;~Seungmin_Chou1;clim@cau.ac.kr",
        "aff": "Chung-Ang University;Chung-Ang University;",
        "aff_domain": "cau.ac.kr;cau.ac.kr;",
        "position": "MS student;Undergrad student;",
        "bibtex": "@misc{\njung2024lung,\ntitle={Lung Nodule Segmentation Network with Self-Supervised Learning and Attention Mechanisms},\nauthor={Eunah Jung and Seungmin Chou and Changwon Lim},\nyear={2024},\nurl={https://openreview.net/forum?id=7B5Korw050}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=7B5Korw050",
        "pdf_size": 319035,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:7fWtsvgK5YEJ:scholar.google.com/&scioq=Lung+Nodule+Segmentation+Network+with+Self-Supervised+Learning+and+Attention+Mechanisms&hl=en&as_sdt=0,23",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Chung-Ang University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.cau.ac.kr",
        "aff_unique_abbr": "CAU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "7CLvyZ6Xn7",
        "title": "Cross-domain Adaptation for Few-shot 3D Shape Generation",
        "track": "main",
        "status": "Desk Reject",
        "tldr": "",
        "abstract": "Realistic and diverse 3D shape generation is helpful for a wide variety of applications such as virtual reality, gaming, and animation. Modern generative models learn from large-scale datasets and generate new samples following similar distributions. However, when training data is limited, deep neural generative networks overfit and tend to replicate training samples. Prior works focus on few-shot image generation to produce high-quality and diverse results using a few target images. Unfortunately, abundant 3D shape data is typically hard to obtain as well. In this work, we make the first attempt to realize few-shot 3D shape generation by adapting generative models pre-trained on large source domains to target domains. To relieve overfitting and keep considerable diversity, we propose to maintain the probability distributions of the pairwise relative distances between adapted samples at feature-level and shape-level during domain adaptation. Our approach only needs the silhouettes of few-shot target samples as training data to learn target geometry distributions and achieve generated shapes with diverse topology and textures. Moreover, we introduce several metrics to evaluate generation quality and diversity. The effectiveness of our approach is demonstrated qualitatively and quantitatively under a series of few-shot 3D shape adaptation setups.",
        "keywords": "Few-shot;3D shape generation;Domain adaptation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/508ef1649b323ebae12785e156b6cce1e9d8d954.zip",
        "author": "JingYuan Zhu;Huimin Ma;Jiansheng Chen;Jian Yuan",
        "authorids": "~JingYuan_Zhu1;~Huimin_Ma1;~Jiansheng_Chen3;~Jian_Yuan1",
        "gender": "M;F;M;",
        "homepage": ";http://server.3dimagelab.cn:5000;http://scce.ustb.edu.cn/shiziduiwu/jiaoshixinxi/2021-11-15/210.html;http://bdktzweb.tsinghua.edu.cn/yuanjian/zh_CN/index.htm",
        "dblp": "302/9530;69/7694-1;;64/4192",
        "google_scholar": "a3ErJwkAAAAJ;32hwVLEAAAAJ;A1gA9XIAAAAJ;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~JingYuan_Zhu1;~Huimin_Ma1;~Jiansheng_Chen3;~Jian_Yuan1",
        "aff": "Electronic Engineering, Tsinghua University, Tsinghua University;University of Science and Technology Beijing;University of Science and Technology Beijing;Tsinghua University",
        "aff_domain": "mails.tsinghua.edu.cn;ustb.edu.cn;ustb.edu.cn;tsinghua.edu.cn",
        "position": "PhD student;Full Professor;Full Professor;Professor",
        "bibtex": "@misc{\nzhu2024crossdomain,\ntitle={Cross-domain Adaptation for Few-shot 3D Shape Generation},\nauthor={JingYuan Zhu and Huimin Ma and Jiansheng Chen and Jian Yuan},\nyear={2024},\nurl={https://openreview.net/forum?id=7CLvyZ6Xn7}\n}",
        "github": "",
        "project": "",
        "reviewers": "4te8;KzHF;DPcy;xeiS",
        "site": "https://openreview.net/forum?id=7CLvyZ6Xn7",
        "pdf_size": 48874117,
        "rating": "3;5;6;6",
        "confidence": "5;3;3;4",
        "soundness": "2;3;2;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "50;100;86;92",
        "wc_strengths": "11;30;119;85",
        "wc_weaknesses": "61;298;223;88",
        "wc_questions": "16;2;69;62",
        "wc_review": "138;430;497;327",
        "wc_reply_reviewers": "0;264;185;0",
        "wc_reply_authors": "685;1480;872;345",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "2;3;3;2",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            82.0,
            19.131126469708992
        ],
        "wc_strengths_avg": [
            61.25,
            43.01380592321493
        ],
        "wc_weaknesses_avg": [
            167.5,
            97.1763860204731
        ],
        "wc_questions_avg": [
            37.25,
            28.78693279944913
        ],
        "wc_review_avg": [
            348.0,
            135.52306076826926
        ],
        "wc_reply_reviewers_avg": [
            112.25,
            115.67276040624257
        ],
        "wc_reply_authors_avg": [
            845.5,
            412.1750235033656
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.7385489458759963,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:PCzSa-ZAer8J:scholar.google.com/&scioq=Cross-domain+Adaptation+for+Few-shot+3D+Shape+Generation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;0",
        "aff_unique_norm": "Tsinghua University;University of Science and Technology Beijing",
        "aff_unique_dep": "Electronic Engineering;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;http://www.ustb.edu.cn",
        "aff_unique_abbr": "THU;USTB",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Elastic Feature Consolidation For Cold Start Exemplar-Free Incremental Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19370",
        "id": "7D9X2cFnt1",
        "author_site": "Simone Magistri, Tomaso Trinci, Albin Soutif--Cormerais, Joost van de Weijer, Andrew Bagdanov",
        "tldr": "",
        "abstract": "Exemplar-Free Class Incremental Learning (EFCIL) aims to learn from a sequence of tasks without having access to previous task data. In this paper, we consider the challenging Cold Start scenario in which insufficient data is available in the first task to learn a high-quality backbone. This is especially challenging for EFCIL since it requires high plasticity, which results in feature drift which is difficult to compensate for in the exemplar-free setting.  To address this problem, we propose a simple and effective approach that consolidates feature representations by regularizing drift in directions highly relevant to previous tasks and employs prototypes to reduce task-recency bias. Our method, called Elastic Feature Consolidation (EFC), exploits a tractable second-order approximation of feature drift based on an Empirical Feature Matrix (EFM). The EFM induces a pseudo-metric in feature space which we use to regularize feature drift in important directions and to update Gaussian prototypes used in a novel asymmetric cross entropy loss which effectively balances prototype rehearsal with data from new tasks. Experimental results on CIFAR-100, Tiny-ImageNet, ImageNet-Subset and ImageNet-1K demonstrate that Elastic Feature Consolidation is better able to learn new tasks by maintaining model plasticity and significantly outperform the state-of-the-art.",
        "keywords": "Computer vision;continual learning;class-incremental learning;exemplar free;lifelong learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/75279702f6513c9c1950c5b24c1637c0100a3626.zip",
        "author": "Simone Magistri;Tomaso Trinci;Albin Soutif;Joost van de Weijer;Andrew D. Bagdanov",
        "authorids": "~Simone_Magistri1;~Tomaso_Trinci1;~Albin_Soutif1;~Joost_van_de_Weijer5;~Andrew_D._Bagdanov2",
        "gender": "M;M;M;M;M",
        "homepage": "https://webgol.dinfo.unifi.it/simone-magistri/;https://webgol.dinfo.unifi.it/tomaso-trinci/;;http://www.micc.unifi.it/bagdanov;http://lamp.cvc.uab.es/",
        "dblp": "283/0920;364/8212;295/9611;64/3935;67/3379",
        "google_scholar": "fAS993EAAAAJ;kfN-d6IAAAAJ;BtPOFGoAAAAJ;_Fk4YUcAAAAJ;https://scholar.google.es/citations?user=Gsw2iUEAAAAJ",
        "orcid": "0000-0002-0520-8463;0000-0002-4052-1930;;;0000-0002-9656-9706",
        "linkedin": ";;albin-soutif-b2252210b/;;",
        "or_profile": "~Simone_Magistri1;~Tomaso_Trinci1;~Albin_Soutif1;~Andrew_D._Bagdanov2;~Joost_van_de_Weijer1",
        "aff": "University of Florence;University of Florence;Computer Vision Center, Universitat Aut\u00f2noma de Barcelona;Universit\u00e0 degli Studi di Firenze;Computer Vision Center, Universitat Aut\u00f3noma de Barcelona",
        "aff_domain": "unifi.it;unifi.it;cvc.uab.es;unifi.it;cvc.uab.es",
        "position": "PhD student;PhD student;PhD student;Associate Professor;Researcher",
        "bibtex": "@inproceedings{\nmagistri2024elastic,\ntitle={Elastic Feature Consolidation For Cold Start Exemplar-Free Incremental Learning},\nauthor={Simone Magistri and Tomaso Trinci and Albin Soutif and Joost van de Weijer and Andrew D. Bagdanov},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=7D9X2cFnt1}\n}",
        "github": "",
        "project": "",
        "reviewers": "RQMN;4Tis;Hr2j;sY5k",
        "pdf_size": 1200954,
        "rating": "6;6;8;8",
        "confidence": "5;5;4;5",
        "soundness": "3;3;3;4",
        "contribution": "3;3;3;3",
        "presentation": "3;3;3;4",
        "wc_summary": "198;133;56;197",
        "wc_strengths": "82;106;75;159",
        "wc_weaknesses": "462;99;6;339",
        "wc_questions": "9;9;3;65",
        "wc_review": "751;347;140;760",
        "wc_reply_reviewers": "38;0;35;88",
        "wc_reply_authors": "1401;763;258;723",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            4.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            146.0,
            58.25375524376089
        ],
        "wc_strengths_avg": [
            105.5,
            32.95830699535399
        ],
        "wc_weaknesses_avg": [
            226.5,
            182.3410266506142
        ],
        "wc_questions_avg": [
            21.5,
            25.233905761891084
        ],
        "wc_review_avg": [
            499.5,
            266.27476410655214
        ],
        "wc_reply_reviewers_avg": [
            40.25,
            31.355820831226854
        ],
        "wc_reply_authors_avg": [
            786.25,
            406.6653261589928
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 23,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9154825138737762782&as_sdt=1005&sciodt=0,4&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=7D9X2cFnt1",
        "pdf": "https://openreview.net/pdf?id=7D9X2cFnt1",
        "email": "unifi.it;unifi.it;cvc.uab.es;unifi.it;cvc.uab.es",
        "author_num": 5,
        "aff_unique_index": "0;0;1;0;2",
        "aff_unique_norm": "University of Florence;Universitat Aut\u00f2noma de Barcelona;Universitat Aut\u00f3noma de Barcelona",
        "aff_unique_dep": ";Computer Vision Center;Computer Vision Center",
        "aff_unique_url": "https://www.unifi.it;https://www.uab.cat;https://www.uab.cat",
        "aff_unique_abbr": "UNIFI;UAB;UAB",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;1",
        "aff_country_unique": "Italy;Spain"
    },
    {
        "title": "Real3D-Portrait: One-shot Realistic 3D Talking Portrait Synthesis",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19369",
        "id": "7ERQPyR2eb",
        "author_site": "Zhenhui Ye, Tianyun Zhong, Yi Ren, Jiaqi Yang, Weichuang Li, Jiawei Huang, Ziyue Jiang, Jinzheng He, Rongjie Huang, Jinglin Liu, Chen Zhang, Xiang Yin, Zejun MA, Zhou Zhao",
        "tldr": "",
        "abstract": "One-shot 3D talking portrait generation aims to reconstruct a 3D avatar from an unseen image, and then animate it with a reference video or audio to generate a talking portrait video. The existing methods fail to simultaneously achieve the goals of accurate 3D avatar reconstruction and stable talking face animation. Besides, while the existing works mainly focus on synthesizing the head part, it is also vital to generate natural torso and background segments to obtain a realistic talking portrait video. To address these limitations, we present Real3D-Potrait, a framework that (1) improves the one-shot 3D reconstruction power with a large image-to-plane model that distills 3D prior knowledge from a 3D face generative model; (2) facilitates accurate motion-conditioned animation with an efficient motion adapter; (3) synthesizes realistic video with natural torso movement and switchable background using a head-torso-background super-resolution model; and (4) supports one-shot audio-driven talking face generation with a generalizable audio-to-motion model. Extensive experiments show that Real3D-Portrait generalizes well to unseen identities and generates more realistic talking portrait videos compared to previous methods. Video samples are available at https://real3dportrait.github.io.",
        "keywords": "One-shot Talking Face Generation;Neural Radiance Field",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/d5e2a3d21b399033bef1d6ec656016a274654cde.zip",
        "author": "Zhenhui Ye;Tianyun Zhong;Yi Ren;Jiaqi Yang;Weichuang Li;Jiawei Huang;Ziyue Jiang;Jinzheng He;Rongjie Huang;Jinglin Liu;Chen Zhang;Xiang Yin;Zejun MA;Zhou Zhao",
        "authorids": "~Zhenhui_Ye1;~Tianyun_Zhong3;~Yi_Ren2;~Jiaqi_Yang8;~Weichuang_Li1;~Jiawei_Huang5;~Ziyue_Jiang1;~Jinzheng_He1;~Rongjie_Huang1;~Jinglin_Liu1;~Chen_Zhang3;~Xiang_Yin2;~Zejun_MA1;~Zhou_Zhao3",
        "gender": "M;M;M;M;M;M;M;;M;M;F;M;M;M",
        "homepage": "https://yerfor.github.io;;https://rayeren.github.io/;https://omnihuman-lab.github.io/;https://www.waytron.net/;;;;;;https://actuy.github.io/;;;https://dblp.uni-trier.de/pid/75/7785.html?",
        "dblp": "265/6375;;75/6568-6;;318/0593;13/4208-8;258/6865;272/8857;212/8936-1;;94/4084-20;18/1022-6.html;;75/7785",
        "google_scholar": ";https://scholar.google.co.jp/scholar?hl=zh-CN;4FA6C0AAAAAJ;https://scholar.google.com/citations?hl=zh-CN;742-_K0AAAAJ;https://scholar.google.com/citations?hl=zh-CN;wDgSBssAAAAJ;https://scholar.google.com/citations?hl=zh-CN;iRHBUsgAAAAJ;Ri8x0jEAAAAJ;eBBFeVcAAAAJ;e6_J-lEAAAAJ;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com.hk/citations?user=IIoFY90AAAAJ",
        "orcid": ";;;0009-0006-6034-4069;;;;;;;;;;0000-0001-6121-0384",
        "linkedin": ";;;;;;;;;;;;zejun-ma-58614365/;",
        "or_profile": "~Zhenhui_Ye1;~Tianyun_Zhong3;~Yi_Ren2;~Jiaqi_Yang8;~Weichuang_Li1;~Jiawei_Huang5;~Ziyue_Jiang1;~Jinzheng_He1;~Rongjie_Huang1;~Jinglin_Liu1;~Chen_Zhang3;~Xiang_Yin2;~Zejun_MA1;~Zhou_Zhao2",
        "aff": "Zhejiang University;Zhejiang University;ByteDance;Tsinghua University;Hongkong University of Science and Technology(Guangzhou);Zhejiang University;Zhejiang University;Zhejiang University;Zhejiang University;ByteDance;Bytedance;ByteDance Inc.;ByteDance Inc.;Zhejiang University",
        "aff_domain": "zju.edu.cn;zju.edu.cn;bytedance.com;tsinghua.edu.cn;hkust-gz.edu.cn;zju.edu.cn;zju.edu.cn;zju.edu.cn;zju.edu.cn;bytedance.com;bytedance.com;bytedance.com;bytedance.com;zju.edu.cn",
        "position": "PhD student;MS student;Researcher;MS student;PhD student;MS student;PhD student;MS student;MS student;Research Scientist;Research Scientist;Researcher;Principal Researcher;Associate Professor",
        "bibtex": "@inproceedings{\nye2024realdportrait,\ntitle={Real3D-Portrait: One-shot Realistic 3D Talking Portrait Synthesis},\nauthor={Zhenhui Ye and Tianyun Zhong and Yi Ren and Jiaqi Yang and Weichuang Li and Jiawei Huang and Ziyue Jiang and Jinzheng He and Rongjie Huang and Jinglin Liu and Chen Zhang and Xiang Yin and Zejun MA and Zhou Zhao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=7ERQPyR2eb}\n}",
        "github": "",
        "project": "",
        "reviewers": "Kntd;8dWt;yTCz;MF4S",
        "pdf_size": 4764610,
        "rating": "8;8;8;10",
        "confidence": "4;3;5;4",
        "soundness": "3;2;3;4",
        "contribution": "3;1;2;3",
        "presentation": "3;3;4;3",
        "wc_summary": "228;85;116;122",
        "wc_strengths": "35;43;189;158",
        "wc_weaknesses": "10;64;381;278",
        "wc_questions": "341;30;22;91",
        "wc_review": "614;222;708;649",
        "wc_reply_reviewers": "221;99;88;0",
        "wc_reply_authors": "1880;1002;1576;945",
        "reply_reviewers": "4;2;4;0",
        "reply_authors": "5;4;6;4",
        "rating_avg": [
            8.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            137.75,
            53.9646875280493
        ],
        "wc_strengths_avg": [
            106.25,
            68.19594929319483
        ],
        "wc_weaknesses_avg": [
            183.25,
            151.92000362032644
        ],
        "wc_questions_avg": [
            121.0,
            129.79021534769097
        ],
        "wc_review_avg": [
            548.25,
            191.3326618745477
        ],
        "wc_reply_reviewers_avg": [
            102.0,
            78.69243928103894
        ],
        "wc_reply_authors_avg": [
            1350.75,
            392.77943874393424
        ],
        "reply_reviewers_avg": [
            2.5,
            1.6583123951777
        ],
        "reply_authors_avg": [
            4.75,
            0.82915619758885
        ],
        "replies_avg": [
            38,
            0
        ],
        "authors#_avg": [
            14,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 47,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4610920972123504276&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=7ERQPyR2eb",
        "pdf": "https://openreview.net/pdf?id=7ERQPyR2eb",
        "email": "zju.edu.cn;zju.edu.cn;bytedance.com;tsinghua.edu.cn;hkust-gz.edu.cn;zju.edu.cn;zju.edu.cn;zju.edu.cn;zju.edu.cn;bytedance.com;bytedance.com;bytedance.com;bytedance.com;zju.edu.cn",
        "author_num": 14,
        "aff_unique_index": "0;0;1;2;3;0;0;0;0;1;1;1;1;0",
        "aff_unique_norm": "Zhejiang University;ByteDance;Tsinghua University;Hong Kong University of Science and Technology",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.zju.edu.cn;https://www.bytedance.com;https://www.tsinghua.edu.cn;https://www.ust.hk",
        "aff_unique_abbr": "ZJU;ByteDance;THU;HKUST",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Guangzhou",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "7ErllmwXym",
        "title": "Interpreting and improving diffusion models using the Euclidean distance function",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Denoising is intuitively related to projection. Indeed, under the manifold hypothesis, adding random noise is approximately equivalent to orthogonal perturbation. Hence, learning to denoise is approximately learning to project. In this paper, we use this observation to reinterpret denoising diffusion models as approximate gradient descent applied to the Euclidean distance function. We then provide straight-forward convergence analysis of the DDIM sampler under simple assumptions on the projection-error of the denoiser. Finally, we propose a new sampler based on two simple modifications to DDIM using insights from our theoretical results. In as few as 5-10 function evaluations, our sampler achieves state-of-the-art FID scores on pretrained CIFAR-10 and CelebA models and can generate high quality samples on latent diffusion models.",
        "keywords": "Diffusion models;distance functions;projection;training-free sampler",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/3c87d9fda1783f5522157a8aa1542c4aca19463e.zip",
        "author": "Frank Permenter;Chenyang Yuan",
        "authorids": "~Frank_Permenter1;~Chenyang_Yuan1",
        "gender": ";",
        "homepage": "https://www.mit.edu/~fperment;",
        "dblp": "90/9943;",
        "google_scholar": "BQ_S4vMAAAAJ;",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Frank_Permenter1;~Chenyang_Yuan1",
        "aff": "Toyota Research Institute;",
        "aff_domain": "tri.global;",
        "position": "Principal Researcher;",
        "bibtex": "@misc{\npermenter2024interpreting,\ntitle={Interpreting and improving diffusion models using the Euclidean distance function},\nauthor={Frank Permenter and Chenyang Yuan},\nyear={2024},\nurl={https://openreview.net/forum?id=7ErllmwXym}\n}",
        "github": "",
        "project": "",
        "reviewers": "LpGF;dfzc;gUw5",
        "site": "https://openreview.net/forum?id=7ErllmwXym",
        "pdf_size": 7309770,
        "rating": "3;6;8",
        "confidence": "4;3;3",
        "soundness": "2;3;3",
        "contribution": "1;3;3",
        "presentation": "2;4;2",
        "wc_summary": "99;152;57",
        "wc_strengths": "20;75;47",
        "wc_weaknesses": "513;83;1",
        "wc_questions": "6;47;73",
        "wc_review": "638;357;178",
        "wc_reply_reviewers": "0;88;0",
        "wc_reply_authors": "160;586;73",
        "reply_reviewers": "0;1;0",
        "reply_authors": "1;2;1",
        "rating_avg": [
            5.666666666666667,
            2.0548046676563256
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            102.66666666666667,
            38.87015421745698
        ],
        "wc_strengths_avg": [
            47.333333333333336,
            22.45489305746572
        ],
        "wc_weaknesses_avg": [
            199.0,
            224.54101332867157
        ],
        "wc_questions_avg": [
            42.0,
            27.58018612458347
        ],
        "wc_review_avg": [
            391.0,
            189.32687782421877
        ],
        "wc_reply_reviewers_avg": [
            29.333333333333332,
            41.48359782961079
        ],
        "wc_reply_authors_avg": [
            273.0,
            224.15619554230483
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.9176629354822472,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14071772171599282298&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Toyota Research Institute",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tri.global",
        "aff_unique_abbr": "TRI",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "7F4ioiKQFT",
        "title": "ColCLIP: Enhancing Fine-Grained Image Retrieval with Pre-trained Embeddings",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In the realm of image retrieval systems, efficiently searching for images based on any visual element described in the query is critical for user experience. However, current embedding models like CLIP primarily focus on aligning text with the most salient aspects of images, which may not always correspond to the elements users seek. In this paper, we propose ColCLIP, a fine-grained image retrieval system that leverages pre-trained embeddings and enhances them for our use case. We fine-tune CLIP on the Visual Genome Dataset and incorporate the MaxSim operator for image-text interaction. Our evaluations show that ColCLIP consistently outperforms standard CLIP in handling fine-grained retrieval tasks. ColCLIP improves image retrieval systems by enabling more relevant searches for users while maintaining efficiency and ease of development. We release our code at https://anonymous.4open.science/r/image-is-context-32B6.",
        "keywords": "Multimodal Learning;Image;Language;Retrieval",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Conghao Shen;Yixin Liu;Wanyue Zhai",
        "authorids": "~Conghao_Shen1;~Yixin_Liu6;~Wanyue_Zhai1",
        "gender": "M;F;F",
        "homepage": "https://tomshen.io;;",
        "dblp": ";;",
        "google_scholar": ";;",
        "orcid": ";;",
        "linkedin": "conghao-shen/;yixin-liu-261090201/;wanyue-zhai-74a074182/",
        "or_profile": "~Conghao_Shen1;~Yixin_Liu6;~Wanyue_Zhai1",
        "aff": "Stanford University;Stanford University;Stanford University",
        "aff_domain": "stanford.edu;stanford.edu;stanford.edu",
        "position": "MS student;MS student;MS student",
        "bibtex": "@misc{\nshen2024colclip,\ntitle={Col{CLIP}: Enhancing Fine-Grained Image Retrieval with Pre-trained Embeddings},\nauthor={Conghao Shen and Yixin Liu and Wanyue Zhai},\nyear={2024},\nurl={https://openreview.net/forum?id=7F4ioiKQFT}\n}",
        "github": "",
        "project": "",
        "reviewers": "hnuQ;coku;yk6P;Qpf8",
        "site": "https://openreview.net/forum?id=7F4ioiKQFT",
        "pdf_size": 3760218,
        "rating": "3;3;5;5",
        "confidence": "4;4;5;4",
        "soundness": "2;2;2;3",
        "contribution": "2;1;2;2",
        "presentation": "2;3;1;2",
        "wc_summary": "53;61;115;69",
        "wc_strengths": "25;19;106;45",
        "wc_weaknesses": "206;55;262;194",
        "wc_questions": "39;18;4;18",
        "wc_review": "323;153;487;326",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            74.5,
            24.057223447438815
        ],
        "wc_strengths_avg": [
            48.75,
            34.4265522525855
        ],
        "wc_weaknesses_avg": [
            179.25,
            76.18849978835388
        ],
        "wc_questions_avg": [
            19.75,
            12.497499749949988
        ],
        "wc_review_avg": [
            322.25,
            118.11302849389648
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ZMvOkV_SPHkJ:scholar.google.com/&scioq=ColCLIP:+Enhancing+Fine-Grained+Image+Retrieval+with+Pre-trained+Embeddings&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Stanford University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.stanford.edu",
        "aff_unique_abbr": "Stanford",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Stanford",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "7FHrZuKogW",
        "title": "Contractive Systems Improve Graph Neural Networks Against Adversarial Attacks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph Neural Networks (GNNs) have established themselves as a key component in addressing diverse graph-based tasks. Despite their notable successes, GNNs remain susceptible to input perturbations in the form of adversarial attacks. This paper introduces an innovative approach to fortify GNNs against adversarial perturbations through the lens of contractive dynamical systems. Our method introduces graph neural layers based on differential equations with contractive properties, which, as we show, improve the robustness of GNNs. A distinctive feature of the proposed approach is the simultaneous learned evolution of both the node features and the adjacency matrix, yielding an intrinsic enhancement of model robustness to perturbations in the input features and the connectivity of the graph. We mathematically derive the underpinnings of our novel architecture and provide theoretical insights to reason about its expected behavior. We demonstrate the efficacy of our method through numerous real-world benchmarks, reading on par or improved performance compared to existing methods.",
        "keywords": "Graph Neural Networks;Adversarial Defense;Contractive Systems;Dynamical Systems Inspired Neural Networks",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Moshe Eliasof;Davide Murari;Ferdia Sherry;Carola-Bibiane Sch\u00f6nlieb",
        "authorids": "~Moshe_Eliasof1;~Davide_Murari1;~Ferdia_Sherry1;~Carola-Bibiane_Sch\u00f6nlieb1",
        "gender": "M;M;;F",
        "homepage": ";http://davidemurari.com;https://ferdiasherry.com;http://www.damtp.cam.ac.uk/research/cia/",
        "dblp": "239/6004;286/5121;;07/8184",
        "google_scholar": "44LKqBsAAAAJ;P8A76uwAAAAJ;8V2NqB8AAAAJ;nPeOXjwAAAAJ",
        "orcid": ";0000-0002-1095-6685;;",
        "linkedin": ";;;",
        "or_profile": "~Moshe_Eliasof1;~Davide_Murari1;~Ferdia_Sherry1;~Carola-Bibiane_Sch\u00f6nlieb1",
        "aff": "University of Cambridge;Norwegian University of Science and Technology;University of Cambridge;University of Cambridge",
        "aff_domain": "cam.ac.uk;ntnu.no;cam.ac.uk;cam.ac.uk",
        "position": "Postdoc;PhD student;Postdoc;Full Professor",
        "bibtex": "@misc{\neliasof2024contractive,\ntitle={Contractive Systems Improve Graph Neural Networks Against Adversarial Attacks},\nauthor={Moshe Eliasof and Davide Murari and Ferdia Sherry and Carola-Bibiane Sch{\\\"o}nlieb},\nyear={2024},\nurl={https://openreview.net/forum?id=7FHrZuKogW}\n}",
        "github": "",
        "project": "",
        "reviewers": "mRqu;SPJa;fwuD;QT3W",
        "site": "https://openreview.net/forum?id=7FHrZuKogW",
        "pdf_size": 531618,
        "rating": "5;5;6;6",
        "confidence": "4;4;1;2",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "32;22;80;51",
        "wc_strengths": "33;62;107;13",
        "wc_weaknesses": "78;570;6;36",
        "wc_questions": "139;1;10;9",
        "wc_review": "282;655;203;109",
        "wc_reply_reviewers": "205;20;9;9",
        "wc_reply_authors": "1925;2577;188;265",
        "reply_reviewers": "2;1;1;1",
        "reply_authors": "6;6;2;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            2.75,
            1.299038105676658
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            46.25,
            22.094965489902897
        ],
        "wc_strengths_avg": [
            53.75,
            35.336772631353874
        ],
        "wc_weaknesses_avg": [
            172.5,
            230.91719295020022
        ],
        "wc_questions_avg": [
            39.75,
            57.408078699778834
        ],
        "wc_review_avg": [
            312.25,
            207.14653629737572
        ],
        "wc_reply_reviewers_avg": [
            60.75,
            83.40376190556395
        ],
        "wc_reply_authors_avg": [
            1238.75,
            1038.5225984541694
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.0,
            2.0
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9622504486493763,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14697871274676579373&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "University of Cambridge;Norwegian University of Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cam.ac.uk;https://www.ntnu.no",
        "aff_unique_abbr": "Cambridge;NTNU",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Cambridge;",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "United Kingdom;Norway"
    },
    {
        "title": "SLiMe: Segment Like Me",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19368",
        "id": "7FeIRqCedv",
        "author_site": "Aliasghar Khani, Saeid Asgari, Aditya Sanghi, Ali Mahdavi Amiri, Ghassan Hamarneh",
        "tldr": "",
        "abstract": "Significant strides have been made using large vision-language models, like Stable Diffusion (SD), for a variety of downstream tasks, including image generation, image editing, and 3D shape generation. Inspired by these advancements, we explore leveraging these vision-language models for segmenting images at any desired granularity using as few as one annotated sample. We propose SLiMe, which frames this problem as an optimization task. Specifically, given a single image and its segmentation mask, we first extract our novel \u201cweighted accumulated self-attention map\u201d along with cross-attention map from the SD prior. Then, using these extracted maps, the text embeddings of SD are optimized to highlight the segmented region in these attention maps, which in turn can be used to derive new segmentation results. Moreover, leveraging additional training data when available, i.e. few-shot, improves the performance of SLiMe. We performed comprehensive experiments examining various design factors and showed that SLiMe outperforms other existing one-shot and few-shot segmentation methods.",
        "keywords": "one-shot segmentation;computer vision;text-to-image models;stable diffusion;cross attention",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/9c59450fa65d10e741d665936f860f90609cced7.zip",
        "author": "Aliasghar Khani;Saeid Asgari;Aditya Sanghi;Ali Mahdavi Amiri;Ghassan Hamarneh",
        "authorids": "~Aliasghar_Khani1;~Saeid_Asgari1;~Aditya_Sanghi1;~Ali_Mahdavi_Amiri1;~Ghassan_Hamarneh1",
        "gender": "M;;M;M;M",
        "homepage": "http://aliasgharkhani.github.io/;https://asgsaeid.github.io/;https://github.com/sanghiad;https://www.sfu.ca/~amahdavi;http://www.medicalimageanalysis.com",
        "dblp": ";201/4374.html;;33/10499.html;h/GhassanHamarneh",
        "google_scholar": "yr7Y5EcAAAAJ;SuePM1sAAAAJ;q0-11e25FxIC;https://scholar.google.ca/citations?user=M9eTADwAAAAJ;https://scholar.google.ca/citations?user=61DdlkAAAAAJ",
        "orcid": ";;;;0000-0001-5040-7448",
        "linkedin": "aliasghar-khani-08157b16b/;;;;ghassanhamarneh/",
        "or_profile": "~Aliasghar_Khani1;~Saeid_Asgari1;~Aditya_Sanghi1;~Ali_Mahdavi_Amiri1;~Ghassan_Hamarneh1",
        "aff": "Computing Science, Simon Fraser University;Autodesk;Autodesk;Simon Fraser University;Simon Fraser University",
        "aff_domain": "cs.sfu.ca;autodesk.com;autodesk.com;sfu.ca;sfu.ca",
        "position": "MS student;Research Scientist;Researcher;Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\nkhani2024slime,\ntitle={{SL}iMe: Segment Like Me},\nauthor={Aliasghar Khani and Saeid Asgari and Aditya Sanghi and Ali Mahdavi Amiri and Ghassan Hamarneh},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=7FeIRqCedv}\n}",
        "github": "",
        "project": "",
        "reviewers": "Fjuo;kAQy;16rP;VRf7",
        "pdf_size": 22137145,
        "rating": "6;6;8;8",
        "confidence": "2;3;3;4",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "105;79;129;75",
        "wc_strengths": "124;64;48;66",
        "wc_weaknesses": "168;160;140;95",
        "wc_questions": "47;5;12;15",
        "wc_review": "444;308;329;251",
        "wc_reply_reviewers": "0;42;21;13",
        "wc_reply_authors": "667;315;244;616",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            97.0,
            21.77154105707724
        ],
        "wc_strengths_avg": [
            75.5,
            28.85740806101615
        ],
        "wc_weaknesses_avg": [
            140.75,
            28.314086600135983
        ],
        "wc_questions_avg": [
            19.75,
            16.145819892467525
        ],
        "wc_review_avg": [
            333.0,
            70.15340333868343
        ],
        "wc_reply_reviewers_avg": [
            19.0,
            15.247950681976906
        ],
        "wc_reply_authors_avg": [
            460.5,
            183.61985186792847
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.7071067811865475,
        "gs_citation": 33,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1984554634286821078&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=7FeIRqCedv",
        "pdf": "https://openreview.net/pdf?id=7FeIRqCedv",
        "email": "cs.sfu.ca;autodesk.com;autodesk.com;sfu.ca;sfu.ca",
        "author_num": 5,
        "aff_unique_index": "0;1;1;0;0",
        "aff_unique_norm": "Simon Fraser University;Autodesk",
        "aff_unique_dep": "Computing Science;",
        "aff_unique_url": "https://www.sfu.ca;https://www.autodesk.com",
        "aff_unique_abbr": "SFU;Autodesk",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;0;0",
        "aff_country_unique": "Canada;United States"
    },
    {
        "id": "7GCRhebJEr",
        "title": "Robustness via learned Bregman divergence",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We exploit the Bregman divergence to generate functions that are trained to measure the semantic similarity between images under corruptions and use these functions as alternatives to the $L^p$ norms to define robustness threat models. Then we replace the projected gradient descent (PGD) by semantic attacks, which are instantiations of the mirror descent, the optimization framework associated with the Bregman divergence. Adversarial training under these settings yield classification models that are more robust to common image corruptions. Particularly, for the contrast corruption that was found problematic in prior work we achieve an accuracy that exceeds the $L^p$- and the LPIPS-based adversarially trained neural networks by a margin of 29\\% on the CIFAR-10-C corruption dataset.",
        "keywords": "Bregman divergence;Mirror descent;Corruption robustness;Adversarial training;Self-supervised learning.",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Mohamed-Hicham LEGHETTAS;Markus P\u00fcschel",
        "authorids": "~Mohamed-Hicham_LEGHETTAS1;~Markus_P\u00fcschel1",
        "gender": "M;M",
        "homepage": "https://acl.inf.ethz.ch/people/hichaml/;https://acl.inf.ethz.ch/",
        "dblp": ";37/6355",
        "google_scholar": ";az9ZryAAAAAJ",
        "orcid": ";0000-0001-8834-8551",
        "linkedin": ";",
        "or_profile": "~Mohamed-Hicham_LEGHETTAS1;~Markus_P\u00fcschel1",
        "aff": "Department of Computer Science, ETHZ - ETH Zurich;Department of Computer Science, ETHZ - ETH Zurich",
        "aff_domain": "inf.ethz.ch;inf.ethz.ch",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nleghettas2024robustness,\ntitle={Robustness via learned Bregman divergence},\nauthor={Mohamed-Hicham LEGHETTAS and Markus P{\\\"u}schel},\nyear={2024},\nurl={https://openreview.net/forum?id=7GCRhebJEr}\n}",
        "github": "",
        "project": "",
        "reviewers": "qLEt;brGx;zXKR;GMTd",
        "site": "https://openreview.net/forum?id=7GCRhebJEr",
        "pdf_size": 1783808,
        "rating": "3;3;6;8",
        "confidence": "4;4;3;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;4",
        "wc_summary": "21;94;67;80",
        "wc_strengths": "11;43;57;119",
        "wc_weaknesses": "53;271;65;410",
        "wc_questions": "6;2;82;237",
        "wc_review": "91;410;271;846",
        "wc_reply_reviewers": "0;119;36;72",
        "wc_reply_authors": "6;1349;255;540",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            5.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            65.5,
            27.408940147331492
        ],
        "wc_strengths_avg": [
            57.5,
            39.22690403281911
        ],
        "wc_weaknesses_avg": [
            199.75,
            149.14317785269296
        ],
        "wc_questions_avg": [
            81.75,
            95.132473425219
        ],
        "wc_review_avg": [
            404.5,
            278.86242127615543
        ],
        "wc_reply_reviewers_avg": [
            56.75,
            44.04188347471075
        ],
        "wc_reply_authors_avg": [
            537.5,
            505.1823928048166
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.2721655269759087,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:orqCiqyFMJ4J:scholar.google.com/&scioq=Robustness+via+learned+Bregman+divergence&hl=en&as_sdt=0,11",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "ETH Zurich",
        "aff_unique_dep": "Department of Computer Science",
        "aff_unique_url": "https://www.ethz.ch",
        "aff_unique_abbr": "ETHZ",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Zurich",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Switzerland"
    },
    {
        "id": "7GkdjhupsV",
        "title": "InfoAug: Mutual Information Informed Augmentation for Representation Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Representation learning methods utilizing the InfoNCE loss have demonstrated considerable capacity in reducing human annotation effort by training invariant neural feature extractors. Although different variants of the training objective adhere to the information maximization principle between the data and learned features, data selection and augmentation still rely on human hypotheses or engineering, which may be suboptimal. For instance, data augmentation in contrastive learning primarily focuses on color jittering, aiming to emulate real-world illumination changes. In this work, we investigate the potential of selecting training data based on their mutual information computed from real-world distributions, which, in principle, should endow the learned features with better generalization when applied in open environments. Specifically, we consider patches attached to scenes that exhibit high mutual information under natural perturbations, such as color changes and motion, as positive samples for learning with contrastive loss. We evaluate the proposed mutual-information-informed data augmentation method on several benchmarks across multiple state-of-the-art representation learning frameworks, demonstrating its effectiveness and establishing it as a promising direction for future research. The data and code will be available for further investigation.",
        "keywords": "representation learning;mutual information;data augmentation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Hanyang Chen;Qingyuan Zheng;YANG ZONGRU;Yanchao Yang",
        "authorids": "~Hanyang_Chen2;~Qingyuan_Zheng1;~YANG_ZONGRU2;~Yanchao_Yang1",
        "gender": "M;M;M;M",
        "homepage": "https://jeremycccc.github.io/;;https://github.com/yangzongru-jpg;https://yanchaoyang.github.io/",
        "dblp": ";;;84/8637-1",
        "google_scholar": ";;;r2tKnV4AAAAJ",
        "orcid": ";;;",
        "linkedin": ";https://www.linkedin.cn/incareer/in/ACoAAD7uNpgBlyknH4xCq6-6dwLecU4xaHDNqBc;;",
        "or_profile": "~Hanyang_Chen2;~Qingyuan_Zheng1;~YANG_ZONGRU2;~Yanchao_Yang1",
        "aff": "University of Hong Kong;University of Hong Kong;University of Hong Kong;University of Hong Kong",
        "aff_domain": "hku.hk;hku.hk;hku.hk;hku.hk",
        "position": "Undergrad student;PhD student;MS student;Assistant Professor",
        "bibtex": "@misc{\nchen2024infoaug,\ntitle={InfoAug: Mutual Information Informed Augmentation for Representation Learning},\nauthor={Hanyang Chen and Qingyuan Zheng and YANG ZONGRU and Yanchao Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=7GkdjhupsV}\n}",
        "github": "",
        "project": "",
        "reviewers": "xZ59;m3jm;LYQ4;A3xm",
        "site": "https://openreview.net/forum?id=7GkdjhupsV",
        "pdf_size": 1388488,
        "rating": "3;3;3;6",
        "confidence": "5;3;4;3",
        "soundness": "2;2;1;3",
        "contribution": "2;1;1;3",
        "presentation": "2;2;2;3",
        "wc_summary": "39;94;71;128",
        "wc_strengths": "34;27;42;97",
        "wc_weaknesses": "134;190;199;258",
        "wc_questions": "73;2;2;37",
        "wc_review": "280;313;314;520",
        "wc_reply_reviewers": "0;61;0;18",
        "wc_reply_authors": "495;467;559;457",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            83.0,
            32.50384592629001
        ],
        "wc_strengths_avg": [
            50.0,
            27.649593125396983
        ],
        "wc_weaknesses_avg": [
            195.25,
            43.96234183935155
        ],
        "wc_questions_avg": [
            28.5,
            29.3981291921782
        ],
        "wc_review_avg": [
            356.75,
            95.24015697173121
        ],
        "wc_reply_reviewers_avg": [
            19.75,
            24.923633362734254
        ],
        "wc_reply_authors_avg": [
            494.5,
            39.75864685826217
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:5X_KkOYcPoIJ:scholar.google.com/&scioq=InfoAug:+Mutual+Information+Informed+Augmentation+for+Representation+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of Hong Kong",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.hku.hk",
        "aff_unique_abbr": "HKU",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "7Gza2TkLPJ",
        "title": "BiTGNN: prediction of drug-target interactions based on bidirectional transformer and graph neural network on heterogeneous graph",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Drug-target interaction (DTI) is a widely explored topic in the field of bioinformatics and plays a pivotal role in drug discovery. However, the traditional bio-experimental process of drug-target interaction identification requires a large investment of time and labor. To address this challenge, graph neural network (GNN) approaches in deep learning are becoming a prominent trend in the field of DTI research, which is characterized by multimodal processing of data, feature learning and interpretability in DTI. Nevertheless, some methods are still limited by homogeneous graphs and single features. To address the problems we mechanistically analyze graph convolutional neural networks (GCN) and graph attentional neural networks (GAT) in order to propose a new model for drug-target interaction prediction based on graph neural networks named BiTGNN (bidirectional transformer and graph neural network). The method first establishes drug-target pairs through the pseudo-position specificity scoring matrix (PsePSSM) and drug fingerprint data, and constructs a heterogeneous network by utilizing the relationship between the drug and the target. Then, the computational extraction of drug and target attributes is performed using GCN and GAT for the purpose of model information flow extension and graph information enhancement. We collect interaction data using the proposed Bi-directional transformer (Bi-transformer) architecture, in which we design a bi-directional cross-attention mechanism for calculating the effects of drug-target interactions for realistic biological interaction simulations. Finally, a feed-forward neural network is used to obtain the feature matrices of the drug and the target, and DTI prediction is performed by fusing the two feature matrices. The Enzyme, Ion Channel (IC) , G Protein-coupled Receptor (GPCR) , and Nuclear Receptor (NR) datasets are used in the experiments, and compared with several existing mainstream models, our model outperforms the others in Area Under the Curve (AUC), Area Under the Precision-Recall Curve (AUPR) , Accuracy and Specificity metrics.",
        "keywords": "DTI prediction;bidirectional transformer;graph attention network;graph convolutional neural network",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Qingqian Zhang;Changxiang He;Xiaofei Qin;Peisheng Yang;Junyang Kong",
        "authorids": "~Qingqian_Zhang2;~Changxiang_He2;~Xiaofei_Qin1;~Peisheng_Yang1;~Junyang_Kong1",
        "gender": "F;M;M;;",
        "homepage": ";;;;",
        "dblp": ";;;;",
        "google_scholar": ";;;;",
        "orcid": ";0000-0002-0258-5423;0009-0002-1134-5517;0009-0003-1645-4058;",
        "linkedin": ";;;;",
        "or_profile": "~Qingqian_Zhang2;~Xiaofei_Qin1;~Peisheng_Yang1;~Junyang_Kong1;~changxiang_he1",
        "aff": "University of Shanghai for Science and Technology;Shanghai University of Science and Technology;University of Shanghai for Science and Technology;Shanghai University of Science and Technology;",
        "aff_domain": "usst.edu.cn;usst.edu.cn;usst.edu.cn;usst.edu.cn;",
        "position": "MS student;Associate Professor;MS student;MS student;",
        "bibtex": "@misc{\nzhang2024bitgnn,\ntitle={Bi{TGNN}: prediction of drug-target interactions based on bidirectional transformer and graph neural network on heterogeneous graph},\nauthor={Qingqian Zhang and Changxiang He and Xiaofei Qin and Peisheng Yang and Junyang Kong},\nyear={2024},\nurl={https://openreview.net/forum?id=7Gza2TkLPJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "rts4;eUmF;UEEt;Z8k5",
        "site": "https://openreview.net/forum?id=7Gza2TkLPJ",
        "pdf_size": 472893,
        "rating": "1;1;3;3",
        "confidence": "5;4;4;5",
        "soundness": "1;1;2;3",
        "contribution": "1;1;2;2",
        "presentation": "1;1;2;1",
        "wc_summary": "93;75;58;111",
        "wc_strengths": "5;7;24;109",
        "wc_weaknesses": "67;192;250;317",
        "wc_questions": "4;2;35;55",
        "wc_review": "169;276;367;592",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.0,
            1.0
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            1.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            84.25,
            19.79109648301478
        ],
        "wc_strengths_avg": [
            36.25,
            42.64607250380743
        ],
        "wc_weaknesses_avg": [
            206.5,
            91.88715905935932
        ],
        "wc_questions_avg": [
            24.0,
            22.169799277395363
        ],
        "wc_review_avg": [
            351.0,
            155.79313206942084
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6952811768654855146&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;1",
        "aff_unique_norm": "University of Shanghai for Science and Technology;Shanghai University of Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.usst.edu.cn;https://www.sustech.edu.cn",
        "aff_unique_abbr": "USST;SUSTech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "7HdtLgsvys",
        "title": "Tube Loss: A Novel Approach for High Quality Prediction Interval Estimation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "This paper proposes a continuous loss function termed 'tube loss' for  Prediction Interval (PI) estimation. The minimizer of the proposed tube loss is a pair of functions  $\\mu_1(x)$ and $\\mu_2(x)$ such that the interval $[\\mu_1(x),\\mu_2(x)]$ contains $t$  fraction of $y_i$ values. The tube loss function also facilitates an upward or downward movement of the  PI tube so that the estimated PI may cover the densest regions of response values, thus allowing the sharpening of the width of PI, especially when the distribution of the response is skewed. The tube loss function-based machine learning models also have the privilege of trading off the calibration error and the width of PI by solving a single optimization problem. We have illustrated the use of tube loss functions in kernel machines, neural networks, and sequential deep learning models. Our numerical experiments show that the tube loss function is effective in yielding narrow and more accurate PIs compared to the existing methods.",
        "keywords": "Prediction Interval Estimation;Neural Network;Loss Function;Kernel Machine",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/f03da49e3d74031967c62860619ea67ae3dee76c.zip",
        "author": "Pritam Anand;Tathagata Bandyopadhyay;Harshkumar Mukeshbhai Savaliya;Suresh Chandra",
        "authorids": "~Pritam_Anand1;~Tathagata_Bandyopadhyay1;~Harshkumar_Mukeshbhai_Savaliya2;~Suresh_Chandra2",
        "gender": "M;M;;M",
        "homepage": "https://scholar.google.com/citations?user=ATYzQhoAAAAJ&hl=en;;;",
        "dblp": ";;;",
        "google_scholar": ";https://scholar.google.co.in/citations?user=NZjB-lUAAAAJ;;https://scholar.google.co.in/citations?user=X8dtzjAAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;harsh-savaliya-8b81b117a/;",
        "or_profile": "~Pritam_Anand1;~Tathagata_Bandyopadhyay1;~Harshkumar_Mukeshbhai_Savaliya2;~Suresh_Chandra2",
        "aff": "DA-IICT, Gandhinagar;DA-IICT;;",
        "aff_domain": "daiict.ac.in;daiict.ac.in;;",
        "position": "Assistant Professor;Full Professor;;",
        "bibtex": "@misc{\nanonymous2024tube,\ntitle={Tube Loss: A Novel Approach for High Quality Prediction Interval Estimation},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=7HdtLgsvys}\n}",
        "github": "",
        "project": "",
        "reviewers": "tfsf;PHGF;9f1c;RfXE",
        "site": "https://openreview.net/forum?id=7HdtLgsvys",
        "pdf_size": 944500,
        "rating": "1;3;3;3",
        "confidence": "5;3;2;3",
        "soundness": "1;3;2;2",
        "contribution": "1;3;1;2",
        "presentation": "1;2;1;2",
        "wc_summary": "37;62;26;74",
        "wc_strengths": "18;94;15;51",
        "wc_weaknesses": "44;68;79;137",
        "wc_questions": "340;137;15;4",
        "wc_review": "439;361;135;266",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            49.75,
            19.13602623325961
        ],
        "wc_strengths_avg": [
            44.5,
            31.87867625859016
        ],
        "wc_weaknesses_avg": [
            82.0,
            34.18332927027442
        ],
        "wc_questions_avg": [
            124.0,
            135.1906061825303
        ],
        "wc_review_avg": [
            300.25,
            113.38292419936964
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9271726499455306,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:v68TjBMqysEJ:scholar.google.com/&scioq=Tube+Loss:+A+Novel+Approach+for+High+Quality+Prediction+Interval+Estimation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Dhirubhai Ambani Institute of Information and Communication Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.daiict.ac.in",
        "aff_unique_abbr": "DA-IICT",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Gandhinagar;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "India"
    },
    {
        "id": "7Hf4Wtc8uW",
        "title": "Variational Bayes Classifier",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Classifiers have traditionally been designed as fully-observed models. These classifiers are generally deterministic, so they are able to obtain a single output per input. The problem with this is that in this scenario it is not usually possible to capture the model uncertainty. On the other hand, Bayesian models offer the ability to capture this uncertainty, but usually have a higher computational cost. In this paper we propose to build a classifier as a latent variable model. This latent variable corresponds to what is usually called embedding and with our proposal we can model its distribution, which has two fundamental advantages. The first is that by knowing the distribution of the embeddings, the uncertainty of the predictions can be estimated. In addition, certain conditions can be imposed on the distribution of the embeddings to favor aspects such as interclass separation. We also propose an evidence lower bound to optimize the parameters of this classifier which can be maximized using stochastic gradient methods. Finally, we give two alternatives to implement these models using neural networks and demonstrate empirically the theoretical advantages of our proposal using different architectures and datasets.",
        "keywords": "embeddings organization;calibrated classification;variational classifier",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/76a3d790c197c181ceb24e0c74ecd4265d93b142.zip",
        "author": "Antonio Almud\u00e9var;Alfonso Ortega;Antonio Miguel;Luis Vicente;Eduardo Lleida",
        "authorids": "~Antonio_Almud\u00e9var1;~Alfonso_Ortega2;~Antonio_Miguel1;~Luis_Vicente1;~Eduardo_Lleida1",
        "gender": "M;M;;M;",
        "homepage": "https://vivolab.i3a.es/antonio-almudevar/;http://alfonso.vivolab.es;https://vivolab.i3a.es/antonio-miguel/;;https://vivolab.i3a.es/eduardo-lleida/",
        "dblp": "333/6950;121/1854-1.html;;;14/4997",
        "google_scholar": "https://scholar.google.com/citations?hl=es;https://scholar.google.es/citations?hl=es;https://scholar.google.com/citations?hl=es;https://scholar.google.es/citations?user=pOEAiugAAAAJ;https://scholar.google.es/citations?hl=es",
        "orcid": ";0000-0002-3886-7748;0000-0001-5803-4316;0000-0003-4391-5203;0000-0001-9137-4013",
        "linkedin": ";;antonio-miguel-78792410/;luisvicenteborruel/;https://linkedin.com/in/eduardolleida",
        "or_profile": "~Antonio_Almud\u00e9var1;~Alfonso_Ortega2;~Antonio_Miguel1;~Luis_Vicente1;~Eduardo_Lleida1",
        "aff": "Universidad de Zaragoza;Universidad de Zaragoza;Universidad de Zaragoza;Universidad de Zaragoza;Universidad de Zaragoza",
        "aff_domain": "unizar.es;unizar.es;unizar.es;unizar.es;unizar.es",
        "position": "PhD student;Associate Professor;Associate Professor;Associate Professor;Full Professor",
        "bibtex": "@misc{\nalmud{\\'e}var2024variational,\ntitle={Variational Bayes Classifier},\nauthor={Antonio Almud{\\'e}var and Alfonso Ortega and Antonio Miguel and Luis Vicente and Eduardo Lleida},\nyear={2024},\nurl={https://openreview.net/forum?id=7Hf4Wtc8uW}\n}",
        "github": "",
        "project": "",
        "reviewers": "fLRd;pf4E;QwG7;KP2i",
        "site": "https://openreview.net/forum?id=7Hf4Wtc8uW",
        "pdf_size": 617254,
        "rating": "3;5;5;5",
        "confidence": "3;4;3;4",
        "soundness": "3;3;2;3",
        "contribution": "2;2;2;2",
        "presentation": "3;3;2;2",
        "wc_summary": "72;100;74;39",
        "wc_strengths": "57;85;73;69",
        "wc_weaknesses": "159;468;101;193",
        "wc_questions": "147;1;450;4",
        "wc_review": "435;654;698;305",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            71.25,
            21.649191670822262
        ],
        "wc_strengths_avg": [
            71.0,
            10.0
        ],
        "wc_weaknesses_avg": [
            230.25,
            141.15129294483987
        ],
        "wc_questions_avg": [
            150.5,
            182.70536390593463
        ],
        "wc_review_avg": [
            523.0,
            160.51012429127329
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:HfhhSe8DOPsJ:scholar.google.com/&scioq=Variational+Bayes+Classifier&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Universidad de Zaragoza",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.unizar.es",
        "aff_unique_abbr": "UNIZAR",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Spain"
    },
    {
        "id": "7HfliVAtCG",
        "title": "Detect Every Thing with Few Examples",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Open-set object detection aims at detecting arbitrary categories beyond those seen during training. Most recent advancements have adopted the open-vocabulary paradigm, utilizing vision-language backbones to represent categories with language. In this paper, we introduce DE-ViT, an open-set object detector that employs vision-only DINOv2 backbones and learns new categories through example images instead of language. To improve general detection ability, we transform multi-classification tasks into binary classification tasks while bypassing per-class inference, and propose a novel region propagation technique for localization. We evaluate DE-ViT on open-vocabulary, few-shot, and one-shot object detection benchmark with COCO and LVIS. For COCO, DE-ViT outperforms the open-vocabulary SoTA by 6.9 AP50 and achieves 50 AP50 in novel classes. DE-ViT surpasses the few-shot SoTA by 15 mAP on 10-shot and 7.2 mAP on 30-shot and one-shot SoTA by 2.8 AP50. For LVIS, DE-ViT outperforms the open-vocabulary SoTA by 2.2 mask AP and reaches 34.3 mask APr.",
        "keywords": "Few-shot;Object detection;Open-vocabulary",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Xinyu Zhang;Yuting Wang;Abdeslam Boularias",
        "authorids": "~Xinyu_Zhang7;~Yuting_Wang2;~Abdeslam_Boularias1",
        "gender": "M;;M",
        "homepage": "https://mlzxy.github.io/;;http://rl.cs.rutgers.edu/",
        "dblp": ";09/8269-4;57/2269",
        "google_scholar": "M7hnG9oAAAAJ;o9V5WAYAAAAJ;https://scholar.google.com.tw/citations?user=8AF3RCsAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Xinyu_Zhang7;~Yuting_Wang2;~Abdeslam_Boularias1",
        "aff": "Rutgers University;Amazon;, Rutgers University",
        "aff_domain": "rutgers.edu;amazon.com;cs.rutgers.edu",
        "position": "PhD student;Researcher;Associate Professor",
        "bibtex": "@misc{\nzhang2024detect,\ntitle={Detect Every Thing with Few Examples},\nauthor={Xinyu Zhang and Yuting Wang and Abdeslam Boularias},\nyear={2024},\nurl={https://openreview.net/forum?id=7HfliVAtCG}\n}",
        "github": "",
        "project": "",
        "reviewers": "Vm41;f8VP;bhpM;Jjnu",
        "site": "https://openreview.net/forum?id=7HfliVAtCG",
        "pdf_size": 9368714,
        "rating": "5;5;6;6",
        "confidence": "5;4;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "63;46;105;79",
        "wc_strengths": "39;14;56;37",
        "wc_weaknesses": "204;83;18;284",
        "wc_questions": "11;4;197;4",
        "wc_review": "317;147;376;404",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1944;2224;1480;997",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;5;3;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            73.25,
            21.72987574745884
        ],
        "wc_strengths_avg": [
            36.5,
            14.941552797483935
        ],
        "wc_weaknesses_avg": [
            147.25,
            103.38610883479463
        ],
        "wc_questions_avg": [
            54.0,
            82.61053201620238
        ],
        "wc_review_avg": [
            311.0,
            99.7572052535555
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1661.25,
            466.5604864323596
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            3.25,
            1.0897247358851685
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 23,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2956108232415386259&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Rutgers University;Amazon",
        "aff_unique_dep": ";Amazon.com, Inc.",
        "aff_unique_url": "https://www.rutgers.edu;https://www.amazon.com",
        "aff_unique_abbr": "Rutgers;Amazon",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "7J0NsFXnFd",
        "title": "Optimal Action Abstraction for Imperfect Information Extensive-Form Games",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Action abstraction is critical for solving imperfect information extensive-form games (IIEFGs) with large action spaces. However, due to the large number of states and high computational complexity in IIEFGs, existing methods often focus on using a fixed abstraction, which can result in sub-optimal performance. To tackle this issue, we propose a novel Markov Decision Process (MDP) formulation for finding the optimal (and possibly state-dependent) action abstraction. Specifically, the state of the MDP is defined as the public information of the game, each action is a feature vector representing a particular action abstraction, and the reward is defined as the expected value difference between the selected action abstraction and a default fixed action abstraction. Based on this MDP, we build a game tree with the  action abstraction selected by reinforcement learning (RL), and  solve for the optimal strategy based on counterfactual regret minimization (CFR). This two-phase framework, named RL-CFR, effectively trades off computational complexity (due to CFR) and performance improvement (due to RL) for IIEFGs, and offers a novel RL-guided action abstraction selection in CFR. To demonstrate the effectiveness of RL-CFR, we apply the method to solve Heads-up No-limit (HUNL) Texas Hold'em, a popular representative benchmark for IIEFGs. Our results show that RL-CFR defeats ReBeL, one of the best fixed action abstraction-based HUNL algorithms, and a strong HUNL agent Slumbot by significant win-rate margins $64\\pm 11$ and $84\\pm 17$ mbb/hand, respectively.",
        "keywords": "Game Theory;Imperfect Information Games;Extensive-Form Games;Regret Minimization;Reinforcement Learning;Texas Hold'em",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/98566200990017f081b3b26726c2443862776056.pdf",
        "author": "Boning Li;Zhixuan Fang;Longbo Huang",
        "authorids": "~Boning_Li3;~Zhixuan_Fang1;~Longbo_Huang2",
        "gender": "M;M;M",
        "homepage": "https://lbn187.github.io/;https://people.iiis.tsinghua.edu.cn/~fang/;http://people.iiis.tsinghua.edu.cn/~huang/",
        "dblp": ";179/2243;79/7077",
        "google_scholar": ";0N4s3CAAAAAJ;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Boning_Li3;~Zhixuan_Fang1;~Longbo_Huang2",
        "aff": "Tsinghua University;Tsinghua University;Tsinghua University",
        "aff_domain": "mail.tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "PhD student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nli2024optimal,\ntitle={Optimal Action Abstraction for Imperfect Information Extensive-Form Games},\nauthor={Boning Li and Zhixuan Fang and Longbo Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=7J0NsFXnFd}\n}",
        "github": "",
        "project": "",
        "reviewers": "YRS4;Y7tW;BWf4;3LiM",
        "site": "https://openreview.net/forum?id=7J0NsFXnFd",
        "pdf_size": 644861,
        "rating": "3;6;6;6",
        "confidence": "4;4;3;4",
        "soundness": "2;3;2;2",
        "contribution": "2;3;2;3",
        "presentation": "1;3;2;2",
        "wc_summary": "112;75;64;247",
        "wc_strengths": "49;88;110;119",
        "wc_weaknesses": "412;221;240;1434",
        "wc_questions": "187;68;124;1080",
        "wc_review": "760;452;538;2880",
        "wc_reply_reviewers": "238;14;0;426",
        "wc_reply_authors": "1272;680;912;4144",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "4;2;2;8",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            124.5,
            72.92633269265636
        ],
        "wc_strengths_avg": [
            91.5,
            27.004629232781554
        ],
        "wc_weaknesses_avg": [
            576.75,
            500.49444302609396
        ],
        "wc_questions_avg": [
            364.75,
            415.08997518610346
        ],
        "wc_review_avg": [
            1157.5,
            1000.8150428525743
        ],
        "wc_reply_reviewers_avg": [
            169.5,
            175.63812228556762
        ],
        "wc_reply_authors_avg": [
            1752.0,
            1397.036864223704
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.0,
            2.449489742783178
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:GQzfbIjeHbUJ:scholar.google.com/&scioq=Optimal+Action+Abstraction+for+Imperfect+Information+Extensive-Form+Games&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Tsinghua University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "7JRbs3i9Ei",
        "title": "Machine Learning for PROTAC Engineering",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "PROTACs are a promising therapeutic technology that harnesses the cell's built-in degradation processes to degrade specific proteins. Despite their potential, developing new PROTAC molecules is challenging and requires significant expertise, time, and cost. Meanwhile, machine learning has transformed various scientific fields, including drug development. In this work, we present a strategy for curating open-source PROTAC data and propose an open-source toolkit for predicting the degradation effectiveness, i.e., activity, of novel PROTAC molecules. We organized the curated data into 16 different datasets ready to be processed by machine learning models. The datasets incorporate important features such as $pDC_{50}$, $D_{max}$, E3 ligase type, POI amino acid sequence, and experimental cell type. Our toolkit includes a configurable PyTorch dataset class tailored to process PROTAC features, a customizable machine learning model for processing various PROTAC features, and a hyperparameter optimization mechanism powered by Optuna. To evaluate the system, three surrogate models were developed utilizing different PROTAC representations. Using our automatically-curated public datasets, the best models achieved a 71.4% validation accuracy and a 0.73 ROC-AUC validation score. This is not only comparable to state-of-the-art models for protein degradation prediction, but also open-source, easily-reproducible, and less computationally complex than existing approaches.",
        "keywords": "Deep learning;Chemoinformatics;PROTAC;Drug design.",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Stefano Ribes;Eva Nittinger;Christian Tyrchan;Roc\u00edo Mercado",
        "authorids": "~Stefano_Ribes1;eva.nittinger@astrazeneca.com;christian.tyrchan@astrazeneca.com;~Roc\u00edo_Mercado1",
        "gender": "M;;;F",
        "homepage": ";;;https://rociomer.github.io/",
        "dblp": ";;;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;;v2P0-IoAAAAJ",
        "orcid": ";;;0000-0002-6170-6088",
        "linkedin": "stefano-ribes-1379b1107/;;;rociomer/",
        "or_profile": "~Stefano_Ribes1;eva.nittinger@astrazeneca.com;christian.tyrchan@astrazeneca.com;~Roc\u00edo_Mercado1",
        "aff": ";;;Chalmers University of Technology",
        "aff_domain": ";;;chalmers.se",
        "position": ";;;Assistant Professor",
        "bibtex": "@misc{\nribes2024machine,\ntitle={Machine Learning for {PROTAC} Engineering},\nauthor={Stefano Ribes and Eva Nittinger and Christian Tyrchan and Roc{\\'\\i}o Mercado},\nyear={2024},\nurl={https://openreview.net/forum?id=7JRbs3i9Ei}\n}",
        "github": "",
        "project": "",
        "reviewers": "A2WQ;qQeP;BNfR",
        "site": "https://openreview.net/forum?id=7JRbs3i9Ei",
        "pdf_size": 798945,
        "rating": "3;5;5",
        "confidence": "4;3;4",
        "soundness": "1;2;3",
        "contribution": "1;2;2",
        "presentation": "2;2;2",
        "wc_summary": "193;33;99",
        "wc_strengths": "210;43;213",
        "wc_weaknesses": "222;19;110",
        "wc_questions": "48;369;66",
        "wc_review": "673;464;488",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            108.33333333333333,
            65.65228268858762
        ],
        "wc_strengths_avg": [
            155.33333333333334,
            79.44110327084391
        ],
        "wc_weaknesses_avg": [
            117.0,
            83.02208541506691
        ],
        "wc_questions_avg": [
            161.0,
            147.26167186338745
        ],
        "wc_review_avg": [
            541.6666666666666,
            93.3821301011185
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:MDX2luF9r44J:scholar.google.com/&scioq=Machine+Learning+for+PROTAC+Engineering&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Chalmers University of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.chalmers.se",
        "aff_unique_abbr": "Chalmers",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Sweden"
    },
    {
        "id": "7JU8TwFXGC",
        "title": "LLM Performance Predictors are good initializers for Architecture Search",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs) have become an integral component in solving a wide range of NLP tasks. In this work, we explore a novel use case of using LLMs to build performance predictors (PP): models that, given a specific deep neural network architecture, predict its performance on a downstream task. We design PP prompts for LLMs consisting of: (i) role: description of the role assigned to the LLM, (ii) instructions: set of instructions to be followed by the LLM to carry out performance prediction, (iii) hyperparameters: a definition of each architecture-specific hyperparameter and (iv) demonstrations: sample architectures along with their efficiency metrics and 'training from scratch' performance. For machine translation (MT) tasks, we discover that GPT-4 with our PP prompts (LLM-PP) can predict the performance of architecture with a mean absolute error matching the SOTA and a marginal degradation in rank correlation coefficient compared to SOTA performance predictors. Further, we show that the predictions from LLM-PP can be distilled to a small regression model (LLM-Distill-PP). LLM-Distill-PP models surprisingly retain the performance of LLM-PP largely and can be a cost-effective alternative for heavy use cases of performance estimation. Specifically, for neural architecture search (NAS), we propose a Hybrid-Search algorithm for NAS (HS-NAS), which uses LLM-Distill-PP for the initial part of search, resorting to the baseline predictor for rest of the search. We show that HS-NAS performs very similar to SOTA NAS across benchmarks, reduces search hours by \u223c50%, and in some cases, improves latency, GFLOPs, and model size.",
        "keywords": "Large language models;Neural architecture search;Performance Predictor;Machine Translation",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Ganesh Jawahar;Muhammad Abdul-Mageed;Laks V. S. Lakshmanan;Dujian Ding",
        "authorids": "~Ganesh_Jawahar1;~Muhammad_Abdul-Mageed2;~Laks_V._S._Lakshmanan1;~Dujian_Ding1",
        "gender": "M;;;",
        "homepage": "https://ganeshjawahar.github.io/;;https://www.cs.ubc.ca/~laks;",
        "dblp": "203/9710;;l/LVSLakshmanan;244/8792",
        "google_scholar": "https://scholar.google.co.in/citations?user=X7SMP1EAAAAJ;;https://scholar.google.ca/citations?user=_RCsaOsAAAAJ;https://scholar.google.ca/citations?user=1-FsZPQAAAAJ",
        "orcid": ";;0000-0002-9775-4241;",
        "linkedin": "https://in.linkedin.com/in/ganesh-jawahar-ab928435;;laksvslakshmanan/;dujian-ding-250123133/",
        "or_profile": "~Ganesh_Jawahar1;~Muhammad_Abdul-Mageed2;~Laks_V._S._Lakshmanan1;~Dujian_Ding1",
        "aff": "University of British Columbia;;University of British Columbia;Computing Science, University of British Columbia",
        "aff_domain": "ubc.ca;;ubc.ca;cs.ubc.ca",
        "position": "PhD student;;Professor;PhD student",
        "bibtex": "@misc{\njawahar2024llm,\ntitle={{LLM} Performance Predictors are good initializers for Architecture Search},\nauthor={Ganesh Jawahar and Muhammad Abdul-Mageed and Laks V. S. Lakshmanan and Dujian Ding},\nyear={2024},\nurl={https://openreview.net/forum?id=7JU8TwFXGC}\n}",
        "github": "",
        "project": "",
        "reviewers": "mogH;oJTh;ABPv;GzhX",
        "site": "https://openreview.net/forum?id=7JU8TwFXGC",
        "pdf_size": 536989,
        "rating": "3;5;6;6",
        "confidence": "4;4;4;3",
        "soundness": "1;2;3;3",
        "contribution": "1;3;3;3",
        "presentation": "3;2;3;1",
        "wc_summary": "43;84;58;68",
        "wc_strengths": "28;83;185;41",
        "wc_weaknesses": "206;326;102;95",
        "wc_questions": "4;28;85;50",
        "wc_review": "281;521;430;254",
        "wc_reply_reviewers": "165;240;44;0",
        "wc_reply_authors": "1285;1546;801;549",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            63.25,
            14.922717580923388
        ],
        "wc_strengths_avg": [
            84.25,
            61.617266248998746
        ],
        "wc_weaknesses_avg": [
            182.25,
            93.91585329431874
        ],
        "wc_questions_avg": [
            41.75,
            29.80247472945829
        ],
        "wc_review_avg": [
            371.5,
            109.28060212132802
        ],
        "wc_reply_reviewers_avg": [
            112.25,
            95.34247479481535
        ],
        "wc_reply_authors_avg": [
            1045.25,
            391.83949201171646
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.4714045207910316,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=712574979734589959&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of British Columbia",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ubc.ca",
        "aff_unique_abbr": "UBC",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Vancouver",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "7Jer2DQt9V",
        "title": "The Unreasonable Effectiveness of Pretraining in Graph OOD",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph neural networks have shown significant progress in various tasks, yet their ability to generalize in out-of-distribution (OOD) scenarios remains an open question. In this study, we conduct a comprehensive benchmarking of the efficacy of graph pre-trained models in the context of OOD challenges, named as PODGenGraph. We conduct extensive experiments across diverse datasets, spanning general and molecular graph domains and encompassing different graph sizes. Our benchmark is framed around distinct distribution shifts, including both concept and covariate shifts, whilst also varying the degree of shift. Our findings are striking: even basic pre-trained models exhibit performance that is not only comparable to, but often surpasses, specifically designed to handle distribution shift. We further investigate the results, examining the influence of the key factors (e.g., sample size, learning rates, in-distribution performance etc) of pre-trained models for OOD generalization. In general, our work shows that pre-training could be a flexible and simple approach to OOD generalization in graph learning. Leveraging pre-trained models together for graph OOD generalization in real-world applications stands as a promising avenue for future research.",
        "keywords": "Graph pre-training;Graph out of distribution",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/f6031b9f3f6b1d563bf73f57f72d57225c61d6b9.pdf",
        "author": "Qi Liu;Rosa H. M. Chan;Rose Yu",
        "authorids": "~Qi_Liu8;~Rosa_H._M._Chan1;~Rose_Yu1",
        "gender": ";F;F",
        "homepage": "https://www.qi-liu.com/;https://www.ee.cityu.edu.hk/~rosachan;http://roseyu.com",
        "dblp": ";86/7576;164/7314",
        "google_scholar": ";n71R2h8AAAAJ;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Qi_Liu8;~Rosa_H._M._Chan1;~Rose_Yu1",
        "aff": "City University of Hong Kong;City University of Hong Kong;University of California, San Diego",
        "aff_domain": "cityu.edu.hk;cityu.edu.hk;ucsd.edu",
        "position": "PhD student;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nliu2024the,\ntitle={The Unreasonable Effectiveness of Pretraining in Graph {OOD}},\nauthor={Qi Liu and Rosa H. M. Chan and Rose Yu},\nyear={2024},\nurl={https://openreview.net/forum?id=7Jer2DQt9V}\n}",
        "github": "",
        "project": "",
        "reviewers": "RvDk;xDkS;qBm3;tP6E",
        "site": "https://openreview.net/forum?id=7Jer2DQt9V",
        "pdf_size": 1404820,
        "rating": "3;5;5;5",
        "confidence": "4;4;4;4",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;3;2",
        "wc_summary": "58;73;80;84",
        "wc_strengths": "49;27;56;134",
        "wc_weaknesses": "156;244;295;220",
        "wc_questions": "12;2;43;70",
        "wc_review": "275;346;474;508",
        "wc_reply_reviewers": "73;48;0;0",
        "wc_reply_authors": "718;504;924;576",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            73.75,
            9.908960591303208
        ],
        "wc_strengths_avg": [
            66.5,
            40.413487847499624
        ],
        "wc_weaknesses_avg": [
            228.75,
            49.97686964986903
        ],
        "wc_questions_avg": [
            31.75,
            26.76167969317322
        ],
        "wc_review_avg": [
            400.75,
            94.44409722158395
        ],
        "wc_reply_reviewers_avg": [
            30.25,
            31.514877439076294
        ],
        "wc_reply_authors_avg": [
            680.5,
            160.28958169513078
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:WzMw4lJiXFIJ:scholar.google.com/&scioq=The+Unreasonable+Effectiveness+of+Pretraining+in+Graph+OOD&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "City University of Hong Kong;University of California, San Diego",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cityu.edu.hk;https://www.ucsd.edu",
        "aff_unique_abbr": "CityU;UCSD",
        "aff_campus_unique_index": "0;0;1",
        "aff_campus_unique": "Hong Kong SAR;San Diego",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "STREAM: Spatio-TempoRal Evaluation and Analysis Metric for Video Generative Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19367",
        "id": "7JfKCZQPxJ",
        "author_site": "Pum Jun Kim, Seojun Kim, Jaejun Yoo",
        "tldr": "",
        "abstract": "Image generative models have made significant progress in generating realistic and diverse images, supported by comprehensive guidance from various evaluation metrics. However, current video generative models struggle to generate even\nshort video clips, with limited tools that provide insights for improvements. Current video evaluation metrics are simple adaptations of image metrics by switching the embeddings with video embedding networks, which may underestimate the unique characteristics of video. Our analysis reveals that the widely used Frechet Video Distance (FVD) has a stronger emphasis on the spatial aspect than the temporal naturalness of video and is inherently constrained by the input size of the embedding networks used, limiting it to 16 frames. Additionally, it demonstrates considerable instability and diverges from human evaluations. To address the limitations, we propose STREAM, a new video evaluation metric uniquely designed to independently evaluate spatial and temporal aspects. This feature allows comprehensive analysis and evaluation of video generative models from various perspectives, unconstrained by video length. We provide analytical and experimental evidence demonstrating that STREAM provides an effective evaluation tool for both visual and temporal quality of videos, offering insights into area of improvement for video generative models. To the best of our knowledge, STREAM is the first evaluation metric that can separately assess the temporal and spatial aspects of videos. Our code is available at https://github.com/pro2nit/STREAM.",
        "keywords": "Generative Models;Video Generative Models;Evaluation;Fidelity;Diversity;Assessment",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Pum Jun Kim;Seojun Kim;Jaejun Yoo",
        "authorids": "~Pum_Jun_Kim1;~Seojun_Kim1;~Jaejun_Yoo1",
        "gender": "M;M;M",
        "homepage": ";;",
        "dblp": "349/4625;;141/8878-1",
        "google_scholar": "WGJgXskAAAAJ;;https://scholar.google.co.kr/citations?user=7NBlQw4AAAAJ",
        "orcid": "0000-0001-8220-0951;;0000-0001-5252-9668",
        "linkedin": ";\uc11c\uc900-\uae40-6b74a7292/;jaejunyoo/",
        "or_profile": "~Pum_Jun_Kim1;~Seojun_Kim1;~Jaejun_Yoo1",
        "aff": "Ulsan National Institute of Science and Technology;Ulsan National Institute of Science and Technology;Ulsan National Institute of Science and Technology",
        "aff_domain": "unist.ac.kr;unist.ac.kr;unist.ac.kr",
        "position": "PhD student;MS student;Assistant Professor",
        "bibtex": "@inproceedings{\nkim2024stream,\ntitle={{STREAM}: Spatio-TempoRal Evaluation and  Analysis Metric for Video Generative Models},\nauthor={Pum Jun Kim and Seojun Kim and Jaejun Yoo},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=7JfKCZQPxJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "rxEA;srFK;1pjF;QwpP",
        "pdf_size": 5353516,
        "rating": "3;6;6;6",
        "confidence": "5;4;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;2;2",
        "wc_summary": "41;94;94;48",
        "wc_strengths": "32;270;63;61",
        "wc_weaknesses": "43;351;158;75",
        "wc_questions": "185;95;2;41",
        "wc_review": "301;810;317;225",
        "wc_reply_reviewers": "0;129;41;0",
        "wc_reply_authors": "1191;659;528;648",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "3;1;1;1",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            69.25,
            24.873429598670143
        ],
        "wc_strengths_avg": [
            106.5,
            95.19059827524985
        ],
        "wc_weaknesses_avg": [
            156.75,
            119.74634649959054
        ],
        "wc_questions_avg": [
            80.75,
            68.65265836076561
        ],
        "wc_review_avg": [
            413.25,
            231.68553580230252
        ],
        "wc_reply_reviewers_avg": [
            42.5,
            52.671149598238316
        ],
        "wc_reply_authors_avg": [
            756.5,
            256.06688579353636
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17515982151271475644&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=7JfKCZQPxJ",
        "pdf": "https://openreview.net/pdf?id=7JfKCZQPxJ",
        "email": "unist.ac.kr;unist.ac.kr;unist.ac.kr",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Ulsan National Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.unist.ac.kr",
        "aff_unique_abbr": "UNIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "7JigPd5Pm5",
        "title": "Informed weight initialization of Graph Neural Networks and its effect on Oversmoothing",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this work, we generalize the ideas of Kaiming initialization to Graph Neural Networks (GNNs) and propose a new initialization scheme that addresses the problem of oversmoothing. GNNs are typically initialized using methods, that have been designed for other types of Neural Networks, such as Xavier or Kaiming initialization. Such methods ignore the underlying topology of the graph. In this work, propose a new initialization method, called G-Init, which takes into account (a) the variance of signals flowing forward, (b) the gradients flowing backward\nin the network, and (c) the effect of graph convolution, which tends to smooth node representations and lead to the problem of oversmoothing. Oversmoothing is an inherent problem of GNNs, which appears when their depth increases, making node representations indistinguishable. We show that in deep GNNs, G-Init reduces oversmoothing and enables deep architectures. We also verify the theoretical results experimentally.",
        "keywords": "Graph Neural Networks;Weight initialization;Oversmoothing",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Dimitrios Kelesis;Dimitris Fotakis;Georgios Paliouras",
        "authorids": "~Dimitrios_Kelesis1;~Dimitris_Fotakis1;~Georgios_Paliouras1",
        "gender": ";M;M",
        "homepage": ";http://www.softlab.ntua.gr/~fotakis/;https://users.iit.demokritos.gr/~paliourg",
        "dblp": "309/5763;95/4731;55/2039",
        "google_scholar": ";zFDLf0UAAAAJ;-pec7wIAAAAJ",
        "orcid": ";0000-0001-6864-8960;0000-0001-9629-2367",
        "linkedin": "dimitrios-kelesis-b614451b5/;;georgios-paliouras-a203a79/",
        "or_profile": "~Dimitrios_Kelesis1;~Dimitris_Fotakis1;~Georgios_Paliouras1",
        "aff": "National Centre For Scientific Research Demokritos;National Technical University of Athens;NCSR \u201cDemokritos\u201d",
        "aff_domain": "iit.demokritos.gr;ntua.gr;demokritos.gr",
        "position": "Researcher;Full Professor;Researcher",
        "bibtex": "@misc{\nkelesis2024informed,\ntitle={Informed weight initialization of Graph Neural Networks and its effect on Oversmoothing},\nauthor={Dimitrios Kelesis and Dimitris Fotakis and Georgios Paliouras},\nyear={2024},\nurl={https://openreview.net/forum?id=7JigPd5Pm5}\n}",
        "github": "",
        "project": "",
        "reviewers": "8Vyh;fihQ;kvnA;FoM5",
        "site": "https://openreview.net/forum?id=7JigPd5Pm5",
        "pdf_size": 240711,
        "rating": "1;3;3;3",
        "confidence": "4;4;3;4",
        "soundness": "1;1;2;3",
        "contribution": "2;1;2;1",
        "presentation": "1;2;2;1",
        "wc_summary": "54;356;86;51",
        "wc_strengths": "20;27;24;24",
        "wc_weaknesses": "255;574;4;108",
        "wc_questions": "44;3;326;1",
        "wc_review": "373;960;440;184",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            136.75,
            127.32512517174291
        ],
        "wc_strengths_avg": [
            23.75,
            2.48746859276655
        ],
        "wc_weaknesses_avg": [
            235.25,
            214.94810420192127
        ],
        "wc_questions_avg": [
            93.5,
            135.32645713237304
        ],
        "wc_review_avg": [
            489.25,
            287.54249685915994
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:KdTdcnEWWEMJ:scholar.google.com/&scioq=Informed+weight+initialization+of+Graph+Neural+Networks+and+its+effect+on+Oversmoothing&hl=en&as_sdt=0,48",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "National Centre for Scientific Research 'Demokritos';National Technical University of Athens;National Centre for Scientific Research \u201cDemokritos\u201d",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.demokritos.gr;https://www.ntua.gr;https://www.demokritos.gr",
        "aff_unique_abbr": "NCSR Demokritos;NTUA;NCSR Demokritos",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Greece"
    },
    {
        "title": "AutoDAN: Generating Stealthy Jailbreak Prompts on Aligned Large Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19366",
        "id": "7Jwpw4qKkb",
        "author_site": "Xiaogeng Liu, Nan Xu, Muhao Chen, Chaowei Xiao",
        "tldr": "",
        "abstract": "The aligned Large Language Models (LLMs) are powerful language understanding and decision-making tools that are created through extensive alignment with human feedback. However, these large models remain susceptible to jailbreak attacks, where adversaries manipulate prompts to elicit malicious outputs that should not be given by aligned LLMs. Investigating jailbreak prompts can lead us to delve into the limitations of LLMs and further guide us to secure them. Unfortunately, existing jailbreak techniques suffer from either (1) scalability issues, where attacks heavily rely on manual crafting of prompts, or (2) stealthiness problems, as attacks depend on token-based algorithms to generate prompts that are often semantically meaningless, making them susceptible to detection through basic perplexity testing. In light of these challenges, we intend to answer this question: Can we develop an approach that can automatically generate stealthy jailbreak prompts? In this paper, we introduce AutoDAN, a novel jailbreak attack against aligned LLMs. AutoDAN can automatically generate stealthy jailbreak prompts by the carefully designed hierarchical genetic algorithm. Extensive evaluations demonstrate that AutoDAN not only automates the process while preserving semantic meaningfulness, but also demonstrates superior attack strength in cross-model transferability, and cross-sample universality compared with the baseline. Moreover, we also compare AutoDAN with perplexity-based defense methods and show that AutoDAN can bypass them effectively. Code is available at https://github.com/SheltonLiu-N/AutoDAN.",
        "keywords": "Large Language Models;Jailbreak Attack;Adversarial Attack",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Xiaogeng Liu;Nan Xu;Muhao Chen;Chaowei Xiao",
        "authorids": "~Xiaogeng_Liu1;~Nan_Xu2;~Muhao_Chen1;~Chaowei_Xiao2",
        "gender": "M;F;M;M",
        "homepage": ";https://sites.google.com/site/xunannancy;https://muhaochen.github.io/;https://xiaocw11.github.io/",
        "dblp": "304/1538;;173/2608;150/3317",
        "google_scholar": "Gvs5nz8AAAAJ;https://scholar.google.co.uk/citations?hl=en;k79yEZkAAAAJ;Juoqtj8AAAAJ",
        "orcid": ";;0000-0003-0118-3147;0000-0002-7043-4926",
        "linkedin": ";https://linkedin.com/in/nan-xu-b52777125;;",
        "or_profile": "~Xiaogeng_Liu1;~Nan_Xu2;~Muhao_Chen1;~chaowei_xiao1",
        "aff": "University of Wisconsin - Madison;University of Southern California;University of Southern California;NVIDIA",
        "aff_domain": "wisc.edu;usc.edu;usc.edu;nvidia.com",
        "position": "PhD student;PhD student;Adjunct Professor;Researcher",
        "bibtex": "@inproceedings{\nliu2024autodan,\ntitle={Auto{DAN}: Generating Stealthy Jailbreak Prompts on Aligned Large Language Models},\nauthor={Xiaogeng Liu and Nan Xu and Muhao Chen and Chaowei Xiao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=7Jwpw4qKkb}\n}",
        "github": "",
        "project": "",
        "reviewers": "6bTy;UziC;QEyR;GPCZ",
        "pdf_size": 514653,
        "rating": "6;6;8;8",
        "confidence": "4;4;4;3",
        "soundness": "2;3;3;2",
        "contribution": "2;2;3;3",
        "presentation": "2;3;3;4",
        "wc_summary": "45;78;19;71",
        "wc_strengths": "33;48;42;53",
        "wc_weaknesses": "130;311;51;101",
        "wc_questions": "141;6;5;84",
        "wc_review": "349;443;117;309",
        "wc_reply_reviewers": "69;0;0;23",
        "wc_reply_authors": "1048;1606;105;1835",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "6;5;1;9",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            53.25,
            23.284920012746447
        ],
        "wc_strengths_avg": [
            44.0,
            7.44983221287567
        ],
        "wc_weaknesses_avg": [
            148.25,
            98.12078016404068
        ],
        "wc_questions_avg": [
            59.0,
            57.17079674099356
        ],
        "wc_review_avg": [
            304.5,
            118.6791894141513
        ],
        "wc_reply_reviewers_avg": [
            23.0,
            28.16913204200655
        ],
        "wc_reply_authors_avg": [
            1148.5,
            667.0046851409666
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            5.25,
            2.8613807855648994
        ],
        "replies_avg": [
            30,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 508,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6354376323759784601&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=7Jwpw4qKkb",
        "pdf": "https://openreview.net/pdf?id=7Jwpw4qKkb",
        "email": "wisc.edu;usc.edu;usc.edu;nvidia.com",
        "author_num": 4,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "University of Wisconsin-Madison;University of Southern California;NVIDIA",
        "aff_unique_dep": ";;NVIDIA Corporation",
        "aff_unique_url": "https://www.wisc.edu;https://www.usc.edu;https://www.nvidia.com",
        "aff_unique_abbr": "UW-Madison;USC;NVIDIA",
        "aff_campus_unique_index": "0;1;1",
        "aff_campus_unique": "Madison;Los Angeles;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "A Foundation Model for Error Correction Codes",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19365",
        "id": "7KDuQPrAF3",
        "author_site": "Yoni Choukroun, Lior Wolf",
        "tldr": "",
        "abstract": "In recent years, Artificial Intelligence has undergone a paradigm shift with the rise of foundation models, which are trained on large amounts of data, typically in a self-supervised way, and can then be adapted to a wide range of downstream tasks. In this work, we propose the first foundation model for Error Correction Codes. This model is trained on multiple codes and can then be applied to an unseen code. To enable this, we extend the Transformer architecture in multiple ways: (1) a code-invariant initial embedding, which is also position- and length-invariant, (2) a learned modulation of the attention maps that is conditioned on the Tanner graph, and (3) a length-invariant code-aware noise prediction module that is based on the parity-check matrix. The proposed architecture is trained on multiple short- and medium-length codes and is able to generalize to unseen codes. Its performance on these codes matches and even outperforms the state of the art, despite having a smaller capacity than the leading code-specific transformers. The suggested framework therefore demonstrates, for the first time, the benefits of learning a universal decoder rather than a neural decoder optimized for a given code.",
        "keywords": "Error Correction Codes;Foundation Model",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Yoni Choukroun;Lior Wolf",
        "authorids": "~Yoni_Choukroun1;~Lior_Wolf1",
        "gender": "M;M",
        "homepage": "https://yonilc.github.io/;http://www.cs.tau.ac.il/~wolf",
        "dblp": "186/8305;83/4103",
        "google_scholar": "https://scholar.google.co.il/citations?user=gjo4ebcAAAAJ;UbFrXTsAAAAJ",
        "orcid": ";0000-0001-5578-8892",
        "linkedin": ";",
        "or_profile": "~Yoni_Choukroun1;~Lior_Wolf1",
        "aff": "Huawei Technologies Ltd.;Tel Aviv University",
        "aff_domain": "huawei.com;tau.ac.il",
        "position": "Principal Researcher;Full Professor",
        "bibtex": "@inproceedings{\nchoukroun2024a,\ntitle={A Foundation Model for Error Correction Codes},\nauthor={Yoni Choukroun and Lior Wolf},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=7KDuQPrAF3}\n}",
        "github": "",
        "project": "",
        "reviewers": "w8i1;dPJy;jdxb;1rnF",
        "pdf_size": 1667896,
        "rating": "3;6;8;8",
        "confidence": "4;3;4;5",
        "soundness": "3;3;4;4",
        "contribution": "2;3;3;4",
        "presentation": "3;2;3;4",
        "wc_summary": "121;92;105;64",
        "wc_strengths": "53;69;179;21",
        "wc_weaknesses": "346;144;154;13",
        "wc_questions": "119;36;1;13",
        "wc_review": "639;341;439;111",
        "wc_reply_reviewers": "605;231;0;0",
        "wc_reply_authors": "2180;1054;254;86",
        "reply_reviewers": "2;2;0;0",
        "reply_authors": "5;3;1;1",
        "rating_avg": [
            6.25,
            2.0463381929681126
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            95.5,
            20.886598574205422
        ],
        "wc_strengths_avg": [
            80.5,
            59.43694137487224
        ],
        "wc_weaknesses_avg": [
            164.25,
            118.7694720877381
        ],
        "wc_questions_avg": [
            42.25,
            46.06177916668005
        ],
        "wc_review_avg": [
            382.5,
            190.01249958884284
        ],
        "wc_reply_reviewers_avg": [
            209.0,
            247.31659871508828
        ],
        "wc_reply_authors_avg": [
            893.5,
            827.9279859987823
        ],
        "reply_reviewers_avg": [
            1.0,
            1.0
        ],
        "reply_authors_avg": [
            2.5,
            1.6583123951777
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.34554737023254406,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15745966124655371585&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=7KDuQPrAF3",
        "pdf": "https://openreview.net/pdf?id=7KDuQPrAF3",
        "email": "huawei.com;tau.ac.il",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Huawei;Tel Aviv University",
        "aff_unique_dep": "Huawei Technologies;",
        "aff_unique_url": "https://www.huawei.com;https://www.tau.ac.il",
        "aff_unique_abbr": "Huawei;TAU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "China;Israel"
    },
    {
        "id": "7LZjuA4AB2",
        "title": "Ask Your Distribution Shift if Pre-Training is Right for You",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Pre-training is a widely used approach to develop models that are robust to distribution shifts. However, in practice, its effectiveness varies: fine-tuning a pre-trained model improves robustness significantly in some cases but *not at all* in others (compared to training from scratch). In this work, we seek to characterize the failure modes that pre-training *can* and *cannot* address. In particular, we focus on two possible failure modes of models under distribution shift: poor extrapolation (e.g., they cannot generalize to a different domain) and biases in the training data (e.g., they rely on spurious features). Our study suggests that, as a rule of thumb, pre-training can help mitigate poor extrapolation but not dataset biases. After providing theoretical motivation and empirical evidence for this finding, we explore two of its implications for developing robust models: (1) pre-training and interventions designed to prevent exploiting biases have complementary robustness benefits, and (2) fine-tuning on a (very) small, non-diverse but *de-biased* dataset can result in significantly more robust models than fine-tuning on a large and diverse but biased dataset.",
        "keywords": "robustness;distribution shift;transfer learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Benjamin Cohen-Wang;Joshua Vendrow;Aleksander Madry",
        "authorids": "~Benjamin_Cohen-Wang1;~Joshua_Vendrow2;~Aleksander_Madry1",
        "gender": "M;M;M",
        "homepage": "https://bencw99.github.io;https://people.csail.mit.edu/madry/;http://www.joshvendrow.com",
        "dblp": ";67/2454;274/7218",
        "google_scholar": "QwJR7jEAAAAJ;SupjsEUAAAAJ;zQjuF5wAAAAJ",
        "orcid": ";;0000-0002-1041-5782",
        "linkedin": ";;joshua-vendrow/",
        "or_profile": "~Benjamin_Cohen-Wang1;~Aleksander_Madry1;~Joshua_Vendrow1",
        "aff": "Massachusetts Institute of Technology;Massachusetts Institute of Technology;Massachusetts Institute of Technology",
        "aff_domain": "mit.edu;mit.edu;mit.edu",
        "position": "PhD student;Professor;PhD student",
        "bibtex": "@misc{\ncohen-wang2024ask,\ntitle={Ask Your Distribution Shift if Pre-Training is Right for You},\nauthor={Benjamin Cohen-Wang and Joshua Vendrow and Aleksander Madry},\nyear={2024},\nurl={https://openreview.net/forum?id=7LZjuA4AB2}\n}",
        "github": "",
        "project": "",
        "reviewers": "Uetj;f9zp;cFpN;kid6",
        "site": "https://openreview.net/forum?id=7LZjuA4AB2",
        "pdf_size": 11272932,
        "rating": "3;3;3;3",
        "confidence": "4;4;3;4",
        "soundness": "3;1;2;1",
        "contribution": "1;2;2;2",
        "presentation": "2;2;2;2",
        "wc_summary": "126;80;68;135",
        "wc_strengths": "18;51;70;125",
        "wc_weaknesses": "241;566;358;431",
        "wc_questions": "84;32;24;53",
        "wc_review": "469;729;520;744",
        "wc_reply_reviewers": "0;139;56;294",
        "wc_reply_authors": "464;539;355;933",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            102.25,
            28.74347752099596
        ],
        "wc_strengths_avg": [
            66.0,
            38.8136573901507
        ],
        "wc_weaknesses_avg": [
            399.0,
            117.85372289410293
        ],
        "wc_questions_avg": [
            48.25,
            23.19886850689059
        ],
        "wc_review_avg": [
            615.5,
            122.45101061240777
        ],
        "wc_reply_reviewers_avg": [
            122.25,
            110.80698308319742
        ],
        "wc_reply_authors_avg": [
            572.75,
            218.03712413256602
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10406340723698108579&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Massachusetts Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://web.mit.edu",
        "aff_unique_abbr": "MIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Online Continual Learning for Interactive Instruction Following Agents",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19364",
        "id": "7M0EzjugaN",
        "author_site": "Byeonghwi Kim, Minhyuk Seo, Jonghyun Choi",
        "tldr": "",
        "abstract": "In learning an embodied agent executing daily tasks via language directives, the literature largely assumes that the agent learns all training data at the beginning. We argue that such a learning scenario is less realistic, since a robotic agent is supposed to learn the world continuously as it explores and perceives it. To take a step towards a more realistic embodied agent learning scenario, we propose two continual learning setups for embodied agents; learning new behaviors (Behavior Incremental Learning, Behavior-IL) and new environments (Environment Incremental Learning, Environment-IL) For the tasks, previous \u2018data prior\u2019 based continual learning methods maintain logits for the past tasks. However, the stored information is often insufficiently learned information and requires task boundary information, which might not always be available. Here, we propose to update them based on confidence scores without task boundary information (i.e., task-free) in a moving average fashion, named Confidence-Aware Moving Average (CAMA). In the proposed challenging Behavior-IL and Environment-IL setups, our simple CAMA outperforms prior arts in our empirical validations by noticeable margins.",
        "keywords": "Embodied AI;Continual Learning",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Byeonghwi Kim;Minhyuk Seo;Jonghyun Choi",
        "authorids": "~Byeonghwi_Kim1;~Minhyuk_Seo1;~Jonghyun_Choi1",
        "gender": "M;M;M",
        "homepage": "https://bhkim94.github.io/;https://dbd05088.github.io/;https://ppolon.github.io/",
        "dblp": "280/2943;350/4104;21/11103",
        "google_scholar": "Sr9hbXYAAAAJ;ayDPR-gAAAAJ;uiGWnm4AAAAJ",
        "orcid": "0000-0003-3775-2778;;0000-0002-7934-8434",
        "linkedin": "byeonghwi-kim-821909167;minhyuk-seo-59ba11247/;jonghyun-choi-459bb615/",
        "or_profile": "~Byeonghwi_Kim1;~Minhyuk_Seo1;~Jonghyun_Choi1",
        "aff": "Seoul National University;Yonsei University;Yonsei University",
        "aff_domain": "snu.ac.kr;yonsei.ac.kr;yonsei.ac.kr",
        "position": "PhD student;MS student;Associate Professor",
        "bibtex": "@inproceedings{\nkim2024online,\ntitle={Online Continual Learning for Interactive Instruction Following Agents},\nauthor={Byeonghwi Kim and Minhyuk Seo and Jonghyun Choi},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=7M0EzjugaN}\n}",
        "github": "",
        "project": "",
        "reviewers": "q27B;z9k5;UTbC;oYjZ",
        "pdf_size": 7496007,
        "rating": "6;6;6;6",
        "confidence": "2;4;4;3",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "56;129;87;110",
        "wc_strengths": "48;78;65;84",
        "wc_weaknesses": "75;260;187;100",
        "wc_questions": "77;152;107;48",
        "wc_review": "256;619;446;342",
        "wc_reply_reviewers": "16;118;97;0",
        "wc_reply_authors": "1225;1866;1929;722",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "2;4;5;3",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            95.5,
            27.225906780123964
        ],
        "wc_strengths_avg": [
            68.75,
            13.808964479641476
        ],
        "wc_weaknesses_avg": [
            155.5,
            73.26834241335067
        ],
        "wc_questions_avg": [
            96.0,
            38.47726601514198
        ],
        "wc_review_avg": [
            415.75,
            135.26340044520543
        ],
        "wc_reply_reviewers_avg": [
            57.75,
            50.61805507919087
        ],
        "wc_reply_authors_avg": [
            1435.5,
            495.54641558586616
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.5,
            1.118033988749895
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5344051114832059180&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=7M0EzjugaN",
        "pdf": "https://openreview.net/pdf?id=7M0EzjugaN",
        "email": "snu.ac.kr;yonsei.ac.kr;yonsei.ac.kr",
        "author_num": 3,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Seoul National University;Yonsei University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.snu.ac.kr;https://www.yonsei.ac.kr",
        "aff_unique_abbr": "SNU;Yonsei",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "7Mq096hr9Y",
        "title": "OpenMixup: A Comprehensive Mixup Benchmark for Visual Classification",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Data mixing, or mixup, is a data-dependent augmentation technique that has greatly enhanced the generalizability of modern deep neural networks. However, a full grasp of mixup methodology necessitates a top-down hierarchical understanding from systematic impartial evaluations and empirical analysis, both of which are currently lacking within the community. In this paper, we present OpenMixup, the first comprehensive mixup benchmarking study for supervised visual classification. OpenMixup offers a unified mixup-based model design and training framework, encompassing a wide collection of data mixing algorithms, a diverse range of widely-used backbones and modules, and a set of model analysis toolkits. To ensure fair and complete comparisons, large-scale standard evaluations of various mixup baselines are conducted across 12 diversified image datasets with meticulous confounders tweaking powered by our modular and extensible codebase framework. Interesting observations and insights are derived through detailed empirical analysis of how mixup policies, network architectures, and dataset properties affect the mixup visual classification performance. We hope that OpenMixup can bolster the reproducibility of previously gained insights and facilitate a better understanding of mixup properties, thereby giving the community a kick-start for the development and evaluation of new mixup methods. The source code is publicly available.",
        "keywords": "Data Augmentation;Benchmark;Image Classification;Mixup;Supervised Learning",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/56234f3efb471cda180f65d29300100a283c25ac.zip",
        "author": "Siyuan Li;Zedong Wang;Zicheng Liu;Di Wu;Cheng Tan;Weiyang Jin;Stan Z. Li",
        "authorids": "~Siyuan_Li6;~Zedong_Wang1;~Zicheng_Liu2;~Di_Wu10;~Cheng_Tan1;~Weiyang_Jin1;~Stan_Z._Li2",
        "gender": "M;M;M;M;M;M;M",
        "homepage": "https://lupin1998.github.io/;https://jacky1128.github.io;;;https://chengtan9907.github.io/;;https://en.westlake.edu.cn/academics/School_of_Engineering/About/Our_People/Faculty/201912/t20191206_2497.shtml",
        "dblp": "63/9705-2;179/8811.html;l/ZichengLiu-6;;70/1533-12.html;344/6132;l/StanZLi",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com/citations?hl=en;6kTV6aMAAAAJ;;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": "0000-0001-6806-2468;0009-0000-0112-0491;;;;0000-0001-5351-1400;",
        "linkedin": "https://www.linkedin.cn/incareer/in/siyuan-li-lupin1998/;;;;;;stan-z-li-%E6%9D%8E%E5%AD%90%E9%9D%92-55753224/",
        "or_profile": "~Siyuan_Li6;~Zedong_Wang1;~Zicheng_Liu2;~Di_Wu10;~Cheng_Tan1;~Weiyang_Jin1;~Stan_Z._Li1",
        "aff": "Alibaba Group;Westlake University;Zhejiang University;Westlake University;Zhejiang University & Westlake University;Beijing Jiaotong University;Westlake University",
        "aff_domain": "alibaba-inc.com;westlake.edu;zju.edu.cn;westlake.edu.cn;westlake.edu.cn;bjtu.edu.cn;westlake.edu.cn",
        "position": "Intern;Intern;PhD student;PhD student;PhD student;Undergrad student;Chair Professor",
        "bibtex": "@misc{\nli2024openmixup,\ntitle={OpenMixup: A Comprehensive Mixup Benchmark for Visual Classification},\nauthor={Siyuan Li and Zedong Wang and Zicheng Liu and Di Wu and Cheng Tan and Weiyang Jin and Stan Z. Li},\nyear={2024},\nurl={https://openreview.net/forum?id=7Mq096hr9Y}\n}",
        "github": "",
        "project": "",
        "reviewers": "nCz4;x5Ek;kQcu;rFDa",
        "site": "https://openreview.net/forum?id=7Mq096hr9Y",
        "pdf_size": 5269571,
        "rating": "5;5;5;6",
        "confidence": "4;5;5;4",
        "soundness": "3;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "74;43;31;65",
        "wc_strengths": "94;15;55;77",
        "wc_weaknesses": "191;94;53;155",
        "wc_questions": "74;1;38;101",
        "wc_review": "433;153;177;398",
        "wc_reply_reviewers": "0;0;58;0",
        "wc_reply_authors": "749;717;731;0",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;2;0",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            53.25,
            17.09349291397168
        ],
        "wc_strengths_avg": [
            60.25,
            29.55820529057879
        ],
        "wc_weaknesses_avg": [
            123.25,
            53.35904328227784
        ],
        "wc_questions_avg": [
            53.5,
            37.659660115301094
        ],
        "wc_review_avg": [
            290.25,
            126.14550130702244
        ],
        "wc_reply_reviewers_avg": [
            14.5,
            25.11473670974872
        ],
        "wc_reply_authors_avg": [
            549.25,
            317.3124446031072
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.7071067811865476
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15958471513919602797&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;1;2;3;1",
        "aff_unique_norm": "Alibaba Group;Westlake University;Zhejiang University;Beijing Jiao Tong University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.alibaba.com;https://www.westlake.edu.cn;https://www.zju.edu.cn;http://www.njtu.edu.cn/en",
        "aff_unique_abbr": "Alibaba;WU;ZJU;BJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "7NqRDbkizw",
        "title": "DIA: Diffusion based Inverse Network Attack on Collaborative Inference",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "With the continuous expansion of neural networks in size and depth, and the growing popularity of machine learning as a service, collaborative inference systems present a promising approach for deploying models in resource-constrained computing environments. However, as the deployment of these systems gains traction, evaluating their privacy and security has become a critical issue. Towards this goal, this paper introduces a diffusion-based inverse network attack, named DIA, for collaborative inference systems that uses a novel feature map awareness conditioning mechanism to guide the diffusion model training. Compared to prior approaches, our extensive empirical results demonstrate that the proposed attack achieves an average improvement of 29%, 20%, 30% in terms of SSIM, PSNR, and MSE when applied to convolutional neural networks (CNN), 18%, 17%, 61% to ResNet models, and 55%, 54%, 84% to Vision transformers (ViTs). Moreover, we uncover a notable vulnerability of transformer-based model ViTs and analyze the potential reasons behind this vulnerability. Based on our analysis, we raise caution regarding the deployment of transformer-based models in collaborative inference systems, emphasizing the need for careful consideration regarding the security of such models in collaborative settings.",
        "keywords": "Diffusion model;data privacy;inverse network attack;collaborative Inference",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/15ab6727a8c0b11f331756a8e7474a67055d4bfc.pdf",
        "author": "Dake Chen;Shiduo Li;Yuke Zhang;Souvik Kundu;Chenghao Li;Peter Anthony Beerel",
        "authorids": "~Dake_Chen1;~Shiduo_Li1;~Yuke_Zhang1;~Souvik_Kundu2;~Chenghao_Li2;~Peter_Anthony_Beerel1",
        "gender": ";M;F;M;M;M",
        "homepage": "https://scholar.google.com/citations?user=MwaZe-8AAAAJ&hl=en&oi=ao;https://github.com/Risto0211;;https://ksouvik52.github.io;https://howardli0816.github.io/;http://sites.usc.edu/eessc.html",
        "dblp": ";386/9567;;126/2210;;29/6330",
        "google_scholar": ";PY12lawAAAAJ;CJ5iMiwAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en;JSdH7PsAAAAJ",
        "orcid": ";;0000-0001-5253-5478;0000-0002-3533-9405;;",
        "linkedin": ";shiduo-li/;;souvik-kundu-64922b50/;chenghao-li-3b0354252/;peter-beerel-b9902a1/",
        "or_profile": "~Dake_Chen1;~Shiduo_Li1;~Yuke_Zhang1;~Souvik_Kundu2;~Chenghao_Li2;~Peter_Anthony_Beerel1",
        "aff": "Meta Facebook;Tsinghua University;University of Southern California;Intel;University of Southern California;University of Southern California",
        "aff_domain": "meta.com;mail.tsinghua.edu.cn;usc.edu;intel.com;usc.edu;usc.edu",
        "position": "Researcher;Undergrad student;PhD student;Researcher;MS student;Full Professor",
        "bibtex": "@misc{\nchen2024dia,\ntitle={{DIA}: Diffusion based Inverse Network Attack on Collaborative Inference},\nauthor={Dake Chen and Shiduo Li and Yuke Zhang and Souvik Kundu and Chenghao Li and Peter Anthony Beerel},\nyear={2024},\nurl={https://openreview.net/forum?id=7NqRDbkizw}\n}",
        "github": "",
        "project": "",
        "reviewers": "wMLT;ZM8C;9V3L",
        "site": "https://openreview.net/forum?id=7NqRDbkizw",
        "pdf_size": 876877,
        "rating": "3;3;5",
        "confidence": "4;3;4",
        "soundness": "3;2;3",
        "contribution": "2;2;2",
        "presentation": "2;2;2",
        "wc_summary": "72;102;95",
        "wc_strengths": "34;98;66",
        "wc_weaknesses": "122;181;64",
        "wc_questions": "9;5;98",
        "wc_review": "237;386;323",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            89.66666666666667,
            12.814921857827391
        ],
        "wc_strengths_avg": [
            66.0,
            26.127890589687233
        ],
        "wc_weaknesses_avg": [
            122.33333333333333,
            47.76563153100308
        ],
        "wc_questions_avg": [
            37.333333333333336,
            42.92888175679503
        ],
        "wc_review_avg": [
            315.3333333333333,
            61.070087240444934
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18400872964133980956&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;3;2;2",
        "aff_unique_norm": "Meta;Tsinghua University;University of Southern California;Intel",
        "aff_unique_dep": "Meta Platforms, Inc.;;;Intel Corporation",
        "aff_unique_url": "https://meta.com;https://www.tsinghua.edu.cn;https://www.usc.edu;https://www.intel.com",
        "aff_unique_abbr": "Meta;THU;USC;Intel",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Los Angeles",
        "aff_country_unique_index": "0;1;0;0;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "Parameter-Efficient Orthogonal Finetuning via Butterfly Factorization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19363",
        "id": "7NzgkEdGyr",
        "author_site": "Weiyang Liu, Zeju Qiu, Yao Feng, Yuliang Xiu, Yuxuan Xue, Longhui Yu, Haiwen Feng, Zhen Liu, Juyeon Heo, Songyou Peng, Yandong Wen, Michael J Black, Adrian Weller, Bernhard Schoelkopf",
        "tldr": "",
        "abstract": "Large foundation models are becoming ubiquitous, but training them from scratch is prohibitively expensive. Thus, efficiently adapting these powerful models to downstream tasks is increasingly important. In this paper, we study a principled finetuning paradigm -- Orthogonal Finetuning (OFT) -- for downstream task adaptation. Despite demonstrating good generalizability, OFT still uses a fairly large number of trainable parameters due to the high dimensionality of orthogonal matrices. To address this, we start by examining OFT from an information transmission perspective, and then identify a few key desiderata that enable better parameter-efficiency. Inspired by how the Cooley-Tukey fast Fourier transform algorithm enables efficient information transmission, we propose an efficient orthogonal parameterization using  butterfly structures. We apply this parameterization to OFT, creating  a novel parameter-efficient finetuning method, called Orthogonal Butterfly (BOFT). By subsuming OFT as a special case, BOFT introduces a generalized orthogonal finetuning framework. Finally, we conduct an extensive empirical study of adapting large vision transformers, large language models, and text-to-image diffusion models to various downstream tasks in computer vision and natural language. The results validate the effectiveness of BOFT as a generic finetuning method.",
        "keywords": "Parameter-efficient finetuning;orthogonal;Butterfly matrix",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Weiyang Liu;Zeju Qiu;Yao Feng;Yuliang Xiu;Yuxuan Xue;Longhui Yu;Haiwen Feng;Zhen Liu;Juyeon Heo;Songyou Peng;Yandong Wen;Michael J. Black;Adrian Weller;Bernhard Sch\u00f6lkopf",
        "authorids": "~Weiyang_Liu1;~Zeju_Qiu1;~Yao_Feng3;~Yuliang_Xiu2;~Yuxuan_Xue1;~Longhui_Yu1;~Haiwen_Feng1;~Zhen_Liu6;~Juyeon_Heo1;~Songyou_Peng1;~Yandong_Wen1;~Michael_J._Black1;~Adrian_Weller1;~Bernhard_Sch\u00f6lkopf1",
        "gender": "M;M;F;M;;M;M;M;F;M;M;;M;",
        "homepage": "http://wyliu.com/;;https://ps.is.tuebingen.mpg.de/person/yfeng;http://xiuyuliang.cn;http://yuxuan-xue.com;https://yulonghui.github.io/;https://ps.is.mpg.de/person/hfeng;;https://sites.google.com/view/juyeonheo/%ED%99%88;https://pengsongyou.github.io/;;;http://mlg.eng.cam.ac.uk/adrian/;",
        "dblp": "137/1532;276/4222;05/9861;215/3940;254/6994;313/9946;119/9168;77/35-19;;205/2316;153/2125;;73/8324;",
        "google_scholar": "DMjROf0AAAAJ;7y5RN9wAAAAJ;wNQQhSIAAAAJ;https://scholar.google.com.hk/citations?hl=zh-CN;5SKNmhcAAAAJ;https://scholar.google.com.hk/citations?user=3eHjDDgAAAAJ;g5co-iIAAAAJ;I1IiJCAAAAAJ;;eNypkO0AAAAJ;;;https://scholar.google.co.uk/citations?user=Ek4hM10AAAAJ;",
        "orcid": ";;0000-0002-9481-9783;0000-0003-0165-5909;;;;;;;;;;",
        "linkedin": ";zeju-qiu-729b8018a/;;yuliangxiu;;%E9%BE%99%E8%BE%89-%E8%99%9E-71655a154/;;;;;;;;",
        "or_profile": "~Weiyang_Liu1;~Zeju_Qiu1;~Yao_Feng3;~Yuliang_Xiu2;~Yuxuan_Xue1;~Longhui_Yu1;~Haiwen_Feng1;~Zhen_Liu6;~Juyeon_Heo1;~Songyou_Peng1;~Yandong_Wen1;~Michael_J._Black1;~Adrian_Weller1;~Bernhard_Sch\u00f6lkopf1",
        "aff": "University of Cambridge;Max-Planck-Institute for Intelligent Systems, Max-Planck Institute;ETHZ - ETH Zurich;Max Planck Institute for Intelligent Systems, Max-Planck Institute;Eberhard-Karls-Universit\u00e4t T\u00fcbingen;;Max Planck Institute for Intelligent Systems, Max-Planck Institute;University of Montreal;University of Cambridge;ETH Zurich;Max Planck Institute for Intelligent Systems, Max-Planck Institute;;University of Cambridge;",
        "aff_domain": "cam.ac.uk;is.mpg.de;ethz.ch;tuebingen.mpg.de;uni-tuebingen.de;;tuebingen.mpg.de;umontreal.ca;cam.ac.uk;inf.ethz.ch;tuebingen.mpg.de;;cam.ac.uk;",
        "position": "Researcher;Intern;PhD student;PhD student;PhD student;;PhD student;PhD student;PhD student;Senior Researcher;Postdoc;;Principal Researcher;",
        "bibtex": "@inproceedings{\nliu2024parameterefficient,\ntitle={Parameter-Efficient Orthogonal Finetuning via Butterfly Factorization},\nauthor={Weiyang Liu and Zeju Qiu and Yao Feng and Yuliang Xiu and Yuxuan Xue and Longhui Yu and Haiwen Feng and Zhen Liu and Juyeon Heo and Songyou Peng and Yandong Wen and Michael J. Black and Adrian Weller and Bernhard Sch{\\\"o}lkopf},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=7NzgkEdGyr}\n}",
        "github": "",
        "project": "",
        "reviewers": "CCPY;oVSz;mHgj",
        "pdf_size": 11453628,
        "rating": "5;6;8",
        "confidence": "3;4;3",
        "soundness": "3;3;3",
        "contribution": "3;3;2",
        "presentation": "4;3;4",
        "wc_summary": "65;34;249",
        "wc_strengths": "45;35;129",
        "wc_weaknesses": "121;108;238",
        "wc_questions": "2;18;191",
        "wc_review": "233;195;807",
        "wc_reply_reviewers": "0;77;73",
        "wc_reply_authors": "1935;2983;3351",
        "reply_reviewers": "0;2;1",
        "reply_authors": "3;6;6",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            116.0,
            94.89292211048549
        ],
        "wc_strengths_avg": [
            69.66666666666667,
            42.153159892099296
        ],
        "wc_weaknesses_avg": [
            155.66666666666666,
            58.459862774005515
        ],
        "wc_questions_avg": [
            70.33333333333333,
            85.57387971156203
        ],
        "wc_review_avg": [
            411.6666666666667,
            279.973014572635
        ],
        "wc_reply_reviewers_avg": [
            50.0,
            35.393031329156685
        ],
        "wc_reply_authors_avg": [
            2756.3333333333335,
            599.8873968411813
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            5.0,
            1.4142135623730951
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            14,
            0
        ],
        "corr_rating_confidence": -0.18898223650461363,
        "gs_citation": 57,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5299967292332698973&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=7NzgkEdGyr",
        "pdf": "https://openreview.net/pdf?id=7NzgkEdGyr",
        "email": "cam.ac.uk;is.mpg.de;ethz.ch;tuebingen.mpg.de;uni-tuebingen.de;;tuebingen.mpg.de;umontreal.ca;cam.ac.uk;inf.ethz.ch;tuebingen.mpg.de;;cam.ac.uk;",
        "author_num": 14,
        "aff_unique_index": "0;1;2;3;4;3;5;0;2;3;0",
        "aff_unique_norm": "University of Cambridge;Max-Planck-Institute for Intelligent Systems;ETH Zurich;Max Planck Institute for Intelligent Systems;Eberhard Karls University of T\u00fcbingen;University of Montreal",
        "aff_unique_dep": ";Intelligent Systems;;Intelligent Systems;;",
        "aff_unique_url": "https://www.cam.ac.uk;https://www.mpi-is.mpg.de;https://www.ethz.ch;https://www.mpi-is.mpg.de;https://www.uni-tuebingen.de/;https://wwwumontreal.ca",
        "aff_unique_abbr": "Cambridge;MPI-IS;ETHZ;MPI-IS;Uni T\u00fcbingen;UM",
        "aff_campus_unique_index": "0;2;0;0",
        "aff_campus_unique": "Cambridge;;T\u00fcbingen",
        "aff_country_unique_index": "0;1;2;1;1;1;3;0;2;1;0",
        "aff_country_unique": "United Kingdom;Germany;Switzerland;Canada"
    },
    {
        "id": "7OO8tTOgh4",
        "title": "Non-targeted Adversarial Attacks on Vision-Language Models via Maximizing Information Entropy",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Adversarial examples pose significant security concerns in deep neural networks and play a crucial role in assessing the robustness of models. Nevertheless, existing research has primarily focused on classification tasks, while the evaluation of adversarial examples is urgently needed for more complex tasks. In this paper, we investigate the adversarial robustness of large vision-language models (VLMs). We propose a non-targeted white-box attack method that maximizes information entropy (MIE) to induce the victim model to generate misleading image descriptions deviating from reality. Our method is thoroughly analyzed experimentally, with validation conducted on the ImageNet dataset. The comprehensive and quantifiable experimental results demonstrate a significant success rate achieved by our method in adversarial attacks. Given the consistent architecture of the language decoder, our proposed method can serve as a benchmark for evaluating the robustness of diverse vision-language models.",
        "keywords": "Adversarial Attacks;Vision-Language Models;Trustworthy AI",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Chaohu Liu;Yubo Wang;Haoyu Cao;Bing Liu;Deqiang Jiang;Linli Xu",
        "authorids": "~Chaohu_Liu1;~Yubo_Wang8;~Haoyu_Cao1;~Bing_Liu6;~Deqiang_Jiang1;~Linli_Xu1",
        "gender": "M;M;M;;M;",
        "homepage": "https://github.com/liuchaohu;https://github.com/LingoAmber;;;;",
        "dblp": "356/2510;;334/3895.html;;259/2591.html;",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;LV8ejn8AAAAJ;;v4AK2MQAAAAJ;",
        "orcid": ";;0000-0002-3789-9705;0000-0001-5324-4816;;",
        "linkedin": ";;;;;",
        "or_profile": "~Chaohu_Liu1;~Yubo_Wang8;~Haoyu_Cao1;~Bing_Liu6;~Deqiang_Jiang1;~Linli_Xu1",
        "aff": "University of Science and Technology of China;Tencent Youtu Lab;University of Science and Technology of China;Tencent YouTu Lab;Tencent YouTu Lab;",
        "aff_domain": "ustc.edu.cn;tencent.com;ustc.edu.cn;tencent.com;tencent.com;",
        "position": "PhD student;Intern;PhD student;Researcher;Researcher;",
        "bibtex": "@misc{\nliu2024nontargeted,\ntitle={Non-targeted Adversarial Attacks on Vision-Language Models via Maximizing Information Entropy},\nauthor={Chaohu Liu and Yubo Wang and Haoyu Cao and Bing Liu and Deqiang Jiang and Linli Xu},\nyear={2024},\nurl={https://openreview.net/forum?id=7OO8tTOgh4}\n}",
        "github": "",
        "project": "",
        "reviewers": "fBK2;CGXF;r3mc;qFBU",
        "site": "https://openreview.net/forum?id=7OO8tTOgh4",
        "pdf_size": 8884908,
        "rating": "5;5;5;6",
        "confidence": "4;4;5;3",
        "soundness": "2;2;2;3",
        "contribution": "2;1;2;2",
        "presentation": "4;3;2;3",
        "wc_summary": "66;17;256;43",
        "wc_strengths": "95;11;110;19",
        "wc_weaknesses": "141;152;156;151",
        "wc_questions": "45;3;164;27",
        "wc_review": "347;183;686;240",
        "wc_reply_reviewers": "0;0;0;55",
        "wc_reply_authors": "1395;866;963;867",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "3;2;3;2",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            95.5,
            94.27221223669252
        ],
        "wc_strengths_avg": [
            58.75,
            44.16092730004659
        ],
        "wc_weaknesses_avg": [
            150.0,
            5.522680508593631
        ],
        "wc_questions_avg": [
            59.75,
            62.005544106958695
        ],
        "wc_review_avg": [
            364.0,
            195.0064101510512
        ],
        "wc_reply_reviewers_avg": [
            13.75,
            23.81569860407206
        ],
        "wc_reply_authors_avg": [
            1022.75,
            218.4998569793582
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ddHHjzArvYkJ:scholar.google.com/&scioq=Non-targeted+Adversarial+Attacks+on+Vision-Language+Models+via+Maximizing+Information+Entropy&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;1;1",
        "aff_unique_norm": "University of Science and Technology of China;Tencent",
        "aff_unique_dep": ";Youtu Lab",
        "aff_unique_url": "http://www.ustc.edu.cn;https://www.tencent.com",
        "aff_unique_abbr": "USTC;Tencent",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Data-independent Module-aware Pruning for Hierarchical Vision Transformers",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19362",
        "id": "7Ol6foUi1G",
        "author_site": "Yang He, Joey Tianyi Zhou",
        "tldr": "",
        "abstract": "Hierarchical vision transformers (ViTs) have two advantages over conventional ViTs. First, hierarchical ViTs achieve linear computational complexity with respect to image size by local self-attention. Second, hierarchical ViTs create hierarchical feature maps by merging image patches in deeper layers for dense prediction. However, existing pruning methods ignore the unique properties of hierarchical ViTs and use the magnitude value as the weight importance. This approach leads to two main drawbacks. First, the \"local\" attention weights are compared at a \"global\" level, which may cause some \"locally\" important weights to be pruned due to their relatively small magnitude \"globally\". The second issue with magnitude pruning is that it fails to consider the distinct weight distributions of the network, which are essential for extracting coarse to fine-grained features at various hierarchical levels. \n\nTo solve the aforementioned issues, we have developed a Data-independent Module-Aware Pruning method (DIMAP) to compress hierarchical ViTs. To ensure that \"local\" attention weights at different hierarchical levels are compared fairly in terms of their contribution, we treat them as a **module** and examine their contribution by analyzing their information distortion. Furthermore, we introduce a novel weight metric that is solely based on weights and does not require input images, thereby eliminating the **dependence** on the patch merging process. Our method validates its usefulness and strengths on Swin Transformers of different sizes on ImageNet-1k classification. Notably, the top-5 accuracy drop is only 0.07% when we remove 52.5% FLOPs and 52.7% parameters of Swin-B. When we reduce 33.2% FLOPs and 33.2% parameters of Swin-S, we can even achieve a 0.8% higher relative top-5 accuracy than the original model. Code is available at: [https://github.com/he-y/Data-independent-Module-Aware-Pruning](https://github.com/he-y/Data-independent-Module-Aware-Pruning).",
        "keywords": "Filter Pruning; Model Compression; Vision Transformer",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/d13a5c5260bac7b5449a8f8460f25889e71c9944.pdf",
        "author": "Yang He;Joey Tianyi Zhou",
        "authorids": "~Yang_He2;~Joey_Tianyi_Zhou1",
        "gender": "M;M",
        "homepage": "https://joeyzhouty.github.io/;https://he-y.github.io/",
        "dblp": "123/5110;06/1998-2",
        "google_scholar": "https://scholar.google.com.sg/citations?user=cYNqDokAAAAJ;vvnFsIIAAAAJ",
        "orcid": "0000-0002-4675-7055;0000-0002-2257-6073",
        "linkedin": ";",
        "or_profile": "~Joey_Tianyi_Zhou1;~yang_he1",
        "aff": "A*STAR Centre for Frontier AI Research;Institute of High Performance Computing, Singapore, A*STAR",
        "aff_domain": "cfar.a-star.edu.sg;ihpc.a-star.edu.sg",
        "position": "Principal Researcher;Researcher",
        "bibtex": "@inproceedings{\nhe2024dataindependent,\ntitle={Data-independent Module-aware Pruning for Hierarchical Vision Transformers},\nauthor={Yang He and Joey Tianyi Zhou},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=7Ol6foUi1G}\n}",
        "github": "",
        "project": "",
        "reviewers": "uDum;qfKu;VGj7",
        "pdf_size": 3078423,
        "rating": "6;6;8",
        "confidence": "5;4;4",
        "soundness": "3;3;4",
        "contribution": "4;3;4",
        "presentation": "3;4;3",
        "wc_summary": "79;102;73",
        "wc_strengths": "73;60;140",
        "wc_weaknesses": "111;24;53",
        "wc_questions": "2;24;9",
        "wc_review": "265;210;275",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "795;473;275",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            84.66666666666667,
            12.498888839501783
        ],
        "wc_strengths_avg": [
            91.0,
            35.05234181430203
        ],
        "wc_weaknesses_avg": [
            62.666666666666664,
            36.16935473881477
        ],
        "wc_questions_avg": [
            11.666666666666666,
            9.177266598624136
        ],
        "wc_review_avg": [
            250.0,
            28.577380332470412
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            514.3333333333334,
            214.29159780282774
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3223724432329131&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=7Ol6foUi1G",
        "pdf": "https://openreview.net/pdf?id=7Ol6foUi1G",
        "email": "cfar.a-star.edu.sg;ihpc.a-star.edu.sg",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "A*STAR;Institute of High Performance Computing",
        "aff_unique_dep": "Centre for Frontier AI Research;",
        "aff_unique_url": "https://www.a-star.edu.sg;https://www.ihpc.a-star.edu.sg",
        "aff_unique_abbr": "A*STAR;IHPC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Singapore"
    },
    {
        "id": "7OwML7fwl8",
        "title": "Fairness without Sensitive attributes via Noise and Uncertain Predictions",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "While model fairness improvement has been explored previously, existing methods invariably rely on adjusting explicit sensitive attribute values in order to improve model fairness in downstream tasks. However, we observe the trend of sensitive demographic information being inaccessible as public concerns around data privacy grow. In this paper, we propose a confidence-based hierarchical structure of variational autoencoder (VAE) architectures called ``Reckoner\" for reliable fairness learning under the assumption of missing sensitive attributes. First, we present the results of exploratory data analyses conducted on the widely-used COMPAS dataset. We observed significant disparities in model fairness across different levels of confidence. Inspired by these findings, we devised a dual-model system in which the model initialised with a high-confidence data subset learns from the model initialised with a low-confidence data subset, enabling it to avoid biased predictions. To maintain predictiveness, we also introduced learnable noise into the dataset, forcing the data to retain only the most essential information for predictions. Our experimental results show that Reckoner consistently outperforms state-of-the-art baselines on both the COMPAS and the New Adult datasets in terms of both accuracy and fairness metrics.",
        "keywords": "Fairness;Fairness without Sensitive Attributes;Fairness without Demographics",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/1dfd360e7216c3fbf025619bae5b640ec25bb184.zip",
        "author": "Hongliang Ni;LEI HAN;Tong Chen;Shazia Wasim Sadiq;Gianluca Demartini",
        "authorids": "~Hongliang_Ni1;~LEI_HAN7;~Tong_Chen8;~Shazia_Wasim_Sadiq1;~Gianluca_Demartini1",
        "gender": "F;;M;;F",
        "homepage": ";;https://itee.uq.edu.au/profile/1253/rocky-chen;http://gianlucademartini.net;https://about.uq.edu.au/experts/792",
        "dblp": ";75/2307-3.html;22/1512-5;05/3422;s/SWSadiq",
        "google_scholar": ";https://scholar.google.com.au/citations?user=Oibami4AAAAJ;07cqSMsAAAAJ;https://scholar.google.co.uk/citations?user=PCAiILsAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";0000-0002-7777-3592;0000-0001-7269-146X;0000-0002-7311-3693;0000-0001-6739-4145",
        "linkedin": "hongliang-ni-1931181b0/;;;gianlucademartini/;shazia-sadiq-4920651/?originalSubdomain=au",
        "or_profile": "~Hongliang_Ni1;~LEI_HAN7;~Tong_Chen8;~Gianluca_Demartini1;~Shazia_Sadiq1",
        "aff": "University of Queensland;;The University of Queensland;University of Queensland;The University of Queensland",
        "aff_domain": "uq.edu.au;;uq.edu.au;uq.edu.au;uq.edu.au",
        "position": "PhD student;;Assistant Professor;Associate Professor;Full Professor",
        "bibtex": "@misc{\nni2024fairness,\ntitle={Fairness without Sensitive attributes via Noise and Uncertain Predictions},\nauthor={Hongliang Ni and LEI HAN and Tong Chen and Shazia Wasim Sadiq and Gianluca Demartini},\nyear={2024},\nurl={https://openreview.net/forum?id=7OwML7fwl8}\n}",
        "github": "",
        "project": "",
        "reviewers": "4bz2;zU7R;KsYL",
        "site": "https://openreview.net/forum?id=7OwML7fwl8",
        "pdf_size": 414002,
        "rating": "3;5;5",
        "confidence": "3;5;4",
        "soundness": "2;2;1",
        "contribution": "2;3;2",
        "presentation": "1;3;3",
        "wc_summary": "67;93;110",
        "wc_strengths": "20;48;20",
        "wc_weaknesses": "236;63;226",
        "wc_questions": "2;474;4",
        "wc_review": "325;678;360",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "602;1385;646",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;2;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            90.0,
            17.682382946499793
        ],
        "wc_strengths_avg": [
            29.333333333333332,
            13.199326582148888
        ],
        "wc_weaknesses_avg": [
            175.0,
            79.30111390558564
        ],
        "wc_questions_avg": [
            160.0,
            222.03303057578316
        ],
        "wc_review_avg": [
            454.3333333333333,
            158.80036383949363
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            877.6666666666666,
            359.18828241219427
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.8660254037844385,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:y1RoM6O9alsJ:scholar.google.com/&scioq=Fairness+without+Sensitive+attributes+via+Noise+and+Uncertain+Predictions&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of Queensland",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uq.edu.au",
        "aff_unique_abbr": "UQ",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Australia"
    },
    {
        "id": "7Phicg0WAg",
        "title": "FlexCap: Generating Rich, Localized, and Flexible Captions in Images",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We introduce FlexCap, a module that generates localized descriptions for any region in a given image. We use the idea of length conditioning to ensure the output captions have the desired length. This allows for controllable generation of the full spectrum of localized captions, ranging from short object names to full sentence descriptions. To train this model, we create a dataset of image-box-caption triplets from web-scale text-image pairs using open-vocabulary object detection models. We show that FlexCap can connect images with LLMs by representing images as a sequence of region descriptions and their spatial extents. Using this interpretable textual representation, we exceed the state-of-the-art zero-shot performance on many visual question answering tasks. We also show that FlexCap can be fine-tuned to achieve strong performance on the dense captioning task on the Visual Genome dataset. Finally, we demonstrate qualitatively how FlexCap can be used for image labeling, object attribute recognition, and visual dialog.",
        "keywords": "visual-language model;object detection;image captioning;visual question answering",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/1f64b8fab7ab2a25b9102d70b7f295273fc93497.zip",
        "author": "Debidatta Dwibedi;Vidhi Jain;Jonathan Tompson;Andrew Zisserman;Yusuf Aytar",
        "authorids": "~Debidatta_Dwibedi1;~Vidhi_Jain2;~Jonathan_Tompson1;~Andrew_Zisserman1;~Yusuf_Aytar1",
        "gender": "M;F;M;;M",
        "homepage": "https://debidatta.github.io/;http://vidhijain.github.io;http://jonathantompson.com;;",
        "dblp": "160/3739;199/2574;139/0769;;41/5577",
        "google_scholar": "EPfOJwQAAAAJ;;U_Jw8DUAAAAJ;;0ncQNL8AAAAJ",
        "orcid": ";;;;",
        "linkedin": ";vidhijain96/;;;",
        "or_profile": "~Debidatta_Dwibedi1;~Vidhi_Jain2;~Jonathan_Tompson1;~Andrew_Zisserman1;~Yusuf_Aytar1",
        "aff": "Google;Google;Google DeepMind;;Google DeepMind",
        "aff_domain": "google.com;google.com;google.com;;google.com",
        "position": "Google;Student Researcher;Researcher;;Research Scientist",
        "bibtex": "@misc{\ndwibedi2024flexcap,\ntitle={FlexCap: Generating Rich, Localized, and  Flexible Captions in Images},\nauthor={Debidatta Dwibedi and Vidhi Jain and Jonathan Tompson and Andrew Zisserman and Yusuf Aytar},\nyear={2024},\nurl={https://openreview.net/forum?id=7Phicg0WAg}\n}",
        "github": "",
        "project": "",
        "reviewers": "sAQH;N2tn;1skp",
        "site": "https://openreview.net/forum?id=7Phicg0WAg",
        "pdf_size": 4647987,
        "rating": "5;5;5",
        "confidence": "5;3;4",
        "soundness": "4;3;2",
        "contribution": "3;2;2",
        "presentation": "4;3;3",
        "wc_summary": "85;46;47",
        "wc_strengths": "70;40;49",
        "wc_weaknesses": "68;111;151",
        "wc_questions": "29;95;14",
        "wc_review": "252;292;261",
        "wc_reply_reviewers": "0;50;21",
        "wc_reply_authors": "655;1086;997",
        "reply_reviewers": "0;1;1",
        "reply_authors": "1;2;3",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            59.333333333333336,
            18.153665072253467
        ],
        "wc_strengths_avg": [
            53.0,
            12.569805089976535
        ],
        "wc_weaknesses_avg": [
            110.0,
            33.891985286593446
        ],
        "wc_questions_avg": [
            46.0,
            35.185224171518364
        ],
        "wc_review_avg": [
            268.3333333333333,
            17.13346303452853
        ],
        "wc_reply_reviewers_avg": [
            23.666666666666668,
            20.499322482029065
        ],
        "wc_reply_authors_avg": [
            912.6666666666666,
            185.78541983218764
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:IQx0IzgsA6sJ:scholar.google.com/&scioq=FlexCap:+Generating+Rich,+Localized,+and+Flexible+Captions+in+Images&hl=en&as_sdt=0,5",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Google",
        "aff_unique_dep": "Google",
        "aff_unique_url": "https://www.google.com",
        "aff_unique_abbr": "Google",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Mountain View;",
        "aff_country_unique_index": "0;0;1;1",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "7Pzu7VjSwy",
        "title": "Diving into Class-Incremental Learning from Better Balancing Old and New knowledge",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Class-Incremental Learning (Class-IL) aims to continuously learn new knowledge without forgetting old knowledge from a given data stream using deep neural networks. Recent Class-IL methods strive to balance old and new knowledge and have achieved excellent results in mitigating the forgetting by mainly employing the rehearsal-based strategy. However, the representation learning on new tasks is often impaired since the trade-off is hard to taken between old and new knowledge. To overcome this challenge, based on the Complementary Learning System (CLS) theory, we propose a novel CLS-based method by focusing on the representation of old and new knowledge in Class-IL, which can acquire more new knowledge from new tasks while consolidating the old knowledge so as to make a better balance between them. Specifically, our proposed method has two novel components: (1) To effectively mitigate the forgetting, we first propose a bidirectional transport (BDT) strategy between old and new models, which can better integrate the old knowledge into the new knowledge and meanwhile enforce the old knowledge to be better consolidated by bidirectionally transferring parameters across old and new models. (2) To ensure that the representation of new knowledge is not impaired by the old knowledge, we further devise a selective momentum (SMT) mechanism to give parameters greater flexibility to learn new knowledge while transferring important old knowledge, which is achieved by selectively (momentum) updating network parameters through parameter importance evaluation. Extensive experiments on four benchmarks show that our proposed method significantly outperforms the state-of-the-arts under the Class-IL setting.",
        "keywords": "class incremental learning;catastrophic forgetting;complementary learning system;knowledge representation",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Feifei Fu;Yizhao Gao;Shiqi Zhao;Haoran Wu;Zhiwu Lu",
        "authorids": "~Feifei_Fu1;~Yizhao_Gao1;~Shiqi_Zhao3;~Haoran_Wu6;~Zhiwu_Lu1",
        "gender": "M;M;M;M;F",
        "homepage": ";;;https://gsai.ruc.edu.cn/luzhiwu;",
        "dblp": "132/7629;;;53/5234;https://dblp.org/rec/journals/iet-ipr/Fu0TL21",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;;OUXS8doAAAAJ;",
        "orcid": ";0009-0006-2508-7108;;;0009-0000-9957-5231",
        "linkedin": ";;https://www.linkedin.cn/incareer/in/%E6%B5%A9%E7%84%B6-%E5%90%B4-b807a0164;;https://www.linkedin.cn/injobs/in/%E8%8F%B2%E8%8F%B2-%E4%BB%98-a20230234",
        "or_profile": "~Yizhao_Gao1;~Shiqi_Zhao3;~Haoran_Wu6;~Zhiwu_Lu1;~FU_Feifei1",
        "aff": "Renmin University of China;China Unicom Research Institute;China Unicom Research Institute ;Renmin University of China;Renmin University of China",
        "aff_domain": "ruc.edu.cn;chinaunicom.cn;chinaunicom.cn;ruc.edu.cn;ruc.edu.cn",
        "position": "PhD student;Researcher;Researcher;Full Professor;PhD student",
        "bibtex": "@misc{\nfu2024diving,\ntitle={Diving into Class-Incremental Learning from Better Balancing Old and New knowledge},\nauthor={Feifei Fu and Yizhao Gao and Shiqi Zhao and Haoran Wu and Zhiwu Lu},\nyear={2024},\nurl={https://openreview.net/forum?id=7Pzu7VjSwy}\n}",
        "github": "",
        "project": "",
        "reviewers": "nG1u;W1qo;T7Kt;UGyp",
        "site": "https://openreview.net/forum?id=7Pzu7VjSwy",
        "pdf_size": 3936805,
        "rating": "3;3;3;6",
        "confidence": "5;4;4;4",
        "soundness": "3;3;2;3",
        "contribution": "1;1;2;2",
        "presentation": "2;2;3;2",
        "wc_summary": "76;50;51;117",
        "wc_strengths": "32;26;63;83",
        "wc_weaknesses": "321;109;316;208",
        "wc_questions": "32;26;66;2",
        "wc_review": "461;211;496;410",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            73.5,
            27.189152248645048
        ],
        "wc_strengths_avg": [
            51.0,
            23.205602771744587
        ],
        "wc_weaknesses_avg": [
            238.5,
            87.33985344617885
        ],
        "wc_questions_avg": [
            31.5,
            22.863726730347352
        ],
        "wc_review_avg": [
            394.5,
            110.26898929436145
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:B_17qcodV_sJ:scholar.google.com/&scioq=Diving+into+Class-Incremental+Learning+from+Better+Balancing+Old+and+New+knowledge&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;0;0",
        "aff_unique_norm": "Renmin University of China;China Unicom Research Institute",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.ruc.edu.cn;https://www.chinaunicom.com.cn/en-US/ResearchInstitute",
        "aff_unique_abbr": "RUC;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Adversarial Adaptive Sampling: Unify PINN and Optimal Transport for the Approximation of PDEs",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19361",
        "id": "7QI7tVrh2c",
        "author_site": "Kejun Tang, Jiayu Zhai, Xiaoliang Wan, Chao Yang",
        "tldr": "",
        "abstract": "Solving partial differential equations (PDEs) is a central task in scientific computing. Recently, neural network approximation of PDEs has received increasing attention due to its flexible meshless discretization and its potential for high-dimensional problems. One fundamental numerical difficulty is that random samples in the training set introduce statistical errors into the discretization of the loss functional which may become the dominant error in the final approximation, and therefore overshadow the modeling capability of the neural network. In this work, we propose a new minmax formulation to optimize simultaneously the approximate solution, given by a neural network model, and the random samples in the training set, provided by a deep generative model. The key idea is to use a deep generative model to adjust the random samples in the training set such that the residual induced by the neural network model can maintain a smooth profile in the training process. Such an idea is achieved by implicitly embedding the Wasserstein distance between the residual-induced distribution and the uniform distribution into the loss, which is then minimized together with the residual. A nearly uniform residual profile means that its variance is small for any normalized weight function such that the Monte Carlo approximation error of the loss functional is reduced significantly for a certain sample size. The adversarial adaptive sampling (AAS) approach proposed in this work is the first attempt to formulate two essential components, minimizing the residual and seeking the optimal training set, into one minmax objective functional for the neural network approximation of PDEs.",
        "keywords": "adversarial adaptive sampling;optimal transport;neural network approximation of PDEs",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/1a0842aff32043ada3484a12665005e0edb4749a.pdf",
        "author": "Kejun Tang;Jiayu Zhai;Xiaoliang Wan;Chao Yang",
        "authorids": "~Kejun_Tang1;~Jiayu_Zhai1;~Xiaoliang_Wan1;~Chao_Yang8",
        "gender": ";M;;M",
        "homepage": ";https://ims.shanghaitech.edu.cn/2022/0913/c4741a835499/page.htm;http://www.math.lsu.edu/~xlwan;",
        "dblp": ";206/7523;11/3027;",
        "google_scholar": ";gcu1p1UAAAAJ;j0uRgOYAAAAJ;JvVLHaEAAAAJ",
        "orcid": ";0000-0002-7376-6205;;",
        "linkedin": ";;;",
        "or_profile": "~Kejun_Tang1;~Jiayu_Zhai1;~Xiaoliang_Wan1;~Chao_Yang8",
        "aff": ";ShanghaiTech University;Louisiana State University;Peking University",
        "aff_domain": ";shanghaitech.edu.cn;lsu.edu;pku.edu.cn",
        "position": ";Assistant Professor;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\ntang2024adversarial,\ntitle={Adversarial Adaptive Sampling: Unify {PINN} and Optimal Transport for the Approximation of {PDE}s},\nauthor={Kejun Tang and Jiayu Zhai and Xiaoliang Wan and Chao Yang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=7QI7tVrh2c}\n}",
        "github": "",
        "project": "",
        "reviewers": "YsSo;ZtMG;CyTK;3BKL",
        "pdf_size": 2677007,
        "rating": "5;6;8;10",
        "confidence": "4;3;4;5",
        "soundness": "2;2;3;4",
        "contribution": "2;3;4;4",
        "presentation": "1;2;4;4",
        "wc_summary": "136;198;159;118",
        "wc_strengths": "32;80;22;27",
        "wc_weaknesses": "390;352;38;106",
        "wc_questions": "39;11;19;75",
        "wc_review": "597;641;238;326",
        "wc_reply_reviewers": "271;28;0;136",
        "wc_reply_authors": "1532;1074;175;337",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "3;3;1;2",
        "rating_avg": [
            7.25,
            1.920286436967152
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            3.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            1.299038105676658
        ],
        "wc_summary_avg": [
            152.75,
            29.894606536965828
        ],
        "wc_strengths_avg": [
            40.25,
            23.220411279734044
        ],
        "wc_weaknesses_avg": [
            221.5,
            152.01562419698837
        ],
        "wc_questions_avg": [
            36.0,
            24.71841418861655
        ],
        "wc_review_avg": [
            450.5,
            172.05304414627486
        ],
        "wc_reply_reviewers_avg": [
            108.75,
            106.55368365288926
        ],
        "wc_reply_authors_avg": [
            779.5,
            550.9566679876013
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.7364596943186587,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5022401845944297732&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=7QI7tVrh2c",
        "pdf": "https://openreview.net/pdf?id=7QI7tVrh2c",
        "email": ";shanghaitech.edu.cn;lsu.edu;pku.edu.cn",
        "author_num": 4,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "ShanghaiTech University;Louisiana State University;Peking University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.shanghaitech.edu.cn;https://www.lsu.edu;http://www.pku.edu.cn",
        "aff_unique_abbr": "ShanghaiTech;LSU;Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "7QUwypJ8Vq",
        "title": "Taming Self-Training for Open-Vocabulary Object Detection",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recent studies have shown promising performance in open-vocabulary object detection (OVD) by utilizing pseudo labels (PLs) from pretrained vision and language models (VLMs). However, teacher-student self-training, a powerful and widely used paradigm to leverage PLs, is rarely explored for OVD. This work identifies two challenges of using self-training in OVD: noisy PLs from VLMs and frequent distribution changes of PLs. To address these challenges, we propose SAS-Det that tames self-training for OVD in two key aspects. First, we present a split-and-fusion (SAF) head that splits a standard detection into an open-branch and a closed-branch. This design can prevent noisy boxes of PLs from supervision. Moreover, the two branches learn complementary knowledge from different training data, significantly enhancing performance when fused together. Second, in our view, unlike in closed-set tasks, the PL's distributions in OVD are solely determined by the teacher model. Consequently, we introduce a periodic update strategy to decrease the number of updates to the teacher, thereby decreasing the frequency of changes in PL distributions. Extensive experiments demonstrate SAS-Det is both efficient and effective. Our pseudo labeling is three times faster than prior methods. SAS-Det outperforms prior state-of-the-art models of the same scale by a clear margin and achieves 37.4 AP50 and 29.1 APr on novel categories of the COCO and LVIS benchmarks, respectively.",
        "keywords": "Open-vocabulary object detection;pseudo labels;vision and language pretraining",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Shiyu Zhao;Samuel Schulter;Long Zhao;Zhixing Zhang;Vijay Kumar b g;Yumin Suh;Manmohan Chandraker;Dimitris N. Metaxas",
        "authorids": "~Shiyu_Zhao1;~Samuel_Schulter1;~Long_Zhao2;~Zhixing_Zhang1;~Vijay_Kumar_b_g1;~Yumin_Suh1;~Manmohan_Chandraker3;~Dimitris_N._Metaxas1",
        "gender": "M;;M;M;;;;",
        "homepage": "https://xiaofeng94.github.io/;https://samschulter.github.io;http://garyzhao.github.io/;https://zhang-zx.github.io/;;https://yuminsuh.github.io/;;",
        "dblp": ";27/9990;31/5383-3;;;119/1522;;",
        "google_scholar": "https://scholar.google.com.sg/citations?hl=en;VQ6dsFEAAAAJ;YTyBTmgAAAAJ;RhM5qHoAAAAJ;;a9k4nwQAAAAJ;;",
        "orcid": "0000-0002-4978-725X;;0000-0001-8921-8564;;;;;",
        "linkedin": "shiyu-zhao-8ba8ab301/;;garyzhao9012/;zhixing-zhang-174959198/;;;;",
        "or_profile": "~Shiyu_Zhao1;~Samuel_Schulter1;~Long_Zhao2;~Zhixing_Zhang1;~Vijay_Kumar_b_g1;~Yumin_Suh1;~Manmohan_Chandraker3;~Dimitris_N._Metaxas1",
        "aff": "Meta;NEC-Labs;Google DeepMind;Snap Inc.;;NEC-Labs;;",
        "aff_domain": "meta.com;nec-labs.com;google.com;snapchat.com;;nec-labs.com;;",
        "position": "Intern;Researcher;Research scientist;Intern;;Researcher;;",
        "bibtex": "@misc{\nzhao2024taming,\ntitle={Taming Self-Training for Open-Vocabulary Object Detection},\nauthor={Shiyu Zhao and Samuel Schulter and Long Zhao and Zhixing Zhang and Vijay Kumar b g and Yumin Suh and Manmohan Chandraker and Dimitris N. Metaxas},\nyear={2024},\nurl={https://openreview.net/forum?id=7QUwypJ8Vq}\n}",
        "github": "",
        "project": "",
        "reviewers": "wquL;NEiz;vFm8;rX3B",
        "site": "https://openreview.net/forum?id=7QUwypJ8Vq",
        "pdf_size": 11147330,
        "rating": "3;5;5;6",
        "confidence": "4;5;4;3",
        "soundness": "1;2;3;2",
        "contribution": "1;3;3;2",
        "presentation": "1;3;3;3",
        "wc_summary": "71;44;74;119",
        "wc_strengths": "31;41;17;45",
        "wc_weaknesses": "280;150;166;93",
        "wc_questions": "4;18;14;2",
        "wc_review": "386;253;271;259",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            77.0,
            26.91653766738954
        ],
        "wc_strengths_avg": [
            33.5,
            10.805091392487155
        ],
        "wc_weaknesses_avg": [
            172.25,
            67.86889935751131
        ],
        "wc_questions_avg": [
            9.5,
            6.689544080129826
        ],
        "wc_review_avg": [
            292.25,
            54.51318647813573
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.3244428422615251,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16942470371922372045&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;2;3;1",
        "aff_unique_norm": "Meta;NEC Laboratories;Google;Snap Inc.",
        "aff_unique_dep": "Meta Platforms, Inc.;;Google DeepMind;",
        "aff_unique_url": "https://meta.com;https://www.nec-labs.com;https://deepmind.com;https://www.snapinc.com",
        "aff_unique_abbr": "Meta;NEC-Labs;DeepMind;Snap",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "7QlKLvfVge",
        "title": "Directional Rank Reduction for Backdoor Defense",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent studies have indicated the effectiveness of neuron pruning for backdoor defense. In this work, we explore the limitations of pruning-based defense through theoretical and empirical investigations. We argue that pruning-based defense necessitates the removal of neurons that affect normal performance when the effect of backdoor is entangled across normal neurons. To address this challenge, we propose an extended neuron pruning framework, named \\emph{Directional Rank Reduction (\\method)}. \\method consists of three procedures: orthogonal transformation, pruning, and inverse transformation. Through the transformation of the feature space prior to pruning, \\method is able to focus the trigger effects on a limited number of neurons for more efficient pruning with less damage, outperforming existing pruning-based defense strategies. We implement \\method using Sarle's Bimodality Coefficient (SBC) which is optimized as the criterion for the transformation matrix based on the separability assumption of benign and poisoned features. Extensive experimental results demonstrate the superiority of our method. On average, our approach substantially reduces the ASR by 4.5x and increases the ACC by 1.45\\% compared with the recently strong baselines.",
        "keywords": "backdoor defense;backdoor attack;neuron pruning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Runkai Zheng;Jindong Wang;Xuanchang Xu;Li Liu;Jianze Li;Xing Xie",
        "authorids": "~Runkai_Zheng1;~Jindong_Wang1;~Xuanchang_Xu2;~Li_Liu8;~Jianze_Li1;~Xing_Xie3",
        "gender": "M;M;F;M;M;M",
        "homepage": ";https://github.com/EricXuXuanchang;https://liliu-avril.github.io/;http://www.sribd.cn/teacher/21;http://research.microsoft.com/en-us/people/xingx/;https://jd92.wang/",
        "dblp": ";;33/4528-36;195/6246;08/6809-1;19/2969-1",
        "google_scholar": ";;KQ2S01UAAAAJ;;5EQfAFIAAAAJ;hBZ_tKsAAAAJ",
        "orcid": ";;;0000-0002-0760-7994;0000-0002-8608-8482;0000-0002-4833-0880",
        "linkedin": "%E6%B6%A6%E9%94%B4-%E9%83%91-551606156/;;;;xingx/;jindong-wang/",
        "or_profile": "~Runkai_Zheng1;~Xuanchang_Xu2;~Li_Liu8;~Jianze_Li1;~Xing_Xie3;~Jindong_Wang4",
        "aff": "Carnegie Mellon University;National University of Singapore;The Hong Kong University of Science and Technology (Guangzhou);;Microsoft Research Asia;Microsoft Research",
        "aff_domain": "andrew.cmu.edu;nus.edu;hkust-gz.edu.cn;;microsoft.com;microsoft.com",
        "position": "MS student;MS student;Assistant Professor;;Senior Principal Researcher;Researcher",
        "bibtex": "@misc{\nzheng2024directional,\ntitle={Directional Rank Reduction for Backdoor Defense},\nauthor={Runkai Zheng and Jindong Wang and Xuanchang Xu and Li Liu and Jianze Li and Xing Xie},\nyear={2024},\nurl={https://openreview.net/forum?id=7QlKLvfVge}\n}",
        "github": "",
        "project": "",
        "reviewers": "X3hw;niUP;7hoR;1xjT",
        "site": "https://openreview.net/forum?id=7QlKLvfVge",
        "pdf_size": 546454,
        "rating": "5;5;5;6",
        "confidence": "3;4;4;4",
        "soundness": "2;3;2;3",
        "contribution": "2;3;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "68;68;94;33",
        "wc_strengths": "44;46;30;30",
        "wc_weaknesses": "178;136;132;79",
        "wc_questions": "44;78;26;8",
        "wc_review": "334;328;282;150",
        "wc_reply_reviewers": "101;0;0;0",
        "wc_reply_authors": "1126;900;1661;630",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "2;2;2;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            65.75,
            21.683807322516035
        ],
        "wc_strengths_avg": [
            37.5,
            7.533259586659682
        ],
        "wc_weaknesses_avg": [
            131.25,
            35.13812032536743
        ],
        "wc_questions_avg": [
            39.0,
            25.865034312755125
        ],
        "wc_review_avg": [
            273.5,
            74.0860985610661
        ],
        "wc_reply_reviewers_avg": [
            25.25,
            43.73428289111415
        ],
        "wc_reply_authors_avg": [
            1079.25,
            379.00354549792803
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ABg7mFflFPsJ:scholar.google.com/&scioq=Directional+Rank+Reduction+for+Backdoor+Defense&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;3",
        "aff_unique_norm": "Carnegie Mellon University;National University of Singapore;Hong Kong University of Science and Technology;Microsoft",
        "aff_unique_dep": ";;;Research",
        "aff_unique_url": "https://www.cmu.edu;https://www.nus.edu.sg;https://www.ust.hk;https://www.microsoft.com/en-us/research/group/asia",
        "aff_unique_abbr": "CMU;NUS;HKUST;MSR Asia",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Guangzhou;Asia",
        "aff_country_unique_index": "0;1;2;2;0",
        "aff_country_unique": "United States;Singapore;China"
    },
    {
        "id": "7QncaLObzi",
        "title": "Binary Hyperbolic Embeddings",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "As datasets continue to grow, vector-based search becomes more storage and compute intensive, requiring large-scale systems to support retrieval. Proposed solutions range from quantization techniques that balance speed and accuracy, to hashing methods that learn compact binary representations. This paper promotes the use of hyperbolic space for its compact nature whilst overcoming its slow retrieval via binarization. Specifically, we address hyperbolic space's inherent slowness by proving that its complex similarity calculations can be equated to a binary XOR operation. Our approach allows for 90% less storage and at least 4.7 times faster search while maintaining performance of full-precision Euclidean embeddings.",
        "keywords": "Hyperbolic;Binary;Hierarchical",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Teng Long;Pascal Mettes;Nanne Van Noord",
        "authorids": "~Teng_Long2;~Pascal_Mettes1;~Nanne_Van_Noord1",
        "gender": "M;M;M",
        "homepage": "http://tenglon.github.io/;https://staff.fnwi.uva.nl/p.s.m.mettes/;https://nanne.github.io/",
        "dblp": ";147/4008;123/5104.html",
        "google_scholar": "5Iv3ul0AAAAJ;https://scholar.google.nl/citations?user=sMQxA3AAAAAJ;wFDJzDkAAAAJ",
        "orcid": "0000-0002-2380-9502;0000-0001-9275-5942;0000-0002-5145-3603",
        "linkedin": "tenglong-926500116/;;",
        "or_profile": "~Teng_Long2;~Pascal_Mettes1;~Nanne_Van_Noord1",
        "aff": "University of Amsterdam, University of Amsterdam;University of Amsterdam;University of Amsterdam",
        "aff_domain": "ivi.uva.nl;uva.nl;uva.nl",
        "position": "Postdoc;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nlong2024binary,\ntitle={Binary Hyperbolic Embeddings},\nauthor={Teng Long and Pascal Mettes and Nanne Van Noord},\nyear={2024},\nurl={https://openreview.net/forum?id=7QncaLObzi}\n}",
        "github": "",
        "project": "",
        "reviewers": "5iHW;4fSp;AY1W;d3do",
        "site": "https://openreview.net/forum?id=7QncaLObzi",
        "pdf_size": 10093397,
        "rating": "5;6;6;6",
        "confidence": "3;5;3;3",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "96;39;67;67",
        "wc_strengths": "32;41;26;72",
        "wc_weaknesses": "156;43;144;250",
        "wc_questions": "34;34;114;147",
        "wc_review": "318;157;351;536",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1077;373;370;424",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            67.25,
            20.154093876927337
        ],
        "wc_strengths_avg": [
            42.75,
            17.711225254058512
        ],
        "wc_weaknesses_avg": [
            148.25,
            73.32930860167713
        ],
        "wc_questions_avg": [
            82.25,
            49.6405831956072
        ],
        "wc_review_avg": [
            340.5,
            134.63747620926353
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            561.0,
            298.68461627609815
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4136104022654752726&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Amsterdam",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uva.nl",
        "aff_unique_abbr": "UvA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Netherlands"
    },
    {
        "id": "7Rf2j94H1x",
        "title": "Episode Transformer: Model-based Episodic Reinforcement Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Episodic Reinforcement Learning (ERL) with movement primitives (MPs) has recently achieved significant success, especially in sparse and non-Markovian reward scenarios. By reasoning directly at the trajectory level via MPs, ERL results in smoother, energy-efficient policies and improved exploration capabilities for many real-world tasks. However, these black-box optimization approaches have very poor data-efficiency making them impractical for real-world applications. To mitigate this drawback, we propose Episode Transformer, a model-based ERL algorithm. Here, we learn a transformer-based episodic world model. To perform control we train a policy, with trust region constraints, purely in the world model's imagination. We compare our approach to state-of-the-art step-based and episodic RL methods on a variety of challenging robotic tasks under dense, sparse, and non-Markovian reward settings. The results show that the Episode Transformer is able to learn high-quality policies that retain all the benefits of previous deep ERL methods while requiring up to 5x fewer environment samples.",
        "keywords": "Episodic RL;Model-based RL;Movement Primitives",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Ruben Jacob;Vaisakh Shaj;Philipp Becker;Gerhard Neumann",
        "authorids": "~Ruben_Jacob1;~Vaisakh_Shaj1;~Philipp_Becker1;~Gerhard_Neumann2",
        "gender": ";M;M;M",
        "homepage": ";;;https://alr.anthropomatik.kit.edu/",
        "dblp": ";190/3994;66/1316;60/4878",
        "google_scholar": ";;https://scholar.google.de/citations?user=jXx-LuQAAAAJ;https://scholar.google.com.tw/citations?user=GL360kMAAAAJ",
        "orcid": ";;;",
        "linkedin": "ruben-jacob-067735249/;;;",
        "or_profile": "~Ruben_Jacob1;~Vaisakh_Shaj1;~Philipp_Becker1;~Gerhard_Neumann1",
        "aff": ";Karlsruhe Institute of Technology;FZI Forschungszentrum Informatik ;Karlsruhe Institute of Technology",
        "aff_domain": ";kit.edu;fzi.de;kit.edu",
        "position": ";PhD student;Researcher;Full Professor",
        "bibtex": "@misc{\njacob2024episode,\ntitle={Episode Transformer: Model-based Episodic Reinforcement Learning},\nauthor={Ruben Jacob and Vaisakh Shaj and Philipp Becker and Gerhard Neumann},\nyear={2024},\nurl={https://openreview.net/forum?id=7Rf2j94H1x}\n}",
        "github": "",
        "project": "",
        "reviewers": "Q5Ym;in4T;kg3S;AjWh",
        "site": "https://openreview.net/forum?id=7Rf2j94H1x",
        "pdf_size": 2200445,
        "rating": "3;3;3;5",
        "confidence": "2;3;3;4",
        "soundness": "2;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "2;2;2;3",
        "wc_summary": "64;145;91;87",
        "wc_strengths": "13;35;54;15",
        "wc_weaknesses": "65;246;334;116",
        "wc_questions": "29;42;61;79",
        "wc_review": "171;468;540;297",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            96.75,
            29.701641368786337
        ],
        "wc_strengths_avg": [
            29.25,
            16.67895380412093
        ],
        "wc_weaknesses_avg": [
            190.25,
            106.03389788176231
        ],
        "wc_questions_avg": [
            52.75,
            18.952242611363964
        ],
        "wc_review_avg": [
            369.0,
            144.42125882293092
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:YNHREC3LGtsJ:scholar.google.com/&scioq=Episode+Transformer:+Model-based+Episodic+Reinforcement+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Karlsruhe Institute of Technology;FZI Forschungszentrum Informatik",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.kit.edu;https://www.fzi.de",
        "aff_unique_abbr": "KIT;FZI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "7Scc7Nl7lg",
        "title": "Revealing Vision-Language Integration in the Brain with Multimodal Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We use multimodal deep neural networks to identify sites of multimodal integration in the human brain. These are regions where a multimodal language-vision model is better at predicting neural recordings (stereoelectroencephalography, SEEG) than either a unimodal language, unimodal vision model, or a linearly-integrated language-vision model. We use a wide range of state-of-the-art models spanning different architectures including Transformers and CNNs (ALBEF, BLIP, Flava, ConvNeXt, BEIT, SIMCLR, CLIP, SLIP) with different multimodal integration approaches to model the SEEG signal while subjects watched movies. As a key enabling step, we first demonstrate that the approach has the resolution to distinguish trained from randomly-initialized models for both language and vision; the inability to do so would fundamentally hinder further analysis. We show that trained models systematically outperform randomly initialized models in their ability to predict the SEEG signal. We then compare unimodal and multimodal models against one another. A key contribution is standardizing the methodology for doing so while carefully avoiding statistical artifacts. Since models all have different architectures, number of parameters, and training sets which can obscure the results, we then carry out a test between two controlled models: SLIP-Combo and SLIP-SimCLR which keep all of these attributes the same aside from multimodal input. Using this method, we identify neural sites (on average 141 out of 1090 total sites or 12.94\\%) and brain regions where multimodal integration is occurring. We find numerous new sites of multimodal integration, many of which lie around the temporoparietal junction, long theorized to be a hub of multimodal integration.",
        "keywords": "Vision and language in the brain;multimodal processing;encoding models",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/eb0f25e91d6c84d21fa6637156456d34106a4e27.zip",
        "author": "Vighnesh Subramaniam;Colin Conwell;Christopher Wang;Gabriel Kreiman;Boris Katz;Ignacio Cases;Andrei Barbu",
        "authorids": "~Vighnesh_Subramaniam1;~Colin_Conwell1;~Christopher_Wang1;~Gabriel_Kreiman1;~Boris_Katz1;~Ignacio_Cases2;~Andrei_Barbu3",
        "gender": ";;;M;M;Non-Binary;M",
        "homepage": "https://vsubramaniam851.github.io;;https://czlwang.github.io/;http://klab.tch.harvard.edu;http://people.csail.mit.edu/boris/boris.html;;https://0xab.com",
        "dblp": ";;;12/1367;k/BorisKatz;;58/8365",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en;;WxZ_6nsAAAAJ;FdNuUb8AAAAJ;9-TdgYMAAAAJ;t1rjgHgAAAAJ",
        "orcid": ";0000-0002-7754-1580;;0000-0003-3505-8475;;;",
        "linkedin": "vighnesh-subramaniam-34549717b/;;;kreiman/;;;andrei-barbu-1166131",
        "or_profile": "~Vighnesh_Subramaniam1;~Colin_Conwell1;~Christopher_Wang1;~Gabriel_Kreiman1;~Boris_Katz1;~Ignacio_Cases2;~Andrei_Barbu3",
        "aff": "Massachusetts Institute of Technology;Johns Hopkins University;Computer Science and Artificial Intelligence Laboratory, Electrical Engineering & Computer Science;Harvard Medical School;Massachusetts Institute of Technology;Massachusetts Institute of Technology;Massachusetts Institute of Technology",
        "aff_domain": "mit.edu;jhu.edu;csail.mit.edu;harvard.edu;mit.edu;mit.edu;mit.edu",
        "position": "MS student;Postdoc;PhD student;Full Professor;Principal Research Scientist;Postdoc;Researcher",
        "bibtex": "@misc{\nsubramaniam2024revealing,\ntitle={Revealing Vision-Language Integration in the Brain with Multimodal Networks},\nauthor={Vighnesh Subramaniam and Colin Conwell and Christopher Wang and Gabriel Kreiman and Boris Katz and Ignacio Cases and Andrei Barbu},\nyear={2024},\nurl={https://openreview.net/forum?id=7Scc7Nl7lg}\n}",
        "github": "",
        "project": "",
        "reviewers": "KL3N;JsYq;HcSy;gGN5;9iyA",
        "site": "https://openreview.net/forum?id=7Scc7Nl7lg",
        "pdf_size": 30079476,
        "rating": "3;3;6;6;6",
        "confidence": "4;5;3;5;4",
        "soundness": "1;2;3;2;3",
        "contribution": "1;2;2;3;3",
        "presentation": "1;2;3;3;3",
        "wc_summary": "73;114;42;289;55",
        "wc_strengths": "16;66;68;91;93",
        "wc_weaknesses": "252;436;175;799;125",
        "wc_questions": "92;3;1;244;45",
        "wc_review": "433;619;286;1423;318",
        "wc_reply_reviewers": "0;187;0;0;20",
        "wc_reply_authors": "782;1372;588;1221;801",
        "reply_reviewers": "0;1;0;0;1",
        "reply_authors": "1;3;1;2;2",
        "rating_avg": [
            4.8,
            1.469693845669907
        ],
        "confidence_avg": [
            4.2,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.2,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.2,
            0.7483314773547882
        ],
        "presentation_avg": [
            2.4,
            0.8
        ],
        "wc_summary_avg": [
            114.6,
            90.51983208115224
        ],
        "wc_strengths_avg": [
            66.8,
            27.76616646208115
        ],
        "wc_weaknesses_avg": [
            357.4,
            244.7763060428848
        ],
        "wc_questions_avg": [
            77.0,
            89.87769467448528
        ],
        "wc_review_avg": [
            615.8,
            420.10731962202226
        ],
        "wc_reply_reviewers_avg": [
            41.4,
            73.21092814600836
        ],
        "wc_reply_authors_avg": [
            952.8,
            294.26341940513095
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.8,
            0.7483314773547883
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.32732683535398854,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12071620120661180690&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 10,
        "aff_unique_index": "0;1;0;2;0;0;0",
        "aff_unique_norm": "Massachusetts Institute of Technology;Johns Hopkins University;Harvard University",
        "aff_unique_dep": ";;Medical School",
        "aff_unique_url": "https://web.mit.edu;https://www.jhu.edu;https://hms.harvard.edu",
        "aff_unique_abbr": "MIT;JHU;HMS",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Cambridge;Boston",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Removing Biases from Molecular Representations via Information Maximization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19360",
        "id": "7TOs9gjAg1",
        "author_site": "Chenyu Wang, Sharut Gupta, Caroline Uhler, Tommi Jaakkola",
        "tldr": "",
        "abstract": "High-throughput drug screening -- using cell imaging or gene expression measurements as readouts of drug effect -- is a critical tool in biotechnology to assess and understand the relationship between the chemical structure and biological activity of a drug. Since large-scale screens have to be divided into multiple experiments, a key difficulty is dealing with batch effects, which can introduce systematic errors and non-biological associations in the data. We propose InfoCORE, an Information maximization approach for COnfounder REmoval, to effectively deal with batch effects and obtain refined molecular representations. InfoCORE establishes a variational lower bound on the conditional mutual information of the latent representations given a batch identifier. It adaptively reweights samples to equalize their implied batch distribution. Extensive experiments on drug screening data reveal InfoCORE's superior performance in a multitude of tasks including molecular property prediction and molecule-phenotype retrieval. Additionally, we show results for how InfoCORE offers a versatile framework and resolves general distribution shifts and issues of data fairness by minimizing correlation with spurious features or removing sensitive attributes.",
        "keywords": "Molecular Representation;Batch Effect;Contrastive Learning;Information Maximization;Drug Discovery",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Chenyu Wang;Sharut Gupta;Caroline Uhler;Tommi S. Jaakkola",
        "authorids": "~Chenyu_Wang7;~Sharut_Gupta1;~Caroline_Uhler1;~Tommi_S._Jaakkola1",
        "gender": ";F;F;",
        "homepage": ";https://www.mit.edu/~sharut/;https://www.carolineuhler.com/;",
        "dblp": ";;66/10813;",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;https://scholar.google.com.tw/citations?user=dIJFcaoAAAAJ;",
        "orcid": ";;;",
        "linkedin": ";sharut-gupta/;;",
        "or_profile": "~Chenyu_Wang7;~Sharut_Gupta1;~Caroline_Uhler1;~Tommi_S._Jaakkola1",
        "aff": ";Google;Electrical Engineering & Computer Science, Massachusetts Institute of Technology;",
        "aff_domain": ";google.com;eecs.mit.edu;",
        "position": ";Student Researcher;Associate Professor;",
        "bibtex": "@inproceedings{\nwang2024removing,\ntitle={Removing Biases from Molecular Representations via Information Maximization},\nauthor={Chenyu Wang and Sharut Gupta and Caroline Uhler and Tommi S. Jaakkola},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=7TOs9gjAg1}\n}",
        "github": "",
        "project": "",
        "reviewers": "Tyeq;JEFo;g7wR;FJph",
        "pdf_size": 5869947,
        "rating": "6;6;6;8",
        "confidence": "2;3;3;3",
        "soundness": "3;2;3;3",
        "contribution": "3;2;2;3",
        "presentation": "3;2;3;4",
        "wc_summary": "107;63;204;96",
        "wc_strengths": "81;12;97;80",
        "wc_weaknesses": "85;27;419;159",
        "wc_questions": "30;278;137;2",
        "wc_review": "303;380;857;337",
        "wc_reply_reviewers": "20;42;254;155",
        "wc_reply_authors": "634;2445;1944;382",
        "reply_reviewers": "1;1;1;2",
        "reply_authors": "1;5;4;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            117.5,
            52.5
        ],
        "wc_strengths_avg": [
            67.5,
            32.745228660065884
        ],
        "wc_weaknesses_avg": [
            172.5,
            149.80904512078035
        ],
        "wc_questions_avg": [
            111.75,
            108.40289433405364
        ],
        "wc_review_avg": [
            469.25,
            225.5242503590246
        ],
        "wc_reply_reviewers_avg": [
            117.75,
            93.86792583199014
        ],
        "wc_reply_authors_avg": [
            1351.25,
            866.2468975413418
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            1.5811388300841898
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4157904962319405770&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 8,
        "openreview": "https://openreview.net/forum?id=7TOs9gjAg1",
        "pdf": "https://openreview.net/pdf?id=7TOs9gjAg1",
        "email": ";google.com;eecs.mit.edu;",
        "author_num": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Google;Massachusetts Institute of Technology",
        "aff_unique_dep": "Google;Electrical Engineering & Computer Science",
        "aff_unique_url": "https://www.google.com;https://web.mit.edu",
        "aff_unique_abbr": "Google;MIT",
        "aff_campus_unique_index": "0;1",
        "aff_campus_unique": "Mountain View;Cambridge",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "BooookScore: A systematic exploration of book-length summarization in the era of LLMs",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19359",
        "id": "7Ttk3RzDeu",
        "author_site": "Yapei Chang, Kyle Lo, Tanya Goyal, Mohit Iyyer",
        "tldr": "",
        "abstract": "Summarizing book-length documents ($>$100K tokens)  that exceed the context window size of large language models (LLMs) requires first breaking the input document into smaller chunks and then prompting an LLM to merge, update, and compress chunk-level summaries. Despite the complexity and importance of this task, it has yet to be meaningfully studied due to the challenges of evaluation: existing book-length summarization datasets (e.g., BookSum) are in the pretraining data of most public LLMs, and existing evaluation methods struggle to capture errors made by modern LLM summarizers. In this paper, we present the first study of the coherence of LLM-based book-length summarizers implemented via two prompting workflows: (1) hierarchically merging chunk-level summaries, and (2) incrementally updating a running summary. We obtain 1193 fine-grained human annotations on GPT-4 generated summaries of 100 recently-published books and identify eight common types of coherence errors made by LLMs. Because human evaluation is expensive and time-consuming, we develop an automatic metric, BooookScore, that measures the proportion of sentences in a summary that do not contain any of the identified error types. BooookScore has high agreement with human annotations and allows us to systematically evaluate the impact of many other critical parameters (e.g., chunk size, base LLM) while saving \\$15K USD and 500 hours in human evaluation costs. We find that closed-source LLMs such as GPT-4 and Claude 2 produce summaries with higher BooookScore than those generated by open-source models. While LLaMA 2 falls behind other models, Mixtral achieves performance on par with GPT-3.5-Turbo. Incremental updating yields lower BooookScore but higher level of detail than hierarchical merging, a trade-off sometimes preferred by annotators. We release code and annotations to spur more principled research on book-length summarization.",
        "keywords": "summarization;evaluation;long context;prompting;LLM",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Yapei Chang;Kyle Lo;Tanya Goyal;Mohit Iyyer",
        "authorids": "~Yapei_Chang1;~Kyle_Lo1;~Tanya_Goyal1;~Mohit_Iyyer1",
        "gender": "F;;F;M",
        "homepage": "https://lilakk.github.io/;https://kyleclo.github.io/;;http://cs.umass.edu/~miyyer",
        "dblp": "316/9933;220/2020;176/9145;148/9178",
        "google_scholar": "qCjnm-UAAAAJ;VJS12uMAAAAJ;w72MSFoAAAAJ;rBVA5tcAAAAJ",
        "orcid": ";;;",
        "linkedin": "ella-yapei-chang/;kylelo/;;",
        "or_profile": "~Yapei_Chang1;~Kyle_Lo1;~Tanya_Goyal1;~Mohit_Iyyer1",
        "aff": "University of Massachusetts at Amherst;Allen Institute for Artificial Intelligence;Princeton University;University of Massachusetts Amherst",
        "aff_domain": "umass.edu;allenai.org;princeton.edu;cs.umass.edu",
        "position": "PhD student;Researcher;Postdoc;Associate Professor",
        "bibtex": "@inproceedings{\nchang2024booookscore,\ntitle={BooookScore: A systematic exploration of book-length summarization in the era of {LLM}s},\nauthor={Yapei Chang and Kyle Lo and Tanya Goyal and Mohit Iyyer},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=7Ttk3RzDeu}\n}",
        "github": "",
        "project": "",
        "reviewers": "vK8q;hJ5Z;rPVA;SAFf",
        "pdf_size": 599451,
        "rating": "8;8;8;10",
        "confidence": "4;4;4;5",
        "soundness": "3;3;4;4",
        "contribution": "3;4;4;4",
        "presentation": "3;4;4;4",
        "wc_summary": "39;202;36;61",
        "wc_strengths": "52;55;50;250",
        "wc_weaknesses": "145;145;45;43",
        "wc_questions": "114;67;1;11",
        "wc_review": "350;469;132;365",
        "wc_reply_reviewers": "546;66;0;0",
        "wc_reply_authors": "796;604;288;234",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            8.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            84.5,
            68.52189431123456
        ],
        "wc_strengths_avg": [
            101.75,
            85.61067398403075
        ],
        "wc_weaknesses_avg": [
            94.5,
            50.50495025242575
        ],
        "wc_questions_avg": [
            48.25,
            45.53775905773142
        ],
        "wc_review_avg": [
            329.0,
            122.6234072271685
        ],
        "wc_reply_reviewers_avg": [
            153.0,
            228.49288829195538
        ],
        "wc_reply_authors_avg": [
            480.5,
            230.54880177524237
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 115,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17968620361685249119&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=7Ttk3RzDeu",
        "pdf": "https://openreview.net/pdf?id=7Ttk3RzDeu",
        "email": "umass.edu;allenai.org;princeton.edu;cs.umass.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "University of Massachusetts Amherst;Allen Institute for Artificial Intelligence;Princeton University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.umass.edu;https://allenai.org;https://www.princeton.edu",
        "aff_unique_abbr": "UMass Amherst;AI2;Princeton",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Amherst;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "7U5QE9T4hI",
        "title": "Learning to Extrapolate and Adjust: Two-Stage Meta-Learning for Concept Drift in Online Time Series Forecasting",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The non-stationary nature of time series data in many real-world applications makes accurate time series forecasting challenging. In this paper, we consider concept drift where the underlying distribution or environment of time series changes. We first classify concepts into two categories, macro-drift corresponding to stable and long-term changes and micro-drift referring to sudden or short-term changes. Next, we propose a unified meta-learning framework called LEAF (Learning to Extrapolate and Adjust for Forecasting). Specifically, an extrapolation module is first meta-learnt to track the dynamics of the prediction model in latent space and extrapolate to the future considering macro-drift.  Then an adjustment module incorporates meta-learnable surrogate loss to capture sample-specific micro-drift patterns. Through this two-stage framework, different types of concept drifts can be handled. In particular, LEAF is model-agnostic and can be applied to any deep prediction model. To further advance the research of concept drift on time series, we open source three electric load time series datasets collected from real-world scenarios, which exhibit diverse and typical concept drifts and are ideal benchmark datasets for further research. Extensive experiments on multiple datasets demonstrate the effectiveness of LEAF.",
        "keywords": "time series forecasting;concept drift;meta learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/c2d1a81a6325615723201ac7aa0fdf556cc11293.pdf",
        "author": "Zhaoyang Zhu;Weiqi Chen;YiFan Zhang;Qingsong Wen;Liang Sun",
        "authorids": "~Zhaoyang_Zhu1;~Weiqi_Chen1;~YiFan_Zhang8;~Qingsong_Wen2;~Liang_Sun2",
        "gender": ";M;M;M;M",
        "homepage": "https://github.com/DAMO-DI-ML;https://github.com/DAMO-DI-ML;https://www.linkedin.com/in/liang-sun-a0a87621/;https://sites.google.com/site/qingsongwen8/;https://yfzhang114.github.io/",
        "dblp": "https://dblp.org/rec/journals/corr/abs-2403-14949;;18/5837-1;27/561;",
        "google_scholar": ";dMg_soMAAAAJ;D_cOMBgAAAAJ;vjPJvwYAAAAJ;lUnt8X4AAAAJ",
        "orcid": "0009-0009-0265-9910;0009-0007-9246-9402;0009-0002-5835-7259;0000-0003-4516-2524;0000-0002-6227-0183",
        "linkedin": ";;;qingsong-wen-22814156/;",
        "or_profile": "~Zhaoyang_Zhu1;~Weiqi_Chen1;~Liang_Sun2;~Qingsong_Wen1;~yifan_zhang7",
        "aff": "Alibaba Group;Alibaba Group;Alibaba Group;Squirrel Ai Learning;Institute of automation, Chinese academy of science",
        "aff_domain": "alibaba-inc.com;alibaba-inc.com;alibaba-inc.com;squirrelai.com;nlpr.ia.ac.cn",
        "position": "Researcher;Researcher;Staff Software Engineer;Principal Researcher;PhD student",
        "bibtex": "@misc{\nzhu2024learning,\ntitle={Learning to Extrapolate and Adjust: Two-Stage Meta-Learning for Concept Drift in Online Time Series Forecasting},\nauthor={Zhaoyang Zhu and Weiqi Chen and YiFan Zhang and Qingsong Wen and Liang Sun},\nyear={2024},\nurl={https://openreview.net/forum?id=7U5QE9T4hI}\n}",
        "github": "",
        "project": "",
        "reviewers": "rgPM;RMU1;CCky;9YY8;5qcj;x7gB",
        "site": "https://openreview.net/forum?id=7U5QE9T4hI",
        "pdf_size": 2673574,
        "rating": "3;5;5;5;6;8",
        "confidence": "4;4;4;4;3;4",
        "soundness": "2;2;3;3;3;3",
        "contribution": "2;2;3;3;3;3",
        "presentation": "2;2;3;3;3;3",
        "wc_summary": "63;150;96;197;138;68",
        "wc_strengths": "34;50;50;81;67;61",
        "wc_weaknesses": "290;183;46;197;214;88",
        "wc_questions": "35;122;5;72;103;5",
        "wc_review": "422;505;197;547;522;222",
        "wc_reply_reviewers": "125;189;20;0;0;63",
        "wc_reply_authors": "1245;1622;406;656;1135;549",
        "reply_reviewers": "1;1;1;0;0;1",
        "reply_authors": "4;3;1;2;2;1",
        "rating_avg": [
            5.333333333333333,
            1.4907119849998596
        ],
        "confidence_avg": [
            3.8333333333333335,
            0.3726779962499649
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            118.66666666666667,
            47.73421786889941
        ],
        "wc_strengths_avg": [
            57.166666666666664,
            14.82584080433739
        ],
        "wc_weaknesses_avg": [
            169.66666666666666,
            80.96638534327413
        ],
        "wc_questions_avg": [
            57.0,
            45.566800780100124
        ],
        "wc_review_avg": [
            402.5,
            141.9257434952048
        ],
        "wc_reply_reviewers_avg": [
            66.16666666666667,
            70.05573178231425
        ],
        "wc_reply_authors_avg": [
            935.5,
            431.0347047125865
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.1666666666666665,
            1.0671873729054748
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.19999999999999998,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:zuPLExgdwQ8J:scholar.google.com/&scioq=Learning+to+Extrapolate+and+Adjust:+Two-Stage+Meta-Learning+for+Concept+Drift+in+Online+Time+Series+Forecasting&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;2",
        "aff_unique_norm": "Alibaba Group;Squirrel Ai Learning;Chinese Academy of Sciences",
        "aff_unique_dep": ";;Institute of Automation",
        "aff_unique_url": "https://www.alibaba.com;https://www.squirrelai.com/;http://www.ia.cas.cn",
        "aff_unique_abbr": "Alibaba;;CAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "7UHlKybsQM",
        "title": "EFFICIENT QUANTUM STATE RECONSTRUCTION USING UNSUPERVISED LEARNING FOR QUANTUM CIRCUIT CUTTING",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Current quantum computer (QC) fabrication encounters challenges when attempting to scale up the number of qubits. These challenges include errors, physical limitations, interference, and various other factors. As a remedy, quantum circuit cutting holds the promise for studying large quantum systems with the limited qubit capacity of quantum computers today. With quantum circuit cutting, the output of a large quantum circuit could be obtained through classical post-processing of fragmented circuit outputs acquired through different measurement and preparation bases. However, such reconstruction process results in exponential quantum measurement cost with the increase in the number of circuit cuts. In this paper, we demonstrate efficient state reconstruction using a Restricted Boltzmann Machine (RBM) with polynomial resource scaling. We explore the benefits of unsupervised learning for simulating extensive quantum systems, exemplified by the reconstruction of highly entangled multi-qubit Greenberger\u2013Horne\u2013Zeilinger (GHZ) states from fragmented circuits. Our experiments illustrate that fragmented GHZ circuits, at the state-of-the-art scale of up to $18$ qubits, can be reconstructed with near-perfect fidelity using only $100$ sample measurements compared to $4^{18}$ sample measurements needed otherwise.",
        "keywords": "Unsupervised learning;state tomography;quantum computing",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "vinitha balachandran;Benjamin Chen Ming Choong;Nitin Shivaraman;Zhehui Wang;Liwei Yang;Rick Siow Mong Goh;Tao Luo",
        "authorids": "~vinitha_balachandran1;~Benjamin_Chen_Ming_Choong1;~Nitin_Shivaraman1;~Zhehui_Wang2;~Liwei_Yang2;~Rick_Siow_Mong_Goh1;~Tao_Luo2",
        "gender": "F;;M;M;;M;",
        "homepage": ";https://www.linkedin.com/in/benjamin-choong-ba6001179/;https://nitinshivaraman.github.io;;https://sites.google.com/view/rickgoh/home;;http://zhehui-wang.github.io",
        "dblp": ";322/4020;;;https://dblp.uni-trier.de/pers/g/Goh:Rick_Siow_Mong;43/4720-14;",
        "google_scholar": "https://scholar.google.com.sg/citations?user=b7LGxKkAAAAJ;;umM6yZsAAAAJ;;https://scholar.google.com.sg/citations?user=fBsBJjoAAAAJ;d4KZI8MAAAAJ;",
        "orcid": ";;0000-0002-3208-8495;0000-0002-0327-714X;0000-0001-9116-1595;0000-0002-3415-3676;",
        "linkedin": ";;nitinshivaraman/;;rickgoh/;;",
        "or_profile": "~vinitha_balachandran1;~Benjamin_Chen_Ming_Choong1;~Nitin_Shivaraman1;~Liwei_Yang2;~Rick_Siow_Mong_Goh1;~Tao_Luo2;~zhehui_wang1",
        "aff": "Institute of High Performance Computing, Singapore, A*STAR;Institute of High Performance Computing, Singapore, A*STAR;Institute of High Performance Computing, Singapore, A*STAR;Institute of High Performance Computing, Singapore, A*STAR;Institute of High Performance Computing, Singapore, A*STAR;Institute of High Performance Computing, Singapore, A*STAR;Institute of High Performance Computing, Singapore, A*STAR",
        "aff_domain": "ihpc.a-star.edu.sg;ihpc.a-star.edu.sg;ihpc.a-star.edu.sg;ihpc.a-star.edu.sg;ihpc.a-star.edu.sg;ihpc.a-star.edu.sg;ihpc.a-star.edu.sg",
        "position": "Researcher;Researcher;Researcher;Researcher;Director;Researcher;Researcher",
        "bibtex": "@misc{\nbalachandran2024efficient,\ntitle={{EFFICIENT} {QUANTUM} {STATE} {RECONSTRUCTION} {USING} {UNSUPERVISED} {LEARNING} {FOR} {QUANTUM} {CIRCUIT} {CUTTING}},\nauthor={vinitha balachandran and Benjamin Chen Ming Choong and Nitin Shivaraman and Zhehui Wang and Liwei Yang and Rick Siow Mong Goh and Tao Luo},\nyear={2024},\nurl={https://openreview.net/forum?id=7UHlKybsQM}\n}",
        "github": "",
        "project": "",
        "reviewers": "kuyP;YKiP;DHPz;GKSV",
        "site": "https://openreview.net/forum?id=7UHlKybsQM",
        "pdf_size": 2249405,
        "rating": "3;3;3;5",
        "confidence": "4;4;4;3",
        "soundness": "2;3;3;2",
        "contribution": "1;1;2;2",
        "presentation": "2;3;2;3",
        "wc_summary": "63;53;73;59",
        "wc_strengths": "21;48;49;98",
        "wc_weaknesses": "89;150;65;327",
        "wc_questions": "42;276;228;48",
        "wc_review": "215;527;415;532",
        "wc_reply_reviewers": "26;10;0;0",
        "wc_reply_authors": "508;255;139;190",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            62.0,
            7.280109889280518
        ],
        "wc_strengths_avg": [
            54.0,
            27.7758888246623
        ],
        "wc_weaknesses_avg": [
            157.75,
            102.51188955433413
        ],
        "wc_questions_avg": [
            148.5,
            104.90352710943517
        ],
        "wc_review_avg": [
            422.25,
            128.47446244293064
        ],
        "wc_reply_reviewers_avg": [
            9.0,
            10.63014581273465
        ],
        "wc_reply_authors_avg": [
            273.0,
            141.76917859675987
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:YBATzIG-VC4J:scholar.google.com/&scioq=EFFICIENT+QUANTUM+STATE+RECONSTRUCTION+USING+UNSUPERVISED+LEARNING+FOR+QUANTUM+CIRCUIT+CUTTING&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0;0;0",
        "aff_unique_norm": "Institute of High Performance Computing",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ihpc.a-star.edu.sg",
        "aff_unique_abbr": "IHPC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "Singapore"
    },
    {
        "title": "Beam Enumeration: Probabilistic Explainability For Sample Efficient Self-conditioned Molecular Design",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19358",
        "id": "7UhxsmbdaQ",
        "author_site": "Jeff Guo, Philippe Schwaller",
        "tldr": "",
        "abstract": "Generative molecular design has moved from proof-of-concept to real-world applicability, as marked by the surge in very recent papers reporting experimental validation. Key challenges in explainability and sample efficiency present opportunities to enhance generative design to directly optimize expensive high-fidelity oracles and provide actionable insights to domain experts. Here, we propose Beam Enumeration to exhaustively enumerate the most probable sub-sequences from language-based molecular generative models and show that molecular substructures can be extracted. When coupled with reinforcement learning, extracted substructures become meaningful, providing a source of explainability and improving sample efficiency through self-conditioned generation. Beam Enumeration is generally applicable to any language-based molecular generative model and notably further improves the performance of the recently reported Augmented Memory algorithm, which achieved the new state-of-the-art on the Practical Molecular Optimization benchmark for sample efficiency. The combined algorithm generates more high reward molecules and faster, given a fixed oracle budget. Beam Enumeration shows that improvements to explainability and sample efficiency for molecular design can be made synergistic.",
        "keywords": "Molecular generative models;reinforcement learning;natural language processing;drug discovery;sample-efficiency;explainability",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Jeff Guo;Philippe Schwaller",
        "authorids": "~Jeff_Guo1;~Philippe_Schwaller1",
        "gender": "M;M",
        "homepage": "https://guojeff.github.io/;https://schwallergroup.github.io",
        "dblp": ";209/9632",
        "google_scholar": "yzhfk_YAAAAJ;Tz0I4ywAAAAJ",
        "orcid": "0000-0002-4633-3199;0000-0003-3046-6576",
        "linkedin": "jeffguo1/;",
        "or_profile": "~Jeff_Guo1;~Philippe_Schwaller1",
        "aff": "Microsoft AI4Science;Swiss Federal Institute of Technology Lausanne",
        "aff_domain": "research.microsoft.com;epfl.ch",
        "position": "Intern;Assistant Professor",
        "bibtex": "@inproceedings{\nguo2024beam,\ntitle={Beam Enumeration: Probabilistic Explainability For Sample Efficient Self-conditioned Molecular Design},\nauthor={Jeff Guo and Philippe Schwaller},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=7UhxsmbdaQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "wYf5;d4Xh;La1F;3svX",
        "pdf_size": 19002272,
        "rating": "3;8;8;8",
        "confidence": "4;5;4;4",
        "soundness": "2;3;4;4",
        "contribution": "1;3;3;4",
        "presentation": "2;3;4;3",
        "wc_summary": "34;78;90;150",
        "wc_strengths": "19;52;164;123",
        "wc_weaknesses": "205;202;488;67",
        "wc_questions": "9;92;12;23",
        "wc_review": "267;424;754;363",
        "wc_reply_reviewers": "0;140;137;0",
        "wc_reply_authors": "2112;3411;2552;831",
        "reply_reviewers": "0;2;4;0",
        "reply_authors": "4;8;5;2",
        "rating_avg": [
            6.75,
            2.165063509461097
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            1.0897247358851685
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            88.0,
            41.42463035441596
        ],
        "wc_strengths_avg": [
            89.5,
            57.11610981150589
        ],
        "wc_weaknesses_avg": [
            240.5,
            153.3794314763228
        ],
        "wc_questions_avg": [
            34.0,
            33.88952640566109
        ],
        "wc_review_avg": [
            452.0,
            183.1215443359956
        ],
        "wc_reply_reviewers_avg": [
            69.25,
            69.25812226735576
        ],
        "wc_reply_authors_avg": [
            2226.5,
            931.3325131229984
        ],
        "reply_reviewers_avg": [
            1.5,
            1.6583123951777
        ],
        "reply_authors_avg": [
            4.75,
            2.165063509461097
        ],
        "replies_avg": [
            32,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=101114070671548311&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=7UhxsmbdaQ",
        "pdf": "https://openreview.net/pdf?id=7UhxsmbdaQ",
        "email": "research.microsoft.com;epfl.ch",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Microsoft;Swiss Federal Institute of Technology Lausanne",
        "aff_unique_dep": "AI4Science;",
        "aff_unique_url": "https://www.microsoft.com;https://www.epfl.ch",
        "aff_unique_abbr": "Microsoft;EPFL",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Lausanne",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United States;Switzerland"
    },
    {
        "title": "Provable Compositional Generalization for Object-Centric Learning",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19357",
        "id": "7VPTUWkiDQ",
        "author_site": "Thadd\u00e4us Wiedemer, Jack Brady, Alexander Panfilov, Attila Juhos, Matthias Bethge, Wieland Brendel",
        "tldr": "",
        "abstract": "Learning representations that generalize to novel compositions of known concepts is crucial for bridging the gap between human and machine perception. One prominent effort is learning object-centric representations, which are widely conjectured to enable compositional generalization. Yet, it remains unclear when this conjecture will be true, as a principled theoretical or empirical understanding of compositional generalization is lacking. In this work, we investigate when compositional generalization is guaranteed for object-centric representations through the lens of identifiability theory. We show that autoencoders that satisfy structural assumptions on the decoder and enforce encoder-decoder consistency will learn object-centric representations that provably generalize compositionally. We validate our theoretical result and highlight the practical relevance of our assumptions through experiments on synthetic image data.",
        "keywords": "compositional generalization;identifiability;object-centric learning;generalization;OOD generalization;unsupervised learning;slot attention;disentanglement;autoencoders;representation learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/33fd1c9b517dded8403690a54c5761cbb95fa832.zip",
        "author": "Thadd\u00e4us Wiedemer;Jack Brady;Alexander Panfilov;Attila Juhos;Matthias Bethge;Wieland Brendel",
        "authorids": "~Thadd\u00e4us_Wiedemer1;~Jack_Brady1;~Alexander_Panfilov1;~Attila_Juhos1;~Matthias_Bethge1;~Wieland_Brendel1",
        "gender": "M;;M;;M;M",
        "homepage": ";https://github.com/JackBrady;https://kotekjedi.github.io/;;https://bethgelab.org;",
        "dblp": "327/3433;;305/8752;228/6943;77/3005;37/11107",
        "google_scholar": "aeCiRSYAAAAJ;;https://scholar.google.com/citations?hl=en;35hg1Z8AAAAJ;https://scholar.google.com/citations?hl=en;v-JL-hsAAAAJ",
        "orcid": "0009-0003-6280-0804;;;;;",
        "linkedin": "thaddaeuswiedemer/;;kotekjedi/;;;",
        "or_profile": "~Thadd\u00e4us_Wiedemer1;~Jack_Brady1;~Alexander_Panfilov1;~Attila_Juhos1;~Matthias_Bethge1;~Wieland_Brendel1",
        "aff": "Max Planck Institute for Intelligent Systems;Max-Planck Institute;University of Tuebingen;Max-Planck Institute for Intelligent Systems;University of Tuebingen;ELLIS Institute T\u00fcbingen",
        "aff_domain": "is.tuebingen.mpg.de;mpg.de;tuebingen.de;mpg.tuebingen.de;uni-tuebingen.de;tue.ellis.eu",
        "position": "PhD student;PhD student;MS student;PhD student;Full Professor;Principal Researcher",
        "bibtex": "@inproceedings{\nwiedemer2024provable,\ntitle={Provable Compositional Generalization for Object-Centric Learning},\nauthor={Thadd{\\\"a}us Wiedemer and Jack Brady and Alexander Panfilov and Attila Juhos and Matthias Bethge and Wieland Brendel},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=7VPTUWkiDQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "KGuC;JA2G;wPGp",
        "pdf_size": 1564010,
        "rating": "6;8;8",
        "confidence": "3;4;3",
        "soundness": "2;4;3",
        "contribution": "2;3;3",
        "presentation": "3;4;4",
        "wc_summary": "173;92;202",
        "wc_strengths": "53;45;122",
        "wc_weaknesses": "117;38;89",
        "wc_questions": "3;84;19",
        "wc_review": "346;259;432",
        "wc_reply_reviewers": "0;42;19",
        "wc_reply_authors": "730;631;315",
        "reply_reviewers": "0;1;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            155.66666666666666,
            46.549853800940014
        ],
        "wc_strengths_avg": [
            73.33333333333333,
            34.56716489515576
        ],
        "wc_weaknesses_avg": [
            81.33333333333333,
            32.70406023042943
        ],
        "wc_questions_avg": [
            35.333333333333336,
            35.02697373295171
        ],
        "wc_review_avg": [
            345.6666666666667,
            70.62734755193786
        ],
        "wc_reply_reviewers_avg": [
            20.333333333333332,
            17.172329163188344
        ],
        "wc_reply_authors_avg": [
            558.6666666666666,
            176.97520228049527
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.49999999999999983,
        "gs_citation": 23,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10657915378413188094&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=7VPTUWkiDQ",
        "pdf": "https://openreview.net/pdf?id=7VPTUWkiDQ",
        "email": "is.tuebingen.mpg.de;mpg.de;tuebingen.de;mpg.tuebingen.de;uni-tuebingen.de;tue.ellis.eu",
        "author_num": 6,
        "aff_unique_index": "0;1;2;3;2;4",
        "aff_unique_norm": "Max Planck Institute for Intelligent Systems;Max-Planck-Gesellschaft zur F\u00f6rderung der Wissenschaften e.V.;University of Tuebingen;Max-Planck Institute for Intelligent Systems;ELLIS Institute",
        "aff_unique_dep": "Intelligent Systems;;;;",
        "aff_unique_url": "https://www.mpi-is.mpg.de;https://www.mpg.de;https://www.uni-tuebingen.de/;https://www.mpi-is.mpg.de;https://ellis.eu/",
        "aff_unique_abbr": "MPI-IS;MPG;Uni T\u00fcbingen;MPI-IS;ELLIS",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";T\u00fcbingen",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "7VVGO0kuuY",
        "title": "Learning Causal Dynamics Models in Object-Oriented Environments",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Causal Dynamics Models (CDMs) have demonstrated significant potential in addressing various challenges in reinforcement learning. Recent studies have incorporated causal discovery to capture the causal dependencies among environmental variables in the learning of CDMs. However, the learning of CDMs is still confined to small-scale environments due to computational complexity and sample efficiency constraints. This paper aims to extend CDMs to large-scale object-oriented environments, which consist of a multitude of objects classified into different categories. We introduce the Object-Oriented CDM (OOCDM) that shares causalities and parameters among objects belonging to the same class. Furthermore, we propose a learning method for OOCDM that enables it to adapt to a varying number of objects. Experimental results from large-scale tasks indicate that OOCDM outperforms existing CDMs in terms of causal discovery, prediction accuracy, generalization, and computational efficiency.",
        "keywords": "reinforcement learning;causality;dynamics model",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/f993e5fe10e42ccfb63a0b4a23195036c43cc171.zip",
        "author": "Zhongwei Yu;Jingqing Ruan;Dengpeng Xing",
        "authorids": "~Zhongwei_Yu1;~Jingqing_Ruan1;~Dengpeng_Xing1",
        "gender": "M;F;M",
        "homepage": ";https://github.com/Amanda-1997/;https://people.ucas.edu.cn/~xingdengpeng?language=en",
        "dblp": "96/4996;304/3544;85/8134",
        "google_scholar": ";https://scholar.google.com/citations?hl=zh-CN;",
        "orcid": "0000-0003-3372-2256;0000-0002-4857-9053;",
        "linkedin": ";;",
        "or_profile": "~Zhongwei_Yu1;~Jingqing_Ruan1;~Dengpeng_Xing1",
        "aff": "Institute of Automation, Chinese Academy of Sciences;Institute of Automation, Chinese Academy of Sciences;Institute of Automation, Chinese Academy of Sciences",
        "aff_domain": "ia.ac.cn;ia.ac.cn;ia.ac.cn",
        "position": "MS student;PhD student;Associate Professor",
        "bibtex": "@misc{\nyu2024learning,\ntitle={Learning Causal Dynamics Models in Object-Oriented Environments},\nauthor={Zhongwei Yu and Jingqing Ruan and Dengpeng Xing},\nyear={2024},\nurl={https://openreview.net/forum?id=7VVGO0kuuY}\n}",
        "github": "",
        "project": "",
        "reviewers": "LMvE;miEU;dZfY;mQjQ;6VtU",
        "site": "https://openreview.net/forum?id=7VVGO0kuuY",
        "pdf_size": 1852025,
        "rating": "5;6;6;6;6",
        "confidence": "4;4;2;3;3",
        "soundness": "3;3;3;3;2",
        "contribution": "3;2;3;3;2",
        "presentation": "3;1;2;2;3",
        "wc_summary": "107;95;106;173;73",
        "wc_strengths": "74;76;122;118;67",
        "wc_weaknesses": "428;436;433;371;168",
        "wc_questions": "75;227;165;11;73",
        "wc_review": "684;834;826;673;381",
        "wc_reply_reviewers": "267;55;264;38;125",
        "wc_reply_authors": "2201;1279;1542;594;1268",
        "reply_reviewers": "3;2;3;1;1",
        "reply_authors": "5;3;5;2;3",
        "rating_avg": [
            5.8,
            0.39999999999999997
        ],
        "confidence_avg": [
            3.2,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.2,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            110.8,
            33.420951512486894
        ],
        "wc_strengths_avg": [
            91.4,
            23.5762592452662
        ],
        "wc_weaknesses_avg": [
            367.2,
            102.42538747790998
        ],
        "wc_questions_avg": [
            110.2,
            76.30045871421744
        ],
        "wc_review_avg": [
            679.6,
            164.01048746955175
        ],
        "wc_reply_reviewers_avg": [
            149.8,
            98.87244307692615
        ],
        "wc_reply_authors_avg": [
            1376.8,
            517.8368082707138
        ],
        "reply_reviewers_avg": [
            2.0,
            0.8944271909999159
        ],
        "reply_authors_avg": [
            3.6,
            1.2
        ],
        "replies_avg": [
            37,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5345224838248488,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17002781624394995765&as_sdt=80005&sciodt=0,11&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Chinese Academy of Sciences",
        "aff_unique_dep": "Institute of Automation",
        "aff_unique_url": "http://www.ia.cas.cn",
        "aff_unique_abbr": "CAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Human Feedback is not Gold Standard",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19356",
        "id": "7W3GLNImfS",
        "author_site": "Tom Hosking, Phil Blunsom, Max Bartolo",
        "tldr": "",
        "abstract": "Human feedback has become the de facto standard for evaluating the performance of Large Language Models, and is increasingly being used as a training objective. However, it is not clear which properties of a generated output this single `preference' score captures. We hypothesise that preference scores are subjective and open to undesirable biases. We critically analyse the use of human feedback for both training and evaluation, to verify whether it fully captures a range of crucial error criteria. We find that while preference scores have fairly good coverage, they under-represent important aspects like factuality. We further hypothesise that both preference scores and error annotation may be affected by confounders, and leverage instruction-tuned models to generate outputs that vary along two possible confounding dimensions: assertiveness and complexity. We find that the assertiveness of an output skews the perceived rate of factuality errors, indicating that human annotations are not a fully reliable evaluation metric or training objective. Finally, we offer preliminary evidence that using human feedback as a training objective disproportionately increases the assertiveness of model outputs. We encourage future work to carefully consider whether preference scores are well aligned with the desired objective.",
        "keywords": "human evaluation;large language models;evaluation;natural language generation",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Tom Hosking;Phil Blunsom;Max Bartolo",
        "authorids": "~Tom_Hosking1;~Phil_Blunsom1;~Max_Bartolo1",
        "gender": ";;",
        "homepage": ";;https://maxbartolo.com",
        "dblp": ";96/4705;227/3290",
        "google_scholar": ";https://scholar.google.co.uk/citations?user=eJwbbXEAAAAJ;jPSWYn4AAAAJ",
        "orcid": ";;0009-0007-3301-7895",
        "linkedin": ";;maxbartolo/",
        "or_profile": "~Tom_Hosking1;~Phil_Blunsom1;~Max_Bartolo1",
        "aff": ";Department of Computer Science, University of Oxford;University College London",
        "aff_domain": ";cs.ox.ac.uk;ucl.ac.uk",
        "position": ";Associate Professor;PhD student",
        "bibtex": "@inproceedings{\nhosking2024human,\ntitle={Human Feedback is not Gold Standard},\nauthor={Tom Hosking and Phil Blunsom and Max Bartolo},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=7W3GLNImfS}\n}",
        "github": "",
        "project": "",
        "reviewers": "Rbzk;iLy7;knEY;mWEt",
        "pdf_size": 402977,
        "rating": "6;6;6;8",
        "confidence": "3;4;4;3",
        "soundness": "3;3;3;4",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "140;91;433;224",
        "wc_strengths": "72;53;168;111",
        "wc_weaknesses": "111;515;198;417",
        "wc_questions": "37;139;5;73",
        "wc_review": "360;798;804;825",
        "wc_reply_reviewers": "91;169;0;218",
        "wc_reply_authors": "517;1257;526;747",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "2;3;1;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            222.0,
            130.77652694577876
        ],
        "wc_strengths_avg": [
            101.0,
            43.971581731841304
        ],
        "wc_weaknesses_avg": [
            310.25,
            162.4951922365705
        ],
        "wc_questions_avg": [
            63.5,
            49.78704650810289
        ],
        "wc_review_avg": [
            696.75,
            194.68098905645616
        ],
        "wc_reply_reviewers_avg": [
            119.5,
            82.53029746705145
        ],
        "wc_reply_authors_avg": [
            761.75,
            300.40420686135536
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 43,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9519322896122389978&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=7W3GLNImfS",
        "pdf": "https://openreview.net/pdf?id=7W3GLNImfS",
        "email": ";cs.ox.ac.uk;ucl.ac.uk",
        "author_num": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Oxford;University College London",
        "aff_unique_dep": "Department of Computer Science;",
        "aff_unique_url": "https://www.ox.ac.uk;https://www.ucl.ac.uk",
        "aff_unique_abbr": "Oxford;UCL",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Oxford;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "7W4boWjb3Q",
        "title": "Partitioned-Learned Count-Min Sketch",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We propose Partitioned Learned Count-Min Sketch (PL-CMS), a new approach to learning augmented frequent item identification in data streams. Our method builds on the learned Count-Min Sketch (LCMS) algorithm of Hsu et al. (ICLR 2019), which combines a standard Count-Min Sketch frequency estimation data structure with a learned model, by partitioning items in the input stream into two sets. Items with sufficiently high predicted frequencies have their frequencies tracked exactly, while the remaining items, with low predicted frequencies, are placed into the Count-Min Sketch data structure. \n \nInspired by an approach of Vaidya et al. for learning augmented Bloom filters (ICLR 2021), our PL-CMS algorithm partitions items into different sets, based on multiple predicted frequency thresholds. Each set is handled by a separate Count-Min Sketch data structure. Unlike classic LCMS, this allows the algorithm to take advantage of the full prediction space of the learned model. We demonstrate that, given fixed partitioning thresholds, the parameters of our data structure can be efficiently optimized using a convex program. Empirically, we show that, on a variety of benchmarks, PL-CMS obtains a lower false positive rate for frequent item identification as compared to LCMS and standard Count-Min Sketch.",
        "keywords": "count-min sketch;heavy hitters;frequent items;learning augmented algorithms;streaming algorithms",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Thuy Trang Nguyen;Cameron N Musco",
        "authorids": "~Thuy_Trang_Nguyen1;~Cameron_N_Musco1",
        "gender": "F;M",
        "homepage": ";https://people.cs.umass.edu/~cmusco/",
        "dblp": ";149/2327",
        "google_scholar": "dmFU5vcAAAAJ;EeYGZCwAAAAJ",
        "orcid": ";",
        "linkedin": "thuytrang--nguyen/;",
        "or_profile": "~Thuy_Trang_Nguyen1;~Cameron_N_Musco1",
        "aff": "University of Massachusetts at Amherst;University of Massachusetts, Amherst",
        "aff_domain": "umass.edu;umass.edu",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nnguyen2024partitionedlearned,\ntitle={Partitioned-Learned Count-Min Sketch},\nauthor={Thuy Trang Nguyen and Cameron N Musco},\nyear={2024},\nurl={https://openreview.net/forum?id=7W4boWjb3Q}\n}",
        "github": "",
        "project": "",
        "reviewers": "C7mx;jB1e;4TXw;PmnJ",
        "site": "https://openreview.net/forum?id=7W4boWjb3Q",
        "pdf_size": 1331632,
        "rating": "5;5;6;6",
        "confidence": "4;4;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;2",
        "presentation": "3;3;3;4",
        "wc_summary": "113;161;55;116",
        "wc_strengths": "70;55;61;48",
        "wc_weaknesses": "118;121;124;102",
        "wc_questions": "227;111;2;77",
        "wc_review": "528;448;242;343",
        "wc_reply_reviewers": "0;125;59;0",
        "wc_reply_authors": "829;746;911;646",
        "reply_reviewers": "0;1;2;0",
        "reply_authors": "1;1;3;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            111.25,
            37.632266740126084
        ],
        "wc_strengths_avg": [
            58.5,
            8.077747210701755
        ],
        "wc_weaknesses_avg": [
            116.25,
            8.496322733983215
        ],
        "wc_questions_avg": [
            104.25,
            81.102943842995
        ],
        "wc_review_avg": [
            390.25,
            107.84334703633785
        ],
        "wc_reply_reviewers_avg": [
            46.0,
            51.58003489723519
        ],
        "wc_reply_authors_avg": [
            783.0,
            98.28275535413117
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Jb3gORY006sJ:scholar.google.com/&scioq=Partitioned-Learned+Count-Min+Sketch&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Massachusetts Amherst",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.umass.edu",
        "aff_unique_abbr": "UMass Amherst",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Amherst",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "7W4rbphLht",
        "title": "A Semi-smooth, Self-shifting, and Singular Newton Method for Sparse Optimal Transport",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Newton's method is an important second-order optimization algorithm that has been extensively studied. However, many challenging optimization problems break the classical assumptions of Newton's method. For example, the objective function may not be twice differentiable, and the optimal solution may be non-unique. In this article, we propose a general Newton-type algorithm named S5N, to solve problems that have possibly non-differentiable gradients and non-isolated solutions, a setting highly motivated by the sparse optimal transport problem. Compared with existing Newton-type approaches, the proposed S5N algorithm has broad applicability, does not require hyperparameter tuning, and possesses rigorous global and local convergence guarantees. Extensive numerical experiments show that on sparse optimal transport problems, S5N gains superior performance on convergence speed and computational efficiency.",
        "keywords": "Newton's method;semi-smooth function;non-isolated solution;global convergence;quadratic convergence;optimal transport",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Zihao Tang;Yixuan Qiu",
        "authorids": "~Zihao_Tang3;~Yixuan_Qiu1",
        "gender": "M;",
        "homepage": "https://github.com/TangZihao1997;https://statr.me",
        "dblp": "176/5858-1.html;209/7159",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;",
        "orcid": "0009-0008-4716-8616;",
        "linkedin": ";",
        "or_profile": "~Zihao_Tang3;~Yixuan_Qiu1",
        "aff": "Shanghai University of Finance and Economics;Shanghai University of Finance and Economics",
        "aff_domain": "sufe.edu;sufe.edu.cn",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\ntang2024a,\ntitle={A Semi-smooth, Self-shifting, and Singular Newton Method for Sparse Optimal Transport},\nauthor={Zihao Tang and Yixuan Qiu},\nyear={2024},\nurl={https://openreview.net/forum?id=7W4rbphLht}\n}",
        "github": "",
        "project": "",
        "reviewers": "h4ty;tikC;35vU;7Z3B;cPiV",
        "site": "https://openreview.net/forum?id=7W4rbphLht",
        "pdf_size": 3257542,
        "rating": "3;3;6;6;6",
        "confidence": "3;4;2;2;3",
        "soundness": "1;2;3;3;2",
        "contribution": "2;2;3;3;3",
        "presentation": "2;2;3;3;2",
        "wc_summary": "51;63;79;32;75",
        "wc_strengths": "9;30;125;42;45",
        "wc_weaknesses": "271;404;66;73;124",
        "wc_questions": "2;125;3;43;1",
        "wc_review": "333;622;273;190;245",
        "wc_reply_reviewers": "89;799;14;0;24",
        "wc_reply_authors": "690;1806;408;360;355",
        "reply_reviewers": "1;2;1;0;2",
        "reply_authors": "2;5;2;1;3",
        "rating_avg": [
            4.8,
            1.469693845669907
        ],
        "confidence_avg": [
            2.8,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.2,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            60.0,
            17.08800749063506
        ],
        "wc_strengths_avg": [
            50.2,
            39.48366750949055
        ],
        "wc_weaknesses_avg": [
            187.6,
            130.9573976528245
        ],
        "wc_questions_avg": [
            34.8,
            47.817988247102164
        ],
        "wc_review_avg": [
            332.6,
            151.86388642465332
        ],
        "wc_reply_reviewers_avg": [
            185.2,
            308.4149153332244
        ],
        "wc_reply_authors_avg": [
            723.8,
            555.0482501548852
        ],
        "reply_reviewers_avg": [
            1.2,
            0.7483314773547883
        ],
        "reply_authors_avg": [
            2.6,
            1.3564659966250538
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.7637626158259733,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:lwxVI53t-2AJ:scholar.google.com/&scioq=A+Semi-smooth,+Self-shifting,+and+Singular+Newton+Method+for+Sparse+Optimal+Transport&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Shanghai University of Finance and Economics",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.sufe.edu.cn",
        "aff_unique_abbr": "SUFE",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "7W9zRGhLq7",
        "title": "A New Theoretical Perspective on Data Heterogeneity in Federated Averaging",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In federated learning, data heterogeneity is the main reason that existing theoretical analyses are pessimistic about the convergence error caused by local updates. However, empirical studies have shown that more local updates can improve the convergence rate and reduce the communication cost when data are heterogeneous. This paper aims to bridge this gap between the theoretical understanding and the practical performance by providing a theoretical analysis for federated averaging (FedAvg) with non-convex objective functions from a new perspective on data heterogeneity. Identifying the limitations in the commonly used assumption of bounded gradient divergence, we propose a new assumption, termed the heterogeneity-driven Lipschitz assumption, which characterizes the fundamental effect of data heterogeneity on local updates. In the convergence analysis, we use the heterogeneity-driven Lipschitz constant and the global Lipschitz constant to substitute the widely used local Lipschitz constant and we show that our assumptions are weaker than those used in the literature. Based on the new assumption, we derive novel convergence bounds for both full participation and partial participation, which are tighter compared to the state-of-the-art analysis of FedAvg. This result can also imply that more local updates can improve the convergence rate even when data are highly heterogeneous. Further, we discuss the insights behind the proposed heterogeneity-driven Lipschitz assumption, by which we identify a region where FedAvg (also known as local SGD) can outperform mini-batch SGD even when the gradient divergence is arbitrarily large.",
        "keywords": "Federated Learning;Data Heterogeneity;Theoretical Analysis",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/db647562ac0cb088ebafd8f91e572dc2f56b6ae2.zip",
        "author": "Jiayi Wang;Shiqiang Wang;Rong-Rong Chen;Mingyue Ji",
        "authorids": "~Jiayi_Wang4;~Shiqiang_Wang1;~Rong-Rong_Chen1;~Mingyue_Ji1",
        "gender": "F;M;;M",
        "homepage": ";https://shiqiang.wang;;https://mingyueji.ece.ufl.edu/",
        "dblp": ";87/5094-1;;",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;kA_vmOcAAAAJ;G2pEqUQAAAAJ;rWLfxVgAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Jiayi_Wang4;~Shiqiang_Wang1;~Rong-Rong_Chen1;~Mingyue_Ji1",
        "aff": "Oak Ridge National Laboratory;IBM, International Business Machines;University of Utah;University of Florida",
        "aff_domain": "ornl.gov;us.ibm.com;utah.edu;ufl.edu",
        "position": "Postdoc;Research Staff Member;Associate Professor;Associate Professor",
        "bibtex": "@misc{\nwang2024a,\ntitle={A New Theoretical Perspective on Data Heterogeneity in Federated Averaging},\nauthor={Jiayi Wang and Shiqiang Wang and Rong-Rong Chen and Mingyue Ji},\nyear={2024},\nurl={https://openreview.net/forum?id=7W9zRGhLq7}\n}",
        "github": "",
        "project": "",
        "reviewers": "NMhc;wiji;RuXa;ziE8",
        "site": "https://openreview.net/forum?id=7W9zRGhLq7",
        "pdf_size": 1682092,
        "rating": "3;5;5;6",
        "confidence": "3;4;3;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;2",
        "presentation": "3;3;3;2",
        "wc_summary": "58;172;122;65",
        "wc_strengths": "65;154;108;69",
        "wc_weaknesses": "268;291;297;189",
        "wc_questions": "4;2;26;105",
        "wc_review": "395;619;553;428",
        "wc_reply_reviewers": "152;0;115;47",
        "wc_reply_authors": "2346;725;1064;1171",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "5;1;2;3",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            104.25,
            46.32696299132936
        ],
        "wc_strengths_avg": [
            99.0,
            35.92352989337211
        ],
        "wc_weaknesses_avg": [
            261.25,
            43.09509832916036
        ],
        "wc_questions_avg": [
            34.25,
            41.91882035553959
        ],
        "wc_review_avg": [
            498.75,
            91.06693966528138
        ],
        "wc_reply_reviewers_avg": [
            78.5,
            58.92580080066795
        ],
        "wc_reply_authors_avg": [
            1326.5,
            611.2014806919237
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            1.479019945774904
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.13245323570650439,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:JKimkEaRFksJ:scholar.google.com/&scioq=A+New+Theoretical+Perspective+on+Data+Heterogeneity+in+Federated+Averaging&hl=en&as_sdt=0,5",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Oak Ridge National Laboratory;International Business Machines;University of Utah;University of Florida",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.ornl.gov;https://www.ibm.com;https://www.utah.edu;https://www.ufl.edu",
        "aff_unique_abbr": "ORNL;IBM;Utah;UF",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "You Only Query Once: An Efficient Label-Only Membership Inference Attack",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19355",
        "id": "7WsivwyHrS",
        "author_site": "Yutong Wu, Han Qiu, Shangwei Guo, Jiwei Li, Tianwei Zhang",
        "tldr": "",
        "abstract": "As one of the privacy threats to machine learning models, the membership inference attack (MIA) tries to infer whether a given sample is in the original training set of a victim model by analyzing its outputs. Recent studies only use the predicted hard labels to achieve impressive membership inference accuracy. However, such label-only MIA approach requires very high query budgets to evaluate the distance of the target sample from the victim model's decision boundary.  \n   We propose YOQO, a novel label-only attack to overcome the above limitation.YOQO aims at identifying a special area (called improvement area) around the target sample and crafting a query sample, whose hard label from the victim model can reliably reflect the target sample's membership. YOQO can successfully reduce the query budget from more than 1,000 times to only ONCE. Experiments demonstrate that YOQO is not only as effective as SOTA attack methods, but also performs comparably or even more robustly against many sophisticated defenses.",
        "keywords": "Machine learning;Membership Inference Attack;Computer Vision",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/9c3699b4de96d41735ae13a134b7dcc950cec14c.zip",
        "author": "YUTONG WU;Han Qiu;Shangwei Guo;Jiwei Li;Tianwei Zhang",
        "authorids": "~YUTONG_WU3;~Han_Qiu3;~Shangwei_Guo1;~Jiwei_Li1;~Tianwei_Zhang1",
        "gender": "M;M;M;M;M",
        "homepage": ";https://qiuhan.info;http://www.cs.cqu.edu.cn/info/1332/5290.htm;https://nlp.stanford.edu/~bdlijiwei/;https://personal.ntu.edu.sg/tianwei.zhang/index.html",
        "dblp": ";15/4507-1;176/6479;73/5746-1;77/7902-4",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;https://scholar.google.fr/citations?user=6JWNv6gAAAAJ;wQrVkBYAAAAJ;PwU16JEAAAAJ;9vpiYDIAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~YUTONG_WU3;~Han_Qiu3;~Shangwei_Guo1;~Jiwei_Li1;~Tianwei_Zhang1",
        "aff": "National Technological University;Tsinghua University;Chongqing University;Zhejiang University;Nanyang Technological University",
        "aff_domain": "ntu.edu;tsinghua.edu.cn;cqu.edu.cn;zju.edu.cn;ntu.edu.sg",
        "position": "PhD student;Assistant Professor;Associate Professor;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nwu2024you,\ntitle={You Only Query Once: An Efficient Label-Only Membership Inference Attack},\nauthor={YUTONG WU and Han Qiu and Shangwei Guo and Jiwei Li and Tianwei Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=7WsivwyHrS}\n}",
        "github": "",
        "project": "",
        "reviewers": "1W2d;bo89;1cwK",
        "pdf_size": 426882,
        "rating": "6;6;8",
        "confidence": "3;4;4",
        "soundness": "3;2;3",
        "contribution": "2;3;3",
        "presentation": "3;3;3",
        "wc_summary": "72;119;100",
        "wc_strengths": "66;36;50",
        "wc_weaknesses": "91;29;77",
        "wc_questions": "63;262;347",
        "wc_review": "292;446;574",
        "wc_reply_reviewers": "43;258;19",
        "wc_reply_authors": "705;1874;773",
        "reply_reviewers": "1;1;1",
        "reply_authors": "2;4;2",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            97.0,
            19.30457631409368
        ],
        "wc_strengths_avg": [
            50.666666666666664,
            12.256517540566822
        ],
        "wc_weaknesses_avg": [
            65.66666666666667,
            26.5497436689865
        ],
        "wc_questions_avg": [
            224.0,
            119.01540516532583
        ],
        "wc_review_avg": [
            437.3333333333333,
            115.289008823719
        ],
        "wc_reply_reviewers_avg": [
            106.66666666666667,
            107.45645112737014
        ],
        "wc_reply_authors_avg": [
            1117.3333333333333,
            535.7638368618108
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.49999999999999983,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16365776509541219820&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=7WsivwyHrS",
        "pdf": "https://openreview.net/pdf?id=7WsivwyHrS",
        "email": "ntu.edu;tsinghua.edu.cn;cqu.edu.cn;zju.edu.cn;ntu.edu.sg",
        "author_num": 5,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "National Technological University;Tsinghua University;Chongqing University;Zhejiang University;Nanyang Technological University",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.ntu.edu;https://www.tsinghua.edu.cn;https://www.cqu.edu.cn;https://www.zju.edu.cn;https://www.ntu.edu.sg",
        "aff_unique_abbr": "NTU;THU;CQU;ZJU;NTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;2",
        "aff_country_unique": "United States;China;Singapore"
    },
    {
        "id": "7XXineVQeU",
        "title": "Faster Maximum Inner Product Search in High Dimensions",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Maximum Inner Product Search (MIPS) is a ubiquitous task in machine learning applications such as recommendation systems. \nGiven a query vector and $n$ atom vectors in $d$-dimensional space, the goal of MIPS is to find the atom that has the highest inner product with the query vector. \nExisting MIPS algorithms scale at least as $O(\\sqrt{d})$, which becomes computationally prohibitive in high-dimensional settings. In this work, we present BanditMIPS, a novel randomized MIPS algorithm whose complexity is independent of $d$. \nBanditMIPS estimates the inner product for each atom by subsampling coordinates and adaptively evaluates more coordinates for more promising atoms. The specific adaptive sampling strategy is motivated by multi-armed bandits. We provide theoretical guarantees that BanditMIPS returns the correct answer with high probability, while improving the complexity in $d$ from $O(\\sqrt{d})$ to $O(1)$. We also perform experiments on four synthetic and real-world datasets and demonstrate that BanditMIPS outperforms prior state-of-the-art algorithms. \nFor example, in the Movie Lens dataset ($n$=4,000, $d$=6,000), BanditMIPS is 20$\\times$ faster than the next best algorithm while returning the same answer. BanditMIPS requires no preprocessing of the data and includes a hyperparameter that practitioners may use to trade off accuracy and runtime.\nWe also propose a variant of our algorithm, named BanditMIPS-$\\alpha$, which achieves further speedups by employing non-uniform sampling across coordinates. \nFinally, we demonstrate how known preprocessing techniques can be used to further accelerate BanditMIPS, and discuss applications to Matching Pursuit and Fourier analysis.",
        "keywords": "multi-armed bandits;maximum inner product search;MIPS;best-arm identification",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/a99288def3c9d0cd2f8686fe3d79b6b9e29a71f2.pdf",
        "author": "Mo Tiwari;Ryan Kang;Donghyun Lee;Jaeyong Lee;Sebastian Thrun;Christopher J Piech;Ilan Shomorony;Martin Jinye Zhang",
        "authorids": "~Mo_Tiwari1;~Ryan_Kang1;~Donghyun_Lee2;~Jaeyong_Lee1;~Sebastian_Thrun1;~Christopher_J_Piech1;~Ilan_Shomorony1;~Martin_Jinye_Zhang1",
        "gender": ";M;M;M;M;M;M;M",
        "homepage": "http://www.motiwari.com/;;;https://kr.linkedin.com/in/jeyong-lee-6a7838190;http://robot.cc;;http://www.ilanshomorony.com;https://mzhanglab.github.io/",
        "dblp": "267/5421;https://dblp.org/rec/conf/nips/TiwariKLPSTZ22.html;298/4489;336/2490;t/SebastianThrun;35/10987.html;31/9223;184/9278",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;https://scholar.google.com/citations?hl=en;;;;fMAg4zEAAAAJ;zjr6n-QAAAAJ",
        "orcid": ";;;;;;;0000-0003-0006-2466",
        "linkedin": "motiwari;ryan-kang-554819221/;donghyun-lee-aa789422a;;sebastian-thrun-59a0b273/;;;",
        "or_profile": "~Mo_Tiwari1;~Ryan_Kang1;~Donghyun_Lee2;~Jaeyong_Lee1;~Sebastian_Thrun1;~Christopher_J_Piech1;~Ilan_Shomorony1;~Martin_J._Zhang1",
        "aff": "OpenAI;Stanford University;University College London, University of London;University of Oxford;;;University of Illinois, Urbana Champaign;Carnegie Mellon University",
        "aff_domain": "openai.com;stanford.edu;ucl.ac.uk;oxford.ac.uk;;;illinois.edu;andrew.cmu.edu",
        "position": "Member of Technical Staff;MS student;MS student;Undergrad student;;;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\ntiwari2024faster,\ntitle={Faster Maximum Inner Product Search in High Dimensions},\nauthor={Mo Tiwari and Ryan Kang and Donghyun Lee and Jaeyong Lee and Sebastian Thrun and Christopher J Piech and Ilan Shomorony and Martin Jinye Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=7XXineVQeU}\n}",
        "github": "",
        "project": "",
        "reviewers": "CJG9;hfLb;tsE3;FGUA",
        "site": "https://openreview.net/forum?id=7XXineVQeU",
        "pdf_size": 2650778,
        "rating": "1;1;3;3",
        "confidence": "4;5;3;3",
        "soundness": "1;3;2;2",
        "contribution": "1;1;3;2",
        "presentation": "1;3;2;2",
        "wc_summary": "77;225;44;73",
        "wc_strengths": "3;1;32;29",
        "wc_weaknesses": "3;147;46;160",
        "wc_questions": "3;6;47;6",
        "wc_review": "86;379;169;268",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            104.75,
            70.5846123457514
        ],
        "wc_strengths_avg": [
            16.25,
            14.306903927824496
        ],
        "wc_weaknesses_avg": [
            89.0,
            66.42665127793211
        ],
        "wc_questions_avg": [
            15.5,
            18.227726133558185
        ],
        "wc_review_avg": [
            225.5,
            109.56847174255923
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.9045340337332909,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12912019336735211116&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;1;2;3;4;5",
        "aff_unique_norm": "OpenAI;Stanford University;University College London;University of Oxford;University of Illinois Urbana-Champaign;Carnegie Mellon University",
        "aff_unique_dep": ";;;;;",
        "aff_unique_url": "https://openai.com;https://www.stanford.edu;https://www.ucl.ac.uk;https://www.ox.ac.uk;https://illinois.edu;https://www.cmu.edu",
        "aff_unique_abbr": "OpenAI;Stanford;UCL;Oxford;UIUC;CMU",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Stanford;Urbana-Champaign",
        "aff_country_unique_index": "0;0;1;1;0;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "7YEXo5qUmN",
        "title": "Organ-DETR: 3D Organ Detection Transfomer with Multiscale Attention and Dense Query Matching",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Query-based Transformers have been yielding impressive results in object detection.  The potential of DETR-like methods for 3D data, especially in volumetric medical imaging, remains largely unexplored.  This study presents Organ-DETR that contains two novel modules, MultiScale Attention (MSA) and Dense Query Matching (DQM), for boosting the performance of DEtection TRansformers (DETRs) for 3D organ detection.  MSA introduces a novel top-down representation learning approach for efficient encoding of 3D visual data. \nMSA has a multiscale attention architecture that leverages dual self-attention and cross-attention mechanisms to provide the most relevant features for DETRs.  It aims to employ long- and short-range spatial interactions in the attention mechanism, leveraging the self-attention module.  Organ-DETR also introduces DQM, an approach for one-to-many matching that tackles the difficulties in detecting organs.\nDQM increases positive queries for enhancing both recall scores and training efficiency without the need for additional learnable parameters. \nExtensive results on five 3D Computed Tomography (CT) datasets indicate that the proposed Organ-DETR outperforms comparable techniques by achieving a remarkable improvement of +10.6 mAP COCO and +10.2 mAR COCO. \nCode and pre-trained models are available at \\url{https://---}.",
        "keywords": "Organ Detection;Representation Learning;DEtection TRansformer (DETR);Attention;Transformer;One-to-Many Matching;One-to-One Matching;Segmentation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/f62c032dcfe3094c85c0aac53ae9816f7df501a3.zip",
        "author": "MORTEZA GHAHREMANI;Benjamin Raphael Ernhofer;Jiajun Wang;Christian Wachinger",
        "authorids": "~MORTEZA_GHAHREMANI3;~Benjamin_Raphael_Ernhofer1;~Jiajun_Wang2;~Christian_Wachinger1",
        "gender": "M;;M;M",
        "homepage": "https://mogvision.github.io/;;;https://ai-med.de/people/christian-wachinger/",
        "dblp": "152/6299;;;79/5985",
        "google_scholar": "yhXUlXsAAAAJ;;;https://scholar.google.de/citations?user=UOIBNdUAAAAJ",
        "orcid": "0000-0001-6423-6475;0009-0007-4189-9576;;0000-0002-3652-1874",
        "linkedin": "morteza-ghahremani-3a040421a/;;jiajun-wang-a82725251/;",
        "or_profile": "~MORTEZA_GHAHREMANI3;~Benjamin_Raphael_Ernhofer1;~Jiajun_Wang2;~Christian_Wachinger1",
        "aff": "Technische Universit\u00e4t M\u00fcnchen;;Technische Universit\u00e4t M\u00fcnchen;Technische Universit\u00e4t M\u00fcnchen",
        "aff_domain": "tum.de;;tum.de;tum.de",
        "position": "AI Scientist;;MS student;Professor",
        "bibtex": "@misc{\nanonymous2024organdetr,\ntitle={Organ-{DETR}: 3D Organ Detection Transfomer with Multiscale Attention and Dense Query Matching},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=7YEXo5qUmN}\n}",
        "github": "",
        "project": "",
        "reviewers": "nhJL;2UmR;xGvm",
        "site": "https://openreview.net/forum?id=7YEXo5qUmN",
        "pdf_size": 1212160,
        "rating": "3;3;8",
        "confidence": "5;5;5",
        "soundness": "2;2;4",
        "contribution": "2;1;3",
        "presentation": "2;3;4",
        "wc_summary": "89;42;71",
        "wc_strengths": "43;39;18",
        "wc_weaknesses": "95;220;88",
        "wc_questions": "3;50;4",
        "wc_review": "230;351;181",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "517;632;150",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.666666666666667,
            2.357022603955158
        ],
        "confidence_avg": [
            5.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            67.33333333333333,
            19.362047641943477
        ],
        "wc_strengths_avg": [
            33.333333333333336,
            10.96458946893235
        ],
        "wc_weaknesses_avg": [
            134.33333333333334,
            60.642852468824024
        ],
        "wc_questions_avg": [
            19.0,
            21.924111536540465
        ],
        "wc_review_avg": [
            254.0,
            71.44695001654492
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            433.0,
            205.54480452365286
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:dEyQpfH8J8wJ:scholar.google.com/&scioq=Organ-DETR:+3D+Organ+Detection+Transfomer+with+Multiscale+Attention+and+Dense+Query+Matching&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Technische Universit\u00e4t M\u00fcnchen",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tum.de",
        "aff_unique_abbr": "TUM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "7Yg5eylBHe",
        "title": "ZGS-Based Event-Driven Algorithms for Bayesian Optimization in Fully Distributed Multi-Agent Systems",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Bayesian optimization (BO) is a well-established framework for globally optimizing expensive-to-evaluate black-box functions with impressive efficiency. Although numerous BO algorithms have been developed for the centralized machine learning setting and some recent works have extended BO to the tree-structured federated learning, no previous studies have investigated BO within a fully distributed multi-agent system (MAS) in the field of distributed learning (DL). Addressing this gap, we introduce and investigate a novel paradigm, Distributed Bayesian Optimization (DBO), in which agents cooperatively optimize the same costly-to-evaluate black-box objectives. An innovative generalized algorithm, Zero-Gradient-Sum-Based Event-Driven Distributed Lower Confidence Bound (ZGS-ED-DLCB), is proposed to overcome the significant challenges of DBO and DL: We (a) adopt a surrogate model based on random Fourier features as an approximate alternative to a typical Gaussian process to enable the exchange of local knowledge between neighboring agents, and (b) employ the event-driven mechanism to enhance communication efficiency in MASs. Moreover, we propose a novel generalized fully distributed convergence theorem, which represents a substantial theoretical and practical breakthrough wrt the ZGS-based DL. The performance of our proposed algorithm has been rigorously evaluated through theoretical analysis and extensive experiments, demonstrating substantial advantages over the state-of-the-art baselines.",
        "keywords": "distributed machine learning;Bayesian optimization;multi-agent systems;zero-gradient-sum optimization;event-driven mechanism",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/2c4857962fdfc2176867928f2585de383fdd66a9.zip",
        "author": "Pengfei Ren;Cheng-zhong Xu",
        "authorids": "~Pengfei_Ren5;~Cheng-zhong_Xu1",
        "gender": ";",
        "homepage": ";",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": ";",
        "aff": ";",
        "aff_domain": ";",
        "position": ";",
        "bibtex": "@misc{\nren2024zgsbased,\ntitle={{ZGS}-Based Event-Driven Algorithms for Bayesian Optimization in Fully Distributed Multi-Agent Systems},\nauthor={Pengfei Ren and Cheng-zhong Xu},\nyear={2024},\nurl={https://openreview.net/forum?id=7Yg5eylBHe}\n}",
        "github": "",
        "project": "",
        "reviewers": "BqAx;ugDi;N4Gg;EeJ5",
        "site": "https://openreview.net/forum?id=7Yg5eylBHe",
        "pdf_size": 488705,
        "rating": "1;3;3;6",
        "confidence": "3;4;4;2",
        "soundness": "1;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "1;1;1;2",
        "wc_summary": "102;91;40;67",
        "wc_strengths": "54;18;20;35",
        "wc_weaknesses": "724;192;374;36",
        "wc_questions": "10;2;9;2",
        "wc_review": "890;303;443;140",
        "wc_reply_reviewers": "155;0;0;0",
        "wc_reply_authors": "996;353;763;129",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            3.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            75.0,
            23.843238035132728
        ],
        "wc_strengths_avg": [
            31.75,
            14.428704030508076
        ],
        "wc_weaknesses_avg": [
            331.5,
            256.2435365038502
        ],
        "wc_questions_avg": [
            5.75,
            3.766629793329841
        ],
        "wc_review_avg": [
            444.0,
            278.9327876030353
        ],
        "wc_reply_reviewers_avg": [
            38.75,
            67.11696879329399
        ],
        "wc_reply_authors_avg": [
            560.25,
            339.0850741333213
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5488604301969737,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:t7ISjxiSuAYJ:scholar.google.com/&scioq=ZGS-Based+Event-Driven+Algorithms+for+Bayesian+Optimization+in+Fully+Distributed+Multi-Agent+Systems&hl=en&as_sdt=0,47",
        "gs_version_total": 0
    },
    {
        "id": "7Zbg38nA0J",
        "title": "Explaining grokking through circuit efficiency",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We present a theory of grokking in neural networks which explains grokking in terms of the relative efficiency of competing emergent sub-networks (circuits). Grokking is an important generalisation phenomenon where continuing to train a network which already achieves nearly perfect training loss can still dramatically improve the test loss. Our theory explains why generalising circuits gradually out-compete memorising circuits. This is because memorising circuits are inefficient for compressing large datasets---the per-example cost is high---while generalising circuits have a larger fixed cost but better per-example efficiency.  Strikingly, our theory is precise enough to produce novel predictions of previously unobserved phenomena: ungrokking and semi-grokking.",
        "keywords": "grokking;interpretability;generalisation;regularisation;weight decay",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Vikrant Varma;Rohin Shah;Zachary Kenton;Janos Kramar;Ramana Kumar",
        "authorids": "~Vikrant_Varma1;~Rohin_Shah1;~Zachary_Kenton2;~Janos_Kramar1;~Ramana_Kumar1",
        "gender": ";M;M;M;",
        "homepage": ";http://rohinshah.com/;https://zackenton.github.io/;;",
        "dblp": "281/7099;145/1009;209/9980;49/9013;",
        "google_scholar": "EPYHbToAAAAJ;odFQXSYAAAAJ;https://scholar.google.co.uk/citations?hl=en;;OyX1-qYAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";rohin-shah-76405832/;zac-kenton-824429124/;;",
        "or_profile": "~Vikrant_Varma1;~Rohin_Shah1;~Zachary_Kenton2;~Janos_Kramar1;~Ramana_Kumar1",
        "aff": "Google DeepMind;Google DeepMind;Google DeepMind;Google DeepMind;Google DeepMind",
        "aff_domain": "deepmind.com;deepmind.com;google.com;deepmind.com;deepmind.com",
        "position": "Researcher;Researcher;Researcher;Researcher;Researcher",
        "bibtex": "@misc{\nvarma2024explaining,\ntitle={Explaining grokking through circuit efficiency},\nauthor={Vikrant Varma and Rohin Shah and Zachary Kenton and Janos Kramar and Ramana Kumar},\nyear={2024},\nurl={https://openreview.net/forum?id=7Zbg38nA0J}\n}",
        "github": "",
        "project": "",
        "reviewers": "JVYB;Rk5Z;m2MB;A2EW",
        "site": "https://openreview.net/forum?id=7Zbg38nA0J",
        "pdf_size": 1682327,
        "rating": "3;5;6;6",
        "confidence": "5;4;4;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "4;3;4;3",
        "wc_summary": "67;54;72;127",
        "wc_strengths": "45;34;107;59",
        "wc_weaknesses": "249;24;125;261",
        "wc_questions": "93;219;300;98",
        "wc_review": "454;331;604;545",
        "wc_reply_reviewers": "616;173;178;0",
        "wc_reply_authors": "2183;911;1432;786",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "3;2;3;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            80.0,
            27.919527216627433
        ],
        "wc_strengths_avg": [
            61.25,
            27.860141779969464
        ],
        "wc_weaknesses_avg": [
            164.75,
            97.15033453364944
        ],
        "wc_questions_avg": [
            177.5,
            86.8749100718959
        ],
        "wc_review_avg": [
            483.5,
            102.99150450401237
        ],
        "wc_reply_reviewers_avg": [
            241.75,
            227.64926422020343
        ],
        "wc_reply_authors_avg": [
            1328.0,
            549.8849879747582
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9428090415820632,
        "gs_citation": 48,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3942436453220632592&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Google",
        "aff_unique_dep": "Google DeepMind",
        "aff_unique_url": "https://deepmind.com",
        "aff_unique_abbr": "DeepMind",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "7ZiFtNzzQA",
        "title": "A Neural Tangent Kernel Approach for Constrained Policy Gradient Reinforcement Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "This paper presents a constrained policy gradient method where we introduce constraints for safe learning, augmenting the traditional REINFORCE algorithm by taking the following steps. First, we analyze how the agent's policy changes if a new data batch is applied, leading to a nonlinear differential equation system in continuous time (gradient flow). This description of learning dynamics is connected to the neural tangent kernel (NTK) which enables us to evaluate the policy change at arbitrary states. \nNext, we introduce constraints for action probabilities based on the assumption that there are some environment states where we know how the agent should behave, ensuring safety during learning. Then, we augment the training batch with these states and compute fictitious rewards for them, making the policy obey the constraints with the help of the NTK-based formulation. More specifically, exogenous discounted sum of future rewards (returns) are computed at these constrained state-action pairs such that the policy network satisfies the constraints. Computing the constraining returns is based on solving a system of linear equations (equality constraints) or a constrained quadratic program (inequality constraints). To tackle high-dimensional environments, a dynamic constraint selection methodology is proposed. \nSimulation results demonstrate that adding constraints (external information) to the learning can improve learning in terms of speed and transparency reasonably if they are selected appropriately.",
        "keywords": "Reinforcement learning;Policy gradient methods;Constrained learning;Neural Tangent Kernel",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Balazs Varga;Attila Lischka;Balazs Kulcsar;Morteza Haghir Chehreghani",
        "authorids": "~Balazs_Varga1;~Attila_Lischka1;~Balazs_Kulcsar1;~Morteza_Haghir_Chehreghani2",
        "gender": "M;;;",
        "homepage": ";https://www.chalmers.se/personer/lischka/;;",
        "dblp": ";;;",
        "google_scholar": "OO4UlEIAAAAJ;;https://scholar.google.com/citations?hl=en;",
        "orcid": "0000-0002-2945-7974;;;",
        "linkedin": ";;;",
        "or_profile": "~Balazs_Varga1;~Attila_Lischka1;~Balazs_Kulcsar1;~Morteza_Haghir_Chehreghani2",
        "aff": "Budapest University of Technology and Economics;Chalmers University of Technology;Chalmers University of Technology;",
        "aff_domain": "bme.hu;chalmers.se;chalmers.se;",
        "position": "Researcher;PhD student;Prof;",
        "bibtex": "@misc{\nvarga2024a,\ntitle={A Neural Tangent Kernel Approach for Constrained Policy Gradient Reinforcement Learning},\nauthor={Balazs Varga and Attila Lischka and Balazs Kulcsar and Morteza Haghir Chehreghani},\nyear={2024},\nurl={https://openreview.net/forum?id=7ZiFtNzzQA}\n}",
        "github": "",
        "project": "",
        "reviewers": "RmLh;4Ecu;xmYU;P7MJ",
        "site": "https://openreview.net/forum?id=7ZiFtNzzQA",
        "pdf_size": 14551656,
        "rating": "3;5;5;6",
        "confidence": "3;4;3;3",
        "soundness": "1;2;3;3",
        "contribution": "1;3;3;3",
        "presentation": "2;3;2;3",
        "wc_summary": "70;90;24;134",
        "wc_strengths": "50;94;30;52",
        "wc_weaknesses": "180;151;155;68",
        "wc_questions": "318;95;136;5",
        "wc_review": "618;430;345;259",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            79.5,
            39.53163290328392
        ],
        "wc_strengths_avg": [
            56.5,
            23.296995514443488
        ],
        "wc_weaknesses_avg": [
            138.5,
            42.19300889957956
        ],
        "wc_questions_avg": [
            138.5,
            113.95284112298386
        ],
        "wc_review_avg": [
            413.0,
            132.90410076442336
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.13245323570650439,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:HCbKudIvjDYJ:scholar.google.com/&scioq=A+Neural+Tangent+Kernel+Approach+for+Constrained+Policy+Gradient+Reinforcement+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Budapest University of Technology and Economics;Chalmers University of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.bme.hu;https://www.chalmers.se",
        "aff_unique_abbr": "BME;Chalmers",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "Hungary;Sweden"
    },
    {
        "title": "Flag Aggregator: Scalable Distributed Training under Failures and Augmented Losses using Convex Optimization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19354",
        "id": "7avlrpzWqo",
        "author_site": "Hamidreza Almasi, Harsh Mishra, Balajee Vamanan, Sathya N. Ravi",
        "tldr": "",
        "abstract": "Modern ML applications increasingly rely on complex deep learning models and large datasets. There has been an exponential growth in the amount of computation needed to train the largest models. Therefore, to scale computation and data, these models are inevitably trained in a distributed manner in clusters of nodes, and their updates are aggregated before being applied to the model. However, a distributed setup is prone to Byzantine failures of individual nodes, components, and software. With data augmentation added to these settings, there is a critical need for robust and efficient aggregation systems. We define the quality of workers as reconstruction ratios $\\in (0,1]$, and formulate aggregation as a Maximum Likelihood Estimation procedure using Beta densities. We show that the Regularized form of log-likelihood wrt subspace can be approximately solved using iterative least squares solver, and provide convergence guarantees using recent Convex Optimization landscape results. Our empirical findings demonstrate that our approach significantly enhances the robustness of state-of-the-art Byzantine resilient aggregators. We evaluate our method in a distributed setup with a parameter server, and show simultaneous improvements in communication efficiency and accuracy across various tasks.",
        "keywords": "Robust;Aggregation;Distributed;Training;Failure;Augmented;Byzantine;Resilience",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/aae05857d3367152772f83487cd072c367bd1e99.zip",
        "author": "Hamidreza Almasi;Harsh Mishra;Balajee Vamanan;Sathya N. Ravi",
        "authorids": "~Hamidreza_Almasi1;~Harsh_Mishra1;~Balajee_Vamanan1;~Sathya_N._Ravi1",
        "gender": "M;M;M;M",
        "homepage": "https://hamidralmasi.github.io/;;https://www.cs.uic.edu/~balajee/;http://sathyaravi.com",
        "dblp": "241/0508;;;159/2123",
        "google_scholar": "OkUGKRAAAAAJ;;https://scholar.google.com.tw/citations?user=GKvAsQMAAAAJ;FW-0thoAAAAJ",
        "orcid": "0000-0002-4479-6464;;;0000-0003-3881-6323",
        "linkedin": "hamidralmasi/;harsh-mishra-515624144;;sathya-narayanan-ravi-74a5a128/",
        "or_profile": "~Hamidreza_Almasi1;~Harsh_Mishra1;~Balajee_Vamanan1;~Sathya_N._Ravi1",
        "aff": ";Rothamsted Research ;University of Illinois at Chicago;University of Illinois, Chicago",
        "aff_domain": ";rothamsted.ac.uk;uic.edu;uic.edu",
        "position": ";Researcher;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nalmasi2024flag,\ntitle={Flag Aggregator: Scalable Distributed Training under Failures and Augmented Losses using Convex Optimization},\nauthor={Hamidreza Almasi and Harsh Mishra and Balajee Vamanan and Sathya N. Ravi},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=7avlrpzWqo}\n}",
        "github": "",
        "project": "",
        "reviewers": "Es7u;PqPx;YEpb",
        "pdf_size": 1909941,
        "rating": "6;6;6",
        "confidence": "5;2;3",
        "soundness": "4;2;3",
        "contribution": "3;2;3",
        "presentation": "2;3;3",
        "wc_summary": "76;73;49",
        "wc_strengths": "99;34;28",
        "wc_weaknesses": "147;104;76",
        "wc_questions": "172;1;12",
        "wc_review": "494;212;165",
        "wc_reply_reviewers": "105;0;0",
        "wc_reply_authors": "1487;435;340",
        "reply_reviewers": "1;0;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.3333333333333335,
            1.247219128924647
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            66.0,
            12.083045973594572
        ],
        "wc_strengths_avg": [
            53.666666666666664,
            32.14895885647863
        ],
        "wc_weaknesses_avg": [
            109.0,
            29.20045661743437
        ],
        "wc_questions_avg": [
            61.666666666666664,
            78.14658590680011
        ],
        "wc_review_avg": [
            290.3333333333333,
            145.28668976276603
        ],
        "wc_reply_reviewers_avg": [
            35.0,
            49.49747468305833
        ],
        "wc_reply_authors_avg": [
            754.0,
            519.7582771507027
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17474371774670655893&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "openreview": "https://openreview.net/forum?id=7avlrpzWqo",
        "pdf": "https://openreview.net/pdf?id=7avlrpzWqo",
        "email": ";rothamsted.ac.uk;uic.edu;uic.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Rothamsted Research;University of Illinois at Chicago",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.rothamsted.ac.uk;https://www.uic.edu",
        "aff_unique_abbr": "Rothamsted;UIC",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Chicago",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "id": "7b2itdrxMa",
        "title": "From Child's Play to AI: Insights into Automated Causal Curriculum Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We study how reinforcement learning algorithms and children develop their causal curriculum to achieve a challenging goal that is not solvable at first. Adopting the Procgen environments that comprise various tasks as challenging goals, we found that 5- to 7-year-old children actively used their current level progress to determine their next step in the curriculum and made improvements to solving the goal during this process. To evaluate RL agents, we exposed them to the same demanding Procgen environments as children and employed several curriculum learning methodologies. Our results demonstrate that RL agents that emulate children by incorporating level progress as an intrinsic reward signal exhibit greater stability and are more likely to converge during training, compared to RL agents solely reliant on extrinsic reward signals for game-solving. Curriculum learning may also offer a significant reduction in the number of frames needed to solve a target environment. Taken together, our human-inspired findings suggest a potential path forward for addressing catastrophic forgetting or domain shift during curriculum learning in RL agents.",
        "keywords": "reinforcement learning;curriculum learning;cognitive science;cognitive development",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/c6239845071ec68cc8483ce302f108b8eb3ff372.pdf",
        "author": "Annya Dahmani;Eunice Yiu;Tabitha Edith Lee;Nan Rosemary Ke;Oliver Kroemer;Alison Gopnik",
        "authorids": "~Annya_Dahmani1;~Eunice_Yiu1;~Tabitha_Edith_Lee1;~Nan_Rosemary_Ke1;~Oliver_Kroemer1;~Alison_Gopnik1",
        "gender": "F;F;F;M;F;F",
        "homepage": ";https://ey242.github.io/;https://nke001.github.io/;https://www.ri.cmu.edu/ri-faculty/oliver-kroemer/;http://alisongopnik.com/;https://tabula-rosa.github.io/",
        "dblp": ";;120/5291;04/7743;49/2088;",
        "google_scholar": "75hAWYsAAAAJ;oqQDfCEAAAAJ;https://scholar.google.ca/citations?user=dxwPYhQAAAAJ;_tbXjP4AAAAJ;https://scholar.google.co.uk/citations?user=2tt6ZJ0AAAAJ;ZD6QUvYAAAAJ",
        "orcid": ";0000-0002-3505-5525;;;;",
        "linkedin": ";euniceyiu/;;;;tabithaedith",
        "or_profile": "~Annya_Dahmani1;~Eunice_Yiu1;~Nan_Rosemary_Ke1;~Oliver_Kroemer1;~Alison_Gopnik1;~Timothy_E_Lee1",
        "aff": "University of California, Berkeley;University of California, Berkeley;Google DeepMind;Carnegie Mellon University;;Carnegie Mellon University",
        "aff_domain": "berkeley.edu;berkeley.edu;deepmind.com;cmu.edu;;cmu.edu",
        "position": "PhD student;PhD student;Researcher;Assistant Professor;;PhD Student",
        "bibtex": "@misc{\ndahmani2024from,\ntitle={From Child's Play to {AI}: Insights into Automated Causal Curriculum Learning},\nauthor={Annya Dahmani and Eunice Yiu and Tabitha Edith Lee and Nan Rosemary Ke and Oliver Kroemer and Alison Gopnik},\nyear={2024},\nurl={https://openreview.net/forum?id=7b2itdrxMa}\n}",
        "github": "",
        "project": "",
        "reviewers": "FUEG;MFeg;tuxP;Rafo;5JBB",
        "site": "https://openreview.net/forum?id=7b2itdrxMa",
        "pdf_size": 8383889,
        "rating": "3;3;3;5;6",
        "confidence": "4;4;3;3;4",
        "soundness": "2;3;3;2;3",
        "contribution": "1;1;2;2;4",
        "presentation": "3;3;1;4;4",
        "wc_summary": "15;104;56;74;297",
        "wc_strengths": "32;28;32;15;130",
        "wc_weaknesses": "1249;113;135;6;133",
        "wc_questions": "2;65;130;162;65",
        "wc_review": "1298;310;353;257;625",
        "wc_reply_reviewers": "1014;310;171;0;0",
        "wc_reply_authors": "1862;681;455;849;312",
        "reply_reviewers": "3;2;1;0;0",
        "reply_authors": "4;2;2;2;1",
        "rating_avg": [
            4.0,
            1.2649110640673518
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.0,
            1.0954451150103321
        ],
        "presentation_avg": [
            3.0,
            1.0954451150103321
        ],
        "wc_summary_avg": [
            109.2,
            98.22301156042815
        ],
        "wc_strengths_avg": [
            47.4,
            41.76888794306116
        ],
        "wc_weaknesses_avg": [
            327.2,
            463.34022057231334
        ],
        "wc_questions_avg": [
            84.8,
            55.933531982166116
        ],
        "wc_review_avg": [
            568.6,
            386.1754005630084
        ],
        "wc_reply_reviewers_avg": [
            299.0,
            375.9074354146244
        ],
        "wc_reply_authors_avg": [
            831.8,
            547.0866110589803
        ],
        "reply_reviewers_avg": [
            1.2,
            1.1661903789690602
        ],
        "reply_authors_avg": [
            2.2,
            0.9797958971132712
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17615996309583098648&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;1;2;2",
        "aff_unique_norm": "University of California, Berkeley;Google;Carnegie Mellon University",
        "aff_unique_dep": ";Google DeepMind;",
        "aff_unique_url": "https://www.berkeley.edu;https://deepmind.com;https://www.cmu.edu",
        "aff_unique_abbr": "UC Berkeley;DeepMind;CMU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Berkeley;",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "7bIpWYhCdu",
        "title": "FILI: Syntax Repair By Learning From Own Mistakes",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Automatically fixing syntax errors in programs is a key challenge in Software Engineering community. Although, there are millions of programs on the web, both syntactically correct and incorrect, finding a large number of paired examples of <correct, incorrect> programs is difficult. This makes training a program fixer using supervised learning difficult. Recently, BIFI, an unsupervised approach for learning a syntax fixer was proposed, in which an additional model (Breaker model) is used to augment data in each learning iteration to match real-world error distribution. In this paper, we propose a novel approach, FILI (Fix-It-Learn-It) for learning a syntax fixer without having to train any additional models for data augmentation. In each iteration, FILI carefully selects examples from the fixer's own predictions, both correct and incorrect, and uses those to fine-tune the fixer. We also show that gradually increasing the complexity of the examples during training leads to a more accurate fixer. Our evaluation on the Github-Python dataset shows that FILI outperforms BIFI by 1% while being significantly easier to train. Moreover, FILI avoids training the breaker model training a 13 million parameter breaker model in each iteration, which can take about 2 days on a modest DNN accelerator.",
        "keywords": "Automatic Program Repair;Software Engineering;Neural Syntax Fix",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/01b0c55cb4f8e8c344a1f03d0f02ed1f69f5cfdd.pdf",
        "author": "Sahil Bhatia;Navneet Potti;Rishabh Singh",
        "authorids": "~Sahil_Bhatia3;~Navneet_Potti1;~Rishabh_Singh1",
        "gender": ";;M",
        "homepage": ";;https://rishabhmit.bitbucket.io/",
        "dblp": ";;25/7056",
        "google_scholar": ";;https://scholar.google.com/citations?hl=en",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Sahil_Bhatia3;~Navneet_Potti1;~Rishabh_Singh1",
        "aff": ";;Meta",
        "aff_domain": ";;meta.com",
        "position": ";;Researcher",
        "bibtex": "@misc{\nbhatia2024fili,\ntitle={{FILI}: Syntax Repair By Learning From Own Mistakes},\nauthor={Sahil Bhatia and Navneet Potti and Rishabh Singh},\nyear={2024},\nurl={https://openreview.net/forum?id=7bIpWYhCdu}\n}",
        "github": "",
        "project": "",
        "reviewers": "9dQP;yQj5;5pCb;ydVV",
        "site": "https://openreview.net/forum?id=7bIpWYhCdu",
        "pdf_size": 281433,
        "rating": "3;5;5;6",
        "confidence": "5;3;4;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;2",
        "presentation": "3;3;3;4",
        "wc_summary": "113;49;171;138",
        "wc_strengths": "30;39;70;76",
        "wc_weaknesses": "58;137;83;163",
        "wc_questions": "117;16;104;50",
        "wc_review": "318;241;428;427",
        "wc_reply_reviewers": "0;28;0;0",
        "wc_reply_authors": "215;281;279;331",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            117.75,
            44.70668294561787
        ],
        "wc_strengths_avg": [
            53.75,
            19.62619423117992
        ],
        "wc_weaknesses_avg": [
            110.25,
            41.74550874046213
        ],
        "wc_questions_avg": [
            71.75,
            40.831207427652686
        ],
        "wc_review_avg": [
            353.5,
            78.84954026498824
        ],
        "wc_reply_reviewers_avg": [
            7.0,
            12.12435565298214
        ],
        "wc_reply_authors_avg": [
            276.5,
            41.16734142496938
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.6488856845230502,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:BoC80p5zSlMJ:scholar.google.com/&scioq=FILI:+Syntax+Repair+By+Learning+From+Own+Mistakes&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Meta",
        "aff_unique_dep": "Meta Platforms, Inc.",
        "aff_unique_url": "https://meta.com",
        "aff_unique_abbr": "Meta",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "7c3ZOKGQ6s",
        "title": "YOLOV6: A SINGLE-STAGE OBJECT DETECTION FRAMEWORK FOR INDUSTRIAL APPLICATIONS",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We inaugurate YOLOv6, shipped with hardware-friendly architectural designs and a composite of novel training schemes tailored for industrial scenarios, which marks a new state-of-the-art real-time object detector as of early 2023. For a glimpse of performance, our YOLOv6-N hits 37.5% AP on the COCO dataset at a throughput of 1187 FPS tested with an NVIDIA Tesla T4 GPU. YOLOv6-S strikes 45.0% AP at 484 FPS, outperforming other mainstream detectors at the same scale (YOLOv5-S, YOLOv8-S, YOLOX-S, and PPYOLOE-S). Meantime, YOLOv6-M and L achieve better accuracy performance (50.0%/52.8% respectively) than other detectors at a similar inference speed. Additionally, with an extended backbone and neck design, our YOLOv6-L6 achieves state-of-the-art accuracy in real-time object detection. We carefully conducted extensive experiments to validate the effectiveness of each proposed component.",
        "keywords": "object detection;single-stage",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Chuyi Li;Bo Zhang;Lulu Li;Liang Li;Yifei Geng;Meng Cheng;Xu Xiaoming;Xiangxiang Chu;Xiaoming Wei",
        "authorids": "~Chuyi_Li1;~Bo_Zhang7;~Lulu_Li1;~Liang_Li10;~Yifei_Geng2;~Meng_Cheng2;~Xu_Xiaoming1;~Xiangxiang_Chu1;~Xiaoming_Wei1",
        "gender": "F;M;;M;M;;M;M;M",
        "homepage": "https://www.linkedin.cn/incareer/in/ACoAAD3J2pgBMaevrBlIBbqscuJvvv037e8MRyA;;https://github.com/meituan/YOLOv6;https://myaccount.google.com/?hl=zh-CN;https://github.com/meituan/YOLOv6;;;https://cxxgtxy.github.io/;https://www.linkedin.com/in/%E6%99%93%E6%98%8E-%E9%AD%8F-a0571b1a1/",
        "dblp": ";36/2259-46;;;;;;207/8002;",
        "google_scholar": ";uUNQnu0AAAAJ;;z_fYeJoAAAAJ;;;fFjtYN8AAAAJ;jn21pUsAAAAJ;",
        "orcid": ";0000-0003-0564-617X;;;;0000-0003-1734-5550;;0000-0003-2548-0605;0000-0002-7471-8344",
        "linkedin": "https://www.linkedin.cn/incareer/in/ACoAAD3J2pgBMaevrBlIBbqscuJvvv037e8MRyA;bo-zhang-20a86588/;;;;;;;",
        "or_profile": "~Chuyi_Li1;~Bo_Zhang7;~Lulu_Li1;~Liang_Li10;~Yifei_Geng2;~Meng_Cheng2;~Xu_Xiaoming1;~Xiangxiang_Chu1;~Wei_Xiaoming1",
        "aff": ";Meituan Inc.;;Meituan;;;;MeiTuan;Meituan",
        "aff_domain": ";meituan.com;;meituan.com;;;;meituan.com;meituan.com",
        "position": ";Senior Software Engineer;;Researcher;;;;Senior Engineer;Researcher",
        "bibtex": "@misc{\nli2024yolov,\ntitle={{YOLOV}6: A {SINGLE}-{STAGE} {OBJECT} {DETECTION} {FRAMEWORK} {FOR} {INDUSTRIAL} {APPLICATIONS}},\nauthor={Chuyi Li and Bo Zhang and Lulu Li and Liang Li and Yifei Geng and Meng Cheng and Xu Xiaoming and Xiangxiang Chu and Xiaoming Wei},\nyear={2024},\nurl={https://openreview.net/forum?id=7c3ZOKGQ6s}\n}",
        "github": "",
        "project": "",
        "reviewers": "W4rd;jptY;3aeD",
        "site": "https://openreview.net/forum?id=7c3ZOKGQ6s",
        "pdf_size": 761950,
        "rating": "3;3;3",
        "confidence": "5;4;5",
        "soundness": "2;1;3",
        "contribution": "2;2;2",
        "presentation": "2;2;3",
        "wc_summary": "47;55;103",
        "wc_strengths": "35;24;85",
        "wc_weaknesses": "155;460;215",
        "wc_questions": "1;2;64",
        "wc_review": "238;541;467",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            68.33333333333333,
            24.729649321321876
        ],
        "wc_strengths_avg": [
            48.0,
            26.54555832275273
        ],
        "wc_weaknesses_avg": [
            276.6666666666667,
            131.93011618108866
        ],
        "wc_questions_avg": [
            22.333333333333332,
            29.465610840812758
        ],
        "wc_review_avg": [
            415.3333333333333,
            128.98148015208315
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3106,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13702720529764835843&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Meituan Inc.;Meituan",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.meituan.com;https://www.meituan.com",
        "aff_unique_abbr": "Meituan;Meituan",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "7d2sWFIIPF",
        "title": "Backdoor Attack for Federated Learning with Fake Clients",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Federated Learning (FL) is a popular distributed machine learning paradigm that enables joint model training without sharing clients\u2019 data. Recent studies show that federated learning can be vulnerable to potential backdoor attacks from malicious clients: such attacks aim to mislead the global model into a targeted misprediction when a specific trigger pattern is presented. Although various types of federated backdoor attacks are proposed, most of them rely on the malicious client's local data to inject the backdoor trigger into the model. In this paper, we consider a new and more challenging scenario that the attacker can only control the fake clients, who do not possess any real data at all. Such a threat model sets a higher standard for the attacker that the attack must be conducted without relying on any real client data (only knowing the target class label). Meanwhile, the resulting malicious update should not be easily detected by the potential defenses. Specifically, we first simulate the normal client updates via modeling the historical global model trajectory. Then we simultaneously optimize the backdoor trigger and manipulate the model parameters in a data-free manner to achieve our attacking goal. Extensive experiments on multiple benchmark datasets show the effectiveness of the proposed attack in the fake client setting under state-of-the-art defenses.",
        "keywords": "Backdoor Atttack;Federated Learning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Pei Fang;Bochuan Cao;Jinyuan Jia;Jinghui Chen",
        "authorids": "~Pei_Fang1;~Bochuan_Cao1;~Jinyuan_Jia2;~Jinghui_Chen1",
        "gender": "M;;;M",
        "homepage": "https://greilfang.github.io/;https://aaaaaasuka.github.io/;https://jinyuan-jia.github.io/;https://jinghuichen.github.io/",
        "dblp": ";334/3881;24/5124-1.html;67/5633",
        "google_scholar": ";eOZCg2IAAAAJ;iyg4ytkAAAAJ;mKia7Y4AAAAJ",
        "orcid": ";;0000-0002-9785-7769;",
        "linkedin": ";;;",
        "or_profile": "~Pei_Fang1;~Bochuan_Cao1;~Jinyuan_Jia2;~Jinghui_Chen1",
        "aff": "Tongji University;Pennsylvania State University;Pennsylvania State University;Pennsylvania State University",
        "aff_domain": "tongji.edu.cn;psu.edu;psu.edu;psu.edu",
        "position": "MS student;PhD student;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nfang2024backdoor,\ntitle={Backdoor Attack for Federated Learning with Fake Clients},\nauthor={Pei Fang and Bochuan Cao and Jinyuan Jia and Jinghui Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=7d2sWFIIPF}\n}",
        "github": "",
        "project": "",
        "reviewers": "9itP;JM2E;DwZd;Sevc",
        "site": "https://openreview.net/forum?id=7d2sWFIIPF",
        "pdf_size": 450129,
        "rating": "3;3;5;5",
        "confidence": "3;4;4;4",
        "soundness": "2;2;3;2",
        "contribution": "2;2;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "47;108;117;51",
        "wc_strengths": "35;44;58;28",
        "wc_weaknesses": "262;88;73;76",
        "wc_questions": "122;80;156;160",
        "wc_review": "466;320;404;315",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            80.75,
            31.940374136819376
        ],
        "wc_strengths_avg": [
            41.25,
            11.211043662389331
        ],
        "wc_weaknesses_avg": [
            124.75,
            79.43983572490568
        ],
        "wc_questions_avg": [
            129.5,
            32.16753021293366
        ],
        "wc_review_avg": [
            376.25,
            62.73107284273082
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7138459469686333820&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Tongji University;Pennsylvania State University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tongji.edu.cn;https://www.psu.edu",
        "aff_unique_abbr": "Tongji;PSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "7duh4Ml5rc",
        "title": "Based on What We Can Control Artificial Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "How can the stability and efficiency of Artificial Neural Networks (ANNs) be ensured through a systematic analysis method? This paper seeks to address that query. While numerous factors can influence the learning process of ANNs, utilizing knowledge from control systems allows us to analyze its system function and simulate system responses. Although the complexity of most ANNs is extremely high, we still can analyze each factor (e.g., optimiser, hyperparameters) by simulating their system response. This new method also can potentially benefit the development of new optimiser and learning system, especially when discerning which components adversely affect ANNs. Controlling ANNs can benefit from the design of optimiser and learning system, as (1) all optimisers act as controllers, (2) all learning systems operate as control systems with inputs and outputs, and (3) the optimiser should match the learning system. We will share the source code of this work after the paper has been accepted for publication.",
        "keywords": "optimizer;controller;learning system;control system;fuzzy logic;filter",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/4827c5e1144c8aadb33c88a7d92c1a0b65ba8a27.zip",
        "author": "Cheng Kang;Xujing Yao",
        "authorids": "~Cheng_Kang1;~Xujing_Yao1",
        "gender": "M;F",
        "homepage": "https://chengkang520.github.io/about/;",
        "dblp": ";",
        "google_scholar": "https://scholar.google.com/citations?hl=tr;",
        "orcid": "0000-0001-9546-4585;0000-0001-8735-5573",
        "linkedin": ";",
        "or_profile": "~Cheng_Kang1;~Xujing_Yao1",
        "aff": "Czech Technical Univeresity in Prague, Czech Technical University of Prague;University of Leicester",
        "aff_domain": "fel.cvut.cz;le.ac.uk",
        "position": "PhD student;PhD student",
        "bibtex": "@misc{\nkang2024based,\ntitle={Based on What We Can Control Artificial Neural Networks},\nauthor={Cheng Kang and Xujing Yao},\nyear={2024},\nurl={https://openreview.net/forum?id=7duh4Ml5rc}\n}",
        "github": "",
        "project": "",
        "reviewers": "jZKP;WG3Y;egTB",
        "site": "https://openreview.net/forum?id=7duh4Ml5rc",
        "pdf_size": 1102247,
        "rating": "1;1;3",
        "confidence": "4;2;3",
        "soundness": "2;1;1",
        "contribution": "1;2;2",
        "presentation": "2;1;1",
        "wc_summary": "30;60;64",
        "wc_strengths": "31;61;45",
        "wc_weaknesses": "125;103;130",
        "wc_questions": "24;38;208",
        "wc_review": "210;262;447",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            51.333333333333336,
            15.173075568988056
        ],
        "wc_strengths_avg": [
            45.666666666666664,
            12.256517540566822
        ],
        "wc_weaknesses_avg": [
            119.33333333333333,
            11.728408057172787
        ],
        "wc_questions_avg": [
            90.0,
            83.63412381717565
        ],
        "wc_review_avg": [
            306.3333333333333,
            101.7065495542063
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:G0yUQEppL-4J:scholar.google.com/&scioq=Based+on+What+We+Can+Control+Artificial+Neural+Networks&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Czech Technical University in Prague;University of Leicester",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ctu.cz;https://www.leicester.ac.uk",
        "aff_unique_abbr": "CTU;Leicester",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Prague;",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Czech Republic;United Kingdom"
    },
    {
        "id": "7eYmijcuqO",
        "title": "On the Dynamics of Learning Time-Aware Behavior with RNNs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recurrent Neural Networks (RNNs) have shown great success in modeling time-dependent patterns, but there is limited research on how they develop representations of temporal features during training. To address this gap, we use timed automata (TA) to introduce a family of supervised learning tasks modeling behavior dependent on hidden temporal variables whose complexity is directly controllable. Building upon past studies from the perspective of dynamical systems theory, we train RNNs to emulate a new class of TA called temporal flipflops, and we find they undergo *phase transitions during training* characterized by sudden and rapid discovery of the hidden time-dependent features. In the case of periodic \"time-of-day\" aware flipflop, we show that the RNNs learn stable periodic cycles that encode time modulo the period of the transition rules. We then use fixed point stability analysis to monitor changes in the RNN dynamics during training, and we observe that the phase transition coincides with a *bifurcation* from which stable periodic behavior emerges. We also show that these cycles initially lose stability if the RNN is later trained on the same TA task but with a different period, and we explain this result through analysis of a simple differential equation for learning oscillations via gradient flow. Through this work, we demonstrate how dynamical systems theory can provide insights into not only learned representations, but also the dynamics and pathologies of the learning process itself.",
        "keywords": "recurrent neural networks;latent temporal features;developmental interpretability;phase transitions;dynamical systems theory",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Peter DelMastro;Rushiv Arora;Edward Rietman;Hava T Siegelmann",
        "authorids": "~Peter_DelMastro1;~Rushiv_Arora1;~Edward_Rietman1;~Hava_T_Siegelmann1",
        "gender": "M;M;;F",
        "homepage": ";https://rushivarora.github.io;;https://www.cics.umass.edu/faculty/directory/siegelmann_hava",
        "dblp": ";;32/3819.html;s/HavaTSiegelmann.html",
        "google_scholar": ";LxFWdpgAAAAJ;https://scholar.google.com/scholar?hl=en;https://scholar.google.co.il/citations?user=A2fiOI0AAAAJ",
        "orcid": ";;;0000-0003-4938-8723",
        "linkedin": "pdelmastro;rushiv-arora/;erietman/?midToken=AQGMbfgM-nipWg&midSig=2tulkv3VchiGM1&trk=eml-email_next_best_action_digest_01-header-68-profile&trkEmail=eml-email_next_best_action_digest_01-header-68-profile-null-1i4vs%7Elhnyy0hm%7Ezo-null-neptune%2Fprofile%7Evanity%2Eview;hava-siegelmann-4b272a/",
        "or_profile": "~Peter_DelMastro1;~Rushiv_Arora1;~Edward_Rietman1;~Hava_T_Siegelmann1",
        "aff": "Virginia Polytechnic Institute and State University;Dell AI Research;University of Massachusetts at Amherst;University of Massachusetts at Amherst",
        "aff_domain": "vt.edu;dell.com;umass.edu;umass.edu",
        "position": "PhD student;Research Scientist;Principal Researcher;Full Professor",
        "bibtex": "@misc{\ndelmastro2024on,\ntitle={On the Dynamics of Learning Time-Aware Behavior with {RNN}s},\nauthor={Peter DelMastro and Rushiv Arora and Edward Rietman and Hava T Siegelmann},\nyear={2024},\nurl={https://openreview.net/forum?id=7eYmijcuqO}\n}",
        "github": "",
        "project": "",
        "reviewers": "oza4;HfNN;kx7S;cxSU",
        "site": "https://openreview.net/forum?id=7eYmijcuqO",
        "pdf_size": 2725167,
        "rating": "3;3;3;3",
        "confidence": "3;2;3;4",
        "soundness": "3;3;3;3",
        "contribution": "2;3;2;2",
        "presentation": "3;3;1;2",
        "wc_summary": "70;51;65;96",
        "wc_strengths": "83;28;94;36",
        "wc_weaknesses": "148;161;169;271",
        "wc_questions": "87;16;217;12",
        "wc_review": "388;256;545;415",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            70.5,
            16.28649747490233
        ],
        "wc_strengths_avg": [
            60.25,
            28.656369274560934
        ],
        "wc_weaknesses_avg": [
            187.25,
            48.93043531382078
        ],
        "wc_questions_avg": [
            83.0,
            82.91863481751253
        ],
        "wc_review_avg": [
            401.0,
            102.62309681548301
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:CWhABIkI-XQJ:scholar.google.com/&scioq=On+the+Dynamics+of+Learning+Time-Aware+Behavior+with+RNNs&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;2",
        "aff_unique_norm": "Virginia Tech;Dell;University of Massachusetts Amherst",
        "aff_unique_dep": ";Dell AI Research;",
        "aff_unique_url": "https://www.vt.edu;https://www.dell.com;https://www.umass.edu",
        "aff_unique_abbr": "VT;Dell;UMass Amherst",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Amherst",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "7em7Jl0qMm",
        "title": "Fourier Ordinary Differential Equations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Continuous models such as Neural Ordinary Differential Equations (NODEs) are powerful approaches for modeling time series data, known for their ability to capture underlying dynamics and generalization. Current continuous models focus on learning mappings within finite-dimensional Euclidean spaces, raising two critical questions for enhancing their effectiveness. First, Is Euclidean space the optimal representation for capturing the underlying patterns and features in time series data? Second, how can we maintain granularity while benefiting from the generalization capabilities of continuous models? To address the first question, we propose a novel approach for learning dynamics in the Fourier domain. In contrast to Euclidean space, each point in Fourier space summarizes the original signal at a specific frequency, enabling more comprehensive data representations. Additionally, time differentiation in the Fourier domain simplifies the modeling of dynamics as it becomes a multiplication operation. To answer the second question, we introduce element-wise filtering, a method designed to compensate for the bias of continuous models when fitting discrete data points. These techniques culminate in the introduction of a new approach\u2014Fourier Ordinary Differential Equations (FODEs). Our experiments provide compelling evidence of FODEs' superiority in terms of accuracy, efficiency, and generalization capabilities when compared to existing methods across various time series datasets. By offering a novel method for modeling time series data capable of capturing both short-term and long-term patterns, FODEs have the potential to significantly enhance the modeling and prediction of complex dynamic systems.",
        "keywords": "Neural Ordinary Differential Equations;Time Series;Fourier;FFT",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Muhao Guo;Yang Weng",
        "authorids": "~Muhao_Guo1;~Yang_Weng1",
        "gender": "M;",
        "homepage": ";",
        "dblp": "345/6430;",
        "google_scholar": "wIOmifAAAAAJ;",
        "orcid": "0000-0002-9890-8214;",
        "linkedin": "muhaoguo/;",
        "or_profile": "~Muhao_Guo1;~Yang_Weng1",
        "aff": "Arizona State University;",
        "aff_domain": "asu.edu;",
        "position": "PhD student;",
        "bibtex": "@misc{\nguo2024fourier,\ntitle={Fourier Ordinary Differential Equations},\nauthor={Muhao Guo and Yang Weng},\nyear={2024},\nurl={https://openreview.net/forum?id=7em7Jl0qMm}\n}",
        "github": "",
        "project": "",
        "reviewers": "GqMG;MSqR;hxik;cX5F",
        "site": "https://openreview.net/forum?id=7em7Jl0qMm",
        "pdf_size": 4609813,
        "rating": "3;5;5;6",
        "confidence": "4;4;4;4",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;2;3",
        "wc_summary": "71;79;194;51",
        "wc_strengths": "48;61;91;26",
        "wc_weaknesses": "265;172;259;102",
        "wc_questions": "158;319;2;1",
        "wc_review": "542;631;546;180",
        "wc_reply_reviewers": "10;111;21;11",
        "wc_reply_authors": "512;611;485;161",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            98.75,
            55.930202037897196
        ],
        "wc_strengths_avg": [
            56.5,
            23.521266972678152
        ],
        "wc_weaknesses_avg": [
            199.5,
            67.2551113299205
        ],
        "wc_questions_avg": [
            120.0,
            131.4629225295102
        ],
        "wc_review_avg": [
            474.75,
            173.84673566104138
        ],
        "wc_reply_reviewers_avg": [
            38.25,
            42.22188413607332
        ],
        "wc_reply_authors_avg": [
            442.25,
            169.01978434491033
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0",
        "aff_unique_norm": "Arizona State University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.asu.edu",
        "aff_unique_abbr": "ASU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Can Sensitive Information Be Deleted From LLMs? Objectives for Defending Against Extraction Attacks",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19353",
        "id": "7erlRDoaV8",
        "author_site": "Vaidehi Ramesh Patil, Peter Hase, Mohit Bansal",
        "tldr": "",
        "abstract": "Pretrained language models sometimes possess knowledge that we do not wish them to, including memorized personal information and knowledge that could be used to harm people. They can also output toxic or harmful text. To mitigate these safety and informational issues, we propose an attack-and-defense framework for studying the task of deleting sensitive information directly from model weights. We study direct edits to model weights because (1) this approach should guarantee that particular deleted information is never extracted by future prompt attacks, and (2) it should protect against whitebox attacks, which is necessary for making claims about safety/privacy in a setting where publicly available model weights could be used to elicit sensitive information. Our threat model assumes that an attack succeeds if the answer to a sensitive question is located among a set of B generated candidates, based on scenarios where the information would be insecure if the answer is among B candidates. Experimentally, we show that even state-of-the-art model editing methods such as ROME struggle to truly delete factual information from models like GPT-J, as our whitebox and blackbox attacks can recover \u201cdeleted\u201d information from an edited model 38% of the time. These attacks leverage two key observations: (1) that traces of deleted information can be found in intermediate model hidden states, and (2) that applying an editing method for one question may not delete information across rephrased versions of the question. Finally, we provide new defense methods that protect against some extraction attacks, but we do not find a single universally effective defense method. Our results suggest that truly deleting sensitive information is a tractable but difficult problem, since even relatively low attack success rates have potentially severe implications for the deployment of language models in a world where individuals enjoy ownership of their personal data, a right to privacy, and safety from harmful model outputs.",
        "keywords": "Sensitive Information Deletion;Privacy Attacks;Model editing;Language Models",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/fb642952d68748c4c3da0a925fd0602ac68ae134.zip",
        "author": "Vaidehi Patil;Peter Hase;Mohit Bansal",
        "authorids": "~Vaidehi_Patil1;~Peter_Hase1;~Mohit_Bansal2",
        "gender": "F;;M",
        "homepage": "https://vaidehi99.github.io/;;https://www.cs.unc.edu/~mbansal/",
        "dblp": "294/5205;;32/5243.html",
        "google_scholar": "wCt6wSAAAAAJ;;DN8QtscAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Vaidehi_Patil1;~Peter_Hase1;~Mohit_Bansal2",
        "aff": "Department of Computer Science, University of North Carolina at Chapel Hill;;University of North Carolina at Chapel Hill",
        "aff_domain": "cs.unc.edu;;unc.edu",
        "position": "PhD student;;Full Professor",
        "bibtex": "@inproceedings{\npatil2024can,\ntitle={Can Sensitive Information Be Deleted From {LLM}s? Objectives for Defending Against Extraction Attacks},\nauthor={Vaidehi Patil and Peter Hase and Mohit Bansal},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=7erlRDoaV8}\n}",
        "github": "",
        "project": "",
        "reviewers": "X7HP;KWLr;GnJt;174w",
        "pdf_size": 644259,
        "rating": "6;8;8;8",
        "confidence": "3;4;3;3",
        "soundness": "3;4;4;2",
        "contribution": "2;3;3;3",
        "presentation": "3;3;4;3",
        "wc_summary": "164;127;67;118",
        "wc_strengths": "112;32;27;57",
        "wc_weaknesses": "202;110;30;150",
        "wc_questions": "84;91;84;151",
        "wc_review": "562;360;208;476",
        "wc_reply_reviewers": "0;21;0;0",
        "wc_reply_authors": "694;507;427;759",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            119.0,
            34.61935874622752
        ],
        "wc_strengths_avg": [
            57.0,
            33.726843908080106
        ],
        "wc_weaknesses_avg": [
            123.0,
            62.82515419798029
        ],
        "wc_questions_avg": [
            102.5,
            28.146935890075138
        ],
        "wc_review_avg": [
            401.5,
            132.73563952458284
        ],
        "wc_reply_reviewers_avg": [
            5.25,
            9.093266739736606
        ],
        "wc_reply_authors_avg": [
            596.75,
            134.77087036893394
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 96,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17466616399348737261&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=7erlRDoaV8",
        "pdf": "https://openreview.net/pdf?id=7erlRDoaV8",
        "email": "cs.unc.edu;;unc.edu",
        "author_num": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of North Carolina at Chapel Hill;University of North Carolina",
        "aff_unique_dep": "Department of Computer Science;",
        "aff_unique_url": "https://www.unc.edu;https://www.unc.edu",
        "aff_unique_abbr": "UNC Chapel Hill;UNC",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Chapel Hill",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "7essnmWOK5",
        "title": "Graph Neural Networks for Multivariate Time-Series Forecasting via Learning Hierarchical Spatiotemporal Dependencies",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Multivariate time-series forecasting is one of the essential tasks to draw insights from sequential data. Spatiotemporal Graph Neural Networks (STGNNs) have attracted much attention in this field due to their capability to capture the underlying spatiotemporal dependencies. However, current STGNN solutions still fall short of providing trustworthy predictions due to insufficient modeling of the dependencies and dynamics at different levels. In this paper, we propose a graph neural network model for multivariate time-series forecasting via learning hierarchical spatiotemporal dependencies (HSDGNN). Specifically, we organize variables as nodes in a graph while each node serves as a subgraph consisting of the attributes of variables. Then we design two-level convolutions on the hierarchical graph to model the spatial dependencies with different granularities. The changes in graph topologies are also encoded for strengthening dependency modeling across time and spatial dimensions. We test the proposed model on real-world datasets from different domains. The experimental results demonstrate the superiority of HSDGNN over state-of-the-art baselines in terms of prediction accuracy.",
        "keywords": "Multivariate time-series forecasting;Spatiotemporal graph neural networks;Deep learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Zhou Zhou;Ronisha Basker;Dit-Yan Yeung",
        "authorids": "~Zhou_Zhou6;~Ronisha_Basker1;~Dit-Yan_Yeung2",
        "gender": "Not Specified;F;M",
        "homepage": ";;https://cse.hkust.edu.hk/faculty/dyyeung/",
        "dblp": ";;41/5668",
        "google_scholar": ";;nEsOOx8AAAAJ",
        "orcid": "0000-0002-6490-8945;;0000-0003-3716-8125",
        "linkedin": ";ronisha-basker;",
        "or_profile": "~Zhou_Zhou6;~Ronisha_Basker1;~Dit-Yan_Yeung2",
        "aff": "Hong Kong University of Science and Technology;;Hong Kong University of Science and Technology",
        "aff_domain": "ust.hk;;ust.hk",
        "position": "Postdoc;;Chair Professor",
        "bibtex": "@misc{\nzhou2024graph,\ntitle={Graph Neural Networks for Multivariate Time-Series Forecasting via Learning Hierarchical Spatiotemporal Dependencies},\nauthor={Zhou Zhou and Ronisha Basker and Dit-Yan Yeung},\nyear={2024},\nurl={https://openreview.net/forum?id=7essnmWOK5}\n}",
        "github": "",
        "project": "",
        "reviewers": "MDiL;MTEy;kfob;7UwB",
        "site": "https://openreview.net/forum?id=7essnmWOK5",
        "pdf_size": 13118596,
        "rating": "3;3;3;5",
        "confidence": "4;4;4;4",
        "soundness": "2;3;2;3",
        "contribution": "1;2;1;2",
        "presentation": "2;3;1;3",
        "wc_summary": "64;99;58;100",
        "wc_strengths": "22;47;26;233",
        "wc_weaknesses": "356;170;61;103",
        "wc_questions": "14;4;126;152",
        "wc_review": "456;320;271;588",
        "wc_reply_reviewers": "32;16;28;23",
        "wc_reply_authors": "800;653;658;687",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            80.25,
            19.369757355217438
        ],
        "wc_strengths_avg": [
            82.0,
            87.6954958934608
        ],
        "wc_weaknesses_avg": [
            172.5,
            112.85056490775754
        ],
        "wc_questions_avg": [
            74.0,
            65.7419196555744
        ],
        "wc_review_avg": [
            408.75,
            123.70807370580144
        ],
        "wc_reply_reviewers_avg": [
            24.75,
            5.973901572674261
        ],
        "wc_reply_authors_avg": [
            699.5,
            59.457968347396466
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:oHwDBhFEwyMJ:scholar.google.com/&scioq=Graph+Neural+Networks+for+Multivariate+Time-Series+Forecasting+via+Learning+Hierarchical+Spatiotemporal+Dependencies&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Hong Kong University of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ust.hk",
        "aff_unique_abbr": "HKUST",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "SpikePoint: An Efficient Point-based Spiking Neural Network for Event Cameras Action Recognition",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19352",
        "id": "7etoNfU9uF",
        "author_site": "Hongwei Ren, Yue ZHOU, Xiaopeng LIN, Yulong Huang, Haotian FU, Jie Song, Bojun Cheng",
        "tldr": "",
        "abstract": "Event cameras are bio-inspired sensors that respond to local changes in light intensity and feature low latency, high energy efficiency, and high dynamic range. Meanwhile, Spiking Neural Networks (SNNs) have gained significant attention due to their remarkable efficiency and fault tolerance. By synergistically harnessing the energy efficiency inherent in event cameras and the spike-based processing capabilities of SNNs, their integration could enable ultra-low-power application scenarios, such as action recognition tasks. However, existing approaches often entail converting asynchronous events into conventional frames, leading to additional data mapping efforts and a loss of sparsity, contradicting the design concept of SNNs and event cameras. To address this challenge, we propose SpikePoint, a novel end-to-end point-based SNN architecture. SpikePoint excels at processing sparse event cloud data, effectively extracting both global and local features through a singular-stage structure. Leveraging the surrogate training method, SpikePoint achieves high accuracy with few parameters and maintains low power consumption, specifically employing the identity mapping feature extractor on diverse datasets. SpikePoint achieves state-of-the-art (SOTA) performance on four event-based action recognition datasets using only 16 timesteps, surpassing other SNN methods. Moreover, it also achieves SOTA performance across all methods on three datasets, utilizing approximately 0.3 % of the parameters and 0.5 % of power consumption employed by artificial neural networks (ANNs). These results emphasize the significance of Point Cloud and pave the way for many ultra-low-power event-based data processing applications.",
        "keywords": "Spiking Neural Betwork;Point Cloud;Event Camera;Action Recognition",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Hongwei Ren;Yue Zhou;Xiaopeng LIN;Yulong Huang;Haotian FU;Jie Song;Bojun Cheng",
        "authorids": "~Hongwei_Ren2;~Yue_Zhou8;~Xiaopeng_LIN1;~Yulong_Huang2;~Haotian_FU4;~Jie_Song1;~Bojun_Cheng1",
        "gender": "M;F;;;M;M;M",
        "homepage": "http://rhwdmx.github.io;;https://github.com/xplin13;;;https://ait.ethz.ch/people/song/;https://personal.hkust-gz.edu.cn/bojuncheng/index.html",
        "dblp": ";;;;;09/4756-6;285/0564",
        "google_scholar": "https://scholar.google.com.hk/citations?user=eD60q1YAAAAJ;;;;;https://scholar.google.com/citations?hl=en;https://scholar.google.ch/citations?user=Zisp-_IAAAAJ",
        "orcid": ";0000-0001-9323-4524;;;0000-0001-5445-4487;0009-0003-7484-1937;",
        "linkedin": ";;;;;;",
        "or_profile": "~Hongwei_Ren2;~Yue_Zhou8;~Xiaopeng_LIN1;~Yulong_Huang2;~Haotian_FU4;~Jie_Song1;~Bojun_Cheng1",
        "aff": "Hong Kong University of Science and Technology;Hong Kong University of Science and Technology;Hong Kong University of Science and Technology;;Hong Kong University of Science and Technology;ETHZ - ETH Zurich;The Hong Kong University of Science and Technology (Guangzhou)",
        "aff_domain": "connect.hkust-gz.edu.cn;hkust.edu;hkust.edu;;hkust.edu;ethz.ch;hkust-gz.edu.cn",
        "position": "PhD student;PhD student;PhD student;;PhD student;Postdoc;Assistant Professor",
        "bibtex": "@inproceedings{\nren2024spikepoint,\ntitle={SpikePoint: An Efficient Point-based Spiking Neural Network for Event Cameras Action Recognition},\nauthor={Hongwei Ren and Yue Zhou and Xiaopeng LIN and Yulong Huang and Haotian FU and Jie Song and Bojun Cheng},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=7etoNfU9uF}\n}",
        "github": "",
        "project": "",
        "reviewers": "NnWo;tiMk;qCNh;XXP9",
        "pdf_size": 11954613,
        "rating": "3;6;6;8",
        "confidence": "5;4;4;3",
        "soundness": "2;3;3;4",
        "contribution": "2;3;3;4",
        "presentation": "3;2;3;4",
        "wc_summary": "106;45;47;145",
        "wc_strengths": "47;69;19;87",
        "wc_weaknesses": "59;133;122;36",
        "wc_questions": "33;284;4;1",
        "wc_review": "245;531;192;269",
        "wc_reply_reviewers": "49;0;15;0",
        "wc_reply_authors": "809;872;731;106",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            85.75,
            42.07953778263255
        ],
        "wc_strengths_avg": [
            55.5,
            25.391927851189244
        ],
        "wc_weaknesses_avg": [
            87.5,
            41.00304866714181
        ],
        "wc_questions_avg": [
            80.5,
            118.1535018524631
        ],
        "wc_review_avg": [
            309.25,
            131.02361428383816
        ],
        "wc_reply_reviewers_avg": [
            16.0,
            20.0124960961895
        ],
        "wc_reply_authors_avg": [
            629.5,
            306.34172095880115
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.9901475429766743,
        "gs_citation": 25,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2749373382167214942&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=7etoNfU9uF",
        "pdf": "https://openreview.net/pdf?id=7etoNfU9uF",
        "email": "connect.hkust-gz.edu.cn;hkust.edu;hkust.edu;;hkust.edu;ethz.ch;hkust-gz.edu.cn",
        "author_num": 7,
        "aff_unique_index": "0;0;0;0;1;0",
        "aff_unique_norm": "Hong Kong University of Science and Technology;ETH Zurich",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ust.hk;https://www.ethz.ch",
        "aff_unique_abbr": "HKUST;ETHZ",
        "aff_campus_unique_index": "0;0;0;0;2",
        "aff_campus_unique": "Hong Kong SAR;;Guangzhou",
        "aff_country_unique_index": "0;0;0;0;1;0",
        "aff_country_unique": "China;Switzerland"
    },
    {
        "id": "7ezBaMwOqY",
        "title": "Trading-off Multiple Properties for Molecular Optimization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Molecular optimization, a critical research area in drug discovery, aims to enhance the properties or performance of molecules through systematic modifications of their chemical structures. Recently, existing Multi-Objective Molecular Optimization (MOMO) methods are extended from Single-Objective Molecular Optimization (SOMO) approaches by employing techniques such as Linear Scalarization, Evolutionary Algorithms, and Multi-Objective Bayesian Optimization. In Multi-Objective Optimization, the ideal goal is to find Pareto optimal solutions over different preferences, which indicate the importance of different objectives. However, these straightforward extensions often struggle with trading off multiple properties due to the conflicting or correlated nature of certain properties.  More specifically, current MOMO methods derived from SOMO are still challenged in finding preference-conditioned Pareto solutions and exhibit low efficiency in Pareto search. To address the aforementioned problems, we propose the \\textbf{P}reference-\\textbf{C}onditioned \\textbf{I}nversion (PCI) framework,  efficiently ``inverting'' a pre-trained surrogate oracle under the guidance of a non-dominated gradient, to generate candidate Pareto optimal molecules over preference-conditioned distributions. Additionally, we provide theoretical guarantees for PCI's capability in converging to preference-conditioned solutions. This unique characteristic enables PCI to search the full Pareto front approximately, thereby assisting in the discovery of diverse molecules with varying ratios of properties. Comprehensive experimental evaluations show that our model significantly outperforms state-of-the-art baselines in multi-objective molecular optimization settings.",
        "keywords": "Molecular Optimization;Multiple Properties",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Yifan Niu;Ziqi Gao;Tingyang Xu;Yatao Bian;Yu Rong;Jia Li",
        "authorids": "~Yifan_Niu1;~Ziqi_Gao1;~Tingyang_Xu1;~Yatao_Bian1;~Yu_Rong1;~Jia_Li4",
        "gender": "Non-Binary;;M;M;M;M",
        "homepage": "https://nyf0808.github.io/;;;https://royrong.me/;https://sites.google.com/view/lijia;https://yataobian.com",
        "dblp": ";;157/0940;24/10036-1;23/6950-9;222/2694",
        "google_scholar": ";https://scholar.google.com.hk/citations?user=UHwNFy8AAAAJ;6gIs5YMAAAAJ;https://scholar.google.com.hk/citations?user=itezhEMAAAAJ;1gSbcYoAAAAJ;oZBTlBkAAAAJ",
        "orcid": ";;0009-0002-0106-8376;0000-0001-7387-302X;0000-0002-6362-4385;0000-0002-2368-4084",
        "linkedin": ";;;;;",
        "or_profile": "~Yifan_Niu1;~Ziqi_Gao1;~Tingyang_Xu1;~Yu_Rong1;~Jia_Li4;~An_Bian1",
        "aff": "Hong Kong University of Science and Technology;Hong Kong University of Science and Technology;Tencent AI Lab;Tencent AI Lab;Hong Kong University of Science and Technology (Guangzhou);Tencent AI Lab",
        "aff_domain": "connect.hkust-gz.edu.cn;ust.hk;tencent.com;tencent.com;ust.hk;tencent.com",
        "position": "PhD student;PhD student;Researcher;Principal Researcher;Assistant Professor;Senior researcher    ",
        "bibtex": "@misc{\nniu2024tradingoff,\ntitle={Trading-off Multiple Properties for Molecular Optimization},\nauthor={Yifan Niu and Ziqi Gao and Tingyang Xu and Yatao Bian and Yu Rong and Jia Li},\nyear={2024},\nurl={https://openreview.net/forum?id=7ezBaMwOqY}\n}",
        "github": "",
        "project": "",
        "reviewers": "8aLW;dF44;xqpc;xC4n",
        "site": "https://openreview.net/forum?id=7ezBaMwOqY",
        "pdf_size": 1983659,
        "rating": "3;5;5;6",
        "confidence": "4;4;4;2",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;2",
        "wc_summary": "114;221;132;50",
        "wc_strengths": "31;202;165;23",
        "wc_weaknesses": "269;249;372;88",
        "wc_questions": "31;182;10;53",
        "wc_review": "445;854;679;214",
        "wc_reply_reviewers": "363;308;85;0",
        "wc_reply_authors": "653;1056;863;579",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "1;3;2;2",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            129.25,
            61.11208963863042
        ],
        "wc_strengths_avg": [
            105.25,
            79.38631809071384
        ],
        "wc_weaknesses_avg": [
            244.5,
            101.69685344198217
        ],
        "wc_questions_avg": [
            69.0,
            66.9888050348713
        ],
        "wc_review_avg": [
            548.0,
            241.33068598916302
        ],
        "wc_reply_reviewers_avg": [
            189.0,
            150.8094824604872
        ],
        "wc_reply_authors_avg": [
            787.75,
            186.65124564277625
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.6622661785325219,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:__VbIQAApc8J:scholar.google.com/&scioq=Trading-off+Multiple+Properties+for+Molecular+Optimization&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;1;0;1",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Tencent",
        "aff_unique_dep": ";Tencent AI Lab",
        "aff_unique_url": "https://www.ust.hk;https://ai.tencent.com",
        "aff_unique_abbr": "HKUST;Tencent AI Lab",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "7ffJo4vtTY",
        "title": "Robust multimodal models have outlier features and encode more concepts",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "What distinguishes robust models from non-robust ones?  This question has gained traction with the appearance of large-scale multimodal models, such as CLIP. These models have demonstrated unprecedented robustness with respect to natural distribution shifts. While it has been shown that such differences in robustness can be traced back to differences in training data, so far it is not known what that translates to in terms of what the model has learned. In this work, we bridge this gap by probing the representation spaces of 12 robust multimodal models with various backbones (ResNets and ViTs) and pretraining sets (OpenAI, LAION-400M, LAION-2B, YFCC15M, CC12M and DataComp). We find two signatures of robustness in the representation spaces of these models: (1) Robust models exhibit outlier features characterized by their activations, with some being several orders of magnitude above average. These outlier features induce privileged directions in the model's representation space. We demonstrate that these privileged directions explain most of the predictive power of the model by pruning up to $80 \\\\%$ of the least important representation space directions without negative impacts on model accuracy and robustness; (2) Robust models encode substantially more concepts in their representation space. While this superposition of concepts allows robust models to store much information, it also results in highly polysemantic features, which makes their interpretation challenging. We discuss how these insights pave the way for future research in various fields, such as model pruning and mechanistic interpretability.",
        "keywords": "interpretability;explainability;robustness",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Jonathan Crabb\u00e9;Pau Rodriguez;Vaishaal Shankar;Luca Zappella;Arno Blaas",
        "authorids": "~Jonathan_Crabb\u00e91;~Pau_Rodriguez2;~Vaishaal_Shankar1;~Luca_Zappella1;~Arno_Blaas1",
        "gender": "M;M;;;M",
        "homepage": "https://jonathancrabbe.github.io/;http://www.cis.jhu.edu/~luca/;https://github.com/arblox/;https://prlz77.github.io;http://vaishaal.com",
        "dblp": "278/8353.html;38/2520;;190/7735;159/3628",
        "google_scholar": "Y_Nmd2sAAAAJ;bmh6mxAAAAAJ;;https://scholar.google.es/citations?user=IwBx73wAAAAJ;",
        "orcid": "0000-0002-0341-7712;;;0000-0002-1689-8084;",
        "linkedin": "jonathan-crabb%C3%A9-4ab5701a5/;zappella?trk=people-guest_profile-result-card_result-card_full-click;;;",
        "or_profile": "~Jonathan_Crabb\u00e91;~Luca_Zappella1;~Arno_Blaas1;~Pau_Rodriguez_Lopez1;~vaishaal_naanny_shankar1",
        "aff": "University of Cambridge;Apple;Apple;Apple;Apple",
        "aff_domain": "cam.ac.uk;apple.com;apple.com;apple.com;apple.com",
        "position": "PhD student;Principal Researcher;Researcher;Researcher;Researcher",
        "bibtex": "@misc{\ncrabb{\\'e}2024robust,\ntitle={Robust multimodal models have outlier features and encode more concepts},\nauthor={Jonathan Crabb{\\'e} and Pau Rodriguez and Vaishaal Shankar and Luca Zappella and Arno Blaas},\nyear={2024},\nurl={https://openreview.net/forum?id=7ffJo4vtTY}\n}",
        "github": "",
        "project": "",
        "reviewers": "8h4M;KW5N;qBSE;YHoY",
        "site": "https://openreview.net/forum?id=7ffJo4vtTY",
        "pdf_size": 2238262,
        "rating": "5;5;6;8",
        "confidence": "3;1;3;4",
        "soundness": "1;2;3;4",
        "contribution": "2;2;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "103;25;163;63",
        "wc_strengths": "161;30;297;94",
        "wc_weaknesses": "649;90;245;64",
        "wc_questions": "105;2;143;90",
        "wc_review": "1018;147;848;311",
        "wc_reply_reviewers": "187;0;66;0",
        "wc_reply_authors": "2177;959;2389;940",
        "reply_reviewers": "1;0;2;0",
        "reply_authors": "5;3;6;2",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            2.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.5,
            1.118033988749895
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            88.5,
            51.09549882328188
        ],
        "wc_strengths_avg": [
            145.5,
            98.97600719366285
        ],
        "wc_weaknesses_avg": [
            262.0,
            233.9048952031573
        ],
        "wc_questions_avg": [
            85.0,
            51.66720429827803
        ],
        "wc_review_avg": [
            581.0,
            361.7713366202469
        ],
        "wc_reply_reviewers_avg": [
            63.25,
            76.35893857303151
        ],
        "wc_reply_authors_avg": [
            1616.25,
            670.9833734899845
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            4.0,
            1.5811388300841898
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.7492686492653551,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1179695393162082103&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;1;1;1",
        "aff_unique_norm": "University of Cambridge;Apple",
        "aff_unique_dep": ";Apple Inc.",
        "aff_unique_url": "https://www.cam.ac.uk;https://www.apple.com",
        "aff_unique_abbr": "Cambridge;Apple",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Cambridge;",
        "aff_country_unique_index": "0;1;1;1;1",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "id": "7fwzPsn1lJ",
        "title": "LLark: A Multimodal Foundation Model for Music",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Music has a unique and complex structure which is challenging for both expert humans and existing AI systems to understand, and presents unique challenges relative to other forms of audio. \nWe present LLark, an instruction-tuned multimodal model for music understanding. We detail our process for dataset creation, which involves augmenting the annotations of diverse open-source music datasets and converting them to a unified instruction-tuning format. We propose a multimodal architecture for LLark, integrating a pretrained generative model for music with a pretrained language model. \nIn evaluations on three types of tasks (music understanding, captioning, and reasoning), we show that our model outperforms existing baselines in zero-shot generalization for music understanding, and that humans show a high degree of agreement with the model's responses in captioning and reasoning tasks. LLark is trained entirely from open-source music data and models, and we make our training code available along with the release of this paper.\nAdditional results and audio examples are at https://bit.ly/3ZyzbGG .",
        "keywords": "multimodal;music;MIR;music captioning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/7e2f04752908ad969e6f6b23cea8a9708cfdfe76.zip",
        "author": "Joshua P Gardner;Simon Durand;Daniel Stoller;Rachel M Bittner",
        "authorids": "~Joshua_P_Gardner1;~Simon_Durand1;~Daniel_Stoller1;~Rachel_M_Bittner1",
        "gender": ";M;;",
        "homepage": ";https://scholar.google.com/citations?user=N2oBCKkAAAAJ&hl=en&oi=ao;;",
        "dblp": ";;;",
        "google_scholar": ";;;pXn1kQEAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Joshua_P_Gardner1;~Simon_Durand1;~Daniel_Stoller1;~Rachel_M_Bittner1",
        "aff": ";;Queen Mary University London;Spotify",
        "aff_domain": ";;qmul.ac.uk;spotify.com",
        "position": ";;PhD student;Researcher",
        "bibtex": "@misc{\ngardner2024llark,\ntitle={{LL}ark: A Multimodal Foundation Model for Music},\nauthor={Joshua P Gardner and Simon Durand and Daniel Stoller and Rachel M Bittner},\nyear={2024},\nurl={https://openreview.net/forum?id=7fwzPsn1lJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "p6wE;JrBS;zBmL;gHco",
        "site": "https://openreview.net/forum?id=7fwzPsn1lJ",
        "pdf_size": 1290670,
        "rating": "5;6;6;6",
        "confidence": "5;4;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;4;2",
        "presentation": "2;4;3;3",
        "wc_summary": "138;47;72;105",
        "wc_strengths": "88;50;88;30",
        "wc_weaknesses": "1082;352;709;24",
        "wc_questions": "180;38;209;28",
        "wc_review": "1488;487;1078;187",
        "wc_reply_reviewers": "554;49;0;0",
        "wc_reply_authors": "3677;1229;3454;1624",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "8;4;7;5",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            90.5,
            34.2819194328439
        ],
        "wc_strengths_avg": [
            64.0,
            25.019992006393608
        ],
        "wc_weaknesses_avg": [
            541.75,
            394.94073922551974
        ],
        "wc_questions_avg": [
            113.75,
            81.47507287508247
        ],
        "wc_review_avg": [
            810.0,
            505.9560257571798
        ],
        "wc_reply_reviewers_avg": [
            150.75,
            233.67431929931882
        ],
        "wc_reply_authors_avg": [
            2496.0,
            1081.4571188909897
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            6.0,
            1.5811388300841898
        ],
        "replies_avg": [
            33,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 33,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10782095578294234543&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Queen Mary University of London;Spotify",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.qmul.ac.uk;https://www.spotify.com",
        "aff_unique_abbr": "QMUL;Spotify",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "London;",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United Kingdom;Sweden"
    },
    {
        "id": "7fxzVTSgZC",
        "title": "Offline Imitation Learning without Auxiliary High-quality Behavior Data",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this work, we study the problem of Offline Imitation Learning (OIL), where an agent aims to learn from the demonstrations composed of expert behaviors and sub-optimal behaviors without additional online environment interactions. Previous studies typically assume that there is high-quality behavioral data mixed in the auxiliary offline data and seriously degrades when only low-quality data from an off-policy distribution is available. In this work, we break through the bottleneck of OIL relying on auxiliary high-quality behavior data and make the first attempt to demonstrate that low-quality data is also helpful for OIL. Specifically, we utilize the transition information from offline data to maximize the policy transition probability towards expert-observed states. This guidance can improve long-term returns on states that are not observed by experts when reward signals are not available, ultimately enabling imitation learning to benefit from low-quality data. We instantiate our proposition in a simple but effective algorithm, Behavioral Cloning with Dynamic Programming (BCDP), which involves executing behavioral cloning on the expert data and dynamic programming on the unlabeled offline data respectively. In the experiments on benchmark tasks, unlike most existing offline imitation learning methods that do not utilize low-quality data sufficiently, our BCDP algorithm can still achieve an average performance gain of more than 40\\% even when the offline data is purely random exploration.",
        "keywords": "imitation learning;offline imitation learning;offline reinforcement learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/3d5912eba6101f92028da8bad15680f502afd76a.zip",
        "author": "Jie-Jing Shao;Hao-Sen Shi;Tian Xu;Lan-Zhe Guo;Yang Yu;Yu-Feng Li",
        "authorids": "~Jie-Jing_Shao1;~Hao-Sen_Shi1;~Tian_Xu2;~Lan-Zhe_Guo2;~Yang_Yu5;~Yu-Feng_Li1",
        "gender": "M;M;M;M;M;M",
        "homepage": "http://www.lamda.nju.edu.cn/shaojj/;http://www.lamda.nju.edu.cn/xut/;http://www.lamda.nju.edu.cn/guolz;https://www.lamda.nju.edu.cn/shihs/;http://www.lamda.nju.edu.cn/yuy;https://cs.nju.edu.cn/liyf/index.htm",
        "dblp": "299/4982;07/2985-3;216/4845;;46/2181-1;57/413",
        "google_scholar": "k1tEDpQAAAAJ;e5mnk1wAAAAJ;dpunvqgAAAAJ;;PG2lDSwAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0001-8107-114X;;;;;0000-0002-2220-5248",
        "linkedin": ";;;;;",
        "or_profile": "~Jie-Jing_Shao1;~Tian_Xu2;~Lan-Zhe_Guo2;~Haosen_Shi2;~Yang_Yu2;~Yu-feng_Li2",
        "aff": "Nanjing University;Nanjing University;Nanjing University;Nanjing University;Nanjing University;Nanjing University",
        "aff_domain": "nju.edu.cn;nju.edu.cn;nju.edu.cn;nju.edu.cn;nju.edu.cn;nju.edu.cn",
        "position": "PhD student;PhD student;Assistant Professor;MS student;Professor;Assistant Professor",
        "bibtex": "@misc{\nshao2024offline,\ntitle={Offline Imitation Learning without Auxiliary High-quality Behavior Data},\nauthor={Jie-Jing Shao and Hao-Sen Shi and Tian Xu and Lan-Zhe Guo and Yang Yu and Yu-Feng Li},\nyear={2024},\nurl={https://openreview.net/forum?id=7fxzVTSgZC}\n}",
        "github": "",
        "project": "",
        "reviewers": "K5Tt;uGnS;Yds8;Xzkb",
        "site": "https://openreview.net/forum?id=7fxzVTSgZC",
        "pdf_size": 4346384,
        "rating": "5;6;6;8",
        "confidence": "4;3;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;3;3;4",
        "wc_summary": "90;105;133;89",
        "wc_strengths": "14;61;238;106",
        "wc_weaknesses": "479;316;27;168",
        "wc_questions": "124;129;59;13",
        "wc_review": "707;611;457;376",
        "wc_reply_reviewers": "386;56;28;0",
        "wc_reply_authors": "2060;946;234;91",
        "reply_reviewers": "2;1;1;0",
        "reply_authors": "4;2;1;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            104.25,
            17.76759691123141
        ],
        "wc_strengths_avg": [
            104.75,
            83.5265676297069
        ],
        "wc_weaknesses_avg": [
            247.5,
            168.2446135839124
        ],
        "wc_questions_avg": [
            81.25,
            48.11639533464659
        ],
        "wc_review_avg": [
            537.75,
            129.1266335811478
        ],
        "wc_reply_reviewers_avg": [
            117.5,
            156.2777975273519
        ],
        "wc_reply_authors_avg": [
            832.75,
            779.0479365867033
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.13245323570650439,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10838255184797337773&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "Nanjing University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nju.edu.cn",
        "aff_unique_abbr": "Nanjing U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Belief-Enriched Pessimistic Q-Learning against Adversarial State Perturbations",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19351",
        "id": "7gDENzTzw1",
        "author_site": "Xiaolin Sun, Zizhan Zheng",
        "tldr": "",
        "abstract": "Reinforcement learning (RL) has achieved phenomenal success in various domains. However, its data-driven nature also introduces new vulnerabilities that can be exploited by malicious opponents. Recent work shows that a well-trained RL agent can be easily manipulated by strategically perturbing its state observations at the test stage. Existing solutions either introduce a regularization term to improve the smoothness of the trained policy against perturbations or alternatively train the agent's policy and the attacker's policy. However, the former does not provide sufficient protection against strong attacks, while the latter is computationally prohibitive for large environments. In this work, we propose a new robust RL algorithm for deriving a pessimistic policy to safeguard against an agent's uncertainty about true states. This approach is further enhanced with belief state inference and diffusion-based state purification to reduce uncertainty. Empirical results show that our approach obtains superb performance under strong attacks and has a comparable training overhead with regularization-based methods. Our code is available at https://github.com/SliencerX/Belief-enriched-robust-Q-learning.",
        "keywords": "Reinforcement Learning;Robustness;Adversarial Attack;Adversarial Defense",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/fc5a3b1becca02090173a605a76086e275a0e612.zip",
        "author": "Xiaolin Sun;Zizhan Zheng",
        "authorids": "~Xiaolin_Sun1;~Zizhan_Zheng1",
        "gender": "M;M",
        "homepage": "https://xsun01.wixsite.com/mysite-1;https://www.cs.tulane.edu/~zzheng3/",
        "dblp": "26/;23/286",
        "google_scholar": "6VM5rAYAAAAJ;B1v2AUYAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Xiaolin_Sun1;~Zizhan_Zheng1",
        "aff": "Tulane University;Tulane University",
        "aff_domain": "tulane.edu;tulane.edu",
        "position": "PhD student;Associate Professor",
        "bibtex": "@inproceedings{\nsun2024beliefenriched,\ntitle={Belief-Enriched Pessimistic Q-Learning against Adversarial State Perturbations},\nauthor={Xiaolin Sun and Zizhan Zheng},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=7gDENzTzw1}\n}",
        "github": "",
        "project": "",
        "reviewers": "achV;cDHy;GsDy;QHWx",
        "pdf_size": 663907,
        "rating": "5;6;6;8",
        "confidence": "4;2;2;4",
        "soundness": "2;3;3;3",
        "contribution": "3;3;2;4",
        "presentation": "3;3;3;3",
        "wc_summary": "64;46;76;64",
        "wc_strengths": "55;19;47;28",
        "wc_weaknesses": "112;12;40;57",
        "wc_questions": "39;130;66;2",
        "wc_review": "270;207;229;151",
        "wc_reply_reviewers": "131;0;21;21",
        "wc_reply_authors": "1224;989;480;406",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "3;3;2;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.0,
            1.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            62.5,
            10.712142642814275
        ],
        "wc_strengths_avg": [
            37.25,
            14.394009170484782
        ],
        "wc_weaknesses_avg": [
            55.25,
            36.49229370702806
        ],
        "wc_questions_avg": [
            59.25,
            46.74064077438391
        ],
        "wc_review_avg": [
            214.25,
            42.949825377991935
        ],
        "wc_reply_reviewers_avg": [
            43.25,
            51.38275488916491
        ],
        "wc_reply_authors_avg": [
            774.75,
            342.9951712488093
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.2294157338705618,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:PeTPByT4qxQJ:scholar.google.com/&scioq=Belief-Enriched+Pessimistic+Q-Learning+against+Adversarial+State+Perturbations&hl=en&as_sdt=0,33",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=7gDENzTzw1",
        "pdf": "https://openreview.net/pdf?id=7gDENzTzw1",
        "email": "tulane.edu;tulane.edu",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Tulane University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tulane.edu",
        "aff_unique_abbr": "Tulane",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Proper Laplacian Representation Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19350",
        "id": "7gLfQT52Nn",
        "author_site": "Diego Gomez, Michael Bowling, Marlos C. Machado",
        "tldr": "",
        "abstract": "The ability to learn good representations of states is essential for solving large reinforcement learning problems, where exploration, generalization, and transfer are particularly challenging. The _Laplacian representation_ is a promising approach to address these problems by inducing informative state encoding and intrinsic rewards for temporally-extended action discovery and reward shaping. To obtain the Laplacian representation one needs to compute the eigensystem of the graph Laplacian, which is often approximated through optimization objectives compatible with deep learning approaches. These approximations, however, depend on hyperparameters that are impossible to tune efficiently, converge to arbitrary rotations of the desired eigenvectors, and are unable to accurately recover the corresponding eigenvalues. In this paper we introduce a theoretically sound objective and corresponding optimization algorithm for approximating the Laplacian representation. Our approach naturally recovers both the true eigenvectors and eigenvalues while eliminating the hyperparameter dependence of previous approximations. We provide theoretical guarantees for our method and we show that those results translate empirically into robust learning across multiple environments.",
        "keywords": "Reinforcement learning;Graph Laplacian;Representation learning;Augmented Lagrangian optimization;Hyperparameter robustness",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Diego Gomez;Michael Bowling;Marlos C. Machado",
        "authorids": "~Diego_Gomez1;~Michael_Bowling1;~Marlos_C._Machado1",
        "gender": "M;M;M",
        "homepage": ";https://webdocs.cs.ualberta.ca/~bowling/;https://webdocs.cs.ualberta.ca/~machado/",
        "dblp": ";71/5161;21/10949",
        "google_scholar": "wj8Edy4AAAAJ;https://scholar.google.ca/citations?user=PYtPCHoAAAAJ;https://scholar.google.ca/citations?user=xf_n4xUAAAAJ",
        "orcid": "0000-0002-4625-233X;;",
        "linkedin": ";;cholodovskis/",
        "or_profile": "~Diego_Gomez1;~Michael_Bowling1;~Marlos_C._Machado1",
        "aff": "University of Alberta;Department of Computing Science, University of Alberta;University of Alberta",
        "aff_domain": "ualberta.ca;cs.ualberta.ca;ualberta.ca",
        "position": "Researcher;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\ngomez2024proper,\ntitle={Proper Laplacian Representation Learning},\nauthor={Diego Gomez and Michael Bowling and Marlos C. Machado},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=7gLfQT52Nn}\n}",
        "github": "",
        "project": "",
        "reviewers": "DES2;tVNo;Fii6;nARE",
        "pdf_size": 5740877,
        "rating": "5;6;6;6",
        "confidence": "3;4;1;3",
        "soundness": "3;4;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;4;3;3",
        "wc_summary": "66;78;85;56",
        "wc_strengths": "70;112;11;57",
        "wc_weaknesses": "143;197;12;21",
        "wc_questions": "3;43;41;91",
        "wc_review": "282;430;149;225",
        "wc_reply_reviewers": "0;284;0;109",
        "wc_reply_authors": "18;743;172;710",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            2.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            71.25,
            11.121488209767612
        ],
        "wc_strengths_avg": [
            62.5,
            36.01735692690401
        ],
        "wc_weaknesses_avg": [
            93.25,
            79.15293740601166
        ],
        "wc_questions_avg": [
            44.5,
            31.22098653149833
        ],
        "wc_review_avg": [
            271.5,
            102.95751551003939
        ],
        "wc_reply_reviewers_avg": [
            98.25,
            116.10851605287185
        ],
        "wc_reply_authors_avg": [
            410.75,
            320.62234404358037
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.13245323570650439,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15160893217759249782&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=7gLfQT52Nn",
        "pdf": "https://openreview.net/pdf?id=7gLfQT52Nn",
        "email": "ualberta.ca;cs.ualberta.ca;ualberta.ca",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Alberta",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ualberta.ca",
        "aff_unique_abbr": "UAlberta",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "7gUmlgc9q0",
        "title": "Towards More Accurate Diffusion Model Acceleration with A Timestep Aligner",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "A diffusion model, which is formulated to produce an image using thousands of denoising steps, usually suffers from a slow inference speed. Existing acceleration algorithms simplify the sampling by skipping most steps yet observe considerable performance degradation. By viewing the generation of diffusion models as a discretized integrating process, we argue that the quality drop is partly caused by applying an inaccurate integral direction to a timestep interval. To rectify such inaccuracy, we propose a \\textbf{timestep aligner} that helps find a more accurate integral direction for a particular interval at the minimum cost. Specifically, at each denoising step, we replace the original parameterization by conditioning the network on a new timestep, which is obtained by aligning the sampling distribution to the real distribution. Extensive experiments show that our plug-in design can be trained efficiently and boost the inference performance of various state-of-the-art acceleration methods, especially for the one with few denoising steps. For example, when using 10 denoising steps on the popular LSUN Bedroom dataset, we improve the FID of DDIM from 9.65 to 6.07, simply by adopting our method for a more appropriate set of timesteps. Code will be made publicly available.",
        "keywords": "Generative model;diffusion model",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Mengfei Xia;Yujun Shen;Changsong Lei;Yu Zhou;Ran Yi;Deli Zhao;Wenping Wang;Yong-jin Liu",
        "authorids": "~Mengfei_Xia1;~Yujun_Shen1;~Changsong_Lei2;~Yu_Zhou17;~Ran_Yi1;~Deli_Zhao1;~Wenping_Wang1;~Yong-jin_Liu1",
        "gender": "M;;M;M;F;M;M;M",
        "homepage": "https://thuxmf.github.io/;;https://github.com/lcshhh;https://scholar.google.com/citations?hl=zh-CN&user=pMXjhxkAAAAJ;https://yiranran.github.io/;https://zhaodeli.github.io;https://engineering.tamu.edu/cse/profiles/Wang-Wenping.html;https://cg.cs.tsinghua.edu.cn/people/~Yongjin/Yongjin.htm",
        "dblp": "301/3569;;;;136/5469;77/1992;;27/2098",
        "google_scholar": "jmOlxQ0AAAAJ;;;;https://scholar.google.com.hk/citations?user=y68DLo4AAAAJ;https://scholar.google.com/citations?hl=en;28shvv0AAAAJ;https://scholar.google.com.tw/citations?user=GNDtwWQAAAAJ",
        "orcid": ";;;;0000-0003-1858-3358;0000-0002-8838-578X;0000-0002-2284-3952;0000-0001-5774-1916",
        "linkedin": ";;;;;;;",
        "or_profile": "~Mengfei_Xia1;~Yujun_Shen1;~Changsong_Lei2;~Yu_Zhou17;~Ran_Yi1;~Deli_Zhao1;~Wenping_Wang1;~Yong-jin_Liu1",
        "aff": "Tsinghua University;;Tsinghua University;Tsinghua University;Shanghai Jiaotong University;Alibaba Group;Texas A&M University - College Station;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;;tsinghua.edu.cn;tsinghua.edu.cn;sjtu.edu.cn;alibaba-inc.com;tamu.edu;tsinghua.edu.cn",
        "position": "PhD student;;PhD student;Undergrad student;Assistant Professor;Director;Full Professor;Full Professor",
        "bibtex": "@misc{\nxia2024towards,\ntitle={Towards More Accurate Diffusion Model Acceleration with A Timestep Aligner},\nauthor={Mengfei Xia and Yujun Shen and Changsong Lei and Yu Zhou and Ran Yi and Deli Zhao and Wenping Wang and Yong-jin Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=7gUmlgc9q0}\n}",
        "github": "",
        "project": "",
        "reviewers": "koqD;n1ad;j67R",
        "site": "https://openreview.net/forum?id=7gUmlgc9q0",
        "pdf_size": 3979255,
        "rating": "3;3;5",
        "confidence": "4;4;2",
        "soundness": "2;2;3",
        "contribution": "1;2;2",
        "presentation": "2;3;3",
        "wc_summary": "75;67;49",
        "wc_strengths": "20;59;25",
        "wc_weaknesses": "424;251;114",
        "wc_questions": "2;39;3",
        "wc_review": "521;416;191",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            63.666666666666664,
            10.873004286866726
        ],
        "wc_strengths_avg": [
            34.666666666666664,
            17.326921891156033
        ],
        "wc_weaknesses_avg": [
            263.0,
            126.8411079526928
        ],
        "wc_questions_avg": [
            14.666666666666666,
            17.21110752456745
        ],
        "wc_review_avg": [
            376.0,
            137.65899897936205
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10405448026401765017&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;1;2;3;0",
        "aff_unique_norm": "Tsinghua University;Shanghai Jiao Tong University;Alibaba Group;Texas A&M University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.sjtu.edu.cn;https://www.alibaba.com;https://www.tamu.edu",
        "aff_unique_abbr": "THU;SJTU;Alibaba;TAMU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";College Station",
        "aff_country_unique_index": "0;0;0;0;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "EQA-MX: Embodied Question Answering using Multimodal Expression",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19349",
        "id": "7gUrYE50Rb",
        "author_site": "Md Mofijul Islam, Alexi Gladstone, Riashat Islam, Tariq Iqbal",
        "tldr": "",
        "abstract": "Humans predominantly use verbal utterances and nonverbal gestures (e.g., eye gaze and pointing gestures) in their natural interactions. For instance, pointing gestures and verbal information is often required to comprehend questions such as \"what object is that?\" Thus, this question-answering (QA) task involves complex reasoning of multimodal expressions (verbal utterances and nonverbal gestures). However, prior works have explored QA tasks in non-embodied settings, where questions solely contain verbal utterances from a single verbal and visual perspective. In this paper, we have introduced 8 novel embodied question answering (EQA) tasks to develop learning models to comprehend embodied questions with multimodal expressions. We have developed a novel large-scale dataset, EQA-MX, with over 8 million diverse embodied QA data samples involving multimodal expressions from multiple visual and verbal perspectives. To learn salient multimodal representations from discrete verbal embeddings and continuous wrapping of multiview visual representations, we propose a vector-quantization (VQ) based multimodal representation learning model, VQ-Fusion, for the EQA tasks. Our extensive experimental results suggest that VQ-Fusion can improve the performance of existing state-of-the-art visual-language models up to 13% across EQA tasks.",
        "keywords": "multimodal representation learning;visual-language models;embodied question answering",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Md Mofijul Islam;Alexi Gladstone;Riashat Islam;Tariq Iqbal",
        "authorids": "~Md_Mofijul_Islam1;~Alexi_Gladstone1;~Riashat_Islam1;~Tariq_Iqbal1",
        "gender": "M;M;M;",
        "homepage": "http://mmiakashs.github.io;https://alexiglad.github.io/;https://riashat.github.io/;http://www.tiqbal.com",
        "dblp": "271/8379;346/0923;198/0459;159/0463",
        "google_scholar": "FYy4ZxYAAAAJ;j9Cx6PcAAAAJ;https://scholar.google.ca/citations?user=2_4Rs44AAAAJ;t_ndTI4AAAAJ",
        "orcid": ";;;",
        "linkedin": "beingmiakashs;alexiglad/;;",
        "or_profile": "~Md_Mofijul_Islam1;~Alexi_Gladstone1;~Riashat_Islam1;~Tariq_Iqbal1",
        "aff": "Amazon;University of Virginia, Charlottesville;Saudi Data and AI Authority, Saudi Data and AI Authority;University of Virginia",
        "aff_domain": "amazon.com;virginia.edu;sdaia.gov.sa;virginia.edu",
        "position": "Applied Scientist;Undergrad student;Researcher;Assistant Professor",
        "bibtex": "@inproceedings{\nislam2024eqamx,\ntitle={{EQA}-{MX}: Embodied Question Answering using Multimodal Expression},\nauthor={Md Mofijul Islam and Alexi Gladstone and Riashat Islam and Tariq Iqbal},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=7gUrYE50Rb}\n}",
        "github": "",
        "project": "",
        "reviewers": "BG1y;4CbJ;9x3E;7hsY",
        "pdf_size": 23982438,
        "rating": "8;8;8;8",
        "confidence": "3;4;4;4",
        "soundness": "4;4;2;3",
        "contribution": "4;3;3;3",
        "presentation": "4;2;2;4",
        "wc_summary": "82;56;83;125",
        "wc_strengths": "99;99;96;127",
        "wc_weaknesses": "121;142;627;154",
        "wc_questions": "77;2;255;21",
        "wc_review": "379;299;1061;427",
        "wc_reply_reviewers": "36;72;419;30",
        "wc_reply_authors": "1135;960;4566;1050",
        "reply_reviewers": "1;1;2;1",
        "reply_authors": "7;6;14;5",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            1.0
        ],
        "wc_summary_avg": [
            86.5,
            24.72347063015223
        ],
        "wc_strengths_avg": [
            105.25,
            12.616952880945542
        ],
        "wc_weaknesses_avg": [
            261.0,
            211.64002457002314
        ],
        "wc_questions_avg": [
            88.75,
            99.86584751555459
        ],
        "wc_review_avg": [
            541.5,
            303.39866512560667
        ],
        "wc_reply_reviewers_avg": [
            139.25,
            162.31046639080304
        ],
        "wc_reply_authors_avg": [
            1927.75,
            1524.450782249135
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            8.0,
            3.5355339059327378
        ],
        "replies_avg": [
            43,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16387022272988085046&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=7gUrYE50Rb",
        "pdf": "https://openreview.net/pdf?id=7gUrYE50Rb",
        "email": "amazon.com;virginia.edu;sdaia.gov.sa;virginia.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "Amazon;University of Virginia;Saudi Data and AI Authority",
        "aff_unique_dep": "Amazon.com, Inc.;;",
        "aff_unique_url": "https://www.amazon.com;https://www.virginia.edu;https://sdaia.gov.sa",
        "aff_unique_abbr": "Amazon;UVA;SDAIA",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Charlottesville",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "United States;Saudi Arabia"
    },
    {
        "id": "7gVX2LxE7A",
        "title": "SpecAR-Net: Spectrogram Analysis and Representation Network for Time Series",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Time series analysis involves modeling time series to extract valuable information, which finds broad applications in domains such as device malfunction diagnosis, human activity recognition, and medical-assisted diagnosis. Representing temporal-structured samples is crucial for time series analysis tasks. Recently, several advanced deep learning models, i.e., recurrent neural networks, convolutional neural networks, and transformer-style models, have been successively applied in the field of temporal data representation, yielding notable results. Those existing methods primarily model and represent the variation patterns within time series solely in time domain. However, as a highly abstracted information entity, time series data is formed by the coupling of various patterns such as trends, seasonality, and dramatic changes (instantaneous high dynamic), it is difficult to exploit these highly coupled properties only by means of analysis in the time domain. Consequently, it would be insufficient for time-domain dependent only methods to overcome the semantic representation bottleneck or construct comprehensive feature representations of 1D time series. To this end, we present Spectrum Analysis and Representation Network (SpecAR-Net). SpecAR-Net aims at learning more comprehensive representations by modeling raw time series in time-frequency domain, where an efficient joint extraction of time-frequency features is achieved through a group of learnable 2D multi-scale parallel complex convolution blocks. Experimental results show that the SpecAR-Net achieves excellent performance in five major downstream tasks of time series analysis i.e., classification, anomaly detection, imputation, long- and short-term series forecasting.",
        "keywords": "Time series analysis;time series representation;time-frequency transformation;complex convolution",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/e39cdbb7be7beb449f1098b31f8d10e2b35451ae.pdf",
        "author": "Y Dong;Liwen Zhang;Youcheng Zhang;Shi Peng;Wen Chen;Zhe Ma;Xuhui Huang",
        "authorids": "~Y_Dong1;~Liwen_Zhang5;~Youcheng_Zhang1;~Shi_Peng2;~Wen_Chen7;~Zhe_Ma2;~Xuhui_Huang1",
        "gender": "M;M;F;;;M;M",
        "homepage": ";;;;https://scholar.google.com/citations?user=wZWfbLUAAAAJ&hl=zh-CN;https://dblp.org/pid/22/6672;",
        "dblp": ";94/905;;;;22/6672-1;",
        "google_scholar": "mb6jJaQAAAAJ;;;Z5UHCdUAAAAJ;;;https://scholar.google.com/citations?hl=en",
        "orcid": ";0000-0001-8457-2943;0000-0001-9762-7966;;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Y_Dong1;~Liwen_Zhang5;~Youcheng_Zhang1;~Shi_Peng2;~Wen_Chen7;~Zhe_Ma2;~Xuhui_Huang1",
        "aff": ";Harbin Institute of Technology;Intelligent Science and Technology Academy of CASIC;;;Intelligent science and technology academy limited of CASIC;Intelligent Science and Technology Academy of CASIC",
        "aff_domain": ";hit.edu.cn;casic.com.cn;;;casic.com;casic.com.cn",
        "position": ";Researcher;Engineer;;;Full Professor;Full Professor",
        "bibtex": "@misc{\ndong2024specarnet,\ntitle={Spec{AR}-Net: Spectrogram Analysis and Representation Network for Time Series},\nauthor={Y Dong and Liwen Zhang and Youcheng Zhang and Shi Peng and Wen Chen and Zhe Ma and Xuhui Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=7gVX2LxE7A}\n}",
        "github": "",
        "project": "",
        "reviewers": "13Yj;forZ;hAhz",
        "site": "https://openreview.net/forum?id=7gVX2LxE7A",
        "pdf_size": 543364,
        "rating": "3;3;5",
        "confidence": "3;4;3",
        "soundness": "1;2;2",
        "contribution": "2;2;1",
        "presentation": "2;2;2",
        "wc_summary": "37;67;56",
        "wc_strengths": "18;31;45",
        "wc_weaknesses": "160;179;196",
        "wc_questions": "179;53;42",
        "wc_review": "394;330;339",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            53.333333333333336,
            12.39175353029407
        ],
        "wc_strengths_avg": [
            31.333333333333332,
            11.025223605694151
        ],
        "wc_weaknesses_avg": [
            178.33333333333334,
            14.704496666741854
        ],
        "wc_questions_avg": [
            91.33333333333333,
            62.15214307559224
        ],
        "wc_review_avg": [
            354.3333333333333,
            28.288199345702832
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:R06JdPgvNxkJ:scholar.google.com/&scioq=SpecAR-Net:+Spectrogram+Analysis+and+Representation+Network+for+Time+Series&hl=en&as_sdt=0,33",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Harbin Institute of Technology;China Aerospace Science and Industry Corporation",
        "aff_unique_dep": ";Intelligent Science and Technology Academy",
        "aff_unique_url": "http://www.hit.edu.cn/;http://www.casic.com.cn/",
        "aff_unique_abbr": "HIT;CASIC",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Harbin;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "7gg2PcT4HJ",
        "title": "Hybrid Representation Learning Via Epistemic Graph",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In recent years, deep models have achieved remarkable success in many vision tasks. Unfortunately, their performance largely depends on intensive training samples. In contrast, human beings typically perform hybrid learning, e.g., spontaneously integrating structured knowledge for cross-domain recognition or on a much smaller amount of data samples for few-shot learning. Thus it is very attractive to extend hybrid learning for the computer vision tasks by seamlessly integrating structured knowledge with data samples to achieve more effective representation learning. However, such a hybrid learning approach remains a great challenge due to the huge gap between the structured knowledge and the deep features (learned from data samples) on both dimensions and knowledge granularity. In this paper, a novel Epistemic Graph Layer (EGLayer) is developed to enable hybrid learning, such that the information can be exchanged more effectively between the deep features and a structured knowledge graph. Our EGLayer is composed of three major parts: (a) a local graph module to establish a local prototypical graph through the learned deep features, i.e., aligning the deep features with the structured knowledge graph at the same granularity; (b) a query aggregation model to aggregate useful information from the local graphs, and using such representations to compute their similarity with global node embeddings for final prediction; and (c) a novel correlation alignment loss function to constrain the linear consistency between the local and global adjacency matrices from both cosine similarity and Euclidean space. EGLayer is a plug-and-play module that can replace the standard linear classifier, significantly improving the performance of deep models. Extensive experiments have demonstrated that EGLayer can greatly enhance representation learning for the tasks of cross-domain recognition and few-shot learning, and the visualization of knowledge graphs can aid in model interpretation.",
        "keywords": "Representation Learning;Graph Network;Hybrid Learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/3c40121da7316595f08288db1e08056fe8e1939f.zip",
        "author": "Jin Yuan;Yang Zhang;Yangzhou Du;zhongchao shi;Xin Geng;Jianping Fan;Yong Rui",
        "authorids": "~Jin_Yuan2;~Yang_Zhang23;~Yangzhou_Du2;~zhongchao_shi1;~Xin_Geng1;~Jianping_Fan4;~Yong_Rui2",
        "gender": "M;M;M;M;M;M;M",
        "homepage": "https://www.researchgate.net/profile/Jin-Yuan-19;;;;http://palm.seu.edu.cn/xgeng/index.htm;;",
        "dblp": "98/609.html;06/6785-2;40/951.html;45/5323;;69/2360.html;r/YongRui",
        "google_scholar": "https://scholar.google.com.hk/citations?user=S1JGPCMAAAAJ;https://scholar.google.com/citations?hl=zh-CN;;GASgQxEAAAAJ;ZOCxkIcAAAAJ;;rCGsLtcAAAAJ",
        "orcid": "0000-0002-9954-0693;;;;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Jin_Yuan2;~Yang_Zhang23;~Yangzhou_Du2;~zhongchao_shi1;~Xin_Geng1;~Jianping_Fan4;~Yong_Rui2",
        "aff": "Southeast University, Tsinghua University;Lenovo Research, AI Lab;Lenovo;Lenovo Research;Southeast University, China;Northwest University;Lenovo",
        "aff_domain": "seu.edu.cn;lenovo.com;lenovo.com;lenovo.com;seu.edu.cn;nwu.edu.cn;lenovo.com",
        "position": "PhD student;Researcher;Researcher;Research Scientist;Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nyuan2024hybrid,\ntitle={Hybrid Representation Learning Via Epistemic Graph},\nauthor={Jin Yuan and Yang Zhang and Yangzhou Du and zhongchao shi and Xin Geng and Jianping Fan and Yong Rui},\nyear={2024},\nurl={https://openreview.net/forum?id=7gg2PcT4HJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "EhZr;rxaN;kGHn",
        "site": "https://openreview.net/forum?id=7gg2PcT4HJ",
        "pdf_size": 664169,
        "rating": "3;3;5",
        "confidence": "5;3;4",
        "soundness": "2;2;3",
        "contribution": "1;1;2",
        "presentation": "2;1;1",
        "wc_summary": "61;64;50",
        "wc_strengths": "48;44;32",
        "wc_weaknesses": "121;177;177",
        "wc_questions": "5;148;127",
        "wc_review": "235;433;386",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            58.333333333333336,
            6.018490028422596
        ],
        "wc_strengths_avg": [
            41.333333333333336,
            6.79869268479038
        ],
        "wc_weaknesses_avg": [
            158.33333333333334,
            26.398653164297777
        ],
        "wc_questions_avg": [
            93.33333333333333,
            63.04671989000609
        ],
        "wc_review_avg": [
            351.3333333333333,
            84.46827149225257
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:PZfZqTSX1KcJ:scholar.google.com/&scioq=Hybrid+Representation+Learning+Via+Epistemic+Graph&hl=en&as_sdt=0,33",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;3;0;4;2",
        "aff_unique_norm": "Southeast University;Lenovo Research;Lenovo Group Limited;Lenovo;Northwest University",
        "aff_unique_dep": ";AI Lab;;Research;",
        "aff_unique_url": "https://www.seu.edu.cn/;https://www.lenovo.com;https://www.lenovo.com;https://www.lenovo.com;https://www.nwu.edu.cn",
        "aff_unique_abbr": "SEU;Lenovo;Lenovo;Lenovo;NWU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "7hqNl9nP81",
        "title": "On Memorization and Privacy Risks of Sharpness Aware Minimization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In many recent works, there is an increased focus on designing algorithms that seek flatter optima for neural network loss optimization as there is empirical evidence that it leads to better generalization performance in many datasets. In this work, we dissect these performance gains through the lens of data memorization in overparameterized models. We define a new metric that helps us identify which data points specifically do algorithms seeking flatter optima do better when compared to vanilla SGD. We find that the generalization gains achieved by Sharpness Aware Minimization (SAM) are particularly pronounced for atypical data points, which necessitate memorization. This insight helps us unearth higher privacy risks associated with SAM, which we verify through exhaustive empirical evaluations. Finally, we propose mitigation strategies to achieve a more desirable accuracy vs privacy tradeoff.",
        "keywords": "SAM;privacy;memorization;generalization;sharpness aware minimization;flat minima;wider minima;sharper minima;membership inference attack",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/8936d8989ca8947a90720a34402c720b5d68dd5c.pdf",
        "author": "Young In Kim;Pratiksha Agrawal;Johannes Royset;Rajiv Khanna",
        "authorids": "~Young_In_Kim1;~Pratiksha_Agrawal2;~Johannes_Royset1;~Rajiv_Khanna1",
        "gender": "M;;;M",
        "homepage": ";;https://faculty.nps.edu/joroyset/;http://rjvak7.github.io/",
        "dblp": ";;;31/4624",
        "google_scholar": ";;vdegcWUAAAAJ;523w4w8AAAAJ",
        "orcid": ";;;0000-0003-1314-3126",
        "linkedin": "https://linkedin.com/in/kim-young-in-8034a3276/;pratiksha-agrawal-9696b5127/;;",
        "or_profile": "~Young_In_Kim1;~Pratiksha_Agrawal2;~Johannes_Royset1;~Rajiv_Khanna1",
        "aff": "Vanderbilt University;;Naval Postgraduate School;Purdue University",
        "aff_domain": "vanderbilt.edu;;nps.edu;purdue.edu",
        "position": "Undergrad student;;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nkim2024on,\ntitle={On Memorization and Privacy Risks of Sharpness Aware Minimization},\nauthor={Young In Kim and Pratiksha Agrawal and Johannes Royset and Rajiv Khanna},\nyear={2024},\nurl={https://openreview.net/forum?id=7hqNl9nP81}\n}",
        "github": "",
        "project": "",
        "reviewers": "3uQd;gjgb;Dp9T;AV1Z;mP5k",
        "site": "https://openreview.net/forum?id=7hqNl9nP81",
        "pdf_size": 2034846,
        "rating": "3;3;5;5;5",
        "confidence": "4;4;3;2;3",
        "soundness": "2;2;2;2;2",
        "contribution": "3;2;2;2;2",
        "presentation": "1;2;3;2;3",
        "wc_summary": "46;135;53;104;96",
        "wc_strengths": "72;51;51;61;19",
        "wc_weaknesses": "586;448;191;113;129",
        "wc_questions": "2;128;2;115;16",
        "wc_review": "706;762;297;393;260",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            4.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.2,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.2,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            86.8,
            33.19879515886081
        ],
        "wc_strengths_avg": [
            50.8,
            17.690675509996783
        ],
        "wc_weaknesses_avg": [
            293.4,
            189.51158275947145
        ],
        "wc_questions_avg": [
            52.6,
            56.63779656731007
        ],
        "wc_review_avg": [
            483.6,
            209.75852783617643
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8728715609439696,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11624328370537611340&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Vanderbilt University;Naval Postgraduate School;Purdue University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.vanderbilt.edu;https://www.nps.edu;https://www.purdue.edu",
        "aff_unique_abbr": "Vanderbilt;NPS;Purdue",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Continuous-Multiple Image Outpainting in One-Step via Positional Query and A Diffusion-based Approach",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19348",
        "id": "7hxoYxKDTV",
        "author_site": "Shaofeng Zhang, Jinfa Huang, Qiang Zhou, zhibin wang, Fan Wang, Jiebo Luo, Junchi Yan",
        "tldr": "",
        "abstract": "Image outpainting aims to generate the content of an input sub-image beyond its original boundaries. It is an important task in content generation yet remains an open problem for generative models. This paper pushes the technical frontier of image outpainting in two directions that have not been resolved in literature: 1) outpainting with arbitrary and continuous multiples (without restriction), and 2) outpainting in a single step (even for large expansion multiples). Moreover, we develop a method that does not depend on a pre-trained backbone network, which is in contrast commonly required by the previous SOTA outpainting methods. The arbitrary multiple outpainting is achieved by utilizing randomly cropped views from the same image during training to capture arbitrary relative positional information. Specifically, by feeding one view and positional embeddings as queries, we can reconstruct another view. At inference, we generate images with arbitrary expansion multiples by inputting an anchor image and its corresponding positional embeddings. The one-step outpainting ability here is particularly noteworthy in contrast to previous methods that need to be performed for $N$ times to obtain a final multiple which is $N$ times of its basic and fixed multiple. We evaluate the proposed approach (called PQDiff as we adopt a diffusion-based generator as our embodiment, under our proposed \\textbf{P}ositional \\textbf{Q}uery scheme) on public benchmarks, demonstrating its superior performance over state-of-the-art approaches. Specifically, PQDiff achieves state-of-the-art FID scores on the Scenery (\\textbf{21.512}), Building Facades (\\textbf{25.310}), and WikiArts (\\textbf{36.212}) datasets. Furthermore, under the 2.25x, 5x and 11.7x outpainting settings, PQDiff only takes \\textbf{40.6\\%}, \\textbf{20.3\\%} and \\textbf{10.2\\%} of the time of the benchmark state-of-the-art (SOTA) method.",
        "keywords": "Diffusion models;image outpainting",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Shaofeng Zhang;Jinfa Huang;Qiang Zhou;zhibin wang;Fan Wang;Jiebo Luo;Junchi Yan",
        "authorids": "~Shaofeng_Zhang1;~Jinfa_Huang2;~Qiang_Zhou8;~zhibin_wang2;~Fan_Wang6;~Jiebo_Luo1;~Junchi_Yan2",
        "gender": "M;M;M;F;M;M;M",
        "homepage": "https://sherrylone.github.io;https://github.com/inFaaa;https://mightyzau.github.io/;;https://www.cs.rochester.edu/u/jluo/;http://thinklab.sjtu.edu.cn/;",
        "dblp": "132/2540;39/9426;;;25/5545;60/7949.html;",
        "google_scholar": "VoVVJIgAAAAJ;https://scholar.google.com/citations?hl=en;;WCRGTHsAAAAJ;CcbnBvgAAAAJ;ga230VoAAAAJ;YHzKee8AAAAJ",
        "orcid": ";;0000-0003-3697-9348;0000-0001-7320-1119;0000-0002-4516-9729;0000-0001-9639-7679;0000-0001-7618-7973",
        "linkedin": ";;;;jieboluo/;;",
        "or_profile": "~Shaofeng_Zhang1;~Jinfa_Huang2;~Qiang_Zhou8;~Fan_Wang6;~Jiebo_Luo3;~Junchi_Yan1;~Zhibin_Wang1",
        "aff": "Shanghai Jiaotong University;University of Rochester;Alibaba Group;Alibaba Group;University of Rochester;Shanghai Jiaotong University;INF Tech",
        "aff_domain": "sjtu.edu.cn;rochester.edu;alibaba-inc.com;alibaba-inc.com;rochester.edu;sjtu.edu.cn;inftech.ai",
        "position": "PhD student;PhD student;Researcher;Senior Staff Algorithm Engineer;Full Professor;Full Professor;Researcher",
        "bibtex": "@inproceedings{\nzhang2024continuousmultiple,\ntitle={Continuous-Multiple Image Outpainting in One-Step via Positional Query and A Diffusion-based Approach},\nauthor={Shaofeng Zhang and Jinfa Huang and Qiang Zhou and zhibin wang and Fan Wang and Jiebo Luo and Junchi Yan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=7hxoYxKDTV}\n}",
        "github": "",
        "project": "",
        "reviewers": "xgEg;HK74;urTZ",
        "pdf_size": 4340389,
        "rating": "6;6;8",
        "confidence": "5;4;4",
        "soundness": "3;3;3",
        "contribution": "3;3;4",
        "presentation": "2;3;3",
        "wc_summary": "44;63;47",
        "wc_strengths": "36;118;52",
        "wc_weaknesses": "340;27;30",
        "wc_questions": "31;21;178",
        "wc_review": "451;229;307",
        "wc_reply_reviewers": "61;0;58",
        "wc_reply_authors": "974;230;439",
        "reply_reviewers": "1;0;1",
        "reply_authors": "3;1;2",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            51.333333333333336,
            8.339997335464536
        ],
        "wc_strengths_avg": [
            68.66666666666667,
            35.490217744549774
        ],
        "wc_weaknesses_avg": [
            132.33333333333334,
            146.84761565044977
        ],
        "wc_questions_avg": [
            76.66666666666667,
            71.76969338717345
        ],
        "wc_review_avg": [
            329.0,
            91.9565114605812
        ],
        "wc_reply_reviewers_avg": [
            39.666666666666664,
            28.075295585660754
        ],
        "wc_reply_authors_avg": [
            547.6666666666666,
            313.3053178964925
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8223303092029418712&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=7hxoYxKDTV",
        "pdf": "https://openreview.net/pdf?id=7hxoYxKDTV",
        "email": "sjtu.edu.cn;rochester.edu;alibaba-inc.com;alibaba-inc.com;rochester.edu;sjtu.edu.cn;inftech.ai",
        "author_num": 7,
        "aff_unique_index": "0;1;2;2;1;0;3",
        "aff_unique_norm": "Shanghai Jiao Tong University;University of Rochester;Alibaba Group;INF Tech",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.sjtu.edu.cn;https://www.rochester.edu;https://www.alibaba.com;",
        "aff_unique_abbr": "SJTU;U of R;Alibaba;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;1;0",
        "aff_country_unique": "China;United States;"
    },
    {
        "id": "7iCUSBlOgh",
        "title": "Toward Generalizability of Graph-based Imputation on Bio-Medical Missing Data",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent work on graph-based imputation methods for missing features has garnered significant attention, largely due to the effectiveness of their ability to aggregate and propagate information through graph structures. However, these methods generally assume that the graph structure is readily available and manually mask the original features to simulate the scenario of missing features. This set of assumptions narrows the applicability of such techniques to real-world tabular data, where graph structure is not readily available and missing data is a prevalent issue, such as in cases involving confidential patient information. In light of this situation, and with the aim of enhancing generalizability, we propose GRASS that bridges the gap between recent graph-based imputation methods and real-world scenarios involving missing data in their initial states. Specifically, our approach begins with tabular data and employs a simple Multi-Layer Perceptron (MLP) layer to extract feature gradient, which serves as an additional resource for generating graph structures. Leveraging these gradients, we construct a graph from a feature (i.e., column) perspective and carry out column-wise feature propagation to impute missing values based on their similarity to other features. Once the feature matrix is imputed, we generate a second graph, but this time from a sample-oriented (i.e., row) perspective, which serves as the input for existing graph-based imputation models. We evaluate GRASS using real-world medical and bio-domain datasets, demonstrating their effectiveness and generalizability in handling versatile missing scenarios.",
        "keywords": "Missing Features;Graph-based Imputation;Tabular data",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Sukwon Yun;Yunhak Oh;Junseok Lee;Xin Liu;Tsuyoshi Murata;Dongmin Hyun;Sein Kim;Tianlong Chen;Chanyoung Park",
        "authorids": "~Sukwon_Yun1;~Yunhak_Oh1;~Junseok_Lee1;~Xin_Liu24;~Tsuyoshi_Murata1;~Dongmin_Hyun2;~Sein_Kim1;~Tianlong_Chen1;~Chanyoung_Park1",
        "gender": "M;M;M;;M;;;M;M",
        "homepage": "https://sukwonyun.github.io/;https://yunhak0.github.io;;;https://www.net.comp.isct.ac.jp/murata.html;;http://dsail.kaist.ac.kr;https://tianlong-chen.github.io;https://dsail.kaist.ac.kr/",
        "dblp": "327/3464;317/6968;77/3729-2;;77/1703;;334/3935;;170/5430.html",
        "google_scholar": "AgqvtZkAAAAJ;SYoXjKMAAAAJ;Vn0aynYAAAAJ;;https://scholar.google.co.jp/citations?user=ws2fHhsAAAAJ;;https://scholar.google.co.kr/citations?user=qD5z_WkAAAAJ;LE3ctn0AAAAJ;lWk2LtQAAAAJ",
        "orcid": "0000-0002-5186-6563;0000-0002-9110-3042;0000-0003-3874-1667;;0000-0002-3818-7830;;0009-0009-9088-9491;0000-0001-7774-8197;0000-0002-5957-5816",
        "linkedin": ";;;;;;;tianlong-chen-783862167/;",
        "or_profile": "~Sukwon_Yun1;~Yunhak_Oh1;~Junseok_Lee1;~Xin_Liu24;~Tsuyoshi_Murata1;~Dongmin_Hyun2;~Sein_Kim1;~Tianlong_Chen1;~Chanyoung_Park1",
        "aff": "University of North Carolina at Chapel Hill;Korea Advanced Institute of Science & Technology;University of Texas Health Center at Houson;;Tokyo Institute of Technology;;Korea Advanced Institute of Science & Technology;Harvard University;Korea Advanced Institute of Science & Technology",
        "aff_domain": "cs.unc.edu;kaist.ac.kr;uth.tmc.edu;;titech.ac.jp;;kaist.ac.kr;harvard.edu;kaist.ac.kr",
        "position": "PhD student;PhD student;Researcher;;Full Professor;;PhD student;Postdoc;Assistant Professor",
        "bibtex": "@misc{\nyun2024toward,\ntitle={Toward Generalizability of Graph-based Imputation on Bio-Medical Missing Data},\nauthor={Sukwon Yun and Yunhak Oh and Junseok Lee and Xin Liu and Tsuyoshi Murata and Dongmin Hyun and Sein Kim and Tianlong Chen and Chanyoung Park},\nyear={2024},\nurl={https://openreview.net/forum?id=7iCUSBlOgh}\n}",
        "github": "",
        "project": "",
        "reviewers": "4SJf;r66i;T1VM;JSNu;Cqu6",
        "site": "https://openreview.net/forum?id=7iCUSBlOgh",
        "pdf_size": 2312914,
        "rating": "3;5;6;6;6",
        "confidence": "3;5;5;4;3",
        "soundness": "1;2;3;3;3",
        "contribution": "2;2;3;3;3",
        "presentation": "1;1;3;4;2",
        "wc_summary": "50;117;81;86;71",
        "wc_strengths": "15;96;13;42;76",
        "wc_weaknesses": "160;94;1092;147;133",
        "wc_questions": "15;164;40;74;3",
        "wc_review": "240;471;1226;349;283",
        "wc_reply_reviewers": "0;28;165;0;0",
        "wc_reply_authors": "949;3064;4788;1978;616",
        "reply_reviewers": "0;1;2;0;0",
        "reply_authors": "3;6;10;4;2",
        "rating_avg": [
            5.2,
            1.16619037896906
        ],
        "confidence_avg": [
            4.0,
            0.8944271909999159
        ],
        "soundness_avg": [
            2.4,
            0.8
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.2,
            1.16619037896906
        ],
        "wc_summary_avg": [
            81.0,
            21.82658928921328
        ],
        "wc_strengths_avg": [
            48.4,
            32.97635516548183
        ],
        "wc_weaknesses_avg": [
            325.2,
            384.0371856995101
        ],
        "wc_questions_avg": [
            59.2,
            57.762963912874135
        ],
        "wc_review_avg": [
            513.8,
            364.5421237662392
        ],
        "wc_reply_reviewers_avg": [
            38.6,
            64.12363058966639
        ],
        "wc_reply_authors_avg": [
            2279.0,
            1518.971757472798
        ],
        "reply_reviewers_avg": [
            0.6,
            0.7999999999999999
        ],
        "reply_authors_avg": [
            5.0,
            2.8284271247461903
        ],
        "replies_avg": [
            36,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.3834824944236852,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:6FqY728RwdUJ:scholar.google.com/&scioq=Toward+Generalizability+of+Graph-based+Imputation+on+Bio-Medical+Missing+Data&hl=en&as_sdt=0,5",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;3;1;4;1",
        "aff_unique_norm": "University of North Carolina;Korea Advanced Institute of Science and Technology;University of Texas Health Science Center at Houston;Tokyo Institute of Technology;Harvard University",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.unc.edu;https://www.kaist.ac.kr;https://www.uth.edu;https://www.titech.ac.jp;https://www.harvard.edu",
        "aff_unique_abbr": "UNC;KAIST;UTHealth;Titech;Harvard",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Chapel Hill;;Houston",
        "aff_country_unique_index": "0;1;0;2;1;0;1",
        "aff_country_unique": "United States;South Korea;Japan"
    },
    {
        "id": "7ipjMIHVJt",
        "title": "DASFormer: Self-supervised Pretraining for Earthquake Monitoring",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Earthquake monitoring is a fundamental task to unravel the underlying physics of earthquakes and mitigate associated hazards for public safety. Distributed acoustic sensing, or DAS, which transforms pre-existing telecommunication cables into ultra-dense seismic networks, offers a cost-effective and scalable solution for next-generation earthquake monitoring. However, current approaches for earthquake monitoring primarily rely on supervised learning, while manually labeled DAS data is quite limited and it is difficult to obtain more annotated datasets. In this paper, we present DASFormer, a novel self-supervised pretraining technique on DAS data with a coarse-to-fine framework that models spatial-temporal signal correlation. Given the pretrained DASFormer, we treat earthquake monitoring as an anomaly detection task and demonstrate that the pretrained DASFormer can be successfully utilized as a seismic phase detector. Experimental results demonstrate that DASFormer is effective in terms of several evaluation metrics and outperforms state-of-the-art time-series forecasting, anomaly detection, and foundation models on several datasets in the seismic detection tasks.",
        "keywords": "deep learing;self-supervised learning;time series analysis;anomaly detection;earthquake monitering",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Qianggang Ding;Zhichao Shen;Weiqiang Zhu;Bang Liu",
        "authorids": "~Qianggang_Ding1;~Zhichao_Shen1;~Weiqiang_Zhu1;~Bang_Liu1",
        "gender": "M;M;;M",
        "homepage": "http://www.mrdqg.com/;https://www.whoi.edu/profile/zhichao.shen/;;http://www-labs.iro.umontreal.ca/~liubang/",
        "dblp": "247/1295;;;",
        "google_scholar": "ga3j4_oAAAAJ;oWmPQzUAAAAJ;ApsNeMkAAAAJ;lmfAnP4AAAAJ",
        "orcid": ";0000-0003-0458-5264;;0000-0002-9483-8984",
        "linkedin": ";;;bang-liu-12b66789/?originalSubdomain=ca",
        "or_profile": "~Qianggang_Ding1;~Zhichao_Shen1;~Weiqiang_Zhu1;~Bang_Liu1",
        "aff": "Universit\u00e9 de Montr\u00e9al;Woods Hole Oceanographic Institution;University of California, Berkeley;University of Montreal",
        "aff_domain": "umontreal.ca;whoi.edu;berkeley.edu;umontreal.ca",
        "position": "PhD student;Postdoc;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nding2024dasformer,\ntitle={{DASF}ormer: Self-supervised Pretraining for Earthquake Monitoring},\nauthor={Qianggang Ding and Zhichao Shen and Weiqiang Zhu and Bang Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=7ipjMIHVJt}\n}",
        "github": "",
        "project": "",
        "reviewers": "Hht1;RSrX;8ntH;gsBc",
        "site": "https://openreview.net/forum?id=7ipjMIHVJt",
        "pdf_size": 9282097,
        "rating": "5;5;5;6",
        "confidence": "4;3;5;3",
        "soundness": "3;3;3;2",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "65;20;112;79",
        "wc_strengths": "31;50;73;71",
        "wc_weaknesses": "283;83;538;459",
        "wc_questions": "192;75;5;98",
        "wc_review": "571;228;728;707",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1160;732;1829;1037",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;3;2",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            69.0,
            33.03785707336358
        ],
        "wc_strengths_avg": [
            56.25,
            17.137313091613866
        ],
        "wc_weaknesses_avg": [
            340.75,
            175.11478378480786
        ],
        "wc_questions_avg": [
            92.5,
            66.88235940814289
        ],
        "wc_review_avg": [
            558.5,
            200.10559712311897
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1189.5,
            400.74711477439234
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:34S76So_WW0J:scholar.google.com/&scioq=DASFormer:+Self-supervised+Pretraining+for+Earthquake+Monitoring&hl=en&as_sdt=0,47",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Universit\u00e9 de Montr\u00e9al;Woods Hole Oceanographic Institution;University of California, Berkeley;University of Montreal",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.umontreal.ca;https://www.whoi.edu;https://www.berkeley.edu;https://wwwumontreal.ca",
        "aff_unique_abbr": "UdeM;WHOI;UC Berkeley;UM",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Berkeley",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "Canada;United States"
    },
    {
        "id": "7iuFxx9Ccx",
        "title": "Resource Efficient Test-Time Training with Slimmable Network",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Test-Time Training (TTT), an innovative paradigm for enhancing a model's generalization in a specific future scenario, commonly leverages self-supervised learning to adapt the model to the unlabeled test data under distribution shifts. However, previous TTT methods tend to disregard resource constraints during the deployment phase in real-world scenarios and have two fundamental shortcomings. Firstly, they are obligated to retrain adapted models when deploying across multiple devices with diverse resource limitations, causing considerable resource inefficiency. Secondly, they are incapable of coping with computational budget variations during the testing stage. To tackle these issues, we propose a resource-adaptive test-time training framework called SlimTTT, which allows for the seamless switching of different sub-networks for adaptive inference. Furthermore, we discover that different width of sub-networks can capture different views of images and these views are complementary and beneficial to the ones created by data augmentation, which is widely used in TTT. To utilize these views, we introduce Width-enhance Contrastive Learning (WCL), Logits Consistency Regularization (LCR) and Global Feature Alignment (GFA) to promote representation consistency at both feature and prediction space in a self-supervised manner, enabling networks of different widths to excel in TTT tasks. Our proposed method, SlimTTT, has achieved state-of-the-art (SOTA) results across a variety of adaptation methods and four different datasets with varying backbones. Remarkably, despite a significant reduction in computational complexity - over 70% less than the current SOTA method - SlimTTT continues to deliver competitive performance, rendering it highly conducive for adoption in practice.",
        "keywords": "Test-Time Training;Resource Efficient;Slimmable Neural Network",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/0decffc758dac0536859f1845c9bc589cdf1d853.zip",
        "author": "Lincan Cai;Shuang Li;Wenxuan Ma;Ling Liu",
        "authorids": "~Lincan_Cai1;~Shuang_Li6;~Wenxuan_Ma2;~Ling_Liu8",
        "gender": ";M;M;F",
        "homepage": "https://github.com/cailincan0129;https://shuangli.xyz;;https://github.com/llada60",
        "dblp": ";43/6294-8;289/0784-1;",
        "google_scholar": "wH-dNbAAAAAJ;VXCiAc4AAAAJ;u7aJOt8AAAAJ;",
        "orcid": ";0000-0001-6807-9905;0000-0001-5402-6028;",
        "linkedin": ";;;",
        "or_profile": "~Lincan_Cai1;~Shuang_Li6;~Wenxuan_Ma2;~Ling_Liu8",
        "aff": "Beijing Institute of Technology;Beijing Institute of Technology;Beijing Institute of Technology;Beijing Institute of Technology",
        "aff_domain": "bit.edu.cn;bit.edu.cn;bit.edu.cn;bit.edu.cn",
        "position": "MS student;Associate Professor;MS student;Undergrad student",
        "bibtex": "@misc{\ncai2024resource,\ntitle={Resource Efficient Test-Time Training with Slimmable Network},\nauthor={Lincan Cai and Shuang Li and Wenxuan Ma and Ling Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=7iuFxx9Ccx}\n}",
        "github": "",
        "project": "",
        "reviewers": "yJHx;by2E;1QhS;aCQv",
        "site": "https://openreview.net/forum?id=7iuFxx9Ccx",
        "pdf_size": 765386,
        "rating": "5;5;6;8",
        "confidence": "4;4;4;3",
        "soundness": "1;2;3;4",
        "contribution": "2;2;3;3",
        "presentation": "3;2;3;2",
        "wc_summary": "92;58;332;110",
        "wc_strengths": "61;29;163;55",
        "wc_weaknesses": "152;180;169;94",
        "wc_questions": "12;5;67;183",
        "wc_review": "317;272;731;442",
        "wc_reply_reviewers": "0;138;222;22",
        "wc_reply_authors": "1404;3521;2910;1669",
        "reply_reviewers": "0;1;2;1",
        "reply_authors": "2;6;4;4",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            1.118033988749895
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            148.0,
            107.86102168995063
        ],
        "wc_strengths_avg": [
            77.0,
            51.088159097779204
        ],
        "wc_weaknesses_avg": [
            148.75,
            33.14645531576491
        ],
        "wc_questions_avg": [
            66.75,
            71.28244875142829
        ],
        "wc_review_avg": [
            440.5,
            178.9112908678488
        ],
        "wc_reply_reviewers_avg": [
            95.5,
            89.90411558988832
        ],
        "wc_reply_authors_avg": [
            2376.0,
            871.8964961507759
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            4.0,
            1.4142135623730951
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9428090415820632,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:MVLhjDRX0kMJ:scholar.google.com/&scioq=Resource+Efficient+Test-Time+Training+with+Slimmable+Network&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Beijing Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.bit.edu.cn/",
        "aff_unique_abbr": "BIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "7j5KWl7VtF",
        "title": "Exploring the Edge of Stability: Insights from a Fine-Grained Analysis of Gradient Descent in Shallow ReLU Networks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Gradient descent (GD) in modern neural networks initially sharpens the loss landscape by increasing the top Hessian eigenvalues until the step size becomes unstable. Subsequently, it enters the ``Edge of Stability'' (EoS) regime, characterized by unstable step size and non-monotonic loss reduction. EoS regime challenges conventional step size wisdom, sparking recent intensive research. However, a detailed characterization of EoS within the fine-grained GD neural network training dynamics remains under-explored. This paper provides a comprehensive analysis of both the sharpening phase and the EoS regime throughout the entire GD dynamics, focusing on shallow ReLU networks with squared loss on orthogonal inputs. Our theory characterizes the evolution of the top Hessian eigenvalues and elucidates the mechanisms behind EoS training. Leveraging this analysis, we present empirical validations of our predictions regarding sharpening and EoS dynamics, contributing to a deeper understanding of neural network training processes.",
        "keywords": "gradient descent;edge of stability",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Junghwan Kim;Michelle YoungJin Kim;Barzan Mozafari",
        "authorids": "~Junghwan_Kim1;~Michelle_YoungJin_Kim1;~Barzan_Mozafari1",
        "gender": "M;M;F",
        "homepage": ";https://web.eecs.umich.edu/~mozafari/;https://cozymichelle.github.io/",
        "dblp": ";;",
        "google_scholar": "msafJ3UAAAAJ;;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Junghwan_Kim1;~Barzan_Mozafari1;~Michelle_Kim2",
        "aff": "University of Michigan - Ann Arbor;University of Michigan;Michigan State University",
        "aff_domain": "umich.edu;umich.edu;msu.edu",
        "position": "PhD student;Associate Professor;PhD student",
        "bibtex": "@misc{\nkim2024exploring,\ntitle={Exploring the Edge of Stability: Insights from a Fine-Grained Analysis of Gradient Descent in Shallow Re{LU} Networks},\nauthor={Junghwan Kim and Michelle YoungJin Kim and Barzan Mozafari},\nyear={2024},\nurl={https://openreview.net/forum?id=7j5KWl7VtF}\n}",
        "github": "",
        "project": "",
        "reviewers": "QK5F;CLYU;xPNL;5wmW",
        "site": "https://openreview.net/forum?id=7j5KWl7VtF",
        "pdf_size": 608370,
        "rating": "1;3;3;3",
        "confidence": "3;4;5;4",
        "soundness": "1;1;2;1",
        "contribution": "2;1;1;1",
        "presentation": "2;2;2;1",
        "wc_summary": "55;56;36;188",
        "wc_strengths": "36;37;43;2",
        "wc_weaknesses": "121;319;202;2",
        "wc_questions": "166;8;1;7",
        "wc_review": "378;420;282;199",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            1.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            83.75,
            60.71398109167278
        ],
        "wc_strengths_avg": [
            29.5,
            16.101242188104617
        ],
        "wc_weaknesses_avg": [
            161.0,
            115.67843359935334
        ],
        "wc_questions_avg": [
            45.5,
            69.62219473702334
        ],
        "wc_review_avg": [
            319.75,
            85.80319050012068
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:mERti5tom8oJ:scholar.google.com/&scioq=Exploring+the+Edge+of+Stability:+Insights+from+a+Fine-Grained+Analysis+of+Gradient+Descent+in+Shallow+ReLU+Networks&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "University of Michigan;Michigan State University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.umich.edu;https://www.msu.edu",
        "aff_unique_abbr": "UM;MSU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Ann Arbor;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "7jUQHmz4Tq",
        "title": "D3AD: DYNAMIC DENOISING DIFFUSION PROBABILISTIC MODEL FOR ANOMALY DETECTION",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Diffusion models have found valuable applications in anomaly detection by capturing the nominal data distribution and identifying anomalies via reconstruction. Despite their merits, they struggle to localize anomalies of varying scales, especially larger anomalies like entire missing components. Addressing this, we present a novel framework that enhances the capability of diffusion models, by extending the previous introduced implicit conditioning approach \\cite{DBLP:conf/iclr/MengHSSWZE22} in three significant ways. First, we incorporate a dynamic step size computation that allows for variable noising steps in the forward process guided by an initial anomaly prediction. Second, we demonstrate that denoising an only scaled input, without any added noise, outperforms conventional denoising process. Third, we project images in a latent space to abstract away from fine details that interfere with reconstruction of large missing components. Additionally, we propose a fine-tuning mechanism that facilitates the model to effectively grasp the nuances of the target domain. Our method undergoes rigorous evaluation on two prominent anomaly detection datasets VISA and BTAD, yielding state-of-the-art performance. Importantly, our framework effectively localizes anomalies regardless of their scale, marking a pivotal advancement in diffusion-based anomaly detection.  All code will be made public upon acceptance.",
        "keywords": "Anomaly Detection;Diffusion Models;Domain Adaptation;Score Based Models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/8d398527c3c4d820a8e622da38507b989203354b.zip",
        "author": "Justin Tebbe;Jawad Tayyub",
        "authorids": "~Justin_Tebbe1;~Jawad_Tayyub1",
        "gender": ";M",
        "homepage": ";",
        "dblp": ";161/2637",
        "google_scholar": ";BtS3MQsAAAAJ",
        "orcid": ";",
        "linkedin": "justin-tebbe-18a056283;jawad-tayyub-b8899a23/",
        "or_profile": "~Justin_Tebbe1;~Jawad_Tayyub1",
        "aff": "Otto-von-Guericke Universit\u00e4t Magdeburg;Endress + Hauser",
        "aff_domain": "ovgu.de;endress.com",
        "position": "MS student;AI Research Scientist",
        "bibtex": "@misc{\ntebbe2024dad,\ntitle={D3{AD}: {DYNAMIC} {DENOISING} {DIFFUSION} {PROBABILISTIC} {MODEL} {FOR} {ANOMALY} {DETECTION}},\nauthor={Justin Tebbe and Jawad Tayyub},\nyear={2024},\nurl={https://openreview.net/forum?id=7jUQHmz4Tq}\n}",
        "github": "",
        "project": "",
        "reviewers": "vjSv;Emgj;xkrq",
        "site": "https://openreview.net/forum?id=7jUQHmz4Tq",
        "pdf_size": 25497277,
        "rating": "3;3;3",
        "confidence": "5;5;5",
        "soundness": "1;2;2",
        "contribution": "1;2;2",
        "presentation": "2;1;2",
        "wc_summary": "75;72;66",
        "wc_strengths": "11;47;26",
        "wc_weaknesses": "490;122;169",
        "wc_questions": "25;97;49",
        "wc_review": "601;338;310",
        "wc_reply_reviewers": "503;0;180",
        "wc_reply_authors": "1097;381;794",
        "reply_reviewers": "1;0;1",
        "reply_authors": "2;1;2",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            5.0,
            0.0
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            71.0,
            3.7416573867739413
        ],
        "wc_strengths_avg": [
            28.0,
            14.7648230602334
        ],
        "wc_weaknesses_avg": [
            260.3333333333333,
            163.5284548803527
        ],
        "wc_questions_avg": [
            57.0,
            29.93325909419153
        ],
        "wc_review_avg": [
            416.3333333333333,
            131.07843283910424
        ],
        "wc_reply_reviewers_avg": [
            227.66666666666666,
            208.0966655720899
        ],
        "wc_reply_authors_avg": [
            757.3333333333334,
            293.45338452450824
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5215605692183936052&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1+2",
        "aff_unique_norm": "Otto-von-Guericke University Magdeburg;Endress;Hauser",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ovgu.de;;",
        "aff_unique_abbr": "OVGU;;",
        "aff_campus_unique_index": "0;",
        "aff_campus_unique": "Magdeburg;",
        "aff_country_unique_index": "0;",
        "aff_country_unique": "Germany;"
    },
    {
        "id": "7jWiBAWG0b",
        "title": "Learning Guarantees for Non-convex Pairwise SGD with Heavy Tails",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In recent years, there have been a growing number of works studying the generalization properties of pairwise stochastic gradient descent (SGD) from the perspective of algorithmic stability. However, few of them devote to simultaneously studying the generalization and optimization for the non-convex setting, especially the ones with heavy-tailed gradient noise. This paper establishes the stability-based learning guarantees for non-convex, heavy-tailed pairwise SGD by investigating its generalization and optimization jointly. Firstly, we bound the generalization error of pairwise SGD in the general non-convex setting, after bridging the quantitative relationships between $\\ell_1$ on-average model stability and generalization error. Secondly, a refined generalization bound is established for non-convex pairwise SGD by introducing the heavy-tailed gradient noise to remove the bounded gradient assumption. Finally, the sharper error bounds for generalization and optimization are provided under the gradient dominance condition. In addition, we extend our analysis to the corresponding pairwise minibatch SGD and derive the first stability-based near-optimal generalization and optimization bounds which are consistent with many empirical observations. These theoretical results fill the learning theory gap for non-convex pairwise SGD with heavy tails.",
        "keywords": "Stability;generalization bound;stochastic gradient descent;pairwise learning;heavy tail",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Jun Chen;Hong Chen;Bin Gu;Tieliang Gong;Guodong Liu;Yingjie Wang;Weifu Li",
        "authorids": "~Jun_Chen12;~Hong_Chen1;~Bin_Gu1;~Tieliang_Gong2;~Guodong_Liu2;~Yingjie_Wang1;~Weifu_Li1",
        "gender": "M;;M;;M;M;M",
        "homepage": "https://www.researchgate.net/profile/Jun-Chen-256;https://chenhongml.github.io/;https://mbzuai.ac.ae/study/faculty/bin-gu/;;;https://www.researchgate.net/profile/Yingjie-Wang-37;https://www.researchgate.net/profile/Weifu-Li",
        "dblp": ";https://dblp.uni-trier.de/pers/hd/c/Chen_0004:Hong;29/1758-1;;;33/6297-7;198/9625",
        "google_scholar": "GkZkdRYAAAAJ;;Vo8OgCgAAAAJ;;Xgwse5AAAAAJ;https://scholar.google.com/citations?hl=en;",
        "orcid": "0000-0002-9810-5171;;0000-0001-6049-1815;;;;",
        "linkedin": "%E5%90%9B-%E9%99%88-4a8823276/;;;;guodong-liu-56a671107/;;",
        "or_profile": "~Jun_Chen12;~Hong_Chen1;~Bin_Gu1;~Tieliang_Gong2;~Guodong_Liu2;~Yingjie_Wang1;~Weifu_Li1",
        "aff": "Huazhong Agricultural University;Huazhong Agricultural University;Mohamed bin Zayed University of Artificial Intelligence;;University of Maryland, College Park;Nanyang Technological University;Huazhong Agricultural University",
        "aff_domain": "hzau.edu.cn;hzau.edu.cn;mbzuai.ac.ae;;umd.edu;ntu.edu.sg;hzau.edu.cn",
        "position": "PhD student;Full Professor;Assistant Professor;;Postdoc;Postdoc;Associate Professor",
        "bibtex": "@misc{\nchen2024learning,\ntitle={Learning Guarantees for Non-convex Pairwise {SGD} with Heavy Tails},\nauthor={Jun Chen and Hong Chen and Bin Gu and Tieliang Gong and Guodong Liu and Yingjie Wang and Weifu Li},\nyear={2024},\nurl={https://openreview.net/forum?id=7jWiBAWG0b}\n}",
        "github": "",
        "project": "",
        "reviewers": "dGQ5;6TFb;dBNi",
        "site": "https://openreview.net/forum?id=7jWiBAWG0b",
        "pdf_size": 589245,
        "rating": "5;5;6",
        "confidence": "3;3;3",
        "soundness": "3;2;3",
        "contribution": "2;3;2",
        "presentation": "3;2;3",
        "wc_summary": "50;93;121",
        "wc_strengths": "41;39;76",
        "wc_weaknesses": "464;255;86",
        "wc_questions": "235;66;55",
        "wc_review": "790;453;338",
        "wc_reply_reviewers": "0;116;30",
        "wc_reply_authors": "1633;1746;641",
        "reply_reviewers": "0;1;1",
        "reply_authors": "4;4;3",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            88.0,
            29.20045661743437
        ],
        "wc_strengths_avg": [
            52.0,
            16.990193249832878
        ],
        "wc_weaknesses_avg": [
            268.3333333333333,
            154.60559138947363
        ],
        "wc_questions_avg": [
            118.66666666666667,
            82.3825763671475
        ],
        "wc_review_avg": [
            527.0,
            191.8037191158364
        ],
        "wc_reply_reviewers_avg": [
            48.666666666666664,
            49.16186417223099
        ],
        "wc_reply_authors_avg": [
            1340.0,
            496.41582032270753
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:OA79FH0x53cJ:scholar.google.com/&scioq=Learning+Guarantees+for+Non-convex+Pairwise+SGD+with+Heavy+Tails&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2;3;0",
        "aff_unique_norm": "Huazhong Agricultural University;Mohamed bin Zayed University of Artificial Intelligence;University of Maryland;Nanyang Technological University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "http://www.hzau.edu.cn/;https://mbzuai.ac.ae;https://www/umd.edu;https://www.ntu.edu.sg",
        "aff_unique_abbr": "HAU;MBZUAI;UMD;NTU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";College Park",
        "aff_country_unique_index": "0;0;1;2;3;0",
        "aff_country_unique": "China;United Arab Emirates;United States;Singapore"
    },
    {
        "id": "7kKyELnAhn",
        "title": "Efficient Offline Preference-Based Reinforcement Learning with Transition-Dependent Discounting",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Offline preference-based reinforcement learning (OPBRL) tackles two major limitations of traditional reinforcement learning: the need for online interaction and the requirement for carefully designed reward labels. Despite recent progress, solving complex tasks with a small number of preference labels remains challenging, as the learned reward function is inaccurate when preference labels are scarce. To tackle this challenge, we first demonstrate that the inaccurate reward model predicts low-preference regions much more precisely than high-preference regions, as the former suffers less from generalization errors. By incorporating this insight with offline RL's pessimism property, we propose a novel OPBRL framework, Transition-dEpendent Discounting (TED), that excels in complex OPBRL tasks with only a small number of preference queries. TED assigns low transition-dependent discount factors to the predicted low-preference regions, which discourages the offline agent from visiting these regions and achieves higher performance. On the challenging Meta-World MT1 tasks, TED significantly outperforms current OPBRL baselines.",
        "keywords": "preference-based reinforcement learning;offline reinforcement learning;RLHF;transition-dependent discounting",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/d499e23ae564a989731714cd81c6163b70aaf9ad.zip",
        "author": "Jin Zhang;Hao Hu;Yiqin Yang;Bo Liu;Yang Gao;Chongjie Zhang",
        "authorids": "~Jin_Zhang6;~Hao_Hu3;~Yiqin_Yang1;~Bo_Liu2;~Yang_Gao1;~Chongjie_Zhang1",
        "gender": "M;M;M;M;M;",
        "homepage": "http://group.iiis.tsinghua.edu.cn/~milab/person-zhangjin.html;https://mousehu.github.io;https://www.researchgate.net/profile/Yiqin-Yang-2;https://liubo-cs.github.io/;http://yang-gao.weebly.com;",
        "dblp": "43/6657-16;67/6924-6;180/7725;58/2670-6.html;89/4402-29;29/6693",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;aHTi5IEAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en;LjxqXycAAAAJ",
        "orcid": ";;;0000-0003-2519-6196;;",
        "linkedin": ";hao-hu-tsinghua;;bo-liu-8b2b8118/;yang-gao-45245348/;",
        "or_profile": "~Jin_Zhang6;~Hao_Hu3;~Yiqin_Yang1;~Bo_Liu2;~Yang_Gao1;~Chongjie_Zhang1",
        "aff": "Tsinghua University;Tsinghua University;Tsinghua University;Auburn University;Tsinghua University;Washington University, Saint Louis",
        "aff_domain": "tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;auburn.edu;tsinghua.edu.cn;wustl.edu",
        "position": "PhD student;PhD student;PhD student;Assistant Professor;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nzhang2024efficient,\ntitle={Efficient Offline Preference-Based Reinforcement Learning with Transition-Dependent Discounting},\nauthor={Jin Zhang and Hao Hu and Yiqin Yang and Bo Liu and Yang Gao and Chongjie Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=7kKyELnAhn}\n}",
        "github": "",
        "project": "",
        "reviewers": "AQAk;CqDq;KeDu;wPHc",
        "site": "https://openreview.net/forum?id=7kKyELnAhn",
        "pdf_size": 744407,
        "rating": "1;3;3;3",
        "confidence": "4;4;4;4",
        "soundness": "2;1;2;2",
        "contribution": "2;3;2;2",
        "presentation": "2;2;3;1",
        "wc_summary": "86;148;59;26",
        "wc_strengths": "26;72;37;38",
        "wc_weaknesses": "138;257;104;630",
        "wc_questions": "27;137;68;2",
        "wc_review": "277;614;268;696",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            79.75,
            44.76815274277017
        ],
        "wc_strengths_avg": [
            43.25,
            17.25362280797862
        ],
        "wc_weaknesses_avg": [
            282.25,
            208.65566730860678
        ],
        "wc_questions_avg": [
            58.5,
            51.08081831764248
        ],
        "wc_review_avg": [
            463.75,
            193.4610748962178
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:YrOpRukvZLEJ:scholar.google.com/&scioq=Efficient+Offline+Preference-Based+Reinforcement+Learning+with+Transition-Dependent+Discounting&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;0;2",
        "aff_unique_norm": "Tsinghua University;Auburn University;Washington University in St. Louis",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.auburn.edu;https://wustl.edu",
        "aff_unique_abbr": "THU;Auburn;WUSTL",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Saint Louis",
        "aff_country_unique_index": "0;0;0;1;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "7kubdPrlRY",
        "title": "A PERSPECTIVE OF IMPROPER DYNAMICS ON OFFLINE MODEL-BASED PLANNING",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "By learning the dynamics model, estimating, and planning on the latent state, MuZero and its variants perform well in complex environments. However, the performance of these algorithms require an accurate dynamics model and prediction model, which may be difficult in offline reinforcement learning since the lack of interactions with the environment. Recent works attempt to use one-step rollouts to reduce the cumulative error of rollout caused by an inaccurate dynamics model. We argue that the planning issues of MuZero-type methods are mainly caused by inaccurate models. To address this issue, we propose a robust method, Constrained Offline Model-based Planning (COMP), for training dynamics or prediction models more smoothly. COMP introduces a kind of specifically designed noise to the latent state, aiming to align the value and dynamics of these states with those of states not perturbed. Our method can be combined with MuZero and its derived algorithms to improve planning performance in offline settings. Experiments show that our proposed method achieved notable performance in most Atari game tasks on RL Unplugged benchmark.",
        "keywords": "Offline RL;model-based RL;deep RL;planning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Chen Zhao;Yazhe Niu;Kaixin Huang;Yu Liu;Chun Yuan",
        "authorids": "~Chen_Zhao8;~Yazhe_Niu1;~Kaixin_Huang1;~Yu_Liu2;~Chun_Yuan1",
        "gender": "M;M;M;M;M",
        "homepage": "https://github.com/PaParaZz1;;http://liuyu.us;https://www.sigs.tsinghua.edu.cn/fg3/105064.jhtml;",
        "dblp": "252/5570.html;;97/2274-15;;",
        "google_scholar": "P3BUrBQAAAAJ;https://scholar.google.com.hk/citations?hl=zh-CN;;https://scholar.google.com.hk/citations?user=fYdxi2sAAAAJ;https://scholar.google.com/citations?view_op=new_profile",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Yazhe_Niu1;~Kaixin_Huang1;~Yu_Liu2;~Chun_Yuan1;~Zhao_Chen7",
        "aff": "The Chinese University of Hong Kong;Electronic Engineering, Tsinghua University, Tsinghua University;SenseTime;Tsinghua University;Tsinghua University",
        "aff_domain": "cuhk.edu.hk;mails.tsinghua.edu.cn;sensetime.com;tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "PhD student;MS student;Principal Researcher;Full Professor;MS student",
        "bibtex": "@misc{\nzhao2024a,\ntitle={A {PERSPECTIVE} {OF} {IMPROPER} {DYNAMICS} {ON} {OFFLINE} {MODEL}-{BASED} {PLANNING}},\nauthor={Chen Zhao and Yazhe Niu and Kaixin Huang and Yu Liu and Chun Yuan},\nyear={2024},\nurl={https://openreview.net/forum?id=7kubdPrlRY}\n}",
        "github": "",
        "project": "",
        "reviewers": "pj73;LURo;dRm8;NRcG",
        "site": "https://openreview.net/forum?id=7kubdPrlRY",
        "pdf_size": 2305251,
        "rating": "1;3;3;3",
        "confidence": "4;4;4;4",
        "soundness": "2;2;2;2",
        "contribution": "1;2;2;1",
        "presentation": "1;2;2;2",
        "wc_summary": "66;38;48;43",
        "wc_strengths": "30;17;68;11",
        "wc_weaknesses": "839;266;176;104",
        "wc_questions": "14;1;60;29",
        "wc_review": "949;322;352;187",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            48.75,
            10.568230693924125
        ],
        "wc_strengths_avg": [
            31.5,
            22.1641602593015
        ],
        "wc_weaknesses_avg": [
            346.25,
            290.2209287766821
        ],
        "wc_questions_avg": [
            26.0,
            21.988633427296023
        ],
        "wc_review_avg": [
            452.5,
            293.31425127327174
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:DQYVGxuANnIJ:scholar.google.com/&scioq=A+PERSPECTIVE+OF+IMPROPER+DYNAMICS+ON+OFFLINE+MODEL-BASED+PLANNING&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;1;1",
        "aff_unique_norm": "Chinese University of Hong Kong;Tsinghua University;SenseTime",
        "aff_unique_dep": ";Electronic Engineering;",
        "aff_unique_url": "https://www.cuhk.edu.hk;https://www.tsinghua.edu.cn;https://www.sensetime.com",
        "aff_unique_abbr": "CUHK;THU;SenseTime",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "7lmvCdD6va",
        "title": "P4Q: Learning to Prompt for Quantization in Visual-language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large-scale pre-trained Vision-Language Models (VLMs) have gained prominence in various visual and multimodal tasks, yet the deployment of VLMs on resource-constrained platforms remains challenging due to their prohibitive computational and memory overhead.  Quantization of VLMs can substantially reduce the computational and memory costs, which are in urgent need. There are two prevailing paradigms, Quantization-Aware Training (QAT) can effectively quantize large-scale VLMs but incur a huge training cost, while low-bit Post-Training Quantization (PTQ) suffers from a notable performance drop. We propose a `Prompt for Quantization'' (P4Q) method, in which we design a lightweight architecture to leverage contrastive loss supervision to enhance the recognition performance of a PTQ model. Our method can effectively reduce the gap between image features and text features caused by low-bit quantization, based on learnable prompts to reorganize textual representations and a low-bit adapter to realign the distributions of image and text features. We also introduce a distillation loss based on cosine similarity predictions to distill the quantized model using a full-precision teacher. Extensive experimental results demonstrate that our P4Q method outperforms prior arts, even achieving comparable results to its full-precision counterparts. For instance, our 8-bit P4Q can theoretically compress the CLIP-ViT/B-32  by 4 $\\times$ while achieving 79.42\\% Top-1 accuracy, outperforming the learnable prompt fine-tuned full-precision model by 2.91\\% with negligible additional parameters on the CIFAR100 dataset. Test code and checkpoints are available at \\url{https://anonymous.4open.science/r/ICLR2024-P4Q-1255}",
        "keywords": "Quantization;Vision-Language Models (VLMs)",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Huixin Sun;Runqi Wang;Xianbin Cao;Yanjing Li;Xiaolong Jiang;Yao Hu;Baochang Zhang",
        "authorids": "~Huixin_Sun1;~Runqi_Wang1;~Xianbin_Cao2;~Yanjing_Li2;~Xiaolong_Jiang2;~Yao_Hu4;~Baochang_Zhang1",
        "gender": "F;M;M;;M;M;M",
        "homepage": "https://huixinsun.github.io/;;http://www.ee.buaa.edu.cn/info/1205/22851.htm;;https://dblp.org/pid/56/5097;https://dblp.uni-trier.de/pid/80/3887-1.html;",
        "dblp": "329/3654;266/9915;22/3485;62/201;;https://dblp.uni-trier.de/pid/80/3887-1.html;",
        "google_scholar": ";https://scholar.google.com.hk/citations?hl=zh-CN;;2rE-GM8AAAAJ;G0Ow8j8AAAAJ;;LIu7k7wAAAAJ",
        "orcid": ";;;0000-0003-3745-8755;;;0009-0006-1274-7111",
        "linkedin": "https://www.linkedin.cn/incareer/in/huixin-sun-52a5701a2;;;;;;",
        "or_profile": "~Huixin_Sun1;~Runqi_Wang1;~Xianbin_Cao2;~Yanjing_Li2;~Xiaolong_Jiang2;~Baochang_Zhang1;~Yao_Hu1",
        "aff": "Beihang University;Beihang University;Beihang University;Beihang University;Alibaba Group;Beihang University;Zhejiang University of Technology",
        "aff_domain": "buaa.edu.cn;buaa.edu.cn;buaa.edu.cn;buaa.edu.cn;alibaba-inc.com;buaa.edu.cn;zjut.edu.cn",
        "position": "PhD student;PhD student;Full Professor;PhD student;Research Engineer;Professor;Researcher",
        "bibtex": "@misc{\nsun2024pq,\ntitle={P4Q: Learning to Prompt for Quantization in Visual-language Models},\nauthor={Huixin Sun and Runqi Wang and Xianbin Cao and Yanjing Li and Xiaolong Jiang and Yao Hu and Baochang Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=7lmvCdD6va}\n}",
        "github": "",
        "project": "",
        "reviewers": "xyBt;X2dx;iH7g;5VdB",
        "site": "https://openreview.net/forum?id=7lmvCdD6va",
        "pdf_size": 2874160,
        "rating": "3;3;5;5",
        "confidence": "4;5;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;1;2;2",
        "presentation": "2;2;3;3",
        "wc_summary": "112;54;130;70",
        "wc_strengths": "53;34;72;62",
        "wc_weaknesses": "251;184;295;163",
        "wc_questions": "46;2;265;31",
        "wc_review": "462;274;762;326",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            91.5,
            30.70423423568808
        ],
        "wc_strengths_avg": [
            55.25,
            13.988834833537782
        ],
        "wc_weaknesses_avg": [
            223.25,
            52.651566928250105
        ],
        "wc_questions_avg": [
            86.0,
            104.54903155935975
        ],
        "wc_review_avg": [
            456.0,
            189.53627621117812
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14843857089839360972&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0;1;0;2",
        "aff_unique_norm": "Beihang University;Alibaba Group;Zhejiang University of Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.buaa.edu.cn/;https://www.alibaba.com;https://www.zjut.edu.cn",
        "aff_unique_abbr": "BUAA;Alibaba;ZJUT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "7m5jhNXklB",
        "title": "VTruST : Controllable value function based subset selection for Data-Centric Trustworthy AI",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Trustworthy AI is crucial to the widespread adoption of AI in high-stakes applications with explainability, fairness, and robustness being some of the key trustworthiness metrics. Data-Centric AI (DCAI) aims to construct high-quality datasets for efficient training of trustworthy models. In this work, we propose a controllable framework for data-centric trustworthy AI (DCTAI)- VTruST, that allows users to control the trade-offs between the different trustworthiness metrics of the constructed training datasets. A key challenge in implementing an efficient DCTAI framework is to design an online value-function-based training data subset selection algorithm. We pose the training data valuation and subset selection problem as an online sparse approximation formulation, where the $\\textit{features}$ for each training datapoint is obtained in an online manner through an iterative training algorithm. We propose a novel online version of the OMP algorithm for solving this problem. We also derive conditions on the data matrix, that guarantee the exact recovery of the sparse solution. We demonstrate the generality and effectiveness of our approach by designing data-driven value functions for the above trustworthiness metrics. Experimental results show that VTruST outperforms the state-of-the-art baselines for fair learning as well as robust training, on standard fair and robust datasets. We also demonstrate that VTruST can provide effective tradeoffs between different trustworthiness metrics through pareto optimal fronts. Finally, we show that the data valuation generated by VTruST can provide effective data-centric explanations for different trustworthiness metrics.",
        "keywords": "Data centric trustworthy AI;value function;data valuation;online sparse approximation;fairness;robustness;explainability",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/d8c70fa936124b80998e8c95b94b8ae1cc8e561d.zip",
        "author": "Soumi Das;Shubhadip Nag;Shreyyash Sharma;Suparna Bhattacharya;Sourangshu Bhattacharya",
        "authorids": "~Soumi_Das1;~Shubhadip_Nag1;~Shreyyash_Sharma1;~Suparna_Bhattacharya1;~Sourangshu_Bhattacharya1",
        "gender": "F;M;M;F;M",
        "homepage": "https://soumidas.github.io/;https://nagshubhadip.github.io/;http://cse.iitkgp.ac.in/~shreyyashs/;https://www.hpe.com/psnow/doc/a00130899enw;http://cse.iitkgp.ac.in/~sourangshu/",
        "dblp": "252/5452;;;10/2594;http://dblp.uni-trier.de/pers/hd/b/Bhattacharya:Sourangshu",
        "google_scholar": "1tJnMkoAAAAJ;https://scholar.google.com/citations?hl=en;;https://scholar.google.co.in/citations?user=ubLpnh4AAAAJ;https://scholar.google.co.in/citations?user=IixRsP0AAAAJ",
        "orcid": ";;;0000-0001-9541-4027;",
        "linkedin": "soumi-das;shubhadip-nag;;suparna-bhattacharya-5a7798b/;sourangshubhattacharya",
        "or_profile": "~Soumi_Das1;~Shubhadip_Nag1;~Shreyyash_Sharma1;~Suparna_Bhattacharya1;~Sourangshu_Bhattacharya1",
        "aff": "MPI-SWS;Indian Institute of Technology, Kharagpur;;Hewlett Packard Enterprise;Indian Institute of Technology Kharagpur",
        "aff_domain": "mpi-sws.org;iitkgp.ac.in;;hpe.com;iitkgp.ac.in",
        "position": "Postdoc;MS student;;Researcher;Associate Professor",
        "bibtex": "@misc{\ndas2024vtrust,\ntitle={{VT}ru{ST} : Controllable value function based subset selection for Data-Centric Trustworthy {AI}},\nauthor={Soumi Das and Shubhadip Nag and Shreyyash Sharma and Suparna Bhattacharya and Sourangshu Bhattacharya},\nyear={2024},\nurl={https://openreview.net/forum?id=7m5jhNXklB}\n}",
        "github": "",
        "project": "",
        "reviewers": "FQcd;7pAq;ohGL",
        "site": "https://openreview.net/forum?id=7m5jhNXklB",
        "pdf_size": 9471762,
        "rating": "5;5;6",
        "confidence": "3;3;3",
        "soundness": "2;2;3",
        "contribution": "3;2;3",
        "presentation": "3;3;2",
        "wc_summary": "69;78;161",
        "wc_strengths": "41;62;30",
        "wc_weaknesses": "183;103;99",
        "wc_questions": "3;2;87",
        "wc_review": "296;245;377",
        "wc_reply_reviewers": "0;0;151",
        "wc_reply_authors": "383;406;1004",
        "reply_reviewers": "0;0;1",
        "reply_authors": "1;1;2",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            102.66666666666667,
            41.41121694527811
        ],
        "wc_strengths_avg": [
            44.333333333333336,
            13.274871834493252
        ],
        "wc_weaknesses_avg": [
            128.33333333333334,
            38.689648342791756
        ],
        "wc_questions_avg": [
            30.666666666666668,
            39.83577398380617
        ],
        "wc_review_avg": [
            306.0,
            54.35071296680477
        ],
        "wc_reply_reviewers_avg": [
            50.333333333333336,
            71.18208263944578
        ],
        "wc_reply_authors_avg": [
            597.6666666666666,
            287.47444330854097
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:vU38P9fvb6QJ:scholar.google.com/&scioq=VTruST+:+Controllable+value+function+based+subset+selection+for+Data-Centric+Trustworthy+AI&hl=en&as_sdt=0,5",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Max Planck Institute for Software Systems;Indian Institute of Technology;Hewlett Packard Enterprise;Indian Institute of Technology Kharagpur",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.mpi-sws.org;https://www.iitkgp.ac.in;https://www.hpe.com;https://www.iitkgp.ac.in",
        "aff_unique_abbr": "MPI-SWS;IIT Kharagpur;HPE;IIT Kharagpur",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Kharagpur",
        "aff_country_unique_index": "0;1;2;1",
        "aff_country_unique": "Germany;India;United States"
    },
    {
        "id": "7mR83Q12cJ",
        "title": "Counterfactual Data Augmentation with Contrastive Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Statistical disparity between distinct treatment groups is one of the most significant challenges for estimating Conditional Average Treatment Effects (CATE). To address this, we introduce a model-agnostic data augmentation method that imputes the counterfactual outcomes for a selected subset of individuals. Specifically, we utilize contrastive learning to learn a representation space and a similarity measure such that in the learned representation space \\textit{close} individuals identified by the learned similarity measure have \\textit{similar} potential outcomes. This property ensures reliable imputation of counterfactual outcomes for the individuals with close neighbors from the alternative treatment group. By augmenting the original dataset with these reliable imputations, we can effectively reduce the discrepancy between different treatment groups, while inducing minimal imputation error. The augmented dataset is subsequently employed to train CATE estimation models. Theoretical analysis and experimental studies on synthetic and semi-synthetic benchmarks demonstrate that our method achieves significant improvements in both performance and robustness to overfitting across state-of-the-art models.",
        "keywords": "Data Augmentation;Contrastive Learning;Treatment Effect;Causal Inference",
        "primary_area": "causal reasoning",
        "supplementary_material": "/attachment/fd5e7459888b42e76d8e91a42b239b8b056762cb.zip",
        "author": "Ahmed Aloui;Juncheng Dong;Cat Phuoc Le;Vahid Tarokh",
        "authorids": "~Ahmed_Aloui1;~Juncheng_Dong1;~Cat_Phuoc_Le1;~Vahid_Tarokh1",
        "gender": "M;;M;",
        "homepage": ";;https://scholars.duke.edu/person/cat.le;",
        "dblp": "116/6738;;251/5583;",
        "google_scholar": ";;gSzKGdQAAAAJ;",
        "orcid": ";;0000-0002-9121-9395;",
        "linkedin": "ahmed-aloui-b06547153/;;catphuocle/;",
        "or_profile": "~Ahmed_Aloui1;~Juncheng_Dong1;~Cat_Phuoc_Le1;~Vahid_Tarokh1",
        "aff": "Duke University, Duke University;;Duke University;",
        "aff_domain": "ece.duke.edu;;duke.edu;",
        "position": "PhD student;;Postdoc;",
        "bibtex": "@misc{\naloui2024counterfactual,\ntitle={Counterfactual Data Augmentation with Contrastive Learning},\nauthor={Ahmed Aloui and Juncheng Dong and Cat Phuoc Le and Vahid Tarokh},\nyear={2024},\nurl={https://openreview.net/forum?id=7mR83Q12cJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "AQb9;NLwi;Lde6;FUqM",
        "site": "https://openreview.net/forum?id=7mR83Q12cJ",
        "pdf_size": 2896223,
        "rating": "3;5;5;6",
        "confidence": "5;3;5;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "52;50;35;75",
        "wc_strengths": "6;13;29;126",
        "wc_weaknesses": "21;145;287;142",
        "wc_questions": "1024;37;31;42",
        "wc_review": "1103;245;382;385",
        "wc_reply_reviewers": "0;156;0;0",
        "wc_reply_authors": "1555;676;463;241",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            1.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            53.0,
            14.300349646075091
        ],
        "wc_strengths_avg": [
            43.5,
            48.355454707819675
        ],
        "wc_weaknesses_avg": [
            148.75,
            94.19759816470906
        ],
        "wc_questions_avg": [
            283.5,
            427.54561160185006
        ],
        "wc_review_avg": [
            528.75,
            336.33196027139616
        ],
        "wc_reply_reviewers_avg": [
            39.0,
            67.54998149518622
        ],
        "wc_reply_authors_avg": [
            733.75,
            498.4713507314136
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.6882472016116854,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10401963946042605033&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Duke University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.duke.edu",
        "aff_unique_abbr": "Duke",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "7n360rsYAq",
        "title": "Towards Dynamic Trend Filtering through Trend Points Detection with Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Trend filtering simplifies complex time series data by prioritizing proximity to the original data while applying smoothness to filter out noise. However, the inherent smoothness of trend filtering filters out the tail distribution of time series data, characterized as extreme values, thereby failing to reflect abrupt changes in the trend. In this paper, we introduce Trend Point Detection, a novel approach to trend filtering that directly identifies essential points that should be reflected in the trend including abrupt changes. We refer to these essential points as Dynamic Trend Points (DTPs) and extract trends from connecting these points. To identify DTPs, we formalize the Trend Point Detection problem as a Markov Decision Process (MDP). We solve the Trend Point Detection problem using Reinforcement Learning (RL) algorithms operating within a discrete action space, referred to as the Dynamic Trend Filtering network (DTF-net). DTF-net incorporates flexible noise filtering, preserving important original sub-sequences while removing noise as needed for other sub-sequences. We demonstrate that DTF-net excels at capturing abrupt changes compared to other trend filtering algorithms, using synthetic data and the Nasdaq intraday dataset. Furthermore, when we utilize DTF-net's trend as an additional feature for Time Series Forecasting (TSF) in non-stationary data, we demonstrate performance improvements, as abrupt changes are captured rather than smoothed out.",
        "keywords": "time series analysis;trend filtering;reinforcement learning;time series forecasting",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/d1a85b8573e87c6b89a8e6a5586dd8464abdcfb9.zip",
        "author": "Jihyeon Seong;Sekwang Oh;Jaesik Choi",
        "authorids": "~Jihyeon_Seong1;~Sekwang_Oh1;~Jaesik_Choi1",
        "gender": "F;M;M",
        "homepage": "http://sailab.kaist.ac.kr/members/#GraduateStudents;;https://sailab.kaist.ac.kr/jaesik",
        "dblp": ";;13/1402",
        "google_scholar": "DdSo9q4AAAAJ;;RqMLVzUAAAAJ",
        "orcid": "0000-0002-3591-131X;;",
        "linkedin": "jihyeon-seong-302571267/;oskoskosk;",
        "or_profile": "~Jihyeon_Seong1;~Sekwang_Oh1;~Jaesik_Choi1",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr;kaist.ac.kr",
        "position": "PhD student;MS student;Associate Professor",
        "bibtex": "@misc{\nseong2024towards,\ntitle={Towards Dynamic Trend Filtering through Trend Points Detection with Reinforcement Learning},\nauthor={Jihyeon Seong and Sekwang Oh and Jaesik Choi},\nyear={2024},\nurl={https://openreview.net/forum?id=7n360rsYAq}\n}",
        "github": "",
        "project": "",
        "reviewers": "ALFQ;Fg2U;Q1zH;NMhu",
        "site": "https://openreview.net/forum?id=7n360rsYAq",
        "pdf_size": 1115341,
        "rating": "5;5;6;8",
        "confidence": "3;3;3;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "57;84;100;119",
        "wc_strengths": "49;67;118;102",
        "wc_weaknesses": "173;212;40;89",
        "wc_questions": "4;77;53;16",
        "wc_review": "283;440;311;326",
        "wc_reply_reviewers": "76;28;0;0",
        "wc_reply_authors": "918;1133;486;394",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "3;4;2;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            90.0,
            22.726636354727024
        ],
        "wc_strengths_avg": [
            84.0,
            27.358728040608906
        ],
        "wc_weaknesses_avg": [
            128.5,
            67.72185762366534
        ],
        "wc_questions_avg": [
            37.5,
            29.090376415577712
        ],
        "wc_review_avg": [
            340.0,
            59.76202807803631
        ],
        "wc_reply_reviewers_avg": [
            26.0,
            31.04834939252005
        ],
        "wc_reply_authors_avg": [
            732.75,
            304.2017217242532
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:nl0k2DsgulMJ:scholar.google.com/&scioq=Towards+Dynamic+Trend+Filtering+through+Trend+Points+Detection+with+Reinforcement+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "7n8RzGQKnR",
        "title": "A Symbolic Framework for Evaluating Mathematical Reasoning with Transformers",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "This paper proposes a methodology for generating synthetic mathematical derivations via a computer algebra system to evaluate the generalisability of Transformers in symbolic and quantitative reasoning problems, and provides a general framework for building large-scale and high-quality benchmarks in the mathematical domain. In the context of classification tasks involving multi-step annotated derivations (spanning 18 mathematical operators), we leverage the framework to compare the mathematical capabilities of GPT-4, GPT-3.5, and a canon of fine-tuned BERT models, exploring the relationship between specific operators and generalisation failure. Surprisingly, the average in-distribution performance of BERT models surpasses GPT-3.5, and rivals GPT-4, yet simple data perturbations reduce BERT scores by up to 80 F1 points. The results suggest that the in-distribution performance and generalisability of smaller open-source models may potentially rival GPT in narrow mathematical domains by incorporating appropriately structured discourse-level relations during training, and highlight a shared weakness between BERT and GPT involving a relative inability to decode dependency relations involving indirect references to mathematical entities. We release the data generation framework along with all the resulting datasets and fine-tuned models\\footnote{\\url{https://github.com/anonymous/TBA}}.",
        "keywords": "mathematical reasoning;generalisation;gpt;bert;sequence classification;synthetic data;fine-tuning;few-shot learning",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Jordan Meadows;Marco Valentino;Damien Teney;Andre Freitas",
        "authorids": "~Jordan_Meadows1;~Marco_Valentino1;~Damien_Teney1;~Andre_Freitas1",
        "gender": "M;M;M;",
        "homepage": ";https://www.marcovalentino.net/;https://www.damienteney.info;http://andrefreitas.org",
        "dblp": ";212/3533;62/10068;47/9409.html",
        "google_scholar": "https://scholar.google.com/citations?hl=en;nnaBYcIAAAAJ;https://scholar.google.com.au/citations?user=iS_jP_3dpD8J;ExmHmMoAAAAJ",
        "orcid": ";;;",
        "linkedin": ";marco-valentino-844a5ab1/;;andrefreitas/",
        "or_profile": "~Jordan_Meadows1;~Marco_Valentino1;~Damien_Teney1;~Andre_Freitas1",
        "aff": "University of Manchester;Idiap Research Institute;Idiap Research Institute;University of Manchester",
        "aff_domain": "cs.manchester.ac.uk;idiap.ch;idiap.ch;manchester.ac.uk",
        "position": "PhD student;Postdoc;Researcher;Associate Professor",
        "bibtex": "@misc{\nmeadows2024a,\ntitle={A Symbolic Framework for Evaluating Mathematical Reasoning with Transformers},\nauthor={Jordan Meadows and Marco Valentino and Damien Teney and Andre Freitas},\nyear={2024},\nurl={https://openreview.net/forum?id=7n8RzGQKnR}\n}",
        "github": "",
        "project": "",
        "reviewers": "o3bz;Y9EH;RYtb;5bKm",
        "site": "https://openreview.net/forum?id=7n8RzGQKnR",
        "pdf_size": 948481,
        "rating": "3;3;6;6",
        "confidence": "3;3;3;4",
        "soundness": "3;2;4;3",
        "contribution": "2;1;3;3",
        "presentation": "2;1;3;4",
        "wc_summary": "42;75;77;164",
        "wc_strengths": "31;131;69;45",
        "wc_weaknesses": "92;482;6;51",
        "wc_questions": "166;102;23;1",
        "wc_review": "331;790;175;261",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "11;17;18;14",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            89.5,
            45.202322949158265
        ],
        "wc_strengths_avg": [
            69.0,
            38.28837943815329
        ],
        "wc_weaknesses_avg": [
            157.75,
            189.66071680767212
        ],
        "wc_questions_avg": [
            73.0,
            65.52480446365331
        ],
        "wc_review_avg": [
            389.25,
            237.8785141621664
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            15.0,
            2.7386127875258306
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5773502691896258,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Frt3JHs3X-0J:scholar.google.com/&scioq=A+Symbolic+Framework+for+Evaluating+Mathematical+Reasoning+with+Transformers&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;0",
        "aff_unique_norm": "University of Manchester;Idiap Research Institute",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.manchester.ac.uk;https://www.idiap.ch",
        "aff_unique_abbr": "UoM;Idiap",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "United Kingdom;Switzerland"
    },
    {
        "title": "TimeMixer: Decomposable Multiscale Mixing for Time Series Forecasting",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19347",
        "id": "7oLshfEIC2",
        "author_site": "Shiyu Wang, Haixu Wu, Xiaoming Shi, Tengge Hu, Huakun Luo, Lintao Ma, James Zhang, JUN ZHOU",
        "tldr": "",
        "abstract": "Time series forecasting is widely used in extensive applications, such as traffic planning and weather forecasting. However, real-world time series usually present intricate temporal variations, making forecasting extremely challenging. Going beyond the mainstream paradigms of plain decomposition and multiperiodicity analysis, we analyze temporal variations in a novel view of multiscale-mixing, where time series present distinct patterns in different sampling scales. Specifically, the microscopic and the macroscopic information are reflected in fine and coarse scales, respectively, and thereby complex variations are inherently disentangled. Based on this observation, we propose TimeMixer as a fully MLP-based architecture with Past-Decomposable-Mixing (PDM) and Future-Multipredictor-Mixing (FMM) blocks to take full advantage of disentangled multiscale series in both past extraction and future prediction phases. Concretely, PDM applies the decomposition to multiscale series and further mixes the decomposed seasonal and trend components in fine-to-coarse and coarse-to-fine directions separately, which successively aggregates the microscopic seasonal and macroscopic trend information. FMM further ensembles multiple predictors to utilize complementary forecasting capabilities in multiscale observations. Consequently, our proposed TimeMixer is able to achieve consistent state-of-the-art performances in both long-term and short-term forecasting tasks with favorable run-time efficiency.",
        "keywords": "Time Series Forecasting;Mixing Networks",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/92b4b480bed2da6400329929685bd647f09c0bf8.zip",
        "author": "Shiyu Wang;Haixu Wu;Xiaoming Shi;Tengge Hu;Huakun Luo;Lintao Ma;James Y. Zhang;JUN ZHOU",
        "authorids": "~Shiyu_Wang3;~Haixu_Wu1;~Xiaoming_Shi2;~Tengge_Hu1;~Huakun_Luo1;~Lintao_Ma1;~James_Y._Zhang1;~JUN_ZHOU6",
        "gender": ";M;M;;;;M;M",
        "homepage": ";;;http://ise.thss.tsinghua.edu.cn/~mlong/;;;https://scholar.google.com/citations?user=Ywakh_sAAAAJ;https://scholar.google.com/citations?user=mCVvloEAAAAJ&hl=en",
        "dblp": ";286/8115;;330/4778;;;151/3086;99/3847-11",
        "google_scholar": ";oLL_x0wAAAAJ;0WMTWacAAAAJ;;;;Ywakh_sAAAAJ;mCVvloEAAAAJ",
        "orcid": ";;0000-0003-0764-8961;;;;0000-0001-6519-676X;0000-0001-6033-6102",
        "linkedin": ";;;;;;jamesymzhang/;",
        "or_profile": "~Shiyu_Wang3;~Haixu_Wu1;~Xiaoming_Shi2;~Tengge_Hu1;~Huakun_Luo1;~Lintao_Ma1;~James_Y._Zhang1;~JUN_ZHOU6",
        "aff": ";Tsinghua University;Ant Group;Tsinghua University;;;Ant Group;Ant Group",
        "aff_domain": ";tsinghua.edu.cn;antgroup.com;tsinghua.edu.cn;;;alipay.com;antgroup.com",
        "position": ";PhD student;Researcher;MS student;;;managing director;Researcher",
        "bibtex": "@inproceedings{\nwang2024timemixer,\ntitle={TimeMixer: Decomposable Multiscale Mixing for Time Series Forecasting},\nauthor={Shiyu Wang and Haixu Wu and Xiaoming Shi and Tengge Hu and Huakun Luo and Lintao Ma and James Y. Zhang and JUN ZHOU},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=7oLshfEIC2}\n}",
        "github": "",
        "project": "",
        "reviewers": "ixvB;P2SD;ansv",
        "pdf_size": 5651407,
        "rating": "3;6;8",
        "confidence": "3;4;3",
        "soundness": "3;2;3",
        "contribution": "3;2;3",
        "presentation": "4;3;4",
        "wc_summary": "99;46;94",
        "wc_strengths": "161;50;205",
        "wc_weaknesses": "265;181;193",
        "wc_questions": "117;5;74",
        "wc_review": "642;282;566",
        "wc_reply_reviewers": "569;60;44",
        "wc_reply_authors": "3469;1390;714",
        "reply_reviewers": "2;1;1",
        "reply_authors": "11;5;2",
        "rating_avg": [
            5.666666666666667,
            2.0548046676563256
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            79.66666666666667,
            23.893281249943232
        ],
        "wc_strengths_avg": [
            138.66666666666666,
            65.21928821717971
        ],
        "wc_weaknesses_avg": [
            213.0,
            37.094473981982816
        ],
        "wc_questions_avg": [
            65.33333333333333,
            46.13265895460852
        ],
        "wc_review_avg": [
            496.6666666666667,
            154.9308089295204
        ],
        "wc_reply_reviewers_avg": [
            224.33333333333334,
            243.8036550632952
        ],
        "wc_reply_authors_avg": [
            1857.6666666666667,
            1172.3311060541823
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            6.0,
            3.7416573867739413
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.1147078669352809,
        "gs_citation": 210,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7179608277779096511&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=7oLshfEIC2",
        "pdf": "https://openreview.net/pdf?id=7oLshfEIC2",
        "email": ";tsinghua.edu.cn;antgroup.com;tsinghua.edu.cn;;;alipay.com;antgroup.com",
        "author_num": 8,
        "aff_unique_index": "0;1;0;1;1",
        "aff_unique_norm": "Tsinghua University;Ant Group",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.antgroup.com",
        "aff_unique_abbr": "THU;Ant Group",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "7oYpj8BOLW",
        "title": "BackBench: Are Vision Language Models Resilient to Object-to-Background Context?",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In this paper, we evaluate the resilience of modern vision and multimodal foundational models against object-to-background context variations. The majority of robustness evaluation methods have introduced synthetic datasets to induce changes to object characteristics (viewpoints, scale, color) or utilized image transformation techniques (adversarial changes, common corruptions) on real images to simulate shifts in distributions. Our approach, on the other hand, can change the background of real images using text prompts thus allowing diverse changes to the background. We achieve this while preserving the original appearance and semantics of the object of interest. This allows us to quantify the role of background context in understanding the robustness and generalization of deep neural networks. To achieve this goal, we harness the generative capabilities of text-to-image, image-to-text, and image-to-segment models to automatically generate a broad spectrum of object-to-background changes. By using textual guidance for control, we produce various versions of standard vision datasets (ImageNet, COCO), incorporating either diverse and realistic backgrounds into the images or introducing variations in the color and texture of the background. Additionally, we craft adversarial backgrounds by optimizing the latent variables and text embeddings within text-to-image models. We conduct thorough experimentation and provide an in-depth analysis of the robustness of vision and language models against object-to-background context variations across different tasks. Our code and evaluation benchmark along with the datasets will be publicly released.",
        "keywords": "Robustness;Real Image Editing;Foundational models;Adversarial Examples;Counterfactual images",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/621bb75b2ca1bab96f2b2602621aee16ab2bcfbe.pdf",
        "author": "Muhammad Huzaifa;Hashmat Shadab Malik;Muzammal Naseer;Salman Khan;Fahad Khan",
        "authorids": "~Muhammad_Huzaifa1;~Hashmat_Shadab_Malik1;~Muzammal_Naseer1;~Salman_Khan4;~Fahad_Khan1",
        "gender": "M;M;M;M;M",
        "homepage": "https://muhammad-huzaifaa.github.io/;;https://muzammal-naseer.com/;https://salman-h-khan.github.io/;https://sites.google.com/view/fahadkhans/home",
        "dblp": ";312/4561;;32/11535-1;05/8618",
        "google_scholar": "V7hTDxQAAAAJ;2Ft7r4AAAAAJ;https://scholar.google.ch/citations?user=tM9xKA8AAAAJ;https://scholar.google.es/citations?user=M59O9lkAAAAJ;zvaeYnUAAAAJ",
        "orcid": ";;0000-0001-7663-7161;0000-0002-9502-1749;",
        "linkedin": "muhammad-huzaifa--/;hashmat-shadab-malik-7a578b17b?originalSubdomain=ae;muzammalnaseer/;;",
        "or_profile": "~Muhammad_Huzaifa1;~Hashmat_Shadab_Malik1;~Muzammal_Naseer1;~Salman_Khan4;~Fahad_Khan1",
        "aff": "Mohamed bin Zayed University of Artificial Intelligence;Mohamed bin Zayed University of Artificial Intelligence;Mohamed bin Zayed University of Artificial Intelligence;Australian National University;Link\u00f6ping University",
        "aff_domain": "mbzuai.ac.ae;mbzuai.ac.ae;mbzuai.ac.ae;anu.edu.au;liu.se",
        "position": "MS student;PhD student;Researcher;Lecturer;Associate Professor",
        "bibtex": "@misc{\nanonymous2024backbench,\ntitle={BackBench: Are Vision Language Models Resilient to Object-to-Background Context?},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=7oYpj8BOLW}\n}",
        "github": "",
        "project": "",
        "reviewers": "SPdM;ATH5;B18W;RPSV",
        "site": "https://openreview.net/forum?id=7oYpj8BOLW",
        "pdf_size": 10114163,
        "rating": "5;5;6;8",
        "confidence": "4;3;3;4",
        "soundness": "2;2;2;4",
        "contribution": "2;3;2;3",
        "presentation": "2;3;2;4",
        "wc_summary": "52;58;149;72",
        "wc_strengths": "57;8;81;84",
        "wc_weaknesses": "202;55;96;42",
        "wc_questions": "34;2;90;56",
        "wc_review": "345;123;416;254",
        "wc_reply_reviewers": "55;0;0;0",
        "wc_reply_authors": "1904;1168;768;1489",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "3;2;2;3",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            82.75,
            38.931831449342326
        ],
        "wc_strengths_avg": [
            57.5,
            30.434355587066403
        ],
        "wc_weaknesses_avg": [
            98.75,
            62.85449466824151
        ],
        "wc_questions_avg": [
            45.5,
            32.07413287993925
        ],
        "wc_review_avg": [
            284.5,
            109.5045661148429
        ],
        "wc_reply_reviewers_avg": [
            13.75,
            23.81569860407206
        ],
        "wc_reply_authors_avg": [
            1332.25,
            417.3801474675095
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.40824829046386296,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:PBSU1a9SdPIJ:scholar.google.com/&scioq=BackBench:+Are+Vision+Language+Models+Resilient+to+Object-to-Background+Context%3F&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;2",
        "aff_unique_norm": "Mohamed bin Zayed University of Artificial Intelligence;Australian National University;Link\u00f6ping University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://mbzuai.ac.ae;https://www.anu.edu.au;https://www.liu.se",
        "aff_unique_abbr": "MBZUAI;ANU;LiU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;2",
        "aff_country_unique": "United Arab Emirates;Australia;Sweden"
    },
    {
        "id": "7pVIFJW2Hp",
        "title": "FigCaps-HF: A Figure-to-Caption Generative Framework and Benchmark with Human Feedback",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Captions are crucial for understanding scientific visualizations and documents. Existing captioning methods for scientific figures rely on figure-caption pairs extracted from documents for training, many of which fall short with respect to metrics like helpfulness, explainability, and visual-descriptiveness leading to generated captions being misaligned with reader preferences. To enable the generation of high-quality figure captions, we introduce FigCaps-HF a new framework for figure-caption generation that can incorporate domain expert feedback in generating captions optimized for reader preferences. Our framework comprises of 1) an automatic method for evaluating quality of figure-caption pairs, 2) a novel reinforcement learning with human feedback (RLHF) method to optimize a generative figure-to-caption model for reader preferences. We demonstrate the effectiveness of our simple learning framework by improving performance over standard fine-tuning across different types of models. In particular, when using BLIP as the base model, our RLHF framework achieves a mean gain of 35.7%, 16.9%, and 9% in ROUGE, BLEU, and Meteor, respectively. Finally, we release a large-scale benchmark dataset with human feedback on figure-caption pairs to enable further evaluation and development of RLHF techniques for this problem",
        "keywords": "Figure Caption Generation;Image-to-Text Generation;Reinforcement Learning using Human Feedback;Figure-Caption Benchmark;Human Feedback",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Ashish Singh;Prateek Agarwal;Zixuan Huang;Arpita Singh;Tong Yu;Sungchul Kim;Victor Bursztyn;Nikos Vlassis;Ryan A. Rossi",
        "authorids": "~Ashish_Singh2;~Prateek_Agarwal1;~Zixuan_Huang5;~Arpita_Singh1;~Tong_Yu3;~Sungchul_Kim1;~Victor_Bursztyn1;~Nikos_Vlassis1;~Ryan_A._Rossi2",
        "gender": "M;M;M;F;;M;M;;M",
        "homepage": "https://people.cs.umass.edu/~ashishsingh/;;https://github.com/rayt98;;https://www.linkedin.com/in/tong-yu-42790744;https://sites.google.com/site/subright;https://vbursztyn.github.io/;;http://ryanrossi.com",
        "dblp": ";;;;32/1593-1;61/1573;154/7800.html;v/NikosAVlassis;17/5085",
        "google_scholar": "5lJCCzMAAAAJ;;;;https://scholar.google.com/citations?hl=en;v8ISLgIAAAAJ;HRx3epUAAAAJ;JJWWPjsAAAAJ;_Dc6lbQAAAAJ",
        "orcid": ";;;;0000-0002-5991-2050;0000-0003-3580-5290;;;0000-0001-9758-0635",
        "linkedin": "ashish-singh-a750b7b6/;prateekagarw/;;arpita505/;tong-yu-42790744;;;;",
        "or_profile": "~Ashish_Singh2;~Prateek_Agarwal1;~Zixuan_Huang5;~Arpita_Singh1;~Tong_Yu3;~Sungchul_Kim1;~Victor_Bursztyn1;~Nikos_Vlassis1;~Ryan_Rossi1",
        "aff": "Department of Computer Science, University of Massachusetts, Amherst;;University of Massachusetts at Amherst;LinkedIn;Adobe Research;Adobe Systems;Adobe Systems;Adobe Systems;Adobe Research",
        "aff_domain": "cs.umass.edu;;umass.edu;linkedin.com;adobe.com;adobe.com;adobe.com;adobe.com;adobe.com",
        "position": "PhD student;;MS student;Software Engineer;Senior Research Scientist;Researcher;Researcher;Principal Researcher;Senior Research Scientist",
        "bibtex": "@misc{\nsingh2024figcapshf,\ntitle={FigCaps-{HF}: A Figure-to-Caption Generative Framework and Benchmark with Human Feedback},\nauthor={Ashish Singh and Prateek Agarwal and Zixuan Huang and Arpita Singh and Tong Yu and Sungchul Kim and Victor Bursztyn and Nikos Vlassis and Ryan A. Rossi},\nyear={2024},\nurl={https://openreview.net/forum?id=7pVIFJW2Hp}\n}",
        "github": "",
        "project": "",
        "reviewers": "oWEK;LPWT;3Ti9;MqnR",
        "site": "https://openreview.net/forum?id=7pVIFJW2Hp",
        "pdf_size": 3346984,
        "rating": "5;5;6;6",
        "confidence": "3;3;3;3",
        "soundness": "3;2;3;3",
        "contribution": "3;2;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "45;62;101;57",
        "wc_strengths": "71;53;124;40",
        "wc_weaknesses": "70;98;22;52",
        "wc_questions": "53;4;201;24",
        "wc_review": "239;217;448;173",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "711;685;0;727",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;0;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            66.25,
            20.99255820523073
        ],
        "wc_strengths_avg": [
            72.0,
            31.976553910638962
        ],
        "wc_weaknesses_avg": [
            60.5,
            27.617928959282953
        ],
        "wc_questions_avg": [
            70.5,
            77.3320761392063
        ],
        "wc_review_avg": [
            269.25,
            105.90178232683338
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            530.75,
            306.79502522042304
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0.75,
            0.4330127018922193
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15640674917187120192&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;2;2;2;2;2",
        "aff_unique_norm": "University of Massachusetts Amherst;LinkedIn Corporation;Adobe",
        "aff_unique_dep": "Department of Computer Science;;Adobe Research",
        "aff_unique_url": "https://www.umass.edu;https://www.linkedin.com;https://research.adobe.com",
        "aff_unique_abbr": "UMass Amherst;LinkedIn;Adobe",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Amherst;",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Heterogeneous Personalized Federated Learning by Local-Global Updates Mixing via Convergence Rate",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19346",
        "id": "7pWRLDBAtc",
        "author_site": "Meirui Jiang, Anjie Le, Xiaoxiao Li, Qi Dou",
        "tldr": "",
        "abstract": "Personalized federated learning (PFL) has emerged as a promising technique for addressing the challenge of data heterogeneity. While recent studies have made notable progress in mitigating heterogeneity associated with label distributions, the issue of effectively handling feature heterogeneity remains an open question. In this paper, we propose a personalization approach by Local-global updates Mixing (LG-Mix) via Neural Tangent Kernel (NTK)-based convergence. The core idea is to leverage the convergence rate induced by NTK to quantify the importance of local and global updates, and subsequently mix these updates based on their importance. Specifically, we find the trace of the NTK matrix can manifest the convergence rate, and propose an efficient and effective approximation to calculate the trace of a feature matrix instead of the NTK matrix. Such approximation significantly reduces the cost of computing NTK, and the feature matrix explicitly considers the heterogeneous features among samples. We have theoretically analyzed the convergence of our method in the over-parameterize regime, and experimentally evaluated our method on five datasets. These datasets present heterogeneous data features in natural and medical images. With comprehensive comparison to existing state-of-the-art approaches, our LG-Mix has consistently outperformed them across all datasets (largest accuracy improvement of 5.01\\%), demonstrating the outstanding efficacy of our method for model personalization. Code is available at \\url{https://github.com/med-air/HeteroPFL}.",
        "keywords": "Personalized Federated Learning;Heterogeneous Data;Feature Distribution Shift",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/5b33797c929db3d387af16617136bea9a85e4fd2.zip",
        "author": "Meirui Jiang;Anjie Le;Xiaoxiao Li;Qi Dou",
        "authorids": "~Meirui_Jiang2;~Anjie_Le1;~Xiaoxiao_Li1;~Qi_Dou2",
        "gender": "F;Unspecified;F;M",
        "homepage": ";https://xxlya.github.io/;https://www.cse.cuhk.edu.hk/~qdou;https://meiruijiang.github.io/MeiruiJiang/",
        "dblp": "353/1044;71/8042;165/7846;285/5480",
        "google_scholar": "XvQ4B1sAAAAJ;sdENOQ4AAAAJ;https://scholar.google.com.hk/citations?user=iHh7IJQAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;0000-0002-3416-9950;0000-0003-4228-8420",
        "linkedin": ";;;",
        "or_profile": "~Anjie_Le1;~Xiaoxiao_Li1;~Qi_Dou2;~Meirui_JIANG1",
        "aff": "University of Cambridge;University of British Columbia;The Chinese University of Hong Kong;Department of Computer Science and Engineering, The Chinese University of Hong Kong",
        "aff_domain": "cam.ac.uk;ece.ubc.ca;cuhk.edu.hk;cse.cuhk.edu.hk",
        "position": "MS student;Assistant Professor;Assistant Professor;PhD student",
        "bibtex": "@inproceedings{\njiang2024heterogeneous,\ntitle={Heterogeneous Personalized Federated Learning by Local-Global Updates Mixing via Convergence Rate},\nauthor={Meirui Jiang and Anjie Le and Xiaoxiao Li and Qi Dou},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=7pWRLDBAtc}\n}",
        "github": "",
        "project": "",
        "reviewers": "Ho8d;efqn;i8zc",
        "pdf_size": 1368900,
        "rating": "5;6;8",
        "confidence": "2;3;2",
        "soundness": "2;3;3",
        "contribution": "2;2;3",
        "presentation": "2;3;3",
        "wc_summary": "65;47;102",
        "wc_strengths": "44;50;71",
        "wc_weaknesses": "322;154;48",
        "wc_questions": "391;28;71",
        "wc_review": "822;279;292",
        "wc_reply_reviewers": "0;152;0",
        "wc_reply_authors": "1819;942;1510",
        "reply_reviewers": "0;2;0",
        "reply_authors": "3;3;3",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            71.33333333333333,
            22.895899681432528
        ],
        "wc_strengths_avg": [
            55.0,
            11.575836902790225
        ],
        "wc_weaknesses_avg": [
            174.66666666666666,
            112.81055900146147
        ],
        "wc_questions_avg": [
            163.33333333333334,
            161.93894597107337
        ],
        "wc_review_avg": [
            464.3333333333333,
            252.9642047580821
        ],
        "wc_reply_reviewers_avg": [
            50.666666666666664,
            71.65348716023682
        ],
        "wc_reply_authors_avg": [
            1423.6666666666667,
            363.2008932930767
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            3.0,
            0.0
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.18898223650461363,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:vK5WzmeAoIgJ:scholar.google.com/&scioq=Heterogeneous+Personalized+Federated+Learning+by+Local-Global+Updates+Mixing+via+Convergence+Rate&hl=en&as_sdt=0,33",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=7pWRLDBAtc",
        "pdf": "https://openreview.net/pdf?id=7pWRLDBAtc",
        "email": "cam.ac.uk;ece.ubc.ca;cuhk.edu.hk;cse.cuhk.edu.hk",
        "author_num": 4,
        "aff_unique_index": "0;1;2;2",
        "aff_unique_norm": "University of Cambridge;University of British Columbia;Chinese University of Hong Kong",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.cam.ac.uk;https://www.ubc.ca;https://www.cuhk.edu.hk",
        "aff_unique_abbr": "Cambridge;UBC;CUHK",
        "aff_campus_unique_index": "0;2;2",
        "aff_campus_unique": "Cambridge;;Hong Kong SAR",
        "aff_country_unique_index": "0;1;2;2",
        "aff_country_unique": "United Kingdom;Canada;China"
    },
    {
        "id": "7q7s5fXEpP",
        "title": "Stealthy Imitation: Reward-guided Environment-free Policy Stealing",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep reinforcement learning policies, which are integral to modern control systems, represent valuable intellectual property. The development of these policies demands considerable resources, such as domain expertise, simulation fidelity, and real-world validation. These policies are potentially vulnerable to model stealing attacks, which aim to replicate their functionality using only black-box access. In this paper, we propose Stealthy Imitation, the first attack designed to steal policies without access to the environment or knowledge of the input range. This setup has not been considered by previous model stealing methods. Lacking access to the victim's input states distribution, Stealthy Imitation fits a reward model that allows to approximate it. We show that the victim policy is harder to imitate when the distribution of the attack queries matches that of the victim. We evaluate our approach across diverse, high-dimensional control tasks and consistently outperform prior data-free approaches adapted for policy stealing. Lastly, we propose a countermeasure that significantly diminishes the effectiveness of the attack. The implementation of Stealthy Imitation will be publicly available and open-source.",
        "keywords": "model stealing;security;deep reinforcement learning;control system",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Zhixiong Zhuang;Maria-Irina Nicolae;Mario Fritz",
        "authorids": "~Zhixiong_Zhuang1;~Maria-Irina_Nicolae1;~Mario_Fritz1",
        "gender": "M;F;M",
        "homepage": "https://de.linkedin.com/in/zhixiong-zhuang-7b18121b0;https://ririnicolae.github.io/;https://cispa.saarland/group/fritz/",
        "dblp": ";156/0167.html;",
        "google_scholar": ";kNOsX30AAAAJ;https://scholar.google.de/citations?user=4V1nNm4AAAAJ",
        "orcid": ";0009-0002-2758-7481;",
        "linkedin": ";irina-nicolae-a2251638;",
        "or_profile": "~Zhixiong_Zhuang1;~Maria-Irina_Nicolae1;~Mario_Fritz1",
        "aff": "Robert Bosch GmbH;Robert Bosch GmbH;Saarland University",
        "aff_domain": "bosch.com;bosch.com;uni-saarland.de",
        "position": "PhD student;Research scientist;Full Professor",
        "bibtex": "@misc{\nzhuang2024stealthy,\ntitle={Stealthy Imitation: Reward-guided Environment-free Policy Stealing},\nauthor={Zhixiong Zhuang and Maria-Irina Nicolae and Mario Fritz},\nyear={2024},\nurl={https://openreview.net/forum?id=7q7s5fXEpP}\n}",
        "github": "",
        "project": "",
        "reviewers": "3FCu;LEDd;Maon;AqHM",
        "site": "https://openreview.net/forum?id=7q7s5fXEpP",
        "pdf_size": 2088392,
        "rating": "5;5;6;6",
        "confidence": "4;3;3;3",
        "soundness": "2;3;3;2",
        "contribution": "3;2;2;2",
        "presentation": "4;3;3;2",
        "wc_summary": "140;78;72;131",
        "wc_strengths": "40;56;24;74",
        "wc_weaknesses": "493;74;150;320",
        "wc_questions": "73;201;45;200",
        "wc_review": "746;409;291;725",
        "wc_reply_reviewers": "260;0;20;63",
        "wc_reply_authors": "673;602;498;666",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            105.25,
            30.49077729412617
        ],
        "wc_strengths_avg": [
            48.5,
            18.567444627627143
        ],
        "wc_weaknesses_avg": [
            259.25,
            161.69628165174362
        ],
        "wc_questions_avg": [
            129.75,
            71.44009728436825
        ],
        "wc_review_avg": [
            542.75,
            197.3529515867447
        ],
        "wc_reply_reviewers_avg": [
            85.75,
            103.14643716580811
        ],
        "wc_reply_authors_avg": [
            609.75,
            70.2010505619396
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12495121733455247305&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Robert Bosch GmbH;Saarland University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.bosch.com;https://www.uni-saarland.de",
        "aff_unique_abbr": "Bosch;UdS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "7rex8lEZH2",
        "title": "Prompt Tuning with Diffusion for Few-Shot Pre-trained Policy Generalization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Offline Reinforcement Learning (RL) methods harness previous experiences to derive an optimal policy, forming the foundation for pre-trained large-scale models (PLMs). When encountering tasks not seen before, PLMs often utilize several expert trajectories as prompts to expedite their adaptation to new requirements. Though a range of prompt-tuning methods has been proposed to enhance the quality of prompts, these methods frequently face restrictions due to prompt initialization, which can significantly constrain the exploration domain and potentially lead to suboptimal solutions. To eliminate the reliance on the initial prompt, we shift our perspective towards the generative model, framing the prompt-tuning process as a form of conditional generative modeling, where prompts are generated from random noise. Our innovation, the Prompt Diffuser, leverages a conditional diffusion model to produce prompts of exceptional quality. Central to our framework is the approach to trajectory reconstruction and the meticulous integration of downstream task guidance during the training phase. Further experimental results underscore the potency of the Prompt Diffuser as a robust and effective tool for the prompt-tuning process, demonstrating strong performance in the meta-RL tasks.",
        "keywords": "prompt tuning;diffusion model",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/19a1db969304f3603761c62f87bfbfb406968244.pdf",
        "author": "Shengchao Hu;Li Shen;Ya Zhang;Dacheng Tao",
        "authorids": "~Shengchao_Hu1;~Li_Shen1;~Ya_Zhang1;~Dacheng_Tao1",
        "gender": ";M;F;",
        "homepage": ";https://sites.google.com/site/mathshenli/home;https://annzhanglion.github.io/;",
        "dblp": ";91/3680-8;85/3714-2;",
        "google_scholar": ";yVhgENIAAAAJ;pbjw9sMAAAAJ;",
        "orcid": ";;0000-0002-5390-9053;",
        "linkedin": ";;;",
        "or_profile": "~Shengchao_Hu1;~Li_Shen1;~Ya_Zhang1;~Dacheng_Tao1",
        "aff": ";JD Explore Academy;Shanghai Jiaotong University;",
        "aff_domain": ";jd.com;sjtu.edu.cn;",
        "position": ";Researcher;Professor;",
        "bibtex": "@misc{\nhu2024prompt,\ntitle={Prompt Tuning with Diffusion for Few-Shot Pre-trained Policy Generalization},\nauthor={Shengchao Hu and Li Shen and Ya Zhang and Dacheng Tao},\nyear={2024},\nurl={https://openreview.net/forum?id=7rex8lEZH2}\n}",
        "github": "",
        "project": "",
        "reviewers": "GaVK;4ueS;V1Dp;zrXj",
        "site": "https://openreview.net/forum?id=7rex8lEZH2",
        "pdf_size": 900417,
        "rating": "5;5;6;8",
        "confidence": "4;3;4;3",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;2;3",
        "wc_summary": "74;47;52;52",
        "wc_strengths": "39;45;48;67",
        "wc_weaknesses": "103;138;97;52",
        "wc_questions": "75;40;109;2",
        "wc_review": "291;270;306;173",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1862;1918;2556;1175",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "5;4;5;2",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            56.25,
            10.449282272003183
        ],
        "wc_strengths_avg": [
            49.75,
            10.473180032826706
        ],
        "wc_weaknesses_avg": [
            97.5,
            30.581857366746057
        ],
        "wc_questions_avg": [
            56.5,
            39.81519810323691
        ],
        "wc_review_avg": [
            260.0,
            51.83145762951299
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1877.75,
            488.8120165257806
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            4.0,
            1.224744871391589
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.40824829046386296,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1566295000175567071&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "JD;Shanghai Jiao Tong University",
        "aff_unique_dep": "JD Explore Academy;",
        "aff_unique_url": ";https://www.sjtu.edu.cn",
        "aff_unique_abbr": ";SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "1",
        "aff_country_unique": ";China"
    },
    {
        "id": "7sASqAmGaO",
        "title": "Augmenting Negative Representation for Continual Self-Supervised Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We introduce a novel and general loss function, called Augmented Negatives (AugNeg), for effective continual self-supervised learning (CSSL). We first argue that the conventional loss form of continual learning which consists of single task-specific loss (for plasticity) and a regularizer (for stability) may not be ideal for contrastive loss based CSSL that focus on representation learning. Our reasoning is that, in contrastive learning based methods, the task-specific loss would suffer from decreasing diversity of negative samples and the regularizer may hinder learning new distinctive representations. To that end, we propose AugNeg that consists of two losses with symmetric dependence on current and past models' negative representations. We argue our model can naturally find good trade-off between the plasticity and stability without any explicit hyperparameter tuning. \nFurthermore, we present that the idea of utilizing augmented negative representations can be applied to CSSL with non-contrastive learning by adding a regularization term.\nWe validate the effectiveness of our approach through extensive experiments, demonstrating that applying the AugNeg loss achieves superior performance compared to other state-of-the-art CSSL methods, in both contrastive and non-contrastive learning algorithms.",
        "keywords": "Continual Learning;Representation Learning;Self-supervised Learning;Continual Self-Supervised Learning;Continual Representation Learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/ac9c8b73f89c33a533cf3ae8b11732619bcecc3d.zip",
        "author": "Sungmin Cha;Kyunghyun Cho;Taesup Moon",
        "authorids": "~Sungmin_Cha1;~Kyunghyun_Cho1;~Taesup_Moon1",
        "gender": "M;M;",
        "homepage": "https://sites.google.com/view/sungmin-cha/;http://kyunghyuncho.me;https://mindlab-snu.github.io/people/pi/",
        "dblp": "206/6287;41/9736;05/4084",
        "google_scholar": "i0PPhfAAAAAJ;https://scholar.google.fi/citations?user=0RAmmIAAAAAJ;lQlioBoAAAAJ",
        "orcid": ";;0000-0002-9257-6503",
        "linkedin": ";;",
        "or_profile": "~Sungmin_Cha1;~Kyunghyun_Cho1;~Taesup_Moon1",
        "aff": "New York University;Genentech;Seoul National University",
        "aff_domain": "nyu.edu;gene.com;snu.ac.kr",
        "position": "Faculty Fellow;Senior Director of Frontier Research;Associate Professor",
        "bibtex": "@misc{\ncha2024augmenting,\ntitle={Augmenting Negative Representation for Continual Self-Supervised Learning},\nauthor={Sungmin Cha and Kyunghyun Cho and Taesup Moon},\nyear={2024},\nurl={https://openreview.net/forum?id=7sASqAmGaO}\n}",
        "github": "",
        "project": "",
        "reviewers": "Tkp5;E4AJ;GiPi",
        "site": "https://openreview.net/forum?id=7sASqAmGaO",
        "pdf_size": 1335969,
        "rating": "5;5;6",
        "confidence": "3;4;3",
        "soundness": "2;3;3",
        "contribution": "2;2;3",
        "presentation": "2;2;3",
        "wc_summary": "75;55;59",
        "wc_strengths": "18;17;75",
        "wc_weaknesses": "259;135;173",
        "wc_questions": "49;127;44",
        "wc_review": "401;334;351",
        "wc_reply_reviewers": "0;51;16",
        "wc_reply_authors": "1036;1144;669",
        "reply_reviewers": "0;1;1",
        "reply_authors": "4;4;3",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            63.0,
            8.640987597877148
        ],
        "wc_strengths_avg": [
            36.666666666666664,
            27.10883414846328
        ],
        "wc_weaknesses_avg": [
            189.0,
            51.87163643713842
        ],
        "wc_questions_avg": [
            73.33333333333333,
            38.00292386412159
        ],
        "wc_review_avg": [
            362.0,
            28.437065014988214
        ],
        "wc_reply_reviewers_avg": [
            22.333333333333332,
            21.296843793284385
        ],
        "wc_reply_authors_avg": [
            949.6666666666666,
            203.29999726731154
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14189818090051337427&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "New York University;Genentech;Seoul National University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.nyu.edu;https://www.genentech.com;https://www.snu.ac.kr",
        "aff_unique_abbr": "NYU;Genentech;SNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "United States;South Korea"
    },
    {
        "id": "7sMR09VNKU",
        "title": "Learning System Dynamics from Sensory Input under Optimal Control Principles",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Identifying the underlying dynamics of actuated physical systems from sensory input is of high interest in control, robotics, and engineering in general. In the context of control problems, existing approaches decouple the construction of the feature space where the dynamics identification process occurs from the target control tasks, potentially leading to a mismatch between feature and state spaces: the systems may not be controllable in feature space, and synthesized controls may not be applicable in state space.\nBorrowing from the Koopman formalism, we propose instead to learn an embedding of both the states and controls into a feature space where the dynamics are linear, and include the target control task in the learning objective in the form of a differentiable and robust optimal control problem. We validate the proposed approach with simulation experiments using systems with non-linear dynamics, demonstrating that the controls obtained in feature space can be used to drive the corresponding physical systems and that the learned model can serve for future state prediction.",
        "keywords": "representation learning;optimal control",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/d9f53cb0d0718befb58b84bc55561e74bc656ee3.pdf",
        "author": "Oumayma Bounou;Jean Ponce;Justin Carpentier",
        "authorids": "~Oumayma_Bounou1;~Jean_Ponce1;~Justin_Carpentier1",
        "gender": "F;M;M",
        "homepage": ";http://www.di.ens.fr/~ponce/;https://jcarpent.github.io",
        "dblp": ";p/JeanPonce;173/7498",
        "google_scholar": "B2RS1M4AAAAJ;https://scholar.google.com.tw/citations?user=vC2vywcAAAAJ;https://scholar.google.fr/citations?user=CyhIdmMAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Oumayma_Bounou1;~Jean_Ponce1;~Justin_Carpentier1",
        "aff": ";Ecole Normale Sup\u00e9rieure de Paris;INRIA",
        "aff_domain": ";ens.fr;inria.fr",
        "position": ";Full Professor;Researcher",
        "bibtex": "@misc{\nbounou2024learning,\ntitle={Learning System Dynamics from Sensory Input under Optimal Control Principles},\nauthor={Oumayma Bounou and Jean Ponce and Justin Carpentier},\nyear={2024},\nurl={https://openreview.net/forum?id=7sMR09VNKU}\n}",
        "github": "",
        "project": "",
        "reviewers": "6hvE;fvtc;ianP;wihP",
        "site": "https://openreview.net/forum?id=7sMR09VNKU",
        "pdf_size": 933768,
        "rating": "1;3;5;5",
        "confidence": "5;4;4;3",
        "soundness": "2;2;3;2",
        "contribution": "1;2;2;2",
        "presentation": "2;3;3;2",
        "wc_summary": "46;85;104;80",
        "wc_strengths": "30;66;109;30",
        "wc_weaknesses": "611;273;178;29",
        "wc_questions": "61;56;125;8",
        "wc_review": "748;480;516;147",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            1.6583123951777
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            78.75,
            20.92098229051399
        ],
        "wc_strengths_avg": [
            58.75,
            32.52210786526605
        ],
        "wc_weaknesses_avg": [
            272.75,
            213.77836069162848
        ],
        "wc_questions_avg": [
            62.5,
            41.59627387158614
        ],
        "wc_review_avg": [
            472.75,
            214.3587821853819
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8528028654224417,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17943297840464535428&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 12,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Ecole Normale Sup\u00e9rieure de Paris;INRIA",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ens.fr;https://www.inria.fr",
        "aff_unique_abbr": "ENS Paris;INRIA",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Paris;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "France"
    },
    {
        "id": "7suavRDxe8",
        "title": "Plausibly Deniable Encryption with Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We present a novel approach for achieving plausible deniability in cryptography by harnessing the power of large language models (LLMs) in conjunction with conventional encryption algorithms. Leveraging the inherent statistical properties of LLMs, we design an encryption scheme that allows the same ciphertext to be decrypted with any key, while still yielding a plausible message. Unlike established methods, our approach neither relies on a fixed set of decoy keys or messages nor introduces redundancy. Our method is founded on the observation that language models can be used as encoders to compress a low-entropy signal (such as natural language) into a stream indistinguishable from noise, and similarly, that sampling from the model is equivalent to decoding a stream of noise. When such a stream is encrypted and subsequently decrypted with an incorrect key, it will lead to a sampling behavior and will thus generate a plausible message. Through a series of experiments, we substantiate the resilience of our approach against various statistical detection techniques. Finally, although we mainly focus on language models, we establish the applicability of our approach to a broader set of generative models and domains, including images and audio.",
        "keywords": "large language models;LLM;deniable encryption;compression",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/764c29d631d2939d474d5a77f1f77f61272b4496.zip",
        "author": "Dario Pavllo;Sotiris Anagnostidis",
        "authorids": "~Dario_Pavllo2;~Sotiris_Anagnostidis1",
        "gender": ";M",
        "homepage": ";",
        "dblp": "218/5320;286/1763",
        "google_scholar": "5A_sjVQAAAAJ;qjzTKWUAAAAJ",
        "orcid": ";",
        "linkedin": "dario-pavllo/;sotiris-anagnostidis-b064a5129/",
        "or_profile": "~Dario_Pavllo2;~Sotiris_Anagnostidis1",
        "aff": ";ETH Zurich",
        "aff_domain": ";inf.ethz.ch",
        "position": ";PhD student",
        "bibtex": "@misc{\npavllo2024plausibly,\ntitle={Plausibly Deniable Encryption with Large Language Models},\nauthor={Dario Pavllo and Sotiris Anagnostidis},\nyear={2024},\nurl={https://openreview.net/forum?id=7suavRDxe8}\n}",
        "github": "",
        "project": "",
        "reviewers": "xago;dPno;ydp2;jZiK;n1KU",
        "site": "https://openreview.net/forum?id=7suavRDxe8",
        "pdf_size": 1213338,
        "rating": "3;3;5;5;8",
        "confidence": "4;4;3;5;4",
        "soundness": "1;1;2;3;3",
        "contribution": "1;2;2;2;4",
        "presentation": "3;3;2;3;4",
        "wc_summary": "74;70;55;219;176",
        "wc_strengths": "130;92;19;19;127",
        "wc_weaknesses": "508;323;101;76;113",
        "wc_questions": "74;21;69;51;37",
        "wc_review": "786;506;244;365;453",
        "wc_reply_reviewers": "0;0;0;342;32",
        "wc_reply_authors": "228;817;458;630;293",
        "reply_reviewers": "0;0;0;2;1",
        "reply_authors": "1;1;2;2;1",
        "rating_avg": [
            4.8,
            1.8330302779823362
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.0,
            0.8944271909999159
        ],
        "contribution_avg": [
            2.2,
            0.9797958971132712
        ],
        "presentation_avg": [
            3.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            118.8,
            65.98605913372914
        ],
        "wc_strengths_avg": [
            77.4,
            49.52009693043826
        ],
        "wc_weaknesses_avg": [
            224.2,
            167.21889845349418
        ],
        "wc_questions_avg": [
            50.4,
            19.734234213670415
        ],
        "wc_review_avg": [
            470.8,
            180.8528683764789
        ],
        "wc_reply_reviewers_avg": [
            74.8,
            134.1736188674957
        ],
        "wc_reply_authors_avg": [
            485.2,
            216.74445782995238
        ],
        "reply_reviewers_avg": [
            0.6,
            0.8
        ],
        "reply_authors_avg": [
            1.4,
            0.4898979485566356
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:S3CLm32LP88J:scholar.google.com/&scioq=Plausibly+Deniable+Encryption+with+Large+Language+Models&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "ETH Zurich",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ethz.ch",
        "aff_unique_abbr": "ETHZ",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Switzerland"
    },
    {
        "id": "7tUDUFQkh2",
        "title": "Ref-Diff: Zero-shot Referring Image Segmentation with Generative Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Zero-shot referring image segmentation (RIS) presents a significant challenge. It requires identifying an instance segmentation mask using referring descriptions, without having been trained on such paired data. While existing zero-shot RIS methods mainly utilize pre-trained discriminative models (e.g., CLIP), this study observes that generative models (e.g., Stable Diffusion) can discern relationships between various visual elements and text descriptions, an area yet to be explored in this task. In this work, we introduce the Referring Diffusional Segmentor (Ref-Diff), a model that leverages the fine-grained multi-modal information derived from generative models. Our findings show that even without an external proposal generator, our Ref-Diff with a sole generative model outperforms SOTA weakly-supervised models on RefCOCO+ and RefCOCOg. Notably, when combining both generative and discriminative models, our Ref-Diff+ surpasses competing methods by a substantial margin. This highlights the constructive role of generative models in this domain, providing complementary advantages alongside discriminative models to enhance referring segmentation. Our source code will be publicly available.",
        "keywords": "Zero-shot Referring Image Segmentation;Generative Model",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Minheng Ni;Yabo Zhang;Kailai Feng;Xiaoming Li;Yiwen Guo;Wangmeng Zuo",
        "authorids": "~Minheng_Ni1;~Yabo_Zhang1;~Kailai_Feng1;~Xiaoming_Li3;~Yiwen_Guo1;~Wangmeng_Zuo3",
        "gender": "M;M;M;M;;M",
        "homepage": "https://kodenii.github.io;https://ybybzhang.github.io/;https://github.com/carlofkl;;;",
        "dblp": "263/9969;231/0624;331/2340;36/3071-2;;93/2671",
        "google_scholar": "-ybr4_cAAAAJ;LnYDPdAAAAAJ;;https://scholar.google.com/citations?hl=zh-CN;;rUOpCEYAAAAJ",
        "orcid": ";;;;;0000-0002-3330-783X",
        "linkedin": "https://linkedin.com/in/minheng-ni-7b8a99146;;;;;",
        "or_profile": "~Minheng_Ni1;~Yabo_Zhang1;~Kailai_Feng1;~Xiaoming_Li3;~Yiwen_Guo1;~Wangmeng_Zuo3",
        "aff": "Microsoft;Harbin Institute of Technology;Harbin Institute of Technology;Nanyang Technological University;;Harbin Institute of Technology",
        "aff_domain": "microsoft.com;hit.edu.cn;stu.hit.edu.cn;ntu.edu.sg;;hit.edu.cn",
        "position": "Research Intern;PhD student;MS student;Postdoc;;Full Professor",
        "bibtex": "@misc{\nni2024refdiff,\ntitle={Ref-Diff: Zero-shot Referring Image Segmentation with Generative Models},\nauthor={Minheng Ni and Yabo Zhang and Kailai Feng and Xiaoming Li and Yiwen Guo and Wangmeng Zuo},\nyear={2024},\nurl={https://openreview.net/forum?id=7tUDUFQkh2}\n}",
        "github": "",
        "project": "",
        "reviewers": "YFJv;83NR;rW9R;2K1U",
        "site": "https://openreview.net/forum?id=7tUDUFQkh2",
        "pdf_size": 6617820,
        "rating": "3;3;3;6",
        "confidence": "4;5;4;4",
        "soundness": "3;1;2;3",
        "contribution": "2;1;1;2",
        "presentation": "3;2;2;3",
        "wc_summary": "55;44;38;149",
        "wc_strengths": "24;15;23;43",
        "wc_weaknesses": "261;247;397;134",
        "wc_questions": "2;11;24;2",
        "wc_review": "342;317;482;328",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            71.5,
            45.15805575974236
        ],
        "wc_strengths_avg": [
            26.25,
            10.280442597476044
        ],
        "wc_weaknesses_avg": [
            259.75,
            93.29355551162149
        ],
        "wc_questions_avg": [
            9.75,
            9.01041064547005
        ],
        "wc_review_avg": [
            367.25,
            66.84076226375639
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 22,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13803166602830577984&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1;2;1",
        "aff_unique_norm": "Microsoft;Harbin Institute of Technology;Nanyang Technological University",
        "aff_unique_dep": "Microsoft Corporation;;",
        "aff_unique_url": "https://www.microsoft.com;http://www.hit.edu.cn/;https://www.ntu.edu.sg",
        "aff_unique_abbr": "Microsoft;HIT;NTU",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Harbin",
        "aff_country_unique_index": "0;1;1;2;1",
        "aff_country_unique": "United States;China;Singapore"
    },
    {
        "id": "7v3tkQmtpE",
        "title": "Rethinking Decision Transformer via Hierarchical Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Decision Transformer (DT) is an innovative algorithm leveraging recent advances of the Transformer architecture in sequential decision making. However, a notable limitation of DT is its reliance on {recalling} trajectories from datasets, without the capability to seamlessly stitch them together. In this work, we introduce a general sequence modeling framework for studying sequential decision making through the lens of \\emph{Hierarchical Reinforcement Learning}. At the time of making decisions, a \\emph{high-level} policy first proposes an ideal \\emph{prompt} for the current state, a \\emph{low-level} policy subsequently generates an action conditioned on the given prompt. We show how DT emerges as a special case with specific choices of high-level and low-level policies and discuss why these choices might fail in practice. Inspired by these observations, we investigate how to jointly optimize the high-level and low-level policies to enable the stitching capability. This further leads to the development of new algorithms for offline reinforcement learning. Finally, our empirical studies clearly demonstrate the proposed algorithms significantly surpass DT on several control and navigation benchmarks. We hope that our contributions can inspire the integration of Transformer architectures within the field of RL.",
        "keywords": "offline reinforcement learning;decision transformer",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Yi Ma;Chenjun Xiao;Hebin Liang;Jianye HAO",
        "authorids": "~Yi_Ma5;~Chenjun_Xiao1;~Hebin_Liang2;~Jianye_HAO1",
        "gender": ";;M;M",
        "homepage": "https://mayi1996.top/;https://chenjun-x.github.io/;http://www.icdai.org/jianye.html;https://github.com/superCat-star",
        "dblp": "69/1112-5.html;178/8641;21/7664.html;352/9378.html",
        "google_scholar": "TdVWzqgAAAAJ;;;",
        "orcid": "0000-0001-9375-6605;0000-0002-5493-1500;0000-0002-0422-8235;0009-0000-8371-2297",
        "linkedin": ";;;",
        "or_profile": "~Yi_Ma5;~Chenjun_Xiao1;~Jianye_HAO1;~hebin_liang1",
        "aff": "Tianjin University;Huawei Technologies Ltd.;Tianjin University;Tianjin University",
        "aff_domain": "tju.edu.cn;huawei.com;tju.edu.cn;tju.edu.cn",
        "position": "PhD student;Researcher;Associate Professor;MS student",
        "bibtex": "@misc{\nma2024rethinking,\ntitle={Rethinking Decision Transformer via Hierarchical Reinforcement Learning},\nauthor={Yi Ma and Chenjun Xiao and Hebin Liang and Jianye HAO},\nyear={2024},\nurl={https://openreview.net/forum?id=7v3tkQmtpE}\n}",
        "github": "",
        "project": "",
        "reviewers": "UBLF;xoB5;RLH1;XUDW",
        "site": "https://openreview.net/forum?id=7v3tkQmtpE",
        "pdf_size": 2059234,
        "rating": "5;5;5;6",
        "confidence": "4;3;5;4",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "3;2;2;3",
        "wc_summary": "81;51;72;212",
        "wc_strengths": "253;45;31;118",
        "wc_weaknesses": "237;204;161;129",
        "wc_questions": "34;8;58;21",
        "wc_review": "605;308;322;480",
        "wc_reply_reviewers": "159;182;0;39",
        "wc_reply_authors": "945;1269;783;275",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "3;4;3;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            104.0,
            63.29691935631623
        ],
        "wc_strengths_avg": [
            111.75,
            87.98685981440637
        ],
        "wc_weaknesses_avg": [
            182.75,
            41.09972627646077
        ],
        "wc_questions_avg": [
            30.25,
            18.471261462065875
        ],
        "wc_review_avg": [
            428.75,
            122.13389169268291
        ],
        "wc_reply_reviewers_avg": [
            95.0,
            77.17836484404162
        ],
        "wc_reply_authors_avg": [
            818.0,
            359.0278540726332
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            1.0897247358851685
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 16,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=871146290267306675&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Tianjin University;Huawei",
        "aff_unique_dep": ";Huawei Technologies",
        "aff_unique_url": "http://www.tju.edu.cn;https://www.huawei.com",
        "aff_unique_abbr": "TJU;Huawei",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "7vKWg2Vdrs",
        "title": "LeBD: A Run-time Defense Against Backdoor Attack in YOLO",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Backdoor attack poses a serious threat to deep neural networks (DNNs). An adversary can manipulate the prediction of a backdoored model by attaching a specific backdoor trigger to the input. However, existing defenses are mainly aimed  at detecting backdoors in the digital world, which cannot meet the real-time requirement of application scenes in the physical world. We propose a LayerCAMenabled backdoor detector (LeBD) for monitoring backdoor attacks in the object  detection (OD) network, YOLOv5. LeBD ultilizes LayerCAM to locate the trigger and give a risk warning at run-time. In order to further improve the precision  of trigger localization, we propose a backdoor detector based on counterfactual attribution LayerCAM (CA-LeBD). We evaluated the performance of the backdoor  detector on images in the digital world and video streams in the physical world. Extensive experiments demonstrate that LeBD and CA-LeBD can efficiently locate the trigger and mitigate the effect of backdoor in real time. In the physical  world scene, the detection rate of backdoor can achieve over 90\\%.",
        "keywords": "backdoor detector;physical world;YOLO;LayerCAM;counterfactual attribution",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/23a737e05bc27b5ac5cb5fdb77cb4e4c62c36a6d.zip",
        "author": "Kai Chen;Weijun Shan;Xin Li;XUE YANG;Qing Li;Jun Yu",
        "authorids": "~Kai_Chen26;~Weijun_Shan1;~Xin_Li63;~XUE_YANG6;~Qing_Li21;~Jun_Yu9",
        "gender": "M;M;M;F;F;M",
        "homepage": "https://1208320416.github.io/kaichen.github.io/;https://shanweijun.github.io/;https://903861078.github.io/lixin.github.io/;https://shirley0302.github.io/XueYang.github.io/;https://qingli66.github.io/qingli.github.io/;https://sme.fudan.edu.cn/60/5e/c31157a352350/page.htm",
        "dblp": ";;;;;",
        "google_scholar": ";;;;;",
        "orcid": ";;;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Kai_Chen26;~Weijun_Shan1;~Xin_Li63;~XUE_YANG6;~Qing_Li21;~Jun_Yu9",
        "aff": ";;;;Fudan University;Fudan University",
        "aff_domain": ";;;;fudan.edu.cn;fudan.edu.cn",
        "position": ";;;;Principal Researcher;Principal Researcher",
        "bibtex": "@misc{\nchen2024lebd,\ntitle={Le{BD}: A Run-time Defense Against Backdoor Attack in {YOLO}},\nauthor={Kai Chen and Weijun Shan and Xin Li and XUE YANG and Qing Li and Jun Yu},\nyear={2024},\nurl={https://openreview.net/forum?id=7vKWg2Vdrs}\n}",
        "github": "",
        "project": "",
        "reviewers": "dW4R;JMJB;4B6q;9mm5",
        "site": "https://openreview.net/forum?id=7vKWg2Vdrs",
        "pdf_size": 43049579,
        "rating": "1;3;3;6",
        "confidence": "5;5;4;3",
        "soundness": "1;3;3;3",
        "contribution": "1;2;1;3",
        "presentation": "2;2;3;3",
        "wc_summary": "78;53;72;40",
        "wc_strengths": "17;56;26;41",
        "wc_weaknesses": "57;149;172;344",
        "wc_questions": "87;9;6;64",
        "wc_review": "239;267;276;489",
        "wc_reply_reviewers": "0;123;85;0",
        "wc_reply_authors": "388;619;505;811",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            60.75,
            15.122417134836613
        ],
        "wc_strengths_avg": [
            35.0,
            14.849242404917497
        ],
        "wc_weaknesses_avg": [
            180.5,
            103.74126469250315
        ],
        "wc_questions_avg": [
            41.5,
            34.97499106504532
        ],
        "wc_review_avg": [
            317.75,
            99.80825366671837
        ],
        "wc_reply_reviewers_avg": [
            52.0,
            53.70754136990447
        ],
        "wc_reply_authors_avg": [
            580.75,
            156.0198304703604
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.8866206949335731,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:9dgrYx05OTEJ:scholar.google.com/&scioq=LeBD:+A+Run-time+Defense+Against+Backdoor+Attack+in+YOLO&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Fudan University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.fudan.edu.cn",
        "aff_unique_abbr": "Fudan",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Rethinking and Extending the Probabilistic Inference Capacity of GNNs",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19345",
        "id": "7vVWiCrFnd",
        "author_site": "Tuo Xu, Lei Zou",
        "tldr": "",
        "abstract": "Designing expressive Graph Neural Networks (GNNs) is an important topic in graph machine learning fields. Despite the existence of numerous approaches proposed to enhance GNNs based on Weisfeiler-Lehman (WL) tests, what GNNs can and cannot learn still lacks a deeper understanding. This paper adopts a fundamentally different approach to examine the expressive power of GNNs from a probabilistic perspective. By establishing connections between GNNs' predictions and the central inference problems of probabilistic graphical models (PGMs), we can analyze previous GNN variants with a novel hierarchical framework and gain new insights into their node-level and link-level behaviors. Additionally, we introduce novel methods that can provably enhance GNNs' ability to capture complex dependencies and make complex predictions. Experiments on both synthetic and real-world datasets demonstrate the effectiveness of our approaches.",
        "keywords": "graph neural networks;expressiveness;approximate inference",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/54841c69346bbc60258f7a6556c00bfbb49e79f7.zip",
        "author": "Tuo Xu;Lei Zou",
        "authorids": "~Tuo_Xu1;~Lei_Zou2",
        "gender": "M;M",
        "homepage": "https://github.com/doujzc;https://www.wict.pku.edu.cn/zoulei/",
        "dblp": ";81/3390-1.html",
        "google_scholar": ";",
        "orcid": ";0000-0002-8586-4400",
        "linkedin": ";",
        "or_profile": "~Tuo_Xu1;~Lei_Zou2",
        "aff": "Peking University;Peking University",
        "aff_domain": "pku.edu.cn;pku.edu.cn",
        "position": "MS student;Full Professor",
        "bibtex": "@inproceedings{\nxu2024rethinking,\ntitle={Rethinking and Extending the Probabilistic Inference Capacity of {GNN}s},\nauthor={Tuo Xu and Lei Zou},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=7vVWiCrFnd}\n}",
        "github": "",
        "project": "",
        "reviewers": "G6RK;G9eq;rfPW;jjG1;ubyE",
        "pdf_size": 875277,
        "rating": "5;6;6;8;8",
        "confidence": "3;3;2;3;2",
        "soundness": "3;3;3;3;3",
        "contribution": "2;2;3;3;3",
        "presentation": "3;3;3;3;2",
        "wc_summary": "95;150;65;80;135",
        "wc_strengths": "86;60;56;92;68",
        "wc_weaknesses": "254;61;40;263;82",
        "wc_questions": "140;108;5;4;60",
        "wc_review": "575;379;166;439;345",
        "wc_reply_reviewers": "0;16;0;0;0",
        "wc_reply_authors": "1673;818;434;462;332",
        "reply_reviewers": "0;1;0;0;0",
        "reply_authors": "3;2;1;1;1",
        "rating_avg": [
            6.6,
            1.2
        ],
        "confidence_avg": [
            2.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            105.0,
            32.4037034920393
        ],
        "wc_strengths_avg": [
            72.4,
            14.22111106770494
        ],
        "wc_weaknesses_avg": [
            140.0,
            97.70363350459388
        ],
        "wc_questions_avg": [
            63.4,
            54.41911428900694
        ],
        "wc_review_avg": [
            380.8,
            133.05998647226747
        ],
        "wc_reply_reviewers_avg": [
            3.2,
            6.400000000000001
        ],
        "wc_reply_authors_avg": [
            743.8,
            492.7240201167384
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            1.6,
            0.8
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.2721655269759087,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9428183867229033194&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=7vVWiCrFnd",
        "pdf": "https://openreview.net/pdf?id=7vVWiCrFnd",
        "email": "pku.edu.cn;pku.edu.cn",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Peking University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.pku.edu.cn",
        "aff_unique_abbr": "Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "7vnKTsj66A",
        "title": "When Self-Supervised Learning Meets Unbounded Pseudo-Label Generation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Self-supervised learning (SSL) has demonstrated strong generalization abilities across diverse downstream tasks. However, it is difficult for SSL to accurately gather samples of the same category and separate samples of different categories in the training stage. In this paper, we present a novel approach of generating pseudo-labels for augmented samples to regulate their feature-space relationships. To align the pseudo-label space with the ground-truth label space, we propose an instance-level pseudo-label generation mechanism. Building upon our observations that pseudo-labels can encompass unbounded label noise and that learning remains robust to such noise in the early stages of training, we propose Precise Adjustment Regularization (PAR) for precise dynamic relationship mining. Finally, we propose a PAR-based bi-level optimization learning mechanism mechanism (PBOLM) to promote high-quality representations in SSL. Theoretically, from a data generation perspective, we demonstrate that the proposed PBOLM is more conducive to extracting critical generative factors in data generation. Empirically, based on various downstream tasks, we demonstrate that PBOLM can be considered a plug-and-play module to enhance the performance of SSL methods.",
        "keywords": "Self-supervised learning;contrastive learning;representation learning;bi-level optimization",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Wenwen Qiang;Lingyu Si;Jie Hu;Jiangmeng Li;Changwen Zheng;Fuchun Sun;Hui Xiong",
        "authorids": "~Wenwen_Qiang1;~Lingyu_Si1;~Jie_Hu4;~Jiangmeng_Li1;~Changwen_Zheng1;~Fuchun_Sun1;~Hui_Xiong1",
        "gender": "M;M;M;M;M;M;M",
        "homepage": ";;https://jiangmengli.github.io/;http://people.ucas.ac.cn/~cwzheng;https://www.cs.tsinghua.edu.cn/info/1121/3555.htm;https://www.hkust-gz.edu.cn/people/hui-xiong/;",
        "dblp": "261/6913;298/0368;293/0997;81/2728;;262/1686-1.html;90/5064-19",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;;https://scholar.google.com.sg/citations?user=-kU4VLcAAAAJ;-lErK1QAAAAJ;;cVDF1tkAAAAJ;DAJdHnkAAAAJ",
        "orcid": "0000-0002-7985-5743;0000-0002-7735-6676;0000-0002-3376-1522;0000-0002-2311-6757;;0000-0001-6016-6465;0000-0002-5150-1003",
        "linkedin": ";;jiangmeng-li-86aaa7125/;;;;%E6%9D%B0-%E8%83%A1-97093710a/",
        "or_profile": "~Wenwen_Qiang1;~Lingyu_Si1;~Jiangmeng_Li1;~Changwen_Zheng1;~Fuchun_Sun1;~Hui_Xiong1;~Jie_Hu3",
        "aff": "Institute of Software Chinese Academy of Sciences;Institute of Software Chinese Academy of Sciences;Institute of Software, Chinese Academy of Sciences;Institute of Software, Chinese Academy of Sciences;Tsinghua University;Hong Kong University of Science and Technology (Guangzhou);Meituan",
        "aff_domain": "iscas.ac.cn;iscas.ac.cn;iscas.ac.cn;iscas.ac.cn;cs.tsinghua.edu.cn;hkust.edu;meituan.com",
        "position": "Assistant Professor;Associate Professor;Assistant Professor;Full Professor;Full Professor;Full Professor;Principal Researcher",
        "bibtex": "@misc{\nqiang2024when,\ntitle={When Self-Supervised Learning Meets Unbounded Pseudo-Label Generation},\nauthor={Wenwen Qiang and Lingyu Si and Jie Hu and Jiangmeng Li and Changwen Zheng and Fuchun Sun and Hui Xiong},\nyear={2024},\nurl={https://openreview.net/forum?id=7vnKTsj66A}\n}",
        "github": "",
        "project": "",
        "reviewers": "fBvz;bjmg;ZMGw",
        "site": "https://openreview.net/forum?id=7vnKTsj66A",
        "pdf_size": 400215,
        "rating": "3;5;5",
        "confidence": "4;2;4",
        "soundness": "3;3;2",
        "contribution": "2;2;2",
        "presentation": "2;2;2",
        "wc_summary": "64;92;128",
        "wc_strengths": "49;33;88",
        "wc_weaknesses": "220;193;148",
        "wc_questions": "5;12;19",
        "wc_review": "338;330;383",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            94.66666666666667,
            26.195843605851334
        ],
        "wc_strengths_avg": [
            56.666666666666664,
            23.098821518760552
        ],
        "wc_weaknesses_avg": [
            187.0,
            29.698484809834994
        ],
        "wc_questions_avg": [
            12.0,
            5.715476066494082
        ],
        "wc_review_avg": [
            350.3333333333333,
            23.32857094256359
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:YMKnU--v9AMJ:scholar.google.com/&scioq=When+Self-Supervised+Learning+Meets+Unbounded+Pseudo-Label+Generation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;1;2;3",
        "aff_unique_norm": "Chinese Academy of Sciences;Tsinghua University;Hong Kong University of Science and Technology;Meituan",
        "aff_unique_dep": "Institute of Software;;;",
        "aff_unique_url": "http://www.is.cas.cn;https://www.tsinghua.edu.cn;https://www.ust.hk;https://www.meituan.com",
        "aff_unique_abbr": "CAS;THU;HKUST;Meituan",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "7vzyqs8UbA",
        "title": "LMCC-MBC: Metric-Constrained Model-Based Clustering with Wasserstein-2 Distance of Gaussian Markov Random Fields",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "A wide range of temporal (1D) and spatial (2D) data analysis problems can be formulated as model-based clustering problems given metric constraints. For example, subsequence clustering of multivariate time series is constrained by 1D temporal continuity, while urban functional area identification is constrained by the spatial proximity in the 2D space. Existing works model such metric constraints independent of the model estimation process, failing to leverage the correlation between adjacent estimated models and their locations in the metric space. To solve this problem we propose a novel metric-constrained model-based clustering algorithm LMCC-MBC that softly requires the Wasserstein-2 distance between estimated model parameters (such as those of Gaussian Markov Random Fields) to be a locally monotonic continuous function of the metric distance. We theoretically prove that satisfaction of this requirement guarantees intra-cluster cohesion and inter-cluster separation. Moreover, without explicitly optimizing log-likelihood LMCC-MBC voids the expensive EM-step that is needed by previous approaches (e.g., TICC and STICC), and enables faster and more stable clustering. Experiments on both 1D and 2D synthetic as well as real-world datasets demonstrate that our algorithm successfully captures the latent correlation between the estimated models and the metric constraints, and outperforms strong baselines by a margin up to 14.3% in ARI (Adjusted Rand Index) and 32.1% in NMI (Normalized Mutual Information).",
        "keywords": "unsupervised learning;clustering;model-based clustering;metric-constrained clustering",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/0940559c62d56eef5dab3517bf8141b275d6cf62.zip",
        "author": "Zhangyu Wang;Gengchen Mai;Krzysztof Janowicz;Ni Lao",
        "authorids": "~Zhangyu_Wang1;~Gengchen_Mai1;~Krzysztof_Janowicz2;~Ni_Lao1",
        "gender": ";M;;M",
        "homepage": ";https://gengchenmai.github.io/;;http://www.cs.cmu.edu/~nlao",
        "dblp": ";151/5583;95/5567;82/283",
        "google_scholar": "8vNk5Z8AAAAJ;X2Wfl1UAAAAJ;;iUgWR3MAAAAJ",
        "orcid": ";0000-0002-7818-7309;;0000-0002-4034-7784",
        "linkedin": "zhangyu-wang-26aab0170/;gengchen-mai-144439121/;;ni-lao",
        "or_profile": "~Zhangyu_Wang1;~Gengchen_Mai1;~Krzysztof_Janowicz2;~Ni_Lao1",
        "aff": "University of California, Santa Barbara;University of Georgia;UC Santa Barbara;Google",
        "aff_domain": "ucsb.edu;uga.edu;ucsb.edu;google.com",
        "position": "PhD student;Assistant Professor;Full Professor;Researcher",
        "bibtex": "@misc{\nwang2024lmccmbc,\ntitle={{LMCC}-{MBC}: Metric-Constrained Model-Based Clustering with Wasserstein-2 Distance of Gaussian Markov Random Fields},\nauthor={Zhangyu Wang and Gengchen Mai and Krzysztof Janowicz and Ni Lao},\nyear={2024},\nurl={https://openreview.net/forum?id=7vzyqs8UbA}\n}",
        "github": "",
        "project": "",
        "reviewers": "FzKt;cTE9;FyBz",
        "site": "https://openreview.net/forum?id=7vzyqs8UbA",
        "pdf_size": 1404434,
        "rating": "5;6;6",
        "confidence": "2;5;3",
        "soundness": "2;3;2",
        "contribution": "1;3;2",
        "presentation": "3;2;3",
        "wc_summary": "71;133;166",
        "wc_strengths": "45;44;119",
        "wc_weaknesses": "221;189;186",
        "wc_questions": "1;2;163",
        "wc_review": "338;368;634",
        "wc_reply_reviewers": "0;59;0",
        "wc_reply_authors": "460;614;415",
        "reply_reviewers": "0;1;0",
        "reply_authors": "1;2;1",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.3333333333333335,
            1.247219128924647
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            123.33333333333333,
            39.38132665222045
        ],
        "wc_strengths_avg": [
            69.33333333333333,
            35.122009560324926
        ],
        "wc_weaknesses_avg": [
            198.66666666666666,
            15.839472494022298
        ],
        "wc_questions_avg": [
            55.333333333333336,
            76.13292469242346
        ],
        "wc_review_avg": [
            446.6666666666667,
            133.02965417112415
        ],
        "wc_reply_reviewers_avg": [
            19.666666666666668,
            27.812866726670865
        ],
        "wc_reply_authors_avg": [
            496.3333333333333,
            85.20693764138119
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.7559289460184542,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:JgrvziXnTrwJ:scholar.google.com/&scioq=LMCC-MBC:+Metric-Constrained+Model-Based+Clustering+with+Wasserstein-2+Distance+of+Gaussian+Markov+Random+Fields&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "University of California, Santa Barbara;University of Georgia;Google",
        "aff_unique_dep": ";;Google",
        "aff_unique_url": "https://www.ucsb.edu;https://www.uga.edu;https://www.google.com",
        "aff_unique_abbr": "UCSB;UGA;Google",
        "aff_campus_unique_index": "0;0;2",
        "aff_campus_unique": "Santa Barbara;;Mountain View",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Cauchy-Schwarz Divergence Information Bottleneck for Regression",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19344",
        "id": "7wY67ZDQTE",
        "author_site": "Shujian Yu, Xi Yu, Sigurd L\u00f8kse, Robert Jenssen, Jose Principe",
        "tldr": "",
        "abstract": "The information bottleneck (IB) approach is popular to improve the generalization, robustness and explainability of deep neural networks. Essentially, it aims to find a minimum sufficient representation $\\mathbf{t}$ by striking a trade-off between a compression term $I(\\mathbf{x};\\mathbf{t})$ and a prediction term $I(y;\\mathbf{t})$, where $I(\\cdot;\\cdot)$ refers to the mutual information (MI). MI is for the IB for the most part expressed in terms of the Kullback-Leibler (KL) divergence, which in the regression case corresponds to prediction based on mean squared error (MSE) loss with Gaussian assumption and compression approximated by variational inference. \nIn this paper, we study the IB principle for the regression problem and develop a new way to parameterize the IB with deep neural networks by exploiting favorable properties of the Cauchy-Schwarz (CS) divergence. By doing so, we move away from MSE-based regression and ease estimation by avoiding variational approximations or distributional assumptions. We investigate the improved generalization ability of our proposed CS-IB and demonstrate strong adversarial robustness guarantees. We demonstrate its superior performance on six real-world regression tasks over other popular deep IB approaches. We additionally observe that the solutions discovered by CS-IB always achieve the best trade-off between prediction accuracy and compression ratio in the information plane. The code is available at \\url{https://github.com/SJYuCNEL/Cauchy-Schwarz-Information-Bottleneck}.",
        "keywords": "Information Bottleneck;Cauchy-Schwarz Divergence;Regression",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/f2602b561c7a9045ae501b67e9061b0c34bdb59b.zip",
        "author": "Shujian Yu;Xi Yu;Sigurd L\u00f8kse;Robert Jenssen;Jose C Principe",
        "authorids": "~Shujian_Yu1;~Xi_Yu1;~Sigurd_L\u00f8kse1;~Robert_Jenssen1;~Jose_C_Principe1",
        "gender": "M;M;M;M;M",
        "homepage": "https://sjyucnel.github.io/;https://www.bnl.gov/staff/xyu1;;https://uit.no/ansatte/robert.jenssen;http://www.cnel.ufl.edu",
        "dblp": "154/5763.html;;163/4540;45/5813;",
        "google_scholar": "O8kpnMoAAAAJ;;7nKP_jYAAAAJ;HiviXjIAAAAJ;",
        "orcid": ";0000-0002-2029-1680;0000-0002-1953-4315;0000-0002-7496-8474;",
        "linkedin": ";;;robert-jenssen-10b79318/?originalSubdomain=no;",
        "or_profile": "~Shujian_Yu1;~Xi_Yu1;~Sigurd_L\u00f8kse1;~Robert_Jenssen1;~Jose_C_Principe1",
        "aff": "University of Troms\u00f8;Brookhaven National Laboratory;NORCE Norwegian Research Centre;UiT The Arctic University of Norway;",
        "aff_domain": "uit.no;bnl.gov;norceresearch.no;uit.no;",
        "position": "Guest Associate Professor;Postdoc;Researcher;Full Professor;",
        "bibtex": "@inproceedings{\nyu2024cauchyschwarz,\ntitle={Cauchy-Schwarz Divergence Information Bottleneck for Regression},\nauthor={Shujian Yu and Xi Yu and Sigurd L{\\o}kse and Robert Jenssen and Jose C Principe},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=7wY67ZDQTE}\n}",
        "github": "",
        "project": "",
        "reviewers": "MhfL;aubm;uyPi;zqzB;SV68",
        "pdf_size": 2257629,
        "rating": "5;6;6;6;6",
        "confidence": "4;4;2;2;4",
        "soundness": "3;2;3;3;4",
        "contribution": "2;3;3;2;3",
        "presentation": "2;3;3;3;3",
        "wc_summary": "148;62;77;47;70",
        "wc_strengths": "151;79;40;39;39",
        "wc_weaknesses": "1217;497;106;78;91",
        "wc_questions": "435;2;3;50;22",
        "wc_review": "1951;640;226;214;222",
        "wc_reply_reviewers": "121;16;26;0;0",
        "wc_reply_authors": "1847;1205;204;478;386",
        "reply_reviewers": "1;1;1;0;0",
        "reply_authors": "3;3;1;1;1",
        "rating_avg": [
            5.8,
            0.39999999999999997
        ],
        "confidence_avg": [
            3.2,
            0.9797958971132712
        ],
        "soundness_avg": [
            3.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            80.8,
            35.05082024717824
        ],
        "wc_strengths_avg": [
            69.6,
            43.50448252766604
        ],
        "wc_weaknesses_avg": [
            397.8,
            438.7424757189575
        ],
        "wc_questions_avg": [
            102.4,
            167.20837299609133
        ],
        "wc_review_avg": [
            650.6,
            670.1873170987348
        ],
        "wc_reply_reviewers_avg": [
            32.6,
            45.297240534054616
        ],
        "wc_reply_authors_avg": [
            824.0,
            614.4346995409683
        ],
        "reply_reviewers_avg": [
            0.6,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.8,
            0.9797958971132713
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.408248290463863,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12295463531972727817&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=7wY67ZDQTE",
        "pdf": "https://openreview.net/pdf?id=7wY67ZDQTE",
        "email": "uit.no;bnl.gov;norceresearch.no;uit.no;",
        "author_num": 5,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "University of Troms\u00f8;Brookhaven National Laboratory;NORCE Norwegian Research Centre;Arctic University of Norway",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://uit.no;https://www.bnl.gov;https://www.norce.no;https://www.uit.no",
        "aff_unique_abbr": "UIT;BNL;NORCE;UiT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "Norway;United States"
    },
    {
        "id": "7yyAoyfVEC",
        "title": "Hypothesis- and Structure-based prompting for medical and business diagnosis",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In real-world scenarios like healthcare and business, tackling many-to-one problems is challenging but crucial. Take medical diagnosis: A patient's chief complaint can be caused by various diseases, yet time and resource constraints make identifying the cause via difficult.\nTo tackle these issues, our study introduces Hypothesis-based and Structure-based (HS) prompting, a method designed to enhance the problem-solving capabilities of Large Language Models (LLMs). Our approach starts by efficiently breaking down the problem space using a Mutually Exclusive and Collectively Exhaustive (MECE) framework. Armed with this structure, LLMs generate, prioritize, and validate hypotheses through targeted questioning and data collection. The ability to ask the right questions is crucial for pinpointing the root cause of a problem accurately. We provide an easy-to-follow guide for crafting examples, enabling users to develop tailored HS prompts for specific tasks. We validate our method through diverse case studies in business consulting and medical diagnosis, which are further evaluated by domain experts. Interestingly, adding one sentence ``You can request one data in each response if needed'' initiates human interaction and improves performance.",
        "keywords": "Large Language Models;Prompting method;Medical diagnosis;Business consulting application",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/b1902f38586375c759a0a65d630345a9f41ec8ad.pdf",
        "author": "Juyeon Heo;Kyunghyun Lee;Hyonkeun Joh;Umang Bhatt;Adrian Weller",
        "authorids": "~Juyeon_Heo1;~Kyunghyun_Lee3;~Hyonkeun_Joh1;~Umang_Bhatt1;~Adrian_Weller1",
        "gender": "F;M;M;M;M",
        "homepage": "https://sites.google.com/view/juyeonheo/%ED%99%88;https://www.linkedin.com/in/kyunghyun-kh-lee-5148bb232/;;https://umangsbhatt.github.io;http://mlg.eng.cam.ac.uk/adrian/",
        "dblp": ";;;207/7955;73/8324",
        "google_scholar": ";;;https://scholar.google.com/citations?hl=en;https://scholar.google.co.uk/citations?user=Ek4hM10AAAAJ",
        "orcid": ";;0000-0001-9163-8859;;",
        "linkedin": ";;;umangsbhatt/;",
        "or_profile": "~Juyeon_Heo1;~Kyunghyun_Lee3;~Hyonkeun_Joh1;~Umang_Bhatt1;~Adrian_Weller1",
        "aff": "University of Cambridge;;Yonsei University;New York University;University of Cambridge",
        "aff_domain": "cam.ac.uk;;yonsei.ac.kr;nyu.edu;cam.ac.uk",
        "position": "PhD student;;PhD student;Assistant Professor;Principal Researcher",
        "bibtex": "@misc{\nheo2024hypothesis,\ntitle={Hypothesis- and Structure-based prompting for medical and business diagnosis},\nauthor={Juyeon Heo and Kyunghyun Lee and Hyonkeun Joh and Umang Bhatt and Adrian Weller},\nyear={2024},\nurl={https://openreview.net/forum?id=7yyAoyfVEC}\n}",
        "github": "",
        "project": "",
        "reviewers": "hnXU;ueoZ;HT4V;y4hX",
        "site": "https://openreview.net/forum?id=7yyAoyfVEC",
        "pdf_size": 463113,
        "rating": "1;3;3;3",
        "confidence": "4;4;3;2",
        "soundness": "1;3;2;3",
        "contribution": "1;2;2;2",
        "presentation": "2;3;3;2",
        "wc_summary": "312;75;89;75",
        "wc_strengths": "19;17;45;110",
        "wc_weaknesses": "369;155;157;113",
        "wc_questions": "42;3;92;168",
        "wc_review": "742;250;383;466",
        "wc_reply_reviewers": "260;23;71;0",
        "wc_reply_authors": "884;706;775;742",
        "reply_reviewers": "2;1;1;0",
        "reply_authors": "3;2;2;1",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            137.75,
            100.76550749140303
        ],
        "wc_strengths_avg": [
            47.75,
            37.599035891894886
        ],
        "wc_weaknesses_avg": [
            198.5,
            99.99374980467529
        ],
        "wc_questions_avg": [
            76.25,
            61.653771174195015
        ],
        "wc_review_avg": [
            460.25,
            179.99218733045055
        ],
        "wc_reply_reviewers_avg": [
            88.5,
            102.27536360238472
        ],
        "wc_reply_authors_avg": [
            776.75,
            66.55589755987069
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:uNpwW_eFtD0J:scholar.google.com/&scioq=Hypothesis-+and+Structure-based+prompting+for+medical+and+business+diagnosis&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "University of Cambridge;Yonsei University;New York University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.cam.ac.uk;https://www.yonsei.ac.kr;https://www.nyu.edu",
        "aff_unique_abbr": "Cambridge;Yonsei;NYU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Cambridge;",
        "aff_country_unique_index": "0;1;2;0",
        "aff_country_unique": "United Kingdom;South Korea;United States"
    },
    {
        "title": "Free from Bellman Completeness: Trajectory Stitching via Model-based Return-conditioned Supervised Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19343",
        "id": "7zY781bMDO",
        "author_site": "Zhaoyi Zhou, Chuning Zhu, Runlong Zhou, Qiwen Cui, Abhishek Gupta, Simon Du",
        "tldr": "",
        "abstract": "Off-policy dynamic programming (DP) techniques such as $Q$-learning have proven to be important in sequential decision-making problems. In the presence of function approximation, however, these techniques often diverge due to the absence of Bellman completeness in the function classes considered, a crucial condition for the success of DP-based methods. In this paper, we show how off-policy learning techniques based on return-conditioned supervised learning (RCSL) are able to circumvent these challenges of Bellman completeness, converging under significantly more relaxed assumptions inherited from supervised learning. We prove there exists a natural environment in which if one uses two-layer multilayer perceptron as the function approximator, the layer width needs to grow *linearly* with the state space size to satisfy Bellman completeness while a constant layer width is enough for RCSL. These findings take a step towards explaining the superior empirical performance of RCSL methods compared to DP-based methods in environments with near-optimal datasets. Furthermore, in order to learn from sub-optimal datasets, we propose a simple framework called MBRCSL, granting RCSL methods the ability of dynamic programming to stitch together segments from distinct trajectories. MBRCSL leverages learned dynamics models and forward sampling to accomplish trajectory stitching while avoiding the need for Bellman completeness that plagues all dynamic programming algorithms. We propose both theoretical analysis and experimental evaluation to back these claims, outperforming state-of-the-art model-free and model-based offline RL algorithms across several simulated robotics problems.",
        "keywords": "Offline Reinforcement Learning;Return-Conditioned Supervised Learning;Bellman Completeness;Trajectory Stitching",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Zhaoyi Zhou;Chuning Zhu;Runlong Zhou;Qiwen Cui;Abhishek Gupta;Simon Shaolei Du",
        "authorids": "~Zhaoyi_Zhou1;~Chuning_Zhu1;~Runlong_Zhou1;~Qiwen_Cui1;~Abhishek_Gupta1;~Simon_Shaolei_Du1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://zhaoyizhou1123.github.io/;https://homes.cs.washington.edu/~zchuning/;https://vectorzhou.com;;https://homes.cs.washington.edu/~abhgupta/;http://simonshaoleidu.com",
        "dblp": "211/3392;295/9468;290/8755;276/6268;18/6404-4;176/5602",
        "google_scholar": "9fPuoP4AAAAJ;;https://scholar.google.com/citations?hl=en;AnSVkUYAAAAJ;1wLVDP4AAAAJ;OttawxUAAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";chuning-zhu-39b086167/;;;;",
        "or_profile": "~Zhaoyi_Zhou1;~Chuning_Zhu1;~Runlong_Zhou1;~Qiwen_Cui1;~Abhishek_Gupta1;~Simon_Shaolei_Du1",
        "aff": "Tsinghua University;University of Washington;Department of Computer Science, University of Washington;Department of Computer Science, University of Washington;University of Washington;University of Washington",
        "aff_domain": "tsinghua.edu.cn;cs.washington.edu;cs.washington.edu;cs.washington.edu;uw.edu;washington.edu",
        "position": "Undergrad student;PhD student;PhD student;PhD student;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nzhou2024free,\ntitle={Free from Bellman Completeness: Trajectory Stitching via Model-based Return-conditioned Supervised Learning},\nauthor={Zhaoyi Zhou and Chuning Zhu and Runlong Zhou and Qiwen Cui and Abhishek Gupta and Simon Shaolei Du},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=7zY781bMDO}\n}",
        "github": "",
        "project": "",
        "reviewers": "HXBB;YXKR;BsaB;9pmM",
        "pdf_size": 1132711,
        "rating": "5;5;6;8",
        "confidence": "5;3;3;4",
        "soundness": "3;2;3;3",
        "contribution": "3;2;3;3",
        "presentation": "3;3;3;4",
        "wc_summary": "160;104;92;66",
        "wc_strengths": "59;57;122;106",
        "wc_weaknesses": "33;30;114;97",
        "wc_questions": "291;234;182;250",
        "wc_review": "543;425;510;519",
        "wc_reply_reviewers": "0;147;21;39",
        "wc_reply_authors": "1813;1614;617;1161",
        "reply_reviewers": "0;2;1;1",
        "reply_authors": "4;5;1;2",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            105.5,
            34.332928800205785
        ],
        "wc_strengths_avg": [
            86.0,
            28.574464124459098
        ],
        "wc_weaknesses_avg": [
            68.5,
            37.5
        ],
        "wc_questions_avg": [
            239.25,
            39.04724702203729
        ],
        "wc_review_avg": [
            499.25,
            44.53299338692606
        ],
        "wc_reply_reviewers_avg": [
            51.75,
            56.69821425759368
        ],
        "wc_reply_authors_avg": [
            1301.25,
            460.3174855466605
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            3.0,
            1.5811388300841898
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17828791884504357290&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=7zY781bMDO",
        "pdf": "https://openreview.net/pdf?id=7zY781bMDO",
        "email": "tsinghua.edu.cn;cs.washington.edu;cs.washington.edu;cs.washington.edu;uw.edu;washington.edu",
        "author_num": 6,
        "aff_unique_index": "0;1;1;1;1;1",
        "aff_unique_norm": "Tsinghua University;University of Washington",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.washington.edu",
        "aff_unique_abbr": "THU;UW",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Seattle",
        "aff_country_unique_index": "0;1;1;1;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "7zxGHwe7Vw",
        "title": "FedAnchor: Enhancing Federated Semi-Supervised Learning with Label Contrastive Loss",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Federated learning (FL) is a distributed learning paradigm that allows devices to collaboratively train a shared global model while keeping the data locally. Due to the nature of FL, it provides access to an astonishing amount of training data for meaningful research and applications. However, the assumption that all of these private data samples include correct and complete annotations is not realistic for real-world applications. Federated Semi-Supervised Learning (FSSL) provides a powerful approach for training models on a large amount of data without requiring all data points to be completely labeled. In this paper, we propose FedAnchor, an innovative method that tackles the label-at-server FSSL scenario where the server maintains a limited amount of labeled data, while clients' private data remain unlabeled. FedAnchor introduces a unique double-head structure, with one anchor head attached with a newly designed label contrastive loss based on the cosine similarity to train on labeled anchor data to provide better pseudo-labels for faster convergence and higher performance. Following this approach, we alleviate the confirmation bias and over-fitting easy-to-learn data problems coming from pseudo-labeling based on high-confidence model prediction samples. We conduct extensive experiments on three different datasets and demonstrate our method can outperform the state-of-the-art method by a significant margin, both in terms of convergence rate and model accuracy.",
        "keywords": "Federated Learning;Semi-supervised Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Xinchi Qiu;Yan Gao;Lorenzo Sani;Heng Pan;Wanru Zhao;Pedro Porto Buarque de Gusmao;Nicholas Donald Lane",
        "authorids": "~Xinchi_Qiu1;~Yan_Gao4;~Lorenzo_Sani1;~Heng_Pan2;~Wanru_Zhao1;~Pedro_Porto_Buarque_de_Gusmao1;~Nicholas_Donald_Lane1",
        "gender": "F;M;M;;;M;",
        "homepage": ";https://www.cst.cam.ac.uk/people/yg381;https://relogu.github.io/;;;https://portobgusmao.com/;",
        "dblp": "265/6559;;237/2312;;;88/10808;",
        "google_scholar": "yW6vsS8AAAAJ;https://scholar.google.com/citations?hl=en;IoCEzUMAAAAJ;;;https://scholar.google.it/citations?user=TfdVttMAAAAJ;",
        "orcid": ";;;;;0000-0002-7072-9898;",
        "linkedin": "xinchi-qiu-686a7394/;;;heng-pan-117915247/;;pedropgusmao;",
        "or_profile": "~Xinchi_Qiu1;~Yan_Gao4;~Lorenzo_Sani1;~Heng_Pan2;~Wanru_Zhao1;~Pedro_Porto_Buarque_de_Gusmao1;~Nicholas_Donald_Lane1",
        "aff": "University of Cambridge;University of Cambridge;University of Cambridge;University of Cambridge;;University of Surrey;",
        "aff_domain": "cam.ac.uk;cam.ac.uk;cam.ac.uk;cam.ac.uk;;surrey.ac.uk;",
        "position": "PhD student;PhD student;PhD student;Researcher;;Lecturer;",
        "bibtex": "@misc{\nqiu2024fedanchor,\ntitle={FedAnchor: Enhancing Federated Semi-Supervised Learning with Label Contrastive Loss},\nauthor={Xinchi Qiu and Yan Gao and Lorenzo Sani and Heng Pan and Wanru Zhao and Pedro Porto Buarque de Gusmao and Nicholas Donald Lane},\nyear={2024},\nurl={https://openreview.net/forum?id=7zxGHwe7Vw}\n}",
        "github": "",
        "project": "",
        "reviewers": "6dEL;LCsM;WkFS;wVdB",
        "site": "https://openreview.net/forum?id=7zxGHwe7Vw",
        "pdf_size": 8124750,
        "rating": "3;3;3;5",
        "confidence": "4;3;4;3",
        "soundness": "3;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "1;1;3;3",
        "wc_summary": "81;56;100;83",
        "wc_strengths": "13;7;38;155",
        "wc_weaknesses": "493;156;127;367",
        "wc_questions": "9;42;3;5",
        "wc_review": "596;261;268;610",
        "wc_reply_reviewers": "85;17;91;0",
        "wc_reply_authors": "394;287;475;314",
        "reply_reviewers": "1;1;2;0",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            1.0
        ],
        "wc_summary_avg": [
            80.0,
            15.700318468107582
        ],
        "wc_strengths_avg": [
            53.25,
            59.88478521294036
        ],
        "wc_weaknesses_avg": [
            285.75,
            151.31981859624338
        ],
        "wc_questions_avg": [
            14.75,
            15.880412463157246
        ],
        "wc_review_avg": [
            433.75,
            169.34044850537038
        ],
        "wc_reply_reviewers_avg": [
            48.25,
            40.25776322648838
        ],
        "wc_reply_authors_avg": [
            367.5,
            73.4863932983515
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:dUuKApYhJtsJ:scholar.google.com/&scioq=FedAnchor:+Enhancing+Federated+Semi-Supervised+Learning+with+Label+Contrastive+Loss&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;1",
        "aff_unique_norm": "University of Cambridge;University of Surrey",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cam.ac.uk;https://www.surrey.ac.uk",
        "aff_unique_abbr": "Cambridge;Surrey",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Cambridge;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "80faVLl6ji",
        "title": "BRIDGING THE GAP BETWEEN HUMAN MOTION AND ACTION SEMANTICS VIA KINEMATIC PHRASES",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The goal of motion understanding is to establish a reliable mapping between motion and action semantics, while it is a challenging many-to-many problem. An abstract action semantic (i.e., walk forwards) could be conveyed by perceptually diverse motions (walk with arms up or swinging), while a motion could carry different semantics w.r.t. its context and intention. This makes an elegant mapping between them difficult. Previous attempts adopted direct-mapping paradigms with limited reliability. Also, current automatic metrics fail to provide reliable assessments of the consistency between motions and action semantics. We identify the source of these problems as the significant gap between the two modalities. To alleviate this gap, we propose Kinematic Phrases (KP) that take the objective kinematic facts of human motion with proper abstraction, interpretability, and generality characteristics. Based on KP as a mediator, we can unify a motion knowledge base and build a motion understanding system. Meanwhile, KP can be automatically converted from motions and to text descriptions with no subjective bias, inspiring Kinematic Prompt Generation (KPG) as a novel automatic motion generation benchmark. In extensive experiments, our approach shows superiority over other methods. Our code and data would be made publicly available.",
        "keywords": "Motion generation;Motion representation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/d431a6b69944d0b4e6b748affb4f09d388269107.zip",
        "author": "Xinpeng Liu;Yong-Lu Li;Ailing Zeng;Zizheng Zhou;Yang You;Cewu Lu",
        "authorids": "~Xinpeng_Liu1;~Yong-Lu_Li1;~Ailing_Zeng1;~Zizheng_Zhou1;~Yang_You2;~Cewu_Lu3",
        "gender": "M;M;F;M;M;M",
        "homepage": "https://foruck.github.io/;https://dirtyharrylyl.github.io/;https://ailingzeng.site/;https://darth-zzz.github.io;https://qq456cvb.github.io;https://www.mvig.org/",
        "dblp": "27/5719-2;198/9345;226/4720;;33/8167;",
        "google_scholar": "DBE-ju8AAAAJ;https://scholar.google.com.hk/citations?user=UExAaVgAAAAJ;Tn7fzS8AAAAJ;h_UN0qUAAAAJ;1YV1_KUAAAAJ;https://scholar.google.com.tw/citations?user=QZVQEWAAAAAJ",
        "orcid": "0000-0002-7525-3243;0000-0003-0478-0692;;;;",
        "linkedin": ";%E6%B0%B8%E9%9C%B2-%E6%9D%8E-991b99139/;%E7%88%B1%E7%8E%B2-%E6%9B%BE-65504112a/;;;",
        "or_profile": "~Xinpeng_Liu1;~Yong-Lu_Li1;~Ailing_Zeng1;~Zizheng_Zhou1;~Yang_You2;~Cewu_Lu3",
        "aff": "Shanghai Jiaotong University;Shanghai Jiaotong University;International Digital Economy Academy;Shanghai Jiaotong University;Stanford University;Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu;sjtu.edu.cn;idea.edu.cn;sjtu.edu.cn;stanford.edu;sjtu.edu.cn",
        "position": "PhD student;Assistant Professor;Researcher;Undergrad student;Postdoc;Full Professor",
        "bibtex": "@misc{\nliu2024bridging,\ntitle={{BRIDGING} {THE} {GAP} {BETWEEN} {HUMAN} {MOTION} {AND} {ACTION} {SEMANTICS} {VIA} {KINEMATIC} {PHRASES}},\nauthor={Xinpeng Liu and Yong-Lu Li and Ailing Zeng and Zizheng Zhou and Yang You and Cewu Lu},\nyear={2024},\nurl={https://openreview.net/forum?id=80faVLl6ji}\n}",
        "github": "",
        "project": "",
        "reviewers": "DPfm;HZyv;537a;87dC",
        "site": "https://openreview.net/forum?id=80faVLl6ji",
        "pdf_size": 2891901,
        "rating": "6;6;6;6",
        "confidence": "4;3;4;2",
        "soundness": "3;2;3;3",
        "contribution": "3;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "90;40;60;91",
        "wc_strengths": "190;31;47;84",
        "wc_weaknesses": "109;250;126;261",
        "wc_questions": "131;248;240;437",
        "wc_review": "520;569;473;873",
        "wc_reply_reviewers": "234;0;0;12",
        "wc_reply_authors": "1002;697;539;1362",
        "reply_reviewers": "2;0;0;1",
        "reply_authors": "3;1;1;3",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            70.25,
            21.45198126048035
        ],
        "wc_strengths_avg": [
            88.0,
            61.94755846681934
        ],
        "wc_weaknesses_avg": [
            186.5,
            69.37038272923107
        ],
        "wc_questions_avg": [
            264.0,
            110.05680351527569
        ],
        "wc_review_avg": [
            608.75,
            156.29519346416254
        ],
        "wc_reply_reviewers_avg": [
            61.5,
            99.71333912772153
        ],
        "wc_reply_authors_avg": [
            900.0,
            314.39545162104366
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.0,
            1.0
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7699111375450909101&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;0;1;0;2;0",
        "aff_unique_norm": "Shanghai Jiao Tong University;International Digital Economy Academy;Stanford University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.sjtu.edu.cn;;https://www.stanford.edu",
        "aff_unique_abbr": "SJTU;;Stanford",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Stanford",
        "aff_country_unique_index": "0;0;0;2;0",
        "aff_country_unique": "China;;United States"
    },
    {
        "title": "Dynamic Neighborhood Construction for Structured Large Discrete Action Spaces",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19342",
        "id": "80wh3jjCZf",
        "author_site": "Fabian Akkerman, Julius Luy, Wouter van Heeswijk, Maximilian Schiffer",
        "tldr": "",
        "abstract": "Large discrete action spaces (LDAS) remain a central challenge in reinforcement learning. Existing solution approaches can handle unstructured LDAS with up to a few million actions. However, many real-world applications in logistics, production, and transportation systems have combinatorial action spaces, whose size grows well beyond millions of actions, even on small instances. Fortunately, such action spaces exhibit structure, e.g., equally spaced discrete resource units. With this work, we focus on handling structured LDAS (SLDAS) with sizes that cannot be handled by current benchmarks: we propose Dynamic Neighborhood Construction (DNC), a novel exploitation paradigm for SLDAS. We present a scalable neighborhood exploration heuristic that utilizes this paradigm and efficiently explores the discrete neighborhood around the continuous proxy action in structured action spaces with up to $10^{73}$ actions. We demonstrate the performance of our method by benchmarking it against three state-of-the-art approaches designed for large discrete action spaces across three distinct environments. Our results show that DNC matches or outperforms state-of-the-art approaches while being computationally more  efficient. Furthermore, our method scales to action spaces that so far remained computationally intractable for existing methodologies.",
        "keywords": "Structured large discrete action space;Reinforcement learning;Neighborhood search",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/cd6e8b1d6539421502f8244cda3ae5e0b205e9b4.zip",
        "author": "Fabian Akkerman;Julius Luy;Wouter van Heeswijk;Maximilian Schiffer",
        "authorids": "~Fabian_Akkerman1;~Julius_Luy1;~Wouter_van_Heeswijk1;~Maximilian_Schiffer1",
        "gender": ";M;;M",
        "homepage": ";https://www.ot.mgt.tum.de/osm/team/alumni/julius-luy/;;https://www.professors.wi.tum.de/osm/team/maximilian-schiffer/",
        "dblp": ";;;198/6733",
        "google_scholar": ";BvEGvqoAAAAJ;;umGuS18AAAAJ",
        "orcid": ";;;0000-0003-2682-4975",
        "linkedin": ";julius-luy-b66a47a9/?originalSubdomain=de;;",
        "or_profile": "~Fabian_Akkerman1;~Julius_Luy1;~Wouter_van_Heeswijk1;~Maximilian_Schiffer1",
        "aff": ";Technische Universit\u00e4t M\u00fcnchen;;Technische Universit\u00e4t M\u00fcnchen",
        "aff_domain": ";tum.de;;tum.de",
        "position": ";PhD student;;Associate Professor",
        "bibtex": "@inproceedings{\nakkerman2024dynamic,\ntitle={Dynamic Neighborhood Construction for Structured Large Discrete Action Spaces},\nauthor={Fabian Akkerman and Julius Luy and Wouter van Heeswijk and Maximilian Schiffer},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=80wh3jjCZf}\n}",
        "github": "",
        "project": "",
        "reviewers": "x32f;kH6M;ZSBT",
        "pdf_size": 1651736,
        "rating": "6;8;8",
        "confidence": "2;2;4",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "3;4;3",
        "wc_summary": "98;52;142",
        "wc_strengths": "18;120;35",
        "wc_weaknesses": "224;76;211",
        "wc_questions": "2;25;148",
        "wc_review": "342;273;536",
        "wc_reply_reviewers": "72;29;29",
        "wc_reply_authors": "437;630;840",
        "reply_reviewers": "1;1;1",
        "reply_authors": "2;2;2",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            97.33333333333333,
            36.745370078721784
        ],
        "wc_strengths_avg": [
            57.666666666666664,
            44.61937795273359
        ],
        "wc_weaknesses_avg": [
            170.33333333333334,
            66.91453919407617
        ],
        "wc_questions_avg": [
            58.333333333333336,
            64.09541498595841
        ],
        "wc_review_avg": [
            383.6666666666667,
            111.33832324147073
        ],
        "wc_reply_reviewers_avg": [
            43.333333333333336,
            20.270394394014364
        ],
        "wc_reply_authors_avg": [
            635.6666666666666,
            164.57284776724933
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8412935024885307152&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=80wh3jjCZf",
        "pdf": "https://openreview.net/pdf?id=80wh3jjCZf",
        "email": ";tum.de;;tum.de",
        "author_num": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Technische Universit\u00e4t M\u00fcnchen",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tum.de",
        "aff_unique_abbr": "TUM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "816T4ab9Z5",
        "title": "Perfect Alignment May be Poisonous to Graph Contrastive Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph Contrastive Learning (GCL) aims to learn node representations by aligning positive pairs and separating negative ones. However, limited research has been conducted on the inner law behind specific augmentations used in graph-based learning. What kind of augmentation will help downstream performance, how does contrastive learning actually influence downstream tasks, and why the magnitude of augmentation matters? This paper seeks to address these questions by establishing a connection between augmentation and downstream performance, as well as by investigating the generalization of contrastive learning. Our findings reveal that GCL contributes to downstream tasks mainly by separating different classes rather than gathering nodes of the same class. So perfect alignment and augmentation overlap which draw all intra-class samples the same can not explain the success of contrastive learning. Then in order to comprehend how augmentation aids the contrastive learning process, we conduct further investigations into its generalization, finding that perfect alignment that draw positive pair the same could help contrastive loss but is poisonous to generalization, on the contrary, imperfect alignment enhances the model's generalization ability. We analyse the result by information theory and graph spectrum theory respectively, and propose two simple but effective methods to verify the theories. The two methods could be easily applied to various GCL algorithms and extensive experiments are conducted to prove its effectiveness.",
        "keywords": "Graph Contrastive Learning;Alignment;Generalization",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/986cca6c5db8e20d8b0822ae1d37dbf799c743e2.zip",
        "author": "Jingyu Liu;Yong Liu",
        "authorids": "~Jingyu_Liu4;~Yong_Liu7",
        "gender": "M;M",
        "homepage": "https://github.com/somebodyhh1;https://iie-liuyong.github.io",
        "dblp": ";29/4867-18",
        "google_scholar": ";vVhmzbAAAAAJ",
        "orcid": ";0000-0002-6739-621X",
        "linkedin": ";",
        "or_profile": "~Jingyu_Liu4;~Yong_Liu7",
        "aff": "Renmin University of China;Renmin University of China",
        "aff_domain": "ruc.edu.cn;ruc.edu.cn",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\nliu2024perfect,\ntitle={Perfect Alignment May be Poisonous to Graph Contrastive Learning},\nauthor={Jingyu Liu and Yong Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=816T4ab9Z5}\n}",
        "github": "",
        "project": "",
        "reviewers": "vy1b;yxaQ;J3pe;KFkN;yszY",
        "site": "https://openreview.net/forum?id=816T4ab9Z5",
        "pdf_size": 2808574,
        "rating": "3;6;6;6;8",
        "confidence": "5;3;3;4;4",
        "soundness": "2;3;3;3;3",
        "contribution": "2;3;3;2;3",
        "presentation": "3;3;2;2;3",
        "wc_summary": "50;200;110;55;122",
        "wc_strengths": "30;62;124;25;115",
        "wc_weaknesses": "459;77;223;284;102",
        "wc_questions": "4;4;6;290;15",
        "wc_review": "543;343;463;654;354",
        "wc_reply_reviewers": "25;0;11;273;0",
        "wc_reply_authors": "1833;399;703;2599;491",
        "reply_reviewers": "1;0;1;1;0",
        "reply_authors": "4;1;2;4;1",
        "rating_avg": [
            5.8,
            1.6
        ],
        "confidence_avg": [
            3.8,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            107.4,
            54.47054249775744
        ],
        "wc_strengths_avg": [
            71.2,
            41.52782199923324
        ],
        "wc_weaknesses_avg": [
            229.0,
            137.9811581340003
        ],
        "wc_questions_avg": [
            63.8,
            113.17314169006708
        ],
        "wc_review_avg": [
            471.4,
            117.31086906165174
        ],
        "wc_reply_reviewers_avg": [
            61.8,
            105.99886791848297
        ],
        "wc_reply_authors_avg": [
            1205.0,
            865.916393192784
        ],
        "reply_reviewers_avg": [
            0.6,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            2.4,
            1.3564659966250538
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5345224838248488,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12307682829642070275&as_sdt=8005&sciodt=0,7&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Renmin University of China",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.ruc.edu.cn",
        "aff_unique_abbr": "RUC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "82A2EfMu3e",
        "title": "Efficient Discrete Physics-informed Neural Networks for Solving Evolutionary Partial Differential Equations",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Physics-informed neural networks (PINNs) have shown promising potential for solving partial differential equations (PDEs) using deep learning. \nHowever, PINNs face training difficulties for evolutionary PDEs, particularly for dynamical systems whose solutions exhibit multi-scale or turbulent behavior over time.\nThe reason is that PINNs may violate the temporal causality property since all the temporal features in the PINNs loss are trained simultaneously. \nThis paper proposes to use implicit time differencing schemes to enforce temporal causality, and use transfer learning to sequentially update the PINNs in space as surrogates for PDE solutions in different time frames.\nThe evolving PINNs are better able to capture the varying complexities of the evolutionary equations, while only requiring minor updates between adjacent time frames.\nOur method is theoretically proven to be convergent if the time step is small and each PINN in different time frames is well-trained.\nIn addition, we provide state-of-the-art (SOTA) numerical results for a variety of benchmarks for which existing PINNs formulations may fail or be inefficient.\nWe demonstrate that the proposed method improves the accuracy of PINNs approximation for evolutionary PDEs and improves efficiency by a factor of 4\u201340x.\nAll code and data can be found in the supplemental materials.",
        "keywords": "Neural networks;Partial differential equation;Physics-informed machine learning",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/611bc55af46ccbe60fc9a6c1c0c47ac0aebb8283.zip",
        "author": "Ye Li;Siqi Chen;Bin Shan",
        "authorids": "~Ye_Li6;~Siqi_Chen5;~Bin_Shan2",
        "gender": "M;M;M",
        "homepage": ";https://github.com/kjzxcsq;",
        "dblp": ";;",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;;",
        "orcid": "0000-0003-3986-129X;0009-0003-0174-989X;0009-0003-1177-4597",
        "linkedin": ";;",
        "or_profile": "~Ye_Li6;~Siqi_Chen5;~Bin_Shan2",
        "aff": "Nanjing University of Aeronautics and Astronautics;Nanjing University of Aeronautics and Astronautics;Nanjing University of Aeronautics and Astronautics",
        "aff_domain": "nuaa.edu.cn;nuaa.edu.cn;nuaa.edu.cn",
        "position": "Assistant Professor;Undergrad student;MS student",
        "bibtex": "@misc{\nli2024efficient,\ntitle={Efficient Discrete Physics-informed Neural Networks for Solving Evolutionary Partial Differential Equations},\nauthor={Ye Li and Siqi Chen and Bin Shan},\nyear={2024},\nurl={https://openreview.net/forum?id=82A2EfMu3e}\n}",
        "github": "",
        "project": "",
        "reviewers": "HW8p;XCvN;rdRW;sf3Z",
        "site": "https://openreview.net/forum?id=82A2EfMu3e",
        "pdf_size": 2938444,
        "rating": "3;3;5;5",
        "confidence": "5;5;5;3",
        "soundness": "2;1;3;3",
        "contribution": "1;1;2;3",
        "presentation": "1;2;3;3",
        "wc_summary": "144;94;148;94",
        "wc_strengths": "44;45;99;53",
        "wc_weaknesses": "673;440;303;159",
        "wc_questions": "166;201;298;47",
        "wc_review": "1027;780;848;353",
        "wc_reply_reviewers": "245;0;0;12",
        "wc_reply_authors": "257;500;529;179",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            120.0,
            26.038433132583073
        ],
        "wc_strengths_avg": [
            60.25,
            22.64260364887395
        ],
        "wc_weaknesses_avg": [
            393.75,
            189.3823843444791
        ],
        "wc_questions_avg": [
            178.0,
            89.76914837515169
        ],
        "wc_review_avg": [
            752.0,
            247.3994745346077
        ],
        "wc_reply_reviewers_avg": [
            64.25,
            104.4709887959332
        ],
        "wc_reply_authors_avg": [
            366.25,
            151.14128324187274
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:YFYSz6HeFZQJ:scholar.google.com/&scioq=Efficient+Discrete+Physics-informed+Neural+Networks+for+Solving+Evolutionary+Partial+Differential+Equations&hl=en&as_sdt=0,21",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Nanjing University of Aeronautics and Astronautics",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.nuaa.edu.cn",
        "aff_unique_abbr": "NUAA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "FreeDyG: Frequency Enhanced Continuous-Time Dynamic Graph Model for Link Prediction",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19341",
        "id": "82Mc5ilInM",
        "author_site": "Yuxing Tian, Yiyan Qi, Fan Guo",
        "tldr": "",
        "abstract": "Link prediction is a crucial task in dynamic graph learning. Recent advancements in continuous-time dynamic graph models, primarily by leveraging richer temporal details, have significantly improved link prediction performance. However, due to their complex modules, they still face several challenges, such as overfitting and optimization difficulties. More importantly, it is challenging for these methods to capture the 'shift' phenomenon, where node interaction patterns change over time. To address these issues, we propose a simple yet novel method called \\textbf{Fre}quency \\textbf{E}nhanced Continuous-Time \\textbf{Dy}namic \\textbf{G}raph ({\\bf FreeDyG}) model for link prediction. Specifically, we propose a node interaction frequency encoding module that both explicitly captures the proportion of common neighbors and the frequency of the interaction of the node pair. Unlike previous works that primarily focus on the time domain, we delve into the frequency domain, allowing a deeper and more nuanced extraction of interaction patterns, revealing periodic and \"shift\" behaviors. Extensive experiments conducted on seven real-world continuous-time dynamic graph datasets validate the effectiveness of FreeDyG. The results consistently demonstrate that FreeDyG outperforms existing methods in both transductive and inductive settings. Our code is available at this repository: \\href{https://github.com/Tianxzzz/FreeDyG}{https://github.com/Tianxzzz/FreeDyG}",
        "keywords": "Dynamic graph; fourier transform; link prediction",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Yuxing Tian;Yiyan Qi;Fan Guo",
        "authorids": "~Yuxing_Tian1;~Yiyan_Qi1;~Fan_Guo3",
        "gender": "M;;",
        "homepage": ";;https://jsjxy.jxnu.edu.cn/2012/0923/c3381a106151/page.htm",
        "dblp": "02/6504.html;209/8128;",
        "google_scholar": "hZGWZnQAAAAJ;ZG9GqnMAAAAJ;",
        "orcid": ";0000-0002-8078-5834;",
        "linkedin": ";;",
        "or_profile": "~Yuxing_Tian1;~Yiyan_Qi1;~Fan_Guo3",
        "aff": "International Digital Economy Academy;IDEA;Jiangxi Normal University",
        "aff_domain": "idea.edu.cn;idea.edu.cn;jxnu.edu.cn",
        "position": "Intern;Researcher;Associate Professor",
        "bibtex": "@inproceedings{\ntian2024freedyg,\ntitle={FreeDyG: Frequency Enhanced Continuous-Time Dynamic Graph Model for Link Prediction},\nauthor={Yuxing Tian and Yiyan Qi and Fan Guo},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=82Mc5ilInM}\n}",
        "github": "",
        "project": "",
        "reviewers": "VgR1;Gxoa;VGzm;Wgp4",
        "pdf_size": 908866,
        "rating": "5;6;8;8",
        "confidence": "3;5;3;3",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;4;3;3",
        "wc_summary": "67;56;65;125",
        "wc_strengths": "53;60;80;111",
        "wc_weaknesses": "326;170;126;151",
        "wc_questions": "276;63;65;44",
        "wc_review": "722;349;336;431",
        "wc_reply_reviewers": "0;27;8;0",
        "wc_reply_authors": "1123;1235;1033;554",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "2;3;3;1",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            78.25,
            27.307279249313726
        ],
        "wc_strengths_avg": [
            76.0,
            22.5055548698538
        ],
        "wc_weaknesses_avg": [
            193.25,
            78.21564741149945
        ],
        "wc_questions_avg": [
            112.0,
            95.03946548671242
        ],
        "wc_review_avg": [
            459.5,
            155.86933630448294
        ],
        "wc_reply_reviewers_avg": [
            8.75,
            11.031205736455105
        ],
        "wc_reply_authors_avg": [
            986.25,
            259.61642378709405
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 22,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7223783100460016618&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=82Mc5ilInM",
        "pdf": "https://openreview.net/pdf?id=82Mc5ilInM",
        "email": "idea.edu.cn;idea.edu.cn;jxnu.edu.cn",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "International Digital Economy Academy;Institute of Electrical and Electronics Engineers;Jiangxi Normal University",
        "aff_unique_dep": ";;",
        "aff_unique_url": ";https://www.ieee.org;http://www.jxnu.edu.cn",
        "aff_unique_abbr": ";IEEE;JXNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "1;2",
        "aff_country_unique": ";United States;China"
    },
    {
        "id": "83w0LPowHz",
        "title": "On Reconstructability of Graph Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recently, the expressive power of GNNs has been analyzed based on their ability to determine if two given graphs are isomorphic using the WL-test. However, previous analyses only establish the expressiveness of GNNs for graph-level tasks from a global perspective. In this paper, we analyze the expressive power of GNNs in terms of Graph Reconstructability, which aims to examine whether the topological information of graphs can be recovered from a local (node-level) perspective. We answer this question by analyzing how the output node embeddings extracted from GNNs may maintain important information for reconstructing the input graph structure. Moreover, we generalize GNNs in the form of Graph Reconstructable Neural Network (GRNN) and explore Nearly Orthogonal Random Features (NORF) to retain graph reconstructability. Experimental results demonstrate that GRNN outperforms representative baselines in reconstructability and efficiency.",
        "keywords": "Graph Neural Network;Reconstructability",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/fa435ca30046d40fb88c9d805787039b2b370491.pdf",
        "author": "Hsi-Wen Chen;De-Nian Yang;Hong-Han Shuai;Wang-Chien Lee;Ming-Syan Chen",
        "authorids": "~Hsi-Wen_Chen1;~De-Nian_Yang1;~Hong-Han_Shuai1;~Wang-Chien_Lee1;~Ming-Syan_Chen2",
        "gender": "Not Specified;M;M;M;M",
        "homepage": ";https://homepage.iis.sinica.edu.tw/pages/dnyang/index_en.html;http://basiclab.lab.nycu.edu.tw/;http://www.cse.psu.edu/~wul2/;https://arbor.ee.ntu.edu.tw/~mschen",
        "dblp": "39/9713.html;85/318;86/10294;14/716;c/MingSyanChen",
        "google_scholar": "https://scholar.google.com.tw/citations?user=ZupA27cAAAAJ;;https://scholar.google.com.tw/citations?user=MSWL2noAAAAJ;https://scholar.google.com.tw/citations?user=9OdHL5wAAAAJ;KTmCrFkAAAAJ",
        "orcid": ";0000-0002-3765-9293;0000-0003-2216-077X;0000-0002-8949-489X;0000-0002-0711-8197",
        "linkedin": "hsi-wen-chen-674395134;;;;",
        "or_profile": "~Hsi-Wen_Chen1;~De-Nian_Yang1;~Hong-Han_Shuai1;~Wang-Chien_Lee1;~Ming-Syan_Chen2",
        "aff": "National Taiwan University;Academia Sinica;National Yang Ming Chiao Tung University;Pennsylvania State University;National Taiwan University",
        "aff_domain": "ntu.edu.tw;iis.sinica.edu.tw;nycu.edu.tw;psu.edu;ntu.edu",
        "position": "PhD student;Professor;Associate Professor;Associate Professor;Full Professor",
        "bibtex": "@misc{\nchen2024on,\ntitle={On Reconstructability of Graph Neural Networks},\nauthor={Hsi-Wen Chen and De-Nian Yang and Hong-Han Shuai and Wang-Chien Lee and Ming-Syan Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=83w0LPowHz}\n}",
        "github": "",
        "project": "",
        "reviewers": "zmY8;9f9r;M2Jy;RshA",
        "site": "https://openreview.net/forum?id=83w0LPowHz",
        "pdf_size": 511522,
        "rating": "3;3;5;5",
        "confidence": "4;3;3;3",
        "soundness": "1;2;2;2",
        "contribution": "2;1;3;2",
        "presentation": "2;3;1;2",
        "wc_summary": "71;71;156;74",
        "wc_strengths": "53;78;59;48",
        "wc_weaknesses": "379;333;451;122",
        "wc_questions": "246;83;150;65",
        "wc_review": "749;565;816;309",
        "wc_reply_reviewers": "45;97;39;11",
        "wc_reply_authors": "1146;534;972;636",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;1;2;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            93.0,
            36.39368077015569
        ],
        "wc_strengths_avg": [
            59.5,
            11.368817000902073
        ],
        "wc_weaknesses_avg": [
            321.25,
            122.4834172449479
        ],
        "wc_questions_avg": [
            136.0,
            70.9683027837076
        ],
        "wc_review_avg": [
            609.75,
            196.45785171379637
        ],
        "wc_reply_reviewers_avg": [
            48.0,
            31.064449134018133
        ],
        "wc_reply_authors_avg": [
            822.0,
            247.49545450371406
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:QDNzCenuQhQJ:scholar.google.com/&scioq=On+Reconstructability+of+Graph+Neural+Networks&hl=en&as_sdt=0,11",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;0",
        "aff_unique_norm": "National Taiwan University;Academia Sinica;National Yang Ming Chiao Tung University;Pennsylvania State University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.ntu.edu.tw;https://www.sinica.edu.tw;https://www.nycu.edu.tw;https://www.psu.edu",
        "aff_unique_abbr": "NTU;Academia Sinica;NYCU;PSU",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Taiwan;",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "84Hk01tFKq",
        "title": "HyperFields: Towards Zero-Shot Generation of NeRFs from Text",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We introduce HyperFields, a method for generating text-conditioned NeRFs with a single forward pass and (optionally) some finetuning. Key to our approach are: (i) a dynamic hypernetwork, which learns a smooth mapping from text token embeddings to the space of Neural Radiance Fields (NeRFs); (ii) NeRF distillation training, which distills scenes encoded in individual NeRFs into one dynamic hypernetwork. These techniques enable a single network to fit over a hundred unique scenes. We further demonstrate that HyperFields learns a more general map between text and NeRFs, and consequently is capable of predicting novel in-distribution and out-of-distribution scenes --- either zero-shot or with a few finetuning steps. Finetuning HyperFields benefits from accelerated convergence thanks to the learned general map, and is capable of synthesizing novel scenes 5 to 10 times faster than existing neural optimization-based methods. Our ablation experiments show that both the dynamic architecture and NeRF distillation are critical to the expressivity of HyperFields.",
        "keywords": "HyperNetworks;generative modelling",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Sudarshan Babu;Richard Liu;Avery Zhou;Michael Maire;Greg Shakhnarovich;Rana Hanocka",
        "authorids": "~Sudarshan_Babu1;~Richard_Liu1;~Avery_Zhou1;~Michael_Maire1;~Greg_Shakhnarovich1;~Rana_Hanocka1",
        "gender": "M;M;M;M;;M",
        "homepage": "https://people.cs.uchicago.edu/~sudarshan/;https://factoryofthesun.github.io/;https://www.linkedin.com/in/azhou/;http://people.cs.uchicago.edu/~mmaire/;https://people.cs.uchicago.edu/~ranahanocka/;http://ttic.edu/gregory/",
        "dblp": "164/6304;44/5359;;73/1498.html;167/2260;17/1926.html",
        "google_scholar": ";;;HXowq5YAAAAJ;3Bk5C9EAAAAJ;https://scholar.google.com.tw/citations?user=YLOz1kgAAAAJ",
        "orcid": ";;;;0000-0003-3214-3703;",
        "linkedin": ";;;;;",
        "or_profile": "~Sudarshan_Babu1;~Richard_Liu1;~Avery_Zhou1;~Michael_Maire1;~Rana_Hanocka1;~Gregory_Shakhnarovich2",
        "aff": "Toyota Technological Institute at Chicago;University of Chicago;;University of Chicago;University of Chicago;University of Chicago",
        "aff_domain": "ttic.edu;cs.uchicago.edu;;uchicago.edu;uchicago.edu;uchicago.edu",
        "position": "PhD student;PhD student;;Associate Professor;Assistant Professor;Professor, part time",
        "bibtex": "@misc{\nbabu2024hyperfields,\ntitle={HyperFields: Towards Zero-Shot Generation of Ne{RF}s from Text},\nauthor={Sudarshan Babu and Richard Liu and Avery Zhou and Michael Maire and Greg Shakhnarovich and Rana Hanocka},\nyear={2024},\nurl={https://openreview.net/forum?id=84Hk01tFKq}\n}",
        "github": "",
        "project": "",
        "reviewers": "VyWD;6JFZ;YDm2;ckby",
        "site": "https://openreview.net/forum?id=84Hk01tFKq",
        "pdf_size": 6003306,
        "rating": "5;5;5;8",
        "confidence": "5;4;4;4",
        "soundness": "3;3;3;4",
        "contribution": "3;2;2;4",
        "presentation": "2;3;3;3",
        "wc_summary": "92;98;64;104",
        "wc_strengths": "51;57;33;140",
        "wc_weaknesses": "162;125;164;99",
        "wc_questions": "107;82;21;18",
        "wc_review": "412;362;282;361",
        "wc_reply_reviewers": "100;0;0;0",
        "wc_reply_authors": "377;494;128;492",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            89.5,
            15.321553446044563
        ],
        "wc_strengths_avg": [
            70.25,
            41.227266462864115
        ],
        "wc_weaknesses_avg": [
            137.5,
            27.115493725912497
        ],
        "wc_questions_avg": [
            57.0,
            38.54218468120353
        ],
        "wc_review_avg": [
            354.25,
            46.53157530107916
        ],
        "wc_reply_reviewers_avg": [
            25.0,
            43.30127018922193
        ],
        "wc_reply_authors_avg": [
            372.75,
            149.03250484374206
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11413657046320631001&as_sdt=5,40&sciodt=0,40&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;1;1;1;1",
        "aff_unique_norm": "Toyota Technological Institute at Chicago;University of Chicago",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tti-chicago.org;https://www.uchicago.edu",
        "aff_unique_abbr": "TTI Chicago;UChicago",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Chicago;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "84fOBZlOiV",
        "title": "Estimating uncertainty from feed-forward network based sensing using quasilinear approximation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Artificial neural networks are increasingly integrated into both sensing hardware (e.g., \"smart sensors\") and dedicated decision-making circuits that operate on this information. As this technology is deployed in safety-critical environments (pedestrian-detection, power management, and flight-controls) it is critical to assess the real-time confidence of information built on these networks. However, while stand-alone confidence of sensing (e.g. object detection) neural networks are common, tools are much more limited for integrating such information into formal estimation of latent variables upstream of the sensor. To make this distinction clear, consider the common problem of target-tracking from a mobile camera. The geographic position of the target is a function of the camera position and orientation in addition to position within the image, whereas the neural network only reports confidence in pixel-space. Likewise, optimally leveraging an image-sequence requires consideration of uncertainty in the camera and target dynamics, as well as the sensing neural network. As we will demonstrate, fusing dynamical system models with large sensing networks presents a major computational challenge. Specifically, popular approaches such as first-order (Jacobian) linearization prove inaccurate, whereas nonlinear sampling-based approaches, while effective, are intractable for high-dimensional measurements such as images. In this work, we borrow an analytic approach from control engineering, quasilinear system approximation, to propagate the dynamics of environmental uncertainty through feedforward neural network architectures. The approximation enables direct Bayesian (i.e., Kalman-style) filtering to estimate latent variables, thus obviating the need for taxing sampling-based approaches. Thus, the proposed framework may enable real-time confidence estimation in high-dimensional network-based sensing deployments.",
        "keywords": "Uncertainty propagation;quasilinear approximation;stochastic linearization;neural networks;Kalman filter.",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/6116d624dba3dc0f924acb132a34ce744df6b47f.pdf",
        "author": "Songhan Zhang;Matthew Singh;ShiNung Ching",
        "authorids": "~Songhan_Zhang1;~Matthew_Singh1;~ShiNung_Ching1",
        "gender": "M;;",
        "homepage": "https://www.linkedin.com/in/songhan-zhang-7a58338b/;https://sites.wustl.edu/ccplab/people/matthew-singh/;http://braindynamics.engineering.wustl.edu",
        "dblp": ";;13/9188",
        "google_scholar": ";;z_vUo8EAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Songhan_Zhang1;~Matthew_Singh1;~ShiNung_Ching1",
        "aff": "Washington University, St. Louis;Washington University, St. Louis;Washington University, St. Louis",
        "aff_domain": "wustl.edu;wustl.edu;wustl.edu",
        "position": "PhD student;Postdoc;Associate Professor",
        "bibtex": "@misc{\nzhang2024estimating,\ntitle={Estimating uncertainty from feed-forward network based sensing using quasilinear approximation},\nauthor={Songhan Zhang and Matthew Singh and ShiNung Ching},\nyear={2024},\nurl={https://openreview.net/forum?id=84fOBZlOiV}\n}",
        "github": "",
        "project": "",
        "reviewers": "vnNG;Woe1;Lszd;gBbv",
        "site": "https://openreview.net/forum?id=84fOBZlOiV",
        "pdf_size": 1331208,
        "rating": "3;3;5;5",
        "confidence": "4;4;4;3",
        "soundness": "2;3;2;3",
        "contribution": "1;1;2;2",
        "presentation": "2;3;2;2",
        "wc_summary": "33;75;82;132",
        "wc_strengths": "9;17;49;173",
        "wc_weaknesses": "104;194;27;325",
        "wc_questions": "3;49;12;5",
        "wc_review": "149;335;170;635",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            80.5,
            35.14612354157995
        ],
        "wc_strengths_avg": [
            62.0,
            65.81033353509159
        ],
        "wc_weaknesses_avg": [
            162.5,
            110.88394834239986
        ],
        "wc_questions_avg": [
            17.25,
            18.632968094214082
        ],
        "wc_review_avg": [
            322.25,
            194.40341432186833
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:wRkjZyULNGEJ:scholar.google.com/&scioq=Estimating+uncertainty+from+feed-forward+network+based+sensing+using+quasilinear+approximation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Washington University in St. Louis",
        "aff_unique_dep": "",
        "aff_unique_url": "https://wustl.edu",
        "aff_unique_abbr": "WUSTL",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "St. Louis",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Detecting, Explaining, and Mitigating Memorization in Diffusion Models",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19340",
        "id": "84n3UwkH7b",
        "author_site": "Yuxin Wen, Yuchen Liu, Chen Chen, Lingjuan Lyu",
        "tldr": "",
        "abstract": "Recent breakthroughs in diffusion models have exhibited exceptional image-generation capabilities. However, studies show that some outputs are merely replications of training data. Such replications present potential legal challenges for model owners, especially when the generated content contains proprietary information. In this work, we introduce a straightforward yet effective method for detecting memorized prompts by inspecting the magnitude of text-conditional predictions. Our proposed method seamlessly integrates without disrupting sampling algorithms, and delivers high accuracy even at the first generation step, with a single generation per prompt. Building on our detection strategy, we unveil an explainable approach that shows the contribution of individual words or tokens to memorization. This offers an interactive medium for users to adjust their prompts. Moreover, we propose two strategies i.e., to mitigate memorization by leveraging the magnitude of text-conditional predictions, either through minimization during inference or filtering during training. These proposed strategies effectively counteract memorization while maintaining high-generation quality. Code is available at https://github.com/YuxinWenRick/diffusion_memorization.",
        "keywords": "Diffusion Model;Memorization",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/5a7cc8c3e384ae4896dc9e7840e66453f612bdb4.zip",
        "author": "Yuxin Wen;Yuchen Liu;Chen Chen;Lingjuan Lyu",
        "authorids": "~Yuxin_Wen2;~Yuchen_Liu8;~Chen_Chen20;~Lingjuan_Lyu1",
        "gender": ";;M;F",
        "homepage": "https://yuxinwenrick.github.io/;;https://cc233.github.io/;https://sites.google.com/view/lingjuan-lyu",
        "dblp": ";;65/4423-43;178/9876",
        "google_scholar": "oUYfjg0AAAAJ;;;",
        "orcid": ";0000-0002-3629-128X;0000-0001-7359-8515;",
        "linkedin": ";;;",
        "or_profile": "~Yuxin_Wen2;~Yuchen_Liu8;~Chen_Chen20;~Lingjuan_Lyu1",
        "aff": "University of Maryland, College Park;Zhejiang University;Sony AI;Sony",
        "aff_domain": "umd.edu;zju.edu.cn;sony.com;sony.com",
        "position": "PhD student;PhD student;Researcher;scientist",
        "bibtex": "@inproceedings{\nwen2024detecting,\ntitle={Detecting, Explaining, and Mitigating Memorization in Diffusion Models},\nauthor={Yuxin Wen and Yuchen Liu and Chen Chen and Lingjuan Lyu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=84n3UwkH7b}\n}",
        "github": "",
        "project": "",
        "reviewers": "hCP2;VQfz;Mwfj;5xmi",
        "pdf_size": 44556169,
        "rating": "8;8;8;8",
        "confidence": "2;3;4;4",
        "soundness": "2;3;4;4",
        "contribution": "3;3;4;4",
        "presentation": "3;3;4;3",
        "wc_summary": "204;322;81;133",
        "wc_strengths": "225;61;56;177",
        "wc_weaknesses": "271;2;59;276",
        "wc_questions": "82;116;33;2",
        "wc_review": "782;501;229;588",
        "wc_reply_reviewers": "21;0;0;0",
        "wc_reply_authors": "879;234;436;636",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            3.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            185.0,
            90.34655499796325
        ],
        "wc_strengths_avg": [
            129.75,
            73.26450368357108
        ],
        "wc_weaknesses_avg": [
            152.0,
            123.1726430665511
        ],
        "wc_questions_avg": [
            58.25,
            43.87695864574025
        ],
        "wc_review_avg": [
            525.0,
            198.87810336987832
        ],
        "wc_reply_reviewers_avg": [
            5.25,
            9.093266739736606
        ],
        "wc_reply_authors_avg": [
            546.25,
            238.97319410343914
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 55,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5536743981762017609&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=84n3UwkH7b",
        "pdf": "https://openreview.net/pdf?id=84n3UwkH7b",
        "email": "umd.edu;zju.edu.cn;sony.com;sony.com",
        "author_num": 4,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "University of Maryland;Zhejiang University;Sony;Sony Corporation",
        "aff_unique_dep": ";;Sony AI;",
        "aff_unique_url": "https://www/umd.edu;https://www.zju.edu.cn;https://www.sony.com;https://www.sony.com",
        "aff_unique_abbr": "UMD;ZJU;Sony AI;Sony",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "College Park;",
        "aff_country_unique_index": "0;1;2;2",
        "aff_country_unique": "United States;China;Japan"
    },
    {
        "id": "85Af6AcMo5",
        "title": "SciRE-Solver: Accelerating Diffusion Models Sampling by Score-integrand Solver with Recursive Difference",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "One downside of Diffusion models (DMs) is their slow iterative process. Recent algorithms for fast sampling are designed from the \ndifferential equations. However, in the fast algorithms, estimating the derivative of the score function evaluations becomes intractable due to the complexity of large-scale, well-trained neural networks.  In this work, we introduce the recursive difference method to calculate the derivative of the score function networks. Building upon, we propose \\emph{SciRE-Solver} with the convergence order guarantee for accelerating DMs sampling. Our proposed sampling algorithms attain SOTA FIDs in comparison to existing training-free sampling algorithms, \nunder various number of score function evaluations (NFE).   Such as, we achieve $3.48$ FID with $12$ NFE, and $2.42$ FID with $20$ NFE for continuous-time model on CIFAR-10;  $1.79$ FID with $20$ NFE and  $1.76$ FID with $100$ NFE for the pretrained model of EDM. Experiments demonstrate also that demonstrate that SciRE-Solver with multi-step methods can achieve high-quality samples on popular text-to-image generation tasks with only 6$\\sim$20 NFEs.",
        "keywords": "Diffusion Models;Sampler;Accelerating",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/66d650a108b6c2b1946203983df892e7a90ac5de.zip",
        "author": "Shigui Li;Wei Chen;Delu Zeng",
        "authorids": "~Shigui_Li2;~Wei_Chen52;~Delu_Zeng4",
        "gender": "M;M;M",
        "homepage": ";;",
        "dblp": "236/7957;;38/5665",
        "google_scholar": "Fm039ikAAAAJ;https://scholar.google.com.hk/citations?user=r5fgeWQAAAAJ;08RCdoIAAAAJ",
        "orcid": "0000-0003-2606-3600;0009-0002-2880-3078;",
        "linkedin": ";;",
        "or_profile": "~Shigui_Li2;~Wei_Chen52;~Delu_zeng1",
        "aff": "South China University of Technology;South China University of Technology;South China University of Technology",
        "aff_domain": "scut.edu.cn;scut.edu.cn;scut.edu.cn",
        "position": "PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nli2024sciresolver,\ntitle={Sci{RE}-Solver: Accelerating  Diffusion Models Sampling by Score-integrand Solver with Recursive Difference},\nauthor={Shigui Li and Wei Chen and Delu Zeng},\nyear={2024},\nurl={https://openreview.net/forum?id=85Af6AcMo5}\n}",
        "github": "",
        "project": "",
        "reviewers": "zqdo;MTm2;eocv;gjHa",
        "site": "https://openreview.net/forum?id=85Af6AcMo5",
        "pdf_size": 41322172,
        "rating": "5;6;6;6",
        "confidence": "4;4;4;2",
        "soundness": "3;3;3;2",
        "contribution": "2;3;3;3",
        "presentation": "1;3;3;2",
        "wc_summary": "29;53;59;90",
        "wc_strengths": "29;23;47;69",
        "wc_weaknesses": "200;12;132;131",
        "wc_questions": "2;36;34;308",
        "wc_review": "260;124;272;598",
        "wc_reply_reviewers": "47;0;0;64",
        "wc_reply_authors": "748;375;432;853",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "2;1;1;3",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            57.75,
            21.741377601246892
        ],
        "wc_strengths_avg": [
            42.0,
            17.916472867168917
        ],
        "wc_weaknesses_avg": [
            118.75,
            67.68077644353676
        ],
        "wc_questions_avg": [
            95.0,
            123.71337841963576
        ],
        "wc_review_avg": [
            313.5,
            174.23762509859918
        ],
        "wc_reply_reviewers_avg": [
            27.75,
            28.39344114403888
        ],
        "wc_reply_authors_avg": [
            602.0,
            202.9445737141055
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=791203681200403792&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "South China University of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.scut.edu.cn",
        "aff_unique_abbr": "SCUT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "85gNpcUhmx",
        "title": "Context-Aware Unsupervised Domain Adaptive Lane Detection",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper focuses on two crucial issues in domain-adaptive lane detection, i.e., how to effectively learn discriminative features and transfer knowledge across domains. Existing lane detection methods usually exploit a pixel-wise cross-entropy loss to train detection models. However, the loss ignores the difference in feature representation among lanes, which leads to inefficient feature learning. On the other hand, cross-domain context dependency crucial for transferring knowledge across domains remains unexplored in existing lane detection methods. This paper proposes a Context-aware Unsupervised Domain-Adaptive Lane Detection (CUDALD) method, consisting of two key components, i.e., cross-domain contrastive loss and domain-level feature aggregation, to realize domain-adaptive lane detection. The former can effectively differentiate feature representations among categories by taking domain-level features as positive samples. The latter fuses the domain-level and pixel-level features to strengthen cross-domain context dependency. Extensive experiments show that CUDALD significantly improves the detection model\u2019s performance and outperforms existing unsupervised domain adaptive lane detection methods on datasets, TuLane, MuLane, and MoLane, especially achieving the best accuracy of 92.24\\% when using RTFormer on TuLane.",
        "keywords": "Unsupervised domain adaptive;Lane detection;Cross-domain contrastive loss;Domain-level feature aggregation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Kunyang Zhou;Yunjian Feng;Jun Li",
        "authorids": "~Kunyang_Zhou1;~Yunjian_Feng2;~Jun_Li40",
        "gender": ";M;",
        "homepage": ";https://blog.csdn.net/qq_36104364?type=blog;",
        "dblp": ";;",
        "google_scholar": ";;",
        "orcid": ";;0000-0002-5272-9130",
        "linkedin": ";;",
        "or_profile": "~Kunyang_Zhou1;~Yunjian_Feng2;~Jun_Li40",
        "aff": ";Southeast University;Southeast University",
        "aff_domain": ";seu.edu.cn;seu.edu.cn",
        "position": ";PhD student;Full Professor",
        "bibtex": "@misc{\nzhou2024contextaware,\ntitle={Context-Aware Unsupervised Domain Adaptive Lane Detection},\nauthor={Kunyang Zhou and Yunjian Feng and Jun Li},\nyear={2024},\nurl={https://openreview.net/forum?id=85gNpcUhmx}\n}",
        "github": "",
        "project": "",
        "reviewers": "1nVJ;YuT7;cVkk;ZmgM",
        "site": "https://openreview.net/forum?id=85gNpcUhmx",
        "pdf_size": 2809368,
        "rating": "3;3;5;6",
        "confidence": "4;4;4;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "78;47;82;86",
        "wc_strengths": "98;30;36;56",
        "wc_weaknesses": "93;215;118;278",
        "wc_questions": "4;3;22;32",
        "wc_review": "273;295;258;452",
        "wc_reply_reviewers": "0;0;0;210",
        "wc_reply_authors": "309;540;451;775",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            73.25,
            15.417117110536587
        ],
        "wc_strengths_avg": [
            55.0,
            26.627053911388696
        ],
        "wc_weaknesses_avg": [
            176.0,
            74.46139939592862
        ],
        "wc_questions_avg": [
            15.25,
            12.275483697190918
        ],
        "wc_review_avg": [
            319.5,
            77.62248385616117
        ],
        "wc_reply_reviewers_avg": [
            52.5,
            90.93266739736606
        ],
        "wc_reply_authors_avg": [
            518.75,
            169.3374958477891
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:D54Hn5mETXoJ:scholar.google.com/&scioq=Context-Aware+Unsupervised+Domain+Adaptive+Lane+Detection&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Southeast University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.seu.edu.cn/",
        "aff_unique_abbr": "SEU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "CompA: Addressing the Gap in Compositional Reasoning in Audio-Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19339",
        "id": "86NGO8qeWs",
        "author_site": "Sreyan Ghosh, Ashish Seth, Sonal Kumar, Utkarsh Tyagi, Chandra Kiran Evuru, Ramaneswaran S, S Sakshi, Oriol Nieto, Ramani Duraiswami, Dinesh Manocha",
        "tldr": "",
        "abstract": "A fundamental characteristic of audio is its compositional nature. Audio-language models (ALMs) trained using a contrastive approach (e.g., CLAP) that learns a shared representation between audio and language modalities have improved performance in many downstream applications, including zero-shot audio classification, audio retrieval, etc. However, the ability of these models to effectively perform compositional reasoning remains largely unexplored and necessitates additional research. In this paper, we propose CompA, a collection of two expert-annotated benchmarks with a majority of real-world audio samples, to evaluate compositional reasoning in ALMs. Our proposed CompA-order evaluates how well an ALM understands the order or occurrence of acoustic events in audio, and CompA-attribute evaluates attribute-binding of acoustic events. An instance from either benchmark consists of two audio-caption pairs, where both audios have the same acoustic events but with different compositions. An ALM is evaluated on how well it matches the right audio to the right caption. Using this benchmark, we first show that current ALMs perform only marginally better than random chance, thereby struggling with compositional reasoning. Next, we propose CompA-CLAP, where we fine-tune CLAP using a novel learning method to improve its compositional reasoning abilities. To train CompA-CLAP, we first propose improvements to contrastive training with composition-aware hard negatives, allowing for more focused training. Next, we propose a novel modular contrastive loss that helps the model learn fine-grained compositional understanding and overcomes the acute scarcity of openly available compositional audios. CompA-CLAP significantly improves over all our baseline models on the CompA benchmark, indicating its superior compositional reasoning capabilities.",
        "keywords": "audio;audio-language;compositional reasoning",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/8a89ee1502f56c41795ace8c403fa62fedc8d16c.zip",
        "author": "Sreyan Ghosh;Ashish Seth;Sonal Kumar;Utkarsh Tyagi;Chandra Kiran Reddy Evuru;Ramaneswaran S;S Sakshi;Oriol Nieto;Ramani Duraiswami;Dinesh Manocha",
        "authorids": "~Sreyan_Ghosh1;~Ashish_Seth1;~Sonal_Kumar1;~Utkarsh_Tyagi1;~Chandra_Kiran_Reddy_Evuru1;~Ramaneswaran_S1;~S_Sakshi1;~Oriol_Nieto1;~Ramani_Duraiswami1;~Dinesh_Manocha3",
        "gender": "M;M;M;M;M;M;F;M;M;M",
        "homepage": "https://sreyan88.github.io/;https://cs20s030.github.io/;https://sonalkum.github.io;https://utkarsh4430.github.io;;;https://sakshi113.github.io/;https://www.urinieto.com/;http://www.umiacs.umd.edu/~ramani/;https://www.cs.umd.edu/people/dmanocha",
        "dblp": "173/5626;36/10405;;286/2046;355/1221;;;120/3843.html;d/RamaniDuraiswami;m/DineshManocha",
        "google_scholar": "5HKZJHAAAAAJ;aBn1e34AAAAJ;jiJ2DcEAAAAJ;https://scholar.google.co.in/citations?user=RLjKaTwAAAAJ;;YIhHxbwAAAAJ;F_-YNVAAAAAJ;7CyUUcMAAAAJ;GNEcpkAAAAAJ;X08l_4IAAAAJ",
        "orcid": ";0000-0003-3100-9342;;;;;;;0000-0002-5596-8460;0000-0001-7047-9801",
        "linkedin": ";;realsonalkumar/;utkarsh4430/;ckevuru/;;sakshi113/;urinieto;ramani-duraiswami-32a50b1/;dinesh-manocha-2311846",
        "or_profile": "~Sreyan_Ghosh1;~Ashish_Seth1;~Sonal_Kumar1;~Utkarsh_Tyagi1;~Chandra_Kiran_Reddy_Evuru1;~Ramaneswaran_S1;~S_Sakshi1;~Oriol_Nieto1;~Ramani_Duraiswami1;~Dinesh_Manocha3",
        "aff": "University of Maryland, College Park;University of Maryland, College Park;University of Maryland, College Park;University of Maryland, College Park;University of Maryland, College Park;NVIDIA;University of Maryland, College Park;Adobe Systems;University of Maryland, College Park;University of Maryland, College Park",
        "aff_domain": "umd.edu;umd.edu;umd.edu;umd.edu;umd.edu;nvidia.com;umd.edu;adobe.com;umd.edu;umd.edu",
        "position": "PhD student;PhD student;PhD student;MS student;MS student;Researcher;PhD student;Researcher;Full Professor;Professor",
        "bibtex": "@inproceedings{\nghosh2024compa,\ntitle={CompA: Addressing the Gap in Compositional Reasoning in Audio-Language Models},\nauthor={Sreyan Ghosh and Ashish Seth and Sonal Kumar and Utkarsh Tyagi and Chandra Kiran Reddy Evuru and Ramaneswaran S and S Sakshi and Oriol Nieto and Ramani Duraiswami and Dinesh Manocha},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=86NGO8qeWs}\n}",
        "github": "",
        "project": "",
        "reviewers": "Cw3v;Xast;x6Uk;jJm8",
        "pdf_size": 3917096,
        "rating": "6;6;6;8",
        "confidence": "4;4;4;4",
        "soundness": "3;3;3;4",
        "contribution": "3;3;2;4",
        "presentation": "3;3;2;3",
        "wc_summary": "41;106;128;190",
        "wc_strengths": "63;1483;57;32",
        "wc_weaknesses": "181;2;91;73",
        "wc_questions": "129;2;130;50",
        "wc_review": "414;1593;406;345",
        "wc_reply_reviewers": "22;994;115;0",
        "wc_reply_authors": "1244;6047;1739;348",
        "reply_reviewers": "1;3;2;0",
        "reply_authors": "5;11;9;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            116.25,
            53.25586822125802
        ],
        "wc_strengths_avg": [
            408.75,
            620.3274840759516
        ],
        "wc_weaknesses_avg": [
            86.75,
            63.782344735827955
        ],
        "wc_questions_avg": [
            77.75,
            54.46271660503174
        ],
        "wc_review_avg": [
            689.5,
            522.3181501728616
        ],
        "wc_reply_reviewers_avg": [
            282.75,
            412.90275792249196
        ],
        "wc_reply_authors_avg": [
            2344.5,
            2195.0084851772212
        ],
        "reply_reviewers_avg": [
            1.5,
            1.118033988749895
        ],
        "reply_authors_avg": [
            6.5,
            3.840572873934304
        ],
        "replies_avg": [
            39,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5900022586925230025&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=86NGO8qeWs",
        "pdf": "https://openreview.net/pdf?id=86NGO8qeWs",
        "email": "umd.edu;umd.edu;umd.edu;umd.edu;umd.edu;nvidia.com;umd.edu;adobe.com;umd.edu;umd.edu",
        "author_num": 10,
        "aff_unique_index": "0;0;0;0;0;1;0;2;0;0",
        "aff_unique_norm": "University of Maryland;NVIDIA;Adobe",
        "aff_unique_dep": ";NVIDIA Corporation;Adobe Systems Incorporated",
        "aff_unique_url": "https://www/umd.edu;https://www.nvidia.com;https://www.adobe.com",
        "aff_unique_abbr": "UMD;NVIDIA;Adobe",
        "aff_campus_unique_index": "0;0;0;0;0;0;0;0",
        "aff_campus_unique": "College Park;",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "86w3LbTNI1",
        "title": "Preventing Reward Hacking with Occupancy Measure Regularization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Reward hacking occurs when an agent performs very well with respect to a specified or learned reward function (often called a \"proxy\"), but poorly with respect to the true desired reward function. Since ensuring good alignment between the proxy and the true reward is remarkably difficult, prior work has proposed regularizing to a \"safe\" policy using the KL divergence between action distributions. The challenge with this divergence measure is that a small change in action distribution at a single state can lead to potentially calamitous outcomes. Our insight is that when this happens, the state occupancy measure of the policy shifts significantly\u2014the agent spends time in drastically different states than the safe policy does. We thus propose regularizing based on occupancy measure (OM) rather than action distribution. We show theoretically that there is a direct relationship between the returns of two policies under *any* reward function and their OM divergence, whereas no such relationship holds for their action distribution divergence. We then empirically find that OM regularization more effectively prevents reward hacking while allowing for performance improvement on top of the safe policy.",
        "keywords": "reward hacking;safety;occupancy measures;reinforcement learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Cassidy Laidlaw;Shivam Singhal;Anca Dragan",
        "authorids": "~Cassidy_Laidlaw1;~Shivam_Singhal1;~Anca_Dragan1",
        "gender": "M;M;F",
        "homepage": "https://cassidylaidlaw.com;;http://www.ancadragan.com/",
        "dblp": "241/5375;;",
        "google_scholar": "DzeJ67UAAAAJ;;",
        "orcid": ";;",
        "linkedin": ";shivam-singhal5601/;",
        "or_profile": "~Cassidy_Laidlaw1;~Shivam_Singhal1;~Anca_Dragan1",
        "aff": "University of California, Berkeley;University of California, Berkeley;University of California, Berkeley",
        "aff_domain": "berkeley.edu;berkeley.edu;berkeley.edu",
        "position": "PhD student;MS student;Associate Professor",
        "bibtex": "@misc{\nlaidlaw2024preventing,\ntitle={Preventing Reward Hacking with Occupancy Measure Regularization},\nauthor={Cassidy Laidlaw and Shivam Singhal and Anca Dragan},\nyear={2024},\nurl={https://openreview.net/forum?id=86w3LbTNI1}\n}",
        "github": "",
        "project": "",
        "reviewers": "jdVB;y14X;rjUA;Jr8S;M4hZ",
        "site": "https://openreview.net/forum?id=86w3LbTNI1",
        "pdf_size": 495818,
        "rating": "3;5;5;6;6",
        "confidence": "4;4;2;4;4",
        "soundness": "2;2;3;3;3",
        "contribution": "2;1;2;2;2",
        "presentation": "2;3;3;4;3",
        "wc_summary": "73;138;186;214;163",
        "wc_strengths": "22;59;110;218;129",
        "wc_weaknesses": "145;140;177;172;299",
        "wc_questions": "188;55;37;171;85",
        "wc_review": "428;392;510;775;676",
        "wc_reply_reviewers": "0;0;0;16;196",
        "wc_reply_authors": "911;723;1049;1126;934",
        "reply_reviewers": "0;0;0;1;1",
        "reply_authors": "2;1;2;2;2",
        "rating_avg": [
            5.0,
            1.0954451150103321
        ],
        "confidence_avg": [
            3.6,
            0.8
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            1.8,
            0.4000000000000001
        ],
        "presentation_avg": [
            3.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            154.8,
            47.997499934892446
        ],
        "wc_strengths_avg": [
            107.6,
            66.84489509304356
        ],
        "wc_weaknesses_avg": [
            186.6,
            58.03654021390317
        ],
        "wc_questions_avg": [
            107.2,
            61.22875141630768
        ],
        "wc_review_avg": [
            556.2,
            146.80381466433357
        ],
        "wc_reply_reviewers_avg": [
            42.4,
            77.04959441814084
        ],
        "wc_reply_authors_avg": [
            948.6,
            137.16646820560774
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.8,
            0.4000000000000001
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7760325786457688938&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of California, Berkeley",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.berkeley.edu",
        "aff_unique_abbr": "UC Berkeley",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Berkeley",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "CPPO: Continual Learning for Reinforcement Learning with Human Feedback",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19338",
        "id": "86zAUE80pP",
        "author_site": "Han Zhang, Yu Lei, Lin Gui, Min Yang, Yulan He, HUI WANG, Ruifeng Xu",
        "tldr": "",
        "abstract": "The approach of Reinforcement Learning from Human Feedback (RLHF) is widely used for enhancing pre-trained Language Models (LM), enabling them to better align with human preferences. Existing RLHF-based LMs however require complete retraining whenever new queries or feedback are introduced, as human preferences may differ across different domains or topics. LM retraining is of\u0002ten impracticable in most real-world scenarios, due to the substantial time and computational costs involved, as well as data privacy concerns. To address this limitation, we propose Continual Proximal Policy Optimization (CPPO), a novel method that is able to continually align LM with dynamic human preferences. Specifically, CPPO adopts a weighting strategy to decide which samples should be utilized for enhancing policy learning and which should be used for solidifying past experiences. This seeks a good trade-off between policy learning and knowledge retention. Our experimental results show that CPPO outperforms strong Contin\u0002uous learning (CL) baselines when it comes to consistently aligning with human preferences. Furthermore, compared to PPO, CPPO offers more efficient and stable learning in non-continual scenarios.",
        "keywords": "lifelong learning;reinforcement learning;human feedback;proximal policy optimization",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/e53518d4f66f4c373da1c927bbf41ce523a3e4b9.zip",
        "author": "Han Zhang;Yu Lei;Lin Gui;Min Yang;Yulan He;Hui Wang;Ruifeng Xu",
        "authorids": "~Han_Zhang3;~Yu_Lei5;~Lin_Gui3;~Min_Yang6;~Yulan_He1;~Hui_Wang13;~Ruifeng_Xu1",
        "gender": "M;M;F;F;M;M;M",
        "homepage": ";;https://minyang.me/;https://www.kcl.ac.uk/people/yulan-he;https://openi.pcl.ac.cn;http://faculty.hitsz.edu.cn/xuruifeng;",
        "dblp": "26/4189-25;34/8605-3;02/1640-7;75/5430;39/721-73;93/5407-1;284/8639-4",
        "google_scholar": "lhdgPb8AAAAJ;https://scholar.google.com.ph/citations?user=1b3Eyx4AAAAJ;_wop6KgAAAAJ;https://scholar.google.co.uk/citations?user=SP9r32UAAAAJ;;mObXnNIAAAAJ;nHlrzV0AAAAJ",
        "orcid": "0000-0001-5660-6237;;;0000-0003-3948-5845;;0000-0002-4009-5679;0000-0001-8482-3140",
        "linkedin": ";;;yulan-he-277234a/?originalSubdomain=uk;;;",
        "or_profile": "~Han_Zhang3;~Lin_Gui3;~Min_Yang6;~Yulan_He1;~Hui_Wang13;~Ruifeng_Xu1;~Yu_Lei4",
        "aff": "Harbin Institute of Technology;King's College London, University of London;Shenzhen Institutes of Advanced Technology, Chinese Academy of Sciences, Chinese Academy of Sciences;King's College London, University of London;Cloud Computing;Harbin Institute of Technology;Peng Cheng Laboratory, Shenzhen, China",
        "aff_domain": "hit.edu.cn;kcl.ac.uk;siat.ac.cn;kcl.ac.uk;pcl.ac.cn;hit.edu.cn;pcl.ac.cn",
        "position": "PhD student;Lecturer;Associate Professor;Full Professor;Full Professor;Full Professor;Researcher",
        "bibtex": "@inproceedings{\nzhang2024cppo,\ntitle={{CPPO}: Continual Learning for Reinforcement Learning with Human Feedback},\nauthor={Han Zhang and Yu Lei and Lin Gui and Min Yang and Yulan He and Hui Wang and Ruifeng Xu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=86zAUE80pP}\n}",
        "github": "",
        "project": "",
        "reviewers": "Loz4;CUAu;qeM7;za1s",
        "pdf_size": 2705011,
        "rating": "5;6;6;8",
        "confidence": "4;4;2;2",
        "soundness": "2;3;2;4",
        "contribution": "2;3;2;3",
        "presentation": "2;2;3;4",
        "wc_summary": "159;61;158;127",
        "wc_strengths": "156;58;50;47",
        "wc_weaknesses": "612;327;163;90",
        "wc_questions": "212;2;23;1",
        "wc_review": "1139;448;394;265",
        "wc_reply_reviewers": "0;16;13;244",
        "wc_reply_authors": "1763;1081;347;590",
        "reply_reviewers": "0;1;1;2",
        "reply_authors": "5;3;2;2",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.0,
            1.0
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            126.25,
            39.808133591013785
        ],
        "wc_strengths_avg": [
            77.75,
            45.35622889967816
        ],
        "wc_weaknesses_avg": [
            298.0,
            200.5779150355293
        ],
        "wc_questions_avg": [
            59.5,
            88.48304922413107
        ],
        "wc_review_avg": [
            561.5,
            339.9841908089257
        ],
        "wc_reply_reviewers_avg": [
            68.25,
            101.64736838698776
        ],
        "wc_reply_authors_avg": [
            945.25,
            541.1212317956116
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            3.0,
            1.224744871391589
        ],
        "replies_avg": [
            31,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.6882472016116854,
        "gs_citation": 17,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10293528444348719373&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=86zAUE80pP",
        "pdf": "https://openreview.net/pdf?id=86zAUE80pP",
        "email": "hit.edu.cn;kcl.ac.uk;siat.ac.cn;kcl.ac.uk;pcl.ac.cn;hit.edu.cn;pcl.ac.cn",
        "author_num": 7,
        "aff_unique_index": "0;1;2;1;3;0;4",
        "aff_unique_norm": "Harbin Institute of Technology;King's College London;Chinese Academy of Sciences;Cloud Computing;Pengcheng Laboratory",
        "aff_unique_dep": ";;Shenzhen Institutes of Advanced Technology;;Peng Cheng Laboratory",
        "aff_unique_url": "http://www.hit.edu.cn/;https://www.kcl.ac.uk;http://www.cas.cn;;",
        "aff_unique_abbr": "HIT;KCL;CAS;;",
        "aff_campus_unique_index": "0;2;0;2",
        "aff_campus_unique": "Harbin;;Shenzhen",
        "aff_country_unique_index": "0;1;0;1;0;0",
        "aff_country_unique": "China;United Kingdom;"
    },
    {
        "id": "87XbxDnPqj",
        "title": "Gradient Descent Provably Solves Nonlinear Tomographic Reconstruction",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In computed tomography (CT), the forward model consists of a linear Radon transform followed by an exponential nonlinearity based on the attenuation of light according to the Beer\u2013Lambert Law. Conventional reconstruction often involves inverting this nonlinearity as a preprocessing step and then solving a convex inverse problem. However, this nonlinear measurement preprocessing required to use the Radon transform is poorly conditioned in the vicinity of high-density materials, such as metal. This preprocessing makes CT reconstruction methods numerically sensitive and susceptible to artifacts near high-density regions. In this paper, we study a technique where the signal is directly reconstructed from raw measurements through the nonlinear forward model. Though this optimization is nonconvex, we show that gradient descent provably converges to the global optimum at a geometric rate, perfectly reconstructing the underlying signal with a near minimal number of random measurements. We also prove similar results in the under-determined setting where the number of measurements is significantly smaller than the dimension of the signal. This is achieved by enforcing prior structural information about the signal through constraints on the optimization variables. We illustrate the benefits of direct nonlinear CT reconstruction with cone-beam CT experiments on synthetic and real 3D volumes. We show that this approach reduces metal artifacts compared to a commercial reconstruction of a human skull with metal dental crowns.",
        "keywords": "computed tomography;nonconvex optimization;compressive sensing",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/8b984c2545ff3e41b798bb48357af00cb160610a.zip",
        "author": "Sara Fridovich-Keil;Fabrizio Valdivia;Gordon Wetzstein;Benjamin Recht;Mahdi Soltanolkotabi",
        "authorids": "~Sara_Fridovich-Keil1;fabriziovaldivia2001@gmail.com;~Gordon_Wetzstein3;~Benjamin_Recht1;~Mahdi_Soltanolkotabi1",
        "gender": "F;;M;M;M",
        "homepage": "https://sarafridov.github.io;;http://web.stanford.edu/~gordonwz/;http://www.eecs.berkeley.edu/~brecht/;http://www-bcf.usc.edu/~soltanol/",
        "dblp": "236/7023;;13/4660;r/BenRecht;75/6691",
        "google_scholar": "9xF7M6wAAAAJ;;VOf45S0AAAAJ;https://scholar.google.com.tw/citations?user=a_dbdxAAAAAJ;narJyMAAAAAJ",
        "orcid": ";;0000-0002-9243-6885;;",
        "linkedin": "sara-fridovich-keil-3aa744160/;;gordon-wetzstein-2406723/;;",
        "or_profile": "~Sara_Fridovich-Keil1;fabriziovaldivia2001@gmail.com;~Gordon_Wetzstein3;~Benjamin_Recht1;~Mahdi_Soltanolkotabi1",
        "aff": "Stanford University;;Stanford University;University of California, Berkeley;University of Southern California",
        "aff_domain": "stanford.edu;;stanford.edu;berkeley.edu;usc.edu",
        "position": "Postdoc;;Associate Professor;Full Professor;Associate Professor",
        "bibtex": "@misc{\nfridovich-keil2024gradient,\ntitle={Gradient Descent Provably Solves Nonlinear Tomographic Reconstruction},\nauthor={Sara Fridovich-Keil and Fabrizio Valdivia and Gordon Wetzstein and Benjamin Recht and Mahdi Soltanolkotabi},\nyear={2024},\nurl={https://openreview.net/forum?id=87XbxDnPqj}\n}",
        "github": "",
        "project": "",
        "reviewers": "MBT4;TLot;1R2J;qFK5",
        "site": "https://openreview.net/forum?id=87XbxDnPqj",
        "pdf_size": 609659,
        "rating": "3;5;6;8",
        "confidence": "2;4;4;1",
        "soundness": "2;2;3;2",
        "contribution": "2;2;3;2",
        "presentation": "2;4;3;2",
        "wc_summary": "49;158;54;12",
        "wc_strengths": "26;97;37;1",
        "wc_weaknesses": "66;149;70;1",
        "wc_questions": "32;224;86;1",
        "wc_review": "173;628;247;15",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "535;1151;564;12",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;3;2;1",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            2.75,
            1.299038105676658
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            68.25,
            54.29721447735602
        ],
        "wc_strengths_avg": [
            40.25,
            35.26595383652624
        ],
        "wc_weaknesses_avg": [
            71.5,
            52.461890930464946
        ],
        "wc_questions_avg": [
            85.75,
            85.41772357069696
        ],
        "wc_review_avg": [
            265.75,
            225.30798365792543
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            565.5,
            403.1454452179759
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.2668802563418119,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8804626619442851423&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "Stanford University;University of California, Berkeley;University of Southern California",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.stanford.edu;https://www.berkeley.edu;https://www.usc.edu",
        "aff_unique_abbr": "Stanford;UC Berkeley;USC",
        "aff_campus_unique_index": "0;0;1;2",
        "aff_campus_unique": "Stanford;Berkeley;Los Angeles",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "87YOFayjcG",
        "title": "JudgeLM : Fine-tuned Large Language Models are Scalable Judges",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Evaluating Large Language Models (LLMs) in open-ended scenarios is challenging due to existing benchmarks and metrics can not measure them comprehensively. To address this problem, we propose to fine-tune LLMs as scalable judges (JudgeLM) to evaluate LLMs efficiently and effectively in open-ended benchmarks. We first propose a comprehensive, large-scale, high-quality dataset containing task seeds, LLMs-generated answers, and GPT-4-generated judgments for fine-tuning high-performance judges, as well as a new benchmark for evaluating the judges. We train JudgeLM at different scales from 7B, 13B, to 33B parameters, and conduct a systematic analysis of its capabilities and behaviors. We then analyze the key biases in fine-tuning LLM as a judge and consider them as position bias, knowledge bias, and format bias. To address these issues, JudgeLM introduces a bag of techniques including swap augmentation, reference support, and reference drop, which clearly enhance the judge's performance. JudgeLM obtains the state-of-the-art judge performance on both the existing PandaLM benchmark and our proposed new benchmark. Our JudgeLM is efficient and the JudgeLM-7B only needs 3 mins to judge 5K samples with 8 A100 GPUs. JudgeLM obtains high agreement with the teacher judge, achieving an agreement exceeding 90% that even surpasses human-to-human agreement. JudgeLM also demonstrates extended capabilities in being judges of the single answer, multimodal models, multiple answers, and multi-turn chat.",
        "keywords": "Large Language Model;Evaluation of Open-ended Tasks;Scalable Judges;Judge Dataset",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Lianghui Zhu;Xinggang Wang;Xinlong Wang",
        "authorids": "~Lianghui_Zhu3;~Xinggang_Wang1;~Xinlong_Wang2",
        "gender": "M;M;M",
        "homepage": "https://xwcv.github.io/index.htm;;https://github.com/Unrealluver",
        "dblp": "95/3056;;",
        "google_scholar": "qNCTLV0AAAAJ;DPz0DjYAAAAJ;NvMHcs0AAAAJ",
        "orcid": "0000-0001-6732-7823;;",
        "linkedin": ";;",
        "or_profile": "~Xinggang_Wang1;~Xinlong_Wang2;~Lianghui_Zhu2",
        "aff": "Huazhong University of Science and Technology;Beijing Academy of Artificial Intelligence;Huazhong University of Science and Technology",
        "aff_domain": "hust.edu.cn;baai.ac.cn;hust.edu.cn",
        "position": "Full Professor;Researcher;PhD student",
        "bibtex": "@misc{\nzhu2024judgelm,\ntitle={Judge{LM} : Fine-tuned Large Language Models are Scalable Judges},\nauthor={Lianghui Zhu and Xinggang Wang and Xinlong Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=87YOFayjcG}\n}",
        "github": "",
        "project": "",
        "reviewers": "CPpo;UdgT;rHPM;jzHn",
        "site": "https://openreview.net/forum?id=87YOFayjcG",
        "pdf_size": 2686654,
        "rating": "5;5;5;6",
        "confidence": "4;4;4;4",
        "soundness": "3;3;2;3",
        "contribution": "2;3;2;2",
        "presentation": "3;3;3;3",
        "wc_summary": "86;78;116;47",
        "wc_strengths": "80;46;74;100",
        "wc_weaknesses": "189;102;159;248",
        "wc_questions": "43;57;39;137",
        "wc_review": "398;283;388;532",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "679;655;597;1249",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            81.75,
            24.55987581401828
        ],
        "wc_strengths_avg": [
            75.0,
            19.313207915827967
        ],
        "wc_weaknesses_avg": [
            174.5,
            52.69962049199216
        ],
        "wc_questions_avg": [
            69.0,
            39.824615503479755
        ],
        "wc_review_avg": [
            400.25,
            88.40354913689835
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            795.0,
            263.80674744971935
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 107,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17023951720589094623&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Huazhong University of Science and Technology;Beijing Academy of Artificial Intelligence",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.hust.edu.cn;https://www.baaic.cn",
        "aff_unique_abbr": "HUST;BAAI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "87zTciMFHM",
        "title": "EXPLAIN, AGREE and LEARN: A Recipe for Scalable Neural-Symbolic Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recent progress in neural-symbolic AI (NeSy) has demonstrated that neural networks can benefit greatly from an integration with symbolic reasoning methods in terms of interpretability, data-efficiency and generalisation performance. Unfortunately, the symbolic component can lead to intractable computations for more complicated domains. This computational bottleneck has prevented the successful application of NeSy to more practical problems. We present EXPLAIN, AGREE and LEARN, an alternative paradigm that addresses the scalability problem of probabilistic NeSy learning. EXPLAIN leverages sampling to obtain a representative set of possible explanations for the symbolic component driven by a newly introduced diversity criterion. Then AGREE assigns importance to the sampled explanations based on the neural predictions. This defines the learning objective, which for sufficiently many samples is guaranteed to coincide with the objective used by exact probabilistic NeSy approaches. Using this objective, LEARN updates the neural component with direct supervision on its outputs, without the need to propagate the gradient through the symbolic component. Our approximate paradigm and its theoretical guarantees are experimentally evaluated and shown to be competitive with existing exact probabilistic NeSy frameworks, while outperforming them in terms of speed.",
        "keywords": "neuro-symbolic learning;variational inference;sampling;discrete latent variable model",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "/attachment/7836706a1e46eb52fbc34bce7411947546e1b893.pdf",
        "author": "Victor Verreet;Lennert De Smet;Luc De Raedt;Emanuele Sansone",
        "authorids": "~Victor_Verreet1;~Lennert_De_Smet1;~Luc_De_Raedt1;~Emanuele_Sansone1",
        "gender": "M;M;M;",
        "homepage": ";;https://people.cs.kuleuven.be/~luc.deraedt/;",
        "dblp": "303/4998;342/2788;r/LucDeRaedt;",
        "google_scholar": ";;https://scholar.google.com.tw/citations?user=dgobB6AAAAAJ;",
        "orcid": "0000-0003-2595-7207;0000-0003-3136-0634;0000-0002-6860-6303;",
        "linkedin": ";;;",
        "or_profile": "~Victor_Verreet1;~Lennert_De_Smet1;~Luc_De_Raedt1;~Emanuele_Sansone1",
        "aff": "KU Leuven;KU Leuven;KU Leuven, Belgium;",
        "aff_domain": "kuleuven.be;kuleuven.be;cs.kuleuven.be;",
        "position": "PhD student;PhD student;Full Professor;",
        "bibtex": "@misc{\nverreet2024explain,\ntitle={{EXPLAIN}, {AGREE} and {LEARN}: A Recipe for Scalable Neural-Symbolic Learning},\nauthor={Victor Verreet and Lennert De Smet and Luc De Raedt and Emanuele Sansone},\nyear={2024},\nurl={https://openreview.net/forum?id=87zTciMFHM}\n}",
        "github": "",
        "project": "",
        "reviewers": "GwsC;WFyQ;Pp9a;fkWq",
        "site": "https://openreview.net/forum?id=87zTciMFHM",
        "pdf_size": 1213246,
        "rating": "3;3;5;5",
        "confidence": "4;4;2;4",
        "soundness": "2;2;3;2",
        "contribution": "2;2;2;3",
        "presentation": "2;2;2;2",
        "wc_summary": "74;63;62;31",
        "wc_strengths": "23;39;53;16",
        "wc_weaknesses": "155;124;473;542",
        "wc_questions": "32;344;31;2",
        "wc_review": "284;570;619;591",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            57.5,
            16.00781059358212
        ],
        "wc_strengths_avg": [
            32.75,
            14.359230480774379
        ],
        "wc_weaknesses_avg": [
            323.5,
            185.93345583837245
        ],
        "wc_questions_avg": [
            102.25,
            140.09349556635382
        ],
        "wc_review_avg": [
            516.0,
            135.06850113923676
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:B48ZpoaYh58J:scholar.google.com/&scioq=EXPLAIN,+AGREE+and+LEARN:+A+Recipe+for+Scalable+Neural-Symbolic+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Katholieke Universiteit Leuven;KU Leuven",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.kuleuven.be;https://www.kuleuven.be",
        "aff_unique_abbr": "KU Leuven;KU Leuven",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Belgium"
    },
    {
        "id": "88FcNOwNvM",
        "title": "Compositional Image Decomposition with Diffusion Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Given an image of a natural scene, we are able to quickly decompose it into a set of components such as objects, lighting, shadows, and foreground. We can then picture how the image would look if we were to recombine certain components with those from other images, for instance producing a scene with a set of objects from our bedroom and animals from a zoo under the lighting conditions of a forest even if we have never seen such a scene in real life before. We present a method to decompose an image into such compositional components. Our approach, Decomp Diffusion, is an unsupervised method which, when given a single image, infers a set of different components in the image, each represented by a diffusion model. We demonstrate how components can capture different factors of the scene, ranging from global scene descriptors (shadows, foreground, facial expression) to local scene descriptors (objects). We further illustrate how inferred factors can be flexibly composed, even with factors inferred from other models, to generate a variety of scenes sharply different than those seen in training time.",
        "keywords": "Image Decomposition;Compositional Decomposition",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/a931bdad2b84cb88335b8450372e276f9f454278.pdf",
        "author": "Jocelin Su;Nan Liu;Joshua B. Tenenbaum;Yilun Du",
        "authorids": "~Jocelin_Su1;~Nan_Liu4;~Joshua_B._Tenenbaum1;~Yilun_Du1",
        "gender": ";;;",
        "homepage": ";;;https://yilundu.github.io",
        "dblp": ";;t/JoshuaBTenenbaum;204/4379",
        "google_scholar": ";;;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Jocelin_Su1;~Nan_Liu4;~Joshua_B._Tenenbaum1;~Yilun_Du1",
        "aff": ";;Massachusetts Institute of Technology;Massachusetts Institute of Technology",
        "aff_domain": ";;mit.edu;mit.edu",
        "position": ";;Professor;PhD student",
        "bibtex": "@misc{\nsu2024compositional,\ntitle={Compositional Image Decomposition with Diffusion Models},\nauthor={Jocelin Su and Nan Liu and Joshua B. Tenenbaum and Yilun Du},\nyear={2024},\nurl={https://openreview.net/forum?id=88FcNOwNvM}\n}",
        "github": "",
        "project": "",
        "reviewers": "Rmft;t1av;W4iB",
        "site": "https://openreview.net/forum?id=88FcNOwNvM",
        "pdf_size": 2766866,
        "rating": "5;6;8",
        "confidence": "4;4;4",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "2;3;3",
        "wc_summary": "46;55;98",
        "wc_strengths": "28;57;79",
        "wc_weaknesses": "44;117;36",
        "wc_questions": "46;73;216",
        "wc_review": "164;302;429",
        "wc_reply_reviewers": "115;0;44",
        "wc_reply_authors": "731;831;399",
        "reply_reviewers": "3;0;1",
        "reply_authors": "5;1;1",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            66.33333333333333,
            22.69116323349001
        ],
        "wc_strengths_avg": [
            54.666666666666664,
            20.885933597094056
        ],
        "wc_weaknesses_avg": [
            65.66666666666667,
            36.444783196257625
        ],
        "wc_questions_avg": [
            111.66666666666667,
            74.59371436134697
        ],
        "wc_review_avg": [
            298.3333333333333,
            108.21686046494274
        ],
        "wc_reply_reviewers_avg": [
            53.0,
            47.37791327893902
        ],
        "wc_reply_authors_avg": [
            653.6666666666666,
            184.64620825303246
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            1.247219128924647
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            1.8856180831641267
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16868049165076129421&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Massachusetts Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://web.mit.edu",
        "aff_unique_abbr": "MIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "88MalncLgU",
        "title": "GInX-Eval: Towards In-Distribution Evaluation of Graph Neural Networks Explanations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Diverse explainability methods of graph neural networks (GNN) have recently been developed to highlight the edges and nodes in the graph that contribute the most to the model predictions. However, it is not clear yet how to evaluate the *correctness* of those explanations, whether it is from a human or a model perspective. One unaddressed bottleneck in the current evaluation procedure is the problem of out-of-distribution explanations, whose distribution differs from those of the training data. This important issue affects existing evaluation metrics such as the popular faithfulness or fidelity score. In this paper, we show the limitations of faithfulness metrics. We propose **GInX-Eval** (**G**raph **In**-distribution e**X**planation **Eval**uation), an evaluation procedure of graph explanations that overcomes the pitfalls of faithfulness and offers new insights on explainability methods. Using a retraining strategy, the GInX score measures how informative removed edges are for the model and the EdgeRank score evaluates if explanatory edges are correctly ordered by their importance. GInX-Eval verifies if ground-truth explanations are instructive to the GNN model. In addition, it shows that many popular methods, including gradient-based methods, produce explanations that are not better than a random designation of edges as important subgraphs, challenging the findings of current works in the area. Results with GInX-Eval are consistent across multiple datasets and align with human evaluation.",
        "keywords": "Evaluation;explainability;graph neural networks;out-of-distribution explanations;faithfulness",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/15109512a07d95ca40cf9dfe1c9457f196d56b2e.pdf",
        "author": "Kenza Amara;Mennatallah El-Assady;Zhitao Ying",
        "authorids": "~Kenza_Amara1;~Mennatallah_El-Assady1;~Zhitao_Ying1",
        "gender": "F;;M",
        "homepage": "https://ai.ethz.ch/people/kenza-amara.html;;https://www.cs.yale.edu/homes/ying-rex",
        "dblp": ";183/8957;209/4936",
        "google_scholar": "e4wlh1AAAAAJ;;6fqNXooAAAAJ",
        "orcid": "0000-0001-7139-5562;0000-0001-8526-2613;",
        "linkedin": "kenza-amara/;;rex-ying-92770148/",
        "or_profile": "~Kenza_Amara1;~Mennatallah_El-Assady1;~Zhitao_Ying1",
        "aff": "ETH AI Center;Department of Computer Science, ETHZ - ETH Zurich;Yale University",
        "aff_domain": "infk.ethz.ch;inf.ethz.ch;yale.edu",
        "position": "PhD student;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\namara2024ginxeval,\ntitle={{GI}nX-Eval: Towards In-Distribution Evaluation of Graph Neural Networks Explanations},\nauthor={Kenza Amara and Mennatallah El-Assady and Zhitao Ying},\nyear={2024},\nurl={https://openreview.net/forum?id=88MalncLgU}\n}",
        "github": "",
        "project": "",
        "reviewers": "EeHX;DCst;qa24",
        "site": "https://openreview.net/forum?id=88MalncLgU",
        "pdf_size": 766028,
        "rating": "5;6;6",
        "confidence": "4;4;3",
        "soundness": "2;3;3",
        "contribution": "2;2;3",
        "presentation": "2;4;3",
        "wc_summary": "94;69;145",
        "wc_strengths": "52;77;73",
        "wc_weaknesses": "215;241;152",
        "wc_questions": "2;494;23",
        "wc_review": "363;881;393",
        "wc_reply_reviewers": "36;0;49",
        "wc_reply_authors": "548;645;417",
        "reply_reviewers": "1;0;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            102.66666666666667,
            31.626290048347787
        ],
        "wc_strengths_avg": [
            67.33333333333333,
            10.96458946893235
        ],
        "wc_weaknesses_avg": [
            202.66666666666666,
            37.36605708691007
        ],
        "wc_questions_avg": [
            173.0,
            227.1431266844762
        ],
        "wc_review_avg": [
            545.6666666666666,
            237.43256352535602
        ],
        "wc_reply_reviewers_avg": [
            28.333333333333332,
            20.725722075613085
        ],
        "wc_reply_authors_avg": [
            536.6666666666666,
            93.42495502927588
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5722598543388739124&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "ETH Zurich;Yale University",
        "aff_unique_dep": "AI Center;",
        "aff_unique_url": "https://www.ethz.ch;https://www.yale.edu",
        "aff_unique_abbr": "ETH;Yale",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Zurich;",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "Switzerland;United States"
    },
    {
        "title": "Local Graph Clustering with Noisy Labels",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19337",
        "id": "89A5c6enfc",
        "author_site": "Artur Back de Luca, Kimon Fountoulakis, Shenghao Yang",
        "tldr": "",
        "abstract": "The growing interest in machine learning problems over graphs with additional node information such as texts, images, or labels has popularized methods that require the costly operation of processing the entire graph. Yet, little effort has been made to the development of fast local methods (i.e. without accessing the entire graph) that extract useful information from such data. To that end, we propose a study of local graph clustering using noisy node labels as a proxy for additional node information. In this setting, nodes receive initial binary labels based on cluster affiliation: 1 if they belong to the target cluster and 0 otherwise. Subsequently, a fraction of these labels is flipped. We investigate the benefits of incorporating noisy labels for local graph clustering. By constructing a weighted graph with such labels, we study the performance of graph diffusion-based local clustering method on both the original and the weighted graphs. From a theoretical perspective, we consider recovering an unknown target cluster with a single seed node in a random graph with independent noisy node labels. We provide sufficient conditions on the label noise under which, with high probability, using diffusion in the weighted graph yields a more accurate recovery of the target cluster. This approach proves more effective than using the given labels alone or using diffusion in the label-free original graph. Empirically, we show that reliable node labels can be obtained with just a few samples from an attributed graph. Moreover, utilizing these labels via diffusion in the weighted graph leads to significantly better local clustering performance across several real-world datasets, improving F1 scores by up to 13\\%.",
        "keywords": "local graph clustering;graph diffusion;attributed graphs;noisy labels",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/074bb46f3424c6bb86d5032d9a3cbba9d3838e91.zip",
        "author": "Artur Back de Luca;Kimon Fountoulakis;Shenghao Yang",
        "authorids": "~Artur_Back_de_Luca1;~Kimon_Fountoulakis1;~Shenghao_Yang1",
        "gender": "M;M;M",
        "homepage": "https://artur-deluca.github.io/;https://opallab.ca;https://cs.uwaterloo.ca/~s286yang/",
        "dblp": ";149/5799;41/4482-2",
        "google_scholar": "tL9d0UoAAAAJ;https://scholar.google.ca/citations?user=K-SafJUAAAAJ;ocLDM-AAAAAJ",
        "orcid": ";;",
        "linkedin": "https://linkedin.com/in/arturbackdeluca;;",
        "or_profile": "~Artur_Back_de_Luca1;~Kimon_Fountoulakis1;~Shenghao_Yang1",
        "aff": "University of Waterloo;University of Waterloo;University of Waterloo",
        "aff_domain": "uwaterloo.ca;uwaterloo.ca;uwaterloo.ca",
        "position": "PhD student;Assistant Professor;PhD student",
        "bibtex": "@inproceedings{\nluca2024local,\ntitle={Local Graph Clustering with Noisy Labels},\nauthor={Artur Back de Luca and Kimon Fountoulakis and Shenghao Yang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=89A5c6enfc}\n}",
        "github": "",
        "project": "",
        "reviewers": "LuBd;PWgh;oYEs;CYJN",
        "pdf_size": 764106,
        "rating": "3;6;6;8",
        "confidence": "4;2;3;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;3;4",
        "wc_summary": "38;95;59;91",
        "wc_strengths": "31;46;32;73",
        "wc_weaknesses": "201;98;46;67",
        "wc_questions": "2;269;125;209",
        "wc_review": "272;508;262;440",
        "wc_reply_reviewers": "0;11;11;24",
        "wc_reply_authors": "1588;1082;816;1404",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "4;4;2;3",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            70.75,
            23.498670175139697
        ],
        "wc_strengths_avg": [
            45.5,
            16.948451256678293
        ],
        "wc_weaknesses_avg": [
            103.0,
            59.5273046592906
        ],
        "wc_questions_avg": [
            151.25,
            100.20572588430264
        ],
        "wc_review_avg": [
            370.5,
            106.31439225241331
        ],
        "wc_reply_reviewers_avg": [
            11.5,
            8.5
        ],
        "wc_reply_authors_avg": [
            1222.5,
            296.4435022057323
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.25,
            0.82915619758885
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5940885257860046,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11045825304576235979&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=89A5c6enfc",
        "pdf": "https://openreview.net/pdf?id=89A5c6enfc",
        "email": "uwaterloo.ca;uwaterloo.ca;uwaterloo.ca",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Waterloo",
        "aff_unique_dep": "",
        "aff_unique_url": "https://uwaterloo.ca",
        "aff_unique_abbr": "UW",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "89AOrk05uy",
        "title": "Understanding and addressing spurious correlation via Neural Tangent Kernels: A spectral bias perspective",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The existence of spurious correlations can prompt neural networks to depend heavily on features that exhibit strong correlations with the target labels exclusively in the training set, while such correlations may not persist in real-world scenarios. As a consequence, this results in suboptimal performance within certain subgrouping of the data. In this work, we leverage the theoretical insights of the Neural Tangent Kernel (NTK) to investigate the group robustness problem in the presence of spurious correlations. Specifically, we identify that poor generalization is not solely a consequence of statistical biases inherent in the dataset; rather, it also arises from the disparity in complexity between spurious and core features. Building upon this observation, we propose a method that adjusts the spectral properties of neural networks to mitigate bias without requiring knowledge of the spurious attributes.",
        "keywords": "NTK;spurious correlation",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Yeat Jeng Ng;Ainhize Barrainkua;Novi Quadrianto",
        "authorids": "~Yeat_Jeng_Ng2;~Ainhize_Barrainkua1;~Novi_Quadrianto1",
        "gender": "M;F;M",
        "homepage": "https://profiles.sussex.ac.uk/p515010-yeat-jeng-ng;;http://www.sussex.ac.uk/profiles/335583",
        "dblp": ";333/2278;http://dblp.uni-trier.de/pers/hd/q/Quadrianto:Novi",
        "google_scholar": ";;I-rLzGcAAAAJ",
        "orcid": ";0000-0002-2300-312X;",
        "linkedin": ";ainhize-barrainkua-agirre-07a000151;",
        "or_profile": "~Yeat_Jeng_Ng2;~Ainhize_Barrainkua1;~Novi_Quadrianto1",
        "aff": "University of Sussex;Basque Center for Applied Mathematics;Monash Indonesia",
        "aff_domain": "sussex.ac.uk;bcamath.org;monash.edu",
        "position": "PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nng2024understanding,\ntitle={Understanding and addressing spurious correlation via Neural Tangent Kernels: A spectral bias perspective},\nauthor={Yeat Jeng Ng and Ainhize Barrainkua and Novi Quadrianto},\nyear={2024},\nurl={https://openreview.net/forum?id=89AOrk05uy}\n}",
        "github": "",
        "project": "",
        "reviewers": "hgH8;cfRQ;XMhp",
        "site": "https://openreview.net/forum?id=89AOrk05uy",
        "pdf_size": 36589025,
        "rating": "3;3;6",
        "confidence": "4;4;4",
        "soundness": "1;2;3",
        "contribution": "1;1;3",
        "presentation": "3;3;4",
        "wc_summary": "188;118;175",
        "wc_strengths": "104;55;130",
        "wc_weaknesses": "826;356;217",
        "wc_questions": "130;62;22",
        "wc_review": "1248;591;544",
        "wc_reply_reviewers": "111;202;56",
        "wc_reply_authors": "307;630;238",
        "reply_reviewers": "1;1;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            160.33333333333334,
            30.40102337458761
        ],
        "wc_strengths_avg": [
            96.33333333333333,
            31.09483701338357
        ],
        "wc_weaknesses_avg": [
            466.3333333333333,
            260.5767108208679
        ],
        "wc_questions_avg": [
            71.33333333333333,
            44.58200932613463
        ],
        "wc_review_avg": [
            794.3333333333334,
            321.3641064102973
        ],
        "wc_reply_reviewers_avg": [
            123.0,
            60.20520464766037
        ],
        "wc_reply_authors_avg": [
            391.6666666666667,
            170.86511899416126
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Te8q6S72rikJ:scholar.google.com/&scioq=Understanding+and+addressing+spurious+correlation+via+Neural+Tangent+Kernels:+A+spectral+bias+perspective&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of Sussex;Basque Center for Applied Mathematics;Monash University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.sussex.ac.uk;https://www.bcamath.org/;https://www.monash.edu.id",
        "aff_unique_abbr": "Sussex;BCAM;Monash",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Indonesia",
        "aff_country_unique_index": "0;1;2",
        "aff_country_unique": "United Kingdom;Spain;Indonesia"
    },
    {
        "id": "89XNDtqhpL",
        "title": "MatFormer: Nested Transformer for Elastic Inference",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Transformer models are deployed in a wide range of settings, from multi-accelerator clusters to standalone mobile phones. The diverse inference constraints in these scenarios necessitate practitioners to train foundation models such as PaLM 2, Llama, & ViTs as a series of models of varying sizes. Due to significant training costs, only a select few model sizes are trained and supported, limiting more fine-grained control over relevant tradeoffs, including latency, cost, and accuracy. This work introduces MatFormer, a nested Transformer architecture designed to offer elasticity in a variety of deployment constraints. Each Feed Forward Network (FFN) block of a  MatFormer model is jointly optimized with a few nested smaller FFN blocks. This training procedure allows for the Mix'n'Match of model granularities across layers -- i.e., a trained universal MatFormer model enables extraction of hundreds of accurate smaller models, which were never explicitly optimized.  We empirically demonstrate MatFormer's effectiveness across different model classes (decoders & encoders), modalities (language & vision), and scales (up to 2.6B parameters). We find that a 2.6B decoder-only MatFormer language model (MatLM) allows us to extract smaller models spanning from 1.5B to 2.6B, each exhibiting comparable validation loss and one-shot downstream evaluations to their independently trained counterparts. Furthermore, we observe that smaller encoders extracted from a universal MatFormer-based ViT (MatViT) encoder preserve the metric-space structure for adaptive large-scale retrieval. Finally, we showcase that speculative decoding with the accurate and consistent submodels extracted from  MatFormer can further reduce inference latency.",
        "keywords": "Transformer;Neural Architecture Design;Large-scale deployment;Efficiency",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/9c05c9481de346aa885b02c262fbf2fc546fce1e.pdf",
        "author": "Fnu Devvrit;Sneha Kudugunta;Aditya Kusupati;Tim Dettmers;Kaifeng Chen;Inderjit S Dhillon;Yulia Tsvetkov;Hannaneh Hajishirzi;Sham M. Kakade;Ali Farhadi;Prateek Jain",
        "authorids": "~Fnu_Devvrit1;~Sneha_Kudugunta1;~Aditya_Kusupati1;~Tim_Dettmers2;~Kaifeng_Chen2;~Inderjit_S_Dhillon1;~Yulia_Tsvetkov1;~Hannaneh_Hajishirzi1;~Sham_M._Kakade1;~Ali_Farhadi3;~Prateek_Jain1",
        "gender": "M;F;M;M;M;M;F;F;M;M;M",
        "homepage": ";;http://www.adityakusupati.com/;https://timdettmers.com/;;http://www.cs.utexas.edu/users/inderjit/;https://homes.cs.washington.edu/~yuliats/;https://homes.cs.washington.edu/~hannaneh/;https://shamulent.github.io;https://homes.cs.washington.edu/~ali/;http://prateekjain.org",
        "dblp": ";;231/7662;172/1045;186/7404;d/InderjitSDhillon;75/8157;52/1296;s/SMKakade;37/5826;https://dblp.uni-trier.de/pers/j/Jain_0002:Prateek.html",
        "google_scholar": "c86HtPoAAAAJ;LeEwxtgAAAAJ;https://scholar.google.co.in/citations?user=qULx8g8AAAAJ;lHI3w5kAAAAJ;xjEcoNQAAAAJ;xBv5ZfkAAAAJ;SEDPkrsAAAAJ;LOV6_WIAAAAJ;https://scholar.google.com.tw/citations?user=wb-DKCIAAAAJ;jeOFRDsAAAAJ;qYhRbJoAAAAJ",
        "orcid": ";;0000-0001-8455-1851;;;;0000-0002-4634-7128;;;;",
        "linkedin": "devvrit/;;adityakusupati/;;kaifeng-chen-b37a2b69/;inderjit-dhillon-a20888b0/;;;;;",
        "or_profile": "~Fnu_Devvrit1;~Sneha_Kudugunta1;~Aditya_Kusupati1;~Tim_Dettmers2;~Kaifeng_Chen2;~Inderjit_S_Dhillon1;~Yulia_Tsvetkov1;~Hannaneh_Hajishirzi1;~Sham_M._Kakade1;~Ali_Farhadi3;~Prateek_Jain1",
        "aff": ", University of Texas at Austin;Google DeepMind;Department of Computer Science, University of Washington;University of Washington;Google;University of Texas, Austin;Department of Computer Science, University of Washington;University of Washington;Harvard University;University of Washington;Google",
        "aff_domain": "cs.utexas.edu;google.com;cs.washington.edu;cs.washington.edu;google.com;utexas.edu;cs.washington.edu;uw.edu;harvard.edu;cs.uw.edu;google.com",
        "position": "PhD student;Researcher;PhD student;PhD student;Researcher;Full Professor;Associate Professor;Associate Professor;Full Professor;Full Professor;Researcher",
        "bibtex": "@misc{\ndevvrit2024matformer,\ntitle={MatFormer: Nested Transformer for Elastic Inference},\nauthor={Fnu Devvrit and Sneha Kudugunta and Aditya Kusupati and Tim Dettmers and Kaifeng Chen and Inderjit S Dhillon and Yulia Tsvetkov and Hannaneh Hajishirzi and Sham M. Kakade and Ali Farhadi and Prateek Jain},\nyear={2024},\nurl={https://openreview.net/forum?id=89XNDtqhpL}\n}",
        "github": "",
        "project": "",
        "reviewers": "J4dY;CZp9;UoXf;EdnT",
        "site": "https://openreview.net/forum?id=89XNDtqhpL",
        "pdf_size": 639959,
        "rating": "5;5;6;8",
        "confidence": "4;3;4;3",
        "soundness": "2;3;2;4",
        "contribution": "2;2;3;4",
        "presentation": "2;3;3;4",
        "wc_summary": "48;131;104;62",
        "wc_strengths": "27;95;116;45",
        "wc_weaknesses": "172;425;381;173",
        "wc_questions": "53;81;11;42",
        "wc_review": "300;732;612;322",
        "wc_reply_reviewers": "0;117;0;0",
        "wc_reply_authors": "968;935;811;549",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "4;4;3;3",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            86.25,
            33.04826016600571
        ],
        "wc_strengths_avg": [
            70.75,
            36.09968836430586
        ],
        "wc_weaknesses_avg": [
            287.75,
            116.2956899459305
        ],
        "wc_questions_avg": [
            46.75,
            25.063668925358872
        ],
        "wc_review_avg": [
            491.5,
            185.58219203361082
        ],
        "wc_reply_reviewers_avg": [
            29.25,
            50.66248612138966
        ],
        "wc_reply_authors_avg": [
            815.75,
            164.75644903918027
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.5,
            0.5
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": -0.40824829046386296,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15483101880052662391&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;2;1;0;2;2;3;2;1",
        "aff_unique_norm": "University of Texas at Austin;Google;University of Washington;Harvard University",
        "aff_unique_dep": ";Google DeepMind;Department of Computer Science;",
        "aff_unique_url": "https://www.utexas.edu;https://deepmind.com;https://www.washington.edu;https://www.harvard.edu",
        "aff_unique_abbr": "UT Austin;DeepMind;UW;Harvard",
        "aff_campus_unique_index": "0;2;3;0;2;3",
        "aff_campus_unique": "Austin;;Seattle;Mountain View",
        "aff_country_unique_index": "0;1;0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "89ZekEEsSJ",
        "title": "Stealthy Targeted Backdoor Attack Against Image Captioning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We study backdoor attacks against image caption models, whose security issues have received less scrutiny compared with other multimodal tasks. Existing backdoor attacks typically pair a trigger either with a predefined sentence or a single word as the targeted output, yet they are unrelated to the image content, making them easily noticeable as anomalies by humans. In this paper, we present a novel method to craft targeted backdoor attacks against image caption models, which are designed to be stealthier than prior attacks. Specifically, our method first learns a special trigger by leveraging universal perturbation techniques for object detection, then places the learned trigger in the center of some specific source object and modifies the corresponding object name in the output caption to a predefined target name. During the prediction phase, the caption produced by the backdoored model for input images with the trigger can accurately convey the semantic information of the rest of the whole image, while incorrectly recognizing the source object as the predefined target. Extensive experiments demonstrate that our approach can achieve a high attack success rate while having a negligible impact on model clean performance. In addition, we show our method is stealthy in that the produced backdoor samples are indistinguishable from clean samples in both image and text domains, which can successfully bypass existing backdoor defenses, highlighting the need for better defensive mechanisms against such stealthy backdoor attacks.",
        "keywords": "Machine Learning;Image Caption;Backdoor Attack",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/9fcd6274e7f84de436036ee93df2145fbdfd328b.pdf",
        "author": "Wenshu Fan;Hongwei Li;Wenbo Jiang;Meng Hao;Xiao Zhang",
        "authorids": "~Wenshu_Fan1;~Hongwei_Li2;~Wenbo_Jiang1;~Meng_Hao1;~Xiao_Zhang2",
        "gender": "M;M;M;;M",
        "homepage": "https://github.com/meIody97;https://faculty.uestc.edu.cn/lihongwei/zh_CN/index.htm;https://wenbo-jiang.github.io/;;https://xiao-zhang.net",
        "dblp": "285/2460;39/5544-1;34/10703-1.html;;",
        "google_scholar": ";-o6u2gwAAAAJ;https://scholar.google.com.sg/citations?user=OjHzvJkAAAAJ;;L-lz7CUAAAAJ",
        "orcid": ";;0000-0002-4592-8094;;0009-0008-1837-7670",
        "linkedin": ";;;;",
        "or_profile": "~Wenshu_Fan1;~Hongwei_Li2;~Wenbo_Jiang1;~Meng_Hao1;~Xiao_Zhang2",
        "aff": "University of Electronic Science and Technology of China;University of Electronic Science and Technology of China, Tsinghua University;University of Electronic Science and Technology of China;;CISPA Helmholtz Center for Information Security",
        "aff_domain": "uestc.edu.cn;uestc.edu.cn;uestc.edu.cn;;cispa.de",
        "position": "PhD student;Full Professor;Postdoc;;Tenure-Track Faculty",
        "bibtex": "@misc{\nfan2024stealthy,\ntitle={Stealthy Targeted Backdoor Attack Against Image Captioning},\nauthor={Wenshu Fan and Hongwei Li and Wenbo Jiang and Meng Hao and Xiao Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=89ZekEEsSJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "nNC3;1VPN;MmsG;sNE8",
        "site": "https://openreview.net/forum?id=89ZekEEsSJ",
        "pdf_size": 840700,
        "rating": "5;5;5;5",
        "confidence": "4;3;5;4",
        "soundness": "2;3;2;2",
        "contribution": "2;2;2;2",
        "presentation": "3;3;3;2",
        "wc_summary": "131;82;71;66",
        "wc_strengths": "81;39;53;24",
        "wc_weaknesses": "443;57;155;389",
        "wc_questions": "7;86;5;5",
        "wc_review": "662;264;284;484",
        "wc_reply_reviewers": "0;0;55;15",
        "wc_reply_authors": "592;202;926;916",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "1;1;2;2",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            87.5,
            25.773047937719745
        ],
        "wc_strengths_avg": [
            49.25,
            21.00446381129497
        ],
        "wc_weaknesses_avg": [
            261.0,
            159.968746947646
        ],
        "wc_questions_avg": [
            25.75,
            34.79493497622894
        ],
        "wc_review_avg": [
            423.5,
            162.35993964029427
        ],
        "wc_reply_reviewers_avg": [
            17.5,
            22.5
        ],
        "wc_reply_authors_avg": [
            659.0,
            296.08951349211947
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10372884778743723752&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "University of Electronic Science and Technology of China;CISPA Helmholtz Center for Information Security",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uestc.edu.cn;https://www.cispa.de/",
        "aff_unique_abbr": "UESTC;CISPA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "China;Germany"
    },
    {
        "id": "89bUur0Q4J",
        "title": "Vision-Language Subspace Prompting",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Prompting vision-language models like CLIP to adapt to downstream tasks is currently topical. A seminal technique to this end is context optimization, which replaces a subset of textual tokens with trainable parameters (a.k.a soft prompts). However, current pipelines use a single vector embedding induced by soft prompts as the classifier weight for visual recognition. This can lead to problems where the learned soft prompts overfit to base classes\u2019 training data, resulting in poor performance when applied to novel classes. Several approaches were proposed to address this issue by regularizing the learned soft prompts to align them with handcrafted text/hard prompts. However, excessive regularization of the soft prompts can hurt the model\u2019s performance on the base classes it is trained on. Maintaining the right balance to ensure strong base- and novel-class performance is crucial but non-trivial. In this paper, we introduce a novel subspace-based prompt learning method, named SuPr, which can effectively model subspaces spanning the embeddings\nof both the learnable soft and the textual/hard prompts. Our subspace-based alignment between hand-crafted and learnable prompts balances these effects to achieve excellent fitting of base classes as well as generalization to novel classes. With the advantages of subspace modelling, our SuPr shows its effectiveness on generalization from base to new, domain generalization, cross-dataset transfer and few-shot learning, leading to new state-of-the-art results in all settings.",
        "keywords": "Prompt Learning; Vision Language Models",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yujun Tong;Da Li;Dongliang Chang;Tianwei Cao;Timothy Hospedales;Yi-Zhe Song;Zhanyu Ma",
        "authorids": "~Yujun_Tong1;~Da_Li3;~Dongliang_Chang2;~Tianwei_Cao1;~Timothy_Hospedales1;~Yi-Zhe_Song2;~Zhanyu_Ma1",
        "gender": "M;M;M;M;M;M;M",
        "homepage": ";https://dali-dl.github.io/;https://www.dongliangchang.cn/;https://github.com/caotianwei;http://homepages.inf.ed.ac.uk/thospeda/;http://personal.ee.surrey.ac.uk/Personal/Y.Song/;https://zhanyuma.cn/",
        "dblp": "294/5100;43/4804-1;236/3116;;32/3545;98/1684;",
        "google_scholar": "8jks3_kAAAAJ;RPvaE3oAAAAJ;tIf50PgAAAAJ;;https://scholar.google.fr/citations?user=nHhtvqkAAAAJ;https://scholar.google.co.uk/citations?user=irZFP_AAAAAJ;5GAAs7IAAAAJ",
        "orcid": ";0000-0002-2101-2989;0000-0002-4081-3001;;0000-0003-4867-7486;;0000-0003-2950-2488",
        "linkedin": ";;;;timothyhospedales/;;",
        "or_profile": "~Yujun_Tong1;~Da_Li3;~Dongliang_Chang2;~Tianwei_Cao1;~Timothy_Hospedales1;~Yi-Zhe_Song2;~Zhanyu_Ma1",
        "aff": "Beijing University of Posts and Telecommunications;University of Edinburgh;Tsinghua University;University of Chinese Academy of Sciences;Samsung AI Research Centre;University of Surrey;Beijing University of Post and Telecommunication",
        "aff_domain": "bupt.edu.cn;ed.ac.uk;tsinghua.edu.cn;ucas.ac.cn;samsung.com;surrey.ac.uk;bupt.edu.cn",
        "position": "PhD student;Visiting Scholar;Postdoc;PhD student;Principal Researcher;Professor;Full Professor",
        "bibtex": "@misc{\ntong2024visionlanguage,\ntitle={Vision-Language Subspace Prompting},\nauthor={Yujun Tong and Da Li and Dongliang Chang and Tianwei Cao and Timothy Hospedales and Yi-Zhe Song and Zhanyu Ma},\nyear={2024},\nurl={https://openreview.net/forum?id=89bUur0Q4J}\n}",
        "github": "",
        "project": "",
        "reviewers": "SWVW;nXYV;kdeh;Keaq",
        "site": "https://openreview.net/forum?id=89bUur0Q4J",
        "pdf_size": 47646175,
        "rating": "3;5;5;6",
        "confidence": "4;5;3;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "52;48;47;37",
        "wc_strengths": "27;33;41;22",
        "wc_weaknesses": "68;207;17;32",
        "wc_questions": "4;6;37;3",
        "wc_review": "151;294;142;94",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "55;934;471;469",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;3;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            46.0,
            5.522680508593631
        ],
        "wc_strengths_avg": [
            30.75,
            7.084313657652377
        ],
        "wc_weaknesses_avg": [
            81.0,
            75.0699673637867
        ],
        "wc_questions_avg": [
            12.5,
            14.186260959111108
        ],
        "wc_review_avg": [
            170.25,
            74.66048151465405
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            482.25,
            311.01557436887305
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.3458572319330373,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Po3-QoSvbEkJ:scholar.google.com/&scioq=Vision-Language+Subspace+Prompting&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;4;5;0",
        "aff_unique_norm": "Beijing University of Posts and Telecommunications;University of Edinburgh;Tsinghua University;University of Chinese Academy of Sciences;Samsung;University of Surrey",
        "aff_unique_dep": ";;;;AI Research;",
        "aff_unique_url": "http://www.bupt.edu.cn/;https://www.ed.ac.uk;https://www.tsinghua.edu.cn;http://www.ucas.ac.cn;https://www.samsung.com/global/researchers/samsung-ai-research-centre/;https://www.surrey.ac.uk",
        "aff_unique_abbr": "BUPT;Edinburgh;THU;UCAS;SARC;Surrey",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Beijing;",
        "aff_country_unique_index": "0;1;0;0;2;1;0",
        "aff_country_unique": "China;United Kingdom;South Korea"
    },
    {
        "id": "89l6VLPrin",
        "title": "Graph layouts and graph contrastive learning via neighbour embeddings",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In node-level graph representation learning, there are two distinct paradigms. One is known as graph layouts, where nodes are embedded into 2D space for visualization purposes. Another is graph contrastive learning, where nodes are parametrically embedded into a high-dimensional vector space based on node features. In this work, we show that these two paradigms are intimately related, and that both can be successfully approached via neighbour embedding methods. First, we introduce graph t-SNE for two-dimensional graph drawing, and show that the resulting layouts outperform all existing algorithms in terms of local structure preservation, as measured by kNN classification accuracy. Second, we introduce graph contrastive neighbor embedding (graph CNE)}, which uses a fully-connected neural network to transform graph node features into an embedding space by optimizing the contrastive InfoNCE objective. We show that graph CNE, while being conceptually simpler than most existing graph contrastive learning methods, produces competitive node representations, with state-of-the-art linear classification accuracy.",
        "keywords": "Graph Layout;Contrastive Learning;t-SNE",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Marius Keute;Alica Leonie Guzm\u00e1n;Dmitry Kobak",
        "authorids": "~Marius_Keute1;~Alica_Leonie_Guzm\u00e1n1;~Dmitry_Kobak2",
        "gender": "M;F;",
        "homepage": ";;https://dkobak.github.io/",
        "dblp": ";;236/5191",
        "google_scholar": "https://scholar.google.de/citations?user=cn2rZJ8AAAAJ;https://scholar.google.com/citations?hl=en;BUQbD5kAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Marius_Keute1;~Alica_Leonie_Guzm\u00e1n1;~Dmitry_Kobak2",
        "aff": ";Eberhard-Karls-Universit\u00e4t T\u00fcbingen;Eberhard-Karls-Universit\u00e4t T\u00fcbingen",
        "aff_domain": ";uni-tuebingen.de;uni-tuebingen.de",
        "position": ";MS student;Researcher",
        "bibtex": "@misc{\nkeute2024graph,\ntitle={Graph layouts and graph contrastive learning via neighbour embeddings},\nauthor={Marius Keute and Alica Leonie Guzm{\\'a}n and Dmitry Kobak},\nyear={2024},\nurl={https://openreview.net/forum?id=89l6VLPrin}\n}",
        "github": "",
        "project": "",
        "reviewers": "WEvC;pX5U;JHfU",
        "site": "https://openreview.net/forum?id=89l6VLPrin",
        "pdf_size": 13744935,
        "rating": "5;5;6",
        "confidence": "4;3;2",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "2;2;2",
        "wc_summary": "51;29;64",
        "wc_strengths": "22;52;16",
        "wc_weaknesses": "346;83;51",
        "wc_questions": "5;155;9",
        "wc_review": "424;319;140",
        "wc_reply_reviewers": "185;0;15",
        "wc_reply_authors": "1418;627;395",
        "reply_reviewers": "1;0;1",
        "reply_authors": "3;2;1",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            48.0,
            14.445299120013633
        ],
        "wc_strengths_avg": [
            30.0,
            15.748015748023622
        ],
        "wc_weaknesses_avg": [
            160.0,
            132.16908362649212
        ],
        "wc_questions_avg": [
            56.333333333333336,
            69.78697745440923
        ],
        "wc_review_avg": [
            294.3333333333333,
            117.24712742275987
        ],
        "wc_reply_reviewers_avg": [
            66.66666666666667,
            83.8980863243548
        ],
        "wc_reply_authors_avg": [
            813.3333333333334,
            437.9287105860446
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:zivpkVhNyAkJ:scholar.google.com/&scioq=Graph+layouts+and+graph+contrastive+learning+via+neighbour+embeddings&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Eberhard Karls University of T\u00fcbingen",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uni-tuebingen.de/",
        "aff_unique_abbr": "Uni T\u00fcbingen",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "T\u00fcbingen",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Germany"
    },
    {
        "title": "A Policy Gradient Method for Confounded POMDPs",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19336",
        "id": "8BAkNCqpGW",
        "author_site": "Mao Hong, Zhengling Qi, Yanxun Xu",
        "tldr": "",
        "abstract": "In this paper, we propose a policy gradient method for confounded partially observable Markov decision processes (POMDPs) with continuous state and observation spaces in the offline setting. We first establish a novel identification result to non-parametrically estimate any history-dependent policy gradient under POMDPs using the offline data. The identification enables us to solve a sequence of conditional moment restrictions and adopt the min-max learning procedure with general function approximation for estimating the policy gradient. We then provide a finite-sample non-asymptotic bound for estimating the gradient uniformly over a pre-specified policy class in terms of the sample size, length of horizon, concentratability coefficient and the measure of ill-posedness in solving the conditional moment restrictions. Lastly, by deploying the proposed gradient estimation in the gradient ascent algorithm, we show the global convergence of the proposed algorithm in finding the history-dependent optimal policy under some technical conditions. To the best of our knowledge, this is the first work studying the policy gradient method for POMDPs under the offline setting.",
        "keywords": "Offline Reinforcement Learning;Confounded POMDP;Policy Gradient;Statistical Guarantee;Function Approximation",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Mao Hong;Zhengling Qi;Yanxun Xu",
        "authorids": "~Mao_Hong1;~Zhengling_Qi1;~Yanxun_Xu1",
        "gender": "M;;F",
        "homepage": ";https://sites.google.com/view/statsqizl/home?authuser=0;http://www.ams.jhu.edu/~yxu70",
        "dblp": ";173/0201;",
        "google_scholar": "GUKNcVUAAAAJ;;https://scholar.google.com/citations?hl=en",
        "orcid": ";;",
        "linkedin": "mao-hong-a45624195/;;",
        "or_profile": "~Mao_Hong1;~Zhengling_Qi1;~Yanxun_Xu1",
        "aff": "Johns Hopkins University;George Washington University;Johns Hopkins University",
        "aff_domain": "jh.edu;gwu.edu;jhu.edu",
        "position": "PhD student;Assistant Professor;Associate Professor",
        "bibtex": "@inproceedings{\nhong2024a,\ntitle={A Policy Gradient Method for Confounded {POMDP}s},\nauthor={Mao Hong and Zhengling Qi and Yanxun Xu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=8BAkNCqpGW}\n}",
        "github": "",
        "project": "",
        "reviewers": "4mko;KDFK;YGPH;5Pwh",
        "pdf_size": 961571,
        "rating": "8;8;8;8",
        "confidence": "2;3;3;1",
        "soundness": "4;3;3;4",
        "contribution": "3;3;3;4",
        "presentation": "3;2;3;3",
        "wc_summary": "65;94;50;191",
        "wc_strengths": "113;90;53;106",
        "wc_weaknesses": "259;273;34;94",
        "wc_questions": "105;79;48;204",
        "wc_review": "542;536;185;595",
        "wc_reply_reviewers": "59;0;0;117",
        "wc_reply_authors": "1406;698;536;1197",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "3;2;1;3",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            2.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            100.0,
            54.868023474515645
        ],
        "wc_strengths_avg": [
            90.5,
            23.200215516240362
        ],
        "wc_weaknesses_avg": [
            165.0,
            103.32231124011889
        ],
        "wc_questions_avg": [
            109.0,
            58.44227921633447
        ],
        "wc_review_avg": [
            464.5,
            162.99463181344348
        ],
        "wc_reply_reviewers_avg": [
            44.0,
            48.54379466007988
        ],
        "wc_reply_authors_avg": [
            959.25,
            354.78963837744755
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16526567701232919548&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=8BAkNCqpGW",
        "pdf": "https://openreview.net/pdf?id=8BAkNCqpGW",
        "email": "jh.edu;gwu.edu;jhu.edu",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Johns Hopkins University;George Washington University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.jhu.edu;https://www.gwu.edu",
        "aff_unique_abbr": "JHU;GWU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "8Cc6qOPvFo",
        "title": "Text-Driven Image Editing using Cycle-Consistency-Driven Metric Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We present a simple but effective training-free method for text-driven image-to-image translation based on pretrained text-to-image diffusion models. Since a naive application of the pre-trained diffusion models for the manipulation tasks often significantly destroys the structure or background of the source image, we revise the original backward process for the target image by meaningfully aligning better with a given target task while preserving the background or structure of a source image. We derive a new guidance objective term that is a combination of maximizing the similarity with target prompts rather than the source prompt based on the pre-trained CLIP and minimizing the distance with the source latents. Moreover, contrary to existing methods based on the diffusion models, we exploit the cycle-consistency objective in order to further maintain the background of the source image, where we perform an iterative optimization process by alternately optimizing the source and target latents. Experimental results demonstrate that the proposed method achieves outstanding editing performance on various tasks when combined with the pre-trained Stable Diffusion.",
        "keywords": "Diffusion Models;Text-Driven Image-to-Image Translation",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Hyunsoo Lee;Minsoo Kang;Bohyung Han",
        "authorids": "~Hyunsoo_Lee1;~Minsoo_Kang1;~Bohyung_Han1",
        "gender": "M;M;Not Specified",
        "homepage": ";https://kminsoo.github.io;http://cvlab.snu.ac.kr/~bhhan",
        "dblp": ";29/5268;73/4880.html",
        "google_scholar": "https://scholar.google.co.kr/citations?user=6JNXaH0AAAAJ;in5F4IUAAAAJ;9aaeCToAAAAJ",
        "orcid": ";;",
        "linkedin": "philip21/;;",
        "or_profile": "~Hyunsoo_Lee1;~Minsoo_Kang1;~Bohyung_Han1",
        "aff": "Seoul National University;Seoul National University;Seoul National University",
        "aff_domain": "snu.ac.kr;snu.ac.kr;snu.ac.kr",
        "position": "Undergrad student;PhD student;Full Professor",
        "bibtex": "@misc{\nlee2024textdriven,\ntitle={Text-Driven Image Editing using Cycle-Consistency-Driven Metric Learning},\nauthor={Hyunsoo Lee and Minsoo Kang and Bohyung Han},\nyear={2024},\nurl={https://openreview.net/forum?id=8Cc6qOPvFo}\n}",
        "github": "",
        "project": "",
        "reviewers": "q62i;Cs1x;k61j;GXjj",
        "site": "https://openreview.net/forum?id=8Cc6qOPvFo",
        "pdf_size": 11275276,
        "rating": "3;3;5;6",
        "confidence": "4;4;4;5",
        "soundness": "2;2;2;2",
        "contribution": "2;2;2;3",
        "presentation": "2;3;2;3",
        "wc_summary": "69;78;85;16",
        "wc_strengths": "22;20;121;52",
        "wc_weaknesses": "103;52;236;84",
        "wc_questions": "1;53;2;2",
        "wc_review": "195;203;444;154",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "161;137;255;95",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            62.0,
            27.15695122800054
        ],
        "wc_strengths_avg": [
            53.75,
            40.84345112744514
        ],
        "wc_weaknesses_avg": [
            118.75,
            70.104832215761
        ],
        "wc_questions_avg": [
            14.5,
            22.23173407541571
        ],
        "wc_review_avg": [
            249.0,
            114.10740554407501
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            162.0,
            58.66003750424986
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.7777777777777777,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ArsSUTvMqkgJ:scholar.google.com/&scioq=Text-Driven+Image+Editing+using+Cycle-Consistency-Driven+Metric+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Seoul National University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.snu.ac.kr",
        "aff_unique_abbr": "SNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "8Cw3yFqPDX",
        "title": "Buffered Asynchronous Federated Learning with Local Differential Privacy",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Federated Learning (FL) allows multiple parties to collaboratively train a machine learning (ML) model without having to disclose their training data.\nClients train their own models locally and share only model updates with an aggregation server.\nThe first FL deployments have been in synchronous settings, with all clients performing training and sharing model updates simultaneously.\nMore recently, {\\em Asynchronous FL} (Async-FL) has emerged as a new approach that allows clients to train at their own pace and send/receive updates when they are ready.\n\nWhile FL is inherently less privacy-invasive than alternative centralized ML approaches, (aggregate) model updates can still leak sensitive information about clients' data.\nTherefore, FL algorithms need to satisfy Differential Privacy (DP) to provably limit leakage.\nAlas, previous work on Async-FL has only considered Central DP, which requires trust in the server, and thus may not always be viable.\nIn this paper, we present the first technique that satisfies {\\em Local DP} (LDP) in the context of the state-of-the-art aggregation algorithm for Async-FL, namely, FedBuff.\nWe experimentally demonstrate on three benchmark FL datasets that our LDP technique performs equally well and, in some cases, better than FedBuff with Central DP.\nFinally, we study how the {\\em staleness} of the model updates received by the asynchronous FL clients can be used to improve utility while preserving privacy under different attack setups.",
        "keywords": "Asynchronous Federated Learning;Differential Privacy",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Mohammad Naseri;Nicolas Kourtellis;Emiliano De Cristofaro",
        "authorids": "~Mohammad_Naseri1;~Nicolas_Kourtellis1;~Emiliano_De_Cristofaro1",
        "gender": "M;;M",
        "homepage": ";https://emilianodc.com;",
        "dblp": ";36/6225;96/8779",
        "google_scholar": "FqFAeIYAAAAJ;https://scholar.google.com/citations?hl=en;Q5oWwiQAAAAJ",
        "orcid": ";;0000-0002-5674-1698",
        "linkedin": ";;",
        "or_profile": "~Mohammad_Naseri1;~Emiliano_De_Cristofaro1;~Nicolas_Kourtellis2",
        "aff": "Flower Labs;University of California, Riverside;Telefonica Research",
        "aff_domain": "flower.ai;ucr.edu;telefonica.com",
        "position": "Researcher;Full Professor;Director of Research",
        "bibtex": "@misc{\nnaseri2024buffered,\ntitle={Buffered Asynchronous Federated Learning with Local Differential Privacy},\nauthor={Mohammad Naseri and Nicolas Kourtellis and Emiliano De Cristofaro},\nyear={2024},\nurl={https://openreview.net/forum?id=8Cw3yFqPDX}\n}",
        "github": "",
        "project": "",
        "reviewers": "g7c5;gsJz;fiZQ;xZb7",
        "site": "https://openreview.net/forum?id=8Cw3yFqPDX",
        "pdf_size": 366060,
        "rating": "1;3;3;5",
        "confidence": "4;4;4;5",
        "soundness": "1;1;2;3",
        "contribution": "1;1;2;2",
        "presentation": "2;3;2;2",
        "wc_summary": "26;45;21;140",
        "wc_strengths": "24;31;26;68",
        "wc_weaknesses": "109;65;85;47",
        "wc_questions": "78;58;3;26",
        "wc_review": "237;199;135;281",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            58.0,
            48.181946826586405
        ],
        "wc_strengths_avg": [
            37.25,
            17.93564885918544
        ],
        "wc_weaknesses_avg": [
            76.5,
            23.08137777516758
        ],
        "wc_questions_avg": [
            41.25,
            28.838992700855556
        ],
        "wc_review_avg": [
            213.0,
            53.5723809439155
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:V00-zUNGZJ8J:scholar.google.com/&scioq=Buffered+Asynchronous+Federated+Learning+with+Local+Differential+Privacy&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Flower Labs;University of California, Riverside;Telefonica",
        "aff_unique_dep": ";;Research",
        "aff_unique_url": ";https://www.ucr.edu;https://www.telefonica.com",
        "aff_unique_abbr": ";UCR;Telefonica",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Riverside",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "United States;Spain"
    },
    {
        "id": "8DLVrWL78S",
        "title": "Streamlining Generative Models for Structure-Based Drug Design",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Generative models for structure-based drug design (SBDD) aim to generate novel 3D molecules for specified protein targets $\\textit{in silico}$. The prevailing paradigm focuses on model expressivity - typically with powerful Graph Neural Network (GNN) models - but is agnostic to binding affinity during training, potentially overlooking better molecules. We address this issue with a two-pronged approach: learn an economical surrogate for affinity to infer an unlabeled molecular graph, and optimize for labels conditioned on this graph and desired molecular properties (e.g., QED, SA). The resulting model FastSBDD achieves state-of-the-art results as well as streamlined computation and model size (up to 1000x faster and with 100x fewer trainable parameters compared to existing methods), paving way for improved docking software. We also establish rigorous theoretical results to expose the representation limits of GNNs in SBDD contexts and the generalizability of our affinity scoring model, advocating more emphasis on generalization going forward.",
        "keywords": "drug design;binding;docking;graph neural networks;generalization bounds",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/2e87e16cc7197b69e1920028c29e14f2093dd5f6.zip",
        "author": "Rafal Karczewski;Markus Heinonen;Vikas Garg",
        "authorids": "~Rafal_Karczewski1;~Markus_Heinonen1;~Vikas_Garg2",
        "gender": ";M;",
        "homepage": ";https://users.aalto.fi/~heinom10/;",
        "dblp": "228/6790;22/7709;",
        "google_scholar": ";hFtfHZoAAAAJ;",
        "orcid": ";;",
        "linkedin": "rafal-karczewski-906ab010a;;",
        "or_profile": "~Rafal_Karczewski1;~Markus_Heinonen1;~Vikas_Garg2",
        "aff": "Aalto University;Aalto University;",
        "aff_domain": "aalto.fi;aalto.fi;",
        "position": "PhD student;Researcher;",
        "bibtex": "@misc{\nkarczewski2024streamlining,\ntitle={Streamlining Generative Models for Structure-Based Drug Design},\nauthor={Rafal Karczewski and Markus Heinonen and Vikas Garg},\nyear={2024},\nurl={https://openreview.net/forum?id=8DLVrWL78S}\n}",
        "github": "",
        "project": "",
        "reviewers": "A4Na;aZds;zMwy;jdjh",
        "site": "https://openreview.net/forum?id=8DLVrWL78S",
        "pdf_size": 1101616,
        "rating": "3;3;5;5",
        "confidence": "3;4;4;4",
        "soundness": "2;1;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;3;2",
        "wc_summary": "69;71;115;31",
        "wc_strengths": "34;69;22;44",
        "wc_weaknesses": "210;220;166;130",
        "wc_questions": "35;19;58;25",
        "wc_review": "348;379;361;230",
        "wc_reply_reviewers": "112;0;206;0",
        "wc_reply_authors": "1142;716;2052;575",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "3;2;5;2",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            71.5,
            29.744747435471695
        ],
        "wc_strengths_avg": [
            42.25,
            17.297037318569906
        ],
        "wc_weaknesses_avg": [
            181.5,
            36.010415160061676
        ],
        "wc_questions_avg": [
            34.25,
            14.85555451674558
        ],
        "wc_review_avg": [
            329.5,
            58.4914523669912
        ],
        "wc_reply_reviewers_avg": [
            79.5,
            86.16698903872643
        ],
        "wc_reply_authors_avg": [
            1121.25,
            576.4856351202517
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.0,
            1.224744871391589
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:JEfpuRRtM_sJ:scholar.google.com/&scioq=Streamlining+Generative+Models+for+Structure-Based+Drug+Design&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Aalto University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.aalto.fi",
        "aff_unique_abbr": "Aalto",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Finland"
    },
    {
        "id": "8DW3aSOnou",
        "title": "Video Deblurring with Adaptive High-frequency Extraction",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "State-of-the-art video deblurring methods use deep network architectures to recover sharpened video frames. Blurring especially degrades high-frequency information yet this aspect is often overlooked by recent models that focus more on enhancing architectural design. The recovery of high frequency detailing can be non-trivial, in part due to the spectral bias of neural networks. Neural networks are biased towards learning low frequency functions, making it to prioritize learning low frequency components. To enhance the learning of latent high frequencies, it is necessary to enforce explicit structures to capture the fine details or edges. This work merges the principles of the classic unsharp masking with a deep learning framework to emphasize the essential role of high-frequency information in deblurring. We generate an adaptive kernel, constructed from a convex combination of dynamic coefficients and predefined high-pass filtering kernels. This kernel is then employed in a spatio-temporal 3D convolution process to extract high-frequency components from the data. This method significantly improves video deblurring, achieving a noteworthy enhancement with an increase of up to 0.61dB in PSNR over top models on GORPO dataset. Additionally, it outpaces the majority of them in inference time.",
        "keywords": "video deblurring;deep learning;unsharp masking",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Bo Ji;Angela Yao",
        "authorids": "~Bo_Ji2;~Angela_Yao1",
        "gender": ";",
        "homepage": ";http://www.angelayao.com",
        "dblp": ";64/8484",
        "google_scholar": ";https://scholar.google.ch/citations?user=-LJCZMMAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Bo_Ji2;~Angela_Yao1",
        "aff": ";National University of Singapore",
        "aff_domain": ";nus.edu.sg",
        "position": ";Associate Professor",
        "bibtex": "@misc{\nji2024video,\ntitle={Video Deblurring with Adaptive High-frequency Extraction},\nauthor={Bo Ji and Angela Yao},\nyear={2024},\nurl={https://openreview.net/forum?id=8DW3aSOnou}\n}",
        "github": "",
        "project": "",
        "reviewers": "Ebb6;HuzH;a8DG;5xHX",
        "site": "https://openreview.net/forum?id=8DW3aSOnou",
        "pdf_size": 16821352,
        "rating": "3;3;5;8",
        "confidence": "5;5;4;2",
        "soundness": "2;2;2;3",
        "contribution": "1;2;2;3",
        "presentation": "1;2;3;3",
        "wc_summary": "28;51;62;22",
        "wc_strengths": "18;12;54;41",
        "wc_weaknesses": "95;8;65;166",
        "wc_questions": "4;226;48;4",
        "wc_review": "145;297;229;233",
        "wc_reply_reviewers": "0;0;138;0",
        "wc_reply_authors": "528;603;104;233",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            4.0,
            1.224744871391589
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            40.75,
            16.361158271956175
        ],
        "wc_strengths_avg": [
            31.25,
            17.020208576865326
        ],
        "wc_weaknesses_avg": [
            83.5,
            56.967095765889276
        ],
        "wc_questions_avg": [
            70.5,
            91.55735907069403
        ],
        "wc_review_avg": [
            226.0,
            53.99073994677235
        ],
        "wc_reply_reviewers_avg": [
            34.5,
            59.75575286112627
        ],
        "wc_reply_authors_avg": [
            367.0,
            205.39109036177786
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.9975093361076329,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:NjfiiTs63KYJ:scholar.google.com/&scioq=Video+Deblurring+with+Adaptive+High-frequency+Extraction&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "National University of Singapore",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nus.edu.sg",
        "aff_unique_abbr": "NUS",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Singapore"
    },
    {
        "title": "CLAP: Collaborative Adaptation for Patchwork Learning",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19335",
        "id": "8EyRkd3Qj2",
        "author_site": "Sen Cui, Abudukelimu Wuerkaixi, Weishen Pan, Jian Liang, Lei Fang, Changshui Zhang, Fei Wang",
        "tldr": "",
        "abstract": "In this paper, we investigate a new practical learning scenario, where the data distributed in different sources/clients are typically generated with various modalities. Existing research on learning from multi-source data mostly assume that each client owns the data of all modalities, which may largely limit its practicability. In light of the expensiveness and sparsity of multimodal data, we propose patchwork learning to jointly learn from fragmented multimodal data in distributed clients. Considering the concerns on data privacy, patchwork learning aims to impute incomplete multimodal data for diverse downstream tasks without accessing the raw data directly. Local clients could miss different modality combinations. Due to the statistical heterogeneity induced by non-i.i.d. data, the imputation is more challenging since the learned dependencies fail to adapt to the imputation of other clients. In this paper, we provide a novel imputation framework to tackle modality combination heterogeneity and statistical heterogeneity simultaneously, called ``collaborative adaptation''. In particular, for two observed modality combinations from two clients, we learn the transformations between their maximal intersection and other modalities by proposing a novel ELBO. We improve the worst-performing required transformations through a Pareto min-max optimization framework. In extensive experiments, we demonstrate the superiority of the proposed method compared to existing related methods on benchmark data sets and a real-world clinical data set.",
        "keywords": "Patchwork learning;robustness",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Sen Cui;Abudukelimu Wuerkaixi;Weishen Pan;Jian Liang;Lei Fang;Changshui Zhang;Fei Wang",
        "authorids": "~Sen_Cui1;~Abudukelimu_Wuerkaixi1;~Weishen_Pan1;~Jian_Liang3;~Lei_Fang6;~Changshui_Zhang2;~Fei_Wang3",
        "gender": "M;M;M;M;;M;",
        "homepage": ";https://www.baidu.com;https://scholar.google.com/citations?user=PtTBMhUAAAAJ;;https://linkedin.com/in/leifang;http://bigeye.au.tsinghua.edu.cn/english/Introduction.html;https://wcm-wanglab.github.io/index.html",
        "dblp": "267/5483;293/3368;161/2032;19/2208;;z/ChangshuiZhang;52/3194-9.html",
        "google_scholar": "UzQuG1UAAAAJ;;PtTBMhUAAAAJ;mrunnpoAAAAJ;;GL9M37YAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;0009-0006-0431-5642;;;;",
        "linkedin": ";;;;;;fei-wang-50682425/",
        "or_profile": "~Sen_Cui1;~Abudukelimu_Wuerkaixi1;~Weishen_Pan1;~Jian_Liang3;~Lei_Fang6;~Changshui_Zhang2;~Fei_Wang3",
        "aff": "Tsinghua University;Tsinghua University, Beijing;Weill Cornell Medicine, Cornell University;Kuaishou Technology;;Tsinghua University;Cornell University",
        "aff_domain": "tsinghua.edu.cn;tsinghua.edu.cn;med.cornell.edu;kuaishou.com;;mail.tsinghua.edu.cn;cornell.edu",
        "position": "PhD student;PhD student;Postdoc;Senior Algorithm Engineer;;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\ncui2024clap,\ntitle={{CLAP}: Collaborative Adaptation for Patchwork Learning},\nauthor={Sen Cui and Abudukelimu Wuerkaixi and Weishen Pan and Jian Liang and Lei Fang and Changshui Zhang and Fei Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=8EyRkd3Qj2}\n}",
        "github": "",
        "project": "",
        "reviewers": "QCRo;ccS1;scKN;DjdF",
        "pdf_size": 4277230,
        "rating": "6;8;8;8",
        "confidence": "4;4;5;2",
        "soundness": "4;3;3;3",
        "contribution": "3;4;4;3",
        "presentation": "3;3;3;3",
        "wc_summary": "128;126;143;104",
        "wc_strengths": "158;173;166;67",
        "wc_weaknesses": "145;146;85;33",
        "wc_questions": "76;146;102;60",
        "wc_review": "507;591;496;264",
        "wc_reply_reviewers": "0;22;0;62",
        "wc_reply_authors": "1720;1152;683;1040",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "3;2;1;2",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            125.25,
            13.91716565971678
        ],
        "wc_strengths_avg": [
            141.0,
            43.05229378325852
        ],
        "wc_weaknesses_avg": [
            102.25,
            46.99667541433117
        ],
        "wc_questions_avg": [
            96.0,
            32.526911934581186
        ],
        "wc_review_avg": [
            464.5,
            121.45060724426206
        ],
        "wc_reply_reviewers_avg": [
            21.0,
            25.317977802344327
        ],
        "wc_reply_authors_avg": [
            1148.75,
            372.5207209001937
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.13245323570650439,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16746551509627980679&as_sdt=5,34&sciodt=0,34&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=8EyRkd3Qj2",
        "pdf": "https://openreview.net/pdf?id=8EyRkd3Qj2",
        "email": "tsinghua.edu.cn;tsinghua.edu.cn;med.cornell.edu;kuaishou.com;;mail.tsinghua.edu.cn;cornell.edu",
        "author_num": 7,
        "aff_unique_index": "0;0;1;2;0;1",
        "aff_unique_norm": "Tsinghua University;Cornell University;Kuaishou Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.weill.cornell.edu;https://www.kuaishou.com",
        "aff_unique_abbr": "THU;Cornell;Kuaishou",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Beijing;Weill Cornell Medicine",
        "aff_country_unique_index": "0;0;1;0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Language-Interfaced Tabular Oversampling via Progressive Imputation and Self-Authentication",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19334",
        "id": "8F6bws5JBy",
        "author_site": "June Yong Yang, Geondo Park, Joowon Kim, Hyeongwon Jang, Eunho Yang",
        "tldr": "",
        "abstract": "Tabular data in the wild are frequently afflicted with class-imbalance, biasing machine learning model predictions towards major classes. A data-centric solution to this problem is oversampling - where the classes are balanced by adding synthetic minority samples via generative methods. However, although tabular generative models are capable of generating synthetic samples under a balanced distribution, their integrity suffers when the number of minority samples is low. To this end, pre-trained generative language models with rich prior knowledge are a fitting candidate for the task at hand. Nevertheless, an oversampling strategy tailored for tabular data that utilizes the extensive capabilities of such language models is yet to emerge. In this paper, we propose a novel oversampling framework for tabular data to channel the abilities of generative language models. By leveraging its conditional sampling capabilities, we synthesize minority samples by progressively masking the important features of the majority class samples and imputing them towards the minority distribution. To reduce the inclusion of imperfectly converted samples, we utilize the power of the language model itself to self-authenticate the labels of the samples generated by itself, sifting out ill-converted samples. Extensive experiments on a variety of datasets and imbalance ratios reveal that the proposed method successfully generates reliable minority samples to boost the performance of machine learning classifiers, even under heavy imbalance ratios.",
        "keywords": "Tabular data;imbalanced learning;language models",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "June Yong Yang;Geondo Park;Joowon Kim;Hyeongwon Jang;Eunho Yang",
        "authorids": "~June_Yong_Yang1;~Geondo_Park1;~Joowon_Kim1;~Hyeongwon_Jang1;~Eunho_Yang1",
        "gender": ";M;M;;M",
        "homepage": "http://mli.kaist.ac.kr/people/;;https://github.com/kjwispro;https://github.com/HyeongWon-Jang;https://sites.google.com/site/hleehome2/",
        "dblp": "277/5624;256/5123;;206/3852;96/2621",
        "google_scholar": "nkLNWg0AAAAJ;;;MT2tKmQAAAAJ;",
        "orcid": ";;;;",
        "linkedin": ";;;hyeongwon-jang-478591292?trk=contact-info;",
        "or_profile": "~June_Yong_Yang1;~Geondo_Park1;~Joowon_Kim1;~Hyeongwon_Jang1;~Eunho_Yang1",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science and Technology (KAIST);Seoul National University;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr;kaist.ac.kr;snu.ac.kr;kaist.ac.kr",
        "position": "PhD student;PhD student;MS student;Undergrad student;Associate Professor",
        "bibtex": "@inproceedings{\nyang2024languageinterfaced,\ntitle={Language-Interfaced Tabular Oversampling via Progressive Imputation and Self-Authentication},\nauthor={June Yong Yang and Geondo Park and Joowon Kim and Hyeongwon Jang and Eunho Yang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=8F6bws5JBy}\n}",
        "github": "",
        "project": "",
        "reviewers": "tYE6;gyRK;puAc",
        "pdf_size": 4395848,
        "rating": "6;6;6",
        "confidence": "3;3;3",
        "soundness": "2;3;3",
        "contribution": "2;2;3",
        "presentation": "3;2;4",
        "wc_summary": "52;104;78",
        "wc_strengths": "54;28;71",
        "wc_weaknesses": "106;134;119",
        "wc_questions": "21;5;39",
        "wc_review": "233;271;307",
        "wc_reply_reviewers": "86;28;25",
        "wc_reply_authors": "696;1459;1355",
        "reply_reviewers": "1;1;1",
        "reply_authors": "2;4;3",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            78.0,
            21.228911104120876
        ],
        "wc_strengths_avg": [
            51.0,
            17.682382946499793
        ],
        "wc_weaknesses_avg": [
            119.66666666666667,
            11.440668201153676
        ],
        "wc_questions_avg": [
            21.666666666666668,
            13.888444437333106
        ],
        "wc_review_avg": [
            270.3333333333333,
            30.214051182999096
        ],
        "wc_reply_reviewers_avg": [
            46.333333333333336,
            28.075295585660754
        ],
        "wc_reply_authors_avg": [
            1170.0,
            337.8471054584702
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.0,
            0.816496580927726
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16290416663341375138&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=8F6bws5JBy",
        "pdf": "https://openreview.net/pdf?id=8F6bws5JBy",
        "email": "kaist.ac.kr;kaist.ac.kr;kaist.ac.kr;snu.ac.kr;kaist.ac.kr",
        "author_num": 5,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology;Seoul National University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.kaist.ac.kr;https://www.snu.ac.kr",
        "aff_unique_abbr": "KAIST;SNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "Learning Personalized Causally Invariant Representations for Heterogeneous Federated Clients",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19333",
        "id": "8FHWkY0SwF",
        "author_site": "Xueyang Tang, Song Guo, Jie ZHANG, Jingcai Guo",
        "tldr": "",
        "abstract": "Personalized federated learning (PFL) has gained great success in tackling the scenarios where target datasets are heterogeneous across the local clients. However, the application of the existing PFL methods to real-world setting is hindered by the common assumption that the test data on each client is in-distribution (IND) with respect to its training data. Due to the bias of training dataset, the modern machine learning model prefers to rely on shortcut which can perform well on the training data but fail to generalize to the unseen test data that is out-of-distribution (OOD). This pervasive phenomenon is called shortcut learning and has attracted plentiful efforts in centralized situations. In PFL, the limited data diversity on federated clients makes mitigating shortcut and meanwhile preserving personalization knowledge rather difficult. In this paper, we analyse this challenging problem by formulating the structural causal models (SCMs) for heterogeneous federated clients. From the proposed SCMs, we derive two significant causal signatures which inspire a provable shortcut discovery and removal method under federated learning, namely FedSDR. Specifically, FedSDR is divided into two steps: 1) utilizing the available training data distributed among local clients to discover all the shortcut features in a collaborative manner. 2) developing the optimal personalized causally invariant predictor for each client by eliminating the discovered shortcut features. We provide theoretical analysis to prove that our method can draw complete shortcut features and produce the optimal personalized invariant predictor that can generalize to unseen OOD data on each client. The experimental results on diverse datasets validate the superiority of FedSDR over the state-of-the-art PFL methods on OOD generalization performance.",
        "keywords": "Personalized Federated Learning;Invariant Learning;Causality;Out-of-distribution Generalization;Shortcut Learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Xueyang Tang;Song Guo;Jie ZHANG;Jingcai Guo",
        "authorids": "~Xueyang_Tang1;~Song_Guo5;~Jie_ZHANG18;~Jingcai_Guo1",
        "gender": "M;M;F;M",
        "homepage": ";https://cse.hkust.edu.hk/~songguo/;https://cugzj.github.io/zhangjie.github.io/;https://jingcaiguo.github.io/",
        "dblp": ";01/267-1;84/6889-76;192/7270",
        "google_scholar": "wAGIpRAAAAAJ;https://scholar.google.com/citations?hl=en;JRCNlI8AAAAJ;YjSHPjcAAAAJ",
        "orcid": "0000-0003-4284-9806;;0000-0002-8073-2118;0000-0002-0449-4525",
        "linkedin": ";;;jingcai-guo",
        "or_profile": "~Xueyang_Tang1;~Song_Guo5;~Jie_ZHANG18;~Jingcai_Guo1",
        "aff": "The Hong Kong Polytechnic University;Department of Computer Science and Engineering, Hong Kong University of Science and Technology;The Hong Kong Polytechnic University;The Hong Kong Polytechnic University",
        "aff_domain": "polyu.edu.hk;cse.ust.hk;polyu.edu.hk;polyu.edu.hk",
        "position": "PhD student;Full Professor;Postdoc;Assistant Professor",
        "bibtex": "@inproceedings{\ntang2024learning,\ntitle={Learning Personalized Causally Invariant Representations for Heterogeneous Federated Clients},\nauthor={Xueyang Tang and Song Guo and Jie ZHANG and Jingcai Guo},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=8FHWkY0SwF}\n}",
        "github": "",
        "project": "",
        "reviewers": "Qvuh;2uxd;zjFS",
        "pdf_size": 2607041,
        "rating": "3;6;6",
        "confidence": "4;3;4",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "2;3;3",
        "wc_summary": "39;72;59",
        "wc_strengths": "33;27;36",
        "wc_weaknesses": "349;117;47",
        "wc_questions": "3;66;69",
        "wc_review": "424;282;211",
        "wc_reply_reviewers": "0;18;39",
        "wc_reply_authors": "1091;1171;523",
        "reply_reviewers": "0;1;1",
        "reply_authors": "3;3;2",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            56.666666666666664,
            13.572848714334887
        ],
        "wc_strengths_avg": [
            32.0,
            3.7416573867739413
        ],
        "wc_weaknesses_avg": [
            171.0,
            129.0684572878543
        ],
        "wc_questions_avg": [
            46.0,
            30.430248109405877
        ],
        "wc_review_avg": [
            305.6666666666667,
            88.55255815364994
        ],
        "wc_reply_reviewers_avg": [
            19.0,
            15.937377450509228
        ],
        "wc_reply_authors_avg": [
            928.3333333333334,
            288.46875432570204
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12102156348141143717&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=8FHWkY0SwF",
        "pdf": "https://openreview.net/pdf?id=8FHWkY0SwF",
        "email": "polyu.edu.hk;cse.ust.hk;polyu.edu.hk;polyu.edu.hk",
        "author_num": 4,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Hong Kong Polytechnic University;Hong Kong University of Science and Technology",
        "aff_unique_dep": ";Department of Computer Science and Engineering",
        "aff_unique_url": "https://www.polyu.edu.hk;https://www.ust.hk",
        "aff_unique_abbr": "PolyU;HKUST",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "8FP6eJsVCv",
        "title": "Explanation Shift: How Did the Distribution Shift Impact the Model?",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The performance of machine learning models on new data is critical for their success in real-world applications. However, the model's performance may deteriorate if the new data is sampled from a different distribution than the training data. Current methods to detect shifts in the input or output data distributions have limitations in identifying model behavior changes. In this paper, we define \\emph{explanation shift} as the statistical comparison between how predictions from training data are explained and how predictions on new data are explained. We propose explanation shift as a key indicator to investigate the interaction between distribution shifts and learned models.  We introduce an Explanation Shift Detector that operates on the explanation distributions, providing more sensitive and explainable changes in interactions between distribution shifts and learned models. We compare explanation shifts with other methods that are based on distribution shifts, showing that monitoring for explanation shifts results in more sensitive indicators for varying model behavior. We provide theoretical and experimental evidence and demonstrate the effectiveness of our approach on synthetic and real data. Additionally, we release an open-source Python package, \\texttt{skshift}, which implements our method and provides usage tutorials for further reproducibility.",
        "keywords": "Model Monitoring;Distribution Shift;Explainable AI",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Carlos Mougan;Klaus Broelemann;David Masip;Gjergji Kasneci;Thanassis Tiropanis;Steffen Staab",
        "authorids": "~Carlos_Mougan1;~Klaus_Broelemann1;~David_Masip4;~Gjergji_Kasneci2;~Thanassis_Tiropanis1;~Steffen_Staab2",
        "gender": "M;;M;M;;M",
        "homepage": "https://cmougan.eu;;http://github.com/david26694/;https://www.gov.sot.tum.de/rds/prof-dr-gjergji-kasneci/;https://www.southampton.ac.uk/people/5x5rrv/professor-thanassis-tiropanis;https://www.ki.uni-stuttgart.de/de/institut/team/Staab-00004/",
        "dblp": "293/7915;00/7271.html;;69/3216;64/6175;s/SteffenStaab",
        "google_scholar": "dQ5WrokAAAAJ;;;Zbc8GK4AAAAJ;T0MK3pUAAAAJ;https://scholar.google.com/citations?hl=de",
        "orcid": ";;;0000-0002-3123-7268;0000-0002-6195-2852;0000-0002-0780-4154",
        "linkedin": "carlosmougan/;;;;tiropanis/;",
        "or_profile": "~Carlos_Mougan1;~Klaus_Broelemann1;~David_Masip4;~Gjergji_Kasneci2;~Thanassis_Tiropanis1;~Steffen_Staab2",
        "aff": "University of Southampton;SCHUFA;;University of Tuebingen;University of Southampton;University of Southampton",
        "aff_domain": "soton.ac.uk;schufa.de;;uni-tuebingen.de;ecs.soton.ac.uk;soton.ac.uk",
        "position": "PhD student;Principal Researcher;;Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nmougan2024explanation,\ntitle={Explanation Shift: How Did the Distribution Shift Impact the Model?},\nauthor={Carlos Mougan and Klaus Broelemann and David Masip and Gjergji Kasneci and Thanassis Tiropanis and Steffen Staab},\nyear={2024},\nurl={https://openreview.net/forum?id=8FP6eJsVCv}\n}",
        "github": "",
        "project": "",
        "reviewers": "QGE3;Kdfx;hRuz;3HUZ",
        "site": "https://openreview.net/forum?id=8FP6eJsVCv",
        "pdf_size": 1303631,
        "rating": "3;5;5;8",
        "confidence": "4;4;4;3",
        "soundness": "3;2;3;4",
        "contribution": "2;2;2;3",
        "presentation": "2;3;2;4",
        "wc_summary": "110;236;72;90",
        "wc_strengths": "40;51;66;99",
        "wc_weaknesses": "364;173;367;41",
        "wc_questions": "61;159;254;149",
        "wc_review": "575;619;759;379",
        "wc_reply_reviewers": "0;0;137;0",
        "wc_reply_authors": "770;787;732;320",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            127.0,
            64.35060217278468
        ],
        "wc_strengths_avg": [
            64.0,
            22.214859891523062
        ],
        "wc_weaknesses_avg": [
            236.25,
            137.42156854002212
        ],
        "wc_questions_avg": [
            155.75,
            68.34974396440707
        ],
        "wc_review_avg": [
            583.0,
            135.97058505426827
        ],
        "wc_reply_reviewers_avg": [
            34.25,
            59.322740159234044
        ],
        "wc_reply_authors_avg": [
            652.25,
            192.85535382768091
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.8892972917998875,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9342819475098152131&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2;0;0",
        "aff_unique_norm": "University of Southampton;SCHUFA Holding AG;University of Tuebingen",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.southampton.ac.uk;https://www.schufa.de;https://www.uni-tuebingen.de/",
        "aff_unique_abbr": "Southampton;SCHUFA;Uni T\u00fcbingen",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;0;0",
        "aff_country_unique": "United Kingdom;Germany"
    },
    {
        "id": "8FhwHJGUPZ",
        "title": "Dual-Balancing for Multi-Task Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Multi-task learning (MTL), a learning paradigm to learn multiple related tasks simultaneously, has achieved great success in various fields. However, task balancing problem remains a significant challenge in MTL, with the disparity in loss/gradient scales often leading to performance compromises. In this paper, we propose a Dual-Balancing Multi-Task Learning (DB-MTL) method to alleviate the task balancing problem from both loss and gradient perspectives. Specifically, DB-MTL ensures loss-scale balancing by performing a logarithm transformation on each task loss, and guarantees gradient-magnitude balancing via normalizing all task gradients to the same magnitude as the maximum gradient norm. Extensive experiments conducted on several benchmark datasets consistently demonstrate the state-of-the-art performance of DB-MTL.",
        "keywords": "multi-task learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Baijiong Lin;Weisen Jiang;Feiyang Ye;Yu Zhang;Pengguang Chen;Ying-Cong Chen;Shu Liu;James Kwok",
        "authorids": "~Baijiong_Lin1;~Weisen_Jiang1;~Feiyang_Ye4;~Yu_Zhang3;~Pengguang_Chen1;~Ying-Cong_Chen1;~Shu_Liu4;~James_Kwok1",
        "gender": "M;M;M;M;M;M;M;",
        "homepage": "https://baijiong-lin.github.io/;https://wayson-ust.github.io/;https://feiyang-ye.github.io/;http://cse.sustech.edu.cn/faculty/~zhangy/;https://github.com/akuxcw;https://www.yingcong.me/;https://shuliu1993.github.io/;",
        "dblp": "279/2950;302/7625;285/4704;50/671-6;189/7442.html;137/6578;57/1180-5;",
        "google_scholar": "KVdbYTYAAAAJ;https://scholar.google.com/citations?hl=en;3EX25cAAAAAJ;https://scholar.google.com.hk/citations?user=jaRS5w4AAAAJ;https://scholar.google.com.hk/citations?user=lMnVrgIAAAAJ;https://scholar.google.com.hk/citations?user=n7j4bJUAAAAJ;BUEDUFkAAAAJ;",
        "orcid": "0000-0002-4257-0226;;;;;;;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Baijiong_Lin1;~Weisen_Jiang1;~Feiyang_Ye4;~Yu_Zhang3;~Pengguang_Chen1;~Ying-Cong_Chen1;~Shu_Liu4;~James_Kwok1",
        "aff": "The Hong Kong University of Science and Technology (Guangzhou);Hong Kong University of Science and Technology;University of Technology Sydney;Southern University of Science and Technology;SmartMore;Hong Kong University of Science and Technology;SmartMore Ltd.;",
        "aff_domain": "connect.hkust-gz.edu.cn;ust.hk;uts.edu.au;sustc.edu.cn;smartmore.com;hkust-gz.edu.cn;smartmore.com;",
        "position": "PhD student;PhD student;PhD student;Associate Professor;Researcher;Assistant Professor;Principal Researcher;",
        "bibtex": "@misc{\nlin2024dualbalancing,\ntitle={Dual-Balancing for Multi-Task Learning},\nauthor={Baijiong Lin and Weisen Jiang and Feiyang Ye and Yu Zhang and Pengguang Chen and Ying-Cong Chen and Shu Liu and James Kwok},\nyear={2024},\nurl={https://openreview.net/forum?id=8FhwHJGUPZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "gC4S;H1EY;PmP7;SooC;8dJR",
        "site": "https://openreview.net/forum?id=8FhwHJGUPZ",
        "pdf_size": 484187,
        "rating": "3;5;5;6;8",
        "confidence": "4;4;4;5;4",
        "soundness": "2;2;2;3;3",
        "contribution": "2;2;2;3;3",
        "presentation": "2;2;2;3;3",
        "wc_summary": "106;40;164;76;74",
        "wc_strengths": "54;49;42;46;75",
        "wc_weaknesses": "87;360;238;5;40",
        "wc_questions": "49;5;30;134;25",
        "wc_review": "296;454;474;261;214",
        "wc_reply_reviewers": "0;0;0;33;12",
        "wc_reply_authors": "1180;1356;994;300;251",
        "reply_reviewers": "0;0;0;1;1",
        "reply_authors": "3;3;3;2;2",
        "rating_avg": [
            5.4,
            1.624807680927192
        ],
        "confidence_avg": [
            4.2,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            92.0,
            41.626914370392626
        ],
        "wc_strengths_avg": [
            53.2,
            11.582745788456206
        ],
        "wc_weaknesses_avg": [
            146.0,
            133.31016465371272
        ],
        "wc_questions_avg": [
            48.6,
            44.93817975841923
        ],
        "wc_review_avg": [
            339.8,
            104.88546133759436
        ],
        "wc_reply_reviewers_avg": [
            9.0,
            12.86856635371633
        ],
        "wc_reply_authors_avg": [
            816.2,
            456.3465349928714
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            2.6,
            0.4898979485566356
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.1846372364689991,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16214532746501801863&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;2;3;0;3",
        "aff_unique_norm": "Hong Kong University of Science and Technology;University of Technology Sydney;Southern University of Science and Technology;SmartMore",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.ust.hk;https://www.uts.edu.au;https://www.sustech.edu.cn;",
        "aff_unique_abbr": "HKUST;UTS;SUSTech;",
        "aff_campus_unique_index": "0;1;1",
        "aff_campus_unique": "Guangzhou;Hong Kong SAR;",
        "aff_country_unique_index": "0;0;1;0;0;0",
        "aff_country_unique": "China;Australia;"
    },
    {
        "id": "8GCcSXlkZN",
        "title": "Dense Representation Learning for a Joint-Embedding Predictive Architecture",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The joint-embedding predictive architecture (JEPA) recently has shown impressive results in extracting visual representations from unlabeled imagery under a masking strategy.\nHowever, we reveal its disadvantage lies in the inadequate grasp of local semantics for dense representations, a shortfall stemming from its \nmasked modeling on the embedding space and the consequent in less discriminative or even missing local semantics.\nTo bridge this gap, we introduce Dense-JEPA, a novel masked modeling objective rooted in JEPA, tailored for enhanced dense representation learning.\nOur key idea is simple: we consider a set of semantically similar neighboring patches as a target of a masked patch.\nTo be specific, the proposed Dense-JEPA (a) computes feature similarities between each masked patch and its corresponding neighboring patches to select patches having semantically meaningful relations, and (b) employs lightweight cross-attention heads to aggregate features of neighboring patches as the masked targets.\nConsequently, Dense-JEPA learns better dense representations, which can be beneficial to a wide range of downstream tasks.\nThrough extensive experiments, we demonstrate our effectiveness across various visual benchmarks, including ImageNet-1K image classification, ADE20K semantic segmentation, and COCO object detection tasks.",
        "keywords": "Self-supervised Learning;Joint-Embedding Predictive Architecture;Masked Image Modeling",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Shentong Mo;Sukmin Yun",
        "authorids": "~Shentong_Mo1;~Sukmin_Yun1",
        "gender": ";",
        "homepage": ";https://sites.google.com/view/sukmin-yun",
        "dblp": ";234/9078",
        "google_scholar": ";fQcZ_hQAAAAJ",
        "orcid": ";",
        "linkedin": ";sukmin-yun-975b67129/",
        "or_profile": "~Shentong_Mo1;~Sukmin_Yun1",
        "aff": ";Mohamed bin Zayed University of Artificial Intelligence",
        "aff_domain": ";mbzuai.ac.ae",
        "position": ";Postdoc",
        "bibtex": "@misc{\nmo2024dense,\ntitle={Dense Representation Learning for a Joint-Embedding Predictive Architecture},\nauthor={Shentong Mo and Sukmin Yun},\nyear={2024},\nurl={https://openreview.net/forum?id=8GCcSXlkZN}\n}",
        "github": "",
        "project": "",
        "reviewers": "wqKm;NVsT;KGbU;RoAg",
        "site": "https://openreview.net/forum?id=8GCcSXlkZN",
        "pdf_size": 40485812,
        "rating": "5;5;6;8",
        "confidence": "4;5;5;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;2;2;3",
        "wc_summary": "49;28;55;173",
        "wc_strengths": "61;9;34;61",
        "wc_weaknesses": "419;88;151;144",
        "wc_questions": "79;14;98;2",
        "wc_review": "608;139;338;380",
        "wc_reply_reviewers": "82;0;0;65",
        "wc_reply_authors": "1267;520;432;356",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "4;2;2;2",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            76.25,
            56.751101310899685
        ],
        "wc_strengths_avg": [
            41.25,
            21.637640814099857
        ],
        "wc_weaknesses_avg": [
            200.5,
            128.4922176631721
        ],
        "wc_questions_avg": [
            48.25,
            41.026668156212736
        ],
        "wc_review_avg": [
            366.25,
            166.637893349622
        ],
        "wc_reply_reviewers_avg": [
            36.75,
            37.238253181372514
        ],
        "wc_reply_authors_avg": [
            643.75,
            364.4834529851801
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            0.8660254037844386
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.40824829046386296,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:wwgTT6p-FuIJ:scholar.google.com/&scioq=Dense+Representation+Learning+for+a+Joint-Embedding+Predictive+Architecture&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Mohamed bin Zayed University of Artificial Intelligence",
        "aff_unique_dep": "",
        "aff_unique_url": "https://mbzuai.ac.ae",
        "aff_unique_abbr": "MBZUAI",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United Arab Emirates"
    },
    {
        "id": "8GmPLkO0oR",
        "title": "NeRFuser: Diffusion Guided Multi-Task 3D Policy Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper presents NeRFuser, a language-conditioned multi-task policy framework that integrates neural rendering pre-training and diffusion training to enforce multi-modality learning in action sequence spaces. To learn a generalizable multi-task policy with few demonstrations, the pre-training phase of NeRFuser leverages neural rendering to distill 2D semantic features from foundation models such as Stable Diffusion to a 3D space, which provides a comprehensive semantic understanding regarding the scene. Consequently, it allows various applications to challenging robotic tasks requiring rich 3D semantics and accurate geometry. Furthermore, we introduce a novel approach utilizing diffusion training to learn a vision and language feature that encapsulates the inherent multi-modality in the multi-task demonstrations. By reconstructing the action sequences from different tasks via the diffusion process, the model is capable of distinguishing different modalities and thus improving the robustness and the generalizability of the learned representation. NeRFuser significantly surpasses SOTA NeRF-based multi-task manipulation approaches with over 30\\% improvement in success rate. Videos: https://nerfuser.github.io/.",
        "keywords": "Robotic Manipulation;Neural Radiance Field;Pre-Training;Diffusion",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/cfdcf956dff0183739f7a1634e3e9d52d7f4eec9.zip",
        "author": "Ge Yan;Yueh-Hua Wu;Xiaolong Wang",
        "authorids": "~Ge_Yan3;~Yueh-Hua_Wu1;~Xiaolong_Wang3",
        "gender": "Not Specified;;M",
        "homepage": "https://geyan21.github.io/;;https://xiaolonw.github.io/",
        "dblp": "169/8155-6;;91/952-4",
        "google_scholar": "ma7qW2kAAAAJ;;Y8O9N_0AAAAJ",
        "orcid": ";;",
        "linkedin": "ge-yan/;;",
        "or_profile": "~Ge_Yan3;~Yueh-Hua_Wu1;~Xiaolong_Wang3",
        "aff": "University of California, San Diego;;University of California, San Diego",
        "aff_domain": "ucsd.edu;;ucsd.edu",
        "position": "MS student;;Assistant Professor",
        "bibtex": "@misc{\nyan2024nerfuser,\ntitle={Ne{RF}user: Diffusion Guided Multi-Task 3D Policy Learning},\nauthor={Ge Yan and Yueh-Hua Wu and Xiaolong Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=8GmPLkO0oR}\n}",
        "github": "",
        "project": "",
        "reviewers": "ui5H;bCxa;3vtu;Pcik",
        "site": "https://openreview.net/forum?id=8GmPLkO0oR",
        "pdf_size": 20086596,
        "rating": "3;5;6;8",
        "confidence": "4;3;4;4",
        "soundness": "3;3;3;4",
        "contribution": "2;2;3;3",
        "presentation": "2;3;2;4",
        "wc_summary": "127;72;69;142",
        "wc_strengths": "54;19;73;94",
        "wc_weaknesses": "191;102;162;276",
        "wc_questions": "91;95;57;152",
        "wc_review": "463;288;361;664",
        "wc_reply_reviewers": "465;0;262;50",
        "wc_reply_authors": "1948;1354;606;1279",
        "reply_reviewers": "1;0;2;1",
        "reply_authors": "6;5;5;3",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            102.5,
            32.45381333526154
        ],
        "wc_strengths_avg": [
            60.0,
            27.577164466275352
        ],
        "wc_weaknesses_avg": [
            182.75,
            62.67924297564545
        ],
        "wc_questions_avg": [
            98.75,
            34.10553474144629
        ],
        "wc_review_avg": [
            444.0,
            141.40898132721273
        ],
        "wc_reply_reviewers_avg": [
            194.25,
            184.6867280017706
        ],
        "wc_reply_authors_avg": [
            1296.75,
            475.6192673767538
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            4.75,
            1.0897247358851685
        ],
        "replies_avg": [
            30,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.16012815380508713,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:39_eYI8LQSAJ:scholar.google.com/&scioq=NeRFuser:+Diffusion+Guided+Multi-Task+3D+Policy+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of California, San Diego",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucsd.edu",
        "aff_unique_abbr": "UCSD",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "San Diego",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Learning with a Mole: Transferable latent spatial representations for navigation without reconstruction",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19332",
        "id": "8HCARN2hhw",
        "author_site": "Guillaume Bono, Leonid Antsfeld, Assem Sadek, Gianluca Monaci, Christian Wolf",
        "tldr": "",
        "abstract": "Agents navigating in 3D environments require some form of memory, which should hold a compact and actionable representation of the history of observations useful for decision taking and planning. In most end-to-end learning approaches the representation is latent and usually does not have a clearly defined interpretation, whereas classical robotics addresses this with scene reconstruction resulting in some form of map, usually estimated with geometry and sensor models and/or learning. In this work we propose to learn an actionable representation of the scene independently of the targeted downstream task and without explicitly optimizing reconstruction. The learned representation is optimized by a blind auxiliary agent trained to navigate with it on multiple short sub episodes branching out from a waypoint and, most importantly, without any direct visual observation. We argue and show that the blindness property is important and forces the (trained) latent representation to be the only means for planning. With probing experiments we show that the learned representation optimizes navigability and not reconstruction. On downstream tasks we show that it is robust to changes in distribution, in particular the sim2real gap, which we evaluate with a real physical robot in a real office building, significantly improving performance.",
        "keywords": "Navigation;Embodied AI;Perception",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/f84a134b21d0b098ddf46d3a14fdee05504d4afc.zip",
        "author": "Guillaume Bono;Leonid Antsfeld;Assem Sadek;Gianluca Monaci;Christian Wolf",
        "authorids": "~Guillaume_Bono1;~Leonid_Antsfeld1;~Assem_Sadek1;~Gianluca_Monaci1;~Christian_Wolf5",
        "gender": "M;M;M;;M",
        "homepage": ";;https://www.assemsadek.com;;https://chriswolfvision.github.io/www/",
        "dblp": "225/4959;;;23/903;38/2606-1.html",
        "google_scholar": "MkNg3H0AAAAJ;;JC9TIAwAAAAJ;https://scholar.google.co.uk/citations?user=t7MzKqIAAAAJ;idYS1AIAAAAJ",
        "orcid": "0000-0003-3001-2857;;;;",
        "linkedin": ";leonid-antsfeld-8bb3615;assemsadek/;gmonaci;christian-wolf-522761249/",
        "or_profile": "~Guillaume_Bono1;~Leonid_Antsfeld1;~Assem_Sadek1;~Gianluca_Monaci1;~Christian_Wolf5",
        "aff": "Naver Labs Europe;Naver Labs Europe;;Naver Labs Europe;Naver Labs Europe",
        "aff_domain": "naverlabs.com;naverlabs.com;;naverlabs.com;naverlabs.com",
        "position": "Researcher;Researcher;;Researcher;Principal Researcher",
        "bibtex": "@inproceedings{\nbono2024learning,\ntitle={Learning with a Mole: Transferable latent spatial representations for navigation without reconstruction},\nauthor={Guillaume Bono and Leonid Antsfeld and Assem Sadek and Gianluca Monaci and Christian Wolf},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=8HCARN2hhw}\n}",
        "github": "",
        "project": "",
        "reviewers": "SbcL;sYMN;hBzC",
        "pdf_size": 1779340,
        "rating": "6;6;8",
        "confidence": "4;3;4",
        "soundness": "3;3;3",
        "contribution": "2;2;3",
        "presentation": "3;3;3",
        "wc_summary": "167;238;80",
        "wc_strengths": "112;43;161",
        "wc_weaknesses": "529;187;169",
        "wc_questions": "85;81;36",
        "wc_review": "893;549;446",
        "wc_reply_reviewers": "61;13;12",
        "wc_reply_authors": "802;714;748",
        "reply_reviewers": "1;1;1",
        "reply_authors": "1;2;1",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            161.66666666666666,
            64.61338010728807
        ],
        "wc_strengths_avg": [
            105.33333333333333,
            48.40339749324306
        ],
        "wc_weaknesses_avg": [
            295.0,
            165.62608490210712
        ],
        "wc_questions_avg": [
            67.33333333333333,
            22.216110270602176
        ],
        "wc_review_avg": [
            629.3333333333334,
            191.12357840471233
        ],
        "wc_reply_reviewers_avg": [
            28.666666666666668,
            22.866763848189994
        ],
        "wc_reply_authors_avg": [
            754.6666666666666,
            36.23380864453651
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.49999999999999983,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10585416350282073239&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=8HCARN2hhw",
        "pdf": "https://openreview.net/pdf?id=8HCARN2hhw",
        "email": "naverlabs.com;naverlabs.com;;naverlabs.com;naverlabs.com",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "NAVER LABS",
        "aff_unique_dep": "",
        "aff_unique_url": "https://labs.naver.com",
        "aff_unique_abbr": "NLE",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Unknown"
    },
    {
        "id": "8HG2QrtXXB",
        "title": "HelmSim: Learning Helmholtz Dynamics for Interpretable Fluid Simulation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Fluid simulation is a long-standing challenge due to the intrinsic high-dimensional non-linear dynamics. Previous methods usually utilize the non-linear modeling capability of deep models to directly estimate velocity fields for future prediction. However, skipping over inherent physical properties but directly learning superficial velocity fields will overwhelm the model from generating precise or physics reliable results. In this paper, we propose the HelmSim toward an accurate and interpretable simulator for fluid. Inspired by Helmholtz theorem, we design a HelmDynamic block to learn the Helmholtz dynamics, which decomposes fluid dynamics into more solvable curl-free and divergence-free parts, physically corresponding to potential and stream functions of fluid. By embedding the HelmDynamic block into a Multiscale Intergation Network, HelmSim can integrate learned Helmholtz dynamics along temporal dimension in multiple spatial scales to yield future fluid. Comparing with previous velocity estimating methods, HelmSim is faithfully derived from Helmholtz theorem and ravels out complex fluid dynamics with physically interpretable evidence. Experimentally, our proposed HelmSim achieves the consistent state-of-the-art in both numerical simulated and real-world observed benchmarks, even for scenarios with complex boundaries.",
        "keywords": "Interpretable fluid simulation;Helmholtz decomposition",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "/attachment/e0cb9b76d4ec4e489adfb3588548f9b766677853.zip",
        "author": "Lanxiang Xing;Haixu Wu;Yuezhou Ma;Jianmin Wang;Mingsheng Long",
        "authorids": "~Lanxiang_Xing2;~Haixu_Wu1;~Yuezhou_Ma1;~Jianmin_Wang1;~Mingsheng_Long5",
        "gender": "M;M;M;M;M",
        "homepage": "https://github.com/BluesCrossing;;https://github.com/mayz20;https://www.thss.tsinghua.edu.cn/en/faculty/jianminwang.htm;http://ise.thss.tsinghua.edu.cn/~mlong",
        "dblp": ";286/8115;359/0553;06/3456-1.html;74/9023",
        "google_scholar": ";oLL_x0wAAAAJ;;https://scholar.google.com.tw/citations?user=MiovcboAAAAJ;_MjXpXkAAAAJ",
        "orcid": "0000-0001-5928-3242;;;0000-0001-6841-7943;0000-0002-5412-9120",
        "linkedin": ";;;;",
        "or_profile": "~Lanxiang_Xing2;~Haixu_Wu1;~Yuezhou_Ma1;~Jianmin_Wang1;~Mingsheng_Long2",
        "aff": "Tsinghua University;Tsinghua University;Tsinghua University;Tsinghua University;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "MS student;PhD student;Undergrad student;Full Professor;Associate Professor",
        "bibtex": "@misc{\nxing2024helmsim,\ntitle={HelmSim: Learning Helmholtz Dynamics for Interpretable Fluid Simulation},\nauthor={Lanxiang Xing and Haixu Wu and Yuezhou Ma and Jianmin Wang and Mingsheng Long},\nyear={2024},\nurl={https://openreview.net/forum?id=8HG2QrtXXB}\n}",
        "github": "",
        "project": "",
        "reviewers": "rfHe;2nz9;Mqos;eKS7",
        "site": "https://openreview.net/forum?id=8HG2QrtXXB",
        "pdf_size": 23713244,
        "rating": "3;5;6;6",
        "confidence": "4;3;3;5",
        "soundness": "2;2;2;3",
        "contribution": "1;2;2;2",
        "presentation": "2;3;2;2",
        "wc_summary": "80;46;67;52",
        "wc_strengths": "46;49;76;81",
        "wc_weaknesses": "379;244;377;17",
        "wc_questions": "375;141;75;199",
        "wc_review": "880;480;595;349",
        "wc_reply_reviewers": "0;309;39;7",
        "wc_reply_authors": "1206;901;1367;1122",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "5;3;4;4",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            61.25,
            13.254716141811564
        ],
        "wc_strengths_avg": [
            63.0,
            15.636495771111889
        ],
        "wc_weaknesses_avg": [
            254.25,
            147.49809320801404
        ],
        "wc_questions_avg": [
            197.5,
            111.4753335944773
        ],
        "wc_review_avg": [
            576.0,
            195.90941784406385
        ],
        "wc_reply_reviewers_avg": [
            88.75,
            128.0085446366765
        ],
        "wc_reply_authors_avg": [
            1149.0,
            168.08182531136436
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.0,
            0.7071067811865476
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:HdqK5jlVER8J:scholar.google.com/&scioq=HelmSim:+Learning+Helmholtz+Dynamics+for+Interpretable+Fluid+Simulation&hl=en&as_sdt=0,14",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Tsinghua University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "CoBIT: A Contrastive Bi-directional Image-Text Generation Model",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19331",
        "id": "8ISRqgtjPc",
        "author_site": "Haoxuan You, Xiaoyue Guo, Zhecan Wang, Kai-Wei Chang, Jason Baldridge, Jiahui Yu",
        "tldr": "",
        "abstract": "The field of Vision-and-Language (VL) has witnessed a proliferation of pretrained foundation models. Current techniques typically employ only one type of training objective, whether it's (1) contrastive objectives (like CLIP), (2) image-to-text generative objectives (like PaLI), or (3) text-to-image generative objectives (like Parti). However, all these three objectives are mutually relevant and are all based on image-text pairs. Intuitively, the first two objectives can be considered as complementary projections between two modalities, and contrastive learning can preserve global alignment and generations facilitate fine-grained understanding. Inspired by this, we present a Contrastive Bi-directional Image-Text generation model (CoBIT) to first time unify the three pre-training objectives in one framework. Specifically, CoBIT employs a novel unicoder-decoder structure consisting of an image unicoder, a text unicoder, and a cross-modal decoder. The image/text unicoders can switch between encoding and decoding in different tasks, enabling flexibility and shared knowledge that benefits both image-to-text and text-to-image generations. CoBIT achieves superior performance in image understanding, image-text understanding (Retrieval, Captioning, VQA, SNLI-VE), and text-based content creation, particularly in zero-shot scenarios.",
        "keywords": "Contrastive Pre-training;Vision-Language;Text-to-Image Generation;Auto-regressive Model.",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Haoxuan You;Mandy Guo;Zhecan Wang;Kai-Wei Chang;Jason Michael Baldridge;Jiahui Yu",
        "authorids": "~Haoxuan_You1;~Mandy_Guo2;~Zhecan_Wang2;~Kai-Wei_Chang1;~Jason_Michael_Baldridge1;~Jiahui_Yu1",
        "gender": "M;M;M;M;M;F",
        "homepage": "https://hxyou.github.io/;https://www.zhecanwang.com/;http://kwchang.net;https://research.google/people/jasonbaldridge/?&type=google;http://jiahuiyu.com/;",
        "dblp": "210/2628;167/4251;18/2428;90/6617;185/1060;",
        "google_scholar": "BhysChMAAAAJ;uqHPnmgAAAAJ;fqDBtzYAAAAJ;TP_JZm8AAAAJ;-CLCMk4AAAAJ;qOiCKewAAAAJ",
        "orcid": ";0009-0003-7785-4637;0000-0001-5365-0072;;;",
        "linkedin": ";jameszhecanwang/;kai-wei-chang-41239040;jason-baldridge-9b26295/;jiahuiyuu/;",
        "or_profile": "~Haoxuan_You1;~Zhecan_Wang2;~Kai-Wei_Chang1;~Jason_Michael_Baldridge1;~Jiahui_Yu1;~Xiaoyue_Guo1",
        "aff": "Columbia University;Columbia University;Amazon;Google;Google Brain;",
        "aff_domain": "columbia.edu;columbia.edu;amazon.com;google.com;google.com;",
        "position": "PhD student;PhD student;Researcher;Research Scientist;Research Scientist;",
        "bibtex": "@inproceedings{\nyou2024cobit,\ntitle={Co{BIT}: A Contrastive Bi-directional Image-Text Generation Model},\nauthor={Haoxuan You and Mandy Guo and Zhecan Wang and Kai-Wei Chang and Jason Michael Baldridge and Jiahui Yu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=8ISRqgtjPc}\n}",
        "github": "",
        "project": "",
        "reviewers": "GAkS;vaSs;PXu6;wSdD;Ui8A",
        "pdf_size": 3360100,
        "rating": "5;6;6;8;8",
        "confidence": "4;4;5;5;4",
        "soundness": "3;3;2;4;4",
        "contribution": "2;3;3;2;3",
        "presentation": "3;3;3;4;2",
        "wc_summary": "70;140;47;68;123",
        "wc_strengths": "18;111;72;66;148",
        "wc_weaknesses": "192;150;476;107;198",
        "wc_questions": "51;82;19;20;1",
        "wc_review": "331;483;614;261;470",
        "wc_reply_reviewers": "0;0;15;0;248",
        "wc_reply_authors": "1132;683;845;571;874",
        "reply_reviewers": "0;0;1;0;1",
        "reply_authors": "3;2;3;2;2",
        "rating_avg": [
            6.6,
            1.2
        ],
        "confidence_avg": [
            4.4,
            0.48989794855663565
        ],
        "soundness_avg": [
            3.2,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            3.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            89.6,
            35.556152772762125
        ],
        "wc_strengths_avg": [
            83.0,
            43.91810560577494
        ],
        "wc_weaknesses_avg": [
            224.6,
            129.89780598609045
        ],
        "wc_questions_avg": [
            34.6,
            28.639832401744254
        ],
        "wc_review_avg": [
            431.8,
            123.7827128479579
        ],
        "wc_reply_reviewers_avg": [
            52.6,
            97.87257021249621
        ],
        "wc_reply_authors_avg": [
            821.0,
            190.60430215501432
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            2.4,
            0.4898979485566356
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.2721655269759087,
        "gs_citation": 22,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14505239298930891113&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=8ISRqgtjPc",
        "pdf": "https://openreview.net/pdf?id=8ISRqgtjPc",
        "email": "columbia.edu;columbia.edu;amazon.com;google.com;google.com;",
        "author_num": 6,
        "aff_unique_index": "0;0;1;2;2",
        "aff_unique_norm": "Columbia University;Amazon;Google",
        "aff_unique_dep": ";Amazon.com, Inc.;Google",
        "aff_unique_url": "https://www.columbia.edu;https://www.amazon.com;https://www.google.com",
        "aff_unique_abbr": "Columbia;Amazon;Google",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "8Itp6Axs9Z",
        "title": "SelfDreamer: Dual-Prototypical Regularization for Frame-masked Model-based Reinforcement Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In the realm of reinforcement learning (RL), the conventional approach involves\ntraining agents in unknown environments using extensive experiences comprising\nhigh-dimensional state representations (typically images), actions, and rewards.\nHowever, this standard setup imposes substantial data transmission overhead in\nscenarios where edge devices are employed for data collection, and cloud servers\nare utilized for model training. This paper introduces a novel paradigm termed\n\u201dframe-masked RL,\u201d which is devised to enhance data efficiency while examining the impact on existing methods. Concurrently, we introduce a model-based\nalgorithm, \u201dSelfDreamer,\u201d tailored to mitigate the information loss incurred due\nto frame masking. SelfDreamer leverages action-transition dual prototypes to embed action information within the world model and align the hidden states in the\nrepresentation space. Empirical evaluations reveal that SelfDreamer consistently\noutperforms state-of-the-art methods across six continuous control tasks sourced\nfrom the DeepMind Control Suite, demonstrating superior or comparable performance while utilizing only half of the observations from the environment.",
        "keywords": "reinforcement learning;prototypical learning;deep learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/d3a5594c17942719049a62ab3dcc99bd2be9bbb2.zip",
        "author": "Wei Ding;Ming-Syan Chen",
        "authorids": "~Wei_Ding6;~Ming-Syan_Chen2",
        "gender": "M;M",
        "homepage": ";https://arbor.ee.ntu.edu.tw/~mschen",
        "dblp": ";c/MingSyanChen",
        "google_scholar": "https://scholar.google.com.tw/citations?user=DS7DBXgAAAAJ;KTmCrFkAAAAJ",
        "orcid": ";0000-0002-0711-8197",
        "linkedin": "wei-ding-7b0829260/;",
        "or_profile": "~Wei_Ding6;~Ming-Syan_Chen2",
        "aff": "National Taiwan University;National Taiwan University",
        "aff_domain": "ntu.edu.tw;ntu.edu",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nding2024selfdreamer,\ntitle={SelfDreamer: Dual-Prototypical Regularization for Frame-masked Model-based Reinforcement Learning},\nauthor={Wei Ding and Ming-Syan Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=8Itp6Axs9Z}\n}",
        "github": "",
        "project": "",
        "reviewers": "Ngz6;GHX9;Euds;CGK5",
        "site": "https://openreview.net/forum?id=8Itp6Axs9Z",
        "pdf_size": 411206,
        "rating": "3;3;5;5",
        "confidence": "5;4;4;5",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "2;1;3;3",
        "wc_summary": "105;143;47;70",
        "wc_strengths": "46;78;48;110",
        "wc_weaknesses": "196;518;465;271",
        "wc_questions": "258;347;78;95",
        "wc_review": "605;1086;638;546",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            91.25,
            36.32062086473743
        ],
        "wc_strengths_avg": [
            70.5,
            26.091186251299497
        ],
        "wc_weaknesses_avg": [
            362.5,
            133.02349416550447
        ],
        "wc_questions_avg": [
            194.5,
            112.65100976023251
        ],
        "wc_review_avg": [
            718.75,
            214.57792873452757
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:DgXQSSOGPG8J:scholar.google.com/&scioq=SelfDreamer:+Dual-Prototypical+Regularization+for+Frame-masked+Model-based+Reinforcement+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "National Taiwan University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ntu.edu.tw",
        "aff_unique_abbr": "NTU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Taiwan",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "8JCn0kmS8W",
        "title": "WavJourney: Compositional Audio Creation with Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Despite breakthroughs in audio generation models, their capabilities are often confined to domain-specific conditions such as speech transcriptions and audio captions. However, real-world audio creation aims to generate harmonious audio containing various elements such as speech, music, and sound effects with controllable conditions, which is challenging to address using existing audio generation systems. We present WavJourney, a novel framework that leverages Large Language Models (LLMs) to connect various audio models for audio creation. WavJourney allows users to create storytelling audio content with diverse audio elements simply from textual descriptions. Specifically, given a text instruction, WavJourney first prompts LLMs to generate an audio script that serves as a structured semantic representation of audio elements. The audio script is then converted into a computer program, where each line of the program calls a task-specific audio generation model or computational operation function. The computer program is then executed to obtain a compositional and interpretable solution for audio creation. Experimental results suggest that WavJourney is capable of synthesizing realistic audio aligned with textually-described semantic, spatial and temporal conditions, achieving state-of-the-art results on text-to-audio generation benchmarks. Additionally, we introduce a new multi-genre story benchmark. Subjective evaluations demonstrate the potential of WavJourney in crafting engaging storytelling audio content from text. We further demonstrate that WavJourney can facilitate human-machine co-creation in multi-round dialogues. To foster future research, the code and synthesized audio are available at: https://anonymous.4open.science/w/WavJourney_Anonymous/.",
        "keywords": "Audio Generation;Audio Synthesis;Large Language Models (LLMs);AIGC;Computational Creativity",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Xubo Liu;Zhongkai Zhu;Haohe Liu;Yi Yuan;Meng Cui;Qiushi Huang;Jinhua Liang;Yin Cao;Qiuqiang Kong;Mark D Plumbley;Wenwu Wang",
        "authorids": "~Xubo_Liu1;~Zhongkai_Zhu1;~Haohe_Liu2;~Yi_Yuan2;~Meng_Cui1;~Qiushi_Huang1;~Jinhua_Liang1;~Yin_Cao1;~Qiuqiang_Kong1;~Mark_D_Plumbley1;~Wenwu_Wang1",
        "gender": "M;M;M;M;M;M;M;M;M;;M",
        "homepage": "https://liuxubo717.github.io/;;https://haoheliu.github.io/;https://www.surrey.ac.uk/people/yi-yuan;https://www.surrey.ac.uk/people/meng-cui;;https://jinhualiang.github.io/;;https://qiuqiangkong.github.io/;https://www.surrey.ac.uk/people/mark-plumbley;http://personal.ee.surrey.ac.uk/Personal/W.Wang/",
        "dblp": "235/1970/;;272/5570;;35/4727;204/2933;;;;84/1168;https://dblp.org/pers/hd/w/Wang:Wenwu",
        "google_scholar": "-OlNYSgAAAAJ;CcqM9L4AAAAJ;g3O4lJMAAAAJ;;https://scholar.google.com/citations?view_op=list_works;F_yGB9sAAAAJ;mDVXe7sAAAAJ;J9edRm4AAAAJ;;28TCymYAAAAJ;https://scholar.google.co.uk/citations?user=JQFnV5IAAAAJ",
        "orcid": ";;0000-0003-1036-7888;;;;0000-0002-4570-0735;;;0000-0002-9708-1075;",
        "linkedin": ";;haohe-liu-4483a71a4/;;;;jinhua-l1ang/;;;;https://uk.linkedin.com/in/wenwu",
        "or_profile": "~Xubo_Liu1;~Zhongkai_Zhu1;~Haohe_Liu2;~Yi_Yuan2;~Meng_Cui1;~Qiushi_Huang1;~Jinhua_Liang1;~Yin_Cao1;~Qiuqiang_Kong1;~Mark_D_Plumbley1;~Wenwu_Wang1",
        "aff": "University of Surrey;;Meta Facebook;University of Surrey;University of Surrey;University of Surrey;Queen Mary University of London;;;University of Surrey;University of Surrey",
        "aff_domain": "surrey.ac.uk;;meta.com;surrey.ac.uk;surrey.ac.uk;surrey.ac.uk;qmul.ac.uk;;;surrey.ac.uk;surrey.ac.uk",
        "position": "PhD student;;Intern;PhD student;PhD student;PhD student;PhD student;;;Full Professor;Full Professor",
        "bibtex": "@misc{\nliu2024wavjourney,\ntitle={WavJourney: Compositional Audio Creation with Large Language Models},\nauthor={Xubo Liu and Zhongkai Zhu and Haohe Liu and Yi Yuan and Meng Cui and Qiushi Huang and Jinhua Liang and Yin Cao and Qiuqiang Kong and Mark D Plumbley and Wenwu Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=8JCn0kmS8W}\n}",
        "github": "",
        "project": "",
        "reviewers": "xGho;HBpU;koFK;jF76;iM1V",
        "site": "https://openreview.net/forum?id=8JCn0kmS8W",
        "pdf_size": 13661954,
        "rating": "3;5;5;6;6",
        "confidence": "3;3;4;3;3",
        "soundness": "2;2;3;2;2",
        "contribution": "2;2;2;2;3",
        "presentation": "3;3;3;3;2",
        "wc_summary": "86;225;83;163;226",
        "wc_strengths": "4;107;33;61;76",
        "wc_weaknesses": "185;337;149;125;157",
        "wc_questions": "100;29;30;2;114",
        "wc_review": "375;698;295;351;573",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "679;718;514;538;436",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            5.0,
            1.0954451150103321
        ],
        "confidence_avg": [
            3.2,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.2,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            156.6,
            63.14617961523879
        ],
        "wc_strengths_avg": [
            56.2,
            35.38022046285184
        ],
        "wc_weaknesses_avg": [
            190.6,
            75.66663729808535
        ],
        "wc_questions_avg": [
            55.0,
            43.85430423573039
        ],
        "wc_review_avg": [
            458.4,
            152.13888391860905
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            577.0,
            105.50450227359968
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 19,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3696469140543305659&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;0;0;0;2;0;0",
        "aff_unique_norm": "University of Surrey;Meta;Queen Mary University of London",
        "aff_unique_dep": ";Meta Platforms, Inc.;",
        "aff_unique_url": "https://www.surrey.ac.uk;https://meta.com;https://www.qmul.ac.uk",
        "aff_unique_abbr": "Surrey;Meta;QMUL",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";London",
        "aff_country_unique_index": "0;1;0;0;0;0;0;0",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "id": "8JKZZxJAZ3",
        "title": "Nonnegative Matrix Factorization through Canonical Edges",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this paper we present a novel approach to nonnegative matrix factorization (NMF) by introducing the concept of nonnegative canonical edges (NCEs). These NCEs are intersections of the principal subspace containing the data to be factored with canonical faces of the nonnegative orthant. Through this lens, our approach yields a closed-form solution to the special NMF case where (at least one of) the factors are required to be orthogonal. In the general NMF case, NCEs provide a deterministic optimal solution whenever the data resides within or in proximity to the cone formed by the NCEs. Furthermore, NCEs provide an improved initialization for classical NMF methods in general. Despite these advancements, numerous fundamental questions regarding NCEs in the context of NMF remain unexplored, offering exciting avenues for future research.",
        "keywords": "nonnegative matrix factorization;orthogonal",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/741f884deb358c33aa8f1fdfa8cd4d5edf39c9c8.zip",
        "author": "Daniel L. Pimentel-Alarc\u00f3n",
        "authorids": "~Daniel_L._Pimentel-Alarc\u00f3n1",
        "gender": "",
        "homepage": "https://danielpimentel.github.io/",
        "dblp": "150/6256",
        "google_scholar": "",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Daniel_L._Pimentel-Alarc\u00f3n1",
        "aff": "University of Wisconsin, Madison",
        "aff_domain": "wisc.edu",
        "position": "Assistant Professor",
        "bibtex": "@misc{\npimentel-alarc{\\'o}n2024nonnegative,\ntitle={Nonnegative Matrix Factorization through Canonical Edges},\nauthor={Daniel L. Pimentel-Alarc{\\'o}n},\nyear={2024},\nurl={https://openreview.net/forum?id=8JKZZxJAZ3}\n}",
        "github": "",
        "project": "",
        "reviewers": "qZPt;bRYi;VKXr",
        "site": "https://openreview.net/forum?id=8JKZZxJAZ3",
        "pdf_size": 3373057,
        "rating": "3;5;5",
        "confidence": "4;3;3",
        "soundness": "2;2;2",
        "contribution": "1;2;2",
        "presentation": "1;2;1",
        "wc_summary": "78;106;33",
        "wc_strengths": "13;51;15",
        "wc_weaknesses": "331;121;127",
        "wc_questions": "3;26;54",
        "wc_review": "425;304;229",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            72.33333333333333,
            30.070288030250428
        ],
        "wc_strengths_avg": [
            26.333333333333332,
            17.46106780494506
        ],
        "wc_weaknesses_avg": [
            193.0,
            97.61147473529944
        ],
        "wc_questions_avg": [
            27.666666666666668,
            20.8539897594894
        ],
        "wc_review_avg": [
            319.3333333333333,
            80.74789298936675
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.9999999999999998,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:BR1mSqziwU8J:scholar.google.com/&scioq=Nonnegative+Matrix+Factorization+through+Canonical+Edges&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Wisconsin",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.wisc.edu",
        "aff_unique_abbr": "UW",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Madison",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "title": "lpNTK: Better Generalisation with Less Data via Sample Interaction During Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19330",
        "id": "8Ju0VmvMCW",
        "author_site": "Shangmin Guo, YI REN, Stefano Albrecht, Kenny Smith",
        "tldr": "",
        "abstract": "Although much research has been done on proposing new models or loss functions to improve the generalisation of artificial neural networks (ANNs), less attention has been directed to the impact of the training data on generalisation. In this work, we start from approximating the interaction between samples, i.e. how learning one sample would modify the model's prediction on other samples. Through analysing the terms involved in weight updates in supervised learning, we find that labels influence the interaction between samples. Therefore, we propose the labelled pseudo Neural Tangent Kernel (lpNTK) which takes label information into consideration when measuring the interactions between samples. We first prove that lpNTK asymptotically converges to the empirical neural tangent kernel in terms of the Frobenius norm under certain assumptions. Secondly, we illustrate how lpNTK helps to understand learning phenomena identified in previous work, specifically the learning difficulty of samples and forgetting events during learning. Moreover, we also show that using lpNTK to identify and remove poisoning training samples does not hurt the generalisation performance of ANNs.",
        "keywords": "generalisation;data selection;neural tangent kernel;sample interaction;learning dynamics",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Shangmin Guo;Yi Ren;Stefano V Albrecht;Kenny Smith",
        "authorids": "~Shangmin_Guo1;~Yi_Ren6;~Stefano_V_Albrecht1;~Kenny_Smith1",
        "gender": "M;M;;M",
        "homepage": ";https://joshua-ren.github.io/;https://agents-lab.org/stefano-albrecht/;http://www.ling.ed.ac.uk/~kenny",
        "dblp": "183/0949;;118/3975;58/6224",
        "google_scholar": "cpOrbSoAAAAJ;5QNce38AAAAJ;https://scholar.google.co.uk/citations?user=ceSFqCcAAAAJ;",
        "orcid": "0000-0003-1716-0994;;0000-0002-8735-1465;0000-0002-4530-6914",
        "linkedin": ";;;",
        "or_profile": "~Shangmin_Guo1;~Yi_Ren6;~Stefano_V_Albrecht1;~Kenny_Smith1",
        "aff": "University of Edinburgh;University of British Columbia;University of Edinburgh;University of Edinburgh",
        "aff_domain": "ed.ac.uk;ubc.ca;ed.ac.uk;ed.ac.uk",
        "position": "PhD student;PhD student;Associate Professor;Professor",
        "bibtex": "@inproceedings{\nguo2024lpntk,\ntitle={lp{NTK}: Better Generalisation with Less Data via Sample Interaction During Learning},\nauthor={Shangmin Guo and Yi Ren and Stefano V Albrecht and Kenny Smith},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=8Ju0VmvMCW}\n}",
        "github": "",
        "project": "",
        "reviewers": "4TQg;3vgc;9biR",
        "pdf_size": 3163503,
        "rating": "6;6;8",
        "confidence": "4;2;3",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "2;2;3",
        "wc_summary": "73;93;106",
        "wc_strengths": "58;139;80",
        "wc_weaknesses": "254;172;202",
        "wc_questions": "4;55;87",
        "wc_review": "389;459;475",
        "wc_reply_reviewers": "31;0;55",
        "wc_reply_authors": "938;907;957",
        "reply_reviewers": "1;0;1",
        "reply_authors": "3;2;2",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            90.66666666666667,
            13.572848714334887
        ],
        "wc_strengths_avg": [
            92.33333333333333,
            34.198765409814946
        ],
        "wc_weaknesses_avg": [
            209.33333333333334,
            33.875589375766666
        ],
        "wc_questions_avg": [
            48.666666666666664,
            34.179265969622904
        ],
        "wc_review_avg": [
            441.0,
            37.345236197762446
        ],
        "wc_reply_reviewers_avg": [
            28.666666666666668,
            22.51419305435771
        ],
        "wc_reply_authors_avg": [
            934.0,
            20.607442021431645
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11154955795369655285&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=8Ju0VmvMCW",
        "pdf": "https://openreview.net/pdf?id=8Ju0VmvMCW",
        "email": "ed.ac.uk;ubc.ca;ed.ac.uk;ed.ac.uk",
        "author_num": 4,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "University of Edinburgh;University of British Columbia",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ed.ac.uk;https://www.ubc.ca",
        "aff_unique_abbr": "Edinburgh;UBC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "United Kingdom;Canada"
    },
    {
        "id": "8LBS1nixTJ",
        "title": "HashOrder: Accelerating Graph Processing Through Hashing-based Reordering",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph processing systems are a fundamental tool across various domains such as machine learning, and their efficiency has become increasingly crucial due to the rapid growth in data volume. A major bottleneck in graph processing systems is poor cache utilization. Graph reordering techniques can mitigate this bottleneck and significantly speed up graph workloads by improving the data locality of the graph memory layout. However, since existing approaches use greedy algorithms or simple heuristics to find good orderings, they suffer from either high computational overhead or suboptimal ordering quality. To this end, we propose HashOrder, a probabilistic algorithm for graph reordering based on randomized hashing. We theoretically show that hashing-based orderings have quality guarantees under reasonable assumptions. HashOrder produces high-quality orderings while being lightweight and parallelizable. We empirically show that HashOrder beats the efficiency-quality tradeoff curve of existing algorithms. Evaluations on various graph processing workloads and GNN data loaders reveal that HashOrder is competitive with or outperforms the existing best method while being 592$\\times$ more efficient in reordering, speeding up PageRank by up to 2.49$\\times$ and GNN data loaders by up to 2.33$\\times$.",
        "keywords": "graph processing;graph reordering;efficiency;hashing",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Tianyi Zhang;Aditya Desai;Gaurav Gupta;Anshumali Shrivastava",
        "authorids": "~Tianyi_Zhang6;~Aditya_Desai1;~Gaurav_Gupta6;~Anshumali_Shrivastava1",
        "gender": "M;M;M;M",
        "homepage": "https://github.com/tonyzhang617;https://gaurav16gupta.github.io/;https://www.cs.rice.edu/~as143/;https://apd10.github.io/",
        "dblp": "17/322-11.html;;63/9828;18/8339",
        "google_scholar": "ekRl428AAAAJ;;https://scholar.google.com.tw/citations?user=SGT23RAAAAAJ;ymdbDZwAAAAJ",
        "orcid": ";;;0009-0002-9111-9391",
        "linkedin": ";;;aditya-desai-ai/",
        "or_profile": "~Tianyi_Zhang6;~Gaurav_Gupta6;~Anshumali_Shrivastava1;~Adity_Desai1",
        "aff": "Rice University;;ThirdAI Corp.;Rice University",
        "aff_domain": "rice.edu;;thirdai.com;rice.edu",
        "position": "PhD student;;CEO;PhD student",
        "bibtex": "@misc{\nzhang2024hashorder,\ntitle={HashOrder: Accelerating Graph Processing Through Hashing-based Reordering},\nauthor={Tianyi Zhang and Aditya Desai and Gaurav Gupta and Anshumali Shrivastava},\nyear={2024},\nurl={https://openreview.net/forum?id=8LBS1nixTJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "EBBV;KkKE;3s87;L3q7;M1A7;n1d2",
        "site": "https://openreview.net/forum?id=8LBS1nixTJ",
        "pdf_size": 2025142,
        "rating": "3;5;5;6;6;8",
        "confidence": "4;3;4;3;3;4",
        "soundness": "2;3;2;3;2;3",
        "contribution": "1;2;3;3;2;3",
        "presentation": "3;3;3;3;2;3",
        "wc_summary": "133;50;58;75;40;80",
        "wc_strengths": "65;90;77;26;28;62",
        "wc_weaknesses": "147;58;352;103;188;46",
        "wc_questions": "79;20;13;29;18;41",
        "wc_review": "424;218;500;233;274;229",
        "wc_reply_reviewers": "297;198;0;0;65;29",
        "wc_reply_authors": "505;437;538;476;1055;381",
        "reply_reviewers": "1;2;0;0;1;1",
        "reply_authors": "2;3;1;1;2;2",
        "rating_avg": [
            5.5,
            1.5
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.7453559924999298
        ],
        "presentation_avg": [
            2.8333333333333335,
            0.3726779962499649
        ],
        "wc_summary_avg": [
            72.66666666666667,
            30.263656237951302
        ],
        "wc_strengths_avg": [
            58.0,
            23.713568549109883
        ],
        "wc_weaknesses_avg": [
            149.0,
            103.06955580254207
        ],
        "wc_questions_avg": [
            33.333333333333336,
            22.320892057044276
        ],
        "wc_review_avg": [
            313.0,
            109.00458705944443
        ],
        "wc_reply_reviewers_avg": [
            98.16666666666667,
            111.54881841099389
        ],
        "wc_reply_authors_avg": [
            565.3333333333334,
            224.5697120173501
        ],
        "reply_reviewers_avg": [
            0.8333333333333334,
            0.6871842709362768
        ],
        "reply_authors_avg": [
            1.8333333333333333,
            0.6871842709362768
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.11111111111111109,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6449314624127255120&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Rice University;ThirdAI Corp.",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.rice.edu;",
        "aff_unique_abbr": "Rice;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Fast-ELECTRA for Efficient Pre-training",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19329",
        "id": "8OBuqbLb8h",
        "author_site": "Chengyu Dong, Liyuan Liu, Hao Cheng, Jingbo Shang, Jianfeng Gao, Xiaodong Liu",
        "tldr": "",
        "abstract": "ELECTRA pre-trains language models by detecting tokens in a sequence that have been replaced by an auxiliary model. Although ELECTRA offers a significant boost in efficiency, its potential is constrained by the training cost brought by the auxiliary model. Notably, this model, which is jointly trained with the main model, only serves to assist the training of the main model and is discarded post-training. This results in a substantial amount of training cost being expended in vain. To mitigate this issue, we propose Fast-ELECTRA, which leverages an existing language model as the auxiliary model. To construct a learning curriculum for the main model, we smooth its output distribution via temperature scaling following a descending schedule. Our approach rivals the performance of state-of-the-art ELECTRA-style pre-training methods, while significantly eliminating the computation and memory cost brought by the joint training of the auxiliary model. Our method also reduces the sensitivity to hyper-parameters and enhances the pre-training stability.",
        "keywords": "Language model Pre-training;ELECTRA;Efficiency",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Chengyu Dong;Liyuan Liu;Hao Cheng;Jingbo Shang;Jianfeng Gao;Xiaodong Liu",
        "authorids": "~Chengyu_Dong1;~Liyuan_Liu3;~Hao_Cheng4;~Jingbo_Shang2;~Jianfeng_Gao1;~Xiaodong_Liu1",
        "gender": ";M;M;M;;M",
        "homepage": "https://www.chengyu-dong.me/;https://sites.google.com/site/hcheng2site/Home;https://shangjingbo1226.github.io/;https://www.microsoft.com/en-us/research/people/jfgao/;;https://liyuanlucasliu.github.io/",
        "dblp": "14/3155;09/5158-2;151/3145.html;92/5339;65/622;06/1624",
        "google_scholar": "Ppfi7j0AAAAJ;https://scholar.google.com/citations?hl=en;0SkFI4MAAAAJ;https://scholar.google.com/citations?hl=en;NIewcxMAAAAJ;RmvbkzYAAAAJ",
        "orcid": ";0000-0001-7988-3149;;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Chengyu_Dong1;~Hao_Cheng4;~Jingbo_Shang2;~Jianfeng_Gao1;~Xiaodong_Liu1;~Liyuan_Liu1",
        "aff": "University of California, San Diego;Microsoft Research;University of California, San Diego;Microsoft Research;Microsoft Research;University of Illinois, Urbana Champaign",
        "aff_domain": "ucsd.edu;microsoft.com;ucsd.edu;microsoft.com;microsoft.com;illinois.edu",
        "position": "PhD student;Researcher;Assistant Professor;Principal Researcher;Researcher;PhD student",
        "bibtex": "@inproceedings{\ndong2024fastelectra,\ntitle={Fast-{ELECTRA} for Efficient Pre-training},\nauthor={Chengyu Dong and Liyuan Liu and Hao Cheng and Jingbo Shang and Jianfeng Gao and Xiaodong Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=8OBuqbLb8h}\n}",
        "github": "",
        "project": "",
        "reviewers": "QMNg;rs11;dT26",
        "pdf_size": 418386,
        "rating": "6;6;6",
        "confidence": "3;4;4",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "2;4;3",
        "wc_summary": "30;47;209",
        "wc_strengths": "16;12;85",
        "wc_weaknesses": "46;19;235",
        "wc_questions": "2;2;76",
        "wc_review": "94;80;605",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "322;125;1156",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            95.33333333333333,
            80.67355342503652
        ],
        "wc_strengths_avg": [
            37.666666666666664,
            33.50953429829918
        ],
        "wc_weaknesses_avg": [
            100.0,
            96.0937042682818
        ],
        "wc_questions_avg": [
            26.666666666666668,
            34.883934538536344
        ],
        "wc_review_avg": [
            259.6666666666667,
            244.2544210904323
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            534.3333333333334,
            446.88129171950004
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6732446403804894749&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=8OBuqbLb8h",
        "pdf": "https://openreview.net/pdf?id=8OBuqbLb8h",
        "email": "ucsd.edu;microsoft.com;ucsd.edu;microsoft.com;microsoft.com;illinois.edu",
        "author_num": 6,
        "aff_unique_index": "0;1;0;1;1;2",
        "aff_unique_norm": "University of California, San Diego;Microsoft;University of Illinois Urbana-Champaign",
        "aff_unique_dep": ";Microsoft Research;",
        "aff_unique_url": "https://www.ucsd.edu;https://www.microsoft.com/en-us/research;https://illinois.edu",
        "aff_unique_abbr": "UCSD;MSR;UIUC",
        "aff_campus_unique_index": "0;0;2",
        "aff_campus_unique": "San Diego;;Urbana-Champaign",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "MgNO: Efficient Parameterization of Linear Operators via Multigrid",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19328",
        "id": "8OxL034uEr",
        "author_site": "Juncai He, Xinliang Liu, Jinchao Xu",
        "tldr": "",
        "abstract": "In this work, we propose a concise neural operator architecture for operator learning. Drawing an analogy with a conventional fully connected neural network, we define the neural operator as follows: the output of the $i$-th neuron in a nonlinear operator layer is defined by $\\mathcal O_i(u) =  \\sigma\\left( \\sum_j \\mathcal W_{ij} u + \\mathcal B_{ij}\\right)$. Here, $\\mathcal W_{ij}$ denotes the bounded linear operator connecting $j$-th input neuron to $i$-th output neuron, and the bias $\\mathcal B_{ij}$ takes the form of a function rather than a scalar. Given its new universal approximation property, the efficient parameterization of the bounded linear operators between two neurons (Banach spaces) plays a critical role. As a result, we introduce MgNO, utilizing multigrid structures to parameterize these linear operators between neurons.  This approach offers both mathematical rigor and practical expressivity. Additionally, MgNO obviates the need for conventional lifting and projecting operators typically required in previous neural operators. Moreover, it seamlessly accommodates diverse boundary conditions. Our empirical observations reveal that MgNO exhibits superior ease of training compared to CNN-based models, while also displaying a reduced susceptibility to overfitting when contrasted with spectral-type neural operators. We demonstrate the efficiency and accuracy of our method with consistently state-of-the-art performance on different types of partial differential equations (PDEs).",
        "keywords": "neural operator; multigrid; universal approximation; boundary condition",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/a7015fd3efce1ca846b507d9c03a7562ff5a1fce.zip",
        "author": "Juncai He;Xinliang Liu;Jinchao Xu",
        "authorids": "~Juncai_He1;~Xinliang_Liu1;~Jinchao_Xu1",
        "gender": "M;M;M",
        "homepage": "https://juncaihe.github.io;https://cemse.kaust.edu.sa/scml/people/person/xinliang-liu;https://www.personal.psu.edu/jxx1/",
        "dblp": "223/4286;67/10364;",
        "google_scholar": "CG5GBW0AAAAJ;9AsSTc4AAAAJ;pBHiYxcAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Juncai_He1;~Xinliang_Liu1;~Jinchao_Xu1",
        "aff": "King Abdullah University of Science and Technology;King Abdullah University of Science and Technology;Pennsylvania State University",
        "aff_domain": "kaust.edu.sa;kaust.edu.sa;psu.edu",
        "position": "Researcher;Postdoc;Full Professor",
        "bibtex": "@inproceedings{\nhe2024mgno,\ntitle={Mg{NO}: Efficient Parameterization of Linear Operators via Multigrid},\nauthor={Juncai He and Xinliang Liu and Jinchao Xu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=8OxL034uEr}\n}",
        "github": "",
        "project": "",
        "reviewers": "4o6c;RPM7;H6UK;5jaY",
        "pdf_size": 3022526,
        "rating": "6;6;6;8",
        "confidence": "3;2;2;4",
        "soundness": "3;3;3;4",
        "contribution": "3;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "75;52;120;73",
        "wc_strengths": "24;57;92;91",
        "wc_weaknesses": "14;91;12;100",
        "wc_questions": "57;56;38;36",
        "wc_review": "170;256;262;300",
        "wc_reply_reviewers": "0;12;0;0",
        "wc_reply_authors": "321;1095;650;954",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;2;1;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            80.0,
            24.78911051248108
        ],
        "wc_strengths_avg": [
            66.0,
            28.044607324760317
        ],
        "wc_weaknesses_avg": [
            54.25,
            41.37858745776612
        ],
        "wc_questions_avg": [
            46.75,
            9.781998773256925
        ],
        "wc_review_avg": [
            247.0,
            47.54997371187496
        ],
        "wc_reply_reviewers_avg": [
            3.0,
            5.196152422706632
        ],
        "wc_reply_authors_avg": [
            755.0,
            297.73394163245814
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.8703882797784891,
        "gs_citation": 22,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4854488223594303538&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 9,
        "openreview": "https://openreview.net/forum?id=8OxL034uEr",
        "pdf": "https://openreview.net/pdf?id=8OxL034uEr",
        "email": "kaust.edu.sa;kaust.edu.sa;psu.edu",
        "author_num": 3,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "King Abdullah University of Science and Technology;Pennsylvania State University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.kast.kau.edu.sa;https://www.psu.edu",
        "aff_unique_abbr": "KAUST;PSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "Saudi Arabia;United States"
    },
    {
        "title": "R&B: Region and Boundary Aware Zero-shot Grounded Text-to-image Generation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19327",
        "id": "8Q4uVOJ5bX",
        "author_site": "Jiayu Xiao, Henglei Lv, Liang Li, Shuhui Wang, Qingming Huang",
        "tldr": "",
        "abstract": "Recent text-to-image (T2I) diffusion models have achieved remarkable progress in generating high-quality images given text-prompts as input. However, these models fail to convey appropriate spatial composition specified by a layout instruction. In this work, we probe into zero-shot grounded T2I generation with diffusion models, that is, generating images corresponding to the input layout information without training auxiliary modules or finetuning diffusion models. We propose a **R**egion and **B**oundary (R&B) aware cross-attention guidance approach that gradually modulates the attention maps of diffusion model during generative process, and assists the model to synthesize images (1) with high fidelity, (2) highly compatible with textual input, and (3) interpreting layout instructions accurately. Specifically, we leverage the discrete sampling to bridge the gap between consecutive attention maps and discrete layout constraints, and design a region-aware loss to refine the generative layout during diffusion process. We further propose a boundary-aware loss to strengthen object discriminability within the corresponding regions. Experimental results show that our method outperforms existing state-of-the-art zero-shot grounded T2I generation methods by a large margin both qualitatively and quantitatively on several benchmarks. \nProject page: https://sagileo.github.io/Region-and-Boundary.",
        "keywords": "Stable Diffusion;training-free;grounded text-to-image generation;controllable generation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/c8db5295ecda49880047fa64f1d9cfd900352249.zip",
        "author": "Jiayu Xiao;Henglei Lv;Liang Li;Shuhui Wang;Qingming Huang",
        "authorids": "~Jiayu_Xiao1;~Henglei_Lv1;~Liang_Li3;~Shuhui_Wang1;~Qingming_Huang1",
        "gender": "M;M;M;M;",
        "homepage": ";https://github.com/sagileo;http://www.ict.cas.cn/sourcedb_2018_ict_cas/cn/jssrck/201711/t20171114_4894220.html;https://vipl.ict.ac.cn/people/shwang/;https://qmhuang-ucas.github.io/",
        "dblp": ";;14/1395-3.html;37/2537;68/4388",
        "google_scholar": "8P4k11gAAAAJ;;Q-4mZnQAAAAJ;h-JxBSYAAAAJ;https://scholar.google.com.hk/citations?user=J1vMnRgAAAAJ",
        "orcid": ";;;0000-0002-5931-0527;",
        "linkedin": ";;;;",
        "or_profile": "~Jiayu_Xiao1;~Henglei_Lv1;~Liang_Li3;~Shuhui_Wang1;~Qingming_Huang2",
        "aff": "Institute of Computing Technology, University of Chinese Academy of Sciences;Institute of Computing Technology, Chinese Academy of Sciences;Institute of Computing Technology, Chinese Academy of Sciences;Institute of Computing Technology, Chinese Academy of Sciences;University of Chinese Academy of Sciences",
        "aff_domain": "ict.ac.cn;ict.ac.cn;ict.ac.cn;ict.ac.cn;ucas.ac.cn",
        "position": "PhD student;MS student;Full Professor;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nxiao2024rb,\ntitle={R\\&B: Region and Boundary Aware Zero-shot Grounded Text-to-image Generation},\nauthor={Jiayu Xiao and Henglei Lv and Liang Li and Shuhui Wang and Qingming Huang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=8Q4uVOJ5bX}\n}",
        "github": "",
        "project": "",
        "reviewers": "F2Yp;cFE6;KFuf;Nptk",
        "pdf_size": 16579484,
        "rating": "6;6;6;6",
        "confidence": "3;4;4;4",
        "soundness": "3;3;3;3",
        "contribution": "3;3;2;3",
        "presentation": "3;3;2;3",
        "wc_summary": "116;78;78;113",
        "wc_strengths": "19;84;71;142",
        "wc_weaknesses": "110;214;280;109",
        "wc_questions": "67;64;21;124",
        "wc_review": "312;440;450;488",
        "wc_reply_reviewers": "57;0;101;30",
        "wc_reply_authors": "449;1113;1392;1379",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "2;2;3;3",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            96.25,
            18.280795934531955
        ],
        "wc_strengths_avg": [
            79.0,
            43.754999714318366
        ],
        "wc_weaknesses_avg": [
            178.25,
            72.60294415517872
        ],
        "wc_questions_avg": [
            69.0,
            36.5991803186902
        ],
        "wc_review_avg": [
            422.5,
            66.26273462512697
        ],
        "wc_reply_reviewers_avg": [
            47.0,
            37.12815643147395
        ],
        "wc_reply_authors_avg": [
            1083.25,
            382.73775290660836
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 24,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6353490822039373341&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=8Q4uVOJ5bX",
        "pdf": "https://openreview.net/pdf?id=8Q4uVOJ5bX",
        "email": "ict.ac.cn;ict.ac.cn;ict.ac.cn;ict.ac.cn;ucas.ac.cn",
        "author_num": 5,
        "aff_unique_index": "0;1;1;1;0",
        "aff_unique_norm": "University of Chinese Academy of Sciences;Chinese Academy of Sciences",
        "aff_unique_dep": "Institute of Computing Technology;Institute of Computing Technology",
        "aff_unique_url": "http://www.ict.ac.cn;http://www.ict.ac.cn",
        "aff_unique_abbr": "UCAS;CAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "8Q6UmFhhQS",
        "title": "Neural Network Diffusion",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Diffusion models have achieved remarkable success in image and video generation. In this work, we demonstrate that diffusion models can also generate high-performing neural network parameters. Our approach is simple, utilizing an autoencoder and a standard latent diffusion model. The autoencoder extracts the latent representation of trained model parameters. A diffusion model is then trained to synthesize these latent parameter representations from random noise. It then generates new representations that are passed through the autoencoder\u2019s decoder, whose outputs are ready to use as new sets of network parameters. Across various tasks and datasets, our diffusion process consistently generates models of comparable or improved performance over SGD-trained models, with minimal additional cost. Our results encourage more exploration on the versatile use of diffusion models.",
        "keywords": "Parameter Generation;Diffusion Model",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/3f160407ba5c0438d03f45552e75133ba90740b8.zip",
        "author": "Kai Wang;xu Zhao Pan;Zhuang Liu;Zelin Zang;Trevor Darrell;Yang You",
        "authorids": "~Kai_Wang8;~xu_Zhao_Pan1;~Zhuang_Liu1;~Zelin_Zang2;~Trevor_Darrell2;~Yang_You1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://kaiwang960112.github.io/;;;https://www.comp.nus.edu.sg/~youy/;https://people.eecs.berkeley.edu/~trevor/;https://liuzhuang13.github.io/",
        "dblp": "78/2022-36;278/2033.html;226/7615;33/8167-1.html;d/TrevorDarrell;56/11346-3",
        "google_scholar": "i2II0XIAAAAJ;;foERjnQAAAAJ;jF4dPZwAAAAJ;https://scholar.google.com.tw/citations?user=bh-uRFMAAAAJ;7OTD-LEAAAAJ",
        "orcid": "0000-0002-1154-5175;;;;;",
        "linkedin": ";;;yang-you-0b92914b/;;zhuang-liu-19306b1b1/",
        "or_profile": "~Kai_Wang8;~xu_Zhao_Pan1;~Zelin_Zang2;~Yang_You1;~trevor_darrell1;~Zhuang_Liu2",
        "aff": "National University of Singapore;Harbin Institute of Technology;National University of Singapore;National University of Singapore;Electrical Engineering & Computer Science Department;FAIR, Meta",
        "aff_domain": "u.nus.edu;hit.edu.cn;nus.edu.sg;nus.edu.sg;eecs.berkeley.edu;meta.com",
        "position": "PhD student;PhD student;Intern;Professor;Professor;Research Scientist",
        "bibtex": "@misc{\nwang2024neural,\ntitle={Neural Network Diffusion},\nauthor={Kai Wang and xu Zhao Pan and Zhuang Liu and Zelin Zang and Trevor Darrell and Yang You},\nyear={2024},\nurl={https://openreview.net/forum?id=8Q6UmFhhQS}\n}",
        "github": "",
        "project": "",
        "reviewers": "jEgU;GLkA;aG24",
        "site": "https://openreview.net/forum?id=8Q6UmFhhQS",
        "pdf_size": 6427964,
        "rating": "3;3;6",
        "confidence": "3;4;3",
        "soundness": "2;3;3",
        "contribution": "2;2;3",
        "presentation": "1;3;3",
        "wc_summary": "48;111;62",
        "wc_strengths": "33;60;43",
        "wc_weaknesses": "55;243;100",
        "wc_questions": "180;160;5",
        "wc_review": "316;574;210",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            73.66666666666667,
            27.010286106510527
        ],
        "wc_strengths_avg": [
            45.333333333333336,
            11.145502331533658
        ],
        "wc_weaknesses_avg": [
            132.66666666666666,
            80.15124591809051
        ],
        "wc_questions_avg": [
            115.0,
            78.20912137766712
        ],
        "wc_review_avg": [
            366.6666666666667,
            152.86013941581442
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 69,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10519989663900027339&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;0;0;2;3",
        "aff_unique_norm": "National University of Singapore;Harbin Institute of Technology;Electrical Engineering & Computer Science Department;Meta",
        "aff_unique_dep": ";;Electrical Engineering & Computer Science;Facebook AI Research (FAIR)",
        "aff_unique_url": "https://www.nus.edu.sg;http://www.hit.edu.cn/;;https://meta.com",
        "aff_unique_abbr": "NUS;HIT;;Meta",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Harbin",
        "aff_country_unique_index": "0;1;0;0;3",
        "aff_country_unique": "Singapore;China;;United States"
    },
    {
        "title": "Class Incremental Learning via Likelihood Ratio Based Task Prediction",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19326",
        "id": "8QfK9Dq4q0",
        "author_site": "Haowei Lin, Yijia Shao, Weinan Qian, Ningxin Pan, Yiduo Guo, Bing Liu",
        "tldr": "",
        "abstract": "Class incremental learning (CIL) is a challenging setting of continual learning, which learns a series of tasks sequentially. Each task consists of a set of unique classes. The key feature of CIL is that no task identifier (or task-id) is provided at test time. Predicting the task-id for each test sample is a challenging problem. An emerging theory-guided approach (called TIL+OOD) is to train a task-specific model for each task in a shared network for all tasks based on a task-incremental learning (TIL) method to deal with catastrophic forgetting. The model for each task is an out-of-distribution (OOD) detector rather than a conventional classifier. The OOD detector can perform both within-task (in-distribution (IND)) class prediction and OOD detection. The OOD detection capability is the key to task-id prediction during inference. However, this paper argues that using a traditional OOD detector for task-id prediction is sub-optimal because additional information (e.g., the replay data and the learned tasks) available in CIL can be exploited to design a better and principled method for task-id prediction. We call the new method TPL (Task-id Prediction based on Likelihood Ratio). TPL markedly outperforms strong CIL baselines and has negligible catastrophic forgetting. The code of TPL is publicly available at https://github.com/linhaowei1/TPL.",
        "keywords": "Class Incremental Learning;Continual Learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Haowei Lin;Yijia Shao;Weinan Qian;Ningxin Pan;Yiduo Guo;Bing Liu",
        "authorids": "~Haowei_Lin1;~Yijia_Shao1;~Weinan_Qian1;~Ningxin_Pan1;~Yiduo_Guo2;~Bing_Liu1",
        "gender": "M;F;M;F;M;M",
        "homepage": "https://linhaowei1.github.io/;https://cs.stanford.edu/~shaoyj/;https://github.com/SouthwestWindQ;https://github.com/pnx2003;https://www.cs.uic.edu/~liub/;https://github.com/gydpku",
        "dblp": "235/2798;329/4063;;;l/BingLiu1.html;196/5954.html",
        "google_scholar": "Ng-DmJgAAAAJ;H0zcQh4AAAAJ;;;Kt1bjZoAAAAJ;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": "0009-0006-9809-4835;;;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Haowei_Lin1;~Yijia_Shao1;~Weinan_Qian1;~Ningxin_Pan1;~Bing_Liu1;~Yiduo_GUO1",
        "aff": "Peking University;Computer Science Department, Stanford University;Peking University;Peking University;University of Illinois at Chicago;Peking University",
        "aff_domain": "pku.edu.cn;cs.stanford.edu;pku.edu.cn;pku.edu.cn;uic.edu;pku.edu.cn",
        "position": "PhD student;PhD student;Undergrad student;Undergrad student;Full Professor;PhD student",
        "bibtex": "@inproceedings{\nlin2024class,\ntitle={Class Incremental Learning via Likelihood Ratio Based Task Prediction},\nauthor={Haowei Lin and Yijia Shao and Weinan Qian and Ningxin Pan and Yiduo Guo and Bing Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=8QfK9Dq4q0}\n}",
        "github": "",
        "project": "",
        "reviewers": "aMSi;SU84;fLUE;h9ds",
        "pdf_size": 2115954,
        "rating": "5;5;6;8",
        "confidence": "4;4;4;3",
        "soundness": "3;3;3;4",
        "contribution": "2;3;2;3",
        "presentation": "1;3;3;3",
        "wc_summary": "67;99;71;185",
        "wc_strengths": "71;52;58;165",
        "wc_weaknesses": "359;103;80;40",
        "wc_questions": "4;6;371;92",
        "wc_review": "501;260;580;482",
        "wc_reply_reviewers": "297;0;201;0",
        "wc_reply_authors": "1802;1052;2042;353",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "3;3;4;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            105.5,
            47.52630850381713
        ],
        "wc_strengths_avg": [
            86.5,
            45.83939353874569
        ],
        "wc_weaknesses_avg": [
            145.5,
            125.30861901720887
        ],
        "wc_questions_avg": [
            118.25,
            150.18717488520784
        ],
        "wc_review_avg": [
            455.75,
            118.84101775060662
        ],
        "wc_reply_reviewers_avg": [
            124.5,
            129.04359728401872
        ],
        "wc_reply_authors_avg": [
            1312.25,
            663.3778617801471
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.75,
            1.0897247358851685
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.9428090415820632,
        "gs_citation": 16,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6922209428065594215&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=8QfK9Dq4q0",
        "pdf": "https://openreview.net/pdf?id=8QfK9Dq4q0",
        "email": "pku.edu.cn;cs.stanford.edu;pku.edu.cn;pku.edu.cn;uic.edu;pku.edu.cn",
        "author_num": 6,
        "aff_unique_index": "0;1;0;0;2;0",
        "aff_unique_norm": "Peking University;Stanford University;University of Illinois at Chicago",
        "aff_unique_dep": ";Computer Science Department;",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.stanford.edu;https://www.uic.edu",
        "aff_unique_abbr": "Peking U;Stanford;UIC",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Stanford;Chicago",
        "aff_country_unique_index": "0;1;0;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "8S14xeFQAY",
        "title": "Segmenting the Unknown: Discrete Diffusion Models for Non-Deterministic Segmentation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Safety critical applications of deep-learning require models able to handle ambiguity and uncertainty.\nWe introduce discrete diffusion models to capture uncertainty in semantic segmentation, with application in both oncology and autonomous driving.\nUnlike prior approaches that tackle these tasks in distinct ways, we formulate both as estimating a complex posterior distribution over images, and present a unified solution that leverages the discrete diffusion framework.\nOur contributions include the adaptation of discrete diffusion for semantic segmentation to model uncertainty and the introduction of an auto-regressive diffusion framework for future forecasting.\nExperimental evaluation on medical imaging data and real-world future prediction tasks demonstrates the superiority of our generative framework over deterministic models and its competitive performance compared to methods specific to these domains separately.",
        "keywords": "segmentation;diffusion;future-prediction",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Evann COURDIER;Angelos Katharopoulos;Fran\u00e7ois Fleuret",
        "authorids": "~Evann_COURDIER1;~Angelos_Katharopoulos1;~Fran\u00e7ois_Fleuret2",
        "gender": "M;;M",
        "homepage": "https://evannc.notion.site/Evann-Courdier-70ea6da3f1fb43c6add377ffb5ec9e1c?pvs=4;https://angeloskath.github.io;https://fleuret.org/francois/",
        "dblp": ";188/1159;90/5265",
        "google_scholar": "q4Bfz-4AAAAJ;CNSO4uIAAAAJ;https://scholar.google.ch/citations?user=Bj1tRlsAAAAJ",
        "orcid": ";;0000-0001-9457-7393",
        "linkedin": "evann-courdier/;;francois-fleuret/",
        "or_profile": "~Evann_COURDIER1;~Angelos_Katharopoulos1;~Francois_Fleuret1",
        "aff": "EPFL - EPF Lausanne;Apple;University of Geneva",
        "aff_domain": "epfl.ch;apple.com;unige.ch",
        "position": "PhD student;Researcher;Full Professor",
        "bibtex": "@misc{\ncourdier2024segmenting,\ntitle={Segmenting the Unknown: Discrete Diffusion Models for Non-Deterministic Segmentation},\nauthor={Evann COURDIER and Angelos Katharopoulos and Fran{\\c{c}}ois Fleuret},\nyear={2024},\nurl={https://openreview.net/forum?id=8S14xeFQAY}\n}",
        "github": "",
        "project": "",
        "reviewers": "ofDT;27GV;qH1j",
        "site": "https://openreview.net/forum?id=8S14xeFQAY",
        "pdf_size": 13811735,
        "rating": "3;5;6",
        "confidence": "5;4;3",
        "soundness": "2;3;3",
        "contribution": "2;2;2",
        "presentation": "2;2;3",
        "wc_summary": "85;117;38",
        "wc_strengths": "60;51;62",
        "wc_weaknesses": "115;209;200",
        "wc_questions": "140;1;278",
        "wc_review": "400;378;578",
        "wc_reply_reviewers": "41;49;182",
        "wc_reply_authors": "527;466;808",
        "reply_reviewers": "1;1;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            80.0,
            32.44482495971687
        ],
        "wc_strengths_avg": [
            57.666666666666664,
            4.784233364802441
        ],
        "wc_weaknesses_avg": [
            174.66666666666666,
            42.35039026450117
        ],
        "wc_questions_avg": [
            139.66666666666666,
            113.08502209498047
        ],
        "wc_review_avg": [
            452.0,
            89.54700813911465
        ],
        "wc_reply_reviewers_avg": [
            90.66666666666667,
            64.66494843078092
        ],
        "wc_reply_authors_avg": [
            600.3333333333334,
            148.9392120594469
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.9819805060619659,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:txilMNL7L0UJ:scholar.google.com/&scioq=Segmenting+the+Unknown:+Discrete+Diffusion+Models+for+Non-Deterministic+Segmentation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "EPFL;Apple;University of Geneva",
        "aff_unique_dep": ";Apple Inc.;",
        "aff_unique_url": "https://www.epfl.ch;https://www.apple.com;https://www.unige.ch",
        "aff_unique_abbr": "EPFL;Apple;UNIGE",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Lausanne;",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Switzerland;United States"
    },
    {
        "id": "8S7eGD15b6",
        "title": "Subspace Grid-sweep: ML Defense Evaluation via Constrained Brute-force Search",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "It is becoming increasingly imperative to design robust ML defenses.  However, recent work has found that many defenses that initially resist state-of-the-art attacks can be broken by an adaptive adversary. Attacks can initially make defenses look strong by not finding potential adversarial examples due to obfuscated gradients, limited compute, unlucky initialization, etc. In this work, we make steps towards more reliable defense evaluation by introducing a new defense evaluation tool, Subspace Grid-sweep, that leverages deterministic inference to more simply evaluate adversarial robustness. We use Subspace Grid-sweep to show that a previously published, but now broken, defense could have been known to be broken without performing a fully adaptive attack. In order to make Subspace Grid-sweep applicable to random defenses, we show how to make deterministic variants of random defenses while retaining similar empirical effectiveness.  As a result, we show that randomness may not be necessary for these defense\u2019s robustness.",
        "keywords": "artificial intelligence;machine learning;robustness;adversarial machine learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/b49118d34683604988200ad7d1b37406792df7d3.zip",
        "author": "Keane Lucas;Matthew Jagielski;Florian Tram\u00e8r;Lujo Bauer;Nicholas Carlini",
        "authorids": "~Keane_Lucas1;~Matthew_Jagielski1;~Florian_Tram\u00e8r1;~Lujo_Bauer1;~Nicholas_Carlini1",
        "gender": "M;M;;;",
        "homepage": "https://keanelucas.com;https://jagielski.github.io/;;;http://nicholas.carlini.com",
        "dblp": "250/5769;218/5156;;;145/1806",
        "google_scholar": "vJEa5voAAAAJ;_8rw_GMAAAAJ;;;",
        "orcid": "0000-0002-4705-3412;;;;",
        "linkedin": "keane-lucas/;;;;",
        "or_profile": "~Keane_Lucas1;~Matthew_Jagielski1;~Florian_Tram\u00e8r1;~Lujo_Bauer1;~Nicholas_Carlini1",
        "aff": "Carnegie Mellon University;Google;;;Google",
        "aff_domain": "cmu.edu;google.com;;;google.com",
        "position": "PhD student;Researcher;;;Researcher",
        "bibtex": "@misc{\nlucas2024subspace,\ntitle={Subspace Grid-sweep: {ML} Defense Evaluation via Constrained Brute-force Search},\nauthor={Keane Lucas and Matthew Jagielski and Florian Tram{\\`e}r and Lujo Bauer and Nicholas Carlini},\nyear={2024},\nurl={https://openreview.net/forum?id=8S7eGD15b6}\n}",
        "github": "",
        "project": "",
        "reviewers": "2Hxt;LfCf;EJoi;YZ44",
        "site": "https://openreview.net/forum?id=8S7eGD15b6",
        "pdf_size": 1990390,
        "rating": "5;5;5;6",
        "confidence": "3;4;4;3",
        "soundness": "3;2;2;3",
        "contribution": "3;3;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "42;47;75;153",
        "wc_strengths": "56;108;35;48",
        "wc_weaknesses": "55;218;277;74",
        "wc_questions": "12;25;32;6",
        "wc_review": "165;398;419;281",
        "wc_reply_reviewers": "9;219;45;12",
        "wc_reply_authors": "450;1971;1165;377",
        "reply_reviewers": "1;2;2;1",
        "reply_authors": "1;3;4;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            79.25,
            44.39805738993543
        ],
        "wc_strengths_avg": [
            61.75,
            27.73422975314079
        ],
        "wc_weaknesses_avg": [
            156.0,
            94.08772502298055
        ],
        "wc_questions_avg": [
            18.75,
            10.280442597476044
        ],
        "wc_review_avg": [
            315.75,
            101.68425394327285
        ],
        "wc_reply_reviewers_avg": [
            71.25,
            86.46494954604438
        ],
        "wc_reply_authors_avg": [
            990.75,
            644.2733794748934
        ],
        "reply_reviewers_avg": [
            1.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            1.299038105676658
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:BLd-hQcysvYJ:scholar.google.com/&scioq=Subspace+Grid-sweep:+ML+Defense+Evaluation+via+Constrained+Brute-force+Search&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Carnegie Mellon University;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.cmu.edu;https://www.google.com",
        "aff_unique_abbr": "CMU;Google",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "8SPSIfR2e0",
        "title": "Dissecting Language Models: Machine Unlearning via Selective Pruning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Understanding and shaping the behaviour of Large Language Models (LLMs) is increasingly important as applications become more powerful and more frequently adopted.\nThis paper introduces a machine unlearning method specifically designed for LLMs. \nWe introduce a selective pruning method for LLMs that removes neurons based on their relative importance on a targeted capability compared to overall network performance. \nThis approach is a compute- and data-efficient method for identifying and removing neurons that enable specific behaviours.\nOur findings reveal that both feed-forward and attention neurons in LLMs are specialized; \nthat is, for specific tasks, certain neurons are more crucial than others.",
        "keywords": "language models;pruning;machine unlearning;capability removal;intepretability;modularity",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Nicky Pochinkov;Nandi Schoots",
        "authorids": "~Nicky_Pochinkov1;~Nandi_Schoots1",
        "gender": "M;F",
        "homepage": "https://nicky.pro;https://safeandtrustedai.org/person/nandi-schoots/",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": "https://linkedin.com/in/nicky-pochinkov;",
        "or_profile": "~Nicky_Pochinkov1;~Nandi_Schoots1",
        "aff": "Independant;Imperial College London",
        "aff_domain": "nicky.pro;ic.ac.uk",
        "position": "Researcher;PhD student",
        "bibtex": "@misc{\npochinkov2024dissecting,\ntitle={Dissecting Language Models: Machine Unlearning via Selective Pruning},\nauthor={Nicky Pochinkov and Nandi Schoots},\nyear={2024},\nurl={https://openreview.net/forum?id=8SPSIfR2e0}\n}",
        "github": "",
        "project": "",
        "reviewers": "sDUD;Q3q4;9FMg;q42J",
        "site": "https://openreview.net/forum?id=8SPSIfR2e0",
        "pdf_size": 4096323,
        "rating": "5;6;6;6",
        "confidence": "4;4;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "238;71;84;118",
        "wc_strengths": "45;88;45;90",
        "wc_weaknesses": "817;353;229;91",
        "wc_questions": "209;114;192;10",
        "wc_review": "1309;626;550;309",
        "wc_reply_reviewers": "367;12;0;0",
        "wc_reply_authors": "1379;755;600;294",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            127.75,
            65.9256209678756
        ],
        "wc_strengths_avg": [
            67.0,
            22.01136070305514
        ],
        "wc_weaknesses_avg": [
            372.5,
            272.8529823916169
        ],
        "wc_questions_avg": [
            131.25,
            78.63642603781024
        ],
        "wc_review_avg": [
            698.5,
            371.39231279066615
        ],
        "wc_reply_reviewers_avg": [
            94.75,
            157.25993609308125
        ],
        "wc_reply_authors_avg": [
            757.0,
            395.5711061237916
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2293050757298981416&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Independent;Imperial College London",
        "aff_unique_dep": ";",
        "aff_unique_url": ";https://www.imperial.ac.uk",
        "aff_unique_abbr": ";ICL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "1",
        "aff_country_unique": ";United Kingdom"
    },
    {
        "id": "8T7m27VC3S",
        "title": "3D Dense Captioning beyond Nouns: A Middleware for Autonomous Driving",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recently, language foundation models have revolutionized many fields and how they could enable smarter and safer autonomous vehicles remains elusive. We believe one major obstacle is the lack of a comprehensive and standard middleware representation that links perception and planning. We rethink the limitations of existing middleware (e.g., 3D boxes or occupancy) and propose 3\\textbf{D} d\\textbf{e}n\\textbf{s}e capt\\textbf{i}onin\\textbf{g} beyond \\textbf{n}ouns (or abbreviated as DESIGN). For each input scenario, DESIGN refers to a set of 3D bounding boxes with a language description for each. Notably, the \\textbf{comprehensive} description involves not only what the box is (noun) but also its attribute (adjective), location (preposition) and moving status (adverb). We design a scalable rule-based auto-labelling methodology to generate DESIGN ground truth, guaranteeing that the middleware is \\textbf{standard}. Using this methodology, we construct a large-scale dataset nuDesign based upon nuScenes, which consists of an unprecedented number of 2300k sentences. We also present an extensive benchmarking on nuDesign, featuring a model named DESIGN-former that takes multi-modal inputs and predicts reliable DESIGN outputs. Through qualitative visualizations, we demonstrate that DEISGN, as a novel 3D scene understanding middleware, has good interpretability. We release our code, data and models, hoping this middleware could trigger better autonomous driving algorithms and systems that benefit from the power of language foundation models.",
        "keywords": "Autonomous Driving;Dense Captioning;Foundation model",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Bu Jin;Yupeng Zheng;Pengfei Li;Sujie Hu;Zhijie Yan;Xinyu Liu;Yuhang Zheng;Jingjing Huang;Jinwei Zhu;Guyue Zhou;Yilun Chen;Hao Zhao",
        "authorids": "~Bu_Jin1;~Yupeng_Zheng1;~Pengfei_Li6;~Sujie_Hu1;~Zhijie_Yan3;~Xinyu_Liu9;~Yuhang_Zheng2;~Jingjing_Huang2;~Jinwei_Zhu1;~Guyue_Zhou2;~Yilun_Chen3;~Hao_Zhao1",
        "gender": ";;M;F;M;F;M;F;M;M;M;M",
        "homepage": ";;https://github.com/Philipflyg;https://husujie.github.io/;;https://liuxinyv.github.io/;;https://github.com//JJingH;http://hao.360.com/?a1004;https://air.tsinghua.edu.cn/en/info/1046/1196.htm;https://air.tsinghua.edu.cn/info/1046/1769.htm;https://sites.google.com/view/fromandto",
        "dblp": ";;;;;;;;;133/4199;;08/3737-2.html",
        "google_scholar": ";;https://scholar.google.com/citations?view_op=list_works;;4PXGeaYAAAAJ;kgRjFN8AAAAJ;;;;;XGnsL5MAAAAJ;ygQznUQAAAAJ",
        "orcid": ";;;;;;0000-0001-8215-6962;;;;;",
        "linkedin": ";;;;;%E6%98%95%E7%85%9C-%E5%88%98-847812247/;;;;;;",
        "or_profile": "~Bu_Jin1;~Yupeng_Zheng1;~Pengfei_Li6;~Sujie_Hu1;~Zhijie_Yan3;~Xinyu_Liu9;~Yuhang_Zheng2;~Jingjing_Huang2;~Jinwei_Zhu1;~Guyue_Zhou2;~Yilun_Chen3;~Hao_Zhao1",
        "aff": ";;Tsinghua University;Minzu University of China;Beihang University;Hong Kong University of Science and Technology;Beihang University;Shanghai University;Beijing Jiaotong University;Tsinghua University;;Peking University",
        "aff_domain": ";;tsinghua.edu.cn;muc.edu.cn;buaa.edu.cn;connect.ust.hk;buaa.edu.cn;shu.edu.cn;bjtu.edu.cn;tsinghua.edu.cn;;pku.edu.cn",
        "position": ";;PhD student;Undergrad student;MS student;PhD student;MS student;Undergrad student;Undergrad student;Associate Professor;;Postdoc",
        "bibtex": "@misc{\njin2024d,\ntitle={3D Dense Captioning beyond Nouns: A Middleware for Autonomous Driving},\nauthor={Bu Jin and Yupeng Zheng and Pengfei Li and Sujie Hu and Zhijie Yan and Xinyu Liu and Yuhang Zheng and Jingjing Huang and Jinwei Zhu and Guyue Zhou and Yilun Chen and Hao Zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=8T7m27VC3S}\n}",
        "github": "",
        "project": "",
        "reviewers": "rzAd;a5o2;R3EY",
        "site": "https://openreview.net/forum?id=8T7m27VC3S",
        "pdf_size": 11612601,
        "rating": "3;3;6",
        "confidence": "4;5;5",
        "soundness": "2;2;2",
        "contribution": "2;2;3",
        "presentation": "2;2;2",
        "wc_summary": "106;142;73",
        "wc_strengths": "66;267;43",
        "wc_weaknesses": "358;357;169",
        "wc_questions": "32;42;3",
        "wc_review": "562;808;288",
        "wc_reply_reviewers": "264;203;0",
        "wc_reply_authors": "1712;762;340",
        "reply_reviewers": "1;1;0",
        "reply_authors": "3;1;1",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            107.0,
            28.178005607210743
        ],
        "wc_strengths_avg": [
            125.33333333333333,
            100.6125682451695
        ],
        "wc_weaknesses_avg": [
            294.6666666666667,
            88.86068997156292
        ],
        "wc_questions_avg": [
            25.666666666666668,
            16.539514973407037
        ],
        "wc_review_avg": [
            552.6666666666666,
            212.39167173460973
        ],
        "wc_reply_reviewers_avg": [
            155.66666666666666,
            112.85487239026158
        ],
        "wc_reply_authors_avg": [
            938.0,
            573.7757982580537
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            12,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:jFZz7htIdqEJ:scholar.google.com/&scioq=3D+Dense+Captioning+beyond+Nouns:+A+Middleware+for+Autonomous+Driving&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;2;4;5;0;6",
        "aff_unique_norm": "Tsinghua University;Minzu University of China;Beihang University;Hong Kong University of Science and Technology;Shanghai University;Beijing Jiao Tong University;Peking University",
        "aff_unique_dep": ";;;;;;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;http://www.muc.edu.cn/;http://www.buaa.edu.cn/;https://www.ust.hk;https://www.shu.edu.cn;http://www.njtu.edu.cn/en;http://www.pku.edu.cn",
        "aff_unique_abbr": "THU;MUC;BUAA;HKUST;SHU;BJTU;Peking U",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "8TAGx549Ns",
        "title": "REX: Rapid Exploration and eXploitation for AI agents",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "AI agents leveraging the capabilities of Large Language Models (LLMs) and Reinforcement Learning (RL) techniques have garnered growing attention due to their commendable performance in autonomously executing real-world tasks. Effective exploration of the action space is paramount for the successful accomplishment of diverse tasks by these AI agents. In this paper, we propose an enhanced approach for $\\textbf{R}$apid $\\textbf{E}$xploration and e$\\textbf{X}$ploitation of action space for LLM-based AI agents, called $\\textbf{REX}$. Existing LLM-driven agents have inherent limitations, such as a heavy reliance on precise descriptions for decision-making, and the lack of a systematic approach to leverage try-and-fail procedures akin to traditional RL. REX introduces an additional layer of rewards and integrates concepts similar to Upper Confidence Bound (UCB) scores, leading to more robust and efficient AI agent performance. This approach has the advantage of enabling the utilization of offline behaviors from logs and allowing seamless integration with existing foundation models while it does not require any model fine-tuning. Through comparative analysis with existing methods such as Chain-of-Thought(CoT) and Reflexion, REX-based methods demonstrate comparable performance and, in certain cases, even surpass the results achieved by these existing techniques. Notably, REX-based methods exhibit remarkable reductions in execution time while systematically exploring the action space of AI agents, enhancing their practical applicability across a diverse set of scenarios.",
        "keywords": "AI agent;Large Language Models;Upper Confidence Bound",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/3976967bb4823484c0b7b2480d8a7c08e6e43a11.zip",
        "author": "Rithesh R N;Shelby Heinecke;Juan Carlos Niebles;Zhiwei Liu;Le Xue;Weiran Yao;Yihao Feng;Zeyuan Chen;Akash Gokul;Devansh Arpit;Ran Xu;Phil L Mui;Huan Wang;Caiming Xiong;Silvio Savarese",
        "authorids": "~Rithesh_R_N1;~Shelby_Heinecke1;~Juan_Carlos_Niebles1;~Zhiwei_Liu3;~Le_Xue1;~Weiran_Yao1;~Yihao_Feng1;~Zeyuan_Chen1;~Akash_Gokul1;~Devansh_Arpit2;~Ran_Xu1;~Phil_L_Mui1;~Huan_Wang1;~Caiming_Xiong1;~Silvio_Savarese1",
        "gender": "M;F;M;;M;M;M;M;;M;M;;M;M;M",
        "homepage": "https://ritheshrn.github.io/;http://www.shelbyh.ai;http://www.niebles.net/;https://sites.google.com/view/zhiwei-jim;;;;https://www.linkedin.com/in/zeyuan-chen-0253b6141/;;;;;http://www.cs.yale.edu/homes/wang-huan/;http://cmxiong.com/;",
        "dblp": "352/4275;;26/647;90/9499-1.html;304/2195;192/3295;204/3696;191/1578-1.html;;120/8494;;;70/6155-16.html;80/7282;50/3578",
        "google_scholar": "https://scholar.google.ca/citations?user=Y1XpJucAAAAJ;tS937l8AAAAJ;hqNhUCYAAAAJ;https://scholar.google.com/citations?;https://scholar.google.com/citations?view_op=list_works;rr_leUAAAAAJ;uqnNle0AAAAJ;znf-4mgAAAAJ;;https://scholar.google.ca/citations?hl=en;sgBB2sUAAAAJ;;7NpTttkAAAAJ;vaSdahkAAAAJ;ImpbxLsAAAAJ",
        "orcid": ";;;0000-0003-1525-1067;0000-0003-2810-770X;;;0009-0003-2471-5449;;;;;;;",
        "linkedin": "rithesh-r-n/;shelbyheinecke;;;le-tycho-xue-5abbb9157/;;;zeyuan-chen-/;;;;;huanwangyale/;caiming-xiong-150a1417;",
        "or_profile": "~Rithesh_R_N1;~Shelby_Heinecke1;~Juan_Carlos_Niebles1;~Zhiwei_Liu3;~Le_Xue1;~Weiran_Yao1;~Yihao_Feng1;~Zeyuan_Chen1;~Akash_Gokul1;~Devansh_Arpit2;~Ran_Xu1;~Phil_L_Mui1;~Huan_Wang1;~Caiming_Xiong1;~Silvio_Savarese1",
        "aff": "SalesForce.com;Salesforce Research;Stanford University;Salesforce AI Research;Salesforce;SalesForce.com;Salesforce AI Research;Salesforce Inc;;VaniLabs;SalesForce.com;;Salesforce.com;Salesforce Research;Stanford University",
        "aff_domain": "salesforce.com;salesforce.com;stanford.edu;salesforce.com;salesforce.com;salesforce.com;salesforce.com;salesforce.com;;vanilabs.com;salesforce.com;;salesforce.com;salesforce.com;stanford.edu",
        "position": "Researcher;Researcher;Adjunct Professor;Researcher;Researcher;Researcher;Researcher;Researcher;;Principal Researcher;senior manager;;Researcher;Research Scientist;Adjunct Professor",
        "bibtex": "@misc{\nn2024rex,\ntitle={{REX}: Rapid Exploration and eXploitation for {AI} agents},\nauthor={Rithesh R N and Shelby Heinecke and Juan Carlos Niebles and Zhiwei Liu and Le Xue and Weiran Yao and Yihao Feng and Zeyuan Chen and Akash Gokul and Devansh Arpit and Ran Xu and Phil L Mui and Huan Wang and Caiming Xiong and Silvio Savarese},\nyear={2024},\nurl={https://openreview.net/forum?id=8TAGx549Ns}\n}",
        "github": "",
        "project": "",
        "reviewers": "b79r;3Nop;1Dq3;up34",
        "site": "https://openreview.net/forum?id=8TAGx549Ns",
        "pdf_size": 642008,
        "rating": "3;3;5;5",
        "confidence": "4;4;2;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "2;2;3;2",
        "wc_summary": "186;62;50;49",
        "wc_strengths": "134;40;51;21",
        "wc_weaknesses": "244;284;73;26",
        "wc_questions": "355;119;127;219",
        "wc_review": "919;505;301;315",
        "wc_reply_reviewers": "71;17;12;13",
        "wc_reply_authors": "894;916;768;745",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            86.75,
            57.52988353890524
        ],
        "wc_strengths_avg": [
            61.5,
            43.21168823362494
        ],
        "wc_weaknesses_avg": [
            156.75,
            109.4471904618844
        ],
        "wc_questions_avg": [
            205.0,
            95.09994742374992
        ],
        "wc_review_avg": [
            510.0,
            249.505510961181
        ],
        "wc_reply_reviewers_avg": [
            28.25,
            24.752525123712125
        ],
        "wc_reply_authors_avg": [
            830.75,
            75.09785283215493
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            15,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15336770226670021155&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1;0;0;0;0;0;2;0;0;0;1",
        "aff_unique_norm": "Salesforce;Stanford University;VaniLabs",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.salesforce.com;https://www.stanford.edu;",
        "aff_unique_abbr": "Salesforce;Stanford;",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Stanford",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States;"
    },
    {
        "id": "8TyGCAuCGd",
        "title": "Look Ma, No Training! Observation Space Design for Reinforcement Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Many scientific communities agree on the potential of reinforcement learning (RL) agents to solve real-world problems, yet such consensus does not extend to how these agents should be designed. In some practical applications, the increasing literature on RL does not shed light on which RL components work better for a particular problem, they are usually treated just as configuration elements to be reported. One of these components is the choice of observation space, which in some cases entails dealing with tens of thousands of observable features. Choosing a rich yet efficient observation space is key to encoding useful information while limiting the tangible implications of adding extra features. Gaining understanding of feature relevance has already been studied for RL. In comparison to supervised learning, the effect of dependencies across states adds a layer of complexity to the structure of the problem. Many of the proposed methods require training RL agents from scratch several times, which is costly in real-world applications. In this paper we propose a simple and cost-efficient way to find good observation spaces that does not require training. Specifically, we propose leveraging multiple random policies when comparing candidate spaces for the same problem. By conducting rollouts with different random policies for each candidate space, we are able to identify statistically-significant signals that indicate which features are better suited for the application considered. We demonstrate the usefulness of our approach in different RL problems, including Traffic Signal Control. By combining random policy sampling with the Hill Climbing search algorithm, we find observation spaces that use less features and achieve comparable or greater return. Overall, this work suggests a straightforward and inexpensive approach to an important aspect of RL design that is often overlooked and is crucial for applied problems.",
        "keywords": "observation space design;real-world reinforcement learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/bc80203cac72704cc955fd8185b5448ce4560428.zip",
        "author": "Juan Jose Garau-Luis;Ram Krishna Goel;Edward Crawley;Cathy Wu",
        "authorids": "~Juan_Jose_Garau-Luis1;~Ram_Krishna_Goel1;~Edward_Crawley1;~Cathy_Wu1",
        "gender": "M;M;;F",
        "homepage": ";;https://aeroastro.mit.edu/people/edward-f-crawley/;http://wucathy.com",
        "dblp": ";;;155/3740",
        "google_scholar": "FpaKuysAAAAJ;;;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;0000-0001-8594-303X",
        "linkedin": "juanjosegarau/;ram-krishna-goel-5a662320a/;;cathywu/",
        "or_profile": "~Juan_Jose_Garau-Luis1;~Ram_Krishna_Goel1;~Edward_Crawley1;~Cathy_Wu1",
        "aff": ";Massachusetts Institute of Technology;;Massachusetts Institute of Technology",
        "aff_domain": ";mit.edu;;mit.edu",
        "position": ";Undergrad student;;Assistant Professor",
        "bibtex": "@misc{\ngarau-luis2024look,\ntitle={Look Ma, No Training! Observation Space Design for Reinforcement Learning},\nauthor={Juan Jose Garau-Luis and Ram Krishna Goel and Edward Crawley and Cathy Wu},\nyear={2024},\nurl={https://openreview.net/forum?id=8TyGCAuCGd}\n}",
        "github": "",
        "project": "",
        "reviewers": "NkaL;CJ7V;N2rj;fGnS",
        "site": "https://openreview.net/forum?id=8TyGCAuCGd",
        "pdf_size": 1037059,
        "rating": "1;3;5;5",
        "confidence": "4;4;4;5",
        "soundness": "1;1;2;2",
        "contribution": "2;2;3;1",
        "presentation": "3;3;3;3",
        "wc_summary": "169;38;107;34",
        "wc_strengths": "51;134;51;31",
        "wc_weaknesses": "395;500;271;257",
        "wc_questions": "34;56;52;18",
        "wc_review": "649;728;481;340",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            1.6583123951777
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            87.0,
            55.52927156014204
        ],
        "wc_strengths_avg": [
            66.75,
            39.67603180762915
        ],
        "wc_weaknesses_avg": [
            355.75,
            99.09938193550957
        ],
        "wc_questions_avg": [
            40.0,
            15.165750888103101
        ],
        "wc_review_avg": [
            549.5,
            150.28722500598644
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5222329678670935,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:RErkHn1mq6sJ:scholar.google.com/&scioq=Look+Ma,+No+Training!+Observation+Space+Design+for+Reinforcement+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Massachusetts Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://web.mit.edu",
        "aff_unique_abbr": "MIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Revisiting Link Prediction: a data perspective",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19325",
        "id": "8Ur2xmuw7w",
        "author_site": "Haitao Mao, Juanhui Li, Harry Shomer, Bingheng Li, Wenqi Fan, Yao Ma, Tong Zhao, Neil Shah, Jiliang Tang",
        "tldr": "",
        "abstract": "Link prediction, a fundamental task on graphs, has proven indispensable in various applications, e.g., friend recommendation, protein analysis, and drug interaction prediction. However, since datasets span a multitude of domains, they could have distinct underlying mechanisms of link formation. Evidence in existing literature underscores the absence of a universally best algorithm suitable for all datasets. In this paper, we endeavor to explore principles of link prediction across diverse datasets from a data-centric perspective. We recognize three fundamental factors critical to link prediction: local structural proximity, global structural proximity, and feature proximity. We then unearth relationships among those factors where (i) global structural proximity only shows effectiveness when local structural proximity is deficient. (ii) The incompatibility can be found between feature and structural proximity. Such incompatibility leads to GNNs for Link Prediction (GNN4LP) consistently underperforming on edges where the feature proximity factor dominates. Inspired by these new insights from a data perspective, we offer practical instruction for GNN4LP model design and guidelines for selecting appropriate benchmark datasets for more comprehensive evaluations.",
        "keywords": "Link Prediction;Graph Neural Network",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/7f292b427499ef2c6a3ca14529b1b63f683de205.zip",
        "author": "Haitao Mao;Juanhui Li;Harry Shomer;Bingheng Li;Wenqi Fan;Yao Ma;Tong Zhao;Neil Shah;Jiliang Tang",
        "authorids": "~Haitao_Mao1;~Juanhui_Li1;~Harry_Shomer1;~Bingheng_Li1;~Wenqi_Fan1;~Yao_Ma3;~Tong_Zhao3;~Neil_Shah2;~Jiliang_Tang1",
        "gender": "F;;M;M;M;M;M;M;M",
        "homepage": "https://juanhui28.github.io/;https://www.cse.msu.edu/~shomerha/;https://github.com/uestclbh;https://wenqifan03.github.io;https://yaoma24.github.io/;https://tzhao.io/;http://nshah.net;https://www.cse.msu.edu/~tangjili/;",
        "dblp": "313/9527.html;;;218/7410;212/7871.html;94/6503-3;71/7771;64/10812;",
        "google_scholar": "5J0dd-sAAAAJ;_6eE2vsAAAAJ;;https://scholar.google.com/citations?hl=en;wf9TTOIAAAAJ;05cRc-MAAAAJ;Qut69OgAAAAJ;WtzKMWAAAAAJ;3GmlKM4AAAAJ",
        "orcid": "0000-0003-4909-1778;0000-0001-5081-1870;0009-0000-0950-9012;0000-0002-4049-1233;;0000-0001-7660-1732;0000-0003-3261-8430;0000-0001-7125-3898;",
        "linkedin": ";;;wenqi-fan-a425a7196/;;;;;",
        "or_profile": "~Juanhui_Li1;~Harry_Shomer1;~Bingheng_Li1;~Wenqi_Fan1;~Yao_Ma3;~Tong_Zhao3;~Neil_Shah2;~Jiliang_Tang1;~Mao_Haitao1",
        "aff": "Amazon;Michigan State University;University of Electronic Science and Technology of China;The Hong Kong Polytechnic University;Rensselaer Polytechnic Institute;Snap Inc.;Snap Inc.;Michigan State University;Michigan State University",
        "aff_domain": "amazon.com;msu.edu;uestc.edu.cn;polyu.edu.hk;rpi.edu;snap.com;snap.com;msu.edu;msu.edu",
        "position": "Intern;PhD student;Undergrad student;Assistant Professor;Assistant Professor;Researcher;Research Scientist;Full Professor;PhD student",
        "bibtex": "@inproceedings{\nmao2024revisiting,\ntitle={Revisiting Link Prediction: a data perspective},\nauthor={Haitao Mao and Juanhui Li and Harry Shomer and Bingheng Li and Wenqi Fan and Yao Ma and Tong Zhao and Neil Shah and Jiliang Tang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=8Ur2xmuw7w}\n}",
        "github": "",
        "project": "",
        "reviewers": "zuoh;cwp2;wtEd;Rht2",
        "pdf_size": 842601,
        "rating": "5;6;6;8",
        "confidence": "3;4;5;5",
        "soundness": "3;3;3;4",
        "contribution": "1;3;2;4",
        "presentation": "3;1;3;3",
        "wc_summary": "114;128;98;83",
        "wc_strengths": "83;120;30;146",
        "wc_weaknesses": "87;246;11;80",
        "wc_questions": "14;18;73;3",
        "wc_review": "298;512;212;312",
        "wc_reply_reviewers": "0;0;0;42",
        "wc_reply_authors": "1118;1808;887;959",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "4;5;3;4",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            1.118033988749895
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            105.75,
            16.887495373796554
        ],
        "wc_strengths_avg": [
            94.75,
            43.573931426943794
        ],
        "wc_weaknesses_avg": [
            106.0,
            86.1132974632838
        ],
        "wc_questions_avg": [
            27.0,
            27.120103244641236
        ],
        "wc_review_avg": [
            333.5,
            109.93975623040102
        ],
        "wc_reply_reviewers_avg": [
            10.5,
            18.186533479473212
        ],
        "wc_reply_authors_avg": [
            1193.0,
            364.7745879306836
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.0,
            0.7071067811865476
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.7608859102526822,
        "gs_citation": 25,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2697033961358863084&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=8Ur2xmuw7w",
        "pdf": "https://openreview.net/pdf?id=8Ur2xmuw7w",
        "email": "amazon.com;msu.edu;uestc.edu.cn;polyu.edu.hk;rpi.edu;snap.com;snap.com;msu.edu;msu.edu",
        "author_num": 9,
        "aff_unique_index": "0;1;2;3;4;5;5;1;1",
        "aff_unique_norm": "Amazon;Michigan State University;University of Electronic Science and Technology of China;Hong Kong Polytechnic University;Rensselaer Polytechnic Institute;Snap Inc.",
        "aff_unique_dep": "Amazon.com, Inc.;;;;;",
        "aff_unique_url": "https://www.amazon.com;https://www.msu.edu;https://www.uestc.edu.cn;https://www.polyu.edu.hk;https://www.rpi.edu;https://www.snapinc.com",
        "aff_unique_abbr": "Amazon;MSU;UESTC;PolyU;RPI;Snap",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;1;1;0;0;0;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "8V3C2ijJ33",
        "title": "Lightweight In-Context Tuning for Multimodal Unified Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In-context learning (ICL) involves reasoning from given contextual examples. As more modalities comes, this procedure is becoming more challenging as the interleaved input modalities convolutes the understanding process. This is exemplified by the observation that multimodal models often struggle to effectively extrapolate from contextual examples to perform ICL. To address these challenges, we introduce Multimodal In-context Tuning (M$^{2}$IXT), a lightweight module to enhance the ICL capabilities of multimodal unified models. The proposed M$^{2}$IXT module perceives an expandable context window to incorporate various labeled examples of multiple modalities (e.g., text, image, and coordinates). It can be prepended to various multimodal unified models (e.g., OFA, Unival, LLaVA) of different architectures and trained via a mixed-tasks strategy to enable rapid few-shot adaption on multiple tasks and datasets. When tuned on as little as 50K multimodal data, M$^{2}$IXT can boost the few-shot ICL performance significantly (e.g., 18% relative increase for OFA), and obtained state-of-the-art results across an array of tasks including visual question answering, image captioning, visual grounding, and visual entailment, while being considerably small in terms of model parameters (e.g., ~20x smaller than Flamingo or MMICL), highlighting the flexibility and effectiveness of M$^{2}$IXT as a multimodal in-context learner.",
        "keywords": "Multi-modality;Unified Autoregressive Model;Multi-tasking;In-Context Tuning;Few-shot Adaptation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yixin Chen;Shuai Zhang;Boran Han;Jiaya Jia",
        "authorids": "~Yixin_Chen4;~Shuai_Zhang7;~Boran_Han1;~Jiaya_Jia1",
        "gender": "M;;;M",
        "homepage": "https://yix-chen.github.io/;;;https://jiaya.me",
        "dblp": "59/983;;;31/5649",
        "google_scholar": "tEWGP3sAAAAJ;;;https://scholar.google.com.tw/citations?user=XPAkzTEAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Yixin_Chen4;~Shuai_Zhang7;~Boran_Han1;~Jiaya_Jia1",
        "aff": "Department of Computer Science and Engineering, The Chinese University of Hong Kong;;;Department of Computer Science and Engineering, Hong Kong University of Science and Technology",
        "aff_domain": "cse.cuhk.edu.hk;;;cse.ust.hk",
        "position": "PhD student;;;Full Professor",
        "bibtex": "@misc{\nchen2024lightweight,\ntitle={Lightweight In-Context Tuning for Multimodal Unified Models},\nauthor={Yixin Chen and Shuai Zhang and Boran Han and Jiaya Jia},\nyear={2024},\nurl={https://openreview.net/forum?id=8V3C2ijJ33}\n}",
        "github": "",
        "project": "",
        "reviewers": "rfnh;1Zj1;kbgq;bTML",
        "site": "https://openreview.net/forum?id=8V3C2ijJ33",
        "pdf_size": 3375440,
        "rating": "3;5;5;6",
        "confidence": "4;4;4;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;2;3",
        "wc_summary": "19;129;78;49",
        "wc_strengths": "33;200;94;37",
        "wc_weaknesses": "378;437;120;6",
        "wc_questions": "21;4;35;119",
        "wc_review": "451;770;327;211",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            68.75,
            40.56091098582476
        ],
        "wc_strengths_avg": [
            91.0,
            67.39807118901845
        ],
        "wc_weaknesses_avg": [
            235.25,
            178.12828944331105
        ],
        "wc_questions_avg": [
            44.75,
            44.25141240683737
        ],
        "wc_review_avg": [
            439.75,
            208.70478552251743
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.6622661785325219,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2956087388086531757&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Chinese University of Hong Kong;Hong Kong University of Science and Technology",
        "aff_unique_dep": "Department of Computer Science and Engineering;Department of Computer Science and Engineering",
        "aff_unique_url": "https://www.cuhk.edu.hk;https://www.ust.hk",
        "aff_unique_abbr": "CUHK;HKUST",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "8VHCeoBGxB",
        "title": "Revisiting the Temporal Modeling in Spatio-Temporal Predictive Learning under A Unified View",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Spatio-temporal predictive learning plays a crucial role in self-supervised learning, with wide-ranging applications across a diverse range of fields. Previous approaches for temporal modeling fall into two categories: recurrent-based and recurrent-free methods. The former, while meticulously processing frames one by one, neglect short-term spatio-temporal information redundancies, leading to inefficiencies. The latter naively stack frames sequentially, overlooking the inherent temporal dependencies. In this paper, we re-examine the two dominant temporal modeling approaches within the realm of spatio-temporal predictive learning, offering a unified perspective. Building upon this analysis, we introduce USTEP (Unified Spatio-TEmporal Predictive learning), an innovative framework that reconciles the recurrent-based and recurrent-free methods by integrating both micro-temporal and macro-temporal scales. Extensive experiments on a wide range of spatio-temporal predictive learning demonstrate that USTEP achieves significant improvements over existing temporal modeling approaches, thereby establishing it as a robust solution for a wide range of spatio-temporal applications.",
        "keywords": "self-supervised learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/65f8f7dbbb41ca55d8a80cd4687076b81425c700.zip",
        "author": "Cheng Tan;Jue Wang;Zhangyang Gao;Siyuan Li;Lirong Wu;Jun Xia;Stan Z. Li",
        "authorids": "~Cheng_Tan1;~Jue_Wang9;~Zhangyang_Gao1;~Siyuan_Li6;~Lirong_Wu1;~Jun_Xia1;~Stan_Z._Li2",
        "gender": "M;;M;M;;M;M",
        "homepage": "https://chengtan9907.github.io/;https://scholar.google.com.hk/citations?hl=zh-CN&pli=1&user=NjYyuQQAAAAJ;;https://lupin1998.github.io/;;http://junxia97.github.io/;https://en.westlake.edu.cn/academics/School_of_Engineering/About/Our_People/Faculty/201912/t20191206_2497.shtml",
        "dblp": "70/1533-12.html;;275/3266;63/9705-2;15/10330;;l/StanZLi",
        "google_scholar": "6kTV6aMAAAAJ;https://scholar.google.com.hk/citations?hl=zh-CN;4SclT-QAAAAJ;https://scholar.google.com/citations?hl=zh-CN;Tk7TrCoAAAAJ;aPKKpSYAAAAJ;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": ";;0000-0003-1026-6083;0000-0001-6806-2468;;;",
        "linkedin": ";;;https://www.linkedin.cn/incareer/in/siyuan-li-lupin1998/;;;stan-z-li-%E6%9D%8E%E5%AD%90%E9%9D%92-55753224/",
        "or_profile": "~Cheng_Tan1;~Jue_Wang9;~Zhangyang_Gao1;~Siyuan_Li6;~Lirong_Wu1;~Jun_Xia1;~Stan_Z._Li1",
        "aff": "Zhejiang University & Westlake University;Zhongnan University of Economics and Law;Westlake University, China;Alibaba Group;Westlake University;Westlake University, China;Westlake University",
        "aff_domain": "westlake.edu.cn;zuel.edu.cn;westlake.edu.cn;alibaba-inc.com;westlake.edu.cn;westlake.edu.cn;westlake.edu.cn",
        "position": "PhD student;Undergrad student;PhD student;Intern;PhD student;PhD student;Chair Professor",
        "bibtex": "@misc{\ntan2024revisiting,\ntitle={Revisiting the Temporal Modeling in Spatio-Temporal Predictive Learning under A Unified View},\nauthor={Cheng Tan and Jue Wang and Zhangyang Gao and Siyuan Li and Lirong Wu and Jun Xia and Stan Z. Li},\nyear={2024},\nurl={https://openreview.net/forum?id=8VHCeoBGxB}\n}",
        "github": "",
        "project": "",
        "reviewers": "ygZp;nrq1;sHRf;8Yx7",
        "site": "https://openreview.net/forum?id=8VHCeoBGxB",
        "pdf_size": 942443,
        "rating": "3;3;5;6",
        "confidence": "4;3;3;3",
        "soundness": "3;3;2;2",
        "contribution": "3;2;2;2",
        "presentation": "3;2;3;3",
        "wc_summary": "91;60;62;89",
        "wc_strengths": "20;80;28;175",
        "wc_weaknesses": "276;295;141;110",
        "wc_questions": "2;62;152;5",
        "wc_review": "389;497;383;379",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            75.5,
            14.534441853748634
        ],
        "wc_strengths_avg": [
            75.75,
            61.75910863994071
        ],
        "wc_weaknesses_avg": [
            205.5,
            81.02623032080415
        ],
        "wc_questions_avg": [
            55.25,
            60.75925855373813
        ],
        "wc_review_avg": [
            412.0,
            49.20365840057018
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5555555555555555,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3352675855393393460&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;3;2;2;2",
        "aff_unique_norm": "Zhejiang University;Zhongnan University of Economics and Law;Westlake University;Alibaba Group",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "http://www.zju.edu.cn;http://www.zuel.edu.cn/;https://www.westlake.edu.cn;https://www.alibaba.com",
        "aff_unique_abbr": "ZJU;ZUEL;WU;Alibaba",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Context is Environment",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19324",
        "id": "8VPWfqtQMX",
        "author_site": "Sharut Gupta, Stefanie Jegelka, David Lopez-Paz, Kartik Ahuja",
        "tldr": "",
        "abstract": "Two lines of work are taking the central stage in AI research. On the one hand, the community is making increasing efforts to build models that discard spurious correlations and generalize better in novel test environments. Unfortunately, the hard lesson so far is that no proposal convincingly outperforms a simple empirical risk minimization baseline. On the other hand, large language models (LLMs) have erupted as algorithms able to learn in-context, generalizing on-the-fly to eclectic contextual circumstances that users enforce by means of prompting. In this paper, we argue that context is environment, and posit that in-context learning holds the key to better domain generalization. Via extensive theory and experiments, we show that paying attention to context$\\unicode{x2013}\\unicode{x2013}$unlabeled examples as they arrive$\\unicode{x2013}\\unicode{x2013}$allows our proposed In-Context Risk Minimization (ICRM) algorithm to zoom-in on the test environment risk minimizer, leading to significant out-of-distribution performance improvements. Furthermore, training with context helps the model learn a better featurizer. From all of this, two messages are worth taking home. Researchers in domain generalization should consider environment as context, and harness the adaptive power of in-context learning. Researchers in LLMs should consider context as environment, to better structure data towards generalization. Code is available at https://github.com/facebookresearch/ICRM.",
        "keywords": "Domain Generalization; In-Context Learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Sharut Gupta;Stefanie Jegelka;David Lopez-Paz;Kartik Ahuja",
        "authorids": "~Sharut_Gupta1;~Stefanie_Jegelka3;~David_Lopez-Paz2;~Kartik_Ahuja1",
        "gender": "F;F;;",
        "homepage": "https://www.mit.edu/~sharut/;http://people.csail.mit.edu/stefje/;http://lopezpaz.org;",
        "dblp": ";38/7003;74/10481;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;gTWUZlsAAAAJ;;",
        "orcid": ";;;",
        "linkedin": "sharut-gupta/;;;",
        "or_profile": "~Sharut_Gupta1;~Stefanie_Jegelka3;~David_Lopez-Paz2;~Kartik_Ahuja1",
        "aff": "Google;Massachusetts Institute of Technology;Meta Facebook;",
        "aff_domain": "google.com;mit.edu;fb.com;",
        "position": "Student Researcher;Associate Professor;Research Scientist;",
        "bibtex": "@inproceedings{\ngupta2024context,\ntitle={Context is Environment},\nauthor={Sharut Gupta and Stefanie Jegelka and David Lopez-Paz and Kartik Ahuja},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=8VPWfqtQMX}\n}",
        "github": "",
        "project": "",
        "reviewers": "cBZm;NswY;1GJP;7Bph",
        "pdf_size": 3283081,
        "rating": "6;6;6;8",
        "confidence": "4;3;2;3",
        "soundness": "2;3;2;3",
        "contribution": "2;4;2;4",
        "presentation": "3;3;3;4",
        "wc_summary": "177;85;25;123",
        "wc_strengths": "54;120;16;237",
        "wc_weaknesses": "1496;519;192;443",
        "wc_questions": "100;84;289;710",
        "wc_review": "1827;808;522;1513",
        "wc_reply_reviewers": "1819;174;0;61",
        "wc_reply_authors": "4824;1304;2420;1488",
        "reply_reviewers": "4;1;0;1",
        "reply_authors": "9;3;5;3",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            3.0,
            1.0
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            102.5,
            55.414348322433604
        ],
        "wc_strengths_avg": [
            106.75,
            83.9028456013263
        ],
        "wc_weaknesses_avg": [
            662.5,
            496.20182385799427
        ],
        "wc_questions_avg": [
            295.75,
            252.390941794669
        ],
        "wc_review_avg": [
            1167.5,
            524.4571002474845
        ],
        "wc_reply_reviewers_avg": [
            513.5,
            756.3116090607099
        ],
        "wc_reply_authors_avg": [
            2509.0,
            1401.928314857789
        ],
        "reply_reviewers_avg": [
            1.5,
            1.5
        ],
        "reply_authors_avg": [
            5.0,
            2.449489742783178
        ],
        "replies_avg": [
            33,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "openreview": "https://openreview.net/forum?id=8VPWfqtQMX",
        "pdf": "https://openreview.net/pdf?id=8VPWfqtQMX",
        "email": "google.com;mit.edu;fb.com;",
        "author_num": 4,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Google;Massachusetts Institute of Technology;Meta",
        "aff_unique_dep": "Google;;Meta Platforms, Inc.",
        "aff_unique_url": "https://www.google.com;https://web.mit.edu;https://meta.com",
        "aff_unique_abbr": "Google;MIT;Meta",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Mountain View;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "8WH6ZlDad6",
        "title": "EWoK: Tackling Robust Markov Decision Processes via Estimating Worst Kernel",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Robust Markov Decision Processes (RMDPs) provide a framework for sequential decision-making that is robust to perturbations on the transition kernel. However, current RMDP methods are often limited to small-scale problems, hindering their use in realistic high-dimensional domains. To bridge this gap, we present **EWoK**, a novel approach for the online RMDP setting that **E**stimates the **Wo**rst transition **K**ernel to learn robust policies. Unlike previous works that regularize the policy or value updates, EWoK achieves robustness by simulating the worst scenarios for the agent while retaining complete flexibility in the learning process. Notably, EWoK can be applied on top of any off-the-shelf *non-robust* RL algorithm, enabling easy scaling to high-dimensional domains. Our experiments, spanning from simple Cartpole to high-dimensional MinAtar and DeepMind Control Suite environments, demonstrate the effectiveness and applicability of the EWoK paradigm as a practical method for learning robust policies.",
        "keywords": "robust Markov decision process;reinforcement learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Kaixin Wang;Uri Gadot;Navdeep Kumar;Kfir Yehuda Levy;Shie Mannor",
        "authorids": "~Kaixin_Wang1;~Uri_Gadot1;~Navdeep_Kumar1;~Kfir_Yehuda_Levy1;~Shie_Mannor2",
        "gender": "M;M;M;M;M",
        "homepage": "https://kaixin96.github.io;;;http://kfiryehud.wixsite.com/kfir-y-levy;https://shie.net.technion.ac.il",
        "dblp": ";349/0367;;83/11388;20/1669",
        "google_scholar": "https://scholar.google.com.sg/citations?hl=en;XXolX3MAAAAJ;;;https://scholar.google.com.tw/citations?user=q1HlbIUAAAAJ",
        "orcid": "0000-0001-8237-9285;;;;",
        "linkedin": ";;navdeepsjb/;;",
        "or_profile": "~Kaixin_Wang1;~Uri_Gadot1;~Navdeep_Kumar1;~Kfir_Yehuda_Levy1;~Shie_Mannor2",
        "aff": "Technion - Israel Institute of Technology, Technion - Israel Institute of Technology;Technion - Israel Institute of Technology, Technion - Israel Institute of Technology;Technion - Israel Institute of Technology, Technion - Israel Institute of Technology;Technion - Israel Institute of Technology, Technion;Technion - Israel Institute of Technology, Technion",
        "aff_domain": "campus.technion.ac.il;campus.technion.ac.il;campus.technion.ac.il;technion.ac.il;technion.il",
        "position": "Postdoc;PhD student;PhD student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nwang2024ewok,\ntitle={{EW}oK: Tackling Robust Markov Decision Processes via Estimating Worst Kernel},\nauthor={Kaixin Wang and Uri Gadot and Navdeep Kumar and Kfir Yehuda Levy and Shie Mannor},\nyear={2024},\nurl={https://openreview.net/forum?id=8WH6ZlDad6}\n}",
        "github": "",
        "project": "",
        "reviewers": "rzcF;QAuy;qiNv;vpVH",
        "site": "https://openreview.net/forum?id=8WH6ZlDad6",
        "pdf_size": 7772774,
        "rating": "3;6;6;6",
        "confidence": "4;2;4;3",
        "soundness": "2;3;3;3",
        "contribution": "1;3;2;3",
        "presentation": "2;2;3;2",
        "wc_summary": "34;86;59;96",
        "wc_strengths": "25;79;62;113",
        "wc_weaknesses": "118;80;137;310",
        "wc_questions": "178;97;148;31",
        "wc_review": "355;342;406;550",
        "wc_reply_reviewers": "609;23;0;106",
        "wc_reply_authors": "1235;259;630;423",
        "reply_reviewers": "2;1;0;1",
        "reply_authors": "4;2;2;3",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            68.75,
            24.200981385059574
        ],
        "wc_strengths_avg": [
            69.75,
            31.696805832764916
        ],
        "wc_weaknesses_avg": [
            161.25,
            88.29885333343803
        ],
        "wc_questions_avg": [
            113.5,
            55.74271252818614
        ],
        "wc_review_avg": [
            413.25,
            82.49659083865224
        ],
        "wc_reply_reviewers_avg": [
            184.5,
            248.23627857345912
        ],
        "wc_reply_authors_avg": [
            636.75,
            369.57162702242175
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1383827578533557120&as_sdt=80005&sciodt=0,11&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Technion - Israel Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.technion.ac.il/en/",
        "aff_unique_abbr": "Technion",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Israel"
    },
    {
        "title": "OmniQuant: Omnidirectionally Calibrated Quantization for Large Language Models",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19323",
        "id": "8Wuvhh0LYW",
        "author_site": "Wenqi Shao, Mengzhao Chen, Zhaoyang Zhang, Peng Xu, Lirui Zhao, Zhiqian Li, Kaipeng Zhang, Gao Peng, Yu Qiao, Ping Luo",
        "tldr": "",
        "abstract": "Large language models (LLMs) have revolutionized natural language processing tasks. However, their practical deployment is hindered by their immense memory and computation requirements. Although recent post-training quantization (PTQ) methods are effective in reducing memory footprint and improving the computational efficiency of LLM, they hand-craft quantization parameters, leading to low performance, especially in extremely low-bit quantization. To tackle this issue, we introduce an Omnidirectionally calibrated Quantization ($\\textbf{OmniQuant}$) technique for LLMs, which achieves good performance in diverse quantization settings while maintaining the computational efficiency of PTQ by efficiently optimizing various quantization parameters. OmniQuant comprises two innovative components including Learnable Weight Clipping (LWC) and Learnable Equivalent Transformation (LET). LWC modulates the extreme values of weights by optimizing the clipping threshold. Meanwhile, LET tackles activation outliers by shifting the challenge of quantization from activations to weights. Operating within a differentiable framework using block-wise error minimization, OmniQuant can optimize the quantization process efficiently for both weight-only and weight-activation quantization. For instance, the LLaMA-2 model family size 7-70B can be processed with OmniQuant on a single A100-40G GPU within 1-16 hours using 128 samples. Extensive experiments validate OmniQuant's superior performance across diverse quantization configurations such as W4A4 (4-bit weight, 4-bit activation), W6A6, W4A16, W3A16, and W2A16. Additionally, OmniQuant demonstrates effectiveness in instruction-tuned models and delivers notable improvements in inference speed and memory reduction on real devices. Codes are available at \n\\url{https://github.com/OpenGVLab/OmniQuant}.",
        "keywords": "Large Language Model Compression;Differentiable Quantization",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/0974848a3a6e6d9966e1d4d1ac74e251b28c3d0c.zip",
        "author": "Wenqi Shao;Mengzhao Chen;Zhaoyang Zhang;Peng Xu;Lirui Zhao;Zhiqian Li;Kaipeng Zhang;Peng Gao;Yu Qiao;Ping Luo",
        "authorids": "~Wenqi_Shao2;~Mengzhao_Chen1;~Zhaoyang_Zhang1;~Peng_Xu11;~Lirui_Zhao1;~Zhiqian_Li1;~Kaipeng_Zhang1;~Peng_Gao3;~Yu_Qiao1;~Ping_Luo2",
        "gender": "M;M;M;M;M;F;M;;;",
        "homepage": "https://wqshao126.github.io/;https://chenmnz.github.io/;https://zzyfd.github.io/#/;;https://github.com/Lirui-Zhao;;http://kpzhang93.github.io/;;;",
        "dblp": "227/3122;301/9459;;;;;179/2126;;;",
        "google_scholar": "Bs9mrwwAAAAJ;https://scholar.google.com.hk/citations?user=dN7UtFkAAAAJ;Pf6o7uAAAAAJ;;;;4OqZBmYAAAAJ;;;",
        "orcid": ";;;;;;;;;",
        "linkedin": ";;;https://www.linkedin.cn/incareer/in/peng-xu-250466206;;zhiqian-li-a19727205/;;;;",
        "or_profile": "~Wenqi_Shao2;~Mengzhao_Chen1;~Zhaoyang_Zhang1;~Peng_Xu11;~Lirui_Zhao1;~Zhiqian_Li1;~Kaipeng_Zhang1;~Peng_Gao3;~Yu_Qiao1;~Ping_Luo2",
        "aff": "Shanghai AI Laboratory;Xiamen University;The Chinese University of Hong Kong;University of Hong Kong;Xiamen University;University of Hong Kong;Shanghai AI Laboratory;;;",
        "aff_domain": "pjlab.org.cn;xmu.edu.cn;cuhk.edu.hk;hku.hk;xmu.edu.cn;hku.hk;pjlab.org.cn;;;",
        "position": "Researcher;MS student;PhD student;PhD student;MS student;Undergrad student;Researcher;;;",
        "bibtex": "@inproceedings{\nshao2024omniquant,\ntitle={OmniQuant: Omnidirectionally Calibrated Quantization for Large Language Models},\nauthor={Wenqi Shao and Mengzhao Chen and Zhaoyang Zhang and Peng Xu and Lirui Zhao and Zhiqian Li and Kaipeng Zhang and Peng Gao and Yu Qiao and Ping Luo},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=8Wuvhh0LYW}\n}",
        "github": "",
        "project": "",
        "reviewers": "PTbL;WDuc;ZyAK;FuSa;ngyH",
        "pdf_size": 884767,
        "rating": "6;6;6;6;8",
        "confidence": "5;4;5;4;5",
        "soundness": "3;2;3;3;3",
        "contribution": "3;2;3;3;3",
        "presentation": "3;3;3;3;2",
        "wc_summary": "92;71;47;64;210",
        "wc_strengths": "53;66;50;69;115",
        "wc_weaknesses": "67;453;41;191;91",
        "wc_questions": "394;5;81;6;22",
        "wc_review": "606;595;219;330;438",
        "wc_reply_reviewers": "27;229;42;36;23",
        "wc_reply_authors": "1590;2841;922;513;889",
        "reply_reviewers": "1;2;1;1;1",
        "reply_authors": "5;6;3;3;3",
        "rating_avg": [
            6.4,
            0.7999999999999999
        ],
        "confidence_avg": [
            4.6,
            0.48989794855663565
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.8,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            96.8,
            58.410273069041544
        ],
        "wc_strengths_avg": [
            70.6,
            23.36321895629966
        ],
        "wc_weaknesses_avg": [
            168.6,
            151.00410590444218
        ],
        "wc_questions_avg": [
            101.6,
            148.81478421178454
        ],
        "wc_review_avg": [
            437.6,
            149.99813332171837
        ],
        "wc_reply_reviewers_avg": [
            71.4,
            79.08122406741059
        ],
        "wc_reply_authors_avg": [
            1351.0,
            821.8211484258603
        ],
        "reply_reviewers_avg": [
            1.2,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            4.0,
            1.2649110640673518
        ],
        "replies_avg": [
            35,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.408248290463863,
        "gs_citation": 246,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17294293173749479580&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=8Wuvhh0LYW",
        "pdf": "https://openreview.net/pdf?id=8Wuvhh0LYW",
        "email": "pjlab.org.cn;xmu.edu.cn;cuhk.edu.hk;hku.hk;xmu.edu.cn;hku.hk;pjlab.org.cn;;;",
        "author_num": 10,
        "aff_unique_index": "0;1;2;3;1;3;0",
        "aff_unique_norm": "Shanghai AI Laboratory;Xiamen University;Chinese University of Hong Kong;University of Hong Kong",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.shanghai-ai-lab.com;https://www.xmu.edu.cn;https://www.cuhk.edu.hk;https://www.hku.hk",
        "aff_unique_abbr": "SAIL;XMU;CUHK;HKU",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "8XgCH9y1Bs",
        "title": "3D Object Representation Learning for Robust Classification and Pose estimation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this work, we pioneer a framework for 3D object representation learning that achieves exceptionally robust classification and pose estimation results. In particular, we introduce a 3D representation of object categories using a 3D template mesh composed of feature vectors at each mesh vertex. Our model predicts, for each pixel in a 2D image, a feature vector of the corresponding vertex in each category template mesh, hence establishing dense correspondences between image pixels and the 3D template geometry of all target object categories. The feature vectors on the mesh vertices are trained to be viewpoint invariant by leveraging associated camera poses. During inference, we efficiently estimate the object class and pose by matching the class-specific templates to a target feature map in a two-step process: First, we classify the image by matching the vertex features of each template to an input feature map. Interestingly, we found that image classification can be performed using the vertex features only and without requiring the 3D mesh geometry, hence making the class label inference very efficient. In a second step, the object pose can be inferred using a render-and-compare matching process that ensures spatial consistency between the detected vertices. Our experiments on image classification demonstrate that our proposed 3D object representation has a number of profound advantages over classical image-based representations. First, it is exceptionally robust on a range of real-world and synthetic out-of-distribution shifts while performing on par with state-of-the-art architectures on in-distribution data in terms of accuracy and speed. Second, the estimated object pose is competitive with baseline models that were explicitly designed for pose estimation, but that cannot classify images. Finally, we show that our model has an enhanced interpretability by visualizing the individual vertex matches and the ability to perform classification and pose estimation jointly and consistently.",
        "keywords": "classification;3D-pose estimation;analysis-by-synthesis;render-and-compare",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/d5fb8bce79d4790099daf4e95353a2977d370d9d.zip",
        "author": "Artur Jesslen;Guofeng Zhang;Angtian Wang;Alan Yuille;Adam Kortylewski",
        "authorids": "~Artur_Jesslen1;~Guofeng_Zhang4;~Angtian_Wang2;~Alan_Yuille1;~Adam_Kortylewski1",
        "gender": "M;M;M;M;",
        "homepage": "https://arturjssln.github.io;https://richard-guofeng-zhang.github.io/;https://angtianwang.github.io/;;https://gvrl.mpi-inf.mpg.de/",
        "dblp": "345/3057;;;y/AlanLYuille;161/0772",
        "google_scholar": ";vl0mzhEAAAAJ;YR7re-cAAAAJ;;https://scholar.google.ch/citations?user=tRLUOBIAAAAJ",
        "orcid": "0000-0002-4837-8163;;;;0000-0002-9146-4403",
        "linkedin": "artur-jesslen/;;;;",
        "or_profile": "~Artur_Jesslen1;~Guofeng_Zhang4;~Angtian_Wang2;~Alan_Yuille1;~Adam_Kortylewski1",
        "aff": "University of Freiburg, Albert-Ludwigs-Universit\u00e4t Freiburg;Johns Hopkins University;Johns Hopkins University;Johns Hopkins University;Albert-Ludwigs-Universit\u00e4t Freiburg",
        "aff_domain": "cs.uni-freiburg.de;jhu.edu;jhu.edu;johnshopkins.edu;uni-freiburg.de",
        "position": "PhD student;PhD student;PhD student;Full Professor;Research Group Leader",
        "bibtex": "@misc{\njesslen2024d,\ntitle={3D Object Representation Learning for Robust Classification and Pose estimation},\nauthor={Artur Jesslen and Guofeng Zhang and Angtian Wang and Alan Yuille and Adam Kortylewski},\nyear={2024},\nurl={https://openreview.net/forum?id=8XgCH9y1Bs}\n}",
        "github": "",
        "project": "",
        "reviewers": "LehM;35dn;Yc1n;wnbh",
        "site": "https://openreview.net/forum?id=8XgCH9y1Bs",
        "pdf_size": 10851286,
        "rating": "3;5;6;6",
        "confidence": "3;4;4;3",
        "soundness": "2;2;3;3",
        "contribution": "1;2;3;2",
        "presentation": "3;2;3;3",
        "wc_summary": "244;81;80;94",
        "wc_strengths": "83;46;71;54",
        "wc_weaknesses": "228;181;81;98",
        "wc_questions": "46;5;7;200",
        "wc_review": "601;313;239;446",
        "wc_reply_reviewers": "190;49;63;204",
        "wc_reply_authors": "876;734;313;1458",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;2;2;3",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            124.75,
            69.07016360194899
        ],
        "wc_strengths_avg": [
            63.5,
            14.430869689661812
        ],
        "wc_weaknesses_avg": [
            147.0,
            60.153969112603036
        ],
        "wc_questions_avg": [
            64.5,
            79.92027277230727
        ],
        "wc_review_avg": [
            399.75,
            137.84660859085363
        ],
        "wc_reply_reviewers_avg": [
            126.5,
            70.84666541200087
        ],
        "wc_reply_authors_avg": [
            845.25,
            409.9008264202452
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.40824829046386296,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:xO1UbHRLSTMJ:scholar.google.com/&scioq=3D+Object+Representation+Learning+for+Robust+Classification+and+Pose+estimation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1;2",
        "aff_unique_norm": "University of Freiburg;Johns Hopkins University;Albert-Ludwigs-Universit\u00e4t Freiburg",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.uni-freiburg.de;https://www.jhu.edu;https://www.uni-freiburg.de",
        "aff_unique_abbr": "UoF;JHU;Albert-Ludwigs-Universit\u00e4t",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Freiburg;",
        "aff_country_unique_index": "0;1;1;1;0",
        "aff_country_unique": "Germany;United States"
    },
    {
        "id": "8Xx0mKoCMd",
        "title": "ExoViP: Step-by-step Verification and Exploration with Exoskeleton Modules for Compositional Visual Reasoning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Compositional visual reasoning methods, which translate a complex query into a structured composition of feasible visual tasks, have exhibited a strong potential in complicated multimodal tasks like visual question answering, language-guided image editing, etc. Empowered by recent advances in large language models (LLMs), this multimodal challenge has been brought to a new stage by treating LLMs as few-shot/zero-shot planners, i.e., visual-language programming.\nSuch methods, despite their numerous merits, suffer from challenges due to LLM planning mistakes or inaccuracy of visual execution modules, lagging behind the non-compositional models.\nIn this work, we devise a \"plug-and-play\" method, ExoViP, to correct the errors at both the planning and execution stages through introspective verification. We employ verification modules as \"exoskeletons\" to enhance current vision-language programming schemes. Specifically, our proposed verification module utilizes a mixture of three sub-verifiers to validate predictions after each reasoning step, subsequently calibrating the visual module predictions and refining the reasoning trace planned by LLMs. \nExperimental results on two representative vision-language programming methods showcase consistent improvements on five compositional reasoning tasks on standard benchmarks. In light of this, we believe ExoViP can foster better performance and generalization on open-domain multimodal challenges.",
        "keywords": "Compositional Reasoning;Multimodality",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/35577ec20819897a1094f0e7aaddda3b59f3bc9f.pdf",
        "author": "Yuxuan Wang;Alan Yuille;Zhuowan Li;Zilong Zheng",
        "authorids": "~Yuxuan_Wang4;~Alan_Yuille1;~Zhuowan_Li1;~Zilong_Zheng1",
        "gender": "M;M;F;M",
        "homepage": "https://github.com/patrick-tssn;;https://lizw14.github.io;http://zilongzheng.github.io",
        "dblp": ";y/AlanLYuille;228/6963;218/5234",
        "google_scholar": "jNCX2g0AAAAJ;;Fft1WvwAAAAJ;9sDx70IAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Yuxuan_Wang4;~Alan_Yuille1;~Zhuowan_Li1;~Zilong_Zheng1",
        "aff": "Beijing Institute for General Artificial Intelligence;Johns Hopkins University;Johns Hopkins University;Beijing Institute for General Artificial Intelligence",
        "aff_domain": "bigai.ai;johnshopkins.edu;jhu.edu;bigai.ai",
        "position": "Researcher;Full Professor;PhD student;Researcher",
        "bibtex": "@misc{\nwang2024exovip,\ntitle={ExoViP: Step-by-step Verification and Exploration with Exoskeleton Modules for Compositional Visual Reasoning},\nauthor={Yuxuan Wang and Alan Yuille and Zhuowan Li and Zilong Zheng},\nyear={2024},\nurl={https://openreview.net/forum?id=8Xx0mKoCMd}\n}",
        "github": "",
        "project": "",
        "reviewers": "atdm;2ndj;rVcU;Tiuv",
        "site": "https://openreview.net/forum?id=8Xx0mKoCMd",
        "pdf_size": 1944140,
        "rating": "5;5;6;6",
        "confidence": "3;5;2;3",
        "soundness": "2;4;4;3",
        "contribution": "2;2;4;3",
        "presentation": "2;3;3;3",
        "wc_summary": "81;90;74;113",
        "wc_strengths": "58;149;86;65",
        "wc_weaknesses": "299;202;30;134",
        "wc_questions": "133;162;2;202",
        "wc_review": "571;603;192;514",
        "wc_reply_reviewers": "0;66;0;48",
        "wc_reply_authors": "2112;1350;505;978",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "4;4;2;4",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.25,
            1.0897247358851685
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            89.5,
            14.705441169852742
        ],
        "wc_strengths_avg": [
            89.5,
            35.864327680858594
        ],
        "wc_weaknesses_avg": [
            166.25,
            98.11313622548207
        ],
        "wc_questions_avg": [
            124.75,
            74.9845817485168
        ],
        "wc_review_avg": [
            470.0,
            163.6383206953677
        ],
        "wc_reply_reviewers_avg": [
            28.5,
            29.201883500897676
        ],
        "wc_reply_authors_avg": [
            1236.25,
            587.64290815086
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.5,
            0.8660254037844386
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.6882472016116854,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5136323398738501800&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1;0",
        "aff_unique_norm": "Beijing Institute for General Artificial Intelligence;Johns Hopkins University",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.bigaiai.org/;https://www.jhu.edu",
        "aff_unique_abbr": "BIGAI;JHU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "8ZW3oLNE0c",
        "title": "SEArch: A Self-Evolving Framework for Network Architecture Optimization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper studies a fundamental network optimization problem that finds a network architecture with optimal performance (low losses) under given resource budgets (small parameter size and/or fast inference). Different from existing network optimization approaches such as network pruning, knowledge distillation (KD), and network architecture search (NAS), in this work we introduce a novel self-evolving pipeline to perform network optimization. In this framework, a simple network iteratively and adaptively modifies its structures by using the guidance from the teacher network, until it reaches the resource budget. An attention module is introduced to transfer the knowledge from teacher network to student network. The splitting edge scheme helps the student model find an optimal macro architecture. The proposed framework combines the advantages of pruning, KD, and NAS, and hence, can efficiently generate networks with flexible structure and desirable performance. Extensive experiments on CIFAR-10, CIFAR-100 and ImageNet demonstrated that our framework achieves state-of-the-art performance in this network architecture optimization task.",
        "keywords": "network architecture optimization;network pruning;knowledge distillation",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Yongqing Liang;Dawei Xiang;Xin Li",
        "authorids": "~Yongqing_Liang1;xiangdw@tamu.edu;~Xin_Li52",
        "gender": "M;;M",
        "homepage": "https://lyq.me/scholar;;https://people.tamu.edu/~xinli/",
        "dblp": ";;09/1365-3",
        "google_scholar": "bDo9RPwAAAAJ;;Begpk8wAAAAJ",
        "orcid": "0000-0002-7282-0476;;0000-0002-0144-9489",
        "linkedin": ";;xin-shane-li-31427443",
        "or_profile": "~Yongqing_Liang1;xiangdw@tamu.edu;~Xin_Li52",
        "aff": "Texas A&M University - College Station;;Texas A&M University - College Station",
        "aff_domain": "tamu.edu;;tamu.edu",
        "position": "PhD student;;Full Professor",
        "bibtex": "@misc{\nliang2024search,\ntitle={{SEA}rch: A Self-Evolving Framework for Network Architecture Optimization},\nauthor={Yongqing Liang and Dawei Xiang and Xin Li},\nyear={2024},\nurl={https://openreview.net/forum?id=8ZW3oLNE0c}\n}",
        "github": "",
        "project": "",
        "reviewers": "rdLr;6dDt;xUVA",
        "site": "https://openreview.net/forum?id=8ZW3oLNE0c",
        "pdf_size": 580495,
        "rating": "3;5;5",
        "confidence": "3;4;4",
        "soundness": "3;2;3",
        "contribution": "1;2;2",
        "presentation": "3;3;2",
        "wc_summary": "44;58;96",
        "wc_strengths": "31;48;29",
        "wc_weaknesses": "117;81;200",
        "wc_questions": "65;4;4",
        "wc_review": "257;191;329",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            66.0,
            21.96967607104544
        ],
        "wc_strengths_avg": [
            36.0,
            8.524474568362947
        ],
        "wc_weaknesses_avg": [
            132.66666666666666,
            49.828595092465626
        ],
        "wc_questions_avg": [
            24.333333333333332,
            28.755675768252935
        ],
        "wc_review_avg": [
            259.0,
            56.356011214421486
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.9999999999999998,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:bTBy1m-mvH8J:scholar.google.com/&scioq=SEArch:+A+Self-Evolving+Framework+for+Network+Architecture+Optimization&hl=en&as_sdt=0,33",
        "gs_version_total": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Texas A&M University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tamu.edu",
        "aff_unique_abbr": "TAMU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "College Station",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "8ayoKVFmxp",
        "title": "QualEval: Qualitative Evaluation for Model Improvement",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Quantitative evaluation metrics have played a central role in measuring the progress of natural language systems (NLP) systems like large language models (LLMs) thus far, but they come with their own weaknesses. Given the complex and intricate nature of real-world tasks, a simple scalar to quantify and compare models is a gross trivialization of model behavior that ignores its idiosyncrasies. As a result, scalar evaluation metrics like accuracy make the actual model improvement process an arduous one. It currently involves a lot of manual effort which includes analyzing a large number of data points and making hit-or-miss changes to the training data or setup. This process is even more excruciating when this analysis needs to be performed on a cross-product of multiple models and datasets. In this work, we address the shortcomings of quantitative metrics by proposing our method QualEval, which enables automated qualitative evaluation as a vehicle for model improvement. QualEval provides a comprehensive dashboard with fine-grained analysis and human-readable insights to improve the model. We show that utilizing the dashboard generated by QualEval improves performance by up to 12% relatively on a variety of datasets, thus leading to agile model development cycles both on open-source and closed-source models and on a variety of setups like fine-tuning and in-context learning. In essence, QualEval serves as an automated data-scientist-in-a-box. Given the focus on critiquing and improving current evaluation metrics, our method serves as a refreshingly new technique towards both model evaluation and improvement.",
        "keywords": "qualitative evaluation;evaluation;framework",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Vishvak Murahari;Ameet Deshpande;Peter Clark;Tanmay Rajpurohit;Ashish Sabharwal;Karthik R Narasimhan;Ashwin Kalyan",
        "authorids": "~Vishvak_Murahari1;~Ameet_Deshpande1;~Peter_Clark1;~Tanmay_Rajpurohit1;~Ashish_Sabharwal1;~Karthik_R_Narasimhan1;~Ashwin_Kalyan6",
        "gender": "M;M;M;M;M;M;M",
        "homepage": "https://vishvakmurahari.com/;https://allenai.org/team/peterc;;;http://www.karthiknarasimhan.com;https://ameet-1997.github.io;http://ashwinkalyan.com/",
        "dblp": "249/5621;34/1184;;13/154;147/0322;220/4337;173/5217",
        "google_scholar": "Y_NYX7MAAAAJ;o-5vyEsAAAAJ;B4NztA8AAAAJ;7VspfeAAAAAJ;euc0GX4AAAAJ;332L1coAAAAJ;KYHL9aIAAAAJ",
        "orcid": ";;;;;;",
        "linkedin": ";peter-clark-a8b556/;tanmay-rajpurohit-b13942125/;ashish-sabharwal-82a2b661;;;",
        "or_profile": "~Vishvak_Murahari1;~Peter_Clark1;~Tanmay_Rajpurohit1;~Ashish_Sabharwal1;~Karthik_R_Narasimhan1;~Ameet_S_Deshpande1;~Ashwin_Kalyan_Vijayakumar1",
        "aff": "Princeton University;Allen Institute for Artificial Intelligence;Independent Researcher;Allen Institute for AI;Princeton University;Princeton University;Allen Institute for Artificial Intelligence",
        "aff_domain": "princeton.edu;allenai.org;tanmay.one;allenai.org;princeton.edu;princeton.edu;allenai.org",
        "position": "PhD student;Senior Research Manager;Researcher;Principal Researcher;Assistant Professor;PhD student;Research Scientist",
        "bibtex": "@misc{\nmurahari2024qualeval,\ntitle={QualEval: Qualitative Evaluation for Model Improvement},\nauthor={Vishvak Murahari and Ameet Deshpande and Peter Clark and Tanmay Rajpurohit and Ashish Sabharwal and Karthik R Narasimhan and Ashwin Kalyan},\nyear={2024},\nurl={https://openreview.net/forum?id=8ayoKVFmxp}\n}",
        "github": "",
        "project": "",
        "reviewers": "BTXw;hZVP;2Tzm",
        "site": "https://openreview.net/forum?id=8ayoKVFmxp",
        "pdf_size": 36036938,
        "rating": "1;3;3",
        "confidence": "4;2;4",
        "soundness": "1;3;3",
        "contribution": "2;3;2",
        "presentation": "2;2;3",
        "wc_summary": "46;53;89",
        "wc_strengths": "35;53;51",
        "wc_weaknesses": "298;139;151",
        "wc_questions": "6;30;38",
        "wc_review": "385;275;329",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            62.666666666666664,
            18.83849486792639
        ],
        "wc_strengths_avg": [
            46.333333333333336,
            8.055363982396383
        ],
        "wc_weaknesses_avg": [
            196.0,
            72.29107828771127
        ],
        "wc_questions_avg": [
            24.666666666666668,
            13.59738536958076
        ],
        "wc_review_avg": [
            329.6666666666667,
            44.90978611493144
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5000000000000001,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16924907597993779907&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2;3;0;0;1",
        "aff_unique_norm": "Princeton University;Allen Institute for Artificial Intelligence;Independent Researcher;Allen Institute for AI",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.princeton.edu;https://allenai.org;;https://allenai.org",
        "aff_unique_abbr": "Princeton;AI2;;AI2",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States;"
    },
    {
        "id": "8cNMMrWRbZ",
        "title": "LMRL Gym: Benchmarks for Multi-Turn Reinforcement Learning with Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs) provide excellent text-generation capabilities, but standard prompting and generation methods generally do not lead to intentional or goal-directed agents and might necessitate considerable prompt tuning. This becomes particularly apparent in multi-turn conversations: even the best current LLMs rarely ask clarifying questions, engage in explicit information gathering, or take actions now that lead to better decisions after multiple turns. Reinforcement learning has the potential to leverage the powerful modeling capabilities of LLMs, as well as their internal representation of textual interactions, to create capable goal-directed language agents. This can enable intentional and temporally extended interactions, such as with humans, through coordinated persuasion and carefully crafted questions, or in goal-directed play through text games to bring about desired final outcomes. However, enabling this requires the community to develop stable and reliable reinforcement learning algorithms that can effectively train LLMs. Developing such algorithms requires tasks that can gauge progress on algorithm design, provide accessible and reproducible evaluations for multi-turn interactions, and cover a range of task properties and challenges in improving reinforcement learning algorithms. Our paper introduces the LMRL-Gym benchmark for evaluating multi-turn RL for LLMs, together with an open-source research framework containing a basic toolkit for getting started on multi-turn RL with offline value-based and policy-based RL methods. Our benchmark consists of 8 different language tasks, which require multiple rounds of language interaction and cover a range of tasks in open-ended dialogue and text games",
        "keywords": "benchmarks;RL;LLMs;offline reinforcement learning",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/e4ee6cd1641958842d9b76d430bd3ef903f69b0b.zip",
        "author": "Marwa Abdulhai;Isadora White;Charlie Victor Snell;Charles Sun;Joey Hong;Yuexiang Zhai;Kelvin Xu;Sergey Levine",
        "authorids": "~Marwa_Abdulhai1;~Isadora_White1;~Charlie_Victor_Snell1;~Charles_Sun1;~Joey_Hong2;~Yuexiang_Zhai1;~Kelvin_Xu2;~Sergey_Levine1",
        "gender": ";Non-Binary;M;M;M;;Unspecified;M",
        "homepage": "https://abdulhaim.github.io/;https://icwhite.github.io/website/;https://sea-snell.github.io;https://charlesjsun.github.io/;;;http://kelvinxu.github.io/;https://people.eecs.berkeley.edu/~svlevine/",
        "dblp": "277/9482;;;;188/6056.html;241/6124.html;159/1894;80/7594",
        "google_scholar": ";https://scholar.google.com/citations?view_op=list_works;dD7EpwQAAAAJ;;SiBVfPUAAAAJ;78WTKm4AAAAJ;GyoKzFwAAAAJ;8R35rCwAAAAJ",
        "orcid": ";;;;;;;",
        "linkedin": ";isadora-c-white/;;;;;;",
        "or_profile": "~Marwa_Abdulhai1;~Isadora_White1;~Charlie_Victor_Snell1;~Charles_Sun1;~Joey_Hong2;~Yuexiang_Zhai1;~Kelvin_Xu2;~Sergey_Levine1",
        "aff": "University of California, Berkeley;University of California, Berkeley;University of California, Berkeley;University of California, Berkeley;University of California, Berkeley;University of California, Berkeley;University of California, Berkeley;Google",
        "aff_domain": "berkeley.edu;berkeley.edu;berkeley.edu;berkeley.edu;berkeley.edu;berkeley.edu;berkeley.edu;google.com",
        "position": "PhD student;Undergrad student;PhD student;Undergrad student;PhD student;PhD student;PhD student;Research Scientist",
        "bibtex": "@misc{\nabdulhai2024lmrl,\ntitle={{LMRL} Gym: Benchmarks for Multi-Turn Reinforcement Learning with Language Models},\nauthor={Marwa Abdulhai and Isadora White and Charlie Victor Snell and Charles Sun and Joey Hong and Yuexiang Zhai and Kelvin Xu and Sergey Levine},\nyear={2024},\nurl={https://openreview.net/forum?id=8cNMMrWRbZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "6Fq6;2ASy;fFLM;BtsG",
        "site": "https://openreview.net/forum?id=8cNMMrWRbZ",
        "pdf_size": 1601889,
        "rating": "5;5;6;6",
        "confidence": "4;4;4;4",
        "soundness": "2;2;3;2",
        "contribution": "3;3;2;2",
        "presentation": "3;2;3;2",
        "wc_summary": "158;77;108;96",
        "wc_strengths": "32;129;116;54",
        "wc_weaknesses": "181;360;99;300",
        "wc_questions": "79;10;67;230",
        "wc_review": "450;576;390;680",
        "wc_reply_reviewers": "36;89;11;105",
        "wc_reply_authors": "1435;1235;581;925",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "4;4;3;4",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            109.75,
            29.969776442275975
        ],
        "wc_strengths_avg": [
            82.75,
            40.76380134383936
        ],
        "wc_weaknesses_avg": [
            235.0,
            101.56524996277024
        ],
        "wc_questions_avg": [
            96.5,
            81.36491873037176
        ],
        "wc_review_avg": [
            524.0,
            112.32987136109433
        ],
        "wc_reply_reviewers_avg": [
            60.25,
            38.21894163893082
        ],
        "wc_reply_authors_avg": [
            1044.0,
            323.2228333518534
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.75,
            0.4330127018922193
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 34,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14634267088299559076&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;0;0;0;0;0;1",
        "aff_unique_norm": "University of California, Berkeley;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.berkeley.edu;https://www.google.com",
        "aff_unique_abbr": "UC Berkeley;Google",
        "aff_campus_unique_index": "0;0;0;0;0;0;0;1",
        "aff_campus_unique": "Berkeley;Mountain View",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Uncertainty-aware Graph-based Hyperspectral Image Classification",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19322",
        "id": "8dN7gApKm3",
        "author_site": "Linlin Yu, Yifei Lou, Feng Chen",
        "tldr": "",
        "abstract": "Hyperspectral imaging (HSI) technology captures spectral information across a broad wavelength range, providing richer pixel features compared to traditional color images with only three channels. Although pixel classification in HSI  has been extensively studied, especially using graph convolution neural networks (GCNs), quantifying epistemic and aleatoric uncertainties associated with the HSI classification (HSIC) results remains an unexplored area. These two uncertainties are effective for out-of-distribution (OOD) and misclassification detection, respectively. In this paper, we adapt two advanced uncertainty quantification models, evidential GCNs (EGCN) and graph posterior networks (GPN), designed for node classifications in graphs, into the realm of HSIC. We first reveal theoretically that a popular uncertainty cross-entropy (UCE) loss function is insufficient to produce good epistemic uncertainty when learning EGCNs. To mitigate the limitations, we propose two regularization terms. One leverages the inherent property of HSI data where each feature vector is a linear combination of the spectra signatures of the confounding materials, while the other is the total variation (TV) regularization to enforce the spatial smoothness of the evidence with edge-preserving. We demonstrate the effectiveness of the proposed regularization terms on both EGCN and GPN on three real-world HSIC datasets for OOD and misclassification detection tasks. The code is available at GitHub.",
        "keywords": "Uncertainty Quantification;Graph;Hyperspectral Image Classification",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Linlin Yu;Yifei Lou;Feng Chen",
        "authorids": "~Linlin_Yu1;~Yifei_Lou2;~Feng_Chen7",
        "gender": "F;F;M",
        "homepage": ";https://sites.google.com/site/louyifei/;https://personal.utdallas.edu/~fxc190007/",
        "dblp": "204/9716;;21/3047-1",
        "google_scholar": "https://scholar.google.com/citations?hl=en;iCiUflEAAAAJ;KOQ-SSYAAAAJ",
        "orcid": "0009-0001-5690-9905;0000-0003-1973-5704;",
        "linkedin": "linlin-yu-723884249/;;",
        "or_profile": "~Linlin_Yu1;~Yifei_Lou2;~Feng_Chen7",
        "aff": "The University of Texas at Dallas;University of North Carolina at Chapel Hill;University of Texas, Dallas",
        "aff_domain": "cs.utdallas.edu;unc.edu;utdallas.edu",
        "position": "PhD student;Associate Professor;Associate Professor",
        "bibtex": "@inproceedings{\nyu2024uncertaintyaware,\ntitle={Uncertainty-aware Graph-based Hyperspectral Image Classification},\nauthor={Linlin Yu and Yifei Lou and Feng Chen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=8dN7gApKm3}\n}",
        "github": "",
        "project": "",
        "reviewers": "6WzU;pixa;NxUY;WkZQ;SyHe",
        "pdf_size": 1832303,
        "rating": "5;5;6;6;6",
        "confidence": "4;2;4;2;3",
        "soundness": "2;2;2;3;4",
        "contribution": "2;3;2;3;3",
        "presentation": "2;2;3;2;2",
        "wc_summary": "36;54;72;85;35",
        "wc_strengths": "60;28;69;74;60",
        "wc_weaknesses": "96;159;148;218;95",
        "wc_questions": "207;35;5;58;4",
        "wc_review": "399;276;294;435;194",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "1095;2237;884;698;1126",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "2;4;2;1;2",
        "rating_avg": [
            5.6,
            0.48989794855663565
        ],
        "confidence_avg": [
            3.0,
            0.8944271909999159
        ],
        "soundness_avg": [
            2.6,
            0.8
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.2,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            56.4,
            19.7038067388005
        ],
        "wc_strengths_avg": [
            58.2,
            16.0299719276111
        ],
        "wc_weaknesses_avg": [
            143.2,
            45.64822011864208
        ],
        "wc_questions_avg": [
            61.8,
            75.34294923879739
        ],
        "wc_review_avg": [
            319.6,
            87.12427905010175
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1208.0,
            537.2913548532118
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.2,
            0.9797958971132712
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7656154241134560566&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=8dN7gApKm3",
        "pdf": "https://openreview.net/pdf?id=8dN7gApKm3",
        "email": "cs.utdallas.edu;unc.edu;utdallas.edu",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Texas at Dallas;University of North Carolina",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.utdallas.edu;https://www.unc.edu",
        "aff_unique_abbr": "UT Dallas;UNC",
        "aff_campus_unique_index": "0;1;0",
        "aff_campus_unique": "Dallas;Chapel Hill",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "8dkp41et6U",
        "title": "LongLLMLingua: Accelerating and Enhancing LLMs in Long Context Scenarios via Prompt Compression",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In long context scenarios, large language models (LLMs) face three main challenges: higher computational/financial cost, longer latency, and inferior performance. Some studies reveal that the performance of LLMs depends on both the density and the position of the key information (question relevant) in the input prompt. Inspired by these findings, we propose LongLLMLingua for prompt compression towards improving LLMs\u2019 perception of the key information to simultaneously address the three challenges. We conduct evaluation on a wide range of long context scenarios including single-/multi-document QA, few-shot learning, summarization, synthetic tasks, and code completion. and experimental results show that LongLLMLingua compressed prompt can derive higher performance with much less cost. The latency of the end-to-end system is also reduced. For example, on NaturalQuestions benchmark, LongLLMLingua gains a performance boost of up to 17.1% over the original prompt with \u223c4x fewer tokens as input to GPT-3.5-Turbo. It can derive cost savings of `$`28.5 and `$`27.4 per 1,000 samples from the LongBench and ZeroScrolls benchmark, respectively. Additionally, when compressing prompts of \u223c10k tokens at a compression rate of 2x-10x, LongLLMLingua can speed up the end-to-end latency by 1.4x-3.8x.",
        "keywords": "Prompt Compression;Long Context;LLMs;Black-box LLMs;Efficient Method",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/a6731934d7958d6ae28a710aa9b4f8508ce1a21f.zip",
        "author": "Huiqiang Jiang;Qianhui Wu;Xufang Luo;Dongsheng Li;Chin-Yew Lin;Yuqing Yang;Lili Qiu",
        "authorids": "~Huiqiang_Jiang2;~Qianhui_Wu1;~Xufang_Luo1;~Dongsheng_Li2;~Chin-Yew_Lin1;~Yuqing_Yang1;~Lili_Qiu3",
        "gender": "M;F;F;M;M;;",
        "homepage": "https://hqjiang.com;https://qianhuiwu.github.io/;;http://recmind.cn;https://www.microsoft.com/en-us/research/people/cyl/;;https://www.microsoft.com/en-us/research/people/liliqiu/",
        "dblp": "204/2497;204/2307;218/7350;254/0830-2.html;64/6843;91/9064-1.html;",
        "google_scholar": "99KtvpYAAAAJ;BLZieokAAAAJ;;VNg5rA8AAAAJ;cDF07aYAAAAJ;4BtNQAEAAAAJ;",
        "orcid": "0000-0002-1327-4882;;;0000-0003-3103-8442;;0000-0003-3518-5212;",
        "linkedin": ";qianhui-wu-2b1608b7?originalSubdomain=cn;;;chin-yew-lin-32585a4;;",
        "or_profile": "~Huiqiang_Jiang2;~Qianhui_Wu1;~Xufang_Luo1;~Dongsheng_Li2;~Chin-Yew_Lin1;~Yuqing_Yang1;~Lili_Qiu3",
        "aff": "Microsoft;Microsoft;Microsoft Research;Microsoft Research Asia;Microsoft;Microsoft Research;University of Texas at Austin",
        "aff_domain": "microsoft.com;microsoft.com;microsoft.com;microsoft.com;microsoft.com;research.microsoft.com;utexas.edu",
        "position": "RSDE;Researcher;Researcher;Principal Researcher;Senior Principal Research Manager;Researcher;Full Professor",
        "bibtex": "@misc{\njiang2024longllmlingua,\ntitle={Long{LLML}ingua: Accelerating and Enhancing {LLM}s in Long Context Scenarios via Prompt Compression},\nauthor={Huiqiang Jiang and Qianhui Wu and Xufang Luo and Dongsheng Li and Chin-Yew Lin and Yuqing Yang and Lili Qiu},\nyear={2024},\nurl={https://openreview.net/forum?id=8dkp41et6U}\n}",
        "github": "",
        "project": "",
        "reviewers": "iM9S;jRw6;qdfA;PhaL;qC5x",
        "site": "https://openreview.net/forum?id=8dkp41et6U",
        "pdf_size": 2349383,
        "rating": "5;6;6;6;6",
        "confidence": "4;4;3;5;4",
        "soundness": "2;2;3;3;3",
        "contribution": "3;2;3;3;3",
        "presentation": "3;2;3;3;3",
        "wc_summary": "124;24;75;61;37",
        "wc_strengths": "64;56;34;69;61",
        "wc_weaknesses": "682;41;219;206;70",
        "wc_questions": "183;5;2;4;86",
        "wc_review": "1053;126;330;340;254",
        "wc_reply_reviewers": "0;16;12;15;0",
        "wc_reply_authors": "1186;127;161;373;447",
        "reply_reviewers": "0;1;1;1;0",
        "reply_authors": "2;1;1;1;1",
        "rating_avg": [
            5.8,
            0.39999999999999997
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.8,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            64.2,
            34.81034329046469
        ],
        "wc_strengths_avg": [
            56.8,
            12.155657119218196
        ],
        "wc_weaknesses_avg": [
            243.6,
            230.3897567167429
        ],
        "wc_questions_avg": [
            56.0,
            71.06335201775947
        ],
        "wc_review_avg": [
            420.6,
            325.32420752228074
        ],
        "wc_reply_reviewers_avg": [
            8.6,
            7.1442284397967
        ],
        "wc_reply_authors_avg": [
            458.8,
            383.43103682409435
        ],
        "reply_reviewers_avg": [
            0.6,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.2,
            0.4000000000000001
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 205,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13295521544032790503&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;0;0;0;0;1",
        "aff_unique_norm": "Microsoft;University of Texas at Austin",
        "aff_unique_dep": "Microsoft Corporation;",
        "aff_unique_url": "https://www.microsoft.com;https://www.utexas.edu",
        "aff_unique_abbr": "Microsoft;UT Austin",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Asia;Austin",
        "aff_country_unique_index": "0;0;0;1;0;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "Prometheus: Inducing Fine-Grained Evaluation Capability in Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19321",
        "id": "8euJaTveKw",
        "author_site": "Seungone Kim, Jamin Shin, yejin cho, Joel Jang, Shayne Longpre, Hwaran Lee, Sangdoo Yun, Ryan, S Shin, Sungdong Kim, James Thorne, Minjoon Seo",
        "tldr": "",
        "abstract": "Recently, GPT-4 has become the de facto evaluator for long-form text generated by large language models (LLMs). However, for practitioners and researchers with large and custom evaluation tasks, GPT-4 is unreliable due to its closed-source nature, uncontrolled versioning, and prohibitive costs. In this work, we propose PROMETHEUS a fully open-source LLM that is on par with GPT-4\u2019s evaluation capabilities when the appropriate reference materials (reference answer, score rubric) are accompanied. For this purpose, we construct a new dataset \u2013 FEEDBACK COLLECTION \u2013 that consists of 1K fine-grained score rubrics, 20K instructions, and 100K natural language feedback generated by GPT-4. Using the FEEDBACK COLLECTION, we train PROMETHEUS, a 13B evaluation-specific LLM that can assess any given response based on novel and unseen score rubrics and reference materials provided by the user. Our dataset\u2019s versatility and diversity make our model generalize to challenging real-world criteria, such as prioritizing conciseness, child-readability, or varying levels of formality. We show that PROMETHEUS shows a stronger correlation with GPT-4 evaluation compared to ChatGPT on seven evaluation benchmarks (Two Feedback Collection testsets, MT Bench, Vicuna Bench, Flask Eval, MT Bench Human Judgment, and HHH Alignment), showing the efficacy of our model and dataset design. During human evaluation with hand-crafted score rubrics, PROMETHEUS shows a Pearson correlation of 0.897 with human evaluators, which is on par with GPT-4-0613 (0.882), and greatly outperforms ChatGPT (0.392). Remarkably, when assessing the quality of the generated feedback, PROMETHEUS demonstrates a win rate of 58.62% when compared to GPT-4 evaluation and a win rate of 79.57% when compared to ChatGPT evaluation. Our findings suggests that by adding reference materials and training on GPT-4 feedback, we can obtain effective open-source evaluator LMs.",
        "keywords": "automatic evaluation;large language models;llm-as-a-judge",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/fba32c838c8e8307f5560e1966c2a1c1b9cd1c4e.zip",
        "author": "Seungone Kim;Jamin Shin;Yejin Cho;Joel Jang;Shayne Longpre;Hwaran Lee;Sangdoo Yun;Seongjin Shin;Sungdong Kim;James Thorne;Minjoon Seo",
        "authorids": "~Seungone_Kim1;~Jamin_Shin1;~Yejin_Cho2;~Joel_Jang1;~Shayne_Longpre1;~Hwaran_Lee1;~Sangdoo_Yun1;~Seongjin_Shin1;~Sungdong_Kim1;~James_Thorne1;~Minjoon_Seo1",
        "gender": "M;M;F;M;M;F;M;M;;;M",
        "homepage": "https://github.com/SeungoneKim;https://jayshin.xyz;https://github.com/bodhitrii?tab=repositories;https://joeljang.github.io/;https://www.shaynelongpre.com;https://hwaranlee.github.io;https://sangdooyun.github.io/;;;https://jamesthorne.com;https://seominjoon.github.io",
        "dblp": "324/2064.html;225/5387;;;190/7024;127/9475;124/3009.html;277/5169;118/1568;204/1380;149/1367",
        "google_scholar": "https://scholar.google.co.kr/citations?user=qEf3e3EAAAAJ;GuBHIwsAAAAJ;;xL-7eFEAAAAJ;ADd_YfkAAAAJ;https://scholar.google.co.kr/citations?user=Jf6padoAAAAJ;o0qtjzYAAAAJ;;xKrSnDoAAAAJ;hao9RrgAAAAJ;zYze5fIAAAAJ",
        "orcid": ";;;;;0000-0002-3773-4871;;;;;",
        "linkedin": "seungone-kim-09b551264/;jayshin94/;;joel-jang-1289331a5/;shayne-redford-longpre/;hwaranlee/;;businesssavior/;;;minjoon-seo/",
        "or_profile": "~Seungone_Kim1;~Jamin_Shin1;~Yejin_Cho2;~Joel_Jang1;~Shayne_Longpre1;~Hwaran_Lee1;~Sangdoo_Yun1;~Seongjin_Shin1;~Sungdong_Kim1;~James_Thorne1;~Minjoon_Seo1",
        "aff": "KAIST;NAVER;Korea Advanced Institute of Science & Technology;Department of Computer Science, University of Washington;Massachusetts Institute of Technology;NAVER AI Lab;NAVER;NAVER;NAVER;KAIST;Twelve Labs",
        "aff_domain": "ee.kaist.ac.kr;navercorp.com;kaist.edu;cs.washington.edu;mit.edu;navercorp.com;navercorp.com;navercorp.com;navercorp.com;kaist.ac.kr;twelvelabs.io",
        "position": "MS student;Research Scientist;MS student;PhD student;PhD student;Lead;Research Scientist;Researcher;Researcher;Assistant Professor;Chief Scientist",
        "bibtex": "@inproceedings{\nkim2024prometheus,\ntitle={Prometheus: Inducing Fine-Grained Evaluation Capability in Language Models},\nauthor={Seungone Kim and Jamin Shin and Yejin Cho and Joel Jang and Shayne Longpre and Hwaran Lee and Sangdoo Yun and Seongjin Shin and Sungdong Kim and James Thorne and Minjoon Seo},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=8euJaTveKw}\n}",
        "github": "",
        "project": "",
        "reviewers": "B7Vr;WpqT;LTFo;6KgK",
        "pdf_size": 11257046,
        "rating": "1;5;6;6",
        "confidence": "4;3;4;4",
        "soundness": "1;2;4;2",
        "contribution": "1;3;3;3",
        "presentation": "1;3;4;3",
        "wc_summary": "103;126;99;93",
        "wc_strengths": "5;91;92;33",
        "wc_weaknesses": "41;221;95;161",
        "wc_questions": "8;2;2;21",
        "wc_review": "157;440;288;308",
        "wc_reply_reviewers": "0;0;15;0",
        "wc_reply_authors": "1045;1249;1404;0",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "5;4;4;0",
        "rating_avg": [
            4.5,
            2.0615528128088303
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            1.0897247358851685
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            2.75,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            105.25,
            12.497499749949988
        ],
        "wc_strengths_avg": [
            55.25,
            37.5790832778023
        ],
        "wc_weaknesses_avg": [
            129.5,
            67.79933627993714
        ],
        "wc_questions_avg": [
            8.25,
            7.75806032459145
        ],
        "wc_review_avg": [
            298.25,
            100.30547093753162
        ],
        "wc_reply_reviewers_avg": [
            3.75,
            6.49519052838329
        ],
        "wc_reply_authors_avg": [
            924.5,
            548.7351364729618
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.25,
            1.920286436967152
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": -0.14002800840280097,
        "gs_citation": 193,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4752804398290639678&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=8euJaTveKw",
        "pdf": "https://openreview.net/pdf?id=8euJaTveKw",
        "email": "ee.kaist.ac.kr;navercorp.com;kaist.edu;cs.washington.edu;mit.edu;navercorp.com;navercorp.com;navercorp.com;navercorp.com;kaist.ac.kr;twelvelabs.io",
        "author_num": 11,
        "aff_unique_index": "0;1;0;2;3;1;1;1;1;0;4",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology;NAVER Corporation;University of Washington;Massachusetts Institute of Technology;Twelve Labs",
        "aff_unique_dep": ";;Department of Computer Science;;",
        "aff_unique_url": "https://www.kaist.ac.kr;https://www.naver.com;https://www.washington.edu;https://web.mit.edu;https://twelvelabs.com",
        "aff_unique_abbr": "KAIST;NAVER;UW;MIT;",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Seattle",
        "aff_country_unique_index": "0;0;0;1;1;0;0;0;0;0;1",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "id": "8fJEOri51F",
        "title": "SSCBench: Monocular 3D Semantic Scene Completion Benchmark in Street Views",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Monocular scene understanding is a foundational component of autonomous systems. Within the spectrum of monocular perception topics, one crucial and useful task for holistic 3D scene understanding is semantic scene completion (SSC), which jointly completes semantic information and geometric details from RGB input. However, progress in SSC, particularly in large-scale street views, is hindered by the scarcity of high-quality datasets. To address this issue, we introduce SSCBench, a comprehensive benchmark that integrates scenes from widely used automotive datasets (e.g., KITTI-360, nuScenes, and Waymo). SSCBench follows an established setup and format in the community, facilitating the easy exploration of SSC methods in various street views. We benchmark models using monocular, trinocular, and point cloud input to assess the performance gap resulting from sensor coverage and modality. Moreover, we have unified semantic labels across diverse datasets to simplify cross-domain generalization testing. We commit to including more datasets and SSC models to drive further advancements in this field.",
        "keywords": "Semantic Scene Completion;Autonomous Driving",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Yiming Li;Sihang Li;Xinhao Liu;Moonjun Gong;Kenan Li;Nuo Chen;Zijun Wang;Zhiheng Li;Tao Jiang;Fisher Yu;Yue Wang;Hang Zhao;Zhiding Yu;Chen Feng",
        "authorids": "~Yiming_Li2;~Sihang_Li4;~Xinhao_Liu1;~Moonjun_Gong1;~Kenan_Li1;~Nuo_Chen6;~Zijun_Wang2;~Zhiheng_Li7;~Tao_Jiang11;~Fisher_Yu2;~Yue_Wang2;~Hang_Zhao1;~Zhiding_Yu1;~Chen_Feng2",
        "gender": "M;M;;;M;M;M;M;;M;M;M;;M",
        "homepage": "https://yimingli-page.github.io/;https://louis-leee.github.io/;https://gaaaavin.github.io/;;https://connorkevin.github.io/;https://nuochen1203.github.io/;;;;https://www.yf.io/;https://yuewang.xyz;http://www.mit.edu/~hangzhao/;;https://ai4ce.github.io/",
        "dblp": "l/YimingLi-3;;126/4582-3;;;135/5622-3;;;;117/6314;33/4822-41;;;01/161-2",
        "google_scholar": "https://scholar.google.com/citations?hl=en;90IoeJsAAAAJ;6pI4Xa4AAAAJ;;;https://scholar.google.com/citations?hl=en;;;;-XCiamcAAAAJ;v-AEFIEAAAAJ;DmahiOYAAAAJ;;YeG8ZM0AAAAJ",
        "orcid": "0000-0002-0157-6218;0000-0003-3053-5770;0000-0002-3036-0344;;;0009-0007-0581-0327;;;;;;;;0000-0003-3211-1576",
        "linkedin": "yiming-li-58b519173/;sihang-li-07724b267/;;;;;zijun-wang-083025193/;zhiheng-li-zl3466nyu/;;;;;;simbaforrest/",
        "or_profile": "~Yiming_Li2;~Sihang_Li4;~Xinhao_Liu1;~Moonjun_Gong1;~Kenan_Li1;~Nuo_Chen6;~Zijun_Wang2;~Zhiheng_Li7;~Tao_Jiang11;~Fisher_Yu2;~Yue_Wang2;~Hang_Zhao1;~Zhiding_Yu1;~Chen_Feng2",
        "aff": "New York University;New York University;New York University;;;New York University;Duke University;New York University;;Swiss Federal Institute of Technology;NVIDIA;Tsinghua University;;New York University",
        "aff_domain": "nyu.edu;nyu.edu;nyu.edu;;;nyu.edu;duke.edu;nyu.edu;;ethz.ch;nvidia.com;tsinghua.edu.cn;;nyu.edu",
        "position": "PhD student;PhD student;PhD student;;;MS student;MS student;Undergrad student;;Assistant Professor;Researcher;Assistant Professor;;Assistant Professor",
        "bibtex": "@misc{\nli2024sscbench,\ntitle={{SSCB}ench: Monocular 3D Semantic Scene Completion Benchmark in Street Views},\nauthor={Yiming Li and Sihang Li and Xinhao Liu and Moonjun Gong and Kenan Li and Nuo Chen and Zijun Wang and Zhiheng Li and Tao Jiang and Fisher Yu and Yue Wang and Hang Zhao and Zhiding Yu and Chen Feng},\nyear={2024},\nurl={https://openreview.net/forum?id=8fJEOri51F}\n}",
        "github": "",
        "project": "",
        "reviewers": "JQ2D;MTom;drPb;5Bcg",
        "site": "https://openreview.net/forum?id=8fJEOri51F",
        "pdf_size": 11668709,
        "rating": "5;5;5;8",
        "confidence": "4;4;4;3",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;2;4",
        "wc_summary": "45;59;33;94",
        "wc_strengths": "44;65;49;79",
        "wc_weaknesses": "227;300;230;21",
        "wc_questions": "63;81;10;84",
        "wc_review": "379;505;322;278",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            5.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            57.75,
            22.862359895688808
        ],
        "wc_strengths_avg": [
            59.25,
            13.790848414800301
        ],
        "wc_weaknesses_avg": [
            194.5,
            104.34198579670601
        ],
        "wc_questions_avg": [
            59.5,
            29.685855217594792
        ],
        "wc_review_avg": [
            371.0,
            85.24963343029692
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            14,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10903902950978373793&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0;0;1;0;2;3;4;0",
        "aff_unique_norm": "New York University;Duke University;Swiss Federal Institute of Technology;NVIDIA;Tsinghua University",
        "aff_unique_dep": ";;;NVIDIA Corporation;",
        "aff_unique_url": "https://www.nyu.edu;https://www.duke.edu;https://www.ethz.ch;https://www.nvidia.com;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "NYU;Duke;ETH Zurich;NVIDIA;THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;1;0;2;0",
        "aff_country_unique": "United States;Switzerland;China"
    },
    {
        "id": "8fQlGQkj0S",
        "title": "A Theoretical Analysis of In-context Task Retrieval and Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In-context learning (ICL) can be used for two different purposes: task retrieval and task learning.\nTask retrieval focuses on recalling a pre-trained task using examples from the task that closely approximates the target pre-trained task, while task learning involves learning a task using in-context examples.\nTo rigorously analyze these two modes, we propose generative models for both pretraining data and in-context samples.\nAssuming we use our proposed models and consider the mean squared error as a risk measure, we demonstrate that in-context prediction using a Bayes-optimal next-token predictor equates to the posterior mean of the label, conditioned on in-context samples.\nFrom this equivalence, we derive risk upper bounds for in-context learning.\nWe reveal a unique phenomenon in task retrieval: as the number of in-context samples increases, the risk upper bound decreases initially and then increases subsequently.\nThis implies that more in-context examples could potentially worsen task retrieval.\nWe validate our analysis with numerical computations in various scenarios and validate that our findings are replicable in the actual Transformer model implementation.",
        "keywords": "In-context Learning;Task Learning;Task Retrieval;Bayesian Inference;Noisy Linear Regression",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/2cc5080d6e6e6417844b1b5182590f4a19145080.pdf",
        "author": "Ziqian Lin;Kangwook Lee",
        "authorids": "~Ziqian_Lin1;~Kangwook_Lee1",
        "gender": "M;M",
        "homepage": "https://myhakureimu.github.io/;http://kangwooklee.com/",
        "dblp": "245/3453;88/9826-1",
        "google_scholar": "0nOdbCoAAAAJ;sCEl8r-n5VEC",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Ziqian_Lin1;~Kangwook_Lee1",
        "aff": "University of Wisconsin - Madison;KRAFTON",
        "aff_domain": "wisc.edu;krafton.com",
        "position": "PhD student;Researcher",
        "bibtex": "@misc{\nlin2024a,\ntitle={A Theoretical Analysis of In-context Task Retrieval and Learning},\nauthor={Ziqian Lin and Kangwook Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=8fQlGQkj0S}\n}",
        "github": "",
        "project": "",
        "reviewers": "v8Fu;KzaL;ZoJM;4TUM;8Pgy",
        "site": "https://openreview.net/forum?id=8fQlGQkj0S",
        "pdf_size": 1271038,
        "rating": "3;5;6;6;6",
        "confidence": "3;4;3;2;3",
        "soundness": "2;3;3;3;4",
        "contribution": "2;2;3;3;3",
        "presentation": "2;3;3;3;2",
        "wc_summary": "79;69;81;105;124",
        "wc_strengths": "34;31;48;71;94",
        "wc_weaknesses": "221;147;61;60;142",
        "wc_questions": "14;6;1;145;4",
        "wc_review": "348;253;191;381;364",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "759;686;135;566;382",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            5.2,
            1.16619037896906
        ],
        "confidence_avg": [
            3.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            3.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            91.6,
            20.05592181875468
        ],
        "wc_strengths_avg": [
            55.6,
            23.83778513201258
        ],
        "wc_weaknesses_avg": [
            126.2,
            60.50256192922742
        ],
        "wc_questions_avg": [
            34.0,
            55.666866267107224
        ],
        "wc_review_avg": [
            307.4,
            73.1808718177093
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            505.6,
            224.95564007154832
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.2711630722733202,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:VUKWRZU-hyYJ:scholar.google.com/&scioq=A+Theoretical+Analysis+of+In-context+Task+Retrieval+and+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Wisconsin-Madison;KRAFTON Inc.",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.wisc.edu;https://www.krafton.com",
        "aff_unique_abbr": "UW-Madison;KRAFTON",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Madison;",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United States;South Korea"
    },
    {
        "title": "Amortized Network Intervention to Steer the Excitatory Point Processes",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19320",
        "id": "8g26Yv1EOu",
        "author_site": "Zitao Song, Wendi Ren, Shuang Li",
        "tldr": "",
        "abstract": "Excitatory point processes (i.e., event flows) occurring over dynamic graphs (i.e., evolving topologies) provide a fine-grained model to capture how discrete events may spread over time and space. How to effectively steer the event flows by modifying the dynamic graph structures presents an interesting problem, motivated by curbing the spread of infectious diseases through strategically locking down cities to mitigating traffic congestion via traffic light optimization. To address the intricacies of planning and overcome the high dimensionality inherent to such decision-making problems, we design an Amortized Network Interventions (ANI) framework, allowing for the pooling of optimal policies from history and other contexts while ensuring a permutation equivalent property. This property enables efficient knowledge transfer and sharing across diverse contexts. Each task is solved by an H-step lookahead model-based reinforcement learning, where neural ODEs are introduced to model the dynamics of the excitatory point processes. Instead of simulating rollouts from the dynamics model, we derive an analytical mean-field approximation for the event flows given the dynamics, making the online planning more efficiently solvable. We empirically illustrate that this ANI approach substantially enhances policy learning for unseen dynamics and exhibits promising outcomes in steering event flows through network intervention using synthetic and real COVID datasets.",
        "keywords": "Time series application;Point Process;Amortized Learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/3169788ddf13a20386755c976fece7fa1bc6f6ac.pdf",
        "author": "Zitao Song;Wendi Ren;Shuang Li",
        "authorids": "~Zitao_Song1;~Wendi_Ren1;~Shuang_Li3",
        "gender": "M;F;F",
        "homepage": "https://tsedao.github.io/;;https://shuangli01.github.io",
        "dblp": ";218/8905;43/6294-2",
        "google_scholar": "RATrbJUAAAAJ;V0vQt1YAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0003-4646-0339;;",
        "linkedin": ";wendiren-gatech/;",
        "or_profile": "~Zitao_Song1;~Wendi_Ren1;~Shuang_Li3",
        "aff": "Nanyang Technological University;The Chinese University of Hong Kong;The Chinese University of Hong Kong (Shenzhen)",
        "aff_domain": "ntu.edu.sg;cuhk.edu.cn;cuhk.edu.cn",
        "position": "Researcher;PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nsong2024amortized,\ntitle={Amortized Network Intervention to Steer the Excitatory Point Processes},\nauthor={Zitao Song and Wendi Ren and Shuang Li},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=8g26Yv1EOu}\n}",
        "github": "",
        "project": "",
        "reviewers": "ya7t;9miN;hvRi;YqcV",
        "pdf_size": 4978040,
        "rating": "5;5;6;6",
        "confidence": "3;2;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "51;132;116;66",
        "wc_strengths": "83;68;33;14",
        "wc_weaknesses": "38;157;32;27",
        "wc_questions": "70;40;12;357",
        "wc_review": "242;397;193;464",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "896;568;561;690",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;2;2;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            91.25,
            33.65542303997975
        ],
        "wc_strengths_avg": [
            49.5,
            27.37243138634199
        ],
        "wc_weaknesses_avg": [
            63.5,
            54.12254613375095
        ],
        "wc_questions_avg": [
            119.75,
            138.50338443518265
        ],
        "wc_review_avg": [
            324.0,
            110.46945279125809
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            678.75,
            135.51268390818626
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.7071067811865475,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:zZ3BY3ZTVrYJ:scholar.google.com/&scioq=Amortized+Network+Intervention+to+Steer+the+Excitatory+Point+Processes&hl=en&as_sdt=0,48",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=8g26Yv1EOu",
        "pdf": "https://openreview.net/pdf?id=8g26Yv1EOu",
        "email": "ntu.edu.sg;cuhk.edu.cn;cuhk.edu.cn",
        "author_num": 3,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Nanyang Technological University;Chinese University of Hong Kong",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ntu.edu.sg;https://www.cuhk.edu.hk",
        "aff_unique_abbr": "NTU;CUHK",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Hong Kong SAR;Shenzhen",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "Singapore;China"
    },
    {
        "id": "8gZtt8nrpI",
        "title": "Diffusion Models With Learned Adaptive Noise Processes",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Diffusion models have gained traction as powerful algorithms for synthesizing high-quality images. Central to these algorithms is the diffusion process, which maps data to noise according to equations inspired by thermodynamics, and which can significantly impact performance. In this work, we explore whether a diffusion process can be learned from data. We propose multivariate learned adaptive noise (MULAN), a learned diffusion process that applies Gaussian noise at different rates across an image. Our method consists of three components\u2014a multivariate noise schedule, instance-conditional diffusion, and auxiliary variables\u2014which ensure that the learning objective is no longer invariant to the choice of noise schedule as in previous works. Our work is grounded in Bayesian inference and casts the learned diffusion process as an approximate variational posterior that yields a tighter lower bound on marginal likelihood. Empirically, MULAN significantly improves likelihood estimation on CIFAR10 and ImageNet, and achieves ~2x faster convergence to state-of-the-art performance compared to classical diffusion.",
        "keywords": "Generative Modeling;Diffusion Models;likelihood;Noising Schedule",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Subham Sekhar Sahoo;Aaron Gokaslan;Christopher De Sa;Volodymyr Kuleshov",
        "authorids": "~Subham_Sekhar_Sahoo1;~Aaron_Gokaslan1;~Christopher_De_Sa2;~Volodymyr_Kuleshov1",
        "gender": "M;M;;M",
        "homepage": ";https://skylion007.github.io/;https://www.cs.cornell.edu/~kuleshov/;http://cs.cornell.edu/~cdesa",
        "dblp": ";220/6816;81/8612;154/6336",
        "google_scholar": "Z7DoDbAAAAAJ;Mt2wyL4AAAAJ;RY_t8XAAAAAJ;",
        "orcid": ";0000-0002-3575-2961;;",
        "linkedin": "shakeh3r/;aarongokaslan/;;",
        "or_profile": "~Subham_Sekhar_Sahoo1;~Aaron_Gokaslan1;~Volodymyr_Kuleshov1;~Christopher_De_Sa1",
        "aff": "Department of Computer Science, Cornell University;Cornell University;Cornell University;Cornell University",
        "aff_domain": "cs.cornell.edu;cornell.edu;cornell.edu;cornell.edu",
        "position": "PhD student;PhD student;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nsahoo2024diffusion,\ntitle={Diffusion Models With Learned Adaptive Noise Processes},\nauthor={Subham Sekhar Sahoo and Aaron Gokaslan and Christopher De Sa and Volodymyr Kuleshov},\nyear={2024},\nurl={https://openreview.net/forum?id=8gZtt8nrpI}\n}",
        "github": "",
        "project": "",
        "reviewers": "U1Ra;oSn9;aHz6;PeVN",
        "site": "https://openreview.net/forum?id=8gZtt8nrpI",
        "pdf_size": 4573487,
        "rating": "5;5;6;6",
        "confidence": "3;4;3;4",
        "soundness": "2;2;3;3",
        "contribution": "2;3;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "35;75;38;114",
        "wc_strengths": "124;25;21;149",
        "wc_weaknesses": "310;111;97;326",
        "wc_questions": "138;53;48;13",
        "wc_review": "607;264;204;602",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "976;558;690;638",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            65.5,
            32.12864765283469
        ],
        "wc_strengths_avg": [
            79.75,
            57.451610073173754
        ],
        "wc_weaknesses_avg": [
            211.0,
            107.26369376447933
        ],
        "wc_questions_avg": [
            63.0,
            45.96194077712559
        ],
        "wc_review_avg": [
            419.25,
            186.4689987638696
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            715.5,
            157.577758582866
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:hTKfdIOIfGAJ:scholar.google.com/&scioq=Diffusion+Models+With+Learned+Adaptive+Noise+Processes&hl=en&as_sdt=0,33",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Cornell University",
        "aff_unique_dep": "Department of Computer Science",
        "aff_unique_url": "https://www.cornell.edu",
        "aff_unique_abbr": "Cornell",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "8giiPtg6rw",
        "title": "DataFreeShield: Defending Adversarial Attacks without Training Data",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent advances in adversarial robustness rely on an abundant set of training data, where using external or additional datasets has become a common setting.\nHowever, due to security and privacy issues, it is more common that a pretrained model is available while the dataset is not.\nIn such a scenario, existing methods that assume accessibility to the original data become inapplicable.\nFor the first time, we propose a problem of learning *data-free adversarial robustness*, where given only a pretrained model, adversarial robustness should be achieved without accessing the training dataset.\nIn our preliminary study, we identify that robustness without the original dataset is difficult to achieve, even with similar domain datasets.\nWe tackle the task from two perspectives: surrogate dataset generation and adversarial training using the generated data.\nFor dataset generation, we propose  diversified sample synthesis, which largely enhances the diversity of synthetic samples that are known to have low coverage. \nFor training, we propose a soft label loss that best learns robustness from noisy synthetic samples and a gradient refinement method toward smoother loss surface. \nExtensively validating methods using four datasets, we show that the proposed solution outperforms several baselines, demonstrating that the proposed method sets the first solution for the data-free robustness problem.",
        "keywords": "Data-free;Adversarial Robustness;Adversarial Training",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/0fc4fd221918f07afe3bc4bc764d6743e67677e1.zip",
        "author": "Hyeyoon Lee;Kanghyun Choi;Dain Kwon;SunJong Park;Mayoore Selvarasa Jaiswal;Noseong Park;Jonghyun Choi;Jinho Lee",
        "authorids": "~Hyeyoon_Lee1;~Kanghyun_Choi1;~Dain_Kwon1;~SunJong_Park1;~Mayoore_Selvarasa_Jaiswal1;~Noseong_Park1;~Jonghyun_Choi1;~Jinho_Lee2",
        "gender": ";M;F;;F;;M;M",
        "homepage": "https://aisys.snu.ac.kr/members/HyeyoonLee.html;https://aisys.snu.ac.kr/kanghyun.html;https://github.com/meowrowan;;mayoore.github.io;;https://ppolon.github.io/;http://acsys.snu.ac.kr/people.html",
        "dblp": "276/0074;229/7353;380/6008;;http://dblp.uni-trier.de/pers/hd/j/Jaiswal:Mayoore_S=;;21/11103;",
        "google_scholar": "lYXg5nsAAAAJ;n9e6qnsAAAAJ;;;IcMxiP4AAAAJ;;uiGWnm4AAAAJ;https://scholar.google.com/citations?hl=ko",
        "orcid": ";;;;;;0000-0002-7934-8434;",
        "linkedin": ";;;;;;jonghyun-choi-459bb615/;",
        "or_profile": "~Hyeyoon_Lee1;~Kanghyun_Choi1;~Dain_Kwon1;~SunJong_Park1;~Mayoore_Selvarasa_Jaiswal1;~Noseong_Park1;~Jonghyun_Choi1;~Jinho_Lee2",
        "aff": "Seoul National University;Seoul National University;Yonsei University;;University of Washington;;Yonsei University;Seoul National University",
        "aff_domain": "snu.ac.kr;snu.ac.kr;yonsei.ac.kr;; ;;yonsei.ac.kr;snu.ac.kr",
        "position": "PhD student;PhD student;Undergrad student;;Graduate Student;;Associate Professor;Associate Professor",
        "bibtex": "@misc{\nlee2024datafreeshield,\ntitle={DataFreeShield: Defending Adversarial Attacks without Training Data},\nauthor={Hyeyoon Lee and Kanghyun Choi and Dain Kwon and SunJong Park and Mayoore Selvarasa Jaiswal and Noseong Park and Jonghyun Choi and Jinho Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=8giiPtg6rw}\n}",
        "github": "",
        "project": "",
        "reviewers": "F6PX;nfcV;RMmq",
        "site": "https://openreview.net/forum?id=8giiPtg6rw",
        "pdf_size": 15521882,
        "rating": "3;5;5",
        "confidence": "4;4;4",
        "soundness": "2;4;2",
        "contribution": "2;3;2",
        "presentation": "3;3;2",
        "wc_summary": "101;48;36",
        "wc_strengths": "115;42;29",
        "wc_weaknesses": "712;134;152",
        "wc_questions": "191;2;2",
        "wc_review": "1119;226;219",
        "wc_reply_reviewers": "0;0;43",
        "wc_reply_authors": "1888;710;1258",
        "reply_reviewers": "0;0;1",
        "reply_authors": "4;2;3",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            61.666666666666664,
            28.241026106633512
        ],
        "wc_strengths_avg": [
            62.0,
            37.85058343892029
        ],
        "wc_weaknesses_avg": [
            332.6666666666667,
            268.3298136415126
        ],
        "wc_questions_avg": [
            65.0,
            89.09545442950498
        ],
        "wc_review_avg": [
            521.3333333333334,
            422.62381486244817
        ],
        "wc_reply_reviewers_avg": [
            14.333333333333334,
            20.27039439401436
        ],
        "wc_reply_authors_avg": [
            1285.3333333333333,
            481.30470829010414
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.0,
            0.816496580927726
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16114210221793948933&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;0;1;2;1;0",
        "aff_unique_norm": "Seoul National University;Yonsei University;University of Washington",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.snu.ac.kr;https://www.yonsei.ac.kr;https://www.washington.edu",
        "aff_unique_abbr": "SNU;Yonsei;UW",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0;0",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "id": "8hc2UvwTaL",
        "title": "FLAIM: AIM-based Synthetic Data Generation in the Federated Setting",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Preserving individual privacy while enabling collaborative data sharing is crucial for organizations. Synthetic data generation is one solution, producing artificial data that mirrors the statistical properties of private data. While numerous techniques have been devised under differential privacy, they predominantly assume data is centralized. However, data is often distributed across multiple clients in a federated manner. In this work, we initiate the study of federated synthetic tabular data generation. Building upon a SOTA central method known as AIM, we present DistAIM and FLAIM. We show it is straightforward to distribute AIM, extending a recent approach based on secure multi-party computation which necessitates additional overhead, making it less suited to federated scenarios. We then demonstrate that naively federating AIM can lead to substantial degradation in utility under the presence of heterogeneity. To mitigate both issues, we propose an augmented FLAIM approach that maintains a private proxy of heterogeneity. We simulate our methods across a range of benchmark datasets under different degrees of heterogeneity and show this can improve utility while reducing overhead.",
        "keywords": "Synthetic Data;Differential Privacy;Federated Learning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Samuel Maddock;Graham Cormode;carsten maple",
        "authorids": "~Samuel_Maddock1;~Graham_Cormode1;~carsten_maple1",
        "gender": "M;M;",
        "homepage": "https://warwick.ac.uk/fac/sci/dcs/people/u1714078/;http://dimacs.rutgers.edu/~graham/;https://warwick.ac.uk/fac/sci/wmg/people/profile/?wmgid=1102",
        "dblp": "289/1670;c/GrahamCormode;05/2263.html",
        "google_scholar": "ohQy__cAAAAJ;https://scholar.google.co.uk/citations?user=gpLVKmEAAAAJ;8MMdv50AAAAJ",
        "orcid": ";0000-0002-0698-0922;0000-0002-4715-212X",
        "linkedin": "samuel-maddock/;;",
        "or_profile": "~Samuel_Maddock1;~Graham_Cormode1;~carsten_maple1",
        "aff": "University of Warwick;The university of Warwick;The university of Warwick",
        "aff_domain": "warwick.ac.uk;warwick.ac.uk;warwick.ac.uk",
        "position": "PhD student;Full Professor;Full Professor",
        "bibtex": "@misc{\nmaddock2024flaim,\ntitle={{FLAIM}: {AIM}-based Synthetic Data Generation in the Federated Setting},\nauthor={Samuel Maddock and Graham Cormode and carsten maple},\nyear={2024},\nurl={https://openreview.net/forum?id=8hc2UvwTaL}\n}",
        "github": "",
        "project": "",
        "reviewers": "DXga;B23T;gW6i",
        "site": "https://openreview.net/forum?id=8hc2UvwTaL",
        "pdf_size": 7555006,
        "rating": "3;3;8",
        "confidence": "3;5;3",
        "soundness": "2;3;3",
        "contribution": "2;1;2",
        "presentation": "2;2;3",
        "wc_summary": "76;129;150",
        "wc_strengths": "55;60;19",
        "wc_weaknesses": "156;64;23",
        "wc_questions": "149;28;19",
        "wc_review": "436;281;211",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1415;760;245",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            4.666666666666667,
            2.357022603955158
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            118.33333333333333,
            31.13768706175132
        ],
        "wc_strengths_avg": [
            44.666666666666664,
            18.263503375736967
        ],
        "wc_weaknesses_avg": [
            81.0,
            55.61174935808679
        ],
        "wc_questions_avg": [
            65.33333333333333,
            59.275252471461954
        ],
        "wc_review_avg": [
            309.3333333333333,
            94.0153651744697
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            806.6666666666666,
            478.78898158676213
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2418353014466619100&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Warwick",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.warwick.ac.uk",
        "aff_unique_abbr": "Warwick",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "title": "Neural Auto-designer for Enhanced Quantum Kernels",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19319",
        "id": "8htNAnMSyP",
        "author_site": "Cong Lei, Yuxuan Du, Peng Mi, Jun Yu, Tongliang Liu",
        "tldr": "",
        "abstract": "Quantum kernels hold great promise for offering computational advantages over classical learners, with the effectiveness of these kernels closely tied to the design of the feature map. However, the challenge of designing effective quantum feature maps for real-world datasets, particularly in the absence of sufficient prior information, remains a significant obstacle. In this study, we present a data-driven approach that automates the design of problem-specific quantum feature maps. Our approach leverages feature-selection techniques to handle high-dimensional data on near-term quantum machines with limited qubits, and incorporates a deep neural predictor to efficiently evaluate the performance of various candidate quantum kernels. Through extensive numerical simulations on different datasets, we demonstrate the superiority of our proposal over prior methods, especially for the capability of eliminating the kernel concentration issue and identifying the feature map with prediction  advantages. Our work not only unlocks the potential of quantum kernels for enhancing real-world tasks, but also highlights the substantial role of deep learning in advancing quantum machine learning.",
        "keywords": "Quantum machine learning;kernel learning;quantum kernels;feature map;quantum circuit design",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Cong Lei;Yuxuan Du;Peng Mi;Jun Yu;Tongliang Liu",
        "authorids": "~Cong_Lei2;~Yuxuan_Du2;~Peng_Mi1;~Jun_Yu3;~Tongliang_Liu1",
        "gender": ";M;M;M;M",
        "homepage": "https://cong-lei.github.io/;https://github.com/yuxuan-du/Yuxuan-Du.github.io;https://www.github.com/Mi-Peng;https://faculty.ustc.edu.cn/yujun_AI/en/index.htm;https://tongliang-liu.github.io/",
        "dblp": "205/7609;;;50/5754-1.html;150/6667",
        "google_scholar": ";https://scholar.google.com.au/citations?user=50sFkzIAAAAJ;PTM4HCsAAAAJ;efZyqyQAAAAJ;https://scholar.google.com.au/citations?user=EiLdZ_YAAAAJ",
        "orcid": "0000-0003-2522-1152;0000-0002-1193-9756;;0000-0002-3197-8103;",
        "linkedin": ";;;;",
        "or_profile": "~Cong_Lei2;~Yuxuan_Du2;~Peng_Mi1;~Jun_Yu3;~Tongliang_Liu1",
        "aff": "University of Sydney;JD.com;;University of Science and Technology of China;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_domain": "usyd.edu.au;jd.com;;ustc.edu.cn;mbzuai.ac.ae",
        "position": "PhD student;Researcher;;Associate Professor;Affiliated Associate Professor",
        "bibtex": "@inproceedings{\nlei2024neural,\ntitle={Neural Auto-designer for Enhanced Quantum Kernels},\nauthor={Cong Lei and Yuxuan Du and Peng Mi and Jun Yu and Tongliang Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=8htNAnMSyP}\n}",
        "github": "",
        "project": "",
        "reviewers": "3hUP;oLos;FSEH;e6Tr",
        "pdf_size": 4287919,
        "rating": "3;6;6;6",
        "confidence": "5;5;4;4",
        "soundness": "2;2;3;2",
        "contribution": "1;2;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "85;46;100;51",
        "wc_strengths": "8;49;103;45",
        "wc_weaknesses": "242;139;384;163",
        "wc_questions": "5;53;4;35",
        "wc_review": "340;287;591;294",
        "wc_reply_reviewers": "770;53;470;11",
        "wc_reply_authors": "1773;1890;3165;2050",
        "reply_reviewers": "2;1;2;1",
        "reply_authors": "6;7;7;5",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            70.5,
            22.699118925632334
        ],
        "wc_strengths_avg": [
            51.25,
            33.88491552298751
        ],
        "wc_weaknesses_avg": [
            232.0,
            95.67392539244953
        ],
        "wc_questions_avg": [
            24.25,
            20.753011829611623
        ],
        "wc_review_avg": [
            378.0,
            124.6495086231791
        ],
        "wc_reply_reviewers_avg": [
            326.0,
            312.9001438158826
        ],
        "wc_reply_authors_avg": [
            2219.5,
            554.6694961866931
        ],
        "reply_reviewers_avg": [
            1.5,
            0.5
        ],
        "reply_authors_avg": [
            6.25,
            0.82915619758885
        ],
        "replies_avg": [
            37,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2971491082992789812&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=8htNAnMSyP",
        "pdf": "https://openreview.net/pdf?id=8htNAnMSyP",
        "email": "usyd.edu.au;jd.com;;ustc.edu.cn;mbzuai.ac.ae",
        "author_num": 5,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "University of Sydney;JD.com;University of Science and Technology of China;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.sydney.edu.au;https://www.jd.com;http://www.ustc.edu.cn;https://mbzuai.ac.ae",
        "aff_unique_abbr": "USYD;JD;USTC;MBZUAI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;2",
        "aff_country_unique": "Australia;China;United Arab Emirates"
    },
    {
        "title": "Poisoned Forgery Face: Towards Backdoor Attacks on Face Forgery Detection",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19318",
        "id": "8iTpB4RNvP",
        "author_site": "Jiawei Liang, Siyuan Liang, Aishan Liu, Xiaojun Jia, Junhao Kuang, Xiaochun Cao",
        "tldr": "",
        "abstract": "The proliferation of face forgery techniques has raised significant concerns within society, thereby motivating the development of face forgery detection methods. These methods aim to distinguish forged faces from genuine ones and have proven effective in practical applications. However, this paper introduces a novel and previously unrecognized threat in face forgery detection scenarios caused by backdoor attack. By embedding backdoors into models and incorporating specific trigger patterns into the input, attackers can deceive detectors into producing erroneous predictions for forged faces. To achieve this goal, this paper proposes \\emph{Poisoned Forgery Face} framework, which enables clean-label backdoor attacks on face forgery detectors. Our approach involves constructing a scalable trigger generator and utilizing a novel convolving process to generate translation-sensitive trigger patterns. Moreover, we employ a relative embedding method based on landmark-based regions to enhance the stealthiness of the poisoned samples. Consequently, detectors trained on our poisoned samples are embedded with backdoors. Notably, our approach surpasses SoTA backdoor baselines with a significant improvement in attack success rate (+16.39\\% BD-AUC) and reduction in visibility (-12.65\\% $L_\\infty$). Furthermore, our attack exhibits promising performance against backdoor defenses. We anticipate that this paper will draw greater attention to the potential threats posed by backdoor attacks in face forgery detection scenarios. Our codes will be made available at \\url{https://github.com/JWLiang007/PFF}.",
        "keywords": "Deepfake Detection;Backdoor Attack",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/c9892c29e38f6dc89dbeac92fcf9e72a9c2f5640.zip",
        "author": "Jiawei Liang;Siyuan Liang;Aishan Liu;Xiaojun Jia;Junhao Kuang;Xiaochun Cao",
        "authorids": "~Jiawei_Liang1;~Siyuan_Liang1;~Aishan_Liu1;~Xiaojun_Jia1;~Junhao_Kuang1;~Xiaochun_Cao3",
        "gender": "M;F;M;M;;M",
        "homepage": "https://www.researchgate.net/profile/Jiawei-Liang-11;https://www.github.com/;https://liuaishan.github.io/;https://jiaxiaojunqaq.github.io/;https://github.com/knight4u13;https://scst.sysu.edu.cn/members/caoxiaochun.htm",
        "dblp": ";205/8767.html;177/5658;;;39/3695",
        "google_scholar": "https://scholar.google.com.hk/citations?user=w60LFNwAAAAJ;Hon4nf0AAAAJ;88tzr_sAAAAJ;https://scholar.google.com/citations?hl=zh-CN;;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0003-1143-6873;0000-0002-6154-0233;;0000-0002-2018-9344;;0000-0001-7141-708X",
        "linkedin": ";;;;;",
        "or_profile": "~Jiawei_Liang1;~Siyuan_Liang1;~Aishan_Liu1;~Xiaojun_Jia1;~Junhao_Kuang1;~Xiaochun_Cao3",
        "aff": "SUN YAT-SEN UNIVERSITY;National University of Singapore;Beihang University;Nanyang Technological University;SUN YAT-SEN UNIVERSITY;SUN YAT-SEN UNIVERSITY",
        "aff_domain": "sysu.edu.cn;nus.edu;buaa.edu.cn;ntu.edu.sg;sysu.edu.cn;sysu.edu.cn",
        "position": "MS student;Researcher;Assistant Professor;Postdoc;Undergrad student;Full Professor",
        "bibtex": "@inproceedings{\nliang2024poisoned,\ntitle={Poisoned Forgery Face: Towards Backdoor Attacks on Face Forgery Detection},\nauthor={Jiawei Liang and Siyuan Liang and Aishan Liu and Xiaojun Jia and Junhao Kuang and Xiaochun Cao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=8iTpB4RNvP}\n}",
        "github": "",
        "project": "",
        "reviewers": "GcXY;4qiC;uGDS",
        "pdf_size": 5589900,
        "rating": "6;8;8",
        "confidence": "4;5;4",
        "soundness": "3;4;3",
        "contribution": "3;4;3",
        "presentation": "3;4;3",
        "wc_summary": "82;72;100",
        "wc_strengths": "71;81;69",
        "wc_weaknesses": "83;144;216",
        "wc_questions": "230;4;9",
        "wc_review": "466;301;394",
        "wc_reply_reviewers": "97;22;37",
        "wc_reply_authors": "1246;998;1549",
        "reply_reviewers": "1;1;1",
        "reply_authors": "3;3;4",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            84.66666666666667,
            11.585431464655178
        ],
        "wc_strengths_avg": [
            73.66666666666667,
            5.2493385826745405
        ],
        "wc_weaknesses_avg": [
            147.66666666666666,
            54.35888969514452
        ],
        "wc_questions_avg": [
            81.0,
            105.37868222115262
        ],
        "wc_review_avg": [
            387.0,
            67.54257916307313
        ],
        "wc_reply_reviewers_avg": [
            52.0,
            32.4037034920393
        ],
        "wc_reply_authors_avg": [
            1264.3333333333333,
            225.3180468187629
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 32,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12263160280159972267&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=8iTpB4RNvP",
        "pdf": "https://openreview.net/pdf?id=8iTpB4RNvP",
        "email": "sysu.edu.cn;nus.edu;buaa.edu.cn;ntu.edu.sg;sysu.edu.cn;sysu.edu.cn",
        "author_num": 6,
        "aff_unique_index": "0;1;2;3;0;0",
        "aff_unique_norm": "Sun Yat-sen University;National University of Singapore;Beihang University;Nanyang Technological University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "http://www.sysu.edu.cn;https://www.nus.edu.sg;http://www.buaa.edu.cn/;https://www.ntu.edu.sg",
        "aff_unique_abbr": "SYSU;NUS;BUAA;NTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;1;0;0",
        "aff_country_unique": "China;Singapore"
    },
    {
        "id": "8iojQVLLWb",
        "title": "Bayesian Knowledge Distillation for Online Action Detection",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Online action detection aims at identifying the ongoing action in a streaming video without seeing the future. Timely and accurate response is critical for real-world applications. In this paper, we introduce Bayesian knowledge distillation (BKD), an efficient and generalizable framework for online action detection. Specifically, we adopt a teacher-student architecture. During the training, the teacher model is built with a Bayesian neural network to output both the feature mutual information that measures the informativeness of historical features to ongoing action and the detection uncertainty. For efficient online detection, we also introduce a student model based on the evidential neural network that learns the feature mutual information and predictive uncertainties from the teacher model. In this way, the student model can not only select important features and make fast inference, but also efficiently quantify the prediction uncertainty by a single forward pass. We evaluated our proposed method on three benchmark datasets including THUMOS'14, TVSeries, and HDD. Our method achieves competitive performance with much better computational efficiency and much less model complexity. We also demonstrate that BKD generalizes better and is more data-efficient by extensive ablation studies. Finally, we validate the uncertainty quantification of the student model by performing abnormal action detection.",
        "keywords": "Online action detection;knowledge distillation;mutual information;uncertainty quantification",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/f6e366e0bf22ec1481b420f92501008a709307a6.pdf",
        "author": "Hongji Guo;Hanjing Wang;Qiang Ji",
        "authorids": "~Hongji_Guo1;~Hanjing_Wang2;~Qiang_Ji1",
        "gender": "M;M;M",
        "homepage": "https://sites.ecse.rpi.edu/~cvrl/Hongji/hongji.html;https://www.ecse.rpi.edu/~cvrl/people_zw.html;https://www.ecse.rpi.edu/~qji/",
        "dblp": "330/1899;234/8752;",
        "google_scholar": "I213n_cAAAAJ;;vAXmpVIAAAAJ",
        "orcid": ";;",
        "linkedin": "hongji-guo-357124192/;;",
        "or_profile": "~Hongji_Guo1;~Hanjing_Wang2;~Qiang_Ji1",
        "aff": "Rensselaer Polytechnic Institute;Rensselaer Polytechnic Institute;Rensselaer Polytechnic Institute",
        "aff_domain": "rpi.edu;rpi.edu;rpi.edu",
        "position": "PhD student;PhD student;Professor",
        "bibtex": "@misc{\nguo2024bayesian,\ntitle={Bayesian Knowledge Distillation for Online Action Detection},\nauthor={Hongji Guo and Hanjing Wang and Qiang Ji},\nyear={2024},\nurl={https://openreview.net/forum?id=8iojQVLLWb}\n}",
        "github": "",
        "project": "",
        "reviewers": "i6Lf;f1zi;kgXL;37DN",
        "site": "https://openreview.net/forum?id=8iojQVLLWb",
        "pdf_size": 4195624,
        "rating": "3;3;5;5",
        "confidence": "4;4;4;2",
        "soundness": "2;2;3;2",
        "contribution": "2;2;2;2",
        "presentation": "3;2;3;2",
        "wc_summary": "80;105;64;67",
        "wc_strengths": "29;90;26;80",
        "wc_weaknesses": "217;352;112;150",
        "wc_questions": "61;42;11;12",
        "wc_review": "387;589;213;309",
        "wc_reply_reviewers": "48;90;55;69",
        "wc_reply_authors": "572;611;212;371",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            79.0,
            16.170961628796228
        ],
        "wc_strengths_avg": [
            56.25,
            28.98598799420161
        ],
        "wc_weaknesses_avg": [
            207.75,
            91.37388850213172
        ],
        "wc_questions_avg": [
            31.5,
            21.10094784600919
        ],
        "wc_review_avg": [
            374.5,
            138.32841356713377
        ],
        "wc_reply_reviewers_avg": [
            65.5,
            16.03901493234544
        ],
        "wc_reply_authors_avg": [
            441.5,
            160.7801293692725
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9528727725945138740&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Rensselaer Polytechnic Institute",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.rpi.edu",
        "aff_unique_abbr": "RPI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Finite Scalar Quantization: VQ-VAE Made Simple",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19317",
        "id": "8ishA3LxN8",
        "author_site": "Fabian Mentzer, David Minnen, Eirikur Agustsson, Michael Tschannen",
        "tldr": "",
        "abstract": "We propose to replace vector quantization (VQ) in the latent representation of VQ-VAEs\nwith a simple scheme termed finite scalar quantization (FSQ), where we project the VAE representation down to a few dimensions (typically less than 10).\nEach dimension is quantized to a small set of fixed values, leading to an (implicit) codebook given by the product of these sets.\nBy appropriately choosing the number of dimensions and values each dimension can take, we obtain the same codebook size as in VQ.\nOn top of such discrete representations,\nwe can train the same models that have been trained on VQ-VAE representations. For example, autoregressive and masked transformer models for image generation, multimodal generation, and dense prediction computer vision tasks.\nConcretely, we employ FSQ with MaskGIT for image generation, and with UViM for depth estimation, colorization, and panoptic segmentation.\nDespite the much simpler design of FSQ, we obtain competitive performance in all these tasks.\nWe emphasize that FSQ does not suffer from codebook collapse and does not need the complex machinery employed in VQ (commitment losses, codebook reseeding, code splitting, entropy penalties, etc.) to learn expressive discrete representations.",
        "keywords": "representation learning;vector quantization;quantization",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/8d534731cef42aa361d20832385f5dc4f32f5537.pdf",
        "author": "Fabian Mentzer;David Minnen;Eirikur Agustsson;Michael Tschannen",
        "authorids": "~Fabian_Mentzer2;~David_Minnen1;~Eirikur_Agustsson1;~Michael_Tschannen1",
        "gender": "M;M;;",
        "homepage": "https://fmentzer.github.io;http://research.minnen.org;;https://mitscha.github.io/",
        "dblp": "186/8020;;http://dblp.uni-trier.de/pers/hd/a/Agustsson:Eirikur;134/9824",
        "google_scholar": "https://scholar.google.ch/citations?user=R80F8XUAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.ch/citations?user=Uhvyua4AAAAJ;https://scholar.google.ch/citations?user=TSj_8nYAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;eirikuragustsson/;",
        "or_profile": "~Fabian_Mentzer2;~David_Minnen1;~Eirikur_Agustsson1;~Michael_Tschannen1",
        "aff": "Google;Google;Google;Google DeepMind",
        "aff_domain": "google.com;google.com;google.com;google.com",
        "position": "Researcher;Researcher;Researcher;Researcher",
        "bibtex": "@inproceedings{\nmentzer2024finite,\ntitle={Finite Scalar Quantization: {VQ}-{VAE} Made Simple},\nauthor={Fabian Mentzer and David Minnen and Eirikur Agustsson and Michael Tschannen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=8ishA3LxN8}\n}",
        "github": "",
        "project": "",
        "reviewers": "zMky;fsTh;Hp3C;HYXB",
        "pdf_size": 3295764,
        "rating": "6;6;6;8",
        "confidence": "4;4;2;3",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;2",
        "wc_summary": "73;50;250;120",
        "wc_strengths": "62;45;89;47",
        "wc_weaknesses": "67;84;101;115",
        "wc_questions": "97;97;37;145",
        "wc_review": "299;276;477;427",
        "wc_reply_reviewers": "28;0;17;120",
        "wc_reply_authors": "456;785;217;385",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            123.25,
            77.40599137017755
        ],
        "wc_strengths_avg": [
            60.75,
            17.583728273605686
        ],
        "wc_weaknesses_avg": [
            91.75,
            18.019087102292392
        ],
        "wc_questions_avg": [
            94.0,
            38.301436004411116
        ],
        "wc_review_avg": [
            369.75,
            84.52033778919723
        ],
        "wc_reply_reviewers_avg": [
            41.25,
            46.54769059792333
        ],
        "wc_reply_authors_avg": [
            460.75,
            206.34482668581734
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.17407765595569782,
        "gs_citation": 166,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6562591541374820279&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=8ishA3LxN8",
        "pdf": "https://openreview.net/pdf?id=8ishA3LxN8",
        "email": "google.com;google.com;google.com;google.com",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Google",
        "aff_unique_dep": "Google",
        "aff_unique_url": "https://www.google.com",
        "aff_unique_abbr": "Google",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Mountain View;",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "title": "Combining Axes Preconditioners through Kronecker Approximation for Deep Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19316",
        "id": "8j9hz8DVi8",
        "author_site": "Venkata Sai Surya Subramanyam Duvvuri, Fnu Devvrit, Rohan Anil, Cho-Jui Hsieh, Inderjit Dhillon",
        "tldr": "",
        "abstract": "Adaptive regularization based optimization methods such as full-matrix Adagrad which use gradient second-moment information hold significant potential for fast convergence in deep neural network (DNN) training, but are memory intensive and computationally demanding for large neural nets. We develop a technique called Combining AxeS PReconditioners (CASPR), which optimizes matrix-shaped DNN parameters by finding different preconditioners for each mode/axis of the parameter and combining them using a Kronecker-sum based approximation. We show tighter convergence guarantees in stochastic optimization compared to a Kronecker product based preconditioner, Shampoo, which arises as a special case of CASPR. Furthermore, our experiments demonstrates that CASPR approximates the gradient second-moment matrix in full-matrix Adagrad more accurately, and shows significant improvement in training and generalization performance compared to existing practical adaptive regularization based methods such as Shampoo and Adam in a variety of tasks including graph neural network on OGBG-molpcba, Transformer on a universal dependencies dataset and auto-regressive large language modeling on C4 dataset.",
        "keywords": "Optimization",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Sai Surya Duvvuri;Fnu Devvrit;Rohan Anil;Cho-Jui Hsieh;Inderjit S Dhillon",
        "authorids": "~Sai_Surya_Duvvuri1;~Fnu_Devvrit1;~Rohan_Anil1;~Cho-Jui_Hsieh1;~Inderjit_S_Dhillon1",
        "gender": "M;M;M;M;M",
        "homepage": ";;;http://web.cs.ucla.edu/~chohsieh/index.html;http://www.cs.utexas.edu/users/inderjit/",
        "dblp": "277/6122;;182/1833;14/2770;d/InderjitSDhillon",
        "google_scholar": "UL3980gAAAAJ;c86HtPoAAAAJ;;Wy89g4IAAAAJ;xBv5ZfkAAAAJ",
        "orcid": ";;;;",
        "linkedin": "sai-surya-duvvuri-79903511b/;devvrit/;;;inderjit-dhillon-a20888b0/",
        "or_profile": "~Sai_Surya_Duvvuri1;~Fnu_Devvrit1;~Rohan_Anil1;~Cho-Jui_Hsieh1;~Inderjit_S_Dhillon1",
        "aff": "University of Texas at Austin;, University of Texas at Austin;Google Brain  ;University of California, Los Angeles;University of Texas, Austin",
        "aff_domain": "cs.utexas.edu;cs.utexas.edu;google.com;ucla.edu;utexas.edu",
        "position": "PhD student;PhD student;Principal Engineer;Associate Professor;Full Professor",
        "bibtex": "@inproceedings{\nduvvuri2024combining,\ntitle={Combining Axes Preconditioners through Kronecker Approximation for Deep Learning},\nauthor={Sai Surya Duvvuri and Fnu Devvrit and Rohan Anil and Cho-Jui Hsieh and Inderjit S Dhillon},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=8j9hz8DVi8}\n}",
        "github": "",
        "project": "",
        "reviewers": "gGzL;Vz7y;a8ib",
        "pdf_size": 678541,
        "rating": "6;8;8",
        "confidence": "3;5;3",
        "soundness": "3;4;3",
        "contribution": "3;4;4",
        "presentation": "3;4;3",
        "wc_summary": "48;77;41",
        "wc_strengths": "37;67;22",
        "wc_weaknesses": "129;25;81",
        "wc_questions": "109;108;4",
        "wc_review": "323;277;148",
        "wc_reply_reviewers": "0;76;0",
        "wc_reply_authors": "803;258;271",
        "reply_reviewers": "0;1;0",
        "reply_authors": "3;2;1",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            55.333333333333336,
            15.584892970081281
        ],
        "wc_strengths_avg": [
            42.0,
            18.708286933869708
        ],
        "wc_weaknesses_avg": [
            78.33333333333333,
            42.49967320135794
        ],
        "wc_questions_avg": [
            73.66666666666667,
            49.2634640366356
        ],
        "wc_review_avg": [
            249.33333333333334,
            74.07353703509027
        ],
        "wc_reply_reviewers_avg": [
            25.333333333333332,
            35.82674358011841
        ],
        "wc_reply_authors_avg": [
            444.0,
            253.90680705067098
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12991620137545411675&as_sdt=805&sciodt=0,3&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=8j9hz8DVi8",
        "pdf": "https://openreview.net/pdf?id=8j9hz8DVi8",
        "email": "cs.utexas.edu;cs.utexas.edu;google.com;ucla.edu;utexas.edu",
        "author_num": 5,
        "aff_unique_index": "0;0;1;2;0",
        "aff_unique_norm": "University of Texas at Austin;Google;University of California, Los Angeles",
        "aff_unique_dep": ";Google Brain;",
        "aff_unique_url": "https://www.utexas.edu;https://brain.google.com;https://www.ucla.edu",
        "aff_unique_abbr": "UT Austin;Google Brain;UCLA",
        "aff_campus_unique_index": "0;0;1;2;0",
        "aff_campus_unique": "Austin;Mountain View;Los Angeles",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "8jKuUHsndT",
        "title": "Re-evaluating Retrosynthesis Algorithms with Syntheseus",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The planning of how to synthesize molecules, also known as retrosynthesis, has been a growing focus of the machine learning and chemistry communities in recent years. Despite the appearance of steady progress, we argue that imperfect benchmarks and inconsistent comparisons mask systematic shortcomings of existing techniques. To remedy this, we present a benchmarking library called syntheseus which promotes best practice by default, enabling consistent meaningful evaluation of single-step and multi-step retrosynthesis algorithms. We use syntheseus to re-evaluate a number of previous retrosynthesis algorithms, and find that the ranking of state-of-the-art models changes when evaluated carefully. We end with guidance for future works in this area.",
        "keywords": "retrosynthesis;reaction prediction;chemistry;drug design;science",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/42f838fa010120ad601b8a33bdb7878062eff97e.zip",
        "author": "Krzysztof Maziarz;Austin Tripp;Guoqing Liu;Megan Stanley;Shufang Xie;Piotr Gai\u0144ski;Philipp Seidl;Marwin Segler",
        "authorids": "~Krzysztof_Maziarz1;~Austin_Tripp1;~Guoqing_Liu3;~Megan_Stanley1;~Shufang_Xie1;~Piotr_Gai\u0144ski1;~Philipp_Seidl1;~Marwin_Segler2",
        "gender": "M;M;M;;M;M;M;",
        "homepage": ";https://www.austintripp.ca/;https://www.microsoft.com/en-us/research/people/guoqingliu/;;;https://github.com/panpiort8/;;",
        "dblp": "194/2971;267/5455;;;https://dblp.uni-trier.de/pid/163/2704-3;;262/3456;185/0993",
        "google_scholar": "BA8bBVkAAAAJ;WAvRaxMAAAAJ;h-eHvyoAAAAJ;;;;WmyltwcAAAAJ;imsL94QAAAAJ",
        "orcid": ";0000-0002-0138-7740;;;;;;",
        "linkedin": ";;;megan-jane-stanley/;;;phseidl/;",
        "or_profile": "~Krzysztof_Maziarz1;~Austin_Tripp1;~Guoqing_Liu3;~Megan_Stanley1;~Shufang_Xie1;~Piotr_Gai\u0144ski1;~Philipp_Seidl1;~Marwin_Segler1",
        "aff": "Microsoft Research;University of Cambridge;Microsoft Research ;Microsoft Research Cambridge;Renmin University of China;Mila - Quebec Artificial Intelligence Institute;Johannes Kepler University Linz;Microsoft",
        "aff_domain": "microsoft.com;cam.ac.uk;microsoft.com;microsoft.com;ruc.edu.cn;mila.quebec;jku.at;microsoft.com",
        "position": "Senior Researcher;PhD student;Researcher;Researcher;PhD student;Intern;PhD student;Researcher",
        "bibtex": "@misc{\nmaziarz2024reevaluating,\ntitle={Re-evaluating Retrosynthesis Algorithms with Syntheseus},\nauthor={Krzysztof Maziarz and Austin Tripp and Guoqing Liu and Megan Stanley and Shufang Xie and Piotr Gai{\\'n}ski and Philipp Seidl and Marwin Segler},\nyear={2024},\nurl={https://openreview.net/forum?id=8jKuUHsndT}\n}",
        "github": "",
        "project": "",
        "reviewers": "cznK;eNX2;WK4y;JYEf",
        "site": "https://openreview.net/forum?id=8jKuUHsndT",
        "pdf_size": 578731,
        "rating": "3;5;6;8",
        "confidence": "4;4;3;4",
        "soundness": "2;3;3;4",
        "contribution": "2;2;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "111;99;60;61",
        "wc_strengths": "81;63;68;184",
        "wc_weaknesses": "114;52;94;153",
        "wc_questions": "21;31;53;52",
        "wc_review": "327;245;275;450",
        "wc_reply_reviewers": "98;0;0;133",
        "wc_reply_authors": "496;528;406;486",
        "reply_reviewers": "1;0;0;2",
        "reply_authors": "3;1;2;3",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            82.75,
            22.65364209128413
        ],
        "wc_strengths_avg": [
            99.0,
            49.512624652708524
        ],
        "wc_weaknesses_avg": [
            103.25,
            36.409991760504425
        ],
        "wc_questions_avg": [
            39.25,
            13.718144918318949
        ],
        "wc_review_avg": [
            324.25,
            78.30509242699354
        ],
        "wc_reply_reviewers_avg": [
            57.75,
            59.060879607401716
        ],
        "wc_reply_authors_avg": [
            479.0,
            44.91102314577124
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.16012815380508713,
        "gs_citation": 32,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3781188252048429306&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;0;0;2;3;4;0",
        "aff_unique_norm": "Microsoft;University of Cambridge;Renmin University of China;Quebec Artificial Intelligence Institute;Johannes Kepler University",
        "aff_unique_dep": "Microsoft Research;;;Artificial Intelligence;",
        "aff_unique_url": "https://www.microsoft.com/en-us/research;https://www.cam.ac.uk;http://www.ruc.edu.cn;https://mila.quebec;https://www.jku.at",
        "aff_unique_abbr": "MSR;Cambridge;RUC;Mila;JKU",
        "aff_campus_unique_index": "1;1;2",
        "aff_campus_unique": ";Cambridge;Linz",
        "aff_country_unique_index": "0;1;0;1;2;3;4;0",
        "aff_country_unique": "United States;United Kingdom;China;Canada;Austria"
    },
    {
        "id": "8lLaS1ekDA",
        "title": "Signatures Meet Dynamic Programming: Generalizing Bellman Equations for Trajectory Following",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Path signatures have been proposed as a powerful representation of paths that ef\ufb01ciently captures the path\u2019s analytic and geometric characteristics, having useful algebraic properties including fast concatenation of paths through tensor products. Signatures have recently been widely adopted in machine learning problems for time series analysis. In this work we establish connections between value functions typically used in optimal control and intriguing properties of path signatures. These connections motivate our novel control framework with signature transforms that ef\ufb01ciently generalizes the Bellman equation to the space of trajectories. We analyze the properties and advantages of the framework, termed signature control. In particular, we demonstrate that (i) it can naturally deal with varying/adaptive time steps; (ii) it propagates higher-level information more ef\ufb01ciently than value function updates; (iii) it is robust to dynamical system misspeci\ufb01cation over long rollouts. As a speci\ufb01c case of our framework, we devise a model predictive control method for path tracking. This method generalizes integral control, being suitable for problems with unknown disturbances. The proposed algorithms are tested in simulation, with differentiable physics models including typical control and robotics tasks such as point-mass, curve following for an ant model, and a robotic manipulator.",
        "keywords": "Decision making;Path signature;Bellman equation;Integral control;Model predictive control;Robotics",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/31e087a732bf849de7221b5f837a4c104c4b0288.zip",
        "author": "Motoya Ohnishi;Iretiayo Akinola;Jie Xu;Ajay Mandlekar;Fabio Ramos",
        "authorids": "~Motoya_Ohnishi1;~Iretiayo_Akinola1;~Jie_Xu7;~Ajay_Mandlekar1;~Fabio_Ramos1",
        "gender": "M;M;M;M;M",
        "homepage": "https://mohnishi.github.io/;;https://people.csail.mit.edu/jiex;https://ai.stanford.edu/~amandlek/;https://fabioramos.github.io/",
        "dblp": "207/9907;;37/5126-28;https://dblp.uni-trier.de/pers/hd/m/Mandlekar:Ajay;22/2488",
        "google_scholar": ";e1zesfMAAAAJ;3Tj5lWEAAAAJ;MEz23joAAAAJ;https://scholar.google.com.au/citations?user=T_mJiHoAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;fabio-ramos-3256b421/",
        "or_profile": "~Motoya_Ohnishi1;~Iretiayo_Akinola1;~Jie_Xu7;~Ajay_Mandlekar1;~Fabio_Ramos1",
        "aff": "University of Washington;NVIDIA;NVIDIA;NVIDIA;NVIDIA",
        "aff_domain": "washington.edu;nvidia.com;nvidia.com;nvidia.com;nvidia.com",
        "position": "PhD student;Researcher;Researcher;Researcher;Principal Research Scientist",
        "bibtex": "@misc{\nohnishi2024signatures,\ntitle={Signatures Meet Dynamic Programming: Generalizing Bellman Equations for Trajectory Following},\nauthor={Motoya Ohnishi and Iretiayo Akinola and Jie Xu and Ajay Mandlekar and Fabio Ramos},\nyear={2024},\nurl={https://openreview.net/forum?id=8lLaS1ekDA}\n}",
        "github": "",
        "project": "",
        "reviewers": "1sNc;ZzLg;AcwD",
        "site": "https://openreview.net/forum?id=8lLaS1ekDA",
        "pdf_size": 3336066,
        "rating": "3;5;5",
        "confidence": "3;3;3",
        "soundness": "2;2;2",
        "contribution": "3;2;2",
        "presentation": "1;3;1",
        "wc_summary": "80;120;81",
        "wc_strengths": "118;167;33",
        "wc_weaknesses": "962;128;152",
        "wc_questions": "178;44;1",
        "wc_review": "1338;459;267",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            93.66666666666667,
            18.624953392931992
        ],
        "wc_strengths_avg": [
            106.0,
            55.35943159631127
        ],
        "wc_weaknesses_avg": [
            414.0,
            387.618369017775
        ],
        "wc_questions_avg": [
            74.33333333333333,
            75.37609405876346
        ],
        "wc_review_avg": [
            688.0,
            466.2552948761011
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2357026002029994603&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1;1;1",
        "aff_unique_norm": "University of Washington;NVIDIA",
        "aff_unique_dep": ";NVIDIA Corporation",
        "aff_unique_url": "https://www.washington.edu;https://www.nvidia.com",
        "aff_unique_abbr": "UW;NVIDIA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "DiffEnc: Variational Diffusion with a Learned Encoder",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19315",
        "id": "8nxy1bQWTG",
        "author_site": "Beatrix M. G. Nielsen, Anders Christensen, Andrea Dittadi, Ole Winther",
        "tldr": "",
        "abstract": "Diffusion models may be viewed as hierarchical variational autoencoders (VAEs) with two improvements: parameter sharing for the conditionals in the generative process and efficient computation of the loss as independent terms over the hierarchy. We consider two changes to the diffusion model that retain these advantages while adding flexibility to the model. Firstly, we introduce a data and depth-dependent mean function in the diffusion process, which leads to a modified diffusion loss. Our proposed framework, DiffEnc, achieves a statistically significant improvement in likelihood on CIFAR-10. Secondly, we let the ratio of the noise variance of the reverse encoder process and the generative process be a free weight parameter rather than being fixed to one. This leads to theoretical insights: For a finite depth hierarchy, the evidence lower bound (ELBO) can be used as an objective for a weighted diffusion loss approach and for optimizing the noise schedule specifically for inference. For the infinite-depth hierarchy, on the other hand, the weight parameter has to be one to have a well-defined ELBO.",
        "keywords": "DDPM;diffusion;image generation;encoder",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Beatrix Miranda Ginn Nielsen;Anders Christensen;Andrea Dittadi;Ole Winther",
        "authorids": "~Beatrix_Miranda_Ginn_Nielsen1;~Anders_Christensen1;~Andrea_Dittadi1;~Ole_Winther1",
        "gender": "F;M;M;M",
        "homepage": ";;https://addtt.github.io;https://olewinther.github.io/",
        "dblp": ";44/5606;;36/1568",
        "google_scholar": ";https://scholar.google.com/citations?hl=da;PrvuuaAAAAAJ;7VAwhzUAAAAJ",
        "orcid": "0009-0005-0092-024X;0009-0009-0038-5485;;0000-0002-1966-3205",
        "linkedin": "beatrix-miranda-ginn-nielsen-84201694;anderschrist/;;owinther/",
        "or_profile": "~Beatrix_Miranda_Ginn_Nielsen1;~Anders_Christensen1;~Andrea_Dittadi1;~Ole_Winther1",
        "aff": "Technical University of Denmark;Technical University of Denmark;Mila - Quebec Artificial Intelligence Institute;Technical University of Denmark",
        "aff_domain": "dtu.dk;dtu.dk;mila.quebec;dtu.dk",
        "position": "PhD student;PhD student;Visiting Researcher;Full Professor",
        "bibtex": "@inproceedings{\nnielsen2024diffenc,\ntitle={DiffEnc: Variational Diffusion with a Learned Encoder},\nauthor={Beatrix Miranda Ginn Nielsen and Anders Christensen and Andrea Dittadi and Ole Winther},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=8nxy1bQWTG}\n}",
        "github": "",
        "project": "",
        "reviewers": "g9hi;jJ4J;Hg56;neQL",
        "pdf_size": 3398407,
        "rating": "5;6;6;6",
        "confidence": "2;4;4;1",
        "soundness": "3;3;3;2",
        "contribution": "2;2;3;3",
        "presentation": "3;4;3;2",
        "wc_summary": "58;41;105;86",
        "wc_strengths": "71;38;79;101",
        "wc_weaknesses": "133;227;306;56",
        "wc_questions": "70;73;146;24",
        "wc_review": "332;379;636;267",
        "wc_reply_reviewers": "0;0;35;0",
        "wc_reply_authors": "506;874;583;188",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            2.75,
            1.299038105676658
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            72.5,
            24.70323865407125
        ],
        "wc_strengths_avg": [
            72.25,
            22.620510604316607
        ],
        "wc_weaknesses_avg": [
            180.5,
            94.43119188064927
        ],
        "wc_questions_avg": [
            78.25,
            43.671357890498435
        ],
        "wc_review_avg": [
            403.5,
            140.00089285429576
        ],
        "wc_reply_reviewers_avg": [
            8.75,
            15.155444566227676
        ],
        "wc_reply_authors_avg": [
            537.75,
            244.15402413230873
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5956881876886698360&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=8nxy1bQWTG",
        "pdf": "https://openreview.net/pdf?id=8nxy1bQWTG",
        "email": "dtu.dk;dtu.dk;mila.quebec;dtu.dk",
        "author_num": 4,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Technical University of Denmark;Quebec Artificial Intelligence Institute",
        "aff_unique_dep": ";Artificial Intelligence",
        "aff_unique_url": "https://www.tek.dk;https://mila.quebec",
        "aff_unique_abbr": "DTU;Mila",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "Denmark;Canada"
    },
    {
        "id": "8nz6xYntfJ",
        "title": "AlignDiff: Aligning Diffusion Models for General Few-Shot Segmentation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Text-to-image diffusion models have shown remarkable success in synthesizing photo-realistic images. Apart from creative applications, can we use such models to synthesize samples that aid the few-shot training of discriminative models? In this work, we propose AlignDiff, a general framework for synthesizing training images and associated mask annotations for few-shot segmentation. We identify three levels of misalignments that arise when utilizing pre-trained diffusion models in segmentation tasks. These misalignments need to be addressed to create realistic training samples and align the synthetic data distribution with the real training distribution: 1) instance-level misalignment, where generated samples fail to be consistent with the target task (e.g., specific texture or out-of-distribution generation of rare categories); 2) scene-level misalignment, where synthetic samples are object-centric and fail to represent realistic scene layouts with multiple objects; and 3) annotation-level misalignment, where diffusion models are limited to generating images without pixel-level annotations. AlignDiff overcomes these challenges by leveraging a few real samples to guide the generation, thus improving novel IoU over baseline methods in generalized few-shot semantic segmentation on Pascal-5i and COCO-20i by up to 80%. In addition, AlignDiff is capable of augmenting the learning of out-of-distribution categories on FSS-1000, while naive diffusion model generates samples that hurt the training process. The code will be released.",
        "keywords": "Few-shot learning;image segmentation;image synthesis;training synthesis",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Ri-Zhao Qiu;Yu-Xiong Wang;Kris Hauser",
        "authorids": "~Ri-Zhao_Qiu1;~Yu-Xiong_Wang1;~Kris_Hauser2",
        "gender": "Not Specified;;M",
        "homepage": "https://rogerqi.github.io/;https://yxw.cs.illinois.edu/;http://kkhauser.web.illinois.edu",
        "dblp": "336/5470;35/10700;",
        "google_scholar": "uH0re54AAAAJ;T_Q-xDkAAAAJ;-sGaL8sAAAAJ",
        "orcid": ";;",
        "linkedin": "rizhaoqiu/;;",
        "or_profile": "~Ri-Zhao_Qiu1;~Yu-Xiong_Wang1;~Kris_Hauser2",
        "aff": "University of California, San Diego;Department of Computer Science, University of Illinois Urbana-Champaign;University of Illinois, Urbana-Champaign",
        "aff_domain": "ucsd.edu;cs.illinois.edu;illinois.edu",
        "position": "PhD student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nqiu2024aligndiff,\ntitle={AlignDiff: Aligning Diffusion Models for General Few-Shot Segmentation},\nauthor={Ri-Zhao Qiu and Yu-Xiong Wang and Kris Hauser},\nyear={2024},\nurl={https://openreview.net/forum?id=8nz6xYntfJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZQEG;cYiM;bS35;ofKT",
        "site": "https://openreview.net/forum?id=8nz6xYntfJ",
        "pdf_size": 16923510,
        "rating": "3;5;5;6",
        "confidence": "4;4;4;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;2",
        "presentation": "3;1;2;3",
        "wc_summary": "147;122;69;100",
        "wc_strengths": "72;27;78;59",
        "wc_weaknesses": "234;247;156;81",
        "wc_questions": "22;57;4;46",
        "wc_review": "475;453;307;286",
        "wc_reply_reviewers": "0;77;0;0",
        "wc_reply_authors": "722;1024;234;726",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            109.5,
            28.692333470807146
        ],
        "wc_strengths_avg": [
            59.0,
            19.710403344427025
        ],
        "wc_weaknesses_avg": [
            179.5,
            66.67270805959512
        ],
        "wc_questions_avg": [
            32.25,
            20.64430914319973
        ],
        "wc_review_avg": [
            380.25,
            84.43747686898277
        ],
        "wc_reply_reviewers_avg": [
            19.25,
            33.34197804570089
        ],
        "wc_reply_authors_avg": [
            676.5,
            283.32093110111015
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1403047807487662662&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 10,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of California, San Diego;University of Illinois Urbana-Champaign;University of Illinois",
        "aff_unique_dep": ";Department of Computer Science;",
        "aff_unique_url": "https://www.ucsd.edu;https://illinois.edu;https://illinois.edu",
        "aff_unique_abbr": "UCSD;UIUC;UIUC",
        "aff_campus_unique_index": "0;1;1",
        "aff_campus_unique": "San Diego;Urbana-Champaign",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "8oNzf7u5lT",
        "title": "Pylic: Leveraging Source Code for Planning in Structured Environments",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper investigates the application of program analysis techniques to planning problems in dynamic environments with discontinuities in long-horizon settings. Traditional approaches rely on specialized representations, which are often tailored to specific problems and domains. In contrast, we propose describing the combined planning and control problem directly as a desired property of the execution of simulator source code. This representation is expressive, naturally providing a means to describe desired properties of even very dynamic and discontinuous environments. We show that, despite this generality, it is still possible to leverage domain knowledge by relating it to the simulator source code. We study the effectiveness of this approach through several case studies in simulated robotic environments. Our results show that in these environments, our framework can improve the efficiency in solving the control and planning problem, relative to standard numerical and reinforcement learning methods.",
        "keywords": "program analysis;planning;robotics;optimization",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "/attachment/92ea473536bb13af7e2f11255bbc254dcb94c811.zip",
        "author": "Leonardo Hernandez Cano;Nathan Hunt;Sara Magliacane;Armando Solar-Lezama",
        "authorids": "~Leonardo_Hernandez_Cano1;~Nathan_Hunt1;~Sara_Magliacane1;~Armando_Solar-Lezama1",
        "gender": ";M;F;M",
        "homepage": ";;http://saramagliacane.github.io;https://people.csail.mit.edu/asolar/",
        "dblp": ";200/8601;120/5256;95/6919",
        "google_scholar": ";;https://scholar.google.nl/citations?user=H3j_zQ4AAAAJ;https://scholar.google.com.tw/citations?user=8BX3BokAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;magliacane/;",
        "or_profile": "~Leonardo_Hernandez_Cano1;~Nathan_Hunt1;~Sara_Magliacane1;~Armando_Solar-Lezama1",
        "aff": ";Massachusetts Institute of Technology;University of Amsterdam;Massachusetts Institute of Technology",
        "aff_domain": ";mit.edu;uva.nl;mit.edu",
        "position": ";PhD student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\ncano2024pylic,\ntitle={Pylic: Leveraging Source Code for Planning in Structured Environments},\nauthor={Leonardo Hernandez Cano and Nathan Hunt and Sara Magliacane and Armando Solar-Lezama},\nyear={2024},\nurl={https://openreview.net/forum?id=8oNzf7u5lT}\n}",
        "github": "",
        "project": "",
        "reviewers": "uEX5;ppCk;wE34",
        "site": "https://openreview.net/forum?id=8oNzf7u5lT",
        "pdf_size": 685675,
        "rating": "3;3;5",
        "confidence": "4;4;2",
        "soundness": "1;2;2",
        "contribution": "1;2;2",
        "presentation": "2;2;2",
        "wc_summary": "59;55;41",
        "wc_strengths": "34;25;41",
        "wc_weaknesses": "428;601;146",
        "wc_questions": "6;71;19",
        "wc_review": "527;752;247",
        "wc_reply_reviewers": "181;0;95",
        "wc_reply_authors": "1271;508;389",
        "reply_reviewers": "1;0;1",
        "reply_authors": "2;1;1",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            51.666666666666664,
            7.717224601860151
        ],
        "wc_strengths_avg": [
            33.333333333333336,
            6.548960901462833
        ],
        "wc_weaknesses_avg": [
            391.6666666666667,
            187.5212580541796
        ],
        "wc_questions_avg": [
            32.0,
            28.083209693100727
        ],
        "wc_review_avg": [
            508.6666666666667,
            206.57255921884257
        ],
        "wc_reply_reviewers_avg": [
            92.0,
            73.92338376093635
        ],
        "wc_reply_authors_avg": [
            722.6666666666666,
            390.761933776678
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:jz2EayYY-nsJ:scholar.google.com/&scioq=Pylic:+Leveraging+Source+Code+for+Planning+in+Structured+Environments&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Massachusetts Institute of Technology;University of Amsterdam",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://web.mit.edu;https://www.uva.nl",
        "aff_unique_abbr": "MIT;UvA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United States;Netherlands"
    },
    {
        "id": "8oUF3uGIVo",
        "title": "Exploring High-Order Message-Passing in Graph Transformers",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The Transformer architecture has demonstrated promising performance on graph learning tasks. However, the existing attention mechanism used in Graph Transformers (GT) cannot capture high-order correlations that exist in complex graphs, thereby limiting their expressiveness. In this paper, we present a High-Order message-passing strategy within the Transformer architecture (HOtrans) to learn long-range, high-order relationships for graph representation. Recognizing that some nodes share similar properties, we extract communities from the entire graph and introduce a virtual node to connect all nodes in the community. Operating on the community, we adopt a three-step message-passing approach: capture the high-order information of the community into a virtual node; propagate long-range dependent information between communities; aggregate community-level representations back to graph nodes.  This facilitates effective global information passing. Virtual nodes capture the high-order community information and support the long-range information passing as the bridge. \nWe demonstrate that many existing GTs can be regarded as special cases of this framework. Our experimental results illustrate that our proposed HOtrans consistently achieves highly competitive results across several node classification tasks.",
        "keywords": "Graph representation learning;Transformer",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Xueqi Ma;Xingjun Ma;Chuang Liu;Sarah Monazam Erfani;James Bailey",
        "authorids": "~Xueqi_Ma1;~Xingjun_Ma1;~Chuang_Liu2;~Sarah_Monazam_Erfani1;~James_Bailey1",
        "gender": "F;M;M;;",
        "homepage": ";http://xingjunma.com/;https://liuchuang0059.github.io/;https://people.eng.unimelb.edu.au/smonazam/;",
        "dblp": "194/4773;195/8270;52/1800-8;136/0170;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.com.au/citations?user=XQViiyYAAAAJ;hQzjzekAAAAJ;https://scholar.google.com.au/citations?user=Jq9ocx4AAAAJ;",
        "orcid": ";;0000-0003-2377-2567;;",
        "linkedin": ";xingjun-ma-173532129/;;;",
        "or_profile": "~Xueqi_Ma1;~Xingjun_Ma1;~Chuang_Liu2;~Sarah_Monazam_Erfani1;~James_Bailey1",
        "aff": "University of Melbourne;Fudan University;Wuhan University;The University of Melbourne;",
        "aff_domain": "unimelb.edu;fudan.edu.cn;whu.edu;unimelb.edu.au;",
        "position": "PhD student;Associate Professor;PhD student;Associate Professor;",
        "bibtex": "@misc{\nma2024exploring,\ntitle={Exploring High-Order Message-Passing in Graph Transformers},\nauthor={Xueqi Ma and Xingjun Ma and Chuang Liu and Sarah Monazam Erfani and James Bailey},\nyear={2024},\nurl={https://openreview.net/forum?id=8oUF3uGIVo}\n}",
        "github": "",
        "project": "",
        "reviewers": "eGUc;e8WT;7DnL;akHZ",
        "site": "https://openreview.net/forum?id=8oUF3uGIVo",
        "pdf_size": 426931,
        "rating": "3;3;5;5",
        "confidence": "5;4;4;5",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;2;4",
        "wc_summary": "69;58;85;66",
        "wc_strengths": "36;44;30;89",
        "wc_weaknesses": "137;427;211;151",
        "wc_questions": "25;44;5;45",
        "wc_review": "267;573;331;351",
        "wc_reply_reviewers": "0;22;0;0",
        "wc_reply_authors": "510;640;360;422",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            69.5,
            9.810708435174291
        ],
        "wc_strengths_avg": [
            49.75,
            23.19886850689059
        ],
        "wc_weaknesses_avg": [
            231.5,
            116.24435470163702
        ],
        "wc_questions_avg": [
            29.75,
            16.361158271956175
        ],
        "wc_review_avg": [
            380.5,
            115.38955758646446
        ],
        "wc_reply_reviewers_avg": [
            5.5,
            9.526279441628825
        ],
        "wc_reply_authors_avg": [
            483.0,
            105.152270541344
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8011409773533815531&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "University of Melbourne;Fudan University;Wuhan University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.unimelb.edu.au;https://www.fudan.edu.cn;http://www.whu.edu.cn/",
        "aff_unique_abbr": "UniMelb;Fudan;WHU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "Australia;China"
    },
    {
        "id": "8oYjW8QxuC",
        "title": "Pi-DUAL: Using privileged information to distinguish clean from noisy labels",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Label noise is a pervasive problem in deep learning that often compromises the generalization performance of trained models. Recently, leveraging privileged information (PI) -- information available only during training but not at test time -- has emerged as an effective approach to mitigate this issue. Yet, existing PI-based methods have failed to consistently outperform their no-PI counterparts in terms of preventing overfitting to label noise. To address this deficiency, we introduce Pi-DUAL, an architecture designed to harness PI to distinguish clean from wrong labels. Pi-DUAL decomposes the output logits into a prediction term, based on conventional input features, and a noise-fitting term influenced solely by PI. A gating mechanism steered by PI adaptively shifts focus between these terms, allowing the model to implicitly separate the learning paths of clean and wrong labels. Empirically, Pi-DUAL achieves significant performance improvements on key PI benchmarks (e.g., +6.8% on ImageNet-PI), establishing a new state-of-the-art test set accuracy. Additionally, Pi-DUAL is a potent method for identifying noisy samples post-training, outperforming other strong methods at this task.  Overall, Pi-DUAL is a simple, scalable and practical approach for mitigating the effects of label noise in a variety of real-world scenarios with PI.",
        "keywords": "noisy labels;privileged information;supervised learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/04979be18de8465f8a54fb736275a0f60fb768fc.pdf",
        "author": "Ke Wang;Guillermo Ortiz-Jimenez;Rodolphe Jenatton;Mark Collier;Efi Kokiopoulou;Pascal Frossard",
        "authorids": "~Ke_Wang19;~Guillermo_Ortiz-Jimenez1;~Rodolphe_Jenatton3;~Mark_Collier1;~Efi_Kokiopoulou2;~Pascal_Frossard1",
        "gender": "M;;M;M;;",
        "homepage": "https://wang-kee.github.io/;http://gortizji.github.io;http://rodolphejenatton.com/;;;",
        "dblp": ";222/2737;68/8398;;;",
        "google_scholar": "wKBORzsAAAAJ;xAsJnG0AAAAJ;QIR6rygAAAAJ;U4rBrcgAAAAJ;;",
        "orcid": ";;;;;",
        "linkedin": ";;;mark-collier-aa446032/;;",
        "or_profile": "~Ke_Wang19;~Guillermo_Ortiz-Jimenez1;~Rodolphe_Jenatton3;~Mark_Collier1;~Efi_Kokiopoulou2;~Pascal_Frossard1",
        "aff": "EPFL - EPF Lausanne;Google DeepMind;Google;Google;;",
        "aff_domain": "epfl.ch;google.com;google.com;google.com;;",
        "position": "PhD student;Research Scientist;Senior research scientist;Researcher;;",
        "bibtex": "@misc{\nwang2024pidual,\ntitle={Pi-{DUAL}: Using privileged information to distinguish clean from noisy labels},\nauthor={Ke Wang and Guillermo Ortiz-Jimenez and Rodolphe Jenatton and Mark Collier and Efi Kokiopoulou and Pascal Frossard},\nyear={2024},\nurl={https://openreview.net/forum?id=8oYjW8QxuC}\n}",
        "github": "",
        "project": "",
        "reviewers": "h1hP;VkrZ;sbuM",
        "site": "https://openreview.net/forum?id=8oYjW8QxuC",
        "pdf_size": 8107634,
        "rating": "5;6;6",
        "confidence": "4;4;3",
        "soundness": "3;3;3",
        "contribution": "2;2;3",
        "presentation": "3;3;3",
        "wc_summary": "49;108;66",
        "wc_strengths": "47;87;123",
        "wc_weaknesses": "126;186;98",
        "wc_questions": "6;3;4",
        "wc_review": "228;384;291",
        "wc_reply_reviewers": "0;89;0",
        "wc_reply_authors": "1740;1304;764",
        "reply_reviewers": "0;1;0",
        "reply_authors": "3;3;1",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            74.33333333333333,
            24.796953217863052
        ],
        "wc_strengths_avg": [
            85.66666666666667,
            31.04119127152751
        ],
        "wc_weaknesses_avg": [
            136.66666666666666,
            36.709066394496546
        ],
        "wc_questions_avg": [
            4.333333333333333,
            1.247219128924647
        ],
        "wc_review_avg": [
            301.0,
            64.07807737440318
        ],
        "wc_reply_reviewers_avg": [
            29.666666666666668,
            41.95500235040182
        ],
        "wc_reply_authors_avg": [
            1269.3333333333333,
            399.203651731238
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5880124482341331784&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "EPFL;Google",
        "aff_unique_dep": ";Google DeepMind",
        "aff_unique_url": "https://www.epfl.ch;https://deepmind.com",
        "aff_unique_abbr": "EPFL;DeepMind",
        "aff_campus_unique_index": "0;2;2",
        "aff_campus_unique": "Lausanne;;Mountain View",
        "aff_country_unique_index": "0;1;2;2",
        "aff_country_unique": "Switzerland;United Kingdom;United States"
    },
    {
        "id": "8oZf2SlXEY",
        "title": "Distribution Calibration For Few-Shot Learning by Bayesian Relation Inference",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Learning from a limited number of samples is difficult as a small number of samples cannot cover all the information in their category. It is worth noting that categories with scarce samples may be distributed in a way that is related to categories that contain sufficient data. Therefore it is possible to calibrate the distribution of a sample-poor category by using categories with a large amount of data. Existing methods of distribution calibration usually use artificially set distances to calculate the association between two categories, which may ignore deeper relations between categories. In this paper, we propose a distribution calibration method based on Bayesian relation inference. For the input few-sample classes, it can automatically infer their relation with the categories with sufficient data and adaptively generate a large amount of fused feature data that can represent the few-sample classes. The results show that a simple logistic regression classifier trained by using the large amount of data generated by our method, exceeds state-of-the-art accuracy for skin disease classification issue. Through visual analysis, we demonstrate that the relationship graph generated by this Bayesian relationship inference method has a degree of interpretability.",
        "keywords": "Bayesian inference;few-shot learning",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/4b2b9ff2b5456c9d167f8ad79d6f4fe6137fc161.zip",
        "author": "Yuchen Liu;Yang Gu;Weining Weng;Zhaohua Yang;Yiqiang Chen",
        "authorids": "~Yuchen_Liu12;~Yang_Gu5;~Weining_Weng1;~Zhaohua_Yang2;~Yiqiang_Chen1",
        "gender": "M;F;M;;M",
        "homepage": "https://github.com/YuchenLiu1225;https://scholar.google.com/citations?hl=en&user=KrsyFoQAAAAJ;;http://yangzhaohua1998.github.io;http://www.ict.cas.cn/sourcedb_2018_ict_cas/cn/jssrck/200909/t20090917_2496596.html",
        "dblp": ";;;;",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;3VK38QgAAAAJ;;LC3SwhEAAAAJ",
        "orcid": ";;0009-0008-5006-1262;;",
        "linkedin": ";;;;",
        "or_profile": "~Yuchen_Liu12;~Yang_Gu5;~Weining_Weng1;~Zhaohua_Yang2;~Yiqiang_Chen1",
        "aff": "University of Chinese Academy of Sciences;Institute of Computing Technology, Chinese Academy of Sciences;Institute of Computing Technology, Chinese Academy of Sciences;Institute of Computing Technology, Chinese Academy of Sciences;Chinese Academy of Sciences",
        "aff_domain": "ucas.ac.cn;ict.ac.cn;ict.ac.cn;ict.ac.cn;ict.ac.cn",
        "position": "MS student;Associate Professor;PhD student;MS student;Full Professor",
        "bibtex": "@misc{\nliu2024distribution,\ntitle={Distribution Calibration For Few-Shot Learning by Bayesian Relation Inference},\nauthor={Yuchen Liu and Yang Gu and Weining Weng and Zhaohua Yang and Yiqiang Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=8oZf2SlXEY}\n}",
        "github": "",
        "project": "",
        "reviewers": "czxy;MVEs;PCKz",
        "site": "https://openreview.net/forum?id=8oZf2SlXEY",
        "pdf_size": 1058517,
        "rating": "3;5;5",
        "confidence": "2;4;3",
        "soundness": "2;3;3",
        "contribution": "1;2;2",
        "presentation": "1;3;1",
        "wc_summary": "45;95;173",
        "wc_strengths": "25;74;95",
        "wc_weaknesses": "109;102;177",
        "wc_questions": "8;91;39",
        "wc_review": "187;362;484",
        "wc_reply_reviewers": "0;50;247",
        "wc_reply_authors": "1473;2537;822",
        "reply_reviewers": "0;2;1",
        "reply_authors": "5;8;2",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            104.33333333333333,
            52.67088590694315
        ],
        "wc_strengths_avg": [
            64.66666666666667,
            29.32954520994525
        ],
        "wc_weaknesses_avg": [
            129.33333333333334,
            33.82635395992631
        ],
        "wc_questions_avg": [
            46.0,
            34.2442209236342
        ],
        "wc_review_avg": [
            344.3333333333333,
            121.89157294725324
        ],
        "wc_reply_reviewers_avg": [
            99.0,
            106.62394977990013
        ],
        "wc_reply_authors_avg": [
            1610.6666666666667,
            706.8806279862408
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            5.0,
            2.449489742783178
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.8660254037844385,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:abrTrww8RUQJ:scholar.google.com/&scioq=Distribution+Calibration+For+Few-Shot+Learning+by+Bayesian+Relation+Inference&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1;1",
        "aff_unique_norm": "University of Chinese Academy of Sciences;Chinese Academy of Sciences",
        "aff_unique_dep": ";Institute of Computing Technology",
        "aff_unique_url": "http://www.ucas.ac.cn;http://www.ict.ac.cn",
        "aff_unique_abbr": "UCAS;CAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "8ohamFnX14",
        "title": "The (co)limit of metabeliefs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Potentially infinite sequences of beliefs arise when reasoning about the future, one's own beliefs, or others' beliefs.  Machine learning researchers are typically content with heuristic truncation, or proofs of asymptotic convergence, of sequences of beliefs; however, such approaches lack insight into the structure of the possible choices. We construct and analyze several (co)limits of meta beliefs to understand the topological and geometric structure of sequences of beliefs.  We analyze the relationship between different levels, the relationship between different beliefs at different levels, the encoding of temporal and other indexing structures in belief space, and structures preserved in the colimit. Examples demonstrate the ability to formalize and reason about problems of learning, cooperative and competitive reasoning, and sequential decision making. We conclude by emphasizing insights gained, and future directions for more concrete machine learning models.",
        "keywords": "Belief;colimit;category theory",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/6d822a6fc32a8915220e508e24ad2a37c088fb94.pdf",
        "author": "Benjamin Sheller;Patrick Shafto",
        "authorids": "~Benjamin_Sheller1;~Patrick_Shafto2",
        "gender": "M;",
        "homepage": ";http://www.shaftolab.com",
        "dblp": ";03/5979",
        "google_scholar": ";HUi6F7wAAAAJ",
        "orcid": "0000-0001-6699-0797;",
        "linkedin": ";",
        "or_profile": "~Benjamin_Sheller1;~Patrick_Shafto1",
        "aff": "Drake University;Rutgers University",
        "aff_domain": "drake.edu;rutgers.edu",
        "position": "Assistant Professor;Professor",
        "bibtex": "@misc{\nsheller2024the,\ntitle={The (co)limit of metabeliefs},\nauthor={Benjamin Sheller and Patrick Shafto},\nyear={2024},\nurl={https://openreview.net/forum?id=8ohamFnX14}\n}",
        "github": "",
        "project": "",
        "reviewers": "y6tA;BToD;xqdq;cWSP;sas8",
        "site": "https://openreview.net/forum?id=8ohamFnX14",
        "pdf_size": 468735,
        "rating": "3;5;5;5;8",
        "confidence": "4;3;2;1;4",
        "soundness": "2;3;3;3;3",
        "contribution": "2;2;2;2;3",
        "presentation": "2;2;4;3;4",
        "wc_summary": "226;66;158;19;140",
        "wc_strengths": "5;62;38;1;229",
        "wc_weaknesses": "157;69;49;22;140",
        "wc_questions": "3;52;47;1;555",
        "wc_review": "391;249;292;43;1064",
        "wc_reply_reviewers": "383;79;25;0;0",
        "wc_reply_authors": "573;163;124;0;435",
        "reply_reviewers": "2;1;1;0;0",
        "reply_authors": "3;2;1;0;1",
        "rating_avg": [
            5.2,
            1.6
        ],
        "confidence_avg": [
            2.8,
            1.16619037896906
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            3.0,
            0.8944271909999159
        ],
        "wc_summary_avg": [
            121.8,
            72.36131563204196
        ],
        "wc_strengths_avg": [
            67.0,
            84.03570669661795
        ],
        "wc_weaknesses_avg": [
            87.4,
            52.347301745171166
        ],
        "wc_questions_avg": [
            131.6,
            212.7699226864549
        ],
        "wc_review_avg": [
            407.8,
            347.15610321583
        ],
        "wc_reply_reviewers_avg": [
            97.4,
            145.68541450673777
        ],
        "wc_reply_authors_avg": [
            259.0,
            211.70451105255174
        ],
        "reply_reviewers_avg": [
            0.8,
            0.7483314773547883
        ],
        "reply_authors_avg": [
            1.4,
            1.019803902718557
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.12862393885688164,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:J2yN2_b05uEJ:scholar.google.com/&scioq=The+(co)limit+of+metabeliefs&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Drake University;Rutgers University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.drake.edu;https://www.rutgers.edu",
        "aff_unique_abbr": "Drake;Rutgers",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "One Step of Gradient Descent is Provably the Optimal In-Context Learner with One Layer of Linear Self-Attention",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19314",
        "id": "8p3fu56lKc",
        "author_site": "Arvind Mahankali, Tatsunori Hashimoto, Tengyu Ma",
        "tldr": "",
        "abstract": "Recent works have empirically analyzed in-context learning and shown that transformers trained on synthetic linear regression tasks can learn to implement ridge regression, which is the Bayes-optimal predictor, given sufficient capacity (Akyurek et al., 2023), while one-layer transformers with linear self-attention and no MLP layer will learn to implement one step of gradient descent (GD) on a least-squares linear regression objective (von Oswald et al., 2022). However, the theory behind these observations remains poorly understood. We theoretically study transformers with a single layer of linear self-attention, trained on synthetic noisy linear regression data. First, we mathematically show that when the covariates are drawn from a standard Gaussian distribution, the one-layer transformer which minimizes the pre-training loss will implement a single step of GD on the least-squares linear regression objective. Then, we find that changing the distribution of the covariates and weight vector to a non-isotropic Gaussian distribution has a strong impact on the learned algorithm: the global minimizer of the pre-training loss now implements a single step of $\\textit{pre-conditioned}$ GD. However, if only the distribution of the responses is changed, then this does not have a large effect on the learned algorithm: even when the response comes from a more general family of $\\textit{nonlinear}$ functions, the global minimizer of the pre-training loss still implements a single step of GD on a least-squares linear regression objective.",
        "keywords": "Linear Self-Attention;In-context learning;Gradient Descent;Theoretical Understanding",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/2a9f6630ad97e11aca89759cde4ceb153d835363.zip",
        "author": "Arvind V. Mahankali;Tatsunori Hashimoto;Tengyu Ma",
        "authorids": "~Arvind_V._Mahankali1;~Tatsunori_Hashimoto1;~Tengyu_Ma1",
        "gender": ";M;M",
        "homepage": ";https://thashim.github.io;http://ai.stanford.edu/~tengyuma/",
        "dblp": "270/8242.html;;54/9061",
        "google_scholar": ";5ygiTwsAAAAJ;i38QlUwAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Arvind_V._Mahankali1;~Tatsunori_Hashimoto1;~Tengyu_Ma1",
        "aff": "Computer Science Department, Stanford University;Stanford University;Facebook AI Research",
        "aff_domain": "cs.stanford.edu;stanford.edu;fb.com",
        "position": "PhD student;Assistant Professor;Visiting Scientist",
        "bibtex": "@inproceedings{\nmahankali2024one,\ntitle={One Step of Gradient Descent is Provably the Optimal In-Context Learner with One Layer of Linear Self-Attention},\nauthor={Arvind V. Mahankali and Tatsunori Hashimoto and Tengyu Ma},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=8p3fu56lKc}\n}",
        "github": "",
        "project": "",
        "reviewers": "nLRu;VQYN;ksN8;1cqQ",
        "pdf_size": 401766,
        "rating": "5;5;6;8",
        "confidence": "4;3;4;4",
        "soundness": "2;2;3;4",
        "contribution": "2;2;3;3",
        "presentation": "3;2;3;4",
        "wc_summary": "208;103;88;269",
        "wc_strengths": "65;20;82;125",
        "wc_weaknesses": "22;146;177;89",
        "wc_questions": "97;60;364;2",
        "wc_review": "392;329;711;485",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "228;92;754;62",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            167.0,
            74.8698871376203
        ],
        "wc_strengths_avg": [
            73.0,
            37.60983913818298
        ],
        "wc_weaknesses_avg": [
            108.5,
            59.078337823605025
        ],
        "wc_questions_avg": [
            130.75,
            138.85851612342688
        ],
        "wc_review_avg": [
            479.25,
            144.85229545989253
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            284.0,
            278.47082432456006
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.4714045207910316,
        "gs_citation": 112,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13101108196694454872&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=8p3fu56lKc",
        "pdf": "https://openreview.net/pdf?id=8p3fu56lKc",
        "email": "cs.stanford.edu;stanford.edu;fb.com",
        "author_num": 3,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Stanford University;Meta",
        "aff_unique_dep": "Computer Science Department;Facebook AI Research",
        "aff_unique_url": "https://www.stanford.edu;https://research.facebook.com",
        "aff_unique_abbr": "Stanford;FAIR",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Stanford;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "8p3hMUwwbg",
        "title": "From Stability to Chaos: Analyzing Gradient Descent Dynamics in Quadratic Regression",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We conduct a comprehensive investigation into the dynamics of gradient descent using large-order constant step-sizes in the context of quadratic regression models. Within this framework, we reveal that the dynamics can be encapsulated by a specific cubic map, naturally parameterized by the step-size. Through a fine-grained bifurcation analysis concerning the step-size parameter, we delineate five distinct training phases: (1) monotonic, (2) catapult, (3) periodic, (4) chaotic, and (5) divergent, precisely demarcating the boundaries of each phase. As illustrations, we provide examples involving phase retrieval and two-layer neural networks employing quadratic activation functions and constant outer-layers, utilizing orthogonal training data. Our simulations indicate that these five phases also manifest with generic non-orthogonal data. We also empirically investigate the generalization performance when training in the various non-monotonic (and non-divergent) phases. In particular, we observe that performing an ergodic trajectory averaging stabilizes the test error in non-monotonic (and non-divergent) phases.",
        "keywords": "Edges of stability;periodicity;chaos;trajectory averaging;cubic dynamics;quadratic regression",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Xuxing Chen;Krishna Balasubramanian;Promit Ghosal;Bhavya Kumar Agrawalla",
        "authorids": "~Xuxing_Chen1;~Krishna_Balasubramanian1;promit@brandeis.edu;~Bhavya_Kumar_Agrawalla1",
        "gender": "M;;;",
        "homepage": "https://xuxingc.github.io/;;;",
        "dblp": "221/0393;;;",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;;;https://scholar.google.com/scholar?hl=en",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Xuxing_Chen1;~Krishna_Balasubramanian1;promit@brandeis.edu;~Bhavya_Kumar_Agrawalla1",
        "aff": "University of California, Davis;;;Massachusetts Institute of Technology",
        "aff_domain": "ucdavis.edu;;;mit.edu",
        "position": "PhD student;;;Undergrad student",
        "bibtex": "@misc{\nchen2024from,\ntitle={From Stability to Chaos: Analyzing Gradient Descent Dynamics in Quadratic Regression},\nauthor={Xuxing Chen and Krishna Balasubramanian and Promit Ghosal and Bhavya Kumar Agrawalla},\nyear={2024},\nurl={https://openreview.net/forum?id=8p3hMUwwbg}\n}",
        "github": "",
        "project": "",
        "reviewers": "BLuU;fNyy;MkpK;qRAi;Ebrh",
        "site": "https://openreview.net/forum?id=8p3hMUwwbg",
        "pdf_size": 1807377,
        "rating": "3;3;5;5;6",
        "confidence": "5;3;3;3;3",
        "soundness": "3;3;3;3;3",
        "contribution": "1;1;2;2;2",
        "presentation": "2;2;3;2;3",
        "wc_summary": "70;99;122;88;81",
        "wc_strengths": "68;32;66;74;77",
        "wc_weaknesses": "125;227;406;1007;78",
        "wc_questions": "204;125;180;77;44",
        "wc_review": "467;483;774;1246;280",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            4.4,
            1.2
        ],
        "confidence_avg": [
            3.4,
            0.8000000000000002
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            1.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            92.0,
            17.72004514666935
        ],
        "wc_strengths_avg": [
            63.4,
            16.19382598399773
        ],
        "wc_weaknesses_avg": [
            368.6,
            338.46512375723444
        ],
        "wc_questions_avg": [
            126.0,
            60.20963378065009
        ],
        "wc_review_avg": [
            650.0,
            337.3040171714532
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5833333333333331,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12175652516156880684&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of California, Davis;Massachusetts Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ucdavis.edu;https://web.mit.edu",
        "aff_unique_abbr": "UC Davis;MIT",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Davis;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "8pYNdmwGAO",
        "title": "EvolMPNN: Predicting Mutational Effect on Homologous Proteins by Evolution Encoding",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Predicting protein properties is paramount for biological and medical advancements. Current protein engineering mutates on a typical protein, called the wild-type, to construct a family of homologous proteins and study their properties. Yet, existing methods easily neglect subtle mutations, failing to capture the effect on the protein properties. To this end, we propose EvolMPNN, Evolution-aware Message Passing Neural Network, to learn evolution-aware protein embeddings. EvolMPNN samples sets of anchor proteins, computes evolutionary information by means of residues and employs a differentiable evolution-aware aggregation scheme over these sampled anchors. This way EvolMPNN can capture the mutation effect on proteins with respect to the anchor proteins. Afterwards, the aggregated evolution-aware embeddings are integrated with sequence embeddings to generate final comprehensive protein embeddings. Our model shows up to 6.4% better than state-of-the-art methods and attains 36X inference speedup in comparison with large pre-trained models. The code and models are available at https://anonymous.4open.science/r/EvolMPNN.",
        "keywords": "Mutation Prediction;Protein Property Prediction;Homologous Protein Sequence Modelling;Message Passing Neural Network",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Zhiqiang Zhong;Davide Mottin",
        "authorids": "~Zhiqiang_Zhong1;~Davide_Mottin1",
        "gender": "M;M",
        "homepage": "https://zhiqiangzhongddu.github.io/;https://mott.in",
        "dblp": "253/0447;135/7623",
        "google_scholar": "zHzChxAAAAAJ;https://scholar.google.it/citations?user=evZ9Q9EAAAAJ",
        "orcid": "0000-0002-1226-5597;0000-0001-8256-2258",
        "linkedin": "zhiqiang-zhong-097287111/;davide-mottin-67ab7323/",
        "or_profile": "~Zhiqiang_Zhong1;~Davide_Mottin1",
        "aff": "Aarhus University;Aarhus University",
        "aff_domain": "au.dk;au.dk",
        "position": "Postdoc;Associate Professor",
        "bibtex": "@misc{\nzhong2024evolmpnn,\ntitle={Evol{MPNN}: Predicting Mutational Effect on Homologous Proteins by Evolution Encoding},\nauthor={Zhiqiang Zhong and Davide Mottin},\nyear={2024},\nurl={https://openreview.net/forum?id=8pYNdmwGAO}\n}",
        "github": "",
        "project": "",
        "reviewers": "fHbu;LeqQ;ojZm",
        "site": "https://openreview.net/forum?id=8pYNdmwGAO",
        "pdf_size": 545553,
        "rating": "3;3;6",
        "confidence": "4;4;3",
        "soundness": "3;3;3",
        "contribution": "2;2;3",
        "presentation": "3;2;3",
        "wc_summary": "93;32;80",
        "wc_strengths": "63;35;127",
        "wc_weaknesses": "630;138;132",
        "wc_questions": "416;91;149",
        "wc_review": "1202;296;488",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            68.33333333333333,
            26.233989826601334
        ],
        "wc_strengths_avg": [
            75.0,
            38.505410875183074
        ],
        "wc_weaknesses_avg": [
            300.0,
            233.35809392433768
        ],
        "wc_questions_avg": [
            218.66666666666666,
            141.53052281712553
        ],
        "wc_review_avg": [
            662.0,
            389.79994869163335
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:K-MxG5d2Je4J:scholar.google.com/&scioq=EvolMPNN:+Predicting+Mutational+Effect+on+Homologous+Proteins+by+Evolution+Encoding&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Aarhus University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://au.dk",
        "aff_unique_abbr": "AU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Denmark"
    },
    {
        "id": "8phE9BVRWS",
        "title": "SuperFormer: Superpixel-based Transformers for Salient Object Detection",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Images often have local redundant information that can strain the training of deep neural networks. An effective way to reduce spatial redundancy and image complexity is to over-segment with superpixels. With a fast, linear computational complexity, Simple Linear Iterative Clustering (SLIC) generates superpixels by grouping pixels as a function of colour similarity and spatial proximity. However, it is challenging and non-trivial to train a model on over-segmented images with dynamic graph structure and low spatial inductive bias. In order to train on unstructured data, graph neural networks (GNNs) can be applied to classify each superpixel for salient object detection (SOD) by considering a set of superpixels as graphs. Although other works on graph classification or node classification were able to utilize pre-defined edge information or GNNs, naive applications on superpixel graphs do not translate trivially. Our proposed SuperFormer method introduces new feature attributes for superpixels and a dynamic positional encoding for heterogeneous spatial graphs to achieve state-of-the-art results in salient object detection for low model complexity.",
        "keywords": "Salient Object Detection;Superpixels;Transformers;Graph Neural Networks",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/8f993178f4ac8afbb0ef49f8626e32c95e514b9c.zip",
        "author": "Jinman Park;Zahra Gharaee;Paul W. Fieguth",
        "authorids": "~Jinman_Park1;~Zahra_Gharaee1;~Paul_W._Fieguth1",
        "gender": "M;F;",
        "homepage": ";https://zahrag.github.io/;",
        "dblp": "81/3875;174/4584;f/PWFieguth",
        "google_scholar": ";https://scholar.google.pl/citations?user=nWe8d1MAAAAJ;TObmBfYAAAAJ",
        "orcid": "0009-0003-0870-8185;0000-0003-0140-0025;0000-0001-7260-2260",
        "linkedin": "jinmanpark/;zahragh/;paul-fieguth-1071461",
        "or_profile": "~Jinman_Park1;~Zahra_Gharaee1;~Paul_W._Fieguth1",
        "aff": "University of Waterloo;University of Waterloo;University of Waterloo",
        "aff_domain": "uwaterloo.ca;uwaterloo.ca;uwaterloo.ca",
        "position": "PhD student;Postdoc;Full Professor",
        "bibtex": "@misc{\npark2024superformer,\ntitle={SuperFormer: Superpixel-based Transformers for Salient Object Detection},\nauthor={Jinman Park and Zahra Gharaee and Paul W. Fieguth},\nyear={2024},\nurl={https://openreview.net/forum?id=8phE9BVRWS}\n}",
        "github": "",
        "project": "",
        "reviewers": "tMkj;DeSV;P45W",
        "site": "https://openreview.net/forum?id=8phE9BVRWS",
        "pdf_size": 3817996,
        "rating": "3;3;3",
        "confidence": "5;4;4",
        "soundness": "1;2;2",
        "contribution": "1;2;2",
        "presentation": "2;3;2",
        "wc_summary": "40;54;45",
        "wc_strengths": "27;17;25",
        "wc_weaknesses": "79;92;84",
        "wc_questions": "27;80;4",
        "wc_review": "173;243;158",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            46.333333333333336,
            5.792715732327589
        ],
        "wc_strengths_avg": [
            23.0,
            4.320493798938574
        ],
        "wc_weaknesses_avg": [
            85.0,
            5.354126134736337
        ],
        "wc_questions_avg": [
            37.0,
            31.822423959633664
        ],
        "wc_review_avg": [
            191.33333333333334,
            37.04351795148811
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:j-aW-vzfth8J:scholar.google.com/&scioq=SuperFormer:+Superpixel-based+Transformers+for+Salient+Object+Detection&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Waterloo",
        "aff_unique_dep": "",
        "aff_unique_url": "https://uwaterloo.ca",
        "aff_unique_abbr": "UW",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "8r2f4D0I3S",
        "title": "Towards Pareto-Optimality for Test-Time Adaptation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Test-Time Adaptation (TTA) has been effective for mitigating the distribution shifts of test datasets by adapting a pre-trained model. The existing TTA approaches update the model parameters online toward the gradient descent direction by averaging individual objectives in the current batch. The averaged gradient can be biased by only a few instances in the batch, leading to conflict among individual objectives when updating the model. To prevent a negative effect from the gradient conflict among test instances, a model could have been updated by the gradient that is agreeable by all objectives in the batch. Therefore, we propose a new approach to update the model parameters toward Pareto-Optimality across all individual objectives in TTA. Particularly, this paper suggests an extended version of the Pareto optimization to anticipate unexpected distribution shifts during testing time. This extension is enabled by merging the sharpness-aware minimization into the Pareto optimization. We demonstrate the effectiveness of the proposed approaches through experiments on three benchmark datasets: CIFAR10-to-CIFAR10C, CIFAR100-to-CIFAR100C, and ImageNet-to-ImageNetC.",
        "keywords": "Test-Time Adaptation;Pareto-Optimality;Sharpness-Aware Minimization",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "JoonHo Jang;DongHyeok Shin;Byeonghu Na;HeeSun Bae;Il-chul Moon",
        "authorids": "~JoonHo_Jang1;~DongHyeok_Shin1;~Byeonghu_Na1;~HeeSun_Bae1;~Il-chul_Moon1",
        "gender": ";;M;F;",
        "homepage": "https://aailab.kaist.ac.kr/xe2/members_phdstudent/16877;;https://sites.google.com/view/byeonghu-na;;",
        "dblp": "241/9686;;276/5100;;",
        "google_scholar": "oYbKry4AAAAJ;;https://scholar.google.co.kr/citations?user=mJoqpmEAAAAJ;https://scholar.google.co.kr/citations?user=D9U_ohsAAAAJ;",
        "orcid": ";;0000-0003-3463-2674;0000-0002-9986-0945;",
        "linkedin": ";;byeonghu-na-17942120b/;heesun-bae-8a4b8523a/;",
        "or_profile": "~JoonHo_Jang1;~DongHyeok_Shin1;~Byeonghu_Na1;~HeeSun_Bae1;~Il-chul_Moon1",
        "aff": "Korea Advanced Institute of Science & Technology;;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;",
        "aff_domain": "kaist.ac.kr;;kaist.ac.kr;kaist.ac.kr;",
        "position": "PhD student;;PhD student;PhD student;",
        "bibtex": "@misc{\njang2024towards,\ntitle={Towards Pareto-Optimality for Test-Time Adaptation},\nauthor={JoonHo Jang and DongHyeok Shin and Byeonghu Na and HeeSun Bae and Il-chul Moon},\nyear={2024},\nurl={https://openreview.net/forum?id=8r2f4D0I3S}\n}",
        "github": "",
        "project": "",
        "reviewers": "HqZ3;MZwq;7JZo;gRux",
        "site": "https://openreview.net/forum?id=8r2f4D0I3S",
        "pdf_size": 6355806,
        "rating": "3;3;5;6",
        "confidence": "5;4;4;3",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;2;3",
        "wc_summary": "84;45;114;96",
        "wc_strengths": "33;27;55;127",
        "wc_weaknesses": "149;171;614;102",
        "wc_questions": "38;2;145;88",
        "wc_review": "304;245;928;413",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            84.75,
            25.31180554602931
        ],
        "wc_strengths_avg": [
            60.5,
            39.78379066906521
        ],
        "wc_weaknesses_avg": [
            259.0,
            206.4691260213013
        ],
        "wc_questions_avg": [
            68.25,
            53.816238255753255
        ],
        "wc_review_avg": [
            472.5,
            269.80038917688756
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:g3nWTDi2Y7UJ:scholar.google.com/&scioq=Towards+Pareto-Optimality+for+Test-Time+Adaptation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "8rN439jpkT",
        "title": "Imitation Learning Using Generalized Sliced Wasserstein Distances",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Imitation learning methods allow to train reinforcement learning policies by way\nof minimizing a divergence measure between the state occupancies of the expert\nagent and the novice policy. Alternatively, a true metric in the space of probability\nmeasures can be used by invoking the optimal transport formalism. In this work,\nwe propose a novel imitation learning method based on the generalized form of\nthe sliced Wasserstein distance, which presents a number of computational and\nsample complexity benefits compared to existing imitation learning approaches.\nWe derive a per-state reward function based on the approximate differential of the\n$\\mathcal{SW}2$ distance which allows the use of standard forward RL methods for policy\noptimization. We demonstrate that the proposed method exhibits state-of-the-art\nperformance compared to established imitation learning frameworks on a number\nof benchmark tasks from the MuJoCo robotic locomotion suite.",
        "keywords": "Imitation Learning;Sliced Wasserstein;Optimal Transport",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Ivan Ovinnikov;Joachim M. Buhmann",
        "authorids": "~Ivan_Ovinnikov1;~Joachim_M._Buhmann1",
        "gender": "M;M",
        "homepage": ";https://ise.ethz.ch",
        "dblp": ";b/JMBuhmann",
        "google_scholar": "https://scholar.google.ch/citations?user=m8UKFekAAAAJ;https://scholar.google.ch/citations?user=zQWbCzYAAAAJ",
        "orcid": ";",
        "linkedin": "ivan-ovinnikov-0b227593/;",
        "or_profile": "~Ivan_Ovinnikov1;~Joachim_M._Buhmann1",
        "aff": "Swiss Federal Institute of Technology;Department of Computer Science, ETHZ - ETH Zurich",
        "aff_domain": "ethz.ch;inf.ethz.ch",
        "position": "PhD student;Professor",
        "bibtex": "@misc{\novinnikov2024imitation,\ntitle={Imitation Learning Using Generalized Sliced Wasserstein Distances},\nauthor={Ivan Ovinnikov and Joachim M. Buhmann},\nyear={2024},\nurl={https://openreview.net/forum?id=8rN439jpkT}\n}",
        "github": "",
        "project": "",
        "reviewers": "BgRr;DZ6u;jjKQ;evdi;DVGp",
        "site": "https://openreview.net/forum?id=8rN439jpkT",
        "pdf_size": 5309276,
        "rating": "3;3;5;5;6",
        "confidence": "3;3;4;3;4",
        "soundness": "3;3;2;3;4",
        "contribution": "2;2;2;3;3",
        "presentation": "3;2;2;2;4",
        "wc_summary": "32;65;66;71;81",
        "wc_strengths": "25;29;92;39;43",
        "wc_weaknesses": "145;71;311;168;139",
        "wc_questions": "53;76;40;265;5",
        "wc_review": "255;241;509;543;268",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            4.4,
            1.2
        ],
        "confidence_avg": [
            3.4,
            0.4898979485566356
        ],
        "soundness_avg": [
            3.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.6,
            0.8
        ],
        "wc_summary_avg": [
            63.0,
            16.504544828622205
        ],
        "wc_strengths_avg": [
            45.6,
            24.096472770926457
        ],
        "wc_weaknesses_avg": [
            166.8,
            79.01999746899514
        ],
        "wc_questions_avg": [
            87.8,
            91.53228938467561
        ],
        "wc_review_avg": [
            363.2,
            133.63293007339172
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.748455199183749,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Th_iEzzvVqgJ:scholar.google.com/&scioq=Imitation+Learning+Using+Generalized+Sliced+Wasserstein+Distances&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Swiss Federal Institute of Technology;ETH Zurich",
        "aff_unique_dep": ";Department of Computer Science",
        "aff_unique_url": "https://www.ethz.ch;https://www.ethz.ch",
        "aff_unique_abbr": "ETH Zurich;ETHZ",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Zurich",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Switzerland"
    },
    {
        "id": "8rhHI6C8iC",
        "title": "All for One and One for All: A Collaborative FL Framework for Generic Federated Learning with Personalized Plug-ins",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Personalized federated learning (PFL) mitigates the notorious data heterogeneity issue in generic federated learning (GFL) by assuming that client models only need to fit on local datasets individually. However, real-world FL clients may meet with test data from other distributions. To endow clients with the ability to handle other datasets, we theoretically formulate a new problem named as Selective FL (SFL), bridging the GFL and PFL together. To practically solve SFL, we design a general effective framework named as Hot-Pluggable Federated Learning (HPFL). In HPFL, clients firstly learn a global shared feature extractor. Next, with the frozen feature extractor, multiple personalized plug-in modules are individually learned based on the local data and saved in a modular store on the server. In inference stage, an accurate selection algorithm allows clients to choose and download suitable plug-in modules from the modular store to achieve the high generalization performance on target data distribution. We conduct comprehensive experiments and ablation studies following common FL settings including four datasets and three neural networks, showing that HPFL significantly outperforms advanced FL algorithms. Additionally, we empirically show the remarkable potential of HPFL to resolve other practical FL problems like continual federated learning and discuss its possible applications in one-shot FL, anarchic FL and an FL plug-in market.",
        "keywords": "Federated Learning;Deep Learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Lei Shen;Zhenheng Tang;Lijun Wu;Yonggang Zhang;Xiaowen Chu;Tao Qin;Bo Han",
        "authorids": "~Lei_Shen4;~Zhenheng_Tang2;~Lijun_Wu1;~Yonggang_Zhang1;~Xiaowen_Chu2;~Tao_Qin1;~Bo_Han1",
        "gender": ";M;M;M;M;M;M",
        "homepage": "https://shenlei515.github.io/;https://apeterswu.github.io/;https://yonggangzhangben.github.io/index.html;https://facultyprofiles.hkust-gz.edu.cn/faculty-personal-page/CHU-Xiaowen/xwchu;https://www.microsoft.com/en-us/research/people/taoqin/;https://bhanml.github.io/;",
        "dblp": ";68/1284-3;27/6859-3;24/2536;14/6841;241/0472-3;234/7546",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;XSbEr98AAAAJ;https://scholar.google.com.hk/citations?user=v4rX24EAAAAJ;Bl4SRU0AAAAJ;nTNjqHwAAAAJ;FlYcrEcAAAAJ",
        "orcid": ";0000-0002-3530-590X;0000-0002-4080-7592;0000-0001-9745-4372;;;0000-0001-8769-9974",
        "linkedin": ";lijun-wu-59340478/;;;;;",
        "or_profile": "~Lei_Shen4;~Lijun_Wu1;~Yonggang_Zhang1;~Xiaowen_Chu2;~Tao_Qin1;~bo_han2;~Zhenheng_TANG1",
        "aff": "Huazhong University of Science and Technology;Microsoft Research;Hong Kong Baptist University;Hong Kong University of Science and Technology (Guangzhou);;MBZUAI;Hong Kong Baptist University",
        "aff_domain": "hust.edu.cn;microsoft.com;hkbu.edu.hk;ust.hk;;mbzuai.ac.ae;hkbu.edu.hk",
        "position": "Undergrad student;Researcher;Postdoc;Full Professor;;Researcher;PhD student",
        "bibtex": "@misc{\nshen2024all,\ntitle={All for One and One for All: A Collaborative {FL} Framework for Generic Federated Learning with Personalized Plug-ins},\nauthor={Lei Shen and Zhenheng Tang and Lijun Wu and Yonggang Zhang and Xiaowen Chu and Tao Qin and Bo Han},\nyear={2024},\nurl={https://openreview.net/forum?id=8rhHI6C8iC}\n}",
        "github": "",
        "project": "",
        "reviewers": "nQmW;3cLo;TW8h;MHGx;ENEM",
        "site": "https://openreview.net/forum?id=8rhHI6C8iC",
        "pdf_size": 2695820,
        "rating": "3;5;5;5;6",
        "confidence": "4;4;4;5;4",
        "soundness": "3;2;2;2;3",
        "contribution": "2;2;2;1;3",
        "presentation": "1;2;3;3;2",
        "wc_summary": "81;81;79;64;146",
        "wc_strengths": "83;27;78;27;69",
        "wc_weaknesses": "162;470;149;20;160",
        "wc_questions": "90;6;78;2;36",
        "wc_review": "416;584;384;113;411",
        "wc_reply_reviewers": "182;301;130;0;0",
        "wc_reply_authors": "3029;2526;2653;914;1793",
        "reply_reviewers": "1;2;1;0;0",
        "reply_authors": "6;5;5;5;5",
        "rating_avg": [
            4.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            4.2,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            2.2,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            90.2,
            28.6174771774173
        ],
        "wc_strengths_avg": [
            56.8,
            24.741867350707384
        ],
        "wc_weaknesses_avg": [
            192.2,
            148.755369650981
        ],
        "wc_questions_avg": [
            42.4,
            36.14194239384486
        ],
        "wc_review_avg": [
            381.6,
            151.76639944335506
        ],
        "wc_reply_reviewers_avg": [
            122.6,
            114.43006597918223
        ],
        "wc_reply_authors_avg": [
            2183.0,
            750.5632551624146
        ],
        "reply_reviewers_avg": [
            0.8,
            0.7483314773547883
        ],
        "reply_authors_avg": [
            5.2,
            0.39999999999999997
        ],
        "replies_avg": [
            38,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.10206207261596574,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:e7EgC2in8KoJ:scholar.google.com/&scioq=All+for+One+and+One+for+All:+A+Collaborative+FL+Framework+for+Generic+Federated+Learning+with+Personalized+Plug-ins&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;4;2",
        "aff_unique_norm": "Huazhong University of Science and Technology;Microsoft;Hong Kong Baptist University;Hong Kong University of Science and Technology;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_unique_dep": ";Microsoft Research;;;",
        "aff_unique_url": "http://www.hust.edu.cn;https://www.microsoft.com/en-us/research;https://www.hkbu.edu.hk;https://www.ust.hk;https://www.mbzuai.ac.ae",
        "aff_unique_abbr": "HUST;MSR;HKBU;HKUST;MBZUAI",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;1;0;0;2;0",
        "aff_country_unique": "China;United States;United Arab Emirates"
    },
    {
        "title": "Fine-Tuning Enhances Existing Mechanisms: A Case Study on Entity Tracking",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19313",
        "id": "8sKcAWOf2D",
        "author_site": "Nikhil Prakash, Tamar Shaham, Tal Haklay, Yonatan Belinkov, David Bau",
        "tldr": "",
        "abstract": "Fine-tuning on generalized tasks such as instruction following, code generation, and mathematics has been shown to enhance language models' performance on a range of tasks. Nevertheless, explanations of how such fine-tuning influences the internal computations in these models remain elusive. We study how fine-tuning affects the internal mechanisms implemented in language models. As a case study, we explore the property of entity tracking, a crucial facet of language comprehension, where models fine-tuned on mathematics have substantial performance gains. We identify a mechanism that enables entity tracking and show that (i) both the original model and its fine-tuned version implement entity tracking with the same circuit. In fact, the entity tracking circuit of the fine-tuned version performs better than the full original model. (ii) The circuits of all the models implement roughly the same functionality, that is entity tracking is performed by tracking the position of the correct entity in both the original model and its fine-tuned version. (iii) Performance boost in the fine-tuned model is primarily attributed to its improved ability to handle positional information. To uncover these findings, we employ two methods: DCM, which automatically detects model components responsible for specific semantics, and CMAP, a new approach for patching activations across models to reveal improved mechanisms. Our findings suggest that fine-tuning enhances, rather than fundamentally alters, the mechanistic operation of the model.",
        "keywords": "Mechanistic Interpretability;Fine-Tuning;Entity Tracking;Mechanisms",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Nikhil Prakash;Tamar Rott Shaham;Tal Haklay;Yonatan Belinkov;David Bau",
        "authorids": "~Nikhil_Prakash1;~Tamar_Rott_Shaham1;~Tal_Haklay1;~Yonatan_Belinkov1;~David_Bau1",
        "gender": "M;F;F;M;M",
        "homepage": "https://nix07.github.io/;https://tamarott.github.io/;;https://www.belinkov.com;https://baulab.info/",
        "dblp": "227/0705;185/7904;;136/8705;47/3614",
        "google_scholar": "kUfq-fEAAAAJ;https://scholar.google.co.il/citations?user=YRJ-ePMAAAAJ;;https://scholar.google.com/citations?authorid=K-6ujU4AAAAJ;CYI6cKgAAAAJ",
        "orcid": ";;;;0000-0003-1744-6765",
        "linkedin": "nikhil07prakash/;;tal-haklay-501032192/;;david-bau-4b8130/",
        "or_profile": "~Nikhil_Prakash1;~Tamar_Rott_Shaham1;~Tal_Haklay1;~Yonatan_Belinkov1;~David_Bau1",
        "aff": "Northeastern University;Massachusetts Institute of Technology;Technion - Israel Institute of Technology, Technion;Technion, Technion;Northeastern University",
        "aff_domain": "northeastern.edu;mit.edu;technion.ac.il;technion.ac.il;northeastern.edu",
        "position": "PhD student;Postdoc;MS student;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nprakash2024finetuning,\ntitle={Fine-Tuning Enhances Existing Mechanisms: A Case Study on Entity Tracking},\nauthor={Nikhil Prakash and Tamar Rott Shaham and Tal Haklay and Yonatan Belinkov and David Bau},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=8sKcAWOf2D}\n}",
        "github": "",
        "project": "",
        "reviewers": "AnWX;fhvV;M52Y",
        "pdf_size": 2936233,
        "rating": "5;6;6",
        "confidence": "4;3;4",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "3;3;3",
        "wc_summary": "102;188;166",
        "wc_strengths": "31;96;147",
        "wc_weaknesses": "58;240;134",
        "wc_questions": "29;53;2",
        "wc_review": "220;577;449",
        "wc_reply_reviewers": "14;0;21",
        "wc_reply_authors": "768;1574;763",
        "reply_reviewers": "1;0;1",
        "reply_authors": "1;3;1",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            152.0,
            36.478304054145205
        ],
        "wc_strengths_avg": [
            91.33333333333333,
            47.471628954097994
        ],
        "wc_weaknesses_avg": [
            144.0,
            74.63689882803725
        ],
        "wc_questions_avg": [
            28.0,
            20.83266665599966
        ],
        "wc_review_avg": [
            415.3333333333333,
            147.67607193524015
        ],
        "wc_reply_reviewers_avg": [
            11.666666666666666,
            8.73053390247253
        ],
        "wc_reply_authors_avg": [
            1035.0,
            381.13602121377437
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 43,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13633037998843459062&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=8sKcAWOf2D",
        "pdf": "https://openreview.net/pdf?id=8sKcAWOf2D",
        "email": "northeastern.edu;mit.edu;technion.ac.il;technion.ac.il;northeastern.edu",
        "author_num": 5,
        "aff_unique_index": "0;1;2;2;0",
        "aff_unique_norm": "Northeastern University;Massachusetts Institute of Technology;Technion - Israel Institute of Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.northeastern.edu;https://web.mit.edu;https://www.technion.ac.il",
        "aff_unique_abbr": "NEU;MIT;Technion",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;1;0",
        "aff_country_unique": "United States;Israel"
    },
    {
        "id": "8tGu1pNUnN",
        "title": "CodeComplex: A Time-complexity Dataset for Multi-language Source Codes",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Deciding the computational complexity of algorithms is a really challenging problem, even for human algorithm experts. Theoretically, the problem of deciding the computational complexity of a given program is undecidable due to the famous Halting problem. So, we focus on cases where there are inputs and outputs, and of which we can know if the code is right or wrong. \nWe propose our own dataset CodeComplex, which consists of 4,900 Java codes and 4,900 Python codes submitted to programming competitions by human programmers and their complexity labels annotated by a group of algorithm experts. As far as we are aware, the CodeComplex dataset is by far the largest code dataset for the complexity prediction problem. Then, we present experimental results from several baseline models using the SOTA code understanding neural models such as CodeBERT, GraphCodeBERT, PLBART, CodeT5, CodeT5+ and UniXcoder. We also give an analysis on the difficulties of code complexity and why the models are good/bad on predicting the time complexity.\nThe CodeComplex dataset is available at https://anonymous.4open.science/r/CodeComplex-Data\nand material for reproduction is available at https://anonymous.4open.science/r/CodeComplex-Models.",
        "keywords": "Code complexity;Dataset;Neural network",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "SeungYeop Baik;Mingi Jeon;Joonghyuk Hahn;Jungin Kim;Yo-Sub Han;Sang-Ki Ko",
        "authorids": "~SeungYeop_Baik1;~Mingi_Jeon1;~Joonghyuk_Hahn1;~Jungin_Kim1;~Yo-Sub_Han1;~Sang-Ki_Ko1",
        "gender": "M;M;M;;;M",
        "homepage": "https://sybaik1.github.io/;https://ckawoalt.github.io/;https://peer0.github.io;https://github.com/inistory;http://toc.yonsei.ac.kr/~emmous/;https://sites.google.com/site/sangkikotoc/home",
        "dblp": ";;304/4027;70/4018.html;h/YoSubHan;71/9491.html",
        "google_scholar": ";;08ccS2oAAAAJ;jLI2V78AAAAJ;yDOh26sAAAAJ;https://scholar.google.com/scholar?hl=en",
        "orcid": ";;0009-0000-5890-4916;;;",
        "linkedin": ";;joonghyuk-hahn;;;",
        "or_profile": "~SeungYeop_Baik1;~Mingi_Jeon1;~Joonghyuk_Hahn1;~Jungin_Kim1;~Yo-Sub_Han1;~Sang-Ki_Ko1",
        "aff": "Yonsei University;;Yonsei University;Yonsei University;Yonsei University;University of Seoul",
        "aff_domain": "yonsei.ac.kr;;yonsei.ac.kr;yonsei.ac.kr;yonsei.ac.kr;uos.ac.kr",
        "position": "PhD student;;PhD student;MS student;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nbaik2024codecomplex,\ntitle={CodeComplex: A Time-complexity Dataset for Multi-language Source Codes},\nauthor={SeungYeop Baik and Mingi Jeon and Joonghyuk Hahn and Jungin Kim and Yo-Sub Han and Sang-Ki Ko},\nyear={2024},\nurl={https://openreview.net/forum?id=8tGu1pNUnN}\n}",
        "github": "",
        "project": "",
        "reviewers": "UsDM;Vi2o;oyNS;aZXg",
        "site": "https://openreview.net/forum?id=8tGu1pNUnN",
        "pdf_size": 583447,
        "rating": "3;3;5;5",
        "confidence": "4;4;3;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;2;2",
        "wc_summary": "58;47;67;89",
        "wc_strengths": "78;16;54;112",
        "wc_weaknesses": "305;93;190;290",
        "wc_questions": "98;63;127;254",
        "wc_review": "539;219;438;745",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            65.25,
            15.433324334050653
        ],
        "wc_strengths_avg": [
            65.0,
            35.0
        ],
        "wc_weaknesses_avg": [
            219.5,
            85.37124808739767
        ],
        "wc_questions_avg": [
            135.5,
            72.07114540507872
        ],
        "wc_review_avg": [
            485.25,
            189.39426469669033
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:22_OuezmMioJ:scholar.google.com/&scioq=CodeComplex:+A+Time-complexity+Dataset+for+Multi-language+Source+Codes&hl=en&as_sdt=0,24",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;1",
        "aff_unique_norm": "Yonsei University;University of Seoul",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.yonsei.ac.kr;http://www.useoul.edu",
        "aff_unique_abbr": "Yonsei;UOS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "8tWOUmBHRv",
        "title": "Offline Tracking with Object Permanence",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "To reduce the expensive labor cost for manual labeling autonomous driving datasets, an alternative is to automatically label the datasets using an offline perception system. However, objects might be temporally occluded. Such occlusion scenarios in the datasets are common yet underexplored in offline autolabeling. In this work, we propose an offline tracking model that focuses on occluded object tracks. It leverages the concept of object permanence which means objects continue to exist even if they are not observed anymore. The model contains three parts: a standard online tracker, a re-identification (Re-ID) module that associates tracklets before and after occlusion, and a track completion module that completes the fragmented tracks. The Re-ID module and the track completion module use the vectorized high-definition map (HD map) as one of the inputs to refine the tracking results with occlusion. The model can effectively recover the occluded object trajectories. It achieves state-of-the-art performance in 3D multi-object tracking (MOT) by improving over the original online tracking result by 45% IDS and 2% AMOTA on the vehicle tracks.",
        "keywords": "autonomous driving;offline tracking;occlusion",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Xianzhong Liu;Holger Caesar",
        "authorids": "~Xianzhong_Liu1;~Holger_Caesar2",
        "gender": "M;M",
        "homepage": ";http://it-caesar.com",
        "dblp": ";125/7460",
        "google_scholar": ";373LKEYAAAAJ",
        "orcid": ";",
        "linkedin": "xianzhong-liu-992375193/;holger-caesar-18600638/?originalSubdomain=sg",
        "or_profile": "~Xianzhong_Liu1;~Holger_Caesar2",
        "aff": ";Delft University of Technology",
        "aff_domain": ";tudelft.nl",
        "position": ";Assistant Professor",
        "bibtex": "@misc{\nliu2024offline,\ntitle={Offline Tracking with Object Permanence},\nauthor={Xianzhong Liu and Holger Caesar},\nyear={2024},\nurl={https://openreview.net/forum?id=8tWOUmBHRv}\n}",
        "github": "",
        "project": "",
        "reviewers": "SgKx;tT1W;GvzN;S5GM",
        "site": "https://openreview.net/forum?id=8tWOUmBHRv",
        "pdf_size": 2259320,
        "rating": "3;3;5;5",
        "confidence": "4;3;4;3",
        "soundness": "2;3;2;2",
        "contribution": "1;2;2;1",
        "presentation": "2;3;3;2",
        "wc_summary": "64;73;64;73",
        "wc_strengths": "11;37;56;30",
        "wc_weaknesses": "22;145;103;124",
        "wc_questions": "117;54;27;124",
        "wc_review": "214;309;250;351",
        "wc_reply_reviewers": "0;44;0;104",
        "wc_reply_authors": "379;0;0;0",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "1;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            68.5,
            4.5
        ],
        "wc_strengths_avg": [
            33.5,
            16.101242188104617
        ],
        "wc_weaknesses_avg": [
            98.5,
            46.5966737010272
        ],
        "wc_questions_avg": [
            80.5,
            41.19769411022904
        ],
        "wc_review_avg": [
            281.0,
            52.758885507561665
        ],
        "wc_reply_reviewers_avg": [
            37.0,
            42.649736224272246
        ],
        "wc_reply_authors_avg": [
            94.75,
            164.11181401715112
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            0.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3862650890182915223&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0",
        "aff_unique_norm": "Delft University of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tudelft.nl",
        "aff_unique_abbr": "TU Delft",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Netherlands"
    },
    {
        "id": "8uYJottqTy",
        "title": "Solving Continual Offline Reinforcement Learning with Decision Transformer",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Continuous offline reinforcement learning (CORL) combines continuous and offline reinforcement learning, enabling agents to learn multiple tasks from static datasets without forgetting prior tasks. However, CORL faces challenges in balancing stability and plasticity. Existing methods, employing Actor-Critic structures and experience replay (ER), suffer from distribution shifts, low efficiency, and weak knowledge-sharing. To address these issues, we first compare AC-based offline algorithms with Decision Transformer (DT) within the CORL framework.  DT offers advantages in learning efficiency, distribution shift mitigation, and zero-shot generalization but exacerbates the forgetting problem during supervised parameter updates. We introduce multi-head DT (MH-DT) and low-rank adaptation DT (LoRA-DT) to mitigate DT's forgetting problem. MH-DT stores task-specific knowledge using multiple heads, facilitating knowledge sharing with common components.  It employs distillation and selective rehearsal to enhance current task learning when a replay buffer is available. In buffer-unavailable scenarios, LoRA-DT merges less influential weights and fine-tunes DT's decisive MLP layer to adapt to the current task. Extensive experiments on MoJuCo and Meta-World benchmarks demonstrate that our methods outperform SOTA CORL baselines and showcase enhanced learning capabilities and superior memory efficiency.",
        "keywords": "offline RL;continual learning;decision transformer",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Kaixin Huang;Li Shen;Chen Zhao;Chun Yuan;Dacheng Tao",
        "authorids": "~Kaixin_Huang1;~Li_Shen1;~Chen_Zhao8;~Chun_Yuan1;~Dacheng_Tao1",
        "gender": "M;M;;M;",
        "homepage": ";https://sites.google.com/site/mathshenli/home;;https://www.sigs.tsinghua.edu.cn/fg3/105064.jhtml;",
        "dblp": ";91/3680-8;;;",
        "google_scholar": "https://scholar.google.com.hk/citations?hl=zh-CN;yVhgENIAAAAJ;;https://scholar.google.com.hk/citations?user=fYdxi2sAAAAJ;",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Kaixin_Huang1;~Li_Shen1;~Chen_Zhao8;~Chun_Yuan1;~Dacheng_Tao1",
        "aff": "Electronic Engineering, Tsinghua University, Tsinghua University;JD Explore Academy;;Tsinghua University;",
        "aff_domain": "mails.tsinghua.edu.cn;jd.com;;tsinghua.edu.cn;",
        "position": "MS student;Researcher;;Full Professor;",
        "bibtex": "@misc{\nhuang2024solving,\ntitle={Solving Continual Offline Reinforcement Learning with Decision Transformer},\nauthor={Kaixin Huang and Li Shen and Chen Zhao and Chun Yuan and Dacheng Tao},\nyear={2024},\nurl={https://openreview.net/forum?id=8uYJottqTy}\n}",
        "github": "",
        "project": "",
        "reviewers": "Md6w;ZQbc;b7vq;1HUt",
        "site": "https://openreview.net/forum?id=8uYJottqTy",
        "pdf_size": 18435930,
        "rating": "3;3;5;5",
        "confidence": "4;4;2;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;2",
        "presentation": "1;2;3;2",
        "wc_summary": "50;38;41;34",
        "wc_strengths": "28;9;35;36",
        "wc_weaknesses": "278;176;90;38",
        "wc_questions": "98;42;2;22",
        "wc_review": "454;265;168;130",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            40.75,
            5.889609494694874
        ],
        "wc_strengths_avg": [
            27.0,
            10.8397416943394
        ],
        "wc_weaknesses_avg": [
            145.5,
            90.99862636325891
        ],
        "wc_questions_avg": [
            41.0,
            35.81898937714463
        ],
        "wc_review_avg": [
            254.25,
            125.39213492081551
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9045340337332909,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10700540742214198622&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Tsinghua University;JD",
        "aff_unique_dep": "Electronic Engineering;JD Explore Academy",
        "aff_unique_url": "https://www.tsinghua.edu.cn;",
        "aff_unique_abbr": "THU;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China;"
    },
    {
        "title": "Learning Nash Equilibria in Rank-1 Games",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19312",
        "id": "8utTlmhw8v",
        "author_site": "Nikolas Patris, Ioannis Panageas",
        "tldr": "",
        "abstract": "Learning Nash equilibria (NE) in games has garnered significant attention, particularly in the context of training Generative Adversarial Networks (GANs) and multi-agent Reinforcement Learning. The current state-of-the-art in efficiently learning games focuses on landscapes that meet the (weak) Minty property or games characterized by a unique function, often referred to as potential games. A significant challenge in this domain is that computing Nash equilibria is a computationally intractable task [Daskalakis et al. 2009]. \n\nIn this paper we focus on bimatrix games (A,B) called rank-1. These are games in which the sum of the payoff matrices A+B is a rank 1 matrix; note that standard zero-sum games are rank 0. We show that optimistic gradient descent/ascent converges to an \\epsilon-approximate NE after 1/\\epsilon^2 log(1/\\epsilon) iterates in rank-1 games. We achieve this by leveraging structural results about the NE landscape of rank-1 games Adsul et al. 2021. Notably, our approach bypasses the fact that these games do not satisfy the MVI property.",
        "keywords": "learning in games;rank games;Nash equilibria;Minty;optimistic gradient",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Nikolas Patris;Ioannis Panageas",
        "authorids": "~Nikolas_Patris1;~Ioannis_Panageas1",
        "gender": "M;M",
        "homepage": "https://npatris.github.io/;https://panageas.github.io",
        "dblp": "297/4669;139/3829",
        "google_scholar": "https://scholar.google.com/citations?hl=en;5NiFWuwAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Nikolas_Patris1;~Ioannis_Panageas1",
        "aff": "University of California, Irvine;Donald Bren School of Information and Computer Sciences, University of California, Irvine",
        "aff_domain": "uci.edu;ics.uci.edu",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\npatris2024learning,\ntitle={Learning Nash Equilibria in Rank-1 Games},\nauthor={Nikolas Patris and Ioannis Panageas},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=8utTlmhw8v}\n}",
        "github": "",
        "project": "",
        "reviewers": "LH17;cjaZ;r4eu;TKWX",
        "pdf_size": 7806530,
        "rating": "5;5;6;8",
        "confidence": "2;4;4;3",
        "soundness": "3;3;3;3",
        "contribution": "3;1;2;3",
        "presentation": "2;2;4;3",
        "wc_summary": "76;179;120;95",
        "wc_strengths": "28;16;30;100",
        "wc_weaknesses": "42;81;183;29",
        "wc_questions": "380;45;28;45",
        "wc_review": "526;321;361;269",
        "wc_reply_reviewers": "0;0;84;17",
        "wc_reply_authors": "1608;803;844;455",
        "reply_reviewers": "0;0;2;1",
        "reply_authors": "3;2;3;2",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            117.5,
            38.78466191679386
        ],
        "wc_strengths_avg": [
            43.5,
            33.05676935213119
        ],
        "wc_weaknesses_avg": [
            83.75,
            60.41264354421184
        ],
        "wc_questions_avg": [
            124.5,
            147.6761659849009
        ],
        "wc_review_avg": [
            369.25,
            96.19868762098577
        ],
        "wc_reply_reviewers_avg": [
            25.25,
            34.62206666275137
        ],
        "wc_reply_authors_avg": [
            927.5,
            420.9539761066523
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12925125726078962169&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=8utTlmhw8v",
        "pdf": "https://openreview.net/pdf?id=8utTlmhw8v",
        "email": "uci.edu;ics.uci.edu",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of California, Irvine",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uci.edu",
        "aff_unique_abbr": "UCI",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Irvine",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "8vGXHjuCiq",
        "title": "Connectivity-based Token Condensation for Efficient Vision Transformer",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The high computational cost of vision transformers blocks their implementation on resource-limited devices such as mobile phones. Reducing the number of tokens can significantly accelerate the inference process and save computational resources. Most of the existing token pruning methods focus on evaluating token's importance and discard the unimportant tokens directly, which incur significant information loss. A few methods suggest ways focusing on merging while directly partition tokens into two parts by random or odd/even partition, which do not consider carefully how to select tokens. In this paper, we propose a new token condensation method based on the connectivity between tokens. Different from the previous methods, we gradually condense the large number of tokens by selection and fusion. The most representative tokens are selected and the others are separately fused into them. Extensive experiments are conducted on benchmark datasets. Compared with the existing methods, our method achieves higher accuracy with lower computational cost. For example, our method can reduce 50\\% FLOPs of DeiT-S without accuracy degradation on ImageNet dataset.",
        "keywords": "Vision Transformer;Token Condensation;Connectivity",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Tianxing Na;Yehui Tang;Chao Zhang;Chao Xu;Yunhe Wang;Kai Han",
        "authorids": "~Tianxing_Na1;~Yehui_Tang1;~Chao_Zhang10;~Chao_Xu1;~Yunhe_Wang1;~Kai_Han2",
        "gender": "M;M;M;M;M;M",
        "homepage": ";;http://www.cis.pku.edu.cn/faculty/vision/zhangchao/zhangchao.htm;http://www.cis.pku.edu.cn/faculty/vision/xuchao/xuchao01.htm;https://www.wangyunhe.site/;https://iamhankai.github.io",
        "dblp": ";244/9659;94/3019-1;;63/8217-1;51/4757-2",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;TkSZQ6gAAAAJ;NeCCx-kAAAAJ;https://scholar.google.co.uk/citations?hl=zh-CN;https://scholar.google.com.sg/citations?user=isizOkYAAAAJ;vThoBVcAAAAJ",
        "orcid": ";;;;0000-0002-0142-509X;0000-0002-9761-2702",
        "linkedin": ";;;;;",
        "or_profile": "~Tianxing_Na1;~Yehui_Tang1;~Chao_Zhang10;~Chao_Xu1;~Yunhe_Wang1;~Kai_Han2",
        "aff": "Peking University;Huawei Technologies Ltd.;Peking University;Peking University;Huawei Noah's Ark Lab;Huawei Noah's Ark Lab",
        "aff_domain": "pku.edu.cn;huawei.com;pku.edu.cn;pku.edu;huawei.com;huawei.com",
        "position": "MS student;Researcher;Full Professor;Full Professor;Principal Researcher;Principal Researcher",
        "bibtex": "@misc{\nna2024connectivitybased,\ntitle={Connectivity-based Token Condensation for Efficient Vision Transformer},\nauthor={Tianxing Na and Yehui Tang and Chao Zhang and Chao Xu and Yunhe Wang and Kai Han},\nyear={2024},\nurl={https://openreview.net/forum?id=8vGXHjuCiq}\n}",
        "github": "",
        "project": "",
        "reviewers": "V3W2;DqFk;apVU;1bHr",
        "site": "https://openreview.net/forum?id=8vGXHjuCiq",
        "pdf_size": 7198473,
        "rating": "3;3;5;6",
        "confidence": "4;4;4;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "3;2;1;2",
        "wc_summary": "247;70;98;51",
        "wc_strengths": "61;16;29;50",
        "wc_weaknesses": "391;126;136;307",
        "wc_questions": "190;45;35;46",
        "wc_review": "889;257;298;454",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            116.5,
            77.17674520216566
        ],
        "wc_strengths_avg": [
            39.0,
            17.564168070250297
        ],
        "wc_weaknesses_avg": [
            240.0,
            113.02875740270703
        ],
        "wc_questions_avg": [
            79.0,
            64.23005527009921
        ],
        "wc_review_avg": [
            474.5,
            250.34426296602047
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:gNRJtyhzI2QJ:scholar.google.com/&scioq=Connectivity-based+Token+Condensation+for+Efficient+Vision+Transformer&hl=en&as_sdt=0,48",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0;1;1",
        "aff_unique_norm": "Peking University;Huawei",
        "aff_unique_dep": ";Huawei Technologies",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.huawei.com",
        "aff_unique_abbr": "Peking U;Huawei",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "What does automatic differentiation compute for neural networks?",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19311",
        "id": "8vKknbgXxf",
        "author_site": "Sejun Park, Sanghyuk Chun, Wonyeol Lee",
        "tldr": "",
        "abstract": "Forward- or reverse-mode automatic differentiation (AD) is a popular algorithm for computing the derivative of a function expressed by a program. AD always outputs the correct derivative if a program does not use any non-differentiable functions and control flows; however, it may return an arbitrary value otherwise. In this work, we investigate what AD computes for neural networks that may contain non-differentiable functions such as ReLU and maxpools. We first prove that AD always returns a generalized derivative called a Clarke subderivative for networks with pointwise activation functions, if the minibatch size is one and all non-differentiable neurons have distinct bias parameters. We show that the same conclusion does not hold otherwise, but does hold under some mild sufficient conditions. We also prove similar results for more general networks that can use maxpools and bias parameters shared across different neurons. We empirically check our sufficient conditions over popular network architectures and observe that AD almost always computes a Clarke subderivative in practical learning setups.",
        "keywords": "automatic differentiation;correctness;neural networks;clarke subdifferential",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Sejun Park;Sanghyuk Chun;Wonyeol Lee",
        "authorids": "~Sejun_Park1;~Sanghyuk_Chun1;~Wonyeol_Lee1",
        "gender": ";M;M",
        "homepage": ";https://sanghyukchun.github.io/home/;https://wonyeol.github.io",
        "dblp": "155/9882;213/1095.html;124/7158",
        "google_scholar": ";https://scholar.google.co.kr/citations?user=4_uj0xcAAAAJ;g3TYhjcAAAAJ",
        "orcid": ";0000-0002-4533-2610;",
        "linkedin": ";https://kr.linkedin.com/in/sanghyukchun/en;wonyeol/",
        "or_profile": "~Sejun_Park1;~Sanghyuk_Chun1;~Wonyeol_Lee1",
        "aff": "Korea University;NAVER AI Lab;Carnegie Mellon University",
        "aff_domain": "korea.ac.kr;navercorp.com;cmu.edu",
        "position": "Assistant Professor;Lead research scientist;Postdoc",
        "bibtex": "@inproceedings{\npark2024what,\ntitle={What does automatic differentiation compute for neural networks?},\nauthor={Sejun Park and Sanghyuk Chun and Wonyeol Lee},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=8vKknbgXxf}\n}",
        "github": "",
        "project": "",
        "reviewers": "84GA;FQtB;XRNZ;uFDP;DHhS",
        "pdf_size": 509858,
        "rating": "6;6;8;8;8",
        "confidence": "3;2;1;3;3",
        "soundness": "3;3;2;4;4",
        "contribution": "3;2;2;3;3",
        "presentation": "2;3;3;4;3",
        "wc_summary": "52;25;126;544;143",
        "wc_strengths": "20;19;32;55;115",
        "wc_weaknesses": "94;36;169;53;88",
        "wc_questions": "269;32;22;27;43",
        "wc_review": "435;112;349;679;389",
        "wc_reply_reviewers": "345;0;0;66;16",
        "wc_reply_authors": "2253;666;164;1155;393",
        "reply_reviewers": "2;0;0;1;1",
        "reply_authors": "7;1;1;3;1",
        "rating_avg": [
            7.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            2.4,
            0.8
        ],
        "soundness_avg": [
            3.2,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            3.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            178.0,
            188.23920951810226
        ],
        "wc_strengths_avg": [
            48.2,
            35.82959670440068
        ],
        "wc_weaknesses_avg": [
            88.0,
            45.88245852174881
        ],
        "wc_questions_avg": [
            78.6,
            95.45386320102502
        ],
        "wc_review_avg": [
            392.8,
            181.36857500680762
        ],
        "wc_reply_reviewers_avg": [
            85.4,
            132.03878218159997
        ],
        "wc_reply_authors_avg": [
            926.2,
            741.0401878440872
        ],
        "reply_reviewers_avg": [
            0.8,
            0.7483314773547883
        ],
        "reply_authors_avg": [
            2.6,
            2.3323807579381204
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.10206207261596574,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:FflVEilSkoAJ:scholar.google.com/&scioq=What+does+automatic+differentiation+compute+for+neural+networks%3F&hl=en&as_sdt=0,23",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=8vKknbgXxf",
        "pdf": "https://openreview.net/pdf?id=8vKknbgXxf",
        "email": "korea.ac.kr;navercorp.com;cmu.edu",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Korea University;NAVER Corporation;Carnegie Mellon University",
        "aff_unique_dep": ";NAVER AI Lab;",
        "aff_unique_url": "https://www.korea.ac.kr;https://www.naver.com;https://www.cmu.edu",
        "aff_unique_abbr": "KU;NAVER;CMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "id": "8vT0f6x1BY",
        "title": "Going Further: Flatness at the Rescue of Early Stopping for Adversarial Example Transferability",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Transferability is the property of adversarial examples to be misclassified by other models than the surrogate model for which they were crafted. Previous research has shown that early stopping the training of the surrogate model substantially increases transferability. A common hypothesis to explain this is that deep neural networks (DNNs) first learn robust features, which are more generic, thus a better surrogate. Then, at later epochs, DNNs learn non-robust features, which are more brittle, hence worst surrogate. We demonstrate that the reasons why early stopping improves transferability lie in the side effects it has on the learning dynamics of the model. We first show that early stopping benefits the transferability of non-robust features. Then, we establish links between transferability and the exploration of the loss landscape in the parameter space, on which early stopping has an inherent effect. More precisely, we observe that transferability peaks when the learning rate decays, which is also the time at which the sharpness of the loss significantly drops. \nThis leads us to evaluate the training of surrogate models with seven minimizers that minimize both loss value and loss sharpness. One of such optimizers, SAM always improves over early stopping (by up to 28.8 percentage points). We also uncover that the strong regularization induced by SAM with large flat neighborhoods is tightly linked to transferability. Finally, the best sharpness-aware minimizers are competitive with other training techniques, and complementary to other types of transferability techniques.",
        "keywords": "adversarial examples;transferability;sharpness;loss landscape;early stopping",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Martin Gubri;Maxime Cordy;YVES LE TRAON",
        "authorids": "~Martin_Gubri1;~Maxime_Cordy1;~YVES_LE_TRAON1",
        "gender": "M;M;M",
        "homepage": "https://gubri.eu;https://maxcordy.github.io/;https://wwwfr.uni.lu/snt/people/yves_le_traon",
        "dblp": "213/7879;73/10839.html;95/5206",
        "google_scholar": "Jt4OYwMAAAAJ;sRXHjkIAAAAJ;DmGlmNEAAAAJ",
        "orcid": "0000-0001-6744-6662;0000-0001-8312-1358;",
        "linkedin": ";;",
        "or_profile": "~Martin_Gubri1;~Maxime_Cordy1;~YVES_LE_TRAON1",
        "aff": "Parameter Lab;University of Luxemburg;",
        "aff_domain": "parameterlab.de;uni.lu;",
        "position": "Principal Researcher;Researcher;",
        "bibtex": "@misc{\ngubri2024going,\ntitle={Going Further: Flatness at the Rescue of Early Stopping for Adversarial Example Transferability},\nauthor={Martin Gubri and Maxime Cordy and YVES LE TRAON},\nyear={2024},\nurl={https://openreview.net/forum?id=8vT0f6x1BY}\n}",
        "github": "",
        "project": "",
        "reviewers": "2E6M;hxCY;4sAy;5DVg",
        "site": "https://openreview.net/forum?id=8vT0f6x1BY",
        "pdf_size": 769398,
        "rating": "3;3;5;6",
        "confidence": "4;5;4;4",
        "soundness": "2;1;3;3",
        "contribution": "2;2;3;3",
        "presentation": "1;3;4;3",
        "wc_summary": "201;108;134;95",
        "wc_strengths": "29;117;53;65",
        "wc_weaknesses": "351;467;619;318",
        "wc_questions": "168;15;75;5",
        "wc_review": "749;707;881;483",
        "wc_reply_reviewers": "0;0;30;0",
        "wc_reply_authors": "429;378;347;204",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            134.5,
            40.88092464707715
        ],
        "wc_strengths_avg": [
            66.0,
            32.17141588429082
        ],
        "wc_weaknesses_avg": [
            438.75,
            117.86512418862503
        ],
        "wc_questions_avg": [
            65.75,
            64.82042502174758
        ],
        "wc_review_avg": [
            705.0,
            143.35271186831451
        ],
        "wc_reply_reviewers_avg": [
            7.5,
            12.99038105676658
        ],
        "wc_reply_authors_avg": [
            339.5,
            83.52993475395512
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5555555555555555,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13291102371347036259&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Parameter Lab;University of Luxembourg",
        "aff_unique_dep": ";",
        "aff_unique_url": ";https://wwwen.uniluxembourg.lu",
        "aff_unique_abbr": ";Uni Lu",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "1",
        "aff_country_unique": ";Luxembourg"
    },
    {
        "id": "8w6FzR68DS",
        "title": "PriViT: Vision Transformers for Fast Private Inference",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The Vision Transformer (ViT) architecture has emerged as the backbone of choice for state-of-the-art deep models for computer vision applications. However, ViTs are ill-suited for private inference using secure multi-party computation (MPC) protocols, due to the large number of non-polynomial operations (self-attention, feed-forward rectifiers, layer normalization). We propose PriViT, a gradient-based algorithm to selectively Taylorize nonlinearities in ViTs while maintaining their prediction accuracy. Our algorithm is conceptually simple, easy to implement, and achieves improved performance over existing approaches for designing MPC-friendly transformer architectures in terms of achieving the Pareto frontier in latency-accuracy. We confirm these improvements via experiments on several standard image classification tasks.",
        "keywords": "private inference;transformers;secure multi-party communication",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/77397e0854eaf94604242cbe06f4a72ccb6b3b17.pdf",
        "author": "Naren Dhyani;Jianqiao Cambridge Mo;Minsu Cho;Ameya Joshi;Siddharth Garg;Brandon Reagen;Chinmay Hegde",
        "authorids": "~Naren_Dhyani1;~Jianqiao_Cambridge_Mo1;~Minsu_Cho2;~Ameya_Joshi2;~Siddharth_Garg1;~Brandon_Reagen1;~Chinmay_Hegde1",
        "gender": "M;M;M;M;M;M;M",
        "homepage": ";http://engineering.nyu.edu/people/siddharth-garg/;https://brandonreagen.com/;https://chinmayhegde.github.io/;https://ameya005.github.io;https://engineering.nyu.edu/student/jianqiao-cambridge-mo;",
        "dblp": ";94/3807;135/8203;39/2056;148/8731;260/4034;",
        "google_scholar": ";https://scholar.google.com.tw/citations?user=Yf8OqQQAAAAJ;cO2uYoAAAAAJ;eJAV17IAAAAJ;jZgsp_sAAAAJ;rydgKnMAAAAJ;1pcqgUYAAAAJ",
        "orcid": ";;;;;0000-0001-9533-8183;",
        "linkedin": "naren-dhyani/;;;;;jianqiao-cambridge-mo/;",
        "or_profile": "~Naren_Dhyani1;~Siddharth_Garg1;~Brandon_Reagen1;~Chinmay_Hegde1;~Ameya_A_Joshi1;~Jianqiao_Mo1;~Minsu_Cho3",
        "aff": ";New York University;New York University;New York University;InstaDeep;New York University;Samsung",
        "aff_domain": ";nyu.edu;nyu.edu;nyu.edu;instadeep.com;nyu.edu;samsung.com",
        "position": ";Associate Professor;Professor;Associate Professor;Researcher;PhD student;Researcher",
        "bibtex": "@misc{\ndhyani2024privit,\ntitle={PriViT: Vision Transformers for Fast Private Inference},\nauthor={Naren Dhyani and Jianqiao Cambridge Mo and Minsu Cho and Ameya Joshi and Siddharth Garg and Brandon Reagen and Chinmay Hegde},\nyear={2024},\nurl={https://openreview.net/forum?id=8w6FzR68DS}\n}",
        "github": "",
        "project": "",
        "reviewers": "pfyb;HTX8;y916;BazG",
        "site": "https://openreview.net/forum?id=8w6FzR68DS",
        "pdf_size": 686634,
        "rating": "5;5;5;6",
        "confidence": "3;2;3;3",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;2;2",
        "wc_summary": "68;55;25;81",
        "wc_strengths": "27;38;20;39",
        "wc_weaknesses": "23;15;80;405",
        "wc_questions": "413;51;11;16",
        "wc_review": "531;159;136;541",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "685;285;438;458",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            57.25,
            20.765054779605084
        ],
        "wc_strengths_avg": [
            31.0,
            7.905694150420948
        ],
        "wc_weaknesses_avg": [
            130.75,
            160.3096612809097
        ],
        "wc_questions_avg": [
            122.75,
            168.28305767367075
        ],
        "wc_review_avg": [
            341.75,
            194.45227563595137
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            466.5,
            142.8014355670138
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5350038279028032370&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;1;0;2",
        "aff_unique_norm": "New York University;InstaDeep;Samsung",
        "aff_unique_dep": ";;Samsung",
        "aff_unique_url": "https://www.nyu.edu;https://www.instadeep.com;https://www.samsung.com",
        "aff_unique_abbr": "NYU;InstaDeep;Samsung",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0;2",
        "aff_country_unique": "United States;United Kingdom;South Korea"
    },
    {
        "id": "8wFNfTxM6i",
        "title": "LegoNet: Piecing Together and Breaking Apart Sub-Networks for Scalable Multi-task Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Despite considerable progress in general-purpose vision models, most efforts focus on designing a new unified structure that can handle different types of input and supervision. In contrast, we believe each vision task requires its specific designed module to use different forms of perception. For example, a feature pyramid network is commonly used in segmentation but not in classification. We present LegoNet, a general Multi-Task Learning (MTL) framework that is assembled with many small sub-networks from different vision tasks, similar to how Lego pieces can be pieced together into larger structures. By leveraging this property, LegoNet can borrow design elements from single-task models and combine them to create a scalable multi-task model. We demonstrate its efficiency on mainstream vision datasets such as ImageNet, COCO, and ADE20K, and show it achieves comparable results to state-of-the-art single-task models. Moreover, like a Lego creation capable of dynamically piecing together or breaking apart pieces, our model exhibits scalability in both its model capacity and adaptability to a multitude of tasks. It can remove sub-networks and decompose into high-performing components for efficient adaptation, or add sub-networks for learning new tasks in a continuous learning scenario. On downstream tasks, it can be fine-tuned with fewer training parameters, fewer model parameters, and even transformed to a low computation shape. These functions can be controlled and combined to meet various demands of downstream applications.",
        "keywords": "multi-task learning; continous learning; efficient adaptation",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/874e946be23562ebbaa2ee3abab93bd90e5941ff.pdf",
        "author": "Zitian Chen;Mingyu Ding;Yikang Shen;Wei Zhan;Erik Learned-Miller;Chuang Gan",
        "authorids": "~Zitian_Chen1;~Mingyu_Ding1;~Yikang_Shen1;~Wei_Zhan2;~Erik_Learned-Miller2;~Chuang_Gan1",
        "gender": "M;M;M;;;M",
        "homepage": "http://chenzt.net/;https://dingmyu.github.io/;;;;http://people.csail.mit.edu/ganchuang/",
        "dblp": "218/6728;188/5243;152/8226;;;139/6993",
        "google_scholar": "n6rhKWQAAAAJ;w4yTWwoAAAAJ;qff5rRYAAAAJ;;;PTeSCbIAAAAJ",
        "orcid": ";0000-0001-6556-8359;;;;",
        "linkedin": ";dingmyu/;;;;",
        "or_profile": "~Zitian_Chen1;~Mingyu_Ding1;~Yikang_Shen1;~Wei_Zhan2;~Erik_Learned-Miller2;~Chuang_Gan1",
        "aff": "University of Massachusetts, Amherst;University of California, Berkeley;International Business Machines;;;University of Massachusetts at Amherst",
        "aff_domain": "umass.edu;berkeley.edu;ibm.com;;;umass.edu",
        "position": "PhD student;Postdoc;Researcher;;;Assistant Professor",
        "bibtex": "@misc{\nchen2024legonet,\ntitle={LegoNet: Piecing Together and Breaking Apart Sub-Networks for Scalable Multi-task Learning},\nauthor={Zitian Chen and Mingyu Ding and Yikang Shen and Wei Zhan and Erik Learned-Miller and Chuang Gan},\nyear={2024},\nurl={https://openreview.net/forum?id=8wFNfTxM6i}\n}",
        "github": "",
        "project": "",
        "reviewers": "MPaF;pEdg;thbj",
        "site": "https://openreview.net/forum?id=8wFNfTxM6i",
        "pdf_size": 3383459,
        "rating": "5;5;8",
        "confidence": "5;4;4",
        "soundness": "2;3;3",
        "contribution": "2;2;3",
        "presentation": "3;3;3",
        "wc_summary": "91;126;102",
        "wc_strengths": "88;55;44",
        "wc_weaknesses": "237;346;140",
        "wc_questions": "59;2;383",
        "wc_review": "475;529;669",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            6.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            106.33333333333333,
            14.613540144521982
        ],
        "wc_strengths_avg": [
            62.333333333333336,
            18.696404883173543
        ],
        "wc_weaknesses_avg": [
            241.0,
            84.14669730100324
        ],
        "wc_questions_avg": [
            148.0,
            167.7915373312969
        ],
        "wc_review_avg": [
            557.6666666666666,
            81.75301557469031
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:MjM1bo8Q1VcJ:scholar.google.com/&scioq=LegoNet:+Piecing+Together+and+Breaking+Apart+Sub-Networks+for+Scalable+Multi-task+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "University of Massachusetts Amherst;University of California, Berkeley;International Business Machines Corporation",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.umass.edu;https://www.berkeley.edu;https://www.ibm.com",
        "aff_unique_abbr": "UMass Amherst;UC Berkeley;IBM",
        "aff_campus_unique_index": "0;1;0",
        "aff_campus_unique": "Amherst;Berkeley;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "MUSTARD: Mastering Uniform Synthesis of Theorem and Proof Data",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19310",
        "id": "8xliOUg9EW",
        "author_site": "Yinya Huang, Xiaohan Lin, Zhengying Liu, Qingxing Cao, Huajian Xin, Haiming Wang, Zhenguo Li, Linqi Song, Xiaodan Liang",
        "tldr": "",
        "abstract": "Recent large language models (LLMs) have witnessed significant advancement in various tasks, including mathematical reasoning and theorem proving. As these two tasks require strict and formal multi-step inference, they are appealing domains for exploring the reasoning ability of LLMs but still face important challenges. Previous studies such as Chain-of-Thought (CoT) have revealed the effectiveness of intermediate steps guidance. However, such step-wise annotation requires heavy labor, leading to insufficient training steps for current benchmarks. To fill this gap, this work introduces MUSTARD, a data generation framework that masters uniform synthesis of theorem and proof data of high quality and diversity. MUSTARD synthesizes data in three stages: (1) It samples a few mathematical concept seeds as the problem category. (2) Then, it prompts a generative language model with the sampled concepts to obtain both the problems and their step-wise formal solutions. (3) Lastly, the framework utilizes a proof assistant (e.g., Lean Prover) to filter the valid proofs. With the proposed MUSTARD, we present a theorem-and-proof benchmark MUSTARDSAUCE with 5,866 valid data points. Each data point contains an informal statement, an informal proof, and a translated formal proof that passes the prover validation. We perform extensive analysis and demonstrate that MUSTARD generates validated high-quality step-by-step data. We further apply the MUSTARDSAUCE for fine-tuning smaller language models. The fine-tuned Llama 2-7B achieves a 15.41% average relative performance gain in automated theorem proving, and 8.18% in math word problems. Codes and data are available at https://github.com/Eleanor-H/MUSTARD.",
        "keywords": "theorem proving;math word problem;mathematical reasoning;benchmark",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/d03852344e1e4ab8a88a1ab90ae3d42a901c6322.zip",
        "author": "Yinya Huang;Xiaohan Lin;Zhengying Liu;Qingxing Cao;Huajian Xin;Haiming Wang;Zhenguo Li;Linqi Song;Xiaodan Liang",
        "authorids": "~Yinya_Huang1;~Xiaohan_Lin2;~Zhengying_Liu2;~Qingxing_Cao1;~Huajian_Xin1;~Haiming_Wang1;~Zhenguo_Li1;~Linqi_Song1;~Xiaodan_Liang2",
        "gender": ";M;M;M;M;M;M;M;F",
        "homepage": "https://eleanor-h.github.io/;https://xiaohlim.github.io/;;;https://xinhuajian.wordpress.com/;;http://www.ee.columbia.edu/~zgli/;https://sites.google.com/site/aisquaredlab/;https://www.sysu-hcp.net/",
        "dblp": "282/1562;;241/1782;149/7615;356/3551;97/604;23/6479;137/7963.html;",
        "google_scholar": "dWStaRIAAAAJ;;http:// DFme0joAAAAJ;flOBrd8AAAAJ;E5M9x8wAAAAJ;zDPqP6AAAAAJ;XboZC1AAAAAJ;UcGN3MoAAAAJ;voxznZAAAAAJ",
        "orcid": "0000-0002-0686-0832;;;;;;;0000-0003-2756-4984;",
        "linkedin": ";;;;;;;;",
        "or_profile": "~Yinya_Huang1;~Xiaohan_Lin2;~Zhengying_Liu2;~Qingxing_Cao1;~Huajian_Xin1;~Haiming_Wang1;~Zhenguo_Li1;~Linqi_Song1;~Xiaodan_Liang2",
        "aff": "City University of Hong Kong;SUN YAT-SEN UNIVERSITY;Huawei Technologies Ltd.;SUN YAT-SEN UNIVERSITY, Tsinghua University;University of Edinburgh, University of Edinburgh;SUN YAT-SEN UNIVERSITY;Huawei Noah's Ark Lab;City University of Hong Kong;SUN YAT-SEN UNIVERSITY",
        "aff_domain": "cityu.edu.hk;sysu.edu.cn;huawei.com;sysu.edu.cn;ed.ac.uk;sysu.edu.cn;huawei.com;cityu.edu.hk;sysu.edu.cn",
        "position": "Postdoc;MS student;Researcher;Postdoc;PhD student;PhD student;Principal Researcher;Assistant Professor;Associate Professor",
        "bibtex": "@inproceedings{\nhuang2024mustard,\ntitle={{MUSTARD}: Mastering Uniform Synthesis of Theorem and Proof Data},\nauthor={Yinya Huang and Xiaohan Lin and Zhengying Liu and Qingxing Cao and Huajian Xin and Haiming Wang and Zhenguo Li and Linqi Song and Xiaodan Liang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=8xliOUg9EW}\n}",
        "github": "",
        "project": "",
        "reviewers": "9Wae;Mb77;LURb",
        "pdf_size": 2708190,
        "rating": "6;8;8",
        "confidence": "4;4;4",
        "soundness": "3;4;3",
        "contribution": "2;3;3",
        "presentation": "3;3;3",
        "wc_summary": "58;62;139",
        "wc_strengths": "137;90;48",
        "wc_weaknesses": "341;34;41",
        "wc_questions": "48;21;81",
        "wc_review": "584;207;309",
        "wc_reply_reviewers": "34;13;79",
        "wc_reply_authors": "3110;1393;1246",
        "reply_reviewers": "1;1;1",
        "reply_authors": "8;3;4",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            86.33333333333333,
            37.27674282385138
        ],
        "wc_strengths_avg": [
            91.66666666666667,
            36.353205574688396
        ],
        "wc_weaknesses_avg": [
            138.66666666666666,
            143.09980976771269
        ],
        "wc_questions_avg": [
            50.0,
            24.535688292770594
        ],
        "wc_review_avg": [
            366.6666666666667,
            159.2196246977391
        ],
        "wc_reply_reviewers_avg": [
            42.0,
            27.53179979587241
        ],
        "wc_reply_authors_avg": [
            1916.3333333333333,
            846.1805691195914
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            5.0,
            2.160246899469287
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 26,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16858387062816034025&as_sdt=5,24&sciodt=0,24&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=8xliOUg9EW",
        "pdf": "https://openreview.net/pdf?id=8xliOUg9EW",
        "email": "cityu.edu.hk;sysu.edu.cn;huawei.com;sysu.edu.cn;ed.ac.uk;sysu.edu.cn;huawei.com;cityu.edu.hk;sysu.edu.cn",
        "author_num": 9,
        "aff_unique_index": "0;1;2;1;3;1;2;0;1",
        "aff_unique_norm": "City University of Hong Kong;Sun Yat-sen University;Huawei;University of Edinburgh",
        "aff_unique_dep": ";;Huawei Technologies;",
        "aff_unique_url": "https://www.cityu.edu.hk;http://www.sysu.edu.cn;https://www.huawei.com;https://www.ed.ac.uk",
        "aff_unique_abbr": "CityU;SYSU;Huawei;Edinburgh",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0;1;0;0;0;0",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "id": "8y5vlBuRll",
        "title": "Efficient Action Robust Reinforcement Learning with Probabilistic Policy Execution Uncertainty",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Robust reinforcement learning (RL) aims to find a policy that optimizes the worst-case performance in the face of uncertainties. In this paper, we focus on action robust RL with the probabilistic policy execution uncertainty, in which, instead of always carrying out the action specified by the policy, the agent will take the action specified by the policy with probability $1-\\rho$ and an alternative adversarial action with probability $\\rho$. We establish the existence of an optimal policy on the action robust MDPs with probabilistic policy execution uncertainty and provide the action robust Bellman optimality equation for its solution. Furthermore, we develop Action Robust Reinforcement Learning with Certificates (ARRLC) algorithm that achieves minimax optimal regret and sample complexity. Furthermore, we conduct numerical experiments to validate our approach's robustness, demonstrating that ARRLC outperforms non-robust RL algorithms and converges faster than the robust TD algorithm in the presence of action perturbations.",
        "keywords": "Robust Reinforcement Learning;Sample Complexity",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/520f7198cec22e28b38e1179fd69d77d07cf004e.zip",
        "author": "Guanlin Liu;Zhihan Zhou;Han Liu;Lifeng Lai",
        "authorids": "~Guanlin_Liu1;~Zhihan_Zhou1;~Han_Liu4;~Lifeng_Lai1",
        "gender": "M;M;;",
        "homepage": ";http://zhihan1996.github.io/;;",
        "dblp": "224/9954;226/5688-1.html;;12/4889",
        "google_scholar": "a7eYJk4AAAAJ;bNerBT8AAAAJ;;gOhaCfUAAAAJ",
        "orcid": "0000-0002-0595-9398;;;",
        "linkedin": ";zhihan-zhou-6a057716b/;;",
        "or_profile": "~Guanlin_Liu1;~Zhihan_Zhou1;~Han_Liu4;~Lifeng_Lai1",
        "aff": "University of California, Davis;Northwestern University;Northwestern University;University of California, Davis",
        "aff_domain": "ucdavis.edu;u.northwestern.edu;u.northwestern.edu;ucdavis.edu",
        "position": "PhD student;PhD student;Associate Professor;Full Professor",
        "bibtex": "@misc{\nliu2024efficient,\ntitle={Efficient Action Robust Reinforcement Learning with Probabilistic Policy Execution Uncertainty},\nauthor={Guanlin Liu and Zhihan Zhou and Han Liu and Lifeng Lai},\nyear={2024},\nurl={https://openreview.net/forum?id=8y5vlBuRll}\n}",
        "github": "",
        "project": "",
        "reviewers": "wBWc;N6KC;if62",
        "site": "https://openreview.net/forum?id=8y5vlBuRll",
        "pdf_size": 3264942,
        "rating": "5;6;6",
        "confidence": "4;5;4",
        "soundness": "2;3;3",
        "contribution": "2;1;2",
        "presentation": "1;3;2",
        "wc_summary": "97;19;82",
        "wc_strengths": "35;34;36",
        "wc_weaknesses": "338;227;145",
        "wc_questions": "137;1;9",
        "wc_review": "607;281;272",
        "wc_reply_reviewers": "0;82;16",
        "wc_reply_authors": "1004;642;693",
        "reply_reviewers": "0;1;1",
        "reply_authors": "3;3;2",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            66.0,
            33.793490497431605
        ],
        "wc_strengths_avg": [
            35.0,
            0.816496580927726
        ],
        "wc_weaknesses_avg": [
            236.66666666666666,
            79.08785550821875
        ],
        "wc_questions_avg": [
            49.0,
            62.31104770958892
        ],
        "wc_review_avg": [
            386.6666666666667,
            155.84251309860505
        ],
        "wc_reply_reviewers_avg": [
            32.666666666666664,
            35.490217744549774
        ],
        "wc_reply_authors_avg": [
            779.6666666666666,
            159.98819400887749
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6122834642764614269&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;1;0",
        "aff_unique_norm": "University of California, Davis;Northwestern University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ucdavis.edu;https://www.northwestern.edu",
        "aff_unique_abbr": "UC Davis;NU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Davis;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "8zJevzvk64",
        "title": "Schrodinger Bridge to Bridge Generative Diffusion Method to Off-Policy Evaluation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The problem of off-policy evaluation (OPE) in reinforcement learning (RL), which evaluates a given policy using data collected from a different behavior policy, plays an important role in many real-world applications. The OPE under the model of episodic non-stationary finite-horizon Markov decision process (MDP) has been widely studied. However, the general model-free importance sampling (IS) methods suffer from the curse of horizon and dimensionality, while the improved marginal importance sampling (MIS) can only be restrained to the case where the state space $\\mathcal{S}$ is sufficiently small. The model-based methods often have limited scope of application. To find a widely-applicable OPE algorithm when $\\mathcal{S}$ is continuous and high-dimensional that avoids the curse of horizon and dimensionality, which means the error of the estimator grows exponentially with the number of horizon $H$ and the dimension $d$ of the state space $\\mathcal{S}$, we apply the diffusion Schr\"odinger bridge generative model to construct a model-based estimator (CDSB estimator). Moreover, we established the statistical rate of the estimation error of the value function with a polynomial rate of $O(H^2\\sqrt{d})$, which, to the best of our knowledge, is one of the first theoretical rate results on applying Schr\"odinger bridge to reinforcement learning. This breaks the restraint of the complexity of the state space for OPE under MDP with large horizon and can be applied to various real-life decision problems with continuous setting, which is shown in our simulation using our method in continuous, high-dimensional and long-horizon RL environments and its comparison with other existing algorithms.",
        "keywords": "off-policy evaluation;Schrodinger bridge problem;diffusion model;generative model",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/8e88ec1313fa2926b2f3fa36bf607b8ec296ccbb.pdf",
        "author": "Yucong Lin;Liyuan Xu;Haoqun Cao;Hongyi Yuan;Junwei Lu",
        "authorids": "~Yucong_Lin2;~Liyuan_Xu2;~Haoqun_Cao1;~Hongyi_Yuan1;~Junwei_Lu1",
        "gender": "M;F;M;M;M",
        "homepage": ";https://mails.tsinghua.edu.cn;https://kencao2007.github.io/;;https://junwei-lu.github.io/",
        "dblp": ";;;308/0909;",
        "google_scholar": "https://scholar.google.com.hk/citations?hl=zh-CN;;;FG3O4i8AAAAJ;",
        "orcid": "0000-0002-9039-0318;;;;",
        "linkedin": ";;;;",
        "or_profile": "~Yucong_Lin2;~Liyuan_Xu2;~Haoqun_Cao1;~Hongyi_Yuan1;~Junwei_Lu1",
        "aff": "Beijing Institute of Technology;Tsinghua University;Renmin University of China;Tsinghua University;Harvard University",
        "aff_domain": "bit.edu.cn;tsinghua.edu.cn;ruc.edu.cn;tsinghua.edu.cn;harvard.edu",
        "position": "Postdoc;Undergrad student;Undergrad student;PhD student;Assistant Professor",
        "bibtex": "@misc{\nlin2024schrodinger,\ntitle={Schrodinger Bridge to Bridge Generative Diffusion Method to Off-Policy Evaluation},\nauthor={Yucong Lin and Liyuan Xu and Haoqun Cao and Hongyi Yuan and Junwei Lu},\nyear={2024},\nurl={https://openreview.net/forum?id=8zJevzvk64}\n}",
        "github": "",
        "project": "",
        "reviewers": "p1r4;VmGz;CNAs;ijeG",
        "site": "https://openreview.net/forum?id=8zJevzvk64",
        "pdf_size": 371040,
        "rating": "3;3;3;5",
        "confidence": "4;3;3;2",
        "soundness": "2;3;2;3",
        "contribution": "1;1;1;2",
        "presentation": "2;2;2;2",
        "wc_summary": "72;87;47;59",
        "wc_strengths": "92;22;21;37",
        "wc_weaknesses": "512;35;318;110",
        "wc_questions": "16;350;275;163",
        "wc_review": "692;494;661;369",
        "wc_reply_reviewers": "0;127;0;0",
        "wc_reply_authors": "323;761;593;203",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            66.25,
            14.889173919328098
        ],
        "wc_strengths_avg": [
            43.0,
            28.991378028648448
        ],
        "wc_weaknesses_avg": [
            243.75,
            186.37110156888593
        ],
        "wc_questions_avg": [
            201.0,
            125.84315634948132
        ],
        "wc_review_avg": [
            554.0,
            130.68856109086212
        ],
        "wc_reply_reviewers_avg": [
            31.75,
            54.99261314031185
        ],
        "wc_reply_authors_avg": [
            470.0,
            219.49259668608414
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:vna5OldSG5IJ:scholar.google.com/&scioq=Schrodinger+Bridge+to+Bridge+Generative+Diffusion+Method+to+Off-Policy+Evaluation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;1;3",
        "aff_unique_norm": "Beijing Institute of Technology;Tsinghua University;Renmin University of China;Harvard University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "http://www.bit.edu.cn/;https://www.tsinghua.edu.cn;http://www.ruc.edu.cn;https://www.harvard.edu",
        "aff_unique_abbr": "BIT;THU;RUC;Harvard",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "90QOM1xB88",
        "title": "Improved order analysis and design of exponential integrator for diffusion models sampling",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Efficient differential equation solvers have significantly reduced the sampling time of diffusion models (DMs) while retaining high sampling quality. Among these solvers, exponential integrators (EI) have gained prominence by demonstrating state-of-the-art performance. However, existing high-order EI-based sampling algorithms rely on degenerate EI solvers, resulting in inferior error bounds and reduced accuracy in contrast to the theoretically anticipated results under optimal settings. This situation makes the sampling quality extremely vulnerable to seemingly innocuous design choices such as timestep schedules. For example, an inefficient timestep scheduler might necessitate twice the number of steps to achieve a quality comparable to that obtained through carefully optimized timesteps. To address this issue, we reevaluate the design of high-order differential solvers for DMs. Through a thorough order analysis, we reveal that the degeneration of existing high-order EI solvers can be attributed to the absence of essential order conditions. By reformulating the differential equations in DMs and capitalizing on the theory of exponential integrators, we propose refined EI solvers that fulfill all the order conditions, which we designate as Refined Exponential Solver (RES). Utilizing these improved solvers, RES exhibits more favorable error bounds theoretically and achieves superior sampling efficiency and stability in practical applications. For instance, a simple switch from the single-step DPM-Solver++ to our order-satisfied numerical scheme when NFE$=9$, results in a reduction of numerical defects by 25.2 and FID improvement of  25.4 (16.77 vs 12.51) on a pre-trained ImageNet diffusion model.",
        "keywords": "diffusion model;order analysis;fast sampling",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Qinsheng Zhang;Jiaming Song;Yongxin Chen",
        "authorids": "~Qinsheng_Zhang1;~Jiaming_Song1;~Yongxin_Chen1",
        "gender": "M;M;M",
        "homepage": "https://qsh-zh.github.io/;http://tsong.me;https://yongxin.ae.gatech.edu/",
        "dblp": ";173/5104;",
        "google_scholar": ";;X8BYiV4AAAAJ",
        "orcid": ";;",
        "linkedin": ";jiamings/;",
        "or_profile": "~Qinsheng_Zhang1;~Jiaming_Song1;~Yongxin_Chen1",
        "aff": "Georgia Institute of Technology;Luma AI;Georgia Institute of Technology",
        "aff_domain": "gatech.edu;lumalabs.ai;gatech.edu",
        "position": "PhD student;Chief Scientist;Associate Professor",
        "bibtex": "@misc{\nzhang2024improved,\ntitle={Improved order analysis and design of exponential integrator for diffusion models sampling},\nauthor={Qinsheng Zhang and Jiaming Song and Yongxin Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=90QOM1xB88}\n}",
        "github": "",
        "project": "",
        "reviewers": "XmiM;xZkC;kkMa",
        "site": "https://openreview.net/forum?id=90QOM1xB88",
        "pdf_size": 12230407,
        "rating": "3;6;6",
        "confidence": "4;4;2",
        "soundness": "3;3;3",
        "contribution": "1;3;3",
        "presentation": "2;2;3",
        "wc_summary": "83;34;51",
        "wc_strengths": "63;76;47",
        "wc_weaknesses": "416;81;63",
        "wc_questions": "37;177;15",
        "wc_review": "599;368;176",
        "wc_reply_reviewers": "246;42;0",
        "wc_reply_authors": "1180;586;399",
        "reply_reviewers": "1;1;0",
        "reply_authors": "3;2;2",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            56.0,
            20.314198646923455
        ],
        "wc_strengths_avg": [
            62.0,
            11.86029791643813
        ],
        "wc_weaknesses_avg": [
            186.66666666666666,
            162.3295687448497
        ],
        "wc_questions_avg": [
            76.33333333333333,
            71.74646719912803
        ],
        "wc_review_avg": [
            381.0,
            172.9335132355785
        ],
        "wc_reply_reviewers_avg": [
            96.0,
            107.44300814850634
        ],
        "wc_reply_authors_avg": [
            721.6666666666666,
            332.9607918192304
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5000000000000001,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8888918704360335549&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Georgia Institute of Technology;Luma AI",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.gatech.edu;https://www.luma.ai",
        "aff_unique_abbr": "Georgia Tech;Luma AI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Learning Flexible Body Collision Dynamics with Hierarchical Contact Mesh Transformer",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19309",
        "id": "90yw2uM6J5",
        "author_site": "Youn-Yeol Yu, Jeongwhan Choi, Woojin Cho, Kookjin Lee, Nayong Kim, Kiseok Chang, ChangSeung Woo, ILHO KIM, SeokWoo Lee, Joon Young Yang, SOOYOUNG YOON, Noseong Park",
        "tldr": "",
        "abstract": "Recently, many mesh-based graph neural network (GNN) models have been proposed for modeling complex high-dimensional physical systems. Remarkable achievements have been made in significantly reducing the solving time compared to traditional numerical solvers. These methods are typically designed to i) reduce the computational cost in solving physical dynamics and/or ii) propose techniques to enhance the solution accuracy in fluid and rigid body dynamics. However, it remains under-explored whether they are effective in addressing the challenges of flexible body dynamics, where instantaneous collisions occur within a very short timeframe. In this paper, we present Hierarchical Contact Mesh Transformer (HCMT), which uses hierarchical mesh structures and can learn long-range dependencies (occurred by collisions) among spatially distant positions of a body --- two close positions in a higher-level mesh correspond to two distant positions in a lower-level mesh. HCMT enables long-range interactions, and the hierarchical mesh structure quickly propagates collision effects to faraway positions. To this end, it consists of a contact mesh Transformer and a hierarchical mesh Transformer (CMT and HMT, respectively). Lastly, we propose a flexible body dynamics dataset,  consisting of trajectories that reflect experimental settings frequently used in the display industry for product designs. We also compare the performance of several baselines using well-known benchmark datasets. Our results show that HCMT provides significant performance improvements over existing methods. Our code is available at https://github.com/yuyudeep/hcmt.",
        "keywords": "graph transformer;physics-based simulation;mesh;collision;flexible dynamics",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Youn-Yeol Yu;Jeongwhan Choi;Woojin Cho;Kookjin Lee;Nayong Kim;Kiseok Chang;ChangSeung Woo;ILHO KIM;SeokWoo Lee;Joon Young Yang;SOOYOUNG YOON;Noseong Park",
        "authorids": "~Youn-Yeol_Yu1;~Jeongwhan_Choi1;~Woojin_Cho1;~Kookjin_Lee1;~Nayong_Kim1;~Kiseok_Chang1;~ChangSeung_Woo1;~ILHO_KIM1;~SeokWoo_Lee1;~Joon_Young_Yang1;~SOOYOUNG_YOON1;~Noseong_Park1",
        "gender": "M;M;M;M;M;M;M;M;M;M;M;",
        "homepage": "https://sites.google.com/view/npark/home?authuser=0;https://www.jeongwhanchoi.com;https://woojin-cho.github.io/;https://scholar.google.com/citations?hl=en&user=KL89hVQAAAAJ&view_op=list_works;;;https://www.lgdisplay.com/;;https://www.lgdisplay.com;https://www.lgdisplay.com;https://lgdisplay.com;",
        "dblp": ";39/11215-2;;122/5103;;;;;;;;",
        "google_scholar": ";3MNElkYAAAAJ;cqIj5tQAAAAJ;https://scholar.google.com/citations?hl=en;;TmbYdlgAAAAJ;;;;;;",
        "orcid": ";0000-0002-6530-2662;;;;;;;;;;",
        "linkedin": ";jeongwhanchoi/;woojin-cho-02b905264/;;gh-k-30ba80218/;kiseok-chang-b0869349/?originalSubdomain=kr;;ilho-kim-918093129/?originalSubdomain=kr;;;;",
        "or_profile": "~Youn-Yeol_Yu1;~Jeongwhan_Choi1;~Woojin_Cho1;~Kookjin_Lee1;~Nayong_Kim1;~Kiseok_Chang1;~ChangSeung_Woo1;~ILHO_KIM1;~SeokWoo_Lee1;~Joon_Young_Yang1;~SOOYOUNG_YOON1;~Noseong_Park1",
        "aff": "LG Display;Yonsei University;Yonsei University;Arizona State University;LG Display;LG Display;;LG Display Co., Ltd.;LG Display;LG Display;LG Display;",
        "aff_domain": "lgdisplay.com;yonsei.ac.kr;yonsei.ac.kr;asu.edu;lgdisplay.com;lgdisplay.com;;lgdisplay.com;lgdisplay.com;lgdisplay.com;lgdisplay.com;",
        "position": "Researcher;PhD student;MS student;Assistant Professor;Researcher;Researcher;;Researcher;Principal Researcher;Principal Researcher;Principal Researcher;",
        "bibtex": "@inproceedings{\nyu2024learning,\ntitle={Learning Flexible Body Collision Dynamics with Hierarchical Contact Mesh Transformer},\nauthor={Youn-Yeol Yu and Jeongwhan Choi and Woojin Cho and Kookjin Lee and Nayong Kim and Kiseok Chang and ChangSeung Woo and ILHO KIM and SeokWoo Lee and Joon Young Yang and SOOYOUNG YOON and Noseong Park},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=90yw2uM6J5}\n}",
        "github": "",
        "project": "",
        "reviewers": "gSaT;zh4D;J9Rp;CgKu",
        "pdf_size": 14173895,
        "rating": "6;6;6;6",
        "confidence": "4;2;3;3",
        "soundness": "3;2;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "114;39;76;69",
        "wc_strengths": "201;102;84;76",
        "wc_weaknesses": "639;90;77;2",
        "wc_questions": "579;417;41;16",
        "wc_review": "1533;648;278;163",
        "wc_reply_reviewers": "0;34;0;0",
        "wc_reply_authors": "3495;1250;602;290",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "6;3;3;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            74.5,
            26.706740722147284
        ],
        "wc_strengths_avg": [
            115.75,
            50.11175011910879
        ],
        "wc_weaknesses_avg": [
            202.0,
            254.5279945310535
        ],
        "wc_questions_avg": [
            263.25,
            241.79782360476284
        ],
        "wc_review_avg": [
            655.5,
            537.3837083500019
        ],
        "wc_reply_reviewers_avg": [
            8.5,
            14.722431864335457
        ],
        "wc_reply_authors_avg": [
            1409.25,
            1253.0050628389336
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.5,
            1.5
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            12,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13358364848196757569&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 8,
        "openreview": "https://openreview.net/forum?id=90yw2uM6J5",
        "pdf": "https://openreview.net/pdf?id=90yw2uM6J5",
        "email": "lgdisplay.com;yonsei.ac.kr;yonsei.ac.kr;asu.edu;lgdisplay.com;lgdisplay.com;;lgdisplay.com;lgdisplay.com;lgdisplay.com;lgdisplay.com;",
        "author_num": 12,
        "aff_unique_index": "0;1;1;2;0;0;0;0;0;0",
        "aff_unique_norm": "LG;Yonsei University;Arizona State University",
        "aff_unique_dep": "LG Display;;",
        "aff_unique_url": "https://www.lgdisplay.com;https://www.yonsei.ac.kr;https://www.asu.edu",
        "aff_unique_abbr": "LG Display;Yonsei;ASU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0;0;0;0;0;0",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "id": "91DFSjAva8",
        "title": "SERA: Sample Efficient Reward Augmentation in offline-to-online Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "A prospective application of offline reinforcement learning (RL) involves initializing a pre-trained policy using existing static datasets for subsequent online fine-tuning. However, direct fine-tuning of the offline pre-trained policy often results in sub-optimal performance. A primary reason is that offline conservative methods diminish the agent's capability of exploration, thereby impacting online fine-tuning performance. To enhance exploration during online fine-tuning and thus enhance the overall online fine-tuning performance, we introduce a generalized reward augmentation framework called Sample Efficient Reward Augmentation (SERA). SERA aims to improve the performance of online fine-tuning by designing intrinsic rewards that encourage the agent to explore. Specifically, it implicitly implements State Marginal Matching (SMM) and penalizes out-of-distribution (OOD) state actions, thus encouraging agents to cover the target state density, and achieving better online fine-tuning results. Additionally, SERA can be effortlessly plugged into various RL algorithms to improve online fine-tuning and ensure sustained asymptotic improvement, showing the versatility as well as the effectiveness of SERA. Moreover, extensive experimental results will demonstrate that when conducting offline-to-online problems, SERA consistently and effectively enhances the performance of various offline algorithms.",
        "keywords": "Reinforcement Learning;Offline-to-Online RL",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/608d32bda01ddc656658dcf526ed2b5d07c812ed.pdf",
        "author": "Ziqi Zhang;Xiao Xiong;Zifeng Zhuang;Jinxin Liu;Donglin Wang",
        "authorids": "~Ziqi_Zhang7;~Xiao_Xiong2;~Zifeng_Zhuang1;~Jinxin_Liu1;~Donglin_Wang1",
        "gender": ";F;M;;M",
        "homepage": ";https://github.com/SherryHanyu;;;https://milab.westlake.edu.cn/",
        "dblp": ";;276/5034;;",
        "google_scholar": ";;;;https://scholar.google.ca/citations?user=-fo6wdwAAAAJ",
        "orcid": ";;;;0000-0002-8188-3735",
        "linkedin": ";;;;",
        "or_profile": "~Ziqi_Zhang7;~Xiao_Xiong2;~Zifeng_Zhuang1;~Jinxin_Liu1;~Donglin_Wang1",
        "aff": ";University of Cambridge;Zhejiang University;;Westlake University",
        "aff_domain": ";cam.ac.uk;zju.edu.cn;;westlake.edu.cn",
        "position": ";MS student;PhD student;;Associate Professor",
        "bibtex": "@misc{\nzhang2024sera,\ntitle={{SERA}: Sample Efficient Reward Augmentation in offline-to-online Reinforcement Learning},\nauthor={Ziqi Zhang and Xiao Xiong and Zifeng Zhuang and Jinxin Liu and Donglin Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=91DFSjAva8}\n}",
        "github": "",
        "project": "",
        "reviewers": "sGsS;NgYG;zoZX;pDE4",
        "site": "https://openreview.net/forum?id=91DFSjAva8",
        "pdf_size": 2039765,
        "rating": "3;5;5;6",
        "confidence": "5;3;4;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "1;2;1;3",
        "wc_summary": "40;29;61;78",
        "wc_strengths": "13;12;22;80",
        "wc_weaknesses": "4;590;341;384",
        "wc_questions": "468;2;46;3",
        "wc_review": "525;633;470;545",
        "wc_reply_reviewers": "0;98;0;26",
        "wc_reply_authors": "1053;3110;627;710",
        "reply_reviewers": "0;2;0;1",
        "reply_authors": "4;9;3;2",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            52.0,
            18.907670401189037
        ],
        "wc_strengths_avg": [
            31.75,
            28.12805538959279
        ],
        "wc_weaknesses_avg": [
            329.75,
            210.3049868643157
        ],
        "wc_questions_avg": [
            129.75,
            196.09484312444323
        ],
        "wc_review_avg": [
            543.25,
            58.64458628040614
        ],
        "wc_reply_reviewers_avg": [
            31.0,
            40.11234224026316
        ],
        "wc_reply_authors_avg": [
            1375.0,
            1014.3517634430375
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            4.5,
            2.692582403567252
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.6488856845230502,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7660073471667830530&as_sdt=5,34&sciodt=0,34&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of Cambridge;Zhejiang University;Westlake University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.cam.ac.uk;https://www.zju.edu.cn;https://www.westlake.edu.cn",
        "aff_unique_abbr": "Cambridge;ZJU;WU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Cambridge;",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "United Kingdom;China"
    },
    {
        "title": "On gauge freedom, conservativity and intrinsic dimensionality estimation in diffusion models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19308",
        "id": "92KV9xAMhF",
        "author_site": "Christian Horvat, Jean-Pascal Pfister",
        "tldr": "",
        "abstract": "Diffusion models are generative models that have recently demonstrated impressive performances in terms of sampling quality and density estimation in high dimensions. They rely on a forward continuous diffusion process and a backward continuous denoising process, which can be described by a time-dependent vector field and is used as a generative model. In the original formulation of the diffusion model, this vector field is assumed to be the score function (i.e. it is the gradient of the log-probability at a given time in the diffusion process). Curiously, on the practical side, most studies on diffusion models implement this vector field as a neural network function and do not constrain it be the gradient of some energy function (that is, most studies do not constrain the vector field to be conservative). Even though some studies investigated empirically whether such a constraint will lead to a performance gain, they lead to  contradicting results and failed to provide analytical results. Here, we provide three analytical results regarding the extent of the modeling freedom of this vector field. {Firstly, we propose a novel decomposition of vector fields into a conservative component and an orthogonal component which satisfies a given (gauge) freedom. Secondly, from this orthogonal decomposition, we show that exact density estimation and exact sampling is achieved when the conservative component is exactly equals to the true score and therefore conservativity is neither necessary nor sufficient to obtain exact density estimation and exact sampling. Finally, we show that when it comes to inferring local information of the data manifold, constraining the vector field to be conservative is desirable.",
        "keywords": "gauge freedom;conservativitym intrinsic dimensionality estimation;diffusion models;explainable AI;theory",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/c6a9ea8a3844959d87cafb5e0e69155b41c43a2d.pdf",
        "author": "Christian Horvat;Jean-Pascal Pfister",
        "authorids": "~Christian_Horvat1;~Jean-Pascal_Pfister1",
        "gender": "M;M",
        "homepage": "https://physio.unibe.ch/~pfister/group/;https://physio.unibe.ch/~pfister/group/",
        "dblp": "293/8018;33/921",
        "google_scholar": "LpRirZAAAAAJ;https://scholar.google.co.uk/citations?user=mzUYoLgAAAAJ",
        "orcid": ";0000-0002-1847-3389",
        "linkedin": ";jean-pascal-pfister-840a7a1/",
        "or_profile": "~Christian_Horvat1;~Jean-Pascal_Pfister1",
        "aff": "Theoretical Neuroscience;Department of Physiology, \u00fcnivelsitat Bern",
        "aff_domain": "unibe.ch;unibe.ch",
        "position": "Postdoc;Assistant Professor",
        "bibtex": "@inproceedings{\nhorvat2024on,\ntitle={On gauge freedom, conservativity and intrinsic dimensionality estimation in diffusion models},\nauthor={Christian Horvat and Jean-Pascal Pfister},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=92KV9xAMhF}\n}",
        "github": "",
        "project": "",
        "reviewers": "ovjk;pZCv;h3ie;KRsj",
        "pdf_size": 5143768,
        "rating": "5;6;8;8",
        "confidence": "4;3;5;4",
        "soundness": "3;2;4;2",
        "contribution": "2;2;3;2",
        "presentation": "2;2;4;3",
        "wc_summary": "131;194;65;105",
        "wc_strengths": "45;56;61;58",
        "wc_weaknesses": "51;297;515;172",
        "wc_questions": "375;191;380;133",
        "wc_review": "602;738;1021;468",
        "wc_reply_reviewers": "0;124;14;167",
        "wc_reply_authors": "288;583;87;156",
        "reply_reviewers": "0;2;1;1",
        "reply_authors": "1;3;1;1",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            123.75,
            46.87949978402073
        ],
        "wc_strengths_avg": [
            55.0,
            6.041522986797286
        ],
        "wc_weaknesses_avg": [
            258.75,
            171.61930981098834
        ],
        "wc_questions_avg": [
            269.75,
            109.69816543589049
        ],
        "wc_review_avg": [
            707.25,
            204.75763111542386
        ],
        "wc_reply_reviewers_avg": [
            76.25,
            71.07170674748144
        ],
        "wc_reply_authors_avg": [
            278.5,
            190.05854361222492
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.5443310539518174,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8157807008404479797&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=92KV9xAMhF",
        "pdf": "https://openreview.net/pdf?id=92KV9xAMhF",
        "email": "unibe.ch;unibe.ch",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Theoretical Neuroscience;University of Bern",
        "aff_unique_dep": "Neuroscience Department;Department of Physiology",
        "aff_unique_url": ";https://www.unibe.ch",
        "aff_unique_abbr": ";UniBE",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "1",
        "aff_country_unique": ";Switzerland"
    },
    {
        "title": "SPDER: Semiperiodic Damping-Enabled Object Representation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19307",
        "id": "92btneN9Wm",
        "author_site": "Kathan Shah, Chawin Sitawarin",
        "tldr": "",
        "abstract": "We present a neural network architecture designed to naturally learn a positional embedding and overcome the spectral bias towards lower frequencies faced by conventional implicit neural representation networks. Our proposed architecture, SPDER, is a simple MLP that uses an activation function composed of a sinusoidal multiplied by a sublinear function, called the damping function. The sinusoidal enables the network to automatically learn the positional embedding of an input coordinate while the damping passes on the actual coordinate value by preventing it from being projected down to within a finite range of values. Our results indicate that SPDERs speed up training by 10 times and converge to losses 1,500 to 50,000 times lower than that of the state-of-the-art for image representation. SPDER is also state-of-the-art in audio representation. The superior representation capability allows SPDER to also excel on multiple downstream tasks such as image super-resolution and video frame interpolation. We provide intuition as to why SPDER significantly improves fitting compared to that of other INR methods while requiring no hyperparameter tuning or preprocessing. See code at https://github.com/katop1234/SPDER.",
        "keywords": "Implicit neural representations;spectral bias;computer vision;neural network architectures;activations;image representation;edge detection",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/8939af26ae9c398e386ecddf5fad22e5efa128f5.zip",
        "author": "Kathan Shah;Chawin Sitawarin",
        "authorids": "~Kathan_Shah1;~Chawin_Sitawarin1",
        "gender": "M;M",
        "homepage": ";https://chawins.github.io/",
        "dblp": ";211/7105",
        "google_scholar": "xRpZ_sgAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";0000-0002-4949-9661",
        "linkedin": "kathans/;chawins/",
        "or_profile": "~Kathan_Shah1;~Chawin_Sitawarin1",
        "aff": "University of California, Berkeley;University of California, Berkeley",
        "aff_domain": "berkeley.edu;berkeley.edu",
        "position": "Undergrad student;PhD student",
        "bibtex": "@inproceedings{\nshah2024spder,\ntitle={{SPDER}: Semiperiodic Damping-Enabled Object Representation},\nauthor={Kathan Shah and Chawin Sitawarin},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=92btneN9Wm}\n}",
        "github": "",
        "project": "",
        "reviewers": "TKxh;V9Ce;9hcy",
        "pdf_size": 4004295,
        "rating": "5;6;8",
        "confidence": "4;4;3",
        "soundness": "2;2;3",
        "contribution": "3;3;2",
        "presentation": "4;3;3",
        "wc_summary": "98;97;49",
        "wc_strengths": "134;44;76",
        "wc_weaknesses": "302;20;155",
        "wc_questions": "257;28;43",
        "wc_review": "791;189;323",
        "wc_reply_reviewers": "0;0;6",
        "wc_reply_authors": "582;183;558",
        "reply_reviewers": "0;0;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            81.33333333333333,
            22.866763848189994
        ],
        "wc_strengths_avg": [
            84.66666666666667,
            37.249906785863985
        ],
        "wc_weaknesses_avg": [
            159.0,
            115.16075720487426
        ],
        "wc_questions_avg": [
            109.33333333333333,
            104.5955172185798
        ],
        "wc_review_avg": [
            434.3333333333333,
            258.0663136138117
        ],
        "wc_reply_reviewers_avg": [
            2.0,
            2.8284271247461903
        ],
        "wc_reply_authors_avg": [
            441.0,
            182.69646958822165
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.944911182523068,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12155969879033561286&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=92btneN9Wm",
        "pdf": "https://openreview.net/pdf?id=92btneN9Wm",
        "email": "berkeley.edu;berkeley.edu",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of California, Berkeley",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.berkeley.edu",
        "aff_unique_abbr": "UC Berkeley",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Berkeley",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "92yrETgM6G",
        "title": "Calibration Attack: A Framework For Adversarial Attacks Targeting Calibration",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We introduce a new framework of adversarial attacks, named calibration attacks, in which the attacks are generated  and organized to trap victim models to be miscalibrated without altering their original accuracy, hence seriously endangering the trustworthiness of the models and any decision-making based on their confidence scores. Specifically, we identify four novel forms of calibration attacks: underconfidence attacks, overconfidence attacks, maximum miscalibration attacks, and random confidence attacks, in both the black-box and white-box setups. We then test these new attacks on typical victim models with comprehensive datasets, demonstrating that even with a relatively low number of queries, the attacks can create significant calibration mistakes. We further provide detailed analyses to understand different aspects of calibration attacks. Building on that, we investigate the effectiveness of widely used adversarial defences and calibration methods against these types of attacks, which then inspires us to devise two novel defences against such calibration attacks.",
        "keywords": "robustness;calibration;deep learning;image classification;adversarial",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Stephen Obadinma;Xiaodan Zhu;Hongyu Guo",
        "authorids": "~Stephen_Obadinma1;~Xiaodan_Zhu1;~Hongyu_Guo1",
        "gender": "M;M;M",
        "homepage": ";http://www.xiaodanzhu.com;https://hongyuharryguo.github.io/",
        "dblp": "271/8187;93/310.html;",
        "google_scholar": "https://scholar.google.ca/citations?user=bRbQBNsAAAAJ;https://scholar.google.ca/citations?user=a6MYnuUAAAAJ;https://scholar.google.ca/citations?user=bZUqlakAAAAJ",
        "orcid": ";0000-0003-3856-3696;",
        "linkedin": ";xiaodan-zhu-066833101/?originalSubdomain=ca;harry-h-y-guo-a582087/",
        "or_profile": "~Stephen_Obadinma1;~Xiaodan_Zhu1;~Hongyu_Guo1",
        "aff": "Queen's University;Queen's University;National Research Council Canada",
        "aff_domain": "queensu.ca;queensu.ca;nrc-cnrc.gc.ca",
        "position": "PhD student;Associate Professor;Senior Research Officer",
        "bibtex": "@misc{\nobadinma2024calibration,\ntitle={Calibration Attack: A Framework For Adversarial Attacks Targeting Calibration},\nauthor={Stephen Obadinma and Xiaodan Zhu and Hongyu Guo},\nyear={2024},\nurl={https://openreview.net/forum?id=92yrETgM6G}\n}",
        "github": "",
        "project": "",
        "reviewers": "YLZS;BDLx;PTEC;LAwv",
        "site": "https://openreview.net/forum?id=92yrETgM6G",
        "pdf_size": 2622314,
        "rating": "1;5;5;5",
        "confidence": "3;3;3;4",
        "soundness": "3;4;3;3",
        "contribution": "1;3;2;2",
        "presentation": "1;2;3;3",
        "wc_summary": "112;121;106;62",
        "wc_strengths": "97;30;96;64",
        "wc_weaknesses": "476;3;168;144",
        "wc_questions": "178;243;65;46",
        "wc_review": "863;397;435;316",
        "wc_reply_reviewers": "247;0;0;0",
        "wc_reply_authors": "603;151;490;295",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.0,
            1.7320508075688772
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            100.25,
            22.71976012197312
        ],
        "wc_strengths_avg": [
            71.75,
            27.517040175135115
        ],
        "wc_weaknesses_avg": [
            197.75,
            172.57226747076137
        ],
        "wc_questions_avg": [
            133.0,
            81.11411714368838
        ],
        "wc_review_avg": [
            502.75,
            212.3845274496238
        ],
        "wc_reply_reviewers_avg": [
            61.75,
            106.95413736737817
        ],
        "wc_reply_authors_avg": [
            384.75,
            174.2159220622501
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13536272327202876115&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Queen's University;National Research Council Canada",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.queensu.ca;https://www.nrc-cnrc.gc.ca",
        "aff_unique_abbr": "Queen's;NRC-CNRC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "title": "Hybrid Internal Model: Learning Agile Legged Locomotion with Simulated Robot Response",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19306",
        "id": "93LoCyww8o",
        "author_site": "Junfeng Long, ZiRui Wang, Quanyi Li, Liu Cao, Jiawei Gao, Jiangmiao Pang",
        "tldr": "",
        "abstract": "Robust locomotion control depends on accurate state estimations. However, the sensors of most legged robots can only provide partial and noisy observations, making the estimation particularly challenging, especially for external states like terrain frictions and elevation maps. Inspired by the classical Internal Model Control principle, we consider these external states as disturbances and introduce Hybrid Internal Model (HIM) to estimate them according to the response of the robot. The response, which we refer to as the hybrid internal embedding, contains the robot\u2019s explicit velocity and implicit stability representation, corresponding to two primary goals for locomotion tasks: explicitly tracking velocity and implicitly maintaining stability. We use contrastive learning to optimize the embedding to be close to the robot\u2019s successor state, in which the response is naturally embedded. HIM has several appealing benefits: It only needs the robot\u2019s proprioceptions, i.e., those from joint encoders and IMU as observations. It innovatively maintains consistent observations between simulation reference and reality that avoids information loss in mimicking learning. It exploits batch-level information that is more robust to noises and keeps better sample efficiency. It only requires 1 hour of training on an RTX 4090 to enable a quadruped robot to traverse any terrain under any disturbances. A wealth of real-world experiments demonstrates its agility, even in high-difficulty tasks and cases never occurred during the training process, revealing remarkable open-world generalizability.",
        "keywords": "Reinforcement Learning;Quadrupedal Locomotion;Internal Model",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Junfeng Long;ZiRui Wang;Quanyi Li;Liu Cao;Jiawei Gao;Jiangmiao Pang",
        "authorids": "~Junfeng_Long1;~ZiRui_Wang8;~Quanyi_Li1;~Liu_Cao1;~Jiawei_Gao1;~Jiangmiao_Pang1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://junfeng-long.github.io/;https://quanyili.github.io;https://github.com/xiaohu-art;https://gao-jiawei.com/;https://oceanpang.github.io/;https://github.com/Wongziseoi",
        "dblp": "343/2990;270/7691;;124/9335-4;231/7630;",
        "google_scholar": "olmfqBEAAAAJ;Ty49X3UAAAAJ;;NJxUNrcAAAAJ;https://scholar.google.com/citations?authuser=0;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": "0000-0001-7047-4963;;;;0000-0002-6711-9319;",
        "linkedin": ";https://www.linkedin.com/mwlite/in/quanyi-li-2b7985183;;;;",
        "or_profile": "~Junfeng_Long1;~Quanyi_Li1;~Liu_Cao1;~Jiawei_Gao1;~Jiangmiao_Pang1;~ZiRui_Wang4",
        "aff": "Shanghai AI Laboratory;University of Edinburgh;Tsinghua University;Tsinghua University;Shanghai AI Laboratory ;Shanghai Artificial Intelligence Laboratory",
        "aff_domain": "pjlab.org.cn;ed.ac.uk;tsinghua.edu.cn;tsinghua.edu.cn;pjlab.org.cn;pjlab.org.cn",
        "position": "Researcher;MS student;Undergrad student;Undergrad student;Research Scientist;Intern",
        "bibtex": "@inproceedings{\nlong2024hybrid,\ntitle={Hybrid Internal Model: Learning Agile Legged Locomotion with Simulated Robot Response},\nauthor={Junfeng Long and ZiRui Wang and Quanyi Li and Liu Cao and Jiawei Gao and Jiangmiao Pang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=93LoCyww8o}\n}",
        "github": "",
        "project": "",
        "reviewers": "9L23;FQfg;SBNA;Yqja",
        "pdf_size": 8357957,
        "rating": "5;6;6;8",
        "confidence": "5;3;4;4",
        "soundness": "1;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "1;2;2;3",
        "wc_summary": "56;67;93;35",
        "wc_strengths": "48;103;34;15",
        "wc_weaknesses": "284;67;140;54",
        "wc_questions": "78;81;11;101",
        "wc_review": "466;318;278;205",
        "wc_reply_reviewers": "30;0;12;10",
        "wc_reply_authors": "2790;353;1921;393",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "6;3;6;2",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            62.75,
            20.90902915010642
        ],
        "wc_strengths_avg": [
            50.0,
            32.76430985081175
        ],
        "wc_weaknesses_avg": [
            136.25,
            91.38483189238792
        ],
        "wc_questions_avg": [
            67.75,
            33.9365216249397
        ],
        "wc_review_avg": [
            316.75,
            95.21915511072339
        ],
        "wc_reply_reviewers_avg": [
            13.0,
            10.816653826391969
        ],
        "wc_reply_authors_avg": [
            1364.25,
            1037.8688199864182
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.25,
            1.7853571071357126
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.3244428422615251,
        "gs_citation": 21,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16640877501129933135&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=93LoCyww8o",
        "pdf": "https://openreview.net/pdf?id=93LoCyww8o",
        "email": "pjlab.org.cn;ed.ac.uk;tsinghua.edu.cn;tsinghua.edu.cn;pjlab.org.cn;pjlab.org.cn",
        "author_num": 6,
        "aff_unique_index": "0;1;2;2;0;3",
        "aff_unique_norm": "Shanghai AI Laboratory;University of Edinburgh;Tsinghua University;Shanghai Artificial Intelligence Laboratory",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.shanghai-ai-lab.com;https://www.ed.ac.uk;https://www.tsinghua.edu.cn;http://www.shailab.org/",
        "aff_unique_abbr": "SAIL;Edinburgh;THU;Shanghai AI Lab",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;0;0",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "id": "94FKDbtTqO",
        "title": "Rethinking the bert-like pretraining for dna sequences",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "With the success of large-scale pretraining in NLP, there is an increasing trend of applying it to the domain of life sciences. In particular, pretraining methods based on DNA sequences have garnered growing attention due to their potential to capture generic information about genes. However, existing pretraining methods for DNA sequences largely rely on direct adoptions of BERT pretraining from NLP, lacking a comprehensive understanding and a specifically tailored approach. To address this research gap, we first conducted a series of exploratory experiments and gained several insightful observations: 1) In the fine-tuning phase of downstream tasks, when using K-mer overlapping tokenization instead of K-mer non-overlapping tokenization, both overlapping and non-overlapping pretraining weights show consistent performance improvement.\n2) During the pre-training process, using K-mer overlapping tokenization quickly produces clear K-mer embeddings and reduces the loss to a very low level, while using K-mer non-overlapping tokenization results in less distinct embeddings and continuously decreases the loss. 3) Using overlapping tokenization causes the self-attention in the intermediate layers of pre-trained models to tend to overly focus on certain tokens, reflecting that these layers are not adequately optimized. In summary, overlapping tokenization can benefit the fine-tuning of downstream tasks but leads to inadequate pretraining with fast convergence. To unleash the pretraining potential, we introduce a novel approach called RandomMask, which gradually increases the task difficulty of BERT-like pretraining by continuously expanding its mask boundary, forcing the model to learn more knowledge. RandomMask is simple but effective, achieving top-tier performance across 26 datasets spanning 7 downstream tasks. For example, RandomMask achieves a staggering 65.83\\% in Matthew's correlation coefficient for epigenetic mark prediction, which is a groundbreaking increase of 14.02\\% over the baseline and a remarkable 4.82\\% improvement over the SOTA results.",
        "keywords": "Pretrained;DNA;Large Language Model",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/4d7404012286f7bdac17ee876cdeec6b8ef75a04.pdf",
        "author": "chaoqi liang;Weiqiang Bai;Lifeng Qiao;Yuchen Ren;Jianle Sun;Peng Ye;Hongliang Yan;Xinzhu Ma;Wangmeng Zuo;Wanli Ouyang",
        "authorids": "~chaoqi_liang1;~Weiqiang_Bai1;~Lifeng_Qiao1;~Yuchen_Ren1;~Jianle_Sun1;~Peng_Ye4;~Hongliang_Yan1;~Xinzhu_Ma1;~Wangmeng_Zuo3;~Wanli_Ouyang1",
        "gender": "M;;M;;M;M;M;M;M;",
        "homepage": "https://github.com/ChaoqiLiang;;https://github.com/qiaoqiaoLF;;https://sjl-sjtu.github.io/;;;https://github.com/xinzhuma;;",
        "dblp": "320/0293;;55/10318;;307/2312;53/930-6;03/8409;191/3902;93/2671;",
        "google_scholar": "r1yke4EAAAAJ;;;;sRFyIxAAAAAJ;UEZZP5QAAAAJ;Obo7-bIAAAAJ;8PuKa_8AAAAJ;rUOpCEYAAAAJ;",
        "orcid": ";;;;0000-0002-0001-0992;0000-0002-8486-7562;;;0000-0002-3330-783X;",
        "linkedin": ";;;;;;;;;",
        "or_profile": "~chaoqi_liang1;~Weiqiang_Bai1;~Lifeng_Qiao1;~Yuchen_Ren1;~Jianle_Sun1;~Peng_Ye4;~Hongliang_Yan1;~Xinzhu_Ma1;~Wangmeng_Zuo3;~Wanli_Ouyang1",
        "aff": "Harbin Institute of Technology;;Shanghai Jiaotong University;;Shanghai Jiaotong University;Fudan University;Shanghai Artificial Intelligence Lab;The Chinese University of Hong Kong;Harbin Institute of Technology;",
        "aff_domain": "hit.edu.cn;;sjtu.edu.cn;;sjtu.edu.cn;fudan.edu.cn;pjlab.org.cn;cuhk.edu.hk;hit.edu.cn;",
        "position": "PhD student;;Undergrad student;;MS student;PhD student;Postdoc;Postdoc;Full Professor;",
        "bibtex": "@misc{\nliang2024rethinking,\ntitle={Rethinking the bert-like pretraining for dna sequences},\nauthor={chaoqi liang and Weiqiang Bai and Lifeng Qiao and Yuchen Ren and Jianle Sun and Peng Ye and Hongliang Yan and Xinzhu Ma and Wangmeng Zuo and Wanli Ouyang},\nyear={2024},\nurl={https://openreview.net/forum?id=94FKDbtTqO}\n}",
        "github": "",
        "project": "",
        "reviewers": "g7iT;kyqC;45WA;SHyo",
        "site": "https://openreview.net/forum?id=94FKDbtTqO",
        "pdf_size": 1883340,
        "rating": "3;6;6;6",
        "confidence": "3;3;3;4",
        "soundness": "3;2;4;2",
        "contribution": "3;2;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "300;59;97;178",
        "wc_strengths": "50;6;142;68",
        "wc_weaknesses": "382;137;166;30",
        "wc_questions": "3;3;57;56",
        "wc_review": "735;205;462;332",
        "wc_reply_reviewers": "128;0;18;0",
        "wc_reply_authors": "1697;920;1181;945",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "4;2;3;2",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            158.5,
            92.31061694084815
        ],
        "wc_strengths_avg": [
            66.5,
            49.07901792008475
        ],
        "wc_weaknesses_avg": [
            178.75,
            127.81113996831418
        ],
        "wc_questions_avg": [
            29.75,
            26.75233634656981
        ],
        "wc_review_avg": [
            433.5,
            196.3600010185374
        ],
        "wc_reply_reviewers_avg": [
            36.5,
            53.33619783974107
        ],
        "wc_reply_authors_avg": [
            1185.75,
            312.2429943169262
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:awX9quWX0vYJ:scholar.google.com/&scioq=Rethinking+the+bert-like+pretraining+for+dna+sequences&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;2;3;4;0",
        "aff_unique_norm": "Harbin Institute of Technology;Shanghai Jiao Tong University;Fudan University;Shanghai Artificial Intelligence Lab;Chinese University of Hong Kong",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "http://www.hit.edu.cn/;https://www.sjtu.edu.cn;https://www.fudan.edu.cn;https://www.shailab.org;https://www.cuhk.edu.hk",
        "aff_unique_abbr": "HIT;SJTU;Fudan;Shanghai AI Lab;CUHK",
        "aff_campus_unique_index": "0;2;0",
        "aff_campus_unique": "Harbin;;Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "9528xxcT7h",
        "title": "Two Heads are Better than One: Towards Better Adversarial Robustness by Combining Transduction and Rejection",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Both transduction and rejection have emerged as important techniques for defending against adversarial perturbations. A recent work by Tram\u00e8r showed that, in the rejection-only case (no transduction), a strong rejection-solution can be turned into a strong (but computationally inefficient) non-rejection solution. This detector-to-classifier reduction has been mostly applied to give evidence that certain claims of strong selective-model solutions are susceptible, leaving the benefits of rejection unclear. On the other hand, a recent work by Goldwasser et al. showed that rejection combined with transduction can give provable guarantees (for certain problems) that cannot be achieved otherwise. Nevertheless, under recent strong adversarial attacks (GMSA, which has been shown to be much more effective than AutoAttack against transduction), Goldwasser et al.'s work was shown to have low performance in a practical deep-learning setting. In this paper, we take a step towards realizing the promise of transduction+rejection in more realistic scenarios. Theoretically, we show that a novel application of Tram\u00e8r's classifier-to-detector technique in the transductive setting can give significantly improved sample-complexity for robust generalization. While our theoretical construction is computationally inefficient, it guides us to identify an efficient transductive algorithm to learn a selective model. Extensive experiments using state of the art attacks (AutoAttack, GMSA) show that our solutions provide significantly better robust accuracy.",
        "keywords": "Adversarial robustness;Transductive machine learning;Rejection;Selective classification",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/756840c278f6b75cb543649e00bba7f20708cd4c.zip",
        "author": "Nils Palumbo;Yang Guo;Xi Wu;Jiefeng Chen;Yingyu Liang;Somesh Jha",
        "authorids": "~Nils_Palumbo1;~Yang_Guo4;~Xi_Wu1;~Jiefeng_Chen2;~Yingyu_Liang1;~Somesh_Jha1",
        "gender": ";M;M;M;;M",
        "homepage": ";;http://andrewxiwu.github.io/;https://jfc43.github.io/;;",
        "dblp": "258/3557;;37/4465-1;199/3381;;j/SomeshJha",
        "google_scholar": "vXBD3Q8AAAAJ;BbQQEPcAAAAJ;OmmxazMAAAAJ;5mOfQfAAAAAJ;;BaI7l8QAAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";;;jiefeng-chen-aa1769122/;;",
        "or_profile": "~Nils_Palumbo1;~Yang_Guo4;~Xi_Wu1;~Jiefeng_Chen2;~Yingyu_Liang1;~Somesh_Jha1",
        "aff": "University of Wisconsin - Madison;;Google;Amazon;;Department of Computer Science, University of Wisconsin, Madison",
        "aff_domain": "wisc.edu;;google.com;amazon.com;;cs.wisc.edu",
        "position": "PhD student;;Software Engineer;Applied Scientist;;Full Professor",
        "bibtex": "@misc{\npalumbo2024two,\ntitle={Two Heads are Better than One: Towards Better Adversarial Robustness by Combining Transduction and Rejection},\nauthor={Nils Palumbo and Yang Guo and Xi Wu and Jiefeng Chen and Yingyu Liang and Somesh Jha},\nyear={2024},\nurl={https://openreview.net/forum?id=9528xxcT7h}\n}",
        "github": "",
        "project": "",
        "reviewers": "xAQ7;XrZg;qXLN;kR75",
        "site": "https://openreview.net/forum?id=9528xxcT7h",
        "pdf_size": 2247755,
        "rating": "6;6;6;8",
        "confidence": "3;4;3;4",
        "soundness": "3;3;3;3",
        "contribution": "3;3;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "94;224;95;75",
        "wc_strengths": "113;55;48;57",
        "wc_weaknesses": "255;201;119;148",
        "wc_questions": "71;5;24;5",
        "wc_review": "533;485;286;285",
        "wc_reply_reviewers": "0;0;0;12",
        "wc_reply_authors": "575;360;473;444",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            122.0,
            59.42642509860407
        ],
        "wc_strengths_avg": [
            68.25,
            26.05163142684158
        ],
        "wc_weaknesses_avg": [
            180.75,
            51.982569193913456
        ],
        "wc_questions_avg": [
            26.25,
            26.975683494584526
        ],
        "wc_review_avg": [
            397.25,
            113.0317986232193
        ],
        "wc_reply_reviewers_avg": [
            3.0,
            5.196152422706632
        ],
        "wc_reply_authors_avg": [
            463.0,
            76.834237160266
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Tq19TOg1zpQJ:scholar.google.com/&scioq=Two+Heads+are+Better+than+One:+Towards+Better+Adversarial+Robustness+by+Combining+Transduction+and+Rejection&hl=en&as_sdt=0,21",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "University of Wisconsin-Madison;Google;Amazon",
        "aff_unique_dep": ";Google;Amazon.com, Inc.",
        "aff_unique_url": "https://www.wisc.edu;https://www.google.com;https://www.amazon.com",
        "aff_unique_abbr": "UW-Madison;Google;Amazon",
        "aff_campus_unique_index": "0;1;0",
        "aff_campus_unique": "Madison;Mountain View;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "95ObXevgHx",
        "title": "The Temporal Structure of Language Processing in the Human Brain Corresponds to The Layered Hierarchy of Deep Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep Language Models (DLMs) provide a novel computational paradigm for understanding the mechanisms of natural language processing in the human brain. Unlike traditional psycholinguistic models, DLMs use layered sequences of continuous numerical vectors to represent words and context, allowing a plethora of emerging applications such as human-like text generation. \nIn this paper we show evidence that the layered hierarchy of DLMs may be used to model the temporal dynamics of language comprehension in the brain by demonstrating a strong correlation between DLM layer depth and \nthe time at which layers are most predictive of the human brain.\nOur ability to temporally resolve individual layers benefits from our use of electrocorticography (ECoG) data, which has a much higher temporal resolution than noninvasive methods like fMRI. Using ECoG, we record neural activity from participants listening to a 30-minute narrative while also feeding the same narrative to a high-performing DLM (GPT2-XL). We then extract contextual embeddings from the different layers of the DLM and use linear encoding models to predict neural activity. We first focus on the Inferior Frontal Gyrus (IFG, or Broca's area) and then extend our model to track the increasing temporal receptive window along the linguistic processing hierarchy from auditory to syntactic and semantic areas. \nOur results reveal a connection between human language processing and DLMs, with the DLM's layer-by-layer accumulation of contextual information mirroring the timing of neural activity in high-order language areas.",
        "keywords": "natural language processing;NLP;neuroscience;cognitive science;deep language models;GPT2",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/a0c98662662e4a5c55ff3d4366101e06c2b94617.zip",
        "author": "Ariel Goldstein;Eric Ham;Mariano Schain;Samuel Nastase;Zaid Zada;Avigail Dabush;Bobbi Aubrey;Harshvardhan Gazula;Amir Feder;Werner K Doyle;Sasha Devore;Patricia Dugan;Daniel Friedman;Roi Reichart;Michael Brenner;Avinatan Hassidim;Orrin Devinsky;Adeen Flinker;Omer Levy;Uri Hasson",
        "authorids": "~Ariel_Goldstein1;~Eric_Ham1;~Mariano_Schain1;~Samuel_Nastase1;~Zaid_Zada1;~Avigail_Dabush1;~Bobbi_Aubrey1;~Harshvardhan_Gazula1;~Amir_Feder1;~Werner_K_Doyle1;~Sasha_Devore1;~Patricia_Dugan1;~Daniel_Friedman2;~Roi_Reichart1;~Michael_Brenner1;~Avinatan_Hassidim3;~Orrin_Devinsky1;~Adeen_Flinker1;~Omer_Levy1;~Uri_Hasson1",
        "gender": "M;M;;M;M;;;;;M;;F;M;M;;;M;M;M;M",
        "homepage": "https://www.deepcognitionlab.com/;;;https://snastase.github.io/;https://zaidzada.com;https://www.linkedin.com/in/avigail-dabush-grinstein-546a15226/;;;https://www.amirfeder.com/;http://neuroviewtech.com;https://med.nyu.edu/faculty/sasha-devore;https://nyulangone.org/doctors/1467789107/patricia-c-dugan;;https://roireichart.com/;https://brennergroup.seas.harvard.edu;;;https://flinkerlab.org;;https://hassonlab.princeton.edu/",
        "dblp": ";;;165/6494;;;;;214/3604;;;;73/1093;96/5429;;;;;117/4866;",
        "google_scholar": "p8hQgVuVOTgC;Ts4PsekAAAAJ;;tjLH8mQAAAAJ;RC_hwc0AAAAJ;;pryO0XYAAAAJ;;ERwoPLIAAAAJ;;;;CMIm2eUAAAAJ;https://scholar.google.co.il/citations?user=xXJIsh4AAAAJ;;;25Q74uMAAAAJ;Us1mDooAAAAJ;PZVd2h8AAAAJ;VRw8v4kAAAAJ",
        "orcid": ";0009-0004-1453-7180;;0000-0001-7013-5275;0000-0002-3096-0059;;;;0000-0001-5472-1135;;;0000-0001-6199-1870;0000-0003-1068-1797;;;;;0000-0003-1247-1283;0000-0001-7300-8191;",
        "linkedin": ";eric-ham-1b10ab12a/;;;zzada/;;;;amir-feder-b65b7035/;;;;;roi-reichart-ba2a8a7/;;;;;;",
        "or_profile": "~Ariel_Goldstein1;~Eric_Ham1;~Mariano_Schain1;~Samuel_Nastase1;~Zaid_Zada1;~Avigail_Dabush1;~Bobbi_Aubrey1;~Harshvardhan_Gazula1;~Amir_Feder1;~Werner_K_Doyle1;~Sasha_Devore1;~Patricia_Dugan1;~Daniel_Friedman2;~Roi_Reichart1;~Michael_Brenner1;~Avinatan_Hassidim3;~Orrin_Devinsky1;~Adeen_Flinker1;~Omer_Levy1;~Uri_Hasson1",
        "aff": "Hebrew University of Jerusalem;Gladstone Institutes;;Princeton University;Princeton University;;Princeton University;;Google;New York University;NYU Langone;NYU Grossman School of Medicine;NYU Langone;Technion, Israel Institute of Technology;Harvard University;;;New York University;Tel Aviv University;",
        "aff_domain": "huji.ac.il;gladstone.ucsf.edu;;princeton.edu;princeton.edu;;princeton.edu;;google.com;nyu.edu;nyumc.org;nyulangone.org;nyumc.org;technion.ac.il;fas.harvard.edu;;;nyu.edu;tau.ac.il;",
        "position": "Assistant Professor;Researcher;;Postdoc;PhD student;;Researcher;;Researcher;Associate Professor;Associate Professor;Associate Professor;Full Professor;Associate Professor;Professor;;;Assistant Professor;Senior Lecturer;",
        "bibtex": "@misc{\ngoldstein2024the,\ntitle={The Temporal Structure of Language Processing in the Human Brain Corresponds to The Layered Hierarchy of Deep Language Models},\nauthor={Ariel Goldstein and Eric Ham and Mariano Schain and Samuel Nastase and Zaid Zada and Avigail Dabush and Bobbi Aubrey and Harshvardhan Gazula and Amir Feder and Werner K Doyle and Sasha Devore and Patricia Dugan and Daniel Friedman and Roi Reichart and Michael Brenner and Avinatan Hassidim and Orrin Devinsky and Adeen Flinker and Omer Levy and Uri Hasson},\nyear={2024},\nurl={https://openreview.net/forum?id=95ObXevgHx}\n}",
        "github": "",
        "project": "",
        "reviewers": "MbTk;4Wkk;r5Ne;4TH4;rNmu",
        "site": "https://openreview.net/forum?id=95ObXevgHx",
        "pdf_size": 18254906,
        "rating": "3;6;6;8;8",
        "confidence": "4;3;5;4;4",
        "soundness": "2;3;3;4;3",
        "contribution": "2;3;3;3;3",
        "presentation": "2;3;3;4;4",
        "wc_summary": "157;79;165;259;94",
        "wc_strengths": "25;85;189;99;77",
        "wc_weaknesses": "137;125;165;129;30",
        "wc_questions": "119;65;103;417;9",
        "wc_review": "438;354;622;904;210",
        "wc_reply_reviewers": "260;19;0;0;0",
        "wc_reply_authors": "1951;1079;1119;1514;739",
        "reply_reviewers": "1;1;0;0;0",
        "reply_authors": "4;3;2;2;2",
        "rating_avg": [
            6.2,
            1.8330302779823362
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            3.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            2.8,
            0.39999999999999997
        ],
        "presentation_avg": [
            3.2,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            150.8,
            63.76331233554292
        ],
        "wc_strengths_avg": [
            95.0,
            53.246596135339956
        ],
        "wc_weaknesses_avg": [
            117.2,
            45.783839943805496
        ],
        "wc_questions_avg": [
            142.6,
            142.33144417169382
        ],
        "wc_review_avg": [
            505.6,
            239.66777004845684
        ],
        "wc_reply_reviewers_avg": [
            55.8,
            102.36483771295687
        ],
        "wc_reply_authors_avg": [
            1280.4,
            415.69200136639625
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            2.6,
            0.8
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            20,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12394723397824789272&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;2;2;3;4;5;6;5;7;8;4;9",
        "aff_unique_norm": "Hebrew University of Jerusalem;Gladstone Institutes;Princeton University;Google;New York University;NYU Langone Health;New York University Grossman School of Medicine;Israel Institute of Technology;Harvard University;Tel Aviv University",
        "aff_unique_dep": ";;;Google;;;School of Medicine;;;",
        "aff_unique_url": "https://www.huji.ac.il;https://www.gladstone.org;https://www.princeton.edu;https://www.google.com;https://www.nyu.edu;https://nyulangone.org;https://med.nyu.edu;https://www.technion.ac.il/en/;https://www.harvard.edu;https://www.tau.ac.il",
        "aff_unique_abbr": "HUJI;;Princeton;Google;NYU;NYU Langone;NYU Grossman SOM;Technion;Harvard;TAU",
        "aff_campus_unique_index": "0;2;3",
        "aff_campus_unique": "Jerusalem;;Mountain View;New York",
        "aff_country_unique_index": "0;1;1;1;1;1;1;1;1;1;0;1;1;0",
        "aff_country_unique": "Israel;United States"
    },
    {
        "id": "95joD3Yc5t",
        "title": "Generative Semantic Communication: Diffusion Models Beyond Bit Recovery",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Semantic communication is expected to be one of the cores of next-generation AI-based communications. One of the possibilities offered by semantic communication is the capability to regenerate, at the destination side, images or videos semantically equivalent to the transmitted ones, without necessarily recovering the transmitted sequence of bits. The current solutions still lack the ability to build complex scenes from the received partial information. Clearly, there is an unmet need to balance the effectiveness of generation methods and the complexity of the transmitted information, possibly taking into account the goal of communication. In this paper, we aim to bridge this gap by proposing a novel generative diffusion-guided framework for semantic communication that leverages the strong abilities of diffusion models in synthesizing multimedia content while preserving semantic features. Concurrently, we propose a novel strategy to make diffusion models resilient to corrupted conditioning data, avoiding that heavily noise-affected conditioning may mislead the generation process. We reduce bandwidth usage by sending highly-compressed semantic information only. Then, the diffusion model learns to synthesize semantic-consistent scenes from such semantic information.\nWe prove, through an in-depth assessment of multiple scenarios, that our method outperforms existing solutions in generating high-quality images with preserved semantic information even in cases where the received conditioning content is significantly degraded. More specifically, our results show that objects, locations, and depths are still recognizable even in the presence of extremely noisy conditions of the communication channel.",
        "keywords": "Semantic image synthesis;Diffusion models;Deep generative models;Semantic communication",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/b8cdcaeebef29d66f185b12dc0c713cd06e7dbc1.zip",
        "author": "Eleonora Grassucci;Sergio Barbarossa;Danilo Comminiello",
        "authorids": "~Eleonora_Grassucci1;~Sergio_Barbarossa1;~Danilo_Comminiello1",
        "gender": "F;;M",
        "homepage": "https://sites.google.com/uniroma1.it/eleonoragrassucci/home-page;https://sites.google.com/a/uniroma1.it/sergiobarbarossa/;https://danilocomminiello.site.uniroma1.it/",
        "dblp": "275/6348;66/426;33/9433",
        "google_scholar": "https://scholar.google.it/citations?user=Jcv0TgQAAAAJ;https://scholar.google.it/citations?hl=it;https://scholar.google.it/citations?user=H3Y52cMAAAAJ",
        "orcid": "0000-0003-4626-4506;;0000-0003-4067-4504",
        "linkedin": ";;danilocomminiello/",
        "or_profile": "~Eleonora_Grassucci1;~Sergio_Barbarossa1;~Danilo_Comminiello1",
        "aff": "Sapienza University of Rome;University of Roma \"La Sapienza\";Sapienza University of Rome",
        "aff_domain": "uniroma1.it;uniroma1.it;uniroma1.it",
        "position": "Assistant Professor;Full Professor;Associate Professor",
        "bibtex": "@misc{\ngrassucci2024generative,\ntitle={Generative Semantic Communication: Diffusion Models Beyond Bit Recovery},\nauthor={Eleonora Grassucci and Sergio Barbarossa and Danilo Comminiello},\nyear={2024},\nurl={https://openreview.net/forum?id=95joD3Yc5t}\n}",
        "github": "",
        "project": "",
        "reviewers": "ckTn;4cUJ;q6SF;M1DV",
        "site": "https://openreview.net/forum?id=95joD3Yc5t",
        "pdf_size": 26810978,
        "rating": "3;5;5;6",
        "confidence": "2;3;4;3",
        "soundness": "2;3;2;3",
        "contribution": "2;2;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "82;65;48;101",
        "wc_strengths": "38;40;62;86",
        "wc_weaknesses": "146;179;164;136",
        "wc_questions": "34;2;23;63",
        "wc_review": "300;286;297;386",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "924;823;925;1348",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "4;3;4;4",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            74.0,
            19.685019685029527
        ],
        "wc_strengths_avg": [
            56.5,
            19.461500456028563
        ],
        "wc_weaknesses_avg": [
            156.25,
            16.528384676065595
        ],
        "wc_questions_avg": [
            30.5,
            22.005681084665387
        ],
        "wc_review_avg": [
            317.25,
            40.03357965508455
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1005.0,
            202.32029062849827
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            3.75,
            0.4330127018922193
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.6488856845230502,
        "gs_citation": 66,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6442150188972160068&as_sdt=80005&sciodt=0,11&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Sapienza University of Rome;University of Rome La Sapienza",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uniroma1.it;https://www.uniroma1.it",
        "aff_unique_abbr": "Sapienza;La Sapienza",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Rome",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Italy"
    },
    {
        "id": "96UB3vQpAA",
        "title": "Fast Learning in Balanced Deep Spiking Neural Networks with Strong and Weak Synapses",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The intricate neural dynamics of the cerebral cortex are often characterized in terms of the delicate balance between excitation and inhibition (E-I balance). While numerous studies have delved into its functional implications, one fundamental issue has remained unresolved -- namely, _the unstructured, random connections posed by E-I balance dynamics versus the necessity for structured neural connections to fulfill specific computational tasks_.  This raises the crucial question: How can neural circuits reconcile these seemingly contradictory demands? Drawing inspirations from recent data in neuroscience, we propose a biologically grounded spiking neural network. This network incorporates two distinct sets of synaptic connections, one featuring strong synapses dedicated to maintaining the balance condition, and the other comprising weak synapses utilized for neural computation. Crucially, only the weak synapses undergo training, while the strong synapses remain fixed. Interestingly, we have discovered that this architecture not only resolves the structural conflicts, but also offers several compelling computational advantages. Firstly, the E-I balance dynamics mediated by strong synapses can closely mimic the function of normalization operations, effectively alleviating the internal covariate shift problem. Secondly, we have observed that weak synapses remain weak during training without any imposed constraints, thus preserving the balance condition established by the strong synapses. Lastly, the coexistence of strong and weak synapses allows for a seamless transition from the \"lazy\" learning regime, characterized by the primary training of readout weights, to the \"rich\" learning regime, marked by alterations in neural representations. We believe this study can shed light on how structured computations can coexist with unstructured E-I balance dynamics and offer novel perspectives on the computational advantages of E-I balance.",
        "keywords": "excitation-inhibition balance;spiking neural networks;brain-inspired;neuroscience",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "Xiaohan Lin;Chaoming Wang;Boxin Shi;Si Wu",
        "authorids": "~Xiaohan_Lin1;~Chaoming_Wang1;~Boxin_Shi3;~Si_Wu1",
        "gender": ";M;M;M",
        "homepage": ";https://brainpy.tech/;http://camera.pku.edu.cn;https://mgv.pku.edu.cn/english/people/lbd/soeeace/267528.htm",
        "dblp": ";;69/783;25/437-1",
        "google_scholar": ";;K1LjZxcAAAAJ;",
        "orcid": ";;0000-0001-6749-0364;",
        "linkedin": ";;;",
        "or_profile": "~Xiaohan_Lin1;~Chaoming_Wang1;~Boxin_Shi3;~Si_Wu1",
        "aff": ";;Peking University;Peking University",
        "aff_domain": ";;pku.edu.cn;pku.edu.cn",
        "position": ";;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nlin2024fast,\ntitle={Fast Learning in Balanced Deep Spiking Neural Networks with Strong and Weak Synapses},\nauthor={Xiaohan Lin and Chaoming Wang and Boxin Shi and Si Wu},\nyear={2024},\nurl={https://openreview.net/forum?id=96UB3vQpAA}\n}",
        "github": "",
        "project": "",
        "reviewers": "W5kj;VbNy;aXEa;yPXB",
        "site": "https://openreview.net/forum?id=96UB3vQpAA",
        "pdf_size": 703402,
        "rating": "1;3;6;8",
        "confidence": "5;4;4;4",
        "soundness": "2;1;3;4",
        "contribution": "1;2;4;3",
        "presentation": "2;1;3;4",
        "wc_summary": "110;116;37;67",
        "wc_strengths": "36;23;45;89",
        "wc_weaknesses": "140;513;198;55",
        "wc_questions": "1;2;151;218",
        "wc_review": "287;654;431;429",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            2.692582403567252
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            1.118033988749895
        ],
        "contribution_avg": [
            2.5,
            1.118033988749895
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            82.5,
            32.361242250568814
        ],
        "wc_strengths_avg": [
            48.25,
            24.79289212657531
        ],
        "wc_weaknesses_avg": [
            226.5,
            173.05273762642415
        ],
        "wc_questions_avg": [
            93.0,
            94.5171942029597
        ],
        "wc_review_avg": [
            450.25,
            131.32664428820223
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.7504787743864564,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:oRMmFyWEFDMJ:scholar.google.com/&scioq=Fast+Learning+in+Balanced+Deep+Spiking+Neural+Networks+with+Strong+and+Weak+Synapses&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Peking University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.pku.edu.cn",
        "aff_unique_abbr": "Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "96nX9xIIx2",
        "title": "Visual Prompting Upgrades Neural Network Sparsification: A Data-Model Perspective",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The rapid development of large-scale deep learning models questions the affordability of hardware platforms, which necessitates the pruning to reduce their computational and memory footprints. Sparse neural networks as the product, have demonstrated numerous favorable benefits like low complexity, undamaged generalization, $\\textit{etc}$. Most of the prominent pruning strategies are invented from a $\\textit{model-centric}$ perspective, focusing on searching and preserving crucial weights by analyzing network topologies. However, the role of data and its interplay with model-centric pruning has remained relatively unexplored. In this research, we introduce a novel $\\textit{data-model co-design}$ perspective: to promote superior weight sparsity by learning important model topology and adequate input data in a synergetic manner. Specifically, customized $\\textbf{V}$isual $\\textbf{P}$rompts are mounted to upgrade neural $\\textbf{N}$etwork $\\textbf{s}$parsification in our proposed $\\textbf{\\texttt{VPNs}}$ framework. As a pioneering effort, this paper conducts systematic investigations about the impact of different visual prompts on model pruning and suggests an effective joint optimization approach. Extensive experiments with $3$ network architectures and $8$ datasets evidence the substantial performance improvements from $\\textbf{\\texttt{VPNs}}$ over existing start-of-the-art pruning algorithms. Furthermore, we find that subnetworks discovered by $\\textbf{\\texttt{VPNs}}$ from pre-trained models enjoy better transferability across diverse downstream scenarios. These insights shed light on new promising possibilities of data-model co-designs for vision model sparsification. Codes are in the supplement.",
        "keywords": "neural network sparsification;visual prompt",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/7b2339ecfd6931cea6805aafbe426323e33c3767.zip",
        "author": "Can Jin;Tianjin Huang;Yihua Zhang;Mykola Pechenizkiy;Sijia Liu;Shiwei Liu;Tianlong Chen",
        "authorids": "~Can_Jin1;~Tianjin_Huang1;~Yihua_Zhang1;~Mykola_Pechenizkiy1;~Sijia_Liu1;~Shiwei_Liu2;~Tianlong_Chen1",
        "gender": "M;M;M;M;M;M;M",
        "homepage": "https://jincan333.github.io/;https://research.tue.nl/nl/persons/tianjin-huang;https://yihua-zhang.com;http://www.win.tue.nl/~mpechen/;https://lsjxjtu.github.io/;https://shiweiliuiiiiiii.github.io/;https://tianlong-chen.github.io",
        "dblp": ";189/3972;;37/4649;128/6972-1;234/8697-3.html;",
        "google_scholar": "RK-8dz0AAAAJ;https://scholar.google.co.uk/citations?user=yFLmPsoAAAAJ;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com.tw/citations?user=F0uFT_kAAAAJ;C7dO_UgAAAAJ;73IbXtsAAAAJ;LE3ctn0AAAAJ",
        "orcid": "0009-0007-3407-1658;;;0000-0003-4955-0743;;;0000-0001-7774-8197",
        "linkedin": ";;zhangyihua/;mpechen/;;;tianlong-chen-783862167/",
        "or_profile": "~Can_Jin1;~Tianjin_Huang1;~Yihua_Zhang1;~Mykola_Pechenizkiy1;~Sijia_Liu1;~Shiwei_Liu2;~Tianlong_Chen1",
        "aff": "Rutgers University;University of Exeter;Michigan State University;Eindhoven University of Technology;Michigan State University;University of Oxford;Harvard University",
        "aff_domain": "rutgers.edu;exeter.ac.uk;msu.edu;tue.nl;msu.edu;ox.ac.uk;harvard.edu",
        "position": "PhD student;Lecturer;PhD student;Full Professor;Assistant Professor;Postdoc;Postdoc",
        "bibtex": "@misc{\njin2024visual,\ntitle={Visual Prompting Upgrades Neural Network Sparsification: A Data-Model Perspective},\nauthor={Can Jin and Tianjin Huang and Yihua Zhang and Mykola Pechenizkiy and Sijia Liu and Shiwei Liu and Tianlong Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=96nX9xIIx2}\n}",
        "github": "",
        "project": "",
        "reviewers": "eRqj;hiB3;sGzb;8b5d",
        "site": "https://openreview.net/forum?id=96nX9xIIx2",
        "pdf_size": 4569192,
        "rating": "3;5;5;5",
        "confidence": "5;4;4;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "4;3;3;4",
        "wc_summary": "39;43;92;104",
        "wc_strengths": "24;40;40;83",
        "wc_weaknesses": "115;273;56;137",
        "wc_questions": "2;55;8;153",
        "wc_review": "180;411;196;477",
        "wc_reply_reviewers": "361;196;0;11",
        "wc_reply_authors": "2971;1947;1204;995",
        "reply_reviewers": "5;1;0;1",
        "reply_authors": "7;5;4;4",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            69.5,
            28.848743473503312
        ],
        "wc_strengths_avg": [
            46.75,
            21.924586655168667
        ],
        "wc_weaknesses_avg": [
            145.25,
            79.48073665989766
        ],
        "wc_questions_avg": [
            54.5,
            60.45866356445534
        ],
        "wc_review_avg": [
            316.0,
            130.23248442688944
        ],
        "wc_reply_reviewers_avg": [
            142.0,
            148.49410762720518
        ],
        "wc_reply_authors_avg": [
            1779.25,
            773.6873964980947
        ],
        "reply_reviewers_avg": [
            1.75,
            1.920286436967152
        ],
        "reply_authors_avg": [
            5.0,
            1.224744871391589
        ],
        "replies_avg": [
            34,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 29,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=654969446584179655&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;3;2;4;5",
        "aff_unique_norm": "Rutgers University;University of Exeter;Michigan State University;Eindhoven University of Technology;University of Oxford;Harvard University",
        "aff_unique_dep": ";;;;;",
        "aff_unique_url": "https://www.rutgers.edu;https://www.exeter.ac.uk;https://www.msu.edu;https://www.tue.nl;https://www.ox.ac.uk;https://www.harvard.edu",
        "aff_unique_abbr": "Rutgers;Exeter;MSU;TU/e;Oxford;Harvard",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;2;0;1;0",
        "aff_country_unique": "United States;United Kingdom;Netherlands"
    },
    {
        "title": "Alt-Text with Context: Improving Accessibility for Images on Twitter",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19305",
        "id": "97Dl82avFs",
        "author_site": "Nikita Srivatsan, Sofia Samaniego, Omar Florez, Taylor Berg-Kirkpatrick",
        "tldr": "",
        "abstract": "In this work we present an approach for generating alternative text (or alt-text) descriptions for images shared on social media, specifically Twitter. More than just a special case of image captioning, alt-text is both more literally descriptive and context-specific. Also critically, images posted to Twitter are often accompanied by user-written text that despite not necessarily describing the image may provide useful context that if properly leveraged can be informative. We address this task with a multimodal model that conditions on both textual information from the associated social media post as well as visual signal from the image, and demonstrate that the utility of these two information sources stacks. We put forward a new dataset of 371k images paired with alt-text and tweets scraped from Twitter and evaluate on it across a variety of automated metrics as well as human evaluation. We show that our approach of conditioning on both tweet text and visual information significantly outperforms prior work, by more than 2x on BLEU@4.",
        "keywords": "alt-text;social media;twitter;clip;computer vision;image captioning;accessibility",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Nikita Srivatsan;Sofia Samaniego;Omar Florez;Taylor Berg-Kirkpatrick",
        "authorids": "~Nikita_Srivatsan1;~Sofia_Samaniego1;~Omar_Florez1;~Taylor_Berg-Kirkpatrick1",
        "gender": "F;F;M;M",
        "homepage": "https://www.cs.cmu.edu/~asrivats;;https://www.linkedin.com/in/omar-u-florez-35338015/;https://cseweb.ucsd.edu/~tberg/",
        "dblp": "227/3475.html;;;22/8160",
        "google_scholar": "Zbihne0AAAAJ;;;mN6_BKAAAAAJ",
        "orcid": ";;;",
        "linkedin": ";sofia-samaniego;omar-u-florez-35338015/;",
        "or_profile": "~Nikita_Srivatsan1;~Sofia_Samaniego1;~Omar_Florez1;~Taylor_Berg-Kirkpatrick1",
        "aff": "Carnegie Mellon University;Twitter;Twitter;University of California, San Diego",
        "aff_domain": "cmu.edu;twitter.com;twitter.com;ucsd.edu",
        "position": "PhD student;Researcher;Researcher;Associate Professor",
        "bibtex": "@inproceedings{\nsrivatsan2024alttext,\ntitle={Alt-Text with Context: Improving Accessibility for Images on Twitter},\nauthor={Nikita Srivatsan and Sofia Samaniego and Omar Florez and Taylor Berg-Kirkpatrick},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=97Dl82avFs}\n}",
        "github": "",
        "project": "",
        "reviewers": "2NmJ;1eBv;xHBk",
        "pdf_size": 2532532,
        "rating": "5;6;8",
        "confidence": "4;3;3",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "2;3;3",
        "wc_summary": "68;114;89",
        "wc_strengths": "186;164;24",
        "wc_weaknesses": "650;119;54",
        "wc_questions": "80;68;32",
        "wc_review": "984;465;199",
        "wc_reply_reviewers": "124;31;0",
        "wc_reply_authors": "821;362;403",
        "reply_reviewers": "1;1;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            90.33333333333333,
            18.80307303489394
        ],
        "wc_strengths_avg": [
            124.66666666666667,
            71.74646719912803
        ],
        "wc_weaknesses_avg": [
            274.3333333333333,
            266.958590213705
        ],
        "wc_questions_avg": [
            60.0,
            20.396078054371138
        ],
        "wc_review_avg": [
            549.3333333333334,
            325.97580005611184
        ],
        "wc_reply_reviewers_avg": [
            51.666666666666664,
            52.689868307125444
        ],
        "wc_reply_authors_avg": [
            528.6666666666666,
            207.38745274378476
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.7559289460184545,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4912397428830109366&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=97Dl82avFs",
        "pdf": "https://openreview.net/pdf?id=97Dl82avFs",
        "email": "cmu.edu;twitter.com;twitter.com;ucsd.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "Carnegie Mellon University;Twitter, Inc.;University of California, San Diego",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.cmu.edu;https://twitter.com;https://www.ucsd.edu",
        "aff_unique_abbr": "CMU;Twitter;UCSD",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";San Diego",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "98g9NdJPxm",
        "title": "Theoretically Understanding Data Reconstruction Leakage in Federated Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Federated learning is an emerging collaborative learning paradigm that aims to protect data privacy. Unfortunately, recent works show that federated learning algorithms are vulnerable to data reconstruction attacks, and a series of follow-up works are proposed to enhance the attack effectiveness. However, existing works lack of a theoretical understanding on to what extent the devices' data can be reconstructed and the effectiveness of these attacks cannot be compared theoretically. To address it, we propose a theoretical framework to understand data reconstruction attacks to FL. Our framework involves bounding the data reconstruction error and an attack's error bound reflects its inherent attack effectiveness. Under the framework, we can theoretically compare the effectiveness of existing attacks. For instance, our experimental results on multiple datasets validate that the iDLG data reconstruction attack inherently outperforms the DLG attack.",
        "keywords": "Privacy leakage;model reconstruction attacks;federated learning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Zifan Wang;Binghui Zhang;Meng Pang;Yuan Hong;Binghui Wang",
        "authorids": "~Zifan_Wang5;~Binghui_Zhang1;~Meng_Pang1;~Yuan_Hong1;~Binghui_Wang2",
        "gender": "M;M;M;M;M",
        "homepage": ";;;https://yhongcs.github.io/;https://wangbinghui.net",
        "dblp": ";;172/9447.html;79/5433-1;123/7149",
        "google_scholar": ";;;KJuZW2wAAAAJ;SoOztcEAAAAJ",
        "orcid": ";;;;0000-0001-5616-060X",
        "linkedin": "zifan-wang-2bb067173;binghui-zhang-68b20a108;;;",
        "or_profile": "~Zifan_Wang5;~Binghui_Zhang1;~Meng_Pang1;~Yuan_Hong1;~Binghui_Wang2",
        "aff": "University of Georgia;Illinois Institute of Technology;Nanchang University;University of Connecticut;Illinois Institute of Technology",
        "aff_domain": "uga.edu;iit.edu;ncu.edu.cn;uconn.edu;iit.edu",
        "position": "PhD student;PhD student;Associate Professor;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nwang2024theoretically,\ntitle={Theoretically Understanding Data Reconstruction Leakage in Federated Learning},\nauthor={Zifan Wang and Binghui Zhang and Meng Pang and Yuan Hong and Binghui Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=98g9NdJPxm}\n}",
        "github": "",
        "project": "",
        "reviewers": "kviX;sB6V;3bse",
        "site": "https://openreview.net/forum?id=98g9NdJPxm",
        "pdf_size": 1840938,
        "rating": "3;5;5",
        "confidence": "4;5;4",
        "soundness": "2;2;2",
        "contribution": "1;3;3",
        "presentation": "3;3;3",
        "wc_summary": "48;134;72",
        "wc_strengths": "47;48;33",
        "wc_weaknesses": "161;1346;105",
        "wc_questions": "5;483;4",
        "wc_review": "261;2011;214",
        "wc_reply_reviewers": "33;1370;0",
        "wc_reply_authors": "362;2383;182",
        "reply_reviewers": "1;2;0",
        "reply_authors": "1;4;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            84.66666666666667,
            36.23380864453651
        ],
        "wc_strengths_avg": [
            42.666666666666664,
            6.847546194724712
        ],
        "wc_weaknesses_avg": [
            537.3333333333334,
            572.2705265480265
        ],
        "wc_questions_avg": [
            164.0,
            225.56743263748572
        ],
        "wc_review_avg": [
            828.6666666666666,
            836.2560745502674
        ],
        "wc_reply_reviewers_avg": [
            467.6666666666667,
            638.188234161538
        ],
        "wc_reply_authors_avg": [
            975.6666666666666,
            997.8444545897701
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            2.0,
            1.4142135623730951
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:5WBXkpXVnnAJ:scholar.google.com/&scioq=Theoretically+Understanding+Data+Reconstruction+Leakage+in+Federated+Learning&hl=en&as_sdt=0,3",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;1",
        "aff_unique_norm": "University of Georgia;Illinois Institute of Technology;Nanchang University;University of Connecticut",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.uga.edu;https://www.iit.edu;https://www.ncu.edu.cn;https://www.uconn.edu",
        "aff_unique_abbr": "UGA;IIT;NCU;UConn",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "992eLydH8G",
        "title": "Do Pre-trained Transformers Really Learn In-context by Gradient Descent?",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Is In-Context Learning (ICL) implicitly equivalent to Gradient Descent (GD)? Several recent works draw analogies between the dynamics of GD and the emergent behavior of ICL in large language models. However, these works make assumptions far from the realistic natural language setting in which language models are trained. Such discrepancies between theory and practice, therefore necessitate further investigation to validate their applicability in reality.\n\nWe start by highlighting the weaknesses in prior works that construct Transformer weights to simulate gradient descent. Their experiments with training Transformers on ICL objective, inconsistencies in the order-sensitivity of ICL and GD, sparsity of the constructed weights, and sensitivity to parameter changes are some examples of a mismatch from the real-world setting. \n\nFurthermore, we probe and compare the ICL vs. GD hypothesis in a natural setting. We conduct comprehensive empirical analyses on language models pre-trained on natural data (LLaMa-7B). Our comparisons on various performance metrics highlight the inconsistent behavior of ICL and GD as a function of various factors such as datasets, models, and number of demonstrations. \nWe observe that ICL and GD adapt the output distribution of language models differently. These results indicate that the equivalence between ICL and GD is an open hypothesis, requires nuanced considerations and calls for further studies.",
        "keywords": "In-context learning;gradient descent;large language models",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Lingfeng Shen;Aayush Mishra;Daniel Khashabi",
        "authorids": "~Lingfeng_Shen1;~Aayush_Mishra1;~Daniel_Khashabi2",
        "gender": "M;M;M",
        "homepage": ";https://aamixsh.github.io;http://danielkhashabi.com/",
        "dblp": "240/5490.html;263/3200;71/10515",
        "google_scholar": "PoSTdLAAAAAJ;https://scholar.google.com/citations?hl=en;pK2kQvgAAAAJ",
        "orcid": ";;",
        "linkedin": ";aamixsh/;",
        "or_profile": "~Lingfeng_Shen1;~Aayush_Mishra1;~Daniel_Khashabi2",
        "aff": "Johns Hopkins University;Adobe Systems;Johns Hopkins University",
        "aff_domain": "jh.edu;adobe.com;jhu.edu",
        "position": "MS student;Intern;Assistant Professor",
        "bibtex": "@misc{\nshen2024do,\ntitle={Do Pre-trained Transformers Really Learn In-context by Gradient Descent?},\nauthor={Lingfeng Shen and Aayush Mishra and Daniel Khashabi},\nyear={2024},\nurl={https://openreview.net/forum?id=992eLydH8G}\n}",
        "github": "",
        "project": "",
        "reviewers": "pVVn;GeTu;ivcd;uBmS",
        "site": "https://openreview.net/forum?id=992eLydH8G",
        "pdf_size": 3321649,
        "rating": "3;5;6;6",
        "confidence": "3;2;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;4;3",
        "wc_summary": "124;77;72;102",
        "wc_strengths": "53;42;97;85",
        "wc_weaknesses": "334;69;526;570",
        "wc_questions": "80;87;8;127",
        "wc_review": "591;275;703;884",
        "wc_reply_reviewers": "0;18;259;485",
        "wc_reply_authors": "592;552;1956;1504",
        "reply_reviewers": "0;1;2;2",
        "reply_authors": "3;3;5;4",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            93.75,
            20.837166314064877
        ],
        "wc_strengths_avg": [
            69.25,
            22.498611068241523
        ],
        "wc_weaknesses_avg": [
            374.75,
            197.57451126094176
        ],
        "wc_questions_avg": [
            75.5,
            42.8981351576033
        ],
        "wc_review_avg": [
            613.25,
            221.51114531779209
        ],
        "wc_reply_reviewers_avg": [
            190.5,
            198.41181920440124
        ],
        "wc_reply_authors_avg": [
            1151.0,
            600.815279432872
        ],
        "reply_reviewers_avg": [
            1.25,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.75,
            0.82915619758885
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.4923659639173309,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Johns Hopkins University;Adobe",
        "aff_unique_dep": ";Adobe Systems Incorporated",
        "aff_unique_url": "https://www.jhu.edu;https://www.adobe.com",
        "aff_unique_abbr": "JHU;Adobe",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "99hq9VMkbg",
        "title": "Fisher-aware Quantization for DETR Detectors with Critical-category Objectives",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The impact of quantization on the overall performance of deep learning models is a well-studied problem. However, understanding and overcoming its effects on a more fine-grained level is still lacking, especially for harder tasks such as object detection with both classification and regression objectives. This work identifies the performance for a subset of task-critical categories, i.e. the critical-category performance, as a crucial yet largely overlooked fine-grained objective for detection tasks. We analyze the impact of quantization at the category-level granularity, and propose methods to improve performance for the critical categories. Specifically, we find that certain critical categories have a higher sensitivity to quantization, and have inferior generalization after quantization-aware training (QAT). To explain this, we provide theoretical and empirical links between their performance gaps and the corresponding loss landscapes with the Fisher information framework. Using this evidence, we propose a Fisher-aware mixed-precision quantization scheme, and a Fisher-trace regularization for the QAT on the critical-category loss landscape. The proposed methods improve critical-category performance metrics of the quantized transformer-based DETR detectors. When compared to the conventional quantization objective, our Fisher-aware quantization scheme shows up to 0.9% mAP increase on COCO dataset. A further 0.5% mAP improvement is achieved for selected critical categories with the proposed Fisher-trace regularization.",
        "keywords": "Quantization;Detection Transformers;Fisher information;Finegrained performance",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/ad7138b4d3092f260e9ab8730f1a0b1e1bb44b6c.zip",
        "author": "Huanrui Yang;Yafeng Huang;Zhen Dong;Yizhao Zhang;Denis A Gudovskiy;Tomoyuki Okuno;Yohei Nakata;Yuan Du;Kurt Keutzer;Shanghang Zhang",
        "authorids": "~Huanrui_Yang1;~Yafeng_Huang1;~Zhen_Dong3;~Yizhao_Zhang2;~Denis_A_Gudovskiy1;~Tomoyuki_Okuno1;~Yohei_Nakata1;~Yuan_Du2;~Kurt_Keutzer1;~Shanghang_Zhang4",
        "gender": "M;;M;M;M;M;M;M;M;F",
        "homepage": "https://sites.google.com/view/huanrui-yang;https://github.com/AiyaYF;https://dong-zhen.com/;https://www.linkedin.com/in/zachary-zhang-874390221/;https://gudovskiy.github.io/;;;https://ese.nju.edu.cn/dy_en/list.htm;https://people.eecs.berkeley.edu/~keutzer/;https://www.shanghangzhang.com/",
        "dblp": "221/2845;;;;136/4981;;27/8364.html;26/8831;k/KurtKeutzer.html;95/11531",
        "google_scholar": "bjNCUt8AAAAJ;;czxMUzcAAAAJ;;03qjEm0AAAAJ;https://scholar.google.co.jp/citations?user=E7BhgRsAAAAJ;MA5f-rYAAAAJ;zyu8Qy4AAAAJ;ID9QePIAAAAJ;voqw10cAAAAJ",
        "orcid": ";;;;0000-0002-6829-6667;;0009-0006-9838-1367;0000-0002-5316-619X;0000-0003-3868-8501;",
        "linkedin": ";;zhen-dong/;;gudovskiy;;;;kurtkeutzer/;",
        "or_profile": "~Huanrui_Yang1;~Yafeng_Huang1;~Zhen_Dong3;~Yizhao_Zhang2;~Denis_A_Gudovskiy1;~Tomoyuki_Okuno1;~Yohei_Nakata1;~Yuan_Du2;~Kurt_Keutzer1;~Shanghang_Zhang1",
        "aff": "University of California, Berkeley;Nanjing University;Nexusflow.ai Inc;University of California, Berkeley;Panasonic Corp;Panasonic Holdings Corporation;Panasonic;Nanjing University;University of California, Berkeley;Peking University",
        "aff_domain": "berkeley.edu;nju.edu.cn;nexusflow.ai;berkeley.edu;panasonic.com;panasonic.com;us.panasonic.com;nju.edu.cn;berkeley.edu;pku.edu.cn",
        "position": "Postdoc;MS student;Principal Researcher;Undergrad student;Senior Researcher;Researcher;Researcher;Associate Professor;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nyang2024fisheraware,\ntitle={Fisher-aware Quantization for {DETR} Detectors with Critical-category Objectives},\nauthor={Huanrui Yang and Yafeng Huang and Zhen Dong and Yizhao Zhang and Denis A Gudovskiy and Tomoyuki Okuno and Yohei Nakata and Yuan Du and Kurt Keutzer and Shanghang Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=99hq9VMkbg}\n}",
        "github": "",
        "project": "",
        "reviewers": "DjvC;ka68;WkhP",
        "site": "https://openreview.net/forum?id=99hq9VMkbg",
        "pdf_size": 5925157,
        "rating": "6;6;6",
        "confidence": "3;3;2",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "3;3;3",
        "wc_summary": "44;90;30",
        "wc_strengths": "21;16;65",
        "wc_weaknesses": "5;16;13",
        "wc_questions": "313;78;2",
        "wc_review": "383;200;110",
        "wc_reply_reviewers": "256;57;0",
        "wc_reply_authors": "913;353;319",
        "reply_reviewers": "2;2;0",
        "reply_authors": "3;1;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            54.666666666666664,
            25.629843715654783
        ],
        "wc_strengths_avg": [
            34.0,
            22.015146301277824
        ],
        "wc_weaknesses_avg": [
            11.333333333333334,
            4.642796092394707
        ],
        "wc_questions_avg": [
            131.0,
            132.38076396012627
        ],
        "wc_review_avg": [
            231.0,
            113.58697108383514
        ],
        "wc_reply_reviewers_avg": [
            104.33333333333333,
            109.74009699689941
        ],
        "wc_reply_authors_avg": [
            528.3333333333334,
            272.35434435471905
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:5zA5k8TYbMkJ:scholar.google.com/&scioq=Fisher-aware+Quantization+for+DETR+Detectors+with+Critical-category+Objectives&hl=en&as_sdt=0,44",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;0;3;4;3;1;0;5",
        "aff_unique_norm": "University of California, Berkeley;Nanjing University;Nexusflow.ai;Panasonic Corporation;Panasonic Holdings Corporation;Peking University",
        "aff_unique_dep": ";;;;;",
        "aff_unique_url": "https://www.berkeley.edu;https://www.nju.edu.cn;https://www.nexusflow.ai;https://www.panasonic.com;https://www.panasonic.com/global;http://www.pku.edu.cn",
        "aff_unique_abbr": "UC Berkeley;Nanjing U;Nexusflow.ai;Panasonic;PHC;Peking U",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Berkeley;",
        "aff_country_unique_index": "0;1;0;0;2;2;2;1;0;1",
        "aff_country_unique": "United States;China;Japan"
    },
    {
        "title": "Learning Decentralized Partially Observable Mean Field Control for Artificial Collective Behavior",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19304",
        "id": "99tKiMVJhY",
        "author_site": "Kai Cui, Sascha Hauck, Christian Fabian, Heinz Koeppl",
        "tldr": "",
        "abstract": "Recent reinforcement learning (RL) methods have achieved success in various domains. However, multi-agent RL (MARL) remains a challenge in terms of decentralization, partial observability and scalability to many agents. Meanwhile, collective behavior requires resolution of the aforementioned challenges, and remains of importance to many state-of-the-art applications such as active matter physics, self-organizing systems, opinion dynamics, and biological or robotic swarms. Here, MARL via mean field control (MFC) offers a potential solution to scalability, but fails to consider decentralized and partially observable systems. In this paper, we enable decentralized behavior of agents under partial information by proposing novel models for decentralized partially observable MFC (Dec-POMFC), a broad class of problems with permutation-invariant agents allowing for reduction to tractable single-agent Markov decision processes (MDP) with single-agent RL solution. We provide rigorous theoretical results, including a dynamic programming principle, together with optimality guarantees for Dec-POMFC solutions applied to finite swarms of interest. Algorithmically, we propose Dec-POMFC-based policy gradient methods for MARL via centralized training and decentralized execution, together with policy gradient approximation guarantees. In addition, we improve upon state-of-the-art histogram-based MFC by kernel methods, which is of separate interest also for fully observable MFC. We evaluate numerically on representative collective behavior tasks such as adapted Kuramoto and Vicsek swarming models, being on par with state-of-the-art MARL. Overall, our framework takes a step towards RL-based engineering of artificial collective behavior via MFC.",
        "keywords": "Mean Field Control;Multi-Agent Reinforcement Learning;Partial Observability;Collective Behavior",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Kai Cui;Sascha H. Hauck;Christian Fabian;Heinz Koeppl",
        "authorids": "~Kai_Cui3;~Sascha_H._Hauck1;~Christian_Fabian1;~Heinz_Koeppl1",
        "gender": ";;M;M",
        "homepage": ";;https://www.bcs.tu-darmstadt.de/team_sos/fabianchristian.en.jsp;",
        "dblp": ";;85/10135-1;41/6084",
        "google_scholar": ";;https://scholar.google.de/citations?user=hYtlGkMAAAAJ;https://scholar.google.de/citations?user=WaPW80kAAAAJ",
        "orcid": ";;0000-0003-4239-3861;",
        "linkedin": ";;https://de.linkedin.com/in/-christian-fabian;",
        "or_profile": "~Kai_Cui3;~Sascha_H._Hauck1;~Christian_Fabian1;~Heinz_Koeppl1",
        "aff": ";;Technische Universit\u00e4t Darmstadt;TU Darmstadt",
        "aff_domain": ";;tu-darmstadt.de;tu-darmstadt.de",
        "position": ";;PhD student;Full Professor",
        "bibtex": "@inproceedings{\ncui2024learning,\ntitle={Learning Decentralized Partially Observable Mean Field Control for Artificial Collective Behavior},\nauthor={Kai Cui and Sascha H. Hauck and Christian Fabian and Heinz Koeppl},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=99tKiMVJhY}\n}",
        "github": "",
        "project": "",
        "reviewers": "gUVQ;xiBU;PQjP",
        "pdf_size": 6688687,
        "rating": "5;6;8",
        "confidence": "2;2;3",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "2;3;3",
        "wc_summary": "39;49;45",
        "wc_strengths": "6;37;12",
        "wc_weaknesses": "133;79;21",
        "wc_questions": "59;73;43",
        "wc_review": "237;238;121",
        "wc_reply_reviewers": "119;0;0",
        "wc_reply_authors": "751;637;205",
        "reply_reviewers": "1;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            44.333333333333336,
            4.109609335312651
        ],
        "wc_strengths_avg": [
            18.333333333333332,
            13.424687043734847
        ],
        "wc_weaknesses_avg": [
            77.66666666666667,
            45.73352769637999
        ],
        "wc_questions_avg": [
            58.333333333333336,
            12.256517540566822
        ],
        "wc_review_avg": [
            198.66666666666666,
            54.92014404771916
        ],
        "wc_reply_reviewers_avg": [
            39.666666666666664,
            56.09713797413277
        ],
        "wc_reply_authors_avg": [
            531.0,
            235.16802503741872
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.944911182523068,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14916352646919480751&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "openreview": "https://openreview.net/forum?id=99tKiMVJhY",
        "pdf": "https://openreview.net/pdf?id=99tKiMVJhY",
        "email": ";;tu-darmstadt.de;tu-darmstadt.de",
        "author_num": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Technische Universit\u00e4t Darmstadt",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tu-darmstadt.de",
        "aff_unique_abbr": "TUD",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Darmstadt",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "9AnR2z7iNL",
        "title": "DivKnowQA: Verifying the Reasoning Ability of LLM Through Open-Domain Question Answering Over Knowledge Base and Text",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Open-domain complex question answering often breaks down a multi-hop question into single-hop questions, leveraging external knowledge for solutions. Current practices show a pronounced preference for unstructured texts, such as Wikipedia, often overlooking the potential of structured knowledge sources, such as WikiData. Additionally, while existing research has employed external tools to enhance the Large Language Model(LLM)\u2019s capabilities, many tests have been conducted in artificial or toy scenarios. We argue that open-domain complex question answering presents a realistic and intricate challenge for LLM, necessitating the integration of external tools, including retrieval systems and knowledge base engines. In this paper, we present a new benchmark DIVKNOWQA to assess the LLMs\u2019 reasoning skills and tool compatibility. Comprising 940 human-annotated intricate questions, DIVKNOWQA mandates both structured and unstructured knowledge for comprehensive answers. The subpar performance of prevailing SOTA methods, such as DSP and REACT, on our benchmark demonstrates its challenge. Moreover, we introduce our method DETLLM, which incorporates a symbolic language generation tool and a retrieval toolbox, pioneering a new approach to address this challenge. Our data and code will be released",
        "keywords": "Benchmark;Question Answering;LLM;Retrieval",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Wenting Zhao;Ye Liu;Tong Niu;Yao Wan;Philip S. Yu;Shafiq Joty;Yingbo Zhou;Semih Yavuz",
        "authorids": "~Wenting_Zhao4;~Ye_Liu4;~Tong_Niu1;~Yao_Wan2;~Philip_S._Yu1;~Shafiq_Joty1;~Yingbo_Zhou1;~Semih_Yavuz1",
        "gender": "F;M;M;M;M;;M;F",
        "homepage": ";;http://wanyao.me;https://cs.uic.edu/profiles/philip-yu/;https://raihanjoty.github.io/;;;",
        "dblp": "96/2615-6;;167/0275.html;y/PhilipSYu;62/2078;72/8614;;41/10049-6.html",
        "google_scholar": "QMKD6YMAAAAJ;rrMtKR4AAAAJ;c3MtqtMAAAAJ;D0lL1r0AAAAJ;hR249csAAAAJ;H_6RQ7oAAAAJ;krh3p8AAAAAJ;aySy_OMAAAAJ",
        "orcid": ";;0000-0001-6937-4180;0000-0002-3491-5968;;;;",
        "linkedin": ";;;;;yingbozhou/;semih-yavuz-4303518b;",
        "or_profile": "~Ye_Liu4;~Tong_Niu1;~Yao_Wan2;~Philip_S._Yu1;~Shafiq_Joty1;~Yingbo_Zhou1;~Semih_Yavuz2;~Wenting_Zhao5",
        "aff": "SalesForce.com;Salesforce AI Research;Huazhong University of Science and Technology;University of Illinois Chicago;SalesForce.com;Salesforce Research;SalesForce.com;University of Illinois at Chicago",
        "aff_domain": "salesforce.com;salesforce.com;hust.edu.cn;uic.edu;salesforce.com;salesforce.com;salesforce.com;uic.edu",
        "position": "Researcher;Research Scientist;Assistant Professor;Full Professor;Principal Researcher;Research Scientist;Research Scientist;PhD student",
        "bibtex": "@misc{\nzhao2024divknowqa,\ntitle={DivKnow{QA}: Verifying the Reasoning Ability of {LLM} Through Open-Domain Question Answering Over Knowledge Base and Text},\nauthor={Wenting Zhao and Ye Liu and Tong Niu and Yao Wan and Philip S. Yu and Shafiq Joty and Yingbo Zhou and Semih Yavuz},\nyear={2024},\nurl={https://openreview.net/forum?id=9AnR2z7iNL}\n}",
        "github": "",
        "project": "",
        "reviewers": "r9Z6;dqDr;7HFZ",
        "site": "https://openreview.net/forum?id=9AnR2z7iNL",
        "pdf_size": 909077,
        "rating": "3;5;5",
        "confidence": "4;3;4",
        "soundness": "2;3;2",
        "contribution": "2;2;2",
        "presentation": "2;3;2",
        "wc_summary": "105;78;300",
        "wc_strengths": "86;28;200",
        "wc_weaknesses": "206;88;308",
        "wc_questions": "42;46;19",
        "wc_review": "439;240;827",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "647;417;1098",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;2",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            161.0,
            98.90399385262458
        ],
        "wc_strengths_avg": [
            104.66666666666667,
            71.44850515503379
        ],
        "wc_weaknesses_avg": [
            200.66666666666666,
            89.89376446055026
        ],
        "wc_questions_avg": [
            35.666666666666664,
            11.897712198383164
        ],
        "wc_review_avg": [
            502.0,
            243.74713673531974
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            720.6666666666666,
            282.8548901625865
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:QuMYRhh8zrcJ:scholar.google.com/&scioq=DivKnowQA:+Verifying+the+Reasoning+Ability+of+LLM+Through+Open-Domain+Question+Answering+Over+Knowledge+Base+and+Text&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2;0;0;0;2",
        "aff_unique_norm": "Salesforce;Huazhong University of Science and Technology;University of Illinois at Chicago",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.salesforce.com;http://www.hust.edu.cn;https://www.uic.edu",
        "aff_unique_abbr": "Salesforce;HUST;UIC",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Chicago",
        "aff_country_unique_index": "0;0;1;0;0;0;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "9BERij4Gbv",
        "title": "Guided Evolution with Binary Discriminators for ML Program Search",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "How to automatically design better machine learning programs is an open problem within AutoML. While evolution has been a popular tool to search for better ML programs, using learning itself to guide the search has been less successful and less understood on harder problems but has the promise to dramatically increase the speed and final performance of the optimization process. We propose guiding evolution with a binary discriminator, trained online to distinguish which program is better given a pair of programs. The discriminator selects better programs without having to perform a costly evaluation and thus speed up the convergence of evolution. Our method can encode a wide variety of ML components including symbolic optimizers, neural architectures, RL loss functions, and symbolic regression equations with the same directed acyclic graph representation. By combining this representation with modern GNNs and an adaptive mutation strategy, we demonstrate our method can speed up evolution across a set of diverse problems including a 3.7x speedup on the symbolic search for ML optimizers and a 4x speedup for RL loss functions.",
        "keywords": "automl;evolution;program search",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/cd95578fe2161440c052fbb679f124667b06e639.pdf",
        "author": "John D Co-Reyes;Yingjie Miao;George Tucker;Aleksandra Faust;Esteban Real",
        "authorids": "~John_D_Co-Reyes1;~Yingjie_Miao1;~George_Tucker1;~Aleksandra_Faust1;~Esteban_Real1",
        "gender": "M;;M;F;M",
        "homepage": ";;https://sites.google.com/view/gjt;http://www.afaust.info;https://www.estebanreal.com/",
        "dblp": "198/1129;22/10043;135/5748;135/8420;156/0082",
        "google_scholar": ";ScqM05wAAAAJ;-gJkPHIAAAAJ;RK72t68AAAAJ;ipTsozQAAAAJ",
        "orcid": ";;;0000-0002-3268-8685;",
        "linkedin": ";yingjiemiao/;;aleksandrafaust;",
        "or_profile": "~John_D_Co-Reyes1;~Yingjie_Miao1;~George_Tucker1;~Aleksandra_Faust1;~Esteban_Real1",
        "aff": ";Google DeepMind;Google Brain;Google Brain;Google",
        "aff_domain": ";google.com;google.com;google.com;google.com",
        "position": ";Software Engineer;Research Scientist;Principal Researcher;Engineer/Researcher",
        "bibtex": "@misc{\nco-reyes2024guided,\ntitle={Guided Evolution with Binary Discriminators for {ML} Program Search},\nauthor={John D Co-Reyes and Yingjie Miao and George Tucker and Aleksandra Faust and Esteban Real},\nyear={2024},\nurl={https://openreview.net/forum?id=9BERij4Gbv}\n}",
        "github": "",
        "project": "",
        "reviewers": "qo6q;3xvf;Mfci",
        "site": "https://openreview.net/forum?id=9BERij4Gbv",
        "pdf_size": 1084741,
        "rating": "3;5;8",
        "confidence": "4;4;4",
        "soundness": "1;3;4",
        "contribution": "1;2;3",
        "presentation": "3;3;3",
        "wc_summary": "43;82;176",
        "wc_strengths": "7;134;214",
        "wc_weaknesses": "31;298;211",
        "wc_questions": "2;2;300",
        "wc_review": "83;516;901",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;356;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;1;0",
        "rating_avg": [
            5.333333333333333,
            2.0548046676563256
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            100.33333333333333,
            55.82313339666829
        ],
        "wc_strengths_avg": [
            118.33333333333333,
            85.23040667638647
        ],
        "wc_weaknesses_avg": [
            180.0,
            111.18453129819814
        ],
        "wc_questions_avg": [
            101.33333333333333,
            140.47854719572743
        ],
        "wc_review_avg": [
            500.0,
            334.13869375854495
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            118.66666666666667,
            167.82000940160728
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8820123988891993038&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Google",
        "aff_unique_dep": "Google DeepMind",
        "aff_unique_url": "https://deepmind.com",
        "aff_unique_abbr": "DeepMind",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "title": "Multi-granularity Correspondence Learning from Long-term Noisy Videos",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19303",
        "id": "9Cu8MRmhq2",
        "author_site": "Yijie Lin, Jie Zhang, Zhenyu Huang, Jia Liu, zujie wen, Xi Peng",
        "tldr": "",
        "abstract": "Existing video-language studies mainly focus on learning short video clips, leaving long-term temporal dependencies rarely explored due to over-high computational cost of modeling long videos. To address this issue, one feasible solution is learning the correspondence between video clips and captions, which however inevitably encounters the multi-granularity noisy correspondence (MNC) problem. To be specific, MNC refers to the clip-caption misalignment (coarse-grained) and frame-word misalignment (fine-grained), hindering temporal learning and video understanding. In this paper, we propose NOise Robust Temporal Optimal traNsport (Norton) that addresses MNC in a unified optimal transport (OT) framework. In brief, Norton employs video-paragraph and clip-caption contrastive losses to capture long-term dependencies based on OT. To address coarse-grained misalignment in video-paragraph contrast, Norton filters out the irrelevant clips and captions through an alignable prompt bucket and realigns asynchronous clip-caption pairs based on transport distance. To address the fine-grained misalignment, Norton incorporates a soft-maximum operator to identify crucial words and key frames. Additionally, Norton exploits the potential faulty negative samples in clip-caption contrast by rectifying the alignment target with OT assignment to ensure precise temporal modeling. Extensive experiments on video retrieval, videoQA, and action segmentation verify the effectiveness of our method. \nCode is available at https://lin-yijie.github.io/projects/Norton.",
        "keywords": "Video-language pre-training;Noisy correspondence",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yijie Lin;Jie Zhang;Zhenyu Huang;Jia Liu;zujie wen;Xi Peng",
        "authorids": "~Yijie_Lin1;~Jie_Zhang42;~Zhenyu_Huang1;~Jia_Liu4;~zujie_wen1;~Xi_Peng3",
        "gender": ";F;M;M;M;M",
        "homepage": "https://lin-yijie.github.io;;https://hi-zhenyu.github.io/;;;http://www.pengxi.me",
        "dblp": "02/9654-1.html;84/6889-60;181/2445-5;;260/0351;18/931-1",
        "google_scholar": "https://scholar.google.com.hk/citations?user=KXKVYHsAAAAJ;;0mdxlb8AAAAJ;https://scholar.google.com/citations?hl=zh-CN;vsZ4dK8AAAAJ;bw9FOHAAAAAJ",
        "orcid": "0000-0003-1746-295X;0000-0001-6331-4005;0000-0003-4161-9427;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Yijie_Lin1;~Jie_Zhang42;~Zhenyu_Huang1;~Jia_Liu4;~zujie_wen1;~Xi_Peng2",
        "aff": "Sichuan University;;Alibaba Group;Ant Group;Ant Group;Sichuan University",
        "aff_domain": "scu.edu.cn;;antgroup.com;antgroup.com;antgroup.com;scu.edu.cn",
        "position": "PhD student;;Researcher;Principal Researcher;Researcher;Full Professor",
        "bibtex": "@inproceedings{\nlin2024multigranularity,\ntitle={Multi-granularity Correspondence Learning from Long-term Noisy Videos},\nauthor={Yijie Lin and Jie Zhang and Zhenyu Huang and Jia Liu and zujie wen and Xi Peng},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=9Cu8MRmhq2}\n}",
        "github": "",
        "project": "",
        "reviewers": "83JB;pP85;TtfV;UrFs",
        "pdf_size": 1235445,
        "rating": "8;8;8;8",
        "confidence": "5;5;4;3",
        "soundness": "4;4;4;3",
        "contribution": "4;4;4;3",
        "presentation": "4;4;4;3",
        "wc_summary": "100;151;127;111",
        "wc_strengths": "169;208;174;168",
        "wc_weaknesses": "114;185;189;138",
        "wc_questions": "137;14;61;185",
        "wc_review": "520;558;551;602",
        "wc_reply_reviewers": "0;0;0;24",
        "wc_reply_authors": "957;928;1278;926",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "2;2;2;3",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            122.25,
            19.17517926904466
        ],
        "wc_strengths_avg": [
            179.75,
            16.467771555374455
        ],
        "wc_weaknesses_avg": [
            156.5,
            31.68990375498165
        ],
        "wc_questions_avg": [
            99.25,
            66.16031665583229
        ],
        "wc_review_avg": [
            557.75,
            29.277764600460877
        ],
        "wc_reply_reviewers_avg": [
            6.0,
            10.392304845413264
        ],
        "wc_reply_authors_avg": [
            1022.25,
            148.1660808012414
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 20,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7985543970551262066&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=9Cu8MRmhq2",
        "pdf": "https://openreview.net/pdf?id=9Cu8MRmhq2",
        "email": "scu.edu.cn;;antgroup.com;antgroup.com;antgroup.com;scu.edu.cn",
        "author_num": 6,
        "aff_unique_index": "0;1;2;2;0",
        "aff_unique_norm": "Sichuan University;Alibaba Group;Ant Group",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.scu.edu.cn;https://www.alibaba.com;https://www.antgroup.com",
        "aff_unique_abbr": "SCU;Alibaba;Ant Group",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Elucidating the design space of classifier-guided diffusion generation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19302",
        "id": "9DXXMXnIGm",
        "author_site": "Jiajun Ma, Tianyang Hu, Wenjia Wang, Jiacheng Sun",
        "tldr": "",
        "abstract": "Guidance in conditional diffusion generation is of great importance for sample quality and controllability. \nHowever, existing guidance schemes are to be desired. \nOn one hand, mainstream methods such as classifier guidance and classifier-free guidance both require extra training with labeled data, which is time-consuming and unable to adapt to new conditions.\nOn the other hand, training-free methods such as universal guidance, though more flexible, have yet to demonstrate comparable performance. \nIn this work, through a comprehensive investigation into the design space, we show that it is possible to achieve significant performance improvements over existing guidance schemes by leveraging off-the-shelf classifiers in a training-free fashion, enjoying the best of both worlds. \nEmploying calibration as a general guideline, we propose several pre-conditioning techniques to better exploit pretrained off-the-shelf classifiers for guiding diffusion generation. \nExtensive experiments on ImageNet validate our proposed method, showing that state-of-the-art (SOTA) diffusion models (DDPM, EDM, DiT) can be further improved (up to 20\\%) using off-the-shelf classifiers with barely any extra computational cost.\nWith the proliferation of publicly available pretrained classifiers, our proposed approach has great potential and can be readily scaled up to text-to-image generation tasks.",
        "keywords": "conditional diffusion sampling;classifier guidance",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/a77119b5f7e1cdcb60a31b0cda3fac0bd2d35a99.pdf",
        "author": "Jiajun Ma;Tianyang Hu;Wenjia Wang;Jiacheng Sun",
        "authorids": "~Jiajun_Ma1;~Tianyang_Hu1;~Wenjia_Wang2;~Jiacheng_Sun1",
        "gender": "M;M;M;M",
        "homepage": ";https://hu-tianyang.github.io/;https://www.wenjia-w.com/;",
        "dblp": ";170/2551;;165/5350",
        "google_scholar": ";mlA_3r0AAAAJ;EKS1sO0AAAAJ;",
        "orcid": ";;;",
        "linkedin": "https://www.linkedin.cn/incareer/in/ACoAABNx8OQBL99vmEOUUrE18c5XwhVpsxhEGu0;;;https://www.linkedin.cn/incareer/in/jiacheng-sun-ab622b131",
        "or_profile": "~Jiajun_Ma1;~Tianyang_Hu1;~Wenjia_Wang2;~Jiacheng_Sun1",
        "aff": "Hong Kong University of Science and Technology;Huawei Noah's Ark Lab;HKUST (GZ);Huawei Noah's Ark Lab",
        "aff_domain": "ust.hk;huawei.com;hkust-gz.edu.cn;huawei.com",
        "position": "PhD student;Researcher;Assistant Professor;Senior Researcher",
        "bibtex": "@inproceedings{\nma2024elucidating,\ntitle={Elucidating the design space of classifier-guided diffusion generation},\nauthor={Jiajun Ma and Tianyang Hu and Wenjia Wang and Jiacheng Sun},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=9DXXMXnIGm}\n}",
        "github": "",
        "project": "",
        "reviewers": "VZ9L;rssc;wqgP;r6Zr;6jri",
        "pdf_size": 4818476,
        "rating": "5;5;6;6;8",
        "confidence": "5;4;5;3;5",
        "soundness": "3;2;3;2;4",
        "contribution": "3;2;3;3;3",
        "presentation": "3;2;3;2;3",
        "wc_summary": "78;60;43;68;116",
        "wc_strengths": "93;33;46;48;114",
        "wc_weaknesses": "157;232;493;286;257",
        "wc_questions": "60;2;29;169;69",
        "wc_review": "388;327;611;571;556",
        "wc_reply_reviewers": "66;32;0;372;52",
        "wc_reply_authors": "680;691;1641;1695;1085",
        "reply_reviewers": "1;1;0;4;1",
        "reply_authors": "1;1;4;3;2",
        "rating_avg": [
            6.0,
            1.0954451150103321
        ],
        "confidence_avg": [
            4.4,
            0.8
        ],
        "soundness_avg": [
            2.8,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.8,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            73.0,
            24.363907732545698
        ],
        "wc_strengths_avg": [
            66.8,
            31.121696611849426
        ],
        "wc_weaknesses_avg": [
            285.0,
            112.4651056995013
        ],
        "wc_questions_avg": [
            65.8,
            56.77816481711962
        ],
        "wc_review_avg": [
            490.6,
            111.82951309918147
        ],
        "wc_reply_reviewers_avg": [
            104.4,
            135.6253663589522
        ],
        "wc_reply_authors_avg": [
            1158.4,
            441.26164573867055
        ],
        "reply_reviewers_avg": [
            1.4,
            1.3564659966250536
        ],
        "reply_authors_avg": [
            2.2,
            1.16619037896906
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.22821773229381925,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17380173202151892858&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=9DXXMXnIGm",
        "pdf": "https://openreview.net/pdf?id=9DXXMXnIGm",
        "email": "ust.hk;huawei.com;hkust-gz.edu.cn;huawei.com",
        "author_num": 4,
        "aff_unique_index": "0;1;0;1",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Huawei",
        "aff_unique_dep": ";Noah's Ark Lab",
        "aff_unique_url": "https://www.ust.hk;https://www.huawei.com",
        "aff_unique_abbr": "HKUST;Huawei",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Hong Kong SAR;;Guangzhou",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "ED-NeRF: Efficient Text-Guided Editing of 3D Scene With Latent Space NeRF",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19301",
        "id": "9DvDRTTdlu",
        "author_site": "Jangho Park, Gihyun Kwon, Jong Chul YE",
        "tldr": "",
        "abstract": "Recently, there has been a significant advancement in text-to-image diffusion models, leading to groundbreaking performance in 2D image generation. These advancements have been extended to 3D models, enabling the generation of novel 3D objects from textual descriptions. This has evolved into  NeRF editing methods, which allow the manipulation of existing 3D objects through textual conditioning. However, existing NeRF editing techniques have faced limitations in their performance due to slow training speeds and the use of loss functions that do not adequately consider editing. To address this,  here we present a novel 3D NeRF editing approach dubbed ED-NeRF by successfully embedding real-world scenes into the latent space of the latent diffusion model (LDM) through a unique refinement layer. This approach enables us to obtain a NeRF backbone that is not only faster but also more amenable to editing compared to traditional image space NeRF editing. Furthermore, we propose an improved loss function tailored for editing by migrating the delta denoising score (DDS) distillation loss, originally used in 2D image editing to the three-dimensional domain. This novel loss function surpasses the well-known score distillation sampling (SDS) loss in terms of suitability for editing purposes. Our experimental results demonstrate that ED-NeRF achieves faster editing speed while producing improved output quality compared to state-of-the-art 3D editing models.",
        "keywords": "NeRF;Diffusion model;3D scene editing",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/2c94c50c0d663aed124b968c3da8d7c433667995.zip",
        "author": "JangHo Park;Gihyun Kwon;Jong Chul Ye",
        "authorids": "~JangHo_Park2;~Gihyun_Kwon1;~Jong_Chul_Ye1",
        "gender": "M;M;M",
        "homepage": "https://sites.google.com/view/janghopark/;https://sites.google.com/view/gihyunkwon;https://bispl.weebly.com/",
        "dblp": "154/0659;241/7060;15/5613",
        "google_scholar": ";yexbg8gAAAAJ;HNMjoNEAAAAJ",
        "orcid": ";;",
        "linkedin": ";gihyun-kwon-b4665a233/;",
        "or_profile": "~JangHo_Park2;~Gihyun_Kwon1;~Jong_Chul_Ye1",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr;kaist.ac.kr",
        "position": "MS student;PhD student;Full Professor",
        "bibtex": "@inproceedings{\npark2024ednerf,\ntitle={{ED}-Ne{RF}: Efficient Text-Guided Editing of 3D Scene With Latent Space Ne{RF}},\nauthor={JangHo Park and Gihyun Kwon and Jong Chul Ye},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=9DvDRTTdlu}\n}",
        "github": "",
        "project": "",
        "reviewers": "rsnk;EEVN;kJsR;mMij",
        "pdf_size": 25650691,
        "rating": "5;5;6;6",
        "confidence": "5;4;3;3",
        "soundness": "2;3;3;4",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;2",
        "wc_summary": "137;67;70;107",
        "wc_strengths": "164;26;17;182",
        "wc_weaknesses": "141;229;118;133",
        "wc_questions": "146;32;12;137",
        "wc_review": "588;354;217;559",
        "wc_reply_reviewers": "0;0;0;12",
        "wc_reply_authors": "1113;921;386;678",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "4;3;3;3",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            95.25,
            28.795615985771168
        ],
        "wc_strengths_avg": [
            97.25,
            76.08342460746624
        ],
        "wc_weaknesses_avg": [
            155.25,
            43.37265843823733
        ],
        "wc_questions_avg": [
            81.75,
            60.25103733546834
        ],
        "wc_review_avg": [
            429.5,
            152.27360243981883
        ],
        "wc_reply_reviewers_avg": [
            3.0,
            5.196152422706632
        ],
        "wc_reply_authors_avg": [
            774.5,
            272.1621759172277
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.25,
            0.4330127018922193
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.9045340337332909,
        "gs_citation": 34,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4230739473308506611&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=9DvDRTTdlu",
        "pdf": "https://openreview.net/pdf?id=9DvDRTTdlu",
        "email": "kaist.ac.kr;kaist.ac.kr;kaist.ac.kr",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "9Ebi1euQZQ",
        "title": "HallE-Switch: Rethinking and Controlling Object Existence Hallucinations in Large Vision-Language Models for Detailed Caption",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Current large vision-language models (LVLMs) achieve remarkable progress, yet there remains significant uncertainty regarding their ability to accurately apprehend visual details, that is, in performing detailed captioning. To address this, we introduce \\textit{CCEval}, a GPT-4 assisted evaluation method tailored for detailed captioning. Interestingly, while LVLMs demonstrate minimal object existence hallucination in existing VQA benchmarks, our proposed evaluation reveals continued susceptibility to such hallucinations. In this paper, we make the first attempt to investigate and attribute such hallucinations, including image resolution, the language decoder size, and instruction data amount, quality, granularity. Our findings underscore the unwarranted inference when the language description includes details at a finer object granularity than what the vision module can ground or verify, thus inducing hallucination. To control such hallucinations, we further attribute the reliability of captioning to contextual knowledge (involving only contextually grounded objects) and parametric knowledge (containing inferred objects by the model). Thus, we introduce $\\textit{HallE-Switch}$, a controllable LVLM in terms of $\\textbf{Hall}$ucination in object $\\textbf{E}$xistence. HallE-Switch can condition the captioning to shift between (i) exclusively depicting contextual knowledge for grounded objects and (ii) blending it with parametric knowledge to imagine inferred objects. Our method reduces hallucination by 44\\% compared to LLaVA$_{7B}$ and maintains the same object coverage.",
        "keywords": "vision-language;large vision-language models;object hallucination",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/19243247ff574c8808b01f9ba639e85fbbe1320c.pdf",
        "author": "Bohan Zhai;Shijia Yang;Xiangchen Zhao;Chenfeng Xu;Sheng Shen;Dongdi Zhao;Kurt Keutzer;Manling Li;Tan Yan;Xiangjun Fan",
        "authorids": "~Bohan_Zhai1;~Shijia_Yang1;~Xiangchen_Zhao1;~Chenfeng_Xu1;~Sheng_Shen2;~Dongdi_Zhao1;~Kurt_Keutzer1;~Manling_Li1;~Tan_Yan2;~Xiangjun_Fan1",
        "gender": "M;F;M;M;M;M;F;M;M;M",
        "homepage": ";;;;https://sincerass.github.io;https://people.eecs.berkeley.edu/~keutzer/;https://limanling.github.io/;http://www.google.com;;https://github.com/YoPatapon",
        "dblp": ";;;65/1881;138/5764-1.html;k/KurtKeutzer.html;178/3620;;;",
        "google_scholar": "TAbgR14AAAAJ;;https://scholar.google.com/citations?hl=en;RpqvaTUAAAAJ;https://scholar.google.com/citations?hl=en;ID9QePIAAAAJ;6U4SXnUAAAAJ;;;",
        "orcid": ";;;0000-0002-4941-6985;;0000-0003-3868-8501;;;;",
        "linkedin": ";bronya-shijia-yang-762927193/;;;sheng-s-ab198a174/;kurtkeutzer/;;;xiangjun-max-fan-7984b12b/;",
        "or_profile": "~Bohan_Zhai1;~Shijia_Yang1;~Xiangchen_Zhao1;~Chenfeng_Xu1;~Sheng_Shen2;~Kurt_Keutzer1;~Manling_Li1;~Tan_Yan2;~Xiangjun_Fan1;~Dongdi_Zhao2",
        "aff": "Bytedance;Stanford University;Bytedance;University of California, Berkeley;University of California, Berkeley;University of California, Berkeley;Stanford University;;ByteDance Inc.;Bytedance",
        "aff_domain": "bytedance.com;stanford.edu;bytedance.com;berkeley.edu;berkeley.edu;berkeley.edu;stanford.edu;;bytedance.com;bytedance.com",
        "position": "Researcher;MS student;Researcher;PhD student;PhD student;Full Professor;Postdoc;;Machine Learning Engineer;Researcher",
        "bibtex": "@misc{\nzhai2024halleswitch,\ntitle={HallE-Switch: Rethinking and Controlling Object Existence Hallucinations in Large Vision-Language Models for Detailed Caption},\nauthor={Bohan Zhai and Shijia Yang and Xiangchen Zhao and Chenfeng Xu and Sheng Shen and Dongdi Zhao and Kurt Keutzer and Manling Li and Tan Yan and Xiangjun Fan},\nyear={2024},\nurl={https://openreview.net/forum?id=9Ebi1euQZQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "PjV9;DU9c;6XKb;ZWbF",
        "site": "https://openreview.net/forum?id=9Ebi1euQZQ",
        "pdf_size": 841003,
        "rating": "3;5;6;8",
        "confidence": "4;5;4;4",
        "soundness": "3;2;3;3",
        "contribution": "2;2;4;3",
        "presentation": "3;2;3;3",
        "wc_summary": "170;46;75;234",
        "wc_strengths": "64;52;44;15",
        "wc_weaknesses": "86;290;88;19",
        "wc_questions": "14;20;168;1",
        "wc_review": "334;408;375;269",
        "wc_reply_reviewers": "0;0;27;0",
        "wc_reply_authors": "504;788;1186;73",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;2;2;1",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            131.25,
            74.9845817485168
        ],
        "wc_strengths_avg": [
            43.75,
            18.06066167115701
        ],
        "wc_weaknesses_avg": [
            120.75,
            101.58586269752303
        ],
        "wc_questions_avg": [
            50.75,
            68.04180700128414
        ],
        "wc_review_avg": [
            346.5,
            51.8579791353269
        ],
        "wc_reply_reviewers_avg": [
            6.75,
            11.691342951089922
        ],
        "wc_reply_authors_avg": [
            637.75,
            406.19722734159575
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": -0.16012815380508713,
        "gs_citation": 56,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9614788549598911123&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;2;2;2;1;0;0",
        "aff_unique_norm": "ByteDance;Stanford University;University of California, Berkeley",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.bytedance.com;https://www.stanford.edu;https://www.berkeley.edu",
        "aff_unique_abbr": "Bytedance;Stanford;UC Berkeley",
        "aff_campus_unique_index": "1;2;2;2;1",
        "aff_campus_unique": ";Stanford;Berkeley",
        "aff_country_unique_index": "0;1;0;1;1;1;1;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "9F0xInGNBF",
        "title": "VIDEOPROMPTER: AN ENSEMBLE OF FOUNDATIONAL MODELS FOR ZERO-SHOT VIDEO UNDERSTANDING",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Vision-language models (VLMs) classify the query video by calculating a similarity score between the visual features and text-based class label representations.\nRecently, large language models (LLMs) have been used to enrich the text-based\nclass labels by enhancing the descriptiveness of the class names. However, these\nimprovements are restricted to the text-based classifier only, and the query visual\nfeatures are not considered. In this paper, we propose a framework which combines pre-trained discriminative VLMs with pre-trained generative video-to-text\nand text-to-text models. We introduce two key modifications to the standard zero-shot setting. First, we propose language-guided visual feature enhancement and\nemploy a video-to-text model to convert the query video to its descriptive form.\nThe resulting descriptions contain vital visual cues of the query video, such as\nwhat objects are present and their spatio-temporal interactions. These descriptive cues provide additional semantic knowledge to VLMs to enhance their zero-shot performance. Second, we propose video-specific prompts to LLMs to generate more meaningful descriptions to enrich class label representations. Specifically, we introduce prompt techniques to create a Tree Hierarchy of Categories for\nclass names, offering a higher-level action context for additional visual cues, We\ndemonstrate the effectiveness of our approach in video understanding across three\ndifferent zero-shot settings: 1) video action recognition, 2) video-to-text and text-to-video retrieval, and 3) time-sensitive video tasks. Consistent improvements\nacross multiple benchmarks and with various VLMs demonstrate the effectiveness of our proposed framework. Our code will be made publicly available.",
        "keywords": "Video-Language models;LLM;Video Understanding;Zero-shot",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Adeel Yousaf;Muzammal Naseer;Salman Khan;Fahad Khan;Mubarak Shah",
        "authorids": "~Adeel_Yousaf1;~Muzammal_Naseer1;~Salman_Khan4;~Fahad_Khan1;~Mubarak_Shah3",
        "gender": "M;M;M;M;M",
        "homepage": "https://www.crcv.ucf.edu/people/students/phd-students/;https://muzammal-naseer.com/;https://salman-h-khan.github.io/;https://sites.google.com/view/fahadkhans/home;https://www.crcv.ucf.edu/person/mubarak-shah/",
        "dblp": "217/1167;;32/11535-1;05/8618;s/MubarakShah",
        "google_scholar": "VpLbThoAAAAJ;https://scholar.google.ch/citations?user=tM9xKA8AAAAJ;https://scholar.google.es/citations?user=M59O9lkAAAAJ;zvaeYnUAAAAJ;https://scholar.google.com.tw/citations?user=p8gsO3gAAAAJ",
        "orcid": "0000-0003-0275-903X;0000-0001-7663-7161;0000-0002-9502-1749;;0000-0002-8216-1128",
        "linkedin": "adeel-yousaf-aa58b71a8/;muzammalnaseer/;;;mubarak-shah-b6aa68213/",
        "or_profile": "~Adeel_Yousaf1;~Muzammal_Naseer1;~Salman_Khan4;~Fahad_Khan1;~Mubarak_Shah3",
        "aff": "University of Central Florida;Mohamed bin Zayed University of Artificial Intelligence;Australian National University;Link\u00f6ping University;University of Central Florida",
        "aff_domain": "ucf.edu;mbzuai.ac.ae;anu.edu.au;liu.se;ucf.edu",
        "position": "PhD student;Researcher;Lecturer;Associate Professor;Full Professor",
        "bibtex": "@misc{\nyousaf2024videoprompter,\ntitle={{VIDEOPROMPTER}: {AN} {ENSEMBLE} {OF} {FOUNDATIONAL} {MODELS} {FOR} {ZERO}-{SHOT} {VIDEO} {UNDERSTANDING}},\nauthor={Adeel Yousaf and Muzammal Naseer and Salman Khan and Fahad Khan and Mubarak Shah},\nyear={2024},\nurl={https://openreview.net/forum?id=9F0xInGNBF}\n}",
        "github": "",
        "project": "",
        "reviewers": "FnrC;1vg9;8fLg;ypLm",
        "site": "https://openreview.net/forum?id=9F0xInGNBF",
        "pdf_size": 1069920,
        "rating": "5;5;5;6",
        "confidence": "4;4;3;5",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;2;4",
        "wc_summary": "57;174;57;46",
        "wc_strengths": "90;38;38;59",
        "wc_weaknesses": "113;263;155;99",
        "wc_questions": "11;8;14;2",
        "wc_review": "271;483;264;206",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "563;730;633;611",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            83.5,
            52.44282601080914
        ],
        "wc_strengths_avg": [
            56.25,
            21.288200957337846
        ],
        "wc_weaknesses_avg": [
            157.5,
            64.30202174115523
        ],
        "wc_questions_avg": [
            8.75,
            4.437059837324712
        ],
        "wc_review_avg": [
            306.0,
            105.25920387310556
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            634.25,
            60.80039062374517
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.816496580927726,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9194318577035266866&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;3;0",
        "aff_unique_norm": "University of Central Florida;Mohamed bin Zayed University of Artificial Intelligence;Australian National University;Link\u00f6ping University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.ucf.edu;https://mbzuai.ac.ae;https://www.anu.edu.au;https://www.liu.se",
        "aff_unique_abbr": "UCF;MBZUAI;ANU;LiU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;3;0",
        "aff_country_unique": "United States;United Arab Emirates;Australia;Sweden"
    },
    {
        "id": "9FXGX00iMF",
        "title": "BWS: Best Window Selection Based on Sample Scores for Data Pruning across Broad Ranges",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Data subset selection aims to find a smaller yet informative subset of a large dataset that can approximate the full-dataset training, addressing challenges associated with training neural networks on large-scale datasets. However, existing methods tend to specialize in either high or low selection ratio regimes, lacking a universal approach that consistently achieves competitive performance across a broad range of selection ratios. We introduce a universal and efficient data subset selection method, Best Window Selection (BWS), by proposing a method to choose the best window subset from samples ordered based on their difficulty scores. This approach offers flexibility by allowing the choice of window intervals that span from easy to difficult samples. Furthermore, we provide an efficient mechanism for selecting the best window subset by evaluating its quality using kernel ridge regression. Our experimental results demonstrate the superior performance of BWS compared to other baselines across a broad range of selection ratios over datasets, including CIFAR-10/100 and ImageNet, and the scenarios involving training from random initialization or fine-tuning of pre-trained models.",
        "keywords": "Data subset selection;data pruning;data-efficient learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/e0f31acbdace2895754365d4e7cb78ab4eb4bd25.zip",
        "author": "Hoyong Choi;Nohyun Ki;Hye Won Chung",
        "authorids": "~Hoyong_Choi1;~Nohyun_Ki1;~Hye_Won_Chung2",
        "gender": "M;F;M",
        "homepage": ";https://iids.kaist.ac.kr/;https://iids.kaist.ac.kr/people",
        "dblp": ";https://dblp.uni-trier.de/pers/hd/c/Chung:Hye_Won;",
        "google_scholar": ";;",
        "orcid": ";;",
        "linkedin": "%ED%98%B8%EC%9A%A9-%EC%B5%9C-67b9a919b/;;",
        "or_profile": "~Hoyong_Choi1;~Hye_Won_Chung2;~Ki_Nohyun1",
        "aff": "KAIST;Korea Advanced Institute of Science & Technology;KAIST, Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr;ee.kaist.ac.kr",
        "position": "PhD student;Associate Professor;PhD student",
        "bibtex": "@misc{\nchoi2024bws,\ntitle={{BWS}: Best Window Selection Based on Sample Scores for Data Pruning across Broad Ranges},\nauthor={Hoyong Choi and Nohyun Ki and Hye Won Chung},\nyear={2024},\nurl={https://openreview.net/forum?id=9FXGX00iMF}\n}",
        "github": "",
        "project": "",
        "reviewers": "BL3J;j18Y;LWro",
        "site": "https://openreview.net/forum?id=9FXGX00iMF",
        "pdf_size": 1927725,
        "rating": "5;5;6",
        "confidence": "4;3;4",
        "soundness": "2;3;3",
        "contribution": "2;2;3",
        "presentation": "3;3;3",
        "wc_summary": "74;72;104",
        "wc_strengths": "60;52;101",
        "wc_weaknesses": "89;86;70",
        "wc_questions": "90;5;4",
        "wc_review": "313;215;279",
        "wc_reply_reviewers": "186;0;9",
        "wc_reply_authors": "1861;1214;599",
        "reply_reviewers": "1;0;1",
        "reply_authors": "4;2;1",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            83.33333333333333,
            14.636332266733433
        ],
        "wc_strengths_avg": [
            71.0,
            21.463146709340332
        ],
        "wc_weaknesses_avg": [
            81.66666666666667,
            8.339997335464536
        ],
        "wc_questions_avg": [
            33.0,
            40.307154038292836
        ],
        "wc_review_avg": [
            269.0,
            40.62839729384691
        ],
        "wc_reply_reviewers_avg": [
            65.0,
            85.63877626402656
        ],
        "wc_reply_authors_avg": [
            1224.6666666666667,
            515.264549096438
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18175229063289832276&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "9G2IVZIh4H",
        "title": "FedMef: Towards Memory-efficient Federated Dynamic Pruning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Federated learning (FL) promotes decentralized training while prioritizing data confidentiality. However, its application on resource-constrained devices is challenging due to the high demand for computation and memory resources for training deep learning models. Neural network pruning techniques, such as dynamic pruning, could enhance model efficiency, but directly adopting them in FL still poses substantial challenges, including post-pruning performance degradation, high activation memory, etc. To address these challenges, we propose FedMef, a novel and memory-efficient federated dynamic pruning framework. FedMef comprises two key components. First, we introduce the budget-aware extrusion that maintains pruning efficiency while preserving post-pruning performance by salvaging crucial information from parameters marked for pruning within a given budget. Second, we propose scaled activation pruning to effectively reduce activation memory, which is particularly beneficial for deploying FL to memory-limited devices. Extensive experiments\ndemonstrate the effectiveness of our proposed FedMef. In particular, it achieves a significant reduction of 28.5\\% in memory footprint compared to state-of-the-art methods while obtaining superior accuracy.",
        "keywords": "federated learning;memory efficient training;nerual network pruning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Hong Huang;Weiming Zhuang;Chen Chen;Lingjuan Lyu",
        "authorids": "~Hong_Huang4;~Weiming_Zhuang1;~Chen_Chen20;~Lingjuan_Lyu1",
        "gender": "M;;M;F",
        "homepage": "https://little0o0.github.io/;https://weiming.me/;https://cc233.github.io/;https://sites.google.com/view/lingjuan-lyu",
        "dblp": ";274/0724;65/4423-43;178/9876",
        "google_scholar": "_E4FBygAAAAJ;lLuLAzEAAAAJ;;",
        "orcid": ";;0000-0001-7359-8515;",
        "linkedin": ";;;",
        "or_profile": "~Hong_Huang4;~Weiming_Zhuang1;~Chen_Chen20;~Lingjuan_Lyu1",
        "aff": "City University of Hong Kong;Sony Research;Sony AI;Sony",
        "aff_domain": "my.cityu.edu.hk;sony.com;sony.com;sony.com",
        "position": "PhD student;Researcher;Researcher;scientist",
        "bibtex": "@misc{\nhuang2024fedmef,\ntitle={FedMef: Towards Memory-efficient Federated Dynamic Pruning},\nauthor={Hong Huang and Weiming Zhuang and Chen Chen and Lingjuan Lyu},\nyear={2024},\nurl={https://openreview.net/forum?id=9G2IVZIh4H}\n}",
        "github": "",
        "project": "",
        "reviewers": "vuu4;Lm19;fyPU;pgar",
        "site": "https://openreview.net/forum?id=9G2IVZIh4H",
        "pdf_size": 1323869,
        "rating": "3;3;3;6",
        "confidence": "5;4;1;4",
        "soundness": "2;2;2;4",
        "contribution": "2;2;2;3",
        "presentation": "1;2;2;4",
        "wc_summary": "41;43;156;61",
        "wc_strengths": "39;27;127;66",
        "wc_weaknesses": "228;87;219;47",
        "wc_questions": "95;53;240;4",
        "wc_review": "403;210;742;178",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            1.5
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            75.25,
            47.26719263929264
        ],
        "wc_strengths_avg": [
            64.75,
            38.615896985568
        ],
        "wc_weaknesses_avg": [
            145.25,
            79.58132632722327
        ],
        "wc_questions_avg": [
            98.0,
            88.08234783428516
        ],
        "wc_review_avg": [
            383.25,
            224.29598190783534
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.19245008972987526,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9476448772804489695&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "City University of Hong Kong;Sony;Sony Corporation",
        "aff_unique_dep": ";Research;",
        "aff_unique_url": "https://www.cityu.edu.hk;https://www.sony.com;https://www.sony.com",
        "aff_unique_abbr": "CityU;Sony;Sony",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "China;Japan"
    },
    {
        "id": "9GE0N1htnu",
        "title": "RINGER: Conformer Ensemble Generation of Macrocyclic Peptides with Sequence-Conditioned Internal Coordinate Diffusion",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Macrocyclic peptides are an emerging therapeutic modality, yet computational approaches for accurately sampling their diverse 3D ensembles remain challenging due to their conformational diversity and geometric constraints. Here, we introduce RINGER, a diffusion-based transformer model for conditional generation of macrocycle peptides based on redundant internal coordinates. RINGER provides fast backbone- and side-chain sampling while respecting key structural invariances of cyclic peptides. Through extensive benchmarking and analysis against gold-standard conformer ensembles of cyclic peptides generated with metadynamics, we demonstrate how RINGER generates both high-quality and diverse geometries at a fraction of the computational cost. Our work lays the foundation for improved sampling of cyclic geometries and the development of geometric learning methods for peptides.",
        "keywords": "molecular conformer generation;generative models;diffusion models;internal coordinates;peptides;macrocycles",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/8f122a22d995b8aceee8bbaba9c273b1be18626d.pdf",
        "author": "Colin A Grambow;Hayley Weir;Nathaniel Lee Diamant;Tommaso Biancalani;Gabriele Scalia;Kangway V. Chuang",
        "authorids": "~Colin_A_Grambow1;~Hayley_Weir1;~Nathaniel_Lee_Diamant1;~Tommaso_Biancalani1;~Gabriele_Scalia1;~Kangway_V._Chuang1",
        "gender": "M;F;;M;;M",
        "homepage": ";;;;;https://www.kangway.com",
        "dblp": "250/2439;;290/2075;;201/9258;279/6285",
        "google_scholar": "WfRi2K4AAAAJ;cMK68xcAAAAJ;;https://scholar.google.it/citations?user=s_qd9x0AAAAJ;MxeFvewAAAAJ;HThiDv8AAAAJ",
        "orcid": "0000-0002-2204-9046;0000-0002-1039-327X;0000-0002-1738-304X;;0000-0003-3305-9220;0000-0002-0652-8071",
        "linkedin": "cgrambow/;hayley-v-weir/;nathaniel-diamant-6b35b0106;;gabriele-scalia;",
        "or_profile": "~Colin_A_Grambow1;~Hayley_Weir1;~Nathaniel_Lee_Diamant1;~Tommaso_Biancalani1;~Gabriele_Scalia1;~Kangway_V_Chuang1",
        "aff": "Genentech;Genentech;genentech;Genentech;Genentech;Genentech Research and Early Development",
        "aff_domain": "gene.com;gene.com;gene.com;gene.com;gene.com;gene.com",
        "position": "Researcher;Researcher;Researcher;Director;Researcher;Researcher",
        "bibtex": "@misc{\ngrambow2024ringer,\ntitle={{RINGER}: Conformer Ensemble Generation of Macrocyclic Peptides with Sequence-Conditioned Internal Coordinate Diffusion},\nauthor={Colin A Grambow and Hayley Weir and Nathaniel Lee Diamant and Tommaso Biancalani and Gabriele Scalia and Kangway V. Chuang},\nyear={2024},\nurl={https://openreview.net/forum?id=9GE0N1htnu}\n}",
        "github": "",
        "project": "",
        "reviewers": "2uae;spjZ;PLmK;yeES",
        "site": "https://openreview.net/forum?id=9GE0N1htnu",
        "pdf_size": 4600321,
        "rating": "5;5;5;8",
        "confidence": "4;3;4;4",
        "soundness": "3;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "4;2;2;3",
        "wc_summary": "66;122;48;95",
        "wc_strengths": "81;36;71;132",
        "wc_weaknesses": "184;156;202;76",
        "wc_questions": "89;21;2;123",
        "wc_review": "420;335;323;426",
        "wc_reply_reviewers": "0;0;148;0",
        "wc_reply_authors": "1114;238;774;809",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "3;1;2;2",
        "rating_avg": [
            5.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            82.75,
            28.19020219863632
        ],
        "wc_strengths_avg": [
            80.0,
            34.35840508521896
        ],
        "wc_weaknesses_avg": [
            154.5,
            48.194916744403656
        ],
        "wc_questions_avg": [
            58.75,
            49.21572411333597
        ],
        "wc_review_avg": [
            376.0,
            47.23875527572673
        ],
        "wc_reply_reviewers_avg": [
            37.0,
            64.08587988004847
        ],
        "wc_reply_authors_avg": [
            733.75,
            315.29381138867916
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:YQTShisoLqUJ:scholar.google.com/&scioq=RINGER:+Conformer+Ensemble+Generation+of+Macrocyclic+Peptides+with+Sequence-Conditioned+Internal+Coordinate+Diffusion&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "Genentech",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.genentech.com",
        "aff_unique_abbr": "Genentech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "9GviaQcGnx",
        "title": "Constrained Parameter Regularization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this work, we present constrained parameter regularization (CPR), an alternative to traditional weight decay. Instead of applying a constant penalty uniformly to all parameters, we enforce an upper bound on a statistical measure (e.g., the L2-norm) of parameter groups. Consequently, learning becomes a constraint optimization problem, which we address by an adaptation of the augmented Lagrangian method. This formulation permits varying regularization strengths for each parameter group, eliminating the need for explicit penalty coefficients for regularization terms. CPR only requires two hyperparameters and incurs no measurable runtime overhead. Additionally, we propose a simple but efficient mechanism to adapt the upper bounds during the optimization. We provide empirical evidence of CPR's efficacy in experiments on the ``grokking'' phenomenon, computer vision, and language modeling tasks. Our results demonstrate that CPR counteracts the effects of grokking and consistently matches or outperforms traditional weight decay.",
        "keywords": "Weight Decay;Parameter Regularization;Augmented Lagrangian;Deep Learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/a0588e30e64db00c13de4705f0b6e52201bfa9f1.zip",
        "author": "J\u00f6rg K.H. Franke;Michael Hefenbrock;Gregor Koehler;Frank Hutter",
        "authorids": "~J\u00f6rg_K.H._Franke1;~Michael_Hefenbrock1;~Gregor_Koehler1;~Frank_Hutter1",
        "gender": ";;M;M",
        "homepage": ";;;http://ml.informatik.uni-freiburg.de/~hutter/",
        "dblp": ";;251/8923;89/5383",
        "google_scholar": ";;b8U4UTAAAAAJ;https://scholar.google.de/citations?user=YUrxwrkAAAAJ",
        "orcid": ";;;0000-0002-2037-3694",
        "linkedin": ";;;frank-hutter-9190b24b/",
        "or_profile": "~J\u00f6rg_K.H._Franke1;~Michael_Hefenbrock1;~Gregor_Koehler1;~Frank_Hutter1",
        "aff": ";;German Cancer Research Center (DKFZ);Albert-Ludwigs-Universit\u00e4t Freiburg",
        "aff_domain": ";;dkfz.de;uni-freiburg.de",
        "position": ";;PhD student;Full Professor",
        "bibtex": "@misc{\nfranke2024constrained,\ntitle={Constrained Parameter Regularization},\nauthor={J{\\\"o}rg K.H. Franke and Michael Hefenbrock and Gregor Koehler and Frank Hutter},\nyear={2024},\nurl={https://openreview.net/forum?id=9GviaQcGnx}\n}",
        "github": "",
        "project": "",
        "reviewers": "HpN9;EQkA;VW8f",
        "site": "https://openreview.net/forum?id=9GviaQcGnx",
        "pdf_size": 1016545,
        "rating": "3;5;8",
        "confidence": "5;2;3",
        "soundness": "2;3;4",
        "contribution": "1;2;4",
        "presentation": "2;2;4",
        "wc_summary": "66;62;32",
        "wc_strengths": "39;82;48",
        "wc_weaknesses": "96;326;47",
        "wc_questions": "1;2;97",
        "wc_review": "202;472;224",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "647;1074;401",
        "reply_reviewers": "0;0;0",
        "reply_authors": "3;4;1",
        "rating_avg": [
            5.333333333333333,
            2.0548046676563256
        ],
        "confidence_avg": [
            3.3333333333333335,
            1.247219128924647
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            53.333333333333336,
            15.173075568988056
        ],
        "wc_strengths_avg": [
            56.333333333333336,
            18.517259216441534
        ],
        "wc_weaknesses_avg": [
            156.33333333333334,
            121.62876121853562
        ],
        "wc_questions_avg": [
            33.333333333333336,
            45.02098276236192
        ],
        "wc_review_avg": [
            299.3333333333333,
            122.42367236590951
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            707.3333333333334,
            278.0435617348876
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5636214801906779,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3553407105975230256&as_sdt=80005&sciodt=0,11&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "German Cancer Research Center;Albert-Ludwigs-Universit\u00e4t Freiburg",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.dkfz.de;https://www.uni-freiburg.de",
        "aff_unique_abbr": "DKFZ;Albert-Ludwigs-Universit\u00e4t",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Freiburg",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "9Gvs64deOj",
        "title": "Rendering Wireless Environments Useful for Gradient Estimators: A Zero-Order Stochastic Federated Learning Method",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Federated learning (FL) is a novel approach to machine learning that allows multiple edge devices to collaboratively train a model without disclosing their raw data. However, several challenges hinder the practical implementation of this approach, especially when devices and the server communicate over wireless channels, as it suffers from communication and computation bottlenecks in this case. By utilizing a communication-efficient framework, we propose a novel zero-order (ZO) method with two types of gradient estimators, one-point and two-point, that harnesses the nature of the wireless communication channel without requiring the knowledge of the channel state coefficient. It is the first method that includes the wireless channel in the learning algorithm itself instead of wasting resources to analyze it and remove its impact. The two main difficulties of this work are that in FL, the objective function is usually not convex, which makes the extension of FL to ZO methods challenging, and that including the impact of wireless channels requires extra attention. However, we overcome these difficulties and comprehensively analyze the proposed zero-order federated learning (ZOFL) framework. We establish its convergence theoretically, and we prove a convergence rate of $O(\\frac{1}{\\sqrt[3]{K}})$ with the one-point estimate and $O(\\frac{1}{\\sqrt{K}})$ with the two-point one in the nonconvex setting. We further demonstrate the potential of our algorithms with experimental results, taking into account independent and identically distributed (IID) and non-IID device data distributions.",
        "keywords": "Federated learning;zero-order optimization over wireless channels;gradient estimates;convergence analysis",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Elissa Mhanna;Mohamad Assaad",
        "authorids": "~Elissa_Mhanna1;~Mohamad_Assaad1",
        "gender": "F;M",
        "homepage": "https://l2s.centralesupelec.fr/u/mhanna-elissa/;https://l2s.centralesupelec.fr/u/assaad-mohamad/",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": "elissa-mhanna;",
        "or_profile": "~Elissa_Mhanna1;~Mohamad_Assaad1",
        "aff": "CentraleSupelec;CentraleSupelec",
        "aff_domain": "centralesupelec.fr;centralesupelec.fr",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nmhanna2024rendering,\ntitle={Rendering Wireless Environments Useful for Gradient Estimators: A Zero-Order Stochastic Federated Learning Method},\nauthor={Elissa Mhanna and Mohamad Assaad},\nyear={2024},\nurl={https://openreview.net/forum?id=9Gvs64deOj}\n}",
        "github": "",
        "project": "",
        "reviewers": "b8PD;ufXa;3zxv;hpcJ;DD4A;eq2v",
        "site": "https://openreview.net/forum?id=9Gvs64deOj",
        "pdf_size": 761244,
        "rating": "3;3;3;3;5;5",
        "confidence": "4;4;4;3;4;3",
        "soundness": "3;2;2;2;2;3",
        "contribution": "2;2;2;2;3;3",
        "presentation": "2;2;2;2;3;2",
        "wc_summary": "40;41;84;57;59;72",
        "wc_strengths": "20;12;51;66;74;54",
        "wc_weaknesses": "325;339;281;295;43;218",
        "wc_questions": "4;10;267;15;212;160",
        "wc_review": "389;402;683;433;388;504",
        "wc_reply_reviewers": "0;0;0;0;0;0",
        "wc_reply_authors": "1711;966;656;620;453;848",
        "reply_reviewers": "0;0;0;0;0;0",
        "reply_authors": "3;2;1;1;1;2",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.1666666666666665,
            0.3726779962499649
        ],
        "wc_summary_avg": [
            58.833333333333336,
            15.720651668709186
        ],
        "wc_strengths_avg": [
            46.166666666666664,
            22.74801578648613
        ],
        "wc_weaknesses_avg": [
            250.16666666666666,
            100.3367939602528
        ],
        "wc_questions_avg": [
            111.33333333333333,
            106.30407120875266
        ],
        "wc_review_avg": [
            466.5,
            104.66573778781033
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            875.6666666666666,
            408.0386691914818
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.74535599249993
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.25,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12485515710879715834&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "CentraleSup\u00e9lec",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.centralesupelec.fr",
        "aff_unique_abbr": "CS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "France"
    },
    {
        "id": "9IUZya8bCN",
        "title": "PoisoningGuard: Provable Defense against Data Poisoning Attacks to Multi-label Classification",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Different from multi-class classification where each testing input only has a single ground truth label, multi-label classification aims to make predictions for testing inputs with multiple ground-truth labels. Multi-label classification has many real-world applications such as disease detection, object recognition, document classification, just to name a few. Recent studies, however, showed that a multi-label classifier is vulnerable to data-poisoning attacks, where an attacker can poison the training dataset of the multi-label classifier such that the classifier makes predictions as the attacker desires. Existing provable defenses are all designed for multi-class classification and they achieve sub-optimal results when applying their robustness guarantees to multi-label classification (as we will demonstrate in this paper). In this work, we propose PoisoningGuard, the first provable defense against data-poisoning attacks to multi-label classification. In particular, we generalize two state-of-the-art multi-class certification methods, namely bagging and Deep Partition Aggregation (DPA), to multi-label classification. Our major technical contribution is to jointly consider multiple labels when deriving the provable robustness guarantees. We perform comprehensive evaluations on three datasets. Our experimental results show that our generalized methods significantly outperform bagging and DPA when applying them to multi-label classification. The code will be released.",
        "keywords": "Certified defense;multi-label classification;data poisoning attacks",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/e6b53ad94cd405516d1a52bda6de2faf72333f70.pdf",
        "author": "yanting wang;Guohao Lan;Jinyuan Jia",
        "authorids": "~yanting_wang1;~Guohao_Lan1;~Jinyuan_Jia2",
        "gender": "M;M;",
        "homepage": "https://wang-yanting.github.io/;https://guohao.netlify.app/;https://jinyuan-jia.github.io/",
        "dblp": ";178/9755.html;24/5124-1.html",
        "google_scholar": "ClAr4UYAAAAJ;1ebZN5gAAAAJ;iyg4ytkAAAAJ",
        "orcid": "0009-0004-1653-1444;;0000-0002-9785-7769",
        "linkedin": ";;",
        "or_profile": "~yanting_wang1;~Guohao_Lan1;~Jinyuan_Jia2",
        "aff": "Pennsylvania State University;Delft University of Technology;Pennsylvania State University",
        "aff_domain": "ist.psu.edu;tudelft.nl;psu.edu",
        "position": "PhD student;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nwang2024poisoningguard,\ntitle={PoisoningGuard: Provable Defense against Data Poisoning Attacks to Multi-label Classification},\nauthor={yanting wang and Guohao Lan and Jinyuan Jia},\nyear={2024},\nurl={https://openreview.net/forum?id=9IUZya8bCN}\n}",
        "github": "",
        "project": "",
        "reviewers": "usg5;PaSr;hayp;oRDf",
        "site": "https://openreview.net/forum?id=9IUZya8bCN",
        "pdf_size": 631448,
        "rating": "3;5;5;5",
        "confidence": "4;3;5;3",
        "soundness": "2;2;2;2",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;2",
        "wc_summary": "62;42;64;75",
        "wc_strengths": "21;54;52;78",
        "wc_weaknesses": "373;79;312;254",
        "wc_questions": "10;37;124;223",
        "wc_review": "466;212;552;630",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            60.75,
            11.903255857117413
        ],
        "wc_strengths_avg": [
            51.25,
            20.24073862288627
        ],
        "wc_weaknesses_avg": [
            254.5,
            109.7144019716646
        ],
        "wc_questions_avg": [
            98.5,
            83.3141644619929
        ],
        "wc_review_avg": [
            465.0,
            157.16551784663199
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.17407765595569782,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:p7R9VwucWyMJ:scholar.google.com/&scioq=PoisoningGuard:+Provable+Defense+against+Data+Poisoning+Attacks+to+Multi-label+Classification&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Pennsylvania State University;Delft University of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.psu.edu;https://www.tudelft.nl",
        "aff_unique_abbr": "PSU;TU Delft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United States;Netherlands"
    },
    {
        "title": "A Real-World WebAgent with Planning, Long Context Understanding, and Program Synthesis",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19300",
        "id": "9JQtrumvg8",
        "author_site": "Izzeddin Gur, Hiroki Furuta, Austin Huang, Mustafa Safdari, Yutaka Matsuo, Douglas Eck, Aleksandra Faust",
        "tldr": "",
        "abstract": "Pre-trained large language models (LLMs) have recently achieved better generalization and sample efficiency in autonomous web automation.\nHowever, the performance on real-world websites has still suffered from (1) open domainness, (2) limited context length, and (3) lack of inductive bias on HTML.\nWe introduce WebAgent, an LLM-driven agent that learns from self-experience to complete tasks on real websites following natural language instructions.\nWebAgent plans ahead by decomposing instructions into canonical sub-instructions, summarizes long HTML documents into task-relevant snippets, and acts on websites via Python programs generated from those.\nWe design WebAgent with Flan-U-PaLM, for grounded code generation, and HTML-T5, new pre-trained LLMs for long HTML documents using local and global attention mechanisms and a mixture of long-span denoising objectives, for planning and summarization.\nWe empirically demonstrate that our modular recipe improves the success on real websites by over 50%, and that HTML-T5 is the best model to solve various HTML understanding tasks; achieving 18.7% higher success rate than the prior method on MiniWoB web automation benchmark, and SoTA performance on Mind2Web, an offline task planning evaluation.",
        "keywords": "Web Navigation;Web Automation;Large Language Models;Language Model Agents;Tool Use;Program Synthesis",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Izzeddin Gur;Hiroki Furuta;Austin V Huang;Mustafa Safdari;Yutaka Matsuo;Douglas Eck;Aleksandra Faust",
        "authorids": "~Izzeddin_Gur1;~Hiroki_Furuta1;~Austin_V_Huang1;~Mustafa_Safdari1;~Yutaka_Matsuo1;~Douglas_Eck1;~Aleksandra_Faust1",
        "gender": ";M;;M;M;M;F",
        "homepage": ";https://github.com/frt03;https://github.com/austinvhuang;;http://ymatsuo.com;;http://www.afaust.info",
        "dblp": "188/9027;267/2065;;05/7184;m/YMatsuo.html;79/4646;135/8420",
        "google_scholar": "qS_ugJAAAAAJ;M0OhM1UAAAAJ;;;Dy8iau4AAAAJ;;RK72t68AAAAJ",
        "orcid": ";;;0009-0002-1604-8685;;;0000-0002-3268-8685",
        "linkedin": ";;austin-huang-74a75422/;mustafasafdari/;;;aleksandrafaust",
        "or_profile": "~Izzeddin_Gur1;~Hiroki_Furuta1;~Austin_V_Huang1;~Mustafa_Safdari1;~Yutaka_Matsuo1;~Douglas_Eck1;~Aleksandra_Faust1",
        "aff": "Google;Google DeepMind;;Research, Google;The University of Tokyo;Google;Google Brain",
        "aff_domain": "google.com;google.com;;research.google.com;u-tokyo.ac.jp;google.com;google.com",
        "position": "Research Scientist;Intern;;Researcher;Associate Professor;Research Scientist;Principal Researcher",
        "bibtex": "@inproceedings{\ngur2024a,\ntitle={A Real-World WebAgent with Planning, Long Context Understanding, and Program Synthesis},\nauthor={Izzeddin Gur and Hiroki Furuta and Austin V Huang and Mustafa Safdari and Yutaka Matsuo and Douglas Eck and Aleksandra Faust},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=9JQtrumvg8}\n}",
        "github": "",
        "project": "",
        "reviewers": "Jsxu;eCh6;ASiH;Gbpj",
        "pdf_size": 1816977,
        "rating": "5;8;8;8",
        "confidence": "4;3;3;5",
        "soundness": "4;3;4;3",
        "contribution": "3;4;4;4",
        "presentation": "2;2;3;3",
        "wc_summary": "65;183;61;188",
        "wc_strengths": "74;144;30;140",
        "wc_weaknesses": "15;383;59;91",
        "wc_questions": "218;81;75;52",
        "wc_review": "372;791;225;471",
        "wc_reply_reviewers": "0;20;23;0",
        "wc_reply_authors": "922;678;494;431",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "3;1;1;2",
        "rating_avg": [
            7.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            124.25,
            61.29182245618089
        ],
        "wc_strengths_avg": [
            97.0,
            47.634021455258214
        ],
        "wc_weaknesses_avg": [
            137.0,
            144.5683229480096
        ],
        "wc_questions_avg": [
            106.5,
            65.27825058930425
        ],
        "wc_review_avg": [
            464.75,
            207.70216055688974
        ],
        "wc_reply_reviewers_avg": [
            10.75,
            10.80219885023415
        ],
        "wc_reply_authors_avg": [
            631.25,
            190.82632811014312
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.17407765595569782,
        "gs_citation": 233,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11247435352141794384&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=9JQtrumvg8",
        "pdf": "https://openreview.net/pdf?id=9JQtrumvg8",
        "email": "google.com;google.com;;research.google.com;u-tokyo.ac.jp;google.com;google.com",
        "author_num": 7,
        "aff_unique_index": "0;0;0;1;0;0",
        "aff_unique_norm": "Google;University of Tokyo",
        "aff_unique_dep": "Google;",
        "aff_unique_url": "https://www.google.com;https://www.u-tokyo.ac.jp",
        "aff_unique_abbr": "Google;UTokyo",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Mountain View;",
        "aff_country_unique_index": "0;1;0;2;0;0",
        "aff_country_unique": "United States;United Kingdom;Japan"
    },
    {
        "id": "9JRsAj3ymy",
        "title": "Time-Sensitive Replay for Continual Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Continual learning closely emulates the process of human learning, which allows a model to learn for a large number of tasks sequentially without forgetting knowledge obtained from the preceding tasks. Replay-based continual learning methods reintroduce examples from previous tasks to mitigate catastrophic forgetting. However, current replay-based methods often unnecessarily reintroduce training examples, leading to inefficiency, and require task information prior to training, which requires preceding knowledge of the training data stream. We propose a novel replay method, Time-Sensitive Replay (TSR), that reduces the number of replayed examples while maintaining accuracy. TSR detects drift in the model's prediction when learning a task and preemptively prevents forgetting events by reintroducing previously encountered examples to the training set. We extend this method to a task-free setting with Task-Free TSR (TF-TSR). In our experiments on benchmark datasets, our approach trains 23\\% to 25\\% faster than current task-based continual learning methods and 48\\% to 58\\% faster than task-free methods while maintaining accuracy.",
        "keywords": "Continual Learning;Replay Learning;Task-Free Learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Jack Colin Julian;Yun Sing Koh;Albert Bifet",
        "authorids": "~Jack_Colin_Julian1;~Yun_Sing_Koh2;~Albert_Bifet1",
        "gender": "M;;M",
        "homepage": ";https://profiles.auckland.ac.nz/y-koh;https://albertbifet.com/",
        "dblp": ";23/1879.html;48/1070",
        "google_scholar": ";0L38IrAAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";0000-0001-7256-4049;0000-0002-8339-7773",
        "linkedin": "jack-julian-b88878223;yun-sing-koh-a7ba358/;abifet/",
        "or_profile": "~Jack_Colin_Julian1;~Yun_Sing_Koh2;~Albert_Bifet1",
        "aff": "University of Auckland;University of Auckland;T\u00e9l\u00e9com Paris",
        "aff_domain": "auckland.ac.nz;auckland.ac.nz;telecom-paris.fr",
        "position": "PhD student;Full Professor;Full Professor",
        "bibtex": "@misc{\njulian2024timesensitive,\ntitle={Time-Sensitive Replay for Continual Learning},\nauthor={Jack Colin Julian and Yun Sing Koh and Albert Bifet},\nyear={2024},\nurl={https://openreview.net/forum?id=9JRsAj3ymy}\n}",
        "github": "",
        "project": "",
        "reviewers": "AYp8;D8wn;Xzud;qppC",
        "site": "https://openreview.net/forum?id=9JRsAj3ymy",
        "pdf_size": 877719,
        "rating": "3;3;3;5",
        "confidence": "4;3;4;4",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;2",
        "presentation": "1;2;2;3",
        "wc_summary": "38;101;55;94",
        "wc_strengths": "37;53;20;15",
        "wc_weaknesses": "140;376;154;50",
        "wc_questions": "188;37;37;100",
        "wc_review": "403;567;266;259",
        "wc_reply_reviewers": "21;0;14;0",
        "wc_reply_authors": "402;729;508;294",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            72.0,
            26.315394733881533
        ],
        "wc_strengths_avg": [
            31.25,
            14.972892172189045
        ],
        "wc_weaknesses_avg": [
            180.0,
            119.99166637729472
        ],
        "wc_questions_avg": [
            90.5,
            61.88901356460612
        ],
        "wc_review_avg": [
            373.75,
            125.47783668839689
        ],
        "wc_reply_reviewers_avg": [
            8.75,
            9.093266739736606
        ],
        "wc_reply_authors_avg": [
            483.25,
            160.79703821899207
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:lheoGJz0Go8J:scholar.google.com/&scioq=Time-Sensitive+Replay+for+Continual+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "University of Auckland;T\u00e9l\u00e9com Paris",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.auckland.ac.nz;https://www.telecom-paris.fr",
        "aff_unique_abbr": "UoA;T\u00e9l\u00e9com Paris",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "New Zealand;France"
    },
    {
        "id": "9JxQyat11M",
        "title": "Zero-Shot Visual Classification with Guided Cropping",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Pretrained vision-language models, e.g., CLIP, show promising zero-shot transfer capability across various unseen classification datasets. However, there is an inherent limitation: CLIP image encoders are typically designed to extract generic image-level features that summarize superfluous or confounding information for the target tasks. This results in degradation of classification performance, especially when objects of interest cover small areas of input images. In this work, we propose CLIP with Guided Cropping (GC-CLIP), where we use an off-the-shelf zero-shot object detection model in a preprocessing step to increase the focus of zero-shot classifiers on the object of interest and minimize the influence of extraneous image regions. We empirically show that our approach improves zero-shot performance across architectures and datasets, most favorably for small objects.",
        "keywords": "zero-shot;open-vocabulary;CLIP;image classification",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/ad135640af6f7ecce8bedd5a8005608a5ffcd566.pdf",
        "author": "Piyapat Saranrittichai;Mauricio Munoz;Volker Fischer;Chaithanya Kumar Mummadi",
        "authorids": "~Piyapat_Saranrittichai1;~Mauricio_Munoz1;~Volker_Fischer1;~Chaithanya_Kumar_Mummadi1",
        "gender": "M;;M;M",
        "homepage": ";;;",
        "dblp": "299/7804;245/9820;84/4102-3;208/6386",
        "google_scholar": "https://scholar.google.de/citations?user=ncbD7EQAAAAJ;;https://scholar.google.de/citations?hl=de;XJLtaG4AAAAJ",
        "orcid": "0000-0003-0620-7945;;0000-0001-5437-4030;0000-0002-1173-2720",
        "linkedin": "https://www.linkedin.com/pub/piyapat-saranrittichai/38/684/b41;ammd010289/;;",
        "or_profile": "~Piyapat_Saranrittichai1;~Mauricio_Munoz1;~Volker_Fischer1;~Chaithanya_Kumar_Mummadi1",
        "aff": "Albert-Ludwigs-Universit\u00e4t Freiburg;Robert Bosch GmbH, Bosch;Bosch Center for Artificial Intelligence;Bosch Center for Artificial Intelligence",
        "aff_domain": "uni-freiburg.de;de.bosch.com;bosch.com;bosch.com",
        "position": "PhD student;Researcher;Postdoc;Researcher",
        "bibtex": "@misc{\nsaranrittichai2024zeroshot,\ntitle={Zero-Shot Visual Classification with Guided Cropping},\nauthor={Piyapat Saranrittichai and Mauricio Munoz and Volker Fischer and Chaithanya Kumar Mummadi},\nyear={2024},\nurl={https://openreview.net/forum?id=9JxQyat11M}\n}",
        "github": "",
        "project": "",
        "reviewers": "EzG9;tiUR;LrWg;KVmG",
        "site": "https://openreview.net/forum?id=9JxQyat11M",
        "pdf_size": 5447527,
        "rating": "3;5;5;6",
        "confidence": "5;3;4;4",
        "soundness": "2;3;3;2",
        "contribution": "1;2;2;2",
        "presentation": "2;3;4;3",
        "wc_summary": "69;95;70;72",
        "wc_strengths": "8;48;50;26",
        "wc_weaknesses": "200;162;219;157",
        "wc_questions": "1;3;52;96",
        "wc_review": "278;308;391;351",
        "wc_reply_reviewers": "0;0;0;353",
        "wc_reply_authors": "603;491;610;1016",
        "reply_reviewers": "0;0;0;2",
        "reply_authors": "1;1;1;3",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            76.5,
            10.735455276791944
        ],
        "wc_strengths_avg": [
            33.0,
            17.233687939614086
        ],
        "wc_weaknesses_avg": [
            184.5,
            25.947061490658243
        ],
        "wc_questions_avg": [
            38.0,
            39.223717314910374
        ],
        "wc_review_avg": [
            332.0,
            42.81938813201328
        ],
        "wc_reply_reviewers_avg": [
            88.25,
            152.85348376795343
        ],
        "wc_reply_authors_avg": [
            680.0,
            199.65344975732324
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.6488856845230502,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ipEt37xNIrcJ:scholar.google.com/&scioq=Zero-Shot+Visual+Classification+with+Guided+Cropping&hl=en&as_sdt=0,33",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;2",
        "aff_unique_norm": "Albert-Ludwigs-Universit\u00e4t Freiburg;Robert Bosch GmbH;Bosch Center for Artificial Intelligence",
        "aff_unique_dep": ";;Center for Artificial Intelligence",
        "aff_unique_url": "https://www.uni-freiburg.de;https://www.bosch.com;https://www.bosch-ai.com",
        "aff_unique_abbr": "Albert-Ludwigs-Universit\u00e4t;Bosch;BCAI",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Freiburg;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "9KVT1e1qf7",
        "title": "LoRAPrune: Pruning Meets Low-Rank Parameter-Efficient Fine-Tuning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large pre-trained models (LPMs), such as LLaMA and GLM, have shown exceptional performance across various tasks through fine-tuning. Although low-rank adaption (LoRA) has emerged to cheaply fine-tune these LPMs on downstream tasks, their deployment is still hindered by the vast model scale and computational costs. Neural network pruning offers a way to compress LPMs. However, the current pruning methods designed for LPMs are not compatible with LoRA. This is due to their utilization of unstructured pruning on LPMs, impeding the merging of LoRA weights, or their dependence on the gradients of pre-trained weights to guide pruning, which can impose significant memory overhead.\nTo this end, we propose LoRAPrune, a new framework that delivers an accurate, compact model for efficient inference in a highly memory-effective manner. Specifically, we first design a LoRA-guided pruning criterion, which uses the weights and gradients of LoRA, rather than the gradients of pre-trained weights for importance estimation. We then propose a structured iterative pruning procedure, to remove redundant channels and heads. \nExtensive experimental results demonstrate the superior performance of our LoRAPrune over existing approaches on the LLaMA series models.\nFor instance, at a 50\\% compression rate, LoRAPrune outperforms LLM-Pruner by a perplexity reduction of 8.0 on WikiText2 and 16.05 on PTB datasets, while concurrently reducing memory usage by 52.6\\%.",
        "keywords": "Neural Network Pruning;Parameter Efficient Tuning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/874a30065f9392ccee03ceaeff0c4a4c359b960d.zip",
        "author": "Mingyang Zhang;Hao Chen;Chunhua Shen;Zhen Yang;Linlin Ou;Xinyi Yu;Bohan Zhuang",
        "authorids": "~Mingyang_Zhang3;~Hao_Chen17;~Chunhua_Shen2;~Zhen_Yang15;~Linlin_Ou1;~Xinyi_Yu1;~Bohan_Zhuang1",
        "gender": "M;;;M;F;M;M",
        "homepage": "https://www.researchgate.net/profile/Mingyang_Zhang25;;;https://zhenyangcs.github.io/;https://www.researchgate.net/profile/Linlin_Ou;https://www.researchgate.net/profile/Yu_Xinyi;https://bohanzhuang.github.io/",
        "dblp": "76/4874-7.html;;;;17/7817.html;;145/1096",
        "google_scholar": ";;;Vm1moSIAAAAJ;;;https://scholar.google.com.au/citations?user=DFuDBBwAAAAJ",
        "orcid": ";;;;;0000-0001-8716-7687;",
        "linkedin": ";;;;;;bohan-zhuang/",
        "or_profile": "~Mingyang_Zhang3;~Hao_Chen17;~Chunhua_Shen2;~Zhen_Yang15;~Linlin_Ou1;~Xinyi_Yu1;~Bohan_Zhuang1",
        "aff": "Zhejiang University;;;Hong Kong University of Science and Technology;Zhejiang University of Technology;Zhejiang University of Technology;Monash University",
        "aff_domain": "zju.edu.cn;;;connect.hkust-gz.edu.cn;zjut.edu.cn;zjut.edu.cn;monash.edu",
        "position": "Postdoc;;;PhD student;Full Professor;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nzhang2024loraprune,\ntitle={Lo{RAP}rune: Pruning Meets Low-Rank Parameter-Efficient Fine-Tuning},\nauthor={Mingyang Zhang and Hao Chen and Chunhua Shen and Zhen Yang and Linlin Ou and Xinyi Yu and Bohan Zhuang},\nyear={2024},\nurl={https://openreview.net/forum?id=9KVT1e1qf7}\n}",
        "github": "",
        "project": "",
        "reviewers": "C5GK;nG8N;nuRr;pQXa;RcVc",
        "site": "https://openreview.net/forum?id=9KVT1e1qf7",
        "pdf_size": 691160,
        "rating": "5;5;5;5;6",
        "confidence": "5;4;4;4;2",
        "soundness": "2;2;2;2;3",
        "contribution": "3;2;2;2;3",
        "presentation": "2;3;2;3;2",
        "wc_summary": "50;100;104;78;80",
        "wc_strengths": "67;68;60;64;36",
        "wc_weaknesses": "67;269;145;189;236",
        "wc_questions": "18;55;5;6;7",
        "wc_review": "202;492;314;337;359",
        "wc_reply_reviewers": "0;554;195;0;43",
        "wc_reply_authors": "275;1315;781;356;453",
        "reply_reviewers": "0;2;1;0;1",
        "reply_authors": "2;4;3;2;2",
        "rating_avg": [
            5.2,
            0.39999999999999997
        ],
        "confidence_avg": [
            3.8,
            0.9797958971132712
        ],
        "soundness_avg": [
            2.2,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            82.4,
            19.24162155328911
        ],
        "wc_strengths_avg": [
            59.0,
            11.832159566199232
        ],
        "wc_weaknesses_avg": [
            181.2,
            70.88695225498131
        ],
        "wc_questions_avg": [
            18.2,
            18.988417522268673
        ],
        "wc_review_avg": [
            340.8,
            92.94170215785807
        ],
        "wc_reply_reviewers_avg": [
            158.4,
            210.39828896642672
        ],
        "wc_reply_authors_avg": [
            636.0,
            380.59847608733276
        ],
        "reply_reviewers_avg": [
            0.8,
            0.7483314773547883
        ],
        "reply_authors_avg": [
            2.6,
            0.8
        ],
        "replies_avg": [
            30,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.9185586535436918,
        "gs_citation": 61,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13109504067265056757&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2;2;3",
        "aff_unique_norm": "Zhejiang University;Hong Kong University of Science and Technology;Zhejiang University of Technology;Monash University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.zju.edu.cn;https://www.ust.hk;https://www.zjut.edu.cn;https://www.monash.edu",
        "aff_unique_abbr": "ZJU;HKUST;ZJUT;Monash",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;1",
        "aff_country_unique": "China;Australia"
    },
    {
        "id": "9Kgnvknvwd",
        "title": "A First-Order Multi-Gradient Algorithm for Multi-Objective Bi-Level Optimization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this paper, we study the Multi-Objective Bi-Level Optimization (MOBLO) problem, where the upper-level subproblem is a multi-objective optimization problem and the lower-level subproblem is for scalar optimization. Existing gradient-based MOBLO algorithms need to compute the Hessian matrix, causing the computational inefficient problem. To address this, we propose an efficient first-order multi-gradient method for MOBLO, called FORUM. Specifically, we reformulate MOBLO problems as a constrained multi-objective optimization (MOO) problem via the value-function approach. Then we propose a novel multi-gradient aggregation method to solve the challenging constrained MOO problem. Theoretically, we provide the complexity analysis to show the efficiency of the proposed method and a non-asymptotic convergence result. Empirically, extensive experiments demonstrate the effectiveness and efficiency of the proposed FORUM method in different learning problems. In particular, it achieves state-of-the-art performance on three multi-task learning benchmark datasets.",
        "keywords": "Multi-Objective Bi-Level Optimization;Multi-Task Learning",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Feiyang Ye;Baijiong Lin;Xiaofeng Cao;Yu Zhang;Ivor Tsang",
        "authorids": "~Feiyang_Ye4;~Baijiong_Lin1;~Xiaofeng_Cao2;~Yu_Zhang3;~Ivor_Tsang1",
        "gender": "M;M;M;M;M",
        "homepage": "https://feiyang-ye.github.io/;https://baijiong-lin.github.io/;http://cse.sustech.edu.cn/faculty/~zhangy/;https://www.a-star.edu.sg/cfar/about-cfar/management/prof-ivor-tsang;https://xiaofengcaoml.github.io/",
        "dblp": "285/4704;279/2950;50/671-6;35/5873;117/3982-2.html",
        "google_scholar": "3EX25cAAAAAJ;KVdbYTYAAAAJ;https://scholar.google.com.hk/citations?user=jaRS5w4AAAAJ;rJMOlVsAAAAJ;",
        "orcid": ";0000-0002-4257-0226;;;",
        "linkedin": ";;;;",
        "or_profile": "~Feiyang_Ye4;~Baijiong_Lin1;~Yu_Zhang3;~Ivor_W_Tsang1;~Xiaofeng_Cao1",
        "aff": "University of Technology Sydney;The Hong Kong University of Science and Technology (Guangzhou);Southern University of Science and Technology;A*STAR;Jilin University",
        "aff_domain": "uts.edu.au;connect.hkust-gz.edu.cn;sustc.edu.cn;cfar.a-star.edu.sg;jlu.edu.cn",
        "position": "PhD student;PhD student;Associate Professor;Principal Researcher;Associate Professor",
        "bibtex": "@misc{\nye2024a,\ntitle={A First-Order Multi-Gradient Algorithm for Multi-Objective Bi-Level Optimization},\nauthor={Feiyang Ye and Baijiong Lin and Xiaofeng Cao and Yu Zhang and Ivor Tsang},\nyear={2024},\nurl={https://openreview.net/forum?id=9Kgnvknvwd}\n}",
        "github": "",
        "project": "",
        "reviewers": "xYWk;6mPv;nzzn;MMwK",
        "site": "https://openreview.net/forum?id=9Kgnvknvwd",
        "pdf_size": 506917,
        "rating": "3;5;6;6",
        "confidence": "3;4;3;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "79;67;46;62",
        "wc_strengths": "50;35;37;126",
        "wc_weaknesses": "390;202;78;132",
        "wc_questions": "40;8;3;76",
        "wc_review": "559;312;164;396",
        "wc_reply_reviewers": "0;4;17;7",
        "wc_reply_authors": "1381;653;356;726",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "3;1;2;3",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            63.5,
            11.84271928232701
        ],
        "wc_strengths_avg": [
            62.0,
            37.39652390263031
        ],
        "wc_weaknesses_avg": [
            200.5,
            117.909923246519
        ],
        "wc_questions_avg": [
            31.75,
            29.22648627529488
        ],
        "wc_review_avg": [
            357.75,
            142.82572422361457
        ],
        "wc_reply_reviewers_avg": [
            7.0,
            6.284902544988268
        ],
        "wc_reply_authors_avg": [
            779.0,
            374.17175200701615
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12337236500024581689&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "University of Technology Sydney;Hong Kong University of Science and Technology;Southern University of Science and Technology;Agency for Science, Technology and Research;Jilin University",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.uts.edu.au;https://www.ust.hk;https://www.sustech.edu.cn;https://www.a-star.edu.sg;http://www.jlu.edu.cn",
        "aff_unique_abbr": "UTS;HKUST;SUSTech;A*STAR;JLU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Guangzhou",
        "aff_country_unique_index": "0;1;1;2;1",
        "aff_country_unique": "Australia;China;Singapore"
    },
    {
        "id": "9Klj7QG0NO",
        "title": "ONE-PEACE: Exploring One General Representation Model Toward Unlimited Modalities",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this work, we propose ONE-PEACE, a highly extensible model with 4B parameters that seamlessly aligns and integrates representations across vision, audio, and language modalities. The ONE-PEACE architecture consists of shared self-attention layers, modality adapters and FFNs. This design allows for multi-modal fusion through self-attention layers, while also providing the flexibility to easily incorporate new modalities. Two modality-agnostic pretraining tasks, cross-modal aligning contrast and intra-modal denoising contrast, are developed to align the semantic space of different modalities and capture fine-grained details within each modality simultaneously. With the scaling-friendly architecture and tasks, ONE-PEACE has the potential to expand to unlimited modalities. Without utilizing any vision or language pretrained model for initialization, ONE-PEACE achieves new SOTAs across a wide range of uni-modal and cross-modal tasks. Furthermore, we show that ONE-PEACE possesses a strong emergent retrieval capability, enabling it to align modalities that are not paired in the training data.",
        "keywords": "We propose a scalable way for building a general representation model toward unlimited modalities.",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/e7177c8d49e3d4fb104722f7ff0ea6e28a202e0e.zip",
        "author": "Peng Wang;Shijie Wang;Junyang Lin;Shuai Bai;Xiaohuan Zhou;Jingren Zhou;Xinggang Wang;Chang Zhou",
        "authorids": "~Peng_Wang20;~Shijie_Wang1;~Junyang_Lin1;~Shuai_Bai1;~Xiaohuan_Zhou1;~Jingren_Zhou1;~Xinggang_Wang1;~Chang_Zhou2",
        "gender": "M;M;M;M;F;M;M;M",
        "homepage": ";https://github.com/simonJJJ;;;;;https://xwcv.github.io/index.htm;",
        "dblp": "95/4442-28;;215/3823;208/8033;217/2489;84/2644;95/3056;",
        "google_scholar": "7fjqA0YAAAAJ;DuAqyTwAAAAJ;qp6IwtgAAAAJ;ylhI1JsAAAAJ;;;qNCTLV0AAAAJ;QeSoG3sAAAAJ",
        "orcid": ";;;;;;0000-0001-6732-7823;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Peng_Wang20;~Shijie_Wang1;~Junyang_Lin1;~Shuai_Bai1;~Xiaohuan_Zhou1;~Jingren_Zhou1;~Xinggang_Wang1;~Chang_Zhou2",
        "aff": "Alibaba Group;;Alibaba Group;Alibaba Group;Alibaba Group;Alibaba Group;Huazhong University of Science and Technology;Alibaba Group",
        "aff_domain": "alibaba-inc.com;;alibaba-inc.com;alibaba-inc.com;alibaba-inc.com;alibaba-inc.com;hust.edu.cn;alibaba-inc.com",
        "position": "Researcher;;Principal Researcher;Senior Engineer;Researcher;Researcher;Full Professor;Researcher",
        "bibtex": "@misc{\nwang2024onepeace,\ntitle={{ONE}-{PEACE}: Exploring One General Representation Model Toward Unlimited Modalities},\nauthor={Peng Wang and Shijie Wang and Junyang Lin and Shuai Bai and Xiaohuan Zhou and Jingren Zhou and Xinggang Wang and Chang Zhou},\nyear={2024},\nurl={https://openreview.net/forum?id=9Klj7QG0NO}\n}",
        "github": "",
        "project": "",
        "reviewers": "zvUR;DHvY;9Evr",
        "site": "https://openreview.net/forum?id=9Klj7QG0NO",
        "pdf_size": 0,
        "rating": "5;6;8",
        "confidence": "4;4;2",
        "soundness": "2;4;3",
        "contribution": "2;2;3",
        "presentation": "2;3;3",
        "wc_summary": "39;69;46",
        "wc_strengths": "29;78;50",
        "wc_weaknesses": "129;197;84",
        "wc_questions": "3;38;55",
        "wc_review": "200;382;235",
        "wc_reply_reviewers": "11;11;0",
        "wc_reply_authors": "459;978;898",
        "reply_reviewers": "1;1;0",
        "reply_authors": "3;2;2",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            51.333333333333336,
            12.81492185782739
        ],
        "wc_strengths_avg": [
            52.333333333333336,
            20.07209228976613
        ],
        "wc_weaknesses_avg": [
            136.66666666666666,
            46.449494674921446
        ],
        "wc_questions_avg": [
            32.0,
            21.64871050817269
        ],
        "wc_review_avg": [
            272.3333333333333,
            78.8514778273404
        ],
        "wc_reply_reviewers_avg": [
            7.333333333333333,
            5.185449728701348
        ],
        "wc_reply_authors_avg": [
            778.3333333333334,
            228.15248312379936
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.944911182523068,
        "gs_citation": 143,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15486176021242692169&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0;0;1;0",
        "aff_unique_norm": "Alibaba Group;Huazhong University of Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.alibaba.com;http://www.hust.edu.cn",
        "aff_unique_abbr": "Alibaba;HUST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "9L9j5bQPIY",
        "title": "Metanetwork: A novel approach to interpreting ANNs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent work on mechanistic interpretability, which attempts to demystify the black box of artificial neural network (ANN) models through analytical approaches, has made it possible to give a qualitative interpretation of how each component of the model works, even without using the dataset the model was trained on. However, it is also desirable from the viewpoint of interpretability to understand the ability of the entire model; and considering the previous studies on task embedding, the ability of the entire model should also be represented by a vector. In this study we propose a novel approach to quantitatively interpreting an unseen ANN's ability based on relationships with other ANNs through obtaining a low-dimensional representation of ANNs by training a \"metanetwork\" that autoencodes ANNs. As a first-ever attempt of such an approach, we train a \"metanetwork\" to autoencode ANNs consisting of one fully-connected layer. We demonstrate the validity of our proposed approach by showing that a simple k-Nearest Neighbor classifier can successfully predict properties of the training datasets of unseen models from their embedded representations.",
        "keywords": "AI interpretability;Model representation;Model capability;Autoencoder;Meta learning",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/6cece3e9fe0474793ffa192016303a5b791bfaf1.zip",
        "author": "Ryota Takatsuki;Ippei Fujisawa;Ryota Kanai",
        "authorids": "~Ryota_Takatsuki1;~Ippei_Fujisawa1;~Ryota_Kanai1",
        "gender": "M;;M",
        "homepage": ";;",
        "dblp": ";;",
        "google_scholar": "https://scholar.google.co.jp/citations?user=RTxFWIoAAAAJ;VR-c7ckAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;",
        "linkedin": "ryota-takatsuki-8a4697212/;;ryota-kanai-3585979/",
        "or_profile": "~Ryota_Takatsuki1;~Ippei_Fujisawa1;~Ryota_Kanai1",
        "aff": "Araya Inc.;Araya;Araya, Inc.",
        "aff_domain": "araya.org;research.araya.org;research.araya.org",
        "position": "Intern;Researcher;Principal Researcher",
        "bibtex": "@misc{\ntakatsuki2024metanetwork,\ntitle={Metanetwork: A novel approach to interpreting {ANN}s},\nauthor={Ryota Takatsuki and Ippei Fujisawa and Ryota Kanai},\nyear={2024},\nurl={https://openreview.net/forum?id=9L9j5bQPIY}\n}",
        "github": "",
        "project": "",
        "reviewers": "aLkj;3Bf5;rUtA;Bzy7",
        "site": "https://openreview.net/forum?id=9L9j5bQPIY",
        "pdf_size": 702501,
        "rating": "1;3;3;3",
        "confidence": "4;3;4;4",
        "soundness": "1;1;2;3",
        "contribution": "2;1;2;2",
        "presentation": "1;1;1;3",
        "wc_summary": "75;42;79;37",
        "wc_strengths": "5;8;29;59",
        "wc_weaknesses": "123;70;148;227",
        "wc_questions": "8;163;31;75",
        "wc_review": "211;283;287;398",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "127;564;389;647",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            58.25,
            18.886172190256023
        ],
        "wc_strengths_avg": [
            25.25,
            21.568205766822608
        ],
        "wc_weaknesses_avg": [
            142.0,
            56.581799193733666
        ],
        "wc_questions_avg": [
            69.25,
            59.23839548806163
        ],
        "wc_review_avg": [
            294.75,
            66.84450239174498
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            431.75,
            199.07457773407432
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:VZmkChpQtSQJ:scholar.google.com/&scioq=Metanetwork:+A+novel+approach+to+interpreting+ANNs&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Araya Inc.;Araya;Araya, Inc.",
        "aff_unique_dep": ";;",
        "aff_unique_url": ";;",
        "aff_unique_abbr": ";;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States;"
    },
    {
        "id": "9NKRfhKgzI",
        "title": "Adversarially Robust and Privacy-Preserving Representation Learning via Information Theory",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Machine learning models are vulnerable to both security (e.g., adversarial examples) attacks and privacy (e.g., private attribute inference) attacks. In this paper, we aim to mitigate both the security and privacy attacks, and maintain utility of the primary task simultaneously.\nParticularly, we propose an information-theoretical framework to achieve the goals through the lens of representation learning, i.e., learning representations that are robust to both adversarial examples and attribute inference adversaries. We also derive novel theoretical results, i.e., the inherent tradeoff between adversarial robustness/utility and attribute privacy, as well as guaranteed attribute privacy leakage against attribute inference adversaries.",
        "keywords": "Representation learning;adversarially robust;privacy-preserving;information theory",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Binghui Zhang;Sayedeh Leila Noorbakhsh;Yun Dong;Yuan Hong;Binghui Wang",
        "authorids": "~Binghui_Zhang1;~Sayedeh_Leila_Noorbakhsh1;~Yun_Dong1;~Yuan_Hong1;~Binghui_Wang2",
        "gender": "M;F;F;M;M",
        "homepage": ";;;https://yhongcs.github.io/;https://wangbinghui.net",
        "dblp": ";;;79/5433-1;123/7149",
        "google_scholar": ";;;KJuZW2wAAAAJ;SoOztcEAAAAJ",
        "orcid": ";;;;0000-0001-5616-060X",
        "linkedin": "binghui-zhang-68b20a108;leilynourbakhsh/;yun-dong/;;",
        "or_profile": "~Binghui_Zhang1;~Sayedeh_Leila_Noorbakhsh1;~Yun_Dong1;~Yuan_Hong1;~Binghui_Wang2",
        "aff": "Illinois Institute of Technology;Illinois Institute of Technology;Milwaukee School of Engineering;University of Connecticut;Illinois Institute of Technology",
        "aff_domain": "iit.edu;iit.edu;msoe.edu;uconn.edu;iit.edu",
        "position": "PhD student;MS student;Assistant Professor;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nzhang2024adversarially,\ntitle={Adversarially Robust and Privacy-Preserving Representation Learning via Information Theory},\nauthor={Binghui Zhang and Sayedeh Leila Noorbakhsh and Yun Dong and Yuan Hong and Binghui Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=9NKRfhKgzI}\n}",
        "github": "",
        "project": "",
        "reviewers": "qq4Y;jNV8;qrh8",
        "site": "https://openreview.net/forum?id=9NKRfhKgzI",
        "pdf_size": 1104626,
        "rating": "3;3;5",
        "confidence": "4;3;3",
        "soundness": "2;2;3",
        "contribution": "1;2;2",
        "presentation": "2;2;2",
        "wc_summary": "44;123;73",
        "wc_strengths": "47;29;55",
        "wc_weaknesses": "350;161;345",
        "wc_questions": "5;442;108",
        "wc_review": "446;755;581",
        "wc_reply_reviewers": "721;330;0",
        "wc_reply_authors": "502;689;0",
        "reply_reviewers": "1;1;0",
        "reply_authors": "1;1;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            80.0,
            32.629230249374054
        ],
        "wc_strengths_avg": [
            43.666666666666664,
            10.873004286866726
        ],
        "wc_weaknesses_avg": [
            285.3333333333333,
            87.94063654281538
        ],
        "wc_questions_avg": [
            185.0,
            186.5279246297097
        ],
        "wc_review_avg": [
            594.0,
            126.48320046551636
        ],
        "wc_reply_reviewers_avg": [
            350.3333333333333,
            294.69796213901594
        ],
        "wc_reply_authors_avg": [
            397.0,
            290.9169411819578
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:owgVDhfyracJ:scholar.google.com/&scioq=Adversarially+Robust+and+Privacy-Preserving+Representation+Learning+via+Information+Theory&hl=en&as_sdt=0,48",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2;0",
        "aff_unique_norm": "Illinois Institute of Technology;Milwaukee School of Engineering;University of Connecticut",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.iit.edu;https://www.msoe.edu;https://www.uconn.edu",
        "aff_unique_abbr": "IIT;MSOE;UConn",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "9NiprOP4OL",
        "title": "Zero-shot Inversion Process for Image Attribute Editing with Diffusion Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Denoising diffusion models have shown outstanding performance in image editing. Existing works tend to use either image-guided methods, which provide a visual reference but lack control over semantic coherence, or text-guided methods, which ensure faithfulness to text guidance but lack visual quality. To address the problem, we propose the Zero-shot Inversion Process (ZIP), a framework that injects a fusion of generated visual reference and text guidance into the semantic latent space of a frozen pre-trained diffusion model. Only using a tiny neural network, the proposed ZIP produces diverse content and attributes under the intuitive control of the text prompt. Moreover, ZIP shows remarkable robustness for both in-domain and out-of-domain attribute manipulation on real images. We perform detailed experiments on various benchmark datasets. Compared to state-of-the-art methods, ZIP produces images of equivalent quality while providing a realistic editing effect.",
        "keywords": "Diffusion Models; Attribute Editing; Zero Shot",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/88ef13782f9e35b9d1490bae22b8f160767a5336.zip",
        "author": "Zhanbo Feng;Zenan Ling;Feng Zhou;Ci Gong;Jie LI;Robert C Qiu",
        "authorids": "~Zhanbo_Feng1;~Zenan_Ling1;~Feng_Zhou9;~Ci_Gong1;~Jie_LI12;~Robert_C_Qiu1",
        "gender": "M;M;;M;M;",
        "homepage": "http://SadAngel.cn/;https://scholar.google.com/citations?user=BabePTkAAAAJ&hl=zh-CN;;https://github.com/HomuraToHikari;https://www.cs.sjtu.edu.cn/~lijie;",
        "dblp": "234/7758;183/7798;;;17/2703-2.html;",
        "google_scholar": ";BabePTkAAAAJ;;;Krl5HRcAAAAJ;",
        "orcid": ";;;;0000-0002-4974-6116;",
        "linkedin": ";;;;;",
        "or_profile": "~Zhanbo_Feng1;~Zenan_Ling1;~Feng_Zhou9;~Ci_Gong1;~Jie_LI12;~Robert_C_Qiu1",
        "aff": "Shanghai Jiaotong University;Huazhong University of Science and Technology;;Huazhong University of Science and Technology;Shanghai Jiaotong University;",
        "aff_domain": "sjtu.edu.cn;hust.edu.cn;;hust.edu.cn;cs.sjtu.edu.cn;",
        "position": "PhD student;Researcher;;MS student;Full Professor;",
        "bibtex": "@misc{\nfeng2024zeroshot,\ntitle={Zero-shot Inversion Process for Image Attribute Editing with Diffusion Models},\nauthor={Zhanbo Feng and Zenan Ling and Feng Zhou and Ci Gong and Jie LI and Robert C Qiu},\nyear={2024},\nurl={https://openreview.net/forum?id=9NiprOP4OL}\n}",
        "github": "",
        "project": "",
        "reviewers": "VELF;nLmB;pQWL;L9gz",
        "site": "https://openreview.net/forum?id=9NiprOP4OL",
        "pdf_size": 7482303,
        "rating": "3;3;3;3",
        "confidence": "4;5;5;4",
        "soundness": "3;3;1;2",
        "contribution": "2;2;1;1",
        "presentation": "2;2;3;2",
        "wc_summary": "112;115;79;48",
        "wc_strengths": "79;32;45;16",
        "wc_weaknesses": "131;83;165;136",
        "wc_questions": "3;75;29;6",
        "wc_review": "325;305;318;206",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            88.5,
            27.31757675929547
        ],
        "wc_strengths_avg": [
            43.0,
            23.18404623873926
        ],
        "wc_weaknesses_avg": [
            128.75,
            29.431063521388417
        ],
        "wc_questions_avg": [
            28.25,
            28.80429655450728
        ],
        "wc_review_avg": [
            288.5,
            48.16897341650536
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ZroxgevmYEgJ:scholar.google.com/&scioq=Zero-shot+Inversion+Process+for+Image+Attribute+Editing+with+Diffusion+Models&hl=en&as_sdt=0,33",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1;0",
        "aff_unique_norm": "Shanghai Jiao Tong University;Huazhong University of Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.sjtu.edu.cn;http://www.hust.edu.cn",
        "aff_unique_abbr": "SJTU;HUST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Neural Field Classifiers via Target Encoding and Classification Loss",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19299",
        "id": "9NqC72m31m",
        "author_site": "Xindi Yang, Zeke Xie, Xiong Zhou, Boyu Liu, Buhua Liu, Yi Liu, Haoran Wang, YUNFENG CAI, Mingming Sun",
        "tldr": "",
        "abstract": "Neural field methods have seen great progress in various long-standing tasks in computer vision and computer graphics, including novel view synthesis and geometry reconstruction. As existing neural field methods try to predict some coordinate-based continuous target values, such as RGB for Neural Radiance Field (NeRF), all of these methods are regression models and are optimized by some regression loss. However, are regression models really better than classification models for neural field methods? In this work, we try to visit this very fundamental but overlooked question for neural fields from a machine learning perspective. We successfully propose a novel Neural Field Classifier (NFC) framework which formulates existing neural field methods as classification tasks rather than regression tasks. The proposed NFC can easily transform arbitrary Neural Field Regressor (NFR) into its classification variant via employing a novel Target Encoding module and optimizing a classification loss. By encoding a continuous regression target into a high-dimensional discrete encoding, we naturally formulate a multi-label classification task. Extensive experiments demonstrate the impressive effectiveness of NFC at the nearly free extra computational costs. Moreover, NFC also shows robustness to sparse inputs, corrupted images, and dynamic scenes.",
        "keywords": "Neural Fields;NeRF;3D Vision;Scene Reconstruction",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Xindi Yang;Zeke Xie;Xiong Zhou;Boyu Liu;Buhua Liu;Yi Liu;Haoran Wang;YUNFENG CAI;Mingming Sun",
        "authorids": "~Xindi_Yang1;~Zeke_Xie1;~Xiong_Zhou3;~Boyu_Liu3;~Buhua_Liu1;~Yi_Liu40;~Haoran_Wang2;~YUNFENG_CAI1;~Mingming_Sun1",
        "gender": ";M;M;M;;;M;M;M",
        "homepage": ";https://sites.google.com/view/zeke-xie;https://hitcszx.github.io/;https://github.com/pascalliu;;http://faculty.bjtu.edu.cn/8546/;;https://www.bimsa.cn/detail/yfcai.html;",
        "dblp": ";210/1039;;143/0142;;;382/4779.html;133/8201;87/8665-1.html",
        "google_scholar": ";https://scholar.google.co.jp/citations?user=ysXmZCMAAAAJ;BMGootgAAAAJ;;;;xfnL2IEAAAAJ;https://scholar.google.com/citations?hl=en;",
        "orcid": ";;0000-0002-0856-6696;;;;0000-0002-6098-4772;;",
        "linkedin": ";;;;;;;;",
        "or_profile": "~Xindi_Yang1;~Zeke_Xie1;~Xiong_Zhou3;~Boyu_Liu3;~Buhua_Liu1;~Yi_Liu40;~Haoran_Wang2;~YUNFENG_CAI1;~Mingming_Sun1",
        "aff": ";Baidu;Harbin Institute of Technology;Beihang University;;Beijing Jiaotong University;Baidu;Baidu Research;Baidu",
        "aff_domain": ";baidu.com;hit.edu.cn;buaa.edu.cn;;bjtu.edu.cn;baidu.com;baidu.com;baidu.com",
        "position": ";Researcher;PhD student;PhD student;;Associate Professor;Researcher;Resseacher;Principal Researcher",
        "bibtex": "@inproceedings{\nyang2024neural,\ntitle={Neural Field Classifiers via Target Encoding and Classification Loss},\nauthor={Xindi Yang and Zeke Xie and Xiong Zhou and Boyu Liu and Buhua Liu and Yi Liu and Haoran Wang and YUNFENG CAI and Mingming Sun},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=9NqC72m31m}\n}",
        "github": "",
        "project": "",
        "reviewers": "fXmy;WcH4;zn3A;dKd6",
        "pdf_size": 8584881,
        "rating": "6;6;6;8",
        "confidence": "3;4;4;3",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;4;3",
        "wc_summary": "43;93;66;64",
        "wc_strengths": "54;101;21;39",
        "wc_weaknesses": "54;59;116;157",
        "wc_questions": "24;90;2;24",
        "wc_review": "175;343;205;284",
        "wc_reply_reviewers": "17;50;152;77",
        "wc_reply_authors": "267;550;888;858",
        "reply_reviewers": "1;1;2;3",
        "reply_authors": "1;1;3;3",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            66.5,
            17.755280904564703
        ],
        "wc_strengths_avg": [
            53.75,
            29.67637949615822
        ],
        "wc_weaknesses_avg": [
            96.5,
            42.58227330709341
        ],
        "wc_questions_avg": [
            35.0,
            33.0
        ],
        "wc_review_avg": [
            251.75,
            66.03550181531143
        ],
        "wc_reply_reviewers_avg": [
            74.0,
            49.794578018093496
        ],
        "wc_reply_authors_avg": [
            640.75,
            253.10805498837843
        ],
        "reply_reviewers_avg": [
            1.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.0,
            1.0
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:01FbbTUi7vUJ:scholar.google.com/&scioq=Neural+Field+Classifiers+via+Target+Encoding+and+Classification+Loss&hl=en&as_sdt=0,33",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=9NqC72m31m",
        "pdf": "https://openreview.net/pdf?id=9NqC72m31m",
        "email": ";baidu.com;hit.edu.cn;buaa.edu.cn;;bjtu.edu.cn;baidu.com;baidu.com;baidu.com",
        "author_num": 9,
        "aff_unique_index": "0;1;2;3;0;0;0",
        "aff_unique_norm": "Baidu;Harbin Institute of Technology;Beihang University;Beijing Jiao Tong University",
        "aff_unique_dep": "Baidu, Inc.;;;",
        "aff_unique_url": "https://www.baidu.com;http://www.hit.edu.cn/;http://www.buaa.edu.cn/;http://www.njtu.edu.cn/en",
        "aff_unique_abbr": "Baidu;HIT;BUAA;BJTU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Harbin",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Towards Understanding Factual Knowledge of Large Language Models",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19298",
        "id": "9OevMUdods",
        "author_site": "Xuming Hu, Junzhe Chen, Xiaochuan Li, Yufei Guo, Lijie Wen, Philip Yu, Zhijiang Guo",
        "tldr": "",
        "abstract": "Large language models (LLMs) have recently driven striking performance improvements across a range of natural language processing tasks. The factual knowledge acquired during pretraining and instruction tuning can be useful in various downstream tasks, such as question answering, and language generation. Unlike conventional Knowledge Bases (KBs) that explicitly store factual knowledge, LLMs implicitly store facts in their parameters. Content generated by the LLMs can often exhibit inaccuracies or deviations from the truth, due to facts that can be incorrectly induced or become obsolete over time. To this end, we aim to explore the extent and scope of factual knowledge within LLMs by designing the benchmark Pinocchio. Pinocchio contains 20K diverse factual questions that span different sources, timelines, domains, regions, and languages. Furthermore, we investigate whether LLMs can compose multiple facts, update factual knowledge temporally, reason over multiple pieces of facts, identify subtle factual differences, and resist adversarial examples. Extensive experiments on different sizes and types of LLMs show that existing LLMs still lack factual knowledge and suffer from various spurious correlations. We believe this is a critical bottleneck for realizing trustworthy artificial intelligence. The dataset Pinocchio and our codes are publicly available at: https://github.com/THU-BPM/Pinocchio.",
        "keywords": "Large Language Models;Resource and Evaluation;Interpretability;NLP Application",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/51a07766af2dbf3f53f933abc73c84392c2f0628.zip",
        "author": "Xuming Hu;Junzhe Chen;Xiaochuan Li;Yufei Guo;Lijie Wen;Philip S. Yu;Zhijiang Guo",
        "authorids": "~Xuming_Hu1;~Junzhe_Chen1;~Xiaochuan_Li3;~Yufei_Guo3;~Lijie_Wen1;~Philip_S._Yu1;~Zhijiang_Guo2",
        "gender": "M;M;M;M;M;M;M",
        "homepage": "https://xuminghu.github.io/;;https://xiaochuanli.com;https://none.com;https://www.thss.tsinghua.edu.cn/en/faculty/lijiewen.htm;https://cs.uic.edu/profiles/philip-yu/;https://cartus.github.io/",
        "dblp": "262/3664;351/9670;;;36/172-1;y/PhilipSYu;43/6147",
        "google_scholar": "dbBKbXoAAAAJ;KUXvSuIAAAAJ;97QHT-0AAAAJ;;https://scholar.google.com.tw/citations?user=f3C0jUIAAAAJ;D0lL1r0AAAAJ;8b-u3icAAAAJ",
        "orcid": "0000-0001-6075-4224;0009-0005-7573-0707;;;0000-0003-0358-3160;0000-0002-3491-5968;",
        "linkedin": ";;;;;;",
        "or_profile": "~Xuming_Hu1;~Junzhe_Chen1;~Xiaochuan_Li3;~Yufei_Guo3;~Lijie_Wen1;~Philip_S._Yu1;~Zhijiang_Guo2",
        "aff": "Tsinghua University;Tsinghua University;Tsinghua University;Tsinghua University;Tsinghua University;University of Illinois Chicago;University of Cambridge",
        "aff_domain": "tsinghua.edu.cn;tsinghua.edu.cn;mail.tsinghua.edu.cn;mail.tsinghua.edu.cn;tsinghua.edu.cn;uic.edu;cam.ac.uk",
        "position": "PhD student;Undergrad student;Undergrad student;Undergrad student;Associate Professor;Full Professor;Postdoc",
        "bibtex": "@inproceedings{\nhu2024towards,\ntitle={Towards Understanding Factual Knowledge of Large Language Models},\nauthor={Xuming Hu and Junzhe Chen and Xiaochuan Li and Yufei Guo and Lijie Wen and Philip S. Yu and Zhijiang Guo},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=9OevMUdods}\n}",
        "github": "",
        "project": "",
        "reviewers": "1LZe;9WHz;SmAT;XTL4",
        "pdf_size": 2082950,
        "rating": "5;6;8;8",
        "confidence": "4;3;4;4",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "371;51;37;187",
        "wc_strengths": "23;39;38;29",
        "wc_weaknesses": "41;130;306;203",
        "wc_questions": "4;55;2;40",
        "wc_review": "439;275;383;459",
        "wc_reply_reviewers": "0;0;0;47",
        "wc_reply_authors": "1756;959;1428;1359",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "4;3;4;3",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            161.5,
            134.3977306356026
        ],
        "wc_strengths_avg": [
            32.25,
            6.609652033201143
        ],
        "wc_weaknesses_avg": [
            170.0,
            97.24453712162962
        ],
        "wc_questions_avg": [
            25.25,
            22.884219453588535
        ],
        "wc_review_avg": [
            389.0,
            71.47027354082255
        ],
        "wc_reply_reviewers_avg": [
            11.75,
            20.351596988934308
        ],
        "wc_reply_authors_avg": [
            1375.5,
            283.408274402848
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.5,
            0.5
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=827760621825055587&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=9OevMUdods",
        "pdf": "https://openreview.net/pdf?id=9OevMUdods",
        "email": "tsinghua.edu.cn;tsinghua.edu.cn;mail.tsinghua.edu.cn;mail.tsinghua.edu.cn;tsinghua.edu.cn;uic.edu;cam.ac.uk",
        "author_num": 7,
        "aff_unique_index": "0;0;0;0;0;1;2",
        "aff_unique_norm": "Tsinghua University;University of Illinois at Chicago;University of Cambridge",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.uic.edu;https://www.cam.ac.uk",
        "aff_unique_abbr": "THU;UIC;Cambridge",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Chicago;Cambridge",
        "aff_country_unique_index": "0;0;0;0;0;1;2",
        "aff_country_unique": "China;United States;United Kingdom"
    },
    {
        "id": "9QV7Q9gKl9",
        "title": "DIFUSCO-LNS: Diffusion-Guided Large Neighbourhood Search for Integer Linear Programming",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Integer Linear Programming (ILP) is a powerful and flexible framework for modeling and solving a variety of combinatorial optimization problems. This paper introduces a novel ILP solver, namely DIFUSCO-LNS, which combines the strengths of carefully engineered traditional solvers in symbolic reasoning and the generative power of a neural diffusion model in graph-based learning for the Large Neighborhood Search (LNS) approach. Our diffusion model treats the destroy policy in LNS as a generative problem in the discrete $\\{0, 1\\}$-vector space and is trained to imitate the high-quality Local Branching (LB) destroy heuristic through iterative denoising. Specifically, this addresses the unimodal limitation of other neural LNS solvers with its capability to capture the multimodal nature of optimal policies during variable selection.  Our evaluations span four representative MIP problems: MIS, CA, SC, and MVC. Experimental results reveal that DIFUSCO-LNS substantially surpasses prior neural LNS  solvers.",
        "keywords": "Large Neighborhood Search;Diffusion Models;Combinatorial Optimization Solvers",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "/attachment/ba5aca64f8e2a198eb0a3806f8de36908c03c8e6.pdf",
        "author": "Shengyu Feng;Zhiqing Sun;Yiming Yang",
        "authorids": "~Shengyu_Feng1;~Zhiqing_Sun1;~Yiming_Yang1",
        "gender": "M;M;F",
        "homepage": "https://shengyu-feng.github.io/;https://www.cs.cmu.edu/~zhiqings/;http://www.cs.cmu.edu/~yiming/",
        "dblp": "47/2121;211/7692;25/1666",
        "google_scholar": "ApUH8ZcAAAAJ;https://scholar.google.com/citations?hl=en;MlZq4XwAAAAJ",
        "orcid": ";;0000-0001-8322-607X",
        "linkedin": "shengyu-feng-331a6214b/;zhiqing-sun-5781b3100/;yiming-yang-24100924/",
        "or_profile": "~Shengyu_Feng1;~Zhiqing_Sun1;~Yiming_Yang1",
        "aff": "Apple;Carnegie Mellon University;School of Computer Science, Carnegie Mellon University",
        "aff_domain": "apple.com;cs.cmu.edu;cs.cmu.edu",
        "position": "Intern;PhD student;Full Professor",
        "bibtex": "@misc{\nfeng2024difuscolns,\ntitle={{DIFUSCO}-{LNS}: Diffusion-Guided Large Neighbourhood Search for Integer Linear Programming},\nauthor={Shengyu Feng and Zhiqing Sun and Yiming Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=9QV7Q9gKl9}\n}",
        "github": "",
        "project": "",
        "reviewers": "Xy75;Gizx;3tnY",
        "site": "https://openreview.net/forum?id=9QV7Q9gKl9",
        "pdf_size": 1713594,
        "rating": "3;5;5",
        "confidence": "4;3;4",
        "soundness": "2;3;3",
        "contribution": "2;3;2",
        "presentation": "3;2;3",
        "wc_summary": "67;113;79",
        "wc_strengths": "42;39;23",
        "wc_weaknesses": "205;298;114",
        "wc_questions": "265;20;168",
        "wc_review": "579;470;384",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "367;246;536",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            86.33333333333333,
            19.48218559493661
        ],
        "wc_strengths_avg": [
            34.666666666666664,
            8.339997335464536
        ],
        "wc_weaknesses_avg": [
            205.66666666666666,
            75.11916459126053
        ],
        "wc_questions_avg": [
            151.0,
            100.74059095849431
        ],
        "wc_review_avg": [
            477.6666666666667,
            79.79278719839837
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            383.0,
            118.93135274883014
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6209733794584114338&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Apple;Carnegie Mellon University",
        "aff_unique_dep": "Apple Inc.;",
        "aff_unique_url": "https://www.apple.com;https://www.cmu.edu",
        "aff_unique_abbr": "Apple;CMU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Pittsburgh",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "9QVqYBvCD8",
        "title": "Asking Before Acting: Gather Information in Embodied Decision-Making with Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "With strong capabilities of reasoning and a broad understanding of the world, Large Language Models (LLMs) have demonstrated immense potential in building versatile embodied decision-making agents capable of executing a wide array of tasks.\nNevertheless, when deployed in unfamiliar environments, we show that LLM agents encounter challenges in efficiently gathering essential information, leading to suboptimal performance.\nConversely, human individuals often seek additional information from their peers prior to taking action, harnessing external knowledge to avoid unnecessary trial and error. Drawing inspiration from this behavior, we propose \\textit{Asking Before Acting} (ABA), a method that empowers the agent to proactively inquire with external sources for pertinent information using natural language during their interactions within the environment. \nIn this way, the agent is able to enhance its efficiency and performance by circumventing potentially laborious steps and combating the difficulties associated with exploration in unfamiliar environments and vagueness of the instructions.\nWe conduct extensive experiments involving a spectrum of environments including text-based household everyday tasks, robot arm manipulation tasks, and real world open domain image based embodied tasks. The experiments involve various models from Vicuna to GPT-4. The results demonstrate that, even with modest prompts modifications, ABA exhibits substantial  advantages on both performance and efficiency over baseline LLM agents.\nFurther finetuning ABA with reformulated metadata (ABA-FT) faciliates learning the rationale for asking and allows for additional enhancements especially in tasks that baselines struggle to solve.",
        "keywords": "human in the loop;embodied decision making;language model",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/18d3d13ea2cab853919b64523eacb46fcc13d876.zip",
        "author": "Xiaoyu Chen;Shenao Zhang;Pushi Zhang;Li Zhao;Jianyu Chen",
        "authorids": "~Xiaoyu_Chen4;~Shenao_Zhang1;~Pushi_Zhang1;~Li_Zhao1;~Jianyu_Chen1",
        "gender": ";M;;F;M",
        "homepage": "https://github.com/Cospui;https://shenao-zhang.github.io/;https://zpschang.github.io/;https://www.microsoft.com/en-us/research/people/lizo/;http://people.iiis.tsinghua.edu.cn/~jychen/",
        "dblp": ";253/4543.html;288/4226;97/4708-7;",
        "google_scholar": ";8NamuusAAAAJ;_DLMSkIAAAAJ;b-LJkLQAAAAJ;",
        "orcid": ";;;;",
        "linkedin": ";shenao-zhang-055a53178/;;;",
        "or_profile": "~Xiaoyu_Chen4;~Shenao_Zhang1;~Pushi_Zhang1;~Li_Zhao1;~Jianyu_Chen1",
        "aff": "Tsinghua University;Georgia Institute of Technology;Microsoft;Microsoft;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;gatech.edu;microsoft.com;microsoft.com;tsinghua.edu.cn",
        "position": "Graduate student;MS student;Researcher;Researcher;Assistant Professor",
        "bibtex": "@misc{\nchen2024asking,\ntitle={Asking Before Acting: Gather Information in Embodied Decision-Making with Language Models},\nauthor={Xiaoyu Chen and Shenao Zhang and Pushi Zhang and Li Zhao and Jianyu Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=9QVqYBvCD8}\n}",
        "github": "",
        "project": "",
        "reviewers": "mCAD;P7Hr;umUa;23Y9",
        "site": "https://openreview.net/forum?id=9QVqYBvCD8",
        "pdf_size": 3480122,
        "rating": "3;3;6;6",
        "confidence": "4;3;3;5",
        "soundness": "2;3;3;4",
        "contribution": "2;1;2;3",
        "presentation": "2;3;2;4",
        "wc_summary": "51;166;112;60",
        "wc_strengths": "55;100;36;90",
        "wc_weaknesses": "231;239;201;194",
        "wc_questions": "22;3;9;2",
        "wc_review": "359;508;358;346",
        "wc_reply_reviewers": "305;143;21;0",
        "wc_reply_authors": "1784;1483;385;396",
        "reply_reviewers": "2;1;1;0",
        "reply_authors": "4;4;2;2",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            97.25,
            46.01833873576924
        ],
        "wc_strengths_avg": [
            70.25,
            25.8879798362097
        ],
        "wc_weaknesses_avg": [
            216.25,
            19.122957407263137
        ],
        "wc_questions_avg": [
            9.0,
            7.968688725254614
        ],
        "wc_review_avg": [
            392.75,
            66.73595357826244
        ],
        "wc_reply_reviewers_avg": [
            117.25,
            121.37210346698289
        ],
        "wc_reply_authors_avg": [
            1012.0,
            630.5572931938857
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            3.0,
            1.0
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.3015113445777637,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13115928641223429866&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2;2;0",
        "aff_unique_norm": "Tsinghua University;Georgia Institute of Technology;Microsoft",
        "aff_unique_dep": ";;Microsoft Corporation",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.gatech.edu;https://www.microsoft.com",
        "aff_unique_abbr": "THU;Georgia Tech;Microsoft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "On Double Descent in Reinforcement Learning with LSTD and Random Features",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19297",
        "id": "9RIbNmx984",
        "author_site": "David Brellmann, Elo\u00efse Berthier, David Filliat, Goran Frehse",
        "tldr": "",
        "abstract": "Temporal Difference (TD) algorithms are widely used in Deep Reinforcement Learning (RL). Their performance is heavily influenced by the size of the neural network. While in supervised learning, the regime of over-parameterization and its benefits are well understood, the situation in RL is much less clear. In this paper, we present a theoretical analysis of the influence of network size and $l_2$-regularization on performance. We identify the ratio between the number of parameters and the number of visited states as a crucial factor and define over-parameterization as the regime when it is larger than one. Furthermore, we observe a double descent phenomenon, i.e., a sudden drop in performance around the parameter/state ratio of one. Leveraging random features and the lazy training regime, we study the regularized Least-Square Temporal Difference (LSTD) algorithm in an asymptotic regime, as both the number of parameters and states go to infinity, maintaining a constant ratio. We derive deterministic limits of both the empirical and the true Mean-Squared Bellman Error (MSBE) that feature correction terms responsible for the double descent. Correction terms vanish when the $l_2$-regularization is increased or the number of unvisited states goes to zero. Numerical experiments with synthetic and small real-world environments closely match the theoretical predictions.",
        "keywords": "Regularized Least-Square Temporal Difference;double descent;over-parameterization;random features",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/91988691567d4725cfa0a2f23110312354b228ee.zip",
        "author": "David Brellmann;Elo\u00efse Berthier;David Filliat;Goran Frehse",
        "authorids": "~David_Brellmann1;~Elo\u00efse_Berthier1;~David_Filliat1;~Goran_Frehse1",
        "gender": "M;F;M;M",
        "homepage": ";https://eloiseberthier.github.io/;https://perso.ensta-paris.fr/~filliat/en/;https://sites.google.com/site/frehseg/",
        "dblp": ";267/0937;13/5289;95/3625",
        "google_scholar": "https://scholar.google.com/citations?hl=fr;-PQBEZMAAAAJ;https://scholar.google.fr/citations?user=Wzq_c20AAAAJ;IgZwd6MAAAAJ",
        "orcid": ";;0000-0002-5739-1618;0000-0002-5441-0481",
        "linkedin": "david-brellmann;;;goran-frehse-84b8311/",
        "or_profile": "~David_Brellmann1;~Elo\u00efse_Berthier1;~David_Filliat1;~Goran_Frehse1",
        "aff": "ENSTA Paris;ENSTA;ENSTA Paris;ENSTA Paris",
        "aff_domain": "ensta-paris.fr;ensta-paris.fr;ensta-paris.fr;ensta-paris.fr",
        "position": "PhD student;Researcher;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nbrellmann2024on,\ntitle={On Double Descent in Reinforcement Learning with {LSTD} and Random Features},\nauthor={David Brellmann and Elo{\\\"\\i}se Berthier and David Filliat and Goran Frehse},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=9RIbNmx984}\n}",
        "github": "",
        "project": "",
        "reviewers": "jHhA;xcHJ;a6mC;7TMf",
        "pdf_size": 1395169,
        "rating": "6;6;8;10",
        "confidence": "3;3;3;4",
        "soundness": "3;3;3;4",
        "contribution": "3;3;3;4",
        "presentation": "3;3;3;4",
        "wc_summary": "198;259;111;169",
        "wc_strengths": "76;63;90;175",
        "wc_weaknesses": "200;119;537;356",
        "wc_questions": "94;2;80;83",
        "wc_review": "568;443;818;783",
        "wc_reply_reviewers": "26;0;20;76",
        "wc_reply_authors": "286;361;728;374",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "1;3;2;2",
        "rating_avg": [
            7.5,
            1.6583123951777
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            184.25,
            53.326236506995315
        ],
        "wc_strengths_avg": [
            101.0,
            43.777848279695064
        ],
        "wc_weaknesses_avg": [
            303.0,
            159.7106759111613
        ],
        "wc_questions_avg": [
            64.75,
            36.601741761834234
        ],
        "wc_review_avg": [
            653.0,
            154.47491705775408
        ],
        "wc_reply_reviewers_avg": [
            30.5,
            27.977669667075563
        ],
        "wc_reply_authors_avg": [
            437.25,
            171.1919609677978
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.8703882797784891,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6954276998867653729&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=9RIbNmx984",
        "pdf": "https://openreview.net/pdf?id=9RIbNmx984",
        "email": "ensta-paris.fr;ensta-paris.fr;ensta-paris.fr;ensta-paris.fr",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "\u00c9cole Nationale Sup\u00e9rieure de Techniques Avanc\u00e9es",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ensta.fr",
        "aff_unique_abbr": "ENSTA",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Paris;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "France"
    },
    {
        "id": "9RLC0J2N9n",
        "title": "SynBench: Evaluating Pretrained Representations for Image Classification using Synthetic Data",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Fine-tuning large models pretrained at scale on broad data for solving downstream tasks has made considerable success in recent years. There seems to be indeed an ongoing paradigm shift in deep learning from task-centric model design to task-agnostic representation learning and task-specific fine-tuning. Specifically, the representations of pretrained models are used as a foundation for different downstream tasks. This paper proposes a new task-agnostic framework, \\textit{SynBench}, to measure the quality of pretrained representations for image classification using synthetic data. To address the challenge of task-agnostic data-free evaluation, we design synthetic binary classification proxy tasks with class-conditional Gaussian mixtures. This way we probe and compare the robustness-accuracy performance on pretrained representations and input synthetic data. SynBench offers a holistic quantitative evaluation, informs the model designers of the intrinsic performance, and spares efforts on task-specific finetuning with real-life data. Evaluated with various pretrained vision models for different downstream image classification tasks, the experimental results show that our SynBench score matches well the actual linear probing performance of the pretrained model when fine-tuned on downstream tasks using real-life data. Finally, SynBench can also be used in robust linear probing to mitigate the robustness-accuracy tradeoff in downstream tasks.",
        "keywords": "Vision pretrained model; synthetic data; evaluation",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Ching-Yun Ko;Pin-Yu Chen;Payel Das;Jeet Mohapatra;Luca Daniel",
        "authorids": "~Ching-Yun_Ko1;~Pin-Yu_Chen1;~Payel_Das1;~Jeet_Mohapatra1;~Luca_Daniel1",
        "gender": "F;M;F;M;",
        "homepage": ";http://www.pinyuchen.com;;;https://www.mit.edu/~dluca/",
        "dblp": "206/6472;39/8969;56/7926;210/2304;35/5202",
        "google_scholar": ";jxwlCUUAAAAJ;;;",
        "orcid": ";0000-0003-1039-8369;;;0000-0002-5880-3151",
        "linkedin": ";pin-yu-chen-940062a2;;;",
        "or_profile": "~Ching-Yun_Ko1;~Pin-Yu_Chen1;~Payel_Das1;~Jeet_Mohapatra1;~Luca_Daniel1",
        "aff": "Massachusetts Institute of Technology;International Business Machines;IBM, International Business Machines;;",
        "aff_domain": "mit.edu;ibm.com;us.ibm.com;;",
        "position": "PhD student;Principal Researcher;Principal Researcher;;",
        "bibtex": "@misc{\nko2024synbench,\ntitle={SynBench: Evaluating Pretrained Representations for Image Classification using Synthetic Data},\nauthor={Ching-Yun Ko and Pin-Yu Chen and Payel Das and Jeet Mohapatra and Luca Daniel},\nyear={2024},\nurl={https://openreview.net/forum?id=9RLC0J2N9n}\n}",
        "github": "",
        "project": "",
        "reviewers": "af4U;4o5T;97TE;S4rE",
        "site": "https://openreview.net/forum?id=9RLC0J2N9n",
        "pdf_size": 2774636,
        "rating": "3;3;6;6",
        "confidence": "4;3;2;3",
        "soundness": "1;2;4;3",
        "contribution": "2;2;4;3",
        "presentation": "3;3;3;3",
        "wc_summary": "126;100;103;74",
        "wc_strengths": "66;58;91;60",
        "wc_weaknesses": "392;173;39;129",
        "wc_questions": "190;50;77;2",
        "wc_review": "774;381;310;265",
        "wc_reply_reviewers": "519;242;35;25",
        "wc_reply_authors": "2547;2062;644;723",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "6;5;2;2",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            1.118033988749895
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            100.75,
            18.430613120566555
        ],
        "wc_strengths_avg": [
            68.75,
            13.179055353097201
        ],
        "wc_weaknesses_avg": [
            183.25,
            129.83908309904226
        ],
        "wc_questions_avg": [
            79.75,
            69.08825877093734
        ],
        "wc_review_avg": [
            432.5,
            201.45533003621424
        ],
        "wc_reply_reviewers_avg": [
            205.25,
            200.78891279151844
        ],
        "wc_reply_authors_avg": [
            1494.0,
            828.9110326205099
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.75,
            1.7853571071357126
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.7071067811865476,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:xTaPW4fqbKkJ:scholar.google.com/&scioq=SynBench:+Evaluating+Pretrained+Representations+for+Image+Classification+using+Synthetic+Data&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Massachusetts Institute of Technology;International Business Machines Corporation;International Business Machines",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://web.mit.edu;https://www.ibm.com;https://www.ibm.com",
        "aff_unique_abbr": "MIT;IBM;IBM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Leave-one-out Distinguishability in Machine Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19296",
        "id": "9RNfX0ah0K",
        "author_site": "Jiayuan Ye, Anastasia Borovykh, Soufiane Hayou, Reza Shokri",
        "tldr": "",
        "abstract": "We introduce an analytical framework to quantify the changes in a machine learning algorithm's output distribution following the inclusion of a few data points in its training set, a notion we define as leave-one-out distinguishability (LOOD).  This is key to measuring data **memorization** and information **leakage** as well as the **influence** of training data points in machine learning. We illustrate how our method broadens and refines existing empirical measures of memorization and privacy risks associated with training data. We use Gaussian processes to model the randomness of machine learning algorithms, and validate LOOD with extensive empirical analysis of leakage using membership inference attacks. Our analytical framework enables us to investigate the causes of leakage and where the leakage is high.  For example, we analyze the influence of activation functions, on data memorization.  Additionally, our method allows us to identify queries that disclose the most information about the training data in the leave-one-out setting.  We illustrate how optimal queries can be used for accurate **reconstruction** of training data.",
        "keywords": "memorization;influence estimation;information leakage;neural network Gaussian process",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Jiayuan Ye;Anastasia Borovykh;Soufiane Hayou;Reza Shokri",
        "authorids": "~Jiayuan_Ye1;~Anastasia_Borovykh1;~Soufiane_Hayou1;~Reza_Shokri1",
        "gender": ";;M;",
        "homepage": ";;https://www.soufianehayou.com/;",
        "dblp": ";;220/5617;",
        "google_scholar": ";;https://scholar.google.com/citations?hl=en;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Jiayuan_Ye1;~Anastasia_Borovykh1;~Soufiane_Hayou1;~Reza_Shokri1",
        "aff": ";;National University of Singapore;",
        "aff_domain": ";;nus.edu.sg;",
        "position": ";;Assistant Professor;",
        "bibtex": "@inproceedings{\nye2024leaveoneout,\ntitle={Leave-one-out Distinguishability in Machine Learning},\nauthor={Jiayuan Ye and Anastasia Borovykh and Soufiane Hayou and Reza Shokri},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=9RNfX0ah0K}\n}",
        "github": "",
        "project": "",
        "reviewers": "s1Kq;Azxn;mmKM;rJTi",
        "pdf_size": 5745906,
        "rating": "5;6;6;8",
        "confidence": "4;3;3;2",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;2;3",
        "wc_summary": "82;294;107;158",
        "wc_strengths": "80;88;25;59",
        "wc_weaknesses": "242;128;122;16",
        "wc_questions": "52;30;24;43",
        "wc_review": "456;540;278;276",
        "wc_reply_reviewers": "0;0;0;4",
        "wc_reply_authors": "1113;947;0;368",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "2;2;0;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            160.25,
            81.93404359605353
        ],
        "wc_strengths_avg": [
            63.0,
            24.361855430159665
        ],
        "wc_weaknesses_avg": [
            127.0,
            79.95623803056269
        ],
        "wc_questions_avg": [
            37.25,
            10.940178243520533
        ],
        "wc_review_avg": [
            387.5,
            114.42355526726129
        ],
        "wc_reply_reviewers_avg": [
            1.0,
            1.7320508075688772
        ],
        "wc_reply_authors_avg": [
            607.0,
            446.43196570138207
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.82915619758885
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9733285267845754,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11532538955694417653&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=9RNfX0ah0K",
        "pdf": "https://openreview.net/pdf?id=9RNfX0ah0K",
        "email": ";;nus.edu.sg;",
        "author_num": 4,
        "aff_unique_index": "0",
        "aff_unique_norm": "National University of Singapore",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nus.edu.sg",
        "aff_unique_abbr": "NUS",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Singapore"
    },
    {
        "title": "NECO: NEural Collapse Based Out-of-distribution detection",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19295",
        "id": "9ROuKblmi7",
        "author_site": "Mou\u00efn Ben Ammar, Nacim Belkhir, Sebastian Popescu, Antoine Manzanera, Gianni Franchi",
        "tldr": "",
        "abstract": "Detecting out-of-distribution (OOD) data is a critical challenge in machine learning due to model overconfidence, often without awareness of their epistemological limits. We hypothesize that \"neural collapse\", a phenomenon affecting in-distribution data for models trained beyond loss convergence, also influences OOD data. To benefit from this interplay, we introduce NECO, a novel post-hoc method for OOD detection, which leverages the geometric properties of \u201cneural collapse\u201d and of principal component spaces to identify OOD data. Our extensive experiments demonstrate that NECO achieves state-of-the-art results on both small and large-scale OOD detection tasks while exhibiting strong generalization capabilities across different network architectures. Furthermore, we provide a theoretical explanation for the effectiveness of our method in OOD detection. We plan to release the code after the anonymity period.",
        "keywords": "anomaly detection;OOD",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/6ac26ebf27b2712ee42924778a40e47549861536.zip",
        "author": "Mou\u00efn Ben Ammar;Nacim Belkhir;Sebastian Popescu;Antoine Manzanera;Gianni Franchi",
        "authorids": "~Mou\u00efn_Ben_Ammar1;~Nacim_Belkhir1;~Sebastian_Popescu1;~Antoine_Manzanera1;~Gianni_Franchi1",
        "gender": "M;M;M;M;M",
        "homepage": ";https://www.linkedin.com/in/belkhirnacim;;https://perso.ensta-paris.fr/~manzaner/;https://giannifranchi.github.io/",
        "dblp": "359/1584;;;73/2951;155/3061",
        "google_scholar": "https://scholar.google.com/citations?hl=en;As-piMYAAAAJ;FKDRATgAAAAJ;YBJbAhoAAAAJ;ZCW6-psAAAAJ",
        "orcid": ";;;0000-0001-5718-411X;0000-0002-2184-1381",
        "linkedin": "mouinbenammar/;;;;gianni-franchi-94435754/",
        "or_profile": "~Mou\u00efn_Ben_Ammar1;~Nacim_Belkhir1;~Sebastian_Popescu1;~Antoine_Manzanera1;~Gianni_Franchi1",
        "aff": "ENSTA Paris;Safran;Find&Order;Ecole Nationale Sup\u00e9rieure de Techniques Avanc\u00e9es;ENSTA Paris",
        "aff_domain": "ensta-paristech.fr;safrangroup.com;findnorder.com;ensta-paris.fr;ensta-paristech.fr",
        "position": "PhD student;Researcher;Researcher;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nammar2024neco,\ntitle={{NECO}: {NE}ural Collapse Based Out-of-distribution detection},\nauthor={Mou{\\\"\\i}n Ben Ammar and Nacim Belkhir and Sebastian Popescu and Antoine Manzanera and Gianni Franchi},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=9ROuKblmi7}\n}",
        "github": "",
        "project": "",
        "reviewers": "1ZaR;Qb8y;Ek3F;r6r7",
        "pdf_size": 6740316,
        "rating": "5;6;6;6",
        "confidence": "3;3;4;4",
        "soundness": "2;2;3;2",
        "contribution": "2;2;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "73;75;49;57",
        "wc_strengths": "72;54;49;38",
        "wc_weaknesses": "63;121;84;257",
        "wc_questions": "237;124;11;11",
        "wc_review": "445;374;193;363",
        "wc_reply_reviewers": "0;127;0;0",
        "wc_reply_authors": "540;1372;366;526",
        "reply_reviewers": "0;2;0;0",
        "reply_authors": "2;4;2;2",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            63.5,
            10.897247358851684
        ],
        "wc_strengths_avg": [
            53.25,
            12.275483697190918
        ],
        "wc_weaknesses_avg": [
            131.25,
            75.51283003569658
        ],
        "wc_questions_avg": [
            95.75,
            93.69465032754005
        ],
        "wc_review_avg": [
            343.75,
            92.5509994543549
        ],
        "wc_reply_reviewers_avg": [
            31.75,
            54.99261314031185
        ],
        "wc_reply_authors_avg": [
            701.0,
            393.38657831705444
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            2.5,
            0.8660254037844386
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 20,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4653753281710190123&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 10,
        "openreview": "https://openreview.net/forum?id=9ROuKblmi7",
        "pdf": "https://openreview.net/pdf?id=9ROuKblmi7",
        "email": "ensta-paristech.fr;safrangroup.com;findnorder.com;ensta-paris.fr;ensta-paristech.fr",
        "author_num": 5,
        "aff_unique_index": "0;1;2;3;0",
        "aff_unique_norm": "\u00c9cole Nationale Sup\u00e9rieure de Techniques Avanc\u00e9es;Safran;Find&Order;Ecole Nationale Sup\u00e9rieure de Techniques Avanc\u00e9es",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.ensta.fr;https://www.safran-group.com;;https://www.ensae.fr",
        "aff_unique_abbr": "ENSTA;;;ENSTA",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Paris;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "France;"
    },
    {
        "id": "9St5HsXMOr",
        "title": "Long-range Meta-path Search through Progressive Sampling on Large-scale Heterogeneous Information Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Utilizing long-range dependency, though extensively studied in homogeneous graphs, is rarely studied in large-scale heterogeneous information networks (HINs), whose main challenge is the high costs and the difficulty in utilizing effective information. To this end, we investigate the importance of different meta-paths and propose an automatic framework for utilizing long-range dependency in HINs, called Long-range Meta-path Search through Progressive Sampling (LMSPS). Specifically, to discover meta-paths for various datasets or tasks without prior, we develop a search space with all target-node-related meta-paths. With a progressive sampling algorithm, we dynamically shrink the search space with hop-independent time complexity, leading to a compact search space driven by the current HIN and task. Utilizing a sampling evaluation strategy as the guidance, we conduct a specialized and expressive meta-path selection. Extensive experiments on eight heterogeneous datasets demonstrate that LMSPS discovers effective long-range meta-paths and outperforms state-of-the-art models. Besides, it ranks top-1 on the leaderboards of ogbn-mag in Open Graph Benchmark.",
        "keywords": "Neural architecture search;heterogeneous graph neural networks;long-range dependency;meta-path search",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/3b1003a69e73a2a2719eaab2b87fa49fc9612f95.zip",
        "author": "Chao Li;Zijie Guo;Qiuting He;Hao Xu;Kun He",
        "authorids": "~Chao_Li14;~Zijie_Guo1;~Qiuting_He1;~Hao_Xu11;~Kun_He1",
        "gender": "M;;M;M;F",
        "homepage": "https://github.com/lichaoaaron;;;http://www.masterx.top/;http://faculty.hust.edu.cn/hekun/zh_CN/more/1411001/jsjjgd/index.htm",
        "dblp": ";;https://dblp.uni-trier.de/pid/322/9335.html;43/6008;59/1028-1",
        "google_scholar": "Wik8bkIAAAAJ;;;8zcB6s4AAAAJ;YTQnGJsAAAAJ",
        "orcid": "0000-0001-9066-1440;;;0000-0003-4207-6161;0000-0001-7627-4604",
        "linkedin": ";;;;",
        "or_profile": "~Chao_Li14;~Zijie_Guo1;~Qiuting_He1;~Hao_Xu11;~Kun_He1",
        "aff": "Huazhong University of Science and Technology;;;Huazhong University of Science and Technology;Huazhong University of Sceince and Technology",
        "aff_domain": "hust.edu.cn;;;hust.edu.cn;hust.edu.cn",
        "position": "PhD student;;;MS student;Full Professor",
        "bibtex": "@misc{\nli2024longrange,\ntitle={Long-range Meta-path Search through Progressive Sampling on Large-scale Heterogeneous Information Networks},\nauthor={Chao Li and Zijie Guo and Qiuting He and Hao Xu and Kun He},\nyear={2024},\nurl={https://openreview.net/forum?id=9St5HsXMOr}\n}",
        "github": "",
        "project": "",
        "reviewers": "f416;vDix;dvsv;kpcU;zWVu",
        "site": "https://openreview.net/forum?id=9St5HsXMOr",
        "pdf_size": 624254,
        "rating": "5;5;5;5;8",
        "confidence": "4;4;3;4;3",
        "soundness": "3;2;3;3;4",
        "contribution": "2;2;2;3;3",
        "presentation": "3;3;2;2;3",
        "wc_summary": "93;73;119;124;84",
        "wc_strengths": "33;48;38;59;33",
        "wc_weaknesses": "138;555;150;175;49",
        "wc_questions": "21;2;51;3;51",
        "wc_review": "285;678;358;361;217",
        "wc_reply_reviewers": "12;0;0;28;0",
        "wc_reply_authors": "955;1606;918;749;590",
        "reply_reviewers": "1;0;0;1;0",
        "reply_authors": "2;3;2;1;1",
        "rating_avg": [
            5.6,
            1.2
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            3.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            98.6,
            19.80504986108341
        ],
        "wc_strengths_avg": [
            42.2,
            10.02796090937734
        ],
        "wc_weaknesses_avg": [
            213.4,
            176.00977245596337
        ],
        "wc_questions_avg": [
            25.6,
            21.813757127097567
        ],
        "wc_review_avg": [
            379.8,
            158.26736871509556
        ],
        "wc_reply_reviewers_avg": [
            8.0,
            11.027239001672177
        ],
        "wc_reply_authors_avg": [
            963.6,
            346.5432729111907
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.8,
            0.7483314773547883
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.6123724356957945,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:4lJBZmkZIaYJ:scholar.google.com/&scioq=Long-range+Meta-path+Search+through+Progressive+Sampling+on+Large-scale+Heterogeneous+Information+Networks&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Huazhong University of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.hust.edu.cn",
        "aff_unique_abbr": "HUST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "9SwObx9Jdn",
        "title": "Generation of Geodesics with Actor-Critic Reinforcement Learning to Predict Midpoints",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Various tasks in the real world, such as path planning, can be reduced to the generation of geodesics on manifolds. For reinforcement learning to generate geodesics sequentially, we need to define rewards appropriately. To generate geodesics without any adjustment of rewards, we propose to use a modified version of sub-goal trees, called midpoint trees. While sub-goal trees consist of arbitrary intermediate points, midpoint trees consist of midpoints. In addition, we propose an actor-critic method to learn to predict midpoints and theoretically prove that, under mild assumptions, when the learning converges at the limit of infinite tree depth, the resulting policy generates exact midpoints.\nWe show experimentally that our proposed method outperforms existing methods in a certain path planning task.",
        "keywords": "reinforcement learning;actor-critic method;path planning;path optimization;subgoal;midpoint;geodesic;Finsler geometry",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/88737306bff9b1bedc84e99ad1af389499b699d6.zip",
        "author": "Kazumi Kasaura",
        "authorids": "~Kazumi_Kasaura1",
        "gender": "",
        "homepage": "",
        "dblp": "334/3342.html",
        "google_scholar": "rONY2jEAAAAJ",
        "orcid": "0000-0002-3219-9961",
        "linkedin": "",
        "or_profile": "~Kazumi_Kasaura1",
        "aff": "OMRON SINIC X Corporation",
        "aff_domain": "sinicx.com",
        "position": "Researcher",
        "bibtex": "@misc{\nkasaura2024generation,\ntitle={Generation of Geodesics with Actor-Critic Reinforcement Learning to Predict Midpoints},\nauthor={Kazumi Kasaura},\nyear={2024},\nurl={https://openreview.net/forum?id=9SwObx9Jdn}\n}",
        "github": "",
        "project": "",
        "reviewers": "8vLp;4ppY;etxs;ZvgN",
        "site": "https://openreview.net/forum?id=9SwObx9Jdn",
        "pdf_size": 757217,
        "rating": "3;5;5;6",
        "confidence": "3;1;2;3",
        "soundness": "3;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "55;93;82;80",
        "wc_strengths": "49;18;60;37",
        "wc_weaknesses": "125;137;351;63",
        "wc_questions": "106;45;70;66",
        "wc_review": "335;293;563;246",
        "wc_reply_reviewers": "55;0;0;0",
        "wc_reply_authors": "597;257;472;216",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "3;1;2;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            2.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            77.5,
            13.901438774457844
        ],
        "wc_strengths_avg": [
            41.0,
            15.572411502397436
        ],
        "wc_weaknesses_avg": [
            169.0,
            108.76580344942982
        ],
        "wc_questions_avg": [
            71.75,
            21.935986415021322
        ],
        "wc_review_avg": [
            359.25,
            121.77515140618796
        ],
        "wc_reply_reviewers_avg": [
            13.75,
            23.81569860407206
        ],
        "wc_reply_authors_avg": [
            385.5,
            156.09051861019617
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.20751433915982243,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:-hXDlkd16w4J:scholar.google.com/&scioq=Generation+of+Geodesics+with+Actor-Critic+Reinforcement+Learning+to+Predict+Midpoints&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "OMRON Corporation",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.omron.com",
        "aff_unique_abbr": "OMRON",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Japan"
    },
    {
        "id": "9TG42oozQP",
        "title": "Causal Effect Estimation with Mixed Latent Confounders and Post-treatment Variables",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In recent years, causal inference from observational data has attracted considerable attention among researchers. One main obstacle for inferring causal effects from observational data is the handling of confounders. As direct measurement of confounders may not always be feasible, recent methods seek to adjust the confounding effects based on proxy variables, which are high-dimensional features researchers postulated to be determined by the latent confounders. However, observed features may scramble both latent confounders and post-treatment variables simultaneously in observational study, where existing methods risk distorting the estimation by unintentionally controlling variables affected by the treatment. In this paper, we systematically investigate the latent post-treatment bias in causal inference. We first derive the bias of existing methods when the selected proxies scramble both latent confounders and post-treatment variables, which we demonstrate can be arbitrarily bad. We then propose a novel Confounder-identifiable VAE (CiVAE) to address the bias, built upon the assumption that the prior of latent variables belongs to the general exponential family with at least one invertible sufficient statistic in the factorized part. Based on this, we show that latent confounders and latent post-treatment variables can be properly distinguished. Furthermore, we show that latent confounders can be identified up to simple bijective transformations. Finally, we prove that the true causal effects can be unbiasedly estimated with transformed confounder proxies. Experiments on both simulated and real-world datasets demonstrate that CiVAE is signi\ufb01cantly more robust than existing methods.",
        "keywords": "Causal Inference;Latent Post-treatment Bias;Proxy of Confounders;Identifiable VAE",
        "primary_area": "causal reasoning",
        "supplementary_material": "",
        "author": "Yaochen Zhu;Jing Ma;Liang Wu;Qi Guo;Liangjie Hong;Jundong Li",
        "authorids": "~Yaochen_Zhu1;~Jing_Ma2;~Liang_Wu3;~Qi_Guo9;~Liangjie_Hong1;~Jundong_Li2",
        "gender": "M;F;M;M;M;M",
        "homepage": "http://www.ychzhu.com/;https://jma712.github.io/;http://liangwu.me/;https://qiguo.xyz/;https://www.hongliangjie.com/;https://jundongli.github.io/",
        "dblp": "251/3533;96/6129-2;https://dblp.org/pers/hd/w/Wu_0006:Liang;67/398-3;00/7186;144/7997.html",
        "google_scholar": "mNKYtHEAAAAJ;VLElvX8AAAAJ;r2BP6FsAAAAJ;IatRsPEAAAAJ;4uaSNpYAAAAJ;uY6ek7sAAAAJ",
        "orcid": ";;;0009-0009-0078-1533;;",
        "linkedin": ";;wuliang1/;qi-guo/;liangjiehong/;",
        "or_profile": "~Yaochen_Zhu1;~Jing_Ma2;~Liang_Wu3;~Qi_Guo9;~Liangjie_Hong1;~Jundong_Li2",
        "aff": "LinkedIn;Case Western Reserve University;LinkedIn;LinkedIn;LinkedIn;University of Virginia",
        "aff_domain": "linkedin.com;case.edu;linkedin.com;linkedin.com;linkedin.com;virginia.edu",
        "position": "Intern;Assistant Professor;Applied Scientist;Researcher;Researcher;Assistant Professor",
        "bibtex": "@misc{\nzhu2024causal,\ntitle={Causal Effect Estimation with Mixed Latent Confounders and Post-treatment Variables},\nauthor={Yaochen Zhu and Jing Ma and Liang Wu and Qi Guo and Liangjie Hong and Jundong Li},\nyear={2024},\nurl={https://openreview.net/forum?id=9TG42oozQP}\n}",
        "github": "",
        "project": "",
        "reviewers": "cihL;Eaxa;gqDy;wUiz",
        "site": "https://openreview.net/forum?id=9TG42oozQP",
        "pdf_size": 458832,
        "rating": "3;3;5;5",
        "confidence": "3;4;3;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;2",
        "presentation": "2;2;3;2",
        "wc_summary": "46;27;100;38",
        "wc_strengths": "29;25;25;29",
        "wc_weaknesses": "697;211;188;229",
        "wc_questions": "2;2;22;2",
        "wc_review": "774;265;335;298",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            52.75,
            28.101378969723175
        ],
        "wc_strengths_avg": [
            27.0,
            2.0
        ],
        "wc_weaknesses_avg": [
            331.25,
            211.66527230511858
        ],
        "wc_questions_avg": [
            7.0,
            8.660254037844387
        ],
        "wc_review_avg": [
            418.0,
            207.02294558816422
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:-W6LS7n_ENoJ:scholar.google.com/&scioq=Causal+Effect+Estimation+with+Mixed+Latent+Confounders+and+Post-treatment+Variables&hl=en&as_sdt=0,33",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;0;0;0;2",
        "aff_unique_norm": "LinkedIn Corporation;Case Western Reserve University;University of Virginia",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.linkedin.com;https://www.case.edu;https://www.virginia.edu",
        "aff_unique_abbr": "LinkedIn;CWRU;UVA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "9TJDsOEaBC",
        "title": "Bayesian Vector Optimization with Gaussian Processes",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Learning problems in which multiple conflicting objectives must be considered simultaneously often arise in various fields, including engineering, drug design, and environmental management. Traditional methods of multi-objective optimization, such as scalarization and identification of the Pareto set under componentwise order, have limitations in incorporating objective preferences and exploring the solution space accordingly. While vector optimization offers improved flexibility and adaptability via specifying partial orders based on ordering cones, current techniques designed for sequential experiments suffer from high sample complexity, which makes them unfit for large-scale learning problems. To address this issue, we propose VOGP, an ($\\epsilon,\\delta$)-PAC adaptive elimination algorithm that performs vector optimization using Gaussian processes. VOGP allows users to convey objective preferences through ordering cones while performing efficient sampling by exploiting the smoothness of the objective function, resulting in a more effective optimization process that requires fewer evaluations. We first establish provable theoretical guarantees for VOGP, and then derive information gain based and kernel specific sample complexity bounds. VOGP demonstrates strong empirical results on both real-world and synthetic datasets, outperforming previous work in sequential vector optimization and its special case multi-objective optimization. This work highlights the potential of VOGP as a powerful preference-driven method for addressing complex sequential vector optimization problems.",
        "keywords": "Vector Optimization;Bayesian Optimization;Gaussian Processes;Ordering Cones",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/9ea67f537d09082f69a1d889d546c9ec75f82025.zip",
        "author": "\u0130lter Onat Korkmaz;Cagin Ararat;Cem Tekin",
        "authorids": "~\u0130lter_Onat_Korkmaz1;~Cagin_Ararat1;~Cem_Tekin2",
        "gender": "M;M;M",
        "homepage": ";https://sites.google.com/view/cararat;http://kilyos.ee.bilkent.edu.tr/~cemtekin/",
        "dblp": ";268/5341;98/7659.html",
        "google_scholar": "qlway8sAAAAJ;;https://scholar.google.com/citations?hl=tr",
        "orcid": ";0000-0002-6985-7665;",
        "linkedin": "ilter-onat-korkmaz-352998180/;;",
        "or_profile": "~\u0130lter_Onat_Korkmaz1;~Cagin_Ararat1;~Cem_Tekin2",
        "aff": "Bilkent University;Bilkent University;Bilkent University",
        "aff_domain": "bilkent.edu.tr;bilkent.edu.tr;bilkent.edu.tr",
        "position": "MS student;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nkorkmaz2024bayesian,\ntitle={Bayesian Vector Optimization with Gaussian Processes},\nauthor={{\\.I}lter Onat Korkmaz and Cagin Ararat and Cem Tekin},\nyear={2024},\nurl={https://openreview.net/forum?id=9TJDsOEaBC}\n}",
        "github": "",
        "project": "",
        "reviewers": "bF5L;ahkf;XrYo;vz76",
        "site": "https://openreview.net/forum?id=9TJDsOEaBC",
        "pdf_size": 699313,
        "rating": "5;5;5;6",
        "confidence": "5;2;3;2",
        "soundness": "2;2;2;3",
        "contribution": "2;3;2;3",
        "presentation": "2;2;3;3",
        "wc_summary": "75;116;115;64",
        "wc_strengths": "24;99;59;8",
        "wc_weaknesses": "59;157;308;6",
        "wc_questions": "570;135;152;1",
        "wc_review": "728;507;634;79",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "789;647;635;96",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.0,
            1.224744871391589
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            92.5,
            23.32916629457641
        ],
        "wc_strengths_avg": [
            47.5,
            34.98928407384181
        ],
        "wc_weaknesses_avg": [
            132.5,
            114.89669272872914
        ],
        "wc_questions_avg": [
            214.5,
            213.41801704635904
        ],
        "wc_review_avg": [
            487.0,
            248.2710212650683
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            541.75,
            264.38549033560827
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.4714045207910316,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17018310508350217774&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Bilkent University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.bilkent.edu.tr",
        "aff_unique_abbr": "Bilkent",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "T\u00fcrkiye"
    },
    {
        "id": "9TSv6ZVhvN",
        "title": "Improving Accelerated Federated Learning with Compression and Importance Sampling",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Federated Learning is a collaborative training framework that leverages heterogeneous data distributed across a vast number of clients. Since it is practically infeasible to request and process all clients during the aggregation step, partial participation must be supported. In this setting, the communication between the server and clients poses a major bottleneck. To reduce communication loads, there are two main approaches: compression and local steps. Recent work by Mishchenko et al. [2022] introduced the new ProxSkip method, which achieves an accelerated rate using the local steps technique. Follow-up works successfully combined local steps acceleration with partial participation [Grudzie\u0144 et al., 2023, Condat et al. 2023] and gradient compression [Condat et al. [2022]. In this paper, we finally present a complete method for Federated Learning that incorporates all necessary ingredients: Local Training, Compression, and Partial Participation. We obtain state-of-the-art convergence guarantees in the considered setting. Moreover, we analyze the general sampling framework for partial participation and derive an importance sampling scheme, which leads to even better performance. We experimentally demonstrate the advantages of the proposed method in practice.",
        "keywords": "Machine Learning;Optimization;Federated Learning",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Micha\u0142 Grudzie\u0144;Grigory Malinovsky;Peter Richt\u00e1rik",
        "authorids": "~Micha\u0142_Grudzie\u01441;~Grigory_Malinovsky1;~Peter_Richt\u00e1rik1",
        "gender": "M;M;M",
        "homepage": ";https://grigory-malinovsky.github.io;https://richtarik.org",
        "dblp": ";262/3277.html;62/8001",
        "google_scholar": "vN2ALVYAAAAJ;4w2W9KQAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;0000-0003-4380-5848",
        "linkedin": "micha%C5%82-grudzie%C5%84-2141a2198/;;richtarik/",
        "or_profile": "~Micha\u0142_Grudzie\u01441;~Grigory_Malinovsky1;~Peter_Richtarik1",
        "aff": "University of Oxford;Samsung;King Abdullah University of Science and Technology (KAUST)",
        "aff_domain": "ox.ac.uk;samsung.com;kaust.edu.sa",
        "position": "Undergrad student;Intern;Full Professor",
        "bibtex": "@misc{\ngrudzie{\\'n}2024improving,\ntitle={Improving Accelerated Federated Learning with Compression and Importance Sampling},\nauthor={Micha{\\l} Grudzie{\\'n} and Grigory Malinovsky and Peter Richt{\\'a}rik},\nyear={2024},\nurl={https://openreview.net/forum?id=9TSv6ZVhvN}\n}",
        "github": "",
        "project": "",
        "reviewers": "AQbc;ii5V;SCZT",
        "site": "https://openreview.net/forum?id=9TSv6ZVhvN",
        "pdf_size": 590601,
        "rating": "3;3;8",
        "confidence": "3;4;2",
        "soundness": "2;2;4",
        "contribution": "2;2;2",
        "presentation": "2;3;4",
        "wc_summary": "36;32;26",
        "wc_strengths": "26;43;30",
        "wc_weaknesses": "62;284;53",
        "wc_questions": "116;2;2",
        "wc_review": "240;361;111",
        "wc_reply_reviewers": "381;0;0",
        "wc_reply_authors": "3240;1105;537",
        "reply_reviewers": "2;0;0",
        "reply_authors": "6;2;1",
        "rating_avg": [
            4.666666666666667,
            2.357022603955158
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            31.333333333333332,
            4.109609335312651
        ],
        "wc_strengths_avg": [
            33.0,
            7.2571803523590805
        ],
        "wc_weaknesses_avg": [
            133.0,
            106.8363234110946
        ],
        "wc_questions_avg": [
            40.0,
            53.74011537017761
        ],
        "wc_review_avg": [
            237.33333333333334,
            102.07948972355916
        ],
        "wc_reply_reviewers_avg": [
            127.0,
            179.60512242138307
        ],
        "wc_reply_authors_avg": [
            1627.3333333333333,
            1163.6655686044662
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            3.0,
            2.160246899469287
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8660254037844387,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12607570230306687324&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of Oxford;Samsung;King Abdullah University of Science and Technology",
        "aff_unique_dep": ";Samsung;",
        "aff_unique_url": "https://www.ox.ac.uk;https://www.samsung.com;https://www.kaust.edu.sa",
        "aff_unique_abbr": "Oxford;Samsung;KAUST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2",
        "aff_country_unique": "United Kingdom;South Korea;Saudi Arabia"
    },
    {
        "id": "9UGAUQjibp",
        "title": "Quantized Local Independence Discovery for Fine-Grained Causal Dynamics Learning in Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Incorporating causal relationships between the variables into dynamics learning has emerged as a promising approach to enhance robustness and generalization in reinforcement learning (RL). Recent studies have focused on examining conditional independences and leveraging only relevant state and action variables for prediction. However, such approaches tend to overlook local independence relationships that hold under certain circumstances referred as event. In this work, we present a theoretically-grounded and practical approach to dynamics learning which discovers such meaningful events and infers fine-grained causal relationships. The key idea is to learn a discrete latent variable that represents the pair of event and causal relationships specific to the event via vector quantization. As a result, our method provides a fine-grained understanding of the dynamics by capturing event-specific causal relationships, leading to improved robustness and generalization in RL. Experimental results demonstrate that our method is more robust to unseen states and generalizes well to downstream tasks compared to prior approaches. In addition, we find that our method successfully identifies meaningful events and recovers event-specific causal relationships.",
        "keywords": "Reinforcement learning;Causal reasoning;Local independence",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Inwoo Hwang;Yunhyeok Kwak;Suhyung Choi;Byoung-Tak Zhang;Sanghack Lee",
        "authorids": "~Inwoo_Hwang1;~Yunhyeok_Kwak1;~Suhyung_Choi2;~Byoung-Tak_Zhang1;~Sanghack_Lee1",
        "gender": ";M;M;M;M",
        "homepage": "https://iwhwang.github.io;https://yun-kwak.github.io;https://www.github.com/conscious-choi;https://bi.snu.ac.kr/~btzhang/;http://www.sanghacklee.me",
        "dblp": "317/0732;332/4729;376/2355;09/5682;20/1133",
        "google_scholar": "MuG6Le8AAAAJ;rhyhnRYAAAAJ;jPcpT2MAAAAJ;sYTUOu8AAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";0009-0001-5491-3492;;;0000-0001-7137-6126",
        "linkedin": ";;;;sanghack-lee-65b52a28/",
        "or_profile": "~Inwoo_Hwang1;~Yunhyeok_Kwak1;~Suhyung_Choi2;~Byoung-Tak_Zhang1;~Sanghack_Lee1",
        "aff": "Seoul National University;Seoul National University;Seoul National University;Seoul National University;Seoul National University",
        "aff_domain": "snu.ac.kr;snu.ac.kr;snu.ac.kr;snu.ac.kr;snu.ac.kr",
        "position": "PhD student;MS student;PhD student;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nhwang2024quantized,\ntitle={Quantized Local Independence Discovery for Fine-Grained Causal Dynamics Learning in Reinforcement Learning},\nauthor={Inwoo Hwang and Yunhyeok Kwak and Suhyung Choi and Byoung-Tak Zhang and Sanghack Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=9UGAUQjibp}\n}",
        "github": "",
        "project": "",
        "reviewers": "RHPG;Ufsn;eMfR;JfxM;s5uf",
        "site": "https://openreview.net/forum?id=9UGAUQjibp",
        "pdf_size": 12317800,
        "rating": "5;6;6;6;6",
        "confidence": "3;3;1;3;3",
        "soundness": "1;3;2;2;3",
        "contribution": "2;3;3;3;3",
        "presentation": "1;3;3;3;3",
        "wc_summary": "144;44;46;52;55",
        "wc_strengths": "120;71;48;26;53",
        "wc_weaknesses": "516;21;18;39;180",
        "wc_questions": "643;56;265;40;210",
        "wc_review": "1423;192;377;157;498",
        "wc_reply_reviewers": "550;0;0;18;16",
        "wc_reply_authors": "1655;302;938;313;742",
        "reply_reviewers": "3;0;0;1;1",
        "reply_authors": "4;1;3;1;1",
        "rating_avg": [
            5.8,
            0.39999999999999997
        ],
        "confidence_avg": [
            2.6,
            0.8
        ],
        "soundness_avg": [
            2.2,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.8,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.6,
            0.8000000000000002
        ],
        "wc_summary_avg": [
            68.2,
            38.107217164206574
        ],
        "wc_strengths_avg": [
            63.6,
            31.639216172339037
        ],
        "wc_weaknesses_avg": [
            154.8,
            190.32960883688065
        ],
        "wc_questions_avg": [
            242.8,
            218.059991745391
        ],
        "wc_review_avg": [
            529.4,
            463.73552807607916
        ],
        "wc_reply_reviewers_avg": [
            116.8,
            216.7343073904083
        ],
        "wc_reply_authors_avg": [
            790.0,
            497.61551422760124
        ],
        "reply_reviewers_avg": [
            1.0,
            1.0954451150103321
        ],
        "reply_authors_avg": [
            2.0,
            1.2649110640673518
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.25,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1663183835689284920&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Seoul National University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.snu.ac.kr",
        "aff_unique_abbr": "SNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "De novo Protein Design Using Geometric Vector Field Networks",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19294",
        "id": "9UIGyJJpay",
        "author_site": "weian mao, Muzhi Zhu, Zheng Sun, Shuaike Shen, Lin Yuanbo Wu, Hao Chen, Chunhua Shen",
        "tldr": "",
        "abstract": "Advances like protein diffusion have marked revolutionary progress in $\\textit{de novo}$ protein design, a central topic in life science. These methods typically depend on protein structure encoders to model residue backbone frames, where atoms do not exist. Most prior encoders rely on atom-wise features, such as angles and distances between atoms, which are not available in this context. Only a few basic encoders, like IPA, have been proposed for this scenario, exposing the frame modeling as a bottleneck. In this work, we introduce the Vector Field Network (VFN), that enables network layers to perform learnable vector computations between coordinates of frame-anchored virtual atoms, thus achieving a higher capability for modeling frames. The vector computation operates in a manner similar to a linear layer, with each input channel receiving 3D virtual atom coordinates instead of scalar values. The multiple feature vectors output by the vector computation are then used to update the residue representations and virtual atom coordinates via attention aggregation. Remarkably, VFN also excels in modeling both frames and atoms, as the real atoms can be treated as the virtual atoms for modeling, positioning VFN as a potential $\\textit{universal encoder}$. In protein diffusion (frame modeling), VFN exhibits a impressive performance advantage over IPA, excelling in terms of both designability ($\\textbf{67.04}$\\% vs. 53.58\\%) and diversity ($\\textbf{66.54}$\\% vs. 51.98\\%). In inverse folding(frame and atom modeling), VFN outperforms the previous SoTA model, PiFold ($\\textbf{54.7}$\\% vs. 51.66\\%), on sequence recovery rate; we also propose a method of equipping VFN with the ESM model, which significantly surpasses the previous ESM-based SoTA ($\\textbf{62.67}$\\% vs. 55.65\\%), LM-Design, by a substantial margin. Code is available at https://github.com/aim-uofa/VFN",
        "keywords": "Protein design;Protein structure encoder;Inverse folding;Protein diffusion",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Weian Mao;Muzhi Zhu;Zheng Sun;Shuaike Shen;Lin Yuanbo Wu;Hao Chen;Chunhua Shen",
        "authorids": "~Weian_Mao2;~Muzhi_Zhu1;~Zheng_Sun7;~Shuaike_Shen1;~Lin_Yuanbo_Wu1;~Hao_Chen17;~Chunhua_Shen2",
        "gender": "M;M;M;;F;;",
        "homepage": ";https://z-mu-z.github.io/;https://ringhalsun.github.io/;;https://sites.google.com/site/linwuuq/home;;",
        "dblp": "289/1631;157/1679;;;65/6292-1;;",
        "google_scholar": "Qu-QXTsAAAAJ;https://scholar.google.com.hk/citations?user=064gBH4AAAAJ;https://scholar.google.com/citations?hl=en;;https://scholar.google.com.au/citations?user=mMiJUegAAAAJ;;",
        "orcid": ";;;;0000-0001-6119-058X;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Weian_Mao2;~Muzhi_Zhu1;~Zheng_Sun7;~Shuaike_Shen1;~Lin_Yuanbo_Wu1;~Hao_Chen17;~Chunhua_Shen2",
        "aff": "University of Adelaide;Zhejiang University;Swansea University;;Swansea University;;",
        "aff_domain": "adelaide.edu.au;zju.edu.cn;swansea.ac.uk;;swansea.ac.uk;;",
        "position": "PhD student;PhD student;MS student;;Associate Professor;;",
        "bibtex": "@inproceedings{\nmao2024de,\ntitle={De novo Protein Design Using Geometric Vector Field Networks},\nauthor={Weian Mao and Muzhi Zhu and Zheng Sun and Shuaike Shen and Lin Yuanbo Wu and Hao Chen and Chunhua Shen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=9UIGyJJpay}\n}",
        "github": "",
        "project": "",
        "reviewers": "MXeu;AKqf;unsL",
        "pdf_size": 6252283,
        "rating": "6;8;8",
        "confidence": "5;4;4",
        "soundness": "3;3;3",
        "contribution": "3;3;2",
        "presentation": "2;2;3",
        "wc_summary": "62;89;51",
        "wc_strengths": "13;65;76",
        "wc_weaknesses": "352;158;407",
        "wc_questions": "111;135;86",
        "wc_review": "538;447;620",
        "wc_reply_reviewers": "231;231;0",
        "wc_reply_authors": "2982;2357;1440",
        "reply_reviewers": "2;1;0",
        "reply_authors": "6;4;4",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            67.33333333333333,
            15.965240019770729
        ],
        "wc_strengths_avg": [
            51.333333333333336,
            27.475241379993168
        ],
        "wc_weaknesses_avg": [
            305.6666666666667,
            106.80303782612594
        ],
        "wc_questions_avg": [
            110.66666666666667,
            20.005554784164875
        ],
        "wc_review_avg": [
            535.0,
            70.65880459409618
        ],
        "wc_reply_reviewers_avg": [
            154.0,
            108.89444430272832
        ],
        "wc_reply_authors_avg": [
            2259.6666666666665,
            633.2699968330165
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            4.666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.9999999999999997,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5870346272431391349&as_sdt=5,38&sciodt=0,38&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=9UIGyJJpay",
        "pdf": "https://openreview.net/pdf?id=9UIGyJJpay",
        "email": "adelaide.edu.au;zju.edu.cn;swansea.ac.uk;;swansea.ac.uk;;",
        "author_num": 7,
        "aff_unique_index": "0;1;2;2",
        "aff_unique_norm": "University of Adelaide;Zhejiang University;Swansea University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.adelaide.edu.au;https://www.zju.edu.cn;https://www.swansea.ac.uk",
        "aff_unique_abbr": "Adelaide;ZJU;Swansea",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;2",
        "aff_country_unique": "Australia;China;United Kingdom"
    },
    {
        "title": "Most discriminative stimuli for functional cell type clustering",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19293",
        "id": "9W6KaAcYlr",
        "author_site": "Max F. Burg, Thomas Zenkel, Michaela Vystr\u010dilov\u00e1, Jonathan Oesterle, Larissa H\u00f6fling, Konstantin F. Willeke, Jan Lause, Sarah M\u00fcller, Paul Fahey, Zhiwei Ding, Kelli Restivo, Shashwat Sridhar, Tim Gollisch, Philipp Berens, Andreas Tolias, Thomas Euler, Matthias Bethge, Alexander S Ecker",
        "tldr": "",
        "abstract": "Identifying cell types and understanding their functional properties is crucial for unraveling the mechanisms underlying perception and cognition. In the retina, functional types can be identified by carefully selected stimuli, but this requires expert domain knowledge and biases the procedure towards previously known cell types. In the visual cortex, it is still unknown what functional types exist and how to identify them. Thus, for unbiased identification of the functional cell types in retina and visual cortex, new approaches are needed. Here we propose an optimization-based clustering approach using deep predictive models to obtain functional clusters of neurons using Most Discriminative Stimuli (MDS). Our approach alternates between stimulus optimization with cluster reassignment akin to an expectation-maximization algorithm. The algorithm recovers functional clusters in mouse retina, marmoset retina and macaque visual area V4. This demonstrates that our approach can successfully find discriminative stimuli across species, stages of the visual system and recording techniques. The resulting most discriminative stimuli can be used to assign functional cell types fast and on the fly, without the need to train complex predictive models or show a large natural scene dataset, paving the way for experiments that were previously limited by experimental time. Crucially, MDS are interpretable: they visualize the distinctive stimulus patterns that most unambiguously identify a specific type of neuron.",
        "keywords": "clustering;discriminative stimuli;interpretable;optimization;expectation-maximization;functional cell types;digital twins;feature visualization;pre-image search;maximally exciting image",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "Max F Burg;Thomas Zenkel;Michaela Vystr\u010dilov\u00e1;Jonathan Oesterle;Larissa H\u00f6fling;Konstantin Friedrich Willeke;Jan Lause;Sarah M\u00fcller;Paul G. Fahey;Zhiwei Ding;Kelli Restivo;Shashwat Sridhar;Tim Gollisch;Philipp Berens;Andreas S. Tolias;Thomas Euler;Matthias Bethge;Alexander S Ecker",
        "authorids": "~Max_F_Burg1;~Thomas_Zenkel1;~Michaela_Vystr\u010dilov\u00e11;~Jonathan_Oesterle1;~Larissa_H\u00f6fling1;~Konstantin_Friedrich_Willeke1;~Jan_Lause1;~Sarah_M\u00fcller1;~Paul_G._Fahey1;~Zhiwei_Ding1;~Kelli_Restivo1;~Shashwat_Sridhar1;~Tim_Gollisch1;~Philipp_Berens1;~Andreas_S._Tolias1;~Thomas_Euler1;~Matthias_Bethge1;~Alexander_S_Ecker1",
        "gender": ";M;;M;;M;;F;;;F;M;M;M;;;M;M",
        "homepage": ";;;;;https://sinzlab.org/team.html;;https://hertie.ai/data-science/team/members/sarah-mueller;;;;;https://www.retina.uni-goettingen.de/;http://www.berenslab.org;;https://eulerlab.de/;https://bethgelab.org;http://eckerlab.org",
        "dblp": ";;;;;;;;;;;;;78/3560;32/3057;196/3259;77/3005;26/7228",
        "google_scholar": ";https://scholar.google.de/citations?user=jn2QYvoAAAAJ;;https://scholar.google.de/citations?user=jGoWHKoAAAAJ;s4lDqV0AAAAJ;sc3jZTsAAAAJ;;https://scholar.google.de/citations?user=UGqIaQcAAAAJ;;;;e9m2XqgAAAAJ;https://scholar.google.de/citations?user=yrtgRRkAAAAJ;https://scholar.google.de/citations?user=lPQLk3QAAAAJ;;https://scholar.google.de/citations?user=XeqGapgAAAAJ;https://scholar.google.com/citations?hl=en;VgYU_m8AAAAJ",
        "orcid": ";;;0000-0001-8919-1445;;0000-0003-4445-6408;;0000-0003-1500-8673;;;;0000-0002-8837-8555;0000-0003-3998-533X;;;0000-0002-4567-6966;;0000-0003-2392-5105",
        "linkedin": ";;michaela-vystr\u010dilov\u00e1-4b7a601ba/;;;;;;;;kellirestivo/;;;;;thomas-euler-9b67102b2/;;alexecker/",
        "or_profile": "~Max_F_Burg1;~Thomas_Zenkel1;~Michaela_Vystr\u010dilov\u00e11;~Jonathan_Oesterle1;~Larissa_H\u00f6fling1;~Konstantin_Friedrich_Willeke1;~Jan_Lause1;~Sarah_M\u00fcller1;~Paul_G._Fahey1;~Zhiwei_Ding1;~Kelli_Restivo1;~Shashwat_Sridhar1;~Tim_Gollisch1;~Philipp_Berens1;~Andreas_S._Tolias1;~Thomas_Euler1;~Matthias_Bethge1;~Alexander_S_Ecker1",
        "aff": ";;Georg-August Universit\u00e4t G\u00f6ttingen;Eberhard-Karls-Universit\u00e4t T\u00fcbingen;;University of Tuebingen;;University of Tuebingen;;;Baylor College of Medicine;Georg-August Universit\u00e4t G\u00f6ttingen;Georg-August Universit\u00e4t G\u00f6ttingen;University of Tuebingen;Baylor College of Medicine;University of Tuebingen;University of Tuebingen;Max Planck Institute for Dynamics and Self-Organization",
        "aff_domain": ";;uni-goettingen.de;uni-tuebingen.de;;uni-tuebingen.de;;uni-tuebingen.de;;;bcm.edu;uni-goettingen.de;uni-goettingen.de;uni-tuebingen.de;bcm.edu;uni-tuebingen.de;uni-tuebingen.de;ds.mpg.de",
        "position": ";;PhD student;Postdoc;;PhD student;;PhD student;;;PhD student;PhD student;Full Professor;Full Professor;Professor;Full Professor;Full Professor;Principal Researcher",
        "bibtex": "@inproceedings{\nburg2024most,\ntitle={Most discriminative stimuli for functional cell type clustering},\nauthor={Max F Burg and Thomas Zenkel and Michaela Vystr{\\v{c}}ilov{\\'a} and Jonathan Oesterle and Larissa H{\\\"o}fling and Konstantin Friedrich Willeke and Jan Lause and Sarah M{\\\"u}ller and Paul G. Fahey and Zhiwei Ding and Kelli Restivo and Shashwat Sridhar and Tim Gollisch and Philipp Berens and Andreas S. Tolias and Thomas Euler and Matthias Bethge and Alexander S Ecker},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=9W6KaAcYlr}\n}",
        "github": "",
        "project": "",
        "reviewers": "NLuU;FrCb;KEew;69wH",
        "pdf_size": 1730049,
        "rating": "5;5;6;6",
        "confidence": "2;2;4;2",
        "soundness": "2;2;3;3",
        "contribution": "3;2;3;2",
        "presentation": "2;2;3;3",
        "wc_summary": "53;81;114;69",
        "wc_strengths": "25;35;77;30",
        "wc_weaknesses": "130;92;125;63",
        "wc_questions": "29;150;30;193",
        "wc_review": "237;358;346;355",
        "wc_reply_reviewers": "146;353;267;0",
        "wc_reply_authors": "1292;825;1450;825",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "3;2;3;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            2.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            79.25,
            22.38721733489895
        ],
        "wc_strengths_avg": [
            41.75,
            20.656415468323637
        ],
        "wc_weaknesses_avg": [
            102.5,
            27.07858932810201
        ],
        "wc_questions_avg": [
            100.5,
            72.6102609828666
        ],
        "wc_review_avg": [
            324.0,
            50.42320894191484
        ],
        "wc_reply_reviewers_avg": [
            191.5,
            132.782717248895
        ],
        "wc_reply_authors_avg": [
            1098.0,
            278.6565987016995
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            18,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15776683461126722528&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 9,
        "openreview": "https://openreview.net/forum?id=9W6KaAcYlr",
        "pdf": "https://openreview.net/pdf?id=9W6KaAcYlr",
        "email": ";;uni-goettingen.de;uni-tuebingen.de;;uni-tuebingen.de;;uni-tuebingen.de;;;bcm.edu;uni-goettingen.de;uni-goettingen.de;uni-tuebingen.de;bcm.edu;uni-tuebingen.de;uni-tuebingen.de;ds.mpg.de",
        "author_num": 18,
        "aff_unique_index": "0;1;2;2;3;0;0;2;3;2;2;4",
        "aff_unique_norm": "Georg-August Universit\u00e4t G\u00f6ttingen;Eberhard Karls University of T\u00fcbingen;University of Tuebingen;Baylor College of Medicine;Max Planck Institute for Dynamics and Self-Organization",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.uni-goettingen.de;https://www.uni-tuebingen.de/;https://www.uni-tuebingen.de/;https://www.bcm.edu;https://www.mpids.org",
        "aff_unique_abbr": "GAU;Uni T\u00fcbingen;Uni T\u00fcbingen;BCM;MPIDS",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";T\u00fcbingen",
        "aff_country_unique_index": "0;0;0;0;1;0;0;0;1;0;0;0",
        "aff_country_unique": "Germany;United States"
    },
    {
        "title": "Zipformer: A faster and better encoder for automatic speech recognition",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19292",
        "id": "9WD9KwssyT",
        "author_site": "Zengwei Yao, Liyong Guo, Xiaoyu Yang, Wei Kang, Fangjun Kuang, Yifan Yang, Zengrui Jin, Long Lin, Daniel Povey",
        "tldr": "",
        "abstract": "The Conformer has become the most popular encoder model for automatic speech recognition (ASR).  It adds convolution modules to a transformer to learn both local and global dependencies. In this work we describe a faster, more memory-efficient, and better-performing transformer, called Zipformer.  Modeling changes include: 1) a U-Net-like encoder structure where middle stacks operate at lower frame rates; 2) reorganized block structure with more modules, within which we re-use attention weights for efficiency; 3) a modified form of LayerNorm called BiasNorm allows us to retain some length information; 4)  new activation functions SwooshR and SwooshL work better than Swish.  We also propose a new optimizer, called ScaledAdam, which scales the update by each tensor's current scale to keep the relative change about the same, and also explictly learns the parameter scale. It achieves faster converge and better performance than Adam. Extensive experiments on LibriSpeech, Aishell-1, and WenetSpeech datasets demonstrate the effectiveness of our proposed Zipformer over other state-of-the-art ASR models. Our code is publicly available at https://github.com/k2-fsa/icefall.",
        "keywords": "Zipformer;ScaledAdam;automatic speech recognition",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Zengwei Yao;Liyong Guo;Xiaoyu Yang;Wei Kang;Fangjun Kuang;Yifan Yang;Zengrui Jin;Long Lin;Daniel Povey",
        "authorids": "~Zengwei_Yao1;~Liyong_Guo1;~Xiaoyu_Yang7;~Wei_Kang3;~Fangjun_Kuang1;~Yifan_Yang11;~Zengrui_Jin1;~Long_Lin1;~Daniel_Povey2",
        "gender": "M;;M;M;M;M;;F;",
        "homepage": ";;;https://pkufool.github.io/;http://github.com/csukuangfj;https://yfyeung.github.io/;;https://github.com/liliana404;",
        "dblp": ";;;;;83/89-5;;;",
        "google_scholar": "f3Eo9S0AAAAJ;2nME_lQAAAAJ;dQQ5_4wAAAAJ;dyIpw7kAAAAJ;3JCBRi8AAAAJ;https://scholar.google.com/citations?hl=zh-CN;;;",
        "orcid": ";;;;;0009-0003-0588-1812;;;",
        "linkedin": ";;xiaoyu-yang-602271193/;;;yifan-yang-290ba624b;;;",
        "or_profile": "~Zengwei_Yao1;~Liyong_Guo1;~Xiaoyu_Yang7;~Wei_Kang3;~Fangjun_Kuang1;~Yifan_Yang11;~Zengrui_Jin1;~Long_Lin1;~Daniel_Povey2",
        "aff": ";;Xiaomi Corp.;Xiaomi Corp.;;Shanghai Jiaotong University;;;",
        "aff_domain": ";;xiaomi.com;xiaomi.com;;sjtu.edu.cn;;;",
        "position": ";;Researcher;Researcher;;PhD student;;;",
        "bibtex": "@inproceedings{\nyao2024zipformer,\ntitle={Zipformer: A faster and better encoder for automatic speech recognition},\nauthor={Zengwei Yao and Liyong Guo and Xiaoyu Yang and Wei Kang and Fangjun Kuang and Yifan Yang and Zengrui Jin and Long Lin and Daniel Povey},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=9WD9KwssyT}\n}",
        "github": "",
        "project": "",
        "reviewers": "2d3G;hvPD;6jVU;UyUP",
        "pdf_size": 511626,
        "rating": "6;8;8;8",
        "confidence": "5;4;5;4",
        "soundness": "3;3;3;3",
        "contribution": "3;4;3;3",
        "presentation": "3;3;2;3",
        "wc_summary": "69;27;143;74",
        "wc_strengths": "36;56;56;43",
        "wc_weaknesses": "669;87;280;56",
        "wc_questions": "44;99;374;33",
        "wc_review": "818;269;853;206",
        "wc_reply_reviewers": "0;42;0;0",
        "wc_reply_authors": "763;437;791;404",
        "reply_reviewers": "0;2;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            78.25,
            41.601532423698046
        ],
        "wc_strengths_avg": [
            47.75,
            8.613216588476108
        ],
        "wc_weaknesses_avg": [
            273.0,
            244.20790323001424
        ],
        "wc_questions_avg": [
            137.5,
            138.81372410536358
        ],
        "wc_review_avg": [
            536.5,
            300.08373831315816
        ],
        "wc_reply_reviewers_avg": [
            10.5,
            18.186533479473212
        ],
        "wc_reply_authors_avg": [
            598.75,
            178.90552674526296
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 97,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4991886084904422681&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 9,
        "openreview": "https://openreview.net/forum?id=9WD9KwssyT",
        "pdf": "https://openreview.net/pdf?id=9WD9KwssyT",
        "email": ";;xiaomi.com;xiaomi.com;;sjtu.edu.cn;;;",
        "author_num": 9,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Xiaomi Corporation;Shanghai Jiao Tong University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.xiaomi.com;https://www.sjtu.edu.cn",
        "aff_unique_abbr": "Xiaomi;SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "9Wy6pLNQcG",
        "title": "RegionSpot: Unleashing the Power of Frozen Foundation Models for Open-World Region Understanding",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Understanding the semantics of individual regions or patches within unconstrained images, such as in open-world object detection, represents a critical yet challenging task in computer vision. Building on the success of powerful image-level vision-language (ViL) foundation models like CLIP, recent efforts have sought to harness their capabilities by either training a contrastive model from scratch with an extensive collection of region-label pairs or aligning the outputs of a detection model with image-level representations of region proposals. Despite notable progress, these approaches are plagued by computationally intensive training requirements, susceptibility to data noise, \nand a deficiency in contextual information.\n%\nTo address these limitations, we explore the synergistic potential of off-the-shelf foundation models, leveraging their strengths in localization and semantics. We introduce a novel, generic, and efficient region recognition architecture, named \\textit{\\modelname{}}, designed to integrate position-aware localization knowledge from a localization foundation model (e.g., SAM) with multimodal information extracted from a ViL model (e.g., CLIP). To fully exploit pretrained knowledge while minimizing training overhead, we keep both foundation models frozen, focusing optimization efforts solely on a lightweight attention-based knowledge integration module.\n%\nThrough extensive experiments in the context of open-world object recognition, our \\textit{\\modelname{}} demonstrates significant performance improvements over prior alternatives, while also providing substantial computational savings. \n{For instance, training our model with 3 million data in 1 day using 8 V100 GPUs.} Our model outperforms GLIP by 6.5\\% in mean average precision (mAP), with an even larger margin by 14.8\\% for more challenging and rare categories. Our source code will be made publicly available.",
        "keywords": "Open world Region Understanding",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Haosen Yang;Chuofan Ma;Bin Wen;Yi Jiang;Zehuan Yuan;Xiatian Zhu",
        "authorids": "~Haosen_Yang1;~Chuofan_Ma1;~Bin_Wen1;~Yi_Jiang2;~Zehuan_Yuan1;~Xiatian_Zhu3",
        "gender": "M;;M;M;M;",
        "homepage": ";https://machuofan.github.io/;;https://enjoyyi.github.io/;https://shallowyuan.github.io/;https://x-up-lab.github.io",
        "dblp": "245/9949-3;330/3312;;;227/3298;128/7935",
        "google_scholar": "https://scholar.google.com/citations?hl=en;hgKtgWAAAAAJ;https://scholar.google.com/citations?view_op=list_works;https://scholar.google.com.hk/citations?user=6dikuoYAAAAJ;;ZbA-z1cAAAAJ",
        "orcid": ";;;0000-0002-2133-8719;;0000-0002-9284-2955",
        "linkedin": ";;;;;",
        "or_profile": "~Haosen_Yang1;~Chuofan_Ma1;~Bin_Wen1;~Yi_Jiang2;~Zehuan_Yuan1;~Xiatian_Zhu3",
        "aff": "University of Surrey;University of Hong Kong;;Bytedance;ByteDance Inc.;University of Surrey",
        "aff_domain": "surrey.ac.uk;hku.hk;;bytedance.com;bytedance.com;surrey.ac.uk",
        "position": "PhD student;PhD student;;Researcher;Researcher;Associate Professor",
        "bibtex": "@misc{\nyang2024regionspot,\ntitle={RegionSpot: Unleashing the Power of Frozen Foundation Models for Open-World Region Understanding},\nauthor={Haosen Yang and Chuofan Ma and Bin Wen and Yi Jiang and Zehuan Yuan and Xiatian Zhu},\nyear={2024},\nurl={https://openreview.net/forum?id=9Wy6pLNQcG}\n}",
        "github": "",
        "project": "",
        "reviewers": "3vj6;Tjjg;PEMU;UsjU",
        "site": "https://openreview.net/forum?id=9Wy6pLNQcG",
        "pdf_size": 2420418,
        "rating": "3;5;5;6",
        "confidence": "4;4;3;4",
        "soundness": "3;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;2;4",
        "wc_summary": "71;20;65;77",
        "wc_strengths": "39;61;105;71",
        "wc_weaknesses": "157;215;216;155",
        "wc_questions": "33;21;37;46",
        "wc_review": "300;317;423;349",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "882;768;705;498",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;2;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            58.25,
            22.487496525847426
        ],
        "wc_strengths_avg": [
            69.0,
            23.790754506740637
        ],
        "wc_weaknesses_avg": [
            185.75,
            29.76050234791073
        ],
        "wc_questions_avg": [
            34.25,
            8.98262211161084
        ],
        "wc_review_avg": [
            347.25,
            47.14008379288268
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            713.25,
            139.53023865814893
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.13245323570650439,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:0fp0BEd_PgMJ:scholar.google.com/&scioq=RegionSpot:+Unleashing+the+Power+of+Frozen+Foundation+Models+for+Open-World+Region+Understanding&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;2;0",
        "aff_unique_norm": "University of Surrey;University of Hong Kong;ByteDance",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.surrey.ac.uk;https://www.hku.hk;https://www.bytedance.com",
        "aff_unique_abbr": "Surrey;HKU;Bytedance",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;1;1;1;0",
        "aff_country_unique": "United Kingdom;China"
    },
    {
        "id": "9XdLlbxZCC",
        "title": "MC-JEPA: A Joint-Embedding Predictive Architecture for Self-Supervised Learning of Motion and Content Features",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Self-supervised learning of visual representations has been focusing on learning content features, which do not capture object motion or location, and focus on identifying and differentiating objects in images and videos. On the other hand, optical flow estimation is a task that does not involve understanding the content of the images on which it is estimated. We unify the two approaches and introduce MC-JEPA, a joint-embedding predictive architecture and self-supervised learning approach to jointly learn optical flow and content features within a shared encoder, demonstrating that the two associated objectives; the optical flow estimation objective and the self-supervised learning objective; benefit from each other and thus learn content features that incorporate motion information. The proposed approach achieves performance on-par with existing unsupervised optical flow benchmarks, as well as with common self-supervised learning approaches on downstream tasks such as semantic segmentation of images and videos.",
        "keywords": "self-supervised learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/7567d0bbed2fe4d9de9c36c3826dbfba4ba6f6e2.pdf",
        "author": "Adrien Bardes;Jean Ponce;Yann LeCun",
        "authorids": "~Adrien_Bardes1;~Jean_Ponce1;~Yann_LeCun1",
        "gender": "M;M;M",
        "homepage": ";http://www.di.ens.fr/~ponce/;http://yann.lecun.com",
        "dblp": "292/3848.html;p/JeanPonce;l/YannLeCun",
        "google_scholar": "SvRU8F8AAAAJ;https://scholar.google.com.tw/citations?user=vC2vywcAAAAJ;WLN3QrAAAAAJ",
        "orcid": ";;",
        "linkedin": "adrien-bardes-48a080129/;;",
        "or_profile": "~Adrien_Bardes1;~Jean_Ponce1;~Yann_LeCun1",
        "aff": "Meta Facebook;Ecole Normale Sup\u00e9rieure de Paris;New York University",
        "aff_domain": "meta.com;ens.fr;nyu.edu",
        "position": "Researcher;Full Professor;Full Professor",
        "bibtex": "@misc{\nbardes2024mcjepa,\ntitle={{MC}-{JEPA}: A Joint-Embedding Predictive Architecture for Self-Supervised Learning of Motion and Content Features},\nauthor={Adrien Bardes and Jean Ponce and Yann LeCun},\nyear={2024},\nurl={https://openreview.net/forum?id=9XdLlbxZCC}\n}",
        "github": "",
        "project": "",
        "reviewers": "arP2;q59r;Jf74;RRax",
        "site": "https://openreview.net/forum?id=9XdLlbxZCC",
        "pdf_size": 5198063,
        "rating": "3;5;6;6",
        "confidence": "4;4;4;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "2;3;2;2",
        "wc_summary": "33;117;63;34",
        "wc_strengths": "21;225;58;78",
        "wc_weaknesses": "167;302;228;26",
        "wc_questions": "2;2;103;129",
        "wc_review": "223;646;452;267",
        "wc_reply_reviewers": "0;0;0;42",
        "wc_reply_authors": "506;667;888;403",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            61.75,
            34.098203765007916
        ],
        "wc_strengths_avg": [
            95.5,
            77.51290215183535
        ],
        "wc_weaknesses_avg": [
            180.75,
            101.32959834125467
        ],
        "wc_questions_avg": [
            59.0,
            57.736470276593806
        ],
        "wc_review_avg": [
            397.0,
            167.48283494137542
        ],
        "wc_reply_reviewers_avg": [
            10.5,
            18.186533479473212
        ],
        "wc_reply_authors_avg": [
            616.0,
            183.06692765215678
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.4714045207910316,
        "gs_citation": 27,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11805965224862551060&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Meta;Ecole Normale Sup\u00e9rieure de Paris;New York University",
        "aff_unique_dep": "Meta Platforms, Inc.;;",
        "aff_unique_url": "https://meta.com;https://www.ens.fr;https://www.nyu.edu",
        "aff_unique_abbr": "Meta;ENS Paris;NYU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Paris",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United States;France"
    },
    {
        "id": "9Z0yB8rmQ2",
        "title": "Lyra: Orchestrating Dual Correction in Automated Theorem Proving",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) present an intriguing avenue for exploration in the field of formal theorem proving. Nevertheless, their full potential, particularly concerning the mitigation of hallucinations and refinement through prover error messages, remains an area that has yet to be thoroughly investigated. To enhance the effectiveness of LLMs in the field, we introduce the Lyra, a new framework that employs two distinct correction mechanisms: Tool Correction (TC) and Conjecture Correction (CC). To implement Tool Correction in the post-processing of formal proofs, we leverage prior knowledge to utilize predefined prover tools (e.g., Sledgehammer) for guiding the replacement of incorrect tools. Tool Correction significantly contributes to mitigating hallucinations, thereby improving the overall accuracy of the proof. In addition, we introduce Conjecture Correction, an error feedback mechanism designed to interact with prover to refine formal proof conjectures with prover error messages. Compared to the previous refinement framework, the proposed Conjecture Correction refines generation with instruction but does not collect paired (generation, error & refinement) prompts. Our method has achieved state-of-the-art (SOTA) performance on both miniF2F validation (48.0% \u2192 55.3%) and test (45.5% \u2192 51.2%). We also present 3 IMO problems solved by Lyra. We believe Tool Correction (post-process for hallucination mitigation) and Conjecture Correction (subgoal adjustment from interaction with environment) could provide a promising avenue for future research in this field.",
        "keywords": "Theorem proving;large language model;neuro-symbolic method;automated theorem provers;miniF2F",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "/attachment/f09b60fa30c45e1aa100c31928288548d4ecb1a2.zip",
        "author": "Chuanyang Zheng;Haiming Wang;Enze Xie;Zhengying Liu;Jiankai Sun;Huajian Xin;Jianhao Shen;Zhenguo Li;Yu Li",
        "authorids": "~Chuanyang_Zheng3;~Haiming_Wang1;~Enze_Xie1;~Zhengying_Liu2;~Jiankai_Sun6;~Huajian_Xin1;~Jianhao_Shen1;~Zhenguo_Li1;~Yu_Li1",
        "gender": "M;M;M;M;;M;M;M;M",
        "homepage": "https://chuanyang-zheng.github.io/;;https://xieenze.github.io/;;;https://xinhuajian.wordpress.com/;;http://www.ee.columbia.edu/~zgli/;https://sites.google.com/view/liyu1995",
        "dblp": ";97/604;218/5441;241/1782;121/4211;356/3551;217/2324;23/6479;",
        "google_scholar": "LWwh7K4AAAAJ;zDPqP6AAAAAJ;42MVVPgAAAAJ;http:// DFme0joAAAAJ;726MCb8AAAAJ;E5M9x8wAAAAJ;9fppVAUAAAAJ;XboZC1AAAAAJ;8YHZx-AAAAAJ",
        "orcid": ";;;;;;;;0000-0002-3664-6722",
        "linkedin": ";;;;;;;;yuli1995/",
        "or_profile": "~Chuanyang_Zheng3;~Haiming_Wang1;~Enze_Xie1;~Zhengying_Liu2;~Jiankai_Sun6;~Huajian_Xin1;~Jianhao_Shen1;~Zhenguo_Li1;~Yu_Li1",
        "aff": "The Chinese University of Hong Kong;SUN YAT-SEN UNIVERSITY;Huawei Noah's Ark Lab;Huawei Technologies Ltd.;Stanford University;University of Edinburgh, University of Edinburgh;;Huawei Noah's Ark Lab;Department of Computer Science and Engineering, The Chinese University of Hong Kong",
        "aff_domain": "cse.cuhk.edu.hk;sysu.edu.cn;huawei.com;huawei.com;stanford.edu;ed.ac.uk;;huawei.com;cse.cuhk.edu.hk",
        "position": "PhD student;PhD student;Researcher;Researcher;PhD student;PhD student;;Principal Researcher;Assistant Professor",
        "bibtex": "@misc{\nzheng2024lyra,\ntitle={Lyra: Orchestrating Dual Correction in Automated Theorem Proving},\nauthor={Chuanyang Zheng and Haiming Wang and Enze Xie and Zhengying Liu and Jiankai Sun and Huajian Xin and Jianhao Shen and Zhenguo Li and Yu Li},\nyear={2024},\nurl={https://openreview.net/forum?id=9Z0yB8rmQ2}\n}",
        "github": "",
        "project": "",
        "reviewers": "bwwN;NmsF;1Jjk;Wc5t",
        "site": "https://openreview.net/forum?id=9Z0yB8rmQ2",
        "pdf_size": 1024887,
        "rating": "6;6;6;6",
        "confidence": "5;3;4;5",
        "soundness": "3;3;3;4",
        "contribution": "3;2;3;2",
        "presentation": "3;3;3;4",
        "wc_summary": "42;132;59;159",
        "wc_strengths": "23;111;37;37",
        "wc_weaknesses": "183;355;47;45",
        "wc_questions": "1;76;225;106",
        "wc_review": "249;674;368;347",
        "wc_reply_reviewers": "31;795;220;0",
        "wc_reply_authors": "331;5450;1576;2298",
        "reply_reviewers": "1;5;2;0",
        "reply_authors": "2;8;5;6",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            98.0,
            48.821101994936576
        ],
        "wc_strengths_avg": [
            52.0,
            34.539832078341085
        ],
        "wc_weaknesses_avg": [
            157.5,
            127.00688957690446
        ],
        "wc_questions_avg": [
            102.0,
            80.65667982256646
        ],
        "wc_review_avg": [
            409.5,
            159.17678850887776
        ],
        "wc_reply_reviewers_avg": [
            261.5,
            319.3184147524223
        ],
        "wc_reply_authors_avg": [
            2413.75,
            1888.9074057507426
        ],
        "reply_reviewers_avg": [
            2.0,
            1.8708286933869707
        ],
        "reply_authors_avg": [
            5.25,
            2.165063509461097
        ],
        "replies_avg": [
            39,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 19,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17828337707468607238&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;2;3;4;2;0",
        "aff_unique_norm": "Chinese University of Hong Kong;Sun Yat-sen University;Huawei;Stanford University;University of Edinburgh",
        "aff_unique_dep": ";;Noah's Ark Lab;;",
        "aff_unique_url": "https://www.cuhk.edu.hk;http://www.sysu.edu.cn;https://www.huawei.com;https://www.stanford.edu;https://www.ed.ac.uk",
        "aff_unique_abbr": "CUHK;SYSU;Huawei;Stanford;Edinburgh",
        "aff_campus_unique_index": "0;2;0",
        "aff_campus_unique": "Hong Kong SAR;;Stanford",
        "aff_country_unique_index": "0;0;0;0;1;2;0;0",
        "aff_country_unique": "China;United States;United Kingdom"
    },
    {
        "title": "TOSS: High-quality Text-guided Novel View Synthesis from a Single Image",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19291",
        "id": "9ZUYJpvIys",
        "author_site": "Yukai Shi, Jianan Wang, He CAO, Boshi Tang, Xianbiao Qi, Tianyu Yang, Yukun Huang, Shilong Liu, Lei Zhang, Heung-Yeung Shum",
        "tldr": "",
        "abstract": "In this paper, we present TOSS, which introduces text to the task of novel view synthesis (NVS) from just a single RGB image. \nWhile Zero123 has demonstrated impressive zero-shot open-set NVS capabilities, it treats NVS as a pure image-to-image translation problem. This approach suffers from the challengingly under-constrained nature of single-view NVS: the process lacks means of explicit user control and often result in implausible NVS generations.\nTo address this limitation, TOSS uses text as high-level semantic information to constrain the NVS solution space.\nTOSS fine-tunes text-to-image Stable Diffusion pre-trained on large-scale text-image pairs and introduces modules specifically tailored to image and camera pose conditioning, as well as dedicated training for pose correctness and preservation of fine details. \nComprehensive experiments are conducted with results showing that our proposed TOSS outperforms Zero123 with higher-quality NVS results and faster convergence. We further support these results with comprehensive ablations that underscore the effectiveness and potential of \nthe introduced semantic guidance and architecture design.",
        "keywords": "novel view synthesis;3D object synthesis;diffusion model",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/01aebc58b4b4450b01b5ff07c9d36c98febffd11.zip",
        "author": "Yukai Shi;Jianan Wang;He CAO;Boshi Tang;Xianbiao Qi;Tianyu Yang;Yukun Huang;Shilong Liu;Lei Zhang;Heung-Yeung Shum",
        "authorids": "~Yukai_Shi3;~Jianan_Wang2;~He_CAO1;~Boshi_Tang1;~Xianbiao_Qi2;~Tianyu_Yang2;~Yukun_Huang1;~Shilong_Liu1;~Lei_Zhang23;~Heung-Yeung_Shum1",
        "gender": ";F;M;M;M;M;M;M;M;M",
        "homepage": "https://shiyukai26.github.io/info/;https://scholar.google.com/citations?user=mt5mvZ8AAAAJ&hl=en;https://github.com/CiaoHe;https://github.com/TangYucopper;https://www.linkedin.com/in/xianbiao-qi-39617727/;https://tianyu-yang.com/;;https://www.lsl.zone;https://www.microsoft.com/en-us/research/people/hshum/;https://www.leizhang.org/",
        "dblp": ";49/6053,;;;118/3741;120/8076-3.html;186/1316;;;z/LeiZhang",
        "google_scholar": "oQXfkSQAAAAJ;mt5mvZ8AAAAJ;tLZ2V2kAAAAJ;;odjSydQAAAAJ;BXsWsf8AAAAJ;lHb5gzoAAAAJ;nkSVY3MAAAAJ;;fIlGZToAAAAJ",
        "orcid": ";;;;;;0000-0002-5322-2884;;;",
        "linkedin": ";;he-cao/;;;;;;;",
        "or_profile": "~Yukai_Shi3;~Jianan_Wang2;~He_CAO1;~Boshi_Tang1;~Xianbiao_Qi2;~Tianyu_Yang2;~Yukun_Huang1;~Shilong_Liu1;~Heung-Yeung_Shum1;~Lei_Zhang1",
        "aff": "Tsinghua University;International Digital Economy Academy (IDEA);Hong Kong University of Science and Technology;Tsinghua University;International Digital Economy Academy;International Digital Economy Academy;University of Hong Kong;NVIDIA;;International Digital Economy Academy",
        "aff_domain": "mail.tsinghua.edu.cn;idea.edu.cn;ust.hk;mails.tsinghua.edu.cn;idea.edu.cn;idea.edu.cn;hku.hk;nvidia.com;;idea.edu.cn",
        "position": "PhD student;Researcher;PhD student;MS student;Researcher;Researcher;Postdoc;Research Intern;;Chief Scientist",
        "bibtex": "@inproceedings{\nshi2024toss,\ntitle={{TOSS}: High-quality Text-guided Novel View Synthesis from a Single Image},\nauthor={Yukai Shi and Jianan Wang and He CAO and Boshi Tang and Xianbiao Qi and Tianyu Yang and Yukun Huang and Shilong Liu and Lei Zhang and Heung-Yeung Shum},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=9ZUYJpvIys}\n}",
        "github": "",
        "project": "",
        "reviewers": "LBZY;Givb;wyYi;gFkU",
        "pdf_size": 8550065,
        "rating": "6;6;6;6",
        "confidence": "4;2;4;5",
        "soundness": "3;3;3;3",
        "contribution": "3;3;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "126;74;84;40",
        "wc_strengths": "89;106;105;64",
        "wc_weaknesses": "236;135;127;122",
        "wc_questions": "38;21;33;3",
        "wc_review": "489;336;349;229",
        "wc_reply_reviewers": "33;14;42;46",
        "wc_reply_authors": "255;261;449;279",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            81.0,
            30.675723300355934
        ],
        "wc_strengths_avg": [
            91.0,
            16.98528775146303
        ],
        "wc_weaknesses_avg": [
            155.0,
            46.994680550036726
        ],
        "wc_questions_avg": [
            23.75,
            13.47915056670857
        ],
        "wc_review_avg": [
            350.75,
            92.4077242442427
        ],
        "wc_reply_reviewers_avg": [
            33.75,
            12.336429791475327
        ],
        "wc_reply_authors_avg": [
            311.0,
            80.16233529532433
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 18,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13024502958196107678&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=9ZUYJpvIys",
        "pdf": "https://openreview.net/pdf?id=9ZUYJpvIys",
        "email": "mail.tsinghua.edu.cn;idea.edu.cn;ust.hk;mails.tsinghua.edu.cn;idea.edu.cn;idea.edu.cn;hku.hk;nvidia.com;;idea.edu.cn",
        "author_num": 10,
        "aff_unique_index": "0;1;2;0;1;1;3;4;1",
        "aff_unique_norm": "Tsinghua University;International Digital Economy Academy;Hong Kong University of Science and Technology;University of Hong Kong;NVIDIA",
        "aff_unique_dep": ";;;;NVIDIA Corporation",
        "aff_unique_url": "https://www.tsinghua.edu.cn;;https://www.ust.hk;https://www.hku.hk;https://www.nvidia.com",
        "aff_unique_abbr": "THU;IDEA;HKUST;HKU;NVIDIA",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;2",
        "aff_country_unique": "China;;United States"
    },
    {
        "id": "9ZUz4M55Up",
        "title": "Revisiting the Lottery Ticket Hypothesis for Pre-trained Networks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The lottery ticket hypothesis (LTH) suggests the possibility of pruning neural networks at initialization. Our study revisits LTH in the context of transfer learning, unveiling novel insights surpassing prior studies limited to LTH's application in pre-trained networks. To begin, our study shows that multiple pruning-at-initialization methods are likely to find worse pruning masks than a simple magnitude-based pruning method for pre-trained networks, owing to an inaccurate approximation of the influence of each weight. Iterative magnitude pruning (IMP) can find trainable subnetworks (winning tickets) even for pre-trained networks, however, IMP is a costly algorithm that requires multiple training cycles. Given that trainable subnetworks can be identified only when the initial network withstands the training's inherent randomness, and considering the superior resilience of pre-trained networks to this randomness compared to randomly initialized networks, we empirically demonstrate the enhanced efficiency of identifying trainable subnetworks within the framework of transfer learning. By challenging conventional wisdom surrounding gradual magnitude pruning (GMP), we reveal its capability to significantly enhance the trade-off between transfer learning performance and sparsity in terms of pruning-at-initialization. Our experiments, which involve various models such as convolutional neural networks and transformers, across both vision and language domains, demonstrate that GMP can identify trainable subnetworks for pre-trained networks at a significantly lower cost than IMP. For example, for ImageNet pre-trained ResNet-50, at a pruning ratio of 99%, GMP achieves comparable or superior results to IMP on the CIFAR, Caltech-101, Oxford-IIIT Pets, and Stanford Cars datasets, with 42 times less computation than IMP. Ultimately, we provide empirical evidence that the methodological distinction between the LTH-based and conventional pruning methods can be blurred for pre-trained networks.",
        "keywords": "lottery ticket hypothesis;transfer learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/ec75867c154a5733f28b2b74a342bd509efee0eb.zip",
        "author": "Saehyung Lee;Se Jung Kwon;Byeongwook Kim;Sungroh Yoon",
        "authorids": "~Saehyung_Lee1;~Se_Jung_Kwon1;~Byeongwook_Kim1;~Sungroh_Yoon1",
        "gender": "M;M;;",
        "homepage": ";;;http://ailab.snu.ac.kr",
        "dblp": "260/0442;119/5676;220/5405;99/1474",
        "google_scholar": "nS24h74AAAAJ;https://scholar.google.co.kr/citations?user=8eTxKOkAAAAJ;https://scholar.google.co.kr/citations?user=OjfC7gUAAAAJ;Bphl_fIAAAAJ",
        "orcid": ";;;0000-0002-2367-197X",
        "linkedin": ";se-jung-kwon-305503175/;;",
        "or_profile": "~Saehyung_Lee1;~Se_Jung_Kwon1;~Byeongwook_Kim1;~Sungroh_Yoon1",
        "aff": "Adobe Systems;NAVER Cloud;NAVER CLOUD;Seoul National University",
        "aff_domain": "adobe.com;navercorp.com;navercorp.com;snu.ac.kr",
        "position": "Intern;AI Researcher;Researcher;Full Professor",
        "bibtex": "@misc{\nlee2024revisiting,\ntitle={Revisiting the Lottery Ticket Hypothesis for Pre-trained Networks},\nauthor={Saehyung Lee and Se Jung Kwon and Byeongwook Kim and Sungroh Yoon},\nyear={2024},\nurl={https://openreview.net/forum?id=9ZUz4M55Up}\n}",
        "github": "",
        "project": "",
        "reviewers": "mi9v;kmMF;V5JA;6QxM",
        "site": "https://openreview.net/forum?id=9ZUz4M55Up",
        "pdf_size": 784253,
        "rating": "3;3;5;5",
        "confidence": "4;5;3;4",
        "soundness": "1;2;3;3",
        "contribution": "1;2;2;3",
        "presentation": "2;3;3;4",
        "wc_summary": "75;94;110;109",
        "wc_strengths": "19;54;121;95",
        "wc_weaknesses": "175;251;182;313",
        "wc_questions": "2;17;4;8",
        "wc_review": "271;416;417;525",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            97.0,
            14.19506956657839
        ],
        "wc_strengths_avg": [
            72.25,
            38.931831449342326
        ],
        "wc_weaknesses_avg": [
            230.25,
            56.25555528123422
        ],
        "wc_questions_avg": [
            7.75,
            5.7608593109014565
        ],
        "wc_review_avg": [
            407.25,
            90.27838888682052
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.7071067811865475,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:mXiDScR1eqEJ:scholar.google.com/&scioq=Revisiting+the+Lottery+Ticket+Hypothesis+for+Pre-trained+Networks&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "Adobe;NAVER Corporation;Seoul National University",
        "aff_unique_dep": "Adobe Systems Incorporated;Cloud Division;",
        "aff_unique_url": "https://www.adobe.com;https://www.naver.com;https://www.snu.ac.kr",
        "aff_unique_abbr": "Adobe;NAVER;SNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "United States;South Korea"
    },
    {
        "id": "9bSDTTDUIp",
        "title": "ERM++: An Improved Baseline for Domain Generalization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Multi-source Domain Generalization (DG) measures a classifier's ability to generalize to new distributions of data it was not trained on, given several training domains.  While several multi-source DG methods have been proposed, they incur additional complexity during training by using domain labels. Recent work has shown that a well-tuned Empirical Risk Minimization (ERM) training procedure, that is simply minimizing the empirical risk on the source domains, can outperform most existing DG methods. ERM has achieved such strong results while only tuning hyper-parameters such as learning rate, weight decay, and batch size. This paper aims to understand how we can push ERM as a baseline for DG further, thereby providing a stronger baseline for which to benchmark new methods. We call the resulting improved baseline ERM++, and it consists of better utilization of training data, model parameter selection, and weight-space regularization. ERM++ significantly improves the performance of DG on five multi-source datasets by over 5% compared to standard ERM using ResNet-50, and beats state-of-the-art despite being less computationally expensive. We also demonstrate the efficacy of ERM++ on the WILDS-FMOW dataset, a challenging DG benchmark. Finally, we show that with a CLIP-pretrained ViT-B/16, ERM++ outperforms ERM by over 10%, allowing one to take advantage of the stronger pre-training effectively. We will release code upon acceptance.",
        "keywords": "Domain Generalization;Multi-Source Domain Generalization.",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/75d591d439050ce24e33a5216df536b9ce04f4be.zip",
        "author": "Piotr Teterwak;Kuniaki Saito;Theodoros Tsiligkaridis;Kate Saenko;Bryan A. Plummer",
        "authorids": "~Piotr_Teterwak1;~Kuniaki_Saito2;~Theodoros_Tsiligkaridis1;~Kate_Saenko1;~Bryan_A._Plummer1",
        "gender": "M;M;M;F;M",
        "homepage": "https://scholar.google.com/citations?user=lUkd1AMAAAAJ&hl=en&oi=ao;;https://sites.google.com/view/theo-t;http://ai.bu.edu;http://bryanplummer.com/",
        "dblp": "247/6128;182/1957;64/10412;88/2754;163/2330",
        "google_scholar": "lUkd1AMAAAAJ;https://scholar.google.co.jp/citations?user=2X0cwhkAAAAJ;hVUVOTIAAAAJ;https://scholar.google.com.tw/citations?user=9xDADY4AAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;0000-0002-5704-7614;",
        "linkedin": ";;;;",
        "or_profile": "~Piotr_Teterwak1;~Kuniaki_Saito2;~Theodoros_Tsiligkaridis1;~Kate_Saenko1;~Bryan_Allen_Plummer1",
        "aff": "Boston University;OMRON SINICX;MIT Lincoln Laboratory, Massachusetts Institute of Technology;Boston University, Boston University;Boston University",
        "aff_domain": "bu.edu;sinicx.com;ll.mit.edu;bu.edu;bu.edu",
        "position": "PhD student;Researcher;Senior AI Research Scientist;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nteterwak2024erm,\ntitle={{ERM}++: An Improved Baseline for Domain Generalization},\nauthor={Piotr Teterwak and Kuniaki Saito and Theodoros Tsiligkaridis and Kate Saenko and Bryan A. Plummer},\nyear={2024},\nurl={https://openreview.net/forum?id=9bSDTTDUIp}\n}",
        "github": "",
        "project": "",
        "reviewers": "Xq2C;Pkyt;72G7;4v1r",
        "site": "https://openreview.net/forum?id=9bSDTTDUIp",
        "pdf_size": 19522919,
        "rating": "3;3;5;5",
        "confidence": "4;5;3;3",
        "soundness": "2;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "3;2;3;2",
        "wc_summary": "48;37;112;43",
        "wc_strengths": "46;16;32;89",
        "wc_weaknesses": "115;73;190;284",
        "wc_questions": "2;14;4;281",
        "wc_review": "211;140;338;697",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "289;166;299;584",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            60.0,
            30.273751006441206
        ],
        "wc_strengths_avg": [
            45.75,
            27.13277538328875
        ],
        "wc_weaknesses_avg": [
            165.5,
            80.23247472189799
        ],
        "wc_questions_avg": [
            75.25,
            118.87677443470612
        ],
        "wc_review_avg": [
            346.5,
            214.43239027721535
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            334.5,
            153.2750795139249
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9045340337332909,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12473608674129674084&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;0;0",
        "aff_unique_norm": "Boston University;OMRON Corporation;Massachusetts Institute of Technology",
        "aff_unique_dep": ";;Lincoln Laboratory",
        "aff_unique_url": "https://www.bu.edu;https://www.omron.com;https://web.mit.edu",
        "aff_unique_abbr": "BU;OMRON;MIT",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Cambridge;Boston",
        "aff_country_unique_index": "0;1;0;0;0",
        "aff_country_unique": "United States;Japan"
    },
    {
        "title": "Bootstrapping Variational Information Pursuit with Large Language and Vision Models for Interpretable Image Classification",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19290",
        "id": "9bmTbVaA2A",
        "author_site": "Aditya Chattopadhyay, Kwan Ho Ryan Chan, Rene Vidal",
        "tldr": "",
        "abstract": "Variational Information Pursuit (V-IP) is an interpretable-by-design framework that makes predictions by sequentially selecting a short chain of user-defined, interpretable queries about the data that are most informative for the task. The prediction is based solely on the obtained query answers, which also serve as a faithful explanation for the prediction. Applying the framework to any task requires (i) specification of a query set, and (ii) densely annotated data with query answers to train classifiers to answer queries at test time. This limits V-IP's application to small-scale tasks where manual data annotation is feasible. In this work, we focus on image classification tasks and propose to relieve this bottleneck by leveraging pretrained language and vision models. Specifically, following recent work, we propose to use GPT, a Large Language Model, to propose semantic concepts as queries for a given classification task. To answer these queries, we propose a light-weight Concept Question-Answering network (Concept-QA) which learns to answer binary queries about semantic concepts in images. We design pseudo-labels to train our Concept-QA model using GPT and CLIP (a Vision-Language Model). Empirically, we find our Concept-QA model to be competitive with state-of-the-art VQA models in terms of answering accuracy but with an order of magnitude fewer parameters. This allows for seamless integration of Concept-QA into the V-IP framework as a fast-answering mechanism. We name this method Concept-QA+V-IP. Finally, we show on several datasets that Concept-QA+V-IP produces shorter, interpretable query chains which are more accurate than V-IP trained with CLIP-based answering systems. Code available at https://github.com/adityac94/conceptqa_vip.",
        "keywords": "Interpretable ML;Explainable AI;Information Pursuit;Large Language Models;Large Multimodal Models;Vision Language Models",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Aditya Chattopadhyay;Kwan Ho Ryan Chan;Rene Vidal",
        "authorids": "~Aditya_Chattopadhyay1;~Kwan_Ho_Ryan_Chan1;~Rene_Vidal1",
        "gender": "M;M;",
        "homepage": ";https://ryanchankh.github.io/;http://www.vision.jhu.edu",
        "dblp": "207/8574;267/5496;v/ReneVidal",
        "google_scholar": "aekzv1gAAAAJ;DBXWBqcAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;",
        "linkedin": ";ryanchankh/;rene-vidal-74844928/",
        "or_profile": "~Aditya_Chattopadhyay1;~Kwan_Ho_Ryan_Chan1;~Rene_Vidal1",
        "aff": "Johns Hopkins University;University of Pennsylvania ;Amazon",
        "aff_domain": "jhu.edu;seas.upenn.edu;amazon.com",
        "position": "PhD student;PhD student;Principal Researcher",
        "bibtex": "@inproceedings{\nchattopadhyay2024bootstrapping,\ntitle={Bootstrapping Variational Information Pursuit with Large Language and Vision Models for Interpretable Image Classification},\nauthor={Aditya Chattopadhyay and Kwan Ho Ryan Chan and Rene Vidal},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=9bmTbVaA2A}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZeKa;3dNV;8mpd;8xTQ",
        "pdf_size": 20655217,
        "rating": "5;6;6;6",
        "confidence": "4;3;4;4",
        "soundness": "3;2;3;3",
        "contribution": "2;3;2;2",
        "presentation": "3;3;2;3",
        "wc_summary": "91;101;117;60",
        "wc_strengths": "152;77;78;41",
        "wc_weaknesses": "247;273;186;79",
        "wc_questions": "109;8;222;44",
        "wc_review": "599;459;603;224",
        "wc_reply_reviewers": "0;0;95;0",
        "wc_reply_authors": "1642;1527;1056;870",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "3;3;2;2",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            92.25,
            20.801141795584204
        ],
        "wc_strengths_avg": [
            87.0,
            40.37945021913993
        ],
        "wc_weaknesses_avg": [
            196.25,
            74.69730584164331
        ],
        "wc_questions_avg": [
            95.75,
            81.38296811987138
        ],
        "wc_review_avg": [
            471.25,
            154.0785108313291
        ],
        "wc_reply_reviewers_avg": [
            23.75,
            41.13620667976084
        ],
        "wc_reply_authors_avg": [
            1273.75,
            320.22365231194277
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5154153297737871391&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=9bmTbVaA2A",
        "pdf": "https://openreview.net/pdf?id=9bmTbVaA2A",
        "email": "jhu.edu;seas.upenn.edu;amazon.com",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Johns Hopkins University;University of Pennsylvania;Amazon",
        "aff_unique_dep": ";;Amazon.com, Inc.",
        "aff_unique_url": "https://www.jhu.edu;https://www.upenn.edu;https://www.amazon.com",
        "aff_unique_abbr": "JHU;UPenn;Amazon",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "AGILE3D: Attention Guided Interactive Multi-object 3D Segmentation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19289",
        "id": "9cQtXpRshE",
        "author_site": "Yuanwen Yue, Sabarinath Mahadevan, Jonas Schult, Francis Engelmann, Bastian Leibe, Konrad Schindler, Theodora Kontogianni",
        "tldr": "",
        "abstract": "During interactive segmentation, a model and a user work together to delineate objects of interest in a 3D point cloud. In an iterative process, the model assigns each data point to an object (or the background), while the user corrects errors in the resulting segmentation and feeds them back into the model. The current best practice formulates the problem as binary classification and segments objects one at a time. The model expects the user to provide positive clicks to indicate regions wrongly assigned to the background and negative clicks on regions wrongly assigned to the object. Sequentially visiting objects is wasteful since it disregards synergies between objects: a positive click for a given object can, by definition, serve as a negative click for nearby objects. Moreover, a direct competition between adjacent objects can speed up the identification of their common boundary. We introduce AGILE3D, an efficient, attention-based model that (1) supports simultaneous segmentation of multiple 3D objects, (2) yields more accurate segmentation masks with fewer user clicks, and (3) offers faster inference. Our core idea is to encode user clicks as spatial-temporal queries and enable explicit interactions between click queries as well as between them and the 3D scene through a click attention module. Every time new clicks are added, we only need to run a lightweight decoder that produces updated segmentation masks. In experiments with four different 3D point cloud datasets, AGILE3D sets a new state-of-the-art. Moreover, we also verify its practicality in real-world setups with real user studies. Project page: https://ywyue.github.io/AGILE3D.",
        "keywords": "interactive segmentation;3D instance segmentation;point cloud;attention",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/7f29a60c66bdc5881f680f613bc3c921576b6f6c.zip",
        "author": "Yuanwen Yue;Sabarinath Mahadevan;Jonas Schult;Francis Engelmann;Bastian Leibe;Konrad Schindler;Theodora Kontogianni",
        "authorids": "~Yuanwen_Yue1;~Sabarinath_Mahadevan1;~Jonas_Schult1;~Francis_Engelmann1;~Bastian_Leibe3;~Konrad_Schindler1;~Theodora_Kontogianni2",
        "gender": "M;M;M;;M;M;F",
        "homepage": "https://ywyue.github.io/;;https://www.vision.rwth-aachen.de/person/219/;;http://www.vision.rwth-aachen.de;https://igp.ethz.ch/personen/person-detail.html?persid=143986;",
        "dblp": "253/0221;220/3248;228/6936;;41/1228;73/488;191/4648",
        "google_scholar": "rO_8EHsAAAAJ;https://scholar.google.com/citations?hl=en;iW4T05IAAAAJ;;ZcULDB0AAAAJ;FZuNgqIAAAAJ;QVJIkWwAAAAJ",
        "orcid": ";;;;0000-0003-4225-0051;0000-0002-3172-9246;0000-0002-8754-8356",
        "linkedin": ";sabarinath-mahadevan-23b5b846?originalSubdomain=de;;;;konrad-schindler-5b0b22153/;",
        "or_profile": "~Yuanwen_Yue1;~Sabarinath_Mahadevan1;~Jonas_Schult1;~Francis_Engelmann1;~Bastian_Leibe3;~Konrad_Schindler1;~Theodora_Kontogianni2",
        "aff": "ETHZ - ETH Zurich;RWTH Aachen University;Rheinisch Westf\u00e4lische Technische Hochschule Aachen;;RWTH Aachen University;Swiss Federal Institute of Technology;ETHZ - ETH Zurich",
        "aff_domain": "ethz.ch;rwth-aachen.de;rwth-aachen.de;;rwth-aachen.de;ethz.ch;ethz.ch",
        "position": "Scientific Assistant;PhD student;PhD student;;Full Professor;Professor;Postdoc",
        "bibtex": "@inproceedings{\nyue2024agiled,\ntitle={{AGILE}3D: Attention Guided Interactive Multi-object 3D Segmentation},\nauthor={Yuanwen Yue and Sabarinath Mahadevan and Jonas Schult and Francis Engelmann and Bastian Leibe and Konrad Schindler and Theodora Kontogianni},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=9cQtXpRshE}\n}",
        "github": "",
        "project": "",
        "reviewers": "byjT;3vqw;Gxfu;PRcH",
        "pdf_size": 50509934,
        "rating": "3;5;6;8",
        "confidence": "4;4;3;3",
        "soundness": "2;2;3;4",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;4",
        "wc_summary": "69;52;50;78",
        "wc_strengths": "73;42;58;116",
        "wc_weaknesses": "365;106;31;57",
        "wc_questions": "76;5;1;14",
        "wc_review": "583;205;140;265",
        "wc_reply_reviewers": "263;0;0;0",
        "wc_reply_authors": "4041;859;483;204",
        "reply_reviewers": "3;0;0;0",
        "reply_authors": "8;3;2;2",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            62.25,
            11.712706775122479
        ],
        "wc_strengths_avg": [
            72.25,
            27.535204738661378
        ],
        "wc_weaknesses_avg": [
            139.75,
            132.80695576663143
        ],
        "wc_questions_avg": [
            24.0,
            30.389142798045487
        ],
        "wc_review_avg": [
            298.25,
            170.2400878171766
        ],
        "wc_reply_reviewers_avg": [
            65.75,
            113.88234059765368
        ],
        "wc_reply_authors_avg": [
            1396.75,
            1544.24939290906
        ],
        "reply_reviewers_avg": [
            0.75,
            1.299038105676658
        ],
        "reply_authors_avg": [
            3.75,
            2.48746859276655
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.8320502943378437,
        "gs_citation": 23,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14686933716165665768&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=9cQtXpRshE",
        "pdf": "https://openreview.net/pdf?id=9cQtXpRshE",
        "email": "ethz.ch;rwth-aachen.de;rwth-aachen.de;;rwth-aachen.de;ethz.ch;ethz.ch",
        "author_num": 7,
        "aff_unique_index": "0;1;1;1;2;0",
        "aff_unique_norm": "ETH Zurich;RWTH Aachen University;Swiss Federal Institute of Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ethz.ch;https://www.rwth-aachen.de;https://www.ethz.ch",
        "aff_unique_abbr": "ETHZ;RWTH;ETH Zurich",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Aachen",
        "aff_country_unique_index": "0;1;1;1;0;0",
        "aff_country_unique": "Switzerland;Germany"
    },
    {
        "id": "9ceadCJY4B",
        "title": "Ask Again, Then Fail: Large Language Models\u2019 Vacillations in Judgement",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "With the emergence of generative conversational large language models (LLMs) like ChatGPT, serving as virtual assistants in various fields, the stability and reliability of their responses have become crucial. However, during usage, it has been observed that these models tend to waver in their judgements when confronted with follow-up questions from users expressing skepticism or disagreement. In this work, we draw inspiration from questioning strategies in education and propose a \\textsc{Follow-up Questioning Mechanism} along with two evaluation metrics to assess the judgement consistency of LLMs before and after exposure to disturbances. We evaluate the judgement consistency of ChatGPT, PaLM2-Bison, and Vicuna-13B under this mechanism across eight reasoning benchmarks. Empirical results show that even when the initial answers are correct, judgement consistency sharply decreases when LLMs face disturbances such as questioning, negation, or misleading. Additionally, we study these models' judgement consistency under various settings (sampling temperature and prompts) to validate this issue further, observing the impact of prompt tone and conducting an in-depth error analysis for deeper behavioral insights. Furthermore, we also explore several prompting methods to mitigate this issue and demonstrate their effectiveness.",
        "keywords": "Large Language Models;Uncertainty;Evaluation;In-Context Learning;Alignment;Multi-round dialogue;Robustness",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/7152853d31897128e3389fe7cc5498495d0d877f.pdf",
        "author": "Qiming Xie;Zengzhi Wang;Yi Feng;Rui Xia",
        "authorids": "~Qiming_Xie1;~Zengzhi_Wang1;~Yi_Feng8;~Rui_Xia1",
        "gender": ";M;M;M",
        "homepage": ";https://sinclaircoder.github.io/;https://github.com/mind-yi;http://www.nustm.cn/member/rxia/",
        "dblp": ";34/133;;",
        "google_scholar": "6YxHXgEAAAAJ;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com/citations?hl=en;https://scholar.google.com.hk/citations?user=Znde6gwAAAAJ",
        "orcid": ";0000-0002-6146-6248;0009-0003-9827-6733;",
        "linkedin": ";;;",
        "or_profile": "~Qiming_Xie1;~Zengzhi_Wang1;~Yi_Feng8;~Rui_Xia1",
        "aff": "Nanjing University of Science and Technology;;Nanjing University of Science and Technology;Nanjing University of Science and Technology",
        "aff_domain": "njust.edu.cn;;njust.edu.cn;njust.edu.cn",
        "position": "PhD student;;MS student;Full Professor",
        "bibtex": "@misc{\nxie2024ask,\ntitle={Ask Again, Then Fail: Large Language Models{\\textquoteright} Vacillations in Judgement},\nauthor={Qiming Xie and Zengzhi Wang and Yi Feng and Rui Xia},\nyear={2024},\nurl={https://openreview.net/forum?id=9ceadCJY4B}\n}",
        "github": "",
        "project": "",
        "reviewers": "AVRR;3h1U;bqxm",
        "site": "https://openreview.net/forum?id=9ceadCJY4B",
        "pdf_size": 513500,
        "rating": "5;6;6",
        "confidence": "4;4;4",
        "soundness": "3;3;3",
        "contribution": "2;2;3",
        "presentation": "3;3;4",
        "wc_summary": "89;137;110",
        "wc_strengths": "76;41;76",
        "wc_weaknesses": "241;35;100",
        "wc_questions": "1;20;63",
        "wc_review": "407;233;349",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1782;341;2842",
        "reply_reviewers": "0;0;0",
        "reply_authors": "4;1;7",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            112.0,
            19.6468827043885
        ],
        "wc_strengths_avg": [
            64.33333333333333,
            16.49915822768611
        ],
        "wc_weaknesses_avg": [
            125.33333333333333,
            85.98578693921196
        ],
        "wc_questions_avg": [
            28.0,
            25.93581821856921
        ],
        "wc_review_avg": [
            329.6666666666667,
            72.33870947762954
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1655.0,
            1024.9705686831533
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            4.0,
            2.449489742783178
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14812058383281440644&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Nanjing University of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.nust.edu.cn/",
        "aff_unique_abbr": "NUST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "9cumTvvlHG",
        "title": "Implicit Chain of Thought Reasoning via Knowledge Distillation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "To augment language models with the ability to reason, researchers usually prompt or finetune them to produce chain of thought reasoning steps before producing the final answer. However, although people use natural language to reason effectively, it may be that LMs could reason more effectively with some intermediate computation that is not in natural language. In this work, we explore an alternative reasoning approach: instead of explicitly producing the chain of thought reasoning steps, we use the language model\u2019s internal hidden states to perform implicit reasoning. The implicit reasoning steps are distilled from a teacher model trained on explicit chain-of-thought reasoning, and instead of doing reasoning \u201chorizontally\u201d by producing intermediate words one-by-one, we distill it such that the reasoning\nhappens \u201cvertically\u201d among the hidden states in different layers. We conduct experiments on a multi-digit multiplication task and a grade school math problem dataset and find that this approach is able to outperform baselines that directly produce the answer by a large margin.",
        "keywords": "chain of thought;knowledge distillation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yuntian Deng;Kiran Prasad;Roland Fernandez;Paul Smolensky;Vishrav Chaudhary;Stuart Shieber",
        "authorids": "~Yuntian_Deng2;kiranprasad@microsoft.com;~Roland_Fernandez1;~Paul_Smolensky1;~Vishrav_Chaudhary1;~Stuart_Shieber1",
        "gender": ";;M;M;;M",
        "homepage": "https://yuntiandeng.com;;https://www.microsoft.com/en-us/research/people/rfernand/;http://cogsci.jhu.edu/directory/paul-smolensky/;;http://www.eecs.harvard.edu/~shieber/",
        "dblp": "166/1720;;http://dblp.uni-trier.de/pers/hd/f/Fernandez:Roland;48/1105;;",
        "google_scholar": "tk0e5lYAAAAJ;;4__jyWsAAAAJ;PRtkZzYAAAAJ;;",
        "orcid": ";;0000-0002-8032-6646;0000-0003-2420-182X;;0000-0002-7733-8195",
        "linkedin": ";;fernandezroland/;paul-smolensky-b1871183/;;",
        "or_profile": "~Yuntian_Deng2;kiranprasad@microsoft.com;~Roland_Fernandez1;~Paul_Smolensky1;~Vishrav_Chaudhary1;~Stuart_Shieber1",
        "aff": "Allen Institute for Artificial Intelligence;;Microsoft Research AI;Johns Hopkins University;;Harvard University",
        "aff_domain": "allenai.org;;microsoft.com;jhu.edu;;harvard.edu",
        "position": "Postdoc;;Senior Reseacher;Professor;;Full Professor",
        "bibtex": "@misc{\ndeng2024implicit,\ntitle={Implicit Chain of Thought Reasoning via Knowledge Distillation},\nauthor={Yuntian Deng and Kiran Prasad and Roland Fernandez and Paul Smolensky and Vishrav Chaudhary and Stuart Shieber},\nyear={2024},\nurl={https://openreview.net/forum?id=9cumTvvlHG}\n}",
        "github": "",
        "project": "",
        "reviewers": "XfmE;kRur;t8BA",
        "site": "https://openreview.net/forum?id=9cumTvvlHG",
        "pdf_size": 275248,
        "rating": "3;3;6",
        "confidence": "3;4;4",
        "soundness": "2;2;2",
        "contribution": "2;2;2",
        "presentation": "3;2;3",
        "wc_summary": "91;103;239",
        "wc_strengths": "41;9;81",
        "wc_weaknesses": "65;446;269",
        "wc_questions": "24;27;192",
        "wc_review": "221;585;781",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "246;580;707",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            144.33333333333334,
            67.11846905948383
        ],
        "wc_strengths_avg": [
            43.666666666666664,
            29.4542960458327
        ],
        "wc_weaknesses_avg": [
            260.0,
            155.6727336433712
        ],
        "wc_questions_avg": [
            81.0,
            78.49840762716146
        ],
        "wc_review_avg": [
            529.0,
            232.022987366913
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            511.0,
            194.42393542634267
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 36,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14329277276992928160&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Allen Institute for Artificial Intelligence;Microsoft;Johns Hopkins University;Harvard University",
        "aff_unique_dep": ";AI;;",
        "aff_unique_url": "https://allenai.org;https://www.microsoft.com/en-us/research;https://www.jhu.edu;https://www.harvard.edu",
        "aff_unique_abbr": "AI2;MSR;JHU;Harvard",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "9g8h5HwZMy",
        "title": "Subgraph Diffusion for 3D Molecular Representation Learning: Combining Continuous and Discrete",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Molecular representation learning has shown great success in AI-based drug discovery. The 3D geometric structure contains crucial information about the underlying energy function, related to the physical and chemical properties. Recently, denoising diffusion probabilistic models have achieved impressive results in molecular conformation generation. However, the knowledge of pre-trained diffusion models has not been fully exploited in molecular representation learning. In this paper, we study the ability of representation learning inherent in the diffusion model for conformation generation. We introduce a new general diffusion model framework called MaskedDiff for molecular representation learning. Instead of adding noise to atoms like conventional diffusion models, MaskedDiff uses a discrete distribution to select a subset of the atoms to add continuous Gaussian noise at each step during the forward process. Further, we develop a novel subgraph diffusion model termed SUBGDIFF for enhancing the perception of molecular substructure in the denoising network (noise predictor), by incorporating auxiliary subgraph predictors during training. Experiments on molecular conformation generation and 3D molecular property prediction demonstrate the superior performance of our approach.",
        "keywords": "Diffusion model;Molecular representation learning;Subgraph;Masked vector",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/00780d42048704782dd30c09a50b5b27d5e58bd6.zip",
        "author": "Jiying Zhang;Zijing Liu;Yu Wang;Zhengyang Qi;Yu Li",
        "authorids": "~Jiying_Zhang1;~Zijing_Liu1;~Yu_Wang43;~Zhengyang_Qi2;~Yu_Li4",
        "gender": "M;;F;M;M",
        "homepage": "https://youjibiying.github.io/;https://github.com/zj-liu;https://github.com/rain305f;https://github.com/MiloQ/;https://yu-li.github.io/",
        "dblp": "287/9432;205/3211;;;34/2997-3",
        "google_scholar": "j90eZ0MAAAAJ;;lzsu-5MAAAAJ;;j9lwU7kAAAAJ",
        "orcid": ";0000-0002-0189-7409;;;",
        "linkedin": ";;;;",
        "or_profile": "~Jiying_Zhang1;~Zijing_Liu1;~Yu_Wang43;~Zhengyang_Qi2;~Yu_Li4",
        "aff": "IDEA;International Digital Economy Academy;Peking University;University of Science and Technology of China;International Digital Economy Academy",
        "aff_domain": "idea.edu.cn;idea.edu.cn;pku.edu.cn;ustc.edu.cn;idea.edu.cn",
        "position": "Researcher;Researcher;MS student;MS student;Principal Researcher",
        "bibtex": "@misc{\nzhang2024subgraph,\ntitle={Subgraph Diffusion for 3D Molecular Representation Learning: Combining Continuous and Discrete},\nauthor={Jiying Zhang and Zijing Liu and Yu Wang and Zhengyang Qi and Yu Li},\nyear={2024},\nurl={https://openreview.net/forum?id=9g8h5HwZMy}\n}",
        "github": "",
        "project": "",
        "reviewers": "yz4M;eamf;aJi2;7f3c",
        "site": "https://openreview.net/forum?id=9g8h5HwZMy",
        "pdf_size": 4601085,
        "rating": "3;5;6;6",
        "confidence": "5;4;4;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;2",
        "presentation": "2;2;2;3",
        "wc_summary": "52;78;73;49",
        "wc_strengths": "49;37;53;48",
        "wc_weaknesses": "318;99;110;40",
        "wc_questions": "13;170;104;33",
        "wc_review": "432;384;340;170",
        "wc_reply_reviewers": "68;79;0;0",
        "wc_reply_authors": "3115;3051;1688;1728",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "6;6;3;3",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            63.0,
            12.668859459319927
        ],
        "wc_strengths_avg": [
            46.75,
            5.931905258852336
        ],
        "wc_weaknesses_avg": [
            141.75,
            105.18168804502046
        ],
        "wc_questions_avg": [
            80.0,
            61.99596761080514
        ],
        "wc_review_avg": [
            331.5,
            98.75601247519059
        ],
        "wc_reply_reviewers_avg": [
            36.75,
            36.9552093756753
        ],
        "wc_reply_authors_avg": [
            2395.5,
            688.0176233207984
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            4.5,
            1.5
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.8660254037844386,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:93SazIYRKncJ:scholar.google.com/&scioq=Subgraph+Diffusion+for+3D+Molecular+Representation+Learning:+Combining+Continuous+and+Discrete&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;1",
        "aff_unique_norm": "Institute of Electrical and Electronics Engineers;International Digital Economy Academy;Peking University;University of Science and Technology of China",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.ieee.org;;http://www.pku.edu.cn;http://www.ustc.edu.cn",
        "aff_unique_abbr": "IEEE;;Peking U;USTC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;2;2",
        "aff_country_unique": "United States;;China"
    },
    {
        "id": "9grjdFDiAj",
        "title": "Probabilistic Stability of Stochastic Gradient Descent",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Characterizing and understanding the stability of Stochastic Gradient Descent (SGD) remains an open problem in deep learning. A common method is to utilize the convergence of statistical moments, esp. the variance, of the parameters to quantify the stability. We revisit the definition of stability for SGD and propose using the \\textit{convergence in probability} condition to define the \\textit{probabilistic stability} of SGD. The probabilistic stability sheds light on a fundamental question in deep learning theory: how SGD selects a meaningful solution for a neural network from an enormous number of possible solutions that may severely overfit. We show that only through the lens of probabilistic stability does SGD exhibit rich and practically relevant phases of learning, such as the phases of the complete loss of stability, incorrect learning where the model captures incorrect data correlation, convergence to low-rank saddles, and correct learning where the model captures the correct correlation. These phase boundaries are precisely quantified by the Lyapunov exponents of the dynamics. The obtained phase diagrams imply that SGD prefers low-rank saddles in a neural network when the underlying gradient is noisy, thereby influencing the learning performance, for better or for worse.",
        "keywords": "stability;stochastic gradient descent",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Liu Ziyin;Botao Li;Tomer Galanti;Masahito Ueda",
        "authorids": "~Liu_Ziyin1;~Botao_Li1;~Tomer_Galanti1;~Masahito_Ueda1",
        "gender": ";M;M;M",
        "homepage": "https://www.mit.edu/~ziyinl/;;https://tomergalanti.github.io;http://cat.phys.s.u-tokyo.ac.jp/index-e.html",
        "dblp": ";;198/1490;",
        "google_scholar": "NpN9oRMAAAAJ;zRB_MlAAAAAJ;;https://scholar.google.co.jp/citations?user=Xpjx9CwAAAAJ",
        "orcid": ";0000-0003-1631-4373;;0000-0002-5367-1436",
        "linkedin": ";botao-li-33a0ab185;tomer-galanti-5880b1104/;",
        "or_profile": "~Liu_Ziyin1;~Botao_Li1;~Tomer_Galanti1;~Masahito_Ueda1",
        "aff": "Massachusetts Institute of Technology;Laboratoire de Probabilit\u00e9s, Statistique et Mod\u00e9lisation;Texas A&M University - College Station;The University of Tokyo",
        "aff_domain": "mit.edu;lpsm.paris;tamu.edu;u-tokyo.ac.jp",
        "position": "Postdoc;Postdoc;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nziyin2024probabilistic,\ntitle={Probabilistic Stability of Stochastic Gradient Descent},\nauthor={Liu Ziyin and Botao Li and Tomer Galanti and Masahito Ueda},\nyear={2024},\nurl={https://openreview.net/forum?id=9grjdFDiAj}\n}",
        "github": "",
        "project": "",
        "reviewers": "Mfzw;PopN;My7s;bHzM",
        "site": "https://openreview.net/forum?id=9grjdFDiAj",
        "pdf_size": 2076494,
        "rating": "3;5;5;5",
        "confidence": "3;3;3;4",
        "soundness": "2;2;3;4",
        "contribution": "2;2;2;3",
        "presentation": "2;3;1;2",
        "wc_summary": "59;91;64;180",
        "wc_strengths": "39;50;25;62",
        "wc_weaknesses": "219;70;87;206",
        "wc_questions": "167;224;417;207",
        "wc_review": "484;435;593;655",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1557;993;1438;1365",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;2;2;2",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            98.5,
            48.602983447521
        ],
        "wc_strengths_avg": [
            44.0,
            13.656500283747663
        ],
        "wc_weaknesses_avg": [
            145.5,
            67.4258852370512
        ],
        "wc_questions_avg": [
            253.75,
            96.49708544821445
        ],
        "wc_review_avg": [
            541.75,
            86.86591679133997
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1338.25,
            210.78113648996202
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8050913484983213429&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Massachusetts Institute of Technology;Laboratoire de Probabilit\u00e9s, Statistique et Mod\u00e9lisation;Texas A&M University;University of Tokyo",
        "aff_unique_dep": ";Department of Probability, Statistics and Modeling;;",
        "aff_unique_url": "https://web.mit.edu;;https://www.tamu.edu;https://www.u-tokyo.ac.jp",
        "aff_unique_abbr": "MIT;;TAMU;UTokyo",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";College Station",
        "aff_country_unique_index": "0;1;0;2",
        "aff_country_unique": "United States;France;Japan"
    },
    {
        "id": "9gyDdCKTDJ",
        "title": "Gaitor: Learning a Unified Representation for Continuous Gait Transition and Terrain Traversal for Quadruped Robots",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The current state-of-the-art in quadruped locomotion is able to produce robust motion for terrain traversal but requires the segmentation of a desired trajectory into a discrete set of skills such as trot, crawl and pace. This misses the opportunity to leverage commonalities between individual gait types for efficient learning and are unable to smoothly transition between them. Here we present Gaitor, which creates a learnt representation capturing correlations across multiple distinct gait types resulting in the discovery of smooth transitions between motions. In particular, this representation is compact meaning that information common to all gait types is shared. The emerging structure is interpretable in that it encodes phase correlations between the different gait types which can be leveraged to produce smooth gait transitions. In addition, foot swing characteristics are disentangled and directly addressable. Together with a rudimentary terrain encoding and a learned planner operating in this structured latent representation, Gaitor is able to take motion commands including gait type and characteristics from a user while reacting to uneven terrain. We evaluate Gaitor in both simulated and real-world settings, such as climbing over raised platforms, on an ANYmal C platform. To the best of our knowledge, this is the first work learning an interpretable unified-latent representation for multiple gaits, resulting in smooth and natural looking gait transitions between trot and crawl on a real quadruped robot.",
        "keywords": "Representation Learning;Learning for Control;Quadruped Robots",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/46c3aaac74ab3f930d6e07d07f05685a0e77eacd.zip",
        "author": "Alexander Luis Mitchell;Wolfgang Merkt;Aristotelis Papatheodorou;Ioannis Havoutis;Ingmar Posner",
        "authorids": "~Alexander_Luis_Mitchell1;~Wolfgang_Merkt1;aristotelis@robots.ox.ac.uk;~Ioannis_Havoutis1;~Ingmar_Posner1",
        "gender": "M;;;;",
        "homepage": ";http://www.wolfgangmerkt.com/;;;",
        "dblp": "268/8155;;;;59/542",
        "google_scholar": "https://scholar.google.co.uk/citations?user=7YV2TGMAAAAJ;WzpoCwkAAAAJ;;;dPk-iwsAAAAJ",
        "orcid": ";0000-0003-3235-4906;;;0000-0001-6270-700X",
        "linkedin": ";;;;ingmar-posner-20b49a",
        "or_profile": "~Alexander_Luis_Mitchell1;~Wolfgang_Merkt1;aristotelis@robots.ox.ac.uk;~Ioannis_Havoutis1;~Ingmar_Posner1",
        "aff": "University of Oxford;University of Oxford, University of Oxford;;;University of Oxford",
        "aff_domain": "oxford.ac.uk;robots.ox.ac.uk;;;ox.ac.uk",
        "position": "Postdoc;Postdoc;;;Full Professor",
        "bibtex": "@misc{\nmitchell2024gaitor,\ntitle={Gaitor: Learning a Unified Representation for Continuous Gait Transition and Terrain Traversal for Quadruped Robots},\nauthor={Alexander Luis Mitchell and Wolfgang Merkt and Aristotelis Papatheodorou and Ioannis Havoutis and Ingmar Posner},\nyear={2024},\nurl={https://openreview.net/forum?id=9gyDdCKTDJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "QD8G;keBn;A1WD;st69",
        "site": "https://openreview.net/forum?id=9gyDdCKTDJ",
        "pdf_size": 3909475,
        "rating": "3;5;5;5",
        "confidence": "5;2;3;4",
        "soundness": "3;4;2;2",
        "contribution": "3;3;2;2",
        "presentation": "1;3;2;2",
        "wc_summary": "118;102;37;160",
        "wc_strengths": "47;53;39;71",
        "wc_weaknesses": "327;58;21;320",
        "wc_questions": "57;3;364;3",
        "wc_review": "549;216;461;554",
        "wc_reply_reviewers": "136;36;55;0",
        "wc_reply_authors": "662;580;820;484",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "2;2;2;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            104.25,
            44.228808484968255
        ],
        "wc_strengths_avg": [
            52.5,
            11.779218989389747
        ],
        "wc_weaknesses_avg": [
            181.5,
            142.62275414533264
        ],
        "wc_questions_avg": [
            106.75,
            150.15054944954414
        ],
        "wc_review_avg": [
            445.0,
            137.28983939097606
        ],
        "wc_reply_reviewers_avg": [
            56.75,
            49.8366080306435
        ],
        "wc_reply_authors_avg": [
            636.5,
            123.25887391989268
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.7745966692414834,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:jEOifc3UKW4J:scholar.google.com/&scioq=Gaitor:+Learning+a+Unified+Representation+for+Continuous+Gait+Transition+and+Terrain+Traversal+for+Quadruped+Robots&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Oxford",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ox.ac.uk",
        "aff_unique_abbr": "Oxford",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "title": "Machine Unlearning for Image-to-Image Generative Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19288",
        "id": "9hjVoPWPnh",
        "author_site": "Guihong Li, Hsiang Hsu, Chun-Fu Chen, Radu Marculescu",
        "tldr": "",
        "abstract": "Machine unlearning has emerged as a new paradigm to deliberately forget data samples from a given model in order to adhere to stringent regulations.\nHowever, existing machine unlearning methods have been primarily focused on classification models, leaving the landscape of unlearning for generative models relatively unexplored.\nThis paper serves as a bridge, addressing the gap by providing a unifying framework of machine unlearning for image-to-image generative models.\nWithin this framework, we propose a computationally-efficient algorithm, underpinned by rigorous theoretical analysis, that demonstrates negligible performance degradation on the retain samples, while effectively removing the information from the forget samples. \nEmpirical studies on two large-scale datasets, ImageNet-1K and Places-365, further show that our algorithm does not rely on the availability of the retain samples, which further complies with data retention policy.\nTo our best knowledge, this work is the first that represents systemic, theoretical, empirical explorations of machine unlearning specifically tailored for image-to-image generative models.",
        "keywords": "Machine Unlearning;Generative Models;Diffusion Models;GAN;Masked Autoencoder",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Guihong Li;Hsiang Hsu;Chun-Fu Chen;Radu Marculescu",
        "authorids": "~Guihong_Li1;~Hsiang_Hsu1;~Chun-Fu_Chen1;~Radu_Marculescu2",
        "gender": "Unspecified;M;M;M",
        "homepage": "https://liguihong.github.io/;https://hsianghsu.github.io;;https://radum.ece.utexas.edu/",
        "dblp": "143/6649.html;;48/915;88/3494",
        "google_scholar": ";https://scholar.google.com.tw/citations?user=JRl3iYIAAAAJ;9gqd5cYAAAAJ;ZCmYP5cAAAAJ",
        "orcid": "0000-0001-8537-8632;0000-0001-8084-3929;;0000-0003-1826-7646",
        "linkedin": ";;;",
        "or_profile": "~Guihong_Li1;~Hsiang_Hsu1;~Chun-Fu_Chen1;~Radu_Marculescu2",
        "aff": "University of Texas, Austin;JP Morgan & Chase Bank;JPMorganChase, GTAR;University of Texas, Austin",
        "aff_domain": "utexas.edu;jpmchase.com;jpmchase.com;utexas.edu",
        "position": "PhD student;Researcher;Executive Director;Full Professor",
        "bibtex": "@inproceedings{\nli2024machine,\ntitle={Machine Unlearning for Image-to-Image Generative Models},\nauthor={Guihong Li and Hsiang Hsu and Chun-Fu Chen and Radu Marculescu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=9hjVoPWPnh}\n}",
        "github": "",
        "project": "",
        "reviewers": "L8mN;uD61;4Xrc;hK5e",
        "pdf_size": 31020328,
        "rating": "5;5;6;8",
        "confidence": "3;4;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "79;90;74;106",
        "wc_strengths": "93;55;41;54",
        "wc_weaknesses": "253;593;48;56",
        "wc_questions": "49;33;21;202",
        "wc_review": "474;771;184;418",
        "wc_reply_reviewers": "0;270;0;0",
        "wc_reply_authors": "1349;3084;547;1057",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "3;5;2;2",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            87.25,
            12.275483697190918
        ],
        "wc_strengths_avg": [
            60.75,
            19.421315609401955
        ],
        "wc_weaknesses_avg": [
            237.5,
            221.06164298674702
        ],
        "wc_questions_avg": [
            76.25,
            73.27815158694985
        ],
        "wc_review_avg": [
            461.75,
            209.0722064263923
        ],
        "wc_reply_reviewers_avg": [
            67.5,
            116.91342951089922
        ],
        "wc_reply_authors_avg": [
            1509.25,
            953.4113422337706
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            1.224744871391589
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.4714045207910316,
        "gs_citation": 29,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2939352183806994849&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=9hjVoPWPnh",
        "pdf": "https://openreview.net/pdf?id=9hjVoPWPnh",
        "email": "utexas.edu;jpmchase.com;jpmchase.com;utexas.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "University of Texas at Austin;JPMorgan Chase & Co.;JPMorgan Chase",
        "aff_unique_dep": ";;Global Technology, Analytics, and Research (GTAR)",
        "aff_unique_url": "https://www.utexas.edu;https://www.jpmorganchase.com;https://www.jpmorganchase.com",
        "aff_unique_abbr": "UT Austin;JPM;JPM",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Austin;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Bayesian Optimization through Gaussian Cox Process Models for Spatio-temporal Data",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19287",
        "id": "9j1RD9LlWH",
        "author_site": "Yongsheng Mei, Mahdi Imani, Tian Lan",
        "tldr": "",
        "abstract": "Bayesian optimization (BO) has established itself as a leading strategy for efficiently optimizing expensive-to-evaluate functions. Existing BO methods mostly rely on Gaussian process (GP) surrogate models and are not applicable to (doubly-stochastic) Gaussian Cox processes, where the observation process is modulated by a latent intensity function modeled as a GP. In this paper, we propose a novel maximum *a posteriori* inference of Gaussian Cox processes. It leverages the Laplace approximation and change of kernel technique to transform the problem into a new reproducing kernel Hilbert space, where it becomes more tractable computationally. It enables us to obtain both a functional posterior of the latent intensity function and the covariance of the posterior, thus extending existing works that often focus on specific link functions or estimating the posterior mean. Using the result, we propose a BO framework based on the Gaussian Cox process model and further develop a Nystr\u00f6m approximation for efficient computation. Extensive evaluations on various synthetic and real-world datasets demonstrate significant improvement over state-of-the-art inference solutions for Gaussian Cox processes, as well as effective BO with a wide range of acquisition functions designed through the underlying Gaussian Cox process model.",
        "keywords": "Bayesian optimization;Gaussian Cox process",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Yongsheng Mei;Mahdi Imani;Tian Lan",
        "authorids": "~Yongsheng_Mei1;~Mahdi_Imani3;~Tian_Lan4",
        "gender": "M;M;M",
        "homepage": ";https://www2.seas.gwu.edu/~tlan/;https://imani.lab.northeastern.edu/",
        "dblp": "261/7750;;176/7532",
        "google_scholar": "y4Qyp24AAAAJ;;IwSVQXEAAAAJ",
        "orcid": "0000-0001-7606-8931;;0000-0001-9570-9909",
        "linkedin": "yongshengmei/;;mahdi-imani-2a362b25/",
        "or_profile": "~Yongsheng_Mei1;~Tian_Lan4;~Mahdi_Imani2",
        "aff": "George Washington University;George Washington University;Northeastern University",
        "aff_domain": "gwu.edu;gwu.edu;northeastern.edu",
        "position": "PhD student;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nmei2024bayesian,\ntitle={Bayesian Optimization through Gaussian Cox Process Models for Spatio-temporal Data},\nauthor={Yongsheng Mei and Mahdi Imani and Tian Lan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=9j1RD9LlWH}\n}",
        "github": "",
        "project": "",
        "reviewers": "kMEd;dgpT;bJz1",
        "pdf_size": 10544913,
        "rating": "6;8;8",
        "confidence": "2;4;4",
        "soundness": "4;3;3",
        "contribution": "3;3;3",
        "presentation": "3;4;2",
        "wc_summary": "177;140;87",
        "wc_strengths": "87;134;65",
        "wc_weaknesses": "55;391;193",
        "wc_questions": "89;17;569",
        "wc_review": "408;682;914",
        "wc_reply_reviewers": "56;95;284",
        "wc_reply_authors": "920;1460;1701",
        "reply_reviewers": "1;1;3",
        "reply_authors": "3;3;4",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            134.66666666666666,
            36.935379004718804
        ],
        "wc_strengths_avg": [
            95.33333333333333,
            28.778850258865837
        ],
        "wc_weaknesses_avg": [
            213.0,
            137.8985134075056
        ],
        "wc_questions_avg": [
            225.0,
            245.01428529781688
        ],
        "wc_review_avg": [
            668.0,
            206.8107024954624
        ],
        "wc_reply_reviewers_avg": [
            145.0,
            99.56907150315303
        ],
        "wc_reply_authors_avg": [
            1360.3333333333333,
            326.53772965599074
        ],
        "reply_reviewers_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5833568390443611849&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=9j1RD9LlWH",
        "pdf": "https://openreview.net/pdf?id=9j1RD9LlWH",
        "email": "gwu.edu;gwu.edu;northeastern.edu",
        "author_num": 3,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "George Washington University;Northeastern University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.gwu.edu;https://www.northeastern.edu",
        "aff_unique_abbr": "GWU;NEU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "9jMoHuqjfg",
        "title": "Learning to Reach Goals via Diffusion",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Diffusion models are a powerful class of generative models capable of mapping random noise in high-dimensional spaces to a target manifold through iterative denoising. In this work, we present a novel perspective on goal-conditioned reinforcement learning by framing it within the context of diffusion modeling. Analogous to the diffusion process, where Gaussian noise is used to create random trajectories that walk away from the data manifold, we construct trajectories that move away from potential goal states. We then learn a goal-conditioned policy analogous to the score function. This approach, which we call Merlin, can reach predefined or novel goals from an arbitrary initial state without learning a separate value function. We consider three choices for the noise model to replace Gaussian noise in diffusion - reverse play from the buffer, reverse dynamics model, and a novel non-parametric approach. We theoretically justify our approach and validate it on offline goal-reaching tasks. Empirical results are competitive with state-of-the-art methods, which suggests this perspective on diffusion for RL is a simple, scalable, and effective direction for sequential decision-making.",
        "keywords": "Goal-conditioned reinforcement learning;Offline reinforcement learning;Diffusion modeling",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Vineet Jain;Siamak Ravanbakhsh",
        "authorids": "~Vineet_Jain1;~Siamak_Ravanbakhsh1",
        "gender": ";",
        "homepage": ";",
        "dblp": "92/3653;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Vineet_Jain1;~Siamak_Ravanbakhsh1",
        "aff": "McGill University;",
        "aff_domain": "mcgill.ca;",
        "position": "PhD student;",
        "bibtex": "@misc{\njain2024learning,\ntitle={Learning to Reach Goals via Diffusion},\nauthor={Vineet Jain and Siamak Ravanbakhsh},\nyear={2024},\nurl={https://openreview.net/forum?id=9jMoHuqjfg}\n}",
        "github": "",
        "project": "",
        "reviewers": "5ke8;euBm;6Zbj;i457",
        "site": "https://openreview.net/forum?id=9jMoHuqjfg",
        "pdf_size": 11802882,
        "rating": "3;5;5;5",
        "confidence": "3;4;3;3",
        "soundness": "2;3;2;2",
        "contribution": "2;2;2;2",
        "presentation": "2;2;2;3",
        "wc_summary": "71;84;77;97",
        "wc_strengths": "33;89;37;12",
        "wc_weaknesses": "155;96;276;111",
        "wc_questions": "140;2;2;10",
        "wc_review": "399;271;392;230",
        "wc_reply_reviewers": "0;0;255;0",
        "wc_reply_authors": "641;450;1170;557",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;3;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            82.25,
            9.67923034130297
        ],
        "wc_strengths_avg": [
            42.75,
            28.340562803162538
        ],
        "wc_weaknesses_avg": [
            159.5,
            70.67000778265134
        ],
        "wc_questions_avg": [
            38.5,
            58.69199263954155
        ],
        "wc_review_avg": [
            323.0,
            73.97634757136905
        ],
        "wc_reply_reviewers_avg": [
            63.75,
            110.41823898251593
        ],
        "wc_reply_authors_avg": [
            704.5,
            277.1502300197494
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17073276869658529521&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0",
        "aff_unique_norm": "McGill University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.mcgill.ca",
        "aff_unique_abbr": "McGill",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "9jmUwjZi7j",
        "title": "DreamFuser: Value-guided Diffusion Policy for Offline Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent advances in reinforcement learning have underscored the potential of diffusion models, particularly in the context of policy learning. While earlier applications were predominantly focused on single-timestep settings, trajectory-based diffusion policy learning promises significant superiority, especially for low-level control tasks. In this context, we introduce DreamFuser, a trajectory-based value optimization approach that seamlessly blends the merits of diffusion-based trajectory learning and efficient Q function learning over state and noisy action. To address the computational challenges associated with action sampling of diffusion policy during the training phase, we design the DreamFuser based on the Generalized Noisy Action Markov Decision Process (GNMDP), which views the diffusion denoising process as part of the MDP transition. Empirical tests reveal DreamFuser's advantages over existing diffusion policy algorithms, notably in low-level control tasks. When benchmarked against the standard benchmark of offline reinforcement learning D4RL, DreamFuser matches or even outperforms contemporary methods. This work also elucidates the parallels between the optimization process of DreamFuser over GNMDP and Diffusion Policy over MDP, demonstrating its computational and memory advantages.",
        "keywords": "Trajectory-based Reinforcement Learning; Diffusion Model; Offline Reinforcement Learning;",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/acb2e143858cab7aafa815293691c9f1f4874b5e.zip",
        "author": "Kairong Luo;CAIWEI XIAO;Zhiao Huang;Zhan Ling;Yunhao Fang;Hao Su",
        "authorids": "~Kairong_Luo1;~CAIWEI_XIAO1;~Zhiao_Huang1;~Zhan_Ling2;~Yunhao_Fang1;~Hao_Su1",
        "gender": "M;F;M;M;M;M",
        "homepage": "https://github.com/thu-yao-01-luo/thu-yao-01-luo;;;;https://seerkfang.github.io/;http://ai.ucsd.edu/~haosu",
        "dblp": ";;172/1410;254/1980;;09/4945-1",
        "google_scholar": ";;;vsRxnYAAAAAJ;;1P8Zu04AAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";caiwei-xiao;;zhan-ling-069a59149/;yunhao-fang-8b318221a/;",
        "or_profile": "~Kairong_Luo1;~CAIWEI_XIAO1;~Zhiao_Huang1;~Zhan_Ling2;~Yunhao_Fang1;~Hao_Su1",
        "aff": "Tsinghua University;;University of California, San Diego, University of California, San Diego;University of California, San Diego;University of California, San Diego;University of California, San Diego",
        "aff_domain": "tsinghua.edu.cn;;eng.ucsd.edu;ucsd.edu;ucsd.edu;ucsd.edu",
        "position": "Undergrad student;;PhD student;PhD student;MS student;Associate Professor",
        "bibtex": "@misc{\nluo2024dreamfuser,\ntitle={DreamFuser: Value-guided Diffusion Policy for Offline Reinforcement Learning},\nauthor={Kairong Luo and CAIWEI XIAO and Zhiao Huang and Zhan Ling and Yunhao Fang and Hao Su},\nyear={2024},\nurl={https://openreview.net/forum?id=9jmUwjZi7j}\n}",
        "github": "",
        "project": "",
        "reviewers": "vgVx;pkRP;6WsC",
        "site": "https://openreview.net/forum?id=9jmUwjZi7j",
        "pdf_size": 544922,
        "rating": "3;3;6",
        "confidence": "4;3;3",
        "soundness": "2;2;3",
        "contribution": "2;2;2",
        "presentation": "3;1;3",
        "wc_summary": "54;29;47",
        "wc_strengths": "86;36;55",
        "wc_weaknesses": "250;579;203",
        "wc_questions": "9;2;363",
        "wc_review": "399;646;668",
        "wc_reply_reviewers": "186;0;218",
        "wc_reply_authors": "1156;1542;1487",
        "reply_reviewers": "1;0;1",
        "reply_authors": "2;4;3",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            43.333333333333336,
            10.530379332620875
        ],
        "wc_strengths_avg": [
            59.0,
            20.607442021431645
        ],
        "wc_weaknesses_avg": [
            344.0,
            167.27422594849054
        ],
        "wc_questions_avg": [
            124.66666666666667,
            168.55134397433784
        ],
        "wc_review_avg": [
            571.0,
            121.95354306729537
        ],
        "wc_reply_reviewers_avg": [
            134.66666666666666,
            96.11567105431988
        ],
        "wc_reply_authors_avg": [
            1395.0,
            170.4836258022062
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.0,
            0.816496580927726
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:yQEgfy0z2sMJ:scholar.google.com/&scioq=DreamFuser:+Value-guided+Diffusion+Policy+for+Offline+Reinforcement+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1;1",
        "aff_unique_norm": "Tsinghua University;University of California, San Diego",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.ucsd.edu",
        "aff_unique_abbr": "THU;UCSD",
        "aff_campus_unique_index": "1;1;1;1",
        "aff_campus_unique": ";San Diego",
        "aff_country_unique_index": "0;1;1;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "On the Learnability of Watermarks for Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19286",
        "id": "9k0krNzvlV",
        "author_site": "Chenchen Gu, XIANG LI, Percy Liang, Tatsunori Hashimoto",
        "tldr": "",
        "abstract": "Watermarking of language model outputs enables statistical detection of model-generated text, which can mitigate harms and misuses of language models. Existing watermarking strategies operate by altering the decoder of an existing language model. In this paper, we ask whether language models can directly learn to generate watermarked text, which would have significant implications for the real-world deployment of watermarks. First, learned watermarks could be used to build open models that naturally generate watermarked text, enabling watermarking for open models, where users can control the decoding procedure. Second, if watermarking is used to determine the provenance of generated text, an adversary can hurt the reputation of a victim model by spoofing its watermark and generating damaging watermarked text. To investigate the learnability of watermarks, we propose watermark distillation, which trains a student model to behave like a teacher model that uses decoding-based watermarking. We test our approach on three decoding-based watermarking strategies and various hyperparameter settings, finding that models can learn to generate watermarked text with high detectability. We also find limitations to learnability, including the loss of watermarking capabilities under fine-tuning on normal text and high sample complexity when learning low-distortion watermarks.",
        "keywords": "watermarking;large language models;distillation",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Chenchen Gu;Xiang Lisa Li;Percy Liang;Tatsunori Hashimoto",
        "authorids": "~Chenchen_Gu1;~Xiang_Lisa_Li1;~Percy_Liang1;~Tatsunori_Hashimoto1",
        "gender": "M;F;;M",
        "homepage": "https://chenchenygu.github.io/;https://xiangli1999.github.io;https://cs.stanford.edu/~pliang/;https://thashim.github.io",
        "dblp": ";40/1491-63;04/1701;",
        "google_scholar": "kHeBSVYAAAAJ;nzA4P0oAAAAJ;pouyVyUAAAAJ;5ygiTwsAAAAJ",
        "orcid": ";;;",
        "linkedin": "chenchen-gu/;;;",
        "or_profile": "~Chenchen_Gu1;~Xiang_Lisa_Li1;~Percy_Liang1;~Tatsunori_Hashimoto1",
        "aff": "Stanford University;Stanford University;Stanford University;Stanford University",
        "aff_domain": "stanford.edu;stanford.edu;stanford.edu;stanford.edu",
        "position": "Undergrad student;PhD student;Associate Professor;Assistant Professor",
        "bibtex": "@inproceedings{\ngu2024on,\ntitle={On the Learnability of Watermarks for Language Models},\nauthor={Chenchen Gu and Xiang Lisa Li and Percy Liang and Tatsunori Hashimoto},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=9k0krNzvlV}\n}",
        "github": "",
        "project": "",
        "reviewers": "2p7U;GhKC;hxrQ;metd",
        "pdf_size": 569282,
        "rating": "5;6;6;6",
        "confidence": "3;4;4;4",
        "soundness": "3;3;3;4",
        "contribution": "3;3;3;2",
        "presentation": "3;2;2;4",
        "wc_summary": "37;81;208;74",
        "wc_strengths": "14;94;121;72",
        "wc_weaknesses": "101;177;198;224",
        "wc_questions": "72;1;131;68",
        "wc_review": "224;353;658;438",
        "wc_reply_reviewers": "0;0;46;12",
        "wc_reply_authors": "820;655;1206;1032",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            100.0,
            64.55617708631762
        ],
        "wc_strengths_avg": [
            75.25,
            39.39146481155531
        ],
        "wc_weaknesses_avg": [
            175.0,
            45.8530260724415
        ],
        "wc_questions_avg": [
            68.0,
            46.02716589146023
        ],
        "wc_review_avg": [
            418.25,
            158.00375786670392
        ],
        "wc_reply_reviewers_avg": [
            14.5,
            18.83480820183736
        ],
        "wc_reply_authors_avg": [
            928.25,
            208.74191601113563
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 44,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4306363265805586600&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=9k0krNzvlV",
        "pdf": "https://openreview.net/pdf?id=9k0krNzvlV",
        "email": "stanford.edu;stanford.edu;stanford.edu;stanford.edu",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Stanford University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.stanford.edu",
        "aff_unique_abbr": "Stanford",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Stanford",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "9k27IITeAZ",
        "title": "ChunkAttention: Efficient Attention on KV Cache with Chunking Sharing and Batching",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Self-attention is an essential component of GPT-style models and a significant cause of LLM inference latency for long sequences. In multi-tenant LLM inference servers, the compute and memory operation cost of self-attention can be amortized by making use of the probability that sequences from users may share long prompt prefixes. This paper introduces ChunkAttention, a unique self-attention kernel built on chunking, sharing the KV cache, and batching the attention computation. ChunkAttention recognizes matching prompt prefixes across several sequences and shares their KV cache in memory by chunking the KV cache and structuring it into the auxiliary prefix tree. To significantly improve the memory reuse of KV cache and consequently the speed of self-attention for long shared prompts, we design an efficient computation kernel on this new storage structure, where two-phased partitioning is implemented to reduce memory operations on shared KV cache during self-attention. Experiments show that ChunkAttention can speed up self-attention of long shared prompts 1.6-3 times, with lengths ranging from 1024 to 8192.",
        "keywords": "large language model;model inference;self attention",
        "primary_area": "infrastructure, software libraries, hardware, etc.",
        "supplementary_material": "/attachment/34a6aefe728c3e9a526d796dc036dc6b0d6a9571.zip",
        "author": "Lu Ye;Ze Tao;Yong Huang;Yang Li",
        "authorids": "~Lu_Ye1;~Ze_Tao2;~Yong_Huang4;~Yang_Li83",
        "gender": "M;M;;M",
        "homepage": "https://scholar.google.com/citations?user=kRjMKvEAAAAJ&hl=en;https://github.com/Toudsour;https://www.linkedin.com/in/yong-huang-818698bb/;https://leon.github.io",
        "dblp": ";;;",
        "google_scholar": "kRjMKvEAAAAJ;;;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Lu_Ye1;~Ze_Tao2;~Yong_Huang4;~Yang_Li83",
        "aff": ";Xi'an Jiaotong University;;",
        "aff_domain": ";xjtu.edu.cn;;",
        "position": ";MS student;;",
        "bibtex": "@misc{\nye2024chunkattention,\ntitle={ChunkAttention: Efficient Attention on {KV} Cache with Chunking Sharing and Batching},\nauthor={Lu Ye and Ze Tao and Yong Huang and Yang Li},\nyear={2024},\nurl={https://openreview.net/forum?id=9k27IITeAZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "oC3j;ee1U;sEJt;FRg7",
        "site": "https://openreview.net/forum?id=9k27IITeAZ",
        "pdf_size": 566347,
        "rating": "3;5;5;5",
        "confidence": "5;3;5;3",
        "soundness": "2;3;3;2",
        "contribution": "3;2;4;2",
        "presentation": "2;3;3;2",
        "wc_summary": "91;94;67;44",
        "wc_strengths": "40;19;63;53",
        "wc_weaknesses": "111;145;204;69",
        "wc_questions": "102;9;28;166",
        "wc_review": "344;267;362;332",
        "wc_reply_reviewers": "54;0;20;32",
        "wc_reply_authors": "415;85;151;162",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            1.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            74.0,
            20.23610634484806
        ],
        "wc_strengths_avg": [
            43.75,
            16.452583383772897
        ],
        "wc_weaknesses_avg": [
            132.25,
            49.403314666123364
        ],
        "wc_questions_avg": [
            76.25,
            62.3873985673389
        ],
        "wc_review_avg": [
            326.25,
            35.83556194620087
        ],
        "wc_reply_reviewers_avg": [
            26.5,
            19.56399754651385
        ],
        "wc_reply_authors_avg": [
            203.25,
            125.75049701691043
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7802398420830154308&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Xi'an Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.xjtu.edu.cn",
        "aff_unique_abbr": "XJTU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "9k4Yvb75ED",
        "title": "EquiAV: Single-modal Equivariance Promotes Audio-Visual Contrastive Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Advancements in audio-visual representation learning have showcased its effectiveness in acquiring rich and comprehensive representations by leveraging both auditory and visual modalities. Recent works have attempted to improve performance using contrastive learning or masked modeling techniques. However, the effort to maximize the impact of data augmentations for learning semantically rich representation has remained relatively narrow. Without a proper strategy for utilizing data augmentation, the model can be adversely affected or fail to achieve sufficient performance gains. To address this limitation, we present EquiAV, a novel framework that integrates single-modal equivariant contrastive learning with audio-visual contrastive learning. In the proposed framework, audio-visual correspondence and rich modality-specific representations are learned in separate latent spaces. In particular, augmentation-related and modality-specific information is learned in the intra-modal latent space by making the representations equivariant to data augmentation. Extensive ablation studies verify that our framework is the most suitable architecture for maximizing the benefits of the augmentation while ensuring model robustness to strong augmentation. EquiAV outperforms the existing audio-visual self-supervised pre-training methods on audio-visual event classification and zero-shot audio-visual retrieval tasks.",
        "keywords": "Audio-Visual Contrastive Learning;Multimodal Representation Learning;Equivariant Contrastive Learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Jongsuk Kim;Hyeongkeun Lee;Kyeongha Rho;Junmo Kim;Joon Son Chung",
        "authorids": "~Jongsuk_Kim1;~Hyeongkeun_Lee1;~Kyeongha_Rho1;~Junmo_Kim1;~Joon_Son_Chung1",
        "gender": "M;M;M;;M",
        "homepage": ";https://khrho325.github.io;https://siit.kaist.ac.kr/Faculty;https://mmai.io/joon/;https://siit.kaist.ac.kr/",
        "dblp": "325/1370;264/9498;40/240-2.html;160/2692.html;330/3774",
        "google_scholar": "rFmAVN4AAAAJ;;https://scholar.google.com.tw/citations?user=GdQtWNQAAAAJ;https://scholar.google.co.uk/citations?user=JJ_LQ0YAAAAJ;C1O5NFQAAAAJ",
        "orcid": ";;;0000-0001-7741-7275;",
        "linkedin": ";;;;",
        "or_profile": "~Hyeongkeun_Lee1;~Kyeongha_Rho1;~Junmo_Kim1;~Joon_Son_Chung1;~Jong_Suk_Kim1",
        "aff": "Korea Advanced Institute of Science & Technology;KAIST;Korea Advanced Institute of Science & Technology;KAIST;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr;kaist.ac.kr;kaist.ac.kr;kaist.ac.kr",
        "position": "MS student;MS student;Associate Professor;Associate Professor;PhD student",
        "bibtex": "@misc{\nkim2024equiav,\ntitle={Equi{AV}: Single-modal Equivariance Promotes Audio-Visual Contrastive Learning},\nauthor={Jongsuk Kim and Hyeongkeun Lee and Kyeongha Rho and Junmo Kim and Joon Son Chung},\nyear={2024},\nurl={https://openreview.net/forum?id=9k4Yvb75ED}\n}",
        "github": "",
        "project": "",
        "reviewers": "4TFL;eQDc;3ZPL;A7KE",
        "site": "https://openreview.net/forum?id=9k4Yvb75ED",
        "pdf_size": 4747337,
        "rating": "3;3;3;6",
        "confidence": "4;5;2;3",
        "soundness": "3;2;3;3",
        "contribution": "1;2;1;3",
        "presentation": "3;3;3;3",
        "wc_summary": "137;121;58;90",
        "wc_strengths": "129;65;20;143",
        "wc_weaknesses": "387;156;295;47",
        "wc_questions": "29;65;5;336",
        "wc_review": "682;407;378;616",
        "wc_reply_reviewers": "140;0;0;7",
        "wc_reply_authors": "1687;1080;1053;981",
        "reply_reviewers": "2;0;0;1",
        "reply_authors": "3;2;2;2",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            101.5,
            30.26962173533062
        ],
        "wc_strengths_avg": [
            89.25,
            49.630509769697106
        ],
        "wc_weaknesses_avg": [
            221.25,
            129.93532044829072
        ],
        "wc_questions_avg": [
            108.75,
            132.92925750187578
        ],
        "wc_review_avg": [
            520.75,
            130.7581259425203
        ],
        "wc_reply_reviewers_avg": [
            36.75,
            59.67987516742976
        ],
        "wc_reply_authors_avg": [
            1200.25,
            283.3455266984111
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.2581988897471611,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:QCXIDQNANV8J:scholar.google.com/&scioq=EquiAV:+Single-modal+Equivariance+Promotes+Audio-Visual+Contrastive+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "Time Fairness in Online Knapsack Problems",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19285",
        "id": "9kG7TwgLYu",
        "author_site": "Adam Lechowicz, Rik Sengupta, Bo Sun, Shahin Kamali, Mohammad Hajiesmaili",
        "tldr": "",
        "abstract": "The online knapsack problem is a classic problem in the field of online algorithms. Its canonical version asks how to pack items of different values and weights arriving online into a capacity-limited knapsack so as to maximize the total value of the admitted items. Although optimal competitive algorithms are known for this problem, they may be fundamentally unfair, i.e., individual items may be treated inequitably in different ways. We formalize a practically-relevant notion of time fairness which effectively models a trade off between static and dynamic pricing in a motivating application such as cloud resource allocation, and show that existing algorithms perform poorly under this metric.  We propose a parameterized deterministic algorithm where the parameter precisely captures the Pareto-optimal trade-off between fairness (static pricing) and competitiveness (dynamic pricing). We show that randomization is theoretically powerful enough to be simultaneously competitive and fair; however, it does not work well in experiments. To further improve the trade-off between fairness and competitiveness, we develop a nearly-optimal learning-augmented algorithm which is fair, consistent, and robust (competitive), showing substantial performance improvements in numerical experiments.",
        "keywords": "fairness;online knapsack;learning-augmented algorithm;Pareto-optimality;robustness;consistency",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/6e62237334e258d8dddb48f6242a120848a5903b.pdf",
        "author": "Adam Lechowicz;Rik Sengupta;Bo Sun;Shahin Kamali;Mohammad Hajiesmaili",
        "authorids": "~Adam_Lechowicz1;~Rik_Sengupta1;~Bo_Sun8;~Shahin_Kamali1;~Mohammad_Hajiesmaili1",
        "gender": "Non-Binary;M;;M;M",
        "homepage": "https://adamlechowicz.github.io;https://people.cs.umass.edu/~rsengupta/;;https://www.eecs.yorku.ca/~kamalis/;https://groups.cs.umass.edu/hajiesmaili/",
        "dblp": "307/5199;151/8711;;59/577.html;49/7911",
        "google_scholar": "fZ2-jm0AAAAJ;hK7NUBIAAAAJ;;hQXlVLsAAAAJ;XCGuYKIAAAAJ",
        "orcid": "0000-0002-7774-9939;0000-0002-9238-5408;;0000-0003-1404-2212;",
        "linkedin": ";rik-sengupta-ab00bb224/;;shahin-kamali-4a3b376?originalSubdomain=ca;",
        "or_profile": "~Adam_Lechowicz1;~Rik_Sengupta1;~Bo_Sun8;~Shahin_Kamali1;~Mohammad_Hajiesmaili1",
        "aff": "University of Massachusetts Amherst;University of Massachusetts at Amherst;;York University;College of Information and Computer Science, University of Massachusetts, Amherst",
        "aff_domain": "cs.umass.edu;umass.edu;;yorku.ca;cics.umass.edu",
        "position": "PhD student;PhD student;;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nlechowicz2024time,\ntitle={Time Fairness in Online Knapsack Problems},\nauthor={Adam Lechowicz and Rik Sengupta and Bo Sun and Shahin Kamali and Mohammad Hajiesmaili},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=9kG7TwgLYu}\n}",
        "github": "",
        "project": "",
        "reviewers": "rQKw;zsDR;37F8",
        "pdf_size": 1607054,
        "rating": "6;6;8",
        "confidence": "3;4;2",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "3;3;4",
        "wc_summary": "60;178;153",
        "wc_strengths": "42;108;86",
        "wc_weaknesses": "40;155;79",
        "wc_questions": "30;4;22",
        "wc_review": "172;445;340",
        "wc_reply_reviewers": "34;55;14",
        "wc_reply_authors": "923;662;88",
        "reply_reviewers": "2;1;1",
        "reply_authors": "2;2;1",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            130.33333333333334,
            50.769632218045025
        ],
        "wc_strengths_avg": [
            78.66666666666667,
            27.438820836342234
        ],
        "wc_weaknesses_avg": [
            91.33333333333333,
            47.75167245471327
        ],
        "wc_questions_avg": [
            18.666666666666668,
            10.873004286866726
        ],
        "wc_review_avg": [
            319.0,
            112.43664882946307
        ],
        "wc_reply_reviewers_avg": [
            34.333333333333336,
            16.73983937265296
        ],
        "wc_reply_authors_avg": [
            557.6666666666666,
            348.7791405587337
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14561090357017339709&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=9kG7TwgLYu",
        "pdf": "https://openreview.net/pdf?id=9kG7TwgLYu",
        "email": "cs.umass.edu;umass.edu;;yorku.ca;cics.umass.edu",
        "author_num": 5,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "University of Massachusetts Amherst;York University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.umass.edu;https://www.yorku.ca",
        "aff_unique_abbr": "UMass Amherst;York U",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Amherst;",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "United States;Canada"
    },
    {
        "id": "9kLDrE5rsW",
        "title": "Temporal graph models fail to capture global temporal dynamics",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "A recently released Temporal Graph Benchmark is analyzed in the context of Dynamic Link Property Prediction. We outline our observations and propose a trivial optimization-free baseline of \"recently popular nodes\" outperforming other methods on medium and large-size datasets in the Temporal Graph Benchmark. We propose two measures based on Wasserstein distance which can quantify the strength of short-term and long-term global dynamics of datasets. By analyzing our unexpectedly strong baseline, we show how standard negative sampling evaluation can be unsuitable for datasets with strong temporal dynamics. We also show how simple negative-sampling can lead to model degeneration during training, resulting in impossible to rank, fully saturated predictions of temporal graph networks. We propose improved negative sampling schemes for both training and evaluation and prove their usefulness. We conduct a comparison with a model trained non-contrastively without negative sampling. Our results provide a challenging baseline and indicate that temporal graph network architectures need deep rethinking for usage in problems with significant global dynamics, such as social media, cryptocurrency markets or e-commerce. We open-source the code for baselines, measures and proposed negative sampling schemes.",
        "keywords": "temporal graph;dynamic graph;graph neural networks;temporal graph neural networks",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Michal Daniluk;Jacek Dabrowski",
        "authorids": "~Michal_Daniluk1;~Jacek_Dabrowski1",
        "gender": "M;M",
        "homepage": ";",
        "dblp": ";",
        "google_scholar": ";https://scholar.google.pl/citations?user=1rbW6yUAAAAJ",
        "orcid": ";",
        "linkedin": "https://pl.linkedin.com/in/michaldaniluk91;ponythewhite/",
        "or_profile": "~Michal_Daniluk1;~Jacek_Dabrowski1",
        "aff": ";Synerise S.A.",
        "aff_domain": ";synerise.com",
        "position": ";Principal Researcher",
        "bibtex": "@misc{\ndaniluk2024temporal,\ntitle={Temporal graph models fail to capture global temporal dynamics},\nauthor={Michal Daniluk and Jacek Dabrowski},\nyear={2024},\nurl={https://openreview.net/forum?id=9kLDrE5rsW}\n}",
        "github": "",
        "project": "",
        "reviewers": "mQmi;C9Fh;BqDA;Chai",
        "site": "https://openreview.net/forum?id=9kLDrE5rsW",
        "pdf_size": 473608,
        "rating": "1;3;3;6",
        "confidence": "2;4;4;3",
        "soundness": "1;1;2;3",
        "contribution": "2;1;2;3",
        "presentation": "1;1;2;3",
        "wc_summary": "60;81;78;82",
        "wc_strengths": "33;21;58;81",
        "wc_weaknesses": "608;230;208;22",
        "wc_questions": "126;2;144;100",
        "wc_review": "827;334;488;285",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            75.25,
            8.926785535678562
        ],
        "wc_strengths_avg": [
            48.25,
            23.14492384951828
        ],
        "wc_weaknesses_avg": [
            267.0,
            212.81212371479216
        ],
        "wc_questions_avg": [
            93.0,
            54.817880294662984
        ],
        "wc_review_avg": [
            483.5,
            211.99351405172754
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.2955402316445243,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15199979378178198245&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0",
        "aff_unique_norm": "Synerise",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.synerise.com",
        "aff_unique_abbr": "Synerise",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Poland"
    },
    {
        "id": "9lvyCHhQix",
        "title": "Diversity-aware Continual Learning with Latent Knowledge Hypergraph",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Continual learning (CL) refers to the ability of models to learn from non-stationary data distribution while transferring and protecting past knowledge. Existing literature in CL has mainly focused on overcoming catastrophic forgetting. However, they often overlook a critical trade-off between parameter efficiency and capacity saturation. Almost all of the existing approaches including architecture-stable and architecture-growing methods struggle to balance parameter efficiency and capacity saturation. This makes them vulnerable to long-term task-incremental CL under storage constraints. In this paper, we propose a novel CL approach that addresses the trade-off between parameter efficiency and capacity saturation by dynamically expanding the model's weight space in proportion to the actual capacity increase needed by each new task. Specifically, our approach introduces a unique knowledge hypergraph structure that captures the latent knowledge across tasks and leverages it to measure task diversity and estimate the capacity increase required for each new task. Moreover, we introduce new constraints to ensure parameter efficiency during inference and a fine-grained parameter generator to create task-specific sub-networks that ensure a constant number of trainable parameters over time while accommodating the evolving complexities of tasks. Extensive experiment results show that the proposed approach achieves state-of-the-art results on several benchmark CL datasets, while maintaining low parameter counts.",
        "keywords": "continual learning;hypernetwork;hypergraph;diversity awareness",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Jiayi Chen;Kishlay Jha;Aidong Zhang",
        "authorids": "~Jiayi_Chen4;~Kishlay_Jha2;~Aidong_Zhang2",
        "gender": "F;M;F",
        "homepage": "https://jia-yi-chen.github.io/;https://engineering.uiowa.edu/people/kishlay-jha;https://engineering.virginia.edu/faculty/aidong-zhang",
        "dblp": "42/1159;177/7445;z/AidongZhang.html",
        "google_scholar": "f3Iz6qoAAAAJ;8GhLfu8AAAAJ;O8XxkE4AAAAJ",
        "orcid": "0000-0003-0217-6352;0000-0003-0826-445X;0000-0001-9723-3246",
        "linkedin": ";kishlayjha/;",
        "or_profile": "~Jiayi_Chen4;~Kishlay_Jha2;~Aidong_Zhang2",
        "aff": "University of Virginia;University of Iowa;University of Virginia",
        "aff_domain": "cs.virginia.edu;uiowa.edu;virginia.edu",
        "position": "PhD student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nchen2024diversityaware,\ntitle={Diversity-aware Continual Learning with Latent Knowledge Hypergraph},\nauthor={Jiayi Chen and Kishlay Jha and Aidong Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=9lvyCHhQix}\n}",
        "github": "",
        "project": "",
        "reviewers": "j4Dh;8ANK;RNxE;9KLn",
        "site": "https://openreview.net/forum?id=9lvyCHhQix",
        "pdf_size": 2600665,
        "rating": "3;3;5;5",
        "confidence": "5;3;4;4",
        "soundness": "1;2;3;3",
        "contribution": "2;2;3;2",
        "presentation": "3;1;3;2",
        "wc_summary": "93;112;44;63",
        "wc_strengths": "103;76;37;31",
        "wc_weaknesses": "410;241;109;135",
        "wc_questions": "127;101;131;4",
        "wc_review": "733;530;321;233",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            78.0,
            26.277366686941825
        ],
        "wc_strengths_avg": [
            61.75,
            29.422567868899545
        ],
        "wc_weaknesses_avg": [
            223.75,
            118.35407682036137
        ],
        "wc_questions_avg": [
            90.75,
            51.39248485916983
        ],
        "wc_review_avg": [
            454.25,
            193.74387087079683
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:L78khaq-8dQJ:scholar.google.com/&scioq=Diversity-aware+Continual+Learning+with+Latent+Knowledge+Hypergraph&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Virginia;University of Iowa",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.virginia.edu;https://www.uiowa.edu",
        "aff_unique_abbr": "UVA;UIowa",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "DataInf: Efficiently Estimating Data Influence in LoRA-tuned LLMs and Diffusion Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19284",
        "id": "9m02ib92Wz",
        "author_site": "Yongchan Kwon, Eric Wu, Kevin Wu, James Y Zou",
        "tldr": "",
        "abstract": "Quantifying the impact of training data points is crucial for understanding the outputs of machine learning models and for improving the transparency of the AI pipeline. The influence function is a principled and popular data attribution method, but its computational cost often makes it challenging to use. This issue becomes more pronounced in the setting of large language models and text-to-image models. In this work, we propose DataInf, an efficient influence approximation method that is practical for large-scale generative AI models. Leveraging an easy-to-compute closed-form expression, DataInf outperforms existing influence computation algorithms in terms of computational and memory efficiency. Our theoretical analysis shows that DataInf is particularly well-suited for parameter-efficient fine-tuning techniques such as LoRA. Through systematic empirical evaluations, we show that DataInf accurately approximates influence scores and is orders of magnitude faster than existing methods. In applications to RoBERTa-large, Llama-2-13B-chat, and stable-diffusion-v1.5 models, DataInf effectively identifies the most influential fine-tuning examples better than other approximate influence scores. Moreover, it can help to identify which data points are mislabeled.",
        "keywords": "Influence function;Data valuation",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/e078e037cea2844184989983823731a351cdeacf.zip",
        "author": "Yongchan Kwon;Eric Wu;Kevin Wu;James Zou",
        "authorids": "~Yongchan_Kwon1;~Eric_Wu3;~Kevin_Wu1;~James_Zou1",
        "gender": ";M;;",
        "homepage": ";;https://kevinwu.ai;",
        "dblp": ";;;",
        "google_scholar": ";6pIliiAAAAAJ;s4dCi5sAAAAJ;23ZXZvEAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Yongchan_Kwon1;~Eric_Wu3;~Kevin_Wu1;~James_Zou1",
        "aff": ";Stanford University;Stanford University;Stanford University",
        "aff_domain": ";stanford.edu;stanford.edu;stanford.edu",
        "position": ";PhD student;PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nkwon2024datainf,\ntitle={DataInf: Efficiently Estimating Data Influence in Lo{RA}-tuned {LLM}s and Diffusion Models},\nauthor={Yongchan Kwon and Eric Wu and Kevin Wu and James Zou},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=9m02ib92Wz}\n}",
        "github": "",
        "project": "",
        "reviewers": "kkF9;oMqQ;gXtX;NdTy",
        "pdf_size": 3982524,
        "rating": "6;6;6;6",
        "confidence": "3;2;3;3",
        "soundness": "3;3;3;2",
        "contribution": "3;3;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "56;27;275;23",
        "wc_strengths": "35;30;19;17",
        "wc_weaknesses": "134;26;69;108",
        "wc_questions": "109;13;70;37",
        "wc_review": "334;96;433;185",
        "wc_reply_reviewers": "10;10;0;0",
        "wc_reply_authors": "725;313;416;743",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "3;3;1;3",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            95.25,
            104.55710162394519
        ],
        "wc_strengths_avg": [
            25.25,
            7.495832175282475
        ],
        "wc_weaknesses_avg": [
            84.25,
            40.81896005534683
        ],
        "wc_questions_avg": [
            57.25,
            36.08583517115822
        ],
        "wc_review_avg": [
            262.0,
            130.29773597419106
        ],
        "wc_reply_reviewers_avg": [
            5.0,
            5.0
        ],
        "wc_reply_authors_avg": [
            549.25,
            188.41228065070493
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            0.8660254037844386
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 60,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4678751591021020846&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=9m02ib92Wz",
        "pdf": "https://openreview.net/pdf?id=9m02ib92Wz",
        "email": ";stanford.edu;stanford.edu;stanford.edu",
        "author_num": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Stanford University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.stanford.edu",
        "aff_unique_abbr": "Stanford",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Stanford",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "9mX0AZVEet",
        "title": "Improving Diffusion Models for Inverse Problems Using Optimal Posterior Covariance",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent diffusion models provide a promising alternative zero-shot solution to noisy linear inverse problems without retraining for specific inverse problems. In this paper, we propose the first unified framework for diffusion-based zero-shot methods from the view of approximating conditional posterior mean for the reverse process. We reveal that recent diffusion-based zero-shot methods are equivalent to making isotropic Gaussian approximation to intractable posterior distributions over clean images given diffused noisy images, with only difference in handcrafted design of isotropic posterior covariances. Inspired by this finding, we develop the optimal posterior covariance of the posterior distribution via maximum likelihood estimation. We provide a general solution based on three approaches specifically designed for posterior covariance optimization, by training from scratch and using pre-trained models with and without reverse covariances. Remarkably, the proposed framework can be achieved in a plug-and-play fashion based on pre-trained unconditional diffusion models by converting reverse covariances or via Monte Carlo estimation without reverse covariances.  Experimental results demonstrate that the proposed framework significantly outperforms existing zero-shot methods and enhances the robustness to hyper-parameters.",
        "keywords": "Generative models;Inverse problems;Diffusion models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/ebc9ae332842f7f74263d5ba0b69be7ce8767fab.zip",
        "author": "Xinyu Peng;Ziyang Zheng;Wenrui Dai;Nuoqian Xiao;Chenglin Li;Junni Zou;Hongkai Xiong",
        "authorids": "~Xinyu_Peng1;~Ziyang_Zheng2;~Wenrui_Dai1;~Nuoqian_Xiao1;~Chenglin_Li2;~Junni_Zou1;~Hongkai_Xiong1",
        "gender": "M;M;;;M;F;M",
        "homepage": "https://github.com/xypeng9903;;;;https://min.sjtu.edu.cn/En/FacultyShow/4?Vid=17;http://www.cs.sjtu.edu.cn/~zou-jn;http://min.sjtu.edu.cn",
        "dblp": ";;16/5135.html;;;91/4613;21/3569",
        "google_scholar": ";pcgDcMmDJbwC;Xg8MhyAAAAAJ;;ltW2JMcAAAAJ;https://scholar.google.com/citations?hl=zh-CN;bB16iN4AAAAJ",
        "orcid": ";0000-0001-9923-8016;;;;;0000-0003-4552-0029",
        "linkedin": "xinyu-peng-328918246/;;;;;;",
        "or_profile": "~Xinyu_Peng1;~Ziyang_Zheng2;~Wenrui_Dai1;~Nuoqian_Xiao1;~Chenglin_Li2;~Junni_Zou1;~Hongkai_Xiong1",
        "aff": "Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;;Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn",
        "position": "PhD student;PhD student;Associate Professor;;Full Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\npeng2024improving,\ntitle={Improving Diffusion Models for Inverse Problems Using Optimal Posterior Covariance},\nauthor={Xinyu Peng and Ziyang Zheng and Wenrui Dai and Nuoqian Xiao and Chenglin Li and Junni Zou and Hongkai Xiong},\nyear={2024},\nurl={https://openreview.net/forum?id=9mX0AZVEet}\n}",
        "github": "",
        "project": "",
        "reviewers": "rzGL;8Q2y;FU6y",
        "site": "https://openreview.net/forum?id=9mX0AZVEet",
        "pdf_size": 40237100,
        "rating": "5;5;8",
        "confidence": "4;4;5",
        "soundness": "3;2;3",
        "contribution": "2;2;3",
        "presentation": "3;3;3",
        "wc_summary": "45;72;109",
        "wc_strengths": "35;68;247",
        "wc_weaknesses": "95;112;245",
        "wc_questions": "4;529;92",
        "wc_review": "179;781;693",
        "wc_reply_reviewers": "0;290;31",
        "wc_reply_authors": "1179;1688;1876",
        "reply_reviewers": "0;1;1",
        "reply_authors": "2;4;3",
        "rating_avg": [
            6.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            75.33333333333333,
            26.233989826601334
        ],
        "wc_strengths_avg": [
            116.66666666666667,
            93.13908357337905
        ],
        "wc_weaknesses_avg": [
            150.66666666666666,
            67.06381703687582
        ],
        "wc_questions_avg": [
            208.33333333333334,
            229.5740016252324
        ],
        "wc_review_avg": [
            551.0,
            265.4857183855031
        ],
        "wc_reply_reviewers_avg": [
            107.0,
            130.0179474790564
        ],
        "wc_reply_authors_avg": [
            1581.0,
            294.43618437051293
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.0,
            0.816496580927726
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14269481151172449337&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "Shanghai Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sjtu.edu.cn",
        "aff_unique_abbr": "SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "9n9q0R9Gyw",
        "title": "Retrieval-augmented Text-to-3D Generation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Text-to-3D generation using using neural networks has been confronted with a fundamental difficulty regarding the scale and quality of 3D data. Score distillation sampling based on 2D diffusion models addresses this issue effectively; however, it also introduces 3D inconsistencies that plague generated 3D scenes due to a lack of robust 3D prior knowledge and awareness. In this study, we propose a novel framework for retrieval-augmented text-to-3D generation that is capable of generating superior-quality 3D objects with decent geometry. After we employ a particle-based variational inference framework, we augment the conventional target distribution in SDS-based techniques with an empirical distribution of retrieved 3D assets. Furthermore, based on the retrieved 3D assets, we propose the two effective methods: a lightweight adaptation of a 2D prior model for reducing its inherent bias toward certain camera viewpoints, and delta distillation to regularize artifacts of generated 3D contents. Our experimental results show that our method not only exhibits state-of-the-art quality in text-to-3D generation but also significantly enhances the geometry compared to the baseline.",
        "keywords": "diffusion models;NeRF;3d synthesis",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/c39a7cc106e4888a0676c8fdf37ee17c7c231196.zip",
        "author": "Junyoung Seo;Susung Hong;Wooseok Jang;Min-Seop Kwak;Hyeonsu Kim;Doyup Lee;Seungryong Kim",
        "authorids": "~Junyoung_Seo1;~Susung_Hong1;~Wooseok_Jang2;~Min-Seop_Kwak1;~Hyeonsu_Kim2;~Doyup_Lee1;~Seungryong_Kim1",
        "gender": "M;M;;M;F;M;M",
        "homepage": "https://j0seo.github.io;https://susunghong.github.io/;https://github.com/woo1726;;https://ines-hyeonsu-kim.github.io;;https://cvlab.korea.ac.kr/members/faculty",
        "dblp": "209/9340;330/5127;30/4458;338/9125;367/9344;205/2368;141/9955",
        "google_scholar": "orJRvmEAAAAJ;HigIHvUAAAAJ;;;tBcqfncAAAAJ;https://scholar.google.co.kr/citations?user=5rAj44kAAAAJ;cIK1hS8AAAAJ",
        "orcid": ";;;;0009-0003-3695-0243;;",
        "linkedin": ";;;matthewmatics96;;;",
        "or_profile": "~Junyoung_Seo1;~Susung_Hong1;~Wooseok_Jang2;~Min-Seop_Kwak1;~Hyeonsu_Kim2;~Doyup_Lee1;~Seungryong_Kim1",
        "aff": "Korea University;Korea University;Korea University;Korea Advanced Institute of Science & Technology;Korea University;Runway;Korea University",
        "aff_domain": "korea.ac.kr;korea.ac.kr;korea.ac.kr;kaist.ac.kr;korea.ac.kr;runwayml.com;korea.ac.kr",
        "position": "PhD student;Undergrad student;MS student;PhD student;Undergrad student;Researcher;Assistant Professor",
        "bibtex": "@misc{\nseo2024retrievalaugmented,\ntitle={Retrieval-augmented Text-to-3D Generation},\nauthor={Junyoung Seo and Susung Hong and Wooseok Jang and Min-Seop Kwak and Hyeonsu Kim and Doyup Lee and Seungryong Kim},\nyear={2024},\nurl={https://openreview.net/forum?id=9n9q0R9Gyw}\n}",
        "github": "",
        "project": "",
        "reviewers": "aEzM;U742;3ZvE",
        "site": "https://openreview.net/forum?id=9n9q0R9Gyw",
        "pdf_size": 18814750,
        "rating": "5;5;5",
        "confidence": "5;4;4",
        "soundness": "2;2;3",
        "contribution": "2;3;3",
        "presentation": "2;2;3",
        "wc_summary": "67;163;97",
        "wc_strengths": "55;104;51",
        "wc_weaknesses": "161;658;155",
        "wc_questions": "43;37;2",
        "wc_review": "326;962;305",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            109.0,
            40.099875311526844
        ],
        "wc_strengths_avg": [
            70.0,
            24.097026095903757
        ],
        "wc_weaknesses_avg": [
            324.6666666666667,
            235.71498797394185
        ],
        "wc_questions_avg": [
            27.333333333333332,
            18.080068829760823
        ],
        "wc_review_avg": [
            531.0,
            304.8835843399903
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:7d0dYifEf7EJ:scholar.google.com/&scioq=Retrieval-augmented+Text-to-3D+Generation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;0;2;0",
        "aff_unique_norm": "Korea University;Korea Advanced Institute of Science and Technology;Runway",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.korea.ac.kr;https://www.kaist.ac.kr;https://www.runwayml.com",
        "aff_unique_abbr": "KU;KAIST;Runway",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;1;0",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "id": "9nT8ouPui8",
        "title": "On Memorization in Diffusion Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Due to their capacity to generate novel and high-quality samples, diffusion models have attracted significant research interest in recent years. Notably, the typical training objective of diffusion models, i.e., denoising score matching, has a closed-form optimal solution that can only generate training-data replicating samples. This indicates that a memorization behavior is theoretically expected, which contradicts the common generalization ability of state-of-the-art diffusion models, and thus calls for a deeper understanding. Looking into this, we first observe that memorization behaviors tend to occur on smaller-sized datasets, which motivates our definition of effective model memorization (EMM), a metric measuring the maximum size of training data at which a model approximates its theoretical optimum. Then, we quantify the impact of the influential factors on these memorization behaviors in terms of EMM, focusing primarily on data distribution, model configuration, and training procedure. Besides comprehensive empirical results identifying the influential factors, we surprisingly find that conditioning training data on uninformative random labels can significantly trigger the memorization in diffusion models. Our study holds practical significance for diffusion model users and offers clues to theoretical research in deep generative models.",
        "keywords": "Diffusion Models;Memorization",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/036527d261d51e762ec07f0af264526133fba1c5.zip",
        "author": "Xiangming Gu;Chao Du;Tianyu Pang;Chongxuan Li;Min Lin;Ye Wang",
        "authorids": "~Xiangming_Gu1;~Chao_Du1;~Tianyu_Pang1;~Chongxuan_Li1;~Min_Lin1;~Ye_Wang3",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://guxm2021.github.io;https://duchao0726.github.io/;https://p2333.github.io/;http://ml.cs.tsinghua.edu.cn/~chongxuan;https://linmin.me;https://smcnus.comp.nus.edu.sg/",
        "dblp": "276/5844;75/7523;202/2550;161/9965;;44/6292-7",
        "google_scholar": "BkxEuIoAAAAJ;QOp7xW0AAAAJ;wYDbtFsAAAAJ;UKMcQn4AAAAJ;BGONmkIAAAAJ;https://scholar.google.com.sg/citations?user=CdgLLL8AAAAJ",
        "orcid": ";0000-0003-1244-6336;0000-0003-0639-6176;0000-0002-0912-9076;;0000-0002-0123-1260",
        "linkedin": "xiangming-gu/;duchao/;%E5%A4%A9%E5%AE%87-%E5%BA%9E-b3999017a/;;min-lin-08a3a422/;",
        "or_profile": "~Xiangming_Gu1;~Chao_Du1;~Tianyu_Pang1;~Chongxuan_Li1;~Min_Lin1;~Ye_Wang3",
        "aff": "National University of Singapore;Sea AI Lab;Sea AI Lab;Renmin University of China;Sea AI Lab;National University of Singapore",
        "aff_domain": "nus.edu.sg;sea.com;sea.com;ruc.edu.cn;sea.com;nus.edu.sg",
        "position": "PhD student;Senior Research Scientist;Senior Research Scientist;Associate Professor;Principal Researcher;Associate Professor",
        "bibtex": "@misc{\ngu2024on,\ntitle={On Memorization in Diffusion Models},\nauthor={Xiangming Gu and Chao Du and Tianyu Pang and Chongxuan Li and Min Lin and Ye Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=9nT8ouPui8}\n}",
        "github": "",
        "project": "",
        "reviewers": "gEHa;MQLD;sac3;p3eW;QP3y",
        "site": "https://openreview.net/forum?id=9nT8ouPui8",
        "pdf_size": 1226281,
        "rating": "3;5;5;5;6",
        "confidence": "4;4;2;4;3",
        "soundness": "3;3;2;3;3",
        "contribution": "1;3;2;2;2",
        "presentation": "3;4;2;3;3",
        "wc_summary": "24;74;79;93;100",
        "wc_strengths": "74;37;51;170;126",
        "wc_weaknesses": "236;11;101;334;268",
        "wc_questions": "56;19;98;4;204",
        "wc_review": "390;141;329;601;698",
        "wc_reply_reviewers": "0;36;111;0;0",
        "wc_reply_authors": "856;534;1500;770;1297",
        "reply_reviewers": "0;1;1;0;0",
        "reply_authors": "2;2;3;2;2",
        "rating_avg": [
            4.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.4,
            0.8
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            3.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            74.0,
            26.69082239272518
        ],
        "wc_strengths_avg": [
            91.6,
            49.53624935337758
        ],
        "wc_weaknesses_avg": [
            190.0,
            117.38654096616017
        ],
        "wc_questions_avg": [
            76.2,
            71.69490916376141
        ],
        "wc_review_avg": [
            431.8,
            198.17709252080573
        ],
        "wc_reply_reviewers_avg": [
            29.4,
            43.116586135732035
        ],
        "wc_reply_authors_avg": [
            991.4,
            354.5789615868375
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            2.2,
            0.39999999999999997
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.4082482904638631,
        "gs_citation": 48,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2503430110501581051&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1;2;1;0",
        "aff_unique_norm": "National University of Singapore;Sea AI Lab;Renmin University of China",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.nus.edu.sg;;http://www.ruc.edu.cn",
        "aff_unique_abbr": "NUS;;RUC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;2;0",
        "aff_country_unique": "Singapore;;China"
    },
    {
        "id": "9nXgWT12tb",
        "title": "Correlated Attention in Transformers for Multivariate Time Series",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Multivariate time series (MTS)  analysis prevail in real-world applications such as finance, climate science and healthcare. The various self-attention mechanisms, the backbone of the state-of-the-art Transformer-based models, efficiently discover the temporal dependencies, yet cannot well capture the intricate cross-correlation between different features of MTS data, which inherently stems from complex dynamical systems in practice. To this end, we propose a novel correlated attention mechanism, which not only efficiently captures feature-wise dependencies, but can also be seamlessly integrated within the encoder blocks of existing well-known Transformers to gain efficiency improvement. In particular, correlated attention operates across feature channels to compute cross-covariance matrices between queries and keys with different lag values, and selectively aggregate representations at the sub-series level. This architecture facilitates automated discovery and representation learning of not only instantaneous but also lagged cross-correlations, while inherently capturing time series auto-correlation. When combined with prevalent Transformer baselines, correlated attention mechanism constitutes a better alternative for encoder-only architectures, which are suitable for a wide range of tasks including  imputation, anomaly detection and classification. Extensive experiments on the aforementioned tasks consistently underscore the advantages of correlated attention mechanism in enhancing base Transformer models, and demonstrate our state-of-the-art results in imputation, anomaly detection and classification.",
        "keywords": "Transformer;multivariate time series;deep learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/f2e5b20ec68fc0d5845f952195abc8b9ee7348d2.pdf",
        "author": "Quang Minh Nguyen;Lam M. Nguyen;Subhro Das",
        "authorids": "~Quang_Minh_Nguyen1;~Lam_M._Nguyen1;~Subhro_Das1",
        "gender": "M;;",
        "homepage": ";;",
        "dblp": ";;",
        "google_scholar": ";;",
        "orcid": ";;",
        "linkedin": "quang-m-nguyen-191122b3/;;",
        "or_profile": "~Quang_Minh_Nguyen1;~Lam_M._Nguyen1;~Subhro_Das1",
        "aff": "Massachusetts Institute of Technology;;",
        "aff_domain": "mit.edu;;",
        "position": "PhD student;;",
        "bibtex": "@misc{\nnguyen2024correlated,\ntitle={Correlated Attention in Transformers for Multivariate Time Series},\nauthor={Quang Minh Nguyen and Lam M. Nguyen and Subhro Das},\nyear={2024},\nurl={https://openreview.net/forum?id=9nXgWT12tb}\n}",
        "github": "",
        "project": "",
        "reviewers": "KQRi;rWhs;mjBo;M5Eq",
        "site": "https://openreview.net/forum?id=9nXgWT12tb",
        "pdf_size": 749721,
        "rating": "5;6;6;6",
        "confidence": "3;2;3;3",
        "soundness": "2;3;2;3",
        "contribution": "2;3;1;2",
        "presentation": "3;3;3;3",
        "wc_summary": "73;170;16;132",
        "wc_strengths": "77;270;33;104",
        "wc_weaknesses": "69;210;111;318",
        "wc_questions": "427;197;44;82",
        "wc_review": "646;847;204;636",
        "wc_reply_reviewers": "89;0;137;20",
        "wc_reply_authors": "2240;1155;1584;1406",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "7;5;5;6",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            97.75,
            58.49946580952684
        ],
        "wc_strengths_avg": [
            121.0,
            89.6799866190891
        ],
        "wc_weaknesses_avg": [
            177.0,
            96.16392254894764
        ],
        "wc_questions_avg": [
            187.5,
            149.30924284852563
        ],
        "wc_review_avg": [
            583.25,
            234.58194197337525
        ],
        "wc_reply_reviewers_avg": [
            61.5,
            54.68317840067456
        ],
        "wc_reply_authors_avg": [
            1596.25,
            401.7028597110058
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            5.75,
            0.82915619758885
        ],
        "replies_avg": [
            32,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17876364347666406101&as_sdt=8005&sciodt=0,7&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "Massachusetts Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://web.mit.edu",
        "aff_unique_abbr": "MIT",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "9nddtu94uX",
        "title": "PlatoLM: Teaching LLMs via a Socratic Questioning User Simulator",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The unparalleled performance of closed-sourced ChatGPT has sparked efforts towards its democratization, with notable strides made by leveraging real user and ChatGPT conversations, as evidenced by Vicuna. However, due to challenges in gathering conversations involving human participation, current endeavors like Baize and UltraChat aim to automatically generate conversational data. They primarily rely on ChatGPT conducting roleplay to simulate human behaviors based on instructions rather than genuine learning from humans, resulting in limited scope, diminished diversity, and an absence of genuine multi-round conversational dynamics. To address the above issues, we target human questions extracted from genuine human-machine conversations as a learning goal and train a user simulator called Socratic to produce a high-quality human-centric synthetic conversation dataset. Subsequently, this dataset was used to train our assistant model, named PlatoLM. PlatoLM achieves the SOTA performance among 7B  models (including  LLaMA-2-7B-chat and Vicuna-7B) in both Vicuna-Bench and pairwise comparison in MT-Bench; the effectiveness of PlatoLM is also evidenced by manual evaluation.",
        "keywords": "Large Language Model;User Simulation;Human Computer Interaction",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/65555c22ee2606bad7996d1fe101f345329957b8.zip",
        "author": "Chuyi Kong;Yaxin FAN;Xiang Wan;Feng Jiang;Benyou Wang",
        "authorids": "~Chuyi_Kong1;~Yaxin_FAN2;~Xiang_Wan1;~Feng_Jiang4;~Benyou_Wang2",
        "gender": "Not Specified;M;M;M;M",
        "homepage": ";https://fanyaxin.top/;http://www.sribd.cn/teacher/28;;https://wabyking.github.io/old.html",
        "dblp": ";234/9447;;75/1693-7;169/1793",
        "google_scholar": "w5vcgWYAAAAJ;N0oiLQwAAAAJ;;zrxpiWYAAAAJ;Jk4vJU8AAAAJ",
        "orcid": ";;;0000-0002-3465-311X;0000-0002-1501-9914",
        "linkedin": ";;;;",
        "or_profile": "~Chuyi_Kong1;~Yaxin_FAN2;~Xiang_Wan1;~Feng_Jiang4;~Benyou_Wang2",
        "aff": "Hong Kong Baptist University;Soochow University;Shenzhen Research Institute of Big Data;The Chinese University of Hong Kong, Shenzhen;The Chinese University of Hong Kong, Shenzhen",
        "aff_domain": "hkbu.edu.hk;suda.edu.cn;sribd.cn;cuhk.edu.cn;cuhk.edu.cn",
        "position": "PhD student;PhD student;Principal Researcher;Postdoc;Assistant Professor",
        "bibtex": "@misc{\nanonymous2024platolm,\ntitle={Plato{LM}: Teaching {LLM}s  via a Socratic  Questioning User Simulator},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=9nddtu94uX}\n}",
        "github": "",
        "project": "",
        "reviewers": "GXfd;FWRq;Z8HQ;6WiD",
        "site": "https://openreview.net/forum?id=9nddtu94uX",
        "pdf_size": 2136631,
        "rating": "6;6;6;8",
        "confidence": "5;3;4;3",
        "soundness": "2;3;2;3",
        "contribution": "1;3;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "96;81;44;69",
        "wc_strengths": "14;129;77;104",
        "wc_weaknesses": "230;113;61;59",
        "wc_questions": "17;69;244;31",
        "wc_review": "357;392;426;263",
        "wc_reply_reviewers": "0;0;27;109",
        "wc_reply_authors": "822;932;1300;1181",
        "reply_reviewers": "0;0;1;2",
        "reply_authors": "2;3;3;4",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            72.5,
            19.03286631067428
        ],
        "wc_strengths_avg": [
            81.0,
            42.83106349368411
        ],
        "wc_weaknesses_avg": [
            115.75,
            69.42396920372674
        ],
        "wc_questions_avg": [
            90.25,
            90.78374028426015
        ],
        "wc_review_avg": [
            359.5,
            60.82146002851296
        ],
        "wc_reply_reviewers_avg": [
            34.0,
            44.68221122549778
        ],
        "wc_reply_authors_avg": [
            1058.75,
            190.56675339628367
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7100133306028201699&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;3",
        "aff_unique_norm": "Hong Kong Baptist University;Soochow University;Shenzhen Research Institute of Big Data;Chinese University of Hong Kong",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.hkbu.edu.hk;https://www.soochow.edu.cn;http://www.sribd.cn;https://www.cuhk.edu.cn",
        "aff_unique_abbr": "HKBU;Soochow U;;CUHK",
        "aff_campus_unique_index": "0;2;2",
        "aff_campus_unique": "Hong Kong SAR;;Shenzhen",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Mastering Symbolic Operations: Augmenting Language Models with Compiled Neural Networks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19283",
        "id": "9nsNyN0vox",
        "author_site": "Yixuan Weng, Minjun Zhu, Fei Xia, Bin Li, Shizhu He, Kang Liu, Jun Zhao",
        "tldr": "",
        "abstract": "Language models' (LMs) proficiency in handling deterministic symbolic reasoning and rule-based tasks remains limited due to their dependency implicit learning on textual data. To endow LMs with genuine rule comprehension abilities, we propose \"Neural Comprehension\" - a framework that synergistically integrates compiled neural networks (CoNNs) into the standard transformer architecture. CoNNs are neural modules designed to explicitly encode rules through artificially generated attention weights. By incorporating CoNN modules, the Neural Comprehension framework enables LMs to accurately and robustly execute rule-intensive symbolic tasks. Extensive experiments demonstrate the superiority of our approach over existing techniques in terms of length generalization, efficiency, and interpretability for symbolic operations. Furthermore, it can be applied to LMs across different model scales, outperforming tool-calling methods in arithmetic reasoning tasks while maintaining superior inference efficiency. Our work highlights the potential of seamlessly unifying explicit rule learning via CoNNs and implicit pattern learning in LMs, paving the way for true symbolic comprehension capabilities. The code is released at: \\url{https://github.com/wengsyx/Neural-Comprehension}.",
        "keywords": "Language Models;Compiled Neural Networks;Neural Comprehension;Symbolic Operations;Length Generalization",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/973363d708001b999bd7968b8230071cc264af34.zip",
        "author": "Yixuan Weng;Minjun Zhu;Fei Xia;Bin Li;Shizhu He;Kang Liu;Jun Zhao",
        "authorids": "~Yixuan_Weng1;~Minjun_Zhu2;~Fei_Xia4;~Bin_Li14;~Shizhu_He2;~Kang_Liu1;~Jun_Zhao4",
        "gender": "M;F;M;M;M;M;M",
        "homepage": "https://wengsyx.github.io/;;https://github.com/Alex0xf;https://libincn.top;https://heshizhu.github.io/;http://www.nlpr.ia.ac.cn/cip/~liukang/index.html;http://nlpr-web.ia.ac.cn/cip/english/~junzhao/index.html",
        "dblp": "298/8205;271/6029;79/1081;89/6764-83;136/8650;42/4903.html;https://dblp.uni-trier.de/pid/47/2026-1.html",
        "google_scholar": "O1XsDEMAAAAJ;cm2ub2kAAAAJ;;2ZIBEWgAAAAJ;zBPIt3QAAAAJ;DtZCfl0AAAAJ;https://scholar.google.com.hk/citations?user=HljRttwAAAAJ",
        "orcid": "0000-0002-9720-8689;;0009-0002-4609-9950;0000-0002-6508-5071;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Yixuan_Weng1;~Minjun_Zhu2;~Fei_Xia4;~Bin_Li14;~Shizhu_He2;~Kang_Liu1;~Jun_Zhao4",
        "aff": "Institute of Automation, Chinese Academy of Sciences;Westlake University;;Hunan University;Institute of Automation, Chinese Academy of Sciences;Institute of Automation, Chinese Academy of Sciences;Institute of automation, Chinese academy of science",
        "aff_domain": "ia.ac.cn;westlake.edu;;hnu.edu.cn;ia.ac.cn;ia.ac.cn;nlpr.ia.ac.cn",
        "position": "MS student;PhD student;;PhD student;Associate Researcher;Professor;Full Professor",
        "bibtex": "@inproceedings{\nweng2024mastering,\ntitle={Mastering Symbolic Operations: Augmenting Language Models with Compiled Neural Networks},\nauthor={Yixuan Weng and Minjun Zhu and Fei Xia and Bin Li and Shizhu He and Kang Liu and Jun Zhao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=9nsNyN0vox}\n}",
        "github": "",
        "project": "",
        "reviewers": "68he;uMuv;M9Rq;NkHa",
        "pdf_size": 2344693,
        "rating": "5;6;6;8",
        "confidence": "3;4;3;4",
        "soundness": "3;3;3;3",
        "contribution": "3;3;2;3",
        "presentation": "2;2;2;3",
        "wc_summary": "77;140;105;72",
        "wc_strengths": "97;80;42;81",
        "wc_weaknesses": "75;166;161;40",
        "wc_questions": "153;2;2;106",
        "wc_review": "402;388;310;299",
        "wc_reply_reviewers": "0;0;47;33",
        "wc_reply_authors": "1336;1673;1819;1165",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "3;3;4;3",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            98.5,
            27.060118255469618
        ],
        "wc_strengths_avg": [
            75.0,
            20.211382931407737
        ],
        "wc_weaknesses_avg": [
            110.5,
            54.45410911951457
        ],
        "wc_questions_avg": [
            65.75,
            65.88009942311866
        ],
        "wc_review_avg": [
            349.75,
            45.68574723039998
        ],
        "wc_reply_reviewers_avg": [
            20.0,
            20.603397778036516
        ],
        "wc_reply_authors_avg": [
            1498.25,
            260.19163610692794
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.25,
            0.4330127018922193
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.6882472016116854,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11908960632930766199&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=9nsNyN0vox",
        "pdf": "https://openreview.net/pdf?id=9nsNyN0vox",
        "email": "ia.ac.cn;westlake.edu;;hnu.edu.cn;ia.ac.cn;ia.ac.cn;nlpr.ia.ac.cn",
        "author_num": 7,
        "aff_unique_index": "0;1;2;0;0;0",
        "aff_unique_norm": "Chinese Academy of Sciences;Westlake University;Hunan University",
        "aff_unique_dep": "Institute of Automation;;",
        "aff_unique_url": "http://www.ia.cas.cn;https://www.westlake.edu.cn;http://www.hunu.edu.cn/",
        "aff_unique_abbr": "CAS;WU;HNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "9o7KuFcsps",
        "title": "Unified Anomaly Detection via Multi-Scale Contrasted Memory",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep anomaly detection (AD) aims to provide robust and efficient classifiers for one-class (OC) and outlier-exposure (OE) settings. However current models still struggle on edge-case normal samples and are often unable to keep high performance over different scales of anomalies. Additionally, there is a lack of a unified framework that efficiently addresses both OC and OE settings. To address these limitations, we present a novel two-stage method which leverages multi-scale normal prototypes during training to compute an anomaly deviation score. First, we employ a novel memory-augmented contrastive learning (CL) to jointly learn representations and memory modules across multiple scales. This allows us to effectively capture subtle features of normal data while adapting to varying levels of anomaly complexity.\nThen, we train an efficient anomaly distance-based detector that computes spatial deviation maps between the learned prototypes and incoming observations.\nOur model outperforms the state-of-the-art on a wide range of anomalies, including object, style, and local anomalies, as well as face presentation attacks. Notably, it stands as the first model capable of maintaining exceptional performance across both OC and OE settings.",
        "keywords": "anomaly detection;self-supervised learning;unbalanced outlier-exposure;hopfield memory",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/36e1233ea52b1e5835a2a33d2cc49fa24bbc71d5.pdf",
        "author": "Lo\u00efc J\u00e9z\u00e9quel;Ngoc-Son Vu;Jean Beaudet;Aymeric Histace",
        "authorids": "~Lo\u00efc_J\u00e9z\u00e9quel1;~Ngoc-Son_Vu2;~Jean_Beaudet1;~Aymeric_Histace1",
        "gender": "M;M;;M",
        "homepage": ";;;https://aymeric.histace.free.fr",
        "dblp": "290/7143;11/8109;;72/6341",
        "google_scholar": "sq4F5egAAAAJ;Fw14qXwAAAAJ;;https://scholar.google.fr/citations?user=y0MU8CAAAAAJ",
        "orcid": "0000-0002-4896-0081;;;",
        "linkedin": ";;;",
        "or_profile": "~Lo\u00efc_J\u00e9z\u00e9quel1;~Ngoc-Son_Vu2;~Jean_Beaudet1;~Aymeric_Histace1",
        "aff": "Ecole Nationale Sup\u00e9rieure de l'Electronique et de ses Applications;Ecole Nationale Sup\u00e9rieure de l'Electronique et de ses Applications;;ETIS",
        "aff_domain": "ensea.fr;ensea.fr;;ensea.fr",
        "position": "PhD student;Associate Professor;;Full Professor",
        "bibtex": "@misc{\nj{\\'e}z{\\'e}quel2024unified,\ntitle={Unified Anomaly Detection via Multi-Scale Contrasted Memory},\nauthor={Lo{\\\"\\i}c J{\\'e}z{\\'e}quel and Ngoc-Son Vu and Jean Beaudet and Aymeric Histace},\nyear={2024},\nurl={https://openreview.net/forum?id=9o7KuFcsps}\n}",
        "github": "",
        "project": "",
        "reviewers": "t6Z1;9JQe;xRL9",
        "site": "https://openreview.net/forum?id=9o7KuFcsps",
        "pdf_size": 1108844,
        "rating": "5;5;6",
        "confidence": "5;4;3",
        "soundness": "2;2;3",
        "contribution": "2;2;2",
        "presentation": "3;2;3",
        "wc_summary": "89;88;100",
        "wc_strengths": "35;103;69",
        "wc_weaknesses": "315;501;72",
        "wc_questions": "116;8;72",
        "wc_review": "555;700;313",
        "wc_reply_reviewers": "29;0;14",
        "wc_reply_authors": "1167;1411;677",
        "reply_reviewers": "1;0;1",
        "reply_authors": "2;3;1",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            92.33333333333333,
            5.436502143433363
        ],
        "wc_strengths_avg": [
            69.0,
            27.760883751542686
        ],
        "wc_weaknesses_avg": [
            296.0,
            175.65306715227035
        ],
        "wc_questions_avg": [
            65.33333333333333,
            44.34210439550904
        ],
        "wc_review_avg": [
            522.6666666666666,
            159.63778444410403
        ],
        "wc_reply_reviewers_avg": [
            14.333333333333334,
            11.841546445554407
        ],
        "wc_reply_authors_avg": [
            1085.0,
            305.21249428335443
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:yUIhXttEPQcJ:scholar.google.com/&scioq=Unified+Anomaly+Detection+via+Multi-Scale+Contrasted+Memory&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Ecole Nationale Sup\u00e9rieure de l'Electronique et de ses Applications;ETIS",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.enssea.fr;",
        "aff_unique_abbr": "ENSEA;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "France;"
    },
    {
        "title": "Video Language Planning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19282",
        "id": "9pKtcJcMP3",
        "author_site": "Yilun Du, Sherry Yang, Pete Florence, Fei Xia, Ayzaan Wahid, brian ichter, Pierre Sermanet, Tianhe Yu, Pieter Abbeel, Joshua B Tenenbaum, Leslie Kaelbling, Andy Zeng, Jonathan Tompson",
        "tldr": "",
        "abstract": "We are interested in enabling visual planning for complex long-horizon tasks in the space of generated videos and language, leveraging recent advances in large generative models pretrained on Internet-scale data.  To this end, we present video language planning (VLP), an algorithm that consists of a tree search procedure, where we train (i) vision-language models to serve as both policies and value functions, and (ii) text-to-video models as dynamics models. VLP takes as input a long-horizon task instruction and current image observation, and outputs a long video plan that provides detailed multimodal (video and language) specifications that describe how to complete the final task. VLP scales with increasing computation budget where more computation time results in improved video plans, and is able to synthesize long-horizon video plans across different robotics domains -- from multi-object rearrangement, to multi-camera bi-arm dexterous manipulation. Generated video plans can be translated into real robot actions via goal-conditioned policies, conditioned on each intermediate frame of the generated video. Experiments show that VLP substantially improves long-horizon task success rates compared to prior methods on both simulated and real robots (across 3 hardware platforms).",
        "keywords": "Planning;Hierarchical Planning;Language Models;Video Models;Long-Horizon Planning",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Yilun Du;Sherry Yang;Pete Florence;Fei Xia;Ayzaan Wahid;brian ichter;Pierre Sermanet;Tianhe Yu;Pieter Abbeel;Joshua B. Tenenbaum;Leslie Pack Kaelbling;Andy Zeng;Jonathan Tompson",
        "authorids": "~Yilun_Du1;~Sherry_Yang1;~Pete_Florence1;~Fei_Xia1;~Ayzaan_Wahid1;~brian_ichter1;~Pierre_Sermanet1;~Tianhe_Yu1;~Pieter_Abbeel2;~Joshua_B._Tenenbaum1;~Leslie_Pack_Kaelbling1;~Andy_Zeng3;~Jonathan_Tompson1",
        "gender": ";F;;M;M;;;M;M;;F;M;M",
        "homepage": "https://yilundu.github.io;https://sherryy.github.io;http://www.peteflorence.com/;;https://ayzaan.com;;https://sermanet.github.io/;https://cs.stanford.edu/~tianheyu/;https://people.eecs.berkeley.edu/~pabbeel/;;http://people.csail.mit.edu/lpk/;http://jonathantompson.com;http://andyzeng.github.io/",
        "dblp": "204/4379;;;;;;28/6457;192/1797;;t/JoshuaBTenenbaum;k/LesliePackKaelbling;139/0769;http://dblp.uni-trier.de/pers/hd/z/Zeng:Andy",
        "google_scholar": ";7c1B_fIAAAAJ;;pqP5_PgAAAAJ;;-w5DuHgAAAAJ;0nPi5YYAAAAJ;;https://scholar.google.com.tw/citations?user=vtwH6GkAAAAJ;;IcasIiwAAAAJ;U_Jw8DUAAAAJ;q7nFtUcAAAAJ",
        "orcid": ";;;0000-0003-4343-1444;;;;;;;0000-0001-6054-7145;;",
        "linkedin": ";;;;;;sermanet/;;;;;;",
        "or_profile": "~Yilun_Du1;~Sherry_Yang1;~Pete_Florence1;~Fei_Xia1;~Ayzaan_Wahid1;~brian_ichter1;~Pierre_Sermanet1;~Tianhe_Yu1;~Pieter_Abbeel2;~Joshua_B._Tenenbaum1;~Leslie_Pack_Kaelbling1;~Jonathan_Tompson1;~Andy_Zeng1",
        "aff": "Massachusetts Institute of Technology;University of California, Berkeley;Google;Google;Robotics at Google;Google;Google;Google Brain;Covariant;Massachusetts Institute of Technology;Massachusetts Institute of Technology;Google DeepMind;Google",
        "aff_domain": "mit.edu;berkeley.edu;google.com;google.com;google.com;google.com;google.com;google.com;covariant.ai;mit.edu;mit.edu;google.com;google.com",
        "position": "PhD student;Student;Research Scientist;Researcher;Software Engineer;Research Scientist;Research Scientist;Research Scientist;Founder;Professor;Full Professor;Researcher;Research Scientist",
        "bibtex": "@inproceedings{\ndu2024video,\ntitle={Video Language Planning},\nauthor={Yilun Du and Sherry Yang and Pete Florence and Fei Xia and Ayzaan Wahid and brian ichter and Pierre Sermanet and Tianhe Yu and Pieter Abbeel and Joshua B. Tenenbaum and Leslie Pack Kaelbling and Andy Zeng and Jonathan Tompson},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=9pKtcJcMP3}\n}",
        "github": "",
        "project": "",
        "reviewers": "AYpb;MAiq;4qts;uBLi",
        "pdf_size": 5468375,
        "rating": "6;6;8;8",
        "confidence": "4;4;3;3",
        "soundness": "2;2;3;3",
        "contribution": "2;3;4;3",
        "presentation": "3;4;3;4",
        "wc_summary": "73;93;83;135",
        "wc_strengths": "20;66;126;119",
        "wc_weaknesses": "353;91;88;147",
        "wc_questions": "70;22;280;137",
        "wc_review": "516;272;577;538",
        "wc_reply_reviewers": "274;0;34;0",
        "wc_reply_authors": "850;367;407;403",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            96.0,
            23.600847442411894
        ],
        "wc_strengths_avg": [
            82.75,
            43.01961761801237
        ],
        "wc_weaknesses_avg": [
            169.75,
            108.37752303868179
        ],
        "wc_questions_avg": [
            127.25,
            97.18892683840068
        ],
        "wc_review_avg": [
            475.75,
            119.64609270678253
        ],
        "wc_reply_reviewers_avg": [
            77.0,
            114.58184847522752
        ],
        "wc_reply_authors_avg": [
            506.75,
            198.78678904796465
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            13,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "openreview": "https://openreview.net/forum?id=9pKtcJcMP3",
        "pdf": "https://openreview.net/pdf?id=9pKtcJcMP3",
        "email": "mit.edu;berkeley.edu;google.com;google.com;google.com;google.com;google.com;google.com;covariant.ai;mit.edu;mit.edu;google.com;google.com",
        "author_num": 13,
        "aff_unique_index": "0;1;2;2;2;2;2;2;3;0;0;2;2",
        "aff_unique_norm": "Massachusetts Institute of Technology;University of California, Berkeley;Google;Covariant",
        "aff_unique_dep": ";;Google;",
        "aff_unique_url": "https://web.mit.edu;https://www.berkeley.edu;https://www.google.com;",
        "aff_unique_abbr": "MIT;UC Berkeley;Google;",
        "aff_campus_unique_index": "1;2;2;2;2;2;2;2",
        "aff_campus_unique": ";Berkeley;Mountain View",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0;2;0",
        "aff_country_unique": "United States;;United Kingdom"
    },
    {
        "id": "9pe38WpsbX",
        "title": "MuDreamer: Learning Predictive World Models without Reconstruction",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The DreamerV3 agent recently demonstrated state-of-the-art performance in diverse domains, learning powerful world models in latent space using a pixel reconstruction loss. However, while the reconstruction loss is essential to Dreamer's performance, it also necessitates modeling unnecessary information. Consequently, Dreamer sometimes fails to perceive crucial elements which are necessary for task-solving, significantly limiting its potential. In this paper, we present MuDreamer, a reinforcement learning agent that builds upon the DreamerV3 algorithm by learning a predictive world model without the need for reconstructing input signals. Rather than relying on pixel reconstruction, hidden representations are instead learned by predicting the environment value function and previously selected actions. Similar to predictive self-supervised methods for images, we find that the use of batch normalization is crucial to prevent learning collapse. We also study the effect of KL balancing between model posterior and prior losses on convergence speed and learning stability. We evaluate MuDreamer on the widely used DeepMind Visual Control Suite and achieves performance comparable to DreamerV3. MuDreamer also demonstrates promising results on the Atari100k benchmark. Research code will be made available publicly.",
        "keywords": "Model-Based Reinforcement Learning;Dreamer;Reconstruction-Free",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/c218d7d4916d4f567814e4bbc29379c6061b3190.pdf",
        "author": "Maxime Burchi;Radu Timofte",
        "authorids": "~Maxime_Burchi1;~Radu_Timofte1",
        "gender": ";M",
        "homepage": "https://burchim.github.io/;https://www.informatik.uni-wuerzburg.de/computervision/",
        "dblp": "302/0270;24/8616",
        "google_scholar": "7S_l2eAAAAAJ;https://scholar.google.ch/citations?user=u3MwH5kAAAAJ",
        "orcid": ";0000-0002-1478-0402",
        "linkedin": ";https://ch.linkedin.com/in/radutimofte",
        "or_profile": "~Maxime_Burchi1;~Radu_Timofte1",
        "aff": "Bayerische Julius-Maximilians-Universit\u00e4t W\u00fcrzburg;Bayerische Julius-Maximilians-Universit\u00e4t W\u00fcrzburg",
        "aff_domain": "uni-wuerzburg.de;uni-wuerzburg.de",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nburchi2024mudreamer,\ntitle={MuDreamer: Learning Predictive World Models without Reconstruction},\nauthor={Maxime Burchi and Radu Timofte},\nyear={2024},\nurl={https://openreview.net/forum?id=9pe38WpsbX}\n}",
        "github": "",
        "project": "",
        "reviewers": "QumB;5xED;8AeP",
        "site": "https://openreview.net/forum?id=9pe38WpsbX",
        "pdf_size": 3319017,
        "rating": "3;5;5",
        "confidence": "5;3;4",
        "soundness": "2;3;3",
        "contribution": "2;2;1",
        "presentation": "2;3;4",
        "wc_summary": "65;60;85",
        "wc_strengths": "58;34;76",
        "wc_weaknesses": "168;224;217",
        "wc_questions": "17;5;159",
        "wc_review": "308;323;537",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "282;615;593",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            70.0,
            10.801234497346433
        ],
        "wc_strengths_avg": [
            56.0,
            17.204650534085253
        ],
        "wc_weaknesses_avg": [
            203.0,
            24.91318258807306
        ],
        "wc_questions_avg": [
            60.333333333333336,
            69.93965653015144
        ],
        "wc_review_avg": [
            389.3333333333333,
            104.59551721857979
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            496.6666666666667,
            152.05773757213265
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7866069089508150540&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of W\u00fcrzburg",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uni-wuerzburg.de",
        "aff_unique_abbr": "JMU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "W\u00fcrzburg",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "9qtswuW5ux",
        "title": "Unsupervised graph neural networks with recurrent features for solving combinatorial optimization problems",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In recent years, graph neural networks (GNNs) have gained considerable attention as a promising approach to tackle combinatorial optimization problems.\nWe introduce a novel algorithm, dubbed QRF-GNN in the following, that leverages the power of GNNs to efficiently solve combinatorial problems which have quadratic unconstrained binary optimization (QUBO) formulation.\nIt relies on unsupervised learning and minimizes the loss function derived from QUBO relaxation.\nThe key components of the architecture are the recurrent use of intermediate GNN predictions, parallel convolutional layers and combination of artificial node features as input.\nThe performance of the algorithm was evaluated on benchmark datasets for maximum cut and graph coloring problems.\nResults of experiments show that QRF-GNN surpasses existing graph neural network based approaches and is comparable to the state-of-the-art conventional heuristics.",
        "keywords": "graph neural networks;combinatorial optimization;recurrent neural networks;maximum cut problem;graph coloring problem",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Daria Pugacheva;Yuriy Zotov;Andrei Ermakov;Igor Lyskov",
        "authorids": "~Daria_Pugacheva1;~Yuriy_Zotov1;~Andrei_Ermakov1;~Igor_Lyskov1",
        "gender": "F;M;M;M",
        "homepage": ";;;",
        "dblp": "383/6092;;;",
        "google_scholar": "https://scholar.google.ru/citations?hl=ru;;;",
        "orcid": "0000-0002-4285-1001;;;0000-0002-6111-2060",
        "linkedin": ";https://linkedin.com/in/yura-zotov-75a84193/;andrey-ermakov-8a2848202;",
        "or_profile": "~Daria_Pugacheva1;~Yuriy_Zotov1;~Andrei_Ermakov1;~Igor_Lyskov1",
        "aff": "AIRI;;National Research University Higher School of Economics;",
        "aff_domain": "airi.net;;edu.hse;",
        "position": "Researcher;;MS student;",
        "bibtex": "@misc{\npugacheva2024unsupervised,\ntitle={Unsupervised graph neural networks with recurrent features for solving combinatorial optimization problems},\nauthor={Daria Pugacheva and Yuriy Zotov and Andrei Ermakov and Igor Lyskov},\nyear={2024},\nurl={https://openreview.net/forum?id=9qtswuW5ux}\n}",
        "github": "",
        "project": "",
        "reviewers": "VZaD;oXir;vpKg;Nnir",
        "site": "https://openreview.net/forum?id=9qtswuW5ux",
        "pdf_size": 689549,
        "rating": "3;3;5;6",
        "confidence": "4;4;2;2",
        "soundness": "2;2;3;2",
        "contribution": "2;2;2;2",
        "presentation": "2;3;3;2",
        "wc_summary": "101;31;73;54",
        "wc_strengths": "40;37;42;78",
        "wc_weaknesses": "219;94;4;21",
        "wc_questions": "230;5;192;13",
        "wc_review": "590;167;311;166",
        "wc_reply_reviewers": "111;107;192;18",
        "wc_reply_authors": "2789;887;1153;204",
        "reply_reviewers": "1;1;2;1",
        "reply_authors": "6;3;2;2",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.0,
            1.0
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            64.75,
            25.674647027758727
        ],
        "wc_strengths_avg": [
            49.25,
            16.69393602479655
        ],
        "wc_weaknesses_avg": [
            84.5,
            84.69504117715512
        ],
        "wc_questions_avg": [
            110.0,
            101.92889678594584
        ],
        "wc_review_avg": [
            308.5,
            172.89953730418137
        ],
        "wc_reply_reviewers_avg": [
            107.0,
            61.567036634874675
        ],
        "wc_reply_authors_avg": [
            1258.25,
            949.1499815624504
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.25,
            1.6393596310755
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9622504486493761,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:OND0PEK0xVIJ:scholar.google.com/&scioq=Unsupervised+graph+neural+networks+with+recurrent+features+for+solving+combinatorial+optimization+problems&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Artificial Intelligence Research Institute;National Research University Higher School of Economics",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.airi.jp;https://hse.ru",
        "aff_unique_abbr": "AIRI;HSE",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Japan;Russian Federation"
    },
    {
        "title": "Domain-Agnostic Molecular Generation with Chemical Feedback",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19281",
        "id": "9rPyHyjfwP",
        "author_site": "Yin Fang, Ningyu Zhang, Zhuo Chen, Lingbing Guo, Xiaohui Fan, Huajun Chen",
        "tldr": "",
        "abstract": "The generation of molecules with desired properties has become increasingly popular, revolutionizing the way scientists design molecular structures and providing valuable support for chemical and drug design. However, despite the potential of language models in molecule generation, they face challenges such as generating syntactically or chemically flawed molecules, having narrow domain focus, and struggling to create diverse and feasible molecules due to limited annotated data or external molecular databases.\nTo tackle these challenges, we introduce MolGen, a pre-trained molecular language model tailored specifically for molecule generation. Through the reconstruction of over 100 million molecular SELFIES, MolGen internalizes structural and grammatical insights. This is further enhanced by domain-agnostic molecular prefix tuning, fostering robust knowledge transfer across diverse domains. Importantly, our chemical feedback paradigm steers the model away from \"molecular hallucinations\", ensuring alignment between the model's estimated probabilities and real-world chemical preferences. Extensive experiments on well-known benchmarks underscore MolGen's optimization capabilities in properties such as penalized logP, QED, and molecular docking. Additional analyses confirm its proficiency in accurately capturing molecule distributions, discerning intricate structural patterns, and efficiently exploring the chemical space (https://github.com/zjunlp/MolGen).",
        "keywords": "molecule generation;pre-trained language models;SELFIES;natural products;self-feedback",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/3227006229cb78a850fdd90e59f6767a967b5a45.zip",
        "author": "Yin Fang;Ningyu Zhang;Zhuo Chen;Lingbing Guo;Xiaohui Fan;Huajun Chen",
        "authorids": "~Yin_Fang1;~Ningyu_Zhang1;~Zhuo_Chen3;~Lingbing_Guo1;~Xiaohui_Fan1;~Huajun_Chen1",
        "gender": "F;M;;M;;M",
        "homepage": "https://github.com/Fangyinfff;https://person.zju.edu.cn/en/ningyu;;https://guolingbing.github.io/;https://person.zju.edu.cn/en/fanxh;",
        "dblp": "231/7716;139/4181-1.html;;228/2586;133/8797;94/5089",
        "google_scholar": "4rWspjsAAAAJ;xQDOPvsAAAAJ;;og4v8cMAAAAJ;;",
        "orcid": "0000-0001-9538-848X;0000-0002-1970-0678;;;0000-0002-6336-3007;",
        "linkedin": ";ningyuzhang/;;;;",
        "or_profile": "~Yin_Fang1;~Ningyu_Zhang1;~Zhuo_Chen3;~Lingbing_Guo1;~Xiaohui_Fan1;~Huajun_Chen1",
        "aff": "Zhejiang University;Zhejiang University;;Zhejiang University;Zhejiang University;Zhejiang University",
        "aff_domain": "zju.edu.cn;zju.edu.cn;;zju.edu.cn;zju.edu.cn;zju.edu.cn",
        "position": "PhD student;Associate Professor;;PhD student;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nfang2024domainagnostic,\ntitle={Domain-Agnostic Molecular Generation with Chemical Feedback},\nauthor={Yin Fang and Ningyu Zhang and Zhuo Chen and Lingbing Guo and Xiaohui Fan and Huajun Chen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=9rPyHyjfwP}\n}",
        "github": "",
        "project": "",
        "reviewers": "Hnvb;Vj81;13gf;A1g6",
        "pdf_size": 9422963,
        "rating": "6;6;8;8",
        "confidence": "4;4;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "1;3;3;3",
        "wc_summary": "80;63;91;116",
        "wc_strengths": "28;67;35;89",
        "wc_weaknesses": "578;143;256;11",
        "wc_questions": "23;145;107;2",
        "wc_review": "709;418;489;218",
        "wc_reply_reviewers": "157;14;20;0",
        "wc_reply_authors": "1266;838;932;113",
        "reply_reviewers": "2;1;1;0",
        "reply_authors": "4;3;3;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            87.5,
            19.241881404893856
        ],
        "wc_strengths_avg": [
            54.75,
            24.641174890820444
        ],
        "wc_weaknesses_avg": [
            247.0,
            209.8535203421663
        ],
        "wc_questions_avg": [
            69.25,
            58.789348525051714
        ],
        "wc_review_avg": [
            458.5,
            175.47150765865095
        ],
        "wc_reply_reviewers_avg": [
            47.75,
            63.49163330707441
        ],
        "wc_reply_authors_avg": [
            787.25,
            420.51835572302906
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.75,
            1.0897247358851685
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 16,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4693474697199891995&as_sdt=4005&sciodt=0,6&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=9rPyHyjfwP",
        "pdf": "https://openreview.net/pdf?id=9rPyHyjfwP",
        "email": "zju.edu.cn;zju.edu.cn;;zju.edu.cn;zju.edu.cn;zju.edu.cn",
        "author_num": 6,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Zhejiang University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.zju.edu.cn",
        "aff_unique_abbr": "ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "9rV9cp7KRH",
        "title": "Incentivized Collaborative Learning: Architectural Design and Insights",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Collaborations among various entities, such as companies, research labs, AI agents, and edge devices, have become increasingly crucial for achieving machine learning tasks that cannot be accomplished by a single entity alone. This is likely due to factors such as security constraints, privacy concerns, and limitations in computation resources. As a result, collaborative learning (CL) research has been gaining momentum. However, a significant challenge in practical applications of CL is how to effectively incentivize multiple entities to collaborate before any collaboration occurs. In this study, we propose ICL, an architectural framework for incentivized collaborative learning, and provide insights into the critical issue of when and why incentives can improve collaboration performance. Then, we apply the concepts of ICL to specific use cases in federated learning, assisted learning, and multi-armed bandit, corroborated with both theoretical and experimental results.",
        "keywords": "collaborative learning;incentive;modeling",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/7704433bb6b4da5ea843eae61b49570b845eac49.zip",
        "author": "Xinran Wang;Qi Le;Ahmad Faraz Khan;Jie Ding;Ali Anwar",
        "authorids": "~Xinran_Wang3;~Qi_Le1;~Ahmad_Faraz_Khan1;~Jie_Ding2;~Ali_Anwar1",
        "gender": "F;M;M;M;M",
        "homepage": "https://wang8740.github.io;https://www.linkedin.com/in/qi-le-60a8811a0/;https://afkd98.github.io/;http://jding.org;https://chalianwar.github.io/",
        "dblp": ";;;94/1825-2;69/9027-1",
        "google_scholar": "u8gID6EAAAAJ;;VjGylKsAAAAJ;ZyqvoqcAAAAJ;o3eOVbgAAAAJ",
        "orcid": ";;0009-0009-3867-5656;;",
        "linkedin": "wang-xinran;;ahmadfarazkhandurrani/;;",
        "or_profile": "~Xinran_Wang3;~Qi_Le1;~Ahmad_Faraz_Khan1;~Jie_Ding2;~Ali_Anwar1",
        "aff": "University of Minnesota - Twin Cities;University of Minnesota - Twin Cities;Virginia Polytechnic Institute and State University;University of Minnesota - Twin Cities;University of Minnesota",
        "aff_domain": "umn.edu;umn.edu;vt.edu;umn.edu;umn.edu",
        "position": "PhD student;PhD student;PhD student;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nwang2024incentivized,\ntitle={Incentivized Collaborative Learning: Architectural Design and Insights},\nauthor={Xinran Wang and Qi Le and Ahmad Faraz Khan and Jie Ding and Ali Anwar},\nyear={2024},\nurl={https://openreview.net/forum?id=9rV9cp7KRH}\n}",
        "github": "",
        "project": "",
        "reviewers": "npuS;R699;cras",
        "site": "https://openreview.net/forum?id=9rV9cp7KRH",
        "pdf_size": 9443415,
        "rating": "3;5;5",
        "confidence": "4;4;4",
        "soundness": "2;3;2",
        "contribution": "2;2;2",
        "presentation": "2;2;1",
        "wc_summary": "96;99;76",
        "wc_strengths": "77;67;59",
        "wc_weaknesses": "355;52;153",
        "wc_questions": "3;562;39",
        "wc_review": "531;780;327",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "917;1837;537",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;3;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            90.33333333333333,
            10.208928554075703
        ],
        "wc_strengths_avg": [
            67.66666666666667,
            7.363574011458175
        ],
        "wc_weaknesses_avg": [
            186.66666666666666,
            125.96913202138936
        ],
        "wc_questions_avg": [
            201.33333333333334,
            255.4529745808849
        ],
        "wc_review_avg": [
            546.0,
            185.24038436582882
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1097.0,
            545.7716250105594
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:z3pPZleR0L8J:scholar.google.com/&scioq=Incentivized+Collaborative+Learning:+Architectural+Design+and+Insights&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "University of Minnesota;Virginia Tech",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.minnesota.edu;https://www.vt.edu",
        "aff_unique_abbr": "UMN;VT",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Twin Cities;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "9rXBGpLMxV",
        "title": "xMLP: Revolutionizing Private Inference with Exclusive Square Activation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Private Inference (PI) enables deep neural networks (DNNs) to work on private data without leaking sensitive information by exploiting cryptographic primitives such as multi-party computation (MPC) and homomorphic encryption (HE).\nHowever, the use of non-linear activations such as ReLU in DNNs can lead to impractically high PI latency in existing PI systems, as ReLU requires the use of costly MPC computations, such as Garbled Circuits.\nSince square activations can be processed by Beaver's triples hundreds of times faster compared to ReLU, they are more friendly to PI tasks, but using them leads to a notable drop in model accuracy.\nThis paper starts by exploring the reason for such an accuracy drop after using square activations, and concludes that this is due to an ``information compounding\u2019\u2019 effect. Leveraging this insight, we propose xMLP, a novel DNN architecture that uses square activations exclusively while maintaining parity in both accuracy and efficiency with ReLU-based DNNs. \nOur experiments on CIFAR-100 and ImageNet show that xMLP models consistently achieve better performance than ResNet models with fewer activation layers and parameters while maintaining consistent performance with its ReLU-based variants.\nRemarkably, when compared to state-of-the-art PI Models, xMLP demonstrates superior performance, achieving a 0.58\\% increase in accuracy with 7$\\times$ faster PI speed. Moreover, it delivers a significant accuracy improvement of 4.96\\% while maintaining the same PI latency.\nWhen offloading PI to the GPU, xMLP is up to 700$\\times$ faster than the previous state-of-the-art PI model with comparable accuracy.",
        "keywords": "Privacy Preserving Machine Learning;Private Inference;Multi-Party Computation;Deep Learning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Jiajie Li;Jinjun Xiong",
        "authorids": "~Jiajie_Li2;~Jinjun_Xiong1",
        "gender": "M;",
        "homepage": "https://jiajie.li;https://www.xlab-ub.com",
        "dblp": ";81/1130",
        "google_scholar": "oMCzOmoAAAAJ;tRt1xPYAAAAJ",
        "orcid": ";0000-0002-2620-4859",
        "linkedin": "li-jia-jie/;jinjun-xiong-314774/",
        "or_profile": "~Jiajie_Li2;~Jinjun_Xiong1",
        "aff": "State University of New York at Buffalo;State University of New York at Buffalo",
        "aff_domain": "buffalo.edu;buffalo.edu",
        "position": "PhD student;Professor",
        "bibtex": "@misc{\nli2024xmlp,\ntitle={x{MLP}: Revolutionizing Private Inference with Exclusive Square Activation},\nauthor={Jiajie Li and Jinjun Xiong},\nyear={2024},\nurl={https://openreview.net/forum?id=9rXBGpLMxV}\n}",
        "github": "",
        "project": "",
        "reviewers": "Bz3S;9z1L;gNjC;TxCL",
        "site": "https://openreview.net/forum?id=9rXBGpLMxV",
        "pdf_size": 758534,
        "rating": "3;3;5;5",
        "confidence": "5;5;3;4",
        "soundness": "2;3;2;2",
        "contribution": "2;2;2;1",
        "presentation": "3;3;3;3",
        "wc_summary": "52;71;100;38",
        "wc_strengths": "11;111;89;25",
        "wc_weaknesses": "260;600;70;119",
        "wc_questions": "5;42;3;46",
        "wc_review": "328;824;262;228",
        "wc_reply_reviewers": "93;170;114;0",
        "wc_reply_authors": "314;722;356;372",
        "reply_reviewers": "1;1;2;0",
        "reply_authors": "2;2;3;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            65.25,
            23.23117517475171
        ],
        "wc_strengths_avg": [
            59.0,
            42.02380277890139
        ],
        "wc_weaknesses_avg": [
            262.25,
            207.0994628191971
        ],
        "wc_questions_avg": [
            24.0,
            20.062402647738878
        ],
        "wc_review_avg": [
            410.5,
            241.42648984732392
        ],
        "wc_reply_reviewers_avg": [
            94.25,
            61.26326386995717
        ],
        "wc_reply_authors_avg": [
            441.0,
            163.61234672236688
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.9045340337332909,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:hBmZs37tiWMJ:scholar.google.com/&scioq=xMLP:+Revolutionizing+Private+Inference+with+Exclusive+Square+Activation&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "State University of New York at Buffalo",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.buffalo.edu",
        "aff_unique_abbr": "SUNY Buffalo",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Buffalo",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "9rzEPbs4Wg",
        "title": "Improving Generalization and Safety of Deep Neural Networks with Masked Anchoring",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Anchoring is a recent architecture and task-agnostic technique that can produce state-of-the-art epistemic uncertainty estimates, and improve extrapolation capabilities. However, the differences between anchored models and non-anchored variants is not well studied -- as there is little insight into the kinds of functions anchoring induces and how they behave under distribution shifts. In this paper, we analyze and improve anchoring as a training protocol for deep neural networks, evaluating them on important tasks of out of distribution generalization, task adaptation, anomaly detection and calibration. We pinpoint the impact of anchoring on generalization as being inversely related to the sensitivity of the model to the distribution of residuals. We further improve this sensitivity using a new technique called Random Anchor Masking (RAM) that significantly improves the quality of anchored models. We build evidence for the superiority of RAM-training using a range of benchmarks of varying size, using neural networks of varying complexity and scale.",
        "keywords": "Anomaly Detection;OOD Generalization;ML Safety;Anchoring;Deep Neural Networks",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/ba233f79a4e1de1dd6a5cc117e4384bbbffd0376.pdf",
        "author": "Vivek Narayanaswamy;Kowshik Thopalli;Rushil Anirudh;Jayaraman J. Thiagarajan",
        "authorids": "~Vivek_Narayanaswamy1;~Kowshik_Thopalli1;~Rushil_Anirudh1;~Jayaraman_J._Thiagarajan3",
        "gender": "M;M;M;M",
        "homepage": ";https://kowshikthopalli.github.io/;https://rushila.com/;https://jjthiagarajan.com",
        "dblp": "230/4531;224/0052;136/5391;16/7803",
        "google_scholar": "7h2Ui6YAAAAJ;https://scholar.google.com/citations?hl=en;WkoIlpQAAAAJ;cMz65_oAAAAJ",
        "orcid": ";;0000-0002-4186-3502;",
        "linkedin": ";;rushilanirudh/;",
        "or_profile": "~Vivek_Narayanaswamy1;~Kowshik_Thopalli1;~Rushil_Anirudh1;~Jayaraman_J._Thiagarajan2",
        "aff": "Lawrence Livermore National Labs;Lawrence Livermore National Labs;Amazon;Lawrence Livermore National Labs",
        "aff_domain": "llnl.gov;llnl.gov;amazon.com;llnl.gov",
        "position": "Researcher;Postdoc;Applied Scientist;Computer Scientist",
        "bibtex": "@misc{\nnarayanaswamy2024improving,\ntitle={Improving Generalization and Safety of Deep Neural Networks with Masked Anchoring},\nauthor={Vivek Narayanaswamy and Kowshik Thopalli and Rushil Anirudh and Jayaraman J. Thiagarajan},\nyear={2024},\nurl={https://openreview.net/forum?id=9rzEPbs4Wg}\n}",
        "github": "",
        "project": "",
        "reviewers": "auhR;8fzY;GTiz;rVkq;BVnY;LRUp",
        "site": "https://openreview.net/forum?id=9rzEPbs4Wg",
        "pdf_size": 794700,
        "rating": "5;6;6;6;6;8",
        "confidence": "4;3;4;3;3;3",
        "soundness": "2;3;3;3;3;4",
        "contribution": "2;3;3;3;3;4",
        "presentation": "2;3;3;3;3;3",
        "wc_summary": "73;33;94;102;59;355",
        "wc_strengths": "81;31;94;71;37;239",
        "wc_weaknesses": "323;36;92;207;81;367",
        "wc_questions": "44;8;5;5;66;238",
        "wc_review": "521;108;285;385;243;1199",
        "wc_reply_reviewers": "404;0;23;120;75;58",
        "wc_reply_authors": "792;575;740;1285;783;714",
        "reply_reviewers": "1;0;1;1;2;1",
        "reply_authors": "2;2;2;3;2;2",
        "rating_avg": [
            6.166666666666667,
            0.8975274678557507
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.5773502691896257
        ],
        "contribution_avg": [
            3.0,
            0.5773502691896257
        ],
        "presentation_avg": [
            2.8333333333333335,
            0.3726779962499649
        ],
        "wc_summary_avg": [
            119.33333333333333,
            107.79713457333744
        ],
        "wc_strengths_avg": [
            92.16666666666667,
            69.42722008613687
        ],
        "wc_weaknesses_avg": [
            184.33333333333334,
            125.3763224146498
        ],
        "wc_questions_avg": [
            61.0,
            82.38527376499597
        ],
        "wc_review_avg": [
            456.8333333333333,
            355.2053005735635
        ],
        "wc_reply_reviewers_avg": [
            113.33333333333333,
            135.44207453947075
        ],
        "wc_reply_authors_avg": [
            814.8333333333334,
            222.06561843042903
        ],
        "reply_reviewers_avg": [
            1.0,
            0.5773502691896257
        ],
        "reply_authors_avg": [
            2.1666666666666665,
            0.3726779962499649
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5252257314388904,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Umc_zKTaF2kJ:scholar.google.com/&scioq=Improving+Generalization+and+Safety+of+Deep+Neural+Networks+with+Masked+Anchoring&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Lawrence Livermore National Laboratory;Amazon",
        "aff_unique_dep": ";Amazon.com, Inc.",
        "aff_unique_url": "https://www.llnl.gov;https://www.amazon.com",
        "aff_unique_abbr": "LLNL;Amazon",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "9tNhV5kTSc",
        "title": "How do agents invest strategically under persistent improvement?",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "This paper studies algorithmic decision-making under human's strategic behavior, where a decision-maker uses an algorithm to make decisions about human agents, and the latter with information about the algorithm may exert effort strategically and improve to receive favorable decisions. Unlike prior works that assume agents benefit from their efforts immediately, we consider realistic scenarios where the impacts of these efforts are persistent and agents benefit from efforts by making improvements gradually. However, the agent's utility also diminishes as time goes on. We first develop a dynamic model to characterize persistent improvements and based on this construct a Stackelberg game to model the interplay between agents and the decision-maker. We analytically characterize the equilibrium strategies and identify conditions under which agents have incentives to improve. With the dynamics, we then study how the decision-maker can design an optimal policy to incentivize the largest improvements inside the agent population. We also extend the model to settings where (1) agents may be dishonest and game the algorithm into making favorable but erroneous decisions; (2) honest efforts are forgettable and not sufficient to guarantee persistent improvements. With the extended models, we further examine conditions under which agents prefer honest efforts over dishonest behavior and the impacts of forgettable efforts.",
        "keywords": "Strategic Classification;Stackelberg Game;Population Dynamics",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/ee27e133776715e834b3a5e5aab05b904ae56f69.zip",
        "author": "Tian Xie;Xuwei Tan;Xueru Zhang",
        "authorids": "~Tian_Xie4;~Xuwei_Tan1;~Xueru_Zhang2",
        "gender": "M;M;F",
        "homepage": "https://www.linkedin.com/in/tianxie1999/;https://engineering.osu.edu/people/tan.1206;https://xueruzhang.github.io/",
        "dblp": ";308/6151;",
        "google_scholar": ";IpTmmIYAAAAJ;PNBO_a4AAAAJ",
        "orcid": ";;",
        "linkedin": "tianxie1999/;;",
        "or_profile": "~Tian_Xie4;~Xuwei_Tan1;~Xueru_Zhang2",
        "aff": "Ohio State University, Columbus;Ohio State University, Columbus;Ohio State University",
        "aff_domain": "osu.edu;osu.edu;osu.edu",
        "position": "PhD student;PhD student;Assistant Professor",
        "bibtex": "@misc{\nxie2024how,\ntitle={How do agents invest strategically under persistent improvement?},\nauthor={Tian Xie and Xuwei Tan and Xueru Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=9tNhV5kTSc}\n}",
        "github": "",
        "project": "",
        "reviewers": "6GuR;m2xs;gzfu",
        "site": "https://openreview.net/forum?id=9tNhV5kTSc",
        "pdf_size": 386779,
        "rating": "1;5;5",
        "confidence": "3;5;2",
        "soundness": "1;3;2",
        "contribution": "1;2;2",
        "presentation": "2;3;3",
        "wc_summary": "208;79;52",
        "wc_strengths": "50;73;47",
        "wc_weaknesses": "341;206;94",
        "wc_questions": "52;84;25",
        "wc_review": "651;442;218",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            1.8856180831641267
        ],
        "confidence_avg": [
            3.3333333333333335,
            1.247219128924647
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            113.0,
            68.07348970047003
        ],
        "wc_strengths_avg": [
            56.666666666666664,
            11.61416759345623
        ],
        "wc_weaknesses_avg": [
            213.66666666666666,
            100.98294685517727
        ],
        "wc_questions_avg": [
            53.666666666666664,
            24.115462996914562
        ],
        "wc_review_avg": [
            437.0,
            176.80686261190957
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.18898223650461363,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:u8ubvAys_KkJ:scholar.google.com/&scioq=How+do+agents+invest+strategically+under+persistent+improvement%3F&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Ohio State University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.osu.edu",
        "aff_unique_abbr": "OSU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Columbus;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "9tQfBNxX16",
        "title": "Towards efficient deep spiking neural networks construction with spiking activity based pruning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Spiking neural networks (SNNs) drawing inspiration from the biological nervous system possess the distinctive advantage of being biologically interpretable and energy-efficient. In recent years, there has been a rise in deep and large-scale SNNs structures that exhibit high performance across various complex datasets. However, within these structures, a significant number of redundant structural units are often present, compelling the need to compress the network models of SNNs to more effectively harness their low-power advantage. Currently, most model compression techniques for SNNs are based on unstructured pruning of individual connections, which requires specific hardware support. Receptive field cells in the biological visual system have influenced a crucial concept in deep learning: convolutional kernels. Hence, we propose a structured pruning approach based on the activity levels of convolutional kernels named Spiking Channel Activity-based (SCA) network pruning framework. Inspired by synaptic plasticity mechanisms, our method dynamically adjusts the network's structure by pruning and regenerating convolutional kernels during training, enhancing the model's adaptation to the current target task. While maintaining model performance, this approach refines the network architecture, ultimately reducing computational load and accelerating the inference process. We conducted experiments on static datasets including CIFAR10, CIFAR100 and DVS-CIFAR10. Experimental results demonstrate that this method incurs only about 2% accuracy loss while retaining 20% of the channels. This indicates that structured dynamic sparse learning methods can better facilitate the application of deep SNNs in low-power and high-efficiency scenarios.",
        "keywords": "spiking neural networks;pruning;network structure;power consumption",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/d51c7b629ced13c4a3eaf3b2cf04a3420803818d.zip",
        "author": "Yaxin Li;Jiangrong Shen;Hongming Xu;Long Chen;Gang Pan;Qiang Zhang;Qi Xu",
        "authorids": "~Yaxin_Li4;~Jiangrong_Shen1;~Hongming_Xu3;~Long_Chen18;~Gang_Pan1;~Qiang_Zhang13;~Qi_Xu1",
        "gender": ";F;M;M;;M;M",
        "homepage": ";;https://xhm1014.github.io/index.html;https://iris.ucl.ac.uk/iris/browse/profile?upi=LCHEI54;;https://faculty.dlut.edu.cn/2017022144/en/index.htm;https://www.researchgate.net/profile/Qi_Xu43",
        "dblp": "143/0251-3;208/3564;150/7585-2;64/5725-19.html;;72/3527-8;",
        "google_scholar": ";3XK6COkAAAAJ;nErn9W8AAAAJ;J_v0xb8AAAAJ;;https://scholar.google.de/citations?hl=de;dGEcAuYAAAAJ",
        "orcid": "0000-0003-0160-8950;;0000-0002-1305-0010;0000-0001-8552-859X;;0000-0003-0609-0337;0000-0001-9245-5544",
        "linkedin": ";;;;;;",
        "or_profile": "~Yaxin_Li4;~Jiangrong_Shen1;~Hongming_Xu3;~Long_Chen18;~Gang_Pan1;~Qiang_Zhang13;~Qi_Xu1",
        "aff": "Dalian University of Technology;Zhejiang University;Dalian University of Technology;Imperial College London;;Dalian University of Technology;School of Computer Science and Technology",
        "aff_domain": "dlut.edu.cn;zju.edu.cn;dlut.edu.cn;ic.ac.uk;;dlut.edu.cn;dlut.edu.cn",
        "position": "MS student;Postdoc;Associate Professor;Postdoc;;Full Professor;Associate Professor",
        "bibtex": "@misc{\nli2024towards,\ntitle={Towards efficient deep spiking neural networks construction with spiking activity based pruning},\nauthor={Yaxin Li and Jiangrong Shen and Hongming Xu and Long Chen and Gang Pan and Qiang Zhang and Qi Xu},\nyear={2024},\nurl={https://openreview.net/forum?id=9tQfBNxX16}\n}",
        "github": "",
        "project": "",
        "reviewers": "AYqQ;JMPU;vHij;zKkP",
        "site": "https://openreview.net/forum?id=9tQfBNxX16",
        "pdf_size": 886686,
        "rating": "3;3;5;5",
        "confidence": "4;4;5;4",
        "soundness": "2;3;3;2",
        "contribution": "2;2;2;2",
        "presentation": "3;3;4;2",
        "wc_summary": "75;40;83;70",
        "wc_strengths": "40;17;53;44",
        "wc_weaknesses": "196;137;183;115",
        "wc_questions": "37;289;123;86",
        "wc_review": "348;483;442;315",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            67.0,
            16.263455967290593
        ],
        "wc_strengths_avg": [
            38.5,
            13.275918047351754
        ],
        "wc_weaknesses_avg": [
            157.75,
            33.0104150231408
        ],
        "wc_questions_avg": [
            133.75,
            94.68203367059667
        ],
        "wc_review_avg": [
            397.0,
            68.09184973254875
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8902417123251783381&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;0;2;0;3",
        "aff_unique_norm": "Dalian University of Technology;Zhejiang University;Imperial College London;School of Computer Science and Technology",
        "aff_unique_dep": ";;;Computer Science and Technology",
        "aff_unique_url": "http://www.dlut.edu.cn/;https://www.zju.edu.cn;https://www.imperial.ac.uk;",
        "aff_unique_abbr": "DUT;ZJU;ICL;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "China;United Kingdom;"
    },
    {
        "id": "9ux2cgxw6O",
        "title": "LOVECon: Text-driven Training-free Long Video Editing with ControlNet",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Leveraging pre-trained conditional diffusion models for video editing without further tuning has gained increasing attention due to its promise in film production, advertising, etc. Yet, seminal works in this line fall short in generation length, temporal coherence, or fidelity to the source video. This paper aims to bridge the gap, establishing a simple and effective baseline for training-free diffusion model-based long video editing. As suggested by prior arts, we build the pipeline upon ControlNet, which excels at various image editing tasks based on text prompts. To break down the length constraints caused by limited computational memory, we split the long video into consecutive windows and develop a novel cross-window attention mechanism to ensure the consistency of global style and maximize the smoothness among windows. To achieve more accurate control, we extract the information from the source video via DDIM inversion and integrate the outcomes into the latent feature maps of the generations. We also incorporate a video frame interpolation model to mitigate frame-level flickering issues further. Extensive empirical studies verify the superior efficacy of our method over competing baselines across scenarios, including replacing attributes of foreground objects, style transfer, and background replacement. In particular, our method manages to edit videos with up to 128 frames according to user requirements.",
        "keywords": "Video editing;Diffusion models;Training-free",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/dc950b2a21404113366bc65150acc9194a6c097c.zip",
        "author": "Zhenyi Liao;Zhijie Deng",
        "authorids": "~Zhenyi_Liao1;~Zhijie_Deng1",
        "gender": "M;M",
        "homepage": "https://github.com/L-Justice1998;https://thudzj.github.io/",
        "dblp": "359/1044;209/4959",
        "google_scholar": ";J3dR0sUAAAAJ",
        "orcid": ";0000-0002-0932-1631",
        "linkedin": ";",
        "or_profile": "~Zhenyi_Liao1;~Zhijie_Deng1",
        "aff": "Shanghai Jiaotong University;Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn;sjtu.edu.cn",
        "position": "MS student;Assistant Professor",
        "bibtex": "@misc{\nliao2024lovecon,\ntitle={{LOVEC}on: Text-driven Training-free Long Video Editing with ControlNet},\nauthor={Zhenyi Liao and Zhijie Deng},\nyear={2024},\nurl={https://openreview.net/forum?id=9ux2cgxw6O}\n}",
        "github": "",
        "project": "",
        "reviewers": "WhZ8;59Nz;EDK1",
        "site": "https://openreview.net/forum?id=9ux2cgxw6O",
        "pdf_size": 20544191,
        "rating": "5;5;5",
        "confidence": "5;4;4",
        "soundness": "3;2;2",
        "contribution": "2;2;2",
        "presentation": "3;3;3",
        "wc_summary": "64;80;92",
        "wc_strengths": "55;2;67",
        "wc_weaknesses": "144;89;241",
        "wc_questions": "69;2;1",
        "wc_review": "332;173;401",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "533;340;433",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;2;2",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            78.66666666666667,
            11.469767022723502
        ],
        "wc_strengths_avg": [
            41.333333333333336,
            28.241026106633512
        ],
        "wc_weaknesses_avg": [
            158.0,
            62.838417124134075
        ],
        "wc_questions_avg": [
            24.0,
            31.822423959633664
        ],
        "wc_review_avg": [
            302.0,
            95.46727187890099
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            435.3333333333333,
            78.80919292118712
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9923968201600933195&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Shanghai Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sjtu.edu.cn",
        "aff_unique_abbr": "SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "9v5uZPWZoV",
        "title": "Not Just Pretty Pictures: Toward Interventional Data Augmentation Using Text-to-Image Generators",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Neural image classifiers are known to undergo severe performance degradation when exposed to inputs that exhibit covariate shift with respect to the training distribution. A general interventional data augmentation (IDA) mechanism that simulates arbitrary interventions over spurious variables has often been conjectured as a theoretical solution to this problem and approximated to varying degrees of success. In this work, we study how well modern Text-to-Image (T2I) generators and associated image editing techniques can solve the problem of IDA. We experiment across a diverse collection of benchmarks in domain generalization, ablating across key dimensions of T2I generation, including interventional prompts, conditioning mechanisms, and post-hoc filtering, showing that it substantially outperforms previously state-of-the-art image augmentation techniques independently of how each dimension is configured. We discuss the comparative advantages of using T2I for image editing versus synthesis, also finding that a simple retrieval baseline presents a surprisingly effective alternative, which raises interesting questions about how generative models should be evaluated in the context of domain generalization.",
        "keywords": "Text-to-Image Generators;Diffusion Models;Synthetic Data;Distribution Shift;Domain Generalization",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Jianhao Yuan;Francesco Pinto;Adam Davies;Philip Torr",
        "authorids": "~Jianhao_Yuan2;~Francesco_Pinto1;~Adam_Davies2;~Philip_Torr1",
        "gender": "M;Non-Binary;;M",
        "homepage": ";https://ahdavies6.github.io/;http://www.robots.ox.ac.uk/~tvg/;https://yuanjianhao508.github.io/",
        "dblp": "281/7477;;;",
        "google_scholar": "rqAdo2MAAAAJ;vqkOH7gAAAAJ;;BUJPCegAAAAJ",
        "orcid": ";0000-0002-0610-2732;;",
        "linkedin": "francesco-pinto-42a389b1?lipi=urn%3Ali%3Apage%3Ad_flagship3_profile_view_base_contact_details%3BishkY8oUQ8OTPPeV0SSCdw%3D%3D;adamhdavies/;;",
        "or_profile": "~Francesco_Pinto1;~Adam_Davies2;~Philip_Torr1;~JIANHAO_YUAN1",
        "aff": "University of Oxford;University of Illinois, Urbana Champaign;University of Oxford;University of Oxford",
        "aff_domain": "ox.ac.uk;illinois.edu;ox.ac.uk;robots.ox.ac.uk",
        "position": "PhD student;PhD student;Full Professor;PhD student",
        "bibtex": "@misc{\nyuan2024not,\ntitle={Not Just Pretty Pictures: Toward Interventional Data Augmentation Using Text-to-Image Generators},\nauthor={Jianhao Yuan and Francesco Pinto and Adam Davies and Philip Torr},\nyear={2024},\nurl={https://openreview.net/forum?id=9v5uZPWZoV}\n}",
        "github": "",
        "project": "",
        "reviewers": "3cd6;MWyF;nrcC;bsQg",
        "site": "https://openreview.net/forum?id=9v5uZPWZoV",
        "pdf_size": 49054750,
        "rating": "5;5;6;6",
        "confidence": "4;4;5;4",
        "soundness": "3;3;2;2",
        "contribution": "2;2;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "218;39;92;118",
        "wc_strengths": "59;17;94;37",
        "wc_weaknesses": "146;309;13;11",
        "wc_questions": "10;82;12;344",
        "wc_review": "433;447;211;510",
        "wc_reply_reviewers": "66;71;0;400",
        "wc_reply_authors": "1186;1173;446;1490",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "2;4;2;4",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            116.75,
            65.0206697904597
        ],
        "wc_strengths_avg": [
            51.75,
            28.560243346302215
        ],
        "wc_weaknesses_avg": [
            119.75,
            122.19528427889514
        ],
        "wc_questions_avg": [
            112.0,
            137.04743704279917
        ],
        "wc_review_avg": [
            400.25,
            113.04727993189398
        ],
        "wc_reply_reviewers_avg": [
            134.25,
            155.96854650858293
        ],
        "wc_reply_authors_avg": [
            1073.75,
            383.9872230947275
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            1.0
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4464747621104770790&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "University of Oxford;University of Illinois Urbana-Champaign",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ox.ac.uk;https://illinois.edu",
        "aff_unique_abbr": "Oxford;UIUC",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Urbana-Champaign",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "id": "9vZ8UjP2Mz",
        "title": "Exploring the Generalization Capabilities of AID-based Bi-level Optimization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Bi-level optimization has achieved considerable success in contemporary machine learning applications, especially for given proper hyperparameters. However, due to the two-level optimization structure, commonly, researchers focus on two types of bi-level optimization methods: approximate implicit differentiation (AID)-based and iterative differentiation (ITD)-based approaches. ITD-based methods can be readily transformed into single-level optimization problems, facilitating the study of their generalization capabilities. In contrast, AID-based methods cannot be easily transformed similarly but must stay in the two-level structure, leaving their generalization properties enigmatic. In this paper, although the outer-level function is nonconvex, we ascertain the uniform stability of AID-based methods, which achieves similar results to a single-level nonconvex problem. We conduct a convergence analysis for a carefully chosen step size to maintain stability. Combining the convergence and stability results, we give the generalization ability of AID-based bi-level optimization methods. Furthermore, we carry out an ablation study of the parameters and assess the performance of these methods on real-world tasks. Our experimental results corroborate the theoretical findings, demonstrating the effectiveness and potential applications of these methods.",
        "keywords": "Generalization; Bi-level Optimization",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/6fdfb91e52c0d916612146d0aeb4faa8622af831.pdf",
        "author": "Congliang Chen;Li Shen;zhiqiang xu;Wei Liu;Zhi-Quan Luo;Peilin Zhao",
        "authorids": "~Congliang_Chen1;~Li_Shen1;~zhiqiang_xu1;~Wei_Liu3;~Zhi-Quan_Luo1;~Peilin_Zhao2",
        "gender": "M;M;M;M;M;",
        "homepage": ";https://sites.google.com/site/mathshenli/home;https://scholar.google.com/citations?user=0R20iBMAAAAJ&hl=en;https://sites.google.com/view/cuweiliu;;",
        "dblp": "205/7138;91/3680-8;72/51-3.html;49/3283-5;;84/8411",
        "google_scholar": "O1P1-EAAAAAJ;yVhgENIAAAAJ;;AjxoEpIAAAAJ;dW3gcXoAAAAJ;https://scholar.google.com.hk/citations?user=HPeX_YcAAAAJ",
        "orcid": ";;0000-0002-5693-8933;0000-0002-3865-8145;;0000-0001-8543-3953",
        "linkedin": ";;;;;",
        "or_profile": "~Congliang_Chen1;~Li_Shen1;~zhiqiang_xu1;~Wei_Liu3;~Zhi-Quan_Luo1;~Peilin_Zhao2",
        "aff": "The Chinese University of Hong Kong(Shenzhen);JD Explore Academy;Mohamed bin Zayed University of Artificial Intelligence;Tencent;The Chinese University of Hong Kong, Shenzhen;Tencent",
        "aff_domain": "cuhk.edu.cn;jd.com;mbzuai.ac.ae;tencent.com;cuhk.edu.cn;tencent.com",
        "position": "PhD student;Researcher;Assistant Professor;Distinguished Scientist;Full Professor;Researcher",
        "bibtex": "@misc{\nchen2024exploring,\ntitle={Exploring the Generalization Capabilities of {AID}-based Bi-level Optimization},\nauthor={Congliang Chen and Li Shen and zhiqiang xu and Wei Liu and Zhi-Quan Luo and Peilin Zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=9vZ8UjP2Mz}\n}",
        "github": "",
        "project": "",
        "reviewers": "FTaq;R6J2;JTQs;CjiH",
        "site": "https://openreview.net/forum?id=9vZ8UjP2Mz",
        "pdf_size": 1156955,
        "rating": "3;3;6;8",
        "confidence": "3;3;3;3",
        "soundness": "2;2;3;3",
        "contribution": "3;2;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "159;80;35;98",
        "wc_strengths": "133;48;28;101",
        "wc_weaknesses": "724;149;109;135",
        "wc_questions": "6;421;109;71",
        "wc_review": "1022;698;281;405",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1148;804;203;600",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            5.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            93.0,
            44.48033273256845
        ],
        "wc_strengths_avg": [
            77.5,
            41.692325432865935
        ],
        "wc_weaknesses_avg": [
            279.25,
            257.17734639738393
        ],
        "wc_questions_avg": [
            151.75,
            159.75508599102565
        ],
        "wc_review_avg": [
            601.5,
            286.12278832696984
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            688.75,
            342.0609412078497
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:-O-IdThMmvMJ:scholar.google.com/&scioq=Exploring+the+Generalization+Capabilities+of+AID-based+Bi-level+Optimization&hl=en&as_sdt=0,33",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;3;0;3",
        "aff_unique_norm": "Chinese University of Hong Kong;JD;Mohamed bin Zayed University of Artificial Intelligence;Tencent",
        "aff_unique_dep": ";JD Explore Academy;;Tencent Holdings Limited",
        "aff_unique_url": "https://www.cuhk.edu.cn;;https://mbzuai.ac.ae;https://www.tencent.com",
        "aff_unique_abbr": "CUHK;;MBZUAI;Tencent",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Shenzhen;",
        "aff_country_unique_index": "0;2;0;0;0",
        "aff_country_unique": "China;;United Arab Emirates"
    },
    {
        "id": "9vkgAaCI3F",
        "title": "Balancing Stability and Plasticity in Continual Learning: the readout-decomposition of activation change (RDAC) framework",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Continual learning (CL) algorithms strive to equip neural networks with the ability to acquire new knowledge while preserving prior information. However, the stability-plasticity trade-off remains a central challenge in CL. This paper introduces a framework that dissects this trade-off, offering valuable insights into CL algorithms.\nThe framework first addresses the stability-plasticity dilemma and its relation to catastrophic forgetting. It presents the Readout-Decomposition of Activation Change (RDAC) framework that relates learning-induced activation changes in the range of prior readouts to the degree of stability, and changes in the null space to the degree of plasticity. \nIn deep non-linear networks tackling split-CIFAR-110 tasks, the framework was used to explain the stability-plasticity trade-offs  of the popular regularization algorithms Synaptic intelligence (SI), Elastic-weight consolidation (EWC), and learning without Forgetting (LwF) and replay based algorithms Gradient episodic memory (GEM), and data replay. GEM and data replay excelled in preserving both stability and plasticity, while SI, EWC, and LwF traded off plasticity for stability. The inability of the regularization algorithms to maintain plasticity was linked to them restricting the change of activations in the null space of the prior readout. For one-hidden-layer linear neural networks, we additionally derived a gradient decomposition algorithm to restrict activation change only in the range of the prior readouts, to maintain high stability while not further sacrificing plasticity. \nResults demonstrate that the algorithm maintains stability without significant plasticity loss.\nThe RDAC framework not only informs the behavior of existing CL algorithms but also paves the way for novel CL approaches. Finally, it sheds light on the connection between learning-induced activation/representation changes and the stability-plasticity dilemma, also offering insights into representational drift in biological systems.",
        "keywords": "continual learning;stability-plasticity trade-off;representational drift;task-incremental learning;readout misalignment;interpretability",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/56cf2b801fb4c69f3519ab8aa6637ac9c2dffced.zip",
        "author": "Daniel Anthes;Sushrut Thorat;Peter K\u00f6nig;Tim C Kietzmann",
        "authorids": "~Daniel_Anthes1;~Sushrut_Thorat1;~Peter_K\u00f6nig1;~Tim_C_Kietzmann1",
        "gender": ";M;M;M",
        "homepage": ";https://sushrutthorat.com/;https://www.ikw.uni-osnabrueck.de/en/research_groups/neurobiopsychology.html;https://www.kietzmannlab.org",
        "dblp": ";169/0786;;",
        "google_scholar": "YPdEhboAAAAJ;https://scholar.google.it/citations?user=MPFzJQgAAAAJ;Ieubd0EAAAAJ;JXcWFkgAAAAJ",
        "orcid": ";0000-0003-2276-5621;0000-0003-3654-5267;0000-0001-8076-6062",
        "linkedin": ";;;",
        "or_profile": "~Daniel_Anthes1;~Sushrut_Thorat1;~Peter_K\u00f6nig1;~Tim_C_Kietzmann1",
        "aff": "University of Osnabr\u00fcck;University of Osnabr\u00fcck;Universit\u00e4t Osnabr\u00fcck;Universit\u00e4t Osnabr\u00fcck",
        "aff_domain": "uos.de;uos.de;uni-osnabrueck.de;uni-osnabrueck.de",
        "position": "PhD student;Postdoc;Full Professor;Full Professor",
        "bibtex": "@misc{\nanthes2024balancing,\ntitle={Balancing Stability and Plasticity in Continual Learning: the readout-decomposition of activation change ({RDAC}) framework},\nauthor={Daniel Anthes and Sushrut Thorat and Peter K{\\\"o}nig and Tim C Kietzmann},\nyear={2024},\nurl={https://openreview.net/forum?id=9vkgAaCI3F}\n}",
        "github": "",
        "project": "",
        "reviewers": "gbcF;RvDh;a3Rp;djfe",
        "site": "https://openreview.net/forum?id=9vkgAaCI3F",
        "pdf_size": 1329158,
        "rating": "5;5;5;6",
        "confidence": "5;5;2;1",
        "soundness": "2;2;3;3",
        "contribution": "2;3;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "134;176;69;71",
        "wc_strengths": "81;79;59;83",
        "wc_weaknesses": "54;132;324;31",
        "wc_questions": "104;262;50;4",
        "wc_review": "373;649;502;189",
        "wc_reply_reviewers": "0;44;0;0",
        "wc_reply_authors": "329;577;523;95",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.25,
            1.7853571071357126
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            112.5,
            45.0249930594109
        ],
        "wc_strengths_avg": [
            75.5,
            9.630680142129112
        ],
        "wc_weaknesses_avg": [
            135.25,
            115.22450911156011
        ],
        "wc_questions_avg": [
            105.0,
            97.30878685915265
        ],
        "wc_review_avg": [
            428.25,
            169.16171996051588
        ],
        "wc_reply_reviewers_avg": [
            11.0,
            19.05255888325765
        ],
        "wc_reply_authors_avg": [
            381.0,
            189.12958520548815
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.7276068751089989,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:db2DrzxzUXAJ:scholar.google.com/&scioq=Balancing+Stability+and+Plasticity+in+Continual+Learning:+the+readout-decomposition+of+activation+change+(RDAC)+framework&hl=en&as_sdt=0,33",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of Osnabr\u00fcck",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uni-osnabrueck.de",
        "aff_unique_abbr": "UOS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "title": "Entropy is not Enough for Test-Time Adaptation: From the Perspective of Disentangled Factors",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19280",
        "id": "9w3iw8wDuE",
        "author_site": "Jonghyun Lee, Dahuin Jung, Saehyung Lee, Junsung Park, Juhyeon Shin, Uiwon Hwang, Sungroh Yoon",
        "tldr": "",
        "abstract": "Test-time adaptation (TTA) fine-tunes pre-trained deep neural networks for unseen test data. The primary challenge of TTA is limited access to the entire test dataset during online updates, causing error accumulation. To mitigate it, TTA methods have utilized the model output's entropy as a confidence metric that aims to determine which samples have a lower likelihood of causing error. Through experimental studies, however, we observed the unreliability of entropy as a confidence metric for TTA under biased scenarios and theoretically revealed that it stems from the neglect of the influence of latent disentangled factors of data on predictions. Building upon these findings, we introduce a novel TTA method named Destroy Your Object (DeYO), which leverages a newly proposed confidence metric named Pseudo-Label Probability Difference (PLPD). PLPD quantifies the influence of the shape of an object on prediction by measuring the difference between predictions before and after applying an object-destructive transformation. DeYO consists of sample selection and sample weighting, which employ entropy and PLPD concurrently. For robust adaptation, DeYO prioritizes samples that dominantly incorporate shape information when making predictions. Our extensive experiments demonstrate the consistent superiority of DeYO over baseline methods across various scenarios, including biased and wild. Project page is publicly available at https://whitesnowdrop.github.io/DeYO/.",
        "keywords": "Test-time adaptation;Roustness",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Jonghyun Lee;Dahuin Jung;Saehyung Lee;Junsung Park;Juhyeon Shin;Uiwon Hwang;Sungroh Yoon",
        "authorids": "~Jonghyun_Lee1;~Dahuin_Jung2;~Saehyung_Lee1;~Junsung_Park1;~Juhyeon_Shin1;~Uiwon_Hwang1;~Sungroh_Yoon1",
        "gender": "M;F;M;M;F;M;",
        "homepage": ";https://hai.ssu.ac.kr/;;http://data.snu.ac.kr/;https://github.com/newjh12;https://sites.google.com/view/uiwon-hwang;http://ailab.snu.ac.kr",
        "dblp": ";224/0158;260/0442;;;207/8512;99/1474",
        "google_scholar": ";https://scholar.google.co.kr/citations?user=wleS-UQAAAAJ;nS24h74AAAAJ;;;https://scholar.google.co.kr/citations?user=CJ8-pGIAAAAJ;Bphl_fIAAAAJ",
        "orcid": ";;;;;0000-0001-5054-2236;0000-0002-2367-197X",
        "linkedin": "jonghyun-lee-0886061a3/;;;;;uiwon-hwang/;",
        "or_profile": "~Jonghyun_Lee1;~Dahuin_Jung2;~Saehyung_Lee1;~Junsung_Park1;~Juhyeon_Shin1;~Uiwon_Hwang1;~Sungroh_Yoon1",
        "aff": "Seoul National University;Seoul National University;Adobe Systems;Seoul National University;Seoul National University;Yonsei University - Mirae Campus;Seoul National University",
        "aff_domain": "snu.ac.kr;snu.ac.kr;adobe.com;snu.ac.kr;snu.ac.kr;yonsei.ac.kr;snu.ac.kr",
        "position": "PhD student;PhD student;Intern;PhD student;PhD student;Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\nlee2024entropy,\ntitle={Entropy is not Enough for Test-Time Adaptation: From the Perspective of Disentangled Factors},\nauthor={Jonghyun Lee and Dahuin Jung and Saehyung Lee and Junsung Park and Juhyeon Shin and Uiwon Hwang and Sungroh Yoon},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=9w3iw8wDuE}\n}",
        "github": "",
        "project": "",
        "reviewers": "7TAy;xMUg;NrgV;M673",
        "pdf_size": 1515837,
        "rating": "6;6;8;8",
        "confidence": "3;5;5;4",
        "soundness": "3;3;2;4",
        "contribution": "3;3;2;3",
        "presentation": "3;3;2;3",
        "wc_summary": "55;38;100;71",
        "wc_strengths": "46;70;16;57",
        "wc_weaknesses": "107;44;494;74",
        "wc_questions": "86;13;10;4",
        "wc_review": "294;165;620;206",
        "wc_reply_reviewers": "14;5;274;0",
        "wc_reply_authors": "1452;612;2861;1179",
        "reply_reviewers": "1;1;2;0",
        "reply_authors": "4;3;6;4",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            66.0,
            22.83637449333847
        ],
        "wc_strengths_avg": [
            47.25,
            19.942103700462496
        ],
        "wc_weaknesses_avg": [
            179.75,
            182.79547997694036
        ],
        "wc_questions_avg": [
            28.25,
            33.49906715119094
        ],
        "wc_review_avg": [
            321.25,
            178.66921251295648
        ],
        "wc_reply_reviewers_avg": [
            73.25,
            116.01158347337562
        ],
        "wc_reply_authors_avg": [
            1526.0,
            828.1766115992409
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            4.25,
            1.0897247358851685
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.30151134457776363,
        "gs_citation": 38,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4357779222588905269&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=9w3iw8wDuE",
        "pdf": "https://openreview.net/pdf?id=9w3iw8wDuE",
        "email": "snu.ac.kr;snu.ac.kr;adobe.com;snu.ac.kr;snu.ac.kr;yonsei.ac.kr;snu.ac.kr",
        "author_num": 7,
        "aff_unique_index": "0;0;1;0;0;2;0",
        "aff_unique_norm": "Seoul National University;Adobe;Yonsei University",
        "aff_unique_dep": ";Adobe Systems Incorporated;",
        "aff_unique_url": "https://www.snu.ac.kr;https://www.adobe.com;https://www.yonsei.ac.kr",
        "aff_unique_abbr": "SNU;Adobe;Yonsei",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mirae",
        "aff_country_unique_index": "0;0;1;0;0;0;0",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "id": "9wSWiavGwU",
        "title": "SwapTransformer: Highway Overtaking Tactical Planner Model via Imitation Learning on OSHA Dataset",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper investigates the high-level decision-making problem in highway scenarios regarding lane changing and over-taking other slower vehicles. In particular, this paper aims to improve the Travel Assist feature for automatic overtaking and lane changes on highways. About 9 million samples including lane images and other dynamic objects are collected in simulation. This data; Overtaking on Simulated HighwAys (OSHA) dataset is released to tackle this challenge. To solve this problem, an architecture called SwapTransformer is designed and implemented as an imitation learning approach on the OSHA dataset. Moreover, auxiliary tasks such as future points and car distance network predictions are proposed to aid the model in better understanding the surrounding environment. The performance of the proposed solution is compared with a multi-layer perceptron (MLP) and multi-head self-attention networks as baselines in a simulation environment. We also demonstrate the performance of the model with and without auxiliary tasks. All models are evaluated based on different metrics such as time to finish each lap, number of overtakes, and speed difference with speed limit. The evaluation shows that the SwapTransformer model outperforms other models in different traffic densities in the inference phase.",
        "keywords": "Autonomous driving;Imitation learning;highway;overtaking;machine learning;transformer",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/22416a94694b96b41ac47558d98e24683a8a1bcc.zip",
        "author": "Alireza Shamsoshoara;Safin B Salih;Pedram Aghazadeh",
        "authorids": "~Alireza_Shamsoshoara1;safin.salih@vw.com;pedram.aghazadeh@vw.com",
        "gender": "M;;",
        "homepage": "https://alirezashamsoshoara.github.io/;;",
        "dblp": ";;",
        "google_scholar": "1IDrN5QAAAAJ;;",
        "orcid": "0000-0003-4087-8304;;",
        "linkedin": "alireza-shamsoshoara/;;",
        "or_profile": "~Alireza_Shamsoshoara1;safin.salih@vw.com;pedram.aghazadeh@vw.com",
        "aff": ";;",
        "aff_domain": ";;",
        "position": ";;",
        "bibtex": "@misc{\nshamsoshoara2024swaptransformer,\ntitle={SwapTransformer: Highway Overtaking Tactical Planner Model via Imitation Learning on {OSHA} Dataset},\nauthor={Alireza Shamsoshoara and Safin B Salih and Pedram Aghazadeh},\nyear={2024},\nurl={https://openreview.net/forum?id=9wSWiavGwU}\n}",
        "github": "",
        "project": "",
        "reviewers": "kokN;Qxdb;8dui",
        "site": "https://openreview.net/forum?id=9wSWiavGwU",
        "pdf_size": 14859760,
        "rating": "5;5;5",
        "confidence": "3;3;3",
        "soundness": "2;2;2",
        "contribution": "2;2;2",
        "presentation": "2;2;3",
        "wc_summary": "185;286;160",
        "wc_strengths": "32;129;39",
        "wc_weaknesses": "61;218;295",
        "wc_questions": "25;72;209",
        "wc_review": "303;705;703",
        "wc_reply_reviewers": "10;0;373",
        "wc_reply_authors": "377;1187;2238",
        "reply_reviewers": "1;0;2",
        "reply_authors": "1;2;5",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            210.33333333333334,
            54.46915538989832
        ],
        "wc_strengths_avg": [
            66.66666666666667,
            44.16886786967591
        ],
        "wc_weaknesses_avg": [
            191.33333333333334,
            97.37327947417378
        ],
        "wc_questions_avg": [
            102.0,
            78.05553578489271
        ],
        "wc_review_avg": [
            570.3333333333334,
            189.0349761875358
        ],
        "wc_reply_reviewers_avg": [
            127.66666666666667,
            173.52489414746486
        ],
        "wc_reply_authors_avg": [
            1267.3333333333333,
            761.8706510221331
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            1.699673171197595
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18112353373146535003&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4
    },
    {
        "title": "Provably Efficient CVaR RL in Low-rank MDPs",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19279",
        "id": "9x6yrFAPnx",
        "author_site": "Yulai Zhao, Wenhao Zhan, Xiaoyan Hu, Ho-fung Leung, Farzan Farnia, Wen Sun, Jason Lee",
        "tldr": "",
        "abstract": "We study risk-sensitive Reinforcement Learning (RL), where we aim to maximize\nthe Conditional Value at Risk (CVaR) with a fixed risk tolerance $\\tau$. \nPrior theoretical work studying risk-sensitive RL focuses on the tabular Markov Decision Processes (MDPs) setting.  \nTo extend CVaR RL to settings where state space is large, function approximation must be deployed. \nWe study CVaR RL in low-rank MDPs with nonlinear function approximation.  Low-rank MDPs assume the underlying transition kernel admits a low-rank decomposition, but unlike prior linear models, low-rank MDPs do not assume the feature or state-action representation is known. \nWe propose a novel Upper Confidence Bound (UCB) bonus-driven algorithm to carefully balance the interplay between exploration, exploitation, and representation learning in CVaR RL. \nWe prove that our algorithm achieves a sample complexity of $\\tilde{O}\\left(\\frac{H^7 A^2 d^4}{\\tau^2 \\epsilon^2}\\right)$ to yield an $\\epsilon$-optimal CVaR, where $H$ is the length of each episode, $A$ is the capacity of action space, and $d$ is the dimension of representations.\nComputational-wise, we design a novel discretized Least-Squares Value Iteration (LSVI) algorithm for the CVaR objective as the planning oracle and show that we can find the near-optimal policy in a polynomial running time with a Maximum Likelihood Estimation oracle. \nTo our knowledge, this is the first provably efficient CVaR RL algorithm in low-rank MDPs.",
        "keywords": "reinforment learning theory;risk-sensitive reinforment learning;Conditional Value at Risk",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Yulai Zhao;Wenhao Zhan;Xiaoyan Hu;Ho-fung Leung;Farzan Farnia;Wen Sun;Jason D. Lee",
        "authorids": "~Yulai_Zhao1;~Wenhao_Zhan1;~Xiaoyan_Hu2;~Ho-fung_Leung1;~Farzan_Farnia1;~Wen_Sun1;~Jason_D._Lee1",
        "gender": "M;M;M;M;M;;M",
        "homepage": "https://yulaizhao.com/;;https://yannxiaoyanhu.github.io;http://www.cse.cuhk.edu.hk/~lhf/;https://www.cse.cuhk.edu.hk/~farnia/;https://wensun.github.io;https://jasondlee88.github.io/",
        "dblp": "64/6357-2;275/3558;;l/HofungLeung;132/7757;;88/3262",
        "google_scholar": "r-mWYj0AAAAJ;;https://scholar.google.com/citations?hl=en;https://scholar.google.com.hk/citations?user=JDErdKcAAAAJ;GYPCqcYAAAAJ;iOLC30YAAAAJ;GR_DsT0AAAAJ",
        "orcid": "0000-0002-6930-3590;;0000-0002-5766-1059;0000-0003-4914-2934;0000-0002-6049-9232;;",
        "linkedin": "yulaizhao/;;xiaoyan-hu-9a26661b9/;ho-fung-leung-1a73135/;farzan-farnia-00798335;;",
        "or_profile": "~Yulai_Zhao1;~Wenhao_Zhan1;~Xiaoyan_Hu2;~Ho-fung_Leung1;~Farzan_Farnia1;~Wen_Sun1;~Jason_D._Lee1",
        "aff": "Princeton University;Princeton University;The Chinese University of Hong Kong; ;The Chinese University of Hong Kong;Cornell University;Princeton University",
        "aff_domain": "princeton.edu;princeton.edu;cse.cuhk.edu.hk;outlook.com;cuhk.edu.hk;cornell.edu;princeton.edu",
        "position": "PhD student;PhD student;PhD student;Independent Researcher;Assistant Professor;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nzhao2024provably,\ntitle={Provably Efficient {CV}aR {RL} in Low-rank {MDP}s},\nauthor={Yulai Zhao and Wenhao Zhan and Xiaoyan Hu and Ho-fung Leung and Farzan Farnia and Wen Sun and Jason D. Lee},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=9x6yrFAPnx}\n}",
        "github": "",
        "project": "",
        "reviewers": "hVSJ;yZ3N;i64s;htXD",
        "pdf_size": 491888,
        "rating": "6;6;6;6",
        "confidence": "4;3;3;2",
        "soundness": "3;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "69;110;63;81",
        "wc_strengths": "45;47;93;31",
        "wc_weaknesses": "301;194;145;20",
        "wc_questions": "35;25;168;24",
        "wc_review": "450;376;469;156",
        "wc_reply_reviewers": "145;47;0;0",
        "wc_reply_authors": "1188;826;874;476",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "2;2;2;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            80.75,
            18.08832496390973
        ],
        "wc_strengths_avg": [
            54.0,
            23.345235059857504
        ],
        "wc_weaknesses_avg": [
            165.0,
            100.94800641914628
        ],
        "wc_questions_avg": [
            63.0,
            60.774172145739676
        ],
        "wc_review_avg": [
            362.75,
            124.32090532167146
        ],
        "wc_reply_reviewers_avg": [
            48.0,
            59.198817555758666
        ],
        "wc_reply_authors_avg": [
            841.0,
            252.46187831036985
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9310462942782500564&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=9x6yrFAPnx",
        "pdf": "https://openreview.net/pdf?id=9x6yrFAPnx",
        "email": "princeton.edu;princeton.edu;cse.cuhk.edu.hk;outlook.com;cuhk.edu.hk;cornell.edu;princeton.edu",
        "author_num": 7,
        "aff_unique_index": "0;0;1;1;2;0",
        "aff_unique_norm": "Princeton University;Chinese University of Hong Kong;Cornell University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.princeton.edu;https://www.cuhk.edu.hk;https://www.cornell.edu",
        "aff_unique_abbr": "Princeton;CUHK;Cornell",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;1;1;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "9yKzVMxlkw",
        "title": "TiG-BEV: Multi-view BEV 3D Object Detection via Target Inner-Geometry Learning",
        "track": "main",
        "status": "Desk Reject",
        "tldr": "",
        "abstract": "To achieve accurate multi-view 3D object detection, existing methods propose to benefit camera-based detectors with spatial cues provided by the LiDAR modal\u0002ity, e.g., depth supervision and bird-eye-view (BEV) feature distillation. However, they employ a direct point-to-point mimicry from LiDAR to camera, which suf\u0002fers from the modality gap between 2D-3D features. In this paper, we propose the Target Inner-Geometry learning scheme to enhance camera-based BEV detectors from both depth and BEV feature by leveraging the LiDAR modality, termed as TiG-BEV. Firstly, we introduce an inner-depth supervision module to learn the low-level relative depth relations in each object. This equips camera-based de\u0002tectors with a deeper understanding of object-level spatial structures. Secondly, we design an inner-feature BEV distillation module to imitate the high-level se\u0002mantics of different keypoints within foreground targets. To further alleviate the domain gap between two modalities, we incorporate both inter-channel and inter\u0002keypoint distillation to model feature similarity. With our target inner-geometry learning, TiG-BEV effectively boosts BEVDepth by +2.3% NDS on nuScenes val set, and achieves leading performance with 61.9% NDS on nuScenes leaderboard.",
        "keywords": "BEV;3D Object Detection",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/996fe1e8b83459367b0e6f2f1f7f132aff8d39ae.pdf",
        "author": "Peixiang Huang;Li Liu;Renrui Zhang;Jiaming Liu;Mingjie Pan;Rui Xu;Xinli Xu;Yongqiang Qin",
        "authorids": "~Peixiang_Huang1;~Li_Liu19;~Renrui_Zhang1;~Jiaming_Liu2;~Mingjie_Pan1;~Rui_Xu11;~Xinli_Xu1;~Yongqiang_Qin1",
        "gender": "M;M;M;M;M;M;M;M",
        "homepage": ";;;https://github.com/liujiaming1996;https://github.com/xray-pku;;;https://github.com/pmj110119",
        "dblp": "250/5451;;244/1748;;;;65/8354;335/1213",
        "google_scholar": ";zO5iemAAAAAJ;YlL3xN4AAAAJ;cPki5sUAAAAJ;;https://scholar.google.com.sg/citations?user=lrgPuBUAAAAJ;kBc-zJYAAAAJ;QdUeY3IAAAAJ",
        "orcid": ";;;0000-0002-6770-4390;;0000-0002-7866-6027;;",
        "linkedin": ";;;;;;yongqiang-qin/;",
        "or_profile": "~Peixiang_Huang1;~Li_Liu19;~Renrui_Zhang1;~Jiaming_Liu2;~Rui_Xu11;~Xinli_Xu1;~Yongqiang_Qin1;~Pan_Mingjie1",
        "aff": "Peking University;Xiaomi;MMLab of CUHK & Shanghai AI Laboratory;Peking University;Peking University;Hong Kong University of Science and Technology;NIO;Peking University",
        "aff_domain": "pku.edu.cn;xiaomi.com;pjlab.org.cn;pku.edu.cn;pku.edu.cn;hkust.edu;nio.com;pku.edu.cn",
        "position": "MS student;Researcher;PhD student;PhD student;MS student;PhD student;Researcher;MS student",
        "bibtex": "@misc{\nhuang2024tigbev,\ntitle={TiG-{BEV}: Multi-view {BEV} 3D Object Detection via Target Inner-Geometry Learning},\nauthor={Peixiang Huang and Li Liu and Renrui Zhang and Jiaming Liu and Mingjie Pan and Rui Xu and Xinli Xu and Yongqiang Qin},\nyear={2024},\nurl={https://openreview.net/forum?id=9yKzVMxlkw}\n}",
        "github": "",
        "project": "",
        "reviewers": "CVGt;oss3;kyMY;CeGw;v25e",
        "site": "https://openreview.net/forum?id=9yKzVMxlkw",
        "pdf_size": 11753936,
        "rating": "3;5;6;6;8",
        "confidence": "4;4;4;3;4",
        "soundness": "3;3;2;3;3",
        "contribution": "2;2;2;2;4",
        "presentation": "3;3;2;3;3",
        "wc_summary": "78;44;108;83;85",
        "wc_strengths": "83;13;65;47;132",
        "wc_weaknesses": "454;248;132;189;52",
        "wc_questions": "109;2;75;32;47",
        "wc_review": "724;307;380;351;316",
        "wc_reply_reviewers": "0;301;167;0;0",
        "wc_reply_authors": "1270;1388;1193;538;430",
        "reply_reviewers": "0;1;1;0;0",
        "reply_authors": "3;3;2;2;2",
        "rating_avg": [
            5.6,
            1.624807680927192
        ],
        "confidence_avg": [
            3.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.4,
            0.8
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            79.6,
            20.57765778702717
        ],
        "wc_strengths_avg": [
            68.0,
            39.486706623875335
        ],
        "wc_weaknesses_avg": [
            215.0,
            135.89996320823636
        ],
        "wc_questions_avg": [
            53.0,
            36.60054644400818
        ],
        "wc_review_avg": [
            415.6,
            156.3746782570631
        ],
        "wc_reply_reviewers_avg": [
            93.6,
            122.21718373453055
        ],
        "wc_reply_authors_avg": [
            963.8,
            398.11676679084997
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            2.4,
            0.4898979485566356
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.1230914909793327,
        "gs_citation": 40,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6302894399736069090&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;0;0;3;4;0",
        "aff_unique_norm": "Peking University;Xiaomi Corporation;Chinese University of Hong Kong;Hong Kong University of Science and Technology;NIO",
        "aff_unique_dep": ";;MMLab;;",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.xiaomi.com;https://www.cuhk.edu.hk;https://www.ust.hk;",
        "aff_unique_abbr": "Peking U;Xiaomi;CUHK;HKUST;",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China;"
    },
    {
        "id": "9ydLP7como",
        "title": "ReLU for Inference Acceleration",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Over the past decade, advancements in neural networks have outpaced human-level performance in a wide range of domains, including but not limited to natural language understanding and image generation. This progress has led to significantly larger networks with hundreds of billions of parameters, creating substantial computational demands. We propose the re-introduction of ReLU activation function to replace gradient-smooth alternatives during inference. We show that this can reduce computational costs while achieving minimal accuracy degradation with the help of specialized knowledge distillation training. The effectiveness of the proposed method is demonstrated by a wide variety of network architectures, covering popular applications such as image classification, object detection, and language modeling. We observed FPS improvement of 2-10% for Convolution based neural networks while observing only 1.8-2.6% accuracy degradation. The different Transformer networks demonstrated accuracy difference of < 1% between proposed ReLU and original GeLU networks with comparable QPS. The improvement in performance is significantly noticeable on AI accelerators like ours, with ReLU based convolution networks showcasing theoretical improvement of 41-74% compared to their SiLU based counterpart.",
        "keywords": "Deep learning;knowledge distillation;quantization;object detection;tranformer;nlp",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Kinjal Pravinbhai Patel;Ben Goel;Ofer Shai",
        "authorids": "~Kinjal_Pravinbhai_Patel1;~Ben_Goel1;~Ofer_Shai1",
        "gender": ";;M",
        "homepage": ";;",
        "dblp": ";;12/4686",
        "google_scholar": ";;",
        "orcid": ";;",
        "linkedin": ";benjamin-goel?trk=contact-info;",
        "or_profile": "~Kinjal_Pravinbhai_Patel1;~Ben_Goel1;~Ofer_Shai1",
        "aff": ";University of Toronto, University of Toronto;",
        "aff_domain": ";ece.utoronto.ca;",
        "position": ";Undergrad student;",
        "bibtex": "@misc{\npatel2024relu,\ntitle={Re{LU} for Inference Acceleration},\nauthor={Kinjal Pravinbhai Patel and Ben Goel and Ofer Shai},\nyear={2024},\nurl={https://openreview.net/forum?id=9ydLP7como}\n}",
        "github": "",
        "project": "",
        "reviewers": "jbaK;9ug7;RjcT;SAkP",
        "site": "https://openreview.net/forum?id=9ydLP7como",
        "pdf_size": 206409,
        "rating": "3;3;5;5",
        "confidence": "5;4;4;4",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "2;3;2;3",
        "wc_summary": "42;41;54;66",
        "wc_strengths": "23;16;23;90",
        "wc_weaknesses": "89;232;12;106",
        "wc_questions": "9;14;93;2",
        "wc_review": "163;303;182;264",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            50.75,
            10.18270592720815
        ],
        "wc_strengths_avg": [
            38.0,
            30.157917700000443
        ],
        "wc_weaknesses_avg": [
            109.75,
            78.96953526518945
        ],
        "wc_questions_avg": [
            29.5,
            36.908671067921155
        ],
        "wc_review_avg": [
            228.0,
            57.58037860243713
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:SD-VPUuxp7kJ:scholar.google.com/&scioq=ReLU+for+Inference+Acceleration&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Toronto",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.utoronto.ca",
        "aff_unique_abbr": "U of T",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "9zEBK3E9bX",
        "title": "SPOT: Scalable 3D Pre-training via Occupancy Prediction for Autonomous Driving",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Annotating 3D LiDAR point clouds for perception tasks including 3D object detection and LiDAR semantic segmentation is notoriously time-and-energy-consuming. To alleviate the burden from labeling, it is promising to perform large-scale pre-training and fine-tune the pre-trained backbone on different downstream datasets as well as tasks. In this paper, we propose SPOT, namely Scalable Pre-training via Occupancy prediction for learning Transferable 3D representations, and demonstrate its effectiveness on various public datasets with different downstream tasks under the label-efficiency setting. Our contributions are threefold: (1) Occupancy prediction is shown to be promising for learning general representations, which is demonstrated by extensive experiments on plenty of datasets and tasks. (2) SPOT uses beam re-sampling technique for point cloud augmentation and applies class-balancing strategies to overcome the domain gap brought by various LiDAR sensors and annotation strategies in different datasets. (3) Scalable pre-training is observed, that is, the downstream performance across all the experiments gets better with more pre-training data. We believe that our findings can facilitate understanding of LiDAR point clouds and pave the way for future exploration in LiDAR pre-training. Codes and models will be released.",
        "keywords": "3D LiDAR point clouds;3D Pre-training;Object Detection;Semantic Segmentation",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/322395f5f11bbdb54b6f57a5e463b75b50a8f9b3.zip",
        "author": "Xiangchao Yan;Runjian Chen;Bo Zhang;Jiakang Yuan;Xinyu Cai;Botian Shi;Wenqi Shao;Junchi Yan;Ping Luo;Yu Qiao",
        "authorids": "~Xiangchao_Yan1;~Runjian_Chen1;~Bo_Zhang17;~Jiakang_Yuan1;~Xinyu_Cai2;~Botian_Shi1;~Wenqi_Shao2;~Junchi_Yan2;~Ping_Luo2;~Yu_Qiao1",
        "gender": ";M;M;M;;M;M;;;",
        "homepage": "https://github.com/sky-fly97;https://runjian-chen.github.io;https://bobrown.github.io/boZhang.github.io/;https://jiakangyuan.github.io/;;;https://wqshao126.github.io/;;;",
        "dblp": "314/2496.html;257/4647;36/2259-69;323/7363;;245/8742;227/3122;;;",
        "google_scholar": "0mMk6PMAAAAJ;_USUMdAAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=zh-CN;;K0PpvLkAAAAJ;Bs9mrwwAAAAJ;;;",
        "orcid": ";0000-0003-0519-496X;0000-0001-8052-782X;;0000-0001-8500-9300;0000-0003-3677-7252;;;;",
        "linkedin": ";;;;;friskit/;;;;",
        "or_profile": "~Xiangchao_Yan1;~Runjian_Chen1;~Bo_Zhang17;~Jiakang_Yuan1;~Xinyu_Cai2;~Botian_Shi1;~Wenqi_Shao2;~Junchi_Yan2;~Ping_Luo2;~Yu_Qiao1",
        "aff": "Shanghai AI Laboratory;University of Hong Kong;Shanghai Artificial Intelligence Laboratory;Shanghai AI Laboratory;Shanghai Artificial Intelligence Laboratory;Shanghai AI Lab;Shanghai AI Laboratory;;;",
        "aff_domain": "pjlab.org.cn;hku.hk;pjlab.org.cn;pjlab.org.cn;pjlab.org.cn;pjlab.org.cn;pjlab.org.cn;;;",
        "position": "Researcher;PhD student;Researcher;Intern;Researcher;Researcher;Researcher;;;",
        "bibtex": "@misc{\nyan2024spot,\ntitle={{SPOT}: Scalable 3D Pre-training via Occupancy Prediction for Autonomous Driving},\nauthor={Xiangchao Yan and Runjian Chen and Bo Zhang and Jiakang Yuan and Xinyu Cai and Botian Shi and Wenqi Shao and Junchi Yan and Ping Luo and Yu Qiao},\nyear={2024},\nurl={https://openreview.net/forum?id=9zEBK3E9bX}\n}",
        "github": "",
        "project": "",
        "reviewers": "y7L9;FWLb;4p2k",
        "site": "https://openreview.net/forum?id=9zEBK3E9bX",
        "pdf_size": 4762439,
        "rating": "3;5;5",
        "confidence": "4;4;4",
        "soundness": "2;3;2",
        "contribution": "2;3;2",
        "presentation": "3;4;3",
        "wc_summary": "77;147;85",
        "wc_strengths": "31;93;59",
        "wc_weaknesses": "56;368;297",
        "wc_questions": "39;3;48",
        "wc_review": "203;611;489",
        "wc_reply_reviewers": "48;0;0",
        "wc_reply_authors": "1513;734;4101",
        "reply_reviewers": "1;0;0",
        "reply_authors": "6;2;9",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            103.0,
            31.283648551066843
        ],
        "wc_strengths_avg": [
            61.0,
            25.350871122442058
        ],
        "wc_weaknesses_avg": [
            240.33333333333334,
            133.52735882790296
        ],
        "wc_questions_avg": [
            30.0,
            19.44222209522358
        ],
        "wc_review_avg": [
            434.3333333333333,
            170.99187764985277
        ],
        "wc_reply_reviewers_avg": [
            16.0,
            22.627416997969522
        ],
        "wc_reply_authors_avg": [
            2116.0,
            1439.1847229131731
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            5.666666666666667,
            2.8674417556808756
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13020716792976066220&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0;2;3;0",
        "aff_unique_norm": "Shanghai AI Laboratory;University of Hong Kong;Shanghai Artificial Intelligence Laboratory;Shanghai AI Lab",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.shanghai-ai-lab.com;https://www.hku.hk;http://www.shailab.org/;https://www.shanghaiailab.com",
        "aff_unique_abbr": "SAIL;HKU;Shanghai AI Lab;SAIL",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "9zHxXaYEgw",
        "title": "LEO: Generative Latent Image Animator for Human Video Synthesis",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Spatio-temporal coherency is a major challenge in synthesizing high quality videos, particularly in synthesizing human videos that contain rich global and local deformations. To resolve this challenge, previous approaches have resorted to different features in the generation process aimed at representing appearance and motion. However, in the absence of strict mechanisms to guarantee such disentanglement, a separation of motion from appearance has remained challenging, resulting in spatial distortions and temporal jittering that break the spatio-temporal coherency. Motivated by this, we here propose LEO, a novel framework for human video synthesis, placing emphasis on spatio-temporal coherency. Our key idea is to represent motion as a sequence of flow maps in the generation process, which inherently isolate motion from appearance. We implement this idea via a flow-based image animator and a Latent Motion Diffusion Model (LMDM). The former bridges a space of motion codes with the space of flow maps, and synthesizes video frames in a warp-and-inpaint manner. LMDM learns to capture motion prior in the training data by synthesizing sequences of motion codes. Extensive quantitative and qualitative analysis suggests that LEO significantly improves coherent synthesis of human videos over previous methods on the datasets TaichiHD, FaceForensics and CelebV-HQ. In addition, the effective disentanglement of appearance and motion in LEO allows for two additional tasks, namely infinite-length human video synthesis, as well as content-preserving video editing.",
        "keywords": "video generation;diffusion models;talking head generation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/d6ecd717dc451a90b2a518048e38a28d685c543a.zip",
        "author": "Yaohui Wang;Xin Ma;Xinyuan Chen;Cunjian Chen;Antitza Dantcheva;Bo Dai;Yu Qiao",
        "authorids": "~Yaohui_Wang1;~Xin_Ma3;~Xinyuan_Chen1;~Cunjian_Chen2;~Antitza_Dantcheva1;~Bo_Dai2;~Yu_Qiao1",
        "gender": "M;;F;M;F;M;",
        "homepage": "https://wyhsirius.github.io/;https://maxin-cn.github.io/;;https://cunjian.github.io/;https://www-sop.inria.fr/members/Antitza.Dantcheva/;http://daibo.info/;",
        "dblp": "168/6263-1.html;;;73/2740.html;13/2986;64/2903-2;",
        "google_scholar": "R7LyAb4AAAAJ;https://scholar.google.com.hk/citations?user=dN8QWCQAAAAJ;3fWSC8YAAAAJ;f26cvh8AAAAJ;https://scholar.google.fr/citations?user=ZMggPHMAAAAJ;https://scholar.google.com.hk/citations?user=KNWTvgEAAAAJ;",
        "orcid": ";0000-0001-9389-9032;0000-0002-5517-7255;;0000-0003-0107-7029;0000-0003-0777-9232;",
        "linkedin": ";;;;antitza-dantcheva-ph-d-4b65b24/;;",
        "or_profile": "~Yaohui_Wang1;~Xin_Ma3;~Xinyuan_Chen1;~Cunjian_Chen2;~Antitza_Dantcheva1;~Bo_Dai2;~Yu_Qiao1",
        "aff": "Shanghai AI Laboratory;Monash University;Shanghai Artificial Intelligence Laboratory;Monash University;INRIA;Shanghai AI Laboratory;",
        "aff_domain": "pjlab.org.cn;monash.edu;pjlab.org.cn;monash.edu;inria.fr;pjlab.org.cn;",
        "position": "Research Scientist;PhD student;Research Scientist;Lecturer;Researcher;Scientist;",
        "bibtex": "@misc{\nwang2024leo,\ntitle={{LEO}: Generative Latent Image Animator for Human Video Synthesis},\nauthor={Yaohui Wang and Xin Ma and Xinyuan Chen and Cunjian Chen and Antitza Dantcheva and Bo Dai and Yu Qiao},\nyear={2024},\nurl={https://openreview.net/forum?id=9zHxXaYEgw}\n}",
        "github": "",
        "project": "",
        "reviewers": "NikU;8SWB;H4YQ",
        "site": "https://openreview.net/forum?id=9zHxXaYEgw",
        "pdf_size": 33226883,
        "rating": "3;6;6",
        "confidence": "4;3;4",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "3;3;3",
        "wc_summary": "45;74;77",
        "wc_strengths": "65;80;45",
        "wc_weaknesses": "46;123;62",
        "wc_questions": "2;55;30",
        "wc_review": "158;332;214",
        "wc_reply_reviewers": "151;165;0",
        "wc_reply_authors": "1234;746;432",
        "reply_reviewers": "1;2;0",
        "reply_authors": "3;2;1",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            65.33333333333333,
            14.429907214608907
        ],
        "wc_strengths_avg": [
            63.333333333333336,
            14.337208778404378
        ],
        "wc_weaknesses_avg": [
            77.0,
            33.1762967593833
        ],
        "wc_questions_avg": [
            29.0,
            21.64871050817269
        ],
        "wc_review_avg": [
            234.66666666666666,
            72.52279335185287
        ],
        "wc_reply_reviewers_avg": [
            105.33333333333333,
            74.70088501632509
        ],
        "wc_reply_authors_avg": [
            804.0,
            329.97373632861553
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 27,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12488673244627239660&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;2;1;3;0",
        "aff_unique_norm": "Shanghai AI Laboratory;Monash University;Shanghai Artificial Intelligence Laboratory;INRIA",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.shanghai-ai-lab.com;https://www.monash.edu;http://www.shailab.org/;https://www.inria.fr",
        "aff_unique_abbr": "SAIL;Monash;Shanghai AI Lab;INRIA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;1;2;0",
        "aff_country_unique": "China;Australia;France"
    },
    {
        "title": "Leveraging Generative Models for Unsupervised Alignment of Neural Time Series Data",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19278",
        "id": "9zhHVyLY4K",
        "author_site": "Ayesha Vermani, Il Memming Park, Josue Nassar",
        "tldr": "",
        "abstract": "Large scale inference models are widely used in neuroscience to extract latent representations from high-dimensional neural recordings. Due to the statistical heterogeneities between sessions and animals, a new model is trained from scratch to infer the underlying dynamics for each new dataset. This is computationally expensive and does not fully leverage all the available data. Moreover, as these models get more complex, they can be challenging to train. In parallel, it is becoming common to use pre-trained models in the machine learning community for few shot and transfer learning. One major hurdle that prevents the re-use of generative models in neuroscience is the complex spatio-temporal structure of neural dynamics within and across animals. Interestingly, the underlying dynamics identified from different datasets on the same task are qualitatively similar. In this work, we exploit this observation and propose a source-free and unsupervised alignment approach that utilizes the learnt dynamics and enables the re-use of trained generative models. We validate our approach on simulations and show the efficacy of the alignment on neural recordings from the motor cortex obtained during a reaching task.",
        "keywords": "neural dynamics;transfer learning;distribution alignment;neuroscience;few-shot learning",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "Ayesha Vermani;Il Memming Park;Josue Nassar",
        "authorids": "~Ayesha_Vermani1;~Il_Memming_Park1;~Josue_Nassar1",
        "gender": ";M;M",
        "homepage": ";http://catniplab.github.io/;",
        "dblp": ";00/4652-2;230/8314",
        "google_scholar": "https://scholar.google.com/citations?hl=en;CsmltusAAAAJ;a5RNqTYAAAAJ",
        "orcid": ";0000-0002-4255-7750;",
        "linkedin": "ayesha-vermani-3825151a2/;memming/;",
        "or_profile": "~Ayesha_Vermani1;~Il_Memming_Park1;~Josue_Nassar1",
        "aff": "State University of New York, Stony Brook;Champalimaud Centre for the Unknown;Optum Labs",
        "aff_domain": "stonybrook.edu;fchampalimaud.org;optum.com",
        "position": "PhD student;Associate Professor;Researcher",
        "bibtex": "@inproceedings{\nvermani2024leveraging,\ntitle={Leveraging Generative Models for Unsupervised Alignment of Neural Time Series Data},\nauthor={Ayesha Vermani and Il Memming Park and Josue Nassar},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=9zhHVyLY4K}\n}",
        "github": "",
        "project": "",
        "reviewers": "nsT1;Jh7W;MYCT;H5ee",
        "pdf_size": 5965413,
        "rating": "6;6;6;8",
        "confidence": "3;3;4;4",
        "soundness": "2;3;3;4",
        "contribution": "2;3;3;4",
        "presentation": "2;3;2;3",
        "wc_summary": "46;87;100;134",
        "wc_strengths": "36;62;50;84",
        "wc_weaknesses": "30;132;109;101",
        "wc_questions": "231;26;19;71",
        "wc_review": "343;307;278;390",
        "wc_reply_reviewers": "12;12;15;11",
        "wc_reply_authors": "574;443;360;374",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            91.75,
            31.499007920885383
        ],
        "wc_strengths_avg": [
            58.0,
            17.60681686165901
        ],
        "wc_weaknesses_avg": [
            93.0,
            38.11167800031901
        ],
        "wc_questions_avg": [
            86.75,
            85.63987097141144
        ],
        "wc_review_avg": [
            329.5,
            41.8359892915179
        ],
        "wc_reply_reviewers_avg": [
            12.5,
            1.5
        ],
        "wc_reply_authors_avg": [
            437.75,
            84.70647850076168
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=140027540675777815&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=9zhHVyLY4K",
        "pdf": "https://openreview.net/pdf?id=9zhHVyLY4K",
        "email": "stonybrook.edu;fchampalimaud.org;optum.com",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "State University of New York;Champalimaud Centre for the Unknown;Optum Labs",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.stonybrook.edu;https://www.champalimaud.org;https://www.optumlabs.com",
        "aff_unique_abbr": "SUNY Stony Brook;CCU;",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Stony Brook;",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United States;Portugal"
    },
    {
        "id": "9zpOUsOvLM",
        "title": "Aligning Persistent Homology with Graph Pooling",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recently, there has been an emerging trend to integrate persistent homology (PH) into graph neural networks (GNNs) to enrich expressive power. However, naively plugging PH features into GNN layers always results in marginal improvement with low interpretability. In this paper, we investigate a novel mechanism for injecting global topological invariance into pooling layers using PH, motivated by the observation that filtration operation in PH naturally aligns graph pooling in a cut-off manner. In this fashion, message passing in the coarsened graph is performed along persistent sub-topology, leading to improved performance. Experimentally, we apply our mechanism to a collection of graph pooling methods and observe consistent and substantial performance gain over several popular datasets, demonstrating its wide applicability and flexibility. Code is open-sourced at https://anonymous.4open.science/r/TIP.",
        "keywords": "graph pooling;persistent homology;graph neural networks",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Chaolong Ying;Xinjian Zhao;Tianshu Yu",
        "authorids": "~Chaolong_Ying1;~Xinjian_Zhao2;~Tianshu_Yu2",
        "gender": "M;M;M",
        "homepage": "https://sds.cuhk.edu.cn/node/708;https://sduzxj.github.io//;https://mypage.cuhk.edu.cn/academics/yutianshu/",
        "dblp": "295/3323;02/8613;152/6675",
        "google_scholar": "1-O3158AAAAJ;iKuIMsgAAAAJ;MTHO7DsAAAAJ",
        "orcid": "0000-0002-8555-8817;0009-0003-1553-8209;0000-0002-6537-1924",
        "linkedin": ";;",
        "or_profile": "~Chaolong_Ying1;~Xinjian_Zhao2;~Tianshu_Yu2",
        "aff": "The Chinese University of Hong Kong, Shenzhen;Chinese University of Hong Kong (Shenzhen);Chinese University of Hong Kong (Shenzhen)",
        "aff_domain": "cuhk.edu.cn;cuhk.edu.cn;cuhk.edu.cn",
        "position": "PhD student;PhD student;Assistant Professor",
        "bibtex": "@misc{\nying2024aligning,\ntitle={Aligning Persistent Homology with Graph Pooling},\nauthor={Chaolong Ying and Xinjian Zhao and Tianshu Yu},\nyear={2024},\nurl={https://openreview.net/forum?id=9zpOUsOvLM}\n}",
        "github": "",
        "project": "",
        "reviewers": "r2G4;XtaZ;adEb;S9nw",
        "site": "https://openreview.net/forum?id=9zpOUsOvLM",
        "pdf_size": 1443618,
        "rating": "3;3;5;6",
        "confidence": "4;4;4;3",
        "soundness": "2;1;2;4",
        "contribution": "2;1;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "47;76;49;100",
        "wc_strengths": "35;32;31;47",
        "wc_weaknesses": "297;241;242;44",
        "wc_questions": "134;445;2;332",
        "wc_review": "513;794;324;523",
        "wc_reply_reviewers": "47;354;84;11",
        "wc_reply_authors": "1051;1622;671;479",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "3;4;2;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            1.0897247358851685
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            68.0,
            21.737065119284157
        ],
        "wc_strengths_avg": [
            36.25,
            6.378675411086537
        ],
        "wc_weaknesses_avg": [
            206.0,
            96.23668739103607
        ],
        "wc_questions_avg": [
            228.25,
            171.62222321133123
        ],
        "wc_review_avg": [
            538.5,
            167.46716095999238
        ],
        "wc_reply_reviewers_avg": [
            124.0,
            135.27564451888597
        ],
        "wc_reply_authors_avg": [
            955.75,
            436.2724922568463
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.7777777777777777,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ZGLE4NwJYyMJ:scholar.google.com/&scioq=Aligning+Persistent+Homology+with+Graph+Pooling&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Chinese University of Hong Kong",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cuhk.edu.cn",
        "aff_unique_abbr": "CUHK",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Shenzhen",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "9ztL7Trdnx",
        "title": "TAFS: Task-aware Activation Function Search for Graph Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Since the inception of Graph Neural Networks (GNNs), extensive research efforts have concentrated on enhancing graph convolution, refining pooling operations, devising robust training strategies, and advancing theoretical foundations. Notably, one critical facet of current GNN research remains conspicuously underexplored\u2014the design of activation functions. Activation functions serve as pivotal components, imbuing GNNs with the essential capacity for non-linearity. Yet, the ubiquitous adoption of Rectified Linear Units (ReLU) persists.\nIn our study, we embark on a mission to craft task-aware activation functions tailored for diverse GNN applications. We introduce TAFS (Task-aware Activation Function Search), an adept and efficient framework for activation function design. TAFS leverages a streamlined parameterization and frames the problem as a bi-level stochastic optimization challenge. To enhance the search for smooth activation functions, we incorporate additional Lipschitz regularization. Our approach automates the discovery of the optimal activation patterns, customizing them to suit any downstream task seamlessly. Crucially, this entire process unfolds end-to-end without imposing significant computational or memory overhead. Comprehensive experimentation underscores the efficacy of our method. We consistently achieve substantial improvements across a spectrum of tasks, including node classification over diverse graph data. Moreover, our approach surpasses state-of-the-art results in the realm of link-level tasks, particularly in biomedical applications.",
        "keywords": "Activation Function;Graph Neural Networks;AutoML;Neural Architecture Search",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/0aea1b17e69a8e92bb8279c8f63dc4c2b2a7f169.zip",
        "author": "Zhen Xu;quanming yao;Xiaojin Zhang;Qiang Yang",
        "authorids": "~Zhen_Xu4;~quanming_yao1;~Xiaojin_Zhang2;~Qiang_Yang1",
        "gender": "Not Specified;M;F;",
        "homepage": "https://NehzUx.github.io;https://lars-group.github.io/;https://xiaojin319.github.io/;",
        "dblp": ";158/1014;69/8512-2;",
        "google_scholar": "MhE__x0AAAAJ;https://scholar.google.com/schhp?hl=en;https://scholar.google.com/citations?hl=zh-TW;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Zhen_Xu4;~quanming_yao1;~Xiaojin_Zhang2;~Qiang_Yang1",
        "aff": "University of Chicago;Department of Electronic Engineering;Huazhong University of Science and Technology;",
        "aff_domain": "uchicago.edu;tsinghua.edu.cn;hust.edu.cn;",
        "position": "PhD student;Assistant Professor;Assistant Professor;",
        "bibtex": "@misc{\nxu2024tafs,\ntitle={{TAFS}: Task-aware Activation Function Search for Graph Neural Networks},\nauthor={Zhen Xu and quanming yao and Xiaojin Zhang and Qiang Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=9ztL7Trdnx}\n}",
        "github": "",
        "project": "",
        "reviewers": "SDpu;vEQt;kgxw;JLTs",
        "site": "https://openreview.net/forum?id=9ztL7Trdnx",
        "pdf_size": 1320361,
        "rating": "5;5;5;5",
        "confidence": "5;4;3;3",
        "soundness": "2;3;3;2",
        "contribution": "3;2;2;1",
        "presentation": "4;3;3;3",
        "wc_summary": "70;128;72;69",
        "wc_strengths": "37;73;84;27",
        "wc_weaknesses": "89;136;171;97",
        "wc_questions": "2;199;4;31",
        "wc_review": "198;536;331;224",
        "wc_reply_reviewers": "0;0;0;10",
        "wc_reply_authors": "1486;1301;1398;1080",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            84.75,
            24.993749218554626
        ],
        "wc_strengths_avg": [
            55.25,
            23.836683913665507
        ],
        "wc_weaknesses_avg": [
            123.25,
            32.80529682840867
        ],
        "wc_questions_avg": [
            59.0,
            81.63638894512667
        ],
        "wc_review_avg": [
            322.25,
            133.09465616620375
        ],
        "wc_reply_reviewers_avg": [
            2.5,
            4.330127018922194
        ],
        "wc_reply_authors_avg": [
            1316.25,
            151.2818148357561
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:TeHRN0G1cAEJ:scholar.google.com/&scioq=TAFS:+Task-aware+Activation+Function+Search+for+Graph+Neural+Networks&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of Chicago;Institution Name Not Provided;Huazhong University of Science and Technology",
        "aff_unique_dep": ";Department of Electronic Engineering;",
        "aff_unique_url": "https://www.uchicago.edu;;http://www.hust.edu.cn",
        "aff_unique_abbr": "UChicago;;HUST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;2",
        "aff_country_unique": "United States;;China"
    },
    {
        "id": "A0DI5v6m8O",
        "title": "Black-Box Gradient Matching for Reliable Offline Black-Box Optimization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Offline design optimization problem arises in numerous science and engineering applications including materials engineering, where expensive online experimentation necessitates the use of in silico surrogate functions to predict and maximize the target objective over candidate designs. Although these surrogates can be learned from offline data, their predictions can be potentially inaccurate outside the offline data regime. This challenge raises a fundamental question about the impact of imperfect surrogate model on the performance gap between its optima and the true oracle optima, and to what extent the performance loss can be mitigated. Although prior work developed methods to improve the robustness of surrogate models and their associated optimization processes, a provably quantifiable relationship between an imperfect surrogate and the corresponding performance gap, and whether prior methods directly address it, remain elusive. To shed more light on this important question, we present a novel theoretical formulation to understand offline black-box optimization, by explicitly bounding the optimization quality based on how well the surrogate matches the latent gradient field that underlines the offline data. Inspired by our theoretical analysis, we propose a principled black-box gradient matching algorithm to create effective surrogate models for offline optimization. Experiments on diverse real-world benchmarks demonstrate improved optimization quality using our approach to create surrogates.",
        "keywords": "Offline Optimization;Black-Box Optimization",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/59d372ecc04948c0197dd9e33c167396517be0c5.zip",
        "author": "Minh Hoang;Azza Fadhel;Aryan Deshwal;Jana Doppa;Trong Nghia Hoang",
        "authorids": "~Minh_Hoang1;~Azza_Fadhel1;~Aryan_Deshwal1;~Jana_Doppa1;~Trong_Nghia_Hoang1",
        "gender": "M;F;M;;",
        "homepage": ";;https://aryandeshwal.github.io/;;",
        "dblp": ";;246/3012.html;;",
        "google_scholar": "56Mb6DY0_NUC;;wNEYBrAAAAAJ;;",
        "orcid": ";;;;",
        "linkedin": ";azza-fadhel-594a21246/;aryan-deshwal-a27835120/;;",
        "or_profile": "~Minh_Hoang1;~Azza_Fadhel1;~Aryan_Deshwal1;~Jana_Doppa1;~Trong_Nghia_Hoang1",
        "aff": "Princeton University;Washington State University at Pullman;University of Minnesota - Twin Cities;;",
        "aff_domain": "princeton.edu;wsu.edu;umn.edu;;",
        "position": "Postdoc;PhD student;Assistant Professor;;",
        "bibtex": "@misc{\nhoang2024blackbox,\ntitle={Black-Box Gradient Matching for Reliable Offline Black-Box Optimization},\nauthor={Minh Hoang and Azza Fadhel and Aryan Deshwal and Jana Doppa and Trong Nghia Hoang},\nyear={2024},\nurl={https://openreview.net/forum?id=A0DI5v6m8O}\n}",
        "github": "",
        "project": "",
        "reviewers": "1MFJ;eLsu;7Vbx;ehny",
        "site": "https://openreview.net/forum?id=A0DI5v6m8O",
        "pdf_size": 669087,
        "rating": "3;5;6;8",
        "confidence": "4;5;2;4",
        "soundness": "2;1;3;3",
        "contribution": "2;1;3;4",
        "presentation": "3;2;3;4",
        "wc_summary": "43;139;140;24",
        "wc_strengths": "19;31;83;11",
        "wc_weaknesses": "373;159;139;6",
        "wc_questions": "65;2;94;32",
        "wc_review": "500;331;456;73",
        "wc_reply_reviewers": "537;406;0;0",
        "wc_reply_authors": "1756;1751;995;122",
        "reply_reviewers": "2;3;0;0",
        "reply_authors": "4;5;3;1",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            1.118033988749895
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            86.5,
            53.42518132865812
        ],
        "wc_strengths_avg": [
            36.0,
            28.053520278211074
        ],
        "wc_weaknesses_avg": [
            169.25,
            131.51497063072324
        ],
        "wc_questions_avg": [
            48.25,
            34.55701810052482
        ],
        "wc_review_avg": [
            340.0,
            166.15203880783406
        ],
        "wc_reply_reviewers_avg": [
            235.75,
            240.25650355401413
        ],
        "wc_reply_authors_avg": [
            1156.0,
            672.514312115363
        ],
        "reply_reviewers_avg": [
            1.25,
            1.299038105676658
        ],
        "reply_authors_avg": [
            3.25,
            1.479019945774904
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.19088542889273336,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:bBQRVXHIg6kJ:scholar.google.com/&scioq=Black-Box+Gradient+Matching+for+Reliable+Offline+Black-Box+Optimization&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Princeton University;Washington State University;University of Minnesota",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.princeton.edu;https://wsu.edu;https://www.minnesota.edu",
        "aff_unique_abbr": "Princeton;WSU;UMN",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Pullman;Twin Cities",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Mechanistically analyzing the effects of fine-tuning on procedurally defined tasks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19277",
        "id": "A0HKeKl4Nl",
        "author_site": "Samyak Jain, Robert Kirk, Ekdeep Singh Lubana, Robert Dick, Hidenori Tanaka, Tim Rocktaeschel, Edward Grefenstette, David Krueger",
        "tldr": "",
        "abstract": "Fine-tuning large pre-trained models has become the de facto strategy for developing both task-specific and general-purpose machine learning systems, including developing models that are safe to deploy. Despite its clear importance, there has been minimal work that explains how fine-tuning alters the underlying capabilities learned by a model during pretraining: does fine-tuning yield entirely novel capabilities or does it just modulate existing ones? We address this question empirically in synthetic, controlled settings where we can use mechanistic interpretability tools (e.g., network pruning and probing) to understand how the model's underlying capabilities are changing. We perform an extensive analysis of the effects of fine-tuning in these settings, and show that: (i) fine-tuning rarely alters the underlying model capabilities; (ii) a minimal transformation, which we call a `wrapper', is typically learned on top of the underlying model capabilities, creating the illusion that they have been modified; and (iii) further fine-tuning on a task where such ``wrapped capabilities'' are relevant leads to sample-efficient revival of the capability, i.e., the model begins reusing these capabilities after only a few gradient steps. This indicates that practitioners can unintentionally remove a model's safety wrapper merely by fine-tuning it on a, e.g., superficially unrelated, downstream task. We additionally perform analysis on language models trained on the TinyStories dataset to support our claims in a more realistic setup.",
        "keywords": "Fine-Tuning;Interpretability;Mechanisms",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Samyak Jain;Robert Kirk;Ekdeep Singh Lubana;Robert P. Dick;Hidenori Tanaka;Tim Rockt\u00e4schel;Edward Grefenstette;David Krueger",
        "authorids": "~Samyak_Jain1;~Robert_Kirk1;~Ekdeep_Singh_Lubana1;~Robert_P._Dick1;~Hidenori_Tanaka1;~Tim_Rockt\u00e4schel1;~Edward_Grefenstette1;~David_Krueger1",
        "gender": "M;M;M;M;;M;M;M",
        "homepage": "https://samyakjain0112.github.io/;https://robertkirk.github.io;https://ekdeepslubana.github.io/;http://robertdick.org/;https://sites.google.com/view/htanaka/home;http://egrefen.com/;https://mila.umontreal.ca/en/person/david-scott-krueger/;http://rockt.ai",
        "dblp": "249/4464.html;01/9684;228/2683;84/523.html;;http://dblp.uni-trier.de/pers/hd/g/Grefenstette:Edward;142/2741.html;43/11537",
        "google_scholar": "https://scholar.google.co.in/citations?hl=en;https://scholar.google.co.uk/citations?user=PL5KWdYAAAAJ;https://scholar.google.co.in/citations?user=OP7S3vsAAAAJ;;f_pWOGIAAAAJ;https://scholar.google.co.uk/citations?user=ezllEwMAAAAJ;https://scholar.google.ca/citations?user=5Uz70IoAAAAJ;https://scholar.google.co.uk/citations?user=mWBY8aIAAAAJ",
        "orcid": "0000-0003-3785-4782;;;;;;;",
        "linkedin": "samyak-jain-276738178/;;;;;;;rockt/",
        "or_profile": "~Samyak_Jain1;~Robert_Kirk1;~Ekdeep_Singh_Lubana1;~Robert_P._Dick1;~Hidenori_Tanaka1;~Edward_Grefenstette1;~David_Krueger1;~Tim_Rocktaeschel1",
        "aff": "Five AI;University College London;University of Michigan;University of Michigan;Physics & Informatics Lab, NTT Research, Inc.;Google DeepMind;University of Cambridge;Google DeepMind",
        "aff_domain": "five.ai;ucl.ac.uk;umich.edu;umich.edu;ntt-research.com;deepmind.com;cam.ac.uk;google.com",
        "position": "Intern;PhD student;PhD student;Full Professor;Senior Research Scientist;Principal Researcher;Assistant Professor;Senior Staff Research Scientist",
        "bibtex": "@inproceedings{\njain2024mechanistically,\ntitle={Mechanistically analyzing the effects of fine-tuning on procedurally defined tasks},\nauthor={Samyak Jain and Robert Kirk and Ekdeep Singh Lubana and Robert P. Dick and Hidenori Tanaka and Tim Rockt{\\\"a}schel and Edward Grefenstette and David Krueger},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=A0HKeKl4Nl}\n}",
        "github": "",
        "project": "",
        "reviewers": "GZdd;wEP2;eQAm",
        "pdf_size": 5401464,
        "rating": "6;6;8",
        "confidence": "4;4;4",
        "soundness": "3;2;4",
        "contribution": "3;3;3",
        "presentation": "2;2;3",
        "wc_summary": "21;78;51",
        "wc_strengths": "60;126;90",
        "wc_weaknesses": "402;630;253",
        "wc_questions": "7;6;19",
        "wc_review": "490;840;413",
        "wc_reply_reviewers": "0;28;63",
        "wc_reply_authors": "938;1616;2040",
        "reply_reviewers": "0;1;1",
        "reply_authors": "2;3;3",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            50.0,
            23.280893453645632
        ],
        "wc_strengths_avg": [
            92.0,
            26.981475126464083
        ],
        "wc_weaknesses_avg": [
            428.3333333333333,
            155.0318963597133
        ],
        "wc_questions_avg": [
            10.666666666666666,
            5.90668171555645
        ],
        "wc_review_avg": [
            581.0,
            185.8189082592691
        ],
        "wc_reply_reviewers_avg": [
            30.333333333333332,
            25.77250904010361
        ],
        "wc_reply_authors_avg": [
            1531.3333333333333,
            453.8555815332548
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 62,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3773752858357865751&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 10,
        "openreview": "https://openreview.net/forum?id=A0HKeKl4Nl",
        "pdf": "https://openreview.net/pdf?id=A0HKeKl4Nl",
        "email": "five.ai;ucl.ac.uk;umich.edu;umich.edu;ntt-research.com;deepmind.com;cam.ac.uk;google.com",
        "author_num": 8,
        "aff_unique_index": "0;1;2;2;3;4;5;4",
        "aff_unique_norm": "Five AI;University College London;University of Michigan;NTT Research, Inc.;Google;University of Cambridge",
        "aff_unique_dep": ";;;Physics & Informatics Lab;Google DeepMind;",
        "aff_unique_url": "https://www.five.ai;https://www.ucl.ac.uk;https://www.umich.edu;https://www.ntt-research.com;https://deepmind.com;https://www.cam.ac.uk",
        "aff_unique_abbr": "Five AI;UCL;UM;NTT Research;DeepMind;Cambridge",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Cambridge",
        "aff_country_unique_index": "0;0;1;1;1;0;0;0",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "title": "Course Correcting Koopman Representations",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19276",
        "id": "A18gWgc5mi",
        "author_site": "Mahan Fathi, Clement Gehring, Jonathan Pilault, David Kanaa, Pierre-Luc Bacon, Ross Goroshin",
        "tldr": "",
        "abstract": "Koopman representations aim to learn features of nonlinear dynamical systems (NLDS) which lead to linear dynamics in the latent space. Theoretically, such features can be used to simplify many problems in modeling and control of NLDS. In this work we study autoencoder formulations of this problem, and different ways they can be used to model dynamics, specifically for future state prediction over long horizons. We discover several limitations of predicting future states in the latent space and propose an inference-time mechanism, which we refer to as Periodic Reencoding, for faithfully capturing long term dynamics. We justify this method both analytically and empirically via experiments in low and high dimensional NLDS.",
        "keywords": "Koopman;Autoencoders;Dynamical Systems;Sequence Modeling;Inference-time Methods;Planning;Unsupervised Learning;Representation Learning;Robotics",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/8bf353eea7668c39a57b740083ffac9e690d322e.pdf",
        "author": "Mahan Fathi;Clement Gehring;Jonathan Pilault;David Kanaa;Pierre-Luc Bacon;Ross Goroshin",
        "authorids": "~Mahan_Fathi1;~Clement_Gehring1;~Jonathan_Pilault1;~David_Kanaa1;~Pierre-Luc_Bacon1;~Ross_Goroshin1",
        "gender": "M;M;;;;",
        "homepage": "https://mahanfathi.github.io/;http://people.csail.mit.edu/gehring/;;;;",
        "dblp": ";131/5247;248/8053.html;;;",
        "google_scholar": ";KvX7mJUAAAAJ;https://scholar.google.com/citations?hl=en;;;EC4o-1oAAAAJ",
        "orcid": ";;;;;",
        "linkedin": "mahanfathi/;;jonathanpilault/;;;",
        "or_profile": "~Mahan_Fathi1;~Clement_Gehring1;~Jonathan_Pilault1;~David_Kanaa1;~Pierre-Luc_Bacon1;~Ross_Goroshin1",
        "aff": "Mila;Massachusetts Institute of Technology;Polytechnique Montreal;;;Google",
        "aff_domain": "mila.quebec;mit.edu;polymtl.ca;;;google.com",
        "position": "MS student;PhD student;PhD student;;;Research Scientist",
        "bibtex": "@inproceedings{\nfathi2024course,\ntitle={Course Correcting Koopman Representations},\nauthor={Mahan Fathi and Clement Gehring and Jonathan Pilault and David Kanaa and Pierre-Luc Bacon and Ross Goroshin},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=A18gWgc5mi}\n}",
        "github": "",
        "project": "",
        "reviewers": "f4vn;Fg8g;FYpR;Woag;QVMC",
        "pdf_size": 30922143,
        "rating": "6;6;6;8;8",
        "confidence": "2;3;2;3;4",
        "soundness": "3;3;3;4;4",
        "contribution": "2;2;3;4;3",
        "presentation": "3;3;3;4;3",
        "wc_summary": "422;57;70;54;119",
        "wc_strengths": "89;18;14;24;57",
        "wc_weaknesses": "510;138;156;33;368",
        "wc_questions": "141;26;100;24;3",
        "wc_review": "1162;239;340;135;547",
        "wc_reply_reviewers": "0;81;0;11;112",
        "wc_reply_authors": "1450;656;895;291;1591",
        "reply_reviewers": "0;1;0;1;3",
        "reply_authors": "3;2;3;1;4",
        "rating_avg": [
            6.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            2.8,
            0.7483314773547882
        ],
        "soundness_avg": [
            3.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.8,
            0.7483314773547882
        ],
        "presentation_avg": [
            3.2,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            144.4,
            140.75027531056557
        ],
        "wc_strengths_avg": [
            40.4,
            28.653795560099887
        ],
        "wc_weaknesses_avg": [
            241.0,
            172.96704888504053
        ],
        "wc_questions_avg": [
            58.8,
            52.63990881451069
        ],
        "wc_review_avg": [
            484.6,
            365.02416358372767
        ],
        "wc_reply_reviewers_avg": [
            40.8,
            46.6964666757561
        ],
        "wc_reply_authors_avg": [
            976.6,
            486.0216456085058
        ],
        "reply_reviewers_avg": [
            1.0,
            1.0954451150103321
        ],
        "reply_authors_avg": [
            2.6,
            1.019803902718557
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.7637626158259733,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16303568290070259858&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=A18gWgc5mi",
        "pdf": "https://openreview.net/pdf?id=A18gWgc5mi",
        "email": "mila.quebec;mit.edu;polymtl.ca;;;google.com",
        "author_num": 6,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Mila;Massachusetts Institute of Technology;Polytechnique Montreal;Google",
        "aff_unique_dep": "Quebec Artificial Intelligence Institute;;;Google",
        "aff_unique_url": "https://mila.quebec;https://web.mit.edu;https://www.polymtl.ca;https://www.google.com",
        "aff_unique_abbr": "Mila;MIT;PolyMTL;Google",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Montreal;Mountain View",
        "aff_country_unique_index": "0;1;0;1",
        "aff_country_unique": "Canada;United States"
    },
    {
        "id": "A1z0JnxnGp",
        "title": "Power Characterization of Noisy Quantum Kernels",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Quantum kernel methods have been widely recognized as one of promising quantum machine learning algorithms that have potential to achieve quantum advantages. In this paper, we theoretically characterize the power of noisy quantum kernels and demonstrate that under global depolarization noise, for different input data the predictions of the optimal hypothesis inferred by the noisy quantum kernel  approximately concentrate towards some fixed value. In particular, we depict the convergence rate in terms of the strength of quantum noise, the size of training samples, the number of qubits, the number of layers affected by quantum noises, as well as the number of measurement shots. Our results show that noises may make quantum kernel methods to only have poor prediction capability, even when the generalization error is small. Thus, we provide a crucial warning to employ noisy quantum kernel methods for quantum computation and the theoretical results can also serve as guidelines when developing practical quantum kernel algorithms for achieving quantum advantages.",
        "keywords": "quantum kernel;quantum machine learning;prediction capability;noisy quantum circuit",
        "primary_area": "metric learning, kernel learning, and sparse coding",
        "supplementary_material": "",
        "author": "Yabo Wang;Bo Qi;Xin Wang;Tongliang Liu;Daoyi Dong",
        "authorids": "~Yabo_Wang1;~Bo_Qi1;~Xin_Wang75;~Tongliang_Liu1;~Daoyi_Dong1",
        "gender": ";M;M;M;M",
        "homepage": "https://github.com/yabowang23;;https://sheffieldwang.github.io/;https://tongliang-liu.github.io/;https://profiles.uts.edu.au/Daoyi.Dong",
        "dblp": ";;;150/6667;27/3317",
        "google_scholar": ";;;https://scholar.google.com.au/citations?user=EiLdZ_YAAAAJ;https://scholar.google.com.au/citations?hl=en",
        "orcid": ";0000-0002-4504-0124;;;0000-0002-7425-3559",
        "linkedin": ";;;;",
        "or_profile": "~Yabo_Wang1;~Bo_Qi1;~Xin_Wang75;~Tongliang_Liu1;~Daoyi_Dong1",
        "aff": "Academy of Mathematics and Systems Science, Chinese Academy of Sciences, Chinese Academy of Sciences;Academy of Mathematics and Systems Science, Chinese Academy of Sciences;Academy of Mathematics and Systems Science, Chinese Academy of Sciences, Chinese Academy of Sciences;Mohamed bin Zayed University of Artificial Intelligence;Australian National University",
        "aff_domain": "amss.ac.cn;amss.ac.cn;amss.ac.cn;mbzuai.ac.ae;anu.edu.au",
        "position": "PhD student;Associate Professor;MS student;Affiliated Associate Professor;Full Professor",
        "bibtex": "@misc{\nwang2024power,\ntitle={Power Characterization of Noisy Quantum Kernels},\nauthor={Yabo Wang and Bo Qi and Xin Wang and Tongliang Liu and Daoyi Dong},\nyear={2024},\nurl={https://openreview.net/forum?id=A1z0JnxnGp}\n}",
        "github": "",
        "project": "",
        "reviewers": "8JA5;XjgB;5XBn;VA13;M7Gm",
        "site": "https://openreview.net/forum?id=A1z0JnxnGp",
        "pdf_size": 508969,
        "rating": "3;5;5;5;6",
        "confidence": "3;4;4;4;3",
        "soundness": "2;3;3;2;4",
        "contribution": "2;2;2;2;2",
        "presentation": "3;2;3;4;3",
        "wc_summary": "60;138;82;43;104",
        "wc_strengths": "41;79;74;56;88",
        "wc_weaknesses": "127;129;131;108;124",
        "wc_questions": "38;162;33;45;38",
        "wc_review": "266;508;320;252;354",
        "wc_reply_reviewers": "57;40;68;172;151",
        "wc_reply_authors": "943;1662;1231;1259;598",
        "reply_reviewers": "1;1;1;1;1",
        "reply_authors": "4;4;4;2;3",
        "rating_avg": [
            4.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.8,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            85.4,
            33.368248380758615
        ],
        "wc_strengths_avg": [
            67.6,
            16.906803364326446
        ],
        "wc_weaknesses_avg": [
            123.8,
            8.23164625090267
        ],
        "wc_questions_avg": [
            63.2,
            49.547552916365106
        ],
        "wc_review_avg": [
            340.0,
            91.6951470907812
        ],
        "wc_reply_reviewers_avg": [
            97.6,
            53.34641506230761
        ],
        "wc_reply_authors_avg": [
            1138.6,
            354.25674305508994
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.4,
            0.8
        ],
        "replies_avg": [
            31,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.25000000000000006,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13191641656876513006&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;1;2",
        "aff_unique_norm": "Chinese Academy of Sciences;Mohamed bin Zayed University of Artificial Intelligence;Australian National University",
        "aff_unique_dep": "Academy of Mathematics and Systems Science;;",
        "aff_unique_url": "http://www.cas.cn;https://mbzuai.ac.ae;https://www.anu.edu.au",
        "aff_unique_abbr": "CAS;MBZUAI;ANU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;2",
        "aff_country_unique": "China;United Arab Emirates;Australia"
    },
    {
        "id": "A2KKgcYYDB",
        "title": "Global Convergence Rate of Deep Equilibrium Models with General Activations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In a recent paper, Ling et al. investigated the over-parametrized Deep Equilibrium Model (DEQ) with ReLU activation. They proved that the gradient descent converges to a globally optimal solution at a linear convergence rate for the quadratic loss function. This paper shows that this fact still holds for DEQs with any general activation that has bounded first and second derivatives. Since the new activation function is generally non-linear, bounding the least eigenvalue of the Gram matrix of the equilibrium point is particularly challenging. To accomplish this task, we need to create a novel population Gram matrix and develop a new form of dual activation with Hermite polynomial expansion.",
        "keywords": "Deep Learning;Deep Equilibrium Model;Gradient Descent Convergence;Hermite Polynomial Expansion",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Lan V. Truong",
        "authorids": "~Lan_V._Truong1",
        "gender": "M",
        "homepage": "https://sites.google.com/site/truongvinhlan/",
        "dblp": "91/11265.html",
        "google_scholar": "BCoSKrQAAAAJ",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Lan_Vinh_Truong1",
        "aff": "University of Essex",
        "aff_domain": "essex.ac.uk",
        "position": "Lecturer",
        "bibtex": "@misc{\ntruong2024global,\ntitle={Global Convergence Rate of Deep Equilibrium Models with General Activations},\nauthor={Lan V. Truong},\nyear={2024},\nurl={https://openreview.net/forum?id=A2KKgcYYDB}\n}",
        "github": "",
        "project": "",
        "reviewers": "pmW6;fu3L;ubP5;SDT1",
        "site": "https://openreview.net/forum?id=A2KKgcYYDB",
        "pdf_size": 430501,
        "rating": "1;3;5;6",
        "confidence": "2;5;4;3",
        "soundness": "2;3;3;3",
        "contribution": "1;2;2;2",
        "presentation": "1;2;2;2",
        "wc_summary": "27;47;142;76",
        "wc_strengths": "11;92;123;51",
        "wc_weaknesses": "178;149;444;98",
        "wc_questions": "39;2;50;16",
        "wc_review": "255;290;759;241",
        "wc_reply_reviewers": "588;0;380;9",
        "wc_reply_authors": "669;490;1261;170",
        "reply_reviewers": "1;0;3;1",
        "reply_authors": "1;1;4;1",
        "rating_avg": [
            3.75,
            1.920286436967152
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            73.0,
            43.47988040461933
        ],
        "wc_strengths_avg": [
            69.25,
            42.22780482099442
        ],
        "wc_weaknesses_avg": [
            217.25,
            134.01002760987703
        ],
        "wc_questions_avg": [
            26.75,
            18.833148966649205
        ],
        "wc_review_avg": [
            386.25,
            215.9460291369119
        ],
        "wc_reply_reviewers_avg": [
            244.25,
            250.79511059827303
        ],
        "wc_reply_authors_avg": [
            647.5,
            396.75464710573965
        ],
        "reply_reviewers_avg": [
            1.25,
            1.0897247358851685
        ],
        "reply_authors_avg": [
            1.75,
            1.299038105676658
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0.29111125486979095,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5049746081414068337&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Essex",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.essex.ac.uk",
        "aff_unique_abbr": "Essex",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "title": "Semantic Flow: Learning Semantic Fields of Dynamic Scenes from Monocular Videos",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19275",
        "id": "A2mRcRyGdl",
        "author_site": "Fengrui Tian, Yueqi Duan, Angtian Wang, Jianfei Guo, Shaoyi Du",
        "tldr": "",
        "abstract": "In this work, we pioneer Semantic Flow, a neural semantic representation of dynamic scenes from monocular videos. In contrast to previous NeRF methods that reconstruct dynamic scenes from the colors and volume densities of individual points, Semantic Flow learns semantics from continuous flows that contain rich 3D motion information. As there is 2D-to-3D ambiguity problem in the viewing direction when extracting 3D flow features from 2D video frames, we consider the volume densities as opacity priors that describe the contributions of flow features to the semantics on the frames. More specifically, we first learn a flow network to predict flows in the dynamic scene, and propose a flow feature aggregation module to extract flow features from video frames. Then, we propose a flow attention module to extract motion information from flow features, which is followed by a semantic network to output semantic logits of flows. We integrate the logits with\nvolume densities in the viewing direction to supervise the flow features with semantic labels on video frames. Experimental results show that our model is able to learn from multiple dynamic scenes and supports a series of new tasks such as instance-level scene editing, semantic completions, dynamic scene tracking and semantic adaption on novel scenes.",
        "keywords": "3D vision;NeRF;semantic understanding",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/a151f48e53dbd76f25d3817e0b2f656802151425.zip",
        "author": "Fengrui Tian;Yueqi Duan;Angtian Wang;Jianfei Guo;Shaoyi Du",
        "authorids": "~Fengrui_Tian1;~Yueqi_Duan1;~Angtian_Wang2;~Jianfei_Guo1;~Shaoyi_Du1",
        "gender": "M;M;M;M;",
        "homepage": "https://tianfr.github.io/;https://duanyueqi.github.io/;https://angtianwang.github.io/;https://ventusff.github.io;",
        "dblp": "336/7668;168/8373;;305/7388.html;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;qDseo3cAAAAJ;YR7re-cAAAAJ;MJb2_wYAAAAJ;",
        "orcid": "0000-0002-9577-5276;;;0000-0002-5838-679X;",
        "linkedin": ";;;;",
        "or_profile": "~Fengrui_Tian1;~Yueqi_Duan1;~Angtian_Wang2;~Jianfei_Guo1;~Shaoyi_Du1",
        "aff": "Xi'an Jiaotong University;Tsinghua University;Johns Hopkins University;Shanghai Artificial Intelligence Laboratory;",
        "aff_domain": "xjtu.edu.cn;tsinghua.edu.cn;jhu.edu;pjlab.org.cn;",
        "position": "MS student;Assistant Professor;PhD student;Researcher;",
        "bibtex": "@inproceedings{\ntian2024semantic,\ntitle={Semantic Flow: Learning Semantic Fields of Dynamic Scenes from Monocular Videos},\nauthor={Fengrui Tian and Yueqi Duan and Angtian Wang and Jianfei Guo and Shaoyi Du},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=A2mRcRyGdl}\n}",
        "github": "",
        "project": "",
        "reviewers": "QtRh;xtsS;5VQj",
        "pdf_size": 16230649,
        "rating": "5;6;8",
        "confidence": "4;4;3",
        "soundness": "3;3;3",
        "contribution": "2;2;3",
        "presentation": "3;3;3",
        "wc_summary": "126;69;54",
        "wc_strengths": "136;65;66",
        "wc_weaknesses": "283;180;81",
        "wc_questions": "80;20;62",
        "wc_review": "625;334;263",
        "wc_reply_reviewers": "91;149;0",
        "wc_reply_authors": "1370;1129;348",
        "reply_reviewers": "1;3;0",
        "reply_authors": "4;5;1",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            83.0,
            31.016124838541646
        ],
        "wc_strengths_avg": [
            89.0,
            33.23652609203716
        ],
        "wc_weaknesses_avg": [
            181.33333333333334,
            82.47154391398014
        ],
        "wc_questions_avg": [
            54.0,
            25.13961017995307
        ],
        "wc_review_avg": [
            407.3333333333333,
            156.6191417278091
        ],
        "wc_reply_reviewers_avg": [
            80.0,
            61.32427469335994
        ],
        "wc_reply_authors_avg": [
            949.0,
            436.2117222939643
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            1.247219128924647
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            1.699673171197595
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.944911182523068,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18433628933461041863&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=A2mRcRyGdl",
        "pdf": "https://openreview.net/pdf?id=A2mRcRyGdl",
        "email": "xjtu.edu.cn;tsinghua.edu.cn;jhu.edu;pjlab.org.cn;",
        "author_num": 5,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Xi'an Jiao Tong University;Tsinghua University;Johns Hopkins University;Shanghai Artificial Intelligence Laboratory",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.xjtu.edu.cn;https://www.tsinghua.edu.cn;https://www.jhu.edu;http://www.shailab.org/",
        "aff_unique_abbr": "XJTU;THU;JHU;Shanghai AI Lab",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "A4YlfnbaSD",
        "title": "Overcoming the Stability Gap in Continual Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In many real-world applications, deep neural networks are retrained from scratch as a dataset grows in size. Given the computational expense for retraining networks, it has been argued that continual learning could make updating networks more efficient. An obstacle to achieving this goal is the stability gap, which refers to an observation that when updating on new data, performance on previously learned data degrades before recovering. Addressing this problem would enable learning new data with fewer network updates, resulting in increased computational efficiency. We study how to mitigate the stability gap. We test a variety of hypotheses to understand why the stability gap occurs. This leads us to discover a method that vastly reduces this gap. In large-scale class incremental learning experiments, we are able to significantly reduce the number of network updates needed for continual learning. Our work has the potential to advance the state-of-the-art in continual learning for real-world applications along with reducing the carbon footprint required to maintain updated neural networks.",
        "keywords": "Continual Learning;Catastrophic Forgetting;Stability Gap;Stability-Plasticity Dilemma",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/15ba233b64c3c5ce3183ed3d71147ce77a34f3fd.pdf",
        "author": "Md Yousuf Harun;Christopher Kanan",
        "authorids": "~Md_Yousuf_Harun1;~Christopher_Kanan1",
        "gender": "M;M",
        "homepage": "https://yousuf907.github.io;https://chriskanan.com/",
        "dblp": ";14/8653",
        "google_scholar": "https://scholar.google.com/citations?hl=en;jMxZjBoAAAAJ",
        "orcid": "0000-0001-6544-6159;0000-0002-6412-995X",
        "linkedin": "md-yousuf-harun-71748572;chriskanan/",
        "or_profile": "~Md_Yousuf_Harun1;~Christopher_Kanan1",
        "aff": "Rochester Institute of Technology;University of Rochester",
        "aff_domain": "rit.edu;rochester.edu",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\nharun2024overcoming,\ntitle={Overcoming the Stability Gap in Continual Learning},\nauthor={Md Yousuf Harun and Christopher Kanan},\nyear={2024},\nurl={https://openreview.net/forum?id=A4YlfnbaSD}\n}",
        "github": "",
        "project": "",
        "reviewers": "EKNY;9Qg6;wwBV;2UBD",
        "site": "https://openreview.net/forum?id=A4YlfnbaSD",
        "pdf_size": 5703220,
        "rating": "3;5;5;5",
        "confidence": "4;4;5;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;2;2",
        "presentation": "3;3;2;3",
        "wc_summary": "185;143;101;83",
        "wc_strengths": "26;87;41;64",
        "wc_weaknesses": "205;351;276;105",
        "wc_questions": "115;47;194;138",
        "wc_review": "531;628;612;390",
        "wc_reply_reviewers": "0;221;0;0",
        "wc_reply_authors": "764;874;1137;1073",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;3;2;2",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            128.0,
            39.45883931389772
        ],
        "wc_strengths_avg": [
            54.5,
            23.13547060251855
        ],
        "wc_weaknesses_avg": [
            234.25,
            90.73966883342698
        ],
        "wc_questions_avg": [
            123.5,
            52.690131903421914
        ],
        "wc_review_avg": [
            540.25,
            94.21882773628634
        ],
        "wc_reply_reviewers_avg": [
            55.25,
            95.69580711818047
        ],
        "wc_reply_authors_avg": [
            962.0,
            149.91164064207956
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5029589355732838682&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Rochester Institute of Technology;University of Rochester",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.rit.edu;https://www.rochester.edu",
        "aff_unique_abbr": "RIT;U of R",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Dirichlet-based Per-Sample Weighting by Transition Matrix for Noisy Label Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19274",
        "id": "A4mJuFRMN8",
        "author_site": "HeeSun Bae, Seungjae Shin, Byeonghu Na, Il-chul Moon",
        "tldr": "",
        "abstract": "For learning with noisy labels, the transition matrix, which explicitly models the relation between noisy label distribution and clean label distribution, has been utilized to achieve the statistical consistency of either the classifier or the risk. Previous researches have focused more on how to estimate this transition matrix well, rather than how to utilize it. We propose good utilization of the transition matrix is crucial and suggest a new utilization method based on resampling, coined RENT. Specifically, we first demonstrate current utilizations can have potential limitations for implementation. As an extension to Reweighting, we suggest the Dirichlet distribution-based per-sample Weight Sampling (DWS) framework, and compare reweighting and resampling under DWS framework. With the analyses from DWS, we propose RENT, a REsampling method with Noise Transition matrix. Empirically, RENT consistently outperforms existing transition matrix utilization methods, which includes reweighting, on various benchmark datasets. Our code is available at https://github.com/BaeHeeSun/RENT.",
        "keywords": "learning with noisy label;noisy label classification;Transition matrix;Dirichlet distribution;Importance sampling",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "HeeSun Bae;Seungjae Shin;Byeonghu Na;Il-chul Moon",
        "authorids": "~HeeSun_Bae1;~Seungjae_Shin1;~Byeonghu_Na1;~Il-chul_Moon1",
        "gender": "F;M;M;",
        "homepage": ";https://sites.google.com/view/seungjae-shin;https://sites.google.com/view/byeonghu-na;",
        "dblp": ";29/551;276/5100;",
        "google_scholar": "https://scholar.google.co.kr/citations?user=D9U_ohsAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.co.kr/citations?user=mJoqpmEAAAAJ;",
        "orcid": "0000-0002-9986-0945;;0000-0003-3463-2674;",
        "linkedin": "heesun-bae-8a4b8523a/;seungjae-shin-hoodie/;byeonghu-na-17942120b/;",
        "or_profile": "~HeeSun_Bae1;~Seungjae_Shin1;~Byeonghu_Na1;~Il-chul_Moon1",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr;kaist.ac.kr;",
        "position": "PhD student;PhD student;PhD student;",
        "bibtex": "@inproceedings{\nbae2024dirichletbased,\ntitle={Dirichlet-based Per-Sample Weighting by Transition Matrix for Noisy Label Learning},\nauthor={HeeSun Bae and Seungjae Shin and Byeonghu Na and Il-chul Moon},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=A4mJuFRMN8}\n}",
        "github": "",
        "project": "",
        "reviewers": "z7WX;4M7K;KTbE;HW3A;Epey;hEe7",
        "pdf_size": 8461139,
        "rating": "5;6;6;6;6;6",
        "confidence": "3;4;4;3;3;3",
        "soundness": "3;3;3;2;3;2",
        "contribution": "2;3;2;2;3;3",
        "presentation": "2;2;3;3;3;2",
        "wc_summary": "64;41;94;62;77;97",
        "wc_strengths": "61;47;54;55;31;136",
        "wc_weaknesses": "172;127;100;105;186;50",
        "wc_questions": "54;22;9;140;28;64",
        "wc_review": "351;237;257;362;322;347",
        "wc_reply_reviewers": "0;30;45;84;38;0",
        "wc_reply_authors": "1757;587;613;2669;327;1119",
        "reply_reviewers": "0;1;1;1;1;0",
        "reply_authors": "4;3;2;6;2;4",
        "rating_avg": [
            5.833333333333333,
            0.372677996249965
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            72.5,
            19.397164741270824
        ],
        "wc_strengths_avg": [
            64.0,
            33.54598833442433
        ],
        "wc_weaknesses_avg": [
            123.33333333333333,
            45.766314638121735
        ],
        "wc_questions_avg": [
            52.833333333333336,
            43.229683731847445
        ],
        "wc_review_avg": [
            312.6666666666667,
            48.29308669180531
        ],
        "wc_reply_reviewers_avg": [
            32.833333333333336,
            28.742631906088363
        ],
        "wc_reply_authors_avg": [
            1178.6666666666667,
            811.8402278500096
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.5,
            1.3844373104863459
        ],
        "replies_avg": [
            35,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.31622776601683783,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:hAGhZb9SFH4J:scholar.google.com/&scioq=Dirichlet-based+Per-Sample+Weighting+by+Transition+Matrix+for+Noisy+Label+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=A4mJuFRMN8",
        "pdf": "https://openreview.net/pdf?id=A4mJuFRMN8",
        "email": "kaist.ac.kr;kaist.ac.kr;kaist.ac.kr;",
        "author_num": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "A5nLEfjhJW",
        "title": "SHARCS: SHARed Concept Space for\\\\Explainable Multimodal Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Multimodal learning is an essential paradigm for addressing complex real-world problems, where individual data modalities are typically insufficient for accurately solving a given modelling task. While various deep learning approaches have successfully addressed these challenges, their reasoning process is often opaque; limiting the capabilities for a principled explainable cross-modal analysis and any domain-expert intervention. In this paper, we introduce SHARCS (SHARed Concept Space) -- a novel concept-based approach for explainable multimodal learning. SHARCS learns and maps interpretable concepts from different heterogeneous modalities into a single unified concept-manifold, which leads to an intuitive projection of semantically similar cross-modal concepts. We demonstrate that such an approach can lead to inherently explainable task predictions while also improving downstream predictive performance. Moreover, we show that SHARCS can operate and significantly outperform other approaches in practically significant scenarios, such as retrieval of missing modalities and cross-modal explanations. Our approach is model agnostic and easily applicable to different types (and number) of modalities, thus advancing the development of effective, interpretable, and trustworthy multimodal approaches.",
        "keywords": "Explainable AI;Multimodal Learning;Concept Based Models",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/77fa16b490d1cb28d040a45c5a5db8e4a85479d8.zip",
        "author": "Gabriele Dominici;Pietro Barbiero;Lucie Charlotte Magister;Pietro Lio;Nikola Simidjievski",
        "authorids": "~Gabriele_Dominici1;~Pietro_Barbiero1;~Lucie_Charlotte_Magister1;~Pietro_Lio1;~Nikola_Simidjievski1",
        "gender": "M;M;F;M;Unspecified",
        "homepage": ";http://www.pietrobarbiero.eu/;;https://www.cst.cam.ac.uk/people/pl219;https://simidjievskin.github.io/",
        "dblp": "351/0657;238/7860;298/1032;l/PietroLio.html;",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;https://scholar.google.it/citations?user=4gbToQoAAAAJ;do6o-rYAAAAJ;https://scholar.google.co.uk/citations?user=3YrWf7EAAAAJ;",
        "orcid": "0009-0009-1955-0778;0000-0003-3155-2564;0000-0003-3499-5475;0000-0002-0540-5053;",
        "linkedin": "gabriele-dominici-677bb6161/;;;;",
        "or_profile": "~Gabriele_Dominici1;~Pietro_Barbiero1;~Lucie_Charlotte_Magister1;~Pietro_Lio1;~Nikola_Simidjievski1",
        "aff": "Universita della Svizzera Italiana;Universita della Svizzera Italiana;Apple;University of Cambridge;University of Cambridge",
        "aff_domain": "usi.ch;usi.ch;apple.com;cam.ac.uk;cam.ac.uk",
        "position": "PhD student;Postdoc;ML Research Intern;Full Professor;Principal Researcher",
        "bibtex": "@misc{\ndominici2024sharcs,\ntitle={{SHARCS}: {SHAR}ed Concept Space for{\\textbackslash}{\\textbackslash}Explainable Multimodal Learning},\nauthor={Gabriele Dominici and Pietro Barbiero and Lucie Charlotte Magister and Pietro Lio and Nikola Simidjievski},\nyear={2024},\nurl={https://openreview.net/forum?id=A5nLEfjhJW}\n}",
        "github": "",
        "project": "",
        "reviewers": "w4Zt;yLh6;D8iH",
        "site": "https://openreview.net/forum?id=A5nLEfjhJW",
        "pdf_size": 11778429,
        "rating": "3;5;6",
        "confidence": "4;4;3",
        "soundness": "2;3;2",
        "contribution": "2;2;3",
        "presentation": "3;2;3",
        "wc_summary": "61;51;62",
        "wc_strengths": "38;53;73",
        "wc_weaknesses": "305;136;123",
        "wc_questions": "3;38;28",
        "wc_review": "407;278;286",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            58.0,
            4.96655480858378
        ],
        "wc_strengths_avg": [
            54.666666666666664,
            14.337208778404378
        ],
        "wc_weaknesses_avg": [
            188.0,
            82.90154803540563
        ],
        "wc_questions_avg": [
            23.0,
            14.719601443879744
        ],
        "wc_review_avg": [
            323.6666666666667,
            59.01600536201081
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.7559289460184545,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15506685760797823300&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;2;2",
        "aff_unique_norm": "Universita della Svizzera Italiana;Apple;University of Cambridge",
        "aff_unique_dep": ";Apple Inc.;",
        "aff_unique_url": "https://www.usi.ch;https://www.apple.com;https://www.cam.ac.uk",
        "aff_unique_abbr": "USI;Apple;Cambridge",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Cambridge",
        "aff_country_unique_index": "0;0;1;2;2",
        "aff_country_unique": "Switzerland;United States;United Kingdom"
    },
    {
        "id": "A6juYCULJO",
        "title": "Abstractive Summarization through the PRISM of Decoding Strategies",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In the realm of natural language generation, abstractive summarization (AS) is at the center of an unparalleled evolution driven by transformer-based language models (LMs). However, the significance of decoding strategies is often neglected despite their influence on the generated summaries. Given the abundance of token selection heuristics and their accompanying hyperparameters, the community needs directions to steer well-founded decisions based on the task and the target metrics at hand. To fill this gap, we comparatively assess the effectiveness and efficiency of decoding-time techniques for short, long, and multi-document AS. We explore more than 2500 combinations of 3 widely used million-scale autoregressive encoder-decoder models, 6 datasets, and 9 decoding settings. Our findings shed light on the field, demonstrating that optimized decoding choices can yield substantial performance enhancements. In addition to human evaluation, we quantitatively measure effects using 10 automatic metrics, including dimensions such as semantic similarity, factuality, compression, redundancy, and carbon footprint. We introduce PRISM, a first-of-its-kind dataset that pairs AS gold input-output examples with LM predictions under a wide array of decoding options.",
        "keywords": "Decoding Strategies;Abstractive Summarization;Short Document Summarization;Long Document Summarization;Multi-Document Summarization;Natural Language Generation;Autoregressive Language Models;Datasets and Benchmarks",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Giacomo Frisoni;Luca Ragazzi;David Cohen;Gianluca Moro;Antonella Carbonaro;Claudio Sartori",
        "authorids": "~Giacomo_Frisoni1;~Luca_Ragazzi1;~David_Cohen4;~Gianluca_Moro1;~Antonella_Carbonaro1;~Claudio_Sartori1",
        "gender": "M;M;M;M;F;M",
        "homepage": ";https://www.unibo.it/sitoweb/l.ragazzi;;https://www.unibo.it/sitoweb/gianluca.moro/en;https://www.unibo.it/sitoweb/antonella.carbonaro;https://www.unibo.it/sitoweb/claudio.sartori/en",
        "dblp": "271/1231;https://dblp.uni-trier.de/pid/320/5349;;m/GianlucaMoro;90/6831;s/ClaudioSartori.html",
        "google_scholar": "BEZlFiAAAAAJ;BmaBHcAAAAAJ;;QOfSGKkAAAAJ;TsJoqIUAAAAJ;yGZuBaAAAAAJ",
        "orcid": "0000-0002-9845-0231;0000-0003-3574-9962;;;0000-0002-3890-4852;0000-0003-4535-1026",
        "linkedin": "giacomo-frisoni-3b97a8129/;luca-ragazzi-38557316b/;david-cohen96;;;claudiosartori/?originalSubdomain=it",
        "or_profile": "~Giacomo_Frisoni1;~Luca_Ragazzi1;~David_Cohen4;~Gianluca_Moro1;~Antonella_Carbonaro1;~Claudio_Sartori1",
        "aff": "University of Bologna;University of Bologna;University of Bologna;DISI - University of Bologna;University of Bologna;University of Bologna",
        "aff_domain": "unibo.it;unibo.it;unibo.it;unibo.it;unibo.it;unibo.it",
        "position": "PhD student;Postdoc;MS student;Associate Professor;Associate Professor;Full Professor",
        "bibtex": "@misc{\nfrisoni2024abstractive,\ntitle={Abstractive Summarization through the {PRISM} of Decoding Strategies},\nauthor={Giacomo Frisoni and Luca Ragazzi and David Cohen and Gianluca Moro and Antonella Carbonaro and Claudio Sartori},\nyear={2024},\nurl={https://openreview.net/forum?id=A6juYCULJO}\n}",
        "github": "",
        "project": "",
        "reviewers": "BSXa;8Gmg;rLZb;Eedp",
        "site": "https://openreview.net/forum?id=A6juYCULJO",
        "pdf_size": 6564224,
        "rating": "5;5;6;8",
        "confidence": "4;4;3;3",
        "soundness": "3;2;2;3",
        "contribution": "2;3;3;3",
        "presentation": "3;2;3;4",
        "wc_summary": "31;130;94;49",
        "wc_strengths": "19;271;35;50",
        "wc_weaknesses": "75;498;26;147",
        "wc_questions": "1;308;35;25",
        "wc_review": "126;1207;190;271",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "530;1826;445;595",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;3;1;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            76.0,
            38.71046370169182
        ],
        "wc_strengths_avg": [
            93.75,
            102.92078264374013
        ],
        "wc_weaknesses_avg": [
            186.5,
            184.9222809723047
        ],
        "wc_questions_avg": [
            92.25,
            125.17462802021822
        ],
        "wc_review_avg": [
            448.5,
            440.92431323300826
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            849.0,
            566.5734727288244
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.8164965809277259,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9682898466353828177&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "University of Bologna",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.unibo.it",
        "aff_unique_abbr": "Unibo",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "Italy"
    },
    {
        "id": "A6kK5e3DhR",
        "title": "Controllable Data Generation via Iterative Data-Property Mutual Mappings",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Deep generative models have been widely used for their ability to generate realistic data samples in various areas, such as images, molecules, text, and speech. One major goal of data generation is controllability, namely to generate new data with desired properties. Despite growing interest in the area of controllable generation, significant challenges still remain, including 1) Disentangling desired properties with unrelated latent variables, 2) out-of-distribution property control, and 3) objective optimization for out-of-distribution property control. To address these challenges, in this paper, we propose a general framework to enhance VAE-based data generators with property controllability and disentanglement ensure. Our proposed objective can be optimized on both data seen and unseen in the training set. We propose a training procedure to train the objective in a semi-supervised manner by iteratively conducting mutual mappings between the data and properties. The proposed framework is implemented on four VAE-based controllable generators to evaluate its performance on property error, disentanglement performance, generation quality, and training time. The results indicate that our proposed framework enables more precise control over the properties of generated samples in a short training time, ensuring the disentanglement stated above and keeping the validity of the generated samples.",
        "keywords": "Controllable data generation;generative models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/ff639ecc52639976ac8a50ef6ff465d365352768.pdf",
        "author": "Bo Pan;Muran Qin;Shiyu Wang;Yifei Zhang;Liang Zhao",
        "authorids": "~Bo_Pan2;~Muran_Qin1;~Shiyu_Wang2;~Yifei_Zhang10;~Liang_Zhao6",
        "gender": ";M;M;M;M",
        "homepage": "https://pb0316.github.io/;;https://sites.google.com/view/about-shiyuwang;https://yifeizhangcs.github.io/;https://cs.emory.edu/~lzhao41/",
        "dblp": ";;;55/5266-6;63/5422-2",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en;y5FkC7cAAAAJ;qnvyqtwAAAAJ",
        "orcid": "0009-0005-7501-7581;;;0009-0004-6136-733X;0000-0002-2648-9989",
        "linkedin": "bo-pan;;shiyu-wang-647a7b91/;yifei-jimmy-zhang/;",
        "or_profile": "~Bo_Pan2;~Muran_Qin1;~Shiyu_Wang2;~Yifei_Zhang10;~Liang_Zhao6",
        "aff": "Emory University;University of California, San Diego;Emory University;Emory University;Emory University",
        "aff_domain": "emory.edu;ucsd.edu;emory.edu;emory.edu;emory.edu",
        "position": "PhD student;MS student;PhD student;PhD student;Associate Professor",
        "bibtex": "@misc{\npan2024controllable,\ntitle={Controllable Data Generation via Iterative Data-Property Mutual Mappings},\nauthor={Bo Pan and Muran Qin and Shiyu Wang and Yifei Zhang and Liang Zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=A6kK5e3DhR}\n}",
        "github": "",
        "project": "",
        "reviewers": "rFTY;Umbq;YxqT;UtY6",
        "site": "https://openreview.net/forum?id=A6kK5e3DhR",
        "pdf_size": 3883,
        "rating": "1;3;5;5",
        "confidence": "4;4;4;4",
        "soundness": "1;1;3;3",
        "contribution": "1;2;2;2",
        "presentation": "1;3;3;2",
        "wc_summary": "95;131;81;120",
        "wc_strengths": "93;44;80;74",
        "wc_weaknesses": "167;101;263;566",
        "wc_questions": "53;42;73;5",
        "wc_review": "408;318;497;765",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            1.6583123951777
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            1.0
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            106.75,
            19.778460506318485
        ],
        "wc_strengths_avg": [
            72.75,
            17.963504669189696
        ],
        "wc_weaknesses_avg": [
            274.25,
            178.01878412122693
        ],
        "wc_questions_avg": [
            43.25,
            24.722206616724165
        ],
        "wc_review_avg": [
            497.0,
            167.17206704470695
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:AB6W9j4pEXkJ:scholar.google.com/&scioq=Controllable+Data+Generation+via+Iterative+Data-Property+Mutual+Mappings&hl=en&as_sdt=0,5",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0;0;0",
        "aff_unique_norm": "Emory University;University of California, San Diego",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.emory.edu;https://www.ucsd.edu",
        "aff_unique_abbr": "Emory;UCSD",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";San Diego",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Hyper Evidential Deep Learning to Quantify Composite Classification Uncertainty",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19273",
        "id": "A7t7z6g6tM",
        "author_site": "Changbin Li, Kangshuo Li, Yuzhe Ou, Lance Kaplan, Audun J\u00f8sang, Jin-Hee Cho, DONG HYUN JEONG, Feng Chen",
        "tldr": "",
        "abstract": "Deep neural networks (DNNs) have been shown to perform well on exclusive, multi-class classification tasks. However, when different classes have similar visual features, it becomes challenging for human annotators to differentiate them. When an image is ambiguous, such as a blurry one where an annotator can't distinguish between a husky and a wolf, it may be labeled with both classes: {husky, wolf}. This scenario necessitates the use of composite set labels. \nIn this paper, we propose a novel framework called Hyper-Evidential Neural Network (HENN) that explicitly models predictive uncertainty caused by composite set labels in training data in the context of the belief theory called Subjective Logic (SL).\nBy placing a Grouped Dirichlet distribution on the class probabilities, we treat predictions of a neural network as parameters of hyper-subjective opinions and learn the network that collects both single and composite evidence leading to these hyper-opinions by a deterministic DNN from data.\nWe introduce a new uncertainty type called vagueness originally designed for hyper-opinions in SL to quantify composite classification uncertainty for DNNs.\nOur experiments prove that HENN outperforms its state-of-the-art counterparts based on four image datasets.\nThe code and datasets are available at: https://shorturl.at/dhoqx.",
        "keywords": "Evidential Neural Network;hyperdomain;vagueness",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/6ef067847995e4802cedd24f94bbb3467d122878.pdf",
        "author": "Changbin Li;Kangshuo Li;Yuzhe Ou;Lance M. Kaplan;Audun J\u00f8sang;Jin-Hee Cho;DONG HYUN JEONG;Feng Chen",
        "authorids": "~Changbin_Li1;~Kangshuo_Li1;~Yuzhe_Ou1;~Lance_M._Kaplan1;~Audun_J\u00f8sang1;~Jin-Hee_Cho1;~DONG_HYUN_JEONG1;~Feng_Chen7",
        "gender": "M;M;M;M;M;F;;M",
        "homepage": ";https://www.linkedin.com/in/kangshuo-li-10359a218/;;;https://www.mn.uio.no/ifi/english/people/aca/josang/;https://people.cs.vt.edu/~jicho/;;https://personal.utdallas.edu/~fxc190007/",
        "dblp": "125/9302;;250/9325.html;47/4107;;;;21/3047-1",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;;https://scholar.google.com/citations?hl=en;obew8e0AAAAJ;https://scholar.google.no/citations?user=wduTe90AAAAJ;wToVkEUAAAAJ;;KOQ-SSYAAAAJ",
        "orcid": ";;0000-0001-8740-4531;0000-0002-3627-4471;0000-0001-6337-2264;;0000-0001-5271-293X;",
        "linkedin": "changbin-li/;;;;audunjosang/;;;",
        "or_profile": "~Changbin_Li1;~Kangshuo_Li1;~Yuzhe_Ou1;~Lance_M._Kaplan1;~Audun_J\u00f8sang1;~Jin-Hee_Cho1;~DONG_HYUN_JEONG1;~Feng_Chen7",
        "aff": "University of Texas, Dallas;UT-Dallas;The University of Texas at Dallas;US DEVCOM Army Research Laboratory ;University of Oslo;Virginia Polytechnic Institute and State University;University of the District of Columbia;University of Texas, Dallas",
        "aff_domain": "utdallas.edu;cs.utdallas.edu;utdallas.edu;army.mil;uio.no;vt.edu;udc.edu;utdallas.edu",
        "position": "PhD student;PhD student;PhD student;Principal Researcher;Full Professor;Associate Professor;Full Professor;Associate Professor",
        "bibtex": "@inproceedings{\nli2024hyper,\ntitle={Hyper Evidential Deep Learning to Quantify Composite Classification Uncertainty},\nauthor={Changbin Li and Kangshuo Li and Yuzhe Ou and Lance M. Kaplan and Audun J{\\o}sang and Jin-Hee Cho and DONG HYUN JEONG and Feng Chen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=A7t7z6g6tM}\n}",
        "github": "",
        "project": "",
        "reviewers": "3vp1;AQu8;Gzpb;RL9p",
        "pdf_size": 7365416,
        "rating": "6;6;6;6",
        "confidence": "3;3;4;2",
        "soundness": "3;3;3;2",
        "contribution": "3;2;3;2",
        "presentation": "3;3;3;2",
        "wc_summary": "79;218;57;61",
        "wc_strengths": "34;186;95;102",
        "wc_weaknesses": "69;704;124;206",
        "wc_questions": "7;52;44;71",
        "wc_review": "189;1160;320;440",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "336;2573;678;1969",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;4;2;4",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            103.75,
            66.48073029081435
        ],
        "wc_strengths_avg": [
            104.25,
            54.10348879693434
        ],
        "wc_weaknesses_avg": [
            275.75,
            252.01029244854266
        ],
        "wc_questions_avg": [
            43.5,
            23.243278598338918
        ],
        "wc_review_avg": [
            527.25,
            375.9490490744723
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1389.0,
            915.5034134289178
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.75,
            1.299038105676658
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9018239966282149804&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=A7t7z6g6tM",
        "pdf": "https://openreview.net/pdf?id=A7t7z6g6tM",
        "email": "utdallas.edu;cs.utdallas.edu;utdallas.edu;army.mil;uio.no;vt.edu;udc.edu;utdallas.edu",
        "author_num": 8,
        "aff_unique_index": "0;0;0;1;2;3;4;0",
        "aff_unique_norm": "University of Texas at Dallas;US Army Research Laboratory;University of Oslo;Virginia Tech;University of the District of Columbia",
        "aff_unique_dep": ";DEVCOM;;;",
        "aff_unique_url": "https://www.utdallas.edu;https://www.arl.army.mil;https://www.uio.no;https://www.vt.edu;https://www.udc.edu",
        "aff_unique_abbr": "UT Dallas;ARL;UiO;VT;UDC",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Dallas;",
        "aff_country_unique_index": "0;0;0;0;1;0;0;0",
        "aff_country_unique": "United States;Norway"
    },
    {
        "id": "A81iom2Y41",
        "title": "Be Your Own Neighborhood: Detecting Adversarial Example by the Neighborhood Relations Built on Self-Supervised Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep Neural Networks (DNNs) have achieved excellent performance in various fields. However, DNNs\u2019 vulnerability to Adversarial Examples (AE) hinders their deployments to safety-critical applications. This paper presents a novel AE detection framework, named BEYOND, for trustworthy predictions. BEYOND performs the detection by distinguishing the AE\u2019s abnormal relation with its augmented versions, i.e. neighbors, from two prospects: representation similarity and label consistency. An off-the-shelf Self-Supervised Learning (SSL) model is used to extract the representation and predict the label for its highly informative representation capacity compared to supervised learning models. For clean samples, their representations and predictions are closely consistent with their neighbors, whereas those of AEs differ greatly. Furthermore, we explain this observation and show that by leveraging this discrepancy BEYOND can effectively detect AEs. We develop a rigorous justification for the effectiveness of BEYOND. Furthermore, as a plug-and-play model, BEYOND can easily cooperate with the Adversarial Trained Classifier (ATC), achieving the state-of-the-art (SOTA) robustness accuracy. Experimental results show that BEYOND outperforms baselines by a large margin, especially under adaptive attacks. Empowered by the robust relation net built on SSL, we found that BEYOND outperforms baselines in terms of both detection ability and speed. Our code will be publicly available.",
        "keywords": "Adversarial Examples;Self-supervised Learning;Adversarial Examples Detection",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/da24b4d9fe6bee964e5657232a67c1f42368c564.zip",
        "author": "Zhiyuan He;Yijun YANG;Pin-Yu Chen;Qiang Xu;Tsung-Yi Ho",
        "authorids": "~Zhiyuan_He2;~Yijun_YANG2;~Pin-Yu_Chen1;~Qiang_Xu1;~Tsung-Yi_Ho2",
        "gender": ";F;M;M;M",
        "homepage": ";https://yangyijune.github.io/;http://www.pinyuchen.com;https://github.com/cure-lab;https://www.cse.cuhk.edu.hk/people/faculty/tsung-yi-ho/",
        "dblp": ";;39/8969;43/1230-1;63/4181.html",
        "google_scholar": ";GZDKIUMAAAAJ;jxwlCUUAAAAJ;https://scholar.google.com.tw/citations?user=eSiKPqUAAAAJ;TRDUYkAAAAAJ",
        "orcid": ";0000-0002-4496-3154;0000-0003-1039-8369;;0000-0001-7348-5625",
        "linkedin": ";%E4%B8%80%E5%90%9B-%E6%9D%A8-82aa60133/;pin-yu-chen-940062a2;;",
        "or_profile": "~Zhiyuan_He2;~Yijun_YANG2;~Pin-Yu_Chen1;~Qiang_Xu1;~Tsung-Yi_Ho2",
        "aff": ";The Chinese University of Hong Kong;International Business Machines;The Chinese University of Hong Kong;Department of Computer Science and Engineering, The Chinese University of Hong Kong",
        "aff_domain": ";cuhk.edu.hk;ibm.com;cuhk.edu.hk;cse.cuhk.edu.hk",
        "position": ";PhD student;Principal Researcher;Full Professor;Full Professor",
        "bibtex": "@misc{\nhe2024be,\ntitle={Be Your Own Neighborhood: Detecting Adversarial Example by the Neighborhood Relations Built on Self-Supervised Learning},\nauthor={Zhiyuan He and Yijun YANG and Pin-Yu Chen and Qiang Xu and Tsung-Yi Ho},\nyear={2024},\nurl={https://openreview.net/forum?id=A81iom2Y41}\n}",
        "github": "",
        "project": "",
        "reviewers": "qcuA;cka9;SDmS;J3f8",
        "site": "https://openreview.net/forum?id=A81iom2Y41",
        "pdf_size": 1357156,
        "rating": "5;6;6;8",
        "confidence": "4;3;3;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;2;2;3",
        "wc_summary": "78;22;228;137",
        "wc_strengths": "117;28;30;171",
        "wc_weaknesses": "92;166;42;366",
        "wc_questions": "16;28;72;44",
        "wc_review": "303;244;372;718",
        "wc_reply_reviewers": "546;28;0;130",
        "wc_reply_authors": "1251;505;153;600",
        "reply_reviewers": "2;1;0;2",
        "reply_authors": "3;2;1;4",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            116.25,
            76.26393315322781
        ],
        "wc_strengths_avg": [
            86.5,
            60.59084089200281
        ],
        "wc_weaknesses_avg": [
            166.5,
            123.33997729852231
        ],
        "wc_questions_avg": [
            40.0,
            20.97617696340303
        ],
        "wc_review_avg": [
            409.25,
            183.92304776726598
        ],
        "wc_reply_reviewers_avg": [
            176.0,
            219.02967835432713
        ],
        "wc_reply_authors_avg": [
            627.25,
            396.7570887835528
        ],
        "reply_reviewers_avg": [
            1.25,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.2294157338705618,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14773029716196574449&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 10,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Chinese University of Hong Kong;International Business Machines Corporation",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cuhk.edu.hk;https://www.ibm.com",
        "aff_unique_abbr": "CUHK;IBM",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "A8Sqe4RZqF",
        "title": "RoBERT: Low-Cost Bi-Directional Sequence Model for Flexible Robot Behavior Control",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Requirement of human involvement for data collection or system design has always been a major challenge for building robot control policy. In this paper, we present $\\textbf{Ro}$bot-$\\textbf{BERT}$ (RoBERT), a method to build\n   general robot control policy for complex behaviors with $\\textit{least}$ human effort. Starting from unsupervisedly-collected dataset, RoBERT has no requirements of human labels, high-quality\n   behavior dataset or accurate information of system model, in contrast to most\n   other methods for building general robot agent. RoBERT is further pre-trained via $\\textit{Masked Action-Inverse-Inference}$ (MAII), a method inspired by\n   $\\textit{Masked Language Modeling}$ (MLM) in BERT-like language models and has potential to enable $\\textit{zero-shot}$, $\\textit{multi-task}$, $\\textit{keyframe-based}$ robot control with little\n   architectural change and user-friendly interface. In our empirical study, RoBERT\n   is successfully applied on various types of robots in simulated environment and could generate stable and flexible behaviors to fulfill complex commands.",
        "keywords": "Imitation Learning;Sequence Model;Transformer;Robotics",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/9ccc8ef515966dbe2fbe240ee2517223a0eb29f5.zip",
        "author": "Diyuan Shi;Shangke Lyu;Donglin Wang",
        "authorids": "~Diyuan_Shi1;~Shangke_Lyu1;~Donglin_Wang1",
        "gender": ";M;M",
        "homepage": ";;https://milab.westlake.edu.cn/",
        "dblp": ";;",
        "google_scholar": ";;https://scholar.google.ca/citations?user=-fo6wdwAAAAJ",
        "orcid": ";0000-0002-8302-6630;0000-0002-8188-3735",
        "linkedin": ";;",
        "or_profile": "~Diyuan_Shi1;~Shangke_Lyu1;~Donglin_Wang1",
        "aff": ";Westlake University;Westlake University",
        "aff_domain": ";westlake.edu;westlake.edu.cn",
        "position": ";Researcher;Associate Professor",
        "bibtex": "@misc{\nshi2024robert,\ntitle={Ro{BERT}: Low-Cost Bi-Directional Sequence Model for Flexible Robot Behavior Control},\nauthor={Diyuan Shi and Shangke Lyu and Donglin Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=A8Sqe4RZqF}\n}",
        "github": "",
        "project": "",
        "reviewers": "piq4;xJAs;oyMc",
        "site": "https://openreview.net/forum?id=A8Sqe4RZqF",
        "pdf_size": 14323779,
        "rating": "3;3;3",
        "confidence": "4;4;4",
        "soundness": "2;2;2",
        "contribution": "2;1;2",
        "presentation": "1;2;1",
        "wc_summary": "86;61;65",
        "wc_strengths": "21;28;47",
        "wc_weaknesses": "215;96;269",
        "wc_questions": "98;46;302",
        "wc_review": "420;231;683",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            70.66666666666667,
            10.96458946893235
        ],
        "wc_strengths_avg": [
            32.0,
            10.98483803552272
        ],
        "wc_weaknesses_avg": [
            193.33333333333334,
            72.26955713776644
        ],
        "wc_questions_avg": [
            148.66666666666666,
            110.48177325795518
        ],
        "wc_review_avg": [
            444.6666666666667,
            185.35071860904367
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:8A3muF_3-14J:scholar.google.com/&scioq=RoBERT:+Low-Cost+Bi-Directional+Sequence+Model+for+Flexible+Robot+Behavior+Control&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Westlake University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.westlake.edu.cn",
        "aff_unique_abbr": "WU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "A8et2yjbly",
        "title": "Cross-Modality Masked Pre-training for Visible-Infrared Person Re-identification",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Visible-Infrared person re-identification is a challenging yet important task in the field of intelligent surveillance. Most existing approaches focus on designing powerful deep networks to  learn modality-shared representations, while little attention has been paid to using pre-training methods, although they can improve the performance of cross-modality tasks stably. This paper proposes a cross-modality masked pre-training (CMMP) method for visible-infrared person re-identification. Specifically, we generate color-irrelevant images using random channel exchangeable augmentation to minimize the difference between modalities at first. In the pre-training process, the visible together with the generated image, and the infrared image are masked by sharing the same random mask. Considering the misalignment of visible and infrared images in the datasets, we then reconstruct the masked areas only of the visible and the generated images using a lightweight decoder, which makes the pre-training process more efficient. Extensive experiments on two visible-infrared person re-identification datasets verify the effectiveness of the proposed method. CMMP outperforms the baseline method by +1.87\\% and +1.24\\% mAP on SYSU-MM01 and RegDB, respectively.",
        "keywords": "Person Re-identification;Cross-modality;Pre-training;Self-supervised Learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Haoyan Ma;Xiang Li;Xia Yuan;Jie Li;Chunxia Zhao",
        "authorids": "~Haoyan_Ma1;~Xiang_Li20;~Xia_Yuan1;~Jie_Li8;~Chunxia_Zhao1",
        "gender": "M;M;M;;",
        "homepage": ";http://implus.github.io/;;;",
        "dblp": ";40/1491-41;69/2223;;78/5979",
        "google_scholar": "mcx4JCsAAAAJ;oamjJdYAAAAJ;;;",
        "orcid": ";;0000-0002-7271-0058;;",
        "linkedin": ";;;;",
        "or_profile": "~Haoyan_Ma1;~Xiang_Li20;~Xia_Yuan1;~Jie_Li8;~Chunxia_Zhao1",
        "aff": ";Nankai University;Nanjing University of Science and Technology;;Nanjing University of Science and Technology",
        "aff_domain": ";nankai.edu.cn;njust.edu.cn;;njust.edu.cn",
        "position": ";Associate Professor;Associate Professor;;Full Professor",
        "bibtex": "@misc{\nma2024crossmodality,\ntitle={Cross-Modality Masked Pre-training for Visible-Infrared Person Re-identification},\nauthor={Haoyan Ma and Xiang Li and Xia Yuan and Jie Li and Chunxia Zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=A8et2yjbly}\n}",
        "github": "",
        "project": "",
        "reviewers": "JDzU;HM7x;t1sC",
        "site": "https://openreview.net/forum?id=A8et2yjbly",
        "pdf_size": 570733,
        "rating": "1;3;5",
        "confidence": "4;5;5",
        "soundness": "1;2;2",
        "contribution": "1;1;3",
        "presentation": "1;3;2",
        "wc_summary": "20;48;52",
        "wc_strengths": "1;20;35",
        "wc_weaknesses": "1;301;17",
        "wc_questions": "1;237;93",
        "wc_review": "23;606;197",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            1.632993161855452
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            40.0,
            14.236104336041748
        ],
        "wc_strengths_avg": [
            18.666666666666668,
            13.912424503139471
        ],
        "wc_weaknesses_avg": [
            106.33333333333333,
            137.80501522884506
        ],
        "wc_questions_avg": [
            110.33333333333333,
            97.12306054119634
        ],
        "wc_review_avg": [
            275.3333333333333,
            244.36902877046882
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.8660254037844385,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:kTMjHNgnHi0J:scholar.google.com/&scioq=Cross-Modality+Masked+Pre-training+for+Visible-Infrared+Person+Re-identification&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Nankai University;Nanjing University of Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.nankai.edu.cn;http://www.nust.edu.cn/",
        "aff_unique_abbr": "NKU;NUST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "A8xmyDIZhn",
        "title": "FedDRO: Federated Compositional Optimization for Distributionally Robust Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recently, compositional optimization (CO) has gained popularity because of its applications in distributionally robust optimization (DRO) and many other machine learning problems. Large-scale and distributed availability of data demands the development of efficient federated learning (FL) algorithms for solving CO problems. Developing FL algorithms for CO is particularly challenging because of the compositional nature of the objective. Moreover, current state-of-the-art methods to solve such problems rely on large batch gradients (depending on the solution accuracy) not feasible for most practical settings. To address these challenges, in this work, we propose efficient FedAvg-type algorithms for solving non-convex CO in the FL setting. We first establish that vanilla FedAvg is not suitable to solve distributed CO problems because of the data heterogeneity in the compositional objective at each client which leads to the amplification of bias in the local compositional gradient estimates. To this end, we propose a novel Distributed-DRO (D-DRO)~framework that utilizes the DRO problem structure to design a communication strategy that allows FedAvg to control the bias in the estimation of the compositional gradient. A key novelty of our work is to develop solution accuracy-independent algorithms that do not require large batch gradients (and function evaluations) for solving federated CO problems. We establish $\\mathcal{O}(\\epsilon^{-2})$ and \n sample and $\\mathcal{O}(\\epsilon^{-3/2})$ communication complexity in the FL setting while achieving linear speedup with the number of clients. We corroborate our theoretical findings with empirical studies on large-scale DRO problems with multiple real datasets.",
        "keywords": "Compositional Optimization;Federated Learning;Distributionally robust Learning",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/41c2707ac0a77343414ce38b49a363ef560d0584.pdf",
        "author": "Prashant Khanduri;Chengyin Li;RAFI IBN SULTAN;Yao Qiang;Joerg Kliewer;Dongxiao Zhu",
        "authorids": "~Prashant_Khanduri1;~Chengyin_Li1;~RAFI_IBN_SULTAN1;~Yao_Qiang1;~Joerg_Kliewer1;~Dongxiao_Zhu1",
        "gender": "M;M;M;M;;M",
        "homepage": "https://sites.google.com/view/khanduri-prashant/home?authuser=0;https://chengyinlee.github.io/;https://rafiibnsultan.github.io/;https://qiangyao1988.github.io/;https://web.njit.edu/~jkliewer/wp/;https://dongxiaozhu.github.io",
        "dblp": "158/4888;262/6036;245/7089;261/3623;39/4721;15/6233",
        "google_scholar": ";GeL7DtsAAAAJ;https://scholar.google.com/citations?hl=en;8ADcg38AAAAJ;;https://scholar.google.com/citations?hl=en",
        "orcid": ";0000-0003-2450-9760;0009-0002-5814-0404;0000-0003-2995-3385;;",
        "linkedin": "prashant-khanduri-0497894b/;chengyin-li-a4262862/;rafi-ibn-sultan;yaoqiang/;;dongxiao-zhu-5796754/",
        "or_profile": "~Prashant_Khanduri1;~Chengyin_Li1;~RAFI_IBN_SULTAN1;~Yao_Qiang1;~Joerg_Kliewer1;~Dongxiao_Zhu1",
        "aff": "Wayne State University;Wayne State University;Wayne State University;Wayne State University;New Jersey Institute of Technology;Wayne State University",
        "aff_domain": "wayne.edu;wayne.edu;wayne.edu;wayne.edu;njit.edu;wayne.edu",
        "position": "Assistant Professor;PhD student;PhD student;PhD student;Full Professor;Full Professor",
        "bibtex": "@misc{\nkhanduri2024feddro,\ntitle={Fed{DRO}: Federated Compositional Optimization for Distributionally Robust Learning},\nauthor={Prashant Khanduri and Chengyin Li and RAFI IBN SULTAN and Yao Qiang and Joerg Kliewer and Dongxiao Zhu},\nyear={2024},\nurl={https://openreview.net/forum?id=A8xmyDIZhn}\n}",
        "github": "",
        "project": "",
        "reviewers": "StaW;J3Ha;EdtR;Sjhd",
        "site": "https://openreview.net/forum?id=A8xmyDIZhn",
        "pdf_size": 2042583,
        "rating": "3;5;5;6",
        "confidence": "5;4;4;3",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;2",
        "presentation": "1;3;3;3",
        "wc_summary": "62;41;41;46",
        "wc_strengths": "11;36;49;41",
        "wc_weaknesses": "28;143;3;22",
        "wc_questions": "228;5;353;1",
        "wc_review": "329;225;446;110",
        "wc_reply_reviewers": "28;0;399;14",
        "wc_reply_authors": "1789;528;2380;90",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "3;1;3;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            47.5,
            8.616843969807043
        ],
        "wc_strengths_avg": [
            34.25,
            14.201672436723781
        ],
        "wc_weaknesses_avg": [
            49.0,
            55.04997729336498
        ],
        "wc_questions_avg": [
            146.75,
            150.3967669200372
        ],
        "wc_review_avg": [
            277.5,
            124.35533764177555
        ],
        "wc_reply_reviewers_avg": [
            110.25,
            167.00355535137567
        ],
        "wc_reply_authors_avg": [
            1196.75,
            925.0625316701569
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            1.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.9733285267845754,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:N6j1u_SC_o4J:scholar.google.com/&scioq=FedDRO:+Federated+Compositional+Optimization+for+Distributionally+Robust+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0;1;0",
        "aff_unique_norm": "Wayne State University;New Jersey Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://wayne.edu;https://www.njit.edu",
        "aff_unique_abbr": "WSU;NJIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "AAxIs3D2ZZ",
        "title": "RLAIF: Scaling Reinforcement Learning from Human Feedback with AI Feedback",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Reinforcement learning from human feedback (RLHF) is an effective technique for aligning large language models (LLMs) to human preferences, but gathering high-quality human preference labels is a critical bottleneck. RL from AI Feedback (RLAIF) is an alternative solution that generates preferences labels using an off-the-shelf LLM in lieu of human annotators. We compare RLAIF and RLHF, and we find that RLAIF achieves improvements on par with RLHF, with both RL policies outperforming the baseline supervised fine-tuning policy by approximately 70\\% for summarization and 60\\% for helpful dialogue generation, as rated by human evaluators. Furthermore, when asked to rate RLAIF against RLHF in a head-to-head comparison, both are equally preferred. These results suggest that RLAIF can achieve human-level performance, offering a potential solution to the scalability limitations of RLHF.",
        "keywords": "reinforcement learning;rlhf;rlaif;nlp;large language models;llm;nlp;machine learning",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Harrison Lee;Samrat Phatale;Hassan Mansoor;Kellie Ren Lu;Thomas Mesnard;Johan Ferret;Colton Bishop;Ethan Hall;Victor Carbune;Abhinav Rastogi",
        "authorids": "~Harrison_Lee1;~Samrat_Phatale1;~Hassan_Mansoor1;~Kellie_Ren_Lu1;~Thomas_Mesnard2;~Johan_Ferret1;~Colton_Bishop1;~Ethan_Hall1;~Victor_Carbune1;~Abhinav_Rastogi2",
        "gender": "M;M;M;;;M;M;M;M;M",
        "homepage": ";;https://www.linkedin.com/in/hassan-mansoor-6938364/;;https://thomasmesnard.github.io/;https://ferretj.github.io;https://bishopcolton.com;;https://ai.google/research/people/104909;",
        "dblp": "249/6387-1;192/7541.html;;;;;;;199/7020;",
        "google_scholar": ";gTK5jNYAAAAJ;;qZ3I8gQAAAAJ;;uyUnqjMAAAAJ;;;https://scholar.google.ch/citations?user=35djUQYAAAAJ;uDrgdtwAAAAJ",
        "orcid": ";;;;;;;;;",
        "linkedin": "harrisonl;;;;;;;ethan-hall-397391b0/;vcarbune/;abhinav-rastogi-0a466934/",
        "or_profile": "~Harrison_Lee1;~Samrat_Phatale1;~Hassan_Mansoor1;~Kellie_Ren_Lu1;~Thomas_Mesnard2;~Johan_Ferret1;~Colton_Bishop1;~Ethan_Hall1;~Victor_Carbune1;~Abhinav_Rastogi2",
        "aff": "Google;Google DeepMind;Google;;Google DeepMind;Google;;Google;Google;Google",
        "aff_domain": "google.com;deepmind.com;google.com;;google.com;google.com;;google.com;google.com;google.com",
        "position": "Researcher;Researcher;Researcher;;PhD student;Researcher;;Software Engineer;Researcher;Research Scientist",
        "bibtex": "@misc{\nlee2024rlaif,\ntitle={{RLAIF}: Scaling Reinforcement Learning from Human Feedback with {AI} Feedback},\nauthor={Harrison Lee and Samrat Phatale and Hassan Mansoor and Kellie Ren Lu and Thomas Mesnard and Johan Ferret and Colton Bishop and Ethan Hall and Victor Carbune and Abhinav Rastogi},\nyear={2024},\nurl={https://openreview.net/forum?id=AAxIs3D2ZZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "RhkW;BDUS;4rk2;LzbJ",
        "site": "https://openreview.net/forum?id=AAxIs3D2ZZ",
        "pdf_size": 759682,
        "rating": "3;6;6;8",
        "confidence": "4;4;4;4",
        "soundness": "2;3;2;4",
        "contribution": "2;4;3;4",
        "presentation": "3;3;3;4",
        "wc_summary": "90;236;62;27",
        "wc_strengths": "83;133;40;41",
        "wc_weaknesses": "318;280;300;49",
        "wc_questions": "1;97;224;17",
        "wc_review": "492;746;626;134",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1064;1010;1052;490",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            3.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            103.75,
            79.54990571961729
        ],
        "wc_strengths_avg": [
            74.25,
            38.10101704679286
        ],
        "wc_weaknesses_avg": [
            236.75,
            109.22768650850388
        ],
        "wc_questions_avg": [
            84.75,
            88.23937613106747
        ],
        "wc_review_avg": [
            499.5,
            229.35289403013863
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            904.0,
            239.86246058939693
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 540,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7995210232742152683&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0;0;0;0;0",
        "aff_unique_norm": "Google",
        "aff_unique_dep": "Google",
        "aff_unique_url": "https://www.google.com",
        "aff_unique_abbr": "Google",
        "aff_campus_unique_index": "0;0;0;0;0;0",
        "aff_campus_unique": "Mountain View;",
        "aff_country_unique_index": "0;1;0;1;0;0;0;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "ABIcBDLBVG",
        "title": "Fill in the Blank: Exploring and Enhancing LLM Capabilities for Backward Reasoning in Math Word Problems",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "While forward reasoning (i.e., find the answer given the question) has been explored extensively in the recent literature, backward reasoning is relatively unexplored. We examine the backward reasoning capabilities of LLMs on Math Word Problems (MWPs): given a mathematical question and its answer, with some details omitted from the question, can LLMs effectively retrieve the missing information? \n\nIn this paper, we formally define the backward reasoning task on math word problems and modify three datasets to evaluate this task: GSM8k, SVAMP and MultiArith. Our findings show a significant drop in the accuracy of models on backward reasoning compared to forward reasoning across four SOTA LLMs (GPT4, GPT3.5, PaLM-2, and LLaMa). Utilizing the specific format of this task, we propose three novel techniques that improve performance: Rephrase reformulates the given problem into a forward reasoning problem, PAL-Tools combines the idea of Program-Aided LLMs to produce a set of equations that can be solved by an external solver, and Check your Work exploits the availability of natural verifier of high accuracy in the forward direction, interleaving solving and verification steps. Finally, realizing that each of our base methods correctly solves a different set of problems, we propose a novel Bayesian formulation for creating an ensemble over these base methods aided by a verifier to further boost the accuracy by a significant margin. Extensive experimentation demonstrates that our techniques successively improve the performance of LLMs on the backward reasoning task, with the final ensemble-based method resulting in a substantial performance gain compared to the raw LLMs with standard prompting techniques such as chain-of-thought.",
        "keywords": "large language models;prompting;mathematical reasoning;natural language processing",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Aniruddha Deb;Neeva Hareshbhai Oza;Sarthak Singla;Dinesh Khandelwal;Dinesh Garg;Parag Singla",
        "authorids": "~Aniruddha_Deb1;~Neeva_Hareshbhai_Oza1;~Sarthak_Singla1;~Dinesh_Khandelwal2;~Dinesh_Garg1;~Parag_Singla1",
        "gender": "Not Specified;;M;M;M;M",
        "homepage": "https://www.aniruddhadeb.com;;;https://research.ibm.com/people/dinesh-khandelwal;https://researcher.watson.ibm.com/researcher/view.php?person=in-garg.dinesh;http://www.cse.iitd.ac.in/~parags",
        "dblp": ";358/6181;;177/0164;https://dblp.uni-trier.de/pers/g/Garg:Dinesh.html;14/167",
        "google_scholar": ";;;Pi-SqXwAAAAJ;https://scholar.google.com.tw/citations?user=YrU_ZDkAAAAJ;https://scholar.google.co.in/citations?user=V49BsgMAAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";learner4ever/;sarthak-singla/;dinesh-khandelwal-68689420/;dingarg/;",
        "or_profile": "~Aniruddha_Deb1;~Neeva_Hareshbhai_Oza1;~Sarthak_Singla1;~Dinesh_Khandelwal2;~Dinesh_Garg1;~Parag_Singla1",
        "aff": "Indian Institute of Technology, Delhi;Indian Institute of Technology, Delhi;;International Business Machines;;Indian Institute of Technology, Delhi",
        "aff_domain": "iitd.ac.in;iitd.ac.in;;ibm.com;;iitd.ac.in",
        "position": "Undergrad student;MS student;;Researcher;;Full Professor",
        "bibtex": "@misc{\ndeb2024fill,\ntitle={Fill in the Blank: Exploring and Enhancing {LLM} Capabilities for Backward Reasoning in Math Word Problems},\nauthor={Aniruddha Deb and Neeva Hareshbhai Oza and Sarthak Singla and Dinesh Khandelwal and Dinesh Garg and Parag Singla},\nyear={2024},\nurl={https://openreview.net/forum?id=ABIcBDLBVG}\n}",
        "github": "",
        "project": "",
        "reviewers": "AYQE;9odL;4wdv;xzVN",
        "site": "https://openreview.net/forum?id=ABIcBDLBVG",
        "pdf_size": 421256,
        "rating": "3;5;6;8",
        "confidence": "5;3;4;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;2;3",
        "wc_summary": "125;79;63;41",
        "wc_strengths": "66;41;39;30",
        "wc_weaknesses": "519;210;116;49",
        "wc_questions": "187;13;47;49",
        "wc_review": "897;343;265;169",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1136;740;606;306",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            77.0,
            30.822070014844883
        ],
        "wc_strengths_avg": [
            44.0,
            13.360389215887388
        ],
        "wc_weaknesses_avg": [
            223.5,
            179.93679445849867
        ],
        "wc_questions_avg": [
            74.0,
            66.79071791798619
        ],
        "wc_review_avg": [
            418.5,
            283.0525569571842
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            697.0,
            298.21636440678435
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.7526178090063818,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15364179068116096669&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Indian Institute of Technology Delhi;International Business Machines Corporation",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.iitdelhi.ac.in;https://www.ibm.com",
        "aff_unique_abbr": "IIT Delhi;IBM",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Delhi;",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "India;United States"
    },
    {
        "title": "Manipulating dropout reveals an optimal balance of efficiency and robustness in biological and machine visual systems",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19272",
        "id": "ADDCErFzev",
        "author_site": "Jacob Prince, Gabriel Fajardo, George Alvarez, Talia Konkle",
        "tldr": "",
        "abstract": "According to the efficient coding hypothesis, neural populations encode information optimally when representations are high-dimensional and uncorrelated. However, such codes may carry a cost in terms of generalization and robustness. Past empirical studies of early visual cortex (V1) in rodents have suggested that this tradeoff indeed constrains sensory representations. However, it remains unclear whether these insights generalize across the hierarchy of the human visual system, and particularly to object representations in high-level occipitotemporal cortex (OTC). To gain new empirical clarity, here we develop a family of object recognition models with parametrically varying dropout proportion $p$, which induces systematically varying dimensionality of internal responses (while controlling all other inductive biases). We find that increasing dropout produces an increasingly smooth, low-dimensional representational space. Optimal robustness to lesioning is observed at around 70% dropout, after which both accuracy and robustness decline. Representational comparison to large-scale 7T fMRI data from occipitotemporal cortex in the Natural Scenes Dataset reveals that this optimal degree of dropout is also associated with maximal emergent neural predictivity. Finally, using new techniques for achieving denoised estimates of the eigenspectrum of human fMRI responses, we compare the rate of eigenspectrum decay between model and brain feature spaces. We observe that the match between model and brain representations is associated with a common balance between efficiency and robustness in the representational space. These results suggest that varying dropout may reveal an optimal point of balance between the efficiency of high-dimensional codes and the robustness of low dimensional codes in hierarchical vision systems.",
        "keywords": "Efficient coding;object representation;dropout;robustness;human fMRI;occipitotemporal cortex;cognitive neuroscience;distributed coding",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "Jacob S. Prince;Gabriel Fajardo;George A. Alvarez;Talia Konkle",
        "authorids": "~Jacob_S._Prince1;fajardgb@bc.edu;~George_A._Alvarez2;~Talia_Konkle1",
        "gender": "M;;M;F",
        "homepage": "https://jacob-prince.github.io/;;https://visionlab.harvard.edu/george/;https://konklab.fas.harvard.edu/",
        "dblp": ";;;",
        "google_scholar": "pd6wUgIAAAAJ;;qU8dld4AAAAJ;QxV9vroAAAAJ",
        "orcid": "0000-0001-6169-9503;;;0000-0003-1738-4744",
        "linkedin": "jacobprince/;;;",
        "or_profile": "~Jacob_S._Prince1;fajardgb@bc.edu;~George_A._Alvarez2;~Talia_Konkle1",
        "aff": "Harvard University;;Harvard University;Harvard University",
        "aff_domain": "harvard.edu;;harvard.edu;harvard.edu",
        "position": "PhD student;;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nprince2024manipulating,\ntitle={Manipulating dropout reveals an optimal balance of efficiency and robustness in biological and machine visual systems},\nauthor={Jacob S. Prince and Gabriel Fajardo and George A. Alvarez and Talia Konkle},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ADDCErFzev}\n}",
        "github": "",
        "project": "",
        "reviewers": "YU1u;h1kR;yavH;wjr3",
        "pdf_size": 6385398,
        "rating": "6;6;6;6",
        "confidence": "4;4;3;3",
        "soundness": "3;3;4;3",
        "contribution": "3;3;3;3",
        "presentation": "4;4;3;3",
        "wc_summary": "110;107;111;170",
        "wc_strengths": "39;117;70;83",
        "wc_weaknesses": "4;28;185;172",
        "wc_questions": "170;29;102;108",
        "wc_review": "323;281;468;533",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "673;182;546;496",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            124.5,
            26.31064423384574
        ],
        "wc_strengths_avg": [
            77.25,
            27.9676152004421
        ],
        "wc_weaknesses_avg": [
            97.25,
            81.8210700247803
        ],
        "wc_questions_avg": [
            102.25,
            49.97186708539115
        ],
        "wc_review_avg": [
            401.25,
            102.95235548543802
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            474.25,
            180.64658175564796
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8966726572268208078&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=ADDCErFzev",
        "pdf": "https://openreview.net/pdf?id=ADDCErFzev",
        "email": "harvard.edu;;harvard.edu;harvard.edu",
        "author_num": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Harvard University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.harvard.edu",
        "aff_unique_abbr": "Harvard",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "LoTa-Bench: Benchmarking Language-oriented Task Planners for Embodied Agents",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19271",
        "id": "ADSxCpCu9s",
        "author_site": "Jae-Woo Choi, Youngwoo Yoon, Hyobin Ong, Jaehong Kim, Minsu Jang",
        "tldr": "",
        "abstract": "Large language models (LLMs) have recently received considerable attention as alternative solutions for task planning. However, comparing the performance of language-oriented task planners becomes difficult, and there exists a dearth of detailed exploration regarding the effects of various factors such as pre-trained model selection and prompt construction. To address this, we propose a benchmark system for automatically quantifying performance of task planning for home-service embodied agents. Task planners are tested on two pairs of datasets and simulators: 1) ALFRED and AI2-THOR, 2) an extension of Watch-And-Help and VirtualHome. Using the proposed benchmark system, we perform extensive experiments with LLMs and prompts, and explore several enhancements of the baseline planner. We expect that the proposed benchmark tool would accelerate the development of language-oriented task planners.",
        "keywords": "task planning;language models;benchmarking;embodied agents;home robots",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Jae-Woo Choi;Youngwoo Yoon;Hyobin Ong;Jaehong Kim;Minsu Jang",
        "authorids": "~Jae-Woo_Choi1;~Youngwoo_Yoon1;~Hyobin_Ong1;~Jaehong_Kim3;~Minsu_Jang1",
        "gender": "M;M;F;M;M",
        "homepage": ";https://sites.google.com/view/youngwoo-yoon/;https://ohnghb99.github.io/hyobin.github.io/;;https://zebehn.github.io",
        "dblp": ";82/5691;;75/3644-1;64/4831",
        "google_scholar": "vE3PElsAAAAJ;XPL1OiAAAAAJ;_7yFVacAAAAJ;https://scholar.google.si/citations?user=PfnxK1kAAAAJ;ggkuHCcAAAAJ",
        "orcid": ";;0009-0000-8479-0510;0000-0002-6840-5026;0000-0002-7166-0300",
        "linkedin": ";;;;minsu-jang-066b1bb/",
        "or_profile": "~Jae-Woo_Choi1;~Youngwoo_Yoon1;~Hyobin_Ong1;~Jaehong_Kim3;~Minsu_Jang1",
        "aff": "Electronics and Telecommunications Research Institute;Electronics and Telecommunications Research Institute;University of Science and Technology;ETRI;Electronics and Telecommunications Research Institute",
        "aff_domain": "etri.re.kr;etri.re.kr;ust.ac.kr;etri.re.kr;etri.re.kr",
        "position": "Researcher;Principal Researcher;MS student;Principle Researcher/Director;Principal Researcher",
        "bibtex": "@inproceedings{\nchoi2024lotabench,\ntitle={LoTa-Bench: Benchmarking Language-oriented Task Planners for Embodied Agents},\nauthor={Jae-Woo Choi and Youngwoo Yoon and Hyobin Ong and Jaehong Kim and Minsu Jang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ADSxCpCu9s}\n}",
        "github": "",
        "project": "",
        "reviewers": "mB86;DjjY;JeGM;JjuX",
        "pdf_size": 12665485,
        "rating": "6;6;6;6",
        "confidence": "4;4;4;3",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;1",
        "presentation": "3;3;2;3",
        "wc_summary": "86;106;77;49",
        "wc_strengths": "76;79;137;45",
        "wc_weaknesses": "209;400;229;81",
        "wc_questions": "3;8;148;11",
        "wc_review": "374;593;591;186",
        "wc_reply_reviewers": "24;0;28;59",
        "wc_reply_authors": "845;1116;1748;889",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "2;3;4;3",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            79.5,
            20.5
        ],
        "wc_strengths_avg": [
            84.25,
            33.23683950077083
        ],
        "wc_weaknesses_avg": [
            229.75,
            113.51514216173982
        ],
        "wc_questions_avg": [
            42.5,
            60.97745485013293
        ],
        "wc_review_avg": [
            436.0,
            169.57151883497417
        ],
        "wc_reply_reviewers_avg": [
            27.75,
            20.980645843252777
        ],
        "wc_reply_authors_avg": [
            1149.5,
            360.52219071785305
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5315466281824827335&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=ADSxCpCu9s",
        "pdf": "https://openreview.net/pdf?id=ADSxCpCu9s",
        "email": "etri.re.kr;etri.re.kr;ust.ac.kr;etri.re.kr;etri.re.kr",
        "author_num": 5,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "Electronics and Telecommunications Research Institute;University of Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.etri.re.kr;",
        "aff_unique_abbr": "ETRI;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "South Korea;"
    },
    {
        "id": "AEi2wyAMyb",
        "title": "Bi-Level Optimization for Pseudo-Labeling Based Semi-Supervised Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Semi-supervised learning (SSL) is a fundamental task in machine learning, empowering models to extract valuable insights from datasets with limited labeled samples and a large amount of unlabeled data. \nAlthough pseudo-labeling is a widely used approach for  SSL that generates pseudo-labels for unlabeled data and leverages them as ground truth labels for training, traditional pseudo-labeling techniques often suffer from the problem of error accumulation, leading to a significant decrease in the quality of pseudo-labels and hence\n\tthe overall model performance. \n\tIn this paper, we propose a novel Bi-level Optimization method for Pseudo-label Learning (BOPL) \n\tto boost semi-supervised training. \nIt treats pseudo-labels as latent variables, and optimizes the model parameters and pseudo-labels\njointly within a bi-level optimization framework. \nBy enabling direct optimization over the pseudo-labels towards maximizing the prediction model performance,\nthe method is expected to produce high-quality pseudo-labels that are much less susceptible to error accumulation. \nTo evaluate the effectiveness of the proposed approach, \nwe conduct extensive experiments on \nmultiple SSL benchmarks. \nThe experimental results show the proposed BOPL outperforms the state-of-the-art SSL techniques.",
        "keywords": "Semi-Supervised Learning;Bi-level Optimization",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Marzi Heidari;Yuhong Guo",
        "authorids": "~Marzi_Heidari1;~Yuhong_Guo1",
        "gender": "F;",
        "homepage": ";",
        "dblp": "270/0305;",
        "google_scholar": "https://scholar.google.ca/citations?user=OEWPekoAAAAJ;",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Marzi_Heidari1;~Yuhong_Guo1",
        "aff": "Carleton University;",
        "aff_domain": "carleton.ca;",
        "position": "PhD student;",
        "bibtex": "@misc{\nheidari2024bilevel,\ntitle={Bi-Level Optimization for Pseudo-Labeling Based Semi-Supervised Learning},\nauthor={Marzi Heidari and Yuhong Guo},\nyear={2024},\nurl={https://openreview.net/forum?id=AEi2wyAMyb}\n}",
        "github": "",
        "project": "",
        "reviewers": "Yzuc;hAat;akKq",
        "site": "https://openreview.net/forum?id=AEi2wyAMyb",
        "pdf_size": 579116,
        "rating": "5;5;6",
        "confidence": "4;3;3",
        "soundness": "2;3;3",
        "contribution": "2;2;3",
        "presentation": "3;2;3",
        "wc_summary": "76;113;46",
        "wc_strengths": "102;58;55",
        "wc_weaknesses": "484;152;183",
        "wc_questions": "7;56;26",
        "wc_review": "669;379;310",
        "wc_reply_reviewers": "29;110;137",
        "wc_reply_authors": "539;839;611",
        "reply_reviewers": "1;1;3",
        "reply_authors": "2;3;4",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            78.33333333333333,
            27.402351886086144
        ],
        "wc_strengths_avg": [
            71.66666666666667,
            21.483844059096022
        ],
        "wc_weaknesses_avg": [
            273.0,
            149.7353220408153
        ],
        "wc_questions_avg": [
            29.666666666666668,
            20.17148702720969
        ],
        "wc_review_avg": [
            452.6666666666667,
            155.5427772529331
        ],
        "wc_reply_reviewers_avg": [
            92.0,
            45.89117562233506
        ],
        "wc_reply_authors_avg": [
            663.0,
            127.87493890516625
        ],
        "reply_reviewers_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            3.0,
            0.816496580927726
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:29BwJvPaTNEJ:scholar.google.com/&scioq=Bi-Level+Optimization+for+Pseudo-Labeling+Based+Semi-Supervised+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Carleton University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://carleton.ca",
        "aff_unique_abbr": "Carleton",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Canada"
    },
    {
        "title": "SpeechTokenizer: Unified Speech Tokenizer for Speech Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19270",
        "id": "AF9Q8Vip84",
        "author_site": "Xin Zhang, Dong Zhang, Shimin Li, Yaqian Zhou, Xipeng Qiu",
        "tldr": "",
        "abstract": "Current speech large language models build upon discrete speech representations,\nwhich can be categorized into semantic tokens and acoustic tokens. However,\nexisting speech tokens are not specifically designed for speech language modeling. To assess the suitability of speech tokens for building speech language\nmodels, we established the first benchmark, SLMTokBench. Our results indicate\nthat neither semantic nor acoustic tokens are ideal for this purpose. Therefore, we\npropose SpeechTokenizer, a unified speech tokenizer for speech large language\nmodels. SpeechTokenizer adopts the Encoder-Decoder architecture with residual\nvector quantization (RVQ). Unifying semantic and acoustic tokens, SpeechTokenizer disentangles different aspects of speech information hierarchically across\ndifferent RVQ layers. Furthermore, We construct a Unified Speech Language\nModel (USLM) leveraging SpeechTokenizer. Experiments show that SpeechTokenizer performs comparably to EnCodec in speech reconstruction and demonstrates\nstrong performance on the SLMTokBench benchmark. Also, USLM outperforms\nVALL-E in zero-shot Text-to-Speech tasks. Code and models are available at\nhttps://github.com/ZhangXInFD/SpeechTokenizer/.",
        "keywords": "speech;audio;multi-modal;large language model",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Xin Zhang;Dong Zhang;Shimin Li;Yaqian Zhou;Xipeng Qiu",
        "authorids": "~Xin_Zhang36;~Dong_Zhang9;~Shimin_Li1;~Yaqian_Zhou1;~Xipeng_Qiu1",
        "gender": "M;M;M;F;M",
        "homepage": "https://github.com/ZhangXInFD;;;;https://xpqiu.github.io/",
        "dblp": ";;;34/389-1.html;69/1395",
        "google_scholar": "https://scholar.google.com/citations?hl=en;ScVbeu0AAAAJ;0xxkGjMAAAAJ;;Pq4Yp_kAAAAJ",
        "orcid": ";;;;0000-0001-7163-5247",
        "linkedin": ";;;;",
        "or_profile": "~Xin_Zhang36;~Dong_Zhang9;~Shimin_Li1;~Yaqian_Zhou1;~Xipeng_Qiu1",
        "aff": "Fudan University;Fudan University;Fudan University;Fudan University;Fudan University",
        "aff_domain": "fudan.edu.cn;fudan.edu.cn;fudan.edu.cn;fudan.edu.cn;fudan.edu.cn",
        "position": "MS student;MS student;PhD student;Associate Professor;Full Professor",
        "bibtex": "@inproceedings{\nzhang2024speechtokenizer,\ntitle={SpeechTokenizer: Unified Speech Tokenizer for Speech Language Models},\nauthor={Xin Zhang and Dong Zhang and Shimin Li and Yaqian Zhou and Xipeng Qiu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=AF9Q8Vip84}\n}",
        "github": "",
        "project": "",
        "reviewers": "pbGo;g1yJ;usJL;tD35",
        "pdf_size": 1257544,
        "rating": "3;6;6;8",
        "confidence": "4;4;3;4",
        "soundness": "3;2;2;3",
        "contribution": "2;3;2;3",
        "presentation": "3;3;2;3",
        "wc_summary": "149;72;47;69",
        "wc_strengths": "98;69;33;115",
        "wc_weaknesses": "210;257;100;61",
        "wc_questions": "29;31;5;44",
        "wc_review": "486;429;185;289",
        "wc_reply_reviewers": "0;107;0;0",
        "wc_reply_authors": "666;1474;513;234",
        "reply_reviewers": "0;2;0;0",
        "reply_authors": "1;4;1;1",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            84.25,
            38.6094224251024
        ],
        "wc_strengths_avg": [
            78.75,
            31.115711465431737
        ],
        "wc_weaknesses_avg": [
            157.0,
            79.48899294870957
        ],
        "wc_questions_avg": [
            27.25,
            14.077908225301087
        ],
        "wc_review_avg": [
            347.25,
            117.95417542418751
        ],
        "wc_reply_reviewers_avg": [
            26.75,
            46.332359102467464
        ],
        "wc_reply_authors_avg": [
            721.75,
            461.1032286809538
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            1.75,
            1.299038105676658
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.08084520834544431,
        "gs_citation": 136,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10604890170283513348&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=AF9Q8Vip84",
        "pdf": "https://openreview.net/pdf?id=AF9Q8Vip84",
        "email": "fudan.edu.cn;fudan.edu.cn;fudan.edu.cn;fudan.edu.cn;fudan.edu.cn",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Fudan University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.fudan.edu.cn",
        "aff_unique_abbr": "Fudan",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "MuSc: Zero-Shot Industrial Anomaly Classification and Segmentation with Mutual Scoring of the Unlabeled Images",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19269",
        "id": "AHgc5SMdtd",
        "author_site": "Xurui Li, Ziming Huang, Feng Xue, Yu Zhou",
        "tldr": "",
        "abstract": "This paper studies zero-shot anomaly classification (AC) and segmentation (AS) in industrial vision.\nWe reveal that the abundant normal and abnormal cues implicit in unlabeled test images can be exploited for anomaly determination, which is ignored by prior methods.\nOur key observation is that for the industrial product images, the normal image patches could find a relatively large number of similar patches in other unlabeled images,\nwhile the abnormal ones only have a few similar patches.\nWe leverage such a discriminative characteristic to design a novel zero-shot AC/AS method by Mutual Scoring (MuSc) of the unlabeled images,  \nwhich does not need any training or prompts.\nSpecifically, we perform Local Neighborhood Aggregation with Multiple Degrees (LNAMD) to obtain the patch features that are capable of representing anomalies in varying sizes.\nThen we propose the Mutual Scoring Mechanism (MSM) to leverage the unlabeled test images to assign the anomaly score to each other. \nFurthermore, we present an optimization approach named Re-scoring with Constrained Image-level Neighborhood (RsCIN) for image-level anomaly classification to suppress the false positives caused by noises in normal images.\nThe superior performance on the challenging MVTec AD and VisA datasets demonstrates the effectiveness of our approach. \nCompared with the state-of-the-art zero-shot approaches, \nMuSc achieves a $\\textbf{21.1}$% PRO absolute gain (from 72.7\\% to 93.8\\%) on MVTec AD, a $\\textbf{19.4}$% pixel-AP gain and a $\\textbf{14.7}$% pixel-AUROC gain on VisA.\nIn addition, our zero-shot approach outperforms most of the few-shot approaches and is comparable to some one-class methods.\nCode is available at https://github.com/xrli-U/MuSc.",
        "keywords": "zero-shot anomaly detection;  Industrial Informatics\uff1b",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Xurui Li;Ziming Huang;Feng Xue;Yu Zhou",
        "authorids": "~Xurui_Li4;~Ziming_Huang2;~Feng_Xue3;~Yu_Zhou1",
        "gender": "M;M;M;",
        "homepage": "https://github.com/xrli-U;https://github.com/ZimingHuang1;https://xuefeng-cvr.github.io/;https://github.com/zhouyu-hust",
        "dblp": ";;;36/2728-16.html",
        "google_scholar": ";;66SeiQsAAAAJ;",
        "orcid": "0009-0007-3590-9870;;0000-0002-4101-3401;",
        "linkedin": ";;;",
        "or_profile": "~Xurui_Li4;~Ziming_Huang2;~Feng_Xue3;~Yu_Zhou1",
        "aff": "Huazhong University of Science and Technology;Huazhong University of Science and Technology;University of Trento;Huazhong University of Science and Technology",
        "aff_domain": "hust.edu.cn;hust.edu.cn;unitn.it;hust.edu.cn",
        "position": "MS student;MS student;Postdoc;Associate Professor",
        "bibtex": "@inproceedings{\nli2024musc,\ntitle={MuSc: Zero-Shot Industrial Anomaly Classification and Segmentation with Mutual Scoring of the Unlabeled Images},\nauthor={Xurui Li and Ziming Huang and Feng Xue and Yu Zhou},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=AHgc5SMdtd}\n}",
        "github": "",
        "project": "",
        "reviewers": "52S5;dCfU;H5pV;idjR;NLA8",
        "pdf_size": 15540149,
        "rating": "3;5;6;6;6",
        "confidence": "3;4;5;3;5",
        "soundness": "1;3;4;3;2",
        "contribution": "1;2;3;3;3",
        "presentation": "1;3;4;3;2",
        "wc_summary": "170;39;26;45;70",
        "wc_strengths": "15;5;30;79;147",
        "wc_weaknesses": "165;157;144;103;67",
        "wc_questions": "1;92;3;3;2",
        "wc_review": "351;293;203;230;286",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "1083;2241;437;185;1416",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "2;4;1;1;3",
        "rating_avg": [
            5.2,
            1.16619037896906
        ],
        "confidence_avg": [
            4.0,
            0.8944271909999159
        ],
        "soundness_avg": [
            2.6,
            1.019803902718557
        ],
        "contribution_avg": [
            2.4,
            0.8
        ],
        "presentation_avg": [
            2.6,
            1.019803902718557
        ],
        "wc_summary_avg": [
            70.0,
            52.003846011617256
        ],
        "wc_strengths_avg": [
            55.2,
            52.46865731081748
        ],
        "wc_weaknesses_avg": [
            127.2,
            36.90203246435079
        ],
        "wc_questions_avg": [
            20.2,
            35.907659350060676
        ],
        "wc_review_avg": [
            272.6,
            51.77103437251375
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1072.4,
            731.4384731472634
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.2,
            1.16619037896906
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5752237416355278,
        "gs_citation": 26,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4485039909524484938&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=AHgc5SMdtd",
        "pdf": "https://openreview.net/pdf?id=AHgc5SMdtd",
        "email": "hust.edu.cn;hust.edu.cn;unitn.it;hust.edu.cn",
        "author_num": 4,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Huazhong University of Science and Technology;University of Trento",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.hust.edu.cn;https://www.unitn.it",
        "aff_unique_abbr": "HUST;UniTN",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "China;Italy"
    },
    {
        "id": "AIbQ3HDDHU",
        "title": "Training and inference of large language models using 8-bit floating point",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "FP8 formats are gaining popularity to boost the computational efficiency for training and inference of large deep learning models. Their main challenge is that a careful choice of scaling is needed to prevent degradation due to the reduced dynamic range compared to higher-precision formats. Although there exists ample literature about selecting such scalings for INT formats, this critical aspect has yet to be addressed for FP8. This paper presents a methodology to select the scalings for FP8 linear layers, based on dynamically updating per-tensor scales for the weights, gradients and activations. We apply this methodology to train and validate large language models of the type of GPT and Llama 2 using FP8, for model sizes ranging from 111M to 70B. To facilitate the understanding of the FP8 dynamics, our results are accompanied by plots of the per-tensor scale distribution for weights, activations and gradients during both training and inference.",
        "keywords": "FP8;quantisation;low-precision training;low-precision inference;post-training quantisation;large language models;hardware",
        "primary_area": "infrastructure, software libraries, hardware, etc.",
        "supplementary_material": "",
        "author": "Sergio P. Perez;Yan Zhang;James Briggs;Charlie Blake;Josh Levy-Kramer;Paul Balanca;Carlo Luschi;Stephen Barlow;Andrew W Fitzgibbon",
        "authorids": "~Sergio_P._Perez1;~Yan_Zhang32;~James_Briggs1;~Charlie_Blake1;~Josh_Levy-Kramer1;~Paul_Balanca1;~Carlo_Luschi1;~Stephen_Barlow2;~Andrew_W_Fitzgibbon1",
        "gender": ";;M;M;M;M;M;M;M",
        "homepage": ";;https://jimypbr.github.io/;https://thecharlieblake.co.uk/;;https://github.com/balancap;;https://graphcore.ai;http://awf.fitzgibbon.ie",
        "dblp": ";;;243/6977;;;72/10621;;f/AndrewWFitzgibbon",
        "google_scholar": "izqE_ooAAAAJ;;TYNnuTYAAAAJ;kvibgXMAAAAJ;NJxqHNcAAAAJ;;;;73t3lIcAAAAJ",
        "orcid": ";;;;;;;;",
        "linkedin": "sergiopp;yan-zhang-54b79071;jimypbr/;;joshlevykramer/;;carlo-luschi-1908144/;stevebarlow;andrew-fitzgibbon-952b9370",
        "or_profile": "~Sergio_P._Perez1;~Yan_Zhang32;~James_Briggs1;~Charlie_Blake1;~Josh_Levy-Kramer1;~Paul_Balanca1;~Carlo_Luschi1;~Stephen_Barlow2;~Andrew_W_Fitzgibbon1",
        "aff": ";Graphcore;;;;Graphcore;Graphcore;Graphcore Ltd;Graphcore",
        "aff_domain": ";graphcore.ai;;;;graphcore.ai;graphcore.ai;graphcore.ai;graphcore.ai",
        "position": ";Researcher;;;;Researcher;VP & Head of Research;Member of Engineering Team;Researcher",
        "bibtex": "@misc{\nperez2024training,\ntitle={Training and inference of large language models using 8-bit floating point},\nauthor={Sergio P. Perez and Yan Zhang and James Briggs and Charlie Blake and Josh Levy-Kramer and Paul Balanca and Carlo Luschi and Stephen Barlow and Andrew W Fitzgibbon},\nyear={2024},\nurl={https://openreview.net/forum?id=AIbQ3HDDHU}\n}",
        "github": "",
        "project": "",
        "reviewers": "LXwv;PWj7;ViM8",
        "site": "https://openreview.net/forum?id=AIbQ3HDDHU",
        "pdf_size": 677378,
        "rating": "3;5;6",
        "confidence": "3;4;3",
        "soundness": "2;3;3",
        "contribution": "1;2;3",
        "presentation": "2;3;3",
        "wc_summary": "27;111;41",
        "wc_strengths": "32;27;28",
        "wc_weaknesses": "275;257;40",
        "wc_questions": "17;47;37",
        "wc_review": "351;442;146",
        "wc_reply_reviewers": "184;50;86",
        "wc_reply_authors": "419;343;207",
        "reply_reviewers": "1;1;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            59.666666666666664,
            36.745370078721784
        ],
        "wc_strengths_avg": [
            29.0,
            2.160246899469287
        ],
        "wc_weaknesses_avg": [
            190.66666666666666,
            106.79055305701074
        ],
        "wc_questions_avg": [
            33.666666666666664,
            12.472191289246473
        ],
        "wc_review_avg": [
            313.0,
            123.79283770342558
        ],
        "wc_reply_reviewers_avg": [
            106.66666666666667,
            56.62351298022953
        ],
        "wc_reply_authors_avg": [
            323.0,
            87.69644614616186
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.18898223650461363,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12127229904750398817&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Graphcore",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.graphcore.ai",
        "aff_unique_abbr": "Graphcore",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "AJ7tnHhgWZ",
        "title": "Enhancing Vision-Language Prompt Learning through Image-Text Distribution Alignment",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large vision-language models (VLMs) such as CLIP have demonstrated impressive performance in zero-shot image classification tasks. These models usually leverage prompts to align the text and image distributions. However, existing prompting techniques have limitations in terms of interpretability or dynamic alignment of distributions. Specifically, the discrete prompt learning methods cannot effectively perform dynamic alignment of distributions, while the soft prompt learning method have very limited interpretability, rendering them challenging to comprehend and enhance. To jointly solve these issues, we leverage the interpretable descriptions to facilitate the soft prompt learning. In this paper, we introduce a novel training-free strategy to mitigate the distribution gap between plain text and image-text corpus, leveraging the power of pretrained models like GPT-3 to enhance image classification performance. Furthermore, we propose a new few-shot learning pipeline that incorporates a prompt learning and reweighting strategy to dynamically mitigate the image and text distribution gap. This method overcomes the limitations of existing prompting techniques and offers a more effective and interpretable solution for image classification tasks. Extensive experiments show the effectiveness of our method and illustrate the interpretability of our descriptions.",
        "keywords": "Domain adaptaion;CLIP;Prompt learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Dongliang Guo;Handong Zhao;Sungchul Kim;Ryan A. Rossi;Tong Yu;Sheng Li",
        "authorids": "~Dongliang_Guo1;~Handong_Zhao3;~Sungchul_Kim1;~Ryan_A._Rossi2;~Tong_Yu3;~Sheng_Li3",
        "gender": "M;M;;M;;M",
        "homepage": "https://donglgcn.github.io/;https://sites.google.com/site/subright;https://www.linkedin.com/in/tong-yu-42790744;http://sheng-li.org;https://hdzhao.github.io/;http://ryanrossi.com",
        "dblp": "48/7696-2.html;61/1573;32/1593-1;23/3439-1;79/8522;17/5085",
        "google_scholar": ";v8ISLgIAAAAJ;https://scholar.google.com/citations?hl=en;DEncVcYAAAAJ;0f-YOFgAAAAJ;_Dc6lbQAAAAJ",
        "orcid": "0000-0003-2856-4011;0000-0003-3580-5290;0000-0002-5991-2050;0000-0003-1205-8632;;0000-0001-9758-0635",
        "linkedin": ";;tong-yu-42790744;sheng-li-15a70022/;;",
        "or_profile": "~Dongliang_Guo1;~Sungchul_Kim1;~Tong_Yu3;~Sheng_Li3;~Handong_Zhao1;~Ryan_Rossi1",
        "aff": "University of Virginia, Charlottesville;Adobe Systems;Adobe Research;University of Virginia, Charlottesville;Adobe Systems;Adobe Research",
        "aff_domain": "virginia.edu;adobe.com;adobe.com;virginia.edu;adobe.com;adobe.com",
        "position": "PhD student;Researcher;Senior Research Scientist;Associate Professor;Research Scientist;Senior Research Scientist",
        "bibtex": "@misc{\nguo2024enhancing,\ntitle={Enhancing Vision-Language Prompt Learning through Image-Text Distribution Alignment},\nauthor={Dongliang Guo and Handong Zhao and Sungchul Kim and Ryan A. Rossi and Tong Yu and Sheng Li},\nyear={2024},\nurl={https://openreview.net/forum?id=AJ7tnHhgWZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "1JaY;W7r5;sZnc",
        "site": "https://openreview.net/forum?id=AJ7tnHhgWZ",
        "pdf_size": 1873941,
        "rating": "3;3;3",
        "confidence": "4;5;5",
        "soundness": "2;2;2",
        "contribution": "2;2;1",
        "presentation": "2;2;2",
        "wc_summary": "79;84;104",
        "wc_strengths": "102;25;89",
        "wc_weaknesses": "290;740;306",
        "wc_questions": "202;6;2",
        "wc_review": "673;855;501",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            89.0,
            10.801234497346433
        ],
        "wc_strengths_avg": [
            72.0,
            33.65511352924941
        ],
        "wc_weaknesses_avg": [
            445.3333333333333,
            208.46315954836933
        ],
        "wc_questions_avg": [
            70.0,
            93.35237900914291
        ],
        "wc_review_avg": [
            676.3333333333334,
            144.5391142755329
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Y40cEljJIjgJ:scholar.google.com/&scioq=Enhancing+Vision-Language+Prompt+Learning+through+Image-Text+Distribution+Alignment&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;0;1;1",
        "aff_unique_norm": "University of Virginia;Adobe",
        "aff_unique_dep": ";Adobe Systems Incorporated",
        "aff_unique_url": "https://www.virginia.edu;https://www.adobe.com",
        "aff_unique_abbr": "UVA;Adobe",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Charlottesville;",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Backdoor Federated Learning by Poisoning Backdoor-Critical Layers",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19268",
        "id": "AJBGSVSTT2",
        "author_site": "Haomin Zhuang, Mingxian Yu, Hao Wang, Yang Hua, Jian Li, Xu Yuan",
        "tldr": "",
        "abstract": "Federated learning (FL) has been widely deployed to enable machine learning training on sensitive data across distributed devices. However, the decentralized learning paradigm and heterogeneity of FL further extend the attack surface for backdoor attacks. Existing FL attack and defense methodologies typically focus on the whole model. None of them recognizes the existence of backdoor-critical (BC) layers-a small subset of layers that dominate the model vulnerabilities. Attacking the BC layers achieves equivalent effects as attacking the whole model but at a far smaller chance of being detected by state-of-the-art (SOTA) defenses. This paper proposes a general in-situ approach that identifies and verifies BC layers from the perspective of attackers. Based on the identified BC layers, we carefully craft a new backdoor attack methodology that adaptively seeks a fundamental balance between attacking effects and stealthiness under various defense strategies. Extensive experiments show that our BC layer-aware backdoor attacks can successfully backdoor FL under seven SOTA defenses with only 10% malicious clients and outperform the latest backdoor attack methods.",
        "keywords": "Federated Learning;Backdoor Attack",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/60ac36473d69d31eaa56e5f7104eae3c979a5554.zip",
        "author": "Haomin Zhuang;Mingxian Yu;Hao Wang;Yang Hua;Jian Li;Xu Yuan",
        "authorids": "~Haomin_Zhuang1;~Mingxian_Yu1;~Hao_Wang29;~Yang_Hua2;~Jian_Li14;~Xu_Yuan1",
        "gender": ";;M;M;M;M",
        "homepage": "https://zhmzm.github.io/;;https://www.haow.us;https://pure.qub.ac.uk/en/persons/yang-hua;https://sites.google.com/stonybrook.edu/jianli;https://yuanxuyx.github.io/",
        "dblp": "344/1798;;w/HaoWang-22;;33/5448-8;24/6114-1",
        "google_scholar": "vXllNroAAAAJ;;r-Ik__gAAAAJ;N0tFi8MAAAAJ;h039Yq4AAAAJ;R3XkwA8AAAAJ",
        "orcid": ";0009-0008-8547-7831;0000-0002-1444-2657;0000-0001-5536-503X;;",
        "linkedin": ";;haowanguoft/;;;",
        "or_profile": "~Haomin_Zhuang1;~Mingxian_Yu1;~Hao_Wang29;~Yang_Hua2;~Jian_Li14;~Xu_Yuan1",
        "aff": "University of Notre Dame;SUN YAT-SEN UNIVERSITY;Louisiana State University;Queen's University Belfast;State University of New York at Stony Brook;University of Delaware",
        "aff_domain": "nd.edu;sysu.edu.cn;lsu.edu;qub.ac.uk;stonybrook.edu;udel.edu",
        "position": "PhD student;MS student;Assistant Professor;Assistant Professor;Assistant Professor;Associate Professor",
        "bibtex": "@inproceedings{\nzhuang2024backdoor,\ntitle={Backdoor Federated Learning by Poisoning Backdoor-Critical Layers},\nauthor={Haomin Zhuang and Mingxian Yu and Hao Wang and Yang Hua and Jian Li and Xu Yuan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=AJBGSVSTT2}\n}",
        "github": "",
        "project": "",
        "reviewers": "EGpy;MrXZ;vQhS;tdce",
        "pdf_size": 1740676,
        "rating": "6;6;6;6",
        "confidence": "4;4;4;3",
        "soundness": "3;3;3;2",
        "contribution": "3;2;3;2",
        "presentation": "3;2;3;3",
        "wc_summary": "73;76;128;143",
        "wc_strengths": "11;49;94;27",
        "wc_weaknesses": "125;229;84;27",
        "wc_questions": "151;63;20;143",
        "wc_review": "360;417;326;340",
        "wc_reply_reviewers": "23;132;0;20",
        "wc_reply_authors": "559;1082;436;854",
        "reply_reviewers": "1;2;0;1",
        "reply_authors": "2;3;2;3",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            105.0,
            30.97579700346708
        ],
        "wc_strengths_avg": [
            45.25,
            31.21197686786276
        ],
        "wc_weaknesses_avg": [
            116.25,
            73.81522539422338
        ],
        "wc_questions_avg": [
            94.25,
            54.96987811520051
        ],
        "wc_review_avg": [
            360.75,
            34.65093793824346
        ],
        "wc_reply_reviewers_avg": [
            43.75,
            51.71254683343299
        ],
        "wc_reply_authors_avg": [
            732.75,
            252.45135670065233
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 16,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13229252772080574765&as_sdt=8005&sciodt=0,7&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=AJBGSVSTT2",
        "pdf": "https://openreview.net/pdf?id=AJBGSVSTT2",
        "email": "nd.edu;sysu.edu.cn;lsu.edu;qub.ac.uk;stonybrook.edu;udel.edu",
        "author_num": 6,
        "aff_unique_index": "0;1;2;3;4;5",
        "aff_unique_norm": "University of Notre Dame;Sun Yat-sen University;Louisiana State University;Queen's University Belfast;State University of New York at Stony Brook;University of Delaware",
        "aff_unique_dep": ";;;;;",
        "aff_unique_url": "https://www.nd.edu;http://www.sysu.edu.cn;https://www.lsu.edu;https://www.qub.ac.uk;https://www.stonybrook.edu;https://www.udel.edu",
        "aff_unique_abbr": "Notre Dame;SYSU;LSU;QUB;SUNY Stony Brook;UD",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Stony Brook",
        "aff_country_unique_index": "0;1;0;2;0;0",
        "aff_country_unique": "United States;China;United Kingdom"
    },
    {
        "title": "Causality-Inspired Spatial-Temporal Explanations for Dynamic Graph Neural Networks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19267",
        "id": "AJBkfwXh3u",
        "author_site": "Kesen Zhao, Liang Zhang",
        "tldr": "",
        "abstract": "Dynamic Graph Neural Networks (DyGNNs) have gained significant popularity in the research of dynamic graphs, but are limited by the low transparency, such that human-understandable insights can hardly be drawn from their predictions. Although a number of existing research have been devoted to investigating the interpretability of graph neural networks (GNNs), achieving the interpretability of DyGNNs is pivotally challenging due to the complex spatial-temporal correlations in dynamic graphs. To this end, we propose an innovative causality-inspired generative model based on structural causal model (SCM), which explores the underlying philosophies of DyGNN predictions by identifying the trivial, static, and dynamic causal relationships. To reach this goal, two critical tasks need to be accomplished including (1) disentangling the complex causal relationships, and (2) fitting the spatial-temporal explanations of DyGNNs in the SCM architecture. To tackle these challenges, the proposed method incorporates a contrastive learning module to disentangle trivial and causal relationships, and a dynamic correlating module to disentangle dynamic and static causal relationships, respectively. A dynamic VGAE-based framework is further developed, which generates causal-and-dynamic masks for spatial interpretability, and recognizes dynamic relationships along the time horizon through causal invention for temporal interpretability. Comprehensive experiments have been conducted on both synthetic and real-world datasets, where our approach yields substantial improvements, thereby demonstrating significant superiority.",
        "keywords": "Dynamic Graph;Graph Explanation;Graph Neural Network;Causal Inference",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/6961ddeb5ee2ee2596341db5f50262266b74bb58.zip",
        "author": "Kesen Zhao;Liang Zhang",
        "authorids": "~Kesen_Zhao1;~Liang_Zhang17",
        "gender": "M;M",
        "homepage": ";https://sites.google.com/view/liangzhang1111/liang-zhang-hk-polyu",
        "dblp": "331/3303;",
        "google_scholar": ";MKlx5KsAAAAJ",
        "orcid": ";0000-0002-5805-7099",
        "linkedin": ";",
        "or_profile": "~Kesen_Zhao1;~Liang_Zhang17",
        "aff": "Nanyang Technological University;Shenzhen Research Institute of Big Data",
        "aff_domain": "ntu.edu.sg;sribd.cn",
        "position": "PhD student;Researcher",
        "bibtex": "@inproceedings{\nzhao2024causalityinspired,\ntitle={Causality-Inspired Spatial-Temporal Explanations for Dynamic Graph Neural Networks},\nauthor={Kesen Zhao and Liang Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=AJBkfwXh3u}\n}",
        "github": "",
        "project": "",
        "reviewers": "JCbW;fzQP;8sLV;U7py",
        "pdf_size": 563165,
        "rating": "5;5;6;8",
        "confidence": "4;2;4;2",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;1;3;3",
        "wc_summary": "51;44;94;61",
        "wc_strengths": "77;71;49;59",
        "wc_weaknesses": "263;102;322;9",
        "wc_questions": "141;50;2;12",
        "wc_review": "532;267;467;141",
        "wc_reply_reviewers": "29;0;56;0",
        "wc_reply_authors": "650;833;680;108",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.0,
            1.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            62.5,
            19.1637678967368
        ],
        "wc_strengths_avg": [
            64.0,
            10.816653826391969
        ],
        "wc_weaknesses_avg": [
            174.0,
            124.73371637211808
        ],
        "wc_questions_avg": [
            51.25,
            54.82415070021605
        ],
        "wc_review_avg": [
            351.75,
            156.02143282254525
        ],
        "wc_reply_reviewers_avg": [
            21.25,
            23.29565410114084
        ],
        "wc_reply_authors_avg": [
            567.75,
            274.3595952395323
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.40824829046386296,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14135559314020236466&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=AJBkfwXh3u",
        "pdf": "https://openreview.net/pdf?id=AJBkfwXh3u",
        "email": "ntu.edu.sg;sribd.cn",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Nanyang Technological University;Shenzhen Research Institute of Big Data",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ntu.edu.sg;http://www.sribd.cn",
        "aff_unique_abbr": "NTU;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Singapore;China"
    },
    {
        "id": "AJgVY0zOB0",
        "title": "Weakly-supervised Camera Localization by Ground-to-satellite Image Registration",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The ground-to-satellite image matching/retrieval was initially proposed for city-scale ground camera localization. Recently, more and more attention has been paid to increasing the camera pose accuracy by ground-to-satellite image matching, once a coarse location and orientation has been obtained from the city-scale retrieval.  This paper addresses the same scenario. \nHowever, existing learning-based methods for solving this task require accurate GPS labels of ground images for network training. \nUnfortunately, obtaining such accurate GPS labels is not always possible, often requiring an expensive RTK setup and suffering from signal occlusion, multi-path signal disruptions, \\etc. \nTo address this issue, this paper proposes a weakly-supervised learning strategy for ground-to-satellite image registration. It does not require highly accurate ground truth (GT)\npose labels for ground images in the training dataset. Instead, a coarse location and orientation label, either derived from the city-scale retrieval or noisy sensors (GPS, compass, \\etc), is sufficient. \nSpecifically, we present a pseudo image pair creation strategy for cross-view rotation estimation network training, and a novel method that leverages deep metric learning for translation estimation between ground-and-satellite image pairs.\nExperimental results show that our weakly-supervised learning strategy achieves the best performance on cross-area evaluation, compared to the recent state-of-the-art methods that require accurate pose labels for supervision, and shows comparable performance on same-area evaluation.",
        "keywords": "Cross-view localization;ground-to-satellite image matching;cross-view image matching",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Yujiao Shi;Hongdong Li;Akhil Perincherry;Ankit Vora",
        "authorids": "~Yujiao_Shi1;~Hongdong_Li1;~Akhil_Perincherry1;~Ankit_Vora1",
        "gender": "F;M;;M",
        "homepage": "https://shiyujiao.github.io/;http://users.cecs.anu.edu.au/~hongdong/;;https://ankitvora19.wixsite.com/portfolio",
        "dblp": "159/2546;59/4859.html;;242/8412",
        "google_scholar": "rVsRpZEAAAAJ;https://scholar.google.com.tw/citations?hl=en;;EUS0qnEAAAAJ",
        "orcid": "0000-0001-6028-9051;;;0000-0001-7976-8730",
        "linkedin": "yujiao-shi-053a12198/;;;https://linkedin.com/in/ankitvora1",
        "or_profile": "~Yujiao_Shi1;~Hongdong_Li1;~Akhil_Perincherry1;~Ankit_Vora1",
        "aff": "Australian National University;Australian National University;;Ford Motor Company",
        "aff_domain": "anu.edu.au;anu.edu.au;;ford.com",
        "position": "Postdoc;Full Professor;;Researcher",
        "bibtex": "@misc{\nshi2024weaklysupervised,\ntitle={Weakly-supervised Camera Localization by Ground-to-satellite Image Registration},\nauthor={Yujiao Shi and Hongdong Li and Akhil Perincherry and Ankit Vora},\nyear={2024},\nurl={https://openreview.net/forum?id=AJgVY0zOB0}\n}",
        "github": "",
        "project": "",
        "reviewers": "9PqU;db9o;mQu3",
        "site": "https://openreview.net/forum?id=AJgVY0zOB0",
        "pdf_size": 21753895,
        "rating": "3;6;6",
        "confidence": "5;4;4",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "3;3;3",
        "wc_summary": "118;80;110",
        "wc_strengths": "36;76;167",
        "wc_weaknesses": "200;148;197",
        "wc_questions": "18;36;91",
        "wc_review": "372;340;565",
        "wc_reply_reviewers": "0;20;146",
        "wc_reply_authors": "685;694;395",
        "reply_reviewers": "0;1;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            102.66666666666667,
            16.35712552851373
        ],
        "wc_strengths_avg": [
            93.0,
            54.81483983983413
        ],
        "wc_weaknesses_avg": [
            181.66666666666666,
            23.837412238374835
        ],
        "wc_questions_avg": [
            48.333333333333336,
            31.05192783422991
        ],
        "wc_review_avg": [
            425.6666666666667,
            99.38589213543116
        ],
        "wc_reply_reviewers_avg": [
            55.333333333333336,
            64.62885492478486
        ],
        "wc_reply_authors_avg": [
            591.3333333333334,
            138.87724395626842
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14290918079063947141&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Australian National University;Ford Motor Company",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.anu.edu.au;https://www.ford.com",
        "aff_unique_abbr": "ANU;Ford",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "Australia;United States"
    },
    {
        "id": "AKAlVyunxA",
        "title": "SHINE: Shielding Backdoors in Deep Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent studies have discovered that similar to supervised classifiers, a deep reinforcement learning (DRL) policy is also vulnerable to backdoor attacks. Existing defenses against backdoor attacks either do not consider RL's unique mechanism or make unrealistic assumptions, resulting in limited defense efficacy, practicability, and generalizability. In this work, we propose SHINE, a novel backdoor shielding method for DRL. SHINE first leverages policy explanation techniques to identify the backdoor triggers and then designs a policy retraining algorithm to eliminate the negative impact of the triggers on backdoored agents. We theoretically prove that SHINE guarantees to improve a backdoored agent's performance in a poisoned environment while ensuring its performance difference in the clean environment before and after shielding is bounded. We further conduct extensive experiments that evaluate SHINE against three mainstream DRL backdoor attacks in various benchmark RL environments. Our results show that SHINE significantly outperforms existing defenses in mitigating these backdoor attacks.",
        "keywords": "deep reinforcement learning;trojan backdoor;explanation",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/658689c17d6bf5701683a010a94f12063ad683d2.zip",
        "author": "Wenbo Guo;Zhuowen Yuan;Jinyuan Jia;Bo Li;Dawn Song",
        "authorids": "~Wenbo_Guo1;~Zhuowen_Yuan1;~Jinyuan_Jia2;~Bo_Li19;~Dawn_Song1",
        "gender": "M;M;;F;F",
        "homepage": "https://henrygwb.github.io/;;https://jinyuan-jia.github.io/;http://boli.cs.illinois.edu/;",
        "dblp": "144/1238-2.html;304/3576;24/5124-1.html;50/3402-26;s/DXSong",
        "google_scholar": "KyPheRMAAAAJ;F-r0bYQAAAAJ;iyg4ytkAAAAJ;K8vJkTcAAAAJ;",
        "orcid": ";;0000-0002-9785-7769;;",
        "linkedin": ";;;;",
        "or_profile": "~Wenbo_Guo1;~Zhuowen_Yuan1;~Jinyuan_Jia2;~Bo_Li19;~Dawn_Song1",
        "aff": "University of California, Santa Barbara;University of Illinois Urbana-Champaign;Pennsylvania State University;University of Illinois, Urbana Champaign;University of California, Berkeley",
        "aff_domain": "ucsb.edu;illinois.edu;psu.edu;illinois.edu;berkeley.edu",
        "position": "Assistant Professor;PhD student;Assistant Professor;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nguo2024shine,\ntitle={{SHINE}: Shielding Backdoors in Deep Reinforcement Learning},\nauthor={Wenbo Guo and Zhuowen Yuan and Jinyuan Jia and Bo Li and Dawn Song},\nyear={2024},\nurl={https://openreview.net/forum?id=AKAlVyunxA}\n}",
        "github": "",
        "project": "",
        "reviewers": "F9HD;2tnZ;5eAS;r1tp",
        "site": "https://openreview.net/forum?id=AKAlVyunxA",
        "pdf_size": 1157602,
        "rating": "5;6;6;6",
        "confidence": "5;4;2;3",
        "soundness": "2;2;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;3;2",
        "wc_summary": "90;173;66;74",
        "wc_strengths": "32;75;53;77",
        "wc_weaknesses": "171;195;31;130",
        "wc_questions": "162;235;1;32",
        "wc_review": "455;678;151;313",
        "wc_reply_reviewers": "120;198;22;0",
        "wc_reply_authors": "1077;1714;397;745",
        "reply_reviewers": "2;3;1;0",
        "reply_authors": "4;4;3;2",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            100.75,
            42.5991490525339
        ],
        "wc_strengths_avg": [
            59.25,
            18.335416548308903
        ],
        "wc_weaknesses_avg": [
            131.75,
            62.63934466451577
        ],
        "wc_questions_avg": [
            107.5,
            95.22210877732125
        ],
        "wc_review_avg": [
            399.25,
            193.5695934283068
        ],
        "wc_reply_reviewers_avg": [
            85.0,
            79.3536388579629
        ],
        "wc_reply_authors_avg": [
            983.25,
            485.6018816891055
        ],
        "reply_reviewers_avg": [
            1.5,
            1.118033988749895
        ],
        "reply_authors_avg": [
            3.25,
            0.82915619758885
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.7745966692414834,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6033307709105802344&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;2;1;3",
        "aff_unique_norm": "University of California, Santa Barbara;University of Illinois Urbana-Champaign;Pennsylvania State University;University of California, Berkeley",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.ucsb.edu;https://illinois.edu;https://www.psu.edu;https://www.berkeley.edu",
        "aff_unique_abbr": "UCSB;UIUC;PSU;UC Berkeley",
        "aff_campus_unique_index": "0;1;1;3",
        "aff_campus_unique": "Santa Barbara;Urbana-Champaign;;Berkeley",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "AKJLnDgzkm",
        "title": "Welfare Diplomacy: Benchmarking Language Model Cooperation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The growing capabilities and increasingly widespread deployment of AI systems necessitate robust benchmarks for measuring their cooperative capabilities. Unfortunately, most multi-agent benchmarks are either zero-sum or purely cooperative, providing limited opportunities for such measurements. We introduce a general-sum variant of the zero-sum board game Diplomacy\u2014called Welfare Diplomacy\u2014in which players must balance investing in military conquest and domestic welfare. We argue that Welfare Diplomacy facilitates both a clearer assessment of and stronger training incentives for cooperative capabilities. Our contributions are: (1) proposing the Welfare Diplomacy rules and implementing them via an open- source Diplomacy engine; (2) constructing baseline agents using zero-shot prompted language models; and (3) conducting experiments where we find that baselines using state-of-the-art models attain high social welfare but are exploitable. Our work aims to promote societal safety by aiding researchers in developing and assessing multi-agent AI systems. Code to evaluate Welfare Diplomacy and reproduce our experiments is available at https://anonymous.4open.science/r/welfare-diplomacy-72AC.",
        "keywords": "multiagent systems;cooperative AI;AI agents;language models",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/9076a3d46cd1dfd13e87f73ee5ff9636ce6368be.pdf",
        "author": "Gabriel Mukobi;Hannah Erlebach;Niklas Lauffer;Lewis Hammond;Alan Chan;Jesse Clifton",
        "authorids": "~Gabriel_Mukobi1;~Hannah_Erlebach1;~Niklas_Lauffer1;~Lewis_Hammond1;~Alan_Chan2;~Jesse_Clifton1",
        "gender": "M;F;M;;M;M",
        "homepage": "https://gabrielmukobi.com/;;https://niklaslauffer.github.io/;https://www.lewishammond.com/;https://achan.ca;https://statistics.sciences.ncsu.edu/people/jclifto/",
        "dblp": ";;;228/6647;;",
        "google_scholar": ";;;8fYnp7UAAAAJ;lmQmYPgAAAAJ;",
        "orcid": ";;;0000-0003-1695-0871;;",
        "linkedin": "gabrielmukobi/;hannah-erlebach-625159195/;;lrhammond/;alan-chan-51858378/;",
        "or_profile": "~Gabriel_Mukobi1;~Hannah_Erlebach1;~Niklas_Lauffer1;~Lewis_Hammond1;~Alan_Chan2;~Jesse_Clifton1",
        "aff": "Computer Science Department, Stanford University;University College London, University of London;University of California, Berkeley;University of Oxford;University of Montreal;",
        "aff_domain": "cs.stanford.edu;ucl.ac.uk;berkeley.edu;ox.ac.uk;umontreal.ca;",
        "position": "MS student;MS student;PhD student;PhD student;PhD student;",
        "bibtex": "@misc{\nmukobi2024welfare,\ntitle={Welfare Diplomacy: Benchmarking Language Model Cooperation},\nauthor={Gabriel Mukobi and Hannah Erlebach and Niklas Lauffer and Lewis Hammond and Alan Chan and Jesse Clifton},\nyear={2024},\nurl={https://openreview.net/forum?id=AKJLnDgzkm}\n}",
        "github": "",
        "project": "",
        "reviewers": "zuKK;A4aM;R7WR",
        "site": "https://openreview.net/forum?id=AKJLnDgzkm",
        "pdf_size": 17615370,
        "rating": "5;6;8",
        "confidence": "4;3;4",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "2;3;3",
        "wc_summary": "39;74;43",
        "wc_strengths": "71;55;73",
        "wc_weaknesses": "209;61;60",
        "wc_questions": "103;64;266",
        "wc_review": "422;254;442",
        "wc_reply_reviewers": "67;0;0",
        "wc_reply_authors": "709;435;734",
        "reply_reviewers": "1;0;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            52.0,
            15.641824275533422
        ],
        "wc_strengths_avg": [
            66.33333333333333,
            8.055363982396383
        ],
        "wc_weaknesses_avg": [
            110.0,
            70.00476174280338
        ],
        "wc_questions_avg": [
            144.33333333333334,
            87.49222187651249
        ],
        "wc_review_avg": [
            372.6666666666667,
            84.30631978419859
        ],
        "wc_reply_reviewers_avg": [
            22.333333333333332,
            31.584102892999123
        ],
        "wc_reply_authors_avg": [
            626.0,
            135.44248471829903
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.18898223650461363,
        "gs_citation": 33,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7008315424132990650&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "Stanford University;University College London;University of California, Berkeley;University of Oxford;University of Montreal",
        "aff_unique_dep": "Computer Science Department;;;;",
        "aff_unique_url": "https://www.stanford.edu;https://www.ucl.ac.uk;https://www.berkeley.edu;https://www.ox.ac.uk;https://wwwumontreal.ca",
        "aff_unique_abbr": "Stanford;UCL;UC Berkeley;Oxford;UM",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Stanford;;Berkeley",
        "aff_country_unique_index": "0;1;0;1;2",
        "aff_country_unique": "United States;United Kingdom;Canada"
    },
    {
        "id": "AKZtQO81GQ",
        "title": "Evaluating model bias requires characterizing model mistakes",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The ability to properly benchmark model performance in the face of spurious correlation is important to both build better predictors and increase confidence that models are operating as intended. We demonstrate that characterizing (as opposed to simply quantifying) model mistakes across subgroups is pivotal to properly reflect model biases, which are ignored by standard metrics such as worst-group accuracy or accuracy gap. Inspired by the hypothesis testing framework, we introduce SkewSize, a flexible metric that captures bias from mistakes in a model\u2019s predictions.  It can be used in multi-class settings or generalised to the open vocabulary setting of generative models.  SkewSize is an aggregation of the effect size of the interaction between two categorical variables:  the independent variable, representing the bias attribute (i.e.  subgroup), and the dependent variable,representing the model\u2019s prediction.  We demonstrate the utility of SkewSize in multiple settings including:  standard vision models trained on synthetic data, vision models trained on ImageNet as well as the DomainNet distribution shift benchmark, and large scale vision-language models from the BLIP-2 family. In each case, the proposed SkewSize is able to highlight biases not captured by other metrics, while also providing insights on the impact of recently proposed techniques, such as instruction tuning.",
        "keywords": "model bias;performance disparity across subgroups;neural networks evaluation",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/d200a4ccf3be2e7b00c79399a1bacc8c9977b297.zip",
        "author": "Isabela Albuquerque;Jessica Schrouff;David Warde-Farley;Ali Taylan Cemgil;Sven Gowal;Olivia Wiles",
        "authorids": "~Isabela_Albuquerque1;~Jessica_Schrouff1;~David_Warde-Farley1;~Ali_Taylan_Cemgil2;~Sven_Gowal2;~Olivia_Wiles1",
        "gender": "F;F;M;;M;M",
        "homepage": ";;;;https://www.cmpe.boun.edu.tr/~cemgil/;",
        "dblp": "210/2719;96/9449;71/9421;194/3191;41/6613;75/8368",
        "google_scholar": ";https://scholar.google.co.uk/citations?user=2YWm2nMAAAAJ;https://scholar.google.ca/citations?user=MOgfm8oAAAAJ;https://scholar.google.co.uk/citations?user=XQzHJSgAAAAJ;X3ZFZ7AAAAAJ;",
        "orcid": ";0000-0003-4992-3183;;;http://orcid.org/0000-0003-4463-8455;",
        "linkedin": ";jessica-schrouff/;;;;",
        "or_profile": "~Isabela_Albuquerque1;~Jessica_Schrouff1;~David_Warde-Farley1;~Olivia_Wiles1;~ali_taylan_cemgil1;~Sven_Gowal1",
        "aff": "Google DeepMind;Google DeepMind;Google DeepMind;Google;Bogazici University;Google DeepMind",
        "aff_domain": "deepmind.com;google.com;google.com;google.com;boun.edu.tr;google.com",
        "position": "Researcher;Senior Researcher;Research Scientist;Researcher;Full Professor;Research Engineer",
        "bibtex": "@misc{\nalbuquerque2024evaluating,\ntitle={Evaluating model bias requires characterizing model mistakes},\nauthor={Isabela Albuquerque and Jessica Schrouff and David Warde-Farley and Ali Taylan Cemgil and Sven Gowal and Olivia Wiles},\nyear={2024},\nurl={https://openreview.net/forum?id=AKZtQO81GQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "1DWK;6Zhw;kSV6;bd8T",
        "site": "https://openreview.net/forum?id=AKZtQO81GQ",
        "pdf_size": 1076041,
        "rating": "5;5;6;8",
        "confidence": "4;4;4;2",
        "soundness": "3;4;3;3",
        "contribution": "2;2;2;3",
        "presentation": "4;3;4;2",
        "wc_summary": "64;46;71;81",
        "wc_strengths": "68;56;81;62",
        "wc_weaknesses": "205;140;116;8",
        "wc_questions": "119;4;2;100",
        "wc_review": "456;246;270;251",
        "wc_reply_reviewers": "113;117;208;0",
        "wc_reply_authors": "2975;1143;1555;38",
        "reply_reviewers": "1;1;2;0",
        "reply_authors": "7;4;3;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            65.5,
            12.776932339180638
        ],
        "wc_strengths_avg": [
            66.75,
            9.256754290786809
        ],
        "wc_weaknesses_avg": [
            117.25,
            70.98371292064117
        ],
        "wc_questions_avg": [
            56.25,
            53.67669419776147
        ],
        "wc_review_avg": [
            305.75,
            87.20772614854718
        ],
        "wc_reply_reviewers_avg": [
            109.5,
            73.7580504080741
        ],
        "wc_reply_authors_avg": [
            1427.75,
            1051.5063896619934
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            3.75,
            2.165063509461097
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.9428090415820632,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:sBOFi0Nj4nAJ:scholar.google.com/&scioq=Evaluating+model+bias+requires+characterizing+model+mistakes&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;1;0",
        "aff_unique_norm": "Google;Bogazici University",
        "aff_unique_dep": "Google DeepMind;",
        "aff_unique_url": "https://deepmind.com;https://www.boun.edu.tr",
        "aff_unique_abbr": "DeepMind;BU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0;0;1;2;0",
        "aff_country_unique": "United Kingdom;United States;T\u00fcrkiye"
    },
    {
        "id": "AL1fq05o7H",
        "title": "Mamba: Linear-Time Sequence Modeling with Selective State Spaces",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Foundation models, now powering most of the exciting applications in deep learning, are almost universally based on the Transformer architecture and its core attention module. Many subquadratic-time architectures such as linear attention, gated convolution and recurrent models, and structured state space models (SSMs) have been developed to address Transformers' computational inefficiency on long sequences, but they have not performed as well as attention on important modalities such as language.  We identify that a key weakness of such models is their inability to perform content-based reasoning, and make several improvements. First, simply letting the SSM parameters be functions of the input addresses their weakness with discrete modalities, allowing the model to *selectively* propagate or forget information along the sequence length dimension depending on the current token. Second, even though this change prevents the use of efficient convolutions, we design a hardware-aware parallel algorithm in recurrent mode. We integrate these selective SSMs into a simplified end-to-end neural network architecture without attention or even MLP blocks (**Mamba**). Mamba enjoys fast inference (5$\\times$ higher throughput than Transformers) and linear scaling in sequence length, and its performance improves on real data up to million-length sequences. As a general sequence model backbone, Mamba achieves state-of-the-art performance across several modalities such as language, audio, and genomics. On language modeling, our Mamba-1.4B model outperforms Transformers of the same size and matches Transformers twice its size, both in pretraining and downstream evaluation.",
        "keywords": "Sequence model;language model;state space model;RNN;SSM;S4;Mamba",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Albert Gu;Tri Dao",
        "authorids": "~Albert_Gu1;~Tri_Dao1",
        "gender": "M;",
        "homepage": ";https://tridao.me/",
        "dblp": "130/0612;206/7018",
        "google_scholar": "DVCHv1kAAAAJ;NQRw0bQAAAAJ",
        "orcid": "0000-0002-4946-6042;",
        "linkedin": ";",
        "or_profile": "~Albert_Gu1;~Tri_Dao1",
        "aff": "Carnegie Mellon University;Princeton University",
        "aff_domain": "cmu.edu;princeton.edu",
        "position": "Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\ngu2024mamba,\ntitle={Mamba: Linear-Time Sequence Modeling with Selective State Spaces},\nauthor={Albert Gu and Tri Dao},\nyear={2024},\nurl={https://openreview.net/forum?id=AL1fq05o7H}\n}",
        "github": "",
        "project": "",
        "reviewers": "du8a;iEaX;sf96;5ZBk",
        "site": "https://openreview.net/forum?id=AL1fq05o7H",
        "pdf_size": 639407,
        "rating": "3;6;8;8",
        "confidence": "5;2;4;5",
        "soundness": "2;3;4;4",
        "contribution": "2;3;3;4",
        "presentation": "3;3;4;4",
        "wc_summary": "60;186;83;52",
        "wc_strengths": "71;60;69;20",
        "wc_weaknesses": "385;13;10;210",
        "wc_questions": "2;38;46;120",
        "wc_review": "518;297;208;402",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "2115;335;229;473",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "4;1;1;1",
        "rating_avg": [
            6.25,
            2.0463381929681126
        ],
        "confidence_avg": [
            4.0,
            1.224744871391589
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            95.25,
            53.6161123171011
        ],
        "wc_strengths_avg": [
            55.0,
            20.627651344736268
        ],
        "wc_weaknesses_avg": [
            154.5,
            155.81479390609866
        ],
        "wc_questions_avg": [
            51.5,
            42.88064831599448
        ],
        "wc_review_avg": [
            356.25,
            115.91456983485726
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            788.0,
            771.0129700595185
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.75,
            1.299038105676658
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.09975093361076329,
        "gs_citation": 3100,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3513516483726437226&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 11,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Carnegie Mellon University;Princeton University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cmu.edu;https://www.princeton.edu",
        "aff_unique_abbr": "CMU;Princeton",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "AL4tS0HhJT",
        "title": "Post-prediction confidence training complements supervised learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Wrong prediction is bad. For users,  having high confidence on a wrong prediction is even worse. Since even the best-trained class-label predictor will have some chance of making mistakes, users, especially in  some AI application areas such as personalized medicine, may want to tell  the high quality predictions from  the low quality ones. In convolutional neural networks (CNN), confidence on a prediction is associated with the softmax output layer, which gives a probability distribution on the class-labels. But even a prediction with 95\\%  probability concentrated  on one class may still turn out wrong many times more often than the anticipated rate of 5\\%.  There are at least three main sources of uncertainty to cause a large anticipation gap. The first one is that some of the test samples may not belong to the same distribution of the training samples. The second one is the sever population heterogeneity within each class, causing the variation of prediction quality across some hidden subpopulations. The third one is the imperfectness of the prediction model. While most researches are focused on the first source of prediction uncertainty, the other two receive much less  attention. Here we take a different approach, termed post-prediction confidence training (PPCT), to guide users how to discern the high-quality predictions from the low-quality ones.  Distinctively different from other methods including conformal prediction, PPCT entertains all three sources of uncertainty by searching features to anchor the criticism of prediction quality.  An enhancement to CNN configuration is required during network training. We propose a blueprint by coupling each logit node (T channel) in the layer feeding to softmax   with an additional node (C channel) and using maxout  to link the pair to the softmax layer. The C channel is introduced to counter the T channel as a contrastive feature against the feature of the target class. A high-quality prediction must follow a logically-lucid pattern between T and C  for every class. Successful implementation of our methods  on  popular image datasets are reported.",
        "keywords": "supervised learning;prediction uncertainty;maxout;feature representation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Yu-Cheng Li;Hao Ho;Ker-Chau Li",
        "authorids": "~Yu-Cheng_Li1;~Hao_Ho1;~Ker-Chau_Li1",
        "gender": "M;M;",
        "homepage": "https://www.stat.sinica.edu.tw/cht/index.php?act=researcher_manager&code=view&member=75;;http://statistics.ucla.edu/index.php/people1/all-faculty/7809-2/?smid=8818",
        "dblp": ";;",
        "google_scholar": ";;",
        "orcid": ";0000-0001-8911-7907;",
        "linkedin": ";;",
        "or_profile": "~Yu-Cheng_Li1;~Hao_Ho1;~Ker-Chau_Li1",
        "aff": "Academia Sinica;University of California, Los Angeles;UCLA, University of California, Los Angeles",
        "aff_domain": "sinica.edu.tw;ucla.edu;stat.ucla.edu",
        "position": "Postdoc;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nli2024postprediction,\ntitle={Post-prediction confidence training complements supervised learning},\nauthor={Yu-Cheng Li and Hao Ho and Ker-Chau Li},\nyear={2024},\nurl={https://openreview.net/forum?id=AL4tS0HhJT}\n}",
        "github": "",
        "project": "",
        "reviewers": "2myu;c9j6;xsnZ;9DJD",
        "site": "https://openreview.net/forum?id=AL4tS0HhJT",
        "pdf_size": 4562090,
        "rating": "1;3;3;3",
        "confidence": "4;4;3;3",
        "soundness": "2;1;2;3",
        "contribution": "2;1;2;2",
        "presentation": "1;2;1;2",
        "wc_summary": "52;49;118;83",
        "wc_strengths": "20;13;81;54",
        "wc_weaknesses": "258;299;272;137",
        "wc_questions": "59;154;71;49",
        "wc_review": "389;515;542;323",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            75.5,
            27.91504970441572
        ],
        "wc_strengths_avg": [
            42.0,
            27.340446228984632
        ],
        "wc_weaknesses_avg": [
            241.5,
            62.10676291677099
        ],
        "wc_questions_avg": [
            83.25,
            41.583500333665995
        ],
        "wc_review_avg": [
            442.25,
            89.85926496472136
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:4zVtrlxgT0cJ:scholar.google.com/&scioq=Post-prediction+confidence+training+complements+supervised+learning&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Academia Sinica;University of California, Los Angeles",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.sinica.edu.tw;https://www.ucla.edu",
        "aff_unique_abbr": "Academia Sinica;UCLA",
        "aff_campus_unique_index": "0;1;1",
        "aff_campus_unique": "Taiwan;Los Angeles",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "One Forward is Enough for Neural Network Training via Likelihood Ratio Method",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19266",
        "id": "ALGFFPXWSi",
        "author_site": "Jinyang Jiang, Zeliang Zhang, Chenliang Xu, Zhaofei Yu, Yijie Peng",
        "tldr": "",
        "abstract": "While backpropagation (BP) is the mainstream approach for gradient computation in neural network training, its heavy reliance on the chain rule of differentiation constrains the designing flexibility of network architecture and training pipelines. We avoid the recursive computation in BP and develop a unified likelihood ratio (ULR) method for gradient estimation with only one forward propagation. Not only can ULR be extended to train a wide variety of neural network architectures, but the computation flow in BP can also be rearranged by ULR for better device adaptation. Moreover, we propose several variance reduction techniques to further accelerate the training process. Our experiments offer numerical results across diverse aspects, including various neural network training scenarios, computation flow rearrangement, and fine-tuning of pre-trained models. All findings demonstrate that ULR effectively enhances the flexibility of neural network training by permitting localized module training without compromising the global objective and significantly boosts the network robustness.",
        "keywords": "stochastic optimization;gradient estimation",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/31f1213f0c37cde70d7c20340d346e97cceb370d.zip",
        "author": "Jinyang Jiang;Zeliang Zhang;Chenliang Xu;Zhaofei Yu;Yijie Peng",
        "authorids": "~Jinyang_Jiang1;~Zeliang_Zhang1;~Chenliang_Xu1;~Zhaofei_Yu1;~Yijie_Peng1",
        "gender": "M;M;M;M;M",
        "homepage": ";https://github.com/ZhangAIPI;https://www.cs.rochester.edu/~cxu22/;https://yuzhaofei.github.io;https://www.gsm.pku.edu.cn/faculty/pengyijie/",
        "dblp": "209/2313-1;219/9383;117/4770;166/0573;",
        "google_scholar": ";7nLfsSgAAAAJ;https://scholar.google.com.tw/citations?user=54HfyDIAAAAJ;qaUgD50AAAAJ;",
        "orcid": "0009-0004-7145-6272;;;;",
        "linkedin": ";;;;",
        "or_profile": "~Jinyang_Jiang1;~Zeliang_Zhang1;~Chenliang_Xu1;~Zhaofei_Yu1;~Yijie_Peng1",
        "aff": "Peking University;Microsoft Research;University of Rochester;Peking University;",
        "aff_domain": "pku.edu.cn;research.microsoft.com;rochester.edu;pku.edu.cn;",
        "position": "PhD student;Intern;Associate Professor;Assistant Professor;",
        "bibtex": "@inproceedings{\njiang2024one,\ntitle={One Forward is Enough for Neural Network Training via Likelihood Ratio Method},\nauthor={Jinyang Jiang and Zeliang Zhang and Chenliang Xu and Zhaofei Yu and Yijie Peng},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ALGFFPXWSi}\n}",
        "github": "",
        "project": "",
        "reviewers": "3HaG;s8CG;hjbZ;HFF5",
        "pdf_size": 971319,
        "rating": "6;6;8;8",
        "confidence": "2;4;3;3",
        "soundness": "2;3;4;4",
        "contribution": "2;3;3;3",
        "presentation": "2;3;4;3",
        "wc_summary": "141;179;87;123",
        "wc_strengths": "47;73;87;101",
        "wc_weaknesses": "97;129;69;188",
        "wc_questions": "159;285;21;137",
        "wc_review": "444;666;264;549",
        "wc_reply_reviewers": "392;73;0;394",
        "wc_reply_authors": "1506;1680;368;791",
        "reply_reviewers": "4;1;0;1",
        "reply_authors": "6;5;2;3",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            132.5,
            33.14739808793444
        ],
        "wc_strengths_avg": [
            77.0,
            19.949937343260004
        ],
        "wc_weaknesses_avg": [
            120.75,
            44.25141240683737
        ],
        "wc_questions_avg": [
            150.5,
            93.69498385719483
        ],
        "wc_review_avg": [
            480.75,
            147.73857823872544
        ],
        "wc_reply_reviewers_avg": [
            214.75,
            180.11020931640715
        ],
        "wc_reply_authors_avg": [
            1086.25,
            531.9268629238422
        ],
        "reply_reviewers_avg": [
            1.5,
            1.5
        ],
        "reply_authors_avg": [
            4.0,
            1.5811388300841898
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6983145891460231622&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=ALGFFPXWSi",
        "pdf": "https://openreview.net/pdf?id=ALGFFPXWSi",
        "email": "pku.edu.cn;research.microsoft.com;rochester.edu;pku.edu.cn;",
        "author_num": 5,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Peking University;Microsoft;University of Rochester",
        "aff_unique_dep": ";Microsoft Research;",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.microsoft.com/en-us/research;https://www.rochester.edu",
        "aff_unique_abbr": "Peking U;MSR;U of R",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Coeditor: Leveraging Repo-level Diffs for Code Auto-editing",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19265",
        "id": "ALVwQjZRS8",
        "author_site": "Jiayi Wei, Greg Durrett, Isil Dillig",
        "tldr": "",
        "abstract": "Developers often dedicate significant time to maintaining and refactoring existing code. However, most prior work on generative models for code focuses solely on creating new code, overlooking the distinctive needs of editing existing code. In this work, we explore a multi-round code auto-editing setting, aiming to predict edits to a code region based on recent changes within the same codebase. Our model, Coeditor, is a fine-tuned language model specifically designed for code editing tasks. We represent code changes using a line diff format and employ static analysis to form large customized model contexts, ensuring the availability of appropriate information for prediction. We collect a code editing dataset from the commit histories of 1650 open-source Python projects for training and evaluation. In a simplified single-round, single-edit task, Coeditor significantly outperforms GPT-3.5 and SOTA open-source code completion models (bringing exact-match accuracy from 34.7 up to 60.4), demonstrating the benefits of incorporating editing history for code completion. In a multi-round, multi-edit setting, we observe substantial gains by iteratively conditioning on additional user edits. We have open-sourced our code, data, and model weights to encourage future research and have released a VSCode extension powered by our model for interactive IDE usage.",
        "keywords": "language model for code;editing;refactoring",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/195f30db5399f6562d3051e183696313ace2ec05.zip",
        "author": "Jiayi Wei;Greg Durrett;Isil Dillig",
        "authorids": "~Jiayi_Wei2;~Greg_Durrett1;~Isil_Dillig1",
        "gender": "M;M;F",
        "homepage": "https://mrvplusone.github.io;http://www.cs.utexas.edu/~gdurrett/;https://www.cs.utexas.edu/~isil/",
        "dblp": ";69/7968;",
        "google_scholar": "fTJ8pY8AAAAJ;https://scholar.google.com.tw/citations?user=EpQ_sDEAAAAJ;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Jiayi_Wei2;~Greg_Durrett1;~Isil_Dillig1",
        "aff": "Augment Computing;University of Texas at Austin;University of Texas, Austin",
        "aff_domain": "augmentcode.com;utexas.edu;utexas.edu",
        "position": "Researcher;Associate Professor;Associate Professor",
        "bibtex": "@inproceedings{\nwei2024coeditor,\ntitle={Coeditor: Leveraging Repo-level Diffs for Code Auto-editing},\nauthor={Jiayi Wei and Greg Durrett and Isil Dillig},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ALVwQjZRS8}\n}",
        "github": "",
        "project": "",
        "reviewers": "vqdF;sVPE;ueao;Kf1h",
        "pdf_size": 6469199,
        "rating": "5;6;6;8",
        "confidence": "5;3;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;4;3;3",
        "presentation": "4;4;3;3",
        "wc_summary": "105;162;142;107",
        "wc_strengths": "102;40;65;44",
        "wc_weaknesses": "557;111;116;87",
        "wc_questions": "80;44;139;104",
        "wc_review": "844;357;462;342",
        "wc_reply_reviewers": "378;120;25;0",
        "wc_reply_authors": "1046;294;1017;250",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "2;1;2;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            129.0,
            24.072806234421446
        ],
        "wc_strengths_avg": [
            62.75,
            24.57005290999594
        ],
        "wc_weaknesses_avg": [
            217.75,
            196.17259620038678
        ],
        "wc_questions_avg": [
            91.75,
            34.64372237505664
        ],
        "wc_review_avg": [
            501.25,
            203.21586429213642
        ],
        "wc_reply_reviewers_avg": [
            130.75,
            149.6051051936397
        ],
        "wc_reply_authors_avg": [
            651.75,
            380.2067694031762
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3244428422615251,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2219570809759591003&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=ALVwQjZRS8",
        "pdf": "https://openreview.net/pdf?id=ALVwQjZRS8",
        "email": "augmentcode.com;utexas.edu;utexas.edu",
        "author_num": 3,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Augment Computing;University of Texas at Austin",
        "aff_unique_dep": ";",
        "aff_unique_url": ";https://www.utexas.edu",
        "aff_unique_abbr": ";UT Austin",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Austin",
        "aff_country_unique_index": "1;1",
        "aff_country_unique": ";United States"
    },
    {
        "id": "AMCaG2TAeg",
        "title": "Causal Influence-Aware Counterfactual Data Augmentation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Pre-recorded data and human-collected demonstrations are both valuable and practical resources for teaching robots complex behaviors.\nIdeally, learning agents should not be constrained by the scarcity of available demonstrations, but rather generalize to as many new situations as possible.\nHowever, the combinatorial nature of real-world scenarios typically requires a huge amount of data to prevent neural network policies from picking up on spurious and non-causal factors.\nWe propose CAIAC, a data augmentation method that can create feasible synthetic samples from a fixed dataset without the need to perform new environment interactions.\nMotivated by the fact that an agent may only modify the environment through its actions, we swap causally $\\textit{action}$-unaffected parts of the state-space from different observed trajectories in the dataset.\nIn high-dimensional benchmark environments, we observe an increase in generalization capabilities and sample efficiency.",
        "keywords": "deep reinforcement learning;data augmentation;learning from demonstrations;out-of-distribution generalization",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "N\u00faria Armengol Urp\u00ed;Georg Martius",
        "authorids": "~N\u00faria_Armengol_Urp\u00ed1;~Georg_Martius1",
        "gender": "F;M",
        "homepage": ";https://uni-tuebingen.de/de/264672",
        "dblp": ";47/2706",
        "google_scholar": "https://scholar.google.co.uk/citations?user=Cq6i6XwAAAAJ;https://scholar.google.de/citations?user=b-JF-UIAAAAJ",
        "orcid": ";",
        "linkedin": "nuriaarmengolurpi;",
        "or_profile": "~N\u00faria_Armengol_Urp\u00ed1;~Georg_Martius1",
        "aff": "ETHZ - ETH Zurich;Max Planck Institute for Intelligent Systems",
        "aff_domain": "ethz.ch;tuebingen.mpg.de",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nurp{\\'\\i}2024causal,\ntitle={Causal Influence-Aware Counterfactual Data Augmentation},\nauthor={N{\\'u}ria Armengol Urp{\\'\\i} and Georg Martius},\nyear={2024},\nurl={https://openreview.net/forum?id=AMCaG2TAeg}\n}",
        "github": "",
        "project": "",
        "reviewers": "LtoA;1iyX;GhVi",
        "site": "https://openreview.net/forum?id=AMCaG2TAeg",
        "pdf_size": 8146296,
        "rating": "3;5;5",
        "confidence": "4;3;3",
        "soundness": "2;3;2",
        "contribution": "2;1;2",
        "presentation": "3;2;3",
        "wc_summary": "149;64;71",
        "wc_strengths": "59;45;78",
        "wc_weaknesses": "480;544;168",
        "wc_questions": "263;22;53",
        "wc_review": "951;675;370",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "2405;1598;881",
        "reply_reviewers": "0;0;0",
        "reply_authors": "5;3;2",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            94.66666666666667,
            38.5256047612782
        ],
        "wc_strengths_avg": [
            60.666666666666664,
            13.523641850067197
        ],
        "wc_weaknesses_avg": [
            397.3333333333333,
            164.25454500730126
        ],
        "wc_questions_avg": [
            112.66666666666667,
            107.05242744665915
        ],
        "wc_review_avg": [
            665.3333333333334,
            237.29072651262393
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1628.0,
            622.5319268921073
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            1.247219128924647
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.9999999999999998,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:zBA2vid52oUJ:scholar.google.com/&scioq=Causal+Influence-Aware+Counterfactual+Data+Augmentation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "ETH Zurich;Max Planck Institute for Intelligent Systems",
        "aff_unique_dep": ";Intelligent Systems",
        "aff_unique_url": "https://www.ethz.ch;https://www.mpi-is.mpg.de",
        "aff_unique_abbr": "ETHZ;MPI-IS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Switzerland;Germany"
    },
    {
        "id": "AMDKqZcZbi",
        "title": "Rapid Learning without Catastrophic Forgetting in the Morris Water Maze",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Machine learning models typically struggle to swiftly adapt to novel tasks while maintaining proficiency on previously trained tasks. This contrasts starkly with animals, which demonstrate these capabilities easily. The differences between ML models and animals must stem from particular neural architectures and representations for memory and memory-policy interactions. We propose a new task that requires rapid and continual learning, the sequential Morris Water Maze (sWM). Drawing inspiration from biology, we show that 1) a content-addressable heteroassociative memory based on the entorhinal-hippocampal circuit with grid cells that retain knowledge across diverse environments, and 2) a spatially invariant convolutional network architecture for rapid adaptation across unfamiliar environments together perform rapid learning, good generalization, and continual learning without forgetting. Our model simultaneously outperforms ANN baselines from both the continual and few-shot learning contexts. It retains knowledge of past environments while rapidly acquiring the skills to navigate new ones, thereby addressing the seemingly opposing challenges of quick knowledge transfer and sustaining proficiency in previously learned tasks.",
        "keywords": "neuroscience;cognitive science;water maze;continual learning;catastrophic forgetting",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "Raymond Wang;Jaedong Hwang;Akhilan Boopathy;Ila R Fiete",
        "authorids": "~Raymond_Wang1;~Jaedong_Hwang1;~Akhilan_Boopathy1;~Ila_R_Fiete1",
        "gender": ";M;M;F",
        "homepage": ";https://jd730.github.io/;;https://fietelab.mit.edu/",
        "dblp": ";239/1982;230/8358;",
        "google_scholar": ";https://scholar.google.co.kr/citations?user=bITgqEUAAAAJ;;uE-CihIAAAAJ",
        "orcid": ";;;0000-0003-4738-2539",
        "linkedin": "raymond-w2/;;;",
        "or_profile": "~Raymond_Wang1;~Jaedong_Hwang1;~Akhilan_Boopathy1;~Ila_R_Fiete1",
        "aff": "University of California, Berkeley;Massachusetts Institute of Technology;Amazon;Massachusetts Institute of Technology",
        "aff_domain": "berkeley.edu;mit.edu;amazon.com;mit.edu",
        "position": "Undergrad student;PhD student;Intern;Professor",
        "bibtex": "@misc{\nwang2024rapid,\ntitle={Rapid Learning without Catastrophic Forgetting in the Morris Water Maze},\nauthor={Raymond Wang and Jaedong Hwang and Akhilan Boopathy and Ila R Fiete},\nyear={2024},\nurl={https://openreview.net/forum?id=AMDKqZcZbi}\n}",
        "github": "",
        "project": "",
        "reviewers": "KBVt;3WUm;ndgr;h9UH",
        "site": "https://openreview.net/forum?id=AMDKqZcZbi",
        "pdf_size": 5572537,
        "rating": "3;5;6;6",
        "confidence": "3;2;3;4",
        "soundness": "2;2;3;3",
        "contribution": "1;2;2;3",
        "presentation": "2;1;4;3",
        "wc_summary": "75;75;72;55",
        "wc_strengths": "9;72;66;36",
        "wc_weaknesses": "37;280;133;160",
        "wc_questions": "122;106;93;2",
        "wc_review": "243;533;364;253",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "357;770;905;541",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            69.25,
            8.317902379807062
        ],
        "wc_strengths_avg": [
            45.75,
            25.222757581200355
        ],
        "wc_weaknesses_avg": [
            152.5,
            86.65015868421708
        ],
        "wc_questions_avg": [
            80.75,
            46.61209606958263
        ],
        "wc_review_avg": [
            348.25,
            116.75910028772918
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            643.25,
            210.340646333513
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.28867513459481287,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16521589547593330114&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "University of California, Berkeley;Massachusetts Institute of Technology;Amazon",
        "aff_unique_dep": ";;Amazon.com, Inc.",
        "aff_unique_url": "https://www.berkeley.edu;https://web.mit.edu;https://www.amazon.com",
        "aff_unique_abbr": "UC Berkeley;MIT;Amazon",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Berkeley;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "AMivuI7Bnk",
        "title": "State-wise Constrained Policy Optimization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Reinforcement Learning (RL) algorithms have shown tremendous success in simulation environments, but their application to real-world problems faces significant challenges, with safety being a major concern. In particular, enforcing state-wise constraints is essential for many challenging tasks such as autonomous driving and robot manipulation. However, existing safe RL algorithms under the framework of Constrained Markov Decision Process (CMDP) do not consider state-wise constraints. To address this gap, we propose State-wise Constrained Policy Optimization (SCPO), the first general-purpose policy search algorithm for state-wise constrained reinforcement learning. SCPO provides guarantees for state-wise constraint satisfaction in expectation. In particular, we introduce the framework of Maximum Markov Decision Process, and prove that the worst-case safety violation is bounded under SCPO. We demonstrate the effectiveness of our approach on training neural network policies for extensive robot locomotion tasks, where the agent must satisfy a variety of state-wise safety constraints. Our results show that SCPO significantly outperforms existing methods and can handle state-wise constraints in high-dimensional robotics tasks.",
        "keywords": "Safe Reinforcement Learning;State-wise Safety Guarantee;Trust Region Optimization",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/293250a7998d5139e445399979e677c4e2d85462.zip",
        "author": "Weiye Zhao;Rui Chen;Yifan Sun;Feihan Li;Tianhao Wei;Changliu Liu",
        "authorids": "~Weiye_Zhao1;~Rui_Chen11;~Yifan_Sun9;~Feihan_Li1;~Tianhao_Wei1;~Changliu_Liu1",
        "gender": "M;M;M;M;M;F",
        "homepage": "https://github.com/CaesarAndylaw;https://ruichen.pub/;https://yifansun98.github.io/;;;http://www.cs.cmu.edu/~cliu6/index.html",
        "dblp": "228/6863;;99/10261-11;;222/5386;166/3563",
        "google_scholar": "P-79KOcAAAAJ;XiUE0wMAAAAJ;DGhQSYUAAAAJ;;V22j1C0AAAAJ;",
        "orcid": "0000-0002-8426-5238;0000-0002-8671-8771;0009-0007-2073-7789;0000-0003-1770-4664;;",
        "linkedin": ";;yifansun1/;;;",
        "or_profile": "~Weiye_Zhao1;~Rui_Chen11;~Yifan_Sun9;~Feihan_Li1;~Tianhao_Wei1;~Changliu_Liu1",
        "aff": "Carnegie Mellon University;Carnegie Mellon University;Carnegie Mellon University;Tsinghua University;Carnegie Mellon University;Carnegie Mellon University",
        "aff_domain": "andrew.cmu.edu;andrew.cmu.edu;andrew.cmu.edu;tsinghua.edu.cn;andrew.cmu.edu;cmu.edu",
        "position": "PhD student;PhD student;PhD student;Undergrad student;PhD student;Assistant Professor",
        "bibtex": "@misc{\nzhao2024statewise,\ntitle={State-wise Constrained Policy Optimization},\nauthor={Weiye Zhao and Rui Chen and Yifan Sun and Feihan Li and Tianhao Wei and Changliu Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=AMivuI7Bnk}\n}",
        "github": "",
        "project": "",
        "reviewers": "VGHE;bUD6;A4Kd",
        "site": "https://openreview.net/forum?id=AMivuI7Bnk",
        "pdf_size": 11387510,
        "rating": "3;3;8",
        "confidence": "4;3;3",
        "soundness": "3;2;3",
        "contribution": "2;1;2",
        "presentation": "2;2;3",
        "wc_summary": "51;122;79",
        "wc_strengths": "70;180;30",
        "wc_weaknesses": "158;201;31",
        "wc_questions": "36;363;36",
        "wc_review": "315;866;176",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.666666666666667,
            2.357022603955158
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            84.0,
            29.20045661743437
        ],
        "wc_strengths_avg": [
            93.33333333333333,
            63.42099196813483
        ],
        "wc_weaknesses_avg": [
            130.0,
            72.17109301283075
        ],
        "wc_questions_avg": [
            145.0,
            154.14927829866735
        ],
        "wc_review_avg": [
            452.3333333333333,
            297.96010172877544
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5000000000000001,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1975768402285703586&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;1;0;0",
        "aff_unique_norm": "Carnegie Mellon University;Tsinghua University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cmu.edu;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "CMU;THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "AN5uo4ByWH",
        "title": "Curve Your Attention: Mixed-Curvature Transformers for Graph Representation Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Real-world graphs naturally exhibit hierarchical trees and cyclic structures that are unfit for the typical Euclidean space. While there exist graph neural networks that utilize hyperbolic or spherical spaces towards embedding such structures more accurately, these methods are confined under the message-passing paradigm, making them vulnerable against side-effects such as oversmoothing and oversquashing. More recent work have proposed global attention-based graph Transformers that can alleviate such drawbacks and easily model long-range interactions, but their extensions towards non-Euclidean geometry are yet unexplored. To bridge this gap, we propose Fully Product-Stereographic Transformer, a generalization of Transformers towards operating entirely on the product of constant curvature spaces. When combined with tokenized graph Transformers, our model can learn the curvature appropriate for the input graph in an end-to-end fashion, without any additional tuning on different curvature initializations. We also provide a kernelized approach to non-Euclidean attention, which enables our model to run with computational cost linear to the number of nodes and edges while respecting the underlying geometry. Experiments on graph reconstruction and node classification demonstrate the benefits of generalizing Transformers to the non-Euclidean domain.",
        "keywords": "Non-Euclidean Geometry;Product-Stereographic Space;Transformers",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/ad32c9985e6772b7ce2864b91399ef9420469d8d.zip",
        "author": "Sungjun Cho;Seunghyuk Cho;Sungwoo Park;Hankook Lee;Honglak Lee;Moontae Lee",
        "authorids": "~Sungjun_Cho1;~Seunghyuk_Cho1;~Sungwoo_Park3;~Hankook_Lee1;~Honglak_Lee2;~Moontae_Lee1",
        "gender": "M;M;M;;M;M",
        "homepage": "https://sc782.github.io/;https://seunghyukcho.github.io;https://hankook.github.io;https://moontae.people.uic.edu;http://web.eecs.umich.edu/~honglak;",
        "dblp": "254/8021;284/8079;223/4393;132/1761;58/2562;92/6585",
        "google_scholar": "https://scholar.google.com/citations?hl=en;4OOM9_cAAAAJ;CgqswXUAAAAJ;BMvYy9cAAAAJ;fmSHtE8AAAAJ;B1xpjO8AAAAJ",
        "orcid": ";0000-0002-9124-2712;;0000-0001-5542-3463;;",
        "linkedin": "sungjun-cho-46982411a/;4stack/;;moontae-lee-975248123/;;",
        "or_profile": "~Sungjun_Cho1;~Seunghyuk_Cho1;~Hankook_Lee1;~Moontae_Lee1;~Honglak_Lee1;~Sung_Woo_Park2",
        "aff": "LG AI Research;Pohang University of Science and Technology;LG AI Research;University of Illinois, Chicago;LG AI Research;University of California, Berkeley",
        "aff_domain": "lgresearch.ai;postech.ac.kr;lgresearch.ai;uic.edu;lgresearch.ai;berkeley.edu",
        "position": "Researcher;PhD student;Researcher;Assistant Professor;Chief Scientist;Postdoc",
        "bibtex": "@misc{\ncho2024curve,\ntitle={Curve Your Attention: Mixed-Curvature Transformers for Graph Representation Learning},\nauthor={Sungjun Cho and Seunghyuk Cho and Sungwoo Park and Hankook Lee and Honglak Lee and Moontae Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=AN5uo4ByWH}\n}",
        "github": "",
        "project": "",
        "reviewers": "g83M;c5LD;Wzei",
        "site": "https://openreview.net/forum?id=AN5uo4ByWH",
        "pdf_size": 1349155,
        "rating": "1;5;5",
        "confidence": "5;4;4",
        "soundness": "2;3;2",
        "contribution": "1;3;2",
        "presentation": "2;3;3",
        "wc_summary": "48;88;122",
        "wc_strengths": "27;28;77",
        "wc_weaknesses": "220;154;537",
        "wc_questions": "50;88;29",
        "wc_review": "345;358;765",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            1.8856180831641267
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            86.0,
            30.243456592570013
        ],
        "wc_strengths_avg": [
            44.0,
            23.338094752285727
        ],
        "wc_weaknesses_avg": [
            303.6666666666667,
            167.17721801197143
        ],
        "wc_questions_avg": [
            55.666666666666664,
            24.417662095749915
        ],
        "wc_review_avg": [
            489.3333333333333,
            194.99800568780756
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.9999999999999998,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15592352316861997658&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;2;0;3",
        "aff_unique_norm": "LG;Pohang University of Science and Technology;University of Illinois at Chicago;University of California, Berkeley",
        "aff_unique_dep": "LG AI Research;;;",
        "aff_unique_url": "https://www.lgaires.com;https://www.postech.ac.kr;https://www.uic.edu;https://www.berkeley.edu",
        "aff_unique_abbr": "LG AI;POSTECH;UIC;UC Berkeley",
        "aff_campus_unique_index": "1;2;3",
        "aff_campus_unique": ";Pohang;Chicago;Berkeley",
        "aff_country_unique_index": "0;0;0;1;0;1",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "id": "ANJxbH4eQQ",
        "title": "Beyond the training set: an intuitive method for detecting distribution shift in model-based optimization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Model-based optimization (MBO) is increasingly applied to design problems in science and engineering. A common scenario involves using a fixed training set to train models, with the goal of designing new samples that outperform those present in the training data. A major challenge in this setting is distribution shift, where the distributions of training and designed samples are different. While some shift is expected, as the goal is to create better designs, this change can negatively affect model accuracy and subsequently, design quality. Despite the widespread nature of this problem, addressing it demands deep domain knowledge and artful application. To tackle this issue, we propose a straightforward method for design practitioners that detects distribution shifts. This method trains a binary classifier using knowledge of the unlabeled design distribution to separate the training data from the design data. The classifier\u2019s logit scores are then used as a proxy measure of distribution shift. We validate our method in a real-world application by running offline MBO and evaluate the effect of distribution shift on design quality. We find the intensity of the shift in the design distribution varies based on the number of steps taken by the optimization algorithm, and our simple approach identifies these shifts. This enables users to constrain their search to regions where the model's predictions are reliable, thereby increasing the quality of designs.",
        "keywords": "protein engineering;sequence design;model-based optimization;distribution shift",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Farhan Damani;David H Brookes;Theodore Sternlieb;Cameron Webster;Stephen Malina;Rishi Jajoo;Kathy Lin;Sam Sinai",
        "authorids": "~Farhan_Damani1;~David_H_Brookes1;~Theodore_Sternlieb1;~Cameron_Webster1;~Stephen_Malina1;~Rishi_Jajoo1;~Kathy_Lin1;~Sam_Sinai1",
        "gender": ";;M;M;;M;;M",
        "homepage": "http://fdamani.com;;;;https://stephenmalina.com/;;;",
        "dblp": ";;;;;;;",
        "google_scholar": ";;;;https://scholar.google.com/citations?hl=en;;;4k0EcsIAAAAJ",
        "orcid": ";;;;;;;",
        "linkedin": ";;theodore-sternlieb/;cameron-webster-25a5955a/;;rishi-jajoo-3166166;kathy-lin-05093254/;sam-sinai-710a0221/",
        "or_profile": "~Farhan_Damani1;~David_H_Brookes1;~Theodore_Sternlieb1;~Cameron_Webster1;~Stephen_Malina1;~Rishi_Jajoo1;~Kathy_Lin1;~Sam_Sinai1",
        "aff": "Dyno Therapeutics;;;Dyno Therapeutics;;;Dyno Therapeutics;Dyno Therapeutics",
        "aff_domain": "dynotx.com;;;dynotx.com;;;dynotx.com;dynotx.com",
        "position": "Researcher;;;Researcher;;;Researcher;Principal Researcher",
        "bibtex": "@misc{\ndamani2024beyond,\ntitle={Beyond the training set: an intuitive method for detecting distribution shift in model-based optimization},\nauthor={Farhan Damani and David H Brookes and Theodore Sternlieb and Cameron Webster and Stephen Malina and Rishi Jajoo and Kathy Lin and Sam Sinai},\nyear={2024},\nurl={https://openreview.net/forum?id=ANJxbH4eQQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "a8tv;6Sc3;nQCc;jVj2;SeaM",
        "site": "https://openreview.net/forum?id=ANJxbH4eQQ",
        "pdf_size": 7382108,
        "rating": "3;5;6;6;6",
        "confidence": "5;3;4;3;3",
        "soundness": "2;2;3;3;4",
        "contribution": "2;2;2;2;3",
        "presentation": "2;3;3;3;4",
        "wc_summary": "104;62;179;88;123",
        "wc_strengths": "43;116;25;17;74",
        "wc_weaknesses": "263;123;180;2;61",
        "wc_questions": "290;55;24;79;86",
        "wc_review": "700;356;408;186;344",
        "wc_reply_reviewers": "585;0;279;0;0",
        "wc_reply_authors": "2125;1181;953;603;1253",
        "reply_reviewers": "2;0;3;0;0",
        "reply_authors": "5;3;3;2;3",
        "rating_avg": [
            5.2,
            1.16619037896906
        ],
        "confidence_avg": [
            3.6,
            0.8
        ],
        "soundness_avg": [
            2.8,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            3.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            111.2,
            39.36191052273759
        ],
        "wc_strengths_avg": [
            55.0,
            36.24913792078372
        ],
        "wc_weaknesses_avg": [
            125.8,
            90.87882041487994
        ],
        "wc_questions_avg": [
            106.8,
            94.13479696690271
        ],
        "wc_review_avg": [
            398.8,
            167.8837693167508
        ],
        "wc_reply_reviewers_avg": [
            172.8,
            232.70874500112797
        ],
        "wc_reply_authors_avg": [
            1223.0,
            504.6915889927234
        ],
        "reply_reviewers_avg": [
            1.0,
            1.2649110640673518
        ],
        "reply_authors_avg": [
            3.2,
            0.9797958971132712
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.7717436331412899,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10987622068086027041&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Dyno Therapeutics",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.dynotherapeutics.com",
        "aff_unique_abbr": "",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "ANK10b0sp9",
        "title": "Generalization error bounds for iterative learning algorithms with bounded updates",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "This paper explores the generalization characteristics of iterative learning algorithms with bounded updates for non-convex loss functions, employing information-theoretic techniques. Our key contribution is a novel bound for the generalization error of these algorithms with bounded updates. Our approach introduces two main novelties: 1) we reformulate the mutual information as the uncertainty of updates, providing a new perspective, and 2) instead of using the chaining rule of mutual information, we employ a variance decomposition technique to decompose information across iterations, allowing for a simpler surrogate process. We analyze our generalization bound under various settings and demonstrate improved bounds. To bridge the gap between theory and practice, we also examine the previously observed scaling behavior in large language models. Ultimately, our work takes a further step for developing practical generalization theories.",
        "keywords": "Information theory; generalization bounds; learning algorithm",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Jingwen Fu;Nanning Zheng",
        "authorids": "~Jingwen_Fu1;~Nanning_Zheng1",
        "gender": "M;M",
        "homepage": "https://www.jw-fu.cn/;",
        "dblp": "247/5290;07/256-1",
        "google_scholar": ";https://scholar.google.com/citations?hl=zh-CN",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Jingwen_Fu1;~Nanning_Zheng1",
        "aff": "Microsoft;Xi'an Jiaotong University",
        "aff_domain": "microsoft.com;xjtu.edu.cn",
        "position": "Intern;Full Professor",
        "bibtex": "@misc{\nfu2024generalization,\ntitle={Generalization error bounds for iterative learning algorithms with bounded updates},\nauthor={Jingwen Fu and Nanning Zheng},\nyear={2024},\nurl={https://openreview.net/forum?id=ANK10b0sp9}\n}",
        "github": "",
        "project": "",
        "reviewers": "j93d;UUy1;QX9v;BS2q",
        "site": "https://openreview.net/forum?id=ANK10b0sp9",
        "pdf_size": 404840,
        "rating": "3;3;3;6",
        "confidence": "4;3;5;4",
        "soundness": "2;2;3;3",
        "contribution": "1;2;2;2",
        "presentation": "3;2;2;3",
        "wc_summary": "93;20;51;112",
        "wc_strengths": "28;20;18;68",
        "wc_weaknesses": "216;77;245;29",
        "wc_questions": "119;14;106;78",
        "wc_review": "456;131;420;287",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            69.0,
            35.88175023601831
        ],
        "wc_strengths_avg": [
            33.5,
            20.266968199511243
        ],
        "wc_weaknesses_avg": [
            141.75,
            90.93782216437779
        ],
        "wc_questions_avg": [
            79.25,
            40.48070528041724
        ],
        "wc_review_avg": [
            323.5,
            127.72724846327819
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14415402670218393217&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Microsoft;Xi'an Jiao Tong University",
        "aff_unique_dep": "Microsoft Corporation;",
        "aff_unique_url": "https://www.microsoft.com;https://www.xjtu.edu.cn",
        "aff_unique_abbr": "Microsoft;XJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "Generalization in diffusion models arises from geometry-adaptive harmonic representations",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19264",
        "id": "ANvmVS2Yr0",
        "author_site": "Zahra Kadkhodaie, Florentin Guth, Eero Simoncelli, St\u00e9phane Mallat",
        "tldr": "",
        "abstract": "Deep neural networks (DNNs) trained for image denoising are able to generate high-quality samples with score-based reverse diffusion algorithms. These impressive capabilities seem to imply an escape from the curse of dimensionality, but recent reports of memorization of the training set raise the question of whether these networks are learning the \"true\" continuous density of the data. Here, we show that two DNNs trained on non-overlapping subsets of a dataset learn nearly the same score function, and thus the same density, when the number of training images is large enough.  In this regime of strong generalization, diffusion-generated images are distinct from the training set, and are of high visual quality, suggesting that the inductive biases of the DNNs are well-aligned with the data density. We analyze the learned denoising functions and show that the inductive biases give rise to a shrinkage operation in a basis adapted to the underlying image. Examination of these bases reveals oscillating harmonic structures along contours and in homogeneous regions. We demonstrate that trained denoisers are inductively biased towards these geometry-adaptive harmonic bases since they arise not only when the network is trained on photographic images, but also when it is trained on image classes supported on low-dimensional manifolds for which the harmonic basis is suboptimal. Finally, we show that when trained on regular image classes for which the optimal basis is known to be geometry-adaptive and harmonic, the denoising performance of the networks is near-optimal.",
        "keywords": "diffusion models;memorization;generalization;inductive bias;curse of dimensionality;denoising;geometry-adaptive harmonic basis",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Zahra Kadkhodaie;Florentin Guth;Eero P Simoncelli;St\u00e9phane Mallat",
        "authorids": "~Zahra_Kadkhodaie1;~Florentin_Guth1;~Eero_P_Simoncelli1;~St\u00e9phane_Mallat1",
        "gender": "F;;M;M",
        "homepage": ";;https://www.di.ens.fr/~mallat/;https://www.cns.nyu.edu/~eero/",
        "dblp": "243/3303;223/6081;61/3978;30/5604",
        "google_scholar": "_b5JdjYAAAAJ;opC_fpQAAAAJ;https://scholar.google.com.tw/citations?user=g_YTmSgAAAAJ;MplR7_cAAAAJ",
        "orcid": ";;;0000-0002-1206-527X",
        "linkedin": ";;;eero-simoncelli-445782123",
        "or_profile": "~Zahra_Kadkhodaie1;~Florentin_Guth1;~St\u00e9phane_Mallat1;~Eero_Peter_Simoncelli1",
        "aff": "Flatiron Institute;Simons Foundation;;New York University",
        "aff_domain": "flatironinstitute.org;simonsfoundation.org;;nyu.edu",
        "position": "Postdoc;Postdoc;;Full Professor",
        "bibtex": "@inproceedings{\nkadkhodaie2024generalization,\ntitle={Generalization in diffusion models arises from geometry-adaptive harmonic representations},\nauthor={Zahra Kadkhodaie and Florentin Guth and Eero P Simoncelli and St{\\'e}phane Mallat},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ANvmVS2Yr0}\n}",
        "github": "",
        "project": "",
        "reviewers": "89Fo;SQqg;rH4m;4Rws",
        "pdf_size": 6910937,
        "rating": "8;8;8;10",
        "confidence": "4;4;3;4",
        "soundness": "3;3;4;4",
        "contribution": "3;3;4;4",
        "presentation": "3;4;4;4",
        "wc_summary": "94;250;238;106",
        "wc_strengths": "74;169;183;54",
        "wc_weaknesses": "31;47;85;9",
        "wc_questions": "1;15;239;178",
        "wc_review": "200;481;745;347",
        "wc_reply_reviewers": "0;0;48;4",
        "wc_reply_authors": "59;61;435;75",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            8.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.5,
            0.5
        ],
        "presentation_avg": [
            3.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            172.0,
            72.24956747275377
        ],
        "wc_strengths_avg": [
            120.0,
            56.66127425323225
        ],
        "wc_weaknesses_avg": [
            43.0,
            27.748873851023216
        ],
        "wc_questions_avg": [
            108.25,
            102.66298018273189
        ],
        "wc_review_avg": [
            443.25,
            200.56965747590039
        ],
        "wc_reply_reviewers_avg": [
            13.0,
            20.273134932713294
        ],
        "wc_reply_authors_avg": [
            157.5,
            160.3332467082233
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 96,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11172769844580195677&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "openreview": "https://openreview.net/forum?id=ANvmVS2Yr0",
        "pdf": "https://openreview.net/pdf?id=ANvmVS2Yr0",
        "email": "flatironinstitute.org;simonsfoundation.org;;nyu.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Flatiron Institute;Simons Foundation;New York University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://flatironinstitute.org;https://www.simonsfoundation.org;https://www.nyu.edu",
        "aff_unique_abbr": "Flatiron;Simons Foundation;NYU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "OpenChat: Advancing Open-source Language Models with Mixed-Quality Data",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19263",
        "id": "AOJyfhWYHf",
        "author_site": "Guan Wang, Sijie Cheng, Xianyuan Zhan, Xiangang Li, Sen Song, Yang Liu",
        "tldr": "",
        "abstract": "Nowadays, open-source large language models like LLaMA have emerged. Recent developments have incorporated supervised fine-tuning (SFT) and reinforcement learning fine-tuning (RLFT) to align these models with human goals. However, SFT methods treat all training data with mixed quality equally, while RLFT methods require high-quality pairwise or ranking-based preference data. In this study, we present a novel framework, named OpenChat, to advance open-source language models with mixed-quality data. Specifically, we consider the general SFT training data, consisting of a small amount of expert data mixed with a large proportion of sub-optimal data, without any preference labels. We propose the C(onditioned)-RLFT, which regards different data sources as coarse-grained reward labels and learns a class-conditioned policy to leverage complementary data quality information. Interestingly, the optimal policy in C-RLFT can be easily solved through single-stage, RL-free supervised learning, which is lightweight and avoids costly human preference labeling.\nThrough extensive experiments on three standard benchmarks, our openchat-13b fine-tuned with C-RLFT achieves the highest average performance among all 13b open-source language models. Moreover, we use AGIEval to validate the model generalization performance, in which only openchat-13b surpasses the base model. Finally, we conduct a series of analyses to shed light on the effectiveness and robustness of OpenChat. Our code, data, and models are publicly available at https://github.com/imoneoi/openchat and https://huggingface.co/openchat.",
        "keywords": "Open-source Language Models;Fine-tuning;Mixed-quality Data",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/ba82bf0464fce3f6226fc5890f5b6949478ddae3.zip",
        "author": "Guan Wang;Sijie Cheng;Xianyuan Zhan;Xiangang Li;Sen Song;Yang Liu",
        "authorids": "~Guan_Wang3;~Sijie_Cheng1;~Xianyuan_Zhan1;~Xiangang_Li1;~Sen_Song1;~Yang_Liu19",
        "gender": ";F;M;M;M;M",
        "homepage": ";https://adacheng.github.io/;http://zhanxianyuan.xyz/;;https://brain.tsinghua.edu.cn/en/info/1010/1012.htm;http://nlp.csai.tsinghua.edu.cn/~ly/",
        "dblp": ";160/7320;181/5081;124/9046;33/3456;51/3710-5",
        "google_scholar": ";pruwctkAAAAJ;pDMnGloAAAAJ;;cYgtRP4AAAAJ;https://scholar.google.com.hk/citations?user=lVhoKNcAAAAJ",
        "orcid": ";;0000-0002-3683-0554;;0000-0001-5587-0730;0000-0002-3087-242X",
        "linkedin": ";;;;;",
        "or_profile": "~Guan_Wang3;~Sijie_Cheng1;~Xianyuan_Zhan1;~Xiangang_Li1;~Sen_Song1;~Yang_Liu19",
        "aff": ";Tsinghua University;Tsinghua University;;;Tsinghua University",
        "aff_domain": ";mails.tsinghua.edu.cn;tsinghua.edu.cn;;;tsinghua.edu.cn",
        "position": ";PhD student;Associate Professor;;;Professor",
        "bibtex": "@inproceedings{\nwang2024openchat,\ntitle={OpenChat: Advancing Open-source Language Models with Mixed-Quality Data},\nauthor={Guan Wang and Sijie Cheng and Xianyuan Zhan and Xiangang Li and Sen Song and Yang Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=AOJyfhWYHf}\n}",
        "github": "",
        "project": "",
        "reviewers": "g6Xd;yFnS;U8fK;QA7s",
        "pdf_size": 1454850,
        "rating": "6;6;6;6",
        "confidence": "3;3;3;4",
        "soundness": "3;2;3;4",
        "contribution": "3;3;2;3",
        "presentation": "3;3;4;3",
        "wc_summary": "51;85;91;73",
        "wc_strengths": "75;54;161;42",
        "wc_weaknesses": "111;232;94;23",
        "wc_questions": "76;209;31;52",
        "wc_review": "313;580;377;190",
        "wc_reply_reviewers": "15;240;0;0",
        "wc_reply_authors": "764;1767;874;803",
        "reply_reviewers": "1;2;0;0",
        "reply_authors": "2;7;2;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            75.0,
            15.297058540778355
        ],
        "wc_strengths_avg": [
            83.0,
            46.55641738793912
        ],
        "wc_weaknesses_avg": [
            115.0,
            75.18310980532794
        ],
        "wc_questions_avg": [
            92.0,
            69.40100863820352
        ],
        "wc_review_avg": [
            365.0,
            141.1541710329525
        ],
        "wc_reply_reviewers_avg": [
            63.75,
            101.9420791430114
        ],
        "wc_reply_authors_avg": [
            1052.0,
            414.6848200742342
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.25,
            2.165063509461097
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 232,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16578751109969287542&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=AOJyfhWYHf",
        "pdf": "https://openreview.net/pdf?id=AOJyfhWYHf",
        "email": ";mails.tsinghua.edu.cn;tsinghua.edu.cn;;;tsinghua.edu.cn",
        "author_num": 6,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Tsinghua University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "AOSsLRKQrX",
        "title": "DisFormer: Disentangled Object Representations for Learning Visual Dynamics Via Transformers",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We focus on the task of visual dynamics prediction. Recent work has shown that object-centric representations can greatly help improve the accuracy of learning such dynamics in an unsupervised way. Building on top of this work, we ask the question: would it help to learn disentangled object representations, possibly separating the attributes which contribute to the motion dynamics vs which don\u2019t? Though there is some prior work which aims to achieve this, we argue in this paper either it is limiting in their setting, or does not use the learned representation explicitly for predicting visual dynamics, making them sub-optimal. In response, we propose DisFormer, an approach for learning disentangled object representation and use them for predicting visual dynamics. Our architecture extends the notion of slots Locatello et al. (2020) to taking attention over individual objectrepresentations: each slot learns the representation for a block by attending over different parts of an object, and each block is expressed as a linear combination\nover a small set of learned concepts. We perform an iterative refinement over\nthese slots to extract a disentangled representation, which is then fed to a trans-\nformer architecture to predict the next set of latent object representations. Since\nour loss is unsupervised, we need to align the output object masks with those ex-\ntracted from the ground truth image, and we design a novel permutation module\nto achieve this alignment by learning a canonical ordering. We perform a series\nof experiments demonstrating that our learned representations help predict future\ndynamics in the standard setting, where we test on the same environment as train-\ning, and in the setting of transfer, where certain object combinations are never\nseen before. Our method outperforms existing baselines in terms of\npixel prediction and deciphering the dynamics, especially in the zero-shot transfer\nsetting where existing approaches fail miserably. Further analysis reveals that our\nlearned representations indeed help with significantly better disentanglement of\nobjects compared to existing techniques.",
        "keywords": "Unsupervised Visual dynamics prediction;object centric representation;disentangled representation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Sanket Sanjaykumar Gandhi;Vishal Sharma;Rushil Gupta;Arnab Kumar Mondal;Samanyu Mahajan;Parag Singla",
        "authorids": "~Sanket_Sanjaykumar_Gandhi1;~Vishal_Sharma1;~Rushil_Gupta1;~Arnab_Kumar_Mondal2;mahajansamanyu@gmail.com;~Parag_Singla1",
        "gender": "M;M;M;M;;M",
        "homepage": "https://github.com/sanky29;https://www.cse.iitd.ac.in/~vsharma/;;;;http://www.cse.iitd.ac.in/~parags",
        "dblp": "382/4942;;;;;14/167",
        "google_scholar": "https://scholar.google.de/citations?hl=en;HBxIco0AAAAJ;EjrTb2wAAAAJ;MZ8N49AAAAAJ;;https://scholar.google.co.in/citations?user=V49BsgMAAAAJ",
        "orcid": ";;0009-0006-1402-0426;0000-0001-7297-374X;;",
        "linkedin": "sanketgandhi29/;;rusgupta/;arnab-mondal-a4448a18/;;",
        "or_profile": "~Sanket_Sanjaykumar_Gandhi1;~Vishal_Sharma1;~Rushil_Gupta1;~Arnab_Kumar_Mondal2;mahajansamanyu@gmail.com;~Parag_Singla1",
        "aff": "Indian Institute of Technology, Delhi;Indian Institute of Technology Delhi;Universit\u00e9 de Montr\u00e9al;Fujitsu Research and Development Center Co. Ltm.;;Indian Institute of Technology, Delhi",
        "aff_domain": "iitd.ac.in;iitd.ac.in;umontreal.ca;fujitsu.com;;iitd.ac.in",
        "position": "PhD student;PhD student;MS student;Researcher;;Full Professor",
        "bibtex": "@misc{\ngandhi2024disformer,\ntitle={DisFormer: Disentangled Object Representations for Learning Visual Dynamics Via Transformers},\nauthor={Sanket Sanjaykumar Gandhi and Vishal Sharma and Rushil Gupta and Arnab Kumar Mondal and Samanyu Mahajan and Parag Singla},\nyear={2024},\nurl={https://openreview.net/forum?id=AOSsLRKQrX}\n}",
        "github": "",
        "project": "",
        "reviewers": "M2hR;gVGK;987R;HX9L",
        "site": "https://openreview.net/forum?id=AOSsLRKQrX",
        "pdf_size": 1414108,
        "rating": "3;3;3;5",
        "confidence": "3;4;3;4",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;2;2",
        "wc_summary": "88;99;251;112",
        "wc_strengths": "54;47;39;100",
        "wc_weaknesses": "184;186;701;133",
        "wc_questions": "9;145;37;717",
        "wc_review": "335;477;1028;1062",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "58;379;551;295",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;2;3;3",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            137.5,
            66.07760588883347
        ],
        "wc_strengths_avg": [
            60.0,
            23.695991222145572
        ],
        "wc_weaknesses_avg": [
            301.0,
            231.91485506538817
        ],
        "wc_questions_avg": [
            227.0,
            287.42303317584
        ],
        "wc_review_avg": [
            725.5,
            323.64370842023175
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            320.75,
            177.55896907788127
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8213910590279793768&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2;0",
        "aff_unique_norm": "Indian Institute of Technology Delhi;Universit\u00e9 de Montr\u00e9al;Fujitsu Research and Development Center",
        "aff_unique_dep": ";;Research and Development",
        "aff_unique_url": "https://www.iitdelhi.ac.in;https://www.umontreal.ca;https://www.fujitsu.com/global/",
        "aff_unique_abbr": "IIT Delhi;UdeM;Fujitsu R&D",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Delhi;",
        "aff_country_unique_index": "0;0;1;2;0",
        "aff_country_unique": "India;Canada;Japan"
    },
    {
        "id": "AOpJ3vPNu8",
        "title": "A Game Theoretic Approach to Meta-Learning: Nash Model-Agnostic Meta-Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Meta-learning, or learning to learn, aims to develop algorithms that can quickly adapt to new tasks and environments. Model-agnostic meta-learning (MAML), proposed as a bi-level optimization problem, is widely used as a baseline for gradient-based meta-learning algorithms that learn meta-parameters. In MAML, task-specific parameters are adapted independently in the inner-loop. After learning the task-specific parameters, the meta-parameters are learned in the outer-loop by minimizing the average task loss. After MAML, some gradient-based meta-learning research has explored objectives beyond average task losses, such as minimizing worst-case task losses for risk management and improving zero-shot performance in unadaptable environments. However, if the purpose of learning meta-parameters changes, the inner-loop formulation must change accordingly. Therefore, we propose a novel gradient-based meta-learning framework that imposes joint strategy sets and utility functions among tasks, making each task affected by other tasks. To solve this complex problem, we first show the proposed framework can be formulated as a generalized Stackelberg game. After that, we propose the NashMAML algorithm to compute the generalized Stackelberg equilibrium of this model and theoretically prove its convergence. We validate our approach on sinusoidal regression and few-shot image classification tasks. The results demonstrate that our approach outperforms previous methods in handling few-shot learning problems.",
        "keywords": "Meta learning;Game Theory;Generalized Stackelberg Equilibrium",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/9129609b581da5b697389ab759cd0efb9cc84657.zip",
        "author": "Jihwan Yu;Jaeyeon Jo;Taeyoung Yun;Jinkyoo Park",
        "authorids": "~Jihwan_Yu1;~Jaeyeon_Jo1;~Taeyoung_Yun1;~Jinkyoo_Park1",
        "gender": "M;M;M;M",
        "homepage": ";;https://dbsxodud-11.github.io;http://silab.kaist.ac.kr/",
        "dblp": ";273/2679;358/5797.html;156/7535",
        "google_scholar": ";;_51PhLQAAAAJ;sH2a0nkAAAAJ",
        "orcid": "0000-0003-0505-3956;0000-0002-6058-1594;0009-0001-4602-6367;0000-0003-2620-1479",
        "linkedin": ";;;",
        "or_profile": "~Jihwan_Yu1;~Jaeyeon_Jo1;~Taeyoung_Yun1;~Jinkyoo_Park1",
        "aff": ";Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology",
        "aff_domain": ";kaist.ac.kr;kaist.ac.kr;kaist.ac.kr",
        "position": ";PhD student;MS student;Associate Professor",
        "bibtex": "@misc{\nyu2024a,\ntitle={A Game Theoretic Approach to Meta-Learning: Nash Model-Agnostic Meta-Learning},\nauthor={Jihwan Yu and Jaeyeon Jo and Taeyoung Yun and Jinkyoo Park},\nyear={2024},\nurl={https://openreview.net/forum?id=AOpJ3vPNu8}\n}",
        "github": "",
        "project": "",
        "reviewers": "i9rv;azMB;XAaQ;SENj",
        "site": "https://openreview.net/forum?id=AOpJ3vPNu8",
        "pdf_size": 750119,
        "rating": "1;5;5;5",
        "confidence": "4;4;3;3",
        "soundness": "2;2;3;3",
        "contribution": "1;2;2;2",
        "presentation": "3;3;2;3",
        "wc_summary": "56;70;53;106",
        "wc_strengths": "44;34;27;41",
        "wc_weaknesses": "120;217;266;365",
        "wc_questions": "4;4;40;4",
        "wc_review": "224;325;386;516",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.7320508075688772
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            71.25,
            21.063890903629368
        ],
        "wc_strengths_avg": [
            36.5,
            6.576473218982953
        ],
        "wc_weaknesses_avg": [
            242.0,
            88.33742128905507
        ],
        "wc_questions_avg": [
            13.0,
            15.588457268119896
        ],
        "wc_review_avg": [
            362.75,
            105.71512427273592
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:aE9e3quQ1LsJ:scholar.google.com/&scioq=A+Game+Theoretic+Approach+to+Meta-Learning:+Nash+Model-Agnostic+Meta-Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "AP779Zy70y",
        "title": "GATE: How to Keep Out Intrusive Neighbors",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph Attention Networks (GATs) are designed to provide flexible neighborhood aggregation that assigns weights to neighbors according to their importance. In practice, however, GATs are often unable to switch off task-irrelevant neighborhood aggregation, as we show experimentally and analytically. To address this challenge, we propose GATE, a GAT extension that holds three major advantages: i) It alleviates over-smoothing by addressing its root cause of unnecessary neighborhood aggregation. ii) Similarly to perceptrons, it benefits from higher depth as it can still utilize additional layers for (non-)linear feature transformations in case of (nearly) switched-off neighborhood aggregation. iii) By down-weighting connections to unrelated neighbors, it often outperforms GATs on real-world heterophilic datasets. To further validate our claims, we construct a synthetic test bed to analyze a model's ability to utilize the appropriate amount of neighborhood aggregation, which could be of independent interest.",
        "keywords": "graph attention networks;GNN architecture;neighborhood aggregation",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/52a22da891dff12b66675a2383ee60f86966d6ae.zip",
        "author": "Nimrah Mustafa;Rebekka Burkholz",
        "authorids": "~Nimrah_Mustafa1;~Rebekka_Burkholz1",
        "gender": "F;F",
        "homepage": "https://cispa.de/en/people/c01nimu;https://sites.google.com/view/rebekkaburkholz/startseite",
        "dblp": ";194/3172",
        "google_scholar": ";https://scholar.google.ch/citations?user=vkWBb2wAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Nimrah_Mustafa1;~Rebekka_Burkholz1",
        "aff": "CISPA, saarland university, saarland informatics campus;Helmholtz Center CISPA for Information Security",
        "aff_domain": "cispa.saarland;cispa.saarland",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\nmustafa2024gate,\ntitle={{GATE}: How to Keep Out Intrusive Neighbors},\nauthor={Nimrah Mustafa and Rebekka Burkholz},\nyear={2024},\nurl={https://openreview.net/forum?id=AP779Zy70y}\n}",
        "github": "",
        "project": "",
        "reviewers": "8362;nehk;NiY6;J31R;sCet",
        "site": "https://openreview.net/forum?id=AP779Zy70y",
        "pdf_size": 2198281,
        "rating": "5;5;5;6;6",
        "confidence": "3;4;3;3;4",
        "soundness": "3;2;2;3;2",
        "contribution": "3;3;2;3;2",
        "presentation": "3;4;2;3;3",
        "wc_summary": "56;63;101;53;36",
        "wc_strengths": "38;42;22;18;51",
        "wc_weaknesses": "102;406;217;35;119",
        "wc_questions": "15;2;6;83;2",
        "wc_review": "211;513;346;189;208",
        "wc_reply_reviewers": "27;339;0;12;0",
        "wc_reply_authors": "589;1011;426;360;458",
        "reply_reviewers": "1;2;0;1;0",
        "reply_authors": "2;2;1;1;1",
        "rating_avg": [
            5.4,
            0.48989794855663565
        ],
        "confidence_avg": [
            3.4,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            3.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            61.8,
            21.51650529244933
        ],
        "wc_strengths_avg": [
            34.2,
            12.4
        ],
        "wc_weaknesses_avg": [
            175.8,
            128.9858907012701
        ],
        "wc_questions_avg": [
            21.6,
            31.065092950126513
        ],
        "wc_review_avg": [
            293.4,
            123.2665404722628
        ],
        "wc_reply_reviewers_avg": [
            75.6,
            132.07361583601775
        ],
        "wc_reply_authors_avg": [
            568.8,
            233.33015235926968
        ],
        "reply_reviewers_avg": [
            0.8,
            0.7483314773547883
        ],
        "reply_authors_avg": [
            1.4,
            0.4898979485566356
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.16666666666666666,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14484222735322731887&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Saarland University;Helmholtz Center CISPA",
        "aff_unique_dep": "CISPA;Information Security",
        "aff_unique_url": "https://www.uni-saarland.de;https://www.cispa.de/",
        "aff_unique_abbr": "Saarland U;CISPA",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Saarland Informatics Campus;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "ARFRZh6pzI",
        "title": "Tuning-Free Accountable Intervention for LLM Deployment - A Metacognitive Approach",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) have catalyzed transformative advances across a spectrum of natural language processing tasks through few-shot or zero-shot prompting, bypassing the need for parameter tuning. While convenient, this modus operandi aggravates \"hallucination\" concerns, particularly given the enigmatic \"black-box\" nature behind their gigantic model sizes. Such concerns are exacerbated in high-stakes applications (e.g., healthcare), where unaccountable decision errors can lead to devastating consequences. \nIn contrast, human decision-making relies on nuanced cognitive processes, such as the ability to sense and adaptively correct misjudgments through conceptual understanding. Drawing inspiration from human cognition, we propose an innovative *metacognitive* approach, dubbed **CLEAR**, to equip LLMs with capabilities for self-aware error identification and correction. Our framework facilitates the construction of concept-specific sparse subnetworks that illuminate transparent decision pathways. This provides a novel interface for model *intervention* after deployment. Our intervention offers compelling advantages:\n(*i*) at deployment or inference time, our metacognitive LLMs can self-consciously identify potential mispredictions with minimum human involvement, (*ii*) the model has the capability to self-correct its errors efficiently, obviating the need for additional tuning, and (*iii*) the rectification procedure is not only self-explanatory but also user-friendly, enhancing the interpretability and accessibility of the model. By integrating these metacognitive features, our approach pioneers a new path toward engendering greater trustworthiness and accountability in the deployment of LLMs.",
        "keywords": "Large Language Models;Trustworthiness;Interpretability",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Zhen Tan;Jie Peng;Tianlong Chen;huan liu",
        "authorids": "~Zhen_Tan2;~Jie_Peng4;~Tianlong_Chen1;~huan_liu1",
        "gender": "M;M;M;",
        "homepage": "https://zhen-tan-dmml.github.io/;http://home.ustc.edu.cn/~pengjieb/;https://tianlong-chen.github.io;",
        "dblp": "13/10345-1.html;;;",
        "google_scholar": "yMV7JtIAAAAJ;;LE3ctn0AAAAJ;",
        "orcid": "0009-0006-9548-2330;;0000-0001-7774-8197;",
        "linkedin": ";;tianlong-chen-783862167/;",
        "or_profile": "~Zhen_Tan2;~Jie_Peng4;~Tianlong_Chen1;~huan_liu1",
        "aff": "Amazon;University of Science and Technology of China;Harvard University;",
        "aff_domain": "amazon.com;ustc.edu.cn;harvard.edu;",
        "position": "Intern;PhD student;Postdoc;",
        "bibtex": "@misc{\ntan2024tuningfree,\ntitle={Tuning-Free Accountable Intervention for {LLM} Deployment - A Metacognitive Approach},\nauthor={Zhen Tan and Jie Peng and Tianlong Chen and huan liu},\nyear={2024},\nurl={https://openreview.net/forum?id=ARFRZh6pzI}\n}",
        "github": "",
        "project": "",
        "reviewers": "4fqZ;movx;7QQj;DFsm",
        "site": "https://openreview.net/forum?id=ARFRZh6pzI",
        "pdf_size": 1763932,
        "rating": "5;5;6;8",
        "confidence": "4;3;2;3",
        "soundness": "3;3;2;4",
        "contribution": "3;2;2;3",
        "presentation": "2;4;3;4",
        "wc_summary": "135;106;93;91",
        "wc_strengths": "70;11;52;77",
        "wc_weaknesses": "52;197;167;80",
        "wc_questions": "43;7;125;16",
        "wc_review": "300;321;437;264",
        "wc_reply_reviewers": "0;16;0;62",
        "wc_reply_authors": "789;1348;2072;740",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "4;5;5;2",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            106.25,
            17.5695048308141
        ],
        "wc_strengths_avg": [
            52.5,
            25.636887486588538
        ],
        "wc_weaknesses_avg": [
            124.0,
            59.787122359250574
        ],
        "wc_questions_avg": [
            47.75,
            46.5262022950509
        ],
        "wc_review_avg": [
            330.5,
            64.77846864506755
        ],
        "wc_reply_reviewers_avg": [
            19.5,
            25.391927851189244
        ],
        "wc_reply_authors_avg": [
            1237.25,
            537.8798076708216
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            4.0,
            1.224744871391589
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.28867513459481287,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14447195481248609480&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Amazon;University of Science and Technology of China;Harvard University",
        "aff_unique_dep": "Amazon.com, Inc.;;",
        "aff_unique_url": "https://www.amazon.com;http://www.ustc.edu.cn;https://www.harvard.edu",
        "aff_unique_abbr": "Amazon;USTC;Harvard",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "ARP0xaE6od",
        "title": "Adapting Large Language Models for Content Moderation: Pitfalls in Data Engineering and Supervised Fine-tuning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Nowadays, billions of people engage in communication and express their opinions on the internet daily. Unfortunately, not all of these expressions are friendly or compliant, making content moderation an indispensable task. With the successful development of Large Language Models (LLMs) in recent years, LLM-based methods have become a feasible solution for handling tasks in various domains. However, in the field of content moderation, there is still a lack of detailed work that systematically introduces implementation details. In this paper, we introduce how to fine-tune an LLM model that can be privately deployed for content moderation. Specifically, we discuss whether incorporating reasons during the fine-tuning process would be better or if it should be treated as a classification task directly. We also explore the benefits of utilizing reasons generated by more powerful LLMs for fine-tuning privately deployed models and the impact of different processing approaches when the answers generated by the more powerful LLMs are incorrect. We report the entire research process and the key findings in this paper, hoping to provide valuable experience for researchers who are fine-tuning privately deployed models in their domain-specific research.",
        "keywords": "large language models;content moderation;fine-tuning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Huan Ma;Changqing Zhang;Huazhu Fu;Peilin Zhao;Bingzhe Wu",
        "authorids": "~Huan_Ma1;~Changqing_Zhang1;~Huazhu_Fu4;~Peilin_Zhao2;~Bingzhe_Wu1",
        "gender": "M;M;M;;M",
        "homepage": "https://github.com/MaHuanAAA;http://cic.tju.edu.cn/faculty/zhangchangqing/index.html;https://hzfu.github.io;;",
        "dblp": ";78/2668;63/7767;84/8411;207/4843",
        "google_scholar": ";yJGhdykAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com.hk/citations?user=HPeX_YcAAAAJ;_3hgtf8AAAAJ",
        "orcid": "0009-0000-4448-9897;;0000-0002-9702-5524;0000-0001-8543-3953;",
        "linkedin": "huan-ma-037711276/;;;;",
        "or_profile": "~Huan_Ma1;~Changqing_Zhang1;~Huazhu_Fu4;~Peilin_Zhao2;~Bingzhe_Wu1",
        "aff": "Tencent AI Lab;Tianjin University;Institute of High Performance Computing, Singapore, A*STAR;Tencent;Tencent AI Lab",
        "aff_domain": "tencent.com;tju.edu.cn;ihpc.a-star.edu.sg;tencent.com;tencent.com",
        "position": "Intern;Associate Professor;Principal Scientist;Researcher;Researcher",
        "bibtex": "@misc{\nma2024adapting,\ntitle={Adapting Large Language Models for Content Moderation: Pitfalls in Data Engineering and Supervised Fine-tuning},\nauthor={Huan Ma and Changqing Zhang and Huazhu Fu and Peilin Zhao and Bingzhe Wu},\nyear={2024},\nurl={https://openreview.net/forum?id=ARP0xaE6od}\n}",
        "github": "",
        "project": "",
        "reviewers": "65ce;7bgL;8Sfa",
        "site": "https://openreview.net/forum?id=ARP0xaE6od",
        "pdf_size": 733690,
        "rating": "3;3;6",
        "confidence": "3;4;3",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "2;2;2",
        "wc_summary": "107;43;68",
        "wc_strengths": "51;20;129",
        "wc_weaknesses": "264;317;127",
        "wc_questions": "76;3;3",
        "wc_review": "498;383;327",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            72.66666666666667,
            26.335442953471574
        ],
        "wc_strengths_avg": [
            66.66666666666667,
            45.85726647859518
        ],
        "wc_weaknesses_avg": [
            236.0,
            80.05414834139869
        ],
        "wc_questions_avg": [
            27.333333333333332,
            34.41253001774532
        ],
        "wc_review_avg": [
            402.6666666666667,
            71.1820826394458
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 24,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9620926999652194412&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;0;0",
        "aff_unique_norm": "Tencent;Tianjin University;Institute of High Performance Computing",
        "aff_unique_dep": "Tencent AI Lab;;",
        "aff_unique_url": "https://ai.tencent.com;http://www.tju.edu.cn;https://www.ihpc.a-star.edu.sg",
        "aff_unique_abbr": "Tencent AI Lab;TJU;IHPC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "China;Singapore"
    },
    {
        "title": "On the hardness of learning under symmetries",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19262",
        "id": "ARPrtuzAnQ",
        "author_site": "Bobak Kiani, Thien Le, Hannah Lawrence, Stefanie Jegelka, Melanie Weber",
        "tldr": "",
        "abstract": "We study the problem of learning equivariant neural networks via gradient descent. The incorporation of known  symmetries (\"equivariance\") into neural nets has empirically improved the performance of learning pipelines, in domains ranging from biology to computer vision. However, a rich yet separate line of learning theoretic research has demonstrated that actually learning shallow, fully-connected (i.e. non-symmetric) networks has exponential complexity in the correlational statistical query (CSQ) model, a framework encompassing gradient descent. In this work, we ask: are known problem symmetries sufficient to alleviate the fundamental hardness of learning neural nets with gradient descent? We answer this question in the negative. In particular, we give lower bounds for shallow graph neural networks, convolutional networks, invariant polynomials, and frame-averaged networks for permutation subgroups, which all scale either superpolynomially or exponentially in the relevant input dimension. Therefore, in spite of the significant inductive bias imparted via symmetry, actually learning the complete classes of functions represented by equivariant neural networks via gradient descent remains hard.",
        "keywords": "Equivariance;statistical query;lower bound;computational hardness;invariance;symmetry;neural networks",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/31c55803ff649b8bb0d1d92205dad839c65e06f8.pdf",
        "author": "Bobak Kiani;Thien Le;Hannah Lawrence;Stefanie Jegelka;Melanie Weber",
        "authorids": "~Bobak_Kiani1;~Thien_Le1;~Hannah_Lawrence1;~Stefanie_Jegelka3;~Melanie_Weber1",
        "gender": ";M;F;F;",
        "homepage": ";https://steven-le-thien.github.io;https://hannahlawrence.github.io/;http://people.csail.mit.edu/stefje/;",
        "dblp": "232/4086;194/5549;251/5474;38/7003;",
        "google_scholar": ";WhFGh74AAAAJ;;gTWUZlsAAAAJ;",
        "orcid": ";0000-0001-5476-8451;;;",
        "linkedin": "bobak-kiani;;hannah-lawrence-417b5a130/;;",
        "or_profile": "~Bobak_Kiani1;~Thien_Le1;~Hannah_Lawrence1;~Stefanie_Jegelka3;~Melanie_Weber1",
        "aff": "Massachusetts Institute of Technology;Massachusetts Institute of Technology;Massachusetts Institute of Technology;Massachusetts Institute of Technology;",
        "aff_domain": "mit.edu;mit.edu;mit.edu;mit.edu;",
        "position": "PhD student;PhD student;PhD student;Associate Professor;",
        "bibtex": "@inproceedings{\nkiani2024on,\ntitle={On the hardness of learning under symmetries},\nauthor={Bobak Kiani and Thien Le and Hannah Lawrence and Stefanie Jegelka and Melanie Weber},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ARPrtuzAnQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "Fgas;kFXh;aiE7",
        "pdf_size": 845675,
        "rating": "6;8;8",
        "confidence": "5;3;3",
        "soundness": "4;4;4",
        "contribution": "3;4;3",
        "presentation": "4;4;3",
        "wc_summary": "401;86;73",
        "wc_strengths": "111;80;124",
        "wc_weaknesses": "39;30;106",
        "wc_questions": "45;62;1",
        "wc_review": "596;258;304",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "317;511;112",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            4.0,
            0.0
        ],
        "contribution_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            186.66666666666666,
            151.64944957221425
        ],
        "wc_strengths_avg": [
            105.0,
            18.457157599876172
        ],
        "wc_weaknesses_avg": [
            58.333333333333336,
            33.9050963065371
        ],
        "wc_questions_avg": [
            36.0,
            25.703436864876
        ],
        "wc_review_avg": [
            386.0,
            149.67520391389706
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            313.3333333333333,
            162.91170069157778
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18055256462617413365&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=ARPrtuzAnQ",
        "pdf": "https://openreview.net/pdf?id=ARPrtuzAnQ",
        "email": "mit.edu;mit.edu;mit.edu;mit.edu;",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Massachusetts Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://web.mit.edu",
        "aff_unique_abbr": "MIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "ASppt1L3hx",
        "title": "Cooperative Minibatching in Graph Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Significant computational resources are required to train Graph Neural Networks (GNNs) at a large scale,\nand the process is highly data-intensive.\nOne of the most effective ways to reduce resource requirements is minibatch training \ncoupled with graph sampling.\nGNNs have the unique property that items in a minibatch have overlapping data. \nHowever, the commonly implemented Independent Minibatching approach assigns each Processing \nElement (PE) its own minibatch to process, leading to duplicated computations and input data access across PEs. \nThis amplifies the Neighborhood Explosion Phenomenon (NEP), which is the main bottleneck limiting scaling. \nTo reduce the effects of NEP in the multi-PE setting,\nwe propose a new approach called Cooperative Minibatching. \nOur approach capitalizes on the fact that the size of the sampled subgraph is a concave function of the batch size, leading to \nsignificant reductions in the amount of work per seed vertex as batch sizes increase. Hence, it is favorable for \nprocessors to work on a large minibatch together as a single larger processor, instead of working on separate smaller \nminibatches, even though global batch size is identical.\nWe also show how to take advantage of the same phenomenon in serial execution by generating dependent consecutive minibatches. \nOur experimental evaluations show up to 4x bandwidth savings for fetching vertex embeddings, by simply increasing \nthis dependency without harming model convergence. Combining our proposed approaches, we achieve up to 64\\% \nspeedup over Independent Minibatching on single-node multi-GPU systems and show \nthat load balancing is not an issue despite the use of lock-step communication.",
        "keywords": "graph learning;graph neural networks;gnn;multigpu training",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/6dfd498f249f8487991ed90b471e5f8be5df2b12.zip",
        "author": "Muhammed Fatih Balin;Dominique LaSalle;Umit Catalyurek",
        "authorids": "~Muhammed_Fatih_Balin1;~Dominique_LaSalle1;~Umit_Catalyurek1",
        "gender": "M;;M",
        "homepage": "http://mfbal.in;;https://www.cc.gatech.edu/~umit/",
        "dblp": "234/8533;;https://dblp.uni-trier.de/pid/c/UmitVCatalyurek.html",
        "google_scholar": "https://scholar.google.com.tr/citations?user=xfzbywYAAAAJ;;OLDMURQAAAAJ",
        "orcid": "0000-0001-9935-2687;;",
        "linkedin": "mfbalin/;;catalyurek/",
        "or_profile": "~Muhammed_Fatih_Balin1;~Dominique_LaSalle1;~Umit_Catalyurek1",
        "aff": "Georgia Institute of Technology;;Georgia Institute of Technology",
        "aff_domain": "gatech.edu;;gatech.edu",
        "position": "PhD student;;Full Professor",
        "bibtex": "@misc{\nbalin2024cooperative,\ntitle={Cooperative Minibatching in Graph Neural Networks},\nauthor={Muhammed Fatih Balin and Dominique LaSalle and Umit Catalyurek},\nyear={2024},\nurl={https://openreview.net/forum?id=ASppt1L3hx}\n}",
        "github": "",
        "project": "",
        "reviewers": "LvyT;m5Sh;GNH8",
        "site": "https://openreview.net/forum?id=ASppt1L3hx",
        "pdf_size": 2004684,
        "rating": "1;6;6",
        "confidence": "5;3;3",
        "soundness": "1;3;2",
        "contribution": "1;3;2",
        "presentation": "1;3;3",
        "wc_summary": "28;109;60",
        "wc_strengths": "10;48;67",
        "wc_weaknesses": "212;40;205",
        "wc_questions": "80;216;71",
        "wc_review": "330;413;403",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "695;676;873",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;2;2",
        "rating_avg": [
            4.333333333333333,
            2.357022603955158
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            65.66666666666667,
            33.30999182761166
        ],
        "wc_strengths_avg": [
            41.666666666666664,
            23.697163449568293
        ],
        "wc_weaknesses_avg": [
            152.33333333333334,
            79.48305200201835
        ],
        "wc_questions_avg": [
            122.33333333333333,
            66.33417084898419
        ],
        "wc_review_avg": [
            382.0,
            36.995495221265344
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            748.0,
            88.72804892854721
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18112592828352537730&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Georgia Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.gatech.edu",
        "aff_unique_abbr": "Georgia Tech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "GAIA: Zero-shot Talking Avatar Generation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19261",
        "id": "ATEawsFUj4",
        "author_site": "Tianyu He, Junliang Guo, Runyi Yu, Yuchi Wang, jialiang zhu, Kaikai An, Leyi Li, Xu Tan, Chunyu Wang, Han Hu, HsiangTao Wu, sheng zhao, Jiang Bian",
        "tldr": "",
        "abstract": "Zero-shot talking avatar generation aims at synthesizing natural talking videos from speech and a single portrait image. Previous methods have relied on domain-specific heuristics such as warping-based motion representation and 3D Morphable Models, which limit the naturalness and diversity of the generated avatars. In this work, we introduce GAIA (Generative AI for Avatar), which eliminates the domain priors in talking avatar generation. In light of the observation that the speech only drives the motion of the avatar while the appearance of the avatar and the background typically remain the same throughout the entire video, we divide our approach into two stages: 1) disentangling each frame into motion and appearance representations; 2) generating motion sequences conditioned on the speech and reference portrait image. We collect a large-scale high-quality talking avatar dataset and train the model on it with different scales (up to 2B parameters). Experimental results verify the superiority, scalability, and flexibility of GAIA as 1) the resulting model beats previous baseline models in terms of naturalness, diversity, lip-sync quality, and visual quality; 2) the framework is scalable since larger models yield better results; 3) it is general and enables different applications like controllable talking avatar generation and text-instructed avatar generation.",
        "keywords": "Talking Avatar Generation;Video Generation;Disentanglement;Diffusion Models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/5e232f403fc3dd96d63591c6871d42425e9a6f46.zip",
        "author": "Tianyu He;Junliang Guo;Runyi Yu;Yuchi Wang;jialiang zhu;Kaikai An;Leyi Li;Xu Tan;Chunyu Wang;Han Hu;HsiangTao Wu;sheng zhao;Jiang Bian",
        "authorids": "~Tianyu_He1;~Junliang_Guo1;~Runyi_Yu1;~Yuchi_Wang1;~jialiang_zhu2;~Kaikai_An1;~Leyi_Li1;~Xu_Tan1;~Chunyu_Wang1;~Han_Hu1;~HsiangTao_Wu1;~sheng_zhao1;~Jiang_Bian1",
        "gender": "M;M;F;M;M;M;;M;M;M;M;M;M",
        "homepage": "https://www.microsoft.com/en-us/research/people/tianyuhe/;https://leoguojl.me/;https://ingrid789.github.io/IngridYu/;https://wangyuchi369.github.io/;https://github.com/jialiang-zhu;https://github.com/kkk-an;https://xunmeibuyue.github.io/;https://tan-xu.github.io/;https://www.chunyuwang.org/;https://ancientmooner.github.io/;https://www.microsoft.com/en-us/research/people/musclewu/;https://www.aaai.org/ojs/index.php/AAAI/article/view/4642;https://sites.google.com/view/jiangbian",
        "dblp": "198/4010;209/9674;94/6433-2;358/5700;;;;96/10484-3;63/7235;;;;09/851-2.html",
        "google_scholar": "P08KU1YAAAAJ;https://scholar.google.com.sg/citations?user=S88C9ewAAAAJ;https://scholar.google.com.hk/citations?user=jUSqsWkAAAAJ;RxuU_0YAAAAJ;;6TrBRiEAAAAJ;;tob-U1oAAAAJ;https://scholar.google.co.jp/citations?user=VXQV5xwAAAAJ;Jkss014AAAAJ;;689bIIwAAAAJ;pZBEnY8AAAAJ",
        "orcid": "0000-0002-4828-3228;0000-0001-8360-5483;;;;;;0000-0001-5631-0639;;;;;0000-0002-9472-600X",
        "linkedin": ";;;;;;;;;;;;jbian/",
        "or_profile": "~Tianyu_He1;~Junliang_Guo1;~Runyi_Yu1;~Yuchi_Wang1;~jialiang_zhu2;~Kaikai_An1;~Leyi_Li1;~Xu_Tan1;~Chunyu_Wang1;~Han_Hu1;~HsiangTao_Wu1;~sheng_zhao1;~Jiang_Bian1",
        "aff": "Microsoft Research Asia;Microsoft;Peking University;Peking University;Southeast University;Peking University;Zhejiang University;Microsoft;Microsoft Research Asia;Microsft Research Asia;Microsoft;Microsoft;Microsoft",
        "aff_domain": "microsoft.com;microsoft.com;pku.edu.cn;pku.edu.cn;seu.edu.cn;pku.edu.cn;zju.edu.cn;microsoft.com;microsoft.com;microsoft.com;microsoft.com;microsoft.com;microsoft.com",
        "position": "Researcher;Researcher;MS student;MS student;PhD student;MS student;MS student;Principal Researcher;Researcher;Researcher;Principal Researcher;Researcher;Partner Research Manager",
        "bibtex": "@inproceedings{\nhe2024gaia,\ntitle={{GAIA}: Zero-shot Talking Avatar Generation},\nauthor={Tianyu He and Junliang Guo and Runyi Yu and Yuchi Wang and jialiang zhu and Kaikai An and Leyi Li and Xu Tan and Chunyu Wang and Han Hu and HsiangTao Wu and sheng zhao and Jiang Bian},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ATEawsFUj4}\n}",
        "github": "",
        "project": "",
        "reviewers": "tNS3;Lkke;ft55;1S6P",
        "pdf_size": 12849431,
        "rating": "6;6;6;8",
        "confidence": "4;3;5;4",
        "soundness": "3;3;3;3",
        "contribution": "3;3;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "60;33;57;109",
        "wc_strengths": "82;71;41;34",
        "wc_weaknesses": "49;40;97;190",
        "wc_questions": "23;44;222;26",
        "wc_review": "214;188;417;359",
        "wc_reply_reviewers": "0;25;46;54",
        "wc_reply_authors": "363;590;1326;1096",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "2;2;4;4",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            64.75,
            27.60774347895894
        ],
        "wc_strengths_avg": [
            57.0,
            20.03746490951388
        ],
        "wc_weaknesses_avg": [
            94.0,
            59.510503274632114
        ],
        "wc_questions_avg": [
            78.75,
            83.09444927310128
        ],
        "wc_review_avg": [
            294.5,
            96.16262267638086
        ],
        "wc_reply_reviewers_avg": [
            31.25,
            20.92098229051399
        ],
        "wc_reply_authors_avg": [
            843.75,
            384.6117360403866
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            1.0
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            13,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 21,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11354634788031823120&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=ATEawsFUj4",
        "pdf": "https://openreview.net/pdf?id=ATEawsFUj4",
        "email": "microsoft.com;microsoft.com;pku.edu.cn;pku.edu.cn;seu.edu.cn;pku.edu.cn;zju.edu.cn;microsoft.com;microsoft.com;microsoft.com;microsoft.com;microsoft.com;microsoft.com",
        "author_num": 13,
        "aff_unique_index": "0;0;1;1;2;1;3;0;0;0;0;0;0",
        "aff_unique_norm": "Microsoft;Peking University;Southeast University;Zhejiang University",
        "aff_unique_dep": "Research;;;",
        "aff_unique_url": "https://www.microsoft.com/en-us/research/group/asia;http://www.pku.edu.cn;https://www.seu.edu.cn/;https://www.zju.edu.cn",
        "aff_unique_abbr": "MSR Asia;Peking U;SEU;ZJU",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Asia;",
        "aff_country_unique_index": "0;1;0;0;0;0;0;1;0;0;1;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "ATFPZbSZia",
        "title": "Grouplane: End-to-End 3D Lane Detection with Channel-Wise Grouping",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Efficiency is quite important for 3D lane detection while previous detectors are either computationally expensive or difficult for optimization. To bridge this gap, we propose a fully convolutional detector named GroupLane, which is simple, fast, and still maintains high detection precision. Specifically, we first propose to split extracted feature into multiple groups along the channel dimension and employ every group to represent a prediction. In this way, GroupLane realizes end-to-end detection like DETR based on pure convolutional neural network. Then, we propose to represent lanes by performing row-wise classification in bird\u2019s eye view and devise a set of corresponding detection heads. Compared with existing row-wise classification implementations that only support recognizing vertical lanes, ours can detect both vertical and horizontal ones. Additionally, a matching algorithm named single-win one-to-one matching is developed to associate prediction with labels during training. Evaluated on 3 benchmarks, OpenLane, Once-3DLanes, and OpenLane-Huawei, GroupLane adopting ConvNext-Base as the backbone outperforms the published state-of-the-art PersFormer by 13.6% F1 score in the OpenLane validation set. Besides, GroupLane with ResNet18 still surpasses PersFormer by 4.9% F1 score, while the inference speed is 7$\\times$ faster.",
        "keywords": "3D lane detection;end-to-end;row-wise classification;fully convolutional",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/4f580cb11e17a27feb9056536ca7021a480fb213.zip",
        "author": "Zhuoling Li;chunrui han;Zheng Ge;Jinrong Yang;En Yu;Haoqian Wang;Hengshuang Zhao;Xiangyu Zhang",
        "authorids": "~Zhuoling_Li1;~chunrui_han1;~Zheng_Ge1;~Jinrong_Yang1;~En_Yu1;~Haoqian_Wang1;~Hengshuang_Zhao2;~Xiangyu_Zhang1",
        "gender": "M;F;M;M;M;M;M;M",
        "homepage": "https://lizhuoling.github.io/;https://github.com/hanchunrui;;https://yancie-yjr.github.io/;https://www.zhihu.com/people/yu-en-47-48;;https://hszhao.github.io;",
        "dblp": "243/1499;;231/1007;286/5463;213/4929;;185/7848;95/3760-5.html",
        "google_scholar": "2r6ejykAAAAJ;;hJ-VrrIAAAAJ;8Of_NYQAAAAJ;https://scholar.google.com.hk/citations?user=rWCQMNgAAAAJ;;4uE10I0AAAAJ;yuB-cfoAAAAJ",
        "orcid": ";;;;;0000-0003-2792-8469;0000-0001-8277-2706;0000-0003-2138-4608",
        "linkedin": ";;;;;;hengshuang-zhao-347b8391/?originalSubdomain=hk;",
        "or_profile": "~Zhuoling_Li1;~chunrui_han1;~Zheng_Ge1;~Jinrong_Yang1;~En_Yu1;~Haoqian_Wang1;~Hengshuang_Zhao2;~Xiangyu_Zhang1",
        "aff": "University of Hong Kong;Megvii Technology Inc.;Megvii Technology Inc.;Huazhong University of Science and Technology;Huazhong University of Science and Technology;Tsinghua University;The University of Hong Kong;MEGVII Technology",
        "aff_domain": "hku.hk;megvii.com;megvii.com;hust.edu.cn;hust.edu;tsinghua.edu.cn;hku.hk;megvii.com",
        "position": "PhD student;Researcher;Researcher;PhD student;PhD student;Full Professor;Assistant Professor;Principal Researcher",
        "bibtex": "@misc{\nli2024grouplane,\ntitle={Grouplane: End-to-End 3D Lane Detection with Channel-Wise Grouping},\nauthor={Zhuoling Li and chunrui han and Zheng Ge and Jinrong Yang and En Yu and Haoqian Wang and Hengshuang Zhao and Xiangyu Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=ATFPZbSZia}\n}",
        "github": "",
        "project": "",
        "reviewers": "5Kts;RkdN;dGoq",
        "site": "https://openreview.net/forum?id=ATFPZbSZia",
        "pdf_size": 3193343,
        "rating": "5;5;6",
        "confidence": "4;5;3",
        "soundness": "3;3;2",
        "contribution": "2;2;3",
        "presentation": "3;2;3",
        "wc_summary": "87;63;62",
        "wc_strengths": "37;11;84",
        "wc_weaknesses": "37;75;151",
        "wc_questions": "82;1;35",
        "wc_review": "243;150;332",
        "wc_reply_reviewers": "0;12;125",
        "wc_reply_authors": "648;796;897",
        "reply_reviewers": "0;1;1",
        "reply_authors": "2;4;3",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            70.66666666666667,
            11.55662388223981
        ],
        "wc_strengths_avg": [
            44.0,
            30.21037349432586
        ],
        "wc_weaknesses_avg": [
            87.66666666666667,
            47.39432689913659
        ],
        "wc_questions_avg": [
            39.333333333333336,
            33.209770985191824
        ],
        "wc_review_avg": [
            241.66666666666666,
            74.3071702835975
        ],
        "wc_reply_reviewers_avg": [
            45.666666666666664,
            56.31064631922536
        ],
        "wc_reply_authors_avg": [
            780.3333333333334,
            102.25567085605678
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.0,
            0.816496580927726
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11111051036937699351&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1;2;2;3;0;1",
        "aff_unique_norm": "University of Hong Kong;Megvii Technology;Huazhong University of Science and Technology;Tsinghua University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.hku.hk;https://www.megvii.com;http://www.hust.edu.cn;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "HKU;Megvii;HUST;THU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "ATQSDgYwqA",
        "title": "Diffusion Random Feature Model",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Diffusion probabilistic models have been successfully used to generate data from noise. However, most diffusion models are computationally expensive and difficult to interpret with a lack of theoretical justification. Random feature models (RFMs) on the other hand have gained popularity due to their interpretability but their application to complex machine learning tasks remains limited.  In this work,  we present a diffusion model-inspired deep random feature model that is interpretable and gives comparable numerical results to a fully connected neural network having the same number of trainable parameters. Specifically, we extend existing results for random features and derive generalization bounds between the distribution of sampled data and the true distribution using properties of score matching. We validate our findings by generating samples on the fashion MNIST dataset and instrumental audio data.",
        "keywords": "Diffusion Models;Deep Random Feature Models;Generalization Bounds",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/90d99ba01a4642577c4724dcead598157e441d63.pdf",
        "author": "Esha Saha;Giang Tran",
        "authorids": "~Esha_Saha1;~Giang_Tran2",
        "gender": "F;",
        "homepage": ";https://uwaterloo.ca/applied-mathematics/people-profiles/giang-tran",
        "dblp": "254/3655;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;-zCxA1AAAAAJ",
        "orcid": "0000-0002-1548-5712;0000-0002-3518-153X",
        "linkedin": "esha-saha-bb86171b6/?originalSubdomain=ca;",
        "or_profile": "~Esha_Saha1;~Giang_Tran2",
        "aff": "University of Waterloo;University of Waterloo",
        "aff_domain": "uwaterloo.ca;uwaterloo.ca",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nsaha2024diffusion,\ntitle={Diffusion Random Feature Model},\nauthor={Esha Saha and Giang Tran},\nyear={2024},\nurl={https://openreview.net/forum?id=ATQSDgYwqA}\n}",
        "github": "",
        "project": "",
        "reviewers": "2YaV;3pnu;vFu7;crxL;58mK;2JVx",
        "site": "https://openreview.net/forum?id=ATQSDgYwqA",
        "pdf_size": 966474,
        "rating": "3;3;3;5;5;6",
        "confidence": "5;4;4;4;3;3",
        "soundness": "1;3;1;3;3;3",
        "contribution": "1;3;1;2;3;3",
        "presentation": "3;4;3;2;2;3",
        "wc_summary": "77;54;70;92;100;46",
        "wc_strengths": "42;44;33;76;79;28",
        "wc_weaknesses": "172;281;147;415;222;68",
        "wc_questions": "93;3;20;9;305;2",
        "wc_review": "384;382;270;592;706;144",
        "wc_reply_reviewers": "57;26;22;92;0;0",
        "wc_reply_authors": "539;1217;725;1325;1460;405",
        "reply_reviewers": "1;1;1;1;0;0",
        "reply_authors": "2;3;1;4;3;1",
        "rating_avg": [
            4.166666666666667,
            1.2133516482134197
        ],
        "confidence_avg": [
            3.8333333333333335,
            0.6871842709362768
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.1666666666666665,
            0.8975274678557507
        ],
        "presentation_avg": [
            2.8333333333333335,
            0.6871842709362768
        ],
        "wc_summary_avg": [
            73.16666666666667,
            19.169564998252365
        ],
        "wc_strengths_avg": [
            50.333333333333336,
            19.955506062794353
        ],
        "wc_weaknesses_avg": [
            217.5,
            109.88592569872934
        ],
        "wc_questions_avg": [
            72.0,
            108.83014288330233
        ],
        "wc_review_avg": [
            413.0,
            188.194048790072
        ],
        "wc_reply_reviewers_avg": [
            32.833333333333336,
            32.672193410027155
        ],
        "wc_reply_authors_avg": [
            945.1666666666666,
            405.882748531587
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            1.1055415967851334
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.766241095350685,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:cZDvD6V_pBkJ:scholar.google.com/&scioq=Diffusion+Random+Feature+Model&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Waterloo",
        "aff_unique_dep": "",
        "aff_unique_url": "https://uwaterloo.ca",
        "aff_unique_abbr": "UW",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "ATaE46G1eJ",
        "title": "CosPGD: an efficient white-box adversarial attack for pixel-wise prediction tasks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "While neural networks allow highly accurate predictions in many tasks, their lack of robustness towards even slight input perturbations hampers their deployment in many real-world applications.\nWhite-box adversarial attacks such as the seminal projected gradient descent (PGD) offer an effective means to evaluate the model robustness and dedicated solutions have been proposed for example for attacks on semantic segmentation or on optical flow. \nTo streamline the evaluation process, we propose an efficient white-box adversarial attack, termed CosPGD, that can be applied to any pixel-wise prediction task in a unified setting.\nTo this end, CosPGD employs a simple loss scaling based on the cosine similarity between the distributions over the predictions and ground truth (or target, for targeted attacks).\nThis leads to efficient evaluations of a model's robustness for pixelwise classification as well as regression models, providing new insights into their performance at earlier attack stages.\nWe outperform the SotA on semantic segmentation attacks in our experiments on PASCAL VOC2012 and CityScapes.\nFurther, we showcase CosPGD's versatility by evaluating optical flow as well as image restoration models. \nWe provide code for the CosPGD algorithm and example usage at https://anonymous.4open.science/r/cospgd-iclr2024-909/.",
        "keywords": "adversarial attacks;pgd;fgsm;cospgd;cosine similarity;semantic segmentation;optical flow;benchmarking tool;benchmark adversarial attack;lp norm;l-inf norm;l-2 norm",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Shashank Agnihotri;Steffen Jung;Margret Keuper",
        "authorids": "~Shashank_Agnihotri1;~Steffen_Jung1;~Margret_Keuper1",
        "gender": "M;M;F",
        "homepage": "https://www.uni-mannheim.de/dws/people/researchers/phd-students/shashank/;http://jung.vision;https://www.vc.informatik.uni-siegen.de/en/keuper-margret",
        "dblp": ";252/0087-1;95/7589",
        "google_scholar": "vhm_xu8AAAAJ;x5ovaJcAAAAJ;https://scholar.google.de/citations?user=KMqMQAcAAAAJ",
        "orcid": "0000-0001-6097-8551;0000-0001-8021-791X;0000-0002-8437-7993",
        "linkedin": "shashank-agnihotri/;jung-vision/;",
        "or_profile": "~Shashank_Agnihotri1;~Steffen_Jung1;~Margret_Keuper1",
        "aff": "Universit\u00e4t Siegen;Saarland Informatics Campus, Max-Planck Institute;Max Planck Institute for Informatics",
        "aff_domain": "uni-siegen.de;mpi-inf.mpg.de;mpi-inf.mpg",
        "position": "PhD student;PhD student;Researcher",
        "bibtex": "@misc{\nagnihotri2024cospgd,\ntitle={Cos{PGD}: an efficient white-box adversarial attack for pixel-wise prediction tasks},\nauthor={Shashank Agnihotri and Steffen Jung and Margret Keuper},\nyear={2024},\nurl={https://openreview.net/forum?id=ATaE46G1eJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "3VUb;E2Ss;kcAq;YMdT",
        "site": "https://openreview.net/forum?id=ATaE46G1eJ",
        "pdf_size": 11646064,
        "rating": "5;5;5;8",
        "confidence": "4;4;4;5",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;2;4",
        "wc_summary": "61;64;52;123",
        "wc_strengths": "37;34;65;167",
        "wc_weaknesses": "91;367;90;176",
        "wc_questions": "2;4;151;3",
        "wc_review": "191;469;358;469",
        "wc_reply_reviewers": "74;0;0;11",
        "wc_reply_authors": "1037;1328;751;1697",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "4;3;3;4",
        "rating_avg": [
            5.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            75.0,
            28.062430400804562
        ],
        "wc_strengths_avg": [
            75.75,
            54.05263638343647
        ],
        "wc_weaknesses_avg": [
            181.0,
            112.91811192187018
        ],
        "wc_questions_avg": [
            40.0,
            64.08978077665736
        ],
        "wc_review_avg": [
            371.75,
            113.77032785397078
        ],
        "wc_reply_reviewers_avg": [
            21.25,
            30.784533454317607
        ],
        "wc_reply_authors_avg": [
            1203.25,
            350.54270424585934
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.5,
            0.5
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2686630512059451311&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of Siegen;Max-Planck Institute;Max Planck Institute for Informatics",
        "aff_unique_dep": ";Informatics;",
        "aff_unique_url": "https://www.uni-siegen.de;https://www.mpi-sws.org;https://mpi-inf.mpg.de",
        "aff_unique_abbr": "Uni Siegen;MPI-SWS;MPII",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Saarland",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "ATuX4zRnJo",
        "title": "NoiseOut: Learning to Gate Improves Robustness in Deep Neural Networks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Deep Neural Networks (DNNs) achieve impressive performance, when trained on datasets of similar distributions. However, they struggle to generalize to novel data, such as image perturbations, when they differ from the training distribution. Using the Integrated Gradients method, we visualize several perturbed features contributing to the higher classification errors. To filter out such distractor features, we take inspiration from the thalamus, which is a biological gating mechanism that improves the signal fidelity of novel stimuli for task completion. Similarly, we propose a novel method called NoiseOut which is a lightweight modular gating mechanism that can be easily integrated with existing DNNs to enhance its robustness to novel image perturbations. When training on the clean datasets, we randomly replaced a subset of the hidden states with normally-sampled values and, augmented the Integrated Gradients analysis method into an additional objective function. With these processes, NoiseOut gradually learned suitable dynamic gating policies to filter out distractor signals and pass task relevant information to the classifier. When evaluating on perturbed datasets, NoiseOut uses the prior learned gating policies to filter out features that negatively influence classification. We demonstrate that our modular NoiseOut mechanism improves existing DNN's robustness to novel perturbations by achieving strong results on the MNIST-C and ImageNet-C benchmarks.",
        "keywords": "robust classifiers; bionic algorithms",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Leon Guertler;M Ganesh Kumar;Cheston Tan",
        "authorids": "~Leon_Guertler1;~M_Ganesh_Kumar1;~Cheston_Tan1",
        "gender": "M;M;M",
        "homepage": ";https://mgkumar138.github.io/;",
        "dblp": ";230/0379;136/9366",
        "google_scholar": ";sFfy1q4AAAAJ;Up0UYEYAAAAJ",
        "orcid": ";0000-0001-5559-6428;",
        "linkedin": "leon-gurtler-6b3847165/;m-ganesh-kumar-28682792/;cheston-tan/",
        "or_profile": "~Leon_Guertler1;~M_Ganesh_Kumar1;~Cheston_Tan1",
        "aff": "Nanyang Technological University;Harvard University;Singapore University of Technology and Design",
        "aff_domain": "ntu.edu.sg;harvard.edu;sutd.edu.sg",
        "position": "Undergrad student;Postdoc;Assistant Professor",
        "bibtex": "@misc{\nguertler2024noiseout,\ntitle={NoiseOut: Learning to Gate Improves Robustness in Deep Neural Networks},\nauthor={Leon Guertler and M Ganesh Kumar and Cheston Tan},\nyear={2024},\nurl={https://openreview.net/forum?id=ATuX4zRnJo}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZBE7;zW13;G3rD;oCeg",
        "site": "https://openreview.net/forum?id=ATuX4zRnJo",
        "pdf_size": 2996681,
        "rating": "3;3;3;3",
        "confidence": "3;5;4;3",
        "soundness": "2;2;2;2",
        "contribution": "1;2;2;2",
        "presentation": "3;3;2;3",
        "wc_summary": "100;98;47;71",
        "wc_strengths": "38;131;36;48",
        "wc_weaknesses": "302;262;67;250",
        "wc_questions": "4;2;39;44",
        "wc_review": "444;493;189;413",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            79.0,
            21.737065119284157
        ],
        "wc_strengths_avg": [
            63.25,
            39.37876966082104
        ],
        "wc_weaknesses_avg": [
            220.25,
            90.54936498949068
        ],
        "wc_questions_avg": [
            22.25,
            19.343926695477318
        ],
        "wc_review_avg": [
            384.75,
            116.55980224760164
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:7xX8jFi8Fd8J:scholar.google.com/&scioq=NoiseOut:+Learning+to+Gate+Improves+Robustness+in+Deep+Neural+Networks&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Nanyang Technological University;Harvard University;Singapore University of Technology and Design",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ntu.edu.sg;https://www.harvard.edu;https://www.sutd.edu.sg",
        "aff_unique_abbr": "NTU;Harvard;SUTD",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Singapore;United States"
    },
    {
        "title": "A differentiable brain simulator bridging brain simulation and brain-inspired computing",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19260",
        "id": "AU2gS9ut61",
        "author_site": "Chaoming Wang, Tianqiu Zhang, Sichao He, Hongyaoxing Gu, Shangyang Li, Si Wu",
        "tldr": "",
        "abstract": "Brain simulation builds dynamical models to mimic the structure and functions of the brain, while brain-inspired computing (BIC) develops intelligent systems by learning from the structure and functions of the brain. The two fields are intertwined and should share a common programming framework to facilitate each other's development. However, none of the existing software in the fields can achieve this goal, because traditional brain simulators lack differentiability for training, while existing deep learning (DL) frameworks fail to capture the biophysical realism and complexity of brain dynamics. In this paper, we introduce BrainPy, a differentiable brain simulator developed using JAX and XLA, with the aim of bridging the gap between brain simulation and BIC. BrainPy expands upon the functionalities of JAX, a powerful AI framework, by introducing complete capabilities for flexible, efficient, and scalable brain simulation. It offers a range of sparse and event-driven operators for efficient and scalable brain simulation, an abstraction for managing the intricacies of synaptic computations, a modular and flexible interface for constructing multi-scale brain models, and an object-oriented just-in-time compilation approach to handle the memory-intensive nature of brain dynamics. We showcase the efficiency and scalability of BrainPy on benchmark tasks, and highlight its differentiable simulation for biologically plausible spiking models.",
        "keywords": "brain simulator;brain simulation;computational neuroscience;brain-inspired computing",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/943a8eb1c80560e7df5cc2d12a0bb25667d6e630.zip",
        "author": "Chaoming Wang;Tianqiu Zhang;Sichao He;Hongyaoxing Gu;Shangyang Li;Si Wu",
        "authorids": "~Chaoming_Wang1;~Tianqiu_Zhang1;~Sichao_He1;~Hongyaoxing_Gu1;~Shangyang_Li1;~Si_Wu1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://brainpy.tech/;https://ztqakita.github.io/;https://routhleck.com;;https://mgv.pku.edu.cn/english/people/lbd/soeeace/267528.htm;https://gitee.com/guhongyaoxing",
        "dblp": ";356/8708;;274/8227;25/437-1;360/4816.html",
        "google_scholar": ";https://scholar.google.co.jp/citations?user=q-7tMTwAAAAJ;;g77hKJcAAAAJ;;",
        "orcid": ";0009-0000-6418-1961;;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Chaoming_Wang1;~Tianqiu_Zhang1;~Sichao_He1;~Shangyang_Li1;~Si_Wu1;~Gu_Hongyaoxing1",
        "aff": ";Peking University;Beijing Jiaotong University;Peking University;Peking University;University of Chinese Academy of Sciences",
        "aff_domain": ";pku.edu.cn;bjtu.edu.cn;pku.edu.cn;pku.edu.cn;ucas.edu.cn",
        "position": ";PhD student;Undergrad student;PhD student;Full Professor;MS student",
        "bibtex": "@inproceedings{\nwang2024a,\ntitle={A differentiable brain simulator bridging brain simulation and brain-inspired computing},\nauthor={Chaoming Wang and Tianqiu Zhang and Sichao He and Hongyaoxing Gu and Shangyang Li and Si Wu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=AU2gS9ut61}\n}",
        "github": "",
        "project": "",
        "reviewers": "zrYr;g6hc;kvGz;wQtY;afG7",
        "pdf_size": 13405406,
        "rating": "6;6;6;8;10",
        "confidence": "3;3;4;4;4",
        "soundness": "2;2;3;3;4",
        "contribution": "3;2;2;3;4",
        "presentation": "3;3;3;3;4",
        "wc_summary": "66;64;34;40;49",
        "wc_strengths": "56;40;18;33;27",
        "wc_weaknesses": "117;68;108;182;36",
        "wc_questions": "127;40;4;2;90",
        "wc_review": "366;212;164;257;202",
        "wc_reply_reviewers": "0;0;143;0;4",
        "wc_reply_authors": "682;680;614;681;299",
        "reply_reviewers": "0;0;1;0;1",
        "reply_authors": "1;1;2;1;1",
        "rating_avg": [
            7.2,
            1.6
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.8,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.8,
            0.7483314773547882
        ],
        "presentation_avg": [
            3.2,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            50.6,
            12.705904139414873
        ],
        "wc_strengths_avg": [
            34.8,
            12.82809416865966
        ],
        "wc_weaknesses_avg": [
            102.2,
            49.34126062434968
        ],
        "wc_questions_avg": [
            52.6,
            49.02081190678098
        ],
        "wc_review_avg": [
            240.2,
            69.52524721279313
        ],
        "wc_reply_reviewers_avg": [
            29.4,
            56.82112283297471
        ],
        "wc_reply_authors_avg": [
            591.2,
            148.38787012421196
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.2,
            0.4
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.6123724356957946,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17450486356494803188&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=AU2gS9ut61",
        "pdf": "https://openreview.net/pdf?id=AU2gS9ut61",
        "email": ";pku.edu.cn;bjtu.edu.cn;pku.edu.cn;pku.edu.cn;ucas.edu.cn",
        "author_num": 6,
        "aff_unique_index": "0;1;0;0;2",
        "aff_unique_norm": "Peking University;Beijing Jiao Tong University;University of Chinese Academy of Sciences",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.pku.edu.cn;http://www.njtu.edu.cn/en;http://www.ucas.ac.cn",
        "aff_unique_abbr": "Peking U;BJTU;UCAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "AVBw2Ul4X9",
        "title": "Towards Precise Prediction Uncertainty in GNNs: Refining GNNs with Topology-grouping Strategy",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The calibration of model predictions has recently gained increasing attention in the domain of graph neural networks (GNNs), with a particular emphasis on the underconfidence exhibited by these networks. Among the critical factors identified to be associated with GNN calibration, the concept of neighborhood prediction similarity has been recognized as a pivotal component. Building upon this insight, modern GNN calibration techniques adapt GNNs by smoothing the confidence of individual nodes with those of adjacent nodes. However, these approaches often engage in superficial learning across varying affinity levels, thereby failing to effectively accommodate diverse local topologies. Through an in-depth analysis, we unveil that calibrated logits from preceding research significantly contradict their foundational assumption of nearby affinity, necessitating a re-evaluation of the existing GNN-founded calibration strategies. To address this, we introduce Simi-Mailbox, which categorizes nodes based on both neighborhood representational similarity and their own confidence, irrespective of proximity or connectivity. Our method effectively mitigates miscalibration for nodes exhibiting analogous similarity levels by adjusting their predictions with group-specific temperatures. This encourages a more sophisticated calibration, where each group-wise temperature is tailored to address affiliated nodes with similar topology. Extensive experiments demonstrate the effectiveness of Simi-Mailbox across diverse datasets on different GNN architectures.",
        "keywords": "Graph Neural Networks;Post-hoc Calibration",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/532ff41721a330d7a6ff13286c6cc462d3ac895f.zip",
        "author": "Hyunjin Seo;Kyusung Seo;Joonhyung Park;Eunho Yang",
        "authorids": "~Hyunjin_Seo2;~Kyusung_Seo1;~Joonhyung_Park1;~Eunho_Yang1",
        "gender": "F;M;M;M",
        "homepage": "https://github.com/hyunjin72;;;https://sites.google.com/site/hleehome2/",
        "dblp": ";;306/1374;96/2621",
        "google_scholar": "MFDOhRUAAAAJ;;https://scholar.google.com/citations?hl=ko;",
        "orcid": ";;;",
        "linkedin": "hyunjin-seo-97525629a/?originalSubdomain=kr;kyusung-seo-513137172/;joonhyung-park-495527145/;",
        "or_profile": "~Hyunjin_Seo2;~Kyusung_Seo1;~Joonhyung_Park1;~Eunho_Yang1",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr;kaist.ac.kr;kaist.ac.kr",
        "position": "MS student;MS student;PhD student;Associate Professor",
        "bibtex": "@misc{\nseo2024towards,\ntitle={Towards Precise Prediction Uncertainty in {GNN}s: Refining {GNN}s with Topology-grouping Strategy},\nauthor={Hyunjin Seo and Kyusung Seo and Joonhyung Park and Eunho Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=AVBw2Ul4X9}\n}",
        "github": "",
        "project": "",
        "reviewers": "75Vm;jzwr;3Tgz",
        "site": "https://openreview.net/forum?id=AVBw2Ul4X9",
        "pdf_size": 16214180,
        "rating": "6;6;6",
        "confidence": "5;3;2",
        "soundness": "3;3;3",
        "contribution": "2;2;2",
        "presentation": "3;3;3",
        "wc_summary": "74;88;56",
        "wc_strengths": "67;38;54",
        "wc_weaknesses": "244;200;60",
        "wc_questions": "8;31;73",
        "wc_review": "393;357;243",
        "wc_reply_reviewers": "142;82;57",
        "wc_reply_authors": "1427;2097;1193",
        "reply_reviewers": "1;2;1",
        "reply_authors": "4;8;5",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.3333333333333335,
            1.247219128924647
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            72.66666666666667,
            13.097921802925667
        ],
        "wc_strengths_avg": [
            53.0,
            11.86029791643813
        ],
        "wc_weaknesses_avg": [
            168.0,
            78.45168364456347
        ],
        "wc_questions_avg": [
            37.333333333333336,
            26.911377189252544
        ],
        "wc_review_avg": [
            331.0,
            63.93746945258312
        ],
        "wc_reply_reviewers_avg": [
            93.66666666666667,
            35.6682242650545
        ],
        "wc_reply_authors_avg": [
            1572.3333333333333,
            383.09731864835015
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            5.666666666666667,
            1.699673171197595
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:YQssGAScMasJ:scholar.google.com/&scioq=Towards+Precise+Prediction+Uncertainty+in+GNNs:+Refining+GNNs+with+Topology-grouping+Strategy&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "M3C: A Framework towards Convergent, Flexible, and Unsupervised Learning of Mixture Graph Matching and Clustering",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19259",
        "id": "AXC9KydyZq",
        "author_site": "Jiaxin Lu, Zetian Jiang, Tianzhe Wang, Junchi Yan",
        "tldr": "",
        "abstract": "Existing graph matching methods typically assume that there are similar structures between graphs and they are matchable. This work addresses a more realistic scenario where graphs exhibit diverse modes, requiring graph grouping before or along with matching, a task termed mixture graph matching and clustering. Specifically, we introduce Minorize-Maximization Matching and Clustering (M3C), a learning-free algorithm that guarantees theoretical convergence through the Minorize-Maximization framework and offers enhanced flexibility via relaxed clustering. Building on M3C, we further develop UM3C, an unsupervised model that incorporates novel edge-wise affinity learning and pseudo label selection. Extensive experimental results on public benchmarks demonstrate that our method outperforms state-of-the-art graph matching and mixture graph matching and clustering approaches in both accuracy and efficiency.",
        "keywords": "Graph Matching; Joint Optimization; Unsupervised Learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Jiaxin Lu;Zetian Jiang;Tianzhe Wang;Junchi Yan",
        "authorids": "~Jiaxin_Lu1;~Zetian_Jiang1;~Tianzhe_Wang1;~Junchi_Yan2",
        "gender": "F;M;M;M",
        "homepage": "https://jiaxin-lu.github.io/;http://thinklab.sjtu.edu.cn/member.html;https://sites.google.com/view/tianzhe-wang/home;http://thinklab.sjtu.edu.cn/",
        "dblp": ";;243/6770;60/7949.html",
        "google_scholar": "VWTpWhEAAAAJ;;;ga230VoAAAAJ",
        "orcid": "0009-0004-4485-9615;;;0000-0001-9639-7679",
        "linkedin": "jiaxin-lu-9a422127a/;;;",
        "or_profile": "~Jiaxin_Lu1;~Zetian_Jiang1;~Tianzhe_Wang1;~Junchi_Yan1",
        "aff": "University of Texas at Austin;Shanghai Jiaotong University;Georgia Institute of Technology;Shanghai Jiaotong University",
        "aff_domain": "utexas.edu;sjtu.edu.cn;gatech.edu;sjtu.edu.cn",
        "position": "PhD student;PhD student;PhD student;Full Professor",
        "bibtex": "@inproceedings{\nlu2024mc,\ntitle={M3C: A Framework towards Convergent, Flexible, and Unsupervised Learning of Mixture Graph Matching and Clustering},\nauthor={Jiaxin Lu and Zetian Jiang and Tianzhe Wang and Junchi Yan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=AXC9KydyZq}\n}",
        "github": "",
        "project": "",
        "reviewers": "euAu;uZV9;ra71;sBU3",
        "pdf_size": 11516658,
        "rating": "6;6;8;8",
        "confidence": "4;3;5;3",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "1;2;4;3",
        "wc_summary": "47;145;48;91",
        "wc_strengths": "28;72;54;49",
        "wc_weaknesses": "49;265;192;31",
        "wc_questions": "310;183;127;70",
        "wc_review": "434;665;421;241",
        "wc_reply_reviewers": "47;48;70;0",
        "wc_reply_authors": "1291;930;1123;685",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "3;2;2;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            82.75,
            40.08974307725107
        ],
        "wc_strengths_avg": [
            50.75,
            15.674421839417235
        ],
        "wc_weaknesses_avg": [
            134.25,
            97.926949814645
        ],
        "wc_questions_avg": [
            172.5,
            88.87209910877542
        ],
        "wc_review_avg": [
            440.25,
            150.51806370000912
        ],
        "wc_reply_reviewers_avg": [
            41.25,
            25.52817071393875
        ],
        "wc_reply_authors_avg": [
            1007.25,
            225.67939095096833
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.30151134457776363,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6076462582348668008&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=AXC9KydyZq",
        "pdf": "https://openreview.net/pdf?id=AXC9KydyZq",
        "email": "utexas.edu;sjtu.edu.cn;gatech.edu;sjtu.edu.cn",
        "author_num": 4,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "University of Texas at Austin;Shanghai Jiao Tong University;Georgia Institute of Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.utexas.edu;https://www.sjtu.edu.cn;https://www.gatech.edu",
        "aff_unique_abbr": "UT Austin;SJTU;Georgia Tech",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Austin;",
        "aff_country_unique_index": "0;1;0;1",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "Protein-ligand binding representation learning from fine-grained interactions",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19258",
        "id": "AXbN2qMNiW",
        "author_site": "Shikun Feng, Minghao Li, Yinjun JIA, Wei-Ying Ma, Yanyan Lan",
        "tldr": "",
        "abstract": "The binding between proteins and ligands plays a crucial role in the realm of drug discovery. Previous deep learning approaches have shown promising results over traditional computationally intensive methods, but resulting in poor generalization due to limited supervised data. In this paper, we propose to learn protein-ligand binding representation in a self-supervised learning manner. Different from existing pre-training approaches which treat proteins and ligands individually, we emphasize to discern the intricate binding patterns from fine-grained interactions. Specifically, this self-supervised learning problem is formulated as a prediction of the conclusive binding complex structure given a pocket and ligand with a Transformer based interaction module, which naturally emulates the binding process. To ensure the representation of rich binding information, we introduce two pre-training tasks, i.e. atomic pairwise distance map prediction and mask ligand reconstruction, which comprehensively model the fine-grained interactions from both structure and feature space. Extensive experiments have demonstrated the superiority of our method across various binding tasks, including protein-ligand affinity prediction, virtual screening and protein-ligand docking.",
        "keywords": "Protein-ligand binding;representation learning;self-supervised",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Shikun Feng;Minghao Li;Yinjun Jia;Wei-Ying Ma;Yanyan Lan",
        "authorids": "~Shikun_Feng3;~Minghao_Li8;~Yinjun_Jia1;~Wei-Ying_Ma2;~Yanyan_Lan2",
        "gender": "M;M;M;;M",
        "homepage": "https://fengshikun.github.io;https://github.com/limh1317;https://air.tsinghua.edu.cn/en/info/1046/1189.htm;;https://github.com/EBGU",
        "dblp": ";;m/WYMa.html;00/6040.html;",
        "google_scholar": ";;SToCbu8AAAAJ;;",
        "orcid": ";;;;",
        "linkedin": ";;wei-ying-ma-16a0171/;;",
        "or_profile": "~Shikun_Feng3;~Minghao_Li8;~Wei-Ying_Ma2;~Yanyan_Lan2;~Yinjun_Harold_Jia1",
        "aff": "Tsinghua University;University of Chinese Academy of Sciences;Tsinghua University;Tsinghua University;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;ucas.ac.cn;tsinghua.edu.cn;tsinghua.edu.cn;mails.tsinghua.edu.cn",
        "position": "PhD student;MS student;Full Professor;Full Professor;PhD student",
        "bibtex": "@inproceedings{\nfeng2024proteinligand,\ntitle={Protein-ligand binding representation learning from fine-grained interactions},\nauthor={Shikun Feng and Minghao Li and Yinjun Jia and Wei-Ying Ma and Yanyan Lan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=AXbN2qMNiW}\n}",
        "github": "",
        "project": "",
        "reviewers": "kw5e;7LCi;PEGf",
        "pdf_size": 3069624,
        "rating": "5;6;6",
        "confidence": "4;5;3",
        "soundness": "2;3;2",
        "contribution": "2;3;2",
        "presentation": "2;4;1",
        "wc_summary": "110;190;41",
        "wc_strengths": "24;96;21",
        "wc_weaknesses": "136;187;120",
        "wc_questions": "80;86;39",
        "wc_review": "350;559;221",
        "wc_reply_reviewers": "109;92;14",
        "wc_reply_authors": "2186;1882;2277",
        "reply_reviewers": "1;1;1",
        "reply_authors": "8;7;7",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "wc_summary_avg": [
            113.66666666666667,
            60.88422528774501
        ],
        "wc_strengths_avg": [
            47.0,
            34.66987164671943
        ],
        "wc_weaknesses_avg": [
            147.66666666666666,
            28.56960311628816
        ],
        "wc_questions_avg": [
            68.33333333333333,
            20.885933597094056
        ],
        "wc_review_avg": [
            376.6666666666667,
            139.27032067968474
        ],
        "wc_reply_reviewers_avg": [
            71.66666666666667,
            41.362892656206824
        ],
        "wc_reply_authors_avg": [
            2115.0,
            168.89247072225177
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            7.333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            30,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10146790950636761999&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=AXbN2qMNiW",
        "pdf": "https://openreview.net/pdf?id=AXbN2qMNiW",
        "email": "tsinghua.edu.cn;ucas.ac.cn;tsinghua.edu.cn;tsinghua.edu.cn;mails.tsinghua.edu.cn",
        "author_num": 5,
        "aff_unique_index": "0;1;0;0;0",
        "aff_unique_norm": "Tsinghua University;University of Chinese Academy of Sciences",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tsinghua.edu.cn;http://www.ucas.ac.cn",
        "aff_unique_abbr": "THU;UCAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Unleashing the Power of Pre-trained Language Models for Offline Reinforcement Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19257",
        "id": "AY6aM13gGF",
        "author_site": "Ruizhe Shi, Yuyao Liu, Yanjie Ze, Simon Du, Huazhe Xu",
        "tldr": "",
        "abstract": "Offline reinforcement learning (RL) aims to find a near-optimal policy using pre-collected datasets. Given recent advances in Large Language Models (LLMs) and their few-shot learning prowess, this paper introduces $\\textbf{La}$nguage Models for $\\textbf{Mo}$tion Control ($\\textbf{LaMo}$), a general framework based on Decision Transformers to effectively use pre-trained Language Models (LMs) for offline RL. Our framework highlights four crucial components: (1)  Initializing Decision Transformers with sequentially pre-trained LMs, (2) employing the LoRA fine-tuning method, in contrast to full-weight fine-tuning, to combine the pre-trained knowledge from LMs and in-domain knowledge effectively, (3) using the non-linear MLP transformation instead of linear projections, to generate embeddings, and (4) integrating an auxiliary language prediction loss during fine-tuning to stabilize the LMs and retain their original abilities on languages. Empirical results indicate $\\textbf{LaMo}$ achieves state-of-the-art performance in sparse-reward tasks and closes the gap between value-based offline RL methods and decision transformers in dense-reward tasks. In particular, our method demonstrates superior performance in scenarios with limited data samples.",
        "keywords": "Offline Reinforcement Learning;Decision Transformer;Motion Control",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/a32db095adf9241993ade6a962055977b99c0bcb.pdf",
        "author": "Ruizhe Shi;Yuyao Liu;Yanjie Ze;Simon Shaolei Du;Huazhe Xu",
        "authorids": "~Ruizhe_Shi1;~Yuyao_Liu1;~Yanjie_Ze1;~Simon_Shaolei_Du1;~Huazhe_Xu1",
        "gender": "M;M;M;M;M",
        "homepage": "http://srzer.github.io;;http://yanjieze.com;http://simonshaoleidu.com;http://hxu.rocks",
        "dblp": "304/0634.html;;312/5407;176/5602;164/9006",
        "google_scholar": "0tlXSPkAAAAJ;https://scholar.google.com/citations?hl=en;BO_b2O8AAAAJ;OttawxUAAAAJ;t9HPFawAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;yanjie-ze-a71a0a247/;;",
        "or_profile": "~Ruizhe_Shi1;~Yuyao_Liu1;~Yanjie_Ze1;~Simon_Shaolei_Du1;~Huazhe_Xu1",
        "aff": "University of Washington;Massachusetts Institute of Technology;Stanford University;University of Washington;Tsinghua University",
        "aff_domain": "uw.edu;mit.edu;stanford.edu;washington.edu;tsinghua.edu.cn",
        "position": "Intern;Visiting Student;PhD student;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nshi2024unleashing,\ntitle={Unleashing the Power of Pre-trained Language Models for Offline Reinforcement Learning},\nauthor={Ruizhe Shi and Yuyao Liu and Yanjie Ze and Simon Shaolei Du and Huazhe Xu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=AY6aM13gGF}\n}",
        "github": "",
        "project": "",
        "reviewers": "mYMk;ei7j;1Dwk;GHKm",
        "pdf_size": 1915431,
        "rating": "5;6;6;8",
        "confidence": "4;4;4;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "4;3;3;4",
        "wc_summary": "96;101;88;107",
        "wc_strengths": "142;113;58;205",
        "wc_weaknesses": "128;43;212;560",
        "wc_questions": "16;104;42;199",
        "wc_review": "382;361;400;1071",
        "wc_reply_reviewers": "0;17;62;420",
        "wc_reply_authors": "1065;520;862;2283",
        "reply_reviewers": "0;1;1;2",
        "reply_authors": "3;1;2;6",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            98.0,
            6.96419413859206
        ],
        "wc_strengths_avg": [
            129.5,
            53.011791141216875
        ],
        "wc_weaknesses_avg": [
            235.75,
            196.51001882855743
        ],
        "wc_questions_avg": [
            90.25,
            70.45699042678449
        ],
        "wc_review_avg": [
            553.5,
            299.0973921651608
        ],
        "wc_reply_reviewers_avg": [
            124.75,
            171.96129651755945
        ],
        "wc_reply_authors_avg": [
            1182.5,
            664.5549262476353
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            3.0,
            1.8708286933869707
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 27,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8269125061704282950&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=AY6aM13gGF",
        "pdf": "https://openreview.net/pdf?id=AY6aM13gGF",
        "email": "uw.edu;mit.edu;stanford.edu;washington.edu;tsinghua.edu.cn",
        "author_num": 5,
        "aff_unique_index": "0;1;2;0;3",
        "aff_unique_norm": "University of Washington;Massachusetts Institute of Technology;Stanford University;Tsinghua University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.washington.edu;https://web.mit.edu;https://www.stanford.edu;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "UW;MIT;Stanford;THU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Stanford",
        "aff_country_unique_index": "0;0;0;0;1",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "Adaptive Regret for Bandits Made Possible: Two Queries Suffice",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19256",
        "id": "AY9KyTGcnk",
        "author_site": "Zhou Lu, Qiuyi (Richard) Zhang, Xinyi Chen, Fred Zhang, David Woodruff, Elad Hazan",
        "tldr": "",
        "abstract": "Fast changing states or volatile environments pose a significant challenge to online optimization, which needs to perform rapid adaptation under limited observation. In this paper, we give query and regret optimal bandit algorithms under the strict notion of strongly adaptive regret, which measures the maximum regret over any contiguous interval  $I$. Due to its worst-case nature, there is an almost-linear $\\Omega(|I|^{1-\\epsilon})$ regret lower bound, when only one query per round is allowed [Daniely el al, ICML 2015]. Surprisingly, with just two queries per round, we give Strongly Adaptive Bandit Learner (StABL) that achieves $\\widetilde{O}(\\sqrt{n|I|})$ adaptive regret for multi-armed bandits with $n$ arms. The bound is tight and  cannot be improved in general. Our algorithm leverages a  multiplicative update scheme of varying stepsizes and a carefully chosen observation distribution to control the variance. Furthermore, we extend our results and provide optimal algorithms in the bandit convex optimization setting. Finally, we empirically demonstrate the superior performance of our algorithms under volatile environments and for downstream tasks, such as algorithm selection for hyperparameter optimization.",
        "keywords": "adaptive regret;multi arm bandit",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/3056c93ece1d7c6cad8ccff9309bc32f2935e068.pdf",
        "author": "Zhou Lu;Qiuyi Zhang;Xinyi Chen;Fred Zhang;David Woodruff;Elad Hazan",
        "authorids": "~Zhou_Lu1;~Qiuyi_Zhang1;~Xinyi_Chen1;~Fred_Zhang1;~David_Woodruff1;~Elad_Hazan1",
        "gender": ";M;F;M;M;M",
        "homepage": "https://leozoroaster.github.io/;https://qiuyiz.github.io;;http://fredzhang.me/;http://www.cs.cmu.edu/~dwoodruf/;https://www.ehazan.com",
        "dblp": "68/11524;133/8559;84/6214;232/9071;w/DPWoodruff;72/739",
        "google_scholar": "17_nX_kAAAAJ;mE11hO8AAAAJ;;guJ_kBQAAAAJ;https://scholar.google.com.tw/citations?user=0G2t-6sAAAAJ;LnhCGNMAAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";;;fred-zhang-0/;;",
        "or_profile": "~Zhou_Lu1;~Qiuyi_Zhang1;~Xinyi_Chen1;~Fred_Zhang1;~David_Woodruff1;~Elad_Hazan1",
        "aff": ";Google;Google DeepMind;University of California, Berkeley;Carnegie Mellon University;Princeton University",
        "aff_domain": ";google.com;google.com;berkeley.edu;cmu.edu;princeton.edu",
        "position": ";Researcher;Researcher;PhD student;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nlu2024adaptive,\ntitle={Adaptive Regret for Bandits Made Possible: Two Queries Suffice},\nauthor={Zhou Lu and Qiuyi Zhang and Xinyi Chen and Fred Zhang and David Woodruff and Elad Hazan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=AY9KyTGcnk}\n}",
        "github": "",
        "project": "",
        "reviewers": "gNKg;EXm4;kZqs;wKMs",
        "pdf_size": 723821,
        "rating": "5;8;8;8",
        "confidence": "5;4;3;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;2;4;3",
        "wc_summary": "91;143;73;357",
        "wc_strengths": "90;173;24;180",
        "wc_weaknesses": "172;339;229;103",
        "wc_questions": "63;1;2;139",
        "wc_review": "416;656;328;779",
        "wc_reply_reviewers": "11;0;4;0",
        "wc_reply_authors": "406;38;376;233",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            7.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            166.0,
            113.22985472038724
        ],
        "wc_strengths_avg": [
            116.75,
            64.19258134706845
        ],
        "wc_weaknesses_avg": [
            210.75,
            86.447599735331
        ],
        "wc_questions_avg": [
            51.25,
            56.543677807514435
        ],
        "wc_review_avg": [
            544.75,
            180.83607908821736
        ],
        "wc_reply_reviewers_avg": [
            3.75,
            4.493050188902857
        ],
        "wc_reply_authors_avg": [
            263.25,
            145.55304016062323
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.8703882797784892,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:qF043ycUjHEJ:scholar.google.com/&scioq=Adaptive+Regret+for+Bandits+Made+Possible:+Two+Queries+Suffice&hl=en&as_sdt=0,33",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=AY9KyTGcnk",
        "pdf": "https://openreview.net/pdf?id=AY9KyTGcnk",
        "email": ";google.com;google.com;berkeley.edu;cmu.edu;princeton.edu",
        "author_num": 6,
        "aff_unique_index": "0;0;1;2;3",
        "aff_unique_norm": "Google;University of California, Berkeley;Carnegie Mellon University;Princeton University",
        "aff_unique_dep": "Google;;;",
        "aff_unique_url": "https://www.google.com;https://www.berkeley.edu;https://www.cmu.edu;https://www.princeton.edu",
        "aff_unique_abbr": "Google;UC Berkeley;CMU;Princeton",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Mountain View;;Berkeley",
        "aff_country_unique_index": "0;1;0;0;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "title": "Towards Cross Domain Generalization of Hamiltonian Representation via Meta Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19255",
        "id": "AZGIwqCyYY",
        "author_site": "Yeongwoo Song, Hawoong Jeong",
        "tldr": "",
        "abstract": "Recent advances in deep learning for physics have focused on discovering shared representations of target systems by incorporating physics priors or inductive biases into neural networks. While effective, these methods are limited to the system domain, where the type of system remains consistent and thus cannot ensure the adaptation to new, or unseen physical systems governed by different laws. For instance, a neural network trained on a mass-spring system cannot guarantee accurate predictions for the behavior of a two-body system or any other system with different physical laws.\nIn this work, we take a significant leap forward by targeting cross domain generalization within the field of Hamiltonian dynamics. \nWe model our system with a graph neural network (GNN) and employ a meta learning algorithm to enable the model to gain experience over a distribution of systems and make it adapt to new physics. Our approach aims to learn a unified Hamiltonian representation that is generalizable across multiple system domains, thereby overcoming the limitations of system-specific models. \nWe demonstrate that the meta-trained model captures the generalized Hamiltonian representation that is consistent across different physical domains.\nOverall, through the use of meta learning, we offer a framework that achieves cross domain generalization, providing a step towards a unified model for understanding a wide array of dynamical systems via deep learning.",
        "keywords": "hamiltonian dynamics;cross domain generalization;learning physics;meta learning",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/13c5178c183aa265ef6bcfdad34ad2fea13afaa0.zip",
        "author": "Yeongwoo Song;Hawoong Jeong",
        "authorids": "~Yeongwoo_Song1;~Hawoong_Jeong1",
        "gender": "M;M",
        "homepage": "https://ywssng.github.io/;",
        "dblp": "335/1745;07/3681",
        "google_scholar": "https://scholar.google.com/citations?hl=ko;",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Yeongwoo_Song1;~Hawoong_Jeong1",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.edu;kaist.edu",
        "position": "PhD student;Full Professor",
        "bibtex": "@inproceedings{\nsong2024towards,\ntitle={Towards Cross Domain Generalization of Hamiltonian Representation via Meta Learning},\nauthor={Yeongwoo Song and Hawoong Jeong},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=AZGIwqCyYY}\n}",
        "github": "",
        "project": "",
        "reviewers": "GtBu;xLig;jozM;hDu2",
        "pdf_size": 6274027,
        "rating": "5;6;6;6",
        "confidence": "3;2;3;4",
        "soundness": "2;3;2;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "68;71;71;70",
        "wc_strengths": "118;61;34;70",
        "wc_weaknesses": "246;31;174;140",
        "wc_questions": "85;33;35;5",
        "wc_review": "517;196;314;285",
        "wc_reply_reviewers": "41;15;30;349",
        "wc_reply_authors": "725;368;414;1218",
        "reply_reviewers": "1;1;1;2",
        "reply_authors": "3;2;2;3",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            70.0,
            1.224744871391589
        ],
        "wc_strengths_avg": [
            70.75,
            30.326349928733592
        ],
        "wc_weaknesses_avg": [
            147.75,
            77.51249899209805
        ],
        "wc_questions_avg": [
            39.5,
            28.822734082664677
        ],
        "wc_review_avg": [
            328.0,
            117.4627600561131
        ],
        "wc_reply_reviewers_avg": [
            108.75,
            139.01506213356882
        ],
        "wc_reply_authors_avg": [
            681.25,
            338.9552883493633
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11513760535408203006&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=AZGIwqCyYY",
        "pdf": "https://openreview.net/pdf?id=AZGIwqCyYY",
        "email": "kaist.edu;kaist.edu",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "AZVmYg3LvS",
        "title": "Improved Function Space Variational Inference with Informative Priors",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Function space variational inference allows Bayesian neural network (BNN) to introduce the prior distribution on the function space directly. Moreover, Recent linear approximation scheme for KL divergence between two random functions, has presented the tractable training objective and thus facilitates imposing the function space prior on BNNs. On the other hand, despite of its tractability, the existing inference suffers from the interpretability issue because the this function space prior is obtained by mapping the pre-defined weight-space prior to the function output via the complex neural network, and thus seems to be less interpretable. Alternatively, thought the uniform function space prior, that imposes a zero mean prior on the function space to encourage the model to be uncertain for out-of-training set, has been considered, this prior can introduce unnecessary uncertainty into the function outputs of the training datasets. Thus, this can cause the trade-off between the uncertainty estimation performances on the in-training and out-of-training sets.\n\n\nIn this work, we aim at refining the function space variational inference to handle the mentioned issue. To this end, we first reconsider the role of the function space prior in view of Bayesian Model prediction, and then build the function space prior to help improve the uncertainty estimation of the BNNs. Additionally, we propose a refined variational distribution on function space to encourage the useful predictive functions in sense of Bayesian model averaging, to be sampled, and thus improving the prediction of the BNNs.",
        "keywords": "Bayesian Neural Network;Function space variational inference",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Yohan Jung;Juho Lee",
        "authorids": "~Yohan_Jung1;~Juho_Lee2",
        "gender": "M;M",
        "homepage": "https://e2ee22.github.io/;https://juho.lee.github.io",
        "dblp": "256/1530;55/3410-1",
        "google_scholar": "https://scholar.google.co.kr/citations?user=DwAJS14AAAAJ;Py4URJUAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Yohan_Jung1;~Juho_Lee2",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr",
        "position": "Postdoc;Associate Professor",
        "bibtex": "@misc{\njung2024improved,\ntitle={Improved Function Space Variational Inference with Informative Priors},\nauthor={Yohan Jung and Juho Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=AZVmYg3LvS}\n}",
        "github": "",
        "project": "",
        "reviewers": "hyeW;3j4p;QnS6;1KC1",
        "site": "https://openreview.net/forum?id=AZVmYg3LvS",
        "pdf_size": 1307371,
        "rating": "3;3;6;6",
        "confidence": "4;3;3;3",
        "soundness": "1;1;3;3",
        "contribution": "1;2;3;2",
        "presentation": "1;2;3;2",
        "wc_summary": "29;146;67;105",
        "wc_strengths": "32;73;23;117",
        "wc_weaknesses": "419;279;116;290",
        "wc_questions": "12;98;4;492",
        "wc_review": "492;596;210;1004",
        "wc_reply_reviewers": "0;38;100;269",
        "wc_reply_authors": "702;843;421;639",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "2;3;2;2",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            1.0
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            86.75,
            43.49928160326329
        ],
        "wc_strengths_avg": [
            61.25,
            37.298625980054545
        ],
        "wc_weaknesses_avg": [
            276.0,
            107.53371564304844
        ],
        "wc_questions_avg": [
            151.5,
            200.01187464748187
        ],
        "wc_review_avg": [
            575.5,
            284.8661966608183
        ],
        "wc_reply_reviewers_avg": [
            101.75,
            102.94749875543359
        ],
        "wc_reply_authors_avg": [
            651.25,
            152.07625554306628
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5773502691896258,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:LrZndIaURf0J:scholar.google.com/&scioq=Improved+Function+Space+Variational+Inference+with+Informative+Priors&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "Enhancing Instance-Level Image Classification with Set-Level Labels",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19254",
        "id": "AZW3qlCGTe",
        "author_site": "Renyu Zhang, Aly Khan, Yuxin Chen, Robert Grossman",
        "tldr": "",
        "abstract": "Instance-level image classification tasks have traditionally relied on single-instance labels to train models, e.g., few-shot learning and transfer learning. However, set-level coarse-grained labels that capture relationships among instances can provide richer information in real-world scenarios. In this paper, we present a novel approach to enhance instance-level image classification by leveraging set-level labels. We provide a theoretical analysis of the proposed method, including recognition conditions for fast excess risk rate, shedding light on the theoretical foundations of our approach. We conducted experiments on two distinct categories of datasets: natural image datasets and histopathology image datasets. Our experimental results demonstrate the effectiveness of our approach, showcasing improved classification performance compared to traditional single-instance label-based methods. Notably, our algorithm achieves 13\\% improvement in classification accuracy compared to the strongest baseline on the histopathology image classification benchmarks. Importantly, our experimental findings align with the theoretical analysis, reinforcing the robustness and reliability of our proposed method. This work bridges the gap between instance-level and set-level image classification, offering a promising avenue for advancing the capabilities of image classification models with set-level coarse-grained labels.",
        "keywords": "set-level labels;fast excess risk rate;representation learning;few-shot learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/6da5ddfffa12a56a47e07353ad6df009d1936ab5.pdf",
        "author": "Renyu Zhang;Aly A Khan;Yuxin Chen;Robert L. Grossman",
        "authorids": "~Renyu_Zhang2;~Aly_A_Khan1;~Yuxin_Chen1;~Robert_L._Grossman2",
        "gender": "M;;;M",
        "homepage": "https://zhangrenyuuchicago.github.io/;http://ttic.uchicago.edu/~aakhan/;http://yuxinchen.org/;https://rgrossman.com",
        "dblp": "152/4749;46/2390;11/5123-1;g/RobertLGrossman.html",
        "google_scholar": "-4Hr3l0AAAAJ;xIVBCnEAAAAJ;-k1N7HAAAAAJ;3KG8arsAAAAJ",
        "orcid": ";0000-0003-3933-8538;;0000-0003-3741-5739",
        "linkedin": ";;;robertgrossman/",
        "or_profile": "~Renyu_Zhang2;~Aly_A_Khan1;~Yuxin_Chen1;~Robert_L._Grossman2",
        "aff": "Department of Computer Science, University of Chicago;Toyota Technological Institute at Chicago;University of Chicago;University of Chicago",
        "aff_domain": "cs.uchicago.edu;ttic.edu;uchicago.edu;uchicago.edu",
        "position": "PhD student;Courtesy Faculty;Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\nzhang2024enhancing,\ntitle={Enhancing Instance-Level Image Classification with Set-Level Labels},\nauthor={Renyu Zhang and Aly A Khan and Yuxin Chen and Robert L. Grossman},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=AZW3qlCGTe}\n}",
        "github": "",
        "project": "",
        "reviewers": "jPxq;xN2u;4JEd",
        "pdf_size": 41441022,
        "rating": "5;6;6",
        "confidence": "4;3;3",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "3;2;2",
        "wc_summary": "87;70;76",
        "wc_strengths": "138;21;24",
        "wc_weaknesses": "223;92;49",
        "wc_questions": "69;35;154",
        "wc_review": "517;218;303",
        "wc_reply_reviewers": "0;77;0",
        "wc_reply_authors": "2347;1010;1979",
        "reply_reviewers": "0;1;0",
        "reply_authors": "5;3;4",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            77.66666666666667,
            7.039570693980959
        ],
        "wc_strengths_avg": [
            61.0,
            54.46099521676041
        ],
        "wc_weaknesses_avg": [
            121.33333333333333,
            74.00150148626865
        ],
        "wc_questions_avg": [
            86.0,
            50.04664490919113
        ],
        "wc_review_avg": [
            346.0,
            125.79613136605857
        ],
        "wc_reply_reviewers_avg": [
            25.666666666666668,
            36.29814810090944
        ],
        "wc_reply_authors_avg": [
            1778.6666666666667,
            563.910355365894
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            4.0,
            0.816496580927726
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9999999999999997,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:JmCxTlZUXiUJ:scholar.google.com/&scioq=Enhancing+Instance-Level+Image+Classification+with+Set-Level+Labels&hl=en&as_sdt=0,33",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=AZW3qlCGTe",
        "pdf": "https://openreview.net/pdf?id=AZW3qlCGTe",
        "email": "cs.uchicago.edu;ttic.edu;uchicago.edu;uchicago.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "University of Chicago;Toyota Technological Institute at Chicago",
        "aff_unique_dep": "Department of Computer Science;",
        "aff_unique_url": "https://www.uchicago.edu;https://www.tti-chicago.org",
        "aff_unique_abbr": "UChicago;TTI Chicago",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Chicago",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Aarj9MrG8Y",
        "title": "Towards the Universal Learning Principle for Graph Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph neural networks (GNNs) are currently highly regarded in graph representation learning tasks due to their significant performance. Although various propagation mechanisms and graph filters were proposed, few works have considered the convergence and stability of graph filters under infinite-depth scenarios. To address this problem, we elucidate the criterion for the graph filter formed by power series and further establish a scalable regularized learning principle, which can guide us on how to design infinite deep GNN. Following the framework, we develop Adaptive Power GNN (APGNN), a deep GNN that employs exponentially decaying weights to aggregate graph information of different orders so as to mine the deeper neighbor information. Different from existing GNNs, APGNN can be seamlessly extended to an infinite-depth network. Moreover, we analyze the generalization of the proposed learning framework via uniform convergence and present its upper bound in theory. Experimental results show that APGNN obtains superior performance against the state-of-the-art GNNs.",
        "keywords": "Graph Neural Network;Graph Filter;Learning Principle",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/024f072f7b6145a4bf4484f38b3e1a1ec9dac4aa.zip",
        "author": "Foping Chen;Junhong Zhang;Guangfei Liang;Richard Yi Da Xu;Zhihui Lai",
        "authorids": "~Foping_Chen1;~Junhong_Zhang1;~Guangfei_Liang1;~Richard_Yi_Da_Xu1;~Zhihui_Lai1",
        "gender": "M;M;M;M;M",
        "homepage": ";;;https://www.math.hkbu.edu.hk/people/xu-yi-da/;https://www.scholat.com/laizhihui.cn",
        "dblp": "https://dblp.org/;;368/5290;38/3064;61/7577-1",
        "google_scholar": ";ribcEAIAAAAJ;0Tz_-WQAAAAJ;ykOUWa4AAAAJ;CkK6ULsAAAAJ",
        "orcid": ";;0000-0002-5515-7414;0000-0003-2080-4762;0000-0002-4388-3080",
        "linkedin": ";;;richard-xu-0221a943/;",
        "or_profile": "~Foping_Chen1;~Junhong_Zhang1;~Guangfei_Liang1;~Richard_Yi_Da_Xu1;~Zhihui_Lai1",
        "aff": "Shenzhen University;Shenzhen University;Shenzhen University;Hong Kong Baptist University;Shenzhen University",
        "aff_domain": "szu.edu.cn;szu.edu.cn;szu.edu.cn;hkbu.edu.hk;szu.edu.cn",
        "position": "MS student;PhD student;MS student;Full Professor;Full Professor",
        "bibtex": "@misc{\nchen2024towards,\ntitle={Towards the Universal Learning Principle for Graph Neural Networks},\nauthor={Foping Chen and Junhong Zhang and Guangfei Liang and Richard Yi Da Xu and Zhihui Lai},\nyear={2024},\nurl={https://openreview.net/forum?id=Aarj9MrG8Y}\n}",
        "github": "",
        "project": "",
        "reviewers": "W4db;2jyF;X3Vf",
        "site": "https://openreview.net/forum?id=Aarj9MrG8Y",
        "pdf_size": 678064,
        "rating": "3;3;3",
        "confidence": "3;3;4",
        "soundness": "2;3;3",
        "contribution": "1;2;2",
        "presentation": "1;3;3",
        "wc_summary": "75;94;32",
        "wc_strengths": "44;51;53",
        "wc_weaknesses": "177;175;362",
        "wc_questions": "102;110;5",
        "wc_review": "398;430;452",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            67.0,
            25.93581821856921
        ],
        "wc_strengths_avg": [
            49.333333333333336,
            3.8586123009300755
        ],
        "wc_weaknesses_avg": [
            238.0,
            87.68504243408147
        ],
        "wc_questions_avg": [
            72.33333333333333,
            47.72374205314956
        ],
        "wc_review_avg": [
            426.6666666666667,
            22.17105219775452
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:VevL8YYxxNoJ:scholar.google.com/&scioq=Towards+the+Universal+Learning+Principle+for+Graph+Neural+Networks&hl=en&as_sdt=0,33",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "Shenzhen University;Hong Kong Baptist University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.szu.edu.cn;https://www.hkbu.edu.hk",
        "aff_unique_abbr": "SZU;HKBU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Implicit regularization of deep residual networks towards neural ODEs",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19253",
        "id": "AbXGwqb5Ht",
        "author_site": "Pierre Marion, Yu-Han Wu, Michael Sander, G\u00e9rard Biau",
        "tldr": "",
        "abstract": "Residual neural networks are state-of-the-art deep learning models. Their continuous-depth analog, neural ordinary differential equations (ODEs), are also widely used. Despite their success, the link between the discrete and continuous models still lacks a solid mathematical foundation. In this article, we take a step in this direction by establishing an implicit regularization of deep residual networks towards neural ODEs, for nonlinear networks trained with gradient flow. We prove that if the network is initialized as a discretization of a neural ODE, then such a discretization holds throughout training. Our results are valid for a finite training time, and also as the training time tends to infinity provided that the network satisfies a Polyak-\u0141ojasiewicz condition. Importantly, this condition holds for a family of residual networks where the residuals are two-layer perceptrons with an overparameterization in width that is only linear, and implies the convergence of gradient flow to a global minimum. Numerical experiments illustrate our results.",
        "keywords": "deep learning theory;residual networks;neural ODEs;optimization;implicit regularization;gradient flow",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/3420e969258ff49b5456cd02f8a157685dcbeb41.zip",
        "author": "Pierre Marion;Yu-Han Wu;Michael Eli Sander;G\u00e9rard Biau",
        "authorids": "~Pierre_Marion1;~Yu-Han_Wu1;~Michael_Eli_Sander1;~G\u00e9rard_Biau1",
        "gender": "M;M;M;M",
        "homepage": "https://pierremarion23.github.io/;https://github.com/pojoowu;https://michaelsdr.github.io/;https://perso.lpsm.paris/~biau",
        "dblp": "250/2318;;285/5131;",
        "google_scholar": "https://scholar.google.fr/citations?user=Q8H5LgIAAAAJ;;COqAqcMAAAAJ;WiW_7VkAAAAJ",
        "orcid": ";;;",
        "linkedin": "pierre-marion-816474130/;yu-han-wu-716a9715b/;;",
        "or_profile": "~Pierre_Marion1;~Yu-Han_Wu1;~Michael_Eli_Sander1;~G\u00e9rard_Biau1",
        "aff": "EPFL - EPF Lausanne;Ecole Normale Superieure Paris;Ecole Normale Sup\u00e9rieure de Paris;Sorbonne University",
        "aff_domain": "epfl.ch;ens.psl.eu;ens.fr;sorbonne-universite.fr",
        "position": "Postdoc;MS student;PhD student;Full Professor",
        "bibtex": "@inproceedings{\nmarion2024implicit,\ntitle={Implicit regularization of deep residual networks towards neural {ODE}s},\nauthor={Pierre Marion and Yu-Han Wu and Michael Eli Sander and G{\\'e}rard Biau},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=AbXGwqb5Ht}\n}",
        "github": "",
        "project": "",
        "reviewers": "Hmrt;NuSB;Htsq;6832",
        "pdf_size": 2284080,
        "rating": "6;6;8;8",
        "confidence": "2;2;4;4",
        "soundness": "3;3;4;4",
        "contribution": "3;3;4;3",
        "presentation": "3;3;4;4",
        "wc_summary": "67;67;28;155",
        "wc_strengths": "26;90;158;142",
        "wc_weaknesses": "23;94;27;54",
        "wc_questions": "1;17;212;43",
        "wc_review": "117;268;425;394",
        "wc_reply_reviewers": "0;0;33;0",
        "wc_reply_authors": "39;602;562;409",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.0,
            1.0
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            79.25,
            46.54231945230061
        ],
        "wc_strengths_avg": [
            104.0,
            51.57518783291051
        ],
        "wc_weaknesses_avg": [
            49.5,
            28.324018076537094
        ],
        "wc_questions_avg": [
            68.25,
            84.3367505895265
        ],
        "wc_review_avg": [
            301.0,
            121.41869707750945
        ],
        "wc_reply_reviewers_avg": [
            8.25,
            14.289419162443238
        ],
        "wc_reply_authors_avg": [
            403.0,
            222.15647638545224
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 20,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2815881658153338920&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=AbXGwqb5Ht",
        "pdf": "https://openreview.net/pdf?id=AbXGwqb5Ht",
        "email": "epfl.ch;ens.psl.eu;ens.fr;sorbonne-universite.fr",
        "author_num": 4,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "EPFL;Ecole Normale Superieure;Ecole Normale Sup\u00e9rieure de Paris;Sorbonne University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.epfl.ch;https://www.ens.fr;https://www.ens.fr;https://www.sorbonne.universite.fr",
        "aff_unique_abbr": "EPFL;ENS;ENS Paris;Sorbonne",
        "aff_campus_unique_index": "0;1;1",
        "aff_campus_unique": "Lausanne;Paris;",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "Switzerland;France"
    },
    {
        "title": "Forward Learning of Graph Neural Networks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19252",
        "id": "Abr7dU98ME",
        "author_site": "Namyong Park, Xing Wang, Antoine Simoulin, Shuai Yang, Grey Yang, Ryan Rossi, Puja Trivedi, Nesreen Ahmed",
        "tldr": "",
        "abstract": "Graph neural networks (GNNs) have achieved remarkable success across a wide range of applications, such as recommendation, drug discovery, and question answering. Behind the success of GNNs lies the backpropagation (BP) algorithm, which is the de facto standard for training deep neural networks (NNs). However, despite its effectiveness, BP imposes several constraints, which are not only biologically implausible, but also limit the scalability, parallelism, and flexibility in learning NNs. Examples of such constraints include storage of neural activities computed in the forward pass for use in the subsequent backward pass, and the dependence of parameter updates on non-local signals. To address these limitations, the forward-forward algorithm (FF) was recently proposed as an alternative to BP in the image classification domain, which trains NNs by performing two forward passes over positive and negative data. Inspired by this advance, we propose ForwardGNN in this work, a new forward learning procedure for GNNs, which avoids the constraints imposed by BP via an effective layer-wise local forward training. ForwardGNN extends the original FF to deal with graph data and GNNs, and makes it possible to operate without generating negative inputs (hence no longer forward-forward). Further, ForwardGNN enables each layer to learn from both the bottom-up and top-down signals without relying on the backpropagation of errors. Extensive experiments on real-world datasets show the effectiveness and generality of the proposed forward graph learning framework. We release our code at https://github.com/facebookresearch/forwardgnn.",
        "keywords": "graph neural networks;forward learning;forward-forward algorithm",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Namyong Park;Xing Wang;Antoine Simoulin;Shuai Yang;Grey Yang;Ryan A. Rossi;Puja Trivedi;Nesreen K. Ahmed",
        "authorids": "~Namyong_Park1;~Xing_Wang8;~Antoine_Simoulin1;~Shuai_Yang9;~Grey_Yang1;~Ryan_A._Rossi2;~Puja_Trivedi1;~Nesreen_K._Ahmed2",
        "gender": ";M;M;;M;F;F;M",
        "homepage": "https://namyongpark.github.io/;https://scholar.google.com/citations?user=_nDiQQ0AAAAJ&hl=en;http://www.llf.cnrs.fr/fr/Gens/Simoulin;;;https://pujacomputes.github.io/;http://nesreenahmed.com;http://ryanrossi.com",
        "dblp": "116/9404;;211/7662;72/7503;;274/2080;33/11518;17/5085",
        "google_scholar": "YBTXGb8AAAAJ;;https://scholar.google.fr/citations?hl=en;ef7yzckAAAAJ;B11lRXUAAAAJ;1y9cR50AAAAJ;AFV0nLcAAAAJ;_Dc6lbQAAAAJ",
        "orcid": ";;0000-0001-8433-7919;;;0000-0003-1874-8992;;0000-0001-9758-0635",
        "linkedin": ";;antoine-simoulin;;;;nkahmed/;",
        "or_profile": "~Namyong_Park1;~Xing_Wang8;~Antoine_Simoulin1;~Shuai_Yang9;~Grey_Yang1;~Puja_Trivedi1;~Nesreen_Ahmed1;~Ryan_Rossi1",
        "aff": "Meta AI;;Meta AI;Meta;Meta Platforms, Inc;University of Michigan;Intel AI Research;Adobe Research",
        "aff_domain": "meta.com;;meta.com;meta.com;meta.com;umich.edu;intel.com;adobe.com",
        "position": "Researcher;;Researcher;Researcher;Researcher;PhD student;Principal Researcher;Senior Research Scientist",
        "bibtex": "@inproceedings{\npark2024forward,\ntitle={Forward Learning of Graph Neural Networks},\nauthor={Namyong Park and Xing Wang and Antoine Simoulin and Shuai Yang and Grey Yang and Ryan A. Rossi and Puja Trivedi and Nesreen K. Ahmed},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Abr7dU98ME}\n}",
        "github": "",
        "project": "",
        "reviewers": "TBYv;BuBQ;ztUM;yhLp",
        "pdf_size": 792820,
        "rating": "6;6;6;8",
        "confidence": "3;4;2;4",
        "soundness": "4;3;3;3",
        "contribution": "3;2;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "118;91;120;74",
        "wc_strengths": "61;58;45;37",
        "wc_weaknesses": "85;426;79;12",
        "wc_questions": "280;190;15;168",
        "wc_review": "544;765;259;291",
        "wc_reply_reviewers": "0;0;0;9",
        "wc_reply_authors": "1685;1346;730;868",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "3;2;1;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            100.75,
            19.22725929507375
        ],
        "wc_strengths_avg": [
            50.25,
            9.730750228014282
        ],
        "wc_weaknesses_avg": [
            150.5,
            161.62069793191714
        ],
        "wc_questions_avg": [
            163.25,
            95.32411814436051
        ],
        "wc_review_avg": [
            464.75,
            205.51931174466307
        ],
        "wc_reply_reviewers_avg": [
            2.25,
            3.897114317029974
        ],
        "wc_reply_authors_avg": [
            1157.25,
            380.9050898846063
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.5222329678670935,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16316806855315001275&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=Abr7dU98ME",
        "pdf": "https://openreview.net/pdf?id=Abr7dU98ME",
        "email": "meta.com;;meta.com;meta.com;meta.com;umich.edu;intel.com;adobe.com",
        "author_num": 8,
        "aff_unique_index": "0;0;0;0;1;2;3",
        "aff_unique_norm": "Meta;University of Michigan;Intel;Adobe",
        "aff_unique_dep": "Meta AI;;Intel AI Research;Adobe Research",
        "aff_unique_url": "https://meta.com;https://www.umich.edu;https://www.intel.com/research;https://research.adobe.com",
        "aff_unique_abbr": "Meta;UM;Intel AI;Adobe",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Abt6oSKkb4",
        "title": "Model2Scene: Learning 3D Scene Representation via Contrastive Language-CAD Models Pre-training",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Current successful methods of 3D scene perception rely on the large-scale annotated point cloud, which is tedious and expensive to acquire. In this paper, we propose Model2Scene, a novel paradigm that learns free 3D scene representation from Computer-Aided Design (CAD) models and languages. The main challenges are the domain gaps between the CAD models and the real scene's objects, including model-to-scene (from a single model to the scene) and synthetic-to-real (from synthetic model to real scene's object). To handle the above challenges, Model2Scene first simulates a crowded scene by mixing data-augmented CAD models. Next, we propose a novel feature regularization operation, termed Deep Convex-hull Regularization (DCR), to project point features into a unified convex hull space, reducing the domain gap. Ultimately, we impose contrastive loss on language embedding and the point features of CAD models to pre-train the 3D network. Extensive experiments verify the learned 3D scene representation is beneficial for various downstream tasks, including label-free 3D object salient detection, label-efficient 3D scene perception and zero-shot 3D semantic segmentation. Notably, Model2Scene yields impressive label-free 3D object salient detection with an average mAP of 46.08\\% and 55.49\\% on the ScanNet and S3DIS datasets, respectively. The code will be publicly available.",
        "keywords": "3D representation learning;segmentation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/c4871e35d8266ca3a10d5e3e5e3f9ca02bb243c0.zip",
        "author": "Runnan Chen;Xinge ZHU;Nenglun Chen;Dawei Wang;Wei Li;Yuexin Ma;Ruigang Yang;Tongliang Liu;Wenping Wang",
        "authorids": "~Runnan_Chen1;~Xinge_ZHU2;~Nenglun_Chen1;~Dawei_Wang3;~Wei_Li28;~Yuexin_Ma2;~Ruigang_Yang1;~Tongliang_Liu1;~Wenping_Wang1",
        "gender": "M;M;M;M;F;M;M;M;M",
        "homepage": "https://scholar.google.com.hk/citations?hl=en&user=Uq2DuzkAAAAJ&view_op=list_works&sortby=pubdate;https://scholar.google.com/citations?user=UhjTC7AAAAAJ;https://dawei.site;;http://yuexinma.me/aboutme.html;https://www.engr.uky.edu/directory/yang-ruigang;https://tongliang-liu.github.io/;https://engineering.tamu.edu/cse/profiles/Wang-Wenping.html;https://xingezhu.me/aboutme.html",
        "dblp": "232/1849;230/7699.html;39/2537-6;64/6025-111;209/5925;08/5690;150/6667;;204/3002",
        "google_scholar": "https://scholar.google.com.hk/citations?hl=en;UhjTC7AAAAAJ;DsmzUgsAAAAJ;i8jP6q8AAAAJ;;https://scholar.google.com.tw/citations?user=yveq40QAAAAJ;https://scholar.google.com.au/citations?user=EiLdZ_YAAAAJ;28shvv0AAAAJ;https://scholar.google.com.hk/citations?user=yHAcRooAAAAJ",
        "orcid": ";;0000-0003-2440-220X;0000-0002-0059-3745;;;;0000-0002-2284-3952;",
        "linkedin": ";;;;;;;;",
        "or_profile": "~Runnan_Chen1;~Nenglun_Chen1;~Dawei_Wang3;~Wei_Li28;~Yuexin_Ma2;~Ruigang_Yang1;~Tongliang_Liu1;~Wenping_Wang1;~Xinge_Zhu3",
        "aff": "the University of Hong Kong, University of Hong Kong;Nanjing University of Information Science and Technology;University of Hong Kong;Inceptio;ShanghaiTech University;Inceptio ;Mohamed bin Zayed University of Artificial Intelligence;Texas A&M University - College Station;The Chinese University of Hong Kong",
        "aff_domain": "cs.hku.hk;nuist.edu.cn;hku.hk;inceptio.ai;shanghaitech.edu.cn;inceptio.ai;mbzuai.ac.ae;tamu.edu;cuhk.edu.hk",
        "position": "Postdoc;Lecturer;Postdoc;Researcher;Assistant Professor;Instructor;Affiliated Associate Professor;Full Professor;PhD student",
        "bibtex": "@misc{\nchen2024modelscene,\ntitle={Model2Scene: Learning 3D Scene Representation via Contrastive Language-{CAD} Models Pre-training},\nauthor={Runnan Chen and Xinge ZHU and Nenglun Chen and Dawei Wang and Wei Li and Yuexin Ma and Ruigang Yang and Tongliang Liu and Wenping Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=Abt6oSKkb4}\n}",
        "github": "",
        "project": "",
        "reviewers": "xgfx;gV7n;yhuq;U8AX",
        "site": "https://openreview.net/forum?id=Abt6oSKkb4",
        "pdf_size": 4517451,
        "rating": "3;3;5;6",
        "confidence": "4;3;3;3",
        "soundness": "2;2;2;3",
        "contribution": "1;2;2;3",
        "presentation": "1;2;2;2",
        "wc_summary": "357;47;77;57",
        "wc_strengths": "22;25;23;53",
        "wc_weaknesses": "445;111;95;169",
        "wc_questions": "233;78;2;53",
        "wc_review": "1057;261;197;332",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            134.5,
            128.91373084353737
        ],
        "wc_strengths_avg": [
            30.75,
            12.891373084353738
        ],
        "wc_weaknesses_avg": [
            205.0,
            141.27278577277366
        ],
        "wc_questions_avg": [
            91.5,
            86.16408764676848
        ],
        "wc_review_avg": [
            461.75,
            346.96928898679204
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -0.5555555555555555,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16656736670335244446&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;2;3;2;4;5;6",
        "aff_unique_norm": "University of Hong Kong;Nanjing University of Information Science and Technology;Inceptio;ShanghaiTech University;Mohamed bin Zayed University of Artificial Intelligence;Texas A&M University;Chinese University of Hong Kong",
        "aff_unique_dep": ";;;;;;",
        "aff_unique_url": "https://www.hku.hk;http://www.nuist.edu.cn;;https://www.shanghaitech.edu.cn;https://mbzuai.ac.ae;https://www.tamu.edu;https://www.cuhk.edu.hk",
        "aff_unique_abbr": "HKU;;;ShanghaiTech;MBZUAI;TAMU;CUHK",
        "aff_campus_unique_index": "0;0;2;0",
        "aff_campus_unique": "Hong Kong SAR;;College Station",
        "aff_country_unique_index": "0;0;0;0;2;3;0",
        "aff_country_unique": "China;;United Arab Emirates;United States"
    },
    {
        "id": "Ac7f7xL4bU",
        "title": "Universal Clustering Bounds",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper seamlessly integrates several fundamental learning tasks under the umbrella of subspace clustering, namely orthogonal nonnegative matrix factorization, and K-means clustering. Within this framework, we unveil a unified, closed-form solution that elegantly addresses these tasks. Our main theoretical contribution establishes that our deterministic solution achieves perfect accuracy when the data exhibits sufficiently well-defined clusters. Furthermore, the immediate relaxation of our solution yields practical algorithms that not only rival but also surpass the current state-of-the-art in these complex problem domains. This achievement is corroborated by a comprehensive array of experiments conducted on synthetic datasets, as well as on a diverse set of five real-world datasets.",
        "keywords": "nonnegative matrix factorization;orthogonal;subspace;k-means;clustering",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/44e8c82e13d461285eac62500ab46c6906917dc6.zip",
        "author": "Daniel L. Pimentel-Alarc\u00f3n",
        "authorids": "~Daniel_L._Pimentel-Alarc\u00f3n1",
        "gender": "",
        "homepage": "https://danielpimentel.github.io/",
        "dblp": "150/6256",
        "google_scholar": "",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Daniel_L._Pimentel-Alarc\u00f3n1",
        "aff": "University of Wisconsin, Madison",
        "aff_domain": "wisc.edu",
        "position": "Assistant Professor",
        "bibtex": "@misc{\npimentel-alarc{\\'o}n2024universal,\ntitle={Universal Clustering Bounds},\nauthor={Daniel L. Pimentel-Alarc{\\'o}n},\nyear={2024},\nurl={https://openreview.net/forum?id=Ac7f7xL4bU}\n}",
        "github": "",
        "project": "",
        "reviewers": "B34v;Eiut;Wvoi;qhZS",
        "site": "https://openreview.net/forum?id=Ac7f7xL4bU",
        "pdf_size": 1217525,
        "rating": "3;3;3;5",
        "confidence": "3;4;4;4",
        "soundness": "2;3;2;3",
        "contribution": "2;1;1;2",
        "presentation": "2;1;3;2",
        "wc_summary": "98;99;84;116",
        "wc_strengths": "19;6;113;70",
        "wc_weaknesses": "231;172;736;150",
        "wc_questions": "47;10;41;186",
        "wc_review": "395;287;974;522",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            99.25,
            11.344051304538427
        ],
        "wc_strengths_avg": [
            52.0,
            42.573465914816005
        ],
        "wc_weaknesses_avg": [
            322.25,
            240.70768060034976
        ],
        "wc_questions_avg": [
            71.0,
            67.8638342565464
        ],
        "wc_review_avg": [
            544.5,
            261.54970846858157
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:NVg3jXFFhTQJ:scholar.google.com/&scioq=Universal+Clustering+Bounds&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Wisconsin",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.wisc.edu",
        "aff_unique_abbr": "UW",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Madison",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "AcGUW5655J",
        "title": "Constraining Non-Negative Matrix Factorization to Improve Signature Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Collaborative filtering approaches are fundamental for learning meaningful low-dimensional representations when only association data is available. Among these methods, Non-negative Matrix Factorization (NMF) has gained prominence due to its capability to yield interpretable and meaningful low-dimensional representations. However, one significant challenge for NMF is the vast number of solutions for the same problem instance, making the selection of high-quality signatures a complex task. In response to this challenge, our work introduces a novel approach, Self-Matrix Factorization (SMF), which leverages NMF by incorporating constraints that preserve the relationships inherent in the original data. This is achieved by drawing inspiration from a distinct family of matrix decomposition methods, known as Self-Expressive Models (SEM).\nIn our experimental analyses, conducted on two diverse benchmark datasets, our findings present a compelling narrative. SMF consistently delivers competitive or even superior performance when compared to NMF in predictive tasks. However, what truly sets SMF apart, as validated by our empirical results, is its remarkable ability to consistently generate significantly more meaningful object representations.",
        "keywords": "Representation Learning;Colaborative Filtering (CF);Recommender Systems;Link Prediction",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/de9467f65ce858889ef8f7d3c372978f31a907e9.zip",
        "author": "Aldo Galeano;Suzana Santos;Ruben Jimenez;Alberto Paccanaro",
        "authorids": "~Aldo_Galeano1;suzana.santos@fgv.br;ruben.franco@fgv.br;~Alberto_Paccanaro1",
        "gender": "M;;;M",
        "homepage": ";;;https://paccanarolab.org/",
        "dblp": ";;;94/3076",
        "google_scholar": ";;;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;0000-0001-8059-1346",
        "linkedin": "aldogaleanoalfonso18;;;",
        "or_profile": "~Aldo_Galeano1;suzana.santos@fgv.br;ruben.franco@fgv.br;~Alberto_Paccanaro1",
        "aff": "Funda\u00e7\u00e3o Getulio Vargas;;;Royal Holloway, University of London",
        "aff_domain": "fgv.br;;;rhul.ac.uk",
        "position": "PhD student;;;Full Professor",
        "bibtex": "@misc{\ngaleano2024constraining,\ntitle={Constraining Non-Negative Matrix Factorization to Improve Signature Learning},\nauthor={Aldo Galeano and Suzana Santos and Ruben Jimenez and Alberto Paccanaro},\nyear={2024},\nurl={https://openreview.net/forum?id=AcGUW5655J}\n}",
        "github": "",
        "project": "",
        "reviewers": "G6Gq;oagP;NTRu",
        "site": "https://openreview.net/forum?id=AcGUW5655J",
        "pdf_size": 856512,
        "rating": "3;3;6",
        "confidence": "5;4;3",
        "soundness": "2;2;2",
        "contribution": "2;1;2",
        "presentation": "2;3;2",
        "wc_summary": "38;30;105",
        "wc_strengths": "5;14;55",
        "wc_weaknesses": "97;134;30",
        "wc_questions": "4;9;61",
        "wc_review": "144;187;251",
        "wc_reply_reviewers": "0;0;12",
        "wc_reply_authors": "485;825;750",
        "reply_reviewers": "0;0;1",
        "reply_authors": "1;2;2",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            57.666666666666664,
            33.62869145371091
        ],
        "wc_strengths_avg": [
            24.666666666666668,
            21.761331658599286
        ],
        "wc_weaknesses_avg": [
            87.0,
            43.04261454264444
        ],
        "wc_questions_avg": [
            24.666666666666668,
            25.772509040103607
        ],
        "wc_review_avg": [
            194.0,
            43.96210489349511
        ],
        "wc_reply_reviewers_avg": [
            4.0,
            5.656854249492381
        ],
        "wc_reply_authors_avg": [
            686.6666666666666,
            145.84999904772786
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8660254037844387,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:HiH0204EvqEJ:scholar.google.com/&scioq=Constraining+Non-Negative+Matrix+Factorization+to+Improve+Signature+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Funda\u00e7\u00e3o Getulio Vargas;University of London",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.fgv.br;https://www.royalholloway.ac.uk",
        "aff_unique_abbr": "FGV;RHUL",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Royal Holloway",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Brazil;United Kingdom"
    },
    {
        "title": "Rethinking Model Ensemble in Transfer-based Adversarial Attacks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19251",
        "id": "AcJrSoArlh",
        "author_site": "Huanran Chen, Yichi Zhang, Yinpeng Dong, Xiao Yang, Hang Su, Jun Zhu",
        "tldr": "",
        "abstract": "It is widely recognized that deep learning models lack robustness to adversarial examples. An intriguing property of adversarial examples is that they can transfer across different models, which enables black-box attacks without any knowledge of the victim model. An effective strategy to improve the transferability is attacking an ensemble of models. However, previous works simply average the outputs of different models, lacking an in-depth analysis on how and why model ensemble methods can strongly improve the transferability. In this paper, we rethink the ensemble in adversarial attacks and define the common weakness of model ensemble with two properties: 1) the flatness of loss landscape; and 2) the closeness to the local optimum of each model. We empirically and theoretically show that both properties are strongly correlated with the transferability and propose a Common Weakness Attack (CWA) to generate more transferable adversarial examples by promoting these two properties. Experimental results on both image classification and object detection tasks validate the effectiveness of our approach to improving the adversarial transferability, especially when attacking adversarially trained models. We also successfully apply our method to attack a black-box large vision-language model -- Google's Bard, showing the practical effectiveness. Code is available at \\url{https://github.com/huanranchen/AdversarialAttacks}.",
        "keywords": "Adversarial attack;transferability;ensemble attack;robustness",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Huanran Chen;Yichi Zhang;Yinpeng Dong;Xiao Yang;Hang Su;Jun Zhu",
        "authorids": "~Huanran_Chen1;~Yichi_Zhang4;~Yinpeng_Dong2;~Xiao_Yang4;~Hang_Su3;~Jun_Zhu2",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://huanranchen.github.io/;https://zycheiheihei.github.io;https://dongyp13.github.io;https://ml.cs.tsinghua.edu.cn/~xiaoyang/;http://ml.cs.tsinghua.edu.cn/~jun;",
        "dblp": "329/6558;;183/0980;57/33851;50/2644-1;26/5371-6",
        "google_scholar": "https://scholar.google.co.jp/citations?user=QYsKXccAAAAJ;HzgDakoAAAAJ;6_4ad84AAAAJ;bwkwp0MAAAAJ;axsP38wAAAAJ;dxN1_X0AAAAJ",
        "orcid": ";0000-0002-1894-3977;;0000-0001-9502-9962;;",
        "linkedin": ";;;;;",
        "or_profile": "~Huanran_Chen1;~Yichi_Zhang4;~Yinpeng_Dong2;~Xiao_Yang4;~Jun_Zhu2;~Hang_Su2",
        "aff": ";Tsinghua University;Tsinghua University;Tsinghua University;Tsinghua University;Tsinghua University",
        "aff_domain": ";tsinghua.edu.cn;tsinghua.edu.cn;mail.tsinghua.edu.cn;mail.tsinghua.edu.cn;tsinghua.edu.cn",
        "position": ";PhD student;Postdoc;Postdoc;Professor;Associate Professor",
        "bibtex": "@inproceedings{\nchen2024rethinking,\ntitle={Rethinking Model Ensemble in Transfer-based Adversarial Attacks},\nauthor={Huanran Chen and Yichi Zhang and Yinpeng Dong and Xiao Yang and Hang Su and Jun Zhu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=AcJrSoArlh}\n}",
        "github": "",
        "project": "",
        "reviewers": "GTKq;JLTP;9Y8Q;s2Ct",
        "pdf_size": 2167419,
        "rating": "6;6;8;8",
        "confidence": "4;3;3;2",
        "soundness": "3;3;4;3",
        "contribution": "3;3;3;3",
        "presentation": "3;2;3;4",
        "wc_summary": "62;120;61;53",
        "wc_strengths": "42;84;74;42",
        "wc_weaknesses": "76;149;87;78",
        "wc_questions": "24;178;4;50",
        "wc_review": "204;531;226;223",
        "wc_reply_reviewers": "67;0;39;12",
        "wc_reply_authors": "1286;799;361;653",
        "reply_reviewers": "3;0;1;1",
        "reply_authors": "5;2;2;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            74.0,
            26.78619047195775
        ],
        "wc_strengths_avg": [
            60.5,
            18.83480820183736
        ],
        "wc_weaknesses_avg": [
            97.5,
            30.02082610455615
        ],
        "wc_questions_avg": [
            64.0,
            67.80855403265875
        ],
        "wc_review_avg": [
            296.0,
            135.93932470039712
        ],
        "wc_reply_reviewers_avg": [
            29.5,
            25.85053190942113
        ],
        "wc_reply_authors_avg": [
            774.75,
            334.65532641809244
        ],
        "reply_reviewers_avg": [
            1.25,
            1.0897247358851685
        ],
        "reply_authors_avg": [
            2.75,
            1.299038105676658
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.7071067811865475,
        "gs_citation": 58,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9671466880746340903&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=AcJrSoArlh",
        "pdf": "https://openreview.net/pdf?id=AcJrSoArlh",
        "email": ";tsinghua.edu.cn;tsinghua.edu.cn;mail.tsinghua.edu.cn;mail.tsinghua.edu.cn;tsinghua.edu.cn",
        "author_num": 6,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Tsinghua University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Out-of-Distribution Detection by Leveraging Between-Layer Transformation Smoothness",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19250",
        "id": "AcRfzLS6se",
        "author_site": "Fran Jeleni\u0107, Josip Juki\u0107, Martin Tutek, Mate Puljiz, Jan Snajder",
        "tldr": "",
        "abstract": "Effective out-of-distribution (OOD) detection is crucial for reliable machine learning models, yet most current methods are limited in practical use due to requirements like access to training data or intervention in training. We present a novel method for detecting OOD data in Transformers based on transformation smoothness between intermediate layers of a network (BLOOD), which is applicable to pre-trained models without access to training data. BLOOD utilizes the tendency of between-layer representation transformations of in-distribution (ID) data to be smoother than the corresponding transformations of OOD data, a property that we also demonstrate empirically. We evaluate BLOOD on several text classification tasks with Transformer networks and demonstrate that it outperforms methods with comparable resource requirements. Our analysis also suggests that when learning simpler tasks, OOD data transformations maintain their original sharpness, whereas sharpness increases with more complex tasks.",
        "keywords": "out-of-distribution detection;deep neural networks;transformers;representation analysis;uncertainty quantification;text classification",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/9c4c6570df8fcd5ab6e2335f73d107f295739f7c.zip",
        "author": "Fran Jeleni\u0107;Josip Juki\u0107;Martin Tutek;Mate Puljiz;Jan Snajder",
        "authorids": "~Fran_Jeleni\u01071;~Josip_Juki\u01071;~Martin_Tutek1;~Mate_Puljiz1;~Jan_Snajder1",
        "gender": ";;M;M;M",
        "homepage": ";;;https://my-web-bbeba.firebaseapp.com/;http://www.zemris.fer.hr/~jan/",
        "dblp": "333/1019;333/0711;186/7079;198/6470.html;34/5404",
        "google_scholar": "6zH9ZZcAAAAJ;0NzyWBoAAAAJ;https://scholar.google.hr/citations?user=3MK-3e0AAAAJ;https://scholar.google.hr/citations?user=U5cL9tYAAAAJ;https://scholar.google.hr/citations?user=7h0lKgIAAAAJ",
        "orcid": ";;;0000-0003-0912-8345;",
        "linkedin": ";;mtutek/;;",
        "or_profile": "~Fran_Jeleni\u01071;~Josip_Juki\u01071;~Martin_Tutek1;~Mate_Puljiz1;~Jan_Snajder1",
        "aff": "University of Zagreb;Faculty of Electrical Engineering and Computing, University of Zagreb;Technion - Israel Institute of Technology, Technion;;UniZg-FER, University of Zagreb",
        "aff_domain": "fer.hr;fer.hr;technion.ac.il;;fer.unizg.hr",
        "position": "Researcher;PhD student;Postdoc;;Full Professor",
        "bibtex": "@inproceedings{\njeleni{\\'c}2024outofdistribution,\ntitle={Out-of-Distribution Detection by Leveraging Between-Layer Transformation Smoothness},\nauthor={Fran Jeleni{\\'c} and Josip Juki{\\'c} and Martin Tutek and Mate Puljiz and Jan Snajder},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=AcRfzLS6se}\n}",
        "github": "",
        "project": "",
        "reviewers": "Bnog;Txyj;ELpL;woCv",
        "pdf_size": 1559264,
        "rating": "5;5;6;6",
        "confidence": "4;3;2;4",
        "soundness": "2;3;3;2",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "42;79;93;66",
        "wc_strengths": "57;67;51;68",
        "wc_weaknesses": "131;111;158;79",
        "wc_questions": "34;14;19;109",
        "wc_review": "264;271;321;322",
        "wc_reply_reviewers": "0;0;59;0",
        "wc_reply_authors": "273;352;314;902",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            70.0,
            18.774983355518586
        ],
        "wc_strengths_avg": [
            60.75,
            7.084313657652377
        ],
        "wc_weaknesses_avg": [
            119.75,
            28.838992700855556
        ],
        "wc_questions_avg": [
            44.0,
            38.242646351945886
        ],
        "wc_review_avg": [
            294.5,
            27.115493725912497
        ],
        "wc_reply_reviewers_avg": [
            14.75,
            25.54774941164094
        ],
        "wc_reply_authors_avg": [
            460.25,
            256.5700440425577
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.30151134457776363,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2061125423693659380&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=AcRfzLS6se",
        "pdf": "https://openreview.net/pdf?id=AcRfzLS6se",
        "email": "fer.hr;fer.hr;technion.ac.il;;fer.unizg.hr",
        "author_num": 5,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "University of Zagreb;Technion - Israel Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.unizg.hr;https://www.technion.ac.il",
        "aff_unique_abbr": "UNIZG;Technion",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Zagreb",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "Croatia;Israel"
    },
    {
        "title": "Distinguished In Uniform: Self-Attention Vs. Virtual Nodes",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19249",
        "id": "AcSChDWL6V",
        "author_site": "Eran Rosenbluth, Jan T\u00f6nshoff, Martin Ritzert, Berke Kisin, Martin Grohe",
        "tldr": "",
        "abstract": "Graph Transformers (GTs) such as SAN and GPS are graph processing models that combine Message-Passing GNNs (MPGNNs) with global Self-Attention. They were shown to be universal function approximators, with two reservations: 1. The initial node features must be augmented with certain positional encodings. 2. The approximation is non-uniform: Graphs of different sizes may require a different approximating network.\n\nWe first clarify that this form of universality is not unique to GTs: Using the same positional encodings, also pure MPGNNs and even 2-layer MLPs are non-uniform universal approximators. We then consider uniform expressivity: The target function is to be approximated by a single network for graphs of all sizes. There, we compare GTs to the more efficient MPGNN + Virtual Node architecture. The essential difference between the two model definitions is in their global computation method: Self-Attention Vs Virtual Node. We prove that none of the models is a uniform-universal approximator, before proving our main result: Neither model\u2019s uniform expressivity subsumes the other\u2019s. We demonstrate the theory with experiments on synthetic data. We further augment our study with real-world datasets, observing mixed results which indicate no clear ranking in practice as well.",
        "keywords": "Graph Neural Networks;Message Passing;Graph Transformers;Virtual Nodes;Expressivity;Uniform Expressivity",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/115096b1e19ffa39a7d9ee9fd3e4a1dac92a30a1.zip",
        "author": "Eran Rosenbluth;Jan T\u00f6nshoff;Martin Ritzert;Berke Kisin;Martin Grohe",
        "authorids": "~Eran_Rosenbluth1;~Jan_T\u00f6nshoff1;~Martin_Ritzert1;~Berke_Kisin1;~Martin_Grohe1",
        "gender": ";M;M;;M",
        "homepage": ";https://www.lics.rwth-aachen.de/;;;http://www.lics.rwth-aachen.de/~grohe",
        "dblp": ";;194/2447;;g/MGrohe",
        "google_scholar": ";;https://scholar.google.de/citations?user=ZNioUNgAAAAJ;xqVvCc4AAAAJ;https://scholar.google.com.tw/citations?user=Sou5ih0AAAAJ",
        "orcid": ";;0000-0002-5322-3684;;0000-0002-0292-9142",
        "linkedin": ";;martin-ritzert/;;",
        "or_profile": "~Eran_Rosenbluth1;~Jan_T\u00f6nshoff1;~Martin_Ritzert1;~Berke_Kisin1;~Martin_Grohe1",
        "aff": ";RWTH Aachen University;Georg-August Universit\u00e4t G\u00f6ttingen;Rheinisch Westf\u00e4lische Technische Hochschule Aachen;RWTH Aachen University",
        "aff_domain": ";rwth-aachen.de;uni-goettingen.de;rwth-aachen.de;rwth-aachen.de",
        "position": ";PhD student;Postdoc;MS student;Full Professor",
        "bibtex": "@inproceedings{\nrosenbluth2024distinguished,\ntitle={Distinguished In Uniform: Self-Attention Vs. Virtual Nodes},\nauthor={Eran Rosenbluth and Jan T{\\\"o}nshoff and Martin Ritzert and Berke Kisin and Martin Grohe},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=AcSChDWL6V}\n}",
        "github": "",
        "project": "",
        "reviewers": "MBi3;BMpU;Uru7;EnRw",
        "pdf_size": 445579,
        "rating": "6;6;6;8",
        "confidence": "2;3;3;4",
        "soundness": "3;2;3;3",
        "contribution": "3;3;3;3",
        "presentation": "4;2;3;3",
        "wc_summary": "178;241;92;157",
        "wc_strengths": "92;87;129;130",
        "wc_weaknesses": "79;300;274;63",
        "wc_questions": "106;1;50;4",
        "wc_review": "455;629;545;354",
        "wc_reply_reviewers": "11;192;0;0",
        "wc_reply_authors": "523;1267;276;342",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            167.0,
            53.2024435529046
        ],
        "wc_strengths_avg": [
            109.5,
            20.081085628023203
        ],
        "wc_weaknesses_avg": [
            179.0,
            108.53801177467736
        ],
        "wc_questions_avg": [
            40.25,
            42.6402098962939
        ],
        "wc_review_avg": [
            495.75,
            102.38987987101069
        ],
        "wc_reply_reviewers_avg": [
            50.75,
            81.67427685630281
        ],
        "wc_reply_authors_avg": [
            602.0,
            394.44327855852737
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.816496580927726,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12750433681330117626&as_sdt=5,30&sciodt=0,30&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=AcSChDWL6V",
        "pdf": "https://openreview.net/pdf?id=AcSChDWL6V",
        "email": ";rwth-aachen.de;uni-goettingen.de;rwth-aachen.de;rwth-aachen.de",
        "author_num": 5,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "RWTH Aachen University;Georg-August Universit\u00e4t G\u00f6ttingen",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.rwth-aachen.de;https://www.uni-goettingen.de",
        "aff_unique_abbr": "RWTH;GAU",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Aachen;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "title": "Risk Bounds of Accelerated SGD for Overparameterized Linear Regression",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19248",
        "id": "AcoXPIPh4A",
        "author_site": "Xuheng Li, Yihe Deng, Jingfeng Wu, Dongruo Zhou, Quanquan Gu",
        "tldr": "",
        "abstract": "Accelerated stochastic gradient descent (ASGD) is a workhorse in deep learning and often achieves better generalization performance than SGD. However, existing optimization theory can only explain the faster convergence of ASGD, but cannot explain its better generalization. In this paper, we study the generalization of ASGD for overparameterized linear regression, which is possibly the simplest setting of learning with overparameterization. We establish an instance-dependent excess risk bound for ASGD within each eigen-subspace of the data covariance matrix. Our analysis shows that (i) ASGD outperforms SGD in the subspace of small eigenvalues, exhibiting a faster rate of exponential decay for bias error, while in the subspace of large eigenvalues, its bias error decays slower than SGD; and (ii) the variance error of ASGD is always larger than that of SGD. Our result suggests that ASGD can outperform SGD when the difference between the initialization and the true weight vector is mostly confined to the subspace of small eigenvalues. Additionally, when our analysis is specialized to linear regression in the strongly convex setting, it yields a tighter bound for bias error than the best-known result.",
        "keywords": "Accelerated stochastic gradient descent;excess risk;linear regression;overparameterization",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/81ed44f42960f9d6a83ba25e890d44117641bc92.pdf",
        "author": "Xuheng Li;Yihe Deng;Jingfeng Wu;Dongruo Zhou;Quanquan Gu",
        "authorids": "~Xuheng_Li1;~Yihe_Deng1;~Jingfeng_Wu1;~Dongruo_Zhou1;~Quanquan_Gu1",
        "gender": "M;F;M;M;M",
        "homepage": "http://www.pku.edu.cn;;https://uuujf.github.io;;http://web.cs.ucla.edu/~qgu/",
        "dblp": "330/7681;230/8011;;215/3401;50/4597",
        "google_scholar": ";7Lix1poAAAAJ;z-KILD8AAAAJ;1780wr0AAAAJ;GU9HgNAAAAAJ",
        "orcid": ";;0009-0009-3414-4487;;",
        "linkedin": ";;jingfeng-wu-79205b184/;;",
        "or_profile": "~Xuheng_Li1;~Yihe_Deng1;~Jingfeng_Wu1;~Dongruo_Zhou1;~Quanquan_Gu1",
        "aff": "ByteDance Inc.;University of California, Los Angeles;University of California, Berkeley;Indiana University;University of California, Los Angeles",
        "aff_domain": "bytedance.com;ucla.edu;berkeley.edu;iu.edu;cs.ucla.edu",
        "position": "Intern;PhD student;Postdoc;Assistant Professor;Associate Professor",
        "bibtex": "@inproceedings{\nli2024risk,\ntitle={Risk Bounds of Accelerated {SGD} for Overparameterized Linear Regression},\nauthor={Xuheng Li and Yihe Deng and Jingfeng Wu and Dongruo Zhou and Quanquan Gu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=AcoXPIPh4A}\n}",
        "github": "",
        "project": "",
        "reviewers": "MrsP;BSyC;hi74",
        "pdf_size": 1086933,
        "rating": "6;6;6",
        "confidence": "3;4;3",
        "soundness": "3;4;3",
        "contribution": "3;2;3",
        "presentation": "3;3;3",
        "wc_summary": "130;68;146",
        "wc_strengths": "15;61;106",
        "wc_weaknesses": "15;170;1",
        "wc_questions": "75;40;1",
        "wc_review": "235;339;254",
        "wc_reply_reviewers": "0;103;0",
        "wc_reply_authors": "633;793;8",
        "reply_reviewers": "0;1;0",
        "reply_authors": "1;3;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            114.66666666666667,
            33.6386021641143
        ],
        "wc_strengths_avg": [
            60.666666666666664,
            37.15134213217905
        ],
        "wc_weaknesses_avg": [
            62.0,
            76.58111168340838
        ],
        "wc_questions_avg": [
            38.666666666666664,
            30.225081564084416
        ],
        "wc_review_avg": [
            276.0,
            45.217990519998416
        ],
        "wc_reply_reviewers_avg": [
            34.333333333333336,
            48.554665641476255
        ],
        "wc_reply_authors_avg": [
            478.0,
            338.6984893185481
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5460095850641278501&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 9,
        "openreview": "https://openreview.net/forum?id=AcoXPIPh4A",
        "pdf": "https://openreview.net/pdf?id=AcoXPIPh4A",
        "email": "bytedance.com;ucla.edu;berkeley.edu;iu.edu;cs.ucla.edu",
        "author_num": 5,
        "aff_unique_index": "0;1;2;3;1",
        "aff_unique_norm": "ByteDance;University of California, Los Angeles;University of California, Berkeley;Indiana University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.bytedance.com;https://www.ucla.edu;https://www.berkeley.edu;https://www.indiana.edu",
        "aff_unique_abbr": "ByteDance;UCLA;UC Berkeley;IU",
        "aff_campus_unique_index": "1;2;1",
        "aff_campus_unique": ";Los Angeles;Berkeley",
        "aff_country_unique_index": "0;1;1;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Rotation Has Two Sides: Evaluating Data Augmentation for Deep One-class Classification",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19247",
        "id": "Ad81awoBVS",
        "author_site": "Guodong Wang, Yunhong Wang, Xiuguo Bao, Di Huang",
        "tldr": "",
        "abstract": "One-class classification (OCC) involves predicting whether a new data is normal or anomalous based solely on the data from a single class during training. Various attempts have been made to learn suitable representations for OCC within a self-supervised framework. Notably, discriminative methods that use geometric visual transformations, such as rotation, to generate pseudo-anomaly samples have exhibited impressive detection performance. Although rotation is commonly viewed as a distribution-shifting transformation and is widely used in the literature, the cause of its effectiveness remains a mystery. In this study, we are the first to make a surprising observation: there exists a strong linear relationship (Pearson's Correlation, $r > 0.9$) between the accuracy of rotation prediction and the performance of OCC. This suggests that a classifier that effectively distinguishes different rotations is more likely to excel in OCC, and vice versa. The root cause of this phenomenon can be attributed to the transformation bias in the dataset, where representations learned from transformations already present in the dataset tend to be less effective, making it essential to accurately estimate the transformation distribution before utilizing pretext tasks involving these transformations for reliable self-supervised representation learning. To the end, we propose a novel two-stage method to estimate the transformation distribution within the dataset. In the first stage, we learn general representations through standard contrastive pre-training. In the second stage, we select potentially semantics-preserving samples from the entire augmented dataset, which includes all rotations, by employing density matching with the provided reference distribution. By sorting samples based on semantics-preserving versus shifting transformations, we achieve improved performance on OCC benchmarks.",
        "keywords": "self-supervised learning;deep one-class cilassification",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Guodong Wang;Yunhong Wang;Xiuguo Bao;Di Huang",
        "authorids": "~Guodong_Wang3;~Yunhong_Wang1;~Xiuguo_Bao3;~Di_Huang4",
        "gender": "M;;M;M",
        "homepage": "https://gdwang08.github.io/;;https://dblp.org/rec/conf/ijcai/LiCZB022;http://irip.buaa.edu.cn/dihuang/index.html",
        "dblp": ";;;45/780-1",
        "google_scholar": "9xCdnoQAAAAJ;;;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;0000-0002-2412-9330",
        "linkedin": ";;;",
        "or_profile": "~Guodong_Wang3;~Yunhong_Wang1;~Xiuguo_Bao3;~Di_Huang4",
        "aff": "Beihang University;;;Beihang University",
        "aff_domain": "buaa.edu.cn;;;buaa.edu.cn",
        "position": "PhD student;;;Full Professor",
        "bibtex": "@inproceedings{\nwang2024rotation,\ntitle={Rotation Has Two Sides: Evaluating Data Augmentation for Deep One-class Classification},\nauthor={Guodong Wang and Yunhong Wang and Xiuguo Bao and Di Huang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Ad81awoBVS}\n}",
        "github": "",
        "project": "",
        "reviewers": "Yjs1;jwSM;vKuc;Soam;h8uB",
        "pdf_size": 878803,
        "rating": "3;6;6;6;6",
        "confidence": "4;5;4;3;2",
        "soundness": "2;3;3;2;3",
        "contribution": "1;3;3;3;3",
        "presentation": "2;3;3;3;2",
        "wc_summary": "64;50;222;70;56",
        "wc_strengths": "31;21;97;129;93",
        "wc_weaknesses": "181;61;173;102;149",
        "wc_questions": "3;101;104;61;31",
        "wc_review": "279;233;596;362;329",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "555;887;635;537;212",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "1;2;1;1;1",
        "rating_avg": [
            5.4,
            1.2
        ],
        "confidence_avg": [
            3.6,
            1.019803902718557
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.6,
            0.8000000000000002
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            92.4,
            65.15704106234413
        ],
        "wc_strengths_avg": [
            74.2,
            41.40724574274411
        ],
        "wc_weaknesses_avg": [
            133.2,
            45.397797303393475
        ],
        "wc_questions_avg": [
            60.0,
            39.2632143360678
        ],
        "wc_review_avg": [
            359.8,
            125.97682326523399
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            565.2,
            216.3685744279885
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.2,
            0.4000000000000001
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.19611613513818404,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8500072982366343769&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=Ad81awoBVS",
        "pdf": "https://openreview.net/pdf?id=Ad81awoBVS",
        "email": "buaa.edu.cn;;;buaa.edu.cn",
        "author_num": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Beihang University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.buaa.edu.cn/",
        "aff_unique_abbr": "BUAA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Ghost on the Shell: An Expressive Representation of General 3D Shapes",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19246",
        "id": "Ad87VjRqUw",
        "author_site": "Zhen Liu, Yao Feng, Yuliang Xiu, Weiyang Liu, Liam Paull, Michael J Black, Bernhard Schoelkopf",
        "tldr": "",
        "abstract": "The creation of photorealistic virtual worlds requires the accurate modeling of 3D surface geometry for a wide range of objects. For this, meshes are appealing since they enable 1) fast physics-based rendering with realistic material and lighting, 2) physical simulation, and 3) are memory-efficient for modern graphics pipelines. Recent work on reconstructing and statistically modeling 3D shape, however, has critiqued meshes as being topologically inflexible. To capture a wide range of object shapes, any 3D representation must be able to model solid, watertight, shapes as well as thin, open, surfaces. Recent work has focused on the former, and methods for reconstructing open surfaces do not support fast reconstruction with material and lighting or unconditional generative modelling. Inspired by the observation that open surfaces can be seen as islands floating on watertight surfaces, we parametrize open surfaces by defining a manifold signed distance field on watertight templates. With this parametrization, we further develop a grid-based and differentiable representation that parametrizes both watertight and non-watertight meshes of arbitrary topology. Our new representation, called Ghost-on-the-Shell (G-Shell), enables two important applications:  differentiable rasterization-based reconstruction from multiview images and generative modelling of non-watertight meshes. We empirically demonstrate that G-Shell achieves state-of-the-art performance on non-watertight mesh reconstruction and generation tasks, while also performing effectively for watertight meshes.",
        "keywords": "Non-watertight mesh; generative model; 3D geometry; differentiable rendering",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Zhen Liu;Yao Feng;Yuliang Xiu;Weiyang Liu;Liam Paull;Michael J. Black;Bernhard Sch\u00f6lkopf",
        "authorids": "~Zhen_Liu6;~Yao_Feng3;~Yuliang_Xiu2;~Weiyang_Liu1;~Liam_Paull1;~Michael_J._Black1;~Bernhard_Sch\u00f6lkopf1",
        "gender": "M;F;M;M;;;",
        "homepage": ";https://ps.is.tuebingen.mpg.de/person/yfeng;http://xiuyuliang.cn;http://wyliu.com/;;;",
        "dblp": "77/35-19;05/9861;215/3940;137/1532;;;",
        "google_scholar": "I1IiJCAAAAAJ;wNQQhSIAAAAJ;https://scholar.google.com.hk/citations?hl=zh-CN;DMjROf0AAAAJ;;;",
        "orcid": ";0000-0002-9481-9783;0000-0003-0165-5909;;;;",
        "linkedin": ";;yuliangxiu;;;;",
        "or_profile": "~Zhen_Liu6;~Yao_Feng3;~Yuliang_Xiu2;~Weiyang_Liu1;~Liam_Paull1;~Michael_J._Black1;~Bernhard_Sch\u00f6lkopf1",
        "aff": "University of Montreal;ETHZ - ETH Zurich;Max Planck Institute for Intelligent Systems, Max-Planck Institute;University of Cambridge;;;",
        "aff_domain": "umontreal.ca;ethz.ch;tuebingen.mpg.de;cam.ac.uk;;;",
        "position": "PhD student;PhD student;PhD student;Researcher;;;",
        "bibtex": "@inproceedings{\nliu2024ghost,\ntitle={Ghost on the Shell: An Expressive Representation of General 3D Shapes},\nauthor={Zhen Liu and Yao Feng and Yuliang Xiu and Weiyang Liu and Liam Paull and Michael J. Black and Bernhard Sch{\\\"o}lkopf},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Ad87VjRqUw}\n}",
        "github": "",
        "project": "",
        "reviewers": "RYwJ;9iXa;dsfR;hJqu",
        "pdf_size": 14168139,
        "rating": "5;8;8;8",
        "confidence": "5;3;5;4",
        "soundness": "4;3;4;3",
        "contribution": "3;3;3;3",
        "presentation": "4;4;3;2",
        "wc_summary": "75;66;40;97",
        "wc_strengths": "47;215;24;45",
        "wc_weaknesses": "86;72;39;292",
        "wc_questions": "4;188;72;262",
        "wc_review": "212;541;175;696",
        "wc_reply_reviewers": "0;41;21;0",
        "wc_reply_authors": "520;817;535;2092",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;2;1;3",
        "rating_avg": [
            7.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            69.5,
            20.426698215815495
        ],
        "wc_strengths_avg": [
            82.75,
            76.88424741128705
        ],
        "wc_weaknesses_avg": [
            122.25,
            99.47958333246073
        ],
        "wc_questions_avg": [
            131.5,
            100.02374718035712
        ],
        "wc_review_avg": [
            406.0,
            219.8419887100733
        ],
        "wc_reply_reviewers_avg": [
            15.5,
            17.03672503740082
        ],
        "wc_reply_authors_avg": [
            991.0,
            646.5783015227158
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11053737743132381826&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=Ad87VjRqUw",
        "pdf": "https://openreview.net/pdf?id=Ad87VjRqUw",
        "email": "umontreal.ca;ethz.ch;tuebingen.mpg.de;cam.ac.uk;;;",
        "author_num": 7,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "University of Montreal;ETH Zurich;Max Planck Institute for Intelligent Systems;University of Cambridge",
        "aff_unique_dep": ";;Intelligent Systems;",
        "aff_unique_url": "https://wwwumontreal.ca;https://www.ethz.ch;https://www.mpi-is.mpg.de;https://www.cam.ac.uk",
        "aff_unique_abbr": "UM;ETHZ;MPI-IS;Cambridge",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Cambridge",
        "aff_country_unique_index": "0;1;2;3",
        "aff_country_unique": "Canada;Switzerland;Germany;United Kingdom"
    },
    {
        "id": "Aemqy6Hjdj",
        "title": "Enhancing Compositional Generalization via Compositional Feature Alignment",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Real-world applications of machine learning (ML) models often confront data distribution shifts, wherein discrepancies exist between the training and test data distributions. In the common multi-domain multi-class setup, as the number of classes and domains scales up, it becomes infeasible to gather training data for every domain-class combination. This challenge naturally leads the quest for models with Compositional Generalization (CG) ability, where models can generalize to unseen domain-class combinations. To delve into the CG challenge, we develop CG-Bench, a suite of CG benchmarks derived from existing real-world image datasets, and observe that the prevalent pretraining-finetuning paradigm on foundational models, such as CLIP and DINOv2, struggles with the challenge. To address this challenge, we propose Compositional Feature Alignment (CFA), a simple two-stage finetuning technique that i) learns two orthogonal linear heads on a pretrained encoder with respect to class and domain labels, and ii) fine-tunes the encoder with the newly learned head frozen. We theoretically and empirically justify that CFA encourages compositional feature learning of pretrained models. We further conduct extensive experiments on CG-Bench for CLIP and DINOv2, two powerful pretrained vision foundation models. Experiment results show that CFA outperforms common finetuning techniques in compositional generalization, corroborating CFA's efficacy in compositional feature learning.",
        "keywords": "OOD Generalization;Fine-tuning;Compositional Generalization",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/4c14940f660ae48e6cb30c38a01c856ccbca7457.zip",
        "author": "Haoxiang Wang;Haozhe Si;Huajie Shao;Han Zhao",
        "authorids": "~Haoxiang_Wang1;~Haozhe_Si1;~Huajie_Shao1;~Han_Zhao1",
        "gender": "M;M;M;M",
        "homepage": "https://haoxiang-wang.github.io/;https://ehzoahis.github.io/;https://huajieshao.github.io/;https://hanzhaoml.github.io/",
        "dblp": ";;179/4173;03/3520-2",
        "google_scholar": "bcInPlwAAAAJ;DUcnRMMAAAAJ;5-D7ZLsAAAAJ;x942ipYAAAAJ",
        "orcid": ";;0000-0001-7627-5615;0000-0002-8579-1600",
        "linkedin": "haoxiang-wang-071414ab/;haozhesi-468811146/;huajie-shao-508465113/;",
        "or_profile": "~Haoxiang_Wang1;~Haozhe_Si1;~Huajie_Shao1;~Han_Zhao1",
        "aff": "University of Illinois, Urbana Champaign;University of Illinois Urbana-Champaign;College of William and Mary;University of Illinois, Urbana Champaign",
        "aff_domain": "illinois.edu;illunois.edu;wm.edu;illinois.edu",
        "position": "PhD student;PhD student;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nwang2024enhancing,\ntitle={Enhancing Compositional Generalization via Compositional Feature Alignment},\nauthor={Haoxiang Wang and Haozhe Si and Huajie Shao and Han Zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=Aemqy6Hjdj}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZjmZ;d1KC;H15m",
        "site": "https://openreview.net/forum?id=Aemqy6Hjdj",
        "pdf_size": 5692695,
        "rating": "5;6;6",
        "confidence": "4;3;4",
        "soundness": "2;3;3",
        "contribution": "2;3;2",
        "presentation": "3;2;3",
        "wc_summary": "66;113;50",
        "wc_strengths": "74;85;49",
        "wc_weaknesses": "298;41;117",
        "wc_questions": "51;28;14",
        "wc_review": "489;267;230",
        "wc_reply_reviewers": "104;0;89",
        "wc_reply_authors": "1796;436;1300",
        "reply_reviewers": "1;0;1",
        "reply_authors": "4;1;3",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            76.33333333333333,
            26.737406173540634
        ],
        "wc_strengths_avg": [
            69.33333333333333,
            15.062831370260005
        ],
        "wc_weaknesses_avg": [
            152.0,
            107.79919603905526
        ],
        "wc_questions_avg": [
            31.0,
            15.253414918196734
        ],
        "wc_review_avg": [
            328.6666666666667,
            114.37462811111368
        ],
        "wc_reply_reviewers_avg": [
            64.33333333333333,
            45.90085934804368
        ],
        "wc_reply_authors_avg": [
            1177.3333333333333,
            561.9521529651988
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:FlompfGzqNAJ:scholar.google.com/&scioq=Enhancing+Compositional+Generalization+via+Compositional+Feature+Alignment&hl=en&as_sdt=0,33",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "University of Illinois Urbana-Champaign;College of William and Mary",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://illinois.edu;https://www.wm.edu",
        "aff_unique_abbr": "UIUC;WM",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Urbana-Champaign;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "AfSpl24oUJ",
        "title": "A graph transformer for symbolic regression",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Inferring the underlying mathematical expressions from real-world observed data is a central challenge in scientific discovery. Symbolic regression (SR) techniques stand out as a primary method for addressing this challenge, as they explore a function space characterized by interpretable analytical expressions. Recently, transformer-based approaches have gained widespread popularity for solving symbolic regression problems. However, these existing transformer-based models rely on pre-order traversal of expressions as supervision, essentially compressing the information within a computation tree into a token sequence. This compression makes the derived formula highly sensitive to the order of decoded tokens. To address this sensitivity issue, we introduce a novel model architecture called the Graph Transformer (GT), which is purpose-built for directly predicting the tree structure of mathematical formulas. In empirical evaluations, our proposed method demonstrates significant improvements in terms of formula skeleton recovery rates and R-squared scores for data fitting when compared to state-of-the-art transformer-based approaches.",
        "keywords": "attention mechanism;graph transformer;symbolic regression",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Weiheng Zhong;Hadi Meidani",
        "authorids": "~Weiheng_Zhong1;~Hadi_Meidani1",
        "gender": "M;Not Specified",
        "homepage": ";https://uq.cee.illinois.edu",
        "dblp": ";",
        "google_scholar": "fgLb_DsAAAAJ;",
        "orcid": "0000-0002-7902-3568;",
        "linkedin": "weiheng-zhong-796481238/;",
        "or_profile": "~Weiheng_Zhong1;~Hadi_Meidani1",
        "aff": "University of Illinois Urbana Champaign;",
        "aff_domain": "illinois.edu;",
        "position": "PhD student;",
        "bibtex": "@misc{\nzhong2024a,\ntitle={A graph transformer for symbolic regression},\nauthor={Weiheng Zhong and Hadi Meidani},\nyear={2024},\nurl={https://openreview.net/forum?id=AfSpl24oUJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "YZQC;mTB4;dKpQ;SCmX",
        "site": "https://openreview.net/forum?id=AfSpl24oUJ",
        "pdf_size": 806007,
        "rating": "3;3;5;5",
        "confidence": "4;4;4;4",
        "soundness": "3;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "1;2;2;2",
        "wc_summary": "113;56;26;73",
        "wc_strengths": "115;44;39;42",
        "wc_weaknesses": "773;265;184;35",
        "wc_questions": "247;100;185;162",
        "wc_review": "1248;465;434;312",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            67.0,
            31.44041984452498
        ],
        "wc_strengths_avg": [
            60.0,
            31.804087787578503
        ],
        "wc_weaknesses_avg": [
            314.25,
            277.4088814367702
        ],
        "wc_questions_avg": [
            173.5,
            52.60465758846834
        ],
        "wc_review_avg": [
            614.75,
            370.0536278703399
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:cVyLaAYYqowJ:scholar.google.com/&scioq=A+graph+transformer+for+symbolic+regression&hl=en&as_sdt=0,48",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Illinois Urbana-Champaign",
        "aff_unique_dep": "",
        "aff_unique_url": "https://illinois.edu",
        "aff_unique_abbr": "UIUC",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Urbana-Champaign",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "title": "General Stability Analysis for Zeroth-Order Optimization Algorithms",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19245",
        "id": "AfhNyr73Ma",
        "author_site": "Xinyue Liu, Hualin Zhang, Bin Gu, Hong Chen",
        "tldr": "",
        "abstract": "Zeroth-order optimization algorithms are widely used for black-box optimization problems, such as those in machine learning and prompt engineering, where the gradients are approximated using function evaluations. Recently, a generalization result was provided for zeroth-order stochastic gradient descent (SGD) algorithms through stability analysis. However, this result was limited to the vanilla 2-point zeroth-order estimate of Gaussian distribution used in SGD algorithms. To address these limitations, we propose a general proof framework for stability analysis that applies to convex, strongly convex, and non-convex conditions, and yields results for popular zeroth-order optimization algorithms, including SGD, GD, and SVRG, as well as various zeroth-order estimates, such as 1-point and 2-point with different distributions and coordinate estimates. Our general analysis shows that coordinate estimation can lead to tighter generalization bounds for SGD, GD, and SVRG versions of zeroth-order optimization algorithms, due to the smaller expansion brought by coordinate estimates to stability analysis.",
        "keywords": "Stability Analysis; Zeroth-Order Optimization; Black-Box Learning",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/ce5a38524d3d18e6062d950399c839cc2e0e1042.zip",
        "author": "Xinyue Liu;Hualin Zhang;Bin Gu;Hong Chen",
        "authorids": "~Xinyue_Liu3;~Hualin_Zhang1;~Bin_Gu1;~Hong_Chen1",
        "gender": "F;M;M;",
        "homepage": ";https://github.com/zhanghualin0;https://mbzuai.ac.ae/study/faculty/bin-gu/;https://chenhongml.github.io/",
        "dblp": ";303/7916;29/1758-1;https://dblp.uni-trier.de/pers/hd/c/Chen_0004:Hong",
        "google_scholar": ";;Vo8OgCgAAAAJ;",
        "orcid": "0009-0005-4885-1917;;0000-0001-6049-1815;",
        "linkedin": ";;;",
        "or_profile": "~Xinyue_Liu3;~Hualin_Zhang1;~Bin_Gu1;~Hong_Chen1",
        "aff": "Huazhong Agricultural University;Mohamed bin Zayed University of Artificial Intelligence;Mohamed bin Zayed University of Artificial Intelligence;Huazhong Agricultural University",
        "aff_domain": "hzau.edu.cn;mbzuai.ac.ae;mbzuai.ac.ae;hzau.edu.cn",
        "position": "Undergrad student;PhD student;Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\nliu2024general,\ntitle={General Stability Analysis for Zeroth-Order Optimization Algorithms},\nauthor={Xinyue Liu and Hualin Zhang and Bin Gu and Hong Chen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=AfhNyr73Ma}\n}",
        "github": "",
        "project": "",
        "reviewers": "qUEd;PNwi;N2Y8;x656",
        "pdf_size": 1050024,
        "rating": "6;6;8;8",
        "confidence": "4;4;3;3",
        "soundness": "3;3;3;4",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;4",
        "wc_summary": "118;45;61;185",
        "wc_strengths": "63;34;63;49",
        "wc_weaknesses": "122;73;27;30",
        "wc_questions": "55;5;15;28",
        "wc_review": "358;157;166;292",
        "wc_reply_reviewers": "25;0;0;10",
        "wc_reply_authors": "1178;385;365;175",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "3;1;1;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            102.25,
            54.94258366695181
        ],
        "wc_strengths_avg": [
            52.25,
            11.986972094736853
        ],
        "wc_weaknesses_avg": [
            63.0,
            38.61994303465504
        ],
        "wc_questions_avg": [
            25.75,
            18.7533330370897
        ],
        "wc_review_avg": [
            243.25,
            85.07459961704198
        ],
        "wc_reply_reviewers_avg": [
            8.75,
            10.231690964840562
        ],
        "wc_reply_authors_avg": [
            525.75,
            385.39160278864404
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10860145463877914785&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=AfhNyr73Ma",
        "pdf": "https://openreview.net/pdf?id=AfhNyr73Ma",
        "email": "hzau.edu.cn;mbzuai.ac.ae;mbzuai.ac.ae;hzau.edu.cn",
        "author_num": 4,
        "aff_unique_index": "0;1;1;0",
        "aff_unique_norm": "Huazhong Agricultural University;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.hzau.edu.cn/;https://mbzuai.ac.ae",
        "aff_unique_abbr": "HAU;MBZUAI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "China;United Arab Emirates"
    },
    {
        "id": "AfiM6F2YPY",
        "title": "Applying language models to algebraic topology: generating simplicial cycles using multi-labeling in Wu's formula",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Computing homotopy groups of spheres has long been a fundamental objective in algebraic topology. Various theoretical and algorithmic approaches have been developed to tackle this problem. In this paper we take a step towards the goal of comprehending the group-theoretic structure of the generators of these homotopy groups by leveraging the power of machine learning. Specifically, in the simplicial group setting of Wu's formula, we reformulate the problem of generating simplicial cycles as a problem of sampling from the intersection of algorithmic datasets related to Dyck languages. We present and evaluate language modelling approaches that employ multi-label information for input sequences, along with the necessary group-theoretic toolkit and non-neural baselines.",
        "keywords": "transformers;group theory;algebraic topology",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/41fddd281731146639d01291e86d6c2c55ce872f.zip",
        "author": "Kirill Brilliantov;Fedor Pavutnitskiy;Dmitry Pasechnyuk;German Magai",
        "authorids": "~Kirill_Brilliantov1;~Fedor_Pavutnitskiy1;~Dmitry_Pasechnyuk1;~German_Magai1",
        "gender": "M;M;M;M",
        "homepage": "https://github.com/kibrq;;http://dmivilensky.ru/;https://www.hse.ru/en/org/persons/364631586",
        "dblp": "350/5533;285/5395;242/6650;318/9190",
        "google_scholar": "thgwrhYAAAAJ;;yUfa6X8AAAAJ;",
        "orcid": ";0000-0002-8676-6941;0000-0002-1208-1659;",
        "linkedin": ";;;german-magai-0b7a69233/",
        "or_profile": "~Kirill_Brilliantov1;~Fedor_Pavutnitskiy1;~Dmitry_Pasechnyuk1;~German_Magai1",
        "aff": "ETHZ - ETH Zurich;Beijing Institute of Mathematical Sciences and Applications;Mohamed bin Zayed University of Artificial Intelligence;Higher School of Economics",
        "aff_domain": "ethz.ch;bimsa.cn;mbzuai.ac.ae;hse.ru",
        "position": "MS student;Assistant Professor;Researcher;PhD student",
        "bibtex": "@misc{\nbrilliantov2024applying,\ntitle={Applying language models to algebraic topology: generating simplicial cycles using multi-labeling in Wu's formula},\nauthor={Kirill Brilliantov and Fedor Pavutnitskiy and Dmitry Pasechnyuk and German Magai},\nyear={2024},\nurl={https://openreview.net/forum?id=AfiM6F2YPY}\n}",
        "github": "",
        "project": "",
        "reviewers": "VtUd;LHhA;aKQP",
        "site": "https://openreview.net/forum?id=AfiM6F2YPY",
        "pdf_size": 785192,
        "rating": "3;3;6",
        "confidence": "3;4;3",
        "soundness": "3;3;4",
        "contribution": "2;3;4",
        "presentation": "2;2;4",
        "wc_summary": "60;283;102",
        "wc_strengths": "58;85;29",
        "wc_weaknesses": "306;184;61",
        "wc_questions": "40;436;49",
        "wc_review": "464;988;241",
        "wc_reply_reviewers": "180;230;77",
        "wc_reply_authors": "720;804;298",
        "reply_reviewers": "1;1;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            148.33333333333334,
            96.75513193394734
        ],
        "wc_strengths_avg": [
            57.333333333333336,
            22.866763848189994
        ],
        "wc_weaknesses_avg": [
            183.66666666666666,
            100.02110888318637
        ],
        "wc_questions_avg": [
            175.0,
            184.59144075498193
        ],
        "wc_review_avg": [
            564.3333333333334,
            313.10523612499503
        ],
        "wc_reply_reviewers_avg": [
            162.33333333333334,
            63.698944697346086
        ],
        "wc_reply_authors_avg": [
            607.3333333333334,
            221.4036033030076
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ri0V03MH7o8J:scholar.google.com/&scioq=Applying+language+models+to+algebraic+topology:+generating+simplicial+cycles+using+multi-labeling+in+Wu%27s+formula&hl=en&as_sdt=0,5",
        "gs_version_total": 9,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "ETH Zurich;Beijing Institute of Mathematical Sciences and Applications;Mohamed bin Zayed University of Artificial Intelligence;Higher School of Economics",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.ethz.ch;;https://mbzuai.ac.ae;https://www.hse.ru",
        "aff_unique_abbr": "ETHZ;;MBZUAI;HSE",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;3",
        "aff_country_unique": "Switzerland;China;United Arab Emirates;Russian Federation"
    },
    {
        "title": "Role of Locality and Weight Sharing in Image-Based Tasks: A Sample Complexity Separation between CNNs, LCNs, and FCNs",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19244",
        "id": "AfnsTnYphT",
        "author_site": "Aakash Sunil Lahoti, Stefani Karp, Ezra Winston, Aarti Singh, Yuanzhi Li",
        "tldr": "",
        "abstract": "Vision tasks are characterized by the properties of locality and translation invariance. \n    The superior performance of convolutional neural networks (CNNs) on these tasks is widely attributed to the inductive bias of locality and weight sharing baked into their architecture.\n    Existing attempts to quantify the statistical benefits of these biases in CNNs over locally connected convolutional neural networks (LCNs) and fully connected neural networks (FCNs) fall into one of the following categories: either they disregard the optimizer and only provide uniform convergence upper bounds with no separating lower bounds, \n    or they consider simplistic tasks that do not truly mirror the locality and translation invariance as found in real-world vision tasks.\n    To address these deficiencies, we introduce the Dynamic Signal Distribution (DSD) classification task that models an image as consisting of $k$ patches, each of dimension $d$, and the label is determined by a $d$-sparse signal vector that can freely appear in any one of the $k$ patches. \n    On this task, for any orthogonally equivariant algorithm like gradient descent, we prove that CNNs require $\\tilde{O}(k+d)$ samples, whereas LCNs require $\\Omega(kd)$ samples, establishing the statistical advantages of weight sharing in translation invariant tasks. \n    Furthermore, LCNs need $\\tilde{O}(k(k+d))$ samples, compared to $\\Omega(k^2d)$ samples for FCNs, showcasing the benefits of locality in local tasks.\n    Additionally, we develop information theoretic tools for analyzing randomized algorithms, which may be of interest for statistical research.",
        "keywords": "Deep Learning Theory;Sample Complexity;Convolutional Neural Networks",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Aakash Lahoti;Stefani Karp;Ezra Winston;Aarti Singh;Yuanzhi Li",
        "authorids": "~Aakash_Lahoti1;~Stefani_Karp1;~Ezra_Winston1;~Aarti_Singh1;~Yuanzhi_Li1",
        "gender": "M;F;;F;M",
        "homepage": ";;https://ezrawinston.github.io;https://www.cs.cmu.edu/~aarti;",
        "dblp": ";280/1111;66/9442;64/5328;73/3628",
        "google_scholar": "wGUvxZQAAAAJ;iMknz8EAAAAJ;;vGBcNVAAAAAJ;",
        "orcid": ";;;;",
        "linkedin": "aakashlahoti/;;;;",
        "or_profile": "~Aakash_Lahoti1;~Stefani_Karp1;~Ezra_Winston1;~Aarti_Singh1;~Yuanzhi_Li1",
        "aff": "Carnegie Mellon University;Carnegie Mellon University;Machine Learning Department, School of Computer Science;University of Wisconsin - Madison;Carnegie Mellon University",
        "aff_domain": "andrew.cmu.edu;cmu.edu;mld.cs.cmu.edu;wisc.edu;andrew.cmu.edu",
        "position": "PhD student;PhD student;PhD student;PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nlahoti2024role,\ntitle={Role of Locality and Weight Sharing in Image-Based Tasks: A Sample Complexity Separation between {CNN}s, {LCN}s, and {FCN}s},\nauthor={Aakash Lahoti and Stefani Karp and Ezra Winston and Aarti Singh and Yuanzhi Li},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=AfnsTnYphT}\n}",
        "github": "",
        "project": "",
        "reviewers": "yeJ4;o7GU;jtyo;LSto",
        "pdf_size": 1988737,
        "rating": "6;8;8;8",
        "confidence": "3;5;3;3",
        "soundness": "3;3;3;4",
        "contribution": "3;2;2;3",
        "presentation": "3;3;3;4",
        "wc_summary": "28;78;22;176",
        "wc_strengths": "49;46;23;176",
        "wc_weaknesses": "167;367;226;84",
        "wc_questions": "9;1;49;36",
        "wc_review": "253;492;320;472",
        "wc_reply_reviewers": "0;36;12;0",
        "wc_reply_authors": "596;1889;332;195",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "2;4;2;1",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            76.0,
            61.69278726074872
        ],
        "wc_strengths_avg": [
            73.5,
            60.02707722353305
        ],
        "wc_weaknesses_avg": [
            211.0,
            103.23032500191017
        ],
        "wc_questions_avg": [
            23.75,
            19.51121472384536
        ],
        "wc_review_avg": [
            384.25,
            100.82751360615812
        ],
        "wc_reply_reviewers_avg": [
            12.0,
            14.696938456699069
        ],
        "wc_reply_authors_avg": [
            753.0,
            671.5188009281646
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            1.0897247358851685
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17650709807965419878&as_sdt=5,24&sciodt=0,24&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=AfnsTnYphT",
        "pdf": "https://openreview.net/pdf?id=AfnsTnYphT",
        "email": "andrew.cmu.edu;cmu.edu;mld.cs.cmu.edu;wisc.edu;andrew.cmu.edu",
        "author_num": 5,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "Carnegie Mellon University;University of Wisconsin-Madison",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cmu.edu;https://www.wisc.edu",
        "aff_unique_abbr": "CMU;UW-Madison",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Madison",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "AgCz44ebFe",
        "title": "May the Forgetting Be with You: Alternate Replay for Learning with Noisy Labels",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Forgetting presents a significant challenge during incremental training, making it particularly demanding for contemporary AI systems to assimilate new knowledge in streaming data environments. To address this issue, most approaches in Continual Learning (CL) rely on the replay of a restricted buffer of past data. However, the presence of noise in real-world scenarios, where human annotation is constrained by time limitations, frequently renders these strategies vulnerable. In this study, we address the problem of CL under Noisy labels (CLN) by introducing Alternate Experience Replay (AER), a novel strategy that takes advantage of forgetting to maintain a clear differentiation between clean, complex, and noisy samples in the memory buffer. The idea is that complex or mislabeled examples, which hardly fit the previously learned data distribution, are the ones most likely to be forgotten. To grasp the benefits of such a separation, we equip AER with Asymmetric Balanced Sampling: a new sample selection strategy that prioritizes purity on the current task while retaining relevant samples from the past. Through extensive computational comparisons, we demonstrate the effectiveness of our approach in terms of both accuracy and purity of the obtained buffer, resulting in a remarkable average gain of $7.45\\%$ points in accuracy w.r.t. existing loss-based purification strategies.",
        "keywords": "continual learning;lifelong learning;noisy labels;forgetting;rehearsal;incremental learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/2b9e56ab884c20e4677d96cf7ae97e2e37311c78.zip",
        "author": "Monica Millunzi;Lorenzo Bonicelli;Angelo Porrello;Jacopo Credi;Petter N. Kolm;Simone Calderara",
        "authorids": "~Monica_Millunzi1;~Lorenzo_Bonicelli1;~Angelo_Porrello1;~Jacopo_Credi1;~Petter_N._Kolm1;~Simone_Calderara1",
        "gender": ";M;M;M;;M",
        "homepage": ";https://lorenzobonicelli.net/;;;;",
        "dblp": ";299/8442;223/4466;;;13/422",
        "google_scholar": ";ovXU58MAAAAJ;b3-5Ys4AAAAJ;XOG3FBEAAAAJ;;https://scholar.google.it/citations?user=CZd-WXkAAAAJ",
        "orcid": ";0000-0002-9717-5602;0000-0002-9022-8484;;;0000-0001-9056-1538",
        "linkedin": ";;;jacopocredi/;;",
        "or_profile": "~Monica_Millunzi1;~Lorenzo_Bonicelli1;~Angelo_Porrello1;~Jacopo_Credi1;~Petter_N._Kolm1;~Simone_Calderara1",
        "aff": ";University of Modena and Reggio Emilia;University of Modena and Reggio Emilia, AimageLab;;;University of Modena and Reggio Emilia",
        "aff_domain": ";unimore.it;unimore.it;;;unimore.it",
        "position": ";PhD student;Postdoc;;;Full Professor",
        "bibtex": "@misc{\nmillunzi2024may,\ntitle={May the Forgetting Be with You: Alternate Replay for Learning with Noisy Labels},\nauthor={Monica Millunzi and Lorenzo Bonicelli and Angelo Porrello and Jacopo Credi and Petter N. Kolm and Simone Calderara},\nyear={2024},\nurl={https://openreview.net/forum?id=AgCz44ebFe}\n}",
        "github": "",
        "project": "",
        "reviewers": "QKiJ;Jj1M;2XeP;aFAe",
        "site": "https://openreview.net/forum?id=AgCz44ebFe",
        "pdf_size": 1654384,
        "rating": "3;5;5;6",
        "confidence": "4;4;3;4",
        "soundness": "2;2;2;2",
        "contribution": "1;2;2;2",
        "presentation": "2;3;2;3",
        "wc_summary": "88;58;165;65",
        "wc_strengths": "23;19;79;34",
        "wc_weaknesses": "183;265;66;502",
        "wc_questions": "15;6;82;4",
        "wc_review": "309;348;392;605",
        "wc_reply_reviewers": "0;178;0;483",
        "wc_reply_authors": "403;1529;980;1896",
        "reply_reviewers": "0;2;0;2",
        "reply_authors": "1;4;2;4",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            94.0,
            42.46763473517215
        ],
        "wc_strengths_avg": [
            38.75,
            23.878599205146017
        ],
        "wc_weaknesses_avg": [
            254.0,
            159.69502183850315
        ],
        "wc_questions_avg": [
            26.75,
            32.16655872175325
        ],
        "wc_review_avg": [
            413.5,
            114.39514849852681
        ],
        "wc_reply_reviewers_avg": [
            165.25,
            197.321279896518
        ],
        "wc_reply_authors_avg": [
            1202.0,
            564.8561763847501
        ],
        "reply_reviewers_avg": [
            1.0,
            1.0
        ],
        "reply_authors_avg": [
            2.75,
            1.299038105676658
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.13245323570650439,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1183970600880101647&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Modena and Reggio Emilia",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.unimore.it",
        "aff_unique_abbr": "",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Italy"
    },
    {
        "title": "Large Language Models as Analogical Reasoners",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19243",
        "id": "AgDICX1h50",
        "author_site": "Michihiro Yasunaga, Xinyun Chen, Yujia Li, Panupong Pasupat, Jure Leskovec, Percy Liang, Ed H. Chi, Denny Zhou",
        "tldr": "",
        "abstract": "Chain-of-thought (CoT) prompting for language models demonstrates impressive performance across reasoning tasks, but typically needs labeled exemplars of the reasoning process. In this work, we introduce a new prompting approach, analogical prompting, designed to automatically guide the reasoning process of large language models. Inspired by analogical reasoning, a cognitive process in which humans draw from relevant past experiences to tackle new problems, our approach prompts language models to self-generate relevant exemplars or knowledge in the context, before proceeding to solve the given problem. This method presents several advantages: it obviates the need for labeling or retrieving exemplars, offering generality and convenience; it can also tailor the generated exemplars and knowledge to each problem, offering adaptability. Experimental results show that our approach outperforms 0-shot CoT and manual few-shot CoT in a variety of reasoning tasks, including math problem solving in GSM8K and MATH, code generation in Codeforces, and other reasoning tasks in BIG-Bench.",
        "keywords": "large language model;prompting;analogical reasoning;reasoning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/c7a7583e50c0cdf2ca4cefbfce8ba37d8735af9a.pdf",
        "author": "Michihiro Yasunaga;Xinyun Chen;Yujia Li;Panupong Pasupat;Jure Leskovec;Percy Liang;Ed H. Chi;Denny Zhou",
        "authorids": "~Michihiro_Yasunaga1;~Xinyun_Chen1;~Yujia_Li1;~Panupong_Pasupat1;~Jure_Leskovec1;~Percy_Liang1;~Ed_H._Chi1;~Denny_Zhou1",
        "gender": ";M;M;;;;M;F",
        "homepage": ";https://yujiali.github.io/;https://ppasupat.github.io/;http://cs.stanford.edu/~jure/;https://cs.stanford.edu/~pliang/;https://dennyzhou.github.io/;http://edchi.net;https://jungyhuk.github.io/",
        "dblp": "202/1809;67/3069;124/9178;l/JureLeskovec;04/1701;178/3277;13/310;",
        "google_scholar": "SieJYoEAAAAJ;https://scholar.google.ca/citations?user=UY7CtEwAAAAJ;BqKXIA8AAAAJ;Q_kKkIUAAAAJ;pouyVyUAAAAJ;UwLsYw8AAAAJ;VuWl-KUAAAAJ;d4W1UT0AAAAJ",
        "orcid": ";;;0000-0002-5411-923X;;;0000-0003-3230-5338;",
        "linkedin": ";;;leskovec/;;;edchi/;",
        "or_profile": "~Michihiro_Yasunaga1;~Yujia_Li1;~Panupong_Pasupat1;~Jure_Leskovec1;~Percy_Liang1;~Dengyong_Zhou2;~Ed_Chi1;~Xinyun_Chen2",
        "aff": "Stanford University;Google DeepMind;Google;Kumo.AI;Stanford University;Google DeepMind;Google;Google",
        "aff_domain": "stanford.edu;google.com;google.com;kumo.ai;stanford.edu;google.com;google.com;google.com",
        "position": "PhD student;Research Scientist;Employee;Chief Scientist;Associate Professor;Research Scientist;Researcher;Researcher",
        "bibtex": "@inproceedings{\nyasunaga2024large,\ntitle={Large Language Models as Analogical Reasoners},\nauthor={Michihiro Yasunaga and Xinyun Chen and Yujia Li and Panupong Pasupat and Jure Leskovec and Percy Liang and Ed H. Chi and Denny Zhou},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=AgDICX1h50}\n}",
        "github": "",
        "project": "",
        "reviewers": "fGoM;ExxM;DVcm;ey56",
        "pdf_size": 557807,
        "rating": "5;5;5;8",
        "confidence": "5;4;3;4",
        "soundness": "3;3;2;3",
        "contribution": "2;3;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "49;40;39;32",
        "wc_strengths": "76;40;192;70",
        "wc_weaknesses": "87;117;7;264",
        "wc_questions": "41;45;35;80",
        "wc_review": "253;242;273;446",
        "wc_reply_reviewers": "38;375;0;16",
        "wc_reply_authors": "1071;1262;508;388",
        "reply_reviewers": "1;3;0;1",
        "reply_authors": "2;4;1;2",
        "rating_avg": [
            5.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            40.0,
            6.041522986797286
        ],
        "wc_strengths_avg": [
            94.5,
            57.92020372892347
        ],
        "wc_weaknesses_avg": [
            118.75,
            93.00100805905278
        ],
        "wc_questions_avg": [
            50.25,
            17.541023345289748
        ],
        "wc_review_avg": [
            303.5,
            83.01957600469903
        ],
        "wc_reply_reviewers_avg": [
            107.25,
            155.17308883952785
        ],
        "wc_reply_authors_avg": [
            807.25,
            367.99549929312997
        ],
        "reply_reviewers_avg": [
            1.25,
            1.0897247358851685
        ],
        "reply_authors_avg": [
            2.25,
            1.0897247358851685
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 60,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6114845287628255960&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "openreview": "https://openreview.net/forum?id=AgDICX1h50",
        "pdf": "https://openreview.net/pdf?id=AgDICX1h50",
        "email": "stanford.edu;google.com;google.com;kumo.ai;stanford.edu;google.com;google.com;google.com",
        "author_num": 8,
        "aff_unique_index": "0;1;1;2;0;1;1;1",
        "aff_unique_norm": "Stanford University;Google;Kumo.AI",
        "aff_unique_dep": ";Google DeepMind;",
        "aff_unique_url": "https://www.stanford.edu;https://deepmind.com;https://www.kumo.ai",
        "aff_unique_abbr": "Stanford;DeepMind;Kumo.AI",
        "aff_campus_unique_index": "0;2;0;2;2",
        "aff_campus_unique": "Stanford;;Mountain View",
        "aff_country_unique_index": "0;1;0;0;0;1;0;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "title": "OMNI: Open-endedness via Models of human Notions of Interestingness",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19242",
        "id": "AgM3MzT99c",
        "author_site": "Jenny Zhang, Joel Lehman, Kenneth Stanley, Jeff Clune",
        "tldr": "",
        "abstract": "Open-ended algorithms aim to learn new, interesting behaviors forever. That requires a vast environment search space, but there are thus infinitely many possible tasks. Even after filtering for tasks the current agent can learn (i.e., learning progress), countless learnable yet uninteresting tasks remain (e.g., minor variations of previously learned tasks). An Achilles Heel of open-endedness research is the inability to quantify (and thus prioritize) tasks that are not just learnable, but also $\\textit{interesting}$ (e.g., worthwhile and novel). We propose solving this problem by $\\textit{Open-endedness via Models of human Notions of Interestingness}$ (OMNI). The insight is that we can utilize foundation models (FMs) as a model of interestingness (MoI), because they $\\textit{already}$ internalize human concepts of interestingness from training on vast amounts of human-generated data, where humans naturally write about what they find interesting or boring. We show that FM-based MoIs improve open-ended learning by focusing on tasks that are both learnable $\\textit{and interesting}$, outperforming baselines based on uniform task sampling or learning progress alone. This approach has the potential to dramatically advance the ability to intelligently select which tasks to focus on next (i.e., auto-curricula), and could be seen as AI selecting its own next task to learn, facilitating self-improving AI and AI-Generating Algorithms.",
        "keywords": "Open-endedness;Auto-Curriculum Learning;Reinforcement Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Jenny Zhang;Joel Lehman;Kenneth Stanley;Jeff Clune",
        "authorids": "~Jenny_Zhang1;~Joel_Lehman1;~Kenneth_Stanley1;~Jeff_Clune3",
        "gender": ";;M;",
        "homepage": ";http://joellehman.com;https://www.kenstanley.net/;",
        "dblp": ";47/8285;s/KennethOStanley;",
        "google_scholar": ";GcvxHWQAAAAJ;https://scholar.google.com.tw/citations?user=6Q6oO1MAAAAJ;",
        "orcid": ";;;",
        "linkedin": ";;kenneth-stanley-3a159b/;",
        "or_profile": "~Jenny_Zhang1;~Joel_Lehman1;~Kenneth_Stanley1;~Jeff_Clune3",
        "aff": ";Carper.AI;;",
        "aff_domain": ";carper.ai;;",
        "position": ";Research Advisor;;",
        "bibtex": "@inproceedings{\nzhang2024omni,\ntitle={{OMNI}: Open-endedness via Models of human Notions of Interestingness},\nauthor={Jenny Zhang and Joel Lehman and Kenneth Stanley and Jeff Clune},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=AgM3MzT99c}\n}",
        "github": "",
        "project": "",
        "reviewers": "MxZx;LSLH;CZLW;qXzy",
        "pdf_size": 27141831,
        "rating": "3;6;8;8",
        "confidence": "4;5;3;4",
        "soundness": "2;2;3;3",
        "contribution": "2;3;2;3",
        "presentation": "1;4;3;2",
        "wc_summary": "211;127;109;134",
        "wc_strengths": "61;115;115;52",
        "wc_weaknesses": "192;236;223;459",
        "wc_questions": "190;102;2;11",
        "wc_review": "654;580;449;656",
        "wc_reply_reviewers": "0;0;12;31",
        "wc_reply_authors": "823;864;767;805",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            6.25,
            2.0463381929681126
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            145.25,
            39.04084399702445
        ],
        "wc_strengths_avg": [
            85.75,
            29.422567868899545
        ],
        "wc_weaknesses_avg": [
            277.5,
            106.00117923872357
        ],
        "wc_questions_avg": [
            76.25,
            76.44074502515004
        ],
        "wc_review_avg": [
            584.75,
            84.14682109265922
        ],
        "wc_reply_reviewers_avg": [
            10.75,
            12.676257334087218
        ],
        "wc_reply_authors_avg": [
            814.75,
            34.888214342382156
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.34554737023254406,
        "gs_citation": 39,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16474108468889890747&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=AgM3MzT99c",
        "pdf": "https://openreview.net/pdf?id=AgM3MzT99c",
        "email": ";carper.ai;;",
        "author_num": 4,
        "aff_unique_index": "0",
        "aff_unique_norm": "Carper.AI",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.carper.ai",
        "aff_unique_abbr": "Carper.AI",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "title": "BatchPrompt: Accomplish more with less",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19241",
        "id": "Agyicd577r",
        "author_site": "Jianzhe Lin, Maurice Diesendruck, Liang Du, Robin Abraham",
        "tldr": "",
        "abstract": "The ever-increasing token limits of large language models (LLMs) have enabled long context as input. Many LLMs are trained and fine-tuned to perform zero/few-shot inference using instruction-based prompts. Prompts typically include a detailed task instruction, several examples, and a single data point for inference. This baseline is referred to as \u201cSinglePrompt\u201d in this paper. In terms of token count, when the data input is small compared to instructions and examples, this results in lower token utilization, compared with encoder-based models like fine-tuned BERT. This cost inefficiency, affecting inference speed and compute budget, counteracts many of the benefits that LLMs offer. This paper aims to alleviate this problem by batching multiple data points in each prompt, a strategy we refer to as \u201cBatchPrompt\u201d. We improve token utilization by increasing the \u201cdensity\u201d of data points, however, this cannot be done naively. Simple batching can degrade performance, especially as batch size increases, and data points can yield different answers depending on their position within a prompt. To address the quality issue while retaining high token utilization, we introduce Batch Permutation and Ensembling (BPE) for BatchPrompt \u2013 a simple majority vote over repeated permutations of data, that recovers label quality at the cost of more token usage. To counterbalance this cost, we further propose Self-reflection-guided EArly Stopping (SEAS), which can terminate the voting process early for data points that the LLM handles confidently. Our comprehensive experimental evaluation demonstrates that BPE + SEAS can boost the performance of BatchPrompt by a striking margin on a range of popular NLP tasks, including question answering (Boolq), textual entailment (RTE), and duplicate questions identification (QQP). This performance is even competitive with/higher than single-data prompting (SinglePrompt), while using far fewer LLM calls and input tokens. At batch size 32, our BatchPrompt + BPE + SEAS uses 15.7% the number of LLM calls, and achieves: Boolq accuracy 90.6% \u2192 90.9% with 27.4% tokens, QQP accuracy 87.2% \u2192 88.4% with 18.6% tokens, RTE accuracy 91.5% \u2192 91.1% with 30.8% tokens. We hope our simple yet effective approach will shed light on the future research of large language models. Code: github.com/microsoft/BatchPrompt",
        "keywords": "large language models;token-resource utilization;prompt",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/50783e8b30f12efd8f8bac8609eee0b52536a03c.zip",
        "author": "Jianzhe Lin;Maurice Diesendruck;Liang Du;Robin Abraham",
        "authorids": "~Jianzhe_Lin1;~Maurice_Diesendruck1;~Liang_Du3;~Robin_Abraham1",
        "gender": "M;M;;",
        "homepage": "http://jianzhelin.github.io;https://github.com/diesendruck;;",
        "dblp": "https://dblp.org/pers/l/Lin:Jianzhe.html;;;",
        "google_scholar": "https://scholar.google.ca/citations?user=6709egkAAAAJ;;aq4dG-AAAAAJ;aONpOEwAAAAJ",
        "orcid": ";;;",
        "linkedin": "jianzhe-lin-a4135baa/?originalSubdomain=ca;;;robin-abraham-b206059/",
        "or_profile": "~Jianzhe_Lin1;~Maurice_Diesendruck1;~Liang_Du3;~Robin_Abraham1",
        "aff": "Microsoft;Apple;Microsoft;Microsoft",
        "aff_domain": "microsoft.com;apple.com;microsoft.com;microsoft.com",
        "position": "Senior Applied Scientist;Researcher;Researcher;Principal Researcher",
        "bibtex": "@inproceedings{\nlin2024batchprompt,\ntitle={BatchPrompt: Accomplish more with less},\nauthor={Jianzhe Lin and Maurice Diesendruck and Liang Du and Robin Abraham},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Agyicd577r}\n}",
        "github": "",
        "project": "",
        "reviewers": "7rFs;Nbfh;PJJX;pc53",
        "pdf_size": 808169,
        "rating": "5;6;6;8",
        "confidence": "4;4;4;3",
        "soundness": "3;3;3;4",
        "contribution": "2;3;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "84;105;238;31",
        "wc_strengths": "36;51;86;21",
        "wc_weaknesses": "80;59;129;115",
        "wc_questions": "4;96;70;85",
        "wc_review": "204;311;523;252",
        "wc_reply_reviewers": "0;0;25;0",
        "wc_reply_authors": "322;430;802;270",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            114.5,
            76.23155514614666
        ],
        "wc_strengths_avg": [
            48.5,
            24.109126902482387
        ],
        "wc_weaknesses_avg": [
            95.75,
            27.725214156071004
        ],
        "wc_questions_avg": [
            63.75,
            35.70976757135224
        ],
        "wc_review_avg": [
            322.5,
            121.80414607064901
        ],
        "wc_reply_reviewers_avg": [
            6.25,
            10.825317547305483
        ],
        "wc_reply_authors_avg": [
            456.0,
            207.9326814139615
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9271726499455306,
        "gs_citation": 17,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7802084067485629782&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=Agyicd577r",
        "pdf": "https://openreview.net/pdf?id=Agyicd577r",
        "email": "microsoft.com;apple.com;microsoft.com;microsoft.com",
        "author_num": 4,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Microsoft;Apple",
        "aff_unique_dep": "Microsoft Corporation;Apple Inc.",
        "aff_unique_url": "https://www.microsoft.com;https://www.apple.com",
        "aff_unique_abbr": "Microsoft;Apple",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "AhCdJ93Wmi",
        "title": "Graph Inference Acceleration by Bridging GNNs and MLPs with Self-Supervised Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph Neural Networks (GNNs) have demonstrated their effectiveness in a variety of graph learning tasks such as node classification and link prediction. However, GNN inference mainly relies on neighborhood aggregation, which limits the deployment in latency-sensitive (i.e., real-time) applications such as financial fraud detection. To solve this problem, recent works have proposed to distill knowledge from teacher GNNs to student Multi-Layer Perceptrons (MLPs) trained on node content for inference acceleration. Despite the progress, these studies still suffer insufficient exploration of structural information when inferring unseen nodes. To address this issue, we propose a new method (namely {\\bf SSL-GM}) to fully integrate rich structural information into MLPs by bridging \\textbf{G}NNs and \\textbf{M}LPs with Self-Supervised Learning (\\textbf{SSL}) for graph inference acceleration while improving model generalization capability. A key new insight of SSL-GM is that, without fetching their neighborhoods, the structural information of unseen nodes can be inferred solely from the nodes themselves with SSL. Specifically, SSL-GM employs self-supervised contrastive learning to align the representations encoded by graph context-aware GNNs and neighborhood dependency-free MLPs, fully integrating the structural information into MLPs. In particular, SSL-GM approximates the representations of GNNs using a non-parametric aggregator to avoid potential model collapse and exploits augmentation to facilitate the training; additionally, SSL-GM further incorporates reconstruction regulation to prevent representation shift caused by augmentation. Theoretically, we interpret our proposed SSL-GM through the principle of information bottleneck, demonstrating its generalization capability; we also analyze model capacity in incorporating structural information from the perspective of mutual information maximization and graph smoothness. Empirically, we demonstrate the superiority of SSL-GM over existing state-of-the-art models in both efficiency and effectiveness. In particular, SSL-GM obtains significant performance gains {\\bf (7$\\sim$26\\%)} in comparison to MLPs, and a remarkable acceleration of GNNs {\\bf (90$\\sim$126$\\times$)} on large-scale graph datasets.",
        "keywords": "Graph Neural Network;Self-supervised Learning;Inference Acceleration",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/c9321c31c53095863d027a8a5f2fac942a7c1cb6.zip",
        "author": "Zehong Wang;Zheyuan Zhang;Chuxu Zhang;Yanfang Ye",
        "authorids": "~Zehong_Wang2;~Zheyuan_Zhang5;~Chuxu_Zhang2;~Yanfang_Ye1",
        "gender": "M;M;;",
        "homepage": "https://zehong-wang.github.io/;https://jasonzhangzy1757.github.io/;;http://yes-lab.org/",
        "dblp": "319/7828;;;",
        "google_scholar": "-qXxOv0AAAAJ;qJURp_AAAAAJ;;egjr888AAAAJ",
        "orcid": "0000-0002-7670-6777;0009-0005-5918-6182;;",
        "linkedin": "zehong-wang-745b02286/;jasonzhangzy1757/;;",
        "or_profile": "~Zehong_Wang2;~Zheyuan_Zhang5;~Chuxu_Zhang2;~Yanfang_Ye1",
        "aff": "University of Notre Dame;University of Notre Dame;;University of Notre Dame",
        "aff_domain": "nd.edu;nd.edu;;nd.edu",
        "position": "PhD student;PhD student;;Associate Professor",
        "bibtex": "@misc{\nwang2024graph,\ntitle={Graph Inference Acceleration by Bridging {GNN}s and {MLP}s with Self-Supervised Learning},\nauthor={Zehong Wang and Zheyuan Zhang and Chuxu Zhang and Yanfang Ye},\nyear={2024},\nurl={https://openreview.net/forum?id=AhCdJ93Wmi}\n}",
        "github": "",
        "project": "",
        "reviewers": "eCUd;N5QN;rTyJ;RVGt;WTGk",
        "site": "https://openreview.net/forum?id=AhCdJ93Wmi",
        "pdf_size": 1297645,
        "rating": "3;3;5;5;6",
        "confidence": "4;3;5;4;2",
        "soundness": "2;2;2;3;3",
        "contribution": "2;2;2;2;3",
        "presentation": "3;2;3;3;3",
        "wc_summary": "32;81;84;72;75",
        "wc_strengths": "20;24;49;63;64",
        "wc_weaknesses": "353;251;185;94;102",
        "wc_questions": "1;8;6;37;4",
        "wc_review": "406;364;324;266;245",
        "wc_reply_reviewers": "172;0;491;0;0",
        "wc_reply_authors": "2553;2211;1429;1537;664",
        "reply_reviewers": "3;0;2;0;0",
        "reply_authors": "4;4;3;3;1",
        "rating_avg": [
            4.4,
            1.2
        ],
        "confidence_avg": [
            3.6,
            1.019803902718557
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            68.8,
            18.882796403075474
        ],
        "wc_strengths_avg": [
            44.0,
            18.772320048411704
        ],
        "wc_weaknesses_avg": [
            197.0,
            96.98453484963466
        ],
        "wc_questions_avg": [
            11.2,
            13.105723940324701
        ],
        "wc_review_avg": [
            321.0,
            59.80635417746178
        ],
        "wc_reply_reviewers_avg": [
            132.6,
            191.1811706209584
        ],
        "wc_reply_authors_avg": [
            1678.8,
            657.2349351639793
        ],
        "reply_reviewers_avg": [
            1.0,
            1.2649110640673518
        ],
        "reply_authors_avg": [
            3.0,
            1.0954451150103321
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.19611613513818404,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:fWIfMeuv-owJ:scholar.google.com/&scioq=Graph+Inference+Acceleration+by+Bridging+GNNs+and+MLPs+with+Self-Supervised+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Notre Dame",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nd.edu",
        "aff_unique_abbr": "Notre Dame",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "AhMEkBSdIV",
        "title": "LCA-on-the-Line: Benchmarking Out-of-Distribution Generalization with Class Taxonomies",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this paper, we address the challenge of assessing model generalization under Out-of-Distribution (OOD) conditions. We reintroduce the Least Common Ancestor (LCA) distance, a metric that has been largely overshadowed since ImageNet. By leveraging the WordNet hierarchy, we utilize the LCA to measure the taxonomic distance between labels and predictions, presenting it as a benchmark for model generalization. The LCA metric proves especially robust in comparison to previous state-of-the-art metrics when evaluating diverse models, including both vision-only and vision-language models on natural distribution shift datasets. To validate our benchmark's efficacy, we perform an extensive empirical study on 75 models spanning five distinct ImageNet-OOD datasets. Our findings reveal a strong linear correlation between in-domain ImageNet LCA scores and OOD Top1 performance across ImageNet-S/R/A/ObjectNet. This discovery gives rise to a novel evaluation framework termed \"LCA-on-the-Line\", facilitating unified and consistent assessments across a broad spectrum of models and datasets.\n\nBeside introducing an evaluative tool, we also delve into the intricate ties between the LCA metric and model generalization. By aligning model predictions more closely with the WordNet hierarchy and refining prompt engineering in zero-shot vision-language models, we offer tangible strategies to improve model generalization. We challenge the prevailing notion that LCA offers no added evaluative value over top-1 accuracy, our research provides invaluable insights and actionable techniques to enhance model robustness and generalization across various tasks and scenarios.",
        "keywords": "Out-of-Distribution Generalization;representation evaluation;Hierarchy;Vision Language Model;Class Taxonomy;Zero-shot",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/5f1a0827ba140be8acc7f46d9b1b87bff1f3f4a1.zip",
        "author": "Jia Shi",
        "authorids": "~Jia_Shi2",
        "gender": "M",
        "homepage": "https://www.linkedin.com/in/elvishelvisshi/",
        "dblp": "",
        "google_scholar": "asHobe0AAAAJ",
        "orcid": "",
        "linkedin": "elvishelvisshi/",
        "or_profile": "~Jia_Shi2",
        "aff": "Carnegie Mellon University",
        "aff_domain": "cmu.edu",
        "position": "MS student",
        "bibtex": "@misc{\nshi2024lcaontheline,\ntitle={{LCA}-on-the-Line: Benchmarking Out-of-Distribution Generalization with Class Taxonomies},\nauthor={Jia Shi},\nyear={2024},\nurl={https://openreview.net/forum?id=AhMEkBSdIV}\n}",
        "github": "",
        "project": "",
        "reviewers": "CuPJ;r8af;5fCB",
        "site": "https://openreview.net/forum?id=AhMEkBSdIV",
        "pdf_size": 12468190,
        "rating": "3;5;8",
        "confidence": "4;3;3",
        "soundness": "2;3;4",
        "contribution": "2;2;4",
        "presentation": "1;3;2",
        "wc_summary": "55;70;176",
        "wc_strengths": "14;165;60",
        "wc_weaknesses": "186;313;163",
        "wc_questions": "2;5;133",
        "wc_review": "257;553;532",
        "wc_reply_reviewers": "0;0;30",
        "wc_reply_authors": "1209;638;287",
        "reply_reviewers": "0;0;1",
        "reply_authors": "3;2;2",
        "rating_avg": [
            5.333333333333333,
            2.0548046676563256
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            100.33333333333333,
            53.85371131335539
        ],
        "wc_strengths_avg": [
            79.66666666666667,
            63.19458485942886
        ],
        "wc_weaknesses_avg": [
            220.66666666666666,
            65.9612680964283
        ],
        "wc_questions_avg": [
            46.666666666666664,
            61.05916984550496
        ],
        "wc_review_avg": [
            447.3333333333333,
            134.85877386691934
        ],
        "wc_reply_reviewers_avg": [
            10.0,
            14.142135623730951
        ],
        "wc_reply_authors_avg": [
            711.3333333333334,
            379.9599394088218
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.8029550685469661,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14865788217805581136&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0",
        "aff_unique_norm": "Carnegie Mellon University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cmu.edu",
        "aff_unique_abbr": "CMU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "AhcxMGfqQn",
        "title": "Collaborative World Models: An Online-Offline Transfer RL Approach",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Training offline reinforcement learning (RL) models with visual inputs is challenging due to the coupling of overfitting issue in representation learning and the risk of overestimating true value functions. Recent work has attempted to alleviate the overestimation bias by encouraging conservative behaviors beyond the scope of the offline dataset. This paper, in contrast, tries to build flexible constraints for the offline policies without impeding the exploration of potential advantages. The key idea is to leverage an off-the-shelf RL simulator, with which can be easily interacted in an online manner. In this auxiliary domain, we perform an actor-critic algorithm whose value model is aligned to the target data and thus serves as a \u201c$\\textit{test bed}$\u201d for the offline policies. In this way, the online simulator can be used as the $\\textit{playground}$ for the offline agent, allowing for mildly-conservative value estimation. Experimental results demonstrate the remarkable effectiveness of our approach in challenging environments such as DeepMind Control, Meta-World, and RoboDesk. It outperforms existing offline visual RL approaches by substantial margins.",
        "keywords": "World models;reinforcement learning;visual control;transfer learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/232fe4e6270555bd90bf72f233503acb9b80d129.zip",
        "author": "Qi Wang;Junming Yang;Yunbo Wang;Xin Jin;Wenjun Zeng;Xiaokang Yang",
        "authorids": "~Qi_Wang26;~Junming_Yang1;~Yunbo_Wang2;~Xin_Jin8;~Wenjun_Zeng3;~Xiaokang_Yang1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://qiwang067.github.io/;https://junming-yang.github.io/;http://home.ustc.edu.cn/~jinxustc/;https://www.eias.ac.cn/h-col-187.html;https://icne.sjtu.edu.cn/info/1064/1078.htm;https://wyb15.github.io/",
        "dblp": "19/1924-80;191/4782.html;68/3340-14;57/145;06/3071-1.html;84/3894",
        "google_scholar": "OwW5XfMAAAAJ;L6R5ExQAAAAJ;byaSC-kAAAAJ;_cUfvYQAAAAJ;yDEavdMAAAAJ;C8bGfr0AAAAJ",
        "orcid": ";0000-0002-4261-6271;0000-0002-1820-8358;;0000-0003-4029-3322;",
        "linkedin": "qi-wang-chris-7a6670361/;;;;;",
        "or_profile": "~Qi_Wang26;~Junming_Yang1;~Xin_Jin8;~Wenjun_Zeng3;~Xiaokang_Yang1;~Yunbo_Wang1",
        "aff": "Shanghai Jiaotong University;Nanjing University of Posts and Telecommunications;Eastern Institute of Technology, Ningbo;Eastern Institute for Advanced Study;Shanghai Jiaotong University;Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn;njupt.edu.cn;eitech.edu.cn;eias.ac.cn;sjtu.edu.cn;sjtu.edu.cn",
        "position": "PhD student;Undergrad student;Assistant Professor;Full Professor;Full Professor;Associate Professor",
        "bibtex": "@misc{\nwang2024collaborative,\ntitle={Collaborative World Models: An Online-Offline Transfer {RL} Approach},\nauthor={Qi Wang and Junming Yang and Yunbo Wang and Xin Jin and Wenjun Zeng and Xiaokang Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=AhcxMGfqQn}\n}",
        "github": "",
        "project": "",
        "reviewers": "wybs;MD4J;77pB;G38A;mTFC",
        "site": "https://openreview.net/forum?id=AhcxMGfqQn",
        "pdf_size": 3818750,
        "rating": "3;3;5;5;6",
        "confidence": "2;2;4;2;4",
        "soundness": "2;2;3;3;3",
        "contribution": "2;2;2;2;2",
        "presentation": "2;3;3;3;3",
        "wc_summary": "76;83;126;141;122",
        "wc_strengths": "43;73;75;89;105",
        "wc_weaknesses": "154;206;187;116;409",
        "wc_questions": "158;21;113;42;87",
        "wc_review": "431;383;501;388;723",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "734;452;830;783;1281",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "1;1;2;2;2",
        "rating_avg": [
            4.4,
            1.2
        ],
        "confidence_avg": [
            2.8,
            0.9797958971132712
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            109.6,
            25.476263462289758
        ],
        "wc_strengths_avg": [
            77.0,
            20.513410247932935
        ],
        "wc_weaknesses_avg": [
            214.4,
            102.00117646380359
        ],
        "wc_questions_avg": [
            84.2,
            49.109673181563736
        ],
        "wc_review_avg": [
            485.2,
            126.19730583495037
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            816.0,
            267.10672024492385
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.6,
            0.4898979485566356
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.748455199183749,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:M3nft3Kp0OAJ:scholar.google.com/&scioq=Collaborative+World+Models:+An+Online-Offline+Transfer+RL+Approach&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;0;0",
        "aff_unique_norm": "Shanghai Jiao Tong University;Nanjing University of Posts and Telecommunications;Eastern Institute of Technology;Eastern Institute for Advanced Study",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.sjtu.edu.cn;http://www.njupt.edu.cn;https://www.eit.edu.cn;",
        "aff_unique_abbr": "SJTU;NJUPT;;",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Nanjing;Ningbo",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China;"
    },
    {
        "title": "How Well Do Supervised 3D Models Transfer to Medical Imaging Tasks?",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19240",
        "id": "AhizIPytk4",
        "author_site": "Wenxuan Li, Alan Yuille, Zongwei Zhou",
        "tldr": "",
        "abstract": "The pre-training and fine-tuning paradigm has become prominent in transfer learning. For example, if the model is pre-trained on ImageNet and then fine-tuned to PASCAL, it can significantly outperform that trained on PASCAL from scratch. While ImageNet pre-training has shown enormous success, it is formed in 2D, and the learned features are for classification tasks; when transferring to more diverse tasks, like 3D image segmentation, its performance is inevitably compromised due to the deviation from the original ImageNet context. A significant challenge lies in the lack of large, annotated 3D datasets rivaling the scale of ImageNet for model pre-training. To overcome this challenge, we make two contributions. Firstly, we construct AbdomenAtlas 1.1 that comprises **9,262** three-dimensional computed tomography (CT) volumes with high-quality, per-voxel annotations of 25 anatomical structures and pseudo annotations of seven tumor types. Secondly, we develop a suite of models that are pre-trained on our AbdomenAtlas 1.1 for transfer learning. Our preliminary analyses indicate that the model trained only with 21 CT volumes, 672 masks, and 40 GPU hours has a transfer learning ability similar to the model trained with 5,050 (unlabeled) CT volumes and 1,152 GPU hours. More importantly, the transfer learning ability of supervised models can further scale up with larger annotated datasets, achieving significantly better performance than preexisting pre-trained models, irrespective of their pre-training methodologies or data sources. We hope this study can facilitate collective efforts in constructing larger 3D medical datasets and more releases of supervised pre-trained models.",
        "keywords": "Transfer Learning;Medical Image Analysis;Organ Segmentation",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Wenxuan Li;Alan Yuille;Zongwei Zhou",
        "authorids": "~Wenxuan_Li3;~Alan_Yuille1;~Zongwei_Zhou1",
        "gender": "F;M;M",
        "homepage": "https://github.com/WenxuanChelsea;;https://www.zongweiz.com/",
        "dblp": ";y/AlanLYuille;",
        "google_scholar": "tpNZM2YAAAAJ;;JVOeczAAAAAJ",
        "orcid": ";;0000-0002-3154-9851",
        "linkedin": ";;",
        "or_profile": "~Wenxuan_Li3;~Alan_Yuille1;~Zongwei_Zhou1",
        "aff": "Johns Hopkins University;Johns Hopkins University;Johns Hopkins University",
        "aff_domain": "jh.edu;johnshopkins.edu;jhu.edu",
        "position": "PhD student;Full Professor;Postdoc",
        "bibtex": "@inproceedings{\nli2024how,\ntitle={How Well Do Supervised 3D Models Transfer to Medical Imaging Tasks?},\nauthor={Wenxuan Li and Alan Yuille and Zongwei Zhou},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=AhizIPytk4}\n}",
        "github": "",
        "project": "",
        "reviewers": "osvs;bY7Q;esgA;mSzX;fMfJ",
        "pdf_size": 1417390,
        "rating": "6;6;6;8;8",
        "confidence": "3;5;4;3;3",
        "soundness": "3;3;3;3;3",
        "contribution": "3;3;3;3;3",
        "presentation": "3;3;2;3;3",
        "wc_summary": "37;54;99;85;89",
        "wc_strengths": "29;29;82;52;146",
        "wc_weaknesses": "134;355;232;88;13",
        "wc_questions": "34;63;31;8;26",
        "wc_review": "234;501;444;233;274",
        "wc_reply_reviewers": "5;0;0;13;0",
        "wc_reply_authors": "931;3371;1257;586;391",
        "reply_reviewers": "1;0;0;1;0",
        "reply_authors": "2;6;2;1;1",
        "rating_avg": [
            6.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.6,
            0.8
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            72.8,
            23.378622713923935
        ],
        "wc_strengths_avg": [
            67.6,
            43.765740025732455
        ],
        "wc_weaknesses_avg": [
            164.4,
            118.81178392735293
        ],
        "wc_questions_avg": [
            32.4,
            17.76063061943466
        ],
        "wc_review_avg": [
            337.2,
            112.90597858395276
        ],
        "wc_reply_reviewers_avg": [
            3.6,
            5.083306010855534
        ],
        "wc_reply_authors_avg": [
            1307.2,
            1073.5798805864426
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            2.4,
            1.8547236990991407
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.6123724356957946,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5683284319199448880&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=AhizIPytk4",
        "pdf": "https://openreview.net/pdf?id=AhizIPytk4",
        "email": "jh.edu;johnshopkins.edu;jhu.edu",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Johns Hopkins University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.jhu.edu",
        "aff_unique_abbr": "JHU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Ai4L058yoO",
        "title": "Is Feature Extraction the most informative dimensionality reduction technique? Revisiting Unsupervised Feature Selection from a Dynamic Approach",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper compares unsupervised feature extraction and unsupervised feature selection techniques in the context of dimensionality reduction without using labeled data. Unsupervised feature extraction transforms the input space into a lower-dimensional representation by creating informative features that capture underlying patterns, leading to improved model performance. On the other hand, unsupervised feature selection chooses a subset of features based on predefined criteria, potentially overlooking important relationships and reducing the model's discriminative power. State-of-the-art researches suggest that feature extraction outperforms feature selection in terms of model accuracy and robustness. Leveraging the intrinsic structure of the data, unsupervised feature extraction provides richer representations, enhancing the model's ability to discern complex patterns. These paper proposes to revisit feature selection algorithms from a dynamic perspective, where the features are selected depending on the specific sample input. Through empirical evaluations, it will be demonstrated that unsupervised feature selection outperforms feature extraction, both in accuracy and data compression. These findings highlight the potential of unsupervised feature selection as a powerful approach for dimensionality reduction and improved model performance, particularly when labeled data is scarce or unavailable.",
        "keywords": "dynamic feature selection;unsupervised learning;dimensionality reduction",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Brais Cancela",
        "authorids": "~Brais_Cancela1",
        "gender": "M",
        "homepage": "",
        "dblp": "86/9834",
        "google_scholar": "https://scholar.google.es/citations?user=kFjVlJIAAAAJ",
        "orcid": "0000-0002-2295-4142",
        "linkedin": "cancelabarizo",
        "or_profile": "~Brais_Cancela1",
        "aff": "Universidad de La Coru\u00f1a",
        "aff_domain": "udc.es",
        "position": "Associate Professor",
        "bibtex": "@misc{\ncancela2024is,\ntitle={Is Feature Extraction the most informative dimensionality reduction technique? Revisiting Unsupervised Feature Selection from a Dynamic Approach},\nauthor={Brais Cancela},\nyear={2024},\nurl={https://openreview.net/forum?id=Ai4L058yoO}\n}",
        "github": "",
        "project": "",
        "reviewers": "tqPc;LSnn;eFwU;rUoV",
        "site": "https://openreview.net/forum?id=Ai4L058yoO",
        "pdf_size": 680743,
        "rating": "3;5;5;5",
        "confidence": "4;2;4;4",
        "soundness": "2;2;2;2",
        "contribution": "1;2;2;3",
        "presentation": "1;2;2;2",
        "wc_summary": "78;35;68;54",
        "wc_strengths": "37;27;56;48",
        "wc_weaknesses": "284;77;150;71",
        "wc_questions": "646;130;97;278",
        "wc_review": "1045;269;371;451",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            58.75,
            16.145819892467525
        ],
        "wc_strengths_avg": [
            42.0,
            10.977249200050075
        ],
        "wc_weaknesses_avg": [
            145.5,
            85.79772724262573
        ],
        "wc_questions_avg": [
            287.75,
            217.7778397817372
        ],
        "wc_review_avg": [
            534.0,
            301.9950330717378
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:W9rLRHrjG2gJ:scholar.google.com/&scioq=Is+Feature+Extraction+the+most+informative+dimensionality+reduction+technique%3F+Revisiting+Unsupervised+Feature+Selection+from+a+Dynamic+Approach&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of A Coru\u00f1a",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.udc.es",
        "aff_unique_abbr": "UDC",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Spain"
    },
    {
        "id": "AialDkY6y3",
        "title": "Deep Graph Predictions using Dirac-Bianconi Graph Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Viewing Graph Neural Networks as network dynamical systems on graphs has proven a fruitful inspiration for designing interesting GNN architectures. This work introduces the Dirac-Bianconi Graph Neural Network (DBGNN) based on Bianconi's topological Dirac equation on graphs. While heat equations based on network Laplacian tend to smooth out differences, Dirac equations typically feature long-range propagation. We indeed find that the DBGNN layer does not lead to an equilibration, or smoothing, of nodal features, even after hundreds of steps. A further distinguishing feature of the topological Dirac equation is that it treats edges and nodes on the same footing. Consequently, we expect DBGNN to be useful in contexts where edges encode more than mere logical connectivity, but have physical properties as well. We show competitive performance for molecular property prediction and superior performance for predicting the dynamic stability of power grids. In the case of power grids, DBGNN achieves robust out-of-distribution generalization, showing that structural relations are learned.",
        "keywords": "Graph Neural Networks;graph convolution;physic inspired machine learning",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/8c59b79853a3e1ff2a1e88642982c4b1f3b0f839.zip",
        "author": "Christian Nauck;Rohan Gorantla;Michael Lindner;Konstantin Sch\u00fcrholt;Antonia S J S Mey;Frank Hellmann",
        "authorids": "~Christian_Nauck1;~Rohan_Gorantla1;~Michael_Lindner1;~Konstantin_Sch\u00fcrholt1;~Antonia_S_J_S_Mey1;~Frank_Hellmann1",
        "gender": "M;M;;M;;Non-Binary",
        "homepage": ";;https://www.pik-potsdam.de/members/mlindner;https://kschuerholt.github.io/;https://mey-research.org;",
        "dblp": ";;;267/9297;;",
        "google_scholar": ";1FzTrKoAAAAJ;;refZxl4AAAAJ;_NNNlvMAAAAJ;",
        "orcid": "0000-0003-1972-9654;0000-0003-4344-0383;;;;0000-0001-5635-4949",
        "linkedin": ";rohangorantla/;;https://de.linkedin.com/in/konstantin-schuerholt/en;;",
        "or_profile": "~Christian_Nauck1;~Rohan_Gorantla1;~Michael_Lindner1;~Konstantin_Sch\u00fcrholt1;~Antonia_S_J_S_Mey1;~Frank_Hellmann1",
        "aff": ";University of Edinburgh, University of Edinburgh;;University of St. Gallen;University of Edinburgh, University of Edinburgh;Potsdam Institute for Climate Impact Research",
        "aff_domain": ";ed.ac.uk;;unisg.ch;ed.ac.uk;pik-potsdam.de",
        "position": ";PhD student;;PhD student;Assistant Professor;Researcher",
        "bibtex": "@misc{\nnauck2024deep,\ntitle={Deep Graph Predictions using Dirac-Bianconi Graph Neural Networks},\nauthor={Christian Nauck and Rohan Gorantla and Michael Lindner and Konstantin Sch{\\\"u}rholt and Antonia S J S Mey and Frank Hellmann},\nyear={2024},\nurl={https://openreview.net/forum?id=AialDkY6y3}\n}",
        "github": "",
        "project": "",
        "reviewers": "VKy2;YvSy;NtG7;Bj5J;3z7c",
        "site": "https://openreview.net/forum?id=AialDkY6y3",
        "pdf_size": 4935719,
        "rating": "3;3;5;5;6",
        "confidence": "4;4;3;3;4",
        "soundness": "3;3;2;2;4",
        "contribution": "2;2;3;2;3",
        "presentation": "2;2;2;2;4",
        "wc_summary": "74;110;160;84;191",
        "wc_strengths": "123;41;45;68;53",
        "wc_weaknesses": "210;116;140;267;176",
        "wc_questions": "83;90;1;99;76",
        "wc_review": "490;357;346;518;496",
        "wc_reply_reviewers": "0;0;0;669;8",
        "wc_reply_authors": "436;466;524;1301;893",
        "reply_reviewers": "0;0;0;2;1",
        "reply_authors": "1;1;1;3;3",
        "rating_avg": [
            4.4,
            1.2
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.8,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.4,
            0.8
        ],
        "wc_summary_avg": [
            123.8,
            44.901670347549434
        ],
        "wc_strengths_avg": [
            66.0,
            29.95997329771841
        ],
        "wc_weaknesses_avg": [
            181.8,
            53.225557770680055
        ],
        "wc_questions_avg": [
            69.8,
            35.23293913371406
        ],
        "wc_review_avg": [
            441.4,
            74.07455703546259
        ],
        "wc_reply_reviewers_avg": [
            135.4,
            266.81799039794896
        ],
        "wc_reply_authors_avg": [
            724.0,
            331.9632509781768
        ],
        "reply_reviewers_avg": [
            0.6,
            0.8
        ],
        "reply_authors_avg": [
            1.8,
            0.9797958971132713
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.4082482904638631,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10298937043062127716&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "University of Edinburgh;University of St. Gallen;Potsdam Institute for Climate Impact Research",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ed.ac.uk;https://www.unisg.ch;https://www.pik-potsdam.de",
        "aff_unique_abbr": "Edinburgh;HSG;PIK",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;2",
        "aff_country_unique": "United Kingdom;Switzerland;Germany"
    },
    {
        "id": "Aj1wftldeR",
        "title": "D5RL: Diverse Datasets for Data-Driven Deep Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Offline reinforcement learning algorithms hold the promise of enabling data-driven RL methods that do not require costly or dangerous real-world exploration and benefit from large pre-collected datasets. This in turn can facilitate real-world applications, as well as a more standardized approach to RL research. Furthermore, offline RL methods can provide effective initializations for online finetuning, overcoming challenges with exploration. However, evaluating progress on offline RL algorithms requires effective and challenging benchmarks that capture properties of real-world tasks, provide a range of task difficulties, and cover a range of challenges both in terms of the parameters of the domain (e.g., length of the horizon, sparsity of rewards) and the parameters of the data (e.g., narrow demonstration data or broad exploratory data). While considerable progress in offline RL in recent years has been enabled by simpler benchmark tasks, the most widely used datasets are increasingly saturating in performance and might fail to reflect properties of realistic tasks. We propose a new benchmark for offline RL that focuses on realistic simulations of robotic manipulation and locomotion environments, based on models of real-world robotic systems, and comprising a variety of data sources, including scripted data, over 20 hours of demonstrations and play-style data collected by human teleoperators, and other data sources. Our proposed benchmark covers state-based and image-based domains, and aims to test a number of real-world robot training challenges such as long-horizon manipulation, fine-grained motor control, imperfect controllers, and representation learning. Our proposed tasks vary in complexity from single instance to diverse scenarios with multiple distribution shifts, which can require significant robustness and generalization. Moreover, we support both offline RL evaluation and evaluation with online finetuning, with some of the tasks specifically designed to require both pretraining and finetuning. We hope that our proposed benchmark will facilitate further progress on both offline RL algorithms and algorithms designed for online finetuning from offline initialization.",
        "keywords": "Offline RL;Imitation Learning;Representation Learning",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Rafael Rafailov;Kyle Beltran Hatch;Anikait Singh;Aviral Kumar;Laura Smith;Ilya Kostrikov;Philippe Hansen-Estruch;Victor Kolev;Philip J. Ball;Jiajun Wu;Sergey Levine;Chelsea Finn",
        "authorids": "~Rafael_Rafailov1;~Kyle_Beltran_Hatch1;~Anikait_Singh1;~Aviral_Kumar2;~Laura_Smith1;~Ilya_Kostrikov1;~Philippe_Hansen-Estruch1;~Victor_Kolev1;~Philip_J._Ball2;~Jiajun_Wu1;~Sergey_Levine1;~Chelsea_Finn1",
        "gender": "M;M;M;M;F;M;M;M;M;F;M;M",
        "homepage": "https://rmrafailov.github.io/;https://khatch31.github.io/;https://asap7772.github.io/;https://aviralkumar2907.github.io/;;;https://victorkolev.github.io;https://jiajunwu.com;https://people.eecs.berkeley.edu/~svlevine/;https://ai.stanford.edu/~cbfinn/;https://philipjball.github.io/;https://www.linkedin.com/in/philippe-hansen-estruch-b05559210/",
        "dblp": "272/5358;;302/3876;202/7961;54/11024;https://dblp.org/pers/k/Kostrikov:Ilya.html;;117/4768;80/7594;131/1783;244/1972;289/6990.html",
        "google_scholar": "TwABcRgAAAAJ;;lPaISmIAAAAJ;;;PTS2AOgAAAAJ;;2efgcS0AAAAJ;8R35rCwAAAAJ;vfPE6hgAAAAJ;5Cm8L90AAAAJ;UzjHQLcAAAAJ",
        "orcid": ";;;;;;;0000-0002-4176-343X;;;;",
        "linkedin": ";kyle-h-3402a792/;asap7772/;;;;;jiajunwu/;;;;philippe-hansen-estruch-b05559210/",
        "or_profile": "~Rafael_Rafailov1;~Kyle_Beltran_Hatch1;~Anikait_Singh1;~Aviral_Kumar2;~Laura_Smith1;~Ilya_Kostrikov1;~Victor_Kolev1;~Jiajun_Wu1;~Sergey_Levine1;~Chelsea_Finn1;~Philip_Ball1;~Philippe_I_Hansen-Estruch1",
        "aff": "Stanford University;Toyota Research Institute;Stanford University;Google DeepMind;University of California, Berkeley;OpenAI;Stanford University;Stanford University;Google;Google;Google DeepMind;Meta Facebook",
        "aff_domain": "stanford.edu;tri.global;stanford.edu;google.com;berkeley.edu;openai.com;stanford.edu;stanford.edu;google.com;google.com;google.com;meta.com",
        "position": "PhD student;Researcher;PhD student;Researcher;PhD student;Member of Technical Staff;Undergrad student;Assistant Professor;Research Scientist;Research Scientist;Researcher;Intern",
        "bibtex": "@misc{\nrafailov2024drl,\ntitle={D5{RL}: Diverse Datasets for Data-Driven Deep Reinforcement Learning},\nauthor={Rafael Rafailov and Kyle Beltran Hatch and Anikait Singh and Aviral Kumar and Laura Smith and Ilya Kostrikov and Philippe Hansen-Estruch and Victor Kolev and Philip J. Ball and Jiajun Wu and Sergey Levine and Chelsea Finn},\nyear={2024},\nurl={https://openreview.net/forum?id=Aj1wftldeR}\n}",
        "github": "",
        "project": "",
        "reviewers": "55ef;mGUu;axPt;VAo4",
        "site": "https://openreview.net/forum?id=Aj1wftldeR",
        "pdf_size": 1543814,
        "rating": "3;5;5;6",
        "confidence": "4;3;4;3",
        "soundness": "2;2;2;3",
        "contribution": "1;2;2;2",
        "presentation": "2;3;2;2",
        "wc_summary": "66;85;43;48",
        "wc_strengths": "66;74;27;62",
        "wc_weaknesses": "296;308;314;50",
        "wc_questions": "2;57;6;5",
        "wc_review": "430;524;390;165",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "627;760;641;152",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            60.5,
            16.53027525481654
        ],
        "wc_strengths_avg": [
            57.25,
            17.99131735032207
        ],
        "wc_weaknesses_avg": [
            242.0,
            111.04053313993049
        ],
        "wc_questions_avg": [
            17.5,
            22.85278976405288
        ],
        "wc_review_avg": [
            377.25,
            131.8434203894908
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            545.0,
            232.70904580613106
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            12,
            0
        ],
        "corr_rating_confidence": -0.6882472016116854,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9409474801396491122&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;0;2;3;4;0;0;2;2;2;5",
        "aff_unique_norm": "Stanford University;Toyota Research Institute;Google;University of California, Berkeley;OpenAI;Meta",
        "aff_unique_dep": ";;Google DeepMind;;;Meta Platforms, Inc.",
        "aff_unique_url": "https://www.stanford.edu;https://www.tri.global;https://deepmind.com;https://www.berkeley.edu;https://openai.com;https://meta.com",
        "aff_unique_abbr": "Stanford;TRI;DeepMind;UC Berkeley;OpenAI;Meta",
        "aff_campus_unique_index": "0;0;2;0;0;3;3",
        "aff_campus_unique": "Stanford;;Berkeley;Mountain View",
        "aff_country_unique_index": "0;0;0;1;0;0;0;0;0;0;1;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "Ali45HfJqJ",
        "title": "Observer Uncertainty of Learning in Games from a Covariance Perspective",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We investigate the accuracy of prediction in deterministic learning dynamics of zero-sum games with random initializations, specifically focusing on observer uncertainty and its relationship to the evolution of covariances. Zero-sum games are a prominent field of interest in machine learning due to their various applications, such as Generative Adversarial Networks. Concurrently, the accuracy of observation in dynamical systems from mechanics has long been a classic subject of investigation since the discovery of the Heisenberg Uncertainty Principle. This principle employs covariance and standard deviation of particle states to measure observation accuracy. In this study, we bring these two approaches together to analyze the follow-the-regularized-leader (FTRL) algorithm in two-player zero-sum games. We provide growth rates of covariance information for continuous-time FTRL, as well as its two canonical discretization methods (Euler and symplectic). Our analysis and experiments shows that employing symplectic discretization enhances the accuracy of prediction in learning dynamics.",
        "keywords": "covariance;symplectic Euler method;follow-the-regularized-leader (FTRL) algorithm;uncertainty;zero-sum games",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/35d9f855c0d4f1c58d4c78531c44dec56de73857.zip",
        "author": "Yi Feng;Georgios Piliouras;Xiao Wang",
        "authorids": "~Yi_Feng3;~Georgios_Piliouras1;~Xiao_Wang4",
        "gender": "M;;",
        "homepage": "https://sites.google.com/view/yifeng95524/home;;",
        "dblp": ";62/1236;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Yi_Feng3;~Georgios_Piliouras1;~Xiao_Wang4",
        "aff": "Shanghai University of Finance and Economics;Singapore University of Technology and Design;",
        "aff_domain": "shufe.edu;sutd.edu.sg;",
        "position": "PhD student;Associate Professor;",
        "bibtex": "@misc{\nfeng2024observer,\ntitle={Observer Uncertainty of Learning in Games from a Covariance Perspective},\nauthor={Yi Feng and Georgios Piliouras and Xiao Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=Ali45HfJqJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "kXrY;1edF;3XfB;snif",
        "site": "https://openreview.net/forum?id=Ali45HfJqJ",
        "pdf_size": 1356653,
        "rating": "5;6;6;6",
        "confidence": "3;3;3;3",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "69;124;106;45",
        "wc_strengths": "117;93;30;30",
        "wc_weaknesses": "86;469;24;157",
        "wc_questions": "34;106;7;4",
        "wc_review": "306;792;167;236",
        "wc_reply_reviewers": "78;18;0;40",
        "wc_reply_authors": "1013;1051;34;1077",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "3;3;1;3",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            86.0,
            30.87879531328902
        ],
        "wc_strengths_avg": [
            67.5,
            38.44801685392889
        ],
        "wc_weaknesses_avg": [
            184.0,
            171.14175411044494
        ],
        "wc_questions_avg": [
            37.75,
            41.09972627646077
        ],
        "wc_review_avg": [
            375.25,
            245.5782716365599
        ],
        "wc_reply_reviewers_avg": [
            34.0,
            29.086079144497972
        ],
        "wc_reply_authors_avg": [
            793.75,
            439.231929053433
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.8660254037844386
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:bGQakyIdxZAJ:scholar.google.com/&scioq=Observer+Uncertainty+of+Learning+in+Games+from+a+Covariance+Perspective&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Shanghai University of Finance and Economics;Singapore University of Technology and Design",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.sufe.edu.cn;https://www.sutd.edu.sg",
        "aff_unique_abbr": "SUFE;SUTD",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "China;Singapore"
    },
    {
        "id": "AlkANue4lm",
        "title": "Non-Redundant Graph Neural Networks with Improved Expressiveness",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Message passing graph neural networks iteratively compute node embeddings by aggregating messages from all neighbors. This procedure can be viewed as a neural variant of the Weisfeiler-Leman method, which limits their expressive power. Moreover, oversmoothing and oversquashing restrict the number of layers these networks can effectively utilize. The repeated exchange and encoding of identical information in message passing amplifies oversquashing. We propose a novel aggregation scheme based on neighborhood trees, which allows for controlling the redundancy by pruning branches of the unfolding trees underlying standard message passing. We prove that reducing redundancy improves expressivity and experimentally show that it alleviates oversquashing. We investigate the interaction between redundancy in message passing and redundancy in computation and propose a compact representation of neighborhood trees, from which we compute node and graph embeddings via a neural tree canonization technique. Our method is provably more expressive than the Weisfeiler-Leman method, less susceptible to oversquashing than message passing neural networks, and provides high classification accuracy on widely-used benchmark datasets.",
        "keywords": "graph neural networks;message passing;Weisfeiler-Leman;expressivity",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Franka Bause;Samir Moustafa;Johannes Langguth;Wilfried N. Gansterer;Nils Morten Kriege",
        "authorids": "~Franka_Bause1;~Samir_Moustafa1;~Johannes_Langguth2;~Wilfried_N._Gansterer1;~Nils_Morten_Kriege1",
        "gender": ";M;Not Specified;;M",
        "homepage": "https://dm.cs.univie.ac.at/team/person/112939/;http://samirmoustafa.net/;https://www.simula.no/people/langguth;;https://kriegegroup.univie.ac.at/",
        "dblp": "234/8688;https://dblp.uni-trier.de/pid/358/6919;;;97/8178",
        "google_scholar": "UTQlpH8AAAAJ;tAUUlfAAAAAJ;;;https://scholar.google.de/citations?user=wGT17PcAAAAJ",
        "orcid": "0000-0003-4202-3692;0000-0002-0674-9667;;;0000-0003-2645-947X",
        "linkedin": ";samirmoustafa/;;;",
        "or_profile": "~Franka_Bause1;~Samir_Moustafa1;~Johannes_Langguth2;~Wilfried_N._Gansterer1;~Nils_Morten_Kriege1",
        "aff": "Universit\u00e4t Vienna;Universit\u00e4t Vienna;Simula Research Laboratory;;Universit\u00e4t Vienna",
        "aff_domain": "univie.ac.at;univie.ac.at;simula.no;;univie.ac.at",
        "position": "PhD student;PhD student;Researcher;;Associate Professor",
        "bibtex": "@misc{\nbause2024nonredundant,\ntitle={Non-Redundant Graph Neural Networks with Improved Expressiveness},\nauthor={Franka Bause and Samir Moustafa and Johannes Langguth and Wilfried N. Gansterer and Nils Morten Kriege},\nyear={2024},\nurl={https://openreview.net/forum?id=AlkANue4lm}\n}",
        "github": "",
        "project": "",
        "reviewers": "h7VD;zntd;e2WG;8Vsr",
        "site": "https://openreview.net/forum?id=AlkANue4lm",
        "pdf_size": 444009,
        "rating": "3;3;5;6",
        "confidence": "4;3;3;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;2;4",
        "wc_summary": "59;36;57;48",
        "wc_strengths": "23;42;27;45",
        "wc_weaknesses": "150;98;374;79",
        "wc_questions": "156;23;39;93",
        "wc_review": "388;199;497;265",
        "wc_reply_reviewers": "93;0;77;40",
        "wc_reply_authors": "277;314;410;287",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            50.0,
            9.082951062292475
        ],
        "wc_strengths_avg": [
            34.25,
            9.41740410091868
        ],
        "wc_weaknesses_avg": [
            175.25,
            117.65495102204582
        ],
        "wc_questions_avg": [
            77.75,
            52.093065757353926
        ],
        "wc_review_avg": [
            337.25,
            114.48662585647286
        ],
        "wc_reply_reviewers_avg": [
            52.5,
            35.892199709686224
        ],
        "wc_reply_authors_avg": [
            322.0,
            52.578512721453045
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5555555555555555,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:81w9TdYd-DoJ:scholar.google.com/&scioq=Non-Redundant+Graph+Neural+Networks+with+Improved+Expressiveness&hl=en&as_sdt=0,31",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "University of Vienna;Simula Research Laboratory",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://univie.ac.at;https://www.simula.no",
        "aff_unique_abbr": "UV;Simula",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "Austria;Norway"
    },
    {
        "id": "AnPX5Jual9",
        "title": "Rotative Factorization Machines",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Feature interaction learning, which focuses on capturing the complex relationships among multiple features, is crucial in various real-world predictive tasks.\nHowever, most feature interaction approaches empirically enumerate all feature interactions within a predefined maximal order, which leads to suboptimal results due to the restricted learning capacity.\nSome recent studies propose intricate transformations to convert the feature interaction orders into learnable parameters, enabling them to automatically learn the interactions from data.\nDespite the progress, the interaction order of each feature is often independently learned, which lacks the flexibility to capture the feature dependencies in the varying context.\nIn addition, they can only model the feature interactions within a bounded order due to the exponential growth of the interaction terms.\nTo address these issues, we present a Rotative Factorization Machine (RFM).\nUnlike prior studies, RFM represents each feature as a polar angle in the complex plane.\nAs such, the feature interactions are converted into a series of complex rotations, where the orders are cast into the rotation coefficients, thereby allowing for the learning of arbitrarily large order. \nFurther, we propose a novel self-attentive rotation function that models the rotation coefficients through a rotation-based attention mechanism, which can adaptively learn the interaction orders from different interaction contexts.\nMoreover, it incorporates a modulus amplification network to learn the modulus of the complex features that further enhances the representations.\nSuch a network can adaptively  capture the feature interactions in the varying context, with no need of predefined order coefficients.\nExtensive experiments conducted on five widely used datasets have demonstrated the effectiveness of our approach.",
        "keywords": "Feature Interaction;Neural Networks;Self-Attentive Rotation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/006fcd0b1329983605b37ad954cf666d40109fab.zip",
        "author": "Zhen Tian;Yuhong Shi;Xiangkun Wu;Xin Zhao;Ji-Rong Wen",
        "authorids": "~Zhen_Tian1;~Yuhong_Shi1;~Xiangkun_Wu1;~Xin_Zhao10;~Ji-Rong_Wen1",
        "gender": "M;F;M;M;M",
        "homepage": "https://www.tianzhen.xyz;https://github.com/littlerain51;https://github.com/as112sa;https://gsai.ruc.edu.cn/addons/teacher/index/info.html?user_id=5&ruccode=20140041&ln=cn;https://gsai.ruc.edu.cn/english/jrwen",
        "dblp": "84/8525-1;;;https://dblp.uni-trier.de/pid/52/8700.html;w/JRWen",
        "google_scholar": "MBDadZUAAAAJ;;;JNhNacoAAAAJ;tbxCHJgAAAAJ",
        "orcid": "0000-0001-5569-2591;;;0000-0002-8333-6196;0000-0002-9777-9676",
        "linkedin": ";;;;",
        "or_profile": "~Zhen_Tian1;~Yuhong_Shi1;~Xiangkun_Wu1;~Xin_Zhao10;~Ji-Rong_Wen1",
        "aff": "Renmin University of China;Zhejiang University;Zhejiang University;Renmin University of China;Renmin University of China",
        "aff_domain": "ruc.edu.cn;zju.edu.cn;zju.edu.cn;ruc.edu.cn;ruc.edu.cn",
        "position": "MS student;MS student;PhD student;Full Professor;Full Professor",
        "bibtex": "@misc{\ntian2024rotative,\ntitle={Rotative Factorization Machines},\nauthor={Zhen Tian and Yuhong Shi and Xiangkun Wu and Xin Zhao and Ji-Rong Wen},\nyear={2024},\nurl={https://openreview.net/forum?id=AnPX5Jual9}\n}",
        "github": "",
        "project": "",
        "reviewers": "7fiD;5eVE;LHqT;f3tV",
        "site": "https://openreview.net/forum?id=AnPX5Jual9",
        "pdf_size": 1019592,
        "rating": "3;5;5;6",
        "confidence": "2;4;5;5",
        "soundness": "2;3;2;4",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "90;73;25;29",
        "wc_strengths": "54;21;10;42",
        "wc_weaknesses": "103;33;174;165",
        "wc_questions": "115;5;292;161",
        "wc_review": "362;132;501;397",
        "wc_reply_reviewers": "0;0;0;18",
        "wc_reply_authors": "849;487;1582;1104",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "2;1;3;2",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            1.224744871391589
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            54.25,
            27.94078560098123
        ],
        "wc_strengths_avg": [
            31.75,
            17.239127008059313
        ],
        "wc_weaknesses_avg": [
            118.75,
            56.55251983775789
        ],
        "wc_questions_avg": [
            143.25,
            102.89891884757584
        ],
        "wc_review_avg": [
            348.0,
            134.77944947209124
        ],
        "wc_reply_reviewers_avg": [
            4.5,
            7.794228634059948
        ],
        "wc_reply_authors_avg": [
            1005.5,
            398.55645773215116
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.9365858115816939,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12588312293281606905&as_sdt=5,31&sciodt=0,31&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;1;0;0",
        "aff_unique_norm": "Renmin University of China;Zhejiang University",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.ruc.edu.cn;https://www.zju.edu.cn",
        "aff_unique_abbr": "RUC;ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "AnuHbhwv9Q",
        "title": "Out of the Ordinary: Spectrally Adapting Regression for Covariate Shift",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Designing deep neural network classifiers that perform robustly on distributions differing from the available training data is an active area of machine learning research. However, out-of-distribution generalization for regression---the analogous problem for modeling continuous targets---remains relatively unexplored. To tackle this problem, we return to first principles and analyze how the closed-form solution for ordinary least squares (OLS) regression is sensitive to covariate shift. We characterize the out-of-distribution risk of the OLS model in terms of the eigenspectrum decomposition of the source and target data. We then use this insight to propose a method for adapting the weights of the last layer of a pre-trained neural regression model to perform better on input data originating from a different distribution. We demonstrate how this lightweight spectral adaptation procedure can improve out-of-distribution performance in a suite of both synthetic and real-world experiments.",
        "keywords": "Distribution-Shift;Domain-Adaptation;Robust-Machine-Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/26f313c9f1b463906a918f78389d8f790ee44d47.zip",
        "author": "Benjamin Eyre;Elliot Creager;David Madras;Vardan Papyan;Richard Zemel",
        "authorids": "~Benjamin_Eyre1;~Elliot_Creager1;~David_Madras1;~Vardan_Papyan1;~Richard_Zemel1",
        "gender": "M;M;M;M;M",
        "homepage": ";https://ecreager.github.io/;http://www.cs.toronto.edu/~madras/;https://sites.google.com/view/vardan-papyan;http://www.cs.columbia.edu/~zemel",
        "dblp": ";182/2055;188/6211;173/9783;16/6366",
        "google_scholar": "https://scholar.google.ca/citations?user=Ww1QOOkAAAAJ;boebIUcAAAAJ;MgnNDpkAAAAJ;https://scholar.google.co.il/citations?user=VrE-Gd4AAAAJ;https://scholar.google.ca/citations?user=iBeDoRAAAAAJ",
        "orcid": ";0009-0004-7122-3866;;;",
        "linkedin": ";;;;",
        "or_profile": "~Benjamin_Eyre1;~Elliot_Creager1;~David_Madras1;~Vardan_Papyan1;~Richard_Zemel1",
        "aff": "Google;University of Waterloo;Google;University of Toronto;Department of Computer Science, University of Toronto",
        "aff_domain": "google.com;uwaterloo.ca;google.com;toronto.edu;cs.toronto.edu",
        "position": "Intern;Assistant Professor;Researcher;Assistant Professor;Full Professor",
        "bibtex": "@misc{\neyre2024out,\ntitle={Out of the Ordinary: Spectrally Adapting Regression for Covariate Shift},\nauthor={Benjamin Eyre and Elliot Creager and David Madras and Vardan Papyan and Richard Zemel},\nyear={2024},\nurl={https://openreview.net/forum?id=AnuHbhwv9Q}\n}",
        "github": "",
        "project": "",
        "reviewers": "11sP;TGia;ZgCX;FNwT",
        "site": "https://openreview.net/forum?id=AnuHbhwv9Q",
        "pdf_size": 1038725,
        "rating": "5;6;6;8",
        "confidence": "3;3;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;4",
        "wc_summary": "102;105;82;179",
        "wc_strengths": "74;52;106;147",
        "wc_weaknesses": "97;190;75;120",
        "wc_questions": "168;4;44;305",
        "wc_review": "441;351;307;751",
        "wc_reply_reviewers": "497;16;0;224",
        "wc_reply_authors": "942;179;203;999",
        "reply_reviewers": "2;1;0;2",
        "reply_authors": "3;1;2;4",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            117.0,
            36.871398129173244
        ],
        "wc_strengths_avg": [
            94.75,
            35.75874019033668
        ],
        "wc_weaknesses_avg": [
            120.5,
            43.165379646193315
        ],
        "wc_questions_avg": [
            130.25,
            117.62307384182748
        ],
        "wc_review_avg": [
            462.5,
            173.42649739875392
        ],
        "wc_reply_reviewers_avg": [
            184.25,
            201.0278276756728
        ],
        "wc_reply_authors_avg": [
            580.75,
            390.3628920632698
        ],
        "reply_reviewers_avg": [
            1.25,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.6882472016116854,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=711905381529530377&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;0;2;2",
        "aff_unique_norm": "Google;University of Waterloo;University of Toronto",
        "aff_unique_dep": "Google;;",
        "aff_unique_url": "https://www.google.com;https://uwaterloo.ca;https://www.utoronto.ca",
        "aff_unique_abbr": "Google;UW;U of T",
        "aff_campus_unique_index": "0;0;2",
        "aff_campus_unique": "Mountain View;;Toronto",
        "aff_country_unique_index": "0;1;0;1;1",
        "aff_country_unique": "United States;Canada"
    },
    {
        "id": "Ao4O1kNK9h",
        "title": "Scaling Properties For Artificial Neural Network Models of the $\\textit{C. elegans}$ Nervous System",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The nematode worm $\\textit{C. elegans}$ enables straightforward optical measurement of neural activity, presenting a unique platform for exploring intrinsic neural dynamics. This paper investigates the scaling properties essential for self-supervised neural activity prediction based on past neural data, omitting behavioral aspects. Specifically, we investigate how predictive accuracy, quantified by the mean squared error (MSE), scales with the amount of training data, considering variables such as the number of neurons recorded, recording duration, and diversity of datasets. We also examine the relationship between these scaling properties and various parameters of artificial neural network models (ANNs), including size, architecture, and hyperparameters. Employing the nervous system of $\\textit{C. elegans}$ as an experimental platform, we elucidate the critical influence of data volume and model complexity in self-supervised neural prediction, demonstrating a logarithmic decrease in the MSE with an increase in the amount of training data, consistent across diverse datasets. Additionally, we observe nonlinear changes in MSE as the size of the ANN model varies. These findings emphasize the need for enhanced high-throughput tools for extended imaging of entire mesoscale nervous systems to acquire sufficient data for developing highly accurate ANN models of neural dynamics, with significant implications for systems neuroscience and biologically-inspired AI.",
        "keywords": "$\\textit{C. elegans}$;scaling properties;neural dynamics;self-supervised prediction;ANNs",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "Quilee Simeon;Leandro Risso Ven\u00e2ncio;Kaiya Ivy Zhao;Aran Nayebi;Michael Skuhersky;Edward Boyden;Guangyu Robert Yang",
        "authorids": "~Quilee_Simeon1;~Leandro_Risso_Ven\u00e2ncio1;~Kaiya_Ivy_Zhao1;~Aran_Nayebi2;~Michael_Skuhersky1;~Edward_Boyden1;~Guangyu_Robert_Yang1",
        "gender": "M;M;F;;Not Specified;M;M",
        "homepage": "https://qsimeon.github.io/;;https://kyzhao-ivy.github.io/;https://anayebi.github.io/;http://web.mit.edu/vex/www/;http://synthneuro.org;https://www.metaconscious.org/",
        "dblp": ";;;43/7661;;;",
        "google_scholar": ";;N0yuICkAAAAJ;https://scholar.google.com/citations?hl=en;kWibszMAAAAJ;q2rHA5QAAAAJ;hrI8aH8AAAAJ",
        "orcid": "0000-0003-4561-5087;0009-0002-0924-5218;;;;;0000-0002-8919-4248",
        "linkedin": "quilee-simeon-7843a3178/;rissov-leandro/;kaiya-zhao-910830218/;;;edboyden/;",
        "or_profile": "~Quilee_Simeon1;~Leandro_Risso_Ven\u00e2ncio1;~Kaiya_Ivy_Zhao1;~Aran_Nayebi2;~Michael_Skuhersky1;~Edward_Boyden1;~Guangyu_Robert_Yang1",
        "aff": "Massachusetts Institute of Technology;Universidade Federal de S\u00e3o Carlos;Fudan University;Massachusetts Institute of Technology;;Massachusetts Institute of Technology;Massachusetts Institute of Technology",
        "aff_domain": "mit.edu;ufscar.br;fudan.edu.cn;mit.edu;;mit.edu;mit.edu",
        "position": "PhD Student;Undergrad student;Undergrad student;Postdoc;;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nsimeon2024scaling,\ntitle={Scaling Properties For Artificial Neural Network Models of the \\${\\textbackslash}textit\\{C. elegans\\}\\$ Nervous System},\nauthor={Quilee Simeon and Leandro Risso Ven{\\^a}ncio and Kaiya Ivy Zhao and Aran Nayebi and Michael Skuhersky and Edward Boyden and Guangyu Robert Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=Ao4O1kNK9h}\n}",
        "github": "",
        "project": "",
        "reviewers": "3D8y;3Phf;KaWC",
        "site": "https://openreview.net/forum?id=Ao4O1kNK9h",
        "pdf_size": 944569,
        "rating": "3;5;5",
        "confidence": "5;2;4",
        "soundness": "2;2;2",
        "contribution": "2;2;2",
        "presentation": "1;3;3",
        "wc_summary": "150;38;58",
        "wc_strengths": "50;20;54",
        "wc_weaknesses": "638;130;138",
        "wc_questions": "49;595;271",
        "wc_review": "887;783;521",
        "wc_reply_reviewers": "325;272;85",
        "wc_reply_authors": "1298;1431;648",
        "reply_reviewers": "2;1;1",
        "reply_authors": "2;3;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            1.247219128924647
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            82.0,
            48.771576421791686
        ],
        "wc_strengths_avg": [
            41.333333333333336,
            15.173075568988056
        ],
        "wc_weaknesses_avg": [
            302.0,
            237.61032525264272
        ],
        "wc_questions_avg": [
            305.0,
            224.19634252146042
        ],
        "wc_review_avg": [
            730.3333333333334,
            153.98989865860972
        ],
        "wc_reply_reviewers_avg": [
            227.33333333333334,
            102.94442945373758
        ],
        "wc_reply_authors_avg": [
            1125.6666666666667,
            342.09777679617986
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.7559289460184544,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0;1;2;0;0;0",
        "aff_unique_norm": "Massachusetts Institute of Technology;Universidade Federal de S\u00e3o Carlos;Fudan University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://web.mit.edu;http://www.ufscar.br;https://www.fudan.edu.cn",
        "aff_unique_abbr": "MIT;UFSCar;Fudan",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;0;0;0",
        "aff_country_unique": "United States;Brazil;China"
    },
    {
        "id": "AoRIT2Uzfg",
        "title": "DRMGuard: Defending Deep Regression Models against Backdoor Attacks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep regression models are used in a wide variety of safety-critical applications, but are vulnerable to backdoor attacks. Although many defenses have been proposed for classification models, they are ineffective as they do not consider the uniqueness of regression models. First, the outputs of regression models are continuous values instead of discretized labels. Thus, the potential infected target of a backdoored regression model has infinite possibilities, which makes it impossible to be determined by existing defenses. Second, the backdoor behavior of backdoored deep regression models is triggered by the activation values of all the neurons in the feature space, which makes it difficult to be detected and mitigated using existing defenses. To resolve these problems, we propose DRMGuard, the first defense to identify if a deep regression model in the image domain is backdoored or not. DRMGuard formulates the optimization problem for reverse engineering based on the unique output-space and feature-space characteristics of backdoored deep regression models. We conduct extensive evaluations on two regression tasks and four datasets. The results show that DRMGuard can consistently defend against various backdoor attacks. We also generalize four state-of-the-art defenses designed for classifiers to regression models, and compare DRMGuard with them. The results show that DRMGuard significantly outperforms all those defenses. The code will be open-sourced upon paper acceptance.",
        "keywords": "Defend;reverse engineering;backdoor attack;deep regression model",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/9db40cbe5e38cc894ee3ff27e9a76d803ce21ba0.pdf",
        "author": "Lingyu Du;Yupei Liu;Jinyuan Jia;Guohao Lan",
        "authorids": "~Lingyu_Du1;~Yupei_Liu1;~Jinyuan_Jia2;~Guohao_Lan1",
        "gender": "M;M;;M",
        "homepage": "https://github.com/LingyuDu;https://liu00222.github.io/;https://jinyuan-jia.github.io/;https://guohao.netlify.app/",
        "dblp": ";204/1178;24/5124-1.html;178/9755.html",
        "google_scholar": ";52VEwW8AAAAJ;iyg4ytkAAAAJ;1ebZN5gAAAAJ",
        "orcid": ";0000-0003-4300-758X;0000-0002-9785-7769;",
        "linkedin": ";yupei-liu-39236912b;;",
        "or_profile": "~Lingyu_Du1;~Yupei_Liu1;~Jinyuan_Jia2;~Guohao_Lan1",
        "aff": "Delft University of Technology;MathWorks;Pennsylvania State University;Delft University of Technology",
        "aff_domain": "tudelft.nl;mathworks.com;psu.edu;tudelft.nl",
        "position": "PhD student;Software Engineer;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\ndu2024drmguard,\ntitle={{DRMG}uard: Defending Deep Regression Models against Backdoor Attacks},\nauthor={Lingyu Du and Yupei Liu and Jinyuan Jia and Guohao Lan},\nyear={2024},\nurl={https://openreview.net/forum?id=AoRIT2Uzfg}\n}",
        "github": "",
        "project": "",
        "reviewers": "tXTC;FMPV;WvrB",
        "site": "https://openreview.net/forum?id=AoRIT2Uzfg",
        "pdf_size": 1298267,
        "rating": "3;3;8",
        "confidence": "4;5;5",
        "soundness": "3;1;3",
        "contribution": "1;2;3",
        "presentation": "3;2;3",
        "wc_summary": "35;136;45",
        "wc_strengths": "15;17;24",
        "wc_weaknesses": "53;112;127",
        "wc_questions": "9;59;4",
        "wc_review": "112;324;200",
        "wc_reply_reviewers": "0;0;24",
        "wc_reply_authors": "792;653;699",
        "reply_reviewers": "0;0;1",
        "reply_authors": "3;3;2",
        "rating_avg": [
            4.666666666666667,
            2.357022603955158
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            72.0,
            45.43860326491855
        ],
        "wc_strengths_avg": [
            18.666666666666668,
            3.8586123009300755
        ],
        "wc_weaknesses_avg": [
            97.33333333333333,
            31.94091767971331
        ],
        "wc_questions_avg": [
            24.0,
            24.8327740429189
        ],
        "wc_review_avg": [
            212.0,
            86.96359391530842
        ],
        "wc_reply_reviewers_avg": [
            8.0,
            11.313708498984761
        ],
        "wc_reply_authors_avg": [
            714.6666666666666,
            57.81772123569805
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:p41sdQqsYE8J:scholar.google.com/&scioq=DRMGuard:+Defending+Deep+Regression+Models+against+Backdoor+Attacks&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Delft University of Technology;MathWorks;Pennsylvania State University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.tudelft.nl;https://www.mathworks.com;https://www.psu.edu",
        "aff_unique_abbr": "TU Delft;MathWorks;PSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "Netherlands;United States"
    },
    {
        "id": "Ap344YqCcD",
        "title": "Imitation Bootstrapped Reinforcement Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Despite the considerable potential of reinforcement learning (RL), robotics control tasks predominantly rely on imitation learning (IL) owing to its better sample efficiency.\nHowever, given the high cost of collecting extensive demonstrations, RL is still appealing if it can utilize limited imitation data for efficient autonomous self-improvement.\nExisting RL methods that utilize demonstrations either initialize the replay buffer with demonstrations and oversample them during RL training, which does not benefit from the generalization potential of modern IL methods, or pretrain the RL policy with IL on the demonstrations, which requires additional mechanisms to prevent catastrophic forgetting during RL fine-tuning.\nWe propose _imitation bootstrapped reinforcement learning_ (IBRL), a novel framework that first trains an IL policy on a limited number of demonstrations and then uses it to propose alternative actions for both online exploration and target value bootstrapping.\nIBRL achieves SoTA performance and sample efficiency on 7 challenging sparse reward continuous control tasks in simulation while learning directly from pixels. \nAs a highlight of our method, IBRL achieves $\\mathbf{6.4\\times}$ higher success rate than RLPD, a strong method that combines the idea of oversampling demonstrations with modern RL improvements, under the budget of **10** demos and **100K** interactions in the challenging PickPlaceCan task in the Robomimic benchmark.",
        "keywords": "reinforcement learning;robotics;continuous control",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Hengyuan Hu;Suvir Mirchandani;Dorsa Sadigh",
        "authorids": "~Hengyuan_Hu2;~Suvir_Mirchandani1;~Dorsa_Sadigh1",
        "gender": "M;F;M",
        "homepage": "http://suvirpmirchandani.com;https://dorsa.fyi/;",
        "dblp": "287/4981;117/3174;",
        "google_scholar": "fz7LJPIAAAAJ;ZaJEZpYAAAAJ;oF46lMIAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Suvir_Mirchandani1;~Dorsa_Sadigh1;~Hengyuan_Hu1",
        "aff": "Stanford University;Stanford University;Computer Science Department, Stanford University",
        "aff_domain": "stanford.edu;stanford.edu;cs.stanford.edu",
        "position": "PhD student;Assistant Professor;PhD student",
        "bibtex": "@misc{\nhu2024imitation,\ntitle={Imitation Bootstrapped Reinforcement Learning},\nauthor={Hengyuan Hu and Suvir Mirchandani and Dorsa Sadigh},\nyear={2024},\nurl={https://openreview.net/forum?id=Ap344YqCcD}\n}",
        "github": "",
        "project": "",
        "reviewers": "8Ymy;GwQ8;iZef;k6EZ",
        "site": "https://openreview.net/forum?id=Ap344YqCcD",
        "pdf_size": 1495869,
        "rating": "5;5;6;6",
        "confidence": "3;3;4;4",
        "soundness": "2;3;3;2",
        "contribution": "2;2;2;2",
        "presentation": "2;3;3;3",
        "wc_summary": "45;65;387;118",
        "wc_strengths": "44;91;151;68",
        "wc_weaknesses": "125;140;371;198",
        "wc_questions": "24;51;97;10",
        "wc_review": "238;347;1006;394",
        "wc_reply_reviewers": "198;122;58;25",
        "wc_reply_authors": "870;1181;1505;787",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "3;3;3;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            153.75,
            137.28323823395192
        ],
        "wc_strengths_avg": [
            88.5,
            39.72719471596252
        ],
        "wc_weaknesses_avg": [
            208.5,
            97.69979529149485
        ],
        "wc_questions_avg": [
            45.5,
            33.185087012090236
        ],
        "wc_review_avg": [
            496.25,
            299.69515761853745
        ],
        "wc_reply_reviewers_avg": [
            100.75,
            66.09604753689891
        ],
        "wc_reply_authors_avg": [
            1085.75,
            283.1266280306393
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.75,
            0.4330127018922193
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 27,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12607106594968839768&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Stanford University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.stanford.edu",
        "aff_unique_abbr": "Stanford",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Stanford",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "ApjY32f3Xr",
        "title": "PINNacle: A Comprehensive Benchmark of Physics-Informed Neural Networks for Solving PDEs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "While significant progress has been made on Physics-Informed Neural Networks (PINNs), a comprehensive comparison of these methods across a wide range of Partial Differential Equations (PDEs) is still lacking. This study introduces PINNacle, a benchmarking tool designed to fill this gap. PINNacle provides a diverse dataset, comprising over 20 distinct PDEs from various domains including heat conduction, fluid dynamics, biology, and electromagnetics. These PDEs encapsulate key challenges inherent to real-world problems, such as complex geometry, multi-scale phenomena, nonlinearity, and high dimensionality. PINNacle also offers a user-friendly toolbox, incorporating about 10 state-of-the-art PINN methods for systematic evaluation and comparison. We have conducted extensive experiments with these methods, offering insights into their strengths and weaknesses. In addition to providing a standardized means of assessing performance, PINNacle also offers an in-depth analysis to guide future research, particularly in areas such as domain decomposition methods and loss reweighting for handling multi-scale problems and complex geometry. While PINNacle does not guarantee success in all real-world scenarios, it represents a significant contribution to the field by offering a robust, diverse, and comprehensive benchmark suite that will undoubtedly foster further research and development in PINNs.",
        "keywords": "PINN;machine learning;physics-informed machine learning",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/38585e83cfcd145e3816bd1154c966361c146b92.pdf",
        "author": "Zhongkai Hao;Jiachen Yao;Chang Su;Hang Su;Ziao Wang;Fanzhi Lu;Zeyu Xia;Yichi Zhang;Songming Liu;Lu Lu;Jun Zhu",
        "authorids": "~Zhongkai_Hao1;~Jiachen_Yao3;~Chang_Su7;~Hang_Su3;~Ziao_Wang2;~Fanzhi_Lu1;~Zeyu_Xia4;~Yichi_Zhang4;~Songming_Liu1;~Lu_Lu1;~Jun_Zhu2",
        "gender": "M;M;M;F;M;M;M;M;M;M;M",
        "homepage": "https://jiachenyao.com/;https://github.com/EdwardIX;https://wangziao9.github.io/;https://github.com/FortuniaL;;https://zycheiheihei.github.io;;https://lu.seas.upenn.edu;http://ml.cs.tsinghua.edu.cn/~jun;;https://haozhongkai.github.io/",
        "dblp": "213/4920;;;;;;285/4585;01/2086-10;50/2644-1;26/5371-6;270/0220.html",
        "google_scholar": "Z_bCoGcAAAAJ;;;;https://scholar.google.com/citations?hl=en;HzgDakoAAAAJ;6urFg8kAAAAJ;wD_wsWUAAAAJ;axsP38wAAAAJ;dxN1_X0AAAAJ;dfSzq27ZiVoC",
        "orcid": "0000-0001-7655-7831;;;;;0000-0002-1894-3977;;0000-0002-5476-5768;;;",
        "linkedin": "jiachen-y-05a05932a/;;;;;;%E6%9D%BE%E9%93%AD-%E5%88%98-7b8339254/;;;;",
        "or_profile": "~Jiachen_Yao3;~Chang_Su7;~Ziao_Wang2;~Fanzhi_Lu1;~Zeyu_Xia4;~Yichi_Zhang4;~Songming_Liu1;~Lu_Lu1;~Jun_Zhu2;~Hang_Su2;~Hao_Zhongkai1",
        "aff": "Tsinghua University;Tsinghua University;, University of California, Santa Barbara;Tsinghua University;Tsinghua University;Tsinghua University;Tsinghua University;Yale University;Tsinghua University;Tsinghua University;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;tsinghua.edu.cn;cs.ucsb.edu;tsinghua.edu.cn;mail.tsinghua.edu.cn;tsinghua.edu.cn;mails.tsinghua.edu.cn;yale.edu;mail.tsinghua.edu.cn;tsinghua.edu.cn;mails.tsinghua.edu.cn",
        "position": "Undergrad student;Undergrad student;MS student;Undergrad student;Undergrad student;PhD student;PhD student;Assistant Professor;Professor;Associate Professor;PhD student",
        "bibtex": "@misc{\nhao2024pinnacle,\ntitle={{PINN}acle: A Comprehensive Benchmark of Physics-Informed Neural Networks for Solving {PDE}s},\nauthor={Zhongkai Hao and Jiachen Yao and Chang Su and Hang Su and Ziao Wang and Fanzhi Lu and Zeyu Xia and Yichi Zhang and Songming Liu and Lu Lu and Jun Zhu},\nyear={2024},\nurl={https://openreview.net/forum?id=ApjY32f3Xr}\n}",
        "github": "",
        "project": "",
        "reviewers": "oeuE;xNZs;RGvf;Ytqc",
        "site": "https://openreview.net/forum?id=ApjY32f3Xr",
        "pdf_size": 861377,
        "rating": "3;6;6;6",
        "confidence": "5;3;3;3",
        "soundness": "2;3;4;3",
        "contribution": "1;2;4;3",
        "presentation": "4;3;4;3",
        "wc_summary": "55;273;53;41",
        "wc_strengths": "26;233;92;50",
        "wc_weaknesses": "54;127;227;517",
        "wc_questions": "125;105;4;13",
        "wc_review": "260;738;376;621",
        "wc_reply_reviewers": "292;0;0;290",
        "wc_reply_authors": "295;522;237;596",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            1.118033988749895
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            105.5,
            96.85427197599495
        ],
        "wc_strengths_avg": [
            100.25,
            80.20091957078796
        ],
        "wc_weaknesses_avg": [
            231.25,
            176.0374605020193
        ],
        "wc_questions_avg": [
            61.75,
            53.8115926172047
        ],
        "wc_review_avg": [
            498.75,
            189.90441674695194
        ],
        "wc_reply_reviewers_avg": [
            145.5,
            145.50171820291334
        ],
        "wc_reply_authors_avg": [
            412.5,
            150.22399941420812
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 43,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12178264276662821414&as_sdt=5,31&sciodt=0,31&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;1;0;0;0;0;2;0;0;0",
        "aff_unique_norm": "Tsinghua University;University of California, Santa Barbara;Yale University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.ucsb.edu;https://www.yale.edu",
        "aff_unique_abbr": "THU;UCSB;Yale",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Santa Barbara",
        "aff_country_unique_index": "0;0;1;0;0;0;0;1;0;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Critical Learning Periods Emerge Even in Deep Linear Networks",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19239",
        "id": "Aq35gl2c1k",
        "author_site": "Michael Kleinman, Alessandro Achille, Stefano Soatto",
        "tldr": "",
        "abstract": "Critical learning periods are periods early in development where temporary sensory deficits can have a permanent effect on behavior and learned representations. \nDespite the radical differences between biological and artificial networks, critical learning periods have been empirically observed in both systems. This suggests that critical periods may be fundamental to learning and not an accident of biology.\nYet, why exactly critical periods emerge in deep networks is still an open question, and in particular it is unclear whether the critical periods observed in both systems depend on particular architectural or optimization details. To isolate the key underlying factors, we focus on deep linear network models, and show that, surprisingly, such networks also display much of the behavior seen in biology and artificial networks, while being amenable to analytical treatment. We show that critical periods depend on the depth of the model and structure of the data distribution. We also show analytically and in simulations that the learning of features is tied to competition between sources. Finally, we extend our analysis to multi-task learning to show that pre-training on certain tasks can damage the transfer performance on new tasks, and show how this depends on the relationship between tasks and the duration of the pre-training stage. To the best of our knowledge, our work provides the first analytically tractable model that sheds light into why critical learning periods emerge in biological and artificial networks.",
        "keywords": "critical learning periods;deep neural networks;gradient descent;linear networks",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "Michael Kleinman;Alessandro Achille;Stefano Soatto",
        "authorids": "~Michael_Kleinman2;~Alessandro_Achille1;~Stefano_Soatto1",
        "gender": ";M;",
        "homepage": ";;https://www.cs.ucla.edu/~soatto",
        "dblp": "276/0181;190/7328;08/1262",
        "google_scholar": "https://scholar.google.ca/citations?user=b5c-VcMAAAAJ;;lH1PdF8AAAAJ",
        "orcid": ";;0000-0003-2902-6362",
        "linkedin": ";;stefano-soatto-5765aa6/",
        "or_profile": "~Michael_Kleinman2;~Alessandro_Achille1;~Stefano_Soatto2",
        "aff": "Stanford University;Amazon;UCLA Computer Science Department, University of California, Los Angeles",
        "aff_domain": "stanford.edu;amazon.com;cs.ucla.edu",
        "position": "Postdoc;Applied Research Scientist;Professor",
        "bibtex": "@inproceedings{\nkleinman2024critical,\ntitle={Critical Learning Periods Emerge Even in Deep Linear Networks},\nauthor={Michael Kleinman and Alessandro Achille and Stefano Soatto},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Aq35gl2c1k}\n}",
        "github": "",
        "project": "",
        "reviewers": "SR9U;uHcm;qaj6;PVne",
        "pdf_size": 1610853,
        "rating": "5;6;8;10",
        "confidence": "3;3;3;4",
        "soundness": "3;3;3;4",
        "contribution": "3;2;3;3",
        "presentation": "3;2;3;4",
        "wc_summary": "109;65;185;95",
        "wc_strengths": "69;33;120;68",
        "wc_weaknesses": "149;89;172;359",
        "wc_questions": "4;23;106;227",
        "wc_review": "331;210;583;749",
        "wc_reply_reviewers": "0;21;77;0",
        "wc_reply_authors": "836;542;510;938",
        "reply_reviewers": "0;1;2;0",
        "reply_authors": "2;1;2;2",
        "rating_avg": [
            7.25,
            1.920286436967152
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            113.5,
            44.23516700544941
        ],
        "wc_strengths_avg": [
            72.5,
            31.0201547384922
        ],
        "wc_weaknesses_avg": [
            192.25,
            100.92912116926412
        ],
        "wc_questions_avg": [
            90.0,
            87.9062000088731
        ],
        "wc_review_avg": [
            468.25,
            210.66487011364757
        ],
        "wc_reply_reviewers_avg": [
            24.5,
            31.5
        ],
        "wc_reply_authors_avg": [
            706.5,
            184.41461438833963
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.8268106308031117,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12530288096224791156&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=Aq35gl2c1k",
        "pdf": "https://openreview.net/pdf?id=Aq35gl2c1k",
        "email": "stanford.edu;amazon.com;cs.ucla.edu",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Stanford University;Amazon;University of California, Los Angeles",
        "aff_unique_dep": ";Amazon.com, Inc.;Computer Science Department",
        "aff_unique_url": "https://www.stanford.edu;https://www.amazon.com;https://www.ucla.edu",
        "aff_unique_abbr": "Stanford;Amazon;UCLA",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Stanford;;Los Angeles",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "KoLA: Carefully Benchmarking World Knowledge of Large Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19238",
        "id": "AqN23oqraW",
        "author_site": "Jifan Yu, Xiaozhi Wang, Shangqing Tu, Shulin Cao, Daniel Zhang-Li, Xin Lv, Hao Peng, Zijun Yao, Xiaohan Zhang, Hanming Li, Chunyang Li, Zheyuan Zhang, Yushi Bai, Yantao Liu, Amy Xin, Kaifeng Yun, Linlu Gong, Nianyi Lin, Jianhui Chen, Zhili Wu, Yunjia Qi, Weikai Li, Yong Guan, Kaisheng Zeng, Ji Qi, Hailong Jin, Jinxin Liu, Yu Gu, Yuan Yao, Ning Ding, Lei Hou, Zhiyuan Liu, Xu Bin, Jie Tang, Juanzi Li",
        "tldr": "",
        "abstract": "The unprecedented performance of large language models (LLMs) necessitates improvements in evaluations. Rather than merely exploring the breadth of LLM abilities, we believe meticulous and thoughtful designs are essential to thorough, unbiased, and applicable evaluations. Given the importance of world knowledge to LLMs, we construct a Knowledge-oriented LLM Assessment benchmark (KoLA), in which we carefully design three crucial factors: (1) For ability modeling, we mimic human cognition to form a four-level taxonomy of knowledge-related abilities, covering 19 tasks. (2) For data, to ensure fair comparisons, we use both Wikipedia, a corpus prevalently pre-trained by LLMs, along with continuously collected emerging corpora, aiming to evaluate the capacity to handle unseen data and evolving knowledge. (3) For evaluation criteria, we adopt a contrastive system, including overall standard scores for better numerical comparability across tasks and models, and a unique self-contrast metric for automatically evaluating knowledge-creating ability. We evaluate 21 open-source and commercial LLMs and obtain some intriguing findings. The KoLA dataset will be updated every three months to provide timely references for developing LLMs and knowledge-related systems.",
        "keywords": "Large Language Model;World Knowledge;Evolving Benchmark",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/15ddff071c61dc0e8abdc05e3574461847222dd9.zip",
        "author": "Jifan Yu;Xiaozhi Wang;Shangqing Tu;Shulin Cao;Daniel Zhang-Li;Xin Lv;Hao Peng;Zijun Yao;Xiaohan Zhang;Hanming Li;Chunyang Li;Zheyuan Zhang;Yushi Bai;Yantao Liu;Amy Xin;Kaifeng Yun;Linlu GONG;Nianyi Lin;Jianhui Chen;Zhili Wu;Yunjia Qi;Weikai Li;Yong Guan;Kaisheng Zeng;Ji Qi;Hailong Jin;Jinxin Liu;Yu Gu;Yuan Yao;Ning Ding;Lei Hou;Zhiyuan Liu;Xu Bin;Jie Tang;Juanzi Li",
        "authorids": "~Jifan_Yu2;~Xiaozhi_Wang1;~Shangqing_Tu1;~Shulin_Cao1;~Daniel_Zhang-Li1;~Xin_Lv1;~Hao_Peng6;~Zijun_Yao2;~Xiaohan_Zhang6;~Hanming_Li1;~Chunyang_Li3;~Zheyuan_Zhang3;~Yushi_Bai1;~Yantao_Liu1;~Amy_Xin1;~Kaifeng_Yun2;~Linlu_GONG1;~Nianyi_Lin2;~Jianhui_Chen6;~Zhili_Wu1;~Yunjia_Qi1;~Weikai_Li2;~Yong_Guan2;~Kaisheng_Zeng1;~Ji_Qi2;~Hailong_Jin2;~Jinxin_Liu2;~Yu_Gu5;~Yuan_Yao12;~Ning_Ding5;~Lei_Hou2;~Zhiyuan_Liu1;~Xu_Bin1;~Jie_Tang1;~Juanzi_Li1",
        "gender": "M;M;M;F;M;M;M;M;F;;M;M;M;Not Specified;F;;F;;M;M;;M;M;M;;M;M;M;M;M;M;M;;;",
        "homepage": "https://yujifan0326.github.io/;https://bakser.github.io/;https://shangqingtu.github.io/;https://github.com/ShulinCao;https://github.com/Danielznn16;https://davidlvxin.github.io;;https://transirius.github.io/;;;https://lcy2723.github.io/;https://sparrowzheyuan18.github.io/;https://bys0318.github.io/;https://github.com/RicardoL1u;;;https://github.com/gonglinlu;https://linny2002.github.io/linny.github.io/;;https://wu-zhili.github.io/;https://github.com/kijlk;https://weikai-li.github.io;;https://github.com/alpc43;;;https://scholar.google.com/citations?user=A7KHQ6YAAAAJ&hl=en&oi=sra;http://entslscheia.github.io;https://yaoyuanthu.github.io/;https://www.stingning.cn/;https://www.cs.tsinghua.edu.cn/csen/info/1305/4466.htm;http://nlp.csai.tsinghua.edu.cn/~lzy;;;",
        "dblp": "239/6130.html;03/2015;296/1838;229/2976;321/0309;;69/7742-15;134/4025-2;;;;;302/4421;172/9996;349/5224;;;;;;349/5606;157/3533-2;04/606;199/8788.html;;190/7770.html;20/6480-2;15/4208-16;;;32/5685-1;53/3245-1;;;",
        "google_scholar": "https://scholar.google.com.tw/citations?hl=zh-CN;DjpXXZkAAAAJ;https://scholar.google.nl/citations?user=HiR6VAsAAAAJ;lUfGROcAAAAJ;;rJzgbYQAAAAJ;2ry7XsgAAAAJ;B4LmHSUAAAAJ;https://scholar.google.com.hk/citations?user=RKyE8o0AAAAJ;;GpXP-a4AAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=zh-CN;;2UKO_uYAAAAJ;;;;CkgiFxMAAAAJ;;Xxiwr8YAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com/citations?view_op=list_works;;;A7KHQ6YAAAAJ;c5RwjjcAAAAJ;https://scholar.google.com.hk/citations?user=3NWfi3YAAAAJ;uZXQuYAAAAAJ;YnIq4hsAAAAJ;dT0v5u0AAAAJ;;;",
        "orcid": "0000-0003-3430-4048;0000-0002-5727-143X;0009-0008-0640-3413;;0009-0009-3681-1896;;0009-0006-7192-5790;0000-0002-0288-9283;0000-0003-3295-7758;0009-0009-5835-1587;;0000-0003-3471-0572;;;0009-0001-2404-0475;;0009-0004-2323-4464;;0000-0001-8665-2971;;;0000-0002-5801-9500;0000-0002-9044-2595;0000-0002-8104-9652;;0009-0005-0939-6990;0009-0009-4673-9824;;;;0000-0002-8907-3526;0000-0002-7709-2543;;;",
        "linkedin": ";xiaozhiwang098/?locale=en_US;;;;;;%E5%AD%90%E4%BF%8A-%E5%A7%9A-313188209/;;;;;;;;;;;;;;weikai-li;;https://cn.linkedin.com/in/%E5%BC%80%E8%83%9C-%E6%9B%BE-496566107;;;%E9%87%91%E9%91%AB-%E5%88%98-86aaa7211/;;;;;;;;",
        "or_profile": "~Jifan_Yu2;~Xiaozhi_Wang1;~Shangqing_Tu1;~Shulin_Cao1;~Daniel_Zhang-Li1;~Xin_Lv1;~Hao_Peng6;~Zijun_Yao2;~Xiaohan_Zhang6;~Hanming_Li1;~Chunyang_Li3;~Zheyuan_Zhang3;~Yushi_Bai1;~Yantao_Liu1;~Amy_Xin1;~Kaifeng_Yun2;~Linlu_GONG1;~Nianyi_Lin2;~Jianhui_Chen6;~Zhili_Wu1;~Yunjia_Qi1;~Weikai_Li2;~Yong_Guan2;~Kaisheng_Zeng1;~Ji_Qi2;~Hailong_Jin2;~Jinxin_Liu2;~Yu_Gu5;~Yuan_Yao12;~Ning_Ding5;~Lei_Hou2;~Zhiyuan_Liu1;~Xu_Bin1;~Jie_Tang1;~Juanzi_Li1",
        "aff": "Tsinghua University;Department of Computer Science and Technology, Tsinghua University;Tsinghua University;Tsinghua University;Tsinghua University;Zhipu AI;Tsinghua University;Department of Computer Science and Technology, Tsinghua University;Beijing Knowledge Atlas Technology Co., Ltd. ;;Tsinghua University;Tsinghua University;Tsinghua University;University of Chinese Academy of Sciences;Tsinghua University;;Tsinghua University;Tsinghua University;Tsinghua University;, Tsinghua University;Tsinghua University;UCLA Computer Science Department, University of California, Los Angeles;Tsinghua University;Tsinghua University;;Tsinghua University;Tsinghua University;Ohio State University;National University of Singapore;Tsinghua University;Tsinghua University;Tsinghua University;;;",
        "aff_domain": "tsinghua.edu.cn;mails.tsinghua.edu.cn;mails.tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;zhipuai.cn;tsinghua.edu.cn;cs.tsinghua.edu.cn;zhipuai.cn;;tsinghua.edu.cn;mails.tsinghua.edu.cn;tsinghua.edu.cn;ucas.ac.cn;cs.tsinghua.edu.cn;;tsinghua.edu.cn;tsinghua.edu.cn;cs.tsinghua.edu.cn;cs.tsinghua.edu.cn;tsinghua.edu.cn;cs.ucla.edu;tsinghua.edu.cn;tsinghua.edu.cn;;tsinghua.edu.cn;tsinghua.edu.cn;osu.edu;nus.edu;mail.tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;;;",
        "position": "Postdoc;PhD student;PhD student;PhD student;PhD student;Researcher;PhD student;PhD student;Researcher;;Undergrad student;MS student;PhD student;MS student;MS student;;Undergrad student;Undergrad student;MS student;Undergrad student;PhD student;PhD student;Postdoc;PhD student;;Postdoc;PhD student;PhD student;Postdoc;Postdoc;Assistant Professor;Associate Professor;;;",
        "bibtex": "@inproceedings{\nyu2024kola,\ntitle={Ko{LA}: Carefully Benchmarking World Knowledge of Large Language Models},\nauthor={Jifan Yu and Xiaozhi Wang and Shangqing Tu and Shulin Cao and Daniel Zhang-Li and Xin Lv and Hao Peng and Zijun Yao and Xiaohan Zhang and Hanming Li and Chunyang Li and Zheyuan Zhang and Yushi Bai and Yantao Liu and Amy Xin and Kaifeng Yun and Linlu GONG and Nianyi Lin and Jianhui Chen and Zhili Wu and Yunjia Qi and Weikai Li and Yong Guan and Kaisheng Zeng and Ji Qi and Hailong Jin and Jinxin Liu and Yu Gu and Yuan Yao and Ning Ding and Lei Hou and Zhiyuan Liu and Xu Bin and Jie Tang and Juanzi Li},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=AqN23oqraW}\n}",
        "github": "",
        "project": "",
        "reviewers": "vPns;ryRT;VBLJ;1m8m",
        "pdf_size": 4664841,
        "rating": "5;6;8;8",
        "confidence": "2;4;2;4",
        "soundness": "2;3;3;4",
        "contribution": "2;2;4;3",
        "presentation": "2;3;3;4",
        "wc_summary": "77;47;124;120",
        "wc_strengths": "86;46;70;57",
        "wc_weaknesses": "124;82;46;57",
        "wc_questions": "60;198;22;34",
        "wc_review": "347;373;262;268",
        "wc_reply_reviewers": "116;0;13;0",
        "wc_reply_authors": "743;1173;331;362",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.0,
            1.0
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            92.0,
            31.851216617265973
        ],
        "wc_strengths_avg": [
            64.75,
            14.922717580923388
        ],
        "wc_weaknesses_avg": [
            77.25,
            29.978117018918983
        ],
        "wc_questions_avg": [
            78.5,
            70.34735247328075
        ],
        "wc_review_avg": [
            312.5,
            48.427781283061066
        ],
        "wc_reply_reviewers_avg": [
            32.25,
            48.64347335460329
        ],
        "wc_reply_authors_avg": [
            652.25,
            341.6367771478943
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            35,
            0
        ],
        "corr_rating_confidence": 0.19245008972987526,
        "gs_citation": 129,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13925067843687558202&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=AqN23oqraW",
        "pdf": "https://openreview.net/pdf?id=AqN23oqraW",
        "email": "tsinghua.edu.cn;mails.tsinghua.edu.cn;mails.tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;zhipuai.cn;tsinghua.edu.cn;cs.tsinghua.edu.cn;zhipuai.cn;;tsinghua.edu.cn;mails.tsinghua.edu.cn;tsinghua.edu.cn;ucas.ac.cn;cs.tsinghua.edu.cn;;tsinghua.edu.cn;tsinghua.edu.cn;cs.tsinghua.edu.cn;cs.tsinghua.edu.cn;tsinghua.edu.cn;cs.ucla.edu;tsinghua.edu.cn;tsinghua.edu.cn;;tsinghua.edu.cn;tsinghua.edu.cn;osu.edu;nus.edu;mail.tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;;;",
        "author_num": 35,
        "aff_unique_index": "0;0;0;0;0;1;0;0;2;0;0;0;3;0;0;0;0;0;0;4;0;0;0;0;5;6;0;0;0",
        "aff_unique_norm": "Tsinghua University;Zhipu AI;Beijing Knowledge Atlas Technology Co., Ltd.;University of Chinese Academy of Sciences;University of California, Los Angeles;Ohio State University;National University of Singapore",
        "aff_unique_dep": ";;;;Computer Science Department;;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.zhipu.ai;;http://www.ucas.ac.cn;https://www.ucla.edu;https://www.osu.edu;https://www.nus.edu.sg",
        "aff_unique_abbr": "THU;Zhipu AI;;UCAS;UCLA;OSU;NUS",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Los Angeles",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0;0;0;0;0;0;0;0;0;0;1;0;0;0;0;1;2;0;0;0",
        "aff_country_unique": "China;United States;Singapore"
    },
    {
        "id": "AqXzHRU2cs",
        "title": "Generative Pretrained Embedding and Hierarchical Representation to Unlock Human Rhythm in Activities of Daily Living",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Within the evolving landscape of smart homes, the precise recognition of daily living activities using ambient sensor data stands paramount. This paper not only aims to bolster existing algorithms by evaluating two distinct pretrained embeddings suited for ambient sensor activations but also introduces a novel hierarchical architecture. We delve into an architecture anchored on Transformer Decoder-based pre-trained embeddings, reminiscent of the GPT design, and contrast it with the previously established state-of-the-art (SOTA) ELMo embeddings for ambient sensors. Our proposed hierarchical structure leverages the strengths of each pre-trained embedding, enabling the discernment of activity dependencies and sequence order, thereby enhancing classification precision. To further refine recognition, we incorporate into our proposed architecture an hour-of-the-day embedding. Empirical evaluations underscore the preeminence of the Transformer Decoder embedding in classification endeavors. Additionally, our innovative hierarchical design significantly bolsters the efficacy of both pre-trained embeddings, notably in capturing inter-activity nuances. The integration of temporal aspects subtly but distinctively augments classification, especially for time-sensitive activities. In conclusion, our GPT-inspired hierarchical approach, infused with temporal insights, outshines the SOTA ELMo benchmark.",
        "keywords": "Embedding;Smart Homes;Transformers;Activity of Daily Living;Human activity Recognition",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/3a6f43f562afd48016b18299128ca7392f5e71bf.pdf",
        "author": "Damien Bouchabou;Sao Mai Nguyen",
        "authorids": "~Damien_Bouchabou1;~Sao_Mai_Nguyen1",
        "gender": "M;F",
        "homepage": ";http://nguyensmai.free.fr",
        "dblp": "183/0962;42/10546.html",
        "google_scholar": "https://scholar.google.fr/citations?user=vtUIdqgAAAAJ;https://scholar.google.fr/citations?user=ppPWNQoAAAAJ",
        "orcid": "0000-0003-3623-3626;0000-0003-0929-0019",
        "linkedin": "damien-bouchabou-5725329b/;",
        "or_profile": "~Damien_Bouchabou1;~Sao_Mai_Nguyen1",
        "aff": ";IMT Atlantique",
        "aff_domain": ";imt-atlantique.edu",
        "position": ";Associate Professor",
        "bibtex": "@misc{\nbouchabou2024generative,\ntitle={Generative Pretrained Embedding and Hierarchical Representation to Unlock Human Rhythm in Activities of Daily Living},\nauthor={Damien Bouchabou and Sao Mai Nguyen},\nyear={2024},\nurl={https://openreview.net/forum?id=AqXzHRU2cs}\n}",
        "github": "",
        "project": "",
        "reviewers": "e66t;dgfF;v1qx;wCG6",
        "site": "https://openreview.net/forum?id=AqXzHRU2cs",
        "pdf_size": 1600991,
        "rating": "3;5;5;6",
        "confidence": "5;3;3;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;2",
        "presentation": "3;2;3;3",
        "wc_summary": "128;42;25;45",
        "wc_strengths": "114;45;35;48",
        "wc_weaknesses": "348;78;115;50",
        "wc_questions": "99;58;4;95",
        "wc_review": "689;223;179;238",
        "wc_reply_reviewers": "0;0;0;68",
        "wc_reply_authors": "1678;374;816;965",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "4;2;1;4",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            60.0,
            39.99374951164244
        ],
        "wc_strengths_avg": [
            60.5,
            31.26099806468117
        ],
        "wc_weaknesses_avg": [
            147.75,
            117.89057426274587
        ],
        "wc_questions_avg": [
            64.0,
            38.15101571387058
        ],
        "wc_review_avg": [
            332.25,
            207.1079126928761
        ],
        "wc_reply_reviewers_avg": [
            17.0,
            29.444863728670914
        ],
        "wc_reply_authors_avg": [
            958.25,
            468.95328925171214
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            1.299038105676658
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.6225430174794673,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:P9XYffbs23cJ:scholar.google.com/&scioq=Generative+Pretrained+Embedding+and+Hierarchical+Representation+to+Unlock+Human+Rhythm+in+Activities+of+Daily+Living&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "IMT Atlantique",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.imt-atlantique.fr",
        "aff_unique_abbr": "IMT Atlantique",
        "aff_country_unique_index": "0",
        "aff_country_unique": "France"
    },
    {
        "id": "AqaFgmH87p",
        "title": "On the efficacy of group-wise clipping in differentially private optimization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recent advances have substantially improved the accuracy, memory cost, and training speed of differentially private (DP) deep learning, especially on large vision and language models with millions to billions of parameters. In this work, we thoroughly study the per-sample gradient clipping style, a key component in DP optimization. We show that different clipping styles have the same time complexity but instantiate an accuracy-memory trade-off: while the all-layer clipping (of coarse granularity) is the most prevalent and usually gives the best accuracy, it incurs heavier memory cost compared to other group-wise clipping, such as the layer-wise clipping (of finer granularity). We formalize this trade-off through our convergence theory and complexity analysis. Importantly, we demonstrate that the accuracy gap between group-wise clipping and all-layer clipping becomes smaller for larger models, while the memory advantage of the group-wise clipping remains. Consequently, the group-wise clipping allows DP optimization of large models to achieve high accuracy and low peak memory simultaneously.",
        "keywords": "deep learning;differential privacy;per-sample gradient clipping;optimization",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Zhiqi Bu;Ruixuan Liu;Yu-Xiang Wang;Sheng Zha;George Karypis",
        "authorids": "~Zhiqi_Bu1;~Ruixuan_Liu2;~Yu-Xiang_Wang1;~Sheng_Zha1;~George_Karypis1",
        "gender": "M;F;;M;M",
        "homepage": "https://sites.google.com/view/zhiqi-bu;;http://www.cs.ucsb.edu/~yuxiangw/publications.html;https://github.com/szha;",
        "dblp": "245/2573;243/0195.html;62/1637-3.html;218/5471;",
        "google_scholar": "MEvTLxIAAAAJ;sXWB1UQAAAAJ;HGNZ1fkAAAAJ;;ElqwScwAAAAJ",
        "orcid": ";0000-0002-0823-3760;;;",
        "linkedin": ";;;shengzha/;",
        "or_profile": "~Zhiqi_Bu1;~Ruixuan_Liu2;~Yu-Xiang_Wang1;~Sheng_Zha1;~George_Karypis1",
        "aff": "Amazon;Emory University;UC Santa Barbara;Amazon;University of Minnesota, Minneapolis",
        "aff_domain": "amazon.com;emory.edu;ucsb.edu;amazon.com;umn.edu",
        "position": "Researcher;Postdoc;Assistant Professor;Researcher;Full Professor",
        "bibtex": "@misc{\nbu2024on,\ntitle={On the efficacy of group-wise clipping in differentially private optimization},\nauthor={Zhiqi Bu and Ruixuan Liu and Yu-Xiang Wang and Sheng Zha and George Karypis},\nyear={2024},\nurl={https://openreview.net/forum?id=AqaFgmH87p}\n}",
        "github": "",
        "project": "",
        "reviewers": "fLMf;yntr;nK9w;RBj1",
        "site": "https://openreview.net/forum?id=AqaFgmH87p",
        "pdf_size": 575557,
        "rating": "3;5;5;6",
        "confidence": "4;5;3;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;2;2",
        "wc_summary": "103;10;44;84",
        "wc_strengths": "50;26;56;49",
        "wc_weaknesses": "323;74;176;188",
        "wc_questions": "38;32;6;26",
        "wc_review": "514;142;282;347",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "771;258;389;383",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            60.25,
            35.9887135085432
        ],
        "wc_strengths_avg": [
            45.25,
            11.431863365173676
        ],
        "wc_weaknesses_avg": [
            190.25,
            88.52224296751636
        ],
        "wc_questions_avg": [
            25.5,
            12.031209415515965
        ],
        "wc_review_avg": [
            321.25,
            133.6850309496168
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            450.25,
            192.42839577359678
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.3458572319330373,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:W5QdxLU3BJYJ:scholar.google.com/&scioq=On+the+efficacy+of+group-wise+clipping+in+differentially+private+optimization&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0;3",
        "aff_unique_norm": "Amazon;Emory University;University of California, Santa Barbara;University of Minnesota",
        "aff_unique_dep": "Amazon.com, Inc.;;;",
        "aff_unique_url": "https://www.amazon.com;https://www.emory.edu;https://www.ucsb.edu;https://www.minnesota.edu",
        "aff_unique_abbr": "Amazon;Emory;UCSB;UMN",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Santa Barbara;Minneapolis",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Ar5g8fwnjV",
        "title": "HOVER: Hyperbolic Video-text Retrieval",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Retrieving complex videos with compositional actions is challenging but still with few attentions given. Existing video-text retrieval methods ignore the multi-level semantic structures between mono-action videos and complex compositional videos, e.g., one simultaneously containing \"sitting up\", \"opening door\", \"cooking food\", \"eating\", etc. In this paper, we propose to jointly embed videos and texts into a hyperbolic space where their hierarchical semantic relationships are explicitly encoded. Specifically, a video with action compositions is first decomposed longitudinally into an action tree with mono-action leaf or child nodes and increasingly complex parent nodes. Then, the is-a semantic relationship in videos/texts is represented in the hyperbolic space by employing hyperbolic norm constraints. These constraints ensure that parents have smaller norms than their children, thereby placing parents in higher hierarchical positions compared to their children. Additionally, their temporal relationship is captured by utilizing relative cosine distances within the hyperbolic space. Experimental results show that the proposed method substantially outperforms the Euclidean counterparts, especially when with a small training size. Further, the learned hyperbolic video-text embeddings well generalize to novel datasets containing complex videos with varied-level action compositions.",
        "keywords": "video-text retrieval;hyperbolic representation;multi-modal learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/c9125072ab7ed346d764aaa551029b6731e5cbd2.zip",
        "author": "Ruiqi Shi;Jun Wen;Wei Ji;Menglin Yang;Difei Gao;Roger Zimmermann",
        "authorids": "~Ruiqi_Shi1;~Jun_Wen1;~Wei_Ji1;~Menglin_Yang3;~Difei_Gao1;~Roger_Zimmermann1",
        "gender": "M;M;M;M;;M",
        "homepage": "https://github.com/UX404;https://jungel2star.github.io/;https://jiwei0523.github.io/;https://scholar.google.com/citations?user=KroqSRUAAAAJ&hl=en;;https://www.comp.nus.edu.sg/cs/bio/rogerz/",
        "dblp": "168/6384;;52/3220-8;249/8541-1;;79/1490",
        "google_scholar": ";https://scholar.google.com.hk/citations?user=Gw2ekPsAAAAJ;69OFB-AAAAAJ;KroqSRUAAAAJ;;https://scholar.google.com.tw/citations?user=IDREwXEAAAAJ",
        "orcid": "0009-0001-8850-040X;;0000-0002-8106-9768;0000-0003-2510-5282;;0000-0002-7410-2590",
        "linkedin": ";;;;;roger-zimmermann-76b56b6/",
        "or_profile": "~Ruiqi_Shi1;~Jun_Wen1;~Wei_Ji1;~Menglin_Yang3;~Difei_Gao1;~Roger_Zimmermann1",
        "aff": "The Chinese University of Hong Kong;Harvard University;Nanjing University;Yale University;;National University of Singapore",
        "aff_domain": "cuhk.edu.hk;harvard.edu;nju.edu.cn;yale.edu;;nus.edu.sg",
        "position": "PhD student;Postdoc;Associate Professor;Postdoc;;Full Professor",
        "bibtex": "@misc{\nshi2024hover,\ntitle={{HOVER}: Hyperbolic Video-text Retrieval},\nauthor={Ruiqi Shi and Jun Wen and Wei Ji and Menglin Yang and Difei Gao and Roger Zimmermann},\nyear={2024},\nurl={https://openreview.net/forum?id=Ar5g8fwnjV}\n}",
        "github": "",
        "project": "",
        "reviewers": "BhHY;MxoF;AjjV;P4PE",
        "site": "https://openreview.net/forum?id=Ar5g8fwnjV",
        "pdf_size": 1685266,
        "rating": "3;3;5;6",
        "confidence": "5;4;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "59;59;67;56",
        "wc_strengths": "16;23;71;130",
        "wc_weaknesses": "199;124;74;131",
        "wc_questions": "3;2;5;4",
        "wc_review": "277;208;217;321",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            60.25,
            4.085033659592048
        ],
        "wc_strengths_avg": [
            60.0,
            45.62345887808157
        ],
        "wc_weaknesses_avg": [
            132.0,
            44.4915722356493
        ],
        "wc_questions_avg": [
            3.5,
            1.118033988749895
        ],
        "wc_review_avg": [
            255.75,
            46.072632874625256
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5555555555555555,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:qFiorVCiE3cJ:scholar.google.com/&scioq=HOVER:+Hyperbolic+Video-text+Retrieval&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "Chinese University of Hong Kong;Harvard University;Nanjing University;Yale University;National University of Singapore",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.cuhk.edu.hk;https://www.harvard.edu;https://www.nju.edu.cn;https://www.yale.edu;https://www.nus.edu.sg",
        "aff_unique_abbr": "CUHK;Harvard;Nanjing U;Yale;NUS",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;1;0;1;2",
        "aff_country_unique": "China;United States;Singapore"
    },
    {
        "title": "FairTune: Optimizing Parameter Efficient Fine Tuning for Fairness in Medical Image Analysis",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19237",
        "id": "ArpwmicoYW",
        "author_site": "Raman Dutt, Ondrej Bohdal, Sotirios Tsaftaris, Timothy Hospedales",
        "tldr": "",
        "abstract": "Training models with robust group fairness properties is crucial in ethically sensitive application areas such as medical diagnosis. Despite the growing body of work aiming to minimise demographic bias in AI, this problem remains challenging. A key reason for this challenge is the fairness generalisation gap: High-capacity deep learning models can fit all training data nearly perfectly, and thus also exhibit perfect fairness during training. In this case, bias emerges only during testing when generalisation performance differs across sub-groups. This motivates us to take a bi-level optimisation perspective on fair learning: Optimising the learning strategy based on validation fairness. Specifically, we consider the highly effective workflow of adapting pre-trained models to downstream medical imaging tasks using parameter-efficient fine-tuning (PEFT) techniques. There is a trade-off between updating more parameters, enabling a better fit to the task of interest vs. fewer parameters, potentially reducing the generalisation gap. To manage this tradeoff, we propose FairTune, a framework to optimise the choice of PEFT parameters with respect to fairness. We demonstrate empirically that FairTune leads to improved fairness on a range of medical imaging datasets. The code is available at https://github.com/Raman1121/FairTune.",
        "keywords": "Fairness;PEFT;Hyperparameter Optimization;Medical Imaging",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/a2322b049ff04702f15e4a4262303a4eececd137.zip",
        "author": "Raman Dutt;Ondrej Bohdal;Sotirios A. Tsaftaris;Timothy Hospedales",
        "authorids": "~Raman_Dutt1;~Ondrej_Bohdal1;~Sotirios_A._Tsaftaris1;~Timothy_Hospedales1",
        "gender": "M;M;;M",
        "homepage": "https://ramandutt.super.site/;https://ondrejbohdal.github.io/;https://vios.science/;http://homepages.inf.ed.ac.uk/thospeda/",
        "dblp": "314/5918;267/5714.html;14/613;32/3545",
        "google_scholar": "wdmRaoUAAAAJ;aKppg0QAAAAJ;jC1uFnYAAAAJ;https://scholar.google.fr/citations?user=nHhtvqkAAAAJ",
        "orcid": ";;;0000-0003-4867-7486",
        "linkedin": "raman-dutt/;;;timothyhospedales/",
        "or_profile": "~Raman_Dutt1;~Ondrej_Bohdal1;~Sotirios_A._Tsaftaris1;~Timothy_Hospedales1",
        "aff": "University of Edinburgh, University of Edinburgh;University of Edinburgh;University of Edinburgh;Samsung AI Research Centre",
        "aff_domain": "ed.ac.uk;ed.ac.uk;ed.ac.uk;samsung.com",
        "position": "PhD student;PhD student;Professor in machine learning and computer vision;Principal Researcher",
        "bibtex": "@inproceedings{\ndutt2024fairtune,\ntitle={FairTune: Optimizing Parameter Efficient Fine Tuning for Fairness in Medical Image Analysis},\nauthor={Raman Dutt and Ondrej Bohdal and Sotirios A. Tsaftaris and Timothy Hospedales},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ArpwmicoYW}\n}",
        "github": "",
        "project": "",
        "reviewers": "iDy7;XV7U;gkxu;Dgwu",
        "pdf_size": 849783,
        "rating": "6;6;6;6",
        "confidence": "3;3;4;3",
        "soundness": "3;3;3;3",
        "contribution": "3;4;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "50;79;93;62",
        "wc_strengths": "35;55;56;40",
        "wc_weaknesses": "117;118;347;22",
        "wc_questions": "38;3;82;94",
        "wc_review": "240;255;578;218",
        "wc_reply_reviewers": "148;0;0;0",
        "wc_reply_authors": "1069;414;1035;554",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "3;1;2;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            71.0,
            16.355427233796124
        ],
        "wc_strengths_avg": [
            46.5,
            9.17877987534291
        ],
        "wc_weaknesses_avg": [
            151.0,
            119.68918079759757
        ],
        "wc_questions_avg": [
            54.25,
            36.196512262923896
        ],
        "wc_review_avg": [
            322.75,
            147.95501850224616
        ],
        "wc_reply_reviewers_avg": [
            37.0,
            64.08587988004847
        ],
        "wc_reply_authors_avg": [
            768.0,
            288.5316273825107
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 20,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9705834299251022485&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "openreview": "https://openreview.net/forum?id=ArpwmicoYW",
        "pdf": "https://openreview.net/pdf?id=ArpwmicoYW",
        "email": "ed.ac.uk;ed.ac.uk;ed.ac.uk;samsung.com",
        "author_num": 4,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "University of Edinburgh;Samsung",
        "aff_unique_dep": ";AI Research",
        "aff_unique_url": "https://www.ed.ac.uk;https://www.samsung.com/global/researchers/samsung-ai-research-centre/",
        "aff_unique_abbr": "Edinburgh;SARC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "United Kingdom;South Korea"
    },
    {
        "title": "What Algorithms can Transformers Learn? A Study in Length Generalization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19236",
        "id": "AssIuHnmHX",
        "author_site": "Hattie Zhou, Arwen Bradley, Etai Littwin, Noam Razin, Omid Saremi, Joshua Susskind, Samy Bengio, Preetum Nakkiran",
        "tldr": "",
        "abstract": "Large language models exhibit surprising emergent generalization properties, yet also struggle on many simple reasoning tasks such as arithmetic and parity. In this work, we focus on length generalization, and we propose a unifying framework to understand when and how Transformers can be expected to length generalize on a given task. First, we show that there exist algorithmic tasks for which standard\ndecoder-only Transformers trained from scratch naturally exhibit strong length generalization. For these tasks, we leverage the RASP programming language (Weiss et al., 2021) to show that the correct algorithmic solution which solves the task can be represented by a simple Transformer. We thus propose the RASP-Generalization Conjecture: Transformers tend to learn a length-generalizing solution if there exists a short RASP-L program that works for all input lengths. We present empirical evidence to support the correlation between RASP-simplicity and generalization. We leverage our insights to give new scratchpad formats which yield strong length generalization on traditionally hard tasks (such as parity and addition), and we illustrate how scratchpad can hinder generalization when it increases the complexity of the corresponding RASP-L program. Overall, our work provides a novel perspective on the mechanisms of length generalization and the algorithmic capabilities of Transformers.",
        "keywords": "length generalization;systematic generalization;understanding;transformer;scratchpad;LLM;algorithmic reasoning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Hattie Zhou;Arwen Bradley;Etai Littwin;Noam Razin;Omid Saremi;Joshua M. Susskind;Samy Bengio;Preetum Nakkiran",
        "authorids": "~Hattie_Zhou1;~Arwen_Bradley1;~Etai_Littwin1;~Noam_Razin1;~Omid_Saremi1;~Joshua_M._Susskind1;~Samy_Bengio1;~Preetum_Nakkiran1",
        "gender": "F;F;M;M;;M;M;",
        "homepage": "http://hattiezhou.com;;;https://noamrazin.github.io/;;http://www.apple.com;http://bengio.abracadoudou.com;http://preetum.nakkiran.org",
        "dblp": ";278/8216;;247/1241;;132/7797;b/SamyBengio;151/6343",
        "google_scholar": ";cxi6phoAAAAJ;NOVS7vwAAAAJ;tDsd50oAAAAJ;;Sv2TGqsAAAAJ;Vs-MdPcAAAAJ;zithBbUAAAAJ",
        "orcid": ";0000-0002-4086-217X;;;;;;",
        "linkedin": ";arwen-bradley-2084ba2b/;;;omidsaremi/;joshua-susskind-8ab2ab5/;bengio;",
        "or_profile": "~Hattie_Zhou1;~Arwen_Bradley1;~Etai_Littwin1;~Noam_Razin1;~Omid_Saremi1;~Joshua_M._Susskind1;~Samy_Bengio1;~Preetum_Nakkiran1",
        "aff": "University of Montreal;Apple;;Tel Aviv University;Apple;Apple;Apple;Apple",
        "aff_domain": "umontreal.ca;apple.com;;tau.ac.il;apple.com;apple.com;apple.com;apple.com",
        "position": "PhD student;Researcher;;PhD student;ML;Researcher;Senior Director;Principal Researcher",
        "bibtex": "@inproceedings{\nzhou2024what,\ntitle={What Algorithms can Transformers Learn? A Study in Length Generalization},\nauthor={Hattie Zhou and Arwen Bradley and Etai Littwin and Noam Razin and Omid Saremi and Joshua M. Susskind and Samy Bengio and Preetum Nakkiran},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=AssIuHnmHX}\n}",
        "github": "",
        "project": "",
        "reviewers": "q9T5;Ho88;LyN1;tXQ4",
        "pdf_size": 677257,
        "rating": "6;6;8;8",
        "confidence": "3;4;3;3",
        "soundness": "2;2;3;3",
        "contribution": "3;1;3;3",
        "presentation": "4;3;4;3",
        "wc_summary": "116;175;133;175",
        "wc_strengths": "199;18;64;37",
        "wc_weaknesses": "395;437;309;103",
        "wc_questions": "122;124;4;56",
        "wc_review": "832;754;510;371",
        "wc_reply_reviewers": "618;570;0;55",
        "wc_reply_authors": "2713;2623;534;774",
        "reply_reviewers": "3;2;0;1",
        "reply_authors": "8;6;1;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            149.75,
            25.955490748587284
        ],
        "wc_strengths_avg": [
            79.5,
            70.9031028940201
        ],
        "wc_weaknesses_avg": [
            311.0,
            128.64680330268607
        ],
        "wc_questions_avg": [
            76.5,
            50.00749943758436
        ],
        "wc_review_avg": [
            616.75,
            185.03969168802675
        ],
        "wc_reply_reviewers_avg": [
            310.75,
            284.4234299420496
        ],
        "wc_reply_authors_avg": [
            1661.0,
            1011.0694832700668
        ],
        "reply_reviewers_avg": [
            1.5,
            1.118033988749895
        ],
        "reply_authors_avg": [
            4.25,
            2.8613807855648994
        ],
        "replies_avg": [
            31,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 132,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15771874752676632675&as_sdt=20000005&sciodt=0,21&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=AssIuHnmHX",
        "pdf": "https://openreview.net/pdf?id=AssIuHnmHX",
        "email": "umontreal.ca;apple.com;;tau.ac.il;apple.com;apple.com;apple.com;apple.com",
        "author_num": 8,
        "aff_unique_index": "0;1;2;1;1;1;1",
        "aff_unique_norm": "University of Montreal;Apple;Tel Aviv University",
        "aff_unique_dep": ";Apple Inc.;",
        "aff_unique_url": "https://wwwumontreal.ca;https://www.apple.com;https://www.tau.ac.il",
        "aff_unique_abbr": "UM;Apple;TAU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;1;1;1;1",
        "aff_country_unique": "Canada;United States;Israel"
    },
    {
        "id": "AtLW9HU3bo",
        "title": "Discovering the question-critical moments: Towards building event-aware multi-modal large language models for complex video question answering",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recently, Multi-modal Large Language Models (MLLM) have demonstrated impressive capabilities in image-language reasoning tasks like Image Question Answering. However, naively transferring them to complex Video Question Answering (VideoQA) tasks suffers from unsatisfactory causal-temporal reasoning capabilities. Existing methods simply concatenate the uniformly sampled frame representations to obtain the video representation, which either results in a quite large number of visual tokens and is thus resource-demanding, or is distracted by the redundancy of question-irrelevant contents. In light of this, we introduce E-STR, extending MLLM to be Event-aware for Spatial-Temporal Reasoning in complex VideoQA tasks. Specifically, we propose a differentiable question-critical keyframes retriever to adaptively select the question-critical moments in the video serving as the key event for spatial-temporal reasoning, and a general context encoder to encode the unselected parts for preserving the general contexts of the video. To facilitate the acquisition of spatial-temporal representations, we also incorporate lightweight adapters within the frozen image encoder. Extensive experiments on three large-scale benchmarks, including NExT-QA, Causal-VidQA, and STAR, all of which are notable for complex causal-temporal reasoning within long videos containing multiple objects and events, show that our method achieves better performance than existing state-of-the-art methods.",
        "keywords": "multi-modal learning; video question answering; video-language reasoning; multi-modal large language models",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Haibo Wang;Weifeng Ge",
        "authorids": "~Haibo_Wang8;~Weifeng_Ge2",
        "gender": "M;M",
        "homepage": "http://www.weifengge.net/;https://whb139426.github.io/",
        "dblp": "155/3277.html;",
        "google_scholar": "wFs402oAAAAJ;",
        "orcid": "0000-0002-6258-6225;",
        "linkedin": ";",
        "or_profile": "~Weifeng_Ge2;~wang_haibo1",
        "aff": "Fudan University;Fudan University",
        "aff_domain": "fudan.edu.cn;fudan.edu.cn",
        "position": "Assistant Professor;MS student",
        "bibtex": "@misc{\nwang2024discovering,\ntitle={Discovering the question-critical moments: Towards building event-aware multi-modal large language models for complex video question answering},\nauthor={Haibo Wang and Weifeng Ge},\nyear={2024},\nurl={https://openreview.net/forum?id=AtLW9HU3bo}\n}",
        "github": "",
        "project": "",
        "reviewers": "zSXn;92w2;bWa6;xUFv",
        "site": "https://openreview.net/forum?id=AtLW9HU3bo",
        "pdf_size": 2567826,
        "rating": "3;5;5;5",
        "confidence": "4;5;4;5",
        "soundness": "2;3;2;3",
        "contribution": "2;2;3;2",
        "presentation": "2;3;3;3",
        "wc_summary": "48;43;72;79",
        "wc_strengths": "51;68;26;16",
        "wc_weaknesses": "52;255;194;66",
        "wc_questions": "491;64;4;53",
        "wc_review": "642;430;296;214",
        "wc_reply_reviewers": "394;0;0;0",
        "wc_reply_authors": "2072;1564;1163;785",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "3;2;2;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            60.5,
            15.305227865013967
        ],
        "wc_strengths_avg": [
            40.25,
            20.474068965401088
        ],
        "wc_weaknesses_avg": [
            141.75,
            85.65738438686999
        ],
        "wc_questions_avg": [
            153.0,
            196.4471939224381
        ],
        "wc_review_avg": [
            395.5,
            161.86027925343512
        ],
        "wc_reply_reviewers_avg": [
            98.5,
            170.6070045455344
        ],
        "wc_reply_authors_avg": [
            1396.0,
            477.7054531821884
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:-dsdYw20C_YJ:scholar.google.com/&scioq=Discovering+the+question-critical+moments:+Towards+building+event-aware+multi-modal+large+language+models+for+complex+video+question+answering&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Fudan University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.fudan.edu.cn",
        "aff_unique_abbr": "Fudan",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "AwX6ON5A0V",
        "title": "On Gaussian Mixture Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We investigate the sample complexity of Gaussian mixture models (GMMs).  Our results provide the optimal upper bound, in the context of uniform spherical Gaussian mixtures.  Furthermore, we highlight the relationship between the sample complexity of GMMs and the distribution of spacings among their means.",
        "keywords": "GMM;Machin learning",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/df7f47a1abe5a623c7c7f2ef3f2d1c684870b150.pdf",
        "author": "Farzad Aryan",
        "authorids": "~Farzad_Aryan1",
        "gender": "M",
        "homepage": "",
        "dblp": "",
        "google_scholar": "",
        "orcid": "0000-0002-0700-9281",
        "linkedin": "",
        "or_profile": "~Farzad_Aryan1",
        "aff": "",
        "aff_domain": "",
        "position": "",
        "bibtex": "@misc{\naryan2024on,\ntitle={On Gaussian Mixture Models},\nauthor={Farzad Aryan},\nyear={2024},\nurl={https://openreview.net/forum?id=AwX6ON5A0V}\n}",
        "github": "",
        "project": "",
        "reviewers": "EBv4;xe5T;Ywzd;DCj7;WTMq",
        "site": "https://openreview.net/forum?id=AwX6ON5A0V",
        "pdf_size": 211113,
        "rating": "3;3;3;5;6",
        "confidence": "5;4;3;2;3",
        "soundness": "4;2;2;3;3",
        "contribution": "1;2;1;2;3",
        "presentation": "2;1;1;3;2",
        "wc_summary": "167;85;111;174;285",
        "wc_strengths": "21;35;11;76;6",
        "wc_weaknesses": "133;364;208;33;14",
        "wc_questions": "39;153;54;30;303",
        "wc_review": "360;637;384;313;608",
        "wc_reply_reviewers": "208;47;0;21;131",
        "wc_reply_authors": "800;804;734;548;811",
        "reply_reviewers": "1;1;0;1;1",
        "reply_authors": "1;1;1;1;2",
        "rating_avg": [
            4.0,
            1.2649110640673518
        ],
        "confidence_avg": [
            3.4,
            1.019803902718557
        ],
        "soundness_avg": [
            2.8,
            0.7483314773547882
        ],
        "contribution_avg": [
            1.8,
            0.7483314773547883
        ],
        "presentation_avg": [
            1.8,
            0.7483314773547883
        ],
        "wc_summary_avg": [
            164.4,
            68.99159369082584
        ],
        "wc_strengths_avg": [
            29.8,
            25.134836382996408
        ],
        "wc_weaknesses_avg": [
            150.4,
            127.77574104656956
        ],
        "wc_questions_avg": [
            115.8,
            103.44737792713742
        ],
        "wc_review_avg": [
            460.4,
            134.6233263591418
        ],
        "wc_reply_reviewers_avg": [
            81.4,
            77.3888880912499
        ],
        "wc_reply_authors_avg": [
            739.4,
            99.63453216631271
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4
        ],
        "reply_authors_avg": [
            1.2,
            0.4
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.6201736729460422,
        "gs_citation": 3649,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12581175277722921512&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 12
    },
    {
        "id": "AweVGJeW47",
        "title": "Smoothing for exponential family dynamical systems",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "State-space modeling is a powerful technique for the analysis of spatiotemporal structures of time series.  However, when assumptions about linearity or Gaussianity are violated, statistical inference about the latent process is challenging.  While variational inference can be used to approximate the posterior in these nonlinear or non-Gaussian settings, it is desirable to preserve the temporal structure of the true posterior in the variational approximation, while ensuring inference scales linearly in sequence length.  We propose a new structured variational approximation that satisfies these desiderata.  Furthermore, by generalizing to *exponential family dynamical systems*, we are able to develop decoupled second order inference algorithms that have simple updates, without increased computational complexity.  Then, we extend our insights and develop the *auto-encoding backward factorized smoother*, making it easy to leverage modern deep learning tools.  For settings where a sequential inference algorithm may be more appropriate, we also present the *variational Bryson-Frazier* algorithm, by developing a new backward smoothing objective.  We compare against various inference algorithms for state-space models, and validate the theory presented through numerical experiments.",
        "keywords": "state space model;bayesian inference;time-series;variational inference",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Matthew Dowling;Yuan Zhao;Il Memming Park",
        "authorids": "~Matthew_Dowling2;~Yuan_Zhao1;~Il_Memming_Park1",
        "gender": "M;;M",
        "homepage": ";;http://catniplab.github.io/",
        "dblp": ";65/2105-4;00/4652-2",
        "google_scholar": "https://scholar.google.com/citations?hl=en;XLpD5N0AAAAJ;CsmltusAAAAJ",
        "orcid": ";0000-0002-6123-8579;0000-0002-4255-7750",
        "linkedin": ";;memming/",
        "or_profile": "~Matthew_Dowling2;~Yuan_Zhao1;~Il_Memming_Park1",
        "aff": "State University of New York, Stony Brook;National Institute of Mental Health;Champalimaud Centre for the Unknown",
        "aff_domain": "stonybrook.edu;nih.gov;fchampalimaud.org",
        "position": "PhD student;Researcher;Associate Professor",
        "bibtex": "@misc{\ndowling2024smoothing,\ntitle={Smoothing for exponential family dynamical systems},\nauthor={Matthew Dowling and Yuan Zhao and Il Memming Park},\nyear={2024},\nurl={https://openreview.net/forum?id=AweVGJeW47}\n}",
        "github": "",
        "project": "",
        "reviewers": "CGvB;vygh;pQjy",
        "site": "https://openreview.net/forum?id=AweVGJeW47",
        "pdf_size": 6330847,
        "rating": "5;5;6",
        "confidence": "4;3;2",
        "soundness": "3;3;3",
        "contribution": "2;2;3",
        "presentation": "3;3;3",
        "wc_summary": "66;255;121",
        "wc_strengths": "70;82;98",
        "wc_weaknesses": "215;119;1190",
        "wc_questions": "150;82;496",
        "wc_review": "501;538;1905",
        "wc_reply_reviewers": "122;0;0",
        "wc_reply_authors": "366;503;1462",
        "reply_reviewers": "1;0;0",
        "reply_authors": "2;1;2",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            147.33333333333334,
            79.37393918801197
        ],
        "wc_strengths_avg": [
            83.33333333333333,
            11.469767022723502
        ],
        "wc_weaknesses_avg": [
            508.0,
            483.8367493277045
        ],
        "wc_questions_avg": [
            242.66666666666666,
            181.27204846736728
        ],
        "wc_review_avg": [
            981.3333333333334,
            653.3056116567668
        ],
        "wc_reply_reviewers_avg": [
            40.666666666666664,
            57.51135153650587
        ],
        "wc_reply_authors_avg": [
            777.0,
            487.58657350942985
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:iuYJtriE0NEJ:scholar.google.com/&scioq=Smoothing+for+exponential+family+dynamical+systems&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "State University of New York;National Institute of Mental Health;Champalimaud Centre for the Unknown",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.stonybrook.edu;https://www.nimh.nih.gov;https://www.champalimaud.org",
        "aff_unique_abbr": "SUNY Stony Brook;NIMH;CCU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Stony Brook;",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "United States;Portugal"
    },
    {
        "id": "AwfPDjuWPu",
        "title": "Supervision for Free: Enhancing Depth Estimation for Ground Robots Based on Supervision from Mono Camera Model Parameters",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Depth estimation is a critical topic for robotics and vision-related tasks. In monocular depth estimation, in comparison with supervised learning that requires expensive ground truth labeling, self-supervised methods possess great potential due to no labeling cost. However, self-supervised learning still has a large gap with supervised learning in depth estimation performance. Meanwhile, scaling is also a major issue for monocular unsupervised depth estimation, which commonly still needs ground truth scale from GPS, LiDAR, or existing maps to correct. In deep learning era, while existing methods mainly rely on the exploration of image relationships to train the unsupervised neural networks, fundamental information provided by the camera itself has been generally ignored, which can provide extensive supervision information for free, without the need for any extra equipment to provide supervision signals. Utilizing the camera itself's intrinsics and extrinsics, depth information can be calculated for ground regions and regions connecting ground based on physical principles, providing free supervision information without any other sensors. The method is easy to realize and can be a component to enhance the effects of all the unsupervised methods.",
        "keywords": "Depth Estimation;Camera Model;Unsupervised Learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Praveen Praveen Kamasani;Jinchang Zhang;Xue Iuan Wong;Guoyu Lu",
        "authorids": "praveenkumarreddy.kamasani@uga.edu;jz23267@uga.edu;xwong@ford.com;~Guoyu_Lu4",
        "gender": ";;;M",
        "homepage": ";;;https://engineering.uga.edu/people/profile/guoyu-lu-ph.d",
        "dblp": ";;;120/8962.html",
        "google_scholar": ";;;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "praveenkumarreddy.kamasani@uga.edu;jz23267@uga.edu;xwong@ford.com;~Guoyu_Lu4",
        "aff": ";;;University of Georgia",
        "aff_domain": ";;;uga.edu",
        "position": ";;;Assistant Professor",
        "bibtex": "@misc{\nkamasani2024supervision,\ntitle={Supervision for Free: Enhancing Depth Estimation for Ground Robots Based on Supervision from Mono Camera Model Parameters},\nauthor={Praveen Praveen Kamasani and Jinchang Zhang and Xue Iuan Wong and Guoyu Lu},\nyear={2024},\nurl={https://openreview.net/forum?id=AwfPDjuWPu}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=AwfPDjuWPu",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:lKg3a3hRPMkJ:scholar.google.com/&scioq=Supervision+for+Free:+Enhancing+Depth+Estimation+for+Ground+Robots+Based+on+Supervision+from+Mono+Camera+Model+Parameters&hl=en&as_sdt=0,23",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Georgia",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uga.edu",
        "aff_unique_abbr": "UGA",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Function Vectors in Large Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19235",
        "id": "AwyxtyMwaG",
        "author_site": "Eric Todd, Millicent Li, Arnab Sen Sharma, Aaron Mueller, Byron Wallace, David Bau",
        "tldr": "",
        "abstract": "We report the presence of a simple neural mechanism that represents an input-output function as a vector within autoregressive transformer language models (LMs). Using causal mediation analysis on a diverse range of in-context-learning (ICL) tasks, we find that a small number attention heads transport a compact representation of the demonstrated task, which we call a function vector (FV).  FVs are robust to changes in context, i.e., they trigger execution of the task on inputs such as zero-shot and natural text settings that do not resemble the ICL contexts from which they are collected. We test FVs across a range of tasks, models, and layers and find strong causal effects across settings in middle layers. We investigate the internal structure of FVs and find while that they often contain information that encodes the output space of the function, this information alone is not sufficient to reconstruct an FV. Finally, we test semantic vector composition in FVs, and find that to some extent they can be summed to create vectors that trigger new complex tasks. Our findings show that compact, causal internal vector representations of function abstractions can be explicitly extracted from LLMs.",
        "keywords": "In-Context Learning;Interpretability",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/1a5822915a221c66a406c73d840b166f3d523440.zip",
        "author": "Eric Todd;Millicent Li;Arnab Sen Sharma;Aaron Mueller;Byron C Wallace;David Bau",
        "authorids": "~Eric_Todd1;~Millicent_Li1;~Arnab_Sen_Sharma1;~Aaron_Mueller1;~Byron_C_Wallace1;~David_Bau1",
        "gender": "M;;M;M;M;M",
        "homepage": "https://ericwtodd.github.io/;http://millicentli.github.io/;https://arnab-api.github.io/;https://aaronmueller.github.io;http://www.byronwallace.com/;https://baulab.info/",
        "dblp": "162/6042;;254/2046;248/7949;00/8247;47/3614",
        "google_scholar": "o12WPZEAAAAJ;UZ1gBvAAAAAJ;https://scholar.google.com/citations?view_op=list_works;lhwxXg4AAAAJ;KTzRHmwAAAAJ;CYI6cKgAAAAJ",
        "orcid": "0009-0008-7858-4823;;0000-0002-0407-6526;;;0000-0003-1744-6765",
        "linkedin": "eric-w-todd/;;arnab-api/;aaron-m-mueller/;;david-bau-4b8130/",
        "or_profile": "~Eric_Todd1;~Millicent_Li1;~Arnab_Sen_Sharma1;~Aaron_Mueller1;~Byron_C_Wallace1;~David_Bau1",
        "aff": "Northeastern University;Northeastern University;Northeastern University;Technion - Israel Institute of Technology;Northeastern University;Northeastern University",
        "aff_domain": "northeastern.edu;neu.edu;northeasterd.edu;technion.ac.il;northeastern.edu;northeastern.edu",
        "position": "PhD student;PhD student;PhD student;Postdoc;Associate Professor;Assistant Professor",
        "bibtex": "@inproceedings{\ntodd2024function,\ntitle={Function Vectors in Large Language Models},\nauthor={Eric Todd and Millicent Li and Arnab Sen Sharma and Aaron Mueller and Byron C Wallace and David Bau},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=AwyxtyMwaG}\n}",
        "github": "",
        "project": "",
        "reviewers": "baEP;ZAgB;cNFK;9YEq",
        "pdf_size": 1768824,
        "rating": "6;6;6;6",
        "confidence": "3;2;3;4",
        "soundness": "3;3;2;3",
        "contribution": "3;4;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "43;81;74;177",
        "wc_strengths": "35;132;66;176",
        "wc_weaknesses": "314;168;224;223",
        "wc_questions": "103;45;5;583",
        "wc_review": "495;426;369;1159",
        "wc_reply_reviewers": "210;0;26;806",
        "wc_reply_authors": "632;522;878;1455",
        "reply_reviewers": "1;0;1;3",
        "reply_authors": "1;1;2;4",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            93.75,
            50.14665990871177
        ],
        "wc_strengths_avg": [
            102.25,
            55.137895317104736
        ],
        "wc_weaknesses_avg": [
            232.25,
            52.356351095163234
        ],
        "wc_questions_avg": [
            184.0,
            232.98283198553494
        ],
        "wc_review_avg": [
            612.25,
            318.8035249177775
        ],
        "wc_reply_reviewers_avg": [
            260.5,
            325.1811033870203
        ],
        "wc_reply_authors_avg": [
            871.75,
            360.5637079629618
        ],
        "reply_reviewers_avg": [
            1.25,
            1.0897247358851685
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 147,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3928477797104162619&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=AwyxtyMwaG",
        "pdf": "https://openreview.net/pdf?id=AwyxtyMwaG",
        "email": "northeastern.edu;neu.edu;northeasterd.edu;technion.ac.il;northeastern.edu;northeastern.edu",
        "author_num": 6,
        "aff_unique_index": "0;0;0;1;0;0",
        "aff_unique_norm": "Northeastern University;Technion - Israel Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.northeastern.edu;https://www.technion.ac.il/en/",
        "aff_unique_abbr": "NEU;Technion",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0;0",
        "aff_country_unique": "United States;Israel"
    },
    {
        "title": "Understanding Augmentation-based Self-Supervised Representation Learning via RKHS Approximation and Regression",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19234",
        "id": "Ax2yRhCQr1",
        "author_site": "Runtian Zhai, Bingbin Liu, Andrej Risteski, J Kolter, Pradeep K Ravikumar",
        "tldr": "",
        "abstract": "Data augmentation is critical to the empirical success of modern self-supervised representation learning, such as contrastive learning and masked language modeling.\nHowever, a theoretical understanding of the exact role of the augmentation remains limited.\nRecent work has built the connection between self-supervised learning and the approximation of the top eigenspace of a graph Laplacian operator, suggesting that learning a linear probe atop such representation can be connected to RKHS regression.\nBuilding on this insight, this work delves into a statistical analysis of augmentation-based pretraining.\nStarting from the isometry property, a geometric characterization of the target function given by the augmentation, we disentangle the effects of the model and the augmentation,\nand prove two generalization bounds that are free of model complexity.\nOur first bound works for an arbitrary encoder, and it is the sum of an estimation error bound incurred by fitting a linear probe, and an approximation error bound by RKHS approximation.\nOur second bound specifically addresses the case\nwhere the encoder extracts the top-d eigenspace of a finite-sample-based approximation of the underlying RKHS.\nA key ingredient in our analysis is the *augmentation complexity*,\nwhich we use to quantitatively compare different augmentations and analyze their impact on downstream performance.",
        "keywords": "Learning Theory;Representation Learning;Self-supervised Learning;Data Augmentation;RKHS Approximation;RKHS Regression",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/4cf1ef9bad03c678ea01d4aade8c0ae725a44312.zip",
        "author": "Runtian Zhai;Bingbin Liu;Andrej Risteski;J Zico Kolter;Pradeep Kumar Ravikumar",
        "authorids": "~Runtian_Zhai1;~Bingbin_Liu1;~Andrej_Risteski2;~J_Zico_Kolter1;~Pradeep_Kumar_Ravikumar1",
        "gender": "M;F;M;M;M",
        "homepage": "http://www.runtianzhai.com;https://clarabing.github.io/;;http://www.cs.cmu.edu/~pradeepr/;http://www.zicokolter.com",
        "dblp": "242/8411;222/1554;63/11143;94/3594;67/2526",
        "google_scholar": "EXd0ES8AAAAJ;2ud06rQAAAAJ;;https://scholar.google.com.tw/citations?user=Q4DTPw4AAAAJ;UXh1I6UAAAAJ",
        "orcid": "0000-0003-3332-3466;;;;",
        "linkedin": ";;;;",
        "or_profile": "~Runtian_Zhai1;~Bingbin_Liu1;~Andrej_Risteski2;~Pradeep_Kumar_Ravikumar1;~Zico_Kolter1",
        "aff": "Carnegie Mellon University;Carnegie Mellon University;Carnegie Mellon University;Carnegie Mellon University;Carnegie Mellon University",
        "aff_domain": "cmu.edu;cmu.edu;cmu.edu;cmu.edu;cmu.edu",
        "position": "PhD student;PhD student;Assistant Professor;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nzhai2024understanding,\ntitle={Understanding Augmentation-based Self-Supervised Representation Learning via {RKHS} Approximation and Regression},\nauthor={Runtian Zhai and Bingbin Liu and Andrej Risteski and J Zico Kolter and Pradeep Kumar Ravikumar},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Ax2yRhCQr1}\n}",
        "github": "",
        "project": "",
        "reviewers": "kPdq;umfH;dUJ6;tXrm",
        "pdf_size": 650089,
        "rating": "5;6;8;8",
        "confidence": "2;3;4;3",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;4",
        "presentation": "2;2;3;2",
        "wc_summary": "111;113;234;57",
        "wc_strengths": "80;79;202;61",
        "wc_weaknesses": "426;155;474;85",
        "wc_questions": "48;275;744;576",
        "wc_review": "665;622;1654;779",
        "wc_reply_reviewers": "299;403;831;202",
        "wc_reply_authors": "912;797;1909;1544",
        "reply_reviewers": "1;1;2;1",
        "reply_authors": "3;1;5;2",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            128.75,
            64.7857044416436
        ],
        "wc_strengths_avg": [
            105.5,
            56.224994441973934
        ],
        "wc_weaknesses_avg": [
            285.0,
            167.7065890178439
        ],
        "wc_questions_avg": [
            410.75,
            268.5045390677781
        ],
        "wc_review_avg": [
            930.0,
            421.9200161167991
        ],
        "wc_reply_reviewers_avg": [
            433.75,
            240.11390526164868
        ],
        "wc_reply_authors_avg": [
            1290.5,
            456.51095277112466
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            1.479019945774904
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.816496580927726,
        "gs_citation": 16,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2683750638215426254&as_sdt=5,34&sciodt=0,34&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=Ax2yRhCQr1",
        "pdf": "https://openreview.net/pdf?id=Ax2yRhCQr1",
        "email": "cmu.edu;cmu.edu;cmu.edu;cmu.edu;cmu.edu",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Carnegie Mellon University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cmu.edu",
        "aff_unique_abbr": "CMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Ax9cPWDKkR",
        "title": "Efficiently Quantifying Individual Agent Importance in Cooperative MARL",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Measuring the contribution of individual agents is challenging in cooperative multi-agent reinforcement learning (MARL). In cooperative MARL, team performance is typically inferred from a single shared global reward. Arguably, among the best current approaches to effectively measure individual agent contributions is to use Shapley values. However, calculating these values is expensive as the computational complexity grows exponentially with respect to the number of agents. In this paper, we adapt difference rewards into an efficient method for quantifying the contribution of individual agents, referred to as Agent Importance, offering a linear computational complexity relative to the number of agents. We show empirically that the computed values are strongly correlated with the true Shapley values, as well as the true underlying individual agent rewards, used as the ground truth in environments where these are available. We demonstrate how Agent Importance can be used to help study MARL systems by diagnosing algorithmic failures discovered in prior MARL benchmarking work. Our analysis illustrates Agent Importance as a valuable explainability component for future MARL benchmarks.",
        "keywords": "Multi-agent reinforcement learning;MARL;Evaluation;Credit assignment;Explainable AI",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/f7abce38ae16f8a8aa7c3a3d9588a41a7159e7b3.zip",
        "author": "Omayma Mahjoub;Ruan John de Kock;Siddarth Singh;Wiem Khlifi;Abidine Vall;Kale-ab Tessera;Rihab Gorsane;Arnu Pretorius",
        "authorids": "~Omayma_Mahjoub1;~Ruan_John_de_Kock1;~Siddarth_Singh2;~Wiem_Khlifi1;~Abidine_Vall1;~Kale-ab_Tessera1;~Rihab_Gorsane1;~Arnu_Pretorius1",
        "gender": "F;M;M;F;M;F;M;M",
        "homepage": ";;https://www.raillab.org/people#profile;;;;;https://www.kaleabtessera.com/",
        "dblp": "329/6292;;;;;;188/4368;284/8544",
        "google_scholar": ";jrYPOrsAAAAJ;RDxZpTwAAAAJ;;;;zZ6ydrAAAAAJ;EB5CtIYAAAAJ",
        "orcid": ";;0000-0002-3321-4959;;;;;",
        "linkedin": "omayma-mahjoub-35613b1a6/;ruan-de-kock/;https://za.linkedin.com/in/siddarthsingh1;wiem-khlifi/;abidine-vall-271b23109/;rihabgorsane/;arnupretorius/;kale-ab-tessera-013976101/",
        "or_profile": "~Omayma_Mahjoub1;~Ruan_John_de_Kock1;~Siddarth_Singh2;~Wiem_Khlifi1;~Abidine_Vall1;~Rihab_Gorsane1;~Arnu_Pretorius1;~Kale-ab_Abebe_Tessera1",
        "aff": "InstaDeep;InstaDeep;InstaDeep;InstaDeep;;;InstaDeep;University of Edinburgh",
        "aff_domain": "instadeep.com;instadeep.com;instadeep.com;instadeep.com;;;instadeep.com;ed.ac.uk",
        "position": "Researcher;Research Engineer;Researcher;Researcher;;;Researcher;PhD student",
        "bibtex": "@misc{\nmahjoub2024efficiently,\ntitle={Efficiently Quantifying Individual Agent Importance in Cooperative {MARL}},\nauthor={Omayma Mahjoub and Ruan John de Kock and Siddarth Singh and Wiem Khlifi and Abidine Vall and Kale-ab Tessera and Rihab Gorsane and Arnu Pretorius},\nyear={2024},\nurl={https://openreview.net/forum?id=Ax9cPWDKkR}\n}",
        "github": "",
        "project": "",
        "reviewers": "18rV;Vw4r;D2kb;HLQg",
        "site": "https://openreview.net/forum?id=Ax9cPWDKkR",
        "pdf_size": 1009679,
        "rating": "3;5;5;5",
        "confidence": "4;3;5;4",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;2",
        "presentation": "4;3;2;3",
        "wc_summary": "226;47;80;116",
        "wc_strengths": "113;36;147;74",
        "wc_weaknesses": "266;145;258;265",
        "wc_questions": "200;141;39;53",
        "wc_review": "805;369;524;508",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            117.25,
            67.36235966769573
        ],
        "wc_strengths_avg": [
            92.5,
            41.608292442733095
        ],
        "wc_weaknesses_avg": [
            233.5,
            51.188377587104675
        ],
        "wc_questions_avg": [
            108.25,
            65.83834369119563
        ],
        "wc_review_avg": [
            551.5,
            158.28534360451695
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=688138280485758688&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0;0;1",
        "aff_unique_norm": "InstaDeep;University of Edinburgh",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.instadeep.com;https://www.ed.ac.uk",
        "aff_unique_abbr": "InstaDeep;Edinburgh",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "AxYTFpdlvj",
        "title": "Graph Decoding via Generalized Random Dot Product Graph",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph Neural Networks (GNNs) have established themselves as the state-of-the-art methodology for a multitude of graph-related tasks, including but not limited to link prediction, node clustering, and classification. Despite their efficacy, the performance of GNNs in encoder-decoder architectures is often constrained by the limitations inherent in traditional decoders, particularly in the reconstruction of adjacency matrices.\n\nIn this paper, we introduce a novel graph decoding approach through the use of the Generalized Random Dot Product Graph (GRDPG) as a generative model for graph decoding. This novel methodology enhances the performance of encoder-decoder architectures across a range of tasks, owing to GRDPG's better capability to capture structures embedded within adjacency matrices.\n\nTo  evaluate our approach, we design a benchmark focused on graphs of varying sizes, thereby enriching the diversity of existing benchmarks for link prediction and node clustering tasks. Our experiments span a variety of tasks, encompassing both traditional benchmarks and specialized domains such as molecular graphs.\n\nThe empirical results show the capability of GRDPG on faithfully capturing properties of the original graphs while simultaneously improving the performance metrics of encoder-decoder architectures. By addressing the subtleties involved in adjacency matrix reconstruction, we  elevate the overall performance of GNN-based architectures, rendering them more robust and versatile for a wide array of real-world applications, with special regard on molecular graphs.",
        "keywords": "graph autoencoders;inner dot product decoder;generalized random dot product;link prediction;node clustering;molecular graph",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Alvaro Ciudad Serrano;Zinnera Tariq;Stelina Tarasi;Alexis Molina",
        "authorids": "~Alvaro_Ciudad_Serrano1;~Zinnera_Tariq1;~Stelina_Tarasi1;~Alexis_Molina1",
        "gender": "M;F;M;F",
        "homepage": "https://www.linkedin.com/in/alvaro-ciudad/;;;",
        "dblp": ";;347/2305;",
        "google_scholar": ";;moyS0qgAAAAJ;",
        "orcid": ";;;",
        "linkedin": ";stelina-tarasi-93334b245;;zinnera-tariq-2a76a1213",
        "or_profile": "~Alvaro_Ciudad_Serrano1;~Stelina_Tarasi1;~Alexis_Molina1;~Zinnera_Tariq2",
        "aff": "Nostrum Biodiscovery;;Universidad Polit\u00e9cnica de Cataluna;Universitat Rovira i Virgili",
        "aff_domain": "nostrumbiodiscovery.com;;upc.edu;urv.cat",
        "position": "Researcher;;Associate Professor;MS student",
        "bibtex": "@misc{\nserrano2024graph,\ntitle={Graph Decoding via Generalized Random Dot Product Graph},\nauthor={Alvaro Ciudad Serrano and Zinnera Tariq and Stelina Tarasi and Alexis Molina},\nyear={2024},\nurl={https://openreview.net/forum?id=AxYTFpdlvj}\n}",
        "github": "",
        "project": "",
        "reviewers": "ggnG;AHQZ;hJLN;io5N",
        "site": "https://openreview.net/forum?id=AxYTFpdlvj",
        "pdf_size": 212635,
        "rating": "1;1;3;3",
        "confidence": "4;5;3;4",
        "soundness": "2;2;1;2",
        "contribution": "1;2;2;1",
        "presentation": "1;1;1;3",
        "wc_summary": "37;89;47;36",
        "wc_strengths": "20;26;32;7",
        "wc_weaknesses": "124;129;128;85",
        "wc_questions": "78;43;57;85",
        "wc_review": "259;287;264;213",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "127;147;89;391",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            2.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            1.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            52.25,
            21.649191670822262
        ],
        "wc_strengths_avg": [
            21.25,
            9.256754290786809
        ],
        "wc_weaknesses_avg": [
            116.5,
            18.282505298782223
        ],
        "wc_questions_avg": [
            65.75,
            16.69393602479655
        ],
        "wc_review_avg": [
            255.75,
            26.845623479442605
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            188.5,
            118.75499989474127
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.7071067811865475,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:BdzUf5Xj7-QJ:scholar.google.com/&scioq=Graph+Decoding+via+Generalized+Random+Dot+Product+Graph&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Nostrum Biodiscovery;Universitat Polit\u00e8cnica de Catalunya;Universitat Rovira i Virgili",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.nostrumbiodiscovery.com/;https://www.upc.edu;https://www.urv.cat",
        "aff_unique_abbr": ";UPC;URV",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Spain"
    },
    {
        "title": "Symmetric Neural-Collapse Representations with Supervised Contrastive Loss: The Impact of ReLU and Batching",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19233",
        "id": "AyXIDfvYg8",
        "author_site": "Ganesh Ramachandra Kini, Vala Vakilian, Tina Behnia, Jaidev Gill, Christos Thrampoulidis",
        "tldr": "",
        "abstract": "Supervised contrastive loss (SCL) is a competitive and often superior alternative to the cross-entropy loss for classification. While prior studies have demonstrated that both losses yield symmetric training representations under balanced data, this symmetry breaks under class imbalances. This paper presents an intriguing discovery: the introduction of a ReLU activation at the final layer effectively restores the symmetry in SCL-learned representations. We arrive at this finding analytically, by establishing that the global minimizers of an unconstrained features model with SCL loss and entry-wise non-negativity constraints form an orthogonal frame. Extensive experiments conducted across various datasets, architectures, and imbalance scenarios corroborate our finding.  Importantly, our experiments reveal that the inclusion of the ReLU activation restores symmetry without compromising test accuracy. This constitutes the first geometry characterization of SCL under imbalances. Additionally, our analysis and experiments underscore the pivotal role of batch selection strategies in representation geometry. By proving necessary and sufficient conditions for mini-batch choices that ensure invariant symmetric representations, we introduce batch-binding as an efficient strategy that guarantees these conditions hold.",
        "keywords": "Supervised contrastive learning;neural collapse;implicit bias;class imbalance",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/4ca8e27c93ca216bf6d3c929a8b4ff265f95c4a2.zip",
        "author": "Ganesh Ramachandra Kini;Vala Vakilian;Tina Behnia;Jaidev Gill;Christos Thrampoulidis",
        "authorids": "~Ganesh_Ramachandra_Kini1;~Vala_Vakilian2;~Tina_Behnia1;~Jaidev_Gill1;~Christos_Thrampoulidis1",
        "gender": "M;M;F;M;",
        "homepage": "https://sites.google.com/view/ganeshkini/home?authuser=0;;;https://jaidevgill.github.io/;https://sites.google.com/view/cthrampo/home",
        "dblp": "190/7705;326/5424;323/4405;349/4531;127/6532",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;https://scholar.google.com/citations?hl=en;JHGm3eoAAAAJ;",
        "orcid": ";;;;",
        "linkedin": ";vala-vakilian-7516ab162/;;jaidev-gill/;",
        "or_profile": "~Ganesh_Ramachandra_Kini1;~Vala_Vakilian2;~Tina_Behnia1;~Jaidev_Gill1;~Christos_Thrampoulidis1",
        "aff": "University of California, Santa Barbara;University of British Columbia;University of British Columbia;University of British Columbia;University of British Columbia",
        "aff_domain": "ucsb.edu;ubc.ca;ubc.ca;ubc.ca;ubc.ca",
        "position": "PhD student;MS student;PhD student;Undergrad student;Assistant Professor",
        "bibtex": "@inproceedings{\nkini2024symmetric,\ntitle={Symmetric Neural-Collapse Representations with Supervised Contrastive Loss: The Impact of Re{LU} and Batching},\nauthor={Ganesh Ramachandra Kini and Vala Vakilian and Tina Behnia and Jaidev Gill and Christos Thrampoulidis},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=AyXIDfvYg8}\n}",
        "github": "",
        "project": "",
        "reviewers": "BEvk;ScWC;q7qd;PL8u",
        "pdf_size": 1269151,
        "rating": "5;6;6;6",
        "confidence": "3;4;4;4",
        "soundness": "4;3;4;4",
        "contribution": "2;2;3;2",
        "presentation": "4;3;3;4",
        "wc_summary": "525;67;92;96",
        "wc_strengths": "82;41;64;96",
        "wc_weaknesses": "530;127;85;209",
        "wc_questions": "210;4;18;38",
        "wc_review": "1347;239;259;439",
        "wc_reply_reviewers": "0;0;150;117",
        "wc_reply_authors": "1074;525;868;876",
        "reply_reviewers": "0;0;2;2",
        "reply_authors": "3;2;3;3",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            195.0,
            190.8494170805874
        ],
        "wc_strengths_avg": [
            70.75,
            20.58367071248469
        ],
        "wc_weaknesses_avg": [
            237.75,
            174.524174543242
        ],
        "wc_questions_avg": [
            67.5,
            83.15497579820465
        ],
        "wc_review_avg": [
            571.0,
            454.743883961071
        ],
        "wc_reply_reviewers_avg": [
            66.75,
            67.76199155869018
        ],
        "wc_reply_authors_avg": [
            835.75,
            197.47705562925532
        ],
        "reply_reviewers_avg": [
            1.0,
            1.0
        ],
        "reply_authors_avg": [
            2.75,
            0.4330127018922193
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15271411147837020711&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=AyXIDfvYg8",
        "pdf": "https://openreview.net/pdf?id=AyXIDfvYg8",
        "email": "ucsb.edu;ubc.ca;ubc.ca;ubc.ca;ubc.ca",
        "author_num": 5,
        "aff_unique_index": "0;1;1;1;1",
        "aff_unique_norm": "University of California, Santa Barbara;University of British Columbia",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ucsb.edu;https://www.ubc.ca",
        "aff_unique_abbr": "UCSB;UBC",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Santa Barbara;",
        "aff_country_unique_index": "0;1;1;1;1",
        "aff_country_unique": "United States;Canada"
    },
    {
        "title": "Learning Energy-Based Models by Cooperative Diffusion Recovery Likelihood",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19232",
        "id": "AyzkDpuqcl",
        "author_site": "yaxuan zhu, Jianwen Xie, Yingnian Wu, Ruiqi Gao",
        "tldr": "",
        "abstract": "Training energy-based models (EBMs) on high-dimensional data can be both challenging and time-consuming, and there exists a noticeable gap in sample quality between EBMs and other generative frameworks like GANs and diffusion models. To close this gap, inspired by the recent efforts of learning EBMs by maximimizing diffusion recovery likelihood (DRL), we propose cooperative diffusion recovery likelihood (CDRL), an effective approach to tractably learn and sample from a series of EBMs defined on increasingly noisy versons of a dataset, paired with an initializer model for each EBM. At each noise level, the two models are jointly estimated within a cooperative training framework: Samples from the initializer serve as starting points that are refined by a few MCMC sampling steps from the EBM. The EBM is then optimized by maximizing recovery likelihood, while the initializer model is optimized by learning from the difference between the refined samples and the initial samples. In addition, we made several practical designs for EBM training to further improve the sample quality. Combining these advances, we significantly boost the generation performance compared to existing EBM methods on CIFAR-10 and ImageNet 32x32. And we have shown that CDRL has great potential to largely reduce the sampling time. We also demonstrate the effectiveness of our models for several downstream tasks, including classifier-free guided generation, compositional generation, image inpainting and out-of-distribution detection.",
        "keywords": "Energy-based model;recovery-likelihood;cooperative learning",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Yaxuan Zhu;Jianwen Xie;Ying Nian Wu;Ruiqi Gao",
        "authorids": "~Yaxuan_Zhu1;~Jianwen_Xie1;~Ying_Nian_Wu1;~Ruiqi_Gao1",
        "gender": "M;;;F",
        "homepage": ";;;http://www.stat.ucla.edu/~ruiqigao/",
        "dblp": "289/6018;;;206/7084",
        "google_scholar": "EptgCGsAAAAJ;;;VdlgOXoAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Yaxuan_Zhu1;~Jianwen_Xie1;~Ying_Nian_Wu1;~Ruiqi_Gao1",
        "aff": "University of California, Los Angeles;;;Google",
        "aff_domain": "ucla.edu;;;google.com",
        "position": "PhD student;;;Researcher",
        "bibtex": "@inproceedings{\nzhu2024learning,\ntitle={Learning Energy-Based Models by Cooperative Diffusion Recovery Likelihood},\nauthor={Yaxuan Zhu and Jianwen Xie and Ying Nian Wu and Ruiqi Gao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=AyzkDpuqcl}\n}",
        "github": "",
        "project": "",
        "reviewers": "S2Sh;nfgg;cEiK;KQ36;9dWK",
        "pdf_size": 23293565,
        "rating": "6;6;6;8;8",
        "confidence": "5;4;4;3;5",
        "soundness": "3;3;3;3;3",
        "contribution": "2;2;3;3;2",
        "presentation": "2;3;3;2;3",
        "wc_summary": "59;81;51;126;41",
        "wc_strengths": "6;81;63;53;63",
        "wc_weaknesses": "53;134;222;78;202",
        "wc_questions": "101;47;133;303;11",
        "wc_review": "219;343;469;560;317",
        "wc_reply_reviewers": "10;33;122;128;54",
        "wc_reply_authors": "1101;877;2174;1472;1055",
        "reply_reviewers": "1;1;1;1;1",
        "reply_authors": "4;4;5;3;3",
        "rating_avg": [
            6.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            4.2,
            0.7483314773547882
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            71.6,
            30.223169919781743
        ],
        "wc_strengths_avg": [
            53.2,
            25.26974475533934
        ],
        "wc_weaknesses_avg": [
            137.8,
            66.32164051046989
        ],
        "wc_questions_avg": [
            119.0,
            101.21659942914502
        ],
        "wc_review_avg": [
            381.6,
            119.63878969631881
        ],
        "wc_reply_reviewers_avg": [
            69.4,
            47.520942751591114
        ],
        "wc_reply_authors_avg": [
            1335.8,
            461.65069045762294
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.8,
            0.7483314773547882
        ],
        "replies_avg": [
            31,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.21821789023599233,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12543544673887222111&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=AyzkDpuqcl",
        "pdf": "https://openreview.net/pdf?id=AyzkDpuqcl",
        "email": "ucla.edu;;;google.com",
        "author_num": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of California, Los Angeles;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.ucla.edu;https://www.google.com",
        "aff_unique_abbr": "UCLA;Google",
        "aff_campus_unique_index": "0;1",
        "aff_campus_unique": "Los Angeles;Mountain View",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "B0OwtVEejJ",
        "title": "Weight-Entanglement Meets Gradient-Based Neural Architecture Search",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Weight sharing is a fundamental concept in neural architecture search (NAS), enabling gradient-based methods to explore cell-based architecture spaces significantly faster than traditional blackbox approaches. In parallel, weight entanglement has emerged as a technique for intricate parameter sharing among architectures within macro-level search spaces. Since weight-entanglement poses compatibility challenges for gradient-based NAS methods, these  two paradigms have largely developed independently in parallel sub-communities. This paper aims to bridge the gap between these sub-communities by proposing a novel scheme to adapt gradient-based methods for weight-entangled spaces. This enables us to conduct an in-depth comparative assessment and analysis of the performance of gradient-based NAS in weight-entangled search spaces. Our findings reveal that this integration of weight-entanglement and gradient-based NAS brings forth the various benefits of gradient-based methods (enhanced performance, improved supernet training properties and superior any-time performance), while preserving the memory efficiency of weight-entangled spaces. The code for our work is openly accessible [here](https://anonymous.4open.science/r/TangleNAS-527C).",
        "keywords": "Neural Architecture Search;Transformers;Weight Entanglement",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/8435a982dca96e5ef82ad8f0ea502014437a0691.pdf",
        "author": "Rhea Sanjay Sukthanker;Arjun Krishnakumar;Mahmoud Safari;Frank Hutter",
        "authorids": "~Rhea_Sanjay_Sukthanker3;~Arjun_Krishnakumar1;~Mahmoud_Safari1;~Frank_Hutter1",
        "gender": "F;M;M;M",
        "homepage": "https://rheasukthanker.github.io/;;https://ml.informatik.uni-freiburg.de/profile/safari/;http://ml.informatik.uni-freiburg.de/~hutter/",
        "dblp": "277/5077;312/6584;280/3542;89/5383",
        "google_scholar": "OsamqmMAAAAJ;;https://scholar.google.it/citations?user=ntPjyLwAAAAJ;https://scholar.google.de/citations?user=YUrxwrkAAAAJ",
        "orcid": ";;;0000-0002-2037-3694",
        "linkedin": "rhea-sukthanker-006502116/;arjun-krishnakumar-10235754/;;frank-hutter-9190b24b/",
        "or_profile": "~Rhea_Sanjay_Sukthanker3;~Arjun_Krishnakumar1;~Mahmoud_Safari1;~Frank_Hutter1",
        "aff": "University of Freiburg, Albert-Ludwigs-Universit\u00e4t Freiburg;University of Freiburg, Albert-Ludwigs-Universit\u00e4t Freiburg;Universit\u00e4t Freiburg;Albert-Ludwigs-Universit\u00e4t Freiburg",
        "aff_domain": "cs.uni-freiburg.de;cs.uni-freiburg.de;uni-freiburg.de;uni-freiburg.de",
        "position": "PhD student;Research Engineer;Postdoc;Full Professor",
        "bibtex": "@misc{\nsukthanker2024weightentanglement,\ntitle={Weight-Entanglement Meets Gradient-Based Neural Architecture Search},\nauthor={Rhea Sanjay Sukthanker and Arjun Krishnakumar and Mahmoud Safari and Frank Hutter},\nyear={2024},\nurl={https://openreview.net/forum?id=B0OwtVEejJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "JeZf;wjLK;2nyZ;b7V3",
        "site": "https://openreview.net/forum?id=B0OwtVEejJ",
        "pdf_size": 1708412,
        "rating": "3;3;5;6",
        "confidence": "5;4;2;5",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;3;3",
        "wc_summary": "46;82;88;50",
        "wc_strengths": "27;63;91;33",
        "wc_weaknesses": "101;49;244;104",
        "wc_questions": "25;119;25;17",
        "wc_review": "199;313;448;204",
        "wc_reply_reviewers": "0;0;0;39",
        "wc_reply_authors": "738;1450;642;512",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "2;3;2;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            1.224744871391589
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            66.5,
            18.6748493969831
        ],
        "wc_strengths_avg": [
            53.5,
            25.588083163847973
        ],
        "wc_weaknesses_avg": [
            124.5,
            72.37575560918172
        ],
        "wc_questions_avg": [
            46.5,
            41.98511641046146
        ],
        "wc_review_avg": [
            291.0,
            101.44703051346549
        ],
        "wc_reply_reviewers_avg": [
            9.75,
            16.887495373796554
        ],
        "wc_reply_authors_avg": [
            835.5,
            363.7344498394399
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.15713484026367722,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7294994996214458888&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "University of Freiburg;Albert-Ludwigs-Universit\u00e4t Freiburg",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uni-freiburg.de;https://www.uni-freiburg.de",
        "aff_unique_abbr": "UoF;Albert-Ludwigs-Universit\u00e4t",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Freiburg;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "B0wJ5oCPdB",
        "title": "Chain-of-Symbol Prompting for Spatial Relationships in Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "While conventional Chain-of-Thought prompting shows promising performance on various language tasks for LLMs, the spatial scenarios are nearly unexplored. In this paper, we first investigate the performance of LLMs on complex spatial planning and understanding tasks that require LLMs to understand a virtual spatial environment simulated via natural language and act or reason correspondingly in text. By evaluating on classic spatial planning scenarios through natural language descriptions, we found that current popular LLMs such as ChatGPT still lack abilities to handle spatial relationships in texts. This arises a question -- do the natural language is the best way to represent complex spatial environments for LLMs, or maybe other alternatives such as symbolic representations are both more efficient and effective for LLMs? To this end, we propose a novel method called **CoS** (**C**hain-**o**f-**S**ymbol Prompting) that represents the spatial relationships with condensed symbols during the chained intermediate thinking steps. CoS is easy to use and does not need additional training on LLMs. Extensive experiments indicate that CoS clearly surpasses the performance of the Chain-of-Thought (CoT) Prompting described in natural langauge in all three spatial planning tasks and existing spatial QA benchmark, with even fewer tokens used in the inputs compared with CoT. The performance gain is strong, by up to 60.8\\% accuracy (from 31.8\\% to 92.6\\%) on Brick World scenarios for ChatGPT. CoS also reduces the number of tokens in the prompt obviously, by up to 65.8\\% of the tokens (from 407 to 139) for the intermediate steps from demonstrations on the Brick World task.",
        "keywords": "Large Language Models;Prompting;Spatial Planning;Reasoning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Hanxu Hu;Hongyuan Lu;Huajian Zhang;Yun-Ze Song;Wai Lam;Yue Zhang",
        "authorids": "~Hanxu_Hu1;~Hongyuan_Lu2;~Huajian_Zhang1;~Yun-Ze_Song1;~Wai_Lam1;~Yue_Zhang7",
        "gender": "M;M;M;F;M;M",
        "homepage": "https://hanxuhu.github.io;https://dblp1.uni-trier.de/pid/139/4326.html;https://hjznlp.github.io/;https://yunzesong.github.io/;http://www.se.cuhk.edu.hk/~textmine;http://frcchang.github.io",
        "dblp": ";139/4326;;;48/1707;47/722-4",
        "google_scholar": "https://scholar.google.com.hk/citations?user=r9fCUd8AAAAJ;;niE2uWkAAAAJ;qOQwD7UAAAAJ;ewA4NAcAAAAJ;",
        "orcid": ";;;;;0000-0002-5214-2268",
        "linkedin": ";luke-lu-595b68136;huajian-zhang-64b213276/;;;",
        "or_profile": "~Hanxu_Hu1;~Hongyuan_Lu2;~Huajian_Zhang1;~Yun-Ze_Song1;~Wai_Lam1;~Yue_Zhang7",
        "aff": "University of Edinburgh;The Chinese University of Hong Kong;University of Edinburgh, University of Edinburgh;;The Chinese University of Hong Kong;Westlake University",
        "aff_domain": "inf.ed.ac.uk;cuhk.edu.hk;ed.ac.uk;;cuhk.edu.hk;westlake.edu.cn",
        "position": "MS student;Researcher;Vistor;;Professor;Full Professor",
        "bibtex": "@misc{\nhu2024chainofsymbol,\ntitle={Chain-of-Symbol Prompting for Spatial Relationships in Large Language Models},\nauthor={Hanxu Hu and Hongyuan Lu and Huajian Zhang and Yun-Ze Song and Wai Lam and Yue Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=B0wJ5oCPdB}\n}",
        "github": "",
        "project": "",
        "reviewers": "LjHX;c5jB;tveC;Doc8",
        "site": "https://openreview.net/forum?id=B0wJ5oCPdB",
        "pdf_size": 405509,
        "rating": "6;6;6;6",
        "confidence": "4;3;3;4",
        "soundness": "3;3;3;2",
        "contribution": "3;3;2;2",
        "presentation": "4;3;3;3",
        "wc_summary": "41;208;95;72",
        "wc_strengths": "26;30;73;29",
        "wc_weaknesses": "166;27;144;250",
        "wc_questions": "1;65;108;21",
        "wc_review": "234;330;420;372",
        "wc_reply_reviewers": "0;0;26;79",
        "wc_reply_authors": "298;262;833;543",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            104.0,
            63.027771656627685
        ],
        "wc_strengths_avg": [
            39.5,
            19.397164741270824
        ],
        "wc_weaknesses_avg": [
            146.75,
            79.65354668814189
        ],
        "wc_questions_avg": [
            48.75,
            41.30602256330183
        ],
        "wc_review_avg": [
            339.0,
            68.47627326307996
        ],
        "wc_reply_reviewers_avg": [
            26.25,
            32.251937926270415
        ],
        "wc_reply_authors_avg": [
            484.0,
            228.6711612774991
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13789758302587408119&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;1;2",
        "aff_unique_norm": "University of Edinburgh;Chinese University of Hong Kong;Westlake University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ed.ac.uk;https://www.cuhk.edu.hk;https://www.westlake.edu.cn",
        "aff_unique_abbr": "Edinburgh;CUHK;WU",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;1;0;1;1",
        "aff_country_unique": "United Kingdom;China"
    },
    {
        "id": "B1Tl99XWXC",
        "title": "Efficient Transfer Learning in Diffusion Models via Adversarial Noise",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Diffusion Probabilistic Models (DPMs) have demonstrated substantial promise in image generation tasks but heavily rely on the availability of large amounts of training data. Previous works, like GANs, have tackled the limited data problem by transferring pre-trained models learned with sufficient data. However, those methods are hard to be utilized in DPMs since the distinct differences between DPM-based and GAN-based methods, showing in the unique iterative denoising process integral and the need for many timesteps with no-targeted noise in DPMs. In this paper, we propose a novel DPMs-based transfer learning method, TAN, to address the limited data problem. It includes two strategies: similarity-guided training, which boosts transfer with a classifier, and adversarial noise selection which adaptive chooses targeted noise based on the input image. Extensive experiments in the context of few-shot image generation tasks demonstrate that our method is not only efficient but also excels in terms of image quality and diversity when compared to existing GAN-based and DDPM-based methods.",
        "keywords": "Transfer learning; Few Shot Image Generation; Diffusion model",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/143e48c55f7fb3a45063c3662fb88cf75ce8f0d4.zip",
        "author": "Xiyu Wang;Baijiong Lin;Daochang Liu;Ying-Cong Chen;Chang Xu",
        "authorids": "~Xiyu_Wang2;~Baijiong_Lin1;~Daochang_Liu1;~Ying-Cong_Chen1;~Chang_Xu4",
        "gender": "M;M;M;M;",
        "homepage": ";https://baijiong-lin.github.io/;https://finspire13.github.io;https://www.yingcong.me/;https://sydney.edu.au/engineering/about/our-people/academic-staff/c-xu.html",
        "dblp": ";279/2950;222/2701;137/6578;97/2966-2",
        "google_scholar": ";KVdbYTYAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com.hk/citations?user=n7j4bJUAAAAJ;N4F_3eoAAAAJ",
        "orcid": ";0000-0002-4257-0226;;;0000-0002-4756-0609",
        "linkedin": "%E6%9B%A6%E5%AE%87-%E7%8E%8B-66b6aa1b3/;;;;",
        "or_profile": "~Xiyu_Wang2;~Baijiong_Lin1;~Daochang_Liu1;~Ying-Cong_Chen1;~Charles_Xu1",
        "aff": "University of Sydney;The Hong Kong University of Science and Technology (Guangzhou);University of Sydney;Hong Kong University of Science and Technology;University of Sydney",
        "aff_domain": "usyd.edu.au;connect.hkust-gz.edu.cn;usyd.edu.au;hkust-gz.edu.cn;sydney.eud.au",
        "position": "PhD student;PhD student;Postdoc;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nwang2024efficient,\ntitle={Efficient Transfer Learning in Diffusion Models via Adversarial Noise},\nauthor={Xiyu Wang and Baijiong Lin and Daochang Liu and Ying-Cong Chen and Chang Xu},\nyear={2024},\nurl={https://openreview.net/forum?id=B1Tl99XWXC}\n}",
        "github": "",
        "project": "",
        "reviewers": "dyX4;ft3z;Pd9e;jP4S",
        "site": "https://openreview.net/forum?id=B1Tl99XWXC",
        "pdf_size": 14548603,
        "rating": "3;6;6;6",
        "confidence": "5;3;3;2",
        "soundness": "2;3;3;3",
        "contribution": "1;3;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "60;94;162;60",
        "wc_strengths": "36;39;142;19",
        "wc_weaknesses": "180;150;70;50",
        "wc_questions": "14;16;67;7",
        "wc_review": "290;299;441;136",
        "wc_reply_reviewers": "0;0;27;0",
        "wc_reply_authors": "1100;789;792;489",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "3;2;2;2",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            94.0,
            41.641325627314025
        ],
        "wc_strengths_avg": [
            59.0,
            48.52319033204639
        ],
        "wc_weaknesses_avg": [
            112.5,
            54.025456962435776
        ],
        "wc_questions_avg": [
            26.0,
            23.90606617576384
        ],
        "wc_review_avg": [
            291.5,
            107.92242584375131
        ],
        "wc_reply_reviewers_avg": [
            6.75,
            11.691342951089922
        ],
        "wc_reply_authors_avg": [
            792.5,
            216.0329835927838
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9271726499455307,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11020171793380811836&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0;1;0",
        "aff_unique_norm": "University of Sydney;Hong Kong University of Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.sydney.edu.au;https://www.ust.hk",
        "aff_unique_abbr": "USYD;HKUST",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Guangzhou;Hong Kong SAR",
        "aff_country_unique_index": "0;1;0;1;0",
        "aff_country_unique": "Australia;China"
    },
    {
        "id": "B1VWS7ZRm6",
        "title": "On Transferring Expert Knowledge from Tabular Data to Images",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Transferring knowledge across modalities has gained considerable attention in machine learning. Expert knowledge in fields like medicine is often represented in tabular form, and transferring this information can enhance the comprehensiveness and accuracy of image-based learning. Unlike general knowledge reuse scenarios, tabular data is divided into numerical and categorical variables, with each column having a unique semantic meaning. In addition, not all columns can be accurately represented in images, making it challenging to determine \"how to reuse\" and \"which subset to reuse\". To address this, we propose a novel method called CHannel tAbulaR alignment with optiMal tranSport (CHARMS) that automatically and effectively transfers relevant tabular knowledge. Specifically, by maximizing the mutual information between a group of channels and tabular features, our method modifies the visual embedding and captures the semantics of tabular knowledge. The alignment between channels and attributes helps select the subset of tabular data which contains knowledge to images. Experimental results demonstrate that CHARMS effectively reuses tabular knowledge to improve the performance and interpretability of visual classifiers.",
        "keywords": "Multimodal Learning;Tabular Data;Missing Modality",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Jun-Peng Jiang;Han-Jia Ye;Leye Wang;Yang Yang;Yuan Jiang;De-Chuan Zhan",
        "authorids": "~Jun-Peng_Jiang2;~Han-Jia_Ye1;~Leye_Wang1;~Yang_Yang17;~Yuan_Jiang1;~De-Chuan_Zhan1",
        "gender": ";M;M;M;F;M",
        "homepage": "http://www.lamda.nju.edu.cn/jiangjp/;http://www.lamda.nju.edu.cn/yehj;https://wangleye.github.io/;http://www.njustkmg.cn/;http://lamda.nju.edu.cn/jiangy;http://www.lamda.nju.edu.cn/zhandc/",
        "dblp": "266/2867;165/3014;07/8764;48/450-74;;74/498",
        "google_scholar": "ZZ_7-TQAAAAJ;mgOYhtoAAAAJ;;_6NJip0AAAAJ;;mYJf4TcAAAAJ",
        "orcid": ";;;0000-0002-5245-3584;;0000-0002-3533-2078",
        "linkedin": ";;;;;",
        "or_profile": "~Jun-Peng_Jiang2;~Han-Jia_Ye1;~Leye_Wang1;~Yang_Yang17;~Yuan_Jiang1;~De-Chuan_Zhan1",
        "aff": "NanJing University;Nanjing University;Peking University;Nanjing University of Science and Technology;Nanjing University;Nanjing University",
        "aff_domain": "nju.edu.cn;nju.edu.cn;pku.edu.cn;njust.edu.cn;nju.edu.cn;nju.edu.cn",
        "position": "PhD student;Associate Professor;Assistant Professor;Full Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\njiang2024on,\ntitle={On Transferring Expert Knowledge from Tabular Data to Images},\nauthor={Jun-Peng Jiang and Han-Jia Ye and Leye Wang and Yang Yang and Yuan Jiang and De-Chuan Zhan},\nyear={2024},\nurl={https://openreview.net/forum?id=B1VWS7ZRm6}\n}",
        "github": "",
        "project": "",
        "reviewers": "QrqR;63tZ;zSmg;UGYo",
        "site": "https://openreview.net/forum?id=B1VWS7ZRm6",
        "pdf_size": 2073529,
        "rating": "5;5;5;6",
        "confidence": "4;3;4;5",
        "soundness": "2;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "1;2;2;3",
        "wc_summary": "64;200;22;100",
        "wc_strengths": "12;81;66;81",
        "wc_weaknesses": "300;841;194;139",
        "wc_questions": "14;94;2;66",
        "wc_review": "390;1216;284;386",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "723;867;825;863",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            96.5,
            65.82362797658604
        ],
        "wc_strengths_avg": [
            60.0,
            28.38133189263675
        ],
        "wc_weaknesses_avg": [
            368.5,
            278.8678002208215
        ],
        "wc_questions_avg": [
            44.0,
            37.57658845611187
        ],
        "wc_review_avg": [
            569.0,
            375.9534545658545
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            819.5,
            58.07538204781782
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.816496580927726,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2665088422304130128&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;2;0;0",
        "aff_unique_norm": "Nanjing University;Peking University;Nanjing University of Science and Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.nju.edu.cn;http://www.pku.edu.cn;http://www.nust.edu.cn/",
        "aff_unique_abbr": "Nanjing U;Peking U;NUST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "B21c9hT1D7",
        "title": "High-dimensional robust regression under heavy-tailed data: Asymptotics and Universality",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We investigate the high-dimensional properties of robust regression estimators in the presence of heavy-tailed contamination of both the covariates and response functions. In particular, we provide a sharp asymptotic characterisation of M-estimators trained on a family of elliptical covariate and noise data distributions including cases where second and higher moments do not exist. We show that, despite being consistent, the Huber loss with optimally tuned location parameter $\\delta$ is suboptimal in the high-dimensional regime in the presence of heavy-tailed noise, highlighting the necessity of further regularisation to achieve optimal performance. This result also uncovers the existence of a curious transition in $\\delta$ as a function of the sample complexity and contamination. Moreover, we derive the decay rates for the excess risk of ridge regression. We show that, while it is both optimal and universal for noise distributions with finite second moment, its decay rate can be considerably faster when the covariates' second moment does not exist. Finally, we show that our formulas readily generalise to a richer family of models and data distributions, such as generalised linear estimation with arbitrary convex regularisation trained on mixture models.",
        "keywords": "High-dimensional statistics;Robust regression;M-estimation;Huber loss;Heavy-tail contamination;Replica trick",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/dd9355e049cfee52697f13694ff2dda6eb552dcd.pdf",
        "author": "Urte Adomaityte;Leonardo Defilippis;Bruno Loureiro;Gabriele Sicuro",
        "authorids": "~Urte_Adomaityte1;~Leonardo_Defilippis1;~Bruno_Loureiro1;~Gabriele_Sicuro1",
        "gender": "F;M;M;M",
        "homepage": ";;https://brloureiro.github.io/;https://gsicuro.github.io/",
        "dblp": ";358/3529;207/1834;145/7405",
        "google_scholar": ";https://scholar.google.fr/citations?user=-df-QMIAAAAJ;DXl3ir8AAAAJ;Lls7QvUAAAAJ",
        "orcid": "0000-0002-5593-2177;;0000-0002-6327-4688;0000-0002-9258-2436",
        "linkedin": ";;bruno-loureiro-43183b14a/;",
        "or_profile": "~Urte_Adomaityte1;~Leonardo_Defilippis1;~Bruno_Loureiro1;~Gabriele_Sicuro1",
        "aff": "King's College London, University of London;Ecole Normale Sup\u00e9rieure, Ecole Normale Sup\u00e9rieure de Paris;Ecole Normale Sup\u00e9rieure, Ecole Normale Sup\u00e9rieure de Paris;University of Bologna",
        "aff_domain": "kcl.ac.uk;di.ens.fr;di.ens.fr;unibo.it",
        "position": "PhD student;PhD student;Researcher;Associate Professor",
        "bibtex": "@misc{\nadomaityte2024highdimensional,\ntitle={High-dimensional robust regression under heavy-tailed data: Asymptotics and Universality},\nauthor={Urte Adomaityte and Leonardo Defilippis and Bruno Loureiro and Gabriele Sicuro},\nyear={2024},\nurl={https://openreview.net/forum?id=B21c9hT1D7}\n}",
        "github": "",
        "project": "",
        "reviewers": "Fbsx;sjuz;JXsv",
        "site": "https://openreview.net/forum?id=B21c9hT1D7",
        "pdf_size": 997354,
        "rating": "5;6;8",
        "confidence": "3;3;3",
        "soundness": "3;3;3",
        "contribution": "2;2;3",
        "presentation": "2;2;3",
        "wc_summary": "35;118;43",
        "wc_strengths": "11;89;38",
        "wc_weaknesses": "56;222;29",
        "wc_questions": "454;473;22",
        "wc_review": "556;902;132",
        "wc_reply_reviewers": "116;171;0",
        "wc_reply_authors": "1112;1010;86",
        "reply_reviewers": "1;1;0",
        "reply_authors": "2;2;1",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            65.33333333333333,
            37.38389433373088
        ],
        "wc_strengths_avg": [
            46.0,
            32.341923257592455
        ],
        "wc_weaknesses_avg": [
            102.33333333333333,
            85.33203124006575
        ],
        "wc_questions_avg": [
            316.3333333333333,
            208.2695902483659
        ],
        "wc_review_avg": [
            530.0,
            314.8883399979534
        ],
        "wc_reply_reviewers_avg": [
            95.66666666666667,
            71.27567763425488
        ],
        "wc_reply_authors_avg": [
            736.0,
            461.50189598743793
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10697380971436726465&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "King's College London;Ecole Normale Sup\u00e9rieure de Paris;University of Bologna",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.kcl.ac.uk;https://www.ens.psl.eu;https://www.unibo.it",
        "aff_unique_abbr": "KCL;ENS Paris;Unibo",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Paris",
        "aff_country_unique_index": "0;1;1;2",
        "aff_country_unique": "United Kingdom;France;Italy"
    },
    {
        "id": "B37UmlxsaP",
        "title": "Revealing The Intrinsic Ability of Generative Text Summarizers for Outlier Paragraph Detection",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Generative text summarizers are good at content encapsulation but falter when outlier paragraphs disrupt the primary narrative. We categorize these outliers into cross-document outliers that are thematically inconsistent but within the same domain, and cross-domain outliers, originating from distinct domains. Traditional methods lean on word embeddings and specialized classifiers, requiring extensive supervised fine-tuning. Confidence-based strategies, despite bypassing fine-tuning, are ill-suited due to the non-classification essence of summarization. Leveraging the encoder-decoder cross-attention framework, we introduce an approach emphasizing the unique characteristics of infrequent words in detection. We present CODE, a novel outlier detector using a closed-form expression rooted in cross-attention scores. Our experimental results validate the superiority of CODE under different datasets and architectures, e.g., achieving a 5.80\\% FPR at 95\\% TPR vs. 25.63\\% by supervised baselines on T5-Large and Delve domain. We further underscore the significance of cross-attention, word frequency normalization and judicious integration of cross-document outliers during pretraining.",
        "keywords": "Outlier Paragraph Detection;Generative Language Models;Cross Attention",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Qi Li;Lyuwen Wu;Lin Liu;Luoyi Fu;Xinbing Wang;Lei Zhou;Chenghu Zhou;Shiyu Liang",
        "authorids": "~Qi_Li15;~Lyuwen_Wu1;~Lin_Liu16;~Luoyi_Fu1;~Xinbing_Wang1;~Lei_Zhou3;~Chenghu_Zhou3;~Shiyu_Liang1",
        "gender": "M;F;M;F;M;M;M;M",
        "homepage": ";;;http://www.cs.sjtu.edu.cn/~fu-ly/index.html;http://www.cs.sjtu.edu.cn/~wang-xb/;;http://www.igsnrr.cas.cn/gkjj/ysfc/ysfc_zhouchenghu/;",
        "dblp": ";;;;96/1149.html;72/5749;85/1324.html;",
        "google_scholar": ";;eoj1VFoAAAAJ;https://scholar.google.com.tw/citations?user=xHs9mCUAAAAJ;https://scholar.google.com.tw/citations?user=CT5yZbwAAAAJ;;;L8r9ox4AAAAJ",
        "orcid": "0000-0001-8089-8348;0009-0007-2607-7072;;;0000-0002-0357-8356;;;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Qi_Li15;~Lyuwen_Wu1;~Lin_Liu16;~Luoyi_Fu1;~Xinbing_Wang1;~Lei_Zhou3;~Chenghu_Zhou3;~Shiyu_Liang1",
        "aff": "Shanghai Jiaotong University;Shanghai Jiaotong University;National University of Defense Technology;Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;IGSNRR, Chinese Academy of Sciences, Beijing, China;Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn;sjtu.edu.cn;nudt.edu.cn;sjtu.edu.cn;cs.sjtu.edu.cn;sjtu.edu.cn;lreis.ac.cn;sjtu.edu.cn",
        "position": "PhD student;MS student;Associate Professor;Associate Professor;Full Professor;Full Professor;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nli2024revealing,\ntitle={Revealing The Intrinsic Ability of Generative Text Summarizers for Outlier Paragraph Detection},\nauthor={Qi Li and Lyuwen Wu and Lin Liu and Luoyi Fu and Xinbing Wang and Lei Zhou and Chenghu Zhou and Shiyu Liang},\nyear={2024},\nurl={https://openreview.net/forum?id=B37UmlxsaP}\n}",
        "github": "",
        "project": "",
        "reviewers": "tMsa;bZd9;2Dc8;G5oa",
        "site": "https://openreview.net/forum?id=B37UmlxsaP",
        "pdf_size": 997499,
        "rating": "1;3;3;3",
        "confidence": "4;3;4;3",
        "soundness": "3;2;2;2",
        "contribution": "1;1;1;2",
        "presentation": "2;1;3;2",
        "wc_summary": "64;29;103;42",
        "wc_strengths": "12;34;22;35",
        "wc_weaknesses": "113;137;218;157",
        "wc_questions": "17;63;132;3",
        "wc_review": "206;263;475;237",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            59.5,
            28.0579756931964
        ],
        "wc_strengths_avg": [
            25.75,
            9.443913383762052
        ],
        "wc_weaknesses_avg": [
            156.25,
            38.90613704802881
        ],
        "wc_questions_avg": [
            53.75,
            50.335747734587194
        ],
        "wc_review_avg": [
            295.25,
            105.72221857301331
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:PqyAnqwWOFYJ:scholar.google.com/&scioq=Revealing+The+Intrinsic+Ability+of+Generative+Text+Summarizers+for+Outlier+Paragraph+Detection&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;0;0;2;0",
        "aff_unique_norm": "Shanghai Jiao Tong University;National University of Defense Technology;Chinese Academy of Sciences",
        "aff_unique_dep": ";;IGSNRR",
        "aff_unique_url": "https://www.sjtu.edu.cn;http://www.nudt.edu.cn/;http://www.cas.cn",
        "aff_unique_abbr": "SJTU;NUDT;CAS",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Beijing",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "B3E8Y8g9GA",
        "title": "Data Overfitting for On-Device Super-Resolution with Dynamic Algorithm and Compiler Co-Design",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Deep neural networks (DNNs) are frequently employed in a variety of computer vision applications. Nowadays, an emerging trend in the current video distribution system is to take the advantage of DNNs overfitting property to perform video resolution upscaling. By splitting videos into chunks and applying a super-resolution (SR) model to overfit each chunk, this scheme of SR models plus video chunks is able to replace traditional video transmission to enhance video quality and transmission efficiency. However, many models and chunks are needed to guarantee a high performance, which leads to tremendous overhead on model switching and memory footprints at the user end. To resolve such problems, we propose a Dynamic Deep neural network assisted by a Content-Aware data processing pipeline to reduce the model number down to one (Dy-DCA), which helps promote performance while conserving computational resources. Additionally, to achieve real acceleration on the user end, we design a framework that optimizes dynamic features (e.g., dynamic shapes, sizes, and control flow) in Dy-DCA to enable a series of compilation optimizations, including fused code generation, static execution planning, etc. By employ such techniques, our method achieves better PSNR and real-time performance (33 FPS) on an off-the-shelf mobile phone. Meanwhile, assisted by our compilation optimization, we achieve 1.7$\\times$ speedup while saving up to 1.61$\\times$ memory consumption.",
        "keywords": "video super-resolution; overfitting; compiler optimization",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Gen Li;Zhihao Shu;Jie Ji;Minghai Qin;Fatemeh Afghah;Wei Niu;Xiaolong Ma",
        "authorids": "~Gen_Li4;~Zhihao_Shu1;~Jie_Ji1;~Minghai_Qin1;~Fatemeh_Afghah1;~Wei_Niu3;~Xiaolong_Ma2",
        "gender": "M;M;;M;F;M;M",
        "homepage": "https://coulsonlee.github.io;;;https://sites.google.com/site/minghaiqin/home;https://sites.google.com/g.clemson.edu/is-win-lab/home;https://www.niuwei.info;https://xiaolongma2016.com",
        "dblp": "28/538-12;369/3951;;;70/8821.html;68/828-2.html;",
        "google_scholar": ";dkxKQq0AAAAJ;;MSgWKbYAAAAJ;https://scholar.google.com.tw/citations?user=67mA71QAAAAJ;w1RoaOMAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;;0000-0002-2315-1173;;0000-0003-3753-7648",
        "linkedin": ";;;;fatemeh-afghah-57b53816/;;xiaolong-ma-66b98910b/",
        "or_profile": "~Gen_Li4;~Zhihao_Shu1;~Jie_Ji1;~Minghai_Qin1;~Fatemeh_Afghah1;~Wei_Niu3;~Xiaolong_Ma2",
        "aff": "Clemson University;University of Georgia;;Western Digital Corporation;Clemson University;University of Georgia;Clemson University",
        "aff_domain": "clemson.edu;uga.edu;;wdc.com;clemson.edu;uga.edu;clemson.edu",
        "position": "PhD student;PhD student;;senior technologist;Associate Professor;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nli2024data,\ntitle={Data Overfitting for On-Device Super-Resolution with Dynamic Algorithm and Compiler Co-Design},\nauthor={Gen Li and Zhihao Shu and Jie Ji and Minghai Qin and Fatemeh Afghah and Wei Niu and Xiaolong Ma},\nyear={2024},\nurl={https://openreview.net/forum?id=B3E8Y8g9GA}\n}",
        "github": "",
        "project": "",
        "reviewers": "nwgm;wfAU;J3a9;PF2v",
        "site": "https://openreview.net/forum?id=B3E8Y8g9GA",
        "pdf_size": 16068186,
        "rating": "5;5;5;6",
        "confidence": "4;3;2;3",
        "soundness": "2;3;2;3",
        "contribution": "2;3;3;2",
        "presentation": "3;2;2;3",
        "wc_summary": "75;24;97;219",
        "wc_strengths": "70;14;25;253",
        "wc_weaknesses": "66;45;22;93",
        "wc_questions": "4;108;89;25",
        "wc_review": "215;191;233;590",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "814;557;114;721",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            103.75,
            71.61485530251387
        ],
        "wc_strengths_avg": [
            90.5,
            96.13662153414795
        ],
        "wc_weaknesses_avg": [
            56.5,
            26.196373794859472
        ],
        "wc_questions_avg": [
            56.5,
            43.176961449365564
        ],
        "wc_review_avg": [
            307.25,
            163.92433467914395
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            551.5,
            268.82754695157263
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:45YcQKaSy-sJ:scholar.google.com/&scioq=Data+Overfitting+for+On-Device+Super-Resolution+with+Dynamic+Algorithm+and+Compiler+Co-Design&hl=en&as_sdt=0,33",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;2;0;1;0",
        "aff_unique_norm": "Clemson University;University of Georgia;Western Digital Corporation",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.clemson.edu;https://www.uga.edu;https://www.westerndigital.com",
        "aff_unique_abbr": "Clemson;UGA;WDC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "B4E2BW27MP",
        "title": "PromptCoT: Align Prompt Distribution via Adapted Chain-of-Thought",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Diffusion-based generative models have exhibited remarkable capability in the production of high-fidelity visual content such as images and videos. However, their performance is significantly contingent upon the quality of textual inputs, commonly referred to as \"prompts\".\n  The process of traditional prompt engineering, while effective, necessitates empirical expertise and poses challenges for inexperienced users.\n  In this paper, we introduce PromptCoT, an innovative enhancer that autonomously refines prompts for users.\n  The design of PromptCoT is based on the observation that, prompts resembling textual information corresponding to high-quality images within the training set tend to yield superior generation performance.\n  As such, we fine-tune the pre-trained Large Language Models (LLM) using a curated text dataset comprising solely of high-quality visual content descriptions. By doing so, the LLM becomes capable of capturing the distribution of high-quality training texts, enabling it to generate aligned continuations and revisions to boost the original texts.\n  Nonetheless, one drawback of pre-trained LLMs is their tendency to generate extraneous or irrelevant information. To enhance the alignment between the original text prompts and the refined counterparts, we leverage the Chain-of-Thought (CoT) mechanism. CoT can extract and amalgamate crucial information from the aligned continuation and revision, enabling reasonable inferences based on the contextual cues to produce a more comprehensive and nuanced final output. \n  Considering computational efficiency, instead of allocating a dedicated LLM for prompt enhancement to each individual model or dataset, we integrate adapters that facilitate dataset-specific adaptation, leveraging a shared pre-trained LLM as the foundation for this process. \n  By fine-tuning these adapters independently, we can adapt PromptCoT to new datasets with minimal increase in training cost and memory usage.\n  We assess the performance of PromptCoT on widely-used latent diffusion models for image and video generation to validate the effectiveness. The results demonstrate significant improvements in key performance metrics.",
        "keywords": "text-to-image generative models;prompt engineering;Chain of Thought;parameter efficient adaptation;Large Language Models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/91f80fc6717d44aa9baf63e2157ee385b815414f.pdf",
        "author": "Junyi Yao;Yijiang Liu;Zhen Dong;Mingfei Guo;Kurt Keutzer;Li Du;Daquan Zhou;Shanghang Zhang",
        "authorids": "~Junyi_Yao1;~Yijiang_Liu2;~Zhen_Dong3;~Mingfei_Guo1;~Kurt_Keutzer1;~Li_Du5;~Daquan_Zhou1;~Shanghang_Zhang4",
        "gender": "M;M;M;F;M;M;M;F",
        "homepage": ";;https://dong-zhen.com/;https://www.linkedin.com/in/mingfeiguo/;https://people.eecs.berkeley.edu/~keutzer/;;https://iscl.nju.edu.cn/main.psp;https://www.shanghangzhang.com/",
        "dblp": ";;;;k/KurtKeutzer.html;244/9623;;95/11531",
        "google_scholar": ";uOyz518AAAAJ;czxMUzcAAAAJ;;ID9QePIAAAAJ;DdCAbWwAAAAJ;;voqw10cAAAAJ",
        "orcid": "0009-0002-1437-2836;0000-0001-5914-1607;;;0000-0003-3868-8501;;0000-0003-2687-6978;",
        "linkedin": ";;zhen-dong/;;kurtkeutzer/;;;",
        "or_profile": "~Junyi_Yao1;~Yijiang_Liu2;~Zhen_Dong3;~Mingfei_Guo1;~Kurt_Keutzer1;~Zhou_Daquan1;~LI_DU4;~Shanghang_Zhang1",
        "aff": "Peking University;Nanjing Universiy;Nexusflow.ai Inc;Stanford University;University of California, Berkeley;Bytedance;Nanjing University;Peking University",
        "aff_domain": "stu.pku.edu.cn;nju.edu.cn;nexusflow.ai;stanford.edu;berkeley.edu;bytedance.com;nju.edu.cn;pku.edu.cn",
        "position": "Undergrad student;PhD student;Principal Researcher;MS student;Full Professor;Researcher;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nyao2024promptcot,\ntitle={PromptCoT: Align Prompt Distribution via Adapted Chain-of-Thought},\nauthor={Junyi Yao and Yijiang Liu and Zhen Dong and Mingfei Guo and Kurt Keutzer and Li Du and Daquan Zhou and Shanghang Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=B4E2BW27MP}\n}",
        "github": "",
        "project": "",
        "reviewers": "BjAS;zdHw;YkZW",
        "site": "https://openreview.net/forum?id=B4E2BW27MP",
        "pdf_size": 9156801,
        "rating": "3;3;6",
        "confidence": "3;3;2",
        "soundness": "2;2;3",
        "contribution": "1;2;3",
        "presentation": "2;2;3",
        "wc_summary": "115;54;111",
        "wc_strengths": "38;43;81",
        "wc_weaknesses": "226;203;2",
        "wc_questions": "8;4;264",
        "wc_review": "387;304;458",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            93.33333333333333,
            27.86076492528915
        ],
        "wc_strengths_avg": [
            54.0,
            19.200694431886227
        ],
        "wc_weaknesses_avg": [
            143.66666666666666,
            100.6125682451695
        ],
        "wc_questions_avg": [
            92.0,
            121.63332876587184
        ],
        "wc_review_avg": [
            383.0,
            62.93382768167424
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2816106117694485180&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;2;3;4;5;1;0",
        "aff_unique_norm": "Peking University;Nanjing University;Nexusflow.ai;Stanford University;University of California, Berkeley;ByteDance",
        "aff_unique_dep": ";;;;;",
        "aff_unique_url": "http://www.pku.edu.cn;http://www.nju.edu.cn;https://www.nexusflow.ai;https://www.stanford.edu;https://www.berkeley.edu;https://www.bytedance.com",
        "aff_unique_abbr": "Peking U;Nanjing U;Nexusflow.ai;Stanford;UC Berkeley;Bytedance",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Stanford;Berkeley",
        "aff_country_unique_index": "0;0;1;1;1;0;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "B4XM9nQ8Ns",
        "title": "HyperSINDy: Deep Generative Modeling of Nonlinear Stochastic Governing Equations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The discovery of governing differential equations from data is an open frontier in machine learning. The {\\em sparse identification of nonlinear dynamics} (SINDy) \\citep{brunton_discovering_2016} framework enables data-driven discovery of interpretable models in the form of sparse, deterministic governing laws. Recent works have sought to adapt this approach to the stochastic setting, though these adaptations are severely hampered by the curse of dimensionality. On the other hand, Bayesian-inspired deep learning methods have achieved widespread success in high-dimensional probabilistic modeling via computationally efficient approximate inference techniques, suggesting the use of these techniques for efficient stochastic equation discovery. Here, we introduce {\\em HyperSINDy}, a framework for modeling stochastic dynamics via a deep generative model of sparse, nonlinear governing equations whose parametric form is discovered from data. HyperSINDy employs a variational encoder to approximate the distribution of observed states and derivatives. A hypernetwork \\citep{ha_hypernetworks_2016} transforms samples from this distribution into the coefficients of a differential equation whose sparse form is learned simultaneously using a trainable binary mask \\citep{louizos_learning_2018}. Once trained, HyperSINDy generates stochastic dynamics via a differential equation whose coefficients are driven by a Wiener process. In experiments HyperSINDy accurately recovers ground truth stochastic governing equations, with stochasticity scaled to match that of the data. Finally, HyperSINDy provides uncertainty quantification that scales to high-dimensional systems, retaining computational efficiency and interpretability. Taken together, HyperSINDy offers a promising framework for model discovery and uncertainty quantification in real-world systems, integrating sparse equation discovery methods with advances in statistical machine learning and deep generative modeling.",
        "keywords": "generative modeling;deep learning;equation discovery;system identification;VAE;hypernetwork;SINDy",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/41c0846f555c3053af7c564d2f777bd42388eb26.zip",
        "author": "Mozes Jacobs;Bingni W Brunton;Steven Brunton;J. Nathan Kutz;Ryan V. Raut",
        "authorids": "~Mozes_Jacobs1;~Bingni_W_Brunton1;~Steven_Brunton1;~J._Nathan_Kutz1;~Ryan_V._Raut1",
        "gender": "M;F;M;M;M",
        "homepage": "https://mozesjacobs.github.io;https://www.bingbrunton.com;https://eigensteve.com;http://faculty.washington.edu/kutz;https://ryraut.github.io/",
        "dblp": ";138/7786;;;",
        "google_scholar": ";UftAYPkAAAAJ;TjzWdigAAAAJ;;fafSHeYAAAAJ",
        "orcid": ";0000-0002-4831-3466;;0000-0002-6004-2275;0000-0002-8761-1431",
        "linkedin": ";;;;",
        "or_profile": "~Mozes_Jacobs1;~Bingni_W_Brunton1;~Steven_Brunton1;~J._Nathan_Kutz1;~Ryan_V._Raut1",
        "aff": "Harvard University, Harvard University;University of Washington, Seattle;;University of Washington;Allen Institute",
        "aff_domain": "g.harvard.edu;uw.edu;;u.washington.edu;alleninstitute.org",
        "position": "PhD student;Associate Professor;;Full Professor;Researcher",
        "bibtex": "@misc{\njacobs2024hypersindy,\ntitle={Hyper{SIND}y: Deep Generative Modeling of Nonlinear Stochastic Governing Equations},\nauthor={Mozes Jacobs and Bingni W Brunton and Steven Brunton and J. Nathan Kutz and Ryan V. Raut},\nyear={2024},\nurl={https://openreview.net/forum?id=B4XM9nQ8Ns}\n}",
        "github": "",
        "project": "",
        "reviewers": "WJp7;7UM6;Bwz8;UKtm;cj4i;kqcu",
        "site": "https://openreview.net/forum?id=B4XM9nQ8Ns",
        "pdf_size": 16711409,
        "rating": "5;5;6;6;6;8",
        "confidence": "5;3;5;3;3;3",
        "soundness": "2;2;3;3;2;4",
        "contribution": "2;2;3;3;2;4",
        "presentation": "3;3;3;3;3;4",
        "wc_summary": "135;58;30;75;78;79",
        "wc_strengths": "58;32;62;34;48;147",
        "wc_weaknesses": "68;122;17;55;38;73",
        "wc_questions": "78;32;441;83;112;100",
        "wc_review": "339;244;550;247;276;399",
        "wc_reply_reviewers": "0;47;9;39;0;77",
        "wc_reply_authors": "715;1489;1405;501;875;1155",
        "reply_reviewers": "0;1;1;1;0;1",
        "reply_authors": "1;3;2;1;2;3",
        "rating_avg": [
            6.0,
            1.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.7453559924999298
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.7453559924999298
        ],
        "presentation_avg": [
            3.1666666666666665,
            0.3726779962499649
        ],
        "wc_summary_avg": [
            75.83333333333333,
            31.450578514375355
        ],
        "wc_strengths_avg": [
            63.5,
            38.96045003162395
        ],
        "wc_weaknesses_avg": [
            62.166666666666664,
            32.67729418962892
        ],
        "wc_questions_avg": [
            141.0,
            136.4648916999045
        ],
        "wc_review_avg": [
            342.5,
            107.63015376742709
        ],
        "wc_reply_reviewers_avg": [
            28.666666666666668,
            28.311756490114767
        ],
        "wc_reply_authors_avg": [
            1023.3333333333334,
            358.17950186401725
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.3535533905932737,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5622348542617702222&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "Harvard University;University of Washington;Allen Institute for Artificial Intelligence",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.harvard.edu;https://www.washington.edu;https://allenai.org",
        "aff_unique_abbr": "Harvard;UW;AI2",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Seattle",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "B4nhr6OJWI",
        "title": "Instilling Inductive Biases with Subnetworks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Despite the recent success of artificial neural networks on a variety of tasks, we have little knowledge or control over the exact solutions these models implement. Instilling inductive biases \u2014 preferences for some solutions over others \u2014 into these models is one promising path toward understanding and controlling their behavior. Much work has been done to study the inherent inductive biases of models and instill different inductive biases through hand-designed architectures or carefully curated training regimens. In this work, we explore a more mechanistic approach: Subtask Induction. Our method discovers a functional subnetwork that implements a particular subtask within a trained model and uses it to instill inductive biases towards solutions utilizing that subtask. Subtask Induction is flexible and efficient, and we demonstrate its effectiveness with two experiments. First, we show that Subtask Induction significantly reduces the amount of training data required for a model to adopt a specific, generalizable solution to a modular arithmetic task. Second, we demonstrate that Subtask Induction successfully induces a human-like shape bias while increasing data efficiency for convolutional and transformer-based image classification models.",
        "keywords": "inductive bias;generalization",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Enyan Zhang;Michael A. Lepori;Ellie Pavlick",
        "authorids": "~Enyan_Zhang1;~Michael_A._Lepori1;~Ellie_Pavlick1",
        "gender": ";M;F",
        "homepage": "https://enyanz.com;https://lepori.xyz/;http://cs.brown.edu/people/epavlick/",
        "dblp": ";262/0162;141/4059",
        "google_scholar": "qbL4zikAAAAJ;G1fepc8AAAAJ;sFyrSa8AAAAJ",
        "orcid": ";;",
        "linkedin": ";michael-lepori-925426124/;",
        "or_profile": "~Enyan_Zhang1;~Michael_A._Lepori1;~Ellie_Pavlick1",
        "aff": "Brown University;Brown University;Brown University",
        "aff_domain": "brown.edu;brown.edu;brown.edu",
        "position": "Undergrad student;PhD student;Assistant Professor",
        "bibtex": "@misc{\nzhang2024instilling,\ntitle={Instilling Inductive Biases with Subnetworks},\nauthor={Enyan Zhang and Michael A. Lepori and Ellie Pavlick},\nyear={2024},\nurl={https://openreview.net/forum?id=B4nhr6OJWI}\n}",
        "github": "",
        "project": "",
        "reviewers": "wyEr;pnkg;PuHj",
        "site": "https://openreview.net/forum?id=B4nhr6OJWI",
        "pdf_size": 1727742,
        "rating": "6;6;8",
        "confidence": "3;3;3",
        "soundness": "3;2;4",
        "contribution": "3;2;3",
        "presentation": "4;4;4",
        "wc_summary": "78;268;116",
        "wc_strengths": "17;31;116",
        "wc_weaknesses": "87;154;92",
        "wc_questions": "349;282;22",
        "wc_review": "531;735;346",
        "wc_reply_reviewers": "96;0;0",
        "wc_reply_authors": "1495;1713;339",
        "reply_reviewers": "2;0;0",
        "reply_authors": "4;3;1",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            4.0,
            0.0
        ],
        "wc_summary_avg": [
            154.0,
            82.0893821798329
        ],
        "wc_strengths_avg": [
            54.666666666666664,
            43.74420596553966
        ],
        "wc_weaknesses_avg": [
            111.0,
            30.474032661705056
        ],
        "wc_questions_avg": [
            217.66666666666666,
            141.0350626223454
        ],
        "wc_review_avg": [
            537.3333333333334,
            158.87171624371098
        ],
        "wc_reply_reviewers_avg": [
            32.0,
            45.254833995939045
        ],
        "wc_reply_authors_avg": [
            1182.3333333333333,
            602.931357803044
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6901432766231011120&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Brown University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.brown.edu",
        "aff_unique_abbr": "Brown",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "P2Seg: Pointly-supervised Segmentation via Mutual Distillation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19231",
        "id": "B4vzu2aokv",
        "author_site": "Zipeng Wang, Xuehui Yu, Xumeng Han, Wenwen Yu, Zhixun Huang, Jianbin Jiao, Zhenjun Han",
        "tldr": "",
        "abstract": "Point-level Supervised Instance Segmentation (PSIS) aims to enhance the applicability and scalability of instance segmentation by utilizing low-cost yet instance-informative annotations. Existing PSIS methods usually rely on positional information to distinguish objects, but predicting precise boundaries remains challenging due to the lack of contour annotations. Nevertheless, weakly supervised semantic segmentation methods are proficient in utilizing intra-class feature consistency to capture the boundary contours of the same semantic regions. In this paper, we design a Mutual Distillation Module (MDM) to leverage the complementary strengths of both instance position and semantic information and achieve accurate instance-level object perception. The MDM consists of Semantic to Instance (S2I) and Istance to Semantic (I2S). S2I is guided by the precise boundaries of semantic regions to learn the association between annotated points and instance contours. I2S leverages discriminative relationships between instances to facilitate the differentiation of various objects within the semantic map. Extensive experiments substantiate the efficacy of MDM in fostering the synergy between instance and semantic information, consequently improving the quality of instance-level object representations. Our method achieves 55.7 mAP50 and 17.6 mAP on the PASCAL VOC and MS COCO datasets, significantly outperforming recent PSIS methods and several box-supervised instance segmentation competitors.",
        "keywords": "Mutual Distillation;Semantic to Instance;Instance to Semantic;Point-level Supervised Instance Segmentation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/86d4f1caa1f211657373db8c23b9b64e7d261e1c.pdf",
        "author": "Zipeng Wang;Xuehui Yu;Xumeng Han;Wenwen Yu;Zhixun Huang;Jianbin Jiao;Zhenjun Han",
        "authorids": "~Zipeng_Wang2;~Xuehui_Yu1;~Xumeng_Han1;~Wenwen_Yu2;~Zhixun_Huang1;~Jianbin_Jiao1;~Zhenjun_Han1",
        "gender": "M;M;;;M;M;M",
        "homepage": "https://vision.ucas.ac.cn/;;http://vision.ucas.ac.cn/;;http://lamp.ucas.ac.cn/;https://people.ucas.ac.cn/~hanzhj;https://yinglang.github.io/",
        "dblp": ";297/3745;;;;11/2938;243/8603",
        "google_scholar": ";https://scholar.google.cz/citations?user=LWu_FiQAAAAJ;;;;0rK4yTcAAAAJ;WYrxoBEAAAAJ",
        "orcid": ";0000-0002-1636-463X;;0000-0002-8941-2700;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Zipeng_Wang2;~Xumeng_Han1;~Wenwen_Yu2;~Zhixun_Huang1;~Jianbin_Jiao1;~Zhenjun_Han1;~hui_ying2",
        "aff": "University of Chinese Academy of Sciences;University of Chinese Academy of Sciences;University of Chinese Academy of Sciences;;University of Chinese Academy of Sciences;University of Chinese Academy of Sciences;University of Chinese Academy of Sciences",
        "aff_domain": "ucas.ac.cn;ucas.ac.cn;ucas.ac.cn;;ucas.ac.cn;ucas.ac.cn;mails.ucas.ac.cn",
        "position": "MS student;PhD student;MS student;;Full Professor;Associate Professor;PhD student",
        "bibtex": "@inproceedings{\nwang2024pseg,\ntitle={P2Seg: Pointly-supervised Segmentation via Mutual Distillation},\nauthor={Zipeng Wang and Xuehui Yu and Xumeng Han and Wenwen Yu and Zhixun Huang and Jianbin Jiao and Zhenjun Han},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=B4vzu2aokv}\n}",
        "github": "",
        "project": "",
        "reviewers": "QcUt;3EDk;ZJkY;enoR;fR5S",
        "pdf_size": 2915691,
        "rating": "3;6;6;6;8",
        "confidence": "4;4;3;4;5",
        "soundness": "1;3;3;2;3",
        "contribution": "2;3;3;2;3",
        "presentation": "2;2;3;1;3",
        "wc_summary": "45;67;39;104;76",
        "wc_strengths": "125;65;29;12;95",
        "wc_weaknesses": "983;189;134;134;164",
        "wc_questions": "39;57;15;4;9",
        "wc_review": "1192;378;217;254;344",
        "wc_reply_reviewers": "58;16;66;28;0",
        "wc_reply_authors": "2791;1410;1491;1448;1015",
        "reply_reviewers": "1;1;1;1;0",
        "reply_authors": "5;2;3;2;2",
        "rating_avg": [
            5.8,
            1.6
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.4,
            0.8
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.2,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            66.2,
            23.301502097504358
        ],
        "wc_strengths_avg": [
            65.2,
            41.48445491988535
        ],
        "wc_weaknesses_avg": [
            320.8,
            331.73929523045655
        ],
        "wc_questions_avg": [
            24.8,
            20.08382433701311
        ],
        "wc_review_avg": [
            477.0,
            362.2275527896794
        ],
        "wc_reply_reviewers_avg": [
            33.6,
            24.96076921891631
        ],
        "wc_reply_authors_avg": [
            1631.0,
            604.4809343560804
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4
        ],
        "reply_authors_avg": [
            2.8,
            1.16619037896906
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.3952847075210474,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7416667966264732466&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=B4vzu2aokv",
        "pdf": "https://openreview.net/pdf?id=B4vzu2aokv",
        "email": "ucas.ac.cn;ucas.ac.cn;ucas.ac.cn;;ucas.ac.cn;ucas.ac.cn;mails.ucas.ac.cn",
        "author_num": 7,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "University of Chinese Academy of Sciences",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.ucas.ac.cn",
        "aff_unique_abbr": "UCAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "B5CgCJY2po",
        "title": "Flood and Echo: Algorithmic Alignment of GNNs with Distributed Computing",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph Neural Networks are a natural fit for learning algorithms. They can directly represent tasks through an abstract but versatile graph structure and handle inputs of different sizes. This opens up the possibility for scaling and extrapolation to larger graphs, one of the most important advantages of an algorithm. However, this raises two core questions i) How can we enable nodes to gather the required information in a given graph ($\\textit{information exchange}$), even if is far away and ii) How can we design an execution framework which enables this information exchange for extrapolation to larger graph sizes ($\\textit{algorithmic alignment for extrapolation}$). We propose a new execution framework that is inspired by the design principles of distributed algorithms: Flood and Echo Net. It propagates messages through the entire graph in a wave like activation pattern, which naturally generalizes to larger instances. Through its sparse but parallel activations it is provably more efficient in terms of message complexity. We study the proposed model and provide both empirical evidence and theoretical insights in terms of its expressiveness, efficiency, information exchange and ability to extrapolate.",
        "keywords": "GNN;Extrapolation;Algorithm Learning;Distributed Computing",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Jo\u00ebl Mathys;Florian Gr\u00f6tschla;Kalyan Varma Nadimpalli;Roger Wattenhofer",
        "authorids": "~Jo\u00ebl_Mathys1;~Florian_Gr\u00f6tschla1;~Kalyan_Varma_Nadimpalli1;~Roger_Wattenhofer1",
        "gender": ";M;M;Not Specified",
        "homepage": ";https://disco.ethz.ch/members/fgroetschla;;https://disco.ethz.ch/members/wroger",
        "dblp": ";334/1811;;w/RogerWattenhofer",
        "google_scholar": ";;5fONIZkAAAAJ;https://scholar.google.ch/citations?user=EG3VPm4AAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;roger-wattenhofer-4466731/",
        "or_profile": "~Jo\u00ebl_Mathys1;~Florian_Gr\u00f6tschla1;~Kalyan_Varma_Nadimpalli1;~Roger_Wattenhofer1",
        "aff": ";Oracle Labs;Department of Computer Science, Indian Institute of Technology, Madras, Indian Institute of Technology, Madras;Swiss Federal Institute of Technology",
        "aff_domain": ";oracle.com;cse.iitm.ac.in;ethz.ch",
        "position": ";Intern;Intern;Full Professor",
        "bibtex": "@misc{\nmathys2024flood,\ntitle={Flood and Echo: Algorithmic Alignment of {GNN}s with Distributed Computing},\nauthor={Jo{\\\"e}l Mathys and Florian Gr{\\\"o}tschla and Kalyan Varma Nadimpalli and Roger Wattenhofer},\nyear={2024},\nurl={https://openreview.net/forum?id=B5CgCJY2po}\n}",
        "github": "",
        "project": "",
        "reviewers": "gPuo;VsT5;hXqD;W7g1",
        "site": "https://openreview.net/forum?id=B5CgCJY2po",
        "pdf_size": 952795,
        "rating": "3;3;5;8",
        "confidence": "4;4;4;3",
        "soundness": "2;2;1;4",
        "contribution": "2;1;1;4",
        "presentation": "2;3;1;4",
        "wc_summary": "62;79;139;29",
        "wc_strengths": "67;71;48;46",
        "wc_weaknesses": "260;128;238;45",
        "wc_questions": "113;78;94;49",
        "wc_review": "502;356;519;169",
        "wc_reply_reviewers": "157;125;0;0",
        "wc_reply_authors": "1071;1557;935;383",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "2;3;2;1",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            1.0897247358851685
        ],
        "contribution_avg": [
            2.0,
            1.224744871391589
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            77.25,
            39.927277643235335
        ],
        "wc_strengths_avg": [
            58.0,
            11.113055385446435
        ],
        "wc_weaknesses_avg": [
            167.75,
            86.7363101590101
        ],
        "wc_questions_avg": [
            83.5,
            23.4574082114798
        ],
        "wc_review_avg": [
            386.5,
            140.65294166849125
        ],
        "wc_reply_reviewers_avg": [
            70.5,
            71.40203078344481
        ],
        "wc_reply_authors_avg": [
            986.5,
            418.1731100871982
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9169493006161777,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:kCCViVDaxREJ:scholar.google.com/&scioq=Flood+and+Echo:+Algorithmic+Alignment+of+GNNs+with+Distributed+Computing&hl=en&as_sdt=0,47",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Oracle Corporation;Indian Institute of Technology, Madras;Swiss Federal Institute of Technology",
        "aff_unique_dep": "Oracle Labs;Department of Computer Science;",
        "aff_unique_url": "https://labs.oracle.com;https://www.iitm.ac.in;https://www.ethz.ch",
        "aff_unique_abbr": "Oracle Labs;IIT Madras;ETH Zurich",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Madras",
        "aff_country_unique_index": "0;1;2",
        "aff_country_unique": "United States;India;Switzerland"
    },
    {
        "id": "B5Tp4WwZl8",
        "title": "Error Feedback Shines when Features are Rare",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We provide the first proof that gradient descent $\\left({\\color{green}\\sf GD}\\right)$ with greedy sparsification $\\left({\\color{green}\\sf TopK}\\right)$ and error feedback $\\left({\\color{green}\\sf EF}\\right)$ can obtain better communication complexity than vanilla ${\\color{green}\\sf GD}$ when solving the distributed optimization problem $\\min_{x\\in \\mathbb{R}^d} {f(x)=\\frac{1}{n}\\sum_{i=1}^n f_i(x)}$, where $n$ = # of clients, $d$ = # of features, and $f_1,\\dots,f_n$ are smooth nonconvex functions. Despite intensive research since 2014 when ${\\color{green}\\sf EF}$ was first proposed by Seide et al., this problem remained open until now. Perhaps surprisingly, we show that ${\\color{green}\\sf EF}$ shines in the regime when features are rare, i.e., when each feature is present in the data owned by a small number of clients only. To illustrate our main result, we show that in order to find a random vector $\\hat{x}$ such that $\\lVert {\\nabla f(\\hat{x})} \\rVert^2 \\leq \\varepsilon$ in expectation, ${\\color{green}\\sf GD}$ with the ${\\color{green}\\sf Top1}$ sparsifier and ${\\color{green}\\sf EF}$ requires ${\\cal O} \\left( \\left( L +\n{\\color{blue}r} \\sqrt{ \\frac{{\\color{red}c}}{n} \\min \\left( \\frac{{\\color{red}c}}{n} \\max_i L_i^2, \\frac{1}{n}\\sum_{i=1}^n L_i^2 \\right) }\n\\right) \\frac{1}{\\varepsilon} \\right)$ bits to be communicated by each worker to the server only, where $L$ is the smoothness constant of $f$, $L_i$ is the smoothness constant of $f_i$, ${\\color{red}c}$ is the maximal number of clients owning any feature ($1\\leq {\\color{red}c} \\leq n$), and ${\\color{blue}r}$ is the maximal number of features owned by any client ($1\\leq {\\color{blue}r} \\leq d$). Clearly, the communication complexity improves as ${\\color{red}c}$ decreases (i.e., as features become more rare), and can be much better than the ${\\cal O}({\\color{blue}r} L \\frac{1}{\\varepsilon})$ communication complexity of ${\\color{green}\\sf GD}$ in the same regime.",
        "keywords": "error feedback;greedy sparsification;distributed optimization;communication complexity",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/6584da25926a6f7cc21f5f7b17e343403d8decca.zip",
        "author": "Peter Richt\u00e1rik;Elnur Gasanov;Konstantin Pavlovich Burlachenko",
        "authorids": "~Peter_Richt\u00e1rik1;~Elnur_Gasanov1;~Konstantin_Pavlovich_Burlachenko1",
        "gender": "M;M;M",
        "homepage": "https://elnurgasanov.com;https://burlachenkok.github.io/;https://richtarik.org",
        "dblp": "231/7651;;62/8001",
        "google_scholar": ";3pA-LoQAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;0000-0003-4380-5848",
        "linkedin": ";burlachenkok/;richtarik/",
        "or_profile": "~Elnur_Gasanov1;~Konstantin_Pavlovich_Konstantin_Burlachenko1;~Peter_Richtarik1",
        "aff": "KAUST;;King Abdullah University of Science and Technology (KAUST)",
        "aff_domain": "kaust.edu.sa;;kaust.edu.sa",
        "position": "PhD student;;Full Professor",
        "bibtex": "@misc{\nricht{\\'a}rik2024error,\ntitle={Error Feedback Shines when Features are Rare},\nauthor={Peter Richt{\\'a}rik and Elnur Gasanov and Konstantin Pavlovich Burlachenko},\nyear={2024},\nurl={https://openreview.net/forum?id=B5Tp4WwZl8}\n}",
        "github": "",
        "project": "",
        "reviewers": "XpPb;h2wk;CuB9;xzAm",
        "site": "https://openreview.net/forum?id=B5Tp4WwZl8",
        "pdf_size": 1608153,
        "rating": "3;6;8;8",
        "confidence": "4;3;3;4",
        "soundness": "2;3;4;4",
        "contribution": "2;3;3;3",
        "presentation": "2;3;4;4",
        "wc_summary": "64;91;63;48",
        "wc_strengths": "41;30;19;39",
        "wc_weaknesses": "345;39;15;84",
        "wc_questions": "3;23;59;3",
        "wc_review": "453;183;156;174",
        "wc_reply_reviewers": "0;0;0;6",
        "wc_reply_authors": "2091;190;12;460",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "6;1;2;2",
        "rating_avg": [
            6.25,
            2.0463381929681126
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            66.5,
            15.5
        ],
        "wc_strengths_avg": [
            32.25,
            8.699856320652657
        ],
        "wc_weaknesses_avg": [
            120.75,
            131.81876763192713
        ],
        "wc_questions_avg": [
            22.0,
            22.869193252058544
        ],
        "wc_review_avg": [
            241.5,
            122.49591829934579
        ],
        "wc_reply_reviewers_avg": [
            1.5,
            2.598076211353316
        ],
        "wc_reply_authors_avg": [
            688.25,
            825.4351503903865
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            1.920286436967152
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3665083330689157,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:FQtWzFELb4MJ:scholar.google.com/&scioq=Error+Feedback+Shines+when+Features+are+Rare&hl=en&as_sdt=0,33",
        "gs_version_total": 7,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "King Abdullah University of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaust.edu.sa",
        "aff_unique_abbr": "KAUST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Saudi Arabia"
    },
    {
        "id": "B5kAfAC7hO",
        "title": "Provable Representation with Efficient Planning for Partially Observable Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In real-world reinforcement learning problems, the state information is often only partially observable, which breaks the basic assumption in Markov decision processes, and thus, leads to inferior performances. Partially Observable Markov Decision Processes have been introduced to explicitly take the issue into account for learning, exploration, and planning, but presenting significant computational and statistical challenges. To address these difficulties, we exploit the representation view, which leads to a coherent design framework for a practically tractable reinforcement learning algorithm upon partial observations. We provide a theoretical analysis for justifying the statistical efficiency of the proposed algorithm. We also empirically demonstrate the proposed algorithm can surpass state-of-the-art performance with partial observations across various benchmarks, therefore, pushing reliable reinforcement learning towards more practical applications.",
        "keywords": "reinforcement learning;partial observability;representation learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/fc5c4ac9bbd40be966c5edeae8b4fb523f38941d.pdf",
        "author": "Hongming Zhang;Tongzheng Ren;Chenjun Xiao;Dale Schuurmans;Bo Dai",
        "authorids": "~Hongming_Zhang3;~Tongzheng_Ren1;~Chenjun_Xiao1;~Dale_Schuurmans1;~Bo_Dai1",
        "gender": "M;M;;;",
        "homepage": "https://github.com/initial-h;https://www.cs.utexas.edu/~tzren/;https://chenjun-x.github.io/;;https://bo-dai.github.io/",
        "dblp": ";211/8004;178/8641;;64/2903",
        "google_scholar": "https://scholar.google.ca/citations?user=mwbsY3AAAAAJ;VgNDYeYAAAAJ;;;TIKl_foAAAAJ",
        "orcid": ";;0000-0002-5493-1500;;0009-0002-8070-574X",
        "linkedin": ";;;;",
        "or_profile": "~Hongming_Zhang3;~Tongzheng_Ren1;~Chenjun_Xiao1;~Dale_Schuurmans1;~Bo_Dai1",
        "aff": "University of Alberta;University of Texas, Austin;Huawei Technologies Ltd.;;Google Brain",
        "aff_domain": "ualberta.ca;utexas.edu;huawei.com;;google.com",
        "position": "PhD student;PhD student;Researcher;;Research Scientist",
        "bibtex": "@misc{\nzhang2024provable,\ntitle={Provable Representation with Efficient Planning for Partially Observable Reinforcement Learning},\nauthor={Hongming Zhang and Tongzheng Ren and Chenjun Xiao and Dale Schuurmans and Bo Dai},\nyear={2024},\nurl={https://openreview.net/forum?id=B5kAfAC7hO}\n}",
        "github": "",
        "project": "",
        "reviewers": "rUpE;wQNF;cvkF",
        "site": "https://openreview.net/forum?id=B5kAfAC7hO",
        "pdf_size": 1082436,
        "rating": "5;5;6",
        "confidence": "3;3;3",
        "soundness": "3;2;2",
        "contribution": "2;3;2",
        "presentation": "1;1;2",
        "wc_summary": "99;48;72",
        "wc_strengths": "58;63;142",
        "wc_weaknesses": "172;280;195",
        "wc_questions": "120;63;24",
        "wc_review": "449;454;433",
        "wc_reply_reviewers": "1246;0;0",
        "wc_reply_authors": "2250;479;457",
        "reply_reviewers": "3;0;0",
        "reply_authors": "5;1;1",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            73.0,
            20.83266665599966
        ],
        "wc_strengths_avg": [
            87.66666666666667,
            38.473656210740124
        ],
        "wc_weaknesses_avg": [
            215.66666666666666,
            46.449494674921446
        ],
        "wc_questions_avg": [
            69.0,
            39.42080668885405
        ],
        "wc_review_avg": [
            445.3333333333333,
            8.9566858950296
        ],
        "wc_reply_reviewers_avg": [
            415.3333333333333,
            587.3700329056255
        ],
        "wc_reply_authors_avg": [
            1062.0,
            840.0908681009851
        ],
        "reply_reviewers_avg": [
            1.0,
            1.4142135623730951
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            1.8856180831641267
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5187570997639685783&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "University of Alberta;University of Texas at Austin;Huawei;Google",
        "aff_unique_dep": ";;Huawei Technologies;Google Brain",
        "aff_unique_url": "https://www.ualberta.ca;https://www.utexas.edu;https://www.huawei.com;https://brain.google.com",
        "aff_unique_abbr": "UAlberta;UT Austin;Huawei;Google Brain",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Austin;Mountain View",
        "aff_country_unique_index": "0;1;2;1",
        "aff_country_unique": "Canada;United States;China"
    },
    {
        "title": "ToolChain*: Efficient Action Space Navigation in Large Language Models with A* Search",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19230",
        "id": "B6pQxqUcT8",
        "author_site": "Yuchen Zhuang, Xiang Chen, Tong Yu, Saayan Mitra, Victor Bursztyn, Ryan Rossi, Somdeb Sarkhel, Chao Zhang",
        "tldr": "",
        "abstract": "Large language models (LLMs) have demonstrated powerful decision-making and planning capabilities in solving complicated real-world problems. LLM-based autonomous agents can interact with diverse tools (e.g., functional APIs) and generate solution plans that execute a series of API function calls in a step-by-step manner. The multitude of candidate API function calls significantly expands the action space, amplifying the critical need for efficient action space navigation. However, existing methods either struggle with unidirectional exploration in expansive action spaces, trapped into a locally optimal solution, or suffer from exhaustively traversing all potential actions, causing inefficient navigation. To address these issues, we propose ToolChain*, an efficient tree search-based planning algorithm for LLM-based agents. It formulates the entire action space as a decision tree, where each node represents a possible API function call involved in a solution plan. By incorporating the A$^*$ search algorithm with task-specific cost function design, it efficiently prunes high-cost branches that may involve incorrect actions, identifying the most low-cost valid path as the solution. Extensive experiments on multiple tool-use and reasoning tasks demonstrate that ToolChain* efficiently balances exploration and exploitation within an expansive action space. It outperforms state-of-the-art baselines on planning and reasoning tasks by 3.1% and 3.5% on average while requiring 7.35x and 2.31x less time, respectively.",
        "keywords": "Large Language Model;Tool Use;Tree Search;A* Search",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Yuchen Zhuang;Xiang Chen;Tong Yu;Saayan Mitra;Victor Bursztyn;Ryan A. Rossi;Somdeb Sarkhel;Chao Zhang",
        "authorids": "~Yuchen_Zhuang1;~Xiang_Chen9;~Tong_Yu3;~Saayan_Mitra1;~Victor_Bursztyn1;~Ryan_A._Rossi2;~Somdeb_Sarkhel2;~Chao_Zhang15",
        "gender": "M;M;;;M;;M;",
        "homepage": "https://night-chen.github.io/;;https://www.linkedin.com/in/tong-yu-42790744;;https://vbursztyn.github.io/;;http://www.utdallas.edu/~somdeb.sarkhel/;http://chaozhang.org/",
        "dblp": "191/5231.html;;32/1593-1;;154/7800.html;;138/5583;94/3019-14",
        "google_scholar": "T-f6XlEAAAAJ;aPq10m4AAAAJ;https://scholar.google.com/citations?hl=en;;HRx3epUAAAAJ;;ZrJWmUoAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;0000-0002-5991-2050;;;;0009-0006-2055-9647;0000-0003-3009-598X",
        "linkedin": ";;tong-yu-42790744;;;;somdebsarkhel;",
        "or_profile": "~Yuchen_Zhuang1;~Xiang_Chen9;~Tong_Yu3;~Saayan_Mitra1;~Victor_Bursztyn1;~Ryan_A._Rossi2;~Somdeb_Sarkhel2;~Chao_Zhang15",
        "aff": "Georgia Institute of Technology;Adobe Systems;Adobe Research;;Adobe Systems;;Adobe Research;Georgia Institute of Technology",
        "aff_domain": "gatech.edu;adobe.com;adobe.com;;adobe.com;;adobe.com;gatech.edu",
        "position": "PhD student;Researcher;Senior Research Scientist;;Researcher;;Research Scientist;Assistant Professor",
        "bibtex": "@inproceedings{\nzhuang2024toolchain,\ntitle={ToolChain*: Efficient Action Space Navigation in Large Language Models with A* Search},\nauthor={Yuchen Zhuang and Xiang Chen and Tong Yu and Saayan Mitra and Victor Bursztyn and Ryan A. Rossi and Somdeb Sarkhel and Chao Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=B6pQxqUcT8}\n}",
        "github": "",
        "project": "",
        "reviewers": "tHXf;7Kjr;52p8;gdT8",
        "pdf_size": 809133,
        "rating": "6;8;8;8",
        "confidence": "4;5;3;3",
        "soundness": "3;4;3;4",
        "contribution": "2;4;3;4",
        "presentation": "4;4;3;4",
        "wc_summary": "65;84;141;97",
        "wc_strengths": "27;124;101;58",
        "wc_weaknesses": "17;26;184;78",
        "wc_questions": "133;93;232;96",
        "wc_review": "242;327;658;329",
        "wc_reply_reviewers": "91;23;0;13",
        "wc_reply_authors": "680;471;2983;1632",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "2;2;6;4",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            96.75,
            27.9676152004421
        ],
        "wc_strengths_avg": [
            77.5,
            37.566607512523674
        ],
        "wc_weaknesses_avg": [
            76.25,
            66.42429901775404
        ],
        "wc_questions_avg": [
            138.5,
            56.233886580957574
        ],
        "wc_review_avg": [
            389.0,
            159.2278242016765
        ],
        "wc_reply_reviewers_avg": [
            31.75,
            35.16656793035112
        ],
        "wc_reply_authors_avg": [
            1441.5,
            991.7490862108218
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.5,
            1.6583123951777
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.17407765595569782,
        "gs_citation": 52,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1777782046065029064&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=B6pQxqUcT8",
        "pdf": "https://openreview.net/pdf?id=B6pQxqUcT8",
        "email": "gatech.edu;adobe.com;adobe.com;;adobe.com;;adobe.com;gatech.edu",
        "author_num": 8,
        "aff_unique_index": "0;1;1;1;1;0",
        "aff_unique_norm": "Georgia Institute of Technology;Adobe",
        "aff_unique_dep": ";Adobe Systems Incorporated",
        "aff_unique_url": "https://www.gatech.edu;https://www.adobe.com",
        "aff_unique_abbr": "Georgia Tech;Adobe",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "B6t5wy6g5a",
        "title": "Aligning Large Multimodal Models with Factually Augmented RLHF",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large Multimodal Models (LMM) are built across modalities and the misalignment between two modalities can result in ``hallucination'', generating textual outputs that are not grounded by the multimodal information in context. To address the multimodal misalignment issue, we adapt the Reinforcement Learning from Human Feedback (RLHF) from the text domain to the vision-language alignment, where human annotators are asked to compare two responses and pinpoint the more hallucinated one, and the vision-language model is trained to maximize the simulated human rewards. We propose a new alignment algorithm called Factually Augmented RLHF that augments the reward model with additional factual information such as image captions and ground-truth multi-choice options, which alleviates the reward hacking phenomenon in RLHF and further improves the performance. We also enhance the GPT-4-generated training data (for vision instruction tuning) with previously available human-written image-text pairs to improve the general capabilities of our model. To evaluate the proposed approach in real-world scenarios, we develop a new evaluation benchmark MMHAL-BENCH with a special focus on penalizing hallucinations. As the first LMM trained with RLHF, our approach achieves remarkable improvement on the LLaVA-Bench\ndataset with the 96% performance level of the text-only GPT-4 (while previous best methods can only achieve the 87% level), and an improvement of 60% on MMHAL-BENCH over other baselines",
        "keywords": "AI Alignment;Large Multimodal Models;RLHF",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/6d4dd4d9d307ffd69f22ae293cbcf93dd5b96315.zip",
        "author": "Zhiqing Sun;Sheng Shen;Shengcao Cao;Haotian Liu;Chunyuan Li;Yikang Shen;Chuang Gan;Liangyan Gui;Yu-Xiong Wang;Yiming Yang;Kurt Keutzer;Trevor Darrell",
        "authorids": "~Zhiqing_Sun1;~Sheng_Shen2;~Shengcao_Cao1;~Haotian_Liu1;~Chunyuan_Li1;~Yikang_Shen1;~Chuang_Gan1;~Liangyan_Gui1;~Yu-Xiong_Wang1;~Yiming_Yang1;~Kurt_Keutzer1;~Trevor_Darrell2",
        "gender": "M;M;M;;;M;M;F;;F;M;M",
        "homepage": "https://www.cs.cmu.edu/~zhiqings/;https://sincerass.github.io;https://shengcao-cao.github.io/;https://hliu.cc;http://chunyuan.li/;;http://people.csail.mit.edu/ganchuang/;;https://yxw.cs.illinois.edu/;http://www.cs.cmu.edu/~yiming/;https://people.eecs.berkeley.edu/~keutzer/;https://people.eecs.berkeley.edu/~trevor/",
        "dblp": "211/7692;138/5764-1.html;236/4681;66/10511;64/9590;152/8226;139/6993;155/5055;35/10700;25/1666;k/KurtKeutzer.html;d/TrevorDarrell",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en;yMYTz3AAAAAJ;Xo6wfnQAAAAJ;Zd7WmXUAAAAJ;qff5rRYAAAAJ;PTeSCbIAAAAJ;3aE0r9QAAAAJ;T_Q-xDkAAAAJ;MlZq4XwAAAAJ;ID9QePIAAAAJ;https://scholar.google.com.tw/citations?user=bh-uRFMAAAAJ",
        "orcid": ";;;;;;;;;0000-0001-8322-607X;0000-0003-3868-8501;",
        "linkedin": "zhiqing-sun-5781b3100/;sheng-s-ab198a174/;;;;;;;;yiming-yang-24100924/;kurtkeutzer/;",
        "or_profile": "~Zhiqing_Sun1;~Sheng_Shen2;~Shengcao_Cao1;~Haotian_Liu1;~Chunyuan_Li1;~Yikang_Shen1;~Chuang_Gan1;~Liangyan_Gui1;~Yu-Xiong_Wang1;~Yiming_Yang1;~Kurt_Keutzer1;~trevor_darrell1",
        "aff": "Carnegie Mellon University;University of California, Berkeley;Adobe Systems;Department of Computer Science, University of Wisconsin - Madison;Microsoft Research;International Business Machines;University of Massachusetts at Amherst;UIUC;Department of Computer Science, University of Illinois Urbana-Champaign;School of Computer Science, Carnegie Mellon University;University of California, Berkeley;Electrical Engineering & Computer Science Department",
        "aff_domain": "cs.cmu.edu;berkeley.edu;adobe.com;cs.wisc.edu;microsoft.com;ibm.com;umass.edu;cs.illinois.edu;cs.illinois.edu;cs.cmu.edu;berkeley.edu;eecs.berkeley.edu",
        "position": "PhD student;PhD student;Intern;PhD student;Principal Researcher;Researcher;Assistant Professor;Assistant Professor;Assistant Professor;Full Professor;Full Professor;Professor",
        "bibtex": "@misc{\nsun2024aligning,\ntitle={Aligning Large Multimodal Models with Factually Augmented {RLHF}},\nauthor={Zhiqing Sun and Sheng Shen and Shengcao Cao and Haotian Liu and Chunyuan Li and Yikang Shen and Chuang Gan and Liangyan Gui and Yu-Xiong Wang and Yiming Yang and Kurt Keutzer and Trevor Darrell},\nyear={2024},\nurl={https://openreview.net/forum?id=B6t5wy6g5a}\n}",
        "github": "",
        "project": "",
        "reviewers": "Kjps;Y7nK;XL3H;vv7w",
        "site": "https://openreview.net/forum?id=B6t5wy6g5a",
        "pdf_size": 4291360,
        "rating": "3;5;6;6",
        "confidence": "3;3;4;4",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "1;3;2;3",
        "wc_summary": "247;181;46;46",
        "wc_strengths": "45;49;80;55",
        "wc_weaknesses": "45;193;74;113",
        "wc_questions": "71;4;2;42",
        "wc_review": "408;427;202;256",
        "wc_reply_reviewers": "0;137;0;0",
        "wc_reply_authors": "266;1215;271;355",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            130.0,
            87.18084652032235
        ],
        "wc_strengths_avg": [
            57.25,
            13.608361400256829
        ],
        "wc_weaknesses_avg": [
            106.25,
            55.59395200918891
        ],
        "wc_questions_avg": [
            29.75,
            28.656369274560934
        ],
        "wc_review_avg": [
            323.25,
            96.39858660789587
        ],
        "wc_reply_reviewers_avg": [
            34.25,
            59.322740159234044
        ],
        "wc_reply_authors_avg": [
            526.75,
            398.93130674340415
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            12,
            0
        ],
        "corr_rating_confidence": 0.8164965809277259,
        "gs_citation": 310,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17054470781093797244&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 10,
        "aff_unique_index": "0;1;2;3;4;5;6;7;7;0;1;8",
        "aff_unique_norm": "Carnegie Mellon University;University of California, Berkeley;Adobe;University of Wisconsin-Madison;Microsoft;International Business Machines Corporation;University of Massachusetts Amherst;University of Illinois Urbana-Champaign;Electrical Engineering & Computer Science Department",
        "aff_unique_dep": ";;Adobe Systems Incorporated;Department of Computer Science;Microsoft Research;;;;Electrical Engineering & Computer Science",
        "aff_unique_url": "https://www.cmu.edu;https://www.berkeley.edu;https://www.adobe.com;https://www.wisc.edu;https://www.microsoft.com/en-us/research;https://www.ibm.com;https://www.umass.edu;https://www illinois.edu;",
        "aff_unique_abbr": "CMU;UC Berkeley;Adobe;UW-Madison;MSR;IBM;UMass Amherst;UIUC;",
        "aff_campus_unique_index": "1;2;3;4;4;5;1",
        "aff_campus_unique": ";Berkeley;Madison;Amherst;Urbana-Champaign;Pittsburgh",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States;"
    },
    {
        "id": "B8FA2ixkPN",
        "title": "GML-NeRF: Gate-guided Mutual Learning Framework for Neural Rendering",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Although the neural radiance field (NeRF) exhibits high-fidelity visualization on the rendering task, it still suffers from rendering defects in complex scenes. One of the primary reasons is the limited model capacity. However, directly increasing the network's width and depth cannot significantly improve the rendering quality. To address this issue, existing work adopts scene partitioning and assigns different 3D points to different network parameters. However, a 3D point may be invisible to some rays due to occlusions in complex scenes. On such a point, training with those rays that do not contain valid information about the point might interfere with the NeRF training. Based on the above intuition, we allocate model parameters in the ray dimension and propose a Gate-guided Mutual Learning framework for neural rendering (GML-NeRF). Specifically, we construct an ensemble of sub-NeRFs and train a soft gate module to assign the gating scores to these sub-NeRFs based on specific rays. The gate module is jointly optimized with the sub-NeRF ensemble, enabling it to learn the preference of sub-NeRFs for different rays automatically. Furthermore, we introduce depth-based mutual learning to enhance the rendering consistency among multiple sub-NeRFs and mitigate the depth ambiguity. Experiments on five diverse datasets demonstrate that GML-NeRF can enhance the rendering performance across a wide range of scene types compared with existing single-NeRF and multi-NeRF methods.",
        "keywords": "Neural rendering field;Mutual learning;Novel view synthesis;Soft gate module;Complex scenes with occlusions",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/b7bf1ebeba43dc63e6dbfdf5967837783eadc7d7.zip",
        "author": "Lidong Guo;Xuefei Ning;Yonggan Fu;Tianchen Zhao;Zhuoliang Kang;Jincheng Yu;Yingyan Celine Lin;Yu Wang",
        "authorids": "~Lidong_Guo1;~Xuefei_Ning1;~Yonggan_Fu1;~Tianchen_Zhao2;~Zhuoliang_Kang3;~Jincheng_Yu2;~Yingyan_Celine_Lin1;~Yu_Wang3",
        "gender": "M;Not Specified;M;M;M;M;M;F",
        "homepage": ";https://nics-effalg.com/ningxuefei/;https://www.yongganfu.com/;https://nicsefc.ee.tsinghua.edu.cn/people/tianchen-zhao/;https://zhuoliang.me/;http://nicsefc.ee.tsinghua.edu.cn/people/JinchengYu;https://nicsefc.ee.tsinghua.edu.cn;https://eiclab.scs.gatech.edu/",
        "dblp": "233/2101;202/9525;244/8166;217/2471;;;w/YuWang2.html;120/6981",
        "google_scholar": ";oVslpJsAAAAJ;https://scholar.google.com/citations?hl=en;;W1ZXjMkAAAAJ;1UDGpucAAAAJ;https://scholar.google.com.hk/citations?user=j8JGVvoAAAAJ;dio8IesAAAAJ",
        "orcid": "0000-0003-4162-6360;;;;;;0000-0001-6108-5157;",
        "linkedin": ";;yonggan-fu-b211831b0;;;;;yingyan-celine-lin-a281211a/",
        "or_profile": "~Lidong_Guo1;~Xuefei_Ning1;~Yonggan_Fu1;~Tianchen_Zhao2;~Zhuoliang_Kang3;~Jincheng_Yu2;~Yu_Wang3;~Yingyan_Lin1",
        "aff": "Tsinghua University;Tsinghua University;Georgia Institute of Technology;Infinigence;Meituan;;Tsinghua University;Georgia Institute of Technology",
        "aff_domain": "tsinghua.edu.cn;tsinghua.edu.cn;gatech.edu;infini-ai.com;meituan.com;;tsinghua.edu.cn;gatech.edu",
        "position": "PhD student;Research Assistant Professor;PhD student;Intern;Researcher;;Full Professor;Associate Professor",
        "bibtex": "@misc{\nguo2024gmlnerf,\ntitle={{GML}-Ne{RF}: Gate-guided Mutual Learning Framework for Neural Rendering},\nauthor={Lidong Guo and Xuefei Ning and Yonggan Fu and Tianchen Zhao and Zhuoliang Kang and Jincheng Yu and Yingyan Celine Lin and Yu Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=B8FA2ixkPN}\n}",
        "github": "",
        "project": "",
        "reviewers": "Vfdc;3Q2w;PcY6;MyQ8",
        "site": "https://openreview.net/forum?id=B8FA2ixkPN",
        "pdf_size": 7938395,
        "rating": "5;5;5;5",
        "confidence": "4;2;3;5",
        "soundness": "2;2;3;2",
        "contribution": "2;3;2;2",
        "presentation": "3;2;2;3",
        "wc_summary": "109;51;109;93",
        "wc_strengths": "68;57;12;79",
        "wc_weaknesses": "124;425;331;329",
        "wc_questions": "111;6;72;7",
        "wc_review": "412;539;524;508",
        "wc_reply_reviewers": "0;62;0;0",
        "wc_reply_authors": "762;1385;1145;1027",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "3;5;4;4",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            90.5,
            23.722352328552915
        ],
        "wc_strengths_avg": [
            54.0,
            25.465663156493687
        ],
        "wc_weaknesses_avg": [
            302.25,
            109.98039598037461
        ],
        "wc_questions_avg": [
            49.0,
            44.68221122549778
        ],
        "wc_review_avg": [
            495.75,
            49.58011194017214
        ],
        "wc_reply_reviewers_avg": [
            15.5,
            26.846787517317598
        ],
        "wc_reply_authors_avg": [
            1079.75,
            224.2670004704214
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.0,
            0.7071067811865476
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:kLGKA6GXkFwJ:scholar.google.com/&scioq=GML-NeRF:+Gate-guided+Mutual+Learning+Framework+for+Neural+Rendering&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2;3;0;1",
        "aff_unique_norm": "Tsinghua University;Georgia Institute of Technology;Infinigence;Meituan",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.gatech.edu;;https://www.meituan.com",
        "aff_unique_abbr": "THU;Georgia Tech;;Meituan",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0;1",
        "aff_country_unique": "China;United States;"
    },
    {
        "title": "Compressing LLMs: The Truth is Rarely Pure and Never Simple",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19229",
        "id": "B9klVS7Ddk",
        "author_site": "AJAY JAISWAL, Zhe Gan, Xianzhi Du, Bowen Zhang, Zhangyang Wang, Yinfei Yang",
        "tldr": "",
        "abstract": "Despite their remarkable achievements, modern Large Language Models (LLMs) encounter exorbitant computational and memory footprints. Recently, several works have shown significant success in *training-free* and  *data-free* compression (pruning and quantization) of LLMs achieving 50-60\\% sparsity and reducing the bit-width down to 3 or 4 bits per weight, with negligible perplexity degradation over the uncompressed baseline. As recent research efforts are focused on developing increasingly sophisticated compression methods, our work takes a step back, and re-evaluates the effectiveness of existing SoTA compression methods, which rely on a fairly simple and widely questioned metric, perplexity (even for dense LLMs). We introduce **K**nowledge-**I**ntensive **C**ompressed LLM Benchmar**K** **(LLM-KICK)**, a collection of carefully-curated tasks to re-define the evaluation protocol for compressed LLMs, which have significant alignment with their dense counterparts, and perplexity fail to capture subtle change in their true capabilities. LLM-KICK unveils many favorable merits and unfortunate plights of current SoTA compression methods: all pruning methods suffer significant performance degradation, sometimes at trivial sparsity ratios (*e.g.*, 25-30\\%), and fail for N:M sparsity on knowledge-intensive tasks; current quantization methods are more successful than pruning; yet, pruned LLMs even at $\\geq 50$\\% sparsity are robust in-context retrieval and summarization systems; among others. LLM-KICK is designed to holistically access compressed LLMs' ability for language understanding, reasoning, generation, in-context retrieval, in-context summarization, *etc.* We hope our study can foster the development of better LLM compression methods. The reproduced codes are available at https://github.com/VITA-Group/llm-kick.",
        "keywords": "Compression;Large Language Models;Pruning;Quantization",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "AJAY KUMAR JAISWAL;Zhe Gan;Xianzhi Du;Bowen Zhang;Zhangyang Wang;Yinfei Yang",
        "authorids": "~AJAY_KUMAR_JAISWAL1;~Zhe_Gan1;~Xianzhi_Du4;~Bowen_Zhang2;~Zhangyang_Wang1;~Yinfei_Yang1",
        "gender": "M;M;M;M;M;",
        "homepage": "https://ajay1994.github.io/;http://zhegan27.github.io/;;https://zbwglory.github.io;https://vita-group.github.io;",
        "dblp": "30/9707;41/7845;;85/7433-2;119/4026;117/4082",
        "google_scholar": "I783HxYAAAAJ;E64XWyMAAAAJ;l1hP40AAAAAJ;nI3cKV8AAAAJ;pxFyKAIAAAAJ;kvDbu90AAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";zhe-gan-a2229a78/;xianzhi-du-1b128934/;;;",
        "or_profile": "~AJAY_KUMAR_JAISWAL1;~Zhe_Gan1;~Xianzhi_Du4;~Bowen_Zhang2;~Zhangyang_Wang1;~Yinfei_Yang1",
        "aff": "University of Texas, Austin;Apple;Apple;Apple;University of Texas at Austin;Apple",
        "aff_domain": "utexas.edu;apple.com;apple.com;apple.com;utexas.edu;apple.com",
        "position": "PhD student;Principal Researcher;Researcher;Research Scientist;Associate Professor;Researcher",
        "bibtex": "@inproceedings{\njaiswal2024compressing,\ntitle={Compressing {LLM}s: The Truth is Rarely Pure and Never Simple},\nauthor={AJAY KUMAR JAISWAL and Zhe Gan and Xianzhi Du and Bowen Zhang and Zhangyang Wang and Yinfei Yang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=B9klVS7Ddk}\n}",
        "github": "",
        "project": "",
        "reviewers": "PUep;X7p4;b73d;QryF",
        "pdf_size": 1165142,
        "rating": "5;6;8;8",
        "confidence": "4;4;4;4",
        "soundness": "3;3;3;3",
        "contribution": "3;2;3;3",
        "presentation": "3;4;3;3",
        "wc_summary": "16;27;100;54",
        "wc_strengths": "25;89;71;61",
        "wc_weaknesses": "119;68;83;13",
        "wc_questions": "10;37;22;1",
        "wc_review": "170;221;276;129",
        "wc_reply_reviewers": "81;0;0;0",
        "wc_reply_authors": "873;770;504;119",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "3;2;1;1",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            49.25,
            32.39888115352134
        ],
        "wc_strengths_avg": [
            61.5,
            23.339880033967614
        ],
        "wc_weaknesses_avg": [
            70.75,
            38.14691992808856
        ],
        "wc_questions_avg": [
            17.5,
            13.5
        ],
        "wc_review_avg": [
            199.0,
            55.122590650295095
        ],
        "wc_reply_reviewers_avg": [
            20.25,
            35.074028853269766
        ],
        "wc_reply_authors_avg": [
            566.5,
            291.34043660295424
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 40,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15743144799258029889&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=B9klVS7Ddk",
        "pdf": "https://openreview.net/pdf?id=B9klVS7Ddk",
        "email": "utexas.edu;apple.com;apple.com;apple.com;utexas.edu;apple.com",
        "author_num": 6,
        "aff_unique_index": "0;1;1;1;0;1",
        "aff_unique_norm": "University of Texas at Austin;Apple",
        "aff_unique_dep": ";Apple Inc.",
        "aff_unique_url": "https://www.utexas.edu;https://www.apple.com",
        "aff_unique_abbr": "UT Austin;Apple",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Austin;",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "BAX3NXJ6vU",
        "title": "Escaping Saddle Point Efficiently in Minimax and Bilevel Optimizations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Hierarchical optimization (including minimax optimization and bilevel optimization) is attracting significant attentions as it can be broadly applied to many machine learning tasks such as adversarial training, policy optimization, meta-learning and hyperparameter optimization. Recently, many algorithms have been studied to improve the theoretical analysis results of minimax and bilevel optimizations. Among these works, one of the most crucial issues is to escape saddle point and find local minimum, which is also of importance in conventional nonconvex optimization. In this paper, thus, we focus on investigating the methods to achieve second-order stationary point for nonconvex-strongly-concave minimax optimization and nonconvex-strongly-convex bilevel optimization. Specifically, we propose a new algorithm named PRGDA  via perturbed stochastic gradient which does not require the computation of second order derivatives. In stochastic nonconvex-strongly-concave minimax optimization, we prove that our algorithm can find an $O(\\epsilon, \\sqrt{\\rho_{\\Phi} \\epsilon})$ second-order stationary point within gradient complexity of $\\tilde{O} (\\kappa^3 \\epsilon^{-3})$, which matches state-of-the-art to find first-order stationary point. To our best knowledge, our algorithm is the first stochastic algorithm that is guaranteed to obtain the second-order stationary point for nonconvex minimax problems. Besides, in stochastic nonconvex-strongly-convex bilevel optimization, our method also achieves better gradient complexity of $Gc(f, \\epsilon) = \\tilde{O}(\\kappa^3 \\epsilon^{-3})$ and $Gc(g, \\epsilon) = \\tilde{O}(\\kappa^7 \\epsilon^{-3})$ to find local minimum. Finally, we conduct a numerical experiment to validate the performance of our new method.",
        "keywords": "saddle point;minimax optimization;bilevel optimization",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/ff6c97761f73a1c540d5d504c7604545bc0b51b1.zip",
        "author": "Wenhan Xian;Feihu Huang;Heng Huang",
        "authorids": "~Wenhan_Xian1;~Feihu_Huang1;~Heng_Huang1",
        "gender": "M;M;M",
        "homepage": ";;https://www.cs.umd.edu/~heng/",
        "dblp": "246/3134;169/6247;03/281",
        "google_scholar": ";tRQwlHUAAAAJ;4OqLaDwAAAAJ",
        "orcid": ";0000-0003-0806-6074;",
        "linkedin": "wenhan-xian-3392ba170;;",
        "or_profile": "~Wenhan_Xian1;~Feihu_Huang1;~Heng_Huang1",
        "aff": "University of Maryland, College Park;Nanjing University of Aeronautics and Astronautics;Department of Computer Science, University of Maryland, College Park",
        "aff_domain": "umd.edu;nuaa.edu.cn;cs.umd.edu",
        "position": "PhD student;Full Professor;Full Professor",
        "bibtex": "@misc{\nxian2024escaping,\ntitle={Escaping Saddle Point Efficiently in Minimax and Bilevel Optimizations},\nauthor={Wenhan Xian and Feihu Huang and Heng Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=BAX3NXJ6vU}\n}",
        "github": "",
        "project": "",
        "reviewers": "tUHe;JNob;5LK2",
        "site": "https://openreview.net/forum?id=BAX3NXJ6vU",
        "pdf_size": 1039506,
        "rating": "5;5;6",
        "confidence": "3;3;3",
        "soundness": "3;2;3",
        "contribution": "2;2;3",
        "presentation": "3;1;2",
        "wc_summary": "112;51;57",
        "wc_strengths": "46;20;49",
        "wc_weaknesses": "475;409;167",
        "wc_questions": "9;5;246",
        "wc_review": "642;485;519",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "553;411;197",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            73.33333333333333,
            27.450966386551052
        ],
        "wc_strengths_avg": [
            38.333333333333336,
            13.021349989749739
        ],
        "wc_weaknesses_avg": [
            350.3333333333333,
            132.4067806252971
        ],
        "wc_questions_avg": [
            86.66666666666667,
            112.67751427069298
        ],
        "wc_review_avg": [
            548.6666666666666,
            67.44050876307371
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            387.0,
            146.3238417574753
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:GrriULR_qzMJ:scholar.google.com/&scioq=Escaping+Saddle+Point+Efficiently+in+Minimax+and+Bilevel+Optimizations&hl=en&as_sdt=0,5",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of Maryland;Nanjing University of Aeronautics and Astronautics;University of Maryland, College Park",
        "aff_unique_dep": ";;Department of Computer Science",
        "aff_unique_url": "https://www/umd.edu;http://www.nuaa.edu.cn;https://www/umd.edu",
        "aff_unique_abbr": "UMD;NUAA;UMD",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "College Park;",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "BBD4cFDKxQ",
        "title": "AdaProj: Adaptively Scaled Angular Margin Subspace Projections for Anomaly Detection with Auxiliary Classification Tasks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "One of the state-of-the-art approaches for semi-supervised anomaly detection is to first learn an embedding space and then estimate the distribution of normal data. This can be done by using one-class losses or by using auxiliary classification tasks based on meta information or self-supervised learning. Angular margin losses are a popular training objective because they increase intra-class similarity and avoid learning trivial solutions by reducing inter-class similarity. In this work, AdaProj a novel loss function that generalizes upon angular margin losses is presented. In contrast to angular margin losses, which project data of each class as close as possible to their corresponding class centers, AdaProj learns to project data onto class-specific subspaces. By doing so, the resulting distributions of embeddings belonging to normal data are not required to be as restrictive as other loss functions allowing a more detailed view on the data. This enables a system to more accurately detect anomalous samples during testing. In experiments conducted on the DCASE2022 and DCASE2023 datasets, it is shown that using AdaProj to learn an embedding space significantly outperforms other commonly used loss functions achieving a new state-of-the-art performance on the DCASE2023 dataset.",
        "keywords": "representation learning;anomaly detection;semi-supervised learning;angular margin loss",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Kevin Wilkinghoff",
        "authorids": "~Kevin_Wilkinghoff1",
        "gender": "M",
        "homepage": "https://wilkinghoff.com/",
        "dblp": "207/9559",
        "google_scholar": "https://scholar.google.de/citations?user=UKE_q8wAAAAJ",
        "orcid": "0000-0003-4200-9129",
        "linkedin": "kevin-wilkinghoff/",
        "or_profile": "~Kevin_Wilkinghoff1",
        "aff": "Fraunhofer FKIE",
        "aff_domain": "fkie.fraunhofer.de",
        "position": "Researcher",
        "bibtex": "@misc{\nwilkinghoff2024adaproj,\ntitle={AdaProj: Adaptively Scaled Angular Margin Subspace Projections for Anomaly Detection with Auxiliary Classification Tasks},\nauthor={Kevin Wilkinghoff},\nyear={2024},\nurl={https://openreview.net/forum?id=BBD4cFDKxQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "3pzd;RkC3;PZSP;t49Z",
        "site": "https://openreview.net/forum?id=BBD4cFDKxQ",
        "pdf_size": 214829,
        "rating": "3;3;5;6",
        "confidence": "4;4;3;4",
        "soundness": "2;2;2;2",
        "contribution": "1;2;2;2",
        "presentation": "2;1;2;2",
        "wc_summary": "118;53;42;137",
        "wc_strengths": "49;19;32;86",
        "wc_weaknesses": "166;203;102;102",
        "wc_questions": "32;2;7;2",
        "wc_review": "365;277;183;327",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            87.5,
            40.74616546375867
        ],
        "wc_strengths_avg": [
            46.5,
            25.16445906432324
        ],
        "wc_weaknesses_avg": [
            143.25,
            43.27455950093542
        ],
        "wc_questions_avg": [
            10.75,
            12.43734296383275
        ],
        "wc_review_avg": [
            288.0,
            68.18357573492314
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9065947214425446785&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Fraunhofer Institute for Communication, Information Processing and Ergonomics",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.fkie.fraunhofer.de/",
        "aff_unique_abbr": "FKIE",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Germany"
    },
    {
        "title": "Hybrid Directional Graph Neural Network for Molecules",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19228",
        "id": "BBD6KXIGJL",
        "author_site": "Junyi An, Chao Qu, Zhipeng Zhou, Fenglei Cao, Xu Yinghui, Yuan Qi, Furao Shen",
        "tldr": "",
        "abstract": "Equivariant message passing neural networks have emerged as the prevailing approach for predicting chemical properties of molecules due to their ability to leverage translation and rotation symmetries, resulting in a strong inductive bias. However, the equivariant operations in each layer can impose excessive constraints on the function form and network flexibility. To address these challenges, we introduce a novel network called the Hybrid Directional Graph Neural Network (HDGNN), which effectively combines strictly equivariant operations with learnable modules. We evaluate the performance of HDGNN on the QM9 dataset and the IS2RE dataset of OC20, demonstrating its state-of-the-art performance on several tasks and competitive performance on others. Our code is anonymously released on https://github.com/ajy112/HDGNN.",
        "keywords": "Graph Neural Networks; Equivariance; Molecular model",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/bc98d38347f0c395dece9bd36609fe3ae80bf6a0.pdf",
        "author": "Junyi An;Chao Qu;Zhipeng Zhou;Fenglei Cao;Xu Yinghui;Yuan Qi;Furao Shen",
        "authorids": "~Junyi_An1;~Chao_Qu3;~Zhipeng_Zhou3;~Fenglei_Cao1;~Xu_Yinghui3;~Yuan_Qi2;~Furao_Shen1",
        "gender": "M;M;M;M;M;M;M",
        "homepage": ";;;https://www.infotech.ai;;https://cs.nju.edu.cn/58/05/c2639a153605/page.htm;https://www.google.com.hk/webhp?hl=en&sa=X&ved=0ahUKEwjBm6iTvd7tAhUhqlkKHT10DS0QPAgI",
        "dblp": "254/1449.html;;;;;80/4685;",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;DI2NyPsAAAAJ;Ot0PPAcAAAAJ;;;https://scholar.google.com.tw/citations?user=bjSi-dIAAAAJ;https://scholar.google.com.hk/citations?user=CTdXJYwAAAAJ",
        "orcid": ";;;;;;",
        "linkedin": ";;;;yuan-alan-qi-30ba1b4/;;",
        "or_profile": "~Junyi_An1;~Chao_Qu3;~Zhipeng_Zhou3;~Fenglei_Cao1;~Yuan_Qi2;~Shen_Furao1;~Xu_Yinghui2",
        "aff": "Nanjing University;Inftech;INF (Shanghai) Technology Co., LTD;;Fudan University;Nanjing University;Fudan University",
        "aff_domain": "nju.edu.cn;inftech.ai;inftech.ai;;fudan.edu.cn;nju.edu.cn;fudan.edu.cn",
        "position": "PhD student;Researcher;Researcher;;Full Professor;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nan2024hybrid,\ntitle={Hybrid Directional Graph Neural Network for Molecules},\nauthor={Junyi An and Chao Qu and Zhipeng Zhou and Fenglei Cao and Xu Yinghui and Yuan Qi and Furao Shen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=BBD6KXIGJL}\n}",
        "github": "",
        "project": "",
        "reviewers": "Liwe;yQB9;rs3C",
        "pdf_size": 578867,
        "rating": "6;8;8",
        "confidence": "2;2;4",
        "soundness": "2;3;2",
        "contribution": "2;3;3",
        "presentation": "3;3;3",
        "wc_summary": "63;39;177",
        "wc_strengths": "18;14;45",
        "wc_weaknesses": "42;1;1569",
        "wc_questions": "58;1;22",
        "wc_review": "181;55;1813",
        "wc_reply_reviewers": "0;0;1424",
        "wc_reply_authors": "635;23;4491",
        "reply_reviewers": "0;0;6",
        "reply_authors": "1;1;9",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            93.0,
            60.199667773169644
        ],
        "wc_strengths_avg": [
            25.666666666666668,
            13.767917618708921
        ],
        "wc_weaknesses_avg": [
            537.3333333333334,
            729.6904975551088
        ],
        "wc_questions_avg": [
            27.0,
            23.53720459187964
        ],
        "wc_review_avg": [
            683.0,
            800.6847069852153
        ],
        "wc_reply_reviewers_avg": [
            474.6666666666667,
            671.2800376064291
        ],
        "wc_reply_authors_avg": [
            1716.3333333333333,
            1977.8300117946324
        ],
        "reply_reviewers_avg": [
            2.0,
            2.8284271247461903
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            3.7712361663282534
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14475517015581943774&as_sdt=20000005&sciodt=0,21&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=BBD6KXIGJL",
        "pdf": "https://openreview.net/pdf?id=BBD6KXIGJL",
        "email": "nju.edu.cn;inftech.ai;inftech.ai;;fudan.edu.cn;nju.edu.cn;fudan.edu.cn",
        "author_num": 7,
        "aff_unique_index": "0;1;2;3;0;3",
        "aff_unique_norm": "Nanjing University;Inftech;INF Technology Co., LTD;Fudan University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.nju.edu.cn;;;https://www.fudan.edu.cn",
        "aff_unique_abbr": "Nanjing U;;;Fudan",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Shanghai",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China;"
    },
    {
        "id": "BC4AUywMow",
        "title": "Zero-Level-Set Encoder for Neural Distance Fields",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Neural shape representation generally refers to representing 3D geometry using neural networks, e.g., to compute a signed distance or occupancy value at a specific spatial position. Previous methods tend to rely on the auto-decoder paradigm, which often requires densely-sampled and accurate signed distances to be known during training and testing, as well as an additional optimization loop during inference. This introduces a lot of computational overhead, in addition to having to compute signed distances analytically, even during testing. In this paper, we present a novel encoder-decoder neural network for embedding 3D shapes in a single forward pass. Our architecture is based on a multi-scale hybrid system incorporating graph-based and voxel-based components, as well as a continuously differentiable decoder. Furthermore, the network is trained to solve the Eikonal equation and only requires knowledge of the zero-level set for training and inference. Additional volumetric samples can be generated on-the-fly, and incorporated in an unsupervised manner. This means that in contrast to most previous work, our network is able to output valid signed distance fields without explicit prior knowledge of non-zero distance values or shape occupancy. In other words, our network computes approximate solutions to the boundary-valued Eikonal equation. It also requires only a single forward pass during inference, instead of the common latent code optimization. We further propose a modification of the loss function in case that surface normals are not well defined, e.g., in the context of non-watertight surface-meshes and non-manifold geometry. Overall, this can help reduce the computational overhead of training and evaluating neural distance fields, as well as enabling the application to difficult shapes. We finally demonstrate the efficacy, generalizability and scalability of our method on datasets consisting of deforming 3D shapes, single class encoding and multiclass encoding, showcasing a wide range of possible applications.",
        "keywords": "neural shape representation;neural distance fields;eikonal equation;surface mesh;encoder-decoder",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/1facf82bd05b0f7cd3809292f07b333b2e390880.zip",
        "author": "Stefan Rhys Jeske;Jonathan Klein;Dominik Michels;Jan Bender",
        "authorids": "~Stefan_Rhys_Jeske1;~Jonathan_Klein2;~Dominik_Michels1;~Jan_Bender1",
        "gender": "M;M;M;M",
        "homepage": "https://srjeske.de;https://jonathank.de/research/;https://www.kaust.edu.sa/en/study/faculty/dominik-michels;https://www.animation.rwth-aachen.de/",
        "dblp": ";22/5462;131/3147;63/2863.html",
        "google_scholar": ";wzejV1EAAAAJ;;https://scholar.google.com.tw/citations?user=POEoFagAAAAJ",
        "orcid": "0000-0003-3920-7765;0000-0001-6560-0988;;",
        "linkedin": ";;;",
        "or_profile": "~Stefan_Rhys_Jeske1;~Jonathan_Klein2;~Dominik_Michels1;~Jan_Bender1",
        "aff": "Rheinisch Westf\u00e4lische Technische Hochschule Aachen;King Abdullah University of Science and Technology;KAUST;RWTH Aachen University",
        "aff_domain": "rwth-aachen.de;kaust.edu.sa;kaust.edu.sa;rwth-aachen.de",
        "position": "PhD student;Researcher;Associate Professor;Full Professor",
        "bibtex": "@misc{\njeske2024zerolevelset,\ntitle={Zero-Level-Set Encoder for Neural Distance Fields},\nauthor={Stefan Rhys Jeske and Jonathan Klein and Dominik Michels and Jan Bender},\nyear={2024},\nurl={https://openreview.net/forum?id=BC4AUywMow}\n}",
        "github": "",
        "project": "",
        "reviewers": "ysCV;Msao;ruBo",
        "site": "https://openreview.net/forum?id=BC4AUywMow",
        "pdf_size": 22366387,
        "rating": "3;5;5",
        "confidence": "5;4;4",
        "soundness": "3;2;3",
        "contribution": "1;2;2",
        "presentation": "3;3;3",
        "wc_summary": "49;176;79",
        "wc_strengths": "106;96;77",
        "wc_weaknesses": "297;469;112",
        "wc_questions": "45;96;84",
        "wc_review": "497;837;352",
        "wc_reply_reviewers": "0;165;35",
        "wc_reply_authors": "119;1339;44",
        "reply_reviewers": "0;2;1",
        "reply_authors": "1;3;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            101.33333333333333,
            54.19922098661157
        ],
        "wc_strengths_avg": [
            93.0,
            12.027745701779143
        ],
        "wc_weaknesses_avg": [
            292.6666666666667,
            145.7768462029855
        ],
        "wc_questions_avg": [
            75.0,
            21.77154105707724
        ],
        "wc_review_avg": [
            562.0,
            203.26501584548842
        ],
        "wc_reply_reviewers_avg": [
            66.66666666666667,
            70.98513146348951
        ],
        "wc_reply_authors_avg": [
            500.6666666666667,
            593.58140881339
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9999999999999997,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0;1;1;0",
        "aff_unique_norm": "RWTH Aachen University;King Abdullah University of Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.rwth-aachen.de;https://www.kast.kau.edu.sa",
        "aff_unique_abbr": "RWTH;KAUST",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Aachen;",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "Germany;Saudi Arabia"
    },
    {
        "id": "BCRZq5nNZu",
        "title": "Chunking: Forgetting Matters in Continual Learning even without Changing Tasks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Work on continual learning (CL) has largely focused on the problems arising from the dynamically-changing data distribution. However, CL can be decomposed into two sub-problems: (a) shifts in the data distribution, and (b) dealing with the fact that the data is split into chunks and so only a part of the data is available to be trained on at any point in time. In this work, we look at the latter sub-problem---the chunking of data---and note that previous analysis of chunking in the CL literature is sparse. We show that chunking is an important part of CL, accounting for around half of the performance drop from offline learning in our experiments. Furthermore, our results reveal that current CL algorithms do not address the chunking sub-problem, only performing as well as plain SGD training when there is no shift in the data distribution. We analyse why performance drops when learning occurs on chunks of data, and find that forgetting, which is often seen to be a problem due to distribution shift, still arises and is a significant problem. Motivated by an analysis of the linear case, we show that per-chunk weight averaging improves performance in the chunking setting and that this performance transfers to the full CL setting. Hence, we argue that work on chunking can help advance CL in general.",
        "keywords": "Continual Learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/c4eb9b6dd0ad9985103367e42348e5ecaebbd7fe.zip",
        "author": "Thomas L Lee;Amos Storkey",
        "authorids": "~Thomas_L_Lee1;~Amos_Storkey1",
        "gender": ";Not Specified",
        "homepage": "https://tlee43.github.io/;http://homepages.inf.ed.ac.uk/amos/",
        "dblp": ";",
        "google_scholar": "pRcPv_cAAAAJ;",
        "orcid": ";",
        "linkedin": "thomas-lee-aa27a9176/;",
        "or_profile": "~Thomas_L_Lee1;~Amos_Storkey1",
        "aff": "Huawei Technologies Ltd.;University of Edinburgh",
        "aff_domain": "huawei.com;ed.ac.uk",
        "position": "Intern;Full Professor",
        "bibtex": "@misc{\nlee2024chunking,\ntitle={Chunking: Forgetting Matters in Continual Learning even without Changing Tasks},\nauthor={Thomas L Lee and Amos Storkey},\nyear={2024},\nurl={https://openreview.net/forum?id=BCRZq5nNZu}\n}",
        "github": "",
        "project": "",
        "reviewers": "BU9q;4UBT;w2jf;T7s5",
        "site": "https://openreview.net/forum?id=BCRZq5nNZu",
        "pdf_size": 845347,
        "rating": "3;3;3;5",
        "confidence": "5;4;4;4",
        "soundness": "2;2;2;2",
        "contribution": "2;2;3;2",
        "presentation": "3;2;3;3",
        "wc_summary": "104;37;94;117",
        "wc_strengths": "100;1;148;105",
        "wc_weaknesses": "556;550;326;503",
        "wc_questions": "10;4;223;29",
        "wc_review": "770;592;791;754",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "745;947;805;725",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            88.0,
            30.553232234904378
        ],
        "wc_strengths_avg": [
            88.5,
            53.85396921304873
        ],
        "wc_weaknesses_avg": [
            483.75,
            93.3605243130093
        ],
        "wc_questions_avg": [
            66.5,
            90.82538191496913
        ],
        "wc_review_avg": [
            726.75,
            78.89668877715971
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            805.5,
            86.83749190297932
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3591496541474882982&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Huawei;University of Edinburgh",
        "aff_unique_dep": "Huawei Technologies;",
        "aff_unique_url": "https://www.huawei.com;https://www.ed.ac.uk",
        "aff_unique_abbr": "Huawei;Edinburgh",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "id": "BCe9ut1s7i",
        "title": "On the Importance of Backbone to the Adversarial Robustness of Object Detectors",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Object detection is a critical component of various security-sensitive applications, such as autonomous driving and video surveillance. However, existing object detectors are vulnerable to adversarial attacks, which poses a significant challenge to their reliability and safety.\nThrough experiments, first, we found that existing works on improving the adversarial robustness of object detectors give a false sense of security. Second, we found that using adversarially pre-trained backbone networks was essential for enhancing the adversarial robustness of object detectors. We then proposed a simple yet effective recipe for fast adversarial fine-tuning on object detectors with adversarially pre-trained backbones. Without any modifications to the structure of object detectors, our recipe achieved significantly better adversarial robustness than previous works. Finally, we explored the potential of different modern object detectors to improve adversarial robustness using our recipe and demonstrated interesting findings, which inspired us to design several state-of-the-art (SOTA) robust detectors with faster inference speed. Our empirical results set a new milestone for adversarially robust object detection. Code and trained checkpoints will be publicly available.",
        "keywords": "adversarial robustness;object detection",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Xiao Li;Hang Chen;Xiaolin Hu",
        "authorids": "~Xiao_Li16;~Hang_Chen4;~Xiaolin_Hu1",
        "gender": "M;M;M",
        "homepage": ";;http://www.xlhu.cn/",
        "dblp": "66/2069-28;;60/6028-1",
        "google_scholar": "Is24dqwAAAAJ;WZbgD9oAAAAJ;PksdgoUAAAAJ",
        "orcid": "0000-0001-8992-4944;;0000-0002-4907-7354",
        "linkedin": ";;",
        "or_profile": "~Xiao_Li16;~Hang_Chen4;~Xiaolin_Hu1",
        "aff": "Computer Science, Tsinghua University;Tsinghua University;Tsinghua University",
        "aff_domain": "mails.tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "PhD student;PhD student;Associate Professor",
        "bibtex": "@misc{\nli2024on,\ntitle={On the Importance of Backbone to the Adversarial Robustness of Object Detectors},\nauthor={Xiao Li and Hang Chen and Xiaolin Hu},\nyear={2024},\nurl={https://openreview.net/forum?id=BCe9ut1s7i}\n}",
        "github": "",
        "project": "",
        "reviewers": "xgd4;fyi7;wtFb",
        "site": "https://openreview.net/forum?id=BCe9ut1s7i",
        "pdf_size": 1449805,
        "rating": "3;5;5",
        "confidence": "5;3;5",
        "soundness": "2;3;3",
        "contribution": "1;3;2",
        "presentation": "2;3;4",
        "wc_summary": "36;73;59",
        "wc_strengths": "55;23;74",
        "wc_weaknesses": "207;233;299",
        "wc_questions": "105;16;6",
        "wc_review": "403;345;438",
        "wc_reply_reviewers": "175;0;0",
        "wc_reply_authors": "1109;896;1127",
        "reply_reviewers": "1;0;0",
        "reply_authors": "2;2;2",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            56.0,
            15.253414918196734
        ],
        "wc_strengths_avg": [
            50.666666666666664,
            21.044925490219462
        ],
        "wc_weaknesses_avg": [
            246.33333333333334,
            38.72409528388695
        ],
        "wc_questions_avg": [
            42.333333333333336,
            44.4996878890428
        ],
        "wc_review_avg": [
            395.3333333333333,
            38.35216928530756
        ],
        "wc_reply_reviewers_avg": [
            58.333333333333336,
            82.49579113843053
        ],
        "wc_reply_authors_avg": [
            1044.0,
            104.90948479522717
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12470143202775810721&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Tsinghua University",
        "aff_unique_dep": "Computer Science",
        "aff_unique_url": "https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "BCocsAF7MY",
        "title": "Fine-tune Language Models to Approximate Unbiased In-context Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In-context learning (ICL) is an astonishing emergent ability of large language models (LLMs). By presenting a prompt that includes multiple input-output pairs as examples and introducing a new query input, models can generate the corresponding output. However, the performance of models heavily relies on the quality of the input prompt when implementing in-context learning. Biased or imbalanced input prompts can significantly degrade the performance of language models. To address this issue, we introduce a reweighted algorithm called RICL (Reweighted In-context Learning). This algorithm fine-tunes language models using an unbiased validation set to determine the optimal weight for each input-output example to approximate unbiased in-context learning. Furthermore, we also introduce a low-cost reweighted algorithm, a linear optimal weight approximation algorithm called LARICL (Linear Approximation of Reweighted In-context Learning). This algorithm requires minimal training cost while providing effective results. We prove the convergence of our algorithm and validate its performance through experiments conducted on a numerical dataset. The experimental findings reveal a substantial improvement in comparison to benchmarks including the performance of casual prompt-based in-context learning and the performance of a classic fine-tuning method.",
        "keywords": "fine-tune;in-context learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/3ab7a88a102f875d28b3b9f90cf192215c15dd4c.pdf",
        "author": "Timothy Zer-An Chu;Zhao Song;Chiwun Yang",
        "authorids": "~Timothy_Zer-An_Chu1;~Zhao_Song3;~Chiwun_Yang1",
        "gender": "M;M;M",
        "homepage": ";https://www.youtube.com/@zhaosong2031;https://christianyang37.github.io/",
        "dblp": ";76/4051-2;355/2807",
        "google_scholar": "https://scholar.google.com/citations?hl=en;yDZct7UAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Timothy_Zer-An_Chu1;~Zhao_Song3;~Chiwun_Yang1",
        "aff": "AAAS;Adobe;SUN YAT-SEN UNIVERSITY",
        "aff_domain": "aaas.org;adobe.com;sysu.edu.cn",
        "position": "Researcher;Researcher;Undergrad student",
        "bibtex": "@misc{\nchu2024finetune,\ntitle={Fine-tune Language Models to Approximate Unbiased In-context Learning},\nauthor={Timothy Zer-An Chu and Zhao Song and Chiwun Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=BCocsAF7MY}\n}",
        "github": "",
        "project": "",
        "reviewers": "NqVg;A8do;sUUz",
        "site": "https://openreview.net/forum?id=BCocsAF7MY",
        "pdf_size": 379670,
        "rating": "3;3;5",
        "confidence": "3;3;3",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "2;1;3",
        "wc_summary": "68;40;58",
        "wc_strengths": "68;77;59",
        "wc_weaknesses": "145;220;133",
        "wc_questions": "75;2;53",
        "wc_review": "356;339;303",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            55.333333333333336,
            11.585431464655176
        ],
        "wc_strengths_avg": [
            68.0,
            7.3484692283495345
        ],
        "wc_weaknesses_avg": [
            166.0,
            38.49675310984031
        ],
        "wc_questions_avg": [
            43.333333333333336,
            30.575952787916336
        ],
        "wc_review_avg": [
            332.6666666666667,
            22.095751225568733
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 18,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5893653897567298517&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "American Association for the Advancement of Science;Adobe;Sun Yat-sen University",
        "aff_unique_dep": ";Adobe Inc.;",
        "aff_unique_url": "https://www.aaas.org;https://www.adobe.com;http://www.sysu.edu.cn",
        "aff_unique_abbr": "AAAS;Adobe;SYSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "A Unified and General Framework for Continual Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19227",
        "id": "BE5aK0ETbp",
        "author_site": "Zhenyi Wang, Yan Li, Li Shen, Heng Huang",
        "tldr": "",
        "abstract": "Continual Learning (CL) focuses on learning from dynamic and changing data distributions while retaining previously acquired knowledge. Various methods have been developed to address the challenge of catastrophic forgetting, including regularization-based, Bayesian-based, and memory-replay-based techniques. However, these methods lack a unified framework and common terminology for describing their approaches. This research aims to bridge this gap by introducing a comprehensive and overarching framework that encompasses and reconciles these existing methodologies. Notably, this new framework is capable of encompassing established CL approaches as special instances within a unified and general optimization objective.\nAn intriguing finding is that despite their diverse origins, these methods share common mathematical structures. This observation highlights the compatibility of these seemingly distinct techniques, revealing their interconnectedness through a shared underlying optimization objective. Moreover, the proposed general framework introduces an innovative concept called *refresh learning*, specifically designed to enhance the CL performance. This novel approach draws inspiration from neuroscience, where the human brain often sheds outdated information to improve the retention of crucial knowledge and facilitate the acquisition of new information. In essence, *refresh learning* operates by initially unlearning current data and subsequently relearning it. It serves as a versatile plug-in that seamlessly integrates with existing CL methods, offering an adaptable and effective enhancement to the learning process. Extensive experiments on CL benchmarks and theoretical analysis demonstrate the effectiveness of the proposed *refresh learning*.",
        "keywords": "Continual Learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Zhenyi Wang;Yan Li;Li Shen;Heng Huang",
        "authorids": "~Zhenyi_Wang1;~Yan_Li18;~Li_Shen1;~Heng_Huang1",
        "gender": ";;M;M",
        "homepage": ";;https://sites.google.com/site/mathshenli/home;https://www.cs.umd.edu/~heng/",
        "dblp": ";;91/3680-8;03/281",
        "google_scholar": ";;yVhgENIAAAAJ;4OqLaDwAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Zhenyi_Wang1;~Yan_Li18;~Li_Shen1;~Heng_Huang1",
        "aff": ";;JD Explore Academy;Department of Computer Science, University of Maryland, College Park",
        "aff_domain": ";;jd.com;cs.umd.edu",
        "position": ";;Researcher;Full Professor",
        "bibtex": "@inproceedings{\nwang2024a,\ntitle={A Unified and General Framework for Continual Learning},\nauthor={Zhenyi Wang and Yan Li and Li Shen and Heng Huang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=BE5aK0ETbp}\n}",
        "github": "",
        "project": "",
        "reviewers": "tVq3;KmRA;Dw6m;ngze",
        "pdf_size": 389005,
        "rating": "3;6;6;6",
        "confidence": "4;3;2;3",
        "soundness": "1;2;3;3",
        "contribution": "2;3;3;2",
        "presentation": "2;3;3;2",
        "wc_summary": "43;201;45;81",
        "wc_strengths": "1;109;45;51",
        "wc_weaknesses": "187;231;70;208",
        "wc_questions": "5;55;46;49",
        "wc_review": "236;596;206;389",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1170;1094;601;1720",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "4;3;2;4",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            92.5,
            64.44183423832689
        ],
        "wc_strengths_avg": [
            51.5,
            38.40247387864485
        ],
        "wc_weaknesses_avg": [
            174.0,
            62.028219384406
        ],
        "wc_questions_avg": [
            38.75,
            19.753164303473
        ],
        "wc_review_avg": [
            356.75,
            154.5855345755223
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1146.25,
            396.7936333914646
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            3.25,
            0.82915619758885
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 25,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12568688008196456109&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=BE5aK0ETbp",
        "pdf": "https://openreview.net/pdf?id=BE5aK0ETbp",
        "email": ";;jd.com;cs.umd.edu",
        "author_num": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "JD;University of Maryland, College Park",
        "aff_unique_dep": "JD Explore Academy;Department of Computer Science",
        "aff_unique_url": ";https://www/umd.edu",
        "aff_unique_abbr": ";UMD",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";College Park",
        "aff_country_unique_index": "1",
        "aff_country_unique": ";United States"
    },
    {
        "title": "Pre-training Sequence, Structure, and Surface Features for Comprehensive Protein Representation Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19226",
        "id": "BEH4mGo7zP",
        "author_site": "Youhan Lee, Hasun Yu, Jaemyung Lee, Jaehoon Kim",
        "tldr": "",
        "abstract": "Proteins can be represented in various ways, including their sequences, 3D structures, and surfaces. While recent studies have successfully employed sequence- or structure-based representations to address multiple tasks in protein science, there has been significant oversight in incorporating protein surface information, a critical factor for protein function. In this paper, we present a pre-training strategy that incorporates information from protein sequences, 3D structures, and surfaces to improve protein representation learning. Specifically, we utilize Implicit Neural Representations (INRs) for learning surface characteristics, and name it ProteinINR. We confirm that ProteinINR successfully reconstructs protein surfaces, and integrate this surface learning into the existing pre-training strategy of sequences and structures. Our results demonstrate that our approach can enhance performance in various downstream tasks, thereby underscoring the importance of including surface attributes in protein representation learning. These findings underline the importance of understanding protein surfaces for generating effective protein representations.",
        "keywords": "Protein representation learning;self-supervised learning;implicit neural representation",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Youhan Lee;Hasun Yu;Jaemyung Lee;Jaehoon Kim",
        "authorids": "~Youhan_Lee1;~Hasun_Yu2;~Jaemyung_Lee1;~Jaehoon_Kim1",
        "gender": "M;M;M;M",
        "homepage": ";;https://www.linkedin.com/in/jaemyung-lee-5576b4119/;",
        "dblp": "190/1819;153/5409.html;;",
        "google_scholar": "https://scholar.google.co.kr/citations?user=EFNg9UcAAAAJ;https://scholar.google.co.kr/citations?user=CvbGPQYAAAAJ;UNoy5N8AAAAJ;",
        "orcid": ";;;0000-0001-8598-3429",
        "linkedin": "youhanlee/;https://kr.linkedin.com/in/hasun-yu-733291119;;",
        "or_profile": "~Youhan_Lee1;~Hasun_Yu2;~Jaemyung_Lee1;~Jaehoon_Kim1",
        "aff": "Kakao Brain Corp;Kakao Brain;Kakao Brain Corp;Kakaobrain",
        "aff_domain": "kakaobrain.com;kakaobrain.com;kakaobrain.com;kakaobrain.com",
        "position": "Researcher;Researcher;Researcher;Researcher",
        "bibtex": "@inproceedings{\nlee2024pretraining,\ntitle={Pre-training Sequence, Structure, and Surface Features for Comprehensive Protein Representation Learning},\nauthor={Youhan Lee and Hasun Yu and Jaemyung Lee and Jaehoon Kim},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=BEH4mGo7zP}\n}",
        "github": "",
        "project": "",
        "reviewers": "rs2T;VAn9;AyLE;1KWf",
        "pdf_size": 1966808,
        "rating": "5;6;6;6",
        "confidence": "5;3;2;4",
        "soundness": "2;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "2;3;2;3",
        "wc_summary": "64;120;62;61",
        "wc_strengths": "30;97;60;81",
        "wc_weaknesses": "376;332;70;39",
        "wc_questions": "173;75;40;75",
        "wc_review": "643;624;232;256",
        "wc_reply_reviewers": "55;182;68;0",
        "wc_reply_authors": "1387;1198;641;518",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "3;3;2;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            76.75,
            24.993749218554626
        ],
        "wc_strengths_avg": [
            67.0,
            25.06990227344335
        ],
        "wc_weaknesses_avg": [
            204.25,
            150.95425631627614
        ],
        "wc_questions_avg": [
            90.75,
            49.59019560356664
        ],
        "wc_review_avg": [
            438.75,
            195.05047423679852
        ],
        "wc_reply_reviewers_avg": [
            76.25,
            66.17542973037652
        ],
        "wc_reply_authors_avg": [
            936.0,
            365.30603608481476
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.7745966692414834,
        "gs_citation": 17,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10063730667276780299&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=BEH4mGo7zP",
        "pdf": "https://openreview.net/pdf?id=BEH4mGo7zP",
        "email": "kakaobrain.com;kakaobrain.com;kakaobrain.com;kakaobrain.com",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Kakao Brain",
        "aff_unique_dep": "Corp",
        "aff_unique_url": "https://www.kakaobrain.com",
        "aff_unique_abbr": "Kakao Brain",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "DP-SGD Without Clipping: The Lipschitz Neural Network Way",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19225",
        "id": "BEyEziZ4R6",
        "author_site": "Louis B\u00e9thune, Thomas Massena, Thibaut Boissin, Aur\u00e9lien Bellet, Franck Mamalet, Yannick Prudent, Corentin Friedrich, Mathieu Serrurier, David Vigouroux",
        "tldr": "",
        "abstract": "State-of-the-art approaches for training Differentially Private (DP) Deep Neural Networks (DNN) face difficulties to estimate tight bounds on the sensitivity of the network's layers, and instead rely on a process of per-sample gradient clipping. This clipping process not only biases the direction of gradients but also proves costly both in memory consumption and in computation. To provide sensitivity bounds and bypass the drawbacks of the clipping process, we propose to rely on Lipschitz constrained networks. Our theoretical analysis reveals an unexplored link between the Lipschitz constant with respect to their input and the one with respect to their parameters. By bounding the Lipschitz constant of each layer with respect to its parameters, we prove that we can train these networks with privacy guarantees.  Our analysis not only allows the computation of the aforementioned sensitivities at scale, but also provides guidance on how to maximize the gradient-to-noise ratio for fixed privacy guarantees. To facilitate the application of Lipschitz networks and foster robust and certifiable learning under privacy guarantees, we provide a Python package that implements building blocks allowing the construction and private training of such networks.",
        "keywords": "lipschitz neural networks;dp-sgd;privacy;robustness",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Louis B\u00e9thune;Thomas Massena;Thibaut Boissin;Aur\u00e9lien Bellet;Franck Mamalet;Yannick Prudent;Corentin Friedrich;Mathieu Serrurier;David Vigouroux",
        "authorids": "~Louis_B\u00e9thune1;~Thomas_Massena1;~Thibaut_Boissin1;~Aur\u00e9lien_Bellet1;~Franck_Mamalet2;~Yannick_Prudent1;~Corentin_Friedrich1;~Mathieu_Serrurier1;~David_Vigouroux1",
        "gender": "M;M;M;;M;M;M;M;",
        "homepage": "https://louis-bethune.fr/;;;http://researchers.lille.inria.fr/abellet/;https://www.researchgate.net/profile/Franck-Mamalet;;;;",
        "dblp": "270/0797;;;61/8017;15/6625;;258/6442;30/2092;",
        "google_scholar": "1zvpCDcAAAAJ;n09aacYAAAAJ;zC-MstIAAAAJ;https://scholar.google.fr/citations?user=j8svx3IAAAAJ;https://scholar.google.fr/citations?user=5C5p0osAAAAJ;;;https://scholar.google.com/scholar?scilib=1;",
        "orcid": "0000-0003-1498-8251;;;0000-0003-3440-1251;;;;;",
        "linkedin": ";thomas-mass%C3%A9na-9240b5223/;;;franck-mamalet-0453a91b;yannick-prudent/;corentin-friedrich/;;",
        "or_profile": "~Louis_B\u00e9thune1;~Thomas_Massena1;~Thibaut_Boissin1;~Aur\u00e9lien_Bellet1;~Franck_Mamalet2;~Yannick_Prudent1;~Corentin_Friedrich1;~Mathieu_Serrurier1;~David_Vigouroux1",
        "aff": "Apple ;IRIT / SNCF DTIPG;IRT Saint exup\u00e9ry;INRIA;IRT Saint Exupery;IRT Saint-Exup\u00e9ry;IRT Saint Exup\u00e9ry;university Paul Sabatier;",
        "aff_domain": "apple.com;irit.fr;irt-saintexupery.com;inria.fr;irt-saintexupery.com;irt-saintexupery.com;irt-saintexupery.com;irit.fr;",
        "position": "Researcher;PhD student;Researcher;Tenured researcher;Researcher;Researcher;Researcher;Assistant Professor;",
        "bibtex": "@inproceedings{\nb{\\'e}thune2024dpsgd,\ntitle={{DP}-{SGD} Without Clipping: The Lipschitz Neural Network Way},\nauthor={Louis B{\\'e}thune and Thomas Massena and Thibaut Boissin and Aur{\\'e}lien Bellet and Franck Mamalet and Yannick Prudent and Corentin Friedrich and Mathieu Serrurier and David Vigouroux},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=BEyEziZ4R6}\n}",
        "github": "",
        "project": "",
        "reviewers": "GMKM;ah9n;L744",
        "pdf_size": 7397919,
        "rating": "5;6;8",
        "confidence": "4;4;3",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "2;2;4",
        "wc_summary": "52;24;106",
        "wc_strengths": "21;27;360",
        "wc_weaknesses": "323;18;212",
        "wc_questions": "2;29;311",
        "wc_review": "398;98;989",
        "wc_reply_reviewers": "70;0;21",
        "wc_reply_authors": "844;60;214",
        "reply_reviewers": "1;0;1",
        "reply_authors": "3;1;1",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            60.666666666666664,
            34.03266404826725
        ],
        "wc_strengths_avg": [
            136.0,
            158.41085821369697
        ],
        "wc_weaknesses_avg": [
            184.33333333333334,
            126.04320246998205
        ],
        "wc_questions_avg": [
            114.0,
            139.73546436034053
        ],
        "wc_review_avg": [
            495.0,
            370.159425113018
        ],
        "wc_reply_reviewers_avg": [
            30.333333333333332,
            29.32954520994525
        ],
        "wc_reply_authors_avg": [
            372.6666666666667,
            339.16105646465695
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -0.944911182523068,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1811895221198899715&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 32,
        "openreview": "https://openreview.net/forum?id=BEyEziZ4R6",
        "pdf": "https://openreview.net/pdf?id=BEyEziZ4R6",
        "email": "apple.com;irit.fr;irt-saintexupery.com;inria.fr;irt-saintexupery.com;irt-saintexupery.com;irt-saintexupery.com;irit.fr;",
        "author_num": 9,
        "aff_unique_index": "0;1;2;3;4;5;2;6",
        "aff_unique_norm": "Apple;Institut de Recherche en Informatique de Toulouse;IRT Saint Exup\u00e9ry;INRIA;IRT Saint Exupery;IRT Saint-Exup\u00e9ry;Paul Sabatier University",
        "aff_unique_dep": "Apple Inc.;;;;;;",
        "aff_unique_url": "https://www.apple.com;https://www.irit.fr;;https://www.inria.fr;;https://www.irt-saintexupery.com;https://www.univ-toulouse1.fr",
        "aff_unique_abbr": "Apple;IRIT;;INRIA;;;UT1",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;1;1;1;1",
        "aff_country_unique": "United States;France"
    },
    {
        "title": "A 2-Dimensional State Space Layer for Spatial Inductive Bias",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19224",
        "id": "BGkqypmGvm",
        "author_site": "Ethan Baron, Itamar Zimerman, Lior Wolf",
        "tldr": "",
        "abstract": "A central objective in computer vision is to design models with appropriate 2-D inductive bias. Desiderata for 2-D inductive bias include two-dimensional position awareness, dynamic spatial locality, and translation and permutation invariance. To address these goals, we leverage an expressive variation of the multidimensional State Space Model (SSM). Our approach introduces efficient parameterization, accelerated computation, and a suitable normalization scheme. Empirically, we observe that incorporating our layer at the beginning of each transformer block of Vision Transformers (ViT), as well as when replacing the Conv2D filters of ConvNeXT with our proposed layers significantly  enhances performance for multiple backbones and across multiple datasets. The new layer is effective even with a negligible amount of additional parameters and inference time. Ablation studies and visualizations demonstrate that the layer has a strong 2-D inductive bias. For example, vision transformers equipped with our layer exhibit effective performance even without positional encoding. Our code is attached as supplementary.",
        "keywords": "SSM;Dimensional State Spaces;Spatial Representation",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/0f8c60423e0dd1a58c4d7b84907f5b05bbdf998b.zip",
        "author": "Ethan Baron;Itamar Zimerman;Lior Wolf",
        "authorids": "~Ethan_Baron1;~Itamar_Zimerman1;~Lior_Wolf1",
        "gender": "M;M;M",
        "homepage": ";;http://www.cs.tau.ac.il/~wolf",
        "dblp": ";294/8621;83/4103",
        "google_scholar": "02O0z30AAAAJ;01s_DpwAAAAJ;UbFrXTsAAAAJ",
        "orcid": ";0000-0001-8321-0609;0000-0001-5578-8892",
        "linkedin": "ethan-baron-a423a112a/;;",
        "or_profile": "~Ethan_Baron1;~Itamar_Zimerman1;~Lior_Wolf1",
        "aff": "Tel Aviv University;International Business Machines;Tel Aviv University",
        "aff_domain": "tau.ac.il;ibm.com;tau.ac.il",
        "position": "MS student;Researcher;Full Professor",
        "bibtex": "@inproceedings{\nbaron2024a,\ntitle={A 2-Dimensional State Space Layer for Spatial Inductive Bias},\nauthor={Ethan Baron and Itamar Zimerman and Lior Wolf},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=BGkqypmGvm}\n}",
        "github": "",
        "project": "",
        "reviewers": "SZ7R;mKTe;ZC1E;CN5B",
        "pdf_size": 3876440,
        "rating": "6;6;6;6",
        "confidence": "2;3;3;2",
        "soundness": "3;3;4;3",
        "contribution": "3;3;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "95;55;86;40",
        "wc_strengths": "56;110;174;40",
        "wc_weaknesses": "120;427;207;70",
        "wc_questions": "104;59;5;32",
        "wc_review": "375;651;472;182",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "559;932;382;358",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            2.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            69.0,
            22.371857321197094
        ],
        "wc_strengths_avg": [
            95.0,
            52.46903848937962
        ],
        "wc_weaknesses_avg": [
            206.0,
            136.68760002282576
        ],
        "wc_questions_avg": [
            50.0,
            36.55817282086182
        ],
        "wc_review_avg": [
            420.0,
            169.3620382494259
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            557.75,
            229.59352669446062
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5637507426116350084&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=BGkqypmGvm",
        "pdf": "https://openreview.net/pdf?id=BGkqypmGvm",
        "email": "tau.ac.il;ibm.com;tau.ac.il",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Tel Aviv University;International Business Machines Corporation",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tau.ac.il;https://www.ibm.com",
        "aff_unique_abbr": "TAU;IBM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Israel;United States"
    },
    {
        "title": "A Multi-Level Framework for Accelerating Training Transformer Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19223",
        "id": "BI1N3lTWtn",
        "author_site": "Longwei Zou, Han Zhang, Yangdong Deng",
        "tldr": "",
        "abstract": "The fast growing capabilities of large-scale deep learning models, such as Bert, GPT and ViT, are revolutionizing the landscape of NLP, CV and many other domains. Training such models, however, poses an unprecedented demand for computing power, which incurs exponentially increasing energy cost and carbon dioxide emissions. It is thus critical to develop efficient training solutions to reduce the training costs. Motivated by a set of key observations of inter- and intra-layer similarities among feature maps and attentions that can be identified from typical training processes, we propose a multi-level framework for training acceleration. Specifically, the framework is based on three basic operators, Coalescing, De-coalescing and Interpolation, which can be orchestrated to build a multi-level training framework. The framework consists of a V-cycle training process, which progressively down- and up-scales the model size and projects the parameters between adjacent levels of models via coalescing and de-coalescing. The key idea is that a smaller model that can be trained for fast convergence and the trained parameters provides high-qualities intermediate solutions for the next level larger network. The interpolation operator is designed to break the symmetry of neurons incurred by de-coalescing for better convergence performance. Our experiments on transformer-based language models (e.g. Bert, GPT) as well as a vision model (e.g. DeiT) prove that the proposed framework reduces the computational cost by about 20% on training BERT/GPT-Base models and up to 51.6% on training the BERT-Large model while preserving the performance.",
        "keywords": "Large Model;Transformer;Multi-Level;Training Acceleration",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Longwei Zou;Han Zhang;Yangdong Deng",
        "authorids": "~Longwei_Zou1;~Han_Zhang22;~Yangdong_Deng1",
        "gender": "M;M;M",
        "homepage": "https://photooon.github.io/;https://github.com/explorerZH;http://www.thss.tsinghua.edu.cn/publish/soften/3131/2014/20140115102144786540201/20140115102144786540201_.html",
        "dblp": "375/3580;;90/5987",
        "google_scholar": "TaG_k80AAAAJ/;;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Longwei_Zou1;~Han_Zhang22;~Yangdong_Deng1",
        "aff": "Tsinghua University;University of Washington;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;uw.edu;tsinghua.edu.cn",
        "position": "MEng student;MS student;Associate Professor",
        "bibtex": "@inproceedings{\nzou2024a,\ntitle={A Multi-Level Framework for Accelerating Training Transformer Models},\nauthor={Longwei Zou and Han Zhang and Yangdong Deng},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=BI1N3lTWtn}\n}",
        "github": "",
        "project": "",
        "reviewers": "subK;Csxk;d5rc;2jMP",
        "pdf_size": 653625,
        "rating": "5;6;6;6",
        "confidence": "4;5;2;2",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "179;69;155;112",
        "wc_strengths": "18;215;46;63",
        "wc_weaknesses": "179;132;54;63",
        "wc_questions": "247;2;47;31",
        "wc_review": "623;418;302;269",
        "wc_reply_reviewers": "121;0;27;0",
        "wc_reply_authors": "1899;538;269;870",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "3;1;1;2",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.25,
            1.299038105676658
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            128.75,
            42.02603359823527
        ],
        "wc_strengths_avg": [
            85.5,
            76.4738517403171
        ],
        "wc_weaknesses_avg": [
            107.0,
            51.36633138545131
        ],
        "wc_questions_avg": [
            81.75,
            96.76098128894725
        ],
        "wc_review_avg": [
            403.0,
            138.5478256776338
        ],
        "wc_reply_reviewers_avg": [
            37.0,
            49.73429400323282
        ],
        "wc_reply_authors_avg": [
            894.0,
            618.0538002471953
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12765167249535678442&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=BI1N3lTWtn",
        "pdf": "https://openreview.net/pdf?id=BI1N3lTWtn",
        "email": "tsinghua.edu.cn;uw.edu;tsinghua.edu.cn",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Tsinghua University;University of Washington",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.washington.edu",
        "aff_unique_abbr": "THU;UW",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "BIglOUjfXX",
        "title": "Forked Diffusion for Conditional Graph Generation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We introduce a novel score-based diffusion framework that incorporates forking for conditional generation. In this framework, a single  parent diffusion process is associated with a primary variable (e.g., structure), while multiple child diffusion processes are employed, each dedicated to a dependent variable (e.g., property). The parent process guides the co-evolution of its child processes towards segregated representation spaces. This approach allows our models to manage conditional information flow effectively, uncover intricate interactions and dependencies, and ultimately unlock new generative capabilities. Our experimental results demonstrate the significant superiority of our method over contemporary baselines in the context of conditional graph generation, highlighting the potential of forking diffusion for enhancing conditional generation tasks and inverse molecular design tasks.",
        "keywords": "conditional generative model;graph neural network;score-based diffusion",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Giangiacomo Mercatali;Yogesh Verma;Andre Freitas;Vikas Garg",
        "authorids": "~Giangiacomo_Mercatali1;~Yogesh_Verma1;~Andre_Freitas1;~Vikas_Garg2",
        "gender": ";M;;",
        "homepage": ";https://yoverma.github.io/yoerma.github.io/;http://andrefreitas.org;",
        "dblp": ";284/2155;47/9409.html;",
        "google_scholar": ";9W9u4owAAAAJ;ExmHmMoAAAAJ;",
        "orcid": ";;;",
        "linkedin": ";yogeshverma1998/;andrefreitas/;",
        "or_profile": "~Giangiacomo_Mercatali1;~Yogesh_Verma1;~Andre_Freitas1;~Vikas_Garg2",
        "aff": ";Aalto University;University of Manchester;",
        "aff_domain": ";aalto.fi;manchester.ac.uk;",
        "position": ";PhD student;Associate Professor;",
        "bibtex": "@misc{\nmercatali2024forked,\ntitle={Forked Diffusion for Conditional Graph Generation},\nauthor={Giangiacomo Mercatali and Yogesh Verma and Andre Freitas and Vikas Garg},\nyear={2024},\nurl={https://openreview.net/forum?id=BIglOUjfXX}\n}",
        "github": "",
        "project": "",
        "reviewers": "hTgA;GVsE;qecv;FTyY",
        "site": "https://openreview.net/forum?id=BIglOUjfXX",
        "pdf_size": 561353,
        "rating": "3;3;5;5",
        "confidence": "4;4;3;3",
        "soundness": "2;2;3;2",
        "contribution": "2;1;2;2",
        "presentation": "1;3;2;2",
        "wc_summary": "85;70;66;60",
        "wc_strengths": "27;54;51;10",
        "wc_weaknesses": "281;208;347;211",
        "wc_questions": "42;31;52;34",
        "wc_review": "435;363;516;315",
        "wc_reply_reviewers": "125;26;0;22",
        "wc_reply_authors": "690;519;643;448",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            70.25,
            9.229707470987366
        ],
        "wc_strengths_avg": [
            35.5,
            18.062391868188442
        ],
        "wc_weaknesses_avg": [
            261.75,
            57.23362211148269
        ],
        "wc_questions_avg": [
            39.75,
            8.13557004763649
        ],
        "wc_review_avg": [
            407.25,
            75.93541663808791
        ],
        "wc_reply_reviewers_avg": [
            43.25,
            48.225382320931374
        ],
        "wc_reply_authors_avg": [
            575.0,
            96.32497080196806
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:5C871pxEaKQJ:scholar.google.com/&scioq=Forked+Diffusion+for+Conditional+Graph+Generation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Aalto University;University of Manchester",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.aalto.fi;https://www.manchester.ac.uk",
        "aff_unique_abbr": "Aalto;UoM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Finland;United Kingdom"
    },
    {
        "title": "Equivariant Scalar Fields for Molecular Docking with Fast Fourier Transforms",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19222",
        "id": "BIveOmD1Nh",
        "author_site": "Bowen Jing, Tommi Jaakkola, Bonnie Berger",
        "tldr": "",
        "abstract": "Molecular docking is critical to structure-based virtual screening, yet the throughput of such workflows is limited by the expensive optimization of scoring functions involved in most docking algorithms. We explore how machine learning can accelerate this process by learning a scoring function with a functional form that allows for more rapid optimization. Specifically, we define the scoring function to be the cross-correlation of multi-channel ligand and protein scalar fields parameterized by equivariant graph neural networks, enabling rapid optimization over rigid-body degrees of freedom with fast Fourier transforms. The runtime of our approach can be amortized at several levels of abstraction, and is particularly favorable for virtual screening settings with a common binding pocket. We benchmark our scoring functions on two simplified docking-related tasks: decoy pose scoring and rigid conformer docking. Our method attains similar but faster performance on crystal structures compared to the widely-used Vina and Gnina scoring functions, and is more robust on computationally predicted structures. Code is available at https://github.com/bjing2016/scalar-fields.",
        "keywords": "protein structure;structural biology;drug discovery;molecular docking",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Bowen Jing;Tommi S. Jaakkola;Bonnie Berger",
        "authorids": "~Bowen_Jing1;~Tommi_S._Jaakkola1;~Bonnie_Berger1",
        "gender": ";;F",
        "homepage": ";;https://people.csail.mit.edu/bab/",
        "dblp": ";;b/BonnieBerger",
        "google_scholar": ";;bYjKaowAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Bowen_Jing1;~Tommi_S._Jaakkola1;~Bonnie_Berger1",
        "aff": ";;Massachusetts Institute of Technology",
        "aff_domain": ";;mit.edu",
        "position": ";;Full Professor",
        "bibtex": "@inproceedings{\njing2024equivariant,\ntitle={Equivariant Scalar Fields for Molecular Docking with Fast Fourier Transforms},\nauthor={Bowen Jing and Tommi S. Jaakkola and Bonnie Berger},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=BIveOmD1Nh}\n}",
        "github": "",
        "project": "",
        "reviewers": "BpA5;ncny;9kCY",
        "pdf_size": 2238837,
        "rating": "5;6;8",
        "confidence": "3;3;4",
        "soundness": "3;4;4",
        "contribution": "2;3;4",
        "presentation": "3;4;4",
        "wc_summary": "37;109;55",
        "wc_strengths": "25;126;55",
        "wc_weaknesses": "39;107;55",
        "wc_questions": "21;170;61",
        "wc_review": "122;512;226",
        "wc_reply_reviewers": "0;50;8",
        "wc_reply_authors": "1087;815;540",
        "reply_reviewers": "0;1;1",
        "reply_authors": "3;3;1",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            67.0,
            30.59411708155671
        ],
        "wc_strengths_avg": [
            68.66666666666667,
            42.35039026450117
        ],
        "wc_weaknesses_avg": [
            67.0,
            29.028721409436322
        ],
        "wc_questions_avg": [
            84.0,
            62.96559907335645
        ],
        "wc_review_avg": [
            286.6666666666667,
            164.89457911715056
        ],
        "wc_reply_reviewers_avg": [
            19.333333333333332,
            21.9291789378647
        ],
        "wc_reply_authors_avg": [
            814.0,
            223.31293439177827
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.944911182523068,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9739782478513044686&as_sdt=8005&sciodt=0,7&hl=en",
        "gs_version_total": 8,
        "openreview": "https://openreview.net/forum?id=BIveOmD1Nh",
        "pdf": "https://openreview.net/pdf?id=BIveOmD1Nh",
        "email": ";;mit.edu",
        "author_num": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "Massachusetts Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://web.mit.edu",
        "aff_unique_abbr": "MIT",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "BJ4WgPgFqJ",
        "title": "PQ-VAE: Learning Hierarchical Discrete Representations with Progressive Quantization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Variational auto-encoders (VAEs) are widely used in generative modeling and representation learning, with applications ranging from image generation to data compression. However, conventional VAEs face challenges in balancing the tradeoff between compactness and informativeness of the learned latent codes. In this work, we propose Progressive Quantization VAE (PQ-VAE), which aims to learn a progressive sequential structure for data representation that maximizes the mutual information between the latent representations and the original data in a limited description length. The resulting representations provide a global, compact, and hierarchical understanding of the data semantics, making it suitable for high-level tasks while achieving high compression rates. The proposed model offers an effective solution for generative modeling and data compression while enabling improved performance in high-level tasks such as image understanding and generation.",
        "keywords": "representation learning;deep generative models;variational autoencoders;VQ-VAE",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Lun Huang;Qiang Qiu;Guillermo Sapiro",
        "authorids": "~Lun_Huang1;~Qiang_Qiu1;~Guillermo_Sapiro1",
        "gender": ";;",
        "homepage": ";https://web.ics.purdue.edu/~qqiu/;",
        "dblp": "84/7455;97/360;82/5175",
        "google_scholar": "https://scholar.google.com/citations?hl=en;jdLtt_YAAAAJ;https://scholar.google.co.il/citations?user=ISRNX3gAAAAJ",
        "orcid": "0000-0001-5121-0460;;",
        "linkedin": ";;",
        "or_profile": "~Lun_Huang1;~Qiang_Qiu1;~Guillermo_Sapiro1",
        "aff": "Duke University;Purdue University;Duke University",
        "aff_domain": "duke.edu;purdue.edu;duke.edu",
        "position": "PhD student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nhuang2024pqvae,\ntitle={{PQ}-{VAE}: Learning Hierarchical Discrete Representations with Progressive Quantization},\nauthor={Lun Huang and Qiang Qiu and Guillermo Sapiro},\nyear={2024},\nurl={https://openreview.net/forum?id=BJ4WgPgFqJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "L7SW;JP89;bWca",
        "site": "https://openreview.net/forum?id=BJ4WgPgFqJ",
        "pdf_size": 2645559,
        "rating": "1;3;3",
        "confidence": "4;4;4",
        "soundness": "1;2;2",
        "contribution": "1;2;3",
        "presentation": "1;2;1",
        "wc_summary": "49;36;128",
        "wc_strengths": "1;27;25",
        "wc_weaknesses": "533;286;87",
        "wc_questions": "22;2;298",
        "wc_review": "605;351;538",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            71.0,
            40.65300316909769
        ],
        "wc_strengths_avg": [
            17.666666666666668,
            11.8133634311129
        ],
        "wc_weaknesses_avg": [
            302.0,
            182.4298952109184
        ],
        "wc_questions_avg": [
            107.33333333333333,
            135.06870679604347
        ],
        "wc_review_avg": [
            498.0,
            107.48333204114331
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3676146220517968528&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Duke University;Purdue University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.duke.edu;https://www.purdue.edu",
        "aff_unique_abbr": "Duke;Purdue",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "CellPLM: Pre-training of Cell Language Model Beyond Single Cells",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19221",
        "id": "BKXvPDekud",
        "author_site": "Hongzhi Wen, Wenzhuo Tang, Xinnan Dai, Jiayuan Ding, Wei Jin, Yuying Xie, Jiliang Tang",
        "tldr": "",
        "abstract": "The current state-of-the-art single-cell pre-trained models are greatly inspired by the success of large language models. They trained transformers by treating genes as tokens and cells as sentences. However, three fundamental differences between single-cell data and natural language data are overlooked: (1) scRNA-seq data are presented as bag-of-genes instead of sequences of RNAs; (2) Cell-cell relations are more intricate and important than inter-sentence relations; and (3) The quantity of single-cell data is considerably inferior to text data, and they are very noisy. In light of these characteristics, we propose a new pre-trained model, $\\textit{CellPLM}$, which takes cells as tokens and tissues as sentences. In addition, we leverage spatially-resolved transcriptomic data in pre-training to facilitate learning cell-cell relationships and introduce a Gaussian prior distribution as an additional inductive bias to overcome data limitations. $\\textit{CellPLM}$ is the first single-cell pre-trained transformer that encodes cell-cell relations and it consistently outperforms existing pre-trained and non-pre-trained models in diverse downstream tasks, with 100 times higher inference speed on generating cell embeddings than previous pre-trained models.",
        "keywords": "Single-cell analysis;Pretrained models;AI for science",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/565910ede0800a17a38788810da38efffdc30a34.zip",
        "author": "Hongzhi Wen;Wenzhuo Tang;Xinnan Dai;Jiayuan Ding;Wei Jin;Yuying Xie;Jiliang Tang",
        "authorids": "~Hongzhi_Wen1;~Wenzhuo_Tang1;~Xinnan_Dai1;~Jiayuan_Ding1;~Wei_Jin4;~Yuying_Xie1;~Jiliang_Tang1",
        "gender": "M;M;F;M;;M;M",
        "homepage": "https://www.cse.msu.edu/~wenhongz/;;;;http://www.cs.emory.edu/~wjin30/;https://cmse.msu.edu/directory/faculty/yuying-xie/;https://www.cse.msu.edu/~tangjili/",
        "dblp": "179/0477;;;197/1055;66/2173-9;24/2813-1;64/10812",
        "google_scholar": ";;LGKDd2AAAAAJ;7lwkXGEAAAAJ;eWow24EAAAAJ;https://scholar.google.com/citations?hl=en;WtzKMWAAAAAJ",
        "orcid": "0000-0003-0775-8538;;;;;0000-0002-1049-2219;0000-0001-7125-3898",
        "linkedin": ";wenzhuo-tang-66b757207;;jiayuand/;;yuying-xie-b754bb17/;",
        "or_profile": "~Hongzhi_Wen1;~Wenzhuo_Tang1;~Xinnan_Dai1;~Jiayuan_Ding1;~Wei_Jin4;~Yuying_Xie1;~Jiliang_Tang1",
        "aff": "Michigan State University;Michigan State University;Michigan State University;Michigan State University;Emory University;Michigan State University;Michigan State University",
        "aff_domain": "msu.edu;msu.edu;msu.edu;msu.edu;emory.edu;msu.edu;msu.edu",
        "position": "PhD student;PhD student;PhD student;PhD student;Assistant Professor;Associate Professor;Full Professor",
        "bibtex": "@inproceedings{\nwen2024cellplm,\ntitle={Cell{PLM}: Pre-training of Cell Language Model Beyond Single Cells},\nauthor={Hongzhi Wen and Wenzhuo Tang and Xinnan Dai and Jiayuan Ding and Wei Jin and Yuying Xie and Jiliang Tang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=BKXvPDekud}\n}",
        "github": "",
        "project": "",
        "reviewers": "C7dG;1rfQ;QJ4u;3Haz",
        "pdf_size": 6685800,
        "rating": "6;6;6;8",
        "confidence": "2;2;4;4",
        "soundness": "3;3;3;4",
        "contribution": "3;3;3;3",
        "presentation": "3;3;3;4",
        "wc_summary": "18;70;137;62",
        "wc_strengths": "33;25;90;69",
        "wc_weaknesses": "234;72;378;95",
        "wc_questions": "5;2;3;96",
        "wc_review": "290;169;608;322",
        "wc_reply_reviewers": "30;0;0;0",
        "wc_reply_authors": "1175;773;2274;1325",
        "reply_reviewers": "2;0;0;0",
        "reply_authors": "4;3;7;3",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            1.0
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            71.75,
            42.558048592481306
        ],
        "wc_strengths_avg": [
            54.25,
            26.47050245084139
        ],
        "wc_weaknesses_avg": [
            194.75,
            122.61601649050584
        ],
        "wc_questions_avg": [
            26.5,
            40.1403786728526
        ],
        "wc_review_avg": [
            347.25,
            160.9959238614444
        ],
        "wc_reply_reviewers_avg": [
            7.5,
            12.99038105676658
        ],
        "wc_reply_authors_avg": [
            1386.75,
            550.5798647789437
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            4.25,
            1.6393596310755
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 24,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15887212670928548591&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=BKXvPDekud",
        "pdf": "https://openreview.net/pdf?id=BKXvPDekud",
        "email": "msu.edu;msu.edu;msu.edu;msu.edu;emory.edu;msu.edu;msu.edu",
        "author_num": 7,
        "aff_unique_index": "0;0;0;0;1;0;0",
        "aff_unique_norm": "Michigan State University;Emory University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.msu.edu;https://www.emory.edu",
        "aff_unique_abbr": "MSU;Emory",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "BKinRUoBN9",
        "title": "Investigating the Impact of Data Distribution Shifts on Cross-Modal Knowledge Distillation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Cross-modal knowledge distillation (KD) has expanded the traditional KD approach to encompass multimodal learning, achieving notable success in various applications. However, in cases where there is a considerable shift in data distribution during cross-modal KD, even a more accurate teacher model may not effectively instruct the student model. In this paper, we conduct a comprehensive analysis and evaluation of the effectiveness of cross-modal KD, focusing on its dependence on the distribution shifts in multimodal data. We initially view cross-modal KD as training a maximum entropy model using pseudo-labels and establish conditions under which it outperforms unimodal KD. Subsequently, we introduced the hypothesis of solution space divergence, which unveils the crucial factor influencing the efficacy of cross-modal KD. Our key observation is that the accuracy of the teacher model is not the primary determinant of the student model's accuracy; instead, the data distribution shifts play a more significant role. We demonstrate that as the data distribution shifts decrease, the effectiveness of cross-modal KD improves, and vice versa. Finally, to address significant data distribution differences, we propose a method called the ``perceptual solution space mask'' to enhance the effectiveness of cross-modal KD. Through experimental results on four multimodal datasets, we validate our assumptions and provide directions for future enhancements in cross-modal knowledge transfer. Notably, our enhanced KD method demonstrated an approximate 2\\% improvement in \\emph{mIoU} compared to the Baseline on the SemanticKITTI dataset.",
        "keywords": "Cross-Modal Knowledge Distillation; Data distribution shifts",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/671da5f37467b3eba247f38a874b6f5c82bb5e95.zip",
        "author": "Yilong Chen;Zongyi Xu;Xiaoshui Huang;Xinbo Gao",
        "authorids": "~Yilong_Chen1;~Zongyi_Xu1;~Xiaoshui_Huang1;~Xinbo_Gao5",
        "gender": "F;Not Specified;M;M",
        "homepage": ";https://xiaoshuihuang.github.io/;https://faculty.cqupt.edu.cn/gaoxinbo/zh_CN/index.htm;",
        "dblp": "125/3642;167/9599;;",
        "google_scholar": "PUseiVAAAAAJ;https://scholar.google.ca/citations?user=rp7mYNsAAAAJ;https://scholar.google.com/citations?hl=zh-CN;DsNNLTwAAAAJ",
        "orcid": ";;0000-0002-7985-0037;0000-0002-3649-3519",
        "linkedin": ";;xinbo-gao-151a2224/;",
        "or_profile": "~Zongyi_Xu1;~Xiaoshui_Huang1;~Xinbo_Gao5;~Elon_Chen1",
        "aff": "Chongqing University of Post and Telecommunications;Shanghai AI Laboratory;Chongqing University of Post and Telecommunications;Chongqing University of Post and Telecommunications",
        "aff_domain": "cqupt.edu.cn;pjlab.org.cn;cqupt.edu.cn;cqupt.edu.cn",
        "position": "Associate Professor;Research Fellow;Full Professor;PhD student",
        "bibtex": "@misc{\nchen2024investigating,\ntitle={Investigating the Impact of Data Distribution Shifts on Cross-Modal Knowledge Distillation},\nauthor={Yilong Chen and Zongyi Xu and Xiaoshui Huang and Xinbo Gao},\nyear={2024},\nurl={https://openreview.net/forum?id=BKinRUoBN9}\n}",
        "github": "",
        "project": "",
        "reviewers": "Pm6d;voCm;GxY4;NCD3",
        "site": "https://openreview.net/forum?id=BKinRUoBN9",
        "pdf_size": 24818612,
        "rating": "5;5;6;6",
        "confidence": "4;3;3;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "67;60;19;66",
        "wc_strengths": "46;70;21;104",
        "wc_weaknesses": "147;52;57;104",
        "wc_questions": "44;42;49;5",
        "wc_review": "304;224;146;279",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "554;340;544;367",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            53.0,
            19.81161275615895
        ],
        "wc_strengths_avg": [
            60.25,
            30.629846555280032
        ],
        "wc_weaknesses_avg": [
            90.0,
            38.658763560155414
        ],
        "wc_questions_avg": [
            35.0,
            17.507141400011598
        ],
        "wc_review_avg": [
            238.25,
            60.615076507416866
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            451.25,
            98.2786217852082
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:5Tm2TZStsRkJ:scholar.google.com/&scioq=Investigating+the+Impact+of+Data+Distribution+Shifts+on+Cross-Modal+Knowledge+Distillation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Chongqing University of Post and Telecommunications;Shanghai AI Laboratory",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.cqupt.edu.cn;https://www.shanghai-ai-lab.com",
        "aff_unique_abbr": "CQUPT;SAIL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "LogicMP: A Neuro-symbolic Approach for Encoding First-order Logic Constraints",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19220",
        "id": "BLGQ3oqldb",
        "author_site": "Weidi Xu, Jingwei Wang, Lele Xie, Jianshan He, Hongting Zhou, Taifeng Wang, Xiaopei Wan, Jingdong Chen, Chao Qu, Wei Chu",
        "tldr": "",
        "abstract": "Integrating first-order logic constraints (FOLCs) with neural networks is a crucial but challenging problem since it involves modeling intricate correlations to satisfy the constraints. This paper proposes a novel neural layer, LogicMP, which performs mean-field variational inference over a Markov Logic Network (MLN). It can be plugged into any off-the-shelf neural network to encode FOLCs while retaining modularity and efficiency. By exploiting the structure and symmetries in MLNs, we theoretically demonstrate that our well-designed, efficient mean-field iterations greatly mitigate the difficulty of MLN inference, reducing the inference from sequential calculation to a series of parallel tensor operations. Empirical results in three kinds of tasks over images, graphs, and text show that LogicMP outperforms advanced competitors in both performance and efficiency.",
        "keywords": "Variational Inference",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/78afeaa0ecb9c0bbfd077557c85242e1ea59347b.zip",
        "author": "Weidi Xu;Jingwei Wang;Lele Xie;Jianshan He;Hongting Zhou;Taifeng Wang;Xiaopei Wan;Jingdong Chen;Chao Qu;Wei Chu",
        "authorids": "~Weidi_Xu1;~Jingwei_Wang1;~Lele_Xie1;~Jianshan_He1;~Hongting_Zhou1;~Taifeng_Wang2;~Xiaopei_Wan2;~Jingdong_Chen1;~Chao_Qu3;~Wei_Chu1",
        "gender": "M;;M;M;F;M;M;M;M;M",
        "homepage": ";;;;https://github.com/Nurikol;https://scholar.google.com/citations?user=aMNBEk0AAAAJ&hl=zh-CN;;;;http://weichu.github.io",
        "dblp": "00/11534;;214/0068;225/5402;253/0325;01/1483;;33/5656;;",
        "google_scholar": ";;vH97Cd4AAAAJ;https://scholar.google.com.hk/citations?user=0bq6rAkAAAAJ;;aMNBEk0AAAAJ;zU9TT-AAAAAJ;8SCEv-YAAAAJ;DI2NyPsAAAAJ;3J4zb7gAAAAJ",
        "orcid": "0000-0002-7279-9339;;;;;;;0000-0002-1872-2592;;",
        "linkedin": ";;;;%E8%99%B9%E5%BB%B7-%E5%91%A8-6524b6149/;;;;;",
        "or_profile": "~Weidi_Xu1;~Jingwei_Wang1;~Lele_Xie1;~Jianshan_He1;~Hongting_Zhou1;~Taifeng_Wang2;~Xiaopei_Wan2;~Jingdong_Chen1;~Chao_Qu3;~Wei_Chu1",
        "aff": "Infly Technology;;Ant Group;Ant Group;Antgroup;BioMap;;Ant Group;Inftech;Inf Tech",
        "aff_domain": "inftech.ai;;antgroup.com;antgroup.com;antgroup.com;biomap.com;;antgroup.com;inftech.ai;inftech.ai",
        "position": "Researcher;;Researcher;Researcher;Researcher;Principal Researcher;;Senior Staff Algorithm Engineer;Researcher;Researcher",
        "bibtex": "@inproceedings{\nxu2024logicmp,\ntitle={Logic{MP}: A Neuro-symbolic Approach for Encoding First-order Logic Constraints},\nauthor={Weidi Xu and Jingwei Wang and Lele Xie and Jianshan He and Hongting Zhou and Taifeng Wang and Xiaopei Wan and Jingdong Chen and Chao Qu and Wei Chu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=BLGQ3oqldb}\n}",
        "github": "",
        "project": "",
        "reviewers": "RzRh;svJm;9vvz;XeZX",
        "pdf_size": 2972462,
        "rating": "5;5;6;8",
        "confidence": "3;2;4;4",
        "soundness": "3;2;2;3",
        "contribution": "1;2;2;3",
        "presentation": "2;1;3;3",
        "wc_summary": "35;26;67;94",
        "wc_strengths": "13;106;37;48",
        "wc_weaknesses": "133;177;126;154",
        "wc_questions": "72;2;131;96",
        "wc_review": "253;311;361;392",
        "wc_reply_reviewers": "0;0;89;4",
        "wc_reply_authors": "743;1175;1788;649",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "1;2;4;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            55.5,
            26.949025956423732
        ],
        "wc_strengths_avg": [
            51.0,
            34.18332927027442
        ],
        "wc_weaknesses_avg": [
            147.5,
            19.90602923739438
        ],
        "wc_questions_avg": [
            75.25,
            47.20897690058534
        ],
        "wc_review_avg": [
            329.25,
            52.661062465544695
        ],
        "wc_reply_reviewers_avg": [
            23.25,
            37.995887935406905
        ],
        "wc_reply_authors_avg": [
            1088.75,
            449.80905671184524
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.7385489458759963,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:DjV_uspSItUJ:scholar.google.com/&scioq=LogicMP:+A+Neuro-symbolic+Approach+for+Encoding+First-order+Logic+Constraints&hl=en&as_sdt=0,5",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=BLGQ3oqldb",
        "pdf": "https://openreview.net/pdf?id=BLGQ3oqldb",
        "email": "inftech.ai;;antgroup.com;antgroup.com;antgroup.com;biomap.com;;antgroup.com;inftech.ai;inftech.ai",
        "author_num": 10,
        "aff_unique_index": "0;1;1;2;3;1;4;5",
        "aff_unique_norm": "Infly Technology;Ant Group;Antgroup;BioMap;Inftech;Information Technology",
        "aff_unique_dep": ";;;;;",
        "aff_unique_url": ";https://www.antgroup.com;https://www.antgroup.com;;;",
        "aff_unique_abbr": ";Ant Group;Antgroup;;;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "1;1;1;1",
        "aff_country_unique": ";China"
    },
    {
        "id": "BMZYh3IyAU",
        "title": "Provably Doubly Accelerated Federated Learning: The First Theoretically Successful Combination of Local Training and Communication Compression",
        "track": "main",
        "status": "Desk Reject",
        "tldr": "",
        "abstract": "In federated learning, a large number of users collaborate to learn a global model. They alternate local computations and two-way communication with a distant server. Communication, which can be slow and costly, is the main bottleneck in this setting. To reduce the communication load and therefore accelerate distributed gradient descent, two strategies are popular: 1) communicate less frequently; that is, perform several iterations of local computations between the communication rounds; and 2) communicate compressed information instead of full-dimensional vectors. We propose the first algorithm for distributed optimization and federated learning, which harnesses these two strategies jointly and converges linearly to an exact solution in the strongly convex setting, with a doubly accelerated rate: our algorithm benefits from the two acceleration mechanisms provided by local training and compression, namely a better dependency on the condition number of the functions and on the dimension of the model, respectively.",
        "keywords": "Federated learning;local training;compression;communication;optimization",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/8c0d96120d9d802906205931fc08aa1f095fa4d6.zip",
        "author": "Laurent Condat;Ivan Agarsk\u00fd;Peter Richt\u00e1rik",
        "authorids": "~Laurent_Condat1;~Ivan_Agarsk\u00fd1;~Peter_Richt\u00e1rik1",
        "gender": "M;M;M",
        "homepage": "https://lcondat.github.io/;;https://richtarik.org",
        "dblp": "88/1335;331/8298;62/8001",
        "google_scholar": "PixYHyEAAAAJ;534mR8QAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0001-7087-1002;0000-0003-2007-881X;0000-0003-4380-5848",
        "linkedin": "laurent-condat-40291720b/;agarsky/;richtarik/",
        "or_profile": "~Laurent_Condat1;~Ivan_Agarsk\u00fd1;~Peter_Richtarik1",
        "aff": "KAUST;Kempelen Institute of Intelligent Technologies;King Abdullah University of Science and Technology (KAUST)",
        "aff_domain": "kaust.edu.sa;kinit.sk;kaust.edu.sa",
        "position": "research scientist;PhD student;Full Professor",
        "bibtex": "@misc{\ncondat2024provably,\ntitle={Provably Doubly Accelerated Federated Learning: The First Theoretically Successful Combination of Local Training and Communication Compression},\nauthor={Laurent Condat and Ivan Agarsk{\\'y} and Peter Richt{\\'a}rik},\nyear={2024},\nurl={https://openreview.net/forum?id=BMZYh3IyAU}\n}",
        "github": "",
        "project": "",
        "reviewers": "Va6u;5itr",
        "site": "https://openreview.net/forum?id=BMZYh3IyAU",
        "pdf_size": 1077068,
        "rating": "6;6",
        "confidence": "3;3",
        "soundness": "3;3",
        "contribution": "3;3",
        "presentation": "2;4",
        "wc_summary": "49;56",
        "wc_strengths": "48;48",
        "wc_weaknesses": "57;181",
        "wc_questions": "278;103",
        "wc_review": "432;388",
        "wc_reply_reviewers": "0;22",
        "wc_reply_authors": "965;742",
        "reply_reviewers": "0;1",
        "reply_authors": "2;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            1.0
        ],
        "wc_summary_avg": [
            52.5,
            3.5
        ],
        "wc_strengths_avg": [
            48.0,
            0.0
        ],
        "wc_weaknesses_avg": [
            119.0,
            62.0
        ],
        "wc_questions_avg": [
            190.5,
            87.5
        ],
        "wc_review_avg": [
            410.0,
            22.0
        ],
        "wc_reply_reviewers_avg": [
            11.0,
            11.0
        ],
        "wc_reply_authors_avg": [
            853.5,
            111.5
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 22,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7249144093151301792&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "King Abdullah University of Science and Technology;Kempelen Institute of Intelligent Technologies",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.kaust.edu.sa;http://www.kempeleninstitute.com",
        "aff_unique_abbr": "KAUST;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Saudi Arabia;Hungary"
    },
    {
        "id": "BMw4Cm0gGO",
        "title": "C-MCTS: Safe Planning with Monte Carlo Tree Search",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The Constrained Markov Decision Process (CMDP) allows to solve safety-critical decision making tasks that are subject to constraints. \nWhile CMDPs have been extensively studied in the Reinforcement Learning literature, little attention has been given to sampling-based planning algorithms such as MCTS for solving them. Previous approaches perform conservatively with respect to costs as they avoid constraint violations by using Monte Carlo cost estimates that suffer from high variance. We propose Constrained MCTS (C-MCTS), which estimates cost using a safety critic that is trained with Temporal Difference learning in an offline phase prior to agent deployment. The critic limits exploration by pruning unsafe trajectories within MCTS during deployment. C-MCTS satisfies cost constraints but operates closer to the constraint boundary, achieving higher rewards than previous work. As a nice byproduct, the planner is more efficient w.r.t. planning steps. Most importantly, under model mismatch between the planner and the real world, C-MCTS is less susceptible to cost violations than previous work.",
        "keywords": "Monte Carlo Tree Search;Safety Critic;Safe Reinforcement Learning;Reinforcement Learning;RL",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/e2339d1062b46e11afc46da672c9047490f63e34.zip",
        "author": "Dinesh Parthasarathy;Georgios Kontes;Axel Plinge;Christopher Mutschler",
        "authorids": "~Dinesh_Parthasarathy1;~Georgios_Kontes1;~Axel_Plinge1;~Christopher_Mutschler1",
        "gender": "M;;M;M",
        "homepage": ";;https://www.iis.fraunhofer.de/;https://www.cmutschler.de",
        "dblp": ";;36/1064;118/7748",
        "google_scholar": ";;TLskmTcAAAAJ;https://scholar.google.de/citations?user=gKDSp8YAAAAJ",
        "orcid": ";;0000-0001-7757-2953;0000-0001-8108-0230",
        "linkedin": "dineshkumar-93/;;aplinge/;christopher-mutschler-28431576/",
        "or_profile": "~Dinesh_Parthasarathy1;~Georgios_Kontes1;~Axel_Plinge1;~Christopher_Mutschler1",
        "aff": "Lawrence Livermore National Labs;;;Fraunhofer IIS",
        "aff_domain": "llnl.gov;;;fraunhofer.de",
        "position": "Intern;;;Principal Researcher",
        "bibtex": "@misc{\nparthasarathy2024cmcts,\ntitle={C-{MCTS}: Safe Planning with Monte Carlo Tree Search},\nauthor={Dinesh Parthasarathy and Georgios Kontes and Axel Plinge and Christopher Mutschler},\nyear={2024},\nurl={https://openreview.net/forum?id=BMw4Cm0gGO}\n}",
        "github": "",
        "project": "",
        "reviewers": "DU49;q4t7;EfYF;q5zX",
        "site": "https://openreview.net/forum?id=BMw4Cm0gGO",
        "pdf_size": 483528,
        "rating": "3;5;5;5",
        "confidence": "5;3;3;3",
        "soundness": "2;2;1;3",
        "contribution": "2;2;2;2",
        "presentation": "3;3;2;3",
        "wc_summary": "49;95;41;35",
        "wc_strengths": "66;59;33;17",
        "wc_weaknesses": "64;135;178;29",
        "wc_questions": "88;353;52;226",
        "wc_review": "267;642;304;307",
        "wc_reply_reviewers": "17;25;31;17",
        "wc_reply_authors": "619;2040;1010;1081",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;3;2;2",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            55.0,
            23.62202362203543
        ],
        "wc_strengths_avg": [
            43.75,
            19.74050404624968
        ],
        "wc_weaknesses_avg": [
            101.5,
            58.38878316937252
        ],
        "wc_questions_avg": [
            179.75,
            119.2610057814372
        ],
        "wc_review_avg": [
            380.0,
            152.08385844658204
        ],
        "wc_reply_reviewers_avg": [
            22.5,
            5.894913061275798
        ],
        "wc_reply_authors_avg": [
            1187.5,
            522.6846563655757
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15509113104036491848&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Lawrence Livermore National Laboratory;Fraunhofer Institute for Integrated Circuits",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.llnl.gov;https://www.iis.fraunhofer.de/",
        "aff_unique_abbr": "LLNL;Fraunhofer IIS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United States;Germany"
    },
    {
        "id": "BO3aRwGzq0",
        "title": "DINAR: Fine-Grained Privacy Preserving Federated Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Federated Learning (FL) enables collaborative model training among several participants, while keeping local data private at the participants' premises.However, despite its merits, FL remains vulnerable to privacy attacks, and in particular, to membership inference attacks that allow adversaries to deduce confidential information about participants' training data.\nIn this paper, we propose DINAR, a novel privacy-preserving FL method. DINAR follows a fine-grained approach that specifically tackles FL neural network layers that leak more private information than other layers, thus, efficiently protecting the FL model against membership inference attacks in a non-intrusive way. And in order to compensate for any potential loss in the accuracy of the protected model, DINAR combines the proposed fine-grained approach with adaptive gradient descent.The paper presents our extensive empirical evaluation of DINAR, conducted with six widely used datasets, four neural networks, and comparing against three state-of-the-art FL privacy protection mechanisms.The evaluation results show that DINAR reduces the membership inference attack success rate to reach its optimal value, without hurting model accuracy, and without inducing computational overhead. In contrast, existing FL defense mechanisms incur an overhead of up to +36% and +3,000% on respectively FL client-side and FL server-side computation times, and up to +168% on memory usage.",
        "keywords": "Federetad Learning;Privacy;Membership Inference Attacks;Cross-Silo Federated Learning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "C\u00e9dric BOSCHER;Fatima Elhattab;Sara Bouchenak",
        "authorids": "~C\u00e9dric_BOSCHER1;~Fatima_Elhattab1;~Sara_Bouchenak1",
        "gender": "M;F;F",
        "homepage": "https://liris.cnrs.fr/page-membre/cedric-boscher;https://liris.cnrs.fr/page-membre/fatima-el-hattab;https://perso.liris.cnrs.fr/sara.bouchenak/",
        "dblp": ";;",
        "google_scholar": ";;",
        "orcid": ";;",
        "linkedin": ";;sara-bouchenak-587bbb24/",
        "or_profile": "~C\u00e9dric_BOSCHER1;~Fatima_Elhattab1;~Sara_Bouchenak1",
        "aff": "Institut National des Sciences Appliqu\u00e9es de Lyon;;Institut National des Sciences Appliqu\u00e9es de Lyon",
        "aff_domain": "insa-lyon.fr;;insa-lyon.fr",
        "position": "PhD student;;Full Professor",
        "bibtex": "@misc{\nboscher2024dinar,\ntitle={{DINAR}: Fine-Grained Privacy Preserving Federated Learning},\nauthor={C{\\'e}dric BOSCHER and Fatima Elhattab and Sara Bouchenak},\nyear={2024},\nurl={https://openreview.net/forum?id=BO3aRwGzq0}\n}",
        "github": "",
        "project": "",
        "reviewers": "nS4z;AcVa;uPn1;Y9fY",
        "site": "https://openreview.net/forum?id=BO3aRwGzq0",
        "pdf_size": 1213686,
        "rating": "5;5;5;5",
        "confidence": "3;4;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;3;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "73;71;120;65",
        "wc_strengths": "16;42;107;46",
        "wc_weaknesses": "29;129;702;100",
        "wc_questions": "175;4;6;110",
        "wc_review": "293;246;935;321",
        "wc_reply_reviewers": "88;13;11;0",
        "wc_reply_authors": "454;519;704;624",
        "reply_reviewers": "2;1;1;0",
        "reply_authors": "3;2;2;2",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            82.25,
            21.992896580487074
        ],
        "wc_strengths_avg": [
            52.75,
            33.37195679009548
        ],
        "wc_weaknesses_avg": [
            240.0,
            269.20531198325193
        ],
        "wc_questions_avg": [
            73.75,
            72.49267204345554
        ],
        "wc_review_avg": [
            448.75,
            282.0127435063884
        ],
        "wc_reply_reviewers_avg": [
            28.0,
            34.99285641384538
        ],
        "wc_reply_authors_avg": [
            575.25,
            95.94106263743382
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:0N-qxFgLJj8J:scholar.google.com/&scioq=DINAR:+Fine-Grained+Privacy+Preserving+Federated+Learning&hl=en&as_sdt=0,48",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Institut National des Sciences Appliqu\u00e9es",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.insa-lyon.fr",
        "aff_unique_abbr": "INSA Lyon",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Lyon",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "France"
    },
    {
        "title": "LMSYS-Chat-1M: A Large-Scale Real-World LLM Conversation Dataset",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19219",
        "id": "BOfDKxfwt0",
        "author_site": "Lianmin Zheng, Wei-Lin Chiang, Ying Sheng, Tianle Li, Siyuan Zhuang, Zhanghao Wu, Yonghao Zhuang, Zhuohan Li, Zi Lin, Eric Xing, Joseph E Gonzalez, Ion Stoica, Hao Zhang",
        "tldr": "",
        "abstract": "Studying how people interact with large language models (LLMs) in real-world scenarios is increasingly important due to their widespread use in various applications. In this paper, we introduce LMSYS-Chat-1M, a large-scale dataset containing one million real-world conversations with 25 state-of-the-art LLMs. This dataset is collected from 210K unique IP addresses in the wild on our Vicuna demo and Chatbot Arena website. We offer an overview of the dataset's content, including its curation process, basic statistics, and topic distribution, highlighting its diversity, originality, and scale. We demonstrate its versatility through four use cases: developing content moderation models that perform similarly to GPT-4, building a safety benchmark, training instruction-following models that perform similarly to Vicuna, and creating challenging benchmark questions. We believe that this dataset will serve as a valuable resource for understanding and advancing LLM capabilities. The dataset is publicly available at https://huggingface.co/datasets/lmsys/lmsys-chat-1m.",
        "keywords": "large language models;dataset;conversation;safety;benchmark",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Lianmin Zheng;Wei-Lin Chiang;Ying Sheng;Tianle Li;Siyuan Zhuang;Zhanghao Wu;Yonghao Zhuang;Zhuohan Li;Zi Lin;Eric Xing;Joseph E. Gonzalez;Ion Stoica;Hao Zhang",
        "authorids": "~Lianmin_Zheng2;~Wei-Lin_Chiang1;~Ying_Sheng1;~Tianle_Li2;~Siyuan_Zhuang1;~Zhanghao_Wu1;~Yonghao_Zhuang1;~Zhuohan_Li1;~Zi_Lin1;~Eric_Xing1;~Joseph_E._Gonzalez1;~Ion_Stoica1;~Hao_Zhang2",
        "gender": "M;;F;M;M;M;M;M;F;M;M;M;M",
        "homepage": "http://lmzheng.net/;https://infwinston.github.io/;https://sites.google.com/view/yingsheng;;https://suquark.github.io/;https://zhanghaowu.me;https://zyhowell.github.io/;http://zhuohan.li;https://zi-lin.com/;http://www.cs.cmu.edu/~epxing/;http://eecs.berkeley.edu/~jegonzal;http://people.eecs.berkeley.edu/~istoica/;https://cseweb.ucsd.edu/~haozhang/",
        "dblp": "211/7027;174/2148;262/6232.html;;;;;;81/2999;36/3855;61/8262;s/IonStoica;55/2270-25",
        "google_scholar": "_7Q8uIYAAAAJ;https://scholar.google.com/citations?hl=en;xMhGYpgAAAAJ;1M79iLwAAAAJ;KSZmI5EAAAAJ;YfyMDFgAAAAJ;oh297TsAAAAJ;;kgZYttUAAAAJ;https://scholar.google.com.tw/citations?user=5pKTRxEAAAAJ;https://scholar.google.com.tw/citations?user=gM2WW9UAAAAJ;vN-is70AAAAJ;H1d4BS8AAAAJ",
        "orcid": ";;0000-0002-1883-2126;;0009-0007-3787-0316;;;;;;0000-0003-2921-956X;;",
        "linkedin": ";;;tianleli/;siyuanzhuang;;;;zi-lin/;;;ionstoica;",
        "or_profile": "~Lianmin_Zheng2;~Wei-Lin_Chiang1;~Ying_Sheng1;~Tianle_Li2;~Siyuan_Zhuang1;~Zhanghao_Wu1;~Yonghao_Zhuang1;~Zhuohan_Li1;~Zi_Lin1;~Eric_Xing1;~Joseph_E._Gonzalez1;~Ion_Stoica1;~Hao_Zhang2",
        "aff": "University of California, Berkeley;University of California, Berkeley;Stanford University;University of California, Berkeley;University of California, Berkeley;University of California, Berkeley;Carnegie Mellon University;University of California, Berkeley;University of California, San Diego;School of Computer Science, Carnegie Mellon University;University of California, Berkeley;University of California, Berkeley;Carnegie Mellon University",
        "aff_domain": "berkeley.edu;berkeley.edu;stanford.edu;berkeley.edu;berkeley.edu;berkeley.edu;andrew.cmu.edu;berkeley.edu;ucsd.edu;cs.cmu.edu;berkeley.edu;berkeley.edu;cmu.edu",
        "position": "PhD student;PhD student;PhD student;Undergrad student;PhD student;PhD student;PhD student;PhD student;Graduate student;Full Professor;Associate Professor;Full Professor;PhD student",
        "bibtex": "@inproceedings{\nzheng2024lmsyschatm,\ntitle={{LMSYS}-Chat-1M: A Large-Scale Real-World {LLM} Conversation Dataset},\nauthor={Lianmin Zheng and Wei-Lin Chiang and Ying Sheng and Tianle Li and Siyuan Zhuang and Zhanghao Wu and Yonghao Zhuang and Zhuohan Li and Zi Lin and Eric Xing and Joseph E. Gonzalez and Ion Stoica and Hao Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=BOfDKxfwt0}\n}",
        "github": "",
        "project": "",
        "reviewers": "M7pJ;kFoy;hTkb;D9AT",
        "pdf_size": 916611,
        "rating": "6;8;8;8",
        "confidence": "4;4;4;4",
        "soundness": "2;3;4;3",
        "contribution": "4;4;3;4",
        "presentation": "3;3;3;3",
        "wc_summary": "55;47;69;45",
        "wc_strengths": "94;110;94;81",
        "wc_weaknesses": "61;70;141;26",
        "wc_questions": "2;10;2;32",
        "wc_review": "212;237;306;184",
        "wc_reply_reviewers": "0;0;10;10",
        "wc_reply_authors": "196;163;331;178",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            54.0,
            9.433981132056603
        ],
        "wc_strengths_avg": [
            94.75,
            10.280442597476044
        ],
        "wc_weaknesses_avg": [
            74.5,
            41.76421913552317
        ],
        "wc_questions_avg": [
            11.5,
            12.278029157808675
        ],
        "wc_review_avg": [
            234.75,
            45.20716204319842
        ],
        "wc_reply_reviewers_avg": [
            5.0,
            5.0
        ],
        "wc_reply_authors_avg": [
            217.0,
            66.84683986547158
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            13,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 160,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1730324882341676130&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=BOfDKxfwt0",
        "pdf": "https://openreview.net/pdf?id=BOfDKxfwt0",
        "email": "berkeley.edu;berkeley.edu;stanford.edu;berkeley.edu;berkeley.edu;berkeley.edu;andrew.cmu.edu;berkeley.edu;ucsd.edu;cs.cmu.edu;berkeley.edu;berkeley.edu;cmu.edu",
        "author_num": 13,
        "aff_unique_index": "0;0;1;0;0;0;2;0;3;2;0;0;2",
        "aff_unique_norm": "University of California, Berkeley;Stanford University;Carnegie Mellon University;University of California, San Diego",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.berkeley.edu;https://www.stanford.edu;https://www.cmu.edu;https://www.ucsd.edu",
        "aff_unique_abbr": "UC Berkeley;Stanford;CMU;UCSD",
        "aff_campus_unique_index": "0;0;1;0;0;0;0;3;4;0;0",
        "aff_campus_unique": "Berkeley;Stanford;;San Diego;Pittsburgh",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "BOm1RYdHHu",
        "title": "SAFHE: Defending Against Backdoor and Gradient Inversion Attacks in Federated Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Federated learning (FL) is an increasingly popular approach in machine learning that enables a set of clients to jointly train a global model without ever sharing their private data, using a central server to aggregate clients' local weight updates. However, previous work has shown that the distributed nature of federated learning makes it susceptible to two major attacks: backdoor attacks, where malicious clients submit large weights that incorrectly change model behavior, and gradient inversion attacks, where a malicious eavesdropper is able to reconstruct the clients' training data by viewing the weight updates sent by clients to the central server. Although various solutions have been proposed in the literature that defend against these two attacks separately, present approaches remain largely incompatible, creating a trade-off between defending against the two types of attacks. This poses a major challenge in deploying FL in privacy-sensitive ML applications.\n\nWe present SAFHE (Secure Aggregation with Fully Homomorphic Encryption), a novel scheme to defend against both backdoor attacks and gradient inversion attacks. Our secure aggregation method combines the use of fully homomorphic encryption (FHE) and the gradient norm clipping defense to defend against large malicious client updates, by pre-weighting client updates using a function that can be evaluated in the encrypted domain. This allows the server to reject large-magnitude updates without seeing their cleartext values. We demonstrate that Chebyshev approximations of a product of sigmoids work for this purpose, and perform simulations suggesting that such a scheme can defend against backdoor attacks without significantly impacting model accuracy. Additionally, we show that these approximations can be accurately and efficiently computed in the encrypted domain.",
        "keywords": "federated learning;fully homomorphic encryption;backdoor attacks;gradient inversion attacks",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Jordan Barkin;Ratip Emin Berker;S\u00edlvia Casacuberta;Janet Li",
        "authorids": "~Jordan_Barkin1;~Ratip_Emin_Berker1;~S\u00edlvia_Casacuberta1;~Janet_Li1",
        "gender": "M;M;;F",
        "homepage": ";;;",
        "dblp": ";315/8807.html;;",
        "google_scholar": ";HxaUFCkAAAAJ;;",
        "orcid": ";;;",
        "linkedin": "jordan-barkin/;;;janetli19/",
        "or_profile": "~Jordan_Barkin1;~Ratip_Emin_Berker1;~S\u00edlvia_Casacuberta1;~Janet_Li1",
        "aff": ";Carnegie Mellon University;;Harvard University",
        "aff_domain": ";cs.cmu.edu;;harvard.edu",
        "position": ";PhD student;;Undergrad student",
        "bibtex": "@misc{\nbarkin2024safhe,\ntitle={{SAFHE}: Defending Against Backdoor and Gradient Inversion Attacks in Federated Learning},\nauthor={Jordan Barkin and Ratip Emin Berker and S{\\'\\i}lvia Casacuberta and Janet Li},\nyear={2024},\nurl={https://openreview.net/forum?id=BOm1RYdHHu}\n}",
        "github": "",
        "project": "",
        "reviewers": "wYb4;uyJ6;cV7D",
        "site": "https://openreview.net/forum?id=BOm1RYdHHu",
        "pdf_size": 922413,
        "rating": "1;5;6",
        "confidence": "5;5;2",
        "soundness": "1;2;3",
        "contribution": "1;2;3",
        "presentation": "2;3;3",
        "wc_summary": "88;48;70",
        "wc_strengths": "13;40;84",
        "wc_weaknesses": "528;29;62",
        "wc_questions": "340;8;138",
        "wc_review": "969;125;354",
        "wc_reply_reviewers": "680;101;71",
        "wc_reply_authors": "2094;778;1398",
        "reply_reviewers": "1;1;1",
        "reply_authors": "3;1;2",
        "rating_avg": [
            4.0,
            2.160246899469287
        ],
        "confidence_avg": [
            4.0,
            1.4142135623730951
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            68.66666666666667,
            16.35712552851373
        ],
        "wc_strengths_avg": [
            45.666666666666664,
            29.261275129806325
        ],
        "wc_weaknesses_avg": [
            206.33333333333334,
            227.85131604233104
        ],
        "wc_questions_avg": [
            162.0,
            136.59673007311218
        ],
        "wc_review_avg": [
            482.6666666666667,
            356.3709054092691
        ],
        "wc_reply_reviewers_avg": [
            284.0,
            280.28200084914477
        ],
        "wc_reply_authors_avg": [
            1423.3333333333333,
            537.5533048503706
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.6546536707079772,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:WGcafUPoGVUJ:scholar.google.com/&scioq=SAFHE:+Defending+Against+Backdoor+and+Gradient+Inversion+Attacks+in+Federated+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Carnegie Mellon University;Harvard University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cmu.edu;https://www.harvard.edu",
        "aff_unique_abbr": "CMU;Harvard",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Demystifying Poisoning Backdoor Attacks from a Statistical Perspective",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19218",
        "id": "BPHcEpGvF8",
        "author_site": "Ganghua Wang, Xun Xian, Ashish Kundu, Jayanth Srinivasa, Xuan Bi, Mingyi Hong, Jie Ding",
        "tldr": "",
        "abstract": "Backdoor attacks pose a significant security risk to machine learning applications due to their stealthy nature and potentially serious consequences. Such attacks involve embedding triggers within a learning model with the intention of causing malicious behavior when an active trigger is present while maintaining regular functionality without it. This paper derives a fundamental understanding of backdoor attacks that applies to both discriminative and generative models, including diffusion models and large language models. We evaluate the effectiveness of any backdoor attack incorporating a constant trigger, by establishing tight lower and upper boundaries for the performance of the compromised model on both clean and backdoor test data. The developed theory answers a series of fundamental but previously underexplored problems, including (1) what are the determining factors for a backdoor attack's success, (2) what is the direction of the most effective backdoor attack, and (3) when will a human-imperceptible trigger succeed. We demonstrate the theory by conducting experiments using benchmark datasets and state-of-the-art backdoor attack scenarios. Our code is available \\href{https://github.com/KeyWgh/DemystifyBackdoor}{here}.",
        "keywords": "backdoor attack;machine learning safety;asymptotic;statistical risk",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/d1d4f7b70b114eb7ce8739d1ff6e5ea4fa6435a9.zip",
        "author": "Ganghua Wang;Xun Xian;Ashish Kundu;Jayanth Srinivasa;Xuan Bi;Mingyi Hong;Jie Ding",
        "authorids": "~Ganghua_Wang1;~Xun_Xian1;~Ashish_Kundu1;~Jayanth_Srinivasa1;~Xuan_Bi1;~Mingyi_Hong1;~Jie_Ding2",
        "gender": "M;M;;M;;M;M",
        "homepage": "https://gwang.umn.edu;https://jeremyxianx.github.io/;;;;http://people.ece.umn.edu/~mhong/mingyi.html;http://jding.org",
        "dblp": "200/9632;262/3278;;285/5006;;57/8053;94/1825-2",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;;HtNfeKYAAAAJ;F3eRk9MAAAAJ;qRnP-p0AAAAJ;ZyqvoqcAAAAJ",
        "orcid": "0000-0002-0888-167X;;;;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Ganghua_Wang1;~Xun_Xian1;~Ashish_Kundu1;~Jayanth_Srinivasa1;~Xuan_Bi1;~Mingyi_Hong1;~Jie_Ding2",
        "aff": "University of Minnesota, Minneapolis;University of Minnesota, Minneapolis;;Cisco;University of Minnesota - Twin Cities;University of Minnesota, Minneapolis;University of Minnesota - Twin Cities",
        "aff_domain": "umn.edu;umn.edu;;cisco.com;umn.edu;umn.edu;umn.edu",
        "position": "PhD student;PhD student;;Researcher;Assistant Professor;Associate Professor;Associate Professor",
        "bibtex": "@inproceedings{\nwang2024demystifying,\ntitle={Demystifying Poisoning Backdoor Attacks from a Statistical Perspective},\nauthor={Ganghua Wang and Xun Xian and Ashish Kundu and Jayanth Srinivasa and Xuan Bi and Mingyi Hong and Jie Ding},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=BPHcEpGvF8}\n}",
        "github": "",
        "project": "",
        "reviewers": "DhoY;76rk;DvbB;bWko",
        "pdf_size": 1750496,
        "rating": "3;6;6;8",
        "confidence": "5;3;3;4",
        "soundness": "2;3;3;3",
        "contribution": "1;2;3;4",
        "presentation": "2;3;2;3",
        "wc_summary": "137;95;118;48",
        "wc_strengths": "20;33;76;63",
        "wc_weaknesses": "184;155;253;118",
        "wc_questions": "6;3;1;15",
        "wc_review": "347;286;448;244",
        "wc_reply_reviewers": "745;42;65;0",
        "wc_reply_authors": "1596;806;836;421",
        "reply_reviewers": "3;1;1;0",
        "reply_authors": "4;3;3;2",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            1.118033988749895
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            99.5,
            33.24530041975858
        ],
        "wc_strengths_avg": [
            48.0,
            22.4610774452162
        ],
        "wc_weaknesses_avg": [
            177.5,
            49.46968768852296
        ],
        "wc_questions_avg": [
            6.25,
            5.356071321407137
        ],
        "wc_review_avg": [
            331.25,
            76.71171683647812
        ],
        "wc_reply_reviewers_avg": [
            213.0,
            308.03327742307323
        ],
        "wc_reply_authors_avg": [
            914.75,
            426.0043280296575
        ],
        "reply_reviewers_avg": [
            1.25,
            1.0897247358851685
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5488604301969737,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2162895515699683008&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=BPHcEpGvF8",
        "pdf": "https://openreview.net/pdf?id=BPHcEpGvF8",
        "email": "umn.edu;umn.edu;;cisco.com;umn.edu;umn.edu;umn.edu",
        "author_num": 7,
        "aff_unique_index": "0;0;1;0;0;0",
        "aff_unique_norm": "University of Minnesota;Cisco Systems",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.minnesota.edu;https://www.cisco.com",
        "aff_unique_abbr": "UMN;Cisco",
        "aff_campus_unique_index": "0;0;2;0;2",
        "aff_campus_unique": "Minneapolis;;Twin Cities",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "FreeReg: Image-to-Point Cloud Registration Leveraging Pretrained Diffusion Models and Monocular Depth Estimators",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19217",
        "id": "BPb5AhT2Vf",
        "author_site": "Haiping Wang, Yuan Liu, Bing WANG, YUJING SUN, Zhen Dong, Wenping Wang, Bisheng Yang",
        "tldr": "",
        "abstract": "Matching cross-modality features between images and point clouds is a fundamental problem for image-to-point cloud registration. However, due to the modality difference between images and points, it is difficult to learn robust and discriminative cross-modality features by existing metric learning methods for feature matching. Instead of applying metric learning on cross-modality data, we propose to unify the modality between images and point clouds by pretrained large-scale models first, and then establish robust correspondence within the same modality. We show that the intermediate features, called diffusion features, extracted by depth-to-image diffusion models are semantically consistent between images and point clouds, which enables the building of coarse but robust cross-modality correspondences. We further extract geometric features on depth maps produced by the monocular depth estimator. By matching such geometric features, we significantly improve the accuracy of the coarse correspondences produced by diffusion features. Extensive experiments demonstrate that without any task-specific training, direct utilization of both features produces accurate image-to-point cloud registration. On three public indoor and outdoor benchmarks, the proposed method averagely achieves a 20.6 percent improvement in Inlier Ratio, a $3.0\\times$ higher Inlier Number, and a 48.6 percent improvement in Registration Recall than existing state-of-the-arts. The code and additional results are available at \\url{https://whu-usi3dv.github.io/FreeReg/}.",
        "keywords": "Image-to-point cloud registration;cross-modality feature extraction;diffusion models",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Haiping Wang;Yuan Liu;Bing WANG;YUJING SUN;Zhen Dong;Wenping Wang;Bisheng Yang",
        "authorids": "~Haiping_Wang1;~Yuan_Liu3;~Bing_WANG8;~YUJING_SUN2;~Zhen_Dong4;~Wenping_Wang1;~Bisheng_Yang1",
        "gender": "M;M;M;;M;M;M",
        "homepage": "https://hpwang-whu.github.io/;https://liuyuan-pal.github.io/;http://www.cs.ox.ac.uk/people/bing.wang/;https://yujingsun.github.io/;https://dongzhenwhu.github.io/index.html;https://engineering.tamu.edu/cse/profiles/Wang-Wenping.html;",
        "dblp": ";87/2948-25;06/1909-13;64/8656-1;;;",
        "google_scholar": "https://scholar.google.com.hk/citations?user=YAdDCr0AAAAJ;yRAHVcgAAAAJ;W7QhPeUAAAAJ;https://scholar.google.com.hk/citations?user=AC9Ky6AAAAAJ;https://scholar.google.com/citations?hl=zh-CN;28shvv0AAAAJ;TJkm8igAAAAJ",
        "orcid": ";;0000-0003-0977-0426;0000-0003-0819-296X;;0000-0002-2284-3952;",
        "linkedin": ";;;;;;",
        "or_profile": "~Haiping_Wang1;~Yuan_Liu3;~Bing_WANG8;~YUJING_SUN2;~Zhen_Dong4;~Wenping_Wang1;~Bisheng_Yang1",
        "aff": "Wuhan University;The University of Hong Kong;Hong Kong Polytechnic University;the University of Hong Kong, University of Hong Kong;Wuhan University;Texas A&M University - College Station;Wuhan University",
        "aff_domain": "whu.edu.cn;hku.hk;polyu.edu.hk;cs.hku.hk;whu.edu;tamu.edu;whu.edu.cn",
        "position": "PhD student;PhD student;Assistant Professor;Research Assistant Professor;Full Professor;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nwang2024freereg,\ntitle={FreeReg: Image-to-Point Cloud Registration Leveraging Pretrained Diffusion Models and Monocular Depth Estimators},\nauthor={Haiping Wang and Yuan Liu and Bing WANG and YUJING SUN and Zhen Dong and Wenping Wang and Bisheng Yang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=BPb5AhT2Vf}\n}",
        "github": "",
        "project": "",
        "reviewers": "fhKS;BaLi;zNJ2",
        "pdf_size": 21920377,
        "rating": "6;6;8",
        "confidence": "3;4;2",
        "soundness": "2;2;3",
        "contribution": "3;2;3",
        "presentation": "3;3;3",
        "wc_summary": "24;88;127",
        "wc_strengths": "24;55;60",
        "wc_weaknesses": "220;89;92",
        "wc_questions": "4;27;102",
        "wc_review": "272;259;381",
        "wc_reply_reviewers": "213;0;18",
        "wc_reply_authors": "1352;428;724",
        "reply_reviewers": "2;0;1",
        "reply_authors": "4;1;2",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            79.66666666666667,
            42.460439103816256
        ],
        "wc_strengths_avg": [
            46.333333333333336,
            15.923427883328248
        ],
        "wc_weaknesses_avg": [
            133.66666666666666,
            61.05916984550496
        ],
        "wc_questions_avg": [
            44.333333333333336,
            41.84362423223984
        ],
        "wc_review_avg": [
            304.0,
            54.705270922157645
        ],
        "wc_reply_reviewers_avg": [
            77.0,
            96.44687656943589
        ],
        "wc_reply_authors_avg": [
            834.6666666666666,
            385.2525866954764
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11736741740449634379&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=BPb5AhT2Vf",
        "pdf": "https://openreview.net/pdf?id=BPb5AhT2Vf",
        "email": "whu.edu.cn;hku.hk;polyu.edu.hk;cs.hku.hk;whu.edu;tamu.edu;whu.edu.cn",
        "author_num": 7,
        "aff_unique_index": "0;1;2;1;0;3;0",
        "aff_unique_norm": "Wuhan University;University of Hong Kong;Hong Kong Polytechnic University;Texas A&M University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "http://www.whu.edu.cn/;https://www.hku.hk;https://www.polyu.edu.hk;https://www.tamu.edu",
        "aff_unique_abbr": "WHU;HKU;PolyU;TAMU",
        "aff_campus_unique_index": "1;1;1;2",
        "aff_campus_unique": ";Hong Kong SAR;College Station",
        "aff_country_unique_index": "0;0;0;0;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "BPdagk1mV7",
        "title": "Implicit Semi-auto-regressive Image-to-Video Diffusion",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Diffusion models have demonstrated exceptional performance in various generative domains, particularly in the context of image and video generation. Despite their remarkable success, image-to-video (I2V) generation still remains a formidable challenge for most existing methods. Prior research has primarily concentrated on temporally modeling the entire video sequence, resulting in semantic correspondence but often lacking consistency with the initial image input in detail. In this paper, we present a novel temporal recurrent look-back approach for modeling video dynamics, leveraging prior information from the first frame (provided as a given image) as an implicit semi-auto-regressive process. Conditioned solely on preceding frames, our approach achieves enhanced consistency with the initial frame, thus avoiding unexpected generation results. Furthermore, we introduce a hybrid input initialization strategy to enhance the propagation of information within the look-back module. Our extensive experiments demonstrate that our approach is able to generate video clips with greater detail consistency relative to the provided image.",
        "keywords": "video generation;diffusion model",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/7ac911870a6944b6c3b08f1335f53fcfee3a2407.zip",
        "author": "Tianyi Li;Kai Wang;Ziheng Qin;David Junhao Zhang;Tianle Zhang;Junbo Zhao;Mike Zheng Shou;Yang You",
        "authorids": "~Tianyi_Li5;~Kai_Wang8;~Ziheng_Qin1;~David_Junhao_Zhang1;~Tianle_Zhang4;~Junbo_Zhao1;~Mike_Zheng_Shou1;~Yang_You1",
        "gender": "M;M;M;M;M;M;M;",
        "homepage": "https://scholar.google.com/citations?user=pHXKrL0AAAAJ;https://kaiwang960112.github.io/;;;http://jakezhao.net/;https://www.comp.nus.edu.sg/~youy/;https://scholar.google.com/citations?user=6dCcnNEAAAAJ&hl=en;http://www.columbia.edu/~zs2262/",
        "dblp": ";78/2022-36;342/2679;;191/6665;33/8167-1.html;307/3295;284/0807",
        "google_scholar": ";i2II0XIAAAAJ;I04VhPMAAAAJ;;8ipao8MAAAAJ;jF4dPZwAAAAJ;6dCcnNEAAAAJ;h1-3lSoAAAAJ",
        "orcid": ";0000-0002-1154-5175;0009-0001-8571-1228;0000-0003-1502-9730;;;;",
        "linkedin": ";;ziheng-qin-635551184/;;;yang-you-0b92914b/;;",
        "or_profile": "~Tianyi_Li5;~Kai_Wang8;~Ziheng_Qin1;~Tianle_Zhang4;~Junbo_Zhao1;~Yang_You1;~Junhao_Zhang1;~Zheng_Shou1",
        "aff": "Zhejiang University;National University of Singapore;ByteDance Inc.;University of Electronic Science and Technology of China;Zhejiang University;National University of Singapore;National University of Singapore;National University of Singapore",
        "aff_domain": "zju.edu.cn;u.nus.edu;bytedance.com;cn.edu;zju.edu.cn;nus.edu.sg;nus.edu;nus.edu.sg",
        "position": "Undergrad student;PhD student;Intern;Undergrad student;Assistant Professor;Professor;PhD student;Assistant Professor",
        "bibtex": "@misc{\nli2024implicit,\ntitle={Implicit Semi-auto-regressive Image-to-Video Diffusion},\nauthor={Tianyi Li and Kai Wang and Ziheng Qin and David Junhao Zhang and Tianle Zhang and Junbo Zhao and Mike Zheng Shou and Yang You},\nyear={2024},\nurl={https://openreview.net/forum?id=BPdagk1mV7}\n}",
        "github": "",
        "project": "",
        "reviewers": "sTJV;hgs2;PWSR;7B9z",
        "site": "https://openreview.net/forum?id=BPdagk1mV7",
        "pdf_size": 3654334,
        "rating": "3;5;5;5",
        "confidence": "5;4;4;3",
        "soundness": "1;2;3;2",
        "contribution": "2;2;2;2",
        "presentation": "2;3;2;3",
        "wc_summary": "83;59;110;66",
        "wc_strengths": "30;6;69;75",
        "wc_weaknesses": "138;175;431;124",
        "wc_questions": "7;27;10;89",
        "wc_review": "258;267;620;354",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            79.5,
            19.653244007033546
        ],
        "wc_strengths_avg": [
            45.0,
            28.38133189263675
        ],
        "wc_weaknesses_avg": [
            217.0,
            124.949989995998
        ],
        "wc_questions_avg": [
            33.25,
            33.07850510527947
        ],
        "wc_review_avg": [
            374.75,
            146.47418714572203
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ElPuD3lKsgEJ:scholar.google.com/&scioq=Implicit+Semi-auto-regressive+Image-to-Video+Diffusion&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;0;1;1;1",
        "aff_unique_norm": "Zhejiang University;National University of Singapore;ByteDance;University of Electronic Science and Technology of China",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.zju.edu.cn;https://www.nus.edu.sg;https://www.bytedance.com;https://www.uestc.edu.cn",
        "aff_unique_abbr": "ZJU;NUS;ByteDance;UESTC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;0;1;1;1",
        "aff_country_unique": "China;Singapore"
    },
    {
        "id": "BQvbL2sFQx",
        "title": "Model-Agnostic Shift-Equivariant Downsampling",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The performance of convolutional neural networks (CNNs) are thought to be insensitive to image shifts. However, recent studies have revealed that downsampling layers in CNNs result in inconsistent outputs for shifted input images. In this\nstudy, we present an approach for performing downsampling that ensures absolute shift equivariance. By employing model-agnostic downsampling method that leverages origin selection functions obtained from coordinate-independent statistics of the feature map, we can achieve perfect shift equivariance, while still adhering to the conventional downsampling procedures. Our method allows CNNs to exhibit both improved accuracy and perfect shift invariance for image classification, while also achieving shift equivariance in semantic segmentation benchmarks. Furthermore, we introduce a methodology for achieving shift equivariance without the need for any additional training process. This is accomplished by transferring pretrained weights and replacing existing layers with shift-equivariant\ncounterparts. Additionaly, we show that fine-tuning of the modified CNNs leads superior performance compared to previously proposed models.",
        "keywords": "Shift equivariance;Shift invariance;Downsampling;Convolutional neural networks",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Myungjoon Kim;Arthur Baucour;Jonghwa Shin",
        "authorids": "~Myungjoon_Kim1;~Arthur_Baucour1;~Jonghwa_Shin1",
        "gender": "M;M;M",
        "homepage": "https://github.com/myungjoon;;https://apmd.kaist.ac.kr",
        "dblp": ";;",
        "google_scholar": "https://scholar.google.co.kr/citations?user=dEDl6yQAAAAJ;HQLRKVkAAAAJ;O_qshZoAAAAJ",
        "orcid": ";0000-0002-8251-5504;0000-0003-0712-464X",
        "linkedin": ";arthur-baucour/?locale=en_US;",
        "or_profile": "~Myungjoon_Kim1;~Arthur_Baucour1;~Jonghwa_Shin1",
        "aff": "Korea Advanced Institute of Science & Technology;;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;;kaist.ac.kr",
        "position": "Postdoc;;Associate Professor",
        "bibtex": "@misc{\nkim2024modelagnostic,\ntitle={Model-Agnostic Shift-Equivariant Downsampling},\nauthor={Myungjoon Kim and Arthur Baucour and Jonghwa Shin},\nyear={2024},\nurl={https://openreview.net/forum?id=BQvbL2sFQx}\n}",
        "github": "",
        "project": "",
        "reviewers": "1mgo;pcfU;1rzF;QNhG;gzfx",
        "site": "https://openreview.net/forum?id=BQvbL2sFQx",
        "pdf_size": 1113970,
        "rating": "3;3;3;6;8",
        "confidence": "4;4;4;4;4",
        "soundness": "2;3;2;4;4",
        "contribution": "2;3;2;3;3",
        "presentation": "1;3;2;3;2",
        "wc_summary": "78;48;15;73;63",
        "wc_strengths": "52;31;59;63;28",
        "wc_weaknesses": "527;64;463;302;92",
        "wc_questions": "10;124;29;42;45",
        "wc_review": "667;267;566;480;228",
        "wc_reply_reviewers": "20;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "1;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            4.6,
            2.0591260281974
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.8944271909999159
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.2,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            55.4,
            22.650386310171402
        ],
        "wc_strengths_avg": [
            46.6,
            14.430523206037957
        ],
        "wc_weaknesses_avg": [
            289.6,
            187.89422556321418
        ],
        "wc_questions_avg": [
            50.0,
            39.00256401827962
        ],
        "wc_review_avg": [
            441.6,
            169.62617722509697
        ],
        "wc_reply_reviewers_avg": [
            4.0,
            8.0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:V2OEY6K8ONgJ:scholar.google.com/&scioq=Model-Agnostic+Shift-Equivariant+Downsampling&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "BRO4PfCiwb",
        "title": "OS-net: Orbitally Stable Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We introduce OS-net (Orbitally Stable neural NETworks), a new family of neural network architectures specifically designed for periodic dynamical data. OS-net is a special case of Neural Ordinary Differential Equations (NODEs) and takes fully advantage of the adjoint method based backpropagation method. Utilizing ODE theory, we derive conditions on the network weights to ensure stability of the resulting dynamics. We demonstrate the efficacy of our approach by applying OS-net to discover the dynamics underlying the R\\\"{o}ssler and Sprott's systems, two dynamical systems known for their period doubling attractors and chaotic behavior.",
        "keywords": "neural networks;dynamical systems;chaotic systems;periodic attractor;stable attractors",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/d4e728fe850257d5cf3e0cfdecc4d512a9f6bd73.pdf",
        "author": "Marieme Ngom;Carlo Graziani",
        "authorids": "~Marieme_Ngom1;~Carlo_Graziani1",
        "gender": ";M",
        "homepage": ";https://www.anl.gov/profile/carlo-j-graziani",
        "dblp": ";",
        "google_scholar": ";V6g20IgAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Marieme_Ngom1;~Carlo_Graziani1",
        "aff": ";Argonne National Laboratory",
        "aff_domain": ";anl.gov",
        "position": ";Researcher",
        "bibtex": "@misc{\nngom2024osnet,\ntitle={{OS}-net: Orbitally Stable Neural Networks},\nauthor={Marieme Ngom and Carlo Graziani},\nyear={2024},\nurl={https://openreview.net/forum?id=BRO4PfCiwb}\n}",
        "github": "",
        "project": "",
        "reviewers": "Yjdz;xpia;2Hj6;YZQH",
        "site": "https://openreview.net/forum?id=BRO4PfCiwb",
        "pdf_size": 8640581,
        "rating": "3;3;3;5",
        "confidence": "2;2;4;2",
        "soundness": "2;2;2;2",
        "contribution": "2;2;2;3",
        "presentation": "1;2;1;2",
        "wc_summary": "34;42;71;103",
        "wc_strengths": "9;15;48;37",
        "wc_weaknesses": "403;247;342;83",
        "wc_questions": "2;5;136;17",
        "wc_review": "448;309;597;240",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            2.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            62.5,
            27.13392710243027
        ],
        "wc_strengths_avg": [
            27.25,
            15.880412463157246
        ],
        "wc_weaknesses_avg": [
            268.75,
            120.79398784707789
        ],
        "wc_questions_avg": [
            40.0,
            55.70906568952669
        ],
        "wc_review_avg": [
            398.5,
            136.91694562763223
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ferq88qgI6cJ:scholar.google.com/&scioq=OS-net:+Orbitally+Stable+Neural+Networks&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "Argonne National Laboratory",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.anl.gov",
        "aff_unique_abbr": "ANL",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "BRTyPCq4wL",
        "title": "Cascaded Contrastive Medical Language-Image Pretraining on Radiology Images",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Due to the concise design and the wonderful generalization performance, contrastive language-image pre-training (CLIP) has been investigated in the medical domain for medical image understanding. However, few studies have been done on CLIP for multilevel medical information alignment. In this paper, we proposed cascaded CLIP (casCLIP) where contrastive alignment is performed on multilevel information. In addition, we propose aligning the report with the entire image series and employ a multi-layer transformer to integrate the image embeddings from a study into a single embedding of image series. Moreover, we introduce support alignment opposition de-alignment method to enhance higher-level alignment. In this study, casCLIP was pre-trained on a dataset of chest X-ray images with reports and the high level disease information extracted from the reports. Experimental results on multiple public benchmarks demonstrate the effectiveness of our model for zero-shot classification.",
        "keywords": "Contrastive learning; medical imaging; multi-modality; clinical language model",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/d2b0dd4a9473a5369c5c84545cbb79023a43fdca.zip",
        "author": "Chengsheng Mao;Hanyin Wang;Yuan Luo",
        "authorids": "~Chengsheng_Mao1;~Hanyin_Wang1;~Yuan_Luo3",
        "gender": "M;F;M",
        "homepage": ";;https://www.feinberg.northwestern.edu/faculty-profiles/az/profile.html?xid=33821",
        "dblp": ";;90/6959-4",
        "google_scholar": "https://scholar.google.com/citations?hl=en;YfIObrUAAAAJ;txsHQx4AAAAJ",
        "orcid": ";0000-0001-9884-9683;",
        "linkedin": ";hanyinwang2022/;yuan-luo-16797137/",
        "or_profile": "~Chengsheng_Mao1;~Hanyin_Wang1;~Yuan_Luo3",
        "aff": "Northwestern University;Northwestern University, Northwestern University;Northwestern University",
        "aff_domain": "northwestern.edu;u.northwestern.edu;northwestern.edu",
        "position": "Assistant Professor;PhD student;Full Professor",
        "bibtex": "@misc{\nmao2024cascaded,\ntitle={Cascaded Contrastive Medical Language-Image Pretraining on Radiology Images},\nauthor={Chengsheng Mao and Hanyin Wang and Yuan Luo},\nyear={2024},\nurl={https://openreview.net/forum?id=BRTyPCq4wL}\n}",
        "github": "",
        "project": "",
        "reviewers": "V3gc;WmZb;6KtK;cZSY",
        "site": "https://openreview.net/forum?id=BRTyPCq4wL",
        "pdf_size": 789886,
        "rating": "3;3;5;5",
        "confidence": "3;4;4;4",
        "soundness": "2;1;2;2",
        "contribution": "2;1;2;3",
        "presentation": "3;1;3;2",
        "wc_summary": "130;49;75;86",
        "wc_strengths": "87;22;77;90",
        "wc_weaknesses": "193;400;682;276",
        "wc_questions": "27;2;169;89",
        "wc_review": "437;473;1003;541",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            85.0,
            29.248931604419333
        ],
        "wc_strengths_avg": [
            69.0,
            27.55902755904134
        ],
        "wc_weaknesses_avg": [
            387.75,
            185.16799804501858
        ],
        "wc_questions_avg": [
            71.75,
            64.46462208064203
        ],
        "wc_review_avg": [
            613.5,
            227.9577811788841
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:t3x3WoH87FAJ:scholar.google.com/&scioq=Cascaded+Contrastive+Medical+Language-Image+Pretraining+on+Radiology+Images&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Northwestern University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.northwestern.edu",
        "aff_unique_abbr": "NU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "DAFA: Distance-Aware Fair Adversarial Training",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19216",
        "id": "BRdEBlwUW6",
        "author_site": "Hyungyu Lee, Saehyung Lee, Hyemi Jang, Junsung Park, Ho Bae, Sungroh Yoon",
        "tldr": "",
        "abstract": "The disparity in accuracy between classes in standard training is amplified during adversarial training, a phenomenon termed the robust fairness problem. Existing methodologies aimed to enhance robust fairness by sacrificing the model's performance on easier classes in order to improve its performance on harder ones. However, we observe that under adversarial attacks, the majority of the model's predictions for samples from the worst class are biased towards classes similar to the worst class, rather than towards the easy classes. Through theoretical and empirical analysis, we demonstrate that robust fairness deteriorates as the distance between classes decreases. Motivated by these insights, we introduce the Distance-Aware Fair Adversarial Training (DAFA) methodology, which addresses robust fairness by taking into account the similarities between classes. Specifically, our method assigns distinct adversarial margins and loss weights to each class and adjusts them to encourage a trade-off in robustness among similar classes. Experimental results across various datasets demonstrate that our method not only maintains average robust accuracy but also significantly improves the worst robust accuracy, indicating a marked improvement in robust fairness compared to existing methods.",
        "keywords": "adversarial robustness;robust fairness;adversarial examples;adversarial training",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Hyungyu Lee;Saehyung Lee;Hyemi Jang;Junsung Park;Ho Bae;Sungroh Yoon",
        "authorids": "~Hyungyu_Lee1;~Saehyung_Lee1;~Hyemi_Jang1;~Junsung_Park1;~Ho_Bae1;~Sungroh_Yoon1",
        "gender": "M;;M;M;;M",
        "homepage": ";http://data.snu.ac.kr;http://data.snu.ac.kr/;https://www.spai.co.kr;http://ailab.snu.ac.kr;https://snu.ac.kr",
        "dblp": "260/0442;224/0270;;199/1782;99/1474;",
        "google_scholar": "nS24h74AAAAJ;;;https://scholar.google.com/citations?hl=en;Bphl_fIAAAAJ;",
        "orcid": ";0000-0002-7736-0528;;0000-0002-5238-3547;0000-0002-2367-197X;",
        "linkedin": ";;;;;",
        "or_profile": "~Saehyung_Lee1;~Hyemi_Jang1;~Junsung_Park1;~Ho_Bae1;~Sungroh_Yoon1;~Hyungyu_Lee2",
        "aff": "Adobe Systems;Seoul National University;Seoul National University;Ewha Womans University;Seoul National University;Seoul National University",
        "aff_domain": "adobe.com;snu.ac.kr;snu.ac.kr;ewha.ac.kr;snu.ac.kr;snu.ac.kr",
        "position": "Intern;PhD student;PhD student;Assistant Professor;Full Professor;PhD student",
        "bibtex": "@inproceedings{\nlee2024dafa,\ntitle={{DAFA}: Distance-Aware Fair Adversarial Training},\nauthor={Hyungyu Lee and Saehyung Lee and Hyemi Jang and Junsung Park and Ho Bae and Sungroh Yoon},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=BRdEBlwUW6}\n}",
        "github": "",
        "project": "",
        "reviewers": "nK3C;Wxgz;n9NT;73vn",
        "pdf_size": 3202744,
        "rating": "5;6;6;8",
        "confidence": "3;4;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "193;120;107;50",
        "wc_strengths": "30;12;75;93",
        "wc_weaknesses": "74;45;97;455",
        "wc_questions": "92;2;68;56",
        "wc_review": "389;179;347;654",
        "wc_reply_reviewers": "0;0;81;125",
        "wc_reply_authors": "1824;1448;2026;3162",
        "reply_reviewers": "0;0;1;2",
        "reply_authors": "3;3;4;6",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            117.5,
            50.92396292512986
        ],
        "wc_strengths_avg": [
            52.5,
            32.76049450176233
        ],
        "wc_weaknesses_avg": [
            167.75,
            166.86427868180775
        ],
        "wc_questions_avg": [
            54.5,
            32.96589146375386
        ],
        "wc_review_avg": [
            392.25,
            170.3281758840856
        ],
        "wc_reply_reviewers_avg": [
            51.5,
            53.79823417176441
        ],
        "wc_reply_authors_avg": [
            2115.0,
            639.0813719707373
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            4.0,
            1.224744871391589
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.6622661785325219,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17394704892862092861&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=BRdEBlwUW6",
        "pdf": "https://openreview.net/pdf?id=BRdEBlwUW6",
        "email": "adobe.com;snu.ac.kr;snu.ac.kr;ewha.ac.kr;snu.ac.kr;snu.ac.kr",
        "author_num": 6,
        "aff_unique_index": "0;1;1;2;1;1",
        "aff_unique_norm": "Adobe;Seoul National University;Ewha Womans University",
        "aff_unique_dep": "Adobe Systems Incorporated;;",
        "aff_unique_url": "https://www.adobe.com;https://www.snu.ac.kr;http://www.ewha.ac.kr",
        "aff_unique_abbr": "Adobe;SNU;Ewha",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;1;1",
        "aff_country_unique": "United States;South Korea"
    },
    {
        "id": "BRoBig6ov1",
        "title": "High-Order Tensor Recovery with A Tensor $U_1$ Norm",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recently, numerous tensor SVD (t-SVD)-based tensor recovery methods have emerged, showing promise in processing visual data. However, these methods often suffer from performance degradation when confronted with high-order tensor data exhibiting non-smooth changes (possibly caused by random slice permutation), commonly observed in real-world scenarios but ignored by the traditional t-SVD-based methods. Our objective in this study is to provide an effective tensor recovery technique for handling non-smooth changes in tensor data and efficiently exploring the correlations of high-order tensor data across its various dimensions. To this end, we introduce a new tensor decomposition and a new tensor norm called the Tensor U1 norm. An optimization algorithm is proposed to solve the resulting tensor completion model iteratively by combining the proximal algorithm with the Alternating Direction Method of Multipliers. Theoretical analysis showed the convergence of the algorithm to the Karush\u2013Kuhn\u2013Tucker (KKT)  point of the optimization problem. Numerical experiments demonstrated the effectiveness of the proposed method in high-order tensor completion, especially for tensor data with non-smooth changes. This study fills a critical gap in the t-SVD-based tensor recovery by providing a practical and effective solution that enables the exploration of correlations in high-order tensor data across its different dimensions, even in the presence of non-smooth changes.",
        "keywords": "Tensor SVD; High Order Tensor Recovery; Tensor Completion",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/d3e668c152a215584fe8a3bd3cd6287c65eff290.pdf",
        "author": "Jingjing Zheng;Wenzhe Wang;Xiaoqin Zhang;Yankai Cao;Xianta Jiang",
        "authorids": "~Jingjing_Zheng3;~Wenzhe_Wang2;~Xiaoqin_Zhang4;~Yankai_Cao1;~Xianta_Jiang2",
        "gender": "F;M;;M;",
        "homepage": "https://jzheng20.github.io/;;;https://optimal.chbe.ubc.ca;",
        "dblp": ";;;155/9335;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?view_op=list_works;;M-s3mjAAAAAJ;",
        "orcid": "0000-0003-1955-5308;;;0000-0001-9014-2552;",
        "linkedin": "jingjing-zheng-978303263/?originalSubdomain=ca;;;;",
        "or_profile": "~Jingjing_Zheng3;~Wenzhe_Wang2;~Xiaoqin_Zhang4;~Yankai_Cao1;~Xianta_Jiang2",
        "aff": "The University of British Columbia;;;University of British Columbia;",
        "aff_domain": "math.ubc.ca;;;ubc.ca;",
        "position": "PhD student;;;Associate Professor;",
        "bibtex": "@misc{\nanonymous2024highorder,\ntitle={High-Order Tensor Recovery with A Tensor \\$U\\_1\\$ Norm},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=BRoBig6ov1}\n}",
        "github": "",
        "project": "",
        "reviewers": "Yoac;w1M5;1gNF",
        "site": "https://openreview.net/forum?id=BRoBig6ov1",
        "pdf_size": 448595,
        "rating": "3;5;5",
        "confidence": "4;3;4",
        "soundness": "2;2;3",
        "contribution": "1;2;2",
        "presentation": "2;2;2",
        "wc_summary": "125;93;59",
        "wc_strengths": "132;44;24",
        "wc_weaknesses": "278;193;193",
        "wc_questions": "107;135;45",
        "wc_review": "642;465;321",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "770;779;598",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;2;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            92.33333333333333,
            26.948510575210314
        ],
        "wc_strengths_avg": [
            66.66666666666667,
            46.91363222869115
        ],
        "wc_weaknesses_avg": [
            221.33333333333334,
            40.069384267237695
        ],
        "wc_questions_avg": [
            95.66666666666667,
            37.60614606978788
        ],
        "wc_review_avg": [
            476.0,
            131.27833027579229
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            715.6666666666666,
            83.28398538868215
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:9kQQ67QQUGAJ:scholar.google.com/&scioq=High-Order+Tensor+Recovery+with+A+Tensor+%24U_1%24+Norm&hl=en&as_sdt=0,5",
        "gs_version_total": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of British Columbia",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ubc.ca",
        "aff_unique_abbr": "UBC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "BSePKWwTUj",
        "title": "Multiobjective Stochastic Linear Bandits under Lexicographic Ordering",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper studies the multiobjective stochastic linear bandit (MOSLB) model under lexicographic ordering, where the agent aims to simultaneously maximize $m$ objectives in a hierarchical manner. This model has various real-world scenarios, including water resource planning and radiation treatment for cancer patients. However, there is no effort on the general MOSLB model except a special case called multiobjective multi-armed bandits. Previous literature provided a suboptimal algorithm for this special case, which enjoys a regret bound of $\\widetilde{O}(T^{2/3})$ under a priority-based regret measure. In this paper, we propose an algorithm achieving the almost optimal regret bound $\\widetilde{O}(d\\sqrt{T})$ for the MOSLB model, and its metric is the general regret. Here, $d$ is the dimension of arm vector and $T$ is the time horizon. The major novelties of our algorithm include a new arm filter and a multiple trade-off approach for exploration and exploitation. Experiments confirm the merits of our algorithms and provide compelling evidence to support our analysis.",
        "keywords": "multiobjective;bandits;lexicographic ordering",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Bo Xue;Xi Lin;Xiaoyuan Zhang;Qingfu Zhang",
        "authorids": "~Bo_Xue1;~Xi_Lin2;~Xiaoyuan_Zhang2;~Qingfu_Zhang1",
        "gender": "M;M;M;M",
        "homepage": "https://xueb1996.github.io/;https://xi-l.github.io/;;https://www.cs.cityu.edu.hk/~qzhan7/index.html",
        "dblp": "122/2421-4;43/489-1;;98/1240.html",
        "google_scholar": "1D4gVmIAAAAJ;QB_MUboAAAAJ;KQj18L8AAAAJ;https://scholar.google.co.uk/citations?user=nhL9PHwAAAAJ",
        "orcid": "0000-0002-7295-4853;;0000-0002-3852-645X;",
        "linkedin": ";;;",
        "or_profile": "~Bo_Xue1;~Xi_Lin2;~Xiaoyuan_Zhang2;~Qingfu_Zhang1",
        "aff": "City University of Hong Kong;City University of Hong Kong;City University of Hong Kong;City University of Hong Kong",
        "aff_domain": "cityu.edu.hk;cityu.edu.hk;cityu.edu.hk;cityu.edu.hk",
        "position": "PhD student;Postdoc;PhD student;Full Professor",
        "bibtex": "@misc{\nxue2024multiobjective,\ntitle={Multiobjective Stochastic Linear Bandits under Lexicographic Ordering},\nauthor={Bo Xue and Xi Lin and Xiaoyuan Zhang and Qingfu Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=BSePKWwTUj}\n}",
        "github": "",
        "project": "",
        "reviewers": "1R9s;1nFM;vLB6;chLG",
        "site": "https://openreview.net/forum?id=BSePKWwTUj",
        "pdf_size": 442112,
        "rating": "3;3;5;5",
        "confidence": "4;4;3;3",
        "soundness": "1;2;3;3",
        "contribution": "2;2;2;2",
        "presentation": "2;2;3;4",
        "wc_summary": "95;63;69;76",
        "wc_strengths": "111;22;66;81",
        "wc_weaknesses": "625;256;352;266",
        "wc_questions": "10;19;108;27",
        "wc_review": "841;360;595;450",
        "wc_reply_reviewers": "0;27;33;0",
        "wc_reply_authors": "1168;1071;1566;667",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "3;4;4;2",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            75.75,
            12.028611723719408
        ],
        "wc_strengths_avg": [
            70.0,
            32.101401838549044
        ],
        "wc_weaknesses_avg": [
            374.75,
            149.22361575836447
        ],
        "wc_questions_avg": [
            41.0,
            39.147158262126766
        ],
        "wc_review_avg": [
            561.5,
            181.84952570738258
        ],
        "wc_reply_reviewers_avg": [
            15.0,
            15.149257407543116
        ],
        "wc_reply_authors_avg": [
            1118.0,
            319.6928213144612
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.25,
            0.82915619758885
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:SZA6_kszl4QJ:scholar.google.com/&scioq=Multiobjective+Stochastic+Linear+Bandits+under+Lexicographic+Ordering&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "City University of Hong Kong",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cityu.edu.hk",
        "aff_unique_abbr": "CityU",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "BSqVfAFJWz",
        "title": "The Distributional Reward Critic Architecture for Reinforcement Learning Under Confusion Matrix Reward Perturbations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We study reinforcement learning in the presence of an unknown reward perturbation. Existing methodologies for this problem make strong assumptions including reward smoothness, known perturbations, and/or perturbations that do not modify the optimal policy. We study the case of unknown arbitrary perturbations that discretize and shuffle reward space, but have the property that the true reward belongs to the most frequently observed class after perturbation. This class of perturbations generalizes existing classes (and, in the limit, all continuous bounded perturbations) and defeats existing methods. We introduce an adaptive distributional reward critic and show theoretically that it can recover the true rewards under technical conditions. Under the targeted perturbation in discrete and continuous control tasks, we win/tie the highest return in 40/57 settings (compared to 16/57 for the best baseline). Even under the untargeted perturbation, we still win an edge over the baseline designed especially for that setting.",
        "keywords": "Reinforcement Learning;policy gradient;reward perturbation",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Xi Chen;Zhihui Zhu;Andrew Perrault",
        "authorids": "~Xi_Chen42;~Zhihui_Zhu1;~Andrew_Perrault1",
        "gender": "M;M;M",
        "homepage": "https://engineering.osu.edu/people/chen.10183;https://zhihuizhu.github.io/;https://aperrault.github.io",
        "dblp": ";71/8081;151/3622",
        "google_scholar": ";gmSwszcAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;0000-0002-5062-7958",
        "linkedin": ";;andrew-perrault-2b956733/",
        "or_profile": "~Xi_Chen42;~Zhihui_Zhu1;~Andrew_Perrault1",
        "aff": "Ohio State University, Columbus;Ohio State University, Columbus;Ohio State University",
        "aff_domain": "osu.edu;osu.edu;osu.edu",
        "position": "PhD student;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nchen2024the,\ntitle={The Distributional Reward Critic Architecture for Reinforcement Learning Under Confusion Matrix Reward Perturbations},\nauthor={Xi Chen and Zhihui Zhu and Andrew Perrault},\nyear={2024},\nurl={https://openreview.net/forum?id=BSqVfAFJWz}\n}",
        "github": "",
        "project": "",
        "reviewers": "Jfuy;XsR2;wJ8T;m2dC",
        "site": "https://openreview.net/forum?id=BSqVfAFJWz",
        "pdf_size": 5730338,
        "rating": "3;5;6;6",
        "confidence": "4;4;3;3",
        "soundness": "2;2;3;3",
        "contribution": "1;2;2;2",
        "presentation": "2;3;3;3",
        "wc_summary": "66;99;131;208",
        "wc_strengths": "29;162;100;93",
        "wc_weaknesses": "545;401;108;291",
        "wc_questions": "47;40;48;186",
        "wc_review": "687;702;387;778",
        "wc_reply_reviewers": "35;471;230;101",
        "wc_reply_authors": "2747;2473;1056;2262",
        "reply_reviewers": "1;3;1;1",
        "reply_authors": "5;4;3;5",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            126.0,
            52.62603918213872
        ],
        "wc_strengths_avg": [
            96.0,
            47.090338711884414
        ],
        "wc_weaknesses_avg": [
            336.25,
            159.62044825146933
        ],
        "wc_questions_avg": [
            80.25,
            61.132540434698114
        ],
        "wc_review_avg": [
            638.5,
            149.24560295030471
        ],
        "wc_reply_reviewers_avg": [
            209.25,
            166.60188324265727
        ],
        "wc_reply_authors_avg": [
            2134.5,
            645.9792953338365
        ],
        "reply_reviewers_avg": [
            1.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            4.25,
            0.82915619758885
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8164965809277259,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:l8lSyEEwV9sJ:scholar.google.com/&scioq=The+Distributional+Reward+Critic+Architecture+for+Reinforcement+Learning+Under+Confusion+Matrix+Reward+Perturbations&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Ohio State University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.osu.edu",
        "aff_unique_abbr": "OSU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Columbus;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "What Makes Good Data for Alignment? A Comprehensive Study of Automatic Data Selection in Instruction Tuning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19215",
        "id": "BTKAeLqLMw",
        "author_site": "Wei Liu, Weihao Zeng, Keqing He, Yong Jiang, Junxian He",
        "tldr": "",
        "abstract": "Instruction tuning is a standard technique employed to align large language models to end tasks and user preferences after the initial pretraining phase. Recent research indicates the critical role of data engineering in instruction tuning -- when appropriately selected, only limited data is necessary to achieve superior performance. However, we still lack a principled understanding of what makes good instruction tuning data for alignment, and how we should select data automatically and effectively. In this work, we delve deeply into automatic data selection strategies for alignment. We start with controlled studies to measure data across three dimensions: complexity, quality, and diversity, along which we examine existing methods and introduce novel techniques for enhanced data measurement. Subsequently, we propose a simple strategy to select data samples based on the measurement. We present Deita (short for Data-Efficient Instruction Tuning for Alignment), a series of models fine-tuned from LLaMA models using data samples automatically selected with our proposed approach.  When assessed through both automatic metrics and human evaluation, Deita performs better or on par with the state-of-the-art open-source alignment models such as Vicuna and WizardLM with only 6K training data samples -- 10x less than the data used in the baselines. We anticipate this work to provide clear guidelines and tools on automatic data selection, aiding researchers and practitioners in achieving data-efficient alignment.",
        "keywords": "data selection;instruction tuning;large language models",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Wei Liu;Weihao Zeng;Keqing He;Yong Jiang;Junxian He",
        "authorids": "~Wei_Liu25;~Weihao_Zeng2;~Keqing_He1;~Yong_Jiang1;~Junxian_He1",
        "gender": "M;M;;M;M",
        "homepage": "https://vpeterv.github.io/;https://zeng-wh.github.io/;https://helicqin.github.io/about/index.html;http://jiangyong.site/;https://jxhe.github.io",
        "dblp": "49/3283-131;174/3836;79/2314;;188/6127.html",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;;811USNoAAAAJ;sxXZWQQAAAAJ;BIFGeoUAAAAJ",
        "orcid": "0000-0003-2195-2310;;;;",
        "linkedin": ";;;;",
        "or_profile": "~Wei_Liu25;~Weihao_Zeng2;~Keqing_He1;~Yong_Jiang1;~Junxian_He1",
        "aff": "ShanghaiTech University;Beijing University of Posts and Telecommunications;Meituan Group;Tongyi Lab;Hong Kong University of Science and Technology",
        "aff_domain": "shanghaitech.edu.cn;bupt.edu.cn;meituan.com;alibaba-inc.com;ust.hk",
        "position": "MS student;MS student;Researcher;Researcher;Assistant Professor",
        "bibtex": "@inproceedings{\nliu2024what,\ntitle={What Makes Good Data for Alignment? A Comprehensive Study of Automatic Data Selection in Instruction Tuning},\nauthor={Wei Liu and Weihao Zeng and Keqing He and Yong Jiang and Junxian He},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=BTKAeLqLMw}\n}",
        "github": "",
        "project": "",
        "reviewers": "RtKh;zdke;NSy4",
        "pdf_size": 1834469,
        "rating": "5;6;8",
        "confidence": "2;3;4",
        "soundness": "2;3;2",
        "contribution": "2;2;3",
        "presentation": "3;4;3",
        "wc_summary": "101;57;279",
        "wc_strengths": "44;66;59",
        "wc_weaknesses": "265;77;251",
        "wc_questions": "179;35;95",
        "wc_review": "589;235;684",
        "wc_reply_reviewers": "135;26;0",
        "wc_reply_authors": "1042;728;1297",
        "reply_reviewers": "1;1;0",
        "reply_authors": "3;1;3",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            145.66666666666666,
            95.97684906036224
        ],
        "wc_strengths_avg": [
            56.333333333333336,
            9.177266598624136
        ],
        "wc_weaknesses_avg": [
            197.66666666666666,
            85.5154307063286
        ],
        "wc_questions_avg": [
            103.0,
            59.0592922409336
        ],
        "wc_review_avg": [
            502.6666666666667,
            193.20167931177224
        ],
        "wc_reply_reviewers_avg": [
            53.666666666666664,
            58.482665997902515
        ],
        "wc_reply_authors_avg": [
            1022.3333333333334,
            232.70916517308802
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.9819805060619659,
        "gs_citation": 169,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16674966283854801761&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=BTKAeLqLMw",
        "pdf": "https://openreview.net/pdf?id=BTKAeLqLMw",
        "email": "shanghaitech.edu.cn;bupt.edu.cn;meituan.com;alibaba-inc.com;ust.hk",
        "author_num": 5,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "ShanghaiTech University;Beijing University of Posts and Telecommunications;Meituan Group;Tongyi Lab;Hong Kong University of Science and Technology",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.shanghaitech.edu.cn;http://www.bupt.edu.cn/;https://www.meituan.com;;https://www.ust.hk",
        "aff_unique_abbr": "ShanghaiTech;BUPT;Meituan;;HKUST",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Beijing;Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China;"
    },
    {
        "id": "BTcZwitfgX",
        "title": "Rethinking The Dependence Between Gradients and The Initial Point in Deep Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Despite the considerable advancements in Deep Neural Networks (DNNs), their intrinsic opacity remains a challenge from their foundational design. \nIn this study, we elucidate a novel\nphenomenon wherein the representation of cumulative gradients (the\naggregate changes in iterative gradients) exhibits a certain\nindependence from the initial computation point of the gradients.\nThis implies that learned gradients can be assigned to other\narbitrarily initialized yet well-trained neural networks, while\nretaining a comparable representation to the original network.\nThis suggests that the cumulative gradients can be assigned to other arbitrarily initialized but adequately trained neural networks, maintaining a representation like the original one. \nThis occurrence is counterintuitive and can not be well explained via existing optimization theories.\nAdditionally, we observe that the learned model weights can also be\nreassigned to different neural networks. \nIn essence, these learned gradients can be viewed as a neural network with analogous representations.\nFuthermore, this reassignment of gradients and model weights can potentially mitigate catastrophic forgetting when learning multi-tasks. We provide a theoretical framework to support this claim. Our extensive experiments clearly illustrate this phenomenon and its potential to mitigate catastrophic forgetting.",
        "keywords": "black-box  neural network",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Hui Xu;Jie Shao",
        "authorids": "~Hui_Xu2;~Jie_Shao4",
        "gender": "M;M",
        "homepage": "http://cfm.uestc.edu.cn/~shaojie/;",
        "dblp": ";",
        "google_scholar": "ikbw5okAAAAJ;",
        "orcid": "0000-0003-2615-1555;0000-0003-2081-555X",
        "linkedin": ";",
        "or_profile": "~Jie_Shao4;~Hui.kim_Xu1",
        "aff": "University of Electronic Science and Technology of China;University of Electronic Science and Technology of China",
        "aff_domain": "uestc.edu.cn;uestc.edu.cn",
        "position": "Professor;Associate Professor",
        "bibtex": "@misc{\nxu2024rethinking,\ntitle={Rethinking The Dependence Between Gradients and The Initial Point in Deep Learning},\nauthor={Hui Xu and Jie Shao},\nyear={2024},\nurl={https://openreview.net/forum?id=BTcZwitfgX}\n}",
        "github": "",
        "project": "",
        "reviewers": "izxw;gRM6;vmiY;gVxp",
        "site": "https://openreview.net/forum?id=BTcZwitfgX",
        "pdf_size": 409432,
        "rating": "1;3;3;3",
        "confidence": "4;4;4;5",
        "soundness": "1;2;1;2",
        "contribution": "1;3;1;1",
        "presentation": "1;2;1;2",
        "wc_summary": "76;167;233;80",
        "wc_strengths": "9;147;24;52",
        "wc_weaknesses": "359;244;746;252",
        "wc_questions": "12;99;129;139",
        "wc_review": "456;657;1132;523",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.5,
            0.5
        ],
        "contribution_avg": [
            1.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            139.0,
            65.32610504231826
        ],
        "wc_strengths_avg": [
            58.0,
            53.65165421494476
        ],
        "wc_weaknesses_avg": [
            400.25,
            204.71733561181378
        ],
        "wc_questions_avg": [
            94.75,
            49.991874339736455
        ],
        "wc_review_avg": [
            692.0,
            264.1410607989602
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:TNZ5w7_MWdkJ:scholar.google.com/&scioq=Rethinking+The+Dependence+Between+Gradients+and+The+Initial+Point+in+Deep+Learning&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Electronic Science and Technology of China",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uestc.edu.cn",
        "aff_unique_abbr": "UESTC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "BTd5Tak69u",
        "title": "Unsupervised Learning of Object-Centric Representation from Multi-Viewpoint Scenes",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Objects in a 2D image are influenced by factors like perspective, illumination, and occlusion in the corresponding 3D scene. This results in the challenge of identifying objects across different viewpoints. Humans can effortlessly identify objects from different viewpoints by recognizing their invariant characteristics in 3D dimensions. Motivated by this observation, we propose an object-centric learning method named Learning Object-centric Representation from Multi-viewpoint (LORM), which learns the representations of objects from multi-viewpoint scenes without any supervision. LORM leverages a novel slot attention encoder to decompose the representation of a scene into two distinct components: a viewpoint representation and several object representations. The former encompasses the viewpoint-dependent attributes (i.e., camera position and lighting) of the image observed from each viewpoint, while the latter captures the viewpoint-independent features (i.e., appearance, shape, scale, rotation and position) of the object across various perspectives. We propose a mixture patch decoder to enable LORM to simultaneously handle complex scenes and reconstruct an individual object's 2D appearance and shape at a specific viewpoint through the corresponding object representation and viewpoint representation. Extensive experiments are conducted on three complex simulation datasets, and the results demonstrate that our proposed method outperforms compared methods in individual object reconstruction while achieving comparable performance in scene decomposition.",
        "keywords": "Object-Centric Learning;Mulit-Viewpoints Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/65b1c01b47c8a3004ec9b64cc8853e82ca0289a8.zip",
        "author": "Tonglin Chen;Yinxuan Huang;Zhimeng Shen;Jinghao Huang;Lin Zhu;Dakun Yang;Bin Li;Xiangyang Xue",
        "authorids": "~Tonglin_Chen1;~Yinxuan_Huang1;~Zhimeng_Shen2;~Jinghao_Huang1;~Lin_Zhu11;~Dakun_Yang1;~Bin_Li4;~Xiangyang_Xue2",
        "gender": "M;;;M;M;;M;M",
        "homepage": ";;;https://1827406014.github.io/;https://dblp.org/pid/72/527.html;;https://aimpressionist.github.io/publications;http://homepage.fudan.edu.cn//xyxue",
        "dblp": ";;;;72/527.html;145/5194.html;89/6764-15;84/3791",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;;;;;;8t97oL8AAAAJ;",
        "orcid": ";;;;;;0000-0002-9633-0033;0000-0002-4897-9209",
        "linkedin": ";;;;;;;",
        "or_profile": "~Tonglin_Chen1;~Yinxuan_Huang1;~Zhimeng_Shen2;~Jinghao_Huang1;~Lin_Zhu11;~Dakun_Yang1;~Bin_Li4;~Xiangyang_Xue2",
        "aff": "Fudan University;;;Fudan University;;;Fudan University;Fudan University",
        "aff_domain": "fudan.edu.cn;;;fudan.edu.cn;;;fudan.edu.cn;fudan.edu.cn",
        "position": "PhD student;;;MS student;;;Full Professor;Full Professor",
        "bibtex": "@misc{\nchen2024unsupervised,\ntitle={Unsupervised Learning of Object-Centric Representation from Multi-Viewpoint Scenes},\nauthor={Tonglin Chen and Yinxuan Huang and Zhimeng Shen and Jinghao Huang and Lin Zhu and Dakun Yang and Bin Li and Xiangyang Xue},\nyear={2024},\nurl={https://openreview.net/forum?id=BTd5Tak69u}\n}",
        "github": "",
        "project": "",
        "reviewers": "LpCd;AcUg;UJby",
        "site": "https://openreview.net/forum?id=BTd5Tak69u",
        "pdf_size": 4390086,
        "rating": "3;3;5",
        "confidence": "4;3;4",
        "soundness": "3;2;3",
        "contribution": "2;2;2",
        "presentation": "2;1;3",
        "wc_summary": "31;59;40",
        "wc_strengths": "19;42;42",
        "wc_weaknesses": "246;565;126",
        "wc_questions": "2;33;10",
        "wc_review": "298;699;218",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            43.333333333333336,
            11.671427600007732
        ],
        "wc_strengths_avg": [
            34.333333333333336,
            10.842303978193728
        ],
        "wc_weaknesses_avg": [
            312.3333333333333,
            185.25717859835342
        ],
        "wc_questions_avg": [
            15.0,
            13.140268896284683
        ],
        "wc_review_avg": [
            405.0,
            210.43922321341776
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Qp5scWleTboJ:scholar.google.com/&scioq=Unsupervised+Learning+of+Object-Centric+Representation+from+Multi-Viewpoint+Scenes&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Fudan University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.fudan.edu.cn",
        "aff_unique_abbr": "Fudan",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "BUDxvMRkc4",
        "title": "BLG: BALANCED LANGUAGE DISTRIBUTION AS GUIDANCE FOR ROBUST LONG-TAILED VISION CLASSIFICATION",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recently, pre-trained contrastive visual-linguistic models such as CLIP have shown promising multi-modal capabilities in processing various downstream vision tasks. However, their effectiveness in handling the long-tailed vision recognition problem remains under-explored. In this work, we observe that \\textit{textual features from fine-tuned CLIP are relatively balanced and discriminative than the visual features}. Based on this observation, we propose to leverage balanced text features as prototypes to guide disentangled robust representation learning of biased visual features. Specifically, we first fine-tune CLIP via contrastive learning to help the encoders adapt to the target imbalanced dataset. Then we freeze the vision encoder and employ a linear adapter to refine the biased vision representation. For final vision recognition, a linear classifier initialized by fine-tuned textual features is integrated into the framework, where we consider the weights of the classifier as prototypes. For robust vision representation learning, we introduce a principled approach where we minimize the optimal transport distance between refined visual features and prototypes to help disentangle the biased vision features and continuously optimize prototypes moving towards the class center. We also design a supervised contrastive learning loss based on the transport plan to introduce more supervised signals and class-level information for further robust representation learning. Extensive experiments on long-tailed vision recognition benchmarks demonstrate the superiority of our method in using vision-language information for imbalanced visual recognition, achieving state-of-the-art (SOTA) performance.",
        "keywords": "Long-tailed vision recognition;multi-modality;optimal transport",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/b805fb2185572ba7feeabfb2e6cf778a213f331a.zip",
        "author": "Zhuo Li;He Zhao;Zhen Li;Dan dan Guo;Xiang Wan",
        "authorids": "~Zhuo_Li5;~He_Zhao1;~Zhen_Li6;~Dan_dan_Guo1;~Xiang_Wan1",
        "gender": "M;;;F;M",
        "homepage": ";;;https://github.com/Dan123dan;http://www.sribd.cn/teacher/28",
        "dblp": ";;;121/1618;",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;;;https://scholar.google.com.hk/citations?user=QLOY4JkAAAAJ;",
        "orcid": "0009-0000-6451-4877;;;;",
        "linkedin": ";;;;",
        "or_profile": "~Zhuo_Li5;~He_Zhao1;~Zhen_Li6;~Dan_dan_Guo1;~Xiang_Wan1",
        "aff": "The Chinese University of Hong Kong, Shenzhen;;;Jilin University;Shenzhen Research Institute of Big Data",
        "aff_domain": "link.cuhk.edu.cn;;;jlu.edu.cn;sribd.cn",
        "position": "PhD student;;;Lecturer;Principal Researcher",
        "bibtex": "@misc{\nli2024blg,\ntitle={{BLG}: {BALANCED} {LANGUAGE} {DISTRIBUTION} {AS} {GUIDANCE} {FOR} {ROBUST} {LONG}-{TAILED} {VISION} {CLASSIFICATION}},\nauthor={Zhuo Li and He Zhao and Zhen Li and Dan dan Guo and Xiang Wan},\nyear={2024},\nurl={https://openreview.net/forum?id=BUDxvMRkc4}\n}",
        "github": "",
        "project": "",
        "reviewers": "pMKo;nBTe;V37f",
        "site": "https://openreview.net/forum?id=BUDxvMRkc4",
        "pdf_size": 1696887,
        "rating": "3;5;6",
        "confidence": "5;4;2",
        "soundness": "2;3;3",
        "contribution": "1;2;3",
        "presentation": "2;3;2",
        "wc_summary": "57;105;63",
        "wc_strengths": "22;33;79",
        "wc_weaknesses": "221;92;100",
        "wc_questions": "4;163;70",
        "wc_review": "304;393;312",
        "wc_reply_reviewers": "118;264;82",
        "wc_reply_authors": "2089;2250;1172",
        "reply_reviewers": "2;1;1",
        "reply_authors": "6;6;3",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.6666666666666665,
            1.247219128924647
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            75.0,
            21.354156504062622
        ],
        "wc_strengths_avg": [
            44.666666666666664,
            24.689178916188272
        ],
        "wc_weaknesses_avg": [
            137.66666666666666,
            59.016005362010816
        ],
        "wc_questions_avg": [
            79.0,
            65.22269543648132
        ],
        "wc_review_avg": [
            336.3333333333333,
            40.20226638166339
        ],
        "wc_reply_reviewers_avg": [
            154.66666666666666,
            78.69491018413382
        ],
        "wc_reply_authors_avg": [
            1837.0,
            474.7975006954719
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            5.0,
            1.4142135623730951
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9285714285714286,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Zt0xXu-bXz8J:scholar.google.com/&scioq=BLG:+BALANCED+LANGUAGE+DISTRIBUTION+AS+GUIDANCE+FOR+ROBUST+LONG-TAILED+VISION+CLASSIFICATION&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Chinese University of Hong Kong;Jilin University;Shenzhen Research Institute of Big Data",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.cuhk.edu.cn;http://www.jlu.edu.cn;http://www.sribd.cn",
        "aff_unique_abbr": "CUHK;JLU;",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Shenzhen;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "BUNkXMwfXL",
        "title": "Why Diffusion Models Are Stable and How to Make Them Faster: An Empirical Investigation and Optimization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Diffusion models, a potent generative framework, have garnered considerable attention in recent years. While many posit that the superiority of diffusion models stems from their stable training process compared to Generative Adversarial Networks (GANs), these assertions often rest on intuition and lack empirical substantiation. \nIn this paper, we aim to provide direct evidence to explain why diffusion models exhibit remarkable stability during training. We start by conducting a consistency experiment, where we compare the generation results of models with different hyper-parameters, such as initialization and model structure, under the same sampling conditions. Our results show that diffusion models produce consistent generation results across different hyper-parameters, indicating that they are stable in learning the mapping between noise and data. We then compare the loss landscapes of diffusion models and GANs, and find that diffusion models have much smoother loss landscapes, implying better convergence stability. Based on these analyses, we propose two optimization methods for diffusion models, namely the curriculum learning based timestep schedule (CLTS) and the momentum decay with learning rate compensation (MDLRC), which optimize the sampling probability of timesteps and the momentum selection, respectively, to accelerate convergence. For example, on ImageNet128, our methods achieve a 2.6x speedup in training, demonstrating the effectiveness of our methods.",
        "keywords": "diffusion model;curriculum learning;momentum decay;loss landscape",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Tianshuo Xu;Peng Mi;Ruilin Wang;Yingcong Chen",
        "authorids": "~Tianshuo_Xu1;~Peng_Mi1;~Ruilin_Wang1;yingcongchen@hkust-gz.edu.cn",
        "gender": "M;M;;",
        "homepage": ";https://www.github.com/Mi-Peng;https://github.com/Wangruiln;",
        "dblp": "304/1328;;;",
        "google_scholar": "ZOi14IUAAAAJ;PTM4HCsAAAAJ;;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Tianshuo_Xu1;~Peng_Mi1;~Ruilin_Wang1;yingcongchen@hkust-gz.edu.cn",
        "aff": "Hong Kong University of Science and Technology (Guang Zhou);;Xiamen University;",
        "aff_domain": "hkust-gz.edu.cn;;xmu.edu.cn;",
        "position": "PhD student;;MS student;",
        "bibtex": "@misc{\nxu2024why,\ntitle={Why Diffusion Models Are Stable and How to Make Them Faster: An Empirical Investigation and Optimization},\nauthor={Tianshuo Xu and Peng Mi and Ruilin Wang and Yingcong Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=BUNkXMwfXL}\n}",
        "github": "",
        "project": "",
        "reviewers": "fHcz;bVYL;sw1d",
        "site": "https://openreview.net/forum?id=BUNkXMwfXL",
        "pdf_size": 19071151,
        "rating": "3;3;5",
        "confidence": "4;4;4",
        "soundness": "3;1;2",
        "contribution": "2;1;3",
        "presentation": "3;3;3",
        "wc_summary": "53;192;108",
        "wc_strengths": "30;8;62",
        "wc_weaknesses": "95;6;152",
        "wc_questions": "45;289;186",
        "wc_review": "223;495;508",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            117.66666666666667,
            57.156704671358455
        ],
        "wc_strengths_avg": [
            33.333333333333336,
            22.17105219775452
        ],
        "wc_weaknesses_avg": [
            84.33333333333333,
            60.07957685899224
        ],
        "wc_questions_avg": [
            173.33333333333334,
            100.01444340138522
        ],
        "wc_review_avg": [
            408.6666666666667,
            131.39338728498564
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:O9sHkLUgSYkJ:scholar.google.com/&scioq=Why+Diffusion+Models+Are+Stable+and+How+to+Make+Them+Faster:+An+Empirical+Investigation+and+Optimization&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Xiamen University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ust.hk;https://www.xmu.edu.cn",
        "aff_unique_abbr": "HKUST;XMU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "BURvGotSLz",
        "title": "Is Training Necessary for Representation Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The field of neural network-based encoders is currently experiencing rapid growth. However, in the pursuit of higher performance, models are becoming increasingly complex and specialized for specific datasets and tasks, resulting in a loss of generality.\nIn response to this trend, we explore the finite element method (FEM) as a general solution for feature extraction and introduce LagrangeEmbedding, an untrainable encoder with a universal architecture across various types of raw data and recognition tasks. Our experimental results demonstrate its successful application and good performance in diverse domains, including data fitting, computer vision, and natural language processing.\nLagrangeEmbedding is explainable, it adheres to the error-bound formula in FEM, which governs the relationship between mean absolute error (MAE) and the number of model parameters. \nAs the encoder has no trainable parameters, neural networks utilizing it only need to train a linear layer. This reduces gradient computation and significantly accelerates training convergence.\nOur research promises to advance machine learning by opening up new avenues for unsupervised representation learning.",
        "keywords": "unsupervised representation learning;universal encoder;finite element method;multi-scale mesh;multivariate Lagrange interpolation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/ce7a5cb197787a608b6f1bb42a52e03867ce1da0.zip",
        "author": "Zheng Li;Jerry Cheng;Huanying Gu",
        "authorids": "~Zheng_Li12;~Jerry_Cheng2;~Huanying_Gu1",
        "gender": "M;M;F",
        "homepage": ";https://www.nyit.edu/bio/jcheng18;",
        "dblp": ";;98/3698",
        "google_scholar": "https://scholar.google.com.hk/citations?user=JccDEo4AAAAJ;n_uoQ6MAAAAJ;sTEfizUAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Zheng_Li12;~Jerry_Cheng2;~Huanying_Gu1",
        "aff": "New York Institute of Technology;New York Institute of Technology;New York Institute of Technology",
        "aff_domain": "nyit.edu;nyit.edu;nyit.edu",
        "position": "PhD student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nli2024is,\ntitle={Is Training Necessary for Representation Learning},\nauthor={Zheng Li and Jerry Cheng and Huanying Gu},\nyear={2024},\nurl={https://openreview.net/forum?id=BURvGotSLz}\n}",
        "github": "",
        "project": "",
        "reviewers": "RtZ7;YmUG;P3jk",
        "site": "https://openreview.net/forum?id=BURvGotSLz",
        "pdf_size": 5549026,
        "rating": "5;6;6",
        "confidence": "3;3;3",
        "soundness": "2;2;3",
        "contribution": "2;3;3",
        "presentation": "2;4;2",
        "wc_summary": "71;58;88",
        "wc_strengths": "49;70;22",
        "wc_weaknesses": "313;524;94",
        "wc_questions": "14;44;162",
        "wc_review": "447;696;366",
        "wc_reply_reviewers": "387;206;0",
        "wc_reply_authors": "2045;2343;928",
        "reply_reviewers": "1;1;0",
        "reply_authors": "5;9;3",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            72.33333333333333,
            12.283683848458853
        ],
        "wc_strengths_avg": [
            47.0,
            19.6468827043885
        ],
        "wc_weaknesses_avg": [
            310.3333333333333,
            175.55689169674378
        ],
        "wc_questions_avg": [
            73.33333333333333,
            63.88183535942662
        ],
        "wc_review_avg": [
            503.0,
            140.42079618062277
        ],
        "wc_reply_reviewers_avg": [
            197.66666666666666,
            158.10193617480533
        ],
        "wc_reply_authors_avg": [
            1772.0,
            609.0719716639953
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            5.666666666666667,
            2.494438257849294
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:fQ5dqJjmjrsJ:scholar.google.com/&scioq=Is+Training+Necessary+for+Representation+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "New York Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nyit.edu",
        "aff_unique_abbr": "NYIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "BUSZQWbRaR",
        "title": "Generalized Convergence Analysis of Tsetlin Machines: A Probabilistic Approach to Concept Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Tsetlin Machines (TMs) have garnered increasing interest for their ability to learn concepts via propositional formulas and their proven efficiency across various application domains. Despite this, the convergence proof for the TMs, particularly for the AND operator (\\emph{conjunction} of literals), in the generalized case (inputs greater than two bits) remains an open problem. This paper aims to fill this gap by presenting a comprehensive convergence analysis of Tsetlin automaton-based Machine Learning algorithms. We introduce a novel framework, referred to as Probabilistic Concept Learning (PCL), which simplifies the TM structure while incorporating dedicated feedback mechanisms and dedicated inclusion/exclusion probabilities for literals. Given $n$ features, PCL aims to learn a set of conjunction clauses $C_i$ each associated with a distinct inclusion probability $p_i$. Most importantly, we establish a theoretical proof confirming that, for any clause $C_k$, PCL converges to a conjunction of literals when $0.5<p_k<1$.\nThis result serves as a stepping stone for future research on the convergence properties of Tsetlin automaton-based learning algorithms. Our findings not only contribute to the theoretical understanding of Tsetlin Machines but also have implications for their practical application, potentially leading to more robust and interpretable machine learning models.",
        "keywords": "Convergence;Concept Learning;Tsetlin Machine",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Mohamed-Bachir Belaid;Jivitesh Sharma;Lei Jiao;Ole-Christoffer Granmo;Per-Arne Andersen;Anis Yazidi",
        "authorids": "~Mohamed-Bachir_Belaid1;~Jivitesh_Sharma1;~Lei_Jiao1;~Ole-Christoffer_Granmo1;~Per-Arne_Andersen1;~Anis_Yazidi1",
        "gender": "M;;M;M;M;M",
        "homepage": "https://www.nilu.com/employee/mohamed-bachir-belaid/;;https://www.uia.no/en/kk/profile/leij;https://cair.uia.no/people/ole-christoffer-granmo/;https://per-arne.no;https://www.oslomet.no/om/ansatt/anisy/",
        "dblp": "246/2997.html;;;10/5522.html;;45/8374.html",
        "google_scholar": "hZ6VUu8AAAAJ;https://scholar.google.no/citations?user=BqeBFKkAAAAJ;https://scholar.google.no/citations?user=xyM35qUAAAAJ;https://scholar.google.no/citations?user=PmdKAykAAAAJ;https://scholar.google.no/citations?user=oPth46oAAAAJ;https://scholar.google.no/citations?user=ulr62hcAAAAJ",
        "orcid": "0000-0002-8686-8489;;;0000-0002-7287-030X;0000-0002-7742-4907;0000-0001-7591-1659",
        "linkedin": ";jivitesh-sharma/;;;;",
        "or_profile": "~Mohamed-Bachir_Belaid1;~Jivitesh_Sharma1;~Lei_Jiao1;~Ole-Christoffer_Granmo1;~Per-Arne_Andersen1;~Anis_Yazidi1",
        "aff": "Norwegian Institute for Air Research;Norwegian Institute for Air Research;University of Agder;University of Agder;University of Agder;Norwegian University of Science and Technology, Norway",
        "aff_domain": "nilu.no;nilu.no;uia.no;uia.no;uia.no;ntnu.no",
        "position": "Researcher;Researcher;Full Professor;Full Professor;Associate Professor;Full Professor",
        "bibtex": "@misc{\nbelaid2024generalized,\ntitle={Generalized Convergence Analysis of Tsetlin Machines: A Probabilistic Approach to Concept Learning},\nauthor={Mohamed-Bachir Belaid and Jivitesh Sharma and Lei Jiao and Ole-Christoffer Granmo and Per-Arne Andersen and Anis Yazidi},\nyear={2024},\nurl={https://openreview.net/forum?id=BUSZQWbRaR}\n}",
        "github": "",
        "project": "",
        "reviewers": "aoEu;Q3AU;qHKG;TRnW",
        "site": "https://openreview.net/forum?id=BUSZQWbRaR",
        "pdf_size": 419545,
        "rating": "3;5;5;6",
        "confidence": "3;3;2;3",
        "soundness": "2;2;3;3",
        "contribution": "2;3;3;2",
        "presentation": "1;2;3;3",
        "wc_summary": "40;110;22;70",
        "wc_strengths": "14;39;1;12",
        "wc_weaknesses": "241;107;5;50",
        "wc_questions": "45;112;119;36",
        "wc_review": "340;368;147;168",
        "wc_reply_reviewers": "124;0;0;0",
        "wc_reply_authors": "366;108;199;104",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            60.5,
            33.32791622649097
        ],
        "wc_strengths_avg": [
            16.5,
            13.901438774457844
        ],
        "wc_weaknesses_avg": [
            100.75,
            88.67461587173638
        ],
        "wc_questions_avg": [
            78.0,
            37.71604433129222
        ],
        "wc_review_avg": [
            255.75,
            99.02619602913161
        ],
        "wc_reply_reviewers_avg": [
            31.0,
            53.693575034635195
        ],
        "wc_reply_authors_avg": [
            194.25,
            106.1893944798632
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.13245323570650439,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10481823401933253959&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1;1;1;2",
        "aff_unique_norm": "Norwegian Institute for Air Research;University of Agder;Norwegian University of Science and Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.niair.no;https://www.uia.no;https://www.ntnu.no",
        "aff_unique_abbr": "NILU;UiA;NTNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "Norway"
    },
    {
        "id": "BUtQVZoGch",
        "title": "Optimisation-Based Multi-Modal Semantic Image Editing",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Image editing affords increased control over the aesthetics and content of generated images. Pre-existing works focus predominantly on text-based instructions to achieve desired image modifications, which limit edit precision and accuracy. In this work, we propose an inference-time editing optimisation, designed to extend beyond textual edits to accommodate multiple editing instruction types (e.g., spatial layout-based; pose, scribbles, edge maps). We propose to disentangle the editing task into two competing subtasks: successful local image modifications and global content consistency preservation, where subtasks are guidedthrough two dedicated loss functions. By allowing to adjust the influence of each loss function, we build a flexible editing solution that can be adjusted to user preferences. We evaluate our method using text, pose and scribble edit conditions, and highlight our ability to achieve complex edits, through both qualitative and quantitative experiments.",
        "keywords": "Image Editing;Diffusion Models;Optimisation",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Bowen Li;Yongxin Yang;Steven McDonagh;Shifeng Zhang;Petru-Daniel Tudosiu;Sarah Parisot",
        "authorids": "~Bowen_Li2;~Yongxin_Yang1;~Steven_McDonagh1;~Shifeng_Zhang5;~Petru-Daniel_Tudosiu1;~Sarah_Parisot1",
        "gender": "M;;M;M;;M",
        "homepage": "https://mrlibw.github.io;https://smcdonagh.github.io/;https://github.com/zsffq999;https://kclpure.kcl.ac.uk/portal/en/persons/dan-tudosiu(51c96242-5d86-43b9-990e-2eeab07cef4e).html;https://parisots.github.io/;",
        "dblp": "75/10470-1;159/2641;;258/4838;20/10169;150/4258",
        "google_scholar": "https://scholar.google.co.uk/citations?hl=en;https://scholar.google.co.uk/citations?user=k8-q2AoAAAAJ;;sv39zkwAAAAJ;https://scholar.google.co.uk/citations?user=N-AmfK4AAAAJ;https://scholar.google.co.uk/citations?user=F7PtrL8AAAAJ",
        "orcid": ";0000-0001-7025-5197;;0000-0001-6435-5079;;",
        "linkedin": ";;;https://linkedin.com/in/petru-daniel-tudosiu;;",
        "or_profile": "~Bowen_Li2;~Steven_McDonagh1;~Shifeng_Zhang5;~Petru-Daniel_Tudosiu1;~Sarah_Parisot1;~Yongxin_Yang3",
        "aff": "Department of Computer Science, University of Oxford;University of Edinburgh;Huawei Technologies Ltd.;Huawei Technologies Ltd.;Huawei Technologies Ltd.;Queen Mary University of London",
        "aff_domain": "cs.ox.ac.uk;ed.ac.uk;huawei.com;huawei.com;huawei.com;qmul.ac.uk",
        "position": "Research Associate;Associate Professor;Researcher;Researcher;Senior research scientist;Assistant Professor",
        "bibtex": "@misc{\nli2024optimisationbased,\ntitle={Optimisation-Based Multi-Modal Semantic Image Editing},\nauthor={Bowen Li and Yongxin Yang and Steven McDonagh and Shifeng Zhang and Petru-Daniel Tudosiu and Sarah Parisot},\nyear={2024},\nurl={https://openreview.net/forum?id=BUtQVZoGch}\n}",
        "github": "",
        "project": "",
        "reviewers": "5aGY;aHvV;Y78e;KWjJ",
        "site": "https://openreview.net/forum?id=BUtQVZoGch",
        "pdf_size": 10681908,
        "rating": "3;5;5;6",
        "confidence": "3;4;2;3",
        "soundness": "2;4;3;2",
        "contribution": "2;3;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "61;27;164;46",
        "wc_strengths": "11;55;125;34",
        "wc_weaknesses": "280;108;173;75",
        "wc_questions": "4;7;95;80",
        "wc_review": "356;197;557;235",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            74.5,
            53.05892950295925
        ],
        "wc_strengths_avg": [
            56.25,
            42.634346482618916
        ],
        "wc_weaknesses_avg": [
            159.0,
            78.2527954772224
        ],
        "wc_questions_avg": [
            46.5,
            41.35516896350443
        ],
        "wc_review_avg": [
            336.25,
            140.3235101470883
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Nto3y5-4tpAJ:scholar.google.com/&scioq=Optimisation-Based+Multi-Modal+Semantic+Image+Editing&hl=en&as_sdt=0,10",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;2;2;3",
        "aff_unique_norm": "University of Oxford;University of Edinburgh;Huawei;Queen Mary University of London",
        "aff_unique_dep": "Department of Computer Science;;Huawei Technologies;",
        "aff_unique_url": "https://www.ox.ac.uk;https://www.ed.ac.uk;https://www.huawei.com;https://www.qmul.ac.uk",
        "aff_unique_abbr": "Oxford;Edinburgh;Huawei;QMUL",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Oxford;;London",
        "aff_country_unique_index": "0;0;1;1;1;0",
        "aff_country_unique": "United Kingdom;China"
    },
    {
        "id": "BUxuW0f6EE",
        "title": "EXPLORING BATTERY USAGE IN ELECTRIC VEHICLES THROUGH GRAPH BASED CASCADED CLUSTERING",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recently, electric vehicles (EVs) have gained popularity over internal-combustion engine vehicles (ICEV) because of their convenience and ability to use clean- energy sources. Fueling an EV is fundamentally different than an ICEV and thus, the driving and charging patterns associated with EVs are novel and not well understood. For example, where filling the tank of an IECV is a standard process, charging an EV occurs at different speeds (L1, L2, and DC Fast Charging) and intermittently while driving by regenerative braking. Understanding these usage patterns for EVs is important because the performance and longevity of the battery is dependent on the driving, charging, and idling patterns it is subjected to over its lifetime. We propose a scalable cascaded clustering approach that leverages battery- specific features to identify usage patterns that affect the battery across multiple timescales. We analyze 3,100 EVs over the course of a year using multivariate time- series data consisting of but not limited to state of charge (SOC) and mileage. First, we apply clustering to weekly multivariate data segments and extract usage profiles at that timescale. Then, we use these weekly cluster assignments to generate an EV battery meta-sequence that is unique to every vehicle, which reveals longer- term patterns. We apply a novel graph based clustering technique at the vehicle meta-sequence level to associate groups of vehicles that are operated similarly. Our approach reveals fine-grained usage patterns and helps identify salient themes across a vehicle\u2019s lifetime. While limited to a relatively small selection of vehicles, our work reveals a unique representation of vehicles and their weekly usage pattern that can potentially aid in battery lifecycle management.",
        "keywords": "cascaded clustering;time-series clustering;graph neural networks;AI and batteries;electric vehicles;two-level clustering",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/c10fc59ca947df4f1e30c326952eb9272a83dd1a.zip",
        "author": "Dhanashree Balaram;Brett Dufford;Gianina Alina Negoita;William A. Paxton;Matthew Yen",
        "authorids": "~Dhanashree_Balaram1;~Brett_Dufford1;~Gianina_Alina_Negoita1;~William_A._Paxton1;~Matthew_Yen1",
        "gender": "F;M;F;M;",
        "homepage": ";;;http://www.willpaxton.com;",
        "dblp": ";;;;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;https://scholar.google.com/citations?hl=en;u-AwP0AAAAAJ;v_oQPVcAAAAJ",
        "orcid": ";;0000-0001-6750-3276;0000-0001-5899-9038;0000-0002-5506-7750",
        "linkedin": "dhanashree-balaram/;brett-dufford-aaba6a126;gianina-alina-negoita/;wpaxton;",
        "or_profile": "~Dhanashree_Balaram1;~Brett_Dufford1;~Gianina_Alina_Negoita1;~William_A._Paxton1;~Matthew_Yen1",
        "aff": "Volkswagen IECC;VW IECC;Data Lab, Volkswagen Group;Volkswagen Group Innovation;Georgia Institute of Technology",
        "aff_domain": "vw.com;vw.com;volkswagen.de;vw.com;gatech.edu",
        "position": "Researcher;Researcher;Principal Researcher;Principal Researcher;PhD student",
        "bibtex": "@misc{\nbalaram2024exploring,\ntitle={{EXPLORING} {BATTERY} {USAGE} {IN} {ELECTRIC} {VEHICLES} {THROUGH} {GRAPH} {BASED} {CASCADED} {CLUSTERING}},\nauthor={Dhanashree Balaram and Brett Dufford and Gianina Alina Negoita and William A. Paxton and Matthew Yen},\nyear={2024},\nurl={https://openreview.net/forum?id=BUxuW0f6EE}\n}",
        "github": "",
        "project": "",
        "reviewers": "kfKg;fT58;oWmf",
        "site": "https://openreview.net/forum?id=BUxuW0f6EE",
        "pdf_size": 17568106,
        "rating": "1;3;5",
        "confidence": "5;3;4",
        "soundness": "1;2;2",
        "contribution": "1;2;3",
        "presentation": "2;2;3",
        "wc_summary": "200;108;111",
        "wc_strengths": "18;94;141",
        "wc_weaknesses": "294;300;95",
        "wc_questions": "20;144;53",
        "wc_review": "532;646;400",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            1.632993161855452
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            139.66666666666666,
            42.679685513784605
        ],
        "wc_strengths_avg": [
            84.33333333333333,
            50.6776303927307
        ],
        "wc_weaknesses_avg": [
            229.66666666666666,
            95.25521274741638
        ],
        "wc_questions_avg": [
            72.33333333333333,
            52.43620462576936
        ],
        "wc_review_avg": [
            526.0,
            100.5186549850325
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:uzKUC9smzOMJ:scholar.google.com/&scioq=EXPLORING+BATTERY+USAGE+IN+ELECTRIC+VEHICLES+THROUGH+GRAPH+BASED+CASCADED+CLUSTERING&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1;2",
        "aff_unique_norm": "Volkswagen;Volkswagen Group;Georgia Institute of Technology",
        "aff_unique_dep": "IECC;IECC;",
        "aff_unique_url": "https://www.volkswagen.com;https://www.volkswagenag.com;https://www.gatech.edu",
        "aff_unique_abbr": "VW;VW;Georgia Tech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;1",
        "aff_country_unique": "Germany;United States"
    },
    {
        "title": "Accelerating Distributed Stochastic Optimization via Self-Repellent Random Walks",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19214",
        "id": "BV1PHbTJzd",
        "author_site": "Jie Hu, Vishwaraj Doshi, Do Young Eun",
        "tldr": "",
        "abstract": "We study a family of distributed stochastic optimization algorithms where gradients are sampled by a token traversing a network of agents in random-walk fashion. Typically, these random-walks are chosen to be Markov chains that asymptotically sample from a desired target distribution, and play a critical role in the convergence of the optimization iterates. In this paper, we take a novel approach by replacing the standard *linear* Markovian token by one which follows a *non-linear* Markov chain - namely the Self-Repellent Radom Walk (SRRW). Defined for any given 'base' Markov chain, the SRRW, parameterized by a positive scalar $\\\\alpha$, is less likely to transition to states that were highly visited in the past, thus the name. In the context of MCMC sampling on a graph, a recent breakthrough in Doshi et al. (2023) shows that the SRRW achieves $O(1/\\\\alpha)$ decrease in the asymptotic variance for sampling. We propose the use of a `generalized' version of the SRRW to drive token algorithms for distributed stochastic optimization in the form of stochastic approximation, termed SA-SRRW. We prove that the optimization iterate errors of the resulting SA-SRRW converge to zero almost surely and prove a central limit theorem, deriving the explicit form of the resulting asymptotic covariance matrix corresponding to iterate errors. This asymptotic covariance is always smaller than that of an algorithm driven by the base Markov chain and decreases at rate $O(1/\\\\alpha^2)$ - the performance benefit of using SRRW thereby *amplified* in the stochastic optimization context. Empirical results support our theoretical findings.",
        "keywords": "Distributed Learning;Self-Repellent Random Walk;Token Algorithm;Central Limit Theorem;Asymptotic Analysis",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Jie Hu;Vishwaraj Doshi;Do Young Eun",
        "authorids": "~Jie_Hu7;~Vishwaraj_Doshi1;~Do_Young_Eun1",
        "gender": "M;M;M",
        "homepage": ";;https://people.engr.ncsu.edu/dyeun/",
        "dblp": ";267/1288.html;",
        "google_scholar": "8uBqtwEAAAAJ;bRSzAq4AAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0002-0165-3738;;",
        "linkedin": "jie-hu-ncsu;;",
        "or_profile": "~Jie_Hu7;~Vishwaraj_Doshi1;~Do_Young_Eun1",
        "aff": "North Carolina State University;IQVIA;North Carolina State University",
        "aff_domain": "ncsu.edu;iqvia.com;ncsu.edu",
        "position": "PhD student;Researcher;Full Professor",
        "bibtex": "@inproceedings{\nhu2024accelerating,\ntitle={Accelerating Distributed Stochastic Optimization via Self-Repellent Random Walks},\nauthor={Jie Hu and Vishwaraj Doshi and Do Young Eun},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=BV1PHbTJzd}\n}",
        "github": "",
        "project": "",
        "reviewers": "81Sf;XrEW;DxLx;MZm1",
        "pdf_size": 1653315,
        "rating": "6;6;8;8",
        "confidence": "4;4;3;4",
        "soundness": "3;3;3;4",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;4",
        "wc_summary": "56;118;101;314",
        "wc_strengths": "42;179;68;36",
        "wc_weaknesses": "156;3;102;49",
        "wc_questions": "3;325;584;17",
        "wc_review": "257;625;855;416",
        "wc_reply_reviewers": "15;0;0;0",
        "wc_reply_authors": "888;1650;1362;204",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "2;3;2;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            147.25,
            98.90241402513894
        ],
        "wc_strengths_avg": [
            81.25,
            57.703444437918954
        ],
        "wc_weaknesses_avg": [
            77.5,
            57.282196186948
        ],
        "wc_questions_avg": [
            232.25,
            240.42605412059652
        ],
        "wc_review_avg": [
            538.25,
            224.66794942759415
        ],
        "wc_reply_reviewers_avg": [
            3.75,
            6.49519052838329
        ],
        "wc_reply_authors_avg": [
            1026.0,
            547.037475864314
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17663583364355141429&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=BV1PHbTJzd",
        "pdf": "https://openreview.net/pdf?id=BV1PHbTJzd",
        "email": "ncsu.edu;iqvia.com;ncsu.edu",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "North Carolina State University;IQVIA",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ncsu.edu;https://www.iqvia.com",
        "aff_unique_abbr": "NCSU;IQVIA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Provably Robust Conformal Prediction with Improved Efficiency",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19213",
        "id": "BWAhEjXjeG",
        "author_site": "Ge Yan, Yaniv Romano, Tsui-Wei Weng",
        "tldr": "",
        "abstract": "Conformal prediction is a powerful tool to generate uncertainty sets with guaranteed coverage using any predictive model, under the assumption that the training and test data are i.i.d.. Recently, it has been shown that adversarial examples are able to manipulate conformal methods to construct prediction sets with invalid coverage rates, as the i.i.d. assumption is violated. To address this issue, a recent work, Randomized Smoothed Conformal Prediction (RSCP), was first proposed to certify the robustness of conformal prediction methods to adversarial noise. However, RSCP has two major limitations: (i) its robustness guarantee is flawed when used in practice and (ii) it tends to produce large uncertainty sets. To address these limitations, we first propose a novel framework called RSCP+ to provide provable robustness guarantee in evaluation, which fixes the issues in the original RSCP method. Next, we propose two novel methods, Post-Training Transformation (PTT) and Robust Conformal Training (RCT), to effectively reduce prediction set size with little computation overhead. Experimental results in CIFAR10, CIFAR100, and ImageNet suggest the baseline method only yields trivial predictions including full label set, while our methods could boost the efficiency by up to $4.36\\times$, $5.46\\times$, and $16.9\\times$ respectively and provide practical robustness guarantee.",
        "keywords": "Conformal prediction;randomized smoothing;adversarial robustness",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/de94be7a4c44fac082a8101c97bda9f4fc162245.pdf",
        "author": "Ge Yan;Yaniv Romano;Tsui-Wei Weng",
        "authorids": "~Ge_Yan2;~Yaniv_Romano1;~Tsui-Wei_Weng1",
        "gender": ";M;F",
        "homepage": "https://windymount.github.io;https://sites.google.com/view/yaniv-romano/;https://lilywenglab.github.io",
        "dblp": ";142/0021;177/9197",
        "google_scholar": ";L_m67ywAAAAJ;v8GM4xoAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Ge_Yan2;~Yaniv_Romano1;~Tsui-Wei_Weng1",
        "aff": "University of California, San Diego;Technion, Technion;University of California, San Diego",
        "aff_domain": "ucsd.edu;technion.ac.il;ucsd.edu",
        "position": "PhD student;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nyan2024provably,\ntitle={Provably Robust Conformal Prediction with Improved Efficiency},\nauthor={Ge Yan and Yaniv Romano and Tsui-Wei Weng},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=BWAhEjXjeG}\n}",
        "github": "",
        "project": "",
        "reviewers": "y2Uk;Tjzn;SvdF;mH5T",
        "pdf_size": 2039951,
        "rating": "6;6;8;8",
        "confidence": "3;4;4;3",
        "soundness": "3;3;3;3",
        "contribution": "3;2;3;3",
        "presentation": "2;3;3;2",
        "wc_summary": "87;67;70;139",
        "wc_strengths": "50;102;43;112",
        "wc_weaknesses": "66;64;214;182",
        "wc_questions": "130;197;99;103",
        "wc_review": "333;430;426;536",
        "wc_reply_reviewers": "181;22;19;0",
        "wc_reply_authors": "1564;1828;995;1006",
        "reply_reviewers": "2;1;1;0",
        "reply_authors": "4;5;3;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            90.75,
            28.88230427095456
        ],
        "wc_strengths_avg": [
            76.75,
            30.55630049596973
        ],
        "wc_weaknesses_avg": [
            131.5,
            67.45924695695913
        ],
        "wc_questions_avg": [
            132.25,
            39.23885192000398
        ],
        "wc_review_avg": [
            431.25,
            71.85880252272507
        ],
        "wc_reply_reviewers_avg": [
            55.5,
            72.94689849472697
        ],
        "wc_reply_authors_avg": [
            1348.25,
            360.07941832323604
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            3.5,
            1.118033988749895
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3017777308699272369&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=BWAhEjXjeG",
        "pdf": "https://openreview.net/pdf?id=BWAhEjXjeG",
        "email": "ucsd.edu;technion.ac.il;ucsd.edu",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of California, San Diego;Technion - Israel Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ucsd.edu;https://www.technion.ac.il/en/",
        "aff_unique_abbr": "UCSD;Technion",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "San Diego;",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United States;Israel"
    },
    {
        "id": "BWMFMIad3G",
        "title": "Learning to focus on target for weakly supervised visual grounding",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Visual grounding is a crucial task for connecting visual and language descriptions by identifying target objects based on language entities. However, fully supervised methods require extensive annotations, which can be challenging and time-consuming. Weakly supervised visual grounding, which only relies on image-sentence association without object-level annotations, offers a promising solution. Previous approaches have mainly focused on finding the relationship between detected candidates, without considering improving object localization. In this work, we propose a novel method that leverages Grad-CAM to help the model identify precise objects. Specifically, we introduce a CAM encoder that exploits Grad-CAM information and a new loss function, attention mining loss, to guide the Grad-CAM feature to focus on the entire object. We also use an architecture that combines CNN and transformer, and a multi-modality fusion module to aggregate visual features, language features, and CAM features. Our proposed approach achieves state-of-the-art results on several datasets, demonstrating its effectiveness in different scenes. Ablation studies further confirm the benefits of our architecture.",
        "keywords": "Visual grounding;Vision-language model",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/329ca28dcdbfea38c920f319d4aefee15b6d6c56.pdf",
        "author": "Zhi Xu;Yun Fu",
        "authorids": "~Zhi_Xu2;~Yun_Fu1",
        "gender": "M;M",
        "homepage": "https://github.com/zhix9767;http://www1.ece.neu.edu/~yunfu/",
        "dblp": ";00/5815-1",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.com.tw/citations?user=h-JEcQ8AAAAJ",
        "orcid": ";0000-0002-5098-2853",
        "linkedin": ";furaymond/",
        "or_profile": "~Zhi_Xu2;~Yun_Fu1",
        "aff": "Northeastern University;Northeastern University",
        "aff_domain": "neu.edu;northeastern.edu",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nxu2024learning,\ntitle={Learning to focus on target for weakly supervised visual grounding},\nauthor={Zhi Xu and Yun Fu},\nyear={2024},\nurl={https://openreview.net/forum?id=BWMFMIad3G}\n}",
        "github": "",
        "project": "",
        "reviewers": "qx3e;gxYC",
        "site": "https://openreview.net/forum?id=BWMFMIad3G",
        "pdf_size": 986751,
        "rating": "3;3",
        "confidence": "4;4",
        "soundness": "2;2",
        "contribution": "2;2",
        "presentation": "1;2",
        "wc_summary": "55;149",
        "wc_strengths": "50;51",
        "wc_weaknesses": "164;379",
        "wc_questions": "146;59",
        "wc_review": "415;638",
        "wc_reply_reviewers": "0;0",
        "wc_reply_authors": "0;0",
        "reply_reviewers": "0;0",
        "reply_authors": "0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            102.0,
            47.0
        ],
        "wc_strengths_avg": [
            50.5,
            0.5
        ],
        "wc_weaknesses_avg": [
            271.5,
            107.5
        ],
        "wc_questions_avg": [
            102.5,
            43.5
        ],
        "wc_review_avg": [
            526.5,
            111.5
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            2,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:xU6lV1mzXmkJ:scholar.google.com/&scioq=Learning+to+focus+on+target+for+weakly+supervised+visual+grounding&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Northeastern University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.northeastern.edu",
        "aff_unique_abbr": "NEU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "BWSTBrmRqD",
        "title": "DOMINO: A Dual-System for Multi-step Visual Language Reasoning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Visual language reasoning requires a system to extract text or numbers from information-dense images like charts or plots and perform logical or arithmetic reasoning to arrive at an answer. To tackle this task, existing work relies on either (1) an end-to-end vision-language model trained on a large amount of data, or (2) a two-stage pipeline where a captioning model converts the image into text that is further read by another large language model to deduce the answer. However, the former approach forces the model to answer a complex question with one single step, and the latter approach is prone to inaccurate or distracting information in the converted text that can confuse the language model. In this work, we propose a dual-system for multi-step multimodal reasoning, which consists of a\n\"System-1\" step for visual information extraction and a \"System-2\" step for deliberate reasoning. Given an input, System-2 breaks down the question into atomic sub-steps, each guiding System-1 to extract the information required for reasoning from the image. Experiments on chart and plot datasets show that our method with a pre-trained System-2 module performs competitively compared to prior work on in- and out-of-distribution data. By fine-tuning the System-2 module (LLaMA-2 70B) on only a small amount of data on multi-step reasoning, the accuracy of our method is further improved and surpasses the best fully-supervised end-to-end approach by 5.7% and a pipeline approach with FlanPaLM (540B) by 7.5% on a challenging dataset with human-authored questions.",
        "keywords": "multi-modal reasoning;visual language reasoning;chart question answering",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "PeiFeng Wang;Olga Golovneva;Armen Aghajanyan;Xiang Ren;Muhao Chen;Asli Celikyilmaz;Maryam Fazel-Zarandi",
        "authorids": "~PeiFeng_Wang1;~Olga_Golovneva1;~Armen_Aghajanyan1;~Xiang_Ren1;~Muhao_Chen1;~Asli_Celikyilmaz1;~Maryam_Fazel-Zarandi1",
        "gender": "M;F;;M;M;F;F",
        "homepage": ";;;https://shanzhenren.github.io/;https://muhaochen.github.io/;https://asli.us;https://www.maryamfazel.com/",
        "dblp": "264/4849;280/3377;;36/360-1;173/2608;15/3724;62/5920",
        "google_scholar": "3jfQnM4AAAAJ;;;_moJlrIAAAAJ;k79yEZkAAAAJ;https://scholar.google.com/citations?hl=en;7-a1MKEAAAAJ",
        "orcid": ";;;;0000-0003-0118-3147;;",
        "linkedin": ";olgagolovneva/;;xren7;;aslicelikyilmaz/;maryam-fazel-zarandi/",
        "or_profile": "~PeiFeng_Wang1;~Olga_Golovneva1;~Armen_Aghajanyan1;~Xiang_Ren1;~Muhao_Chen1;~Asli_Celikyilmaz1;~Maryam_Fazel-Zarandi1",
        "aff": "Salesforce AI;Meta Facebook;;University of Southern California;University of Southern California;FAIR ;Meta",
        "aff_domain": "salesforce.com;fb.com;;usc.edu;usc.edu;meta.com;meta.com",
        "position": "Researcher;Researcher;;Associate Professor;Adjunct Professor;Principal Researcher;Senior Research Manager",
        "bibtex": "@misc{\nwang2024domino,\ntitle={{DOMINO}: A Dual-System for Multi-step Visual Language Reasoning},\nauthor={PeiFeng Wang and Olga Golovneva and Armen Aghajanyan and Xiang Ren and Muhao Chen and Asli Celikyilmaz and Maryam Fazel-Zarandi},\nyear={2024},\nurl={https://openreview.net/forum?id=BWSTBrmRqD}\n}",
        "github": "",
        "project": "",
        "reviewers": "j7sH;CNjW;AQ48",
        "site": "https://openreview.net/forum?id=BWSTBrmRqD",
        "pdf_size": 751320,
        "rating": "5;5;8",
        "confidence": "4;3;3",
        "soundness": "2;2;4",
        "contribution": "2;3;3",
        "presentation": "2;3;4",
        "wc_summary": "87;72;84",
        "wc_strengths": "42;39;94",
        "wc_weaknesses": "309;38;8",
        "wc_questions": "79;121;73",
        "wc_review": "517;270;259",
        "wc_reply_reviewers": "120;134;44",
        "wc_reply_authors": "1040;608;631",
        "reply_reviewers": "1;1;1",
        "reply_authors": "2;2;1",
        "rating_avg": [
            6.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            81.0,
            6.48074069840786
        ],
        "wc_strengths_avg": [
            58.333333333333336,
            25.249862485874168
        ],
        "wc_weaknesses_avg": [
            118.33333333333333,
            135.37684029733038
        ],
        "wc_questions_avg": [
            91.0,
            21.354156504062622
        ],
        "wc_review_avg": [
            348.6666666666667,
            119.11432416893538
        ],
        "wc_reply_reviewers_avg": [
            99.33333333333333,
            39.541820336898446
        ],
        "wc_reply_authors_avg": [
            759.6666666666666,
            198.44786608970014
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13825580648752870813&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;2;1;1",
        "aff_unique_norm": "Salesforce;Meta;University of Southern California",
        "aff_unique_dep": "Salesforce AI;Meta Platforms, Inc.;",
        "aff_unique_url": "https://www.salesforce.com;https://meta.com;https://www.usc.edu",
        "aff_unique_abbr": "Salesforce;Meta;USC",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Los Angeles",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "BWlSNtViSA",
        "title": "Coupling Fairness and Pruning in a Single Run: a Bi-level Optimization Perspective",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep neural networks have demonstrated remarkable performance in various tasks. With a growing need for sparse deep learning, model compression techniques, especially pruning, have gained significant attention. However, conventional pruning techniques can inadvertently exacerbate algorithmic bias, resulting in unequal predictions. To address this, we define a fair pruning task where a sparse model is derived subject to fairness requirements. In particular, we propose a framework to jointly optimize the pruning mask and weight update processes with fairness constraints. This framework is engineered to compress models that maintain performance while ensuring fairness in a single execution. To this end, we formulate the fair pruning problem as a novel constrained bi-level optimization task and derive efficient and effective solving strategies. We design experiments spanning various datasets and settings to validate our proposed method. Our empirical analysis contrasts our framework with several mainstream pruning strategies, emphasizing our method's superiority in maintaining model fairness, performance, and efficiency.",
        "keywords": "fairness;pruning;model compression",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Yucong Dai;Gen Li;Feng Luo;Xiaolong Ma;Yongkai Wu",
        "authorids": "~Yucong_Dai1;~Gen_Li4;~Feng_Luo1;~Xiaolong_Ma2;~Yongkai_Wu1",
        "gender": "M;M;M;M;M",
        "homepage": "https://xanadu12138.github.io/;https://coulsonlee.github.io;https://people.cs.clemson.edu/~luofeng;https://xiaolongma2016.com;https://www.yongkaiwu.com/",
        "dblp": ";28/538-12;l/FengLuo.html;;183/0976",
        "google_scholar": ";;joROlFwAAAAJ;https://scholar.google.com/citations?hl=en;sX6KTvwAAAAJ",
        "orcid": "0009-0000-3729-3650;;;0000-0003-3753-7648;0000-0002-7313-9439",
        "linkedin": ";;;xiaolong-ma-66b98910b/;",
        "or_profile": "~Yucong_Dai1;~Gen_Li4;~Feng_Luo1;~Xiaolong_Ma2;~Yongkai_Wu1",
        "aff": "Clemson University;Clemson University;Clemson University;Clemson University;Clemson University",
        "aff_domain": "clemson.edu;clemson.edu;clemson.edu;clemson.edu;clemson.edu",
        "position": "PhD student;PhD student;Full Professor;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\ndai2024coupling,\ntitle={Coupling Fairness and Pruning in a Single Run: a Bi-level Optimization Perspective},\nauthor={Yucong Dai and Gen Li and Feng Luo and Xiaolong Ma and Yongkai Wu},\nyear={2024},\nurl={https://openreview.net/forum?id=BWlSNtViSA}\n}",
        "github": "",
        "project": "",
        "reviewers": "5ZBL;Wsp2;SMS5",
        "site": "https://openreview.net/forum?id=BWlSNtViSA",
        "pdf_size": 1954572,
        "rating": "3;3;5",
        "confidence": "4;3;3",
        "soundness": "2;2;2",
        "contribution": "2;1;2",
        "presentation": "3;2;3",
        "wc_summary": "47;76;50",
        "wc_strengths": "51;26;46",
        "wc_weaknesses": "212;264;57",
        "wc_questions": "3;130;1",
        "wc_review": "313;496;154",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "427;386;210",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            57.666666666666664,
            13.021349989749739
        ],
        "wc_strengths_avg": [
            41.0,
            10.801234497346433
        ],
        "wc_weaknesses_avg": [
            177.66666666666666,
            87.92547349254872
        ],
        "wc_questions_avg": [
            44.666666666666664,
            60.34530268012214
        ],
        "wc_review_avg": [
            321.0,
            139.73546436034053
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            341.0,
            94.1311142325781
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2878665139631535302&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Clemson University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.clemson.edu",
        "aff_unique_abbr": "Clemson",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Fine-tuning Multimodal LLMs to Follow Zero-shot Demonstrative Instructions",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19212",
        "id": "BXY6fe7q31",
        "author_site": "Juncheng Li, Kaihang Pan, Zhiqi Ge, Minghe Gao, Wei Ji, Wenqiao Zhang, Tat-Seng Chua, Siliang Tang, Hanwang Zhang, Yueting Zhuang",
        "tldr": "",
        "abstract": "Recent advancements in Multimodal Large Language Models (MLLMs) have been utilizing Visual Prompt Generators (VPGs) to convert visual features into tokens that LLMs can recognize. This is achieved by training the VPGs on millions of image-caption pairs, where the VPG-generated tokens of images are fed into a frozen LLM to generate the corresponding captions. However, this image-captioning based training objective inherently biases the VPG to concentrate solely on the primary visual contents sufficient for caption generation, often neglecting other visual details. This shortcoming results in MLLMs\u2019 underperformance in comprehending demonstrative instructions consisting of multiple, interleaved, and multimodal instructions that demonstrate the required context to complete a task. To address this issue, we introduce a generic and lightweight Visual Prompt Generator Complete module (VPG-C), which can infer and complete the missing details essential for comprehending demonstrative instructions. Further, we propose a synthetic discriminative training strategy to fine-tune VPG-C, eliminating the need for supervised demonstrative instructions. As for evaluation, we build DEMON, a comprehensive benchmark for demonstrative instruction understanding. Synthetically trained with the proposed strategy, VPG-C achieves significantly stronger zero-shot performance across all tasks of DEMON. Further evaluation on the MME and OwlEval benchmarks also demonstrate the superiority of VPG-C. The code and models are available at https://github.com/DCDmllm/Cheetah.",
        "keywords": "Multimodal Large Language Models;Demonstrative Instruction",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Juncheng Li;Kaihang Pan;Zhiqi Ge;Minghe Gao;Wei Ji;Wenqiao Zhang;Tat-Seng Chua;Siliang Tang;Hanwang Zhang;Yueting Zhuang",
        "authorids": "~Juncheng_Li3;~Kaihang_Pan1;~Zhiqi_Ge1;~Minghe_Gao1;~Wei_Ji1;~Wenqiao_Zhang1;~Tat-Seng_Chua2;~Siliang_Tang1;~Hanwang_Zhang3;~Yueting_Zhuang1",
        "gender": "M;M;M;M;M;M;M;M;M;M",
        "homepage": ";https://github.com/1308024507pkh;;https://github.com/minghehe-nobug;https://jiwei0523.github.io/;;https://person.zju.edu.cn/en/siliang;https://mreallab.github.io/index.html;https://person.zju.edu.cn/yzhuang;http://www.comp.nus.edu.sg/~chuats/",
        "dblp": "182/7674-6;344/0647.html;305/0099;223/7088;52/3220-8;250/4486.html;44/5693;79/8116.html;;",
        "google_scholar": "lm9s-QgAAAAJ;https://scholar.google.com.hk/citations?user=lMQADDUAAAAJ;NOiYcWYAAAAJ;;69OFB-AAAAAJ;https://scholar.google.com/citations?hl=zh-CN;8e7H3PcAAAAJ;YG0DFyYAAAAJ;1RD7UJAAAAAJ;https://scholar.google.com.tw/citations?user=Z9DWCBEAAAAJ",
        "orcid": "0000-0003-2258-1291;;;;0000-0002-8106-9768;0000-0002-5988-7609;0000-0002-7356-9711;;;0000-0001-6097-7807",
        "linkedin": ";;;;;;siliang-tang-4734272a/;;;",
        "or_profile": "~Juncheng_Li3;~Kaihang_Pan1;~Zhiqi_Ge1;~Minghe_Gao1;~Wei_Ji1;~Wenqiao_Zhang1;~Siliang_Tang1;~Hanwang_Zhang3;~Yueting_Zhuang1;~Tat-seng_Chua1",
        "aff": "National University of Singapore;Zhejiang University;Zhejiang University;Zhejiang University;Nanjing University;Zhejiang University;Zhejiang University;Nanyang Technological University;Zhejiang University;National University of Singapore",
        "aff_domain": "nus.edu;zju.edu.cn;zju.edu.cn;zju.edu.cn;nju.edu.cn;zju.edu.cn;zju.edu.cn;ntu.edu.sg;zju.edu.cn;nus.edu.sg",
        "position": "Postdoc;PhD student;PhD student;MS student;Associate Professor;Assistant Professor;Full Professor;Associate Professor;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nli2024finetuning,\ntitle={Fine-tuning Multimodal {LLM}s to Follow Zero-shot Demonstrative Instructions},\nauthor={Juncheng Li and Kaihang Pan and Zhiqi Ge and Minghe Gao and Wei Ji and Wenqiao Zhang and Tat-Seng Chua and Siliang Tang and Hanwang Zhang and Yueting Zhuang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=BXY6fe7q31}\n}",
        "github": "",
        "project": "",
        "reviewers": "kFPK;gX7w;cxqK;HGkc",
        "pdf_size": 9523892,
        "rating": "6;6;8;8",
        "confidence": "4;5;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;4",
        "wc_summary": "63;50;107;162",
        "wc_strengths": "66;56;62;91",
        "wc_weaknesses": "123;108;26;63",
        "wc_questions": "19;2;1;5",
        "wc_review": "271;216;196;321",
        "wc_reply_reviewers": "24;14;0;55",
        "wc_reply_authors": "1620;794;430;611",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "4;3;1;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            95.5,
            43.82065722921097
        ],
        "wc_strengths_avg": [
            68.75,
            13.329947486768281
        ],
        "wc_weaknesses_avg": [
            80.0,
            38.203402989786134
        ],
        "wc_questions_avg": [
            6.75,
            7.224091638399945
        ],
        "wc_review_avg": [
            251.0,
            48.86205071423016
        ],
        "wc_reply_reviewers_avg": [
            23.25,
            20.216020874544032
        ],
        "wc_reply_authors_avg": [
            863.75,
            455.19247302652093
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 88,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9136741930608589425&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=BXY6fe7q31",
        "pdf": "https://openreview.net/pdf?id=BXY6fe7q31",
        "email": "nus.edu;zju.edu.cn;zju.edu.cn;zju.edu.cn;nju.edu.cn;zju.edu.cn;zju.edu.cn;ntu.edu.sg;zju.edu.cn;nus.edu.sg",
        "author_num": 10,
        "aff_unique_index": "0;1;1;1;2;1;1;3;1;0",
        "aff_unique_norm": "National University of Singapore;Zhejiang University;Nanjing University;Nanyang Technological University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.nus.edu.sg;https://www.zju.edu.cn;https://www.nju.edu.cn;https://www.ntu.edu.sg",
        "aff_unique_abbr": "NUS;ZJU;Nanjing U;NTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;1;1;1;0;1;0",
        "aff_country_unique": "Singapore;China"
    },
    {
        "id": "BXYZvcgVUv",
        "title": "Object-Relational Graph Framework for Zero-Shot 3D Scene Segmentation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "When it comes to understanding 3D scenes, the capability to perform zero-shot comprehension on real-world objects is essential, as unseen objects, absent from the training data, frequently appear in natural scenes.  While prior works have proposed zero-shot scene segmentation approaches by aligning 3D point features with other data modalities, they often rely on paired image sets for 3D data. More importantly, they treat scene objects independently, thereby neglecting the rich relational information inherent in scenes. This relational information between objects plays a pivotal role in identifying unseen objects within a scene, transforming the zero-shot scene understanding problem into a question as 'which object is likely to be adjacent to object A and on top of object B?'. Toward this, we introduce a novel open-vocabulary 3D scene segmentation strategy, ORG, which embeds 3D scenes into a knowledge graph framework. Our framework constructs entity graphs among scene objects using a 2D segmentation foundation model and learns relational knowledge within this graph structure. By semantically aligning node embeddings with text embedding space, ORG performs zero-shot inference effectively while leveraging prior relational knowledge specific to a given scene.  Our method consistently outperforms existing zero-shot scene segmentation approaches on three 3D scene understanding datasets: S3DIS, ScanNetV2, and 3DSSG.",
        "keywords": "Deep learning;Point cloud analysis;3D scene segmentation",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Joonhyung Park;Jaeyun Song;JungEun Kim;Eunho Yang",
        "authorids": "~Joonhyung_Park1;~Jaeyun_Song2;~JungEun_Kim3;~Eunho_Yang1",
        "gender": "M;M;;M",
        "homepage": ";;https://jungeun122333.github.io/;https://sites.google.com/site/hleehome2/",
        "dblp": "306/1374;289/2048;376/6596;96/2621",
        "google_scholar": "https://scholar.google.com/citations?hl=ko;;W_8P1eQAAAAJ;",
        "orcid": ";;;",
        "linkedin": "joonhyung-park-495527145/;jaeyun-song-9a4111213/;jungeun-kim-50436a229/;",
        "or_profile": "~Joonhyung_Park1;~Jaeyun_Song2;~JungEun_Kim3;~Eunho_Yang1",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr;kaist.ac.kr;kaist.ac.kr",
        "position": "PhD student;PhD student;MS student;Associate Professor",
        "bibtex": "@misc{\npark2024objectrelational,\ntitle={Object-Relational Graph Framework for Zero-Shot 3D Scene Segmentation},\nauthor={Joonhyung Park and Jaeyun Song and JungEun Kim and Eunho Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=BXYZvcgVUv}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=BXYZvcgVUv",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:aQYotDzH2BYJ:scholar.google.com/&scioq=Object-Relational+Graph+Framework+for+Zero-Shot+3D+Scene+Segmentation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "BYUdBlaNqk",
        "title": "System Identification of Neural Systems: Going Beyond Images to Modelling Dynamics",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Vast literature has compared the recordings of biological neurons in the brain to deep neural networks. The ultimate goal is either reporting insights to interpret deep networks or to have a better understanding and encoding of biological neural systems. Recently, there has been a debate on whether system identification is possible and how much it can tell us about the brain computation. System identification recognizes whether one model is more valid to represent the brain computation over another. Nonetheless, previous work did not consider the time aspect and how video and dynamics (e.g., motion) modelling in deep networks compare to these biological neural systems. Towards this end, we propose a system identification study focused on comparing single image versus video understanding models with respect to the visual cortex recordings. Our study encompasses two sets of experiments; a real environment setup (i.e., regressing on the output of the visual cortex in the human brain recorded as fMRI responses) and a simulated environment setup (i.e., regressing on another network architecture representations that we know its modelling scheme). This study encompasses more than 30 models and, unlike prior works, we focus on convolutional versus transformer-based, single versus two-stream, and fully versus self-supervised video understanding models. The goal is to capture a greater variety of architectures that model dynamics. As such, this signifies the first large-scale study of video understanding models from a neuroscience perspective. Our results in the simulated experiments, show that system identification can be attained to a certain level. Moreover, we present the results of the real experiments and provide key insights on how dynamics modelling in deep networks compare to the human visual cortex.",
        "keywords": "Neuroscience;Neural Encoding;Video Understanding",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/955b0161554e2d79326464e618b87866002556b8.pdf",
        "author": "Mai Gamal;Mohamed Rashad Abdel Hamid;Eman Ehab Nasef;Seif Eldawlatly;Mennatullah Siam",
        "authorids": "~Mai_Gamal1;~Mohamed_Rashad_Abdel_Hamid1;~Eman_Ehab_Nasef1;~Seif_Eldawlatly1;~Mennatullah_Siam1",
        "gender": "F;M;F;M;F",
        "homepage": "https://www.linkedin.com/in/mai-gamal-el-katatny/;;;;https://msiam.github.io/homepage/",
        "dblp": "274/3639.html;;;;163/9048",
        "google_scholar": "SB_-84UAAAAJ;;S4Yfvk0AAAAJ;https://scholar.google.com.eg/citations?user=Yk_SqwIAAAAJ;https://scholar.google.ca/citations?user=AVPds3kAAAAJ",
        "orcid": "0009-0008-6598-9338;;0000-0002-0079-5822;;",
        "linkedin": "mai-gamal-el-katatny/;mohamed-rashad-8a5325178;emanehabn/;;",
        "or_profile": "~Mai_Gamal1;~Mohamed_Rashad_Abdel_Hamid1;~Eman_Ehab_Nasef1;~Seif_Eldawlatly1;~Mennatullah_mohammed_Siam1",
        "aff": "German University in Cairo;Ain Shams University ;The American University in Cairo;Ain Shams University;Ontario Tech University",
        "aff_domain": "guc.edu.eg;fcis.edu;aucegypt.edu;eng.asu.edu.eg;ontariotechu.ca",
        "position": "PhD student;MS student;Research Assistant;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\ngamal2024system,\ntitle={System Identification of Neural Systems: Going Beyond Images to Modelling Dynamics},\nauthor={Mai Gamal and Mohamed Rashad Abdel Hamid and Eman Ehab Nasef and Seif Eldawlatly and Mennatullah Siam},\nyear={2024},\nurl={https://openreview.net/forum?id=BYUdBlaNqk}\n}",
        "github": "",
        "project": "",
        "reviewers": "N4F4;vj7K;4dZd;wu71",
        "site": "https://openreview.net/forum?id=BYUdBlaNqk",
        "pdf_size": 6907786,
        "rating": "3;5;5;8",
        "confidence": "4;4;4;4",
        "soundness": "3;2;2;3",
        "contribution": "1;2;2;3",
        "presentation": "2;4;3;3",
        "wc_summary": "35;154;95;48",
        "wc_strengths": "56;57;120;25",
        "wc_weaknesses": "232;147;481;179",
        "wc_questions": "48;2;16;30",
        "wc_review": "371;360;712;282",
        "wc_reply_reviewers": "51;245;233;24",
        "wc_reply_authors": "463;763;842;280",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            83.0,
            46.674404120459855
        ],
        "wc_strengths_avg": [
            64.5,
            34.528973341239094
        ],
        "wc_weaknesses_avg": [
            259.75,
            131.29618235120168
        ],
        "wc_questions_avg": [
            24.0,
            17.029386365926403
        ],
        "wc_review_avg": [
            431.25,
            165.68249002233156
        ],
        "wc_reply_reviewers_avg": [
            138.25,
            101.29011550985614
        ],
        "wc_reply_authors_avg": [
            587.0,
            226.73001565738932
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:mHTTg8qdc2wJ:scholar.google.com/&scioq=System+Identification+of+Neural+Systems:+Going+Beyond+Images+to+Modelling+Dynamics&hl=en&as_sdt=0,33",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;1;3",
        "aff_unique_norm": "German University in Cairo;Ain Shams University;American University in Cairo;Ontario Tech University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.guc.edu.eg;https://www.ashams.edu.eg;https://www.aucegypt.edu;https://www.ontariotechu.ca",
        "aff_unique_abbr": "GUC;ASU;AUC;OntTechU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;1",
        "aff_country_unique": "Egypt;Canada"
    },
    {
        "id": "BZENIrps7G",
        "title": "XAI Procedural Fairness Auditing Framework: avoid misguided outcomes by refocusing on fairness properties",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Interpretable machine learning and explainable AI (XAI) methods used to investigate fairness properties can be described as ML auditing. Current ML researchers have noted that there are limited, successful implementations of procedural fairness, which focuses on the decision-making steps rather than fair outcomes. We present the results of our procedural fairness auditing framework for XAI tools. We evaluated STEALTH, an ensemble XAI method that combines novel global surrogate model generation that avoids detection by deceptive models with well-known LIME's local explanations. Through a Procedural Fairness lens, we audited STEALTH's decision-making process outside of its notable performance outcomes. The procedural fairness audit reports that STEALTH's global surrogate models are impressive and a successful application of recursive bi-clustering for representative data downsampling. However, the audit also revealed STEALTH's training data biases, and we discuss how STEALTH's fairness claims were misguided by ``fairer outcomes.'' The procedural fairness auditing framework provides an outline of how to interpret ML decision-making, ensuring procedural fairness.",
        "keywords": "Interpretable Machine Learning;Explainable Artificial Intelligence;Trustworthy AI;Fair ML",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Lauren Alvarez;Veronica Catete",
        "authorids": "~Lauren_Alvarez1;vmcatete@ncsu.edu",
        "gender": "F;",
        "homepage": ";",
        "dblp": ";",
        "google_scholar": "MzCfWQ8AAAAJ;",
        "orcid": "0000-0001-7498-0839;",
        "linkedin": ";",
        "or_profile": "~Lauren_Alvarez1;vmcatete@ncsu.edu",
        "aff": "North Carolina State University;",
        "aff_domain": "ncsu.edu;",
        "position": "PhD student;",
        "bibtex": "@misc{\nalvarez2024xai,\ntitle={{XAI} Procedural Fairness Auditing Framework: avoid misguided outcomes by refocusing on fairness properties},\nauthor={Lauren Alvarez and Veronica Catete},\nyear={2024},\nurl={https://openreview.net/forum?id=BZENIrps7G}\n}",
        "github": "",
        "project": "",
        "reviewers": "wYqY;VbpT;VwFX;g6MX",
        "site": "https://openreview.net/forum?id=BZENIrps7G",
        "pdf_size": 381345,
        "rating": "1;3;3;5",
        "confidence": "3;3;4;4",
        "soundness": "2;2;2;2",
        "contribution": "1;1;2;2",
        "presentation": "1;3;2;2",
        "wc_summary": "52;19;38;139",
        "wc_strengths": "13;21;14;87",
        "wc_weaknesses": "28;24;59;91",
        "wc_questions": "25;22;74;6",
        "wc_review": "118;86;185;323",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            62.0,
            45.97281805589037
        ],
        "wc_strengths_avg": [
            33.75,
            30.898017735770686
        ],
        "wc_weaknesses_avg": [
            50.5,
            27.02313823374332
        ],
        "wc_questions_avg": [
            31.75,
            25.439880109780393
        ],
        "wc_review_avg": [
            178.0,
            91.0192287376684
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.7071067811865476,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:dg2rnh6ej_kJ:scholar.google.com/&scioq=XAI+Procedural+Fairness+Auditing+Framework:+avoid+misguided+outcomes+by+refocusing+on+fairness+properties&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "North Carolina State University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ncsu.edu",
        "aff_unique_abbr": "NCSU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "BZkKMQ25Z7",
        "title": "fMRI-PTE: A Large-scale fMRI Pretrained Transformer Encoder for Multi-Subject Brain Activity Decoding",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The exploration of brain activity and its decoding from fMRI data has been a longstanding pursuit, driven by its potential applications in brain-computer interfaces, medical diagnostics, and virtual reality. Previous approaches have primarily focused on individual subject analysis, highlighting the need for a more universal and adaptable framework, which is the core motivation behind our work. In this work, we propose fMRI-PTE, an innovative auto-encoder approach for fMRI pre-training, with a focus on addressing the challenges of varying fMRI data dimensions due to individual brain differences. Our approach involves transforming fMRI signals into unified 2D representations, ensuring consistency in dimensions and preserving distinct brain activity patterns. We introduce a novel learning strategy tailored for pre-training 2D fMRI images, enhancing the quality of reconstruction. fMRI-PTE's adaptability with image generators enables the generation of well-represented fMRI features, facilitating various downstream tasks, including within-subject and cross-subject brain activity decoding. Our contributions encompass introducing fMRI-PTE, innovative data transformation, efficient training, a novel learning strategy, and the universal applicability of our approach. Extensive experiments validate and support our claims, offering a promising foundation for further research in this domain.",
        "keywords": "Neural Encoding;Neural Decoding;Latent Embedding Alignment",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "Xuelin Qian;Yun Wang;Jingyang Huo;Xinwei Sun;Yanwei Fu;Jianfeng Feng",
        "authorids": "~Xuelin_Qian1;~Yun_Wang9;~Jingyang_Huo1;~Xinwei_Sun1;~Yanwei_Fu2;~Jianfeng_Feng2",
        "gender": ";;F;M;M;",
        "homepage": ";;https://dblp.org/pid/348/6840.html;https://sunxinwei0625.github.io/sunxw.github.io/;http://yanweifu.github.io;",
        "dblp": ";;;145/6592-1;63/9065;",
        "google_scholar": ";;;;https://scholar.google.co.uk/citations?user=Vg54TcsAAAAJ;",
        "orcid": ";;;;0000-0002-6595-6893;",
        "linkedin": ";;;;;",
        "or_profile": "~Xuelin_Qian1;~Yun_Wang9;~Jingyang_Huo1;~Xinwei_Sun1;~Yanwei_Fu2;~Jianfeng_Feng2",
        "aff": ";;Fudan University;Fudan University;Fudan University,;",
        "aff_domain": ";;fudan.edu.cn;fudan.edu.cn;fudan.edu.cn;",
        "position": ";;PhD student;Assistant Professor;Professor;",
        "bibtex": "@misc{\nqian2024fmripte,\ntitle={f{MRI}-{PTE}: A Large-scale f{MRI} Pretrained Transformer Encoder for Multi-Subject Brain Activity Decoding},\nauthor={Xuelin Qian and Yun Wang and Jingyang Huo and Xinwei Sun and Yanwei Fu and Jianfeng Feng},\nyear={2024},\nurl={https://openreview.net/forum?id=BZkKMQ25Z7}\n}",
        "github": "",
        "project": "",
        "reviewers": "MXbE;JDw2;X3zc;8D82",
        "site": "https://openreview.net/forum?id=BZkKMQ25Z7",
        "pdf_size": 2001355,
        "rating": "3;3;5;5",
        "confidence": "4;3;3;4",
        "soundness": "1;2;3;3",
        "contribution": "1;2;2;2",
        "presentation": "2;2;2;2",
        "wc_summary": "102;43;53;89",
        "wc_strengths": "31;13;79;141",
        "wc_weaknesses": "93;470;345;158",
        "wc_questions": "547;113;74;95",
        "wc_review": "773;639;551;483",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "762;687;701;287",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            71.75,
            24.44764814864612
        ],
        "wc_strengths_avg": [
            66.0,
            49.56813492557492
        ],
        "wc_weaknesses_avg": [
            266.5,
            149.54012839368568
        ],
        "wc_questions_avg": [
            207.25,
            196.63974038835588
        ],
        "wc_review_avg": [
            611.5,
            108.41010100539525
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            609.25,
            188.17594825056682
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7044201031958514798&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Fudan University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.fudan.edu.cn",
        "aff_unique_abbr": "Fudan",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Manifold Diffusion Fields",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19211",
        "id": "BZtEthuXRF",
        "author_site": "Ahmed Elhag, Yuyang Wang, Joshua Susskind, MIGUEL ANGEL BAUTISTA",
        "tldr": "",
        "abstract": "We present Manifold Diffusion Fields (MDF), an approach that unlocks learning of diffusion models of data in general non-euclidean geometries. Leveraging insights from spectral geometry analysis, we define an intrinsic coordinate system on the manifold via the eigen-functions of the Laplace-Beltrami Operator.  MDF represents functions using an explicit parametrization formed by a set of multiple input-output pairs. Our approach allows to sample continuous functions on manifolds and is invariant with respect to rigid and isometric transformations of the manifold. In addition, we show that MDF generalizes to the case where the training set contains functions on different manifolds. Empirical results on multiple datasets and manifolds including challenging scientific problems like weather prediction or  molecular conformation show that MDF can capture distributions of such functions with better diversity and fidelity than previous approaches.",
        "keywords": "Diffusion models;riemannian manifolds;graphs",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/b3e2a0d430192fa468713ac3c9b21ab0a8f05062.zip",
        "author": "Ahmed A. A. Elhag;Yuyang Wang;Joshua M. Susskind;Miguel \u00c1ngel Bautista",
        "authorids": "~Ahmed_A._A._Elhag1;~Yuyang_Wang3;~Joshua_M._Susskind1;~Miguel_\u00c1ngel_Bautista1",
        "gender": "M;;M;M",
        "homepage": ";https://yuyangw.github.io/;http://www.apple.com;",
        "dblp": "288/1987.html;43/8355-5;132/7797;38/10085",
        "google_scholar": "v0MsHOMAAAAJ;6eWGKEsAAAAJ;Sv2TGqsAAAAJ;ZrRs-qoAAAAJ",
        "orcid": ";0000-0003-0723-6246;;",
        "linkedin": "ahmed-a-a-elhag-7305441a3/;;joshua-susskind-8ab2ab5/;",
        "or_profile": "~Ahmed_A._A._Elhag1;~Yuyang_Wang3;~Joshua_M._Susskind1;~Miguel_\u00c1ngel_Bautista1",
        "aff": "Department of Computer Science, University of Oxford;Apple;Apple;Apple",
        "aff_domain": "cs.ox.ac.uk;apple.com;apple.com;apple.com",
        "position": "PhD student;Research Scientist;Researcher;Research Scientist",
        "bibtex": "@inproceedings{\nelhag2024manifold,\ntitle={Manifold Diffusion Fields},\nauthor={Ahmed A. A. Elhag and Yuyang Wang and Joshua M. Susskind and Miguel {\\'A}ngel Bautista},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=BZtEthuXRF}\n}",
        "github": "",
        "project": "",
        "reviewers": "wDdD;YGhV;WPEM",
        "pdf_size": 22211651,
        "rating": "6;6;8",
        "confidence": "4;3;4",
        "soundness": "2;3;4",
        "contribution": "2;2;3",
        "presentation": "3;3;4",
        "wc_summary": "56;58;84",
        "wc_strengths": "24;51;124",
        "wc_weaknesses": "120;52;178",
        "wc_questions": "50;251;90",
        "wc_review": "250;412;476",
        "wc_reply_reviewers": "78;64;346",
        "wc_reply_authors": "884;628;838",
        "reply_reviewers": "2;1;1",
        "reply_authors": "3;2;2",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            66.0,
            12.754084313139327
        ],
        "wc_strengths_avg": [
            66.33333333333333,
            42.240054713769275
        ],
        "wc_weaknesses_avg": [
            116.66666666666667,
            51.49325737954005
        ],
        "wc_questions_avg": [
            130.33333333333334,
            86.87283170755336
        ],
        "wc_review_avg": [
            379.3333333333333,
            95.11163032049352
        ],
        "wc_reply_reviewers_avg": [
            162.66666666666666,
            129.76217562225992
        ],
        "wc_reply_authors_avg": [
            783.3333333333334,
            111.43109480252309
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.49999999999999983,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15507477462451205812&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=BZtEthuXRF",
        "pdf": "https://openreview.net/pdf?id=BZtEthuXRF",
        "email": "cs.ox.ac.uk;apple.com;apple.com;apple.com",
        "author_num": 4,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "University of Oxford;Apple",
        "aff_unique_dep": "Department of Computer Science;Apple Inc.",
        "aff_unique_url": "https://www.ox.ac.uk;https://www.apple.com",
        "aff_unique_abbr": "Oxford;Apple",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Oxford;",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "id": "Ba5KGabRe8",
        "title": "XplainLLM: A QA Explanation Dataset for Understanding LLM Decision-Making",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) have recently made impressive strides in natural language understanding tasks. Despite their remarkable performance, understanding their decision-making process remains a big challenge. In this paper, we look into bringing some transparency to this process by introducing a new explanation dataset for question answering (QA) tasks that integrates knowledge graphs (KGs) in a novel way. Our dataset includes 12,102 question-answer-explanation (QAE) triples. Each explanation in the dataset links the LLM's reasoning to entities and relations in the KGs. The explanation component includes a $\\textit{why-choose}$ explanation, a $\\textit{why-not-choose}$ explanation, and a set of $\\textit{reason-elements}$ that underlie the LLM's decision. We leverage KGs and graph attention networks (GAT) to find the $\\textit{reason-elements}$ and transform them into $\\textit{why-choose}$ and $\\textit{why-not-choose}$  explanations that are comprehensible to humans. Through quantitative and qualitative evaluations, we demonstrate the potential of our dataset to improve the in-context learning of LLMs, and enhance their interpretability and explainability. Our work contributes to the field of explainable AI by enabling a deeper understanding of the LLMs decision-making process to make them more transparent and thereby, potentially more reliable, to researchers and practitioners alike. Our dataset is available at: http://anonymous.4open.science/r/XplainLLM.",
        "keywords": "Dataset;Explanation;XAI;Language Model",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/0d4ab118094ab6acdfa7d077cecebfb2b6bc72ba.zip",
        "author": "Zichen Chen;Jianda Chen;Mitali Gaidhani;Ambuj Singh;Misha Sra",
        "authorids": "~Zichen_Chen1;~Jianda_Chen1;~Mitali_Gaidhani1;~Ambuj_Singh1;~Misha_Sra1",
        "gender": "F;;;;F",
        "homepage": ";;;;https://sites.cs.ucsb.edu/~sra",
        "dblp": "23/7781;176/6660;;;119/4545",
        "google_scholar": "X4goIzYAAAAJ;jEOSgcUAAAAJ;;;yDkV9BsAAAAJ",
        "orcid": ";;;;0000-0001-8154-8518",
        "linkedin": ";;mitali-gaidhani/;;mishasra",
        "or_profile": "~Zichen_Chen1;~Jianda_Chen1;~Mitali_Gaidhani1;~Ambuj_Singh1;~Misha_Sra1",
        "aff": "University of California, Santa Barbara;Nanyang Technological University;University of California, Santa Barbara;;University of California, Santa Barbara",
        "aff_domain": "ucsb.edu;ntu.edu.sg;ucsb.edu;;ucsb.edu",
        "position": "PhD student;Researcher;Undergrad student;;Assistant Professor",
        "bibtex": "@misc{\nchen2024xplainllm,\ntitle={Xplain{LLM}: A {QA} Explanation Dataset for Understanding {LLM} Decision-Making},\nauthor={Zichen Chen and Jianda Chen and Mitali Gaidhani and Ambuj Singh and Misha Sra},\nyear={2024},\nurl={https://openreview.net/forum?id=Ba5KGabRe8}\n}",
        "github": "",
        "project": "",
        "reviewers": "MEtr;w11A;vkjW;ZCRc",
        "site": "https://openreview.net/forum?id=Ba5KGabRe8",
        "pdf_size": 1717563,
        "rating": "3;3;5;6",
        "confidence": "4;3;2;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;2;3",
        "wc_summary": "152;193;260;67",
        "wc_strengths": "73;191;67;92",
        "wc_weaknesses": "194;509;81;92",
        "wc_questions": "8;78;81;40",
        "wc_review": "427;971;489;291",
        "wc_reply_reviewers": "150;148;82;0",
        "wc_reply_authors": "1703;2179;1359;805",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "6;5;4;2",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            168.0,
            69.9035049192814
        ],
        "wc_strengths_avg": [
            105.75,
            50.07681599303214
        ],
        "wc_weaknesses_avg": [
            219.0,
            173.13145294833058
        ],
        "wc_questions_avg": [
            51.75,
            29.98645527567405
        ],
        "wc_review_avg": [
            544.5,
            256.44248867923585
        ],
        "wc_reply_reviewers_avg": [
            95.0,
            61.29437168288782
        ],
        "wc_reply_authors_avg": [
            1511.5,
            501.15541501614047
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.25,
            1.479019945774904
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5443310539518174,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17774960372040877124&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "University of California, Santa Barbara;Nanyang Technological University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ucsb.edu;https://www.ntu.edu.sg",
        "aff_unique_abbr": "UCSB;NTU",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Santa Barbara;",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "United States;Singapore"
    },
    {
        "title": "AntGPT: Can Large Language Models Help Long-term Action Anticipation from Videos?",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19210",
        "id": "Bb21JPnhhr",
        "author_site": "Qi Zhao, Shijie Wang, Ce Zhang, Changcheng Fu, Minh Quan Do, Nakul Agarwal, Kwonjoon Lee, Chen Sun",
        "tldr": "",
        "abstract": "Can we better anticipate an actor\u2019s future actions (e.g. mix eggs) by knowing what commonly happens after the current action (e.g. crack eggs)? What if the actor also shares the goal (e.g. make fried rice) with us? The long-term action anticipation (LTA) task aims to predict an actor\u2019s future behavior from video observations in the form of verb and noun sequences, and it is crucial for human-machine interaction.\nWe propose to formulate the LTA task from two perspectives: a bottom-up approach that predicts the next actions autoregressively by modeling temporal dynamics; and a top-down approach that infers the goal of the actor and plans the needed procedure to accomplish the goal. We hypothesize that large language models (LLMs), which have been pretrained on procedure text data (e.g. recipes, how-tos),\nhave the potential to help LTA from both perspectives. It can help provide the prior knowledge on the possible next actions, and infer the goal given the observed part of a procedure, respectively. We propose AntGPT, which represents video observations as sequences of human actions, and uses the action representation for an LLM to infer the goals and model temporal dynamics. AntGPT achieves state-\nof-the-art performance on Ego4D LTA v1 and v2, EPIC-Kitchens-55, as well as EGTEA GAZE+, thanks to LLMs\u2019 goal inference and temporal dynamics modeling capabilities. We further demonstrate that these capabilities can be effectively distilled into a compact neural network 1.3% of the original LLM model size. Code and model will be released upon acceptance.",
        "keywords": "long-term action anticipation;multimodal learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Qi Zhao;Shijie Wang;Ce Zhang;Changcheng Fu;Minh Quan Do;Nakul Agarwal;Kwonjoon Lee;Chen Sun",
        "authorids": "~Qi_Zhao8;~Shijie_Wang2;~Ce_Zhang7;~Changcheng_Fu1;minh_quan_do@brown.edu;~Nakul_Agarwal2;~Kwonjoon_Lee1;~Chen_Sun1",
        "gender": "M;M;M;M;;;M;M",
        "homepage": "https://github.com/kevinz8866;https://wang-sj16.github.io/;https://ceezh.github.io/;https://www.frankfcc.com/;;;https://kjunelee.github.io;https://chensun.me",
        "dblp": ";;97/919-10;353/2460;;;127/7948;01/6072-2",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;https://scholar.google.com/citations?hl=en;zGA2ReUAAAAJ;TduSHQwAAAAJ;;;C6Wu8M0AAAAJ;vQa7heEAAAAJ",
        "orcid": ";;;;;;0000-0002-1433-551X;",
        "linkedin": "kevin-zhao-02a7a0171/;shijie-wang-a38413132/;;changcheng-fu/;;;;",
        "or_profile": "~Qi_Zhao8;~Shijie_Wang2;~Ce_Zhang7;~Changcheng_Fu1;minh_quan_do@brown.edu;~Nakul_Agarwal2;~Kwonjoon_Lee1;~Chen_Sun1",
        "aff": "Brown University;Meta Facebook;Meta Facebook;University of Southern California;;;Honda Research Institute USA;Google",
        "aff_domain": "brown.edu;meta.com;meta.com;usc.edu;;;honda-ri.com;google.com",
        "position": "MS student;Intern;Intern;PhD student;;;Sr Research Scientist;Research Scientist",
        "bibtex": "@inproceedings{\nzhao2024antgpt,\ntitle={Ant{GPT}: Can Large Language Models Help Long-term Action Anticipation from Videos?},\nauthor={Qi Zhao and Shijie Wang and Ce Zhang and Changcheng Fu and Minh Quan Do and Nakul Agarwal and Kwonjoon Lee and Chen Sun},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Bb21JPnhhr}\n}",
        "github": "",
        "project": "",
        "reviewers": "R7fa;v3Zh;Utid;jEKR",
        "pdf_size": 17347188,
        "rating": "5;6;6;8",
        "confidence": "4;4;3;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;1;3",
        "wc_summary": "41;52;76;99",
        "wc_strengths": "27;38;46;67",
        "wc_weaknesses": "58;182;80;414",
        "wc_questions": "8;61;79;18",
        "wc_review": "134;333;281;598",
        "wc_reply_reviewers": "0;47;13;106",
        "wc_reply_authors": "453;689;856;481",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "1;2;3;2",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            67.0,
            22.39419567655869
        ],
        "wc_strengths_avg": [
            44.5,
            14.637281168304447
        ],
        "wc_weaknesses_avg": [
            183.5,
            141.0629292195508
        ],
        "wc_questions_avg": [
            41.5,
            29.415132160165456
        ],
        "wc_review_avg": [
            336.5,
            167.6909359506351
        ],
        "wc_reply_reviewers_avg": [
            41.5,
            41.00304866714181
        ],
        "wc_reply_authors_avg": [
            619.75,
            164.0630595228554
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.13245323570650439,
        "gs_citation": 57,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12348422484170189698&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=Bb21JPnhhr",
        "pdf": "https://openreview.net/pdf?id=Bb21JPnhhr",
        "email": "brown.edu;meta.com;meta.com;usc.edu;;;honda-ri.com;google.com",
        "author_num": 8,
        "aff_unique_index": "0;1;1;2;3;4",
        "aff_unique_norm": "Brown University;Meta;University of Southern California;Honda Research Institute;Google",
        "aff_unique_dep": ";Meta Platforms, Inc.;;Honda Research Institute;Google",
        "aff_unique_url": "https://www.brown.edu;https://meta.com;https://www.usc.edu;https://honda-ri.com;https://www.google.com",
        "aff_unique_abbr": "Brown;Meta;USC;HRI USA;Google",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Los Angeles;Mountain View",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Large Language Models as Optimizers",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19209",
        "id": "Bb4VGOWELI",
        "author_site": "Chengrun Yang, Xuezhi Wang, Yifeng Lu, Hanxiao Liu, Quoc V Le, Denny Zhou, Xinyun Chen",
        "tldr": "",
        "abstract": "Optimization is ubiquitous. While derivative-based algorithms have been powerful tools for various problems, the absence of gradient imposes challenges on many real-world applications. In this work, we propose Optimization by PROmpting (OPRO), a simple and effective approach to leverage large language models (LLMs) as optimizers, where the optimization task is described in natural language. In each optimization step, the LLM generates new solutions from the prompt that contains previously generated solutions with their values, then the new solutions are evaluated and added to the prompt for the next optimization step. We first showcase OPRO on linear regression and traveling salesman problems, then move on to our main application in prompt optimization, where the goal is to find instructions that maximize the task accuracy. With a variety of LLMs, we demonstrate that the best prompts optimized by OPRO outperform human-designed prompts by up to 8% on GSM8K, and by up to 50% on Big-Bench Hard tasks. Code at https://github.com/google-deepmind/opro.",
        "keywords": "large language model;optimizer;prompting",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Chengrun Yang;Xuezhi Wang;Yifeng Lu;Hanxiao Liu;Quoc V Le;Denny Zhou;Xinyun Chen",
        "authorids": "~Chengrun_Yang1;~Xuezhi_Wang3;~Yifeng_Lu1;~Hanxiao_Liu1;~Quoc_V_Le1;~Denny_Zhou1;~Xinyun_Chen1",
        "gender": "M;;M;M;M;;F",
        "homepage": "https://chengrunyang.github.io/;https://research.google/people/105995/;;https://quark0.github.io/;;https://dennyzhou.github.io/;https://jungyhuk.github.io/",
        "dblp": "225/4721;70/4090-2;69/8051;157/6334;29/6166;178/3277;",
        "google_scholar": "XYYhXe4AAAAJ;ScLUQ-YAAAAJ;CM4o-cgAAAAJ;IMkVH_8AAAAJ;;UwLsYw8AAAAJ;d4W1UT0AAAAJ",
        "orcid": ";;;;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Chengrun_Yang1;~Xuezhi_Wang3;~Yifeng_Lu1;~Hanxiao_Liu1;~Quoc_V_Le1;~Dengyong_Zhou2;~Xinyun_Chen2",
        "aff": "Google;Google DeepMind;Google Deepmind;Google Brain;Google;Google DeepMind;Google",
        "aff_domain": "google.com;google.com;google.com;google.com;google.com;google.com;google.com",
        "position": "Researcher;Research Scientist;Researcher;Research Scientist;Scientist;Research Scientist;Researcher",
        "bibtex": "@inproceedings{\nyang2024large,\ntitle={Large Language Models as Optimizers},\nauthor={Chengrun Yang and Xuezhi Wang and Yifeng Lu and Hanxiao Liu and Quoc V Le and Denny Zhou and Xinyun Chen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Bb4VGOWELI}\n}",
        "github": "",
        "project": "",
        "reviewers": "um42;3F2p;iHbx;hsEq",
        "pdf_size": 1297579,
        "rating": "5;6;8;8",
        "confidence": "4;4;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "104;100;114;42",
        "wc_strengths": "18;101;67;118",
        "wc_weaknesses": "172;105;137;73",
        "wc_questions": "22;199;5;3",
        "wc_review": "316;505;323;236",
        "wc_reply_reviewers": "499;27;0;0",
        "wc_reply_authors": "1650;1580;439;477",
        "reply_reviewers": "2;1;0;0",
        "reply_authors": "5;5;2;2",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            90.0,
            28.178005607210743
        ],
        "wc_strengths_avg": [
            76.0,
            38.19031290785662
        ],
        "wc_weaknesses_avg": [
            121.75,
            36.79249244071404
        ],
        "wc_questions_avg": [
            57.25,
            82.17169524842481
        ],
        "wc_review_avg": [
            345.0,
            98.49619281982426
        ],
        "wc_reply_reviewers_avg": [
            131.5,
            212.46234960575956
        ],
        "wc_reply_authors_avg": [
            1036.5,
            579.1849877198131
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.5,
            1.5
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 811,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3095277683017219202&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 11,
        "openreview": "https://openreview.net/forum?id=Bb4VGOWELI",
        "pdf": "https://openreview.net/pdf?id=Bb4VGOWELI",
        "email": "google.com;google.com;google.com;google.com;google.com;google.com;google.com",
        "author_num": 7,
        "aff_unique_index": "0;0;1;0;0;0;0",
        "aff_unique_norm": "Google;DeepMind",
        "aff_unique_dep": "Google;DeepMind",
        "aff_unique_url": "https://www.google.com;https://deepmind.com",
        "aff_unique_abbr": "Google;DeepMind",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Mountain View;",
        "aff_country_unique_index": "0;1;1;0;0;1;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "title": "An improved analysis of per-sample and per-update clipping in federated learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19208",
        "id": "BdPvGRvoBC",
        "author_site": "Bo Li, Xiaowen Jiang, Mikkel N. Schmidt, Tommy Sonne Alstr\u00f8m, Sebastian Stich",
        "tldr": "",
        "abstract": "Gradient clipping is key mechanism that is essential to differentially private training techniques in Federated learning. Two popular strategies are per-sample clipping, which clips the mini-batch gradient, and per-update clipping, which clips each user's model update. However, there has not been a thorough theoretical analysis of these two clipping methods.\n\nIn this work, we rigorously analyze the impact of these two clipping techniques on the convergence of a popular federated learning algorithm FedAvg under standard stochastic noise and gradient dissimilarity assumptions. We provide a convergence guarantee given any arbitrary clipping threshold. Specifically, we show that per-sample clipping is guaranteed to converge to the neighborhood of the stationary point, with the size dependent on the stochastic noise, gradient dissimilarity, and clipping threshold. In contrast, the convergence to the stationary point can be guaranteed with a sufficiently small stepsize in per-update clipping at the cost of more communication rounds. We further provide insights into understanding the impact of the improved convergence analysis in the differentially private setting.",
        "keywords": "optimization;clipping;federated learning;decentralized learning;distributed optimization",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/b4cafde41c3add4caaa0531a5d0aefdfe9be3065.pdf",
        "author": "Bo Li;Xiaowen Jiang;Mikkel N. Schmidt;Tommy Sonne Alstr\u00f8m;Sebastian U Stich",
        "authorids": "~Bo_Li34;~Xiaowen_Jiang1;~Mikkel_N._Schmidt1;~Tommy_Sonne_Alstr\u00f8m1;~Sebastian_U_Stich1",
        "gender": ";M;M;M;M",
        "homepage": ";;;https://www.sstich.ch;http://www.mikkelschmidt.dk",
        "dblp": "50/3402-119;192/3782-3;120/7016;04/10549;63/6524",
        "google_scholar": "3Wz--mMAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.dk/citations?user=jAmaPr4AAAAJ;https://scholar.google.ch/citations?user=8l-mDfQAAAAJ;https://scholar.google.dk/citations?user=IjF4ExkAAAAJ",
        "orcid": "0000-0002-2534-4622;;0000-0003-0941-3146;;0000-0001-6927-8869",
        "linkedin": ";xiaowen-jiang-65570b222/;;;",
        "or_profile": "~Bo_Li34;~Xiaowen_Jiang1;~Tommy_Sonne_Alstr\u00f8m1;~Sebastian_U_Stich1;~Mikkel_N_Schmidt1",
        "aff": "Technical University of Denmark;CISPA Helmholtz Center for Information Security;Technical University of Denmark;CISPA Helmholtz Center for Information Security;Technical University of Denmark",
        "aff_domain": "dtu.dk;cispa.de;dtu.dk;cispa.de;dtu.dk",
        "position": "PhD student;PhD student;Associate Professor;Tenure Track Faculty;Associate Professor",
        "bibtex": "@inproceedings{\nli2024an,\ntitle={An improved analysis of per-sample and per-update clipping in federated learning},\nauthor={Bo Li and Xiaowen Jiang and Mikkel N. Schmidt and Tommy Sonne Alstr{\\o}m and Sebastian U Stich},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=BdPvGRvoBC}\n}",
        "github": "",
        "project": "",
        "reviewers": "6Kwh;6LCG;EwA6;VZxT;CsYx",
        "pdf_size": 793968,
        "rating": "5;5;6;6;8",
        "confidence": "4;5;2;3;3",
        "soundness": "2;2;4;3;3",
        "contribution": "2;2;2;2;3",
        "presentation": "3;2;3;3;3",
        "wc_summary": "52;87;84;92;156",
        "wc_strengths": "38;28;31;96;71",
        "wc_weaknesses": "36;358;32;108;198",
        "wc_questions": "250;62;111;7;116",
        "wc_review": "376;535;258;303;541",
        "wc_reply_reviewers": "82;134;27;0;32",
        "wc_reply_authors": "719;647;478;313;648",
        "reply_reviewers": "1;1;1;0;1",
        "reply_authors": "1;1;2;1;2",
        "rating_avg": [
            6.0,
            1.0954451150103321
        ],
        "confidence_avg": [
            3.4,
            1.019803902718557
        ],
        "soundness_avg": [
            2.8,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            94.2,
            33.94348243772286
        ],
        "wc_strengths_avg": [
            52.8,
            26.483202223296185
        ],
        "wc_weaknesses_avg": [
            146.4,
            121.80903086388956
        ],
        "wc_questions_avg": [
            109.2,
            80.68060485643375
        ],
        "wc_review_avg": [
            402.6,
            116.8085613300669
        ],
        "wc_reply_reviewers_avg": [
            55.0,
            47.5562824451197
        ],
        "wc_reply_authors_avg": [
            561.0,
            147.18831475358363
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4
        ],
        "reply_authors_avg": [
            1.4,
            0.4898979485566356
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5370861555295747,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3694767686867173970&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=BdPvGRvoBC",
        "pdf": "https://openreview.net/pdf?id=BdPvGRvoBC",
        "email": "dtu.dk;cispa.de;dtu.dk;cispa.de;dtu.dk",
        "author_num": 5,
        "aff_unique_index": "0;1;0;1;0",
        "aff_unique_norm": "Technical University of Denmark;CISPA Helmholtz Center for Information Security",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tek.dk;https://www.cispa.de/",
        "aff_unique_abbr": "DTU;CISPA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;1;0",
        "aff_country_unique": "Denmark;Germany"
    },
    {
        "id": "BdWLzmPKst",
        "title": "Sequential Data Generation with Groupwise Diffusion Process",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We present the Groupwise Diffusion Model (GDM), which divides data into multiple groups and diffuses one group at one time interval in the forward diffusion process. GDM generates data sequentially from one group at one time interval, leading to several interesting properties. First, as an extension of diffusion models, GDM generalizes certain forms of autoregressive models and cascaded diffusion models. As a unified framework, GDM allows us to investigate design choices that have been overlooked in previous works, such as data-grouping strategy and order of generation. Furthermore, since one group of the initial noise affects only a certain group of the generated data, latent space now possesses group-wise interpretable meaning. We can further extend GDM to the frequency domain where the forward process sequentially diffuses each group of frequency components. Dividing the frequency bands of the data as groups allows the latent variables to become a hierarchical representation where individual groups encode data at different levels of abstraction. We demonstrate several applications of such representation including disentanglement of semantic attributes, image editing, and generating variations.",
        "keywords": "Diffusion models;score-based generative models;autoregressive models",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Sangyun Lee;Gayoung Lee;Hyunsu Kim;Junho Kim;Youngjung Uh",
        "authorids": "~Sangyun_Lee1;~Gayoung_Lee1;~Hyunsu_Kim1;~Junho_Kim3;~Youngjung_Uh2",
        "gender": ";F;M;M;",
        "homepage": "https://sangyun884.github.io/about/;;https://github.com/blandocs;http://bit.ly/jhkim_resume;https://vilab.yonsei.ac.kr/member/professor",
        "dblp": "87/8208;179/2468;239/8447;;57/10511",
        "google_scholar": "CGFkx-IAAAAJ;;VY5PodkAAAAJ;WtjDugkAAAAJ;BWBGrEEAAAAJ",
        "orcid": ";;;0000-0003-3712-8510;",
        "linkedin": ";gayoung-lee-0824548a/;blandocs/;taki0112/;youngjung-uh-78b459b5/",
        "or_profile": "~Sangyun_Lee1;~Gayoung_Lee1;~Hyunsu_Kim1;~Junho_Kim3;~Youngjung_Uh2",
        "aff": "Carnegie Mellon University;NAVER AI Lab;Bucketplace;NAVER;Yonsei University",
        "aff_domain": "andrew.cmu.edu;navercorp.com;bucketplace.net;navercorp.com;yonsei.ac.kr",
        "position": "PhD student;Researcher;Researcher;Research Scientist;Associate Professor",
        "bibtex": "@misc{\nlee2024sequential,\ntitle={Sequential Data Generation with Groupwise Diffusion Process},\nauthor={Sangyun Lee and Gayoung Lee and Hyunsu Kim and Junho Kim and Youngjung Uh},\nyear={2024},\nurl={https://openreview.net/forum?id=BdWLzmPKst}\n}",
        "github": "",
        "project": "",
        "reviewers": "5sF6;efZH;Mi2L",
        "site": "https://openreview.net/forum?id=BdWLzmPKst",
        "pdf_size": 4892981,
        "rating": "3;5;6",
        "confidence": "4;4;4",
        "soundness": "2;2;3",
        "contribution": "2;3;3",
        "presentation": "2;1;3",
        "wc_summary": "42;78;82",
        "wc_strengths": "40;97;45",
        "wc_weaknesses": "63;75;35",
        "wc_questions": "15;544;36",
        "wc_review": "160;794;198",
        "wc_reply_reviewers": "0;14;0",
        "wc_reply_authors": "377;784;426",
        "reply_reviewers": "0;1;0",
        "reply_authors": "2;2;2",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            67.33333333333333,
            17.98765008430939
        ],
        "wc_strengths_avg": [
            60.666666666666664,
            25.77250904010361
        ],
        "wc_weaknesses_avg": [
            57.666666666666664,
            16.759740119968715
        ],
        "wc_questions_avg": [
            198.33333333333334,
            244.573551763518
        ],
        "wc_review_avg": [
            384.0,
            290.3285495204815
        ],
        "wc_reply_reviewers_avg": [
            4.666666666666667,
            6.599663291074443
        ],
        "wc_reply_authors_avg": [
            529.0,
            181.41848490897135
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14720335742397382690&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;1;3",
        "aff_unique_norm": "Carnegie Mellon University;NAVER Corporation;Bucketplace;Yonsei University",
        "aff_unique_dep": ";NAVER AI Lab;;",
        "aff_unique_url": "https://www.cmu.edu;https://www.naver.com;;https://www.yonsei.ac.kr",
        "aff_unique_abbr": "CMU;NAVER;;Yonsei",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "United States;South Korea;"
    },
    {
        "id": "BeuTCoe3bf",
        "title": "Subgraph-To-Node Translation for Efficient Representation Learning of Subgraphs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Subgraph representation learning has emerged as an important problem, but it is by default approached with the graph neural networks (GNNs) on a large global graph, an approach that demands extensive memory and computational resources. We argue that resource requirements can be reduced by designing an efficient data structure to store and process subgraphs. In this paper, we propose Subgraph-To-Node (S2N) translation, a novel formulation to learn representations of subgraphs efficiently. Specifically, given a set of subgraphs in the global graph, we construct a new graph by coarsely transforming subgraphs into nodes. We theoretically and empirically show that S2N significantly reduces memory and computational costs compared to using state-of-the-art models with conventional data structures. We also suggest Coarsened S2N (CoS2N), which combines S2N with graph coarsening methods for improved results in a data-scarce setting where there are not sufficient subgraphs to cover the global graph. Our experiments on four real-world benchmarks demonstrate that fined-tuned models with S2N translation can process 183 -- 711 times more subgraph samples than state-of-the-art models at a similar or better performance level.",
        "keywords": "Efficiency;Subgraphs;Graph Neural Networks",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/3447afaeaa181ec7893e39faae4544d29bb923fe.zip",
        "author": "Dongkwan Kim;Alice Oh",
        "authorids": "~Dongkwan_Kim1;~Alice_Oh1",
        "gender": "M;F",
        "homepage": "https://dongkwan-kim.github.io/;http://uilab.kr",
        "dblp": "62/10307-1.html;50/7562",
        "google_scholar": "KgjSE64AAAAJ;https://scholar.google.co.kr/citations?user=B88-xMEAAAAJ",
        "orcid": ";",
        "linkedin": "dongkwan-kim/;alice-oh-4677544/",
        "or_profile": "~Dongkwan_Kim1;~Alice_Oh1",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nkim2024subgraphtonode,\ntitle={Subgraph-To-Node Translation for Efficient Representation Learning of Subgraphs},\nauthor={Dongkwan Kim and Alice Oh},\nyear={2024},\nurl={https://openreview.net/forum?id=BeuTCoe3bf}\n}",
        "github": "",
        "project": "",
        "reviewers": "1NPi;tdbM;AUEj",
        "site": "https://openreview.net/forum?id=BeuTCoe3bf",
        "pdf_size": 1813382,
        "rating": "5;5;6",
        "confidence": "3;3;4",
        "soundness": "2;3;3",
        "contribution": "2;2;3",
        "presentation": "2;3;3",
        "wc_summary": "87;39;48",
        "wc_strengths": "51;37;36",
        "wc_weaknesses": "150;154;228",
        "wc_questions": "9;31;104",
        "wc_review": "297;261;416",
        "wc_reply_reviewers": "5;235;0",
        "wc_reply_authors": "1419;1255;938",
        "reply_reviewers": "1;2;0",
        "reply_authors": "4;3;3",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            58.0,
            20.83266665599966
        ],
        "wc_strengths_avg": [
            41.333333333333336,
            6.847546194724712
        ],
        "wc_weaknesses_avg": [
            177.33333333333334,
            35.86394041683404
        ],
        "wc_questions_avg": [
            48.0,
            40.60377650744653
        ],
        "wc_review_avg": [
            324.6666666666667,
            66.23359335630892
        ],
        "wc_reply_reviewers_avg": [
            80.0,
            109.62055768270231
        ],
        "wc_reply_authors_avg": [
            1204.0,
            199.65136279691822
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.9999999999999997,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:LtdQ5HGOs-IJ:scholar.google.com/&scioq=Subgraph-To-Node+Translation+for+Efficient+Representation+Learning+of+Subgraphs&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "BexcuT1ZbT",
        "title": "Delve into Image Style Diffusion Towards Schr\u00f6dinger Bridge Problem",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Taking inspiration from the exceptional performances of Score-Based Generative Modeling (SGM) in image generation tasks, we introduce a novel Style-Diffusion method in this work. For the first time, we achieve flexible and efficient stylization transfer using SGM while preserving the semantic structures. With the prior distributions $p_{\\theta}(v)$ obtained from encoding the source domain data samples, we employ approximate score-matching to estimate the drift of the reverse-time Stochastic Differential Equation (SDE) at arbitrary time step. By introducing Control Factor $\\phi$, we have achieved controllable stylization in the output images. To improve computation speed, we re-formulate the original multi-end diffusion problem as a composite Schr\\\"odinger half bridge Problem, providing a new method for the diffusion evolution between more complex multiple distributions. Numerous empirical results and comparison with state-of-the-art methods demonstrate the superior performance of our approach in terms of stylization and extraordinary preservation of semantic structure.",
        "keywords": "Diffusion Models;Schr\u00f6dinger Bridge Problem;Score-Based Generative Modelling;Image Style Diffusion",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/e182dda4dfcd6c7aeadaeb9d0e46527fdb9a7c11.pdf",
        "author": "Richard Jiang;YIJIE ZHU",
        "authorids": "~Richard_Jiang3;~YIJIE_ZHU2",
        "gender": "M;M",
        "homepage": ";https://wp.lancs.ac.uk/autobrain",
        "dblp": ";70/8305",
        "google_scholar": "https://scholar.google.co.uk/citations?hl=zh-CN;NuyoNc4AAAAJ",
        "orcid": ";0000-0003-1721-9474",
        "linkedin": ";",
        "or_profile": "~YIJIE_ZHU2;~Richard_M._Jiang1",
        "aff": "Lancaster University;Shanghai Jiaotong University",
        "aff_domain": "lancaster.ac.uk;sjtu.edu.cn",
        "position": "PhD student;Visiting Scholar",
        "bibtex": "@misc{\njiang2024delve,\ntitle={Delve into Image Style Diffusion Towards Schr\\\"odinger Bridge Problem},\nauthor={Richard Jiang and YIJIE ZHU},\nyear={2024},\nurl={https://openreview.net/forum?id=BexcuT1ZbT}\n}",
        "github": "",
        "project": "",
        "reviewers": "7QnQ;zeKW;p74s;qGym",
        "site": "https://openreview.net/forum?id=BexcuT1ZbT",
        "pdf_size": 25768766,
        "rating": "1;3;5;5",
        "confidence": "5;3;4;3",
        "soundness": "1;2;2;2",
        "contribution": "1;2;2;2",
        "presentation": "1;1;3;1",
        "wc_summary": "84;80;63;74",
        "wc_strengths": "9;17;25;72",
        "wc_weaknesses": "549;145;306;82",
        "wc_questions": "13;74;17;105",
        "wc_review": "655;316;411;333",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            1.6583123951777
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            75.25,
            7.917543811056558
        ],
        "wc_strengths_avg": [
            30.75,
            24.47830672248389
        ],
        "wc_weaknesses_avg": [
            270.5,
            180.35035347899932
        ],
        "wc_questions_avg": [
            52.25,
            38.854697270729055
        ],
        "wc_review_avg": [
            428.75,
            135.44809891615313
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.6363636363636364,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:G_XYop9PVAAJ:scholar.google.com/&scioq=Delve+into+Image+Style+Diffusion+Towards+Schr%C3%B6dinger+Bridge+Problem&hl=en&as_sdt=0,11",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Lancaster University;Shanghai Jiao Tong University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.lancaster.ac.uk;https://www.sjtu.edu.cn",
        "aff_unique_abbr": "Lancaster;SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United Kingdom;China"
    },
    {
        "id": "BfMQIJ0nLc",
        "title": "MMBench: Is Your Multi-modal Model an All-around Player?",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large vision-language models have recently achieved remarkable progress, \nexhibiting great perception and reasoning abilities concerning visual information. \nHowever, how to effectively evaluate these large vision-language models remains a major obstacle, hindering future development in this domain. \nTraditional benchmarks like VQAv2 or COCO Caption provide quantitative performance measurements but suffer from a lack of fine-grained ability assessment and non-robust evaluation metrics. \nRecent subjective benchmarks, such as OwlEval, offer comprehensive evaluations of a model's abilities by incorporating human labor, but they are not scalable and display significant bias.\nIn response to these challenges, we propose MMBench, a new benchmark for assessing multi-modal capabilities of VLMs. \nMMBench methodically develops a comprehensive evaluation pipeline, primarily comprised of two key features: 1. MMBench is a meticulously curated dataset that surpasses existing similar benchmarks in terms of the number and the variety of evaluation questions and abilities; 2. MMBench introduces a rigorous CircularEval strategy and incorporates the use of ChatGPT to convert free-form predictions into pre-defined choices, thereby facilitating a fair and robust evaluation despite of VLMs' different instruction following capabilities. \nMMBench is a systematically-designed objective benchmark for robustly evaluating the various abilities of vision-language models. \nWe hope MMBench will assist the research community in better evaluating their models and encourage future advancements in this domain.",
        "keywords": "Vision-language Pre-training;Multimodality;Benchmark;Dataset",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Yuan Liu;Haodong Duan;Yuanhan Zhang;Bo Li;Songyang Zhang;Yike Yuan;Wangbo Zhao;Jiaqi Wang;Conghui He;Ziwei Liu;Kai Chen;Dahua Lin",
        "authorids": "~Yuan_Liu5;~Haodong_Duan1;~Yuanhan_Zhang1;~Bo_Li23;~Songyang_Zhang1;~Yike_Yuan1;~Wangbo_Zhao1;~Jiaqi_Wang1;~Conghui_He2;~Ziwei_Liu1;~Kai_Chen4;~Dahua_Lin1",
        "gender": ";M;M;M;M;M;;M;;M;M;M",
        "homepage": ";https://kennymckormick.github.io;https://zhangyuanhan-ai.github.io/;https://www.brianboli.com/;https://www.zhangsongyang.com/;;;https://myownskyw7.github.io/;;https://liuziwei7.github.io/;https://chenkai.site/;http://dahua.site",
        "dblp": ";211/7919;10/2476;50/3402-80;;262/3736;;44/740-3;;05/6300-2;181/2839-26;53/6088",
        "google_scholar": ";vi3W-m8AAAAJ;g6grFy0AAAAJ;1_zc1-IAAAAJ;8XQPi7YAAAAJ;;;https://scholar.google.com.hk/citations?user=GDvt570AAAAJ;;https://scholar.google.com.hk/citations?user=lc45xlcAAAAJ;https://scholar.google.com.hk/citations?user=eGD0b7IAAAAJ;GMzzRRUAAAAJ",
        "orcid": ";0000-0002-3052-4177;;;;0000-0002-4050-8111;;;;;0000-0002-6820-2325;",
        "linkedin": ";haodong-duan-bb9349166/;;brianbo1121/;;;;;;;;",
        "or_profile": "~Yuan_Liu5;~Haodong_Duan1;~Yuanhan_Zhang1;~Bo_Li23;~Songyang_Zhang1;~Yike_Yuan1;~Wangbo_Zhao1;~Jiaqi_Wang1;~Conghui_He2;~Ziwei_Liu1;~Kai_Chen4;~Dahua_Lin1",
        "aff": ";Shanghai Artificial Intelligence Laboratory;Nanyang Technological University;Nanyang Technological University;Shanghai Artificial Intelligence Laboratory;Zhejiang University;;Shanghai AI Laboratory;;Nanyang Technological University;Shanghai AI Laboratory;The Chinese University of Hong Kong",
        "aff_domain": ";pjlab.org.cn;ntu.edu.sg;ntu.edu.sg;pjlab.org.cn;zju.edu.cn;;pjlab.org.cn;;ntu.edu.sg;pjlab.org.cn;cuhk.edu.hk",
        "position": ";Postdoc;PhD student;PhD student;Postdoc;MS student;;Research Scientist;;Assistant Professor;Researcher;Associate Professor",
        "bibtex": "@misc{\nliu2024mmbench,\ntitle={{MMB}ench: Is Your Multi-modal Model an All-around Player?},\nauthor={Yuan Liu and Haodong Duan and Yuanhan Zhang and Bo Li and Songyang Zhang and Yike Yuan and Wangbo Zhao and Jiaqi Wang and Conghui He and Ziwei Liu and Kai Chen and Dahua Lin},\nyear={2024},\nurl={https://openreview.net/forum?id=BfMQIJ0nLc}\n}",
        "github": "",
        "project": "",
        "reviewers": "g871;1JAs;EsaC;Ntup",
        "site": "https://openreview.net/forum?id=BfMQIJ0nLc",
        "pdf_size": 5541867,
        "rating": "3;6;6;6",
        "confidence": "4;3;4;3",
        "soundness": "1;3;2;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "74;45;96;100",
        "wc_strengths": "46;34;68;39",
        "wc_weaknesses": "476;87;203;69",
        "wc_questions": "42;28;2;3",
        "wc_review": "638;194;369;211",
        "wc_reply_reviewers": "688;15;343;0",
        "wc_reply_authors": "2764;757;1831;884",
        "reply_reviewers": "3;1;1;0",
        "reply_authors": "6;3;5;3",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            78.75,
            21.856063231972954
        ],
        "wc_strengths_avg": [
            46.75,
            12.987975207860538
        ],
        "wc_weaknesses_avg": [
            208.75,
            162.6412847342273
        ],
        "wc_questions_avg": [
            18.75,
            16.990806337546196
        ],
        "wc_review_avg": [
            353.0,
            178.13337699600262
        ],
        "wc_reply_reviewers_avg": [
            261.5,
            281.81953445423187
        ],
        "wc_reply_authors_avg": [
            1559.0,
            810.0675897726065
        ],
        "reply_reviewers_avg": [
            1.25,
            1.0897247358851685
        ],
        "reply_authors_avg": [
            4.25,
            1.299038105676658
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            12,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 994,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6352199574109390602&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;1;1;0;2;3;1;3;4",
        "aff_unique_norm": "Shanghai Artificial Intelligence Laboratory;Nanyang Technological University;Zhejiang University;Shanghai AI Laboratory;Chinese University of Hong Kong",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "http://www.shailab.org/;https://www.ntu.edu.sg;https://www.zju.edu.cn;https://www.shanghai-ai-lab.com;https://www.cuhk.edu.hk",
        "aff_unique_abbr": "Shanghai AI Lab;NTU;ZJU;SAIL;CUHK",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;1;1;0;0;0;1;0;0",
        "aff_country_unique": "China;Singapore"
    },
    {
        "id": "BgZzJISvpY",
        "title": "Reinforcement Learning with Extreme Minimum Distribution",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Distributional Reinforcement Learning (DRL) has recently achieved remarkable performance by leveraging the distributional information of accumulated rewards. Because the data in the tail of the distribution is scarce, it is difficult to fit the tail distribution, resulting in the tail behavior of the return distribution that limits the performance of DRL. One solution to tackle the tail behavior of the return distribution is truncating the tail atoms in DRL, but this approach does not have theoretical support in previous work. We adopt the perspective of Extreme Value Theorem, which allows us to reconsider the rationality of truncating tail atoms. We further derive a conclusion: Truncating tail atoms eventually transforms the distribution generated by DRL into the extreme minimum distribution and remains stable. Building on this conclusion, we redesign the critic networks in actor-critic method. Specifically, we use two critics that output the location and scale parameters of the extreme minimum distribution to directly model the distribution of truncated DRL. Our method uses fewer networks and fewer computational resources than other truncated DRL methods and achieves more competitive experimental results than other RL methods.",
        "keywords": "Reinforcement Learning;Distributional Reinforcement Learning;Extreme Value Theorem",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/c102a9212a1277ce298401df11a82c98e20bb014.zip",
        "author": "Yushu Zhang;Chun Shen;Junhong Wu;Daolong An;Shuai L\u00fc",
        "authorids": "~Yushu_Zhang2;~Chun_Shen1;~Junhong_Wu2;~Daolong_An4;~Shuai_L\u00fc1",
        "gender": "M;;M;M;F",
        "homepage": ";;;https://lus-jlu.github.io;http://ccst.jlu.edu.cn/info/1312/15593.htm",
        "dblp": ";;371/6068;27/10828-1;",
        "google_scholar": ";;zvlfGUgAAAAJ;S1T_HV0AAAAJ;",
        "orcid": "0000-0001-6338-1056;0009-0009-9951-0505;0009-0005-0020-1990;0000-0002-8081-4498;",
        "linkedin": ";;andaolong-0a5689179;;",
        "or_profile": "~Yushu_Zhang2;~Junhong_Wu2;~Daolong_An4;~Shuai_L\u00fc1;~Shen_Chun1",
        "aff": "Jilin University;Jilin University;Jilin University;Jilin University;Jilin University",
        "aff_domain": "jlu.edu.cn;jlu.edu.cn;jlu.edu.cn;jlu.edu.cn;jlu.edu.cn",
        "position": "MS student;MS student;MS student;Associate Professor;Associate Professor",
        "bibtex": "@misc{\nzhang2024reinforcement,\ntitle={Reinforcement Learning with Extreme Minimum Distribution},\nauthor={Yushu Zhang and Chun Shen and Junhong Wu and Daolong An and Shuai L{\\\"u}},\nyear={2024},\nurl={https://openreview.net/forum?id=BgZzJISvpY}\n}",
        "github": "",
        "project": "",
        "reviewers": "eazc;oowZ;7cHh",
        "site": "https://openreview.net/forum?id=BgZzJISvpY",
        "pdf_size": 7880639,
        "rating": "1;3;3",
        "confidence": "4;4;5",
        "soundness": "1;2;2",
        "contribution": "1;2;4",
        "presentation": "2;2;1",
        "wc_summary": "87;52;100",
        "wc_strengths": "12;1;46",
        "wc_weaknesses": "513;133;68",
        "wc_questions": "6;2;4",
        "wc_review": "618;188;218",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1232;544;390",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            79.66666666666667,
            20.27039439401436
        ],
        "wc_strengths_avg": [
            19.666666666666668,
            19.154343864744856
        ],
        "wc_weaknesses_avg": [
            238.0,
            196.25663470738172
        ],
        "wc_questions_avg": [
            4.0,
            1.632993161855452
        ],
        "wc_review_avg": [
            341.3333333333333,
            196.01587237318876
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            722.0,
            366.06374672543944
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:aAGyFclwQ0MJ:scholar.google.com/&scioq=Reinforcement+Learning+with+Extreme+Minimum+Distribution&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Jilin University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.jlu.edu.cn",
        "aff_unique_abbr": "JLU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "BgzE4zwkFW",
        "title": "Curriculum Reinforcement Learning via Morphology-Environment Co-Evolution",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Throughout long history, natural species have learned to survive by evolving their physical structures adaptive to the changes of environments. In contrast, current reinforcement learning (RL) mainly focuses on training an agent with a fixed morphology (e.g., skeletal structure and joint attributes) in a fixed environment, which can hardly be generalized to changing environments or new tasks. \nIn this paper, we optimize an RL agent and its morphology through ``morphology-environment co-evolution (MECE)'', in which the morphology keeps being updated to adapt to the changing environment, while the environment is modified progressively to bring new challenges and stimulate the improvement of the morphology. This leads to a curriculum to train generalizable RL, whose morphology and policy are optimized for different environments. Instead of hand-crafting the curriculum, we train two policies to automatically change the morphology and the environment. To this end, (1) we develop two novel and effective rewards for the two policies, which are solely based on the learning dynamics of the RL agent; (2) we design a scheduler to automatically determine when to change the environment and the morphology. In experiments on two classes of tasks, the morphology and RL policies trained via MECE exhibit significantly better generalization performance in unseen test environments than SOTA morphology optimization methods. Our ablation studies on the two MECE policies further show that the co-evolution between the morphology and environment is the key to success.",
        "keywords": "Curriculum RL;Morphology Evolution",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Shuang Ao;Tianyi Zhou;Guodong Long;Xuan Song;Jing Jiang",
        "authorids": "~Shuang_Ao3;~Tianyi_Zhou1;~Guodong_Long2;~Xuan_Song5;~Jing_Jiang6",
        "gender": "M;M;M;;F",
        "homepage": "https://github.com/Shuang-AO;https://tianyizhou.github.io/;https://www.uts.edu.au/staff/guodong.long;;https://www.uts.edu.au/staff/jing.jiang",
        "dblp": ";88/8205-1;34/10089;;68/1974-2",
        "google_scholar": ";OKvgizMAAAAJ;https://scholar.google.com.au/citations?user=Pl8m7hMAAAAJ;;https://scholar.google.com.au/citations?hl=en",
        "orcid": ";0000-0001-5348-0632;0000-0003-3740-9515;;",
        "linkedin": ";tianyizhou;;;",
        "or_profile": "~Shuang_Ao3;~Tianyi_Zhou1;~Guodong_Long2;~Xuan_Song5;~Jing_Jiang6",
        "aff": "University of New South Wales;University of Maryland, College Park;University of Technology Sydney;;University of Technology Sydney",
        "aff_domain": "unsw.edu.au;umd.edu;uts.edu.au;;uts.edu.au",
        "position": "Postdoc;Assistant Professor;Associate Professor;;Associate Professor",
        "bibtex": "@misc{\nao2024curriculum,\ntitle={Curriculum Reinforcement Learning via Morphology-Environment Co-Evolution},\nauthor={Shuang Ao and Tianyi Zhou and Guodong Long and Xuan Song and Jing Jiang},\nyear={2024},\nurl={https://openreview.net/forum?id=BgzE4zwkFW}\n}",
        "github": "",
        "project": "",
        "reviewers": "cQrp;QUnH;jNfL",
        "site": "https://openreview.net/forum?id=BgzE4zwkFW",
        "pdf_size": 1725981,
        "rating": "5;5;6",
        "confidence": "4;4;3",
        "soundness": "3;3;2",
        "contribution": "2;3;2",
        "presentation": "3;3;2",
        "wc_summary": "73;91;151",
        "wc_strengths": "44;17;41",
        "wc_weaknesses": "47;91;313",
        "wc_questions": "86;130;9",
        "wc_review": "250;329;514",
        "wc_reply_reviewers": "10;145;111",
        "wc_reply_authors": "627;615;770",
        "reply_reviewers": "1;1;1",
        "reply_authors": "4;3;3",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            105.0,
            33.34666400106613
        ],
        "wc_strengths_avg": [
            34.0,
            12.083045973594572
        ],
        "wc_weaknesses_avg": [
            150.33333333333334,
            116.41687544720004
        ],
        "wc_questions_avg": [
            75.0,
            50.00666622228147
        ],
        "wc_review_avg": [
            364.3333333333333,
            110.63553779063137
        ],
        "wc_reply_reviewers_avg": [
            88.66666666666667,
            57.33139531608217
        ],
        "wc_reply_authors_avg": [
            670.6666666666666,
            70.40991091853161
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9999999999999997,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1640441671062690778&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;2",
        "aff_unique_norm": "University of New South Wales;University of Maryland;University of Technology Sydney",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.unsw.edu.au;https://www/umd.edu;https://www.uts.edu.au",
        "aff_unique_abbr": "UNSW;UMD;UTS",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";College Park",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "Australia;United States"
    },
    {
        "id": "Bh4BW69ILq",
        "title": "Solving (partial) unbalanced optimal transport via transform coefficients and beyond",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Unbalanced Optimal Transport (UOT) has gained increasing attention due to its ability to relax marginal constraints, thereby expanding its application potential. Previous solvers often incorporate an entropy regularization term, which can result in dense matching solutions. Meanwhile directly modeling UOT using penalized linear regression can be computationally expensive. To address the above issue, we turn to consider determining the marginal probability distribution of UOT with KL divergence via proposed \\textbf{\\textit{transform coefficient}} method. The transform coefficient approach is not only computationally friendly but also reveals the essence of UOT, which involves adjusting the sample weights accordingly. We further extend the transform coefficient method into exploiting the marginal probability distribution of Partial Unbalanced Optimal Transport (PUOT) with KL divergence for validating its generalization. Since the marginal probability of UOT/PUOT are determined, we are excited to discover that UOT/PUOT can be transformed into classical Optimal Transport (OT) problem for finding the transportation plan. Therefore, the transform coefficient method can be considered as the bridge that establishes the connection between UOT/PUOT and OT. Moreover, we discover the additional results of Lagrange multipliers when solving transform coefficient can offer valuable guidance for achieving more sparse and accurate mapping with Cost-Reweighted OT (CROT). We perform several numerical experiments to illustrate our proposed new algorithms on dealing with UOT, PUOT and OT problem.",
        "keywords": "Optimal Transport",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Weiming Liu;Xinting Liao;Chaochao Chen;Xiaolin Zheng;Guang-Yong Chen;Yanchao Tan;Fan Wang;Yew-Soon Ong",
        "authorids": "~Weiming_Liu2;~Xinting_Liao1;~Chaochao_Chen3;~Xiaolin_Zheng1;~Guang-Yong_Chen1;~Yanchao_Tan1;~Fan_Wang14;~Yew-Soon_Ong1",
        "gender": ";F;;M;M;F;;",
        "homepage": ";https://xenialll.github.io/;https://sites.google.com/site/ccchomepage/;https://person.zju.edu.cn/xlzheng;;;;",
        "dblp": ";331/1544;26/1492-1;09/5763;216/6951;210/4829.html;;",
        "google_scholar": ";FoMerO8AAAAJ;qZTMyzwAAAAJ;MY23M60AAAAJ;;NQWuK9UAAAAJ;;",
        "orcid": ";0000-0002-8257-2381;0000-0003-1419-964X;0000-0001-5483-0366;;0000-0002-3526-6859;;",
        "linkedin": ";;ccchomepage/;;;;;",
        "or_profile": "~Weiming_Liu2;~Xinting_Liao1;~Chaochao_Chen3;~Xiaolin_Zheng1;~Guang-Yong_Chen1;~Yanchao_Tan1;~Fan_Wang14;~Yew-Soon_Ong1",
        "aff": ";Zhejiang University;Zhejiang University;Zhejiang University;Fuzhou University;Fuzhou University;;",
        "aff_domain": ";zju.edu.cn;zju.edu.cn;zju.edu.cn;fzu.edu.cn;fzu.edu.cn;;",
        "position": ";PhD student;Distinguished Research Fellow;Full Professor;Full Professor;Lecturer;;",
        "bibtex": "@misc{\nliu2024solving,\ntitle={Solving (partial) unbalanced optimal transport via transform coefficients and beyond},\nauthor={Weiming Liu and Xinting Liao and Chaochao Chen and Xiaolin Zheng and Guang-Yong Chen and Yanchao Tan and Fan Wang and Yew-Soon Ong},\nyear={2024},\nurl={https://openreview.net/forum?id=Bh4BW69ILq}\n}",
        "github": "",
        "project": "",
        "reviewers": "8FWU;ZcUR;x5ni;bjot;vADR",
        "site": "https://openreview.net/forum?id=Bh4BW69ILq",
        "pdf_size": 1719194,
        "rating": "1;3;3;3;3",
        "confidence": "4;4;4;4;4",
        "soundness": "1;2;2;3;2",
        "contribution": "2;1;2;2;2",
        "presentation": "2;3;1;3;2",
        "wc_summary": "35;65;168;152;83",
        "wc_strengths": "33;27;29;172;38",
        "wc_weaknesses": "363;182;218;295;151",
        "wc_questions": "2;13;362;128;24",
        "wc_review": "433;287;777;747;296",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            2.6,
            0.8000000000000002
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            1.8,
            0.4000000000000001
        ],
        "presentation_avg": [
            2.2,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            100.6,
            51.11790293038242
        ],
        "wc_strengths_avg": [
            59.8,
            56.225972646100125
        ],
        "wc_weaknesses_avg": [
            241.8,
            77.33925264702265
        ],
        "wc_questions_avg": [
            105.8,
            135.80044182549628
        ],
        "wc_review_avg": [
            508.0,
            213.95887455303182
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:oYD62mk0Nq4J:scholar.google.com/&scioq=Solving+(partial)+unbalanced+optimal+transport+via+transform+coefficients+and+beyond&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;1",
        "aff_unique_norm": "Zhejiang University;Fuzhou University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.zju.edu.cn;https://www.fznu.edu.cn",
        "aff_unique_abbr": "ZJU;FZU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "BhxsjonZ0z",
        "title": "FedOD: Federated Outlier Detection via Neural Approximation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Outlier detection (OD) is a crucial machine learning task with key applications in various sectors such as security, finance, and healthcare. Preserving data privacy has been increasingly important for OD due to the sensitivity of the data involved. While federated learning (FL) offers the potential in protecting data privacy, it is not yet available for most classical OD algorithms, such as those based on distance and density estimation. To address this, we introduce FedOD, the first FL-based system designed for general OD algorithms. FedOD effectively overcomes the privacy and efficiency challenges inherent in classical OD algorithms by automatically decomposing these algorithms into a set of basic operators and approximating their behaviors using neural networks. Given the inherent compatibility of neural networks with FL, the approximated OD algorithms also become capable of privacy-preserving learning without data exchange. With this design, FedOD supports over 20 popular classical OD algorithms and is readily extendable to other fields like classification. Evaluation on more than 30 benchmark and synthetic datasets demonstrates FedOD's accuracy and efficacy over state-of-the-art baselines---compared to existing OD systems, FedOD achieves up to 11x reduction in errors and 10x improvement in performance.",
        "keywords": "outlier detection;federated learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/334eafb52291fdae0805d91f6aa9f2bd9f7fedcc.pdf",
        "author": "Yue Zhao;Sidharth Sharma;Zhihao Jia",
        "authorids": "~Yue_Zhao13;~Sidharth_Sharma1;~Zhihao_Jia2",
        "gender": "M;M;M",
        "homepage": "https://viterbi-web.usc.edu/~yzhao010/;https://sidsharma22.github.io/my-website/;https://www.cs.cmu.edu/~zhihaoj2/",
        "dblp": "48/76-16;122/4379;",
        "google_scholar": "https://scholar.google.ca/citations?user=zoGDYsoAAAAJ;;0IWLFR4AAAAJ",
        "orcid": "0000-0003-3401-4921;;",
        "linkedin": "yzhao062/;;",
        "or_profile": "~Yue_Zhao13;~Sidharth_Sharma1;~Zhihao_Jia2",
        "aff": "University of Southern California;Columbia University;Carnegie Mellon University",
        "aff_domain": "usc.edu;columbia.edu;cs.cmu.edu",
        "position": "Assistant Professor;PhD student;Assistant Professor",
        "bibtex": "@misc{\nzhao2024fedod,\ntitle={Fed{OD}: Federated Outlier Detection via Neural Approximation},\nauthor={Yue Zhao and Sidharth Sharma and Zhihao Jia},\nyear={2024},\nurl={https://openreview.net/forum?id=BhxsjonZ0z}\n}",
        "github": "",
        "project": "",
        "reviewers": "4zZc;9wxE;UDJk",
        "site": "https://openreview.net/forum?id=BhxsjonZ0z",
        "pdf_size": 2949362,
        "rating": "1;3;6",
        "confidence": "4;4;4",
        "soundness": "1;2;2",
        "contribution": "1;2;3",
        "presentation": "1;2;3",
        "wc_summary": "39;90;74",
        "wc_strengths": "23;27;73",
        "wc_weaknesses": "70;179;226",
        "wc_questions": "868;27;1",
        "wc_review": "1000;323;374",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.3333333333333335,
            2.0548046676563256
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            67.66666666666667,
            21.296843793284385
        ],
        "wc_strengths_avg": [
            41.0,
            22.686266036231405
        ],
        "wc_weaknesses_avg": [
            158.33333333333334,
            65.34183618138961
        ],
        "wc_questions_avg": [
            298.6666666666667,
            402.7193674122078
        ],
        "wc_review_avg": [
            565.6666666666666,
            307.82498635137176
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:2a1SaDJ76VQJ:scholar.google.com/&scioq=FedOD:+Federated+Outlier+Detection+via+Neural+Approximation&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of Southern California;Columbia University;Carnegie Mellon University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.usc.edu;https://www.columbia.edu;https://www.cmu.edu",
        "aff_unique_abbr": "USC;Columbia;CMU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Los Angeles;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "PB-LLM: Partially Binarized Large Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19207",
        "id": "BifeBRhikU",
        "author_site": "Zhihang Yuan, Yuzhang Shang, Zhen Dong",
        "tldr": "",
        "abstract": "This paper explores network binarization, a radical form of quantization, compressing model weights to a single bit, specifically for Large Language Models (LLMs) compression. \nDue to previous binarization methods collapsing LLMs, we propose a novel approach, Partially-Binarized LLM (PB-LLM), which can achieve extreme low-bit quantization while maintaining the linguistic reasoning capacity of quantized LLMs. \nSpecifically, our exploration first uncovers the ineffectiveness of na\u00efve applications of existing binarization algorithms and highlights the imperative role of salient weights in achieving low-bit quantization. \nThus, PB-LLM filters a small ratio of salient weights during binarization, allocating them to higher-bit storage, i.e., partially-binarization. \nPB-LLM is extended to recover the capacities of quantized LMMs, by analyzing from the perspective of post-training quantization (PTQ) and quantization-aware training (QAT). \nUnder PTQ, combining the concepts from GPTQ, we reconstruct the binarized weight matrix guided by the Hessian matrix and successfully recover the reasoning capacity of PB-LLM in low-bit. \nUnder QAT, we freeze the salient weights during training, explore the derivation of optimal scaling factors crucial for minimizing the quantization error, and propose a scaling mechanism based on this derived scaling strategy for residual binarized weights. \nThose explorations and the developed methodologies significantly contribute to rejuvenating the performance of low-bit quantized LLMs and present substantial advancements in the field of network binarization for LLMs. \nCode is available at https://github.com/hahnyuan/PB-LLM.",
        "keywords": "Large Language Model;Network Compression",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/d6d3e8ebdb78e648e9f1f03af5cb4a9a9f78b1f3.pdf",
        "author": "Zhihang Yuan;Yuzhang Shang;Zhen Dong",
        "authorids": "~Zhihang_Yuan1;~Yuzhang_Shang1;~Zhen_Dong3",
        "gender": "M;M;M",
        "homepage": "http://zhihang.cc;https://42shawn.github.io/;https://dong-zhen.com/",
        "dblp": "195/4180;300/8483;",
        "google_scholar": "https://scholar.google.ca/citations?user=iipYHLoAAAAJ;6ZPL5E0AAAAJ;czxMUzcAAAAJ",
        "orcid": ";;",
        "linkedin": ";;zhen-dong/",
        "or_profile": "~Zhihang_Yuan1;~Yuzhang_Shang1;~Zhen_Dong3",
        "aff": "Houmo AI;Illinois Institute of Technology;Nexusflow.ai Inc",
        "aff_domain": "houmo.ai;iit.edu;nexusflow.ai",
        "position": "Researcher;PhD student;Principal Researcher",
        "bibtex": "@inproceedings{\nyuan2024pbllm,\ntitle={{PB}-{LLM}: Partially Binarized Large Language Models},\nauthor={Zhihang Yuan and Yuzhang Shang and Zhen Dong},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=BifeBRhikU}\n}",
        "github": "",
        "project": "",
        "reviewers": "tXaS;9nFP;JdJY;92rD",
        "pdf_size": 886555,
        "rating": "5;6;8;8",
        "confidence": "5;3;4;5",
        "soundness": "2;2;3;4",
        "contribution": "3;2;3;4",
        "presentation": "3;3;3;3",
        "wc_summary": "161;95;116;50",
        "wc_strengths": "88;43;25;77",
        "wc_weaknesses": "479;75;50;107",
        "wc_questions": "142;63;56;2",
        "wc_review": "870;276;247;236",
        "wc_reply_reviewers": "276;40;18;22",
        "wc_reply_authors": "3351;1143;825;769",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "10;5;3;3",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            105.5,
            39.94058086708304
        ],
        "wc_strengths_avg": [
            58.25,
            25.370997221236692
        ],
        "wc_weaknesses_avg": [
            177.75,
            175.0962235457978
        ],
        "wc_questions_avg": [
            65.75,
            49.951851817525245
        ],
        "wc_review_avg": [
            407.25,
            267.5680988085089
        ],
        "wc_reply_reviewers_avg": [
            89.0,
            108.28203913853858
        ],
        "wc_reply_authors_avg": [
            1522.0,
            1065.5632313476287
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            5.25,
            2.8613807855648994
        ],
        "replies_avg": [
            33,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.058025885318565944,
        "gs_citation": 68,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6335842344317852057&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=BifeBRhikU",
        "pdf": "https://openreview.net/pdf?id=BifeBRhikU",
        "email": "houmo.ai;iit.edu;nexusflow.ai",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Houmo AI;Illinois Institute of Technology;Nexusflow.ai",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.houmo.ai;https://www.iit.edu;https://www.nexusflow.ai",
        "aff_unique_abbr": "Houmo AI;IIT;Nexusflow.ai",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "BjG6McP5nA",
        "title": "Improving Gradient-guided Nested Sampling for Posterior Inference",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We present a performant, general-purpose gradient-guided nested sampling (GGNS) algorithm, combining the state of the art in differentiable programming, Hamiltonian slice sampling, clustering, mode separation, dynamic nested sampling, and parallelization. This unique combination allows GGNS to scale well with dimensionality and perform competitively on a variety of synthetic and real-world problems.\n    We also show the potential of combining nested sampling with generative flow networks to obtain large amounts of high-quality samples from the posterior distribution. This combination leads to faster mode discovery and more accurate estimates of the partition function.",
        "keywords": "nested sampling;generative flow networks;bayesian inference",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/2c9681d97febfcd86a3a450cb8608da11d93a30f.zip",
        "author": "Pablo Lemos;Will Handley;Nikolay Malkin;Yoshua Bengio;Yashar Hezaveh;Laurence Perreault-Levasseur",
        "authorids": "~Pablo_Lemos1;~Will_Handley1;~Nikolay_Malkin1;~Yoshua_Bengio1;~Yashar_Hezaveh1;~Laurence_Perreault-Levasseur1",
        "gender": "M;M;;M;M;F",
        "homepage": "https://pablo-lemos.github.io;https://www.kicc.cam.ac.uk/directory/wh260;;http://yoshuabengio.org;https://www.astro.umontreal.ca/~hezaveh/hezaveh/Home.html;",
        "dblp": "313/2645;229/4832;;56/953;332/6554;",
        "google_scholar": "AklQTTsAAAAJ;https://scholar.google.co.uk/citations?user=9Ow4mn0AAAAJ;;kukA0LcAAAAJ;4tQoRHoAAAAJ;wVXcNOQAAAAJ",
        "orcid": "0000-0002-4728-8473;0000-0002-5866-0445;;;0000-0002-8669-5733;",
        "linkedin": ";;;yoshuabengio/?originalSubdomain=ca;;",
        "or_profile": "~Pablo_Lemos1;~Will_Handley1;~Nikolay_Malkin1;~Yoshua_Bengio1;~Yashar_Hezaveh1;~Laurence_Perreault-Levasseur1",
        "aff": "Universit\u00e9 de Montr\u00e9al;University of Cambridge;;University of Montreal;Universit\u00e9 de Montr\u00e9al;Universit\u00e9 de Montr\u00e9al",
        "aff_domain": "umontreal.ca;cam.ac.uk;;umontreal.ca;umontreal.ca;umontreal.ca",
        "position": "Postdoc;Principal Researcher;;Full Professor;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nlemos2024improving,\ntitle={Improving Gradient-guided Nested Sampling for Posterior Inference},\nauthor={Pablo Lemos and Will Handley and Nikolay Malkin and Yoshua Bengio and Yashar Hezaveh and Laurence Perreault-Levasseur},\nyear={2024},\nurl={https://openreview.net/forum?id=BjG6McP5nA}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZsRi;Ec9X;C7my;NqDj;vEK5;skHM",
        "site": "https://openreview.net/forum?id=BjG6McP5nA",
        "pdf_size": 4225641,
        "rating": "5;5;6;6;8;8",
        "confidence": "3;3;3;2;2;3",
        "soundness": "2;2;3;3;3;3",
        "contribution": "2;2;3;3;3;3",
        "presentation": "3;2;3;3;3;2",
        "wc_summary": "14;49;87;68;73;56",
        "wc_strengths": "64;9;61;56;62;31",
        "wc_weaknesses": "1107;84;46;103;57;126",
        "wc_questions": "91;2;126;94;8;16",
        "wc_review": "1276;144;320;321;200;229",
        "wc_reply_reviewers": "697;32;33;28;0;19",
        "wc_reply_authors": "1672;234;483;441;57;226",
        "reply_reviewers": "2;1;1;1;0;1",
        "reply_authors": "4;1;1;1;1;2",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            57.833333333333336,
            23.046450678768064
        ],
        "wc_strengths_avg": [
            47.166666666666664,
            20.37495739600181
        ],
        "wc_weaknesses_avg": [
            253.83333333333334,
            382.4846039021992
        ],
        "wc_questions_avg": [
            56.166666666666664,
            48.97079628604062
        ],
        "wc_review_avg": [
            415.0,
            390.18030020320947
        ],
        "wc_reply_reviewers_avg": [
            134.83333333333334,
            251.65678788558213
        ],
        "wc_reply_authors_avg": [
            518.8333333333334,
            534.9932761778932
        ],
        "reply_reviewers_avg": [
            1.0,
            0.5773502691896257
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            1.1055415967851332
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.37796447300922736,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17274674397152848121&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;2;0;0",
        "aff_unique_norm": "Universit\u00e9 de Montr\u00e9al;University of Cambridge;University of Montreal",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.umontreal.ca;https://www.cam.ac.uk;https://wwwumontreal.ca",
        "aff_unique_abbr": "UdeM;Cambridge;UM",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Cambridge",
        "aff_country_unique_index": "0;1;0;0;0",
        "aff_country_unique": "Canada;United Kingdom"
    },
    {
        "id": "BjjG2fH09N",
        "title": "Maximum Margin Based Activation Clipping for Post-Training Overfitting Mitigation in DNN Classifiers",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Well-known (non-malicious) sources of overfitting in deep neural net (DNN) classifiers include: i) large class imbalances; ii) insufficient training set diversity; and iii) over-training.  In recent work, it was shown that backdoor \ndata-poisoning also induces overfitting, with unusually large classification margins to the attacker's target class, mediated particularly by (unbounded) ReLU activations that allow large signals to propagate in the DNN.  Thus, an effective post-training (with no knowledge of the training set or training process) mitigation approach against backdoors was proposed, leveraging a small clean set, based on bounding neural activations.\nImproving upon that work, we threshold activations specifically to limit maximum margins (MMs), which yields performance gains in backdoor mitigation.  We also provide some analytical support for this mitigation approach.  Most importantly, we show that post-training MM-based regularization substantially mitigates non-malicious overfitting due to class imbalances and overtraining. Thus, unlike adversarial training, which provides some resilience against attacks but which harms clean (attack-free) generalization, we demonstrate an approach originating from adversarial learning that helps clean generalization accuracy.  Experiments on CIFAR-10 and CIFAR-100, in comparison with peer methods, demonstrate strong performance of our methods.",
        "keywords": "Activation clipping;data imbalance;backdoor",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Hang Wang;David J. Miller;George Kesidis",
        "authorids": "~Hang_Wang5;~David_J._Miller1;~George_Kesidis1",
        "gender": "M;M;M",
        "homepage": ";http://eecs.psu.edu/departments/ee-faculty-list.aspx;http://www.cse.psu.edu/~gik2",
        "dblp": ";;",
        "google_scholar": ";;",
        "orcid": ";;",
        "linkedin": "hang-wang-2a9068177/;;",
        "or_profile": "~Hang_Wang5;~David_J._Miller1;~George_Kesidis1",
        "aff": ";Pennsylvania State University;Pennsylvania State University",
        "aff_domain": ";psu.edu;psu.edu",
        "position": ";Full Professor;Full Professor",
        "bibtex": "@misc{\nwang2024maximum,\ntitle={Maximum Margin Based Activation Clipping for Post-Training Overfitting Mitigation in {DNN} Classifiers},\nauthor={Hang Wang and David J. Miller and George Kesidis},\nyear={2024},\nurl={https://openreview.net/forum?id=BjjG2fH09N}\n}",
        "github": "",
        "project": "",
        "reviewers": "qM5Q;Ww2o;Xe9i;EQmf",
        "site": "https://openreview.net/forum?id=BjjG2fH09N",
        "pdf_size": 628518,
        "rating": "3;3;3;5",
        "confidence": "4;4;3;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;3;2",
        "presentation": "3;1;3;3",
        "wc_summary": "119;204;86;97",
        "wc_strengths": "69;121;129;40",
        "wc_weaknesses": "534;758;351;102",
        "wc_questions": "3;127;240;5",
        "wc_review": "725;1210;806;244",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "412;326;360;158",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            126.5,
            46.295248136282844
        ],
        "wc_strengths_avg": [
            89.75,
            36.819661866997095
        ],
        "wc_weaknesses_avg": [
            436.25,
            240.86757253727617
        ],
        "wc_questions_avg": [
            93.75,
            98.2430022953289
        ],
        "wc_review_avg": [
            746.25,
            343.2713030534303
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            314.0,
            95.13148795220224
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:_awH-5tLPAoJ:scholar.google.com/&scioq=Maximum+Margin+Based+Activation+Clipping+for+Post-Training+Overfitting+Mitigation+in+DNN+Classifiers&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Pennsylvania State University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.psu.edu",
        "aff_unique_abbr": "PSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Bk0ykeYCfP",
        "title": "Analyzing the Effects of Emulating on the Reinforcement Learning Manifold",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Reinforcement learning has become a prominent research direction with the utilization of deep neural networks as state-action value function approximators enabling exploration and construction of functioning neural policies in MDPs with state representations in high dimensions. While reinforcement learning is currently being deployed in many different settings from medical to finance, the fact that reinforcement learning requires a reward signal from the MDP to learn a functioning policy can be restrictive for tasks in which the construction of the reward function is more or equally complex than learning it. In this line of research several studies proposed algorithms to learn a reward function or an optimal policy from observed optimal trajectories. In this paper, we focus on non-robustness of the state-of-the-art algorithms that accomplish learning without rewards in high dimensional state representation MDPs, and we demonstrate that the vanilla trained deep reinforcement learning policies are more resilient and value aligned than learning without rewards in MDPs with complex state representations.",
        "keywords": "Reinforcement Learning Manifold;Volatility;Learning via Emulating",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/6453692a18d82624a8fc3b49ae3e3d50e6cda836.zip",
        "author": "Ezgi Korkmaz",
        "authorids": "~Ezgi_Korkmaz2",
        "gender": "",
        "homepage": "https://ezgikorkmaz.github.io/",
        "dblp": "300/7830.html",
        "google_scholar": "",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Ezgi_Korkmaz2",
        "aff": "University College London, University of London",
        "aff_domain": "ucl.ac.uk",
        "position": "PhD student",
        "bibtex": "@misc{\nkorkmaz2024analyzing,\ntitle={Analyzing the Effects of Emulating on the Reinforcement Learning Manifold},\nauthor={Ezgi Korkmaz},\nyear={2024},\nurl={https://openreview.net/forum?id=Bk0ykeYCfP}\n}",
        "github": "",
        "project": "",
        "reviewers": "HmFk;uuJm;99sz",
        "site": "https://openreview.net/forum?id=Bk0ykeYCfP",
        "pdf_size": 970985,
        "rating": "3;5;8",
        "confidence": "4;3;2",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "1;2;2",
        "wc_summary": "58;98;117",
        "wc_strengths": "33;65;234",
        "wc_weaknesses": "49;119;49",
        "wc_questions": "500;166;6",
        "wc_review": "640;448;406",
        "wc_reply_reviewers": "244;448;0",
        "wc_reply_authors": "1037;1085;49",
        "reply_reviewers": "2;1;0",
        "reply_authors": "2;3;1",
        "rating_avg": [
            5.333333333333333,
            2.0548046676563256
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            91.0,
            24.589970855343985
        ],
        "wc_strengths_avg": [
            110.66666666666667,
            88.18289075678015
        ],
        "wc_weaknesses_avg": [
            72.33333333333333,
            32.99831645537222
        ],
        "wc_questions_avg": [
            224.0,
            205.80249431595007
        ],
        "wc_review_avg": [
            498.0,
            101.86265262597475
        ],
        "wc_reply_reviewers_avg": [
            230.66666666666666,
            183.13807784170814
        ],
        "wc_reply_authors_avg": [
            723.6666666666666,
            477.46366935669107
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.9933992677987828,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:biUlUHrIQL8J:scholar.google.com/&scioq=Analyzing+the+Effects+of+Emulating+on+the+Reinforcement+Learning+Manifold&hl=en&as_sdt=0,8",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "University College London",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucl.ac.uk",
        "aff_unique_abbr": "UCL",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "BkRD6GsswM",
        "title": "CLA-RA: COLLABORATIVE ACTIVE LEARNING AMIDST RELABELING AMBIGUITY",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Obtaining diverse and high-quality labeled data for training efficient classifiers remains a practical challenge. Crowdsourcing, which involves employing multiple weak labelers, is a popular approach to address this issue. However, crowd labelers often introduce noise, inaccuracies, and possess limited domain knowledge. In this paper, we propose a novel framework CLA-RA to optimize the labeling process by determining what to label next and assigning tasks to the most suitable annotators. Our technique aims to optimize classifier efficiency by utilizing the collective wisdom of various annotators while limiting the influence of error-prone annotations. The key contributions of our work include an annotator disagreement based instance selection mechanism which identifies the noise present in annotations of the instances and an instance-dependent annotator confidence model, which identifies the annotator with the highest confidence to correctly label an instance.These methods, combined with a similarity based annotator inference method, result in improved classifier accuracy while reducing annotation efforts. Experimental results over 13 datasets demonstrate significant improvements over state-of-the-art multi-annotator active learning methods, highlighting the effectiveness of our approach in obtaining high-quality labeled data for training classifiers with minimal labeling costs and errors.",
        "keywords": "Multi-Annotator;Active Learning;Crowd Sourcing",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Oishik Chatterjee;Kaizer Rahaman;Pooja Aggarwal",
        "authorids": "~Oishik_Chatterjee1;~Kaizer_Rahaman1;~Pooja_Aggarwal1",
        "gender": ";M;F",
        "homepage": ";;",
        "dblp": "191/1189.html;;133/3638.html",
        "google_scholar": "jA3iUSMAAAAJ;;",
        "orcid": ";;",
        "linkedin": "oishik-chatterjee-227b64162;kaizer-rahaman?lipi=urn%3Ali%3Apage%3Ad_flagship3_profile_view_base_contact_details%3B8s3DpZcVTLa%2FmQ1NWORLVg%3D%3D;pooja-aggarwal-19402921/",
        "or_profile": "~Oishik_Chatterjee1;~Kaizer_Rahaman1;~Pooja_Aggarwal1",
        "aff": "International Business Machines;INDIAN INSTITUTE OF TECHNOLOGY KHARAGPUR;",
        "aff_domain": "ibm.com;iitkgp.ac.in;",
        "position": "Researcher;MS student;",
        "bibtex": "@misc{\nchatterjee2024clara,\ntitle={{CLA}-{RA}: {COLLABORATIVE} {ACTIVE} {LEARNING} {AMIDST} {RELABELING} {AMBIGUITY}},\nauthor={Oishik Chatterjee and Kaizer Rahaman and Pooja Aggarwal},\nyear={2024},\nurl={https://openreview.net/forum?id=BkRD6GsswM}\n}",
        "github": "",
        "project": "",
        "reviewers": "8mJ8;T5Kg;L6GL;hpUt",
        "site": "https://openreview.net/forum?id=BkRD6GsswM",
        "pdf_size": 1481627,
        "rating": "3;3;3;5",
        "confidence": "5;5;4;4",
        "soundness": "4;3;1;2",
        "contribution": "2;2;2;2",
        "presentation": "4;2;2;3",
        "wc_summary": "84;52;109;89",
        "wc_strengths": "248;29;31;42",
        "wc_weaknesses": "231;194;134;53",
        "wc_questions": "16;103;56;135",
        "wc_review": "579;378;330;319",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "34;568;296;61",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            1.118033988749895
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            83.5,
            20.45116133621756
        ],
        "wc_strengths_avg": [
            87.5,
            92.79682106624128
        ],
        "wc_weaknesses_avg": [
            153.0,
            67.31641701695062
        ],
        "wc_questions_avg": [
            77.5,
            45.27968639467372
        ],
        "wc_review_avg": [
            401.5,
            104.85346918438131
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            239.75,
            215.17245990135447
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:rno1MBQKnxkJ:scholar.google.com/&scioq=CLA-RA:+COLLABORATIVE+ACTIVE+LEARNING+AMIDST+RELABELING+AMBIGUITY&hl=en&as_sdt=0,14",
        "gs_version_total": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "International Business Machines Corporation;Indian Institute of Technology Kharagpur",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ibm.com;https://www.iitkgp.ac.in",
        "aff_unique_abbr": "IBM;IIT Kharagpur",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Kharagpur",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United States;India"
    },
    {
        "id": "BkvdAYhyqm",
        "title": "Explaining black box text modules in natural language with language models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs) have demonstrated remarkable prediction performance for a growing array of tasks. However, their rapid proliferation and increasing opaqueness have created a growing need for interpretability. Here, we ask whether we can automatically obtain natural language explanations for black box text modules. A text module is any function that maps text to a scalar continuous value, such as a submodule within an LLM or a fitted model of a brain region. Black box indicates that we only have access to the module's inputs/outputs.\n    \nWe introduce Summarize and Score (SASC), a method that takes in a text module and returns a natural language explanation of the module's selectivity along with a score for how reliable the explanation is. We study SASC in 3 contexts. First, we evaluate SASC on synthetic modules and find that it often recovers ground truth explanations. Second, we use SASC to explain modules found within a pre-trained BERT model, enabling inspection of the model's internals. Finally, we show that SASC can generate explanations for the response of individual fMRI voxels to language stimuli, with potential applications to fine-grained brain mapping.",
        "keywords": "interpretability;language models;explanations;mechanistic interpretability",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/ecdb37c67f550cc8ab2499c1a045f54139da781c.zip",
        "author": "Chandan Singh;Aliyah R. Hsu;Richard Antonello;Shailee Jain;Alexander Huth;Bin Yu;Jianfeng Gao",
        "authorids": "~Chandan_Singh1;~Aliyah_R._Hsu1;~Richard_Antonello1;~Shailee_Jain1;~Alexander_Huth1;~Bin_Yu5;~Jianfeng_Gao1",
        "gender": "M;F;M;Not Specified;;M;M",
        "homepage": "https://csinva.io/;https://adelaidehsu.github.io/;https://www.cs.utexas.edu/~huth/people.html;https://shaileesjain.github.io;https://www.cs.utexas.edu/~huth/;https://binyu.stat.berkeley.edu;https://www.microsoft.com/en-us/research/people/jfgao/",
        "dblp": "38/2317;263/4967;;197/6887;44/8860.html;27/116;92/5339",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en;;BVojx7oAAAAJ;JNXWWkIAAAAJ;https://scholar.google.com.hk/citations?user=z1iJa3UAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0003-0318-2340;;;0000-0001-7327-5492;;0000-0003-3097-1433;",
        "linkedin": "csinva/;;;;;bin-yu-b665063/;",
        "or_profile": "~Chandan_Singh1;~Aliyah_R._Hsu1;~Richard_Antonello1;~Shailee_Jain1;~Alexander_Huth1;~Bin_Yu5;~Jianfeng_Gao1",
        "aff": "Microsoft Research;University of California, Berkeley;University of Texas, Austin;University of Texas, Austin;The University of Texas at Austin;University of California, Berkeley;Microsoft Research",
        "aff_domain": "microsoft.com;berkeley.edu;utexas.edu;utexas.edu;utexas.edu;berkeley.edu;microsoft.com",
        "position": "Researcher;PhD student;PhD student;MS student;Assistant Professor;Full Professor;Principal Researcher",
        "bibtex": "@misc{\nsingh2024explaining,\ntitle={Explaining black box text modules in natural language with language models},\nauthor={Chandan Singh and Aliyah R. Hsu and Richard Antonello and Shailee Jain and Alexander Huth and Bin Yu and Jianfeng Gao},\nyear={2024},\nurl={https://openreview.net/forum?id=BkvdAYhyqm}\n}",
        "github": "",
        "project": "",
        "reviewers": "beYn;CSdo;Tacm",
        "site": "https://openreview.net/forum?id=BkvdAYhyqm",
        "pdf_size": 786516,
        "rating": "5;6;8",
        "confidence": "4;3;4",
        "soundness": "3;2;3",
        "contribution": "2;3;3",
        "presentation": "2;2;3",
        "wc_summary": "102;214;120",
        "wc_strengths": "81;177;89",
        "wc_weaknesses": "149;568;6",
        "wc_questions": "85;3;182",
        "wc_review": "417;962;397",
        "wc_reply_reviewers": "0;82;0",
        "wc_reply_authors": "644;801;685",
        "reply_reviewers": "0;2;0",
        "reply_authors": "1;2;1",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            145.33333333333334,
            49.10759162854105
        ],
        "wc_strengths_avg": [
            115.66666666666667,
            43.49201714746691
        ],
        "wc_weaknesses_avg": [
            241.0,
            238.47990830815635
        ],
        "wc_questions_avg": [
            90.0,
            73.16192087873765
        ],
        "wc_review_avg": [
            592.0,
            261.756884659538
        ],
        "wc_reply_reviewers_avg": [
            27.333333333333332,
            38.6551707048646
        ],
        "wc_reply_authors_avg": [
            710.0,
            66.4880941723153
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.18898223650461363,
        "gs_citation": 41,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2405408876530202400&as_sdt=8000005&sciodt=0,19&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;2;2;1;0",
        "aff_unique_norm": "Microsoft;University of California, Berkeley;University of Texas at Austin",
        "aff_unique_dep": "Microsoft Research;;",
        "aff_unique_url": "https://www.microsoft.com/en-us/research;https://www.berkeley.edu;https://www.utexas.edu",
        "aff_unique_abbr": "MSR;UC Berkeley;UT Austin",
        "aff_campus_unique_index": "1;2;2;2;1",
        "aff_campus_unique": ";Berkeley;Austin",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "WildChat: 1M ChatGPT Interaction Logs in the Wild",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19206",
        "id": "Bl8u7ZRlbM",
        "author_site": "Wenting Zhao, Xiang Ren, Jack Hessel, Claire Cardie, Yejin Choi, Yuntian Deng",
        "tldr": "",
        "abstract": "Chatbots such as GPT-4 and ChatGPT are now serving millions of users. Despite their widespread use, there remains a lack of public datasets showcasing how these tools are used by a population of users in practice. To bridge this gap, we offered free access to ChatGPT for online users in exchange for their affirmative, consensual opt-in to anonymously collect their chat transcripts and request headers. From this, we compiled WildChat, a corpus of 1 million user-ChatGPT conversations, which consists of over 2.5 million interaction turns. We compare WildChat with other popular user-chatbot interaction datasets, and find that our dataset offers the most diverse user prompts, contains the largest number of languages, and presents the richest variety of potentially toxic use-cases for researchers to study. In addition to timestamped chat transcripts, we enrich the dataset with demographic data, including state, country, and hashed IP addresses, alongside request headers. This augmentation allows for more detailed analysis of user behaviors across different geographical regions and temporal dimensions. Finally, because it captures a broad range of use cases, we demonstrate the dataset\u2019s potential utility in fine-tuning instruction-following models. WildChat is released at https://wildchat.allen.ai under AI2 ImpACT Licenses.",
        "keywords": "dataset;dialogues;chatbot;ChatGPT;instruction tuning;toxicity;AI safety",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Wenting Zhao;Xiang Ren;Jack Hessel;Claire Cardie;Yejin Choi;Yuntian Deng",
        "authorids": "~Wenting_Zhao1;~Xiang_Ren1;~Jack_Hessel1;~Claire_Cardie1;~Yejin_Choi1;~Yuntian_Deng2",
        "gender": ";M;M;F;F;",
        "homepage": ";https://shanzhenren.github.io/;https://www.jmhessel.com;https://www.cs.cornell.edu/home/cardie/;https://yejinc.github.io/;https://yuntiandeng.com",
        "dblp": "41/10049-2.html;36/360-1;https://dblp.uni-trier.de/pid/132/5250.html;c/ClaireCardie;89/579-1;166/1720",
        "google_scholar": "sycHskQAAAAJ;_moJlrIAAAAJ;SxQQ1msAAAAJ;ex9BQiIAAAAJ;vhP-tlcAAAAJ;tk0e5lYAAAAJ",
        "orcid": ";;0000-0002-4012-8979;;;",
        "linkedin": ";xren7;;;;",
        "or_profile": "~Wenting_Zhao1;~Xiang_Ren1;~Jack_Hessel1;~Claire_Cardie1;~Yejin_Choi1;~Yuntian_Deng2",
        "aff": "Cornell University;University of Southern California;Samaya AI;Cornell University;Department of Computer Science, University of Washington;Allen Institute for Artificial Intelligence",
        "aff_domain": "cornell.edu;usc.edu;samaya.ai;cornell.edu;cs.washington.edu;allenai.org",
        "position": "PhD student;Associate Professor;Researcher;Full Professor;Full Professor;Postdoc",
        "bibtex": "@inproceedings{\nzhao2024wildchat,\ntitle={WildChat: 1M Chat{GPT} Interaction Logs in the Wild},\nauthor={Wenting Zhao and Xiang Ren and Jack Hessel and Claire Cardie and Yejin Choi and Yuntian Deng},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Bl8u7ZRlbM}\n}",
        "github": "",
        "project": "",
        "reviewers": "fdao;FR3g;dDLY;cWAh",
        "pdf_size": 13590393,
        "rating": "5;6;6;8",
        "confidence": "2;4;4;4",
        "soundness": "2;3;4;3",
        "contribution": "2;3;3;3",
        "presentation": "2;4;3;3",
        "wc_summary": "92;85;54;71",
        "wc_strengths": "32;80;67;81",
        "wc_weaknesses": "171;114;195;102",
        "wc_questions": "76;87;5;34",
        "wc_review": "371;366;321;288",
        "wc_reply_reviewers": "62;0;0;0",
        "wc_reply_authors": "454;507;642;575",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            75.5,
            14.534441853748634
        ],
        "wc_strengths_avg": [
            65.0,
            19.836834424877374
        ],
        "wc_weaknesses_avg": [
            145.5,
            38.68139087468288
        ],
        "wc_questions_avg": [
            50.5,
            32.882366094914765
        ],
        "wc_review_avg": [
            336.5,
            34.106451002706216
        ],
        "wc_reply_reviewers_avg": [
            15.5,
            26.846787517317598
        ],
        "wc_reply_authors_avg": [
            544.5,
            70.76899038420711
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.6622661785325219,
        "gs_citation": 178,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12299342145701882111&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=Bl8u7ZRlbM",
        "pdf": "https://openreview.net/pdf?id=Bl8u7ZRlbM",
        "email": "cornell.edu;usc.edu;samaya.ai;cornell.edu;cs.washington.edu;allenai.org",
        "author_num": 6,
        "aff_unique_index": "0;1;2;0;3;4",
        "aff_unique_norm": "Cornell University;University of Southern California;Samaya AI;University of Washington;Allen Institute for Artificial Intelligence",
        "aff_unique_dep": ";;;Department of Computer Science;",
        "aff_unique_url": "https://www.cornell.edu;https://www.usc.edu;;https://www.washington.edu;https://allenai.org",
        "aff_unique_abbr": "Cornell;USC;;UW;AI2",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Los Angeles;Seattle",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States;"
    },
    {
        "id": "BlCnycxgJQ",
        "title": "An Inexact Regularized Adaptive Algorithm with Manifold Identification for Training Structured Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We propose an inexact regularized adaptive dual averaging algorithm with momentum, RAMDA, for training structured neural networks in various tasks with the help of regularization. Through the theory of manifold identification, we show that after a finite number of steps, the structures of the iterates generated by RAMDA are all identical to the structure induced by the regularization at the stationary point of asymptotic convergence.  This structure is locally optimal within a neighborhood of the point of convergence and therefore provides the best possible performance among all methods converging to the same point. To make use of manifold identification, RAMDA produces stochastic estimators of the gradient that almost surely converge to the true gradient even when the training problem is no longer a finite-sum one but a stochastic one over a certain probability distribution due to data augmentation. With the simultaneous presence of a preconditioner and a regularization term, the subproblem of RAMDA as well as those of existing frameworks have no closed-form solutions, so we also propose a general iterative subroutine for approximately solving such subproblems efficiently while maintaining similar convergence guarantees. Extensive numerical experiments in modern computer vision, natural language processing, and speech tasks show that our subproblem solver is efficient and applicable to existing frameworks, and the proposed RAMDA excels state of the art for training structured neural networks to generate more structural points without decreasing the prediction performance.",
        "keywords": "Deep learning;structured models;adaptive method;manifold identification;variance reduction;inexact subproblem solution",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/1a2b8e99512e9c2fdab5a14890a88f90fe897868.zip",
        "author": "Zih-Syuan Huang;Ching-pei Lee",
        "authorids": "~Zih-Syuan_Huang1;~Ching-pei_Lee2",
        "gender": ";Unspecified",
        "homepage": "https://github.com/zihsyuan1214;http://leepei.github.io",
        "dblp": ";",
        "google_scholar": ";https://scholar.google.com/citations?hl=en",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Zih-Syuan_Huang1;~Ching-Pei_Lee1",
        "aff": "Department of computer science and information engineering, National Taiwan University;Institute of Statistical Mathematics, Japan",
        "aff_domain": "csie.ntu.edu.tw;ism.ac.jp",
        "position": "MS student;Associate Professor",
        "bibtex": "@misc{\nhuang2024an,\ntitle={An Inexact Regularized Adaptive Algorithm with Manifold Identification for Training Structured Neural Networks},\nauthor={Zih-Syuan Huang and Ching-pei Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=BlCnycxgJQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "VVRX;N8rQ;a8Jk",
        "site": "https://openreview.net/forum?id=BlCnycxgJQ",
        "pdf_size": 1050249,
        "rating": "5;6;6",
        "confidence": "3;3;3",
        "soundness": "2;3;4",
        "contribution": "2;3;3",
        "presentation": "1;3;4",
        "wc_summary": "166;68;122",
        "wc_strengths": "20;39;90",
        "wc_weaknesses": "148;51;80",
        "wc_questions": "144;2;61",
        "wc_review": "478;160;353",
        "wc_reply_reviewers": "0;0;102",
        "wc_reply_authors": "2115;796;1119",
        "reply_reviewers": "0;0;1",
        "reply_authors": "4;2;3",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "wc_summary_avg": [
            118.66666666666667,
            40.07770230717103
        ],
        "wc_strengths_avg": [
            49.666666666666664,
            29.555973263547855
        ],
        "wc_weaknesses_avg": [
            93.0,
            40.65300316909769
        ],
        "wc_questions_avg": [
            69.0,
            58.24660218988458
        ],
        "wc_review_avg": [
            330.3333333333333,
            130.8085963875803
        ],
        "wc_reply_reviewers_avg": [
            34.0,
            48.08326112068523
        ],
        "wc_reply_authors_avg": [
            1343.3333333333333,
            561.3580754642164
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.0,
            0.816496580927726
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:fMfgLVfmetYJ:scholar.google.com/&scioq=An+Inexact+Regularized+Adaptive+Algorithm+with+Manifold+Identification+for+Training+Structured+Neural+Networks&hl=en&as_sdt=0,11",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "National Taiwan University;Institute of Statistical Mathematics",
        "aff_unique_dep": "Department of Computer Science and Information Engineering;",
        "aff_unique_url": "https://www.ntu.edu.tw;https://www.ism.ac.jp",
        "aff_unique_abbr": "NTU;ISM",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Taiwan;",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "China;Japan"
    },
    {
        "title": "A Fast and Provable Algorithm for Sparse Phase Retrieval",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19205",
        "id": "BlkxbI6vzl",
        "author_site": "Jian-Feng Cai, Yu Long, Ruixue WEN, Jiaxi Ying",
        "tldr": "",
        "abstract": "We study the sparse phase retrieval problem, which seeks to recover a sparse signal from a limited set of magnitude-only measurements. In contrast to prevalent sparse phase retrieval algorithms that primarily use first-order methods, we propose an innovative second-order algorithm that employs a Newton-type method with hard thresholding. This algorithm overcomes the linear convergence limitations of first-order methods while preserving their hallmark per-iteration computational efficiency. We provide theoretical guarantees that our algorithm converges to the $s$-sparse ground truth signal $\\boldsymbol{x}^{\\natural} \\in \\mathbb{R}^n$ (up to a global sign) at a quadratic convergence rate after at most $O(\\log (\\Vert\\boldsymbol{x}^{\\natural} \\Vert /x_{\\min}^{\\natural}))$ iterations, using $\\Omega(s^2\\log n)$ Gaussian random samples. Numerical experiments show that our algorithm achieves a significantly faster convergence rate than state-of-the-art methods.",
        "keywords": "Sparse Phase Retrieval;Quadratic Convergence;Newton-type Method;Hard Thresholding;Nonconvex Optimization",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Jian-Feng CAI;Yu Long;Ruixue WEN;Jiaxi Ying",
        "authorids": "~Jian-Feng_CAI1;~Yu_Long2;~Ruixue_WEN1;~Jiaxi_Ying1",
        "gender": "M;;F;M",
        "homepage": "https://www.math.ust.hk/~jfcai/;;http://wrx.homepage;https://jxying.github.io/",
        "dblp": ";;;179/2448",
        "google_scholar": "Mo4v5iwAAAAJ;;;_IzItlcAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Jian-Feng_CAI1;~Yu_Long2;~Ruixue_WEN1;~Jiaxi_Ying1",
        "aff": "Hong Kong University of Science and Technology;;;Hong Kong University of Science and Technology",
        "aff_domain": "ust.hk;;;ust.hk",
        "position": "Full Professor;;;Postdoc",
        "bibtex": "@inproceedings{\ncai2024a,\ntitle={A Fast and Provable Algorithm for Sparse Phase Retrieval},\nauthor={Jian-Feng CAI and Yu Long and Ruixue WEN and Jiaxi Ying},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=BlkxbI6vzl}\n}",
        "github": "",
        "project": "",
        "reviewers": "5Ggq;M25C;qMEw;s5s7",
        "pdf_size": 1467685,
        "rating": "6;6;8;8",
        "confidence": "4;4;4;3",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "117;39;55;111",
        "wc_strengths": "94;35;52;63",
        "wc_weaknesses": "106;52;77;63",
        "wc_questions": "405;50;1;2",
        "wc_review": "722;176;185;239",
        "wc_reply_reviewers": "10;0;14;8",
        "wc_reply_authors": "2726;910;605;367",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "5;2;2;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            80.5,
            34.04041715373065
        ],
        "wc_strengths_avg": [
            61.0,
            21.50581316760657
        ],
        "wc_weaknesses_avg": [
            74.5,
            20.22992832414391
        ],
        "wc_questions_avg": [
            114.5,
            168.88531611718054
        ],
        "wc_review_avg": [
            330.5,
            227.31311004867274
        ],
        "wc_reply_reviewers_avg": [
            8.0,
            5.0990195135927845
        ],
        "wc_reply_authors_avg": [
            1152.0,
            928.9071535950188
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            1.299038105676658
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12132307416779700585&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=BlkxbI6vzl",
        "pdf": "https://openreview.net/pdf?id=BlkxbI6vzl",
        "email": "ust.hk;;;ust.hk",
        "author_num": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Hong Kong University of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ust.hk",
        "aff_unique_abbr": "HKUST",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Continual Momentum Filtering on Parameter Space for Online Test-time Adaptation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19204",
        "id": "BllUWdpIOA",
        "author_site": "Jae-Hong Lee, Joon-Hyuk Chang",
        "tldr": "",
        "abstract": "Deep neural networks (DNNs) have revolutionized tasks such as image classification and speech recognition but often falter when training and test data diverge in distribution. External factors, from weather effects on images to varied speech environments, can cause this discrepancy, compromising DNN performance. Online test-time adaptation (OTTA) methods present a promising solution, recalibrating models in real-time during the test stage without requiring historical data. However, the OTTA paradigm is imperfect, often falling prey to issues such as catastrophic forgetting due to its reliance on noisy, self-trained predictions. Although some contemporary strategies mitigate this by tying adaptations to the static source model, this restricts model flexibility. This paper introduces a continual momentum filtering (CMF) framework, leveraging the Kalman filter (KF) to strike a balance between model adaptability and information retention. The CMF intertwines optimization via stochastic gradient descent with a KF-based inference process. This methodology not only aids in averting catastrophic forgetting but also provides high adaptability to shifting data distributions. We validate our framework on various OTTA scenarios and real-world situations regarding covariate and label shifts, and the CMF consistently shows superior performance compared to state-of-the-art methods.",
        "keywords": "Online Test-time Adaptation;Catastrophic Forgetting;Kalman Filter",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/c378ea0ca20cf3f02e4901ec9ff4fd898edff802.zip",
        "author": "Jae-Hong Lee;Joon-Hyuk Chang",
        "authorids": "~Jae-Hong_Lee1;~Joon-Hyuk_Chang1",
        "gender": "M;M",
        "homepage": "https://github.com/j-pong/;http://asmllab.hanyang.ac.kr",
        "dblp": "62/4284;22/4361",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Jae-Hong_Lee1;~Joon-Hyuk_Chang1",
        "aff": "Hanyang University;Hanyang University",
        "aff_domain": "hanyang.ac.kr;hanyang.ac.kr",
        "position": "PhD student;Full Professor",
        "bibtex": "@inproceedings{\nlee2024continual,\ntitle={Continual Momentum Filtering on Parameter Space for Online Test-time Adaptation},\nauthor={Jae-Hong Lee and Joon-Hyuk Chang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=BllUWdpIOA}\n}",
        "github": "",
        "project": "",
        "reviewers": "iWLp;gT9R;aPnP;4Nt5",
        "pdf_size": 768037,
        "rating": "3;6;8;8",
        "confidence": "4;4;4;4",
        "soundness": "1;3;3;3",
        "contribution": "2;3;3;4",
        "presentation": "2;3;3;3",
        "wc_summary": "27;79;66;100",
        "wc_strengths": "75;43;79;55",
        "wc_weaknesses": "196;10;256;135",
        "wc_questions": "2;124;100;3",
        "wc_review": "300;256;501;293",
        "wc_reply_reviewers": "138;0;35;0",
        "wc_reply_authors": "1571;1585;1332;951",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "4;3;4;2",
        "rating_avg": [
            6.25,
            2.0463381929681126
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            68.0,
            26.59887215654077
        ],
        "wc_strengths_avg": [
            63.0,
            14.696938456699069
        ],
        "wc_weaknesses_avg": [
            149.25,
            91.06968485725642
        ],
        "wc_questions_avg": [
            57.25,
            55.40476062578016
        ],
        "wc_review_avg": [
            337.5,
            95.86579160472206
        ],
        "wc_reply_reviewers_avg": [
            43.25,
            56.53925627384923
        ],
        "wc_reply_authors_avg": [
            1359.75,
            256.5203451970233
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.25,
            0.82915619758885
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17722179941905804974&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=BllUWdpIOA",
        "pdf": "https://openreview.net/pdf?id=BllUWdpIOA",
        "email": "hanyang.ac.kr;hanyang.ac.kr",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Hanyang University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.hanyang.ac.kr",
        "aff_unique_abbr": "HYU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "BmhWGsOyDu",
        "title": "Reinforcement Learning for Large Group Systems using Hierarchical Kernel Representations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Policy learning for targeted coordination of massive-scale populations of, in the limit a continuum spectrum of, intelligent agents has been a missing component in reinforcement learning research. The purpose of this work is to fill in this literature gap by addressing the major challenge: the curse of dimensionality caused by the huge population size. To this end, we formulate such an intelligent agent population as a parameterized deterministic dynamical system, referred to as a group system, and then introduce the novel moment representation to the system. Under this representation, we propose a nested reinforcement learning algorithm to learn the optimal policy for the system hierarchically. As a significant advantage, each hierarchy preserves the optimality of all its lower-level children, which then leads to the fast convergence of the nested algorithm.",
        "keywords": "Reinforcement learning;Group Systems;Control Theory",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/44c45c3125bb4d9fcccb6d0cda4eac41c2ff950d.pdf",
        "author": "Wei Zhang;Jr-Shin Li",
        "authorids": "~Wei_Zhang67;~Jr-Shin_Li1",
        "gender": "M;M",
        "homepage": ";https://www.ese.wustl.edu/~jsli/AMLab/Home.html",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": "0000-0003-0003-0341;",
        "linkedin": ";",
        "or_profile": "~Wei_Zhang67;~Jr-Shin_Li1",
        "aff": "Washington University, Saint Louis;Washington University, St. Louis",
        "aff_domain": "wustl.edu;wustl.edu",
        "position": "Postdoc;Full Professor",
        "bibtex": "@misc{\nzhang2024reinforcement,\ntitle={Reinforcement Learning for Large Group Systems using Hierarchical Kernel Representations},\nauthor={Wei Zhang and Jr-Shin Li},\nyear={2024},\nurl={https://openreview.net/forum?id=BmhWGsOyDu}\n}",
        "github": "",
        "project": "",
        "reviewers": "VDh3;tFnE;ns7v",
        "site": "https://openreview.net/forum?id=BmhWGsOyDu",
        "pdf_size": 2281021,
        "rating": "3;5;6",
        "confidence": "3;4;2",
        "soundness": "2;3;3",
        "contribution": "1;2;3",
        "presentation": "2;2;3",
        "wc_summary": "100;189;70",
        "wc_strengths": "34;46;24",
        "wc_weaknesses": "477;336;80",
        "wc_questions": "7;33;52",
        "wc_review": "618;604;226",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            119.66666666666667,
            50.53271767434991
        ],
        "wc_strengths_avg": [
            34.666666666666664,
            8.993825042154693
        ],
        "wc_weaknesses_avg": [
            297.6666666666667,
            164.3255576253703
        ],
        "wc_questions_avg": [
            30.666666666666668,
            18.445113776342563
        ],
        "wc_review_avg": [
            482.6666666666667,
            181.58071361120804
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.3273268353539886,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ZEZmMmo70VUJ:scholar.google.com/&scioq=Reinforcement+Learning+for+Large+Group+Systems+using+Hierarchical+Kernel+Representations&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Washington University in St. Louis",
        "aff_unique_dep": "",
        "aff_unique_url": "https://wustl.edu",
        "aff_unique_abbr": "WUSTL",
        "aff_campus_unique_index": "0;1",
        "aff_campus_unique": "Saint Louis;St. Louis",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Complete and Efficient Graph Transformers for Crystal Material Property Prediction",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19203",
        "id": "BnQY9XiRAS",
        "author_site": "Keqiang Yan, Cong Fu, Xiaofeng Qian, Xiaoning Qian, Shuiwang Ji",
        "tldr": "",
        "abstract": "Crystal structures are characterized by atomic bases within a primitive unit cell that repeats along a regular lattice throughout 3D space. The periodic and infinite nature of crystals poses unique challenges for geometric graph representation learning. Specifically, constructing graphs that effectively capture  the complete  geometric information of crystals and handle chiral crystals remains an unsolved and challenging problem. In this paper, we introduce a novel approach that utilizes the periodic patterns of unit cells to establish the lattice-based representation for each atom, enabling efficient and expressive graph representations of crystals. Furthermore, we propose ComFormer, a SE(3) transformer designed specifically for crystalline materials. ComFormer includes two variants; namely, iComFormer that employs invariant geometric descriptors of Euclidean distances and angles, and eComFormer that utilizes equivariant vector representations.  Experimental results demonstrate the state-of-the-art predictive accuracy of ComFormer variants on various tasks across three widely-used crystal benchmarks. Our code is publicly available as part of the AIRS library (https://github.com/divelab/AIRS).",
        "keywords": "crystal material property prediction;geometric graph representation learning",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Keqiang Yan;Cong Fu;Xiaofeng Qian;Xiaoning Qian;Shuiwang Ji",
        "authorids": "~Keqiang_Yan2;~Cong_Fu2;~Xiaofeng_Qian1;~Xiaoning_Qian2;~Shuiwang_Ji1",
        "gender": "M;M;;M;M",
        "homepage": ";https://congfu.github.io/;https://sites.google.com/tamu.edu/qian-group;https://www.ece.tamu.edu/~xqian;http://people.tamu.edu/~sji",
        "dblp": "272/6760;45/3990-3;266/1654;62/4504;84/6405",
        "google_scholar": "cv52C8oAAAAJ;https://scholar.google.is/citations?user=7fv5TGMAAAAJ;bK7fFKoAAAAJ;dXGlddgAAAAJ;BZGj6sAAAAAJ",
        "orcid": ";;0000-0003-1627-288X;0000-0002-4347-2476;0000-0002-4205-4563",
        "linkedin": ";;;;shuiwang-ji-9a040715/",
        "or_profile": "~Keqiang_Yan2;~Cong_Fu2;~Xiaofeng_Qian1;~Xiaoning_Qian2;~Shuiwang_Ji1",
        "aff": "Texas A&M University;Texas A&M;Texas A&M University;Texas A&M;Texas A&M University",
        "aff_domain": "tamu.edu;tamu.edu;tamu.edu;tamu.edu;tamu.edu",
        "position": "PhD student;PhD student;Associate Professor;Full Professor;Professor",
        "bibtex": "@inproceedings{\nyan2024complete,\ntitle={Complete and Efficient Graph Transformers for Crystal Material Property Prediction},\nauthor={Keqiang Yan and Cong Fu and Xiaofeng Qian and Xiaoning Qian and Shuiwang Ji},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=BnQY9XiRAS}\n}",
        "github": "",
        "project": "",
        "reviewers": "v1jy;ZKHH;HGjX;pQH7",
        "pdf_size": 4161449,
        "rating": "3;5;6;6",
        "confidence": "5;3;5;3",
        "soundness": "2;3;2;3",
        "contribution": "1;3;3;2",
        "presentation": "2;2;3;3",
        "wc_summary": "18;120;52;56",
        "wc_strengths": "39;113;38;93",
        "wc_weaknesses": "511;308;101;86",
        "wc_questions": "336;19;96;6",
        "wc_review": "904;560;287;241",
        "wc_reply_reviewers": "806;0;169;0",
        "wc_reply_authors": "5944;1489;1585;127",
        "reply_reviewers": "1;0;2;0",
        "reply_authors": "9;4;4;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.0,
            1.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            61.5,
            36.86122624113311
        ],
        "wc_strengths_avg": [
            70.75,
            33.01798752195536
        ],
        "wc_weaknesses_avg": [
            251.5,
            173.618115414262
        ],
        "wc_questions_avg": [
            114.25,
            132.56767139842202
        ],
        "wc_review_avg": [
            498.0,
            264.220551812307
        ],
        "wc_reply_reviewers_avg": [
            243.75,
            331.8662192812037
        ],
        "wc_reply_authors_avg": [
            2286.25,
            2189.112534224771
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            4.5,
            2.8722813232690143
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.40824829046386296,
        "gs_citation": 16,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6035653717718750965&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=BnQY9XiRAS",
        "pdf": "https://openreview.net/pdf?id=BnQY9XiRAS",
        "email": "tamu.edu;tamu.edu;tamu.edu;tamu.edu;tamu.edu",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Texas A&M University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tamu.edu",
        "aff_unique_abbr": "TAMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Out-Of-Domain Unlabeled Data Improves Generalization",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19202",
        "id": "Bo6GpQ3B9a",
        "author_site": "seyed amir hossein saberi, Amir Najafi, Alireza Heidari, Mohammad Hosein Movasaghinia, Abolfazl Motahari, Babak HosseinKhalaj",
        "tldr": "",
        "abstract": "We propose a novel framework for incorporating unlabeled data into semi-supervised classification problems, where scenarios involving the minimization of either i) adversarially robust or ii) non-robust loss functions have been considered. Notably, we allow the unlabeled samples to deviate slightly (in total variation sense) from the in-domain distribution. The core idea behind our framework is to combine Distributionally Robust Optimization (DRO) with self-supervised training. As a result, we also leverage efficient polynomial-time algorithms for the training stage. From a theoretical standpoint, we apply our framework on the classification problem of a mixture of two Gaussians in $\\mathbb{R}^d$, where in addition to the $m$ independent and labeled samples from the true distribution, a set of $n$ (usually with $n\\gg m$) out of domain and unlabeled samples are gievn as well. Using only the labeled data, it is known that the generalization error can be bounded by $\\propto\\left(d/m\\right)^{1/2}$. However, using our method on both isotropic and non-isotropic Gaussian mixture models, one can derive a new set of analytically explicit and non-asymptotic bounds which show substantial improvement on the generalization error compared ERM. Our results underscore two significant insights: 1) out-of-domain samples, even when unlabeled, can be harnessed to narrow the generalization gap, provided that the true data distribution adheres to a form of the \"cluster assumption\", and 2) the semi-supervised learning paradigm can be regarded as a special case of our framework when there are no distributional shifts. We validate our claims through experiments conducted on a variety of synthetic and real-world datasets.",
        "keywords": "Out-of-domain data;Semi-supervised learing;learning theory;generalization bound;adversarial robustness",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/a2cea249ca3822ce041c96c11af8757a5f681aa1.zip",
        "author": "seyed amir hossein saberi;Amir Najafi;Alireza Heidari;Mohammad Hosein Movasaghinia;Abolfazl Motahari;Babak Khalaj",
        "authorids": "~seyed_amir_hossein_saberi1;~Amir_Najafi1;~Alireza_Heidari2;~Mohammad_Hosein_Movasaghinia1;~Abolfazl_Motahari1;~Babak_Khalaj1",
        "gender": "M;M;M;M;M;M",
        "homepage": ";;https://deepmancer.github.io/;;http://sharif.edu/~motahari/index.html;http://ee.sharif.edu/~khalaj/",
        "dblp": ";00/10958;;359/1723;35/1085;21/6529.html",
        "google_scholar": "OyvmpN4AAAAJ;N_zYPC0AAAAJ;Aw2niikAAAAJ;68otW_4AAAAJ;https://scholar.google.com.tw/citations?user=rJ-biB0AAAAJ;8HsoXAUAAAAJ",
        "orcid": ";0000-0002-6680-0110;0009-0002-6339-2649;0009-0008-2863-0158;;0000-0002-9289-2338",
        "linkedin": "seyed-amir-hossein-saberi-711a7aa8;amir-najafi-6a202346/;alireza-heidari-7b55721bb;mmovasaghi;;",
        "or_profile": "~seyed_amir_hossein_saberi1;~Amir_Najafi1;~Alireza_Heidari2;~Mohammad_Hosein_Movasaghinia1;~Abolfazl_Motahari1;~Babak_Khalaj1",
        "aff": "Sharif University of Technology;Sharif University of Technology;Sharif University of Technology;Sharif University of Technology, Sharif University of Technology;Sharif University of Technology;Sharif University of Technology",
        "aff_domain": "sharif.edu;sharif.edu;sharif.edu;ce.sharif.edu;sharif.edu;sharif.edu",
        "position": "PhD student;Assistant Professor;Undergrad student;MS student;Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\nsaberi2024outofdomain,\ntitle={Out-Of-Domain Unlabeled Data Improves Generalization},\nauthor={seyed amir hossein saberi and Amir Najafi and Alireza Heidari and Mohammad Hosein Movasaghinia and Abolfazl Motahari and Babak Khalaj},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Bo6GpQ3B9a}\n}",
        "github": "",
        "project": "",
        "reviewers": "w3Ke;TZRA;Nric;v7JJ",
        "pdf_size": 487619,
        "rating": "6;6;8;8",
        "confidence": "3;4;3;3",
        "soundness": "2;3;3;3",
        "contribution": "1;2;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "49;74;62;182",
        "wc_strengths": "51;50;55;108",
        "wc_weaknesses": "149;39;117;131",
        "wc_questions": "76;65;25;226",
        "wc_review": "325;228;259;647",
        "wc_reply_reviewers": "556;0;6;14",
        "wc_reply_authors": "2188;541;567;571",
        "reply_reviewers": "4;0;1;1",
        "reply_authors": "6;1;1;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            91.75,
            52.8506149443883
        ],
        "wc_strengths_avg": [
            66.0,
            24.320773014030618
        ],
        "wc_weaknesses_avg": [
            109.0,
            41.97618372363071
        ],
        "wc_questions_avg": [
            98.0,
            76.29875490465096
        ],
        "wc_review_avg": [
            364.75,
            166.67989530834245
        ],
        "wc_reply_reviewers_avg": [
            144.0,
            237.92015467378968
        ],
        "wc_reply_authors_avg": [
            966.75,
            705.1830879282344
        ],
        "reply_reviewers_avg": [
            1.5,
            1.5
        ],
        "reply_authors_avg": [
            2.5,
            2.0615528128088303
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17393750851927978716&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=Bo6GpQ3B9a",
        "pdf": "https://openreview.net/pdf?id=Bo6GpQ3B9a",
        "email": "sharif.edu;sharif.edu;sharif.edu;ce.sharif.edu;sharif.edu;sharif.edu",
        "author_num": 6,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "Sharif University of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sharif.edu",
        "aff_unique_abbr": "SUT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "Iran"
    },
    {
        "id": "BoLqnXEdSE",
        "title": "Measuring Fairness Using Probable Segmentation for Continuous Sensitive Attributes",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Algorithmic fairness in machine learning aims to regulate the bias towards sensitive attributes. In the case of continuous sensitive attributes, however, defining and measuring fairness is a non-trivial task. For instance, estimating a maximum disparity of predictions within a continuous sensitive attribute is vulnerable for an extreme case, whereas a mean disparity of predictions underestimates the effect of the worst case, which is meaningful for testing the independence between the prediction and the sensitive attribute. We address this issue by developing a new definition of fairness, probable demographic parity, based on a maximum prediction disparity of probable segments. We only consider probable segments of the continuous sensitive attribute that have a higher probability than the preset minimum probability condition. Then, we compare the local prediction average of these segments to identify the maximum prediction disparity. By doing so, we ensure a consistent estimation error for the local prediction average of the segment and mitigate the risk of encountering missing data in the segment. We analyze the various theoretical features including stability and independence and experimentally prove the usefulness of the proposed metric.",
        "keywords": "Fairness;Probable Demographic Parity;Continuous Sensitive Attribute",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Eungbeom Kim;Minju Kim;Kunwoong Kim;Insung Kong;Yongdai Kim;Kyogu Lee",
        "authorids": "~Eungbeom_Kim1;~Minju_Kim7;~Kunwoong_Kim1;~Insung_Kong1;~Yongdai_Kim1;~Kyogu_Lee1",
        "gender": ";M;M;M;M;M",
        "homepage": "https://eungkim.github.io/;https://welcome.wonderstic.kr;https://sites.google.com/view/insungkong/home;;http://marg.snu.ac.kr;",
        "dblp": "330/8956;;;93/734;85/6128;296/1715",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;NYdp2FQAAAAJ;;https://scholar.google.com/citations?hl=en;",
        "orcid": "0000-0003-1723-6776;;;;;",
        "linkedin": "eungkim/;;;;;",
        "or_profile": "~Eungbeom_Kim1;~Minju_Kim7;~Insung_Kong1;~Yongdai_Kim1;~Kyogu_Lee1;~Kun_woong_Kim1",
        "aff": "Seoul National University;Seoul National University;Seoul National University;Seoul National University;Seoul National University;Seoul National University",
        "aff_domain": "snu.ac.kr;snu.ac.kr;snu.ac.kr;snu.ac.kr;snu.ac.kr;snu.ac.kr",
        "position": "PhD student;MS student;PhD student;Full Professor;Professor;PhD student",
        "bibtex": "@misc{\nkim2024measuring,\ntitle={Measuring Fairness Using Probable Segmentation for Continuous Sensitive Attributes},\nauthor={Eungbeom Kim and Minju Kim and Kunwoong Kim and Insung Kong and Yongdai Kim and Kyogu Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=BoLqnXEdSE}\n}",
        "github": "",
        "project": "",
        "reviewers": "RKaG;xUa4;kbnN",
        "site": "https://openreview.net/forum?id=BoLqnXEdSE",
        "pdf_size": 3837274,
        "rating": "3;5;6",
        "confidence": "4;4;5",
        "soundness": "3;3;4",
        "contribution": "2;2;3",
        "presentation": "3;3;4",
        "wc_summary": "46;153;359",
        "wc_strengths": "74;108;6",
        "wc_weaknesses": "248;114;10",
        "wc_questions": "84;3;47",
        "wc_review": "452;378;422",
        "wc_reply_reviewers": "0;0;123",
        "wc_reply_authors": "708;569;961",
        "reply_reviewers": "0;0;1",
        "reply_authors": "2;2;2",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            186.0,
            129.89482925300248
        ],
        "wc_strengths_avg": [
            62.666666666666664,
            42.405450383438
        ],
        "wc_weaknesses_avg": [
            124.0,
            97.42005269279352
        ],
        "wc_questions_avg": [
            44.666666666666664,
            33.10924677823738
        ],
        "wc_review_avg": [
            417.3333333333333,
            30.390056853443948
        ],
        "wc_reply_reviewers_avg": [
            41.0,
            57.982756057296896
        ],
        "wc_reply_authors_avg": [
            746.0,
            162.27343179543183
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.7559289460184544,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:oj6gDQl0a_kJ:scholar.google.com/&scioq=Measuring+Fairness+Using+Probable+Segmentation+for+Continuous+Sensitive+Attributes&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "Seoul National University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.snu.ac.kr",
        "aff_unique_abbr": "SNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "BoMvv7ypDF",
        "title": "Recursive Score Estimation Accelerates Diffusion-Based Monte Carlo",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "To sample from a general target distribution $p_*\\propto e^{-f_*}$ beyond the isoperimetric condition, \\citet{huang2023monte} proposed to perform sampling through reverse diffusion, giving rise to *Diffusion-based  Monte Carlo* (DMC). Specifically,  DMC follows the reverse SDE of a diffusion process that transforms the target distribution to the standard Gaussian, utilizing a non-parametric score estimation. However, the original DMC algorithm encountered high gradient complexity, resulting in an *exponential dependency* on the error tolerance $\\epsilon$ of the obtained samples. In this paper, we demonstrate that \nthe high complexity of the original DMC algorithm originates from its redundant design of score estimation, and proposed a  more efficient DMC algorithm, called RS-DMC, based on a novel recursive score estimation method. \n\nIn particular, we first divide the entire diffusion process into multiple segments and then formulate the score estimation step (at any time step) as a series of interconnected mean estimation and sampling subproblems accordingly, which are correlated in a recursive manner. Importantly, we show that with a proper design of the segment decomposition, all sampling subproblems will only need to tackle a strongly log-concave distribution, which can be very efficient to solve using the standard sampler (e.g., Langevin Monte Carlo) with a provably rapid convergence rate. As a result, we prove that the gradient complexity of RS-DMC only has a *quasi-polynomial dependency* on $\\epsilon$, which significantly improves exponential gradient complexity in \\citet{huang2023monte}. \nFurthermore, under commonly used dissipative conditions, our algorithm is provably much faster than the popular Langevin-based algorithms. Our algorithm design and theoretical framework illuminate a novel direction for addressing sampling problems, which could be of broader applicability in the community.",
        "keywords": "posterior sampling;non-isopermetric conditions;Monte Carlo;SDE",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/208ad23f84938b9da7f0c1f1454cfd3bf449073f.zip",
        "author": "Xunpeng Huang;Difan Zou;Hanze Dong;Yian Ma;Tong Zhang",
        "authorids": "~Xunpeng_Huang2;~Difan_Zou1;~Hanze_Dong1;~Yian_Ma1;~Tong_Zhang2",
        "gender": "M;M;M;M;M",
        "homepage": "https://xunpeng746.github.io;https://difanzou.github.io/;https://hendrydong.github.io/;https://sites.google.com/view/yianma;http://tongzhang-ml.org",
        "dblp": ";161/8923;228/7798;;07/4227-1",
        "google_scholar": "T2L6rKcAAAAJ;Cp4fcTQAAAAJ;g9WLzWoAAAAJ;A0TFlacAAAAJ;LurWtuYAAAAJ",
        "orcid": ";;;;0000-0002-5511-2558",
        "linkedin": ";;hanze-dong/;;",
        "or_profile": "~Xunpeng_Huang2;~Difan_Zou1;~Hanze_Dong1;~Yian_Ma1;~Tong_Zhang2",
        "aff": "Hong Kong University of Science and Technology;University of Hong Kong;SalesForce;University of California, San Diego;UIUC",
        "aff_domain": "ust.hk;hku.hk;salesforce.com;ucsd.edu;illinois.edu",
        "position": "PhD student;Assistant Professor;Researcher;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nhuang2024recursive,\ntitle={Recursive Score Estimation Accelerates Diffusion-Based Monte Carlo},\nauthor={Xunpeng Huang and Difan Zou and Hanze Dong and Yian Ma and Tong Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=BoMvv7ypDF}\n}",
        "github": "",
        "project": "",
        "reviewers": "nqUk;FZMK;Rkvn;rqBy;UkCa",
        "site": "https://openreview.net/forum?id=BoMvv7ypDF",
        "pdf_size": 1038484,
        "rating": "3;5;5;8;8",
        "confidence": "4;3;4;2;3",
        "soundness": "3;2;4;3;4",
        "contribution": "3;2;4;4;4",
        "presentation": "4;2;2;3;2",
        "wc_summary": "109;84;152;103;132",
        "wc_strengths": "44;16;79;225;83",
        "wc_weaknesses": "140;41;165;362;72",
        "wc_questions": "80;16;6;287;35",
        "wc_review": "373;157;402;977;322",
        "wc_reply_reviewers": "519;219;104;245;10",
        "wc_reply_authors": "1640;777;903;828;614",
        "reply_reviewers": "3;2;1;2;1",
        "reply_authors": "5;3;3;3;2",
        "rating_avg": [
            5.8,
            1.9390719429665315
        ],
        "confidence_avg": [
            3.2,
            0.7483314773547882
        ],
        "soundness_avg": [
            3.2,
            0.7483314773547882
        ],
        "contribution_avg": [
            3.4,
            0.8
        ],
        "presentation_avg": [
            2.6,
            0.8
        ],
        "wc_summary_avg": [
            116.0,
            23.638950907347812
        ],
        "wc_strengths_avg": [
            89.4,
            72.09049868047799
        ],
        "wc_weaknesses_avg": [
            156.0,
            112.2978183225302
        ],
        "wc_questions_avg": [
            84.8,
            104.24087490039595
        ],
        "wc_review_avg": [
            446.2,
            278.611844687192
        ],
        "wc_reply_reviewers_avg": [
            219.4,
            171.80291033623382
        ],
        "wc_reply_authors_avg": [
            952.4,
            356.64806182005253
        ],
        "reply_reviewers_avg": [
            1.8,
            0.7483314773547883
        ],
        "reply_authors_avg": [
            3.2,
            0.9797958971132712
        ],
        "replies_avg": [
            32,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.7994108773089582,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:TAIBZMWxCDkJ:scholar.google.com/&scioq=Recursive+Score+Estimation+Accelerates+Diffusion-Based+Monte+Carlo&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "Hong Kong University of Science and Technology;University of Hong Kong;Salesforce;University of California, San Diego;University of Illinois Urbana-Champaign",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.ust.hk;https://www.hku.hk;https://www.salesforce.com;https://www.ucsd.edu;https://www illinois.edu",
        "aff_unique_abbr": "HKUST;HKU;Salesforce;UCSD;UIUC",
        "aff_campus_unique_index": "0;0;2;3",
        "aff_campus_unique": "Hong Kong SAR;;San Diego;Urbana-Champaign",
        "aff_country_unique_index": "0;0;1;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "BocDxVylBs",
        "title": "Harnessing the Power of Federated Learning in Federated Contextual Bandits",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Federated contextual bandits (FCB), a pivotal integration of federated learning (FL) and sequential decision-making, has garnered significant attention in recent years. Prior research on FCB can be understood as specific instantiations of a unified design principle articulated in this paper: \"FCB = FL + CB\". Here, FL enhances agents' performance by aggregating the information of other agents' local data to better contextual bandits (CB) policies. Nevertheless, it is evident that existing approaches largely employ tailored FL protocols, often deviating from the canonical FL framework. Consequently, even renowned algorithms like FedAvg remain underutilized in FCB, let alone other FL advancements. To bridge this gap between the canonical FL study and the FL component in FCB, our work introduces a novel FCB design, termed FedIGW, that incorporates inverse gap weighting as the CB algorithm. This design permits the integration of versatile FL protocols as long as they can solve a standard FL problem. With this flexible FL choice, FedIGW advances FCB research by enabling the utilization of the entire spectrum of FL innovations, encompassing canonical algorithmic designs (e.g., FedAvg and SCAFFOLD), convergence analyses, and valuable extensions (such as personalization, robustness, and privacy). We substantiate these claims through rigorous theoretical analyses and empirical evaluations.",
        "keywords": "Contextual Bandits;Federated Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/b514c16a93e6d3f229058369bdd44f127859e624.zip",
        "author": "Chengshuai Shi;Ruida Zhou;Kun Yang;Cong Shen",
        "authorids": "~Chengshuai_Shi1;~Ruida_Zhou1;~Kun_Yang7;~Cong_Shen1",
        "gender": "M;M;M;M",
        "homepage": "https://chengshuai-shi.github.io/;https://sites.google.com/view/ruida-zhou;;https://cshen317.github.io/",
        "dblp": "259/3938;215/2026;;79/6027-1.html",
        "google_scholar": "twvDiW8AAAAJ;kXbo1twAAAAJ;-BzQrlgAAAAJ;70LBhKcAAAAJ",
        "orcid": "0000-0002-2727-8251;;;0000-0002-3148-4453",
        "linkedin": ";;;cong-shen-3372404/",
        "or_profile": "~Chengshuai_Shi1;~Ruida_Zhou1;~Kun_Yang7;~Cong_Shen1",
        "aff": "University of Virginia;University of California, Los Angeles;University of Virginia, Charlottesville;University of Virginia",
        "aff_domain": "virginia.edu;ucla.edu;virginia.edu;virginia.edu",
        "position": "PhD student;Postdoc;PhD student;Assistant Professor",
        "bibtex": "@misc{\nshi2024harnessing,\ntitle={Harnessing the Power of Federated Learning in Federated Contextual Bandits},\nauthor={Chengshuai Shi and Ruida Zhou and Kun Yang and Cong Shen},\nyear={2024},\nurl={https://openreview.net/forum?id=BocDxVylBs}\n}",
        "github": "",
        "project": "",
        "reviewers": "Non5;jNg7;YJux",
        "site": "https://openreview.net/forum?id=BocDxVylBs",
        "pdf_size": 2157180,
        "rating": "3;5;5",
        "confidence": "4;3;3",
        "soundness": "3;3;3",
        "contribution": "2;2;2",
        "presentation": "3;3;3",
        "wc_summary": "44;108;92",
        "wc_strengths": "13;31;44",
        "wc_weaknesses": "35;208;288",
        "wc_questions": "97;79;53",
        "wc_review": "189;426;477",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            81.33333333333333,
            27.19477073916152
        ],
        "wc_strengths_avg": [
            29.333333333333332,
            12.710450643291745
        ],
        "wc_weaknesses_avg": [
            177.0,
            105.58724670464073
        ],
        "wc_questions_avg": [
            76.33333333333333,
            18.06162291219209
        ],
        "wc_review_avg": [
            364.0,
            125.4830665866913
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9999999999999998,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4624404166240586389&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "University of Virginia;University of California, Los Angeles",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.virginia.edu;https://www.ucla.edu",
        "aff_unique_abbr": "UVA;UCLA",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Los Angeles;Charlottesville",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "BpAxeHmQ94",
        "title": "Provably Robust Cost-Sensitive Learning via Randomized Smoothing",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We focus on learning adversarially robust classifiers under a cost-sensitive scenario, where the potential harm of different classwise adversarial transformations is encoded in a binary cost matrix. Existing methods are either empirical that cannot certify robustness or suffer from inherent scalability issues. In this work, we study whether randomized smoothing, a scalable certification framework, can be leveraged to certify cost-sensitive robustness. Built upon a notion of cost-sensitive certified radius, we show how to adapt the standard randomized smoothing certification pipeline to produce tight robustness guarantees for any given cost matrix. In addition, with fine-grained certified radius optimization schemes designed for different data subgroups, we propose an algorithm to train smoothed classifiers that are optimized for cost-sensitive robustness. Extensive experiments on image benchmarks and a real-world medical dataset demonstrate the superiority of our method in achieving significantly improved performance of certified cost-sensitive robustness while having a negligible impact on overall accuracy.",
        "keywords": "robustness certification;randomized smoothing;cost-sensitive learning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Yuan Xin;Michael Backes;Xiao Zhang",
        "authorids": "~Yuan_Xin2;~Michael_Backes3;~Xiao_Zhang2",
        "gender": "F;;M",
        "homepage": "https://applexy.github.io;;https://xiao-zhang.net",
        "dblp": ";;",
        "google_scholar": ";;L-lz7CUAAAAJ",
        "orcid": ";;0009-0008-1837-7670",
        "linkedin": ";;",
        "or_profile": "~Yuan_Xin2;~Michael_Backes3;~Xiao_Zhang2",
        "aff": "CISPA, saarland university, saarland informatics campus;;CISPA Helmholtz Center for Information Security",
        "aff_domain": "cispa.saarland;;cispa.de",
        "position": "PhD student;;Tenure-Track Faculty",
        "bibtex": "@misc{\nxin2024provably,\ntitle={Provably Robust Cost-Sensitive Learning via Randomized Smoothing},\nauthor={Yuan Xin and Michael Backes and Xiao Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=BpAxeHmQ94}\n}",
        "github": "",
        "project": "",
        "reviewers": "F4hf;i4At;B2mS;oovB",
        "site": "https://openreview.net/forum?id=BpAxeHmQ94",
        "pdf_size": 573855,
        "rating": "3;3;3;6",
        "confidence": "5;4;4;3",
        "soundness": "3;3;2;3",
        "contribution": "2;1;2;2",
        "presentation": "3;3;2;3",
        "wc_summary": "29;147;93;43",
        "wc_strengths": "24;21;14;73",
        "wc_weaknesses": "216;305;154;79",
        "wc_questions": "5;60;121;24",
        "wc_review": "274;533;382;219",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            78.0,
            46.400431032480725
        ],
        "wc_strengths_avg": [
            33.0,
            23.37733945512192
        ],
        "wc_weaknesses_avg": [
            188.5,
            82.92918665946266
        ],
        "wc_questions_avg": [
            52.5,
            44.206899913927465
        ],
        "wc_review_avg": [
            352.0,
            119.82695856943045
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:u-JfjomcepgJ:scholar.google.com/&scioq=Provably+Robust+Cost-Sensitive+Learning+via+Randomized+Smoothing&hl=en&as_sdt=0,5",
        "gs_version_total": 6,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Saarland University;CISPA Helmholtz Center for Information Security",
        "aff_unique_dep": "CISPA;",
        "aff_unique_url": "https://www.uni-saarland.de;https://www.cispa.de/",
        "aff_unique_abbr": "Saarland U;CISPA",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Saarland Informatics Campus;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Germany"
    },
    {
        "title": "Fast-DetectGPT: Efficient Zero-Shot Detection of Machine-Generated Text via Conditional Probability Curvature",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19201",
        "id": "Bpcgcr8E8Z",
        "author_site": "Guangsheng Bao, Yanbin Zhao, Zhiyang Teng, Linyi Yang, Yue Zhang",
        "tldr": "",
        "abstract": "Large language models (LLMs) have shown the ability to produce fluent and cogent content, presenting both productivity opportunities and societal risks. To build trustworthy AI systems, it is imperative to distinguish between machine-generated and human-authored content. The leading zero-shot detector, DetectGPT, showcases commendable performance but is marred by its intensive computational  costs. In this paper, we introduce the concept of **conditional probability curvature** to elucidate discrepancies in word choices between LLMs and humans within a given context. Utilizing this curvature as a foundational metric, we present **Fast-DetectGPT**, an optimized zero-shot detector, which substitutes DetectGPT's perturbation step with a more efficient sampling step. Our evaluations on various datasets, source models, and test conditions indicate that Fast-DetectGPT not only surpasses DetectGPT by a relative around 75\\% in both the white-box and black-box settings but also accelerates the detection process by a factor of 340, as detailed in Table 1.",
        "keywords": "Fake Detection;Machine-Generated Text Detection;Zero-Shot Detection",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Guangsheng Bao;Yanbin Zhao;Zhiyang Teng;Linyi Yang;Yue Zhang",
        "authorids": "~Guangsheng_Bao1;~Yanbin_Zhao2;~Zhiyang_Teng1;~Linyi_Yang1;~Yue_Zhang7",
        "gender": "M;F;M;;M",
        "homepage": "https://baoguangsheng.github.io/;;https://zeeeyang.github.io;https://yanglinyi.github.io/;http://frcchang.github.io",
        "dblp": "276/0515;;136/8660;218/8007;47/722-4",
        "google_scholar": "cxPJx2kAAAAJ;;9wOJrf8AAAAJ;go3sFxcAAAAJ;",
        "orcid": "0000-0003-3815-3988;0000-0001-5415-2358;;;0000-0002-5214-2268",
        "linkedin": ";;;;",
        "or_profile": "~Guangsheng_Bao1;~Yanbin_Zhao2;~Zhiyang_Teng1;~Linyi_Yang1;~Yue_Zhang7",
        "aff": "Westlake University;Shanghai Polytechnic University;ByteDance Inc.;Westlake University;Westlake University",
        "aff_domain": "westlake.edu.cn;sspu.edu.cn;bytedance.com;westlake.edu.cn;westlake.edu.cn",
        "position": "PhD student;Associate Professor;Researcher;Researcher;Full Professor",
        "bibtex": "@inproceedings{\nbao2024fastdetectgpt,\ntitle={Fast-Detect{GPT}: Efficient Zero-Shot Detection of Machine-Generated Text via Conditional Probability Curvature},\nauthor={Guangsheng Bao and Yanbin Zhao and Zhiyang Teng and Linyi Yang and Yue Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Bpcgcr8E8Z}\n}",
        "github": "",
        "project": "",
        "reviewers": "ubhC;7WUs;RgLj;nx1F;aeWx",
        "pdf_size": 791784,
        "rating": "6;6;6;8;8",
        "confidence": "4;3;5;4;4",
        "soundness": "3;3;2;3;3",
        "contribution": "2;3;1;2;4",
        "presentation": "2;2;2;3;4",
        "wc_summary": "101;67;99;39;85",
        "wc_strengths": "57;42;102;118;46",
        "wc_weaknesses": "219;55;178;139;152",
        "wc_questions": "50;36;35;7;17",
        "wc_review": "427;200;414;303;300",
        "wc_reply_reviewers": "0;0;9;0;0",
        "wc_reply_authors": "500;266;838;289;461",
        "reply_reviewers": "0;0;1;0;0",
        "reply_authors": "1;1;2;1;1",
        "rating_avg": [
            6.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.4,
            1.019803902718557
        ],
        "presentation_avg": [
            2.6,
            0.8
        ],
        "wc_summary_avg": [
            78.2,
            23.068593368473945
        ],
        "wc_strengths_avg": [
            73.0,
            31.02257242718598
        ],
        "wc_weaknesses_avg": [
            148.6,
            54.194464661992924
        ],
        "wc_questions_avg": [
            29.0,
            15.192103211866355
        ],
        "wc_review_avg": [
            328.8,
            83.65022414793638
        ],
        "wc_reply_reviewers_avg": [
            1.8,
            3.6000000000000005
        ],
        "wc_reply_authors_avg": [
            470.8,
            205.31867913076005
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            1.2,
            0.4
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 146,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5808426526727311301&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=Bpcgcr8E8Z",
        "pdf": "https://openreview.net/pdf?id=Bpcgcr8E8Z",
        "email": "westlake.edu.cn;sspu.edu.cn;bytedance.com;westlake.edu.cn;westlake.edu.cn",
        "author_num": 5,
        "aff_unique_index": "0;1;2;0;0",
        "aff_unique_norm": "Westlake University;Shanghai Polytechnic University;ByteDance",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.westlake.edu.cn;https://www.shpupu.edu.cn;https://www.bytedance.com",
        "aff_unique_abbr": "WU;SPU;ByteDance",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Stochastic Modified Equations and Dynamics of Dropout Algorithm",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19200",
        "id": "Bpkhu2ExxU",
        "author_site": "Zhongwang Zhang, Yuqing Li, Tao Luo, Zhiqin Xu",
        "tldr": "",
        "abstract": "Dropout is a widely utilized regularization technique in the training of neural networks, nevertheless, its underlying mechanism and impact on achieving good generalization abilities remain to be further understood. In this work, we start by undertaking a rigorous theoretical derivation of the stochastic modified equations, with the primary aim of providing an effective approximation for the discrete iterative process of dropout. Meanwhile, we experimentally verify SDE's ability to approximate dropout under a wider range of settings. Subsequently, we empirically delve into the intricate mechanisms by which dropout facilitates the identification of flatter minima. This exploration is conducted through intuitive approximations, exploiting the structural analogies inherent in the Hessian of loss landscape and the covariance of dropout. Our empirical findings substantiate the ubiquitous presence of the Hessian-variance alignment relation throughout the training process of dropout.",
        "keywords": "Stochastic modified equations;dropout;noise structure;flatness",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/c03b2d5a55f17542b046034bef84abc3eb509b74.zip",
        "author": "Zhongwang Zhang;Yuqing Li;Tao Luo;Zhi-Qin John Xu",
        "authorids": "~Zhongwang_Zhang1;~Yuqing_Li3;~Tao_Luo3;~Zhi-Qin_John_Xu1",
        "gender": ";M;;",
        "homepage": "https://sjtuzzw.github.io/;https://math.sjtu.edu.cn/Default/faculty/pages/MDAwMDAwMDAwMLKFbqE;;",
        "dblp": "293/9763;;;",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com.hk/citations?hl=en;;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Zhongwang_Zhang1;~Yuqing_Li3;~Tao_Luo3;~Zhi-Qin_John_Xu1",
        "aff": "Shanghai Jiaotong University;Shanghai Jiaotong University;;",
        "aff_domain": "sjtu.edu.cn;sjtu.edu.cn;;",
        "position": "PhD student;Postdoc;;",
        "bibtex": "@inproceedings{\nzhang2024stochastic,\ntitle={Stochastic Modified Equations and Dynamics of Dropout Algorithm},\nauthor={Zhongwang Zhang and Yuqing Li and Tao Luo and Zhi-Qin John Xu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Bpkhu2ExxU}\n}",
        "github": "",
        "project": "",
        "reviewers": "hhFg;h4F1;25p8;Dhk2",
        "pdf_size": 0,
        "rating": "6;6;6;8",
        "confidence": "4;4;2;3",
        "soundness": "3;4;3;3",
        "contribution": "3;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "113;92;111;47",
        "wc_strengths": "21;58;77;68",
        "wc_weaknesses": "358;205;59;17",
        "wc_questions": "42;352;62;103",
        "wc_review": "534;707;309;235",
        "wc_reply_reviewers": "224;274;0;45",
        "wc_reply_authors": "1766;2061;834;729",
        "reply_reviewers": "2;2;0;1",
        "reply_authors": "4;4;2;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            90.75,
            26.55536668924005
        ],
        "wc_strengths_avg": [
            56.0,
            21.295539439046856
        ],
        "wc_weaknesses_avg": [
            159.75,
            134.05106303196555
        ],
        "wc_questions_avg": [
            139.75,
            124.49974899573091
        ],
        "wc_review_avg": [
            446.25,
            186.5172579146498
        ],
        "wc_reply_reviewers_avg": [
            135.75,
            115.72029856511777
        ],
        "wc_reply_authors_avg": [
            1347.5,
            576.7254546142384
        ],
        "reply_reviewers_avg": [
            1.25,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.0,
            1.0
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.17407765595569782,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18042509169071076461&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=Bpkhu2ExxU",
        "pdf": "https://openreview.net/pdf?id=Bpkhu2ExxU",
        "email": "sjtu.edu.cn;sjtu.edu.cn;;",
        "author_num": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Shanghai Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sjtu.edu.cn",
        "aff_unique_abbr": "SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Enhancing Human Experience in Human-Agent Collaboration: A Human-Centered Modeling Approach Based on Positive Human Gain",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19199",
        "id": "BqEvdOS1Hs",
        "author_site": "Yiming Gao, Feiyu Liu, Liang Wang, Dehua Zheng, Zhenjie Lian, Weixuan Wang, Wenjin Yang, Siqin Li, Xianliang Wang, Wenhui Chen, Jing Dai, QIANG FU, Yang Wei, Lanxiao Huang, Wei Liu",
        "tldr": "",
        "abstract": "Existing game AI research mainly focuses on enhancing agents' abilities to win games, but this does not inherently make humans have a better experience when collaborating with these agents. For example, agents may dominate the collaboration and exhibit unintended or detrimental behaviors, leading to poor experiences for their human partners. In other words, most game AI agents are modeled in a \"self-centered\" manner. In this paper, we propose a \"human-centered\" modeling scheme for collaborative agents that aims to enhance the experience of humans. Specifically, we model the experience of humans as the goals they expect to achieve during the task. We expect that agents should learn to enhance the extent to which humans achieve these goals while maintaining agents' original abilities (e.g., winning games). To achieve this, we propose the Reinforcement Learning from Human Gain (RLHG) approach. The RLHG approach introduces a \"baseline\", which corresponds to the extent to which humans primitively achieve their goals, and encourages agents to learn behaviors that can effectively enhance humans in achieving their goals better. We evaluate the RLHG agent in the popular Multi-player Online Battle Arena (MOBA) game, Honor of Kings, by conducting real-world human-agent tests. Both objective performance and subjective preference results show that the RLHG agent provides participants better gaming experience.",
        "keywords": "human enhancement;human-agent collaboration;game playing;deep reinforcement learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Yiming Gao;Feiyu Liu;Liang Wang;Dehua Zheng;Zhenjie Lian;Weixuan Wang;Wenjin Yang;Siqin Li;Xianliang Wang;Wenhui Chen;Jing Dai;QIANG FU;Yang Wei;Lanxiao Huang;Wei Liu",
        "authorids": "~Yiming_Gao4;~Feiyu_Liu1;~Liang_Wang10;~Dehua_Zheng1;~Zhenjie_Lian1;~Weixuan_Wang1;~Wenjin_Yang2;~Siqin_Li1;~Xianliang_Wang1;~Wenhui_Chen1;~Jing_Dai2;~QIANG_FU8;~Yang_Wei2;~Lanxiao_Huang1;~Wei_Liu3",
        "gender": "M;;M;M;;M;M;;M;;M;M;M;M;M",
        "homepage": ";;;https://github.com/dwardzheng;;;;;;;https://github.com/daijing5763;;;;https://sites.google.com/view/cuweiliu",
        "dblp": "304/8689;https://dblp.uni-trier.de/pid/269/4504.html;56/4499.html;262/2272;279/6569.html;;62/10863;274/6530.html;03/1094.html;;;;03/1094-32.html;255/6012.html;49/3283-5",
        "google_scholar": "https://scholar.google.com.hk/citations?user=UvvufgQAAAAJ;;;;;https://scholar.google.com.hk/citations?user=VN4m3l8AAAAJ;;;;;;gANaxT0AAAAJ;;;AjxoEpIAAAAJ",
        "orcid": ";;;;;;0009-0008-1786-8398;;;;;;;;0000-0002-3865-8145",
        "linkedin": ";;;;;;;;;;;;;;",
        "or_profile": "~Yiming_Gao4;~Feiyu_Liu1;~Liang_Wang10;~Dehua_Zheng1;~Zhenjie_Lian1;~Weixuan_Wang1;~Wenjin_Yang2;~Siqin_Li1;~Xianliang_Wang1;~Wenhui_Chen1;~Jing_Dai2;~QIANG_FU8;~Yang_Wei2;~Lanxiao_Huang1;~Wei_Liu3",
        "aff": "Tencent AI Lab;Tencent AI Lab;Tencent AI Lab;Huazhong University of Science and Technology;Tencent AI Lab;Tencent AI Lab;Tencent AI Lab;Tencent AI Lab;Tencent AI Lab;;;Tencent AI Lab;Tencent AI Lab;Tencent TiMi L1 Studio;Tencent",
        "aff_domain": "tencent.com;tencent.com;tencent.com;hust.edu.cn;tencent.com;tencent.com;tencent.com;tencent.com;tencent.com;;;tencent.com;tencent.com;tencent.com;tencent.com",
        "position": "Researcher;Researcher;Researcher;MS student;Researcher;Researcher;Researcher;Researcher;Researcher;;;Principal Researcher;Researcher;Researcher;Distinguished Scientist",
        "bibtex": "@inproceedings{\ngao2024enhancing,\ntitle={Enhancing Human Experience in Human-Agent Collaboration: A Human-Centered Modeling Approach Based on Positive Human Gain},\nauthor={Yiming Gao and Feiyu Liu and Liang Wang and Dehua Zheng and Zhenjie Lian and Weixuan Wang and Wenjin Yang and Siqin Li and Xianliang Wang and Wenhui Chen and Jing Dai and QIANG FU and Yang Wei and Lanxiao Huang and Wei Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=BqEvdOS1Hs}\n}",
        "github": "",
        "project": "",
        "reviewers": "qZtz;uNSX;zdWR",
        "pdf_size": 16717947,
        "rating": "6;6;6",
        "confidence": "4;2;4",
        "soundness": "2;3;3",
        "contribution": "3;4;3",
        "presentation": "1;2;3",
        "wc_summary": "164;142;84",
        "wc_strengths": "78;37;68",
        "wc_weaknesses": "431;172;75",
        "wc_questions": "59;158;2",
        "wc_review": "732;509;229",
        "wc_reply_reviewers": "197;0;0",
        "wc_reply_authors": "856;349;173",
        "reply_reviewers": "1;0;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            130.0,
            33.7441352929167
        ],
        "wc_strengths_avg": [
            61.0,
            17.45470328211473
        ],
        "wc_weaknesses_avg": [
            226.0,
            150.26864831583023
        ],
        "wc_questions_avg": [
            73.0,
            64.45153217728807
        ],
        "wc_review_avg": [
            490.0,
            205.7879167168633
        ],
        "wc_reply_reviewers_avg": [
            65.66666666666667,
            92.86669059583322
        ],
        "wc_reply_authors_avg": [
            459.3333333333333,
            289.5425510851365
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            15,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2457468243408851296&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=BqEvdOS1Hs",
        "pdf": "https://openreview.net/pdf?id=BqEvdOS1Hs",
        "email": "tencent.com;tencent.com;tencent.com;hust.edu.cn;tencent.com;tencent.com;tencent.com;tencent.com;tencent.com;;;tencent.com;tencent.com;tencent.com;tencent.com",
        "author_num": 15,
        "aff_unique_index": "0;0;0;1;0;0;0;0;0;0;0;0;0",
        "aff_unique_norm": "Tencent;Huazhong University of Science and Technology",
        "aff_unique_dep": "Tencent AI Lab;",
        "aff_unique_url": "https://ai.tencent.com;http://www.hust.edu.cn",
        "aff_unique_abbr": "Tencent AI Lab;HUST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "LLM-CXR: Instruction-Finetuned LLM for CXR Image Understanding and Generation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19198",
        "id": "BqHaLnans2",
        "author_site": "Suhyeon Lee, Won Jun Kim, Jinho Chang, Jong Chul YE",
        "tldr": "",
        "abstract": "Following the impressive development of LLMs, vision-language alignment in LLMs is actively being researched to enable multimodal reasoning and visual input/output. This direction of research is particularly relevant to medical imaging because accurate medical image analysis and generation consist of a combination of reasoning based on visual features and prior knowledge. Many recent works have focused on training adapter networks that serve as an information bridge between image processing (encoding or generating) networks and LLMs; but presumably, in order to achieve maximum reasoning potential of LLMs on visual information as well, visual and language features should be allowed to interact more freely. This is especially important in the medical domain because understanding and generating medical images such as chest X-rays (CXR) require not only accurate visual and language-based reasoning but also a more intimate mapping between the two modalities. Thus, taking inspiration from previous work on the transformer and VQ-GAN combination for bidirectional image and text generation, we build upon this approach and develop a method for instruction-tuning an LLM pre-trained only on text to gain vision-language capabilities for medical images. Specifically, we leverage a pretrained LLM\u2019s existing question-answering and instruction-following abilities to teach it to understand visual inputs by instructing it to answer questions about image inputs and, symmetrically, output both text and image responses appropriate to a given query by tuning the LLM with diverse tasks that encompass image-based text-generation and text-based image-generation. We show that our LLM-CXR trained in this approach shows better image-text alignment in both CXR understanding and generation tasks while being smaller in size compared to previously developed models that perform a narrower range of tasks.",
        "keywords": "large language model;multimodal;medical imaging;chest X-ray;bidirectional;instruction-tuning;vision-question answering",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Suhyeon Lee;Won Jun Kim;Jinho Chang;Jong Chul Ye",
        "authorids": "~Suhyeon_Lee2;~Won_Jun_Kim1;~Jinho_Chang1;~Jong_Chul_Ye1",
        "gender": "M;M;M;M",
        "homepage": "https://github.com/hyn2028;https://github.com/chonky-moose;;https://bispl.weebly.com/",
        "dblp": "342/2820;;334/2104;15/5613",
        "google_scholar": "V9rMrFQAAAAJ;;https://scholar.google.com/citations?hl=en;HNMjoNEAAAAJ",
        "orcid": ";;0000-0002-7426-8304;",
        "linkedin": ";;;",
        "or_profile": "~Suhyeon_Lee2;~Won_Jun_Kim1;~Jinho_Chang1;~Jong_Chul_Ye1",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr;kaist.edu;kaist.ac.kr",
        "position": "MS student;MS student;PhD student;Full Professor",
        "bibtex": "@inproceedings{\nlee2024llmcxr,\ntitle={{LLM}-{CXR}: Instruction-Finetuned {LLM} for {CXR} Image Understanding and Generation},\nauthor={Suhyeon Lee and Won Jun Kim and Jinho Chang and Jong Chul Ye},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=BqHaLnans2}\n}",
        "github": "",
        "project": "",
        "reviewers": "MXmf;FRze;xBeK;3hh7;DPiA",
        "pdf_size": 32160645,
        "rating": "5;6;6;6;8",
        "confidence": "4;4;4;3;2",
        "soundness": "2;3;3;3;3",
        "contribution": "3;2;2;3;3",
        "presentation": "2;2;2;3;4",
        "wc_summary": "117;141;44;103;31",
        "wc_strengths": "20;171;38;129;58",
        "wc_weaknesses": "331;333;235;88;7",
        "wc_questions": "2;13;106;148;45",
        "wc_review": "470;658;423;468;141",
        "wc_reply_reviewers": "45;19;26;12;148",
        "wc_reply_authors": "940;850;885;746;627",
        "reply_reviewers": "1;1;1;1;1",
        "reply_authors": "2;2;2;2;2",
        "rating_avg": [
            6.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.4,
            0.8
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.6,
            0.8
        ],
        "wc_summary_avg": [
            87.2,
            42.56007518790351
        ],
        "wc_strengths_avg": [
            83.2,
            57.40871014053529
        ],
        "wc_weaknesses_avg": [
            198.8,
            131.0425884970226
        ],
        "wc_questions_avg": [
            62.8,
            55.890607439891006
        ],
        "wc_review_avg": [
            432.0,
            166.48002883228966
        ],
        "wc_reply_reviewers_avg": [
            50.0,
            50.21951811795888
        ],
        "wc_reply_authors_avg": [
            809.6,
            111.09383421234502
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8675276172357089,
        "gs_citation": 56,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11025168978845469940&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=BqHaLnans2",
        "pdf": "https://openreview.net/pdf?id=BqHaLnans2",
        "email": "kaist.ac.kr;kaist.ac.kr;kaist.edu;kaist.ac.kr",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "BqJamqGwp1",
        "title": "Bit Cipher \u2014 A Simple yet Powerful Word Representation System that Integrates Efficiently with Language-Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "While Large Language Models (LLMs) become ever more dominant, classic pre-trained word embeddings sustain their relevance through computational efficiency and nuanced linguistic interpretation. Drawing from recent studies demonstrating that the convergence of GloVe and word2vec optimizations _all_ tend towards log-co-occurrence matrix variants, we construct a novel word representation system called  _**Bit-cipher**_ that eliminates the need of backpropagation while leveraging contextual information and hyper-efficient dimensionality reduction techniques based on unigram frequency, providing strong interpretability, alongside efficiency. \nWe use the bit-cipher algorithm to train word vectors via a two-step process that critically relies on a hyperparameter---_bits_---that controls the vector dimension. While the first step trains the bit-cipher, the second utilizes it under two different aggregation modes---_summation_ or _concatenation_---to produce contextually rich representations from word co-occurrences. \nWe extend our investigation into bit-cipher's efficacy, performing probing experiments on part-of-speech (POS) tagging and named entity recognition (NER) to assess its competitiveness with classic embeddings like word2vec and GloVe. Additionally, we explore its applicability in LM training and fine-tuning. By replacing embedding layers with cipher embeddings, our experiments illustrate the notable efficiency of cipher in accelerating the training process and attaining better optima compared to conventional training paradigms. In fine-tuning experiments, training cipher embeddings on target datasets and replacing the embedding layer of the LMs to be fine-tuned negates the need for extensive model adjustments, offering a highly efficient transfer learning alternative. Experiments on the integration of bit-cipher embedding layers with Roberta, T5, and OPT, prior to or as a substitute for fine-tuning, showcase a promising enhancement to transfer learning, allowing rapid model convergence while preserving competitive performance.",
        "keywords": "representation learning;word embedding;efficient NLP;language language model training;fine-tuning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Haoran Zhao;Jake Ryland Williams",
        "authorids": "~Haoran_Zhao2;~Jake_Ryland_Williams2",
        "gender": "M;M",
        "homepage": "https://hrjzhao.github.io/;https://jakerylandwilliams.github.io/",
        "dblp": ";",
        "google_scholar": "yNRZK2EAAAAJ;",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Haoran_Zhao2;~Jake_Williams1",
        "aff": "Drexel University;Drexel University",
        "aff_domain": "drexel.edu;drexel.edu",
        "position": "Undergrad student;Assistant Professor",
        "bibtex": "@misc{\nzhao2024bit,\ntitle={Bit Cipher {\\textemdash} A Simple yet Powerful Word Representation System that Integrates Efficiently with Language-Models},\nauthor={Haoran Zhao and Jake Ryland Williams},\nyear={2024},\nurl={https://openreview.net/forum?id=BqJamqGwp1}\n}",
        "github": "",
        "project": "",
        "reviewers": "eyQ8;WMqp;Py7Q",
        "site": "https://openreview.net/forum?id=BqJamqGwp1",
        "pdf_size": 957168,
        "rating": "3;3;3",
        "confidence": "4;3;4",
        "soundness": "2;2;2",
        "contribution": "2;2;2",
        "presentation": "2;1;2",
        "wc_summary": "63;52;77",
        "wc_strengths": "27;21;25",
        "wc_weaknesses": "140;77;53",
        "wc_questions": "35;2;61",
        "wc_review": "265;152;216",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            64.0,
            10.23067283548187
        ],
        "wc_strengths_avg": [
            24.333333333333332,
            2.494438257849294
        ],
        "wc_weaknesses_avg": [
            90.0,
            36.68787265568828
        ],
        "wc_questions_avg": [
            32.666666666666664,
            24.143091949642425
        ],
        "wc_review_avg": [
            211.0,
            46.26733909213568
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:tdgA-p1Z19AJ:scholar.google.com/&scioq=Bit+Cipher+%E2%80%94+A+Simple+yet+Powerful+Word+Representation+System+that+Integrates+Efficiently+with+Language-Models&hl=en&as_sdt=0,33",
        "gs_version_total": 6,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Drexel University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.drexel.edu",
        "aff_unique_abbr": "Drexel",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "BqM0rg1wDW",
        "title": "PETNet - Coincident Particle Event Detection using Spiking Neural Networks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Spiking neural networks (SNN) hold the promise of being a more biologically plausible, low-energy alternative to conventional artificial neural networks. Their time-variant nature makes them particularly suitable for processing time-resolved, sparse binary data.\nIn this paper, we investigate the potential of leveraging SNNs for the detection of photon coincidences in positron emission tomography (PET) data.  PET is a medical imaging technique based on injecting a patient with a radioactive tracer and detecting the emitted photons. One central post-processing task for inferring an image of the tracer distribution is the filtering of invalid hits occurring due to e.g. absorption or scattering processes. Our approach, coined PETNet, interprets the detector hits as a binary-valued spike train and learns to identify photon coincidence pairs in a supervised manner. We introduce a dedicated multi-objective loss function and demonstrate the effects of explicitly modeling the detector geometry on simulation data for two use-cases. Our results show that PETNet can outperform the state-of-the-art classical algorithm with a maximal coincidence detection $F_1$ of 95.2\\%. At the same time, PETNet is able to predict photon coincidences up to 36 times faster than the classical approach, highlighting the great potential of SNNs in particle physics applications.",
        "keywords": "Spiking Neural Networks;Positron Emission Tomography;Coincidence Detection;Multi-Objective Loss;Data-Parallel Neural Networks",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/0d860ab1ae5dcb798dc9b6447b6add859bcfffa0.pdf",
        "author": "Jan Debus;Charlotte Debus;G\u00fcnther Dissertori;Markus G\u00f6tz",
        "authorids": "~Jan_Debus1;~Charlotte_Debus1;~G\u00fcnther_Dissertori1;~Markus_G\u00f6tz1",
        "gender": "M;F;M;M",
        "homepage": "https://www.phys.ethz.ch/de/das-departement/personen/person-detail.MjYxNTQy.TGlzdC81MTUsMTE3MjU5OTI5OQ==.html;;https://dissertori-group.ethz.ch;https://www.scc.kit.edu/personen/11452.php",
        "dblp": ";;;70/8283",
        "google_scholar": ";https://scholar.google.com/citations?hl=de;;https://scholar.google.de/citations?user=eD2svJQAAAAJ",
        "orcid": ";0000-0002-7156-2022;;0000-0002-2233-1041",
        "linkedin": ";;;",
        "or_profile": "~Jan_Debus1;~Charlotte_Debus1;~G\u00fcnther_Dissertori1;~Markus_G\u00f6tz1",
        "aff": "ETHZ - ETH Zurich;Karlsruher Institut f\u00fcr Technologie;ETHZ - ETH Zurich;Karlsruhe Institute of Technology",
        "aff_domain": "ethz.ch;kit.edu;ethz.ch;kit.edu",
        "position": "PhD student;Principal Researcher;Full Professor;Principal Researcher",
        "bibtex": "@misc{\ndebus2024petnet,\ntitle={{PETN}et - Coincident Particle Event Detection using Spiking Neural Networks},\nauthor={Jan Debus and Charlotte Debus and G{\\\"u}nther Dissertori and Markus G{\\\"o}tz},\nyear={2024},\nurl={https://openreview.net/forum?id=BqM0rg1wDW}\n}",
        "github": "",
        "project": "",
        "reviewers": "xnxs;ccA4;iojo",
        "site": "https://openreview.net/forum?id=BqM0rg1wDW",
        "pdf_size": 310283,
        "rating": "3;5;5",
        "confidence": "5;2;4",
        "soundness": "3;2;3",
        "contribution": "2;2;3",
        "presentation": "2;3;3",
        "wc_summary": "50;64;31",
        "wc_strengths": "32;47;3",
        "wc_weaknesses": "56;161;272",
        "wc_questions": "51;2;4",
        "wc_review": "189;274;310",
        "wc_reply_reviewers": "0;55;0",
        "wc_reply_authors": "53;213;266",
        "reply_reviewers": "0;1;0",
        "reply_authors": "1;2;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            1.247219128924647
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            48.333333333333336,
            13.523641850067197
        ],
        "wc_strengths_avg": [
            27.333333333333332,
            18.263503375736967
        ],
        "wc_weaknesses_avg": [
            163.0,
            88.19297024139736
        ],
        "wc_questions_avg": [
            19.0,
            22.642143596988927
        ],
        "wc_review_avg": [
            257.6666666666667,
            50.730223294950676
        ],
        "wc_reply_reviewers_avg": [
            18.333333333333332,
            25.927248643506744
        ],
        "wc_reply_authors_avg": [
            177.33333333333334,
            90.54035318881607
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.7559289460184544,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17459904092789435324&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "ETH Zurich;Karlsruher Institut f\u00fcr Technologie;Karlsruhe Institute of Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ethz.ch;https://www.kit.edu;https://www.kit.edu",
        "aff_unique_abbr": "ETHZ;KIT;KIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;1",
        "aff_country_unique": "Switzerland;Germany"
    },
    {
        "title": "Multimodal Learning Without Labeled Multimodal Data: Guarantees and Applications",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19197",
        "id": "BrjLHbqiYs",
        "author_site": "Paul Liang, Chun Kai Ling, Yun Cheng, Alexander Obolenskiy, Yudong Liu, Rohan Pandey, Alex Wilf, Louis-Philippe Morency, Russ Salakhutdinov",
        "tldr": "",
        "abstract": "In many machine learning systems that jointly learn from multiple modalities, a core research question is to understand the nature of multimodal interactions: how modalities combine to provide new task-relevant information that was not present in either alone. We study this challenge of interaction quantification in a semi-supervised setting with only labeled unimodal data and naturally co-occurring multimodal data (e.g., unlabeled images and captions, video and corresponding audio) but when labeling them is time-consuming. Using a precise information-theoretic definition of interactions, our key contribution is the derivation of lower and upper bounds to quantify the amount of multimodal interactions in this semi-supervised setting. We propose two lower bounds: one based on the shared information between modalities and the other based on disagreement between separately trained unimodal classifiers, and derive an upper bound through connections to approximate algorithms for min-entropy couplings. We validate these estimated bounds and show how they accurately track true interactions. Finally, we show how these theoretical results can be used to estimate multimodal model performance, guide data collection, and select appropriate multimodal models for various tasks.",
        "keywords": "multimodal learning;multimodal interactions;information theory;self-supervised learning;multimodal fusion",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/0531a72459fc7518b0f6d35605942eb5998db823.zip",
        "author": "Paul Pu Liang;Chun Kai Ling;Yun Cheng;Alexander Obolenskiy;Yudong Liu;Rohan Pandey;Alex Wilf;Louis-Philippe Morency;Russ Salakhutdinov",
        "authorids": "~Paul_Pu_Liang1;~Chun_Kai_Ling2;~Yun_Cheng2;~Alexander_Obolenskiy1;~Yudong_Liu3;~Rohan_Pandey1;~Alex_Wilf1;~Louis-Philippe_Morency1;~Russ_Salakhutdinov1",
        "gender": "M;M;F;M;M;;M;M;M",
        "homepage": "https://pliang279.github.io/;https://lingchunkai.github.io/;https://kapikantzari.github.io;;https://yudongl2000.github.io/;;https://abwilf.github.io/;https://www.cs.cmu.edu/~morency/;https://www.cs.cmu.edu/~rsalakhu/",
        "dblp": "207/9749;172/1134;;;;;277/0822;31/739;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;foMuvWEAAAAJ;https://scholar.google.com/citations?hl=en;;;;r1Zw-VEAAAAJ;https://scholar.google.com.tw/citations?user=APgaFK0AAAAJ;",
        "orcid": ";;0009-0009-8916-6667;;;;0000-0002-5587-5125;0000-0001-6376-7696;",
        "linkedin": ";;cheng-yun/;alexander-obolenskiy/;yudong-liu-510929205/;;abwilf/;morency?challengeId=AQELGK_OvMa0vwAAAY72L-VV4X9hW8juuY80VHVeeSGHZ1PJHeeEa5LTFoeTmDGU0t1OL07MXJTYC9EAi6qgPDd2z9ztnbdFYA&submissionId=09a0ff34-04ac-c717-bef7-8c9c8811b463&challengeSource=AgFhxWkU3q7v4wAAAY72L-1xRE0eG-BnZUNE9e3eAG95pgOCZ9u1nxEg-1dK2Dw&challegeType=AgHMzV0lqKgEFwAAAY72L-11X6DHMd3V_A3Iur8XZeyYF2-oBzoufs8&memberId=AgH4yz7pZ_riCgAAAY72L-146jmR2pdr3dmhy2icxBtEQzQ&recognizeDevice=AgFDCNyrhKiFSAAAAY72L-16m7z2EH2t0ueWmMKjyk1_ZJAkfFVe;",
        "or_profile": "~Paul_Pu_Liang1;~Chun_Kai_Ling2;~Yun_Cheng2;~Alexander_Obolenskiy1;~Yudong_Liu3;~Rohan_Pandey1;~Alex_Wilf1;~Louis-Philippe_Morency1;~Russ_Salakhutdinov1",
        "aff": "Massachusetts Institute of Technology;Columbia University;Princeton University;Carnegie Mellon University;;;Carnegie Mellon University;Carnegie Mellon University;School of Computer Science, Carnegie Mellon University",
        "aff_domain": "mit.edu;columbia.edu;princeton.edu;cmu.edu;;;cmu.edu;cmu.edu;cs.cmu.edu",
        "position": "Assistant Professor;Postdoc;PhD student;Undergrad student;;;PhD student;Associate Professor;Full Professor",
        "bibtex": "@inproceedings{\nliang2024multimodal,\ntitle={Multimodal Learning Without Labeled Multimodal Data: Guarantees and Applications},\nauthor={Paul Pu Liang and Chun Kai Ling and Yun Cheng and Alexander Obolenskiy and Yudong Liu and Rohan Pandey and Alex Wilf and Louis-Philippe Morency and Russ Salakhutdinov},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=BrjLHbqiYs}\n}",
        "github": "",
        "project": "",
        "reviewers": "o1cs;dPyL;rHJs",
        "pdf_size": 2640185,
        "rating": "6;6;8",
        "confidence": "3;4;4",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "3;3;3",
        "wc_summary": "88;117;80",
        "wc_strengths": "31;162;135",
        "wc_weaknesses": "35;287;72",
        "wc_questions": "3;100;9",
        "wc_review": "157;666;296",
        "wc_reply_reviewers": "0;21;18",
        "wc_reply_authors": "661;1345;484",
        "reply_reviewers": "0;1;1",
        "reply_authors": "1;2;1",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            95.0,
            15.895492023421818
        ],
        "wc_strengths_avg": [
            109.33333333333333,
            56.476150325208565
        ],
        "wc_weaknesses_avg": [
            131.33333333333334,
            111.10455536215525
        ],
        "wc_questions_avg": [
            37.333333333333336,
            44.37967502760195
        ],
        "wc_review_avg": [
            373.0,
            214.8130970557118
        ],
        "wc_reply_reviewers_avg": [
            13.0,
            9.273618495495704
        ],
        "wc_reply_authors_avg": [
            830.0,
            371.2600166998865
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.49999999999999983,
        "gs_citation": 18,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8624157036505811085&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=BrjLHbqiYs",
        "pdf": "https://openreview.net/pdf?id=BrjLHbqiYs",
        "email": "mit.edu;columbia.edu;princeton.edu;cmu.edu;;;cmu.edu;cmu.edu;cs.cmu.edu",
        "author_num": 9,
        "aff_unique_index": "0;1;2;3;3;3;3",
        "aff_unique_norm": "Massachusetts Institute of Technology;Columbia University;Princeton University;Carnegie Mellon University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://web.mit.edu;https://www.columbia.edu;https://www.princeton.edu;https://www.cmu.edu",
        "aff_unique_abbr": "MIT;Columbia;Princeton;CMU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Pittsburgh",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "BrtOzgElD7",
        "title": "Red Teaming Game: A Game-Theoretic Framework for Red Teaming Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Deployable Large Language Models (LLMs) must conform to the criterion of helpfulness and harmlessness, thereby achieving consistency between LLMs outputs and human values.  Red-teaming techniques constitute a critical way towards this criterion. \nExisting work rely solely on manual red team designs and heuristic adversarial prompts for vulnerability detection and optimization. \nThese approaches lack rigorous mathematical formulation, thus limiting the exploration of diverse attack strategy within quantifiable measure and optimization of LLMs under convergence guarantees. In this paper, we present Red-teaming Game (RTG), a general game-theoretic framework without manual annotation. RTG is designed for analyzing the multi-turn attack and defense interactions between Red-team language Models (RLMs) and Blue-team Language Model (BLM). Within the RTG, we propose Gamified Red-teaming Solver (GRTS) with diversity measure of the semantic space. GRTS is an automated red teaming technique to solve RTG towards Nash equilibrium through meta-game analysis, which corresponds to the theoretically guaranteed optimization direction of both RLMs and BLM. Empirical results in multi-turn attacks with RLMs show that GRTS autonomously discovered diverse attack strategies and effectively improved security of LLMs, outperforming existing heuristic red-team designs. Overall, RTG has established a foundational framework for red teaming tasks and constructed a new scalable oversight technique for alignment.",
        "keywords": "Large Language Models;Red Teaming Language Models;Game Theory;Safety AI",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Chengdong Ma;Ziran Yang;Minquan Gao;Hai Ci;Jun Gao;Xuehai Pan;Yaodong Yang",
        "authorids": "~Chengdong_Ma1;~Ziran_Yang1;~Minquan_Gao1;~Hai_Ci1;~Jun_Gao7;~Xuehai_Pan1;~Yaodong_Yang1",
        "gender": ";M;M;M;M;M;M",
        "homepage": ";https://ziranyang0.github.io;https://github.com/fortymiles;;https://github.com/gaogaocn;https://github.com/XuehaiPan;https://www.yangyaodong.com",
        "dblp": ";358/4441;;227/4707;;;170/1496-1",
        "google_scholar": ";_k1opxYAAAAJ;;GMrjppAAAAAJ;;VIwJg4gAAAAJ;https://scholar.google.co.uk/citations?user=6yL0xw8AAAAJ",
        "orcid": ";;;;;;0000-0001-8132-5613",
        "linkedin": ";;;;;;yaodong-yang",
        "or_profile": "~Chengdong_Ma1;~Ziran_Yang1;~Minquan_Gao1;~Hai_Ci1;~Jun_Gao7;~Xuehai_Pan1;~Yaodong_Yang1",
        "aff": ";Peking University;;National University of Singapore;Beijing University of Posts and Telecommunications;Peking University;Peking University",
        "aff_domain": ";pku.edu.cn;;nus.edu.sg;bupt.edu.cn;pku.edu.cn;pku.edu.cn",
        "position": ";Undergrad student;;Postdoc;PhD student;PhD student;Assistant Professor",
        "bibtex": "@misc{\nma2024red,\ntitle={Red Teaming Game: A Game-Theoretic Framework for Red Teaming Language Models},\nauthor={Chengdong Ma and Ziran Yang and Minquan Gao and Hai Ci and Jun Gao and Xuehai Pan and Yaodong Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=BrtOzgElD7}\n}",
        "github": "",
        "project": "",
        "reviewers": "Kbyq;HPCT;f4uQ;qG6B",
        "site": "https://openreview.net/forum?id=BrtOzgElD7",
        "pdf_size": 1522618,
        "rating": "1;1;3;5",
        "confidence": "4;4;4;3",
        "soundness": "2;1;2;3",
        "contribution": "1;1;2;3",
        "presentation": "1;1;1;2",
        "wc_summary": "91;38;79;168",
        "wc_strengths": "20;13;28;137",
        "wc_weaknesses": "347;501;206;400",
        "wc_questions": "8;7;1;176",
        "wc_review": "466;559;314;881",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "138;183;114;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;0",
        "rating_avg": [
            2.5,
            1.6583123951777
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            1.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            94.0,
            47.026588224109986
        ],
        "wc_strengths_avg": [
            49.5,
            50.79616127228513
        ],
        "wc_weaknesses_avg": [
            363.5,
            106.4389496378088
        ],
        "wc_questions_avg": [
            48.0,
            73.9493069609175
        ],
        "wc_review_avg": [
            555.0,
            207.54156210263042
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            108.75,
            67.49583320472458
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0.75,
            0.4330127018922193
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.8703882797784891,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12299032807477063835&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;0;0",
        "aff_unique_norm": "Peking University;National University of Singapore;Beijing University of Posts and Telecommunications",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.nus.edu.sg;http://www.bupt.edu.cn/",
        "aff_unique_abbr": "Peking U;NUS;BUPT",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Beijing",
        "aff_country_unique_index": "0;1;0;0;0",
        "aff_country_unique": "China;Singapore"
    },
    {
        "id": "BrwIZVSc7b",
        "title": "Point-Bind & Point-LLM: Aligning Point Cloud with Multi-modality for 3D Understanding, Generation, and Instruction Following",
        "track": "main",
        "status": "Desk Reject",
        "tldr": "",
        "abstract": "With the growing diversity of large-scale data, learning from multi-modality has attained notable progress in language and 2D vision. However, in 3D domains, how to develop an all-purpose multi-modal framework is still under-explored. To this end, we introduce Point-Bind, a 3D multi-modality model aligning point clouds with 2D image, language, and audio. Guided by ImageBind, we construct a joint embedding space between 3D and multi-modalities, enabling many promising applications, e.g., any-to-3D generation, 3D embedding arithmetic, and 3D open-world understanding. On top of this joint embedding space, we further present Point-LLM, a 3D large language model (LLM) following 3D and multi-modal instructions. Without any 3D instruction data, our Point-LLM injects the semantics of Point-Bind into pre-trained LLMs, e.g., LLaMA, and exhibits superior 3D and multi-modal question-answering capacity. We have conducted extensive experiments to demonstrate the effectiveness and generalizability of our approach for aligning 3D and multi-modality.",
        "keywords": "3D point cloud learning;multi-modality learning;large language model",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/fc636bd784a2e5d756117ebf05ec8a4c89943d99.pdf",
        "author": "Ziyu Guo;Renrui Zhang;Xiangyang Zhu;Yiwen Tang;Xianzheng Ma;Jiaming Han;Aojun Zhou;Kexin Chen;Peng Gao;Xianzhi Li;Hongsheng Li;Pheng-Ann Heng",
        "authorids": "~Ziyu_Guo2;~Renrui_Zhang1;~Xiangyang_Zhu2;~Yiwen_Tang1;~Xianzheng_Ma1;~Jiaming_Han1;~Aojun_Zhou2;~Kexin_Chen3;~Peng_Gao3;~Xianzhi_Li1;~Hongsheng_Li3;~Pheng-Ann_Heng1",
        "gender": "F;M;M;M;;M;;;;F;M;M",
        "homepage": ";;;;;https://csuhan.com;;;;https://nini-lxz.github.io/;http://www.ee.cuhk.edu.hk/~hsli;http://www.cse.cuhk.edu.hk/~pheng",
        "dblp": ";244/1748;;;;207/2277;;;;126/1233;27/7402-1;52/2889",
        "google_scholar": "S9GLetwAAAAJ;YlL3xN4AAAAJ;k7YfbnEAAAAJ;v-oVANQAAAAJ;;https://scholar.google.com.hk/citations?user=vgcxKEcAAAAJ;;;;https://scholar.google.com.hk/citations?user=qsJCXFoAAAAJ;BN2Ze-QAAAAJ;https://scholar.google.com/citations?sortby=pubdate",
        "orcid": ";;0000-0002-5853-6057;;;;;;;;;",
        "linkedin": ";;;;;;;;;;;",
        "or_profile": "~Ziyu_Guo2;~Renrui_Zhang1;~Xiangyang_Zhu2;~Yiwen_Tang1;~Xianzheng_Ma1;~Jiaming_Han1;~Aojun_Zhou2;~Kexin_Chen3;~Peng_Gao3;~Xianzhi_Li1;~Hongsheng_Li3;~Pheng-Ann_Heng1",
        "aff": "Department of Computer Science and Engineering, The Chinese University of Hong Kong;MMLab of CUHK & Shanghai AI Laboratory;City University of Hong Kong;Shanghai AI Lab;;The Chinese University of Hong Kong;;;;Huazhong University of Science and Technology;The Chinese University of Hong Kong;The Chinese University of Hong Kong",
        "aff_domain": "cse.cuhk.edu.hk;pjlab.org.cn;cityu.edu.hk;pjlab.org.cn;;cuhk.edu.hk;;;;hust.edu.cn;cuhk.edu.hk;cuhk.edu.hk",
        "position": "PhD student;PhD student;PhD student;Intern;;PhD student;;;;Associate Professor;Associate Professor;Full Professor",
        "bibtex": "@misc{\nguo2024pointbind,\ntitle={Point-Bind \\& Point-{LLM}: Aligning Point Cloud with Multi-modality for 3D Understanding, Generation, and Instruction Following},\nauthor={Ziyu Guo and Renrui Zhang and Xiangyang Zhu and Yiwen Tang and Xianzheng Ma and Jiaming Han and Aojun Zhou and Kexin Chen and Peng Gao and Xianzhi Li and Hongsheng Li and Pheng-Ann Heng},\nyear={2024},\nurl={https://openreview.net/forum?id=BrwIZVSc7b}\n}",
        "github": "",
        "project": "",
        "reviewers": "fqYr;Fjjw;gd23",
        "site": "https://openreview.net/forum?id=BrwIZVSc7b",
        "pdf_size": 13541736,
        "rating": "5;6;8",
        "confidence": "5;4;5",
        "soundness": "3;3;3",
        "contribution": "1;2;3",
        "presentation": "3;3;4",
        "wc_summary": "63;52;69",
        "wc_strengths": "64;35;65",
        "wc_weaknesses": "335;302;226",
        "wc_questions": "5;197;112",
        "wc_review": "467;586;472",
        "wc_reply_reviewers": "0;303;56",
        "wc_reply_authors": "1148;2753;1510",
        "reply_reviewers": "0;2;1",
        "reply_authors": "3;6;5",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            61.333333333333336,
            7.039570693980959
        ],
        "wc_strengths_avg": [
            54.666666666666664,
            13.912424503139471
        ],
        "wc_weaknesses_avg": [
            287.6666666666667,
            45.638677554119475
        ],
        "wc_questions_avg": [
            104.66666666666667,
            78.55500549862427
        ],
        "wc_review_avg": [
            508.3333333333333,
            54.95654849262481
        ],
        "wc_reply_reviewers_avg": [
            119.66666666666667,
            131.6367054518694
        ],
        "wc_reply_authors_avg": [
            1803.6666666666667,
            687.3554797596041
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            12,
            0
        ],
        "corr_rating_confidence": 0.18898223650461357,
        "gs_citation": 135,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4061841926044239004&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1;2;0;3;0;0",
        "aff_unique_norm": "Chinese University of Hong Kong;City University of Hong Kong;Shanghai AI Lab;Huazhong University of Science and Technology",
        "aff_unique_dep": "Department of Computer Science and Engineering;;;",
        "aff_unique_url": "https://www.cuhk.edu.hk;https://www.cityu.edu.hk;https://www.shanghaiailab.com;http://www.hust.edu.cn",
        "aff_unique_abbr": "CUHK;CityU;SAIL;HUST",
        "aff_campus_unique_index": "0;0;0;0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Solving Diffusion ODEs with Optimal Boundary Conditions for Better Image Super-Resolution",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19196",
        "id": "BtT6o5tfHu",
        "author_site": "Yiyang Ma, Huan Yang, Wenhan Yang, Jianlong Fu, Jiaying Liu",
        "tldr": "",
        "abstract": "Diffusion models, as a kind of powerful generative model, have given impressive results on image super-resolution (SR) tasks. However, due to the randomness introduced in the reverse process of diffusion models, the performances of diffusion-based SR models are fluctuating at every time of sampling, especially for samplers with few resampled steps. This inherent randomness of diffusion models results in ineffectiveness and instability, making it challenging for users to guarantee the quality of SR results. However, our work takes this randomness as an opportunity: fully analyzing and leveraging it leads to the construction of an effective plug-and-play sampling method that owns the potential to benefit a series of diffusion-based SR methods. More in detail, we propose to steadily sample high-quality SR images from pre-trained diffusion-based SR models by solving diffusion ordinary differential equations (diffusion ODEs) with optimal boundary conditions (BCs) and analyze the characteristics between the choices of BCs and their corresponding SR results. Our analysis shows the route to obtain an approximately optimal BC via an efficient exploration in the whole space. The quality of SR results sampled by the proposed method with fewer steps outperforms the quality of results sampled by current methods with randomness from the same pre-trained diffusion-based SR model, which means that our sampling method ''boosts'' current diffusion-based SR models without any additional training.",
        "keywords": "diffusion models;diffusion ODE;image super-resolution",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Yiyang Ma;Huan Yang;Wenhan Yang;Jianlong Fu;Jiaying Liu",
        "authorids": "~Yiyang_Ma1;~Huan_Yang4;~Wenhan_Yang1;~Jianlong_Fu1;~Jiaying_Liu1",
        "gender": "M;M;M;M;F",
        "homepage": "https://realpasu.github.io/;https://hyang0511.github.io/;https://flyywh.github.io/;;http://www.icst.pku.edu.cn/struct/people/liujiaying.html",
        "dblp": "324/2590;86/4843-5;156/2359;83/8692;32/197.html",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;https://scholar.google.com.hk/citations?hl=zh-CN;-WqSwu8AAAAJ;https://scholar.google.com.tw/citations?user=-OcSne0AAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Yiyang_Ma1;~Huan_Yang4;~Wenhan_Yang1;~Jianlong_Fu1;~Jiaying_Liu1",
        "aff": "DeepSeek AI;01.AI;;Microsoft;Peking University",
        "aff_domain": "deepseek.com;01.ai;;microsoft.com;pku.edu.cn",
        "position": "Intern;Senior Algorithm Expert;;Senior Researcher;Associate Professor",
        "bibtex": "@inproceedings{\nma2024solving,\ntitle={Solving Diffusion {ODE}s with Optimal Boundary Conditions for Better Image Super-Resolution},\nauthor={Yiyang Ma and Huan Yang and Wenhan Yang and Jianlong Fu and Jiaying Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=BtT6o5tfHu}\n}",
        "github": "",
        "project": "",
        "reviewers": "34bX;4gay;8EEt",
        "pdf_size": 1733270,
        "rating": "6;6;8",
        "confidence": "4;3;5",
        "soundness": "2;2;4",
        "contribution": "2;2;4",
        "presentation": "3;3;3",
        "wc_summary": "24;77;81",
        "wc_strengths": "4;29;133",
        "wc_weaknesses": "177;77;117",
        "wc_questions": "2;13;86",
        "wc_review": "207;196;417",
        "wc_reply_reviewers": "258;0;0",
        "wc_reply_authors": "2199;593;1011",
        "reply_reviewers": "3;0;0",
        "reply_authors": "6;1;2",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            60.666666666666664,
            25.978623691198287
        ],
        "wc_strengths_avg": [
            55.333333333333336,
            55.85894934764009
        ],
        "wc_weaknesses_avg": [
            123.66666666666667,
            41.09609335312651
        ],
        "wc_questions_avg": [
            33.666666666666664,
            37.27674282385138
        ],
        "wc_review_avg": [
            273.3333333333333,
            101.68688323585408
        ],
        "wc_reply_reviewers_avg": [
            86.0,
            121.62236636408618
        ],
        "wc_reply_authors_avg": [
            1267.6666666666667,
            680.302547074135
        ],
        "reply_reviewers_avg": [
            1.0,
            1.4142135623730951
        ],
        "reply_authors_avg": [
            3.0,
            2.160246899469287
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.8660254037844385,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3273504801734634102&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=BtT6o5tfHu",
        "pdf": "https://openreview.net/pdf?id=BtT6o5tfHu",
        "email": "deepseek.com;01.ai;;microsoft.com;pku.edu.cn",
        "author_num": 5,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "DeepSeek AI;01.AI;Microsoft;Peking University",
        "aff_unique_dep": ";;Microsoft Corporation;",
        "aff_unique_url": ";;https://www.microsoft.com;http://www.pku.edu.cn",
        "aff_unique_abbr": "DeepSeek AI;;Microsoft;Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;2",
        "aff_country_unique": "United States;;China"
    },
    {
        "title": "Causal-StoNet: Causal Inference for High-Dimensional Complex Data",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19195",
        "id": "BtZ7vCt5QY",
        "author_site": "Yaxin Fang, Faming Liang",
        "tldr": "",
        "abstract": "With the advancement of data science, the collection of increasingly complex datasets has become commonplace. In such datasets, the data dimension can be extremely high, and the underlying data generation process can be unknown and highly nonlinear. As a result, the task of making causal inference with high-dimensional complex data has become a fundamental problem in many disciplines, such as medicine, econometrics, and social science. However, the existing methods for causal inference are frequently developed under the assumption that the data dimension is low or that the underlying data generation process is linear or approximately linear. To address these challenges, this paper proposes a novel stochastic deep learning approach for conducting causal inference with high-dimensional complex data. The proposed approach is based on some deep learning techniques, including sparse deep learning theory and stochastic neural networks, that have been developed in recent literature. By using these techniques, the proposed approach can address both the high dimensionality and unknown data generation process in a coherent way. Furthermore, the proposed approach can also be used when missing values are present in the datasets.  Extensive numerical studies indicate that the proposed approach outperforms existing ones.",
        "keywords": "Causal Information;Stochastic Neural Network;Adaptive Stochastic Gradient MCMC;Sparsity;Missing Data",
        "primary_area": "causal reasoning",
        "supplementary_material": "/attachment/8c999d9d162cd2666e9eea23c75bb679c5d094aa.zip",
        "author": "Yaxin Fang;Faming Liang",
        "authorids": "~Yaxin_Fang1;~Faming_Liang1",
        "gender": ";M",
        "homepage": ";https://www.stat.purdue.edu/~fmliang/",
        "dblp": ";29/1122",
        "google_scholar": ";TboqoPIAAAAJ",
        "orcid": ";",
        "linkedin": "yaxinfang/;",
        "or_profile": "~Yaxin_Fang1;~Faming_Liang1",
        "aff": "Purdue University;Purdue University",
        "aff_domain": "purdue.edu;purdue.edu",
        "position": "PhD student;Full Professor",
        "bibtex": "@inproceedings{\nfang2024causalstonet,\ntitle={Causal-StoNet: Causal Inference for High-Dimensional Complex Data},\nauthor={Yaxin Fang and Faming Liang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=BtZ7vCt5QY}\n}",
        "github": "",
        "project": "",
        "reviewers": "GhoU;7o25;vAHH",
        "pdf_size": 621388,
        "rating": "6;6;8",
        "confidence": "4;3;4",
        "soundness": "3;3;4",
        "contribution": "3;2;4",
        "presentation": "3;2;3",
        "wc_summary": "46;64;36",
        "wc_strengths": "60;44;35",
        "wc_weaknesses": "335;121;32",
        "wc_questions": "95;4;352",
        "wc_review": "536;233;455",
        "wc_reply_reviewers": "32;43;8",
        "wc_reply_authors": "909;723;487",
        "reply_reviewers": "1;1;1",
        "reply_authors": "3;2;3",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            48.666666666666664,
            11.585431464655176
        ],
        "wc_strengths_avg": [
            46.333333333333336,
            10.338708279513881
        ],
        "wc_weaknesses_avg": [
            162.66666666666666,
            127.15956729855428
        ],
        "wc_questions_avg": [
            150.33333333333334,
            147.3597261428267
        ],
        "wc_review_avg": [
            408.0,
            128.0859086707043
        ],
        "wc_reply_reviewers_avg": [
            27.666666666666668,
            14.613540144521982
        ],
        "wc_reply_authors_avg": [
            706.3333333333334,
            172.683396872877
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.49999999999999983,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12216133834044220234&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=BtZ7vCt5QY",
        "pdf": "https://openreview.net/pdf?id=BtZ7vCt5QY",
        "email": "purdue.edu;purdue.edu",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Purdue University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.purdue.edu",
        "aff_unique_abbr": "Purdue",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Inducing High Energy-Latency of Large Vision-Language Models with Verbose Images",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19194",
        "id": "BteuUysuXX",
        "author_site": "Kuofeng Gao, Yang Bai, Jindong Gu, Shu-Tao Xia, Philip Torr, Zhifeng Li, Wei Liu",
        "tldr": "",
        "abstract": "Large vision-language models (VLMs) such as GPT-4 have achieved exceptional performance across various multi-modal tasks. However, the deployment of VLMs necessitates substantial energy consumption and computational resources. Once attackers maliciously induce high energy consumption and latency time (energy-latency cost) during inference of VLMs, it will exhaust computational resources. In this paper, we explore this attack surface about availability of VLMs and aim to induce high energy-latency cost during inference of VLMs. We find that high energy-latency cost during inference of VLMs can be manipulated by maximizing the length of generated sequences. To this end, we propose verbose images, with the goal of crafting an imperceptible perturbation to induce VLMs to generate long sentences during inference. Concretely, we design three loss objectives. First, a loss is proposed to delay the occurrence of end-of-sequence (EOS) token, where EOS token is a signal for VLMs to stop generating further tokens. Moreover, an uncertainty loss and a token diversity loss are proposed to increase the uncertainty over each generated token and the diversity among all tokens of the whole generated sequence, respectively, which can break output dependency at token-level and sequence-level. Furthermore, a temporal weight adjustment algorithm is proposed, which can effectively balance these losses. Extensive experiments demonstrate that our verbose images can increase the length of generated sequences by 7.87\u00d7 and 8.56\u00d7 compared to original images on MS-COCO and ImageNet datasets, which presents potential challenges for various applications.",
        "keywords": "energy-latency manipulation; large vision-language model; verbose images",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/d29d870ff35ed06735c91038fbbe061eac3094f0.zip",
        "author": "Kuofeng Gao;Yang Bai;Jindong Gu;Shu-Tao Xia;Philip Torr;Zhifeng Li;Wei Liu",
        "authorids": "~Kuofeng_Gao1;~Yang_Bai1;~Jindong_Gu1;~Shu-Tao_Xia1;~Philip_Torr1;~Zhifeng_Li5;~Wei_Liu3",
        "gender": "M;F;;M;;M;M",
        "homepage": "https://kuofenggao.github.io/;https://bymavis.github.io/;;https://www.sigs.tsinghua.edu.cn/xst/list.htm;http://www.robots.ox.ac.uk/~tvg/;;https://sites.google.com/view/cuweiliu",
        "dblp": "302/4618;;;03/6195;;;49/3283-5",
        "google_scholar": "https://scholar.google.com.hk/citations?user=0hVZ0woAAAAJ;wBH_Q1gAAAAJ;;https://scholar.google.com.hk/citations?user=koAXTXgAAAAJ;;VTrRNN4AAAAJ;AjxoEpIAAAAJ",
        "orcid": ";;;0000-0002-8639-982X;;;0000-0002-3865-8145",
        "linkedin": ";yang-bai-70850b294/;;;;;",
        "or_profile": "~Kuofeng_Gao1;~Yang_Bai1;~Jindong_Gu1;~Shu-Tao_Xia1;~Philip_Torr1;~Zhifeng_Li5;~Wei_Liu3",
        "aff": "Tsinghua University;Tencent Zhuque Lab;;Shenzhen International Graduate School, Tsinghua University;University of Oxford;Tencent;Tencent",
        "aff_domain": "tsinghua.edu.cn;tencent.com;;sz.tsinghua.edu.cn;ox.ac.uk;tencent.com;tencent.com",
        "position": "PhD student;Researcher;;Full Professor;Full Professor;Principal Researcher;Distinguished Scientist",
        "bibtex": "@inproceedings{\ngao2024inducing,\ntitle={Inducing High Energy-Latency of Large Vision-Language Models with Verbose Images},\nauthor={Kuofeng Gao and Yang Bai and Jindong Gu and Shu-Tao Xia and Philip Torr and Zhifeng Li and Wei Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=BteuUysuXX}\n}",
        "github": "",
        "project": "",
        "reviewers": "NtLX;Ysyk;xu4N",
        "pdf_size": 5073020,
        "rating": "6;6;8",
        "confidence": "4;4;3",
        "soundness": "2;3;4",
        "contribution": "3;2;3",
        "presentation": "3;3;4",
        "wc_summary": "75;39;123",
        "wc_strengths": "69;33;79",
        "wc_weaknesses": "214;126;11",
        "wc_questions": "5;95;51",
        "wc_review": "363;293;264",
        "wc_reply_reviewers": "21;86;9",
        "wc_reply_authors": "1264;2099;897",
        "reply_reviewers": "1;1;1",
        "reply_authors": "3;5;3",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            79.0,
            34.40930106817051
        ],
        "wc_strengths_avg": [
            60.333333333333336,
            19.754043186705402
        ],
        "wc_weaknesses_avg": [
            117.0,
            83.11838946145834
        ],
        "wc_questions_avg": [
            50.333333333333336,
            36.745370078721784
        ],
        "wc_review_avg": [
            306.6666666666667,
            41.55585264302597
        ],
        "wc_reply_reviewers_avg": [
            38.666666666666664,
            33.82635395992631
        ],
        "wc_reply_authors_avg": [
            1420.0,
            502.95990562535565
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.9999999999999998,
        "gs_citation": 46,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2449079870463476618&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=BteuUysuXX",
        "pdf": "https://openreview.net/pdf?id=BteuUysuXX",
        "email": "tsinghua.edu.cn;tencent.com;;sz.tsinghua.edu.cn;ox.ac.uk;tencent.com;tencent.com",
        "author_num": 7,
        "aff_unique_index": "0;1;0;2;1;1",
        "aff_unique_norm": "Tsinghua University;Tencent;University of Oxford",
        "aff_unique_dep": ";Zhuque Lab;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.tencent.com;https://www.ox.ac.uk",
        "aff_unique_abbr": "THU;Tencent;Oxford",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Shenzhen",
        "aff_country_unique_index": "0;0;0;1;0;0",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "id": "BtmB8WrPSp",
        "title": "Sparse-PGD: An Effective and Efficient Attack for $l_0$ Bounded Adversarial Perturbation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This work focuses on sparse adversarial perturbations bounded by $l_0$ norm. We propose a white-box PGD-like attack method named sparse-PGD to effectively and efficiently generate such perturbations. Furthermore, we combine sparse-PGD with a black-box attack to comprehensively and more reliably evaluate the models' robustness against $l_0$ bounded adversarial perturbations. Moreover, due to the efficiency of sparse-PGD, we explore utilizing it to conduct adversarial training to build robust models against sparse perturbations. Extensive experiments demonstrate that our proposed attack algorithm can achieve better performance than baselines. Our adversarially trained model also shows the strongest robustness against various sparse attacks.",
        "keywords": "robustness;adversarial attack",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/82108d91717350768f7e7cec6c4ddf5b260e3f7f.zip",
        "author": "Xuyang Zhong;Yixiao Huang;Chen Liu",
        "authorids": "~Xuyang_Zhong1;~Yixiao_Huang3;~Chen_Liu1",
        "gender": "M;M;M",
        "homepage": ";https://yixiao-huang.github.io/;http://liuchen1993.cn/HomePage/index.html",
        "dblp": ";130/6820-4;10/2639-27",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;iTEcewwAAAAJ;48PsswEAAAAJ",
        "orcid": ";;",
        "linkedin": "xuyang-zhong-62a937226;;",
        "or_profile": "~Xuyang_Zhong1;~Yixiao_Huang3;~Chen_Liu1",
        "aff": "City University of Hong Kong;University of California, Berkeley;City University of Hong Kong",
        "aff_domain": "cityu.edu.hk;berkeley.edu;cityu.edu.hk",
        "position": "PhD student;PhD student;Assistant Professor",
        "bibtex": "@misc{\nzhong2024sparsepgd,\ntitle={Sparse-{PGD}: An Effective and Efficient Attack for \\$l\\_0\\$ Bounded Adversarial Perturbation},\nauthor={Xuyang Zhong and Yixiao Huang and Chen Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=BtmB8WrPSp}\n}",
        "github": "",
        "project": "",
        "reviewers": "RqW9;DCtb;DbyG;Ngmx",
        "site": "https://openreview.net/forum?id=BtmB8WrPSp",
        "pdf_size": 715918,
        "rating": "3;3;3;5",
        "confidence": "5;4;5;4",
        "soundness": "2;1;2;2",
        "contribution": "1;3;2;2",
        "presentation": "2;2;3;3",
        "wc_summary": "30;129;88;80",
        "wc_strengths": "23;69;53;38",
        "wc_weaknesses": "20;149;305;386",
        "wc_questions": "277;496;77;5",
        "wc_review": "350;843;523;509",
        "wc_reply_reviewers": "0;0;187;0",
        "wc_reply_authors": "465;1650;1143;1563",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;3;2;3",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            81.75,
            35.187888541371734
        ],
        "wc_strengths_avg": [
            45.75,
            17.108112110925624
        ],
        "wc_weaknesses_avg": [
            215.0,
            141.17542279022933
        ],
        "wc_questions_avg": [
            213.75,
            191.01227054825563
        ],
        "wc_review_avg": [
            556.25,
            178.95722254214832
        ],
        "wc_reply_reviewers_avg": [
            46.75,
            80.97337525384502
        ],
        "wc_reply_authors_avg": [
            1205.25,
            468.4102768940921
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1798784126737920859&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "City University of Hong Kong;University of California, Berkeley",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cityu.edu.hk;https://www.berkeley.edu",
        "aff_unique_abbr": "CityU;UC Berkeley",
        "aff_campus_unique_index": "0;1;0",
        "aff_campus_unique": "Hong Kong SAR;Berkeley",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "Bu3JGyfz23",
        "title": "A multi-view latent space learning framework via adaptive graph embedding",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In this paper, a new approach to multi-view subspace learning is proposed and termed as multi-view latent space learning via adaptive graph embedding  (MvSLGE),  which learns a latent representation from all view features. Unlike most existing multi-view latent space learning methods that only encode the complementary information into the latent representation, MvSLGE adaptively learn an adjacent graph that well characterizes similarity between samples  to further regularize the latent representation. To extract the neighborhood information from multi-view features, we propose a novel strategy that constructs one graph for each view, and then the learned graph is approximately designed as a centroid of these graphs of different views with different weights.  Therefore, the constructed latent representation not only incorporates the complementary information of features from multiple views but also encodes the similarity between samples. The proposed MvSLGE can be solved by the augmented Lagrangian multiplier with alternating direction minimization (ALM-ADM) algorithm. Plenty of experiments demonstrate the superiority of MvSLGE on a variety of datasets.",
        "keywords": "Multi-view Learning;Latent representation Learning;Graph Embedding;Graph Optimization",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/f9abb4469e93feaf468ad30d47c313a7301c22ba.pdf",
        "author": "Haohao Li;Li Zhong",
        "authorids": "~Haohao_Li1;~Li_Zhong3",
        "gender": ";",
        "homepage": ";http://xxgcxy.zjhu.edu.cn/2022/0315/c819a167551/page.htm",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": "my-orcid?orcid=0000-0002-0171-1205;0000-0002-1767-1519",
        "linkedin": ";",
        "or_profile": "~Haohao_Li1;~Li_Zhong3",
        "aff": "Zhejiang Sci-Tech University;Huzhou University",
        "aff_domain": "zstu.edu.cn;zjhu.edu.cn",
        "position": "Lecturer;Full Professor",
        "bibtex": "@misc{\nli2024a,\ntitle={A multi-view latent space learning framework via adaptive graph embedding},\nauthor={Haohao Li and Li Zhong},\nyear={2024},\nurl={https://openreview.net/forum?id=Bu3JGyfz23}\n}",
        "github": "",
        "project": "",
        "reviewers": "kTLj;F9J3;yhSb",
        "site": "https://openreview.net/forum?id=Bu3JGyfz23",
        "pdf_size": 810760,
        "rating": "1;3;5",
        "confidence": "5;4;4",
        "soundness": "3;2;2",
        "contribution": "3;2;2",
        "presentation": "3;2;2",
        "wc_summary": "52;51;107",
        "wc_strengths": "52;13;53",
        "wc_weaknesses": "103;25;289",
        "wc_questions": "19;88;34",
        "wc_review": "226;177;483",
        "wc_reply_reviewers": "19;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "1;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            1.632993161855452
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            70.0,
            26.166135875720485
        ],
        "wc_strengths_avg": [
            39.333333333333336,
            18.62495339293199
        ],
        "wc_weaknesses_avg": [
            139.0,
            110.74294559925703
        ],
        "wc_questions_avg": [
            47.0,
            29.631064780058107
        ],
        "wc_review_avg": [
            295.3333333333333,
            134.1996853780051
        ],
        "wc_reply_reviewers_avg": [
            6.333333333333333,
            8.956685895029603
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:1S52HAqZDLgJ:scholar.google.com/&scioq=A+multi-view+latent+space+learning+framework+via+adaptive+graph+embedding&hl=en&as_sdt=0,5",
        "gs_version_total": 5,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Zhejiang Sci-Tech University;Huzhou University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.zstu.edu.cn;http://www.hzu.edu.cn",
        "aff_unique_abbr": "ZSTU;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Decoupled Marked Temporal Point Process using Neural Ordinary Differential Equations",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19193",
        "id": "BuFNoKBiMs",
        "author_site": "Yujee Song, Donghyun LEE, Rui Meng, Won Hwa Kim",
        "tldr": "",
        "abstract": "A Marked Temporal Point Process (MTPP) is a stochastic process whose realization is a set of event-time data. MTPP is often used to understand complex dynamics of asynchronous temporal events such as money transaction, social media, healthcare, etc. Recent studies have utilized deep neural networks to capture complex temporal dependencies of events and generate embedding that aptly represent the observed events. While most previous studies focus on the inter-event dependencies and their representations, how individual events influence the overall dynamics over time has been under-explored. In this regime, we propose a Decoupled MTPP framework that disentangles characterization of a stochastic process into a set of evolving influences from different events. Our approach employs Neural Ordinary Differential Equations (Neural ODEs) to learn flexible continuous dynamics of these influences while simultaneously addressing multiple inference problems, such as density estimation and survival rate computation. We emphasize the significance of disentangling the influences by comparing our framework with state-of-the-art methods on real-life datasets, and provide analysis on the model behavior for potential applications.",
        "keywords": "Marked Temporal Point Process;Neural ODE",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Yujee Song;Donghyun LEE;Rui Meng;Won Hwa Kim",
        "authorids": "~Yujee_Song2;~Donghyun_LEE4;~Rui_Meng3;~Won_Hwa_Kim4",
        "gender": "M;M;M;M",
        "homepage": ";https://github.com/dong-tak123;;https://wwplato.github.io/",
        "dblp": ";;;12/10278",
        "google_scholar": ";;Dq8mJMwAAAAJ;aWPSHNwAAAAJ",
        "orcid": ";;;",
        "linkedin": "yujee-song-6485911b3/;;rui-meng/;",
        "or_profile": "~Yujee_Song2;~Donghyun_LEE4;~Rui_Meng3;~Won_Hwa_Kim1",
        "aff": "Pohang University of Science and Technology;Pohang University of Science and Technology;Amazon;Pohang University of Science and Technology",
        "aff_domain": "postech.edu;postech.ac.kr;amazon.com;postech.ac.kr",
        "position": "MS student;MS student;Researcher;Associate Professor",
        "bibtex": "@inproceedings{\nsong2024decoupled,\ntitle={Decoupled Marked Temporal Point Process using Neural Ordinary Differential Equations},\nauthor={Yujee Song and Donghyun LEE and Rui Meng and Won Hwa Kim},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=BuFNoKBiMs}\n}",
        "github": "",
        "project": "",
        "reviewers": "Ux3F;A48s;yduQ",
        "pdf_size": 1417078,
        "rating": "5;6;8",
        "confidence": "3;4;3",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "2;3;3",
        "wc_summary": "88;80;75",
        "wc_strengths": "58;21;63",
        "wc_weaknesses": "440;23;40",
        "wc_questions": "2;75;47",
        "wc_review": "588;199;225",
        "wc_reply_reviewers": "255;0;0",
        "wc_reply_authors": "1440;295;81",
        "reply_reviewers": "1;0;0",
        "reply_authors": "4;2;1",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            81.0,
            5.354126134736337
        ],
        "wc_strengths_avg": [
            47.333333333333336,
            18.732028424302822
        ],
        "wc_weaknesses_avg": [
            167.66666666666666,
            192.69376971995982
        ],
        "wc_questions_avg": [
            41.333333333333336,
            30.07028803025043
        ],
        "wc_review_avg": [
            337.3333333333333,
            177.56563731633312
        ],
        "wc_reply_reviewers_avg": [
            85.0,
            120.20815280171308
        ],
        "wc_reply_authors_avg": [
            605.3333333333334,
            596.6296077876866
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.18898223650461363,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1705947747001447776&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=BuFNoKBiMs",
        "pdf": "https://openreview.net/pdf?id=BuFNoKBiMs",
        "email": "postech.edu;postech.ac.kr;amazon.com;postech.ac.kr",
        "author_num": 4,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Pohang University of Science and Technology;Amazon",
        "aff_unique_dep": ";Amazon.com, Inc.",
        "aff_unique_url": "https://www.postech.ac.kr;https://www.amazon.com",
        "aff_unique_abbr": "POSTECH;Amazon",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Pohang;",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "id": "Buvbx3xRdu",
        "title": "VideoClusterNet: Self-Supervised and Adaptive Face Clustering for Videos",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "With the rise of digital media content production, the need for analyzing movies and TV series episodes to locate the main cast of characters precisely is gaining importance. Specifically, Video Face Clustering aims at grouping together detected video face tracks with common facial identities. This problem is very challenging due to the large range of pose, expression, appearance, and lighting variations of a given face across video frames. Generic pre-trained Face Identification (ID) models fail to adapt well to the video production domain, given its high dynamic range content and also unique cinematic style. Furthermore, traditional clustering algorithms depend on \nhyperparameters requiring individual tuning across datasets. In this paper, we present a novel video face clustering approach that learns to adapt a generic face ID model to new video face tracks in a fully self-supervised fashion. We also propose a parameter-free clustering algorithm that is capable of automatically adapting to the finetuned model's embedding space for any input video. Due to the lack of comprehensive movie face clustering benchmarks, we also present a first-of-kind movie dataset: MovieFaceCluster. Our dataset is handpicked by film industry professionals and contains extremely challenging face ID scenarios. Experiments demonstrate our method's effectiveness in handling difficult mainstream movie scenes on our benchmark dataset and state-of-the-art performance on traditional TV series datasets.",
        "keywords": "Video Face Clustering;Self-Supervised Learning;Representation Learning;Metric Learning",
        "primary_area": "metric learning, kernel learning, and sparse coding",
        "supplementary_material": "",
        "author": "Devesh Walawalkar;Pablo Garrido",
        "authorids": "~Devesh_Walawalkar1;~Pablo_Garrido1",
        "gender": "M;",
        "homepage": "https://www.devwalkar.info;",
        "dblp": "210/0960;",
        "google_scholar": "MpHIZfEAAAAJ;",
        "orcid": ";",
        "linkedin": "devesh-walawalkar-376a87a4/;",
        "or_profile": "~Devesh_Walawalkar1;~Pablo_Garrido1",
        "aff": "Flawless AI;",
        "aff_domain": "flawlessai.com;",
        "position": "Researcher;",
        "bibtex": "@misc{\nwalawalkar2024videoclusternet,\ntitle={VideoClusterNet: Self-Supervised and Adaptive Face Clustering for Videos},\nauthor={Devesh Walawalkar and Pablo Garrido},\nyear={2024},\nurl={https://openreview.net/forum?id=Buvbx3xRdu}\n}",
        "github": "",
        "project": "",
        "reviewers": "B82Y;wXAX;RNxJ",
        "site": "https://openreview.net/forum?id=Buvbx3xRdu",
        "pdf_size": 32651994,
        "rating": "5;5;5",
        "confidence": "4;4;4",
        "soundness": "2;2;3",
        "contribution": "2;2;2",
        "presentation": "2;2;3",
        "wc_summary": "107;79;85",
        "wc_strengths": "50;66;31",
        "wc_weaknesses": "96;189;248",
        "wc_questions": "7;2;4",
        "wc_review": "260;336;368",
        "wc_reply_reviewers": "0;0;172",
        "wc_reply_authors": "604;972;1936",
        "reply_reviewers": "0;0;1",
        "reply_authors": "2;3;3",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            90.33333333333333,
            12.036980056845191
        ],
        "wc_strengths_avg": [
            49.0,
            14.30617582258329
        ],
        "wc_weaknesses_avg": [
            177.66666666666666,
            62.56907294253998
        ],
        "wc_questions_avg": [
            4.333333333333333,
            2.0548046676563256
        ],
        "wc_review_avg": [
            321.3333333333333,
            45.29410067056808
        ],
        "wc_reply_reviewers_avg": [
            57.333333333333336,
            81.08157757605744
        ],
        "wc_reply_authors_avg": [
            1170.6666666666667,
            561.6388717158226
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:0Wd1auGzhV4J:scholar.google.com/&scioq=VideoClusterNet:+Self-Supervised+and+Adaptive+Face+Clustering+for+Videos&hl=en&as_sdt=0,14",
        "gs_version_total": 10,
        "aff_unique_index": "0",
        "aff_unique_norm": "Flawless AI",
        "aff_unique_dep": "",
        "aff_unique_url": "",
        "aff_unique_abbr": ""
    },
    {
        "id": "Bvrc6kobWd",
        "title": "Understanding Contrastive Learning Through the Lens of Margins",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Contrastive learning, along with its variations, has been a highly effective self-supervised learning method across diverse domains.\nContrastive learning measures the distance between representations using cosine similarity and uses cross-entropy for representation learning. Within the same framework of cosine-similarity-based representation learning, margins have played a significant role in enhancing face and speaker recognition tasks. Interestingly, despite the shared reliance on the same similarity metrics and objective functions, contrastive learning has not actively adopted margins. Furthermore, decision-boundary-based explanations are the only ones that have been used to explain the effect of margins in contrastive learning. In this work, we propose a new perspective to understand the role of margins based on gradient analysis. Based on the new perspective, we analyze how margins affect gradients of contrastive learning and separate the effect into more elemental levels. We separately analyze each and provide possible directions for improving contrastive learning. Our experimental results demonstrate that emphasizing positive samples and scaling gradients depending on positive sample angles and logits are the keys to improving the generalization performance of contrastive learning in both seen and unseen datasets, and other factors can only marginally improve performance.",
        "keywords": "Contrastive learning;Margins;Self-supervised learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Daniel Rho;Taesoo Kim;Sooill Park;Jaehyun Park;Jaehan Park",
        "authorids": "~Daniel_Rho1;~Taesoo_Kim2;~Sooill_Park1;~Jaehyun_Park2;~Jaehan_Park1",
        "gender": "M;M;M;;M",
        "homepage": ";https://tskim9439.github.io/;;https://vniel-pkjh-0219.notion.site/Who-am-I-669dcf7f87384a0ab0b8822b7378275f;https://www.linkedin.com/in/jaehan-park-356b0835/",
        "dblp": "311/4143;299/0662;302/4008;https://dblp.org/rec/conf/aipr2/ParkCK20.html;32/2596",
        "google_scholar": "nEC0wK4AAAAJ;nq-34BEAAAAJ;https://scholar.google.com/citations?view_op=list_works;;",
        "orcid": ";;;0000-0002-1424-372X;",
        "linkedin": ";tskim9439/;;;",
        "or_profile": "~Daniel_Rho1;~Taesoo_Kim2;~Sooill_Park1;~Jaehyun_Park2;~Jaehan_Park1",
        "aff": "Korea Telecom Research;Korea Telecom Research;Hyundai Mobis;NCSOFT;Seoul City University",
        "aff_domain": "kt.com;kt.com;mobis.co.kr;ncsoft.com;uos.ac.kr",
        "position": "Researcher;Researcher;Researcher;Researcher;PhD student",
        "bibtex": "@misc{\nrho2024understanding,\ntitle={Understanding Contrastive Learning Through the Lens of Margins},\nauthor={Daniel Rho and Taesoo Kim and Sooill Park and Jaehyun Park and Jaehan Park},\nyear={2024},\nurl={https://openreview.net/forum?id=Bvrc6kobWd}\n}",
        "github": "",
        "project": "",
        "reviewers": "Rz4Z;Q3Bo;Ykxx;Bk8n",
        "site": "https://openreview.net/forum?id=Bvrc6kobWd",
        "pdf_size": 468235,
        "rating": "3;5;5;6",
        "confidence": "3;3;5;5",
        "soundness": "2;3;3;3",
        "contribution": "1;2;2;3",
        "presentation": "1;2;3;3",
        "wc_summary": "43;81;33;78",
        "wc_strengths": "14;43;6;44",
        "wc_weaknesses": "90;399;173;120",
        "wc_questions": "53;14;12;6",
        "wc_review": "200;537;224;248",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            1.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            58.75,
            21.07575621419075
        ],
        "wc_strengths_avg": [
            26.75,
            16.990806337546196
        ],
        "wc_weaknesses_avg": [
            195.5,
            121.1909650097729
        ],
        "wc_questions_avg": [
            21.25,
            18.565761497983324
        ],
        "wc_review_avg": [
            302.25,
            136.59131560974146
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.6882472016116854,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11062268194348990919&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1;2;3",
        "aff_unique_norm": "Korea Telecom;Hyundai Mobis;NCSOFT Corporation;Seoul City University",
        "aff_unique_dep": "Research;;;",
        "aff_unique_url": "https://www.kt.com;https://www.hyundaimobis.com;https://www.ncsoft.com;http://www.scu.ac.kr",
        "aff_unique_abbr": "KT;Hyundai Mobis;NCSOFT;SCU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "BwG8hwohU4",
        "title": "StableSSM: Alleviating the Curse of Memory in State-space Models through Stable Reparameterization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this paper, we investigate the long-term memory learning capabilities of state-space models (SSMs) from the perspective of parameterization. We prove that state-space models without any reparameterization exhibit a memory limitation similar to that of traditional RNNs: the target relationships that can be stably approximated by state-space models must have an exponential decaying memory. Our analysis identifies this ``curse of memory'' as a result of the recurrent weights converging to a stability boundary, suggesting that a reparameterization technique can be effective. To this end, we introduce a class of reparameterization techniques for SSMs that effectively lift its memory limitations. Besides improving approximation capabilities, we further illustrate that a principled choice of reparameterization scheme can also enhance optimization stability. We validate our findings using synthetic datasets and language models.",
        "keywords": "State-space models;Recurrent neural networks;Sequence Modelling;Approximation Theory",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/7acaa8c217e9c4772048fcd5d5b51140d022590e.zip",
        "author": "Shida Wang;Qianxiao Li",
        "authorids": "~Shida_Wang1;~Qianxiao_Li1",
        "gender": "M;M",
        "homepage": "https://radarfudan.github.io;https://blog.nus.edu.sg/qianxiaoli/",
        "dblp": "245/6187;172/0930.html",
        "google_scholar": "vA2YMfgAAAAJ;https://scholar.google.com.sg/citations?user=zLgReYoAAAAJ",
        "orcid": ";0000-0002-3903-3737",
        "linkedin": ";",
        "or_profile": "~Shida_Wang1;~Qianxiao_Li1",
        "aff": "National University of Singapore;National University of Singapore",
        "aff_domain": "nus.edu.sg;nus.edu.sg",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nwang2024stablessm,\ntitle={Stable{SSM}: Alleviating the Curse of Memory in State-space Models through Stable Reparameterization},\nauthor={Shida Wang and Qianxiao Li},\nyear={2024},\nurl={https://openreview.net/forum?id=BwG8hwohU4}\n}",
        "github": "",
        "project": "",
        "reviewers": "4Tez;uWCH;fvkX",
        "site": "https://openreview.net/forum?id=BwG8hwohU4",
        "pdf_size": 804519,
        "rating": "5;5;6",
        "confidence": "2;3;3",
        "soundness": "2;1;3",
        "contribution": "3;2;3",
        "presentation": "3;1;3",
        "wc_summary": "76;41;28",
        "wc_strengths": "21;43;60",
        "wc_weaknesses": "52;79;108",
        "wc_questions": "43;169;9",
        "wc_review": "192;332;205",
        "wc_reply_reviewers": "38;0;0",
        "wc_reply_authors": "964;1502;466",
        "reply_reviewers": "1;0;0",
        "reply_authors": "3;3;1",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            48.333333333333336,
            20.270394394014364
        ],
        "wc_strengths_avg": [
            41.333333333333336,
            15.965240019770729
        ],
        "wc_weaknesses_avg": [
            79.66666666666667,
            22.866763848189994
        ],
        "wc_questions_avg": [
            73.66666666666667,
            68.82506003549064
        ],
        "wc_review_avg": [
            243.0,
            63.15589178110516
        ],
        "wc_reply_reviewers_avg": [
            12.666666666666666,
            17.913371790059205
        ],
        "wc_reply_authors_avg": [
            977.3333333333334,
            423.05029908458346
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14189617943554510295&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "National University of Singapore",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nus.edu.sg",
        "aff_unique_abbr": "NUS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Singapore"
    },
    {
        "title": "Benign Overfitting and Grokking in ReLU Networks for XOR Cluster Data",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19192",
        "id": "BxHgpC6FNv",
        "author_site": "Zhiwei Xu, Yutong Wang, Spencer Frei, Gal Vardi, Wei Hu",
        "tldr": "",
        "abstract": "Neural networks trained by gradient descent (GD) have exhibited a number of surprising generalization behaviors. First, they can achieve a perfect fit to noisy training data and still generalize near-optimally, showing that overfitting can sometimes be benign. Second, they can undergo a period of classical, harmful overfitting---achieving a perfect fit to training data with near-random performance on test data---before transitioning (''grokking'') to near-optimal generalization later in training. In this work, we show that both of these phenomena provably occur in two-layer ReLU networks trained by GD on XOR cluster data where a constant fraction of the training labels are flipped. In this setting, we show that after the first step of GD, the network achieves 100\\% training accuracy, perfectly fitting the noisy labels in the training data, but achieves near-random test accuracy. At a later training step, the network achieves near-optimal test accuracy while still fitting the random labels in the training data, exhibiting a ''grokking'' phenomenon. This provides the first theoretical result of benign overfitting in neural network classification when the data distribution is not linearly separable. Our proofs rely on analyzing the feature learning process under GD, which reveals that the network implements a non-generalizable linear classifier after one step and gradually learns generalizable features in later steps.",
        "keywords": "benign overfitting;grokking;neural networks;feature learning;interpolation;theory",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Zhiwei Xu;Yutong Wang;Spencer Frei;Gal Vardi;Wei Hu",
        "authorids": "~Zhiwei_Xu6;~Yutong_Wang1;~Spencer_Frei1;~Gal_Vardi1;~Wei_Hu1",
        "gender": "M;M;M;M;M",
        "homepage": "https://zhiweixx.github.io;https://yutongwang.me/;http://spencerfrei.github.io/;https://sites.google.com/view/galvardi/home;https://weihu.me",
        "dblp": ";90/3631;250/2714;https://dblp.uni-trier.de/pid/167/9638.html;",
        "google_scholar": "XzQRU3MAAAAJ;GH7ryE4AAAAJ;c7N8SoEAAAAJ;https://scholar.google.co.il/citations?hl=en;ZybgAqkAAAAJ",
        "orcid": ";0000-0001-7472-6750;;;",
        "linkedin": ";;;;",
        "or_profile": "~Zhiwei_Xu6;~Yutong_Wang1;~Spencer_Frei1;~Gal_Vardi1;~Wei_Hu1",
        "aff": "University of Michigan - Ann Arbor;University of Michigan - Ann Arbor;University of California, Davis;Toyota Technological Institute at Chicago;University of Michigan - Ann Arbor",
        "aff_domain": "umich.edu;umich.edu;ucdavis.edu;ttic.edu;umich.edu",
        "position": "PhD student;Postdoc;Assistant Professor;Postdoc;Assistant Professor",
        "bibtex": "@inproceedings{\nxu2024benign,\ntitle={Benign Overfitting and Grokking in Re{LU} Networks for {XOR} Cluster Data},\nauthor={Zhiwei Xu and Yutong Wang and Spencer Frei and Gal Vardi and Wei Hu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=BxHgpC6FNv}\n}",
        "github": "",
        "project": "",
        "reviewers": "AQUA;mTpn;6CDP",
        "pdf_size": 920885,
        "rating": "5;6;6",
        "confidence": "4;4;4",
        "soundness": "3;3;4",
        "contribution": "3;3;4",
        "presentation": "3;3;4",
        "wc_summary": "91;139;73",
        "wc_strengths": "19;134;217",
        "wc_weaknesses": "27;247;115",
        "wc_questions": "30;207;28",
        "wc_review": "167;727;433",
        "wc_reply_reviewers": "162;20;11",
        "wc_reply_authors": "754;1357;419",
        "reply_reviewers": "3;1;1",
        "reply_authors": "3;3;1",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            101.0,
            27.85677655436824
        ],
        "wc_strengths_avg": [
            123.33333333333333,
            81.18428966794554
        ],
        "wc_weaknesses_avg": [
            129.66666666666666,
            90.41140537687832
        ],
        "wc_questions_avg": [
            88.33333333333333,
            83.91397711678046
        ],
        "wc_review_avg": [
            442.3333333333333,
            228.71428075706646
        ],
        "wc_reply_reviewers_avg": [
            64.33333333333333,
            69.1584332448971
        ],
        "wc_reply_authors_avg": [
            843.3333333333334,
            388.11195406594845
        ],
        "reply_reviewers_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 33,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7528833317116470872&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=BxHgpC6FNv",
        "pdf": "https://openreview.net/pdf?id=BxHgpC6FNv",
        "email": "umich.edu;umich.edu;ucdavis.edu;ttic.edu;umich.edu",
        "author_num": 5,
        "aff_unique_index": "0;0;1;2;0",
        "aff_unique_norm": "University of Michigan;University of California, Davis;Toyota Technological Institute at Chicago",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.umich.edu;https://www.ucdavis.edu;https://www.tti-chicago.org",
        "aff_unique_abbr": "UM;UC Davis;TTI Chicago",
        "aff_campus_unique_index": "0;0;1;2;0",
        "aff_campus_unique": "Ann Arbor;Davis;Chicago",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "BxPqibGUPR",
        "title": "VibeSpace: Automatic vector embedding creation for arbitrary domains and mapping between them using large language models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We present VibeSpace; a method for the fully unsupervised construction of interpretable embedding spaces applicable to arbitrary domain areas. By leveraging knowledge contained within large language models, our method automates otherwise costly data acquisition processes and assesses the similarity of entities, allowing for meaningful and interpretable positioning within vector spaces. Our approach is also capable of learning intelligent mappings between vector space representations of non-overlapping domains, allowing for a novel form of cross-domain similarity analysis. First, we demonstrate that our data collection methodology yields comprehensive and rich datasets across multiple domains, including songs, books, and movies. Second, we show that our method yields single-domain embedding spaces which are separable by various domain specific features. These representations provide a solid foundation upon which we can develop classifiers and initialise recommender systems, demonstrating our method's utility as a data-free solution to the cold-start problem. Further, these spaces can be interactively queried to obtain semantic information about different regions in embedding spaces. Lastly, we argue that by exploiting the unique capabilities of current state-of-the-art large language models, we produce cross-domain mappings which capture contextual relationships between heterogeneous entities which may not be attainable through traditional methods. The presented method facilitates the creation of embedding spaces of any domain which circumvents the need for collection and calibration of sensitive user data, as well as providing deeper insights and better interpretations of multi-domain data.",
        "keywords": "unsupervised representation learning;vector embeddings;large language models;recommender systems",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Kipp Freud;Grant Stevens;Daniel Collins;Delmiro Daladier Sampaio Neto",
        "authorids": "~Kipp_Freud1;~Grant_Stevens1;~Daniel_Collins1;~Delmiro_Daladier_Sampaio_Neto1",
        "gender": "M;M;;M",
        "homepage": "https://kippfreud.com/;;;",
        "dblp": ";302/0935;;",
        "google_scholar": ";G7DzVCUAAAAJ;;",
        "orcid": ";0000-0002-8885-4443;;",
        "linkedin": "kipp-freud-571578b4/;;daniel-collins-006411190/;delmiro-daladier-sampaio-neto-375977a4/",
        "or_profile": "~Kipp_Freud1;~Grant_Stevens1;~Daniel_Collins1;~Delmiro_Daladier_Sampaio_Neto1",
        "aff": ";University of Bristol;University of Bristol;",
        "aff_domain": ";bris.ac.uk;bristol.ac.uk;",
        "position": ";PhD student;PhD student;",
        "bibtex": "@misc{\nfreud2024vibespace,\ntitle={VibeSpace: Automatic vector embedding creation for arbitrary domains and mapping between them using large language models},\nauthor={Kipp Freud and Grant Stevens and Daniel Collins and Delmiro Daladier Sampaio Neto},\nyear={2024},\nurl={https://openreview.net/forum?id=BxPqibGUPR}\n}",
        "github": "",
        "project": "",
        "reviewers": "zjbm;jsQn;8jfG;irAu",
        "site": "https://openreview.net/forum?id=BxPqibGUPR",
        "pdf_size": 2517744,
        "rating": "1;3;3;5",
        "confidence": "5;4;4;4",
        "soundness": "1;2;2;2",
        "contribution": "1;1;2;2",
        "presentation": "2;2;3;2",
        "wc_summary": "89;82;48;71",
        "wc_strengths": "1;52;46;17",
        "wc_weaknesses": "6;170;315;73",
        "wc_questions": "1;85;20;53",
        "wc_review": "97;389;429;214",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            72.5,
            15.532224567009067
        ],
        "wc_strengths_avg": [
            29.0,
            20.89258241577618
        ],
        "wc_weaknesses_avg": [
            141.0,
            116.15291645068582
        ],
        "wc_questions_avg": [
            39.75,
            32.0731585597677
        ],
        "wc_review_avg": [
            282.25,
            134.07716994328302
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:9CS9jDq2ZeUJ:scholar.google.com/&scioq=VibeSpace:+Automatic+vector+embedding+creation+for+arbitrary+domains+and+mapping+between+them+using+large+language+models&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Bristol",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.bristol.ac.uk",
        "aff_unique_abbr": "Bristol",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "BxcEqwl9es",
        "title": "Microenvironment Probability Flows as Proficient Protein Engineers",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The inverse folding of proteins has tremendous applications in protein design and protein engineering. While machine learning approaches for inverse folding have made significant advancements in recent years, efficient generation of diverse and high-quality sequences remains a significant challenge, limiting their practical utility in protein design and engineering. We propose to do probabilistic flow framework that introduces three key designs for designing an amino acid sequence with target fold. At the input level, compare to existing inverse folding methods, rather than sampling sequences from the backbone scaffold, we demonstrate that analyzing a protein structure via the local chemical environment (micro-environment) at each residue can come to comparable performance. At the method level, rather than optimizing the recovery ratio, we generate diverse suggestions.  3) At the data level, during training, we propose to do data augmentation with sequence with high sequence similarity, and train a probability flow model to capture the diverse sequence information. \nWe demonstrate that we achieve comparable recovery ratio as the SOTA inverse folding models with higher inference efficiency and flexibility by only using micro-environment as inputs, and further show that we outperforms existing inverse folding methods in several zero-shot thermal stability change prediction tasks.",
        "keywords": "inverse folding; probabilistic flow",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Chengyue Gong;Lemeng Wu;Daniel Jesus Diaz;Xingchao Liu;James Madigan Loy;Adam Klivans;qiang liu",
        "authorids": "~Chengyue_Gong1;~Lemeng_Wu1;~Daniel_Jesus_Diaz1;~Xingchao_Liu1;~James_Madigan_Loy1;~Adam_Klivans1;~qiang_liu4",
        "gender": "M;M;M;M;M;M;M",
        "homepage": ";https://sites.google.com/utexas.edu/wlm/home?authuser=1;;;;http://www.cs.utexas.edu/~klivans;https://www.cs.utexas.edu/~lqiang/",
        "dblp": "209/4862;232/3021;;228/7309;;k/AdamRKlivans;61/3234-1",
        "google_scholar": "AscakBgAAAAJ;https://scholar.google.ca/citations?user=PCDSl2sAAAAJ;lVD0CNEAAAAJ;VOTVE0UAAAAJ;;;https://scholar.google.com.tw/citations?user=2qDh4WUAAAAJ",
        "orcid": ";;0000-0002-7891-2128;;0000-0001-8519-9482;;",
        "linkedin": ";;aiproteins/;;;;",
        "or_profile": "~Chengyue_Gong1;~Lemeng_Wu1;~Daniel_Jesus_Diaz1;~Xingchao_Liu1;~James_Madigan_Loy1;~Adam_Klivans1;~Qiang_Liu1",
        "aff": "University of Texas at Austin;University of Texas, Austin;University of Texas at Austin;University of Texas, Austin;;University of Texas, Austin;University of Texas, Austin",
        "aff_domain": "cs.utexas.edu;cs.utexas.edu;utexas.edu;utexas.edu;;cs.utexas.edu;utexas.edu",
        "position": "grad student;PhD student;Postdoc;PhD student;;Professor;Assistant Professor",
        "bibtex": "@misc{\ngong2024microenvironment,\ntitle={Microenvironment Probability Flows as Proficient Protein Engineers},\nauthor={Chengyue Gong and Lemeng Wu and Daniel Jesus Diaz and Xingchao Liu and James Madigan Loy and Adam Klivans and qiang liu},\nyear={2024},\nurl={https://openreview.net/forum?id=BxcEqwl9es}\n}",
        "github": "",
        "project": "",
        "reviewers": "VmMV;1cV9;UWpB;XuyZ",
        "site": "https://openreview.net/forum?id=BxcEqwl9es",
        "pdf_size": 2846307,
        "rating": "5;5;5;6",
        "confidence": "3;3;4;3",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;4",
        "presentation": "1;2;2;3",
        "wc_summary": "131;21;71;47",
        "wc_strengths": "96;60;53;43",
        "wc_weaknesses": "107;269;51;50",
        "wc_questions": "20;272;194;23",
        "wc_review": "354;622;369;163",
        "wc_reply_reviewers": "0;0;32;0",
        "wc_reply_authors": "624;1616;734;249",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;3;2;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            67.5,
            40.703193977868615
        ],
        "wc_strengths_avg": [
            63.0,
            19.987496091306685
        ],
        "wc_weaknesses_avg": [
            119.25,
            89.48288942585616
        ],
        "wc_questions_avg": [
            127.25,
            109.29175403478526
        ],
        "wc_review_avg": [
            377.0,
            163.1057938885066
        ],
        "wc_reply_reviewers_avg": [
            8.0,
            13.856406460551018
        ],
        "wc_reply_authors_avg": [
            805.75,
            501.16283531403246
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:aZ8NSIqmX-oJ:scholar.google.com/&scioq=Microenvironment+Probability+Flows+as+Proficient+Protein+Engineers&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "University of Texas at Austin",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.utexas.edu",
        "aff_unique_abbr": "UT Austin",
        "aff_campus_unique_index": "0;0;0;0;0;0",
        "aff_campus_unique": "Austin",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "ByAhXwV4bH",
        "title": "Adversarial Data Robustness via Implicit Neural Representation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Despite its effectiveness, adversarial training requires that users possess a detailed understanding of training settings. However, many common users lack such expertise, making adversarial training impossible and exposing them to potential threats. We propose ``adversarial data robustness'', allowing the data to resist adversarial perturbations. Then, even if adversaries attack those data, these post-attack data can still ensure downstream models' robustness at users' end. This leads to our new setup, where we store the data as a learnable representation via Implicit Neural Representation (INR). Then, we can train such a representation adversarially to achieve data robustness. This paper analyzes the possible attacks to this setup and proposes a defense strategy. We achieve a comparable robustness level without resorting to model-level adversarial training.",
        "keywords": "Adversarial attack;adversarial defense;implicit neural representation",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/35b29e333822d614cc65250907eb2120403426f4.zip",
        "author": "Ziyuan Luo;Anderson Rocha;Haoliang Li;Ka Chun Cheung;Simon See;Renjie Wan",
        "authorids": "~Ziyuan_Luo1;~Anderson_Rocha1;~Haoliang_Li2;~Ka_Chun_Cheung1;~Simon_See1;~Renjie_Wan1",
        "gender": ";M;;M;M;M",
        "homepage": ";https://www.ic.unicamp.br/~rocha/;;;;https://wanrenjie.github.io/",
        "dblp": ";;;165/1089;62/6547;191/2619",
        "google_scholar": ";JX1fykMAAAAJ;;NvbCXToAAAAJ;ebIHTEoAAAAJ;https://scholar.google.com.sg/citations?user=S8_ES4MAAAAJ",
        "orcid": ";0000-0002-4236-8212;;;0000-0002-4958-9237;0000-0002-0161-0367",
        "linkedin": ";anderson-rocha-br/;;;simonsee/;",
        "or_profile": "~Ziyuan_Luo1;~Anderson_Rocha1;~Haoliang_Li2;~Ka_Chun_Cheung1;~Simon_See1;~Renjie_Wan1",
        "aff": ";Universidade Estadual de Campinas;;NVIDIA;NVIDIA;Hong Kong Baptist University",
        "aff_domain": ";unicamp.br;;nvidia.com;nvidia.com;hkbu.edu.hk",
        "position": ";Full Professor;;Senior Manager, Solution Architect;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nluo2024adversarial,\ntitle={Adversarial Data Robustness via Implicit Neural Representation},\nauthor={Ziyuan Luo and Anderson Rocha and Haoliang Li and Ka Chun Cheung and Simon See and Renjie Wan},\nyear={2024},\nurl={https://openreview.net/forum?id=ByAhXwV4bH}\n}",
        "github": "",
        "project": "",
        "reviewers": "GzWz;bc25;Gy4W;DRHK;7WdV",
        "site": "https://openreview.net/forum?id=ByAhXwV4bH",
        "pdf_size": 1509383,
        "rating": "3;3;3;3;8",
        "confidence": "3;4;4;5;4",
        "soundness": "3;1;2;2;3",
        "contribution": "3;1;2;2;3",
        "presentation": "3;2;3;3;3",
        "wc_summary": "41;45;54;322;79",
        "wc_strengths": "45;20;51;96;52",
        "wc_weaknesses": "41;211;198;299;54",
        "wc_questions": "73;109;74;548;25",
        "wc_review": "200;385;377;1265;210",
        "wc_reply_reviewers": "0;111;0;0;0",
        "wc_reply_authors": "139;921;764;2224;274",
        "reply_reviewers": "0;1;0;0;0",
        "reply_authors": "1;2;2;4;1",
        "rating_avg": [
            4.0,
            2.0
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.2,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.2,
            0.7483314773547882
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            108.2,
            107.71332322419543
        ],
        "wc_strengths_avg": [
            52.8,
            24.522642598219303
        ],
        "wc_weaknesses_avg": [
            160.6,
            98.7534303201666
        ],
        "wc_questions_avg": [
            165.8,
            192.95947761123318
        ],
        "wc_review_avg": [
            487.4,
            396.7077513737285
        ],
        "wc_reply_reviewers_avg": [
            22.2,
            44.4
        ],
        "wc_reply_authors_avg": [
            864.4,
            739.8071640637173
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            2.0,
            1.0954451150103321
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Dzo-UFN65LAJ:scholar.google.com/&scioq=Adversarial+Data+Robustness+via+Implicit+Neural+Representation&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "Universidade Estadual de Campinas;NVIDIA;Hong Kong Baptist University",
        "aff_unique_dep": ";NVIDIA Corporation;",
        "aff_unique_url": "https://www.unicamp.br;https://www.nvidia.com;https://www.hkbu.edu.hk",
        "aff_unique_abbr": "UNICAMP;NVIDIA;HKBU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;1;1;2",
        "aff_country_unique": "Brazil;United States;China"
    },
    {
        "id": "ByOPJantEd",
        "title": "Wigner kernels: body-ordered equivariant machine learning without a basis",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Machine-learning models based on a point-cloud representation of a physical object are ubiquitous in scientific applications and particularly well-suited to the atomic-scale description of molecules and materials. Among the many different approaches that have been pursued, the description of local atomic environments in terms of their discretized neighbor densities has been used widely and very successfully. \nWe propose a novel density-based method which involves computing \"Wigner kernels''. These are fully equivariant and body-ordered kernels that can be computed iteratively with a cost that is independent of the basis used to discretize the density and grows only linearly with the maximum body-order considered. This is in marked contrast to feature-space models, whose number of terms and computational cost scale exponentially with increasing order of correlations.\nWe present several examples of the accuracy of models based on Wigner kernels in chemical applications, for both scalar and tensorial targets, reaching state-of-the-art accuracy on the popular QM9 benchmark dataset. We discuss the broader relevance of these findings to equivariant geometric machine-learning.",
        "keywords": "Geometric machine learning;kernel methods;chemistry;molecular modeling",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/d4ee95ad720a81aaa620d19da13ac09d89231f6f.zip",
        "author": "Filippo Bigi;Sergey Pozdnyakov;Michele Ceriotti",
        "authorids": "~Filippo_Bigi1;~Sergey_Pozdnyakov1;~Michele_Ceriotti1",
        "gender": "M;M;M",
        "homepage": ";;https://cosmo.epfl.ch",
        "dblp": "329/8390;293/9220;45/8770",
        "google_scholar": ";1-uZ3uYAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0002-9338-7317;0000-0001-5980-5813;0000-0003-2571-2832",
        "linkedin": ";;",
        "or_profile": "~Filippo_Bigi1;~Sergey_Pozdnyakov1;~Michele_Ceriotti1",
        "aff": "EPFL - EPF Lausanne;EPFL - EPF Lausanne;EPFL - EPF Lausanne",
        "aff_domain": "epfl.ch;epfl.ch;epfl.ch",
        "position": "PhD student;PhD student;Associate Professor",
        "bibtex": "@misc{\nbigi2024wigner,\ntitle={Wigner kernels: body-ordered equivariant machine learning without a basis},\nauthor={Filippo Bigi and Sergey Pozdnyakov and Michele Ceriotti},\nyear={2024},\nurl={https://openreview.net/forum?id=ByOPJantEd}\n}",
        "github": "",
        "project": "",
        "reviewers": "BHT2;hS7z;VgHZ;LkVM",
        "site": "https://openreview.net/forum?id=ByOPJantEd",
        "pdf_size": 630928,
        "rating": "5;5;6;6",
        "confidence": "2;4;3;2",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;2",
        "presentation": "2;2;2;2",
        "wc_summary": "26;134;33;64",
        "wc_strengths": "26;143;28;63",
        "wc_weaknesses": "84;211;123;25",
        "wc_questions": "2;49;16;60",
        "wc_review": "138;537;200;212",
        "wc_reply_reviewers": "0;20;33;0",
        "wc_reply_authors": "428;1029;403;782",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;3;2;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            64.25,
            42.733915102644175
        ],
        "wc_strengths_avg": [
            65.0,
            47.37615433949868
        ],
        "wc_weaknesses_avg": [
            110.75,
            67.58096995456636
        ],
        "wc_questions_avg": [
            31.75,
            23.60481942316018
        ],
        "wc_review_avg": [
            271.75,
            155.69581722063057
        ],
        "wc_reply_reviewers_avg": [
            13.25,
            14.02453207775575
        ],
        "wc_reply_authors_avg": [
            660.5,
            260.2484389962791
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.30151134457776363,
        "gs_citation": 17,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13649256178116406055&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 11,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "EPFL",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.epfl.ch",
        "aff_unique_abbr": "EPFL",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Lausanne",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Switzerland"
    },
    {
        "title": "PARL: A Unified Framework for Policy Alignment in Reinforcement Learning from Human Feedback",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19191",
        "id": "ByR3NdDSZB",
        "author_site": "Souradip Chakraborty, Amrit Bedi, Alec Koppel, Huazheng Wang, Dinesh Manocha, Mengdi Wang, Furong Huang",
        "tldr": "",
        "abstract": "We present a novel unified bilevel optimization-based framework, \\textsf{PARL}, formulated to address the recently highlighted critical issue of policy alignment in reinforcement learning using utility or preference-based feedback. We identify a major gap within current algorithmic designs for solving policy alignment due to a lack of precise characterization of the dependence of the alignment objective on the data generated by policy trajectories. This shortfall contributes to the sub-optimal performance observed in contemporary algorithms. Our framework addressed these concerns by explicitly parameterizing the distribution of the upper alignment objective (reward design)  by the lower optimal variable (optimal policy for the designed reward). Interestingly, from an optimization perspective, our formulation leads to a new class of stochastic bilevel problems where the stochasticity at the upper objective depends upon the lower-level variable. {True to our best knowledge, this work presents the first formulation of the RLHF as a bilevel optimization problem which generalizes the existing RLHF formulations and addresses the existing distribution shift issues in RLHF formulations.} To demonstrate the efficacy of our formulation in resolving alignment issues in RL, we devised an algorithm named \\textsf{A-PARL} to solve PARL problem, establishing sample complexity bounds of order $\\mathcal{O}(1/T)$. Our empirical results substantiate that the proposed \\textsf{PARL} can address the alignment concerns in RL by showing significant improvements (up to 63\\% in terms of required samples) for policy alignment in large-scale environments of the Deepmind control suite and Meta world tasks.",
        "keywords": "Reinforcement Learning;Policy optimization;Policy alignment;Preference based RL;RLHF",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Souradip Chakraborty;Amrit Bedi;Alec Koppel;Huazheng Wang;Dinesh Manocha;Mengdi Wang;Furong Huang",
        "authorids": "~Souradip_Chakraborty1;~Amrit_Bedi1;~Alec_Koppel1;~Huazheng_Wang1;~Dinesh_Manocha3;~Mengdi_Wang1;~Furong_Huang1",
        "gender": "M;M;M;;M;F;F",
        "homepage": "https://souradip-umd.github.io/;https://sites.google.com/view/amritsinghbedi/home;http://koppel.netlify.app/;https://huazhengwang.github.io/;https://www.cs.umd.edu/people/dmanocha;http://mwang.princeton.edu;https://furong-huang.com",
        "dblp": "264/5758;176/2707.html;149/0076;163/2233;m/DineshManocha;;72/8513",
        "google_scholar": "https://scholar.google.co.in/citations?user=pvETm1wAAAAJ;91WLA6QAAAAJ;8ClxyjIAAAAJ;w3PrbKwAAAAJ;X08l_4IAAAAJ;;13yyuCcAAAAJ",
        "orcid": ";;0000-0003-2447-2873;;0000-0001-7047-9801;;",
        "linkedin": ";;alec-koppel-9860b697/;;dinesh-manocha-2311846;;",
        "or_profile": "~Souradip_Chakraborty1;~Amrit_Bedi1;~Alec_Koppel1;~Huazheng_Wang1;~Dinesh_Manocha3;~Mengdi_Wang1;~Furong_Huang1",
        "aff": "University of Maryland, College Park;University of Maryland, College Park;J.P. Morgan Chase;Oregon State University;University of Maryland, College Park;Princeton University;University of Maryland",
        "aff_domain": "umd.edu;umd.edu;jpmorgan.com;oregonstate.edu;umd.edu;princeton.edu;cs.umd.edu",
        "position": "PhD student;Researcher;Research Team Lead;Assistant Professor;Professor;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nchakraborty2024parl,\ntitle={{PARL}: A Unified Framework for Policy Alignment in Reinforcement Learning from Human Feedback},\nauthor={Souradip Chakraborty and Amrit Bedi and Alec Koppel and Huazheng Wang and Dinesh Manocha and Mengdi Wang and Furong Huang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ByR3NdDSZB}\n}",
        "github": "",
        "project": "",
        "reviewers": "iimX;nxvi;fXDT;fCoY",
        "pdf_size": 8342773,
        "rating": "6;6;8;8",
        "confidence": "3;3;3;3",
        "soundness": "3;4;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;3;2",
        "wc_summary": "60;108;87;94",
        "wc_strengths": "30;45;130;61",
        "wc_weaknesses": "183;272;112;53",
        "wc_questions": "133;68;2;69",
        "wc_review": "406;493;331;277",
        "wc_reply_reviewers": "15;119;148;0",
        "wc_reply_authors": "1107;1421;456;370",
        "reply_reviewers": "1;1;2;0",
        "reply_authors": "4;4;3;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            87.25,
            17.455300054711177
        ],
        "wc_strengths_avg": [
            66.5,
            38.265519727294965
        ],
        "wc_weaknesses_avg": [
            155.0,
            81.74044286642935
        ],
        "wc_questions_avg": [
            68.0,
            46.31954231207386
        ],
        "wc_review_avg": [
            376.75,
            81.25999938469111
        ],
        "wc_reply_reviewers_avg": [
            70.5,
            64.04880951274582
        ],
        "wc_reply_authors_avg": [
            838.5,
            440.79388607375216
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            3.0,
            1.224744871391589
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 29,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12039057629339875297&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=ByR3NdDSZB",
        "pdf": "https://openreview.net/pdf?id=ByR3NdDSZB",
        "email": "umd.edu;umd.edu;jpmorgan.com;oregonstate.edu;umd.edu;princeton.edu;cs.umd.edu",
        "author_num": 7,
        "aff_unique_index": "0;0;1;2;0;3;0",
        "aff_unique_norm": "University of Maryland;JPMorgan Chase & Co.;Oregon State University;Princeton University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www/umd.edu;https://www.jpmorganchase.com;https://oregonstate.edu;https://www.princeton.edu",
        "aff_unique_abbr": "UMD;JPM;OSU;Princeton",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "College Park;",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "ByW9j60mvV",
        "title": "RL Algorithms are Information-State Policies in the Bayes-Adaptive MDP",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "RL studies the challenge of maximizing reward in unknown environments; the Bayes-Adaptive MDP (BAMDP) provides a formal specification of this problem, albeit one that may be intractable to solve directly. In this paper, rather than trying to solve the BAMDP, we use it as a theoretical resource. In particular, we view RL algorithms as *hand-written information-state policies* for the BAMDP and derive a number of insights from this approach. For instance, one simple observation from bandit theory is that optimal policies for the BAMDP, i.e., ideal RL algorithms, do not necessarily converge to optimal policies for the underlying MDP---even though RL theory has typically regarded the latter property as essential. We also apply the theory of potential-based reward shaping in the BAMDP to analyze valid forms of intrinsic motivation. We then show that BAMDP Q-values can be decomposed into separate measures of the value gained from exploration and exploitation. We finally derive a direct relationship between an RL algorithm's shaping function in the MDP and its suboptimality in the BAMDP, and use these results to clarify the roles of many forms of reward shaping.",
        "keywords": "Bayesian Reinforcement Learning;BAMDPs;Reinforcement Learning Theory;Lifelong Learning;Reward Shaping;Intrinsic Motivation",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Alyssa Li Dayan;Michael D Dennis;Stuart Russell",
        "authorids": "~Alyssa_Li_Dayan1;~Michael_D_Dennis1;~Stuart_Russell1",
        "gender": ";M;M",
        "homepage": "https://alyd.github.io/;;https://people.eecs.berkeley.edu/~russell/",
        "dblp": ";;",
        "google_scholar": "V42yp08AAAAJ;WXXu26AAAAAJ;https://scholar.google.com.tw/citations?user=KJGrjCAAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Alyssa_Li_Dayan1;~Michael_D_Dennis1;~Stuart_Russell1",
        "aff": "University of California, Berkeley;Google DeepMind;University of California, Berkeley",
        "aff_domain": "berkeley.edu;google.com;berkeley.edu",
        "position": "PhD student;Researcher;Full Professor",
        "bibtex": "@misc{\ndayan2024rl,\ntitle={{RL} Algorithms are Information-State Policies in the Bayes-Adaptive {MDP}},\nauthor={Alyssa Li Dayan and Michael D Dennis and Stuart Russell},\nyear={2024},\nurl={https://openreview.net/forum?id=ByW9j60mvV}\n}",
        "github": "",
        "project": "",
        "reviewers": "t2gv;6FQX;7dtM;h87r",
        "site": "https://openreview.net/forum?id=ByW9j60mvV",
        "pdf_size": 600223,
        "rating": "3;5;5;8",
        "confidence": "3;2;4;4",
        "soundness": "3;2;3;4",
        "contribution": "2;2;2;4",
        "presentation": "2;2;1;4",
        "wc_summary": "102;50;276;221",
        "wc_strengths": "38;10;120;126",
        "wc_weaknesses": "221;108;272;79",
        "wc_questions": "235;166;1;87",
        "wc_review": "596;334;669;513",
        "wc_reply_reviewers": "194;57;80;21",
        "wc_reply_authors": "1220;787;1021;407",
        "reply_reviewers": "2;1;1;1",
        "reply_authors": "3;2;2;1",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            2.25,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            162.25,
            90.3060767612014
        ],
        "wc_strengths_avg": [
            73.5,
            50.52474641203061
        ],
        "wc_weaknesses_avg": [
            170.0,
            79.26222303216079
        ],
        "wc_questions_avg": [
            122.25,
            87.42246564813875
        ],
        "wc_review_avg": [
            528.0,
            124.86592809890135
        ],
        "wc_reply_reviewers_avg": [
            88.0,
            64.71089552772392
        ],
        "wc_reply_authors_avg": [
            858.75,
            302.5114667248169
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.46442036401282394,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:34hfkxrFwfQJ:scholar.google.com/&scioq=RL+Algorithms+are+Information-State+Policies+in+the+Bayes-Adaptive+MDP&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of California, Berkeley;Google",
        "aff_unique_dep": ";Google DeepMind",
        "aff_unique_url": "https://www.berkeley.edu;https://deepmind.com",
        "aff_unique_abbr": "UC Berkeley;DeepMind",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Berkeley;",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "ByXWN19vWP",
        "title": "Confident Sinkhorn Allocation for Pseudo-Labeling",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Semi-supervised learning is a critical tool in reducing machine learning\u2019s dependence on labeled data. It has been successfully applied to structured data, such as images and natural language, by exploiting the inherent spatial and semantic structure therein with pretrained models or data augmentation. These methods are not applicable, however, when the data does not have the appropriate structure, or\ninvariances. Due to their simplicity, pseudo-labeling (PL) methods can be widely used without any domain assumptions. However, PL is sensitive to a threshold and can perform poorly if wrong assignments are made due to overconfidence. This paper studies theoretically the role of uncertainty to pseudo-labeling and proposes Confident Sinkhorn Allocation (CSA), which identifies the best pseudo-label allocation via optimal transport to only samples with high confidence scores. CSA outperforms the current state-of-the-art in this practically important area of semi-supervised learning. Additionally, we propose to use the Integral Probability Metrics to extend and improve the existing PAC-Bayes bound which relies on the Kullback-Leibler (KL) divergence, for ensemble models.",
        "keywords": "pseudo-labeling",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/7d899cfc5ea587e6e86372ecfd263d83ddec7505.pdf",
        "author": "Vu Nguyen;Hisham Husain;Sachin Sudhakar Farfade;Anton van den Hengel",
        "authorids": "~Vu_Nguyen1;~Hisham_Husain1;~Sachin_Sudhakar_Farfade1;~Anton_van_den_Hengel1",
        "gender": "M;;M;",
        "homepage": "http://ntienvu.github.io;;;",
        "dblp": "68/11111;222/3235;142/2784;v/AntonvandenHengel",
        "google_scholar": "https://scholar.google.com.au/citations?user=5RQyC9cAAAAJ;bwq3crYAAAAJ;https://scholar.google.co.in/citations?user=X4JIbvoAAAAJ;https://scholar.google.com.au/citations?user=nMGZ2ZQAAAAJ",
        "orcid": "0000-0002-0294-4561;;;0000-0003-3027-8364",
        "linkedin": "tienvunguyen/;;;",
        "or_profile": "~Vu_Nguyen1;~Hisham_Husain1;~Sachin_Sudhakar_Farfade1;~Anton_van_den_Hengel1",
        "aff": "Amazon;Amazon;;University of Adelaide",
        "aff_domain": "amazon.com;amazon.com;;adelaide.edu.au",
        "position": "Machine Learning Scientist;Researcher;;Professor",
        "bibtex": "@misc{\nnguyen2024confident,\ntitle={Confident Sinkhorn Allocation for Pseudo-Labeling},\nauthor={Vu Nguyen and Hisham Husain and Sachin Sudhakar Farfade and Anton van den Hengel},\nyear={2024},\nurl={https://openreview.net/forum?id=ByXWN19vWP}\n}",
        "github": "",
        "project": "",
        "reviewers": "EorJ;Pwpb;jWfa;33FF",
        "site": "https://openreview.net/forum?id=ByXWN19vWP",
        "pdf_size": 664435,
        "rating": "5;5;6;8",
        "confidence": "4;4;3;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "61;75;127;164",
        "wc_strengths": "33;37;74;172",
        "wc_weaknesses": "158;263;170;71",
        "wc_questions": "71;83;216;3",
        "wc_review": "323;458;587;410",
        "wc_reply_reviewers": "25;74;0;49",
        "wc_reply_authors": "696;1004;771;277",
        "reply_reviewers": "2;1;0;1",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            106.75,
            41.19693556564614
        ],
        "wc_strengths_avg": [
            79.0,
            56.0223169817172
        ],
        "wc_weaknesses_avg": [
            165.5,
            68.0312428226914
        ],
        "wc_questions_avg": [
            93.25,
            77.15690182997241
        ],
        "wc_review_avg": [
            444.5,
            95.4476296195982
        ],
        "wc_reply_reviewers_avg": [
            37.0,
            27.504545078950134
        ],
        "wc_reply_authors_avg": [
            687.0,
            262.54809083289865
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8164965809277259,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8907126784991173283&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Amazon;University of Adelaide",
        "aff_unique_dep": "Amazon.com, Inc.;",
        "aff_unique_url": "https://www.amazon.com;https://www.adelaide.edu.au",
        "aff_unique_abbr": "Amazon;Adelaide",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "United States;Australia"
    },
    {
        "id": "ByamnVR1Yu",
        "title": "Multi-Level Contrastive Learning for Dense Prediction Task",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In this work, we present Multi-Level Contrastive Learning for Dense Prediction Task (MCL), an efficient self-supervised method for learning region-level feature representation for dense prediction tasks. \nOur method is motivated by the three key factors in detection: localization, scale consistency and recognition. To explicitly encode absolute position and scale information, we propose a novel pretext task that assembles multi-scale images in a montage manner to mimic multi-object scenarios. \nUnlike the existing image-level self-supervised methods, our method constructs a multi-level contrastive loss that considers each sub-region of the montage image as a singleton. Our method enables the neural network to learn regional semantic representations for translation and scale consistency while reducing pre-training epochs to the same as supervised pre-training.\nExtensive experiments demonstrate that MCL consistently outperforms the recent state-of-the-art methods on various datasets with significant margins. In particular, MCL obtains 42.5 AP$^\\mathrm{bb}$ and 38.3 AP$^\\mathrm{mk}$ on COCO with the 1x schedule fintuning, when using Mask R-CNN with R50-FPN backbone pre-trained with 100 epochs.\nIn comparison to MoCo, our method surpasses their performance by 4.0 AP$^\\mathrm{bb}$ and 3.1 AP$^\\mathrm{mk}$. \nFurthermore, we explore the alignment between pretext task and downstream tasks. We extend our pretext task to supervised pre-training, which achieves a similar performance to self-supervised learning. This result demonstrates the importance of the alignment between pretext task and downstream tasks, indicating the potential for wider applicability of our method beyond self-supervised settings.",
        "keywords": "Dense prediction task",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/a2c75a3705e9b6ec2aae9888f9daf80750011c4f.pdf",
        "author": "Qiushan Guo;Yizhou Yu;Yi Jiang;Jiannan Wu;Zehuan Yuan;Ping Luo",
        "authorids": "~Qiushan_Guo1;~Yizhou_Yu1;~Yi_Jiang2;~Jiannan_Wu2;~Zehuan_Yuan1;~Ping_Luo2",
        "gender": "M;M;M;M;M;",
        "homepage": "https://guoqiushan.github.io/;;https://enjoyyi.github.io/;;https://shallowyuan.github.io/;http://luoping.me/",
        "dblp": "231/1814;90/6896.html;;277/0616;227/3298;54/4989-2.html",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;e38fTZQAAAAJ;https://scholar.google.com.hk/citations?user=6dikuoYAAAAJ;1euA66EAAAAJ;;https://scholar.google.com.hk/citations?hl=en",
        "orcid": ";;0000-0002-2133-8719;;;0000-0002-6685-7950",
        "linkedin": ";;;;;",
        "or_profile": "~Qiushan_Guo1;~Yizhou_Yu1;~Yi_Jiang2;~Jiannan_Wu2;~Zehuan_Yuan1;~Luo_Ping2",
        "aff": "The University of Hong Kong;The University of Hong Kong;Bytedance;University of Hong Kong;ByteDance Inc.;The University of Hong Kong",
        "aff_domain": "hku.hk;hku.hk;bytedance.com;hku.hk;bytedance.com;hku.hk",
        "position": "PhD student;Full Professor;Researcher;PhD student;Researcher;Associate Professor",
        "bibtex": "@misc{\nguo2024multilevel,\ntitle={Multi-Level Contrastive Learning for Dense Prediction Task},\nauthor={Qiushan Guo and Yizhou Yu and Yi Jiang and Jiannan Wu and Zehuan Yuan and Ping Luo},\nyear={2024},\nurl={https://openreview.net/forum?id=ByamnVR1Yu}\n}",
        "github": "",
        "project": "",
        "reviewers": "EixD;dPd7;yNPS;rYNZ",
        "site": "https://openreview.net/forum?id=ByamnVR1Yu",
        "pdf_size": 866595,
        "rating": "3;5;5;6",
        "confidence": "5;5;5;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;2",
        "presentation": "3;2;3;3",
        "wc_summary": "49;76;77;49",
        "wc_strengths": "54;34;105;44",
        "wc_weaknesses": "260;429;113;67",
        "wc_questions": "5;246;37;4",
        "wc_review": "368;785;332;164",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            62.75,
            13.754544703478919
        ],
        "wc_strengths_avg": [
            59.25,
            27.343874999714288
        ],
        "wc_weaknesses_avg": [
            217.25,
            141.51744592098885
        ],
        "wc_questions_avg": [
            73.0,
            100.75961492582233
        ],
        "wc_review_avg": [
            412.25,
            228.56549936506167
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.6622661785325219,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13845144214757865837&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;0;1;0",
        "aff_unique_norm": "University of Hong Kong;ByteDance",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.hku.hk;https://www.bytedance.com",
        "aff_unique_abbr": "HKU;Bytedance",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "BydD1vNMCV",
        "title": "Statistical Inference for Deep Learning via Stochastic Modeling",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep learning has revolutionized big data analysis in modern data science, however, how to make statistical inference for deep neural networks remains largely unclear. To this end, we explore a stochastic \nvariant of the deep neural network known as the stochastic neural network (StoNet). Firstly, we show that the StoNet falls into the framework of statistical modeling. It not only enables us to address fundamental issues in deep learning, such as structure interpretability and uncertainty quantification, but also provides with us a platform for transferring the theory and methods developed for linear models to the realm of deep learning. Specifically, we show how the sparse learning theory with the Lasso penalty can be adapted to deep neural networks (DNNs) from linear models; establish that the sparse StoNet is consistent in network structure selection; and provides a recursive method to quantify the prediction uncertainty for the Stonet. Furthermore, we extend this result to the DNN by its asymptotic equivalence with the StoNet, showing that consistent sparse deep learning can be obtained by training a DNN with an appropriate Lasso penalty. Additionally, we propose to remodel the last hidden layer output and the target output of a well-trained DNN model using a StoNet on the validation dataset, and then assess the prediction uncertainty of the DNN model via the Stonet. The proposed method has been compared with conformal inference on extensive examples, and numerical results suggests its superiority.",
        "keywords": "Stochastic neural network;uncertainty quantification;nonlinear variable selection;stochastic gradient MCMC;imputation regularized-optimization",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/214353732e8dc7609cbb823d585bdd3e27344c33.zip",
        "author": "Yan Sun;Faming Liang",
        "authorids": "~Yan_Sun6;~Faming_Liang1",
        "gender": "M;M",
        "homepage": "https://sylydya.github.io;https://www.stat.purdue.edu/~fmliang/",
        "dblp": "181/2323-11;29/1122",
        "google_scholar": "NC1KaRwAAAAJ;TboqoPIAAAAJ",
        "orcid": ";",
        "linkedin": "yan-sun-2aab73141/;",
        "or_profile": "~Yan_Sun6;~Faming_Liang1",
        "aff": "University of Pennsylvania;Purdue University",
        "aff_domain": "upenn.edu;purdue.edu",
        "position": "Postdoc;Full Professor",
        "bibtex": "@misc{\nsun2024statistical,\ntitle={Statistical Inference for Deep Learning via Stochastic Modeling},\nauthor={Yan Sun and Faming Liang},\nyear={2024},\nurl={https://openreview.net/forum?id=BydD1vNMCV}\n}",
        "github": "",
        "project": "",
        "reviewers": "GYhy;HASS;9U3v",
        "site": "https://openreview.net/forum?id=BydD1vNMCV",
        "pdf_size": 717086,
        "rating": "5;5;5",
        "confidence": "3;3;2",
        "soundness": "2;3;3",
        "contribution": "2;2;2",
        "presentation": "2;3;2",
        "wc_summary": "65;49;46",
        "wc_strengths": "27;32;19",
        "wc_weaknesses": "40;289;172",
        "wc_questions": "151;110;2",
        "wc_review": "283;480;239",
        "wc_reply_reviewers": "0;281;0",
        "wc_reply_authors": "993;2381;1301",
        "reply_reviewers": "0;1;0",
        "reply_authors": "2;5;2",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            53.333333333333336,
            8.339997335464536
        ],
        "wc_strengths_avg": [
            26.0,
            5.354126134736337
        ],
        "wc_weaknesses_avg": [
            167.0,
            101.7152889196113
        ],
        "wc_questions_avg": [
            87.66666666666667,
            62.84548954026498
        ],
        "wc_review_avg": [
            334.0,
            104.78867623301034
        ],
        "wc_reply_reviewers_avg": [
            93.66666666666667,
            132.4646703422799
        ],
        "wc_reply_authors_avg": [
            1558.3333333333333,
            595.1477874350949
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.0,
            1.4142135623730951
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16758449322937440514&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Pennsylvania;Purdue University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.upenn.edu;https://www.purdue.edu",
        "aff_unique_abbr": "UPenn;Purdue",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Mitigating the Curse of Dimensionality for Certified Robustness via Dual Randomized Smoothing",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19190",
        "id": "C1sQBG6Sqp",
        "author_site": "Song Xia, Yi Yu, Jiang Xudong, Henghui Ding",
        "tldr": "",
        "abstract": "Randomized Smoothing (RS) has been proven a promising method for endowing an arbitrary image classifier with certified robustness. However, the substantial uncertainty inherent in the high-dimensional isotropic Gaussian noise imposes the curse of dimensionality on RS. Specifically, the upper bound of ${\\ell_2}$ certified robustness radius provided by RS exhibits a diminishing trend with the expansion of the input dimension $d$, proportionally decreasing at a rate of $1/\\sqrt{d}$. This paper explores the feasibility of providing ${\\ell_2}$ certified robustness for high-dimensional input through the utilization of dual smoothing in the lower-dimensional space. The proposed Dual Randomized Smoothing (DRS) down-samples the input image into two sub-images and smooths the two sub-images in lower dimensions. Theoretically, we prove that DRS guarantees a tight ${\\ell_2}$ certified robustness radius for the original input and reveal that DRS attains a superior upper bound on the ${\\ell_2}$ robustness radius, which decreases proportionally at a rate of $(1/\\sqrt m + 1/\\sqrt n )$ with $m+n=d$. Extensive experiments demonstrate the generalizability and effectiveness of DRS, which exhibits a notable capability to integrate with established methodologies, yielding substantial improvements in both accuracy and ${\\ell_2}$ certified robustness baselines of RS on the CIFAR-10 and ImageNet datasets. Code is available at https://github.com/xiasong0501/DRS.",
        "keywords": "Certified Robustness;DualRandomized Smoothing;Curse of Diemensionality.",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Song Xia;Yi Yu;Xudong Jiang;Henghui Ding",
        "authorids": "~Song_Xia1;~Yi_Yu5;~Xudong_Jiang1;~Henghui_Ding2",
        "gender": "M;;M;M",
        "homepage": ";https://github.com/yuyi-sd;https://personal.ntu.edu.sg/exdjiang/;https://henghuiding.github.io/",
        "dblp": ";99/111-11.html;11/2494;230/1216",
        "google_scholar": "x_CkEE8AAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com.sg/citations?user=IL3mSioAAAAJ;WI_flSwAAAAJ",
        "orcid": "0009-0002-1224-470X;0000-0003-2730-9553;0000-0002-9104-2315;0000-0003-4868-6526",
        "linkedin": ";%E7%9B%8A-%E4%BD%99-6b453a229;;",
        "or_profile": "~Song_Xia1;~Yi_Yu5;~Xudong_Jiang1;~Henghui_Ding1",
        "aff": "Nanyang Technological University;Nanyang Technological University;Nanyang Technological University;Nanyang Technological University",
        "aff_domain": "ntu.edu.sg;ntu.edu.sg;ntu.edu.sg;ntu.edu.sg",
        "position": "PhD student;PhD student;Associate Professor;Postdoc",
        "bibtex": "@inproceedings{\nxia2024mitigating,\ntitle={Mitigating the Curse of Dimensionality for Certified Robustness via Dual Randomized Smoothing},\nauthor={Song Xia and Yi Yu and Xudong Jiang and Henghui Ding},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=C1sQBG6Sqp}\n}",
        "github": "",
        "project": "",
        "reviewers": "Vvvf;acuW;iAVM;h68g",
        "pdf_size": 1065632,
        "rating": "6;6;8;8",
        "confidence": "3;2;3;1",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "4;2;3;3",
        "wc_summary": "27;93;70;1",
        "wc_strengths": "67;51;99;1",
        "wc_weaknesses": "127;46;300;1",
        "wc_questions": "31;57;78;1",
        "wc_review": "252;247;547;4",
        "wc_reply_reviewers": "127;55;146;0",
        "wc_reply_authors": "710;396;1169;12",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "2;2;3;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            2.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            47.75,
            35.912219368900054
        ],
        "wc_strengths_avg": [
            54.5,
            35.39420856580918
        ],
        "wc_weaknesses_avg": [
            118.5,
            114.10192811692535
        ],
        "wc_questions_avg": [
            41.75,
            28.82164984868146
        ],
        "wc_review_avg": [
            262.5,
            192.4272589837521
        ],
        "wc_reply_reviewers_avg": [
            82.0,
            58.25375524376089
        ],
        "wc_reply_authors_avg": [
            571.75,
            424.2725391773547
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.30151134457776363,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=100848729328054334&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=C1sQBG6Sqp",
        "pdf": "https://openreview.net/pdf?id=C1sQBG6Sqp",
        "email": "ntu.edu.sg;ntu.edu.sg;ntu.edu.sg;ntu.edu.sg",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Nanyang Technological University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ntu.edu.sg",
        "aff_unique_abbr": "NTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Singapore"
    },
    {
        "title": "The Lipschitz-Variance-Margin Tradeoff for Enhanced Randomized Smoothing",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19189",
        "id": "C36v8541Ns",
        "author_site": "Blaise Delattre, Alexandre Araujo, Quentin Barth\u00e9lemy, Alexandre Allauzen",
        "tldr": "",
        "abstract": "Real-life applications of deep neural networks are hindered by their unsteady predictions when faced with noisy inputs and adversarial attacks. The certified radius in this context is a crucial indicator of the robustness of models. However how to design an efficient classifier with an associated certified radius? Randomized smoothing provides a promising framework by relying on noise injection into the inputs to obtain a smoothed and robust classifier. In this paper, we first show that the variance introduced by the Monte-Carlo sampling in the randomized smoothing procedure estimate closely interacts with two other important properties of the classifier, \\textit{i.e.} its Lipschitz constant and margin.  More precisely, our work emphasizes the dual impact of the Lipschitz constant of the base classifier, on both the smoothed classifier and the empirical variance. To increase the certified robust radius, we introduce a different way to convert logits to probability vectors for the base classifier to leverage the variance-margin trade-off. We leverage the use of Bernstein's concentration inequality along with enhanced Lipschitz bounds for randomized smoothing. Experimental results show a significant improvement in certified accuracy compared to current state-of-the-art methods. Our novel certification procedure allows us to use pre-trained models with randomized smoothing, effectively improving the current certification radius in a zero-shot manner.",
        "keywords": "Lipschitz;randomized smoothing;margin;variance;deep learning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/e4828517e9cb92e701484d6ccc75713bf7186e27.zip",
        "author": "Blaise Delattre;Alexandre Araujo;Quentin Barth\u00e9lemy;Alexandre Allauzen",
        "authorids": "~Blaise_Delattre1;~Alexandre_Araujo3;~Quentin_Barth\u00e9lemy1;~Alexandre_Allauzen1",
        "gender": "M;;M;M",
        "homepage": ";https://github.com/qbarthelemy/;http://allauzen.github.io/;https://alexandrearaujo.com/",
        "dblp": ";;54/8163;228/6599",
        "google_scholar": "0SNA45sAAAAJ;97OQs9IAAAAJ;https://scholar.google.fr/citations?user=B2-gXkkAAAAJ;https://scholar.google.fr/citations?user=wsu61VYAAAAJ",
        "orcid": ";;0000-0002-8627-1965;",
        "linkedin": ";;;",
        "or_profile": "~Blaise_Delattre1;~Quentin_Barth\u00e9lemy1;~Alexandre_Allauzen1;~Alexandre_ARAUJO1",
        "aff": ", Universit\u00e9 Paris-Dauphine (Paris IX);;Universit\u00e9 Paris-Dauphine;New York University",
        "aff_domain": "lamsade.dauphine.fr;;dauphine.fr;nyu.edu",
        "position": "PhD student;;Full Professor;Postdoc",
        "bibtex": "@inproceedings{\ndelattre2024the,\ntitle={The Lipschitz-Variance-Margin Tradeoff for Enhanced Randomized Smoothing},\nauthor={Blaise Delattre and Alexandre Araujo and Quentin Barth{\\'e}lemy and Alexandre Allauzen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=C36v8541Ns}\n}",
        "github": "",
        "project": "",
        "reviewers": "W4Xb;12zu;2wVc;ay9y",
        "pdf_size": 641792,
        "rating": "6;6;6;8",
        "confidence": "4;4;3;3",
        "soundness": "3;2;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;2;3;2",
        "wc_summary": "106;95;77;141",
        "wc_strengths": "58;121;74;103",
        "wc_weaknesses": "65;1041;56;54",
        "wc_questions": "649;62;58;416",
        "wc_review": "878;1319;265;714",
        "wc_reply_reviewers": "34;217;54;0",
        "wc_reply_authors": "1099;2325;301;472",
        "reply_reviewers": "1;2;1;0",
        "reply_authors": "2;6;1;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            104.75,
            23.34925052330374
        ],
        "wc_strengths_avg": [
            89.0,
            24.525496936861444
        ],
        "wc_weaknesses_avg": [
            304.0,
            425.52731992199983
        ],
        "wc_questions_avg": [
            296.25,
            250.2042915299416
        ],
        "wc_review_avg": [
            794.0,
            377.1345913596365
        ],
        "wc_reply_reviewers_avg": [
            76.25,
            83.52357451642021
        ],
        "wc_reply_authors_avg": [
            1049.25,
            794.2148245279736
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.5,
            2.0615528128088303
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9095435464531107594&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=C36v8541Ns",
        "pdf": "https://openreview.net/pdf?id=C36v8541Ns",
        "email": "lamsade.dauphine.fr;;dauphine.fr;nyu.edu",
        "author_num": 4,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Universit\u00e9 Paris-Dauphine;New York University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.univ-paris-dauphine.fr;https://www.nyu.edu",
        "aff_unique_abbr": "UPD;NYU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Paris;",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "France;United States"
    },
    {
        "id": "C371MUzjBl",
        "title": "DAG-Based Column Generation for Adversarial Team Games",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Many works recently have focused on computing optimal solutions for the ex ante coordination of a team for solving sequential adversarial team games, where a team of players coordinate against an opponent (or a team of players) in a zero-sum extensive-form game. However, it is challenging to directly compute such an optimal solution because the team\u2019s coordinated strategy space is exponential in the size of the game tree due to the asymmetric information of team members. Column Generation (CG) algorithms have been proposed to overcome this challenge by iteratively expanding the team\u2019s coordinated strategy space via a Best Response Oracle (BRO). More recently, more compact representations (particularly, the Team Belief Directed Acyclic Graph (TB-DAG)) of the team\u2019s coordinated strategy space have been proposed, but the TB-DAG-based algorithms only outperform the CG-based algorithms in games with a small TB-DAG. Unfortunately, it is inefficient to directly apply CG to the TB-DAG because the size of the TB-DAG is still exponential in the size of the game tree and then makes the BRO unscalable. To this end, we develop our novel TB-DAG CG (DCG) algorithm framework by computing a coordinated best response in the original game first and then transforming this strategy into the TB-DAG form. To further improve the scalability, we propose a more suitable BRO for DCG to reduce the cost of the transformation at each iteration. We theoretically show that our algorithm converges exponentially faster than the state-of-the-art CG algorithms, and experimental results show that our algorithm is at least two orders of magnitude faster than the state-of-the-art baselines and solves games that were previously unsolvable.",
        "keywords": "general machine learning;optimization;multi-agent systems;game theory;extensive-form games",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Youzhi Zhang;Bo An;Daniel Dajun Zeng",
        "authorids": "~Youzhi_Zhang2;~Bo_An2;~Daniel_Dajun_Zeng1",
        "gender": ";M;M",
        "homepage": "https://youzhi333.github.io/index.html;https://personal.ntu.edu.sg/boan/;",
        "dblp": "131/9490-1;42/6178-1.html;z/DanielDajunZeng",
        "google_scholar": "i2j5DmwAAAAJ;PEEpuNwAAAAJ;d-tAMlYAAAAJ",
        "orcid": "0000-0002-2984-734X;0000-0002-7064-7438;0000-0002-9046-222X",
        "linkedin": ";;",
        "or_profile": "~Youzhi_Zhang2;~Bo_An2;~Daniel_Dajun_Zeng1",
        "aff": "Centre for Artificial Intelligence and Robotics, Hong Kong Institute of Science & Innovation, Chinese Academy of Sciences;Nanyang Technological University;Institute of Automation, Chinese Academy of Sciences",
        "aff_domain": "cair-cas.org.hk;ntu.edu.sg;ia.ac.cn",
        "position": "Assistant Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nzhang2024dagbased,\ntitle={{DAG}-Based Column Generation for Adversarial Team Games},\nauthor={Youzhi Zhang and Bo An and Daniel Dajun Zeng},\nyear={2024},\nurl={https://openreview.net/forum?id=C371MUzjBl}\n}",
        "github": "",
        "project": "",
        "reviewers": "yi8B;toQL;cmYu;rs4T",
        "site": "https://openreview.net/forum?id=C371MUzjBl",
        "pdf_size": 539403,
        "rating": "5;6;6;8",
        "confidence": "2;5;4;4",
        "soundness": "2;3;4;4",
        "contribution": "2;3;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "71;62;105;25",
        "wc_strengths": "38;59;45;149",
        "wc_weaknesses": "79;381;54;43",
        "wc_questions": "1;48;130;1",
        "wc_review": "189;550;334;218",
        "wc_reply_reviewers": "0;24;26;0",
        "wc_reply_authors": "257;1467;755;8",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;3;2;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            65.75,
            28.472574523565655
        ],
        "wc_strengths_avg": [
            72.75,
            44.66752175798429
        ],
        "wc_weaknesses_avg": [
            139.25,
            140.18269329699726
        ],
        "wc_questions_avg": [
            45.0,
            52.69250421075089
        ],
        "wc_review_avg": [
            322.75,
            141.97777114745816
        ],
        "wc_reply_reviewers_avg": [
            12.5,
            12.519984025548915
        ],
        "wc_reply_authors_avg": [
            621.75,
            557.2106311799874
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.4736842105263159,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11291709803693736910&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Hong Kong Institute of Science & Innovation, Chinese Academy of Sciences;Nanyang Technological University;Chinese Academy of Sciences",
        "aff_unique_dep": "Centre for Artificial Intelligence and Robotics;;Institute of Automation",
        "aff_unique_url": ";https://www.ntu.edu.sg;http://www.ia.cas.cn",
        "aff_unique_abbr": ";NTU;CAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "China;Singapore"
    },
    {
        "id": "C3msSjudA7",
        "title": "ViFu: Visible Part Fusion for Multiple Scene Radiance Fields",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this paper, we propose a method to segment and recover a static, clean background and 360$^{\\circ}$ objects from multiple scene observations. Recent works have used neural radiance fields to model 3D scenes and improved the quality of novel view synthesis, while few studies have focused on modeling the invisible or occluded parts of the training images. These under-modeled parts constrain both scene editing and rendering view selection. Our basic idea is that, by observing the same set of objects in various arrangement, so that parts that are invisible in one scene may become visible in others. By fusing the visible parts from each scene, occlusion-free rendering of both background scene and foreground objects can be achieved.\n\nWe decompose the multi-scene fusion task into two main components: (1) objects/background segmentation and alignment, where we leverage point cloud-based methods tailored to our novel problem formulation; (2) radiance fields fusion, where we introduce $\\textit{visibility field}$ to quantify the visible information of radiance fields, and propose $\\textit{visibility-aware rendering}$ for multiple scene fusion, ultimately obtaining clean background and 360$^{\\circ}$ object rendering. Comprehensive experiments were conducted on synthetic and real datasets, and the results demonstrate the effectiveness of our method.\n\nThe code will be release for research purposes upon paper acceptance.",
        "keywords": "Computer vision;3D reconstruction;Neural radiance fields;Neural rendering",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/b6dd481601faed178edb852134da6ba449d2c85b.zip",
        "author": "Tianhan Xu;Takuya Ikeda;Koichi Nishiwaki",
        "authorids": "~Tianhan_Xu1;~Takuya_Ikeda1;~Koichi_Nishiwaki1",
        "gender": "M;M;",
        "homepage": "https://xth430.github.io/;;",
        "dblp": ";126/1141;85/6001",
        "google_scholar": "ENNc68oAAAAJ;HS4dPGQAAAAJ;https://scholar.google.co.jp/citations?user=oC2CnhUAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Tianhan_Xu1;~Takuya_Ikeda1;~Koichi_Nishiwaki1",
        "aff": "Preferred Networks, Inc.;Woven by Toyota, Inc.;Woven by Toyota",
        "aff_domain": "preferred.jp;woven.toyota;woven.toyota",
        "position": "Researcher;Researcher;Principal Researcher",
        "bibtex": "@misc{\nxu2024vifu,\ntitle={ViFu: Visible Part Fusion for Multiple Scene Radiance Fields},\nauthor={Tianhan Xu and Takuya Ikeda and Koichi Nishiwaki},\nyear={2024},\nurl={https://openreview.net/forum?id=C3msSjudA7}\n}",
        "github": "",
        "project": "",
        "reviewers": "Monn;hrRk;bZoV;etRq;p7zS",
        "site": "https://openreview.net/forum?id=C3msSjudA7",
        "pdf_size": 9254419,
        "rating": "5;5;5;6;6",
        "confidence": "4;4;4;3;4",
        "soundness": "2;2;3;3;3",
        "contribution": "2;2;2;3;2",
        "presentation": "3;3;3;3;3",
        "wc_summary": "133;94;95;109;90",
        "wc_strengths": "81;33;22;117;35",
        "wc_weaknesses": "221;219;285;122;115",
        "wc_questions": "47;92;7;127;32",
        "wc_review": "482;438;409;475;272",
        "wc_reply_reviewers": "49;0;69;0;87",
        "wc_reply_authors": "623;429;265;268;213",
        "reply_reviewers": "1;0;1;0;1",
        "reply_authors": "2;2;2;1;1",
        "rating_avg": [
            5.4,
            0.48989794855663565
        ],
        "confidence_avg": [
            3.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            104.2,
            15.765785740013088
        ],
        "wc_strengths_avg": [
            57.6,
            35.942175782776424
        ],
        "wc_weaknesses_avg": [
            192.4,
            64.88019728699967
        ],
        "wc_questions_avg": [
            61.0,
            43.05810028322197
        ],
        "wc_review_avg": [
            415.2,
            76.29259466029453
        ],
        "wc_reply_reviewers_avg": [
            41.0,
            35.5696499842211
        ],
        "wc_reply_authors_avg": [
            359.6,
            150.35105586592996
        ],
        "reply_reviewers_avg": [
            0.6,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.6,
            0.4898979485566356
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.6123724356957945,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:5k3pZjiUO0MJ:scholar.google.com/&scioq=ViFu:+Visible+Part+Fusion+for+Multiple+Scene+Radiance+Fields&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Preferred Networks, Inc.;Toyota, Inc.;Toyota",
        "aff_unique_dep": ";;Woven",
        "aff_unique_url": "https://www.preferred-networks.com;https://www.toyota.com;https://www.toyota-global.com",
        "aff_unique_abbr": "PFN;Toyota;Toyota",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Japan;United States"
    },
    {
        "id": "C42FkKhAUC",
        "title": "IMPROVING ADVERSARIAL TRAINING WITH MARGIN- WEIGHTED PERTURBATION BUDGET",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Adversarial Training effectively improves the robustness of Deep Neural Networks (DNNs) to adversarial attacks. Generally, Adversarial Training involves training DNN models with adversarial examples obtained within a pre-defined, fixed perturbation bound. Notably, individual natural examples from which these adversarial examples are crafted exhibit varying degrees of intrinsic vulnerabilities, and as such, crafting adversarial examples with fixed perturbation radius for all instances may not sufficiently unleash the potency of adversarial training. Motivated by this observation, we propose a simple, computationally cheap reweighting function for assigning perturbation bounds to adversarial examples used for Adversarial Training. We name our approach \\textit{Margin-Weighted Perturbation Budget (MWPB)}. The proposed method assigns perturbation radii to individual adversarial samples based on the vulnerability of their corresponding individual natural examples. Experimental results show that the proposed method yields a genuine improvement in the robustness of existing AT algorithms against various adversarial attacks.",
        "keywords": "Adversarial Training;Adversarial Robustness;Adversarial Examples;Trustworthy Machine Learning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Olukorede Fakorede;Modeste Atsague;Jin Tian",
        "authorids": "~Olukorede_Fakorede1;~Modeste_Atsague1;~Jin_Tian1",
        "gender": ";M;M",
        "homepage": ";;https://mbzuai.ac.ae/study/faculty/jin-tian/",
        "dblp": ";309/0536;04/4658-1",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;T0crkfoAAAAJ",
        "orcid": ";;0000-0001-5313-1600",
        "linkedin": ";https://www.linkedin.com/mwlite/in/modeste-atsague-97794165;",
        "or_profile": "~Olukorede_Fakorede1;~Modeste_Atsague1;~Jin_Tian1",
        "aff": ";Iowa State University;Iowa State University",
        "aff_domain": ";iastate.edu;iastate.edu",
        "position": ";PhD student;Full Professor",
        "bibtex": "@misc{\nfakorede2024improving,\ntitle={{IMPROVING} {ADVERSARIAL} {TRAINING} {WITH} {MARGIN}- {WEIGHTED} {PERTURBATION} {BUDGET}},\nauthor={Olukorede Fakorede and Modeste Atsague and Jin Tian},\nyear={2024},\nurl={https://openreview.net/forum?id=C42FkKhAUC}\n}",
        "github": "",
        "project": "",
        "reviewers": "hkHv;Sshb;jD4X;vNfc",
        "site": "https://openreview.net/forum?id=C42FkKhAUC",
        "pdf_size": 545842,
        "rating": "3;5;5;6",
        "confidence": "4;4;4;4",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;4",
        "wc_summary": "30;87;75;77",
        "wc_strengths": "17;70;61;58",
        "wc_weaknesses": "175;546;128;209",
        "wc_questions": "8;210;54;39",
        "wc_review": "230;913;318;383",
        "wc_reply_reviewers": "0;203;125;0",
        "wc_reply_authors": "647;1144;766;650",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;2;2;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            67.25,
            21.98152633462927
        ],
        "wc_strengths_avg": [
            51.5,
            20.402205763103165
        ],
        "wc_weaknesses_avg": [
            264.5,
            165.0492350785062
        ],
        "wc_questions_avg": [
            77.75,
            78.13569926736434
        ],
        "wc_review_avg": [
            461.0,
            266.55112080049486
        ],
        "wc_reply_reviewers_avg": [
            82.0,
            86.51300480274628
        ],
        "wc_reply_authors_avg": [
            801.75,
            203.34007844003602
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:c0H6x8Wea2wJ:scholar.google.com/&scioq=IMPROVING+ADVERSARIAL+TRAINING+WITH+MARGIN-+WEIGHTED+PERTURBATION+BUDGET&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Iowa State University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.iastate.edu",
        "aff_unique_abbr": "ISU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Str2Str: A Score-based Framework for Zero-shot Protein Conformation Sampling",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19188",
        "id": "C4BikKsgmK",
        "author_site": "Jiarui Lu, Bozitao Zhong, Zuobai Zhang, Jian Tang",
        "tldr": "",
        "abstract": "The dynamic nature of proteins is crucial for determining their biological functions and properties, for which Monte Carlo (MC) and molecular dynamics (MD) simulations stand as predominant tools to study such phenomena. By utilizing empirically derived force fields, MC or MD simulations explore the conformational space through numerically evolving the system via Markov chain or Newtonian mechanics. However, the high-energy barrier of the force fields can hamper the exploration of both methods by the rare event, resulting in inadequately sampled ensemble without exhaustive running. Existing learning-based approaches perform direct sampling yet heavily rely on target-specific simulation data for training, which suffers from high data acquisition cost and poor generalizability. Inspired by simulated annealing, we propose Str2Str, a novel structure-to-structure translation framework capable of zero-shot conformation sampling with roto-translation equivariant property. Our method leverages an amortized denoising score matching objective trained on general crystal structures and has no reliance on simulation data during both training and inference. Experimental results across several benchmarking protein systems demonstrate that Str2Str outperforms previous state-of-the-art generative structure prediction models and can be orders of magnitude faster compared with long MD simulations.",
        "keywords": "proteins;conformational sampling;diffusion models;score-based models;generative modeling;equivariant network",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Jiarui Lu;Bozitao Zhong;Zuobai Zhang;Jian Tang",
        "authorids": "~Jiarui_Lu2;~Bozitao_Zhong1;~Zuobai_Zhang1;~Jian_Tang1",
        "gender": "Not Specified;M;M;",
        "homepage": "https://lujiarui.github.io/;;https://oxer11.github.io/;http://www.jian-tang.com",
        "dblp": ";310/9462;256/9098.html;181/2667-5",
        "google_scholar": "POV9jiIAAAAJ;6k_LhSoAAAAJ;UCDbNccAAAAJ;https://scholar.google.ca/citations?user=1ir6WUEAAAAJ",
        "orcid": ";0000-0001-9363-6099;;",
        "linkedin": "lujiarui/;;;",
        "or_profile": "~Jiarui_Lu2;~Bozitao_Zhong1;~Zuobai_Zhang1;~Jian_Tang1",
        "aff": "Mila - Qu\u00e9bec AI Institute; Universit\u00e9 de Montr\u00e9al;The Chinese University of Hong Kong;NVIDIA;Mila, HEC Montreal",
        "aff_domain": "umontreal.ca;link.cuhk.edu.hk;nvidia.com;hec.ca",
        "position": "PhD student;MS student;Intern;Assistant Professor",
        "bibtex": "@inproceedings{\nlu2024strstr,\ntitle={Str2Str: A Score-based Framework for Zero-shot Protein Conformation Sampling},\nauthor={Jiarui Lu and Bozitao Zhong and Zuobai Zhang and Jian Tang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=C4BikKsgmK}\n}",
        "github": "",
        "project": "",
        "reviewers": "6bVL;Fe1f;dLpk;BVKt",
        "pdf_size": 15629335,
        "rating": "6;6;6;6",
        "confidence": "3;4;3;3",
        "soundness": "3;3;3;3",
        "contribution": "3;3;2;3",
        "presentation": "3;3;3;2",
        "wc_summary": "93;106;141;138",
        "wc_strengths": "61;40;74;69",
        "wc_weaknesses": "119;2;22;180",
        "wc_questions": "201;256;102;386",
        "wc_review": "474;404;339;773",
        "wc_reply_reviewers": "0;33;144;0",
        "wc_reply_authors": "1045;1316;730;1251",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "3;4;3;4",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            119.5,
            20.54872258803452
        ],
        "wc_strengths_avg": [
            61.0,
            12.98075498574717
        ],
        "wc_weaknesses_avg": [
            80.75,
            72.39949930766096
        ],
        "wc_questions_avg": [
            236.25,
            102.56796527181379
        ],
        "wc_review_avg": [
            497.5,
            166.07001535497008
        ],
        "wc_reply_reviewers_avg": [
            44.25,
            59.14547742642712
        ],
        "wc_reply_authors_avg": [
            1085.5,
            228.3314476807783
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.5,
            0.5
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 23,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9509433293930317925&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=C4BikKsgmK",
        "pdf": "https://openreview.net/pdf?id=C4BikKsgmK",
        "email": "umontreal.ca;link.cuhk.edu.hk;nvidia.com;hec.ca",
        "author_num": 4,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "Qu\u00e9bec AI Institute;Universit\u00e9 de Montr\u00e9al;Chinese University of Hong Kong;NVIDIA;HEC Montreal",
        "aff_unique_dep": "AI Institute;;;NVIDIA Corporation;HEC Business School",
        "aff_unique_url": "https://mila.quebec;https://www.umontreal.ca;https://www.cuhk.edu.hk;https://www.nvidia.com;https://www.hec.ca",
        "aff_unique_abbr": "Mila;UdeM;CUHK;NVIDIA;HEC",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Hong Kong SAR;Montreal",
        "aff_country_unique_index": "0;0;1;2;0",
        "aff_country_unique": "Canada;China;United States"
    },
    {
        "title": "Jumanji: a Diverse Suite of Scalable Reinforcement Learning Environments in JAX",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19187",
        "id": "C4CxQmp9wc",
        "author_site": "Cl\u00e9ment Bonnet, Daniel Luo, Donal Byrne, Shikha Surana, Sasha Abramowitz, Paul Duckworth, Vincent Coyette, Laurence Midgley, Elshadai Tegegn, Tristan Kalloniatis, Omayma Mahjoub, Matthew Macfarlane, Andries Smit, Nathan Grinsztajn, Raphael Boige, Cemlyn Waters, Mohamed Ali Mimouni, Ulrich Mbou Sob, Ruan de Kock, Siddarth Singh, Daniel Furelos-Blanco, Victor Le, Arnu Pretorius, Alexandre Laterre",
        "tldr": "",
        "abstract": "Open-source reinforcement learning (RL) environments have played a crucial role in driving progress in the development of AI algorithms.\nIn modern RL research, there is a need for simulated environments that are performant, scalable, and modular to enable their utilization in a wider range of potential real-world applications.\nTherefore, we present Jumanji, a suite of diverse RL environments specifically designed to be fast, flexible, and scalable.\nJumanji provides a suite of environments focusing on combinatorial problems frequently encountered in industry, as well as challenging general decision-making tasks.\nBy leveraging the efficiency of JAX and hardware accelerators like GPUs and TPUs, Jumanji enables rapid iteration of research ideas and large-scale experimentation, ultimately empowering more capable agents.\nUnlike existing RL environment suites, Jumanji is highly customizable, allowing users to tailor the initial state distribution and problem complexity to their needs.\nFurthermore, we provide actor-critic baselines for each environment, accompanied by preliminary findings on scaling and generalization scenarios.\nJumanji aims to set a new standard for speed, adaptability, and scalability of RL environments.",
        "keywords": "reinforcement learning;jax;combinatorial;research",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Cl\u00e9ment Bonnet;Daniel Luo;Donal John Byrne;Shikha Surana;Sasha Abramowitz;Paul Duckworth;Vincent Coyette;Laurence Illing Midgley;Elshadai Tegegn;Tristan Kalloniatis;Omayma Mahjoub;Matthew Macfarlane;Andries Petrus Smit;Nathan Grinsztajn;Raphael Boige;Cemlyn Neil Waters;Mohamed Ali Ali Mimouni;Ulrich Armel Mbou Sob;Ruan John de Kock;Siddarth Singh;Daniel Furelos-Blanco;Victor Le;Arnu Pretorius;Alexandre Laterre",
        "authorids": "~Cl\u00e9ment_Bonnet1;~Daniel_Luo1;~Donal_John_Byrne1;~Shikha_Surana1;~Sasha_Abramowitz1;~Paul_Duckworth1;~Vincent_Coyette1;~Laurence_Illing_Midgley1;~Elshadai_Tegegn1;~Tristan_Kalloniatis1;~Omayma_Mahjoub1;~Matthew_Macfarlane1;~Andries_Petrus_Smit1;~Nathan_Grinsztajn1;~Raphael_Boige1;~Cemlyn_Neil_Waters1;~Mohamed_Ali_Ali_Mimouni1;~Ulrich_Armel_Mbou_Sob1;~Ruan_John_de_Kock1;~Siddarth_Singh2;~Daniel_Furelos-Blanco1;~Victor_Le1;~Arnu_Pretorius1;~Alexandre_Laterre1",
        "gender": "M;M;M;F;M;M;M;M;F;M;F;;M;M;M;M;M;M;M;M;;M;M;M",
        "homepage": ";https://github.com/dluo96;;;;http://www.robots.ox.ac.uk/~scpd/;;https://lollcat.github.io/laurence-midgley;;https://github.com/tristankalloniatis;;;;https://nathangrinsztajn.github.io/;https://github.com/Egiob;https://www.linkedin.com/in/cemlyn-waters-640055151;;;;https://www.raillab.org/people#profile;https://www.danielfurelos.com;https://github.com/Coac;;",
        "dblp": "305/3524;;;;;179/2160;;275/3152;;;329/6292;;;;;;;;;;223/0191;;188/4368;223/4200",
        "google_scholar": "H6euRhAAAAAJ;;;;https://scholar.google.com/citations?hl=en;I64MZDoAAAAJ;;vMd1gwMAAAAJ;;;;;;yVHIYEYAAAAJ;;;;;jrYPOrsAAAAJ;RDxZpTwAAAAJ;https://scholar.google.co.uk/citations?user=IfMKjBgAAAAJ;;zZ6ydrAAAAAJ;HrMSaicAAAAJ",
        "orcid": ";;;;;0000-0001-9052-6919;;0000-0002-3147-6066;;;;;;0000-0001-6817-5972;;;;0000-0001-9710-9368;;0000-0002-3321-4959;;;;",
        "linkedin": "clement-bonnet16/;danluo1996/;donal-byrne-ai/;shikha-surana/;sasha-abramowitz-693761148/;;vincent-coyette-148979151/;laurencemidgley/;elshadai-tegegn/;;omayma-mahjoub-35613b1a6/;matthew-macfarlane-b86163bb/;andries-petrus-smit-856901170;nathan-grinsztajn-960379139/?locale=en_US;;cemlyn-waters-640055151;medalimimouni/;ulrich-a-mbou-sob;ruan-de-kock/;https://za.linkedin.com/in/siddarthsingh1;;;arnupretorius/;reinforce/",
        "or_profile": "~Cl\u00e9ment_Bonnet1;~Daniel_Luo1;~Donal_John_Byrne1;~Shikha_Surana1;~Sasha_Abramowitz1;~Paul_Duckworth1;~Vincent_Coyette1;~Laurence_Illing_Midgley1;~Elshadai_Tegegn1;~Tristan_Kalloniatis1;~Omayma_Mahjoub1;~Matthew_Macfarlane1;~Andries_Petrus_Smit1;~Nathan_Grinsztajn1;~Raphael_Boige1;~Cemlyn_Neil_Waters1;~Mohamed_Ali_Ali_Mimouni1;~Ulrich_Armel_Mbou_Sob1;~Ruan_John_de_Kock1;~Siddarth_Singh2;~Daniel_Furelos-Blanco1;~Victor_Le1;~Arnu_Pretorius1;~Alexandre_Laterre1",
        "aff": "Raive;InstaDeep;CFDX;InstaDeep;InstaDeep;InstaDeep;;University of Cambridge;Iowa State University;InstaDeep;InstaDeep;University of Amsterdam;InstaDeep;InstaDeep;InstaDeep;;InstaDeep;InstaDeep;InstaDeep;InstaDeep;Imperial College London;InstaDeep;InstaDeep;InstaDeep",
        "aff_domain": "raive.com;instadeep.com;cfdx.io;instadeep.com;instadeep.com;instadeep.com;;cam.ac.uk;iastate.edu;instadeep.com;instadeep.com;uva.nl;instadeep.com;instadeep.com;instadeep.com;;instadeep.com;instadeep.com;instadeep.com;instadeep.com;imperial.ac.uk;instadeep.com;instadeep.com;instadeep.com",
        "position": "Researcher;Researcher;Researcher;Researcher;Researcher;Principal Researcher;;PhD student;PhD student;Researcher;Researcher;PhD student;Researcher;Researcher;Researcher;;Researcher;Researcher;Research Engineer;Researcher;Postdoc;Researcher;Researcher;head of research",
        "bibtex": "@inproceedings{\nbonnet2024jumanji,\ntitle={Jumanji: a Diverse Suite of Scalable Reinforcement Learning Environments in {JAX}},\nauthor={Cl{\\'e}ment Bonnet and Daniel Luo and Donal John Byrne and Shikha Surana and Sasha Abramowitz and Paul Duckworth and Vincent Coyette and Laurence Illing Midgley and Elshadai Tegegn and Tristan Kalloniatis and Omayma Mahjoub and Matthew Macfarlane and Andries Petrus Smit and Nathan Grinsztajn and Raphael Boige and Cemlyn Neil Waters and Mohamed Ali Ali Mimouni and Ulrich Armel Mbou Sob and Ruan John de Kock and Siddarth Singh and Daniel Furelos-Blanco and Victor Le and Arnu Pretorius and Alexandre Laterre},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=C4CxQmp9wc}\n}",
        "github": "",
        "project": "",
        "reviewers": "d6hE;S6or;7YMa;VTas",
        "pdf_size": 5743142,
        "rating": "5;6;6;8",
        "confidence": "4;4;4;4",
        "soundness": "3;2;3;4",
        "contribution": "2;2;3;4",
        "presentation": "3;3;4;4",
        "wc_summary": "13;38;90;72",
        "wc_strengths": "12;48;76;52",
        "wc_weaknesses": "102;315;22;35",
        "wc_questions": "42;244;15;15",
        "wc_review": "169;645;203;174",
        "wc_reply_reviewers": "28;23;0;0",
        "wc_reply_authors": "629;1338;289;190",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            53.25,
            29.810862114336782
        ],
        "wc_strengths_avg": [
            47.0,
            22.869193252058544
        ],
        "wc_weaknesses_avg": [
            118.5,
            117.44041042162617
        ],
        "wc_questions_avg": [
            79.0,
            95.89838371943502
        ],
        "wc_review_avg": [
            297.75,
            200.90467266840758
        ],
        "wc_reply_reviewers_avg": [
            12.75,
            12.871965661856
        ],
        "wc_reply_authors_avg": [
            611.5,
            449.9380512915084
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            24,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 27,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12287797302676423152&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=C4CxQmp9wc",
        "pdf": "https://openreview.net/pdf?id=C4CxQmp9wc",
        "email": "raive.com;instadeep.com;cfdx.io;instadeep.com;instadeep.com;instadeep.com;;cam.ac.uk;iastate.edu;instadeep.com;instadeep.com;uva.nl;instadeep.com;instadeep.com;instadeep.com;;instadeep.com;instadeep.com;instadeep.com;instadeep.com;imperial.ac.uk;instadeep.com;instadeep.com;instadeep.com",
        "author_num": 24,
        "aff_unique_index": "0;1;2;1;1;1;3;4;1;1;5;1;1;1;1;1;1;1;6;1;1;1",
        "aff_unique_norm": "Raive;InstaDeep;cfdx;University of Cambridge;Iowa State University;University of Amsterdam;Imperial College London",
        "aff_unique_dep": ";;;;;;",
        "aff_unique_url": ";https://www.instadeep.com;;https://www.cam.ac.uk;https://www.iastate.edu;https://www.uva.nl;https://www.imperial.ac.uk",
        "aff_unique_abbr": ";InstaDeep;;Cambridge;ISU;UvA;ICL",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Cambridge",
        "aff_country_unique_index": "1;1;1;1;1;2;1;1;3;1;1;1;1;1;1;1;1;1;1;1",
        "aff_country_unique": ";United Kingdom;United States;Netherlands"
    },
    {
        "id": "C4QNyUqBIu",
        "title": "Graph Neural Modeling of Network Flows",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Network flow problems, which involve distributing traffic such that the underlying infrastructure is used effectively, are ubiquitous in transportation and logistics. Among them, the general Multi-Commodity Network Flow (MCNF) problem concerns the distribution of multiple flows of different sizes between several sources and sinks, while achieving effective utilization of the links. Due to the appeal of data-driven optimization, these problems have increasingly been approached using graph learning methods. In this paper, we propose a novel graph learning architecture for network flow problems called Per-Edge Weights (PEW). This method builds on a Graph Attention Network and uses distinctly parametrized message functions along each link. We extensively evaluate the proposed solution through an Internet flow routing case study using $17$ Service Provider topologies and $2$ routing schemes. We show that PEW yields substantial gains over architectures whose global message function constrains the routing unnecessarily. We also find that an MLP is competitive with other standard architectures. Furthermore, we analyze the relationship between graph structure and predictive performance for data-driven routing of flows, an aspect that has not been considered by existing work in the area.",
        "keywords": "graph neural networks;network flows;routing;MCNF",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/c7d41ab33a78d78771234918a18db3e38974abb5.zip",
        "author": "Victor-Alexandru Darvariu;Stephen Hailes;Mirco Musolesi",
        "authorids": "~Victor-Alexandru_Darvariu1;~Stephen_Hailes1;~Mirco_Musolesi2",
        "gender": "M;M;M",
        "homepage": "https://victor.darvariu.me/;http://www0.cs.ucl.ac.uk/staff/S.Hailes/;https://www.mircomusolesi.org",
        "dblp": "https://dblp.uni-trier.de/pid/257/4959;85/6195;54/5541",
        "google_scholar": "eRiLIWgAAAAJ;https://scholar.google.com.tw/citations?user=LJD3OxkAAAAJ;https://scholar.google.co.uk/citations?user=8t4SqVwAAAAJ",
        "orcid": ";0000-0001-7375-3642;0000-0001-9712-4090",
        "linkedin": ";;mircomusolesi/",
        "or_profile": "~Victor-Alexandru_Darvariu1;~Stephen_Hailes1;~Mirco_Musolesi1",
        "aff": "University College London, University of London;University College London;University of Bologna",
        "aff_domain": "ucl.ac.uk;ucl.ac.uk;unibo.it",
        "position": "Postdoc;Full Professor;Full Professor",
        "bibtex": "@misc{\ndarvariu2024graph,\ntitle={Graph Neural Modeling of Network Flows},\nauthor={Victor-Alexandru Darvariu and Stephen Hailes and Mirco Musolesi},\nyear={2024},\nurl={https://openreview.net/forum?id=C4QNyUqBIu}\n}",
        "github": "",
        "project": "",
        "reviewers": "kHCa;ci3b;fEYx;o9s9",
        "site": "https://openreview.net/forum?id=C4QNyUqBIu",
        "pdf_size": 24036895,
        "rating": "3;3;3;5",
        "confidence": "4;4;5;3",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "2;2;3;4",
        "wc_summary": "80;113;148;77",
        "wc_strengths": "16;40;160;73",
        "wc_weaknesses": "116;280;681;352",
        "wc_questions": "26;5;159;52",
        "wc_review": "238;438;1148;554",
        "wc_reply_reviewers": "0;0;0;189",
        "wc_reply_authors": "586;780;808;801",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            104.5,
            28.81405906844782
        ],
        "wc_strengths_avg": [
            72.25,
            54.554445281754994
        ],
        "wc_weaknesses_avg": [
            357.25,
            205.5545852079199
        ],
        "wc_questions_avg": [
            60.5,
            59.25580140374443
        ],
        "wc_review_avg": [
            594.5,
            338.9642311513119
        ],
        "wc_reply_reviewers_avg": [
            47.25,
            81.83940065762945
        ],
        "wc_reply_authors_avg": [
            743.75,
            91.65799201379005
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16919886466553480550&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "University College London;University of Bologna",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ucl.ac.uk;https://www.unibo.it",
        "aff_unique_abbr": "UCL;Unibo",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "United Kingdom;Italy"
    },
    {
        "id": "C4s9CAvqyg",
        "title": "MPformer: Advancing Graph Modeling Through Heterophily Relationship-Based Position Encoding",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Graph transformer model integrates the relative positional relationships among nodes into the transformer architecture, holding significant promise for modeling graph-structured data. They address certain limitations of graph neural networks (GNNs) in leveraging information from distant nodes. However, these models overlooked the representations of neighboring nodes with dissimilar labels, i.e., heterophilous relationships. This limitation inhibits the scalability of these methods from handling a wide range of real-world heterophilous datasets. To mitigate this limitation, we introduce MPformer, comprising the information aggregation module called Tree2Token and the position encoding module, HeterPos. Tree2Token aggregates node and its neighbor information at various hop distances, treating each node and its neighbor data as token vectors, and serializing these token sequences. Furthermore, for each newly generated sequence, we introduce a novel position encoding technique called HeterPos. HeterPos employs the shortest path distance between nodes and their neighbors to define their relative positional relationships. Simultaneously, it captures feature distinctions between neighboring nodes and ego-nodes, facilitating the incorporation of heterophilous relationships into the Transformer architecture. We validate the efficacy of our approach through both theoretical analysis and practical experiments. Extensive experiments on various datasets demonstrate that our approach surpasses existing graph transformer models and traditional graph neural network (GNN) models.",
        "keywords": "graph transformer;mulit-hops aggregation;position encoding;heterophily",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/c3a5dae82df3f4b0c98fabc41dc51dd0cf7a5dc6.zip",
        "author": "Dong Li;Biqing Qi;Junqi Gao;Huan Xiong;Bin Gu;Xinquan Chen",
        "authorids": "~Dong_Li20;~Biqing_Qi1;~Junqi_Gao1;~Huan_Xiong1;~Bin_Gu1;~Xinquan_Chen3",
        "gender": ";M;M;M;M;M",
        "homepage": "https://scholar.google.com.hk/citations?hl=zh-CN&user=sSOt_McAAAAJ&view_op=list_works&gmla=AHoSzlUGq462ME3yzn-O-QVHz7m99fadMPU_X2FzQ2M47JN3ZcLFtf0DPl4zmY9LfBnLpIMz-00YKFo7-kN034NWi0ZKUF3q57DNbdoGe_w;https://biqing-qi.github.io/;;https://scholar.google.com/citations?user=l4hm14MAAAAJ&hl=en;https://mbzuai.ac.ae/study/faculty/bin-gu/;",
        "dblp": ";233/4949.html;81/9266.html;;29/1758-1;",
        "google_scholar": "https://scholar.google.com.hk/citations?hl=zh-CN;;;l4hm14MAAAAJ;Vo8OgCgAAAAJ;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": "0009-0007-8307-9904;0000-0002-4072-0577;0009-0007-1644-5812;;0000-0001-6049-1815;",
        "linkedin": ";;;;;",
        "or_profile": "~Dong_Li20;~Biqing_Qi1;~Junqi_Gao1;~Huan_Xiong1;~Bin_Gu1;~Xinquan_Chen3",
        "aff": "Shanghai Artificial Intelligence Laboratory;Harbin Institute of Technology;Shanghai Artificial Intelligence Laboratory;Harbin Institute of Technology;Mohamed bin Zayed University of Artificial Intelligence;Harbin Institute of Technology",
        "aff_domain": "pjlab.org.cn;hit.edu.cn;pjlab.org.cn;hit.edu.cn;mbzuai.ac.ae;hit.edu.cn",
        "position": "Intern;PhD student;Intern;Full Professor;Assistant Professor;MS student",
        "bibtex": "@misc{\nli2024mpformer,\ntitle={{MP}former: Advancing Graph Modeling Through Heterophily Relationship-Based Position Encoding},\nauthor={Dong Li and Biqing Qi and Junqi Gao and Huan Xiong and Bin Gu and Xinquan Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=C4s9CAvqyg}\n}",
        "github": "",
        "project": "",
        "reviewers": "HA8U;CiBH;BMT4;o9xM",
        "site": "https://openreview.net/forum?id=C4s9CAvqyg",
        "pdf_size": 0,
        "rating": "3;3;3;5",
        "confidence": "5;4;5;4",
        "soundness": "2;1;2;2",
        "contribution": "2;1;1;2",
        "presentation": "2;2;2;2",
        "wc_summary": "68;34;38;340",
        "wc_strengths": "20;6;25;398",
        "wc_weaknesses": "227;293;208;173",
        "wc_questions": "113;2;106;1",
        "wc_review": "428;335;377;912",
        "wc_reply_reviewers": "236;0;0;0",
        "wc_reply_authors": "1690;1947;1660;352",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "4;4;4;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            120.0,
            127.6949489995591
        ],
        "wc_strengths_avg": [
            112.25,
            165.12476343662087
        ],
        "wc_weaknesses_avg": [
            225.25,
            43.64845358085439
        ],
        "wc_questions_avg": [
            55.5,
            54.057839394485605
        ],
        "wc_review_avg": [
            513.0,
            232.70474855490164
        ],
        "wc_reply_reviewers_avg": [
            59.0,
            102.19099764656376
        ],
        "wc_reply_authors_avg": [
            1412.25,
            622.2163510387685
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.25,
            1.299038105676658
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13194429199685465748&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;1;2;1",
        "aff_unique_norm": "Shanghai Artificial Intelligence Laboratory;Harbin Institute of Technology;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.shailab.org/;http://www.hit.edu.cn/;https://mbzuai.ac.ae",
        "aff_unique_abbr": "Shanghai AI Lab;HIT;MBZUAI",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Harbin",
        "aff_country_unique_index": "0;0;0;0;1;0",
        "aff_country_unique": "China;United Arab Emirates"
    },
    {
        "id": "C4wuTlitI7",
        "title": "Understanding Masked Autoencoders From a Local Contrastive Perspective",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Masked AutoEncoder (MAE) has revolutionized the field of self-supervised learning with its simple yet effective masking and reconstruction strategies. However, despite achieving state-of-the-art performance across various downstream vision tasks, the underlying mechanisms that drive MAE\u2019s efficacy are less well-explored compared to the canonical contrastive learning paradigm. In this paper, we explore a new perspective to explain what truly contributes to the \u201crich hidden representations inside the MAE\u201d. Firstly, concerning MAE\u2019s generative pretraining pathway, with a unique encoder-decoder architecture to reconstruct images from aggressive masking, we conduct an in-depth analysis of the decoder\u2019s behaviors. We empirically find that MAE\u2019s decoder mainly learns local features with a limited receptive field, adhering to the well-known Locality Principle. Building upon this locality assumption, we propose a theoretical framework that reformulates the reconstruction-based MAE into a local region-level contrastive learning form for improved understanding. Furthermore, to substantiate the local contrastive nature of MAE, we introduce a Siamese architecture that combines the essence of MAE and contrastive learning without masking and explicit decoder, which sheds light on a unified and more flexible self-supervised learning framework.",
        "keywords": "Self-supervised Learning;Masked Image Modeling;Contrastive Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Xiaoyu Yue;LEI BAI;Meng Wei;Jiangmiao Pang;Xihui Liu;Luping Zhou;Wanli Ouyang",
        "authorids": "~Xiaoyu_Yue1;~LEI_BAI1;~Meng_Wei7;~Jiangmiao_Pang1;~Xihui_Liu1;~Luping_Zhou3;~Wanli_Ouyang1",
        "gender": "M;M;;M;F;F;",
        "homepage": "https://github.com/yuexy;http://leibai.site/;;https://oceanpang.github.io/;https://xh-liu.github.io/;https://sites.google.com/view/lupingzhou;",
        "dblp": "220/3383;119/1223-1;;231/7630;184/3911;45/933;",
        "google_scholar": "9Fc5FY0AAAAJ;https://scholar.google.com.au/citations?user=sakOO04AAAAJ;;https://scholar.google.com/citations?authuser=0;https://scholar.google.com.hk/citations?user=4YL23GMAAAAJ;https://scholar.google.com.au/citations?user=SgofT2MAAAAJ;",
        "orcid": ";0000-0003-3378-7201;;0000-0002-6711-9319;0000-0003-1831-9952;;",
        "linkedin": ";lei-bai-641370153/;;;;;",
        "or_profile": "~Xiaoyu_Yue1;~LEI_BAI1;~Meng_Wei7;~Jiangmiao_Pang1;~Xihui_Liu1;~Luping_Zhou3;~Wanli_Ouyang1",
        "aff": "University of Sydney;Shanghai AI Laboratory;;Shanghai AI Laboratory ;University of Hong Kong;University of Sydney;",
        "aff_domain": "usyd.edu.au;pjlab.org.cn;;pjlab.org.cn;hku.hk;sydney.edu.au;",
        "position": "PhD student;Researcher;;Research Scientist;Assistant Professor;Associate Professor;",
        "bibtex": "@misc{\nyue2024understanding,\ntitle={Understanding Masked Autoencoders From a Local Contrastive Perspective},\nauthor={Xiaoyu Yue and LEI BAI and Meng Wei and Jiangmiao Pang and Xihui Liu and Luping Zhou and Wanli Ouyang},\nyear={2024},\nurl={https://openreview.net/forum?id=C4wuTlitI7}\n}",
        "github": "",
        "project": "",
        "reviewers": "pPsy;zrzk;iWK2;bqZg",
        "site": "https://openreview.net/forum?id=C4wuTlitI7",
        "pdf_size": 665192,
        "rating": "3;3;5;5",
        "confidence": "5;4;4;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "2;2;3;3",
        "wc_summary": "100;20;36;69",
        "wc_strengths": "33;37;49;52",
        "wc_weaknesses": "159;71;69;139",
        "wc_questions": "2;4;4;4",
        "wc_review": "294;132;158;264",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            56.25,
            30.825111516424396
        ],
        "wc_strengths_avg": [
            42.75,
            7.949056547792323
        ],
        "wc_weaknesses_avg": [
            109.5,
            40.13415004706092
        ],
        "wc_questions_avg": [
            3.5,
            0.8660254037844386
        ],
        "wc_review_avg": [
            212.0,
            68.45436436049933
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9907988998024195805&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1;2;0",
        "aff_unique_norm": "University of Sydney;Shanghai AI Laboratory;University of Hong Kong",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.sydney.edu.au;https://www.shanghai-ai-lab.com;https://www.hku.hk",
        "aff_unique_abbr": "USYD;SAIL;HKU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;1;1;1;0",
        "aff_country_unique": "Australia;China"
    },
    {
        "id": "C53xlgEqVh",
        "title": "Vec-Tok Speech: Speech Vectorization and Tokenization for Neural Speech Generation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Language models (LMs) have recently flourished in natural language processing and computer vision, generating high-fidelity texts or images in various tasks. In contrast, the current speech generative models are still struggling regarding speech quality and task generalization. This paper presents Vec-Tok Speech, an extensible framework that resembles multiple speech generation tasks, generating expressive and high-fidelity speech. \nSpecifically, we propose a novel speech codec based on speech vectors and semantic tokens. Speech vectors contain acoustic details contributing to high-fidelity speech reconstruction, while semantic tokens focus on the linguistic content of speech, facilitating language modeling. Based on the proposed speech codec, Vec-Tok Speech leverages an LM to undertake the core of speech generation. Moreover, Byte-Pair Encoding (BPE) is introduced to reduce the token length and bit rate for lower exposure bias and longer context coverage, improving the performance of LMs.\nVec-Tok Speech can be used for intra- and cross-lingual zero-shot voice conversion (VC), zero-shot speaking style transfer text-to-speech (TTS), speech-to-speech translation (S2ST), speech denoising, and speaker de-identification and anonymization.\nExperiments show that Vec-Tok Speech, built on 50k hours of speech, performs better than other SOTA models.",
        "keywords": "speech synthesis;zero-shot;voice conversion",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Xinfa Zhu;Yuanjun Lv;Yi Lei;Tao Li;Lei Xie;WENDI HE;Hongbin Zhou;Heng Lu",
        "authorids": "~Xinfa_Zhu1;~Yuanjun_Lv1;~Yi_Lei1;~Tao_Li21;~Lei_Xie1;~WENDI_HE2;~Hongbin_Zhou1;~Heng_Lu1",
        "gender": "M;M;F;M;M;F;M;M",
        "homepage": "https://github.com/zxf-icpc;https://github.com/BakerBunker;https://leiyi420.github.io;;http://lxie.npu-aslp.org/;;https://github.com/HongbinZhou;",
        "dblp": "330/1495;;;;70/1741-1.html;314/6270.html;;",
        "google_scholar": "0lQ704cAAAAJ;;https://scholar.google.com.hk/citations?hl=zh-CN;https://scholar.google.com.hk/citations?user=CnUGnNMAAAAJ;https://scholar.google.com.sg/citations?user=Qddov9wAAAAJ;;;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": "0000-0001-9275-523X;;;;;;;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Xinfa_Zhu1;~Yuanjun_Lv1;~Yi_Lei1;~Tao_Li21;~Lei_Xie1;~WENDI_HE2;~Hongbin_Zhou1;~Heng_Lu1",
        "aff": "Northwestern Polytechnical University, Northwest Polytechnical University Xi'an;Northwest Polytechnical University Xi'an;;;Northwest Polytechnical University;;Ximalaya Inc.;",
        "aff_domain": "mai.nwpu.edu.cn;nwpu.edu.cn;;;nwpu.edu.cn;;ximalaya.com;",
        "position": "MS student;MS student;;;Full Professor;;Researcher;",
        "bibtex": "@misc{\nzhu2024vectok,\ntitle={Vec-Tok Speech: Speech Vectorization and Tokenization for Neural Speech Generation},\nauthor={Xinfa Zhu and Yuanjun Lv and Yi Lei and Tao Li and Lei Xie and WENDI HE and Hongbin Zhou and Heng Lu},\nyear={2024},\nurl={https://openreview.net/forum?id=C53xlgEqVh}\n}",
        "github": "",
        "project": "",
        "reviewers": "zJWA;KgQK;VMQy;cYW2;G28A",
        "site": "https://openreview.net/forum?id=C53xlgEqVh",
        "pdf_size": 792280,
        "rating": "3;5;5;5;8",
        "confidence": "4;4;4;4;4",
        "soundness": "2;3;2;3;3",
        "contribution": "3;3;3;2;3",
        "presentation": "3;3;1;2;4",
        "wc_summary": "69;73;48;135;71",
        "wc_strengths": "65;92;52;24;224",
        "wc_weaknesses": "303;192;132;145;113",
        "wc_questions": "41;5;124;56;26",
        "wc_review": "478;362;356;360;434",
        "wc_reply_reviewers": "41;25;48;0;0",
        "wc_reply_authors": "835;588;839;1032;244",
        "reply_reviewers": "1;1;1;0;0",
        "reply_authors": "2;1;2;2;1",
        "rating_avg": [
            5.2,
            1.6
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.8,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.6,
            1.019803902718557
        ],
        "wc_summary_avg": [
            79.2,
            29.3148426569204
        ],
        "wc_strengths_avg": [
            91.4,
            69.82148666420674
        ],
        "wc_weaknesses_avg": [
            177.0,
            68.18504234801061
        ],
        "wc_questions_avg": [
            50.4,
            40.480118576901425
        ],
        "wc_review_avg": [
            398.0,
            49.39635614091387
        ],
        "wc_reply_reviewers_avg": [
            22.8,
            20.0539272961682
        ],
        "wc_reply_authors_avg": [
            707.6,
            271.27889707826523
        ],
        "reply_reviewers_avg": [
            0.6,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.6,
            0.4898979485566356
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 16,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13710589400071830304&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "Northwestern Polytechnical University;Northwest Polytechnical University;Ximalaya Inc.",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.nwpu.edu.cn;http://www.nwpu.edu.cn;https://www.ximalaya.com",
        "aff_unique_abbr": "NWPU;NWPU;Ximalaya",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Xi'an;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "C5sxQsqv7X",
        "title": "SELECTFORMER: PRIVATE AND PRACTICAL DATA SELECTION FOR TRANSFORMERS",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Critical to a free data market is $\\textit{private data selection}$, i.e. the model owner selects and then appraises training data from the data owner before both parties commit to a transaction. To keep the data and model private, this process shall evaluate the target model to be trained over Multi-Party Computation (MPC). While prior work suggests that evaluating Transformer-based models over MPC is prohibitively expensive, this paper makes it practical for the purpose of data selection. Our contributions are three: (1) a new pipeline for private data selection over MPC; (2) emulating high-dimensional nonlinear operators with low-dimension MLPs, which are trained on a small sample of the data of interest; (3) scheduling MPC in a parallel, multiphase fashion. We evaluate our method on diverse Transformer models and NLP/CV benchmarks. Compared to directly evaluating the target model over MPC, our method reduces the delay from thousands of hours to tens of hours, while only seeing around 0.20% accuracy degradation from training with the selected data.",
        "keywords": "Secure Multiparty Computation;Privacy;Machine Learning;Transformer model",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Xu Ouyang;Changhong Yang;Felix Xiaozhu Lin;Yangfeng Ji",
        "authorids": "~Xu_Ouyang2;~Changhong_Yang1;~Felix_Xiaozhu_Lin1;~Yangfeng_Ji1",
        "gender": "M;M;Not Specified;M",
        "homepage": "https://xo28.github.io/;https://www.linkedin.com/in/changhong-yang-a6b9a4250/;https://felixlin.org;http://yangfengji.net",
        "dblp": ";;;94/8323",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;;;pg02-e8AAAAJ",
        "orcid": "0000-0003-2433-8180;;;",
        "linkedin": "xu-ouyang-b0a2351a0/;;;",
        "or_profile": "~Xu_Ouyang2;~Changhong_Yang1;~Felix_Xiaozhu_Lin1;~Yangfeng_Ji1",
        "aff": "University of Virginia, Charlottesville;;University of Virginia, Charlottesville;University of Virginia",
        "aff_domain": "virginia.edu;;virginia.edu;virginia.edu",
        "position": "PhD student;;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nouyang2024selectformer,\ntitle={{SELECTFORMER}: {PRIVATE} {AND} {PRACTICAL} {DATA} {SELECTION} {FOR} {TRANSFORMERS}},\nauthor={Xu Ouyang and Changhong Yang and Felix Xiaozhu Lin and Yangfeng Ji},\nyear={2024},\nurl={https://openreview.net/forum?id=C5sxQsqv7X}\n}",
        "github": "",
        "project": "",
        "reviewers": "Xsq1;due4;zaeT;ER9t;8Z9X",
        "site": "https://openreview.net/forum?id=C5sxQsqv7X",
        "pdf_size": 979712,
        "rating": "3;5;5;6;8",
        "confidence": "3;3;4;3;2",
        "soundness": "2;2;2;3;3",
        "contribution": "2;2;2;3;3",
        "presentation": "1;2;2;2;4",
        "wc_summary": "66;95;34;25;135",
        "wc_strengths": "53;86;23;45;106",
        "wc_weaknesses": "204;100;41;52;72",
        "wc_questions": "101;3;70;52;144",
        "wc_review": "424;284;168;174;457",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "889;875;618;318;497",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "2;2;1;1;1",
        "rating_avg": [
            5.4,
            1.624807680927192
        ],
        "confidence_avg": [
            3.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.2,
            0.9797958971132712
        ],
        "wc_summary_avg": [
            71.0,
            40.45244121187249
        ],
        "wc_strengths_avg": [
            62.6,
            29.668838871786004
        ],
        "wc_weaknesses_avg": [
            93.8,
            58.63923601139429
        ],
        "wc_questions_avg": [
            74.0,
            47.265209192385896
        ],
        "wc_review_avg": [
            301.4,
            121.3022670851621
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            639.4,
            219.927806336534
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.4,
            0.4898979485566356
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5838742081211422,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:u5E_e5rtU74J:scholar.google.com/&scioq=SELECTFORMER:+PRIVATE+AND+PRACTICAL+DATA+SELECTION+FOR+TRANSFORMERS&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Virginia",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.virginia.edu",
        "aff_unique_abbr": "UVA",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Charlottesville;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "C5u71ph75Q",
        "title": "Internal-Coordinate Density Modelling of Protein Structure: Covariance Matters",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "After the recent ground-breaking advances in protein structure prediction, one of the remaining challenges in protein machine learning is to reliably predict distributions of structural states. Parametric models of fluctuations are difficult to fit due to complex covariance structures between degrees of freedom in the protein chain, often causing models to either violate local or global structural constraints. In this paper, we present a new strategy for modelling protein densities in internal coordinates, which uses constraints in 3D space to induce covariance structure between the internal degrees of freedom. We illustrate the potential of the procedure by constructing a variational autoencoder with full covariance output induced by the constraints implied by the conditional mean in 3D, and demonstrate that our approach makes it possible to scale density models of internal coordinates to full protein backbones in two settings: 1) a unimodal setting for proteins exhibiting small fluctuations and limited amounts of available data, and 2) a multimodal setting for larger conformational changes in a high data regime.",
        "keywords": "Machine Learning;Structural Biology;Internal-Coordinate Density Modelling;Generative Modelling",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/54abbbed4ad13e53d72a1d5118a4a0ca384ae61a.zip",
        "author": "Marloes Arts;Jes Frellsen;Wouter Boomsma",
        "authorids": "~Marloes_Arts1;~Jes_Frellsen1;~Wouter_Boomsma1",
        "gender": "M;M;F",
        "homepage": "https://frellsen.org;;",
        "dblp": "83/8247;06/5945;339/6643",
        "google_scholar": "Yj2sBWkAAAAJ;EwqU_jsAAAAJ;iq2Gx4IAAAAJ",
        "orcid": "0000-0001-9224-1271;0000-0002-8257-3827;0000-0001-7918-8955",
        "linkedin": "frellsen/;;marloes-arts/",
        "or_profile": "~Jes_Frellsen1;~Wouter_Boomsma1;~Marloes_Elisabeth_Arts1",
        "aff": "Technical University of Denmark;University of Copenhagen;Copenhagen University",
        "aff_domain": "dtu.dk;ku.dk;ku.dk",
        "position": "Associate Professor;Full Professor;Postdoc",
        "bibtex": "@misc{\narts2024internalcoordinate,\ntitle={Internal-Coordinate Density Modelling of Protein Structure: Covariance Matters},\nauthor={Marloes Arts and Jes Frellsen and Wouter Boomsma},\nyear={2024},\nurl={https://openreview.net/forum?id=C5u71ph75Q}\n}",
        "github": "",
        "project": "",
        "reviewers": "QUDF;U1Uk;jsg1",
        "site": "https://openreview.net/forum?id=C5u71ph75Q",
        "pdf_size": 17881482,
        "rating": "5;6;6",
        "confidence": "3;3;3",
        "soundness": "3;1;3",
        "contribution": "2;3;3",
        "presentation": "3;2;3",
        "wc_summary": "142;59;46",
        "wc_strengths": "78;66;72",
        "wc_weaknesses": "55;203;110",
        "wc_questions": "74;1294;116",
        "wc_review": "349;1622;344",
        "wc_reply_reviewers": "0;461;0",
        "wc_reply_authors": "279;1813;520",
        "reply_reviewers": "0;2;0",
        "reply_authors": "1;4;1",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            82.33333333333333,
            42.52319628417203
        ],
        "wc_strengths_avg": [
            72.0,
            4.898979485566356
        ],
        "wc_weaknesses_avg": [
            122.66666666666667,
            61.08100268404972
        ],
        "wc_questions_avg": [
            494.6666666666667,
            565.4740390936519
        ],
        "wc_review_avg": [
            771.6666666666666,
            601.2799311099245
        ],
        "wc_reply_reviewers_avg": [
            153.66666666666666,
            217.31748408466564
        ],
        "wc_reply_authors_avg": [
            870.6666666666666,
            673.5549140361328
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            2.0,
            1.4142135623730951
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=785248280049881179&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Technical University of Denmark;University of Copenhagen",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tek.dk;https://www.ku.dk",
        "aff_unique_abbr": "DTU;UCPH",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Denmark"
    },
    {
        "title": "InfoBatch: Lossless Training Speed Up by Unbiased Dynamic Data Pruning",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19186",
        "id": "C61sk5LsK6",
        "author_site": "Ziheng Qin, Kai Wang, Zangwei Zheng, Jianyang Gu, Xiangyu Peng, Zhaopan Xu, Zhou Daquan, Lei Shang, Baigui Sun, Xuansong Xie, Yang You",
        "tldr": "",
        "abstract": "Data pruning aims to obtain lossless performances with less overall cost. A common approach is to filter out samples that make less contribution to the training. This could lead to gradient expectation bias compared to the original data. To solve this problem, we propose InfoBatch, a novel framework aiming to achieve lossless training acceleration by unbiased dynamic data pruning. Specifically, InfoBatch\nrandomly prunes a portion of less informative samples based on the loss distribution and rescales the gradients of the remaining samples to approximate the original gradient. As a plug-and-play and architecture-agnostic framework, InfoBatch consistently obtains lossless training results on classification, semantic segmentation, vision pertaining, and instruction fine-tuning tasks. On CIFAR10/100, ImageNet-\n1K, and ADE20K, InfoBatch losslessly saves 40% overall cost. For pertaining MAE and diffusion model, InfoBatch can respectively save 24.8% and 27% cost. For LLaMA instruction fine-tuning, combining InfoBatch and the recent coreset selection method (DQ) can achieve 10 times acceleration. Our results encourage more exploration on the data efficiency aspect of large model training. Code is publicly available at NUS-HPC-AI-Lab/InfoBatch.",
        "keywords": "Dynamic Data Pruning; Training acceleration",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/5e4cc27b7a5943ee13bcf8072cf75b21d07f018e.zip",
        "author": "Ziheng Qin;Kai Wang;Zangwei Zheng;Jianyang Gu;Xiangyu Peng;xu Zhao Pan;Daquan Zhou;Lei Shang;Baigui Sun;Xuansong Xie;Yang You",
        "authorids": "~Ziheng_Qin1;~Kai_Wang8;~Zangwei_Zheng1;~Jianyang_Gu1;~Xiangyu_Peng2;~xu_Zhao_Pan1;~Daquan_Zhou1;~Lei_Shang1;~Baigui_Sun1;~Xuansong_Xie1;~Yang_You1",
        "gender": "M;M;M;M;M;M;;M;M;M;M",
        "homepage": ";https://kaiwang960112.github.io/;https://zhengzangw.github.io;https://vimar-gu.github.io/;https://github.com/xyupeng;;;;;https://www.comp.nus.edu.sg/~youy/;",
        "dblp": "342/2679;78/2022-36;289/0376;241/7332.html;120/1463;278/2033.html;;186/8016;234/8028;33/8167-1.html;244/9623",
        "google_scholar": "I04VhPMAAAAJ;i2II0XIAAAAJ;FTqutJEAAAAJ;8ZXbT18AAAAJ;https://scholar.google.co.za/citations?user=KRUTk7sAAAAJ;;WO1eMcIAAAAJ;ZNhTHywAAAAJ;M0Ei1zkAAAAJ;jF4dPZwAAAAJ;DdCAbWwAAAAJ",
        "orcid": "0009-0001-8571-1228;0000-0002-1154-5175;0000-0002-1505-1535;;;;;0000-0001-7722-4748;;;",
        "linkedin": "ziheng-qin-635551184/;;;;xiangyu-peng-aa10b11a5/;;;;;yang-you-0b92914b/;",
        "or_profile": "~Ziheng_Qin1;~Kai_Wang8;~Zangwei_Zheng1;~Jianyang_Gu1;~Xiangyu_Peng2;~xu_Zhao_Pan1;~Lei_Shang1;~Baigui_Sun1;~Xuansong_Xie1;~Yang_You1;~Zhou_Daquan1",
        "aff": "ByteDance Inc.;National University of Singapore;National University of Singapore;Zhejiang University;National University of Singapore;Harbin Institute of Technology;Alibaba Group;Alibaba Group;Alibaba Group;National University of Singapore;Bytedance",
        "aff_domain": "bytedance.com;u.nus.edu;nus.edu.sg;zju.edu.cn;nus.edu;hit.edu.cn;alibaba-inc.com;alibaba-inc.com;alibaba-inc.com;nus.edu.sg;bytedance.com",
        "position": "Intern;PhD student;PhD student;PhD student;PhD student;PhD student;Researcher;Researcher;Researcher;Professor;Researcher",
        "bibtex": "@inproceedings{\nqin2024infobatch,\ntitle={InfoBatch: Lossless Training Speed Up by Unbiased Dynamic Data Pruning},\nauthor={Ziheng Qin and Kai Wang and Zangwei Zheng and Jianyang Gu and Xiangyu Peng and xu Zhao Pan and Daquan Zhou and Lei Shang and Baigui Sun and Xuansong Xie and Yang You},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=C61sk5LsK6}\n}",
        "github": "",
        "project": "",
        "reviewers": "DemB;nCAL;8u8Q;Nce2",
        "pdf_size": 3211321,
        "rating": "6;6;8;8",
        "confidence": "4;4;4;4",
        "soundness": "3;2;3;4",
        "contribution": "3;3;3;3",
        "presentation": "3;4;3;4",
        "wc_summary": "62;77;178;52",
        "wc_strengths": "93;92;90;32",
        "wc_weaknesses": "157;291;618;90",
        "wc_questions": "45;36;294;33",
        "wc_review": "357;496;1180;207",
        "wc_reply_reviewers": "53;146;153;39",
        "wc_reply_authors": "1516;1703;2187;416",
        "reply_reviewers": "1;2;1;1",
        "reply_authors": "4;5;6;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            92.25,
            50.30096917555367
        ],
        "wc_strengths_avg": [
            76.75,
            25.85899263312475
        ],
        "wc_weaknesses_avg": [
            289.0,
            203.26706570421092
        ],
        "wc_questions_avg": [
            102.0,
            110.93917252260357
        ],
        "wc_review_avg": [
            560.0,
            372.26133293695705
        ],
        "wc_reply_reviewers_avg": [
            97.75,
            52.04505259868608
        ],
        "wc_reply_authors_avg": [
            1455.5,
            648.1838088073475
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.25,
            1.479019945774904
        ],
        "replies_avg": [
            30,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 46,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15810906281422800988&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=C61sk5LsK6",
        "pdf": "https://openreview.net/pdf?id=C61sk5LsK6",
        "email": "bytedance.com;u.nus.edu;nus.edu.sg;zju.edu.cn;nus.edu;hit.edu.cn;alibaba-inc.com;alibaba-inc.com;alibaba-inc.com;nus.edu.sg;bytedance.com",
        "author_num": 11,
        "aff_unique_index": "0;1;1;2;1;3;4;4;4;1;0",
        "aff_unique_norm": "ByteDance;National University of Singapore;Zhejiang University;Harbin Institute of Technology;Alibaba Group",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.bytedance.com;https://www.nus.edu.sg;https://www.zju.edu.cn;http://www.hit.edu.cn/;https://www.alibaba.com",
        "aff_unique_abbr": "ByteDance;NUS;ZJU;HIT;Alibaba",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Harbin",
        "aff_country_unique_index": "0;1;1;0;1;0;0;0;0;1;0",
        "aff_country_unique": "China;Singapore"
    },
    {
        "id": "C6a0Obrp3o",
        "title": "SingleInsert: Inserting New Concepts from a Single Image into Text-to-Image Models for Flexible Editing",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent progress in text-to-image (T2I) models enables high-quality image generation with flexible textual control. To utilize the abundant visual priors in the off-the-shelf T2I models, a series of methods try to invert an image to proper embedding that aligns with the semantic space of the T2I model. However, these image-to-text (I2T) inversion methods typically need multiple source images containing the same concept or struggle with the imbalance between editing flexibility and visual fidelity. In this work, we point out that the critical problem lies in the foreground-background entanglement when learning an intended concept, and propose a simple and effective baseline for single-image I2T inversion, named SingleInsert. SingleInsert adopts a two-stage scheme. In the first stage, we regulate the learned embedding to concentrate on the foreground area without being associated with the irrelevant background. In the second stage, we finetune the T2I model for better visual resemblance and devise a semantic loss to prevent the language drift problem. With the proposed techniques, SingleInsert excels in single concept generation with high-fidelity preservation while allowing flexible editing. Additionally, SingleInsert can perform single-image novel view synthesis and multiple concepts composition without requiring joint training. To facilitate evaluation, we design an editing prompt list and introduce a metric named Editing Success Rate (ESR) for quantitative assessment of editing flexibility.",
        "keywords": "Diffusion model;Text-to-image synthesis;Image-to-text inversion;Textual inversion",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/05ef4ded06ddc09bb73261dea155e6a079227fc2.zip",
        "author": "Zijie Wu;Chaohui Yu;Zhen Zhu;Fan Wang;Xiang Bai",
        "authorids": "~Zijie_Wu4;~Chaohui_Yu1;~Zhen_Zhu1;~Fan_Wang6;~Xiang_Bai1",
        "gender": "M;M;M;F;M",
        "homepage": ";https://richardych.github.io/;https://zzhu.vision;;http://mclab.eic.hust.edu.cn/~xbai",
        "dblp": ";14/10377;;;59/2741",
        "google_scholar": "VVU574oAAAAJ;b1Q-k20AAAAJ;nD6_ot4AAAAJ;WCRGTHsAAAAJ;UeltiQ4AAAAJ",
        "orcid": ";0000-0002-7852-4491;0000-0003-1557-8473;0000-0001-7320-1119;",
        "linkedin": ";;zhen-zhu-8081b3203/;;",
        "or_profile": "~Zijie_Wu4;~Chaohui_Yu1;~Zhen_Zhu1;~Fan_Wang6;~Xiang_Bai1",
        "aff": "Huazhong University of Science and Technology;Alibaba Group;University of Illinois, Urbana Champaign;Alibaba Group;Huazhong University of Science and Technology",
        "aff_domain": "hust.edu.cn;alibaba-inc.com;illinois.edu;alibaba-inc.com;hust.edu.cn",
        "position": "PhD student;Researcher;PhD student;Senior Staff Algorithm Engineer;Full Professor",
        "bibtex": "@misc{\nwu2024singleinsert,\ntitle={SingleInsert: Inserting New Concepts from a Single Image into Text-to-Image Models for Flexible Editing},\nauthor={Zijie Wu and Chaohui Yu and Zhen Zhu and Fan Wang and Xiang Bai},\nyear={2024},\nurl={https://openreview.net/forum?id=C6a0Obrp3o}\n}",
        "github": "",
        "project": "",
        "reviewers": "n7gt;i9TQ;QGk3",
        "site": "https://openreview.net/forum?id=C6a0Obrp3o",
        "pdf_size": 37923449,
        "rating": "3;5;5",
        "confidence": "5;4;4",
        "soundness": "2;3;3",
        "contribution": "2;2;2",
        "presentation": "3;3;3",
        "wc_summary": "58;21;110",
        "wc_strengths": "7;44;89",
        "wc_weaknesses": "150;300;185",
        "wc_questions": "2;108;76",
        "wc_review": "217;473;460",
        "wc_reply_reviewers": "0;0;26",
        "wc_reply_authors": "1080;1301;833",
        "reply_reviewers": "0;0;1",
        "reply_authors": "2;2;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            63.0,
            36.5057073163453
        ],
        "wc_strengths_avg": [
            46.666666666666664,
            33.529423231278855
        ],
        "wc_weaknesses_avg": [
            211.66666666666666,
            64.07460928913696
        ],
        "wc_questions_avg": [
            62.0,
            44.39219150556398
        ],
        "wc_review_avg": [
            383.3333333333333,
            117.73510757440006
        ],
        "wc_reply_reviewers_avg": [
            8.666666666666666,
            12.256517540566826
        ],
        "wc_reply_authors_avg": [
            1071.3333333333333,
            191.15845666764406
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9999999999999997,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14498849722992114640&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;1;0",
        "aff_unique_norm": "Huazhong University of Science and Technology;Alibaba Group;University of Illinois Urbana-Champaign",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.hust.edu.cn;https://www.alibaba.com;https://illinois.edu",
        "aff_unique_abbr": "HUST;Alibaba;UIUC",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Urbana-Champaign",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "C6zFUEvgiU",
        "title": "Feedback-guided Data Synthesis for Imbalanced Classification",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Current status quo in machine learning is to use static datasets of real images for training, which often come from long-tailed distributions. With the recent advances in generative models, researchers have started augmenting these static datasets with synthetic data, reporting moderate performance improvements on classification tasks. We hypothesize that these performance gains are limited by the lack of feedback from the classifier to the generative model, which would promote the usefulness of the generated samples to improve the classifier\u2019s performance. In this work, we introduce a framework for augmenting static datasets with useful synthetic samples, which leverages one-shot feedback from the classifier to drive the sampling of the generative model. In order for the framework to be effective, we find that the samples must be close to the support of the real data of the task at hand, and be sufficiently diverse. We validate three feedback criteria on a long-tailed dataset (ImageNet-LT) as well as a group-imbalanced dataset (NICO++). On ImageNet-LT, we achieve state-of-the-art results, with over 4% improvement on underrepresented classes while being twice efficient in terms of the number of generated synthetic samples. NICO++ also enjoys marked boosts of over 5% in worst group accuracy. With these results, our framework paves the path towards effectively leveraging state-of-the-art text-to-image models as data sources that can be queried to improve downstream applications.",
        "keywords": "Generative Models;Imbalanced Classification;Data Synthesis;Diffusion Models",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Reyhane Askari Hemmat;Mohammad Pezeshki;Florian Bordes;Michal Drozdzal;Adriana Romero-Soriano",
        "authorids": "~Reyhane_Askari_Hemmat1;~Mohammad_Pezeshki1;~Florian_Bordes1;~Michal_Drozdzal1;~Adriana_Romero-Soriano1",
        "gender": ";M;M;M;",
        "homepage": ";https://mohammadpz.github.io/;;;",
        "dblp": ";139/0888;194/9862;24/9794;",
        "google_scholar": ";HT85tXsAAAAJ;OADfWhUAAAAJ;https://scholar.google.ca/citations?user=XK_ktwQAAAAJ;",
        "orcid": ";;;;",
        "linkedin": ";;florianbordes;;",
        "or_profile": "~Reyhane_Askari_Hemmat1;~Mohammad_Pezeshki1;~Florian_Bordes1;~Michal_Drozdzal1;~Adriana_Romero-Soriano1",
        "aff": ";Meta Facebook;Meta;Meta;",
        "aff_domain": ";fb.com;meta.com;fb.com;",
        "position": ";Postdoc;Researcher;Research Scientst;",
        "bibtex": "@misc{\nhemmat2024feedbackguided,\ntitle={Feedback-guided Data Synthesis for Imbalanced Classification},\nauthor={Reyhane Askari Hemmat and Mohammad Pezeshki and Florian Bordes and Michal Drozdzal and Adriana Romero-Soriano},\nyear={2024},\nurl={https://openreview.net/forum?id=C6zFUEvgiU}\n}",
        "github": "",
        "project": "",
        "reviewers": "Ajag;tjGi;SFA5",
        "site": "https://openreview.net/forum?id=C6zFUEvgiU",
        "pdf_size": 15629518,
        "rating": "3;5;6",
        "confidence": "2;4;3",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "2;3;3",
        "wc_summary": "97;136;35",
        "wc_strengths": "86;36;30",
        "wc_weaknesses": "80;305;46",
        "wc_questions": "5;8;46",
        "wc_review": "268;485;157",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "419;1220;239",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;2;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            89.33333333333333,
            41.58792559812951
        ],
        "wc_strengths_avg": [
            50.666666666666664,
            25.104227178350307
        ],
        "wc_weaknesses_avg": [
            143.66666666666666,
            114.92122906099155
        ],
        "wc_questions_avg": [
            19.666666666666668,
            18.660713336371206
        ],
        "wc_review_avg": [
            303.3333333333333,
            136.21633121211602
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            626.0,
            426.4012195104512
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.6546536707079772,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8497995098595451217&as_sdt=5,34&sciodt=0,34&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Meta",
        "aff_unique_dep": "Meta Platforms, Inc.",
        "aff_unique_url": "https://meta.com",
        "aff_unique_abbr": "Meta",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "C7rg9izne7",
        "title": "What Do GNNs Actually Learn? Towards Understanding their Representations",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Although prior work has shed light on the expressiveness of Graph Neural Networks (GNNs) (\\ie whether they can distinguish pairs of non-isomorphic graphs), it is still not clear what structural information is encoded into the node representations that are learned by those models.\nIn this paper, we address this gap by studying the node representations learned by four standard GNN models.\nWe find that some models produce identical representations for all nodes, while the representations learned by other models are linked to some notion of walks of specific length that start from the nodes.\nWe establish Lipschitz bounds for these models with respect to the number of (normalized) walks.\nAdditionally, we investigate the influence of node features on the learned representations.\nWe find that the representations learned at the $k$-the layer of the models are related to the initial features of nodes that can be reached in exactly $k$ steps.\nWe bound the Lipschitz constant of these models with respect to an optimization problem matching nodes' sets of walks.\nOur theoretical analysis is validated through experiments on synthetic and real-world datasets.\nWe also apply our findings to understand the phenomenon of oversquashing that occurs in GNNs.",
        "keywords": "Graph neural networks;graph representation learning",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Giannis Nikolentzos;Michail Chatzianastasis;Michalis Vazirgiannis",
        "authorids": "~Giannis_Nikolentzos1;~Michail_Chatzianastasis1;~Michalis_Vazirgiannis1",
        "gender": "M;M;M",
        "homepage": "http://users.uop.gr/~nikolentzos/;https://michailchatzianastasis.github.io/;",
        "dblp": "163/6278;292/4296;v/MVazirgiannis",
        "google_scholar": "bdom4I8AAAAJ;e0HbE2YAAAAJ;https://scholar.google.gr/citations?user=aWGJYcMAAAAJ",
        "orcid": ";;",
        "linkedin": ";michail-chatzianastasis-799ab3153/;",
        "or_profile": "~Giannis_Nikolentzos1;~Michail_Chatzianastasis1;~Michalis_Vazirgiannis1",
        "aff": "University of Peloponnese;\u00c9cole Polytechnique;Ecole Polytechnique, France",
        "aff_domain": "uop.gr;polytechnique.edu;polytechnique.fr",
        "position": "Assistant Professor;PhD student;Full Professor",
        "bibtex": "@misc{\nnikolentzos2024what,\ntitle={What Do {GNN}s Actually Learn? Towards Understanding their Representations},\nauthor={Giannis Nikolentzos and Michail Chatzianastasis and Michalis Vazirgiannis},\nyear={2024},\nurl={https://openreview.net/forum?id=C7rg9izne7}\n}",
        "github": "",
        "project": "",
        "reviewers": "c5EH;dPEn;K44H;A5xe",
        "site": "https://openreview.net/forum?id=C7rg9izne7",
        "pdf_size": 697111,
        "rating": "3;3;3;5",
        "confidence": "3;3;3;3",
        "soundness": "2;2;2;3",
        "contribution": "2;1;2;2",
        "presentation": "3;2;3;2",
        "wc_summary": "75;128;113;50",
        "wc_strengths": "69;22;40;32",
        "wc_weaknesses": "353;641;157;58",
        "wc_questions": "58;5;195;103",
        "wc_review": "555;796;505;243",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            91.5,
            30.777426793024787
        ],
        "wc_strengths_avg": [
            40.75,
            17.512495538900218
        ],
        "wc_weaknesses_avg": [
            302.25,
            222.532441455173
        ],
        "wc_questions_avg": [
            90.25,
            69.71863093893913
        ],
        "wc_review_avg": [
            524.75,
            196.38275764435124
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:_ZkOw3cfUY0J:scholar.google.com/&scioq=What+Do+GNNs+Actually+Learn%3F+Towards+Understanding+their+Representations&hl=en&as_sdt=0,48",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "University of Peloponnese;Ecole Polytechnique",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uop.gr;https://www.polytechnique.edu",
        "aff_unique_abbr": ";X",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "Greece;France"
    },
    {
        "id": "C9uv8qR7RX",
        "title": "SiT: Symmetry-invariant Transformers for Generalisation in Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "A major open challenge in reinforcement learning (RL) is the effective deployment of a trained policy to new and slightly different situations i.e. out-of-distribution data, as well as semantically-similar environments. To overcome these limitations, we introduce the **S**ymmetry-**I**nvariant **T**ransformer (**SiT**), a scalable invariant and equivariant Transformer model that identifies and utilizes local\nand global patterns in the data. Central to our approach is the Graph Symmetric Attention (GSA) mechanism, adapting the self-attention mechanism to maintain graph symmetries. The invariant and equivariant latent representations are then used as a starting point for a subsequent policy and value networks. By striking a balance between local symmetries and overarching data trends, our model achieves innate capabilities to handle unfamiliar data distributions. We demonstrate improved generalization using our approach on MiniGrid and Procgen environments.",
        "keywords": "Reinforcement Learning;Generalization;Self-Attention;Equivariant Transformer;Invariant Transformer",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/90f62499bc16d9240033329a5c0ea6ad6b7b4b30.zip",
        "author": "Matthias Weissenbacher;Rishabh Agarwal;Yoshinobu Kawahara",
        "authorids": "~Matthias_Weissenbacher1;~Rishabh_Agarwal2;~Yoshinobu_Kawahara1",
        "gender": "M;M;M",
        "homepage": ";https://agarwl.github.io;https://mls.ist.osaka-u.ac.jp/en/~kawahara/",
        "dblp": ";;09/4700",
        "google_scholar": "xwo5JWgAAAAJ;https://scholar.google.ca/citations?user=aH8AJu4AAAAJ;B8sRETUAAAAJ",
        "orcid": ";;0000-0001-7789-4709",
        "linkedin": "matthias-weissenbacher-8bb850107/;;",
        "or_profile": "~Matthias_Weissenbacher1;~Rishabh_Agarwal2;~Yoshinobu_Kawahara1",
        "aff": ";Google DeepMind;RIKEN",
        "aff_domain": ";google.com;riken.jp",
        "position": ";Research Scientist;Team Director",
        "bibtex": "@misc{\nweissenbacher2024sit,\ntitle={SiT:   Symmetry-invariant Transformers for Generalisation in Reinforcement Learning},\nauthor={Matthias Weissenbacher and Rishabh Agarwal and Yoshinobu Kawahara},\nyear={2024},\nurl={https://openreview.net/forum?id=C9uv8qR7RX}\n}",
        "github": "",
        "project": "",
        "reviewers": "Rs9f;Yry2;vdZg",
        "site": "https://openreview.net/forum?id=C9uv8qR7RX",
        "pdf_size": 2617164,
        "rating": "3;6;8",
        "confidence": "3;4;4",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "2;2;3",
        "wc_summary": "82;107;130",
        "wc_strengths": "44;53;43",
        "wc_weaknesses": "314;298;100",
        "wc_questions": "15;25;138",
        "wc_review": "455;483;411",
        "wc_reply_reviewers": "206;369;30",
        "wc_reply_authors": "846;497;506",
        "reply_reviewers": "1;1;1",
        "reply_authors": "3;2;2",
        "rating_avg": [
            5.666666666666667,
            2.0548046676563256
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            106.33333333333333,
            19.601587237318874
        ],
        "wc_strengths_avg": [
            46.666666666666664,
            4.4969125210773475
        ],
        "wc_weaknesses_avg": [
            237.33333333333334,
            97.32876701617508
        ],
        "wc_questions_avg": [
            59.333333333333336,
            55.77534301901592
        ],
        "wc_review_avg": [
            449.6666666666667,
            29.634814361190493
        ],
        "wc_reply_reviewers_avg": [
            201.66666666666666,
            138.4300866462522
        ],
        "wc_reply_authors_avg": [
            616.3333333333334,
            162.44041642672826
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.9176629354822472,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Mlq3of4JqigJ:scholar.google.com/&scioq=SiT:+Symmetry-invariant+Transformers+for+Generalisation+in+Reinforcement+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 7,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Google;RIKEN",
        "aff_unique_dep": "Google DeepMind;",
        "aff_unique_url": "https://deepmind.com;https://www.riken.jp",
        "aff_unique_abbr": "DeepMind;RIKEN",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United Kingdom;Japan"
    },
    {
        "id": "CARclfc9ci",
        "title": "Relational Convolutional Networks: A framework for learning representations of hierarchical relations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "A maturing area of research in deep learning is the development of architectures that can learn explicit representations of relational features. In this paper, we focus on the problem of learning representations of *hierarchical* relations, proposing an architectural framework we call \"relational convolutional networks\". Given a sequence of objects, a \"multi-dimensional inner product relation\" module produces a relation tensor describing all pairwise relations. A \"relational convolution\" layer then transforms the relation tensor into a sequence of new objects, each describing the relations within some group of objects at the previous layer. Graphlet filters, analogous to filters in convolutional neural networks, represent a template of relations against which the relation tensor is compared at each grouping. Repeating this yields representations of higher-order, hierarchical relations. We present the motivation and details of the architecture, together with a set of experiments to demonstrate how relational convolutional networks can provide an effective framework for modeling relational tasks that have hierarchical structure.",
        "keywords": "representation learning;relational architectures;relational representation learning;hierarchical feature representations;compositionality;higher-order relations;convolutions",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/0deaa470696c28f519d0ae255f55f709d38a2e27.zip",
        "author": "Awni Altabaa;John Lafferty",
        "authorids": "~Awni_Altabaa1;~John_Lafferty2",
        "gender": ";",
        "homepage": "https://www.awni.xyz;http://statml.yale.edu",
        "dblp": ";",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Awni_Altabaa1;~John_Lafferty2",
        "aff": "Yale University;Yale University",
        "aff_domain": "yale.edu;yale.edu",
        "position": "PhD student;Professor",
        "bibtex": "@misc{\naltabaa2024relational,\ntitle={Relational Convolutional Networks: A framework for learning representations of hierarchical relations},\nauthor={Awni Altabaa and John Lafferty},\nyear={2024},\nurl={https://openreview.net/forum?id=CARclfc9ci}\n}",
        "github": "",
        "project": "",
        "reviewers": "nJRP;mJyy;Y5Cn;ikDu",
        "site": "https://openreview.net/forum?id=CARclfc9ci",
        "pdf_size": 2238595,
        "rating": "5;5;6;8",
        "confidence": "3;4;2;4",
        "soundness": "3;3;3;4",
        "contribution": "3;2;3;4",
        "presentation": "3;3;3;4",
        "wc_summary": "30;118;116;582",
        "wc_strengths": "25;68;50;131",
        "wc_weaknesses": "16;288;20;174",
        "wc_questions": "117;6;50;207",
        "wc_review": "188;480;236;1094",
        "wc_reply_reviewers": "0;0;12;0",
        "wc_reply_authors": "584;526;284;780",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            211.5,
            216.83807322516034
        ],
        "wc_strengths_avg": [
            68.5,
            39.18226639693013
        ],
        "wc_weaknesses_avg": [
            124.5,
            113.88041973930373
        ],
        "wc_questions_avg": [
            95.0,
            75.78588259036111
        ],
        "wc_review_avg": [
            499.5,
            360.65045404102847
        ],
        "wc_reply_reviewers_avg": [
            3.0,
            5.196152422706632
        ],
        "wc_reply_authors_avg": [
            543.5,
            176.93148391397162
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.24618298195866545,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17794491139367317705&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Yale University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.yale.edu",
        "aff_unique_abbr": "Yale",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Graph-based Virtual Sensing from Sparse and Partial Multivariate Observations",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19185",
        "id": "CAqdG2dy5s",
        "author_site": "Giovanni De Felice, Andrea Cini, Daniele Zambon, Vladimir Gusev, Cesare Alippi",
        "tldr": "",
        "abstract": "Virtual sensing techniques allow for inferring signals at new unmonitored locations by exploiting spatio-temporal measurements coming from physical sensors at different locations. However, as the sensor coverage becomes sparse due to costs or other constraints, physical proximity cannot be used to support interpolation. In this paper, we overcome this challenge by leveraging dependencies between the target variable and a set of correlated variables (covariates) that can frequently be associated with each location of interest. From this viewpoint, covariates provide partial observability, and the problem consists of inferring values for unobserved channels by exploiting observations at other locations to learn how such variables can correlate. We introduce a novel graph-based methodology to exploit such relationships and design a graph deep learning architecture, named GgNet, implementing the framework. The proposed approach relies on propagating information over a nested graph structure that is used to learn dependencies between variables as well as locations. GgNet is extensively evaluated under different virtual sensing scenarios, demonstrating higher reconstruction accuracy compared to the state-of-the-art.",
        "keywords": "Spatio-temporal data;time series;virtual sensing;imputation;graph neural networks;deep learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/3ddf1b04e040086b80baaeee6ef42235e44d3223.zip",
        "author": "Giovanni De Felice;Andrea Cini;Daniele Zambon;Vladimir Gusev;Cesare Alippi",
        "authorids": "~Giovanni_De_Felice1;~Andrea_Cini1;~Daniele_Zambon1;~Vladimir_Gusev1;~Cesare_Alippi1",
        "gender": "M;M;;;M",
        "homepage": "https://gdefe.github.io;https://andreacini.github.io/;https://dzambon.github.io/;;https://alippi.faculty.polimi.it/",
        "dblp": ";249/8223;185/1319;;84/6337",
        "google_scholar": "dFZ6v6IAAAAJ;bQI2UIUAAAAJ;https://scholar.google.ch/citations?user=JaQGQEwAAAAJ;;SCZObbIAAAAJ",
        "orcid": ";;0000-0003-3722-9784;;",
        "linkedin": ";;;;",
        "or_profile": "~Giovanni_De_Felice1;~Andrea_Cini1;~Daniele_Zambon1;~Vladimir_Gusev1;~Cesare_Alippi1",
        "aff": "University of Liverpool;Universita della Svizzera Italiana;Universita della Svizzera Italiana;;Politecnico di Milano",
        "aff_domain": "liv.ac.uk;usi.ch;usi.ch;;polimi.it",
        "position": "PhD student;PhD student;Postdoc;;Full Professor",
        "bibtex": "@inproceedings{\nfelice2024graphbased,\ntitle={Graph-based Virtual Sensing from Sparse and Partial Multivariate Observations},\nauthor={Giovanni De Felice and Andrea Cini and Daniele Zambon and Vladimir Gusev and Cesare Alippi},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=CAqdG2dy5s}\n}",
        "github": "",
        "project": "",
        "reviewers": "CZHK;MbBb;cynR;L9oj",
        "pdf_size": 3962036,
        "rating": "3;5;6;8",
        "confidence": "5;4;4;2",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;3;2;3",
        "wc_summary": "33;43;94;79",
        "wc_strengths": "32;39;122;142",
        "wc_weaknesses": "116;126;45;152",
        "wc_questions": "90;5;30;65",
        "wc_review": "271;213;291;438",
        "wc_reply_reviewers": "0;11;0;12",
        "wc_reply_authors": "874;580;210;849",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "2;2;1;2",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            62.25,
            25.073641538476217
        ],
        "wc_strengths_avg": [
            83.75,
            48.828142499996865
        ],
        "wc_weaknesses_avg": [
            109.75,
            39.62559147823538
        ],
        "wc_questions_avg": [
            47.5,
            32.5
        ],
        "wc_review_avg": [
            303.25,
            82.90468925217681
        ],
        "wc_reply_reviewers_avg": [
            5.75,
            5.7608593109014565
        ],
        "wc_reply_authors_avg": [
            628.25,
            267.5746391196296
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9544271444636667,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9985008950330023477&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=CAqdG2dy5s",
        "pdf": "https://openreview.net/pdf?id=CAqdG2dy5s",
        "email": "liv.ac.uk;usi.ch;usi.ch;;polimi.it",
        "author_num": 5,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "University of Liverpool;Universita della Svizzera Italiana;Politecnico di Milano",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.liverpool.ac.uk;https://www.usi.ch;https://www.polimi.it",
        "aff_unique_abbr": "Liv Uni;USI;Polimi",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;2",
        "aff_country_unique": "United Kingdom;Switzerland;Italy"
    },
    {
        "id": "CBGdLyJXBW",
        "title": "Connected Hidden Neurons (CHNNet): An Artificial Neural Network for Rapid Convergence",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Despite artificial neural networks being inspired by the functionalities of biological neural networks, unlike biological neural networks, conventional artificial neural networks are often structured hierarchically, which can impede the flow of information between neurons as the neurons in the same layer have no connections between them. Hence, we propose a more robust model of artificial neural networks where the hidden neurons, residing in the same hidden layer, are interconnected that leads to rapid convergence. With the experimental study of our proposed model in deep networks, we demonstrate that the model results in a noticeable increase in convergence rate compared to the conventional feed-forward neural network.",
        "keywords": "Artificial Neural Network;Connected Hidden Neurons;Rapid Convergence.",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/218d68f856e978e0079894968ffcd5d689da073c.zip",
        "author": "Rafiad Sadat Shahir;Zayed Humayun;Mashrufa Akter Tamim;Shouri Saha;Md. Golam Rabiul Alam",
        "authorids": "~Rafiad_Sadat_Shahir1;~Zayed_Humayun1;~Mashrufa_Akter_Tamim1;~Shouri_Saha1;~Md._Golam_Rabiul_Alam1",
        "gender": "M;M;F;F;M",
        "homepage": ";;;https://github.com/ShouriSaha;https://www.bracu.ac.bd/about/people/md-golam-rabiul-alam-phd",
        "dblp": ";;;;00/10963",
        "google_scholar": ";;;;t4GrJR4AAAAJ",
        "orcid": "0009-0007-7543-8516;0009-0001-7941-2977;0009-0006-4108-1670;0009-0007-9107-3991;0000-0002-9054-7557",
        "linkedin": "rafiad-sadat-shahir-5359651ba;zayed-humayun/;mashrufa-tamim-1a9bba209;;md-golam-rabiul-alam-abb1767/?originalSubdomain=bd",
        "or_profile": "~Rafiad_Sadat_Shahir1;~Zayed_Humayun1;~Mashrufa_Akter_Tamim1;~Shouri_Saha1;~Md._Golam_Rabiul_Alam1",
        "aff": ";;;BRAC University ;Brac University",
        "aff_domain": ";;;bracu.ac.bd;bracuniversity.net",
        "position": ";;;Undergrad student;Full Professor",
        "bibtex": "@misc{\nshahir2024connected,\ntitle={Connected Hidden Neurons ({CHNN}et): An Artificial Neural Network for Rapid Convergence},\nauthor={Rafiad Sadat Shahir and Zayed Humayun and Mashrufa Akter Tamim and Shouri Saha and Md. Golam Rabiul Alam},\nyear={2024},\nurl={https://openreview.net/forum?id=CBGdLyJXBW}\n}",
        "github": "",
        "project": "",
        "reviewers": "fGCE;E1uY;imnR;Qbio",
        "site": "https://openreview.net/forum?id=CBGdLyJXBW",
        "pdf_size": 428521,
        "rating": "3;3;3;6",
        "confidence": "5;4;4;3",
        "soundness": "1;1;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;2;3",
        "wc_summary": "67;289;55;90",
        "wc_strengths": "114;29;4;70",
        "wc_weaknesses": "305;21;126;84",
        "wc_questions": "166;7;45;50",
        "wc_review": "652;346;230;294",
        "wc_reply_reviewers": "0;49;0;0",
        "wc_reply_authors": "250;104;164;108",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            125.25,
            95.37393511856371
        ],
        "wc_strengths_avg": [
            54.25,
            41.77544135015213
        ],
        "wc_weaknesses_avg": [
            134.0,
            105.56277753071866
        ],
        "wc_questions_avg": [
            67.0,
            59.5273046592906
        ],
        "wc_review_avg": [
            380.5,
            162.04551829655765
        ],
        "wc_reply_reviewers_avg": [
            12.25,
            21.21762239271875
        ],
        "wc_reply_authors_avg": [
            156.5,
            58.9639720507362
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15047167430343408522&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "BRAC University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.bracu.ac.bd",
        "aff_unique_abbr": "BRACU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Bangladesh"
    },
    {
        "id": "CCo8ElCT7v",
        "title": "Comprehensive Comparison between Vision Transformers and Convolutional Neural Networks for Face Recognition Tasks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper presents a comprehensive comparison between Vision Transformers and Convolutional Neural Networks for face recognition related tasks, including extensive experiments on the tasks of face identification and verification. Our study focuses on six state-of-the-art models: EfficientNet, Inception, MobileNet, ResNet, VGG, and Vision Transformers. Our evaluation of these models is based on five diverse datasets: Labeled Faces in the Wild, Real World Occluded Faces, Surveillance Cameras Face, UPM-GTI-Face, and VGG Face 2. These datasets present unique challenges regarding people diversity, distance from the camera, and face occlusions such as those produced by masks and glasses. Our contribution to the field includes a deep analysis of the experimental results, including a thorough examination of the training and evaluation process, as well as the software and hardware configurations used. Our results show that Vision Transformers outperform Convolutional Neural Networks in terms of accuracy and robustness against distance and occlusions for face recognition related tasks, while also presenting a smaller memory footprint and an impressive inference speed, rivaling even the fastest Convolutional Neural Networks. In conclusion, our study provides valuable insights into the performance of Vision Transformers for face recognition related tasks and highlights the potential of these models as a more efficient solution than Convolutional Neural Networks.",
        "keywords": "Vision Transformers;Convolutional Neural Networks;face recognition;identification;verification",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Marcos Rodrigo;Carlos Cuevas;Narciso Garc\u00eda",
        "authorids": "~Marcos_Rodrigo1;~Carlos_Cuevas1;~Narciso_Garc\u00eda1",
        "gender": "Not Specified;;M",
        "homepage": ";;http://www.gti.ssr.upm.es",
        "dblp": ";;05/4319",
        "google_scholar": "IJwF3U4AAAAJ;https://scholar.google.es/citations?user=L3y6UoIAAAAJ;https://scholar.google.es/citations?user=dJsf9l8AAAAJ",
        "orcid": "0000-0002-1808-4738;;0000-0002-0397-894X",
        "linkedin": ";;",
        "or_profile": "~Marcos_Rodrigo1;~Carlos_Cuevas1;~Narciso_Garc\u00eda1",
        "aff": "Universidad Polit\u00e9cnica de Madrid;Universidad Polit\u00e9cnica de Madrid;Universidad Polit\u00e9cnica de Madrid",
        "aff_domain": "upm.es;upm.es;upm.es",
        "position": "PhD student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nrodrigo2024comprehensive,\ntitle={Comprehensive Comparison between Vision Transformers and Convolutional Neural Networks for Face Recognition Tasks},\nauthor={Marcos Rodrigo and Carlos Cuevas and Narciso Garc{\\'\\i}a},\nyear={2024},\nurl={https://openreview.net/forum?id=CCo8ElCT7v}\n}",
        "github": "",
        "project": "",
        "reviewers": "RorU;D6eT;6T9x;dZCP",
        "site": "https://openreview.net/forum?id=CCo8ElCT7v",
        "pdf_size": 18392507,
        "rating": "3;3;5;6",
        "confidence": "4;5;5;4",
        "soundness": "3;2;3;3",
        "contribution": "2;1;2;2",
        "presentation": "2;3;3;3",
        "wc_summary": "48;42;80;51",
        "wc_strengths": "34;15;27;133",
        "wc_weaknesses": "45;181;168;352",
        "wc_questions": "1;32;28;117",
        "wc_review": "128;270;303;653",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "455;452;538;1021",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;2;3",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            55.25,
            14.652218262092603
        ],
        "wc_strengths_avg": [
            52.25,
            47.11355961928582
        ],
        "wc_weaknesses_avg": [
            186.5,
            109.29890209878597
        ],
        "wc_questions_avg": [
            44.5,
            43.522982434571276
        ],
        "wc_review_avg": [
            338.5,
            193.11460328002127
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            616.5,
            236.07467039053554
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.19245008972987526,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8824315642190745940&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Universidad Polit\u00e9cnica de Madrid",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.upm.es",
        "aff_unique_abbr": "UPM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Spain"
    },
    {
        "id": "CE7lUzrp1o",
        "title": "CODA: Temporal Domain Generalization via Concept Drift Simulator",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In real-world applications, machine learning models often become obsolete due to shifts in the joint distribution arising from underlying temporal trends, a phenomenon known as the \"concept drift\". Existing works propose model-specific strategies to achieve temporal generalization in the near-future domain. However, the diverse characteristics of real-world datasets necessitate customized prediction model architectures. To this end, there is an urgent demand for a model-agnostic temporal domain generalization approach that maintains generality across diverse data modalities and architectures. In this work, we aim to address the concept drift problem from a data-centric perspective to bypass considering the interaction between data and model. Developing such a framework presents non-trivial challenges: (i) existing generative models struggle to generate out-of-distribution future data, and (ii) precisely capturing the temporal trends of joint distribution along chronological source domains is computationally infeasible. To tackle the challenges, we propose the $\\underline{\\mathrm{CO}}$ncept $\\underline{\\mathrm{D}}$rift simul$\\underline{\\mathrm{A}}$tor (CODA) framework incorporating a predicted feature correlation matrix to simulate future data for model training. Specifically, CODA leverages feature correlations to represent data characteristics at specific time points, thereby circumventing the daunting computational costs. Experimental results demonstrate that using CODA-generated data as training input effectively achieves temporal domain generalization across different model architectures.",
        "keywords": "Temporal Domain Generalization;Concept Drift;Concept Shift;Distribution Shift",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Chia-Yuan Chang;Yu-Neng Chuang;Zhimeng Jiang;Kwei-Herng Lai;Anxiao Jiang;Na Zou",
        "authorids": "~Chia-Yuan_Chang3;~Yu-Neng_Chuang1;~Zhimeng_Jiang1;~Kwei-Herng_Lai1;~Anxiao_Jiang1;~Na_Zou2",
        "gender": "Not Specified;M;M;M;M;F",
        "homepage": "https://z76316.github.io/;;http://www.zhimengjiang.com/;https://www.linkedin.com/in/khlai037/;https://www.anxiao-jiang.com/home;https://nzou1.github.io/",
        "dblp": "03/1382-2.html;207/7875;217/3235;225/7856;50/3660.html;152/0090-1.html",
        "google_scholar": "EO595aMAAAAJ;;5Es3Yk4AAAAJ;K0dLbssAAAAJ;https://scholar.google.com/citations?view_op=search_authors;https://scholar.google.com/citations?hl=en",
        "orcid": "0009-0001-1889-612X;;0000-0001-6933-3952;0000-0001-8933-7117;0000-0002-0120-7930;0000-0003-1984-795X",
        "linkedin": "chia-yuan-chang/;ync/;;;anxiao-andrew-jiang-586843170/;na-zou-a1721535/",
        "or_profile": "~Chia-Yuan_Chang3;~Yu-Neng_Chuang1;~Zhimeng_Jiang1;~Kwei-Herng_Lai1;~Anxiao_Jiang1;~Na_Zou2",
        "aff": "Texas A&M University - College Station;Rice University;VISA Research;Apple;Texas A&M University - College Station;University of Houston",
        "aff_domain": "tamu.edu;rice.edu;visa.com;apple.com;tamu.edu;uh.edu",
        "position": "PhD student;PhD student;Researcher;machine learning engineer;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nchang2024coda,\ntitle={{CODA}: Temporal Domain Generalization via Concept Drift Simulator},\nauthor={Chia-Yuan Chang and Yu-Neng Chuang and Zhimeng Jiang and Kwei-Herng Lai and Anxiao Jiang and Na Zou},\nyear={2024},\nurl={https://openreview.net/forum?id=CE7lUzrp1o}\n}",
        "github": "",
        "project": "",
        "reviewers": "GM2p;VxLr;q1Jd;BJ2w",
        "site": "https://openreview.net/forum?id=CE7lUzrp1o",
        "pdf_size": 7241836,
        "rating": "5;5;6;6",
        "confidence": "3;5;3;4",
        "soundness": "2;2;3;3",
        "contribution": "3;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "117;50;79;56",
        "wc_strengths": "63;50;30;47",
        "wc_weaknesses": "223;359;38;81",
        "wc_questions": "4;180;54;56",
        "wc_review": "407;639;201;240",
        "wc_reply_reviewers": "136;167;17;10",
        "wc_reply_authors": "1517;2429;778;313",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "3;7;2;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            75.5,
            26.291633650269812
        ],
        "wc_strengths_avg": [
            47.5,
            11.757976016304847
        ],
        "wc_weaknesses_avg": [
            175.25,
            126.2584155611023
        ],
        "wc_questions_avg": [
            73.5,
            64.92110596716603
        ],
        "wc_review_avg": [
            371.75,
            172.6113770873751
        ],
        "wc_reply_reviewers_avg": [
            82.5,
            69.9088692513332
        ],
        "wc_reply_authors_avg": [
            1259.25,
            800.2719459658698
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.5,
            2.0615528128088303
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.30151134457776363,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8985039108843902679&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;3;0;4",
        "aff_unique_norm": "Texas A&M University;Rice University;VISA;Apple;University of Houston",
        "aff_unique_dep": ";;Research;Apple Inc.;",
        "aff_unique_url": "https://www.tamu.edu;https://www.rice.edu;https://www.visa.com/;https://www.apple.com;https://www.uh.edu",
        "aff_unique_abbr": "TAMU;Rice;VISA;Apple;UH",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "College Station;",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Unraveling the Enigma of Double Descent: An In-depth Analysis through the Lens of Learned Feature Space",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19184",
        "id": "CEkIyshNbC",
        "author_site": "Yufei Gu, Xiaoqing Zheng, Tomaso Aste",
        "tldr": "",
        "abstract": "Double descent presents a counter-intuitive aspect within the machine learning domain, and researchers have observed its manifestation in various models and tasks. While some theoretical explanations have been proposed for this phenomenon in specific contexts, an accepted theory for its occurring mechanism in deep learning remains yet to be established. In this study, we revisit the phenomenon of double descent and demonstrate that the presence of noisy data strongly influences its occurrence. By comprehensively analysing the feature space of learned representations, we unveil that double descent arises in imperfect models trained with noisy data. We argue that while small and intermediate models before the interpolation threshold follow the traditional bias-variance trade-off, over-parameterized models interpolate noisy samples among robust data thus acquiring the capability to separate the information from the noise. The source code is available at \\url{https://github.com/Yufei-Gu-451/double_descent_inference.git}.",
        "keywords": "neural network;double descent;classification;interpretability",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/1b8ffdb8e0147a19cd0efed787bf3ff526ed079c.zip",
        "author": "Yufei Gu;Xiaoqing Zheng;Tomaso Aste",
        "authorids": "~Yufei_Gu1;~Xiaoqing_Zheng2;~Tomaso_Aste2",
        "gender": "M;;M",
        "homepage": ";;http://www.cs.ucl.ac.uk/staff/tomaso_aste/",
        "dblp": "127/9202;;",
        "google_scholar": ";;https://scholar.google.co.uk/citations?user=27pUbTUAAAAJ",
        "orcid": "0009-0007-1151-2748;;",
        "linkedin": "yufei-gu-8000ba1b9;;",
        "or_profile": "~Yufei_Gu1;~Xiaoqing_Zheng2;~Tomaso_Aste2",
        "aff": "University College London, University of London;;University College London, University of London",
        "aff_domain": "ucl.ac.uk;;ucl.ac.uk",
        "position": "Undergrad student;;Full Professor",
        "bibtex": "@inproceedings{\ngu2024unraveling,\ntitle={Unraveling the Enigma of Double Descent: An In-depth Analysis through the Lens of Learned Feature Space},\nauthor={Yufei Gu and Xiaoqing Zheng and Tomaso Aste},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=CEkIyshNbC}\n}",
        "github": "",
        "project": "",
        "reviewers": "9d7L;Ea52;d6tR;P23K",
        "pdf_size": 996267,
        "rating": "3;5;5;5",
        "confidence": "3;3;5;2",
        "soundness": "2;2;2;3",
        "contribution": "3;1;2;2",
        "presentation": "2;2;2;3",
        "wc_summary": "63;76;107;29",
        "wc_strengths": "18;72;39;49",
        "wc_weaknesses": "142;185;260;161",
        "wc_questions": "2;1;31;9",
        "wc_review": "225;334;437;248",
        "wc_reply_reviewers": "0;59;478;0",
        "wc_reply_authors": "488;418;1241;378",
        "reply_reviewers": "0;1;2;0",
        "reply_authors": "1;2;3;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            68.75,
            27.9676152004421
        ],
        "wc_strengths_avg": [
            44.5,
            19.42292459955503
        ],
        "wc_weaknesses_avg": [
            187.0,
            44.81629168059312
        ],
        "wc_questions_avg": [
            10.75,
            12.090802289343747
        ],
        "wc_review_avg": [
            311.0,
            83.32166584988565
        ],
        "wc_reply_reviewers_avg": [
            134.25,
            199.9204529306594
        ],
        "wc_reply_authors_avg": [
            631.25,
            354.23394459029475
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.13245323570650439,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8318903087784038210&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=CEkIyshNbC",
        "pdf": "https://openreview.net/pdf?id=CEkIyshNbC",
        "email": "ucl.ac.uk;;ucl.ac.uk",
        "author_num": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University College London",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucl.ac.uk",
        "aff_unique_abbr": "UCL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "CF6gfZSCVg",
        "title": "Anarchic Federated Bilevel Optimization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Rapid federated bilevel optimization (FBO) developments have attracted much attention in various emerging machine learning and communication applications. Existing work on FBO often assumes that clients participate in the learning process with some particular pattern (such as balanced participation), and/or in a synchronous manner, and/or with homogeneous local iteration numbers, which might be\nhard to hold in practice. This paper proposes a novel Asynchronous Federated Bilevel Optimization (AFBO) algorithm, which allows clients to 1) participate in any inner or outer rounds; 2) participate asynchronously; and 3) participate with any number of local iterations. The proposed AFBO algorithm enables clients to flexibly participate in FBO training. We provide a theoretic analysis of the learning loss of AFBO and the result shows that the AFBO algorithm can achieve a convergence rate of $\\mathcal{O}(\\sqrt{\\frac1T})$, which matches that of the existing benchmarks. Numerical studies are conducted to verify the efficiency of the proposed algorithm.",
        "keywords": "asynchronous;bilevel optimization;heterogenous local iterations;partial participation",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/711d858395570d2bd0692e463e1d943ae21dc2fb.pdf",
        "author": "Dongsheng Li;Xiaowen Gong;Shiwen Mao;Yang Zhou",
        "authorids": "~Dongsheng_Li4;~Xiaowen_Gong1;~Shiwen_Mao1;~Yang_Zhou4",
        "gender": "M;M;M;",
        "homepage": "https://lidsh1107.wixsite.com/website;http://webhome.auburn.edu/~xzg0017/;http://www.eng.auburn.edu/~szm0001/;http://eng.auburn.edu/users/yangzhou/",
        "dblp": ";;;07/4580-1",
        "google_scholar": ";aNw63mYAAAAJ;https://scholar.google.com/citations?hl=en;yvE8Po0AAAAJ",
        "orcid": "0000-0001-6297-0430;;0000-0002-7052-0007;0000-0001-7839-4933",
        "linkedin": ";;;",
        "or_profile": "~Dongsheng_Li4;~Xiaowen_Gong1;~Shiwen_Mao1;~Yang_Zhou4",
        "aff": "Auburn University;Auburn University;Auburn University;Auburn University",
        "aff_domain": "auburn.edu;auburn.edu;auburn.edu;auburn.edu",
        "position": "PhD student;Associate Professor;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nli2024anarchic,\ntitle={Anarchic Federated Bilevel Optimization},\nauthor={Dongsheng Li and Xiaowen Gong and Shiwen Mao and Yang Zhou},\nyear={2024},\nurl={https://openreview.net/forum?id=CF6gfZSCVg}\n}",
        "github": "",
        "project": "",
        "reviewers": "PRRM;3dLq;3Fd8",
        "site": "https://openreview.net/forum?id=CF6gfZSCVg",
        "pdf_size": 270785,
        "rating": "3;5;8",
        "confidence": "5;5;3",
        "soundness": "1;3;2",
        "contribution": "1;3;3",
        "presentation": "1;3;3",
        "wc_summary": "19;88;64",
        "wc_strengths": "9;28;68",
        "wc_weaknesses": "92;89;82",
        "wc_questions": "92;41;14",
        "wc_review": "212;246;228",
        "wc_reply_reviewers": "0;0;9",
        "wc_reply_authors": "956;1219;553",
        "reply_reviewers": "0;0;1",
        "reply_authors": "4;4;2",
        "rating_avg": [
            5.333333333333333,
            2.0548046676563256
        ],
        "confidence_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            57.0,
            28.600699292150182
        ],
        "wc_strengths_avg": [
            35.0,
            24.589970855343985
        ],
        "wc_weaknesses_avg": [
            87.66666666666667,
            4.189935029992178
        ],
        "wc_questions_avg": [
            49.0,
            32.341923257592455
        ],
        "wc_review_avg": [
            228.66666666666666,
            13.888444437333106
        ],
        "wc_reply_reviewers_avg": [
            3.0,
            4.242640687119285
        ],
        "wc_reply_authors_avg": [
            909.3333333333334,
            273.8884606712902
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9176629354822472,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8244649814901177201&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Auburn University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.auburn.edu",
        "aff_unique_abbr": "Auburn",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "The Generative AI Paradox: \u201cWhat It Can Create, It May Not Understand\u201d",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19183",
        "id": "CF8H8MS5P8",
        "author_site": "Peter West, Ximing Lu, Nouha Dziri, Faeze Brahman, Linjie Li, Jena Hwang, Liwei Jiang, Jillian Fisher, Abhilasha Ravichander, Khyathi Chandu, Benjamin Newman, Pang Wei Koh, Allyson Ettinger, Yejin Choi",
        "tldr": "",
        "abstract": "The recent wave of generative AI has sparked unprecedented global attention, with both excitement and concern over potentially superhuman levels of artificial intelligence: models now take only seconds to produce outputs that would challenge or exceed the capabilities even of expert humans. At the same time, models still show basic errors in understanding that would not be expected even in non-expert humans. This presents us with an apparent paradox: how do we reconcile seemingly superhuman capabilities with the persistence of errors that few humans would make? In this work, we posit that this tension reflects a divergence in the configuration of intelligence in today's generative models relative to intelligence in humans. Specifically, we propose and test the **Generative AI Paradox** hypothesis: generative models, having been trained directly to reproduce expert-like outputs, acquire generative capabilities that are not contingent upon---and can therefore exceed---their ability to understand those same types of outputs. This contrasts with humans, for whom basic understanding almost always precedes the ability to\ngenerate expert-level outputs. We test this hypothesis through controlled experiments analyzing generation vs.~understanding in generative models, across both language and image modalities. Our results show that although models can outperform humans in generation, they consistently fall short of human capabilities in measures of understanding, as well as weaker correlation between generation and understanding performance, and more brittleness to adversarial inputs. Our findings support the hypothesis that models' generative capability may not be contingent upon understanding capability, and call for caution in interpreting artificial intelligence by analogy to human intelligence.",
        "keywords": "LMs;language models;vision models;GPT4;ChatGPT;Midjourney;generative models;understanding models",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Peter West;Ximing Lu;Nouha Dziri;Faeze Brahman;Linjie Li;Jena D. Hwang;Liwei Jiang;Jillian Fisher;Abhilasha Ravichander;Khyathi Chandu;Benjamin Newman;Pang Wei Koh;Allyson Ettinger;Yejin Choi",
        "authorids": "~Peter_West1;~Ximing_Lu1;~Nouha_Dziri2;~Faeze_Brahman1;~Linjie_Li1;~Jena_D._Hwang1;~Liwei_Jiang2;~Jillian_Fisher1;~Abhilasha_Ravichander2;~Khyathi_Chandu1;~Benjamin_Newman1;~Pang_Wei_Koh1;~Allyson_Ettinger1;~Yejin_Choi1",
        "gender": "M;F;;F;F;F;F;F;;;;M;F;F",
        "homepage": "https://peterwestai.notion.site/;https://gloriaximinglu.github.io/;;https://fabrahman.github.io;;https://jenahwang.github.io/;https://liweijiang.me;http://jfisher52.github.io;https://www.cs.cmu.edu/~aravicha/;;http://blnewman.com;http://cs.stanford.edu/~pangwei;https://aetting.github.io;https://yejinc.github.io/",
        "dblp": "179/4587;24/10879;;276/6005;200/8256;83/10905;;336/3238;170/4795.html;;126/5109;10/10453;165/0758;89/579-1",
        "google_scholar": "https://scholar.google.ca/citations?user=9ubCBYwAAAAJ;https://scholar.google.com/citations?hl=en;;viCG2ikAAAAJ;WR875gYAAAAJ;9QuMhLgAAAAJ;lcPsDgUAAAAJ;Gnk0E_QAAAAJ;6vLsKGsAAAAJ;;QehvrDoAAAAJ;Nn990CkAAAAJ;;vhP-tlcAAAAJ",
        "orcid": ";;;;;;;;;;;;;",
        "linkedin": ";;;;;;;jillianrosefisher/;abhilasha-ravichander-57524958;;;;;",
        "or_profile": "~Peter_West1;~Ximing_Lu1;~Nouha_Dziri2;~Faeze_Brahman1;~Linjie_Li1;~Jena_D._Hwang1;~Liwei_Jiang2;~Jillian_Fisher1;~Abhilasha_Ravichander2;~Khyathi_Chandu1;~Benjamin_Newman1;~Pang_Wei_Koh1;~Allyson_Ettinger1;~Yejin_Choi1",
        "aff": "University of Washington, Seattle;University of Washington;;Allen Institute for AI;Microsoft;Allen Institute for Artificial Intelligence;University of Washington;University of Washington;Allen Institute for Artificial Intelligence;;University of Washington;University of Washington;Allen Institute for Artificial Intelligence;Department of Computer Science, University of Washington",
        "aff_domain": "uw.edu;cs.washington.edu;;allenai.org;microsoft.com;allenai.org;washington.edu;uw.edu;allenai.org;;cs.washington.edu;cs.washington.edu;allenai.org;cs.washington.edu",
        "position": "PhD student;PhD student;;Postdoc;Researcher;Researcher;PhD student;PhD student;Postdoc;;PhD student;Assistant Professor;Researcher;Full Professor",
        "bibtex": "@inproceedings{\nwest2024the,\ntitle={The Generative {AI} Paradox: {\\textquotedblleft}What It Can Create, It May Not Understand{\\textquotedblright}},\nauthor={Peter West and Ximing Lu and Nouha Dziri and Faeze Brahman and Linjie Li and Jena D. Hwang and Liwei Jiang and Jillian Fisher and Abhilasha Ravichander and Khyathi Chandu and Benjamin Newman and Pang Wei Koh and Allyson Ettinger and Yejin Choi},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=CF8H8MS5P8}\n}",
        "github": "",
        "project": "",
        "reviewers": "W7YK;icxt;n1Ya;izog",
        "pdf_size": 12848291,
        "rating": "6;6;8;8",
        "confidence": "4;3;4;3",
        "soundness": "2;4;4;3",
        "contribution": "3;4;3;3",
        "presentation": "2;2;4;4",
        "wc_summary": "62;82;111;60",
        "wc_strengths": "113;33;158;64",
        "wc_weaknesses": "288;106;261;40",
        "wc_questions": "144;64;83;65",
        "wc_review": "607;285;613;229",
        "wc_reply_reviewers": "299;0;24;0",
        "wc_reply_authors": "674;533;290;149",
        "reply_reviewers": "3;0;1;0",
        "reply_authors": "3;1;2;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            1.0
        ],
        "wc_summary_avg": [
            78.75,
            20.51066795596867
        ],
        "wc_strengths_avg": [
            92.0,
            47.5972688292091
        ],
        "wc_weaknesses_avg": [
            173.75,
            103.85657177088025
        ],
        "wc_questions_avg": [
            89.0,
            32.64199748789893
        ],
        "wc_review_avg": [
            433.5,
            177.6196779639013
        ],
        "wc_reply_reviewers_avg": [
            80.75,
            126.38705432123972
        ],
        "wc_reply_authors_avg": [
            411.5,
            204.5342269645841
        ],
        "reply_reviewers_avg": [
            1.0,
            1.224744871391589
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            14,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 30,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13406142613352755351&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=CF8H8MS5P8",
        "pdf": "https://openreview.net/pdf?id=CF8H8MS5P8",
        "email": "uw.edu;cs.washington.edu;;allenai.org;microsoft.com;allenai.org;washington.edu;uw.edu;allenai.org;;cs.washington.edu;cs.washington.edu;allenai.org;cs.washington.edu",
        "author_num": 14,
        "aff_unique_index": "0;0;1;2;3;0;0;3;0;0;3;0",
        "aff_unique_norm": "University of Washington;Allen Institute for AI;Microsoft;Allen Institute for Artificial Intelligence",
        "aff_unique_dep": ";;Microsoft Corporation;",
        "aff_unique_url": "https://www.washington.edu;https://allenai.org;https://www.microsoft.com;https://allenai.org",
        "aff_unique_abbr": "UW;AI2;Microsoft;AI2",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Seattle;",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "SEAL: A Framework for Systematic Evaluation of Real-World Super-Resolution",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19182",
        "id": "CGlczSBBSj",
        "author_site": "Wenlong Zhang, Xiaohui Li, Xiangyu Chen, Xiaoyun Zhang, Yu Qiao, Xiao-Ming Wu, Chao Dong",
        "tldr": "",
        "abstract": "Real-world Super-Resolution (Real-SR) methods focus on dealing with diverse real-world images and have attracted increasing attention in recent years. The key idea is to use a complex and high-order degradation model to mimic real-world degradations. \nAlthough they have achieved impressive results in various scenarios, they are faced with the obstacle of evaluation. Currently, these methods are only assessed by their average performance on a small set of degradation cases randomly selected from a large space, which fails to provide a comprehensive understanding of their overall performance and often yields inconsistent and potentially misleading results.\nTo overcome the limitation in evaluation, we propose SEAL, a framework for systematic evaluation of real-SR. In particular, we cluster the extensive degradation space to create a set of representative degradation cases, which serves as a comprehensive test set. Next, we propose a coarse-to-fine evaluation protocol to measure the distributed and relative performance of real-SR methods on the test set. The protocol incorporates two new metrics: acceptance rate (AR) and relative performance ratio (RPR), derived from acceptance and excellence lines. Under SEAL, we benchmark existing real-SR methods, obtain new observations and insights into their performance, and develop a new strong baseline. We consider SEAL as the first step towards creating an unbiased and comprehensive real-SR evaluation platform, which can promote the development of real-SR.",
        "keywords": "Image super-resolution; Real-World super-resolution",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/718c01eccfaa2c1486c14594f118c84fccb1e0a1.pdf",
        "author": "Wenlong Zhang;Xiaohui Li;Xiangyu Chen;Xiaoyun Zhang;Yu Qiao;Xiao-Ming Wu;Chao Dong",
        "authorids": "~Wenlong_Zhang3;~Xiaohui_Li2;~Xiangyu_Chen5;~Xiaoyun_Zhang1;~Yu_Qiao1;~Xiao-Ming_Wu1;~Chao_Dong4",
        "gender": "M;F;M;F;;F;M",
        "homepage": "https://wenlongzhang0517.github.io/;https://github.com/xh9998;https://chxy95.github.io/;https://mediabrain.sjtu.edu.cn/xiaoyun-zhang/;;http://www4.comp.polyu.edu.hk/~csxmwu/;http://xpixel.group/2010/01/20/chaodong.html",
        "dblp": ";;84/7543-6;;;98/2898-3;16/1278-5",
        "google_scholar": "https://scholar.google.com.hk/citations?user=UnMImiUAAAAJ;;https://scholar.google.com.hk/citations?user=_gkTxJUAAAAJ;hQm9oqwAAAAJ;;3KbaUFkAAAAJ;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": ";;;0000-0001-7680-4062;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Wenlong_Zhang3;~Xiaohui_Li2;~Xiangyu_Chen5;~Xiaoyun_Zhang1;~Yu_Qiao1;~Xiao-Ming_Wu1;~Chao_Dong4",
        "aff": "Shanghai Artificial Intelligence Laboratory;Shanghai Aritifcal Intelligence Laboratory;Shenzhen Institutes of Advanced Technology, Chinese Academy of Sciences, Chinese Academy of Sciences;Shanghai Jiaotong University;;Hong Kong Polytechnic University;Shenzhen Institutes of Advanced Technology, Chinese Academy of Sciences, Chinese Academy of Sciences",
        "aff_domain": "pjlab.org.cn;pjlab.org.cn;siat.ac.cn;sjtu.edu.cn;;polyu.edu.hk;siat.ac.cn",
        "position": "Researcher;Intern;PhD student;Full Professor;;Associate Professor;Full Professor",
        "bibtex": "@inproceedings{\nzhang2024seal,\ntitle={{SEAL}: A Framework for Systematic Evaluation of Real-World Super-Resolution},\nauthor={Wenlong Zhang and Xiaohui Li and Xiangyu Chen and Xiaoyun Zhang and Yu Qiao and Xiao-Ming Wu and Chao Dong},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=CGlczSBBSj}\n}",
        "github": "",
        "project": "",
        "reviewers": "JzYv;xKgq;p1DW;eBzL",
        "pdf_size": 28095263,
        "rating": "6;6;8;8",
        "confidence": "2;4;4;5",
        "soundness": "3;3;3;4",
        "contribution": "3;3;3;4",
        "presentation": "3;3;3;4",
        "wc_summary": "62;122;73;95",
        "wc_strengths": "21;109;39;93",
        "wc_weaknesses": "231;95;76;143",
        "wc_questions": "15;45;6;88",
        "wc_review": "329;371;194;419",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "707;336;312;626",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            88.0,
            22.94558781116753
        ],
        "wc_strengths_avg": [
            65.5,
            36.50684867254362
        ],
        "wc_weaknesses_avg": [
            136.25,
            59.90565499182861
        ],
        "wc_questions_avg": [
            38.5,
            32.01952529317073
        ],
        "wc_review_avg": [
            328.25,
            83.79551002291232
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            495.25,
            173.83523089408544
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.6882472016116854,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3489364523432902561&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=CGlczSBBSj",
        "pdf": "https://openreview.net/pdf?id=CGlczSBBSj",
        "email": "pjlab.org.cn;pjlab.org.cn;siat.ac.cn;sjtu.edu.cn;;polyu.edu.hk;siat.ac.cn",
        "author_num": 7,
        "aff_unique_index": "0;0;1;2;3;1",
        "aff_unique_norm": "Shanghai Artificial Intelligence Laboratory;Chinese Academy of Sciences;Shanghai Jiao Tong University;Hong Kong Polytechnic University",
        "aff_unique_dep": ";Shenzhen Institutes of Advanced Technology;;",
        "aff_unique_url": "http://www.shailab.org/;http://www.cas.cn;https://www.sjtu.edu.cn;https://www.polyu.edu.hk",
        "aff_unique_abbr": "Shanghai AI Lab;CAS;SJTU;PolyU",
        "aff_campus_unique_index": "1;2;1",
        "aff_campus_unique": ";Shenzhen;Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "CH6DQGcI3a",
        "title": "Revisiting DeepFool: generalization and improvement",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep neural networks have been known to be vulnerable to adversarial examples, which are inputs that are modified slightly to fool the network into making incorrect predictions. This has led to a significant amount of research on evaluating the robustness of these networks against such perturbations. One particularly important robustness metric is the robustness to minimal $\\ell_2$ adversarial perturbations. However, existing methods for evaluating this robustness metric are either computationally expensive or not very accurate. In this paper, we introduce a new family of adversarial attacks that strike a balance between effectiveness and computational efficiency. Our proposed attacks are generalizations of the well-known DeepFool (DF) attack, while they remain simple to understand and implement. We demonstrate that our attacks outperform existing methods in terms of both effectiveness and computational efficiency. Our proposed attacks are also suitable for evaluating the robustness of large models and can be used to perform adversarial training (AT) to achieve state-of-the-art robustness to minimal $\\ell_2$ adversarial perturbations.",
        "keywords": "Deep Learning;Adversarial robustness;Adversarial Attacks;Adversarial training",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Alireza Abdolahpourrostam;Mahed Abroshan;Seyed-Mohsen Moosavi-Dezfooli",
        "authorids": "~Alireza_Abdolahpourrostam1;~Mahed_Abroshan1;~Seyed-Mohsen_Moosavi-Dezfooli1",
        "gender": "M;M;M",
        "homepage": "https://people.epfl.ch/alireza.abdollahpoorrostam;;",
        "dblp": ";;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;tYSPRRwAAAAJ;https://scholar.google.ch/citations?user=qosS83IAAAAJ",
        "orcid": ";;",
        "linkedin": "alireza-abdollahpour-511a36191?lipi=urn%3Ali%3Apage%3Ad_flagship3_profile_view_base_contact_details%3B2ISItUEmSiqSdoHejAhw%2BA%3D%3D;mahed-abroshan/;",
        "or_profile": "~Alireza_Abdolahpourrostam1;~Mahed_Abroshan1;~Seyed-Mohsen_Moosavi-Dezfooli1",
        "aff": "EPFL - EPF Lausanne;Optum AI;Imperial College London, Imperial College London",
        "aff_domain": "epfl.ch;optum.com;imperial.ac.uk",
        "position": "MS student;Principal Researcher;Assistant Professor",
        "bibtex": "@misc{\nabdolahpourrostam2024revisiting,\ntitle={Revisiting DeepFool: generalization and improvement},\nauthor={Alireza Abdolahpourrostam and Mahed Abroshan and Seyed-Mohsen Moosavi-Dezfooli},\nyear={2024},\nurl={https://openreview.net/forum?id=CH6DQGcI3a}\n}",
        "github": "",
        "project": "",
        "reviewers": "2iqu;34Xw;Qken;VFL7",
        "site": "https://openreview.net/forum?id=CH6DQGcI3a",
        "pdf_size": 1401924,
        "rating": "5;6;6;8",
        "confidence": "3;5;4;5",
        "soundness": "3;3;3;3",
        "contribution": "2;2;2;2",
        "presentation": "3;4;1;4",
        "wc_summary": "77;68;142;40",
        "wc_strengths": "100;85;26;8",
        "wc_weaknesses": "287;108;446;16",
        "wc_questions": "15;112;14;816",
        "wc_review": "479;373;628;880",
        "wc_reply_reviewers": "288;295;151;192",
        "wc_reply_authors": "993;1854;1226;1446",
        "reply_reviewers": "2;2;1;1",
        "reply_authors": "4;4;3;2",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            1.224744871391589
        ],
        "wc_summary_avg": [
            81.75,
            37.365592461514645
        ],
        "wc_strengths_avg": [
            54.75,
            38.64825351810868
        ],
        "wc_weaknesses_avg": [
            214.25,
            165.52397862545476
        ],
        "wc_questions_avg": [
            239.25,
            335.35755172651176
        ],
        "wc_review_avg": [
            590.0,
            190.36412477144953
        ],
        "wc_reply_reviewers_avg": [
            231.5,
            61.775804324994425
        ],
        "wc_reply_authors_avg": [
            1379.75,
            317.22103886722266
        ],
        "reply_reviewers_avg": [
            1.5,
            0.5
        ],
        "reply_authors_avg": [
            3.25,
            0.82915619758885
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.7608859102526822,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11381286234084918911&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "EPFL;Optum;Imperial College London",
        "aff_unique_dep": ";Optum AI;",
        "aff_unique_url": "https://www.epfl.ch;https://www.optum.com;https://www.imperial.ac.uk",
        "aff_unique_abbr": "EPFL;Optum;ICL",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Lausanne;",
        "aff_country_unique_index": "0;1;2",
        "aff_country_unique": "Switzerland;United States;United Kingdom"
    },
    {
        "title": "Energy-based Automated Model Evaluation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19181",
        "id": "CHGcP6lVWd",
        "author_site": "Ru Peng, Heming Zou, Haobo Wang, Yawen Zeng, Zenan Huang, Junbo Zhao",
        "tldr": "",
        "abstract": "The conventional evaluation protocols on machine learning models rely heavily on a labeled, i.i.d-assumed testing dataset, which is not often present in real-world applications.\nThe Automated Model Evaluation (AutoEval) shows an alternative to this traditional workflow, by forming a proximal prediction pipeline of the testing performance without the presence of ground-truth labels.\nDespite its recent successes, the AutoEval frameworks still suffer from an overconfidence issue, substantial storage and computational cost.\nIn that regard, we propose a novel measure --- Meta-Distribution Energy (MDE) that allows the AutoEval framework to be both more efficient and effective.\nThe core of the MDE is to establish a meta-distribution statistic, on the information (energy) associated with individual samples, then offer a smoother representation enabled by energy-based learning.\nWe further provide our theoretical insights by connecting the MDE with the classification loss.\nWe provide extensive experiments across modalities, datasets and different architectural backbones to validate MDE's validity, together with its superiority compared with prior approaches.\nWe also prove MDE's versatility by showing its seamless integration with large-scale models, and easy adaption to learning scenarios with noisy- or imbalanced- labels.",
        "keywords": "Automated Model Evalutaion;Energy;Meta-distribution;Distribution shift",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/7d161eccc0fece1a1390613109e1d1f41a4003b5.zip",
        "author": "Ru Peng;Heming Zou;Haobo Wang;Yawen Zeng;Zenan Huang;Junbo Zhao",
        "authorids": "~Ru_Peng1;~Heming_Zou1;~Haobo_Wang1;~Yawen_Zeng1;~Zenan_Huang1;~Junbo_Zhao1",
        "gender": "M;M;M;;M;M",
        "homepage": "https://pengr.github.io/;;https://hbzju.github.io/;;https://lccurious.github.io;http://jakezhao.net/",
        "dblp": ";;;;;191/6665",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.cz/citations?user=QI1LOoYAAAAJ;DnN-rggAAAAJ;;EVfmFW8AAAAJ;8ipao8MAAAAJ",
        "orcid": ";;0000-0001-8586-3048;;0000-0003-3950-2692;",
        "linkedin": ";\u9e64\u9e23-\u90b9-406823265;;;;",
        "or_profile": "~Ru_Peng1;~Heming_Zou1;~Haobo_Wang1;~Yawen_Zeng1;~Zenan_Huang1;~Junbo_Zhao1",
        "aff": "Zhejiang University;Zhejiang University;Zhejiang University;;Zhejiang University;Zhejiang University",
        "aff_domain": "zju.edu.cn;zju.edu.cn;zju.edu.cn;;zju.edu.cn;zju.edu.cn",
        "position": "PhD student;Undergrad student;Assistant Professor;;Researcher;Assistant Professor",
        "bibtex": "@inproceedings{\npeng2024energybased,\ntitle={Energy-based Automated Model Evaluation},\nauthor={Ru Peng and Heming Zou and Haobo Wang and Yawen Zeng and Zenan Huang and Junbo Zhao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=CHGcP6lVWd}\n}",
        "github": "",
        "project": "",
        "reviewers": "SNMZ;zk65;xmk2;2CiW;Dsfd",
        "pdf_size": 9453765,
        "rating": "3;6;6;8;8",
        "confidence": "5;3;3;3;4",
        "soundness": "2;2;2;3;4",
        "contribution": "1;1;2;3;3",
        "presentation": "2;2;3;4;3",
        "wc_summary": "60;53;58;110;90",
        "wc_strengths": "23;10;43;150;106",
        "wc_weaknesses": "345;188;360;107;142",
        "wc_questions": "73;5;133;12;8",
        "wc_review": "501;256;594;379;346",
        "wc_reply_reviewers": "0;16;9;0;0",
        "wc_reply_authors": "2362;1086;1891;567;255",
        "reply_reviewers": "0;1;1;0;0",
        "reply_authors": "4;2;4;1;1",
        "rating_avg": [
            6.2,
            1.8330302779823362
        ],
        "confidence_avg": [
            3.6,
            0.8
        ],
        "soundness_avg": [
            2.6,
            0.8
        ],
        "contribution_avg": [
            2.0,
            0.8944271909999159
        ],
        "presentation_avg": [
            2.8,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            74.2,
            22.112439937736404
        ],
        "wc_strengths_avg": [
            66.4,
            53.233823834100065
        ],
        "wc_weaknesses_avg": [
            228.4,
            104.6414831699169
        ],
        "wc_questions_avg": [
            46.2,
            50.15735240221517
        ],
        "wc_review_avg": [
            415.2,
            118.97461914206744
        ],
        "wc_reply_reviewers_avg": [
            5.0,
            6.511528238439882
        ],
        "wc_reply_authors_avg": [
            1232.2,
            791.1069207129968
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            2.4,
            1.3564659966250538
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.627376434428478,
        "gs_citation": 20,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17046494878218642717&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=CHGcP6lVWd",
        "pdf": "https://openreview.net/pdf?id=CHGcP6lVWd",
        "email": "zju.edu.cn;zju.edu.cn;zju.edu.cn;;zju.edu.cn;zju.edu.cn",
        "author_num": 6,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Zhejiang University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.zju.edu.cn",
        "aff_unique_abbr": "ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Online Stabilization of Spiking Neural Networks",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19180",
        "id": "CIj1CVbkpr",
        "author_site": "Yaoyu Zhu, Jianhao Ding, Tiejun Huang, Xiaodong Xie, Zhaofei Yu",
        "tldr": "",
        "abstract": "Spiking neural networks (SNNs), attributed to the binary, event-driven nature of spikes, possess heightened biological plausibility and enhanced energy efficiency on neuromorphic hardware compared to analog neural networks (ANNs). Mainstream SNN training schemes apply backpropagation-through-time (BPTT) with surrogate gradients to replace the non-differentiable spike emitting process during backpropagation. While achieving competitive performance, the requirement for storing intermediate information at all time-steps incurs higher memory consumption and fails to fulfill the online property crucial to biological brains. \nOur work focuses on online training techniques, aiming for memory efficiency while preserving biological plausibility. \nThe limitation of not having access to future information in early time steps in online training has constrained previous efforts to incorporate advantageous modules such as batch normalization. \nTo address this problem, we propose Online Spiking Renormalization (OSR) to ensure consistent parameters between testing and training, and Online Threshold Stabilizer (OTS) to stabilize neuron firing rates across time steps. Furthermore, we design a novel online approach to compute the sample mean and variance over time for OSR. Experiments conducted on various datasets demonstrate the proposed method's superior performance among SNN online training algorithms.\nOur code is available at https://github.com/zhuyaoyu/SNN-online-normalization.",
        "keywords": "spiking neural networks;online training",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/27db2477fd490ed76f3a28308e0bc1c4ebbcbbf4.zip",
        "author": "Yaoyu Zhu;Jianhao Ding;Tiejun Huang;Xiaodong Xie;Zhaofei Yu",
        "authorids": "~Yaoyu_Zhu1;~Jianhao_Ding1;~Tiejun_Huang1;~Xiaodong_Xie1;~Zhaofei_Yu1",
        "gender": "M;M;M;M;M",
        "homepage": ";https://dingjianhao.github.io/;https://idm.pku.edu.cn/~tjhuang/;http://idm.pku.edu.cn/en/info/1009/1010.htm;https://yuzhaofei.github.io",
        "dblp": "325/0611;128/2534;h/TiejunHuang;;166/0573",
        "google_scholar": ";4rDfCSsAAAAJ;https://scholar.google.com.tw/citations?user=knvEK4AAAAAJ;;qaUgD50AAAAJ",
        "orcid": "0000-0002-8485-5094;;0000-0002-4234-6099;;",
        "linkedin": ";;;;",
        "or_profile": "~Yaoyu_Zhu1;~Jianhao_Ding1;~Tiejun_Huang1;~Xiaodong_Xie1;~Zhaofei_Yu1",
        "aff": "Peking University;Institute of Automation, Chinese Academy of Sciences;Peking University;Peking University;Peking University",
        "aff_domain": "pku.edu.cn;ia.ac.cn;pku.edu.cn;pku.edu.cn;pku.edu.cn",
        "position": "PhD student;Intern;Full Professor;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nzhu2024online,\ntitle={Online Stabilization of Spiking Neural Networks},\nauthor={Yaoyu Zhu and Jianhao Ding and Tiejun Huang and Xiaodong Xie and Zhaofei Yu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=CIj1CVbkpr}\n}",
        "github": "",
        "project": "",
        "reviewers": "W97A;9e6u;pFYW;2ic1",
        "pdf_size": 874606,
        "rating": "6;6;8;8",
        "confidence": "5;4;5;4",
        "soundness": "2;2;3;4",
        "contribution": "2;2;3;4",
        "presentation": "2;2;3;4",
        "wc_summary": "80;202;79;62",
        "wc_strengths": "34;38;67;114",
        "wc_weaknesses": "339;48;19;91",
        "wc_questions": "71;191;102;5",
        "wc_review": "524;479;267;272",
        "wc_reply_reviewers": "71;39;28;25",
        "wc_reply_authors": "1054;1374;698;466",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            105.75,
            56.02845259330299
        ],
        "wc_strengths_avg": [
            63.25,
            31.948200262299597
        ],
        "wc_weaknesses_avg": [
            124.25,
            126.60445292326807
        ],
        "wc_questions_avg": [
            92.25,
            66.91552510441804
        ],
        "wc_review_avg": [
            385.5,
            117.09931682123512
        ],
        "wc_reply_reviewers_avg": [
            40.75,
            18.226011631731172
        ],
        "wc_reply_authors_avg": [
            898.0,
            345.5198981245509
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17191129932463712233&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=CIj1CVbkpr",
        "pdf": "https://openreview.net/pdf?id=CIj1CVbkpr",
        "email": "pku.edu.cn;ia.ac.cn;pku.edu.cn;pku.edu.cn;pku.edu.cn",
        "author_num": 5,
        "aff_unique_index": "0;1;0;0;0",
        "aff_unique_norm": "Peking University;Chinese Academy of Sciences",
        "aff_unique_dep": ";Institute of Automation",
        "aff_unique_url": "http://www.pku.edu.cn;http://www.ia.cas.cn",
        "aff_unique_abbr": "Peking U;CAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Accelerated Convergence of Stochastic Heavy Ball Method under Anisotropic Gradient Noise",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19179",
        "id": "CIqjp9yTDq",
        "author_site": "Rui Pan, Yuxing Liu, Xiaoyu Wang, Tong Zhang",
        "tldr": "",
        "abstract": "Heavy-ball momentum with decaying learning rates is widely used with SGD for optimizing deep learning models. In contrast to its empirical popularity, the understanding of its theoretical property is still quite limited, especially under the standard anisotropic gradient noise condition for quadratic regression problems. Although it is widely conjectured that heavy-ball momentum method can provide accelerated convergence and should work well in large batch settings, there is no rigorous theoretical analysis. In this paper, we fill this theoretical gap by establishing a non-asymptotic convergence bound for stochastic heavy-ball methods with step decay scheduler on quadratic objectives, under the anisotropic gradient noise condition. As a direct implication, we show that heavy-ball momentum can provide $\\tilde{\\mathcal{O}}(\\sqrt{\\kappa})$ accelerated convergence of the bias term of SGD while still achieving near-optimal convergence rate with respect to the stochastic variance term. The combined effect implies an overall convergence rate within log factors from the statistical minimax rate. This means SGD with heavy-ball momentum is useful in the large-batch settings such as distributed machine learning or federated learning, where a smaller number of iterations can significantly reduce the number of communication rounds, leading to acceleration in practice.",
        "keywords": "optimization theory;convergence analysis;heavy-ball momentum;learning rate schedule;near-optimal convergence rate",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Rui Pan;Yuxing Liu;Xiaoyu Wang;Tong Zhang",
        "authorids": "~Rui_Pan4;~Yuxing_Liu1;~Xiaoyu_Wang4;~Tong_Zhang2",
        "gender": "M;M;F;M",
        "homepage": ";https://infinity-stars.github.io/;https://xiaoyuwang2821.github.io/xiaoyu_wang.github.io/;http://tongzhang-ml.org",
        "dblp": "74/9957;11/8650;58/4775-8;07/4227-1",
        "google_scholar": ";ENZKdAUAAAAJ;https://scholar.google.com/citations?view_op=list_works;LurWtuYAAAAJ",
        "orcid": "0000-0001-7217-0656;;0000-0003-4102-4909;0000-0002-5511-2558",
        "linkedin": ";;;",
        "or_profile": "~Rui_Pan4;~Yuxing_Liu1;~Xiaoyu_Wang4;~Tong_Zhang2",
        "aff": "Hong Kong University of Science and Technology;Fudan University;Hong Kong University of Science and Technology;UIUC",
        "aff_domain": "ust.hk;fudan.edu.cn;hkust.edu;illinois.edu",
        "position": "MS student;Undergrad student;Research Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\npan2024accelerated,\ntitle={Accelerated Convergence of Stochastic Heavy Ball Method under Anisotropic Gradient Noise},\nauthor={Rui Pan and Yuxing Liu and Xiaoyu Wang and Tong Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=CIqjp9yTDq}\n}",
        "github": "",
        "project": "",
        "reviewers": "Uq7v;Vpgj;dqiw;JMNK",
        "pdf_size": 696236,
        "rating": "5;6;6;8",
        "confidence": "4;3;4;4",
        "soundness": "3;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "4;3;3;3",
        "wc_summary": "74;53;71;73",
        "wc_strengths": "19;34;30;161",
        "wc_weaknesses": "64;35;97;108",
        "wc_questions": "16;265;39;1",
        "wc_review": "173;387;237;343",
        "wc_reply_reviewers": "718;18;0;0",
        "wc_reply_authors": "2559;936;231;78",
        "reply_reviewers": "5;1;0;0",
        "reply_authors": "8;3;1;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            67.75,
            8.584142356694699
        ],
        "wc_strengths_avg": [
            61.0,
            57.99568949499609
        ],
        "wc_weaknesses_avg": [
            76.0,
            28.679260799399973
        ],
        "wc_questions_avg": [
            80.25,
            107.52063755391335
        ],
        "wc_review_avg": [
            285.0,
            84.581321815162
        ],
        "wc_reply_reviewers_avg": [
            184.0,
            308.3926069152761
        ],
        "wc_reply_authors_avg": [
            951.0,
            983.1604650310142
        ],
        "reply_reviewers_avg": [
            1.5,
            2.0615528128088303
        ],
        "reply_authors_avg": [
            3.25,
            2.8613807855648994
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.13245323570650439,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6587043869272384879&as_sdt=8005&sciodt=0,7&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=CIqjp9yTDq",
        "pdf": "https://openreview.net/pdf?id=CIqjp9yTDq",
        "email": "ust.hk;fudan.edu.cn;hkust.edu;illinois.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Fudan University;University of Illinois Urbana-Champaign",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ust.hk;https://www.fudan.edu.cn;https://www illinois.edu",
        "aff_unique_abbr": "HKUST;Fudan;UIUC",
        "aff_campus_unique_index": "0;0;2",
        "aff_campus_unique": "Hong Kong SAR;;Urbana-Champaign",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "CJBAMwl2ds",
        "title": "Reasoning-Enhanced Object-Centric Learning for Videos",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Object-centric learning aims to break down complex visual scenes into more manageable object representations, enhancing the understanding and reasoning abilities of machine learning systems toward the physical world. Recently, slot-based video models have demonstrated remarkable proficiency in segmenting and tracking objects. Although most modules in these models are well-designed, they overlook the importance of the effective reasoning module. In the real world, especially in complex scenes, reasoning and predictive abilities play a crucial role in human perception and object tracking; in particular, these abilities are closely related to human intuitive physics. Inspired by this, we designed a novel reasoning module called the Slot-based Time-Space Transformer with Memory buffer (STATM) to enhance the model's perception ability in complex scenes. The memory buffer primarily serves as storage for slot information from upstream modules, akin to human memory or field of view. The Slot-based Time-Space Transformer makes predictions through slot-based spatiotemporal attention computations and fusion. We demonstrated that the improved deep learning model exhibits certain degree of rationality imitating human behavior. This has crucial implications for understanding the relationship between deep learning and human cognition, especially in the context of intuitive physics.",
        "keywords": "object-centric learning;spatiotemporal attention;intuitive physics;reasoning;prediction",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Jian Li;Pu Ren;Qi Wang;Yang Liu;Hao Sun",
        "authorids": "~Jian_Li24;~Pu_Ren1;~Qi_Wang30;~Yang_Liu52;~Hao_Sun4",
        "gender": "M;M;M;F;",
        "homepage": "https://github.com/K-lina;https://paulpuren.github.io/;;;",
        "dblp": ";;;;",
        "google_scholar": ";FiuAyGwAAAAJ;;34upg6YAAAAJ;",
        "orcid": "0000-0002-0685-0861;0000-0002-6354-385X;0009-0009-4712-3474;0000-0003-0127-4030;",
        "linkedin": ";;;;",
        "or_profile": "~Jian_Li24;~Pu_Ren1;~Qi_Wang30;~Yang_Liu52;~Hao_Sun4",
        "aff": "Renmin University of China;Lawrence Berkeley National Lab;Renmin University of China;University of Chinese Academy of Sciences;",
        "aff_domain": "ruc.edu.cn;lbl.gov;ruc.edu.cn;ucas.ac.cn;",
        "position": "PhD student;Postdoc;PhD student;Associate Professor;",
        "bibtex": "@misc{\nli2024reasoningenhanced,\ntitle={Reasoning-Enhanced Object-Centric Learning for Videos},\nauthor={Jian Li and Pu Ren and Qi Wang and Yang Liu and Hao Sun},\nyear={2024},\nurl={https://openreview.net/forum?id=CJBAMwl2ds}\n}",
        "github": "",
        "project": "",
        "reviewers": "vpNg;zBsm;km72;4XrW",
        "site": "https://openreview.net/forum?id=CJBAMwl2ds",
        "pdf_size": 2310188,
        "rating": "3;3;3;5",
        "confidence": "5;4;4;5",
        "soundness": "2;2;2;2",
        "contribution": "1;2;2;2",
        "presentation": "3;2;3;2",
        "wc_summary": "51;58;96;76",
        "wc_strengths": "26;79;128;67",
        "wc_weaknesses": "213;359;1182;105",
        "wc_questions": "79;312;70;4",
        "wc_review": "369;808;1476;252",
        "wc_reply_reviewers": "240;90;168;0",
        "wc_reply_authors": "1021;706;833;192",
        "reply_reviewers": "2;1;1;0",
        "reply_authors": "3;2;2;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            70.25,
            17.440971876589906
        ],
        "wc_strengths_avg": [
            75.0,
            36.36619309193636
        ],
        "wc_weaknesses_avg": [
            464.75,
            423.8008819009229
        ],
        "wc_questions_avg": [
            116.25,
            116.66699404715972
        ],
        "wc_review_avg": [
            726.25,
            479.93456585247117
        ],
        "wc_reply_reviewers_avg": [
            124.5,
            89.33504351596858
        ],
        "wc_reply_authors_avg": [
            688.0,
            307.5117883919249
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6787558881951425093&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "Renmin University of China;Lawrence Berkeley National Laboratory;University of Chinese Academy of Sciences",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.ruc.edu.cn;https://www.lbl.gov;http://www.ucas.ac.cn",
        "aff_unique_abbr": "RUC;LBNL;UCAS",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Berkeley",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "CJPzLnQvIr",
        "title": "QuickDrop: Efficient Federated Unlearning by Integrated Dataset Distillation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Federated Unlearning (FU) aims to delete specific training data from an ML model trained using Federated Learning (FL).\nWe introduce QuickDrop, an efficient and original FU method that utilizes dataset distillation (DD) to accelerate unlearning and drastically reduces computational overhead compared to existing approaches. In QuickDrop, each client uses DD to generate a compact dataset representative of the original training dataset, called a *distilled dataset*, and uses this compact dataset during unlearning. To unlearn specific knowledge from the global model, QuickDrop has clients execute Stochastic Gradient Ascent with samples from the distilled datasets, thus significantly reducing computational overhead compared to conventional FU methods. We further increase the efficiency of QuickDrop by ingeniously integrating DD into the FL training process. By reusing the gradient updates produced during FL training for DD, the overhead of creating distilled datasets becomes close to negligible. Evaluations on three standard datasets show that, with comparable accuracy guarantees, QuickDrop reduces the duration of unlearning by 463.8$\\times$ compared to model retraining from scratch and 65.1$\\times$ compared to existing FU approaches. We also demonstrate the scalability of QuickDrop with 100 clients and show its effectiveness while handling multiple unlearning operations.",
        "keywords": "Federated Learning;Machine Unlearning;Dataset Distillation",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/ecfcac58894629a75353ccfd2ea4e599a04ad1ab.pdf",
        "author": "Akash Dhasade;Yaohong Ding;Song Guo;Anne-marie Kermarrec;Martijn De Vos;Leijie WU",
        "authorids": "~Akash_Dhasade1;~Yaohong_Ding1;~Song_Guo5;~Anne-marie_Kermarrec2;~Martijn_De_Vos1;~Leijie_WU1",
        "gender": ";M;M;F;;M",
        "homepage": ";https://github.com/AC-Amiya233?tab=repositories;https://cse.hkust.edu.hk/~songguo/;https://people.epfl.ch/anne-marie.kermarrec;https://devos50.github.io;https://leijiewu.github.io/",
        "dblp": ";313/1192;01/267-1;86/676.html;137/4243;303/7332",
        "google_scholar": ";;https://scholar.google.com/citations?hl=en;https://scholar.google.it/citations?user=aIAy-qcAAAAJ;;https://scholar.google.com.hk/citations?user=nvyzWJ0AAAAJ",
        "orcid": ";;;0000-0001-8187-724X;;",
        "linkedin": ";;;;;",
        "or_profile": "~Akash_Dhasade1;~Yaohong_Ding1;~Song_Guo5;~Anne-marie_Kermarrec2;~Martijn_De_Vos1;~Leijie_WU1",
        "aff": ";Hong Kong Polytechnic University;Department of Computer Science and Engineering, Hong Kong University of Science and Technology;School of Computer and Communication Sciences, EPFL - EPF Lausanne;EPFL - EPF Lausanne;The Hong Kong Polytechnic University, Hong Kong Polytechnic University",
        "aff_domain": ";polyu.edu.hk;cse.ust.hk;ic.epfl.ch;epfl.ch;comp.polyu.edu.hk",
        "position": ";Researcher;Full Professor;Full Professor;Postdoc;PhD student",
        "bibtex": "@misc{\ndhasade2024quickdrop,\ntitle={QuickDrop: Efficient Federated Unlearning by Integrated Dataset Distillation},\nauthor={Akash Dhasade and Yaohong Ding and Song Guo and Anne-marie Kermarrec and Martijn De Vos and Leijie WU},\nyear={2024},\nurl={https://openreview.net/forum?id=CJPzLnQvIr}\n}",
        "github": "",
        "project": "",
        "reviewers": "ug1m;AkUq;um5Z;BiDM",
        "site": "https://openreview.net/forum?id=CJPzLnQvIr",
        "pdf_size": 1064226,
        "rating": "3;3;3;6",
        "confidence": "4;3;3;4",
        "soundness": "2;2;3;3",
        "contribution": "1;2;2;3",
        "presentation": "3;2;2;4",
        "wc_summary": "45;121;205;92",
        "wc_strengths": "36;33;71;24",
        "wc_weaknesses": "280;49;151;125",
        "wc_questions": "4;14;5;24",
        "wc_review": "365;217;432;265",
        "wc_reply_reviewers": "0;0;0;4",
        "wc_reply_authors": "415;519;435;170",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "3;2;3;2",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            115.75,
            58.22961016527588
        ],
        "wc_strengths_avg": [
            41.0,
            17.874562931719478
        ],
        "wc_weaknesses_avg": [
            151.25,
            83.24774771728062
        ],
        "wc_questions_avg": [
            11.75,
            8.073877630977572
        ],
        "wc_review_avg": [
            319.75,
            83.96837202185118
        ],
        "wc_reply_reviewers_avg": [
            1.0,
            1.7320508075688772
        ],
        "wc_reply_authors_avg": [
            384.75,
            129.98148906671287
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8992480544733240510&as_sdt=5,34&sciodt=0,34&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;2;0",
        "aff_unique_norm": "Hong Kong Polytechnic University;Hong Kong University of Science and Technology;EPFL",
        "aff_unique_dep": ";Department of Computer Science and Engineering;School of Computer and Communication Sciences",
        "aff_unique_url": "https://www.polyu.edu.hk;https://www.ust.hk;https://www.epfl.ch",
        "aff_unique_abbr": "PolyU;HKUST;EPFL",
        "aff_campus_unique_index": "0;0;1;1;0",
        "aff_campus_unique": "Hong Kong SAR;Lausanne",
        "aff_country_unique_index": "0;0;1;1;0",
        "aff_country_unique": "China;Switzerland"
    },
    {
        "id": "CJnyR3M6Oh",
        "title": "Sparse hyperbolic representation learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Minimizing the space complexity of entity representations without the loss of information makes data science procedures computationally efficient and effective.\nFor the entities with the tree structure, hyperbolic-space-based representation learning (HSBRL) has successfully reduced the space complexity of representations by using low-dimensional space.\nNevertheless, it has not minimized the space complexity of each representation since it has used the same dimension for all representations and has not selected the best dimension for each representation.\nThis paper, for the first time, constructs a sparse learning scheme to minimize the dimension for each representation in HSBRL.\nThe most significant difficulty is that we cannot construct a well-defined sparse learning scheme for HSBRL based on a coordinate system since there is no canonical coordinate system that reflects geometric structure perfectly, unlike in linear space.\nForcibly applying a linear sparse learning method on a coordinate system of hyperbolic space causes a non-uniform sparsity.\nAnother difficulty is that existing Riemannian gradient descent cannot reach a sparse solution since the algorithm oscillates on a non-smooth function, which is essential in sparse learning.\nTo overcome the above issue, for the first time, we geometrically define the sparseness and sparse regularization in hyperbolic space, to achieve geometrically uniform sparsity.\nAlso, we propose the first optimization algorithm that can avoid the oscillation problem and obtain sparse representations in hyperbolic space by the geometric shrinkage-thresholding idea.",
        "keywords": "sparse learning;hyperbolic space;Cartan-Hadamard norm",
        "primary_area": "metric learning, kernel learning, and sparse coding",
        "supplementary_material": "/attachment/1ac57882e9a133829e88865ed1fb5235c3e8900e.pdf",
        "author": "Atsushi Suzuki;Atsushi Nitanda;jing wang;Feng Tian;Kenji Yamanishi",
        "authorids": "~Atsushi_Suzuki1;~Atsushi_Nitanda1;~jing_wang23;~Feng_Tian6;~Kenji_Yamanishi1",
        "gender": ";M;F;;M",
        "homepage": "https://ash-suzuki.github.io/;https://sites.google.com/site/atsushinitanda;;;http://www.ibis.t.u-tokyo.ac.jp/yamanishi/index_e.html",
        "dblp": "95/125;155/1884;;;88/5479",
        "google_scholar": "https://scholar.google.com/citations?hl=ja;https://scholar.google.co.jp/citations?user=LyVvaf8AAAAJ;2wtzHbcAAAAJ;;https://scholar.google.co.jp/citations?user=hSXFw2sAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Atsushi_Suzuki1;~Atsushi_Nitanda1;~jing_wang23;~Feng_Tian6;~Kenji_Yamanishi1",
        "aff": "King's College London, University of London;A*STAR;University of Greenwich;;The University of Tokyo",
        "aff_domain": "kcl.ac.uk;a-star.edu.sg;gre.ac.uk;;u-tokyo.ac.jp",
        "position": "Lecturer;Principal Researcher;Senior Lecturer;;Full Professor",
        "bibtex": "@misc{\nsuzuki2024sparse,\ntitle={Sparse hyperbolic representation learning},\nauthor={Atsushi Suzuki and Atsushi Nitanda and jing wang and Feng Tian and Kenji Yamanishi},\nyear={2024},\nurl={https://openreview.net/forum?id=CJnyR3M6Oh}\n}",
        "github": "",
        "project": "",
        "reviewers": "kjo2;mRWy;r35J",
        "site": "https://openreview.net/forum?id=CJnyR3M6Oh",
        "pdf_size": 838225,
        "rating": "3;6;6",
        "confidence": "4;3;4",
        "soundness": "3;3;3",
        "contribution": "1;3;3",
        "presentation": "3;2;3",
        "wc_summary": "90;124;51",
        "wc_strengths": "70;92;56",
        "wc_weaknesses": "157;57;118",
        "wc_questions": "9;2;6",
        "wc_review": "326;275;231",
        "wc_reply_reviewers": "0;10;31",
        "wc_reply_authors": "1420;735;638",
        "reply_reviewers": "0;1;1",
        "reply_authors": "3;2;2",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            88.33333333333333,
            29.825417944356715
        ],
        "wc_strengths_avg": [
            72.66666666666667,
            14.817407180595247
        ],
        "wc_weaknesses_avg": [
            110.66666666666667,
            41.15283168331865
        ],
        "wc_questions_avg": [
            5.666666666666667,
            2.8674417556808756
        ],
        "wc_review_avg": [
            277.3333333333333,
            38.818666758260626
        ],
        "wc_reply_reviewers_avg": [
            13.666666666666666,
            12.918548250050735
        ],
        "wc_reply_authors_avg": [
            931.0,
            348.03543880855966
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:oY_GyDSkjjoJ:scholar.google.com/&scioq=Sparse+hyperbolic+representation+learning&hl=en&as_sdt=0,33",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "King's College London;Agency for Science, Technology and Research;University of Greenwich;University of Tokyo",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.kcl.ac.uk;https://www.a-star.edu.sg;https://www.gre.ac.uk;https://www.u-tokyo.ac.jp",
        "aff_unique_abbr": "KCL;A*STAR;Greenwich;UTokyo",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;2",
        "aff_country_unique": "United Kingdom;Singapore;Japan"
    },
    {
        "title": "Channel Vision Transformers: An Image Is Worth 1 x 16 x 16 Words",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19178",
        "id": "CK5Hfb5hBG",
        "author_site": "Yujia Bao, Srinivasan Sivanandan, THEOFANIS KARALETSOS",
        "tldr": "",
        "abstract": "Vision Transformer (ViT) has emerged as a powerful architecture in the realm of modern computer vision. However, its application in certain imaging fields, such as microscopy and satellite imaging, presents unique challenges. In these domains, images often contain multiple channels, each carrying semantically distinct and independent information. Furthermore, the model must demonstrate robustness to sparsity in input channels, as they may not be densely available during training or testing. In this paper, we propose a modification to the ViT architecture that enhances reasoning across the input channels and introduce Hierarchical Channel Sampling (HCS) as an additional regularization technique to ensure robustness when only partial channels are presented during test time. Our proposed model, ChannelViT, constructs patch tokens independently from each input channel and utilizes a learnable channel embedding that is added to the patch tokens, similar to positional embeddings. We evaluate the performance of ChannelViT on ImageNet, JUMP-CP (microscopy cell imaging), and So2Sat (satellite imaging). Our results show that ChannelViT outperforms ViT on classification tasks and generalizes well, even when a subset of input channels is used during testing. Across our experiments, HCS proves to be a powerful regularizer, independent of the architecture employed, suggesting itself as a straightforward technique for robust ViT training. Lastly, we find that ChannelViT generalizes effectively even when there is limited access to all channels during training, highlighting its potential for multi-channel imaging under real-world conditions with sparse sensors. Our code is available at https://github.com/insitro/ChannelViT.",
        "keywords": "vision transformer;representation learning;hyper spectral imaging",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yujia Bao;Srinivasan Sivanandan;Theofanis Karaletsos",
        "authorids": "~Yujia_Bao1;~Srinivasan_Sivanandan1;~Theofanis_Karaletsos1",
        "gender": "M;M;M",
        "homepage": "https://people.csail.mit.edu/yujia/;https://srinivasans.github.io/;http://karaletsos.com/",
        "dblp": "214/4122;155/2084;31/11191",
        "google_scholar": "https://scholar.google.com/citations?authorid=Ee4Peu4AAAAJ;ut5NR58AAAAJ;zrxafGsAAAAJ",
        "orcid": ";;",
        "linkedin": ";srinivasansivanandan/;",
        "or_profile": "~Yujia_Bao1;~Srinivasan_Sivanandan1;~Theofanis_Karaletsos1",
        "aff": "Accenture;Insitro;Pyramidal, Inc",
        "aff_domain": "accenture.com;insitro.com;pyramidal.ai",
        "position": "Researcher;Researcher;Researcher",
        "bibtex": "@inproceedings{\nbao2024channel,\ntitle={Channel Vision Transformers: An Image Is Worth 1 x 16 x 16 Words},\nauthor={Yujia Bao and Srinivasan Sivanandan and Theofanis Karaletsos},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=CK5Hfb5hBG}\n}",
        "github": "",
        "project": "",
        "reviewers": "ptju;PjTm;rJx2;EcAm",
        "pdf_size": 12058421,
        "rating": "5;5;8;8",
        "confidence": "4;4;4;5",
        "soundness": "3;2;4;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "90;69;76;80",
        "wc_strengths": "129;63;94;117",
        "wc_weaknesses": "575;152;95;359",
        "wc_questions": "66;82;93;82",
        "wc_review": "860;366;358;638",
        "wc_reply_reviewers": "403;237;44;27",
        "wc_reply_authors": "507;621;606;742",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            6.5,
            1.5
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            78.75,
            7.595228765481656
        ],
        "wc_strengths_avg": [
            100.75,
            25.16321720289359
        ],
        "wc_weaknesses_avg": [
            295.25,
            189.04017430165473
        ],
        "wc_questions_avg": [
            80.75,
            9.627434756984853
        ],
        "wc_review_avg": [
            555.5,
            208.83187017311317
        ],
        "wc_reply_reviewers_avg": [
            177.75,
            153.99898538626806
        ],
        "wc_reply_authors_avg": [
            619.0,
            83.43560391104027
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5773502691896258,
        "gs_citation": 28,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5830942507575096137&as_sdt=5,31&sciodt=0,31&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=CK5Hfb5hBG",
        "pdf": "https://openreview.net/pdf?id=CK5Hfb5hBG",
        "email": "accenture.com;insitro.com;pyramidal.ai",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Accenture;Insitro;Pyramidal, Inc",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.accenture.com;https://www.insitro.com;",
        "aff_unique_abbr": "Accenture;;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "CKw0wMQxzv",
        "title": "Unsupervised Image-to-Video Domain Adaptation for Fine-Grained Video Understanding",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Video understanding models continue to rely on image-pretrained semantic representations due to a lack of labeled videos. Pixel-precise video annotations are time-consuming and laborious to collect, and may not be feasibly obtained in certain situations. There is a growing amount of freely available unlabeled video data that has led many methods to tackle unsupervised video representation learning and image-to-video domain adaptation. The focus thus far has been on semantic representations for classification, which lack the spatial detail required for tasks such as segmentation. To produce representations better suited for fine-grained video understanding, we propose using large-scale image segmentation datasets and domain adversarial learning to train 2D/3D networks for video segmentation. We introduce a novel unsupervised clustered adversarial loss that first clusters feature maps from a patch embedding then applies a domain discriminator to samples within clusters. Our loss is designed to prevent removal of overall spatial structure while encouraging the removal of fine-grained spatial information specific to the image and video domains. Through experiments using several image and video segmentation datasets, we show how a general or clustered adversarial loss placed at various locations within the network can make spatial feature representations invariant to these domains and improve performance when the network has access to only labeled images and unlabeled videos.",
        "keywords": "Unsupervised Domain Adaptation;Image-to-video Transfer Learning;Video Segmentation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/f47659fdb3ba13d7444f3ffa5c8da8a05f139259.pdf",
        "author": "Cristina Mata;Abe Leite;Michael S Ryoo",
        "authorids": "~Cristina_Mata1;~Abe_Leite1;~Michael_S_Ryoo1",
        "gender": ";M;M",
        "homepage": "https://www.cs.stonybrook.edu/;;http://michaelryoo.com/",
        "dblp": "205/5898;;r/MichaelSRyoo",
        "google_scholar": ";kXpclAgAAAAJ;vcw0TJIAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Cristina_Mata1;~Abe_Leite1;~Michael_S_Ryoo1",
        "aff": "State University of New York, Stony Brook;State University of New York at Stony Brook;Google DeepMind",
        "aff_domain": "stonybrook.edu;stonybrook.edu;google.com",
        "position": "PhD student;PhD student;Research Scientist",
        "bibtex": "@misc{\nmata2024unsupervised,\ntitle={Unsupervised Image-to-Video Domain Adaptation for Fine-Grained Video Understanding},\nauthor={Cristina Mata and Abe Leite and Michael S Ryoo},\nyear={2024},\nurl={https://openreview.net/forum?id=CKw0wMQxzv}\n}",
        "github": "",
        "project": "",
        "reviewers": "g8Ho;stFh;jnCk;RLFw",
        "site": "https://openreview.net/forum?id=CKw0wMQxzv",
        "pdf_size": 1795584,
        "rating": "1;3;3;3",
        "confidence": "4;4;4;4",
        "soundness": "2;2;2;2",
        "contribution": "1;2;2;2",
        "presentation": "1;3;2;1",
        "wc_summary": "33;63;51;73",
        "wc_strengths": "55;36;17;84",
        "wc_weaknesses": "287;243;215;168",
        "wc_questions": "10;117;6;34",
        "wc_review": "385;459;289;359",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            55.0,
            14.89966442575134
        ],
        "wc_strengths_avg": [
            48.0,
            24.748737341529164
        ],
        "wc_weaknesses_avg": [
            228.25,
            43.22831826476714
        ],
        "wc_questions_avg": [
            41.75,
            44.74580985969524
        ],
        "wc_review_avg": [
            373.0,
            60.81118318204309
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:EtvWoI3UfU8J:scholar.google.com/&scioq=Unsupervised+Image-to-Video+Domain+Adaptation+for+Fine-Grained+Video+Understanding&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "State University of New York;State University of New York at Stony Brook;Google",
        "aff_unique_dep": ";;Google DeepMind",
        "aff_unique_url": "https://www.stonybrook.edu;https://www.stonybrook.edu;https://deepmind.com",
        "aff_unique_abbr": "SUNY Stony Brook;SUNY Stony Brook;DeepMind",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Stony Brook;",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "CLZ4mgMdTz",
        "title": "Sequence-SOD: Sequence-aware Spiking Object Detection for Event Cameras",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Due to the asynchronous sensing of changes in illumination by event cameras, they are highly energy-efficient and therefore exhibit great potential especially in mobile, low power scenarios. Moreover, they are able to acquire sparse data with a high temporal resolution in the order of milliseconds and achieve a large dynamic range. This enables the recording of reliable data with minimal motion blur even during rapid movements and in low light scenarios. SNNs are particularly suitable for the processing of event data due to their asynchronous and spike-based functionality while their low energy consumption enables their deployment in automotive embedded applications. However, recent spiking object detectors do not leverage the full temporal information and only consider a single, fixed-size sample of the event data. In this paper, we propose the first sequence-aware SNN, which processes long sequences of the event stream data and predicts bounding boxes with a frequency of 40 Hz. In combination with a SSD network design, we are able to reach 26.88 mAP on the Gen1 Automotive Detection Dataset.",
        "keywords": "Event Camera;Spiking Neural Network;Object Detection",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Katharina Bendig;Ren\u00e9 Schuster;Didier Stricker",
        "authorids": "~Katharina_Bendig1;~Ren\u00e9_Schuster1;~Didier_Stricker1",
        "gender": ";;",
        "homepage": ";;",
        "dblp": ";;",
        "google_scholar": ";;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": ";;",
        "aff": ";;",
        "aff_domain": ";;",
        "position": ";;",
        "bibtex": "@misc{\nbendig2024sequencesod,\ntitle={Sequence-{SOD}: Sequence-aware Spiking Object Detection for Event Cameras},\nauthor={Katharina Bendig and Ren{\\'e} Schuster and Didier Stricker},\nyear={2024},\nurl={https://openreview.net/forum?id=CLZ4mgMdTz}\n}",
        "github": "",
        "project": "",
        "reviewers": "KHHd;N9Kv;5brf;idF6",
        "site": "https://openreview.net/forum?id=CLZ4mgMdTz",
        "pdf_size": 604104,
        "rating": "3;3;5;6",
        "confidence": "3;4;5;5",
        "soundness": "2;2;3;3",
        "contribution": "1;1;2;3",
        "presentation": "2;1;2;3",
        "wc_summary": "58;36;37;56",
        "wc_strengths": "29;15;67;92",
        "wc_weaknesses": "127;160;84;151",
        "wc_questions": "142;3;2;113",
        "wc_review": "356;214;190;412",
        "wc_reply_reviewers": "69;0;75;71",
        "wc_reply_authors": "572;609;341;614",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            46.75,
            10.280442597476044
        ],
        "wc_strengths_avg": [
            50.75,
            30.48257699079919
        ],
        "wc_weaknesses_avg": [
            130.5,
            29.432125305522874
        ],
        "wc_questions_avg": [
            65.0,
            63.33640343435993
        ],
        "wc_review_avg": [
            293.0,
            93.5147047260483
        ],
        "wc_reply_reviewers_avg": [
            53.75,
            31.107675901616307
        ],
        "wc_reply_authors_avg": [
            534.0,
            112.60328592008317
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.8703882797784892,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:a6lx6y90fagJ:scholar.google.com/&scioq=Sequence-SOD:+Sequence-aware+Spiking+Object+Detection+for+Event+Cameras&hl=en&as_sdt=0,5",
        "gs_version_total": 0
    },
    {
        "id": "CMueAY2dIY",
        "title": "DAGCN: Distance-based and Aspect-oriented Graph Convolutional Network for Aspect-based Sentiment Analysis",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Aspect-based sentiment analysis (ABSA) is a task that aims to determine the sentiment polarity of aspects by identifying opinion words. Recently, numerous studies based on Graph Convolutional Networks (GCN) are used for ABSA and they mainly utilize a dependency tree to extract syntactic information. However, not all relations in a dependency tree are necessary and different context words have distinct influence on aspects. Thus, effectively utilizing syntactic information from dependency tree remains a challenging problem. In this paper, we present Distance-based and Aspect-oriented Graph Convolutional Network (DAGCN) to address the aforementioned issue, which consists of tow GCNs. Firstly, we propose a novel function called Distance-based Syntactic Value (DSV) to measure the importance of different context words syntactically and eliminate noise in the dependency tree, and thus construct Distance-based Weighted Matrix (DWM) with it. Secondly, we introduce Aspect-Fusion Attention (AF) to focus on the context words crucial for aspects in global scope and combine DWM with AF to integrate local and global syntactic information simultaneously.Finally, the first GCN (AoGCN) is designed based on the combined result to capture syntactic features and the second GCN (SaGCN) is designed with self-attention mechanism to learn semantic information. Furthermore, the Kullback-Leibler (KL) divergence loss is utilized to ensure that the features learnt by AoGCN and SaGCN are distinct. Extensive experiments on three public datasets demonstrate that DAGCN outperforms state-of-the-art models and verify the effectiveness of the proposed architecture.",
        "keywords": "Aspect-based sentiment analysis;Graph convolutional network;Kullback-Leibler divergence;Aspect-oriented dependency tree",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/8fc93466d0d2a7bf8573092e651a2c5e5414d83e.zip",
        "author": "Zhihao Wang;Bo Zhang;Ru Yang;Chang Guo;Maozhen Li",
        "authorids": "~Zhihao_Wang8;~Bo_Zhang31;~Ru_Yang1;~Chang_Guo1;~Maozhen_Li1",
        "gender": ";M;;F;",
        "homepage": ";http://teacher.shnu.edu.cn/xxjdgcxy/zb/list.htm;http://teacher.shnu.edu.cn/xxjdgcxy/yr/list.htm;;",
        "dblp": ";;;;l/MaozhenLi.html",
        "google_scholar": ";;;;",
        "orcid": "0009-0007-8232-025X;;;0000-0001-9047-4303;",
        "linkedin": ";;;;",
        "or_profile": "~Zhihao_Wang8;~Bo_Zhang31;~Ru_Yang1;~Chang_Guo1;~Maozhen_Li1",
        "aff": "Shanghai Normal University;Shanghai Normal University;Shanghai Normal University;Shanghai Normal University;Brunel University Uxbridge",
        "aff_domain": "shnu.edu.cn;shnu.edu.cn;shnu.edu.cn;shnu.edu.cn;brunel.ac.uk",
        "position": "MS student;Full Professor;Lecturer;Lecturer;Full Professor",
        "bibtex": "@misc{\nwang2024dagcn,\ntitle={{DAGCN}: Distance-based and Aspect-oriented Graph Convolutional Network for Aspect-based Sentiment Analysis},\nauthor={Zhihao Wang and Bo Zhang and Ru Yang and Chang Guo and Maozhen Li},\nyear={2024},\nurl={https://openreview.net/forum?id=CMueAY2dIY}\n}",
        "github": "",
        "project": "",
        "reviewers": "QpvE;U2MN;kTiw;dd5U",
        "site": "https://openreview.net/forum?id=CMueAY2dIY",
        "pdf_size": 1206701,
        "rating": "1;3;3;5",
        "confidence": "5;4;3;3",
        "soundness": "2;2;2;2",
        "contribution": "1;1;2;2",
        "presentation": "2;2;3;3",
        "wc_summary": "129;78;42;63",
        "wc_strengths": "29;25;21;35",
        "wc_weaknesses": "184;357;101;97",
        "wc_questions": "118;2;101;27",
        "wc_review": "460;462;265;222",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            78.0,
            32.101401838549044
        ],
        "wc_strengths_avg": [
            27.5,
            5.172040216394301
        ],
        "wc_weaknesses_avg": [
            184.75,
            105.33844265034489
        ],
        "wc_questions_avg": [
            62.0,
            48.68778080791935
        ],
        "wc_review_avg": [
            352.25,
            109.80977870845565
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.8528028654224418,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16291394616210959667&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0;1",
        "aff_unique_norm": "Shanghai Normal University;Brunel University London",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.shnu.edu.cn;https://www.brunel.ac.uk",
        "aff_unique_abbr": "SHNU;Brunel",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Uxbridge",
        "aff_country_unique_index": "0;0;0;0;1",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "title": "Early Stopping Against Label Noise Without Validation Data",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19177",
        "id": "CMzF2aOfqp",
        "author_site": "Suqin Yuan, Lei Feng, Tongliang Liu",
        "tldr": "",
        "abstract": "Early stopping methods in deep learning face the challenge of balancing the volume of training and validation data, especially in the presence of label noise. Concretely, sparing more data for validation from training data would limit the performance of the learned model, yet insufficient validation data could result in a sub-optimal selection of the desired model. In this paper, we propose a novel early stopping method called Label Wave, which does not require validation data for selecting the desired model in the presence of label noise. It works by tracking the changes in the model's predictions on the training set during the training process, aiming to halt training before the model unduly fits mislabeled data. This method is empirically supported by our observation that minimum fluctuations in predictions typically occur at the training epoch before the model excessively fits mislabeled data. Through extensive experiments, we show both the effectiveness of the Label Wave method across various settings and its capability to enhance the performance of existing methods for learning with noisy labels.",
        "keywords": "label noise;early stopping;deep learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/8f66fd049316a484e1db2b602ec132f11452f7f5.zip",
        "author": "Suqin Yuan;Lei Feng;Tongliang Liu",
        "authorids": "~Suqin_Yuan1;~Lei_Feng1;~Tongliang_Liu1",
        "gender": "Not Specified;M;M",
        "homepage": "https://suqinyuan.github.io;https://lfeng1995.github.io/;https://tongliang-liu.github.io/",
        "dblp": ";76/847-6;150/6667",
        "google_scholar": "PJfBjGQAAAAJ;https://scholar.google.com.sg/citations?user=KomQOFkAAAAJ;https://scholar.google.com.au/citations?user=EiLdZ_YAAAAJ",
        "orcid": ";0000-0003-2839-5799;",
        "linkedin": ";;",
        "or_profile": "~Suqin_Yuan1;~Lei_Feng1;~Tongliang_Liu1",
        "aff": "The University of Sydney;Singapore University of Technology and Design;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_domain": "usyd.edu.au;sutd.edu.sg;mbzuai.ac.ae",
        "position": "PhD student;Assistant Professor;Affiliated Associate Professor",
        "bibtex": "@inproceedings{\nyuan2024early,\ntitle={Early Stopping Against Label Noise Without Validation Data},\nauthor={Suqin Yuan and Lei Feng and Tongliang Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=CMzF2aOfqp}\n}",
        "github": "",
        "project": "",
        "reviewers": "LTbz;D1rG;R2TX;8gHt",
        "pdf_size": 1907180,
        "rating": "5;6;6;6",
        "confidence": "4;4;4;4",
        "soundness": "3;3;2;3",
        "contribution": "2;3;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "86;33;54;36",
        "wc_strengths": "54;18;29;14",
        "wc_weaknesses": "187;42;34;153",
        "wc_questions": "6;233;299;2",
        "wc_review": "333;326;416;205",
        "wc_reply_reviewers": "264;217;327;0",
        "wc_reply_authors": "1799;2472;1629;654",
        "reply_reviewers": "2;2;2;0",
        "reply_authors": "4;7;3;2",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            52.25,
            21.07575621419075
        ],
        "wc_strengths_avg": [
            28.75,
            15.578430601315397
        ],
        "wc_weaknesses_avg": [
            104.0,
            67.14536469481718
        ],
        "wc_questions_avg": [
            135.0,
            133.06953069730125
        ],
        "wc_review_avg": [
            320.0,
            75.24293986813646
        ],
        "wc_reply_reviewers_avg": [
            202.0,
            122.98170595661779
        ],
        "wc_reply_authors_avg": [
            1638.5,
            649.9640374666894
        ],
        "reply_reviewers_avg": [
            1.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            4.0,
            1.8708286933869707
        ],
        "replies_avg": [
            30,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 20,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10457625262153040769&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=CMzF2aOfqp",
        "pdf": "https://openreview.net/pdf?id=CMzF2aOfqp",
        "email": "usyd.edu.au;sutd.edu.sg;mbzuai.ac.ae",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of Sydney;Singapore University of Technology and Design;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.sydney.edu.au;https://www.sutd.edu.sg;https://mbzuai.ac.ae",
        "aff_unique_abbr": "USYD;SUTD;MBZUAI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2",
        "aff_country_unique": "Australia;Singapore;United Arab Emirates"
    },
    {
        "title": "Test-Time Training on Nearest Neighbors for Large Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19176",
        "id": "CNL2bku4ra",
        "author_site": "Moritz Hardt, Yu Sun",
        "tldr": "",
        "abstract": "Many recent efforts augment language models with retrieval, by adding retrieved data to the input context. For this approach to succeed, the retrieved data must be added at both training and test time. Moreover, as input length grows linearly with the size of retrieved data, cost in computation and memory grows quadratically for modern Transformers. To avoid these complications, we simply fine-tune the model on retrieved data at test time, using its standard training setup. We build a large-scale distributed index based on text embeddings of the Pile dataset. For each test input, our system retrieves its neighbors and fine-tunes the model on their text. Surprisingly, retrieving and training on as few as 20 neighbors, each for only one gradient iteration, drastically improves performance across more than 20 language modeling tasks in the Pile. For example, test-time training with nearest neighbors significantly narrows the performance gap between a small GPT-2 and a GPT-Neo model more than 10 times larger. Sufficient index quality and size, however, are necessary. Our work establishes a first baseline of test-time training for language modeling.",
        "keywords": "Test-time training",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/8c4823a66a80b52d1c785ba9498c424c03be4ca9.zip",
        "author": "Moritz Hardt;Yu Sun",
        "authorids": "~Moritz_Hardt1;~Yu_Sun1",
        "gender": "Not Specified;M",
        "homepage": "http://mrtz.org/;https://yueatsprograms.github.io/",
        "dblp": "26/4683;",
        "google_scholar": "adnTgaAAAAAJ;a7drwRMAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Moritz_Hardt1;~Yu_Sun1",
        "aff": "Max-Planck-Institute for Intelligent Systems, Max-Planck Institute;Stanford University",
        "aff_domain": "is.mpg.de;stanford.edu",
        "position": "Principal Researcher;Postdoc",
        "bibtex": "@inproceedings{\nhardt2024testtime,\ntitle={Test-Time Training on Nearest Neighbors for Large Language Models},\nauthor={Moritz Hardt and Yu Sun},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=CNL2bku4ra}\n}",
        "github": "",
        "project": "",
        "reviewers": "y6wT;zh5b;Cq76;kVHL",
        "pdf_size": 549515,
        "rating": "5;5;5;6",
        "confidence": "5;4;4;4",
        "soundness": "2;3;4;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;4;2",
        "wc_summary": "105;204;107;10",
        "wc_strengths": "148;124;31;48",
        "wc_weaknesses": "516;372;91;178",
        "wc_questions": "316;2;93;16",
        "wc_review": "1085;702;322;252",
        "wc_reply_reviewers": "448;0;0;0",
        "wc_reply_authors": "636;224;164;103",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            106.5,
            68.59482487768301
        ],
        "wc_strengths_avg": [
            87.75,
            49.35775015131869
        ],
        "wc_weaknesses_avg": [
            289.25,
            165.78808009021637
        ],
        "wc_questions_avg": [
            106.75,
            125.6808955251354
        ],
        "wc_review_avg": [
            590.25,
            333.0303101821214
        ],
        "wc_reply_reviewers_avg": [
            112.0,
            193.98969044771425
        ],
        "wc_reply_authors_avg": [
            281.75,
            208.95259629877776
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 21,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13923028688883164038&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=CNL2bku4ra",
        "pdf": "https://openreview.net/pdf?id=CNL2bku4ra",
        "email": "is.mpg.de;stanford.edu",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Max-Planck-Institute for Intelligent Systems;Stanford University",
        "aff_unique_dep": "Intelligent Systems;",
        "aff_unique_url": "https://www.mpi-is.mpg.de;https://www.stanford.edu",
        "aff_unique_abbr": "MPI-IS;Stanford",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Stanford",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Germany;United States"
    },
    {
        "id": "CNZmaInj9n",
        "title": "Exploring Unified Perspective For Fast Shapley Value Estimation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Shapley values have emerged as a widely accepted and trustworthy tool, grounded in theoretical axioms, for addressing challenges posed by black-box models like deep neural networks. However, computing Shapley values encounters exponential complexity in the number of features. Various approaches, including ApproSemivalue, KernelSHAP, and FastSHAP, have been explored to expedite the computation. We analyze the consistency of existing works and conclude that stochastic estimators can be unified as the linear transformation of importance sampling of feature subsets. Based on this, we investigate the possibility of designing simple amortized estimators and propose a straightforward and efficient one, SimSHAP, by eliminating redundant techniques. Extensive experiments conducted on tabular and image datasets validate the effectiveness of our SimSHAP, which significantly accelerates the computation of accurate Shapley values.",
        "keywords": "explainable AI;Shapley value;amortized estimator;stochastic estimator",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/9230d8fe1491f30883ad629770718b5f64aaefee.zip",
        "author": "Borui Zhang;Baotong Tian;Wenzhao Zheng;Jie Zhou;Jiwen Lu",
        "authorids": "~Borui_Zhang1;~Baotong_Tian1;~Wenzhao_Zheng1;~Jie_Zhou3;~Jiwen_Lu1",
        "gender": "M;M;;M;M",
        "homepage": "http://boruizhang.site/;https://user-tian.github.io;https://wzzheng.net;https://www.tsinghua.edu.cn/publish/auen/1713/2011/20110506105532098625469/20110506105532098625469_.html;http://ivg.au.tsinghua.edu.cn/Jiwen_Lu/",
        "dblp": "230/7918;;230/1277;00/5012-1;http://dblp.uni-trier.de/pers/hd/l/Lu:Jiwen",
        "google_scholar": "MUN3ZNgAAAAJ;;LdK9scgAAAAJ;;TN8uDQoAAAAJ",
        "orcid": "0000-0001-7237-7454;0009-0000-3686-8854;;;0000-0002-6121-5529",
        "linkedin": "BoruiZhang-THU;baotong-tian-2338b2282/;;;",
        "or_profile": "~Borui_Zhang1;~Baotong_Tian1;~Wenzhao_Zheng1;~Jie_Zhou3;~Jiwen_Lu1",
        "aff": "Tsinghua University;Tsinghua University;University of California, Berkeley;Tsinghua University;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;mails.tsinghua.edu.cn;berkeley.edu;tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "PhD student;Undergrad student;Postdoc;Full Professor;Full Professor",
        "bibtex": "@misc{\nzhang2024exploring,\ntitle={Exploring Unified Perspective For Fast Shapley Value Estimation},\nauthor={Borui Zhang and Baotong Tian and Wenzhao Zheng and Jie Zhou and Jiwen Lu},\nyear={2024},\nurl={https://openreview.net/forum?id=CNZmaInj9n}\n}",
        "github": "",
        "project": "",
        "reviewers": "UWrD;MdhR;Gvfa",
        "site": "https://openreview.net/forum?id=CNZmaInj9n",
        "pdf_size": 1992332,
        "rating": "3;6;6",
        "confidence": "4;4;3",
        "soundness": "2;3;2",
        "contribution": "2;3;3",
        "presentation": "1;3;3",
        "wc_summary": "93;97;139",
        "wc_strengths": "75;56;58",
        "wc_weaknesses": "1076;39;106",
        "wc_questions": "8;545;95",
        "wc_review": "1252;737;398",
        "wc_reply_reviewers": "1895;146;0",
        "wc_reply_authors": "2820;635;495",
        "reply_reviewers": "4;2;0",
        "reply_authors": "6;2;2",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            109.66666666666667,
            20.805982045769646
        ],
        "wc_strengths_avg": [
            63.0,
            8.524474568362947
        ],
        "wc_weaknesses_avg": [
            407.0,
            473.8445596043777
        ],
        "wc_questions_avg": [
            216.0,
            235.33380547639135
        ],
        "wc_review_avg": [
            795.6666666666666,
            351.1033402796897
        ],
        "wc_reply_reviewers_avg": [
            680.3333333333334,
            860.9647043997925
        ],
        "wc_reply_authors_avg": [
            1316.6666666666667,
            1064.5525925111556
        ],
        "reply_reviewers_avg": [
            2.0,
            1.632993161855452
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            1.8856180831641267
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6432210764854990989&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "Tsinghua University;University of California, Berkeley",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.berkeley.edu",
        "aff_unique_abbr": "THU;UC Berkeley",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Berkeley",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Synergistic Patch Pruning for Vision Transformer: Unifying Intra- & Inter-Layer Patch Importance",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19175",
        "id": "COO51g41Q4",
        "author_site": "Yuyao Zhang, Lan Wei, Nikolaos Freris",
        "tldr": "",
        "abstract": "The Vision Transformer (ViT) has emerged as a powerful architecture for various computer vision tasks. Nonetheless, this comes with substantially heavier computational costs than Convolutional Neural Networks (CNNs). The attention mechanism in ViTs, which integrates information from different image patches to the class token ([CLS]), renders traditional structured pruning methods used in CNNs unsuitable. To overcome this issue, we propose SynergisTic pAtch pRuning (STAR) that unifies intra-layer and inter-layer patch importance scoring. Specifically, our approach combines a) online evaluation of intra-layer importance for the [CLS] and b) offline evaluation of the inter-layer importance of each patch. The two importance scores are fused by minimizing a weighted average of Kullback-Leibler (KL) Divergences and patches are successively pruned at each layer by maintaining only the top-k most important ones. Unlike prior art that relies on manual selection of the pruning rates at each layer, we propose an automated method for selecting them based on offline-derived metrics. We also propose a variant that uses these rates as weighted percentile parameters (for the layer-wise normalized scores), thus leading to an alternate adaptive rate selection technique that is input-based. Extensive experiments demonstrate the significant acceleration of the inference with minimal performance degradation. For instance, on the ImageNet dataset, the pruned DeiT-Small reaches a throughput of 4,256 images/s, which is over 66\\% higher than the much smaller (unpruned) DeiT-Tiny model, while having a substantially higher accuracy (+6.8\\% Top-1 and +3.1\\% Top-5).",
        "keywords": "Vision Transformers;Model compression;Dynamic pruning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yuyao Zhang;Lan Wei;Nikolaos Freris",
        "authorids": "~Yuyao_Zhang4;~Lan_Wei2;~Nikolaos_Freris2",
        "gender": "F;F;Not Specified",
        "homepage": "https://ieeexplore.ieee.org/document/10064249;https://scholar.google.com/citations?user=DOkab9UAAAAJ&hl=en;http://staff.ustc.edu.cn/~nfr/",
        "dblp": ";;92/7140",
        "google_scholar": ";;j38QfhkAAAAJ",
        "orcid": ";;0000-0001-6006-3001",
        "linkedin": ";;",
        "or_profile": "~Yuyao_Zhang4;~Lan_Wei2;~Nikolaos_Freris2",
        "aff": ";University of Science and Technology of China;University of Science and Technology of China",
        "aff_domain": ";ustc.edu.cn;ustc.edu.cn",
        "position": ";MS student;Full Professor",
        "bibtex": "@inproceedings{\nzhang2024synergistic,\ntitle={Synergistic Patch Pruning for Vision Transformer: Unifying Intra- \\& Inter-Layer Patch Importance},\nauthor={Yuyao Zhang and Lan Wei and Nikolaos Freris},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=COO51g41Q4}\n}",
        "github": "",
        "project": "",
        "reviewers": "fwdP;cb4H;h5Sc;kdgo",
        "pdf_size": 4297247,
        "rating": "6;6;6;8",
        "confidence": "4;4;4;4",
        "soundness": "3;2;3;3",
        "contribution": "3;2;4;3",
        "presentation": "3;2;1;3",
        "wc_summary": "43;70;88;115",
        "wc_strengths": "53;20;56;83",
        "wc_weaknesses": "61;404;45;104",
        "wc_questions": "2;2;189;42",
        "wc_review": "159;496;378;344",
        "wc_reply_reviewers": "0;25;18;14",
        "wc_reply_authors": "391;1366;1142;568",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "1;2;2;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            79.0,
            26.239283526803852
        ],
        "wc_strengths_avg": [
            53.0,
            22.34949663862701
        ],
        "wc_weaknesses_avg": [
            153.5,
            146.22670754687735
        ],
        "wc_questions_avg": [
            58.75,
            76.95250158376919
        ],
        "wc_review_avg": [
            344.25,
            120.91810244955055
        ],
        "wc_reply_reviewers_avg": [
            14.25,
            9.12071817347735
        ],
        "wc_reply_authors_avg": [
            866.75,
            400.18831504680395
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2577637508687766084&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=COO51g41Q4",
        "pdf": "https://openreview.net/pdf?id=COO51g41Q4",
        "email": ";ustc.edu.cn;ustc.edu.cn",
        "author_num": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Science and Technology of China",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.ustc.edu.cn",
        "aff_unique_abbr": "USTC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "AutoCast++: Enhancing World Event Prediction with Zero-shot Ranking-based Context Retrieval",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19174",
        "id": "COYDmKkQH4",
        "author_site": "Qi Yan, Raihan Seraj, Jiawei He, Lili Meng, Tristan Sylvain",
        "tldr": "",
        "abstract": "Machine-based prediction of real-world events is garnering attention due to its potential for informed decision-making. Whereas traditional forecasting predominantly hinges on structured data like time-series, recent breakthroughs in language models enable predictions using unstructured text. In particular, (Zou et al., 2022) unveils AutoCast, a new benchmark that employs news articles for answering forecasting queries. Nevertheless, existing methods still trail behind human performance. The cornerstone of accurate forecasting, we argue, lies in identifying a concise, yet rich subset of news snippets from a vast corpus. With this motivation, we introduce AutoCast++, a zero-shot ranking-based context retrieval system, tailored to sift through expansive news document collections for event forecasting. Our approach first re-ranks articles based on zero-shot question-passage relevance, honing in on semantically pertinent news. Following this, the chosen articles are subjected to zero-shot summarization to attain succinct context. Leveraging a pre-trained language model, we conduct both the relevance evaluation and article summarization without needing domain-specific training. Notably, recent articles can sometimes be at odds with preceding ones due to new facts or unanticipated incidents, leading to fluctuating temporal dynamics. To tackle this, our re-ranking mechanism gives preference to more recent articles, and we further regularize the multi-passage representation learning to align with human forecaster responses made on different dates. Empirical results underscore marked improvements across multiple metrics, improving the performance for multiple-choice questions (MCQ) by 48% and true/false (TF) questions by up to 8%. Code is available at \nhttps://github.com/BorealisAI/Autocast-plus-plus.",
        "keywords": "world event prediction;large language models",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Qi Yan;Raihan Seraj;Jiawei He;Lili Meng;Tristan Sylvain",
        "authorids": "~Qi_Yan2;~Raihan_Seraj1;~Jiawei_He1;~Lili_Meng2;~Tristan_Sylvain2",
        "gender": "M;M;M;Unspecified;F",
        "homepage": "https://qiyan98.github.io/;http://raihan-seraj.github.io/;https://jiaweimtr.github.io;https://sites.google.com/view/tristansylvain;https://scholar.google.ca/citations?user=JzNMKQoAAAAJ&hl=en&oi=ao",
        "dblp": ";;172/2564;190/7311;45/8688",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.ca/citations?user=gtWzuL0AAAAJ;https://scholar.google.ca/citations?user=7zKNBtgAAAAJ;https://scholar.google.ca/citations?user=Dg5qUb0AAAAJ;https://scholar.google.ca/citations?user=JzNMKQoAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";http://linkedin.com/in/raihan-seraj/;;;",
        "or_profile": "~Qi_Yan2;~Raihan_Seraj1;~Jiawei_He1;~Tristan_Sylvain2;~Lili_Meng1",
        "aff": "University of British Columbia;McGill University;Borealis AI;Borealis AI;Borealis AI",
        "aff_domain": "ece.ubc.ca;mcgill.ca;borealisai.com;borealisai.com;borealisai.com",
        "position": "PhD student;PhD student;Researcher;Machine Learning Researcher;Researcher",
        "bibtex": "@inproceedings{\nyan2024autocast,\ntitle={AutoCast++: Enhancing World Event Prediction with Zero-shot Ranking-based Context Retrieval},\nauthor={Qi Yan and Raihan Seraj and Jiawei He and Lili Meng and Tristan Sylvain},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=COYDmKkQH4}\n}",
        "github": "",
        "project": "",
        "reviewers": "mh89;vd8q;KQUb",
        "pdf_size": 611557,
        "rating": "3;6;8",
        "confidence": "3;4;4",
        "soundness": "2;3;3",
        "contribution": "2;2;3",
        "presentation": "3;2;2",
        "wc_summary": "88;42;85",
        "wc_strengths": "52;15;41",
        "wc_weaknesses": "42;74;73",
        "wc_questions": "5;2;30",
        "wc_review": "187;133;229",
        "wc_reply_reviewers": "0;27;101",
        "wc_reply_authors": "532;503;880",
        "reply_reviewers": "0;1;1",
        "reply_authors": "3;3;2",
        "rating_avg": [
            5.666666666666667,
            2.0548046676563256
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            71.66666666666667,
            21.013223349965983
        ],
        "wc_strengths_avg": [
            36.0,
            15.513435037626794
        ],
        "wc_weaknesses_avg": [
            63.0,
            14.854853303438128
        ],
        "wc_questions_avg": [
            12.333333333333334,
            12.552113589175153
        ],
        "wc_review_avg": [
            183.0,
            39.293765408777
        ],
        "wc_reply_reviewers_avg": [
            42.666666666666664,
            42.69530289023476
        ],
        "wc_reply_authors_avg": [
            638.3333333333334,
            171.29376975113703
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.9176629354822472,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16140852052106814345&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=COYDmKkQH4",
        "pdf": "https://openreview.net/pdf?id=COYDmKkQH4",
        "email": "ece.ubc.ca;mcgill.ca;borealisai.com;borealisai.com;borealisai.com",
        "author_num": 5,
        "aff_unique_index": "0;1;2;2;2",
        "aff_unique_norm": "University of British Columbia;McGill University;Borealis AI",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ubc.ca;https://www.mcgill.ca;https://www.borealisai.com",
        "aff_unique_abbr": "UBC;McGill;Borealis AI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "CQF8mTF7qx",
        "title": "Simplicity Bias of SGD via Sharpness Minimization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The remarkable generalization ability of neural networks is usually attributed to the implicit bias of SGD, which often yields models with lower complexity using simpler (e.g. linear) and low-rank features (Huh et al., 2021). Recent works have provided empirical and theoretical evidence for the bias of particular variants of SGD (such as label noise SGD) towards flatter regions of the loss landscape. \nDespite the folklore intuition that flat solutions are 'simple', the connection with the simplicity of the final trained model (e.g. low rank) is not well understood. \nIn this work, we take a step towards bridging this gap by studying the simplicity structure that arises from minimizers of the sharpness for a class of two-layer neural networks.\nWe show that, for any high dimensional training data and certain activations, with small enough step size, label noise SGD always converges to a network that replicates a single linear feature across all neurons; thereby implying a simple rank one feature matrix. To obtain this result, our main technical contribution is to show that label noise SGD always minimizes the sharpness on the manifold of models with zero loss for two-layer networks. \nAlong the way, we discover a novel property --- a local geodesic convexity --- of the trace of Hessian of the loss at approximate stationary points on the manifold of zero loss, which links sharpness to the geometry of the manifold. This tool may be of independent interest.",
        "keywords": "Sharpness minimization;Implicit bias;SGD;Simplicity Bias;trace of Hessian regularizer",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/5492bf82a175648cffeeb97e318aa1a401f8fecf.zip",
        "author": "Khashayar Gatmiry;Zhiyuan Li;Luana Ruiz;Sashank J. Reddi;Stefanie Jegelka",
        "authorids": "~Khashayar_Gatmiry1;~Zhiyuan_Li2;~Luana_Ruiz1;~Sashank_J._Reddi1;~Stefanie_Jegelka3",
        "gender": "M;M;F;M;F",
        "homepage": "http://ce.sharif.edu/~kgatmiry/;https://zhiyuanli.ttic.edu;https://sites.google.com/view/luana-ruiz/home;;http://people.csail.mit.edu/stefje/",
        "dblp": ";l/ZhiyuanLi;;50/10452;38/7003",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;J-rZew8AAAAJ;70lgwYwAAAAJ;gTWUZlsAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Khashayar_Gatmiry1;~Zhiyuan_Li2;~Luana_Ruiz1;~Sashank_J._Reddi1;~Stefanie_Jegelka3",
        "aff": "Massachusetts Institute of Technology;Toyota Technological Institute at Chicago;Whiting School of Engineering;Google;Massachusetts Institute of Technology",
        "aff_domain": "mit.edu;ttic.edu;engineering.jhu.edu;google.com;mit.edu",
        "position": "PhD student;Assistant Professor;Assistant Professor;Research Scientist;Associate Professor",
        "bibtex": "@misc{\ngatmiry2024simplicity,\ntitle={Simplicity Bias of {SGD} via Sharpness Minimization},\nauthor={Khashayar Gatmiry and Zhiyuan Li and Luana Ruiz and Sashank J. Reddi and Stefanie Jegelka},\nyear={2024},\nurl={https://openreview.net/forum?id=CQF8mTF7qx}\n}",
        "github": "",
        "project": "",
        "reviewers": "dCJC;xXHB;GLiD;wfZ7",
        "site": "https://openreview.net/forum?id=CQF8mTF7qx",
        "pdf_size": 1986794,
        "rating": "5;5;6;8",
        "confidence": "3;4;3;3",
        "soundness": "3;2;3;4",
        "contribution": "3;2;3;3",
        "presentation": "2;2;3;4",
        "wc_summary": "211;71;120;135",
        "wc_strengths": "78;31;65;44",
        "wc_weaknesses": "145;336;129;254",
        "wc_questions": "137;115;160;238",
        "wc_review": "571;553;474;671",
        "wc_reply_reviewers": "19;0;22;0",
        "wc_reply_authors": "409;362;191;94",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            134.25,
            50.23631654490604
        ],
        "wc_strengths_avg": [
            54.5,
            18.200274723201296
        ],
        "wc_weaknesses_avg": [
            216.0,
            84.34156745045708
        ],
        "wc_questions_avg": [
            162.5,
            46.40312489477406
        ],
        "wc_review_avg": [
            567.25,
            70.13691966432515
        ],
        "wc_reply_reviewers_avg": [
            10.25,
            10.304731922762475
        ],
        "wc_reply_authors_avg": [
            264.0,
            127.33616925288746
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.4714045207910316,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17219855495153427174&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;0",
        "aff_unique_norm": "Massachusetts Institute of Technology;Toyota Technological Institute at Chicago;Johns Hopkins University;Google",
        "aff_unique_dep": ";;School of Engineering;Google",
        "aff_unique_url": "https://web.mit.edu;https://www.tti-chicago.org;https://engineering.jhu.edu;https://www.google.com",
        "aff_unique_abbr": "MIT;TTI Chicago;JHU Engineering;Google",
        "aff_campus_unique_index": "1;2;3",
        "aff_campus_unique": ";Chicago;Baltimore;Mountain View",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "CRkvR8TJkk",
        "title": "A Game-theoretic Approach to Personalized Federated Learning Based on Target Interpolation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Contrary to classical Federated Learning (FL) that focuses on collaborative learning of a shared global model via a central server, Personalized Federated Learning (PFL) trains a separate model for each user in order to address data heterogeneity and meet local demands. This paper proposes pFedGT, a method for personalized Federated Learning based on a Game-theoretic approach, that adopts a novel formulation termed \"Target interpolation.\" In specific, each user solves a local optimization problem that comprises of a weighted average of two terms: one for the local loss (based on the user's data) and one for the global loss (based on all the data in the system). The latter is, of course, not accessible to the users (due to the large data volumes and privacy concerns) and it is approximated using second-order expansion which allows for an efficient federated implementation. In pFedGT, the users play a game (by minimizing their local problems), and the algorithm supports partial participation in each round. We prove existence and uniqueness of a Nash equilibrium and establish a linear convergence rate under standard assumptions. Extensive experiments on real datasets under variable levels of statistical heterogeneity are used to portray the merits of the proposed solution. In particular, our method achieves on average 2.6\\% and 3.0\\% higher accuracy on CIFAR-10 and CIFAR-100 datasets, and 3.17\\% on HAR dataset than leading baselines.",
        "keywords": "Personalized Federated Learning;Game-theoretic Approach;Target Interpolation",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Yonghai Gong;Ziwen Huang;Nikolaos Freris",
        "authorids": "~Yonghai_Gong1;~Ziwen_Huang1;~Nikolaos_Freris2",
        "gender": "M;;Not Specified",
        "homepage": ";;http://staff.ustc.edu.cn/~nfr/",
        "dblp": ";;92/7140",
        "google_scholar": "https://scholar.google.com.hk/citations?user=nbNXfzUAAAAJ;;j38QfhkAAAAJ",
        "orcid": ";;0000-0001-6006-3001",
        "linkedin": ";;",
        "or_profile": "~Yonghai_Gong1;~Ziwen_Huang1;~Nikolaos_Freris2",
        "aff": "University of Science and Technology of China;;University of Science and Technology of China",
        "aff_domain": "ustc.edu.cn;;ustc.edu.cn",
        "position": "PhD student;;Full Professor",
        "bibtex": "@misc{\ngong2024a,\ntitle={A Game-theoretic Approach to Personalized Federated Learning Based on Target Interpolation},\nauthor={Yonghai Gong and Ziwen Huang and Nikolaos Freris},\nyear={2024},\nurl={https://openreview.net/forum?id=CRkvR8TJkk}\n}",
        "github": "",
        "project": "",
        "reviewers": "PnWa;5Hnv;Ha4r;jCxY",
        "site": "https://openreview.net/forum?id=CRkvR8TJkk",
        "pdf_size": 6152458,
        "rating": "5;5;5;5",
        "confidence": "3;4;3;3",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "3;2;3;3",
        "wc_summary": "53;101;62;49",
        "wc_strengths": "29;31;35;15",
        "wc_weaknesses": "256;281;376;218",
        "wc_questions": "4;39;41;2",
        "wc_review": "342;452;514;284",
        "wc_reply_reviewers": "0;0;0;80",
        "wc_reply_authors": "545;1263;1211;764",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;2;2;1",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            66.25,
            20.60794749605113
        ],
        "wc_strengths_avg": [
            27.5,
            7.533259586659682
        ],
        "wc_weaknesses_avg": [
            282.75,
            58.3239873465455
        ],
        "wc_questions_avg": [
            21.5,
            18.527007313648905
        ],
        "wc_review_avg": [
            398.0,
            90.1443287178955
        ],
        "wc_reply_reviewers_avg": [
            20.0,
            34.64101615137755
        ],
        "wc_reply_authors_avg": [
            945.75,
            301.9266260202965
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:9PNVK77RoqAJ:scholar.google.com/&scioq=A+Game-theoretic+Approach+to+Personalized+Federated+Learning+Based+on+Target+Interpolation&hl=en&as_sdt=0,23",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Science and Technology of China",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.ustc.edu.cn",
        "aff_unique_abbr": "USTC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "CS4mpDduO1",
        "title": "Test Error Guarantees for Batch-normalized two-layer ReLU Networks Trained with Gradient Descent",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "This work establishes low training and test error guarantees of gradient descent (GD)\n   and stochastic gradient descent (SGD) on two-layer ReLU networks with Batch Norm. \n   Prior work provided convergence analyses for low training error or stationary points\n   while critically relying on modifications to the setting such as modifying Batch Norm \n   and assuming the objective is smooth. Although \n   smoothness based analyses can handle deeper networks, the smoothness constants \n   are highly non-negligible. We take an alternative approach using\n   a margin $\\gamma$ tailored to normalized networks. In particular, for a \n   network of width $m$, the \n   test errors for GD and SGD decrease \n   at a rate of $O(\\frac{m^{1/3}}{\\gamma^{1/3} t})$ and $O(\\frac{1}{\\gamma^2 t})$\n   up until $t \\approx O(\\frac {\\exp(\\gamma^2 m)} n)$. Along the way,\n   we show that $\\gamma$ can be $O(\\sqrt{d})$ times larger than \n   the margin of the max margin linear predictor which can \n   potentially explain the training and test error speed up for normalized networks.",
        "keywords": "gradient descent;stochastic gradient descent;normalization layers;generalization bounds;margins",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/17ff84c26a0dca341a99b32c03b581054ee32405.zip",
        "author": "Danny Hyun Ho Son;Colin Lu;Matus Telgarsky",
        "authorids": "~Danny_Hyun_Ho_Son1;~Colin_Lu1;~Matus_Telgarsky1",
        "gender": "M;M;M",
        "homepage": ";;https://cims.nyu.edu/~matus/",
        "dblp": "323/9562;328/1080;05/9061",
        "google_scholar": ";;https://scholar.google.com/citations?hl=en",
        "orcid": ";;",
        "linkedin": "danny-son-a537b1154;colin-lu-64774a146/;",
        "or_profile": "~Danny_Hyun_Ho_Son1;~Colin_Lu1;~Matus_Telgarsky1",
        "aff": "New York University;University of Illinois, Urbana Champaign;NYU, New York University",
        "aff_domain": "nyu.edu;illinois.edu;cims.nyu.edu",
        "position": "PhD student;Undergrad student;Assistant Professor",
        "bibtex": "@misc{\nson2024test,\ntitle={Test Error Guarantees for Batch-normalized two-layer Re{LU} Networks Trained with Gradient Descent},\nauthor={Danny Hyun Ho Son and Colin Lu and Matus Telgarsky},\nyear={2024},\nurl={https://openreview.net/forum?id=CS4mpDduO1}\n}",
        "github": "",
        "project": "",
        "reviewers": "jFN6;ryx4;J2f7;4dGx",
        "site": "https://openreview.net/forum?id=CS4mpDduO1",
        "pdf_size": 445920,
        "rating": "3;5;5;5",
        "confidence": "5;4;2;4",
        "soundness": "1;2;3;3",
        "contribution": "3;3;2;2",
        "presentation": "3;4;2;2",
        "wc_summary": "37;68;58;64",
        "wc_strengths": "36;63;41;26",
        "wc_weaknesses": "209;108;70;350",
        "wc_questions": "11;112;1;4",
        "wc_review": "293;351;170;444",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            56.75,
            11.94518731540029
        ],
        "wc_strengths_avg": [
            41.5,
            13.536986370680884
        ],
        "wc_weaknesses_avg": [
            184.25,
            108.34291624282595
        ],
        "wc_questions_avg": [
            32.0,
            46.330335634441504
        ],
        "wc_review_avg": [
            314.5,
            99.30382671377775
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.6622661785325219,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:j68TSIyWuhAJ:scholar.google.com/&scioq=Test+Error+Guarantees+for+Batch-normalized+two-layer+ReLU+Networks+Trained+with+Gradient+Descent&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "New York University;University of Illinois Urbana-Champaign",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.nyu.edu;https://illinois.edu",
        "aff_unique_abbr": "NYU;UIUC",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Urbana-Champaign;New York",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "CSm099mlOL",
        "title": "Time-sensitive Weight Averaging for Practical Temporal Domain Generalization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Temporal Domain Generalization (TDG) is a valuable yet challenging task that requires models to support temporal distribution shifts without access to future samples. Prior work utilized time-sensitive models that take timestamps as input or directly estimated optimal model parameters for each temporal domain. However, these methods were evaluated in oversimplified settings that do not scale to complex scenarios. To fundamentally enhance TDG's value for real-world applications, we propose three key principles for TDG method design: 1) Time-sensitive model, 2) Generic method, and 3) Realistic evaluation. Reflecting these guidelines, we propose Time-sensitive Weight Averaging (TWA), a simple yet effective approach to apply weight averaging (WA) of specialists for every temporal domain. For principle 1), we train a selector network to estimate the good coefficients to average weights based on timestamp input. For principle 2), TWA is inherently generic, as WA requires no modification to model architecture. For principle 3), we incorporate more realistic benchmarks into TDG, including CLEAR-10, CLEAR-100, Yearbook, and FMoW-Time, which feature complex data distributions and natural temporal shifts. Extensive experiments conducted on these benchmarks demonstrate the practical value of TWA, e.g., on CLEAR-10/100, TWA consistently improves accuracy over the baselines by up to 4%. We also demonstrate TWA boosts performance on common TDG benchmarks used in prior work. Lastly, we provide theoretical insights behind the outstanding performance of TWA.",
        "keywords": "Domain Generalization;Weight Averaging;Temporal Distribution Shift",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/fedc5bb0a39733971835b939a5d28a7309f02c88.zip",
        "author": "Aoming Liu;Kevin Miller;Venkatesh Saligrama;Kate Saenko;Ser-Nam Lim;Bryan A. Plummer",
        "authorids": "~Aoming_Liu1;~Kevin_Miller2;~Venkatesh_Saligrama1;~Kate_Saenko1;~Ser-Nam_Lim3;~Bryan_A._Plummer1",
        "gender": "M;M;;F;M;M",
        "homepage": "https://cs-people.bu.edu/amliu/;;https://venkatesh-saligrama.github.io/;http://ai.bu.edu;http://bryanplummer.com/;https://sites.google.com/site/sernam",
        "dblp": "271/4398;;67/4721;88/2754;163/2330;04/6633",
        "google_scholar": "10aY6n4AAAAJ;;S4z3uzMAAAAJ;https://scholar.google.com.tw/citations?user=9xDADY4AAAAJ;https://scholar.google.com/citations?hl=en;HX0BfLYAAAAJ",
        "orcid": "0009-0007-2990-9671;;0000-0002-0675-2268;0000-0002-5704-7614;;",
        "linkedin": ";kevin-miller-321451133/;venkatesh-saligrama-91175a16/;;;",
        "or_profile": "~Aoming_Liu1;~Kevin_Miller2;~Venkatesh_Saligrama1;~Kate_Saenko1;~Bryan_Allen_Plummer1;~Ser-Nam_Lim1",
        "aff": "Boston University, Boston University;Boston University, Boston University;Boston University;Boston University, Boston University;Boston University;University of Central Florida",
        "aff_domain": "bu.edu;bu.edu;bu.edu;bu.edu;bu.edu;ucf.edu",
        "position": "PhD student;PhD student;Full Professor;Full Professor;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nliu2024timesensitive,\ntitle={Time-sensitive Weight Averaging for Practical Temporal Domain Generalization},\nauthor={Aoming Liu and Kevin Miller and Venkatesh Saligrama and Kate Saenko and Ser-Nam Lim and Bryan A. Plummer},\nyear={2024},\nurl={https://openreview.net/forum?id=CSm099mlOL}\n}",
        "github": "",
        "project": "",
        "reviewers": "Zoin;bw8U;c3ap;Jcbo",
        "site": "https://openreview.net/forum?id=CSm099mlOL",
        "pdf_size": 4507634,
        "rating": "3;3;6;6",
        "confidence": "4;4;4;4",
        "soundness": "3;2;3;3",
        "contribution": "3;2;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "101;58;49;139",
        "wc_strengths": "85;43;72;161",
        "wc_weaknesses": "222;453;158;76",
        "wc_questions": "181;6;82;92",
        "wc_review": "589;560;361;468",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1293;1130;593;289",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            86.75,
            36.00260407248342
        ],
        "wc_strengths_avg": [
            90.25,
            43.58540466715893
        ],
        "wc_weaknesses_avg": [
            227.25,
            140.23440198467708
        ],
        "wc_questions_avg": [
            90.25,
            62.05793663988515
        ],
        "wc_review_avg": [
            494.5,
            89.08563296065196
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            826.25,
            404.09242445262447
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:6LVBeu0s45UJ:scholar.google.com/&scioq=Time-sensitive+Weight+Averaging+for+Practical+Temporal+Domain+Generalization&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0;1",
        "aff_unique_norm": "Boston University;University of Central Florida",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.bu.edu;https://www.ucf.edu",
        "aff_unique_abbr": "BU;UCF",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Boston;",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "CSpWgKo0ID",
        "title": "Playing repeated games with Large Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) are transforming society and permeating into diverse applications.  As a result, LLMs will frequently interact with us and other agents. It is, therefore, of great societal value to understand how LLMs behave in interactive social settings. We propose to use behavioral game theory to study LLM's cooperation and coordination behavior. We let different LLMs play finitely repeated games with each other and with other, human-like strategies. Our results show that LLMs generally perform well in such tasks and also uncover persistent behavioral signatures. In a large set of two-player, two-strategy games, we find that LLMs are particularly good at games where valuing their own self-interest pays off, like the iterated Prisoner's Dilemma family. However, they behave sub-optimally in games that require coordination, like the Battle of the Sexes. We, therefore, further focus on two games from these distinct families. In the canonical iterated Prisoner's Dilemma, we find that GPT-4 acts particularly unforgivingly, always defecting after another agent has defected only once. In the Battle of the Sexes, we find that GPT-4 cannot match the behavior of the simple convention to alternate between options. We verify that these behavioral signatures are stable across robustness checks. Finally, we show how GPT-4's behavior can be modified by providing further information about the other player as well as by asking it to predict the other player's actions before making a choice. These results enrich our understanding of LLM's social behavior and pave the way for a behavioral game theory for machines.",
        "keywords": "Large Language Models;Behavioral Game Theory;Repeated Games;Machine Behavior",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "Elif Akata;Lion Schulz;Julian Coda-Forno;Seong Joon Oh;Matthias Bethge;Eric Schulz",
        "authorids": "~Elif_Akata1;~Lion_Schulz1;~Julian_Coda-Forno1;~Seong_Joon_Oh1;~Matthias_Bethge1;~Eric_Schulz1",
        "gender": "F;M;M;M;M;M",
        "homepage": ";http://www.lion-schulz.com;;https://seongjoonoh.com;https://bethgelab.org;https://cpilab.org",
        "dblp": ";;;168/8835;77/3005;124/0016",
        "google_scholar": "T__E730AAAAJ;mCmjyaoAAAAJ;beVJGycAAAAJ;https://scholar.google.de/citations?user=kmXOOdsAAAAJ;https://scholar.google.com/citations?hl=en;",
        "orcid": ";;;0000-0002-8985-7689;;",
        "linkedin": "elifakata/;;;seong-joon-oh-32113479/;;",
        "or_profile": "~Elif_Akata1;~Lion_Schulz1;~Julian_Coda-Forno1;~Seong_Joon_Oh1;~Matthias_Bethge1;~Eric_Schulz1",
        "aff": "Eberhard-Karls-Universit\u00e4t T\u00fcbingen;Max Planck Institute for Biological Cybernetics;Max Planck Institute for Biological Cybernetics, Max-Planck Institute;Eberhard-Karls-Universit\u00e4t T\u00fcbingen;University of Tuebingen;Max Planck Institute for Biological Cybernetics",
        "aff_domain": "uni-tuebingen.de;tue.mpg.de;tuebingen.mpg.de;uni-tuebingen.de;uni-tuebingen.de;tuebingen.mpg.de",
        "position": "PhD student;PhD student;PhD student;Associate Professor;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nakata2024playing,\ntitle={Playing repeated games with Large Language Models},\nauthor={Elif Akata and Lion Schulz and Julian Coda-Forno and Seong Joon Oh and Matthias Bethge and Eric Schulz},\nyear={2024},\nurl={https://openreview.net/forum?id=CSpWgKo0ID}\n}",
        "github": "",
        "project": "",
        "reviewers": "RgXw;gVz9;94k1;TJ6F;5SPP",
        "site": "https://openreview.net/forum?id=CSpWgKo0ID",
        "pdf_size": 2107425,
        "rating": "3;3;3;3;5",
        "confidence": "4;3;3;4;4",
        "soundness": "2;2;3;2;2",
        "contribution": "2;2;2;2;3",
        "presentation": "3;3;3;3;3",
        "wc_summary": "73;49;131;65;188",
        "wc_strengths": "30;31;56;43;82",
        "wc_weaknesses": "31;38;197;262;181",
        "wc_questions": "384;2;15;272;106",
        "wc_review": "518;120;399;642;557",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            3.4,
            0.8
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.2,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            101.2,
            51.483589618440554
        ],
        "wc_strengths_avg": [
            48.4,
            19.272778730634563
        ],
        "wc_weaknesses_avg": [
            141.8,
            91.74181162370841
        ],
        "wc_questions_avg": [
            155.8,
            149.35648630039475
        ],
        "wc_review_avg": [
            447.2,
            181.32776952248656
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.4082482904638631,
        "gs_citation": 156,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=935355708493166818&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;1;0;2;1",
        "aff_unique_norm": "Eberhard Karls University of T\u00fcbingen;Max Planck Institute for Biological Cybernetics;University of Tuebingen",
        "aff_unique_dep": ";Biological Cybernetics;",
        "aff_unique_url": "https://www.uni-tuebingen.de/;https://www.biocybernetics.mpg.de;https://www.uni-tuebingen.de/",
        "aff_unique_abbr": "Uni T\u00fcbingen;MPIBC;Uni T\u00fcbingen",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "T\u00fcbingen;",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "CThn4xaLDT",
        "title": "E(3) Equivariant Scalar Interaction Network",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Equivariant Graph Neural Networks have demonstrated exceptional performance in modeling geometric data frequently observed in natural science research. The fundamental component of such models is the equivariant operation, which involves operations such as tensor product and scalarization. We present a conceptual framework that unifies the equivariant operations via equivariant basis decomposition. Within this framework, we generalize the idea of replacing the equivariant basis with input features to design efficient equivariant operations capable of modeling different type-$l$ features. To implement this, we propose Scalar Interaction and design an equivariant network, Scalar Interaction Network (SINet), with it. SINet's efficacy extends to efficiently mapping high type-$l$ features while maintaining a complexity $O(L^2)$ with the maximum $L$, representing a significant improvement over the $O(L^6)$ of tensor-product methods.\nEmpirical results demonstrate SINet's capability to model complex quantum systems with high precision and computational efficiency. Its performance is competitive with current state-of-the-art methods in the field, showcasing its potential to advance the modeling of geometric data. This work highlights the potential of scalar interaction as an building block for constructing equivariant networks and opens up new avenues for future exploration in these vital fields.",
        "keywords": "Equivariant Neural Network;Machine learning for Science;Lie group",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/a1f55eff5c0468f63c2467af908bed4320c9279d.zip",
        "author": "Gengchen Wei;Chen Lin;Gengyaun Hu;Wanli Ouyang",
        "authorids": "~Gengchen_Wei1;~Chen_Lin2;~Gengyaun_Hu1;~Wanli_Ouyang1",
        "gender": ";M;;",
        "homepage": "https://wei-gongzi.github.io/;https://scholar.google.com/citations?hl=en&user=rObgGWIAAAAJ;;",
        "dblp": ";;;",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Gengchen_Wei1;~Chen_Lin2;~Gengyaun_Hu1;~Wanli_Ouyang1",
        "aff": "Fudan University;University of Oxford, University of Oxford;;",
        "aff_domain": "fudan.edu.cn;eng.ox.ac.uk;;",
        "position": "MS student;PhD student;;",
        "bibtex": "@misc{\nwei2024e,\ntitle={E(3) Equivariant Scalar Interaction Network},\nauthor={Gengchen Wei and Chen Lin and Gengyaun Hu and Wanli Ouyang},\nyear={2024},\nurl={https://openreview.net/forum?id=CThn4xaLDT}\n}",
        "github": "",
        "project": "",
        "reviewers": "UiX2;ZnMo;6zpN",
        "site": "https://openreview.net/forum?id=CThn4xaLDT",
        "pdf_size": 1130149,
        "rating": "3;3;6",
        "confidence": "3;4;4",
        "soundness": "2;2;2",
        "contribution": "3;2;3",
        "presentation": "3;1;3",
        "wc_summary": "102;77;201",
        "wc_strengths": "30;43;59",
        "wc_weaknesses": "132;193;90",
        "wc_questions": "28;36;3",
        "wc_review": "292;349;353",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            126.66666666666667,
            53.543336549834926
        ],
        "wc_strengths_avg": [
            44.0,
            11.86029791643813
        ],
        "wc_weaknesses_avg": [
            138.33333333333334,
            42.28737662970148
        ],
        "wc_questions_avg": [
            22.333333333333332,
            14.055445761538676
        ],
        "wc_review_avg": [
            331.3333333333333,
            27.860764925289153
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ToVSKEoM3QQJ:scholar.google.com/&scioq=E(3)+Equivariant+Scalar+Interaction+Network&hl=en&as_sdt=0,11",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Fudan University;University of Oxford",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.fudan.edu.cn;https://www.ox.ac.uk",
        "aff_unique_abbr": "Fudan;Oxford",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "title": "What Matters to You? Towards Visual Representation Alignment for Robot Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19173",
        "id": "CTlUHIKF71",
        "author_site": "Thomas Tian, Chenfeng Xu, Masayoshi Tomizuka, Jitendra Malik, Andrea Bajcsy",
        "tldr": "",
        "abstract": "When operating in service of people, robots need to optimize rewards aligned with end-user preferences. Since robots will rely on raw perceptual inputs, their rewards will inevitably use visual representations. Recently there has been excitement in using representations from pre-trained visual models, but key to making these work in robotics is fine-tuning, which is typically done via proxy tasks like dynamics prediction or enforcing temporal cycle-consistency. However, all these proxy tasks bypass the human\u2019s input on what matters to them, exacerbating spurious correlations and ultimately leading to behaviors that are misaligned with user preferences. In this work, we propose that robots should leverage human feedback to align their visual representations with the end-user and disentangle what matters for the task. We propose Representation-Aligned Preference-based Learning (RAPL), a method for solving the visual representation alignment problem and visual reward learning problem through the lens of preference-based learning and optimal transport. Across experiments in X MAGICAL and in robotic manipulation, we find that RAPL\u2019s reward consistently generates preferred robot behaviors with high sample efficiency, and shows strong zero-shot generalization when the visual representation is learned from a different embodiment than the robot\u2019s.",
        "keywords": "Robot learning;Preference learning;Visual reward learning;Representation alignment",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/77faf5f630a4bdb20c92744b30a196eb0f268ffd.zip",
        "author": "Thomas Tian;Chenfeng Xu;Masayoshi Tomizuka;Jitendra Malik;Andrea Bajcsy",
        "authorids": "~Thomas_Tian1;~Chenfeng_Xu1;~Masayoshi_Tomizuka2;~Jitendra_Malik2;~Andrea_Bajcsy1",
        "gender": "M;M;M;F;M",
        "homepage": "https://scholar.google.com/citations?user=uY4D8-wAAAAJ&hl=en&authuser=1;;https://people.eecs.berkeley.edu/~malik/;https://www.cs.cmu.edu/~abajcsy/;https://me.berkeley.edu/people/masayoshi-tomizuka/",
        "dblp": ";65/1881;58/2944;208/0997;10/4434",
        "google_scholar": ";RpqvaTUAAAAJ;oY9R5YQAAAAJ;LUe32ToAAAAJ;",
        "orcid": ";0000-0002-4941-6985;0000-0003-3695-1580;;",
        "linkedin": ";;;;",
        "or_profile": "~Thomas_Tian1;~Chenfeng_Xu1;~Jitendra_Malik2;~Andrea_Victoria_Bajcsy1;~Masayoshi_Tomizuka1",
        "aff": "University of California, Berkeley;University of California, Berkeley;University of California, Berkeley;Carnegie Mellon University;University of California, Berkeley",
        "aff_domain": "berkeley.edu;berkeley.edu;berkeley.edu;cmu.edu;berkeley.edu",
        "position": "PhD student;PhD student;Full Professor;Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\ntian2024what,\ntitle={What Matters to You? Towards Visual Representation Alignment for Robot Learning},\nauthor={Thomas Tian and Chenfeng Xu and Masayoshi Tomizuka and Jitendra Malik and Andrea Bajcsy},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=CTlUHIKF71}\n}",
        "github": "",
        "project": "",
        "reviewers": "vWH8;2gN6;sCYJ;NUZE",
        "pdf_size": 4250947,
        "rating": "3;6;6;6",
        "confidence": "3;3;4;3",
        "soundness": "3;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "4;2;3;4",
        "wc_summary": "62;63;122;314",
        "wc_strengths": "80;63;70;38",
        "wc_weaknesses": "223;105;327;46",
        "wc_questions": "30;19;67;11",
        "wc_review": "395;250;586;409",
        "wc_reply_reviewers": "0;19;0;32",
        "wc_reply_authors": "1267;674;802;431",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "3;2;2;2",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            140.25,
            103.21427953534337
        ],
        "wc_strengths_avg": [
            62.75,
            15.514106484100203
        ],
        "wc_weaknesses_avg": [
            175.25,
            108.33830116814644
        ],
        "wc_questions_avg": [
            31.75,
            21.44032415799724
        ],
        "wc_review_avg": [
            410.0,
            119.16585081305801
        ],
        "wc_reply_reviewers_avg": [
            12.75,
            13.5531361684298
        ],
        "wc_reply_authors_avg": [
            793.5,
            304.12209719124326
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13407263991364192253&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=CTlUHIKF71",
        "pdf": "https://openreview.net/pdf?id=CTlUHIKF71",
        "email": "berkeley.edu;berkeley.edu;berkeley.edu;cmu.edu;berkeley.edu",
        "author_num": 5,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "University of California, Berkeley;Carnegie Mellon University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.berkeley.edu;https://www.cmu.edu",
        "aff_unique_abbr": "UC Berkeley;CMU",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Berkeley;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "CUL3MTjyMc",
        "title": "Adaptive Memory Module for Sequential Planning and Reasoning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Efficient planning and reasoning in sequential decision-making tasks remains a core challenge for machine learning models. These tasks often involve intricate decision sequences leading to combinatorial complexity that hampers traditional planning methods. Humans on the other hand leverage flexible planning strategies and adapt their thinking time based on the complexity of the problem at hand to efficiently solve complex reasoning problems. Inspired by this, we  propose and investigate an end-to-end memory-based adaptive learning algorithm to enhance planning capabilities and resource allocation of AI agents. Our study borrows concepts from adaptive computation and incorporates memory and reusability mechanisms into agents. This allows agents to meta-learn flexible reasoning strategies, plan deeper, and efficiently adjust their computation to not only improve inference time efficiency but also generalize to more complex problems. Finally, our study of the adaptive memory module reveals patterns comparable to human decision-making mechanisms such as increasing certainty, reconsideration and alternative exploration. This work contributes to the evolving understanding of harnessing adaptive computation to enhance machine learning models' capabilities in complex reasoning and sequential decision-making tasks.",
        "keywords": "Adaptive computation;Memory;Planning;Reasoning;Offline RL",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Kshitij Gupta;Sean Spinney;Xutong Zhao;Janarthanan Rajendran;Patricia Conrod;Irina Rish;Sarath Chandar",
        "authorids": "~Kshitij_Gupta1;sean.c.spinney@gmail.com;~Xutong_Zhao1;~Janarthanan_Rajendran1;patricia.conrod@umontreal.ca;~Irina_Rish1;~Sarath_Chandar1",
        "gender": "M;;;;;F;M",
        "homepage": ";;https://tongtongx.github.io/;;;http://irina-rish.com;http://sarathchandar.in/",
        "dblp": ";;320/8138;;;;45/8542",
        "google_scholar": ";;;;;Avse5gIAAAAJ;https://scholar.google.co.in/citations?user=yxWtZLAAAAAJ",
        "orcid": ";;;;;;",
        "linkedin": "kshitijkgupta/;;;;;irina-rish-8b2162;",
        "or_profile": "~Kshitij_Gupta1;sean.c.spinney@gmail.com;~Xutong_Zhao1;~Janarthanan_Rajendran1;patricia.conrod@umontreal.ca;~Irina_Rish1;~Sarath_Chandar1",
        "aff": ";;Mila;;;University of Montreal;\u00c9cole Polytechnique de Montr\u00e9al",
        "aff_domain": ";;mila.quebec;;;mila.quebec;polymtl.ca",
        "position": ";;PhD student;;;Professor;Assistant Professor",
        "bibtex": "@misc{\ngupta2024adaptive,\ntitle={Adaptive Memory Module for Sequential Planning and Reasoning},\nauthor={Kshitij Gupta and Sean Spinney and Xutong Zhao and Janarthanan Rajendran and Patricia Conrod and Irina Rish and Sarath Chandar},\nyear={2024},\nurl={https://openreview.net/forum?id=CUL3MTjyMc}\n}",
        "github": "",
        "project": "",
        "reviewers": "gpnE;KTzw;6Gb2;Us5J",
        "site": "https://openreview.net/forum?id=CUL3MTjyMc",
        "pdf_size": 1910212,
        "rating": "1;1;1;3",
        "confidence": "4;4;4;3",
        "soundness": "1;1;1;3",
        "contribution": "1;1;1;1",
        "presentation": "1;1;1;3",
        "wc_summary": "38;20;41;41",
        "wc_strengths": "39;20;40;20",
        "wc_weaknesses": "40;117;370;452",
        "wc_questions": "50;350;29;67",
        "wc_review": "167;507;480;580",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            1.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            1.0,
            0.0
        ],
        "presentation_avg": [
            1.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            35.0,
            8.74642784226795
        ],
        "wc_strengths_avg": [
            29.75,
            9.756408150543928
        ],
        "wc_weaknesses_avg": [
            244.75,
            170.94059640705598
        ],
        "wc_questions_avg": [
            124.0,
            131.17354916293147
        ],
        "wc_review_avg": [
            433.5,
            158.1526161655254
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:BeMW65-zPdwJ:scholar.google.com/&scioq=Adaptive+Memory+Module+for+Sequential+Planning+and+Reasoning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Mila;University of Montreal;\u00c9cole Polytechnique de Montr\u00e9al",
        "aff_unique_dep": "Quebec Artificial Intelligence Institute;;",
        "aff_unique_url": "https://mila.quebec;https://wwwumontreal.ca;https://www.polymtl.ca",
        "aff_unique_abbr": "Mila;UM;Polytechnique Montr\u00e9al",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Montr\u00e9al",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "title": "Neural Atoms: Propagating Long-range Interaction in Molecular Graphs through Efficient Communication Channel",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19172",
        "id": "CUfSCwcgqm",
        "author_site": "Xuan Li, Zhanke Zhou, Jiangchao Yao, Yu Rong, Lu Zhang, Bo Han",
        "tldr": "",
        "abstract": "Graph Neural Networks (GNNs) have been widely adopted for drug discovery with molecular graphs. Nevertheless, current GNNs mainly excel in leveraging short-range interactions (SRI) but struggle to capture long-range interactions (LRI), both of which are crucial for determining molecular properties. To tackle this issue, we propose a method to abstract the collective information of atomic groups into a few $\\textit{Neural Atoms}$ by implicitly projecting the atoms of a molecular.\nSpecifically, we explicitly exchange the information among neural atoms and project them back to the atoms\u2019 representations as an enhancement. With this mechanism, neural atoms establish the communication channels among distant nodes, effectively reducing the interaction scope of arbitrary node pairs into a single hop. \nTo provide an inspection of our method from a physical perspective, we reveal its connection to the traditional LRI calculation method, Ewald Summation. The Neural Atom can enhance GNNs to capture LRI by approximating the potential LRI of the molecular.\nWe conduct extensive experiments on four long-range graph benchmarks, covering graph-level and link-level tasks on molecular graphs. We achieve up to a 27.32% and 38.27% improvement in the 2D and 3D scenarios, respectively.\nEmpirically, our method can be equipped with an arbitrary GNN to help capture LRI. Code and datasets are publicly available in https://github.com/tmlr-group/NeuralAtom.",
        "keywords": "Long Range Interaction; Molecular Graph;",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Xuan Li;Zhanke Zhou;Jiangchao Yao;Yu Rong;Lu Zhang;Bo Han",
        "authorids": "~Xuan_Li9;~Zhanke_Zhou1;~Jiangchao_Yao1;~Yu_Rong1;~Lu_Zhang20;~Bo_Han1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://github.com/XuanLi728;https://andrewzhou924.github.io/;https://sunarker.github.io/;https://royrong.me/;https://www.comp.hkbu.edu.hk/v1/?page=profile&id=ericluzhang;https://bhanml.github.io/",
        "dblp": ";285/5311;166/5900;24/10036-1;82/10609-61;241/0472-3",
        "google_scholar": "gt3WbnMAAAAJ;GVXErr0AAAAJ;w8oDh9QAAAAJ;https://scholar.google.com.hk/citations?user=itezhEMAAAAJ;https://scholar.google.com/citations?hl=zh-TW;nTNjqHwAAAAJ",
        "orcid": "0009-0002-1590-2966;;;0000-0001-7387-302X;;",
        "linkedin": ";;;;;",
        "or_profile": "~Xuan_Li9;~Zhanke_Zhou1;~Jiangchao_Yao1;~Yu_Rong1;~Lu_Zhang20;~bo_han2",
        "aff": "Hong Kong Baptist University;Hong Kong Baptist University;Shanghai Artificial Intelligence Laboratory;Tencent AI Lab;Hong Kong Baptist University;MBZUAI",
        "aff_domain": "hkbu.edu.hk;hkbu.edu.hk;pjlab.org.cn;tencent.com;hkbu.edu.hk;mbzuai.ac.ae",
        "position": "Intern;PhD student;Researcher;Principal Researcher;Associate Professor;Researcher",
        "bibtex": "@inproceedings{\nli2024neural,\ntitle={Neural Atoms: Propagating Long-range Interaction in Molecular Graphs through Efficient Communication Channel},\nauthor={Xuan Li and Zhanke Zhou and Jiangchao Yao and Yu Rong and Lu Zhang and Bo Han},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=CUfSCwcgqm}\n}",
        "github": "",
        "project": "",
        "reviewers": "2N34;4gc7;9FRM",
        "pdf_size": 10148395,
        "rating": "6;6;8",
        "confidence": "4;3;3",
        "soundness": "2;2;3",
        "contribution": "2;1;3",
        "presentation": "2;2;3",
        "wc_summary": "144;183;60",
        "wc_strengths": "43;46;37",
        "wc_weaknesses": "48;141;240",
        "wc_questions": "50;77;55",
        "wc_review": "285;447;392",
        "wc_reply_reviewers": "63;71;21",
        "wc_reply_authors": "1356;2837;1815",
        "reply_reviewers": "1;2;1",
        "reply_authors": "3;8;4",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            129.0,
            51.32250968142536
        ],
        "wc_strengths_avg": [
            42.0,
            3.7416573867739413
        ],
        "wc_weaknesses_avg": [
            143.0,
            78.39642849007855
        ],
        "wc_questions_avg": [
            60.666666666666664,
            11.728408057172787
        ],
        "wc_review_avg": [
            374.6666666666667,
            67.26233881023036
        ],
        "wc_reply_reviewers_avg": [
            51.666666666666664,
            21.9291789378647
        ],
        "wc_reply_authors_avg": [
            2002.6666666666667,
            619.0069107494322
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            5.0,
            2.160246899469287
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4652482941467090321&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=CUfSCwcgqm",
        "pdf": "https://openreview.net/pdf?id=CUfSCwcgqm",
        "email": "hkbu.edu.hk;hkbu.edu.hk;pjlab.org.cn;tencent.com;hkbu.edu.hk;mbzuai.ac.ae",
        "author_num": 6,
        "aff_unique_index": "0;0;1;2;0;3",
        "aff_unique_norm": "Hong Kong Baptist University;Shanghai Artificial Intelligence Laboratory;Tencent;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_unique_dep": ";;Tencent AI Lab;",
        "aff_unique_url": "https://www.hkbu.edu.hk;http://www.shailab.org/;https://ai.tencent.com;https://www.mbzuai.ac.ae",
        "aff_unique_abbr": "HKBU;Shanghai AI Lab;Tencent AI Lab;MBZUAI",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0;0;1",
        "aff_country_unique": "China;United Arab Emirates"
    },
    {
        "id": "CVldG5ohCy",
        "title": "Adam through a Second-Order Lens",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Research into optimisation for deep learning is characterised by a tension between the computational efficiency of first-order, gradient-based methods (such as SGD and Adam) and the theoretical efficiency of second-order, curvature-based methods (such as quasi-Newton methods and K-FAC). We seek to combine the benefits of both approaches into a single computationally-efficient algorithm. Noting that second-order methods often depend on stabilising heuristics (such as Levenberg-Marquardt damping), we propose AdamQLR: an optimiser combining damping and learning rate selection techniques from K-FAC (Martens and Grosse, 2015) with the update directions proposed by Adam, inspired by considering Adam through a second-order lens. We evaluate AdamQLR on a range of regression and classification tasks at various scales, achieving competitive generalisation performance vs runtime.",
        "keywords": "Optimisation for Deep Learning;Second-Order Optimisation",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/36a3fd6183febe74e3f994c7b2755a058189794b.zip",
        "author": "Ross M Clarke;Baiyu Su;Jos\u00e9 Miguel Hern\u00e1ndez-Lobato",
        "authorids": "~Ross_M_Clarke1;~Baiyu_Su1;~Jos\u00e9_Miguel_Hern\u00e1ndez-Lobato1",
        "gender": "M;;",
        "homepage": ";;http://jmhl.org",
        "dblp": "304/7918;359/3874;40/6058",
        "google_scholar": "1joGBpgAAAAJ;;BEBccCQAAAAJ",
        "orcid": "0000-0001-9884-046X;;0000-0001-7610-949X",
        "linkedin": ";baiyu-su;",
        "or_profile": "~Ross_M_Clarke1;~Baiyu_Su1;~Jose_Miguel_Hernandez_Lobato1",
        "aff": "University of Cambridge;University of Cambridge;University of Cambridge",
        "aff_domain": "cam.ac.uk;cam.ac.uk;cam.ac.uk",
        "position": "PhD student;Undergrad student;Associate Professor",
        "bibtex": "@misc{\nclarke2024adam,\ntitle={Adam through a Second-Order Lens},\nauthor={Ross M Clarke and Baiyu Su and Jos{\\'e} Miguel Hern{\\'a}ndez-Lobato},\nyear={2024},\nurl={https://openreview.net/forum?id=CVldG5ohCy}\n}",
        "github": "",
        "project": "",
        "reviewers": "2iRB;mFeq;MsHa;BW7Y",
        "site": "https://openreview.net/forum?id=CVldG5ohCy",
        "pdf_size": 26920771,
        "rating": "1;3;6;6",
        "confidence": "5;4;3;3",
        "soundness": "2;1;3;3",
        "contribution": "1;1;3;2",
        "presentation": "2;3;3;3",
        "wc_summary": "108;44;63;53",
        "wc_strengths": "34;33;14;44",
        "wc_weaknesses": "150;68;36;152",
        "wc_questions": "68;14;4;25",
        "wc_review": "360;159;117;274",
        "wc_reply_reviewers": "1004;306;0;0",
        "wc_reply_authors": "1558;543;361;205",
        "reply_reviewers": "2;1;0;0",
        "reply_authors": "3;2;1;1",
        "rating_avg": [
            4.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            67.0,
            24.606909598728564
        ],
        "wc_strengths_avg": [
            31.25,
            10.848386976873567
        ],
        "wc_weaknesses_avg": [
            101.5,
            50.78139423056441
        ],
        "wc_questions_avg": [
            27.75,
            24.39646490785089
        ],
        "wc_review_avg": [
            227.5,
            95.68307060290238
        ],
        "wc_reply_reviewers_avg": [
            327.5,
            410.069201477019
        ],
        "wc_reply_authors_avg": [
            666.75,
            528.2841919838223
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.994936676326182,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12569157991450891485&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Cambridge",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cam.ac.uk",
        "aff_unique_abbr": "Cambridge",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Cambridge",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "CW2aryHm95",
        "title": "Policy Learning For Video Streaming",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Facilitating good quality of experience (QoE) for Internet-based video services is a crucial real-world challenge. With remote/hybrid work, education, and telemedicine being here to stay, poor video quality adversely impacts the economy and society at large. The key algorithmic challenge in this context is adaptive bitrate selection (ABR) - continuously adjusting the video bitrate (resolution) to the prevailing traffic conditions. ABR algorithms struggle to maintain high resolutions while avoiding video stalls and long \"lags behind live'', and are the subject of extensive attention. In particular, ABR has, in recent years, been approached from different ML perspectives. However, disillusionment with applications of end-to-end deep reinforcement learning (DRL) to ABR have effectively led to abandoning policy learning for ABR altogether in favor of control-theoretic optimization methods. We demonstrate that, through more nuanced policy learning, substantial improvement over the state-of-the-art is achievable. Specifically, we show that applying deep-Q-learning to the output of a supervised predictive model bests alternative approaches. As we believe that the ABR domain is an exciting new playground for policy learning, we release our code for ABR policy learning and experimentation to facilitate further research.",
        "keywords": "Adaptive video bitrate (ABR);video streaming;policy learning;Quality of Experience (QoE)",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/69b96559bc5638024ad46ace257ec0645945b7e0.zip",
        "author": "Ofir Birka;Yedid Hoshen;Michael Schapira",
        "authorids": "~Ofir_Birka1;~Yedid_Hoshen3;~Michael_Schapira2",
        "gender": ";M;M",
        "homepage": ";https://www.cs.huji.ac.il/~ydidh/;https://www.michaelschapira.com/",
        "dblp": ";136/0280;15/5634",
        "google_scholar": ";https://scholar.google.co.il/citations?user=6y1-qS4AAAAJ;https://scholar.google.co.il/citations?user=vVvbU7oAAAAJ",
        "orcid": ";;",
        "linkedin": "ofir-birka/;;michael-schapira-8652ba1/?originalSubdomain=il",
        "or_profile": "~Ofir_Birka1;~Yedid_Hoshen3;~Michael_Schapira2",
        "aff": ";Google;Hebrew University of Jerusalem",
        "aff_domain": ";google.com;huji.ac.il",
        "position": ";Researcher;Full Professor",
        "bibtex": "@misc{\nbirka2024policy,\ntitle={Policy Learning For Video Streaming},\nauthor={Ofir Birka and Yedid Hoshen and Michael Schapira},\nyear={2024},\nurl={https://openreview.net/forum?id=CW2aryHm95}\n}",
        "github": "",
        "project": "",
        "reviewers": "9tk1;NkJU;yz9h;GtLG",
        "site": "https://openreview.net/forum?id=CW2aryHm95",
        "pdf_size": 536779,
        "rating": "3;3;5;5",
        "confidence": "4;5;4;4",
        "soundness": "2;3;3;3",
        "contribution": "1;2;2;2",
        "presentation": "2;3;3;3",
        "wc_summary": "57;81;86;66",
        "wc_strengths": "21;12;15;25",
        "wc_weaknesses": "121;111;434;74",
        "wc_questions": "9;45;9;156",
        "wc_review": "208;249;544;321",
        "wc_reply_reviewers": "57;0;0;0",
        "wc_reply_authors": "137;0;206;64",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "1;0;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            72.5,
            11.586630226256467
        ],
        "wc_strengths_avg": [
            18.25,
            5.0682837331783235
        ],
        "wc_weaknesses_avg": [
            185.0,
            144.82230491191612
        ],
        "wc_questions_avg": [
            54.75,
            60.275928031014175
        ],
        "wc_review_avg": [
            330.5,
            129.7314533950807
        ],
        "wc_reply_reviewers_avg": [
            14.25,
            24.681724007856502
        ],
        "wc_reply_authors_avg": [
            101.75,
            77.27992947719349
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            0.75,
            0.4330127018922193
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:t8xYhIHjoQYJ:scholar.google.com/&scioq=Policy+Learning+For+Video+Streaming&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Google;Hebrew University of Jerusalem",
        "aff_unique_dep": "Google;",
        "aff_unique_url": "https://www.google.com;https://www.huji.ac.il",
        "aff_unique_abbr": "Google;HUJI",
        "aff_campus_unique_index": "0;1",
        "aff_campus_unique": "Mountain View;Jerusalem",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United States;Israel"
    },
    {
        "id": "CWoIj2XJuT",
        "title": "Unbalanced Diffusion Schr\u00f6dinger Bridge",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "_Schr\u00f6dinger bridges_ (SBs) provide an elegant framework for modeling the temporal evolution of populations in physical, chemical, or biological systems. Such natural processes are commonly subject to changes in population size over time due to the emergence of new species or birth and death events. However, existing neural parameterizations of SBs such as _diffusion Schr\u00f6dinger bridges_ ( DSBs) are restricted to settings in which the endpoints of the stochastic process are both _probability measures_ and assume _conservation of mass_ constraints. To address this limitation, we introduce _unbalanced_ DSBs which model the temporal evolution of marginals with arbitrary finite mass. This is achieved by deriving the time reversal of _stochastic differential equations_ (SDEs) with killing and birth terms. We present two novel algorithmic schemes that comprise a scalable objective function for training unbalanced DSBs and provide a theoretical analysis alongside challenging applications on predicting heterogeneous molecular single-cell responses to various cancer drugs and simulating the emergence and spread of new viral variants.",
        "keywords": "Schr\u00f6dinger bridges;diffusion;entropic interpolation;unbalanced;finite measures",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/16cb566d1f48bb270d37ad034afd07e4b344f57e.zip",
        "author": "Matteo Pariset;Ya-Ping Hsieh;Charlotte Bunne;Andreas Krause;Valentin De Bortoli",
        "authorids": "~Matteo_Pariset1;~Ya-Ping_Hsieh1;~Charlotte_Bunne1;~Andreas_Krause1;~Valentin_De_Bortoli1",
        "gender": "M;M;F;M;",
        "homepage": ";;https://aimm.epfl.ch;https://las.inf.ethz.ch/krausea;https://vdeborto.github.io/",
        "dblp": "340/8246;122/5313;217/2348;87/1831-1.html;224/9338",
        "google_scholar": ";;https://scholar.google.com/citations?hl=en;https://scholar.google.ch/citations?user=eDHv58AAAAAJ;",
        "orcid": ";;0000-0003-1431-103X;0000-0001-7260-9673;",
        "linkedin": "matteo-pariset/;;bunnech/;krausea/;",
        "or_profile": "~Matteo_Pariset1;~Ya-Ping_Hsieh1;~Charlotte_Bunne1;~Andreas_Krause1;~Valentin_De_Bortoli1",
        "aff": "Adaptyv Biosystems;Department of Computer Science, ETHZ - ETH Zurich;Genentech;ETH Zurich;University of Oxford",
        "aff_domain": "adaptyvbio.com;inf.ethz.ch;gene.com;ethz.ch;ox.ac.uk",
        "position": "Researcher;Postdoc;Postdoc;Full Professor;Postdoc",
        "bibtex": "@misc{\npariset2024unbalanced,\ntitle={Unbalanced Diffusion Schr\\\"odinger Bridge},\nauthor={Matteo Pariset and Ya-Ping Hsieh and Charlotte Bunne and Andreas Krause and Valentin De Bortoli},\nyear={2024},\nurl={https://openreview.net/forum?id=CWoIj2XJuT}\n}",
        "github": "",
        "project": "",
        "reviewers": "NpkQ;1Zr1;wpKe;z1e1",
        "site": "https://openreview.net/forum?id=CWoIj2XJuT",
        "pdf_size": 11439180,
        "rating": "3;5;5;5",
        "confidence": "3;3;1;3",
        "soundness": "2;2;3;3",
        "contribution": "3;3;2;4",
        "presentation": "2;2;3;2",
        "wc_summary": "60;88;51;79",
        "wc_strengths": "31;61;36;90",
        "wc_weaknesses": "187;246;125;262",
        "wc_questions": "36;256;4;255",
        "wc_review": "314;651;216;686",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1050;457;495;1425",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;1;2",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            2.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            69.5,
            14.705441169852742
        ],
        "wc_strengths_avg": [
            54.5,
            23.43608329051593
        ],
        "wc_weaknesses_avg": [
            205.0,
            53.976846888272384
        ],
        "wc_questions_avg": [
            137.75,
            118.29280409221856
        ],
        "wc_review_avg": [
            466.75,
            205.07727202203563
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            856.75,
            403.3970593596339
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=221307050807460715&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;1;3",
        "aff_unique_norm": "Adaptyv Biosystems;ETH Zurich;Genentech;University of Oxford",
        "aff_unique_dep": ";Department of Computer Science;;",
        "aff_unique_url": ";https://www.ethz.ch;https://www.genentech.com;https://www.ox.ac.uk",
        "aff_unique_abbr": ";ETHZ;Genentech;Oxford",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Zurich",
        "aff_country_unique_index": "0;1;0;1;2",
        "aff_country_unique": "United States;Switzerland;United Kingdom"
    },
    {
        "title": "Fast Updating Truncated SVD for Representation Learning with Sparse Matrices",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19171",
        "id": "CX2RgsS29V",
        "author_site": "Haoran Deng, Yang Yang, Jiahe Li, Cheng Chen, Weihao Jiang, Shiliang Pu",
        "tldr": "",
        "abstract": "Updating truncated Singular Value Decomposition (SVD) has extensive applications in representation learning.\nThe continuous evolution of massive-scaled data matrices in practical scenarios highlights the importance of aligning SVD-based models with fast-paced updates.\nRecent methods for updating truncated SVD can be recognized as Rayleigh-Ritz projection procedures where their projection matrices are augmented based on the original singular vectors.\nHowever, the updating process in these methods densifies the update matrix and applies the projection to all singular vectors, resulting in inefficiency.\nThis paper presents a novel method for dynamically approximating the truncated SVD of a sparse and temporally evolving matrix.\nThe proposed method takes advantage of sparsity in the orthogonalization process of the augment matrices and employs an extended decomposition to store projections in the column space of singular vectors independently.\nNumerical experimental results on updating truncated SVD for evolving sparse matrices show an order of magnitude improvement in the efficiency of our proposed method while maintaining precision comparing to previous methods.",
        "keywords": "Singular value decomposition; Sparse matrix; Unsupervised learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Haoran Deng;Yang Yang;Jiahe Li;Cheng Chen;Weihao Jiang;Shiliang Pu",
        "authorids": "~Haoran_Deng2;~Yang_Yang35;~Jiahe_Li5;~Cheng_Chen31;~Weihao_Jiang2;~Shiliang_Pu1",
        "gender": "M;M;F;;M;M",
        "homepage": "https://haorandeng.github.io/;http://yangy.org;https://erikaqvq.github.io/;https://www.hikvision.com/cn/;https://orcid.org/0000-0003-3482-8538;",
        "dblp": ";;;;262/6776.html;155/3173",
        "google_scholar": "XYroEUEAAAAJ;;https://scholar.google.com/citations?hl=zh-CN;;;https://scholar.google.com.hk/citations?user=NWR_wpoAAAAJ",
        "orcid": ";0000-0002-5058-4417;;;0000-0003-3482-8538;",
        "linkedin": "%E6%B5%A9%E7%84%B6-%E9%82%93-b457aa200/;;;;;",
        "or_profile": "~Haoran_Deng2;~Yang_Yang35;~Jiahe_Li5;~Cheng_Chen31;~Weihao_Jiang2;~Shiliang_Pu1",
        "aff": "Zhejiang University;Zhejiang University;Zhejiang University;;Hikvision Research Institute;",
        "aff_domain": "zju.edu.cn;zju.edu.cn;zju.edu.cn;;hikvision.com;",
        "position": "MS student;Associate Professor;Undergrad student;;Researcher;",
        "bibtex": "@inproceedings{\ndeng2024fast,\ntitle={Fast Updating Truncated {SVD} for Representation Learning with Sparse Matrices},\nauthor={Haoran Deng and Yang Yang and Jiahe Li and Cheng Chen and Weihao Jiang and Shiliang Pu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=CX2RgsS29V}\n}",
        "github": "",
        "project": "",
        "reviewers": "An3v;YLvs;jDYv;uuTf",
        "pdf_size": 2862886,
        "rating": "5;6;6;8",
        "confidence": "4;5;4;2",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "1;3;1;2",
        "wc_summary": "44;60;69;60",
        "wc_strengths": "39;38;54;33",
        "wc_weaknesses": "1111;59;710;42",
        "wc_questions": "237;379;99;50",
        "wc_review": "1431;536;932;185",
        "wc_reply_reviewers": "39;0;157;26",
        "wc_reply_authors": "847;469;373;157",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "2;1;2;2",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            58.25,
            9.01041064547005
        ],
        "wc_strengths_avg": [
            41.0,
            7.842193570679061
        ],
        "wc_weaknesses_avg": [
            480.5,
            452.8092865655474
        ],
        "wc_questions_avg": [
            191.25,
            128.26218265724313
        ],
        "wc_review_avg": [
            771.0,
            463.7192038292139
        ],
        "wc_reply_reviewers_avg": [
            55.5,
            60.25985396596975
        ],
        "wc_reply_authors_avg": [
            461.5,
            249.60919454218828
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.7894736842105263,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3777618073694380444&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=CX2RgsS29V",
        "pdf": "https://openreview.net/pdf?id=CX2RgsS29V",
        "email": "zju.edu.cn;zju.edu.cn;zju.edu.cn;;hikvision.com;",
        "author_num": 6,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "Zhejiang University;Hikvision Research Institute",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.zju.edu.cn;https://www.hikvision.com/cn/",
        "aff_unique_abbr": "ZJU;Hikvision",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "CXjz7p4qha",
        "title": "Rotation Invariant Quantization for Model Compression",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Post-training Neural Network (NN) model compression is an attractive approach for deploying large, memory-consuming models on devices with limited memory resources. \nIn this study, we investigate the rate-distortion tradeoff for NN model compression. First, we suggest a Rotation-Invariant Quantization (RIQ) technique that utilizes a single parameter to quantize the entire NN model, yielding a different rate at each layer, i.e., mixed-precision quantization. Then, we prove that our rotation-invariant approach is optimal in terms of compression. We rigorously evaluate RIQ and demonstrate its capabilities on various models and tasks. For example, RIQ facilitates $\\times 19.4$ and $\\times 52.9$ compression ratios on pre-trained VGG dense and pruned models, respectively,  with $<0.4\\%$ accuracy degradation.\nThe code is available in the supplementary material.",
        "keywords": "Neural Network;Model compression;Rate-distortion;Quantization",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/33fc72d43ada53ed3882fc7dd7083d3af1b8fbca.zip",
        "author": "Joseph Kampeas;Yury Nahshan;Hanoch Kremer;Gil Lederman;Shira Zaloshinski;Zheng Li;Emir Haleva",
        "authorids": "~Joseph_Kampeas1;~Yury_Nahshan1;~Hanoch_Kremer1;~Gil_Lederman1;~Shira_Zaloshinski1;~Zheng_Li16;~Emir_Haleva1",
        "gender": "M;M;M;;F;M;",
        "homepage": ";;https://hanochk.github.io/;;;https://dl.acm.org/profile/99659745980;",
        "dblp": "61/10966;228/7866;;;;;",
        "google_scholar": "kampeas;vdRZRhIAAAAJ;GEjajf4AAAAJ;;https://scholar.google.co.il/citations?view_op=list_works;;k4ZFigYAAAAJ",
        "orcid": "0000-0002-3412-6854;;;;;;",
        "linkedin": ";;;gil-lederman-6b9828/;;;",
        "or_profile": "~Joseph_Kampeas1;~Yury_Nahshan1;~Hanoch_Kremer1;~Gil_Lederman1;~Shira_Zaloshinski1;~Zheng_Li16;~Emir_Haleva1",
        "aff": "Huawei Technologies Ltd.;Huawei Technologies Ltd.;MERCK & CO., INC.;;;Huawei Technologies Ltd.;Huawei Technologies Ltd.",
        "aff_domain": "huawei.com;huawei.com;merck.com;;;huawei.com;huawei.com",
        "position": "Researcher;Researcher;Sr deep learning research er;;;Researcher;Researcher",
        "bibtex": "@misc{\nkampeas2024rotation,\ntitle={Rotation Invariant Quantization for Model Compression},\nauthor={Joseph Kampeas and Yury Nahshan and Hanoch Kremer and Gil Lederman and Shira Zaloshinski and Zheng Li and Emir Haleva},\nyear={2024},\nurl={https://openreview.net/forum?id=CXjz7p4qha}\n}",
        "github": "",
        "project": "",
        "reviewers": "qJtZ;4eGc;9KPJ;N6Nd",
        "site": "https://openreview.net/forum?id=CXjz7p4qha",
        "pdf_size": 559904,
        "rating": "3;5;5;8",
        "confidence": "4;5;2;5",
        "soundness": "1;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;2;3",
        "wc_summary": "104;64;39;130",
        "wc_strengths": "21;29;18;51",
        "wc_weaknesses": "158;80;51;196",
        "wc_questions": "3;29;2;4",
        "wc_review": "286;202;110;381",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "730;620;347;579",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.0,
            1.224744871391589
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            84.25,
            35.1452343853331
        ],
        "wc_strengths_avg": [
            29.75,
            12.910751333675357
        ],
        "wc_weaknesses_avg": [
            121.25,
            58.25536455984118
        ],
        "wc_questions_avg": [
            9.5,
            11.280514172678478
        ],
        "wc_review_avg": [
            244.75,
            100.31294781831505
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            569.0,
            139.5582315737771
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.34299717028501764,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:3G2bVvm_gYYJ:scholar.google.com/&scioq=Rotation+Invariant+Quantization+for+Model+Compression&hl=en&as_sdt=0,5",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "Huawei;Merck & Co., Inc.",
        "aff_unique_dep": "Huawei Technologies;",
        "aff_unique_url": "https://www.huawei.com;https://www.merck.com",
        "aff_unique_abbr": "Huawei;Merck",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "CY9f6G89Rv",
        "title": "High-dimensional Bayesian Optimization via Semi-supervised Learning with Optimized Unlabeled Data Sampling",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Bayesian optimization (BO) is a powerful sequential optimization approach for seeking the global optimum of black-box functions for sample efficiency purposes. Evaluations of black-box functions can be expensive, rendering reduced use of labeled data desirable. For the first time, we introduce a teacher-student model, called $\\texttt{TSBO}$, to enable semi-supervised learning that can make use of large amounts of cheaply generated unlabeled data under the context of BO to enhance the generalization of data query models. Our teacher-student model is uncertainty-aware and offers a practical mechanism for leveraging the pseudo labels generated for unlabeled data while dealing with the involved risk. We show that the selection of unlabeled data is key to $\\texttt{TSBO}$. We optimize unlabeled data sampling by generating unlabeled data from a dynamically fitted extreme value distribution or a parameterized sampling distribution learned by minimizing the student feedback. $\\texttt{TSBO}$ is capable of operating in a learned latent space with reduced dimensionality, providing scalability to high-dimensional problems. $\\texttt{TSBO}$ demonstrates the significant sample efficiency in several global optimization tasks under tight labeled data budgets.",
        "keywords": "Bayesian optimization;semi-supervised learning",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Yuxuan Yin;Yu Wang;Peng Li",
        "authorids": "~Yuxuan_Yin1;~Yu_Wang29;~Peng_Li8",
        "gender": "M;M;M",
        "homepage": ";;https://www.ece.ucsb.edu/~lip/",
        "dblp": "287/5093;;83/6353-1.html",
        "google_scholar": "g6SyvToAAAAJ;https://scholar.google.com/citations?authuser=1;QYQUS7gAAAAJ",
        "orcid": ";;0000-0003-3548-4589",
        "linkedin": ";yu-wang-b526a4220/;peng-li-ucsb/",
        "or_profile": "~Yuxuan_Yin1;~Yu_Wang29;~Peng_Li8",
        "aff": "University of California, Santa Barbara;UC Santa Barbara;UC Santa Barbara",
        "aff_domain": "ucsb.edu;ucsb.edu;ucsb.edu",
        "position": "PhD student;PhD student;Professor",
        "bibtex": "@misc{\nyin2024highdimensional,\ntitle={High-dimensional Bayesian Optimization via Semi-supervised Learning with Optimized Unlabeled Data Sampling},\nauthor={Yuxuan Yin and Yu Wang and Peng Li},\nyear={2024},\nurl={https://openreview.net/forum?id=CY9f6G89Rv}\n}",
        "github": "",
        "project": "",
        "reviewers": "r1KM;tpuF;QKF7",
        "site": "https://openreview.net/forum?id=CY9f6G89Rv",
        "pdf_size": 483024,
        "rating": "5;5;6",
        "confidence": "4;4;2",
        "soundness": "2;2;3",
        "contribution": "3;2;3",
        "presentation": "2;3;3",
        "wc_summary": "78;218;134",
        "wc_strengths": "81;55;61",
        "wc_weaknesses": "674;519;42",
        "wc_questions": "61;20;21",
        "wc_review": "894;812;258",
        "wc_reply_reviewers": "130;0;62",
        "wc_reply_authors": "1548;1037;339",
        "reply_reviewers": "1;0;1",
        "reply_authors": "3;2;1",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            143.33333333333334,
            57.53453069437711
        ],
        "wc_strengths_avg": [
            65.66666666666667,
            11.115554667022044
        ],
        "wc_weaknesses_avg": [
            411.6666666666667,
            268.94402556831204
        ],
        "wc_questions_avg": [
            34.0,
            19.096247449870006
        ],
        "wc_review_avg": [
            654.6666666666666,
            282.4763510258671
        ],
        "wc_reply_reviewers_avg": [
            64.0,
            53.09111664550546
        ],
        "wc_reply_authors_avg": [
            974.6666666666666,
            495.5362975829543
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17661275767978311463&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 10,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of California, Santa Barbara",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucsb.edu",
        "aff_unique_abbr": "UCSB",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Santa Barbara",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "CYVQHR5IAq",
        "title": "Enhancing Personal Decentralized Federated Learning through Model Decoupling",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Personalized Federated Learning (FL) aims to produce many local personalized models rather than one global model to encounter an insurmountable problem -- data heterogeneity in real federated systems. However, almost all existing works have to face central communication burdens and the risk of disruption if the central server fails. Only limited efforts have been made without a central server but they still suffer from high local computation, catastrophic forgetting, and worse convergence due to the full model aggregation process. Therefore, in this paper, we propose a PFL framework through model decoupling called DFedMDC, which pursues robust communication and better model performance with a convergence guarantee. It personalizes the \u201cright\u201d components in the modern deep models by alternately updating the shared and personal parameters to train partially personalized models in a peer-to-peer manner. To further promote the shared parameters aggregation process, we propose DFedSMDC via integrating the local Sharpness Aware Minimization (SAM) optimizer to update the shared parameters. Specifically, it adds proper perturbation in the gradient direction to alleviate the shared model inconsistency across clients. Theoretically, we provide convergence analysis of both algorithms in the general non-convex setting with partial personalization and SAM optimizer for the shared model. We analyze the ill impact of the statistical heterogeneity $\\delta^2$, the smoothness $L_u, L_v, L_{uv}, L_{vu}$ of loss functions, and communication topology ($1-\\lambda$) on the convergence. Our experiments on several real-world data with various data partition settings demonstrate that (i) partial personalized training is more suitable for personalized decentralized FL, which results in state-of-the-art (SOTA) accuracy compared with the SOTA PFL baselines; (ii) the shared parameters with proper perturbation make partial personalized FL more suitable for decentralized training, where DFedSMDC achieves most competitive performance.",
        "keywords": "Personalized Federated Learning;Partial Personalization;Decentralizaed Training",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yifan Shi;Yingqi Liu;Yan Sun;Zihao Lin;Li Shen;Xueqian Wang;Dacheng Tao",
        "authorids": "~Yifan_Shi1;~Yingqi_Liu2;~Yan_Sun3;~Zihao_Lin1;~Li_Shen1;~Xueqian_Wang1;~Dacheng_Tao1",
        "gender": ";F;M;M;M;M;",
        "homepage": ";;;https://github.com/ZihaoLin0123;https://sites.google.com/site/mathshenli/home;;",
        "dblp": ";92/10048;;241/2108-3;91/3680-8;43/3563-1;",
        "google_scholar": ";;_-hoDQkAAAAJ;4h_A4n4AAAAJ;yVhgENIAAAAJ;h9dN_ykAAAAJ;",
        "orcid": ";0000-0001-5029-4287;0000-0003-2271-252X;;;0000-0003-3542-0593;",
        "linkedin": ";;;;;;",
        "or_profile": "~Yifan_Shi1;~Yingqi_Liu2;~Yan_Sun3;~Zihao_Lin1;~Li_Shen1;~Xueqian_Wang1;~Dacheng_Tao1",
        "aff": ";Nanjing University of Science and Technology;University of Sydney;Virginia Polytechnic Institute and State University;JD Explore Academy;Tsinghua University;",
        "aff_domain": ";njust.edu.cn;uni.sydney.edu.au;vt.edu;jd.com;tsinghua.edu.cn;",
        "position": ";MS student;PhD student;PhD student;Researcher;Full Professor;",
        "bibtex": "@misc{\nshi2024enhancing,\ntitle={Enhancing Personal Decentralized Federated Learning through Model Decoupling},\nauthor={Yifan Shi and Yingqi Liu and Yan Sun and Zihao Lin and Li Shen and Xueqian Wang and Dacheng Tao},\nyear={2024},\nurl={https://openreview.net/forum?id=CYVQHR5IAq}\n}",
        "github": "",
        "project": "",
        "reviewers": "z1Hn;iEM9;A4M3;7fx1",
        "site": "https://openreview.net/forum?id=CYVQHR5IAq",
        "pdf_size": 1050880,
        "rating": "3;5;5;6",
        "confidence": "3;2;3;3",
        "soundness": "2;2;2;3",
        "contribution": "1;2;2;3",
        "presentation": "2;2;2;4",
        "wc_summary": "63;135;32;49",
        "wc_strengths": "31;56;21;46",
        "wc_weaknesses": "257;166;208;83",
        "wc_questions": "4;4;45;43",
        "wc_review": "355;361;306;221",
        "wc_reply_reviewers": "11;0;0;15",
        "wc_reply_authors": "1089;477;1322;424",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "3;2;4;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            69.75,
            39.23885192000398
        ],
        "wc_strengths_avg": [
            38.5,
            13.46291201783626
        ],
        "wc_weaknesses_avg": [
            178.5,
            63.85334760214221
        ],
        "wc_questions_avg": [
            24.0,
            20.0124960961895
        ],
        "wc_review_avg": [
            310.75,
            56.03737592000539
        ],
        "wc_reply_reviewers_avg": [
            6.5,
            6.652067347825035
        ],
        "wc_reply_authors_avg": [
            828.0,
            386.8378213153414
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.13245323570650439,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ObbW8vD6TlEJ:scholar.google.com/&scioq=Enhancing+Personal+Decentralized+Federated+Learning+through+Model+Decoupling&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "Nanjing University of Science and Technology;University of Sydney;Virginia Tech;JD;Tsinghua University",
        "aff_unique_dep": ";;;JD Explore Academy;",
        "aff_unique_url": "http://www.nust.edu.cn/;https://www.sydney.edu.au;https://www.vt.edu;;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "NUST;USYD;VT;;THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;0",
        "aff_country_unique": "China;Australia;United States;"
    },
    {
        "id": "CYbDOo6GwJ",
        "title": "Parsimonious Demonstrations and Fine-Tuning for Large Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large language models (LLMs) have achieved impressive few-shot performance when provided with a small number of demonstrations as input context. In this paper, we systematically investigate what types of demonstrations are highly effective. Unlike prior approaches that select demonstrations based on similarity or diversity without considering LLMs, our insight is that the effectiveness of demonstrations depends on the specific LLMs used. In light of this, we introduce FEEDER (FEw yet Essential Data minER), a novel data miner that evaluates \u201csufficiency\u201d and \u201cnecessity\u201d of incorporating demonstrations as the context, taking into account the LLMs in use. The set of demonstrations that are both sufficient and necessary, referred to as parsimonious sets, can be viewed as a core subset of the training dataset, containing the most informative samples. Since evaluating all possible subsets is impractical, we devise novel tree-based search algorithms for identifying parsimonious sets. We demonstrate that these sets can serve two primary purposes. One is in-context learning, where FEEDER allows demonstration retrievers to operate on a subset rather than the entire training dataset, thus avoiding the retrieval of insufficient or unnecessary demonstrations. The other is fine-tuning, where fine-tuning LLMs on the set identified by FEEDER can yield improved performance while also reducing computational costs. Our empirical results on six text classification datasets and four LLM bases (ranging from 335M to 7B) consistently demonstrate: (i) In terms of few-shot inference, FEEDER allows the LLMs to achieve superior (or comparable) performance while utilizing only half the size of the input training data. (ii) With fine-tuning setting, FEEDER can significantly improve the LLM\u2019s performance.",
        "keywords": "Language Models;Plug-in Set Selection;In-Context Learning;Fine-Tuning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/08fe89dbf2ab18477ad8d3059a6459ba6f3b32a2.zip",
        "author": "Jiarui Jin;Yuwei Wu;Mengyue Yang;Xiaoting He;Weinan Zhang;Yiming Yang;Yong Yu;Jun Wang",
        "authorids": "~Jiarui_Jin1;~Yuwei_Wu4;~Mengyue_Yang1;~Xiaoting_He1;~Weinan_Zhang1;~Yiming_Yang1;~Yong_Yu1;~Jun_Wang2",
        "gender": "M;M;F;M;M;F;;M",
        "homepage": "https://jinjiarui.github.io/;;https://ymy4323460.github.io/;;http://wnzhang.net;http://www.cs.cmu.edu/~yiming/;https://apex.sjtu.edu.cn/members/yyu;http://www0.cs.ucl.ac.uk/staff/jun.wang/",
        "dblp": "241/9563;63/5298-3;262/3824.html;;28/10261-1;25/1666;43/5685.html;w/JunWang12",
        "google_scholar": "unCPHQEAAAAJ;z8PkJXgAAAAJ;kJJkqdcAAAAJ;MNqQDLMAAAAJ;Qzss0GEAAAAJ;MlZq4XwAAAAJ;;https://scholar.google.co.uk/citations?user=wIE1tY4AAAAJ",
        "orcid": "0000-0001-6458-1586;;;;0000-0002-0127-2425;0000-0001-8322-607X;0000-0003-4457-2820;",
        "linkedin": "jiarui-jerry-jin-ba4a84176/;;;;;yiming-yang-24100924/;;",
        "or_profile": "~Jiarui_Jin1;~Yuwei_Wu4;~Mengyue_Yang1;~Xiaoting_He1;~Weinan_Zhang1;~Yiming_Yang1;~Yong_Yu1;~Jun_Wang2",
        "aff": "Shanghai Jiaotong University;AI Fund;University College London;Amazon;Shanghai Jiaotong University;School of Computer Science, Carnegie Mellon University;Shanghai Jiaotong University;University College London",
        "aff_domain": "sjtu.edu.cn;aifund.ai;ucl.ac.uk;amazon.com;sjtu.edu.cn;cs.cmu.edu;sjtu.edu.cn;ucl.ac.uk",
        "position": "PhD student;Researcher;PhD student;Researcher;Associate Professor;Full Professor;Full Professor;Professor",
        "bibtex": "@misc{\njin2024parsimonious,\ntitle={Parsimonious Demonstrations and Fine-Tuning for Large Language Models},\nauthor={Jiarui Jin and Yuwei Wu and Mengyue Yang and Xiaoting He and Weinan Zhang and Yiming Yang and Yong Yu and Jun Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=CYbDOo6GwJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "HTu1;2FTd;jRpK;5TLU",
        "site": "https://openreview.net/forum?id=CYbDOo6GwJ",
        "pdf_size": 803626,
        "rating": "3;5;5;5",
        "confidence": "3;4;3;3",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;2",
        "presentation": "3;3;3;3",
        "wc_summary": "93;144;65;52",
        "wc_strengths": "53;63;63;45",
        "wc_weaknesses": "126;98;84;93",
        "wc_questions": "80;38;28;51",
        "wc_review": "352;343;240;241",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            88.5,
            35.302266216207705
        ],
        "wc_strengths_avg": [
            56.0,
            7.54983443527075
        ],
        "wc_weaknesses_avg": [
            100.25,
            15.690363284513205
        ],
        "wc_questions_avg": [
            49.25,
            19.536824204563032
        ],
        "wc_review_avg": [
            294.0,
            53.59570878344646
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:6vx762IQpAIJ:scholar.google.com/&scioq=Parsimonious+Demonstrations+and+Fine-Tuning+for+Large+Language+Models&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;0;4;0;2",
        "aff_unique_norm": "Shanghai Jiao Tong University;AI Fund;University College London;Amazon;Carnegie Mellon University",
        "aff_unique_dep": ";;;Amazon.com, Inc.;School of Computer Science",
        "aff_unique_url": "https://www.sjtu.edu.cn;https://www.aifund.ai;https://www.ucl.ac.uk;https://www.amazon.com;https://www.cmu.edu",
        "aff_unique_abbr": "SJTU;AI Fund;UCL;Amazon;CMU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Pittsburgh",
        "aff_country_unique_index": "0;1;2;1;0;1;0;2",
        "aff_country_unique": "China;United States;United Kingdom"
    },
    {
        "title": "FLASK: Fine-grained Language Model Evaluation based on Alignment Skill Sets",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19170",
        "id": "CYmF38ysDa",
        "author_site": "Seonghyeon Ye, Doyoung Kim, Sungdong Kim, Hyeonbin Hwang, Seungone Kim, Yongrae Jo, James Thorne, Juho Kim, Minjoon Seo",
        "tldr": "",
        "abstract": "Evaluation of Large Language Models (LLMs) is challenging because instruction-following necessitates alignment with human values and the required set of skills varies depending on the instruction. However, previous studies have mainly focused on coarse-grained evaluation (i.e. overall preference-based evaluation), which limits interpretability since it does not consider the nature of user instructions that require instance-wise skill composition. In this paper, we introduce FLASK (Fine-grained Language Model Evaluation based on Alignment Skill Sets), a fine-grained evaluation protocol for both human-based and model-based evaluation which decomposes coarse-level scoring to a skill set-level scoring for each instruction. We experimentally observe that the fine-graininess of evaluation is crucial for attaining a holistic view of model performance and increasing the reliability of the evaluation. Using FLASK, we compare multiple open-source and proprietary LLMs and observe a high correlation between model-based and human-based evaluations.",
        "keywords": "large language models;language model evaluation;natural language processing",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/1aefdc28277b97e507b5bf400cd761fa532b0bd8.zip",
        "author": "Seonghyeon Ye;Doyoung Kim;Sungdong Kim;Hyeonbin Hwang;Seungone Kim;Yongrae Jo;James Thorne;Juho Kim;Minjoon Seo",
        "authorids": "~Seonghyeon_Ye1;~Doyoung_Kim3;~Sungdong_Kim1;~Hyeonbin_Hwang1;~Seungone_Kim1;~Yongrae_Jo1;~James_Thorne1;~Juho_Kim2;~Minjoon_Seo1",
        "gender": "M;M;;M;M;Not Specified;;M;M",
        "homepage": "https://vano1205.github.io/;https://doyoungkim-ml.github.io/;;https://github.com/hbin0701;https://github.com/SeungoneKim;https://github.com/dreamgonfly;https://jamesthorne.com;https://juhokim.com/;https://seominjoon.github.io",
        "dblp": "301/8927;;118/1568;317/6967;324/2064.html;252/6347;204/1380;64/3462-1;149/1367",
        "google_scholar": "https://scholar.google.co.kr/citations?user=JfGGjBoAAAAJ;https://scholar.google.co.kr/citations?user=PJR9ogMAAAAJ;xKrSnDoAAAAJ;;https://scholar.google.co.kr/citations?user=qEf3e3EAAAAJ;https://scholar.google.com/citations?hl=en;hao9RrgAAAAJ;2dDAbMgAAAAJ;zYze5fIAAAAJ",
        "orcid": ";;;;;;;0000-0001-6348-4127;",
        "linkedin": ";doyoung-kim-870a141a2/;;;seungone-kim-09b551264/;;;;minjoon-seo/",
        "or_profile": "~Seonghyeon_Ye1;~Doyoung_Kim3;~Sungdong_Kim1;~Hyeonbin_Hwang1;~Seungone_Kim1;~Yongrae_Jo1;~James_Thorne1;~Juho_Kim2;~Minjoon_Seo1",
        "aff": "Korea Advanced Institute of Science & Technology;KAIST;NAVER;Korea Advanced Institute of Science & Technology;KAIST;LG Corporation;KAIST;Korea Advanced Institute of Science & Technology;Twelve Labs",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr;navercorp.com;kaist.edu;ee.kaist.ac.kr;lgresearch.ai;kaist.ac.kr;kaist.ac.kr;twelvelabs.io",
        "position": "PhD student;MS student;Researcher;MS student;MS student;Researcher;Assistant Professor;Associate Professor;Chief Scientist",
        "bibtex": "@inproceedings{\nye2024flask,\ntitle={{FLASK}: Fine-grained Language Model Evaluation based on Alignment Skill Sets},\nauthor={Seonghyeon Ye and Doyoung Kim and Sungdong Kim and Hyeonbin Hwang and Seungone Kim and Yongrae Jo and James Thorne and Juho Kim and Minjoon Seo},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=CYmF38ysDa}\n}",
        "github": "",
        "project": "",
        "reviewers": "BpKX;aEcx;Qvzt",
        "pdf_size": 2769137,
        "rating": "6;8;8",
        "confidence": "4;2;2",
        "soundness": "3;3;2",
        "contribution": "3;4;3",
        "presentation": "3;3;1",
        "wc_summary": "115;107;152",
        "wc_strengths": "105;109;84",
        "wc_weaknesses": "96;84;362",
        "wc_questions": "25;3;61",
        "wc_review": "341;303;659",
        "wc_reply_reviewers": "11;6;0",
        "wc_reply_authors": "317;178;740",
        "reply_reviewers": "1;1;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            124.66666666666667,
            19.601587237318874
        ],
        "wc_strengths_avg": [
            99.33333333333333,
            10.96458946893235
        ],
        "wc_weaknesses_avg": [
            180.66666666666666,
            128.3155831880481
        ],
        "wc_questions_avg": [
            29.666666666666668,
            23.907228102721476
        ],
        "wc_review_avg": [
            434.3333333333333,
            159.61899079439834
        ],
        "wc_reply_reviewers_avg": [
            5.666666666666667,
            4.4969125210773475
        ],
        "wc_reply_authors_avg": [
            411.6666666666667,
            239.00116224729024
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 93,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11317511132993952746&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=CYmF38ysDa",
        "pdf": "https://openreview.net/pdf?id=CYmF38ysDa",
        "email": "kaist.ac.kr;kaist.ac.kr;navercorp.com;kaist.edu;ee.kaist.ac.kr;lgresearch.ai;kaist.ac.kr;kaist.ac.kr;twelvelabs.io",
        "author_num": 9,
        "aff_unique_index": "0;0;1;0;0;2;0;0;3",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology;NAVER Corporation;LG;Twelve Labs",
        "aff_unique_dep": ";;LG Corporation;",
        "aff_unique_url": "https://www.kaist.ac.kr;https://www.naver.com;https://www.lg.com;https://twelvelabs.com",
        "aff_unique_abbr": "KAIST;NAVER;LG;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;1",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "id": "CZ6XT5phWW",
        "title": "Instance Needs More Care: Rewriting Prompts for Instances Yields Better Zero-Shot Performance",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Enabling large language models (LLMs) to perform tasks in zero-shot has been an appealing goal owing to its labor-saving (i.e., requiring no task-specific annotations); as such, zero-shot prompting approaches also enjoy better task generalizability. To improve LLMs' zero-shot performance, prior work has focused on devising more effective task instructions (e.g., ``let's think step by step'' \\cite{kojima2022large}). However, we argue that, in order for an LLM to solve them correctly in zero-shot, individual test instances need more carefully designed and customized instructions. To this end, we propose PRoMTd, an approach that rewrites the task prompt for each individual test input to be more specific, unambiguous, and complete, so as to provide better guidance to the task LLM. We evaluated PRoMTd on eight datasets covering tasks including arithmetics, logical reasoning, and code generation, using GPT-4 as the task LLM. PRoMTd consistently outperforms traditional zero-shot approaches on all the datasets. Notably, we observe an absolute improvement of 10\\% on the complex MATHS dataset and 5\\% on the code generation task on HumanEval. In addition, we also showed that the rewritten prompt can provide better interpretability of how the LLM resolves each test instance, which can potentially be leveraged as a defense mechanism against adversarial prompting.",
        "keywords": "Natural Language Processing;Large Language Models;Prompt Engineering",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/f2c7efbecaec37d20bbd435a852aa79898f7c9ea.zip",
        "author": "Saurabh Srivastava;Chengyue Huang;Weiguo Fan;Ziyu Yao",
        "authorids": "~Saurabh_Srivastava2;~Chengyue_Huang4;~Weiguo_Fan1;~Ziyu_Yao1",
        "gender": "M;M;F;F",
        "homepage": "https://salokr.github.io/;https://tippie.uiowa.edu/people/weiguo-fan;http://ziyuyao.org;https://tippie.uiowa.edu/people/chengyue-huang",
        "dblp": ";f/WeiguoFan;;",
        "google_scholar": "LuCi6M4AAAAJ;6x282B8AAAAJ;4lYrMNUAAAAJ;",
        "orcid": ";0000-0003-1272-5538;0009-0007-4571-3505;",
        "linkedin": "saurabh-srivastava-34941560/;;;",
        "or_profile": "~Saurabh_Srivastava2;~Weiguo_Fan1;~Ziyu_Yao1;~CHENGYUE_HUANG3",
        "aff": "George Mason University;University of Iowa;George Mason University;University of Iowa",
        "aff_domain": "gmu.edu;uiowa.edu;gmu.edu;uiowa.edu",
        "position": "PhD student;Full Professor;Assistant Professor;PhD student",
        "bibtex": "@misc{\nsrivastava2024instance,\ntitle={Instance Needs More Care: Rewriting Prompts for Instances Yields Better Zero-Shot Performance},\nauthor={Saurabh Srivastava and Chengyue Huang and Weiguo Fan and Ziyu Yao},\nyear={2024},\nurl={https://openreview.net/forum?id=CZ6XT5phWW}\n}",
        "github": "",
        "project": "",
        "reviewers": "bonY;xGQ6;vep9",
        "site": "https://openreview.net/forum?id=CZ6XT5phWW",
        "pdf_size": 633613,
        "rating": "3;5;5",
        "confidence": "3;3;2",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "2;3;3",
        "wc_summary": "62;77;71",
        "wc_strengths": "122;134;77",
        "wc_weaknesses": "92;239;51",
        "wc_questions": "16;3;4",
        "wc_review": "292;453;203",
        "wc_reply_reviewers": "16;0;141",
        "wc_reply_authors": "679;1402;448",
        "reply_reviewers": "1;0;2",
        "reply_authors": "1;2;2",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            70.0,
            6.164414002968976
        ],
        "wc_strengths_avg": [
            111.0,
            24.535688292770594
        ],
        "wc_weaknesses_avg": [
            127.33333333333333,
            80.7148616358158
        ],
        "wc_questions_avg": [
            7.666666666666667,
            5.9066817155564495
        ],
        "wc_review_avg": [
            316.0,
            103.46335905366047
        ],
        "wc_reply_reviewers_avg": [
            52.333333333333336,
            63.03614483417871
        ],
        "wc_reply_authors_avg": [
            843.0,
            406.3668293549561
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 37,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11947042479522327938&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;1",
        "aff_unique_norm": "George Mason University;University of Iowa",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.gmu.edu;https://www.uiowa.edu",
        "aff_unique_abbr": "GMU;UIowa",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "MG-TSD: Multi-Granularity Time Series Diffusion Models with Guided Learning Process",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19169",
        "id": "CZiY6OLktd",
        "author_site": "Xinyao Fan, Yueying Wu, XU, Yu-Hao Huang, Weiqing Liu, Jiang Bian",
        "tldr": "",
        "abstract": "Recently, diffusion probabilistic models have attracted attention in generative time series forecasting due to their remarkable capacity to generate high-fidelity samples. However, the effective utilization of their strong modeling ability in the probabilistic time series forecasting task remains an open question, partially due to the challenge of instability arising from their stochastic nature. To address this challenge, we introduce a novel Multi-Granularity Time Series Diffusion (MG-TSD) model, which achieves state-of-the-art predictive performance by leveraging the inherent granularity levels within the data as given targets at intermediate diffusion steps to guide the learning process of diffusion models. The way to construct the targets is motivated by the observation that forward process of the diffusion model, which sequentially corrupts the data distribution to a standard normal distribution, intuitively aligns with the process of smoothing fine-grained data into a coarse-grained representation, both of which result in a gradual loss of fine distribution features. In the study, we derive a novel multi-granularity guidance diffusion loss function and propose a concise implementation method to effectively utilize coarse-grained data across various granularity levels.\nMore importantly, our approach does not rely on additional external data, making it versatile and applicable across various domains. Extensive experiments conducted on real-world datasets demonstrate that our MG-TSD model outperforms existing time series prediction methods.",
        "keywords": "denoising diffusion models;multi-granularity;time series forecasting",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/e72fe6703e413c57638829e0851ad416586d7370.pdf",
        "author": "Xinyao Fan;Yueying Wu;Chang Xu;Yuhao Huang;Weiqing Liu;Jiang Bian",
        "authorids": "~Xinyao_Fan1;~Yueying_Wu1;~Chang_Xu10;~Yuhao_Huang1;~Weiqing_Liu1;~Jiang_Bian1",
        "gender": "F;F;;;;M",
        "homepage": ";https://github.com/Hundredl;;;;https://sites.google.com/view/jiangbian",
        "dblp": ";;;150/3868.html;;09/851-2.html",
        "google_scholar": ";;;OnAD3vsAAAAJ;;pZBEnY8AAAAJ",
        "orcid": ";0009-0008-7071-2560;;0009-0004-0140-8267;;0000-0002-9472-600X",
        "linkedin": "xinyaofan/;yueying-wu-0a45aa298/;;https://www.linkedin.cn/incareer/in/yuhao-huang-8030171a3;weiqing-liu-09646b91/;jbian/",
        "or_profile": "~Xinyao_Fan1;~Yueying_Wu1;~Chang_Xu10;~Yuhao_Huang1;~Weiqing_Liu1;~Jiang_Bian1",
        "aff": "University of British Columbia;Peking University;;Nanjing University;;Microsoft",
        "aff_domain": "ubc.ca;pku.edu.cn;;nju.edu.cn;;microsoft.com",
        "position": "PhD student;MS student;;PhD student;;Partner Research Manager",
        "bibtex": "@inproceedings{\nfan2024mgtsd,\ntitle={{MG}-{TSD}: Multi-Granularity Time Series Diffusion Models with Guided Learning Process},\nauthor={Xinyao Fan and Yueying Wu and Chang Xu and Yuhao Huang and Weiqing Liu and Jiang Bian},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=CZiY6OLktd}\n}",
        "github": "",
        "project": "",
        "reviewers": "FBCv;Zqn4;Zq3E",
        "pdf_size": 1742861,
        "rating": "6;6;6",
        "confidence": "4;4;4",
        "soundness": "3;3;2",
        "contribution": "3;3;2",
        "presentation": "3;4;3",
        "wc_summary": "98;110;112",
        "wc_strengths": "50;113;70",
        "wc_weaknesses": "145;59;53",
        "wc_questions": "35;59;168",
        "wc_review": "328;341;403",
        "wc_reply_reviewers": "168;0;0",
        "wc_reply_authors": "1699;968;1472",
        "reply_reviewers": "2;0;0",
        "reply_authors": "5;2;3",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            106.66666666666667,
            6.18241233033047
        ],
        "wc_strengths_avg": [
            77.66666666666667,
            26.284765338288427
        ],
        "wc_weaknesses_avg": [
            85.66666666666667,
            42.02644669993196
        ],
        "wc_questions_avg": [
            87.33333333333333,
            57.87534497137409
        ],
        "wc_review_avg": [
            357.3333333333333,
            32.72443871006635
        ],
        "wc_reply_reviewers_avg": [
            56.0,
            79.19595949289332
        ],
        "wc_reply_authors_avg": [
            1379.6666666666667,
            305.48795211740986
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            1.247219128924647
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 22,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=111965773431705363&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=CZiY6OLktd",
        "pdf": "https://openreview.net/pdf?id=CZiY6OLktd",
        "email": "ubc.ca;pku.edu.cn;;nju.edu.cn;;microsoft.com",
        "author_num": 6,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "University of British Columbia;Peking University;Nanjing University;Microsoft",
        "aff_unique_dep": ";;;Microsoft Corporation",
        "aff_unique_url": "https://www.ubc.ca;http://www.pku.edu.cn;https://www.nju.edu.cn;https://www.microsoft.com",
        "aff_unique_abbr": "UBC;Peking U;Nanjing U;Microsoft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;2",
        "aff_country_unique": "Canada;China;United States"
    },
    {
        "id": "CaP3CByuLp",
        "title": "Extrapolating Large Language Models to Non-English by Aligning Languages",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Existing large language models show disparate capability across different languages, due to the imbalance in the training data. Their performances on English tasks are often stronger than on tasks of other languages. In this paper, we empower pre-trained LLMs on non-English languages by building semantic alignment across languages. We start from targeting individual languages by performing cross-lingual instruction-tuning (CoIT) on LLaMA, i.e. tuning it with translation task data and cross-lingual general task data to obtain cross-lingual models (x-LLaMAs), and formulate underlying scaling laws to investigate the advantages of using scalable translation data. Then we perform multilingual instruction-tuning (MuIT) with mixed resources to build multilingual m-LLaMA. We also illustrate how we leverage the scaling laws to optimize data allocation in a resource-constrained setting. Experiment results on cross-lingual benchmarks XQUAD and MLQA show that x-LLaMAs surpass the English instruction-tuned counterpart (Alpaca) by an average of 27.83% across six non-English languages. Evaluation results on translation dataset Flores-101 show that x-LLaMAs outperform previous LLaMA-based models by an average of 18.89%. Encouragingly, m-LLaMA achieves comparable performance to x-LLaMAs on individual languages and demonstrates the ability to follow multilingual instructions. Further analysis on response content and representation space reveals the alignment of the multilingual semantic space within the middle layers of m-LLaMA.",
        "keywords": "large language models;instruction-tuning;machine translation;multilingual",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Wenhao Zhu;Yunzhe Lv;Qingxiu Dong;Fei Yuan;Jingjing Xu;Shujian Huang;Lingpeng Kong;Jiajun Chen;Lei Li",
        "authorids": "~Wenhao_Zhu1;~Yunzhe_Lv1;~Qingxiu_Dong1;~Fei_Yuan2;~Jingjing_Xu1;~Shujian_Huang1;~Lingpeng_Kong1;~Jiajun_Chen1;~Lei_Li11",
        "gender": "M;M;F;;F;M;M;M;M",
        "homepage": "https://owennju.github.io/;https://blog.xlworkshop.ltd/;https://dqxiu.github.io/;;;http://nlp.nju.edu.cn/huangsj/;https://ikekonglp.github.io/;https://cs.nju.edu.cn/chenjiajun/index_en.htm;https://www.cs.cmu.edu/~leili",
        "dblp": ";;284/0673;;25/624;57/8451;144/7656;;13/7007-5.html",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;;ibcR7VkAAAAJ;;;HF3-E9kAAAAJ;f1hBi5wAAAAJ;https://scholar.google.com.tw/citations?user=WIF7VaoAAAAJ;BYXqAlwAAAAJ",
        "orcid": ";;;;;;;;0000-0003-3095-9776",
        "linkedin": ";%E4%BA%91%E5%93%B2-%E5%90%95-665286198/;qingxiu-dong-a3758a199/;;;;;;",
        "or_profile": "~Wenhao_Zhu1;~Yunzhe_Lv1;~Qingxiu_Dong1;~Fei_Yuan2;~Jingjing_Xu1;~Shujian_Huang1;~Lingpeng_Kong1;~Jiajun_Chen1;~Lei_Li11",
        "aff": "Shanghai Artificial Intelligence Laboratory;;Peking University;;;Nanjing University;Department of Computer Science, The University of Hong Kong;Nanjing University;School of Computer Science, Carnegie Mellon University",
        "aff_domain": "pjlab.org.cn;;pku.edu.cn;;;nju.edu.cn;cs.hku.hk;nju.edu.cn;cs.cmu.edu",
        "position": "Research Intern;;PhD student;;;Full Professor;Assistant Professor;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nzhu2024extrapolating,\ntitle={Extrapolating Large Language Models to Non-English by Aligning Languages},\nauthor={Wenhao Zhu and Yunzhe Lv and Qingxiu Dong and Fei Yuan and Jingjing Xu and Shujian Huang and Lingpeng Kong and Jiajun Chen and Lei Li},\nyear={2024},\nurl={https://openreview.net/forum?id=CaP3CByuLp}\n}",
        "github": "",
        "project": "",
        "reviewers": "55oU;Hw1M;bT9A;yxQQ",
        "site": "https://openreview.net/forum?id=CaP3CByuLp",
        "pdf_size": 7706893,
        "rating": "3;3;5;5",
        "confidence": "4;5;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;1;3;2",
        "presentation": "2;2;3;3",
        "wc_summary": "64;85;65;105",
        "wc_strengths": "30;75;80;74",
        "wc_weaknesses": "111;349;131;103",
        "wc_questions": "137;56;27;47",
        "wc_review": "342;565;303;329",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "569;647;375;536",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            79.75,
            16.813313177360374
        ],
        "wc_strengths_avg": [
            64.75,
            20.191272867256288
        ],
        "wc_weaknesses_avg": [
            173.5,
            101.8368793708841
        ],
        "wc_questions_avg": [
            66.75,
            41.89495793051952
        ],
        "wc_review_avg": [
            384.75,
            105.01041615001819
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            531.75,
            99.0691046694175
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 18,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6271377790031707208&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;3;2;4",
        "aff_unique_norm": "Shanghai Artificial Intelligence Laboratory;Peking University;Nanjing University;University of Hong Kong;Carnegie Mellon University",
        "aff_unique_dep": ";;;Department of Computer Science;School of Computer Science",
        "aff_unique_url": "http://www.shailab.org/;http://www.pku.edu.cn;https://www.nju.edu.cn;https://www.hku.hk;https://www.cmu.edu",
        "aff_unique_abbr": "Shanghai AI Lab;Peking U;Nanjing U;HKU;CMU",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Hong Kong SAR;Pittsburgh",
        "aff_country_unique_index": "0;0;0;0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "CajWziS3Ia",
        "title": "Exploring Efficient Foundational Multi-modal Models for Video Summarization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Foundational models are able to generate text outputs given prompt instructions and text, audio, or image inputs. Recently these models have been combined to perform tasks on video, such as video summarization. Such video foundation models perform pre-training by aligning outputs from each modality-specific model into the same embedding space. Then the embeddings from each model are used within a language model, which is fine-tuned on a desired instruction set. Aligning each modality during pre-training is computationally expensive and prevents rapid testing of different base modality models. During fine-tuning, evaluation is carried out within in-domain videos where it is hard to understand the generalizability and data efficiency of these methods. To alleviate these issues we propose a plug-and-play video language model. It directly uses the texts generated from each input modality into the language model, avoiding pre-training alignment overhead. Instead of fine-tuning we leverage few-shot instruction adaptation strategies. We compare the performance versus the computational costs for our plug-and-play style method and baseline tuning methods. Finally, we explore the generalizability of each method during domain shift and present insights on what data is useful when training data is limited. Through this analysis, we present practical insights on how to leverage multi-modal foundational models for effective results given realistic compute and data limitations.",
        "keywords": "multi-modal;video summarization;generative models",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Karan Samel;Apoorva Beedu;Nitish Sontakke;Irfan Essa",
        "authorids": "~Karan_Samel2;~Apoorva_Beedu1;~Nitish_Sontakke1;~Irfan_Essa1",
        "gender": "M;;M;M",
        "homepage": "https://karans.github.io;;;http://www.irfanessa.com/",
        "dblp": ";;303/0385;e/IrfanAEssa",
        "google_scholar": ";;;https://scholar.google.com.tw/citations?user=XM97iScAAAAJ",
        "orcid": ";;0000-0002-7462-7696;0000-0002-6236-2969",
        "linkedin": ";apoorva-beedu-32805349/;;irfanessa/",
        "or_profile": "~Karan_Samel2;~Apoorva_Beedu1;~Nitish_Sontakke1;~Irfan_Essa1",
        "aff": "Georgia Institute of Technology;Georgia Institute of Technology;Georgia Institute of Technology;Georgia Institute of Technology",
        "aff_domain": "gatech.edu;gatech.edu;gatech.edu;gatech.edu",
        "position": "PhD student;PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nsamel2024exploring,\ntitle={Exploring Efficient Foundational Multi-modal Models for Video Summarization},\nauthor={Karan Samel and Apoorva Beedu and Nitish Sontakke and Irfan Essa},\nyear={2024},\nurl={https://openreview.net/forum?id=CajWziS3Ia}\n}",
        "github": "",
        "project": "",
        "reviewers": "WPWU;PkUQ;F78M;zhmP",
        "site": "https://openreview.net/forum?id=CajWziS3Ia",
        "pdf_size": 565192,
        "rating": "3;3;3;3",
        "confidence": "4;4;3;4",
        "soundness": "2;2;2;2",
        "contribution": "2;1;1;1",
        "presentation": "3;2;2;2",
        "wc_summary": "59;21;78;103",
        "wc_strengths": "55;17;44;64",
        "wc_weaknesses": "79;120;129;553",
        "wc_questions": "27;5;4;99",
        "wc_review": "220;163;255;819",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            65.25,
            29.93639089803579
        ],
        "wc_strengths_avg": [
            45.0,
            17.649362594722792
        ],
        "wc_weaknesses_avg": [
            220.25,
            193.0354565876435
        ],
        "wc_questions_avg": [
            33.75,
            38.77740966078059
        ],
        "wc_review_avg": [
            364.25,
            264.59532781211385
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12419778443725377399&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Georgia Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.gatech.edu",
        "aff_unique_abbr": "Georgia Tech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Boosting Graph Anomaly Detection with Adaptive Message Passing",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19168",
        "id": "CanomFZssu",
        "author_site": "Jingyan Chen, Guanghui Zhu, Chunfeng Yuan, Yihua Huang",
        "tldr": "",
        "abstract": "Unsupervised graph anomaly detection has been widely used in real-world applications. Existing methods primarily focus on local inconsistency mining (LIM), based on the intuition that establishing high similarities between abnormal nodes and their neighbors is difficult. However, the message passing employed by graph neural networks (GNNs) results in local anomaly signal loss, as GNNs tend to make connected nodes similar, which conflicts with the LIM intuition. In this paper, we propose GADAM, a novel framework that not only resolves the conflict between LIM and message passing but also leverages message passing to augment anomaly detection through a transformative approach to anomaly mining beyond LIM. Specifically, we first propose an efficient MLP-based LIM approach to obtain local anomaly scores in a conflict-free way. Next, we introduce a novel approach to capture anomaly signals from a global perspective. This involves a hybrid attention based adaptive message passing, enabling nodes to selectively absorb abnormal or normal signals from their surroundings. Extensive experiments conducted on nine benchmark datasets, including two large-scale OGB datasets, demonstrate that GADAM surpassinges existing state-of-the-art methods in terms of both effectiveness and efficiency.",
        "keywords": "Graph neural network;unsupervised anomaly detection",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Jingyan Chen;Guanghui Zhu;Chunfeng Yuan;Yihua Huang",
        "authorids": "~Jingyan_Chen1;~Guanghui_Zhu1;~Chunfeng_Yuan4;~Yihua_Huang1",
        "gender": "M;F;M;M",
        "homepage": "https://cs.nju.edu.cn/zgh/;http://pasa-bigdata.nju.edu.cn/;http://cs.nju.edu.cn/yhuang;",
        "dblp": "161/2889.html;;;",
        "google_scholar": "tsH6LowAAAAJ;;;",
        "orcid": "0000-0002-5069-5950;;;0009-0008-5332-2077",
        "linkedin": ";;;",
        "or_profile": "~Guanghui_Zhu1;~Chunfeng_Yuan4;~Yihua_Huang1;~Chen_Jingyan1",
        "aff": "Nanjing University;;Nanjing University;Nanjing University",
        "aff_domain": "nju.edu.cn;;nju.edu.cn;nju.edu.cn",
        "position": "Assistant Professor;;Full Professor;MS student",
        "bibtex": "@inproceedings{\nchen2024boosting,\ntitle={Boosting Graph Anomaly Detection with Adaptive Message Passing},\nauthor={Jingyan Chen and Guanghui Zhu and Chunfeng Yuan and Yihua Huang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=CanomFZssu}\n}",
        "github": "",
        "project": "",
        "reviewers": "WYWU;va1S;6vV6;deYB",
        "pdf_size": 1453547,
        "rating": "5;6;6;6",
        "confidence": "4;4;3;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "88;145;74;145",
        "wc_strengths": "29;57;39;137",
        "wc_weaknesses": "268;70;47;588",
        "wc_questions": "59;88;66;8",
        "wc_review": "444;360;226;878",
        "wc_reply_reviewers": "178;22;0;57",
        "wc_reply_authors": "2641;1926;1109;2825",
        "reply_reviewers": "2;1;0;1",
        "reply_authors": "5;4;2;6",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            113.0,
            32.380549717384355
        ],
        "wc_strengths_avg": [
            65.5,
            42.482349275905165
        ],
        "wc_weaknesses_avg": [
            243.25,
            216.79180681012832
        ],
        "wc_questions_avg": [
            55.25,
            29.303370113350443
        ],
        "wc_review_avg": [
            477.0,
            244.22325851564588
        ],
        "wc_reply_reviewers_avg": [
            64.25,
            68.74727267317591
        ],
        "wc_reply_authors_avg": [
            2125.25,
            676.0385991199023
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            4.25,
            1.479019945774904
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4326942992009313976&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=CanomFZssu",
        "pdf": "https://openreview.net/pdf?id=CanomFZssu",
        "email": "nju.edu.cn;;nju.edu.cn;nju.edu.cn",
        "author_num": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Nanjing University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nju.edu.cn",
        "aff_unique_abbr": "Nanjing U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "Cbak1TA12X",
        "title": "Adv3D: Generating 3D Adversarial Examples for 3D Object Detection in Driving Scenarios with NeRF",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Deep neural networks (DNNs) have been proven extremely susceptible to adversarial examples, which raises special safety-critical concerns for DNN-based autonomous driving stacks (i.e., 3D object detection). Although there are extensive works on image-level attacks, most are restricted to 2D pixel spaces, and such attacks are not always physically realistic in our 3D world. Here we present Adv3D, the first exploration of modeling adversarial examples as Neural Radiance Fields (NeRFs) in driving scenarios. Advances in NeRF provide photorealistic appearances and 3D accurate generation, yielding a more realistic and realizable adversarial example. We train our adversarial NeRF by minimizing the surrounding objects' confidence predicted by 3D detectors on the training set. Then we evaluate Adv3D on the unseen validation set and show that it can cause a large performance reduction when rendering NeRF in any sampled pose. To enhance physical effectiveness, we propose primitive-aware sampling and semantic-guided regularization that enable 3D patch attacks with camouflage adversarial texture. Experimental results demonstrate that our method surpasses the mesh baseline and generalizes well to different poses, scenes, and 3D detectors. Finally, we provide a defense method to our attacks that improves both the robustness and clean performance of 3D detectors.",
        "keywords": "NeRF;Adversarial Examples;Autonomous Driving;3D Object Detection",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/326feec5a0aa8b2ff79ec4d0d1e5b51c66a643d4.pdf",
        "author": "Leheng Li;Qing LIAN;Ying-Cong Chen",
        "authorids": "~Leheng_Li1;~Qing_LIAN3;~Ying-Cong_Chen1",
        "gender": "M;M;M",
        "homepage": "https://len-li.github.io/;https://www.lianqing11.github.io;https://www.yingcong.me/",
        "dblp": "285/6899;234/4406;137/6578",
        "google_scholar": ";;https://scholar.google.com.hk/citations?user=n7j4bJUAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Leheng_Li1;~Qing_LIAN3;~Ying-Cong_Chen1",
        "aff": "The Hong Kong University of Science and Technology (Guangzhou);Hong Kong University of Science and Technology;Hong Kong University of Science and Technology",
        "aff_domain": "connect.hkust-gz.edu.cn;ust.hk;hkust-gz.edu.cn",
        "position": "PhD student;PhD student;Assistant Professor",
        "bibtex": "@misc{\nli2024advd,\ntitle={Adv3D: Generating 3D Adversarial Examples for 3D Object Detection in Driving Scenarios with Ne{RF}},\nauthor={Leheng Li and Qing LIAN and Ying-Cong Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=Cbak1TA12X}\n}",
        "github": "",
        "project": "",
        "reviewers": "VarX;7cQe;coS8;L9aq",
        "site": "https://openreview.net/forum?id=Cbak1TA12X",
        "pdf_size": 2147275,
        "rating": "3;5;5;6",
        "confidence": "4;4;4;4",
        "soundness": "2;3;2;4",
        "contribution": "2;2;2;3",
        "presentation": "3;3;2;4",
        "wc_summary": "65;113;129;83",
        "wc_strengths": "43;55;142;92",
        "wc_weaknesses": "210;207;658;113",
        "wc_questions": "73;5;92;1",
        "wc_review": "391;380;1021;289",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;122;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;1;0;0",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            97.5,
            24.994999499899976
        ],
        "wc_strengths_avg": [
            83.0,
            38.555155297314
        ],
        "wc_weaknesses_avg": [
            297.0,
            212.04126956797822
        ],
        "wc_questions_avg": [
            42.75,
            40.33841221466209
        ],
        "wc_review_avg": [
            520.25,
            291.8059072397267
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            30.5,
            52.827549630850754
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0.25,
            0.4330127018922193
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4627831788523045379&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Hong Kong University of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ust.hk",
        "aff_unique_abbr": "HKUST",
        "aff_campus_unique_index": "0;1;1",
        "aff_campus_unique": "Guangzhou;Hong Kong SAR",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "CbmAtAmQla",
        "title": "PRD: Peer Rank and Discussion Improve Large Language Model based Evaluations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Nowadays, the quality of responses generated by different modern large language models (LLMs) are hard to evaluate and compare automatically. Recent studies suggest and predominantly use LLMs for reference-free evaluation of open-ended question answering. More specifically, they use the recognized \"strongest\" LLM as the evaluator, which conducts pairwise comparisons of candidate models' answers and provides a ranking score. However, this intuitive method has multiple problems, such as bringing in self-enhancement (favoring its own answers) and positional bias. We draw insights and lessons from the educational domain (Cho and MacArthur, 2011; Walsh, 2014) to improve LLM-based evaluations. Specifically, we propose (1) the peer rank (PR) algorithm that takes into account each peer LLM's pairwise preferences of all answer pairs, and outputs a final ranking of models; and (2) peer discussion (PD), where we prompt two LLMs to discuss and try to reach a mutual agreement on preferences of two answers. We conduct experiments on two benchmark datasets. We find that our approaches achieve higher accuracy and align better with human judgments. Interestingly, PR can induce a relatively accurate self-ranking of models under the anonymous setting, where each model's name is unrevealed. _Our work provides space to explore evaluating models that are hard to compare for humans_.",
        "keywords": "Natural Language Processing;Model-based Evaluation;Large Language Models",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/d8a2726fb89262bc5be01d86bf8d2b050c76edfa.zip",
        "author": "Ruosen Li;Teerth Patel;Xinya Du",
        "authorids": "~Ruosen_Li1;~Teerth_Patel1;~Xinya_Du1",
        "gender": "M;M;M",
        "homepage": ";;https://xinyadu.github.io",
        "dblp": "351/0775;;200/8114",
        "google_scholar": "tN-RVAkAAAAJ;;R-lKQqkAAAAJ",
        "orcid": ";;",
        "linkedin": "ruosenli/?locale=en_US;teerth-patel-bab835251/;",
        "or_profile": "~Ruosen_Li1;~Teerth_Patel1;~Xinya_Du1",
        "aff": "University of Texas at Dallas;University of Texas at Dallas;University of Texas at Dallas",
        "aff_domain": "utd.edu;cs.utdallas.edu;utdallas.edu",
        "position": "PhD student;Undergrad student;Assistant Professor",
        "bibtex": "@misc{\nli2024prd,\ntitle={{PRD}: Peer Rank and Discussion Improve Large Language Model based Evaluations},\nauthor={Ruosen Li and Teerth Patel and Xinya Du},\nyear={2024},\nurl={https://openreview.net/forum?id=CbmAtAmQla}\n}",
        "github": "",
        "project": "",
        "reviewers": "qoLU;b58r;mefY;bfhA",
        "site": "https://openreview.net/forum?id=CbmAtAmQla",
        "pdf_size": 1988335,
        "rating": "1;5;5;6",
        "confidence": "2;4;4;4",
        "soundness": "2;2;2;3",
        "contribution": "1;3;2;3",
        "presentation": "1;3;3;3",
        "wc_summary": "44;87;168;116",
        "wc_strengths": "31;67;60;47",
        "wc_weaknesses": "53;68;132;102",
        "wc_questions": "19;12;81;11",
        "wc_review": "147;234;441;276",
        "wc_reply_reviewers": "119;0;0;0",
        "wc_reply_authors": "964;632;1246;717",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "3;2;3;2",
        "rating_avg": [
            4.25,
            1.920286436967152
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            103.75,
            45.07979037218341
        ],
        "wc_strengths_avg": [
            51.25,
            13.718144918318949
        ],
        "wc_weaknesses_avg": [
            88.75,
            30.638007441738115
        ],
        "wc_questions_avg": [
            30.75,
            29.17511782324109
        ],
        "wc_review_avg": [
            274.5,
            106.79536506796538
        ],
        "wc_reply_reviewers_avg": [
            29.75,
            51.528511525174096
        ],
        "wc_reply_authors_avg": [
            889.75,
            239.1154271476435
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.9771398364036774,
        "gs_citation": 86,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18318724609085302128&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Texas at Dallas",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.utdallas.edu",
        "aff_unique_abbr": "UT Dallas",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Dallas",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Internal Cross-layer Gradients for Extending Homogeneity to Heterogeneity in Federated Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19167",
        "id": "Cc0qk6r4Nd",
        "author_site": "Yun-Hin Chan, Rui Zhou, Running Zhao, Zhihan JIANG, Edith Ngai",
        "tldr": "",
        "abstract": "Federated learning (FL) inevitably confronts the challenge of system heterogeneity in practical scenarios. To enhance the capabilities of most model-homogeneous FL methods in handling system heterogeneity, we propose a training scheme that can extend their capabilities to cope with this challenge. In this paper, we commence our study with a detailed exploration of homogeneous and heterogeneous FL settings and discover three key observations: (1) a positive correlation between client performance and layer similarities, (2) higher similarities in the shallow layers in contrast to the deep layers, and (3) the smoother gradients distributions indicate the higher layer similarities. Building upon these observations, we propose InCo Aggregation that leverages internal cross-layer gradients, a mixture of gradients from shallow and deep layers within a server model, to augment the similarity in the deep layers without requiring additional communication between clients. Furthermore, our methods can be tailored to accommodate model-homogeneous FL methods such as FedAvg, FedProx, FedNova, Scaffold, and MOON, to expand their capabilities to handle the system heterogeneity. Copious experimental results validate the effectiveness of InCo Aggregation, spotlighting internal cross-layer gradients as a promising avenue to enhance the performance in heterogeneous FL.",
        "keywords": "Federated Learning;heterogeneity;convex optimization.",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/67ab1ffb5996b11b96a7b8acccbd05fbaa70f64a.pdf",
        "author": "Yun-Hin Chan;Rui Zhou;Running Zhao;Zhihan JIANG;Edith C. H. Ngai",
        "authorids": "~Yun-Hin_Chan1;~Rui_Zhou3;~Running_Zhao1;~Zhihan_JIANG1;~Edith_C._H._Ngai1",
        "gender": "M;;M;F;F",
        "homepage": "https://www.eee.hku.hk/~iotlab/People.html;;https://zhaorunning.github.io/;http://zhihanjiang.com;https://www.eee.hku.hk/people/echngai/",
        "dblp": "332/0847.html;;243/8583;238/9462;25/5713",
        "google_scholar": "9dJZ9RQAAAAJ;;QDnm0fgAAAAJ;;jFt4ZtUAAAAJ",
        "orcid": ";;;;0000-0002-3454-8731",
        "linkedin": ";;;;",
        "or_profile": "~Yun-Hin_Chan1;~Rui_Zhou3;~Running_Zhao1;~Zhihan_JIANG1;~Edith_C._H._Ngai1",
        "aff": "University of Hong Kong;;University of Hong Kong;University of Hong Kong;University of Hong Kong",
        "aff_domain": "hku.hk;;hku.hk;hku.hk;hku.hk",
        "position": "PhD student;;PhD student;PhD student;Associate Professor",
        "bibtex": "@inproceedings{\nchan2024internal,\ntitle={Internal Cross-layer Gradients for Extending Homogeneity to Heterogeneity in Federated Learning},\nauthor={Yun-Hin Chan and Rui Zhou and Running Zhao and Zhihan JIANG and Edith C. H. Ngai},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Cc0qk6r4Nd}\n}",
        "github": "",
        "project": "",
        "reviewers": "ibVy;ky42;e8EV;vLVW",
        "pdf_size": 3922087,
        "rating": "5;8;8;8",
        "confidence": "4;2;3;3",
        "soundness": "2;3;4;3",
        "contribution": "2;3;3;3",
        "presentation": "2;3;3;4",
        "wc_summary": "69;44;102;87",
        "wc_strengths": "62;63;58;43",
        "wc_weaknesses": "121;46;243;105",
        "wc_questions": "26;92;301;65",
        "wc_review": "278;245;704;300",
        "wc_reply_reviewers": "0;0;84;101",
        "wc_reply_authors": "1882;737;2506;1391",
        "reply_reviewers": "0;0;1;2",
        "reply_authors": "4;1;5;4",
        "rating_avg": [
            7.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            75.5,
            21.615966321217286
        ],
        "wc_strengths_avg": [
            56.5,
            8.0156097709407
        ],
        "wc_weaknesses_avg": [
            128.75,
            71.6323076551356
        ],
        "wc_questions_avg": [
            121.0,
            106.53872535374168
        ],
        "wc_review_avg": [
            381.75,
            187.07802516597187
        ],
        "wc_reply_reviewers_avg": [
            46.25,
            46.63890543312525
        ],
        "wc_reply_authors_avg": [
            1629.0,
            649.1236399947239
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.5,
            1.5
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6152674052017531740&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=Cc0qk6r4Nd",
        "pdf": "https://openreview.net/pdf?id=Cc0qk6r4Nd",
        "email": "hku.hk;;hku.hk;hku.hk;hku.hk",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of Hong Kong",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.hku.hk",
        "aff_unique_abbr": "HKU",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Generative Learning for Financial Time Series with Irregular and Scale-Invariant Patterns",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19166",
        "id": "CdjnzWsQax",
        "author_site": "Hongbin Huang, Minghua Chen, Xiao Qiao",
        "tldr": "",
        "abstract": "Limited data availability poses a major obstacle in training deep learning models for financial applications. Synthesizing financial time series to augment real-world data is challenging due to the irregular and scale-invariant patterns uniquely associated with financial time series - temporal dynamics that repeat with varying duration and magnitude. Such dynamics cannot be captured by existing approaches, which often assume regularity and uniformity in the underlying data. We develop a novel generative framework called FTS-Diffusion to model irregular and scale-invariant patterns that consists of three modules. First, we develop a scale-invariant pattern recognition algorithm to extract recurring patterns that vary in duration and magnitude. Second, we construct a diffusion-based generative network to synthesize segments of patterns. Third, we model the temporal transition of patterns in order to aggregate the generated segments. Extensive experiments show that FTS-Diffusion generates synthetic financial time series highly resembling observed data, outperforming state-of-the-art alternatives. Two downstream experiments demonstrate that augmenting real-world data with synthetic data generated by FTS-Diffusion reduces the error of stock market prediction by up to 17.9%. To the best of our knowledge, this is the first work on generating intricate time series with irregular and scale-invariant patterns, addressing data limitation issues in finance.",
        "keywords": "generative model;time series pattern recognition;diffusion model;financial time series",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/2ff6164bc7727c4c9c5e24c9cb39ef3f33a1f500.zip",
        "author": "Hongbin Huang;Minghua Chen;Xiao Qiao",
        "authorids": "~Hongbin_Huang1;~Minghua_Chen1;~Xiao_Qiao1",
        "gender": "M;M;M",
        "homepage": ";https://www.mhchen.com;",
        "dblp": ";12/4395-1.html;",
        "google_scholar": ";https://scholar.google.com.hk/citations?user=WzEQ9QwAAAAJ;https://scholar.google.com.hk/citations?user=Dyqg2jQAAAAJ",
        "orcid": "0000-0002-2665-6142;0000-0003-4763-0037;",
        "linkedin": ";;",
        "or_profile": "~Hongbin_Huang1;~Minghua_Chen1;~Xiao_Qiao1",
        "aff": "City University of Hong Kong;City University of Hong Kong;City University of Hong Kong",
        "aff_domain": "cityu.edu.hk;cityu.edu.hk;cityu.edu.hk",
        "position": "PhD student;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nhuang2024generative,\ntitle={Generative Learning for Financial Time Series with Irregular and Scale-Invariant Patterns},\nauthor={Hongbin Huang and Minghua Chen and Xiao Qiao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=CdjnzWsQax}\n}",
        "github": "",
        "project": "",
        "reviewers": "dpJk;SkxH;XZvW",
        "pdf_size": 1767378,
        "rating": "6;8;8",
        "confidence": "2;4;3",
        "soundness": "2;2;2",
        "contribution": "3;2;3",
        "presentation": "3;3;3",
        "wc_summary": "103;78;52",
        "wc_strengths": "129;84;64",
        "wc_weaknesses": "99;222;74",
        "wc_questions": "117;88;29",
        "wc_review": "448;472;219",
        "wc_reply_reviewers": "36;91;17",
        "wc_reply_authors": "1256;1658;1290",
        "reply_reviewers": "1;1;1",
        "reply_authors": "3;4;4",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            77.66666666666667,
            20.82199691565522
        ],
        "wc_strengths_avg": [
            92.33333333333333,
            27.182510717166817
        ],
        "wc_weaknesses_avg": [
            131.66666666666666,
            64.68556424908282
        ],
        "wc_questions_avg": [
            78.0,
            36.615115275889366
        ],
        "wc_review_avg": [
            379.6666666666667,
            114.03021042201443
        ],
        "wc_reply_reviewers_avg": [
            48.0,
            31.379398762032817
        ],
        "wc_reply_authors_avg": [
            1401.3333333333333,
            182.0207558372274
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.8660254037844385,
        "gs_citation": 22,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2764402758174058589&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=CdjnzWsQax",
        "pdf": "https://openreview.net/pdf?id=CdjnzWsQax",
        "email": "cityu.edu.hk;cityu.edu.hk;cityu.edu.hk",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "City University of Hong Kong",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cityu.edu.hk",
        "aff_unique_abbr": "CityU",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "Cdng6X2Joq",
        "title": "A New, Physics-Based Continuous-Time Reinforcement Learning Algorithm with Performance Guarantees",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We introduce a new, physics-based continuous-time reinforcement learning (CT-RL) algorithm for control of affine nonlinear systems, an area that enables a plethora of well-motivated applications. Based on fundamental input/output control mechanisms, our approach uses reference command input (RCI) as probing noise in learning. With known physical dynamics of the environment, and by leveraging on the Kleinman algorithm structure, our RCI-based CT-RL algorithm not only provides theoretical guarantees such as learning convergence, solution optimality, and closed-loop stability, but also well-behaved dynamic system responses with data efficiency during learning. Our results are therefore an advance from the two currently available classes of approaches to CT-RL. The first school of adaptive dynamic programming (ADP) methods features elegant theoretical results stemming from adaptive and optimal control. Yet, they have not been shown effectively synthesizing meaningful controllers. The second school of fitted value iteration (FVI) methods, also the state-of-the-art (SOTA) deep RL (DRL) design, has shown impressive learning solutions, yet theoretical guarantees are still to be developed. We provide several evaluations to demonstrate that our RCI-based design leads to new, SOTA CT-RL results.",
        "keywords": "Reinforcement Learning (RL);Continuous Time (CT);Optimal Control;Physics-Based",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/5a229f0dba188e3caf840377cf6156bb31402219.zip",
        "author": "Brent A. Wallace;Jennie Si",
        "authorids": "~Brent_A._Wallace1;~Jennie_Si1",
        "gender": ";",
        "homepage": ";",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Brent_A._Wallace1;~Jennie_Si1",
        "aff": ";",
        "aff_domain": ";",
        "position": ";",
        "bibtex": "@misc{\nwallace2024a,\ntitle={A New, Physics-Based Continuous-Time Reinforcement Learning Algorithm with Performance Guarantees},\nauthor={Brent A. Wallace and Jennie Si},\nyear={2024},\nurl={https://openreview.net/forum?id=Cdng6X2Joq}\n}",
        "github": "",
        "project": "",
        "reviewers": "SQkk;QT7M;UKDb",
        "site": "https://openreview.net/forum?id=Cdng6X2Joq",
        "pdf_size": 14328062,
        "rating": "3;3;5",
        "confidence": "4;3;2",
        "soundness": "2;2;2",
        "contribution": "2;2;2",
        "presentation": "2;2;1",
        "wc_summary": "43;63;23",
        "wc_strengths": "11;55;104",
        "wc_weaknesses": "302;218;201",
        "wc_questions": "13;59;23",
        "wc_review": "369;395;351",
        "wc_reply_reviewers": "513;125;159",
        "wc_reply_authors": "1076;1068;1073",
        "reply_reviewers": "2;1;2",
        "reply_authors": "3;2;3",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            43.0,
            16.32993161855452
        ],
        "wc_strengths_avg": [
            56.666666666666664,
            37.985377303495206
        ],
        "wc_weaknesses_avg": [
            240.33333333333334,
            44.15377170248942
        ],
        "wc_questions_avg": [
            31.666666666666668,
            19.754043186705406
        ],
        "wc_review_avg": [
            371.6666666666667,
            18.06162291219209
        ],
        "wc_reply_reviewers_avg": [
            265.6666666666667,
            175.44103156204807
        ],
        "wc_reply_authors_avg": [
            1072.3333333333333,
            3.2998316455372216
        ],
        "reply_reviewers_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.8660254037844387,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:tVHQwUa1Yk4J:scholar.google.com/&scioq=A+New,+Physics-Based+Continuous-Time+Reinforcement+Learning+Algorithm+with+Performance+Guarantees&hl=en&as_sdt=0,33",
        "gs_version_total": 0
    },
    {
        "id": "CeJEfNKstt",
        "title": "The Geometry of Truth: Emergent Linear Structure in Large Language Model Representations of True/False Datasets",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) have impressive capabilities, but are also prone to outputting falsehoods. Recent work has developed techniques for inferring whether a LLM is telling the truth by training probes on the LLM's internal activations. However, this line of work is controversial, with some authors pointing out failures of these probes to generalize in basic ways, among other conceptual issues. In this work, we curate high-quality datasets of true/false statements and use them to study in detail the structure of LLM representations of truth, drawing on three lines of evidence: 1. Visualizations of LLM true/false statement representations, which reveal clear linear structure. 2. Transfer experiments in which probes trained on one dataset generalize to different datasets. 3. Causal evidence obtained by surgicallly intervening in a LLM's forward pass, causing it to treat false statements as true and vice versa. Overall, we present evidence that language models linearly represent the truth or falsehood of factual statements. We also introduce a novel technique, mass-mean probing, which generalizes better and is more causally implicated in model outputs than other probing techniques.",
        "keywords": "Large language models;interpretability;world models;knowledge representations;linear probes;causal interventions",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/87b0986487ca671d862ed199cabad3753961cf63.zip",
        "author": "Samuel Marks;Max Tegmark",
        "authorids": "~Samuel_Marks1;~Max_Tegmark1",
        "gender": ";",
        "homepage": ";https://space.mit.edu/home/tegmark/",
        "dblp": ";25/6578",
        "google_scholar": ";eBXEZxgAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Samuel_Marks1;~Max_Tegmark1",
        "aff": "Northeastern University;Massachusetts Institute of Technology",
        "aff_domain": "northeastern.edu;mit.edu",
        "position": "Postdoc;Full Professor",
        "bibtex": "@misc{\nmarks2024the,\ntitle={The Geometry of Truth: Emergent Linear Structure in Large Language Model Representations of True/False Datasets},\nauthor={Samuel Marks and Max Tegmark},\nyear={2024},\nurl={https://openreview.net/forum?id=CeJEfNKstt}\n}",
        "github": "",
        "project": "",
        "reviewers": "hn5S;LibM;4DXR;WvMz",
        "site": "https://openreview.net/forum?id=CeJEfNKstt",
        "pdf_size": 6565629,
        "rating": "3;5;5;8",
        "confidence": "3;2;3;3",
        "soundness": "2;3;2;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;2;3",
        "wc_summary": "132;73;50;157",
        "wc_strengths": "88;28;56;86",
        "wc_weaknesses": "193;126;93;73",
        "wc_questions": "43;2;27;110",
        "wc_review": "456;229;226;426",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "700;743;1290;833",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;2;2;1",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            103.0,
            43.2030091544559
        ],
        "wc_strengths_avg": [
            64.5,
            24.591665254715874
        ],
        "wc_weaknesses_avg": [
            121.25,
            45.54324867639549
        ],
        "wc_questions_avg": [
            45.5,
            40.00312487793922
        ],
        "wc_review_avg": [
            334.25,
            107.28088133493311
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            891.5,
            235.02606238457895
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.08084520834544431,
        "gs_citation": 142,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6898031812756838201&as_sdt=8005&sciodt=0,7&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Northeastern University;Massachusetts Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.northeastern.edu;https://web.mit.edu",
        "aff_unique_abbr": "NEU;MIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "PAC-FNO: Parallel-Structured All-Component Fourier Neural Operators for Recognizing Low-Quality Images",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19165",
        "id": "Cf4FJGmHRQ",
        "author_site": "Jinsung Jeon, Hyundong Jin, Jonghyun Choi, Sanghyun Hong, Dongeun Lee, Kookjin Lee, Noseong Park",
        "tldr": "",
        "abstract": "A standard practice in developing image recognition models is to train a model on a specific image resolution and then deploy it. However, in real-world inference, models often encounter images different from the training sets in resolution and/or subject to natural variations such as weather changes, noise types and compression artifacts. While traditional solutions involve training multiple models for different resolutions or input variations, these methods are computationally expensive and thus do not scale in practice. To this end, we propose a novel neural network model, parallel-structured and all-component Fourier neural operator (PAC-FNO), that addresses the problem. Unlike conventional feed-forward neural networks, PAC-FNO operates in the frequency domain, allowing it to handle images of varying resolutions within a single model. We also propose a two-stage algorithm for training PAC-FNO with a minimal modification to the original, downstream model. Moreover, the proposed PAC-FNO is ready to work with existing image recognition models. Extensively evaluating methods with seven image recognition benchmarks, we show that the proposed PAC-FNO improves the performance of existing baseline models on images with various resolutions by up to 77.1% and various types of natural variations in the images at inference.",
        "keywords": "Low-quality image;Visual recognition;Classification;Low-resolution;Input variations",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/070d4228e98550c3ea97ae750cb9d44fe8f3f20d.zip",
        "author": "Jinsung Jeon;Hyundong Jin;Jonghyun Choi;Sanghyun Hong;Dongeun Lee;Kookjin Lee;Noseong Park",
        "authorids": "~Jinsung_Jeon1;~Hyundong_Jin1;~Jonghyun_Choi1;~Sanghyun_Hong1;~Dongeun_Lee1;~Kookjin_Lee1;~Noseong_Park1",
        "gender": ";;M;M;M;M;",
        "homepage": "https://sites.google.com/view/npark/home?authuser=0;;https://ppolon.github.io/;http://www.sanghyun-hong.com;;https://scholar.google.com/citations?hl=en&user=KL89hVQAAAAJ&view_op=list_works;",
        "dblp": "294/0098;;21/11103;135/8991;62/688;122/5103;",
        "google_scholar": "0R6W6lsAAAAJ;;uiGWnm4AAAAJ;https://scholar.google.com/citations?hl=en;;https://scholar.google.com/citations?hl=en;",
        "orcid": "0000-0002-9693-2739;;0000-0002-7934-8434;;;;",
        "linkedin": "jinsung-jeon-994942289/;;jonghyun-choi-459bb615/;;;;",
        "or_profile": "~Jinsung_Jeon1;~Hyundong_Jin1;~Jonghyun_Choi1;~Sanghyun_Hong1;~Dongeun_Lee1;~Kookjin_Lee1;~Noseong_Park1",
        "aff": "Yonsei University;;Yonsei University;Oregon State University;East Texas A&M University;Arizona State University;",
        "aff_domain": "yonsei.ac.kr;;yonsei.ac.kr;oregonstate.edu;tamuc.edu;asu.edu;",
        "position": "PhD student;;Associate Professor;Assistant Professor;Associate Professor;Assistant Professor;",
        "bibtex": "@inproceedings{\njeon2024pacfno,\ntitle={{PAC}-{FNO}: Parallel-Structured All-Component Fourier Neural Operators for Recognizing Low-Quality Images},\nauthor={Jinsung Jeon and Hyundong Jin and Jonghyun Choi and Sanghyun Hong and Dongeun Lee and Kookjin Lee and Noseong Park},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Cf4FJGmHRQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "pDdt;WCy8;nwGj",
        "pdf_size": 787247,
        "rating": "6;6;6",
        "confidence": "5;4;4",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "2;3;3",
        "wc_summary": "167;120;82",
        "wc_strengths": "166;20;61",
        "wc_weaknesses": "328;146;191",
        "wc_questions": "2;5;5",
        "wc_review": "663;291;339",
        "wc_reply_reviewers": "226;16;0",
        "wc_reply_authors": "1808;1050;1676",
        "reply_reviewers": "2;1;0",
        "reply_authors": "5;3;4",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            123.0,
            34.76588366008646
        ],
        "wc_strengths_avg": [
            82.33333333333333,
            61.48351179155451
        ],
        "wc_weaknesses_avg": [
            221.66666666666666,
            77.400832611083
        ],
        "wc_questions_avg": [
            4.0,
            1.4142135623730951
        ],
        "wc_review_avg": [
            431.0,
            165.21501142450705
        ],
        "wc_reply_reviewers_avg": [
            80.66666666666667,
            102.97356726634051
        ],
        "wc_reply_authors_avg": [
            1511.3333333333333,
            330.6330628086402
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            4.0,
            0.816496580927726
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:p-HrxR2_OQEJ:scholar.google.com/&scioq=PAC-FNO:+Parallel-Structured+All-Component+Fourier+Neural+Operators+for+Recognizing+Low-Quality+Images&hl=en&as_sdt=0,24",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=Cf4FJGmHRQ",
        "pdf": "https://openreview.net/pdf?id=Cf4FJGmHRQ",
        "email": "yonsei.ac.kr;;yonsei.ac.kr;oregonstate.edu;tamuc.edu;asu.edu;",
        "author_num": 7,
        "aff_unique_index": "0;0;1;2;3",
        "aff_unique_norm": "Yonsei University;Oregon State University;East Texas A&M University;Arizona State University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.yonsei.ac.kr;https://oregonstate.edu;https://www.etam.edu;https://www.asu.edu",
        "aff_unique_abbr": "Yonsei;OSU;ETAMU;ASU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;1;1",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "id": "Cf8HBieRzL",
        "title": "UniContact:A Basic Model for Robotic Manipulation of Contact Synthesis on Rigid and Articulated Rigid Bodies with Arbitrary Manipulators",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We posit that one fundamental, core component of robotic manipulation is inferring contacts with the environment, enabling the agent to exert control. In this work, we study a fundamental problem of contact synthesis in robotic manipulation to choose a set of contact positions and forces on a random rigid or articulated rigid object for an arbitrary robot manipulator to produce a specified external wrench.  Our framework first segments the point clouds with normals into feasible contact region sets. For each feasible contact region set, a model is trained to produce the feasible contact point within these region sets by taking as inputs the robot description, the target wrench, the object point cloud with normals, and the contact region set. After gathering the contact positions from the neural network model, we develop an optimization process to fine-tune the contact points and contact forces and generate the joint values for the robotic manipulator to exert contact forces on the object's surface without penetration.  We perform extensive experiments to verify the effectiveness of our proposed framework both in simulation and in real-world experiments. Supplementary and Videos are on the website.",
        "keywords": "manipulation;grasping;robotics",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/266b90c29cf57dd16ee3b06f9df9a74b411abca8.pdf",
        "author": "Gang Yang;Zhixuan Xu;Zixuan Liu;Jichen Sun;Hanwei Fan;Xinghao Zhu;Lin Shao",
        "authorids": "~Gang_Yang8;~Zhixuan_Xu1;~Zixuan_Liu2;~Jichen_Sun1;~Hanwei_Fan2;~Xinghao_Zhu1;~Lin_Shao2",
        "gender": "M;M;;M;M;;M",
        "homepage": "https://github.com/LapUtopia;https://ariszxxu.github.io;https://panda-shawn.github.io;https://madcreeper.github.io/;;;https://linsats.github.io/",
        "dblp": ";;254/3346-2;;;;26/8546-2",
        "google_scholar": ";OL_axPMAAAAJ;D4XufdkAAAAJ;;;;https://scholar.google.com/citations?hl=en",
        "orcid": ";;0000-0003-0667-9053;;;;",
        "linkedin": ";;;;hanwei-fan-876050292/;;",
        "or_profile": "~Gang_Yang8;~Zhixuan_Xu1;~Zixuan_Liu2;~Jichen_Sun1;~Hanwei_Fan2;~Xinghao_Zhu1;~Lin_Shao2",
        "aff": ";Zhejiang University;Tsinghua University;Shanghai Jiaotong University;National University of Singapore;;National University of Singapore",
        "aff_domain": ";zju.edu.cn;mails.tsinghua.edu.cn;sjtu.edu.cn;u.nus.edu;;nus.edu.sg",
        "position": ";Undergrad student;MS student;Undergrad student;MS student;;Assistant Professor",
        "bibtex": "@misc{\nyang2024unicontacta,\ntitle={UniContact:A Basic Model for Robotic Manipulation of Contact Synthesis on Rigid and Articulated Rigid Bodies with Arbitrary Manipulators},\nauthor={Gang Yang and Zhixuan Xu and Zixuan Liu and Jichen Sun and Hanwei Fan and Xinghao Zhu and Lin Shao},\nyear={2024},\nurl={https://openreview.net/forum?id=Cf8HBieRzL}\n}",
        "github": "",
        "project": "",
        "reviewers": "UfwH;G6eg;VBDw;1VGY",
        "site": "https://openreview.net/forum?id=Cf8HBieRzL",
        "pdf_size": 7799700,
        "rating": "3;3;3;5",
        "confidence": "3;3;4;3",
        "soundness": "2;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "1;3;1;3",
        "wc_summary": "50;105;61;43",
        "wc_strengths": "22;71;24;80",
        "wc_weaknesses": "212;203;218;239",
        "wc_questions": "293;158;43;93",
        "wc_review": "577;537;346;455",
        "wc_reply_reviewers": "0;56;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            1.0
        ],
        "wc_summary_avg": [
            64.75,
            24.107830678018296
        ],
        "wc_strengths_avg": [
            49.25,
            26.45160675649024
        ],
        "wc_weaknesses_avg": [
            218.0,
            13.24764129949177
        ],
        "wc_questions_avg": [
            146.75,
            93.7666651854485
        ],
        "wc_review_avg": [
            478.75,
            88.36394909690263
        ],
        "wc_reply_reviewers_avg": [
            14.0,
            24.24871130596428
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:83Z-qILhFEkJ:scholar.google.com/&scioq=UniContact:A+Basic+Model+for+Robotic+Manipulation+of+Contact+Synthesis+on+Rigid+and+Articulated+Rigid+Bodies+with+Arbitrary+Manipulators&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;3",
        "aff_unique_norm": "Zhejiang University;Tsinghua University;Shanghai Jiao Tong University;National University of Singapore",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.zju.edu.cn;https://www.tsinghua.edu.cn;https://www.sjtu.edu.cn;https://www.nus.edu.sg",
        "aff_unique_abbr": "ZJU;THU;SJTU;NUS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;1",
        "aff_country_unique": "China;Singapore"
    },
    {
        "title": "WizardLM: Empowering Large Pre-Trained Language Models to Follow Complex Instructions",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19164",
        "id": "CfXh93NDgH",
        "author_site": "Can Xu, Qingfeng Sun, Kai Zheng, Xiubo Geng, Pu Zhao, Jiazhan Feng, Chongyang Tao, Qingwei Lin, Daxin Jiang",
        "tldr": "",
        "abstract": "Training large language models (LLMs) with open-domain instruction following data brings colossal success. However, manually creating such instruction data is very time-consuming and labor-intensive. Moreover, humans may struggle to produce high-complexity instructions. In this paper, we show an avenue for creating large amounts of instruction data with varying levels of complexity using LLM instead of humans. Starting with an initial set of instructions, we use our proposed Evol-Instruct to rewrite them step by step into more complex instructions. Then, we mix all generated instruction data to fine-tune LLaMA. We call the resulting model WizardLM. Both automatic and human evaluations consistently indicate that WizardLM outperforms baselines such as Alpaca (trained from Self-Instruct) and Vicuna (trained from human-created instructions). The experimental results demonstrate that the quality of instruction-following dataset crafted by Evol-Instruct can significantly improve the performance of LLMs.",
        "keywords": "Large Language Model;Instruction Fine-tuning",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/8b061fd1e3b9512d743627cf2a25daab1314afc5.zip",
        "author": "Can Xu;Qingfeng Sun;Kai Zheng;Xiubo Geng;Pu Zhao;Jiazhan Feng;Chongyang Tao;Qingwei Lin;Daxin Jiang",
        "authorids": "~Can_Xu2;~Qingfeng_Sun1;~Kai_Zheng8;~Xiubo_Geng2;~Pu_Zhao3;~Jiazhan_Feng1;~Chongyang_Tao1;~Qingwei_Lin1;~Daxin_Jiang2",
        "gender": "M;M;;F;M;M;M;M;M",
        "homepage": ";https://victorsungo.github.io;https://www.microsoft.com/en-us/research/people/zhengkai/;https://xiubo0211.github.io/;https://www.microsoft.com/en-us/research/people/puzhao/;https://sites.google.com/view/jzfeng/home/;;https://www.microsoft.com/en-us/research/people/qlin/;https://www.microsoft.com/en-us/research/people/djiang/",
        "dblp": ";;73/3928-2.html;19/189;75/8475-4.html;242/9191;;120/0743;77/5094",
        "google_scholar": "5aiE_NcAAAAJ;https://scholar.google.com.tw/citations?user=GLMKUEwAAAAJ;dxjqLjsAAAAJ;XxeX3FgAAAAJ;G3kyd-MAAAAJ;uYHmew8AAAAJ;x_cOKuwAAAAJ;https://scholar.google.co.jp/citations?hl=zh-CN;N-wAHCoAAAAJ",
        "orcid": "0000-0002-1949-5715;;;;0000-0002-4518-323X;0000-0002-5832-6199;;0000-0003-2559-2383;",
        "linkedin": ";;;;;;;;",
        "or_profile": "~Can_Xu2;~Qingfeng_Sun1;~Kai_Zheng8;~Xiubo_Geng2;~Pu_Zhao3;~Jiazhan_Feng1;~Chongyang_Tao1;~Qingwei_Lin1;~Daxin_Jiang2",
        "aff": "Microsoft;Microsoft;Microsoft;Microsoft;Microsoft;Peking University;Microsoft;Microsoft Research;StepFun",
        "aff_domain": "microsoft.com;microsoft.com;microsoft.com;microsoft.com;microsoft.com;pku.edu.cn;microsoft.com;microsoft.com;stepfun.com",
        "position": "Researcher;Researcher;Researcher;Researcher;Researcher;PhD student;Researcher;Sr. Principal Researcher;CEO",
        "bibtex": "@inproceedings{\nxu2024wizardlm,\ntitle={Wizard{LM}: Empowering Large Pre-Trained Language Models to Follow Complex Instructions},\nauthor={Can Xu and Qingfeng Sun and Kai Zheng and Xiubo Geng and Pu Zhao and Jiazhan Feng and Chongyang Tao and Qingwei Lin and Daxin Jiang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=CfXh93NDgH}\n}",
        "github": "",
        "project": "",
        "reviewers": "HVLz;tNq7;fF8a;JU8z",
        "pdf_size": 1114788,
        "rating": "6;6;6;6",
        "confidence": "4;3;5;4",
        "soundness": "2;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "51;96;90;107",
        "wc_strengths": "27;73;41;44",
        "wc_weaknesses": "204;103;507;196",
        "wc_questions": "37;108;45;8",
        "wc_review": "319;380;683;355",
        "wc_reply_reviewers": "93;234;122;30",
        "wc_reply_authors": "1319;2136;1648;1245",
        "reply_reviewers": "1;2;2;1",
        "reply_authors": "2;4;4;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            86.0,
            21.106870919205434
        ],
        "wc_strengths_avg": [
            46.25,
            16.723860200324566
        ],
        "wc_weaknesses_avg": [
            252.5,
            152.2046319925908
        ],
        "wc_questions_avg": [
            49.5,
            36.47259244967377
        ],
        "wc_review_avg": [
            434.25,
            145.24354546760418
        ],
        "wc_reply_reviewers_avg": [
            119.75,
            73.8727791544355
        ],
        "wc_reply_authors_avg": [
            1587.0,
            351.3936538983025
        ],
        "reply_reviewers_avg": [
            1.5,
            0.5
        ],
        "reply_authors_avg": [
            3.0,
            1.0
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 175,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11103416019159060709&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=CfXh93NDgH",
        "pdf": "https://openreview.net/pdf?id=CfXh93NDgH",
        "email": "microsoft.com;microsoft.com;microsoft.com;microsoft.com;microsoft.com;pku.edu.cn;microsoft.com;microsoft.com;stepfun.com",
        "author_num": 9,
        "aff_unique_index": "0;0;0;0;0;1;0;0;2",
        "aff_unique_norm": "Microsoft;Peking University;StepFun",
        "aff_unique_dep": "Microsoft Corporation;;",
        "aff_unique_url": "https://www.microsoft.com;http://www.pku.edu.cn;",
        "aff_unique_abbr": "Microsoft;Peking U;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;1;0;0",
        "aff_country_unique": "United States;China;"
    },
    {
        "id": "Cfi68cGzIt",
        "title": "Conservative Reinforcement Learning by Q-function Disagreement",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In this paper we propose a novel continuous-space RL algorithm that subtracts the Q-target network standard deviation from a Q-target network which leads to forcing a tighter upper-bound on Q-values estimation. We show in experiments that this novel Q-target formula has a performance advantage when applied to algorithms in this space such as TD3, TD7, MaxMin, REDQ, etc., where the domains examined are control tasks from MuJoCo simulation.",
        "keywords": "Reinforcement Learning;Target Network;Regularization",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Nitsan Soffair;Orly Avner;Dotan Di Castro",
        "authorids": "~Nitsan_Soffair1;~Orly_Avner1;~Dotan_Di_Castro1",
        "gender": "Not Specified;F;M",
        "homepage": "https://sites.google.com/view/nitsan-soffair;;",
        "dblp": "334/4250.html;07/11045;72/538",
        "google_scholar": ";qANr6GYAAAAJ;zhQaFaMAAAAJ",
        "orcid": "0009-0006-5126-5019;;",
        "linkedin": ";;dotan-di-castro-b0a99039/",
        "or_profile": "~Nitsan_Soffair1;~Orly_Avner1;~Dotan_Di_Castro1",
        "aff": "Ben Gurion University of the Negev;Bosch Center for Artificial Inteligence;Bosch",
        "aff_domain": "post.bgu.ac.il;bosch.com;bosch.com",
        "position": "PhD student;Researcher;Bosch Center for Artificial Inteligence",
        "bibtex": "@misc{\nanonymous2024conservative,\ntitle={Conservative Reinforcement Learning by Q-function Disagreement},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=Cfi68cGzIt}\n}",
        "github": "",
        "project": "",
        "reviewers": "bv75;n5m3",
        "site": "https://openreview.net/forum?id=Cfi68cGzIt",
        "pdf_size": 3600354,
        "rating": "3;3",
        "confidence": "4;4",
        "soundness": "2;2",
        "contribution": "1;2",
        "presentation": "3;3",
        "wc_summary": "94;148",
        "wc_strengths": "58;24",
        "wc_weaknesses": "140;201",
        "wc_questions": "52;12",
        "wc_review": "344;385",
        "wc_reply_reviewers": "55;64",
        "wc_reply_authors": "262;243",
        "reply_reviewers": "1;1",
        "reply_authors": "1;1",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            121.0,
            27.0
        ],
        "wc_strengths_avg": [
            41.0,
            17.0
        ],
        "wc_weaknesses_avg": [
            170.5,
            30.5
        ],
        "wc_questions_avg": [
            32.0,
            20.0
        ],
        "wc_review_avg": [
            364.5,
            20.5
        ],
        "wc_reply_reviewers_avg": [
            59.5,
            4.5
        ],
        "wc_reply_authors_avg": [
            252.5,
            9.5
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Ben Gurion University of the Negev;Bosch Center for Artificial Intelligence;Robert Bosch GmbH",
        "aff_unique_dep": ";Center for Artificial Intelligence;",
        "aff_unique_url": "https://www.bgu.ac.il;https://www.bosch-ai.com;https://www.bosch.com",
        "aff_unique_abbr": "BGU;BCAI;Bosch",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "Israel;Germany"
    },
    {
        "id": "CgBhR1NSLM",
        "title": "Visual Analysis of the Bumpiness and Ruggedness of Residual Neural Network Landscapes",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Different neural network architectures result in distinct training and generalization results. For instance, deep residual neural networks are more likely to find better local minima and perform more accurate predictions than deep non-residual neural networks. However, the causes of this phenomenon still require clarification. Some works show that, for convolutional neural networks, the residual connection is beneficial to generating smooth loss landscapes. However, our visual analysis discovers opposite conclusions for MLPs. Specifically, in the XOR, Iris, and Diabetes datasets, residual MLPs tend to produce more rugged loss landscapes with stronger gradients and higher loss values than non-residual MLPs, but they can still converge to low-loss basins of attraction. In the XOR dataset, residual MLPs prefer to generate more attraction basins that are sharper and have lower loss values than non-residual MLPs. Our work advances the knowledge of residual connections.",
        "keywords": "Fitness landscape analysis;residual neural networks;local minima",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/39650ccee740ffd8a0746e03a42de81a0190d572.pdf",
        "author": "Kunyu Wu;Aichun Zhu;Guan-Nan Dong",
        "authorids": "~Kunyu_Wu1;~Aichun_Zhu1;~Guan-Nan_Dong1",
        "gender": "M;M;",
        "homepage": "https://github.com/kennyorn1;;",
        "dblp": ";154/1314.html;",
        "google_scholar": ";https://scholar.google.cz/citations?view_op=list_works;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Kunyu_Wu1;~Aichun_Zhu1;~Guan-Nan_Dong1",
        "aff": "Nanjing Tech University;Nanjing Tech University;",
        "aff_domain": "njtech.edu;njtech.edu.cn;",
        "position": "Undergrad student;Associate Professor;",
        "bibtex": "@misc{\nwu2024visual,\ntitle={Visual Analysis of the Bumpiness and Ruggedness of Residual Neural Network Landscapes},\nauthor={Kunyu Wu and Aichun Zhu and Guan-Nan Dong},\nyear={2024},\nurl={https://openreview.net/forum?id=CgBhR1NSLM}\n}",
        "github": "",
        "project": "",
        "reviewers": "PtGd;TMom;Me3L",
        "site": "https://openreview.net/forum?id=CgBhR1NSLM",
        "pdf_size": 11436120,
        "rating": "3;3;3",
        "confidence": "2;4;5",
        "soundness": "2;2;3",
        "contribution": "2;2;2",
        "presentation": "2;1;2",
        "wc_summary": "77;38;71",
        "wc_strengths": "42;17;185",
        "wc_weaknesses": "207;102;312",
        "wc_questions": "53;47;220",
        "wc_review": "379;204;788",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            1.247219128924647
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            62.0,
            17.146428199482248
        ],
        "wc_strengths_avg": [
            81.33333333333333,
            74.01050976419198
        ],
        "wc_weaknesses_avg": [
            207.0,
            85.73214099741124
        ],
        "wc_questions_avg": [
            106.66666666666667,
            80.17619485995966
        ],
        "wc_review_avg": [
            457.0,
            244.7134378547011
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:X4Q7PUPXkpoJ:scholar.google.com/&scioq=Visual+Analysis+of+the+Bumpiness+and+Ruggedness+of+Residual+Neural+Network+Landscapes&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Nanjing Tech University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.njtech.edu.cn",
        "aff_unique_abbr": "Nanjing Tech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Butterfly Effects of SGD Noise: Error Amplification in Behavior Cloning and Autoregression",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19163",
        "id": "CgPs04l9TO",
        "author_site": "Adam Block, Dylan Foster, Akshay Krishnamurthy, Max Simchowitz, Cyril Zhang",
        "tldr": "",
        "abstract": "This work studies training instabilities of behavior cloning with deep neural networks. We observe that minibatch SGD updates to the policy network during training result in sharp oscillations in long-horizon rewards, despite negligibly affecting the behavior cloning loss. We empirically disentangle the statistical and computational causes of these oscillations, and find them to stem from the chaotic propagation of minibatch SGD noise through unstable closed-loop dynamics.  While SGD noise is benign in the single-step action prediction objective, it results in catastrophic error accumulation over long horizons, an effect we term *gradient variance amplification* (GVA).  We demonstrate that many standard mitigation techniques do not alleviate GVA, but that taking an exponential moving average (EMA) of iterates is surprisingly effective at doing so.  Furthermore, we illustrate the generality of the phenomenon by showing both the existence of GVA and its amelioration by EMA in autoregressive language generation.  Finally, we provide theoretical vignettes both exhibiting the benefits of EMA in alleviating GVA and illustrating the extent to which classical convex models help in understanding the benefits of iterate averaging in deep learning.",
        "keywords": "Deep Learning;Imitation Learning;Stability;Exponential Moving Average;Optimization",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/fef76d4afff904ee8ebd673f3a933200571e95cf.pdf",
        "author": "Adam Block;Dylan J Foster;Akshay Krishnamurthy;Max Simchowitz;Cyril Zhang",
        "authorids": "~Adam_Block1;~Dylan_J_Foster1;~Akshay_Krishnamurthy1;~Max_Simchowitz1;~Cyril_Zhang1",
        "gender": ";;M;M;",
        "homepage": "https://abblock.github.io/index.html;http://dylanfoster.net;https://www.cics.umass.edu/~akshay/;;https://cyrilzhang.com",
        "dblp": "258/1018;167/4271;85/8024;176/5165;203/4448",
        "google_scholar": ";RqwU8xsAAAAJ;https://scholar.google.com.tw/citations?user=K0kaNvkAAAAJ;;sXtjq8IAAAAJ",
        "orcid": "0000-0003-1677-2665;;;;",
        "linkedin": ";;;;",
        "or_profile": "~Adam_Block1;~Dylan_J_Foster1;~Akshay_Krishnamurthy1;~Max_Simchowitz1;~Cyril_Zhang1",
        "aff": "Massachusetts Institute of Technology;Microsoft Research;Microsoft Research;Massachusetts Institute of Technology;Microsoft",
        "aff_domain": "mit.edu;microsoft.com;research.microsoft.com;mit.edu;microsoft.com",
        "position": "PhD student;Principal Researcher;Principal Researcher;Postdoc;Senior Researcher",
        "bibtex": "@inproceedings{\nblock2024butterfly,\ntitle={Butterfly Effects of {SGD} Noise: Error Amplification in Behavior Cloning and Autoregression},\nauthor={Adam Block and Dylan J Foster and Akshay Krishnamurthy and Max Simchowitz and Cyril Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=CgPs04l9TO}\n}",
        "github": "",
        "project": "",
        "reviewers": "fhjo;xe8u;1ahA",
        "pdf_size": 3555795,
        "rating": "3;5;8",
        "confidence": "2;3;3",
        "soundness": "1;3;4",
        "contribution": "2;2;3",
        "presentation": "2;3;4",
        "wc_summary": "20;90;209",
        "wc_strengths": "36;63;163",
        "wc_weaknesses": "83;98;127",
        "wc_questions": "2;45;96",
        "wc_review": "141;296;595",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "351;601;327",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            5.333333333333333,
            2.0548046676563256
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            106.33333333333333,
            78.0185163207356
        ],
        "wc_strengths_avg": [
            87.33333333333333,
            54.62803513052819
        ],
        "wc_weaknesses_avg": [
            102.66666666666667,
            18.263503375736967
        ],
        "wc_questions_avg": [
            47.666666666666664,
            38.42163742245016
        ],
        "wc_review_avg": [
            344.0,
            188.42682045469712
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            426.3333333333333,
            123.89601374629542
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.8029550685469661,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17095171852400840535&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=CgPs04l9TO",
        "pdf": "https://openreview.net/pdf?id=CgPs04l9TO",
        "email": "mit.edu;microsoft.com;research.microsoft.com;mit.edu;microsoft.com",
        "author_num": 5,
        "aff_unique_index": "0;1;1;0;1",
        "aff_unique_norm": "Massachusetts Institute of Technology;Microsoft",
        "aff_unique_dep": ";Microsoft Research",
        "aff_unique_url": "https://web.mit.edu;https://www.microsoft.com/en-us/research",
        "aff_unique_abbr": "MIT;MSR",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "CgU3bllpEQ",
        "title": "On Formal Feature Attribution and Its Approximation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recent years have witnessed the widespread use of artificial intelligence (AI) algorithms and machine learning (ML) models. Despite their tremendous success, a number of vital problems like ML model brittleness, their fairness, and the lack of interpretability warrant the need for the active developments in explainable artificial intelligence (XAI) and formal ML model verification. The two major lines of work in XAI include feature selection methods, e.g. Anchors, and feature attribution techniques, e.g. LIME and SHAP. Despite their promise, most of the existing feature selection and attribution approaches are susceptible to a range of critical issues, including explanation unsoundness and out-of-distribution sampling. A recent formal approach to XAI (FXAI) although serving as an alternative to the above and free of these issues suffers from a few other limitations. For instance and besides the scalability limitation, the formal approach is unable to tackle the feature attribution problem. Additionally, a formal explanation despite being formally sound is typically quite large, which hampers its applicability in practical settings. Motivated by the above, this paper proposes a way to apply the apparatus of formal XAI to the case of feature attribution based on formal explanation enumeration. Formal feature attribution (FFA) is argued to be advantageous over the existing methods, both formal and non-formal. Given the practical complexity of the problem, the paper then proposes an efficient technique for approximating exact FFA. Finally, it offers experimental evidence of the effectiveness of the proposed approximate FFA in comparison to the existing feature attribution algorithms not only in terms of feature importance and but also in terms of their relative order.",
        "keywords": "Feature Attribution;Explainable AI;Formal Explanation;Explainability",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/7b2a6ec28049846d8d4e414dedc152f8ae613b02.zip",
        "author": "Jinqiang Yu;Alexey Ignatiev;Peter J. Stuckey",
        "authorids": "~Jinqiang_Yu1;~Alexey_Ignatiev1;~Peter_J._Stuckey1",
        "gender": "M;M;M",
        "homepage": ";https://alexeyignatiev.github.io/;https://people.eng.unimelb.edu.au/pstuckey/",
        "dblp": "137/6194;26/9729;s/PeterJStuckey",
        "google_scholar": "2_o5eloAAAAJ;https://scholar.google.pt/citations?user=CkHZ6fMAAAAJ;https://scholar.google.com.au/citations?user=tvFekxwAAAAJ",
        "orcid": ";0000-0002-4535-2902;0000-0003-2186-0459",
        "linkedin": ";;peter-stuckey-564620109/",
        "or_profile": "~Jinqiang_Yu1;~Alexey_Ignatiev1;~Peter_J._Stuckey1",
        "aff": "Monash University;Monash University;Monash University",
        "aff_domain": "monash.edu;monash.edu;monash.edu",
        "position": "PhD student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nyu2024on,\ntitle={On Formal Feature Attribution and Its Approximation},\nauthor={Jinqiang Yu and Alexey Ignatiev and Peter J. Stuckey},\nyear={2024},\nurl={https://openreview.net/forum?id=CgU3bllpEQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "2iyx;vzsC;oi1W;LjFe",
        "site": "https://openreview.net/forum?id=CgU3bllpEQ",
        "pdf_size": 1004049,
        "rating": "5;5;5;6",
        "confidence": "3;3;2;3",
        "soundness": "1;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;4;3",
        "wc_summary": "66;39;261;197",
        "wc_strengths": "84;48;44;154",
        "wc_weaknesses": "197;625;154;163",
        "wc_questions": "79;89;104;128",
        "wc_review": "426;801;563;642",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            140.75,
            91.60342515430304
        ],
        "wc_strengths_avg": [
            82.5,
            44.121989982320606
        ],
        "wc_weaknesses_avg": [
            284.75,
            197.09689875794595
        ],
        "wc_questions_avg": [
            100.0,
            18.452642087245934
        ],
        "wc_review_avg": [
            608.0,
            135.6042034746711
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 17,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12994428242656177989&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Monash University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.monash.edu",
        "aff_unique_abbr": "Monash",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Australia"
    },
    {
        "id": "CgkAGcp9lk",
        "title": "Compositional Search of Stable Crystalline Structures in Multi-Component Alloys Using Generative Diffusion Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Exploring the vast composition space of multi-component alloys presents a challenging task for both ab initio (first principles) and experimental methods due to the time-consuming procedures involved. This ultimately impedes the discovery of novel, stable materials that may display exceptional properties. Here, the Crystal Diffusion Variational Autoencoder (CDVAE) model is adapted to characterize the stable compositions of a well studied multi-component alloy, NiFeCr, with two distinct crystalline phases known to be stable across its compositional space. To this end, novel extensions to CDVAE were proposed, enhancing the model\u2019s ability to reconstruct configurations from their latent space within the test set by approximately 30% . A fact that increases a model\u2019s probability of discovering new materials when dealing with various crystalline structures. Afterwards, the new model is applied for materials generation, demonstrating excellent agreement in identifying stable configurations within the ternary phase space when compared to first principles data. Finally, a computationally efficient framework for inverse design is proposed, employing Molecular Dynamics (MD) simulations of multi- component alloys with reliable interatomic potentials, enabling the optimization of materials property across the phase space.",
        "keywords": "Multi-Component Alloys;Generative Diffusion Models;Composition Search;Inverse Design",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/469da0aec6223184f3ddac51a32bbe1b3007f629.pdf",
        "author": "Grzegorz Kaszuba;Amirhossein Naghdi Dorabati;Stefanos Papanikolaou;Andrzej Jaszkiewicz;Piotr Sankowski",
        "authorids": "~Grzegorz_Kaszuba1;~Amirhossein_Naghdi_Dorabati1;~Stefanos_Papanikolaou2;andrzej.jaszkiewicz@put.poznan.pl;~Piotr_Sankowski1",
        "gender": "M;M;M;;",
        "homepage": ";;https://nomaten.ncbj.gov.pl/materials-structure-informatics-and-function;;https://www.mimuw.edu.pl/~sank",
        "dblp": ";;;;80/4282",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;cfM-MWQAAAAJ;;https://scholar.google.pl/citations?user=-5LVg-0AAAAJ",
        "orcid": "0000-0002-8993-1703;;0000-0001-5239-1275;;",
        "linkedin": "grzegorz-kaszuba-08959b251/;amirhossein-naghdi-475067128/;;;",
        "or_profile": "~Grzegorz_Kaszuba1;~Amirhossein_Naghdi_Dorabati1;~Stefanos_Papanikolaou2;andrzej.jaszkiewicz@put.poznan.pl;~Piotr_Sankowski1",
        "aff": "Technical University of Poznan;IDEAS NCBR, Poland;National Center of Nuclear Research;;IDEAS NCBR",
        "aff_domain": "put.poznan.pl;ideas-ncbr.pl;ncbj.gov.pl;;ideas-ncbr.pl",
        "position": "PhD student;Intern;Associate Professor;;CEO",
        "bibtex": "@misc{\nkaszuba2024compositional,\ntitle={Compositional Search of Stable Crystalline Structures in Multi-Component Alloys Using Generative Diffusion Models},\nauthor={Grzegorz Kaszuba and Amirhossein Naghdi Dorabati and Stefanos Papanikolaou and Andrzej Jaszkiewicz and Piotr Sankowski},\nyear={2024},\nurl={https://openreview.net/forum?id=CgkAGcp9lk}\n}",
        "github": "",
        "project": "",
        "reviewers": "uusi;1Sk8;dfH7",
        "site": "https://openreview.net/forum?id=CgkAGcp9lk",
        "pdf_size": 3144522,
        "rating": "3;3;3",
        "confidence": "2;3;3",
        "soundness": "2;2;2",
        "contribution": "2;2;2",
        "presentation": "1;1;2",
        "wc_summary": "14;61;49",
        "wc_strengths": "8;73;52",
        "wc_weaknesses": "248;583;253",
        "wc_questions": "5;45;59",
        "wc_review": "275;762;413",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "613;437;768",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            41.333333333333336,
            19.938795238317574
        ],
        "wc_strengths_avg": [
            44.333333333333336,
            27.0842307543625
        ],
        "wc_weaknesses_avg": [
            361.3333333333333,
            156.7552940803666
        ],
        "wc_questions_avg": [
            36.333333333333336,
            22.88133640230735
        ],
        "wc_review_avg": [
            483.3333333333333,
            204.94281045100254
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            606.0,
            135.22080707741196
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5629914001674605693&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Technical University of Poznan;IDEAS National Centre for Biotechnology;National Center of Nuclear Research;Institute for Development, Economic Analysis, and Simulation (IDEAS)",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.put.poznan.pl/;https://www.ncbr.gov.pl;https://ncnr.edu.pl;https://www.ideas-ncbr.gov.pl",
        "aff_unique_abbr": "PUT;IDEAS NCBR;;IDEAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Poland"
    },
    {
        "id": "CgpiO0DRrk",
        "title": "Video Caching at Data-drifting Network Edge: A KD-based Cross-domain Collaborative Solution",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The explosive growth of video content streaming has led to network congestion and quality decline, making efficient content delivery a significant challenge. To address this, edge caching has emerged as a solution, utilizing mobile edge caching servers like edge base stations (EBS) as a cost-effective approach. Collaborative edge caching has been proposed to address the space limitation of edge servers by enabling cooperation and content sharing among multiple servers, thereby improving caching hit rates (CHR). However, little attention has been paid to the impact of request characteristics on different servers. To tackle this issue, we conducted a study using data collected from Kuaishou company over a period of four weeks, comprising 350 million video requests. Our research findings indicate that request-sparse EBSs significantly impede the overall CHR improvement in the edge caching problem. Knowledge distillation (KD), a technique that transfers knowledge from strong models to weak models, is expected to solve this bottleneck problem. However, traditional KD methods often rely on the assumption of independent and identically distributed data, which may not hold true in real-world scenarios where data drift occurs. We identify two major types of data drift in caching data: temporal drift and spatial drift. To overcome these challenges, we propose an adaptive KD-based cross-domain collaborative edge caching framework, called KDCdCEC, which incorporates three specifically tailored components: i) a slot-wise reinforcement learning agent capable of adapting to EBSs with varying storage sizes, ii) a deep deterministic policy gradient-based algorithm that adaptively configures the reference weights of servers on their partners, and iii) a content-aware request routing mechanism that enhances the decision-making of edge servers. Experimental results show that KDCdCEC outperforms state-of-the-art approaches in terms of average CHR, average latency, and traffic cost.",
        "keywords": "Cooperative edge caching; Data drift; Knowledge distillation",
        "primary_area": "infrastructure, software libraries, hardware, etc.",
        "supplementary_material": "",
        "author": "Jipeng Li;Yuan Meng;Yinmin Zhang;Xin Wang;Zhi Wang;Wenwu Zhu",
        "authorids": "~Jipeng_Li1;~Yuan_Meng2;~Yinmin_Zhang1;~Xin_Wang17;~Zhi_Wang5;~Wenwu_Zhu1",
        "gender": "M;F;F;M;M;M",
        "homepage": ";;https://yinminzhang.github.io/;http://mn.cs.tsinghua.edu.cn/xinwang/;http://zwang.inflexionlab.org/;http://media.cs.tsinghua.edu.cn/en/zww",
        "dblp": ";;289/0508;10/5630-19;95/6543-1;97/6308-1.html",
        "google_scholar": ";https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com.hk/citations?user=aSxDzKUAAAAJ;YPOBHYUAAAAJ;PK8BtpwAAAAJ;https://scholar.google.com.tw/citations?user=7t2jzpgAAAAJ",
        "orcid": "0009-0001-2279-6818;0000-0002-7450-9438;;0000-0002-0351-2939;0000-0002-5462-6178;0000-0003-2236-9290",
        "linkedin": ";;;;zhi-wang-b159071a/;",
        "or_profile": "~Jipeng_Li1;~Yuan_Meng2;~Yinmin_Zhang1;~Xin_Wang17;~Zhi_Wang5;~Wenwu_Zhu1",
        "aff": "Tsinghua University;Tsinghua University;University of Sydney;Tsinghua University;SIGS, Tsinghua University;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;mail.tsinghua.edu.cn;sydney.edu.au;cs.tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "MS student;Assistant Professor;PHD;Associate Professor;Associate Professor;Full Professor",
        "bibtex": "@misc{\nli2024video,\ntitle={Video Caching at Data-drifting Network Edge: A {KD}-based Cross-domain Collaborative Solution},\nauthor={Jipeng Li and Yuan Meng and Yinmin Zhang and Xin Wang and Zhi Wang and Wenwu Zhu},\nyear={2024},\nurl={https://openreview.net/forum?id=CgpiO0DRrk}\n}",
        "github": "",
        "project": "",
        "reviewers": "V6gK;7VV8;eQVV;CiwC",
        "site": "https://openreview.net/forum?id=CgpiO0DRrk",
        "pdf_size": 1758719,
        "rating": "3;5;6;6",
        "confidence": "4;3;2;3",
        "soundness": "2;3;3;3",
        "contribution": "1;2;3;3",
        "presentation": "1;2;2;2",
        "wc_summary": "144;82;91;80",
        "wc_strengths": "91;40;142;47",
        "wc_weaknesses": "714;116;188;280",
        "wc_questions": "6;16;82;7",
        "wc_review": "955;254;503;414",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "575;199;236;387",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            99.25,
            26.166533969939543
        ],
        "wc_strengths_avg": [
            80.0,
            40.786027019066225
        ],
        "wc_weaknesses_avg": [
            324.5,
            232.2687021533465
        ],
        "wc_questions_avg": [
            27.75,
            31.56243811875122
        ],
        "wc_review_avg": [
            531.5,
            260.2772560175015
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            349.25,
            148.1458318684667
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.8660254037844386,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:MKy_QYqLaK8J:scholar.google.com/&scioq=Video+Caching+at+Data-drifting+Network+Edge:+A+KD-based+Cross-domain+Collaborative+Solution&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;0;0",
        "aff_unique_norm": "Tsinghua University;University of Sydney",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.sydney.edu.au",
        "aff_unique_abbr": "THU;USYD",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0;0",
        "aff_country_unique": "China;Australia"
    },
    {
        "id": "CgvZ530jg8",
        "title": "Exponential Quantum Advantage in Communication for Distributed Learning",
        "track": "main",
        "status": "Desk Reject",
        "tldr": "",
        "abstract": "Training and inference with large machine learning models that far exceed the memory capacity of\nindividual devices necessitates the design of distributed architectures, forcing one to contend with\ncommunication constraints. We present a framework for distributed computation over a quantum\nnetwork in which data is encoded into specialized quantum states. We prove that for certain models\nwithin this framework, inference and training using gradient descent can be performed with exponentially less communication compared to their classical analogs, and with relatively modest time\nand space complexity overheads relative to standard gradient-based methods. To our knowledge,\nthis is the first example of exponential quantum advantage for a generic class of machine learning\nproblems with dense classical data that holds regardless of the data encoding cost. Moreover, we\nshow that models in this class can encode highly nonlinear features of their inputs, and their expressivity increases exponentially with model depth. We also find that, interestingly, the communication\nadvantage nearly vanishes for simpler linear classifiers. These results can be combined with natural\nprivacy advantages in the communicated quantum states that limit the amount of information that\ncan be extracted from them about the data and model parameters. Taken as a whole, these findings\nform a promising foundation for distributed machine learning over quantum networks.",
        "keywords": "Distributed learning;communication complexity;quantum computing",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/93f59b3655ceed50aaf7985891915d522426c018.pdf",
        "author": "Dar Gilboa;Jarrod Ryan McClean",
        "authorids": "~Dar_Gilboa1;~Jarrod_Ryan_McClean1",
        "gender": ";M",
        "homepage": ";https://jarrodmcclean.com",
        "dblp": "203/4469;217/3528",
        "google_scholar": ";yVy2ZIwAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Dar_Gilboa1;~Jarrod_Ryan_McClean1",
        "aff": "Google;Research, Google",
        "aff_domain": "google.com;research.google.com",
        "position": "Researcher;Researcher",
        "bibtex": "@misc{\ngilboa2024exponential,\ntitle={Exponential Quantum Advantage in Communication for Distributed Learning},\nauthor={Dar Gilboa and Jarrod Ryan McClean},\nyear={2024},\nurl={https://openreview.net/forum?id=CgvZ530jg8}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=CgvZ530jg8",
        "pdf_size": 739451,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:aIDcvl8fVe4J:scholar.google.com/&scioq=Exponential+Quantum+Advantage+in+Communication+for+Distributed+Learning&hl=en&as_sdt=0,31",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Google",
        "aff_unique_dep": "Google",
        "aff_unique_url": "https://www.google.com",
        "aff_unique_abbr": "Google",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Mountain View",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Error Feedback Reloaded: From Quadratic to Arithmetic Mean of Smoothness Constants",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19162",
        "id": "Ch7WqGcGmb",
        "author_site": "Peter Richtarik, Elnur Gasanov, Konstantin Burlachenko",
        "tldr": "",
        "abstract": "Error feedback (EF) is a highly popular and immensely effective mechanism for fixing convergence issues which arise in distributed training methods (such as distributed GD or SGD) when these are enhanced with greedy communication compression techniques such as Top-k. While EF was proposed almost a decade ago (Seide et al, 2014), and despite concentrated effort by the community to advance the theoretical understanding of this mechanism, there is still a lot to explore. In this work we study a modern form of error feedback called EF21 (Richt\u00e1rik et al, 2021) which offers the currently best-known theoretical guarantees, under the weakest assumptions, and also works well in practice. In particular, while the theoretical communication complexity of EF21 depends on the quadratic mean of certain smoothness parameters, we improve this dependence to their arithmetic mean, which is always smaller, and can be substantially smaller, especially in heterogeneous data regimes. We take the reader on a journey of our discovery process. Starting with the idea of applying EF21 to an equivalent reformulation of the underlying problem which (unfortunately) requires (often impractical) machine cloning, we continue to the discovery of a new weighted version of EF21 which can (fortunately) be executed without any cloning, and finally circle back to an improved analysis of the original EF21 method. While this development applies to the simplest form of EF21, our approach naturally extends to more elaborate variants involving stochastic gradients and partial participation. Further, our technique improves the best-known theory of EF21 in the rare features regime (Richt\u00e1rik et al, 2023). Finally, we validate our theoretical findings with suitable experiments.",
        "keywords": "error feedback;greedy sparsification;distributed optimization;communication complexity;machine cloning;weighted error feedback;quadratic mean;arithmetic mean;large stepsizes",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/a8bf5d77da65d4c9a835ff63dfb4687ca5e39a5f.zip",
        "author": "Peter Richt\u00e1rik;Elnur Gasanov;Konstantin Pavlovich Burlachenko",
        "authorids": "~Peter_Richt\u00e1rik1;~Elnur_Gasanov1;~Konstantin_Pavlovich_Burlachenko1",
        "gender": "M;M;M",
        "homepage": "https://elnurgasanov.com;https://burlachenkok.github.io/;https://richtarik.org",
        "dblp": "231/7651;;62/8001",
        "google_scholar": ";3pA-LoQAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;0000-0003-4380-5848",
        "linkedin": ";burlachenkok/;richtarik/",
        "or_profile": "~Elnur_Gasanov1;~Konstantin_Pavlovich_Konstantin_Burlachenko1;~Peter_Richtarik1",
        "aff": "KAUST;;King Abdullah University of Science and Technology (KAUST)",
        "aff_domain": "kaust.edu.sa;;kaust.edu.sa",
        "position": "PhD student;;Full Professor",
        "bibtex": "@inproceedings{\nricht{\\'a}rik2024error,\ntitle={Error Feedback Reloaded: From Quadratic to Arithmetic Mean of Smoothness Constants},\nauthor={Peter Richt{\\'a}rik and Elnur Gasanov and Konstantin Pavlovich Burlachenko},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Ch7WqGcGmb}\n}",
        "github": "",
        "project": "",
        "reviewers": "uTDX;XNZi;JbXd;ZKKe",
        "pdf_size": 1387647,
        "rating": "3;6;6;8",
        "confidence": "3;2;4;3",
        "soundness": "3;3;4;3",
        "contribution": "2;3;3;3",
        "presentation": "1;4;4;3",
        "wc_summary": "22;56;191;149",
        "wc_strengths": "24;32;117;108",
        "wc_weaknesses": "222;23;131;63",
        "wc_questions": "60;1;52;71",
        "wc_review": "328;112;491;391",
        "wc_reply_reviewers": "0;0;389;0",
        "wc_reply_authors": "1711;330;2372;885",
        "reply_reviewers": "0;0;2;0",
        "reply_authors": "4;3;7;3",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            1.224744871391589
        ],
        "wc_summary_avg": [
            104.5,
            68.22939249326495
        ],
        "wc_strengths_avg": [
            70.25,
            42.463955303292224
        ],
        "wc_weaknesses_avg": [
            109.75,
            75.43664560410942
        ],
        "wc_questions_avg": [
            46.0,
            26.842131062939096
        ],
        "wc_review_avg": [
            330.5,
            138.89654423346897
        ],
        "wc_reply_reviewers_avg": [
            97.25,
            168.44194103607333
        ],
        "wc_reply_authors_avg": [
            1324.5,
            779.2350415631987
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            4.25,
            1.6393596310755
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14433296191814882585&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=Ch7WqGcGmb",
        "pdf": "https://openreview.net/pdf?id=Ch7WqGcGmb",
        "email": "kaust.edu.sa;;kaust.edu.sa",
        "author_num": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "King Abdullah University of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaust.edu.sa",
        "aff_unique_abbr": "KAUST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Saudi Arabia"
    },
    {
        "title": "Transferring Labels to Solve Annotation Mismatches Across Object Detection Datasets",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19161",
        "id": "ChHx5ORqF0",
        "author_site": "Yuan-Hong Liao, David Acuna, Rafid Mahmood, James Lucas, Viraj Prabhu, Sanja Fidler",
        "tldr": "",
        "abstract": "In object detection, varying annotation protocols across datasets can result in annotation mismatches, leading to inconsistent class labels and bounding regions. Addressing these mismatches typically involves manually identifying common trends and fixing the corresponding bounding boxes and class labels. To alleviate this laborious process, we introduce the label transfer problem in object detection. Here, the goal is to transfer bounding boxes from one or more source datasets to match the annotation style of a target dataset. We propose a data-centric approach, Label-Guided Pseudo-Labeling (LGPL), that improves downstream detectors in a manner agnostic to the detector learning algorithms and model architectures. Validating across four object detection scenarios, defined over seven different datasets and three different architectures, we show that transferring labels for a target task via LGPL consistently improves the downstream detection in every setting, on average by $1.88$ mAP and 2.65 AP$^{75}$. Most importantly, we find that when training with multiple labeled datasets, carefully addressing annotation mismatches with LGPL alone can improve downstream object detection better than off-the-shelf supervised domain adaptation techniques that align instance features.",
        "keywords": "object detection;data-centric AI;label translation;dataset improvements",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Yuan-Hong Liao;David Acuna;Rafid Mahmood;James Lucas;Viraj Uday Prabhu;Sanja Fidler",
        "authorids": "~Yuan-Hong_Liao2;~David_Acuna1;~Rafid_Mahmood1;~James_Lucas1;~Viraj_Uday_Prabhu1;~Sanja_Fidler1",
        "gender": "M;M;;M;M;F",
        "homepage": "https://andrewliao11.github.io;http://www.cs.toronto.edu/~davidj/;http://rafidrm.github.io;http://www.cs.toronto.edu/~jlucas/;http://virajprabhu.github.io;http://www.cs.toronto.edu/~fidler/",
        "dblp": "17/2625;217/2906;164/5832;24/2474;199/1973;08/6607",
        "google_scholar": "cL05XGsAAAAJ;https://scholar.google.ca/citations?user=9aFd9dEAAAAJ;https://scholar.google.ca/citations?user=NoPweUQAAAAJ;https://scholar.google.ca/citations?user=AYaHBAQAAAAJ;https://scholar.google.com/citations?hl=en;CUlqK5EAAAAJ",
        "orcid": ";;;;;",
        "linkedin": "andrewliao11/;;;;viraj-prabhu-0a2a9435/;sanja-fidler-2846a1a?trk=hp-identity-name",
        "or_profile": "~Yuan-Hong_Liao2;~David_Acuna1;~Rafid_Mahmood1;~James_Lucas1;~Viraj_Uday_Prabhu1;~Sanja_Fidler1",
        "aff": "University of Toronto;NVIDIA;NVIDIA;NVIDIA;SalesForce.com;Department of Computer Science, University of Toronto",
        "aff_domain": "toronto.edu;nvidia.com;nvidia.com;nvidia.com;salesforce.com;cs.toronto.edu",
        "position": "PhD student;Researcher;Research Scientist;Researcher;Research Scientist;Associate Professor",
        "bibtex": "@inproceedings{\nliao2024transferring,\ntitle={Transferring Labels to Solve Annotation Mismatches Across Object Detection Datasets},\nauthor={Yuan-Hong Liao and David Acuna and Rafid Mahmood and James Lucas and Viraj Uday Prabhu and Sanja Fidler},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ChHx5ORqF0}\n}",
        "github": "",
        "project": "",
        "reviewers": "2kAn;MRBF;XHr3",
        "pdf_size": 6566081,
        "rating": "6;6;6",
        "confidence": "3;4;4",
        "soundness": "2;3;3",
        "contribution": "2;3;2",
        "presentation": "1;3;3",
        "wc_summary": "39;152;91",
        "wc_strengths": "14;69;36",
        "wc_weaknesses": "491;299;144",
        "wc_questions": "2;2;4",
        "wc_review": "546;522;275",
        "wc_reply_reviewers": "324;77;102",
        "wc_reply_authors": "1088;603;654",
        "reply_reviewers": "2;1;1",
        "reply_authors": "2;2;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            94.0,
            46.180804092898455
        ],
        "wc_strengths_avg": [
            39.666666666666664,
            22.60285134421958
        ],
        "wc_weaknesses_avg": [
            311.3333333333333,
            141.93034285247896
        ],
        "wc_questions_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "wc_review_avg": [
            447.6666666666667,
            122.48628041086434
        ],
        "wc_reply_reviewers_avg": [
            167.66666666666666,
            111.01451356566952
        ],
        "wc_reply_authors_avg": [
            781.6666666666666,
            217.60872123045888
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3964290116969756622&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=ChHx5ORqF0",
        "pdf": "https://openreview.net/pdf?id=ChHx5ORqF0",
        "email": "toronto.edu;nvidia.com;nvidia.com;nvidia.com;salesforce.com;cs.toronto.edu",
        "author_num": 6,
        "aff_unique_index": "0;1;1;1;2;0",
        "aff_unique_norm": "University of Toronto;NVIDIA;Salesforce",
        "aff_unique_dep": ";NVIDIA Corporation;",
        "aff_unique_url": "https://www.utoronto.ca;https://www.nvidia.com;https://www.salesforce.com",
        "aff_unique_abbr": "U of T;NVIDIA;Salesforce",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Toronto",
        "aff_country_unique_index": "0;1;1;1;1;0",
        "aff_country_unique": "Canada;United States"
    },
    {
        "id": "ChNy95ovpF",
        "title": "DebateGPT: Fine-tuning Large Language Models with Multi-agent Debate Supervision",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this paper, we introduce DebateGPT, a large language model (LLM), which achieves remarkable performance on language generation, comprehension, and reasoning without heavy reliance on resource-intensive human-in-the-loop feedback. DebateGPT is crafted by fine-tuning GPT-3.5 with a limited set of instructions extracted from Alpaca through a novel approach called multi-agent debate, achieving comparable performance with GPT-4 in various tasks. We leverage multi-agent debate, harnessing less robust but cost-effective LLMs to generate data without human annotations. Surprisingly, after fine-tuning GPT-3.5 on a modest-size Alpaca dataset obtained by multi-agent debate, DebateGPT shows similar results as GPT-4 on the AlpacaEval test set and showcases remarkable zero-shot generalization to new tasks like commonsense reasoning, factuality and mathematics. For example, DebateGPT outperforms GPT-4 by 2.2\\% on the arithmetic task. Notably, DebateGPT is much smaller than GPT-4 and only uses a modest dataset. DebateGPT offers an innovative strategy for training highly effective language models without the need for expensive human-in-the-loop feedback or excessively large architectures.",
        "keywords": "Large Language Models;Fine-tuning;Factuality and Reasoning",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/77e17b733094fe4328dc5081e4078f17ba864e73.zip",
        "author": "Vighnesh Subramaniam;Antonio Torralba;Shuang Li",
        "authorids": "~Vighnesh_Subramaniam1;~Antonio_Torralba1;~Shuang_Li5",
        "gender": ";M;",
        "homepage": "https://vsubramaniam851.github.io;http://web.mit.edu/torralba/www//;",
        "dblp": ";t/AntonioBTorralba;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.com.tw/citations?user=8cxDHS4AAAAJ;",
        "orcid": ";;",
        "linkedin": "vighnesh-subramaniam-34549717b/;;",
        "or_profile": "~Vighnesh_Subramaniam1;~Antonio_Torralba1;~Shuang_Li5",
        "aff": "Massachusetts Institute of Technology;Massachusetts Institute of Technology;",
        "aff_domain": "mit.edu;mit.edu;",
        "position": "MS student;Full Professor;",
        "bibtex": "@misc{\nsubramaniam2024debategpt,\ntitle={Debate{GPT}: Fine-tuning Large Language Models with Multi-agent Debate Supervision},\nauthor={Vighnesh Subramaniam and Antonio Torralba and Shuang Li},\nyear={2024},\nurl={https://openreview.net/forum?id=ChNy95ovpF}\n}",
        "github": "",
        "project": "",
        "reviewers": "9fkA;8M4v;x4r2",
        "site": "https://openreview.net/forum?id=ChNy95ovpF",
        "pdf_size": 1251294,
        "rating": "3;5;5",
        "confidence": "4;3;4",
        "soundness": "2;2;3",
        "contribution": "2;2;2",
        "presentation": "3;3;3",
        "wc_summary": "37;97;290",
        "wc_strengths": "26;37;2",
        "wc_weaknesses": "112;182;2",
        "wc_questions": "12;1;2",
        "wc_review": "187;317;296",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "354;240;1253",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;2",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            141.33333333333334,
            107.93928334433618
        ],
        "wc_strengths_avg": [
            21.666666666666668,
            14.613540144521982
        ],
        "wc_weaknesses_avg": [
            98.66666666666667,
            74.08703590297623
        ],
        "wc_questions_avg": [
            5.0,
            4.96655480858378
        ],
        "wc_review_avg": [
            266.6666666666667,
            56.98147847229737
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            615.6666666666666,
            453.0594761053883
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9721123496455398420&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Massachusetts Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://web.mit.edu",
        "aff_unique_abbr": "MIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Ci6OBuPuYW",
        "title": "Unsupervised Learning Based Object Detection Using Contrastive Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Training image-based object detectors presents formidable challenges, as it entails not only the complexities of object detection but also the added intricacies of precisely localizing objects within potentially diverse and noisy environments. However, the collection of imagery itself can often be straightforward; for instance, cameras mounted in vehicles can effortlessly capture vast amounts of data in various real-world scenarios. In light of this, we introduce a groundbreaking method for training single-stage object detectors through unsupervised/self-supervised learning.\nOur state-of-the-art approach has the potential to revolutionize the labeling process, substantially reducing the time and cost associated with manual annotation. Furthermore, it paves the way for previously unattainable research opportunities, particularly for large, diverse, and challenging datasets lacking extensive labels. \nIn contrast to prevalent unsupervised learning methods that primarily target classification tasks, our approach takes on the unique challenge of object detection. We pioneer the concept of intra-image contrastive learning alongside inter-image counterparts, enabling the acquisition of crucial location information essential for object detection. The method adeptly learns and represents this location information, yielding informative heatmaps. Our results showcase an outstanding accuracy of 89.2%, marking a significant breakthrough of approximately 15x over random initialization in the realm of unsupervised object detection within the field of computer vision.",
        "keywords": "Unsupervised Learning;Object Detection;Representation Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Chandan Kumar;Jansel Herrera-Gerena;John Just;Matthew Darr;Ali Jannesari",
        "authorids": "~Chandan_Kumar1;~Jansel_Herrera-Gerena1;justjo@iastate.edu;~Matthew_Darr1;~Ali_Jannesari1",
        "gender": "M;;;;M",
        "homepage": ";;;;https://www.cs.iastate.edu/swapp/",
        "dblp": "86/5830;;;;74/1277",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;;;https://scholar.google.de/citations?user=YhWnhQEAAAAJ",
        "orcid": "0000-0003-0138-5312;;;;0000-0001-8672-5317",
        "linkedin": ";;;;ali-jannesari-6ab8a56b/",
        "or_profile": "~Chandan_Kumar1;~Jansel_Herrera-Gerena1;justjo@iastate.edu;~Matthew_Darr1;~Ali_Jannesari1",
        "aff": "Iowa State University;;;;Iowa State University",
        "aff_domain": "iastate.edu;;;;isu.edu",
        "position": "PhD student;;;;Associate Professor",
        "bibtex": "@misc{\nkumar2024unsupervised,\ntitle={Unsupervised Learning Based Object Detection Using Contrastive Learning},\nauthor={Chandan Kumar and Jansel Herrera-Gerena and John Just and Matthew Darr and Ali Jannesari},\nyear={2024},\nurl={https://openreview.net/forum?id=Ci6OBuPuYW}\n}",
        "github": "",
        "project": "",
        "reviewers": "4XTS;R8pY;kZgj;xWJr;eqLV;UeWi",
        "site": "https://openreview.net/forum?id=Ci6OBuPuYW",
        "pdf_size": 5177620,
        "rating": "1;3;3;3;3;5",
        "confidence": "5;4;4;3;5;4",
        "soundness": "1;2;1;1;2;2",
        "contribution": "1;1;2;2;2;2",
        "presentation": "1;1;2;2;2;2",
        "wc_summary": "36;50;72;70;9;100",
        "wc_strengths": "26;19;48;51;63;78",
        "wc_weaknesses": "145;98;214;149;6;106",
        "wc_questions": "5;22;32;21;2;48",
        "wc_review": "212;189;366;291;80;332",
        "wc_reply_reviewers": "0;0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0;0",
        "reply_authors": "0;0;0;0;0;0",
        "rating_avg": [
            3.0,
            1.1547005383792515
        ],
        "confidence_avg": [
            4.166666666666667,
            0.6871842709362768
        ],
        "soundness_avg": [
            1.5,
            0.5
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.47140452079103173
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.47140452079103173
        ],
        "wc_summary_avg": [
            56.166666666666664,
            28.96214003756552
        ],
        "wc_strengths_avg": [
            47.5,
            20.238165265985288
        ],
        "wc_weaknesses_avg": [
            119.66666666666667,
            63.21568019267231
        ],
        "wc_questions_avg": [
            21.666666666666668,
            15.627610892974722
        ],
        "wc_review_avg": [
            245.0,
            96.4157663455516
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.42008402520840293,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=650559768443069492&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Iowa State University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.iastate.edu",
        "aff_unique_abbr": "ISU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "CjPt1AC6w0",
        "title": "IS SYNTHETIC DATA USEFUL FOR TRANSFER LEARNING? AN INVESTIGATION INTO DATA GENERATION, VOLUME, AND UTILIZATION",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Synthetic image data generation represents a promising avenue for training deep learning models, particularly in the realm of transfer learning, where obtaining real images within a specific domain can be prohibitively expensive due to privacy and intellectual property considerations. This work delves into the generation and utilization of synthetic images derived from text-to-image generative models in facilitating transfer learning paradigms. Despite the high visual fidelity of the generated images, we observe that their naive incorporation into existing real-image datasets does not consistently enhance model performance due to the inherent distribution gap between synthetic and real images. To address this issue, we introduce a novel two-stage framework called bridged transfer, which initially employs synthetic images for fine-tuning a pre-trained model to improve its transferability and subsequently uses real data for rapid adaptation. Alongside, We propose dataset style inversion strategy to improve the stylistic alignment between synthetic and real images. Our proposed methods are evaluated across 10 different datasets and 5 distinct models, demonstrating consistent improvements, with up to 30% accuracy increase on classification tasks. Intriguingly, we note that the enhancements were not yet saturated, indicating that the benefits may further increase with an expanded volume of synthetic",
        "keywords": "synthetic data;transfer learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/13faa29eafa3880034e0f8ceefca25e2c7c9507e.zip",
        "author": "Yuhang Li;Xin Dong;Chen Chen;Jingtao Li;Yuxin Wen;Michael Spranger;Lingjuan Lyu",
        "authorids": "~Yuhang_Li6;~Xin_Dong1;~Chen_Chen20;~Jingtao_Li1;~Yuxin_Wen2;~Michael_Spranger2;~Lingjuan_Lyu1",
        "gender": "M;M;M;M;;;F",
        "homepage": "https://yhhhli.github.io/;http://www.simonxin.com/;https://cc233.github.io/;https://zlijingtao.github.io;https://yuxinwenrick.github.io/;;https://sites.google.com/view/lingjuan-lyu",
        "dblp": ";25/7257-9;65/4423-43;;;;178/9876",
        "google_scholar": ";O8nBN64AAAAJ;;JIBdJbAAAAAJ;oUYfjg0AAAAJ;;",
        "orcid": ";;0000-0001-7359-8515;0000-0003-4250-869X;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Yuhang_Li6;~Xin_Dong1;~Chen_Chen20;~Jingtao_Li1;~Yuxin_Wen2;~Michael_Spranger2;~Lingjuan_Lyu1",
        "aff": "Sony AI;Sony Research;Sony AI;Sony AI;University of Maryland, College Park;;Sony",
        "aff_domain": "sony.com;sony.com;sony.com;sony.com;umd.edu;;sony.com",
        "position": "Intern;Researcher;Researcher;Researcher;PhD student;;scientist",
        "bibtex": "@misc{\nli2024is,\ntitle={{IS} {SYNTHETIC} {DATA} {USEFUL} {FOR} {TRANSFER} {LEARNING}? {AN} {INVESTIGATION} {INTO} {DATA} {GENERATION}, {VOLUME}, {AND} {UTILIZATION}},\nauthor={Yuhang Li and Xin Dong and Chen Chen and Jingtao Li and Yuxin Wen and Michael Spranger and Lingjuan Lyu},\nyear={2024},\nurl={https://openreview.net/forum?id=CjPt1AC6w0}\n}",
        "github": "",
        "project": "",
        "reviewers": "yiMQ;e2MK;RCjJ;HV3t",
        "site": "https://openreview.net/forum?id=CjPt1AC6w0",
        "pdf_size": 4027750,
        "rating": "5;6;6;8",
        "confidence": "4;4;4;5",
        "soundness": "1;3;2;4",
        "contribution": "2;3;2;4",
        "presentation": "2;3;3;4",
        "wc_summary": "118;194;136;150",
        "wc_strengths": "71;21;97;148",
        "wc_weaknesses": "569;28;260;91",
        "wc_questions": "74;449;212;28",
        "wc_review": "832;692;705;417",
        "wc_reply_reviewers": "567;111;43;48",
        "wc_reply_authors": "2481;1055;1637;592",
        "reply_reviewers": "2;1;1;1",
        "reply_authors": "5;2;3;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            1.118033988749895
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            149.5,
            28.084693339967234
        ],
        "wc_strengths_avg": [
            84.25,
            45.833257575694965
        ],
        "wc_weaknesses_avg": [
            237.0,
            209.61273816254584
        ],
        "wc_questions_avg": [
            190.75,
            163.75496175688846
        ],
        "wc_review_avg": [
            661.5,
            151.38774719243298
        ],
        "wc_reply_reviewers_avg": [
            192.25,
            218.015337763195
        ],
        "wc_reply_authors_avg": [
            1441.25,
            705.3036137012201
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            1.479019945774904
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.9271726499455306,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1104255863617506038&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0;1;2",
        "aff_unique_norm": "Sony;University of Maryland;Sony Corporation",
        "aff_unique_dep": "Sony AI;;",
        "aff_unique_url": "https://www.sony.com;https://www/umd.edu;https://www.sony.com",
        "aff_unique_abbr": "Sony AI;UMD;Sony",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";College Park",
        "aff_country_unique_index": "0;0;0;0;1;0",
        "aff_country_unique": "Japan;United States"
    },
    {
        "id": "CkDon7WpX1",
        "title": "A Consistent Lebesgue Measure for Multi-label Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Multi-label loss functions are usually either non-convex or discontinuous, which is practically challenging or impossible to optimise directly. Instead, surrogate loss functions can quantify and approximate the quality of a predicted label set. However, their consistency with the desired loss functions is not proven. This issue is further exacerbated by the conflicting nature of multi-label loss functions. To learn from multiple related, yet potentially conflicting multi-label loss functions using a unified representation of a model, we propose a Consistent Lebesgue Measure-based Multi-label Learner (CLML). We begin by proving that the optimisation of the Lebesgue measure directly corresponds to the optimisation of multiple multi-label losses, i.e., CLML can achieve theoretical consistency under a Bayes risk framework. Empirical evidence supports our theory by demonstrating that: (1) CLML can consistently achieve a better rank than state-of-the-art methods on a wide range of loss functions and datasets; (2) the primary factor contributing to this performance improvement is the Lebesgue measure design, as CLML optimises a simpler feedforward model without additional label graph or semantic embeddings; and (3) an analysis of the results not only distinguishes CLML's effectiveness but also highlights inconsistencies between the surrogate and the desired loss functions.",
        "keywords": "multi-label learning;consistency;surrogate-free optimisation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/f191f7badd9b60101ee83a394751361431d69dfe.zip",
        "author": "Kaan Demir;Bach Hoai Nguyen;Bing XUE;Mengjie Zhang",
        "authorids": "~Kaan_Demir1;~Bach_Hoai_Nguyen1;~Bing_XUE2;~Mengjie_Zhang1",
        "gender": "M;M;F;M",
        "homepage": "https://ecs.wgtn.ac.nz/Main/GradKaanDemir;;https://homepages.ecs.vuw.ac.nz/~xuebing/index.html;https://homepages.ecs.vuw.ac.nz/~mengjie/",
        "dblp": ";;40/6434-1.html;z/MengjieZhang.html",
        "google_scholar": ";WDKCFTUAAAAJ;https://scholar.google.co.nz/citations?user=RILgdb4AAAAJ;https://scholar.google.co.nz/citations?user=hLvGrrkAAAAJ",
        "orcid": ";;0000-0002-4865-8026;0000-0003-4463-9538",
        "linkedin": ";;;mengjie-zhang-a8b156a7/?originalSubdomain=nz",
        "or_profile": "~Kaan_Demir1;~Bach_Hoai_Nguyen1;~Bing_XUE2;~Mengjie_Zhang1",
        "aff": "Victoria University of Wellington;Victoria University of Wellington;Victoria University of Wellington;Victoria University of Wellington",
        "aff_domain": "vuw.ac.nz;vuw.ac.nz;vuw.ac.nz;vuw.ac.nz",
        "position": "PhD student;Lecturer;Full Professor;Full Professor",
        "bibtex": "@misc{\ndemir2024a,\ntitle={A Consistent Lebesgue Measure for Multi-label Learning},\nauthor={Kaan Demir and Bach Hoai Nguyen and Bing XUE and Mengjie Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=CkDon7WpX1}\n}",
        "github": "",
        "project": "",
        "reviewers": "PXNK;CLFN;Fh3C;XYJ3",
        "site": "https://openreview.net/forum?id=CkDon7WpX1",
        "pdf_size": 2114152,
        "rating": "3;6;6;6",
        "confidence": "2;2;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;2;2",
        "wc_summary": "46;55;76;76",
        "wc_strengths": "41;59;103;66",
        "wc_weaknesses": "107;187;130;98",
        "wc_questions": "113;10;137;37",
        "wc_review": "307;311;446;277",
        "wc_reply_reviewers": "0;197;28;19",
        "wc_reply_authors": "1493;1108;963;649",
        "reply_reviewers": "0;2;1;1",
        "reply_authors": "3;3;2;2",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.0,
            1.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            63.25,
            13.141061600951424
        ],
        "wc_strengths_avg": [
            67.25,
            22.56518335843961
        ],
        "wc_weaknesses_avg": [
            130.5,
            34.64462440264001
        ],
        "wc_questions_avg": [
            74.25,
            52.332470799686114
        ],
        "wc_review_avg": [
            335.25,
            65.27777186761203
        ],
        "wc_reply_reviewers_avg": [
            61.0,
            79.16754385478939
        ],
        "wc_reply_authors_avg": [
            1053.25,
            303.29059909598254
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13861806412549056072&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Victoria University of Wellington",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.victoria.ac.nz",
        "aff_unique_abbr": "VUW",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "New Zealand"
    },
    {
        "id": "CkH1l00p6u",
        "title": "When Treatment Effect Estimation Meets Collider Bias: A Dual Counterfactual Generative Approach",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Collider bias poses a great challenge in estimating the treatment effect from observational data due to the sample selection mechanism on both treatments and outcomes. Previous works mainly focused on addressing confounding bias and selection bias caused by covariates only. However, they failed to accurately estimate the causal effect with collider bias, which is known to be an unidentifiable problem without further assumptions on the observational data. In this paper, we address collider bias in the observational data by introducing small-scale experimental data. Specifically, we treat the collider bias problem from an out-of-distribution perspective, where the selected observational data comes from an environment labeled with $S=1$, and the unselected data comes from another environment labeled with $S=0$. The experimental data comes from the entire data space, but the environment labels are unknown. Then, we propose a novel method named Dual Counterfactual Generative Model (DCGM), which consists of two generators that respectively generate the unselected data and the missing $S$ labels, and two discriminators that discriminate between the observational data and data with generated $S=1$ labels, as well as between the generated unselected samples and data with generated $S=0$ labels for training the generators. Combining the observational data with the unselected samples generated by DCGM, the treatment effect can be accurately estimated using the existing approaches without considering the collider bias. Extensive experiments on synthetic and real-world data demonstrate the effectiveness and the potential application value of the proposed method.",
        "keywords": "Causal Inference;Treatment Effect Estimation;Collider Bias;Selection Bias;Generative Models",
        "primary_area": "causal reasoning",
        "supplementary_material": "",
        "author": "Baohong Li;Haoxuan Li;Kun Kuang;Anpeng Wu;Minqin Zhu;shiyuan Peng;Qingyu Cao;Fei Wu",
        "authorids": "~Baohong_Li1;~Haoxuan_Li6;~Kun_Kuang1;~Anpeng_Wu1;~Minqin_Zhu1;~shiyuan_Peng1;~Qingyu_Cao1;~Fei_Wu1",
        "gender": "M;M;M;M;M;M;M;M",
        "homepage": ";https://haoxuanli-pku.github.io/;http://kunkuang.github.io;https://scholar.google.com.hk/citations?user=VQ4m6zQAAAAJ&hl=zh-CN&oi=sra;https://scholar.google.com/citations?user=bNFv_sUAAAAJ;https://github.com/cqupeng;https://www.taobao.com;https://person.zju.edu.cn/wufei",
        "dblp": "83/3116;145/4965-1.html;194/4245;267/5637;371/6014.html;;;84/3254-1",
        "google_scholar": "M08DvYsAAAAJ;gtDqiucAAAAJ;https://scholar.google.com.hk/citations?user=FOsNiMQAAAAJ;https://scholar.google.com.hk/citations?user=VQ4m6zQAAAAJ;bNFv_sUAAAAJ;;;XJLn4MYAAAAJ",
        "orcid": "0000-0002-3222-002X;0000-0003-3620-3769;0009-0000-7528-8131;0000-0003-3898-7122;0009-0008-9527-8895;;;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Baohong_Li1;~Haoxuan_Li6;~Kun_Kuang1;~Anpeng_Wu1;~Minqin_Zhu1;~shiyuan_Peng1;~Qingyu_Cao1;~Fei_Wu1",
        "aff": "Zhejiang University;Peking University;Zhejiang University;Mohamed bin Zayed University of Artificial Intelligence;Zhejiang University;;;Zhejiang University",
        "aff_domain": "zju.edu.cn;pku.edu.cn;zju.edu.cn;mbzuai.ac.ae;zju.edu.cn;;;zju.edu.cn",
        "position": "PhD student;PhD student;Associate Professor;Researcher;PhD student;;;Full Professor",
        "bibtex": "@misc{\nli2024when,\ntitle={When Treatment Effect Estimation Meets Collider Bias: A Dual Counterfactual Generative Approach},\nauthor={Baohong Li and Haoxuan Li and Kun Kuang and Anpeng Wu and Minqin Zhu and shiyuan Peng and Qingyu Cao and Fei Wu},\nyear={2024},\nurl={https://openreview.net/forum?id=CkH1l00p6u}\n}",
        "github": "",
        "project": "",
        "reviewers": "eRYG;CgS4;NFEC;vwd1",
        "site": "https://openreview.net/forum?id=CkH1l00p6u",
        "pdf_size": 1944654,
        "rating": "3;5;5;6",
        "confidence": "5;3;3;4",
        "soundness": "1;2;3;3",
        "contribution": "1;2;3;4",
        "presentation": "2;3;3;3",
        "wc_summary": "39;85;103;122",
        "wc_strengths": "44;51;88;260",
        "wc_weaknesses": "407;78;169;27",
        "wc_questions": "8;169;18;2",
        "wc_review": "498;383;378;411",
        "wc_reply_reviewers": "0;0;15;0",
        "wc_reply_authors": "252;686;276;82",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            1.118033988749895
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            87.25,
            30.776411421736615
        ],
        "wc_strengths_avg": [
            110.75,
            87.77634932030381
        ],
        "wc_weaknesses_avg": [
            170.25,
            145.8447376493235
        ],
        "wc_questions_avg": [
            49.25,
            69.3735360205893
        ],
        "wc_review_avg": [
            417.5,
            48.14820868942063
        ],
        "wc_reply_reviewers_avg": [
            3.75,
            6.49519052838329
        ],
        "wc_reply_authors_avg": [
            324.0,
            221.977476334875
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.6225430174794673,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:QLfZRk1Hy_0J:scholar.google.com/&scioq=When+Treatment+Effect+Estimation+Meets+Collider+Bias:+A+Dual+Counterfactual+Generative+Approach&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;2;0;0",
        "aff_unique_norm": "Zhejiang University;Peking University;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.zju.edu.cn;http://www.pku.edu.cn;https://mbzuai.ac.ae",
        "aff_unique_abbr": "ZJU;Peking U;MBZUAI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0;0",
        "aff_country_unique": "China;United Arab Emirates"
    },
    {
        "id": "CkrqCY0GhW",
        "title": "Language Model Agents Suffer from Compositional Decision Making",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Language model agents (LMA) recently emerged as a promising paradigm on muti-step decision making tasks, often outperforming humans and other reinforcement learning agents.\nDespite the promise, their performance on real-world applications that often involve combinations of tasks is still underexplored.\nIn this work, we introduce a new benchmark, called CompWoB -- 50 new compositional web automation tasks reflecting more realistic assumptions.\nWe show that while existing prompted LMAs (gpt-3.5-turbo or gpt-4) achieve 94.0% average success rate on base tasks, their performance degrades to 24.9% success rate on compositional tasks.\nOn the other hand, transferred LMAs (finetuned only on base tasks) show less generalization gap, dropping from 85.4% to 54.8%.\nBy balancing data distribution across tasks, we train a new model, HTML-T5++, that surpasses human-level performance (95.2%) on MiniWoB, and achieves the best zero-shot performance on CompWoB (61.0%).\nWhile these highlight the promise of small-scale finetuned and transferred models for compositional generalization, their performance further degrades under different instruction compositions changing combinational order.\nIn contrast to the recent remarkable success of LMA, our benchmark and detailed analysis emphasize the necessity of building LMAs that are robust and generalizable to task compositionality for real-world deployment.",
        "keywords": "Language Model Agents;Large Language Models;Web Automation;Web Navigation;Tool Use",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Hiroki Furuta;Yutaka Matsuo;Aleksandra Faust;Izzeddin Gur",
        "authorids": "~Hiroki_Furuta1;~Yutaka_Matsuo1;~Aleksandra_Faust1;~Izzeddin_Gur1",
        "gender": "M;M;F;",
        "homepage": "https://github.com/frt03;http://ymatsuo.com;http://www.afaust.info;",
        "dblp": "267/2065;m/YMatsuo.html;135/8420;188/9027",
        "google_scholar": "M0OhM1UAAAAJ;Dy8iau4AAAAJ;RK72t68AAAAJ;qS_ugJAAAAAJ",
        "orcid": ";;0000-0002-3268-8685;",
        "linkedin": ";;aleksandrafaust;",
        "or_profile": "~Hiroki_Furuta1;~Yutaka_Matsuo1;~Aleksandra_Faust1;~Izzeddin_Gur1",
        "aff": "Google DeepMind;The University of Tokyo;Google Brain;Google",
        "aff_domain": "google.com;u-tokyo.ac.jp;google.com;google.com",
        "position": "Intern;Associate Professor;Principal Researcher;Research Scientist",
        "bibtex": "@misc{\nfuruta2024language,\ntitle={Language Model Agents Suffer from Compositional Decision Making},\nauthor={Hiroki Furuta and Yutaka Matsuo and Aleksandra Faust and Izzeddin Gur},\nyear={2024},\nurl={https://openreview.net/forum?id=CkrqCY0GhW}\n}",
        "github": "",
        "project": "",
        "reviewers": "qv9D;MfTP;PK52;G9qb",
        "site": "https://openreview.net/forum?id=CkrqCY0GhW",
        "pdf_size": 559770,
        "rating": "6;6;6;8",
        "confidence": "4;3;3;4",
        "soundness": "3;3;3;4",
        "contribution": "3;2;2;3",
        "presentation": "3;3;4;4",
        "wc_summary": "49;115;39;52",
        "wc_strengths": "117;51;29;114",
        "wc_weaknesses": "3;71;213;34",
        "wc_questions": "255;17;2;3",
        "wc_review": "424;254;283;203",
        "wc_reply_reviewers": "12;50;12;19",
        "wc_reply_authors": "620;530;266;125",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            63.75,
            29.978117018918983
        ],
        "wc_strengths_avg": [
            77.75,
            38.557586802080856
        ],
        "wc_weaknesses_avg": [
            80.25,
            80.33484611300379
        ],
        "wc_questions_avg": [
            69.25,
            107.40664551134627
        ],
        "wc_review_avg": [
            291.0,
            81.95425553319363
        ],
        "wc_reply_reviewers_avg": [
            23.25,
            15.706288549495072
        ],
        "wc_reply_authors_avg": [
            385.25,
            198.75283016852867
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:AavXfovClOsJ:scholar.google.com/&scioq=Language+Model+Agents+Suffer+from+Compositional+Decision+Making&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Google;University of Tokyo",
        "aff_unique_dep": "Google DeepMind;",
        "aff_unique_url": "https://deepmind.com;https://www.u-tokyo.ac.jp",
        "aff_unique_abbr": "DeepMind;UTokyo",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;2;2",
        "aff_country_unique": "United Kingdom;Japan;United States"
    },
    {
        "id": "ClqyY6Bvb7",
        "title": "ChEF: A Comprehensive Evaluation Framework for Standardized Assessment of Multimodal Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Multimodal Large Language Models (MLLMs) have shown impressive abilities in interacting with visual content with myriad potential downstream tasks. However, even though a list of benchmarks has been proposed, the capabilities and limitations of MLLMs are still not comprehensively understood, due to a lack of a standardized and holistic evaluation framework. To this end, we present the first Comprehensive Evaluation Framework (ChEF) that can holistically profile each MLLM and fairly compare different MLLMs. First, we structure ChEF as four modular components, i.e., Scenario as scalable multimodal datasets, Instruction as flexible instruction retrieving formulae, Inferencer as reliable question-answering strategies, and Metric as indicative task-specific score functions. Based on them, ChEF facilitates versatile evaluations in a standardized framework, and new evaluations can be built by designing new Recipes (systematic selection of these four components). Notably, current MLLM benchmarks can be readily summarized as recipes of ChEF. Second, we introduce 6 new recipes to quantify competent MLLMs\u2019 desired capabilities (or called desiderata, i.e., calibration, in-context learning, instruction following, language performance, hallucination, and robustness) as reliable agents that can perform real-world multimodal interactions. Third, we conduct a large-scale evaluation of 9 prominent MLLMs on 9 scenarios and 6 desiderata. Our evaluation summarized over 20 valuable observations concerning the generalizability of MLLMs across various scenarios and the composite capability of MLLMs required for multimodal interactions. We will publicly release all the detailed implementations for further analysis, as well as an easy-to-use modular toolkit for the integration of new recipes and models, so that ChEF can be a growing evaluation framework for the MLLM community.",
        "keywords": "benchmark;multimodal large language model;evaluation framework",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/c6feba364bdf57a22ee8080f91fbb34164ccf150.pdf",
        "author": "Zhelun Shi;Zhipin Wang;Hongxing Fan;Zhenfei Yin;Lu Sheng;Jing Shao",
        "authorids": "~Zhelun_Shi1;~Zhipin_Wang2;~Hongxing_Fan1;~Zhenfei_Yin2;~Lu_Sheng1;~Jing_Shao3",
        "gender": "M;M;M;M;M;F",
        "homepage": "https://github.com/Coach257;https://github.com/Puck-U;https://scholar.google.com/citations?hl=zh-CN&user=Wnk95ccAAAAJ;https://yinzhenfei.github.io/;https://lucassheng.github.io/;https://amandajshao.github.io/",
        "dblp": "349/3643;360/1193;283/4695;271/0669;132/1772;",
        "google_scholar": "EDLcoVkAAAAJ;;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com.hk/citations?user=ngPR1dIAAAAJ;https://scholar.google.com.hk/citations?user=_8lB7xcAAAAJ;VU5ObUwAAAAJ",
        "orcid": "0009-0005-4079-7426;;0009-0003-4525-8777;0000-0002-8666-1103;0000-0002-8525-9163;",
        "linkedin": ";;;zhenfei-yin/;;",
        "or_profile": "~Zhelun_Shi1;~Zhipin_Wang2;~Hongxing_Fan1;~Zhenfei_Yin2;~Lu_Sheng1;~Jing_Shao3",
        "aff": "Beihang University;Beihang University;Beihang University;Shanghai AI Laboratory;Beihang University;Shanghai AI Laboratory",
        "aff_domain": "buaa.edu.cn;buaa.edu.cn;buaa.edu.cn;pjlab.org.cn;buaa.edu.cn;pjlab.org.cn",
        "position": "MS student;MS student;PhD student;Intern;Associate Professor;Researcher",
        "bibtex": "@misc{\nshi2024chef,\ntitle={Ch{EF}: A Comprehensive Evaluation Framework for Standardized Assessment of Multimodal Large Language Models},\nauthor={Zhelun Shi and Zhipin Wang and Hongxing Fan and Zhenfei Yin and Lu Sheng and Jing Shao},\nyear={2024},\nurl={https://openreview.net/forum?id=ClqyY6Bvb7}\n}",
        "github": "",
        "project": "",
        "reviewers": "V16Y;ZiWA;n4Xu;mfBa",
        "site": "https://openreview.net/forum?id=ClqyY6Bvb7",
        "pdf_size": 3372646,
        "rating": "3;6;6;8",
        "confidence": "3;4;5;4",
        "soundness": "2;3;3;3",
        "contribution": "3;3;2;4",
        "presentation": "2;3;3;3",
        "wc_summary": "85;43;44;64",
        "wc_strengths": "23;83;41;41",
        "wc_weaknesses": "238;58;113;41",
        "wc_questions": "12;2;16;2",
        "wc_review": "358;186;214;148",
        "wc_reply_reviewers": "0;48;0;0",
        "wc_reply_authors": "841;696;994;792",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "2;2;3;2",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            59.0,
            17.190113437671084
        ],
        "wc_strengths_avg": [
            47.0,
            22.045407685048602
        ],
        "wc_weaknesses_avg": [
            112.5,
            77.18970138561232
        ],
        "wc_questions_avg": [
            8.0,
            6.164414002968976
        ],
        "wc_review_avg": [
            226.5,
            79.4528161867155
        ],
        "wc_reply_reviewers_avg": [
            12.0,
            20.784609690826528
        ],
        "wc_reply_authors_avg": [
            830.75,
            107.72041357143037
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5940885257860046,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5655603254497925755&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;1;0;1",
        "aff_unique_norm": "Beihang University;Shanghai AI Laboratory",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.buaa.edu.cn/;https://www.shanghai-ai-lab.com",
        "aff_unique_abbr": "BUAA;SAIL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "Cn9Cl08zSS",
        "title": "Language Guided Interpretable Image Recognition via Manifold Alignment",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Most works of interpretable neural networks strive for learning the semantics concepts merely from single modal information such as images. However, humans usually learn semantic concepts from multiple modalities and the semantics is encoded by the brain from fused multi-modal information. Inspired by cognitive science and vision-language learning, we propose a two-stream model for learning visual semantic concepts under the guidance of natural language, where a CNN-based vision stream encodes the input image and a Bert-based language stream encodes corresponding text description. Therefore, visual and natural language features reside on different but semantically highly correlated manifolds, \\ie follow a multi-manifold distribution.  We transform the multi-manifold distribution alignment problem into updating the projection matrices by Cayley transform on the Stiefel manifold and  better joint representations are obtained by fusing the semantically similar features from the aligned manifold. In addition, we propose a Manifold Alignment based Prototypical Part Network (MA-ProtoPNet) to learn the semantics concepts from the joint representations, and these concepts can capture more semantic information from multi-modality. We verified the effectiveness of the manifold alignment method through experiments and the proposed framework can provide better interpretability and classification results.",
        "keywords": "Explainable AI;Prototypes;Manifold Alignment",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/3f4f0fe79480f498d10a2a19a98989eab2ea64fd.zip",
        "author": "Jiaqi Wang;Pichao WANG;Fan Wang;Liping Jing",
        "authorids": "~Jiaqi_Wang8;~Pichao_WANG3;~Fan_Wang6;~Liping_Jing3",
        "gender": "M;M;F;F",
        "homepage": "https://github.com/JackeyWang777/;https://wangpichao.github.io/;;",
        "dblp": "44/740-6;;;",
        "google_scholar": "acjXDZwAAAAJ;;WCRGTHsAAAAJ;zStEDu4AAAAJ",
        "orcid": ";;0000-0001-7320-1119;",
        "linkedin": ";;;",
        "or_profile": "~Jiaqi_Wang8;~Pichao_WANG3;~Fan_Wang6;~liping_jing1",
        "aff": "Beijing jiaotong university;Amazon;Alibaba Group;Beijing Jiaotong University",
        "aff_domain": "bjtu.edu.cn;amazon.com;alibaba-inc.com;bjtu.edu.cn",
        "position": "PhD student;Researcher;Senior Staff Algorithm Engineer;Full Professor",
        "bibtex": "@misc{\nwang2024language,\ntitle={Language Guided Interpretable Image Recognition via Manifold Alignment},\nauthor={Jiaqi Wang and Pichao WANG and Fan Wang and Liping Jing},\nyear={2024},\nurl={https://openreview.net/forum?id=Cn9Cl08zSS}\n}",
        "github": "",
        "project": "",
        "reviewers": "CUNM;LvbZ;76Fr",
        "site": "https://openreview.net/forum?id=Cn9Cl08zSS",
        "pdf_size": 1350783,
        "rating": "3;3;6",
        "confidence": "4;3;4",
        "soundness": "3;2;3",
        "contribution": "2;2;3",
        "presentation": "2;2;2",
        "wc_summary": "92;81;104",
        "wc_strengths": "72;65;12",
        "wc_weaknesses": "207;231;122",
        "wc_questions": "44;109;4",
        "wc_review": "415;486;242",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            92.33333333333333,
            9.392668535736915
        ],
        "wc_strengths_avg": [
            49.666666666666664,
            26.78722747048592
        ],
        "wc_weaknesses_avg": [
            186.66666666666666,
            46.76418382575375
        ],
        "wc_questions_avg": [
            52.333333333333336,
            43.26918328582389
        ],
        "wc_review_avg": [
            381.0,
            102.47276060820586
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:luSv0RLubUYJ:scholar.google.com/&scioq=Language+Guided+Interpretable+Image+Recognition+via+Manifold+Alignment&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Beijing Jiao Tong University;Amazon;Alibaba Group",
        "aff_unique_dep": ";Amazon.com, Inc.;",
        "aff_unique_url": "http://www.bjtu.edu.cn;https://www.amazon.com;https://www.alibaba.com",
        "aff_unique_abbr": "BJTU;Amazon;Alibaba",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "Cnn60wwTe1",
        "title": "Which mode is better for federated learning? Centralized or Decentralized",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Both centralized and decentralized approaches have shown excellent performance and great application value in federated learning (FL). However, current studies do not provide sufficient evidence to show which one performs better. Although from the optimization perspective, decentralized methods can approach the comparable convergence of centralized methods with less communication, its test performance has always been inefficient in empirical studies. To comprehensively explore their behaviors in FL, we study their excess risks, including the joint analysis of both optimization and generalization. We prove that on smooth non-convex objectives, 1) centralized FL (CFL) always generalizes better than decentralized FL (DFL); 2) from perspectives of the excess risk and test error in CFL, adopting partial participation is superior to full participation; and, 3) there is a necessary requirement for the topology in DFL to avoid performance collapse as the training scale increases. Based on some simple hardware metrics, we could evaluate which framework is better in practice. Extensive experiments are conducted on common setups in FL to validate that our theoretical analysis is contextually valid in practical scenarios.",
        "keywords": "Federated learning;centralized;decentralized;excess risk;generalization",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/bc4c6b5606d6bb45dc5cd40dd19885297ac12737.zip",
        "author": "Yan Sun;Li Shen;Dacheng Tao",
        "authorids": "~Yan_Sun3;~Li_Shen1;~Dacheng_Tao1",
        "gender": "M;M;",
        "homepage": ";https://sites.google.com/site/mathshenli/home;",
        "dblp": ";91/3680-8;",
        "google_scholar": "_-hoDQkAAAAJ;yVhgENIAAAAJ;",
        "orcid": "0000-0003-2271-252X;;",
        "linkedin": ";;",
        "or_profile": "~Yan_Sun3;~Li_Shen1;~Dacheng_Tao1",
        "aff": "University of Sydney;JD Explore Academy;",
        "aff_domain": "uni.sydney.edu.au;jd.com;",
        "position": "PhD student;Researcher;",
        "bibtex": "@misc{\nsun2024which,\ntitle={Which mode is better for federated learning? Centralized or Decentralized},\nauthor={Yan Sun and Li Shen and Dacheng Tao},\nyear={2024},\nurl={https://openreview.net/forum?id=Cnn60wwTe1}\n}",
        "github": "",
        "project": "",
        "reviewers": "4LFR;9dRK;3qgW;Fo8N",
        "site": "https://openreview.net/forum?id=Cnn60wwTe1",
        "pdf_size": 1219856,
        "rating": "3;3;6;6",
        "confidence": "4;4;3;3",
        "soundness": "1;2;3;3",
        "contribution": "1;2;3;3",
        "presentation": "1;3;1;3",
        "wc_summary": "33;37;62;66",
        "wc_strengths": "21;12;52;45",
        "wc_weaknesses": "85;321;82;35",
        "wc_questions": "85;30;436;29",
        "wc_review": "224;400;632;175",
        "wc_reply_reviewers": "0;462;17;11",
        "wc_reply_authors": "1196;1412;1505;284",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "3;4;4;2",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.0,
            1.0
        ],
        "wc_summary_avg": [
            49.5,
            14.637281168304447
        ],
        "wc_strengths_avg": [
            32.5,
            16.5
        ],
        "wc_weaknesses_avg": [
            130.75,
            111.61625105691375
        ],
        "wc_questions_avg": [
            145.0,
            169.53023329188218
        ],
        "wc_review_avg": [
            357.75,
            179.08430277386122
        ],
        "wc_reply_reviewers_avg": [
            122.5,
            196.10520135886247
        ],
        "wc_reply_authors_avg": [
            1099.25,
            483.8488271144201
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.25,
            0.82915619758885
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6958960145153580163&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Sydney;JD",
        "aff_unique_dep": ";JD Explore Academy",
        "aff_unique_url": "https://www.sydney.edu.au;",
        "aff_unique_abbr": "USYD;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Australia;"
    },
    {
        "id": "CpgoO6j6W1",
        "title": "DECOUPLING REASONING FROM OBSERVATIONS FOR EFFICIENT AUGMENTED LANGUAGE MODELS",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Augmented Language Models (ALMs) blend the reasoning capabilities of Large Language Models (LLMs) with tools that allow for knowledge retrieval and action execution. Existing ALM systems trigger LLM thought processes while pulling observations from these tools in an interleaved fashion. Specifically, an LLM reasons to call an external tool, gets halted to fetch the tool's response, and then decides the next action based on all preceding response tokens. Such a paradigm, though straightforward and easy to implement, often leads to huge computation complexity from redundant prompts and repeated execution. This study addresses such challenges for the first time, proposing a modular paradigm ReWOO (Reasoning WithOut Observation) that detaches the reasoning process from external observations, thus significantly reducing token consumption. Comprehensive evaluations across six public NLP benchmarks and a curated dataset reveal consistent performance enhancements with our proposed methodology. Notably, ReWOO achieves 5x token efficiency and 4% accuracy improvement on HotpotQA, a multi-step reasoning benchmark. Furthermore, ReWOO demonstrates robustness under tool-failure scenarios. Beyond prompt efficiency, decoupling parametric modules from non-parametric tool calls enables instruction fine-tuning to offload LLMs into smaller language models, thus substantially reducing model sizes. Our illustrative work offloads reasoning ability from 175B GPT3.5 into 7B LLaMA successfully, demonstrating the significant potential for truly efficient and scalable ALM systems. Full code, model, and curated data are released for reproduction.",
        "keywords": "Tool augmented language model;Efficiency;Prompt redundancy;Instruction fine-tuning",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Binfeng Xu;Zhiyuan PENG;Bowen Lei;Subhabrata Mukherjee;Dongkuan Xu",
        "authorids": "~Binfeng_Xu1;~Zhiyuan_PENG2;~Bowen_Lei1;~Subhabrata_Mukherjee2;~Dongkuan_Xu2",
        "gender": "M;M;M;;M",
        "homepage": ";;https://stevenboys.github.io/;https://subhomukherjee.com/;https://dongkuanx27.github.io/",
        "dblp": ";193/1602;334/7726.html;37/11030.html;142/8139",
        "google_scholar": ";j6gmTmsAAAAJ;xF9ZTgYAAAAJ;T4iBN5cAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;0000-0001-7141-7485;;0000-0002-1456-9658",
        "linkedin": "binfeng-xu-1062b3173/;;bowen-lei-9ba238192/;subho87;dongkuan-dk-xu-%F0%9F%87%BA%F0%9F%87%A6-05038087/",
        "or_profile": "~Binfeng_Xu1;~Zhiyuan_PENG2;~Bowen_Lei1;~Subhabrata_Mukherjee2;~Dongkuan_Xu2",
        "aff": "Samsung Research America;North Carolina State University;Texas A&M University - College Station;Hippocratic AI;North Carolina State University",
        "aff_domain": "samsung.com;ncsu.edu;tamu.edu;hippocraticai.com;ncsu.edu",
        "position": "Research Engineer;Postdoc;PhD student;Chief Scientist;Assistant Professor",
        "bibtex": "@misc{\nxu2024decoupling,\ntitle={{DECOUPLING} {REASONING} {FROM} {OBSERVATIONS} {FOR} {EFFICIENT} {AUGMENTED} {LANGUAGE} {MODELS}},\nauthor={Binfeng Xu and Zhiyuan PENG and Bowen Lei and Subhabrata Mukherjee and Dongkuan Xu},\nyear={2024},\nurl={https://openreview.net/forum?id=CpgoO6j6W1}\n}",
        "github": "",
        "project": "",
        "reviewers": "1Xgs;EFq2;Ewxu;s2Wj",
        "site": "https://openreview.net/forum?id=CpgoO6j6W1",
        "pdf_size": 2398562,
        "rating": "3;3;5;6",
        "confidence": "3;5;4;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "113;108;71;62",
        "wc_strengths": "36;61;43;54",
        "wc_weaknesses": "176;289;204;84",
        "wc_questions": "2;73;135;2",
        "wc_review": "327;531;453;202",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            88.5,
            22.299103120977758
        ],
        "wc_strengths_avg": [
            48.5,
            9.656603957913983
        ],
        "wc_weaknesses_avg": [
            188.25,
            73.17231375322227
        ],
        "wc_questions_avg": [
            53.0,
            55.51126011900649
        ],
        "wc_review_avg": [
            378.25,
            125.11070098117106
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.4061811972299616,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11665624336544725858&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;1",
        "aff_unique_norm": "Samsung;North Carolina State University;Texas A&M University;Hippocratic AI",
        "aff_unique_dep": "Samsung Research America;;;",
        "aff_unique_url": "https://www.samsung.com/us/careers/research/;https://www.ncsu.edu;https://www.tamu.edu;https://www.hippocratic.ai",
        "aff_unique_abbr": "SRA;NCSU;TAMU;Hippocratic AI",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";College Station",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "CpiOUOaqh3",
        "title": "PARAMETER OPTIMIZATION FOR EPIDEMIOLOGICAL MODEL WITH GENETIC ALGORITHM",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this study, we propose a variation of the SEIR epidemiological model, called SEPAI3R3O, and apply genetic algorithms to analyze and optimize the associated parameters. This model was developed based on the analysis of sociodemographic and behavioral data from anomalous ICDs (International Classification of Disease) and ICPCs (International Classification of Primary Care) collected from units specialized in SARS (Severe Acute Respiratory Syndrome)(i.e., specifically flu and COVID-19) in the city of Recife, located in northeast Brazil, from April $26, 2020$, to March $7, 2021$. The main objective was to understand the dynamics of disease spread and identify critical factors that influence their spread. One of these factors is the underreporting rate, estimated at around $50\\%,$ which significantly increases cases due to inadequate testing. We could precisely adjust the model parameters using a genetic optimization approach, resulting in more accurate disease dynamics predictions and a more realistic view of the number of people infected by SARS. The results indicate that the SEPAI3R3O model, when optimized with genetic algorithms, could predict the spread of the disease with an effective reproduction rate $R_0$ of $3 (95\\%$ CI $2.8\u20133.2)$ and a growth rate of $0.014 (95\\%$ CI $0.013\u20130.015)$ for the period analyzed. With realistic data, this approach offers a valuable tool for researchers and healthcare professionals in making decisions and formulating more effective intervention strategies.",
        "keywords": "genetic algorithm;epidemiological model;COVID-19",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Cloves Alberto Chaves Lima;Patr\u00edcia Cabral Tedesco",
        "authorids": "~Cloves_Alberto_Chaves_Lima1;pcart@cin.ufpe.br",
        "gender": "M;",
        "homepage": "http://lattes.cnpq.br/8156606806079901;",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": "cloves-alberto-6b084833;",
        "or_profile": "~Cloves_Alberto_Chaves_Lima1;pcart@cin.ufpe.br",
        "aff": "Universidade Federal de Pernambuco, Universidade Federal de Pernambuco;",
        "aff_domain": "cin.ufpe.br;",
        "position": "PhD student;",
        "bibtex": "@misc{\nlima2024parameter,\ntitle={{PARAMETER} {OPTIMIZATION} {FOR} {EPIDEMIOLOGICAL} {MODEL} {WITH} {GENETIC} {ALGORITHM}},\nauthor={Cloves Alberto Chaves Lima and Patr{\\'\\i}cia Cabral Tedesco},\nyear={2024},\nurl={https://openreview.net/forum?id=CpiOUOaqh3}\n}",
        "github": "",
        "project": "",
        "reviewers": "4w3D;yHix;f5YY;gtXp",
        "site": "https://openreview.net/forum?id=CpiOUOaqh3",
        "pdf_size": 498612,
        "rating": "1;1;3;3",
        "confidence": "3;4;3;4",
        "soundness": "1;1;1;2",
        "contribution": "1;1;1;1",
        "presentation": "1;2;2;1",
        "wc_summary": "100;55;98;44",
        "wc_strengths": "20;7;17;20",
        "wc_weaknesses": "98;131;291;443",
        "wc_questions": "49;13;128;97",
        "wc_review": "267;206;534;604",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            1.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.0,
            0.0
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            74.25,
            25.063668925358872
        ],
        "wc_strengths_avg": [
            16.0,
            5.338539126015656
        ],
        "wc_weaknesses_avg": [
            240.75,
            137.70688980584814
        ],
        "wc_questions_avg": [
            71.75,
            44.075928804734225
        ],
        "wc_review_avg": [
            402.75,
            169.45998790274948
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:tWiG_hzWQiIJ:scholar.google.com/&scioq=PARAMETER+OPTIMIZATION+FOR+EPIDEMIOLOGICAL+MODEL+WITH+GENETIC+ALGORITHM&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Universidade Federal de Pernambuco",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ufpe.br",
        "aff_unique_abbr": "UFPE",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Brazil"
    },
    {
        "title": "Efficient Multi-agent Reinforcement Learning by Planning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19160",
        "id": "CpnKq3UJwp",
        "author_site": "Qihan Liu, Jianing Ye, Xiaoteng Ma, Jun Yang, Bin Liang, Chongjie Zhang",
        "tldr": "",
        "abstract": "Multi-agent reinforcement learning (MARL) algorithms have accomplished remarkable breakthroughs in solving large-scale decision-making tasks. Nonetheless, most existing MARL algorithms are model-free, limiting sample efficiency and hindering their applicability in more challenging scenarios. In contrast, model-based reinforcement learning (MBRL), particularly algorithms integrating planning, such as MuZero, has demonstrated superhuman performance with limited data in many tasks. Hence, we aim to boost the sample efficiency of MARL by adopting model-based approaches. However, incorporating planning and search methods into multi-agent systems poses significant challenges. The expansive action space of multi-agent systems often necessitates leveraging the nearly-independent property of agents to accelerate learning. To tackle this issue, we propose the MAZero algorithm, which combines a centralized model with Monte Carlo Tree Search (MCTS) for policy search. We design an ingenious network structure to facilitate distributed execution and parameter sharing. To enhance search efficiency in deterministic environments with sizable action spaces, we introduce two novel techniques: Optimistic Search Lambda (OS($\\lambda$)) and Advantage-Weighted Policy Optimization (AWPO). Extensive experiments on the SMAC benchmark demonstrate that MAZero outperforms model-free approaches in terms of sample efficiency and provides comparable or better performance than existing model-based methods in terms of both sample and computational efficiency.",
        "keywords": "Model-based RL;MARL;Planning;MCTS",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Qihan Liu;Jianing Ye;Xiaoteng Ma;Jun Yang;Bin Liang;Chongjie Zhang",
        "authorids": "~Qihan_Liu1;~Jianing_Ye1;~Xiaoteng_Ma1;~Jun_Yang6;~Bin_Liang5;~Chongjie_Zhang1",
        "gender": "M;M;M;M;M;",
        "homepage": "https://github.com/liuqh16;https://heavycrab.github.io/;https://xtma.github.io/;;;",
        "dblp": ";287/5070;238/3249;;;29/6693",
        "google_scholar": "a3J4_OQAAAAJ;Sc9duQQAAAAJ;CeDFnNMAAAAJ;ZrgN9ssAAAAJ;;LjxqXycAAAAJ",
        "orcid": "0000-0001-6637-8346;;0000-0002-7250-6268;;0000-0002-7163-345X;",
        "linkedin": ";;;;;",
        "or_profile": "~Qihan_Liu1;~Jianing_Ye1;~Xiaoteng_Ma1;~Jun_Yang6;~Bin_Liang5;~Chongjie_Zhang1",
        "aff": "Tsinghua University;Tsinghua University;;Tsinghua University;;Washington University, Saint Louis",
        "aff_domain": "tsinghua.edu.cn;mails.tsinghua.edu.cn;;tsinghua.edu.cn;;wustl.edu",
        "position": "PhD student;MS student;;Assistant Professor;;Associate Professor",
        "bibtex": "@inproceedings{\nliu2024efficient,\ntitle={Efficient Multi-agent Reinforcement Learning by Planning},\nauthor={Qihan Liu and Jianing Ye and Xiaoteng Ma and Jun Yang and Bin Liang and Chongjie Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=CpnKq3UJwp}\n}",
        "github": "",
        "project": "",
        "reviewers": "efig;MHMy;6eaK;iouX",
        "pdf_size": 1328587,
        "rating": "6;6;6;8",
        "confidence": "5;4;3;3",
        "soundness": "3;2;3;3",
        "contribution": "3;2;3;4",
        "presentation": "3;2;3;3",
        "wc_summary": "79;105;99;123",
        "wc_strengths": "41;83;50;132",
        "wc_weaknesses": "513;216;42;44",
        "wc_questions": "34;12;46;158",
        "wc_review": "667;416;237;457",
        "wc_reply_reviewers": "488;65;0;0",
        "wc_reply_authors": "2760;794;472;715",
        "reply_reviewers": "2;2;0;0",
        "reply_authors": "4;2;1;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            101.5,
            15.708278072405008
        ],
        "wc_strengths_avg": [
            76.5,
            35.654592972014136
        ],
        "wc_weaknesses_avg": [
            203.75,
            192.00830060182295
        ],
        "wc_questions_avg": [
            62.5,
            56.46901805415072
        ],
        "wc_review_avg": [
            444.25,
            152.91398726081275
        ],
        "wc_reply_reviewers_avg": [
            138.25,
            203.66439919632492
        ],
        "wc_reply_authors_avg": [
            1185.25,
            916.8934984500654
        ],
        "reply_reviewers_avg": [
            1.0,
            1.0
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16041029718354354371&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=CpnKq3UJwp",
        "pdf": "https://openreview.net/pdf?id=CpnKq3UJwp",
        "email": "tsinghua.edu.cn;mails.tsinghua.edu.cn;;tsinghua.edu.cn;;wustl.edu",
        "author_num": 6,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "Tsinghua University;Washington University in St. Louis",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://wustl.edu",
        "aff_unique_abbr": "THU;WUSTL",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Saint Louis",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "CppEmee0u6",
        "title": "Multimodal Pathway: Improve Transformers with Irrelevant Data from Other Modalities",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We propose to improve transformers of a specific modality with irrelevant data from other modalities, e.g., improve an ImageNet model with audio or point cloud datasets. We would like to highlight that the data samples of the target modality are irrelevant to the other modalities, which distinguishes our method from other works utilizing paired (e.g., CLIP) or interleaved data of different modalities. We propose a methodology named Multimodal Pathway: given a target modality and a transformer designed for it, we use an auxiliary transformer trained with data of another modality and construct pathways to connect components of the two models so that data of the target modality can be processed by both models. In this way, we utilize the universal sequence-to-sequence modeling abilities of transformers obtained from two modalities. As a concrete implementation, we use a modality-specific tokenizer and task-specific head as usual but utilize the transformer blocks of the auxiliary model via a proposed method named Cross-Modal Re-parameterization, which exploits the auxiliary weights without any inference costs. We observe significant and consistent performance improvements with irrelevant data of image, point cloud, video, and audio. For example, on ImageNet-1K, a point-cloud-trained auxiliary transformer can improve an MAE-pretrained ViT by 0.6\\% and a ViT trained from scratch by 5.4\\%. The code and models will be publicly available.",
        "keywords": "Transformer;Multimodal Learning;Pretraining;Re-parameterization",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yiyuan Zhang;Xiaohan Ding;Kaixiong Gong;Yixiao Ge;Ying Shan;Xiangyu Yue",
        "authorids": "~Yiyuan_Zhang1;~Xiaohan_Ding1;~Kaixiong_Gong1;~Yixiao_Ge2;~Ying_Shan2;~Xiangyu_Yue1",
        "gender": "M;M;M;F;M;M",
        "homepage": "https://invictus717.github.io/;https://dingxiaohan.xyz/;;https://geyixiao.com/;;http://xyue.io/",
        "dblp": "163/6458;218/7379;289/0124;228/6649;68/5910;207/7518",
        "google_scholar": "KuYlJCIAAAAJ;CIjw0KoAAAAJ;kBVshUUAAAAJ;TtU74NAAAAAJ;4oXBp9UAAAAJ;-xQ-C1sAAAAJ",
        "orcid": "0000-0001-6643-9698;;;;0000-0001-7673-8325;",
        "linkedin": ";;;;YingShanProfile/;",
        "or_profile": "~Yiyuan_Zhang1;~Xiaohan_Ding1;~Kaixiong_Gong1;~Yixiao_Ge2;~Ying_Shan2;~Xiangyu_Yue1",
        "aff": "The Chinese University of Hong Kong;Tencent AI Lab;The Chinese University of Hong Kong;Tencent;Tencent PCG ARC Lab;The Chinese University of Hong Kong",
        "aff_domain": "ie.cuhk.edu;tencent.com;ie.cuhk.edu;tencent.com;arc.tencent.com;ie.cuhk.edu",
        "position": "PhD student;Researcher;PhD student;Researcher;Director;Assistant Professor",
        "bibtex": "@misc{\nzhang2024multimodal,\ntitle={Multimodal Pathway: Improve Transformers with Irrelevant Data from Other Modalities},\nauthor={Yiyuan Zhang and Xiaohan Ding and Kaixiong Gong and Yixiao Ge and Ying Shan and Xiangyu Yue},\nyear={2024},\nurl={https://openreview.net/forum?id=CppEmee0u6}\n}",
        "github": "",
        "project": "",
        "reviewers": "BGNu;8Bi6;hWyf",
        "site": "https://openreview.net/forum?id=CppEmee0u6",
        "pdf_size": 449671,
        "rating": "3;3;6",
        "confidence": "4;4;2",
        "soundness": "3;2;3",
        "contribution": "2;2;3",
        "presentation": "3;2;3",
        "wc_summary": "51;64;21",
        "wc_strengths": "28;31;48",
        "wc_weaknesses": "164;94;33",
        "wc_questions": "5;3;15",
        "wc_review": "248;192;117",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "782;1330;501",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;2;1",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            45.333333333333336,
            18.00617178142601
        ],
        "wc_strengths_avg": [
            35.666666666666664,
            8.806563209081938
        ],
        "wc_weaknesses_avg": [
            97.0,
            53.522580904387134
        ],
        "wc_questions_avg": [
            7.666666666666667,
            5.2493385826745405
        ],
        "wc_review_avg": [
            185.66666666666666,
            53.667701853370076
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            871.0,
            344.2392578812978
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12876979683033222098&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;0;1;1;0",
        "aff_unique_norm": "Chinese University of Hong Kong;Tencent",
        "aff_unique_dep": ";Tencent AI Lab",
        "aff_unique_url": "https://www.cuhk.edu.hk;https://ai.tencent.com",
        "aff_unique_abbr": "CUHK;Tencent AI Lab",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "Cqrv7Sve7g",
        "title": "Offline Reward Inference on Graph: A New Thinking",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In offline reinforcement learning, reward inference is the key to learning effective policies in practical scenarios. Due to the expensive or unethical nature of environmental interactions in domains such as healthcare and robotics, reward functions are rarely accessible, and the task of inferring rewards becomes challenging. To address this issue, our research focuses on developing a reward inference method that capitalizes on a constrained number of human reward annotations to infer rewards for unlabelled data. Initially, we leverage both the available data and limited reward annotations to construct a reward propagation graph, wherein the edge weights incorporate various influential factors pertaining to the rewards. Subsequently, we employ the constructed graph for transductive reward inference, thereby estimating rewards for unlabelled data. Furthermore, we establish the existence of a fixed point during several iterations of the transductive inference process and demonstrate its at least convergence to a local optimum. Empirical evaluations on locomotion and robotic manipulation tasks substantiate the efficacy of our approach, wherein the utilization of our inferred rewards yields substantial performance enhancements within the offline reinforcement learning framework, particularly when confronted with limited reward annotations.",
        "keywords": "Offline reinforcement learning;Reward learning;Graph",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Bohao Qu;Xiaofeng Cao;Yonggang Zhang;Hechang Chen;Qing Guo;Yi Chang",
        "authorids": "~Bohao_Qu1;~Xiaofeng_Cao2;~Yonggang_Zhang1;~Hechang_Chen2;~Qing_Guo3;~Yi_Chang4",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://ieeexplore.ieee.org/author/37088517338;https://yonggangzhangben.github.io/index.html;http://sai.jlu.edu.cn/info/1094/2387.htm;https://tsingqguo.github.io;http://www.yichang-cs.com;https://xiaofengcaoml.github.io/",
        "dblp": "275/7652.html;27/6859-3;145/1142;25/3038-5;02/5438.html;117/3982-2.html",
        "google_scholar": "Xr4GORcAAAAJ;XSbEr98AAAAJ;EezEcbgAAAAJ;Rj2x4QUAAAAJ;https://scholar.google.com.hk/citations?user=drEkR50AAAAJ;",
        "orcid": "0000-0003-3192-8736;0000-0002-4080-7592;;0000-0003-0974-9299;0000-0003-2697-8093;",
        "linkedin": ";;;;;",
        "or_profile": "~Bohao_Qu1;~Yonggang_Zhang1;~Hechang_Chen2;~Qing_Guo3;~Yi_Chang4;~Xiaofeng_Cao1",
        "aff": "Jilin University;Hong Kong Baptist University;Jilin University; Agency for Science, Technology and Research (A*STAR));Jilin University, China;Jilin University",
        "aff_domain": "jlu.edu.cn;hkbu.edu.hk;jlu.edu.cn;cfar.a-star.edu.sg;jlu.edu.cn;jlu.edu.cn",
        "position": "PhD student;Postdoc;Associate Professor;Researcher;Full Professor;Associate Professor",
        "bibtex": "@misc{\nqu2024offline,\ntitle={Offline Reward Inference on Graph: A New Thinking},\nauthor={Bohao Qu and Xiaofeng Cao and Yonggang Zhang and Hechang Chen and Qing Guo and Yi Chang},\nyear={2024},\nurl={https://openreview.net/forum?id=Cqrv7Sve7g}\n}",
        "github": "",
        "project": "",
        "reviewers": "EMLT;jJQM;kgGb",
        "site": "https://openreview.net/forum?id=Cqrv7Sve7g",
        "pdf_size": 1860117,
        "rating": "6;6;6",
        "confidence": "2;4;4",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "3;2;4",
        "wc_summary": "40;83;80",
        "wc_strengths": "24;101;83",
        "wc_weaknesses": "92;282;2",
        "wc_questions": "82;95;217",
        "wc_review": "238;561;382",
        "wc_reply_reviewers": "0;145;0",
        "wc_reply_authors": "722;1121;740",
        "reply_reviewers": "0;1;0",
        "reply_authors": "1;2;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            67.66666666666667,
            19.601587237318874
        ],
        "wc_strengths_avg": [
            69.33333333333333,
            32.8870119584549
        ],
        "wc_weaknesses_avg": [
            125.33333333333333,
            116.71427600007732
        ],
        "wc_questions_avg": [
            131.33333333333334,
            60.80752877362766
        ],
        "wc_review_avg": [
            393.6666666666667,
            132.12199749558067
        ],
        "wc_reply_reviewers_avg": [
            48.333333333333336,
            68.3536555146996
        ],
        "wc_reply_authors_avg": [
            861.0,
            183.99456513712573
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:7vAcCkcdz0oJ:scholar.google.com/&scioq=Offline+Reward+Inference+on+Graph:+A+New+Thinking&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;2;0;0",
        "aff_unique_norm": "Jilin University;Hong Kong Baptist University;Agency for Science, Technology and Research",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.jlu.edu.cn;https://www.hkbu.edu.hk;https://www.a-star.edu.sg",
        "aff_unique_abbr": "JLU;HKBU;A*STAR",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;1;0;0",
        "aff_country_unique": "China;Singapore"
    },
    {
        "id": "CqzO3z9kVK",
        "title": "Knowledge Fusion by Evolving Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The process of fine-tuning pre-trained language models to aid in downstream NLP tasks is a prevalent technique in NLP research. However, in complex training environments characterized by diverse data domains and tasks, fine-tuned models display varying performance outcomes. The fusion of knowledge across individual models plays a pivotal role in enhancing the performance of a single model. This paper examines the approach of integrating multiple models from diverse training scenarios into a unified model. This unified model excels across various data domains and exhibits the ability to generalize well on out-of-domain data. We propose a knowledge fusion method named model evolving inspired by evolutionary algorithms, which does not need additional training or training data. Our approach involves aggregating the weights of language models into a population and subsequently generating offspring models through mutation and crossover operations. Subsequently, we evaluate the performance of these offspring models in comparison with their parents, thus we can retain the models exhibiting superior performance on development dataset.\nNotably, our proposed model evolving strategy can be employed in conjunction with existing model merging techniques, such as Fisher-weighted averaging and Regression-mean. Through a series of rigorous evaluation experiments, we provide empirical evidence that our proposed method significantly outperforms previous approaches.",
        "keywords": "nature language processing;evolution strategy;knowledge fusion;model merging",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/044193645974986edd35b38bfe4b935efdb8d777.zip",
        "author": "Guodong DU;Hanting Liu;Runhua Jiang;Shuyang Yu;Yifei Guo;Sim Kuan Goh;Ho-Kin Tang",
        "authorids": "~Guodong_DU2;~Hanting_Liu1;~Runhua_Jiang2;~Shuyang_Yu2;~Yifei_Guo2;~Sim_Kuan_Goh2;~Ho-Kin_Tang1",
        "gender": "M;F;M;F;F;M;M",
        "homepage": "https://duguodong7.github.io;;;;;https://simkuangoh.github.io/;http://faculty.hitsz.edu.cn/denghaojian",
        "dblp": "213/8915-4;;;;;152/7784;",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com/citations?hl=en;;sfFLGycAAAAJ;;;https://scholar.google.com.hk/citations?user=a4yjxI4AAAAJ",
        "orcid": ";;;;;;0000-0002-8378-815X",
        "linkedin": "\u56fd\u4e1c-\u675c-30b496169/;hanting-liu-075b44218/;runhua-jiang-295004261/?originalSubdomain=my;shuyang-yu;yifeiguo118/;;",
        "or_profile": "~Guodong_DU2;~Hanting_Liu1;~Runhua_Jiang2;~Shuyang_Yu2;~Yifei_Guo2;~Sim_Kuan_Goh2;~Ho-Kin_Tang1",
        "aff": "Harbin Institute of Technology;Xiamen University;Xiamen University;Xiamen University Malaysia;Xiamen University Malaysia ;Xiamen University Malaysia;Harbin Institute of Technology",
        "aff_domain": "hit.edu.cn;xmu.edu.cn;xmu.edu.cn;xmu.edu.my;xmu.edu.my;xmu.edu.cn;hit.edu.cn",
        "position": "Researcher;Undergrad student;Undergrad student;Undergrad student;Undergrad student;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\ndu2024knowledge,\ntitle={Knowledge Fusion by Evolving Language Models},\nauthor={Guodong DU and Hanting Liu and Runhua Jiang and Shuyang Yu and Yifei Guo and Sim Kuan Goh and Ho-Kin Tang},\nyear={2024},\nurl={https://openreview.net/forum?id=CqzO3z9kVK}\n}",
        "github": "",
        "project": "",
        "reviewers": "zRsU;UukK;zN3R;8A57",
        "site": "https://openreview.net/forum?id=CqzO3z9kVK",
        "pdf_size": 1010363,
        "rating": "3;3;5;6",
        "confidence": "4;5;5;4",
        "soundness": "3;2;2;3",
        "contribution": "3;2;2;3",
        "presentation": "2;1;2;3",
        "wc_summary": "45;41;85;190",
        "wc_strengths": "48;53;52;37",
        "wc_weaknesses": "201;256;118;75",
        "wc_questions": "4;29;102;13",
        "wc_review": "298;379;357;315",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "474;505;703;284",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            90.25,
            60.10563617498778
        ],
        "wc_strengths_avg": [
            47.5,
            6.34428877022476
        ],
        "wc_weaknesses_avg": [
            162.5,
            70.46453008429134
        ],
        "wc_questions_avg": [
            37.0,
            38.58108344772085
        ],
        "wc_review_avg": [
            337.25,
            32.2829289253624
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            491.5,
            148.5572280301433
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.19245008972987526,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:C6NZm4ENUbcJ:scholar.google.com/&scioq=Knowledge+Fusion+by+Evolving+Language+Models&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1;1;1;0",
        "aff_unique_norm": "Harbin Institute of Technology;Xiamen University",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.hit.edu.cn/;https://www.xmu.edu.cn",
        "aff_unique_abbr": "HIT;XMU",
        "aff_campus_unique_index": "0;2;2;2;0",
        "aff_campus_unique": "Harbin;;Malaysia",
        "aff_country_unique_index": "0;0;0;1;1;1;0",
        "aff_country_unique": "China;Malaysia"
    },
    {
        "id": "CrCMEV6oOI",
        "title": "Provably Efficient Policy Optimization with Rare Policy Switches",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "While policy optimization algorithms have demonstrated remarkable empirical success in reinforcement learning (RL) tasks, their theoretical analysis is limited compared to those of value-based algorithms. In this paper, we address the gap by proposing a new provably efficient policy optimization algorithm that incorporates optimistic value estimation and rare policy switches. For linear Markov decision processes (MDPs), our algorithm achieves a regret bound of $\\tilde{O}(d^2 H^2 \\sqrt{T})$, which is the sharpest regret bound of a policy optimization algorithm for linear MDPs. Furthermore, we extend our algorithm to general function approximation and establish a regret bound of  $\\tilde{O}(\\sqrt{T})$. To our best knowledge, this is the first regret guarantee of a policy optimization algorithm with general function approximation. Numerical experiments demonstrate that our algorithm has competitive regret performances compared to the existing RL algorithms while also being computationally efficient, supporting our theoretical claims.",
        "keywords": "reinforcement learning;policy optimization;linear MDP;general function approximation",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Hyungkyu Kang;Min-hwan Oh",
        "authorids": "~Hyungkyu_Kang1;~Min-hwan_Oh1",
        "gender": "M;",
        "homepage": "https://www.linkedin.com/mwlite/in/hyungkyu-kang-46819a276;https://minoh.io",
        "dblp": ";172/0531",
        "google_scholar": ";KzVALFwAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Hyungkyu_Kang1;~Min-hwan_Oh1",
        "aff": "Seoul National University;Seoul National University",
        "aff_domain": "snu.ac.kr;snu.ac.kr",
        "position": "Undergrad student;Assistant Professor",
        "bibtex": "@misc{\nkang2024provably,\ntitle={Provably Efficient Policy Optimization with Rare Policy Switches},\nauthor={Hyungkyu Kang and Min-hwan Oh},\nyear={2024},\nurl={https://openreview.net/forum?id=CrCMEV6oOI}\n}",
        "github": "",
        "project": "",
        "reviewers": "p4hn;cKeF;KS5n;1GBb",
        "site": "https://openreview.net/forum?id=CrCMEV6oOI",
        "pdf_size": 6576344,
        "rating": "3;5;6;8",
        "confidence": "5;3;2;4",
        "soundness": "2;3;2;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "94;94;109;95",
        "wc_strengths": "113;60;74;38",
        "wc_weaknesses": "392;151;251;15",
        "wc_questions": "243;5;32;138",
        "wc_review": "842;310;466;286",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            98.0,
            6.363961030678928
        ],
        "wc_strengths_avg": [
            71.25,
            27.307279249313726
        ],
        "wc_weaknesses_avg": [
            202.25,
            137.9046319019053
        ],
        "wc_questions_avg": [
            104.5,
            94.15545655988292
        ],
        "wc_review_avg": [
            476.0,
            222.32408776378685
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.3721042037676254,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:UJ5AV-eQHqkJ:scholar.google.com/&scioq=Provably+Efficient+Policy+Optimization+with+Rare+Policy+Switches&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Seoul National University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.snu.ac.kr",
        "aff_unique_abbr": "SNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "CsDLcku5cY",
        "title": "Graph Decision Transformer",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Offline Reinforcement Learning (RL) is a challenging task, whose objective is to learn policies from static trajectory data without interacting with the environment. Recently, offline RL has been viewed as a sequence modeling problem, where an agent generates a sequence of subsequent actions based on a set of static transition experiences. However, existing approaches that use Transformers to attend to all tokens plainly may dilute the truly-essential relation priors due to information overload. In this paper, we propose the Graph Decision Transformer (GDT), a novel offline RL approach that models the input sequence into a causal graph to capture potential dependencies between fundamentally different concepts and facilitate temporal and causal relationship learning. GDT uses a Graph Transformer to process the graph inputs with relation-enhanced mechanisms, and an optional Patch Transformer to handle fine-grained spatial information in visual tasks. Our experiments show that GDT matches or surpasses the performance of state-of-the-art offline RL methods on image-based Atari and D4RL benchmarks.",
        "keywords": "decision transformer;graph representation in RL",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/d769b383feaa1ef0d4eb74a2d9d87eb47a45b8e3.pdf",
        "author": "Shengchao Hu;Li Shen;Ya Zhang;Dacheng Tao",
        "authorids": "~Shengchao_Hu1;~Li_Shen1;~Ya_Zhang1;~Dacheng_Tao1",
        "gender": ";M;F;",
        "homepage": ";https://sites.google.com/site/mathshenli/home;https://annzhanglion.github.io/;",
        "dblp": ";91/3680-8;85/3714-2;",
        "google_scholar": ";yVhgENIAAAAJ;pbjw9sMAAAAJ;",
        "orcid": ";;0000-0002-5390-9053;",
        "linkedin": ";;;",
        "or_profile": "~Shengchao_Hu1;~Li_Shen1;~Ya_Zhang1;~Dacheng_Tao1",
        "aff": ";JD Explore Academy;Shanghai Jiaotong University;",
        "aff_domain": ";jd.com;sjtu.edu.cn;",
        "position": ";Researcher;Professor;",
        "bibtex": "@misc{\nhu2024graph,\ntitle={Graph Decision Transformer},\nauthor={Shengchao Hu and Li Shen and Ya Zhang and Dacheng Tao},\nyear={2024},\nurl={https://openreview.net/forum?id=CsDLcku5cY}\n}",
        "github": "",
        "project": "",
        "reviewers": "osuH;ZPDm;nCKe;o23G",
        "site": "https://openreview.net/forum?id=CsDLcku5cY",
        "pdf_size": 875971,
        "rating": "3;5;5;5",
        "confidence": "3;4;3;5",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;2;2",
        "wc_summary": "66;78;85;103",
        "wc_strengths": "32;14;50;115",
        "wc_weaknesses": "358;120;167;353",
        "wc_questions": "58;110;91;6",
        "wc_review": "514;322;393;577",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            83.0,
            13.397761006974262
        ],
        "wc_strengths_avg": [
            52.75,
            38.12725403172906
        ],
        "wc_weaknesses_avg": [
            249.5,
            107.30913288252776
        ],
        "wc_questions_avg": [
            66.25,
            39.44854243188207
        ],
        "wc_review_avg": [
            451.5,
            99.81107153016643
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5222329678670935,
        "gs_citation": 21,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7532548253539529074&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "JD;Shanghai Jiao Tong University",
        "aff_unique_dep": "JD Explore Academy;",
        "aff_unique_url": ";https://www.sjtu.edu.cn",
        "aff_unique_abbr": ";SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "1",
        "aff_country_unique": ";China"
    },
    {
        "title": "Effective pruning of web-scale datasets based on complexity of concept clusters",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19159",
        "id": "CtOA9aN8fr",
        "author_site": "Amro Kamal, Evgenia Rusak, Kushal Tirumala, Wieland Brendel, Kamalika Chaudhuri, Ari Morcos",
        "tldr": "",
        "abstract": "Utilizing massive web-scale datasets has led to unprecedented performance gains in machine learning models, but also imposes outlandish compute requirements for their training. In order to improve training and data efficiency, we here push the limits of pruning large-scale multimodal datasets for training CLIP-style models. Today\u2019s most effective pruning method on ImageNet clusters data samples into separate concepts according to their embedding and prunes away the most proto- typical samples. We scale this approach to LAION and improve it by noting that the pruning rate should be concept-specific and adapted to the complexity of the concept. Using a simple and intuitive complexity measure, we are able to reduce the training cost to a quarter of regular training. More specifically, we are able to outperform the LAION-trained OpenCLIP-ViT-B/32 model on ImageNet zero-shot accuracy by 1.1p.p. while only using 27.7% of the data and training compute. On the DataComp Medium benchmark, we achieve a new state-of-the-art ImageNet zero-shot accuracy and a competitive average zero-shot accuracy on 38 evaluation tasks.",
        "keywords": "pruning;large-scale;data curation;concept-based;LAION;DataComp",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/932b063d5713682ca5dd256ff953eedf1ecf03ad.pdf",
        "author": "Amro Kamal Mohamed Abbas;Evgenia Rusak;Kushal Tirumala;Wieland Brendel;Kamalika Chaudhuri;Ari S. Morcos",
        "authorids": "~Amro_Kamal_Mohamed_Abbas1;~Evgenia_Rusak1;~Kushal_Tirumala1;~Wieland_Brendel1;~Kamalika_Chaudhuri1;~Ari_S._Morcos1",
        "gender": ";F;;M;F;",
        "homepage": ";https://evgeniarusak.github.io/;;;http://cseweb.ucsd.edu/users/kamalika;",
        "dblp": ";245/2556;;37/11107;56/6435;",
        "google_scholar": ";https://scholar.google.de/citations?user=XKc19kkAAAAJ;https://scholar.google.com/citations?hl=en;v-JL-hsAAAAJ;I-DJ7EsAAAAJ;",
        "orcid": ";;;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Amro_Kamal_Mohamed_Abbas1;~Evgenia_Rusak1;~Kushal_Tirumala1;~Wieland_Brendel1;~Kamalika_Chaudhuri1;~Ari_S._Morcos1",
        "aff": ";Max-Planck-Institute for Intelligent Systems, Max-Planck Institute;Research, Facebook;ELLIS Institute T\u00fcbingen;University of California, San Diego;",
        "aff_domain": ";is.mpg.de;research.facebook.com;tue.ellis.eu;ucsd.edu;",
        "position": ";PhD student;Researcher;Principal Researcher;Associate Professor;",
        "bibtex": "@inproceedings{\nabbas2024effective,\ntitle={Effective pruning of web-scale datasets based on complexity of concept clusters},\nauthor={Amro Kamal Mohamed Abbas and Evgenia Rusak and Kushal Tirumala and Wieland Brendel and Kamalika Chaudhuri and Ari S. Morcos},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=CtOA9aN8fr}\n}",
        "github": "",
        "project": "",
        "reviewers": "mnGt;orZi;7m8Z;u5qD",
        "pdf_size": 774867,
        "rating": "3;5;5;8",
        "confidence": "5;4;4;4",
        "soundness": "2;3;3;3",
        "contribution": "1;3;2;3",
        "presentation": "3;3;2;3",
        "wc_summary": "50;111;45;129",
        "wc_strengths": "26;51;28;71",
        "wc_weaknesses": "178;49;103;492",
        "wc_questions": "2;145;85;117",
        "wc_review": "256;356;261;809",
        "wc_reply_reviewers": "0;0;25;0",
        "wc_reply_authors": "382;861;1088;953",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;2;2;2",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            83.75,
            36.84681125959206
        ],
        "wc_strengths_avg": [
            44.0,
            18.425525772688278
        ],
        "wc_weaknesses_avg": [
            205.5,
            171.63697154168153
        ],
        "wc_questions_avg": [
            87.25,
            53.60212215948171
        ],
        "wc_review_avg": [
            420.5,
            227.8118741418015
        ],
        "wc_reply_reviewers_avg": [
            6.25,
            10.825317547305483
        ],
        "wc_reply_authors_avg": [
            821.0,
            266.00469920661175
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.7276068751089989,
        "gs_citation": 26,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11109430094939552910&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=CtOA9aN8fr",
        "pdf": "https://openreview.net/pdf?id=CtOA9aN8fr",
        "email": ";is.mpg.de;research.facebook.com;tue.ellis.eu;ucsd.edu;",
        "author_num": 6,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Max-Planck-Institute for Intelligent Systems;Meta;ELLIS Institute;University of California, San Diego",
        "aff_unique_dep": "Intelligent Systems;Research;;",
        "aff_unique_url": "https://www.mpi-is.mpg.de;https://www.facebook.com;https://ellis.eu/;https://www.ucsd.edu",
        "aff_unique_abbr": "MPI-IS;FB;ELLIS;UCSD",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";T\u00fcbingen;San Diego",
        "aff_country_unique_index": "0;1;0;1",
        "aff_country_unique": "Germany;United States"
    },
    {
        "id": "CtiFwPRMZX",
        "title": "A simple connection from loss flatness to compressed representations in neural networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep neural networks' generalization capacity has been studied in a variety of ways, including at least two distinct categories of approach: one based on the shape of the loss landscape in parameter space, and the other based on the structure of the representation manifold in feature space (that is, in the space of unit activities). These two approaches are related, but they are rarely studied together and explicitly connected. Here, we present a simple analysis that makes such a connection. We show that, in the last phase of learning of deep neural networks, compression of the volume of the manifold of neural representations correlates with the flatness of the loss around the minima explored by ongoing parameter optimization.  We show that this is predicted by a relatively simple mathematical relationship:  loss flatness implies compression of neural representations.  Our results build closely on the prior work of Ma and Ying, which shows how flatness (i.e., small eigenvalues of the loss Hessian) develops in late phases of learning and leads robustness to perturbations in network inputs. Moreover, we show there is no similarly direct connection between local dimensionality and sharpness, suggesting that this property may be controlled by different mechanisms than volume and hence may play a complementary role in neural representations. Overall, we advance a dual perspective on generalization in neural networks in both parameter and feature space.",
        "keywords": "dimensionality;loss flatness;compression",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Shirui Chen;Stefano Recanatesi;Eric Todd SheaBrown",
        "authorids": "~Shirui_Chen1;~Stefano_Recanatesi1;~Eric_Todd_SheaBrown1",
        "gender": "M;M;M",
        "homepage": "https://github.com/chinsengi;;http://faculty.washington.edu/etsb/",
        "dblp": ";;s/EricSheaBrown.html",
        "google_scholar": ";;GyvbrjcAAAAJ",
        "orcid": ";0000-0002-3576-9261;",
        "linkedin": ";;",
        "or_profile": "~Shirui_Chen1;~Stefano_Recanatesi1;~Eric_Shea-Brown1",
        "aff": "University of Washington;University of Washington;University of Washington",
        "aff_domain": "uw.edu;uw.edu;washington.edu",
        "position": "PhD student;Postdoc;Full Professor",
        "bibtex": "@misc{\nchen2024a,\ntitle={A simple connection from loss flatness to compressed representations in neural networks},\nauthor={Shirui Chen and Stefano Recanatesi and Eric Todd SheaBrown},\nyear={2024},\nurl={https://openreview.net/forum?id=CtiFwPRMZX}\n}",
        "github": "",
        "project": "",
        "reviewers": "s2iN;Wiq9;Hwwc;Km7j",
        "site": "https://openreview.net/forum?id=CtiFwPRMZX",
        "pdf_size": 876877,
        "rating": "3;3;6;8",
        "confidence": "4;4;5;3",
        "soundness": "1;3;3;3",
        "contribution": "1;2;3;3",
        "presentation": "1;1;3;3",
        "wc_summary": "94;23;72;60",
        "wc_strengths": "44;33;183;101",
        "wc_weaknesses": "276;322;142;32",
        "wc_questions": "46;20;170;2",
        "wc_review": "460;398;567;195",
        "wc_reply_reviewers": "73;0;0;0",
        "wc_reply_authors": "1016;630;416;167",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            5.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.0,
            1.0
        ],
        "wc_summary_avg": [
            62.25,
            25.733004099793714
        ],
        "wc_strengths_avg": [
            90.25,
            59.44482736117584
        ],
        "wc_weaknesses_avg": [
            193.0,
            114.07453703609758
        ],
        "wc_questions_avg": [
            59.5,
            65.68675665611752
        ],
        "wc_review_avg": [
            405.0,
            135.47878062634015
        ],
        "wc_reply_reviewers_avg": [
            18.25,
            31.60992723813201
        ],
        "wc_reply_authors_avg": [
            557.25,
            311.4445175308116
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:kSPqW5-vQLYJ:scholar.google.com/&scioq=A+simple+connection+from+loss+flatness+to+compressed+representations+in+neural+networks&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Washington",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.washington.edu",
        "aff_unique_abbr": "UW",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "LLCP: Learning Latent Causal Processes for Reasoning-based Video Question Answer",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19158",
        "id": "Cu5wJa5LGO",
        "author_site": "Guangyi Chen, Yuke Li, Xiao Liu, Zijian Li, Eman Al Suradi, Donglai Wei, Kun Zhang",
        "tldr": "",
        "abstract": "Current approaches to Video Question Answering (VideoQA) primarily focus on cross-modality matching, which is limited by the requirement for extensive data annotations and the insufficient capacity for causal reasoning (e.g. attributing accidents). To address these challenges, we introduce a causal framework for video reasoning, termed Learning Latent Causal Processes (LLCP). At the heart of LLCP lies a multivariate generative model designed to analyze the spatial-temporal dynamics of objects within events. Leveraging the inherent modularity of causal mechanisms, we train the model through self-supervised local auto-regression eliminating the need for annotated question-answer pairs. During inference, the model is applied to answer two types of reasoning questions: accident attribution, which infers the cause from observed effects, and counterfactual prediction, which predicts the effects of counterfactual conditions given the factual evidence. In the first scenario, we identify variables that deviate from the established distribution by the learned model, signifying the root cause of accidents. In the second scenario, we replace embeddings of previous variables with counterfactual ones, enabling us to forecast potential developments. Once we have identified these cause/effect variables, natural language answers are derived through a combination of grammatical parsing and a pre-trained vision-language model. We assess the efficacy of LLCP on both synthetic and real-world data, demonstrating comparable performance to supervised methods despite our framework using no paired textual annotations.",
        "keywords": "Video Question Answer;Visual Reasoning;Causal Represetation Learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/6bc923ab1e364483305123c8939eca6a0a8b7801.zip",
        "author": "Guangyi Chen;Yuke Li;Xiao Liu;Zijian Li;Eman Al Suradi;Donglai Wei;Kun Zhang",
        "authorids": "~Guangyi_Chen1;~Yuke_Li1;~Xiao_Liu23;~Zijian_Li1;~Eman_Al_Suradi1;~Donglai_Wei1;~Kun_Zhang1",
        "gender": "M;;M;M;F;M;M",
        "homepage": "https://chengy12.github.io/;;;;;https://donglaiw.github.io/;http://www.andrew.cmu.edu/user/kunz1/",
        "dblp": "c/GuangyiChen-2;;;27/10487;382/3839;89/10116.html;96/3115-1",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;;;j3ilESoAAAAJ;;xF2mhDoAAAAJ;RGoypN4AAAAJ",
        "orcid": ";;;;0000-0002-5994-196X;0000-0002-2329-5484;",
        "linkedin": ";;xiao-l-699069205/;;;;",
        "or_profile": "~Guangyi_Chen1;~Yuke_Li1;~Xiao_Liu23;~Zijian_Li1;~Eman_Al_Suradi1;~Donglai_Wei1;~Kun_Zhang1",
        "aff": "Carnegie Mellon University;;Technische Universit\u00e4t Darmstadt;Mohamed bin Zayed University of Artificial Intelligence;Samsung R&D Institute Jordan (SRJO);Boston College;Carnegie Mellon University",
        "aff_domain": "cmu.edu;;tu-darmstadt.de;mbzuai.ac.ae;samsung.com;bc.edu;cmu.edu",
        "position": "Postdoc;;Researcher;Postdoc;Researcher;Assistant Professor;Associate Professor",
        "bibtex": "@inproceedings{\nchen2024llcp,\ntitle={{LLCP}: Learning Latent Causal Processes for Reasoning-based Video Question Answer},\nauthor={Guangyi Chen and Yuke Li and Xiao Liu and Zijian Li and Eman Al Suradi and Donglai Wei and Kun Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Cu5wJa5LGO}\n}",
        "github": "",
        "project": "",
        "reviewers": "DRzn;dMTZ;naVu;U5ds;6hfp",
        "pdf_size": 3583174,
        "rating": "3;5;6;8;8",
        "confidence": "4;4;3;5;4",
        "soundness": "2;2;2;3;4",
        "contribution": "2;2;3;4;3",
        "presentation": "3;3;2;3;3",
        "wc_summary": "82;71;62;65;81",
        "wc_strengths": "50;29;58;72;218",
        "wc_weaknesses": "127;335;213;55;107",
        "wc_questions": "116;5;270;3;77",
        "wc_review": "375;440;603;195;483",
        "wc_reply_reviewers": "0;0;62;0;0",
        "wc_reply_authors": "1756;2641;2540;815;853",
        "reply_reviewers": "0;0;1;0;0",
        "reply_authors": "6;7;7;2;3",
        "rating_avg": [
            6.0,
            1.8973665961010275
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.6,
            0.8
        ],
        "contribution_avg": [
            2.8,
            0.7483314773547882
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            72.2,
            8.133879763065101
        ],
        "wc_strengths_avg": [
            85.4,
            67.74540574828673
        ],
        "wc_weaknesses_avg": [
            167.4,
            98.0644685908204
        ],
        "wc_questions_avg": [
            94.2,
            97.92936229752546
        ],
        "wc_review_avg": [
            419.2,
            134.53980823533234
        ],
        "wc_reply_reviewers_avg": [
            12.4,
            24.800000000000004
        ],
        "wc_reply_authors_avg": [
            1721.0,
            786.4662739113484
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            5.0,
            2.0976176963403033
        ],
        "replies_avg": [
            34,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.33333333333333337,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16754426804626619065&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=Cu5wJa5LGO",
        "pdf": "https://openreview.net/pdf?id=Cu5wJa5LGO",
        "email": "cmu.edu;;tu-darmstadt.de;mbzuai.ac.ae;samsung.com;bc.edu;cmu.edu",
        "author_num": 7,
        "aff_unique_index": "0;1;2;3;4;0",
        "aff_unique_norm": "Carnegie Mellon University;Technische Universit\u00e4t Darmstadt;Mohamed bin Zayed University of Artificial Intelligence;Samsung;Boston College",
        "aff_unique_dep": ";;;R&D;",
        "aff_unique_url": "https://www.cmu.edu;https://www.tu-darmstadt.de;https://mbzuai.ac.ae;https://www.samsung.com;https://www.bostoncollege.edu",
        "aff_unique_abbr": "CMU;TUD;MBZUAI;SRJO;BC",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Jordan",
        "aff_country_unique_index": "0;1;2;3;0;0",
        "aff_country_unique": "United States;Germany;United Arab Emirates;Jordan"
    },
    {
        "id": "CulHdELJ1S",
        "title": "HUB: Enhancing Learned Optimizers via Hybrid Update-based Strategy",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Learned optimizers are pivotal in meta-learning and recent advancements in scalable learned optimizers have showcased superior performance over traditional, hand-designed counterparts in diverse tasks. However, their adoption is impeded by certain limitations, such as difficulties in handling out-of-distribution tasks, uncontrollable behaviors, and inferior performance in fine-tuning tasks. To address the issue of generalization in these optimizers, we propose a Hybrid-Update-Based (HUB) optimization strategy, inspired by the latest advancements in prompt tuning and result selection techniques in large language and vision models. Compared to previous methodologies (Pr'emont-Schwarz et al., 2022; Heaton et al., 2020), our approach enables a more sophisticated integration between hand-designed and learned optimizers and significantly reduces the computational overhead of hybridization. Our approach broadens the applicability of learned optimizers to tasks beyond their initial training distribution, and it has been validated through a series of diverse tasks, demonstrating significant advantages and unique robustness against out-of-distribution tasks compared to meticulously hyperparameter-tuned competitors. In this paper we also delve into a theoretical analysis of the hybrid strategy's impact on the behaviors and inherent traits of learned optimizers, offering deeper insights into their functionalities and interactions.",
        "keywords": "learn-to-learn;leanred optimizer;hand-designed optimizer;optimization;meta learning;prompt tuning;large model",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/c5cef0ae7f37b383650c8f812d1294c28dce69ab.zip",
        "author": "Gaole Dai;Wei Wu;Ziyu Wang;Jie Fu;Shanghang Zhang;Tiejun Huang",
        "authorids": "~Gaole_Dai1;~Wei_Wu28;~Ziyu_Wang13;~Jie_Fu2;~Shanghang_Zhang4;~Tiejun_Huang1",
        "gender": "M;;M;;;M",
        "homepage": "https://github.com/daviddaiiiii?tab=repositories;;https://tropicalfatfish.github.io/;;;https://idm.pku.edu.cn/~tjhuang/",
        "dblp": ";;;;;h/TiejunHuang",
        "google_scholar": ";;;;;https://scholar.google.com.tw/citations?user=knvEK4AAAAAJ",
        "orcid": ";;;;;0000-0002-4234-6099",
        "linkedin": ";;;;;",
        "or_profile": "~Gaole_Dai1;~Wei_Wu28;~Ziyu_Wang13;~Jie_Fu2;~Shanghang_Zhang4;~Tiejun_Huang1",
        "aff": "Peking University;;Peking University;;;Peking University",
        "aff_domain": "pku.edu.cn;;pku.edu.cn;;;pku.edu.cn",
        "position": "PhD student;;Undergrad student;;;Full Professor",
        "bibtex": "@misc{\ndai2024hub,\ntitle={{HUB}: Enhancing Learned Optimizers via Hybrid Update-based Strategy},\nauthor={Gaole Dai and Wei Wu and Ziyu Wang and Jie Fu and Shanghang Zhang and Tiejun Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=CulHdELJ1S}\n}",
        "github": "",
        "project": "",
        "reviewers": "i8fH;tuob;BBSt;dXMr",
        "site": "https://openreview.net/forum?id=CulHdELJ1S",
        "pdf_size": 7422111,
        "rating": "3;5;5;5",
        "confidence": "4;2;4;4",
        "soundness": "2;3;2;2",
        "contribution": "1;2;2;2",
        "presentation": "3;3;2;1",
        "wc_summary": "80;43;48;118",
        "wc_strengths": "107;38;27;46",
        "wc_weaknesses": "234;35;232;198",
        "wc_questions": "43;88;32;81",
        "wc_review": "464;204;339;443",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "513;430;921;1058",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;2;2",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            72.25,
            29.98645527567405
        ],
        "wc_strengths_avg": [
            54.5,
            31.052375110448477
        ],
        "wc_weaknesses_avg": [
            174.75,
            81.94319678899524
        ],
        "wc_questions_avg": [
            61.0,
            23.947860029656095
        ],
        "wc_review_avg": [
            362.5,
            103.0254822847241
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            730.5,
            265.11931276314067
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:KDjZpq1AfBcJ:scholar.google.com/&scioq=HUB:+Enhancing+Learned+Optimizers+via+Hybrid+Update-based+Strategy&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Peking University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.pku.edu.cn",
        "aff_unique_abbr": "Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "CupHThqQl3",
        "title": "It's About Time: Temporal References in Emergent Communication",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "As humans, we use linguistic elements referencing time, such as \u201cbefore\u201d or \u201ctomorrow\u201d, to easily share past experiences and future predictions. While temporal aspects of the language have been considered in computational linguistics, no such exploration has been done within the field of emergent communication. We research this gap, providing the first reported temporal vocabulary within emergent communication literature. Our experimental analysis shows that a different agent architecture is sufficient for the natural emergence of temporal references, and that no additional losses are necessary. Our readily transferable architectural insights provide the basis for the incorporation of temporal referencing into other emergent communication environments.",
        "keywords": "Emergent Communication;Emergent Language;Temporal Logic",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Olaf Lipinski;Adam Sobey;Federico Cerutti;Timothy J. Norman",
        "authorids": "~Olaf_Lipinski1;~Adam_Sobey1;~Federico_Cerutti1;~Timothy_J._Norman1",
        "gender": "M;M;;M",
        "homepage": "https://olipinski.eu/;https://www.southampton.ac.uk/engineering/about/staff/ajs502.page;;https://www.southampton.ac.uk/people/5xgv5h/professor-tim-norman",
        "dblp": "358/9314;;;23/1018",
        "google_scholar": "https://scholar.google.co.uk/citations?user=W2WANZoAAAAJ;inoZq8AAAAAJ;;https://scholar.google.co.uk/citations?user=mJjmcu0AAAAJ",
        "orcid": "0000-0002-2023-7617;;;0000-0002-6387-4034",
        "linkedin": "olipinski/;;;tim-norman-1a05081/",
        "or_profile": "~Olaf_Lipinski1;~Adam_Sobey1;~Federico_Cerutti1;~Timothy_J._Norman1",
        "aff": "University of Southampton;University of Southampton;;University of Southampton",
        "aff_domain": "soton.ac.uk;soton.ac.uk;;soton.ac.uk",
        "position": "PhD student;Associate Professor;;Full Professor",
        "bibtex": "@misc{\nlipinski2024its,\ntitle={It's About Time: Temporal References in Emergent Communication},\nauthor={Olaf Lipinski and Adam Sobey and Federico Cerutti and Timothy J. Norman},\nyear={2024},\nurl={https://openreview.net/forum?id=CupHThqQl3}\n}",
        "github": "",
        "project": "",
        "reviewers": "WtjD;KopV;RdRa;Avm5",
        "site": "https://openreview.net/forum?id=CupHThqQl3",
        "pdf_size": 1851232,
        "rating": "3;5;5;6",
        "confidence": "4;2;4;3",
        "soundness": "2;2;3;2",
        "contribution": "3;3;2;3",
        "presentation": "2;3;3;2",
        "wc_summary": "60;125;70;112",
        "wc_strengths": "62;165;76;71",
        "wc_weaknesses": "271;627;141;254",
        "wc_questions": "45;267;296;100",
        "wc_review": "438;1184;583;537",
        "wc_reply_reviewers": "52;287;315;41",
        "wc_reply_authors": "721;1689;1152;1259",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;3;2;3",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            91.75,
            27.371289702898547
        ],
        "wc_strengths_avg": [
            93.5,
            41.58425182686349
        ],
        "wc_weaknesses_avg": [
            323.25,
            182.3490814344838
        ],
        "wc_questions_avg": [
            177.0,
            106.78717151418516
        ],
        "wc_review_avg": [
            685.5,
            292.53931359733514
        ],
        "wc_reply_reviewers_avg": [
            173.75,
            127.69372537442864
        ],
        "wc_reply_authors_avg": [
            1205.25,
            344.3242476213373
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.48420012470625223,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16484342832622128391&as_sdt=5,34&sciodt=0,34&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Southampton",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.southampton.ac.uk",
        "aff_unique_abbr": "Southampton",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "title": "On Penalty Methods for Nonconvex Bilevel Optimization and First-Order Stochastic Approximation",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19157",
        "id": "CvYBvgEUK9",
        "author_site": "Jeongyeol Kwon, Dohyun Kwon, Stephen Wright, Robert Nowak",
        "tldr": "",
        "abstract": "In this work, we study first-order algorithms for solving Bilevel Optimization (BO) where the objective functions are smooth but possibly nonconvex in both levels and the variables are restricted to closed convex sets. As a first step, we study the landscape of BO through the lens of penalty methods, in which the upper- and lower-level objectives are combined in a weighted sum with penalty parameter $\\sigma > 0$. In particular, we establish a strong connection between the penalty function and the hyper-objective by explicitly characterizing the conditions under which the values and derivatives of the two must be $O(\\sigma)$-close. A by-product of our analysis is the explicit formula for the gradient of hyper-objective when the lower-level problem has multiple solutions under minimal conditions, which could be of independent interest. Next, viewing the penalty formulation as $O(\\sigma)$-approximation of the original BO, we propose first-order algorithms that find an $\\epsilon$-stationary solution by optimizing the penalty formulation with $\\sigma = O(\\epsilon)$. When the perturbed lower-level problem uniformly satisfies the {\\it small-error} proximal error-bound (EB) condition,  we propose a first-order algorithm that converges to an $\\epsilon$-stationary point of the penalty function using in total $O(\\epsilon^{-7})$ accesses to first-order stochastic gradient oracles. Under an additional assumption on stochastic oracles, we show that the algorithm can be implemented in a fully {\\it single-loop} manner, {\\it i.e.,} with $O(1)$ samples per iteration, and achieves the improved oracle-complexity of $O(\\epsilon^{-5})$.",
        "keywords": "Bilevel-Optimization;Penalty Methods;Landscape Analysis;Non-Asymptotic Analysis;First-Order Methods",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Jeongyeol Kwon;Dohyun Kwon;Stephen Wright;Robert D Nowak",
        "authorids": "~Jeongyeol_Kwon1;~Dohyun_Kwon1;~Stephen_Wright1;~Robert_D_Nowak1",
        "gender": "M;M;M;M",
        "homepage": "https://kwonchungli.github.io/;https://www.dohyunkwon.com/;https://wrightstephen.github.io/sw_proj/;http://nowak.ece.wisc.edu",
        "dblp": "https://dblp.uni-trier.de/pid/228/9224;218/1797-2;75/2677;n/RobertDNowak",
        "google_scholar": "cnyMCYMAAAAJ;dBxpstQAAAAJ;VFQRIOwAAAAJ;fn13u8IAAAAJ",
        "orcid": ";0000-0001-9198-4735;;",
        "linkedin": ";;;",
        "or_profile": "~Jeongyeol_Kwon1;~Dohyun_Kwon1;~Stephen_Wright1;~Robert_D_Nowak1",
        "aff": "University of Wisconsin - Madison;University of Seoul;University of Wisconsin, Madison;University of Wisconsin - Madison",
        "aff_domain": "wisc.edu;uos.ac.kr;wisc.edu;",
        "position": "Postdoc;Assistant Professor;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nkwon2024on,\ntitle={On Penalty Methods for Nonconvex Bilevel Optimization and First-Order Stochastic Approximation},\nauthor={Jeongyeol Kwon and Dohyun Kwon and Stephen Wright and Robert D Nowak},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=CvYBvgEUK9}\n}",
        "github": "",
        "project": "",
        "reviewers": "fS1u;vCGE;dzvn;ocU5;VYCb",
        "pdf_size": 639337,
        "rating": "5;6;6;6;8",
        "confidence": "3;3;3;3;4",
        "soundness": "3;3;3;3;4",
        "contribution": "3;3;3;3;4",
        "presentation": "3;2;3;3;3",
        "wc_summary": "24;57;52;145;61",
        "wc_strengths": "29;80;48;153;80",
        "wc_weaknesses": "240;137;103;51;85",
        "wc_questions": "1151;221;419;261;302",
        "wc_review": "1444;495;622;610;528",
        "wc_reply_reviewers": "0;0;12;0;9",
        "wc_reply_authors": "534;375;171;427;363",
        "reply_reviewers": "0;0;1;0;1",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            6.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.2,
            0.39999999999999997
        ],
        "soundness_avg": [
            3.2,
            0.39999999999999997
        ],
        "contribution_avg": [
            3.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            67.8,
            40.72051080229716
        ],
        "wc_strengths_avg": [
            78.0,
            42.27055712904669
        ],
        "wc_weaknesses_avg": [
            123.2,
            64.67271449382653
        ],
        "wc_questions_avg": [
            470.8,
            346.48659425726703
        ],
        "wc_review_avg": [
            739.8,
            355.36144979443117
        ],
        "wc_reply_reviewers_avg": [
            4.2,
            5.230678732248808
        ],
        "wc_reply_authors_avg": [
            374.0,
            118.101651131557
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.9185586535436918,
        "gs_citation": 27,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1881234685120504353&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=CvYBvgEUK9",
        "pdf": "https://openreview.net/pdf?id=CvYBvgEUK9",
        "email": "wisc.edu;uos.ac.kr;wisc.edu;",
        "author_num": 4,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "University of Wisconsin-Madison;University of Seoul;University of Wisconsin",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.wisc.edu;http://www.useoul.edu;https://www.wisc.edu",
        "aff_unique_abbr": "UW-Madison;UOS;UW",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Madison;",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "United States;South Korea"
    },
    {
        "id": "CvxcWCDX0h",
        "title": "Learning Multi-Modal Representation Alignments from Noisy Data-Pairs",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Contrastive learning~(CL) represents one of the most successful paradigms for self-supervised representation learning, which has been applied to SOTA multi-modal learning applications. One overlooked limitation of standard contrastive learning, however, is that it is not designed for robust learning in the presence of noisy data pairs. For example, not all negative samples are truly negative, {\\it e.g.}, within a mini-batch there can be negative samples that are semantically as positive as the positive sample. This is common in most web-sourced multi-modal datasets such as CC3M and YFCC that are frequently used for CL, due to the noisy nature when crawling the datasets. Consequently, the noise in the datasets could significantly impair the power of CL. To remedy this issue, we propose a novel solution by reformulating the standard CL into a probability framework, and introducing learnable random weights to associate with data pairs, so as to allow automatic inference of the degree of noisiness for each data pair. Within our probability framework, posterior inference of the random weights can be done efficiently with Bayesian data augmentation. Consequently, the model can be effectively optimized by a novel learning algorithm based on stochastic expectation maximization. We demonstrate the effectiveness of our approach on several standard multi-modal contrastive learning benchmarks, which significantly outperforms standard contrastive learning.",
        "keywords": "multi-modal learning;contrastive learning;foundation models",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Qian Jiang;Jingjing Meng;Alireza Bagheri Garakani;Yang Jiao;Yetian Chen;Yikai Ni;Yan Gao;Yi Sun;Changyou Chen",
        "authorids": "~Qian_Jiang1;~Jingjing_Meng1;~Alireza_Bagheri_Garakani1;~Yang_Jiao6;~Yetian_Chen1;yika@amazon.com;~Yan_Gao8;~Yi_Sun13;~Changyou_Chen1",
        "gender": "F;F;;M;M;;F;M;M",
        "homepage": "https://ece.illinois.edu/about/directory/grad-students/qianj3;https://sites.google.com/site/jingjingmengsite/;;;http://web.cs.iastate.edu/~yetianc/;;;;https://www.cse.buffalo.edu/~changyou/",
        "dblp": ";96/1653.html;;09/72131;149/1344;;46/3479-3.html;;65/2802",
        "google_scholar": ";https://scholar.google.com.sg/citations?user=ykFMLGkAAAAJ;;https://scholar.google.com/citations?hl=en;m7xQlmoAAAAJ;;;https://scholar.google.com/scholar?hl=en;LtEcKBcAAAAJ",
        "orcid": ";;;0000-0002-6390-2517;;;0000-0002-8012-1392;;",
        "linkedin": ";;;yang-jiao-1837bb16a/;yetian-chen/;;yan-gao-16a477b/;;",
        "or_profile": "~Qian_Jiang1;~Jingjing_Meng1;~Alireza_Bagheri_Garakani1;~Yang_Jiao6;~Yetian_Chen1;yika@amazon.com;~Yan_Gao8;~Yi_Sun13;~Changyou_Chen1",
        "aff": "University of Illinois, Urbana Champaign;Amazon;;Amazon;Amazon;;Amazon;Amazon;State University of New York, Buffalo",
        "aff_domain": "illinois.edu;amazon.com;;amazon.com;amazon.com;;amazon.com;amazon.com;buffalo.edu",
        "position": "PhD student;Researcher;;Researcher;Applied Scientist;;Researcher;Researcher;Assistant Professor",
        "bibtex": "@misc{\njiang2024learning,\ntitle={Learning Multi-Modal Representation Alignments from Noisy Data-Pairs},\nauthor={Qian Jiang and Jingjing Meng and Alireza Bagheri Garakani and Yang Jiao and Yetian Chen and Yikai Ni and Yan Gao and Yi Sun and Changyou Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=CvxcWCDX0h}\n}",
        "github": "",
        "project": "",
        "reviewers": "LvQG;UYnq;g84h;6kBB",
        "site": "https://openreview.net/forum?id=CvxcWCDX0h",
        "pdf_size": 653982,
        "rating": "3;3;3;5",
        "confidence": "4;4;5;5",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;2;3",
        "wc_summary": "59;81;44;77",
        "wc_strengths": "15;50;34;34",
        "wc_weaknesses": "106;249;185;279",
        "wc_questions": "1;16;71;4",
        "wc_review": "181;396;334;394",
        "wc_reply_reviewers": "0;0;0;38",
        "wc_reply_authors": "284;511;652;401",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            65.25,
            14.804982269492928
        ],
        "wc_strengths_avg": [
            33.25,
            12.397076268217438
        ],
        "wc_weaknesses_avg": [
            204.75,
            66.35651814253066
        ],
        "wc_questions_avg": [
            23.0,
            28.275431031197385
        ],
        "wc_review_avg": [
            326.25,
            87.48249824964991
        ],
        "wc_reply_reviewers_avg": [
            9.5,
            16.454482671904334
        ],
        "wc_reply_authors_avg": [
            462.0,
            135.9282899178828
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:nG0shp6U-2oJ:scholar.google.com/&scioq=Learning+Multi-Modal+Representation+Alignments+from+Noisy+Data-Pairs&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1;1;1;2",
        "aff_unique_norm": "University of Illinois Urbana-Champaign;Amazon;State University of New York at Buffalo",
        "aff_unique_dep": ";Amazon.com, Inc.;",
        "aff_unique_url": "https://illinois.edu;https://www.amazon.com;https://www.buffalo.edu",
        "aff_unique_abbr": "UIUC;Amazon;SUNY Buffalo",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Urbana-Champaign;;Buffalo",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Cw6lk56w6z",
        "title": "When does In-context Learning Fall Short and Why? A Study on Specification-Heavy Tasks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In-context learning (ICL) has become the default method for using large language models (LLMs), making the exploration of its limitations and understanding the underlying causes crucial. In this paper, we find that ICL falls short of handling specification-heavy tasks, which are tasks with complicated and extensive task specifications, requiring several hours for ordinary humans to master, such as traditional information extraction tasks. The performance of ICL on these tasks mostly cannot reach half of the state-of-the-art results. To explore the reasons behind this failure, we conduct comprehensive experiments on $18$ specification-heavy tasks with various LLMs and identify three primary reasons: inability to specifically understand context, misalignment in task schema comprehension with humans, and inadequate long-text understanding ability. Furthermore, we demonstrate that through fine-tuning, LLMs can achieve decent performance on these tasks, indicating that the failure of ICL is not an inherent flaw of LLMs, but rather a drawback of existing alignment methods that renders LLMs incapable of handling complicated specification-heavy tasks via ICL. To substantiate this, we perform dedicated instruction tuning on LLMs for these tasks and observe a notable improvement. We hope the analyses in this paper could facilitate advancements in alignment methods enabling LLMs to meet more sophisticated human demands.",
        "keywords": "In-context learning;large language models;instruction tuning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/441537b4fc68c672c888287a4fda051fcfacb56d.zip",
        "author": "Hao Peng;Xiaozhi Wang;Jianhui Chen;Weikai Li;Yunjia Qi;Zimu Wang;Zhili Wu;Kaisheng Zeng;Xu Bin;Lei Hou;Juanzi Li",
        "authorids": "~Hao_Peng6;~Xiaozhi_Wang1;~Jianhui_Chen6;~Weikai_Li2;~Yunjia_Qi1;~Zimu_Wang3;~Zhili_Wu1;~Kaisheng_Zeng1;~Xu_Bin1;~Lei_Hou2;~Juanzi_Li1",
        "gender": "M;M;M;M;;M;M;M;;M;",
        "homepage": ";https://bakser.github.io/;;https://weikai-li.github.io;https://github.com/kijlk;https://www.zimuwang.net;https://wu-zhili.github.io/;https://github.com/alpc43;;https://www.cs.tsinghua.edu.cn/csen/info/1305/4466.htm;",
        "dblp": "69/7742-15;03/2015;;157/3533-2;349/5606;;;199/8788.html;;32/5685-1;",
        "google_scholar": "2ry7XsgAAAAJ;DjpXXZkAAAAJ;CkgiFxMAAAAJ;https://scholar.google.com/citations?hl=en;Xxiwr8YAAAAJ;0EzXWPgAAAAJ;;https://scholar.google.com/citations?view_op=list_works;;YnIq4hsAAAAJ;",
        "orcid": "0009-0006-7192-5790;0000-0002-5727-143X;0000-0001-8665-2971;0000-0002-5801-9500;;;;0000-0002-8104-9652;;0000-0002-8907-3526;",
        "linkedin": ";xiaozhiwang098/?locale=en_US;;weikai-li;;;;https://cn.linkedin.com/in/%E5%BC%80%E8%83%9C-%E6%9B%BE-496566107;;;",
        "or_profile": "~Hao_Peng6;~Xiaozhi_Wang1;~Jianhui_Chen6;~Weikai_Li2;~Yunjia_Qi1;~Zimu_Wang3;~Zhili_Wu1;~Kaisheng_Zeng1;~Xu_Bin1;~Lei_Hou2;~Juanzi_Li1",
        "aff": "Tsinghua University;Department of Computer Science and Technology, Tsinghua University;Tsinghua University;UCLA Computer Science Department, University of California, Los Angeles;Tsinghua University;University of Texas at Dallas;, Tsinghua University;Tsinghua University;;Tsinghua University;",
        "aff_domain": "tsinghua.edu.cn;mails.tsinghua.edu.cn;cs.tsinghua.edu.cn;cs.ucla.edu;tsinghua.edu.cn;utdallas.edu;cs.tsinghua.edu.cn;tsinghua.edu.cn;;tsinghua.edu.cn;",
        "position": "PhD student;PhD student;MS student;PhD student;PhD student;Visiting student;Undergrad student;PhD student;;Assistant Professor;",
        "bibtex": "@misc{\npeng2024when,\ntitle={When does In-context Learning Fall Short and Why? A Study on Specification-Heavy Tasks},\nauthor={Hao Peng and Xiaozhi Wang and Jianhui Chen and Weikai Li and Yunjia Qi and Zimu Wang and Zhili Wu and Kaisheng Zeng and Xu Bin and Lei Hou and Juanzi Li},\nyear={2024},\nurl={https://openreview.net/forum?id=Cw6lk56w6z}\n}",
        "github": "",
        "project": "",
        "reviewers": "3cva;hYr5;Huq3;KipK",
        "site": "https://openreview.net/forum?id=Cw6lk56w6z",
        "pdf_size": 552587,
        "rating": "3;5;5;5",
        "confidence": "4;4;3;4",
        "soundness": "2;2;3;3",
        "contribution": "1;2;3;3",
        "presentation": "2;4;3;3",
        "wc_summary": "79;68;87;181",
        "wc_strengths": "27;29;75;41",
        "wc_weaknesses": "192;194;250;177",
        "wc_questions": "4;1;78;67",
        "wc_review": "302;292;490;466",
        "wc_reply_reviewers": "0;10;11;14",
        "wc_reply_authors": "263;122;452;245",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            103.75,
            45.107510461119446
        ],
        "wc_strengths_avg": [
            43.0,
            19.235384061671343
        ],
        "wc_weaknesses_avg": [
            203.25,
            27.779263849137543
        ],
        "wc_questions_avg": [
            37.5,
            35.23137805990563
        ],
        "wc_review_avg": [
            387.5,
            90.9656528586477
        ],
        "wc_reply_reviewers_avg": [
            8.75,
            5.261891294962297
        ],
        "wc_reply_authors_avg": [
            270.5,
            118.0052964913016
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 31,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10491637420774149560&as_sdt=40000005&sciodt=0,22&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;1;0;2;0;0;0",
        "aff_unique_norm": "Tsinghua University;University of California, Los Angeles;University of Texas at Dallas",
        "aff_unique_dep": ";Computer Science Department;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.ucla.edu;https://www.utdallas.edu",
        "aff_unique_abbr": "THU;UCLA;UT Dallas",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Los Angeles;Dallas",
        "aff_country_unique_index": "0;0;0;1;0;1;0;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "CwAY8b8i97",
        "title": "Spike Accumulation Forwarding for Effective Training of Spiking Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this article, we propose a new paradigm for training spiking neural networks (SNNs), spike accumulation forwarding (SAF). It is known that SNNs are energy-efficient but difficult to train. Consequently, many researchers have proposed various methods to solve this problem, among which online training through time (OTTT) is a method that allows inferring at each time step while suppressing the memory cost. However, to compute efficiently on GPUs, OTTT requires operations with spike trains and weighted summation of spike trains during forwarding. In addition, OTTT has shown a relationship with the Spike Representation, an alternative training method, though theoretical agreement with Spike Representation has yet to be proven. Our proposed method can solve these problems; namely, SAF can halve the number of operations during the forward process, and it can be theoretically proven that SAF is consistent with the Spike Representation and OTTT, respectively. Furthermore, we confirmed the above contents through experiments and showed that it is possible to reduce memory and training time while maintaining accuracy.",
        "keywords": "Spiking Neural Networks;Efficient SNN Training;Deep Learning;Supervised Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/cdc479b801af35f01ab5113d84a7c4ab4964ace7.zip",
        "author": "Ryuji Saiin;Tomoya Shirakawa;Sota Yoshihara;Yoshihide Sawada;Hiroyuki Kusumoto",
        "authorids": "~Ryuji_Saiin1;~Tomoya_Shirakawa1;~Sota_Yoshihara1;~Yoshihide_Sawada3;~Hiroyuki_Kusumoto2",
        "gender": "M;M;M;M;M",
        "homepage": ";;https://researchmap.jp/yoshiharasota;;",
        "dblp": ";;;28/4026;",
        "google_scholar": "https://scholar.google.com/citations?hl=ja;;https://scholar.google.co.jp/citations?user=Z0eb2QcAAAAJ;6Sh2Ix4AAAAJ;",
        "orcid": ";;;0000-0001-7267-8660;0000-0002-2821-5252",
        "linkedin": ";tomoya-shirakawa-8610a0292/;;yoshihide-sawada-4a5317a0/;",
        "or_profile": "~Ryuji_Saiin1;~Tomoya_Shirakawa1;~Sota_Yoshihara1;~Yoshihide_Sawada3;~Hiroyuki_Kusumoto2",
        "aff": "AISIN SOFTWARE Co., Ltd.;Graduate School of Mathematics, Nagoya University;Nagoya University;Aisin;Nagoya University",
        "aff_domain": "aisin-software.com;nagoya-u.ac.jp;nagoya-u.ac.jp;aisin.co.jp;nagoya-u.ac.jp",
        "position": "Researcher;MS student;MS student;Principal Investigator & Research Manager;Assistant Professor",
        "bibtex": "@misc{\nsaiin2024spike,\ntitle={Spike Accumulation Forwarding for Effective Training of Spiking Neural Networks},\nauthor={Ryuji Saiin and Tomoya Shirakawa and Sota Yoshihara and Yoshihide Sawada and Hiroyuki Kusumoto},\nyear={2024},\nurl={https://openreview.net/forum?id=CwAY8b8i97}\n}",
        "github": "",
        "project": "",
        "reviewers": "owpx;J1Az;q39D;WuBX",
        "site": "https://openreview.net/forum?id=CwAY8b8i97",
        "pdf_size": 840486,
        "rating": "3;3;5;5",
        "confidence": "4;4;5;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;4",
        "presentation": "2;2;2;2",
        "wc_summary": "45;54;82;101",
        "wc_strengths": "36;40;21;46",
        "wc_weaknesses": "179;261;79;157",
        "wc_questions": "88;3;32;108",
        "wc_review": "348;358;214;412",
        "wc_reply_reviewers": "0;109;19;0",
        "wc_reply_authors": "881;515;394;706",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            70.5,
            22.276669409945463
        ],
        "wc_strengths_avg": [
            35.75,
            9.229707470987366
        ],
        "wc_weaknesses_avg": [
            169.0,
            64.82283548256741
        ],
        "wc_questions_avg": [
            57.75,
            42.13297402272951
        ],
        "wc_review_avg": [
            333.0,
            72.89032857656768
        ],
        "wc_reply_reviewers_avg": [
            32.0,
            45.1275968781853
        ],
        "wc_reply_authors_avg": [
            624.0,
            185.44136539618123
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=738461518819571780&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;1;2;1",
        "aff_unique_norm": "AISIN SOFTWARE Co., Ltd.;Nagoya University;AISIN Corporation",
        "aff_unique_dep": ";Graduate School of Mathematics;",
        "aff_unique_url": "https://www.aisin-software.com;https://www.nagoya-u.ac.jp;https://www.aisin.com",
        "aff_unique_abbr": ";Nagoya U;Aisin",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Nagoya",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Japan"
    },
    {
        "id": "Cx6Jn6gKHz",
        "title": "Can adversarial samples benefit few-shot unsupervised implicit neural shape representation learning ?",
        "track": "main",
        "status": "Desk Reject",
        "tldr": "",
        "abstract": "Implicit Neural Representations have gained prominence as a powerful framework for capturing complex data modalities, encompassing a wide range from 3D shapes to images and audio. Within the realm of 3D shape representation, Neural Signed Distance Functions (SDF) have demonstrated remarkable potential in faithfully encoding intricate shape geometry. However, learning SDFs from 3D point clouds in the absence of ground truth supervision remains a very challenging task. While recent methods rely on smoothness priors to regularize the learning, our method introduces a regularization term that leverages adversarial samples around the shape to improve the learned SDFs. Through extensive experiments and evaluations, we illustrate the efficacy of our proposed method, highlighting its capacity to improve SDF learning with respect to baselines and the state-of-the-art using synthetic and real data.",
        "keywords": "3D reconstruction;Implicit Neural Representations",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/0cd0cd1c6a3e75bd6c5685b9558848471815fbfd.pdf",
        "author": "Amine Ouasfi;Adnane Boukhayma",
        "authorids": "~Amine_Ouasfi1;~Adnane_Boukhayma2",
        "gender": ";M",
        "homepage": ";https://boukhayma.github.io/",
        "dblp": "324/2085;172/2146",
        "google_scholar": "IdcK7TcAAAAJ;",
        "orcid": ";",
        "linkedin": "amine-ouasfi/;",
        "or_profile": "~Amine_Ouasfi1;~Adnane_Boukhayma2",
        "aff": "INRIA;INRIA",
        "aff_domain": "inria.fr;inria.fr",
        "position": "PhD student;Researcher",
        "bibtex": "@misc{\nouasfi2024can,\ntitle={Can adversarial samples benefit few-shot unsupervised implicit neural shape representation learning ?},\nauthor={Amine Ouasfi and Adnane Boukhayma},\nyear={2024},\nurl={https://openreview.net/forum?id=Cx6Jn6gKHz}\n}",
        "github": "",
        "project": "",
        "reviewers": "iVm1;ZZdy;akZJ;PU6C",
        "site": "https://openreview.net/forum?id=Cx6Jn6gKHz",
        "pdf_size": 5091865,
        "rating": "5;6;6;6",
        "confidence": "4;3;5;3",
        "soundness": "3;2;2;3",
        "contribution": "3;2;3;3",
        "presentation": "2;3;2;3",
        "wc_summary": "170;49;148;138",
        "wc_strengths": "88;65;73;60",
        "wc_weaknesses": "413;243;242;244",
        "wc_questions": "17;188;105;175",
        "wc_review": "688;545;568;617",
        "wc_reply_reviewers": "0;267;270;251",
        "wc_reply_authors": "875;1708;2811;1867",
        "reply_reviewers": "0;2;2;2",
        "reply_authors": "2;4;6;3",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            126.25,
            46.07805876987441
        ],
        "wc_strengths_avg": [
            71.5,
            10.594810050208546
        ],
        "wc_weaknesses_avg": [
            285.5,
            73.61555542139175
        ],
        "wc_questions_avg": [
            121.25,
            67.9646047586536
        ],
        "wc_review_avg": [
            604.5,
            54.77453788029617
        ],
        "wc_reply_reviewers_avg": [
            197.0,
            113.9671005158945
        ],
        "wc_reply_authors_avg": [
            1815.25,
            687.3443005510412
        ],
        "reply_reviewers_avg": [
            1.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            3.75,
            1.479019945774904
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.17407765595569782,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:rCAcopBVVRMJ:scholar.google.com/&scioq=Can+adversarial+samples+benefit+few-shot+unsupervised+implicit+neural+shape+representation+learning+%3F&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "INRIA",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.inria.fr",
        "aff_unique_abbr": "INRIA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "France"
    },
    {
        "title": "Idempotence and Perceptual Image Compression",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19156",
        "id": "Cy5v64DqEF",
        "author_site": "Tongda Xu, Ziran Zhu, Dailan He, Yanghao Li, Lina Guo, Yuanyuan Wang, Zhe Wang, Hongwei Qin, Yan Wang, Jingjing Liu, Ya-Qin Zhang",
        "tldr": "",
        "abstract": "Idempotence is the stability of image codec to re-compression. At the first glance, it is unrelated to perceptual image compression. However, we find that theoretically: 1) Conditional generative model-based perceptual codec satisfies idempotence; 2) Unconditional generative model with idempotence constraint is equivalent to conditional generative codec. Based on this newfound equivalence, we propose a new paradigm of perceptual image codec by inverting unconditional generative model with idempotence constraints. Our codec is theoretically equivalent to conditional generative codec, and it does not require training new models. Instead, it only requires a pre-trained mean-square-error codec and unconditional generative model. Empirically, we show that our proposed approach outperforms state-of-the-art methods such as HiFiC and ILLM, in terms of Fr\u00e9chet Inception Distance (FID). The source code is provided in https://github.com/tongdaxu/Idempotence-and-Perceptual-Image-Compression.",
        "keywords": "perceptual image compression;neural image compression",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/a1a7d2f2d4c9d4e46224b4e59fb90476f8950581.zip",
        "author": "Tongda Xu;Ziran Zhu;Dailan He;Yanghao Li;Lina Guo;Yuanyuan Wang;Zhe Wang;Hongwei Qin;Yan Wang;Jingjing Liu;Ya-Qin Zhang",
        "authorids": "~Tongda_Xu1;~Ziran_Zhu1;~Dailan_He1;~Yanghao_Li2;~Lina_Guo1;~Yuanyuan_Wang3;~Zhe_Wang28;~Hongwei_Qin2;~Yan_Wang12;~Jingjing_Liu2;~Ya-Qin_Zhang1",
        "gender": "Non-Binary;M;M;;;M;M;M;;;M",
        "homepage": "https://tongdaxu.github.io/;https://github.com/Doris-UESTC;;;;https://www.linkedin.com/in/wang-yuan-4440265a/;;http://qinhongwei.com/academic;http://researchgate.net/profile/Yan_Wang154?ev=hdr_xprf;https://air.tsinghua.edu.cn/en/info/1046/1194.htm#:~:text=Jingjing%20Liu%20is%20Professor%2C%20Principal,CVPR%2C%20ACL%2C%20etc.);https://air.tsinghua.edu.cn/en/info/1046/1188.htm",
        "dblp": "227/8096;;246/2809;;99/5016;;;161/1819;59/2227-80;30/3008-1;09/2187",
        "google_scholar": "LO8GS7sAAAAJ;;f5MTTy4AAAAJ;;C1ii1jUAAAAJ;;y_vW-jcAAAAJ;ZGM7HfgAAAAJ;QOZnsYYAAAAJ;BzJ_GboAAAAJ;mDOMfxIAAAAJ",
        "orcid": ";;;;;;0000-0003-3201-1903;;;;",
        "linkedin": ";;dailan-he-82741a164/;;;;%E5%93%B2-%E7%8E%8B-1a9800160;;;jingjing-liu-65703431/;",
        "or_profile": "~Tongda_Xu1;~Ziran_Zhu1;~Dailan_He1;~Yanghao_Li2;~Lina_Guo1;~Yuanyuan_Wang3;~Zhe_Wang28;~Hongwei_Qin2;~Yan_Wang12;~Jingjing_Liu2;~Ya-Qin_Zhang1",
        "aff": "Tsinghua University;University of Chinese Academy of Sciences;SenseTime Research;;SenseTime;;Tsinghua University;SenseTime Co.;Tsinghua University;Tsinghua University;AIR, Tsinghua University",
        "aff_domain": "air.tsinghua.edu.cn;ucas.edu;sensetime.com;;sensetime.com;;tsinghua.edu.cn;sensetime.com;tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "PhD student;MS student;Researcher;;Researcher;;PhD student;Researcher;Assistant Professor;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nxu2024idempotence,\ntitle={Idempotence and Perceptual Image Compression},\nauthor={Tongda Xu and Ziran Zhu and Dailan He and Yanghao Li and Lina Guo and Yuanyuan Wang and Zhe Wang and Hongwei Qin and Yan Wang and Jingjing Liu and Ya-Qin Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Cy5v64DqEF}\n}",
        "github": "",
        "project": "",
        "reviewers": "zF7s;VEis;CP1y;SHZQ",
        "pdf_size": 43471770,
        "rating": "6;8;8;8",
        "confidence": "3;4;4;4",
        "soundness": "3;4;3;3",
        "contribution": "3;4;4;3",
        "presentation": "2;3;4;3",
        "wc_summary": "45;105;83;88",
        "wc_strengths": "35;119;187;64",
        "wc_weaknesses": "90;171;187;86",
        "wc_questions": "2;186;74;38",
        "wc_review": "172;581;531;276",
        "wc_reply_reviewers": "126;31;54;23",
        "wc_reply_authors": "1430;1175;362;935",
        "reply_reviewers": "2;1;1;1",
        "reply_authors": "3;3;2;2",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            80.25,
            21.924586655168667
        ],
        "wc_strengths_avg": [
            101.25,
            57.97574924052297
        ],
        "wc_weaknesses_avg": [
            133.5,
            45.87210481327405
        ],
        "wc_questions_avg": [
            75.0,
            68.95650803223725
        ],
        "wc_review_avg": [
            390.0,
            170.94004797004123
        ],
        "wc_reply_reviewers_avg": [
            58.5,
            40.59864529759583
        ],
        "wc_reply_authors_avg": [
            975.5,
            395.09271063890816
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 16,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15452380677965587482&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=Cy5v64DqEF",
        "pdf": "https://openreview.net/pdf?id=Cy5v64DqEF",
        "email": "air.tsinghua.edu.cn;ucas.edu;sensetime.com;;sensetime.com;;tsinghua.edu.cn;sensetime.com;tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn",
        "author_num": 11,
        "aff_unique_index": "0;1;2;2;0;2;0;0;0",
        "aff_unique_norm": "Tsinghua University;University of Chinese Academy of Sciences;SenseTime",
        "aff_unique_dep": ";;SenseTime Research",
        "aff_unique_url": "https://www.tsinghua.edu.cn;http://www.ucas.ac.cn;https://www.sensetime.com",
        "aff_unique_abbr": "THU;UCAS;SenseTime",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "D02lqBeVpP",
        "title": "Roadside Monocular 3D Detection via 2D-Detection Prompting",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The problem of roadside monocular 3D detection requires detecting objects of interested classes (e.g., vehicle and pedestrian) in a 2D RGB frame and predicting their 3D information such as Bird-Eye-View (BEV) locations. It has broad applications such as traffic control, vehicle-vehicle communication and vehicle-infrastructure cooperative perception. To approach this problem, we present a novel and simple method that significantly outperforms prior arts by exploiting 2D detections to help 3D detections based on two key insights. First, 2D detectors are much easier to train and perform significantly better than 3D detectors if measured on the 2D image plane. Second, plenty of publicly available 2D-box annotated datasets allows pretraining a strong base detector, which, once finetuned, yields a much better 2D detector for the roadside dataset. To exploit the 2D detector for 3D detection, we explore three techniques: (1) concatenating both 2D and 3D detectors\u2019 features, (2) prompting and attentively fusing 2D and 3D detectors\u2019 features, and (3) prompting and encoding predicted 2D boxes\u2019 {x, y, width, height, label} and attentively fusing such with the 3D detector\u2019s features. Surprisingly, the third performs significantly better than the others. We conjecture that prompting 2D detections gives pinpointed object targets for the 3D detector to learn how to inflate them to BEV as 3D detections. Moreover, we suggest a class-grouping strategy that merges classes based on their functionality, which leads to further improvements. Comprehensive ablation studies and extensive experiments demonstrate that our method achieves the state-of-the-art on two existing large-scale roadside 3D detection benchmarks.",
        "keywords": "roadside 3D detection;monocular 3D detection;object detection",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/c3f01a83a682d1ce05e87ccf656668bbada068ab.zip",
        "author": "Yechi Ma;Shuoquan Wei;Churun Zhang;Wei Hua;Yanan Li;Shu Kong",
        "authorids": "~Yechi_Ma1;~Shuoquan_Wei1;~Churun_Zhang1;~Wei_Hua1;~Yanan_Li4;~Shu_Kong1",
        "gender": "M;;F;M;F;M",
        "homepage": "https://github.com/mayechi;https://github.com/WeiSQ-zju;https://github.com/Truring;https://portal.zhejianglab.com/portal/employee;https://yananlix1.github.io/;https://aimerykong.github.io/",
        "dblp": ";;;;61/7498-2.html;26/11141",
        "google_scholar": ";;;;9cTdt_kAAAAJ;sm9FdLoAAAAJ",
        "orcid": ";;;0000-0003-2868-1920;0000-0001-8482-7221;0000-0002-1362-5937",
        "linkedin": ";;;;;aimerykong/",
        "or_profile": "~Yechi_Ma1;~Shuoquan_Wei1;~Churun_Zhang1;~Wei_Hua1;~Yanan_Li4;~Shu_Kong1",
        "aff": "Zhejiang Lab, Zhejiang Lab;Zhejiang Lab;Zhejiang Lab;Zhejiang Lab;Zhejiang Lab;Texas A&M University - College Station",
        "aff_domain": "zhejianglab.com;zhejianglab.com;zhejianglab.com;zhejianglab.com;zhejianglab.com;tamu.edu",
        "position": "Researcher;Researcher;Researcher;Full Professor;Researcher;Assistant Professor",
        "bibtex": "@misc{\nma2024roadside,\ntitle={Roadside Monocular 3D Detection via 2D-Detection Prompting},\nauthor={Yechi Ma and Shuoquan Wei and Churun Zhang and Wei Hua and Yanan Li and Shu Kong},\nyear={2024},\nurl={https://openreview.net/forum?id=D02lqBeVpP}\n}",
        "github": "",
        "project": "",
        "reviewers": "pSM9;n9u2;QPjq;XGju",
        "site": "https://openreview.net/forum?id=D02lqBeVpP",
        "pdf_size": 5876702,
        "rating": "3;5;5;6",
        "confidence": "5;4;5;4",
        "soundness": "2;2;2;3",
        "contribution": "1;2;2;3",
        "presentation": "1;3;2;3",
        "wc_summary": "118;62;65;65",
        "wc_strengths": "15;40;19;86",
        "wc_weaknesses": "240;311;76;119",
        "wc_questions": "77;5;73;24",
        "wc_review": "450;418;233;294",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            77.5,
            23.41473894793619
        ],
        "wc_strengths_avg": [
            40.0,
            28.20460955234091
        ],
        "wc_weaknesses_avg": [
            186.5,
            93.71365962334413
        ],
        "wc_questions_avg": [
            44.75,
            31.01914731258743
        ],
        "wc_review_avg": [
            348.75,
            88.66051827053573
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.6882472016116854,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:jgZs3FgM9mQJ:scholar.google.com/&scioq=Roadside+Monocular+3D+Detection+via+2D-Detection+Prompting&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0;0;1",
        "aff_unique_norm": "Zhejiang Lab;Texas A&M University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.zhejianglab.com;https://www.tamu.edu",
        "aff_unique_abbr": ";TAMU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";College Station",
        "aff_country_unique_index": "0;0;0;0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "D0zeqL7Vnz",
        "title": "Prompt Sketching for Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Many recent prompting strategies for large language models (LLMs) query the model multiple times sequentially -- first to produce intermediate results and then the final answer. However, using these methods, both decoder and model are unaware of potential follow-up prompts, leading to disconnected and undesirably wordy intermediate responses.\nIn this work, we address this issue by proposing prompt sketching, a new prompting paradigm in which an LLM does not only respond by completing a prompt, but by predicting values for multiple variables in a template. This way, sketching grants users more control over the generation process, e.g., by providing a reasoning framework via intermediate instructions, leading to better overall results. The key idea enabling sketching with existing, autoregressive models is to adapt the decoding procedure to also score follow-up instructions during text generation, thus optimizing overall template likelihood in inference.\nOur experiments show that in a zero-shot setting, prompt sketching outperforms existing, sequential prompting schemes such as direct asking or chain-of-thought on 7 out of 8 LLM benchmarking tasks, including state tracking, arithmetic reasoning, and general question answering. To facilitate future use, we release a number of generic, yet effective sketches applicable to many tasks, and an open source library called dclib, powering our sketch-aware decoders.",
        "keywords": "large language models;prompting;decoding",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/8a37457c7e7214b93e585e946228d41f941de147.zip",
        "author": "Luca Beurer-Kellner;Mark Niklas Mueller;Marc Fischer;Martin Vechev",
        "authorids": "~Luca_Beurer-Kellner1;~Mark_Niklas_Mueller2;~Marc_Fischer1;~Martin_Vechev1",
        "gender": "M;M;M;M",
        "homepage": ";https://www.sri.inf.ethz.ch/people/mark;;https://www.sri.inf.ethz.ch/people/martin",
        "dblp": "314/2627;287/4254;37/9373-2;93/2189.html",
        "google_scholar": "https://scholar.google.com/citations?hl=de;RBpmcCAAAAAJ;;https://scholar.google.ch/citations?user=aZ1Rh50AAAAJ",
        "orcid": ";0000-0002-2496-6542;;",
        "linkedin": ";mark-m%C3%BCller-8bb4b1140/;;",
        "or_profile": "~Luca_Beurer-Kellner1;~Mark_Niklas_Mueller2;~Marc_Fischer1;~Martin_Vechev1",
        "aff": "ETHZ - ETH Zurich;Swiss Federal Institute of Technology;Swiss Federal Institute of Technology;Swiss Federal Institute of Technology",
        "aff_domain": "ethz.ch;ethz.ch;ethz.ch;ethz.ch",
        "position": "PhD student;PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nbeurer-kellner2024prompt,\ntitle={Prompt Sketching for Large Language Models},\nauthor={Luca Beurer-Kellner and Mark Niklas Mueller and Marc Fischer and Martin Vechev},\nyear={2024},\nurl={https://openreview.net/forum?id=D0zeqL7Vnz}\n}",
        "github": "",
        "project": "",
        "reviewers": "pDQp;AyRy;tG6m;Apoy",
        "site": "https://openreview.net/forum?id=D0zeqL7Vnz",
        "pdf_size": 1547746,
        "rating": "5;5;6;6",
        "confidence": "4;4;3;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;2",
        "presentation": "2;3;3;3",
        "wc_summary": "63;190;80;43",
        "wc_strengths": "85;149;61;48",
        "wc_weaknesses": "271;454;88;57",
        "wc_questions": "66;43;51;22",
        "wc_review": "485;836;280;170",
        "wc_reply_reviewers": "409;206;19;0",
        "wc_reply_authors": "1554;1185;913;565",
        "reply_reviewers": "2;1;1;0",
        "reply_authors": "4;2;2;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            94.0,
            56.95173395077625
        ],
        "wc_strengths_avg": [
            85.75,
            38.854697270729055
        ],
        "wc_weaknesses_avg": [
            217.5,
            159.15794042397005
        ],
        "wc_questions_avg": [
            45.5,
            15.88238017426859
        ],
        "wc_review_avg": [
            442.75,
            253.62903520693368
        ],
        "wc_reply_reviewers_avg": [
            158.5,
            165.52114668524985
        ],
        "wc_reply_authors_avg": [
            1054.25,
            362.6853836315988
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.25,
            1.0897247358851685
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14562663346167291414&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "ETH Zurich;Swiss Federal Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ethz.ch;https://www.ethz.ch",
        "aff_unique_abbr": "ETHZ;ETH Zurich",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Switzerland"
    },
    {
        "id": "D1w3huGGpu",
        "title": "Compositional Interfaces for Compositional Generalization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "With recent work such as GATO (Reed et al., 2022) we see the development of agents that can accomplish a variety of tasks, and are able to perceive the world and act in multiple observation and action spaces.  We would want such agents to exhibit compositional generalization to unseen combinations of observation and action spaces, and adapt quickly to novel observation spaces by transfering knowledge. In this work, we demonstrate how these abilities can be achieved through the use of end-to-end modular architectures: the encoding of observations and the prediction of actions are handled by differentiable modules specialized to that space, with a single shared controller between them. To study the properties of such modular architectures in a controlled manner, we construct an environment with compositional structure, where each instance of the environment is created by combining an observation, action, and instruction space from a large set of options. We demonstrate that through the use of modularity, agents can generalize to unseen combinations of observation, action and instruction spaces; even when the unseen combinations are more challenging. Moreover, we demonstrate that modularity enables quick integration of novel observation modalities, requiring only adaptation of the modules encoding the new observation.",
        "keywords": "compositional generalization;modular architectures;generalist agents",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Jelena Luketina;Jack Lanchantin;Sainbayar Sukhbaatar;Arthur Szlam",
        "authorids": "~Jelena_Luketina1;~Jack_Lanchantin1;~Sainbayar_Sukhbaatar1;~Arthur_Szlam3",
        "gender": "F;;M;",
        "homepage": "https://whirl.cs.ox.ac.uk/member/jelena-luketina/;https://www.jacklanchantin.com/;;",
        "dblp": "172/1124;178/8538.html;56/10550;",
        "google_scholar": "zpil5xkAAAAJ;35PmAZwAAAAJ;ri1sE34AAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Jelena_Luketina1;~Jack_Lanchantin1;~Sainbayar_Sukhbaatar1;~Arthur_Szlam3",
        "aff": "University of Oxford;Meta;Meta AI;Google",
        "aff_domain": "ox.ac.uk;meta.com;meta.com;google.com",
        "position": "PhD student;Researcher;Research Scientist;Researcher",
        "bibtex": "@misc{\nluketina2024compositional,\ntitle={Compositional Interfaces for Compositional Generalization},\nauthor={Jelena Luketina and Jack Lanchantin and Sainbayar Sukhbaatar and Arthur Szlam},\nyear={2024},\nurl={https://openreview.net/forum?id=D1w3huGGpu}\n}",
        "github": "",
        "project": "",
        "reviewers": "B95a;h2vj;n2i7;Pm6p",
        "site": "https://openreview.net/forum?id=D1w3huGGpu",
        "pdf_size": 657839,
        "rating": "3;5;5;6",
        "confidence": "3;5;3;3",
        "soundness": "3;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;4;4",
        "wc_summary": "21;63;95;71",
        "wc_strengths": "45;45;48;88",
        "wc_weaknesses": "57;239;137;39",
        "wc_questions": "35;1;6;68",
        "wc_review": "158;348;286;266",
        "wc_reply_reviewers": "10;0;0;75",
        "wc_reply_authors": "473;744;665;427",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            62.5,
            26.69737814842499
        ],
        "wc_strengths_avg": [
            56.5,
            18.227726133558185
        ],
        "wc_weaknesses_avg": [
            118.0,
            79.0
        ],
        "wc_questions_avg": [
            27.5,
            26.744158240632665
        ],
        "wc_review_avg": [
            264.5,
            68.51824574520279
        ],
        "wc_reply_reviewers_avg": [
            21.25,
            31.299960063872287
        ],
        "wc_reply_authors_avg": [
            577.25,
            131.29046995117352
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.13245323570650439,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14514872661166980691&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "University of Oxford;Meta;Google",
        "aff_unique_dep": ";Meta Platforms, Inc.;Google",
        "aff_unique_url": "https://www.ox.ac.uk;https://meta.com;https://www.google.com",
        "aff_unique_abbr": "Oxford;Meta;Google",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "title": "Finite-Time Analysis of On-Policy Heterogeneous Federated Reinforcement Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19155",
        "id": "D2eOVqPX9g",
        "author_site": "Chenyu Zhang, Han Wang, Aritra Mitra, James Anderson",
        "tldr": "",
        "abstract": "Federated reinforcement learning (FRL) has emerged as a promising paradigm for reducing the sample complexity of reinforcement learning tasks by exploiting information from different agents. However, when each agent interacts with a potentially different environment, little to nothing is known theoretically about the non-asymptotic performance of FRL algorithms. The lack of such results can be attributed to various technical challenges and their intricate interplay: Markovian sampling, linear function approximation, multiple local updates to save communication, heterogeneity in the reward functions and transition kernels of the agents' MDPs, and continuous state-action spaces.  Moreover, in the on-policy setting, the behavior policies vary with time, further complicating the analysis. In response, we introduce FedSARSA, a novel federated on-policy reinforcement learning scheme, equipped with linear function approximation, to address these challenges and provide a comprehensive finite-time error analysis. Notably, we establish that FedSARSA converges to a policy that is near-optimal for all agents, with the extent of near-optimality proportional to the level of heterogeneity. Furthermore, we prove that FedSARSA leverages agent collaboration to enable linear speedups as the number of agents increases, which holds for both fixed and adaptive step-size configurations.",
        "keywords": "reinforcement learning;federated learning;temporal difference learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Chenyu Zhang;Han Wang;Aritra Mitra;James Anderson",
        "authorids": "~Chenyu_Zhang2;~Han_Wang14;~Aritra_Mitra1;~James_Anderson6",
        "gender": "M;;M;",
        "homepage": "https://zcysxy.github.io/;https://sites.google.com/view/han-wang/home;https://amitra2.wordpress.ncsu.edu/;http://www.columbia.edu/~ja3451/",
        "dblp": "136/1220-2;;169/2015.html;",
        "google_scholar": "6MAGp1QAAAAJ;ALzWbZQAAAAJ;5aUntRIAAAAJ;https://scholar.google.co.uk/citations?user=rIX6oiMAAAAJ",
        "orcid": "0009-0005-3612-4894;;;0000-0001-8210-6527",
        "linkedin": ";;aritra-mitra-695108b9/;",
        "or_profile": "~Chenyu_Zhang2;~Han_Wang14;~Aritra_Mitra1;~James_Anderson6",
        "aff": "Massachusetts Institute of Technology;Columbia University;North Carolina State University;Columbia University",
        "aff_domain": "mit.edu;columbia.edu;ncsu.edu;columbia.edu",
        "position": "PhD student;PhD student;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nzhang2024finitetime,\ntitle={Finite-Time Analysis of On-Policy Heterogeneous Federated Reinforcement Learning},\nauthor={Chenyu Zhang and Han Wang and Aritra Mitra and James Anderson},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=D2eOVqPX9g}\n}",
        "github": "",
        "project": "",
        "reviewers": "qewk;pmTu;rA2b;uJdU",
        "pdf_size": 25995912,
        "rating": "5;6;6;8",
        "confidence": "3;3;3;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "1;3;4;3",
        "wc_summary": "38;77;39;53",
        "wc_strengths": "16;80;13;93",
        "wc_weaknesses": "126;85;62;80",
        "wc_questions": "62;2;62;5",
        "wc_review": "242;244;176;231",
        "wc_reply_reviewers": "12;0;13;21",
        "wc_reply_authors": "1579;496;862;307",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "8;3;2;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            51.75,
            15.738090735537142
        ],
        "wc_strengths_avg": [
            50.5,
            36.30771267926417
        ],
        "wc_weaknesses_avg": [
            88.25,
            23.41340428045439
        ],
        "wc_questions_avg": [
            32.75,
            29.269224451631786
        ],
        "wc_review_avg": [
            223.25,
            27.725214156071004
        ],
        "wc_reply_reviewers_avg": [
            11.5,
            7.5
        ],
        "wc_reply_authors_avg": [
            811.0,
            486.2267989323501
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.5,
            2.692582403567252
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 20,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9689546457408058460&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=D2eOVqPX9g",
        "pdf": "https://openreview.net/pdf?id=D2eOVqPX9g",
        "email": "mit.edu;columbia.edu;ncsu.edu;columbia.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "Massachusetts Institute of Technology;Columbia University;North Carolina State University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://web.mit.edu;https://www.columbia.edu;https://www.ncsu.edu",
        "aff_unique_abbr": "MIT;Columbia;NCSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "D3JpYSn7dL",
        "title": "An Instance-Level Framework for Multi-tasking Graph Self-Supervised Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "With hundreds of graph self-supervised pretext tasks proposed over the past few years, the research community has greatly developed, and the key is no longer to design more powerful but complex pretext tasks, but to make more effective use of those already on hand. There have been some pioneering works, such as AutoSSL and ParetoGNN, proposed to balance multiple pretext tasks by global loss weighting in the pre-training phase. Despite their great successes, several tricky challenges remain: (i) they ignore instance-level requirements, i.e., different instances (nodes) may require localized combinations of tasks; (ii) poor scalability to emerging tasks, i.e., all task losses need to be re-weighted along with the new task and pre-trained from scratch; (iii) no theoretical guarantee of benefiting from more tasks, i.e., more tasks do not necessarily lead to better performance. To address the above issues, we propose in this paper a novel multi-teacher knowledge distillation framework for instance-level Multi-tasking Graph Self-Supervised Learning (MGSSL), which trains multiple teachers with different pretext tasks, then integrates the knowledge of different teachers for each instance separately by two parameterized knowledge integration schemes (MGSSL-TS and MGSSL-LF), and finally distills it into the student model. Such a framework shifts the trade-off among multiple pretext tasks from loss weighting in the pre-training phase to knowledge integration in the fine-tuning phase, making it compatible with an arbitrary number of pretext tasks without the need to pre-train the entire model from scratch. Furthermore, we theoretically justify that MGSSL has the potential to benefit from a wider range of teachers (tasks). Extensive experiments have shown that by combining a few simple but classical pretext tasks, the resulting performance is comparable to the state-of-the-art competitors.",
        "keywords": "Graph Self-supervised Learning;Graph Knowledge Distillation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Lirong Wu;Tianyu Fan;Yufei Huang;Haitao Lin;Zicheng Liu;Stan Z. Li",
        "authorids": "~Lirong_Wu1;~Tianyu_Fan1;~Yufei_Huang4;~Haitao_Lin2;~Zicheng_Liu2;~Stan_Z._Li2",
        "gender": ";M;M;M;M;M",
        "homepage": ";https://tianyufan0504.github.io/;https://2021.igem.org/Team:ZJU-China;;;https://en.westlake.edu.cn/academics/School_of_Engineering/About/Our_People/Faculty/201912/t20191206_2497.shtml",
        "dblp": "15/10330;238/6657;68/1946-2;34/1040;l/ZichengLiu-6;l/StanZLi",
        "google_scholar": "Tk7TrCoAAAAJ;0lOPzTwAAAAJ;qmTjdwIAAAAJ;o5A23qIAAAAJ;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": ";0000-0002-5953-896X;0009-0007-8184-4529;;;",
        "linkedin": ";;;;;stan-z-li-%E6%9D%8E%E5%AD%90%E9%9D%92-55753224/",
        "or_profile": "~Lirong_Wu1;~Tianyu_Fan1;~Yufei_Huang4;~Haitao_Lin2;~Zicheng_Liu2;~Stan_Z._Li1",
        "aff": "Westlake University;Zhejiang University;Zhejiang University;Westlake University;Zhejiang University;Westlake University",
        "aff_domain": "westlake.edu.cn;zju.edu.cn;zju.edu.cn;westlake.edu.cn;zju.edu.cn;westlake.edu.cn",
        "position": "PhD student;Undergrad student;PhD student;PhD student;PhD student;Chair Professor",
        "bibtex": "@misc{\nwu2024an,\ntitle={An Instance-Level Framework for Multi-tasking Graph Self-Supervised Learning},\nauthor={Lirong Wu and Tianyu Fan and Yufei Huang and Haitao Lin and Zicheng Liu and Stan Z. Li},\nyear={2024},\nurl={https://openreview.net/forum?id=D3JpYSn7dL}\n}",
        "github": "",
        "project": "",
        "reviewers": "UNJF;RhiN;xyJe;YwHq",
        "site": "https://openreview.net/forum?id=D3JpYSn7dL",
        "pdf_size": 1561500,
        "rating": "5;5;5;6",
        "confidence": "3;3;4;5",
        "soundness": "3;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "69;85;54;64",
        "wc_strengths": "81;120;27;57",
        "wc_weaknesses": "80;63;130;97",
        "wc_questions": "12;6;5;131",
        "wc_review": "242;274;216;349",
        "wc_reply_reviewers": "0;0;0;19",
        "wc_reply_authors": "405;339;341;865",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "2;2;2;3",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            68.0,
            11.20267825120404
        ],
        "wc_strengths_avg": [
            71.25,
            34.03215391361528
        ],
        "wc_weaknesses_avg": [
            92.5,
            24.763884994079586
        ],
        "wc_questions_avg": [
            38.5,
            53.47195526628889
        ],
        "wc_review_avg": [
            270.25,
            49.89175783634006
        ],
        "wc_reply_reviewers_avg": [
            4.75,
            8.227241335952167
        ],
        "wc_reply_authors_avg": [
            487.5,
            219.56035616659034
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.8703882797784891,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:us8ra9k6bvoJ:scholar.google.com/&scioq=An+Instance-Level+Framework+for+Multi-tasking+Graph+Self-Supervised+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;0;1;0",
        "aff_unique_norm": "Westlake University;Zhejiang University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.westlake.edu.cn;https://www.zju.edu.cn",
        "aff_unique_abbr": "WU;ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Optimistic Bayesian Optimization with Unknown Constraints",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19154",
        "id": "D4NJFfrqoq",
        "author_site": "Quoc Phong Nguyen, Wan Theng Ruth Chew, Le Song, Bryan Kian Hsiang Low, Patrick Jaillet",
        "tldr": "",
        "abstract": "Though some research efforts have been dedicated to constrained Bayesian optimization (BO), there remains a notable absence of a principled approach with a theoretical performance guarantee in the decoupled setting. Such a setting involves independent evaluations of the objective function and constraints at different inputs, and is hence a relaxation of the commonly-studied coupled setting where functions must be evaluated together. As a result, the decoupled setting requires an adaptive selection between evaluating either the objective function or a constraint, in addition to selecting an input (in the coupled setting). This paper presents a novel constrained BO algorithm with a provable performance guarantee that can address the above relaxed setting. Specifically, it considers the fundamental trade-off between exploration and exploitation in constrained BO, and, interestingly, affords a noteworthy connection to active learning. The performance of our proposed algorithms is also empirically evaluated using several synthetic and real-world optimization problems.",
        "keywords": "Bayesian optimization;black box constraint;decoupled query",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/60b2855fb945a2d05ac8ca4790531970aaf9af9e.pdf",
        "author": "Quoc Phong Nguyen;Wan Theng Ruth Chew;Le Song;Bryan Kian Hsiang Low;Patrick Jaillet",
        "authorids": "~Quoc_Phong_Nguyen2;~Wan_Theng_Ruth_Chew1;~Le_Song3;~Bryan_Kian_Hsiang_Low1;~Patrick_Jaillet1",
        "gender": ";;;M;M",
        "homepage": ";;;http://www.comp.nus.edu.sg/~lowkh;http://web.mit.edu/jaillet/www/",
        "dblp": ";;;97/4877;https://dblp.uni-trier.de/pers/hd/j/Jaillet:Patrick",
        "google_scholar": ";;;https://scholar.google.com.tw/citations?user=2P-Q09UAAAAJ;ND0FM6EAAAAJ",
        "orcid": ";0000-0002-3704-8732;;;0000-0002-8585-6566",
        "linkedin": ";;;;patrick-jaillet-1260445/",
        "or_profile": "~Quoc_Phong_Nguyen2;~Wan_Theng_Ruth_Chew1;~Le_Song3;~Bryan_Kian_Hsiang_Low1;~Patrick_Jaillet1",
        "aff": ";National University of Singapore;;National University of Singapore;Massachusetts Institute of Technology",
        "aff_domain": ";nus.edu;;nus.edu.sg;mit.edu",
        "position": ";Researcher;;Associate Professor;Full Professor",
        "bibtex": "@inproceedings{\nnguyen2024optimistic,\ntitle={Optimistic Bayesian Optimization with Unknown Constraints},\nauthor={Quoc Phong Nguyen and Wan Theng Ruth Chew and Le Song and Bryan Kian Hsiang Low and Patrick Jaillet},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=D4NJFfrqoq}\n}",
        "github": "",
        "project": "",
        "reviewers": "TVyc;WGLv;xiLP;L67a",
        "pdf_size": 786987,
        "rating": "5;6;8;8",
        "confidence": "4;4;3;4",
        "soundness": "2;2;4;3",
        "contribution": "2;2;4;3",
        "presentation": "3;3;3;3",
        "wc_summary": "47;65;61;65",
        "wc_strengths": "56;39;47;39",
        "wc_weaknesses": "167;31;1;142",
        "wc_questions": "34;116;74;169",
        "wc_review": "304;251;183;415",
        "wc_reply_reviewers": "263;73;5;0",
        "wc_reply_authors": "2673;1279;306;868",
        "reply_reviewers": "5;1;1;0",
        "reply_authors": "8;3;2;3",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            59.5,
            7.399324293474371
        ],
        "wc_strengths_avg": [
            45.25,
            7.013380069552769
        ],
        "wc_weaknesses_avg": [
            85.25,
            70.61294144843423
        ],
        "wc_questions_avg": [
            98.25,
            50.091790744592075
        ],
        "wc_review_avg": [
            288.25,
            84.82150375936517
        ],
        "wc_reply_reviewers_avg": [
            85.25,
            106.5982527999404
        ],
        "wc_reply_authors_avg": [
            1281.5,
            874.4799883359253
        ],
        "reply_reviewers_avg": [
            1.75,
            1.920286436967152
        ],
        "reply_authors_avg": [
            4.0,
            2.345207879911715
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5555555555555555,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16133354847125020417&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=D4NJFfrqoq",
        "pdf": "https://openreview.net/pdf?id=D4NJFfrqoq",
        "email": ";nus.edu;;nus.edu.sg;mit.edu",
        "author_num": 5,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "National University of Singapore;Massachusetts Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.nus.edu.sg;https://web.mit.edu",
        "aff_unique_abbr": "NUS;MIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "Singapore;United States"
    },
    {
        "title": "Finite-State Autoregressive Entropy Coding for Efficient Learned Lossless Compression",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19153",
        "id": "D5mJSNtUtv",
        "author_site": "Yufeng Zhang, Hang Yu, Jianguo Li, Weiyao Lin",
        "tldr": "",
        "abstract": "Learned lossless data compression has garnered significant attention recently due to its superior compression ratios compared to traditional compressors. However, the computational efficiency of these models jeopardizes their practicality. This paper proposes a novel system for improving the compression ratio while maintaining computational efficiency for learned lossless data compression. Our approach incorporates two essential innovations. First, we propose the Finite-State AutoRegressive (FSAR) entropy coder, an efficient autoregressive Markov model based entropy coder that utilizes a lookup table to expedite autoregressive entropy coding. Next, we present a Straight-Through Hardmax Quantization (STHQ) scheme to enhance the optimization of discrete latent space. Our experiments show that the proposed lossless compression method could improve the compression ratio by up to 6\\% compared to the baseline, with negligible extra computational time. Our work provides valuable insights into enhancing the computational efficiency of learned lossless data compression, which can have practical applications in various fields. Code is available at https://github.com/alipay/Finite_State_Autoregressive_Entropy_Coding.",
        "keywords": "Lossless Compression;Autoregressive Model;Acceleration;Entropy Coding;Autoencoder",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Yufeng Zhang;Hang Yu;Jianguo Li;Weiyao Lin",
        "authorids": "~Yufeng_Zhang4;~Hang_Yu1;~Jianguo_Li2;~Weiyao_Lin1",
        "gender": "M;M;M;M",
        "homepage": ";https://weiyaolin.github.io/;https://sites.google.com/site/leeplus/;",
        "dblp": "74/2568-2;42/6095;70/6237;17/1651",
        "google_scholar": ";S9g81n8AAAAJ;n44GlFcAAAAJ;",
        "orcid": ";;;0000-0002-9570-155X",
        "linkedin": "hang-yu-7ba38844/;;;",
        "or_profile": "~Hang_Yu1;~Weiyao_Lin1;~jianguo_Li1;~Zhang_Yufeng1",
        "aff": "Ant Group;Shanghai Jiaotong University;Ant Group;Shanghai Jiaotong University",
        "aff_domain": "antgroup.com;sjtu.edu.cn;antgroup.com;sjtu.edu.cn",
        "position": "Senior Algorithm Expert;Full Professor;Director;PhD student",
        "bibtex": "@inproceedings{\nzhang2024finitestate,\ntitle={Finite-State Autoregressive Entropy Coding for Efficient Learned Lossless Compression},\nauthor={Yufeng Zhang and Hang Yu and Jianguo Li and Weiyao Lin},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=D5mJSNtUtv}\n}",
        "github": "",
        "project": "",
        "reviewers": "7HPB;DfKd;QqM2;8pa1",
        "pdf_size": 1895310,
        "rating": "6;6;6;6",
        "confidence": "4;4;4;4",
        "soundness": "3;3;3;4",
        "contribution": "2;3;3;3",
        "presentation": "2;3;2;3",
        "wc_summary": "92;54;35;67",
        "wc_strengths": "71;85;59;116",
        "wc_weaknesses": "175;186;223;112",
        "wc_questions": "21;81;15;6",
        "wc_review": "359;406;332;301",
        "wc_reply_reviewers": "13;0;0;0",
        "wc_reply_authors": "1747;1267;1743;1837",
        "reply_reviewers": "2;0;0;0",
        "reply_authors": "4;2;3;3",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            62.0,
            20.724381776062707
        ],
        "wc_strengths_avg": [
            82.75,
            21.288200957337846
        ],
        "wc_weaknesses_avg": [
            174.0,
            39.96873778342268
        ],
        "wc_questions_avg": [
            30.75,
            29.498940658945703
        ],
        "wc_review_avg": [
            349.5,
            38.53894134508627
        ],
        "wc_reply_reviewers_avg": [
            3.25,
            5.629165124598851
        ],
        "wc_reply_authors_avg": [
            1648.5,
            223.4429457378326
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:wWG5SavImU0J:scholar.google.com/&scioq=Finite-State+Autoregressive+Entropy+Coding+for+Efficient+Learned+Lossless+Compression&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=D5mJSNtUtv",
        "pdf": "https://openreview.net/pdf?id=D5mJSNtUtv",
        "email": "antgroup.com;sjtu.edu.cn;antgroup.com;sjtu.edu.cn",
        "author_num": 4,
        "aff_unique_index": "0;1;0;1",
        "aff_unique_norm": "Ant Group;Shanghai Jiao Tong University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.antgroup.com;https://www.sjtu.edu.cn",
        "aff_unique_abbr": "Ant Group;SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "D6Htk1rwkK",
        "title": "Exploring mechanisms of Neural Robustness: probing the bridge between geometry and spectrum",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Backpropagation-optimized artificial neural networks, while precise, lack robustness, leading to unforeseen behaviors that affect their safety. \nIn cancer detection, for example, slight image alterations can misclassify benign moles as malignant. \nBiological neural systems do not have such issues. \nThus, understanding the biological mechanisms of robustness is an important step towards building trustworthy and safe systems.\nUnlike artificial models, biological neurons adjust connectivity based on neighboring cell activity. \nRobustness in neural representations is hypothesized to correlate with the smoothness of the encoding manifold. \nRecent work suggests power law covariance spectra, which were observed studying the primary visual cortex of mice, to be indicative of a balanced trade-off between accuracy and robustness in representations.\nHere, we show that unsupervised local learning models with winner takes all dynamics learn such power law representations, providing upcoming studies a mechanistic model with that characteristic.\nOur research aims to understand the interplay between geometry, spectral properties, robustness, and expressivity in neural representations.\nHence, we study the link between representation smoothness and spectrum by using weight, Jacobian and spectral regularization while assessing performance and adversarial robustness. \nOur work serves as a foundation for future research into the mechanisms underlying power law spectra and optimally smooth encodings in both biological and artificial systems. \nThe insights gained may elucidate the mechanisms that realize robust neural networks in mammalian brains and inform the development of more stable and reliable artificial systems.",
        "keywords": "Latent Geometry;Latent Spectrum;Adversarial Robustness;Mechanistic Model;Unsupervised Learning;Local Learning;Jacobian Regularization;Spectral Regularization",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Konstantin Holzhausen;Mia Merlin;H\u00e5kon-Olav Torvik;Anders Malthe-S\u00f8renssen;Mikkel Elle Lepper\u00f8d",
        "authorids": "~Konstantin_Holzhausen1;miame@uio.no;haakooto@uio.no;anders.malthe-sorenssen@fys.uio.no;~Mikkel_Elle_Lepper\u00f8d1",
        "gender": "M;;;;M",
        "homepage": ";;;;",
        "dblp": ";;;;218/9214",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;;;https://scholar.google.no/citations?user=QSYCR88AAAAJ",
        "orcid": "0000-0002-3419-5489;;;;",
        "linkedin": ";;;;",
        "or_profile": "~Konstantin_Holzhausen1;miame@uio.no;haakooto@uio.no;anders.malthe-sorenssen@fys.uio.no;~Mikkel_Elle_Lepper\u00f8d1",
        "aff": "University of Oslo;;;;Simula Research Laboratory",
        "aff_domain": "uio.no;;;;simula.no",
        "position": "PhD student;;;;Principal Researcher",
        "bibtex": "@misc{\nholzhausen2024exploring,\ntitle={Exploring mechanisms of Neural Robustness: probing the bridge between geometry and spectrum},\nauthor={Konstantin Holzhausen and Mia Merlin and H{\\r{a}}kon-Olav Torvik and Anders Malthe-S{\\o}renssen and Mikkel Elle Lepper{\\o}d},\nyear={2024},\nurl={https://openreview.net/forum?id=D6Htk1rwkK}\n}",
        "github": "",
        "project": "",
        "reviewers": "74wa;1KBf;8ibB;wEmA",
        "site": "https://openreview.net/forum?id=D6Htk1rwkK",
        "pdf_size": 8864264,
        "rating": "3;3;5;6",
        "confidence": "4;4;4;4",
        "soundness": "2;2;3;3",
        "contribution": "1;2;2;3",
        "presentation": "1;2;1;2",
        "wc_summary": "62;90;87;39",
        "wc_strengths": "39;27;73;13",
        "wc_weaknesses": "327;216;431;90",
        "wc_questions": "158;96;77;81",
        "wc_review": "586;429;668;223",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            69.5,
            20.694202086574876
        ],
        "wc_strengths_avg": [
            38.0,
            22.20360331117452
        ],
        "wc_weaknesses_avg": [
            266.0,
            126.9074465900248
        ],
        "wc_questions_avg": [
            103.0,
            32.53459696999488
        ],
        "wc_review_avg": [
            476.5,
            169.6916320859694
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:TzhdSShMoqUJ:scholar.google.com/&scioq=Exploring+mechanisms+of+Neural+Robustness:+probing+the+bridge+between+geometry+and+spectrum&hl=en&as_sdt=0,5",
        "gs_version_total": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Oslo;Simula Research Laboratory",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uio.no;https://www.simula.no",
        "aff_unique_abbr": "UiO;Simula",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Norway"
    },
    {
        "id": "D6aGz0Zyvn",
        "title": "Enhancing Kernel Flexibility via Learning Asymmetric Locally-Adaptive Kernels",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The lack of sufficient flexibility is the key bottleneck of kernel-based learning that relies on manually designed, pre-given, and non-trainable kernels. To enhance kernel flexibility, this paper introduces the concept of Locally-Adaptive-Bandwidths (LAB) as trainable parameters to enhance the Radial Basis Function (RBF) kernel, giving rise to the LAB RBF kernel. The parameters in LAB RBF kernels are data-dependent, and its number can increase with the dataset, allowing for better adaptation to diverse data patterns and enhancing the flexibility of the learned function. This newfound flexibility also brings challenges, particularly with regards to asymmetry and the need for an efficient learning algorithm. To address these challenges, this paper for the first time establishes an asymmetric kernel ridge regression framework and introduces an iterative kernel learning algorithm. This novel approach not only reduces the demand for extensive support data but also significantly improves generalization by training bandwidths on the available training data. Experimental results on real datasets underscore the remarkable performance of the proposed algorithm, showcasing its superior capability in handling large-scale datasets compared to Nystr\u00f6m approximation-based algorithms. Moreover, it demonstrates a significant improvement in regression accuracy over existing kernel-based learning methods and even surpasses residual neural networks.",
        "keywords": "Asymmetric kernel learning;LAB RBF kernel;Kernel ridge regression",
        "primary_area": "metric learning, kernel learning, and sparse coding",
        "supplementary_material": "/attachment/9558cb8a9a5a9f80f5a13fb4cb6b4759888d7d05.pdf",
        "author": "FAN He;Mingzhen He;Lei Shi;Xiaolin Huang;Johan Suykens",
        "authorids": "~FAN_He1;~Mingzhen_He1;~Lei_Shi7;~Xiaolin_Huang1;~Johan_Suykens1",
        "gender": "F;M;M;M;M",
        "homepage": "http://www.pami.sjtu.edu.cn/StudentDetail/12;https://mingzhenhe.github.io/;https://mastone1983.github.io/;http://www.pami.sjtu.edu.cn/en/xiaolin;https://www.kuleuven.be/wieiswie/nl/person/00015385",
        "dblp": ";313/1706;;61/2227;61/3224",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;;DR-gBcEAAAAJ;https://scholar.google.be/citations?user=WtBmh0UAAAAJ",
        "orcid": ";0000-0002-9214-4196;;;0000-0002-8846-6352",
        "linkedin": ";;;;",
        "or_profile": "~FAN_He1;~Mingzhen_He1;~Lei_Shi7;~Xiaolin_Huang1;~Johan_Suykens1",
        "aff": "KU Leuven;Shanghai Jiaotong University;Fudan University;Shanghai Jiaotong University;KU Leuven",
        "aff_domain": "kuleuven.be;sjtu.edu.cn;fudan.edu.cn;sjtu.edu.cn;kuleuven.be",
        "position": "Postdoc;PhD student;Full Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nhe2024enhancing,\ntitle={Enhancing Kernel Flexibility via Learning Asymmetric Locally-Adaptive Kernels},\nauthor={FAN He and Mingzhen He and Lei Shi and Xiaolin Huang and Johan Suykens},\nyear={2024},\nurl={https://openreview.net/forum?id=D6aGz0Zyvn}\n}",
        "github": "",
        "project": "",
        "reviewers": "aToc;PWHQ;gJwQ",
        "site": "https://openreview.net/forum?id=D6aGz0Zyvn",
        "pdf_size": 424349,
        "rating": "5;8;8",
        "confidence": "4;4;4",
        "soundness": "3;2;3",
        "contribution": "3;3;3",
        "presentation": "3;3;3",
        "wc_summary": "47;88;82",
        "wc_strengths": "78;54;151",
        "wc_weaknesses": "65;344;80",
        "wc_questions": "53;2;2",
        "wc_review": "243;488;315",
        "wc_reply_reviewers": "153;281;0",
        "wc_reply_authors": "1460;1343;967",
        "reply_reviewers": "1;2;0",
        "reply_authors": "5;4;3",
        "rating_avg": [
            7.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            72.33333333333333,
            18.080068829760823
        ],
        "wc_strengths_avg": [
            94.33333333333333,
            41.24991582482994
        ],
        "wc_weaknesses_avg": [
            163.0,
            128.1327436684316
        ],
        "wc_questions_avg": [
            19.0,
            24.041630560342615
        ],
        "wc_review_avg": [
            348.6666666666667,
            102.81482815668608
        ],
        "wc_reply_reviewers_avg": [
            144.66666666666666,
            114.8690075211277
        ],
        "wc_reply_authors_avg": [
            1256.6666666666667,
            210.32091880953948
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            4.0,
            0.816496580927726
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6457431767906071072&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;1;0",
        "aff_unique_norm": "Katholieke Universiteit Leuven;Shanghai Jiao Tong University;Fudan University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.kuleuven.be;https://www.sjtu.edu.cn;https://www.fudan.edu.cn",
        "aff_unique_abbr": "KU Leuven;SJTU;Fudan",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;0",
        "aff_country_unique": "Belgium;China"
    },
    {
        "id": "D6pHf8AiO7",
        "title": "Pruning neural networks using FishLeg estimation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In many domains, the most successful AI models tend to be the largest, indeed often too large to be handled by AI players with limited computational resources. To mitigate this, a number of compression methods have been developed, including methods that prune the network down to high sparsity whilst retaining performance. The best-performing pruning techniques are often those that use second-order curvature information (such as an estimate of the Fisher information matrix) to score the importance of each weight and to predict the optimal compensation for weight deletion. However, these methods are difficult to scale to high-dimensional parameter spaces without making heavy approximations. Here, we propose the FishLeg surgeon (FLS), a new second-order pruning method based on the Fisher-Legendre (FishLeg) optimizer. At the heart of FishLeg is a meta-learning approach to amortising the action of the \\emph{inverse} FIM, which brings a number of advantages. Firstly, the parameterisation enables the use of flexible tensor factorisation techniques to improve computational and memory efficiency without sacrificing much accuracy, alleviating challenges associated with scalability of most second-order pruning methods. Secondly, directly estimating the inverse FIM leads to less sensitivity to the amplification of stochasticity during inversion, thereby resulting in more precise estimates. Thirdly, our approach also allows for progressive assimilation of the curvature into the parameterization. In the gradual pruning regime, this results in a more efficient estimate refinement as opposed to re-estimation. We revisit the autoencoder optimisation benchmark of the original FishLeg paper and show that FLS yields highly effective one-shot and gradual pruning, better than previous methods. We further extend FishLeg by developing new structured approximations of the inverse Fisher for convolutional layers. We find that FishLeg greatly improves one-shot pruning accuracy over previous second-order methods on ResNet50 (e.g. 62\\% accuracy at 75\\% sparsity, v.s. 41\\% for M-FAC).",
        "keywords": "pruning;second-order pruning;neural-network pruning;optimization. fishleg optimization",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/030417a77dd8c467a78556b1356a533c0bc8c79d.zip",
        "author": "Rui Xia;Jamie McGowan;Jezabel R Garcia;Chan-Jan Hsu;Yilei Liang;Guillaume Hennequin;Federica Freddi;Alberto Bernacchia",
        "authorids": "~Rui_Xia2;~Jamie_McGowan1;~Jezabel_R_Garcia1;~Chan-Jan_Hsu1;~Yilei_Liang1;~Guillaume_Hennequin1;~Federica_Freddi1;~Alberto_Bernacchia1",
        "gender": "F;M;M;Non-Binary;M;;;F",
        "homepage": ";;https://github.com/Splend1d;https://www.cst.cam.ac.uk/people/yl841;https://cbl-cambridge.org;;;https://www.linkedin.com/in/jezabel-r-garcia-496689b6/",
        "dblp": ";;318/3101.html;;56/10432;281/7116;68/9669;281/6626",
        "google_scholar": ";;1yS6IHEAAAAJ;;-NkKYYcAAAAJ;;n48pFqcAAAAJ;",
        "orcid": ";;;;;;;",
        "linkedin": "rui-xia-567b56150;jamie-mcgowan-62389a133?challengeId=AQFS7f4yOXP3uQAAAXTRG0twUFETxxxc8VUw0Tnac4tk6pEeLPqEP7kun2VfGlUzHZ3qgDxSEkislAO2ITU45CvwbM_ONiLy6Q&submissionId=f998adb0-b6bb-3816-1fb5-cfabfeb03251;;;;federicafreddi/;;jezabel-r-garcia-496689b6/",
        "or_profile": "~Rui_Xia2;~Jamie_McGowan1;~Chan-Jan_Hsu1;~Yilei_Liang1;~Guillaume_Hennequin1;~Federica_Freddi1;~Alberto_Bernacchia1;~Jezabel_Rodriguez_Garcia1",
        "aff": "University of Cambridge;MediaTek Research;MediaTek Research;University of Cambridge;MediaTek Research;MediaTek Research;MedaiTek Research;MediaTek Research",
        "aff_domain": "cam.ac.uk;mtkresearch.com;mtkresearch.com;cam.ac.uk;mtkresearch.com;mtkresearch.com;mtkresearch.com;mtkresearch.com",
        "position": "PhD student;Researcher;Researcher;PhD student;Researcher;Researcher;Team Lead;Researcher",
        "bibtex": "@misc{\nxia2024pruning,\ntitle={Pruning neural networks using FishLeg estimation},\nauthor={Rui Xia and Jamie McGowan and Jezabel R Garcia and Chan-Jan Hsu and Yilei Liang and Guillaume Hennequin and Federica Freddi and Alberto Bernacchia},\nyear={2024},\nurl={https://openreview.net/forum?id=D6pHf8AiO7}\n}",
        "github": "",
        "project": "",
        "reviewers": "fDy7;vdNS;s1pu;pttL",
        "site": "https://openreview.net/forum?id=D6pHf8AiO7",
        "pdf_size": 899879,
        "rating": "3;3;5;6",
        "confidence": "4;4;2;2",
        "soundness": "2;2;2;3",
        "contribution": "1;1;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "90;63;52;90",
        "wc_strengths": "25;31;39;40",
        "wc_weaknesses": "160;173;157;100",
        "wc_questions": "32;79;2;24",
        "wc_review": "307;346;250;254",
        "wc_reply_reviewers": "0;68;0;0",
        "wc_reply_authors": "23;103;276;21",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.0,
            1.0
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            73.75,
            16.708904811506947
        ],
        "wc_strengths_avg": [
            33.75,
            6.139014578904337
        ],
        "wc_weaknesses_avg": [
            147.5,
            28.075790282732914
        ],
        "wc_questions_avg": [
            34.25,
            28.07467720206236
        ],
        "wc_review_avg": [
            289.25,
            39.74528273896161
        ],
        "wc_reply_reviewers_avg": [
            17.0,
            29.444863728670914
        ],
        "wc_reply_authors_avg": [
            105.75,
            103.70963070033564
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.9622504486493761,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:HXlN-kDADR0J:scholar.google.com/&scioq=Pruning+neural+networks+using+FishLeg+estimation&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;0;1;1;2;1",
        "aff_unique_norm": "University of Cambridge;MediaTek Inc.;MedaiTek",
        "aff_unique_dep": ";Research;Research",
        "aff_unique_url": "https://www.cam.ac.uk;https://www.mediatek.com/;",
        "aff_unique_abbr": "Cambridge;MediaTek;",
        "aff_campus_unique_index": "0;1;1;0;1;1;1",
        "aff_campus_unique": "Cambridge;Taiwan;",
        "aff_country_unique_index": "0;1;1;0;1;1;1",
        "aff_country_unique": "United Kingdom;China;"
    },
    {
        "id": "D78HxVUg1Q",
        "title": "Robustness to Multi-Modal Environment Uncertainty in MARL using Curriculum Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Multi-agent reinforcement learning (MARL) plays a pivotal role in tackling real-world challenges. However, the seamless transition of trained policies from simulations to real-world requires it to be robust to various environmental uncertainties. Existing works focus on finding Nash Equilibrium or the optimal policy under uncertainty in one environment variable (i.e. action, state or reward). This is because a multi-agent system itself is highly complex and unstationary. However, in real-world situation uncertainty can occur in multiple environment variables simultaneously. This work is the first to formulate the generalised problem of robustness to multi-modal environment uncertainty in MARL. To this end, we propose a general robust training approach for multi-modal uncertainty based on curriculum learning techniques. We handle two distinct environmental uncertainty simultaneously and present extensive results across both cooperative and competitive MARL environments, demonstrating that our approach achieves state-of-the-art levels of robustness.",
        "keywords": "Multi-Modal Uncertainty;Robustness;Multi-Agent Reinforcement Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/613a072f44f0ef826e23ef51a65d34c27e1de578.zip",
        "author": "Aakriti Agrawal;Rohith Aralikatti;Yanchao Sun;Furong Huang",
        "authorids": "~Aakriti_Agrawal1;~Rohith_Aralikatti1;~Yanchao_Sun1;~Furong_Huang1",
        "gender": "F;M;F;F",
        "homepage": "https://sites.google.com/umd.edu/aakriti-agrawal/;;https://ycsun2017.github.io/home/index.html;https://furong-huang.com",
        "dblp": "259/2330;218/6651.html;132/6840;72/8513",
        "google_scholar": "2RRnCRMAAAAJ;VqCBLN8AAAAJ;bloBY_QAAAAJ;13yyuCcAAAAJ",
        "orcid": ";;0000-0002-1137-9939;",
        "linkedin": "aakriti-agrawal05/;rohith-aralikatti/;;",
        "or_profile": "~Aakriti_Agrawal1;~Rohith_Aralikatti1;~Yanchao_Sun1;~Furong_Huang1",
        "aff": "University of Maryland;Hilabs Inc;J.P. Morgan AI Research;University of Maryland",
        "aff_domain": "umd.edu;hilabs.com;jpmchase.com;cs.umd.edu",
        "position": "PhD student;Data Scientist;Researcher;Assistant Professor",
        "bibtex": "@misc{\nagrawal2024robustness,\ntitle={Robustness to Multi-Modal Environment Uncertainty in {MARL} using Curriculum Learning},\nauthor={Aakriti Agrawal and Rohith Aralikatti and Yanchao Sun and Furong Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=D78HxVUg1Q}\n}",
        "github": "",
        "project": "",
        "reviewers": "nCir;yumG;TdMD;P2NT",
        "site": "https://openreview.net/forum?id=D78HxVUg1Q",
        "pdf_size": 1823836,
        "rating": "1;3;3;3",
        "confidence": "4;4;5;4",
        "soundness": "2;2;1;1",
        "contribution": "2;2;1;2",
        "presentation": "2;3;1;1",
        "wc_summary": "34;76;117;100",
        "wc_strengths": "22;53;12;19",
        "wc_weaknesses": "129;450;976;562",
        "wc_questions": "8;4;114;119",
        "wc_review": "193;583;1219;800",
        "wc_reply_reviewers": "0;45;231;316",
        "wc_reply_authors": "450;766;357;409",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            81.75,
            31.17992142389073
        ],
        "wc_strengths_avg": [
            26.5,
            15.724185193516387
        ],
        "wc_weaknesses_avg": [
            529.25,
            302.95987770660327
        ],
        "wc_questions_avg": [
            61.25,
            55.29636063973831
        ],
        "wc_review_avg": [
            698.75,
            370.8411890553691
        ],
        "wc_reply_reviewers_avg": [
            148.0,
            130.024997596616
        ],
        "wc_reply_authors_avg": [
            495.5,
            159.61281276890023
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:D8RAEojhEZsJ:scholar.google.com/&scioq=Robustness+to+Multi-Modal+Environment+Uncertainty+in+MARL+using+Curriculum+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "University of Maryland;Hilabs Inc;J.P. Morgan",
        "aff_unique_dep": ";;AI Research",
        "aff_unique_url": "https://www/umd.edu;;https://www.jpmorgan.com",
        "aff_unique_abbr": "UMD;;JPM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Model Merging by Uncertainty-Based Gradient Matching",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19152",
        "id": "D7KJmfEDQP",
        "author_site": "Nico Daheim, Thomas M\u00f6llenhoff, Edoardo M. Ponti, Iryna Gurevych, Mohammad Emtiyaz Khan",
        "tldr": "",
        "abstract": "Models trained on different datasets can be merged by a weighted-averaging of their parameters, but why does it work and when can it fail? Here, we connect the inaccuracy of weighted-averaging to mismatches in the gradients and propose a new uncertainty-based scheme to improve the performance by reducing the mismatch. The connection also reveals implicit assumptions in other schemes such as averaging, task arithmetic, and Fisher-weighted averaging. Our new method gives consistent improvements for large language models and vision transformers, both in terms of performance and robustness to hyperparameters.",
        "keywords": "Model Merging;Gradient Matching;Language Modeling;Model Editing;Transfer Learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Nico Daheim;Thomas M\u00f6llenhoff;Edoardo Ponti;Iryna Gurevych;Mohammad Emtiyaz Khan",
        "authorids": "~Nico_Daheim1;~Thomas_M\u00f6llenhoff1;~Edoardo_Ponti1;~Iryna_Gurevych1;~Mohammad_Emtiyaz_Khan1",
        "gender": "M;M;;;M",
        "homepage": "https://ndaheim.github.io;http://www.thomasmoellenhoff.net;https://ducdauge.github.io/;;https://emtiyaz.github.io/",
        "dblp": "285/5587;;178/8829;;58/10432",
        "google_scholar": "n6wJfqUAAAAJ;KAqmeqAAAAAJ;https://scholar.google.ca/citations?user=tklL2q0AAAAJ;;https://scholar.google.com/citations?hl=en",
        "orcid": ";;0000-0002-6308-1050;;",
        "linkedin": ";;edoardo-maria-ponti/;;",
        "or_profile": "~Nico_Daheim1;~Thomas_M\u00f6llenhoff1;~Edoardo_Ponti1;~Iryna_Gurevych1;~Mohammad_Emtiyaz_Khan1",
        "aff": "Technische Universit\u00e4t Darmstadt;RIKEN;NVIDIA;;RIKEN Center for AI Project",
        "aff_domain": "tu-darmstadt.de;riken.jp;nvidia.com;;riken.jp",
        "position": "PhD student;Researcher;Researcher;;Full Professor",
        "bibtex": "@inproceedings{\ndaheim2024model,\ntitle={Model Merging by Uncertainty-Based Gradient Matching},\nauthor={Nico Daheim and Thomas M{\\\"o}llenhoff and Edoardo Ponti and Iryna Gurevych and Mohammad Emtiyaz Khan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=D7KJmfEDQP}\n}",
        "github": "",
        "project": "",
        "reviewers": "1bWs;V4z1;vWCx;idAX",
        "pdf_size": 419104,
        "rating": "6;6;6;6",
        "confidence": "5;2;4;3",
        "soundness": "2;2;4;4",
        "contribution": "3;3;4;3",
        "presentation": "3;2;4;4",
        "wc_summary": "95;55;44;58",
        "wc_strengths": "116;31;60;74",
        "wc_weaknesses": "105;21;153;233",
        "wc_questions": "668;176;68;5",
        "wc_review": "984;283;325;370",
        "wc_reply_reviewers": "306;49;0;35",
        "wc_reply_authors": "1883;524;516;422",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "3;2;2;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            3.0,
            1.0
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            63.0,
            19.196353820452465
        ],
        "wc_strengths_avg": [
            70.25,
            30.629846555280032
        ],
        "wc_weaknesses_avg": [
            128.0,
            76.8570100901668
        ],
        "wc_questions_avg": [
            229.25,
            260.58911623473455
        ],
        "wc_review_avg": [
            490.5,
            286.5785232706736
        ],
        "wc_reply_reviewers_avg": [
            97.5,
            121.69326193343656
        ],
        "wc_reply_authors_avg": [
            836.25,
            605.6708573969859
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 52,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15576223718711362267&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=D7KJmfEDQP",
        "pdf": "https://openreview.net/pdf?id=D7KJmfEDQP",
        "email": "tu-darmstadt.de;riken.jp;nvidia.com;;riken.jp",
        "author_num": 5,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "Technische Universit\u00e4t Darmstadt;RIKEN;NVIDIA",
        "aff_unique_dep": ";;NVIDIA Corporation",
        "aff_unique_url": "https://www.tu-darmstadt.de;https://www.riken.jp;https://www.nvidia.com",
        "aff_unique_abbr": "TUD;RIKEN;NVIDIA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;1",
        "aff_country_unique": "Germany;Japan;United States"
    },
    {
        "id": "D7v6HmwqKC",
        "title": "Can LLMs Effectively Leverage Graph Structural Information: When and Why",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "This paper studies Large Language Models (LLMs) augmented with structured data--particularly graphs--a crucial data modality that remains underexplored in the LLM literature. We aim to understand when and why the incorporation of structural information inherent in graph data can improve the prediction performance of LLMs on node classification tasks with textual features. To address the \"when\" question, we examine a variety of prompting methods for encoding structural information, in settings where textual node features are either rich or scarce. For the \"why\" questions, we probe into two potential contributing factors to the LLM performance: data leakage and homophily. Our exploration of these questions reveals that (i) LLMs can benefit from structural information, especially when textual node features are scarce; (ii) there is no substantial evidence indicating that the performance of LLMs is significantly attributed to data leakage; and (iii) the performance of LLMs on a target node is strongly positively related to the local homophily ratio of the node.",
        "keywords": "Large Language Model;Graph;Multimodality;Data Leakage;Homophily",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/864c40574e40c54e7cf293fafa6f0a65e23d6580.zip",
        "author": "Jin Huang;Xingjian Zhang;Qiaozhu Mei;Jiaqi Ma",
        "authorids": "~Jin_Huang7;~Xingjian_Zhang1;~Qiaozhu_Mei1;~Jiaqi_Ma1",
        "gender": "M;M;M;",
        "homepage": "https://jn-huang.github.io;https://xingjian-zhang.github.io;http://www-personal.umich.edu/~qmei/;https://jiaqima.github.io",
        "dblp": ";36/5276-2;30/5059;155/2199-1",
        "google_scholar": "5xB2e10AAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com.tw/citations?user=zr22WkQAAAAJ;Z9X2A1MAAAAJ",
        "orcid": ";0009-0001-0716-3449;0000-0002-8640-1942;0000-0001-8292-5901",
        "linkedin": "steven-huang-04220224b/;;;",
        "or_profile": "~Jin_Huang7;~Xingjian_Zhang1;~Qiaozhu_Mei1;~Jiaqi_Ma1",
        "aff": "University of Michigan - Ann Arbor;University of Michigan - Ann Arbor;Google;University of Illinois Urbana-Champaign",
        "aff_domain": "umich.edu;umich.edu;google.com;illinois.edu",
        "position": "Undergrad student;PhD student;Researcher;Assistant Professor",
        "bibtex": "@misc{\nhuang2024can,\ntitle={Can {LLM}s Effectively Leverage Graph Structural Information: When and Why},\nauthor={Jin Huang and Xingjian Zhang and Qiaozhu Mei and Jiaqi Ma},\nyear={2024},\nurl={https://openreview.net/forum?id=D7v6HmwqKC}\n}",
        "github": "",
        "project": "",
        "reviewers": "vRFw;Ayoh;PJPi;ytsy;2d38",
        "site": "https://openreview.net/forum?id=D7v6HmwqKC",
        "pdf_size": 479280,
        "rating": "3;3;3;6;6",
        "confidence": "5;4;4;3;3",
        "soundness": "2;2;2;3;3",
        "contribution": "2;1;2;3;3",
        "presentation": "3;2;3;4;3",
        "wc_summary": "63;169;41;139;99",
        "wc_strengths": "86;81;23;84;123",
        "wc_weaknesses": "307;237;217;33;221",
        "wc_questions": "62;1;4;16;60",
        "wc_review": "518;488;285;272;503",
        "wc_reply_reviewers": "317;150;0;78;33",
        "wc_reply_authors": "984;1019;780;428;274",
        "reply_reviewers": "1;1;0;1;1",
        "reply_authors": "2;3;2;2;1",
        "rating_avg": [
            4.2,
            1.469693845669907
        ],
        "confidence_avg": [
            3.8,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.2,
            0.7483314773547882
        ],
        "presentation_avg": [
            3.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            102.2,
            47.135549217124854
        ],
        "wc_strengths_avg": [
            79.4,
            32.09112026713932
        ],
        "wc_weaknesses_avg": [
            203.0,
            90.98571316421057
        ],
        "wc_questions_avg": [
            28.6,
            26.933993391251885
        ],
        "wc_review_avg": [
            413.2,
            110.46700864964164
        ],
        "wc_reply_reviewers_avg": [
            115.6,
            112.55683009040366
        ],
        "wc_reply_authors_avg": [
            697.0,
            298.0711324499573
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4
        ],
        "reply_authors_avg": [
            2.0,
            0.6324555320336759
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8728715609439694,
        "gs_citation": 49,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6993794447120248794&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "University of Michigan;Google;University of Illinois Urbana-Champaign",
        "aff_unique_dep": ";Google;",
        "aff_unique_url": "https://www.umich.edu;https://www.google.com;https://illinois.edu",
        "aff_unique_abbr": "UM;Google;UIUC",
        "aff_campus_unique_index": "0;0;1;2",
        "aff_campus_unique": "Ann Arbor;Mountain View;Urbana-Champaign",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "D8DAQhpznu",
        "title": "Llamas Know What GPTs Don't Show: Surrogate Models for Selective Classification",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "To maintain user trust, large language models (LLMs) should signal low confidence on examples they get incorrect, instead of misleading the user.\nThe standard approach of estimating confidence is to use the softmax probabilities of these models, but state-of-the-art LLMs such as GPT-4 and Claude do not provide access to these probabilities.\nWe first study eliciting confidence linguistically---asking an LLM for its confidence in its answer---but we find that this leaves a lot of room for improvement (79\\% AUC on GPT-4 averaged across 12 question-answering datasets---only 5\\% above a random baseline).\nWe then explore using a \\emph{surrogate} confidence model---using a model where we do have probabilities to evaluate the original model's confidence in a given question.\nSurprisingly, even though these probabilities come from a different model, this method leads to higher AUC than linguistic confidences on 10 out of 12 datasets.\nOur best method mixing linguistic confidences and surrogate model probabilities gives state-of-the-art performance on all 12 datasets (85\\% average AUC on GPT-4).",
        "keywords": "calibration;uncertainty estimation;large language models",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Vaishnavi Shrivastava;Percy Liang;Ananya Kumar",
        "authorids": "~Vaishnavi_Shrivastava1;~Percy_Liang1;~Ananya_Kumar1",
        "gender": "F;;M",
        "homepage": ";https://cs.stanford.edu/~pliang/;https://ananyakumar.wordpress.com/",
        "dblp": ";04/1701;192/0474",
        "google_scholar": ";pouyVyUAAAAJ;tP5IBFkAAAAJ",
        "orcid": ";;",
        "linkedin": "vaish-shrivastava/;;",
        "or_profile": "~Vaishnavi_Shrivastava1;~Percy_Liang1;~Ananya_Kumar1",
        "aff": "Stanford University;Stanford University;OpenAI",
        "aff_domain": "stanford.edu;stanford.edu;openai.com",
        "position": "MS student;Associate Professor;Researcher",
        "bibtex": "@misc{\nshrivastava2024llamas,\ntitle={Llamas Know What {GPT}s Don't Show: Surrogate Models for Selective Classification},\nauthor={Vaishnavi Shrivastava and Percy Liang and Ananya Kumar},\nyear={2024},\nurl={https://openreview.net/forum?id=D8DAQhpznu}\n}",
        "github": "",
        "project": "",
        "reviewers": "mEr2;78gw;LeSy;RfxS",
        "site": "https://openreview.net/forum?id=D8DAQhpznu",
        "pdf_size": 1060699,
        "rating": "3;3;5;5",
        "confidence": "3;4;4;3",
        "soundness": "2;2;3;2",
        "contribution": "2;2;3;2",
        "presentation": "2;3;3;2",
        "wc_summary": "29;135;108;63",
        "wc_strengths": "12;58;62;58",
        "wc_weaknesses": "158;100;231;206",
        "wc_questions": "21;1;17;58",
        "wc_review": "220;294;418;385",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "784;1011;1292;1702",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;3;3",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            83.75,
            40.751533713468994
        ],
        "wc_strengths_avg": [
            47.5,
            20.56088519495209
        ],
        "wc_weaknesses_avg": [
            173.75,
            50.01187359017856
        ],
        "wc_questions_avg": [
            24.25,
            20.873128658636684
        ],
        "wc_review_avg": [
            329.25,
            77.7218598593729
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1197.25,
            342.49625910365796
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:rcPci9ABSsoJ:scholar.google.com/&scioq=Llamas+Know+What+GPTs+Don%27t+Show:+Surrogate+Models+for+Selective+Classification&hl=en&as_sdt=0,11",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Stanford University;OpenAI",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.stanford.edu;https://openai.com",
        "aff_unique_abbr": "Stanford;OpenAI",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Stanford;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "D96juYQ2NW",
        "title": "Coresets for Clustering with Noisy Data",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We study the problem of data reduction for clustering when the input dataset $\\widehat{P}$ is a noisy version of the true dataset $P$.\nMotivation for this problem derives from settings where data is obtained from inherently noisy measurements or noise is added to data for privacy or robustness reasons.\nIn the noise-free setting, coresets have been proposed as a solution to this data reduction problem -- a coreset is a subset $S$ of $P$ that comes with a guarantee that the maximum difference, over all center sets, in cost of the center set for $S$ versus that of $P$ is small.\nWe find that this well-studied measure which determines the quality of a coreset is too strong when the data is noisy because the change in the cost of the optimal center set in the case $S=\\widehat{P}$ when compared to that of $P$ can be much smaller than other center sets.\nTo bypass this, we consider a modification of this measure by 1) restricting only to approximately optimal center sets and 2) considering the *ratio* of the cost of $S$ for a given center set to the minimum cost of $S$ over all approximately optimal center sets.\nThis new measure allows us to get refined estimates on the quality of the optimal center set of a coreset as a function of the noise level.\nOur results apply to a wide class of noise models satisfying certain bounded-moment conditions that include Gaussian and Laplace distributions.\nOur results are not algorithm-dependent and can be used to derive estimates on the quality of a coreset produced by any algorithm in the noisy setting.\nEmpirically, we present results on the performance of coresets obtained from noisy versions of real-world datasets, verifying our theoretical findings and implying that the variance of noise is the main characterization of the coreset performances.",
        "keywords": "clustering;noise;coreset",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/729e08bd3717fd7df535d5a487b7eddaab34e4d5.pdf",
        "author": "Lingxiao Huang;Zhize Li;Nisheeth K. Vishnoi;Haoyu Zhao",
        "authorids": "~Lingxiao_Huang2;~Zhize_Li1;~Nisheeth_K._Vishnoi2;~Haoyu_Zhao1",
        "gender": "M;M;M;M",
        "homepage": "https://sites.google.com/site/lingxiaohuang1990;https://zhizeli.github.io/;http://hyzhao.me;http://cs.yale.edu/homes/vishnoi/Home.html",
        "dblp": "119/4814.html;178/3238;;02/2229",
        "google_scholar": ";uAFPPigAAAAJ;1MjanHUAAAAJ;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Lingxiao_Huang2;~Zhize_Li1;~Haoyu_Zhao1;~Nisheeth_K_Vishnoi1",
        "aff": "Nanjing University;Singapore Management University;Princeton University;Yale University",
        "aff_domain": "nju.edu.cn;smu.edu.sg;princeton.edu;yale.edu",
        "position": "Associate Professor;Assistant Professor;PhD student;Full Professor",
        "bibtex": "@misc{\nhuang2024coresets,\ntitle={Coresets for Clustering with Noisy Data},\nauthor={Lingxiao Huang and Zhize Li and Nisheeth K. Vishnoi and Haoyu Zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=D96juYQ2NW}\n}",
        "github": "",
        "project": "",
        "reviewers": "a2UA;QbwN;gA35;C3U6",
        "site": "https://openreview.net/forum?id=D96juYQ2NW",
        "pdf_size": 734773,
        "rating": "5;5;6;6",
        "confidence": "4;4;4;3",
        "soundness": "3;2;3;2",
        "contribution": "2;2;3;3",
        "presentation": "3;2;3;2",
        "wc_summary": "247;102;228;12",
        "wc_strengths": "60;47;36;44",
        "wc_weaknesses": "21;89;137;26",
        "wc_questions": "1;103;24;32",
        "wc_review": "329;341;425;114",
        "wc_reply_reviewers": "14;14;0;0",
        "wc_reply_authors": "205;1562;345;772",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "1;3;1;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            147.25,
            95.93063900548145
        ],
        "wc_strengths_avg": [
            46.75,
            8.642193008721803
        ],
        "wc_weaknesses_avg": [
            68.25,
            47.89245765253648
        ],
        "wc_questions_avg": [
            40.0,
            38.11167800031901
        ],
        "wc_review_avg": [
            302.25,
            114.80717529841068
        ],
        "wc_reply_reviewers_avg": [
            7.0,
            7.0
        ],
        "wc_reply_authors_avg": [
            721.0,
            528.5626736726687
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:67Yfct6CZSgJ:scholar.google.com/&scioq=Coresets+for+Clustering+with+Noisy+Data&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Nanjing University;Singapore Management University;Princeton University;Yale University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.nju.edu.cn;https://www.smu.edu.sg;https://www.princeton.edu;https://www.yale.edu",
        "aff_unique_abbr": "Nanjing U;SMU;Princeton;Yale",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;2",
        "aff_country_unique": "China;Singapore;United States"
    },
    {
        "id": "D9SA02esgh",
        "title": "MorphOcc: An Implicit Generative Model of Neuronal Morphologies",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Understanding the diversity and complexity of the morphology of different types\nof neurons is important for understanding neural circuits. We need quantitative,\nunbiased methods to capture the structural and morphological features of neurons.\nWith the advent of large-scale structural datasets, this analysis becomes feasible\nusing data-drive approaches. Existing generative models are limited to modeling\ndendritic and axonal skeleton graphs, without considering the actual 3D shape. In\nthis work, we propose MORPHOCC, a model that represents the diversity of neu-\nrons in mouse primary visual cortex (V1) in a single neural network by encoding\neach neuron\u2019s morphology into a low-dimensional embedding. From this embed-\nding the 3d shape can be reconstructed. We train our model on 797 dendritic\nshapes of V1 neurons. The learned embedding captures morphological features\nwell and enables cell type classification into known cell types. Interpolating be-\ntween samples in embedding space generates new instances of neurons without\nsupervision. MORPHOCC has the potential to improve our understanding of neu-\nrons in the brain by facilitating large-scale analysis and providing a model for\nrepresenting neuronal morphologies.",
        "keywords": "implicit model;generative modelling;neuronal morphologies;computational neuroscience;primary visual cortex",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "Laura Hansel;Timo L\u00fcddecke;Marissa A. Weis;Alexander S Ecker",
        "authorids": "~Laura_Hansel1;~Timo_L\u00fcddecke1;~Marissa_A._Weis1;~Alexander_S_Ecker1",
        "gender": ";;;M",
        "homepage": ";https://eckerlab.org/people/;;http://eckerlab.org",
        "dblp": ";142/3944;;26/7228",
        "google_scholar": ";dgGelc4AAAAJ;;VgYU_m8AAAAJ",
        "orcid": ";;;0000-0003-2392-5105",
        "linkedin": ";;;alexecker/",
        "or_profile": "~Laura_Hansel1;~Timo_L\u00fcddecke1;~Marissa_A._Weis1;~Alexander_S_Ecker1",
        "aff": ";University of Goettingen;;Max Planck Institute for Dynamics and Self-Organization",
        "aff_domain": ";uni-goettingen.de;;ds.mpg.de",
        "position": ";Postdoc;;Principal Researcher",
        "bibtex": "@misc{\nhansel2024morphocc,\ntitle={MorphOcc: An Implicit Generative Model of Neuronal Morphologies},\nauthor={Laura Hansel and Timo L{\\\"u}ddecke and Marissa A. Weis and Alexander S Ecker},\nyear={2024},\nurl={https://openreview.net/forum?id=D9SA02esgh}\n}",
        "github": "",
        "project": "",
        "reviewers": "zrce;ZykZ;7kwZ",
        "site": "https://openreview.net/forum?id=D9SA02esgh",
        "pdf_size": 4854606,
        "rating": "3;3;6",
        "confidence": "3;4;4",
        "soundness": "3;2;3",
        "contribution": "2;2;3",
        "presentation": "3;2;4",
        "wc_summary": "104;84;74",
        "wc_strengths": "54;42;116",
        "wc_weaknesses": "219;129;52",
        "wc_questions": "210;51;54",
        "wc_review": "587;306;296",
        "wc_reply_reviewers": "410;129;158",
        "wc_reply_authors": "648;350;300",
        "reply_reviewers": "1;1;1",
        "reply_authors": "2;1;1",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            87.33333333333333,
            12.472191289246473
        ],
        "wc_strengths_avg": [
            70.66666666666667,
            32.42769735204082
        ],
        "wc_weaknesses_avg": [
            133.33333333333334,
            68.24628602023377
        ],
        "wc_questions_avg": [
            105.0,
            74.2563128629479
        ],
        "wc_review_avg": [
            396.3333333333333,
            134.883488817407
        ],
        "wc_reply_reviewers_avg": [
            232.33333333333334,
            126.18592983724012
        ],
        "wc_reply_authors_avg": [
            432.6666666666667,
            153.6258080170415
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:z4f0962GqNAJ:scholar.google.com/&scioq=MorphOcc:+An+Implicit+Generative+Model+of+Neuronal+Morphologies&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of G\u00f6ttingen;Max Planck Institute for Dynamics and Self-Organization",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uni-goettingen.de;https://www.mpids.org",
        "aff_unique_abbr": "UG;MPIDS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Germany"
    },
    {
        "title": "SpaCE: The Spatial Confounding Environment",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19151",
        "id": "D9rJdtmIG6",
        "author_site": "Mauricio Tec, Ana Trisovic, Michelle Audirac, Sophie Woodward, Jie Hu, Naeem Khoshnevis, Francesca Dominici",
        "tldr": "",
        "abstract": "Spatial confounding poses a significant challenge in scientific studies involving spatial data, where unobserved spatial variables can influence both treatment and outcome, possibly leading to spurious associations. To address this problem, we introduce SpaCE: The Spatial Confounding Environment, the first toolkit to provide realistic benchmark datasets and tools for systematically evaluating causal inference methods designed to alleviate spatial confounding. Each dataset includes training data, true counterfactuals, a spatial graph with coordinates, and smoothness and confounding scores characterizing the effect of a missing spatial confounder. It also includes realistic semi-synthetic outcomes and counterfactuals, generated using state-of-the-art machine learning ensembles, following best practices for causal inference benchmarks. The datasets cover real treatment and covariates from diverse domains, including climate, health and social sciences. SpaCE facilitates an automated end-to-end pipeline, simplifying data loading, experimental setup, and evaluating machine learning and causal inference models. The SpaCE project provides several dozens of datasets of diverse sizes and spatial complexity. It is publicly available as a Python package, encouraging community feedback and contributions.",
        "keywords": "benchmarks;spatial confounding;graph neural networks;semi-synthetic data;causal inference",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Mauricio Tec;Ana Trisovic;Michelle Audirac;Sophie Mirabai Woodward;Jie Kate Hu;Naeem Khoshnevis;Francesca Dominici",
        "authorids": "~Mauricio_Tec1;~Ana_Trisovic1;~Michelle_Audirac1;~Sophie_Mirabai_Woodward1;~Jie_Kate_Hu1;~Naeem_Khoshnevis1;~Francesca_Dominici2",
        "gender": "M;F;F;F;F;M;F",
        "homepage": "https://mauriciogtec.github.io/;https://anatrisovic.com/;;;http://www.katehu.com;;https://www.hsph.harvard.edu/francesca-dominici/",
        "dblp": ";;;;;;220/5365",
        "google_scholar": ";;knzNXzMAAAAJ;;;j0RJHyIAAAAJ;https://scholar.google.co.uk/citations?user=RSwElNMAAAAJ",
        "orcid": "0000-0002-1853-5842;;0000-0001-5889-6768;0000-0003-1802-9082;;0000-0003-4315-1426;",
        "linkedin": "mauriciogtec/;;;;jie-kate-hu-1342157/;;",
        "or_profile": "~Mauricio_Tec1;~Ana_Trisovic1;~Michelle_Audirac1;~Sophie_Mirabai_Woodward1;~Jie_Kate_Hu1;~Naeem_Khoshnevis1;~Francesca_Dominici2",
        "aff": "Harvard University;Harvard University;Harvard University;Harvard University, Harvard University;Harvard University;Harvard University;Harvard University",
        "aff_domain": "harvard.edu;harvard.edu;harvard.edu;g.harvard.edu;harvard.edu;harvard.edu;harvard.edu",
        "position": "Postdoc;Postdoc;Researcher;PhD student;Postdoc;Researcher;Full Professor",
        "bibtex": "@inproceedings{\ntec2024space,\ntitle={Spa{CE}: The Spatial Confounding Environment},\nauthor={Mauricio Tec and Ana Trisovic and Michelle Audirac and Sophie Mirabai Woodward and Jie Kate Hu and Naeem Khoshnevis and Francesca Dominici},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=D9rJdtmIG6}\n}",
        "github": "",
        "project": "",
        "reviewers": "189J;ykyy;oEAN",
        "pdf_size": 2811815,
        "rating": "6;6;8",
        "confidence": "3;4;3",
        "soundness": "2;3;3",
        "contribution": "3;2;3",
        "presentation": "3;4;4",
        "wc_summary": "61;14;133",
        "wc_strengths": "37;63;136",
        "wc_weaknesses": "145;255;219",
        "wc_questions": "14;11;2",
        "wc_review": "257;343;490",
        "wc_reply_reviewers": "17;0;0",
        "wc_reply_authors": "548;591;276",
        "reply_reviewers": "1;0;0",
        "reply_authors": "2;2;2",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            69.33333333333333,
            48.93760199364993
        ],
        "wc_strengths_avg": [
            78.66666666666667,
            41.907305117631005
        ],
        "wc_weaknesses_avg": [
            206.33333333333334,
            45.79179936286506
        ],
        "wc_questions_avg": [
            9.0,
            5.0990195135927845
        ],
        "wc_review_avg": [
            363.3333333333333,
            96.20233307404186
        ],
        "wc_reply_reviewers_avg": [
            5.666666666666667,
            8.013876853447538
        ],
        "wc_reply_authors_avg": [
            471.6666666666667,
            139.46644359446788
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11602869970733770903&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=D9rJdtmIG6",
        "pdf": "https://openreview.net/pdf?id=D9rJdtmIG6",
        "email": "harvard.edu;harvard.edu;harvard.edu;g.harvard.edu;harvard.edu;harvard.edu;harvard.edu",
        "author_num": 7,
        "aff_unique_index": "0;0;0;0;0;0;0",
        "aff_unique_norm": "Harvard University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.harvard.edu",
        "aff_unique_abbr": "Harvard",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Plugin estimators for selective classification with out-of-distribution detection",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19150",
        "id": "DASh78rJ7g",
        "author_site": "Harikrishna Narasimhan, Aditya Krishna Menon, Wittawat Jitkrittum, Sanjiv Kumar",
        "tldr": "",
        "abstract": "Real-world classifiers can benefit from the option of abstaining from predicting on samples where they have low confidence. Such abstention is particularly useful on samples which are close to the learned decision boundary, or which are outliers with respect to the training sample. These settings have been the subject of extensive but disjoint study in the selective classification (SC) and out-of-distribution (OOD) detection literature. Recent work on selective classification with OOD detection (SCOD) has argued for the unified study of these problems; however, the formal underpinnings of this problem are still nascent, and existing techniques are heuristic in nature. In this paper, we propose new plugin estimators for SCOD that are theoretically grounded, effective, and generalise existing approaches from the SC and OOD detection literature. In the course of our analysis, we formally explicate how na\u00efve use of existing SC and OOD detection baselines may be inadequate for SCOD. We empirically demonstrate that our approaches yields competitive SC and OOD detection trade-offs compared to common baselines.",
        "keywords": "Selective classification;Learning to reject;Abstention;OOD detection;SCOD;Loss functions;Plug-in estimators;Statistical consistency",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Harikrishna Narasimhan;Aditya Krishna Menon;Wittawat Jitkrittum;Sanjiv Kumar",
        "authorids": "~Harikrishna_Narasimhan1;~Aditya_Krishna_Menon1;~Wittawat_Jitkrittum1;~Sanjiv_Kumar1",
        "gender": "M;M;;M",
        "homepage": "https://hari-research.github.io/;http://wittawat.com;http://www.sanjivk.com/;https://akmenon.github.io/",
        "dblp": "56/7573;95/3398.html;;89/3514",
        "google_scholar": "7X_oT4YAAAAJ;https://scholar.google.co.uk/citations?hl=en;https://scholar.google.com/citations?hl=en;",
        "orcid": ";0000-0002-9400-9262;;",
        "linkedin": ";wittawat-jitkrittum/;;",
        "or_profile": "~Harikrishna_Narasimhan1;~Wittawat_Jitkrittum1;~Sanjiv_Kumar1;~Aditya_Menon1",
        "aff": "Google;Google Research;Google;Google",
        "aff_domain": "google.com;google.com;google.com;google.com",
        "position": "Research Scientist;Research Scientist;Research Scientist;Research Scientist",
        "bibtex": "@inproceedings{\nnarasimhan2024plugin,\ntitle={Plugin estimators for selective classification with out-of-distribution detection},\nauthor={Harikrishna Narasimhan and Aditya Krishna Menon and Wittawat Jitkrittum and Sanjiv Kumar},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=DASh78rJ7g}\n}",
        "github": "",
        "project": "",
        "reviewers": "WNPt;ZjGh;nGxu",
        "pdf_size": 614176,
        "rating": "6;8;8",
        "confidence": "4;3;4",
        "soundness": "2;3;4",
        "contribution": "3;3;4",
        "presentation": "3;3;3",
        "wc_summary": "88;83;173",
        "wc_strengths": "39;50;230",
        "wc_weaknesses": "68;216;178",
        "wc_questions": "11;204;763",
        "wc_review": "206;553;1344",
        "wc_reply_reviewers": "0;29;19",
        "wc_reply_authors": "372;1014;1531",
        "reply_reviewers": "0;1;1",
        "reply_authors": "1;3;3",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            114.66666666666667,
            41.298372311212894
        ],
        "wc_strengths_avg": [
            106.33333333333333,
            87.56077254620865
        ],
        "wc_weaknesses_avg": [
            154.0,
            62.758797524065635
        ],
        "wc_questions_avg": [
            326.0,
            318.8928764752619
        ],
        "wc_review_avg": [
            701.0,
            476.2275366530863
        ],
        "wc_reply_reviewers_avg": [
            16.0,
            12.027745701779143
        ],
        "wc_reply_authors_avg": [
            972.3333333333334,
            474.07617765737
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4683240413338151658&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=DASh78rJ7g",
        "pdf": "https://openreview.net/pdf?id=DASh78rJ7g",
        "email": "google.com;google.com;google.com;google.com",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Google",
        "aff_unique_dep": "Google",
        "aff_unique_url": "https://www.google.com",
        "aff_unique_abbr": "Google",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Mountain View",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "DAs9X4mCpu",
        "title": "Learning to Count without Annotations",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "While recent supervised methods for reference-based object counting continue to improve the performance on benchmark datasets, they have to rely on small datasets due to the cost associated with manually annotating dozens of objects in images. We propose Unsupervised Counter (UnCo), a model that can learn this task without requiring any manual annotations. To this end, we construct \"Self-Collages\", images with various pasted objects as training samples, that provide a rich learning signal covering arbitrary object types and counts. Our method builds on existing unsupervised representations and segmentation techniques to successfully demonstrate for the first time the ability of reference-based counting without manual supervision. Our experiments show that our method not only outperforms simple baselines and generic models such as FasterRCNN and DETR, but also matches the performance of supervised counting models in some domains.",
        "keywords": "computer vision;self-supervision;visual counting",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/791f31942368a7ec671cde4a9903a6127bc98234.zip",
        "author": "Lukas Knobel;Tengda Han;Yuki M Asano",
        "authorids": "~Lukas_Knobel1;~Tengda_Han1;~Yuki_M_Asano1",
        "gender": ";M;M",
        "homepage": ";https://tengdahan.github.io/;https://yukimasano.github.io/",
        "dblp": ";203/8188;239/8823",
        "google_scholar": ";https://scholar.google.co.uk/citations?user=SbAuWREAAAAJ;CdpLhlgAAAAJ",
        "orcid": "0000-0003-3014-5262;0000-0002-1874-9664;",
        "linkedin": "lukas-knobel;;",
        "or_profile": "~Lukas_Knobel1;~Tengda_Han1;~Yuki_Asano1",
        "aff": "TNO;University of Oxford;University of Amsterdam",
        "aff_domain": "tno.nl;robots.ox.ac.uk;uva.nl",
        "position": "Researcher;Postdoc;Assistant Professor",
        "bibtex": "@misc{\nknobel2024learning,\ntitle={Learning to Count without Annotations},\nauthor={Lukas Knobel and Tengda Han and Yuki M Asano},\nyear={2024},\nurl={https://openreview.net/forum?id=DAs9X4mCpu}\n}",
        "github": "",
        "project": "",
        "reviewers": "1EYE;HmkX;21rs",
        "site": "https://openreview.net/forum?id=DAs9X4mCpu",
        "pdf_size": 5472740,
        "rating": "3;3;5",
        "confidence": "5;4;5",
        "soundness": "3;3;3",
        "contribution": "1;1;2",
        "presentation": "2;3;3",
        "wc_summary": "41;54;54",
        "wc_strengths": "30;34;35",
        "wc_weaknesses": "124;116;147",
        "wc_questions": "1;180;2",
        "wc_review": "196;384;238",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            49.666666666666664,
            6.128258770283412
        ],
        "wc_strengths_avg": [
            33.0,
            2.160246899469287
        ],
        "wc_weaknesses_avg": [
            129.0,
            13.140268896284683
        ],
        "wc_questions_avg": [
            61.0,
            84.14669730100324
        ],
        "wc_review_avg": [
            272.6666666666667,
            80.57019024152517
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17748902978107206836&as_sdt=5,31&sciodt=0,31&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "TNO;University of Oxford;University of Amsterdam",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.tno.nl;https://www.ox.ac.uk;https://www.uva.nl",
        "aff_unique_abbr": "TNO;Oxford;UvA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Netherlands;United Kingdom"
    },
    {
        "title": "Boosting the Adversarial Robustness of Graph Neural Networks: An OOD Perspective",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19149",
        "id": "DCDT918ZkI",
        "author_site": "Kuan Li, YiWen Chen, Yang Liu, Jin Wang, QING HE, Minhao Cheng, Xiang Ao",
        "tldr": "",
        "abstract": "Current defenses against graph attacks often rely on certain properties to eliminate structural perturbations by identifying adversarial edges from normal edges. However, this dependence makes defenses vulnerable to adaptive (white-box) attacks from adversaries with the same knowledge. Adversarial training seems to be a feasible way to enhance robustness without reliance on artificially designed properties. However, in this paper, we show that it can lead to models learning incorrect information. To solve this issue, we re-examine graph attacks from the out-of-distribution (OOD) perspective for poisoning and evasion attacks and introduce a novel adversarial training paradigm incorporating OOD detection. This approach strengthens the robustness of Graph Neural Networks (GNNs) without reliance on prior knowledge. To further evaluate adaptive robustness, we develop adaptive attacks against our methods, revealing a trade-off between graph attack efficacy and defensibility. Through extensive experiments over 25,000 perturbed graphs, our method could still maintain good robustness against both adaptive and non-adaptive attacks. The code is provided at https://github.com/likuanppd/GOOD-AT.",
        "keywords": "Graph Neural Networks;Adversarial Robustness;Data Distribution",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Kuan Li;YiWen Chen;Yang Liu;Jin Wang;Qing He;Minhao Cheng;Xiang Ao",
        "authorids": "~Kuan_Li3;~YiWen_Chen5;~Yang_Liu73;~Jin_Wang8;~Qing_He2;~Minhao_Cheng1;~Xiang_Ao2",
        "gender": "M;M;M;M;M;M;M",
        "homepage": "https://likuan.github.io;https://github.com/cywuuuu;https://ponderly.github.io/;https://www.jinwang18.net/;http://www.ict.cas.cn/sourcedb_2018_ict_cas/cn/jssrck/200909/t20090917_2496626.html;https://cmhcbb.github.io/;https://aoxaustin.github.io/",
        "dblp": ";;51/3710-200;92/1375-7;14/3700-3.html;174/1717;71/1982-1",
        "google_scholar": "Bud1l3kAAAAJ;;kVoIIXkAAAAJ;5zl9QR8AAAAJ;tkbgSDYAAAAJ;_LkC1yoAAAAJ;W8wrWfMAAAAJ",
        "orcid": ";;0000-0002-1525-0788;0000-0002-3172-6133;0000-0001-8833-5398;0000-0003-3965-4215;0000-0001-9633-8361",
        "linkedin": ";;;;;;",
        "or_profile": "~Kuan_Li3;~YiWen_Chen5;~Yang_Liu73;~Jin_Wang8;~Qing_He2;~Minhao_Cheng1;~Xiang_Ao2",
        "aff": "Hong Kong University of Science and Technology;Beihang University;Institute of Computing Technology, Chinese Academy of Sciences;Megagon Labs;Institute of Computing Technology, Chinese Academy of Sciences;Pennsylvania State University;Institute of Computing Technology, Chinese Academy of Sciences",
        "aff_domain": "hkust.edu;buaa.edu.cn;ict.ac.cn;megagon.ai;ict.ac.cn;psu.edu;ict.ac.cn",
        "position": "PhD student;Undergrad student;Assistant Professor;Researcher;Full Professor;Assistant Professor;Associate Professor",
        "bibtex": "@inproceedings{\nli2024boosting,\ntitle={Boosting the Adversarial Robustness of Graph Neural Networks: An {OOD} Perspective},\nauthor={Kuan Li and YiWen Chen and Yang Liu and Jin Wang and Qing He and Minhao Cheng and Xiang Ao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=DCDT918ZkI}\n}",
        "github": "",
        "project": "",
        "reviewers": "sgRe;hRXc;RUQz;TfP9",
        "pdf_size": 10947725,
        "rating": "3;6;6;8",
        "confidence": "5;4;3;4",
        "soundness": "2;4;3;3",
        "contribution": "2;3;2;3",
        "presentation": "2;4;2;3",
        "wc_summary": "58;27;58;90",
        "wc_strengths": "36;57;38;38",
        "wc_weaknesses": "46;28;189;74",
        "wc_questions": "57;3;43;249",
        "wc_review": "197;115;328;451",
        "wc_reply_reviewers": "226;20;155;17",
        "wc_reply_authors": "1813;225;997;851",
        "reply_reviewers": "1;1;2;1",
        "reply_authors": "4;3;4;3",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            58.25,
            22.275266552838374
        ],
        "wc_strengths_avg": [
            42.25,
            8.554969316134336
        ],
        "wc_weaknesses_avg": [
            84.25,
            62.65929699573719
        ],
        "wc_questions_avg": [
            88.0,
            95.0420959364849
        ],
        "wc_review_avg": [
            272.75,
            127.91476654397646
        ],
        "wc_reply_reviewers_avg": [
            104.5,
            89.5949217310892
        ],
        "wc_reply_authors_avg": [
            971.5,
            565.8080504906235
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.5,
            0.5
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5940885257860046,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8293024308161595099&as_sdt=5,31&sciodt=0,31&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=DCDT918ZkI",
        "pdf": "https://openreview.net/pdf?id=DCDT918ZkI",
        "email": "hkust.edu;buaa.edu.cn;ict.ac.cn;megagon.ai;ict.ac.cn;psu.edu;ict.ac.cn",
        "author_num": 7,
        "aff_unique_index": "0;1;2;3;2;4;2",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Beihang University;Chinese Academy of Sciences;Megagon Labs;Pennsylvania State University",
        "aff_unique_dep": ";;Institute of Computing Technology;;",
        "aff_unique_url": "https://www.ust.hk;http://www.buaa.edu.cn/;http://www.ict.ac.cn;https://www.megagonlabs.com;https://www.psu.edu",
        "aff_unique_abbr": "HKUST;BUAA;CAS;;PSU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;1;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "DCUG6P9RkZ",
        "title": "Better Imitation Learning in Discounted Linear MDP",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We present a new algorithm for imitation learning in infinite horizon linear MDPs dubbed ILARL which greatly improves the bound on the number of trajectories that the learner needs to sample from the environment. \nIn particular, we remove exploration assumptions required in previous works and we improve the dependence on the desired accuracy $\\epsilon$ from $\\mathcal{O}(\\epsilon^{-5})$ to $\\mathcal{O}(\\epsilon^{-4})$.\nOur result relies on a connection between imitation learning and online learning in MDPs with adversarial losses. For the latter setting, we present the first result for infinite horizon linear MDP which may be of independent interest. Moreover, we are able to provide a strengthen result for the finite horizon case where we achieve $\\mathcal{O}(\\epsilon^{-2})$. Numerical experiments with linear function approximation shows that ILARL outperforms other commonly used algorithms.",
        "keywords": "imitation learning theory;online learning in MDP;reinforcement learning theory",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/eda2d7e38946d812687e8f7f30477e27cdbff694.zip",
        "author": "Luca Viano;Stratis Skoulakis;Volkan Cevher",
        "authorids": "~Luca_Viano1;~Stratis_Skoulakis2;~Volkan_Cevher1",
        "gender": ";M;M",
        "homepage": "https://scholar.google.com/citations?hl=en&user=e9Bpg5gAAAAJ;http://www.corelab.ntua.gr/~sskoul/;http://lions.epfl.ch",
        "dblp": "268/8179;183/0979.html;70/5301",
        "google_scholar": "E_dAUKEAAAAJ;Juo2Tk8AAAAJ;https://scholar.google.ch/citations?user=hlWhzU8AAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Luca_Viano1;~Stratis_Skoulakis2;~Volkan_Cevher1",
        "aff": "EPFL - EPF Lausanne;EPFL - EPF Lausanne;Amazon Development Center Germany",
        "aff_domain": "epfl.ch;epfl.ch;amazon.de",
        "position": "PhD student;Postdoc;Amazon Scholar",
        "bibtex": "@misc{\nviano2024better,\ntitle={Better Imitation Learning in Discounted Linear {MDP}},\nauthor={Luca Viano and Stratis Skoulakis and Volkan Cevher},\nyear={2024},\nurl={https://openreview.net/forum?id=DCUG6P9RkZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "B5xB;jGsw;Rc5N;Wgzz",
        "site": "https://openreview.net/forum?id=DCUG6P9RkZ",
        "pdf_size": 974121,
        "rating": "5;5;5;6",
        "confidence": "4;4;4;3",
        "soundness": "3;2;3;4",
        "contribution": "2;3;3;3",
        "presentation": "2;2;2;4",
        "wc_summary": "145;54;92;73",
        "wc_strengths": "68;52;317;72",
        "wc_weaknesses": "165;120;419;91",
        "wc_questions": "82;238;99;16",
        "wc_review": "460;464;927;252",
        "wc_reply_reviewers": "444;123;0;0",
        "wc_reply_authors": "1502;1563;1190;570",
        "reply_reviewers": "2;2;0;0",
        "reply_authors": "4;5;3;2",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            91.0,
            33.94849039353591
        ],
        "wc_strengths_avg": [
            127.25,
            109.80750202058145
        ],
        "wc_weaknesses_avg": [
            198.75,
            129.86603674556332
        ],
        "wc_questions_avg": [
            108.75,
            80.80648179446993
        ],
        "wc_review_avg": [
            525.75,
            247.02062160880416
        ],
        "wc_reply_reviewers_avg": [
            141.75,
            181.58520727195815
        ],
        "wc_reply_authors_avg": [
            1206.25,
            393.6422074676444
        ],
        "reply_reviewers_avg": [
            1.0,
            1.0
        ],
        "reply_authors_avg": [
            3.5,
            1.118033988749895
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ixkvtXDdSzEJ:scholar.google.com/&scioq=Better+Imitation+Learning+in+Discounted+Linear+MDP&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "EPFL;Amazon",
        "aff_unique_dep": ";Development Center",
        "aff_unique_url": "https://www.epfl.ch;https://www.amazon.de",
        "aff_unique_abbr": "EPFL;Amazon",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Lausanne;",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "Switzerland;Germany"
    },
    {
        "id": "DDAtRS5Ngf",
        "title": "Ceci n'est pas une pomme: Adversarial Illusions in Multi-Modal Embeddings",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Multi-modal embeddings encode images, sounds, texts, videos, etc. into a single embedding space, aligning representations across modalities (e.g., associate an image of a dog with a barking sound).  We show that multi-modal embeddings can be vulnerable to an attack we call ``adversarial illusions.''  Given an image or a sound, an adversary can perturb it so as to make its embedding close to an arbitrary, adversary-chosen input in another modality. This enables the adversary to align any image and any sound with any text.  \n\nAdversarial illusions exploit proximity in the embedding space and are thus agnostic to downstream tasks.  Using ImageBind embeddings, we demonstrate how adversarially aligned inputs, generated without knowledge of specific downstream tasks, mislead image generation, text generation, and zero-shot classification.",
        "keywords": "security;machine learning;adversarial perturbations;large language models",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Eugene Bagdasaryan;Rishi Dev Jha;Tingwei Zhang;Vitaly Shmatikov",
        "authorids": "~Eugene_Bagdasaryan1;~Rishi_Dev_Jha1;~Tingwei_Zhang1;~Vitaly_Shmatikov1",
        "gender": "M;M;M;",
        "homepage": "https://cs.umass.edu/~eugene;http://rishijha.com/;https://ztingwei.com/;",
        "dblp": "213/9150;359/6028.html;;",
        "google_scholar": "_MfoOC8AAAAJ;v8oRh6YAAAAJ;;",
        "orcid": "0000-0002-7994-6469;;;",
        "linkedin": ";;;",
        "or_profile": "~Eugene_Bagdasaryan1;~Rishi_Dev_Jha1;~Tingwei_Zhang1;~Vitaly_Shmatikov1",
        "aff": "Google;Cornell Tech;Cornell Tech;",
        "aff_domain": "google.com;cornell.edu;cornell.edu;",
        "position": "Researcher;PhD student;PhD student;",
        "bibtex": "@misc{\nbagdasaryan2024ceci,\ntitle={Ceci n'est pas une pomme: Adversarial Illusions in Multi-Modal Embeddings},\nauthor={Eugene Bagdasaryan and Rishi Dev Jha and Tingwei Zhang and Vitaly Shmatikov},\nyear={2024},\nurl={https://openreview.net/forum?id=DDAtRS5Ngf}\n}",
        "github": "",
        "project": "",
        "reviewers": "Tpfm;8PvS;xAWL;cUzT",
        "site": "https://openreview.net/forum?id=DDAtRS5Ngf",
        "pdf_size": 4169855,
        "rating": "3;5;6;6",
        "confidence": "5;4;5;3",
        "soundness": "2;3;3;2",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "86;17;115;81",
        "wc_strengths": "26;17;45;44",
        "wc_weaknesses": "70;58;271;119",
        "wc_questions": "8;6;2;294",
        "wc_review": "190;98;433;538",
        "wc_reply_reviewers": "80;0;23;87",
        "wc_reply_authors": "436;94;491;787",
        "reply_reviewers": "1;0;1;3",
        "reply_authors": "2;1;1;3",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            74.75,
            35.77970793620317
        ],
        "wc_strengths_avg": [
            33.0,
            11.937336386313323
        ],
        "wc_weaknesses_avg": [
            129.5,
            84.83071377749924
        ],
        "wc_questions_avg": [
            77.5,
            125.01499910010799
        ],
        "wc_review_avg": [
            314.75,
            177.74050607557075
        ],
        "wc_reply_reviewers_avg": [
            47.5,
            36.98986347636336
        ],
        "wc_reply_authors_avg": [
            452.0,
            246.05182380953815
        ],
        "reply_reviewers_avg": [
            1.25,
            1.0897247358851685
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.4923659639173309,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Google;Cornell University",
        "aff_unique_dep": "Google;",
        "aff_unique_url": "https://www.google.com;https://tech.cornell.edu",
        "aff_unique_abbr": "Google;Cornell Tech",
        "aff_campus_unique_index": "0;1;1",
        "aff_campus_unique": "Mountain View;New York City",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "DreamCraft3D: Hierarchical 3D Generation with Bootstrapped Diffusion Prior",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19148",
        "id": "DDX1u29Gqr",
        "author_site": "Jingxiang Sun, Bo Zhang, Ruizhi Shao, Lizhen Wang, Wen Liu, Zhenda Xie, Yebin Liu",
        "tldr": "",
        "abstract": "We present DreamCraft3D, a hierarchical 3D content generation method that produces high-fidelity and coherent 3D objects. We tackle the problem by leveraging a 2D reference image to guide the stages of geometry sculpting and texture boosting. A central focus of this work is to address the consistency issue that existing works encounter. To sculpt geometries that render coherently, we perform score distillation sampling via a view-dependent diffusion model. This 3D prior, alongside several training strategies, prioritizes the geometry consistency but compromises the texture fidelity. We further propose bootstrapped score distillation to specifically boost the texture. We train a personalized diffusion model, Dreambooth, on the augmented renderings of the scene, imbuing it with 3D knowledge of the scene being optimized. The score distillation from this 3D-aware diffusion prior provides view-consistent guidance for the scene. Notably, through an alternating optimization of the diffusion prior and 3D scene representation, we achieve mutually reinforcing improvements: the optimized 3D scene aids in training the scene-specific diffusion model, which offers increasingly view-consistent guidance for 3D optimization. The optimization is thus bootstrapped and leads to substantial texture boosting. With tailored 3D priors throughout the hierarchical generation, DreamCraft3D generates coherent 3D objects with photorealistic renderings, advancing the state-of-the-art in 3D content generation.",
        "keywords": "text to 3D;diffusion models;NeRF;neural rendering;3d synthesis",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/aea9835c5198392e63358dafd48e4f1ff18ce937.zip",
        "author": "Jingxiang Sun;Bo Zhang;Ruizhi Shao;Lizhen Wang;Wen Liu;Zhenda Xie;Yebin Liu",
        "authorids": "~Jingxiang_Sun1;~Bo_Zhang9;~Ruizhi_Shao1;~Lizhen_Wang2;~Wen_Liu2;~Zhenda_Xie1;~Yebin_Liu1",
        "gender": "M;M;M;M;M;M;M",
        "homepage": "https://mrtornado24.github.io/;https://bo-zhang.me;https://dsaurus.github.io/saurus/;https://lizhenwangt.github.io/;https://github.com/StevenLiuWen;https://zdaxie.github.io/;http://liuyebin.com",
        "dblp": "261/3451;36/2259-25;267/7795;38/2512-2;61/372-3;239/8676;84/1411.html",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en;;https://scholar.google.cz/citations?user=kEMoSiIAAAAJ;A6K6bkoAAAAJ;;https://scholar.google.com/scholar?hl=zh-CN",
        "orcid": ";0000-0002-9795-4673;0000-0003-2188-1348;0000-0002-6674-9327;;;",
        "linkedin": "jingxiang-sun-8358021ba/;bo-zhang-8b753792/;;;;zhenda-xie/;",
        "or_profile": "~Jingxiang_Sun1;~Bo_Zhang9;~Ruizhi_Shao1;~Lizhen_Wang2;~Wen_Liu2;~Zhenda_Xie1;~Yebin_Liu1",
        "aff": "Tsinghua University;DeepSeek AI;Tsinghua University;Tsinghua University;DeepSeek AI;DeepSeek AI;Tsinghua University",
        "aff_domain": "mails.tsinghua.edu.cn;deepseek.com;tsinghua.edu.cn;tsinghua.edu.cn;deepseek.com;deepseek.com;tsinghua.edu.cn",
        "position": "PhD student;Researcher;PhD student;Postdoc;Researcher;Researcher;Full Professor",
        "bibtex": "@inproceedings{\nsun2024dreamcraftd,\ntitle={DreamCraft3D: Hierarchical 3D Generation with Bootstrapped Diffusion Prior},\nauthor={Jingxiang Sun and Bo Zhang and Ruizhi Shao and Lizhen Wang and Wen Liu and Zhenda Xie and Yebin Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=DDX1u29Gqr}\n}",
        "github": "",
        "project": "",
        "reviewers": "GYis;NmnF;vdnk;c9Ad",
        "pdf_size": 51067715,
        "rating": "5;6;6;8",
        "confidence": "3;3;5;4",
        "soundness": "3;3;3;3",
        "contribution": "1;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "45;60;93;129",
        "wc_strengths": "44;40;211;135",
        "wc_weaknesses": "96;148;271;324",
        "wc_questions": "13;2;12;156",
        "wc_review": "198;250;587;744",
        "wc_reply_reviewers": "0;65;27;0",
        "wc_reply_authors": "631;635;752;974",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            81.75,
            32.33709170596515
        ],
        "wc_strengths_avg": [
            107.5,
            70.81136914366223
        ],
        "wc_weaknesses_avg": [
            209.75,
            91.5925078813764
        ],
        "wc_questions_avg": [
            45.75,
            63.79802112918551
        ],
        "wc_review_avg": [
            444.75,
            228.36306071692067
        ],
        "wc_reply_reviewers_avg": [
            23.0,
            26.636441203734407
        ],
        "wc_reply_authors_avg": [
            748.0,
            139.2390031564432
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.3458572319330373,
        "gs_citation": 110,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2754213918623462447&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=DDX1u29Gqr",
        "pdf": "https://openreview.net/pdf?id=DDX1u29Gqr",
        "email": "mails.tsinghua.edu.cn;deepseek.com;tsinghua.edu.cn;tsinghua.edu.cn;deepseek.com;deepseek.com;tsinghua.edu.cn",
        "author_num": 7,
        "aff_unique_index": "0;1;0;0;1;1;0",
        "aff_unique_norm": "Tsinghua University;DeepSeek AI",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tsinghua.edu.cn;",
        "aff_unique_abbr": "THU;DeepSeek AI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;1;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "DE2RMJVjgI",
        "title": "Fine-grained Separation of Action-Background for Point-Level Temporal Action Localization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Due to the limitation of coarse-grained video-level labels, the action-background confusion is a tough problem for the weakly-supervised temporal action localization. Point-level temporal action localization recently utilizes point-level labels to overcome this difficulty to some extent. However, considering the sparsity of point-level labels, existing methods still lack the ability to effectively eliminate false positive action proposals. To address this issue, in this paper, we propose a new framework to provide guidance for fine-grained separation of action-background for the model. Specifically, the framework relies on annotated single frame labels to extend the original action features and generate dense pseudo labels, providing the model with more precise position information. Based on this information, the framework generates pseudo segment-level labels from video sequences and utilizes our proposed score contrast module and feature separation module, which are different from the previous works,to amplify the differences in scores and features between segment labels. Extensive experiments on four benchmarks verify the effectiveness of our proposed framework, and demonstrate that our method is significantly superior to previous state-of-the-art methods and obtains 3.9\\% performance gains in terms of the average mAP on THUMOS\u201914.",
        "keywords": "Temporal action localization;point-level supervision;weakly-supervised learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/492666e8eeb7dcbb9f9d31fd3515a193d956bd4f.zip",
        "author": "Yone Huang;Ying Xu;Fusen Li",
        "authorids": "~Yone_Huang1;~Ying_Xu8;~Fusen_Li1",
        "gender": "M;F;M",
        "homepage": "https://github.com/Hyone-soul;http://csee.hnu.edu.cn/people/xuying;https://github.com/Leefusen",
        "dblp": ";181/2619;",
        "google_scholar": ";;",
        "orcid": ";0000-0001-7722-4385;",
        "linkedin": ";;",
        "or_profile": "~Yone_Huang1;~Ying_Xu8;~Fusen_Li1",
        "aff": "Hunan University;Hunan University;Hunan University",
        "aff_domain": "hnu.edu.cn;hnu.edu.cn;hnu.edu.cn",
        "position": "MS student;Associate Professor;MS student",
        "bibtex": "@misc{\nhuang2024finegrained,\ntitle={Fine-grained Separation of Action-Background for Point-Level Temporal Action Localization},\nauthor={Yone Huang and Ying Xu and Fusen Li},\nyear={2024},\nurl={https://openreview.net/forum?id=DE2RMJVjgI}\n}",
        "github": "",
        "project": "",
        "reviewers": "KUWp;PXaQ;L6ip;8Huu",
        "site": "https://openreview.net/forum?id=DE2RMJVjgI",
        "pdf_size": 3379162,
        "rating": "3;3;5;6",
        "confidence": "5;5;5;4",
        "soundness": "2;2;3;3",
        "contribution": "2;1;3;3",
        "presentation": "1;3;3;3",
        "wc_summary": "55;78;50;55",
        "wc_strengths": "26;52;27;32",
        "wc_weaknesses": "253;261;157;156",
        "wc_questions": "65;5;56;8",
        "wc_review": "399;396;290;251",
        "wc_reply_reviewers": "87;117;106;39",
        "wc_reply_authors": "576;571;728;219",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            59.5,
            10.874281585465774
        ],
        "wc_strengths_avg": [
            34.25,
            10.497023387608508
        ],
        "wc_weaknesses_avg": [
            206.75,
            50.33078084035653
        ],
        "wc_questions_avg": [
            33.5,
            27.207535720825582
        ],
        "wc_review_avg": [
            334.0,
            64.98846051415589
        ],
        "wc_reply_reviewers_avg": [
            87.25,
            29.852763691155968
        ],
        "wc_reply_authors_avg": [
            523.5,
            186.7839661212921
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.7777777777777777,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:jnFUdpPriJoJ:scholar.google.com/&scioq=Fine-grained+Separation+of+Action-Background+for+Point-Level+Temporal+Action+Localization&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Hunan University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.hunu.edu.cn/",
        "aff_unique_abbr": "HNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "DE7IVrk8Ks",
        "title": "Latent Shattering: Turning Unconditional Pretrained Generators Into Conditional Models By Imposing Latent Structure",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep generative models, such as GANs and VAEs, have gained substantial attention for their ability to synthesize realistic data. Pretrained generative models are often unconditional, thus do not easily allow the user to specify the class of the output. Yet supporting conditional generation offers inherent benefits for many tasks. Due to current models requiring huge data sets and often prohibitively expensive computational resources for training, it is desirable to have a lightweight method that can convert pretrained unconditional generators into conditional models without retraining. Previous research into this problem is limited, typically assuming either access to classifiers that identify which regions of the generator\u2019s latent space correspond to specific classes, access to labeled data, or even retraining of the generative model itself. These strict requirements pose a serious limitation. In this work, we propose LASH, a fresh approach at the conversion of unconditional generators into conditional models in a completely unsupervised manner without requiring retraining nor access to any real data. Instead, the key principle of LASH is to identify points in the generator\u2019s latent space that are\nmapped to low-density regions of the output space. The insight is that by removing these points, LASH \u201cshatters\u201d the latent space into distinct clusters where each cluster corresponds to a semantically meaningful mode in the output space. We demonstrate that these modes correspond to distinct real-world classes. Lastly, LASH utilizes a simple Gaussian mixture model to adaptively sample from these\nclusters, supporting unsupervised conditional generation. Through a series of experiments on MNIST, FashionMNIST, and CelebA, we demonstrate that LASH significantly outperforms existing methods in unsupervised conditional sampling.",
        "keywords": "generative models;generative modeling;GANs;VAEs",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Walter Gerych;Luke Buquicchio;Kavin Chandrasekaran;Emmanuel Agu;Elke Rundensteiner",
        "authorids": "~Walter_Gerych2;~Luke_Buquicchio1;~Kavin_Chandrasekaran1;~Emmanuel_Agu1;~Elke_Rundensteiner2",
        "gender": "M;;M;M;F",
        "homepage": "https://waltergerych.github.io/;;https://kavincsekaran.github.io/;https://www.wpi.edu/people/faculty/emmanuel;https://www.wpi.edu/people/faculty/rundenst",
        "dblp": "237/9060;248/3289;248/3538.html;23/3629;r/EARundensteiner",
        "google_scholar": "https://scholar.google.com/citations?hl=en;D3BKoHMAAAAJ;wziaKmQAAAAJ;https://scholar.google.com.tw/citations?user=Ke6ex0wAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";0000-0002-9639-8660;;;0000-0001-5375-9254",
        "linkedin": "walter-gerych-84165112b/;luke-buquicchio-a55774141/;;;elke-rundensteiner-4a2825/",
        "or_profile": "~Walter_Gerych2;~Luke_Buquicchio1;~Kavin_Chandrasekaran1;~Emmanuel_Agu1;~Elke_Rundensteiner2",
        "aff": "Massachusetts Institute of Technology;;;;Worcester Polytechnic Institute",
        "aff_domain": "mit.edu;;;;wpi.edu",
        "position": "Postdoc;;;;Full Professor",
        "bibtex": "@misc{\ngerych2024latent,\ntitle={Latent Shattering: Turning Unconditional Pretrained Generators Into Conditional Models By Imposing Latent Structure},\nauthor={Walter Gerych and Luke Buquicchio and Kavin Chandrasekaran and Emmanuel Agu and Elke Rundensteiner},\nyear={2024},\nurl={https://openreview.net/forum?id=DE7IVrk8Ks}\n}",
        "github": "",
        "project": "",
        "reviewers": "gFLe;QipQ;twZp;3NcT",
        "site": "https://openreview.net/forum?id=DE7IVrk8Ks",
        "pdf_size": 2935162,
        "rating": "3;3;3;5",
        "confidence": "4;4;4;3",
        "soundness": "3;2;2;1",
        "contribution": "2;1;1;3",
        "presentation": "3;3;2;4",
        "wc_summary": "177;71;71;77",
        "wc_strengths": "56;69;15;76",
        "wc_weaknesses": "430;405;192;248",
        "wc_questions": "84;32;22;83",
        "wc_review": "747;577;300;484",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            99.0,
            45.09988913511872
        ],
        "wc_strengths_avg": [
            54.0,
            23.632604596192948
        ],
        "wc_weaknesses_avg": [
            318.75,
            101.10236149566438
        ],
        "wc_questions_avg": [
            55.25,
            28.472574523565655
        ],
        "wc_review_avg": [
            527.0,
            161.4605214905489
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:txdKN6U3UoEJ:scholar.google.com/&scioq=Latent+Shattering:+Turning+Unconditional+Pretrained+Generators+Into+Conditional+Models+By+Imposing+Latent+Structure&hl=en&as_sdt=0,23",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Massachusetts Institute of Technology;Worcester Polytechnic Institute",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://web.mit.edu;https://www.wpi.edu",
        "aff_unique_abbr": "MIT;WPI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "On the Reliability of Watermarks for Large Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19147",
        "id": "DEJIDCmWOz",
        "author_site": "John Kirchenbauer, Jonas Geiping, Yuxin Wen, Manli Shu, Khalid Saifullah, Kezhi Kong, Kasun Fernando, Aniruddha Saha, Micah Goldblum, Tom Goldstein",
        "tldr": "",
        "abstract": "As LLMs become commonplace, machine-generated text has the potential to flood the internet with spam, social media bots, and valueless content. _Watermarking_ is a simple and effective strategy for mitigating such harms by enabling the detection and documentation of LLM-generated text. Yet a crucial question remains: How reliable is watermarking in realistic settings in the wild? There, watermarked text may be modified to suit a user's needs, or entirely rewritten to avoid detection. We study the robustness of watermarked text after it is re-written by humans, paraphrased by a non-watermarked LLM, or mixed into a longer hand-written document. We find that watermarks remain detectable even after human and machine paraphrasing. While these attacks dilute the strength of the watermark, paraphrases are statistically likely to leak n-grams or even longer fragments of the original text, resulting in high-confidence detections when enough tokens are observed.  For example, after strong human paraphrasing the watermark is detectable after observing 800 tokens on average, when setting a $1\\mathrm{e}{-5}$ false positive rate. We also consider a range of new detection schemes that are sensitive to short spans of watermarked text embedded inside a large document, and we compare the robustness of watermarking to other kinds of detectors.",
        "keywords": "Machine Learning;LLM;Watermark;Language Model;Natural Language Processing;Generative AI",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/9942394bede6a94b67e5f3d6009417de9af9c44d.zip",
        "author": "John Kirchenbauer;Jonas Geiping;Yuxin Wen;Manli Shu;Khalid Saifullah;Kezhi Kong;Kasun Fernando;Aniruddha Saha;Micah Goldblum;Tom Goldstein",
        "authorids": "~John_Kirchenbauer1;~Jonas_Geiping1;~Yuxin_Wen2;~Manli_Shu1;~Khalid_Saifullah1;~Kezhi_Kong1;~Kasun_Fernando1;~Aniruddha_Saha1;~Micah_Goldblum1;~Tom_Goldstein1",
        "gender": "M;M;;F;M;M;M;M;;M",
        "homepage": "https://jwkirchenbauer.notion.site/;https://jonasgeiping.github.io/;https://yuxinwenrick.github.io/;https://azshue.github.io/;http://khalidsaifullaah.github.io/;https://devnkong.github.io;https://kasun-fernando.github.io/personal-webpage/;https://ani0075saha.github.io/;;https://www.cs.umd.edu/~tomg/",
        "dblp": "321/0678;190/7229;;263/3503;;228/8866;;221/8102;241/7231;25/8184",
        "google_scholar": "48GJrbsAAAAJ;https://scholar.google.de/citations?user=206vNCEAAAAJ;oUYfjg0AAAAJ;https://scholar.google.com/citations?hl=en;NNEbBIQAAAAJ;;jHtjQ44AAAAJ;xfjALj0AAAAJ;pGDKzuUAAAAJ;KmSuVtgAAAAJ",
        "orcid": ";;;;;;0000-0003-1489-9566;;;",
        "linkedin": "johnkirchenbauer/;;;manli-shu-a804a8164/;;;abkfernando;;;",
        "or_profile": "~John_Kirchenbauer1;~Jonas_Geiping1;~Yuxin_Wen2;~Manli_Shu1;~Khalid_Saifullah1;~Kezhi_Kong1;~Kasun_Fernando1;~Aniruddha_Saha1;~Micah_Goldblum1;~Tom_Goldstein1",
        "aff": "University of Maryland, College Park;Max Planck Institute for Intelligent Systems, Max-Planck Institute;University of Maryland, College Park;Department of Computer Science, University of Maryland, College Park;University of Maryland, College Park;University of Maryland, College Park;;University of Maryland, College Park;New York University;University of Maryland, College Park",
        "aff_domain": "umd.edu;tuebingen.mpg.de;umd.edu;cs.umd.edu;umd.edu;umd.edu;;umd.edu;nyu.edu;umd.edu",
        "position": "PhD student;Principal Researcher;PhD student;PhD student;PhD student;PhD student;;Postdoc;Postdoc;Full Professor",
        "bibtex": "@inproceedings{\nkirchenbauer2024on,\ntitle={On the Reliability of Watermarks for Large Language Models},\nauthor={John Kirchenbauer and Jonas Geiping and Yuxin Wen and Manli Shu and Khalid Saifullah and Kezhi Kong and Kasun Fernando and Aniruddha Saha and Micah Goldblum and Tom Goldstein},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=DEJIDCmWOz}\n}",
        "github": "",
        "project": "",
        "reviewers": "jTXD;o62T;o8L2",
        "pdf_size": 2674599,
        "rating": "6;6;6",
        "confidence": "3;4;5",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "3;2;4",
        "wc_summary": "66;32;62",
        "wc_strengths": "80;40;70",
        "wc_weaknesses": "129;95;130",
        "wc_questions": "66;108;20",
        "wc_review": "341;275;282",
        "wc_reply_reviewers": "283;20;447",
        "wc_reply_authors": "1755;534;1048",
        "reply_reviewers": "2;1;2",
        "reply_authors": "3;2;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            53.333333333333336,
            15.173075568988056
        ],
        "wc_strengths_avg": [
            63.333333333333336,
            16.99673171197595
        ],
        "wc_weaknesses_avg": [
            118.0,
            16.268579122549905
        ],
        "wc_questions_avg": [
            64.66666666666667,
            35.93821859184948
        ],
        "wc_review_avg": [
            299.3333333333333,
            29.601051032391098
        ],
        "wc_reply_reviewers_avg": [
            250.0,
            175.8768508549851
        ],
        "wc_reply_authors_avg": [
            1112.3333333333333,
            500.542594480119
        ],
        "reply_reviewers_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 70,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16768618147563925643&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=DEJIDCmWOz",
        "pdf": "https://openreview.net/pdf?id=DEJIDCmWOz",
        "email": "umd.edu;tuebingen.mpg.de;umd.edu;cs.umd.edu;umd.edu;umd.edu;;umd.edu;nyu.edu;umd.edu",
        "author_num": 10,
        "aff_unique_index": "0;1;0;2;0;0;0;3;0",
        "aff_unique_norm": "University of Maryland;Max Planck Institute for Intelligent Systems;University of Maryland, College Park;New York University",
        "aff_unique_dep": ";Intelligent Systems;Department of Computer Science;",
        "aff_unique_url": "https://www/umd.edu;https://www.mpi-is.mpg.de;https://www/umd.edu;https://www.nyu.edu",
        "aff_unique_abbr": "UMD;MPI-IS;UMD;NYU",
        "aff_campus_unique_index": "0;0;0;0;0;0;0",
        "aff_campus_unique": "College Park;",
        "aff_country_unique_index": "0;1;0;0;0;0;0;0;0",
        "aff_country_unique": "United States;Germany"
    },
    {
        "id": "DFQCJmHPoe",
        "title": "Adversarial latent representation for positive unlabeled learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Novelty detection, a widely studied problem in machine learning, is the task of detecting a novel class of data that has not been previously observed. Deep networks have driven the state-of-the-art work on this application in recent years due to their successful applications on large and more complex datasets. The usual setting for novelty detection is unsupervised whereby only examples of the normal class are available during training, but more recently there has been a surge in interest in semi-supervised methods. A common assumption about semi-supervised methods is their access to an additional set of labeled data that includes a few examples of anomalies. Transductive novelty detection or positive-unlabeled (PU) learning on the other hand assumes access to an additional unlabeled set that contains examples of anomalies. In this study, we focus on machine vision applications and propose TransductGAN, a transductive generative adversarial network (GAN) that attempts to learn how to generate image examples from the novel class by separating the latter from the negative class in a latent space using a mixture of two Gaussians. It achieves that by incorporating an adversarial autoencoder with a GAN network; the ability to generate examples of novel data points offers not only a visual representation of the new class, but also overcomes the hurdle faced by many inductive methods about how to tune the model hyperparameters at the decision rule level. In addition, the introduction of a latent space enables an enhanced discriminative learning. Our model has shown superior performance over state-of-the-art work on several benchmark datasets.",
        "keywords": "generative adversarial networks;representation learning;novelty detection;transductive learning;positive unlabeled learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Najiba Toron;Janaina Mourao-Miranda;John Shawe-Taylor",
        "authorids": "~Najiba_Toron1;~Janaina_Mourao-Miranda1;~John_Shawe-Taylor1",
        "gender": "F;F;M",
        "homepage": "https://profiles.ucl.ac.uk/68952-najiba-toron;https://profiles.ucl.ac.uk/7237;",
        "dblp": ";;59/41",
        "google_scholar": ";CeWaBjcAAAAJ;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Najiba_Toron1;~Janaina_Mourao-Miranda1;~John_Shawe-Taylor1",
        "aff": "Imperial College London;University College London, University of London;University College London",
        "aff_domain": "ic.ac.uk;ucl.ac.uk;ucl.ac.uk",
        "position": "Undergrad student;Full Professor;Professor",
        "bibtex": "@misc{\ntoron2024adversarial,\ntitle={Adversarial latent representation for positive unlabeled learning},\nauthor={Najiba Toron and Janaina Mourao-Miranda and John Shawe-Taylor},\nyear={2024},\nurl={https://openreview.net/forum?id=DFQCJmHPoe}\n}",
        "github": "",
        "project": "",
        "reviewers": "JuuS;NiHf;ozUy;DxcQ",
        "site": "https://openreview.net/forum?id=DFQCJmHPoe",
        "pdf_size": 1026516,
        "rating": "3;3;3;6",
        "confidence": "3;4;4;4",
        "soundness": "2;2;2;3",
        "contribution": "1;2;1;2",
        "presentation": "1;2;1;3",
        "wc_summary": "32;29;92;78",
        "wc_strengths": "14;9;20;64",
        "wc_weaknesses": "101;80;97;41",
        "wc_questions": "26;53;36;55",
        "wc_review": "173;171;245;238",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            57.75,
            27.716195626384224
        ],
        "wc_strengths_avg": [
            26.75,
            21.856063231972954
        ],
        "wc_weaknesses_avg": [
            79.75,
            23.72103496898902
        ],
        "wc_questions_avg": [
            42.5,
            12.05197079319395
        ],
        "wc_review_avg": [
            206.75,
            34.84519335575568
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:_9IuPbL6h7kJ:scholar.google.com/&scioq=Adversarial+latent+representation+for+positive+unlabeled+learning&hl=en&as_sdt=0,11",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Imperial College London;University College London",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.imperial.ac.uk;https://www.ucl.ac.uk",
        "aff_unique_abbr": "ICL;UCL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "title": "Beyond Worst-case Attacks: Robust RL with Adaptive Defense via Non-dominated Policies",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19146",
        "id": "DFTHW0MyiW",
        "author_site": "Xiangyu Liu, Chenghao Deng, Yanchao Sun, Yongyuan Liang, Furong Huang",
        "tldr": "",
        "abstract": "In light of the burgeoning success of reinforcement learning (RL) in diverse real-world applications, considerable focus has been directed towards ensuring RL policies are robust to adversarial attacks during test time. Current approaches largely revolve around solving a minimax problem to prepare for potential worst-case scenarios. While effective against strong attacks, these methods often compromise performance in the absence of attacks or the presence of only weak attacks. To address this, we study policy robustness under the well-accepted state-adversarial attack model, extending our focus beyond merely worst-case attacks. We first formalize this task at test time as a regret minimization problem and establish its intrinsic difficulty in achieving sublinear regret when the baseline policy is from a general continuous policy class, $\\Pi$. This finding prompts us to \\textit{refine} the baseline policy class $\\Pi$ prior to test time, aiming for efficient adaptation within a compact, finite policy class $\\tilde{\\Pi}$, which can resort to an adversarial bandit subroutine. In light of the importance of a finite and compact $\\tilde{\\Pi}$, we propose a novel training-time algorithm to iteratively discover \\textit{non-dominated policies}, forming a near-optimal and minimal $\\tilde{\\Pi}$, thereby ensuring both robustness and test-time efficiency. Empirical validation on the Mujoco corroborates the superiority of our approach in terms of natural and robust performance, as well as adaptability to various attack scenarios.",
        "keywords": "robust reinforcement learning; beyond worse-case",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Xiangyu Liu;Chenghao Deng;Yanchao Sun;Yongyuan Liang;Furong Huang",
        "authorids": "~Xiangyu_Liu4;~Chenghao_Deng1;~Yanchao_Sun1;~Yongyuan_Liang1;~Furong_Huang1",
        "gender": "M;M;F;F;F",
        "homepage": "https://xiangyu-liu.github.io;https://deng-chenghao.com;https://ycsun2017.github.io/home/index.html;https://cheryyunl.github.io/;https://furong-huang.com",
        "dblp": ";;132/6840;238/4104;72/8513",
        "google_scholar": ";AcGw1hcAAAAJ;bloBY_QAAAAJ;GQToORIAAAAJ;13yyuCcAAAAJ",
        "orcid": ";;0000-0002-1137-9939;;",
        "linkedin": ";chenghao-deng-326444182/;;https://linkedin.com/in/yongyuan-l-31462a17a;",
        "or_profile": "~Xiangyu_Liu4;~Chenghao_Deng1;~Yanchao_Sun1;~Yongyuan_Liang1;~Furong_Huang1",
        "aff": "University of Maryland, College Park;University of Maryland, College Park;J.P. Morgan AI Research;University of Maryland, College Park;University of Maryland",
        "aff_domain": "umd.edu;umd.edu;jpmchase.com;umd.edu;cs.umd.edu",
        "position": "PhD student;PhD student;Researcher;PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nliu2024beyond,\ntitle={Beyond Worst-case Attacks: Robust {RL} with Adaptive Defense via Non-dominated Policies},\nauthor={Xiangyu Liu and Chenghao Deng and Yanchao Sun and Yongyuan Liang and Furong Huang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=DFTHW0MyiW}\n}",
        "github": "",
        "project": "",
        "reviewers": "xB8p;F1uH;t6xM;M1op",
        "pdf_size": 2309270,
        "rating": "6;6;8;8",
        "confidence": "3;2;2;2",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;4",
        "presentation": "2;2;3;3",
        "wc_summary": "64;66;77;155",
        "wc_strengths": "51;37;79;94",
        "wc_weaknesses": "187;227;57;225",
        "wc_questions": "3;16;10;35",
        "wc_review": "305;346;223;509",
        "wc_reply_reviewers": "0;43;0;256",
        "wc_reply_authors": "1393;1840;247;2851",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "4;5;1;7",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            2.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            90.5,
            37.566607512523674
        ],
        "wc_strengths_avg": [
            65.25,
            22.454119889231908
        ],
        "wc_weaknesses_avg": [
            174.0,
            69.40461079784254
        ],
        "wc_questions_avg": [
            16.0,
            11.895377253370318
        ],
        "wc_review_avg": [
            345.75,
            104.13782934169504
        ],
        "wc_reply_reviewers_avg": [
            74.75,
            106.10696254252122
        ],
        "wc_reply_authors_avg": [
            1582.75,
            934.7284030669016
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            4.25,
            2.165063509461097
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17516343008677672040&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=DFTHW0MyiW",
        "pdf": "https://openreview.net/pdf?id=DFTHW0MyiW",
        "email": "umd.edu;umd.edu;jpmchase.com;umd.edu;cs.umd.edu",
        "author_num": 5,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "University of Maryland;J.P. Morgan",
        "aff_unique_dep": ";AI Research",
        "aff_unique_url": "https://www/umd.edu;https://www.jpmorgan.com",
        "aff_unique_abbr": "UMD;JPM",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "College Park;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "A Plug-and-Play Image Registration Network",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19145",
        "id": "DGez4B2a6Y",
        "author_site": "JUNHAO HU, Weijie Gan, Zhixin Sun, Hongyu An, Ulugbek Kamilov",
        "tldr": "",
        "abstract": "Deformable image registration (DIR) is an active research topic in biomedical imaging. There is a growing interest in developing DIR methods based on deep learning (DL). A traditional DL approach to DIR is based on training a convolutional neural network (CNN) to estimate the registration field between two input images. While conceptually simple, this approach comes with a limitation that it exclusively relies on a pre-trained CNN without explicitly enforcing fidelity between the registered image and the reference. We present plug-and-play image registration network (PIRATE) as a new DIR method that addresses this issue by integrating an explicit data-fidelity penalty and a CNN prior. PIRATE pre-trains a CNN denoiser on the registration field and \"plugs\" it into an iterative method as a regularizer. We additionally present PIRATE+ that fine-tunes the CNN prior in PIRATE using deep equilibrium models (DEQ). PIRATE+ interprets the fixed-point iteration of PIRATE as a network with effectively infinite layers and then trains the resulting network end-to-end, enabling it to learn more task-specific information and boosting its performance. Our numerical results on OASIS and CANDI datasets show that our methods achieve state-of-the-art performance on DIR.",
        "keywords": "deformable image registration;plug-and-play priors;deep equilibrium models;iterative algorithms",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/17f39146523c65fadb15437ea9c03c424887a66c.zip",
        "author": "Junhao Hu;Weijie Gan;Zhixin Sun;Hongyu An;Ulugbek Kamilov",
        "authorids": "~Junhao_Hu2;~Weijie_Gan1;~Zhixin_Sun2;~Hongyu_An3;~Ulugbek_Kamilov1",
        "gender": "M;M;F;F;Not Specified",
        "homepage": ";https://wjgancn.github.io;https://flora-sun-zhixin.github.io/;;https://ukmlv.github.io",
        "dblp": ";275/3691;;;73/9223",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;Ib20Ge0AAAAJ;;https://scholar.google.com/citations?hl=en;https://scholar.google.com.tw/citations?user=3qYUSDwAAAAJ",
        "orcid": ";;;0000-0001-6459-2269;0000-0001-6770-3278",
        "linkedin": ";;;hongyu-an-29a54624/;",
        "or_profile": "~Junhao_Hu2;~Weijie_Gan1;~Zhixin_Sun2;~Hongyu_An3;~Ulugbek_Kamilov1",
        "aff": "Washington University, Saint Louis;Washington University, Saint Louis;Washington University, Saint Louis;Washington University, Saint Louis;Google",
        "aff_domain": "wustl.edu;wustl.edu;wustl.edu;wustl.edu;google.com",
        "position": "PhD student;PhD student;PhD student;Full Professor;Visiting Faculty Researcher",
        "bibtex": "@inproceedings{\nhu2024a,\ntitle={A Plug-and-Play Image Registration Network},\nauthor={Junhao Hu and Weijie Gan and Zhixin Sun and Hongyu An and Ulugbek Kamilov},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=DGez4B2a6Y}\n}",
        "github": "",
        "project": "",
        "reviewers": "yfCW;kX3w;UpRR;3727",
        "pdf_size": 7366834,
        "rating": "6;6;8;8",
        "confidence": "1;3;4;4",
        "soundness": "2;3;4;3",
        "contribution": "2;3;4;3",
        "presentation": "2;3;3;3",
        "wc_summary": "69;77;67;105",
        "wc_strengths": "46;38;120;97",
        "wc_weaknesses": "97;216;98;136",
        "wc_questions": "23;87;57;83",
        "wc_review": "235;418;342;421",
        "wc_reply_reviewers": "23;10;36;0",
        "wc_reply_authors": "430;743;460;511",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "2;3;3;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.0,
            1.224744871391589
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            79.5,
            15.190457530963313
        ],
        "wc_strengths_avg": [
            75.25,
            34.34657916008521
        ],
        "wc_weaknesses_avg": [
            136.75,
            48.380652124583854
        ],
        "wc_questions_avg": [
            62.5,
            25.548972582082435
        ],
        "wc_review_avg": [
            354.0,
            75.6472074831583
        ],
        "wc_reply_reviewers_avg": [
            17.25,
            13.5531361684298
        ],
        "wc_reply_authors_avg": [
            536.0,
            122.96950841570442
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.8164965809277259,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9372274363505402118&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=DGez4B2a6Y",
        "pdf": "https://openreview.net/pdf?id=DGez4B2a6Y",
        "email": "wustl.edu;wustl.edu;wustl.edu;wustl.edu;google.com",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0;1",
        "aff_unique_norm": "Washington University in St. Louis;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://wustl.edu;https://www.google.com",
        "aff_unique_abbr": "WUSTL;Google",
        "aff_campus_unique_index": "0;0;0;0;1",
        "aff_campus_unique": "Saint Louis;Mountain View",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "DHCp41nv1M",
        "title": "Seeing Video Through Optical Scattering Media using Spatio-Temporal Diffusion Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Optical scattering causes light rays to deviate from their trajectory, posing challenges for imaging through scattering media such as fog and biological tissues. Although diffusion models have been extensively studied for various inverse problems in recent years, its extension to video recovery, especially through highly scattering media, has been an open problem due to the lack of a closed-form forward model and the difficulty of exploiting the spatio-temporal correlation. To address this,  here we present a novel inverse scattering solver using a video diffusion model. In particular, by deriving a closed-form forward model from the shower-curtain effect in a dynamic scattering medium, we develop a video diffusion posterior sampling scheme using a diffusion model with temporal attention that maximally exploits the statistical correlation between a series of frames and a series of scattered signals. Unlike previous end-to-end approaches only relied on spatial correlation between a scene and a scattered signal at a specific time point, the adaptability of the proposed method is highly extendable to various types of scenes, various thicknesses of scattering media, and varying distances between a target scene and a medium.  In particular, the use of temporal correlation is shown to be critical to faithfully retrieve high-frequency components which are often missed by inverse operations only in spatial domain.  Experimental results using the video datasets of moving sperm cells verify the effectiveness of the proposed method. To the best of our knowledge, this is the first video diffusion model to jointly utilize the correlations in both spatial and temporal domains in solving the inverse scattering problem.",
        "keywords": "Optics;Inverse scattering problem;Spatiotemporal reconstruction;Dynamic scattering media",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/1e9e5c0e37cc0ea2c8419553f80bcf86ade458b0.zip",
        "author": "Taesung Kwon;Gookho Song;Yoosun Kim;Jong Chul Ye;Mooseok Jang",
        "authorids": "~Taesung_Kwon1;~Gookho_Song1;~Yoosun_Kim2;~Jong_Chul_Ye1;~Mooseok_Jang1",
        "gender": "M;M;M;M;M",
        "homepage": "https://star-kwon.github.io/;http://mooolab.kaist.ac.kr/;https://github.com/kimyoosun;https://bispl.weebly.com/;http://mooolab.kaist.ac.kr/",
        "dblp": "290/9040;;;15/5613;",
        "google_scholar": "Mv9KjrsAAAAJ;;;HNMjoNEAAAAJ;QYPGDkAAAAAJ",
        "orcid": ";0000-0002-4906-9506;;;0000-0003-1977-9539",
        "linkedin": "star-kwon;;;;",
        "or_profile": "~Taesung_Kwon1;~Gookho_Song1;~Yoosun_Kim2;~Jong_Chul_Ye1;~Mooseok_Jang1",
        "aff": "Korea Advanced Institute of Science & Technology;;KAIST;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;;ee.kaist.ac.kr;kaist.ac.kr;kaist.edu",
        "position": "PhD student;;Undergrad student;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nkwon2024seeing,\ntitle={Seeing Video Through Optical Scattering Media using Spatio-Temporal Diffusion Models},\nauthor={Taesung Kwon and Gookho Song and Yoosun Kim and Jong Chul Ye and Mooseok Jang},\nyear={2024},\nurl={https://openreview.net/forum?id=DHCp41nv1M}\n}",
        "github": "",
        "project": "",
        "reviewers": "nUZb;dFYB;AVri",
        "site": "https://openreview.net/forum?id=DHCp41nv1M",
        "pdf_size": 7493811,
        "rating": "5;6;8",
        "confidence": "5;3;3",
        "soundness": "2;3;3",
        "contribution": "2;2;4",
        "presentation": "3;3;3",
        "wc_summary": "110;47;76",
        "wc_strengths": "24;60;37",
        "wc_weaknesses": "186;399;39",
        "wc_questions": "20;88;24",
        "wc_review": "340;594;176",
        "wc_reply_reviewers": "93;67;0",
        "wc_reply_authors": "899;1021;204",
        "reply_reviewers": "1;1;0",
        "reply_authors": "2;3;1",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            77.66666666666667,
            25.746628689770024
        ],
        "wc_strengths_avg": [
            40.333333333333336,
            14.884742374510736
        ],
        "wc_weaknesses_avg": [
            208.0,
            147.7903921099068
        ],
        "wc_questions_avg": [
            44.0,
            31.15552385479446
        ],
        "wc_review_avg": [
            370.0,
            171.96123594190252
        ],
        "wc_reply_reviewers_avg": [
            53.333333333333336,
            39.177658032211276
        ],
        "wc_reply_authors_avg": [
            708.0,
            359.8453371473176
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.7559289460184546,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:I0H5OVKQbR8J:scholar.google.com/&scioq=Seeing+Video+Through+Optical+Scattering+Media+using+Spatio-Temporal+Diffusion+Models&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "DIHBt1OUli",
        "title": "Partition and Conquer: A Multimodal Autoregressive Model for Time-Aligned and Contextual Modalities",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "One of the main challenges of multimodal learning is the need to combine heterogeneous modalities (e.g., video, audio, text). For example, video and audio are obtained at much higher rates than text and are roughly aligned in time. They are often not synchronized with text, which comes as a global context, e.g. a title or description. Furthermore, video and audio inputs are of much larger volumes, and grow as the video length increases, which naturally requires more compute dedicated to these modalities and makes modeling of long-range dependencies harder. \n\nWe here decouple the multimodal modeling, dividing it into separate, focused autoregressive models, processing the inputs according to the characteristics of the modalities. We propose a multimodal model consisting of an autoregressive component for the time-synchronized modalities (audio and video), and an autoregressive component for modalities which are not necessarily aligned in time but are still sequential. To address the long-sequences of the video-audio inputs, we propose to further partition the video and audio sequences in consecutive snippets and autoregressively process their representations. To that end, we propose a Combiner mechanism, which models the audio-video information jointly within a timeframe. The Combiner learns to extract audio and video features from raw spatio-temporal signals, and then learns to fuse these features producing compact but expressive representations per snippet. Our approach achieves the state-of-the-art on well established multimodal benchmarks, outperforming much larger models. It effectively addresses the high computational demand of media inputs by both learning compact representations, controlling the sequence length of the audio-video feature representations, and modeling their dependencies in time.",
        "keywords": "multimodal models",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "AJ Piergiovanni;Isaac Noble;Dahun Kim;Michael S Ryoo;Victor Fonseca Gomes;Anelia Angelova",
        "authorids": "~AJ_Piergiovanni1;~Isaac_Noble1;~Dahun_Kim1;~Michael_S_Ryoo1;~Victor_Fonseca_Gomes1;~Anelia_Angelova1",
        "gender": ";M;;M;M;",
        "homepage": "http://homes.sice.indiana.edu/ajpiergi/;https://www.linkedin.com/mwlite/in/isaac-noble-71401a14;;http://michaelryoo.com/;https://scholar.google.com/citations?user=Z8bnyvIAAAAJ&hl=en&oi=sra;https://research.google/people/aneliaangelova/",
        "dblp": "175/9876;209/2753;205/2487;r/MichaelSRyoo;;46/3065",
        "google_scholar": "https://scholar.google.com/citations?hl=en;JFR45L8AAAAJ;mHpN1xoAAAAJ;vcw0TJIAAAAJ;Z8bnyvIAAAAJ;nkmDOPgAAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";;;;;",
        "or_profile": "~AJ_Piergiovanni1;~Isaac_Noble1;~Dahun_Kim1;~Michael_S_Ryoo1;~Victor_Fonseca_Gomes1;~Anelia_Angelova1",
        "aff": "Google;Google;Google;Google DeepMind;Google;California Institute of Technology",
        "aff_domain": "google.com;google.com;google.com;google.com;google.com;caltech.edu",
        "position": "Research Scientist;Researcher;Research Scientist;Research Scientist;Technical Program Manager;PhD student",
        "bibtex": "@misc{\npiergiovanni2024partition,\ntitle={Partition and Conquer: A Multimodal Autoregressive Model for Time-Aligned and Contextual Modalities},\nauthor={AJ Piergiovanni and Isaac Noble and Dahun Kim and Michael S Ryoo and Victor Fonseca Gomes and Anelia Angelova},\nyear={2024},\nurl={https://openreview.net/forum?id=DIHBt1OUli}\n}",
        "github": "",
        "project": "",
        "reviewers": "ypJZ;KVWc;AMDB",
        "site": "https://openreview.net/forum?id=DIHBt1OUli",
        "pdf_size": 687731,
        "rating": "3;3;5",
        "confidence": "3;3;3",
        "soundness": "2;2;3",
        "contribution": "2;2;2",
        "presentation": "2;2;3",
        "wc_summary": "72;111;77",
        "wc_strengths": "33;107;58",
        "wc_weaknesses": "142;230;265",
        "wc_questions": "4;257;29",
        "wc_review": "251;705;429",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            86.66666666666667,
            17.326921891156037
        ],
        "wc_strengths_avg": [
            66.0,
            30.735430152621365
        ],
        "wc_weaknesses_avg": [
            212.33333333333334,
            51.74510175422941
        ],
        "wc_questions_avg": [
            96.66666666666667,
            113.83125913190786
        ],
        "wc_review_avg": [
            461.6666666666667,
            186.77853790578357
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:qCfyvXwlJCkJ:scholar.google.com/&scioq=Partition+and+Conquer:+A+Multimodal+Autoregressive+Model+for+Time-Aligned+and+Contextual+Modalities&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0;1",
        "aff_unique_norm": "Google;California Institute of Technology",
        "aff_unique_dep": "Google;",
        "aff_unique_url": "https://www.google.com;https://www.caltech.edu",
        "aff_unique_abbr": "Google;Caltech",
        "aff_campus_unique_index": "0;0;0;0;2",
        "aff_campus_unique": "Mountain View;;Pasadena",
        "aff_country_unique_index": "0;0;0;1;0;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "DIuSX4HqDZ",
        "title": "Abductive Logical Reasoning on Knowledge Graphs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Abductive reasoning is logical reasoning that makes educated guesses to infer the\nmost likely reasons to explain the observations. However, the abductive logical\nreasoning over knowledge graphs (KGs) is underexplored in KG literature. In this\npaper, we initially and formally raise the task of abductive logical reasoning over\nKGs, which involves inferring the most probable logic hypothesis from the KGs\nto explain an observed entity set. Traditional approaches use symbolic methods,\nlike searching, to tackle the knowledge graph problem. However, the symbolic\nmethods are unsuitable for this task, because the KGs are naturally incomplete,\nand the logical hypotheses can be complex with multiple variables and relations.\nTo address these issues, we propose a generative approach to create logical expres-\nsions based on observations. First, we sample hypothesis-observation pairs from\nthe KG and use supervised training to train a generative model that generates hy-\npotheses from observations. Since supervised learning only minimizes structural\ndifferences between generated and reference hypotheses, higher structural similar-\nity does not guarantee a better explanation for observations. To tackle this issue,\nwe introduce the Reinforcement Learning from the Knowledge Graph (RLF-KG)\nmethod, which minimizes the differences between observations and conclusions\ndrawn from the generated hypotheses according to the KG. Experimental results\ndemonstrate that transformer-based generative models can generate logical expla-\nnations robustly and efficiently. Moreover, with the assistance of RLF-KG, the\ngenerated hypothesis can provide better explanations for the observations, and the\nmethod of supervised learning with RLF-KG achieves state-of-the-art results on\nabductive knowledge graph reasoning on three widely used KGs.",
        "keywords": "knoweldge graph;logical reasoning",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "/attachment/e47e849726c08be9348e6cfb0383eb123dd8c4f4.zip",
        "author": "Jiaxin Bai;Yicheng Wang;Tianshi Zheng;Yue Guo;Xin Liu;Yangqiu Song",
        "authorids": "~Jiaxin_Bai1;~Yicheng_Wang4;~Tianshi_Zheng1;~Yue_Guo4;~Xin_Liu9;~Yangqiu_Song1",
        "gender": "M;M;M;F;M;M",
        "homepage": "http://bjx.fun/;https://ywangmy.github.io;https://stonetzheng.github.io/;https://irenehere.github.io/;https://www.cse.ust.hk/~xliucr/;https://www.cse.ust.hk/~yqsong/",
        "dblp": "250/9281;;341/1619;;76/1820-39.html;86/2159",
        "google_scholar": "BHQiBpQAAAAJ;https://scholar.google.ca/citations?hl=en;R7jE3X4AAAAJ;ZhBvjJUAAAAJ;https://scholar.google.com.hk/citations?user=WvC4upQAAAAJ;MdQZ-q8AAAAJ",
        "orcid": "0000-0002-8985-6467;;;0000-0001-8603-8904;0000-0001-9610-9526;0000-0002-7818-6090",
        "linkedin": ";;;;xin-liu-179830143;yqsong/",
        "or_profile": "~Jiaxin_Bai1;~Yicheng_Wang4;~Tianshi_Zheng1;~Yue_Guo4;~Xin_Liu9;~Yangqiu_Song1",
        "aff": "Hong Kong University of Science and Technology;Hong Kong University of Science and Technology;Hong Kong University of Science and Technology;Hong Kong University of Science and Technology;Amazon;Hong Kong University of Science and Technology",
        "aff_domain": "ust.hk;ust.hk;hkust.edu.hk;ust.hk;amazon.com;ust.hk",
        "position": "PhD student;Undergrad student;Undergrad student;PhD student;Researcher;Associate Professor",
        "bibtex": "@misc{\nbai2024abductive,\ntitle={Abductive Logical Reasoning on Knowledge Graphs},\nauthor={Jiaxin Bai and Yicheng Wang and Tianshi Zheng and Yue Guo and Xin Liu and Yangqiu Song},\nyear={2024},\nurl={https://openreview.net/forum?id=DIuSX4HqDZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "xMZe;yA9N;9m6p;jBpD;dX8J",
        "site": "https://openreview.net/forum?id=DIuSX4HqDZ",
        "pdf_size": 685523,
        "rating": "3;5;5;6;6",
        "confidence": "4;2;4;3;3",
        "soundness": "2;3;3;3;3",
        "contribution": "3;2;2;3;2",
        "presentation": "2;2;2;4;3",
        "wc_summary": "92;121;74;127;53",
        "wc_strengths": "89;37;51;117;52",
        "wc_weaknesses": "151;53;166;98;26",
        "wc_questions": "5;36;61;149;85",
        "wc_review": "337;247;352;491;216",
        "wc_reply_reviewers": "179;112;0;41;24",
        "wc_reply_authors": "1133;451;704;448;592",
        "reply_reviewers": "2;1;0;1;1",
        "reply_authors": "2;2;2;1;1",
        "rating_avg": [
            5.0,
            1.0954451150103321
        ],
        "confidence_avg": [
            3.2,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.6,
            0.8
        ],
        "wc_summary_avg": [
            93.4,
            27.9327764463184
        ],
        "wc_strengths_avg": [
            69.2,
            29.464554977124635
        ],
        "wc_weaknesses_avg": [
            98.8,
            54.10877932461607
        ],
        "wc_questions_avg": [
            67.2,
            48.76228050450471
        ],
        "wc_review_avg": [
            328.6,
            96.2592333233545
        ],
        "wc_reply_reviewers_avg": [
            71.2,
            65.56645483782084
        ],
        "wc_reply_authors_avg": [
            665.6,
            252.4904750678726
        ],
        "reply_reviewers_avg": [
            1.0,
            0.6324555320336759
        ],
        "reply_authors_avg": [
            1.6,
            0.4898979485566356
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.48795003647426666,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8838714502695079176&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;1;0",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Amazon",
        "aff_unique_dep": ";Amazon.com, Inc.",
        "aff_unique_url": "https://www.ust.hk;https://www.amazon.com",
        "aff_unique_abbr": "HKUST;Amazon",
        "aff_campus_unique_index": "0;0;0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Prediction Error-based Classification for Class-Incremental Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19144",
        "id": "DJZDgMOLXQ",
        "author_site": "Micha\u0142 Zaj\u0105c, Tinne Tuytelaars, Gido M van de Ven",
        "tldr": "",
        "abstract": "Class-incremental learning (CIL) is a particularly challenging variant of continual learning, where the goal is to learn to discriminate between all classes presented in an incremental fashion. Existing approaches often suffer from excessive forgetting and imbalance of the scores assigned to classes that have not been seen together during training. In this study, we introduce a novel approach, Prediction Error-based Classification (PEC), which differs from traditional discriminative and generative classification paradigms. PEC computes a class score by measuring the prediction error of a model trained to replicate the outputs of a frozen random neural network on data from that class. The method can be interpreted as approximating a classification rule based on Gaussian Process posterior variance. PEC offers several practical advantages, including sample efficiency, ease of tuning, and effectiveness even when data are presented one class at a time. Our empirical results show that PEC performs strongly in single-pass-through-data CIL, outperforming other rehearsal-free baselines in all cases and rehearsal-based methods with moderate replay buffer size in most cases across multiple benchmarks.",
        "keywords": "continual learning;class-incremental learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/e08b679e0198d7b5775c9ad65f1a1234063466e5.zip",
        "author": "Micha\u0142 Zaj\u0105c;Tinne Tuytelaars;Gido M van de Ven",
        "authorids": "~Micha\u0142_Zaj\u0105c1;~Tinne_Tuytelaars1;~Gido_M_van_de_Ven1",
        "gender": "M;;",
        "homepage": ";;",
        "dblp": "02/6977-5.html;;",
        "google_scholar": "https://scholar.google.pl/citations?user=5HHtXzwAAAAJ;;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Micha\u0142_Zaj\u0105c1;~Tinne_Tuytelaars1;~Gido_M_van_de_Ven1",
        "aff": "FAR AI;;",
        "aff_domain": "far.ai;;",
        "position": "Research Engineer;;",
        "bibtex": "@inproceedings{\nzaj{\\k{a}}c2024prediction,\ntitle={Prediction Error-based Classification for Class-Incremental Learning},\nauthor={Micha{\\l} Zaj{\\k{a}}c and Tinne Tuytelaars and Gido M van de Ven},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=DJZDgMOLXQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "HWad;pyfp;McZJ;TNjc",
        "pdf_size": 722473,
        "rating": "5;5;8;8",
        "confidence": "4;3;3;3",
        "soundness": "2;2;3;4",
        "contribution": "3;2;3;3",
        "presentation": "2;2;3;4",
        "wc_summary": "210;82;169;167",
        "wc_strengths": "64;35;159;57",
        "wc_weaknesses": "1305;191;633;33",
        "wc_questions": "670;76;61;55",
        "wc_review": "2249;384;1022;312",
        "wc_reply_reviewers": "217;193;102;2",
        "wc_reply_authors": "2328;1216;666;252",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "5;4;2;1",
        "rating_avg": [
            6.5,
            1.5
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            157.0,
            46.577891751344865
        ],
        "wc_strengths_avg": [
            78.75,
            47.5519452809241
        ],
        "wc_weaknesses_avg": [
            540.5,
            493.1336025865607
        ],
        "wc_questions_avg": [
            215.5,
            262.51714229741265
        ],
        "wc_review_avg": [
            991.75,
            776.6937539983181
        ],
        "wc_reply_reviewers_avg": [
            128.5,
            84.70094450476925
        ],
        "wc_reply_authors_avg": [
            1115.5,
            779.0922602619025
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.0,
            1.5811388300841898
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896258,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14816939458383415101&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=DJZDgMOLXQ",
        "pdf": "https://openreview.net/pdf?id=DJZDgMOLXQ",
        "email": "far.ai;;",
        "author_num": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "FAR AI",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.far.ai",
        "aff_unique_abbr": "FAR AI",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "DKfcxPxunu",
        "title": "Multi-Task Learning for Routing Problem with Zero-Shot Generalization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Vehicle routing problems (VRPs) are widely studied due to their significant practical importance. In the last decade, leveraging neural networks to solve VRPs in an end-to-end manner has gained substantial research attention. However, current works require building separate neural models for each routing problem, which hinders its practicality in solving diverse problems. In this study, we treat the VRPs as different combinations of a set of shared underlying attributes and propose to solve them simultaneously as multi-task learning. By training a unified model on multiple VRPs with varying attributes, we can effectively solve unseen problems in a zero-shot manner. Our experimental results on eleven VRPs show that our unified model performs comparably to single-task models trained specifically for each problem. More importantly, our model exhibits promising zero-shot generalization to new VRPs, reducing the average gap to 4.6\\% and 7.0\\% for sizes 50 and 100, respectively, compared to over 20\\% in the single-task approach.",
        "keywords": "Multi-task learning;Vehicle routing problems;Zero-shot generalization;Combinatorial optimization;Neural combinatorial optimization",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Fei Liu;Xi Lin;Zhenkun Wang;Qingfu Zhang;Tong Xialiang;Mingxuan Yuan",
        "authorids": "~Fei_Liu14;~Xi_Lin2;~Zhenkun_Wang1;~Qingfu_Zhang1;~Tong_Xialiang2;~Mingxuan_Yuan1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://xi-l.github.io/;https://faculty.sustech.edu.cn/wangzk3/en/;https://www.cs.cityu.edu.hk/~qzhan7/index.html;;;https://feiliu36.github.io/",
        "dblp": "43/489-1;96/9114;98/1240.html;https://dblp.uni-trier.de/pid/245/5977.html;74/2356;64/1350-44",
        "google_scholar": "QB_MUboAAAAJ;https://scholar.google.com.sg/citations?user=r9ezy2gAAAAJ;https://scholar.google.co.uk/citations?user=nhL9PHwAAAAJ;;https://scholar.google.com/citations?hl=en;wS0G_qQAAAAJ",
        "orcid": ";0000-0003-1152-6780;;;0000-0002-2236-8784;0000-0001-6719-0409",
        "linkedin": ";;;;;",
        "or_profile": "~Xi_Lin2;~Zhenkun_Wang1;~Qingfu_Zhang1;~Tong_Xialiang2;~Mingxuan_Yuan1;~Fei_LIU13",
        "aff": "City University of Hong Kong;Southern University of Science and Technology;City University of Hong Kong;Huawei Technologies Ltd.;Huawei Technologies Ltd.;City University of Hong Kong",
        "aff_domain": "cityu.edu.hk;sustech.edu.cn;cityu.edu.hk;huawei.com;huawei.com;cityu.edu.hk",
        "position": "Postdoc;Assistant Professor;Full Professor;Researcher;Researcher;PhD student",
        "bibtex": "@misc{\nliu2024multitask,\ntitle={Multi-Task Learning for Routing Problem with Zero-Shot Generalization},\nauthor={Fei Liu and Xi Lin and Zhenkun Wang and Qingfu Zhang and Tong Xialiang and Mingxuan Yuan},\nyear={2024},\nurl={https://openreview.net/forum?id=DKfcxPxunu}\n}",
        "github": "",
        "project": "",
        "reviewers": "Cmb6;kE7F;QmWB;xWGs",
        "site": "https://openreview.net/forum?id=DKfcxPxunu",
        "pdf_size": 1326705,
        "rating": "3;6;6;8",
        "confidence": "4;4;2;5",
        "soundness": "1;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;3;4",
        "wc_summary": "69;41;49;47",
        "wc_strengths": "67;25;33;20",
        "wc_weaknesses": "139;165;45;34",
        "wc_questions": "74;5;6;107",
        "wc_review": "349;236;133;208",
        "wc_reply_reviewers": "0;39;0;8",
        "wc_reply_authors": "3100;1891;671;389",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "7;5;2;3",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            51.5,
            10.523782589924593
        ],
        "wc_strengths_avg": [
            36.25,
            18.34904629674251
        ],
        "wc_weaknesses_avg": [
            95.75,
            57.12869244083922
        ],
        "wc_questions_avg": [
            48.0,
            44.073801742078025
        ],
        "wc_review_avg": [
            231.5,
            77.59027000855197
        ],
        "wc_reply_reviewers_avg": [
            11.75,
            16.068213964221414
        ],
        "wc_reply_authors_avg": [
            1512.75,
            1076.3123094622676
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            4.25,
            1.920286436967152
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.22487239817113241,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:bNCw1Lp_HXgJ:scholar.google.com/&scioq=Multi-Task+Learning+for+Routing+Problem+with+Zero-Shot+Generalization&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;2;2;0",
        "aff_unique_norm": "City University of Hong Kong;Southern University of Science and Technology;Huawei",
        "aff_unique_dep": ";;Huawei Technologies",
        "aff_unique_url": "https://www.cityu.edu.hk;https://www.sustech.edu.cn;https://www.huawei.com",
        "aff_unique_abbr": "CityU;SUSTech;Huawei",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "DL7JWbdGr3",
        "title": "PEMs: Pre-trained Epidemic Time-Series Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Providing accurate and reliable predictions about the future of an epidemic is an important problem for enabling informed public health decisions. Recent works have shown that leveraging data-driven solutions that utilize advances in deep learning methods to learn from past data of an epidemic often outperforms traditional mechanistic models. However, in many cases, the past data is sparse and may not sufficiently capture the underlying dynamics. While there exists a large amount of data from past epidemics, leveraging prior knowledge from time-series data of other diseases is a non-trivial challenge.\n\nMotivated by the success of pre-trained models in language and vision tasks, we tackle the problem of pre-training epidemic time-series models to learn from multiple datasets from different diseases and epidemics. We introduce Pre-trained Epidemic Time-Series Models (PEMS) that learn from diverse time-series datasets of a variety of diseases by formulating pre-training as a set of self-supervised learning (SSL) tasks. We tackle various important challenges specific to pre-training for epidemic time-series such as dealing with heterogeneous dynamics and efficiently capturing useful patterns from multiple epidemic datasets by carefully designing the SSL tasks to learn important priors about the epidemic dynamics that can be leveraged for fine-tuning to multiple downstream tasks. The resultant PEM outperforms previous state-of-the-art methods in various downstream time-series tasks across datasets of varying seasonal patterns, geography, and mechanism of contagion including the novel Covid-19 pandemic unseen in pre-trained data with better efficiency using smaller fraction of datasets",
        "keywords": "Epidemic Forecasting;Self-supervised learning;Time Series Forecasting",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/4cbeaca6e109cc65e1173bf367096381aecaf794.pdf",
        "author": "Harshavardhan Kamarthi;B. Aditya Prakash",
        "authorids": "~Harshavardhan_Kamarthi1;~B._Aditya_Prakash2",
        "gender": "M;",
        "homepage": "https://www.harsha-pk.com;https://www.cc.gatech.edu/~badityap/",
        "dblp": "245/8927;06/3956",
        "google_scholar": "LNXEjT8AAAAJ;C-NftTgAAAAJ",
        "orcid": "0000-0002-2901-7127;0000-0002-3252-455X",
        "linkedin": "harshavardhan-kamarthi-462928112/;",
        "or_profile": "~Harshavardhan_Kamarthi1;~B._Aditya_Prakash2",
        "aff": "Georgia Institute of Technology;Georgia Institute of Technology",
        "aff_domain": "gatech.edu;gatech.edu",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\nanonymous2024pems,\ntitle={{PEM}s: Pre-trained Epidemic Time-Series Models},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=DL7JWbdGr3}\n}",
        "github": "",
        "project": "",
        "reviewers": "7guK;A18H;PcYs;ZKwe",
        "site": "https://openreview.net/forum?id=DL7JWbdGr3",
        "pdf_size": 1597140,
        "rating": "3;5;5;6",
        "confidence": "5;3;3;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;2",
        "presentation": "3;3;3;3",
        "wc_summary": "47;46;60;76",
        "wc_strengths": "89;79;54;44",
        "wc_weaknesses": "417;177;158;62",
        "wc_questions": "83;171;16;67",
        "wc_review": "636;473;288;249",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "623;747;476;307",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            57.25,
            12.152674602736633
        ],
        "wc_strengths_avg": [
            66.5,
            18.200274723201296
        ],
        "wc_weaknesses_avg": [
            203.5,
            130.74498078320252
        ],
        "wc_questions_avg": [
            84.25,
            55.86311394829329
        ],
        "wc_review_avg": [
            411.5,
            154.79098810977337
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            538.25,
            164.40099604321136
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.6225430174794673,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8705642417185337540&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Georgia Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.gatech.edu",
        "aff_unique_abbr": "Georgia Tech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "ReLoRA: High-Rank Training Through Low-Rank Updates",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19143",
        "id": "DLJznSp6X3",
        "author_site": "Vladislav Lialin, Sherin Muckatira, Namrata Shivagunde, Anna Rumshisky",
        "tldr": "",
        "abstract": "Despite the dominance and effectiveness of scaling, resulting in large networks with hundreds of billions of parameters, the necessity to train overparameterized models remains poorly understood, while training costs grow exponentially. In this paper, we explore parameter-efficient training techniques as an approach to training large neural networks. We introduce a novel method called ReLoRA, which utilizes low-rank updates to train high-rank networks. We apply ReLoRA to training transformer language models with up to 1.3B parameters and demonstrate comparable performance to regular neural network training. ReLoRA saves up to 5.5Gb of RAM per GPU and improves training speed by 9-40% depending on the model size and hardware setup. Our findings show the potential of parameter- efficient techniques for large-scale pre-training. Our code is available on GitHub.",
        "keywords": "language models;pre-training;training efficiency;parameter-efficient fine-tuning;lora",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Vladislav Lialin;Sherin Muckatira;Namrata Shivagunde;Anna Rumshisky",
        "authorids": "~Vladislav_Lialin1;~Sherin_Muckatira1;~Namrata_Shivagunde1;~Anna_Rumshisky1",
        "gender": ";F;F;Not Specified",
        "homepage": "http://vladlialin.com;;https://text-machine.cs.uml.edu/lab2/people/nshivagunde/;http://text-machine.cs.uml.edu",
        "dblp": "https://dblp.uni-trier.de/pid/251/5456;138/5752;320/5719;63/873",
        "google_scholar": "B1Ijov0AAAAJ;https://scholar.google.com/citations?hl=en;RWNUtkkAAAAJ;https://scholar.google.com.tw/citations?user=_Q1uzVYAAAAJ",
        "orcid": ";;;",
        "linkedin": "vlialin/;sherinmuckatira/;namrata-shivagunde-b5823ba3/;",
        "or_profile": "~Vladislav_Lialin1;~Sherin_Muckatira1;~Namrata_Shivagunde1;~Anna_Rumshisky1",
        "aff": "University of Massachusetts, Lowell;University of Massachusetts at Lowell;Department of Computer Science, University of Massachusetts at Lowell;University of Massachusetts, Lowell",
        "aff_domain": "uml.edu;uml.edu;cs.umass.edu;uml.edu",
        "position": "PhD student;PhD student;PhD student;Associate Professor",
        "bibtex": "@inproceedings{\nlialin2024relora,\ntitle={ReLo{RA}: High-Rank Training Through Low-Rank Updates},\nauthor={Vladislav Lialin and Sherin Muckatira and Namrata Shivagunde and Anna Rumshisky},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=DLJznSp6X3}\n}",
        "github": "",
        "project": "",
        "reviewers": "xXqo;DYvD;x3dX;vHWf",
        "pdf_size": 1832410,
        "rating": "5;6;6;6",
        "confidence": "3;4;4;5",
        "soundness": "3;3;2;2",
        "contribution": "3;2;2;3",
        "presentation": "2;3;3;2",
        "wc_summary": "43;76;64;158",
        "wc_strengths": "49;91;69;61",
        "wc_weaknesses": "212;83;117;205",
        "wc_questions": "49;86;123;56",
        "wc_review": "353;336;373;480",
        "wc_reply_reviewers": "0;13;0;0",
        "wc_reply_authors": "1427;297;1518;954",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "2;1;3;2",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            85.25,
            43.631267458097064
        ],
        "wc_strengths_avg": [
            67.5,
            15.321553446044563
        ],
        "wc_weaknesses_avg": [
            154.25,
            55.620926817161184
        ],
        "wc_questions_avg": [
            78.5,
            29.21044333795706
        ],
        "wc_review_avg": [
            385.5,
            56.10926839658489
        ],
        "wc_reply_reviewers_avg": [
            3.25,
            5.629165124598851
        ],
        "wc_reply_authors_avg": [
            1049.0,
            484.0903841226347
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.816496580927726,
        "gs_citation": 111,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15589354674526896115&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=DLJznSp6X3",
        "pdf": "https://openreview.net/pdf?id=DLJznSp6X3",
        "email": "uml.edu;uml.edu;cs.umass.edu;uml.edu",
        "author_num": 4,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "University of Massachusetts Lowell;University of Massachusetts at Lowell",
        "aff_unique_dep": ";Department of Computer Science",
        "aff_unique_url": "https://www.uml.edu;https://www.uml.edu",
        "aff_unique_abbr": "UMass Lowell;UMass Lowell",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Lowell",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "DLfdJEuXkR",
        "title": "UGSL: A Unified Framework for Benchmarking Graph Structure Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph neural networks (GNNs) demonstrate outstanding performance in a broad range of applications. While the majority of GNN applications assume that a graph structure is given, some recent methods substantially expanded the applicability of GNNs by showing that they may be effective even when no graph structure is explicitly provided. The GNN parameters and a graph structure are jointly learned. Previous studies adopt different experimentation setups, making it difficult to compare their merits. In this paper, we propose a benchmarking strategy for graph structure learning using a unified framework. Our framework, called Unified Graph Structure Learning (UGSL), reformulates existing models into a single model. We implement a wide range of existing models in our framework and conduct extensive analyses of the effectiveness of different components in the framework. Our results provide a clear and concise understanding of the different methods in this area as well as their strengths and weaknesses.",
        "keywords": "Graph neural networks;Graph structure learning;unified framework",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/c737073131cd38e02ec79653a5ee5bd47e1b0b2e.zip",
        "author": "Bahare Fatemi;Sami Abu-El-Haija;Anton Tsitsulin;Mehran Kazemi;Dustin Zelle;Neslihan Bulut;Jonathan Halcrow;Bryan Perozzi",
        "authorids": "~Bahare_Fatemi1;~Sami_Abu-El-Haija1;~Anton_Tsitsulin1;~Mehran_Kazemi1;~Dustin_Zelle1;~Neslihan_Bulut1;~Jonathan_Halcrow1;~Bryan_Perozzi1",
        "gender": "F;M;M;M;;M;;M",
        "homepage": ";http://www.haija.org;http://tsitsul.in;;;;http://www.perozzi.net/;https://mehran-k.github.io/",
        "dblp": ";127/6620;217/1668;239/6070;194/4824;;91/10813;149/1283",
        "google_scholar": ";t80qlTcAAAAJ;https://scholar.google.com/citations?hl=en;cv6419kAAAAJ;;2zZucy4AAAAJ;rZgbMs4AAAAJ;https://scholar.google.ca/citations?user=L79ecZkAAAAJ",
        "orcid": ";;;;;;;",
        "linkedin": "bahare-fatemi-b0049179/;samihaija/;atsitsulin/;dustin-zelle-58b36a83/;nes571/;;;mehran-kazemi-64675071/",
        "or_profile": "~Bahare_Fatemi1;~Sami_Abu-El-Haija1;~Anton_Tsitsulin1;~Dustin_Zelle1;~Neslihan_Bulut1;~Jonathan_Halcrow1;~Bryan_Perozzi1;~Seyed_Mehran_Kazemi1",
        "aff": "Google;Research, Google;Google;Research, Google;Research, Google;Google;Google;Google",
        "aff_domain": "google.com;research.google.com;google.com;research.google.com;research.google.com;google.com;google.com;google.com",
        "position": "Researcher;Research Scientist;Research Scientist;Researcher;Software Engineer;Researcher;Researcher;Researcher",
        "bibtex": "@misc{\nfatemi2024ugsl,\ntitle={{UGSL}: A Unified Framework for Benchmarking Graph Structure Learning},\nauthor={Bahare Fatemi and Sami Abu-El-Haija and Anton Tsitsulin and Mehran Kazemi and Dustin Zelle and Neslihan Bulut and Jonathan Halcrow and Bryan Perozzi},\nyear={2024},\nurl={https://openreview.net/forum?id=DLfdJEuXkR}\n}",
        "github": "",
        "project": "",
        "reviewers": "RW4a;k3xx;B447;WpgZ",
        "site": "https://openreview.net/forum?id=DLfdJEuXkR",
        "pdf_size": 636002,
        "rating": "3;3;3;5",
        "confidence": "4;4;4;4",
        "soundness": "2;2;2;1",
        "contribution": "1;2;2;2",
        "presentation": "2;3;2;3",
        "wc_summary": "38;174;72;50",
        "wc_strengths": "13;43;29;37",
        "wc_weaknesses": "61;157;63;301",
        "wc_questions": "2;82;65;46",
        "wc_review": "114;456;229;434",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            83.5,
            53.65398400864562
        ],
        "wc_strengths_avg": [
            30.5,
            11.258330249197702
        ],
        "wc_weaknesses_avg": [
            145.5,
            97.79953987621823
        ],
        "wc_questions_avg": [
            48.75,
            29.844388082183894
        ],
        "wc_review_avg": [
            308.25,
            142.87822612280712
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11206066828520578690&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0;0;0;0;0",
        "aff_unique_norm": "Google",
        "aff_unique_dep": "Google",
        "aff_unique_url": "https://www.google.com",
        "aff_unique_abbr": "Google",
        "aff_campus_unique_index": "0;0;0;0;0;0;0;0",
        "aff_campus_unique": "Mountain View",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "DMJNaBUv3D",
        "title": "Less is More: On the Feature Redundancy of Pretrained Models When Transferring to Few-shot Tasks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Transferring a pretrained model to a downstream task can be as easy as conducting linear probing with target data, that is, training a linear classifier upon frozen features extracted from the pretrained model. As there may exist significant gaps between pretraining and downstream datasets, one may ask whether all dimensions of the pretrained features are useful for a given downstream task. We show that, for linear probing, the pretrained features can be extremely redundant when the downstream data is scarce, or few-shot. For some cases such as 5-way 1-shot tasks, using only 1% of the most important feature dimensions is able to recover the performance achieved by using the full representation. Interestingly, most dimensions are redundant only under few-shot settings and gradually become useful when the number of shots increases, suggesting that feature redundancy may be the key to characterizing the \"few-shot\" nature of few-shot transfer problems. We give a theoretical understanding of this phenomenon and show how dimensions with high variance and small distance between class centroids can serve as confounding factors that severely disturb classification results under few-shot settings. As an attempt at solving this problem, we find that the redundant features are difficult to identify accurately with a small number of training samples, but we can instead adjust feature magnitude with a soft mask based on estimated feature importance. We show that this method can generally improve few-shot transfer performance across various pretrained models and downstream datasets.",
        "keywords": "Pretrained models;Few-shot transfer;Feature redundancy;Linear probing;Representation learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Xu Luo;Difan Zou;Lianli Gao;Zenglin Xu;Jingkuan Song",
        "authorids": "~Xu_Luo1;~Difan_Zou1;~Lianli_Gao1;~Zenglin_Xu1;~Jingkuan_Song3",
        "gender": "M;M;F;M;M",
        "homepage": "https://frankluox.github.io/;https://difanzou.github.io/;https://lianligao.github.io/;https://faculty.fudan.edu.cn/xuzenglin/en/index.htm;https://cfm.uestc.edu.cn/~songjingkuan/",
        "dblp": "06/2622-3;161/8923;123/9849.html;68/1538;70/10575",
        "google_scholar": "https://scholar.google.com/citations?hl=en;Cp4fcTQAAAAJ;https://scholar.google.com.au/citations?user=zsm2dpYAAAAJ;gF0H9nEAAAAJ;F5Zy9V4AAAAJ",
        "orcid": "0000-0001-9827-1244;;;0000-0001-5550-6461;",
        "linkedin": ";;;;",
        "or_profile": "~Xu_Luo1;~Difan_Zou1;~Lianli_Gao1;~Zenglin_Xu1;~Jingkuan_Song3",
        "aff": "University of Electronic Science and Technology of China;University of Hong Kong;University of Electronic Science and Technology of China;Harbin Institute of Technology Shenzhen;University of Electronic Science and Technology of China,",
        "aff_domain": "uestc.edu.cn;hku.hk;uestc.edu.cn;hit.edu.cn;uestc.edu.cn",
        "position": "PhD student;Assistant Professor;Full Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nluo2024less,\ntitle={Less is More: On the Feature Redundancy of Pretrained Models When Transferring to Few-shot Tasks},\nauthor={Xu Luo and Difan Zou and Lianli Gao and Zenglin Xu and Jingkuan Song},\nyear={2024},\nurl={https://openreview.net/forum?id=DMJNaBUv3D}\n}",
        "github": "",
        "project": "",
        "reviewers": "YUQa;Xfoy;BvhJ;h7zL",
        "site": "https://openreview.net/forum?id=DMJNaBUv3D",
        "pdf_size": 1439425,
        "rating": "3;5;6;8",
        "confidence": "4;5;4;5",
        "soundness": "2;3;3;2",
        "contribution": "2;2;3;2",
        "presentation": "2;3;3;3",
        "wc_summary": "28;83;67;154",
        "wc_strengths": "22;57;111;96",
        "wc_weaknesses": "102;114;84;438",
        "wc_questions": "10;6;6;14",
        "wc_review": "162;260;268;702",
        "wc_reply_reviewers": "0;0;22;374",
        "wc_reply_authors": "996;626;330;1572",
        "reply_reviewers": "0;0;1;2",
        "reply_authors": "3;2;2;4",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            83.0,
            45.612498287201944
        ],
        "wc_strengths_avg": [
            71.5,
            34.7167106736799
        ],
        "wc_weaknesses_avg": [
            184.5,
            146.74723166043032
        ],
        "wc_questions_avg": [
            9.0,
            3.3166247903554
        ],
        "wc_review_avg": [
            348.0,
            208.60009587725506
        ],
        "wc_reply_reviewers_avg": [
            99.0,
            159.02515524281057
        ],
        "wc_reply_authors_avg": [
            881.0,
            463.50080906078256
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5547001962252291,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6476122004768108079&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;2;0",
        "aff_unique_norm": "University of Electronic Science and Technology of China;University of Hong Kong;Harbin Institute of Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.uestc.edu.cn;https://www.hku.hk;https://www.hit.edu.cn/",
        "aff_unique_abbr": "UESTC;HKU;HIT",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Hong Kong SAR;Shenzhen",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "DNvzCsQG1D",
        "title": "InstructionGPT-4: A 200-Instruction Paradigm for Fine-Tuning MiniGPT-4",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Multimodal large language models are typically trained in two stages: first pre-training on image-text pairs, and then fine-tuning using supervised vision-language instruction data.\nRecent studies have shown that large language models can achieve satisfactory results even with a limited amount of high-quality instruction-following data.\nIn this paper, we introduce InstructionGPT-4, which is fine-tuned on a small dataset comprising only 200 examples, amounting to approximately 6% of the instruction-following data used in the alignment dataset for MiniGPT-4.\nTo achieve this, we first propose several metrics to access the quality of multimodal instruction data.\nBased on these metrics, we present an effective and trainable data selector to automatically identify and filter low-quality vision-language data.\nBy employing this method, InstructionGPT-4 outperforms the original MiniGPT-4 on various evaluations.\nOverall, our findings demonstrate that less but high-quality instruction tuning data is efficient in enabling multimodal large language models to generate better output.",
        "keywords": "Multimodal LLM;Instruction Curation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/0b20f31dfb3c8bc15830117308f2247a6bb6136b.zip",
        "author": "Lai Wei;Zihao Jiang;Weiran Huang;Lichao Sun",
        "authorids": "~Lai_Wei7;~Zihao_Jiang1;~Weiran_Huang1;~Lichao_Sun1",
        "gender": "M;M;M;M",
        "homepage": "https://waltonfuture.github.io/;;https://www.weiranhuang.com;https://lichao-sun.github.io/",
        "dblp": "36/4168-5;;170/0073-1;121/0780-1.html",
        "google_scholar": "ic3N84oAAAAJ;;AjJ2rf8AAAAJ;WhGUE7AAAAAJ",
        "orcid": ";0000-0002-2959-8427;;",
        "linkedin": ";;;lichao-sun-b273a290/",
        "or_profile": "~Lai_Wei7;~Zihao_Jiang1;~Weiran_Huang1;~Lichao_Sun1",
        "aff": "Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai AI Laboratory;Lehigh University",
        "aff_domain": "sjtu.edu.cn;sjtu.edu.cn;pjlab.org.cn;lehigh.edu",
        "position": "Undergrad student;MS student;Consultant;Assistant Professor",
        "bibtex": "@misc{\nwei2024instructiongpt,\ntitle={Instruction{GPT}-4: A 200-Instruction Paradigm for Fine-Tuning Mini{GPT}-4},\nauthor={Lai Wei and Zihao Jiang and Weiran Huang and Lichao Sun},\nyear={2024},\nurl={https://openreview.net/forum?id=DNvzCsQG1D}\n}",
        "github": "",
        "project": "",
        "reviewers": "dCjW;61XF;PGky;Wn4g",
        "site": "https://openreview.net/forum?id=DNvzCsQG1D",
        "pdf_size": 4884387,
        "rating": "1;3;5;6",
        "confidence": "5;4;3;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;3;4",
        "wc_summary": "114;100;45;104",
        "wc_strengths": "33;25;59;132",
        "wc_weaknesses": "394;204;77;252",
        "wc_questions": "91;194;101;100",
        "wc_review": "632;523;282;588",
        "wc_reply_reviewers": "1000;0;198;272",
        "wc_reply_authors": "5559;2360;1711;2160",
        "reply_reviewers": "3;0;1;1",
        "reply_authors": "10;5;5;5",
        "rating_avg": [
            3.75,
            1.920286436967152
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            90.75,
            26.901440481877547
        ],
        "wc_strengths_avg": [
            62.25,
            42.18634257671551
        ],
        "wc_weaknesses_avg": [
            231.75,
            113.41599314029746
        ],
        "wc_questions_avg": [
            121.5,
            42.03867267171979
        ],
        "wc_review_avg": [
            506.25,
            135.15246020698254
        ],
        "wc_reply_reviewers_avg": [
            367.5,
            378.47159734912736
        ],
        "wc_reply_authors_avg": [
            2947.5,
            1525.956830975241
        ],
        "reply_reviewers_avg": [
            1.25,
            1.0897247358851685
        ],
        "reply_authors_avg": [
            6.25,
            2.165063509461097
        ],
        "replies_avg": [
            37,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.7364596943186587,
        "gs_citation": 46,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9653142586779586757&as_sdt=5,24&sciodt=0,24&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "Shanghai Jiao Tong University;Shanghai AI Laboratory;Lehigh University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.sjtu.edu.cn;https://www.shanghai-ai-lab.com;https://www.lehigh.edu",
        "aff_unique_abbr": "SJTU;SAIL;Lehigh",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "PINNsFormer: A Transformer-Based Framework For Physics-Informed Neural Networks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19142",
        "id": "DO2WFXU1Be",
        "author_site": "Zhiyuan Zhao, Xueying Ding, B. Aditya Prakash",
        "tldr": "",
        "abstract": "Physics-Informed Neural Networks (PINNs) have emerged as a promising deep learning framework for approximating numerical solutions to partial differential equations (PDEs). However, conventional PINNs, relying on multilayer perceptrons (MLP), neglect the crucial temporal dependencies inherent in practical physics systems and thus fail to propagate the initial condition constraints globally and accurately capture the true solutions under various scenarios. In this paper, we introduce a novel Transformer-based framework, termed PINNsFormer, designed to address this limitation. PINNsFormer can accurately approximate PDE solutions by utilizing multi-head attention mechanisms to capture temporal dependencies. PINNsFormer transforms point-wise inputs into pseudo sequences and replaces point-wise PINNs loss with a sequential loss. Additionally, it incorporates a novel activation function, \\texttt{Wavelet}, which anticipates Fourier decomposition through deep neural networks. Empirical results demonstrate that PINNsFormer achieves superior generalization ability and accuracy across various scenarios, including PINNs failure modes and high-dimensional PDEs. Moreover, PINNsFormer offers flexibility in integrating existing learning schemes for PINNs, further enhancing its performance.",
        "keywords": "Physics-Informed Neural Networks;Transformer;Self-Attention",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/e706d30a428f44ca8015da65b09bbd608a747a77.pdf",
        "author": "Zhiyuan Zhao;Xueying Ding;B. Aditya Prakash",
        "authorids": "~Zhiyuan_Zhao1;~Xueying_Ding1;~B._Aditya_Prakash2",
        "gender": "M;F;",
        "homepage": "https://leozhao1997.github.io/;;https://www.cc.gatech.edu/~badityap/",
        "dblp": ";;06/3956",
        "google_scholar": "TzWPFmwAAAAJ;U9CMsh0AAAAJ;C-NftTgAAAAJ",
        "orcid": "0009-0005-6671-705x;;0000-0002-3252-455X",
        "linkedin": ";;",
        "or_profile": "~Zhiyuan_Zhao1;~Xueying_Ding1;~B._Aditya_Prakash2",
        "aff": "Georgia Institute of Technology;Carnegie Mellon University;Georgia Institute of Technology",
        "aff_domain": "gatech.edu;cmu.edu;gatech.edu",
        "position": "PhD student;PhD student;Associate Professor",
        "bibtex": "@inproceedings{\nzhao2024pinnsformer,\ntitle={{PINN}sFormer: A Transformer-Based Framework For Physics-Informed Neural Networks},\nauthor={Zhiyuan Zhao and Xueying Ding and B. Aditya Prakash},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=DO2WFXU1Be}\n}",
        "github": "",
        "project": "",
        "reviewers": "dren;mmgn;ZyRg;PNtx",
        "pdf_size": 2150975,
        "rating": "5;5;8;8",
        "confidence": "3;4;5;4",
        "soundness": "2;3;4;3",
        "contribution": "1;3;4;3",
        "presentation": "2;3;4;4",
        "wc_summary": "93;49;139;120",
        "wc_strengths": "32;53;4;136",
        "wc_weaknesses": "358;254;143;100",
        "wc_questions": "7;3;4;203",
        "wc_review": "490;359;290;559",
        "wc_reply_reviewers": "261;0;271;25",
        "wc_reply_authors": "763;700;399;556",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            6.5,
            1.5
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            1.0897247358851685
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            100.25,
            33.80366104433069
        ],
        "wc_strengths_avg": [
            56.25,
            49.21572411333597
        ],
        "wc_weaknesses_avg": [
            213.75,
            100.46485703966337
        ],
        "wc_questions_avg": [
            54.25,
            85.89346599130809
        ],
        "wc_review_avg": [
            424.5,
            105.78397799288888
        ],
        "wc_reply_reviewers_avg": [
            139.25,
            127.10699233323082
        ],
        "wc_reply_authors_avg": [
            604.5,
            140.37895141366457
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.7071067811865476,
        "gs_citation": 50,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2487090118624512719&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=DO2WFXU1Be",
        "pdf": "https://openreview.net/pdf?id=DO2WFXU1Be",
        "email": "gatech.edu;cmu.edu;gatech.edu",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Georgia Institute of Technology;Carnegie Mellon University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.gatech.edu;https://www.cmu.edu",
        "aff_unique_abbr": "Georgia Tech;CMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "DOerIFfUbs",
        "title": "Enhancing Vision-Language Model with Unmasked Token Alignment at Scale",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Contrastive pre-training on image-text pairs, exemplified by CLIP, becomes a standard technique for learning multi-modal visual-language representations. Although CLIP has demonstrated remarkable performance, training it from scratch on noisy web-scale datasets is computationally demanding. On the other hand, mask-then-predict pre-training approaches, like Masked Image Modeling (MIM), offer efficient self-supervised learning for single-modal representations. This paper introduces Unmasked Token Alignment (UTA), a method that leverages existing CLIP models to further enhance its vision-language representations. UTA trains a Vision Transformer (ViT) by aligning unmasked visual tokens to the corresponding image tokens from a frozen CLIP vision encoder, which automatically aligns the ViT model with the CLIP text encoder. The pre-trained ViT can be directly applied for zero-shot evaluation even without training on image-text pairs. Compared to MIM approaches, UTA does not suffer from training-finetuning inconsistency and is much more training-efficient by avoiding using the extra $\\mathrm{[MASK]}$ tokens. Extensive experimental results demonstrate that UTA can enhance CLIP models and outperform existing MIM methods on various uni- and multi-modal benchmarks.",
        "keywords": "self-supervised learning;masked image modeling;CLIP;multi-modal",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Jihao Liu;Jinliang Zheng;Boxiao Liu;Yu Liu;Hongsheng Li",
        "authorids": "~Jihao_Liu4;~Jinliang_Zheng1;~Boxiao_Liu1;~Yu_Liu2;~Hongsheng_Li3",
        "gender": "M;M;M;M;M",
        "homepage": "https://jihaonew.github.io/;https://2toinf.github.io/;;http://liuyu.us;http://www.ee.cuhk.edu.hk/~hsli",
        "dblp": "167/0509;156/3720.html;188/2274;97/2274-15;27/7402-1",
        "google_scholar": "PP1HyToAAAAJ;3j5AHFsAAAAJ;-zEM0ycAAAAJ;;BN2Ze-QAAAAJ",
        "orcid": ";0009-0000-0605-2969;0000-0002-9792-1361;;",
        "linkedin": ";;;;",
        "or_profile": "~Jihao_Liu4;~Jinliang_Zheng1;~Boxiao_Liu1;~Yu_Liu2;~Hongsheng_Li3",
        "aff": "The Chinese University of Hong Kong;Sensetime Research;Sensetime Research;SenseTime;The Chinese University of Hong Kong",
        "aff_domain": "cuhk.edu.hk;sensetime.com;sensetime.com;sensetime.com;cuhk.edu.hk",
        "position": "PhD student;Intern;Researcher;Principal Researcher;Associate Professor",
        "bibtex": "@misc{\nliu2024enhancing,\ntitle={Enhancing Vision-Language Model with Unmasked Token Alignment at Scale},\nauthor={Jihao Liu and Jinliang Zheng and Boxiao Liu and Yu Liu and Hongsheng Li},\nyear={2024},\nurl={https://openreview.net/forum?id=DOerIFfUbs}\n}",
        "github": "",
        "project": "",
        "reviewers": "SDrz;g84W;WgGM;4GX4",
        "site": "https://openreview.net/forum?id=DOerIFfUbs",
        "pdf_size": 419642,
        "rating": "3;3;3;6",
        "confidence": "4;4;4;3",
        "soundness": "2;3;4;3",
        "contribution": "2;2;4;3",
        "presentation": "2;3;3;3",
        "wc_summary": "63;78;92;22",
        "wc_strengths": "14;39;26;42",
        "wc_weaknesses": "255;206;79;31",
        "wc_questions": "177;83;2;3",
        "wc_review": "509;406;199;98",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "865;638;349;156",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;2;2;2",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            63.75,
            26.1951808545007
        ],
        "wc_strengths_avg": [
            30.25,
            11.143944544011335
        ],
        "wc_weaknesses_avg": [
            142.75,
            91.03948319273347
        ],
        "wc_questions_avg": [
            66.25,
            71.89358455383902
        ],
        "wc_review_avg": [
            303.0,
            162.70064535827754
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            502.0,
            270.8274358332257
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:MwAGhOB9EQwJ:scholar.google.com/&scioq=Enhancing+Vision-Language+Model+with+Unmasked+Token+Alignment+at+Scale&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1;0",
        "aff_unique_norm": "Chinese University of Hong Kong;SenseTime",
        "aff_unique_dep": ";Research",
        "aff_unique_url": "https://www.cuhk.edu.hk;https://www.sensetime.com/",
        "aff_unique_abbr": "CUHK;SenseTime",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "DP4NkPZOpD",
        "title": "Bridging Sequence and Structure: Latent Diffusion for Conditional Protein Generation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Protein design encompasses a range of challenging tasks, including protein folding, inverse folding, and protein-protein docking. Despite significant progress in this domain, many existing methods address these tasks separately, failing to adequately leverage the joint relationship between protein sequence and three-dimensional structure. In this work, we propose a novel generative modeling technique to capture this joint distribution. Our approach is based on a diffusion model applied on a geometrically-structured latent space, obtained through an encoder that produces roto-translational invariant representations of the input protein complex. It can be used for any of the aforementioned tasks by using the diffusion model to sample the conditional distribution of interest. Our experiments show that our method outperforms competitors in protein docking and is competitive with state-of-the-art for protein inverse folding. Exhibiting a single model that excels on on both sequence-based and structure-based tasks represents a significant advancement in the field and paves the way for additional applications.",
        "keywords": "Protein Design;Geometric Machine Learning;Latent Diffusion;Protein Docking",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Matt McPartlon;C\u00e9line Marquet;Tomas Geffner;Daniel Kovtun;Alexander Goncearenco;Zachary Carpenter;Luca Naef;Michael M. Bronstein;Jinbo Xu",
        "authorids": "~Matt_McPartlon1;~C\u00e9line_Marquet1;~Tomas_Geffner1;~Daniel_Kovtun1;~Alexander_Goncearenco1;zach@vant.ai;~Luca_Naef1;~Michael_M._Bronstein1;~Jinbo_Xu1",
        "gender": "M;;M;M;M;;M;M;M",
        "homepage": ";;https://people.umass.edu/tgeffner/;https://github.com/danielkovtun;https://github.com/neksa;;;http://www.inf.usi.ch/bronstein/;http://ttic.uchicago.edu/~jinbo/",
        "dblp": ";;201/5406;;18/7099.html;;;07/2668;",
        "google_scholar": "LIHk4kUAAAAJ;;KIIe2K8AAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en;;qHKY1AQAAAAJ;UU3N6-UAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;0009-0005-5616-9707;0000-0002-9738-7146;;;;",
        "linkedin": ";;tomasgeffner/;daniel-kovtun-646204118/;goncearenco/;;;mbronstein/;",
        "or_profile": "~Matt_McPartlon1;~C\u00e9line_Marquet1;~Tomas_Geffner1;~Daniel_Kovtun1;~Alexander_Goncearenco1;zach@vant.ai;~Luca_Naef1;~Michael_M._Bronstein1;~Jinbo_Xu1",
        "aff": ";;NVIDIA;VantAI;;;;University of Oxford;Toyota Technological Institute at Chicago",
        "aff_domain": ";;nvidia.com;vant.ai;;;;ox.ac.uk;ttic.edu",
        "position": ";;Researcher;Researcher;;;;Full Professor;Full Professor",
        "bibtex": "@misc{\nmcpartlon2024bridging,\ntitle={Bridging Sequence and Structure: Latent Diffusion for Conditional Protein Generation},\nauthor={Matt McPartlon and C{\\'e}line Marquet and Tomas Geffner and Daniel Kovtun and Alexander Goncearenco and Zachary Carpenter and Luca Naef and Michael M. Bronstein and Jinbo Xu},\nyear={2024},\nurl={https://openreview.net/forum?id=DP4NkPZOpD}\n}",
        "github": "",
        "project": "",
        "reviewers": "b3vX;ZFyz;cpz6;rb4f",
        "site": "https://openreview.net/forum?id=DP4NkPZOpD",
        "pdf_size": 5989281,
        "rating": "3;3;6;8",
        "confidence": "5;5;4;3",
        "soundness": "3;2;3;4",
        "contribution": "2;1;3;4",
        "presentation": "3;2;3;3",
        "wc_summary": "23;56;60;112",
        "wc_strengths": "25;59;33;77",
        "wc_weaknesses": "137;790;92;66",
        "wc_questions": "141;13;168;22",
        "wc_review": "326;918;353;277",
        "wc_reply_reviewers": "260;0;0;0",
        "wc_reply_authors": "404;583;221;128",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            1.118033988749895
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            62.75,
            31.854159853934306
        ],
        "wc_strengths_avg": [
            48.5,
            20.706279240848655
        ],
        "wc_weaknesses_avg": [
            271.25,
            300.5755936532439
        ],
        "wc_questions_avg": [
            86.0,
            69.23510670173044
        ],
        "wc_review_avg": [
            468.5,
            260.94491755924275
        ],
        "wc_reply_reviewers_avg": [
            65.0,
            112.58330249197702
        ],
        "wc_reply_authors_avg": [
            334.0,
            174.7183447723793
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -0.994936676326182,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=350639026820252345&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "NVIDIA;VantAI;University of Oxford;Toyota Technological Institute at Chicago",
        "aff_unique_dep": "NVIDIA Corporation;;;",
        "aff_unique_url": "https://www.nvidia.com;https://www.vantai.cn;https://www.ox.ac.uk;https://www.tti-chicago.org",
        "aff_unique_abbr": "NVIDIA;;Oxford;TTI Chicago",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Chicago",
        "aff_country_unique_index": "0;1;2;0",
        "aff_country_unique": "United States;China;United Kingdom"
    },
    {
        "id": "DP5wWg0EiG",
        "title": "Cluster-Learngene: Inheriting Adaptive Clusters for Self-Attention",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In recent years, the merging of vast datasets with powerful computational resources has led to the emergence of large pre-trained models in the field of deep learning. However, the common practices often overgeneralize the applicability of these models, overlooking the task-specific resource constraints. To mitigate this issue, we propose \\textbf{Cluster-Learngene}, which effectively condenses knowledge from an ancestry model and then initializes descendant models with varying scales of attention heads. Specifically, our method adaptively clusters attention heads of each layer in the ancestry model based on their density characteristics and extracts centroids of attention heads as the learngene. Moreover, we introduce a priority weight-sharing strategy that expands the learngene to initialize descendant models with varying scales of attention heads. Through extensive experimentation, we demonstrate that Cluster-Learngene is not only more efficient compared to other initialization methods but also customizes models with varying scales of attention heads according to downstream task resources.",
        "keywords": "Model Initialization;Vision Transformers;Clustering",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Qiufeng Wang;Xu Yang;Fu Feng;Jing wang;Xin Geng",
        "authorids": "~Qiufeng_Wang3;~Xu_Yang5;~Fu_Feng1;~Jing_wang2;~Xin_Geng1",
        "gender": "M;M;M;M;M",
        "homepage": "http://palm.seu.edu.cn/homepage/wangqiufeng/demo/index.html;;https://github.com/fu-feng;https://wangjing4research.github.io/;http://palm.seu.edu.cn/xgeng/index.htm",
        "dblp": ";63/1534-21.html;;02/736-113;",
        "google_scholar": "HQYQkTwAAAAJ;SqdxMH0AAAAJ;https://scholar.google.com.hk/citations?user=iQHFcXEAAAAJ;gL4a4cgAAAAJ;ZOCxkIcAAAAJ",
        "orcid": "0000-0001-7680-6607;0000-0002-8276-2679;0009-0005-7139-7791;0000-0003-2734-7138;",
        "linkedin": ";;;;",
        "or_profile": "~Qiufeng_Wang3;~Xu_Yang5;~Fu_Feng1;~Jing_wang2;~Xin_Geng1",
        "aff": "Southeast University;Southeast University;Southeast University;Southeast University;Southeast University, China",
        "aff_domain": "seu.edu.cn;seu.edu.cn;seu.edu.cn;seu.edu.cn;seu.edu.cn",
        "position": "PhD student;Associate Professor;PhD student;Postdoc;Professor",
        "bibtex": "@misc{\nwang2024clusterlearngene,\ntitle={Cluster-Learngene: Inheriting Adaptive Clusters for Self-Attention},\nauthor={Qiufeng Wang and Xu Yang and Fu Feng and Jing wang and Xin Geng},\nyear={2024},\nurl={https://openreview.net/forum?id=DP5wWg0EiG}\n}",
        "github": "",
        "project": "",
        "reviewers": "YtqB;9WgW;eHH7",
        "site": "https://openreview.net/forum?id=DP5wWg0EiG",
        "pdf_size": 1583192,
        "rating": "3;3;5",
        "confidence": "5;3;2",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "4;2;3",
        "wc_summary": "195;73;95",
        "wc_strengths": "33;21;80",
        "wc_weaknesses": "179;378;65",
        "wc_questions": "27;18;3",
        "wc_review": "434;490;243",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            1.247219128924647
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            121.0,
            53.09111664550546
        ],
        "wc_strengths_avg": [
            44.666666666666664,
            25.460208605237746
        ],
        "wc_weaknesses_avg": [
            207.33333333333334,
            129.3427831599257
        ],
        "wc_questions_avg": [
            16.0,
            9.899494936611665
        ],
        "wc_review_avg": [
            389.0,
            105.73867157604481
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.7559289460184545,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:SUCrP_LP5qYJ:scholar.google.com/&scioq=Cluster-Learngene:+Inheriting+Adaptive+Clusters+for+Self-Attention&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Southeast University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.seu.edu.cn/",
        "aff_unique_abbr": "SEU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "DQCZiKb3Uy",
        "title": "Vision-Language Models Provide Promptable Representations for Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Intelligent beings have the ability to quickly learn new behaviors and tasks by leveraging background world knowledge. This stands in contrast to most agents trained with reinforcement learning (RL), which typically learn behaviors from scratch. Therefore, we would like to endow RL agents with a similar ability to leverage contextual prior information. To this end, we propose a novel approach that uses the vast amounts of general-purpose, diverse, and indexable world knowledge encoded in vision-language models (VLMs) pre-trained on Internet-scale data to generate text in response to images and prompts. We initialize RL policies with VLMs by using such models as sources of \\textit{promptable representations}: embeddings that are grounded in visual observations and encode semantic features based on the VLM's internal knowledge, as elicited through prompts that provide task context and auxiliary information. We evaluate our approach on visually-complex RL tasks in Minecraft. We find that policies trained on promptable embeddings significantly outperform equivalent policies trained on generic, non-promptable image encoder features. Moreover, we show that promptable representations extracted from general-purpose VLMs outperform both domain-specific representations and instruction-following methods. In ablations, we find that VLM promptability and text generation both are important in yielding good representations for RL. Finally, we give a simple method for evaluating and optimizing prompts used by our approach for a given task without running expensive RL trials, ensuring that it extracts task-relevant semantic features from the VLM.",
        "keywords": "Reinforcement Learning;Promptable Representations;Vision-language Models;Embodied Control",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "William Chen;Oier Mees;Aviral Kumar;Sergey Levine",
        "authorids": "~William_Chen1;~Oier_Mees1;~Aviral_Kumar2;~Sergey_Levine1",
        "gender": "M;M;M;M",
        "homepage": ";https://www.oiermees.com/;https://aviralkumar2907.github.io/;https://people.eecs.berkeley.edu/~svlevine/",
        "dblp": ";190/8659;202/7961;80/7594",
        "google_scholar": "xUeq5EAAAAAJ;https://scholar.google.de/citations?user=sgsLkM0AAAAJ;;8R35rCwAAAAJ",
        "orcid": ";;;",
        "linkedin": "william-chen-a3956516b/;oier-mees-a3069488;;",
        "or_profile": "~William_Chen1;~Oier_Mees1;~Aviral_Kumar2;~Sergey_Levine1",
        "aff": "University of California, Berkeley;Electrical Engineering & Computer Science Department, University of California, Berkeley;Google DeepMind;Google",
        "aff_domain": "berkeley.edu;eecs.berkeley.edu;google.com;google.com",
        "position": "PhD student;Postdoc;Researcher;Research Scientist",
        "bibtex": "@misc{\nchen2024visionlanguage,\ntitle={Vision-Language Models Provide Promptable Representations for Reinforcement Learning},\nauthor={William Chen and Oier Mees and Aviral Kumar and Sergey Levine},\nyear={2024},\nurl={https://openreview.net/forum?id=DQCZiKb3Uy}\n}",
        "github": "",
        "project": "",
        "reviewers": "AR8Q;Cm8x;qGuw;sWjV",
        "site": "https://openreview.net/forum?id=DQCZiKb3Uy",
        "pdf_size": 3841343,
        "rating": "5;5;6;6",
        "confidence": "5;4;4;4",
        "soundness": "3;3;3;2",
        "contribution": "3;2;2;3",
        "presentation": "4;3;3;4",
        "wc_summary": "51;136;64;119",
        "wc_strengths": "60;119;106;92",
        "wc_weaknesses": "205;262;280;286",
        "wc_questions": "13;34;101;243",
        "wc_review": "329;551;551;740",
        "wc_reply_reviewers": "76;97;112;0",
        "wc_reply_authors": "989;1527;2160;1293",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "3;5;5;5",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            92.5,
            35.80851853958776
        ],
        "wc_strengths_avg": [
            94.25,
            21.958768180387533
        ],
        "wc_weaknesses_avg": [
            258.25,
            31.98730216820418
        ],
        "wc_questions_avg": [
            97.75,
            89.93713081925618
        ],
        "wc_review_avg": [
            542.75,
            145.54445197258465
        ],
        "wc_reply_reviewers_avg": [
            71.25,
            43.077691442323136
        ],
        "wc_reply_authors_avg": [
            1492.25,
            430.13333688520356
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.5,
            0.8660254037844386
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 22,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17095657775654366390&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;1",
        "aff_unique_norm": "University of California, Berkeley;Google",
        "aff_unique_dep": ";Google DeepMind",
        "aff_unique_url": "https://www.berkeley.edu;https://deepmind.com",
        "aff_unique_abbr": "UC Berkeley;DeepMind",
        "aff_campus_unique_index": "0;0;2",
        "aff_campus_unique": "Berkeley;;Mountain View",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "DQTxr8JtPX",
        "title": "Detecting Influence Structures in Multi-Agent Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We consider the problem of quantifying the amount of influence one agent can exert on another in the setting of multi-agent reinforcement learning (MARL). \nAs a step towards a unified approach to express agents' interdependencies, we introduce the total and state influence measurement functions.\nBoth of these are valid for all common MARL systems, such as the discounted reward setting.\nAdditionally, we propose novel quantities, called the total impact measurement (TIM) and state impact measurement (SIM), that characterize one agent's influence on another by the maximum impact it can have on the other agents' expected returns and represent instances of impact measurement functions in the average reward setting. \nFurthermore, we provide approximation algorithms for TIM and SIM with simultaneously learning approximations of agents' expected returns, error bounds, stability analyses under changes of the policies, and convergence guarantees. \nThe approximation algorithm relies only on observing other agents' actions and is, other than that, fully decentralized.\nThrough empirical studies, we validate our approach's effectiveness in identifying intricate influence structures in complex interactions.\nOur work appears to be the first study of determining influence structures in the multi-agent average reward setting with convergence guarantees.",
        "keywords": "multi-agent reinforcement learning;multi-agent interdependencies;stochastic approximation;decentralized algorithms",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Fabian Raoul Pieroth;Katherine Fitch;Lenz Belzner",
        "authorids": "~Fabian_Raoul_Pieroth1;katie.fitch@laralab.de;~Lenz_Belzner1",
        "gender": "M;;",
        "homepage": "https://www.cs.cit.tum.de/en/dss/members/fabian-pieroth/;;",
        "dblp": "334/1024.html;;136/1485",
        "google_scholar": ";;",
        "orcid": "0000-0002-5712-1706;;",
        "linkedin": ";;",
        "or_profile": "~Fabian_Raoul_Pieroth1;katie.fitch@laralab.de;~Lenz_Belzner1",
        "aff": "Technische Universit\u00e4t M\u00fcnchen;;Technische Hochschule Ingolstadt",
        "aff_domain": "tum.de;;thi.de",
        "position": "PhD student;;Associate Professor",
        "bibtex": "@misc{\npieroth2024detecting,\ntitle={Detecting Influence Structures in Multi-Agent Reinforcement Learning},\nauthor={Fabian Raoul Pieroth and Katherine Fitch and Lenz Belzner},\nyear={2024},\nurl={https://openreview.net/forum?id=DQTxr8JtPX}\n}",
        "github": "",
        "project": "",
        "reviewers": "fprX;dun1;qZgK;gDUL",
        "site": "https://openreview.net/forum?id=DQTxr8JtPX",
        "pdf_size": 5489186,
        "rating": "3;3;5;6",
        "confidence": "1;3;2;4",
        "soundness": "2;3;2;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;2;2",
        "wc_summary": "19;103;177;61",
        "wc_strengths": "12;32;29;23",
        "wc_weaknesses": "46;160;66;55",
        "wc_questions": "53;133;20;29",
        "wc_review": "130;428;292;168",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "311;1146;566;446",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;3;2;2",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            2.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            90.0,
            58.35237784358063
        ],
        "wc_strengths_avg": [
            24.0,
            7.648529270389178
        ],
        "wc_weaknesses_avg": [
            81.75,
            45.72950360544055
        ],
        "wc_questions_avg": [
            58.75,
            44.53299338692606
        ],
        "wc_review_avg": [
            254.5,
            116.71653696027826
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            617.25,
            318.32324373190215
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.6024640760767093,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:4adKMcO4tj4J:scholar.google.com/&scioq=Detecting+Influence+Structures+in+Multi-Agent+Reinforcement+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 5,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Technische Universit\u00e4t M\u00fcnchen;Technische Hochschule Ingolstadt",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tum.de;https://www.thi.de",
        "aff_unique_abbr": "TUM;THI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "DRGnEkbiQZ",
        "title": "Larger language models do in-context learning differently",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We study how in-context learning (ICL) in language models is affected by semantic priors versus input-label mappings. We investigate two setups - ICL with flipped labels and ICL with semantically-unrelated labels - across various model families (GPT-3, InstructGPT, Codex, an internal model, and an instruction-tuned variant of the internal model). First, experiments on ICL with flipped labels show that overriding semantic priors is an emergent ability of model scale. While small language models ignore flipped labels presented in-context and thus rely primarily on semantic priors from pretraining, large models can override semantic priors when presented with in-context exemplars that contradict priors, despite the stronger semantic priors that larger models may hold. We next study semantically-unrelated label ICL (SUL-ICL), in which labels are semantically unrelated to their inputs (e.g., foo/bar instead of negative/positive), thereby forcing language models to learn the input-label mappings shown in in-context exemplars in order to perform the task. The ability to do SUL-ICL also emerges primarily with scale, and large-enough language models can even perform linear classification in a SUL-ICL setting. Finally, we evaluate instruction-tuned models and find that instruction tuning strengthens both the use of semantic priors and the capacity to learn input-label mappings, but more of the former.",
        "keywords": "In-context learning;natural language processing;large language models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/b524dcf17a428757847c09dc7af3d3a1758f9ac2.pdf",
        "author": "Jerry Wei;Jason Wei;Yi Tay;Dustin Tran;Albert Webson;Yifeng Lu;Xinyun Chen;Hanxiao Liu;Da Huang;Denny Zhou;Tengyu Ma",
        "authorids": "~Jerry_Wei1;~Jason_Wei1;~Yi_Tay1;~Dustin_Tran1;~Albert_Webson1;~Yifeng_Lu1;~Xinyun_Chen1;~Hanxiao_Liu1;~Da_Huang2;~Denny_Zhou1;~Tengyu_Ma1",
        "gender": "M;M;;;M;M;;M;;M;F",
        "homepage": "https://jasonwei20.github.io;http://yitay.net;http://dustintran.com;https://representations.ai;;https://quark0.github.io/;;http://ai.stanford.edu/~tengyuma/;https://dennyzhou.github.io/;https://www.jerrywei.net;https://jungyhuk.github.io/",
        "dblp": "02/11220.html;;;276/1456;69/8051;157/6334;;54/9061;178/3277;234/9076;",
        "google_scholar": ";VBclY_cAAAAJ;wVazIm8AAAAJ;3OQplr0AAAAJ;CM4o-cgAAAAJ;IMkVH_8AAAAJ;ZjuMpLoAAAAJ;i38QlUwAAAAJ;UwLsYw8AAAAJ;Y4sk3aMAAAAJ;d4W1UT0AAAAJ",
        "orcid": ";;;;;;;;;0009-0001-5279-0177;",
        "linkedin": ";;;;;;;;;jerryweiai/;",
        "or_profile": "~Jason_Wei1;~Yi_Tay1;~Dustin_Tran1;~Albert_Webson1;~Yifeng_Lu1;~Hanxiao_Liu1;~Da_Huang2;~Tengyu_Ma1;~Dengyong_Zhou2;~Jerry_Weng_Wei1;~Xinyun_Chen2",
        "aff": "OpenAI;Google;Google;Google DeepMind;Google Deepmind;Google Brain;Google;Facebook AI Research;Google DeepMind;Google DeepMind;Google",
        "aff_domain": "openai.com;google.com;google.com;google.com;google.com;google.com;google.com;fb.com;google.com;google.com;google.com",
        "position": "Researcher;Research Scientist;Research Scientist;Research Scientist;Researcher;Research Scientist;Researcher;Visiting Scientist;Research Scientist;Researcher;Researcher",
        "bibtex": "@misc{\nwei2024larger,\ntitle={Larger language models do in-context learning differently},\nauthor={Jerry Wei and Jason Wei and Yi Tay and Dustin Tran and Albert Webson and Yifeng Lu and Xinyun Chen and Hanxiao Liu and Da Huang and Denny Zhou and Tengyu Ma},\nyear={2024},\nurl={https://openreview.net/forum?id=DRGnEkbiQZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "AA4b;X31b;fEqW;K1hb",
        "site": "https://openreview.net/forum?id=DRGnEkbiQZ",
        "pdf_size": 249794,
        "rating": "3;5;5;6",
        "confidence": "4;4;4;4",
        "soundness": "1;3;3;3",
        "contribution": "2;2;2;2",
        "presentation": "3;3;3;4",
        "wc_summary": "213;133;42;255",
        "wc_strengths": "31;55;103;112",
        "wc_weaknesses": "231;103;81;436",
        "wc_questions": "1;127;18;40",
        "wc_review": "476;418;244;843",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            160.75,
            81.37067960881241
        ],
        "wc_strengths_avg": [
            75.25,
            33.49906715119094
        ],
        "wc_weaknesses_avg": [
            212.75,
            141.04675643204277
        ],
        "wc_questions_avg": [
            46.5,
            48.48968962573384
        ],
        "wc_review_avg": [
            495.25,
            218.17123435503592
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 348,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3276432233377164291&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 12,
        "aff_unique_index": "0;1;1;1;2;1;1;3;1;1;1",
        "aff_unique_norm": "OpenAI;Google;DeepMind;Meta",
        "aff_unique_dep": ";Google;DeepMind;Facebook AI Research",
        "aff_unique_url": "https://openai.com;https://www.google.com;https://deepmind.com;https://research.facebook.com",
        "aff_unique_abbr": "OpenAI;Google;DeepMind;FAIR",
        "aff_campus_unique_index": "1;1;1;1;1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0;0;1;1;0;0;0;1;1;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "title": "FedTrans: Client-Transparent Utility Estimation for Robust Federated Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19141",
        "id": "DRu8PMHgCh",
        "author_site": "Mingkun Yang, Ran Zhu, Qing Wang, Jie Yang",
        "tldr": "",
        "abstract": "Federated Learning (FL) is an important privacy-preserving learning paradigm that plays an important role in the Intelligent Internet of Things. Training a global model in FL, however, is vulnerable to the noise in the heterogeneous data across the clients. In this paper, we introduce **FedTrans**, a novel client-transparent client utility estimation method designed to guide client selection for noisy scenarios, mitigating performance degradation problems. To estimate the client utility, we propose a Bayesian framework that models client utility and its relationships with the weight parameters and the performance of local models. We then introduce a variational inference algorithm to effectively infer client utility, given only a small amount of auxiliary data. Our evaluation demonstrates that leveraging FedTrans as a guide for client selection can lead to a better accuracy performance (up to 7.8\\%), ensuring robustness in noisy scenarios.",
        "keywords": "Federated Learning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/ef91943fd80cdeb638000782a7046f2fba774889.pdf",
        "author": "Mingkun Yang;Ran Zhu;Qing Wang;Jie Yang",
        "authorids": "~Mingkun_Yang2;~Ran_Zhu2;~Qing_Wang22;~Jie_Yang1",
        "gender": "M;F;M;M",
        "homepage": "https://mingkunyang.github.io/;https://ran-zhu.github.io/;https://www.st.ewi.tudelft.nl/qing/;http://yangjiera.github.io",
        "dblp": ";;97/6505-7;12/1198-28.html",
        "google_scholar": "4SxijgcAAAAJ;BdU9XbUAAAAJ;https://scholar.google.nl/citations?user=fqE36d0AAAAJ;DAlsOOEAAAAJ",
        "orcid": ";;0000-0003-0950-1111;0000-0002-0350-0313",
        "linkedin": ";;;",
        "or_profile": "~Mingkun_Yang2;~Ran_Zhu2;~Qing_Wang22;~Jie_Yang1",
        "aff": "Delft University of Technology;Delft University of Technology;Delft University of Technology;Delft University of Technology",
        "aff_domain": "tudelft.nl;tudelft.nl;tudelft.nl;tudelft.nl",
        "position": "PhD student;PhD student;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nyang2024fedtrans,\ntitle={FedTrans: Client-Transparent Utility Estimation for Robust Federated Learning},\nauthor={Mingkun Yang and Ran Zhu and Qing Wang and Jie Yang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=DRu8PMHgCh}\n}",
        "github": "",
        "project": "",
        "reviewers": "PLVU;kySo;DCr1",
        "pdf_size": 5056259,
        "rating": "6;6;6",
        "confidence": "3;3;3",
        "soundness": "3;2;3",
        "contribution": "3;2;2",
        "presentation": "3;2;2",
        "wc_summary": "76;83;184",
        "wc_strengths": "87;36;82",
        "wc_weaknesses": "190;132;361",
        "wc_questions": "106;4;47",
        "wc_review": "459;255;674",
        "wc_reply_reviewers": "14;0;40",
        "wc_reply_authors": "955;943;2008",
        "reply_reviewers": "1;0;1",
        "reply_authors": "3;4;5",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            114.33333333333333,
            49.34459330959056
        ],
        "wc_strengths_avg": [
            68.33333333333333,
            22.954060400915758
        ],
        "wc_weaknesses_avg": [
            227.66666666666666,
            97.20882447368426
        ],
        "wc_questions_avg": [
            52.333333333333336,
            41.81174741890396
        ],
        "wc_review_avg": [
            462.6666666666667,
            171.07568175777902
        ],
        "wc_reply_reviewers_avg": [
            18.0,
            16.57307052620807
        ],
        "wc_reply_authors_avg": [
            1302.0,
            499.24142456330685
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            4.0,
            0.816496580927726
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:nS850il8x3kJ:scholar.google.com/&scioq=FedTrans:+Client-Transparent+Utility+Estimation+for+Robust+Federated+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=DRu8PMHgCh",
        "pdf": "https://openreview.net/pdf?id=DRu8PMHgCh",
        "email": "tudelft.nl;tudelft.nl;tudelft.nl;tudelft.nl",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Delft University of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tudelft.nl",
        "aff_unique_abbr": "TU Delft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Netherlands"
    },
    {
        "id": "DS5qRs0tQz",
        "title": "Grounding DINO: Marrying DINO with Grounded Pre-Training for Open-Set Object Detection",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this paper, we develop an open-set object detector, called Grounding DINO, by marrying Transformer-based detector DINO with grounded pre-training, which can detect arbitrary objects with human inputs such as category names or referring expressions. \nThe key solution of open-set object detection is introducing language to a closed-set detector for open-set concept generalization. \nTo effectively fuse language and vision modalities, we conceptually divide a closed-set detector into three phases and propose a tight fusion solution, which includes a feature enhancer, a language-guided query selection, and a cross-modality decoder for cross-modality fusion. \nWhile previous works mainly evaluate open-set object detection on novel categories, we propose to also perform evaluations on referring expression comprehension for objects specified with attributes. \nGrounding DINO performs remarkably well on all three settings, including benchmarks on COCO, LVIS, ODinW, and RefCOCO/+/g. \nGrounding DINO achieves a $52.5$ AP on the COCO detection zero-shot transfer benchmark, i.e.,  without any training data from COCO. It sets a new record on the ODinW zero-shot benchmark with a mean $26.1$ AP.",
        "keywords": "Object Detection;Visual Grounding;Open Vocabulary",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Shilong Liu;Zhaoyang Zeng;Tianhe Ren;Feng Li;Hao Zhang;Jie Yang;Chunyuan Li;Jianwei Yang;Hang Su;Jun Zhu;Lei Zhang",
        "authorids": "~Shilong_Liu1;~Zhaoyang_Zeng1;~Tianhe_Ren1;~Feng_Li9;~Hao_Zhang11;~Jie_Yang20;~Chunyuan_Li1;~Jianwei_Yang1;~Hang_Su3;~Jun_Zhu2;~Lei_Zhang23",
        "gender": "M;M;;M;;M;;M;M;M;M",
        "homepage": "https://www.lsl.zone;;https://rentainhe.github.io/;https://fengli-ust.github.io/;https://research.google/people/haozhang;https://yangjie-cv.github.io/;http://chunyuan.li/;http://ml.cs.tsinghua.edu.cn/~jun;;https://jwyang.github.io/;https://www.leizhang.org/",
        "dblp": ";;;92/2954-40.html;55/2270-10;;64/9590;50/2644-1;26/5371-6;;z/LeiZhang",
        "google_scholar": "nkSVY3MAAAAJ;;cW4ILs0AAAAJ;https://scholar.google.com/citations?hl=zh-CN;20NbGxUAAAAJ;UVzG9IcAAAAJ;Zd7WmXUAAAAJ;axsP38wAAAAJ;dxN1_X0AAAAJ;Cl9byD8AAAAJ;fIlGZToAAAAJ",
        "orcid": ";;;;0009-0002-6681-0914;;;;;;",
        "linkedin": ";%E5%85%86%E9%98%B3-%E6%9B%BE-1a505291/;;;;;;;;;",
        "or_profile": "~Shilong_Liu1;~Zhaoyang_Zeng1;~Tianhe_Ren1;~Feng_Li9;~Hao_Zhang11;~Jie_Yang20;~Chunyuan_Li1;~Jun_Zhu2;~Hang_Su2;~Jianwei_Yang2;~Lei_Zhang1",
        "aff": "NVIDIA;International Digital Economy Academy, International Digital Economy Academy;The International Digital Economy Academy;Hong Kong University of Science and Technology;Google;The Chinese University of Hong Kong, Shenzhen;Microsoft Research;Tsinghua University;Tsinghua University;Microsoft;International Digital Economy Academy",
        "aff_domain": "nvidia.com;idea.edu.cn;idea.edu.cn;ust.hk;google.com;cuhk.edu.cn;microsoft.com;mail.tsinghua.edu.cn;tsinghua.edu.cn;microsoft.com;idea.edu.cn",
        "position": "Research Intern;Researcher;Researcher;PhD student;Research Scientist;PhD student;Principal Researcher;Professor;Associate Professor;Researcher;Chief Scientist",
        "bibtex": "@misc{\nliu2024grounding,\ntitle={Grounding {DINO}: Marrying {DINO} with Grounded Pre-Training for Open-Set Object Detection},\nauthor={Shilong Liu and Zhaoyang Zeng and Tianhe Ren and Feng Li and Hao Zhang and Jie Yang and Chunyuan Li and Jianwei Yang and Hang Su and Jun Zhu and Lei Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=DS5qRs0tQz}\n}",
        "github": "",
        "project": "",
        "reviewers": "9tNN;jXst;sRML",
        "site": "https://openreview.net/forum?id=DS5qRs0tQz",
        "pdf_size": 2945720,
        "rating": "5;5;8",
        "confidence": "4;3;4",
        "soundness": "2;2;3",
        "contribution": "2;1;3",
        "presentation": "3;2;4",
        "wc_summary": "72;106;148",
        "wc_strengths": "31;72;177",
        "wc_weaknesses": "115;45;268",
        "wc_questions": "3;7;104",
        "wc_review": "221;230;697",
        "wc_reply_reviewers": "0;0;67",
        "wc_reply_authors": "870;885;2226",
        "reply_reviewers": "0;0;1",
        "reply_authors": "3;2;5",
        "rating_avg": [
            6.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            108.66666666666667,
            31.084115271666043
        ],
        "wc_strengths_avg": [
            93.33333333333333,
            61.48351179155451
        ],
        "wc_weaknesses_avg": [
            142.66666666666666,
            93.11760783487132
        ],
        "wc_questions_avg": [
            38.0,
            46.69760878960149
        ],
        "wc_review_avg": [
            382.6666666666667,
            222.2975983276073
        ],
        "wc_reply_reviewers_avg": [
            22.333333333333332,
            31.584102892999123
        ],
        "wc_reply_authors_avg": [
            1327.0,
            635.7184911578395
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            1.247219128924647
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 2063,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8920632310259217381&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;1;2;3;4;5;6;6;5;1",
        "aff_unique_norm": "NVIDIA;International Digital Economy Academy;Hong Kong University of Science and Technology;Google;Chinese University of Hong Kong;Microsoft;Tsinghua University",
        "aff_unique_dep": "NVIDIA Corporation;;;Google;;Microsoft Research;",
        "aff_unique_url": "https://www.nvidia.com;;https://www.ust.hk;https://www.google.com;https://www.cuhk.edu.cn;https://www.microsoft.com/en-us/research;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "NVIDIA;;HKUST;Google;CUHK;MSR;THU",
        "aff_campus_unique_index": "1;2;3",
        "aff_campus_unique": ";Hong Kong SAR;Mountain View;Shenzhen",
        "aff_country_unique_index": "0;2;3;0;3;0;3;3;0",
        "aff_country_unique": "United States;;Unknown;China"
    },
    {
        "id": "DT8ipHAAVz",
        "title": "End-to-End Training of Unsupervised Trees: KAURI and DOUGLAS",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Trees are convenient models for obtaining explainable predictions on relatively\nsmall datasets. While many proposals exist for end-to-end construction of such\ntrees in supervised learning, learning a tree end-to-end for clustering without la-\nbels remains an open challenge. As most works focus on interpreting with trees\nthe result of another clustering algorithm, we present here two novel end-to-end\ntrained unsupervised trees for clustering, respectively KAURI for datasets with a\nlarge number of features using binary decision trees, and DOUGLAS for datasets\nwith a large number of samples using k-ary differentiable trees. Both methods are\ncomposed of a learnable tree structure in which parameters are optimised accord-\ning to a generalised mutual information (GEMINI) and present results on par with\nother existing methods while maintaining interpretability. We compare these two\nmodels on multiple datasets with the most recent unsupervised trees and provide\nguidelines for choosing the most suitable model.",
        "keywords": "Decision trees;Clustering;Unsupervised Learning;end-to-end learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/e5070ceaa6634e817b80e9a2805367bd9440a540.zip",
        "author": "Louis Ohl;Pierre-Alexandre Mattei;Arnaud Droit;Frederic Precioso",
        "authorids": "~Louis_Ohl1;~Pierre-Alexandre_Mattei3;~Arnaud_Droit1;~Frederic_Precioso2",
        "gender": "M;M;M;M",
        "homepage": "https://oshillou.github.io/;http://pamattei.github.io;https://compbio.ca;https://www.i3s.unice.fr/~precioso/",
        "dblp": "331/3476;177/7275;;83/1407.html",
        "google_scholar": "s2uxUGwAAAAJ;https://scholar.google.fr/citations?user=Tqa_-D0AAAAJ;https://scholar.google.fr/citations?user=D0QCkCYAAAAJ;-0cKTucAAAAJ",
        "orcid": ";;0000-0001-7922-790X;0000-0001-8712-1443",
        "linkedin": ";;;fr%C3%A9d%C3%A9ric-precioso-3a37389/",
        "or_profile": "~Louis_Ohl1;~Pierre-Alexandre_Mattei3;~Arnaud_Droit1;~Frederic_Precioso1",
        "aff": "Universit\u00e9 Laval;INRIA;Universit\u00e9 Laval;Universit\u00e9 de Nice-Sophia Antipolis",
        "aff_domain": "ulaval.ca;inria.fr;ulaval.ca;unice.fr",
        "position": "PhD student;Research scientist;Full Professor;Full Professor",
        "bibtex": "@misc{\nohl2024endtoend,\ntitle={End-to-End Training of  Unsupervised Trees: {KAURI} and {DOUGLAS}},\nauthor={Louis Ohl and Pierre-Alexandre Mattei and Arnaud Droit and Frederic Precioso},\nyear={2024},\nurl={https://openreview.net/forum?id=DT8ipHAAVz}\n}",
        "github": "",
        "project": "",
        "reviewers": "nAXp;dexJ;xtwY;4Lqz",
        "site": "https://openreview.net/forum?id=DT8ipHAAVz",
        "pdf_size": 825051,
        "rating": "3;3;3;5",
        "confidence": "3;4;4;3",
        "soundness": "3;2;3;3",
        "contribution": "3;2;2;2",
        "presentation": "3;3;3;2",
        "wc_summary": "82;106;54;62",
        "wc_strengths": "54;25;18;32",
        "wc_weaknesses": "202;216;149;137",
        "wc_questions": "168;25;1;44",
        "wc_review": "506;372;222;275",
        "wc_reply_reviewers": "0;0;161;0",
        "wc_reply_authors": "637;778;174;387",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            76.0,
            20.09975124224178
        ],
        "wc_strengths_avg": [
            32.25,
            13.497684986693088
        ],
        "wc_weaknesses_avg": [
            176.0,
            33.637776383108324
        ],
        "wc_questions_avg": [
            59.5,
            64.46898479113814
        ],
        "wc_review_avg": [
            343.75,
            108.0193848343898
        ],
        "wc_reply_reviewers_avg": [
            40.25,
            69.71504500464731
        ],
        "wc_reply_authors_avg": [
            494.0,
            231.81565952282
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:50wkQdfw6gEJ:scholar.google.com/&scioq=End-to-End+Training+of+Unsupervised+Trees:+KAURI+and+DOUGLAS&hl=en&as_sdt=0,47",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "Universit\u00e9 Laval;INRIA;Universit\u00e9 de Nice-Sophia Antipolis",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ulaval.ca;https://www.inria.fr;https://www.unice.fr",
        "aff_unique_abbr": "ULaval;INRIA;UNICA",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Sophia Antipolis",
        "aff_country_unique_index": "0;1;0;1",
        "aff_country_unique": "Canada;France"
    },
    {
        "id": "DTwpuoaea4",
        "title": "PAGER: A Framework for Failure Analysis of Deep Regression Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Safe deployment of AI models requires proactive detection of potential prediction failures to prevent costly errors. While failure detection in classification problems has received significant attention, characterizing failure modes in regression tasks is more complicated and less explored. Existing approaches rely on epistemic uncertainties or feature inconsistency with the training distribution to characterize model risk. However, we find that uncertainties are necessary but insufficient to accurately characterize failure, owing to the various sources of error. In this paper, we propose PAGER (Principled Analysis of Generalization Errors in Regressors), a framework to systematically detect and characterize failures in deep regression models. Built upon the recently proposed idea of anchoring in deep models, PAGER unifies both epistemic uncertainties and complementary non-conformity scores to organize samples into different risk regimes, thereby providing a comprehensive analysis of model errors. Additionally, we introduce a suite metrics for holistically evaluating failure detectors in regression tasks. We demonstrate the effectiveness of PAGER on synthetic and real-world benchmarks. Our results highlight the capability of PAGER to identify regions of accurate generalization and detect failure cases in out-of-distribution and out-of-support scenarios.",
        "keywords": "Deep learning;failure detection;uncertainty;non-conformity;regression",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/76e63c058fbef9387dda21dd45f4b7feb31cbb84.pdf",
        "author": "Jayaraman J. Thiagarajan;Vivek Narayanaswamy;Puja Trivedi;Rushil Anirudh",
        "authorids": "~Jayaraman_J._Thiagarajan3;~Vivek_Narayanaswamy1;~Puja_Trivedi1;~Rushil_Anirudh1",
        "gender": "M;F;M;M",
        "homepage": ";https://pujacomputes.github.io/;https://rushila.com/;https://jjthiagarajan.com",
        "dblp": "230/4531;274/2080;136/5391;16/7803",
        "google_scholar": "7h2Ui6YAAAAJ;1y9cR50AAAAJ;WkoIlpQAAAAJ;cMz65_oAAAAJ",
        "orcid": ";0000-0003-1874-8992;0000-0002-4186-3502;",
        "linkedin": ";;rushilanirudh/;",
        "or_profile": "~Vivek_Narayanaswamy1;~Puja_Trivedi1;~Rushil_Anirudh1;~Jayaraman_J._Thiagarajan2",
        "aff": "Lawrence Livermore National Labs;University of Michigan;Amazon;Lawrence Livermore National Labs",
        "aff_domain": "llnl.gov;umich.edu;amazon.com;llnl.gov",
        "position": "Researcher;PhD student;Applied Scientist;Computer Scientist",
        "bibtex": "@misc{\nthiagarajan2024pager,\ntitle={{PAGER}: A Framework for Failure Analysis of Deep Regression Models},\nauthor={Jayaraman J. Thiagarajan and Vivek Narayanaswamy and Puja Trivedi and Rushil Anirudh},\nyear={2024},\nurl={https://openreview.net/forum?id=DTwpuoaea4}\n}",
        "github": "",
        "project": "",
        "reviewers": "Kt6W;HtuK;LqcK",
        "site": "https://openreview.net/forum?id=DTwpuoaea4",
        "pdf_size": 2580577,
        "rating": "6;6;6",
        "confidence": "2;2;4",
        "soundness": "3;3;4",
        "contribution": "3;3;4",
        "presentation": "3;3;4",
        "wc_summary": "153;94;56",
        "wc_strengths": "97;60;57",
        "wc_weaknesses": "151;39;33",
        "wc_questions": "8;11;4",
        "wc_review": "409;204;150",
        "wc_reply_reviewers": "11;11;0",
        "wc_reply_authors": "963;405;385",
        "reply_reviewers": "1;1;0",
        "reply_authors": "3;2;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            101.0,
            39.9082280572148
        ],
        "wc_strengths_avg": [
            71.33333333333333,
            18.190351532856337
        ],
        "wc_weaknesses_avg": [
            74.33333333333333,
            54.26683046658326
        ],
        "wc_questions_avg": [
            7.666666666666667,
            2.8674417556808756
        ],
        "wc_review_avg": [
            254.33333333333334,
            111.56562592881774
        ],
        "wc_reply_reviewers_avg": [
            7.333333333333333,
            5.185449728701348
        ],
        "wc_reply_authors_avg": [
            584.3333333333334,
            267.8822295130621
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3428890872956299528&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Lawrence Livermore National Laboratory;University of Michigan;Amazon",
        "aff_unique_dep": ";;Amazon.com, Inc.",
        "aff_unique_url": "https://www.llnl.gov;https://www.umich.edu;https://www.amazon.com",
        "aff_unique_abbr": "LLNL;UM;Amazon",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "DUkYDXqxKp",
        "title": "DriveGPT4: Interpretable End-to-end Autonomous Driving via Large Language Model",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In the past decade, autonomous driving has experienced rapid development in both academia and industry. However, its limited interpretability remains a significant unsolved problem, severely hindering autonomous vehicle commercialization and further development. Previous approaches utilizing small language models have failed to address this issue due to their lack of flexibility, generalization ability, and robustness. Recently, multimodal large language models (LLMs) have gained considerable attention from the research community for their capability to process and reason non-text data (e.g., images and videos) by text. \n In this paper, we present DriveGPT4, an interpretable end-to-end autonomous driving system utilizing LLMs. DriveGPT4 is capable of interpreting vehicle actions and providing corresponding reasoning, as well as answering diverse questions posed by human users for enhanced interaction. Additionally, DriveGPT4 predicts vehicle low-level control signals in an end-to-end fashion. These capabilities stem from a customized visual instruction tuning dataset specifically designed for autonomous driving.  To the best of our knowledge, DriveGPT4 is the first work focusing on interpretable end-to-end autonomous driving.  When evaluated on multiple tasks alongside conventional methods and video understanding LLMs, DriveGPT4 demonstrates superior qualitative and quantitative performance. Additionally, DriveGPT4 can be generalized in a zero-shot fashion to accommodate more unseen scenarios.",
        "keywords": "Interpretable autonomous driving;large language model;robotics;computer vision",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Zhenhua Xu;Yujia Zhang;Enze Xie;Zhen Zhao;Yong Guo;Kwan-Yee K. Wong;Zhenguo Li;Hengshuang Zhao",
        "authorids": "~Zhenhua_Xu1;~Yujia_Zhang7;~Enze_Xie1;~Zhen_Zhao4;~Yong_Guo1;~Kwan-Yee_K._Wong1;~Zhenguo_Li1;~Hengshuang_Zhao2",
        "gender": ";F;M;M;M;;M;M",
        "homepage": ";https://Yujia-Zhang0913.github.io;https://xieenze.github.io/;http://zhaozhen.me/;http://www.guoyongcs.com/;;http://www.ee.columbia.edu/~zgli/;https://hszhao.github.io",
        "dblp": ";;218/5441;29/1773-1;;;23/6479;185/7848",
        "google_scholar": ";;42MVVPgAAAAJ;7mpuhO8AAAAJ;https://scholar.google.com/citations?hl=en;;XboZC1AAAAAJ;4uE10I0AAAAJ",
        "orcid": ";0009-0006-3884-9730;;0000-0002-0796-4078;0000-0002-3444-4588;;;0000-0001-8277-2706",
        "linkedin": ";;;;;;;hengshuang-zhao-347b8391/?originalSubdomain=hk",
        "or_profile": "~Zhenhua_Xu1;~Yujia_Zhang7;~Enze_Xie1;~Zhen_Zhao4;~Yong_Guo1;~Kwan-Yee_K._Wong1;~Zhenguo_Li1;~Hengshuang_Zhao2",
        "aff": ";Zhejiang University;Huawei Noah's Ark Lab;University of Sydney;Saarland Informatics Campus, Max-Planck Institute;;Huawei Noah's Ark Lab;The University of Hong Kong",
        "aff_domain": ";zju.edu.cn;huawei.com;usyd.edu.au;mpi-inf.mpg.de;;huawei.com;hku.hk",
        "position": ";Undergrad student;Researcher;PhD student;Postdoc;;Principal Researcher;Assistant Professor",
        "bibtex": "@misc{\nxu2024drivegpt,\ntitle={Drive{GPT}4: Interpretable End-to-end Autonomous Driving via Large Language Model},\nauthor={Zhenhua Xu and Yujia Zhang and Enze Xie and Zhen Zhao and Yong Guo and Kwan-Yee K. Wong and Zhenguo Li and Hengshuang Zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=DUkYDXqxKp}\n}",
        "github": "",
        "project": "",
        "reviewers": "EsLd;2Geq;yQKg;u2wu",
        "site": "https://openreview.net/forum?id=DUkYDXqxKp",
        "pdf_size": 5835415,
        "rating": "3;5;5;6",
        "confidence": "5;4;4;2",
        "soundness": "1;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;4",
        "wc_summary": "112;157;108;171",
        "wc_strengths": "46;82;42;92",
        "wc_weaknesses": "220;127;345;248",
        "wc_questions": "24;173;91;101",
        "wc_review": "402;539;586;612",
        "wc_reply_reviewers": "133;0;303;25",
        "wc_reply_authors": "716;631;1143;504",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "2;1;3;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            137.0,
            27.486360253769504
        ],
        "wc_strengths_avg": [
            65.5,
            21.834605560898048
        ],
        "wc_weaknesses_avg": [
            235.0,
            77.71422006299748
        ],
        "wc_questions_avg": [
            97.25,
            52.81275887510517
        ],
        "wc_review_avg": [
            534.75,
            80.98572405060042
        ],
        "wc_reply_reviewers_avg": [
            115.25,
            119.36577189462648
        ],
        "wc_reply_authors_avg": [
            748.5,
            239.93384504900513
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.894736842105263,
        "gs_citation": 338,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11373295805974182386&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 10,
        "aff_unique_index": "0;1;2;3;1;4",
        "aff_unique_norm": "Zhejiang University;Huawei;University of Sydney;Max-Planck Institute;University of Hong Kong",
        "aff_unique_dep": ";Noah's Ark Lab;;Informatics;",
        "aff_unique_url": "https://www.zju.edu.cn;https://www.huawei.com;https://www.sydney.edu.au;https://www.mpi-sws.org;https://www.hku.hk",
        "aff_unique_abbr": "ZJU;Huawei;USYD;MPI-SWS;HKU",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Saarland;Hong Kong SAR",
        "aff_country_unique_index": "0;0;1;2;0;0",
        "aff_country_unique": "China;Australia;Germany"
    },
    {
        "id": "DUsSJcq4Nz",
        "title": "FMM-Head: Enhancing Autoencoder-based ECG anomaly detection with prior knowledge",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Detecting anomalies in electrocardiogram data is crucial to identifying deviations from normal heartbeat patterns and providing timely intervention to at-risk patients. Various AutoEncoder models (AE) have been proposed to tackle the anomaly detection task with machine learning (ML). However, these models do not consider the specific patterns of ECG leads and are unexplainable black boxes. In contrast, we replace the decoding part of the AE with a reconstruction head (namely, FMM-Head) based on prior knowledge of the ECG shape. Our model consistently achieves higher anomaly detection capabilities than state-of-the-art models, up to 0.31 increase in area under the ROC curve (AUROC), with as little as half the original model size and explainable extracted features. The processing time of our model is four orders of magnitude lower than solving an optimization problem to obtain the same parameters, thus making it suitable for real-time ECG parameters extraction and anomaly detection.",
        "keywords": "Machine Learning;ECG anomaly detection;AutoEncoders",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Giacomo Verardo;Magnus Boman;Samuel Bruchfeld;Marco Chiesa;Sabine Koch;Dejan Kostic;Gerald Q. Maguire Jr.",
        "authorids": "~Giacomo_Verardo1;~Magnus_Boman1;~Samuel_Bruchfeld1;~Marco_Chiesa1;~Sabine_Koch1;~Dejan_Kostic1;~Gerald_Q._Maguire_Jr.1",
        "gender": ";M;M;M;;M;",
        "homepage": "https://www.kth.se/profile/verardo/?l=en;https://people.kth.se/~mab;;https://marchiesa.bitbucket.io/;https://staff.ki.se/people/sabine-koch;https://dejankosticgithub.github.io/;https://www.kth.se/profile/maguire/",
        "dblp": ";;;78/9826.html;;;m/GQMaguireJr",
        "google_scholar": "JD68HL4AAAAJ;DE0n-AQAAAAJ;;https://scholar.google.be/citations?user=qq4qwRMAAAAJ;https://scholar.google.se/citations?user=9gMM-F8AAAAJ;LmqhRxkAAAAJ;HJgs_3YAAAAJ",
        "orcid": ";0000-0001-7949-1815;0000-0002-0284-5176;;0000-0001-7144-8740;0000-0002-1256-1070;0000-0002-6066-746X",
        "linkedin": "https://se.linkedin.com/in/giacomo-verardo-a35aab83/en?trk=people-guest_people_search-card;;;;sabine-koch-4035552/;dekostic/;gerald-q-maguire-jr-6365422/",
        "or_profile": "~Giacomo_Verardo1;~Magnus_Boman1;~Samuel_Bruchfeld1;~Marco_Chiesa1;~Sabine_Koch1;~Dejan_Kostic1;~Gerald_Q._Maguire_Jr.1",
        "aff": "KTH Royal Institute of Technology, Stockholm, Sweden;Karolinska Institute Stockholm;Karolinska Institute Stockholm;;Karolinska Institute Stockholm;KTH Royal Institute of Technology;KTH Royal Institute of Technology",
        "aff_domain": "kth.se;ki.se;ki.se;;ki.se;kth.se;kth.se",
        "position": "PhD student;Full Professor;PhD student;;Full Professor;Full Professor;Emeritus",
        "bibtex": "@misc{\nverardo2024fmmhead,\ntitle={{FMM}-Head: Enhancing Autoencoder-based {ECG} anomaly detection with prior knowledge},\nauthor={Giacomo Verardo and Magnus Boman and Samuel Bruchfeld and Marco Chiesa and Sabine Koch and Dejan Kostic and Gerald Q. Maguire Jr.},\nyear={2024},\nurl={https://openreview.net/forum?id=DUsSJcq4Nz}\n}",
        "github": "",
        "project": "",
        "reviewers": "johH;kmWJ;YaBZ;2MCh",
        "site": "https://openreview.net/forum?id=DUsSJcq4Nz",
        "pdf_size": 708980,
        "rating": "1;3;3;5",
        "confidence": "5;5;5;4",
        "soundness": "2;2;3;3",
        "contribution": "1;2;2;3",
        "presentation": "2;2;4;2",
        "wc_summary": "67;77;33;54",
        "wc_strengths": "17;40;40;52",
        "wc_weaknesses": "298;68;57;182",
        "wc_questions": "6;3;18;169",
        "wc_review": "388;188;148;457",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            57.75,
            16.452583383772897
        ],
        "wc_strengths_avg": [
            37.25,
            12.676257334087218
        ],
        "wc_weaknesses_avg": [
            151.25,
            97.8452221623519
        ],
        "wc_questions_avg": [
            49.0,
            69.5089922240281
        ],
        "wc_review_avg": [
            295.25,
            130.336823269558
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13568273034553955518&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1;1;0;0",
        "aff_unique_norm": "KTH Royal Institute of Technology;Karolinska Institute",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.kth.se;https://ki.se",
        "aff_unique_abbr": "KTH;KI",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Stockholm;",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "Sweden"
    },
    {
        "id": "DVA0NDUdCQ",
        "title": "Efficient Large Language Models Fine-Tuning on Graphs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Learning from Text-Attributed Graphs (TAGs) has attracted significant attention due to its wide range of real-world applications. The rapid evolution of large language models (LLMs) has revolutionized the way we process textual data, which indicates a strong potential to replace shallow text embedding generally used in Graph Neural Networks (GNNs). However, we find that existing LLM approaches that exploit text information in graphs suffer from inferior computation and data efficiency. In this work, we introduce a novel and efficient approach for the end-to- end fine-tuning of Large Language Models (LLMs) on TAGs, named LEADING. The proposed approach maintains computation cost and memory overhead comparable to the graph-less fine-tuning of LLMs. Moreover, it transfers the rick knowledge in LLMs to downstream graph learning tasks effectively with limited labeled data in semi-supervised learning. Its superior computation and data efficiency are demonstrated through comprehensive experiments, offering a promising solution for a wide range of LLMs and graph learning tasks on TAGs.",
        "keywords": "Graph Neural Networks;Large Language Models;Scalability;Label Efficiency",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Rui Xue;Xipeng Shen;Ruozhou Yu;Xiaorui Liu",
        "authorids": "~Rui_Xue1;~Xipeng_Shen1;ryu5@ncsu.edu;~Xiaorui_Liu1",
        "gender": ";M;;M",
        "homepage": "https://www.linkedin.com/in/rui-xue-35b730208/;https://research.csc.ncsu.edu/picture/xshen5/index.htm;;https://sites.google.com/ncsu.edu/xiaorui/",
        "dblp": "30/4367-6;36/4172.html;;172/0995",
        "google_scholar": ";0DC5oGQAAAAJ;;NhvN1KoAAAAJ",
        "orcid": "0009-0003-4975-1585;0000-0003-3599-8010;;0000-0001-8217-5688",
        "linkedin": "rui-xue-35b730208/;;;",
        "or_profile": "~Rui_Xue1;~Xipeng_Shen1;ryu5@ncsu.edu;~Xiaorui_Liu1",
        "aff": "North Carolina State University;North Carolina State University;;North Carolina State University",
        "aff_domain": "ncsu.edu;ncsu.edu;;ncsu.edu",
        "position": "PhD student;Professor;;Assistant Professor",
        "bibtex": "@misc{\nxue2024efficient,\ntitle={Efficient Large Language Models Fine-Tuning on Graphs},\nauthor={Rui Xue and Xipeng Shen and Ruozhou Yu and Xiaorui Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=DVA0NDUdCQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "LoZg;k4U4;DmWL;sP5C",
        "site": "https://openreview.net/forum?id=DVA0NDUdCQ",
        "pdf_size": 513056,
        "rating": "3;5;5;6",
        "confidence": "4;3;4;4",
        "soundness": "2;3;2;2",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;2",
        "wc_summary": "3;79;92;181",
        "wc_strengths": "40;48;75;202",
        "wc_weaknesses": "93;185;192;160",
        "wc_questions": "28;25;37;223",
        "wc_review": "164;337;396;766",
        "wc_reply_reviewers": "61;101;0;0",
        "wc_reply_authors": "2056;2414;1543;2001",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "6;6;4;7",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            88.75,
            63.18375978050056
        ],
        "wc_strengths_avg": [
            91.25,
            65.24329467462537
        ],
        "wc_weaknesses_avg": [
            157.5,
            39.092838218783754
        ],
        "wc_questions_avg": [
            78.25,
            83.68803677945851
        ],
        "wc_review_avg": [
            415.75,
            219.45657315286778
        ],
        "wc_reply_reviewers_avg": [
            40.5,
            42.8981351576033
        ],
        "wc_reply_authors_avg": [
            2003.5,
            309.5694590879404
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            5.75,
            1.0897247358851685
        ],
        "replies_avg": [
            32,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.13245323570650439,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4421482102462122952&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "North Carolina State University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ncsu.edu",
        "aff_unique_abbr": "NCSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "DWJr05rymY",
        "title": "Estimating Unknown Population Sizes Using Hypergeometric Maximum Likelihood",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The multivariate hypergeometric distribution describes the fundamental process of sampling without replacement from a discrete population of elements divided into multiple categories. Despite the hypergeometric distribution's long history, the literature has not yet addressed the problem of maximum likelihood estimation when both the size of the total population and its constituent categories are unknown. Here, we show that this estimation challenge can be solved by maximizing the hypergeometric likelihood, even in the presence of severe under-sampling. We extend this approach to capture data generating processes where the ground-truth high-dimensional distribution is conditional on a continuous latent variable using the variational autoencoder framework, and validate the resulting model using simulated datasets. In a practical use case, we demonstrate that our method can recover the true number of gene transcripts present in a cell from sparse single-cell genomics data.",
        "keywords": "multivariate hypergeometric distribution;maximum likelihood estimation;variational autoencoder;genomics",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Liam Hodgson;Danilo Bzdok",
        "authorids": "~Liam_Hodgson1;~Danilo_Bzdok2",
        "gender": ";",
        "homepage": ";",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": ";",
        "aff": ";",
        "aff_domain": ";",
        "position": ";",
        "bibtex": "@misc{\nhodgson2024estimating,\ntitle={Estimating Unknown Population Sizes Using Hypergeometric Maximum Likelihood},\nauthor={Liam Hodgson and Danilo Bzdok},\nyear={2024},\nurl={https://openreview.net/forum?id=DWJr05rymY}\n}",
        "github": "",
        "project": "",
        "reviewers": "etSf;rSc3;gy2Q;XXPF",
        "site": "https://openreview.net/forum?id=DWJr05rymY",
        "pdf_size": 7472802,
        "rating": "5;5;5;6",
        "confidence": "4;3;2;4",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "4;3;3;3",
        "wc_summary": "146;120;26;161",
        "wc_strengths": "100;27;27;65",
        "wc_weaknesses": "535;94;110;113",
        "wc_questions": "96;106;130;121",
        "wc_review": "877;347;293;460",
        "wc_reply_reviewers": "133;0;107;49",
        "wc_reply_authors": "1702;667;1115;1255",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "3;1;2;2",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            113.25,
            52.466060458166666
        ],
        "wc_strengths_avg": [
            54.75,
            30.384000724065288
        ],
        "wc_weaknesses_avg": [
            213.0,
            186.04703706321152
        ],
        "wc_questions_avg": [
            113.25,
            13.141061600951424
        ],
        "wc_review_avg": [
            494.25,
            229.04953066967852
        ],
        "wc_reply_reviewers_avg": [
            72.25,
            51.62061119359204
        ],
        "wc_reply_authors_avg": [
            1184.75,
            369.26032483872405
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.5222329678670935,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:dFfhV9d-230J:scholar.google.com/&scioq=Estimating+Unknown+Population+Sizes+Using+Hypergeometric+Maximum+Likelihood&hl=en&as_sdt=0,44",
        "gs_version_total": 0
    },
    {
        "id": "DWUiUneKMI",
        "title": "Efficient PDE Solutions using Hartley Neural Operators in Physics-Informed Networks: Potentials and Limitations",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In this work, we introduce novel differentiable architectures for solving partial differential equations (PDEs) using the well-known Discrete Hartley Transform. We incorporate Hartley Neural Operators (HNO) into Physics-Informed Neural Operator Networks (PINOs). Our analysis concentrates on two pivotal PDEs: 1. the one-dimensional diffusion equation, which holds significance not only in machine learning but also across a broad spectrum of physical sciences and engineering disciplines; and 2. the one-dimensional Thermodynamic Energy Equation that is commonly used in weather data analysis. Our implementation of HNO that employs real-valued linear transforms into the PINO architecture results in significant run-time improvements. We show that reconstruction loss is lower than other recently introduced operators that may be used for the above PDEs. Importantly, we find that HNOs naturally satisfy the governing physical laws and equations specific to the PDEs under consideration. However, our empirical observations suggest that the benefits of HNO diminish in certain scenarios where the underlying physical conditions at the boundary are less tractable and involve complex numbers. As an example of a potential failure mode we illustrate that in the case of the one-dimensional Burger's equation, traditional Fourier Neural Operators outperform their Hartley counterparts. Our results indicate that a combination of neural operators including Fourier and Hartley transforms may be better to effectively address the specific type, and/or context of the physical problem at hand.",
        "keywords": "Hartley Neural Operators (HNO);Physics-Informed Neural Operator Networks (PINOs);Discrete Hartley Transform;Machine Learning;Partial Differential Equations (PDEs)",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Jason Alan Sulskis;Sathya N. Ravi",
        "authorids": "~Jason_Alan_Sulskis1;~Sathya_N._Ravi1",
        "gender": "M;M",
        "homepage": ";http://sathyaravi.com",
        "dblp": ";159/2123",
        "google_scholar": "_u46ngcAAAAJ;FW-0thoAAAAJ",
        "orcid": "0000-0002-9204-7695;0000-0003-3881-6323",
        "linkedin": "jasonsulskis/;sathya-narayanan-ravi-74a5a128/",
        "or_profile": "~Jason_Alan_Sulskis1;~Sathya_N._Ravi1",
        "aff": "University of Illinois at Chicago;University of Illinois, Chicago",
        "aff_domain": "uic.edu;uic.edu",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nsulskis2024efficient,\ntitle={Efficient {PDE} Solutions using Hartley Neural Operators in Physics-Informed Networks: Potentials and Limitations},\nauthor={Jason Alan Sulskis and Sathya N. Ravi},\nyear={2024},\nurl={https://openreview.net/forum?id=DWUiUneKMI}\n}",
        "github": "",
        "project": "",
        "reviewers": "cVFx;uzwQ;sSA6;6U54",
        "site": "https://openreview.net/forum?id=DWUiUneKMI",
        "pdf_size": 26035658,
        "rating": "3;3;3;3",
        "confidence": "4;3;5;5",
        "soundness": "1;2;3;2",
        "contribution": "2;1;3;2",
        "presentation": "2;2;3;1",
        "wc_summary": "102;62;71;67",
        "wc_strengths": "39;39;19;169",
        "wc_weaknesses": "167;82;180;650",
        "wc_questions": "243;44;1;101",
        "wc_review": "551;227;271;987",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "272;141;162;466",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            75.5,
            15.628499608087784
        ],
        "wc_strengths_avg": [
            66.5,
            59.7390157267426
        ],
        "wc_weaknesses_avg": [
            269.75,
            222.74017935702574
        ],
        "wc_questions_avg": [
            97.25,
            91.31915187954824
        ],
        "wc_review_avg": [
            509.0,
            302.66152712229547
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            260.25,
            128.78737321647645
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:VMkjeZL1PwYJ:scholar.google.com/&scioq=Efficient+PDE+Solutions+using+Hartley+Neural+Operators+in+Physics-Informed+Networks:+Potentials+and+Limitations&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Illinois at Chicago",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uic.edu",
        "aff_unique_abbr": "UIC",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Chicago",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "DWgkKcGycn",
        "title": "Less is More: Toward Zero-Shot Local Scene Graph Generation via Foundation Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Humans inherently recognize objects via selective visual perception, transform specific regions from the visual field into structured symbolic knowledge, and reason their relationships among regions based on the allocation of limited attention resources in line with humans\u2019 goals. While it is intuitive for humans, contemporary perception systems falter in extracting structural information due to the intricate cognitive abilities and commonsense knowledge required. To fill this gap, we present a new task called Local Scene Graph Generation. Distinct from the conventional scene graph generation task, which encompasses generating all objects and relationships in an image, our proposed task aims to abstract pertinent structural information with partial objects and their relationships for boosting downstream tasks that demand advanced comprehension and reasoning capabilities. Correspondingly, we introduce zEro-shot Local scEne GrAph geNeraTion (ELEGANT), a framework harnessing foundation models renowned for their powerful perception and commonsense reasoning, where collaboration and information communication among foundation models yield superior outcomes and realize zero-shot local scene graph generation without requiring labeled supervision. Furthermore, we propose a novel open-ended evaluation metric, Entity-level CLIPScorE (ECLIPSE), surpassing previous closed-set evaluation metrics by transcending their limited label space, offering a broader assessment. Experiment results show that our approach markedly outperforms baselines in the open-ended evaluation setting, and it also achieves a significant performance boost of up to 24.58% over prior methods in the close-set setting, demonstrating the effectiveness and powerful reasoning ability of our proposed framework.",
        "keywords": "Scene Graph Generation; Zero-Shot; Foundation Model",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Shu Zhao;Huijuan Xu",
        "authorids": "~Shu_Zhao2;~Huijuan_Xu4",
        "gender": "M;",
        "homepage": "https://shuzhao.me/;https://visionlanguagelab.github.io/",
        "dblp": "41/3875;129/9444",
        "google_scholar": "U6Nr8swAAAAJ;eml8HfQAAAAJ",
        "orcid": "0009-0001-2310-9442;",
        "linkedin": ";",
        "or_profile": "~Shu_Zhao2;~Huijuan_Xu4",
        "aff": "Pennsylvania State University;Pennsylvania State University--University Park",
        "aff_domain": "psu.edu;psu.edu",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nzhao2024less,\ntitle={Less is More: Toward Zero-Shot Local Scene Graph Generation via Foundation Models},\nauthor={Shu Zhao and Huijuan Xu},\nyear={2024},\nurl={https://openreview.net/forum?id=DWgkKcGycn}\n}",
        "github": "",
        "project": "",
        "reviewers": "1PLg;hGSC;d1KX;HdXh",
        "site": "https://openreview.net/forum?id=DWgkKcGycn",
        "pdf_size": 1492440,
        "rating": "3;3;5;6",
        "confidence": "3;4;3;5",
        "soundness": "2;3;2;3",
        "contribution": "2;1;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "30;66;52;82",
        "wc_strengths": "46;149;28;21",
        "wc_weaknesses": "267;99;118;28",
        "wc_questions": "4;28;7;33",
        "wc_review": "347;342;205;164",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            57.5,
            19.09842925478428
        ],
        "wc_strengths_avg": [
            61.0,
            51.61879502661797
        ],
        "wc_weaknesses_avg": [
            128.0,
            86.9798827315834
        ],
        "wc_questions_avg": [
            18.0,
            12.668859459319927
        ],
        "wc_review_avg": [
            264.5,
            81.3218912716619
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.5222329678670935,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8673688146726352455&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Pennsylvania State University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.psu.edu",
        "aff_unique_abbr": "PSU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";University Park",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "DY6uhcv4Xm",
        "title": "FedSecurity: A Benchmark for Attacks and Defenses in Federated Learning and Federated LLMs",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "This paper introduces FedSecurity, an end-to-end benchmark designed to simulate adversarial attacks and corresponding defense mechanisms in Federated Learning (FL). FedSecurity comprises two major components: FedAttacker, which simulates attacks injected during FL training, and FedDefender, which simulates defensive mechanisms to mitigate the impacts of the attacks. FedSecurity is open-\nsource and can be customized to cover a wide range of machine learning models (e.g., Logistic Regression, ResNet, and GAN) and federated optimizers (e.g., FedAVG, FedOPT, and FedNOVA). We also demonstrate the use of FedSecurity during federated training of Large Language Models (LLMs), showcasing its adaptability and applicability in more complex scenarios.",
        "keywords": "Security;attack;defense;byzantine;backdoor;federated learning;LLM",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Shanshan Han;Baturalp Buyukates;Zijian Hu;Han Jin;Weizhao Jin;Lichao Sun;Xiaoyang Wang;Wenxuan Wu;Chulin Xie;Yuhang Yao;Kai Zhang;Qifan Zhang;Yuhui Zhang;Salman Avestimehr;Chaoyang He",
        "authorids": "~Shanshan_Han1;~Baturalp_Buyukates1;~Zijian_Hu2;~Han_Jin1;~Weizhao_Jin1;~Lichao_Sun1;~Xiaoyang_Wang6;~Wenxuan_Wu3;~Chulin_Xie1;~Yuhang_Yao2;~Kai_Zhang14;~Qifan_Zhang4;~Yuhui_Zhang6;~Salman_Avestimehr1;~Chaoyang_He1",
        "gender": "F;M;;M;;M;M;M;F;;;;F;;M",
        "homepage": "https://www.linkedin.com/in/shanshan-h-b0bb89222/;https://bbuyukates.github.io;https://www.zijianhu.com/;https://raphael-jin.github.io/;https://weizhaojin.netlify.app/;https://lichao-sun.github.io/;https://xiaoyang-wang.github.io/;;;https://www.andrew.cmu.edu/user/yuhangya/;https://taokz.github.io;;https://nicole456.github.io/;;http://chaoyanghe.com",
        "dblp": "12/4476.html;230/4023;218/6669-1;;266/5162;121/0780-1.html;;191/2518;245/4284;203/0159;55/957-39;;;;222/6721-1.html",
        "google_scholar": "h4qm6oAAAAAJ;JjASH4UAAAAJ;jQ9GwCoAAAAJ;https://scholar.google.nl/citations?hl=en;I4E46yEAAAAJ;WhGUE7AAAAAJ;;oFVCquAAAAAJ;WeJnzAgAAAAJ;oQIV0BoAAAAJ;XL1iKSEAAAAJ;;;;2z2camUAAAAJ",
        "orcid": ";;0000-0001-9490-944X;;0000-0003-3269-5823;;;;;0000-0002-7045-0002;;;;;",
        "linkedin": ";;;;;lichao-sun-b273a290/;;;;yuhang-yao/;kai-zhang-lehigh;;;;",
        "or_profile": "~Shanshan_Han1;~Baturalp_Buyukates1;~Zijian_Hu2;~Han_Jin1;~Weizhao_Jin1;~Lichao_Sun1;~Xiaoyang_Wang6;~Wenxuan_Wu3;~Chulin_Xie1;~Yuhang_Yao2;~Kai_Zhang14;~Qifan_Zhang4;~Yuhui_Zhang6;~Salman_Avestimehr1;~Chaoyang_He1",
        "aff": "University of California, Irvine;University of Southern California;FedML, Inc.;University of Southern California;University of Southern California;Lehigh University;University of Illinois, Urbana Champaign;Texas A&M University - College Station;University of Illinois, Urbana Champaign;Carnegie Mellon University;Lehigh University;;Zhejiang University;;TensorOpera AI",
        "aff_domain": "uci.edu;usc.edu;fedml.ai;usc.edu;usc.edu;lehigh.edu;illinois.edu;tamu.edu;illinois.edu;andrew.cmu.edu;lehigh.edu;;zju.edu.cn;;tensoropera.ai",
        "position": "PhD student;Postdoc;Researcher;MS student;PhD student;Assistant Professor;PhD student;PhD student;PhD student;PhD student;PhD student;;MS student;;Researcher",
        "bibtex": "@misc{\nanonymous2024fedsecurity,\ntitle={FedSecurity: A Benchmark for Attacks and Defenses in Federated Learning and Federated {LLM}s},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=DY6uhcv4Xm}\n}",
        "github": "",
        "project": "",
        "reviewers": "5b7s;r7rM;D1fe;ozf6",
        "site": "https://openreview.net/forum?id=DY6uhcv4Xm",
        "pdf_size": 3901420,
        "rating": "5;5;5;6",
        "confidence": "3;4;5;4",
        "soundness": "3;2;3;3",
        "contribution": "3;2;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "116;127;71;45",
        "wc_strengths": "44;59;92;120",
        "wc_weaknesses": "135;94;143;87",
        "wc_questions": "85;3;46;15",
        "wc_review": "380;283;352;267",
        "wc_reply_reviewers": "90;0;0;0",
        "wc_reply_authors": "1001;545;659;333",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            89.75,
            33.281939546847326
        ],
        "wc_strengths_avg": [
            78.75,
            29.473505051147207
        ],
        "wc_weaknesses_avg": [
            114.75,
            24.539508960042376
        ],
        "wc_questions_avg": [
            37.25,
            31.72045869781835
        ],
        "wc_review_avg": [
            320.5,
            46.90682253148256
        ],
        "wc_reply_reviewers_avg": [
            22.5,
            38.97114317029974
        ],
        "wc_reply_authors_avg": [
            634.5,
            241.78244353136975
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            15,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 16,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2077215069535331276&as_sdt=5,31&sciodt=0,31&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;2;1;1;3;4;5;4;6;3;7;8",
        "aff_unique_norm": "University of California, Irvine;University of Southern California;FedML;Lehigh University;University of Illinois Urbana-Champaign;Texas A&M University;Carnegie Mellon University;Zhejiang University;TensorOpera AI",
        "aff_unique_dep": ";;Inc.;;;;;;",
        "aff_unique_url": "https://www.uci.edu;https://www.usc.edu;https://www.fedml.ai;https://www.lehigh.edu;https://illinois.edu;https://www.tamu.edu;https://www.cmu.edu;https://www.zju.edu.cn;",
        "aff_unique_abbr": "UCI;USC;FedML;Lehigh;UIUC;TAMU;CMU;ZJU;",
        "aff_campus_unique_index": "0;1;1;1;3;4;3",
        "aff_campus_unique": "Irvine;Los Angeles;;Urbana-Champaign;College Station",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0;0;1",
        "aff_country_unique": "United States;China;"
    },
    {
        "title": "The LLM Surgeon",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19140",
        "id": "DYIIRgwg2i",
        "author_site": "Tycho van der Ouderaa, Markus Nagel, Mart van Baalen, Tijmen Blankevoort",
        "tldr": "",
        "abstract": "State-of-the-art language models are becoming increasingly large in an effort to achieve the highest performance on large corpora of available textual data. However, the sheer size of the Transformer architectures makes it difficult to deploy models within computational, environmental or device-specific constraints. We explore data-driven compression of existing pretrained models as an alternative to training smaller models from scratch. To do so, we scale Kronecker-factored curvature approximations of the target loss landscape to large language models. In doing so, we can compute both the dynamic allocation of structures that can be removed as well as updates of remaining weights that account for the removal. We provide a general framework for unstructured, semi-structured and structured pruning and improve upon weight updates to capture more correlations between weights, while remaining computationally efficient. Experimentally, our method can prune rows and columns from a range of OPT models and Llamav2-7B by 20\\%-30\\%, with a negligible loss in performance, and achieve state-of-the-art results in unstructured and semi-structured pruning of large language models. We will open source our code on GitHub upon acceptance.",
        "keywords": "large language model;LLM;compression;pruning;fisher",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/41befcb018e50a439af13097c40da5a30e7cd879.pdf",
        "author": "Tycho F. A. van der Ouderaa;Markus Nagel;Mart Van Baalen;Tijmen Blankevoort",
        "authorids": "~Tycho_F._A._van_der_Ouderaa2;~Markus_Nagel1;~Mart_Van_Baalen1;~Tijmen_Blankevoort1",
        "gender": "M;M;M;M",
        "homepage": ";;;https://tychovdo.github.io/",
        "dblp": "38/1463;;;",
        "google_scholar": "akNuBBEAAAAJ;a-Au4JUAAAAJ;OGEyrG8AAAAJ;",
        "orcid": ";;;",
        "linkedin": ";;tijmen-blankevoort-a5633a24/;tychovdo/",
        "or_profile": "~Markus_Nagel1;~Mart_Van_Baalen1;~Tijmen_Blankevoort1;~Tycho_F.A._van_der_Ouderaa1",
        "aff": "Qualcomm AI Research;QualComm;Qualcomm Inc, QualComm;Imperial College London",
        "aff_domain": "qualcomm.com;qualcomm.com;qti.qualcomm.com;imperial.ac.uk",
        "position": "Researcher;Researcher;Researcher;PhD student",
        "bibtex": "@inproceedings{\nouderaa2024the,\ntitle={The {LLM} Surgeon},\nauthor={Tycho F. A. van der Ouderaa and Markus Nagel and Mart Van Baalen and Tijmen Blankevoort},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=DYIIRgwg2i}\n}",
        "github": "",
        "project": "",
        "reviewers": "2GDn;zzzW;zF62",
        "pdf_size": 503540,
        "rating": "5;5;5",
        "confidence": "5;4;3",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "3;3;3",
        "wc_summary": "48;77;79",
        "wc_strengths": "25;91;20",
        "wc_weaknesses": "208;93;97",
        "wc_questions": "5;49;31",
        "wc_review": "286;310;227",
        "wc_reply_reviewers": "167;0;0",
        "wc_reply_authors": "1823;1625;424",
        "reply_reviewers": "1;0;0",
        "reply_authors": "3;3;1",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            68.0,
            14.165686240583852
        ],
        "wc_strengths_avg": [
            45.333333333333336,
            32.355662392986005
        ],
        "wc_weaknesses_avg": [
            132.66666666666666,
            53.29373529996018
        ],
        "wc_questions_avg": [
            28.333333333333332,
            18.06162291219209
        ],
        "wc_review_avg": [
            274.3333333333333,
            34.874377732401506
        ],
        "wc_reply_reviewers_avg": [
            55.666666666666664,
            78.7245549721023
        ],
        "wc_reply_authors_avg": [
            1290.6666666666667,
            618.1339301118776
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 33,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5004291398859074866&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=DYIIRgwg2i",
        "pdf": "https://openreview.net/pdf?id=DYIIRgwg2i",
        "email": "qualcomm.com;qualcomm.com;qti.qualcomm.com;imperial.ac.uk",
        "author_num": 4,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "Qualcomm;Qualcomm Incorporated;Imperial College London",
        "aff_unique_dep": "Qualcomm AI Research;;",
        "aff_unique_url": "https://www.qualcomm.com/research;https://www.qualcomm.com;https://www.imperial.ac.uk",
        "aff_unique_abbr": "QAI;Qualcomm;ICL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "DZ6B5u4vfe",
        "title": "Instruction-tuned LLMs with World Knowledge are More Aligned to the Human Brain",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Instruction-tuning is a widely adopted method of finetuning that enables large language models (LLMs) to generate output that more closely resembles human responses to natural language queries, in many cases leading to human-level performance on diverse testbeds. However, it remains unclear whether instruction-tuning truly makes LLMs more similar to how humans process language. We investigate the effect of instruction-tuning on LLM-human similarity in two ways: (1) brain alignment, the similarity of LLM internal representations to neural activity in the human language system, and (2) behavioral alignment, the similarity of LLM and human behavior on a reading task. We assess 25 vanilla and instruction-tuned LLMs across three datasets involving humans reading naturalistic stories and sentences, and discover that instruction-tuning generally enhances brain alignment by an average of 6%, but does not have a similar effect on behavioral alignment. To identify the factors underlying LLM-brain alignment, we compute the correlation between the brain alignment of LLMs and various model properties, such as model size, performance ability on problem-solving benchmarks, and ability on benchmarks requiring world knowledge spanning various domains. Notably, we find a strong positive correlation between brain alignment and model size (r = 0.95), as well as performance on tasks requiring world knowledge (r = 0.81). Our results suggest that making world knowledge in LLMs more accessible via instruction-tuning also yields neural representations more similar to those of the human language system.",
        "keywords": "large language models;instruction-tuning;world knowledge;neuroscience;neuroAI",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "Khai Loong Aw;Syrielle Montariol;Badr AlKhamissi;Martin Schrimpf;Antoine Bosselut",
        "authorids": "~Khai_Loong_Aw1;~Syrielle_Montariol1;~Badr_AlKhamissi1;~Martin_Schrimpf1;~Antoine_Bosselut1",
        "gender": "M;F;M;;M",
        "homepage": "https://awwkl.github.io/;https://smontariol.github.io/;https://bkhmsi.github.io;http://mschrimpf.com/;https://atcbosselut.github.io/",
        "dblp": "313/9975;245/2618;;190/7063;184/3742",
        "google_scholar": "https://scholar.google.com/citations?hl=en;oM63nTMAAAAJ;0l9UHtQAAAAJ;RiZ-RdwAAAAJ;XD9hkJwAAAAJ",
        "orcid": ";;;0000-0001-7766-7223;",
        "linkedin": ";;https://linkedin.com/in/bkhmsi;mschrimpf/;",
        "or_profile": "~Khai_Loong_Aw1;~Syrielle_Montariol1;~Badr_AlKhamissi1;~Martin_Schrimpf1;~Antoine_Bosselut1",
        "aff": "Singapore Management University;EPFL - EPF Lausanne;EPFL - EPF Lausanne;EPFL - EPF Lausanne;Swiss Federal Institute of Technology Lausanne",
        "aff_domain": "smu.edu.sg;epfl.ch;epfl.ch;epfl.ch;epfl.ch",
        "position": "Undergrad student;Postdoc;PhD student;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\naw2024instructiontuned,\ntitle={Instruction-tuned {LLM}s with World Knowledge are More Aligned to the Human Brain},\nauthor={Khai Loong Aw and Syrielle Montariol and Badr AlKhamissi and Martin Schrimpf and Antoine Bosselut},\nyear={2024},\nurl={https://openreview.net/forum?id=DZ6B5u4vfe}\n}",
        "github": "",
        "project": "",
        "reviewers": "KJEe;co7p;WxVH;fAu2",
        "site": "https://openreview.net/forum?id=DZ6B5u4vfe",
        "pdf_size": 2212335,
        "rating": "3;3;5;6",
        "confidence": "4;2;4;3",
        "soundness": "2;2;2;3",
        "contribution": "2;1;2;3",
        "presentation": "3;1;3;3",
        "wc_summary": "76;99;59;128",
        "wc_strengths": "52;19;45;58",
        "wc_weaknesses": "99;224;441;143",
        "wc_questions": "36;175;4;34",
        "wc_review": "263;517;549;363",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "451;696;549;560",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            90.5,
            25.889186931999237
        ],
        "wc_strengths_avg": [
            43.5,
            14.874474780643517
        ],
        "wc_weaknesses_avg": [
            226.75,
            131.57198600006006
        ],
        "wc_questions_avg": [
            62.25,
            66.31883216703986
        ],
        "wc_review_avg": [
            423.0,
            116.09478885807063
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            564.0,
            87.22671609088583
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.17407765595569782,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15711299074914776681&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;1;1;2",
        "aff_unique_norm": "Singapore Management University;EPFL;Swiss Federal Institute of Technology Lausanne",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.smu.edu.sg;https://www.epfl.ch;https://www.epfl.ch",
        "aff_unique_abbr": "SMU;EPFL;EPFL",
        "aff_campus_unique_index": "1;1;1;1",
        "aff_campus_unique": ";Lausanne",
        "aff_country_unique_index": "0;1;1;1;1",
        "aff_country_unique": "Singapore;Switzerland"
    },
    {
        "id": "DZBpVcc2Xc",
        "title": "HiddenKey: Parameter-Efficient FineTuning Meets Dropout under a Unified Framework",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The emerging powerful capabilities exhibited by large language models (LLMs) have established them as a fundamental element in various applications that rely on advanced language understanding. At the same time, fine-tuning has become the standard learning approach to adapting LLMs to a concrete application (e.g., instruction tuning, alignment tuning, and task/user-specific specialization). Due to the high cost associated with full finetuning, parameter-efficient finetuning (PEFT) methods, especially LoRA, have gained popularity due to their lower storage, memory, and computation requirements. However, the possible contradiction between limited trainable parameters and the dropout regularization methods (which aim at alleviating overfitting associated with excessive parameter redundancy), has been largely overlooked. With extensive experiments of LoRA-based PEFT, we first confirm that PEFT is also overfitting-prone. We then revisit transformer-specific dropout methods, and validate their equivalence and differences mathematically and empirically. To facilitate a comprehensive comparison, we introduce a unified framework to instantiate them along dropping position, structural pattern and compensation measure, and uncover their new preferences and performance comparisons in PEFT scenarios. This framework also enables us to integrate the best of all into a new dropout method named HiddenKey, which shows performance superiority over existing methods on both NLU and NLG tasks. Compared to baselines, it also achieves better performance with less finetuning time, and offers continuous improvement with further finetuning. These highlight HiddenKey as the better practice for high-performance and parameter-efficient finetuning of LLMs.",
        "keywords": "Dropout;LoRA;Parameter-Efficient FineTuning;NLU;NLG;NLP",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/b5f53ddc18b636ce93b129308539b34228556852.zip",
        "author": "Sheng Wang;Liheng Chen;Jiyue Jiang;Lingpeng Kong;Chuan Wu",
        "authorids": "~Sheng_Wang12;~Liheng_Chen2;~Jiyue_Jiang1;~Lingpeng_Kong1;~Chuan_Wu1",
        "gender": "M;M;M;M;",
        "homepage": "https://forence1999.github.io/;;;https://ikekonglp.github.io/;https://i.cs.hku.hk/~cwu/",
        "dblp": ";;271/4659;144/7656;34/3772-1",
        "google_scholar": "BYxiWaIAAAAJ;;https://scholar.google.com.hk/citations?user=O4ZaJ7QAAAAJ;f1hBi5wAAAAJ;mY7MWXMAAAAJ",
        "orcid": "0009-0007-1607-2948;;;;",
        "linkedin": "forence1999/;liheng-chen-b579b6243/;jethro-jiang-1215661a1/;;",
        "or_profile": "~Sheng_Wang12;~Liheng_Chen2;~Jiyue_Jiang1;~Lingpeng_Kong1;~Chuan_Wu1",
        "aff": "University of Hong Kong;The Univerisity of Hong Kong;The Chinese University of Hong Kong;Department of Computer Science, The University of Hong Kong;The University of Hong Kong",
        "aff_domain": "hku.hk;connect.hku.hk;link.cuhk.edu.hk;cs.hku.hk;hku.hk",
        "position": "PhD student;Undergrad student;PhD student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nwang2024hiddenkey,\ntitle={HiddenKey: Parameter-Efficient FineTuning Meets Dropout under a Unified Framework},\nauthor={Sheng Wang and Liheng Chen and Jiyue Jiang and Lingpeng Kong and Chuan Wu},\nyear={2024},\nurl={https://openreview.net/forum?id=DZBpVcc2Xc}\n}",
        "github": "",
        "project": "",
        "reviewers": "jBFS;4cjp;iCRS;twKX",
        "site": "https://openreview.net/forum?id=DZBpVcc2Xc",
        "pdf_size": 3047044,
        "rating": "3;5;5;5",
        "confidence": "3;4;4;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "2;2;1;2",
        "wc_summary": "36;30;112;55",
        "wc_strengths": "42;38;45;45",
        "wc_weaknesses": "220;312;112;149",
        "wc_questions": "46;10;127;2",
        "wc_review": "344;390;396;251",
        "wc_reply_reviewers": "150;39;26;0",
        "wc_reply_authors": "237;244;364;347",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            58.25,
            32.37572393013012
        ],
        "wc_strengths_avg": [
            42.5,
            2.8722813232690143
        ],
        "wc_weaknesses_avg": [
            198.25,
            76.28359915473312
        ],
        "wc_questions_avg": [
            46.25,
            49.47916228070156
        ],
        "wc_review_avg": [
            345.25,
            58.01454558987771
        ],
        "wc_reply_reviewers_avg": [
            53.75,
            57.31655520004669
        ],
        "wc_reply_authors_avg": [
            298.0,
            57.86622503671723
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:2hogoQKPrZQJ:scholar.google.com/&scioq=HiddenKey:+Parameter-Efficient+FineTuning+Meets+Dropout+under+a+Unified+Framework&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "University of Hong Kong;Chinese University of Hong Kong",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.hku.hk;https://www.cuhk.edu.hk",
        "aff_unique_abbr": "HKU;CUHK",
        "aff_campus_unique_index": "0;0;0;0;0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "HypeBoy: Generative Self-Supervised Representation Learning on Hypergraphs",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19139",
        "id": "DZUzOKE6og",
        "author_site": "Sunwoo Kim, Shinhwan Kang, Fanchen Bu, Soo Yong Lee, Jaemin Yoo, Kijung Shin",
        "tldr": "",
        "abstract": "Hypergraphs are marked by complex topology, expressing higher-order interactions among multiple nodes with hyperedges, and better capturing the topology is essential for effective representation learning. Recent advances in generative self-supervised learning (SSL) suggest that hypergraph neural networks (HNNs) learned from generative self-supervision have the potential to effectively encode the complex hypergraph topology. Designing a generative SSL strategy for hypergraphs, however, is not straightforward. Questions remain with regard to its generative SSL task, connection to downstream tasks, and empirical properties of learned representations. In light of the promises and challenges, we propose a novel generative SSL strategy for hypergraphs. We first formulate a generative SSL task on hypergraphs, hyperedge filling, and highlight its theoretical connection to node classification. Based on the generative SSL task, we propose a hypergraph SSL method, HYPEBOY. HYPEBOY learns effective general-purpose hypergraph representations, outperforming 15 baseline methods across 11 benchmark datasets. To our knowledge, this is the first study on generative SSL on hypergraphs, and we demonstrate its theoretical and empirical strengths for hypergraph representation learning.",
        "keywords": "Hypergraph;Self-supervised learning;Hypergraph neural network",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/05d6f507f264b33bda980132f47283963dd07137.pdf",
        "author": "Sunwoo Kim;Shinhwan Kang;Fanchen Bu;Soo Yong Lee;Jaemin Yoo;Kijung Shin",
        "authorids": "~Sunwoo_Kim4;~Shinhwan_Kang1;~Fanchen_Bu1;~Soo_Yong_Lee1;~Jaemin_Yoo1;~Kijung_Shin2",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://sites.google.com/view/sunwoo97;https://sites.google.com/view/shinhwankang/;https://github.com/bokveizen;https://syleetolow.notion.site/Soo-Yong-s-Homepage-2e5cfa74f1784bf4957e7ba0ab0fbc7a;https://jaeminyoo.github.io/;https://kijungs.github.io/",
        "dblp": "16/3210.html;;270/0123;348/9631;211/2843;153/2052",
        "google_scholar": "fYxrC_EAAAAJ;_wASixAAAAAJ;XjNu7-AAAAAJ;U3vZd0kAAAAJ;https://scholar.google.co.kr/citations?user=LcxcTRUAAAAJ;https://scholar.google.co.kr/citations?user=Yp3Cz5AAAAAJ",
        "orcid": "0009-0006-6002-169X;;0000-0003-0497-3902;0000-0001-7957-7600;0000-0001-7237-5117;0000-0002-2872-1526",
        "linkedin": ";;fanchen-bu-1268a1255/;syleeheal/;jaemin-yoo-8b3678142/;kijungshin/",
        "or_profile": "~Sunwoo_Kim4;~Shinhwan_Kang1;~Fanchen_Bu1;~Soo_Yong_Lee1;~Jaemin_Yoo1;~Kijung_Shin2",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;KAIST;KAIST;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr;kaist.ac.kr;kaist.edu;kaist.ac.kr;kaist.ac.kr",
        "position": "MS student;PhD student;PhD student;PhD student;Assistant Professor;Associate Professor",
        "bibtex": "@inproceedings{\nkim2024hypeboy,\ntitle={HypeBoy: Generative Self-Supervised Representation Learning on Hypergraphs},\nauthor={Sunwoo Kim and Shinhwan Kang and Fanchen Bu and Soo Yong Lee and Jaemin Yoo and Kijung Shin},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=DZUzOKE6og}\n}",
        "github": "",
        "project": "",
        "reviewers": "EPYj;ctQb;3LGX;4MNM",
        "pdf_size": 1895581,
        "rating": "5;5;6;8",
        "confidence": "4;3;3;4",
        "soundness": "3;3;3;4",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "59;73;59;99",
        "wc_strengths": "38;39;63;94",
        "wc_weaknesses": "95;136;161;153",
        "wc_questions": "101;89;5;3",
        "wc_review": "293;337;288;349",
        "wc_reply_reviewers": "18;113;80;15",
        "wc_reply_authors": "2486;2672;1427;1079",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "8;11;7;6",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            72.5,
            16.332482971061076
        ],
        "wc_strengths_avg": [
            58.5,
            22.808989455914087
        ],
        "wc_weaknesses_avg": [
            136.25,
            25.469344318219107
        ],
        "wc_questions_avg": [
            49.5,
            45.70284455042159
        ],
        "wc_review_avg": [
            316.75,
            26.649343331496933
        ],
        "wc_reply_reviewers_avg": [
            56.5,
            41.68033109273485
        ],
        "wc_reply_authors_avg": [
            1916.0,
            677.5186344300797
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            8.0,
            1.8708286933869707
        ],
        "replies_avg": [
            44,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.40824829046386296,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9518591365510698105&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=DZUzOKE6og",
        "pdf": "https://openreview.net/pdf?id=DZUzOKE6og",
        "email": "kaist.ac.kr;kaist.ac.kr;kaist.ac.kr;kaist.edu;kaist.ac.kr;kaist.ac.kr",
        "author_num": 6,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "GraphPulse: Topological representations for temporal graph property prediction",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19138",
        "id": "DZqic2sPTY",
        "author_site": "Kiarash Shamsi, Farimah Poursafaei, Shenyang(Andy) Huang, Tran Gia Bao Ngo, Baris Coskunuzer, Cuneyt Akcora",
        "tldr": "",
        "abstract": "Many real-world networks evolve over time, and predicting the evolution of such networks remains a challenging task. Graph Neural Networks (GNNs) have shown empirical success for learning on static graphs, but they lack the ability to effectively learn from nodes and edges with different timestamps. Consequently, the prediction of future properties in temporal graphs remains a relatively under-explored area.\nIn this paper, we aim to bridge this gap by introducing a principled framework, named GraphPulse. The framework combines two important techniques for the analysis of temporal graphs within a Newtonian framework. First, we employ the Mapper method, a key tool in topological data analysis, to extract essential clustering information from graph nodes. Next, we harness the sequential modeling capabilities of Recurrent Neural Networks (RNNs) for temporal reasoning regarding the graph's evolution. Through extensive experimentation, we demonstrate that our model enhances the ROC-AUC metric by 10.2\\% in comparison to the top-performing state-of-the-art method across various temporal networks. We provide the implementation of GraphPulse at https://github.com/kiarashamsi/GraphPulse.",
        "keywords": "Temporal Graph Analysis;Topological Data Analysis;Graph Property Prediction;Graph Neural Networks",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Kiarash Shamsi;Farimah Poursafaei;Shenyang Huang;Bao Tran Gia Ngo;Baris Coskunuzer;Cuneyt Gurcan Akcora",
        "authorids": "~Kiarash_Shamsi1;~Farimah_Poursafaei1;~Shenyang_Huang1;~Bao_Tran_Gia_Ngo1;~Baris_Coskunuzer1;~Cuneyt_Gurcan_Akcora2",
        "gender": "M;F;M;M;M;M",
        "homepage": ";;;https://personal.utdallas.edu/~bxc190014/;http://cakcora.github.io;https://shenyanghuang.github.io/",
        "dblp": ";277/0215;;287/4893;64/10038;249/2209",
        "google_scholar": ";https://scholar.google.ca/citations?user=gZ7HEsMAAAAJ;1ydEk84AAAAJ;n49tHqQAAAAJ;https://scholar.google.com/citations?hl=en;ljIXv6kAAAAJ",
        "orcid": ";;;0000-0001-7462-8819;0000-0002-2882-6950;",
        "linkedin": "https://ir.linkedin.com/in/kiarash-shamsi-a45096b1;farimah-poursafaei-133195167/?originalSubdomain=ca;;baris-coskunuzer-2ba327169/;cuneyt-gurcan-akcora-97272421/;",
        "or_profile": "~Kiarash_Shamsi1;~Farimah_Poursafaei1;~Bao_Tran_Gia_Ngo1;~Baris_Coskunuzer1;~Cuneyt_Gurcan_Akcora2;~Andy_Huang1",
        "aff": "University of Manitoba;Mila, Quebec AI Institute;University of Manitoba;University of Texas, Dallas;University of Central Florida;McGill University, Mila",
        "aff_domain": "umanitoba.ca;mila.quebec;umanitoba.ca;utdallas.edu;ucf.edu;mcgill.ca",
        "position": "PhD student;Postdoc;Undergrad student;Full Professor;Associate Professor;PhD student",
        "bibtex": "@inproceedings{\nshamsi2024graphpulse,\ntitle={GraphPulse: Topological representations for temporal graph property prediction},\nauthor={Kiarash Shamsi and Farimah Poursafaei and Shenyang Huang and Bao Tran Gia Ngo and Baris Coskunuzer and Cuneyt Gurcan Akcora},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=DZqic2sPTY}\n}",
        "github": "",
        "project": "",
        "reviewers": "NvJb;ehy4;yFgn;Qyn2",
        "pdf_size": 2418542,
        "rating": "6;6;8;8",
        "confidence": "5;2;3;5",
        "soundness": "2;3;3;3",
        "contribution": "3;2;3;3",
        "presentation": "3;4;2;4",
        "wc_summary": "38;88;204;86",
        "wc_strengths": "37;108;69;161",
        "wc_weaknesses": "169;151;293;75",
        "wc_questions": "62;57;99;63",
        "wc_review": "306;404;665;385",
        "wc_reply_reviewers": "0;31;206;284",
        "wc_reply_authors": "451;794;1019;904",
        "reply_reviewers": "0;1;2;2",
        "reply_authors": "2;2;3;3",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            1.299038105676658
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            104.0,
            61.106464469808756
        ],
        "wc_strengths_avg": [
            93.75,
            46.25675626327467
        ],
        "wc_weaknesses_avg": [
            172.0,
            78.26237921249263
        ],
        "wc_questions_avg": [
            70.25,
            16.753730927766508
        ],
        "wc_review_avg": [
            440.0,
            135.0018518391507
        ],
        "wc_reply_reviewers_avg": [
            130.25,
            118.52505009490609
        ],
        "wc_reply_authors_avg": [
            792.0,
            212.3428830924173
        ],
        "reply_reviewers_avg": [
            1.25,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.19245008972987523,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5926163004751256491&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=DZqic2sPTY",
        "pdf": "https://openreview.net/pdf?id=DZqic2sPTY",
        "email": "umanitoba.ca;mila.quebec;umanitoba.ca;utdallas.edu;ucf.edu;mcgill.ca",
        "author_num": 6,
        "aff_unique_index": "0;1;0;2;3;4",
        "aff_unique_norm": "University of Manitoba;Quebec AI Institute;University of Texas at Dallas;University of Central Florida;McGill University",
        "aff_unique_dep": ";AI Institute;;;Mila",
        "aff_unique_url": "https://umanitoba.ca;https://www.mila.quebec;https://www.utdallas.edu;https://www.ucf.edu;https://www.mcgill.ca",
        "aff_unique_abbr": "U of M;Mila;UT Dallas;UCF;McGill",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Quebec;Dallas",
        "aff_country_unique_index": "0;0;0;1;1;0",
        "aff_country_unique": "Canada;United States"
    },
    {
        "id": "DZxU0q2S11",
        "title": "Data geometry and topology dependent bounds on network widths in deep ReLU networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The geometrical perspective of deep ReLU networks is important to understand the learning behavior and generalization capability of the neural networks. As such, here we investigate the relationship between the geometric and topological attributes of datasets and ReLU network architectures. Specifically, we first establish the data geometry-dependent bounds of the ReLU network widths and unveil a profound connection between these bounds and the underlying data manifold. Then, we show that topological characteristics are not the sole factor in fully determining network architecture. Rather, by combining the constraints on the hole shapes of the data manifold, the network architecture can be characterized by the Betti numbers of the data manifold. We further provide theoretical and empirical evidences that gradient descent converges to the proposed network configurations.",
        "keywords": "Dataset geometry;dataset topology;deep ReLU network;width bounds",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Sangmin Lee;Abbas Mammadov;Jong Chul Ye",
        "authorids": "~Sangmin_Lee3;~Abbas_Mammadov1;~Jong_Chul_Ye1",
        "gender": "M;M;M",
        "homepage": ";;https://bispl.weebly.com/",
        "dblp": ";367/7571;15/5613",
        "google_scholar": "https://scholar.google.co.kr/citations?user=2wp3excAAAAJ;_-WJlkwAAAAJ;HNMjoNEAAAAJ",
        "orcid": ";0009-0004-5593-4529;",
        "linkedin": ";abbas-mammadov/;",
        "or_profile": "~Sangmin_Lee3;~Abbas_Mammadov1;~Jong_Chul_Ye1",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr;kaist.ac.kr",
        "position": "PhD student;Undergrad student;Full Professor",
        "bibtex": "@misc{\nlee2024data,\ntitle={Data geometry and topology dependent bounds on network widths in deep Re{LU} networks},\nauthor={Sangmin Lee and Abbas Mammadov and Jong Chul Ye},\nyear={2024},\nurl={https://openreview.net/forum?id=DZxU0q2S11}\n}",
        "github": "",
        "project": "",
        "reviewers": "J9Hi;17Jw;eavJ;nRVF",
        "site": "https://openreview.net/forum?id=DZxU0q2S11",
        "pdf_size": 2970060,
        "rating": "3;6;6;8",
        "confidence": "3;4;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;2;2;4",
        "wc_summary": "78;109;170;66",
        "wc_strengths": "22;160;85;33",
        "wc_weaknesses": "282;638;465;9",
        "wc_questions": "94;38;319;178",
        "wc_review": "476;945;1039;286",
        "wc_reply_reviewers": "13;18;45;0",
        "wc_reply_authors": "1017;1285;435;406",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "5;3;2;1",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            105.75,
            40.2763888649417
        ],
        "wc_strengths_avg": [
            75.0,
            54.53897688809353
        ],
        "wc_weaknesses_avg": [
            348.5,
            232.95117514191682
        ],
        "wc_questions_avg": [
            157.25,
            105.84747280875439
        ],
        "wc_review_avg": [
            686.5,
            314.5588180293155
        ],
        "wc_reply_reviewers_avg": [
            19.0,
            16.38596960817394
        ],
        "wc_reply_authors_avg": [
            785.75,
            377.4793868544347
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            1.479019945774904
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.7001400420140049,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:SZ1n102lpAcJ:scholar.google.com/&scioq=Data+geometry+and+topology+dependent+bounds+on+network+widths+in+deep+ReLU+networks&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "DZyhUXpEee",
        "title": "SpaFL: Communication-Efficient Federated Learning with Sparse Models and Low Computational Overhead",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The large communication and computation overhead of federated learning (FL) is one of the main challenges facing its practical deployment over resource-constrained clients and systems. In this work, SpaFL: a communication-efficient FL framework is proposed to optimize both personalized model parameters and sparse model structures  with low computational overhead. In SpaFL, a trainable threshold is defined for each neuron/filter to prune its connected parameters. Both model parameters and thresholds are jointly optimized to enable the automatic sparsification of the models while recovering prematurely pruned parameters during training. To reduce communication costs, only thresholds are communicated between a server and clients instead of parameters, thereby enabling the clients to learn how to prune. Further, global thresholds are used to update model parameters by extracting aggregated parameter importance. The convergence of SpaFL is analyzed, and the results provide new insights into the tradeoff between computation overhead and learning performance. Experimental results show that SpaFL improves accuracy while requiring much less communication and computing resources compared to both dense and sparse personalized baselines.",
        "keywords": "Federated Learning;Communication efficiency;Sparse training;Computational overhead",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/82858905ed6bae039ed01c829341c97c4094b044.zip",
        "author": "Minsu Kim;Walid Saad;Merouane Abdelkader DEBBAH;Choong Seon Hong",
        "authorids": "~Minsu_Kim6;~Walid_Saad1;~Merouane_Abdelkader_DEBBAH1;~Choong_Seon_Hong1",
        "gender": ";;M;M",
        "homepage": ";http://www.netsciwis.com;;http://networking.khu.ac.kr",
        "dblp": "25/6052;41/6237;75/4085;73/1778.html",
        "google_scholar": "c6vqXkQAAAAJ;kYDNA0UAAAAJ;HU5I0X4AAAAJ;oKANWloAAAAJ",
        "orcid": ";;;0000-0003-3484-7333",
        "linkedin": ";;merouanedebbah/;",
        "or_profile": "~Minsu_Kim6;~Walid_Saad1;~Merouane_Abdelkader_DEBBAH1;~Choong_Seon_Hong1",
        "aff": "Virginia Polytechnic Institute and State University;Virginia Tech;Khalifa University of Science, Technology and Research;Kyung Hee University",
        "aff_domain": "vt.edu;vt.edu;ku.ac.ae;khu.ac.kr",
        "position": "PhD student;Full Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nkim2024spafl,\ntitle={Spa{FL}: Communication-Efficient Federated Learning with Sparse Models and Low Computational Overhead},\nauthor={Minsu Kim and Walid Saad and Merouane Abdelkader DEBBAH and Choong Seon Hong},\nyear={2024},\nurl={https://openreview.net/forum?id=DZyhUXpEee}\n}",
        "github": "",
        "project": "",
        "reviewers": "R775;Kuri;HLPa;Ggae",
        "site": "https://openreview.net/forum?id=DZyhUXpEee",
        "pdf_size": 1906004,
        "rating": "5;6;6;6",
        "confidence": "3;5;4;3",
        "soundness": "3;3;2;3",
        "contribution": "2;3;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "59;92;100;69",
        "wc_strengths": "53;46;34;53",
        "wc_weaknesses": "64;150;115;112",
        "wc_questions": "97;109;8;162",
        "wc_review": "273;397;257;396",
        "wc_reply_reviewers": "0;156;52;21",
        "wc_reply_authors": "1188;1852;1217;1075",
        "reply_reviewers": "0;2;1;1",
        "reply_authors": "3;5;3;3",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            80.0,
            16.62828914831589
        ],
        "wc_strengths_avg": [
            46.5,
            7.762087348130012
        ],
        "wc_weaknesses_avg": [
            110.25,
            30.597181242722343
        ],
        "wc_questions_avg": [
            94.0,
            55.348893394538614
        ],
        "wc_review_avg": [
            330.75,
            65.99384440991447
        ],
        "wc_reply_reviewers_avg": [
            57.25,
            59.93903152370749
        ],
        "wc_reply_authors_avg": [
            1333.0,
            304.3049457370024
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            3.5,
            0.8660254037844386
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5222329678670935,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18277242520449417541&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "Virginia Tech;Khalifa University of Science, Technology and Research;Kyung Hee University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.vt.edu;https://www.kustar.ac.ae;http://www.khu.ac.kr",
        "aff_unique_abbr": "VT;KUSTAR;KHU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;2",
        "aff_country_unique": "United States;United Arab Emirates;South Korea"
    },
    {
        "title": "Constrained Decoding for Cross-lingual Label Projection",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19137",
        "id": "DayPQKXaQk",
        "author_site": "Duong Le, Yang Chen, Alan Ritter, Wei Xu",
        "tldr": "",
        "abstract": "Zero-shot cross-lingual transfer utilizing multilingual LLMs has become a popular learning paradigm for low-resource languages with no labeled training data. However, for NLP tasks that involve fine-grained predictions on words and phrases, the performance of zero-shot cross-lingual transfer learning lags far behind supervised fine-tuning methods. Therefore, it is common to exploit translation and label projection to further improve the performance by (1) translating training data that is available in a high-resource language (e.g., English) together with the gold labels into low-resource languages, and/or (2) translating test data in low-resource languages to a high-source language to run inference on, then projecting the predicted span-level labels back onto the original test data. However, state-of-the-art marker-based label projection methods suffer from translation quality degradation due to the extra label markers injected in the input to the translation model. In this work, we explore a new direction that leverages constrained decoding for label projection to overcome the aforementioned issues. Our new method not only can preserve the quality of translated texts but also has the versatility of being applicable to both translating training and translating test data strategies. This versatility is crucial as our experiments reveal that translating test data can lead to a considerable boost in performance compared to translating only training data. We evaluate on two cross-lingual transfer tasks, namely Named Entity Recognition and Event Argument Extraction, spanning 20 languages. The results demonstrate that our approach outperforms the state-of-the-art marker-based method by a large margin and also shows better performance than other label projection methods that rely on external word alignment.",
        "keywords": "constrained decoding;label projection",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Duong Minh Le;Yang Chen;Alan Ritter;Wei Xu",
        "authorids": "~Duong_Minh_Le1;~Yang_Chen10;~Alan_Ritter1;~Wei_Xu5",
        "gender": "M;;M;F",
        "homepage": "https://duonglm38.github.io/;https://edchengg.github.io/;http://aritter.github.io/;https://cocoxu.github.io/",
        "dblp": ";48/4792-13;47/3133;32/1213-4.html",
        "google_scholar": "52PYT8gAAAAJ;o-oBMWEAAAAJ;https://scholar.google.com/citations?hl=en;BfOdG-oAAAAJ",
        "orcid": ";;;",
        "linkedin": "duong-le-1a7621202/;;;",
        "or_profile": "~Duong_Minh_Le1;~Yang_Chen10;~Alan_Ritter1;~Wei_Xu5",
        "aff": "Georgia Institute of Technology;Georgia Institute of Technology;Georgia Institute of Technology;Georgia Institute of Technology",
        "aff_domain": "gatech.edu;gatech.edu;gatech.edu;gatech.edu",
        "position": "PhD student;PhD student;Associate Professor;Associate Professor",
        "bibtex": "@inproceedings{\nle2024constrained,\ntitle={Constrained Decoding for Cross-lingual Label Projection},\nauthor={Duong Minh Le and Yang Chen and Alan Ritter and Wei Xu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=DayPQKXaQk}\n}",
        "github": "",
        "project": "",
        "reviewers": "VywY;kHv7;NyaM;TbXV",
        "pdf_size": 1560778,
        "rating": "6;6;8;8",
        "confidence": "3;4;4;4",
        "soundness": "3;2;4;3",
        "contribution": "3;2;4;3",
        "presentation": "4;3;3;4",
        "wc_summary": "91;99;209;312",
        "wc_strengths": "17;14;169;145",
        "wc_weaknesses": "96;276;114;243",
        "wc_questions": "132;3;158;78",
        "wc_review": "336;392;650;778",
        "wc_reply_reviewers": "0;213;0;60",
        "wc_reply_authors": "1315;1534;519;1278",
        "reply_reviewers": "0;2;0;1",
        "reply_authors": "2;3;1;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            177.75,
            90.45268099951488
        ],
        "wc_strengths_avg": [
            86.25,
            71.26491072049413
        ],
        "wc_weaknesses_avg": [
            182.25,
            78.38486779985024
        ],
        "wc_questions_avg": [
            92.75,
            59.31009610513205
        ],
        "wc_review_avg": [
            539.0,
            181.8378398463862
        ],
        "wc_reply_reviewers_avg": [
            68.25,
            87.08724074168386
        ],
        "wc_reply_authors_avg": [
            1161.5,
            383.63296260879355
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14822448404141497063&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=DayPQKXaQk",
        "pdf": "https://openreview.net/pdf?id=DayPQKXaQk",
        "email": "gatech.edu;gatech.edu;gatech.edu;gatech.edu",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Georgia Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.gatech.edu",
        "aff_unique_abbr": "Georgia Tech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "DbRfXmzwjc",
        "title": "MAGNet: Motif-Agnostic Generation of Molecules from Shapes",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent advances in machine learning for molecules exhibit great potential for facilitating drug discovery from *in silico* predictions.\nMost models for molecule generation rely on the decomposition of molecules into frequently occurring substructures (motifs), from which they generate novel compounds. While motif representations greatly aid in learning molecular distributions, such methods struggle to represent substructures beyond their known motif set. To alleviate this issue and increase flexibility across datasets, we propose MAGNet, a graph-based model that generates abstract shapes before allocating atom and bond types. To this end, we introduce a novel factorisation of the molecules' data distribution that accounts for the molecules' global context and facilitates learning adequate assignments of atoms and bonds onto shapes. Despite the added complexity of shape abstractions, MAGNet outperforms most other graph-based approaches on standard benchmarks. Importantly, we demonstrate that MAGNet's improved expressivity leads to molecules with more topologically distinct structures and, at the same time, diverse atom and bond assignments.",
        "keywords": "Molecule Generation;Distribution Learning;GNNs",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/9efa809b477bdf7dc03d308f398925c47d1949d7.pdf",
        "author": "Leon Hetzel;Johanna Sommer;Bastian Rieck;Fabian J Theis;Stephan G\u00fcnnemann",
        "authorids": "~Leon_Hetzel1;~Johanna_Sommer1;~Bastian_Rieck1;~Fabian_J_Theis1;~Stephan_G\u00fcnnemann1",
        "gender": "M;F;M;M;",
        "homepage": ";https://johanna-sommer.com;https://bastian.rieck.me;http://www.daml.in.tum.de;https://www.helmholtz-munich.de/en/icb/pi/fabian-theis",
        "dblp": "246/5214;https://dblp.uni-trier.de/pid/243/2320;119/8860;43/3011;t/FabianJTheis",
        "google_scholar": ";R3p8FGsAAAAJ;https://scholar.google.ch/citations?user=La7zuKQAAAAJ;;sqWpn2AAAAAJ",
        "orcid": "0000-0002-4823-9729;;0000-0003-4335-0302;;0000-0002-2419-1943",
        "linkedin": ";;br-ml/;;",
        "or_profile": "~Leon_Hetzel1;~Johanna_Sommer1;~Bastian_Rieck1;~Stephan_G\u00fcnnemann1;~Fabian_J._Theis1",
        "aff": "Technische Universit\u00e4t M\u00fcnchen;Technische Universit\u00e4t M\u00fcnchen;Helmholtz Zentrum M\u00fcnchen;Technical University Munich;Technical University Munich",
        "aff_domain": "tum.de;tum.de;helmholtz-munich.de;tum.de;tum.de",
        "position": "PhD student;PhD student;Principal Investigator;Professor;Full Professor",
        "bibtex": "@misc{\nhetzel2024magnet,\ntitle={{MAGN}et: Motif-Agnostic Generation of Molecules from Shapes},\nauthor={Leon Hetzel and Johanna Sommer and Bastian Rieck and Fabian J Theis and Stephan G{\\\"u}nnemann},\nyear={2024},\nurl={https://openreview.net/forum?id=DbRfXmzwjc}\n}",
        "github": "",
        "project": "",
        "reviewers": "jTCd;bmZE;dbRP;qQTC",
        "site": "https://openreview.net/forum?id=DbRfXmzwjc",
        "pdf_size": 2845092,
        "rating": "1;3;6;8",
        "confidence": "4;3;4;4",
        "soundness": "2;2;3;3",
        "contribution": "1;2;3;3",
        "presentation": "1;1;3;3",
        "wc_summary": "69;95;115;75",
        "wc_strengths": "186;88;128;159",
        "wc_weaknesses": "170;105;2;295",
        "wc_questions": "156;100;181;11",
        "wc_review": "581;388;426;540",
        "wc_reply_reviewers": "518;250;62;10",
        "wc_reply_authors": "709;1457;601;708",
        "reply_reviewers": "1;2;1;1",
        "reply_authors": "1;3;2;2",
        "rating_avg": [
            4.5,
            2.692582403567252
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.0,
            1.0
        ],
        "wc_summary_avg": [
            88.5,
            18.07622748252522
        ],
        "wc_strengths_avg": [
            140.25,
            36.48544230237589
        ],
        "wc_weaknesses_avg": [
            143.0,
            106.25205880358271
        ],
        "wc_questions_avg": [
            112.0,
            65.2725056972689
        ],
        "wc_review_avg": [
            483.75,
            79.25394311956977
        ],
        "wc_reply_reviewers_avg": [
            210.0,
            198.97738564972653
        ],
        "wc_reply_authors_avg": [
            868.75,
            342.45027011231866
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.32163376045133846,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=154933043004143786&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1;2;2",
        "aff_unique_norm": "Technische Universit\u00e4t M\u00fcnchen;Helmholtz Zentrum M\u00fcnchen;Technical University of Munich",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.tum.de;https://www.helmholtz-muenchen.de;https://www.tum.de",
        "aff_unique_abbr": "TUM;;TUM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "title": "Improving Domain Generalization with Domain Relations",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19136",
        "id": "Dc4rXq3HIA",
        "author_site": "Huaxiu Yao, Xinyu Yang, Xinyi Pan, Shengchao Liu, Pang Wei Koh, Chelsea Finn",
        "tldr": "",
        "abstract": "Distribution shift presents a significant challenge in machine learning, where models often underperform during the test stage when faced with a different distribution than the one they were trained on. In this paper, we focus on domain shifts, which occur when the model is applied to new domains that are different from the ones it was trained on, and propose a new approach called DG. Unlike previous approaches that aim to learn a single model that is domain invariant, DG leverages domain similarities based on domain metadata to learn domain-specific models. Concretely, DG learns a set of training-domain-specific functions during the training stage and reweights them based on domain relations during the test stage. These domain relations can be directly obtained and learned from domain metadata. Under mild assumptions, we theoretically prove that using domain relations to reweight training-domain-specific functions achieves stronger out-of-domain generalization compared to the conventional averaging approach. Empirically, we evaluate the effectiveness of DG using both toy and real-world datasets for tasks such as temperature regression, land use classification, and molecule-protein binding affinity prediction. Our results show that DG consistently outperforms state-of-the-art methods.",
        "keywords": "Domain Generalization; Domain Relations; Distribution Shift",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Huaxiu Yao;Xinyu Yang;Xinyi Pan;Shengchao Liu;Pang Wei Koh;Chelsea Finn",
        "authorids": "~Huaxiu_Yao1;~Xinyu_Yang4;~Xinyi_Pan1;~Shengchao_Liu1;~Pang_Wei_Koh1;~Chelsea_Finn1",
        "gender": "M;M;F;M;M;F",
        "homepage": "http://huaxiuyao.mystrikingly.com;http://xinyuyang.me;https://rebeccapan.github.io;https://chao1224.github.io/;http://cs.stanford.edu/~pangwei;https://ai.stanford.edu/~cbfinn/",
        "dblp": "197/1635;89/473-2.html;;;10/10453;131/1783",
        "google_scholar": "A20BZnQAAAAJ;;;F1ws3XUAAAAJ;Nn990CkAAAAJ;vfPE6hgAAAAJ",
        "orcid": ";;;0000-0003-2030-2367;;",
        "linkedin": "huaxiuyao/;;xinyipan42;;;",
        "or_profile": "~Huaxiu_Yao1;~Xinyu_Yang4;~Xinyi_Pan1;~Shengchao_Liu1;~Pang_Wei_Koh1;~Chelsea_Finn1",
        "aff": "Department of Computer Science, University of North Carolina at Chapel Hill;Carnegie Mellon University;;University of California, Berkeley;University of Washington;Google",
        "aff_domain": "cs.unc.edu;cmu.edu;;berkeley.edu;cs.washington.edu;google.com",
        "position": "Assistant Professor;PhD student;;Postdoc;Assistant Professor;Research Scientist",
        "bibtex": "@inproceedings{\nyao2024improving,\ntitle={Improving Domain Generalization with Domain Relations},\nauthor={Huaxiu Yao and Xinyu Yang and Xinyi Pan and Shengchao Liu and Pang Wei Koh and Chelsea Finn},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Dc4rXq3HIA}\n}",
        "github": "",
        "project": "",
        "reviewers": "u1oN;Htjr;79WW;nUD5;bK1N;2jGa",
        "pdf_size": 1064468,
        "rating": "6;6;6;6;8;8",
        "confidence": "4;3;3;4;4;4",
        "soundness": "2;3;3;2;4;3",
        "contribution": "2;3;2;2;4;3",
        "presentation": "3;3;2;3;4;3",
        "wc_summary": "41;90;44;97;88;110",
        "wc_strengths": "38;61;24;77;85;44",
        "wc_weaknesses": "242;90;186;216;30;70",
        "wc_questions": "5;9;3;5;32;124",
        "wc_review": "326;250;257;395;235;348",
        "wc_reply_reviewers": "10;0;57;11;0;14",
        "wc_reply_authors": "835;499;1305;964;931;1530",
        "reply_reviewers": "1;0;2;1;0;1",
        "reply_authors": "2;1;4;2;2;3",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.8333333333333335,
            0.6871842709362768
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.7453559924999299
        ],
        "presentation_avg": [
            3.0,
            0.5773502691896257
        ],
        "wc_summary_avg": [
            78.33333333333333,
            26.310116347561486
        ],
        "wc_strengths_avg": [
            54.833333333333336,
            21.56707882140947
        ],
        "wc_weaknesses_avg": [
            139.0,
            79.36203962432754
        ],
        "wc_questions_avg": [
            29.666666666666668,
            43.3192284736877
        ],
        "wc_review_avg": [
            301.8333333333333,
            58.53607624552761
        ],
        "wc_reply_reviewers_avg": [
            15.333333333333334,
            19.38785415895449
        ],
        "wc_reply_authors_avg": [
            1010.6666666666666,
            331.04011170182315
        ],
        "reply_reviewers_avg": [
            0.8333333333333334,
            0.6871842709362768
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5000000000000001,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14745593896278742604&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=Dc4rXq3HIA",
        "pdf": "https://openreview.net/pdf?id=Dc4rXq3HIA",
        "email": "cs.unc.edu;cmu.edu;;berkeley.edu;cs.washington.edu;google.com",
        "author_num": 6,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "University of North Carolina at Chapel Hill;Carnegie Mellon University;University of California, Berkeley;University of Washington;Google",
        "aff_unique_dep": "Department of Computer Science;;;;Google",
        "aff_unique_url": "https://www.unc.edu;https://www.cmu.edu;https://www.berkeley.edu;https://www.washington.edu;https://www.google.com",
        "aff_unique_abbr": "UNC Chapel Hill;CMU;UC Berkeley;UW;Google",
        "aff_campus_unique_index": "0;2;3",
        "aff_campus_unique": "Chapel Hill;;Berkeley;Mountain View",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "DchC116F4H",
        "title": "Non-negative Probabilistic Factorization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Non-negative Matrix Factorization (NMF) is a powerful data-analysis tool to extract non-negative latent components from linearly mixed samples. It is particularly useful when the observed signal aggregates contributions from multiple sources. However, NMF only accounts for two types of variations between samples - disparities in the proportions of sources contribution and observation noise. Here, we present VarNMF, a probabilistic extension of NMF that introduces another type of variation between samples: a variation in the actual value a source contributes to the samples. We show that by modeling sources as distributions and applying an Expectation Maximization procedure, we can learn this type of variation directly from mixed samples without observing any source directly. We apply VarNMF to a dataset of genomic measurements from liquid biopsies and demonstrate its ability to extract cancer-associated source distributions that reflect inter-cancer variability directly from mixed samples and without prior knowledge. The proposed model provides a framework for learning source distributions from additive mixed samples without direct observations.",
        "keywords": "NMF;Probabilistic graphical models;unsupervised learning;molecular biology",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/b0c2915a520dcce5551c2290951661d4770d2aa0.zip",
        "author": "Ela Fallik;Nir Friedman",
        "authorids": "~Ela_Fallik1;~Nir_Friedman2",
        "gender": "F;M",
        "homepage": "https://github.com/elafallik;",
        "dblp": ";",
        "google_scholar": ";xjnef1AAAAAJ",
        "orcid": ";0000-0002-9678-3550",
        "linkedin": ";",
        "or_profile": "~Ela_Fallik1;~Nir_Friedman2",
        "aff": "Hebrew University of Jerusalem;Hebrew University of Jerusalem",
        "aff_domain": "huji.ac.il;huji.ac.il",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nfallik2024nonnegative,\ntitle={Non-negative Probabilistic Factorization},\nauthor={Ela Fallik and Nir Friedman},\nyear={2024},\nurl={https://openreview.net/forum?id=DchC116F4H}\n}",
        "github": "",
        "project": "",
        "reviewers": "6VBV;oPxL;aHM6;UHns",
        "site": "https://openreview.net/forum?id=DchC116F4H",
        "pdf_size": 4453422,
        "rating": "3;3;5;8",
        "confidence": "4;4;3;3",
        "soundness": "2;3;3;3",
        "contribution": "1;2;2;3",
        "presentation": "2;3;2;4",
        "wc_summary": "51;69;64;144",
        "wc_strengths": "12;47;32;100",
        "wc_weaknesses": "168;307;194;135",
        "wc_questions": "1;6;45;263",
        "wc_review": "232;429;335;642",
        "wc_reply_reviewers": "190;0;0;113",
        "wc_reply_authors": "996;616;444;207",
        "reply_reviewers": "2;0;0;1",
        "reply_authors": "3;1;1;1",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            82.0,
            36.39368077015569
        ],
        "wc_strengths_avg": [
            47.75,
            32.62188682464581
        ],
        "wc_weaknesses_avg": [
            201.0,
            64.67225061802009
        ],
        "wc_questions_avg": [
            78.75,
            107.73201706085337
        ],
        "wc_review_avg": [
            409.5,
            151.23904919034635
        ],
        "wc_reply_reviewers_avg": [
            75.75,
            80.49340035058775
        ],
        "wc_reply_authors_avg": [
            565.75,
            287.73457821402
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.8551861104941366,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Hebrew University of Jerusalem",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.huji.ac.il",
        "aff_unique_abbr": "HUJI",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Jerusalem",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Israel"
    },
    {
        "title": "The Blessing of Randomness: SDE Beats ODE in General Diffusion-based Image Editing",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19135",
        "id": "DesYwmUG00",
        "author_site": "Shen Nie, Hanzhong Guo, Cheng Lu, Yuhao Zhou, Chenyu Zheng, Chongxuan Li",
        "tldr": "",
        "abstract": "We present a unified probabilistic formulation for diffusion-based image editing, where a latent variable is edited in a task-specific manner and generally deviates from the corresponding marginal distribution induced by the original stochastic or ordinary differential equation (SDE or ODE). Instead, it defines a corresponding SDE or ODE for editing. In the formulation, we prove that the Kullback-Leibler divergence between the marginal distributions of the two SDEs gradually decreases while that for the ODEs remains as the time approaches zero, which shows the promise of SDE in image editing. Inspired by it, we provide the SDE counterparts for widely used ODE baselines in various tasks including inpainting and image-to-image translation, where SDE shows a consistent and substantial improvement. Moreover, we propose \\emph{SDE-Drag}  -- a simple yet effective method built upon the SDE formulation for point-based content dragging. We build a challenging benchmark (termed \\emph{DragBench}) with open-set natural, art, and AI-generated images for evaluation. A user study on DragBench indicates that SDE-Drag significantly outperforms our ODE baseline, existing diffusion-based methods, and the renowned DragGAN. Our results demonstrate the superiority and versatility of SDE in image editing and push the boundary of diffusion-based editing methods.  See the project page \\url{https://ml-gsai.github.io/SDE-Drag-demo/} for the code and DragBench dataset.",
        "keywords": "Diffusion models;Stochastic differential equations;Image dragging;Image editing;Score-based models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/9c3e4e6f223975c4ac567784c8ccf7faff9a6eb9.zip",
        "author": "Shen Nie;Hanzhong Allan Guo;Cheng Lu;Yuhao Zhou;Chenyu Zheng;Chongxuan Li",
        "authorids": "~Shen_Nie2;~Hanzhong_Allan_Guo1;~Cheng_Lu5;~Yuhao_Zhou2;~Chenyu_Zheng1;~Chongxuan_Li1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://github.com/NieShenRuc;;https://luchengthu.github.io/;https://yuhaoz.com;https://chen-yu-zheng.github.io;http://ml.cs.tsinghua.edu.cn/~chongxuan",
        "dblp": "342/3413;;91/1482-11;;133/5078;161/9965",
        "google_scholar": ";;vPE9VRoAAAAJ;GKLRbxoAAAAJ;QDfsVgYAAAAJ;UKMcQn4AAAAJ",
        "orcid": ";;;;;0000-0002-0912-9076",
        "linkedin": ";hanzhong-guo-19965b1a5/;;;;",
        "or_profile": "~Shen_Nie2;~Hanzhong_Allan_Guo1;~Cheng_Lu5;~Yuhao_Zhou2;~Chenyu_Zheng1;~Chongxuan_Li1",
        "aff": "Renmin University of China;Renmin University of China;Tsinghua University;Tsinghua University;Renmin University of China;Renmin University of China",
        "aff_domain": "ruc.edu.cn;ruc.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;ruc.edu.cn;ruc.edu.cn",
        "position": "PhD student;MS student;PhD student;PhD student;PhD student;Associate Professor",
        "bibtex": "@inproceedings{\nnie2024the,\ntitle={The Blessing of Randomness: {SDE} Beats {ODE} in General Diffusion-based Image Editing},\nauthor={Shen Nie and Hanzhong Allan Guo and Cheng Lu and Yuhao Zhou and Chenyu Zheng and Chongxuan Li},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=DesYwmUG00}\n}",
        "github": "",
        "project": "",
        "reviewers": "NG3Y;UXKo;mBr1",
        "pdf_size": 10814463,
        "rating": "5;6;8",
        "confidence": "3;4;4",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "3;3;2",
        "wc_summary": "125;45;43",
        "wc_strengths": "94;43;70",
        "wc_weaknesses": "289;164;48",
        "wc_questions": "38;4;56",
        "wc_review": "546;256;217",
        "wc_reply_reviewers": "23;13;42",
        "wc_reply_authors": "1295;359;344",
        "reply_reviewers": "1;1;1",
        "reply_authors": "4;2;2",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            71.0,
            38.19249489974001
        ],
        "wc_strengths_avg": [
            69.0,
            20.83266665599966
        ],
        "wc_weaknesses_avg": [
            167.0,
            98.41070402485019
        ],
        "wc_questions_avg": [
            32.666666666666664,
            21.561282171728305
        ],
        "wc_review_avg": [
            339.6666666666667,
            146.7658755372727
        ],
        "wc_reply_reviewers_avg": [
            26.0,
            12.027745701779143
        ],
        "wc_reply_authors_avg": [
            666.0,
            444.81231997326694
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.7559289460184545,
        "gs_citation": 36,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13683506663648145673&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=DesYwmUG00",
        "pdf": "https://openreview.net/pdf?id=DesYwmUG00",
        "email": "ruc.edu.cn;ruc.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;ruc.edu.cn;ruc.edu.cn",
        "author_num": 6,
        "aff_unique_index": "0;0;1;1;0;0",
        "aff_unique_norm": "Renmin University of China;Tsinghua University",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.ruc.edu.cn;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "RUC;THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Bounding the Expected Robustness of Graph Neural Networks Subject to Node Feature Attacks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19134",
        "id": "DfPtC8uSot",
        "author_site": "Yassine ABBAHADDOU, Sofiane ENNADIR, Johannes Lutzeyer, Michalis Vazirgiannis, Henrik Bostr\u00f6m",
        "tldr": "",
        "abstract": "Graph Neural Networks (GNNs) have demonstrated state-of-the-art performance in various graph representation learning tasks. Recently, studies revealed their vulnerability to adversarial attacks. In this work, we theoretically define the concept of expected robustness in the context of attributed graphs and relate it to the classical definition of adversarial robustness in the graph representation learning literature. Our definition allows us to derive an upper bound of the expected robustness of Graph Convolutional Networks (GCNs) and Graph Isomorphism Networks subject to node feature attacks. Building on these findings, we connect the expected robustness of GNNs to the orthonormality of their weight matrices and consequently propose an attack-independent, more robust variant of the GCN, called the Graph Convolutional Orthonormal Robust Networks (GCORNs). We further introduce a probabilistic method to estimate the expected robustness, which allows us to evaluate the effectiveness of GCORN on several real-world datasets. Experimental experiments showed that GCORN outperforms available defense methods. Our code is publicly available at: https://github.com/Sennadir/GCORN .",
        "keywords": "Graph Neural Networks;Adversarial Robustness",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/f25b91b5158838a4032e88f0752c37a659f5da61.zip",
        "author": "Yassine ABBAHADDOU;Sofiane ENNADIR;Johannes F. Lutzeyer;Michalis Vazirgiannis;Henrik Bostr\u00f6m",
        "authorids": "~Yassine_ABBAHADDOU1;~Sofiane_ENNADIR1;~Johannes_F._Lutzeyer1;~Michalis_Vazirgiannis1;~Henrik_Bostr\u00f6m1",
        "gender": "M;M;M;M;",
        "homepage": "https://abbahaddou.github.io/;https://sennadir.github.io/;https://johanneslutzeyer.com/;;https://www.kth.se/profile/henbos?l=en",
        "dblp": ";355/0360;253/8868;v/MVazirgiannis;39/6674",
        "google_scholar": "https://scholar.google.com/citations?hl=fr;https://scholar.google.fr/citations?user=EqqOxfMAAAAJ;OfT4ns8AAAAJ;https://scholar.google.gr/citations?user=aWGJYcMAAAAJ;https://scholar.google.se/citations?user=wKsdomUAAAAJ",
        "orcid": ";0000-0001-9969-4660;;;0000-0001-8382-0300",
        "linkedin": "yassineabbahaddou/;sofiane-ennadir/;johannes-lutzeyer-213b7480/;;",
        "or_profile": "~Yassine_ABBAHADDOU1;~Sofiane_ENNADIR1;~Johannes_F._Lutzeyer1;~Michalis_Vazirgiannis1;~Henrik_Bostr\u00f6m1",
        "aff": "New York University;KTH Royal Institute of Technology;Ecole Polytechique;Ecole Polytechnique, France;KTH Royal Institute of Technology, Stockholm, Sweden",
        "aff_domain": "nyu.edu;kth.se;polytechnique.edu;polytechnique.fr;kth.se",
        "position": "Intern;PhD student;Assistant Professor;Full Professor;Professor",
        "bibtex": "@inproceedings{\nabbahaddou2024bounding,\ntitle={Bounding the Expected Robustness of Graph Neural Networks Subject to Node Feature Attacks},\nauthor={Yassine ABBAHADDOU and Sofiane ENNADIR and Johannes F. Lutzeyer and Michalis Vazirgiannis and Henrik Bostr{\\\"o}m},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=DfPtC8uSot}\n}",
        "github": "",
        "project": "",
        "reviewers": "nkA1;dcsE;B7fh;gkkc",
        "pdf_size": 816772,
        "rating": "5;6;8;8",
        "confidence": "3;4;2;3",
        "soundness": "2;3;4;4",
        "contribution": "2;3;3;3",
        "presentation": "3;4;3;3",
        "wc_summary": "100;199;56;103",
        "wc_strengths": "21;243;81;154",
        "wc_weaknesses": "24;220;100;22",
        "wc_questions": "351;104;62;2",
        "wc_review": "496;766;299;281",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1995;1130;464;136",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;2;1;1",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            114.5,
            52.21350400040204
        ],
        "wc_strengths_avg": [
            124.75,
            82.94086749003775
        ],
        "wc_weaknesses_avg": [
            91.5,
            80.57760234705424
        ],
        "wc_questions_avg": [
            129.75,
            132.78248190179306
        ],
        "wc_review_avg": [
            460.5,
            195.5076724837161
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            931.25,
            710.9519586441829
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5443310539518174,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14366742430622554938&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=DfPtC8uSot",
        "pdf": "https://openreview.net/pdf?id=DfPtC8uSot",
        "email": "nyu.edu;kth.se;polytechnique.edu;polytechnique.fr;kth.se",
        "author_num": 5,
        "aff_unique_index": "0;1;2;2;1",
        "aff_unique_norm": "New York University;KTH Royal Institute of Technology;Ecole Polytechnique",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.nyu.edu;https://www.kth.se;https://www.polytechnique.edu",
        "aff_unique_abbr": "NYU;KTH;Polytechnique",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Stockholm",
        "aff_country_unique_index": "0;1;2;2;1",
        "aff_country_unique": "United States;Sweden;France"
    },
    {
        "id": "DgRdeJF0k7",
        "title": "Masked Dual-Temporal Autoencoders for Semi-Supervised Time-Series Classification",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this study, we propose a novel framework for semi-supervised time-series classification based on masked time-series modeling, a recent advance in self-supervised learning effective for capturing intricate temporal structures within time series. The proposed method effectively extracts intrinsic semantic information from unlabeled instances by reflecting diverse temporal resolutions and considering various masking ratios during model training. Then, we incorporate the semantic information extracted from unlabeled time series with supervisory features, including hard-to-learn class information, learned from labeled ones to improve classification performance. Through extensive experiments on semi-supervised time-series classification, we demonstrate the superiority of our approach by achieving state-of-the-art performance.",
        "keywords": "semi-supervised learning;time-series classification;self-supervised learning;masked time-series modeling",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/b19ad4268c5b299dbf9f004815181ef36e1add9d.zip",
        "author": "Sangho Lee;Chihyeon Choi;Youngdoo Son",
        "authorids": "~Sangho_Lee6;~Chihyeon_Choi1;~Youngdoo_Son1",
        "gender": "M;M;",
        "homepage": "https://sites.google.com/view/dgudslab/home;;",
        "dblp": ";;",
        "google_scholar": "https://scholar.google.co.kr/citations?user=JwelX1MAAAAJ;;",
        "orcid": "0000-0002-7784-8515;;",
        "linkedin": ";;",
        "or_profile": "~Sangho_Lee6;~Chihyeon_Choi1;~Youngdoo_Son1",
        "aff": "Dongguk University;Dongguk University;",
        "aff_domain": "dongguk.edu;dongguk.edu;",
        "position": "PhD student;MS student;",
        "bibtex": "@misc{\nlee2024masked,\ntitle={Masked Dual-Temporal Autoencoders for Semi-Supervised Time-Series Classification},\nauthor={Sangho Lee and Chihyeon Choi and Youngdoo Son},\nyear={2024},\nurl={https://openreview.net/forum?id=DgRdeJF0k7}\n}",
        "github": "",
        "project": "",
        "reviewers": "G4ga;q17s;6QXJ;8ZuZ",
        "site": "https://openreview.net/forum?id=DgRdeJF0k7",
        "pdf_size": 4780587,
        "rating": "3;6;6;6",
        "confidence": "5;2;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;2",
        "wc_summary": "74;56;82;128",
        "wc_strengths": "58;61;60;82",
        "wc_weaknesses": "383;136;115;156",
        "wc_questions": "103;32;35;2",
        "wc_review": "618;285;292;368",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1400;1406;847;650",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;3;2;1",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            85.0,
            26.551836094703507
        ],
        "wc_strengths_avg": [
            65.25,
            9.730750228014282
        ],
        "wc_weaknesses_avg": [
            197.5,
            108.07520529705229
        ],
        "wc_questions_avg": [
            43.0,
            36.966200778549045
        ],
        "wc_review_avg": [
            390.75,
            135.180203802184
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1075.75,
            334.5865919309977
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.662266178532522,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:cXsdk5f5hnUJ:scholar.google.com/&scioq=Masked+Dual-Temporal+Autoencoders+for+Semi-Supervised+Time-Series+Classification&hl=en&as_sdt=0,47",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Dongguk University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.dongguk.edu",
        "aff_unique_abbr": "DGU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "Dgc5RWZwTR",
        "title": "Efficient Training of Multi-task Combinarotial Neural Solver with Multi-armed Bandits",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Efficiently training a multi-task neural solver for various combinatorial optimization problems (COPs) has been less studied so far. In this paper, we propose a general and efficient training paradigm based on multi-armed bandits to deliver a unified combinarotial multi-task neural solver. To this end, we resort to the theoretical loss decomposition for multiple tasks under an encoder-decoder framework, which enables more efficient training via proper bandit task-sampling algorithms through an intra-task influence matrix. Our method achieves much higher overall performance with either limited training budgets or the same training epochs, compared to standard training schedules, which can be promising for advising efficient training of other multi-task large models. Additionally, the influence matrix can provide empirical evidence of some common practices in the area of learning to optimize, which in turn supports the validity of our approach.",
        "keywords": "learning to optimize;multi-armed bandit;combinatorial optimization",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/35c6c44429a17c31ac3a2703c330e211a8f5a318.zip",
        "author": "Chenguang Wang;Tianshu Yu",
        "authorids": "~Chenguang_Wang2;~Tianshu_Yu2",
        "gender": "M;M",
        "homepage": "https://github.com/Wastedzz/cgwang;https://mypage.cuhk.edu.cn/academics/yutianshu/",
        "dblp": "62/3432-11;152/6675",
        "google_scholar": "Ptf3uO0AAAAJ;MTHO7DsAAAAJ",
        "orcid": "0009-0008-4097-1174;0000-0002-6537-1924",
        "linkedin": ";",
        "or_profile": "~Chenguang_Wang2;~Tianshu_Yu2",
        "aff": "The Chinese University of Hong Kong, Shenzhen;Chinese University of Hong Kong (Shenzhen)",
        "aff_domain": "cuhk.edu.cn;cuhk.edu.cn",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nwang2024efficient,\ntitle={Efficient Training of Multi-task Combinarotial Neural Solver with Multi-armed Bandits},\nauthor={Chenguang Wang and Tianshu Yu},\nyear={2024},\nurl={https://openreview.net/forum?id=Dgc5RWZwTR}\n}",
        "github": "",
        "project": "",
        "reviewers": "48WT;7uDV;ezHK;B49D",
        "site": "https://openreview.net/forum?id=Dgc5RWZwTR",
        "pdf_size": 4442077,
        "rating": "3;5;5;6",
        "confidence": "3;4;3;3",
        "soundness": "3;3;3;2",
        "contribution": "2;3;2;2",
        "presentation": "2;3;2;3",
        "wc_summary": "74;88;76;268",
        "wc_strengths": "71;40;53;97",
        "wc_weaknesses": "228;90;145;123",
        "wc_questions": "75;96;133;231",
        "wc_review": "448;314;407;719",
        "wc_reply_reviewers": "225;0;144;119",
        "wc_reply_authors": "1415;486;922;1162",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "2;1;2;2",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            126.5,
            81.87032429397114
        ],
        "wc_strengths_avg": [
            65.25,
            21.3819433167334
        ],
        "wc_weaknesses_avg": [
            146.5,
            50.96322203314857
        ],
        "wc_questions_avg": [
            133.75,
            59.863908158422134
        ],
        "wc_review_avg": [
            472.0,
            150.64361918116546
        ],
        "wc_reply_reviewers_avg": [
            122.0,
            80.60086848167332
        ],
        "wc_reply_authors_avg": [
            996.25,
            342.3056930581202
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.13245323570650439,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8974803107189265280&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Chinese University of Hong Kong",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cuhk.edu.cn",
        "aff_unique_abbr": "CUHK",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Shenzhen",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "Di7xKawV7x",
        "title": "End-to-End Neural Network Compression via $\\frac{\\ell_1}{\\ell_2}$ Regularized Latency Surrogates",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Neural network (NN) compression via techniques such as pruning, quantization requires setting compression hyperparameters (\\emph{e.g.,} number of channels to be pruned, bitwidths for quantization) for each layer either manually or via neural architecture search (NAS) which can be computationally expensive. We address this problem by providing an end-to-end  technique that optimizes for model's Floating Point Operations (FLOPs) via a novel $\\frac{\\ell_1}{\\ell_2}$ latency surrogate. Our algorithm is versatile and can be used with many popular compression methods  including pruning, low-rank factorization, and quantization. Crucially, it is fast and runs in almost the same amount of time as a {\\em single model training run}; which is a significant training speed-up over standard NAS methods. For BERT compression on GLUE fine-tuning tasks, we achieve $50\\%$ reduction in FLOPs with only $1\\%$ drop in performance. For compressing MobileNetV3 on ImageNet-1K, we achieve $15\\%$ reduction in FLOPs {\\em without drop in accuracy}, while still requiring $3\\times$ less  training compute than SOTA NAS techniques.  Finally, for transfer learning on smaller datasets, our technique identifies $1.2\\times$-$1.4\\times$ cheaper architectures than standard MobileNetV3, EfficientNet suite of architectures at almost the same training cost and accuracy.",
        "keywords": "neural network compression;NAS;end to end",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Anshul Nasery;Hardik Shah;Arun Suggala;Prateek Jain",
        "authorids": "~Anshul_Nasery2;~Hardik_Shah1;~Arun_Suggala1;~Prateek_Jain1",
        "gender": "M;M;M;M",
        "homepage": "https://cse.iitb.ac.in/~anshuln;https://hardik01shah.github.io/;;http://prateekjain.org",
        "dblp": "268/5650;;164/7327;https://dblp.uni-trier.de/pers/j/Jain_0002:Prateek.html",
        "google_scholar": "lmvY2SMAAAAJ;urZ4LKUAAAAJ;CKgmfDMAAAAJ;qYhRbJoAAAAJ",
        "orcid": ";;;",
        "linkedin": ";hardik01shah/;;",
        "or_profile": "~Anshul_Nasery2;~Hardik_Shah1;~Arun_Suggala1;~Prateek_Jain1",
        "aff": "University of Washington;ETHZ - ETH Zurich;Google;Google",
        "aff_domain": "uw.edu;ethz.ch;google.com;google.com",
        "position": "PhD student;MS student;Researcher;Researcher",
        "bibtex": "@misc{\nnasery2024endtoend,\ntitle={End-to-End Neural Network Compression via \\${\\textbackslash}frac\\{{\\textbackslash}ell\\_1\\}\\{{\\textbackslash}ell\\_2\\}\\$  Regularized Latency Surrogates},\nauthor={Anshul Nasery and Hardik Shah and Arun Suggala and Prateek Jain},\nyear={2024},\nurl={https://openreview.net/forum?id=Di7xKawV7x}\n}",
        "github": "",
        "project": "",
        "reviewers": "qwYJ;mcQZ;Hf33",
        "site": "https://openreview.net/forum?id=Di7xKawV7x",
        "pdf_size": 869089,
        "rating": "5;5;6",
        "confidence": "5;3;4",
        "soundness": "3;3;3",
        "contribution": "2;2;3",
        "presentation": "3;3;2",
        "wc_summary": "71;55;55",
        "wc_strengths": "34;59;49",
        "wc_weaknesses": "35;108;47",
        "wc_questions": "46;5;2",
        "wc_review": "186;227;153",
        "wc_reply_reviewers": "40;22;0",
        "wc_reply_authors": "288;554;122",
        "reply_reviewers": "1;1;0",
        "reply_authors": "1;3;1",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            60.333333333333336,
            7.542472332656507
        ],
        "wc_strengths_avg": [
            47.333333333333336,
            10.274023338281628
        ],
        "wc_weaknesses_avg": [
            63.333333333333336,
            31.961782734314987
        ],
        "wc_questions_avg": [
            17.666666666666668,
            20.07209228976613
        ],
        "wc_review_avg": [
            188.66666666666666,
            30.26916289265731
        ],
        "wc_reply_reviewers_avg": [
            20.666666666666668,
            16.35712552851373
        ],
        "wc_reply_authors_avg": [
            321.3333333333333,
            177.93132258137
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0;1;2;2",
        "aff_unique_norm": "University of Washington;ETH Zurich;Google",
        "aff_unique_dep": ";;Google",
        "aff_unique_url": "https://www.washington.edu;https://www.ethz.ch;https://www.google.com",
        "aff_unique_abbr": "UW;ETHZ;Google",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "United States;Switzerland"
    },
    {
        "id": "DiG14qg4ok",
        "title": "Low-coherence Subspace Projection: Enhance the Learning Capacity of Orthogonal Projection Methods on Long Task Sequences",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Gradient Orthogonal Projection (GOP) is an efficient strategy in continual learning to mitigate catastrophic forgetting. Despite its success so far, GOP-based methods often suffer from the learning capacity degradation problem with an increasing number of tasks. To address this problem, we propose a novel and plug-and-play method to learn new tasks in low-coherence subspaces rather than orthogonal subspaces. Specifically, we construct a unified cost function with the DNN parameters lying on the Oblique manifold.  A corresponding gradient descent algorithm is developed to jointly minimize the cost function that involves both inter-task and intra-task coherence. We then provide a theoretical analysis to show the advantages of the proposed in the stability and plasticity. Experimental results show that the proposed method has prominent advantages in maintaining the learning capacity, when the number of tasks increases, especially on a large number of tasks, compared with baselines.",
        "keywords": "continual learning;learning capacity degradation;orthogonal projection;low-coherence;catastrophic forgetting",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Zihao Xu;Zhengyu Li;Yufei Shi;Hao Shen;Xuan Tang;Weiting Chen;Mingsong Chen;Xian Wei",
        "authorids": "~Zihao_Xu3;~Zhengyu_Li2;~Yufei_Shi2;~Hao_Shen1;~Xuan_Tang3;~Weiting_Chen2;~Mingsong_Chen1;~Xian_Wei1",
        "gender": "M;M;F;M;F;F;M;M",
        "homepage": ";;;;https://faculty.ecnu.edu.cn/_s15/tx2_21642/main.psp;;https://faculty.ecnu.edu.cn/_s43/cms/main.psp;https://www.researchgate.net/",
        "dblp": "216/8409-2;134/7254;;26/2210-2;;;95/573.html;139/0725",
        "google_scholar": ";;;Kce9W-8AAAAJ;mFj-I10AAAAJ;;93A6b7YAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0002-0313-1861;0000-0003-2836-276X; 0000-0002-2388-1571 ;;;0000-0002-9102-4870;0000-0002-3922-0989;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Zihao_Xu3;~Zhengyu_Li2;~Yufei_Shi2;~Hao_Shen1;~Xuan_Tang3;~Weiting_Chen2;~Mingsong_Chen1;~Xian_Wei1",
        "aff": "East China Normal University;East China Normal University;SUN YAT-SEN UNIVERSITY;Fortiss GmbH;East China Normal University;East China Normal University;East China Normal University;East China Normal University",
        "aff_domain": "ecnu.edu.cn;ecnu.edu.cn;sysu.edu.cn;fortiss.org;ecnu.edu.cn;ecnu.edu.cn;ecnu.edu.cn;ecnu.edu.cn",
        "position": "MS student;MS student;MS student;Principal Researcher;Associate Professor;Associate Professor;Full Professor;Principal Researcher",
        "bibtex": "@misc{\nxu2024lowcoherence,\ntitle={Low-coherence Subspace Projection: Enhance the Learning Capacity of Orthogonal Projection Methods on Long Task Sequences},\nauthor={Zihao Xu and Zhengyu Li and Yufei Shi and Hao Shen and Xuan Tang and Weiting Chen and Mingsong Chen and Xian Wei},\nyear={2024},\nurl={https://openreview.net/forum?id=DiG14qg4ok}\n}",
        "github": "",
        "project": "",
        "reviewers": "6aA9;g3YD;UiYh",
        "site": "https://openreview.net/forum?id=DiG14qg4ok",
        "pdf_size": 582770,
        "rating": "3;5;5",
        "confidence": "4;4;2",
        "soundness": "2;3;3",
        "contribution": "2;2;3",
        "presentation": "2;3;1",
        "wc_summary": "56;97;68",
        "wc_strengths": "74;31;105",
        "wc_weaknesses": "188;140;282",
        "wc_questions": "40;1;19",
        "wc_review": "358;269;474",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            73.66666666666667,
            17.21110752456745
        ],
        "wc_strengths_avg": [
            70.0,
            30.342489460600735
        ],
        "wc_weaknesses_avg": [
            203.33333333333334,
            58.97645481225726
        ],
        "wc_questions_avg": [
            20.0,
            15.937377450509228
        ],
        "wc_review_avg": [
            367.0,
            83.93251257210561
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:PBdC8PWv0MAJ:scholar.google.com/&scioq=Low-coherence+Subspace+Projection:+Enhance+the+Learning+Capacity+of+Orthogonal+Projection+Methods+on+Long+Task+Sequences&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2;0;0;0;0",
        "aff_unique_norm": "East China Normal University;Sun Yat-sen University;fortiss GmbH",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.ecnu.edu.cn;http://www.sysu.edu.cn;https://www.fortiss.org",
        "aff_unique_abbr": "ECNU;SYSU;Fortiss",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0;0;0;0",
        "aff_country_unique": "China;Germany"
    },
    {
        "title": "MetaCoCo: A New Few-Shot Classification Benchmark with Spurious Correlation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19133",
        "id": "DiWRG9JTWZ",
        "author_site": "Min Zhang, Haoxuan Li, Fei Wu, Kun Kuang",
        "tldr": "",
        "abstract": "Out-of-distribution (OOD) problems in few-shot classification (FSC) occur when novel classes sampled from testing distributions differ from base classes drawn from training distributions, which considerably degrades the performance of deep learning models deployed in real-world applications. Recent studies suggest that the OOD problems in FSC mainly including: (a) cross-domain few-shot classification (CD-FSC) and (b) spurious-correlation few-shot classification (SC-FSC). Specifically, CD-FSC occurs when a classifier learns transferring knowledge from base classes drawn from \\underline{seen} training distributions but recognizes novel classes sampled from unseen testing distributions. In contrast, SC-FSC arises when a classifier relies on non-causal features (or contexts) that happen to be correlated with the labels (or concepts) in base classes but such relationships no longer hold during the model deployment. Despite CD-FSC has been extensively studied, SC-FSC remains understudied due to lack of the corresponding evaluation benchmarks. To this end, we present Meta Concept Context (MetaCoCo), a benchmark with spurious-correlation shifts collected from real-world scenarios. Moreover, to quantify the extent of spurious-correlation shifts of the presented MetaCoCo, we further propose a metric by using CLIP as a pre-trained vision-language model. Extensive experiments on the proposed benchmark are performed to evaluate the state-of-the-art methods in FSC, cross-domain shifts, and self-supervised learning. The experimental results show that the performance of the existing methods degrades significantly in the presence of spurious-correlation shifts. We open-source all codes of our benchmark and hope that the proposed MetaCoCo can facilitate future research on spurious-correlation shifts problems in FSC.",
        "keywords": "Benchmark; Few-shot classification; Spurious-correlation shifts",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Min Zhang;Haoxuan Li;Fei Wu;Kun Kuang",
        "authorids": "~Min_Zhang17;~Haoxuan_Li6;~Fei_Wu1;~Kun_Kuang1",
        "gender": ";M;M;M",
        "homepage": ";https://haoxuanli-pku.github.io/;https://person.zju.edu.cn/wufei;http://kunkuang.github.io",
        "dblp": ";145/4965-1.html;84/3254-1;194/4245",
        "google_scholar": ";gtDqiucAAAAJ;XJLn4MYAAAAJ;https://scholar.google.com.hk/citations?user=FOsNiMQAAAAJ",
        "orcid": ";0000-0003-3620-3769;;0009-0000-7528-8131",
        "linkedin": ";;;",
        "or_profile": "~Min_Zhang17;~Haoxuan_Li6;~Fei_Wu1;~Kun_Kuang1",
        "aff": ";Peking University;Zhejiang University;Zhejiang University",
        "aff_domain": ";pku.edu.cn;zju.edu.cn;zju.edu.cn",
        "position": ";PhD student;Full Professor;Associate Professor",
        "bibtex": "@inproceedings{\nzhang2024metacoco,\ntitle={MetaCoCo: A New Few-Shot Classification Benchmark with Spurious Correlation},\nauthor={Min Zhang and Haoxuan Li and Fei Wu and Kun Kuang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=DiWRG9JTWZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "QLBK;xD6Q;F7nA",
        "pdf_size": 3103466,
        "rating": "5;8;8",
        "confidence": "2;3;4",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "2;3;3",
        "wc_summary": "65;54;90",
        "wc_strengths": "28;32;97",
        "wc_weaknesses": "51;21;71",
        "wc_questions": "55;155;2",
        "wc_review": "199;262;260",
        "wc_reply_reviewers": "0;16;32",
        "wc_reply_authors": "1332;2239;877",
        "reply_reviewers": "0;1;1",
        "reply_authors": "5;5;3",
        "rating_avg": [
            7.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            69.66666666666667,
            15.062831370260005
        ],
        "wc_strengths_avg": [
            52.333333333333336,
            31.626290048347787
        ],
        "wc_weaknesses_avg": [
            47.666666666666664,
            20.548046676563253
        ],
        "wc_questions_avg": [
            70.66666666666667,
            63.436757658491835
        ],
        "wc_review_avg": [
            240.33333333333334,
            29.238483012784517
        ],
        "wc_reply_reviewers_avg": [
            16.0,
            13.063945294843617
        ],
        "wc_reply_authors_avg": [
            1482.6666666666667,
            566.1485866998364
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.8660254037844387,
        "gs_citation": 16,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7285361955939580585&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=DiWRG9JTWZ",
        "pdf": "https://openreview.net/pdf?id=DiWRG9JTWZ",
        "email": ";pku.edu.cn;zju.edu.cn;zju.edu.cn",
        "author_num": 4,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Peking University;Zhejiang University",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.zju.edu.cn",
        "aff_unique_abbr": "Peking U;ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Cleanba: A Reproducible and Efficient Distributed Reinforcement Learning Platform",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19132",
        "id": "Diq6urt3lS",
        "author_site": "Shengyi Huang, Jiayi Weng, Rujikorn Charakorn, Min Lin, Zhongwen Xu, Santiago Ontanon",
        "tldr": "",
        "abstract": "Distributed Deep Reinforcement Learning (DRL) aims to leverage more computational resources to train autonomous agents with less training time. Despite recent progress in the field, reproducibility issues have not been sufficiently explored. This paper first shows that the typical actor-learner framework can have reproducibility issues even if hyperparameters are controlled. We then introduce Cleanba, a new open-source platform for distributed DRL that proposes a highly reproducible architecture. Cleanba implements highly optimized distributed variants of PPO and IMPALA. Our Atari experiments show that these variants can obtain equivalent or higher scores than strong IMPALA baselines in moolib and torchbeast and PPO baseline in CleanRL. However, Cleanba variants present 1) shorter training time and 2) more reproducible learning curves in different hardware settings.",
        "keywords": "Distributed;Deep Reinforcement Learning;Distributed Deep Reinforcement Learning;Reproducibility",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/63e4512ff90171126889b9adb1e1cf01171965c8.pdf",
        "author": "Shengyi Huang;Jiayi Weng;Rujikorn Charakorn;Min Lin;Zhongwen Xu;Santiago Ontanon",
        "authorids": "~Shengyi_Huang1;~Jiayi_Weng1;~Rujikorn_Charakorn1;~Min_Lin1;~Zhongwen_Xu1;~Santiago_Ontanon1",
        "gender": "M;M;M;M;M;",
        "homepage": "https://costa.sh/;https://trinkle23897.github.io/cv/;https://www.rujikorn.com/;https://linmin.me;https://zhongwen.one/;https://sites.google.com/site/santiagoontanonvillar/",
        "dblp": "251/8731;;257/3015;;130/5077;https://dblp.org/pers/o/Onta=ntilde==oacute=n:Santiago.html",
        "google_scholar": "kl9YcpEAAAAJ;CQrkQbIAAAAJ;https://scholar.google.com/citations?hl=en;BGONmkIAAAAJ;https://scholar.google.co.uk/citations?user=T4xuHn8AAAAJ;aS-DrOwAAAAJ",
        "orcid": ";;;;;",
        "linkedin": "costa-huang/;trinkle23897/;;min-lin-08a3a422/;;",
        "or_profile": "~Shengyi_Huang1;~Jiayi_Weng1;~Rujikorn_Charakorn1;~Min_Lin1;~Zhongwen_Xu1;~Santiago_Ontanon1",
        "aff": "Hugging Face;OpenAI;Sakana AI;Sea AI Lab;Tencent;Drexel University",
        "aff_domain": "huggingface.co;openai.com;sakana.ai;sea.com;tencent.com;drexel.edu",
        "position": "Researcher;Researcher;Intern;Principal Researcher;Principal Researcher;Associate Professor",
        "bibtex": "@inproceedings{\nhuang2024cleanba,\ntitle={Cleanba: A Reproducible and Efficient Distributed Reinforcement Learning Platform},\nauthor={Shengyi Huang and Jiayi Weng and Rujikorn Charakorn and Min Lin and Zhongwen Xu and Santiago Ontanon},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Diq6urt3lS}\n}",
        "github": "",
        "project": "",
        "reviewers": "Z35M;eKtC;Ui8X;fstX",
        "pdf_size": 12810509,
        "rating": "3;6;6;6",
        "confidence": "4;4;3;3",
        "soundness": "2;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "23;145;64;92",
        "wc_strengths": "11;109;39;40",
        "wc_weaknesses": "133;114;381;66",
        "wc_questions": "5;167;68;26",
        "wc_review": "172;535;552;224",
        "wc_reply_reviewers": "83;18;21;70",
        "wc_reply_authors": "1541;242;1338;1173",
        "reply_reviewers": "2;1;1;1",
        "reply_authors": "4;1;2;2",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            81.0,
            44.35651023243375
        ],
        "wc_strengths_avg": [
            49.75,
            36.134298111351214
        ],
        "wc_weaknesses_avg": [
            173.5,
            122.26303611476365
        ],
        "wc_questions_avg": [
            66.5,
            62.29967897188556
        ],
        "wc_review_avg": [
            370.75,
            173.82947822506975
        ],
        "wc_reply_reviewers_avg": [
            48.0,
            28.88771365130858
        ],
        "wc_reply_authors_avg": [
            1073.5,
            497.44572568271207
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            1.0897247358851685
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18277814440454210752&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=Diq6urt3lS",
        "pdf": "https://openreview.net/pdf?id=Diq6urt3lS",
        "email": "huggingface.co;openai.com;sakana.ai;sea.com;tencent.com;drexel.edu",
        "author_num": 6,
        "aff_unique_index": "0;1;2;3;4;5",
        "aff_unique_norm": "Hugging Face;OpenAI;Sakana AI;Sea AI Lab;Tencent;Drexel University",
        "aff_unique_dep": ";;;;Tencent Holdings Limited;",
        "aff_unique_url": "https://huggingface.co;https://openai.com;;;https://www.tencent.com;https://www.drexel.edu",
        "aff_unique_abbr": "Hugging Face;OpenAI;;;Tencent;Drexel",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;2;0",
        "aff_country_unique": "United States;;China"
    },
    {
        "title": "Scalable Monotonic Neural Networks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19131",
        "id": "DjIsNDEOYX",
        "author_site": "Hyunho Kim, Jong-Seok Lee",
        "tldr": "",
        "abstract": "In this research, we focus on the problem of learning monotonic neural networks, as preserving the monotonicity of a model with respect to a subset of inputs is crucial for practical applications across various domains. Although several methods have recently been proposed to address this problem, they have limitations such as not guaranteeing monotonicity in certain cases, requiring additional inference time, lacking scalability with increasing network size and number of monotonic inputs, and manipulating network weights during training. To overcome these limitations, we introduce a simple but novel architecture of the partially connected network which incorporates a 'scalable monotonic hidden layer' comprising three units: the exponentiated unit, ReLU unit, and confluence unit. This allows for the repetitive integration of the scalable monotonic hidden layers without other structural constraints. Consequently, our method offers ease of implementation and rapid training through the conventional error-backpropagation algorithm. We accordingly term this method as Scalable Monotonic Neural Networks (SMNN). Numerical experiments demonstrated that our method achieved comparable prediction accuracy to the state-of-the-art approaches while effectively addressing the aforementioned weaknesses.",
        "keywords": "neural networks;monotonicity;scalability;conventional error-backpropagation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/9d0f373f9c75711c40bc57099dc4e044b4f00804.zip",
        "author": "Hyunho Kim;Jong-Seok Lee",
        "authorids": "~Hyunho_Kim2;~Jong-Seok_Lee2",
        "gender": "M;M",
        "homepage": "http://infosci.skku.ac.kr/;",
        "dblp": ";",
        "google_scholar": "xGJI4wkAAAAJ;7BxzwPQAAAAJ",
        "orcid": "0000-0002-4118-6580;0000-0001-5255-4425",
        "linkedin": "hyunhokim319/;",
        "or_profile": "~Hyunho_Kim2;~Jong-Seok_Lee2",
        "aff": "Sung Kyun Kwan University;Korea Advanced Institute of Science & Technology",
        "aff_domain": "skku.edu;kaist.ac.kr",
        "position": "PhD student;Associate Professor",
        "bibtex": "@inproceedings{\nkim2024scalable,\ntitle={Scalable Monotonic Neural Networks},\nauthor={Hyunho Kim and Jong-Seok Lee},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=DjIsNDEOYX}\n}",
        "github": "",
        "project": "",
        "reviewers": "iEFi;tddM;y34F;sRQA",
        "pdf_size": 1069514,
        "rating": "5;5;8;8",
        "confidence": "5;3;3;3",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "42;164;77;32",
        "wc_strengths": "31;50;85;182",
        "wc_weaknesses": "198;44;125;507",
        "wc_questions": "86;75;457;67",
        "wc_review": "357;333;744;788",
        "wc_reply_reviewers": "229;0;266;188",
        "wc_reply_authors": "1085;687;621;1257",
        "reply_reviewers": "2;0;3;1",
        "reply_authors": "4;1;3;3",
        "rating_avg": [
            6.5,
            1.5
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            78.75,
            51.977759666996036
        ],
        "wc_strengths_avg": [
            87.0,
            58.16786054171152
        ],
        "wc_weaknesses_avg": [
            218.5,
            175.246255309493
        ],
        "wc_questions_avg": [
            171.25,
            165.11567914646992
        ],
        "wc_review_avg": [
            555.5,
            211.24452655631103
        ],
        "wc_reply_reviewers_avg": [
            170.75,
            102.37034482700544
        ],
        "wc_reply_authors_avg": [
            912.5,
            266.5797254106171
        ],
        "reply_reviewers_avg": [
            1.5,
            1.118033988749895
        ],
        "reply_authors_avg": [
            2.75,
            1.0897247358851685
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5773502691896258,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2938478833018546596&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=DjIsNDEOYX",
        "pdf": "https://openreview.net/pdf?id=DjIsNDEOYX",
        "email": "skku.edu;kaist.ac.kr",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Sungkyunkwan University;Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.skku.edu;https://www.kaist.ac.kr",
        "aff_unique_abbr": "SKKU;KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "Robustifying State-space Models for Long Sequences via Approximate Diagonalization",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19130",
        "id": "DjeQ39QoLQ",
        "author_site": "Annan Yu, Arnur Nigmetov, Dmitriy Morozov, Michael W Mahoney, N. Benjamin Erichson",
        "tldr": "",
        "abstract": "State-space models (SSMs) have recently emerged as a framework for learning long-range sequence tasks. An example is the structured state-space sequence (S4) layer, which uses the diagonal-plus-low-rank structure of the HiPPO initialization framework. However, the complicated structure of the S4 layer poses challenges; and, in an effort to address these challenges, models such as S4D and S5 have considered a purely diagonal structure. This choice simplifies the implementation, improves computational efficiency, and allows channel communication. However, diagonalizing the HiPPO framework is itself an ill-posed problem. In this paper, we propose a general solution for this and related ill-posed diagonalization problems in machine learning. We introduce a generic, backward-stable ``perturb-then-diagonalize'' (PTD) methodology, which is based on the pseudospectral theory of non-normal operators, and which may be interpreted as the approximate diagonalization of the non-normal matrices defining SSMs. Based on this, we introduce the S4-PTD and S5-PTD models. Through theoretical analysis of the transfer functions of different initialization schemes, we demonstrate that the S4-PTD/S5-PTD initialization strongly converges to the HiPPO framework, while the S4D/S5 initialization only achieves weak convergences. As a result, our new models show resilience to Fourier-mode noise-perturbed inputs, a crucial property not achieved by the S4D/S5 models. In addition to improved robustness, our S5-PTD model averages 87.6% accuracy on the Long-Range Arena benchmark, demonstrating that the PTD methodology helps to improve the accuracy of deep learning models.",
        "keywords": "state-space models;sequence models;Long-Range Arena;recurrent neural networks",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/fab8b8cfaf84fd5cf0a847c78953401e170487b8.zip",
        "author": "Annan Yu;Arnur Nigmetov;Dmitriy Morozov;Michael W. Mahoney;N. Benjamin Erichson",
        "authorids": "~Annan_Yu1;~Arnur_Nigmetov1;~Dmitriy_Morozov1;~Michael_W._Mahoney1;~N._Benjamin_Erichson1",
        "gender": "M;M;M;;M",
        "homepage": "https://annanyu.com/;;https://mrzv.org;;https://www.benerichson.com/",
        "dblp": "302/3962;173/4724.html;80/5570;;173/5153",
        "google_scholar": ";YWztX1wAAAAJ;;;https://scholar.google.co.uk/citations?user=8ViYcioAAAAJ",
        "orcid": ";0000-0003-4823-5311;;;",
        "linkedin": ";;;;",
        "or_profile": "~Annan_Yu1;~Arnur_Nigmetov1;~Dmitriy_Morozov1;~Michael_W._Mahoney1;~N._Benjamin_Erichson1",
        "aff": "Cornell University;Lawrence Berkeley National Lab;Lawrence Berkeley National Lab;;Lawrence Berkeley National Lab",
        "aff_domain": "cornell.edu;lbl.gov;lbl.gov;;lbl.gov",
        "position": "PhD student;Researcher;Researcher;;Researcher",
        "bibtex": "@inproceedings{\nyu2024robustifying,\ntitle={Robustifying State-space Models for Long Sequences via Approximate Diagonalization},\nauthor={Annan Yu and Arnur Nigmetov and Dmitriy Morozov and Michael W. Mahoney and N. Benjamin Erichson},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=DjeQ39QoLQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "X2Rr;faKE;Xrm4;eMiw",
        "pdf_size": 7124061,
        "rating": "6;6;6;8",
        "confidence": "3;3;2;5",
        "soundness": "3;2;3;4",
        "contribution": "3;3;3;3",
        "presentation": "3;3;3;4",
        "wc_summary": "104;66;78;151",
        "wc_strengths": "66;58;22;97",
        "wc_weaknesses": "346;605;17;155",
        "wc_questions": "4;513;23;638",
        "wc_review": "520;1242;140;1041",
        "wc_reply_reviewers": "10;166;22;83",
        "wc_reply_authors": "647;1715;605;1260",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;3;2;3",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            1.0897247358851685
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            99.75,
            32.62188682464581
        ],
        "wc_strengths_avg": [
            60.75,
            26.69620759583653
        ],
        "wc_weaknesses_avg": [
            280.75,
            220.66532917520144
        ],
        "wc_questions_avg": [
            294.5,
            284.533389956258
        ],
        "wc_review_avg": [
            735.75,
            433.2818799580707
        ],
        "wc_reply_reviewers_avg": [
            70.25,
            61.82384248815339
        ],
        "wc_reply_authors_avg": [
            1056.75,
            460.04802738409825
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.9271726499455306,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9446291322992497075&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=DjeQ39QoLQ",
        "pdf": "https://openreview.net/pdf?id=DjeQ39QoLQ",
        "email": "cornell.edu;lbl.gov;lbl.gov;;lbl.gov",
        "author_num": 5,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Cornell University;Lawrence Berkeley National Laboratory",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cornell.edu;https://www.lbl.gov",
        "aff_unique_abbr": "Cornell;LBNL",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Berkeley",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Simplicial Representation Learning with Neural $k$-Forms",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19129",
        "id": "Djw0XhjHZb",
        "author_site": "Kelly Maggs, Celia Hacker, Bastian Rieck",
        "tldr": "",
        "abstract": "Geometric deep learning extends deep learning to incorporate information about the geometry and topology data, especially in complex domains like graphs. Despite the popularity of message passing in this field, it has limitations such as the need for graph rewiring, ambiguity in interpreting data, and over-smoothing. In this paper, we take a different approach, focusing on leveraging geometric information from simplicial complexes embedded in $\\mathbb{R}^n$ using node coordinates. We use differential $k$-forms in $\\mathbb{R}^n$ to create representations of simplices, offering interpretability and geometric consistency without message passing. This approach also enables us to apply differential geometry tools and achieve universal approximation. Our method is efficient, versatile, and applicable to various input complexes, including graphs, simplicial complexes, and cell complexes. It outperforms existing message passing neural networks in harnessing information from geometrical graphs with node features serving as coordinates.",
        "keywords": "geometric deep learning;differential forms;representation learning;graph learning;geometry;topology",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Kelly Maggs;Celia Hacker;Bastian Rieck",
        "authorids": "~Kelly_Maggs1;~Celia_Hacker1;~Bastian_Rieck1",
        "gender": "M;;M",
        "homepage": "https://sites.google.com/view/kelly-maggs;https://people.epfl.ch/celia.hacker;https://bastian.rieck.me",
        "dblp": ";;119/8860",
        "google_scholar": ";;https://scholar.google.ch/citations?user=La7zuKQAAAAJ",
        "orcid": "0009-0003-8115-8706;;0000-0003-4335-0302",
        "linkedin": ";;br-ml/",
        "or_profile": "~Kelly_Maggs1;~Celia_Hacker1;~Bastian_Rieck1",
        "aff": "EPFL - EPF Lausanne;;Helmholtz Zentrum M\u00fcnchen",
        "aff_domain": "epfl.ch;;helmholtz-munich.de",
        "position": "PhD student;;Principal Investigator",
        "bibtex": "@inproceedings{\nmaggs2024simplicial,\ntitle={Simplicial Representation Learning with Neural \\$k\\$-Forms},\nauthor={Kelly Maggs and Celia Hacker and Bastian Rieck},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Djw0XhjHZb}\n}",
        "github": "",
        "project": "",
        "reviewers": "E4oE;VjaY;gTeC;pNcs;rtvN",
        "pdf_size": 2778633,
        "rating": "5;5;6;6;8",
        "confidence": "2;4;4;2;2",
        "soundness": "2;3;3;3;4",
        "contribution": "2;2;3;4;3",
        "presentation": "2;3;2;3;2",
        "wc_summary": "76;78;75;80;76",
        "wc_strengths": "11;17;52;117;37",
        "wc_weaknesses": "34;141;130;91;157",
        "wc_questions": "30;67;515;37;229",
        "wc_review": "151;303;772;325;499",
        "wc_reply_reviewers": "0;0;36;0;42",
        "wc_reply_authors": "353;843;1508;671;1311",
        "reply_reviewers": "0;0;1;0;1",
        "reply_authors": "1;2;2;2;3",
        "rating_avg": [
            6.0,
            1.0954451150103321
        ],
        "confidence_avg": [
            2.8,
            0.9797958971132712
        ],
        "soundness_avg": [
            3.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            2.8,
            0.7483314773547882
        ],
        "presentation_avg": [
            2.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            77.0,
            1.7888543819998317
        ],
        "wc_strengths_avg": [
            46.8,
            38.00210520484359
        ],
        "wc_weaknesses_avg": [
            110.6,
            44.057235501106966
        ],
        "wc_questions_avg": [
            175.6,
            184.52490346833946
        ],
        "wc_review_avg": [
            410.0,
            212.0
        ],
        "wc_reply_reviewers_avg": [
            15.6,
            19.2
        ],
        "wc_reply_authors_avg": [
            937.2,
            421.08545451012674
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            2.0,
            0.6324555320336759
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.372677996249965,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11385511452934141485&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=Djw0XhjHZb",
        "pdf": "https://openreview.net/pdf?id=Djw0XhjHZb",
        "email": "epfl.ch;;helmholtz-munich.de",
        "author_num": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "EPFL;Helmholtz Zentrum M\u00fcnchen",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.epfl.ch;https://www.helmholtz-muenchen.de",
        "aff_unique_abbr": "EPFL;",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Lausanne;",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Switzerland;Germany"
    },
    {
        "title": "CLIPSelf: Vision Transformer Distills Itself for Open-Vocabulary Dense Prediction",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19128",
        "id": "DjzvJCRsVf",
        "author_site": "Size Wu, Wenwei Zhang, Lumin Xu, Sheng Jin, Xiangtai Li, Wentao Liu, Chen Change Loy",
        "tldr": "",
        "abstract": "Open-vocabulary dense prediction tasks including object detection and image segmentation have been advanced by the success of Contrastive Language-Image Pre-training (CLIP). CLIP models, particularly those incorporating vision transformers (ViTs), have exhibited remarkable generalization ability in zero-shot image classification. However, when transferring the vision-language alignment of CLIP from global image representation to local region representation for the open-vocabulary dense prediction tasks, CLIP ViTs suffer from the domain shift from full images to local image regions. In this paper, we embark on an in-depth analysis of the region-language alignment in CLIP models, which is essential for downstream open-vocabulary dense prediction tasks. Subsequently, we propose an approach named CLIPSelf, which adapts the image-level recognition ability of CLIP ViT to local image regions without needing any region-text pairs. CLIPSelf empowers ViTs to distill itself by aligning a region representation extracted from its dense feature map with the image-level representation of the corresponding image crop. With the enhanced CLIP ViTs, we achieve new state-of-the-art performance on open-vocabulary object detection, semantic segmentation, and panoptic segmentation across various benchmarks. Models and code are released at https://github.com/wusize/CLIPSelf.",
        "keywords": "open-vocabulary object detection;open-vocabulary image segmentation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Size Wu;Wenwei Zhang;Lumin Xu;Sheng Jin;Xiangtai Li;Wentao Liu;Chen Change Loy",
        "authorids": "~Size_Wu1;~Wenwei_Zhang1;~Lumin_Xu1;~Sheng_Jin1;~Xiangtai_Li1;~Wentao_Liu1;~Chen_Change_Loy2",
        "gender": "M;M;;M;;M;M",
        "homepage": "https://wusize.github.io/;https://zhangwenwei.cn;http://mmlab.ie.cuhk.edu.hk;https://jin-s13.github.io/;;;https://www.mmlab-ntu.com/person/ccloy/index.html",
        "dblp": "301/9535;;212/1288;70/6780-7;;30/3943-2;01/5855",
        "google_scholar": "y2S02IcAAAAJ;QDXADSEAAAAJ;;wrNd--oAAAAJ;;KZn9NWEAAAAJ;https://scholar.google.co.uk/citations?user=559LF80AAAAJ",
        "orcid": ";0000-0002-2748-4514;;0000-0001-5736-7434;;;0000-0001-5345-1591",
        "linkedin": "%E6%80%9D%E6%B3%BD-%E5%90%B4-721544198/;wenweizhang-b9769a124/;;;;;",
        "or_profile": "~Size_Wu1;~Wenwei_Zhang1;~Lumin_Xu1;~Sheng_Jin1;~Xiangtai_Li1;~Wentao_Liu1;~Chen_Change_Loy2",
        "aff": "Nanyang Technological University;Shanghai AI Laboratory;The Chinese University of Hong Kong;The University of Hong Kong;;Sensetime;Nanyang Technological University",
        "aff_domain": "ntu.edu.sg;pjlab.org.cn;cuhk.edu.hk;hku.hk;;sensetime.com;ntu.edu.sg",
        "position": "PhD student;Researcher;PhD student;PhD student;;Senior Researcher;Full Professor",
        "bibtex": "@inproceedings{\nwu2024clipself,\ntitle={{CLIPS}elf: Vision Transformer Distills Itself for Open-Vocabulary Dense Prediction},\nauthor={Size Wu and Wenwei Zhang and Lumin Xu and Sheng Jin and Xiangtai Li and Wentao Liu and Chen Change Loy},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=DjzvJCRsVf}\n}",
        "github": "",
        "project": "",
        "reviewers": "xSsC;BRE4;CnGz;yRsy",
        "pdf_size": 7528005,
        "rating": "6;6;8;8",
        "confidence": "4;4;5;4",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;4;4",
        "wc_summary": "157;138;132;75",
        "wc_strengths": "215;124;244;64",
        "wc_weaknesses": "265;144;374;170",
        "wc_questions": "31;54;25;181",
        "wc_review": "668;460;775;490",
        "wc_reply_reviewers": "551;0;28;43",
        "wc_reply_authors": "1490;584;286;780",
        "reply_reviewers": "2;0;1;1",
        "reply_authors": "5;3;3;3",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            125.5,
            30.581857366746057
        ],
        "wc_strengths_avg": [
            161.75,
            71.72996235883579
        ],
        "wc_weaknesses_avg": [
            238.25,
            90.3946209682855
        ],
        "wc_questions_avg": [
            72.75,
            63.42860159265692
        ],
        "wc_review_avg": [
            598.25,
            129.36068761412795
        ],
        "wc_reply_reviewers_avg": [
            155.5,
            228.86295025626146
        ],
        "wc_reply_authors_avg": [
            785.0,
            443.41064488800896
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            3.5,
            0.8660254037844386
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 67,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9286809064946144834&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=DjzvJCRsVf",
        "pdf": "https://openreview.net/pdf?id=DjzvJCRsVf",
        "email": "ntu.edu.sg;pjlab.org.cn;cuhk.edu.hk;hku.hk;;sensetime.com;ntu.edu.sg",
        "author_num": 7,
        "aff_unique_index": "0;1;2;3;4;0",
        "aff_unique_norm": "Nanyang Technological University;Shanghai AI Laboratory;Chinese University of Hong Kong;University of Hong Kong;SenseTime",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.ntu.edu.sg;https://www.shanghai-ai-lab.com;https://www.cuhk.edu.hk;https://www.hku.hk;https://www.sensetime.com",
        "aff_unique_abbr": "NTU;SAIL;CUHK;HKU;SenseTime",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;1;1;1;1;0",
        "aff_country_unique": "Singapore;China"
    },
    {
        "id": "Dk10QugVHb",
        "title": "Causal analysis of social bias in CLIP",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We propose the first experimental study to causally measure bias in social perception in the latent space of multi-modal models. Previous studies compute correlations between a model's social judgments and protected attributes, such as race, age, and gender, using observational wild-collected human-annotated datasets, such as FairFace. In order to establish causal links between protected attributes and algorithmic bias, we use a synthetic dataset of face images instead, CausalFace, where both legally protected attributes and potential confound attributes, such as facial expression, lighting, and pose, are controlled independently and systematically, and thus allow an experimental exploration, which lets us reach causal conclusions. Our analysis is based on measuring cosine similarities between images and word prompts, including valence words drawn from the two leading social psychology theories elucidating human stereotypes: The ABC Model and the Stereotype Content Model. We find that non-protected attributes are powerful confounds and profoundly influence social perception, injecting variability in measurements whose size is comparable to that induced by legally protected attributes. Clear intersecting biases of race, gender, and age only emerge when these unprotected attributes are controlled for, which is only possible using CausalFace. FairFace does not permit a similar level of insight due to spurious correlations introduced by uncontrolled attributes and a lack of specific annotations.",
        "keywords": "CLIP;Social biases;Causal datasets;Confounds;Valence words;Social psychology;Stereotypes",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/23332b2908549f18b3145074903674e13142f633.pdf",
        "author": "Carina I Hausladen;Manuel Knott;Pietro Perona;Colin Camerer",
        "authorids": "~Carina_I_Hausladen1;~Manuel_Knott1;~Pietro_Perona1;~Colin_Camerer1",
        "gender": "F;M;Not Specified;",
        "homepage": "http://carinahausladen.github.io;;https://www.vision.caltech.edu;https://camerergroup.caltech.edu/",
        "dblp": ";222/9651;p/PietroPerona.html;",
        "google_scholar": "hzSOg6MAAAAJ;e9xfiKEAAAAJ;j29kMCwAAAAJ;",
        "orcid": "0000-0003-4397-2339;0000-0002-5447-4549;0000-0002-7583-5809;",
        "linkedin": "carina-hausladen/;manuel-knott-119555162/;https://www.linkedin.com/company/perona/;",
        "or_profile": "~Carina_I_Hausladen1;~Manuel_Knott1;~Pietro_Perona1;~Colin_Camerer1",
        "aff": "ETHZ - ETH Zurich;EMPA Swiss Federal Laboratories for Materials Science and Technology;California Institute of Technology;California Institute of Technology",
        "aff_domain": "ethz.ch;empa.ch;caltech.edu;caltech.edu",
        "position": "Postdoc;PhD student;Full Professor;Full Professor",
        "bibtex": "@misc{\nhausladen2024causal,\ntitle={Causal analysis of social bias in {CLIP}},\nauthor={Carina I Hausladen and Manuel Knott and Pietro Perona and Colin Camerer},\nyear={2024},\nurl={https://openreview.net/forum?id=Dk10QugVHb}\n}",
        "github": "",
        "project": "",
        "reviewers": "mYoV;3zN2;SWyU;qwQ3",
        "site": "https://openreview.net/forum?id=Dk10QugVHb",
        "pdf_size": 776381,
        "rating": "3;6;6;8",
        "confidence": "3;4;2;4",
        "soundness": "2;3;3;4",
        "contribution": "1;3;3;4",
        "presentation": "3;2;3;3",
        "wc_summary": "40;283;54;72",
        "wc_strengths": "33;52;79;46",
        "wc_weaknesses": "301;244;74;256",
        "wc_questions": "62;136;25;99",
        "wc_review": "436;715;232;473",
        "wc_reply_reviewers": "293;63;0;35",
        "wc_reply_authors": "2101;992;664;719",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "4;3;2;1",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            1.0897247358851685
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            112.25,
            99.2329960245079
        ],
        "wc_strengths_avg": [
            52.5,
            16.77050983124842
        ],
        "wc_weaknesses_avg": [
            218.75,
            86.23043256298787
        ],
        "wc_questions_avg": [
            80.5,
            41.36725758374611
        ],
        "wc_review_avg": [
            464.0,
            171.52988077883106
        ],
        "wc_reply_reviewers_avg": [
            97.75,
            114.91600193184586
        ],
        "wc_reply_authors_avg": [
            1119.0,
            580.4046002574411
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.37998029782867415,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2222326689190423415&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;2",
        "aff_unique_norm": "ETH Zurich;Swiss Federal Laboratories for Materials Science and Technology;California Institute of Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ethz.ch;https://www.empa.ch;https://www.caltech.edu",
        "aff_unique_abbr": "ETHZ;EMPA;Caltech",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Pasadena",
        "aff_country_unique_index": "0;0;1;1",
        "aff_country_unique": "Switzerland;United States"
    },
    {
        "id": "Dk1ybhMrJv",
        "title": "Pretrained deep models outperform GBDTs in Learning-To-Rank under label scarcity",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "While deep learning (DL) models are state-of-the-art in text and image domains, they have not yet consistently outperformed Gradient Boosted Decision Trees (GBDTs) on tabular Learning-To-Rank (LTR) problems. Most of the recent performance gains attained by DL models in text and image tasks have used unsupervised pretraining, which exploits orders of magnitude more unlabeled data than labeled data. To the best of our knowledge, unsupervised pretraining has not been applied to the LTR problem, which often produces vast amounts of unlabeled data.\n\nIn this work, we study whether unsupervised pretraining of deep models can improve LTR performance over GBDTs and other non-pretrained models. By incorporating simple design choices--including SimCLR-Rank, an LTR-specific pretraining loss--we produce pretrained deep learning models that consistently (across datasets) outperform GBDTs (and other non-pretrained rankers) in the case where there is more unlabeled data than labeled data.  This performance improvement occurs not only on average but also on outlier queries.  We base our empirical conclusions off of experiments on (1) public benchmark tabular LTR datasets, and (2) a large industry-scale proprietary ranking dataset. Code is provided at https://anonymous.4open.science/r/ltr-pretrain-0DAD/README.md.",
        "keywords": "Learning-To-Rank;Gradient Boosted Decision Trees;Deep learning;Self-supervised learning;Unsupervised pretraining",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Charlie Hou;Kiran Koshy Thekumparampil;Michael Shavlovsky;Giulia Fanti;Yesh Dattatreya;sujay sanghavi",
        "authorids": "~Charlie_Hou1;~Kiran_Koshy_Thekumparampil1;~Michael_Shavlovsky1;~Giulia_Fanti1;~Yesh_Dattatreya1;~sujay_sanghavi1",
        "gender": ";M;M;;M;M",
        "homepage": "https://www.andrew.cmu.edu/user/charlieh/;http://thekump2.web.engr.illinois.edu;;https://www.andrew.cmu.edu/user/gfanti/;;https://sites.utexas.edu/sanghavi",
        "dblp": ";142/2840;130/0377;141/9910;;69/4911.html",
        "google_scholar": "92wmC6gAAAAJ;0gJQCIgAAAAJ;;Rn_BmTYAAAAJ;;O-DazBUAAAAJ",
        "orcid": ";;;0000-0002-7671-2624;;",
        "linkedin": "charlie-hou-027a19113/;;;;yeshwantdattatreya/;",
        "or_profile": "~Charlie_Hou1;~Kiran_Koshy_Thekumparampil1;~Michael_Shavlovsky1;~Giulia_Fanti1;~Yesh_Dattatreya1;~sujay_sanghavi1",
        "aff": "Carnegie Mellon University;Amazon;Amazon;Carnegie Mellon University;Amazon;University of Texas, Austin",
        "aff_domain": "andrew.cmu.edu;amazon.com;amazon.com;andrew.cmu.edu;amazon.com;utexas.edu",
        "position": "PhD student;Researcher;PhD student;Assistant Professor;Researcher;Associate Professor",
        "bibtex": "@misc{\nhou2024pretrained,\ntitle={Pretrained deep models outperform {GBDT}s in Learning-To-Rank under label scarcity},\nauthor={Charlie Hou and Kiran Koshy Thekumparampil and Michael Shavlovsky and Giulia Fanti and Yesh Dattatreya and sujay sanghavi},\nyear={2024},\nurl={https://openreview.net/forum?id=Dk1ybhMrJv}\n}",
        "github": "",
        "project": "",
        "reviewers": "oW1i;1XYq;i3NM",
        "site": "https://openreview.net/forum?id=Dk1ybhMrJv",
        "pdf_size": 2162646,
        "rating": "5;5;6",
        "confidence": "5;3;4",
        "soundness": "3;2;3",
        "contribution": "2;2;3",
        "presentation": "3;2;3",
        "wc_summary": "76;90;84",
        "wc_strengths": "71;23;110",
        "wc_weaknesses": "410;134;269",
        "wc_questions": "4;85;12",
        "wc_review": "561;332;475",
        "wc_reply_reviewers": "423;242;0",
        "wc_reply_authors": "4124;3716;1718",
        "reply_reviewers": "4;2;0",
        "reply_authors": "11;8;5",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            83.33333333333333,
            5.734883511361751
        ],
        "wc_strengths_avg": [
            68.0,
            35.58089374931439
        ],
        "wc_weaknesses_avg": [
            271.0,
            112.68540278137182
        ],
        "wc_questions_avg": [
            33.666666666666664,
            36.444783196257625
        ],
        "wc_review_avg": [
            456.0,
            94.44928092191421
        ],
        "wc_reply_reviewers_avg": [
            221.66666666666666,
            173.28653214321713
        ],
        "wc_reply_authors_avg": [
            3186.0,
            1051.3115618121965
        ],
        "reply_reviewers_avg": [
            2.0,
            1.632993161855452
        ],
        "reply_authors_avg": [
            8.0,
            2.449489742783178
        ],
        "replies_avg": [
            35,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3703131703213888605&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1;0;1;2",
        "aff_unique_norm": "Carnegie Mellon University;Amazon;University of Texas at Austin",
        "aff_unique_dep": ";Amazon.com, Inc.;",
        "aff_unique_url": "https://www.cmu.edu;https://www.amazon.com;https://www.utexas.edu",
        "aff_unique_abbr": "CMU;Amazon;UT Austin",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Austin",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "DkYQHewNcp",
        "title": "Unsupervised Detection of Recurrent Patterns in Neural Recordings with Constrained Filters",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Structured spontaneous neural activity, characterized by the expression of repetitive patterns, is crucial for memory, learning and spatial navigation. However, investigating the functional role of these patterns has been challenging due to a lack of scalable methods for detecting them in large-scale recordings. To address this challenge, we propose an unsupervised approach that utilizes backpropagation to optimize the parameters of a predefined number of spatiotemporal filters, which serve as pattern detectors. We demonstrate the scalability and efficiency of our approach for detecting place cell sequences in biologically plausible synthetic and real datasets obtained from the mouse hippocampus. Our speed benchmarks demonstrate that our method significantly outperforms prior art, enabling the study of spontaneous activity in larger recordings.",
        "keywords": "spike sequences;place cells;recurrent pattern detection",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/fa0786a6df5ef5e4e9739d1793822ace8021aa2e.zip",
        "author": "Roman Koshkin;Tomoki Fukai",
        "authorids": "~Roman_Koshkin1;~Tomoki_Fukai1",
        "gender": "M;M",
        "homepage": "https://roman-koshkin.unit.oist.jp;https://groups.oist.jp/ncbc",
        "dblp": "351/7581.html;",
        "google_scholar": "OpQXH3cAAAAJ;https://scholar.google.co.jp/citations?user=iO7jHc4AAAAJ",
        "orcid": "0000-0002-8739-4545;my-orcid?orcid=0000-0001-6977-5638",
        "linkedin": "romankoshkininterpreter/;",
        "or_profile": "~Roman_Koshkin1;~Tomoki_Fukai1",
        "aff": "Okinawa Institute of Science and Technology (OIST);Okinawa Institute of Science and Technology (OIST)",
        "aff_domain": "oist.jp;oist.jp",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nkoshkin2024unsupervised,\ntitle={Unsupervised Detection of Recurrent Patterns in Neural Recordings with Constrained Filters},\nauthor={Roman Koshkin and Tomoki Fukai},\nyear={2024},\nurl={https://openreview.net/forum?id=DkYQHewNcp}\n}",
        "github": "",
        "project": "",
        "reviewers": "qa1s;C8pe;u7XE",
        "site": "https://openreview.net/forum?id=DkYQHewNcp",
        "pdf_size": 5625095,
        "rating": "5;6;8",
        "confidence": "3;3;3",
        "soundness": "2;3;4",
        "contribution": "2;3;3",
        "presentation": "3;3;4",
        "wc_summary": "60;33;79",
        "wc_strengths": "87;81;60",
        "wc_weaknesses": "78;66;71",
        "wc_questions": "192;48;306",
        "wc_review": "417;228;516",
        "wc_reply_reviewers": "221;11;297",
        "wc_reply_authors": "1447;278;1779",
        "reply_reviewers": "1;1;3",
        "reply_authors": "4;2;5",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            57.333333333333336,
            18.87385022252275
        ],
        "wc_strengths_avg": [
            76.0,
            11.575836902790225
        ],
        "wc_weaknesses_avg": [
            71.66666666666667,
            4.921607686744467
        ],
        "wc_questions_avg": [
            182.0,
            105.56514576317318
        ],
        "wc_review_avg": [
            387.0,
            119.47384651043926
        ],
        "wc_reply_reviewers_avg": [
            176.33333333333334,
            120.95545552897654
        ],
        "wc_reply_authors_avg": [
            1168.0,
            643.7551294294025
        ],
        "reply_reviewers_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            1.247219128924647
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:gOeNB-3n6WgJ:scholar.google.com/&scioq=Unsupervised+Detection+of+Recurrent+Patterns+in+Neural+Recordings+with+Constrained+Filters&hl=en&as_sdt=0,23",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Okinawa Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.oist.jp",
        "aff_unique_abbr": "OIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Japan"
    },
    {
        "id": "DkhYlWZq84",
        "title": "Protein Captioning: Bridging the Gap between Protein Sequences and Natural Languages",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We introduce the task of Protein Captioning, which is an easy-to-understand and flexible way for protein analysis. Compared to specific protein recognition or classification tasks, such as enzyme reaction classification and gene ontology term prediction, protein captioning provides comprehensive textural descriptions for proteins, thus playing a key role in bridging the gap between protein sequences and natural languages. To address the problem, we propose a simple yet effective method, Protein-to-Text Generative Pre-trained Transformer (P2T-GPT), to translate the chain of amino acid residues in a protein to a sequence of natural language words, i.e., text. For the evaluation of protein captioning, we collect a ProteinCap dataset that contains 94,454 protein-text pairs. Experiments on  ProteinCap demonstrate the effectiveness of the proposed P2T-GPT on protein captioning. As minor contributions, first, P2T-GPT provides a way to connect protein science and Large Language Models (LLMs). By appending ChatGPT, our method can interact in a conversational way to answer questions given a protein. Second, we show that protein captioning can be treated as a pre-trained task that can benefit a range of downstream tasks, to a certain extent. The code has been submitted in the supplementary material and will be publicly available.",
        "keywords": "natural language processing;protein representation learning;protein captioning",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/aaf7fa42b3da77b3e1b6fac0dca47c2191c2448d.zip",
        "author": "Jianrong Zhang;Hehe Fan;Yi Yang",
        "authorids": "~Jianrong_Zhang1;~Hehe_Fan1;~Yi_Yang22",
        "gender": "M;M;M",
        "homepage": ";https://hehefan.github.io;https://person.zju.edu.cn/yiyang",
        "dblp": "119/5950;184/5722.html;33/4854-1.html",
        "google_scholar": "R3O1gFYAAAAJ;hVuflMQAAAAJ;RMSuNFwAAAAJ",
        "orcid": ";0000-0001-9572-2345;",
        "linkedin": ";;",
        "or_profile": "~Jianrong_Zhang1;~Hehe_Fan1;~Yi_Yang22",
        "aff": "University of Technology Sydney;Zhejiang University;Zhejiang University",
        "aff_domain": "uts.edu.au;zju.edu.cn;zju.edu.cn",
        "position": "PhD student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nzhang2024protein,\ntitle={Protein Captioning: Bridging the Gap between Protein Sequences and Natural Languages},\nauthor={Jianrong Zhang and Hehe Fan and Yi Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=DkhYlWZq84}\n}",
        "github": "",
        "project": "",
        "reviewers": "2Fof;gqUf;gDSy;CGFR",
        "site": "https://openreview.net/forum?id=DkhYlWZq84",
        "pdf_size": 12860881,
        "rating": "3;3;6;6",
        "confidence": "3;5;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;2",
        "presentation": "2;2;3;3",
        "wc_summary": "192;26;124;62",
        "wc_strengths": "79;46;107;76",
        "wc_weaknesses": "293;242;292;54",
        "wc_questions": "9;2;353;9",
        "wc_review": "573;316;876;201",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            101.0,
            63.15853069855251
        ],
        "wc_strengths_avg": [
            77.0,
            21.598611066455177
        ],
        "wc_weaknesses_avg": [
            220.25,
            98.17427106935911
        ],
        "wc_questions_avg": [
            93.25,
            149.99395821165598
        ],
        "wc_review_avg": [
            491.5,
            259.6502455227031
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16086077879645681103&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "University of Technology Sydney;Zhejiang University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uts.edu.au;https://www.zju.edu.cn",
        "aff_unique_abbr": "UTS;ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "Australia;China"
    },
    {
        "id": "DluJpvRF69",
        "title": "StyleCL : Latent Dictionary Learning for StyleGAN Without Forgetting",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "StyleGAN is one of the most versatile generative models that have emerged in recent times. However, when it is trained continually on a stream of data (potentially previously unseen distributions), it tends to forget the distribution it has learned, as is the case with any other generative model, due to catastrophic forgetting. Recent studies have shown that the latent space of StyleGAN is very versatile, as data from a variety of distributions can be inverted onto it. In this paper, we propose to leverage this property to facilitate lifelong learning of StyleGAN without forgetting. Specifically, given a StyleGAN trained on a certain task (dataset), we propose to learn a set of dictionary vectors in its latent space, one for each novel, unseen task (or dataset). Additionally, we also learn a relatively small set of shared parameters (feature adaptors) in the weight space to complement the dictionary learning in the latent space. During inference, given a dataset/task, our method invokes the corresponding learned latent dictionary and the shared parameters for that particular task. Our method avoids catastrophic forgetting because the set of dictionary and the feature adaptor parameters are unique for each task. However, the generator for each task shares all of the parameters except for the newly added parameters of the feature adaptor. We demonstrate that our method, StyleCL, achieves better generation quality on multiple datasets. Additionally, our method requires significantly fewer additional parameters per task compared to previous methods. This is a consequence of learning task-specific dictionaries in the latent space, which has a much lower dimensionality compared to the weight space. We also demonstrate that our method, StyleCL, offers the capability for positive forward transfer when the tasks are semantically similar.",
        "keywords": "Continual Learning;Generative Modelling",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/061db920234bbf4b8df88b2fd3e542daf43d1f4e.zip",
        "author": "Adarsh Kappiyath;ANMOL GARG;Ramya Hebbalaguppe;Prathosh AP",
        "authorids": "~Adarsh_Kappiyath1;~ANMOL_GARG1;~Ramya_Hebbalaguppe2;~Prathosh_AP1",
        "gender": ";M;F;M",
        "homepage": ";;https://rhebbalaguppe.github.io/;https://sites.google.com/view/prathosh",
        "dblp": ";;145/2287;218/5887",
        "google_scholar": ";;https://scholar.google.com/citations?hl=en;https://scholar.google.co.in/citations?user=OEwV4bsAAAAJ",
        "orcid": ";;0009-0006-1186-6311;",
        "linkedin": ";anmol-garg-91a5b3155/;https://in.linkedin.com/in/ramya-hebbalaguppe-620b272;prathosh-ap-phd-50ab9511/",
        "or_profile": "~Adarsh_Kappiyath1;~ANMOL_GARG1;~Ramya_Hebbalaguppe2;~Prathosh_AP1",
        "aff": ";;TCS Research labs;Indian Institute of Science, Indian institute of science, Bangalore",
        "aff_domain": ";;tcs.com;iisc.ac.in",
        "position": ";;Researcher;Assistant Professor",
        "bibtex": "@misc{\nkappiyath2024stylecl,\ntitle={Style{CL} : Latent Dictionary Learning for Style{GAN} Without Forgetting},\nauthor={Adarsh Kappiyath and ANMOL GARG and Ramya Hebbalaguppe and Prathosh AP},\nyear={2024},\nurl={https://openreview.net/forum?id=DluJpvRF69}\n}",
        "github": "",
        "project": "",
        "reviewers": "HJoy;YAxS;3wXE",
        "site": "https://openreview.net/forum?id=DluJpvRF69",
        "pdf_size": 45908122,
        "rating": "3;3;5",
        "confidence": "5;4;2",
        "soundness": "2;3;2",
        "contribution": "2;3;2",
        "presentation": "2;3;2",
        "wc_summary": "48;92;49",
        "wc_strengths": "14;50;38",
        "wc_weaknesses": "41;48;257",
        "wc_questions": "164;236;5",
        "wc_review": "267;426;349",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            1.247219128924647
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            63.0,
            20.51016008388688
        ],
        "wc_strengths_avg": [
            34.0,
            14.966629547095765
        ],
        "wc_weaknesses_avg": [
            115.33333333333333,
            100.21421500410453
        ],
        "wc_questions_avg": [
            135.0,
            96.5090669315583
        ],
        "wc_review_avg": [
            347.3333333333333,
            64.92217563274423
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9449111825230683,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:kWElb6kc4bsJ:scholar.google.com/&scioq=StyleCL+:+Latent+Dictionary+Learning+for+StyleGAN+Without+Forgetting&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Tata Consultancy Services;Indian Institute of Science",
        "aff_unique_dep": "Research labs;",
        "aff_unique_url": "https://www.tcs.com;https://www.iisc.ac.in",
        "aff_unique_abbr": "TCS;IISc",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Bangalore",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "India"
    },
    {
        "id": "Dm4qrBuFKH",
        "title": "Training Binary Neural Networks in a Binary Weight Space",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Binary neural networks (BNNs), which have binary weights and activations, hold significant potential for enabling neural computations on low-end edge devices with limited computational power and memory resources. Currently, most existing BNN training approaches optimize and binarize real-valued weights, leading to substantial memory usage during training.Though training BNNs without real-valued weights to save memory is intriguing, it has been deemed challenging with gradient-based optimization. To address this challenge, we define an update probability for binary weights, determined by the current binary weights and real-valued gradients. The binary weights generated by our method match those obtained by SGD in the real-space training of BNNs in the expectation. As a result, the training of binary weights becomes stable even without real weights. Our method yields test results on Tiny-ImageNet comparable to baselines that utilize real weights during training, yet reduces memory usage by up to a factor of 33.",
        "keywords": "binary neural network;optimization;low-precision neural network",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/9bc191ab55d74e6c92b7d93555687b245878d7bc.zip",
        "author": "Tatsukichi Shibuya;Nakamasa Inoue;Rei Kawakami;Ikuro Sato",
        "authorids": "~Tatsukichi_Shibuya1;~Nakamasa_Inoue1;~Rei_Kawakami3;~Ikuro_Sato1",
        "gender": "M;;F;M",
        "homepage": ";;https://open-vision.sc.e.titech.ac.jp/index.php/people/;",
        "dblp": "336/6051;;69/6882;68/10406",
        "google_scholar": "qB4OYnEAAAAJ;;vz_Z31sAAAAJ;https://scholar.google.com/citations?hl=ja",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Tatsukichi_Shibuya1;~Nakamasa_Inoue1;~Rei_Kawakami3;~Ikuro_Sato1",
        "aff": "Tokyo Institute of Technology;;Tokyo Institute of Technology;Denso IT Laboratory, Inc.",
        "aff_domain": "titech.ac.jp;;titech.ac.jp;d-itlab.co.jp",
        "position": "MS student;;Associate Professor;Researcher",
        "bibtex": "@misc{\nshibuya2024training,\ntitle={Training Binary Neural Networks in a Binary Weight Space},\nauthor={Tatsukichi Shibuya and Nakamasa Inoue and Rei Kawakami and Ikuro Sato},\nyear={2024},\nurl={https://openreview.net/forum?id=Dm4qrBuFKH}\n}",
        "github": "",
        "project": "",
        "reviewers": "2PTe;832g;Wfp6",
        "site": "https://openreview.net/forum?id=Dm4qrBuFKH",
        "pdf_size": 1949580,
        "rating": "3;5;6",
        "confidence": "5;5;3",
        "soundness": "3;3;2",
        "contribution": "3;2;3",
        "presentation": "2;3;3",
        "wc_summary": "48;98;74",
        "wc_strengths": "24;52;34",
        "wc_weaknesses": "144;107;141",
        "wc_questions": "3;17;7",
        "wc_review": "219;274;256",
        "wc_reply_reviewers": "0;64;0",
        "wc_reply_authors": "656;1089;787",
        "reply_reviewers": "0;1;0",
        "reply_authors": "3;5;3",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            73.33333333333333,
            20.417857108151406
        ],
        "wc_strengths_avg": [
            36.666666666666664,
            11.585431464655176
        ],
        "wc_weaknesses_avg": [
            130.66666666666666,
            16.779617264870957
        ],
        "wc_questions_avg": [
            9.0,
            5.887840577551898
        ],
        "wc_review_avg": [
            249.66666666666666,
            22.89589968143253
        ],
        "wc_reply_reviewers_avg": [
            21.333333333333332,
            30.169889330626027
        ],
        "wc_reply_authors_avg": [
            844.0,
            181.30820904379001
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.7559289460184545,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:L4dHzMXAnSgJ:scholar.google.com/&scioq=Training+Binary+Neural+Networks+in+a+Binary+Weight+Space&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Tokyo Institute of Technology;Denso IT Laboratory, Inc.",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.titech.ac.jp;https://www.denso.com",
        "aff_unique_abbr": "Titech;Denso IT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Japan"
    },
    {
        "title": "BayesPrompt: Prompting Large-Scale Pre-Trained Language Models on Few-shot Inference via Debiased Domain Abstraction",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19127",
        "id": "DmD1wboID9",
        "author_site": "Jiangmeng Li, Fei Song, Yifan Jin, Wenwen Qiang, Changwen Zheng, Fuchun Sun, Hui Xiong",
        "tldr": "",
        "abstract": "As a novel and effective fine-tuning paradigm based on large-scale pre-trained language models (PLMs), prompt-tuning aims to reduce the gap between downstream tasks and pre-training objectives. While prompt-tuning has yielded continuous advancements in various tasks, such an approach still remains a persistent defect: prompt-tuning methods fail to generalize to specific few-shot patterns. From the perspective of distribution analyses, we disclose that the intrinsic issues behind the phenomenon are the over-multitudinous conceptual knowledge contained in PLMs and the abridged knowledge for target downstream domains, which jointly result in that PLMs mis-locate the knowledge distributions corresponding to the target domains in the universal knowledge embedding space. To this end, we intuitively explore to approximate the unabridged target domains of downstream tasks in a debiased manner, and then abstract such domains to generate discriminative prompts, thereby providing the de-ambiguous guidance for PLMs. Guided by such an intuition, we propose a simple yet effective approach, namely BayesPrompt, to learn prompts that contain the domain discriminative information against the interference from domain-irrelevant knowledge. BayesPrompt primitively leverages known distributions to approximate the debiased factual distributions of target domains and further uniformly samples certain representative features from the approximated distributions to generate the ultimate prompts for PLMs. We provide theoretical insights with the connection to domain adaptation. Empirically, our method achieves state-of-the-art performance on benchmarks.",
        "keywords": "Prompt;Pre-Trained;Few-shot;Debiased;Domain Abstraction",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/2a61db7133eb9a15ade4cda7753e1e8dec69f2f1.zip",
        "author": "Jiangmeng Li;Fei Song;Yifan Jin;Wenwen Qiang;Changwen Zheng;Fuchun Sun;Hui Xiong",
        "authorids": "~Jiangmeng_Li1;~Fei_Song4;~Yifan_Jin3;~Wenwen_Qiang1;~Changwen_Zheng1;~Fuchun_Sun1;~Hui_Xiong1",
        "gender": "M;F;M;M;M;M;F",
        "homepage": "https://jiangmengli.github.io/;;;http://people.ucas.ac.cn/~cwzheng;https://www.cs.tsinghua.edu.cn/info/1121/3555.htm;https://www.hkust-gz.edu.cn/people/hui-xiong/;https://github.com/jyf123",
        "dblp": "293/0997;;261/6913;81/2728;;262/1686-1.html;30/9582",
        "google_scholar": "https://scholar.google.com.sg/citations?user=-kU4VLcAAAAJ;;https://scholar.google.com/citations?hl=zh-CN;-lErK1QAAAAJ;;cVDF1tkAAAAJ;",
        "orcid": "0000-0002-3376-1522;;0000-0002-7985-5743;0000-0002-2311-6757;;0000-0001-6016-6465;",
        "linkedin": "jiangmeng-li-86aaa7125/;fei-song-04864326a/;;;;;",
        "or_profile": "~Jiangmeng_Li1;~Fei_Song4;~Wenwen_Qiang1;~Changwen_Zheng1;~Fuchun_Sun1;~Hui_Xiong1;~yifan_jin2",
        "aff": "Institute of Software, Chinese Academy of Sciences;University of Chinese Academy of Sciences;Institute of Software Chinese Academy of Sciences;Institute of Software, Chinese Academy of Sciences;Tsinghua University;Hong Kong University of Science and Technology (Guangzhou);University of Chinese Academy of Sciences",
        "aff_domain": "iscas.ac.cn;cn.edu;iscas.ac.cn;iscas.ac.cn;cs.tsinghua.edu.cn;hkust.edu;ucas.ac.cn",
        "position": "Assistant Professor;PhD student;Assistant Professor;Full Professor;Full Professor;Full Professor;PhD student",
        "bibtex": "@inproceedings{\nli2024bayesprompt,\ntitle={BayesPrompt: Prompting Large-Scale Pre-Trained Language Models on Few-shot Inference via Debiased Domain Abstraction},\nauthor={Jiangmeng Li and Fei Song and Yifan Jin and Wenwen Qiang and Changwen Zheng and Fuchun Sun and Hui Xiong},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=DmD1wboID9}\n}",
        "github": "",
        "project": "",
        "reviewers": "32zy;ox7r;JjWU;wpkj",
        "pdf_size": 1022245,
        "rating": "5;6;6;8",
        "confidence": "3;3;3;3",
        "soundness": "3;3;3;3",
        "contribution": "3;3;2;3",
        "presentation": "1;4;3;3",
        "wc_summary": "79;83;76;151",
        "wc_strengths": "48;76;71;50",
        "wc_weaknesses": "364;328;37;54",
        "wc_questions": "2;15;14;34",
        "wc_review": "493;502;198;289",
        "wc_reply_reviewers": "0;64;17;4",
        "wc_reply_authors": "1856;1625;763;1217",
        "reply_reviewers": "0;3;1;1",
        "reply_authors": "3;5;2;2",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            97.25,
            31.13177637077589
        ],
        "wc_strengths_avg": [
            61.25,
            12.397076268217438
        ],
        "wc_weaknesses_avg": [
            195.75,
            150.90787752798062
        ],
        "wc_questions_avg": [
            16.25,
            11.453711188955307
        ],
        "wc_review_avg": [
            370.5,
            131.05056276109616
        ],
        "wc_reply_reviewers_avg": [
            21.25,
            25.469344318219107
        ],
        "wc_reply_authors_avg": [
            1365.25,
            416.2297292361515
        ],
        "reply_reviewers_avg": [
            1.25,
            1.0897247358851685
        ],
        "reply_authors_avg": [
            3.0,
            1.224744871391589
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1637468510682156074&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=DmD1wboID9",
        "pdf": "https://openreview.net/pdf?id=DmD1wboID9",
        "email": "iscas.ac.cn;cn.edu;iscas.ac.cn;iscas.ac.cn;cs.tsinghua.edu.cn;hkust.edu;ucas.ac.cn",
        "author_num": 7,
        "aff_unique_index": "0;1;0;0;2;3;1",
        "aff_unique_norm": "Chinese Academy of Sciences;University of Chinese Academy of Sciences;Tsinghua University;Hong Kong University of Science and Technology",
        "aff_unique_dep": "Institute of Software;;;",
        "aff_unique_url": "http://www.ios.ac.cn;http://www.ucas.ac.cn;https://www.tsinghua.edu.cn;https://www.ust.hk",
        "aff_unique_abbr": "CAS;UCAS;THU;HKUST",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "DmDpu3r8iU",
        "title": "Measuring Value Understanding in Language Models through Discriminator-Critique Gap",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recent advancements in Large Language Models (LLMs) have heightened concerns about their potential misalignment with human values. However, evaluating their grasp of these values is complex due to their intricate and adaptable nature. We argue that truly understanding values in LLMs requires considering both \"know what\" and \"know why\". To this end, we present the Value Understanding Measurement (VUM) framework that quantitatively assess both \"know what\" and \"know why\" by measuring the discriminator-critique gap related to human values. Using the Schwartz Value Survey, we specify our evaluation values and develop a thousand-level dialogue dataset with GPT-4. Our assessment looks at both the value alignment of LLM's outputs compared to baseline answers and how LLM responses align with reasons for value recognition versus GPT-4's annotations. We evaluate five representative LLMs and provide strong evidence that the scaling law significantly impacts \"know what\" but not much on \"know why\", which has consistently maintained a high level. This may further suggest that LLMs might craft plausible explanations based on the provided context without truly understanding their inherent value, indicating potential risks.",
        "keywords": "Value Alignment;Value Understanding Evaluation;Discriminator-Critique Gap;Schwartz Values Survey",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/2541ac5ccf357b590b7aec0ae0b0969eba03c7e2.zip",
        "author": "Zhaowei Zhang;Fengshuo Bai;Jun Gao;Yaodong Yang",
        "authorids": "~Zhaowei_Zhang2;~Fengshuo_Bai1;~Jun_Gao7;~Yaodong_Yang1",
        "gender": "M;;M;M",
        "homepage": "https://zowiezhang.github.io;https://changwinde.github.io/;https://github.com/gaogaocn;https://www.yangyaodong.com",
        "dblp": "127/1796;346/1114;;170/1496-1",
        "google_scholar": "https://scholar.google.com.hk/citations?view_op=list_works;https://scholar.google.com/citations?hl=en;;https://scholar.google.co.uk/citations?user=6yL0xw8AAAAJ",
        "orcid": ";;;0000-0001-8132-5613",
        "linkedin": ";;;yaodong-yang",
        "or_profile": "~Zhaowei_Zhang2;~Fengshuo_Bai1;~Jun_Gao7;~Yaodong_Yang1",
        "aff": "Peking University;Shanghai Jiaotong University;Beijing University of Posts and Telecommunications;Peking University",
        "aff_domain": "pku.edu.cn;sjtu.edu.cn;bupt.edu.cn;pku.edu.cn",
        "position": "PhD student;PhD student;PhD student;Assistant Professor",
        "bibtex": "@misc{\nzhang2024measuring,\ntitle={Measuring Value Understanding in Language Models through Discriminator-Critique Gap},\nauthor={Zhaowei Zhang and Fengshuo Bai and Jun Gao and Yaodong Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=DmDpu3r8iU}\n}",
        "github": "",
        "project": "",
        "reviewers": "3wE5;c54v;Lh4W",
        "site": "https://openreview.net/forum?id=DmDpu3r8iU",
        "pdf_size": 1301310,
        "rating": "3;5;5",
        "confidence": "4;3;3",
        "soundness": "2;2;2",
        "contribution": "2;2;2",
        "presentation": "2;1;2",
        "wc_summary": "111;98;120",
        "wc_strengths": "45;13;128",
        "wc_weaknesses": "350;171;159",
        "wc_questions": "2;87;5",
        "wc_review": "508;369;412",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            109.66666666666667,
            9.030811456096044
        ],
        "wc_strengths_avg": [
            62.0,
            48.46304433964778
        ],
        "wc_weaknesses_avg": [
            226.66666666666666,
            87.34732712313271
        ],
        "wc_questions_avg": [
            31.333333333333332,
            39.38132665222045
        ],
        "wc_review_avg": [
            429.6666666666667,
            58.10526845495357
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9999999999999998,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9805151874516603169&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Peking University;Shanghai Jiao Tong University;Beijing University of Posts and Telecommunications",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.sjtu.edu.cn;http://www.bupt.edu.cn/",
        "aff_unique_abbr": "Peking U;SJTU;BUPT",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Beijing",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "DeepSPF: Spherical SO(3)-Equivariant Patches for Scan-to-CAD Estimation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19126",
        "id": "Dnc3paMqDE",
        "author_site": "Driton Salihu, Adam Misik, Yuankai Wu, Constantin Patsch, Fabian Seguel, Eckehard Steinbach",
        "tldr": "",
        "abstract": "Recently, SO(3)-equivariant methods have been explored for 3D reconstruction via Scan-to-CAD.\nDespite significant advancements attributed to the unique characteristics of 3D data, existing SO(3)-equivariant approaches often fall short in seamlessly integrating local and global contextual information in a widely generalizable manner.\nOur contributions in this paper are threefold.\nFirst, we introduce Spherical Patch Fields, a representation technique designed for patch-wise, SO(3)-equivariant 3D point clouds, anchored theoretically on the principles of Spherical Gaussians.\nSecond, we present the Patch Gaussian Layer, designed for the adaptive extraction of local and global contextual information from resizable point cloud patches.\nCulminating our contributions, we present Learnable Spherical Patch Fields (DeepSPF) \u2013 a versatile and easily integrable backbone suitable for instance-based point networks.\nThrough rigorous evaluations, we demonstrate significant enhancements in Scan-to-CAD performance for point cloud registration, retrieval, and completion: a significant reduction in the rotation error of existing registration methods, an improvement of up to 17\\% in the Top-1 error for retrieval tasks, and a notable reduction of up to 30\\% in the Chamfer Distance for completion models, all attributable to the incorporation of DeepSPF.",
        "keywords": "3D Point Cloud Representation;3D Point Cloud Registration;Scan-to-CAD;Spherical Gaussians;Equivariant",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Driton Salihu;Adam Misik;Yuankai Wu;Constantin Patsch;Fabian Seguel;Eckehard Steinbach",
        "authorids": "~Driton_Salihu1;~Adam_Misik1;~Yuankai_Wu1;~Constantin_Patsch1;~Fabian_Seguel1;~Eckehard_Steinbach1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://driton-salihu.github.io/;;https://www.ce.cit.tum.de/lmt/team/mitarbeiter/wu-yuankai/;https://www.ce.cit.tum.de/lmt/team/mitarbeiter/patsch-constantin/;;https://www.ce.cit.tum.de/lmt/startseite/",
        "dblp": "307/2975;336/5348;;;;",
        "google_scholar": "ApUYm2gAAAAJ;VRNF6YgAAAAJ;;;https://scholar.google.fr/citations?user=rDoqG_KhE;https://scholar.google.de/citations?user=TB6o7YsAAAAJ",
        "orcid": "0000-0001-9152-0770;0000-0002-8717-6281;0000-0003-0573-2609;;0000-0001-6567-8988;0000-0001-8853-2703",
        "linkedin": "driton-salihu/;;;;;",
        "or_profile": "~Driton_Salihu1;~Adam_Misik1;~Yuankai_Wu1;~Constantin_Patsch1;~Fabian_Seguel1;~Eckehard_Steinbach1",
        "aff": "Technische Universit\u00e4t M\u00fcnchen;Siemens Corporate Research;Technische Universit\u00e4t M\u00fcnchen;Technische Universit\u00e4t M\u00fcnchen;Technische Universit\u00e4t M\u00fcnchen;Technical University of Munich",
        "aff_domain": "tum.de;siemens.de;tum.de;tum.de;tum.de;tum.de",
        "position": "PhD student;Researcher;PhD student;PhD student;Postdoc;Full Professor",
        "bibtex": "@inproceedings{\nsalihu2024deepspf,\ntitle={Deep{SPF}: Spherical {SO}(3)-Equivariant Patches for Scan-to-{CAD} Estimation},\nauthor={Driton Salihu and Adam Misik and Yuankai Wu and Constantin Patsch and Fabian Seguel and Eckehard Steinbach},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Dnc3paMqDE}\n}",
        "github": "",
        "project": "",
        "reviewers": "bCvD;73te;T7zb",
        "pdf_size": 7447214,
        "rating": "5;6;8",
        "confidence": "2;2;4",
        "soundness": "2;3;3",
        "contribution": "2;2;3",
        "presentation": "1;3;3",
        "wc_summary": "54;59;87",
        "wc_strengths": "34;24;63",
        "wc_weaknesses": "153;146;113",
        "wc_questions": "15;2;209",
        "wc_review": "256;231;472",
        "wc_reply_reviewers": "360;0;24",
        "wc_reply_authors": "353;591;782",
        "reply_reviewers": "1;0;1",
        "reply_authors": "1;1;2",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            66.66666666666667,
            14.522013940527977
        ],
        "wc_strengths_avg": [
            40.333333333333336,
            16.539514973407037
        ],
        "wc_weaknesses_avg": [
            137.33333333333334,
            17.441967269268172
        ],
        "wc_questions_avg": [
            75.33333333333333,
            94.66549295047038
        ],
        "wc_review_avg": [
            319.6666666666667,
            108.19837747807907
        ],
        "wc_reply_reviewers_avg": [
            128.0,
            164.3411086733931
        ],
        "wc_reply_authors_avg": [
            575.3333333333334,
            175.48852447445736
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.944911182523068,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15023008802430064864&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=Dnc3paMqDE",
        "pdf": "https://openreview.net/pdf?id=Dnc3paMqDE",
        "email": "tum.de;siemens.de;tum.de;tum.de;tum.de;tum.de",
        "author_num": 6,
        "aff_unique_index": "0;1;0;0;0;2",
        "aff_unique_norm": "Technische Universit\u00e4t M\u00fcnchen;Siemens AG;Technical University of Munich",
        "aff_unique_dep": ";Corporate Research;",
        "aff_unique_url": "https://www.tum.de;https://www.siemens.com/research;https://www.tum.de",
        "aff_unique_abbr": "TUM;Siemens;TUM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "DnkCvB8iXR",
        "title": "Large Language Models Can Design Game-Theoretic Objectives for Multi-Agent Planning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Game theory is a powerful paradigm to describe the interplay between participants in interactive multi-agent scenarios, and relies on the knowledge of player objectives or payoff structures for game optimal decision making. However, designing such objectives for games is challenging as it requires evaluating the impact of an agent\u2019s actions on the behavior of others, and understanding the effect of changes in one's policy on the behavior of others. Indeed, aligning objective representations with a desired multi-agent behavior is achieved via tedious and impractical heuristics or human trial-and-error. This work aims to ease this process and proposes a multi-agent planning architecture that relies on a large language model (LLM) as the game formulation designer. First, we exhibit the zero-shot proficiency of the more capable LLMs (such as GPT-4) in tuning continuous objective function parameters in accordance with a specified high-level goal for autonomous driving examples. We then develop a planner which uses an LLM as a matrix game designer, for scenarios with discrete and finite action spaces. Given a scene history, the actions available to each agent, and high-level objectives (expressed in natural language), the LLM evaluates the payoffs associated with each combination of actions. From the game structure obtained, agents execute Nash optimal actions, the scene is re-evaluated, and the process is repeated. We evaluate our approach on a heterogeneous robot planning task inspired by wildlife conservation, as well as a household multi-humanoid transport task, and show the superiority of our LLM-based approach to other baselines",
        "keywords": "Multi-Agent Planning;Game-theoretic Objectives",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Makram Chahine;Tsun-Hsuan Wang;Hongxin Zhang;Wei Xiao;Daniela Rus;Chuang Gan",
        "authorids": "~Makram_Chahine1;~Tsun-Hsuan_Wang2;~Hongxin_Zhang1;~Wei_Xiao2;~Daniela_Rus1;~Chuang_Gan1",
        "gender": "Not Specified;M;M;M;F;M",
        "homepage": "https://www.mit.edu/~chahine/;https://zswang666.github.io/;https://icefoxzhx.github.io/;;https://www.csail.mit.edu/person/daniela-rus;http://people.csail.mit.edu/ganchuang/",
        "dblp": "271/6229;217/1809.html;284/2962-5;20/4794-3;r/DanielaRus;139/6993",
        "google_scholar": "UzM0rckAAAAJ;xE3WSuYAAAAJ;https://scholar.google.com/citations?hl=en;BxdZJNQAAAAJ;https://scholar.google.com/citations?hl=en;PTeSCbIAAAAJ",
        "orcid": ";;0000-0002-6041-2440;;;",
        "linkedin": "mc8/;;;;;",
        "or_profile": "~Makram_Chahine1;~Tsun-Hsuan_Wang2;~Hongxin_Zhang1;~Wei_Xiao2;~Daniela_Rus1;~Chuang_Gan1",
        "aff": "Massachusetts Institute of Technology;Liquid AI;University of Massachusetts at Amherst;Massachusetts Institute of Technology;Massachusetts Institute of Technology;University of Massachusetts at Amherst",
        "aff_domain": "mit.edu;liquid.ai;umass.edu;mit.edu;mit.edu;umass.edu",
        "position": "PhD student;Researcher;PhD student;Postdoc;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nchahine2024large,\ntitle={Large Language Models Can Design Game-Theoretic Objectives for Multi-Agent Planning},\nauthor={Makram Chahine and Tsun-Hsuan Wang and Hongxin Zhang and Wei Xiao and Daniela Rus and Chuang Gan},\nyear={2024},\nurl={https://openreview.net/forum?id=DnkCvB8iXR}\n}",
        "github": "",
        "project": "",
        "reviewers": "qW2i;ZJKY;ooPj;CZtQ",
        "site": "https://openreview.net/forum?id=DnkCvB8iXR",
        "pdf_size": 1525395,
        "rating": "3;3;3;5",
        "confidence": "4;4;4;3",
        "soundness": "2;2;2;3",
        "contribution": "3;2;2;2",
        "presentation": "2;2;2;3",
        "wc_summary": "135;33;109;38",
        "wc_strengths": "52;31;58;55",
        "wc_weaknesses": "70;39;417;183",
        "wc_questions": "112;482;99;53",
        "wc_review": "369;585;683;329",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            78.75,
            44.25141240683737
        ],
        "wc_strengths_avg": [
            49.0,
            10.606601717798213
        ],
        "wc_weaknesses_avg": [
            177.25,
            148.4324341240822
        ],
        "wc_questions_avg": [
            186.5,
            172.00944741496033
        ],
        "wc_review_avg": [
            491.5,
            147.3321078380405
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8881347357718290808&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0;0;2",
        "aff_unique_norm": "Massachusetts Institute of Technology;Liquid AI;University of Massachusetts Amherst",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://web.mit.edu;;https://www.umass.edu",
        "aff_unique_abbr": "MIT;;UMass Amherst",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Amherst",
        "aff_country_unique_index": "0;1;0;0;0;0",
        "aff_country_unique": "United States;Unknown"
    },
    {
        "id": "Dnn7SoD224",
        "title": "Robust Stereo Matching by Risk Minimization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper presents a novel formulation for capturing the continuous disparity in stereo matching networks. In contrast to previous approaches that regress the final output as the expectation of discretized disparity values, we derive a continuous modeling formulation by treating the predicted disparity as an optimal solution to the risk minimization problem. We demonstrate that the commonly used disparity expectation represents an $L^2$ special case within the proposed risk formulation, and transitioning to an $L^1$ formulation notably enhances stereo matching robustness, particularly for disparities with multi-modal probability distributions. Moreover, to enable the end-to-end network training with the non-differentiable $L^1$ risk optimization, we explored the well-known implicit function theorem and proposed a differentiable scheme for both network forward prediction and backward propagation. A comprehensive analysis of our proposed formulation demonstrates its theoretical soundness and superior performance over current state-of-the-art methods across various benchmarks, including KITTI 2012, KITTI 2015, ETH3D, SceneFlow, and Middlebury 2014. We believe our work not only advances the field of stereo matching but also holds promise for broader applications, spanning computer vision, robotics, and control engineering.",
        "keywords": "Stereo Matching;Deep Stereo;Risk Minimization;Robust Estimation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/b72ffff72f7a3c7849f41a602914e3465f413736.zip",
        "author": "Ce Liu;Suryansh Kumar;Shuhang Gu;Radu Timofte;Yao Yao;Luc Van Gool",
        "authorids": "~Ce_Liu3;~Suryansh_Kumar1;~Shuhang_Gu3;~Radu_Timofte1;~Yao_Yao1;~Luc_Van_Gool1",
        "gender": "M;M;M;M;M;",
        "homepage": "https://vision.ee.ethz.ch/people-details.MjYzNDA1.TGlzdC8zMjg5LC0xOTcxNDY1MTc4.html;https://suryanshkumar.github.io/;;https://www.informatik.uni-wuerzburg.de/computervision/;https://yoyo000.github.io/;",
        "dblp": ";124/2783;126/1028;24/8616;07/4410-8;61/5017",
        "google_scholar": ";wbk0QAcAAAAJ;-kSTt40AAAAJ;https://scholar.google.ch/citations?user=u3MwH5kAAAAJ;MGxaDVEAAAAJ;https://scholar.google.be/citations?user=TwMib_QAAAAJ",
        "orcid": ";;;0000-0002-1478-0402;;",
        "linkedin": ";;;https://ch.linkedin.com/in/radutimofte;;",
        "or_profile": "~Ce_Liu3;~Suryansh_Kumar1;~Shuhang_Gu3;~Radu_Timofte1;~Yao_Yao1;~Luc_Van_Gool1",
        "aff": "ETH Zurich;Texas A&M University - College Station;University of Electronic Science and Technology of China;Bayerische Julius-Maximilians-Universit\u00e4t W\u00fcrzburg;Nanjing University;KU Leuven",
        "aff_domain": "vision.ee.ethz.ch;tamu.edu;uestc.edu.cn;uni-wuerzburg.de;nju.edu.cn;kuleuven.be",
        "position": "PhD student;Assistant Professor;Full Professor;Full Professor;Associate Professor;Emeritus",
        "bibtex": "@misc{\nliu2024robust,\ntitle={Robust Stereo Matching by Risk Minimization},\nauthor={Ce Liu and Suryansh Kumar and Shuhang Gu and Radu Timofte and Yao Yao and Luc Van Gool},\nyear={2024},\nurl={https://openreview.net/forum?id=Dnn7SoD224}\n}",
        "github": "",
        "project": "",
        "reviewers": "a5XH;bKMt;MXR7;N1iu",
        "site": "https://openreview.net/forum?id=Dnn7SoD224",
        "pdf_size": 15894058,
        "rating": "6;6;6;6",
        "confidence": "5;4;5;3",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;4;3;3",
        "wc_summary": "62;115;69;99",
        "wc_strengths": "82;244;60;95",
        "wc_weaknesses": "68;184;364;82",
        "wc_questions": "52;79;1;89",
        "wc_review": "264;622;494;365",
        "wc_reply_reviewers": "0;30;40;0",
        "wc_reply_authors": "240;630;664;573",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            86.25,
            21.649191670822262
        ],
        "wc_strengths_avg": [
            120.25,
            72.53404373120252
        ],
        "wc_weaknesses_avg": [
            174.5,
            118.21484678330383
        ],
        "wc_questions_avg": [
            55.25,
            34.120191968979306
        ],
        "wc_review_avg": [
            436.25,
            134.70778559533966
        ],
        "wc_reply_reviewers_avg": [
            17.5,
            17.853571071357123
        ],
        "wc_reply_authors_avg": [
            526.75,
            168.7177747008299
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:g0bkJ968EecJ:scholar.google.com/&scioq=Robust+Stereo+Matching+by+Risk+Minimization&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;4;5",
        "aff_unique_norm": "ETH Zurich;Texas A&M University;University of Electronic Science and Technology of China;University of W\u00fcrzburg;Nanjing University;Katholieke Universiteit Leuven",
        "aff_unique_dep": ";;;;;",
        "aff_unique_url": "https://www.ethz.ch;https://www.tamu.edu;https://www.uestc.edu.cn;https://www.uni-wuerzburg.de;https://www.nju.edu.cn;https://www.kuleuven.be",
        "aff_unique_abbr": "ETHZ;TAMU;UESTC;JMU;Nanjing U;KU Leuven",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";College Station;W\u00fcrzburg",
        "aff_country_unique_index": "0;1;2;3;2;4",
        "aff_country_unique": "Switzerland;United States;China;Germany;Belgium"
    },
    {
        "id": "DorP300Q3b",
        "title": "Learning Pseudo 3D Representation for Ego-centric 2D Multiple Object Tracking",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Data association is a knotty problem for 2D Multiple Object Tracking due to the object occlusion. However, in 3D space, data association is not so hard. Only with a 3D Kalman Filter, the online object tracker can associate the detections from LiDAR. In this paper, we rethink the data association in 2D MOT and utilize the 3D object representation to separate each object in the feature space. Unlike the existing depth-based MOT methods, the 3D object representation can be jointly learned with the object association module. Besides, the object\u2019s 3D representation is learned from the video and supervised by the 2D tracking labels without additional manual annotations from LiDAR or pretrained depth estimator. With 3D object representation learning from Pseudo 3D (P3D) object labels in monocular videos, we propose a new 2D MOT paradigm, called P3DTrack. Extensive experiments show the effectiveness of our method. We achieve state-of-the-art performance on the ego-centric datasets, KITTI and Waymo Open Dataset (WOD). Code will be released.",
        "keywords": "multiple object tracking;data association;pseudo 3D representation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/bbd76de41d14ecab8ed03f7908c9a926e105bb53.zip",
        "author": "Jiawei He;Lue Fan;Yuntao Chen;Zhaoxiang Zhang",
        "authorids": "~Jiawei_He2;~Lue_Fan1;~Yuntao_Chen1;~Zhaoxiang_Zhang3",
        "gender": "M;;M;M",
        "homepage": "https://jiaweihe.com/;;;http://zhaoxiangzhang.net",
        "dblp": "172/2564-2;287/9792;203/8284;55/2285-1.html",
        "google_scholar": "35lEP_oAAAAJ;https://scholar.google.com/citations?hl=en;iLOoUqIAAAAJ;qxWfV6cAAAAJ",
        "orcid": "0000-0001-6872-3254;;;",
        "linkedin": ";;;",
        "or_profile": "~Jiawei_He2;~Lue_Fan1;~Yuntao_Chen1;~Zhaoxiang_Zhang3",
        "aff": "Institute of automation, Chinese Academy of Sciences;Institute of Automation, Chinese Academy of Sciences;Centre for Artificial Intelligence and Robotics (CAIR), Hong Kong Institute of Science & Innovation, Chinese Academy of Sciences;Institute of Automation, Chinese Academy of Sciences",
        "aff_domain": "ia.ac.cn;ia.ac.cn;cair-cas.org.hk;ia.ac.cn",
        "position": "PhD student;PhD student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nhe2024learning,\ntitle={Learning Pseudo 3D Representation for Ego-centric 2D Multiple Object Tracking},\nauthor={Jiawei He and Lue Fan and Yuntao Chen and Zhaoxiang Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=DorP300Q3b}\n}",
        "github": "",
        "project": "",
        "reviewers": "RXkh;kQ8t;e7hh;yTKp",
        "site": "https://openreview.net/forum?id=DorP300Q3b",
        "pdf_size": 1547421,
        "rating": "5;5;6;8",
        "confidence": "5;5;4;4",
        "soundness": "2;3;4;3",
        "contribution": "1;2;3;3",
        "presentation": "2;3;3;4",
        "wc_summary": "44;73;57;167",
        "wc_strengths": "65;34;73;83",
        "wc_weaknesses": "213;107;33;128",
        "wc_questions": "49;130;17;52",
        "wc_review": "371;344;180;430",
        "wc_reply_reviewers": "265;0;0;0",
        "wc_reply_authors": "1518;1194;498;468",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            85.25,
            48.30307961196677
        ],
        "wc_strengths_avg": [
            63.75,
            18.32177666057525
        ],
        "wc_weaknesses_avg": [
            120.25,
            64.13023857744489
        ],
        "wc_questions_avg": [
            62.0,
            41.587257663856604
        ],
        "wc_review_avg": [
            331.25,
            92.6967502127232
        ],
        "wc_reply_reviewers_avg": [
            66.25,
            114.74836600143811
        ],
        "wc_reply_authors_avg": [
            919.5,
            451.40530568437055
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8164965809277259,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:gm8mOxbkrHQJ:scholar.google.com/&scioq=Learning+Pseudo+3D+Representation+for+Ego-centric+2D+Multiple+Object+Tracking&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Chinese Academy of Sciences",
        "aff_unique_dep": "Institute of Automation",
        "aff_unique_url": "http://www.ia.cas.cn",
        "aff_unique_abbr": "CAS",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Group Preference Optimization: Few-Shot Alignment of Large Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19125",
        "id": "DpFeMH4l8Q",
        "author_site": "Siyan Zhao, John Dang, Aditya Grover",
        "tldr": "",
        "abstract": "Many applications of large language models (LLMs), ranging from chatbots to\ncreative writing, require nuanced subjective judgments that can differ significantly\nacross different groups. Existing alignment algorithms can be expensive to align\nfor each group, requiring prohibitive amounts of group-specific preference data\nand computation for real-world use cases. We introduce Group Preference Optimization (GPO), an alignment framework that steers language models to preferences of individual groups in a few-shot manner. In GPO, we augment the base\nLLM with an independent transformer module trained to predict the preferences\nof a group for the LLM generations. For few-shot learning, we parameterize this\nmodule as an in-context autoregressive transformer and train it via meta-learning\non several groups. We empirically validate the efficacy of GPO through rigorous evaluations using LLMs with varied sizes on three human opinion adaptation tasks. These tasks involve adapting to the preferences of US demographic\ngroups, global countries, and individual users. Our results demonstrate that GPO\nnot only aligns models more accurately but also requires fewer group-specific\npreferences and less training and inference computing resources, outperforming\nexisting strategies such as in-context steering and fine-tuning methods.",
        "keywords": "Large Language Models;alignment;group preference alignment;few-shot learning;in-context learning;fine-tuning",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/e6e6b38cf6f535fca8024cf016c0544a43b2bd0e.zip",
        "author": "Siyan Zhao;John Dang;Aditya Grover",
        "authorids": "~Siyan_Zhao1;~John_Dang1;~Aditya_Grover1",
        "gender": "F;M;M",
        "homepage": "https://siyan-zhao.github.io/;https://www.johndang.me/;https://aditya-grover.github.io",
        "dblp": "161/3857;;162/5052",
        "google_scholar": ";;oOhnPUgAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Siyan_Zhao1;~John_Dang1;~Aditya_Grover1",
        "aff": "University of California, Los Angeles;Cohere;University of California, Los Angeles",
        "aff_domain": "cs.ucla.edu;cohere.com;ucla.edu",
        "position": "PhD student;Researcher;Assistant Professor",
        "bibtex": "@inproceedings{\nzhao2024group,\ntitle={Group Preference Optimization: Few-Shot Alignment of Large Language Models},\nauthor={Siyan Zhao and John Dang and Aditya Grover},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=DpFeMH4l8Q}\n}",
        "github": "",
        "project": "",
        "reviewers": "DqhU;UCgS;dRt2",
        "pdf_size": 1924979,
        "rating": "5;6;6",
        "confidence": "4;4;4",
        "soundness": "3;3;3",
        "contribution": "2;4;2",
        "presentation": "4;3;2",
        "wc_summary": "32;54;70",
        "wc_strengths": "36;81;29",
        "wc_weaknesses": "94;74;394",
        "wc_questions": "77;50;28",
        "wc_review": "239;259;521",
        "wc_reply_reviewers": "0;39;504",
        "wc_reply_authors": "1431;566;2395",
        "reply_reviewers": "0;1;2",
        "reply_authors": "4;2;4",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            52.0,
            15.57776192739723
        ],
        "wc_strengths_avg": [
            48.666666666666664,
            23.041026211713937
        ],
        "wc_weaknesses_avg": [
            187.33333333333334,
            146.36332266733433
        ],
        "wc_questions_avg": [
            51.666666666666664,
            20.038851153585515
        ],
        "wc_review_avg": [
            339.6666666666667,
            128.48173238073792
        ],
        "wc_reply_reviewers_avg": [
            181.0,
            228.9497761518888
        ],
        "wc_reply_authors_avg": [
            1464.0,
            747.050645315742
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 41,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10234981869027348093&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=DpFeMH4l8Q",
        "pdf": "https://openreview.net/pdf?id=DpFeMH4l8Q",
        "email": "cs.ucla.edu;cohere.com;ucla.edu",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of California, Los Angeles;Cohere",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ucla.edu;https://cohere.ai",
        "aff_unique_abbr": "UCLA;",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Los Angeles;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Dq7iJqKKM7",
        "title": "Rethinking Independent Cross-Entropy Loss For Graph-Structured Data",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph neural networks (GNNs) have exhibited prominent performance in learning graph-structured data. Considering node classification task, the individual label distribution conditioned on node representation is used to predict its classes. Based on the i.i.d assumption among node labels, the traditional supervised learning simply sums up cross-entropy losses of the independent training nodes and applies the average loss to optimize GNNs' weights. But different from other data formats, the nodes are naturally connected and their classes are correlated to neighbors at the same cluster. It is found that the independent distribution modeling of node labels restricts GNNs' capability to generalize over the entire graph and defend adversarial attacks. In this work, we propose a new framework, termed joint-cluster supervised learning, to model the joint distribution of each node with its corresponding cluster. Rather than assuming the node labels are independent, we learn the joint distribution of node and cluster labels conditioned on their representations, and train GNNs with the obtained joint loss. In this way, the data-label reference signals extracted from the local cluster explicitly strengthen the discrimination ability on the target node. The extensive experiments on 12 benchmark datasets and 7 backbone models demonstrate that our joint-cluster supervised learning can effectively bolster GNNs' node classification accuracy. Furthermore, being benefited from the reference signals which may be free from spiteful interference, our learning paradigm significantly protects the node classification from being affected by the adversarial attack.",
        "keywords": "Supervised Learning;Cross-Entropy Loss;Node Classification;Robustness",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Rui Miao;Kaixiong Zhou;Yili Wang;Ninghao Liu;Ying Wang;Xin Wang",
        "authorids": "~Rui_Miao2;~Kaixiong_Zhou1;~Yili_Wang2;~Ninghao_Liu2;~Ying_Wang13;~Xin_Wang54",
        "gender": "M;M;M;F;M;M",
        "homepage": ";https://kaixiong-zhou.github.io/;https://yl-wang.github.io//;https://ccst.jlu.edu.cn/info/1367/19675.htm;https://xinwangjlu.github.io/;https://cobweb.cs.uga.edu/~ninghaoliu/",
        "dblp": "62/675-3;178/7315;48/6261-4;94/3104-9.html;10/5630-35;145/4489",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;zMspIjIAAAAJ;https://scholar.google.com/citations?view_op=list_works;;https://scholar.google.com.hk/citations?user=Eh9n5VAAAAAJ;Nir-EDYAAAAJ",
        "orcid": "0000-0002-2917-2311;0000-0001-5226-8736;0000-0003-0845-9521;0000-0002-3288-5195;0000-0001-9448-7689;0000-0002-9170-2424",
        "linkedin": ";;;;;",
        "or_profile": "~Rui_Miao2;~Kaixiong_Zhou1;~Yili_Wang2;~Ying_Wang13;~Xin_Wang54;~Ninghao_Liu1",
        "aff": "Jilin University;Massachusetts Institute of Technology;Jilin University;Jilin University;Jilin University;University of Georgia",
        "aff_domain": "jlu.edu.cn;mit.edu;jlu.edu.cn;jlu.edu.cn;jlu.edu.cn;uga.edu",
        "position": "PhD student;Postdoc;PhD student;Full Professor;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nmiao2024rethinking,\ntitle={Rethinking Independent Cross-Entropy Loss For Graph-Structured Data},\nauthor={Rui Miao and Kaixiong Zhou and Yili Wang and Ninghao Liu and Ying Wang and Xin Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=Dq7iJqKKM7}\n}",
        "github": "",
        "project": "",
        "reviewers": "U1a1;8QYJ;npyM",
        "site": "https://openreview.net/forum?id=Dq7iJqKKM7",
        "pdf_size": 823465,
        "rating": "3;5;6",
        "confidence": "3;4;3",
        "soundness": "3;3;2",
        "contribution": "2;2;3",
        "presentation": "3;3;3",
        "wc_summary": "82;59;35",
        "wc_strengths": "30;42;27",
        "wc_weaknesses": "189;77;31",
        "wc_questions": "3;72;100",
        "wc_review": "304;250;193",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "745;0;726",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;0;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            58.666666666666664,
            19.189117286165672
        ],
        "wc_strengths_avg": [
            33.0,
            6.48074069840786
        ],
        "wc_weaknesses_avg": [
            99.0,
            66.3525935187666
        ],
        "wc_questions_avg": [
            58.333333333333336,
            40.762182909598394
        ],
        "wc_review_avg": [
            249.0,
            45.32107677449864
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            490.3333333333333,
            346.8047801797945
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.18898223650461363,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13743410795862586802&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;0;0;0;2",
        "aff_unique_norm": "Jilin University;Massachusetts Institute of Technology;University of Georgia",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.jlu.edu.cn;https://web.mit.edu;https://www.uga.edu",
        "aff_unique_abbr": "JLU;MIT;UGA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Causal Fairness under Unobserved Confounding: A Neural Sensitivity Framework",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19124",
        "id": "DqD59dQP37",
        "author_site": "Maresa Schr\u00f6der, Dennis Frauen, Stefan Feuerriegel",
        "tldr": "",
        "abstract": "Fairness for machine learning predictions is widely required in practice for legal, ethical, and societal reasons. Existing work typically focuses on settings without unobserved confounding, even though unobserved confounding can lead to severe violations of causal fairness and, thus, unfair predictions. In this work, we analyze the sensitivity of causal fairness to unobserved confounding. Our contributions are three-fold. First, we derive bounds for causal fairness metrics under different sources of observed confounding. This enables practitioners to audit the sensitivity of their machine learning models to unobserved confounding in fairness-critical applications. Second, we propose a novel neural framework for learning fair predictions, which allows us to offer worst-case guarantees of the extent to which causal fairness can be violated due to unobserved confounding. Third, we demonstrate the effectiveness of our framework in a series of experiments, including a real-world case study about predicting prison sentences. To the best of our knowledge, ours is the first work to study causal fairness under observed confounding. To this end, our work is of direct practical value for auditing and ensuring the fairness of predictions in high-stakes applications.",
        "keywords": "Causal Fairness;Sensitivity Analysis;Fair Prediction;Unobserved Confounding",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Maresa Schr\u00f6der;Dennis Frauen;Stefan Feuerriegel",
        "authorids": "~Maresa_Schr\u00f6der1;~Dennis_Frauen1;~Stefan_Feuerriegel1",
        "gender": ";M;M",
        "homepage": ";https://www.ai.bwl.uni-muenchen.de/team/research_team/dennis_frauen/index.html;http://www.ai.bwl.lmu.de",
        "dblp": ";315/0115;125/0630",
        "google_scholar": ";ieyW4WQAAAAJ;https://scholar.google.de/citations?hl=de",
        "orcid": ";;0000-0001-7856-8729",
        "linkedin": ";dennis-frauen-6b5746171/;",
        "or_profile": "~Maresa_Schr\u00f6der1;~Dennis_Frauen1;~Stefan_Feuerriegel1",
        "aff": ";Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen;LMU Munich",
        "aff_domain": ";lmu.de;lmu.de",
        "position": ";PhD student;Professor",
        "bibtex": "@inproceedings{\nschr{\\\"o}der2024causal,\ntitle={Causal Fairness under Unobserved Confounding: A Neural Sensitivity Framework},\nauthor={Maresa Schr{\\\"o}der and Dennis Frauen and Stefan Feuerriegel},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=DqD59dQP37}\n}",
        "github": "",
        "project": "",
        "reviewers": "uvD6;2FkR;rYvN",
        "pdf_size": 1721237,
        "rating": "5;6;6",
        "confidence": "3;3;4",
        "soundness": "3;3;3",
        "contribution": "2;3;2",
        "presentation": "2;2;3",
        "wc_summary": "59;44;15",
        "wc_strengths": "37;62;55",
        "wc_weaknesses": "328;220;412",
        "wc_questions": "51;2;84",
        "wc_review": "475;328;566",
        "wc_reply_reviewers": "375;230;724",
        "wc_reply_authors": "1826;2173;2510",
        "reply_reviewers": "3;1;3",
        "reply_authors": "4;4;5",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            39.333333333333336,
            18.263503375736967
        ],
        "wc_strengths_avg": [
            51.333333333333336,
            10.530379332620875
        ],
        "wc_weaknesses_avg": [
            320.0,
            78.587530817554
        ],
        "wc_questions_avg": [
            45.666666666666664,
            33.68811198166037
        ],
        "wc_review_avg": [
            456.3333333333333,
            98.05553981743657
        ],
        "wc_reply_reviewers_avg": [
            443.0,
            207.32743828704068
        ],
        "wc_reply_authors_avg": [
            2169.6666666666665,
            279.2517780705354
        ],
        "reply_reviewers_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6867654553018740906&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=DqD59dQP37",
        "pdf": "https://openreview.net/pdf?id=DqD59dQP37",
        "email": ";lmu.de;lmu.de",
        "author_num": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen;Ludwig Maximilian University of Munich",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.lmu.de;https://www.lmu.de",
        "aff_unique_abbr": "LMU;LMU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Munich",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Germany"
    },
    {
        "title": "Point2SSM: Learning Morphological Variations of Anatomies from Point Clouds",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19123",
        "id": "DqziS8DG4M",
        "author_site": "Jadie Adams, Shireen Elhabian",
        "tldr": "",
        "abstract": "We present Point2SSM, a novel unsupervised learning approach for constructing correspondence-based statistical shape models (SSMs) directly from raw point clouds. SSM is crucial in clinical research, enabling population-level analysis of morphological variation in bones and organs. Traditional methods of SSM construction have limitations, including the requirement of noise-free surface meshes or binary volumes, reliance on assumptions or templates, and prolonged inference times due to simultaneous optimization of the entire cohort. Point2SSM overcomes these barriers by providing a data-driven solution that infers SSMs directly from raw point clouds, reducing inference burdens and increasing applicability as point clouds are more easily acquired. While deep learning on 3D point clouds has seen success in unsupervised representation learning and shape correspondence, its application to anatomical SSM construction is largely unexplored. We conduct a benchmark of state-of-the-art point cloud deep networks on the SSM task, revealing their limited robustness to clinical challenges such as noisy, sparse, or incomplete input and limited training data. Point2SSM addresses these issues through an attention-based module, providing effective correspondence mappings from learned point features. Our results demonstrate that the proposed method significantly outperforms existing networks in terms of accurate surface sampling and correspondence, better capturing population-level statistics. The source code is provided at https://github.com/jadie1/Point2SSM.",
        "keywords": "Unsupervised learning;global correspondence;point cloud;statsitical shape modeling",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/aa0fc3b286e7439814067fc3a6456661bbb617d7.zip",
        "author": "Jadie Adams;Shireen Elhabian",
        "authorids": "~Jadie_Adams1;~Shireen_Elhabian1",
        "gender": "F;F",
        "homepage": "https://www.sci.utah.edu/~jadie/;http://www.sci.utah.edu/~shireen/",
        "dblp": "270/2158;24/2912",
        "google_scholar": "qSrG8PQAAAAJ;IABaOcUAAAAJ",
        "orcid": ";0000-0002-7394-557X",
        "linkedin": "jadie-adams-720180146/;shireen-elhabian-9566601a9/",
        "or_profile": "~Jadie_Adams1;~Shireen_Elhabian1",
        "aff": "University of Utah;University of Utah",
        "aff_domain": "utah.edu;utah.edu",
        "position": "PhD student;Associate Professor",
        "bibtex": "@inproceedings{\nadams2024pointssm,\ntitle={Point2{SSM}: Learning Morphological Variations of Anatomies from Point Clouds},\nauthor={Jadie Adams and Shireen Elhabian},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=DqziS8DG4M}\n}",
        "github": "",
        "project": "",
        "reviewers": "gxDE;ARFH;PV7h;x8Fq",
        "pdf_size": 3426863,
        "rating": "5;8;8;8",
        "confidence": "4;4;3;4",
        "soundness": "3;4;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "44;48;135;227",
        "wc_strengths": "33;67;103;63",
        "wc_weaknesses": "117;115;241;259",
        "wc_questions": "2;44;97;212",
        "wc_review": "196;274;576;761",
        "wc_reply_reviewers": "0;0;0;107",
        "wc_reply_authors": "488;628;720;841",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            7.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            113.5,
            74.94164396382027
        ],
        "wc_strengths_avg": [
            66.5,
            24.834451876375287
        ],
        "wc_weaknesses_avg": [
            183.0,
            67.30527468185537
        ],
        "wc_questions_avg": [
            88.75,
            78.71904153379917
        ],
        "wc_review_avg": [
            451.75,
            228.0771525164237
        ],
        "wc_reply_reviewers_avg": [
            26.75,
            46.332359102467464
        ],
        "wc_reply_authors_avg": [
            669.25,
            129.06078994024483
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8912633665572104489&as_sdt=5,39&sciodt=0,39&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=DqziS8DG4M",
        "pdf": "https://openreview.net/pdf?id=DqziS8DG4M",
        "email": "utah.edu;utah.edu",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Utah",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.utah.edu",
        "aff_unique_abbr": "Utah",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Dr4qD9bzZd",
        "title": "Functional Geometry Guided Protein Sequence and Backbone Structure Co-Design",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Proteins are macromolecules responsible for essential functions in almost all living organisms. Designing reasonable proteins with desired functions is crucial. A protein's sequence and structure are strongly correlated and they together determine its function. In this paper, we propose NAEPro, a model to jointly design Protein sequence and structure based on automatically detected functional sites. NAEPro is powered by an interleaving network of attention and equivariant layers, which can capture global correlation in a whole sequence and local influence from nearest amino acids in three dimensional (3D) space. Such an architecture facilitates effective yet economic message passing at two levels. We evaluate our model and several strong baselines on two protein datasets, $\\beta$-lactamase and myoglobin. Experimental results show that our model consistently achieves the highest amino acid recovery rate, TM-score, and the lowest RMSD among all competitors. These findings prove the capability of our model to design protein sequences and structures that closely resemble their natural counterparts. Furthermore, in-depth analysis further confirms our model's ability to generate highly effective proteins capable of binding to their target metallocofactors.",
        "keywords": "metalloprotein design;protein sequence and structure co-design;functional protein design",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/1680e1c0fcc66f0f881157a8a0634e9c628b5e9d.zip",
        "author": "Zhenqiao Song;Yunlong Zhao;Wenxian Shi;Yang Yang;Lei Li",
        "authorids": "~Zhenqiao_Song1;~Yunlong_Zhao3;~Wenxian_Shi1;~Yang_Yang55;~Lei_Li11",
        "gender": "F;M;;Not Specified;M",
        "homepage": "https://jocelynsong.github.io/;;;https://yang.chem.ucsb.edu/;https://www.cs.cmu.edu/~leili",
        "dblp": "227/7889;;;;13/7007-5.html",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;;https://scholar.google.com/citations?hl=en;BYXqAlwAAAAJ",
        "orcid": ";0009-0009-0330-6885;;0000-0002-4956-2034;0000-0003-3095-9776",
        "linkedin": ";yunlong-zhao-5679991a0/;;;",
        "or_profile": "~Zhenqiao_Song1;~Yunlong_Zhao3;~Wenxian_Shi1;~Yang_Yang55;~Lei_Li11",
        "aff": "Carnegie Mellon University;Massachusetts Institute of Technology;;University of California, Santa Barbara;School of Computer Science, Carnegie Mellon University",
        "aff_domain": "andrew.cmu.edu;mit.edu;;ucsb.edu;cs.cmu.edu",
        "position": "PhD student;Researcher;;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nsong2024functional,\ntitle={Functional Geometry Guided Protein Sequence and Backbone Structure Co-Design},\nauthor={Zhenqiao Song and Yunlong Zhao and Wenxian Shi and Yang Yang and Lei Li},\nyear={2024},\nurl={https://openreview.net/forum?id=Dr4qD9bzZd}\n}",
        "github": "",
        "project": "",
        "reviewers": "Wq6M;VH6U;MgyU",
        "site": "https://openreview.net/forum?id=Dr4qD9bzZd",
        "pdf_size": 6685397,
        "rating": "3;3;6",
        "confidence": "5;4;5",
        "soundness": "2;2;3",
        "contribution": "2;3;2",
        "presentation": "3;3;3",
        "wc_summary": "67;56;89",
        "wc_strengths": "11;6;36",
        "wc_weaknesses": "114;209;701",
        "wc_questions": "50;403;355",
        "wc_review": "242;674;1181",
        "wc_reply_reviewers": "659;244;928",
        "wc_reply_authors": "1979;1850;2847",
        "reply_reviewers": "3;1;4",
        "reply_authors": "5;6;8",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            70.66666666666667,
            13.719410418171117
        ],
        "wc_strengths_avg": [
            17.666666666666668,
            13.123346456686352
        ],
        "wc_weaknesses_avg": [
            341.3333333333333,
            257.26294374087814
        ],
        "wc_questions_avg": [
            269.3333333333333,
            156.32515970103967
        ],
        "wc_review_avg": [
            699.0,
            383.75252442166425
        ],
        "wc_reply_reviewers_avg": [
            610.3333333333334,
            281.3542646241962
        ],
        "wc_reply_authors_avg": [
            2225.3333333333335,
            442.7281583796339
        ],
        "reply_reviewers_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "reply_authors_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "replies_avg": [
            33,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3780572789979914207&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Carnegie Mellon University;Massachusetts Institute of Technology;University of California, Santa Barbara",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.cmu.edu;https://web.mit.edu;https://www.ucsb.edu",
        "aff_unique_abbr": "CMU;MIT;UCSB",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Santa Barbara;Pittsburgh",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Single Motion Diffusion",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19122",
        "id": "DrhZneqz4n",
        "author_site": "Sigal Raab, Inbal Leibovitch, Guy Tevet, Moab Arar, Amit Bermano, Daniel Cohen-Or",
        "tldr": "",
        "abstract": "Synthesizing realistic animations of humans, animals, and even imaginary creatures, has long been a goal for artists and computer graphics professionals. Compared to the imaging domain, which is rich with large available datasets, the number of data instances for the motion domain is limited, particularly for the animation of animals and exotic creatures (e.g., dragons), which have unique skeletons and motion patterns. In this work, we introduce SinMDM, a Single Motion Diffusion Model. It is designed to learn the internal motifs of a single motion sequence with arbitrary topology and synthesize a variety of motions of arbitrary length that remain faithful to the learned motifs. We harness the power of diffusion models and present a denoising network explicitly designed for the task of learning from a single input motion. SinMDM is crafted as a lightweight architecture, which avoids overfitting by using a shallow network with local attention layers that narrow the receptive field and encourage motion diversity. Our work applies to multiple contexts, including spatial and temporal in-betweening, motion expansion, style transfer, and crowd animation. Our results show that SinMDM outperforms existing methods both qualitatively and quantitatively. Moreover, while prior network-based approaches require additional training for different applications, SinMDM supports these applications during inference. Our project page, which includes links to the code and trained models, is accessible at https://sinmdm.github.io/SinMDM-page.",
        "keywords": "Deep Learning;Motion synthesis;Animation;Single Instance Learning;Generative models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/a1482208c8aa5d9ab5bd688b219b37a0ea6b7368.zip",
        "author": "Sigal Raab;Inbal Leibovitch;Guy Tevet;Moab Arar;Amit Haim Bermano;Daniel Cohen-Or",
        "authorids": "~Sigal_Raab1;~Inbal_Leibovitch1;~Guy_Tevet1;~Moab_Arar1;~Amit_Haim_Bermano2;~Daniel_Cohen-Or1",
        "gender": "F;F;M;;M;M",
        "homepage": "https://sigal-raab.github.io;;https://guytevet.github.io/;;https://www.cs.tau.ac.il/~amberman/;http://www.cs.tau.ac.il/~dcor/",
        "dblp": "74/1089;322/5408.html;229/4227.html;;97/10458;c/DCohenOr",
        "google_scholar": "STnhSioAAAAJ;;P9ROgN8AAAAJ;;https://scholar.google.co.il/citations?user=EPO5_f4AAAAJ;https://scholar.google.com.tw/citations?user=fAxws1sAAAAJ",
        "orcid": "0000-0001-6616-257X;0000-0001-6270-1396;0000-0003-4376-2403;;;0000-0001-6777-7445",
        "linkedin": "sigal-raab-65496328;inbal-leibovitch-884335158/;;;;",
        "or_profile": "~Sigal_Raab1;~Inbal_Leibovitch1;~Guy_Tevet1;~Moab_Arar1;~Amit_Haim_Bermano2;~Daniel_Cohen-Or1",
        "aff": "Tel Aviv University;Tel Aviv University;Tel Aviv University;;Tel Aviv University;Tel Aviv University",
        "aff_domain": "tau.ac.il;tau.ac.il;tau.ac.il;;tau.ac.il;tau.ac.il",
        "position": "PhD student;MS student;PhD student;;Associate Professor;Full Professor",
        "bibtex": "@inproceedings{\nraab2024single,\ntitle={Single Motion Diffusion},\nauthor={Sigal Raab and Inbal Leibovitch and Guy Tevet and Moab Arar and Amit Haim Bermano and Daniel Cohen-Or},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=DrhZneqz4n}\n}",
        "github": "",
        "project": "",
        "reviewers": "ep7Y;BL7j;gTdv;qd2e",
        "pdf_size": 15165193,
        "rating": "6;8;8;8",
        "confidence": "3;4;3;3",
        "soundness": "3;4;3;3",
        "contribution": "2;3;3;2",
        "presentation": "4;4;3;4",
        "wc_summary": "130;165;72;71",
        "wc_strengths": "89;83;58;56",
        "wc_weaknesses": "100;82;130;115",
        "wc_questions": "37;80;31;31",
        "wc_review": "356;410;291;273",
        "wc_reply_reviewers": "0;55;0;24",
        "wc_reply_authors": "678;365;342;623",
        "reply_reviewers": "0;2;0;1",
        "reply_authors": "1;2;1;2",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            109.5,
            39.96561021678513
        ],
        "wc_strengths_avg": [
            71.5,
            14.67140075112121
        ],
        "wc_weaknesses_avg": [
            106.75,
            17.795715776557007
        ],
        "wc_questions_avg": [
            44.75,
            20.498475553074673
        ],
        "wc_review_avg": [
            332.5,
            54.36221113972462
        ],
        "wc_reply_reviewers_avg": [
            19.75,
            22.587330519563395
        ],
        "wc_reply_authors_avg": [
            502.0,
            149.98833287959434
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 71,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=834162927028180842&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=DrhZneqz4n",
        "pdf": "https://openreview.net/pdf?id=DrhZneqz4n",
        "email": "tau.ac.il;tau.ac.il;tau.ac.il;;tau.ac.il;tau.ac.il",
        "author_num": 6,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Tel Aviv University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tau.ac.il",
        "aff_unique_abbr": "TAU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Israel"
    },
    {
        "title": "Decomposed Diffusion Sampler for Accelerating Large-Scale Inverse Problems",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19121",
        "id": "DsEhqQtfAG",
        "author_site": "Hyungjin Chung, Suhyeon Lee, Jong Ye",
        "tldr": "",
        "abstract": "Krylov subspace, which is generated by multiplying a given vector by the matrix of a linear transformation and its successive powers,  has been extensively studied in classical optimization literature to design algorithms that converge quickly for large linear inverse problems. For example, the conjugate gradient method (CG), one of the most popular Krylov subspace methods, is based on the idea of minimizing the residual error in the Krylov subspace. However, with the recent advancement of high-performance diffusion solvers for inverse problems, it is not clear how classical wisdom can be synergistically combined with modern diffusion models. In this study, we propose a novel and efficient diffusion sampling strategy that synergistically combines the diffusion sampling and Krylov subspace methods. Specifically, we prove that if the tangent space at a denoised sample by Tweedie's formula forms a  Krylov subspace, then the CG initialized with the denoised data ensures the data consistency update to remain in the tangent space. This negates the need to compute the manifold-constrained gradient (MCG), leading to a more efficient diffusion sampling method. Our method is applicable regardless of the parametrization and setting (i.e., VE, VP). Notably, we achieve state-of-the-art reconstruction quality on challenging real-world medical inverse imaging problems, including multi-coil MRI reconstruction and 3D CT reconstruction. Moreover, our proposed method achieves more than 80 times faster inference time than the previous state-of-the-art method. Code is available at https://github.com/HJ-harry/DDS",
        "keywords": "Diffusion models; Inverse problems; Krylov subspace",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Hyungjin Chung;Suhyeon Lee;Jong Chul Ye",
        "authorids": "~Hyungjin_Chung1;~Suhyeon_Lee2;~Jong_Chul_Ye1",
        "gender": "M;M;M",
        "homepage": "https://www.hj-chung.com/;https://github.com/hyn2028;https://bispl.weebly.com/",
        "dblp": "262/0382;342/2820;15/5613",
        "google_scholar": "https://scholar.google.co.kr/citations?user=KdchEyoAAAAJ;V9rMrFQAAAAJ;HNMjoNEAAAAJ",
        "orcid": "0000-0003-3202-0893;;",
        "linkedin": "hyungjin-chung-060b42148/;;",
        "or_profile": "~Hyungjin_Chung1;~Suhyeon_Lee2;~Jong_Chul_Ye1",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr;kaist.ac.kr",
        "position": "PhD student;MS student;Full Professor",
        "bibtex": "@inproceedings{\nchung2024decomposed,\ntitle={Decomposed Diffusion Sampler for Accelerating Large-Scale Inverse Problems},\nauthor={Hyungjin Chung and Suhyeon Lee and Jong Chul Ye},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=DsEhqQtfAG}\n}",
        "github": "",
        "project": "",
        "reviewers": "tJRQ;wm9K;Q4Mc;YQ7m",
        "pdf_size": 7731037,
        "rating": "6;6;6;8",
        "confidence": "4;2;3;4",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;2;3",
        "wc_summary": "103;57;139;97",
        "wc_strengths": "65;25;76;79",
        "wc_weaknesses": "61;78;70;458",
        "wc_questions": "69;3;59;307",
        "wc_review": "298;163;344;941",
        "wc_reply_reviewers": "0;0;0;28",
        "wc_reply_authors": "348;290;406;674",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            99.0,
            29.086079144497972
        ],
        "wc_strengths_avg": [
            61.25,
            21.568205766822608
        ],
        "wc_weaknesses_avg": [
            166.75,
            168.26077231488034
        ],
        "wc_questions_avg": [
            109.5,
            116.7679322416904
        ],
        "wc_review_avg": [
            436.5,
            298.772907071575
        ],
        "wc_reply_reviewers_avg": [
            7.0,
            12.12435565298214
        ],
        "wc_reply_authors_avg": [
            429.5,
            146.99914965740447
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5222329678670935,
        "gs_citation": 53,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15812705650779047751&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=DsEhqQtfAG",
        "pdf": "https://openreview.net/pdf?id=DsEhqQtfAG",
        "email": "kaist.ac.kr;kaist.ac.kr;kaist.ac.kr",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "DslxExr5Kn",
        "title": "APC: Predict Global Representation From Local Observation In Multi-Agent Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Multi-agent reinforcement learning (MARL) algorithms with sequential decision-making strategies have achieved great success in cooperation tasks recently. To overcome the non-stationarity problem, these methods design a centralized controller that takes global observation as input and chooses actions for each agent in sequence. However, in most scenarios, global information is only available at training time, while agents act synchronously with their local observation at execution time, which prevents agents from leveraging more information in cooperation. In this paper, based on actor-critic architecture, we propose the actor-predicts-critic (APC) algorithm, in which the actor learns to predict the global representations of centralized critic from local observation. During the training, the actor not only receives the estimated state values, but also takes the critic's representations that are extracted from global information as the prediction targets. Since these global representations are closely related to agents' goals and rewards, agents can achieve better cooperation on MARL tasks utilizing the predicted representations. To prove the validity of APC, we evaluate the algorithm on StarCraft2, Google Research Football, and Multi-Agent Mujoco benchmarks. The results show that APC significantly outperforms the strong baselines in centralized training and decentralized execution (CTDE) framework, including MAT-Dec, MAPPO, and fine-tuned QMIX.",
        "keywords": "Multi-Agent Reinforcement Learning;Centralized Training and Decentralized Execution;Multi-Agent Cooperation;Multi-Agent Systerms",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Xiaoyang Li;Guohua Yang;Dawei Zhang;Tianzhu Zhang;Jianhua Tao",
        "authorids": "~Xiaoyang_Li6;~Guohua_Yang1;~Dawei_Zhang3;~Tianzhu_Zhang1;~Jianhua_Tao1",
        "gender": "M;Not Specified;;M;",
        "homepage": "https://toastersc.github.io/;;http://www.ia.ac.cn;https://scholar.google.com/citations?user=9sCGe-gAAAAJ&hl=zh-CN;",
        "dblp": ";206/0795;76/5684-1;;",
        "google_scholar": ";;;9sCGe-gAAAAJ;",
        "orcid": ";0000-0003-4418-6639;;;",
        "linkedin": ";;;;",
        "or_profile": "~Xiaoyang_Li6;~Guohua_Yang1;~Dawei_Zhang3;~Tianzhu_Zhang1;~Jianhua_Tao1",
        "aff": "University of Science and Technology of China;;;University of Science and Technology of China;",
        "aff_domain": "ustc.edu.cn;;;ustc.edu.cn;",
        "position": "MS student;;;Full Professor;",
        "bibtex": "@misc{\nli2024apc,\ntitle={{APC}: Predict Global Representation From Local Observation In Multi-Agent Reinforcement Learning},\nauthor={Xiaoyang Li and Guohua Yang and Dawei Zhang and Tianzhu Zhang and Jianhua Tao},\nyear={2024},\nurl={https://openreview.net/forum?id=DslxExr5Kn}\n}",
        "github": "",
        "project": "",
        "reviewers": "2e7K;iCg2;XhHc;HFwe",
        "site": "https://openreview.net/forum?id=DslxExr5Kn",
        "pdf_size": 943737,
        "rating": "3;5;5;5",
        "confidence": "5;4;3;3",
        "soundness": "1;2;2;3",
        "contribution": "1;2;2;2",
        "presentation": "2;2;3;3",
        "wc_summary": "50;38;76;85",
        "wc_strengths": "45;34;42;61",
        "wc_weaknesses": "307;17;104;61",
        "wc_questions": "95;37;126;128",
        "wc_review": "497;126;348;335",
        "wc_reply_reviewers": "0;0;0;66",
        "wc_reply_authors": "345;103;455;198",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            62.25,
            19.00493356999703
        ],
        "wc_strengths_avg": [
            45.5,
            9.810708435174291
        ],
        "wc_weaknesses_avg": [
            122.25,
            111.01210519578484
        ],
        "wc_questions_avg": [
            96.5,
            36.7593525514256
        ],
        "wc_review_avg": [
            326.5,
            132.1031793712778
        ],
        "wc_reply_reviewers_avg": [
            16.5,
            28.578838324886476
        ],
        "wc_reply_authors_avg": [
            275.25,
            134.91918877609663
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.8703882797784891,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:78EKqmIRS_8J:scholar.google.com/&scioq=APC:+Predict+Global+Representation+From+Local+Observation+In+Multi-Agent+Reinforcement+Learning&hl=en&as_sdt=0,48",
        "gs_version_total": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Science and Technology of China",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.ustc.edu.cn",
        "aff_unique_abbr": "USTC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "Dsvttr9BUf",
        "title": "Structured Pruning Adapters",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Adapters are a parameter-efficient alternative to fine-tuning, which augment a frozen base network to learn new tasks. Yet, the inference of the adapted model is often slower than the corresponding fine-tuned model. To improve on this, we introduce the concept of Structured Pruning Adapters (SPAs), a family of compressing, task-switching network adapters, that accelerate and specialize networks using tiny parameter sets and structured pruning. Specifically, we propose the Structured Pruning Low-rank Adapter (SPLoRA) and the Structured Pruning Residual Adapter (SPPaRA) and evaluate them on a suite of pruning methods, architectures, and image recognition benchmarks. Compared to regular structured pruning with fine-tuning, SPLoRA improves image recognition accuracy by 6.9% on average for ResNet50 while using half the parameters at 90% pruned weights. Alternatively, a SPLoRA augmented model can learn adaptations with 17x fewer parameters at 70% pruning with 1.6% lower accuracy. For ViT-b/16 models, SPLoRA improves accuracy by an average of 43%-points at 75% pruned weights while learning 6.8x fewer parameters. Our experimental code and Python library of adapters are available at link-available-upon-acceptance.",
        "keywords": "Structured Pruning;Adapters;Transfer Learning;Computer Vision;Convolutional Neural Network;Transformer;Vision Transformer",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/65ef41176e0c16534abbeab914efee3eef515cc6.zip",
        "author": "Lukas Hedegaard;Aman Alok;Juby Jose;Alexandros Iosifidis",
        "authorids": "~Lukas_Hedegaard1;~Aman_Alok1;~Juby_Jose1;~Alexandros_Iosifidis3",
        "gender": "M;M;M;M",
        "homepage": "https://amanalok.gitbook.io/;;https://www.tuni.fi/en/people/alexandros-iosifidis;",
        "dblp": "243/2922;;01/9539;",
        "google_scholar": "zyZu2m0AAAAJ;;KjsL0KEAAAAJ;15ovcOoAAAAJ",
        "orcid": ";;0000-0003-4807-1345;0000-0002-2841-864X",
        "linkedin": "aman-alok-39080917/;juby-jose-278aa314/;;lukashedegaard/",
        "or_profile": "~Aman_Alok1;~Juby_Jose1;~Alexandros_Iosifidis2;~Lukas_Hedegaard_Jensen1",
        "aff": ";Cactus Communications;Aarhus University;",
        "aff_domain": ";cactusglobal.com;au.dk;",
        "position": ";Principal Researcher;Full Professor;",
        "bibtex": "@misc{\nhedegaard2024structured,\ntitle={Structured Pruning Adapters},\nauthor={Lukas Hedegaard and Aman Alok and Juby Jose and Alexandros Iosifidis},\nyear={2024},\nurl={https://openreview.net/forum?id=Dsvttr9BUf}\n}",
        "github": "",
        "project": "",
        "reviewers": "onCc;JLMs;dPLA;Nsqg",
        "site": "https://openreview.net/forum?id=Dsvttr9BUf",
        "pdf_size": 1076273,
        "rating": "1;3;5;6",
        "confidence": "4;5;4;4",
        "soundness": "3;2;2;3",
        "contribution": "1;2;3;3",
        "presentation": "4;2;3;3",
        "wc_summary": "62;60;30;74",
        "wc_strengths": "33;27;29;71",
        "wc_weaknesses": "99;76;159;146",
        "wc_questions": "44;19;84;225",
        "wc_review": "238;182;302;516",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.920286436967152
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            56.5,
            16.209565077447326
        ],
        "wc_strengths_avg": [
            40.0,
            18.027756377319946
        ],
        "wc_weaknesses_avg": [
            120.0,
            33.81567683782183
        ],
        "wc_questions_avg": [
            93.0,
            79.6586467371873
        ],
        "wc_review_avg": [
            309.5,
            126.55729927586161
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.22549380840084865,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14403934931508671061&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Cactus Communications;Aarhus University",
        "aff_unique_dep": ";",
        "aff_unique_url": ";https://au.dk",
        "aff_unique_abbr": ";AU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Unknown;Denmark"
    },
    {
        "id": "Dt3rcTC8Sw",
        "title": "Enhancing Mutual Information Estimation in Self-Interpretable Graph Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph neural networks (GNNs) with self-interpretability are pivotal in various high-stakes and scientific domains. The information bottleneck (IB) principle holds promise to infuse GNNs with inherent interpretability. In particular, the graph information bottleneck (GIB) framework identifies key subgraphs from the input graph $G$ that have high mutual information (MI) with the predictions while maintaining minimum MI with $G$. The major challenge is dealing with irregular graph structures and gauging the conditional probabilities for evaluating MI between these subgraphs and $G$. Existing methods for estimating the MI between graphs often present distorted and loose estimations, thereby undermining model efficacy. In this work, we propose a novel framework GEMINI for training self-interpretable graph models, which tackles the key challenge of graph MI estimations. We construct a variational distribution over critical subgraphs, based on which an efficient MI upper bound estimator for graphs is built. Besides the proposed theoretical framework, we devise a practical instantiation of different modules in GEMINI. We compare GEMINI thoroughly with both self-interpretable GNNs and post-hoc explanation methods on eight datasets with both interpretation and prediction performance metrics. Results reveal that GEMINI outperforms state-of-the-art self-interpretable GNNs on interpretability and achieves comparable prediction performance compared with mainstream GNNs.",
        "keywords": "graph neural networks;information bottleneck;interpretability",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/658f21d7dd79e1eddb5ff116ccd00e58a906f5c8.zip",
        "author": "Wenwen Xia;Yutong Zhang;Caihua Shan;Dongsheng Li;Yuchen Li",
        "authorids": "~Wenwen_Xia1;~Yutong_Zhang7;~Caihua_Shan1;~Dongsheng_Li2;~Yuchen_Li6",
        "gender": "M;F;F;M;M",
        "homepage": "https://xiawenwen49.github.io/;https://github.com/zhangyutong-sjtu;;http://recmind.cn;http://yuchenli.net/",
        "dblp": "252/7958;;;254/0830-2.html;143/0258-1",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;;-knurggAAAAJ;VNg5rA8AAAAJ;M4DWiJUAAAAJ",
        "orcid": "0000-0003-2928-7298;0009-0006-4959-2774;;0000-0003-3103-8442;0000-0002-3145-350X",
        "linkedin": ";;;;",
        "or_profile": "~Wenwen_Xia1;~Yutong_Zhang7;~Caihua_Shan1;~Dongsheng_Li2;~Yuchen_Li6",
        "aff": "Ant Group;Shanghai Jiaotong University;Microsoft;Microsoft Research Asia;Singapore Management University",
        "aff_domain": "antgroup.com;sjtu.edu.cn;microsoft.com;microsoft.com;smu.edu.sg",
        "position": "Researcher;PhD student;Researcher;Principal Researcher;Assistant Professor",
        "bibtex": "@misc{\nxia2024enhancing,\ntitle={Enhancing Mutual Information Estimation in Self-Interpretable Graph Neural Networks},\nauthor={Wenwen Xia and Yutong Zhang and Caihua Shan and Dongsheng Li and Yuchen Li},\nyear={2024},\nurl={https://openreview.net/forum?id=Dt3rcTC8Sw}\n}",
        "github": "",
        "project": "",
        "reviewers": "BVpy;6KN9;NeoE;51zY",
        "site": "https://openreview.net/forum?id=Dt3rcTC8Sw",
        "pdf_size": 2152733,
        "rating": "5;5;6;6",
        "confidence": "4;3;2;3",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;3;2",
        "wc_summary": "55;50;81;58",
        "wc_strengths": "39;63;36;40",
        "wc_weaknesses": "46;126;192;100",
        "wc_questions": "10;46;38;105",
        "wc_review": "150;285;347;303",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "325;719;1116;493",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;3;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            61.0,
            11.895377253370318
        ],
        "wc_strengths_avg": [
            44.5,
            10.781929326423912
        ],
        "wc_weaknesses_avg": [
            116.0,
            52.51666402200353
        ],
        "wc_questions_avg": [
            49.75,
            34.585943676586304
        ],
        "wc_review_avg": [
            271.25,
            73.54717873582915
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            663.25,
            296.4324332794912
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.7071067811865475,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Ps6ZBdHvq1QJ:scholar.google.com/&scioq=Enhancing+Mutual+Information+Estimation+in+Self-Interpretable+Graph+Neural+Networks&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;2;3",
        "aff_unique_norm": "Ant Group;Shanghai Jiao Tong University;Microsoft;Singapore Management University",
        "aff_unique_dep": ";;Microsoft Corporation;",
        "aff_unique_url": "https://www.antgroup.com;https://www.sjtu.edu.cn;https://www.microsoft.com;https://www.smu.edu.sg",
        "aff_unique_abbr": "Ant Group;SJTU;Microsoft;SMU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Asia",
        "aff_country_unique_index": "0;0;1;0;2",
        "aff_country_unique": "China;United States;Singapore"
    },
    {
        "id": "Dtxc7mlKRg",
        "title": "Class-Conditional Conformal Prediction for Imbalanced Data via Top-$k$ Classes",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Classification tasks where data contains skewed class proportions (aka {\\em imbalanced data}) arises in many real-world applications including medical diagnosis. Safe deployment of classifiers for imbalanced data settings require theoretically-sound uncertainty quantification. Conformal prediction (CP) is a promising framework for producing prediction sets from black-box classifiers with a user-specified coverage (i.e., true class is contained with high probability). Existing class-conditional CP (CCP) method employs a black-box classifier to find one threshold for each class during calibration and then includes every class label that meets the corresponding threshold for testing inputs, leading to large prediction sets. This paper studies the problem of how to develop provable CP methods with small prediction sets for the class-conditional coverage setting and makes several contributions. First, we theoretically show that marginal CP can perform arbitrarily poorly and cannot provide coverage guarantee for minority classes. Second, we propose a principled algorithm referred to as {\\em $k$-Class-conditional CP ($k$-CCP)}. The key idea behind $k$-CCP is to restrict the candidate labels for the prediction set of a testing input to only top-$k$ labels based on the classifier scores (in contrast to all labels in CCP). Third, we prove that $k$-CCP provides class-conditional coverage and produces smaller prediction sets over the CCP method. Our experiments on benchmark datasets demonstrate that $k$-CCP achieves class-conditional coverage and produces smaller prediction sets over baseline methods.",
        "keywords": "Uncertainty Quantification;Conformal Prediction;Imbalanced Data;Class-conditional Coverage;Deep Models",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/c01a3f62d7d3f4c1d52ec5169b7f64901054bebc.zip",
        "author": "Yuanjie Shi;SUBHANKAR GHOSH;Taha Belkhouja;Jana Doppa;Yan Yan",
        "authorids": "~Yuanjie_Shi1;~SUBHANKAR_GHOSH1;~Taha_Belkhouja1;~Jana_Doppa1;~Yan_Yan3",
        "gender": "F;M;M;;M",
        "homepage": "https://yuanjiesh.github.io/Yuanjie-Shi/;https://subhankarghoshss.github.io/website/;https://tahabelkhouja.github.io/;;http://iemppu.github.io/",
        "dblp": "353/2390;;211/8999;;13/3953-6",
        "google_scholar": "A8PWiEYAAAAJ;1Q73N6IAAAAJ;JPBgQOoAAAAJ;;A6co_BAAAAAJ",
        "orcid": ";;0000-0001-8749-6632;;0000-0001-9108-6767",
        "linkedin": ";subhankar-ghosh-11701a169/;;;",
        "or_profile": "~Yuanjie_Shi1;~SUBHANKAR_GHOSH1;~Taha_Belkhouja1;~Jana_Doppa1;~Yan_Yan3",
        "aff": "Washington State University;Washington State University at Pullman;Washington State University, Pullman;;Washington State University, Pullman",
        "aff_domain": "wsu.edu;wsu.edu;wsu.edu;;wsu.edu",
        "position": "PhD student;PhD student;PhD student;;Assistant Professor",
        "bibtex": "@misc{\nshi2024classconditional,\ntitle={Class-Conditional Conformal Prediction for Imbalanced Data via Top-\\$k\\$ Classes},\nauthor={Yuanjie Shi and SUBHANKAR GHOSH and Taha Belkhouja and Jana Doppa and Yan Yan},\nyear={2024},\nurl={https://openreview.net/forum?id=Dtxc7mlKRg}\n}",
        "github": "",
        "project": "",
        "reviewers": "zE7U;TQMX;RD2z;KjCS;v9Qu",
        "site": "https://openreview.net/forum?id=Dtxc7mlKRg",
        "pdf_size": 421496,
        "rating": "3;3;5;6;6",
        "confidence": "2;4;3;4;4",
        "soundness": "3;2;3;3;3",
        "contribution": "2;2;2;3;3",
        "presentation": "2;1;3;3;3",
        "wc_summary": "73;102;73;92;106",
        "wc_strengths": "42;63;72;66;54",
        "wc_weaknesses": "89;1479;84;413;183",
        "wc_questions": "119;162;113;159;2",
        "wc_review": "323;1806;342;730;345",
        "wc_reply_reviewers": "15;385;33;109;0",
        "wc_reply_authors": "786;1685;811;1849;351",
        "reply_reviewers": "1;1;1;1;0",
        "reply_authors": "1;3;2;3;1",
        "rating_avg": [
            4.6,
            1.3564659966250536
        ],
        "confidence_avg": [
            3.4,
            0.8
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.4,
            0.8
        ],
        "wc_summary_avg": [
            89.2,
            13.991425945914163
        ],
        "wc_strengths_avg": [
            59.4,
            10.461357464497617
        ],
        "wc_weaknesses_avg": [
            449.6,
            528.3512468046234
        ],
        "wc_questions_avg": [
            111.0,
            58.05859109554761
        ],
        "wc_review_avg": [
            709.2,
            569.2153898130302
        ],
        "wc_reply_reviewers_avg": [
            108.4,
            143.2949405945653
        ],
        "wc_reply_authors_avg": [
            1096.4,
            573.808190948857
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4
        ],
        "reply_authors_avg": [
            2.0,
            0.8944271909999159
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.51604684654214,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:2Q1Afgl89_kJ:scholar.google.com/&scioq=Class-Conditional+Conformal+Prediction+for+Imbalanced+Data+via+Top-%24k%24+Classes&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Washington State University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://wsu.edu",
        "aff_unique_abbr": "WSU",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Pullman",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Adversarial Imitation Learning via Boosting",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19120",
        "id": "DuQkqSe9en",
        "author_site": "Jonathan Chang, Dhruv Sreenivas, Yingbing Huang, Kiant\u00e9 Brantley, Wen Sun",
        "tldr": "",
        "abstract": "Adversarial imitation learning (AIL) has stood out as a dominant framework across various imitation learning (IL) applications, with Discriminator Actor Critic (DAC) demonstrating the effectiveness of off-policy learning algorithms in improving sample efficiency and scalability to higher-dimensional observations. Despite DAC\u2019s empirical success, the original AIL objective is on-policy and DAC\u2019s ad-hoc application of off-policy training does not guarantee successful imitation. Follow-up work such as ValueDICE tackles this issue by deriving a fully off-policy AIL objective. Instead in this work, we develop a novel and principled AIL algorithm via the framework of boosting. Like boosting, our new algorithm, AILBoost, maintains an ensemble of weighted weak learners (i.e., policies) and trains a discriminator that witnesses the maximum discrepancy between the distributions of the ensemble and the expert policy. We maintain a weighted replay buffer to represent the state-action distribution induced by the ensemble, allowing us to train discriminators using the entire data collected so far. Empirically, we evaluate our algorithm on both controller state-based and pixel-based environments from the DeepMind Control Suite. AILBoost outperforms DAC on both types of environments, demonstrating the benefit of properly weighting replay buffer data for off-policy training. On state-based environments, AILBoost outperforms ValueDICE and IQ-Learn, achieving state-of-the-art performance with as little as one expert trajectory.",
        "keywords": "Adversarial Imitation Learning;Boosting;Reinforcement Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/f50f2041c7384cbdf95c822b4df59cb232531109.pdf",
        "author": "Jonathan Daniel Chang;Dhruv Sreenivas;Yingbing Huang;Kiant\u00e9 Brantley;Wen Sun",
        "authorids": "~Jonathan_Daniel_Chang1;~Dhruv_Sreenivas1;~Yingbing_Huang1;~Kiant\u00e9_Brantley2;~Wen_Sun1",
        "gender": "M;;;;",
        "homepage": "https://www.cs.cornell.edu/people/phdstudents;https://dhruvsreenivas.github.io;https://wendyh1108.github.io/;;https://wensun.github.io",
        "dblp": ";294/5191;;;",
        "google_scholar": "_qY_t5kAAAAJ;;;;iOLC30YAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Jonathan_Daniel_Chang1;~Dhruv_Sreenivas1;~Yingbing_Huang1;~Kiant\u00e9_Brantley2;~Wen_Sun1",
        "aff": "Cornell University;Mila - Quebec Artificial Intelligence Institute;University of Illinois, Urbana Champaign;;Cornell University",
        "aff_domain": "cornell.edu;mila.quebec;uiuc.edu;;cornell.edu",
        "position": "PhD student;PhD student;PhD student;;Assistant Professor",
        "bibtex": "@inproceedings{\nchang2024adversarial,\ntitle={Adversarial Imitation Learning via Boosting},\nauthor={Jonathan Daniel Chang and Dhruv Sreenivas and Yingbing Huang and Kiant{\\'e} Brantley and Wen Sun},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=DuQkqSe9en}\n}",
        "github": "",
        "project": "",
        "reviewers": "xvjX;Ah7S;o1rE;mXvr",
        "pdf_size": 1732655,
        "rating": "5;6;6;6",
        "confidence": "3;3;3;3",
        "soundness": "3;3;2;2",
        "contribution": "3;3;2;2",
        "presentation": "3;3;3;2",
        "wc_summary": "71;134;90;97",
        "wc_strengths": "16;231;48;54",
        "wc_weaknesses": "20;264;85;83",
        "wc_questions": "88;318;365;270",
        "wc_review": "195;947;588;504",
        "wc_reply_reviewers": "57;0;379;0",
        "wc_reply_authors": "194;725;813;402",
        "reply_reviewers": "1;0;2;0",
        "reply_authors": "2;1;2;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            98.0,
            22.85825890132492
        ],
        "wc_strengths_avg": [
            87.25,
            84.24183936738324
        ],
        "wc_weaknesses_avg": [
            113.0,
            91.01373522716229
        ],
        "wc_questions_avg": [
            260.25,
            104.9675545109059
        ],
        "wc_review_avg": [
            558.5,
            267.81756850513
        ],
        "wc_reply_reviewers_avg": [
            109.0,
            157.6118650355994
        ],
        "wc_reply_authors_avg": [
            533.5,
            248.66895664718587
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8446272609777377665&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=DuQkqSe9en",
        "pdf": "https://openreview.net/pdf?id=DuQkqSe9en",
        "email": "cornell.edu;mila.quebec;uiuc.edu;;cornell.edu",
        "author_num": 5,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Cornell University;Quebec Artificial Intelligence Institute;University of Illinois Urbana-Champaign",
        "aff_unique_dep": ";Artificial Intelligence;",
        "aff_unique_url": "https://www.cornell.edu;https://mila.quebec;https://illinois.edu",
        "aff_unique_abbr": "Cornell;Mila;UIUC",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Urbana-Champaign",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "United States;Canada"
    },
    {
        "id": "Dw6y6bEtXm",
        "title": "PICL: Incorporating Coarse-Grained Data and Physics Information for Superior Physical Systems Modeling",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Physics-informed machine learning has emerged as a promising approach for modeling physical systems. However, two significant challenges limit its real-world applicability. First, most realistic scenarios allow only coarse-grained measurements due to sensor limitations, making the use of physics loss based on finite dimensional approximations infeasible. Second, the high cost of data acquisition impedes the model's predictive ability. To address these challenges, we introduce a novel framework called Physics-Informed Coarse-grained data Learning (PICL) that incorporates physics information via the learnable fine-grained state representation from coarse-grained data. This framework effectively integrates data-driven methods with physics-informed objectives, thereby significantly improving the predictive ability of the model. The PICL framework comprises two modules: the encoding module, responsible for generating the learnable fine-grained state, and the transition module, used for predicting the subsequent state. To train these modules, we employ a base-training period followed by a two-stage fine-tuning period. The key idea behind this training strategy is that we can leverage physics loss to enhance the reconstruction ability of the encoding module and the generalization ability of the transition module, using both labeled and unlabeled data. In the base-training period, we train both modules collaboratively using data loss and physics loss. In the two-stage fine-tuning period, we first tune the transition module with physics loss using unlabeled data and then tune the encoding module with data loss using labeled data to propagate the information from the transition module to the encoding module. We demonstrate that PICL exhibits superior predictive ability across modeling various PDE-governed physical systems. Code is available on GitHub: https://github.com/PI-CL/PICL.",
        "keywords": "Physics-informed machine learning;Coarse-grained data;PDEs;Neural operator",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Haodong Feng;Yue Wang;Dixia Fan",
        "authorids": "~Haodong_Feng1;~Yue_Wang15;~Dixia_Fan1",
        "gender": ";M;M",
        "homepage": ";https://scholar.google.com/citations?hl=zh-CN&user=fGv5irIAAAAJ;https://www.i4fsi.com/",
        "dblp": ";33/4822-17.html;",
        "google_scholar": "https://scholar.google.cz/citations?user=0GOKl_gAAAAJ;https://scholar.google.com/citations?hl=zh-CN;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Haodong_Feng1;~Yue_Wang15;~Dixia_Fan1",
        "aff": "Westlake University;Microsoft Research Aisa;Westlake University",
        "aff_domain": "westlake.edu;microsoft.com;westlake.edu",
        "position": "PhD student;Researcher;Assistant Professor",
        "bibtex": "@misc{\nfeng2024picl,\ntitle={{PICL}: Incorporating Coarse-Grained Data and Physics Information for Superior Physical Systems Modeling},\nauthor={Haodong Feng and Yue Wang and Dixia Fan},\nyear={2024},\nurl={https://openreview.net/forum?id=Dw6y6bEtXm}\n}",
        "github": "",
        "project": "",
        "reviewers": "fJtB;vB1V;iagL;vvjE",
        "site": "https://openreview.net/forum?id=Dw6y6bEtXm",
        "pdf_size": 2493347,
        "rating": "3;3;5;5",
        "confidence": "4;5;2;3",
        "soundness": "2;3;3;3",
        "contribution": "1;2;2;2",
        "presentation": "1;3;2;2",
        "wc_summary": "63;86;123;60",
        "wc_strengths": "38;48;40;84",
        "wc_weaknesses": "172;105;405;238",
        "wc_questions": "78;4;200;47",
        "wc_review": "351;243;768;429",
        "wc_reply_reviewers": "0;0;328;98",
        "wc_reply_authors": "965;867;2112;1564",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "3;3;4;3",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            83.0,
            25.18928343562
        ],
        "wc_strengths_avg": [
            52.5,
            18.567444627627143
        ],
        "wc_weaknesses_avg": [
            230.0,
            111.44281044553749
        ],
        "wc_questions_avg": [
            82.25,
            72.88475492172557
        ],
        "wc_review_avg": [
            447.75,
            196.3381967422539
        ],
        "wc_reply_reviewers_avg": [
            106.5,
            133.99533573971894
        ],
        "wc_reply_authors_avg": [
            1377.0,
            501.2579176432029
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.25,
            0.4330127018922193
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8944271909999159,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:8TwRTQ7G85YJ:scholar.google.com/&scioq=PICL:+Incorporating+Coarse-Grained+Data+and+Physics+Information+for+Superior+Physical+Systems+Modeling&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Westlake University;Microsoft",
        "aff_unique_dep": ";Microsoft Research",
        "aff_unique_url": "https://www.westlake.edu.cn;https://www.microsoft.com/en-us/research/group/asia",
        "aff_unique_abbr": "WU;MSR Asia",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Beijing",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "DwcV654WBP",
        "title": "TVTSv2: Learning Out-of-the-box Spatiotemporal Visual Representations at Scale",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The ultimate goal for foundation models is realizing task-agnostic, i.e., supporting out-of-the-box usage without task-specific fine-tuning. Although breakthroughs have been made in natural language processing and image representation learning, it is still challenging for video models to reach it due to the increasing uncertainty of spatiotemporal signals. To ease training, existing works leverage image foundation models' prior knowledge and equip them with ef\ufb01cient temporal modules. Despite the satisfactory fine-tuning performance, we empirically find they fall short of out-of-the-box usage, given the even degraded performance in zero-shot/linear protocols compared to their baseline counterparts. In this work, we analyze the factor that leads to degradation from the perspective of language supervision distortion. We argue that tuning a text encoder end-to-end, as done in previous work, is suboptimal since it may overfit in terms of styles, thereby losing its original generalization ability to capture the semantics of various language registers. The overfitted text encoder, in turn, provides a harmful supervision signal, degrading the video representation. To tackle this issue, we propose a degradation-free pre-training strategy to retain the generalization ability of the text encoder via freezing shallow layers while enabling the task-related semantics capturing in tunable deep layers. As for the training objective, we adopted the transcript sorting task in TVTS incorporated with masking techniques to enable scalable training. As a result, we produce a series of models, dubbed TVTSv2, with up to one billion parameters. We achieve new state-of-the-arts on various video benchmarks with a frozen backbone, surpassing the recent ImageBind, InternVideo, etc. Code and models will be released publicly.",
        "keywords": "Video Representation Learning;Out-of-the-box Video Representation;Scalable Video Pre-training",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/e20d5866d4d3cf1cb7983a29b1fb072c44e91f85.zip",
        "author": "Ziyun Zeng;Zhan Tong;Xihui Liu;Bin Chen;Shu-Tao Xia;Yixiao Ge",
        "authorids": "~Ziyun_Zeng1;~Zhan_Tong1;~Xihui_Liu1;~Bin_Chen4;~Shu-Tao_Xia1;~Yixiao_Ge2",
        "gender": "M;M;F;M;M;F",
        "homepage": "https://stdkonjac.icu/;https://github.com/yztongzhan;https://xh-liu.github.io/;https://binchen17tsinghua.wixsite.com/website;https://www.sigs.tsinghua.edu.cn/xst/list.htm;https://geyixiao.com/",
        "dblp": "282/8373.html;236/0753;184/3911;22/5523-11;03/6195;228/6649",
        "google_scholar": "RuanZLEAAAAJ;6FsgWBMAAAAJ;https://scholar.google.com.hk/citations?user=4YL23GMAAAAJ;Yl0wv7AAAAAJ;https://scholar.google.com.hk/citations?user=koAXTXgAAAAJ;TtU74NAAAAAJ",
        "orcid": ";0000-0002-3169-0599;0000-0003-1831-9952;0000-0002-4798-230X;0000-0002-8639-982X;",
        "linkedin": ";;;;;",
        "or_profile": "~Ziyun_Zeng1;~Zhan_Tong1;~Xihui_Liu1;~Bin_Chen4;~Shu-Tao_Xia1;~Yixiao_Ge2",
        "aff": "Tsinghua University;Ant Research;University of Hong Kong;Harbin Institute of Technology, Shenzhen;Shenzhen International Graduate School, Tsinghua University;Tencent",
        "aff_domain": "tsinghua.edu.cn;antgroup.com;hku.hk;hit.edu.cn;sz.tsinghua.edu.cn;tencent.com",
        "position": "MS student;Researcher;Assistant Professor;Assistant Professor;Full Professor;Researcher",
        "bibtex": "@misc{\nzeng2024tvtsv,\ntitle={{TVTS}v2: Learning Out-of-the-box Spatiotemporal Visual Representations at Scale},\nauthor={Ziyun Zeng and Zhan Tong and Xihui Liu and Bin Chen and Shu-Tao Xia and Yixiao Ge},\nyear={2024},\nurl={https://openreview.net/forum?id=DwcV654WBP}\n}",
        "github": "",
        "project": "",
        "reviewers": "tEsw;NPSQ;A6Wr;hjUh",
        "site": "https://openreview.net/forum?id=DwcV654WBP",
        "pdf_size": 1331363,
        "rating": "5;5;8;8",
        "confidence": "4;4;4;3",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "101;82;141;117",
        "wc_strengths": "52;31;151;208",
        "wc_weaknesses": "54;158;174;114",
        "wc_questions": "66;148;74;75",
        "wc_review": "273;419;540;514",
        "wc_reply_reviewers": "0;267;0;0",
        "wc_reply_authors": "387;2599;1541;843",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "2;5;4;2",
        "rating_avg": [
            6.5,
            1.5
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            110.25,
            21.649191670822262
        ],
        "wc_strengths_avg": [
            110.5,
            72.26513682267543
        ],
        "wc_weaknesses_avg": [
            125.0,
            46.50806381693394
        ],
        "wc_questions_avg": [
            90.75,
            33.23683950077083
        ],
        "wc_review_avg": [
            436.5,
            104.59086958238754
        ],
        "wc_reply_reviewers_avg": [
            66.75,
            115.61439140522256
        ],
        "wc_reply_authors_avg": [
            1342.5,
            833.7678034081191
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.25,
            1.299038105676658
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5773502691896258,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15047764024806994221&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;3;0;4",
        "aff_unique_norm": "Tsinghua University;Ant Research;University of Hong Kong;Harbin Institute of Technology;Tencent",
        "aff_unique_dep": ";;;;Tencent Holdings Limited",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.antgroup.com;https://www.hku.hk;http://en.hhit.edu.cn/;https://www.tencent.com",
        "aff_unique_abbr": "THU;Ant Research;HKU;HIT;Tencent",
        "aff_campus_unique_index": "1;2;2",
        "aff_campus_unique": ";Hong Kong SAR;Shenzhen",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "DxM73sxtna",
        "title": "Private Overparameterized Linear Regression without Suffering in High Dimensions",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This study focuses on differentially private linear regression in the over-parameterized regime. We propose a new variant of the differentially private Follow-The-Regularized-Leader (DP-FTRL) algorithm that uses a random noise with a general covariance matrix for differential privacy. This leads to improved privacy and utility (excess risk) trade-offs. Firstly, even when reduced to an existing DP-FTRL algorithm that uses an isotropic noise, our excess risk bound is sharper as a function of the eigenspectrum of the data covariance matrix and the ground truth model parameter. Furthermore, when unlabeled public data is available, we can design a better noise covariance matrix structure to improve the utility. For example, when the ground truth has a bounded $\\ell_2$-norm, and the eigenspectrum decays polynomially (i.e., $\\lambda_i=i^{-r}$ for $r>1$), our method achieves $\\mathcal{\\tilde O}(N^{-\\frac{r}{1+2r}})$ and $\\mathcal{\\tilde O}(N^{-\\frac{r}{3+r}\\wedge\\frac{2r}{1+3r}})$ excess error for identity and specially designed covariance matrices, respectively. Notably, our method with a specially designed covariance matrix outperforms the one with an identity matrix when the eigenspectrum decays at least quadratically fast, i.e., $r\\geq 2$. Our proposed method significantly improves upon existing differentially private methods for linear regression, which tend to scale with the problem dimension, leading to a vacuous guarantee in the over-parameterized regime.",
        "keywords": "Differential Privacy;Overparameterization;Linear Regression;Optimization",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Lingxiao Wang;Difan Zou;Kumar Kshitij Patel;Jingfeng Wu;Nathan Srebro",
        "authorids": "~Lingxiao_Wang5;~Difan_Zou1;~Kumar_Kshitij_Patel2;~Jingfeng_Wu1;~Nathan_Srebro1",
        "gender": "M;M;M;M;M",
        "homepage": "https://lingxiaowang-ai.github.io/;https://difanzou.github.io/;https://uuujf.github.io;http://ttic.uchicago.edu/~nati/;https://kishinmh.github.io/",
        "dblp": "140/1229-1;161/8923;;50/3633;239/8754",
        "google_scholar": "VPyxd6kAAAAJ;Cp4fcTQAAAAJ;z-KILD8AAAAJ;https://scholar.google.com.tw/citations?user=ZnT-QpMAAAAJ;https://scholar.google.cl/citations?user=Okd0qN0AAAAJ",
        "orcid": ";;0009-0009-3414-4487;;0000-0002-6886-6826",
        "linkedin": ";;jingfeng-wu-79205b184/;;kumar-kshitij-patel-604a4651/",
        "or_profile": "~Lingxiao_Wang5;~Difan_Zou1;~Jingfeng_Wu1;~Nathan_Srebro1;~Kumar_Kshitij_Patel1",
        "aff": "Toyota Technological Institute at Chicago;University of Hong Kong;University of California, Berkeley;University of Chicago;Toyota Technological Institute at Chicago",
        "aff_domain": "ttic.edu;hku.hk;berkeley.edu;uchicago.edu;ttic.edu",
        "position": "Research assistant professor;Assistant Professor;Postdoc;Full Professor;PhD student",
        "bibtex": "@misc{\nwang2024private,\ntitle={Private Overparameterized Linear Regression without Suffering in High Dimensions},\nauthor={Lingxiao Wang and Difan Zou and Kumar Kshitij Patel and Jingfeng Wu and Nathan Srebro},\nyear={2024},\nurl={https://openreview.net/forum?id=DxM73sxtna}\n}",
        "github": "",
        "project": "",
        "reviewers": "BWiw;mnfV;2YVT;jHEC",
        "site": "https://openreview.net/forum?id=DxM73sxtna",
        "pdf_size": 602015,
        "rating": "3;3;6;6",
        "confidence": "3;5;3;3",
        "soundness": "4;3;4;3",
        "contribution": "2;2;3;2",
        "presentation": "3;3;4;2",
        "wc_summary": "329;60;230;98",
        "wc_strengths": "39;42;103;166",
        "wc_weaknesses": "284;124;201;669",
        "wc_questions": "101;33;137;620",
        "wc_review": "753;259;671;1553",
        "wc_reply_reviewers": "162;295;130;1205",
        "wc_reply_authors": "1672;1678;649;1222",
        "reply_reviewers": "1;2;1;3",
        "reply_authors": "3;3;2;4",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            179.25,
            107.0312454379561
        ],
        "wc_strengths_avg": [
            87.5,
            52.02163011671203
        ],
        "wc_weaknesses_avg": [
            319.5,
            209.56681512109688
        ],
        "wc_questions_avg": [
            222.75,
            232.37294915716848
        ],
        "wc_review_avg": [
            809.0,
            468.56589717989505
        ],
        "wc_reply_reviewers_avg": [
            448.0,
            441.4119391226295
        ],
        "wc_reply_authors_avg": [
            1305.25,
            421.6167542923312
        ],
        "reply_reviewers_avg": [
            1.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5773502691896258,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:0GC84QyhVYoJ:scholar.google.com/&scioq=Private+Overparameterized+Linear+Regression+without+Suffering+in+High+Dimensions&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;0",
        "aff_unique_norm": "Toyota Technological Institute at Chicago;University of Hong Kong;University of California, Berkeley;University of Chicago",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.tti-chicago.org;https://www.hku.hk;https://www.berkeley.edu;https://www.uchicago.edu",
        "aff_unique_abbr": "TTI Chicago;HKU;UC Berkeley;UChicago",
        "aff_campus_unique_index": "0;1;2;0",
        "aff_campus_unique": "Chicago;Hong Kong SAR;Berkeley;",
        "aff_country_unique_index": "0;1;0;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "Dxl0EuFjlf",
        "title": "TILDE-Q: A Transformation Invariant Loss Function for Time-Series Forecasting",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Time-series forecasting has gained increasing attention in the field of artificial intelligence due to its potential to address real-world problems across various domains, including energy, weather, traffic, and economy. While time-series forecasting is a well-researched field, predicting complex temporal patterns such as sudden changes in sequential data still poses a challenge with current models. This difficulty stems from minimizing $L_p$ norm distances as loss functions, such as mean absolute error (MAE) or mean square error (MSE), which are susceptible to both intricate temporal dynamics modeling and signal shape capturing. Furthermore, these functions often cause models to behave aberrantly and generate uncorrelated results with the original time-series. Consequently, the development of a shape-aware loss function that goes beyond mere point-wise comparison is essential. In this paper, we examine the definition of shape and distortions, which are crucial for shape-awareness in time-series forecasting, and provide a design rationale for the shape-aware loss function. Based on our design rationale, we propose a novel, compact loss function called TILDE-Q (Transformation Invariant Loss function with Distance EQuilibrium) that considers not only amplitude and phase distortions but also allows models to capture the shape of time-series sequences. Furthermore, TILDE-Q supports the simultaneous modeling of periodic and nonperiodic temporal dynamics. We evaluate the efficacy of TILDE-Q by conducting extensive experiments under both periodic and nonperiodic conditions with various models ranging from naive to state-of-the-art. The experimental results show that the models trained with TILDE-Q surpass those trained with other metrics, such as MSE and DILATE, in various real-world applications, including electricity, traffic, economics, weather, and electricity transformer temperature (ETT).",
        "keywords": "Time-Series Forecasting;Deep Learning;Loss functions;Time-series Similarity",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/21e20f2a66adb76caff08fd9940fdadb82eabe88.zip",
        "author": "Hyunwook Lee;Chunggi Lee;Hongkyu Lim;Sungahn Ko",
        "authorids": "~Hyunwook_Lee1;~Chunggi_Lee1;~Hongkyu_Lim1;~Sungahn_Ko1",
        "gender": "M;M;M;M",
        "homepage": ";https://chungyi347.github.io/;https://rose-chicken-8dc.notion.site/Hongkyu-Lim-9cbb1a89facc4e669f579767261c22db;https://sites.google.com/view/haiv/",
        "dblp": ";243/0156;;16/9189",
        "google_scholar": "GTWj-V4AAAAJ;0k8JcJIAAAAJ;;gKnZiVcAAAAJ",
        "orcid": "0000-0002-5506-7347;;;",
        "linkedin": "hyunwook-lee-2b15ba283;;;",
        "or_profile": "~Hyunwook_Lee1;~Chunggi_Lee1;~Hongkyu_Lim1;~Sungahn_Ko1",
        "aff": "Ulsan National Institute of Science and Technology;Harvard University;Hyundai Motor Company;Ulsan National Institute of Science and Technology",
        "aff_domain": "unist.ac.kr;harvard.edu;hyundai.com;unist.ac.kr",
        "position": "PhD student;PhD student;Researcher;Associate Professor",
        "bibtex": "@misc{\nlee2024tildeq,\ntitle={{TILDE}-Q: A Transformation Invariant Loss Function for Time-Series Forecasting},\nauthor={Hyunwook Lee and Chunggi Lee and Hongkyu Lim and Sungahn Ko},\nyear={2024},\nurl={https://openreview.net/forum?id=Dxl0EuFjlf}\n}",
        "github": "",
        "project": "",
        "reviewers": "xHdk;gjfT;Ba52;sFtV",
        "site": "https://openreview.net/forum?id=Dxl0EuFjlf",
        "pdf_size": 2633601,
        "rating": "5;5;6;8",
        "confidence": "4;4;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;2;3",
        "wc_summary": "46;28;44;61",
        "wc_strengths": "31;16;22;166",
        "wc_weaknesses": "45;41;110;86",
        "wc_questions": "361;48;152;78",
        "wc_review": "483;133;328;391",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "541;188;446;225",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            44.75,
            11.691342951089922
        ],
        "wc_strengths_avg": [
            58.75,
            62.1505229261991
        ],
        "wc_weaknesses_avg": [
            70.5,
            28.81405906844782
        ],
        "wc_questions_avg": [
            159.75,
            122.20142184115535
        ],
        "wc_review_avg": [
            333.75,
            128.34207221328475
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            350.0,
            147.95776424371923
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11350394722117885277&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Ulsan National Institute of Science and Technology;Harvard University;Hyundai Motor Company",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.unist.ac.kr;https://www.harvard.edu;https://www.hyundai.com",
        "aff_unique_abbr": "UNIST;Harvard;HMC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "id": "Dxm7eil2HT",
        "title": "RoCA: A Robust Method to Discover Causal or Anticausal Relation by Noise Injection",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Understanding whether the data generative process is causal or anticausal is important for algorithm design. It helps machine learning practitioners understand whether semi-supervised learning should be employed for real-world learning tasks. In many cases, existing causal discovery methods cannot be adaptable to this task, as they struggle with scalability and are ill-suited for high-dimensional perceptual data such as images. In this paper, we propose a method that detects whether the data generative process is causal or anticausal. Our method is robust to label errors and is designed to handle both large-scale and high-dimensional datasets effectively. Both theoretical analyses and empirical results on a variety of datasets demonstrate the effectiveness of our proposed method in determining the causal or anticausal direction of the data generative process.",
        "keywords": "Causal or Anticausal Relation Discovery;Semi-Supervised Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Yu Yao;Yang Zhou;Mingming Gong;Kun Zhang;Tongliang Liu",
        "authorids": "~Yu_Yao3;~Yang_Zhou16;~Mingming_Gong1;~Kun_Zhang1;~Tongliang_Liu1",
        "gender": "M;;M;M;M",
        "homepage": "https://a5507203.github.io/;;https://mingming-gong.github.io/;http://www.andrew.cmu.edu/user/kunz1/;https://tongliang-liu.github.io/",
        "dblp": "230/9625;;98/8479;96/3115-1;150/6667",
        "google_scholar": "OkcaMKAAAAAJ;;https://scholar.google.com.au/citations?user=6BmiCJIAAAAJ;RGoypN4AAAAJ;https://scholar.google.com.au/citations?user=EiLdZ_YAAAAJ",
        "orcid": ";;0000-0001-7147-5589;;",
        "linkedin": "yu-yao-150377134/;;;;",
        "or_profile": "~Yu_Yao3;~Yang_Zhou16;~Mingming_Gong1;~Kun_Zhang1;~Tongliang_Liu1",
        "aff": "University of Sydney;;University of Melbourne;Carnegie Mellon University;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_domain": "sydney.edu.au;;unimelb.edu.au;cmu.edu;mbzuai.ac.ae",
        "position": "Lecturer;;Assistant Professor;Associate Professor;Affiliated Associate Professor",
        "bibtex": "@misc{\nyao2024roca,\ntitle={Ro{CA}: A Robust Method to Discover Causal or Anticausal Relation by Noise Injection},\nauthor={Yu Yao and Yang Zhou and Mingming Gong and Kun Zhang and Tongliang Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=Dxm7eil2HT}\n}",
        "github": "",
        "project": "",
        "reviewers": "32x9;aduf;g7sE",
        "site": "https://openreview.net/forum?id=Dxm7eil2HT",
        "pdf_size": 1140774,
        "rating": "3;6;6",
        "confidence": "3;2;4",
        "soundness": "2;3;2",
        "contribution": "2;2;2",
        "presentation": "2;3;2",
        "wc_summary": "102;66;167",
        "wc_strengths": "27;26;33",
        "wc_weaknesses": "277;33;403",
        "wc_questions": "8;344;84",
        "wc_review": "414;469;687",
        "wc_reply_reviewers": "0;47;45",
        "wc_reply_authors": "2989;1560;2295",
        "reply_reviewers": "0;1;1",
        "reply_authors": "9;4;7",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            111.66666666666667,
            41.79579989531111
        ],
        "wc_strengths_avg": [
            28.666666666666668,
            3.0912061651652345
        ],
        "wc_weaknesses_avg": [
            237.66666666666666,
            153.59108770440497
        ],
        "wc_questions_avg": [
            145.33333333333334,
            143.8641334346017
        ],
        "wc_review_avg": [
            523.3333333333334,
            117.88789401611837
        ],
        "wc_reply_reviewers_avg": [
            30.666666666666668,
            21.69997439834639
        ],
        "wc_reply_authors_avg": [
            2281.3333333333335,
            583.4668418646903
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            6.666666666666667,
            2.0548046676563256
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:9Mg3GiTpVDEJ:scholar.google.com/&scioq=RoCA:+A+Robust+Method+to+Discover+Causal+or+Anticausal+Relation+by+Noise+Injection&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "University of Sydney;University of Melbourne;Carnegie Mellon University;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.sydney.edu.au;https://www.unimelb.edu.au;https://www.cmu.edu;https://mbzuai.ac.ae",
        "aff_unique_abbr": "USYD;UniMelb;CMU;MBZUAI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;2",
        "aff_country_unique": "Australia;United States;United Arab Emirates"
    },
    {
        "id": "DyBcEiIs5J",
        "title": "Boosting Adverse Weather Crowd Counting via Multi-queue Contrastive Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Currently, most crowd counting methods perform well under normal weather conditions. However, they often struggle to maintain their performance in extreme and adverse weather conditions due to significant differences in the domain and a lack of adverse weather images for training. To address this issue and enhance the model's robustness in adverse weather, we propose a two-stage crowd counting method. In the first stage, we introduce a multi-queue MoCo contrastive learning strategy to tackle the problem of class imbalance caused by weather variations. This strategy facilitates the learning of weather-aware representations by the model. In the second stage, we employ the supervised contrastive loss to guide the refinement process, enabling the conversion of the weather-aware representations to the normal weather domain. In addition, we also created a new synthetic adverse weather dataset. Extensive experimental results show that our method achieves competitive performance.",
        "keywords": "Crowd counting;adverse weather;multi-queue contrastive learning.",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Tianhang Pan;Zhuoran Zheng;Xiuyi Jia",
        "authorids": "~Tianhang_Pan1;~Zhuoran_Zheng1;~Xiuyi_Jia1",
        "gender": "M;M;",
        "homepage": "https://tianhangpan.github.io;https://zzr-idam.github.io/Zhuoranzheng.github.io;",
        "dblp": ";293/8326;23/5047",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;pXzPL-sAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0001-7913-8405;;",
        "linkedin": "\u5929\u822a-\u6f58-641735292/;;",
        "or_profile": "~Tianhang_Pan1;~Zhuoran_Zheng1;~Xiuyi_Jia1",
        "aff": "Nanjing University of Science and Technology;SUN YAT-SEN UNIVERSITY;Nanjing University of Science and Technology",
        "aff_domain": "njust.edu.cn;sysu.edu.cn;njust.edu.cn",
        "position": "MS student;Postdoc;Full Professor",
        "bibtex": "@misc{\npan2024boosting,\ntitle={Boosting Adverse Weather Crowd Counting via Multi-queue Contrastive Learning},\nauthor={Tianhang Pan and Zhuoran Zheng and Xiuyi Jia},\nyear={2024},\nurl={https://openreview.net/forum?id=DyBcEiIs5J}\n}",
        "github": "",
        "project": "",
        "reviewers": "WLVr;nR6L;evYm",
        "site": "https://openreview.net/forum?id=DyBcEiIs5J",
        "pdf_size": 552971,
        "rating": "3;5;5",
        "confidence": "5;5;4",
        "soundness": "2;2;2",
        "contribution": "2;2;3",
        "presentation": "2;2;3",
        "wc_summary": "61;61;68",
        "wc_strengths": "23;10;48",
        "wc_weaknesses": "143;72;30",
        "wc_questions": "2;85;184",
        "wc_review": "229;228;330",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            63.333333333333336,
            3.299831645537222
        ],
        "wc_strengths_avg": [
            27.0,
            15.769168230019828
        ],
        "wc_weaknesses_avg": [
            81.66666666666667,
            46.63570401408012
        ],
        "wc_questions_avg": [
            90.33333333333333,
            74.39683386333648
        ],
        "wc_review_avg": [
            262.3333333333333,
            47.84930047091133
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16712068469709361481&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Nanjing University of Science and Technology;Sun Yat-sen University",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.nust.edu.cn/;http://www.sysu.edu.cn",
        "aff_unique_abbr": "NUST;SYSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "DyclWshWvf",
        "title": "Causal-based Analysis on Credibility of Feedforward Neural Network",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Feedforward neural network (FNN) has been widely used in various fields. However, its credibility in some risk-sensitive fields remains questionable. The complex causal relations between neurons in the input layer is hard to be observed. These causal relations affect the credibility of FNN directly or indirectly. We transform FNN into a causal structure with different causal relations in the input layer. In order to analyze the causal structure accurately, we categorize it into three causal sub-structures based on different causal relations between input and output neurons. With different levels of intervention, we analyze the causal effect by calculating average treatment effect for each neuron in the input layer. We conduct experiments in the field of pediatric ophthalmology. The results demonstrate the validity of our causal-based analysis method.",
        "keywords": "causal effect;causal relation;feedforward neural network",
        "primary_area": "causal reasoning",
        "supplementary_material": "",
        "author": "Pengzhao Quan;Zhengxi Li;Hongsheng Ma;Yunlin Lei;Hanzhu Jia;Lanyu Gao;Xu Yang",
        "authorids": "~Pengzhao_Quan1;~Zhengxi_Li1;~Hongsheng_Ma1;~Yunlin_Lei1;~Hanzhu_Jia1;~Lanyu_Gao1;~Xu_Yang8",
        "gender": "M;M;;M;F;M;M",
        "homepage": "https://github.com/Kwon7;https://github.com/lhhh31;;https://lylist.github.io/;;https://orcid.org/my-orcid?orcid=0009-0005-9836-819X;https://cs.bit.edu.cn/szdw/jsml/fjs/yx/index.htm",
        "dblp": ";;;250/2000.html;;;",
        "google_scholar": ";;;;;;",
        "orcid": ";;;0000-0003-2643-8214;0009-0003-7145-5504;0009-0005-9836-819X;",
        "linkedin": ";;;;;;",
        "or_profile": "~Pengzhao_Quan1;~Zhengxi_Li1;~Hongsheng_Ma1;~Yunlin_Lei1;~Hanzhu_Jia1;~Lanyu_Gao1;~Xu_Yang8",
        "aff": "Beijing Institute of Technology;Beijing Institute of Technology;;Beijing Institute of Technology;BIT;Beijing Institute of Technology;Beijing Institute of Technology",
        "aff_domain": "bit.edu.cn;bit.edu.cn;;bit.edu.cn;bit.edu;bit.edu;bit.edu.cn",
        "position": "MS student;MS student;;PhD student;MS student;MS student;Associate Professor",
        "bibtex": "@misc{\nanonymous2024causalbased,\ntitle={Causal-based Analysis on Credibility of Feedforward Neural Network},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=DyclWshWvf}\n}",
        "github": "",
        "project": "",
        "reviewers": "3wbn;EaUh;wRkd;HFVt",
        "site": "https://openreview.net/forum?id=DyclWshWvf",
        "pdf_size": 1793272,
        "rating": "3;3;5;5",
        "confidence": "2;4;4;2",
        "soundness": "3;1;2;2",
        "contribution": "2;2;3;2",
        "presentation": "2;2;2;2",
        "wc_summary": "65;19;75;93",
        "wc_strengths": "13;46;47;63",
        "wc_weaknesses": "50;87;243;212",
        "wc_questions": "15;328;73;313",
        "wc_review": "143;480;438;681",
        "wc_reply_reviewers": "0;0;34;0",
        "wc_reply_authors": "65;154;226;157",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.0,
            1.0
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            63.0,
            27.313000567495326
        ],
        "wc_strengths_avg": [
            42.25,
            18.18481509391833
        ],
        "wc_weaknesses_avg": [
            148.0,
            81.31113084934928
        ],
        "wc_questions_avg": [
            182.25,
            139.86310271118685
        ],
        "wc_review_avg": [
            435.5,
            192.23228136814066
        ],
        "wc_reply_reviewers_avg": [
            8.5,
            14.722431864335457
        ],
        "wc_reply_authors_avg": [
            150.5,
            57.151115474678186
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:tXGjxCCU-WoJ:scholar.google.com/&scioq=Causal-based+Analysis+on+Credibility+of+Feedforward+Neural+Network&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "Beijing Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.bit.edu.cn/",
        "aff_unique_abbr": "BIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "DzxaRFVsgC",
        "title": "GPT4RoI: Instruction Tuning Large Language Model on Region-of-Interest",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Visual instruction tuning large language model(LLM) on image-text pairs has achieved general-purpose vision-language abilities. However, the lack of region-text pairs limits their advancements to fine-grained multimodal understanding. In this paper, we propose spatial instruction tuning, which introduces the reference to the region-of-interest(RoI) in the instruction. Before sending to LLM, the reference is replaced by RoI features and interleaved with language embeddings as a sequence. Our model GPT4RoI, trained on 7 region-text pair datasets, brings an unprecedented interactive and conversational experience compared to previous image-level models. (1) Interaction beyond language: Users can interact with our model by both language and drawing bounding boxes to flexibly adjust the referring granularity. (2) Versatile multimodal abilities: A variety of attribute information within each RoI can be mined by GPT4RoI, e.g., color, shape, material, action, etc. Furthermore, it can reason about multiple RoIs based on common sense. On the Visual Commonsense Reasoning (VCR) dataset, GPT4RoI achieves a remarkable accuracy of 81.6\\%, surpassing all existing models by a significant margin (the second place is 75.6\\%) and almost reaching human-level performance of 85.0\\%. \nThe code, dataset, and demo can be found at https://github.com/Anonymous-Researcher1/GPT4RoI.",
        "keywords": "vision language model;large language model;instruction tuning;visual commonsense reasoning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/ef23bcba3cc61b405cda3ba8c205eb220d6e79cf.zip",
        "author": "Shilong Zhang;Peize Sun;Shoufa Chen;Minn Xiao;Wenqi Shao;Wenwei Zhang;Yu Liu;Kai Chen;Ping Luo",
        "authorids": "~Shilong_Zhang1;~Peize_Sun1;~Shoufa_Chen1;~Minn_Xiao1;~Wenqi_Shao2;~Wenwei_Zhang1;~Yu_Liu23;~Kai_Chen4;~Ping_Luo2",
        "gender": "M;M;M;;M;M;M;M;",
        "homepage": "https://jshilong.github.io/;https://peizesun.github.io/;https://www.shoufachen.com;https://github.com/Echo-minn;https://wqshao126.github.io/;https://zhangwenwei.cn;https://github.com/liuyuyuil;https://chenkai.site/;http://luoping.me/",
        "dblp": ";249/2345;187/4654;;227/3122;;97/2274-63;181/2839-26;54/4989-2.html",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;Grkp5AQAAAAJ;ogoCvHEAAAAJ;;Bs9mrwwAAAAJ;QDXADSEAAAAJ;8zksQb4AAAAJ;https://scholar.google.com.hk/citations?user=eGD0b7IAAAAJ;https://scholar.google.com.hk/citations?hl=en",
        "orcid": "0009-0005-4336-4941;;0000-0002-6126-2595;;;0000-0002-2748-4514;;0000-0002-6820-2325;0000-0002-6685-7950",
        "linkedin": ";;;;;wenweizhang-b9769a124/;;;",
        "or_profile": "~Shilong_Zhang1;~Peize_Sun1;~Shoufa_Chen1;~Minn_Xiao1;~Wenqi_Shao2;~Wenwei_Zhang1;~Yu_Liu23;~Kai_Chen4;~Luo_Ping2",
        "aff": "Alibaba Group;The University of Hong Kong;The University of Hong Kong;;Shanghai AI Laboratory;Shanghai AI Laboratory;Alibaba Group;Shanghai AI Laboratory;The University of Hong Kong",
        "aff_domain": "alibaba.com;hku.hk;hku.hk;;pjlab.org.cn;pjlab.org.cn;alibaba-inc.com;pjlab.org.cn;hku.hk",
        "position": "Intern;PhD student;PhD student;;Researcher;Researcher;Researcher;Researcher;Associate Professor",
        "bibtex": "@misc{\nzhang2024gptroi,\ntitle={{GPT}4RoI: Instruction Tuning Large Language Model on Region-of-Interest},\nauthor={Shilong Zhang and Peize Sun and Shoufa Chen and Minn Xiao and Wenqi Shao and Wenwei Zhang and Yu Liu and Kai Chen and Ping Luo},\nyear={2024},\nurl={https://openreview.net/forum?id=DzxaRFVsgC}\n}",
        "github": "",
        "project": "",
        "reviewers": "MYqZ;kN3t;fWBC;yj7F",
        "site": "https://openreview.net/forum?id=DzxaRFVsgC",
        "pdf_size": 12677440,
        "rating": "3;5;6;8",
        "confidence": "3;4;4;3",
        "soundness": "2;3;3;4",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;4",
        "wc_summary": "81;24;83;73",
        "wc_strengths": "57;29;43;35",
        "wc_weaknesses": "106;215;291;83",
        "wc_questions": "12;31;21;69",
        "wc_review": "256;299;438;260",
        "wc_reply_reviewers": "110;109;0;9",
        "wc_reply_authors": "1588;1793;271;340",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "6;7;1;1",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            65.25,
            24.107830678018296
        ],
        "wc_strengths_avg": [
            41.0,
            10.488088481701515
        ],
        "wc_weaknesses_avg": [
            173.75,
            84.07548691503368
        ],
        "wc_questions_avg": [
            33.25,
            21.706853756359994
        ],
        "wc_review_avg": [
            313.25,
            73.95733567402222
        ],
        "wc_reply_reviewers_avg": [
            57.0,
            52.59752845904454
        ],
        "wc_reply_authors_avg": [
            998.0,
            696.7097674067732
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.75,
            2.7726341266023544
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0;1;1;2;2;0;2;1",
        "aff_unique_norm": "Alibaba Group;University of Hong Kong;Shanghai AI Laboratory",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.alibaba.com;https://www.hku.hk;https://www.shanghai-ai-lab.com",
        "aff_unique_abbr": "Alibaba;HKU;SAIL",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Enhancing Group Fairness in Online Settings Using Oblique Decision Forests",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19119",
        "id": "E1NxN5QMOE",
        "author_site": "Somnath Basu Roy Chowdhury, Nicholas Monath, Ahmad Beirami, Rahul Kidambi, Kumar Dubey, Amr Ahmed, Snigdha Chaturvedi",
        "tldr": "",
        "abstract": "Fairness, especially group fairness, is an important consideration in the context of machine learning systems. The most commonly adopted group fairness-enhancing techniques are in-processing methods that rely on a mixture of a fairness objective (e.g., demographic parity) and a task-specific objective (e.g., cross-entropy) during the training process. However, when data arrives in an online fashion \u2013 one instance at a time \u2013 optimizing such fairness objectives poses several challenges. In particular, group fairness objectives are defined using expectations of predictions across different demographic groups. In the online setting, where the algorithm has access to a single instance at a time, estimating the group fairness objective requires additional storage and significantly more computation (e.g., forward/backward passes) than the task-specific objective at every time step. In this paper, we propose Aranyani, an ensemble of oblique decision trees, to make fair decisions in online settings. The hierarchical tree structure of Aranyani enables parameter isolation and allows us to efficiently compute the fairness gradients using aggregate statistics of previous decisions, eliminating the need for additional storage and forward/backward passes. We also present an efficient framework to train Aranyani and theoretically analyze several of its properties. We conduct empirical evaluations on 5 publicly available benchmarks (including vision and language datasets) to show that Aranyani achieves a better accuracy-fairness trade-off compared to baseline approaches.",
        "keywords": "Fairness;Online Learning;Oblique Decision Trees",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/8eb45efc5607d8b3f57dd16341f441fd74d25685.zip",
        "author": "Somnath Basu Roy Chowdhury;Nicholas Monath;Ahmad Beirami;Rahul Kidambi;Kumar Avinava Dubey;Amr Ahmed;Snigdha Chaturvedi",
        "authorids": "~Somnath_Basu_Roy_Chowdhury3;~Nicholas_Monath1;~Ahmad_Beirami1;~Rahul_Kidambi1;~Kumar_Avinava_Dubey1;~Amr_Ahmed1;~Snigdha_Chaturvedi2",
        "gender": ";M;M;;;M;F",
        "homepage": "https://www.cs.unc.edu/~somnath/;https://nmonath.github.io/;https://beirami.github.io/;;;https://research.google/people/AmrAhmed/;https://sites.google.com/site/snigdhac/",
        "dblp": "190/7535;131/4309;41/9367;;;49/2951;77/8700",
        "google_scholar": "https://scholar.google.co.in/citations?user=xGbyrIUAAAAJ;PTfhfCQAAAAJ;VuKWbMMAAAAJ;;;ivUi2T0AAAAJ;gZD3EesAAAAJ",
        "orcid": ";0000-0002-5135-2423;;;;;",
        "linkedin": ";nicholas-monath-8627581aa/;ahmad-beirami-97001962;;;amr-ahmed-b998965/;",
        "or_profile": "~Somnath_Basu_Roy_Chowdhury3;~Nicholas_Monath1;~Ahmad_Beirami1;~Rahul_Kidambi1;~Kumar_Avinava_Dubey1;~Amr_Ahmed1;~Snigdha_Chaturvedi2",
        "aff": "Department of Computer Science, University of North Carolina, Chapel Hill;Google;Massachusetts Institute of Technology;;;;Department of Computer Science, University of North Carolina, Chapel Hill",
        "aff_domain": "cs.unc.edu;google.com;mit.edu;;;;cs.unc.edu",
        "position": "PhD student;Researcher;Research Affiliate;;;;Assistant Professor",
        "bibtex": "@inproceedings{\nchowdhury2024enhancing,\ntitle={Enhancing Group Fairness in Online Settings Using Oblique Decision Forests},\nauthor={Somnath Basu Roy Chowdhury and Nicholas Monath and Ahmad Beirami and Rahul Kidambi and Kumar Avinava Dubey and Amr Ahmed and Snigdha Chaturvedi},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=E1NxN5QMOE}\n}",
        "github": "",
        "project": "",
        "reviewers": "VSWz;uVjM;mq1x;vgYA;9Pu9",
        "pdf_size": 2724078,
        "rating": "5;6;8;8;8",
        "confidence": "3;4;4;3;3",
        "soundness": "2;4;4;3;3",
        "contribution": "3;3;4;3;3",
        "presentation": "2;4;4;4;3",
        "wc_summary": "43;129;320;147;99",
        "wc_strengths": "22;94;153;98;270",
        "wc_weaknesses": "154;139;187;189;456",
        "wc_questions": "26;7;124;51;437",
        "wc_review": "245;369;784;485;1262",
        "wc_reply_reviewers": "283;0;27;0;186",
        "wc_reply_authors": "1838;347;623;454;1378",
        "reply_reviewers": "2;0;1;0;1",
        "reply_authors": "5;2;3;2;4",
        "rating_avg": [
            7.0,
            1.2649110640673518
        ],
        "confidence_avg": [
            3.4,
            0.4898979485566356
        ],
        "soundness_avg": [
            3.2,
            0.7483314773547882
        ],
        "contribution_avg": [
            3.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            3.4,
            0.8
        ],
        "wc_summary_avg": [
            147.6,
            93.13560006785805
        ],
        "wc_strengths_avg": [
            127.4,
            82.55810075334824
        ],
        "wc_weaknesses_avg": [
            225.0,
            117.07946019691072
        ],
        "wc_questions_avg": [
            129.0,
            159.03836015251164
        ],
        "wc_review_avg": [
            629.0,
            363.45728772443124
        ],
        "wc_reply_reviewers_avg": [
            99.2,
            115.07458450935202
        ],
        "wc_reply_authors_avg": [
            928.0,
            580.6654802896414
        ],
        "reply_reviewers_avg": [
            0.8,
            0.7483314773547883
        ],
        "reply_authors_avg": [
            3.2,
            1.16619037896906
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8920689095674170656&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=E1NxN5QMOE",
        "pdf": "https://openreview.net/pdf?id=E1NxN5QMOE",
        "email": "cs.unc.edu;google.com;mit.edu;;;;cs.unc.edu",
        "author_num": 7,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "University of North Carolina;Google;Massachusetts Institute of Technology",
        "aff_unique_dep": "Department of Computer Science;Google;",
        "aff_unique_url": "https://www.unc.edu;https://www.google.com;https://web.mit.edu",
        "aff_unique_abbr": "UNC;Google;MIT",
        "aff_campus_unique_index": "0;1;0",
        "aff_campus_unique": "Chapel Hill;Mountain View;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "E296x0YpML",
        "title": "Fooling the Textual Fooler via Randomizing Latent Representations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Despite outstanding performance in a variety of NLP tasks, recent studies have revealed that NLP models are vulnerable to adversarial attacks that slightly perturb the input to cause the models to misbehave. Among these attacks, adversarial word-level perturbations are well-studied and effective attack strategies. These attacks involve querying the victim model many times to determine the most important words in an input text and to replace these words with their corresponding synonyms. Query-based attacks as such work in black-box settings, which can be detrimental to NLP applications that can be accessed publicly. In this work, we propose a lightweight and attack-agnostic defense whose main goal is to perplex the process of generating an adversarial example in these query-based black-box attacks; that is to fool the textual fooler. This defense, named AdvFooler, works by randomizing the latent representation of the input at inference time. Different from existing defenses, AdvFooler does not necessitate additional computational overhead during training nor relies on assumptions about the potential adversarial perturbation set while having a negligible impact on the model's accuracy. Our theoretical and empirical analyses highlight the significance of robustness resulting from confusing the adversary via randomizing the latent space, as well as the impact of randomization on clean accuracy. Finally, we empirically demonstrate the near state-of-the-art robustness of AdvFooler against representative adversarial word-level attacks on two benchmark datasets.",
        "keywords": "NLP;Adversarial Defense;Robustbess",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/43ce20e0dd00d15a085f08f3142d46b83ba7d6e6.zip",
        "author": "Duy Cao Hoang;Nguyen Hung-Quang;Saurav Manchanda;Minlong Peng;Kok-Seng Wong;Khoa D Doan",
        "authorids": "~Duy_Cao_Hoang1;~Nguyen_Hung-Quang1;~Saurav_Manchanda1;~Minlong_Peng1;~Kok-Seng_Wong1;~Khoa_D_Doan1",
        "gender": "M;;M;M;;M",
        "homepage": ";https://nguyenhungquang.github.io/;;https://v-mipeng.github.io/;https://khoadoan.me;https://sail-research.com/",
        "dblp": ";350/4481;221/3669;205/9010;238/4276.html;29/11439",
        "google_scholar": ";1OXkvboAAAAJ;FK9e6JgAAAAJ;ugZ0lVQAAAAJ;Zz2hMgcAAAAJ;https://scholar.google.co.kr/citations?user=WQyULhIAAAAJ",
        "orcid": ";;;;;0000-0002-2029-7644",
        "linkedin": "https://linkedin.com/in/caoduyh/;h%C3%B9ng-quang-nguy%E1%BB%85n-48186a202/;;;;kok-seng-wong-058217204/",
        "or_profile": "~Duy_Cao_Hoang1;~Nguyen_Hung-Quang1;~Saurav_Manchanda1;~Minlong_Peng1;~Khoa_Doan1;~KOK_SENG_WONG2",
        "aff": "VinUniversity;VinUniversity ;Amazon;Baidu;VinUniversity;VinUniversity",
        "aff_domain": "vinuni.edu.vn;vinuni.edu.vn;amazon.com;baidu.com;vinuni.edu.vn;vinuni.edu.vn",
        "position": "Research Assistant;Research Assistant;Researcher;Researcher;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nhoang2024fooling,\ntitle={Fooling the Textual Fooler via Randomizing Latent Representations},\nauthor={Duy Cao Hoang and Nguyen Hung-Quang and Saurav Manchanda and Minlong Peng and Kok-Seng Wong and Khoa D Doan},\nyear={2024},\nurl={https://openreview.net/forum?id=E296x0YpML}\n}",
        "github": "",
        "project": "",
        "reviewers": "bLP9;UMzy;9Kvp;2d4f",
        "site": "https://openreview.net/forum?id=E296x0YpML",
        "pdf_size": 338325,
        "rating": "3;5;6;8",
        "confidence": "5;5;3;5",
        "soundness": "2;3;3;4",
        "contribution": "2;2;2;4",
        "presentation": "4;3;3;3",
        "wc_summary": "47;34;54;496",
        "wc_strengths": "21;4;58;119",
        "wc_weaknesses": "152;14;129;652",
        "wc_questions": "2;161;25;95",
        "wc_review": "222;213;266;1362",
        "wc_reply_reviewers": "0;0;0;265",
        "wc_reply_authors": "468;1035;736;1605",
        "reply_reviewers": "0;0;0;4",
        "reply_authors": "1;2;1;3",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            4.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            157.75,
            195.42054011797225
        ],
        "wc_strengths_avg": [
            50.5,
            44.104988380000734
        ],
        "wc_weaknesses_avg": [
            236.75,
            245.37866146020113
        ],
        "wc_questions_avg": [
            70.75,
            62.35533257067915
        ],
        "wc_review_avg": [
            515.75,
            488.994056712349
        ],
        "wc_reply_reviewers_avg": [
            66.25,
            114.74836600143811
        ],
        "wc_reply_authors_avg": [
            961.0,
            422.45887373802435
        ],
        "reply_reviewers_avg": [
            1.0,
            1.7320508075688772
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.16012815380508713,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:crSiNU6cbsQJ:scholar.google.com/&scioq=Fooling+the+Textual+Fooler+via+Randomizing+Latent+Representations&hl=en&as_sdt=0,33",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;2;0;0",
        "aff_unique_norm": "VinUniversity;Amazon;Baidu",
        "aff_unique_dep": ";Amazon.com, Inc.;Baidu, Inc.",
        "aff_unique_url": "https://vinuni.edu.vn;https://www.amazon.com;https://www.baidu.com",
        "aff_unique_abbr": "VinUni;Amazon;Baidu",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;2;0;0",
        "aff_country_unique": "Vietnam;United States;China"
    },
    {
        "id": "E2ePtpKJpy",
        "title": "Improving Compositional Text-to-image Generation with Large Vision-Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent advancements in text-to-image models, particularly diffusion models, have shown significant promise. However, compositional text-to-image models frequently encounter difficulties in generating high-quality images that accurately align with input texts describing multiple objects, variable attributes, and intricate spatial relationships. To address this limitation, we employ large vision-language models (LVLMs) for multi-dimensional assessment of the alignment between generated images and their corresponding input texts. Utilizing this assessment, we fine-tune the diffusion model to enhance its alignment capabilities. During the inference phase, an initial image is produced using the fine-tuned diffusion model. The LVLM is then employed to pinpoint areas of misalignment in the initial image, which are subsequently corrected using the image editing algorithm until no further misalignments are detected by the LVLM. The resultant image is consequently more closely aligned with the input text. Our experimental results validate that the proposed methodology significantly improves text-image alignment in compositional image generation, particularly with respect to object number, attribute binding, spatial relationships, and aesthetic quality.",
        "keywords": "Text-to-image;Diffusion Models;Large Language Models",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Song Wen;Guian Fang;Renrui Zhang;Peng Gao;Hao Dong;Dimitris N. Metaxas",
        "authorids": "~Song_Wen1;~Guian_Fang1;~Renrui_Zhang1;~Peng_Gao3;~Hao_Dong3;~Dimitris_N._Metaxas1",
        "gender": ";M;M;;M;",
        "homepage": ";https://enderfga.cn;;;https://zsdonghao.github.io;",
        "dblp": ";348/7142;244/1748;;14/1525-3.html;",
        "google_scholar": ";https://scholar.google.com/citations?hl=zh-CN;YlL3xN4AAAAJ;;xLFL4sMAAAAJ;",
        "orcid": ";0009-0004-7344-2333;;;0000-0003-2261-9122;",
        "linkedin": ";enderfga;;;;",
        "or_profile": "~Song_Wen1;~Guian_Fang1;~Renrui_Zhang1;~Peng_Gao3;~Hao_Dong3;~Dimitris_N._Metaxas1",
        "aff": ";SUN YAT-SEN UNIVERSITY;MMLab of CUHK & Shanghai AI Laboratory;;Peking University;",
        "aff_domain": ";sysu.edu.cn;pjlab.org.cn;;pku.edu.cn;",
        "position": ";Undergrad student;PhD student;;Assistant Professor;",
        "bibtex": "@misc{\nwen2024improving,\ntitle={Improving Compositional Text-to-image Generation with  Large Vision-Language Models},\nauthor={Song Wen and Guian Fang and Renrui Zhang and Peng Gao and Hao Dong and Dimitris N. Metaxas},\nyear={2024},\nurl={https://openreview.net/forum?id=E2ePtpKJpy}\n}",
        "github": "",
        "project": "",
        "reviewers": "A5xo;dnr1;TYf6;dXyt",
        "site": "https://openreview.net/forum?id=E2ePtpKJpy",
        "pdf_size": 4325885,
        "rating": "3;3;3;5",
        "confidence": "5;5;5;3",
        "soundness": "1;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "2;2;2;3",
        "wc_summary": "38;73;47;38",
        "wc_strengths": "41;27;13;14",
        "wc_weaknesses": "230;212;232;11",
        "wc_questions": "6;222;1;144",
        "wc_review": "315;534;293;207",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            49.0,
            14.33527118683145
        ],
        "wc_strengths_avg": [
            23.75,
            11.388041973930374
        ],
        "wc_weaknesses_avg": [
            171.25,
            92.84765748256658
        ],
        "wc_questions_avg": [
            93.25,
            93.9078670825826
        ],
        "wc_review_avg": [
            337.25,
            120.54952301855035
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 16,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17062864696272064408&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Sun Yat-sen University;Chinese University of Hong Kong;Peking University",
        "aff_unique_dep": ";MMLab;",
        "aff_unique_url": "http://www.sysu.edu.cn;https://www.cuhk.edu.hk;http://www.pku.edu.cn",
        "aff_unique_abbr": "SYSU;CUHK;Peking U",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Parallelizing non-linear sequential models over the sequence length",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19118",
        "id": "E34AlVLN0v",
        "author_site": "Yi Heng Lim, Qi Zhu, Joshua Selfridge, Muhammad Firmansyah",
        "tldr": "",
        "abstract": "Sequential models, such as Recurrent Neural Networks and Neural Ordinary Differential Equations, have long suffered from slow training due to their inherent sequential nature.\nFor many years this bottleneck has persisted, as many thought sequential models could not be parallelized.\nWe challenge this long-held belief with our parallel algorithm that accelerates GPU evaluation of sequential models by up to 3 orders of magnitude faster without compromising output accuracy.\nThe algorithm does not need any special structure in the sequential models' architecture, making it applicable to a wide range of architectures.\nUsing our method, training sequential models can be more than 10 times faster than the common sequential method without any meaningful difference in the training results.\nLeveraging this accelerated training, we discovered the efficacy of the Gated Recurrent Unit in a long time series classification problem with 17k time samples.\nBy overcoming the training bottleneck, our work serves as the first step to unlock the potential of non-linear sequential models for long sequence problems.",
        "keywords": "parallel algorithm;recurrent neural networks;neural ordinary differential equations;sequential models",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Yi Heng Lim;Qi Zhu;Joshua Selfridge;Muhammad Firmansyah Kasim",
        "authorids": "~Yi_Heng_Lim1;~Qi_Zhu14;~Joshua_Selfridge1;~Muhammad_Firmansyah_Kasim1",
        "gender": "M;M;M;M",
        "homepage": ";https://github.com/zqigolden;https://joshselfridge.wordpress.com;",
        "dblp": ";;;",
        "google_scholar": "x6-ihZwAAAAJ;;;https://scholar.google.co.uk/citations?user=WmeftKUAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Yi_Heng_Lim1;~Qi_Zhu14;~Joshua_Selfridge1;~Muhammad_Firmansyah_Kasim1",
        "aff": "Machine Discovery;Machine Discovery;University of Oxford;Mach42",
        "aff_domain": "machine-discovery.com;machine-discovery.com;ox.ac.uk;mach42.ai",
        "position": "Researcher;Researcher;Undergrad student;Principal Researcher",
        "bibtex": "@inproceedings{\nlim2024parallelizing,\ntitle={Parallelizing non-linear sequential models over the sequence length},\nauthor={Yi Heng Lim and Qi Zhu and Joshua Selfridge and Muhammad Firmansyah Kasim},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=E34AlVLN0v}\n}",
        "github": "",
        "project": "",
        "reviewers": "gw76;EMpw;QySF",
        "pdf_size": 848833,
        "rating": "6;6;6",
        "confidence": "3;4;4",
        "soundness": "3;4;3",
        "contribution": "3;2;3",
        "presentation": "3;3;2",
        "wc_summary": "70;79;67",
        "wc_strengths": "115;96;51",
        "wc_weaknesses": "327;200;106",
        "wc_questions": "140;107;203",
        "wc_review": "652;482;427",
        "wc_reply_reviewers": "13;59;0",
        "wc_reply_authors": "485;420;868",
        "reply_reviewers": "1;1;0",
        "reply_authors": "2;2;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            72.0,
            5.0990195135927845
        ],
        "wc_strengths_avg": [
            87.33333333333333,
            26.83695627716046
        ],
        "wc_weaknesses_avg": [
            211.0,
            90.55753235742826
        ],
        "wc_questions_avg": [
            150.0,
            39.824615503479755
        ],
        "wc_review_avg": [
            520.3333333333334,
            95.77171932372428
        ],
        "wc_reply_reviewers_avg": [
            24.0,
            25.311394008759507
        ],
        "wc_reply_authors_avg": [
            591.0,
            197.65795371465998
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11914582573882047237&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=E34AlVLN0v",
        "pdf": "https://openreview.net/pdf?id=E34AlVLN0v",
        "email": "machine-discovery.com;machine-discovery.com;ox.ac.uk;mach42.ai",
        "author_num": 4,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "Machine Discovery;University of Oxford;Mach42",
        "aff_unique_dep": ";;",
        "aff_unique_url": ";https://www.ox.ac.uk;",
        "aff_unique_abbr": ";Oxford;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "1",
        "aff_country_unique": ";United Kingdom"
    },
    {
        "id": "E37nwosiyq",
        "title": "Multi-Concept T2I-Zero: Tweaking Only The Text Embeddings And Nothing Else",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recent advances in text-to-image diffusion models have enabled the photo-realistic generation of images from text prompts. Despite the great progress, existing models still struggle to generate compositional multi-concept images naturally, limiting their ability to visualize human imagination. \n While several recent works have attempted to address this issue, they either introduce additional training or adopt guidance at inference time. In this work, we consider a more ambitious goal: natural multi-concept generation using a pre-trained diffusion model, and with almost no extra cost.\n To achieve this goal, we identify the limitations in the text embeddings used for the pre-trained text-to-image diffusion models. \nSpecifically, we observe concept dominance and non-localized contribution that severely degrade multi-concept generation performance. We further design a minimal low-cost solution that overcomes the above issues by tweaking (not re-training) the text embeddings for more realistic multi-concept text-to-image generation. Our Correction by Similarities method tweaks the embedding of concepts by collecting semantic features from most similar tokens to localize the contribution. To avoid mixing features of concepts, we also apply Cross-Token Non-Maximum Suppression, which excludes the overlap of contributions from different concepts. Experiments show that our approach outperforms previous methods in text-to-image, image manipulation, and personalization tasks, despite not introducing additional training or inference costs to the diffusion steps.",
        "keywords": "multi-concept diffusion;text-to-image;diffusion model;image-manipulation",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Hazarapet Tunanyan;Dejia Xu;Shant Navasardyan;Zhangyang Wang;Humphrey Shi",
        "authorids": "~Hazarapet_Tunanyan1;~Dejia_Xu1;~Shant_Navasardyan1;~Zhangyang_Wang1;~Humphrey_Shi1",
        "gender": "M;M;M;M;M",
        "homepage": "https://hazarapet.github.io/;https://ir1d.github.io;;https://vita-group.github.io;https://www.humphreyshi.com",
        "dblp": "304/7901.html;264/5685;286/5315;119/4026;176/5516",
        "google_scholar": "FG7MnFcAAAAJ;ET0e93cAAAAJ;VJSh59sAAAAJ;pxFyKAIAAAAJ;WBvt5A8AAAAJ",
        "orcid": ";;0000-0002-1999-9999;;0000-0002-2922-5663",
        "linkedin": "hazarapet/;;shant-navasardyan-1302aa149;;humphreyshi",
        "or_profile": "~Hazarapet_Tunanyan1;~Dejia_Xu1;~Shant_Navasardyan1;~Zhangyang_Wang1;~Honghui_Shi1",
        "aff": "Picsart Inc.;University of Texas at Austin;Picsart Inc;University of Texas at Austin;University of Illinois, Urbana Champaign",
        "aff_domain": "picsart.com;utexas.edu;picsart.com;utexas.edu;illinois.edu",
        "position": "Senior Machine Learning Scientist;PhD student;Researcher;Associate Professor;Adjunct Assistant Professor",
        "bibtex": "@misc{\ntunanyan2024multiconcept,\ntitle={Multi-Concept T2I-Zero: Tweaking Only The Text Embeddings And Nothing Else},\nauthor={Hazarapet Tunanyan and Dejia Xu and Shant Navasardyan and Zhangyang Wang and Humphrey Shi},\nyear={2024},\nurl={https://openreview.net/forum?id=E37nwosiyq}\n}",
        "github": "",
        "project": "",
        "reviewers": "U4Xb;RDxc;9jmE",
        "site": "https://openreview.net/forum?id=E37nwosiyq",
        "pdf_size": 50201877,
        "rating": "3;5;5",
        "confidence": "5;4;4",
        "soundness": "3;3;2",
        "contribution": "2;3;2",
        "presentation": "1;3;3",
        "wc_summary": "70;43;35",
        "wc_strengths": "82;28;29",
        "wc_weaknesses": "156;113;134",
        "wc_questions": "465;17;4",
        "wc_review": "773;201;202",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            49.333333333333336,
            14.974051630144135
        ],
        "wc_strengths_avg": [
            46.333333333333336,
            25.223445883190152
        ],
        "wc_weaknesses_avg": [
            134.33333333333334,
            17.55625877635159
        ],
        "wc_questions_avg": [
            162.0,
            214.31907676795052
        ],
        "wc_review_avg": [
            392.0,
            269.40799295244875
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9999999999999997,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15189893523736279309&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;1;3",
        "aff_unique_norm": "PicsArt Inc.;University of Texas at Austin;Picsart Inc;University of Illinois Urbana-Champaign",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.picsart.com;https://www.utexas.edu;https://www.picsart.com;https://illinois.edu",
        "aff_unique_abbr": "Picsart;UT Austin;Picsart;UIUC",
        "aff_campus_unique_index": "1;1;2",
        "aff_campus_unique": ";Austin;Urbana-Champaign",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "E3jq8f8t3d",
        "title": "Non-Asymptotic Analysis for Single-Loop (Natural) Actor-Critic with Compatible Function Approximation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Actor-critic (AC) is a powerful method for learning an optimal policy in reinforcement learning, where the critic uses algorithms, e.g., temporal difference (TD) learning with function approximation, to evaluate the current policy and the actor updates the policy along an approximate gradient direction using information from the critic. This paper provides the \\textit{tightest} non-asymptotic convergence bounds for both the AC and natural AC (NAC) algorithms. Specifically, existing studies show that AC converges to an $\\epsilon+\\varepsilon_{\\text{critic}}$ neighborhood of stationary points with the best known sample complexity of $\\mathcal{O}(\\epsilon^{-2})$ (up to a log factor), and NAC converges to an $\\epsilon+\\varepsilon_{\\text{critic}}+\\sqrt{\\varepsilon_{\\text{actor}}}$ neighborhood of the global optimum with the best known sample complexity of $\\mathcal{O}(\\epsilon^{-3})$, where $\\varepsilon_{\\text{critic}}$ is the approximation error of the critic and $\\varepsilon_{\\text{actor}}$ is the approximation error induced by the insufficient expressive power of the parameterized policy class.  This paper analyzes the convergence of both AC and NAC algorithms with compatible function approximation. Our analysis eliminates the term $\\varepsilon_{\\text{critic}}$ from the error bounds while still achieving the best known sample complexities. Moreover, we focus on the challenging single-loop setting with a single Markovian sample trajectory. Our major technical novelty lies in analyzing the stochastic bias due to policy-dependent and time-varying compatible function approximation in the critic, and handling the non-ergodicity of the MDP due to the single Markovian sample trajectory.",
        "keywords": "(Natural) Actor Critic;compatible linear function approximation",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/a71a508d324c259b37176d00a5c745ca1d2eb834.pdf",
        "author": "Yudan Wang;Yue Wang;Yi Zhou;Shaofeng Zou",
        "authorids": "~Yudan_Wang1;~Yue_Wang16;~Yi_Zhou2;~Shaofeng_Zou1",
        "gender": "F;;M;",
        "homepage": ";https://sites.google.com/view/ywangub;https://sites.google.com/site/yizhouhomepage/home;",
        "dblp": "189/3319;33/4822-68;;",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;ndMi_z8AAAAJ;4fK8bYIAAAAJ;",
        "orcid": ";0009-0001-9786-052X;;",
        "linkedin": ";;;",
        "or_profile": "~Yudan_Wang1;~Yue_Wang16;~Yi_Zhou2;~Shaofeng_Zou1",
        "aff": "State University of New York at Buffalo;University of Central Florida;University of Utah;",
        "aff_domain": "buffalo.edu;ucf.edu;utah.edu;",
        "position": "PhD student;Assistant Professor;Assistant Professor;",
        "bibtex": "@misc{\nwang2024nonasymptotic,\ntitle={Non-Asymptotic Analysis for Single-Loop (Natural) Actor-Critic with Compatible Function Approximation},\nauthor={Yudan Wang and Yue Wang and Yi Zhou and Shaofeng Zou},\nyear={2024},\nurl={https://openreview.net/forum?id=E3jq8f8t3d}\n}",
        "github": "",
        "project": "",
        "reviewers": "VajU;CZ8K;mPQr;k8iS;2Umy;XG7r",
        "site": "https://openreview.net/forum?id=E3jq8f8t3d",
        "pdf_size": 307268,
        "rating": "6;6;6;6;8;8",
        "confidence": "3;3;4;2;2;4",
        "soundness": "4;3;3;4;3;3",
        "contribution": "3;3;3;3;3;3",
        "presentation": "1;3;3;3;3;3",
        "wc_summary": "21;78;134;35;35;67",
        "wc_strengths": "47;81;70;62;27;67",
        "wc_weaknesses": "348;89;201;43;62;17",
        "wc_questions": "1;5;5;41;95;19",
        "wc_review": "417;253;410;181;219;170",
        "wc_reply_reviewers": "53;12;0;0;0;24",
        "wc_reply_authors": "1017;1362;1357;278;1341;414",
        "reply_reviewers": "1;1;0;0;0;1",
        "reply_authors": "3;4;3;1;4;1",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.7453559924999298
        ],
        "wc_summary_avg": [
            61.666666666666664,
            37.866725352067206
        ],
        "wc_strengths_avg": [
            59.0,
            17.540429489230494
        ],
        "wc_weaknesses_avg": [
            126.66666666666667,
            114.8486927318819
        ],
        "wc_questions_avg": [
            27.666666666666668,
            32.97810721608437
        ],
        "wc_review_avg": [
            275.0,
            101.54637692535695
        ],
        "wc_reply_reviewers_avg": [
            14.833333333333334,
            19.18694579366109
        ],
        "wc_reply_authors_avg": [
            961.5,
            452.9255825556041
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9640289146638883615&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "State University of New York at Buffalo;University of Central Florida;University of Utah",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.buffalo.edu;https://www.ucf.edu;https://www.utah.edu",
        "aff_unique_abbr": "SUNY Buffalo;UCF;Utah",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Buffalo;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "E4Ero36Zr4",
        "title": "Rethinking Teacher-Student Curriculum Learning under the Cooperative Mechanics of Experience",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Teacher-Student Curriculum Learning (TSCL) is a curriculum learning framework that draws inspiration from human cultural transmission and learning. It involves a teacher algorithm shaping the learning process of a learner algorithm by exposing it to controlled experiences. Despite its success, understanding the conditions under which TSCL is effective remains challenging. In this paper, we propose a data-centric perspective to analyze the underlying mechanics of the teacher-student interactions in TSCL. We leverage cooperative game theory to describe how the composition of the set of experiences presented by the teacher to the learner, as well as their order, influences the performance of the curriculum that are found by TSCL approaches. To do so, we demonstrate that for every TSCL problem, there exists an equivalent cooperative game, and several key components of the TSCL framework can be reinterpreted using game-theoretic principles. Through experiments covering supervised learning, reinforcement learning, and classical games, we estimate the cooperative values of experiences and use value-proportional curriculum mechanisms to construct curricula, even in cases where TSCL struggles. The framework and experimental setup we present in this work represent a foundation that can be used for a deeper exploration of TSCL, shedding light on its underlying mechanisms and providing insights into its broader applicability in machine learning.",
        "keywords": "curriculum learning;teacher-student curriculum learning;cooperative game theory",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Manfred Diaz;Liam Paull;Andrea Tacchetti",
        "authorids": "~Manfred_Diaz1;~Liam_Paull1;~Andrea_Tacchetti1",
        "gender": "M;;M",
        "homepage": "https://manfreddiaz.github.io/;;http://web.mit.edu/~atacchet/www/",
        "dblp": "213/4009;;127/6624",
        "google_scholar": "z_vFbp8AAAAJ;;https://scholar.google.co.uk/citations?user=HKybSogAAAAJ",
        "orcid": ";;0000-0001-9311-9171",
        "linkedin": ";;andreatacchetti/",
        "or_profile": "~Manfred_Diaz1;~Liam_Paull1;~Andrea_Tacchetti1",
        "aff": "University of Montreal;;Google DeepMind",
        "aff_domain": "umontreal.ca;;google.com",
        "position": "PhD student;;Research Scientist",
        "bibtex": "@misc{\ndiaz2024rethinking,\ntitle={Rethinking Teacher-Student Curriculum Learning under the Cooperative Mechanics of Experience},\nauthor={Manfred Diaz and Liam Paull and Andrea Tacchetti},\nyear={2024},\nurl={https://openreview.net/forum?id=E4Ero36Zr4}\n}",
        "github": "",
        "project": "",
        "reviewers": "Y5rF;pSdB;e3hV;E5LP;io1g",
        "site": "https://openreview.net/forum?id=E4Ero36Zr4",
        "pdf_size": 1512867,
        "rating": "3;3;5;5;6",
        "confidence": "3;2;3;3;4",
        "soundness": "2;4;3;2;3",
        "contribution": "1;3;2;2;3",
        "presentation": "1;4;2;2;3",
        "wc_summary": "13;144;111;91;98",
        "wc_strengths": "18;143;107;149;52",
        "wc_weaknesses": "93;136;187;93;43",
        "wc_questions": "36;35;129;66;4",
        "wc_review": "160;458;534;399;197",
        "wc_reply_reviewers": "18;0;22;0;0",
        "wc_reply_authors": "0;416;613;382;309",
        "reply_reviewers": "1;0;1;0;0",
        "reply_authors": "0;1;1;1;1",
        "rating_avg": [
            4.4,
            1.2
        ],
        "confidence_avg": [
            3.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.8,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.2,
            0.7483314773547882
        ],
        "presentation_avg": [
            2.4,
            1.019803902718557
        ],
        "wc_summary_avg": [
            91.4,
            43.223141949654696
        ],
        "wc_strengths_avg": [
            93.8,
            51.25387790206708
        ],
        "wc_weaknesses_avg": [
            110.4,
            48.31397313407375
        ],
        "wc_questions_avg": [
            54.0,
            42.31784493567696
        ],
        "wc_review_avg": [
            349.6,
            146.580489834084
        ],
        "wc_reply_reviewers_avg": [
            8.0,
            9.879271228182775
        ],
        "wc_reply_authors_avg": [
            344.0,
            199.2736811523288
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            0.8,
            0.4000000000000001
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.7905694150420948,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:sTPldSARqv0J:scholar.google.com/&scioq=Rethinking+Teacher-Student+Curriculum+Learning+under+the+Cooperative+Mechanics+of+Experience&hl=en&as_sdt=0,5",
        "gs_version_total": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Montreal;Google",
        "aff_unique_dep": ";Google DeepMind",
        "aff_unique_url": "https://wwwumontreal.ca;https://deepmind.com",
        "aff_unique_abbr": "UM;DeepMind",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Canada;United Kingdom"
    },
    {
        "id": "E4flIscNE6",
        "title": "Meta-Collaboration in Distillation: Pooled Learning from Multiple Students",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Knowledge distillation (KD) approximates a large teacher model using a smaller student model. KD can be used to train multiple students of different capacities, allowing for flexible management of inference costs at test time. We propose a novel distillation method we term meta-collaboration, wherein a set of students are simultaneously distilled from a single teacher and can improve each other through information sharing during distillation. We model this information sharing through a separate network designed to predict instance-specific loss mixing for each of the students. This auxiliary network is trained jointly with the multi-student distillation, utilizing a separate meta-loss aggregating student model loss on a separate validation set. Our method improves student accuracy for all students and beats to state-of-the-art distillation baselines, including methods that use multi-step distillation, combining models of different sizes. In particular, addition of smaller students to the pool clearly benefits larger student models, through the mechanism of meta-collaboration. We show average gains of 2.5\\% on CIFAR100 \\& 2\\% on TinyImageNet datasets; our gains are consistent across a wide range of student sizes, teacher sizes, and model architectures.",
        "keywords": "Knowledge Distillation;Re-weighting;Meta-Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/aa7a7612818b8d34dd9625e3eca4847b7c0ad5df.pdf",
        "author": "Durga S;Shashank Kate;Nishant Jain;Atharva Abhijit Tambat;Ganesh Ramakrishnan;Pradeep Shenoy",
        "authorids": "~Durga_S1;~Shashank_Kate1;~Nishant_Jain2;~Atharva_Abhijit_Tambat2;~Ganesh_Ramakrishnan1;~Pradeep_Shenoy1",
        "gender": "F;M;M;M;M;M",
        "homepage": ";https://www.cse.iitb.ac.in/~shashankkate/;;https://www.cse.iitb.ac.in/~atharvatambat/;https://www.cse.iitb.ac.in/~ganesh/;",
        "dblp": ";;126/3493;;r/GaneshRamakrishnan;12/771",
        "google_scholar": "4JXFWTwAAAAJ;;VKcqFW8AAAAJ;;https://scholar.google.com/scholar?hl=hi;lXbPKmkAAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Durga_S1;~Shashank_Kate1;~Nishant_Jain2;~Atharva_Abhijit_Tambat2;~Ganesh_Ramakrishnan1;~Pradeep_Shenoy1",
        "aff": "Indian Institute of Technology Bombay;Indian Institute of Technology, Bombay, Dhirubhai Ambani Institute Of Information and Communication Technology;Google Deepmind;Indian Institute of Technology Bombay, Indian Institute of Technology, Bombay;Indian Institute of Technology Bombay, Indian Institute of Technology Bombay;Google",
        "aff_domain": "iitb.ac.in;iitb.ac.in;google.com;cse.iitb.ac.in;cse.iitb.ac.in;google.com",
        "position": "PhD student;MS student;Researcher;Undergrad student;Full Professor;Researcher",
        "bibtex": "@misc{\ns2024metacollaboration,\ntitle={Meta-Collaboration in Distillation: Pooled Learning from Multiple Students},\nauthor={Durga S and Shashank Kate and Nishant Jain and Atharva Abhijit Tambat and Ganesh Ramakrishnan and Pradeep Shenoy},\nyear={2024},\nurl={https://openreview.net/forum?id=E4flIscNE6}\n}",
        "github": "",
        "project": "",
        "reviewers": "uMpm;sZry;cbio;Bq77",
        "site": "https://openreview.net/forum?id=E4flIscNE6",
        "pdf_size": 327381,
        "rating": "3;5;5;5",
        "confidence": "4;5;4;4",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "3;2;2;3",
        "wc_summary": "29;69;43;57",
        "wc_strengths": "37;34;56;19",
        "wc_weaknesses": "71;279;141;62",
        "wc_questions": "27;2;4;50",
        "wc_review": "164;384;244;188",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "342;471;385;487",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            49.5,
            14.99166435056495
        ],
        "wc_strengths_avg": [
            36.5,
            13.162446581088183
        ],
        "wc_weaknesses_avg": [
            138.25,
            86.82561545995513
        ],
        "wc_questions_avg": [
            20.75,
            19.536824204563032
        ],
        "wc_review_avg": [
            245.0,
            85.34049449118513
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            421.25,
            59.98489393172251
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:jHc6P20gSgoJ:scholar.google.com/&scioq=Meta-Collaboration+in+Distillation:+Pooled+Learning+from+Multiple+Students&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0;0;3",
        "aff_unique_norm": "Indian Institute of Technology Bombay;Indian Institute of Technology, Bombay;DeepMind;Google",
        "aff_unique_dep": ";;DeepMind;Google",
        "aff_unique_url": "https://www.iitb.ac.in;https://www.iitb.ac.in;https://deepmind.com;https://www.google.com",
        "aff_unique_abbr": "IIT Bombay;IIT Bombay;DeepMind;Google",
        "aff_campus_unique_index": "0;0;0;0;2",
        "aff_campus_unique": "Bombay;;Mountain View",
        "aff_country_unique_index": "0;0;1;0;0;2",
        "aff_country_unique": "India;United Kingdom;United States"
    },
    {
        "id": "E4hK8t7Fts",
        "title": "Improving Large Language Model Fine-tuning for Solving Math Problems",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Despite their success in many natural language tasks, solving math problems remains a significant challenge for large language models (LLMs). A large gap exists between LLMs' pass-at-one and pass-at-N performance in solving math problems, suggesting LLMs might be close to finding correct solutions, motivating our exploration of fine-tuning methods to unlock LLMs' performance. Using the challenging MATH dataset, we investigate three fine-tuning strategies: (1) solution fine-tuning, where we fine-tune to generate a detailed solution for a given math problem; (2) solution-cluster re-ranking, where the LLM is fine-tuned as a solution verifier/evaluator to choose among generated candidate solution clusters; (3) multi-task sequential fine-tuning, which integrates both solution generation and evaluation tasks together efficiently to enhance the LLM performance. With these methods, we present a thorough empirical study on a series of PaLM~2 models and find: (1) The quality and style of the step-by-step solutions used for fine-tuning can make a significant impact on the model performance; (2) While solution re-ranking and majority voting are both effective for improving the model performance when used separately, they can also be used together for an even greater performance boost; (3) Multi-task fine-tuning that sequentially separates the solution generation and evaluation tasks can offer improved performance compared with the solution fine-tuning baseline. Guided by these insights, we design a fine-tuning recipe that yields approximately 58.8% accuracy on the MATH dataset with fine-tuned PaLM 2-L models, an 11.2% accuracy improvement over the few-shot performance of pre-trained PaLM 2-L model with majority voting.",
        "keywords": "Math Problem Solving;Large Language Models",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yixin Liu;Avi Singh;C. Daniel Freeman;John D Co-Reyes;Peter J Liu",
        "authorids": "~Yixin_Liu2;~Avi_Singh1;~C._Daniel_Freeman1;~John_D_Co-Reyes1;~Peter_J_Liu1",
        "gender": ";;M;M;",
        "homepage": "https://yixinl7.github.io/;https://www.avisingh.org/;https://github.com/danielfreeman11/;;http://www.peterjliu.com",
        "dblp": "140/7348-3;https://dblp.org/pers/s/Singh:Avi.html;190/7046;198/1129;190/7667",
        "google_scholar": "sFtxaMkAAAAJ;C2_ZXdcAAAAJ;t5Xsx0IAAAAJ;;",
        "orcid": ";;;;",
        "linkedin": ";;daniel-freeman-6952136?trk=hp-identity-name;;p3t3rliu",
        "or_profile": "~Yixin_Liu2;~Avi_Singh1;~C._Daniel_Freeman1;~John_D_Co-Reyes1;~Peter_J_Liu1",
        "aff": "Yale University;Google;Google Research;;Google Brain",
        "aff_domain": "yale.edu;google.com;google.com;;google.com",
        "position": "PhD student;Researcher;Software Engineer;;Research Scientist",
        "bibtex": "@misc{\nliu2024improving,\ntitle={Improving Large Language Model Fine-tuning for Solving Math Problems},\nauthor={Yixin Liu and Avi Singh and C. Daniel Freeman and John D Co-Reyes and Peter J Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=E4hK8t7Fts}\n}",
        "github": "",
        "project": "",
        "reviewers": "1Ei9;ShdB;hJqw",
        "site": "https://openreview.net/forum?id=E4hK8t7Fts",
        "pdf_size": 257748,
        "rating": "3;3;3",
        "confidence": "4;4;2",
        "soundness": "2;2;2",
        "contribution": "2;1;2",
        "presentation": "2;2;2",
        "wc_summary": "99;54;42",
        "wc_strengths": "24;38;32",
        "wc_weaknesses": "87;185;130",
        "wc_questions": "34;24;63",
        "wc_review": "244;301;267",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;178;165",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;1;1",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            65.0,
            24.535688292770594
        ],
        "wc_strengths_avg": [
            31.333333333333332,
            5.734883511361751
        ],
        "wc_weaknesses_avg": [
            134.0,
            40.10818702792071
        ],
        "wc_questions_avg": [
            40.333333333333336,
            16.539514973407037
        ],
        "wc_review_avg": [
            270.6666666666667,
            23.41414577178126
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            114.33333333333333,
            81.0198878191165
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 46,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9297809244196645603&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Yale University;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.yale.edu;https://www.google.com",
        "aff_unique_abbr": "Yale;Google",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "E5CMyG6jl0",
        "title": "Unified Language Model Alignment with Demonstration and Point-wise Human Preference",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Language model alignment is a cutting-edge technique in large language model training to align the model output to user's intent, e.g., being helpful and harmless. Recent alignment framework consists of two steps: supervised fine-tuning with demonstration data and preference learning with human preference data. Previous preference learning methods, such as RLHF and DPO, mainly focus on pair-wise preference data. However, in many real-world scenarios where human feedbacks are intrinsically point-wise, e.g., upvotes number or binary criterion, effective model alignment to user preference is under explored. In this paper, we fill this gap by developing a simplified tuning method for point-wise preference data. Further revelation on the connection between supervised fine-tuning and point-wise preference learning enables us to develop a unified framework for both human demonstration and point-wise preference data, which sheds new light on the construction of preference dataset. Extensive experiments demonstrate the superior performance and efficiency of our proposed methods. A new dataset with high-quality demonstration samples on harmlessness are constructed and made publicly available.",
        "keywords": "Large Language Model;Alignment;Point-wise preference",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Tianchi Cai;Xierui Song;Jiyan Jiang;Fei Teng;Jinjie GU;Guannan Zhang",
        "authorids": "~Tianchi_Cai1;songxierui.sxr@antgroup.com;~Jiyan_Jiang1;mujing.tf@antgroup.com;~Jinjie_GU1;~Guannan_Zhang2",
        "gender": "M;;M;;M;M",
        "homepage": ";;;;https://scholar.google.com/citations?user=Mz2HnKwAAAAJ&hl=zh-CN&oi=ao;https://orcid.org/0000-0002-7091-2318",
        "dblp": "284/8424;;;;251/9600;",
        "google_scholar": "Y9VCVsoAAAAJ;;;;Mz2HnKwAAAAJ;",
        "orcid": ";;0000-0002-1083-2834;;0000-0001-7596-4945;0000-0002-7091-2318",
        "linkedin": "tianchi-cai-76a0b57b/;;JiyanJiang/;;;",
        "or_profile": "~Tianchi_Cai1;songxierui.sxr@antgroup.com;~Jiyan_Jiang1;mujing.tf@antgroup.com;~Jinjie_GU1;~Guannan_Zhang2",
        "aff": "Ant Group;;Tsinghua University;;Fudan University;",
        "aff_domain": "antgroup.com;;tsinghua.edu.cn;;fudan.edu.cn;",
        "position": "Machine Learning Engineer;;PhD student;;PhD student;",
        "bibtex": "@misc{\ncai2024unified,\ntitle={Unified Language Model Alignment with Demonstration and Point-wise Human Preference},\nauthor={Tianchi Cai and Xierui Song and Jiyan Jiang and Fei Teng and Jinjie GU and Guannan Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=E5CMyG6jl0}\n}",
        "github": "",
        "project": "",
        "reviewers": "33oF;UxYc;veNV;iHby",
        "site": "https://openreview.net/forum?id=E5CMyG6jl0",
        "pdf_size": 336476,
        "rating": "5;5;6;8",
        "confidence": "3;4;4;3",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;4",
        "presentation": "2;4;3;3",
        "wc_summary": "112;50;134;28",
        "wc_strengths": "121;32;174;37",
        "wc_weaknesses": "289;48;96;16",
        "wc_questions": "115;233;25;1",
        "wc_review": "637;363;429;82",
        "wc_reply_reviewers": "281;0;49;0",
        "wc_reply_authors": "1898;579;536;192",
        "reply_reviewers": "2;0;1;0",
        "reply_authors": "4;1;1;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            81.0,
            43.41658669218482
        ],
        "wc_strengths_avg": [
            91.0,
            59.552497848536966
        ],
        "wc_weaknesses_avg": [
            112.25,
            105.94426600812335
        ],
        "wc_questions_avg": [
            93.5,
            91.06453755441797
        ],
        "wc_review_avg": [
            377.75,
            198.44567896530273
        ],
        "wc_reply_reviewers_avg": [
            82.5,
            116.33679555497478
        ],
        "wc_reply_authors_avg": [
            801.25,
            650.7301187896561
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            1.75,
            1.299038105676658
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.40824829046386296,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:WNQd1_E5fHAJ:scholar.google.com/&scioq=Unified+Language+Model+Alignment+with+Demonstration+and+Point-wise+Human+Preference&hl=en&as_sdt=0,47",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Ant Group;Tsinghua University;Fudan University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.antgroup.com;https://www.tsinghua.edu.cn;https://www.fudan.edu.cn",
        "aff_unique_abbr": "Ant Group;THU;Fudan",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Learning from Aggregate responses: Instance Level versus Bag Level Loss Functions",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19117",
        "id": "E60SIDItyT",
        "author_site": "Adel Javanmard, Lin Chen, Vahab Mirrokni, Ashwinkumar Badanidiyuru, Gang Fu",
        "tldr": "",
        "abstract": "Due to the rise of privacy concerns, in many practical applications, the training data is aggregated before being shared with the learner to protect the privacy of users' sensitive responses. In an aggregate learning framework, the dataset is grouped into bags of samples, where each bag is available only with an aggregate response, providing a summary of individuals' responses in that bag. In this paper, we study two natural loss functions for learning from aggregate responses: the bag-level loss and the instance-level loss. In the former, the model is learned by minimizing a loss between the aggregate responses and aggregate model predictions, while in the latter, the model aims to fit individual predictions to the aggregate responses. In this work, we show that the instance-level loss can be perceived as a regularized form of the bag-level loss. This observation allows us to compare the two approaches with respect to the bias and variance of the resulting estimators and to introduce a novel interpolating estimator that combines the two approaches. For linear regression tasks, we provide a precise characterization of the risk of the interpolating estimator in an asymptotic regime where the size of the training set grows in proportion to the feature dimension. Our analysis enables us to theoretically understand the effect of different factors, such as bag size, on the model's prediction risk. Additionally, we propose a mechanism for differentially private learning from aggregate responses and derive the optimal bag size in terms of the prediction risk-privacy trade-off. We also carry out thorough experiments to corroborate our theory and show the efficacy of the interpolating estimator.",
        "keywords": "aggregate learning;asymptotic analysis;bias;variance;privacy;regularization",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/719294b230372befd106ccf0b3ae97c526e7fb1b.pdf",
        "author": "Adel Javanmard;Lin Chen;Vahab Mirrokni;Ashwinkumar Badanidiyuru;Gang Fu",
        "authorids": "~Adel_Javanmard1;~Lin_Chen14;~Vahab_Mirrokni2;~Ashwinkumar_Badanidiyuru1;~Gang_Fu3",
        "gender": ";;M;M;",
        "homepage": "https://faculty.marshall.usc.edu/Adel-Javanmard/;;https://people.csail.mit.edu/mirrokni/Welcome.html;https://sites.google.com/site/ashwinkumarbv/home;",
        "dblp": "96/8072;;m/VahabSMirrokni;15/2638;",
        "google_scholar": "cNSbfGQAAAAJ;;opbZfw0AAAAJ;HhValEMAAAAJ;",
        "orcid": ";;;;",
        "linkedin": ";;;ashwinkumar-badanidiyuru-varadaraja-42b9832b/;",
        "or_profile": "~Adel_Javanmard1;~Lin_Chen14;~Vahab_Mirrokni2;~Ashwinkumar_Badanidiyuru1;~Gang_Fu3",
        "aff": "University of Southern California;;Google Research;Google;",
        "aff_domain": "usc.edu;;google.com;google.com;",
        "position": "Full Professor;;VP, Google Fellow;Researcher;",
        "bibtex": "@inproceedings{\njavanmard2024learning,\ntitle={Learning from Aggregate responses: Instance Level versus Bag Level Loss Functions},\nauthor={Adel Javanmard and Lin Chen and Vahab Mirrokni and Ashwinkumar Badanidiyuru and Gang Fu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=E60SIDItyT}\n}",
        "github": "",
        "project": "",
        "reviewers": "2uPt;D7UY;wg1T;LbHA;Z7mk",
        "pdf_size": 671635,
        "rating": "6;6;6;6;6",
        "confidence": "3;4;3;3;4",
        "soundness": "2;3;3;3;4",
        "contribution": "2;2;2;2;2",
        "presentation": "3;3;2;3;4",
        "wc_summary": "72;48;94;125;383",
        "wc_strengths": "38;44;25;43;224",
        "wc_weaknesses": "117;106;82;52;218",
        "wc_questions": "36;34;20;100;20",
        "wc_review": "263;232;221;320;845",
        "wc_reply_reviewers": "24;0;28;16;0",
        "wc_reply_authors": "524;831;418;1040;666",
        "reply_reviewers": "1;0;1;1;0",
        "reply_authors": "2;2;3;2;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.4,
            0.4898979485566356
        ],
        "soundness_avg": [
            3.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            144.4,
            121.96819257494964
        ],
        "wc_strengths_avg": [
            74.8,
            74.90634152059489
        ],
        "wc_weaknesses_avg": [
            115.0,
            56.12842417171535
        ],
        "wc_questions_avg": [
            42.0,
            29.772470505485433
        ],
        "wc_review_avg": [
            376.2,
            236.90791459974486
        ],
        "wc_reply_reviewers_avg": [
            13.6,
            11.757550765359255
        ],
        "wc_reply_authors_avg": [
            695.8,
            221.05601100173683
        ],
        "reply_reviewers_avg": [
            0.6,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            2.0,
            0.6324555320336759
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10381987877543355354&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=E60SIDItyT",
        "pdf": "https://openreview.net/pdf?id=E60SIDItyT",
        "email": "usc.edu;;google.com;google.com;",
        "author_num": 5,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "University of Southern California;Google",
        "aff_unique_dep": ";Google Research",
        "aff_unique_url": "https://www.usc.edu;https://research.google",
        "aff_unique_abbr": "USC;Google Research",
        "aff_campus_unique_index": "0;1;1",
        "aff_campus_unique": "Los Angeles;Mountain View",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "E64ZqVCr72",
        "title": "Active Domain Adaptation Of Medical Images Using Feature Disentanglement",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "State-of-the-art deep learning models often fail to generalize in the presence of distribution shifts between training (source) data and test (target) data. Domain adaptation techniques have been developed to address this challenge, leveraging either labeled data (supervised domain adaptation) or unlabeled data (unsupervised domain adaptation). The careful selection of target domain samples can significantly enhance model performance and robustness, while also reducing the overall data requirements. Active learning, a strategy for intelligently choosing informative samples with minimal annotation effort, offers a means to maximize performance. In this paper, we introduce an innovative method for active learning in the presence of domain shifts. We propose a novel feature disentanglement approach to decompose image features into domain-specific and task-specific components. Thereafter we define multiple novel cost functions that identify informative samples under domain shift. We test our proposed method for medical image classification using one histopathology dataset and two chest x-ray datasets. Experiments show our proposed approach achieves state-of-the-art performance when compared to both domain adaptation methods and other active domain adaptation techniques.",
        "keywords": "Active domain adaptation;feature disentanglement;chest xray;histopathology",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/420448524af7b54401a35d5b7580e299234c2cb1.pdf",
        "author": "Dwarikanath Mahapatra;Ruwan Tennakoon",
        "authorids": "~Dwarikanath_Mahapatra1;~Ruwan_Tennakoon1",
        "gender": "M;M",
        "homepage": "http://www.inceptioniai.org/;https://sites.google.com/view/ruwantennakoon",
        "dblp": "50/6718.html;127/9356",
        "google_scholar": "https://scholar.google.ch/citations?user=j5K7HPoAAAAJ;https://scholar.google.com.au/citations?user=tJ2el8oAAAAJ",
        "orcid": ";0000-0001-8909-5728",
        "linkedin": "dwarikanath-mahapatra-10897635/;",
        "or_profile": "~Dwarikanath_Mahapatra1;~Ruwan_B._Tennakoon1",
        "aff": "Inception Institute of AI, UAE;Royal Melbourne Institute of Technology",
        "aff_domain": "inceptioniai.org;rmit.edu.au",
        "position": "Principal Researcher;Lecturer",
        "bibtex": "@misc{\nmahapatra2024active,\ntitle={Active Domain Adaptation Of Medical Images Using Feature Disentanglement},\nauthor={Dwarikanath Mahapatra and Ruwan Tennakoon},\nyear={2024},\nurl={https://openreview.net/forum?id=E64ZqVCr72}\n}",
        "github": "",
        "project": "",
        "reviewers": "Hvpz;FaUD;nM77;S5xV",
        "site": "https://openreview.net/forum?id=E64ZqVCr72",
        "pdf_size": 693825,
        "rating": "3;6;6;6",
        "confidence": "4;4;4;4",
        "soundness": "1;3;4;3",
        "contribution": "1;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "56;58;163;45",
        "wc_strengths": "19;30;53;107",
        "wc_weaknesses": "140;124;176;142",
        "wc_questions": "73;112;44;2",
        "wc_review": "288;324;436;296",
        "wc_reply_reviewers": "190;69;7;31",
        "wc_reply_authors": "923;563;418;123",
        "reply_reviewers": "2;2;1;1",
        "reply_authors": "3;2;1;1",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            1.0897247358851685
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            80.5,
            47.88788990966297
        ],
        "wc_strengths_avg": [
            52.25,
            33.9070420414403
        ],
        "wc_weaknesses_avg": [
            145.5,
            18.940696924875812
        ],
        "wc_questions_avg": [
            57.75,
            40.226701331329664
        ],
        "wc_review_avg": [
            336.0,
            59.262129560116215
        ],
        "wc_reply_reviewers_avg": [
            74.25,
            70.38954112650543
        ],
        "wc_reply_authors_avg": [
            506.75,
            287.91003369108205
        ],
        "reply_reviewers_avg": [
            1.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:4moyj04qBtoJ:scholar.google.com/&scioq=Active+Domain+Adaptation+Of+Medical+Images+Using+Feature+Disentanglement&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Inception Institute of AI;Royal Melbourne Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": ";https://www.rmit.edu.au",
        "aff_unique_abbr": ";RMIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United Arab Emirates;Australia"
    },
    {
        "id": "E6EbeJR20o",
        "title": "A Large-Scale 3D Face Mesh Video Dataset via Neural Re-parameterized Optimization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We propose NeuFace, a 3D face mesh pseudo annotation method on videos via neural re-parameterized optimization. Despite the huge progress in 3D face reconstruction methods, generating reliable 3D face labels for in-the-wild dynamic videos remains challenging. Using NeuFace optimization, we annotate the per-view/-frame accurate and consistent face meshes on large-scale face videos, called the NeuFace-dataset. We investigate how neural re-parameterization helps to reconstruct image-aligned facial details on 3D meshes via gradient analysis. By exploiting the naturalness and diversity of 3D faces in our dataset, we demonstrate the usefulness of our dataset for 3D face-related tasks: improving the reconstruction accuracy of an existing 3D face reconstruction model and learning 3D facial motion prior. Code and datasets will be publicly available if accepted.",
        "keywords": "3D Face video dataset; Neural Re-parameterization; Optimization",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/be88b5fdebe6407b4a0432406b9fc1e353b33340.zip",
        "author": "Kim Youwang;Lee Hyun;Kim Sung-Bin;Suekyeong Nam;Janghoon Ju;Tae-Hyun Oh",
        "authorids": "~Kim_Youwang1;~Lee_Hyun1;~Kim_Sung-Bin1;~Suekyeong_Nam1;~Janghoon_Ju1;~Tae-Hyun_Oh3",
        "gender": ";M;F;M;M;M",
        "homepage": "https://kim-youwang.github.io;https://sites.google.com/view/kimsungbin/;http://cvlab.khu.ac.kr;;https://ami.kaist.ac.kr;https://github.com/HyunLee103",
        "dblp": "325/4399;312/3778;;176/5510;119/1450;https://dblp.org/rec/journals/corr/abs-2211-09385",
        "google_scholar": "gKXTrF8AAAAJ;bWsRk0MAAAAJ;;jVg4BCAAAAAJ;dMCBjeIAAAAJ;",
        "orcid": "0000-0002-7508-9260;0000-0003-3542-9934;;;0000-0003-0468-1571;",
        "linkedin": "kim-youwang/;sungbin-kim-a93476227/;;;tae-hyun-oh-at-mit/;hyun-lee-a784b017b/",
        "or_profile": "~Kim_Youwang1;~Kim_Sung-Bin1;~Suekyeong_Nam1;~Janghoon_Ju1;~Tae-Hyun_Oh3;~Hyun_Lee1",
        "aff": "Eberhard-Karls-Universit\u00e4t T\u00fcbingen;Pohang University of Science and Technology;KRAFTON;KRAFTON;POSTECH;Pohang University of Science and Technology",
        "aff_domain": "uni-tuebingen.de;postech.edu;krafton.com;krafton.com;postech.ac.kr;postech.ac.kr",
        "position": "Intern;PhD student;Researcher;Researcher;Associate Professor;MS student",
        "bibtex": "@misc{\nyouwang2024a,\ntitle={A Large-Scale 3D Face Mesh Video Dataset via Neural Re-parameterized Optimization},\nauthor={Kim Youwang and Lee Hyun and Kim Sung-Bin and Suekyeong Nam and Janghoon Ju and Tae-Hyun Oh},\nyear={2024},\nurl={https://openreview.net/forum?id=E6EbeJR20o}\n}",
        "github": "",
        "project": "",
        "reviewers": "C76P;axFo;B8S8;GPao",
        "site": "https://openreview.net/forum?id=E6EbeJR20o",
        "pdf_size": 24189321,
        "rating": "5;5;6;6",
        "confidence": "4;5;4;4",
        "soundness": "2;2;4;3",
        "contribution": "3;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "44;143;64;106",
        "wc_strengths": "48;62;122;31",
        "wc_weaknesses": "211;219;404;12",
        "wc_questions": "172;180;2;24",
        "wc_review": "475;604;592;173",
        "wc_reply_reviewers": "0;237;206;53",
        "wc_reply_authors": "1406;2059;1575;583",
        "reply_reviewers": "0;2;2;1",
        "reply_authors": "5;8;5;4",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            89.25,
            38.25816906230616
        ],
        "wc_strengths_avg": [
            65.75,
            34.28100786149672
        ],
        "wc_weaknesses_avg": [
            211.5,
            138.6659655430993
        ],
        "wc_questions_avg": [
            94.5,
            81.91916747623843
        ],
        "wc_review_avg": [
            461.0,
            173.74550353894054
        ],
        "wc_reply_reviewers_avg": [
            124.0,
            99.88743664745833
        ],
        "wc_reply_authors_avg": [
            1405.75,
            532.0476364950792
        ],
        "reply_reviewers_avg": [
            1.25,
            0.82915619758885
        ],
        "reply_authors_avg": [
            5.5,
            1.5
        ],
        "replies_avg": [
            36,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8093339412831834085&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;2;1;1",
        "aff_unique_norm": "Eberhard Karls University of T\u00fcbingen;Pohang University of Science and Technology;KRAFTON Inc.",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.uni-tuebingen.de/;https://www.postech.ac.kr;https://www.krafton.com",
        "aff_unique_abbr": "Uni T\u00fcbingen;POSTECH;KRAFTON",
        "aff_campus_unique_index": "0;1;1;1",
        "aff_campus_unique": "T\u00fcbingen;Pohang;",
        "aff_country_unique_index": "0;1;1;1;1;1",
        "aff_country_unique": "Germany;South Korea"
    },
    {
        "id": "E6Ix4ahpzd",
        "title": "On the Safety of Open-Sourced Large Language Models: Does Alignment Really Prevent Them From Being Misused?",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) have achieved unprecedented performance in Natural Language Generation (NLG) tasks. However, many existing studies have shown that they could be misused to generate undesired content. In response, before releasing LLMs for public access, model developers usually align those language models through Supervised Fine-Tuning (SFT) or Reinforcement Learning with Human Feedback (RLHF). Consequently, those aligned large language models refuse to generate undesired content when facing potentially harmful/unethical requests. A natural question is \"could alignment really prevent those open-sourced large language models from being misused to generate undesired content?''.  In this work, we provide a negative answer to this question. In particular, we show those open-sourced, aligned large language models could be easily misguided to generate undesired content without heavy computations or careful prompt designs. Our key idea is to directly manipulate the generation process of open-sourced LLMs to misguide it to generate undesired content including harmful or biased information and even private data. We evaluate our method on 4 open-sourced LLMs accessible publicly and our finding highlights the need for more advanced mitigation strategies for open-sourced LLMs.",
        "keywords": "Large Language Model;Responsible AIGC",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/b8a27dcbd4b352d8313eea62578f0d9ade40a041.zip",
        "author": "Hangfan Zhang;Zhimeng Guo;Huaisheng Zhu;Bochuan Cao;Lu Lin;Jinyuan Jia;Jinghui Chen;Dinghao Wu",
        "authorids": "~Hangfan_Zhang1;~Zhimeng_Guo1;~Huaisheng_Zhu1;~Bochuan_Cao1;~Lu_Lin2;~Jinyuan_Jia2;~Jinghui_Chen1;~Dinghao_Wu1",
        "gender": "Not Specified;M;M;;F;;M;",
        "homepage": ";;;https://aaaaaasuka.github.io/;https://louise-lulin.github.io;https://jinyuan-jia.github.io/;https://jinghuichen.github.io/;",
        "dblp": "266/8368.html;304/3478;264/2622.html;334/3881;86/2209-1;24/5124-1.html;67/5633;",
        "google_scholar": ";Du6bnGQAAAAJ;;eOZCg2IAAAAJ;8N04pBgAAAAJ;iyg4ytkAAAAJ;mKia7Y4AAAAJ;",
        "orcid": ";;;;0000-0002-2539-3352;0000-0002-9785-7769;;",
        "linkedin": ";;;;lulin92/;;;",
        "or_profile": "~Hangfan_Zhang1;~Zhimeng_Guo1;~Huaisheng_Zhu1;~Bochuan_Cao1;~Lu_Lin2;~Jinyuan_Jia2;~Jinghui_Chen1;~Dinghao_Wu1",
        "aff": "Pennsylvania State University;Pennsylvania State University;Pennsylvania State University;Pennsylvania State University;Pennsylvania State University;Pennsylvania State University;Pennsylvania State University;",
        "aff_domain": "psu.edu;psu.edu;psu.edu;psu.edu;psu.edu;psu.edu;psu.edu;",
        "position": "PhD student;PhD student;PhD student;PhD student;Assistant Professor;Assistant Professor;Assistant Professor;",
        "bibtex": "@misc{\nzhang2024on,\ntitle={On the Safety of Open-Sourced Large Language Models: Does Alignment Really Prevent Them From Being Misused?},\nauthor={Hangfan Zhang and Zhimeng Guo and Huaisheng Zhu and Bochuan Cao and Lu Lin and Jinyuan Jia and Jinghui Chen and Dinghao Wu},\nyear={2024},\nurl={https://openreview.net/forum?id=E6Ix4ahpzd}\n}",
        "github": "",
        "project": "",
        "reviewers": "ib1R;8iMJ;ssVq;cQgR",
        "site": "https://openreview.net/forum?id=E6Ix4ahpzd",
        "pdf_size": 995803,
        "rating": "3;3;3;5",
        "confidence": "4;3;4;4",
        "soundness": "1;2;2;2",
        "contribution": "1;1;2;2",
        "presentation": "2;2;3;3",
        "wc_summary": "157;87;133;76",
        "wc_strengths": "128;48;19;26",
        "wc_weaknesses": "312;68;154;167",
        "wc_questions": "182;42;1;64",
        "wc_review": "779;245;307;333",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            113.25,
            33.09361720936531
        ],
        "wc_strengths_avg": [
            55.25,
            43.34382885717412
        ],
        "wc_weaknesses_avg": [
            175.25,
            87.63953160532067
        ],
        "wc_questions_avg": [
            72.25,
            67.2769462743368
        ],
        "wc_review_avg": [
            416.0,
            212.00235847744713
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 20,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6222639110509840291&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0;0;0;0",
        "aff_unique_norm": "Pennsylvania State University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.psu.edu",
        "aff_unique_abbr": "PSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "CAS: A Probability-Based Approach for Universal Condition Alignment Score",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19116",
        "id": "E78OaH2s3f",
        "author_site": "Chunsan Hong, ByungHee Cha, Tae-Hyun Oh",
        "tldr": "",
        "abstract": "Recent conditional diffusion models have shown remarkable advancements and have been widely applied in fascinating real-world applications. However, samples generated by these models often do not strictly comply with user-provided conditions. Due to this, there have been few attempts to evaluate this alignment via pre-trained scoring models to select well-generated samples. Nonetheless, current studies are confined to the text-to-image domain and require large training datasets. This suggests that crafting alignment scores for various conditions will demand considerable resources in the future. In this context, we introduce a universal condition alignment score that leverages the conditional probability measurable through the diffusion process. Our technique operates across all conditions and requires no additional models beyond the diffusion model used for generation, effectively enabling self-rejection. Our experiments validate that our met- ric effectively applies in diverse conditional generations, such as text-to-image, {instruction, image}-to-image, edge-/scribble-to-image, and text-to-audio.",
        "keywords": "Generative model;diffusion model;score-based prior;conditional diffusion model;text-to-image alignment score;inversion process;image quality assessment;T2I alignment score",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Chunsan Hong;ByungHee Cha;Tae-Hyun Oh",
        "authorids": "~Chunsan_Hong1;~ByungHee_Cha1;~Tae-Hyun_Oh3",
        "gender": "M;M;M",
        "homepage": "https://sites.google.com/view/chunsanhong;;https://ami.kaist.ac.kr",
        "dblp": ";;119/1450",
        "google_scholar": "nghd1GAAAAAJ;;dMCBjeIAAAAJ",
        "orcid": ";;0000-0003-0468-1571",
        "linkedin": "chunsan-hong-2560ab219/;%EB%B3%91%ED%9D%AC-%EC%B0%A8-6384a81a4/;tae-hyun-oh-at-mit/",
        "or_profile": "~Chunsan_Hong1;~ByungHee_Cha1;~Tae-Hyun_Oh3",
        "aff": "Korea Advanced Institute of Science & Technology;Seoul National University;POSTECH",
        "aff_domain": "kaist.ac.kr;snu.ac.kr;postech.ac.kr",
        "position": "Undergrad student;Undergrad student;Associate Professor",
        "bibtex": "@inproceedings{\nhong2024cas,\ntitle={{CAS}: A Probability-Based Approach for Universal Condition Alignment Score},\nauthor={Chunsan Hong and ByungHee Cha and Tae-Hyun Oh},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=E78OaH2s3f}\n}",
        "github": "",
        "project": "",
        "reviewers": "cbcH;uTB1;8WfE",
        "pdf_size": 9918996,
        "rating": "8;8;8",
        "confidence": "3;4;4",
        "soundness": "4;4;3",
        "contribution": "3;4;3",
        "presentation": "3;3;2",
        "wc_summary": "101;82;70",
        "wc_strengths": "140;53;23",
        "wc_weaknesses": "254;191;249",
        "wc_questions": "15;21;68",
        "wc_review": "510;347;410",
        "wc_reply_reviewers": "17;24;46",
        "wc_reply_authors": "924;1082;1571",
        "reply_reviewers": "1;1;1",
        "reply_authors": "3;3;3",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            84.33333333333333,
            12.762793146051099
        ],
        "wc_strengths_avg": [
            72.0,
            49.61854492022111
        ],
        "wc_weaknesses_avg": [
            231.33333333333334,
            28.592928418676454
        ],
        "wc_questions_avg": [
            34.666666666666664,
            23.697163449568293
        ],
        "wc_review_avg": [
            422.3333333333333,
            67.11350253281543
        ],
        "wc_reply_reviewers_avg": [
            29.0,
            12.355835328567093
        ],
        "wc_reply_authors_avg": [
            1192.3333333333333,
            275.4176626305744
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.0,
            0.0
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2775505767032715951&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=E78OaH2s3f",
        "pdf": "https://openreview.net/pdf?id=E78OaH2s3f",
        "email": "kaist.ac.kr;snu.ac.kr;postech.ac.kr",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology;Seoul National University;Pohang University of Science and Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.kaist.ac.kr;https://www.snu.ac.kr;https://www.postech.ac.kr",
        "aff_unique_abbr": "KAIST;SNU;POSTECH",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Pohang",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "E83OzFbNQ6",
        "title": "Online Continual Learning Without the Storage Constraint",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Traditional online continual learning (OCL) research has primarily focused on mitigating catastrophic forgetting with fixed and limited storage allocation throughout an agent's lifetime. However, a broad range of real-world applications are primarily constrained by computational costs rather than storage limitations. In this paper, we target such applications, investigating the online continual learning problem under relaxed storage constraints and limited computational budgets. We contribute a simple algorithm, which updates a kNN classifier continually along with a fixed, pretrained feature extractor.  We selected this algorithm due to its exceptional suitability for online continual learning. It can adapt to rapidly changing streams, has zero stability gap, operates within tiny computational budgets, has low storage requirements by only storing features, and has a consistency property: It never forgets previously seen data. These attributes yield significant improvements, allowing our proposed algorithm to outperform existing methods by over 20\\% in accuracy on two large-scale OCL datasets: Continual LOCalization (CLOC) with 39M images and 712 classes and Continual Google Landmarks V2 (CGLM) with 580K images and 10,788 classes, even when existing methods retain all previously seen images. Furthermore, we achieve this superior performance with considerably reduced computational and storage expenses.",
        "keywords": "continual learning;online learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/656e2fb6f8041079459cedaa3af55c747993f938.pdf",
        "author": "Ameya Prabhu;zhipeng cai;Puneet K. Dokania;Philip Torr;Vladlen Koltun;Ozan Sener",
        "authorids": "~Ameya_Prabhu1;~zhipeng_cai3;~Puneet_K._Dokania1;~Philip_Torr1;~Vladlen_Koltun1;~Ozan_Sener1",
        "gender": "M;M;;M;M;M",
        "homepage": "https://drimpossible.github.io/;https://zhipengcai.github.io;http://www.robots.ox.ac.uk/~tvg/;http://vladlen.info/;http://ozansener.net;http://puneetkdokania.github.io/",
        "dblp": "181/4512;;;66/5458.html;125/1989;150/4211",
        "google_scholar": "0kK7sSAAAAAJ;;;kg4bCpgAAAAJ;BI8xFr4AAAAJ;https://scholar.google.fr/citations?user=WsM7ybkAAAAJ",
        "orcid": ";;;0000-0003-0858-0970;;",
        "linkedin": ";;;vladlenkoltun/;;",
        "or_profile": "~Ameya_Prabhu1;~zhipeng_cai3;~Philip_Torr1;~Vladlen_Koltun1;~Ozan_Sener1;~Puneet_Dokania1",
        "aff": "University of Oxford;Intel;University of Oxford;Apple;Apple;University of Oxford",
        "aff_domain": "ox.ac.uk;intel.com;ox.ac.uk;apple.com;apple.com;oxford.ac.uk",
        "position": "PhD student;Researcher;Full Professor;Distinguished Scientist;Researcher;Senior Researcher",
        "bibtex": "@misc{\nprabhu2024online,\ntitle={Online Continual Learning Without the Storage Constraint},\nauthor={Ameya Prabhu and zhipeng cai and Puneet K. Dokania and Philip Torr and Vladlen Koltun and Ozan Sener},\nyear={2024},\nurl={https://openreview.net/forum?id=E83OzFbNQ6}\n}",
        "github": "",
        "project": "",
        "reviewers": "2LkF;HFxe;9XgP",
        "site": "https://openreview.net/forum?id=E83OzFbNQ6",
        "pdf_size": 3564243,
        "rating": "3;5;5",
        "confidence": "4;5;4",
        "soundness": "2;3;3",
        "contribution": "2;2;3",
        "presentation": "3;3;3",
        "wc_summary": "77;95;96",
        "wc_strengths": "29;67;21",
        "wc_weaknesses": "83;156;117",
        "wc_questions": "34;136;2",
        "wc_review": "223;454;236",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "425;1138;642",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;2;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            89.33333333333333,
            8.73053390247253
        ],
        "wc_strengths_avg": [
            39.0,
            20.06655592438988
        ],
        "wc_weaknesses_avg": [
            118.66666666666667,
            29.825417944356715
        ],
        "wc_questions_avg": [
            57.333333333333336,
            57.13920623257631
        ],
        "wc_review_avg": [
            304.3333333333333,
            105.96330601780139
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            735.0,
            298.4169342826688
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 38,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=466698489979795244&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;0;2;2;0",
        "aff_unique_norm": "University of Oxford;Intel;Apple",
        "aff_unique_dep": ";Intel Corporation;Apple Inc.",
        "aff_unique_url": "https://www.ox.ac.uk;https://www.intel.com;https://www.apple.com",
        "aff_unique_abbr": "Oxford;Intel;Apple",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;1;1;0",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "id": "EA8dTp96GY",
        "title": "RelationVLM: Making Large Vision-Language Models Understand Visual Relations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The development of Large Vision-Language Models (LVLMs) is striving to catch up with the success of Large Language Models (LLMs), yet it faces more challenges to be resolved. Very recent works enable LVLMs to localize object-level visual contents and ground text to them. Nonetheless, current LVLMs still struggle to precisely understand visual relations. In this work, we present RelationVLM, a large vision-language model capable of comprehending various levels and types of relations whether across multiple images or within a video. Specifically, we devise a multi-stage relation-aware training scheme and a series of corresponding data configuration strategies to bestow RelationVLM with the capabilities of understanding semantic relations, temporal associations and geometric transforms. Extensive case studies and quantitative evaluations show RelationVLM has strong capability in understanding such relations and emerges impressive in-context capability of reasoning from few-shot examples by comparison. This work fosters the advancements of LVLMs by enabling them to support a wider range of downstream applications toward artificial general intelligence.",
        "keywords": "Large Vision-Language Models;Relation;Artifical General Intelligence",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Zhipeng Huang;Zhizheng Zhang;Zheng-Jun Zha;Yan Lu;Baining Guo",
        "authorids": "~Zhipeng_Huang3;~Zhizheng_Zhang1;~Zheng-Jun_Zha2;~Yan_Lu7;~Baining_Guo1",
        "gender": ";M;M;M;M",
        "homepage": ";;;https://www.microsoft.com/en-us/research/people/yanlu/;https://www.microsoft.com/en-us/research/people/bainguo/",
        "dblp": ";67/4758;23/1818;15/4830-1;",
        "google_scholar": ";X7M0I8kAAAAJ;;djk5l-4AAAAJ;h4kYmRYAAAAJ",
        "orcid": ";;;0000-0001-5383-6424;",
        "linkedin": ";;;;",
        "or_profile": "~Zhipeng_Huang3;~Zhizheng_Zhang1;~Zheng-Jun_Zha2;~Yan_Lu7;~Baining_Guo1",
        "aff": ";Beijing Galbot Co., Ltd;University of Science and Technology of China;Microsoft Research Asia;Microsoft Research",
        "aff_domain": ";galbot.com;ustc.edu.cn;microsoft.com;microsoft.com",
        "position": ";Principal Researcher;Full Professor;Partner Research Manager;Researcher",
        "bibtex": "@misc{\nhuang2024relationvlm,\ntitle={Relation{VLM}: Making Large Vision-Language Models Understand Visual Relations},\nauthor={Zhipeng Huang and Zhizheng Zhang and Zheng-Jun Zha and Yan Lu and Baining Guo},\nyear={2024},\nurl={https://openreview.net/forum?id=EA8dTp96GY}\n}",
        "github": "",
        "project": "",
        "reviewers": "izCF;ZyhK;BRZ9;zaJj;qTNs;hRT4",
        "site": "https://openreview.net/forum?id=EA8dTp96GY",
        "pdf_size": 2207798,
        "rating": "3;5;5;5;6;6",
        "confidence": "4;3;4;3;5;3",
        "soundness": "3;3;2;3;3;3",
        "contribution": "2;2;3;2;3;3",
        "presentation": "3;3;2;2;3;3",
        "wc_summary": "65;120;93;55;60;53",
        "wc_strengths": "32;190;40;53;44;50",
        "wc_weaknesses": "170;248;152;148;122;82",
        "wc_questions": "50;169;3;42;16;2",
        "wc_review": "317;727;288;298;242;187",
        "wc_reply_reviewers": "0;26;20;16;12;21",
        "wc_reply_authors": "542;842;380;898;416;207",
        "reply_reviewers": "0;1;1;1;1;1",
        "reply_authors": "1;2;1;2;1;1",
        "rating_avg": [
            5.0,
            1.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.7453559924999299
        ],
        "soundness_avg": [
            2.8333333333333335,
            0.3726779962499649
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            74.33333333333333,
            24.342464040346357
        ],
        "wc_strengths_avg": [
            68.16666666666667,
            54.90724501880927
        ],
        "wc_weaknesses_avg": [
            153.66666666666666,
            50.56239270006469
        ],
        "wc_questions_avg": [
            47.0,
            57.503623074260865
        ],
        "wc_review_avg": [
            343.1666666666667,
            176.87982423731154
        ],
        "wc_reply_reviewers_avg": [
            15.833333333333334,
            8.294911425419535
        ],
        "wc_reply_authors_avg": [
            547.5,
            248.6294096307461
        ],
        "reply_reviewers_avg": [
            0.8333333333333334,
            0.372677996249965
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6968778709693226853&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;2",
        "aff_unique_norm": "Galbot;University of Science and Technology of China;Microsoft",
        "aff_unique_dep": ";;Research",
        "aff_unique_url": ";http://www.ustc.edu.cn;https://www.microsoft.com/en-us/research/group/asia",
        "aff_unique_abbr": ";USTC;MSR Asia",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Asia",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "EAT7gmyIH2",
        "title": "DAME: A Distillation Based Approach For Model-agnostic Local Explainability",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The frameworks for explaining the functional space learned by deep neural networks, also known as eXplainable AI (XAI) models, are majorly based on the notion of the locality. Most of the approaches for local model-agnostic explainability employ linear models. Driven by the fact that a linear model is inherently interpretable (linear coefficients being the explanation), they are used to approximate the non-linear function locally. In this paper, we argue that local linear approximation is inapt as the black boxes under investigation are often highly non linear. We present a novel perturbation-based approach for local explainability, called the Distillation Approach for Model-agnostic Explainability (DAME). It separates out the two tasks- local approximation and generating explanation, and successfully attempts generating explanations by operating on high dimensional input space. The DAME framework is a learnable, saliency-based explainability model, which is post-hoc, model-agnostic, and requires only query access to the black box. Extensive evaluations including quantitative, qualitative and subjective measures, presented on diverse object and sound classification tasks, demonstrate that the DAME approach provides improved explanation compared to other XAI methods.",
        "keywords": "Post-hoc Explainability;Interpretability;Saliency",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/6602bb065dadb9cc88f569ad5b239fd6eab6e5f9.zip",
        "author": "Debarpan Bhattacharya;Amir Hossein Poorjam;Deepak Mittal;Sriram Ganapathy",
        "authorids": "~Debarpan_Bhattacharya1;~Amir_Hossein_Poorjam1;~Deepak_Mittal2;~Sriram_Ganapathy1",
        "gender": "M;M;M;M",
        "homepage": "https://debarpanbhatta123.github.io/;;https://deepak242424.github.io/;http://leap.ee.iisc.ac.in/sriram/",
        "dblp": "272/4019;169/3629;;23/4298.html",
        "google_scholar": "cc-xQxIAAAAJ;https://scholar.google.dk/citations?user=W1pYiAQAAAAJ;;cgpzrtcAAAAJ",
        "orcid": ";0000-0002-6882-4618;;",
        "linkedin": "debarpan98;;;",
        "or_profile": "~Debarpan_Bhattacharya1;~Amir_Hossein_Poorjam1;~Deepak_Mittal2;~Sriram_Ganapathy1",
        "aff": "Indian Institute of Science, Bangalore;FaunaPhotonics;Indian Institute of Technology, Hyderabad, Dhirubhai Ambani Institute Of Information and Communication Technology;Google DeepMind",
        "aff_domain": "iisc.ac.in;faunaphotonics.com;iith.ac.in;google.com",
        "position": "PhD student;Principal Researcher;PhD student;Researcher",
        "bibtex": "@misc{\nbhattacharya2024dame,\ntitle={{DAME}: A Distillation Based Approach For Model-agnostic Local Explainability},\nauthor={Debarpan Bhattacharya and Amir Hossein Poorjam and Deepak Mittal and Sriram Ganapathy},\nyear={2024},\nurl={https://openreview.net/forum?id=EAT7gmyIH2}\n}",
        "github": "",
        "project": "",
        "reviewers": "7xDX;RyMT;kHxm;hRgW",
        "site": "https://openreview.net/forum?id=EAT7gmyIH2",
        "pdf_size": 35571705,
        "rating": "5;6;6;8",
        "confidence": "4;4;3;4",
        "soundness": "2;4;3;2",
        "contribution": "2;2;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "180;172;77;78",
        "wc_strengths": "36;121;68;44",
        "wc_weaknesses": "311;230;40;179",
        "wc_questions": "35;155;80;104",
        "wc_review": "562;678;265;405",
        "wc_reply_reviewers": "135;27;26;23",
        "wc_reply_authors": "764;1090;695;1425",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;3;2;3",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            126.75,
            49.33241834737073
        ],
        "wc_strengths_avg": [
            67.25,
            33.191678173903775
        ],
        "wc_weaknesses_avg": [
            190.0,
            98.56723593567996
        ],
        "wc_questions_avg": [
            93.5,
            43.292609068985435
        ],
        "wc_review_avg": [
            477.5,
            156.32738083905838
        ],
        "wc_reply_reviewers_avg": [
            52.75,
            47.50986739615256
        ],
        "wc_reply_authors_avg": [
            993.5,
            290.37777118780974
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.13245323570650439,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9118549617165346626&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Indian Institute of Science;FaunaPhotonics;Indian Institute of Technology, Hyderabad;Google",
        "aff_unique_dep": ";;;Google DeepMind",
        "aff_unique_url": "https://www.iisc.ac.in;;https://www.iith.ac.in;https://deepmind.com",
        "aff_unique_abbr": "IISc;;IIT Hyderabad;DeepMind",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Bangalore;;Hyderabad",
        "aff_country_unique_index": "0;0;2",
        "aff_country_unique": "India;;United Kingdom"
    },
    {
        "id": "EAkjVCtRO2",
        "title": "Variational quantization for state space models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Forecasting tasks using large datasets gathering thousands of heterogeneous time series is a crucial statistical problem in numerous sectors. The main challenge is to model a rich variety of time series, leverage any available external signals and provide sharp predictions with statistical guarantees. In this work, we propose a new forecasting model  that combines discrete state space hidden Markov models with recent neural network architectures and training procedures inspired by vector quantized variational autoencoders. \nWe introduce a variational discrete posterior distribution of the latent states given the observations and a two-stage training procedure to alternatively train the parameters of the latent states and of the emission distributions. By learning a collection of emission laws and temporarily activating them depending on the hidden process dynamics, the proposed method allows to explore large datasets and leverage available external signals. We assess the performance of the proposed method using several datasets and show that it outperforms other state-of-the-art solutions.",
        "keywords": "Time series forecasting;hidden Markov models;neural networks;variational inference",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Etienne David;Jean Bellot;Sylvain Le Corff",
        "authorids": "~Etienne_David1;~Jean_Bellot1;~Sylvain_Le_Corff1",
        "gender": ";M;M",
        "homepage": "https://www.linkedin.com/in/etienne-david-896777171/;https://www.linkedin.com/in/jean-bellot-95619915b/;https://sylvainlc.github.io/",
        "dblp": ";;29/10875",
        "google_scholar": ";;gHRCj-EAAAAJ",
        "orcid": ";;0000-0001-5211-2328",
        "linkedin": ";;",
        "or_profile": "~Etienne_David1;~Jean_Bellot1;~Sylvain_Le_Corff1",
        "aff": "T\u00e9l\u00e9com ParisTech;;Sorbonne Universit\u00e9, LPSM",
        "aff_domain": "telecom-paristech.fr;;sorbonne-universite.fr",
        "position": "PhD student;;Full Professor",
        "bibtex": "@misc{\ndavid2024variational,\ntitle={Variational quantization for state space models},\nauthor={Etienne David and Jean Bellot and Sylvain Le Corff},\nyear={2024},\nurl={https://openreview.net/forum?id=EAkjVCtRO2}\n}",
        "github": "",
        "project": "",
        "reviewers": "pvUL;YnSQ;9MfL",
        "site": "https://openreview.net/forum?id=EAkjVCtRO2",
        "pdf_size": 6245826,
        "rating": "6;6;6",
        "confidence": "3;3;3",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "3;3;3",
        "wc_summary": "46;41;39",
        "wc_strengths": "35;27;42",
        "wc_weaknesses": "109;59;33",
        "wc_questions": "20;25;94",
        "wc_review": "210;152;208",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "76;418;487",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            42.0,
            2.943920288775949
        ],
        "wc_strengths_avg": [
            34.666666666666664,
            6.128258770283412
        ],
        "wc_weaknesses_avg": [
            67.0,
            31.538336460039655
        ],
        "wc_questions_avg": [
            46.333333333333336,
            33.76717669901086
        ],
        "wc_review_avg": [
            190.0,
            26.8824602048746
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            327.0,
            179.70531433432902
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9340669598678037781&as_sdt=800005&sciodt=0,15&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "T\u00e9l\u00e9com ParisTech;Sorbonne Universit\u00e9",
        "aff_unique_dep": ";LPSM",
        "aff_unique_url": "https://www.telecom-paristech.fr;https://www.sorbonne-universite.fr",
        "aff_unique_abbr": "TP;Sorbonne U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "France"
    },
    {
        "title": "VBH-GNN: Variational Bayesian Heterogeneous Graph Neural Networks for Cross-subject Emotion Recognition",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19115",
        "id": "EArTDUmILF",
        "author_site": "Chenyu Liu, XINLIANG ZHOU, Zhengri Zhu, Liming Zhai, Ziyu Jia, Yang Liu",
        "tldr": "",
        "abstract": "The research on human emotion under electroencephalogram (EEG) is an emerging field in which cross-subject emotion recognition (ER) is a promising but challenging task. Many approaches attempt to find emotionally relevant domain-invariant features using domain adaptation (DA) to improve the accuracy of cross-subject ER. However, two problems still exist with these methods. First, only single-modal data (EEG) is utilized, ignoring the complementarity between multi-modal physiological signals. Second, these methods aim to completely match the signal features between different domains, which is difficult due to the extreme individual differences of EEG. To solve these problems, we introduce the complementarity of multi-modal physiological signals and propose a new method for cross-subject ER that does not align the distribution of signal features but rather the distribution of spatio-temporal relationships between features. We design a Variational Bayesian Heterogeneous Graph Neural Network (VBH-GNN) with Relationship Distribution Adaptation (RDA). The RDA first aligns the domains by expressing the model space as a posterior distribution of a heterogeneous graph for a given source domain. Then, the RDA transforms the heterogeneous graph into an emotion-specific graph to further align the domains for the downstream ER task. Extensive experiments on two public datasets, DEAP and Dreamer, show that our VBH-GNN outperforms state-of-the-art methods in cross-subject scenarios.",
        "keywords": "EEG;Emotion Recognition;Multi-modal;Domain Adaptation;Cross-subject",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "Chenyu Liu;XINLIANG ZHOU;Zhengri Zhu;Liming Zhai;Ziyu Jia;Yang Liu",
        "authorids": "~Chenyu_Liu5;~XINLIANG_ZHOU1;~Zhengri_Zhu1;~Liming_Zhai1;~Ziyu_Jia1;~Yang_Liu36",
        "gender": ";;M;M;M;M",
        "homepage": "https://scholar.google.com/citations?user=xiY8eH4AAAAJ&hl=zh-CN;;https://aa.bjtu.edu.cn/schoolcensus/schoolcensus/stucensuscard/;https://cs.ccnu.edu.cn/info/1100/3340.htm;https://ziyujia.github.io/;https://personal.ntu.edu.sg/yangliu/",
        "dblp": ";60/2684;;https://dblp.uni-trier.de/pid/149/3381;256/1411;51/3710-3",
        "google_scholar": ";EoiH18QAAAAJ;;jIcKoywAAAAJ;;https://scholar.google.com.sg/citations?hl=en",
        "orcid": ";;;0000-0003-3229-056X;;0000-0001-7300-9215",
        "linkedin": ";;;;;",
        "or_profile": "~Chenyu_Liu5;~XINLIANG_ZHOU1;~Zhengri_Zhu1;~Liming_Zhai1;~Ziyu_Jia1;~Yang_Liu36",
        "aff": "Nanyang Technological University;Nanyang Technological University;Beijing Jiaotong University;Central China Normal University;Institute of Automation, Chinese Academy of Sciences;Nanyang Technological University",
        "aff_domain": "ntu.edu.sg;e.ntu.edu.sg;bjtu.edu.cn;ccnu.edu.cn;ia.ac.cn;ntu.edu.sg",
        "position": "PhD student;PhD student;Undergrad student;Associate Professor;Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\nliu2024vbhgnn,\ntitle={{VBH}-{GNN}: Variational Bayesian Heterogeneous Graph Neural Networks for Cross-subject Emotion Recognition},\nauthor={Chenyu Liu and XINLIANG ZHOU and Zhengri Zhu and Liming Zhai and Ziyu Jia and Yang Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=EArTDUmILF}\n}",
        "github": "",
        "project": "",
        "reviewers": "Pxr2;QvEM;zn1U;D38r",
        "pdf_size": 10468639,
        "rating": "6;6;8;8",
        "confidence": "3;2;4;4",
        "soundness": "3;3;3;3",
        "contribution": "3;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "47;108;57;48",
        "wc_strengths": "19;48;331;30",
        "wc_weaknesses": "30;66;408;52",
        "wc_questions": "39;190;10;92",
        "wc_review": "135;412;806;222",
        "wc_reply_reviewers": "0;18;0;26",
        "wc_reply_authors": "566;2196;888;852",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "1;5;2;3",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            65.0,
            25.129663746258124
        ],
        "wc_strengths_avg": [
            107.0,
            129.74012486505475
        ],
        "wc_weaknesses_avg": [
            139.0,
            155.83645273170202
        ],
        "wc_questions_avg": [
            82.75,
            68.54697294556486
        ],
        "wc_review_avg": [
            393.75,
            258.2308802215568
        ],
        "wc_reply_reviewers_avg": [
            11.0,
            11.357816691600547
        ],
        "wc_reply_authors_avg": [
            1125.5,
            630.5194287252376
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.75,
            1.479019945774904
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.9045340337332909,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4006937864810480632&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=EArTDUmILF",
        "pdf": "https://openreview.net/pdf?id=EArTDUmILF",
        "email": "ntu.edu.sg;e.ntu.edu.sg;bjtu.edu.cn;ccnu.edu.cn;ia.ac.cn;ntu.edu.sg",
        "author_num": 6,
        "aff_unique_index": "0;0;1;2;3;0",
        "aff_unique_norm": "Nanyang Technological University;Beijing Jiao Tong University;Central China Normal University;Chinese Academy of Sciences",
        "aff_unique_dep": ";;;Institute of Automation",
        "aff_unique_url": "https://www.ntu.edu.sg;http://www.njtu.edu.cn/en;http://www.ccnu.edu.cn;http://www.ia.cas.cn",
        "aff_unique_abbr": "NTU;BJTU;CCNU;CAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;1;1;0",
        "aff_country_unique": "Singapore;China"
    },
    {
        "id": "EAvcKbUXwb",
        "title": "Interpreting Equivariant Representations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Latent representations are used extensively for downstream tasks, such as visualization, interpolation or feature extraction of deep learning models. Invariant and equivariant neural networks are powerful and well-established models for enforcing inductive biases. In this paper, we demonstrate that the inductive bias imposed on the by an equivariant model must also be taken into account when using latent representations. We show how not accounting for the inductive biases leads to decreased performance on downstream tasks, and vice versa, how accounting for inductive biases can be done effectively by using an invariant projection of the latent representations. We propose principles for how to choose such a projection, and show the impact of using these principles in two common examples: First, we study a permutation equivariant variational auto-encoder trained for molecule graph generation; here we show that invariant projections can be designed that incur no loss of information in the resulting invariant representation. Next, we study a rotation-equivariant representation used for image classification. Here, we illustrate how random invariant projections can be used to obtain an invariant representation with a high degree of retained information. In both cases, the analysis of invariant latent representations proves superior to their equivariant counterparts. Finally, we illustrate that the phenomena documented here for equivariant neural networks have counterparts in standard neural networks where invariance is encouraged via augmentation. Thus, while these ambiguities may be known by experienced developers of equivariant models, we make both the knowledge as well as effective tools to handle the ambiguities available to the broader community.",
        "keywords": "permutation equivariance;graph interpolation;variational autoencoder;VAE;molecule generation;visualization;representation learning;equivariance;invariance;graphs;group action;group convolutional neural network;GCNN",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Andreas Abildtrup Hansen;Anna Calissano;Aasa Feragen",
        "authorids": "~Andreas_Abildtrup_Hansen1;~Anna_Calissano1;~Aasa_Feragen2",
        "gender": ";F;",
        "homepage": ";https://annacalissano.com/;http://people.compute.dtu.dk/afhar/",
        "dblp": ";;62/8616",
        "google_scholar": ";;MNDVpoUAAAAJ",
        "orcid": ";0000-0002-7403-0531;",
        "linkedin": ";;",
        "or_profile": "~Andreas_Abildtrup_Hansen1;~Anna_Calissano1;~Aasa_Feragen2",
        "aff": ";Imperial College London;Technical University of Denmark",
        "aff_domain": ";imperial.ac.uk;dtu.dk",
        "position": ";Postdoc;Professor",
        "bibtex": "@misc{\nhansen2024interpreting,\ntitle={Interpreting Equivariant Representations},\nauthor={Andreas Abildtrup Hansen and Anna Calissano and Aasa Feragen},\nyear={2024},\nurl={https://openreview.net/forum?id=EAvcKbUXwb}\n}",
        "github": "",
        "project": "",
        "reviewers": "Nrx9;f5He;t9rk",
        "site": "https://openreview.net/forum?id=EAvcKbUXwb",
        "pdf_size": 10939294,
        "rating": "5;5;6",
        "confidence": "2;2;4",
        "soundness": "3;2;3",
        "contribution": "2;2;3",
        "presentation": "4;1;3",
        "wc_summary": "51;101;134",
        "wc_strengths": "27;56;83",
        "wc_weaknesses": "72;266;2",
        "wc_questions": "14;2;75",
        "wc_review": "164;425;294",
        "wc_reply_reviewers": "43;309;15",
        "wc_reply_authors": "393;763;207",
        "reply_reviewers": "1;1;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "wc_summary_avg": [
            95.33333333333333,
            34.120700787384514
        ],
        "wc_strengths_avg": [
            55.333333333333336,
            22.866763848189994
        ],
        "wc_weaknesses_avg": [
            113.33333333333333,
            111.67014919942672
        ],
        "wc_questions_avg": [
            30.333333333333332,
            31.961782734314987
        ],
        "wc_review_avg": [
            294.3333333333333,
            106.55306450569854
        ],
        "wc_reply_reviewers_avg": [
            122.33333333333333,
            132.48731595473166
        ],
        "wc_reply_authors_avg": [
            454.3333333333333,
            231.09209323461408
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6712259069507697350&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Imperial College London;Technical University of Denmark",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.imperial.ac.uk;https://www.tek.dk",
        "aff_unique_abbr": "ICL;DTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United Kingdom;Denmark"
    },
    {
        "id": "EBUoTvVtMM",
        "title": "User Inference Attacks on Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Fine-tuning is a common and effective method for tailoring large language models (LLMs) to specialized tasks and applications. In this paper, we study the privacy implications of fine-tuning LLMs on user data. To this end, we define a realistic threat model, called user inference, wherein an attacker infers whether a user's data was used for fine-tuning. We implement attacks for this threat model that require only a small set of samples from a user (possibly different from the samples used for training) and black-box access to the fine-tuned LLM. We find that LLMs are susceptible to user inference attacks across a variety of fine-tuning datasets, at times with near perfect attack success rates. Further, we investigate which properties make users vulnerable to user inference, finding that outlier users (i.e. those with data distributions sufficiently different from other users) and users who contribute large quantities of data are most susceptible to attack. Finally, we explore several heuristics for mitigating privacy attacks. We find that interventions in the training algorithm, such as batch or per-example gradient clipping and early stopping fail to prevent user inference. However, limiting the number of fine-tuning samples from a single user can reduce attack effectiveness, albeit at the cost of reducing the total amount of fine-tuning data.",
        "keywords": "Language Models;Privacy;User Data",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Nikhil Kandpal;Krishna Pillutla;Alina Oprea;Peter Kairouz;Christopher A. Choquette-Choo;Zheng Xu",
        "authorids": "~Nikhil_Kandpal2;~Krishna_Pillutla1;~Alina_Oprea1;~Peter_Kairouz1;~Christopher_A._Choquette-Choo1;~Zheng_Xu2",
        "gender": "M;M;F;M;M;",
        "homepage": "https://nkandpa2.github.io;https://krishnap25.github.io;http://www.ccs.neu.edu/home/alina/;https://kairouzp.github.io/;https://www.christopherchoquette.com;https://sites.google.com/site/xuzhustc/",
        "dblp": "247/5935;173/5185.html;35/3425;129/1254;250/9674;83/2535-2",
        "google_scholar": "jGdqlOwAAAAJ;IL7N6sMAAAAJ;https://scholar.google.com.tw/citations?user=16J3izoAAAAJ;m8NUgw0AAAAJ;oDE4I64AAAAJ;TfWlMTYAAAAJ",
        "orcid": ";;0000-0002-4979-5292;;;0009-0003-6747-3953",
        "linkedin": ";;alina-oprea-9588bb1;kayrouzp;christopher-choquette-choo/;zheng-xu-0a125236/",
        "or_profile": "~Nikhil_Kandpal2;~Krishna_Pillutla1;~Alina_Oprea1;~Peter_Kairouz1;~Christopher_A._Choquette-Choo1;~Zheng_Xu2",
        "aff": "University of Toronto;Google;Northeastern University;Google;Google DeepMind;Google",
        "aff_domain": "cs.toronto.edu;google.com;northeastern.edu;google.com;google.com;google.com",
        "position": "PhD student;Visiting Researcher;Associate Professor;Research Scientist;Research Scientist;Research Scientist",
        "bibtex": "@misc{\nkandpal2024user,\ntitle={User Inference Attacks on Large Language Models},\nauthor={Nikhil Kandpal and Krishna Pillutla and Alina Oprea and Peter Kairouz and Christopher A. Choquette-Choo and Zheng Xu},\nyear={2024},\nurl={https://openreview.net/forum?id=EBUoTvVtMM}\n}",
        "github": "",
        "project": "",
        "reviewers": "hrNQ;UDKj;TnAv;7zUW",
        "site": "https://openreview.net/forum?id=EBUoTvVtMM",
        "pdf_size": 794964,
        "rating": "3;5;6;8",
        "confidence": "4;4;2;3",
        "soundness": "2;3;3;3",
        "contribution": "1;2;3;3",
        "presentation": "2;3;4;4",
        "wc_summary": "80;85;109;124",
        "wc_strengths": "49;42;105;52",
        "wc_weaknesses": "324;136;170;8",
        "wc_questions": "104;54;63;63",
        "wc_review": "557;317;447;247",
        "wc_reply_reviewers": "548;196;0;0",
        "wc_reply_authors": "1658;1312;613;134",
        "reply_reviewers": "2;2;0;0",
        "reply_authors": "4;4;2;1",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            99.5,
            17.89553016817328
        ],
        "wc_strengths_avg": [
            62.0,
            25.089838580588754
        ],
        "wc_weaknesses_avg": [
            159.5,
            112.55554184490428
        ],
        "wc_questions_avg": [
            71.0,
            19.403607911932255
        ],
        "wc_review_avg": [
            392.0,
            119.26860441876563
        ],
        "wc_reply_reviewers_avg": [
            186.0,
            223.79454863780754
        ],
        "wc_reply_authors_avg": [
            929.25,
            593.7193676308699
        ],
        "reply_reviewers_avg": [
            1.0,
            1.0
        ],
        "reply_authors_avg": [
            2.75,
            1.299038105676658
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5853694070049635,
        "gs_citation": 28,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1014417870018807792&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2;1;1;1",
        "aff_unique_norm": "University of Toronto;Google;Northeastern University",
        "aff_unique_dep": ";Google;",
        "aff_unique_url": "https://www.utoronto.ca;https://www.google.com;https://www.northeastern.edu",
        "aff_unique_abbr": "U of T;Google;NEU",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;1;1;2;1",
        "aff_country_unique": "Canada;United States;United Kingdom"
    },
    {
        "title": "Vision-by-Language for Training-Free Compositional Image Retrieval",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19114",
        "id": "EDPxCjXzSb",
        "author_site": "Shyamgopal Karthik, Karsten Roth, Massimiliano Mancini, Zeynep Akata",
        "tldr": "",
        "abstract": "Given an image and a target modification (e.g an image of the Eiffel tower and the text \u201cwithout people and at night-time\u201d), Compositional Image Retrieval (CIR) aims to retrieve the relevant target image in a database. While supervised approaches rely on annotating triplets that is costly (i.e. query image, textual modification, and target image), recent research sidesteps this need by using large-scale vision-language models (VLMs), performing Zero-Shot CIR (ZS-CIR). However, state-of-the-art approaches in ZS-CIR still require training task-specific, customized models over large amounts of image-text pairs. In this work, we proposeto tackle CIR in a training-free manner via our Compositional Image Retrieval through Vision-by-Language (CIReVL), a simple, yet human-understandable and scalable pipeline that effectively recombines large-scale VLMs with large language models (LLMs). By captioning the reference image using a pre-trained generative VLM and asking a LLM to recompose the caption based on the textual target modification for subsequent retrieval via e.g. CLIP, we achieve modular language reasoning. In four ZS-CIR benchmarks, we find competitive, in-part state-of-the-art performance - improving over supervised methods Moreover, the modularity of CIReVL offers simple scalability without re-training, allowing us to both investigate scaling laws and bottlenecks for ZS-CIR while easily scaling up to in parts more than double of previously reported results. Finally, we show that CIReVL makes CIR human-understandable by composing image and text in a modular fashion in the language domain, thereby making it intervenable, allowing to post-hoc re-align failure cases. Code will be released upon acceptance.",
        "keywords": "Vision-Language Models;Large Language Models",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Shyamgopal Karthik;Karsten Roth;Massimiliano Mancini;Zeynep Akata",
        "authorids": "~Shyamgopal_Karthik1;~Karsten_Roth1;~Massimiliano_Mancini1;~Zeynep_Akata1",
        "gender": ";Not Specified;M;F",
        "homepage": "https://sgk98.github.io/;https://karroth.com/;https://mancinimassimiliano.github.io/;https://eml-unitue.de/people/zeynep-akata",
        "dblp": "251/8983;234/7803;192/2058;117/4838",
        "google_scholar": "MofhemMAAAAJ;93ZjIs0AAAAJ;https://scholar.google.it/citations?user=bqTPA8kAAAAJ;jQl9RtkAAAAJ",
        "orcid": ";;0000-0001-8595-9955;0000-0002-1432-7747",
        "linkedin": ";;;zeynep-akata-36182045/?ppe=1",
        "or_profile": "~Shyamgopal_Karthik1;~Karsten_Roth1;~Massimiliano_Mancini1;~Zeynep_Akata1",
        "aff": "Snap Inc.;University of Tuebingen;University of Trento;Helmholtz Munich",
        "aff_domain": "snapchat.com;uni-tuebingen.de;unitn.it;helmholtz-munich.de",
        "position": "Intern;PhD student;Assistant Professor;Researcher",
        "bibtex": "@inproceedings{\nkarthik2024visionbylanguage,\ntitle={Vision-by-Language for Training-Free Compositional Image Retrieval},\nauthor={Shyamgopal Karthik and Karsten Roth and Massimiliano Mancini and Zeynep Akata},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=EDPxCjXzSb}\n}",
        "github": "",
        "project": "",
        "reviewers": "Tg9t;JtMi;QaMw;W9gL",
        "pdf_size": 2225230,
        "rating": "5;5;6;6",
        "confidence": "5;4;4;4",
        "soundness": "3;3;2;3",
        "contribution": "2;2;1;2",
        "presentation": "4;2;2;3",
        "wc_summary": "84;61;188;93",
        "wc_strengths": "57;51;234;63",
        "wc_weaknesses": "178;703;209;127",
        "wc_questions": "4;167;29;75",
        "wc_review": "323;982;660;358",
        "wc_reply_reviewers": "36;54;277;71",
        "wc_reply_authors": "660;1493;915;690",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;4;3;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            106.5,
            48.479377058704046
        ],
        "wc_strengths_avg": [
            101.25,
            76.7605855892202
        ],
        "wc_weaknesses_avg": [
            304.25,
            232.0725910141049
        ],
        "wc_questions_avg": [
            68.75,
            62.17867399679733
        ],
        "wc_review_avg": [
            580.75,
            266.1459890736661
        ],
        "wc_reply_reviewers_avg": [
            109.5,
            97.49487166000065
        ],
        "wc_reply_authors_avg": [
            939.5,
            334.4147873524734
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 64,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7330301410106745675&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=EDPxCjXzSb",
        "pdf": "https://openreview.net/pdf?id=EDPxCjXzSb",
        "email": "snapchat.com;uni-tuebingen.de;unitn.it;helmholtz-munich.de",
        "author_num": 4,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Snap Inc.;University of Tuebingen;University of Trento;Helmholtz Zentrum M\u00fcnchen",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.snapinc.com;https://www.uni-tuebingen.de/;https://www.unitn.it;https://www.helmholtz-muenchen.de",
        "aff_unique_abbr": "Snap;Uni T\u00fcbingen;UniTN;HMGU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;1",
        "aff_country_unique": "United States;Germany;Italy"
    },
    {
        "title": "One-shot Active Learning Based on Lewis Weight Sampling for Multiple Deep Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19113",
        "id": "EDXkkUAIFW",
        "author_site": "Sheng-Jun Huang, Yi Li, Yiming Sun, Ying-Peng Tang",
        "tldr": "",
        "abstract": "Active learning (AL) for multiple target models aims to reduce labeled data querying while effectively training multiple models concurrently. Existing AL algorithms often rely on iterative model training, which can be computationally expensive, particularly for deep models. In this paper, we propose a one-shot AL method to address this challenge, which performs all label queries without repeated model training. Specifically, we extract different representations of the same dataset using distinct network backbones, and actively learn the linear prediction layer on each representation via an $\\ell_p$-regression formulation. The regression problems are solved approximately by \nsampling and reweighting the unlabeled instances based on their maximum Lewis weights across the representations. An upper bound on the number of samples needed is provided with a rigorous analysis for $p\\in [1, +\\infty)$. Experimental results on 11 benchmarks show that our one-shot approach achieves competitive performances with the state-of-the-art AL methods for multiple target models.",
        "keywords": "active learning;Lewis weight sampling;machine learning;deep learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/8eb4cbc751fb593c976f0278660ef5021b7257f6.zip",
        "author": "Sheng-Jun Huang;Yi Li;Yiming Sun;Ying-Peng Tang",
        "authorids": "~Sheng-Jun_Huang1;~Yi_Li8;~Yiming_Sun2;~Ying-Peng_Tang1",
        "gender": ";M;F;M",
        "homepage": "http://parnec.nuaa.edu.cn/huangsj;;;http://tangyp.cn/",
        "dblp": "01/3367.html;59/871-2;;234/7906",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;;;https://scholar.google.com.hk/citations?user=ohuW7YcAAAAJ",
        "orcid": "0000-0002-7673-5367;;;0000-0003-1529-9714",
        "linkedin": ";;https://www.linkedin.com/feed/;",
        "or_profile": "~Sheng-Jun_Huang1;~Yi_Li8;~Yiming_Sun2;~Ying-Peng_Tang1",
        "aff": "Nanjing University of Aeronautics and Astronautics;Nanyang Technological University;Nanyang Technological University;Nanjing University of Aeronautics and Astronautics",
        "aff_domain": "nuaa.edu.cn;ntu.edu.sg;ntu.edu.sg;nuaa.edu.cn",
        "position": "Full Professor;Associate Professor;PhD student;PhD student",
        "bibtex": "@inproceedings{\nhuang2024oneshot,\ntitle={One-shot Active Learning Based on Lewis Weight Sampling for Multiple Deep Models},\nauthor={Sheng-Jun Huang and Yi Li and Yiming Sun and Ying-Peng Tang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=EDXkkUAIFW}\n}",
        "github": "",
        "project": "",
        "reviewers": "QZho;ecLZ;KBY8;pbqA",
        "pdf_size": 869245,
        "rating": "5;5;5;6",
        "confidence": "3;3;3;3",
        "soundness": "3;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;2",
        "wc_summary": "52;71;72;59",
        "wc_strengths": "38;32;47;89",
        "wc_weaknesses": "126;110;140;137",
        "wc_questions": "19;138;114;28",
        "wc_review": "235;351;373;313",
        "wc_reply_reviewers": "159;39;0;9",
        "wc_reply_authors": "679;1072;654;220",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            63.5,
            8.381527307120106
        ],
        "wc_strengths_avg": [
            51.5,
            22.299103120977758
        ],
        "wc_weaknesses_avg": [
            128.25,
            11.755317945508747
        ],
        "wc_questions_avg": [
            74.75,
            52.04505259868608
        ],
        "wc_review_avg": [
            318.0,
            52.507142371300304
        ],
        "wc_reply_reviewers_avg": [
            51.75,
            63.582131923992605
        ],
        "wc_reply_authors_avg": [
            656.25,
            301.53140383714594
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5769539341160471364&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=EDXkkUAIFW",
        "pdf": "https://openreview.net/pdf?id=EDXkkUAIFW",
        "email": "nuaa.edu.cn;ntu.edu.sg;ntu.edu.sg;nuaa.edu.cn",
        "author_num": 4,
        "aff_unique_index": "0;1;1;0",
        "aff_unique_norm": "Nanjing University of Aeronautics and Astronautics;Nanyang Technological University",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.nuaa.edu.cn;https://www.ntu.edu.sg",
        "aff_unique_abbr": "NUAA;NTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "China;Singapore"
    },
    {
        "id": "EE75tyB5Ay",
        "title": "On the Generalization of Training-based ChatGPT Detection Methods",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "ChatGPT is one of the most popular language models which achieve amazing performance on various natural language tasks. Consequently, there is also an urgent need to detect the texts generated ChatGPT from human written. One of the extensively studied methods trains classification models to distinguish both. However, existing studies also demonstrate that the trained models may suffer from distribution shifts (during test), i.e., they are ineffective to predict the generated texts from unseen  language tasks or topics. In this work, we aim to have a comprehensive investigation on these methods' generalization behaviors under distribution shift caused by a wide range of factors, including prompts, text lengths, topics, and language tasks. To achieve this goal, we first collect a new dataset with human and ChatGPT texts, and then we conduct extensive studies on the collected dataset. Our studies unveil insightful findings which provide guidance for developing future methodologies or data collection strategies for ChatGPT detection.",
        "keywords": "large language model;ChatGPT;trustworthy AI",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Han Xu;Jie Ren;Pengfei He;Shenglai Zeng;Yingqian Cui;Amy Liu;Hui Liu;Jiliang Tang",
        "authorids": "~Han_Xu1;~Jie_Ren6;~Pengfei_He2;~Shenglai_Zeng2;~Yingqian_Cui1;amyziyuliu@gmail.com;~Hui_Liu8;~Jiliang_Tang1",
        "gender": "M;M;M;M;F;;F;M",
        "homepage": "https://cse.msu.edu/~xuhan1/;https://renjie3.github.io/;https://pengfeihepower.github.io/;https://slz-ai.github.io/;https://yingqiancui.github.io/;;https://scholar.google.com/citations?user=EuzF_zsAAAAJ&hl=en;https://www.cse.msu.edu/~tangjili/",
        "dblp": "32/34-2;181/2887-19.html;37/10219-2;312/6540;;;93/4010-31;64/10812",
        "google_scholar": "mX2rL3IAAAAJ;;nsSrd6kAAAAJ;https://scholar.google.com.hk/citations?user=2EFS5WEAAAAJ;3p67r08AAAAJ;;;WtzKMWAAAAAJ",
        "orcid": "0000-0002-4016-6748;;;0009-0001-9664-8017;;;0000-0002-3555-3495;0000-0001-7125-3898",
        "linkedin": ";;;;;;;",
        "or_profile": "~Han_Xu1;~Jie_Ren6;~Pengfei_He2;~Shenglai_Zeng2;~Yingqian_Cui1;amyziyuliu@gmail.com;~Hui_Liu8;~Jiliang_Tang1",
        "aff": "Michigan State University;Sony Europe Ltd.;Michigan State University;Michigan State University;Michigan State University;;Michigan State University;Michigan State University",
        "aff_domain": "msu.edu;sony.com;msu.edu;msu.edu;msu.edu;;msu.edu;msu.edu",
        "position": "PhD student;Intern;PhD student;PhD student;PhD student;;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nxu2024on,\ntitle={On the Generalization of Training-based Chat{GPT} Detection Methods},\nauthor={Han Xu and Jie Ren and Pengfei He and Shenglai Zeng and Yingqian Cui and Amy Liu and Hui Liu and Jiliang Tang},\nyear={2024},\nurl={https://openreview.net/forum?id=EE75tyB5Ay}\n}",
        "github": "",
        "project": "",
        "reviewers": "uBbK;FWZZ;vcVF",
        "site": "https://openreview.net/forum?id=EE75tyB5Ay",
        "pdf_size": 3363618,
        "rating": "5;5;6",
        "confidence": "4;4;2",
        "soundness": "2;3;2",
        "contribution": "2;2;2",
        "presentation": "3;4;3",
        "wc_summary": "60;48;73",
        "wc_strengths": "27;82;49",
        "wc_weaknesses": "33;52;101",
        "wc_questions": "10;33;61",
        "wc_review": "130;215;284",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "720;1327;1455",
        "reply_reviewers": "0;0;0",
        "reply_authors": "3;4;4",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            60.333333333333336,
            10.208928554075703
        ],
        "wc_strengths_avg": [
            52.666666666666664,
            22.60285134421958
        ],
        "wc_weaknesses_avg": [
            62.0,
            28.647280266487194
        ],
        "wc_questions_avg": [
            34.666666666666664,
            20.8539897594894
        ],
        "wc_review_avg": [
            209.66666666666666,
            62.98324292134289
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1167.3333333333333,
            320.5997851250406
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=605253303291365992&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;0;0;0;0;0",
        "aff_unique_norm": "Michigan State University;Sony Europe",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.msu.edu;https://www.sony.eu",
        "aff_unique_abbr": "MSU;Sony Europe",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;0;0;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "EEqEyyYUwc",
        "title": "To guide or not to guide: Improving diffusion sampling with progressive guidance",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Diffusion guidance pertains to the use of conditional diffusion under specific constraints, such as class labels or textual inputs. There are primarily two methodologies: Classifier Guidance leverages a pre-trained classifier to guide generation towards the condition, while Classifier-Free Guidance achieves implicit guidance without any classifier but by entering the condition during training. Both approaches employ a weighting parameter \u03c9 that determines the trade-off between\nsample fidelity (unconditional diffusion) and conditional adherence. In this paper, we posit that such conflict between image quality and condition arises, in part, due to misclassification and conflicted gradients from the explicit or implicit classifier, especially when the noise is high i.e., at the first stages of generation. To address this, we introduce a progressive weighting scheme, called Progressive-Guidance, where we make the weight of the guidance term dependent on the timestep. We propose two-time dependent weighting schemes: a simple heuristic, and a more\nprecise gradient-norm-based method. Progressive-Guidance can be implemented without retraining the model and with only a few additional lines of code. We report enhanced performance in benchmark metrics on three tasks: class-conditional image generation, text-to-image generation, and text-to-motion generation.",
        "keywords": "diffusion model;generative model",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Xi WANG;Nicolas Dufour;Nefeli Andreou;Marie-Paule CANI;Victoria Fernandez Abrevaya;David Picard;Vicky Kalogeiton",
        "authorids": "~Xi_WANG13;~Nicolas_Dufour1;~Nefeli_Andreou1;~Marie-Paule_CANI1;~Victoria_Fernandez_Abrevaya1;~David_Picard1;~Vicky_Kalogeiton2",
        "gender": "M;M;F;F;;;",
        "homepage": "https://triocrossing.github.io/;https://nicolas-dufour.github.io/;https://nefeliandreou.github.io;https://www.lix.polytechnique.fr/vista/vista-member/marie-paule_cani/;;;http://vicky.kalogeiton.info/",
        "dblp": ";289/7909;307/5201;c/MariePauleCani.html;;;157/8338",
        "google_scholar": ";g_eDdc4AAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.fr/citations?user=z0RoFtcAAAAJ;;;https://scholar.google.com/citations?hl=en",
        "orcid": ";;0000-0003-0341-6469;0000-0001-7752-9031;;;",
        "linkedin": ";nicolas-dufour/;nefeliandreou/;marie-paule-cani-993726170?miniProfileUrn=urn%3Ali%3Afs_miniProfile%3AACoAACivo_8B7Bkm6kZ2aQErJDpUNr3_uOyq-nU&lipi=urn%3Ali%3Apage%3Ad_flagship3_search_srp_all%3BAH6%2BURRwSuaAw6%2BdSzS2EA%3D%3D;;;",
        "or_profile": "~Xi_WANG13;~Nicolas_Dufour1;~Nefeli_Andreou1;~Marie-Paule_CANI1;~Victoria_Fernandez_Abrevaya1;~David_Picard1;~Vicky_Kalogeiton2",
        "aff": "\u00c9cole Polytechnique;Ecole Polytechnique;University of Cyprus;Ecole Polytechnique;;;Ecole polytechnique, IP Paris",
        "aff_domain": "polytechnique.fr;polytechnique.edu;ucy.ac.cy;polytechnique.edu;;;polytechnique.edu",
        "position": "Postdoc;PhD student;PhD student;Full Professor;;;Assistant Professor",
        "bibtex": "@misc{\nwang2024to,\ntitle={To guide or not to guide: Improving diffusion sampling with progressive guidance},\nauthor={Xi WANG and Nicolas Dufour and Nefeli Andreou and Marie-Paule CANI and Victoria Fernandez Abrevaya and David Picard and Vicky Kalogeiton},\nyear={2024},\nurl={https://openreview.net/forum?id=EEqEyyYUwc}\n}",
        "github": "",
        "project": "",
        "reviewers": "y49U;4fCg;RdGV;fKi6",
        "site": "https://openreview.net/forum?id=EEqEyyYUwc",
        "pdf_size": 4623961,
        "rating": "3;3;6;6",
        "confidence": "4;5;4;5",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;2;3",
        "wc_summary": "86;79;39;48",
        "wc_strengths": "28;19;81;78",
        "wc_weaknesses": "176;303;156;315",
        "wc_questions": "2;32;7;24",
        "wc_review": "292;433;283;465",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            63.0,
            19.912307751739878
        ],
        "wc_strengths_avg": [
            51.5,
            28.20017730440715
        ],
        "wc_weaknesses_avg": [
            237.5,
            71.97395362212639
        ],
        "wc_questions_avg": [
            16.25,
            12.214233500306108
        ],
        "wc_review_avg": [
            368.25,
            81.60078124626014
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:3cJ6QxOzQG4J:scholar.google.com/&scioq=To+guide+or+not+to+guide:+Improving+diffusion+sampling+with+progressive+guidance&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "Ecole Polytechnique;University of Cyprus",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.polytechnique.edu;https://www.ucy.ac.cy",
        "aff_unique_abbr": "X;UCY",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "France;Cyprus"
    },
    {
        "id": "EFGwiZ2pAW",
        "title": "SimTeG: A Frustratingly Simple Approach Improves Textual Graph Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Textual graphs (TGs) are graphs whose nodes correspond to text (sentences or documents), which are widely prevalent. The representation learning of TGs involves two stages: $(i)$ unsupervised feature extraction and $(ii)$ supervised graph representation learning. In recent years, extensive efforts have been devoted to the latter stage, where Graph Neural Networks (GNNs) have dominated. However, the former stage for most existing graph benchmarks still relies on traditional feature engineering techniques. More recently, with the rapid development of language models (LMs), researchers have focused on leveraging LMs to facilitate the learning of TGs, either by jointly training them in a computationally intensive framework (merging the two stages), or designing complex self-supervised training tasks for feature extraction (enhancing the first stage). In this work, we present SimTeG, a frustratingly simple approach for textual graph learning that does not innovate in frameworks, models, and tasks. Instead, we first perform supervised parameter-efficient fine-tuning (PEFT) on a pre-trained LM on the downstream task, such as node classification. We then generate node embeddings using the last hidden states of finetuned LM. These derived features can be further utilized by any GNN for training on the same task. We evaluate our approach on two fundamental graph representation learning tasks: node classification and link prediction. Through extensive experiments, we show that our approach significantly improves the performance of various GNNs on multiple graph benchmarks. Remarkably, when additional supporting text provided by large language models (LLMs) is included, a simple two-layer GraphSAGE trained on an ensemble of SimTeG achieves an accuracy of 77.48\\% on OGBN-Arxiv, comparable to state-of-the-art (SOTA) performance obtained from far more complicated GNN architectures. Furthermore, when combined with a SOTA GNN, we achieve a new SOTA of \\(78.04 \\%\\) on OGBN-Arxiv.  We will release our code and generated node features soon.",
        "keywords": "Text attributed Graph;Graph Learning;Language Models",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Keyu Duan;Qian Liu;Tat-Seng Chua;Shuicheng YAN;Wei Tsang Ooi;Michael Qizhe Xie;Junxian He",
        "authorids": "~Keyu_Duan1;~Qian_Liu2;~Tat-Seng_Chua2;~Shuicheng_YAN3;~Wei_Tsang_Ooi1;~Michael_Qizhe_Xie1;~Junxian_He1",
        "gender": "M;M;;M;;;M",
        "homepage": "https://kduan.live;http://siviltaram.github.io/;;https://yanshuicheng.ai/;;;https://jxhe.github.io",
        "dblp": ";;;y/ShuichengYan;;;188/6127.html",
        "google_scholar": "fGW4ClMAAAAJ;bcbeUo0AAAAJ;;https://scholar.google.com.hk/citations?user=DNuiPHwAAAAJ;;;BIFGeoUAAAAJ",
        "orcid": "0000-0002-1902-5545;;;;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Keyu_Duan1;~Qian_Liu2;~Tat-Seng_Chua2;~Shuicheng_YAN3;~Wei_Tsang_Ooi1;~Michael_Qizhe_Xie1;~Junxian_He1",
        "aff": "National University of Singapore;Tiktok;;sea Group;;;Hong Kong University of Science and Technology",
        "aff_domain": "u.nus.edu;bytedance.com;;sea.com;;;ust.hk",
        "position": "PhD student;Researcher;;Researcher;;;Assistant Professor",
        "bibtex": "@misc{\nduan2024simteg,\ntitle={SimTeG: A Frustratingly Simple Approach Improves Textual Graph Learning},\nauthor={Keyu Duan and Qian Liu and Tat-Seng Chua and Shuicheng YAN and Wei Tsang Ooi and Michael Qizhe Xie and Junxian He},\nyear={2024},\nurl={https://openreview.net/forum?id=EFGwiZ2pAW}\n}",
        "github": "",
        "project": "",
        "reviewers": "wDRw;PJGj;cWJD",
        "site": "https://openreview.net/forum?id=EFGwiZ2pAW",
        "pdf_size": 1175291,
        "rating": "3;5;6",
        "confidence": "4;5;4",
        "soundness": "2;3;3",
        "contribution": "2;2;3",
        "presentation": "3;3;3",
        "wc_summary": "82;61;108",
        "wc_strengths": "126;19;112",
        "wc_weaknesses": "340;201;100",
        "wc_questions": "74;71;40",
        "wc_review": "622;352;360",
        "wc_reply_reviewers": "0;264;0",
        "wc_reply_authors": "1475;764;783",
        "reply_reviewers": "0;1;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            83.66666666666667,
            19.223827807061618
        ],
        "wc_strengths_avg": [
            85.66666666666667,
            47.48567035315906
        ],
        "wc_weaknesses_avg": [
            213.66666666666666,
            98.38812033077073
        ],
        "wc_questions_avg": [
            61.666666666666664,
            15.369522511198006
        ],
        "wc_review_avg": [
            444.6666666666667,
            125.43612805815644
        ],
        "wc_reply_reviewers_avg": [
            88.0,
            124.45079348883236
        ],
        "wc_reply_authors_avg": [
            1007.3333333333334,
            330.7812301540434
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.18898223650461357,
        "gs_citation": 70,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18136174937095403504&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "National University of Singapore;TikTok;Sea Group;Hong Kong University of Science and Technology",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.nus.edu.sg;https://www.tiktok.com;;https://www.ust.hk",
        "aff_unique_abbr": "NUS;TikTok;;HKUST",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "Singapore;China;"
    },
    {
        "title": "Flow to Better: Offline Preference-based Reinforcement Learning via Preferred Trajectory Generation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19112",
        "id": "EG68RSznLT",
        "author_site": "Zhilong Zhang, Yihao Sun, Junyin Ye, Tian-Shuo Liu, Jiaji Zhang, Yang Yu",
        "tldr": "",
        "abstract": "Offline preference-based reinforcement learning (PbRL) offers an effective solution to overcome the challenges associated with designing rewards and the high costs of online interactions. In offline PbRL, agents are provided with a fixed dataset containing human preferences between pairs of trajectories. Previous studies mainly focus on recovering the rewards from the preferences, followed by policy optimization with an off-the-shelf offline RL algorithm. However, given that preference label in PbRL is inherently trajectory-based, accurately learning transition-wise rewards from such label can be challenging, potentially leading to misguidance during subsequent offline RL training. To address this issue, we introduce our method named $\\textit{Flow-to-Better (FTB)}$, which leverages the pairwise preference relationship to guide a generative model in producing preferred trajectories, avoiding Temporal Difference (TD) learning with inaccurate rewards. Conditioning on a low-preference trajectory, $\\textit{FTB}$ uses a diffusion model to generate a better one with a higher preference, achieving high-fidelity full-horizon trajectory improvement. During diffusion training, we propose a technique called $\\textit{Preference Augmentation}$ to alleviate the problem of insufficient preference data. As a result, we surprisingly find that the model-generated trajectories not only exhibit increased preference and consistency with the real transition but also introduce elements of $\\textit{novelty}$ and $\\textit{diversity}$, from which we can derive a desirable policy through imitation learning. Experimental results on D4RL benchmarks demonstrate that FTB achieves a remarkable improvement compared to state-of-the-art offline PbRL methods. Furthermore, we show that FTB can also serve as an effective data augmentation method for offline RL.",
        "keywords": "Preference-based Reinforcement Learning;Offline Reinforcement Learning;Conditional Generative Modeling;Diffusion Models",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/907d98394076a214dc2c82800a1b929d0d76b8b0.zip",
        "author": "Zhilong Zhang;Yihao Sun;Junyin Ye;Tian-Shuo Liu;Jiaji Zhang;Yang Yu",
        "authorids": "~Zhilong_Zhang2;~Yihao_Sun1;~Junyin_Ye1;~Tian-Shuo_Liu1;~Jiaji_Zhang1;~Yang_Yu5",
        "gender": "M;M;M;M;M;M",
        "homepage": "http://www.lamda.nju.edu.cn/zhangzl/;http://www.lamda.nju.edu.cn/sunyh/;http://www.lamda.nju.edu.cn/yejy/;https://github.com/LTSure;http://www.lamda.nju.edu.cn/zhangjj/;http://www.lamda.nju.edu.cn/yuy",
        "dblp": ";;;;;46/2181-1",
        "google_scholar": ";pFNG8fMAAAAJ;;;;PG2lDSwAAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Zhilong_Zhang2;~Yihao_Sun1;~Junyin_Ye1;~Tian-Shuo_Liu1;~Jiaji_Zhang1;~Yang_Yu2",
        "aff": "Nanjing University;Nanjing University;Nanjing University;Nanjing university;Nanjing University;Nanjing University",
        "aff_domain": "nju.edu.cn;nju.edu.cn;nju.edu.cn;nju.edu.cn;nju.edu.cn;nju.edu.cn",
        "position": "MS student;MS student;MS student;MS student;MS student;Professor",
        "bibtex": "@inproceedings{\nzhang2024flow,\ntitle={Flow to Better: Offline Preference-based Reinforcement Learning via Preferred Trajectory Generation},\nauthor={Zhilong Zhang and Yihao Sun and Junyin Ye and Tian-Shuo Liu and Jiaji Zhang and Yang Yu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=EG68RSznLT}\n}",
        "github": "",
        "project": "",
        "reviewers": "ssfF;Juf3;UxuZ",
        "pdf_size": 2791264,
        "rating": "5;6;6",
        "confidence": "5;3;4",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "2;3;3",
        "wc_summary": "77;197;149",
        "wc_strengths": "59;336;81",
        "wc_weaknesses": "139;290;258",
        "wc_questions": "40;66;48",
        "wc_review": "315;889;536",
        "wc_reply_reviewers": "0;0;67",
        "wc_reply_authors": "903;1198;1089",
        "reply_reviewers": "0;0;1",
        "reply_authors": "2;3;4",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            141.0,
            49.31531202375181
        ],
        "wc_strengths_avg": [
            158.66666666666666,
            125.71484487610132
        ],
        "wc_weaknesses_avg": [
            229.0,
            64.96665811527222
        ],
        "wc_questions_avg": [
            51.333333333333336,
            10.873004286866728
        ],
        "wc_review_avg": [
            580.0,
            236.39091917133084
        ],
        "wc_reply_reviewers_avg": [
            22.333333333333332,
            31.584102892999123
        ],
        "wc_reply_authors_avg": [
            1063.3333333333333,
            121.79308500713641
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.0,
            0.816496580927726
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 20,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7451857308295330398&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=EG68RSznLT",
        "pdf": "https://openreview.net/pdf?id=EG68RSznLT",
        "email": "nju.edu.cn;nju.edu.cn;nju.edu.cn;nju.edu.cn;nju.edu.cn;nju.edu.cn",
        "author_num": 6,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "Nanjing University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nju.edu.cn",
        "aff_unique_abbr": "Nanjing U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Revisiting Data Augmentation in Deep Reinforcement Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19111",
        "id": "EGQBpkIEuu",
        "author_site": "Jianshu Hu, Yunpeng Jiang, Paul Weng",
        "tldr": "",
        "abstract": "Various data augmentation techniques have been recently proposed in image-based deep reinforcement learning (DRL).\nAlthough they empirically demonstrate the effectiveness of data augmentation for improving sample efficiency or generalization, which technique should be preferred is not always clear. \nTo tackle this question, we analyze existing methods to better understand them and to uncover how they are connected.\nNotably, by expressing the variance of the Q-targets and that of the empirical actor/critic losses of these methods, we can analyze the effects of their different components and compare them.\nWe furthermore formulate an explanation about how these methods may be affected by choosing different data augmentation transformations in calculating the target Q-values.\nThis analysis suggests recommendations on how to exploit data augmentation in a more principled way.\nIn addition, we include a regularization term called tangent prop, previously proposed in computer vision, but whose adaptation to DRL is novel to the best of our knowledge.\nWe evaluate our proposition and validate our analysis in several domains. \nCompared to different relevant baselines,  we demonstrate that it achieves state-of-the-art performance in most environments and shows higher sample efficiency and better generalization ability in some complex environments.",
        "keywords": "Reinforcement Learning;Data Augmentation",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/c54bf936dad832a2eff4357cbba2b0296f985823.zip",
        "author": "Jianshu Hu;Yunpeng Jiang;Paul Weng",
        "authorids": "~Jianshu_Hu1;~Yunpeng_Jiang1;~Paul_Weng1",
        "gender": "M;M;M",
        "homepage": "https://jianshu-hu.github.io/;https://github.com/jyp9961/jyp9961.github.io/blob/main/Homepage.md;http://weng.fr",
        "dblp": "337/1942;;http://dblp.uni-trier.de/pers/hd/w/Weng:Paul",
        "google_scholar": ";;_Hd6AeQAAAAJ",
        "orcid": "0009-0006-2837-425X;;",
        "linkedin": ";;paul-weng-69a15980/",
        "or_profile": "~Jianshu_Hu1;~Yunpeng_Jiang1;~Paul_Weng1",
        "aff": "Shanghai Jiaotong University;Shanghai Jiaotong University;Duke Kunshan University",
        "aff_domain": "sjtu.edu.cn;sjtu.edu.cn;dukekunshan.edu.cn",
        "position": "PhD student;PhD student;Associate Professor",
        "bibtex": "@inproceedings{\nhu2024revisiting,\ntitle={Revisiting Data Augmentation in Deep Reinforcement Learning},\nauthor={Jianshu Hu and Yunpeng Jiang and Paul Weng},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=EGQBpkIEuu}\n}",
        "github": "",
        "project": "",
        "reviewers": "pcif;9PSY;BeKW;GnUL",
        "pdf_size": 4917854,
        "rating": "6;6;6;6",
        "confidence": "4;3;5;3",
        "soundness": "3;4;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;3;2;3",
        "wc_summary": "200;85;40;131",
        "wc_strengths": "155;419;27;84",
        "wc_weaknesses": "356;282;72;79",
        "wc_questions": "199;4;254;1",
        "wc_review": "910;790;393;295",
        "wc_reply_reviewers": "29;0;25;0",
        "wc_reply_authors": "1100;358;1247;139",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "3;2;4;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            114.0,
            59.16502345136018
        ],
        "wc_strengths_avg": [
            171.25,
            150.0539486318171
        ],
        "wc_weaknesses_avg": [
            197.25,
            124.55395417247901
        ],
        "wc_questions_avg": [
            114.5,
            113.68047325728372
        ],
        "wc_review_avg": [
            597.0,
            258.8619323114158
        ],
        "wc_reply_reviewers_avg": [
            13.5,
            13.573871960498227
        ],
        "wc_reply_authors_avg": [
            711.0,
            471.80769387537543
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16569532461320115550&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=EGQBpkIEuu",
        "pdf": "https://openreview.net/pdf?id=EGQBpkIEuu",
        "email": "sjtu.edu.cn;sjtu.edu.cn;dukekunshan.edu.cn",
        "author_num": 3,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Shanghai Jiao Tong University;Duke Kunshan University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.sjtu.edu.cn;https://www.duk/Dk.edu",
        "aff_unique_abbr": "SJTU;DKU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Kunshan",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "EGRDoPU0Lq",
        "title": "Fast Explanation of RBF-Kernel SVM Models Using Activation Patterns",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Machine learning models have significantly enriched the toolbox in the field of neuroimaging analysis. Among them, Support Vector Machines (SVM) have been one of the most popular models for supervised learning, but their use primarily relies on linear SVM models due to their explainability. Kernel SVM models are capable classifiers but more opaque. Recent advances in eXplainable AI (XAI) have developed several feature importance methods to address the explainability problem. However, these explanations can be affected by noise variables which leads to irrelevant variables being regarded as important variables. This problem also appears in explaining linear models, which the linear pattern can address. In this paper, we propose a fast method to explain RBF kernel SVM globally by adopting the notion of a linear pattern in kernel space. Our method can generate global explanations with low computational cost and is less affected by noise variables. We successfully evaluate our method on simulated and real MEG/EEG datasets.",
        "keywords": "RBF Kernel; Support Vector Machines; Activation Pattern; EEG; MEG",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/0b16919b7eb87b1349b0aed881781af944d41533.zip",
        "author": "MengQi Zhang;Matthias S. Treder;David Marshall;Yuhua Li",
        "authorids": "~MengQi_Zhang4;~Matthias_S._Treder1;~David_Marshall3;~Yuhua_Li1",
        "gender": "M;M;M;M",
        "homepage": "https://www.cardiff.ac.uk/people/research-students/view/2470622-zhang-mengqi;;https://users.cs.cf.ac.uk/Dave.Marshall/;https://www.cardiff.ac.uk/people/view/1063589-li-yuhua",
        "dblp": ";59/8740.html;https://dblp.uni-trier.de/pid/m/ADavidMarshall.html;79/5796-1",
        "google_scholar": ";iEBE0qgAAAAJ;7HJzGQYAAAAJ;https://scholar.google.co.uk/citations?user=33T8CtwAAAAJ",
        "orcid": ";0000-0001-5955-2326;0000-0003-2789-1395;0000-0003-2913-4478",
        "linkedin": ";mtreder/;david-marshall-4306a720/?lipi=urn%3Ali%3Apage%3Ad_flagship3_feed%3BEQnW2VEpSh%2BREsJQCQ8AUA%3D%3D;yuhua-li-55999126/?originalSubdomain=uk",
        "or_profile": "~MengQi_Zhang4;~Matthias_S._Treder1;~David_Marshall3;~Yuhua_Li1",
        "aff": "Cardiff University;iSize;Cardiff University;Cardiff University",
        "aff_domain": "ac.uk;isize.co;cardiff.ac.uk;cardiff.ac.uk",
        "position": "PhD student;Researcher;Full Professor;Associate Professor",
        "bibtex": "@misc{\nzhang2024fast,\ntitle={Fast Explanation of {RBF}-Kernel {SVM} Models Using Activation Patterns},\nauthor={MengQi Zhang and Matthias S. Treder and David Marshall and Yuhua Li},\nyear={2024},\nurl={https://openreview.net/forum?id=EGRDoPU0Lq}\n}",
        "github": "",
        "project": "",
        "reviewers": "KvcN;pU9a;vJrk;bpWC",
        "site": "https://openreview.net/forum?id=EGRDoPU0Lq",
        "pdf_size": 2317683,
        "rating": "5;5;6;8",
        "confidence": "4;3;4;4",
        "soundness": "2;3;3;4",
        "contribution": "2;3;3;4",
        "presentation": "1;3;2;4",
        "wc_summary": "93;85;130;53",
        "wc_strengths": "39;24;40;34",
        "wc_weaknesses": "92;139;54;113",
        "wc_questions": "41;79;25;27",
        "wc_review": "265;327;249;227",
        "wc_reply_reviewers": "0;0;12;0",
        "wc_reply_authors": "707;749;384;343",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            90.25,
            27.39867697535777
        ],
        "wc_strengths_avg": [
            34.25,
            6.339361166552983
        ],
        "wc_weaknesses_avg": [
            99.5,
            31.100643080167973
        ],
        "wc_questions_avg": [
            43.0,
            21.6794833886788
        ],
        "wc_review_avg": [
            267.0,
            37.17526059088221
        ],
        "wc_reply_reviewers_avg": [
            3.0,
            5.196152422706632
        ],
        "wc_reply_authors_avg": [
            545.75,
            183.42760833636794
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.4714045207910316,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11858820338107817304&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Cardiff University;iSize",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cardiff.ac.uk;",
        "aff_unique_abbr": "Cardiff;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United Kingdom;"
    },
    {
        "id": "EGjvMcKrrl",
        "title": "From generalization analysis to optimization designs for state space models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "A State Space Model (SSM) is a foundation model in time series analysis, which has recently been shown as an alternative to transformers in sequence modeling.  \nIn this paper, we theoretically study the generalization of SSMs and  \npropose improvements to training algorithms based on the\ngeneralization results.\nSpecifically, we give a *data-dependent* generalization bound for SSMs,\nshowing an interplay between the SSM parameters and the\ntemporal dependencies of the training sequences.\nLeveraging the generalization bound,\nwe \n(1) set up a scaling rule for model initialization based on the proposed generalization measure,\nwhich significantly improves the robustness of SSMs to different temporal patterns in the sequence data;\n(2) introduce a new regularization method for training SSMs to enhance the generalization performance.\nNumerical results are conducted to validate our results.",
        "keywords": "generalization; state space model; optimization",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/6e38bd044d65854690ac46c7460c93654a3531e2.zip",
        "author": "Fusheng Liu;Qianxiao Li",
        "authorids": "~Fusheng_Liu1;~Qianxiao_Li1",
        "gender": ";M",
        "homepage": "https://mathematicallfs.github.io;https://blog.nus.edu.sg/qianxiaoli/",
        "dblp": ";172/0930.html",
        "google_scholar": ";https://scholar.google.com.sg/citations?user=zLgReYoAAAAJ",
        "orcid": ";0000-0002-3903-3737",
        "linkedin": ";",
        "or_profile": "~Fusheng_Liu1;~Qianxiao_Li1",
        "aff": "National University of Singapore;National University of Singapore",
        "aff_domain": "u.nus.edu;nus.edu.sg",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nliu2024from,\ntitle={From generalization analysis to optimization designs for state space models},\nauthor={Fusheng Liu and Qianxiao Li},\nyear={2024},\nurl={https://openreview.net/forum?id=EGjvMcKrrl}\n}",
        "github": "",
        "project": "",
        "reviewers": "SPHH;nrdv;2971",
        "site": "https://openreview.net/forum?id=EGjvMcKrrl",
        "pdf_size": 3619671,
        "rating": "6;6;6",
        "confidence": "4;4;3",
        "soundness": "3;3;2",
        "contribution": "2;3;2",
        "presentation": "3;3;2",
        "wc_summary": "64;49;62",
        "wc_strengths": "86;30;119",
        "wc_weaknesses": "309;26;601",
        "wc_questions": "234;155;304",
        "wc_review": "693;260;1086",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1336;567;1960",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;1;3",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            58.333333333333336,
            6.649979114420001
        ],
        "wc_strengths_avg": [
            78.33333333333333,
            36.736297521056144
        ],
        "wc_weaknesses_avg": [
            312.0,
            234.7523517809069
        ],
        "wc_questions_avg": [
            231.0,
            60.86597297888753
        ],
        "wc_review_avg": [
            679.6666666666666,
            337.34486146309615
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1287.6666666666667,
            569.7159136115317
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17064670728480213744&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "National University of Singapore",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nus.edu.sg",
        "aff_unique_abbr": "NUS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Singapore"
    },
    {
        "title": "Prompt Gradient Projection for Continual Learning",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19110",
        "id": "EH2O3h7sBI",
        "author_site": "Jingyang Qiao, Zhizhong Zhang, Xin Tan, Chengwei Chen, Yanyun Qu, Yong Peng, Yuan Xie",
        "tldr": "",
        "abstract": "Prompt-tuning has demonstrated impressive performance in continual learning by querying relevant prompts for each input instance, which can avoid the introduction of task identifier. Its forgetting is therefore reduced as this instance-wise query mechanism enables us to select and update only relevant prompts. In this paper, we further integrate prompt-tuning with gradient projection approach. Our observation is: prompt-tuning releases the necessity of task identifier for gradient projection method; and gradient projection provides theoretical guarantees against forgetting for prompt-tuning. This inspires a new prompt gradient projection approach (PGP) for continual learning. In PGP, we deduce that reaching the orthogonal condition for prompt gradient can effectively prevent forgetting via the self-attention mechanism in vision-transformer. The condition equations are then realized by conducting Singular Value Decomposition (SVD) on an element-wise sum space between input space and prompt space. We validate our method on diverse datasets and experiments demonstrate the efficiency of reducing forgetting both in class incremental, online class incremental, and task incremental settings. The code is available at https://github.com/JingyangQiao/prompt-gradient-projection.",
        "keywords": "Continual Learning;Prompt Tuning;Gradient Projection;Anti-forgetting",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/e8c8cd471d52d08a0716d3d2809e90a01308e599.pdf",
        "author": "Jingyang Qiao;zhizhong zhang;Xin Tan;Chengwei Chen;Yanyun Qu;Yong Peng;Yuan Xie",
        "authorids": "~Jingyang_Qiao1;~zhizhong_zhang1;~Xin_Tan2;~Chengwei_Chen2;~Yanyun_Qu1;~Yong_Peng4;~Yuan_Xie5",
        "gender": "M;M;M;M;F;M;",
        "homepage": ";;https://tanxincs.github.io/;https://scholar.google.com/citations?user=2QeklnoAAAAJ&hl=en;http://quyanyun.xmu.edu.cn;https://faculty.csu.edu.cn/pengyong/zh_CN/index.htm;",
        "dblp": ";20/1541;89/6413-2;248/5596;03/3500;;",
        "google_scholar": ";CXZciFAAAAAJ;https://scholar.google.com/citations?hl=zh-CN;2QeklnoAAAAJ;;jvRZQl4AAAAJ;",
        "orcid": "0009-0001-2577-8199;;0000-0001-9346-1196;;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Jingyang_Qiao1;~zhizhong_zhang1;~Xin_Tan2;~Chengwei_Chen2;~Yanyun_Qu1;~Yong_Peng4;~Yuan_Xie5",
        "aff": "East China Normal University;East China Normal University;East China Normal University;2nd Military Medical University;Xiamen University;Central South University;",
        "aff_domain": "ecnu.edu.cn;ecnu.edu.cn;ecnu.edu.cn;smmu.edu.cn;xmu.edu.cn;csu.edu.cn;",
        "position": "PhD student;Associate Professor;Associate Professor;Postdoc;Full Professor;Full Professor;",
        "bibtex": "@inproceedings{\nqiao2024prompt,\ntitle={Prompt Gradient Projection for Continual Learning},\nauthor={Jingyang Qiao and zhizhong zhang and Xin Tan and Chengwei Chen and Yanyun Qu and Yong Peng and Yuan Xie},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=EH2O3h7sBI}\n}",
        "github": "",
        "project": "",
        "reviewers": "LEcv;epe6;Q1LH",
        "pdf_size": 2968117,
        "rating": "6;8;8",
        "confidence": "3;4;5",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "4;2;3",
        "wc_summary": "96;115;49",
        "wc_strengths": "40;90;57",
        "wc_weaknesses": "278;242;52",
        "wc_questions": "47;280;97",
        "wc_review": "461;727;255",
        "wc_reply_reviewers": "29;0;17",
        "wc_reply_authors": "1448;2082;737",
        "reply_reviewers": "1;0;1",
        "reply_authors": "6;9;4",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            86.66666666666667,
            27.740864362084242
        ],
        "wc_strengths_avg": [
            62.333333333333336,
            20.75786330258702
        ],
        "wc_weaknesses_avg": [
            190.66666666666666,
            99.14747713493381
        ],
        "wc_questions_avg": [
            141.33333333333334,
            100.15432536285634
        ],
        "wc_review_avg": [
            481.0,
            193.21145583703534
        ],
        "wc_reply_reviewers_avg": [
            15.333333333333334,
            11.897712198383164
        ],
        "wc_reply_authors_avg": [
            1422.3333333333333,
            549.3938073509344
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            6.333333333333333,
            2.0548046676563256
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.8660254037844385,
        "gs_citation": 31,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15344468557273253905&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=EH2O3h7sBI",
        "pdf": "https://openreview.net/pdf?id=EH2O3h7sBI",
        "email": "ecnu.edu.cn;ecnu.edu.cn;ecnu.edu.cn;smmu.edu.cn;xmu.edu.cn;csu.edu.cn;",
        "author_num": 7,
        "aff_unique_index": "0;0;0;1;2;3",
        "aff_unique_norm": "East China Normal University;Second Military Medical University;Xiamen University;Central South University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "http://www.ecnu.edu.cn;http://www.smmu.edu.cn;https://www.xmu.edu.cn;https://www.csu.edu.cn",
        "aff_unique_abbr": "ECNU;SMMU;XMU;CSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "EHKS0oXuku",
        "title": "Jensen-Shannon Divergence Based Novel Loss Functions for Bayesian Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We aim to overcome the limitations of Kullback-Leibler (KL) divergence-based variational inference (VI) used in Bayesian Neural Networks (BNNs), which stem from the lack of boundedness of KL-divergence. These limitations include unstable optimization, poor approximation, and difficulties in approximating light-tailed posteriors, which are well documented in the literature. To overcome these limitations, we propose two novel loss functions for BNNs based on Jensen-Shannon (JS) divergences, which are bounded, symmetric, and more general. We employ a constrained optimization framework to formulate these loss functions due to the intractability of the JS divergence-based VI. Further, we show that the two loss functions presented here generalize the conventional KL divergence-based loss function for BNNs. In addition to establishing stability in optimization, we perform rigorous theoretical analysis, and empirical experiments to evaluate the performance of the proposed loss functions.  The empirical experiments are performed on the CIFAR-10 data set with various levels of added noise and a highly biased histopathology data set.  Our analysis and experiments suggest that the proposed losses perform better than the KL divergence-based loss and significantly better than their deterministic counterpart. Similar improvements by the present approach are also observed on the CIFAR-100 data set.",
        "keywords": "Bayesian neural networks;KL divergence;JS divergence;Variational Inference;Uncertainty quantification",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/61e4c36177dd3a3c569e08a0d6ae1ff1e7d9981e.zip",
        "author": "Ponkrshnan Thiagarajan;Susanta Ghosh",
        "authorids": "~Ponkrshnan_Thiagarajan1;~Susanta_Ghosh1",
        "gender": "M;",
        "homepage": ";https://www.mtu.edu/mechanical/people/faculty/ghosh/",
        "dblp": "277/1379;220/2124",
        "google_scholar": "AmF33scAAAAJ;zaeE_kMAAAAJ",
        "orcid": "0000-0003-3946-3902;",
        "linkedin": ";",
        "or_profile": "~Ponkrshnan_Thiagarajan1;~Susanta_Ghosh1",
        "aff": "Michigan Technological University;Michigan Technological University",
        "aff_domain": "mtu.edu;mtu.edu",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nthiagarajan2024jensenshannon,\ntitle={Jensen-Shannon Divergence Based Novel Loss Functions for Bayesian Neural Networks},\nauthor={Ponkrshnan Thiagarajan and Susanta Ghosh},\nyear={2024},\nurl={https://openreview.net/forum?id=EHKS0oXuku}\n}",
        "github": "",
        "project": "",
        "reviewers": "uNB9;AJUX;PkhQ;kqYv;BhnF",
        "site": "https://openreview.net/forum?id=EHKS0oXuku",
        "pdf_size": 1092904,
        "rating": "3;3;3;5;5",
        "confidence": "4;4;4;4;4",
        "soundness": "2;1;2;3;3",
        "contribution": "2;2;2;2;2",
        "presentation": "2;2;1;3;3",
        "wc_summary": "139;106;66;65;70",
        "wc_strengths": "33;58;26;79;69",
        "wc_weaknesses": "436;1164;61;132;163",
        "wc_questions": "3;352;213;4;117",
        "wc_review": "611;1680;366;280;419",
        "wc_reply_reviewers": "0;103;0;0;0",
        "wc_reply_authors": "574;704;398;200;603",
        "reply_reviewers": "0;1;0;0;0",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            3.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.2,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.2,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            89.2,
            29.171218692402963
        ],
        "wc_strengths_avg": [
            53.0,
            20.42547429069886
        ],
        "wc_weaknesses_avg": [
            391.2,
            406.8215333533858
        ],
        "wc_questions_avg": [
            137.8,
            132.69724940630834
        ],
        "wc_review_avg": [
            671.2,
            515.9633320304846
        ],
        "wc_reply_reviewers_avg": [
            20.6,
            41.2
        ],
        "wc_reply_authors_avg": [
            495.8,
            177.77333883347077
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13472170809081005435&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Michigan Technological University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.mtu.edu",
        "aff_unique_abbr": "MTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "AgentVerse: Facilitating Multi-Agent Collaboration and Exploring Emergent Behaviors",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19109",
        "id": "EHg5GDnyq1",
        "author_site": "Weize Chen, Yusheng Su, Jingwei Zuo, Cheng Yang, Chenfei Yuan, Chi-Min Chan, Heyang Yu, Yaxi Lu, Yi-Hsin Hung, Chen Qian, Yujia Qin, Xin Cong, Ruobing Xie, Zhiyuan Liu, Maosong Sun, Jie Zhou",
        "tldr": "",
        "abstract": "Autonomous agents empowered by Large Language Models (LLMs) have undergone significant improvements, enabling them to generalize across a broad spectrum of tasks. However, in real-world scenarios, cooperation among individuals is often required to enhance the efficiency and effectiveness of task accomplishment. Hence, inspired by human group dynamics, we propose a multi-agent framework AgentVerse that can effectively orchestrate a collaborative group of expert agents as a greater-than-the-sum-of-its-parts system. Our experiments demonstrate that AgentVerse can proficiently deploy multi-agent groups that outperform a single agent. Extensive experiments on text understanding, reasoning, coding, tool utilization, and embodied AI confirm the effectiveness of AgentVerse. Moreover, our analysis of agent interactions within AgentVerse reveals the emergence of specific collaborative behaviors, contributing to heightened group efficiency. We will release our codebase, AgentVerse, to further facilitate multi-agent research.",
        "keywords": "large language mode;agent;multi-agent",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Weize Chen;Yusheng Su;Jingwei Zuo;Cheng Yang;Chenfei Yuan;Chi-Min Chan;Heyang Yu;Yaxi Lu;Yi-Hsin Hung;Chen Qian;Yujia Qin;Xin Cong;Ruobing Xie;Zhiyuan Liu;Maosong Sun;Jie Zhou",
        "authorids": "~Weize_Chen1;~Yusheng_Su1;~Jingwei_Zuo2;~Cheng_Yang6;~Chenfei_Yuan1;~Chi-Min_Chan1;~Heyang_Yu1;~Yaxi_Lu1;~Yi-Hsin_Hung1;~Chen_Qian8;~Yujia_Qin1;~Xin_Cong1;~Ruobing_Xie2;~Zhiyuan_Liu1;~Maosong_Sun1;~Jie_Zhou8",
        "gender": "M;M;M;M;;;M;;F;;M;M;M;M;M;M",
        "homepage": "https://chenweize1998.github.io/;https://yushengsu-thu.github.io/;https://jingwei-zuo.com/;https://albertyang33.github.io/;https://chenfeiyuan.com;;https://github.com/Tsuruko04;;https://github.com/CindyHung20;;https://yujia-qin.github.io/;;http://nlp.csai.tsinghua.edu.cn/~xrb/;http://nlp.csai.tsinghua.edu.cn/~lzy;https://www.cs.tsinghua.edu.cn/csen/info/1312/4394.htm;",
        "dblp": "245/7488;260/5558;;49/1457-2;355/3243.html;;;;379/3091;;126/2333;141/4386.html;178/8590;53/3245-1;95/3291-1;00/5012-16",
        "google_scholar": "0CoGHtIAAAAJ;xwy6Va4AAAAJ;;OlLjVUcAAAAJ;;;;PXjYFB0AAAAJ;;;;RL9CmXgAAAAJ;j3OX8KUAAAAJ;dT0v5u0AAAAJ;https://scholar.google.com.tw/citations?user=zIgT0HMAAAAJ;https://scholar.google.com.hk/citations?user=OijxQCMAAAAJ",
        "orcid": ";0000-0001-9509-9573;;0000-0001-7821-0030;0009-0001-5251-9803;;;;;;;;0000-0003-3170-5647;0000-0002-7709-2543;;0000-0002-5899-5165",
        "linkedin": ";;;;;;;;;;yujia-qin-672595181/;;;;;",
        "or_profile": "~Weize_Chen1;~Yusheng_Su1;~Jingwei_Zuo2;~Cheng_Yang6;~Chenfei_Yuan1;~Chi-Min_Chan1;~Heyang_Yu1;~Yaxi_Lu1;~Yi-Hsin_Hung1;~Chen_Qian8;~Yujia_Qin1;~Xin_Cong1;~Ruobing_Xie2;~Zhiyuan_Liu1;~Maosong_Sun1;~Jie_Zhou8",
        "aff": "Tsinghua University;Advanced Micro Devices;Tsinghua University;Beijing University of Posts and Telecommunications;Tsinghua University;;Department of Computer Science and Technology, Tsinghua University;Department of Computer Science and Technology, Tsinghua University;Tsinghua University;;Tsinghua University;Tsinghua University;Tencent;Tsinghua University;Tsinghua University;WeChat AI, Tencent Inc.",
        "aff_domain": "tsinghua.edu.cn;amd.com;mails.tsinghua.edu.cn;bupt.edu.cn;cs.tsinghua.edu.cn;;cs.tsinghua.edu.cn;cs.tsinghua.edu.cn;mail.tsinghua.edu.cn;;tsinghua.edu.cn;mail.tsinghua.edu.cn;tencent.com;tsinghua.edu.cn;tsinghua.edu.cn;tencent.com",
        "position": "PhD student;Researcher;Undergrad student;Associate Professor;Undergrad student;;Undergrad student;PhD student;Undergrad student;;PhD student;Postdoc;Senior researcher;Associate Professor;Full Professor;Principal Researcher",
        "bibtex": "@inproceedings{\nchen2024agentverse,\ntitle={AgentVerse: Facilitating Multi-Agent Collaboration and Exploring Emergent Behaviors},\nauthor={Weize Chen and Yusheng Su and Jingwei Zuo and Cheng Yang and Chenfei Yuan and Chi-Min Chan and Heyang Yu and Yaxi Lu and Yi-Hsin Hung and Chen Qian and Yujia Qin and Xin Cong and Ruobing Xie and Zhiyuan Liu and Maosong Sun and Jie Zhou},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=EHg5GDnyq1}\n}",
        "github": "",
        "project": "",
        "reviewers": "Mwtr;4SVa;rnqE;Zbb4",
        "pdf_size": 4484272,
        "rating": "6;6;6;6",
        "confidence": "3;2;3;5",
        "soundness": "3;2;3;3",
        "contribution": "2;2;4;3",
        "presentation": "3;3;4;3",
        "wc_summary": "108;49;131;89",
        "wc_strengths": "72;44;121;96",
        "wc_weaknesses": "90;159;117;265",
        "wc_questions": "21;88;18;61",
        "wc_review": "291;340;387;511",
        "wc_reply_reviewers": "0;22;28;24",
        "wc_reply_authors": "767;1035;787;1094",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "3;3;2;3",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.25,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            94.25,
            30.06139550985616
        ],
        "wc_strengths_avg": [
            83.25,
            28.525208149985513
        ],
        "wc_weaknesses_avg": [
            157.75,
            66.62347559231655
        ],
        "wc_questions_avg": [
            47.0,
            29.129023327259016
        ],
        "wc_review_avg": [
            382.25,
            81.71711876956994
        ],
        "wc_reply_reviewers_avg": [
            18.5,
            10.897247358851684
        ],
        "wc_reply_authors_avg": [
            920.75,
            145.4276022631192
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            0.4330127018922193
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            16,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 335,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13815451266857953260&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=EHg5GDnyq1",
        "pdf": "https://openreview.net/pdf?id=EHg5GDnyq1",
        "email": "tsinghua.edu.cn;amd.com;mails.tsinghua.edu.cn;bupt.edu.cn;cs.tsinghua.edu.cn;;cs.tsinghua.edu.cn;cs.tsinghua.edu.cn;mail.tsinghua.edu.cn;;tsinghua.edu.cn;mail.tsinghua.edu.cn;tencent.com;tsinghua.edu.cn;tsinghua.edu.cn;tencent.com",
        "author_num": 16,
        "aff_unique_index": "0;1;0;2;0;0;0;0;0;0;3;0;0;3",
        "aff_unique_norm": "Tsinghua University;Advanced Micro Devices, Inc.;Beijing University of Posts and Telecommunications;Tencent",
        "aff_unique_dep": ";;;Tencent Holdings Limited",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.amd.com;http://www.bupt.edu.cn/;https://www.tencent.com",
        "aff_unique_abbr": "THU;AMD;BUPT;Tencent",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Beijing",
        "aff_country_unique_index": "0;1;0;0;0;0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "ResFields: Residual Neural Fields for Spatiotemporal Signals",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19108",
        "id": "EHrvRNs2Y0",
        "author_site": "Marko Mihajlovic, Sergey Prokudin, Marc Pollefeys, Siyu Tang",
        "tldr": "",
        "abstract": "Neural fields, a category of neural networks trained to represent high-frequency signals, have gained significant attention in recent years due to their impressive performance in modeling complex 3D data, such as signed distance (SDFs) or radiance fields (NeRFs), via a single multi-layer perceptron (MLP). However, despite the power and simplicity of representing signals with an MLP, these methods still face challenges when modeling large and complex temporal signals due to the limited capacity of MLPs. In this paper, we propose an effective approach to address this limitation by incorporating temporal residual layers into neural fields, dubbed ResFields. It is a novel class of networks specifically designed to effectively represent complex temporal signals. We conduct a comprehensive analysis of the properties of ResFields and propose a matrix factorization technique to reduce the number of trainable parameters and enhance generalization capabilities. Importantly, our formulation seamlessly integrates with existing MLP-based neural fields and consistently improves results across various challenging tasks: 2D video approximation, dynamic shape modeling via temporal SDFs, and dynamic NeRF reconstruction. Lastly, we demonstrate the practical utility of ResFields by showcasing its effectiveness in capturing dynamic 3D scenes from sparse RGBD cameras of a lightweight capture system.",
        "keywords": "neural fields;NeRF;reconstruction",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/c940abe6e7e613858353395cbc81ead9a3663022.zip",
        "author": "Marko Mihajlovic;Sergey Prokudin;Marc Pollefeys;Siyu Tang",
        "authorids": "~Marko_Mihajlovic1;~Sergey_Prokudin1;~Marc_Pollefeys2;~Siyu_Tang1",
        "gender": "M;M;M;F",
        "homepage": "https://markomih.github.io/;https://github.com/sergeyprokudin;;https://vlg.inf.ethz.ch",
        "dblp": "252/5156;205/4367;p/MarcPollefeys;22/845-1",
        "google_scholar": "RYicr-QAAAAJ;xSywCzAAAAAJ;YYH0BjEAAAAJ;BUDh_4wAAAAJ",
        "orcid": "0000-0001-6305-3896;;;0000-0002-1015-4770",
        "linkedin": "marko-mihajlovic/;sergey-prokudin-9bb045a8/;marc-pollefeys-30a7075/;",
        "or_profile": "~Marko_Mihajlovic1;~Sergey_Prokudin1;~Marc_Pollefeys2;~Siyu_Tang1",
        "aff": "Meta;ETHZ - ETH Zurich;Swiss Federal Institute of Technology;Department of Computer Science, Swiss Federal Institute of Technology",
        "aff_domain": "meta.com;ethz.ch;ethz.ch;inf.ethz.ch",
        "position": "Intern;Postdoc;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nmihajlovic2024resfields,\ntitle={ResFields: Residual Neural Fields for Spatiotemporal Signals},\nauthor={Marko Mihajlovic and Sergey Prokudin and Marc Pollefeys and Siyu Tang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=EHrvRNs2Y0}\n}",
        "github": "",
        "project": "",
        "reviewers": "KYty;ZKNQ;4JwP",
        "pdf_size": 6629211,
        "rating": "8;8;8",
        "confidence": "4;4;4",
        "soundness": "4;3;4",
        "contribution": "3;3;3",
        "presentation": "4;3;4",
        "wc_summary": "125;87;101",
        "wc_strengths": "145;56;54",
        "wc_weaknesses": "226;175;92",
        "wc_questions": "131;3;158",
        "wc_review": "627;321;405",
        "wc_reply_reviewers": "0;0;11",
        "wc_reply_authors": "1158;1150;1508",
        "reply_reviewers": "0;0;1",
        "reply_authors": "3;4;3",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            104.33333333333333,
            15.691469727919761
        ],
        "wc_strengths_avg": [
            85.0,
            42.43426288586461
        ],
        "wc_weaknesses_avg": [
            164.33333333333334,
            55.222781128403476
        ],
        "wc_questions_avg": [
            97.33333333333333,
            67.60834925428138
        ],
        "wc_review_avg": [
            451.0,
            129.0891165048394
        ],
        "wc_reply_reviewers_avg": [
            3.6666666666666665,
            5.185449728701348
        ],
        "wc_reply_authors_avg": [
            1272.0,
            166.9091569287517
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1732391009262483540&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=EHrvRNs2Y0",
        "pdf": "https://openreview.net/pdf?id=EHrvRNs2Y0",
        "email": "meta.com;ethz.ch;ethz.ch;inf.ethz.ch",
        "author_num": 4,
        "aff_unique_index": "0;1;2;2",
        "aff_unique_norm": "Meta;ETH Zurich;Swiss Federal Institute of Technology",
        "aff_unique_dep": "Meta Platforms, Inc.;;",
        "aff_unique_url": "https://meta.com;https://www.ethz.ch;https://www.ethz.ch",
        "aff_unique_abbr": "Meta;ETHZ;ETH Zurich",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "United States;Switzerland"
    },
    {
        "title": "Parametric Augmentation for Time Series Contrastive Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19107",
        "id": "EIPLdFy3vp",
        "author_site": "Xu Zheng, Tianchun Wang, Wei Cheng, Aitian Ma, Haifeng Chen, Mo Sha, Dongsheng Luo",
        "tldr": "",
        "abstract": "Modern techniques like contrastive learning have been effectively used in many areas, including computer vision, natural language processing, and graph-structured data. Creating positive examples that assist the model in learning robust and discriminative representations is a crucial stage in contrastive learning approaches. Usually, preset human intuition directs the selection of relevant data augmentations. Due to patterns that are easily recognized by humans, this rule of thumb works well in the vision and language domains. However, it is impractical to visually inspect the temporal structures in time series. The diversity of time series augmentations at both the dataset and instance levels makes it difficult to choose meaningful augmentations on the fly. Thus, although prevalent, contrastive learning with data augmentation has been less studied in the time series domain. In this study, we address this gap by analyzing time series data augmentation using information theory and summarizing the most commonly adopted augmentations in a unified format. We then propose a parametric augmentation method, AutoTCL, which can be adaptively employed to support time series representation learning. The proposed approach is encoder-agnostic, allowing it to be seamlessly integrated with different backbone encoders. Experiments on univariate forecasting tasks demonstrate the highly competitive results of our method, with an average 6.5\\%  reduction in MSE and  4.7\\% in MAE over the leading baselines. In classification tasks, AutoTCL achieves a $1.2\\%$ increase in average accuracy.",
        "keywords": "contrastive learning;neural networks;stream data analysis",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/14a6ca48c098c3d9b4de32065d95005ac1680730.zip",
        "author": "Xu Zheng;Tianchun Wang;Wei Cheng;Aitian Ma;Haifeng Chen;Mo Sha;Dongsheng Luo",
        "authorids": "~Xu_Zheng3;~Tianchun_Wang1;~Wei_Cheng1;~Aitian_Ma1;~Haifeng_Chen1;~Mo_Sha2;~Dongsheng_Luo1",
        "gender": ";M;M;M;;M;M",
        "homepage": ";;https://chengw07.github.io/;;https://haifengchen.gitlab.io/intro/;https://users.cs.fiu.edu/~msha/;https://users.cs.fiu.edu/~dluo/",
        "dblp": ";153/5231.html;89/2506-2.html;;08/57-1.html;70/5884.html;",
        "google_scholar": ";8su8b60AAAAJ;PRrGVmoAAAAJ;;QzakB68AAAAJ;hVZiQDQAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;;;0000-0002-2701-0159;0000-0003-4192-0826",
        "linkedin": ";;wei-cheng-ml/;aitian-ma-4267404a/;;;",
        "or_profile": "~Xu_Zheng3;~Tianchun_Wang1;~Wei_Cheng1;~Aitian_Ma1;~Haifeng_Chen1;~Mo_Sha2;~Dongsheng_Luo1",
        "aff": ";Pennsylvania State University;NEC-Labs;Florida International University;NEC-Labs;Florida International University;Florida International University",
        "aff_domain": ";psu.edu;nec-labs.com;fiu.edu;nec-labs.com;fiu.edu;fiu.edu",
        "position": ";PhD student;Principal Researcher;PhD student;Researcher;Associate Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nzheng2024parametric,\ntitle={Parametric Augmentation for Time Series Contrastive Learning},\nauthor={Xu Zheng and Tianchun Wang and Wei Cheng and Aitian Ma and Haifeng Chen and Mo Sha and Dongsheng Luo},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=EIPLdFy3vp}\n}",
        "github": "",
        "project": "",
        "reviewers": "CECe;NeuG;4aGN;3ku1;3kKY",
        "pdf_size": 1527262,
        "rating": "5;6;6;8;8",
        "confidence": "4;3;4;4;4",
        "soundness": "2;3;3;3;3",
        "contribution": "2;2;2;3;3",
        "presentation": "2;3;3;3;3",
        "wc_summary": "32;91;48;44;103",
        "wc_strengths": "15;98;35;52;49",
        "wc_weaknesses": "87;113;283;76;184",
        "wc_questions": "123;38;7;1;88",
        "wc_review": "257;340;373;173;424",
        "wc_reply_reviewers": "280;18;0;0;55",
        "wc_reply_authors": "1946;473;996;352;949",
        "reply_reviewers": "2;1;0;0;1",
        "reply_authors": "4;1;3;1;2",
        "rating_avg": [
            6.6,
            1.2
        ],
        "confidence_avg": [
            3.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            63.6,
            28.032837887021
        ],
        "wc_strengths_avg": [
            49.8,
            27.41824210265859
        ],
        "wc_weaknesses_avg": [
            148.6,
            77.00545435227299
        ],
        "wc_questions_avg": [
            51.4,
            47.23812019968618
        ],
        "wc_review_avg": [
            313.4,
            88.75269010007527
        ],
        "wc_reply_reviewers_avg": [
            70.6,
            106.60881764657181
        ],
        "wc_reply_authors_avg": [
            943.2,
            561.967045297142
        ],
        "reply_reviewers_avg": [
            0.8,
            0.7483314773547883
        ],
        "reply_authors_avg": [
            2.2,
            1.16619037896906
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.24999999999999997,
        "gs_citation": 18,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17721508468524777421&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=EIPLdFy3vp",
        "pdf": "https://openreview.net/pdf?id=EIPLdFy3vp",
        "email": ";psu.edu;nec-labs.com;fiu.edu;nec-labs.com;fiu.edu;fiu.edu",
        "author_num": 7,
        "aff_unique_index": "0;1;2;1;2;2",
        "aff_unique_norm": "Pennsylvania State University;NEC Laboratories;Florida International University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.psu.edu;https://www.nec-labs.com;https://www.fiu.edu",
        "aff_unique_abbr": "PSU;NEC-Labs;FIU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "EIfcSw6MW0",
        "title": "Achieving Certified Robustness and Maintaining Clean Accuracy via Vanilla Model Guide",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Certified robustness can provide theoretical defense guarantees for deep neural network models against adversarial examples within a certain perturbation range. However, existing research on obtaining certified robustness requires specialized certified robust training from scratch for DNNs models. This approach significantly decreases the clean accuracy of normal inputs compared to vanilla models trained with vanilla training, affecting the main inference task of DNNs models and causing practical difficulties for security methods.\nWe propose a practical training method that aims to obtain certified robustness while maintaining clean accuracy.\nThis method involves adding a pre-trained vanilla model and applying singular value decomposition (SVD) to the weight matrices of each network layer of the vanilla model. This process yields rotation matrices and singular values that respectively affect clean accuracy and certified robustness. The vanilla model is used as a guide model, establishing a knowledge transfer process based on the similarity of rotation matrices between the guide model and the certification model that obtains certified robustness. In order to select important rotation matrix information and reduce computational cost, a low-rank approximation is used for practical knowledge transfer. Experimental results demonstrate that our approach significantly improves clean accuracy while only slightly reducing certified accuracy.",
        "keywords": "Adversarial examples;Certified Robustness",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Chunlin Yu;Yukun Ma;Chuliang Weng",
        "authorids": "~Chunlin_Yu2;~Yukun_Ma3;~Chuliang_Weng1",
        "gender": ";;M",
        "homepage": ";;https://chuliangweng.github.io",
        "dblp": ";;",
        "google_scholar": ";;",
        "orcid": "0000-0003-2833-1031;0000-0002-7055-3597;",
        "linkedin": ";;",
        "or_profile": "~Chunlin_Yu2;~Yukun_Ma3;~Chuliang_Weng1",
        "aff": "East China Normal University;East China Normal University;East China Normal University",
        "aff_domain": "ecnu.edu.cn;ecnu.edu.cn;ecnu.edu.cn",
        "position": "PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nyu2024achieving,\ntitle={Achieving Certified Robustness and Maintaining Clean Accuracy via Vanilla Model Guide},\nauthor={Chunlin Yu and Yukun Ma and Chuliang Weng},\nyear={2024},\nurl={https://openreview.net/forum?id=EIfcSw6MW0}\n}",
        "github": "",
        "project": "",
        "reviewers": "wK2j;KP43;XSXh;koaj",
        "site": "https://openreview.net/forum?id=EIfcSw6MW0",
        "pdf_size": 343376,
        "rating": "3;3;3;3",
        "confidence": "3;3;3;4",
        "soundness": "2;2;2;2",
        "contribution": "2;3;2;2",
        "presentation": "1;1;2;1",
        "wc_summary": "34;84;88;125",
        "wc_strengths": "24;27;48;89",
        "wc_weaknesses": "381;191;139;166",
        "wc_questions": "130;29;11;148",
        "wc_review": "569;331;286;528",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            82.75,
            32.36800117399899
        ],
        "wc_strengths_avg": [
            47.0,
            25.95187854472196
        ],
        "wc_weaknesses_avg": [
            219.25,
            95.17976413082772
        ],
        "wc_questions_avg": [
            79.5,
            60.17682278086805
        ],
        "wc_review_avg": [
            428.5,
            121.91492935649842
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ZdTO_GxHARkJ:scholar.google.com/&scioq=Achieving+Certified+Robustness+and+Maintaining+Clean+Accuracy+via+Vanilla+Model+Guide&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "East China Normal University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.ecnu.edu.cn",
        "aff_unique_abbr": "ECNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Adversarial Supervision Makes Layout-to-Image Diffusion Models Thrive",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19106",
        "id": "EJPIzl7mgc",
        "author_site": "Yumeng Li, Margret Keuper, Dan Zhang, Anna Khoreva",
        "tldr": "",
        "abstract": "Despite the recent advances in large-scale diffusion models, little progress has been made on the layout-to-image (L2I) synthesis task. Current L2I models either suffer from poor editability via text or weak alignment between the generated image and the input layout. This limits their usability in practice. To mitigate this, we propose to integrate adversarial supervision into the conventional training pipeline of L2I diffusion models (ALDM). Specifically, we employ a segmentation-based discriminator which provides explicit feedback to the diffusion generator on the pixel-level alignment between the denoised image and the input layout. To encourage consistent adherence to the input layout over the sampling steps, we further introduce the multistep unrolling strategy. Instead of looking at a single timestep, we unroll a few steps recursively to imitate the inference process, and ask the discriminator to assess the alignment of denoised images with the layout over a certain time window. Our experiments show that ALDM enables layout faithfulness of the generated images, while allowing broad editability via text prompts. Moreover, we showcase its usefulness for practical applications: by synthesizing target distribution samples via text control, we improve domain generalization of semantic segmentation models by a large margin (~12 mIoU points).",
        "keywords": "diffusion models;layout-to-image;domain generalization",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Yumeng Li;Margret Keuper;Dan Zhang;Anna Khoreva",
        "authorids": "~Yumeng_Li2;~Margret_Keuper1;~Dan_Zhang1;~Anna_Khoreva1",
        "gender": "F;F;;F",
        "homepage": "https://yumengli007.github.io;https://www.vc.informatik.uni-siegen.de/en/keuper-margret;;",
        "dblp": ";95/7589;21/802-17;152/5005",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.de/citations?user=KMqMQAcAAAAJ;https://scholar.google.de/citations?user=yazO-mMAAAAJ;https://scholar.google.de/citations?user=ILgZT7MAAAAJ",
        "orcid": ";0000-0002-8437-7993;0000-0003-0930-9162;",
        "linkedin": "yumeng-li-007;;;",
        "or_profile": "~Yumeng_Li2;~Margret_Keuper1;~Dan_Zhang1;~Anna_Khoreva1",
        "aff": "Bosch Center for Artificial Intelligence;Max Planck Institute for Informatics;Robert Bosch GmbH, Bosch;Bosch Center for Artificial Intelligence",
        "aff_domain": "de.bosch.com;mpi-inf.mpg;de.bosch.com;bosch.com",
        "position": "PhD student;Researcher;Research Scientist;Research Group Leader",
        "bibtex": "@inproceedings{\nli2024adversarial,\ntitle={Adversarial Supervision Makes Layout-to-Image Diffusion Models Thrive},\nauthor={Yumeng Li and Margret Keuper and Dan Zhang and Anna Khoreva},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=EJPIzl7mgc}\n}",
        "github": "",
        "project": "",
        "reviewers": "VHY8;rjfS;d5qA;4k64",
        "pdf_size": 45668388,
        "rating": "6;6;6;6",
        "confidence": "4;4;4;4",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "1;3;3;3",
        "wc_summary": "87;144;50;62",
        "wc_strengths": "26;43;28;50",
        "wc_weaknesses": "102;233;270;77",
        "wc_questions": "120;89;1;3",
        "wc_review": "335;509;349;192",
        "wc_reply_reviewers": "37;41;57;31",
        "wc_reply_authors": "1192;1116;1470;398",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "3;3;5;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            85.75,
            36.18269614055868
        ],
        "wc_strengths_avg": [
            36.75,
            10.084022015049353
        ],
        "wc_weaknesses_avg": [
            170.5,
            82.52423886349997
        ],
        "wc_questions_avg": [
            53.25,
            52.413619413278454
        ],
        "wc_review_avg": [
            346.25,
            112.26614583212519
        ],
        "wc_reply_reviewers_avg": [
            41.5,
            9.630680142129112
        ],
        "wc_reply_authors_avg": [
            1044.0,
            395.56289006932894
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.25,
            1.0897247358851685
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=95131038524166498&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=EJPIzl7mgc",
        "pdf": "https://openreview.net/pdf?id=EJPIzl7mgc",
        "email": "de.bosch.com;mpi-inf.mpg;de.bosch.com;bosch.com",
        "author_num": 4,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Bosch Center for Artificial Intelligence;Max Planck Institute for Informatics;Robert Bosch GmbH",
        "aff_unique_dep": "Center for Artificial Intelligence;;",
        "aff_unique_url": "https://www.bosch-ai.com;https://mpi-inf.mpg.de;https://www.bosch.com",
        "aff_unique_abbr": "BCAI;MPII;Bosch",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "EJvFFedM2I",
        "title": "TRAM: Benchmarking Temporal Reasoning for Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Reasoning about time is essential for understanding the nuances of events described in natural language. Previous research on this topic has been limited in scope, characterized by a lack of standardized benchmarks that would allow for consistent evaluations across different studies. In this paper, we introduce TRAM, a temporal reasoning benchmark composed of ten datasets, encompassing various temporal aspects of events such as order, arithmetic, frequency, and duration, designed to facilitate a comprehensive evaluation of the temporal reasoning capabilities of large language models (LLMs). We conduct an extensive evaluation using popular LLMs, such as GPT-4 and Llama2, in both zero-shot and few-shot learning scenarios. Additionally, we employ BERT-based models to establish the baseline evaluations. Our findings indicate that these models still trail human performance in temporal reasoning tasks. It is our aspiration that TRAM will spur further progress in enhancing the temporal reasoning abilities of LLMs.",
        "keywords": "temporal reasoning;large language models;dataset",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/0751323584146bc3f4e559f907d23fe64a895b27.zip",
        "author": "Yuqing Wang;Yun Zhao",
        "authorids": "~Yuqing_Wang5;~Yun_Zhao1",
        "gender": "F;M",
        "homepage": "https://yuqingwangcs.github.io/;https://yunzhaocs.github.io/",
        "dblp": ";42/2862-1",
        "google_scholar": "DHImZjIAAAAJ;30s9RtsAAAAJ",
        "orcid": ";0000-0002-5544-8983",
        "linkedin": "yuqingwang98/;yun-zhao/",
        "or_profile": "~Yuqing_Wang5;~Yun_Zhao1",
        "aff": "Stanford University;Meta Platforms, Inc",
        "aff_domain": "stanford.edu;meta.com",
        "position": "Postdoc;Researcher",
        "bibtex": "@misc{\nwang2024tram,\ntitle={{TRAM}: Benchmarking Temporal Reasoning for Large Language Models},\nauthor={Yuqing Wang and Yun Zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=EJvFFedM2I}\n}",
        "github": "",
        "project": "",
        "reviewers": "PXAF;Z4nr;rYw6;fFct;v5US",
        "site": "https://openreview.net/forum?id=EJvFFedM2I",
        "pdf_size": 589537,
        "rating": "3;6;6;6;8",
        "confidence": "4;4;3;4;4",
        "soundness": "3;4;2;3;3",
        "contribution": "2;3;3;3;3",
        "presentation": "3;4;4;4;3",
        "wc_summary": "92;40;83;98;46",
        "wc_strengths": "76;69;96;34;74",
        "wc_weaknesses": "145;80;605;85;123",
        "wc_questions": "110;9;78;32;145",
        "wc_review": "423;198;862;249;388",
        "wc_reply_reviewers": "235;0;463;28;26",
        "wc_reply_authors": "1902;1029;1245;940;1065",
        "reply_reviewers": "2;0;1;1;1",
        "reply_authors": "5;2;4;2;2",
        "rating_avg": [
            5.8,
            1.6
        ],
        "confidence_avg": [
            3.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            3.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            2.8,
            0.39999999999999997
        ],
        "presentation_avg": [
            3.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            71.8,
            24.069898213328614
        ],
        "wc_strengths_avg": [
            69.8,
            20.123617964968428
        ],
        "wc_weaknesses_avg": [
            207.6,
            200.15753795448222
        ],
        "wc_questions_avg": [
            74.8,
            49.67655382572346
        ],
        "wc_review_avg": [
            424.0,
            234.4534068850355
        ],
        "wc_reply_reviewers_avg": [
            150.4,
            177.73755933960612
        ],
        "wc_reply_authors_avg": [
            1236.2,
            347.3738044239951
        ],
        "reply_reviewers_avg": [
            1.0,
            0.6324555320336759
        ],
        "reply_authors_avg": [
            3.0,
            1.2649110640673518
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.06250000000000004,
        "gs_citation": 40,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10585905559036828384&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Stanford University;Meta",
        "aff_unique_dep": ";Meta Platforms, Inc",
        "aff_unique_url": "https://www.stanford.edu;https://www.meta.com",
        "aff_unique_abbr": "Stanford;Meta",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Stanford;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "EKEcYL7gaf",
        "title": "Predicated Diffusion: Predicate Logic-Based Attention Guidance for Text-to-Image Diffusion Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Diffusion models have achieved remarkable results in generating high-quality, diverse, and creative images. However, when it comes to text-based image generation, they often fail to capture the intended meaning presented in the text. For instance, a specified object may not be generated, an unnecessary object may be generated, and an adjective may alter objects it was not intended to modify. Moreover, we found that relationships indicating possession between objects are often overlooked. While users' intentions in the text are diverse, existing methods tend to specialize in only some aspects of these. In this paper, we propose Predicated Diffusion, a unified framework to express users' intentions. We consider that the root of the above issues lies in the text encoder, which often focuses only on individual words and neglects the logical relationships between them. The proposed method does not solely rely on the text encoder, but instead, represents the intended meaning in the text as propositions using predicate logic and treats the pixels in the attention maps as the fuzzy predicates. This enables us to obtain a differentiable loss function that makes the image fulfill the proposition by minimizing it. When compared to several existing methods, we demonstrated that Predicated Diffusion can generate images that are more faithful to various text prompts, as verified by human evaluators and pretrained image-text models.",
        "keywords": "diffusion models;text-based image generation;attention map;predicate logic",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/d6c427c143cf6b6796f012866a32a5e0826e6b9d.zip",
        "author": "Kota Sueyoshi;Takashi Matsubara",
        "authorids": "~Kota_Sueyoshi1;~Takashi_Matsubara1",
        "gender": "M;M",
        "homepage": ";https://tksmatsubara.github.io/",
        "dblp": ";70/6748-1.html",
        "google_scholar": ";https://scholar.google.co.jp/citations?user=aubjjjwAAAAJ",
        "orcid": "0009-0009-8632-1764;0000-0003-0642-4800",
        "linkedin": ";",
        "or_profile": "~Kota_Sueyoshi1;~Takashi_Matsubara1",
        "aff": "Osaka University;Osaka University",
        "aff_domain": "osaka-u.ac.jp;osaka-u.ac.jp",
        "position": "MS student;Associate Professor",
        "bibtex": "@misc{\nsueyoshi2024predicated,\ntitle={Predicated Diffusion: Predicate Logic-Based Attention Guidance for Text-to-Image Diffusion Models},\nauthor={Kota Sueyoshi and Takashi Matsubara},\nyear={2024},\nurl={https://openreview.net/forum?id=EKEcYL7gaf}\n}",
        "github": "",
        "project": "",
        "reviewers": "2NoA;YsNP;5oLz;h1q7",
        "site": "https://openreview.net/forum?id=EKEcYL7gaf",
        "pdf_size": 33304891,
        "rating": "3;5;6;6",
        "confidence": "3;4;3;4",
        "soundness": "2;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;2;2;2",
        "wc_summary": "93;84;83;70",
        "wc_strengths": "58;57;70;71",
        "wc_weaknesses": "172;323;232;320",
        "wc_questions": "11;4;159;2",
        "wc_review": "334;468;544;463",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "935;898;1122;648",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;2;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            82.5,
            8.200609733428363
        ],
        "wc_strengths_avg": [
            64.0,
            6.519202405202649
        ],
        "wc_weaknesses_avg": [
            261.75,
            63.41283387453994
        ],
        "wc_questions_avg": [
            44.0,
            66.47932009279276
        ],
        "wc_review_avg": [
            452.25,
            75.43995957050879
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            900.75,
            168.83035124052785
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.40824829046386296,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10802455908277699668&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Osaka University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.osaka-u.ac.jp",
        "aff_unique_abbr": "Osaka U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Japan"
    },
    {
        "id": "ELdsurGvz6",
        "title": "Partitioning-Guided K-Means: Extreme Empty Cluster Resolution for Extreme Model Compression",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Compactness in deep learning can be critical to a model\u2019s viability in low-resource applications, and a common approach to extreme model compression is quantization. We consider Iterative Product Quantization (iPQ) with Quant-Noise to be state-of-the-art in this area, but this quantization framework suffers from preventable inference quality degradation due to prevalent empty clusters. In this paper, we propose several novel enhancements aiming to improve the accuracy of iPQ with Quant-Noise by focusing on resolving empty clusters. Our contribution, which we call Partitioning-Guided k-means (PG k-means), is a heavily augmented k-means implementation composed of three main components. First, we propose a partitioning-based pre-assignment strategy that minimizes initial empty clusters and encourages an even weight-to-cluster distribution. Second, we propose an empirically superior empty cluster resolution heuristic executed via cautious partitioning of large clusters. Finally, we construct an optional optimization step that consolidates intuitively dense clusters of weights to ensure shared representation. The proposed approach consistently reduces the number of empty clusters in iPQ with Quant-Noise by 100x on average, uses 8x fewer iterations during empty cluster resolution, and improves overall model accuracy by up to 12%, when applied to RoBERTa on a variety of tasks in the GLUE benchmark.",
        "keywords": "quantization; clustering; compression; transformers; language modeling;",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Tianhong Huang;Victor Agostinelli III;Lizhong Chen",
        "authorids": "~Tianhong_Huang1;~Victor_Agostinelli_III1;~Lizhong_Chen2",
        "gender": "M;;M",
        "homepage": ";;https://web.engr.oregonstate.edu/~chenliz/",
        "dblp": ";;78/4756",
        "google_scholar": ";1mrboE4AAAAJ;",
        "orcid": ";;",
        "linkedin": "tianhong-huang-99160424b/;victor-agostinelli/;",
        "or_profile": "~Tianhong_Huang1;~Victor_Agostinelli_III1;~Lizhong_Chen2",
        "aff": "Oregon State University;, Oregon State University;Oregon State University",
        "aff_domain": "oregonstate.edu;eecs.oregonstate.edu;oregonstate.edu",
        "position": "MS student;PhD student;Associate Professor",
        "bibtex": "@misc{\nhuang2024partitioningguided,\ntitle={Partitioning-Guided K-Means: Extreme Empty Cluster Resolution for Extreme Model Compression},\nauthor={Tianhong Huang and Victor Agostinelli III and Lizhong Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=ELdsurGvz6}\n}",
        "github": "",
        "project": "",
        "reviewers": "uYXA;5ufE;rfms",
        "site": "https://openreview.net/forum?id=ELdsurGvz6",
        "pdf_size": 1077944,
        "rating": "3;3;5",
        "confidence": "4;5;4",
        "soundness": "3;1;2",
        "contribution": "2;2;2",
        "presentation": "2;3;3",
        "wc_summary": "108;107;73",
        "wc_strengths": "31;20;80",
        "wc_weaknesses": "147;189;100",
        "wc_questions": "3;31;5",
        "wc_review": "289;347;258",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            96.0,
            16.268579122549905
        ],
        "wc_strengths_avg": [
            43.666666666666664,
            26.08107018935807
        ],
        "wc_weaknesses_avg": [
            145.33333333333334,
            36.353205574688396
        ],
        "wc_questions_avg": [
            13.0,
            12.754084313139327
        ],
        "wc_review_avg": [
            298.0,
            36.88721549082645
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:SxXKrI31gEgJ:scholar.google.com/&scioq=Partitioning-Guided+K-Means:+Extreme+Empty+Cluster+Resolution+for+Extreme+Model+Compression&hl=en&as_sdt=0,33",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Oregon State University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://oregonstate.edu",
        "aff_unique_abbr": "OSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "ELlBpc0tfb",
        "title": "MedJourney: Counterfactual Medical Image Generation by Instruction-Learning from Multimodal Patient Journeys",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Rapid progress has been made in instruction-learning for image editing with natural-language instruction, as exemplified by InstructPix2Pix. In biomedicine, such counterfactual generation methods can help differentiate causal structure from spurious correlation and facilitate robust image interpretation for disease progression modeling. However, generic image-editing models are ill-suited for the biomedical domain, and counterfactual medical image generation is largely underexplored. In this paper, we present MedJourney, a novel method for counterfactual medical image generation by instruction-learning from multimodal patient journeys. Given a patient with two medical images taken at different time points, we use GPT-4 to process the corresponding imaging reports and generate natural language description of disease progression. The resulting triples (prior image, progression description, new image) are then used to train a latent diffusion model for counterfactual medical image generation. Given the relative scarcity of image time series data, we introduce a two-stage curriculum that first pretrains the denoising network using the much more abundant single image-report pairs (with dummy prior image), and then continues training using the counterfactual triples. Experiments using the standard MIMIC-CXR dataset demonstrate the promise of our method. In a comprehensive battery of tests on counterfactual medical image generation, MedJourney substantially outperforms prior state-of-the-art methods in instruction image editing and medical image generation such as InstructPix2Pix and RoentGen. To facilitate future study in counterfactual medical generation, we plan to release our instruction-learning code and pretrained models.",
        "keywords": "instruction image editing;instruction-learning;image generation;diffusion;natural-language instruction;biomedicine;counterfactual generation;disease progression modeling;GPT-4;imaging reports;latent diffusion model;curriculum learning;MIMIC-CXR",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Yu Gu;Jianwei Yang;Naoto Usuyama;Chunyuan Li;Sheng Zhang;Matthew P. Lungren;Jianfeng Gao;Hoifung Poon",
        "authorids": "~Yu_Gu12;~Jianwei_Yang1;~Naoto_Usuyama1;~Chunyuan_Li1;~Sheng_Zhang9;~Matthew_P._Lungren1;~Jianfeng_Gao1;~Hoifung_Poon1",
        "gender": ";M;;M;;M;M;M",
        "homepage": ";https://www.microsoft.com/en-us/research/people/naotous/;http://chunyuan.li/;https://sheng-z.github.io/;;https://www.microsoft.com/en-us/research/people/jfgao/;https://www.microsoft.com/en-us/research/people/hoifung/;https://jwyang.github.io/",
        "dblp": ";154/3752;64/9590;69/6137-12;;92/5339;78/4609;",
        "google_scholar": "1PoaURIAAAAJ;;Zd7WmXUAAAAJ;-LVEXQ8AAAAJ;z1UtMSYAAAAJ;https://scholar.google.com/citations?hl=en;yqqmVbkAAAAJ;Cl9byD8AAAAJ",
        "orcid": ";0000-0003-0888-929X;;;;;0000-0002-9067-0918;",
        "linkedin": ";;;sheng-z/;;;hoifung-poon-9559943/;",
        "or_profile": "~Yu_Gu12;~Naoto_Usuyama1;~Chunyuan_Li1;~Sheng_Zhang9;~Matthew_P._Lungren1;~Jianfeng_Gao1;~Hoifung_Poon1;~Jianwei_Yang2",
        "aff": "Microsoft;Microsoft;Microsoft Research;Microsoft;Microsoft;Microsoft Research;Microsoft;Microsoft",
        "aff_domain": "microsoft.com;microsoft.com;microsoft.com;microsoft.com;microsoft.com;microsoft.com;microsoft.com;microsoft.com",
        "position": "Researcher;Researcher;Principal Researcher;Researcher;Principal Researcher;Principal Researcher;General Manager;Researcher",
        "bibtex": "@misc{\ngu2024medjourney,\ntitle={MedJourney: Counterfactual Medical Image Generation by Instruction-Learning from Multimodal Patient Journeys},\nauthor={Yu Gu and Jianwei Yang and Naoto Usuyama and Chunyuan Li and Sheng Zhang and Matthew P. Lungren and Jianfeng Gao and Hoifung Poon},\nyear={2024},\nurl={https://openreview.net/forum?id=ELlBpc0tfb}\n}",
        "github": "",
        "project": "",
        "reviewers": "A6Mk;egz5;jLph",
        "site": "https://openreview.net/forum?id=ELlBpc0tfb",
        "pdf_size": 22505992,
        "rating": "5;6;6",
        "confidence": "4;3;4",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "3;3;3",
        "wc_summary": "81;65;147",
        "wc_strengths": "91;87;312",
        "wc_weaknesses": "340;36;483",
        "wc_questions": "10;61;15",
        "wc_review": "522;249;957",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "882;618;552",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            97.66666666666667,
            35.490217744549774
        ],
        "wc_strengths_avg": [
            163.33333333333334,
            105.13589090104081
        ],
        "wc_weaknesses_avg": [
            286.3333333333333,
            186.3908676828228
        ],
        "wc_questions_avg": [
            28.666666666666668,
            22.954060400915758
        ],
        "wc_review_avg": [
            576.0,
            291.5510246937918
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            684.0,
            142.57629536497294
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3850132482633286541&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0;0;0;0",
        "aff_unique_norm": "Microsoft",
        "aff_unique_dep": "Microsoft Corporation",
        "aff_unique_url": "https://www.microsoft.com",
        "aff_unique_abbr": "Microsoft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "EMCXCTsmSx",
        "title": "IRGen: Generative Modeling for Image Retrieval",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "While generative modeling has become prevalent across numerous research fields, its potential application to image retrieval has yet to be thoroughly justified. In this paper, we present a novel approach, reframing image retrieval as a variant of generative modeling and employing a sequence-to-sequence model. This provides promising alignment with the overarching theme of unification in current research. Our framework enables end-to-end differentiable search, leading to superior performance through direct optimization. During the development of IRGen, we tackle the key technical challenge of converting an image into a concise sequence of semantic units, which is essential to facilitate efficient and effective search. Extensive experiments demonstrate that our model yields significant improvement over various widely utilized benchmarks, and further validate its performance on million-scale datasets. Besides, the substantial enhancement of precision scores achieved through generative modeling, potentially opens the avenue to excluding the rerank stage typically utilized in practical retrieval pipelines.",
        "keywords": "Image retrieval;autoregressive model;generative model",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Yidan Zhang;Ting Zhang;Dong Chen;Yujing Wang;Qi Chen;Xing Xie;Hao Sun;Weiwei Deng;Qi Zhang;Fan Yang;Mao Yang;Qingmin Liao;Jingdong Wang;Baining Guo",
        "authorids": "~Yidan_Zhang4;~Ting_Zhang7;~Dong_Chen1;~Yujing_Wang1;~Qi_Chen2;~Xing_Xie3;~Hao_Sun6;~Weiwei_Deng2;~Qi_Zhang19;~Fan_Yang28;~Mao_Yang1;~Qingmin_Liao2;~Jingdong_Wang1;~Baining_Guo1",
        "gender": "F;F;F;M;M;M;M;M;;M;M;M;M;F",
        "homepage": ";;https://www.microsoft.com/en-us/research/people/cheqi/;http://research.microsoft.com/en-us/people/xingx/;;;;https://fanyangcs.github.io/;;https://www.sigs.tsinghua.edu.cn/lqm/main.htm;https://jingdongwang2017.github.io/;https://www.microsoft.com/en-us/research/people/bainguo/;http://www.dongchen.pro/;https://hellozting.github.io/",
        "dblp": ";16/4075;66/6320-9;08/6809-1;;311/3565.html;;29/3081-24.html;;;49/3441;;44/3371-3;06/5919-2",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=zh-CN;5EQfAFIAAAAJ;OjWD_SsAAAAJ;;;https://scholar.google.com/citations?hl=en;LgJqohwAAAAJ;;z5SPCmgAAAAJ;h4kYmRYAAAAJ;https://scholar.google.com.hk/citations?user=_fKSYOwAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;0009-0006-7394-0185;0000-0002-8608-8482;0009-0004-5027-7478;0009-0001-4793-9715;;0000-0002-0378-060X;;;0000-0002-4888-4445;;;",
        "linkedin": "yidan-zhang-111443239/;;;xingx/;;;qizhang07/;;;;;;;",
        "or_profile": "~Yidan_Zhang4;~Yujing_Wang1;~Qi_Chen2;~Xing_Xie3;~Hao_Sun6;~Weiwei_Deng2;~Qi_Zhang19;~Fan_Yang28;~Mao_Yang1;~Qingmin_Liao2;~Jingdong_Wang1;~Baining_Guo1;~Dong_Chen4;~ting_zhang6",
        "aff": ";Microsoft;Microsoft Research;Microsoft Research Asia;Microsoft;Microsoft;Microsoft;Microsoft Research;;Tsinghua University;Baidu;Microsoft Research;Microsoft;Microsoft",
        "aff_domain": ";microsoft.com;microsoft.com;microsoft.com;microsoft.com;microsoft.com;microsoft.com;research.microsoft.com;;tsinghua.edu.cn;baidu.com;microsoft.com;microsoft.com;microsoft.com",
        "position": ";Software Engineering Manager;Principal Researcher;Senior Principal Researcher;Researcher;Researcher;Researcher;Senior Principal Researcher;;Full Professor;Chief Scientist for Computer Vision;Researcher;Principal Researcher;Researcher",
        "bibtex": "@misc{\nzhang2024irgen,\ntitle={{IRG}en: Generative Modeling for Image Retrieval},\nauthor={Yidan Zhang and Ting Zhang and Dong Chen and Yujing Wang and Qi Chen and Xing Xie and Hao Sun and Weiwei Deng and Qi Zhang and Fan Yang and Mao Yang and Qingmin Liao and Jingdong Wang and Baining Guo},\nyear={2024},\nurl={https://openreview.net/forum?id=EMCXCTsmSx}\n}",
        "github": "",
        "project": "",
        "reviewers": "rUYC;obPk;8qfY;Re4A",
        "site": "https://openreview.net/forum?id=EMCXCTsmSx",
        "pdf_size": 4794456,
        "rating": "5;5;6;6",
        "confidence": "3;2;4;4",
        "soundness": "2;3;4;4",
        "contribution": "1;2;4;2",
        "presentation": "1;2;4;3",
        "wc_summary": "126;121;122;88",
        "wc_strengths": "57;138;116;46",
        "wc_weaknesses": "770;187;65;28",
        "wc_questions": "61;168;106;377",
        "wc_review": "1014;614;409;539",
        "wc_reply_reviewers": "268;76;0;87",
        "wc_reply_authors": "2115;1390;972;1383",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "3;2;2;3",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            1.0897247358851685
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            114.25,
            15.270478054075452
        ],
        "wc_strengths_avg": [
            89.25,
            38.7387080321479
        ],
        "wc_weaknesses_avg": [
            262.5,
            298.8532248445715
        ],
        "wc_questions_avg": [
            178.0,
            121.01033013755479
        ],
        "wc_review_avg": [
            644.0,
            225.85946958230465
        ],
        "wc_reply_reviewers_avg": [
            107.75,
            98.39810719724237
        ],
        "wc_reply_authors_avg": [
            1465.0,
            411.67280697175033
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            14,
            0
        ],
        "corr_rating_confidence": 0.9045340337332909,
        "gs_citation": 22,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11383297008277105137&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;0;0;0;0;0;0;1;2;0;0;0",
        "aff_unique_norm": "Microsoft;Tsinghua University;Baidu",
        "aff_unique_dep": "Microsoft Corporation;;Baidu, Inc.",
        "aff_unique_url": "https://www.microsoft.com;https://www.tsinghua.edu.cn;https://www.baidu.com",
        "aff_unique_abbr": "Microsoft;THU;Baidu",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Asia",
        "aff_country_unique_index": "0;0;1;0;0;0;0;1;1;0;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "EMVct15bl5",
        "title": "A qualitative theory of dynamical systems for assessing stability in ResNets",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We present an experimental method for evaluating the stability of ResNets, inspired by the qualitative theory of dynamical systems. To apply qualitative and quantitative properties from the literature on dynamical systems, we have proposed ResNets designed to maintain dimensionality throughout the residual blocks. As a result, we can not only introduce a well-suited concept of expansivity and shadowing properties for ResNets but also analyze their numerical degrees based on Dynamical Systems theory. This work aims to contribute to the understanding of ResNets' stability and bridge the gap between theory and practical applications.",
        "keywords": "Dynamical Systems;stability;residual neural networks",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Woochul Jung;Pildong Hwang;C.A. Morales;Jong-Yeup Kim;SEUNGHEE LEE",
        "authorids": "~Woochul_Jung1;~Pildong_Hwang1;~C.A._Morales1;~Jong-Yeup_Kim1;~SEUNGHEE_LEE2",
        "gender": ";;M;;F",
        "homepage": ";;;;",
        "dblp": ";;;;",
        "google_scholar": "3Z_qAnEAAAAJ;https://scholar.google.com/citations?hl=ko;;;",
        "orcid": ";;0000-0002-4808-6902;0000-0003-1230-9307;0000-0002-2273-0915",
        "linkedin": ";;;;",
        "or_profile": "~Woochul_Jung1;~Pildong_Hwang1;~C.A._Morales1;~Jong-Yeup_Kim1;~SEUNGHEE_LEE2",
        "aff": "Konyang University Hospital;Towson University;Universidade Federal do Rio de Janeiro;Konyang University;Konyang University Hospital",
        "aff_domain": "kyuh.ac.kr;towson.edu;ufrj.br;konyang.ac.kr;kyuh.ac.kr",
        "position": "Researcher;PhD student;Associate Professor;Associate Professor;Researcher",
        "bibtex": "@misc{\njung2024a,\ntitle={A qualitative theory of dynamical systems for assessing stability in ResNets},\nauthor={Woochul Jung and Pildong Hwang and C.A. Morales and Jong-Yeup Kim and SEUNGHEE LEE},\nyear={2024},\nurl={https://openreview.net/forum?id=EMVct15bl5}\n}",
        "github": "",
        "project": "",
        "reviewers": "f824;RNLk;YNhW",
        "site": "https://openreview.net/forum?id=EMVct15bl5",
        "pdf_size": 629136,
        "rating": "3;3;8",
        "confidence": "4;4;3",
        "soundness": "3;2;4",
        "contribution": "2;2;3",
        "presentation": "2;1;3",
        "wc_summary": "55;41;78",
        "wc_strengths": "29;22;49",
        "wc_weaknesses": "202;66;62",
        "wc_questions": "100;506;46",
        "wc_review": "386;635;235",
        "wc_reply_reviewers": "28;0;0",
        "wc_reply_authors": "834;759;326",
        "reply_reviewers": "1;0;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            4.666666666666667,
            2.357022603955158
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            58.0,
            15.253414918196734
        ],
        "wc_strengths_avg": [
            33.333333333333336,
            11.440668201153676
        ],
        "wc_weaknesses_avg": [
            110.0,
            65.07431649019962
        ],
        "wc_questions_avg": [
            217.33333333333334,
            205.30519287690268
        ],
        "wc_review_avg": [
            418.6666666666667,
            164.9248987333999
        ],
        "wc_reply_reviewers_avg": [
            9.333333333333334,
            13.199326582148887
        ],
        "wc_reply_authors_avg": [
            639.6666666666666,
            223.899282912851
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9999999999999998,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:5rtTtAgo2PEJ:scholar.google.com/&scioq=A+qualitative+theory+of+dynamical+systems+for+assessing+stability+in+ResNets&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0;0",
        "aff_unique_norm": "Konyang University;Towson University;Universidade Federal do Rio de Janeiro",
        "aff_unique_dep": "Hospital;;",
        "aff_unique_url": "http://www.konyang.ac.kr;https://www.towson.edu;https://www.ufrj.br",
        "aff_unique_abbr": "KUH;TU;UFRJ",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Rio de Janeiro",
        "aff_country_unique_index": "0;1;2;0;0",
        "aff_country_unique": "South Korea;United States;Brazil"
    },
    {
        "id": "EODzbQ2Gy4",
        "title": "Diff-Transfer: Model-based Robotic Manipulation Skill Transfer via Differentiable Physics Simulation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The capability to transfer mastered skills to accomplish a range of similar yet novel tasks is crucial for intelligent robots. In this work, we introduce Diff-Transfer, a novel framework leveraging differentiable physics simulation to efficiently transfer robotic skills. Specifically, Diff-Transfer discovers a feasible path within the task space that brings the source task to the target task. At each pair of adjacent points along this task path, which is two sub-tasks, Diff-Transfer adapts known actions from one sub-task to tackle the other sub-task successfully. The adaptation is guided by the gradient information from differentiable physics simulations. We propose a novel path-planning method to generate sub-tasks, leveraging $Q$-learning with a task-level state and reward. We implement our framework in simulation experiments and execute four challenging transfer tasks on robotic manipulation, demonstrating the efficacy of Diff-Transfer through comprehensive experiments. Supplementary and Videos are on the website https://sites.google.com/view/difftransfer.",
        "keywords": "Differentiable simulation for manipulation; Transfer Learning in Robotics",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Yuqi Xiang;Feitong Chen;Qinsi Wang;Gang Yang;Xiang Zhang;Xinghao Zhu;Xingyu Liu;Lin Shao",
        "authorids": "~Yuqi_Xiang1;~Feitong_Chen1;~Qinsi_Wang1;~Gang_Yang8;~Xiang_Zhang20;~Xinghao_Zhu1;~Xingyu_Liu1;~Lin_Shao2",
        "gender": "M;F;;M;M;;M;M",
        "homepage": ";http://www.xjtu.edu.cn/;;https://github.com/LapUtopia;https://xiang-zhang-98.github.io/;;https://xingyul.github.io;https://linsats.github.io/",
        "dblp": ";;;;;;;26/8546-2",
        "google_scholar": ";;;;;;ZVABLi8AAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;;;;;",
        "linkedin": "yuqi-xiang-365103248/;;;;;;xing-yu-liu/;",
        "or_profile": "~Yuqi_Xiang1;~Feitong_Chen1;~Qinsi_Wang1;~Gang_Yang8;~Xiang_Zhang20;~Xinghao_Zhu1;~Xingyu_Liu1;~Lin_Shao2",
        "aff": "Nanjing University;;;;University of California, Berkeley;;Carnegie Mellon University;National University of Singapore",
        "aff_domain": "nju.edu.cn;;;;berkeley.edu;;cmu.edu;nus.edu.sg",
        "position": "Undergrad student;;;;PhD student;;Postdoc;Assistant Professor",
        "bibtex": "@misc{\nxiang2024difftransfer,\ntitle={Diff-Transfer: Model-based Robotic Manipulation Skill Transfer via Differentiable Physics Simulation},\nauthor={Yuqi Xiang and Feitong Chen and Qinsi Wang and Gang Yang and Xiang Zhang and Xinghao Zhu and Xingyu Liu and Lin Shao},\nyear={2024},\nurl={https://openreview.net/forum?id=EODzbQ2Gy4}\n}",
        "github": "",
        "project": "",
        "reviewers": "orn2;vf9D;SmsY;PT7k;zf8W",
        "site": "https://openreview.net/forum?id=EODzbQ2Gy4",
        "pdf_size": 2667077,
        "rating": "1;3;3;5;5",
        "confidence": "4;3;3;3;2",
        "soundness": "1;2;3;2;2",
        "contribution": "1;2;2;2;2",
        "presentation": "2;3;2;3;3",
        "wc_summary": "135;89;65;107;73",
        "wc_strengths": "26;13;53;36;40",
        "wc_weaknesses": "73;37;195;70;74",
        "wc_questions": "39;508;35;125;42",
        "wc_review": "273;647;348;338;229",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            3.4,
            1.4966629547095767
        ],
        "confidence_avg": [
            3.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            1.8,
            0.4000000000000001
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            93.8,
            25.126878039263055
        ],
        "wc_strengths_avg": [
            33.6,
            13.45511055324333
        ],
        "wc_weaknesses_avg": [
            89.8,
            54.36690169579282
        ],
        "wc_questions_avg": [
            149.8,
            182.20801299613584
        ],
        "wc_review_avg": [
            367.0,
            146.61650657412352
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.8451542547285165,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2302815649194163577&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Nanjing University;University of California, Berkeley;Carnegie Mellon University;National University of Singapore",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.nju.edu.cn;https://www.berkeley.edu;https://www.cmu.edu;https://www.nus.edu.sg",
        "aff_unique_abbr": "Nanjing U;UC Berkeley;CMU;NUS",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Berkeley",
        "aff_country_unique_index": "0;1;1;2",
        "aff_country_unique": "China;United States;Singapore"
    },
    {
        "id": "EOTgj37XNM",
        "title": "Classifiers are Forgetful! Balancing the Mutual Causal Effects in Class-Incremental Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Class-Incremental Learning (CIL) is a practical and challenging problem for achieving general artificial intelligence. Pre-Trained Models (PTMs) have recently led to breakthroughs in both visual and natural language processing (NLP) tasks. Despite recent studies showing PTMs' potential ability to learn sequentially, a plethora of work indicates the necessity of alleviating the catastrophic forgetting of PTMs. Through a pilot study and a causal analysis of CIL, we reveal that the problem lies in the imbalance effect between new and old data, which leads to the forgetting of classifiers. To alleviate this problem, we propose BaCE, a method retrieving the causal effects from new data to the adaptation of old classes and from old data to the adaptation of new classes. By balancing the causal effect, BaCE enables the causal effects from new and old data mutually help the adaptation to each class. We conduct extensive experiments on three different tasks (Image Classification, Text Classification, and Named Entity Recognition) with various backbones (ResNet-18, ViT, BERT) in the CIL setting. Empirical results show the proposed method outperforms a series of CIL methods on different tasks and settings.",
        "keywords": "Class-Incremental Learning;Causal Inference;Pretrained Models",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/ba766b036d8f4dbf0f4f928c04cf0d8fa31d0a05.zip",
        "author": "Junhao Zheng;Ruiyan Wang;Chongzhi Zhang;Huawen Feng;Qianli Ma",
        "authorids": "~Junhao_Zheng3;~Ruiyan_Wang1;~Chongzhi_Zhang3;~Huawen_Feng1;~Qianli_Ma3",
        "gender": "M;;M;M;M",
        "homepage": "https://github.com/zzz47zzz;https://wruiyan.github.io/;https://github.com/Vin1115;https://github.com/201736621051;http://www2.scut.edu.cn/qianlima",
        "dblp": "37/3126;;;339/3443;57/8221-1",
        "google_scholar": "eyh-5tkAAAAJ;;;WsTNqM8AAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0001-9124-2467;;0009-0000-0515-4795;0000-0002-9704-1479;0000-0002-9356-2883",
        "linkedin": ";;;;",
        "or_profile": "~Junhao_Zheng3;~Ruiyan_Wang1;~Chongzhi_Zhang3;~Huawen_Feng1;~Qianli_Ma3",
        "aff": "South China University of Technology;South China University of Technology;South China University of Technology;South China University of Technology;South China University of Technology",
        "aff_domain": "scut.edu.cn;scut.edu.cn;scut.edu.cn;scut.edu.cn;scut.edu.cn",
        "position": "PhD student;Undergrad student;MS student;PhD student;Full Professor",
        "bibtex": "@misc{\nzheng2024classifiers,\ntitle={Classifiers are Forgetful! Balancing the Mutual Causal Effects in Class-Incremental Learning},\nauthor={Junhao Zheng and Ruiyan Wang and Chongzhi Zhang and Huawen Feng and Qianli Ma},\nyear={2024},\nurl={https://openreview.net/forum?id=EOTgj37XNM}\n}",
        "github": "",
        "project": "",
        "reviewers": "ukvZ;MS7Y;6Ezu;UgqC",
        "site": "https://openreview.net/forum?id=EOTgj37XNM",
        "pdf_size": 16816857,
        "rating": "3;5;6;6",
        "confidence": "4;4;3;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "2;2;2;3",
        "wc_summary": "28;94;73;66",
        "wc_strengths": "53;40;66;68",
        "wc_weaknesses": "235;112;90;233",
        "wc_questions": "10;24;2;156",
        "wc_review": "326;270;231;523",
        "wc_reply_reviewers": "0;0;0;160",
        "wc_reply_authors": "752;428;203;756",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            65.25,
            23.84716964337697
        ],
        "wc_strengths_avg": [
            56.75,
            11.255554184490428
        ],
        "wc_weaknesses_avg": [
            167.5,
            66.95707580233773
        ],
        "wc_questions_avg": [
            48.0,
            62.849025449882674
        ],
        "wc_review_avg": [
            337.5,
            112.29536945039186
        ],
        "wc_reply_reviewers_avg": [
            40.0,
            69.2820323027551
        ],
        "wc_reply_authors_avg": [
            534.75,
            233.23954960512165
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.4714045207910316,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ZBoQ4y283QwJ:scholar.google.com/&scioq=Classifiers+are+Forgetful!+Balancing+the+Mutual+Causal+Effects+in+Class-Incremental+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "South China University of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.scut.edu.cn",
        "aff_unique_abbr": "SCUT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Exploring the cloud of feature interaction scores in a Rashomon set",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19105",
        "id": "EPNEazJoAg",
        "author_site": "Sichao Li, Rong Wang, Quanling Deng, Amanda Barnard",
        "tldr": "",
        "abstract": "Interactions among features are central to understanding the behavior of machine learning models. Recent research has made significant strides in detecting and quantifying feature interactions in single predictive models. However, we argue that the feature interactions extracted from a single pre-specified model may not be trustworthy since: *a well-trained predictive model may not preserve the true feature interactions and there exist multiple well-performing predictive models that differ in feature interaction strengths*. Thus, we recommend exploring feature interaction strengths in a model class of approximately equally accurate predictive models. In this work, we introduce the feature interaction score (FIS) in the context of a Rashomon set, representing a collection of models that achieve similar accuracy on a given task. We propose a general and practical algorithm to calculate the FIS in the model class. We demonstrate the properties of the FIS via synthetic data and draw connections to other areas of statistics. Additionally, we introduce a Halo plot for visualizing the feature interaction variance in high-dimensional space and a swarm plot for analyzing FIS in a Rashomon set. Experiments with recidivism prediction and image classification illustrate how feature interactions can vary dramatically in importance for similarly accurate predictive models. Our results suggest that the proposed FIS can provide valuable insights into the nature of feature interactions in machine learning models.",
        "keywords": "Feature interaction;variable importance;Rashomon set;model interpretability",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/5c68fc0c30f2bf035aa6bb606d61cbfb3632cc94.pdf",
        "author": "Sichao Li;Rong Wang;Quanling Deng;Amanda S Barnard",
        "authorids": "~Sichao_Li1;~Rong_Wang3;~Quanling_Deng1;~Amanda_S_Barnard1",
        "gender": "M;M;M;F",
        "homepage": "https://sichao-li.github.io/;;https://quanlingdeng.github.io/;https://comp.anu.edu.au/people/amanda-barnard/",
        "dblp": "279/4978;66/4610-2.html;192/1818;",
        "google_scholar": "ylZQz2sAAAAJ;https://scholar.google.com/citations?hl=en;PBGaQ44AAAAJ;lGtwfOQAAAAJ",
        "orcid": ";0000-0002-1905-3175;;0000-0002-4784-2382",
        "linkedin": ";;;prof-amanda-barnard-am-a0997b29",
        "or_profile": "~Sichao_Li1;~Rong_Wang3;~Quanling_Deng1;~Amanda_S_Barnard1",
        "aff": "Australian National University;Australian National University;Australian National University;Australian National University",
        "aff_domain": "anu.edu.au;anu.edu.au;anu.edu.au;anu.edu.au",
        "position": "PhD student;PhD student;Lecturer;Full Professor",
        "bibtex": "@inproceedings{\nli2024exploring,\ntitle={Exploring the cloud of feature interaction scores in a Rashomon set},\nauthor={Sichao Li and Rong Wang and Quanling Deng and Amanda S Barnard},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=EPNEazJoAg}\n}",
        "github": "",
        "project": "",
        "reviewers": "UrRA;gxVk;CnMm",
        "pdf_size": 4621914,
        "rating": "6;6;6",
        "confidence": "3;3;4",
        "soundness": "3;3;3",
        "contribution": "3;2;4",
        "presentation": "2;3;4",
        "wc_summary": "114;22;100",
        "wc_strengths": "38;25;44",
        "wc_weaknesses": "28;45;30",
        "wc_questions": "91;1;454",
        "wc_review": "271;93;628",
        "wc_reply_reviewers": "0;39;0",
        "wc_reply_authors": "1432;689;1557",
        "reply_reviewers": "0;1;0",
        "reply_authors": "3;1;3",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            78.66666666666667,
            40.47495796442811
        ],
        "wc_strengths_avg": [
            35.666666666666664,
            7.93025150224688
        ],
        "wc_weaknesses_avg": [
            34.333333333333336,
            7.586537784494028
        ],
        "wc_questions_avg": [
            182.0,
            195.81113349347632
        ],
        "wc_review_avg": [
            330.6666666666667,
            222.45049386823626
        ],
        "wc_reply_reviewers_avg": [
            13.0,
            18.384776310850235
        ],
        "wc_reply_authors_avg": [
            1226.0,
            383.1300910482843
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1239610895835937963&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=EPNEazJoAg",
        "pdf": "https://openreview.net/pdf?id=EPNEazJoAg",
        "email": "anu.edu.au;anu.edu.au;anu.edu.au;anu.edu.au",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Australian National University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.anu.edu.au",
        "aff_unique_abbr": "ANU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Australia"
    },
    {
        "id": "EPfGHb9Y68",
        "title": "Continual Offline Reinforcement Learning via Diffusion-based Dual Generative Replay",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We study continual offline reinforcement learning, a practical paradigm that facilitates forward transfer and mitigates catastrophic forgetting to tackle sequential offline tasks. We propose a dual generative replay framework that retains previous knowledge by concurrent replay of generated pseudo-data. First, we decouple the continual learning policy into a diffusion-based generative behavior model and a multi-head action evaluation model, allowing the policy to inherit distributional expressivity for encompassing a progressive range of diverse behaviors. Second, we train a task-conditioned diffusion model to mimic state distributions of past tasks. Generated states are paired with corresponding responses from the behavior generator to represent old tasks with high-fidelity replayed samples. Finally, by interleaving pseudo samples with real ones of the new task, we continually update the state and behavior generators to model progressively diverse behaviors, and regularize the multi-head critic in a behavior cloning manner to mitigate forgetting. Experiments on various benchmarks demonstrate that our method achieves better forward transfer with less forgetting, and closely approximates results of using previous ground-truth data due to its high-fidelity replay of the sample space.",
        "keywords": "Continual reinforcement learning;offline reinforcement learning;generative replay;diffusion models",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/5b0841f5458a8b56f34047f9d36dbb9770c8641f.pdf",
        "author": "Jinmei Liu;Wenbin Li;Xiangyu Yue;Chunlin Chen;Zhi Wang",
        "authorids": "~Jinmei_Liu2;~Wenbin_Li5;~Xiangyu_Yue1;~Chunlin_Chen1;~Zhi_Wang7",
        "gender": ";M;M;M;",
        "homepage": ";https://cs.nju.edu.cn/liwenbin/;http://xyue.io/;https://sme.nju.edu.cn/ccl/list.htm;",
        "dblp": ";27/1736-6.html;207/7518;68/6992.html;",
        "google_scholar": ";K-kC4yYAAAAJ;-xQ-C1sAAAAJ;;",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Jinmei_Liu2;~Wenbin_Li5;~Xiangyu_Yue1;~Chunlin_Chen1;~Zhi_Wang7",
        "aff": ";Nanjing University;The Chinese University of Hong Kong;Nanjing University;",
        "aff_domain": ";nju.edu.cn;ie.cuhk.edu;nju.edu.cn;",
        "position": ";Assistant Professor;Assistant Professor;Full Professor;",
        "bibtex": "@misc{\nliu2024continual,\ntitle={Continual Offline Reinforcement Learning via Diffusion-based Dual Generative Replay},\nauthor={Jinmei Liu and Wenbin Li and Xiangyu Yue and Chunlin Chen and Zhi Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=EPfGHb9Y68}\n}",
        "github": "",
        "project": "",
        "reviewers": "R6pv;t1vB;RUFG;msqf",
        "site": "https://openreview.net/forum?id=EPfGHb9Y68",
        "pdf_size": 1330490,
        "rating": "3;5;5;6",
        "confidence": "5;3;4;2",
        "soundness": "1;3;2;2",
        "contribution": "3;2;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "123;85;91;131",
        "wc_strengths": "50;38;75;101",
        "wc_weaknesses": "1334;172;178;105",
        "wc_questions": "680;50;55;3",
        "wc_review": "2187;345;399;340",
        "wc_reply_reviewers": "51;0;0;14",
        "wc_reply_authors": "1979;1132;1402;1144",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "3;2;2;2",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            107.5,
            19.817921182606415
        ],
        "wc_strengths_avg": [
            66.0,
            24.21776207662467
        ],
        "wc_weaknesses_avg": [
            447.25,
            512.7666988992167
        ],
        "wc_questions_avg": [
            197.0,
            279.59703145777496
        ],
        "wc_review_avg": [
            817.75,
            790.8752667140375
        ],
        "wc_reply_reviewers_avg": [
            16.25,
            20.8611480987984
        ],
        "wc_reply_authors_avg": [
            1414.25,
            343.4358564564859
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9233805168766388,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2026680893296069934&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Nanjing University;Chinese University of Hong Kong",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.nju.edu.cn;https://www.cuhk.edu.hk",
        "aff_unique_abbr": "Nanjing U;CUHK",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "ER1VDuwWvB",
        "title": "CORE: Common Random Reconstruction for Distributed Optimization with Provable Low Communication Complexity",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "With distributed machine learning being a prominent technique for large-scale machine learning tasks, communication complexity has become a major bottleneck for speeding up training and scaling up machine numbers. In this paper, we propose a new technique named Common randOm REconstruction(CORE), which can be used to compress the information transmitted between machines in order to reduce communication complexity without other strict conditions. Especially, our technique CORE projects the vector-valued information to a low-dimensional one through common random vectors and reconstructs the information with the same random noises after communication. We apply CORE to two distributed tasks, respectively convex optimization on linear models and generic non-convex optimization, and design new distributed algorithms, which achieve provably lower communication complexities.  For example, we show for linear models CORE-based algorithm can encode the gradient vector to $\\mathcal{O}(1)$-bits (against $\\mathcal{O}(d)$), with the convergence rate not worse, preceding the existing results.",
        "keywords": "Distributed Optimization;Effective Dimension;Gradient Compression;Learning Theory",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/eed3435536ae7f24baf63b0f693b4436ddd9e427.pdf",
        "author": "Pengyun Yue;Hanzhen Zhao;Cong Fang;Di He;Liwei Wang;Zhouchen Lin;Song-Chun Zhu",
        "authorids": "~Pengyun_Yue1;~Hanzhen_Zhao2;~Cong_Fang1;~Di_He1;~Liwei_Wang1;~Zhouchen_Lin1;~Song-Chun_Zhu1",
        "gender": ";M;M;M;M;M;M",
        "homepage": ";https://github.com/thos314;https://congfang-ml.github.io/;https://dihe-pku.github.io/;http://www.liweiwang-pku.com/;https://zhouchenlin.github.io;https://zhusongchun.net/",
        "dblp": "354/3974;;140/6568;74/184;;l/ZhouchenLin;10/10313",
        "google_scholar": ";;N2M9RPoAAAAJ;https://scholar.google.co.jp/citations?user=orVoz4IAAAAJ;VZHxoh8AAAAJ;https://scholar.google.com.tw/citations?user=TanjFwoAAAAJ;https://scholar.google.com.tw/citations?user=Al8dyb4AAAAJ",
        "orcid": "0000-0001-7134-7106;;;;;0000-0003-1493-7569;",
        "linkedin": ";;;;;;",
        "or_profile": "~Pengyun_Yue1;~Hanzhen_Zhao2;~Cong_Fang1;~Di_He1;~Liwei_Wang1;~Zhouchen_Lin1;~Song-Chun_Zhu1",
        "aff": "Peking University;Peking University;Peking University;Microsoft;Peking University;Peking University;Peking University",
        "aff_domain": "pku.edu.cn;pku.edu.cn;pku.edu.cn;microsoft.com;pku.edu.cn;pku.edu.cn;pku.edu.cn",
        "position": "PhD student;Undergrad student;Assistant Professor;Senior Researcher;Full Professor;Professor;Full Professor",
        "bibtex": "@misc{\nyue2024core,\ntitle={{CORE}: Common Random Reconstruction for Distributed Optimization with Provable Low Communication Complexity},\nauthor={Pengyun Yue and Hanzhen Zhao and Cong Fang and Di He and Liwei Wang and Zhouchen Lin and Song-Chun Zhu},\nyear={2024},\nurl={https://openreview.net/forum?id=ER1VDuwWvB}\n}",
        "github": "",
        "project": "",
        "reviewers": "pZo4;2Q9p;4Rbu",
        "site": "https://openreview.net/forum?id=ER1VDuwWvB",
        "pdf_size": 413962,
        "rating": "3;3;5",
        "confidence": "5;3;4",
        "soundness": "2;3;3",
        "contribution": "1;2;2",
        "presentation": "2;3;3",
        "wc_summary": "288;95;90",
        "wc_strengths": "46;49;39",
        "wc_weaknesses": "1722;327;356",
        "wc_questions": "108;9;84",
        "wc_review": "2164;480;569",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            157.66666666666666,
            92.18218675837299
        ],
        "wc_strengths_avg": [
            44.666666666666664,
            4.189935029992179
        ],
        "wc_weaknesses_avg": [
            801.6666666666666,
            650.8816243287937
        ],
        "wc_questions_avg": [
            67.0,
            42.16633728461603
        ],
        "wc_review_avg": [
            1071.0,
            773.7213107228381
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16987373999125686914&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;1;0;0;0",
        "aff_unique_norm": "Peking University;Microsoft",
        "aff_unique_dep": ";Microsoft Corporation",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.microsoft.com",
        "aff_unique_abbr": "Peking U;Microsoft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "ERTp3iQWPW",
        "title": "A Framework for PromptOps in GenAI Application Development Lifecycle",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The use of \"prompts\" in the creation process of Generative Artificial Intelligence (GenAI) systems is receiving increasing interest. The significance of these prompts throughout the development cycle, however, is not properly used by current software development lifecycle approaches. This study proposes a unique methodology for integrating timely engineering and management into the creation of GenAI applications. Organizations may benefit from using \u201cPromptOps\u201d to create GenAI applications more quickly, effectively, and securely. It offers a technique to lower the danger of bias, increase the accuracy and dependability of GenAI systems, and decrease the cost of development and implementation.Our platform facilitates the seamless integration of several automated technologies in software development by performing prompt operations (PromptOps). These include Continuous Integration/Continuous Deployment (CI/CD) pipelines, workflows, APIs, and more. Our approach enables developers to easily include automated technologies, leading to a more simplified and efficient process. Furthermore, this study indicates that the framework may enable all stakeholders, including non-engineering units, to convert prompts into services, expanding their use in the building of applications. This study emphasizes the critical \nsignificance of prompts in GenAI and shows how their incorporation may improve AI application development, eventually stimulating creativity and driving the adoption of Generative AI technology.",
        "keywords": "Prompt as a Service;PromptOps;Prompt Engineering;Generative AI",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "ChengHo Wu;Chih-Yu Chou;Hsin Pang Tsai",
        "authorids": "~ChengHo_Wu1;~Chih-Yu_Chou1;~Hsin_Pang_Tsai1",
        "gender": "M;F;M",
        "homepage": "https://www.facebook.com/chengho.wu/;;https://www.facebook.com/derick.tsai.7",
        "dblp": ";;",
        "google_scholar": ";;",
        "orcid": ";;",
        "linkedin": ";chihyuchou/;",
        "or_profile": "~ChengHo_Wu1;~Chih-Yu_Chou1;~Hsin_Pang_Tsai1",
        "aff": ";Institute of Computer Science and Engineering;",
        "aff_domain": ";nycu.edu.tw;",
        "position": ";PhD student;",
        "bibtex": "@misc{\nwu2024a,\ntitle={A Framework for PromptOps in Gen{AI} Application Development Lifecycle},\nauthor={ChengHo Wu and Chih-Yu Chou and Hsin Pang Tsai},\nyear={2024},\nurl={https://openreview.net/forum?id=ERTp3iQWPW}\n}",
        "github": "",
        "project": "",
        "reviewers": "MEeF;turR;uFs3;dxyD",
        "site": "https://openreview.net/forum?id=ERTp3iQWPW",
        "pdf_size": 529016,
        "rating": "1;3;3;3",
        "confidence": "5;3;3;5",
        "soundness": "1;1;3;3",
        "contribution": "2;1;2;1",
        "presentation": "1;2;2;3",
        "wc_summary": "19;126;48;147",
        "wc_strengths": "33;124;6;19",
        "wc_weaknesses": "79;138;46;79",
        "wc_questions": "60;121;103;2",
        "wc_review": "191;509;203;247",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            1.0
        ],
        "soundness_avg": [
            2.0,
            1.0
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            85.0,
            53.033008588991066
        ],
        "wc_strengths_avg": [
            45.5,
            46.31684358848301
        ],
        "wc_weaknesses_avg": [
            85.5,
            33.17001658124397
        ],
        "wc_questions_avg": [
            71.5,
            45.83939353874569
        ],
        "wc_review_avg": [
            287.5,
            129.5714088832872
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:tAVVkbNE-LoJ:scholar.google.com/&scioq=A+Framework+for+PromptOps+in+GenAI+Application+Development+Lifecycle&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Institute of Computer Science and Engineering",
        "aff_unique_dep": "Computer Science and Engineering",
        "aff_unique_url": "",
        "aff_unique_abbr": ""
    },
    {
        "id": "ESSqkWnApz",
        "title": "Fast and Reliable Generation of EHR Time Series via Diffusion Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Electronic Health Records (EHRs) are rich sources of patient-level data, including laboratory tests, medications, and diagnoses, offering valuable resources for medical data analysis. However, concerns about privacy often restrict access to EHRs, hindering downstream analysis. Researchers have explored various methods for generating privacy-preserving EHR data. In this study, we introduce a new method for generating diverse and realistic synthetic EHR time-series data using Denoising Diffusion Probabilistic Models (DDPM). We conducted experiments on six datasets, comparing our proposed method with seven existing methods. Our results demonstrate that our approach significantly outperforms all existing methods in terms of data utility while requiring less training effort. Our approach also enhances downstream medical data analysis by providing diverse and realistic synthetic EHR data.",
        "keywords": "electronic health record data;synthetic data;diffusion model;generative model",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Muhang Tian;Bernie Chen;Allan Guo;Shiyi Jiang;Anru Zhang",
        "authorids": "~Muhang_Tian1;~Bernie_Chen1;~Allan_Guo1;~Shiyi_Jiang1;~Anru_Zhang3",
        "gender": "M;;M;;",
        "homepage": "https://muhang-tian.com/;https://github.com/BernieC22114187;;;https://anruzhang.github.io/",
        "dblp": "335/1350;;;;",
        "google_scholar": "sdzH93QAAAAJ;;;;H-PvgRsAAAAJ",
        "orcid": "0000-0002-1635-9398;;;0000-0001-6979-3334;",
        "linkedin": "muhang-tian-040030196/;;allan-guo-43a9ba1b6/;;",
        "or_profile": "~Muhang_Tian1;~Bernie_Chen1;~Allan_Guo1;~Shiyi_Jiang1;~Anru_Zhang3",
        "aff": "Duke University;Duke University;Duke University;Duke University;Duke University",
        "aff_domain": "duke.edu;duke.edu;duke.edu;duke.edu;duke.edu",
        "position": "Undergrad student;Undergrad student;Undergrad student;PhD student;Associate Professor",
        "bibtex": "@misc{\ntian2024fast,\ntitle={Fast and Reliable Generation of {EHR} Time Series via Diffusion Models},\nauthor={Muhang Tian and Bernie Chen and Allan Guo and Shiyi Jiang and Anru Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=ESSqkWnApz}\n}",
        "github": "",
        "project": "",
        "reviewers": "5r5j;UTQr;WAfz;27MX",
        "site": "https://openreview.net/forum?id=ESSqkWnApz",
        "pdf_size": 7356539,
        "rating": "3;3;5;6",
        "confidence": "4;5;5;5",
        "soundness": "3;2;2;2",
        "contribution": "2;2;2;3",
        "presentation": "3;3;2;2",
        "wc_summary": "45;52;36;48",
        "wc_strengths": "10;40;20;138",
        "wc_weaknesses": "254;108;27;212",
        "wc_questions": "2;4;27;80",
        "wc_review": "311;204;110;478",
        "wc_reply_reviewers": "0;0;12;19",
        "wc_reply_authors": "700;520;272;1191",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "1;1;1;3",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            45.25,
            5.889609494694874
        ],
        "wc_strengths_avg": [
            52.0,
            50.813384063650005
        ],
        "wc_weaknesses_avg": [
            150.25,
            88.81546881033731
        ],
        "wc_questions_avg": [
            28.25,
            31.45135132232
        ],
        "wc_review_avg": [
            275.75,
            136.71937499857142
        ],
        "wc_reply_reviewers_avg": [
            7.75,
            8.13557004763649
        ],
        "wc_reply_authors_avg": [
            670.75,
            336.61652885739284
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5555555555555555,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7273346735636279997&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Duke University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.duke.edu",
        "aff_unique_abbr": "Duke",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "ESmvnmZ9fT",
        "title": "SCoRF: Single-stage convolutional radiance fields for effective 3D scene representation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Novel view synthesis captured from multiple images is a critical research topic in computer vision and computational photography due to their wide range of applications. Neural radiance fields significantly improve performance by optimizing continuous volumetric scene functions using a multi-layer perceptron. Although neural radiance fields and their modifications provide high-quality scenes, they have various limitations in representing color and density due to their hierarchical architecture comprising coarse and fine networks. They also require numerous parameters and considerable training time, and generally do not consider local and global relationships between samples on a ray. This paper proposes a unified single-stage paradigm that jointly learns relative position on three-dimensional rays and their relative color and density for complex scenes using a convolutional neural network to reduce noise and irrelevant features and preventing overfitting. Experimental results including ablation tests verify the proposed approach superior robustness to current state-of-the-art models for synthesizing novel views.",
        "keywords": "Computer Vision;Computational Photography;Novel View Synthesis",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "YoonJae Lee;Gangjoon Yoon;Jinjoo Song;Sang Min Yoon",
        "authorids": "~YoonJae_Lee2;~Gangjoon_Yoon1;~Jinjoo_Song1;~Sang_Min_Yoon1",
        "gender": "M;M;F;M",
        "homepage": "https://github.com/xkdytk;;;",
        "dblp": ";;;",
        "google_scholar": ";HEl7exQAAAAJ;https://scholar.google.com/citations?hl=ko;",
        "orcid": ";0000-0002-0654-491X;0000-0003-3335-5644;0000-0003-0001-1845",
        "linkedin": ";;;",
        "or_profile": "~YoonJae_Lee2;~Gangjoon_Yoon1;~Jinjoo_Song1;~Sang_Min_Yoon1",
        "aff": "Kookmin University;;Kookmin University;Kookmin University",
        "aff_domain": "kookmin.ac.kr;;kookmin.ac.kr;kookmin.ac.kr",
        "position": "MS student;;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nlee2024scorf,\ntitle={{SC}o{RF}: Single-stage convolutional radiance fields for effective 3D scene representation},\nauthor={YoonJae Lee and Gangjoon Yoon and Jinjoo Song and Sang Min Yoon},\nyear={2024},\nurl={https://openreview.net/forum?id=ESmvnmZ9fT}\n}",
        "github": "",
        "project": "",
        "reviewers": "eE9q;BVY4;DEzN",
        "site": "https://openreview.net/forum?id=ESmvnmZ9fT",
        "pdf_size": 1218099,
        "rating": "3;5;5",
        "confidence": "5;3;4",
        "soundness": "2;2;2",
        "contribution": "2;2;2",
        "presentation": "2;2;2",
        "wc_summary": "62;87;45",
        "wc_strengths": "33;108;15",
        "wc_weaknesses": "195;60;356",
        "wc_questions": "64;42;3",
        "wc_review": "354;297;419",
        "wc_reply_reviewers": "0;70;50",
        "wc_reply_authors": "764;287;785",
        "reply_reviewers": "0;1;1",
        "reply_authors": "2;1;2",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            64.66666666666667,
            17.249798710580816
        ],
        "wc_strengths_avg": [
            52.0,
            40.27406113120453
        ],
        "wc_weaknesses_avg": [
            203.66666666666666,
            120.99678599955548
        ],
        "wc_questions_avg": [
            36.333333333333336,
            25.223445883190152
        ],
        "wc_review_avg": [
            356.6666666666667,
            49.84197249529981
        ],
        "wc_reply_reviewers_avg": [
            40.0,
            29.43920288775949
        ],
        "wc_reply_authors_avg": [
            612.0,
            229.96956320348133
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:i_MiukdiXR0J:scholar.google.com/&scioq=SCoRF:+Single-stage+convolutional+radiance+fields+for+effective+3D+scene+representation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Kookmin University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kookmin.ac.kr",
        "aff_unique_abbr": "KMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "ESq3U7z6FD",
        "title": "EHI: End-to-end learning of Hierarchical Index for Efficient Dense Retrieval",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Dense embedding-based retrieval is now the industry standard for semantic search and ranking problems, like obtaining relevant web documents for a given query. Such techniques use a two-stage process: (a) contrastive learning to train a dual encoder to embed both the query and documents and (b) approximate nearest neighbor search (ANNS) for finding similar documents for a given query. These two stages are disjoint; the learned embeddings might be ill-suited for the ANNS method and vice-versa, leading to suboptimal performance. In this work, we propose End-to-end Hierarchical Indexing -- EHI -- that jointly learns both the embeddings and the ANNS structure to optimize retrieval performance. EHI uses a standard dual encoder model for embedding queries and documents while learning an inverted file index (IVF) style tree structure for efficient ANNS. To ensure stable and efficient learning of discrete tree-based ANNS structure, \nEHI introduces the notion of dense path embedding that captures the position of a query/document in the tree. We demonstrate the effectiveness of EHI on several benchmarks, including de-facto industry standard MS MARCO (Dev set and TREC DL19) datasets. For example, with the same compute budget, EHI outperforms state-of-the-art (SOTA) in by 0.6% (MRR@10) on MS MARCO dev set and by  4.2% (nDCG@10) on TREC DL19 benchmarks.",
        "keywords": "dense retrieval;representation learning;semantic search;dual encoder",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Ramnath Kumar;Anshul Mittal;Nilesh Gupta;Aditya Kusupati;Inderjit S Dhillon;Prateek Jain",
        "authorids": "~Ramnath_Kumar1;~Anshul_Mittal2;~Nilesh_Gupta1;~Aditya_Kusupati1;~Inderjit_S_Dhillon1;~Prateek_Jain1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://ramnathkumar181.github.io/;http://anshulmittal.org;https://nilesh2797.github.io/;http://www.adityakusupati.com/;http://www.cs.utexas.edu/users/inderjit/;http://prateekjain.org",
        "dblp": ";;256/5076;231/7662;d/InderjitSDhillon;https://dblp.uni-trier.de/pers/j/Jain_0002:Prateek.html",
        "google_scholar": "csZjvdEAAAAJ;8TDNQMQAAAAJ;WDF2ldUAAAAJ;https://scholar.google.co.in/citations?user=qULx8g8AAAAJ;xBv5ZfkAAAAJ;qYhRbJoAAAAJ",
        "orcid": ";0000-0002-4137-0126;0000-0002-6065-8475;0000-0001-8455-1851;;",
        "linkedin": ";anshumitts/;;adityakusupati/;inderjit-dhillon-a20888b0/;",
        "or_profile": "~Ramnath_Kumar1;~Anshul_Mittal2;~Nilesh_Gupta1;~Aditya_Kusupati1;~Inderjit_S_Dhillon1;~Prateek_Jain1",
        "aff": "Google;Indian Institute of Technology Delhi;University of Texas at Austin;Department of Computer Science, University of Washington;University of Texas, Austin;Google",
        "aff_domain": "google.com;iitd.ac.in;utexas.edu;cs.washington.edu;utexas.edu;google.com",
        "position": "Pre-Doctoral Researcher;PhD student;PhD student;PhD student;Full Professor;Researcher",
        "bibtex": "@misc{\nkumar2024ehi,\ntitle={{EHI}: End-to-end learning of Hierarchical Index for Efficient Dense Retrieval},\nauthor={Ramnath Kumar and Anshul Mittal and Nilesh Gupta and Aditya Kusupati and Inderjit S Dhillon and Prateek Jain},\nyear={2024},\nurl={https://openreview.net/forum?id=ESq3U7z6FD}\n}",
        "github": "",
        "project": "",
        "reviewers": "9k3r;PLmq;vMMh;ftWv",
        "site": "https://openreview.net/forum?id=ESq3U7z6FD",
        "pdf_size": 8270591,
        "rating": "5;5;6;8",
        "confidence": "5;4;4;3",
        "soundness": "1;2;3;3",
        "contribution": "1;2;3;3",
        "presentation": "2;2;2;3",
        "wc_summary": "146;108;75;157",
        "wc_strengths": "34;52;140;173",
        "wc_weaknesses": "300;406;238;120",
        "wc_questions": "35;324;5;135",
        "wc_review": "515;890;458;585",
        "wc_reply_reviewers": "534;2312;17;0",
        "wc_reply_authors": "2761;6529;871;529",
        "reply_reviewers": "2;5;1;0",
        "reply_authors": "6;11;2;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            121.5,
            32.42298567374695
        ],
        "wc_strengths_avg": [
            99.75,
            58.28539697042476
        ],
        "wc_weaknesses_avg": [
            266.0,
            103.50845376103345
        ],
        "wc_questions_avg": [
            124.75,
            124.700390937639
        ],
        "wc_review_avg": [
            612.0,
            166.6868321133976
        ],
        "wc_reply_reviewers_avg": [
            715.75,
            946.2553500509257
        ],
        "wc_reply_authors_avg": [
            2672.5,
            2383.2970335230984
        ],
        "reply_reviewers_avg": [
            2.0,
            1.8708286933869707
        ],
        "reply_authors_avg": [
            5.0,
            3.9370039370059056
        ],
        "replies_avg": [
            35,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.8660254037844386,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4272204947142071636&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;3;2;0",
        "aff_unique_norm": "Google;Indian Institute of Technology Delhi;University of Texas at Austin;University of Washington",
        "aff_unique_dep": "Google;;;Department of Computer Science",
        "aff_unique_url": "https://www.google.com;https://www.iitd.ac.in;https://www.utexas.edu;https://www.washington.edu",
        "aff_unique_abbr": "Google;IIT Delhi;UT Austin;UW",
        "aff_campus_unique_index": "0;1;2;3;2;0",
        "aff_campus_unique": "Mountain View;Delhi;Austin;Seattle",
        "aff_country_unique_index": "0;1;0;0;0;0",
        "aff_country_unique": "United States;India"
    },
    {
        "id": "ESt7ECoWpn",
        "title": "Differentially Pivate Per-Instance Additive Noise Mechanism: A Game Theoretic Approach",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recently, the concept of per-instance differential privacy (pDP) has gained significant attention by virtue of its capability to assess the differential privacy (DP) of individual data instances within a dataset.\nTraditional additive mechanisms in the DP domain, which add identical noises to all data instances, often compromise the dataset's statistical utility to guarantee DP. \nA main obstacle in devising a per-instance additive noise mechanism stems from the interdependency of the additive noises: altering one data instance inadvertently affects the pDP of others. \nThis intricate interdependency complicates the problem, making it resistant to straightforward solutions. \nTo address this challenge, we propose a per-instance noise variance optimization (NVO) game, framed as a common interest sequential game. \nWe show that the Nash equilibrium (NE) points of this game inherently guarantee DP. \nWe leverage two algorithms to derive strategies for achieving the NE: 1) an approximate enumeration (AE) using a genetic algorithm, and 2) best response dynamics (BRD). \nTo validate the efficacy of our approach, we evaluate the NVO game on various statistical metrics including regression experimental results.\nThe source code to reproduce the results will be available soon.",
        "keywords": "differential privacy;safety;privacy",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Sehyun Ryu;Jonggyu Jang;Hyun Jong Yang",
        "authorids": "~Sehyun_Ryu1;~Jonggyu_Jang1;~Hyun_Jong_Yang2",
        "gender": ";M;M",
        "homepage": "https://sites.google.com/view/sehyun-ryu/home;;http://aislab.io",
        "dblp": ";182/7311;87/4972",
        "google_scholar": "ObkT9IkAAAAJ;https://scholar.google.co.kr/citations?hl=en;https://scholar.google.co.kr/citations?user=zNBCcSgAAAAJ",
        "orcid": ";0000-0001-9651-2227;0000-0002-0717-3794",
        "linkedin": "sehyun-ryu-57b640172/;;hyun-jong-yang-549a2417",
        "or_profile": "~Sehyun_Ryu1;~Jonggyu_Jang1;~Hyun_Jong_Yang2",
        "aff": "POSTECH;Pohang University of Science and Technology;POSTECH",
        "aff_domain": "postech.ac.kr;postech.ac.kr;postech.ac.kr",
        "position": "MS student;Postdoc;Associate Professor",
        "bibtex": "@misc{\nryu2024differentially,\ntitle={Differentially Pivate Per-Instance Additive Noise Mechanism: A Game Theoretic Approach},\nauthor={Sehyun Ryu and Jonggyu Jang and Hyun Jong Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=ESt7ECoWpn}\n}",
        "github": "",
        "project": "",
        "reviewers": "UXaT;xkkw;HRkt;eCZ8",
        "site": "https://openreview.net/forum?id=ESt7ECoWpn",
        "pdf_size": 11700714,
        "rating": "3;3;6;6",
        "confidence": "4;2;4;2",
        "soundness": "2;2;3;4",
        "contribution": "2;2;3;3",
        "presentation": "2;1;4;3",
        "wc_summary": "108;26;105;143",
        "wc_strengths": "31;46;96;33",
        "wc_weaknesses": "154;272;183;35",
        "wc_questions": "48;93;2;124",
        "wc_review": "341;437;386;335",
        "wc_reply_reviewers": "0;0;19;0",
        "wc_reply_authors": "776;1119;829;1027",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            3.0,
            1.0
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            95.5,
            42.81646879414509
        ],
        "wc_strengths_avg": [
            51.5,
            26.32964109136317
        ],
        "wc_weaknesses_avg": [
            161.0,
            84.74963126763443
        ],
        "wc_questions_avg": [
            66.75,
            46.12686310600364
        ],
        "wc_review_avg": [
            374.75,
            40.99009026581913
        ],
        "wc_reply_reviewers_avg": [
            4.75,
            8.227241335952167
        ],
        "wc_reply_authors_avg": [
            937.75,
            140.36269981729475
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:YaNp18vRN1sJ:scholar.google.com/&scioq=Differentially+Pivate+Per-Instance+Additive+Noise+Mechanism:+A+Game+Theoretic+Approach&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Pohang University of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.postech.ac.kr",
        "aff_unique_abbr": "POSTECH",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Pohang",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "EUJOKjMB9I",
        "title": "What Makes for Robust Multi-Modal Models in the Face of Missing Modalities?",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "With the growing success of multi-modal learning, research on the robustness of multi-modal models, especially when facing situations with missing modalities, is receiving increased attention. Nevertheless, previous studies in this domain exhibit certain limitations, as they often lack theoretical insights or their methodologies are tied to specific network architectures or modalities. We model the scenarios of multi-modal models encountering missing modalities from an information-theoretic perspective and illustrate that the performance ceiling in such scenarios can be approached by efficiently utilizing the information inherent in non-missing modalities. In practice, there are two key aspects: (1) The encoder should be able to extract sufficiently good features from the non-missing modality; (2) The extracted features should be robust enough not to be influenced by noise during the fusion process across modalities. To this end, we introduce Uni-Modal Ensemble with Missing Modality Adaptation (UME-MMA). UME-MMA employs uni-modal pre-trained weights for the multi-modal model to enhance feature extraction and utilizes missing modality data augmentation techniques to better adapt to situations with missing modalities. Apart from that, UME-MMA, built on a late-fusion learning framework, allows for the plug-and-play use of various encoders, making it suitable for a wide range of modalities and enabling seamless integration of large-scale pre-trained encoders to further enhance performance. And we demonstrate UME-MMA's effectiveness in audio-visual datasets (e.g., AV-MNIST, Kinetics-Sound, AVE) and vision-language datasets (e.g., MM-IMDB, UPMC Food101).",
        "keywords": "Multi-modal Learning; Missing Modalities",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/a43a2179deb82b6fa87841dd143b38923c745122.zip",
        "author": "Siting Li;Chenzhuang Du;Yue Zhao;Yu Huang;Hang Zhao",
        "authorids": "~Siting_Li1;~Chenzhuang_Du1;~Yue_Zhao15;~Yu_Huang3;~Hang_Zhao1",
        "gender": ";M;;F;M",
        "homepage": ";https://scholar.google.com/citations?hl=zh-CN&user=VoF-UAEAAAAJ;;https://yuhuang42.org/;http://www.mit.edu/~hangzhao/",
        "dblp": ";275/3182;;39/6301-23;",
        "google_scholar": ";https://scholar.google.com/citations?hl=zh-CN;;;DmahiOYAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Siting_Li1;~Chenzhuang_Du1;~Yue_Zhao15;~Yu_Huang3;~Hang_Zhao1",
        "aff": ";Tsinghua University;;The Wharton School, University of Pennsylvania;Tsinghua University",
        "aff_domain": ";tsinghua.edu.cn;;wharton.upenn.edu;tsinghua.edu.cn",
        "position": ";PhD student;;PhD student;Assistant Professor",
        "bibtex": "@misc{\nli2024what,\ntitle={What Makes for Robust Multi-Modal Models in the Face of Missing Modalities?},\nauthor={Siting Li and Chenzhuang Du and Yue Zhao and Yu Huang and Hang Zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=EUJOKjMB9I}\n}",
        "github": "",
        "project": "",
        "reviewers": "zEWL;xDLC;v3QK;K5Sq",
        "site": "https://openreview.net/forum?id=EUJOKjMB9I",
        "pdf_size": 818991,
        "rating": "1;3;5;5",
        "confidence": "4;4;3;4",
        "soundness": "2;2;3;2",
        "contribution": "1;2;2;2",
        "presentation": "3;3;2;3",
        "wc_summary": "79;68;82;38",
        "wc_strengths": "46;30;40;33",
        "wc_weaknesses": "141;160;143;149",
        "wc_questions": "1;85;68;8",
        "wc_review": "267;343;333;228",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            1.6583123951777
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            66.75,
            17.397916541931107
        ],
        "wc_strengths_avg": [
            37.25,
            6.219927652312364
        ],
        "wc_weaknesses_avg": [
            148.25,
            7.39509972887452
        ],
        "wc_questions_avg": [
            40.5,
            36.58209944768069
        ],
        "wc_review_avg": [
            292.75,
            47.43614128488952
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=243129072222995189&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Tsinghua University;University of Pennsylvania",
        "aff_unique_dep": ";The Wharton School",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.wharton.upenn.edu",
        "aff_unique_abbr": "THU;UPenn Wharton",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "EUUB2OBbRQ",
        "title": "Node-wise Calibration of Graph Neural Networks under Out-of-Distribution Nodes via Reinforcement Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Graph neural networks (GNNs) achieve great success in tasks like node classification, link prediction, and graph classification. The core of GNNs aims to obtain representative features by aggregating neighborhood node information through the message-passing mechanism. However, when the graph is mixed with out-of-distribution (OOD) nodes, existing methods generally fail to provide reliable confidence for in-distribution (ID) classification, due to the under-explored negative impact from the OOD nodes. Our studies suggest that the calibration issue of GNN with OOD nodes is more complicated than that without OOD nodes. In some datasets the predictions of GNN are under-confident issue while others may be over-confident. This irregularity makes the current calibration methods less effective since none of them considers the negative impact from OOD nodes. Inspired by the existing work that calibrates the neural network with new loss functions that aim to adjust the entropy of the output implicitly, we aim to achieve the same goal by adjusting the weight of the edges. Our empirical studies suggest that manually lowering the weight of edges connecting ID nodes and OOD nodes could effectively mitigate the calibration issue. However, identification of these edges and determination of their weights remains challenging since the OOD nodes are unknown to the training process. To tackle the above challenge, we propose a novel framework called \\underline{R}L-enhanced \\underline{N}ode-wise \\underline{G}raph \\underline{E}dge \\underline{R}e-weighting (RNGER) to calibrate GNNs against OOD nodes. The proposed RNGER framework explores how the entropy of the target nodes is affected by the adjustment of the edge weights without the need for identifying OOD nodes. We develop the iterative edge sampling and re-weighting method accordingly and formulate it as the Markov Decision Process. With the reinforcement learning method, we could achieve the optimal graph structure to alleviate the calibration issue of GNNs. Experimental results on benchmark datasets demonstrate that our method can significantly reduce the expected calibration error (ECE) and also show comparable accuracy, compared with strong baselines and other state-of-the-art methods.",
        "keywords": "graph neural network;calibration;reinfocement learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Weili Shi;Xueying Yang;Xujiang Zhao;Haifeng Chen;ZHIQIANG TAO;Sheng Li",
        "authorids": "~Weili_Shi2;~Xueying_Yang1;~Xujiang_Zhao1;~Haifeng_Chen1;~ZHIQIANG_TAO2;~Sheng_Li3",
        "gender": "F;M;;;M;M",
        "homepage": ";https://zxj32.github.io/;https://haifengchen.gitlab.io/intro/;http://ztao.cc/;http://sheng-li.org;",
        "dblp": "220/7814;221/5767;08/57-1.html;135/5229.html;23/3439-1;74/10300",
        "google_scholar": ";k2-JcFAAAAAJ;QzakB68AAAAJ;sEKglOkAAAAJ;DEncVcYAAAAJ;elyMqnoAAAAJ",
        "orcid": ";;;;0000-0003-1205-8632;0000-0002-9907-2009",
        "linkedin": "xueying-yang-740425129/;zxj32/;;;sheng-li-15a70022/;weili-shi-44847a213/",
        "or_profile": "~Xueying_Yang1;~Xujiang_Zhao1;~Haifeng_Chen1;~ZHIQIANG_TAO2;~Sheng_Li3;~WEILI_SHI1",
        "aff": ";NEC Labs America;NEC-Labs;Rochester Institute of Technology;University of Virginia, Charlottesville;University of Virginia",
        "aff_domain": ";nec-labs.com;nec-labs.com;rit.edu;virginia.edu;virginia.edu",
        "position": ";Researcher;Researcher;Assistant Professor;Associate Professor;PhD student",
        "bibtex": "@misc{\nshi2024nodewise,\ntitle={Node-wise Calibration of Graph Neural Networks under Out-of-Distribution Nodes via Reinforcement Learning},\nauthor={Weili Shi and Xueying Yang and Xujiang Zhao and Haifeng Chen and ZHIQIANG TAO and Sheng Li},\nyear={2024},\nurl={https://openreview.net/forum?id=EUUB2OBbRQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "mT4R;YYpv;cXQX;Tjfh",
        "site": "https://openreview.net/forum?id=EUUB2OBbRQ",
        "pdf_size": 1075218,
        "rating": "3;3;3;6",
        "confidence": "3;4;4;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;2;3",
        "wc_summary": "114;59;113;64",
        "wc_strengths": "34;41;40;123",
        "wc_weaknesses": "154;99;137;79",
        "wc_questions": "34;5;106;62",
        "wc_review": "336;204;396;328",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            87.5,
            26.062425059844298
        ],
        "wc_strengths_avg": [
            59.5,
            36.7593525514256
        ],
        "wc_weaknesses_avg": [
            117.25,
            29.73529048117741
        ],
        "wc_questions_avg": [
            51.75,
            37.24496610281717
        ],
        "wc_review_avg": [
            316.0,
            69.79971346646059
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:NF9ZskWak34J:scholar.google.com/&scioq=Node-wise+Calibration+of+Graph+Neural+Networks+under+Out-of-Distribution+Nodes+via+Reinforcement+Learning&hl=en&as_sdt=0,21",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;3",
        "aff_unique_norm": "NEC Labs America;NEC Laboratories;Rochester Institute of Technology;University of Virginia",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.nec-labs.com;https://www.nec-labs.com;https://www.rit.edu;https://www.virginia.edu",
        "aff_unique_abbr": "NEC LA;NEC-Labs;RIT;UVA",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Charlottesville",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "EUywF11YVi",
        "title": "SimPLR: A Simple and Plain Transformer for Object Detection and Segmentation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The ability to detect objects in images at varying scales has played a pivotal role in the design of modern object detectors. Despite considerable progress in removing handcrafted components using transformers, multi-scale feature maps remain a key factor for their empirical success, even with a plain backbone like the Vision Transformer (ViT). In this paper, we show that this reliance on feature pyramids is unnecessary and a transformer-based detector with scale-aware attention enables the plain detector `SimPLR' whose backbone and detection head both operate on single-scale features. The plain architecture allows SimPLR to effectively take advantages of self-supervised learning and scaling approaches with ViTs, yielding strong performance compared to multi-scale counterparts. We demonstrate through our experiments that when scaling to larger backbones, SimPLR indicates better performance than end-to-end detectors (Mask2Former) and plain-backbone detectors (ViTDet), while consistently being faster. The code will be released.",
        "keywords": "Plain Detection;Single-scale Segmentation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/7d98195a10c3f312312d1d80ba495e38f7c34a8a.pdf",
        "author": "Duy Kien Nguyen;Martin R. Oswald;Cees G. M. Snoek",
        "authorids": "~Duy_Kien_Nguyen1;~Martin_R._Oswald1;~Cees_G._M._Snoek1",
        "gender": "M;;M",
        "homepage": ";;http://www.ceessnoek.info",
        "dblp": "218/5480.html;37/7272;s/CeesSnoek",
        "google_scholar": "welhhBIAAAAJ;https://scholar.google.ch/citations?user=biytQP8AAAAJ;https://scholar.google.nl/citations?user=0uKdbscAAAAJ",
        "orcid": ";0000-0002-1183-9958;0000-0001-9092-1556",
        "linkedin": "https://linkedin.com/in/duy-kien-nguyen-940b63109;martin-r-oswald-167461122/;cgmsnoek/",
        "or_profile": "~Duy_Kien_Nguyen1;~Martin_R._Oswald1;~Cees_Snoek1",
        "aff": "University of Amsterdam;University of Amsterdam;University of Amsterdam",
        "aff_domain": "uva.nl;uva.nl;uva.nl",
        "position": "PhD student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nnguyen2024simplr,\ntitle={Sim{PLR}: A Simple and Plain Transformer for Object Detection and Segmentation},\nauthor={Duy Kien Nguyen and Martin R. Oswald and Cees G. M. Snoek},\nyear={2024},\nurl={https://openreview.net/forum?id=EUywF11YVi}\n}",
        "github": "",
        "project": "",
        "reviewers": "SZaB;ogBT;VYm9",
        "site": "https://openreview.net/forum?id=EUywF11YVi",
        "pdf_size": 1851325,
        "rating": "3;5;6",
        "confidence": "4;3;5",
        "soundness": "3;3;3",
        "contribution": "2;2;3",
        "presentation": "3;3;3",
        "wc_summary": "30;58;63",
        "wc_strengths": "42;100;63",
        "wc_weaknesses": "151;172;32",
        "wc_questions": "57;18;21",
        "wc_review": "280;348;179",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "500;286;204",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            50.333333333333336,
            14.522013940527977
        ],
        "wc_strengths_avg": [
            68.33333333333333,
            23.976840677805924
        ],
        "wc_weaknesses_avg": [
            118.33333333333333,
            61.64594246357356
        ],
        "wc_questions_avg": [
            32.0,
            17.72004514666935
        ],
        "wc_review_avg": [
            269.0,
            69.4310209248479
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            330.0,
            124.7824774023447
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.3273268353539886,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ruQiOZx4DyQJ:scholar.google.com/&scioq=SimPLR:+A+Simple+and+Plain+Transformer+for+Object+Detection+and+Segmentation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Amsterdam",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uva.nl",
        "aff_unique_abbr": "UvA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Netherlands"
    },
    {
        "id": "EVBR6xBXa2",
        "title": "A foundation model for time-series forecasting",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Motivated by recent advances in large language models for Natural Language Processing (NLP), we design a time-series foundation model for forecasting whose out-of-the-box zero-shot performance on a variety of datasets, matches the accuracy of state-of-the-art supervised forecasting models for each individual dataset. Our model is based on pretraining a patched-decoder style attention model on a large time series dataset, and can work well across different forecasting history lengths,  prediction lengths and temporal granularities.",
        "keywords": "time-series;foundation model;zero-shot;few-shot",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Rajat Sen;Yichen Zhou;Abhimanyu Das;Weihao Kong",
        "authorids": "~Rajat_Sen1;~Yichen_Zhou3;~Abhimanyu_Das2;~Weihao_Kong1",
        "gender": "M;;M;",
        "homepage": "http://rajatsen91.github.io;;https://sites.google.com/site/abhidas/;https://weihaokong.github.io/",
        "dblp": "http://dblp.uni-trier.de/pers/hd/s/Sen:Rajat;55/10422;83/6359;117/4343",
        "google_scholar": "YzsCLBoAAAAJ;YAJI36UAAAAJ;;loxOHhoAAAAJ",
        "orcid": ";0000-0002-4925-6184;;",
        "linkedin": "rajat-sen-a8702417/;yichen-zhou-9424554a/;;",
        "or_profile": "~Rajat_Sen1;~Yichen_Zhou3;~Abhimanyu_Das2;~Weihao_Kong1",
        "aff": "Google;Google;Research, Google;Google",
        "aff_domain": "google.com;google.com;research.google.com;google.com",
        "position": "Research Scientist;Data Scientist;Researcher;Researcher",
        "bibtex": "@misc{\nsen2024a,\ntitle={A foundation model for time-series forecasting},\nauthor={Rajat Sen and Yichen Zhou and Abhimanyu Das and Weihao Kong},\nyear={2024},\nurl={https://openreview.net/forum?id=EVBR6xBXa2}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=EVBR6xBXa2",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:a0qV9haORyQJ:scholar.google.com/&scioq=A+foundation+model+for+time-series+forecasting&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Google",
        "aff_unique_dep": "Google",
        "aff_unique_url": "https://www.google.com",
        "aff_unique_abbr": "Google",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Mountain View",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "EW3DGMEwBf",
        "title": "Selective Perception: Learning Concise State Descriptions for Language Model Actors",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "It is increasingly common for large language models (LLMs) to be applied as actors in sequential decision making problems in embodied domains such as robotics and games, due to their general world knowledge and planning abilities. However, LLMs are not natively trained for embodied decision making problems, and expressing complex state spaces in text is non-trivial. Exhaustively describing high-dimensional states leads to prohibitive inference costs and impaired task performance due to distracting or irrelevant information. Previous LLM actors avoid the issue by relying on hand-engineered, task-specific protocols to determine which features to communicate about a state and which to leave out. In this work, we propose BLINDER (Brief Language INputs for DEcision-making Responses), a method for learning to select concise and helpful sets of state features for LLM actors. BLINDER  learns a value function for task-conditioned state descriptions that approximates the likelihood that a state description will result in optimal actions. We evaluate BLINDER  on the challenging video game NetHack and a real-world robotic manipulation task. Our method improves task success rate by 77% and 14% on NetHack and robotic manipulation respectively, reduces model input length by 83%, and generalizes well to LLM actors of various size and quality.",
        "keywords": "embodied ai;reinforcement learning;natural language processing;large language models",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Kolby Nottingham;Yasaman Razeghi;Kyungmin Kim;JB Lanier;Pierre Baldi;Roy Fox;Sameer Singh",
        "authorids": "~Kolby_Nottingham1;~Yasaman_Razeghi1;~Kyungmin_Kim1;~JB_Lanier1;~Pierre_Baldi1;~Roy_Fox1;~Sameer_Singh1",
        "gender": "M;F;;;;M;M",
        "homepage": "http://kolbynottingham.com;https://yasamanrazeghi.com/;;;;https://royf.org;http://sameersingh.org",
        "dblp": "250/3133.html;https://dblp.dagstuhl.de/pid/277/6248.html;;;;32/7007;13/3568-1",
        "google_scholar": "2o3QdBAAAAAJ;YCtmdaMAAAAJ;;;;FH9nKOAAAAAJ;-hGZC54AAAAJ",
        "orcid": ";;;;;0000-0002-5562-3315;0000-0003-0621-6323",
        "linkedin": "kolby-nottingham/;;;;;;sameersingh/",
        "or_profile": "~Kolby_Nottingham1;~Yasaman_Razeghi1;~Kyungmin_Kim1;~JB_Lanier1;~Pierre_Baldi1;~Roy_Fox1;~Sameer_Singh1",
        "aff": "University of California, Irvine;University of California, Irvine;;;;University of California, Irvine;University of California, Irvine",
        "aff_domain": "uci.edu;uci.edu;;;;uci.edu;uci.edu",
        "position": "PhD student;PhD student;;;;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nnottingham2024selective,\ntitle={Selective Perception: Learning Concise State Descriptions for Language Model Actors},\nauthor={Kolby Nottingham and Yasaman Razeghi and Kyungmin Kim and JB Lanier and Pierre Baldi and Roy Fox and Sameer Singh},\nyear={2024},\nurl={https://openreview.net/forum?id=EW3DGMEwBf}\n}",
        "github": "",
        "project": "",
        "reviewers": "Xdzb;6BNo;rLTn;7C4S",
        "site": "https://openreview.net/forum?id=EW3DGMEwBf",
        "pdf_size": 9474001,
        "rating": "3;3;5;6",
        "confidence": "5;3;4;4",
        "soundness": "2;3;2;4",
        "contribution": "2;2;2;3",
        "presentation": "3;3;2;3",
        "wc_summary": "26;58;56;55",
        "wc_strengths": "16;30;78;86",
        "wc_weaknesses": "1043;155;410;160",
        "wc_questions": "5;2;79;177",
        "wc_review": "1090;245;623;478",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "240;153;227;319",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            48.75,
            13.179055353097201
        ],
        "wc_strengths_avg": [
            52.5,
            30.045798375147232
        ],
        "wc_weaknesses_avg": [
            442.0,
            361.97997182164653
        ],
        "wc_questions_avg": [
            65.75,
            71.25087718758274
        ],
        "wc_review_avg": [
            609.0,
            308.71264956266367
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            234.75,
            58.88282856656939
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11995452385653260221&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of California, Irvine",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uci.edu",
        "aff_unique_abbr": "UCI",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Irvine",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Minimax optimality of convolutional neural networks for infinite dimensional input-output problems and separation from kernel methods",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19104",
        "id": "EW8ZExRZkJ",
        "author_site": "Yuto Nishimura, Taiji Suzuki",
        "tldr": "",
        "abstract": "Recent deep learning applications, exemplified by text-to-image tasks, often involve high-dimensional inputs and outputs. While several studies have investigated the function estimation capabilities of deep learning, research on dilated convolutional neural networks (CNNs) has mainly focused on cases where input dimensions are infinite but output dimensions are one-dimensional, similar to many other studies. However, many practical deep learning tasks involve high-dimensional (or even infinite dimensional) inputs and outputs.\nIn this paper, we investigate the optimality of dilated CNNs for estimating a map between infinite-dimensional input and output spaces \nby analyzing their approximation and estimation abilities. \nFor that purpose, we first show that approximation and estimation errors depend only on the smoothness and decay rate with respect to the infinity norm of the output, and their estimation accuracy actually achieve the {\\it minimax optimal} rate of convergence.\nSecond, we demonstrate that the dilated CNNs outperform {\\it any} linear estimators including kernel ridge regression and $k$-NN estimators in a minimax error sense, highlighting the usefulness of feature learning realized by deep neural networks.\nOur theoretical analysis particularly explains the success of deep learning in recent high-dimensional input-output tasks.",
        "keywords": "neural network;nonlinear operator learning;convolutional network;estimation error analysis",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/cf43fff57246ed4b7062ed641df5c64464771c7a.pdf",
        "author": "Yuto Nishimura;Taiji Suzuki",
        "authorids": "~Yuto_Nishimura1;~Taiji_Suzuki1",
        "gender": ";M",
        "homepage": ";http://ibis.t.u-tokyo.ac.jp/suzuki/",
        "dblp": ";08/312",
        "google_scholar": ";x8osrBsAAAAJ",
        "orcid": ";",
        "linkedin": "yuto-nishimura-562213251/;",
        "or_profile": "~Yuto_Nishimura1;~Taiji_Suzuki1",
        "aff": "Tokyo University;The University of Tokyo",
        "aff_domain": "u-tokyo.ac.jp;tokyo.ac.jp",
        "position": "MS student;Associate Professor",
        "bibtex": "@inproceedings{\nnishimura2024minimax,\ntitle={Minimax optimality of convolutional neural networks for infinite dimensional input-output problems and separation from kernel methods},\nauthor={Yuto Nishimura and Taiji Suzuki},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=EW8ZExRZkJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "Ex9R;DeXd;qUYW",
        "pdf_size": 464863,
        "rating": "6;8;8",
        "confidence": "2;2;3",
        "soundness": "3;3;4",
        "contribution": "3;3;3",
        "presentation": "3;3;4",
        "wc_summary": "89;73;130",
        "wc_strengths": "59;87;86",
        "wc_weaknesses": "36;22;42",
        "wc_questions": "62;50;68",
        "wc_review": "246;232;326",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "727;377;484",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            97.33333333333333,
            24.00462918318511
        ],
        "wc_strengths_avg": [
            77.33333333333333,
            12.970050972229146
        ],
        "wc_weaknesses_avg": [
            33.333333333333336,
            8.379870059984356
        ],
        "wc_questions_avg": [
            60.0,
            7.483314773547883
        ],
        "wc_review_avg": [
            268.0,
            41.40853374205209
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            529.3333333333334,
            146.43845882220361
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.49999999999999983,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5958781307203325747&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=EW8ZExRZkJ",
        "pdf": "https://openreview.net/pdf?id=EW8ZExRZkJ",
        "email": "u-tokyo.ac.jp;tokyo.ac.jp",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Tokyo",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.u-tokyo.ac.jp",
        "aff_unique_abbr": "UTokyo",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Japan"
    },
    {
        "title": "Invariance-based Learning of Latent Dynamics",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19103",
        "id": "EWTFMkTdkT",
        "author_site": "Kai Lagemann, Christian Lagemann, Sach Mukherjee",
        "tldr": "",
        "abstract": "We propose a new model class aimed at predicting dynamical trajectories from high-dimensional empirical data. This is done by combining variational autoencoders and (spatio-)temporal transformers within a  framework designed to enforce certain scientifically-motivated invariances. The models allow inference of system behavior at any continuous time and generalization well beyond the data distributions seen during training. Furthermore, the models do not require an explicit neural ODE formulation, making them efficient and highly scalable in practice. We study  behavior through simple theoretical analyses and  extensive empirical experiments. The latter investigate  the ability to predict the trajectories of complicated  systems based on finite data and show that the proposed approaches can outperform existing neural-dynamical models. We study also more general inductive bias in the context of transfer to data obtained under entirely novel system interventions. Overall, our results provide a new framework for efficiently learning complicated dynamics in a data-driven manner, with potential applications in a wide range of fields including physics, biology, and engineering.",
        "keywords": "Latent Dynamical Model;Invariant Decomposition;Neural Network;Spatio-Temporal Attention",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Kai Lagemann;Christian Lagemann;Sach Mukherjee",
        "authorids": "~Kai_Lagemann1;~Christian_Lagemann1;~Sach_Mukherjee1",
        "gender": ";M;",
        "homepage": ";;",
        "dblp": "307/3461;307/3409;",
        "google_scholar": ";6BgfQAgAAAAJ;",
        "orcid": "0000-0001-8485-7682;0000-0003-1150-4987;",
        "linkedin": ";;",
        "or_profile": "~Kai_Lagemann1;~Christian_Lagemann1;~Sach_Mukherjee1",
        "aff": "DZNE;;",
        "aff_domain": "dzne.de;;",
        "position": "PhD student;;",
        "bibtex": "@inproceedings{\nlagemann2024invariancebased,\ntitle={Invariance-based Learning of Latent Dynamics},\nauthor={Kai Lagemann and Christian Lagemann and Sach Mukherjee},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=EWTFMkTdkT}\n}",
        "github": "",
        "project": "",
        "reviewers": "Fm8i;8oY3;1fGG;apHo",
        "pdf_size": 4810507,
        "rating": "5;6;6;6",
        "confidence": "3;2;3;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;4;2",
        "wc_summary": "78;106;138;155",
        "wc_strengths": "32;90;104;103",
        "wc_weaknesses": "298;304;709;173",
        "wc_questions": "179;86;196;243",
        "wc_review": "587;586;1147;674",
        "wc_reply_reviewers": "243;30;289;173",
        "wc_reply_authors": "883;640;908;884",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            119.25,
            29.608909132218972
        ],
        "wc_strengths_avg": [
            82.25,
            29.532820725423434
        ],
        "wc_weaknesses_avg": [
            371.0,
            202.03093822481745
        ],
        "wc_questions_avg": [
            176.0,
            57.00438579618238
        ],
        "wc_review_avg": [
            748.5,
            232.83094725572886
        ],
        "wc_reply_reviewers_avg": [
            183.75,
            97.9065242974134
        ],
        "wc_reply_authors_avg": [
            828.75,
            109.4334843637906
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10665038395478307463&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=EWTFMkTdkT",
        "pdf": "https://openreview.net/pdf?id=EWTFMkTdkT",
        "email": "dzne.de;;",
        "author_num": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "German Center for Neurodegenerative Diseases",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.dzne.de",
        "aff_unique_abbr": "DZNE",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "EWcybWr3MR",
        "title": "Unlocking Tuning-free Generalization: Minimizing the PAC-Bayes Bound with Trainable Priors",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "It is widely recognized that the generalization ability of neural networks can be greatly enhanced through carefully tuning the training procedure. The current state-of-the-art training approach involves utilizing stochastic gradient descent (SGD) or Adam optimization algorithms along with a combination of additional regularization techniques such as weight decay, dropout, or noise injection. Optimal generalization can only be achieved by tuning a multitude of hyper-parameters extensively, which can be time-consuming and necessitates the additional validation dataset. To address this issue, we present a nearly tuning-free PAC-Bayes training framework that requires no extra regularization. This framework achieves test performance comparable to that of SGD/Adam, even when the latter are optimized through a complete grid search and supplemented with additional regularization terms.",
        "keywords": "Generalization; PAC-Bayes bounds; Deep Neural Networks",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/5f964ff006bff320db4c7a41393eadac65924b7b.zip",
        "author": "Xitong Zhang;Avrajit Ghosh;Guangliang Liu;Rongrong Wang",
        "authorids": "~Xitong_Zhang1;~Avrajit_Ghosh1;~Guangliang_Liu2;~Rongrong_Wang1",
        "gender": "M;M;M;",
        "homepage": ";https://sites.google.com/view/avrajitghosh;;https://users.math.msu.edu/users/wangron6/",
        "dblp": "156/9687;261/2812;;",
        "google_scholar": "Ci9svAcAAAAJ;Q44Z8hwAAAAJ;;",
        "orcid": ";;;",
        "linkedin": "xitong-zhang-70118915a/;;;",
        "or_profile": "~Xitong_Zhang1;~Avrajit_Ghosh1;~Guangliang_Liu2;~Rongrong_Wang1",
        "aff": "Michigan State University;RIKEN;Michigan State University;Michigan State University",
        "aff_domain": "msu.edu;riken.jp;msu.edu;msu.edu",
        "position": "PhD student;Intern;PhD student;Associate Professor",
        "bibtex": "@misc{\nzhang2024unlocking,\ntitle={Unlocking Tuning-free Generalization: Minimizing the {PAC}-Bayes Bound with Trainable Priors},\nauthor={Xitong Zhang and Avrajit Ghosh and Guangliang Liu and Rongrong Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=EWcybWr3MR}\n}",
        "github": "",
        "project": "",
        "reviewers": "YdhE;geV1;Htid;R7cX;DC8a",
        "site": "https://openreview.net/forum?id=EWcybWr3MR",
        "pdf_size": 10836587,
        "rating": "5;5;6;6;8",
        "confidence": "3;4;3;3;4",
        "soundness": "3;3;4;3;4",
        "contribution": "2;2;2;3;4",
        "presentation": "2;3;3;3;3",
        "wc_summary": "87;92;99;80;112",
        "wc_strengths": "36;124;141;62;107",
        "wc_weaknesses": "117;695;225;95;101",
        "wc_questions": "11;3;141;95;170",
        "wc_review": "251;914;606;332;490",
        "wc_reply_reviewers": "10;440;99;94;14",
        "wc_reply_authors": "841;3311;1358;1248;428",
        "reply_reviewers": "1;1;2;1;1",
        "reply_authors": "4;8;6;5;2",
        "rating_avg": [
            6.0,
            1.0954451150103321
        ],
        "confidence_avg": [
            3.4,
            0.4898979485566356
        ],
        "soundness_avg": [
            3.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.6,
            0.8
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            94.0,
            10.936178491593852
        ],
        "wc_strengths_avg": [
            94.0,
            39.156097864828155
        ],
        "wc_weaknesses_avg": [
            246.6,
            229.1319270638642
        ],
        "wc_questions_avg": [
            84.0,
            67.31418869748042
        ],
        "wc_review_avg": [
            518.6,
            232.90650484690204
        ],
        "wc_reply_reviewers_avg": [
            131.4,
            158.87303106569095
        ],
        "wc_reply_authors_avg": [
            1437.2,
            992.6867381001925
        ],
        "reply_reviewers_avg": [
            1.2,
            0.4
        ],
        "reply_authors_avg": [
            5.0,
            2.0
        ],
        "replies_avg": [
            38,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.372677996249965,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:C8Q1TxiaRPMJ:scholar.google.com/&scioq=Unlocking+Tuning-free+Generalization:+Minimizing+the+PAC-Bayes+Bound+with+Trainable+Priors&hl=en&as_sdt=0,5",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Michigan State University;RIKEN",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.msu.edu;https://www.riken.jp",
        "aff_unique_abbr": "MSU;RIKEN",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "United States;Japan"
    },
    {
        "id": "EX7AxKgc46",
        "title": "Improved Generalization of cGAN using Vicinal Estimation and Early Stopping",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The problem of generating high-dimensional distributions has been known as a difficult problem in machine learning due to the Curse of Dimensionality: the higher the dimensionality is the more the empirical data deviates from its original distribution even for a large number of samples. Along with the Curse of Dimensionality, the generalization of conditional density estimation (CDE) suffers from so-called Lack of Conditional Samples: the number of data for each conditional density is usually much smaller than the number of samples or no data is avaiable for some conditional densities. To overcome these difficulties, we introduce the concept of Vicinal Estimation (VE) which is shown to be useful in estimating conditional densities. With VE we propose a conditional Generative Adversarial Network (cGAN) model and analyze theoretically that the generalization error of our model is independent of the dimensionality of the output. We also show that our theoretical analysis holds in practice through experiments.",
        "keywords": "Supervised Learning;Conditional density estimation;Generative Adversarial Network;Vicinal Risk Minimization",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/98a332dbe7bdf76d4775f0b149aa7d46ef7b1e51.zip",
        "author": "Ki Joung Jang;Ganguk Hwang",
        "authorids": "~Ki_Joung_Jang1;~Ganguk_Hwang1",
        "gender": "M;M",
        "homepage": ";https://sites.google.com/view/probai-lab/home",
        "dblp": ";125/1390",
        "google_scholar": "https://scholar.google.com/citations?hl=ko;",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Ki_Joung_Jang1;~Ganguk_Hwang1",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.edu;kaist.edu",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\njang2024improved,\ntitle={Improved Generalization of c{GAN} using Vicinal Estimation and Early Stopping},\nauthor={Ki Joung Jang and Ganguk Hwang},\nyear={2024},\nurl={https://openreview.net/forum?id=EX7AxKgc46}\n}",
        "github": "",
        "project": "",
        "reviewers": "JCHw;ushT;JqUD;GnZt",
        "site": "https://openreview.net/forum?id=EX7AxKgc46",
        "pdf_size": 436960,
        "rating": "3;3;5;5",
        "confidence": "2;4;4;2",
        "soundness": "2;2;2;3",
        "contribution": "2;2;3;2",
        "presentation": "2;2;2;2",
        "wc_summary": "9;137;68;92",
        "wc_strengths": "9;16;50;38",
        "wc_weaknesses": "21;287;41;339",
        "wc_questions": "16;2;251;166",
        "wc_review": "55;442;410;635",
        "wc_reply_reviewers": "0;269;45;0",
        "wc_reply_authors": "289;653;714;923",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.0,
            1.0
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            76.5,
            46.176292618615456
        ],
        "wc_strengths_avg": [
            28.25,
            16.498105951896417
        ],
        "wc_weaknesses_avg": [
            172.0,
            142.36923825040296
        ],
        "wc_questions_avg": [
            108.75,
            104.29615285330519
        ],
        "wc_review_avg": [
            385.5,
            209.3280917602795
        ],
        "wc_reply_reviewers_avg": [
            78.5,
            111.50896824919509
        ],
        "wc_reply_authors_avg": [
            644.75,
            228.49767504287652
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Rp1FFn5bajQJ:scholar.google.com/&scioq=Improved+Generalization+of+cGAN+using+Vicinal+Estimation+and+Early+Stopping&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "EXHNjwULlQ",
        "title": "Learned Mixing Weights for Transferable Tabular Data Augmentation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We present an architecture-agnostic method for tabular data augmentation, which mixes pairs of samples from the training set. The mixing procedure is based on a set of per-feature weights that are assigned by a learned network $g$ that is separate from the primary classification model $f$. The features are selected between the two samples at random, and the sum of the weights that $g$ assigns the features that are selected from each sample determines the mixing of the target label. $g$ itself is trained based on two loss terms, one that encourages variability in the assigned weights between the features and one that encourages, for every training sample, the model $f$ to be agnostic to the features for which $g$ assigns low weights. \nOur experiments show that this learned data augmentation method improves multiple neural architectures designed for tabular data. Even more notable is that the network $g$ that was trained on an MLP produces mixed samples that improve non-differentiable methods, including classical methods and gradient-boosting decision tree methods. This is done without any further tuning and with the default parameters of the classifiers. The outcome achieved this way, using the cutting-edge CatBoost method now represents the state of the art.",
        "keywords": "Tabuler data;mix augmentation;data augmentation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Tal Shaharabany;Lior Wolf",
        "authorids": "~Tal_Shaharabany1;~Lior_Wolf1",
        "gender": "M;M",
        "homepage": ";http://www.cs.tau.ac.il/~wolf",
        "dblp": ";83/4103",
        "google_scholar": "SyA5pnoAAAAJ;UbFrXTsAAAAJ",
        "orcid": ";0000-0001-5578-8892",
        "linkedin": ";",
        "or_profile": "~Tal_Shaharabany1;~Lior_Wolf1",
        "aff": "Tel Aviv University, Technion;Tel Aviv University",
        "aff_domain": "tau.ac.il;tau.ac.il",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nshaharabany2024learned,\ntitle={Learned Mixing Weights for Transferable Tabular Data Augmentation},\nauthor={Tal Shaharabany and Lior Wolf},\nyear={2024},\nurl={https://openreview.net/forum?id=EXHNjwULlQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "fbLq;tQjd;mN7Y;6Hg6;94ej",
        "site": "https://openreview.net/forum?id=EXHNjwULlQ",
        "pdf_size": 1137154,
        "rating": "3;3;5;5;6",
        "confidence": "3;3;4;3;3",
        "soundness": "2;2;3;3;2",
        "contribution": "2;2;2;2;3",
        "presentation": "2;1;3;2;3",
        "wc_summary": "45;56;167;41;113",
        "wc_strengths": "21;28;100;44;40",
        "wc_weaknesses": "225;428;122;276;88",
        "wc_questions": "27;197;102;113;2",
        "wc_review": "318;709;491;474;243",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            4.4,
            1.2
        ],
        "confidence_avg": [
            3.2,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.2,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            84.4,
            48.75079486531477
        ],
        "wc_strengths_avg": [
            46.6,
            27.939935576160515
        ],
        "wc_weaknesses_avg": [
            227.8,
            120.95354480129964
        ],
        "wc_questions_avg": [
            88.2,
            69.01999710228914
        ],
        "wc_review_avg": [
            447.0,
            160.9757745749341
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.25000000000000006,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ZxKvUaL6sEkJ:scholar.google.com/&scioq=Learned+Mixing+Weights+for+Transferable+Tabular+Data+Augmentation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Tel Aviv University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tau.ac.il",
        "aff_unique_abbr": "TAU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Israel"
    },
    {
        "title": "Open-ended VQA benchmarking of Vision-Language models by exploiting Classification datasets and their semantic hierarchy",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19102",
        "id": "EXitynZhYn",
        "author_site": "Simon Ging, Maria A. Bravo, Thomas Brox",
        "tldr": "",
        "abstract": "The evaluation of text-generative vision-language models is a challenging yet crucial endeavor. By addressing the limitations of existing Visual Question Answering (VQA) benchmarks and proposing innovative evaluation methodologies, our research seeks to advance our understanding of these models\u2019 capabilities. We propose a novel VQA benchmark based on well-known visual classification datasets which allows a granular evaluation of text-generative vision-language models and their comparison with discriminative vision-language models. To improve the assessment of coarse answers on fine-grained classification tasks, we suggest using the semantic hierarchy of the label space to ask automatically generated follow-up questions about the ground-truth category. Finally, we compare traditional NLP and LLM-based metrics for the problem of evaluating model predictions given ground-truth answers. We perform a human evaluation study upon which we base our decision on the final metric. We apply our benchmark to a suite of vision-language models and show a detailed comparison of their abilities on object, action, and attribute classification. Our contributions aim to lay the foundation for more precise and meaningful assessments, facilitating targeted progress in the exciting field of vision-language modeling.",
        "keywords": "Open-ended VQA;benchmark;Vision-Language;VL;Vision-Text;VLM;Vision-Language models;Image classification;Visual question answering;Text-generating VLM",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Simon Ging;Maria Alejandra Bravo;Thomas Brox",
        "authorids": "~Simon_Ging1;~Maria_Alejandra_Bravo1;~Thomas_Brox1",
        "gender": ";F;M",
        "homepage": "https://lmb.informatik.uni-freiburg.de/people/gings/;https://lmb.informatik.uni-freiburg.de/people/bravoma/;https://lmb.informatik.uni-freiburg.de/people/brox/index.en.html",
        "dblp": "277/9398;212/9488.html;97/4586",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=de",
        "orcid": ";;0000-0002-6282-8861",
        "linkedin": ";maria-a-bravo-5960b3155/;",
        "or_profile": "~Simon_Ging1;~Maria_Alejandra_Bravo1;~Thomas_Brox1",
        "aff": "Albert-Ludwigs-Universit\u00e4t Freiburg;Amazon;University of Freiburg",
        "aff_domain": "uni-freiburg.de;amazon.com;uni-freiburg.de",
        "position": "PhD student;Intern;Full Professor",
        "bibtex": "@inproceedings{\nging2024openended,\ntitle={Open-ended {VQA} benchmarking of Vision-Language models by exploiting Classification datasets and their semantic hierarchy},\nauthor={Simon Ging and Maria Alejandra Bravo and Thomas Brox},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=EXitynZhYn}\n}",
        "github": "",
        "project": "",
        "reviewers": "bBwP;GTBt;3kX8",
        "pdf_size": 10330487,
        "rating": "5;8;8",
        "confidence": "3;5;5",
        "soundness": "2;4;3",
        "contribution": "2;4;3",
        "presentation": "3;4;3",
        "wc_summary": "41;88;162",
        "wc_strengths": "53;141;213",
        "wc_weaknesses": "88;42;64",
        "wc_questions": "6;4;7",
        "wc_review": "188;275;446",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "582;145;51",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            7.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            97.0,
            49.80629143659129
        ],
        "wc_strengths_avg": [
            135.66666666666666,
            65.42850211405492
        ],
        "wc_weaknesses_avg": [
            64.66666666666667,
            18.785337071473826
        ],
        "wc_questions_avg": [
            5.666666666666667,
            1.247219128924647
        ],
        "wc_review_avg": [
            303.0,
            107.17275773255068
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            259.3333333333333,
            231.3645512077327
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14264048818560162377&as_sdt=40000005&sciodt=0,22&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=EXitynZhYn",
        "pdf": "https://openreview.net/pdf?id=EXitynZhYn",
        "email": "uni-freiburg.de;amazon.com;uni-freiburg.de",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Albert-Ludwigs-Universit\u00e4t Freiburg;Amazon;University of Freiburg",
        "aff_unique_dep": ";Amazon.com, Inc.;",
        "aff_unique_url": "https://www.uni-freiburg.de;https://www.amazon.com;https://www.uni-freiburg.de",
        "aff_unique_abbr": "Albert-Ludwigs-Universit\u00e4t;Amazon;UoF",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Freiburg;",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Germany;United States"
    },
    {
        "id": "EYtga9mSdT",
        "title": "Balanced learning with Token Selection for Few-shot Classification",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In recent years, patch-based approaches have shown promise in few-shot learning, with further improvements observed through the use of self-supervised learning. \nHowever, we observe that the mainstream object-oriented approach focuses mainly on the salient part of the subject and also ignores the non-annotated part of the image.\nBased on the assumption that any patch of the image is beneficial to learning, we present an end-to-end learning framework, which reconsiders the whole image from a multi-level perspective.\nThe learning of annotated subjects involves Direct Patch Learning (DPL) to promote balanced learning of different features, and Gaussian Mixup (GMIX) to provide extra mixed patch-level labels.\nAs for the non-annotated part, we utilize a cascading token selection strategy along with self-supervised learning to better utilize knowledge in the background in the current context by learning the consistent representation of different views from the same image.\nFinally, in inductive few-shot learning, our method outperforms many previous methods and achieves new state-of-the-art performance.\nFurthermore, it provides an insight that non-annotated parts still is favorable for few-shot learning.\nAs an ablation study, the effectiveness of each designed component is verified and the mechanism of how our method outperforms the baseline is shown both quantitatively and visually.",
        "keywords": "few-shot classification;self-supervised learning;deep learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Peiwen Sun;Wangding Zeng;Xinying Zhao;Honggang Zhang",
        "authorids": "~Peiwen_Sun1;~Wangding_Zeng1;~Xinying_Zhao1;~Honggang_Zhang1",
        "gender": ";M;;M",
        "homepage": ";;;https://teacher.bupt.edu.cn/zhanghonggang/zh_CN/index.htm",
        "dblp": ";;;82/1228-2.html",
        "google_scholar": ";RXE7hCoAAAAJ;;",
        "orcid": ";;0000-0001-5342-1472;0000-0001-8287-6783",
        "linkedin": ";;;",
        "or_profile": "~Peiwen_Sun1;~Wangding_Zeng1;~Xinying_Zhao1;~Honggang_Zhang1",
        "aff": ";Beijing University of Posts and Telecommunications;Institute of Computing Technology, Chinese Academy of Sciences;Beijing University of Posts and Telecommunications",
        "aff_domain": ";bupt.edu.cn;ict.ac.cn;bupt.edu.cn",
        "position": ";MS student;MS student;Associate Professor",
        "bibtex": "@misc{\nsun2024balanced,\ntitle={Balanced learning with Token Selection for Few-shot Classification},\nauthor={Peiwen Sun and Wangding Zeng and Xinying Zhao and Honggang Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=EYtga9mSdT}\n}",
        "github": "",
        "project": "",
        "reviewers": "yR4m;E3Wj;EnYW;HMyX",
        "site": "https://openreview.net/forum?id=EYtga9mSdT",
        "pdf_size": 3794630,
        "rating": "3;5;5;5",
        "confidence": "5;4;4;3",
        "soundness": "2;3;2;3",
        "contribution": "2;3;3;2",
        "presentation": "3;2;3;2",
        "wc_summary": "132;74;141;63",
        "wc_strengths": "21;19;151;29",
        "wc_weaknesses": "241;407;540;366",
        "wc_questions": "212;6;317;3",
        "wc_review": "606;506;1149;461",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            102.5,
            34.3693177121688
        ],
        "wc_strengths_avg": [
            55.0,
            55.5517776493246
        ],
        "wc_weaknesses_avg": [
            388.5,
            106.72042915955689
        ],
        "wc_questions_avg": [
            134.5,
            135.20077662498835
        ],
        "wc_review_avg": [
            680.5,
            275.5326659399934
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:gZ5ZOgw_bpgJ:scholar.google.com/&scioq=Balanced+learning+with+Token+Selection+for+Few-shot+Classification&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Beijing University of Posts and Telecommunications;Chinese Academy of Sciences",
        "aff_unique_dep": ";Institute of Computing Technology",
        "aff_unique_url": "http://www.bupt.edu.cn/;http://www.ict.ac.cn",
        "aff_unique_abbr": "BUPT;CAS",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Beijing;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "EZ4VwxpzCK",
        "title": "PROSPECT: Learn MLPs Robust against Graph Adversarial Structure Attacks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Current adversarial defense methods for GNNs exhibit critical limitations obstructing real-world application: 1) inadequate adaptability to graph heterophily, 2) absent generalizability to early GNNs like GraphSAGE used downstream, and 3) low inference scalability unacceptable for resource-constrained scenarios. To simultaneously address these challenges, we propose PROSPECT, the first online graph distillation multi-layer perceptron (GD-MLP) framework for learning GNNs and MLPs robust against adversarial structure attacks on both homophilous and heterophilous graphs. PROSPECT fits into GraphSAGE seamlessly and achieves inference scalability exponentially higher than conventional GNNs. Through decision boundary analysis, we formally prove the robustness of PROSPECT against successful adversarial attacks. Furthermore, by leveraging the Banach fixed-point theorem, we analyze the convergence condition of the MLP in PROSPECT and propose a quasi-alternating cosine annealing (QACA) learning rate scheduler, inspired by our convergence analysis and the alternating iterative turbo decoding from information theory. Experiments on five homophilous and three heterophilous graphs demonstrate the advantages of PROSPECT over current defense methods and offline GD-MLPs in adversarial robustness and clean accuracy, the inference scalability of PROSPECT orders of magnitude higher than existing defenders, and the effectiveness of QACA.",
        "keywords": "graph neural networks;adversarial robustness;graph knowledge distillation;graph heterophily",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/893181bb4a13c5d4edacacd87984a5ca757b504e.zip",
        "author": "Bowen Deng;Jialong Chen;Yanming Hu;Zhiyong Xu;Chuan Chen;Zhang Tao",
        "authorids": "~Bowen_Deng2;~Jialong_Chen1;~Yanming_Hu2;~Zhiyong_Xu2;~Chuan_Chen1;~Zhang_Tao3",
        "gender": ";M;M;M;M;M",
        "homepage": ";https://github.com/Loong-Chan;http://127.0.0.1.com;https://github.com/lafe-xzy;https://cse.sysu.edu.cn/teacher/ChenChuan;https://ssse.sysu.edu.cn/teacher/241",
        "dblp": ";;241/9103;;03/1359-1;",
        "google_scholar": ";https://scholar.google.com.hk/citations?user=W5LLHgwAAAAJ;;;s_zdg_IAAAAJ;",
        "orcid": ";;0009-0008-9069-8161;;0000-0002-7048-3445;0000-0002-9161-3210",
        "linkedin": ";;;;chuan-chen-173507157/;",
        "or_profile": "~Bowen_Deng2;~Jialong_Chen1;~Yanming_Hu2;~Zhiyong_Xu2;~Chuan_Chen1;~Zhang_Tao3",
        "aff": ";SUN YAT-SEN UNIVERSITY;SUN YAT-SEN UNIVERSITY;SUN YAT-SEN UNIVERSITY;Sun Yat-Sen University;SUN YAT-SEN UNIVERSITY",
        "aff_domain": ";sysu.edu.cn;sysu.edu.cn;sysu.edu.cn;mail.sysu.edu.cn;sysu.edu.cn",
        "position": ";PhD student;MS student;Undergrad student;Associate Professor;Full Professor",
        "bibtex": "@misc{\ndeng2024prospect,\ntitle={{PROSPECT}: Learn {MLP}s Robust against Graph Adversarial Structure Attacks},\nauthor={Bowen Deng and Jialong Chen and Yanming Hu and Zhiyong Xu and Chuan Chen and Zhang Tao},\nyear={2024},\nurl={https://openreview.net/forum?id=EZ4VwxpzCK}\n}",
        "github": "",
        "project": "",
        "reviewers": "9crP;JnCK;GM8H;Gu8Y",
        "site": "https://openreview.net/forum?id=EZ4VwxpzCK",
        "pdf_size": 3902776,
        "rating": "3;3;5;6",
        "confidence": "4;4;3;4",
        "soundness": "2;2;3;3",
        "contribution": "2;3;2;2",
        "presentation": "3;2;3;1",
        "wc_summary": "62;64;98;56",
        "wc_strengths": "17;41;91;26",
        "wc_weaknesses": "274;319;63;210",
        "wc_questions": "40;68;86;134",
        "wc_review": "393;492;338;426",
        "wc_reply_reviewers": "131;211;0;23",
        "wc_reply_authors": "595;1167;222;1797",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "1;2;1;3",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            70.0,
            16.431676725154983
        ],
        "wc_strengths_avg": [
            43.75,
            28.595235617144336
        ],
        "wc_weaknesses_avg": [
            216.5,
            96.71737175916228
        ],
        "wc_questions_avg": [
            82.0,
            34.20526275297414
        ],
        "wc_review_avg": [
            412.25,
            55.75112106496155
        ],
        "wc_reply_reviewers_avg": [
            91.25,
            85.00698500711574
        ],
        "wc_reply_authors_avg": [
            945.25,
            595.9061901843276
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17963422114546005629&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Sun Yat-sen University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.sysu.edu.cn",
        "aff_unique_abbr": "SYSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "EaB7Ue1X9p",
        "title": "High-Dimensional Safe Exploration via Optimistic Local Latent Safe Optimization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Optimization over high-dimensional input space is inherently difficult, especially when safety needs to be maintained during sampling. Current safe exploration algorithms ensure safety by conservatively expanding the safe region, which leads to inefficiency in large input settings. Existing high-dimensional constrained optimization methods also neglect safety in the search process. In this paper, we propose Optimistic Local Latent Safe Optimization (OLLSO), which is capable of handling high-dimensional problems under probabilistic safety satisfaction. We first use distance-preserved autoencoder to transform the original input space into a low-dimensional continuous latent space. An optimistic local safe strategy is then applied over the latent space to efficiently optimize the utility function. \nTheoretically, we prove the probabilistic safety guarantee from the latent space to the original space.\nOLLSO outperforms representative high-dimensional constrained optimization algorithms in simulation experiments. We also show its real application in clinical experiments for safe and efficient online optimization of a neuromodulation therapy.",
        "keywords": "Safe Bayesian optimization;High-dimensional optimization;Sequential online optimization",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/de6dbcef63a2005844d9ccc831ea6fb588fbfa30.zip",
        "author": "Yunyue Wei;Zeji Yi;Hongda Li;Saraswati Soedarmadji;Yanan Sui",
        "authorids": "~Yunyue_Wei1;~Zeji_Yi1;~Hongda_Li2;~Saraswati_Soedarmadji1;~Yanan_Sui1",
        "gender": "M;M;M;;M",
        "homepage": "https://github.com/yunyuewei;https://neuralmachine.cc/members.html;https://hongdali.com;https://www.caltech.edu;https://www.yanansui.com",
        "dblp": ";;;;151/6934",
        "google_scholar": ";;;;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Yunyue_Wei1;~Zeji_Yi1;~Hongda_Li2;~Saraswati_Soedarmadji1;~Yanan_Sui1",
        "aff": "Tsinghua University;Tsinghua University;Tsinghua University;California Institute of Technology;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;caltech.edu;tsinghua.edu.cn",
        "position": "PhD student;MS student;PhD student;Undergrad student;Associate Professor",
        "bibtex": "@misc{\nwei2024highdimensional,\ntitle={High-Dimensional Safe Exploration via Optimistic Local Latent Safe Optimization},\nauthor={Yunyue Wei and Zeji Yi and Hongda Li and Saraswati Soedarmadji and Yanan Sui},\nyear={2024},\nurl={https://openreview.net/forum?id=EaB7Ue1X9p}\n}",
        "github": "",
        "project": "",
        "reviewers": "N9rb;WSiY;Cfdg;Hhpv",
        "site": "https://openreview.net/forum?id=EaB7Ue1X9p",
        "pdf_size": 10815403,
        "rating": "3;5;5;8",
        "confidence": "5;3;3;3",
        "soundness": "1;2;2;3",
        "contribution": "1;2;2;2",
        "presentation": "2;2;3;2",
        "wc_summary": "77;62;99;127",
        "wc_strengths": "39;71;53;156",
        "wc_weaknesses": "720;378;187;30",
        "wc_questions": "61;38;124;229",
        "wc_review": "897;549;463;542",
        "wc_reply_reviewers": "583;101;392;20",
        "wc_reply_authors": "1938;1072;1404;1061",
        "reply_reviewers": "2;1;1;1",
        "reply_authors": "4;4;3;3",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            91.25,
            24.47830672248389
        ],
        "wc_strengths_avg": [
            79.75,
            45.46083479215928
        ],
        "wc_weaknesses_avg": [
            328.75,
            257.3163179823619
        ],
        "wc_questions_avg": [
            113.0,
            74.00337830126406
        ],
        "wc_review_avg": [
            612.75,
            167.55055207309823
        ],
        "wc_reply_reviewers_avg": [
            274.0,
            225.74875414938617
        ],
        "wc_reply_authors_avg": [
            1368.75,
            356.3912000877687
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.5,
            0.5
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.7276068751089989,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4614574568699555383&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "Tsinghua University;California Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.caltech.edu",
        "aff_unique_abbr": "THU;Caltech",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Pasadena",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "EaLfdBPlIh",
        "title": "Adaptive Slot Attention: Object Discovery with Dynamic Slot Number",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Object-centric learning (OCL) extracts the representation of objects with slots, offering an exceptional blend of flexibility and interpretability for abstracting low-level perceptual features. A widely adopted method within OCL is slot attention, which utilizes attention mechanisms to iteratively refine slot representations. However, a major drawback of most object-centric models, including slot attention, is their reliance on predefining the number of slots. This not only necessitates prior knowledge of the dataset but also overlooks the inherent variability in the number of objects present.\nTo overcome this fundamental limitation, we present a novel complexity-aware object auto-encoder framework. Within this framework, we introduce an adaptive slot attention mechanism that dynamically determines the optimal number of slots based on the content of the data. This is achieved by proposing a discrete slot sampling module that is responsible for selecting an appropriate number of slots from a candidate list. Furthermore, we introduce a masked slot decoder that suppresses unselected slots during the decoding process.\nTo validate the effectiveness of our framework, we conduct extensive evaluations on object discovery tasks using diverse datasets. The experimental results demonstrate that our framework achieves performance that is comparable to or even surpasses the best-performing fixed-slot models in evaluation. Moreover, our analysis substantiates that our method exhibits the capability to dynamically adapt the slot number according to the complexity of each specific instance. The instance-level adaptability offers potential for further exploration in slot attention research.",
        "keywords": "Object-centric Learning;Slot Attention;Gumbel-Softmax",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/6f5fb0936abfc56942b331f61698937e56014fd8.zip",
        "author": "Ke Fan;Zechen Bai;Tianjun Xiao;Tong He;Max Horn;Yanwei Fu;Francesco Locatello;Zheng Zhang",
        "authorids": "~Ke_Fan1;~Zechen_Bai1;~Tianjun_Xiao1;~Tong_He5;~Max_Horn1;~Yanwei_Fu2;~Francesco_Locatello1;~Zheng_Zhang1",
        "gender": "M;M;M;M;M;M;M;M",
        "homepage": ";https://www.baizechen.site/;http://tianjunxiao.com/;https://hetong007.github.io/;https://expectationmax.github.io;http://yanweifu.github.io;https://twitter.com/FrancescoLocat8;https://shanghai.nyu.edu/academics/faculty/directory/zheng-zhang",
        "dblp": ";256/5272;;02/1554-2;https://dblp.uni-trier.de/pers/hd/h/Horn:Max;63/9065;195/6074;",
        "google_scholar": "426Vf3kAAAAJ;aIdQ8GwAAAAJ;DaKJ9pAAAAAJ;hV5D8GYAAAAJ;60cGPvIAAAAJ;https://scholar.google.co.uk/citations?user=Vg54TcsAAAAJ;;https://scholar.google.com.hk/citations?user=k0KiE4wAAAAJ",
        "orcid": ";;;;0000-0002-8269-9948;0000-0002-6595-6893;;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Ke_Fan1;~Zechen_Bai1;~Tianjun_Xiao1;~Tong_He5;~Max_Horn1;~Yanwei_Fu2;~Francesco_Locatello1;~Zheng_Zhang1",
        "aff": "Fudan University;National University of Singapore;Amazon;Amazon;GSK plc;Fudan University,;Institute of Science and Technology;Amazon",
        "aff_domain": "fudan.edu.cn;u.nus.edu;amazon.com;amazon.com;gsk.com;fudan.edu.cn;ist.ac.at;amazon.com",
        "position": "PhD student;PhD student;Senior Applied Scientist;Researcher;Researcher;Professor;Assistant Professor;Senior Principal Scientist",
        "bibtex": "@misc{\nfan2024adaptive,\ntitle={Adaptive Slot Attention: Object Discovery with Dynamic Slot Number},\nauthor={Ke Fan and Zechen Bai and Tianjun Xiao and Tong He and Max Horn and Yanwei Fu and Francesco Locatello and Zheng Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=EaLfdBPlIh}\n}",
        "github": "",
        "project": "",
        "reviewers": "zxD3;BxGH;pNUM;CDqw",
        "site": "https://openreview.net/forum?id=EaLfdBPlIh",
        "pdf_size": 7167763,
        "rating": "5;5;5;5",
        "confidence": "4;5;3;3",
        "soundness": "2;2;3;2",
        "contribution": "2;2;2;2",
        "presentation": "3;3;3;2",
        "wc_summary": "87;68;71;71",
        "wc_strengths": "46;40;35;63",
        "wc_weaknesses": "163;252;172;367",
        "wc_questions": "60;134;5;45",
        "wc_review": "356;494;283;546",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "255;467;216;233",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            74.25,
            7.46240577829965
        ],
        "wc_strengths_avg": [
            46.0,
            10.559356040971437
        ],
        "wc_weaknesses_avg": [
            238.5,
            81.87948461000472
        ],
        "wc_questions_avg": [
            61.0,
            46.69582422444217
        ],
        "wc_review_avg": [
            419.75,
            105.13889622779953
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            292.75,
            101.5489414026557
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12443357756429109055&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;1;2;2;3;0;4;2",
        "aff_unique_norm": "Fudan University;National University of Singapore;Amazon;GlaxoSmithKline plc;Institute of Science and Technology",
        "aff_unique_dep": ";;Amazon.com, Inc.;;",
        "aff_unique_url": "https://www.fudan.edu.cn;https://www.nus.edu.sg;https://www.amazon.com;https://www.gsk.com;",
        "aff_unique_abbr": "Fudan;NUS;Amazon;GSK;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;2;3;0;2",
        "aff_country_unique": "China;Singapore;United States;United Kingdom;"
    },
    {
        "id": "EaYYuxLlsu",
        "title": "Towards Robust Training via Gradient-diversified Backpropagation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Neural networks are prone to be vulnerable to adversarial attacks and domain shifts. Adversarial-driven methods including adversarial training and adversarial augmentation, have been frequently proposed to improve the model's robustness against adversarial attacks and distribution-shifted samples. Nonetheless, recent research on adversarial attacks has cast a spotlight on the robustness lacuna against attacks targeted at intermediate layers. Towards analyzing the rationale for this robustness lacuna, this paper investigates the layer-wise adversarial effect and adversarial gradients w.r.t intermediate layers. We observe that previous adversarial-driven methods tend to generate limited perturbations in the shallow intermediate layers compared with the deep output layer and there is a domain gap existing between the intermediate layer gradients generated by various adversarial techniques. The observed robustness lacuna can be primarily attributed to the exclusive utilization of loss functions on the output layer for adversarial gradient generation. This inherent practice constrains the adversarial impact on the shallow intermediate layers. Therefore, from the standing point of diversifying the adversarial gradients to ensure sufficient training and robustness of intermediate layers, this paper proposes a novel Stochastic Loss Integration Method (SLIM), which can be instantiated into the existing adversarial-driven methods in a plug-and-play manner. Experimental results across diverse tasks, including classification and segmentation, as well as various areas such as adversarial robustness and domain generalization, validate the effectiveness of our proposed method. Furthermore, we provide an in-depth analysis to offer a comprehensive understanding of layer-wise training involving various loss terms.",
        "keywords": "Adversarial Training;Adversarial Augmentation;Domain Generalization",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Xilin He;Cheng Luo;Qinliang Lin;Weicheng Xie;Siyang Song;Muhammad Haris Khan;Linlin Shen",
        "authorids": "~Xilin_He1;~Cheng_Luo4;~Qinliang_Lin2;~Weicheng_Xie1;~Siyang_Song1;~Muhammad_Haris_Khan3;~Linlin_Shen1",
        "gender": "M;M;M;M;M;M;M",
        "homepage": ";https://chengluo.cc/;https://wcxie.github.io/Weicheng-Xie/;https://www.cst.cam.ac.uk/people/ss2796;https://m-haris-khan.com;https://csse.szu.edu.cn/pages/user/index?id=594;https://github.com/LinQinLiang",
        "dblp": "366/0988;68/6443-2;28/6098-1;220/3096.html;155/3076;88/5607;222/7821",
        "google_scholar": "LRdrMfoAAAAJ;h0IdnhUAAAAJ;https://scholar.google.co.uk/citations?user=S2uh8OIAAAAJ;ZKSL1IcAAAAJ;ZgERfFwAAAAJ;https://scholar.google.com.hk/citations?user=AZ_y9HgAAAAJ;",
        "orcid": ";0000-0002-8034-9450;0000-0001-8946-7472;0000-0003-2339-5685;0000-0001-9746-276X;0000-0003-1420-0815;",
        "linkedin": ";;;siyang-song-7a814412b/;muhammad-haris-khan-1516714b/;;",
        "or_profile": "~Xilin_He1;~Cheng_Luo4;~Weicheng_Xie1;~Siyang_Song1;~Muhammad_Haris_Khan3;~Linlin_Shen1;~QINLIANG_LIN1",
        "aff": "Shenzhen University;Monash University;Shenzhen University;University of Leicester;Mohamed Bin Zayed University of Artificial Intelligence;Shenzhen University;Shenzhen University",
        "aff_domain": "szu.edu.cn;monash.edu;szu.edu.cn;leicester.ac.uk;mbzuai.ac.ae;szu.edu.cn;szu.edu.cn",
        "position": "Undergrad student;PhD student;Associate Professor;Assistant Professor;Assistant Professor;Full Professor;MS student",
        "bibtex": "@misc{\nhe2024towards,\ntitle={Towards Robust Training via Gradient-diversified Backpropagation},\nauthor={Xilin He and Cheng Luo and Qinliang Lin and Weicheng Xie and Siyang Song and Muhammad Haris Khan and Linlin Shen},\nyear={2024},\nurl={https://openreview.net/forum?id=EaYYuxLlsu}\n}",
        "github": "",
        "project": "",
        "reviewers": "Ss1r;Rp2G;B9kH;hkrG",
        "site": "https://openreview.net/forum?id=EaYYuxLlsu",
        "pdf_size": 5322150,
        "rating": "3;3;3;6",
        "confidence": "4;4;4;2",
        "soundness": "3;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "2;2;3;3",
        "wc_summary": "28;182;54;55",
        "wc_strengths": "50;48;19;56",
        "wc_weaknesses": "314;196;770;125",
        "wc_questions": "8;9;4;64",
        "wc_review": "400;435;847;300",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            79.75,
            60.01822639832004
        ],
        "wc_strengths_avg": [
            43.25,
            14.306903927824496
        ],
        "wc_weaknesses_avg": [
            351.25,
            251.01332135964418
        ],
        "wc_questions_avg": [
            21.25,
            24.752525123712125
        ],
        "wc_review_avg": [
            495.5,
            208.89770223724338
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:dXRri84qsWkJ:scholar.google.com/&scioq=Towards+Robust+Training+via+Gradient-diversified+Backpropagation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;2;3;0;0",
        "aff_unique_norm": "Shenzhen University;Monash University;University of Leicester;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.szu.edu.cn;https://www.monash.edu;https://www.leicester.ac.uk;https://www.mbzuai.ac.ae",
        "aff_unique_abbr": "SZU;Monash;Leicester;MBZUAI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;2;3;0;0",
        "aff_country_unique": "China;Australia;United Kingdom;United Arab Emirates"
    },
    {
        "title": "Cameras as Rays: Pose Estimation via Ray Diffusion",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19101",
        "id": "EanCFCwAjM",
        "author_site": "Jason Zhang, Amy Lin, Moneish Kumar, Tzu-Hsuan Yang, Deva Ramanan, Shubham Tulsiani",
        "tldr": "",
        "abstract": "Estimating camera poses is a fundamental task for 3D reconstruction and remains challenging given sparsely sampled views (<10). In contrast to existing approaches that pursue top-down prediction of global parametrizations of camera extrinsics, we propose a distributed representation of camera pose that treats a camera as a bundle of rays. This representation allows for a tight coupling with spatial image features improving pose precision. We observe that this representation is naturally suited for set-level transformers and develop a regression-based approach that maps image patches to corresponding rays. To capture the inherent uncertainties in sparse-view pose inference, we adapt this approach to learn a denoising diffusion model which allows us to sample plausible modes while improving performance. Our proposed methods, both regression- and diffusion-based, demonstrate state-of-the-art performance on camera pose estimation on CO3D while generalizing to unseen object categories and in-the-wild captures.",
        "keywords": "3D Computer Vision;Pose Estimation;Diffusion",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/4d6ff352963f3403d5686060a2b2b473568c004b.zip",
        "author": "Jason Y. Zhang;Amy Lin;Moneish Kumar;Tzu-Hsuan Yang;Deva Ramanan;Shubham Tulsiani",
        "authorids": "~Jason_Y._Zhang1;~Amy_Lin1;~Moneish_Kumar1;~Tzu-Hsuan_Yang1;~Deva_Ramanan1;~Shubham_Tulsiani1",
        "gender": "M;F;M;;M;M",
        "homepage": "https://jasonyzhang.com/;https://github.com/amyxlase;https://moneishkumar.github.io/;;https://www.cs.cmu.edu/~deva/;https://shubhtuls.github.io/",
        "dblp": "68/9283-1;;201/4551;;49/488;135/6623",
        "google_scholar": "https://scholar.google.com/citations?authuser=2;Zlp6MrcAAAAJ;https://scholar.google.com/citations?hl=en;;9B8PoXUAAAAJ;06rffEkAAAAJ",
        "orcid": "0000-0002-7343-1122;;;;;",
        "linkedin": ";;;betty-yang-445729194/;;",
        "or_profile": "~Jason_Y._Zhang1;~Amy_Lin1;~Moneish_Kumar1;~Tzu-Hsuan_Yang1;~Deva_Ramanan1;~Shubham_Tulsiani1",
        "aff": "Carnegie Mellon University;Carnegie Mellon University;Meta Facebook;;School of Computer Science, Carnegie Mellon University;Carnegie Mellon University",
        "aff_domain": "cmu.edu;cs.cmu.edu;meta.com;;cs.cmu.edu;cmu.edu",
        "position": "PhD student;Undergrad student;Researcher;;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nzhang2024cameras,\ntitle={Cameras as Rays: Pose Estimation via Ray Diffusion},\nauthor={Jason Y. Zhang and Amy Lin and Moneish Kumar and Tzu-Hsuan Yang and Deva Ramanan and Shubham Tulsiani},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=EanCFCwAjM}\n}",
        "github": "",
        "project": "",
        "reviewers": "mia4;wRVJ;v24e;NPGi",
        "pdf_size": 9808931,
        "rating": "5;5;8;8",
        "confidence": "5;3;4;4",
        "soundness": "2;3;3;3",
        "contribution": "3;2;4;3",
        "presentation": "3;2;3;2",
        "wc_summary": "67;77;171;89",
        "wc_strengths": "68;51;82;98",
        "wc_weaknesses": "349;104;366;255",
        "wc_questions": "90;4;86;105",
        "wc_review": "574;236;705;547",
        "wc_reply_reviewers": "632;7;0;221",
        "wc_reply_authors": "2207;404;579;1052",
        "reply_reviewers": "3;1;0;1",
        "reply_authors": "4;2;1;2",
        "rating_avg": [
            6.5,
            1.5
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            101.0,
            41.15823125451335
        ],
        "wc_strengths_avg": [
            74.75,
            17.340343133859836
        ],
        "wc_weaknesses_avg": [
            268.5,
            103.95792418089157
        ],
        "wc_questions_avg": [
            71.25,
            39.46754996196242
        ],
        "wc_review_avg": [
            515.5,
            172.07919688329557
        ],
        "wc_reply_reviewers_avg": [
            215.0,
            256.6193679362491
        ],
        "wc_reply_authors_avg": [
            1060.5,
            703.0947660166445
        ],
        "reply_reviewers_avg": [
            1.25,
            1.0897247358851685
        ],
        "reply_authors_avg": [
            2.25,
            1.0897247358851685
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 60,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11718454703332988052&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=EanCFCwAjM",
        "pdf": "https://openreview.net/pdf?id=EanCFCwAjM",
        "email": "cmu.edu;cs.cmu.edu;meta.com;;cs.cmu.edu;cmu.edu",
        "author_num": 6,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "Carnegie Mellon University;Meta",
        "aff_unique_dep": ";Meta Platforms, Inc.",
        "aff_unique_url": "https://www.cmu.edu;https://meta.com",
        "aff_unique_abbr": "CMU;Meta",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Pittsburgh",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Is This the Subspace You Are Looking for? An Interpretability Illusion for Subspace Activation Patching",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19100",
        "id": "Ebt7JgMHv1",
        "author_site": "Aleksandar Makelov, Georg Lange, Atticus Geiger, Neel Nanda",
        "tldr": "",
        "abstract": "Mechanistic interpretability aims to attribute high-level model behaviors to specific, interpretable learned features. It is hypothesized that these features manifest as directions or low-dimensional subspaces within activation space. Accordingly, recent studies have explored the identification and manipulation of such subspaces to reverse-engineer computations, employing methods such as activation patching. In this work, we demonstrate that na\u00efve approaches to subspace interventions can give rise to interpretability illusions.\n\nSpecifically, even if patching along a subspace has the intended end-to-end causal effect on model behavior, this effect may be achieved by activating \\emph{a dormant parallel pathway} using a component that is \\textit{causally disconnected} from the model output.\nWe demonstrate this in a mathematical example, realize the example empirically in two different settings (the Indirect Object Identification (IOI) task and factual recall), and argue that activating dormant pathways ought to be prevalent in practice.\nIn the context of factual recall, we further show that the illusion is related to rank-1 fact editing, providing a mechanistic explanation for previous work observing an inconsistency between fact editing performance and fact localisation.\n\nHowever, this does not imply that activation patching of subspaces is intrinsically unfit for interpretability.\nTo contextualize our findings, we also show what a success case looks like in a task (IOI) where prior manual circuit analysis allows an understanding of the location of the ground truth feature. We explore the additional evidence needed to argue that a patched subspace is faithful.",
        "keywords": "Mechanistic Interpretability;Natural Language Processing;Large Language Models",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/e86712c084ae1d55827c06b9609e246f76c653d5.zip",
        "author": "Aleksandar Makelov;Georg Lange;Atticus Geiger;Neel Nanda",
        "authorids": "~Aleksandar_Makelov1;~Georg_Lange1;~Atticus_Geiger1;~Neel_Nanda1",
        "gender": ";M;M;M",
        "homepage": "http://georglange.com;https://atticusg.github.io/;https://neelnanda.io;https://amakelov.github.io/",
        "dblp": ";229/4086;285/6389;202/2447",
        "google_scholar": ";;https://scholar.google.com/citations?hl=en;haO4sKoAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;https://linkedin.com/in/neel-nanda-993580151;",
        "or_profile": "~Georg_Lange1;~Atticus_Geiger1;~Neel_Nanda1;~Aleksandar_Aleksandrov_Makelov1",
        "aff": "Independent; Pr(Ai)\u00b2R Group;Google DeepMind;Independent",
        "aff_domain": "georglange.com;prair.group;deepmind.com;amakelov.github.io",
        "position": "Researcher;Principal Researcher;Researcher;Researcher",
        "bibtex": "@inproceedings{\nmakelov2024is,\ntitle={Is This the Subspace You Are Looking for? An Interpretability Illusion for Subspace Activation Patching},\nauthor={Aleksandar Makelov and Georg Lange and Atticus Geiger and Neel Nanda},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Ebt7JgMHv1}\n}",
        "github": "",
        "project": "",
        "reviewers": "8jAi;ERkw;YsUK",
        "pdf_size": 1205918,
        "rating": "3;8;8",
        "confidence": "3;2;3",
        "soundness": "1;2;4",
        "contribution": "1;4;4",
        "presentation": "1;4;4",
        "wc_summary": "63;248;125",
        "wc_strengths": "39;96;142",
        "wc_weaknesses": "436;23;28",
        "wc_questions": "136;85;119",
        "wc_review": "674;452;414",
        "wc_reply_reviewers": "296;77;99",
        "wc_reply_authors": "3729;1025;667",
        "reply_reviewers": "1;1;1",
        "reply_authors": "9;2;2",
        "rating_avg": [
            6.333333333333333,
            2.357022603955158
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "contribution_avg": [
            3.0,
            1.4142135623730951
        ],
        "presentation_avg": [
            3.0,
            1.4142135623730951
        ],
        "wc_summary_avg": [
            145.33333333333334,
            76.88230543427329
        ],
        "wc_strengths_avg": [
            92.33333333333333,
            42.12943019895817
        ],
        "wc_weaknesses_avg": [
            162.33333333333334,
            193.52232142285004
        ],
        "wc_questions_avg": [
            113.33333333333333,
            21.202725191719
        ],
        "wc_review_avg": [
            513.3333333333334,
            114.66279063216435
        ],
        "wc_reply_reviewers_avg": [
            157.33333333333334,
            98.46262686364247
        ],
        "wc_reply_authors_avg": [
            1807.0,
            1366.8952654342859
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            4.333333333333333,
            3.299831645537222
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5000000000000001,
        "gs_citation": 20,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2185367105840475566&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=Ebt7JgMHv1",
        "pdf": "https://openreview.net/pdf?id=Ebt7JgMHv1",
        "email": "georglange.com;prair.group;deepmind.com;amakelov.github.io",
        "author_num": 4,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Independent;Pr(Ai)\u00b2R Group;Google",
        "aff_unique_dep": ";;Google DeepMind",
        "aff_unique_url": ";;https://deepmind.com",
        "aff_unique_abbr": ";;DeepMind",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "1",
        "aff_country_unique": ";United Kingdom"
    },
    {
        "id": "Ec2rYpP42y",
        "title": "Solving Inverse Problem With Unspecified Forward Operator Using Diffusion Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Diffusion models have excelled in addressing a variety of inverse problems. Nevertheless, their application is restricted by the requirement for specific prior knowledge of the forward operator. This paper presents a novel approach, UFODM, which circumvents this constraint by selecting the appropriate forward measurement, making the method more applicable to real-world scenarios. Specifically, our approach enables the concurrent estimation of both the reconstructed image and the characteristics of the forward operator during the inference stage. Our method effectively tackles inverse problems such as blind deconvolution, JPEG restoration, and super-resolution. Furthermore, we demonstrate the versatility of our approach in solving generic inverse problems through the automated selection of forward operators. Empirical evidence suggests that our framework has the potential to enhance the efficacy of diffusion models and extend their applicability in solving real-world inverse problems.",
        "keywords": "diffusion models;inverse problems",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/0a8a46ecbb6cac1b7c300528e9df4351d06ef567.zip",
        "author": "Jialing Zhang;Chongxuan Li;Dequan Wang",
        "authorids": "~Jialing_Zhang1;~Chongxuan_Li1;~Dequan_Wang1",
        "gender": "F;M;",
        "homepage": "https://dqwang.group/authors/jialing-zhang/;http://ml.cs.tsinghua.edu.cn/~chongxuan;",
        "dblp": ";161/9965;",
        "google_scholar": ";UKMcQn4AAAAJ;",
        "orcid": ";0000-0002-0912-9076;",
        "linkedin": ";;",
        "or_profile": "~Jialing_Zhang1;~Chongxuan_Li1;~Dequan_Wang1",
        "aff": "Shanghai Jiaotong University;Renmin University of China;",
        "aff_domain": "sjtu.edu.cn;ruc.edu.cn;",
        "position": "MS student;Associate Professor;",
        "bibtex": "@misc{\nzhang2024solving,\ntitle={Solving Inverse Problem With Unspecified Forward Operator Using Diffusion Models},\nauthor={Jialing Zhang and Chongxuan Li and Dequan Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=Ec2rYpP42y}\n}",
        "github": "",
        "project": "",
        "reviewers": "zRYy;EWNX;WM9W;udx1",
        "site": "https://openreview.net/forum?id=Ec2rYpP42y",
        "pdf_size": 18181115,
        "rating": "3;3;3;6",
        "confidence": "5;4;4;2",
        "soundness": "2;3;1;3",
        "contribution": "3;2;2;3",
        "presentation": "2;3;2;2",
        "wc_summary": "97;113;107;23",
        "wc_strengths": "64;28;25;13",
        "wc_weaknesses": "420;131;105;173",
        "wc_questions": "196;50;211;1",
        "wc_review": "777;322;448;210",
        "wc_reply_reviewers": "52;0;0;0",
        "wc_reply_authors": "669;377;825;164",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            85.0,
            36.24913792078372
        ],
        "wc_strengths_avg": [
            32.5,
            19.03286631067428
        ],
        "wc_weaknesses_avg": [
            207.25,
            125.20458258386552
        ],
        "wc_questions_avg": [
            114.5,
            90.82538191496913
        ],
        "wc_review_avg": [
            439.25,
            212.39982933138154
        ],
        "wc_reply_reviewers_avg": [
            13.0,
            22.516660498395403
        ],
        "wc_reply_authors_avg": [
            508.75,
            255.8831520440531
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.9271726499455307,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:gNcRQAVPpmsJ:scholar.google.com/&scioq=Solving+Inverse+Problem+With+Unspecified+Forward+Operator+Using+Diffusion+Models&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Shanghai Jiao Tong University;Renmin University of China",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.sjtu.edu.cn;http://www.ruc.edu.cn",
        "aff_unique_abbr": "SJTU;RUC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "EcDO5EXFdH",
        "title": "SiGeo: Sub-One-Shot NAS via Information Theory and Geometry of Loss Landscape",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Neural Architecture Search (NAS) has become a widely used tool for automating neural network design. While one-shot NAS methods have successfully reduced computational requirements, they often require extensive training. On the other hand, zero-shot NAS utilizes training-free proxies to evaluate a candidate architecture's test performance but has two limitations: (1) difficulty in taking advantage of strictly increasing information and (2) unreliable performance, particularly in complex domains like recommendation systems, due to the multi-modal data inputs and complex architecture configurations. To synthesize the benefits of both methods, we introduce a \"sub-one-shot\" paradigm that serves as a bridge between zero-shot and one-shot NAS. In sub-one-shot NAS, the supernet is trained using only a small subset of the training data, a phase we refer to as \"warm-up.\" Within this framework, we present SiGeo, a proxy for NAS, founded on a novel theoretical framework that connects the supernet warm-up with the efficacy of the proxy. Extensive experiments have demonstrated that SiGeo, even without the benefit of supernet warm-up, consistently outperforms state-of-the-art zero-shot NAS competitors on various established NAS benchmarks. When warmed up, it can achieve comparable performance to one-shot NAS methods, but with a significant reduction ($\\sim 60$\\%) in computational costs.",
        "keywords": "Neural Architecture Search;Zero-shot NAS;Sub-one-shot NAS;Loss Landscape;Convergence Analysis;Generalization Capacity",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/f5e30953356389d67a5999dbf4872b09041478ab.zip",
        "author": "Hua Zheng;Kuang-Hung Liu;Igor Fedorov;Xin Zhang;Wen-Yen Chen;Wei Wen",
        "authorids": "~Hua_Zheng2;~Kuang-Hung_Liu1;~Igor_Fedorov1;~Xin_Zhang16;~Wen-Yen_Chen1;~Wei_Wen1",
        "gender": "M;;M;M;M;Not Specified",
        "homepage": "https://zhenghuazx.github.io/hua.zheng;https://scholar.google.com/citations?user=eaxkzLcAAAAJ&hl=en;http://ifed-ucsd.github.io/;https://xinzhang-nac.github.io/;;https://wenwei202.github.io/",
        "dblp": ";;175/1542;76/1584-54.html;06/1416;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;eaxkzLcAAAAJ;;9u5Pa0gAAAAJ;te7mtjAAAAAJ;JYD36ocAAAAJ",
        "orcid": ";;0000-0002-8204-9515;0000-0002-0784-2038;0009-0004-9371-5642;0000-0003-0027-4821",
        "linkedin": "hua-zheng-b064a8b0/;;;;wenyenc/;weiwenml",
        "or_profile": "~Hua_Zheng2;~Kuang-Hung_Liu1;~Igor_Fedorov1;~Xin_Zhang16;~Wen-Yen_Chen1;~Wei_Wen1",
        "aff": "Northeastern University;Meta Facebook;Meta;Meta Facebook;Meta;AI at Meta",
        "aff_domain": "northeastern.edu;meta.com;meta.com;fb.com;meta.com;meta.com",
        "position": "PhD student;Researcher;research scientist ;Research Scientist;Researcher;Researcher",
        "bibtex": "@misc{\nzheng2024sigeo,\ntitle={SiGeo: Sub-One-Shot {NAS} via Information Theory and Geometry of Loss Landscape},\nauthor={Hua Zheng and Kuang-Hung Liu and Igor Fedorov and Xin Zhang and Wen-Yen Chen and Wei Wen},\nyear={2024},\nurl={https://openreview.net/forum?id=EcDO5EXFdH}\n}",
        "github": "",
        "project": "",
        "reviewers": "Hu1G;wPAs;RQP1;DixF;JuJh",
        "site": "https://openreview.net/forum?id=EcDO5EXFdH",
        "pdf_size": 3617176,
        "rating": "3;3;5;5;5",
        "confidence": "5;4;3;4;4",
        "soundness": "1;2;3;2;2",
        "contribution": "1;2;2;2;2",
        "presentation": "2;3;2;3;2",
        "wc_summary": "34;85;63;61;53",
        "wc_strengths": "21;30;41;41;26",
        "wc_weaknesses": "212;115;90;29;68",
        "wc_questions": "3;56;74;143;4",
        "wc_review": "270;286;268;274;151",
        "wc_reply_reviewers": "138;122;0;0;0",
        "wc_reply_authors": "1068;808;552;785;566",
        "reply_reviewers": "1;1;0;0;0",
        "reply_authors": "2;2;1;2;2",
        "rating_avg": [
            4.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            1.8,
            0.4000000000000001
        ],
        "presentation_avg": [
            2.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            59.2,
            16.4730082255792
        ],
        "wc_strengths_avg": [
            31.8,
            8.034923770640265
        ],
        "wc_weaknesses_avg": [
            102.8,
            61.473246213291844
        ],
        "wc_questions_avg": [
            56.0,
            51.7803051362195
        ],
        "wc_review_avg": [
            249.8,
            49.793172222705394
        ],
        "wc_reply_reviewers_avg": [
            52.0,
            63.887400948856886
        ],
        "wc_reply_authors_avg": [
            755.8,
            188.99989417986458
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.8,
            0.4
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.6454972243679028,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=977872142771234770&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1;1;1;1",
        "aff_unique_norm": "Northeastern University;Meta",
        "aff_unique_dep": ";Meta Platforms, Inc.",
        "aff_unique_url": "https://www.northeastern.edu;https://meta.com",
        "aff_unique_abbr": "NEU;Meta",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Understanding Convergence and Generalization in Federated Learning through Feature Learning Theory",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19099",
        "id": "EcetCr4trp",
        "author_site": "Wei Huang, Ye Shi, Zhongyi Cai, Taiji Suzuki",
        "tldr": "",
        "abstract": "Federated Learning (FL) has attracted significant attention as an efficient privacy-preserving approach to distributed learning across multiple clients. Despite extensive empirical research and practical applications, a systematic way to theoretically understand the convergence and generalization properties in FL remains limited. This work aims to establish a unified theoretical foundation for understanding FL through feature learning theory. We focus on a scenario where each client employs a two-layer convolutional neural network (CNN) for local training on their own data. Many existing works analyze the convergence of Federated Averaging (FedAvg) under lazy training with linearizing assumptions in weight space. In contrast, our approach tracks the trajectory of signal learning and noise memorization in FL, eliminating the need for these assumptions. We further show that FedAvg can achieve near-zero test error by effectively increasing signal-to-noise ratio (SNR) in feature learning, while local training without communication achieves a large constant test error. This finding highlights the benefits of communication for generalization in FL. Moreover, our theoretical results suggest that a weighted FedAvg method, based on the similarity of input features across clients, can effectively tackle data heterogeneity issues in FL. Experimental results on both synthetic and real-world datasets verify our theoretical conclusions and emphasize the effectiveness of the weighted FedAvg approach.",
        "keywords": "Federated Learning;Feature Learning Theory;FedAvg",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Wei Huang;Ye Shi;Zhongyi Cai;Taiji Suzuki",
        "authorids": "~Wei_Huang6;~Ye_Shi1;~Zhongyi_Cai1;~Taiji_Suzuki1",
        "gender": "M;M;M;M",
        "homepage": "https://weihuang05.github.io/;http://faculty.sist.shanghaitech.edu.cn/faculty/shiye;;http://ibis.t.u-tokyo.ac.jp/suzuki/",
        "dblp": "81/6685-34;34/11191-1;257/4285;08/312",
        "google_scholar": "RZfDh4MAAAAJ;gMqbZPUAAAAJ;;x8osrBsAAAAJ",
        "orcid": "0000-0001-5674-7021;;0009-0002-1410-7952;",
        "linkedin": ";;;",
        "or_profile": "~Wei_Huang6;~Ye_Shi1;~Zhongyi_Cai1;~Taiji_Suzuki1",
        "aff": "RIKEN AIP;ShanghaiTech University;ShanghaiTech University;The University of Tokyo",
        "aff_domain": "riken.jp;shanghaitech.edu.cn;shanghaitech.edu.cn;tokyo.ac.jp",
        "position": "Research Scientist;Assistant Professor;MS student;Associate Professor",
        "bibtex": "@inproceedings{\nhuang2024understanding,\ntitle={Understanding Convergence and Generalization in Federated Learning through Feature Learning Theory},\nauthor={Wei Huang and Ye Shi and Zhongyi Cai and Taiji Suzuki},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=EcetCr4trp}\n}",
        "github": "",
        "project": "",
        "reviewers": "vgxi;aCq5;bJ2V;u4St",
        "pdf_size": 761864,
        "rating": "5;6;6;6",
        "confidence": "4;3;4;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "168;36;84;13",
        "wc_strengths": "65;35;22;22",
        "wc_weaknesses": "367;162;220;65",
        "wc_questions": "272;133;9;185",
        "wc_review": "872;366;335;285",
        "wc_reply_reviewers": "0;32;231;0",
        "wc_reply_authors": "2829;1432;1143;1139",
        "reply_reviewers": "0;1;3;0",
        "reply_authors": "6;3;4;3",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            75.25,
            59.3606561621416
        ],
        "wc_strengths_avg": [
            36.0,
            17.564168070250297
        ],
        "wc_weaknesses_avg": [
            203.5,
            109.4406231707404
        ],
        "wc_questions_avg": [
            149.75,
            95.2349069406801
        ],
        "wc_review_avg": [
            464.5,
            237.0384989827602
        ],
        "wc_reply_reviewers_avg": [
            65.75,
            96.29739093038815
        ],
        "wc_reply_authors_avg": [
            1635.75,
            699.0927602972298
        ],
        "reply_reviewers_avg": [
            1.0,
            1.224744871391589
        ],
        "reply_authors_avg": [
            4.0,
            1.224744871391589
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 16,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12229129382702610405&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=EcetCr4trp",
        "pdf": "https://openreview.net/pdf?id=EcetCr4trp",
        "email": "riken.jp;shanghaitech.edu.cn;shanghaitech.edu.cn;tokyo.ac.jp",
        "author_num": 4,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "RIKEN;ShanghaiTech University;University of Tokyo",
        "aff_unique_dep": "Advanced Institute for Computational Science;;",
        "aff_unique_url": "https://www.aip.riken.jp;https://www.shanghaitech.edu.cn;https://www.u-tokyo.ac.jp",
        "aff_unique_abbr": "RIKEN AIP;ShanghaiTech;UTokyo",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "Japan;China"
    },
    {
        "id": "EfSOT1QUlw",
        "title": "Data Descriptions from Large Language Models with Influence Estimation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Deep learning models have been successful in many areas but understanding their behaviors still remains a black-box. Most prior explainable AI (XAI) approaches have focused on interpreting and explaining how models make predictions. But in contrast, we take a different approach via the lens of data because data is one of the most important factors in the success of deep learning models. We would like to understand how data can be explained with deep learning model training via one of the most common media -- language. Therefore, we propose a novel approach to understand and extract which information can explain each class inside the dataset well by incorporating knowledge from existing external knowledge bases extracted through large language models such as GPT-3.5. However, the extracted data descriptions may still include irrelevant information, so we propose to exploit influence estimation to choose the most informative textual descriptions, along with the CLIP score. The presented textual descriptions may provide insight into what the trained model focuses on and utilizes for making the prediction. Furthermore, by utilizing recent vision-language contrastive learning as it may provide cross-modal transferability, we propose a novel benchmark task of cross-modal transfer classification to examine the effectiveness of the data description. In experiments with nine image classification datasets, the extracted text descriptions further boost the performance of the trained model with only images. Therefore, it demonstrates that the proposed approach provides information that can explain the characteristics of each dataset that helps the model to train. Through this, we may have insight and inherent interpretability of the decision process from the model. In addition, we show that our approach solves model bias in text-to-image generation tasks.",
        "keywords": "Explainable AI;multi-modal;vision-language model;CLIP;cross-modal transferability;image classification;large language models;2-stage prompting",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Chaeri Kim;Taehwan Kim",
        "authorids": "~Chaeri_Kim1;~Taehwan_Kim1",
        "gender": "F;M",
        "homepage": "https://www.instagram.com/;http://ttic.uchicago.edu/~taehwan",
        "dblp": ";86/3976",
        "google_scholar": ";5dGWexcAAAAJ",
        "orcid": ";0000-0002-6571-4632",
        "linkedin": ";",
        "or_profile": "~Chaeri_Kim1;~Taehwan_Kim1",
        "aff": "Ulsan National Institute of Science and Technology;Ulsan National Institute of Science and Technology",
        "aff_domain": "unist.ac.kr;unist.ac.kr",
        "position": "MS student;Assistant Professor",
        "bibtex": "@misc{\nkim2024data,\ntitle={Data Descriptions from Large Language Models with Influence Estimation},\nauthor={Chaeri Kim and Taehwan Kim},\nyear={2024},\nurl={https://openreview.net/forum?id=EfSOT1QUlw}\n}",
        "github": "",
        "project": "",
        "reviewers": "ANzd;gMvU;vMa1;TWbL",
        "site": "https://openreview.net/forum?id=EfSOT1QUlw",
        "pdf_size": 24166582,
        "rating": "1;3;3;3",
        "confidence": "5;5;3;5",
        "soundness": "2;2;3;2",
        "contribution": "2;2;2;1",
        "presentation": "1;1;2;1",
        "wc_summary": "97;300;110;83",
        "wc_strengths": "15;50;38;92",
        "wc_weaknesses": "28;176;168;476",
        "wc_questions": "381;58;44;52",
        "wc_review": "521;584;360;703",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            147.5,
            88.56212508742098
        ],
        "wc_strengths_avg": [
            48.75,
            27.958674861301994
        ],
        "wc_weaknesses_avg": [
            212.0,
            163.38910612400082
        ],
        "wc_questions_avg": [
            133.75,
            142.8362261472908
        ],
        "wc_review_avg": [
            542.0,
            123.74368670764582
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:xs3VL3FogrwJ:scholar.google.com/&scioq=Data+Descriptions+from+Large+Language+Models+with+Influence+Estimation&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Ulsan National Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.unist.ac.kr",
        "aff_unique_abbr": "UNIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "EgASiEujt6",
        "title": "Towards Controllable Diffusion Models via Training-Phase Guided Exploration",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "By formulating data samples\u2019 formation as a Markov denoising process, diffusion models achieve state-of-the-art performances in a collection of tasks. Recently, many variants of diffusion models have been proposed to enable controlled sample generation. Most of these existing methods either formulate the controlling information as an input (i.e.,: conditional representation) for the noise approximator, or introduce a pre-trained classifier in the test-phase to guide the Langevin dynamic towards the conditional goal. However, the former line of methods only work when the controlling information can be formulated as conditional representations, while the latter requires the pre-trained guidance classifier to be differentiable. In this paper, we propose a novel frame- work named RGDM (Reward-Guided Diffusion Model) that guides the training-phase of diffusion models via reinforcement learning (RL). The proposed training framework bridges the objective of weighted log-likelihood and maximum entropy RL, which enables calculating gradients of policy parameters via sample episodes from a pay-off distribution proportional to exponentiated scaled rewards, rather than from policies themselves. Experiments on 3D shape and molecule generation tasks show significant improvements over existing conditional diffusion models.",
        "keywords": "diffusion model;generative model;controllable generation",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Hengtong Zhang;Tingyang Xu",
        "authorids": "~Hengtong_Zhang1;~Tingyang_Xu1",
        "gender": ";M",
        "homepage": "https://hengtongzhang.github.io;",
        "dblp": "188/2018;157/0940",
        "google_scholar": "J2ZH_McAAAAJ;6gIs5YMAAAAJ",
        "orcid": ";0009-0002-0106-8376",
        "linkedin": ";",
        "or_profile": "~Hengtong_Zhang1;~Tingyang_Xu1",
        "aff": "Tencent AI Lab;Tencent AI Lab",
        "aff_domain": "tencent.com;tencent.com",
        "position": "Researcher;Researcher",
        "bibtex": "@misc{\nzhang2024towards,\ntitle={Towards Controllable Diffusion Models via Training-Phase Guided Exploration},\nauthor={Hengtong Zhang and Tingyang Xu},\nyear={2024},\nurl={https://openreview.net/forum?id=EgASiEujt6}\n}",
        "github": "",
        "project": "",
        "reviewers": "TeCp;R9e8;ZNCD;X1gM",
        "site": "https://openreview.net/forum?id=EgASiEujt6",
        "pdf_size": 2407456,
        "rating": "3;5;5;5",
        "confidence": "5;2;4;4",
        "soundness": "1;2;3;2",
        "contribution": "2;2;3;3",
        "presentation": "2;2;3;2",
        "wc_summary": "146;120;77;68",
        "wc_strengths": "142;95;19;47",
        "wc_weaknesses": "153;272;440;417",
        "wc_questions": "716;2;28;39",
        "wc_review": "1157;489;564;571",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            102.75,
            31.77558024647229
        ],
        "wc_strengths_avg": [
            75.75,
            46.92214296044033
        ],
        "wc_weaknesses_avg": [
            320.5,
            116.19057620994914
        ],
        "wc_questions_avg": [
            196.25,
            300.3784071800102
        ],
        "wc_review_avg": [
            695.25,
            268.52222906120824
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.6622661785325219,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:GYStSzREBbYJ:scholar.google.com/&scioq=Towards+Controllable+Diffusion+Models+via+Training-Phase+Guided+Exploration&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Tencent",
        "aff_unique_dep": "Tencent AI Lab",
        "aff_unique_url": "https://ai.tencent.com",
        "aff_unique_abbr": "Tencent AI Lab",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "HyperAttention: Long-context Attention in Near-Linear Time",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19098",
        "id": "Eh0Od2BJIM",
        "author_site": "Insu Han, Rajesh Jayaram, Amin Karbasi, Vahab Mirrokni, David Woodruff, Amir Zandieh",
        "tldr": "",
        "abstract": "We present an approximate attention mechanism named `HyperAttention` to address the computational challenges posed by the growing complexity of long contexts used in Large Language Models (LLMs). \nRecent work suggests that in the worst-case scenario, the quadratic time is necessary unless the entries of the attention matrix are bounded or the matrix has low stable rank. \nWe introduce two parameters which measure: (1) the max column norm in the normalized attention matrix, and (2) the ratio of row norms in the unnormalized attention matrix after detecting and removing large entries. We use these fine-grained parameters to capture the hardness of the problem. \nDespite previous lower bounds, we are able to achieve a linear time sampling algorithm even when the matrix has unbounded entries or a large stable rank, provided the above parameters are small.\nHyperAttention features a modular design that easily accommodates integration of other fast low-level implementations, particularly FlashAttention. \nEmpirically, employing Locality Sensitive Hashing (LSH) to identify large entries, HyperAttention outperforms existing methods, giving significant speed improvements compared to state-of-the-art solutions like FlashAttention. \nThis development presents substantial implications for enabling LLMs to handle significantly larger contexts.",
        "keywords": "self-attention;locality sensitive hashing;long-range context",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/78543416e9fb2d5ce853bd9da8fb8b7322da21eb.zip",
        "author": "Insu Han;Rajesh Jayaram;Amin Karbasi;Vahab Mirrokni;David Woodruff;Amir Zandieh",
        "authorids": "~Insu_Han1;~Rajesh_Jayaram1;~Amin_Karbasi3;~Vahab_Mirrokni2;~David_Woodruff1;~Amir_Zandieh2",
        "gender": "M;;M;M;M;M",
        "homepage": "https://insuhan.github.io/;http://rajeshjayaram.com/;https://people.csail.mit.edu/mirrokni/Welcome.html;http://www.cs.cmu.edu/~dwoodruf/;https://people.mpi-inf.mpg.de/~azandieh/;http://seas.yale.edu/faculty-research/faculty-directory/amin-karbasi",
        "dblp": "160/8272;202/9970.html;m/VahabSMirrokni;w/DPWoodruff;154/6494;49/7411",
        "google_scholar": "0w39xsoAAAAJ;Cerc8UYAAAAJ;opbZfw0AAAAJ;https://scholar.google.com.tw/citations?user=0G2t-6sAAAAJ;S9Ss8M8AAAAJ;https://scholar.google.com.tw/citations?user=VusVB38AAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";;;;amir-zandieh-phd-323a13a9/;",
        "or_profile": "~Insu_Han1;~Rajesh_Jayaram1;~Vahab_Mirrokni2;~David_Woodruff1;~Amir_Zandieh2;~amin_karbasi1",
        "aff": "Korea Advanced Institute of Science & Technology;Google;Google Research;Carnegie Mellon University;Zalando SE;Google",
        "aff_domain": "kaist.ac.kr;google.com;google.com;cmu.edu;zalando.de;google.com",
        "position": "Assistant Professor;Researcher;VP, Google Fellow;Full Professor;Researcher;Researcher",
        "bibtex": "@inproceedings{\nhan2024hyperattention,\ntitle={HyperAttention: Long-context Attention in Near-Linear Time},\nauthor={Insu Han and Rajesh Jayaram and Amin Karbasi and Vahab Mirrokni and David Woodruff and Amir Zandieh},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Eh0Od2BJIM}\n}",
        "github": "",
        "project": "",
        "reviewers": "xXnD;cCwA;NFiG",
        "pdf_size": 696897,
        "rating": "5;6;8",
        "confidence": "4;3;3",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "3;2;3",
        "wc_summary": "76;246;86",
        "wc_strengths": "44;19;160",
        "wc_weaknesses": "476;35;173",
        "wc_questions": "3;1;22",
        "wc_review": "599;301;441",
        "wc_reply_reviewers": "93;0;27",
        "wc_reply_authors": "699;70;467",
        "reply_reviewers": "1;0;1",
        "reply_authors": "5;1;1",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            136.0,
            77.88880963698615
        ],
        "wc_strengths_avg": [
            74.33333333333333,
            61.42927279038516
        ],
        "wc_weaknesses_avg": [
            228.0,
            184.1901191703833
        ],
        "wc_questions_avg": [
            8.666666666666666,
            9.46337971105226
        ],
        "wc_review_avg": [
            447.0,
            121.73194595777505
        ],
        "wc_reply_reviewers_avg": [
            40.0,
            39.06404996924922
        ],
        "wc_reply_authors_avg": [
            412.0,
            259.7165121178603
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            1.8856180831641267
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.7559289460184545,
        "gs_citation": 78,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12733927342294964560&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=Eh0Od2BJIM",
        "pdf": "https://openreview.net/pdf?id=Eh0Od2BJIM",
        "email": "kaist.ac.kr;google.com;google.com;cmu.edu;zalando.de;google.com",
        "author_num": 6,
        "aff_unique_index": "0;1;1;2;3;1",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology;Google;Carnegie Mellon University;Zalando SE",
        "aff_unique_dep": ";Google;;",
        "aff_unique_url": "https://www.kaist.ac.kr;https://www.google.com;https://www.cmu.edu;https://www.zalando.de",
        "aff_unique_abbr": "KAIST;Google;CMU;Zalando",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;1;1;2;1",
        "aff_country_unique": "South Korea;United States;Germany"
    },
    {
        "id": "EhK6wBBJNS",
        "title": "Stochastic Re-weighted Gradient Descent via Distributionally Robust Optimization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We develop a re-weighted gradient descent technique for boosting the performance of deep neural networks, which involves importance weighting of data points during each optimization step. Our approach is inspired by distributionally robust optimization with f-divergences, which has been known to result in models with improved generalization guarantees. Our re-weighting scheme is simple, computationally efficient, and can be combined with many popular optimization algorithms such as SGD and Adam. Empirically, we demonstrate the superiority of our approach on various tasks, including supervised learning, domain adaptation. Notably, we obtain improvements of +0.7% and +1.44% over SOTA on DomainBed and Tabular classification benchmarks, respectively. Moreover, our algorithm boosts the performance of BERT on GLUE benchmarks by +1.94%, and ViT on ImageNet-1K by +1.01%. These results demonstrate the effectiveness of the proposed approach, indicating its potential for improving performance in diverse domains.",
        "keywords": "Deep Learning;Robustness;Per-sample weighting",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Ramnath Kumar;Kushal Alpesh Majmundar;Dheeraj Mysore Nagaraj;Arun Suggala",
        "authorids": "~Ramnath_Kumar1;~Kushal_Alpesh_Majmundar1;~Dheeraj_Mysore_Nagaraj1;~Arun_Suggala1",
        "gender": "M;M;M;M",
        "homepage": "https://ramnathkumar181.github.io/;;https://dheerajmn.mit.edu;",
        "dblp": ";266/1099;215/5097;164/7327",
        "google_scholar": "csZjvdEAAAAJ;XmvqDZcAAAAJ;0g80b7sAAAAJ;CKgmfDMAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;dheeraj-m-nagaraj-01739792/;",
        "or_profile": "~Ramnath_Kumar1;~Kushal_Alpesh_Majmundar1;~Dheeraj_Mysore_Nagaraj1;~Arun_Suggala1",
        "aff": "Google;;Google;Google",
        "aff_domain": "google.com;;google.com;google.com",
        "position": "Pre-Doctoral Researcher;;Research Scientist;Researcher",
        "bibtex": "@misc{\nkumar2024stochastic,\ntitle={Stochastic Re-weighted Gradient Descent via Distributionally Robust Optimization},\nauthor={Ramnath Kumar and Kushal Alpesh Majmundar and Dheeraj Mysore Nagaraj and Arun Suggala},\nyear={2024},\nurl={https://openreview.net/forum?id=EhK6wBBJNS}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=EhK6wBBJNS",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7250074421399736216&as_sdt=5,34&sciodt=0,34&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Google",
        "aff_unique_dep": "Google",
        "aff_unique_url": "https://www.google.com",
        "aff_unique_abbr": "Google",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Mountain View",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "HoloNets: Spectral Convolutions do extend to Directed Graphs",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19097",
        "id": "EhmEwfavOW",
        "author_site": "Christian Koke, Daniel Cremers",
        "tldr": "",
        "abstract": "Within the graph learning community, conventional wisdom dictates that spectral convolutional networks may only be deployed on undirected graphs: Only there could the existence of a well-defined graph Fourier transform be guaranteed, so that information may be translated between spatial- and spectral domains. Here we show this traditional reliance on the graph Fourier transform to be superfluous and -- making use of certain advanced tools from  complex analysis and spectral theory -- extend spectral convolutions to directed graphs. \nWe provide a frequency-response interpretation of newly developed filters, investigate the influence of the basis used to express filters and discuss the interplay with characteristic operators on which networks are based. In order to thoroughly test the developed  theory, we conduct experiments in real world settings, showcasing that  directed spectral convolutional networks provide new state of the art results for heterophilic node classification on many  datasets  and -- as opposed to baselines -- may be rendered stable to resolution-scale varying topological perturbations.",
        "keywords": "Spectral Graph Convolutions;Directed Graphs;Weighted Graphs;Complex Analysis;Spectral Graph Theory;Heterophily;Node Classification;Graph Regression pectral Graph Theory;Rigorous Proofs",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Christian Koke;Daniel Cremers",
        "authorids": "~Christian_Koke1;~Daniel_Cremers1",
        "gender": ";M",
        "homepage": ";https://vision.in.tum.de/members/cremers",
        "dblp": ";c/DanielCremers",
        "google_scholar": ";cXQciMEAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Christian_Koke1;~Daniel_Cremers1",
        "aff": ";Technical University Munich",
        "aff_domain": ";tum.de",
        "position": ";Full Professor",
        "bibtex": "@inproceedings{\nkoke2024holonets,\ntitle={HoloNets: Spectral Convolutions do extend to Directed Graphs},\nauthor={Christian Koke and Daniel Cremers},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=EhmEwfavOW}\n}",
        "github": "",
        "project": "",
        "reviewers": "XGUM;RxaJ;tzrV;T8Vv",
        "pdf_size": 1264737,
        "rating": "6;6;6;8",
        "confidence": "3;3;3;2",
        "soundness": "3;3;3;3",
        "contribution": "3;3;4;4",
        "presentation": "2;3;2;3",
        "wc_summary": "33;71;119;51",
        "wc_strengths": "34;63;115;38",
        "wc_weaknesses": "126;102;378;113",
        "wc_questions": "40;28;105;6",
        "wc_review": "233;264;717;208",
        "wc_reply_reviewers": "18;0;50;16",
        "wc_reply_authors": "624;1634;2556;1011",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "1;3;4;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            68.5,
            32.10529551335729
        ],
        "wc_strengths_avg": [
            62.5,
            32.283896914715854
        ],
        "wc_weaknesses_avg": [
            179.75,
            114.77450718691847
        ],
        "wc_questions_avg": [
            44.75,
            36.860378457091294
        ],
        "wc_review_avg": [
            355.5,
            209.65268898824073
        ],
        "wc_reply_reviewers_avg": [
            21.0,
            18.138357147217054
        ],
        "wc_reply_authors_avg": [
            1456.25,
            730.0569755162949
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 22,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5531122662379124481&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=EhmEwfavOW",
        "pdf": "https://openreview.net/pdf?id=EhmEwfavOW",
        "email": ";tum.de",
        "author_num": 2,
        "aff_unique_index": "0",
        "aff_unique_norm": "Technical University of Munich",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tum.de",
        "aff_unique_abbr": "TUM",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Germany"
    },
    {
        "title": "L2MAC: Large Language Model Automatic Computer for Extensive Code Generation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19096",
        "id": "EhrzQwsV4K",
        "author_site": "Samuel Holt, Max Ruiz Luyten, Mihaela van der Schaar",
        "tldr": "",
        "abstract": "Transformer-based large language models (LLMs) are constrained by the fixed context window of the underlying transformer architecture, hindering their ability to produce long and coherent outputs. Memory-augmented LLMs are a promising solution, but current approaches cannot handle long output generation tasks since they (1) only focus on reading memory and reduce its evolution to the concatenation of new memories or (2) use very specialized memories that cannot adapt to other domains. This paper presents L2MAC, the first practical LLM-based general-purpose stored-program automatic computer (von Neumann architecture) framework, an LLM-based multi-agent system, for long and consistent output generation. Its memory has two components: the instruction registry, which is populated with a prompt program to solve the user-given task, and a file store, which will contain the final and intermediate outputs. Each instruction in turn is executed by a separate LLM agent, whose context is managed by a control unit capable of precise memory reading and writing to ensure effective interaction with the entire file store. These components enable L2MAC to generate extensive outputs, bypassing the constraints of the finite context window while producing outputs that fulfill a complex user-specified task. We empirically demonstrate that L2MAC achieves state-of-the-art performance in generating large codebases for system design tasks, significantly outperforming other coding methods in implementing the detailed user-specified task; we show that L2MAC works for general-purpose extensive text-based tasks, such as writing an entire book; and we provide valuable insights into L2MAC's performance improvement over existing methods.",
        "keywords": "Code Generation;Memory-augmented LLMs;Large Language Models (LLMs);LLM coder agent;LLM Agent;Stored-program computer;von neumann architecture",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Samuel Holt;Max Ruiz Luyten;Mihaela van der Schaar",
        "authorids": "~Samuel_Holt1;~Max_Ruiz_Luyten1;~Mihaela_van_der_Schaar2",
        "gender": ";;F",
        "homepage": "https://samholt.github.io/;;https://www.vanderschaar-lab.com",
        "dblp": "322/3656;;",
        "google_scholar": "Ey5aInIAAAAJ;P4z6s_MAAAAJ;DZ3S--MAAAAJ",
        "orcid": ";;",
        "linkedin": ";max-ruiz/;",
        "or_profile": "~Samuel_Holt1;~Max_Ruiz_Luyten1;~Mihaela_van_der_Schaar2",
        "aff": "Google DeepMind;University of Cambridge;University of California, Los Angeles",
        "aff_domain": "google.com;cam.ac.uk;ucla.edu",
        "position": "Intern;PhD student;Full Professor",
        "bibtex": "@inproceedings{\nholt2024lmac,\ntitle={L2{MAC}: Large Language Model Automatic Computer for Extensive Code Generation},\nauthor={Samuel Holt and Max Ruiz Luyten and Mihaela van der Schaar},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=EhrzQwsV4K}\n}",
        "github": "",
        "project": "",
        "reviewers": "4zmV;v4fH;Sz28;4yCT;mgbF",
        "pdf_size": 2199547,
        "rating": "6;6;8;8;8",
        "confidence": "3;4;3;4;4",
        "soundness": "3;2;4;3;4",
        "contribution": "3;2;4;3;3",
        "presentation": "2;3;3;3;3",
        "wc_summary": "96;117;153;39;79",
        "wc_strengths": "41;143;83;38;67",
        "wc_weaknesses": "83;241;209;50;139",
        "wc_questions": "221;82;56;4;192",
        "wc_review": "441;583;501;131;477",
        "wc_reply_reviewers": "0;160;0;17;17",
        "wc_reply_authors": "2432;3254;1459;955;1770",
        "reply_reviewers": "0;1;0;1;1",
        "reply_authors": "5;6;3;3;4",
        "rating_avg": [
            7.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            3.2,
            0.7483314773547882
        ],
        "contribution_avg": [
            3.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            96.8,
            38.01262948021355
        ],
        "wc_strengths_avg": [
            74.4,
            38.14498656442286
        ],
        "wc_weaknesses_avg": [
            144.4,
            72.40883923941882
        ],
        "wc_questions_avg": [
            111.0,
            82.4330030994868
        ],
        "wc_review_avg": [
            426.6,
            154.9988387053271
        ],
        "wc_reply_reviewers_avg": [
            38.8,
            61.07503581660841
        ],
        "wc_reply_authors_avg": [
            1974.0,
            799.1703197691966
        ],
        "reply_reviewers_avg": [
            0.6,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            4.2,
            1.16619037896906
        ],
        "replies_avg": [
            33,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.16666666666666663,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13897335000730600225&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=EhrzQwsV4K",
        "pdf": "https://openreview.net/pdf?id=EhrzQwsV4K",
        "email": "google.com;cam.ac.uk;ucla.edu",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Google;University of Cambridge;University of California, Los Angeles",
        "aff_unique_dep": "Google DeepMind;;",
        "aff_unique_url": "https://deepmind.com;https://www.cam.ac.uk;https://www.ucla.edu",
        "aff_unique_abbr": "DeepMind;Cambridge;UCLA",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Cambridge;Los Angeles",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "id": "EjIKerYk1O",
        "title": "Enhancing Airside Monitoring: Multi-view Approach for Accurate Aircraft Distance-To-Touchdown Estimation in Digital Towers",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "A digital tower, a cost-effective alternative to physical air traffic control towers, is expected to provide video-sensor-based surveillance, which is particularly advantageous for small airports. To fully realize this potential, advanced computer vision algorithms play a crucial role in effective airside monitoring. While current research primarily focuses on tracking aircraft on airport surfaces, an equally vital aspect is the real-time observation of approaching aircraft on the runway. This capability holds a pivotal role in augmenting both airport and runway operations. In this context, the study introduces a real-time deep learning approach to accurately estimate the distance-to-touchdown of approaching aircraft, covering distances of up to 10 nautical miles. The approach overcomes the limitations of monoscopic and stereoscopic methods by utilizing multi-view video feeds from digital towers. It integrates Yolov7, an advanced real-time object detection model, with auxiliary regression auto-calibration, enabling real-time tracking and feature extraction from diverse camera viewpoints. Subsequently, an ensemble approach utilizing an LSTM model is proposed to combine input vectors, resulting in precise distance estimation. Notably, this approach is designed for easy adaptation to various camera system configurations within digital towers. The model's effectiveness is assessed using simulated and real video data from Singapore Changi Airport, demonstrating stability across scenarios with low predictive errors (Mean Absolute Percentage Error = 0.18%) up to 10 nautical miles under visual meteorological conditions. These capabilities within a digital tower environment can significantly enhance the controller's ability to manage runway sequencing and final approach spacing, ultimately leading to remarkable airport efficiency and safety improvements.",
        "keywords": "Runway Management; Multiple Cameras; Airside Monitoring;Distance-To-Touchdown Prediction",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Thinh Pham;Gabriel James Goenawan;Hasnain Ali;sameer alam",
        "authorids": "~Thinh_Pham3;~Gabriel_James_Goenawan1;~Hasnain_Ali1;~sameer_alam1",
        "gender": "M;M;M;",
        "homepage": ";;;",
        "dblp": ";;;",
        "google_scholar": "https://scholar.google.com.sg/citations?user=hrGEgUUAAAAJ;vlSvdsIAAAAJ;7gkNRBYAAAAJ;https://scholar.google.com.au/citations?user=5W6FyV0AAAAJ",
        "orcid": "0000-0001-5156-8171;;;",
        "linkedin": ";gjamesgoenawan/;;",
        "or_profile": "~Thinh_Pham3;~Gabriel_James_Goenawan1;~Hasnain_Ali1;~sameer_alam1",
        "aff": "Nanyang Technological University;A*STAR;;Nanyang Technological University",
        "aff_domain": "ntu.edu.sg;astar.edu.sg;;ntu.edu.sg",
        "position": "Researcher;Researcher;;Associate Professor",
        "bibtex": "@misc{\npham2024enhancing,\ntitle={Enhancing Airside Monitoring: Multi-view Approach for Accurate Aircraft Distance-To-Touchdown Estimation in Digital Towers},\nauthor={Thinh Pham and Gabriel James Goenawan and Hasnain Ali and sameer alam},\nyear={2024},\nurl={https://openreview.net/forum?id=EjIKerYk1O}\n}",
        "github": "",
        "project": "",
        "reviewers": "kvrA;E31H;Z485",
        "site": "https://openreview.net/forum?id=EjIKerYk1O",
        "pdf_size": 10628286,
        "rating": "1;3;3",
        "confidence": "4;3;4",
        "soundness": "1;2;2",
        "contribution": "1;2;1",
        "presentation": "2;1;2",
        "wc_summary": "154;23;38",
        "wc_strengths": "89;14;22",
        "wc_weaknesses": "317;105;51",
        "wc_questions": "171;4;19",
        "wc_review": "731;146;130",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "968;455;534",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            71.66666666666667,
            58.53963519606942
        ],
        "wc_strengths_avg": [
            41.666666666666664,
            33.62869145371091
        ],
        "wc_weaknesses_avg": [
            157.66666666666666,
            114.80224542906622
        ],
        "wc_questions_avg": [
            64.66666666666667,
            75.43798041364104
        ],
        "wc_review_avg": [
            335.6666666666667,
            279.6191854806978
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            652.3333333333334,
            225.52802240273576
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:WlGGtuy5xU4J:scholar.google.com/&scioq=Enhancing+Airside+Monitoring:+Multi-view+Approach+for+Accurate+Aircraft+Distance-To-Touchdown+Estimation+in+Digital+Towers&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Nanyang Technological University;Agency for Science, Technology and Research",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ntu.edu.sg;https://www.a-star.edu.sg",
        "aff_unique_abbr": "NTU;A*STAR",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Singapore"
    },
    {
        "title": "Meta-VBO: Utilizing Prior Tasks in Optimizing Risk Measures with Gaussian Processes",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19095",
        "id": "ElykcDu5YK",
        "author_site": "Quoc Phong Nguyen, Bryan Kian Hsiang Low, Patrick Jaillet",
        "tldr": "",
        "abstract": "Research on optimizing the risk measure of a blackbox function using Gaussian processes, especially Bayesian optimization (BO) of risk measures, has become increasingly important due to the inevitable presence of uncontrollable variables in real-world applications. Nevertheless, existing works on BO of risk measures start the optimization from scratch for every new task without considering the results of prior tasks. In contrast, its vanilla BO counterpart has received a thorough investigation on utilizing prior tasks to speed up the current task through the body of works on meta-BO which, however, have not considered risk measures. To bridge this gap, this paper presents the first algorithm for meta-BO of risk measures (i.e., value-at-risk (VaR) and the conditional VaR), namely meta-VBO, by introducing a novel adjustment to the upper confidence bound acquisition function. Our proposed algorithm exhibits two desirable properties: (i) invariance to scaling and vertical shifting of the blackbox function and (ii) robustness to prior harmful tasks. We provide a theoretical performance guarantee for our algorithm and empirically demonstrate its performance using several synthetic function benchmarks and real-world objective functions.",
        "keywords": "meta-learning;Bayesian optimization;risk measure;value-at-risk;conditional value-at-risk",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/248599a968ef378272c140aa14e640c90dc01efa.pdf",
        "author": "Quoc Phong Nguyen;Bryan Kian Hsiang Low;Patrick Jaillet",
        "authorids": "~Quoc_Phong_Nguyen2;~Bryan_Kian_Hsiang_Low1;~Patrick_Jaillet1",
        "gender": ";M;M",
        "homepage": ";http://www.comp.nus.edu.sg/~lowkh;http://web.mit.edu/jaillet/www/",
        "dblp": ";97/4877;https://dblp.uni-trier.de/pers/hd/j/Jaillet:Patrick",
        "google_scholar": ";https://scholar.google.com.tw/citations?user=2P-Q09UAAAAJ;ND0FM6EAAAAJ",
        "orcid": ";;0000-0002-8585-6566",
        "linkedin": ";;patrick-jaillet-1260445/",
        "or_profile": "~Quoc_Phong_Nguyen2;~Bryan_Kian_Hsiang_Low1;~Patrick_Jaillet1",
        "aff": ";National University of Singapore;Massachusetts Institute of Technology",
        "aff_domain": ";nus.edu.sg;mit.edu",
        "position": ";Associate Professor;Full Professor",
        "bibtex": "@inproceedings{\nnguyen2024metavbo,\ntitle={Meta-{VBO}: Utilizing Prior Tasks in Optimizing Risk Measures with Gaussian Processes},\nauthor={Quoc Phong Nguyen and Bryan Kian Hsiang Low and Patrick Jaillet},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ElykcDu5YK}\n}",
        "github": "",
        "project": "",
        "reviewers": "4GcU;25FF;ZY9Q",
        "pdf_size": 676294,
        "rating": "6;6;8",
        "confidence": "3;3;4",
        "soundness": "2;3;4",
        "contribution": "2;3;3",
        "presentation": "1;3;4",
        "wc_summary": "65;163;158",
        "wc_strengths": "37;36;188",
        "wc_weaknesses": "118;55;365",
        "wc_questions": "123;277;7",
        "wc_review": "343;531;718",
        "wc_reply_reviewers": "95;17;16",
        "wc_reply_authors": "1085;1121;925",
        "reply_reviewers": "1;1;1",
        "reply_authors": "4;4;3",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "wc_summary_avg": [
            128.66666666666666,
            45.065384597148274
        ],
        "wc_strengths_avg": [
            87.0,
            71.41895173318261
        ],
        "wc_weaknesses_avg": [
            179.33333333333334,
            133.78174597289257
        ],
        "wc_questions_avg": [
            135.66666666666666,
            110.59033512121312
        ],
        "wc_review_avg": [
            530.6666666666666,
            153.09329036752578
        ],
        "wc_reply_reviewers_avg": [
            42.666666666666664,
            37.007506746004324
        ],
        "wc_reply_authors_avg": [
            1043.6666666666667,
            85.18737517313753
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.9999999999999998,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3323722513070247041&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=ElykcDu5YK",
        "pdf": "https://openreview.net/pdf?id=ElykcDu5YK",
        "email": ";nus.edu.sg;mit.edu",
        "author_num": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "National University of Singapore;Massachusetts Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.nus.edu.sg;https://web.mit.edu",
        "aff_unique_abbr": "NUS;MIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Singapore;United States"
    },
    {
        "title": "Self-contradictory Hallucinations of Large Language Models: Evaluation, Detection and Mitigation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19094",
        "id": "EmQSOi1X2f",
        "author_site": "Niels M\u00fcndler, Jingxuan He, Slobodan Jenko, Martin Vechev",
        "tldr": "",
        "abstract": "Large language models (large LMs) are susceptible to producing text that contains hallucinated content. An important instance of this problem is self-contradiction, where the LM generates two contradictory sentences within the same context. In this work, we present a comprehensive investigation into self-contradiction for various instruction-tuned LMs, covering evaluation, detection, and mitigation. Our primary evaluation task is open-domain text generation, but we also demonstrate the applicability of our approach to shorter question answering. Our analysis reveals the prevalence of self-contradictions, e.g., in 17.7% of all sentences produced by ChatGPT. We then propose a novel prompting-based framework designed to effectively detect and mitigate self-contradictions. Our detector achieves high accuracy, e.g., around 80% F1 score when prompting ChatGPT. The mitigation algorithm iteratively refines the generated text to remove contradictory information while preserving text fluency and informativeness. Importantly, our entire framework is applicable to black-box LMs and does not require retrieval of external knowledge. Rather, our method complements retrieval-based methods, as a large portion of self-contradictions (e.g., 35.2% for ChatGPT) cannot be verified using online text. Our approach is practically effective and has been released as a push-button tool to benefit the public at https://chatprotect.ai/.",
        "keywords": "language model;hallucination;trustworthy artificial intelligence;reasoning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Niels M\u00fcndler;Jingxuan He;Slobodan Jenko;Martin Vechev",
        "authorids": "~Niels_M\u00fcndler1;~Jingxuan_He1;~Slobodan_Jenko1;~Martin_Vechev1",
        "gender": "M;M;M;M",
        "homepage": "https://blog.nielstron.de;https://www.sri.inf.ethz.ch/people/jingxuan;;https://www.sri.inf.ethz.ch/people/martin",
        "dblp": "245/7560;;;93/2189.html",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;ylHZY58AAAAJ;;https://scholar.google.ch/citations?user=aZ1Rh50AAAAJ",
        "orcid": "0000-0003-3851-2557;;;",
        "linkedin": "niels-m%C3%BCndler-04115b231/;;slobodan-jenko-466370172;",
        "or_profile": "~Niels_M\u00fcndler1;~Jingxuan_He1;~Slobodan_Jenko1;~Martin_Vechev1",
        "aff": "Department of Computer Science, ETHZ - ETH Zurich;ETHZ - ETH Zurich;ETHZ - ETH Zurich;Swiss Federal Institute of Technology",
        "aff_domain": "inf.ethz.ch;ethz.ch;ethz.ch;ethz.ch",
        "position": "PhD student;PhD student;MS student;Full Professor",
        "bibtex": "@inproceedings{\nm{\\\"u}ndler2024selfcontradictory,\ntitle={Self-contradictory Hallucinations of Large Language Models: Evaluation, Detection and Mitigation},\nauthor={Niels M{\\\"u}ndler and Jingxuan He and Slobodan Jenko and Martin Vechev},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=EmQSOi1X2f}\n}",
        "github": "",
        "project": "",
        "reviewers": "gQAk;a7zQ;3teD",
        "pdf_size": 473044,
        "rating": "6;6;6",
        "confidence": "4;4;4",
        "soundness": "3;2;3",
        "contribution": "3;3;2",
        "presentation": "2;3;3",
        "wc_summary": "50;60;102",
        "wc_strengths": "63;22;105",
        "wc_weaknesses": "46;284;747",
        "wc_questions": "25;11;41",
        "wc_review": "184;377;995",
        "wc_reply_reviewers": "96;64;133",
        "wc_reply_authors": "260;744;2187",
        "reply_reviewers": "1;1;1",
        "reply_authors": "2;2;3",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            70.66666666666667,
            22.5289936649544
        ],
        "wc_strengths_avg": [
            63.333333333333336,
            33.88542787426805
        ],
        "wc_weaknesses_avg": [
            359.0,
            291.0544049944386
        ],
        "wc_questions_avg": [
            25.666666666666668,
            12.256517540566824
        ],
        "wc_review_avg": [
            518.6666666666666,
            345.91167787296354
        ],
        "wc_reply_reviewers_avg": [
            97.66666666666667,
            28.193773938387338
        ],
        "wc_reply_authors_avg": [
            1063.6666666666667,
            818.5240103720571
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 181,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2847662295796397862&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=EmQSOi1X2f",
        "pdf": "https://openreview.net/pdf?id=EmQSOi1X2f",
        "email": "inf.ethz.ch;ethz.ch;ethz.ch;ethz.ch",
        "author_num": 4,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "ETH Zurich;Swiss Federal Institute of Technology",
        "aff_unique_dep": "Department of Computer Science;",
        "aff_unique_url": "https://www.ethz.ch;https://www.ethz.ch",
        "aff_unique_abbr": "ETHZ;ETH Zurich",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Zurich;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Switzerland"
    },
    {
        "id": "EmUVpfrXWN",
        "title": "Junk DNA Hypothesis: A Task-Centric Angle of LLM Pre-trained Weights through Sparsity",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The traditional notion of \"Junk DNA\" has long been linked to non-coding segments within the human genome, constituting roughly 98\\% of its composition. Initially perceived as biologically inert, recent research has unveiled the critical roles some of these seemingly non-functional DNA sequences play in cellular processes. Intriguingly, the weights within deep neural networks exhibit a remarkable similarity to the redundancy observed in human genes. It was believed that weights in gigantic models contained excessive redundancy, leading to the conception that a significant number of parameters could be removed without compromising performance.\n\nThis paper challenges this conventional wisdom by presenting a compelling **counter-argument**. We employ sparsity (specifically weight pruning) as a tool to isolate and quantify the nuanced significance of low-magnitude weights in pre-trained large language models (LLMs). Our study demonstrates a strong correlation between these weight magnitudes and the knowledge they encapsulate for downstream tasks. Drawing parallels with biological insights, we raise the \"**Junk DNA Hypothesis**\" backed by our in-depth investigation: while small-magnitude weights may appear nearly \"useless\" for simple tasks and thus suitable for pruning, they actually encode crucial knowledge necessary for solving more difficult down stream tasks. Removing these seemingly insignificant weights can lead to \\underline{irreversible} knowledge forgetting and performance damage in difficult tasks. \n\nTo study it formally, we introduce several quantifiable metrics for gauging **downstream task difficulty**: (i) within the same task category, we vary the adequacy of target domain data (e.g., few-shot fine-tuning) and extend this to multi-domain learning (e.g., majority versus minority language in multilingual translation). Additionally, we assess the availability of external information (e.g., open-book versus close-book QA); (ii) across diverse task categories, we utilize the normalized performance gap between humans and models as an indicator of LLM-facing task complexity. Our extensive experiments validate the Junk DNA Hypothesis across a spectrum of model scales, tasks, and datasets, employing both forms of sparsity - unstructured and structured (N:M). We also empirically confirm that the essential knowledge indeed resides within the pre-trained weights, and the performance drop does not stem from constrained model capacity post-pruning. These findings offer fresh insights into how LLMs encode knowledge in a task-sensitive manner, present challenges for future research in model pruning, and open avenues for task-aware conditional computation during inference. Codes will be released.",
        "keywords": "Junk DNA Hypothesis;low-magnitude weights;large-scale language models",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Lu Yin;Shiwei Liu;AJAY KUMAR JAISWAL;Souvik Kundu;Zhangyang Wang",
        "authorids": "~Lu_Yin1;~Shiwei_Liu2;~AJAY_KUMAR_JAISWAL1;~Souvik_Kundu2;~Zhangyang_Wang1",
        "gender": ";M;M;M;M",
        "homepage": "https://luuyin.com/;https://shiweiliuiiiiiii.github.io/;https://ajay1994.github.io/;https://ksouvik52.github.io;https://vita-group.github.io",
        "dblp": "87/2528-6;234/8697-3.html;30/9707;126/2210;119/4026",
        "google_scholar": "G4Xe1NkAAAAJ;73IbXtsAAAAJ;I783HxYAAAAJ;https://scholar.google.com/citations?hl=en;pxFyKAIAAAAJ",
        "orcid": ";;;0000-0002-3533-9405;",
        "linkedin": ";;;souvik-kundu-64922b50/;",
        "or_profile": "~Lu_Yin1;~Shiwei_Liu2;~AJAY_KUMAR_JAISWAL1;~Souvik_Kundu2;~Zhangyang_Wang1",
        "aff": "University of Aberdeen;University of Oxford;University of Texas, Austin;Intel;University of Texas at Austin",
        "aff_domain": "abdn.ac.uk;ox.ac.uk;utexas.edu;intel.com;utexas.edu",
        "position": "Assistant Professor;Postdoc;PhD student;Researcher;Associate Professor",
        "bibtex": "@misc{\nyin2024junk,\ntitle={Junk {DNA} Hypothesis: A Task-Centric Angle of {LLM} Pre-trained Weights through Sparsity},\nauthor={Lu Yin and Shiwei Liu and AJAY KUMAR JAISWAL and Souvik Kundu and Zhangyang Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=EmUVpfrXWN}\n}",
        "github": "",
        "project": "",
        "reviewers": "52Ea;ahA2;Q2er",
        "site": "https://openreview.net/forum?id=EmUVpfrXWN",
        "pdf_size": 609872,
        "rating": "6;6;8",
        "confidence": "2;4;4",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "3;3;3",
        "wc_summary": "69;72;77",
        "wc_strengths": "33;166;191",
        "wc_weaknesses": "86;103;120",
        "wc_questions": "61;9;27",
        "wc_review": "249;350;415",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "843;687;545",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            72.66666666666667,
            3.2998316455372216
        ],
        "wc_strengths_avg": [
            130.0,
            69.34455037468098
        ],
        "wc_weaknesses_avg": [
            103.0,
            13.880441875771343
        ],
        "wc_questions_avg": [
            32.333333333333336,
            21.561282171728305
        ],
        "wc_review_avg": [
            338.0,
            68.29836503655609
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            691.6666666666666,
            121.70273437994544
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9607196654199577217&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;2",
        "aff_unique_norm": "University of Aberdeen;University of Oxford;University of Texas at Austin;Intel",
        "aff_unique_dep": ";;;Intel Corporation",
        "aff_unique_url": "https://www.abdn.ac.uk;https://www.ox.ac.uk;https://www.utexas.edu;https://www.intel.com",
        "aff_unique_abbr": "Aberdeen;Oxford;UT Austin;Intel",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Austin",
        "aff_country_unique_index": "0;0;1;1;1",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "id": "EmrbRRworT",
        "title": "ENHANCEMENT OF GNN\u2019S EXPRESSIVE POWER VIA RECONSIDERING MODAL LOGIC",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Since AC-GNNs, in which nodes only gather information from their neighbors to update features at each layer, are limited in their expressive power, numerous models have been proposed to enable GNNs to go beyond Weisfeiler-Lehman (WL) test. However there still a lack of effective methods to measure these models' expressive power: for a specific task, it is still difficult to figure out whether the model is competent for the task. We tackle this problem by finding equivalent Boolean classifiers logic for models. By checking whether the task is able to be expressed as model's equivalent Boolean classifiers logic formula, we can be aware of whether the model is competent for task. We propose a framework for AC-GNNs, denoted as l-div AC-GNNs, to enhance AC-GNNs' expressive power. To be more specific, we classify node's neighbors according to existence of different length of paths from node's neighbors to itself. To find l-div AC-GNNs' equivalent Boolean classifiers logic, we introduce the l-div graded modal logic and prove that a Boolean logical classifiers can be expressed by l-div graded modal logic if and only if there exists a l-div AC-GNN which is able to capture it. In this paper, three properties are defined for the framework: invariance and equivariance, approximation and logic expressive power, we proved l-div AC-GNNs are possessing with these properties. A series of tasks have been implemented to validate our theoretics, the results of experiments demonstrate the validities of both our method to measure models' expressive power and expressive power of l-div AC-GNNs.",
        "keywords": "Graph Neural Networks;Expressiveness;Modal theory",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Dun Ma;Suixiang Gao",
        "authorids": "~Dun_Ma1;~Suixiang_Gao1",
        "gender": "M;M",
        "homepage": "https://welcome.ucas.edu.cn/index.php/zh-cn/gxfw/xinsheng;https://people.ucas.ac.cn/~sxgao",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Dun_Ma1;~Suixiang_Gao1",
        "aff": "University of Chinese Academy of Sciences;University of Chinese Academy of Sciences",
        "aff_domain": "ucas.ac.cn;ucas.ac.cn",
        "position": "MS student;Full Professor",
        "bibtex": "@misc{\nma2024enhancement,\ntitle={{ENHANCEMENT} {OF} {GNN}{\\textquoteright}S {EXPRESSIVE} {POWER} {VIA} {RECONSIDERING} {MODAL} {LOGIC}},\nauthor={Dun Ma and Suixiang Gao},\nyear={2024},\nurl={https://openreview.net/forum?id=EmrbRRworT}\n}",
        "github": "",
        "project": "",
        "reviewers": "KZTv;3sgu;oNW8",
        "site": "https://openreview.net/forum?id=EmrbRRworT",
        "pdf_size": 649714,
        "rating": "1;3;3",
        "confidence": "4;5;2",
        "soundness": "2;1;2",
        "contribution": "1;2;2",
        "presentation": "1;1;1",
        "wc_summary": "136;35;90",
        "wc_strengths": "13;19;26",
        "wc_weaknesses": "105;132;77",
        "wc_questions": "22;10;28",
        "wc_review": "276;196;221",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            1.247219128924647
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.0,
            0.0
        ],
        "wc_summary_avg": [
            87.0,
            41.28760911782937
        ],
        "wc_strengths_avg": [
            19.333333333333332,
            5.312459150169742
        ],
        "wc_weaknesses_avg": [
            104.66666666666667,
            22.45489305746572
        ],
        "wc_questions_avg": [
            20.0,
            7.483314773547883
        ],
        "wc_review_avg": [
            231.0,
            33.4165627596057
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.18898223650461357,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:7T8vboOdjwkJ:scholar.google.com/&scioq=ENHANCEMENT+OF+GNN%E2%80%99S+EXPRESSIVE+POWER+VIA+RECONSIDERING+MODAL+LOGIC&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Chinese Academy of Sciences",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.ucas.ac.cn",
        "aff_unique_abbr": "UCAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "EmuZOYfPNf",
        "title": "Searching for Parameter-Efficient Tuning Architecture for Text-to-image Diffusion Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The large-scale text-to-image diffusion model, represented by Stable Diffusion, has achieved remarkable success in the field of image generation.  Transferring pretrained diffusion models to downstream domains with parameter-efficient tuning (PEFT)  methods such as Adapter and LoRa have become the most common paradigms. Despite their widespread usage, there has been limited research on systematically studying how the design of these components would impact the final tuning effectiveness.\nIn this paper, we investigate the automatic design of an optimal tuning architecture. Specifically, we employ a reinforcement learning-based neural network search method to facilitate the automatic design of the tuning architecture for PEFT of Stable Diffusion with few-shot training data. Our search space includes micro-structures similar to Adapter, LoRa, as well as their insertion positions. \nFor effective searching and evaluation, we build a large-scale tuning dataset. Through our search, we successfully obtained a novel tuning architecture that reduces parameter count by 18\\% compared to the widely adopted LoRa approach but still surpasses across various downstream tasks hugely.   We also conduct extensive analysis of the searched results, aiming to provide valuable insights to the community regarding parameter-efficient tuning for large-scale diffusion models.",
        "keywords": "architecture search;parameter-efficient tuning;image generation",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Manyuan Zhang;Guanglu Song;Yu Liu;Hongsheng Li",
        "authorids": "~Manyuan_Zhang1;~Guanglu_Song2;~Yu_Liu2;~Hongsheng_Li3",
        "gender": "M;M;M;M",
        "homepage": "https://manyuan97.github.io/;;http://liuyu.us;http://www.ee.cuhk.edu.hk/~hsli",
        "dblp": "217/3051;207/4745;97/2274-15;27/7402-1",
        "google_scholar": "ZYmcm0EAAAAJ;Bd3v08QAAAAJ;;BN2Ze-QAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Manyuan_Zhang1;~Guanglu_Song2;~Yu_Liu2;~Hongsheng_Li3",
        "aff": "Chinese University of Hong Kong;Sensetime;SenseTime;The Chinese University of Hong Kong",
        "aff_domain": "cuhk.hk;sensetime.com;sensetime.com;cuhk.edu.hk",
        "position": "PhD student;Computer Vision Researcher;Principal Researcher;Associate Professor",
        "bibtex": "@misc{\nzhang2024searching,\ntitle={Searching for Parameter-Efficient Tuning Architecture for Text-to-image Diffusion Models},\nauthor={Manyuan Zhang and Guanglu Song and Yu Liu and Hongsheng Li},\nyear={2024},\nurl={https://openreview.net/forum?id=EmuZOYfPNf}\n}",
        "github": "",
        "project": "",
        "reviewers": "4Ls9;g24y;vpDh;vXGg",
        "site": "https://openreview.net/forum?id=EmuZOYfPNf",
        "pdf_size": 9407358,
        "rating": "3;5;5;6",
        "confidence": "5;4;4;3",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;2;4",
        "wc_summary": "42;113;38;72",
        "wc_strengths": "42;36;18;75",
        "wc_weaknesses": "427;114;135;130",
        "wc_questions": "427;2;2;33",
        "wc_review": "938;265;193;310",
        "wc_reply_reviewers": "0;50;54;12",
        "wc_reply_authors": "112;418;445;516",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            66.25,
            30.019785142468958
        ],
        "wc_strengths_avg": [
            42.75,
            20.60794749605113
        ],
        "wc_weaknesses_avg": [
            201.5,
            130.4233491365714
        ],
        "wc_questions_avg": [
            116.0,
            180.00138888353055
        ],
        "wc_review_avg": [
            426.5,
            298.2486378845677
        ],
        "wc_reply_reviewers_avg": [
            29.0,
            23.430749027719962
        ],
        "wc_reply_authors_avg": [
            372.75,
            154.74071054509218
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9733285267845754,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:V09SD5TKiHwJ:scholar.google.com/&scioq=Searching+for+Parameter-Efficient+Tuning+Architecture+for+Text-to-image+Diffusion+Models&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;0",
        "aff_unique_norm": "Chinese University of Hong Kong;SenseTime",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cuhk.edu.hk;https://www.sensetime.com",
        "aff_unique_abbr": "CUHK;SenseTime",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Building Cooperative Embodied Agents Modularly with Large Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19093",
        "id": "EnXJfQqy0K",
        "author_site": "Hongxin Zhang, Weihua Du, Jiaming Shan, Qinhong Zhou, Yilun Du, Joshua B Tenenbaum, Tianmin Shu, Chuang Gan",
        "tldr": "",
        "abstract": "In this work, we address challenging multi-agent cooperation problems with decentralized control, raw sensory observations, costly communication, and multi-objective tasks instantiated in various embodied environments. While previous research either presupposes a cost-free communication channel or relies on a centralized controller with shared observations, we harness the commonsense knowledge, reasoning ability, language comprehension, and text generation prowess of LLMs and seamlessly incorporate them into a cognitive-inspired modular framework that integrates with perception, memory, and execution. Thus building a Cooperative Embodied Language Agent CoELA, who can plan, communicate, and cooperate with others to accomplish long-horizon tasks efficiently. Our experiments on C-WAH and TDW-MAT demonstrate that CoELA driven by GPT-4 can surpass strong planning-based methods and exhibit emergent effective communication. Though current Open LMs like LLAMA-2 still underperform, we fine-tune a CoELA with data collected with our agents and show how they can achieve promising performance. We also conducted a user study for human-agent interaction and discovered that CoELA communicating in natural language can earn more trust and cooperate more effectively with humans. Our research underscores the potential of LLMs for future research in multi-agent cooperation. Videos can be found on the project website https://vis-www.cs.umass.edu/Co-LLM-Agents/.",
        "keywords": "Large Language Models;Embodied Intelligence;Multi-Agent Cooperation;Human-AI Interaction;Communication",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/1731274f5896d9b18709ef40c49c8d05cd933277.zip",
        "author": "Hongxin Zhang;Weihua Du;Jiaming Shan;Qinhong Zhou;Yilun Du;Joshua B. Tenenbaum;Tianmin Shu;Chuang Gan",
        "authorids": "~Hongxin_Zhang1;~Weihua_Du1;~Jiaming_Shan1;~Qinhong_Zhou1;~Yilun_Du1;~Joshua_B._Tenenbaum1;~Tianmin_Shu1;~Chuang_Gan1",
        "gender": "M;M;M;M;;;;M",
        "homepage": "https://icefoxzhx.github.io/;https://stiglidu.github.io/;https://shanjiaming.github.io/;https://zhouqqhh.github.io/;https://yilundu.github.io;;;http://people.csail.mit.edu/ganchuang/",
        "dblp": "284/2962-5;229/1269;351/0589;337/9618;204/4379;t/JoshuaBTenenbaum;163/2175.html;139/6993",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en;sQW6Ni4AAAAJ;;;YT_ffdwAAAAJ;PTeSCbIAAAAJ",
        "orcid": "0000-0002-6041-2440;0000-0002-8856-0277;;;;;;",
        "linkedin": ";;jiaming-shan-36249a298/;https://www.linkedin.cn/incareer/in/%E6%B2%81%E6%B3%93-%E5%91%A8-9500b7127;;;;",
        "or_profile": "~Hongxin_Zhang1;~Weihua_Du1;~Jiaming_Shan1;~Qinhong_Zhou1;~Yilun_Du1;~Joshua_B._Tenenbaum1;~Tianmin_Shu1;~Chuang_Gan1",
        "aff": "University of Massachusetts at Amherst;Tsinghua University;Shanghai Jiaotong University;University of Massachusetts at Amherst;Massachusetts Institute of Technology;Massachusetts Institute of Technology;Johns Hopkins University;University of Massachusetts at Amherst",
        "aff_domain": "umass.edu;mails.tsinghua.edu.cn;sjtu.edu.cn;umass.edu;mit.edu;mit.edu;jhu.edu;umass.edu",
        "position": "PhD student;Undergrad student;Undergrad student;PhD student;PhD student;Professor;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nzhang2024building,\ntitle={Building Cooperative Embodied Agents Modularly with Large Language Models},\nauthor={Hongxin Zhang and Weihua Du and Jiaming Shan and Qinhong Zhou and Yilun Du and Joshua B. Tenenbaum and Tianmin Shu and Chuang Gan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=EnXJfQqy0K}\n}",
        "github": "",
        "project": "",
        "reviewers": "xiUJ;iNRX;2bPF;tquX",
        "pdf_size": 16947808,
        "rating": "6;6;6;8",
        "confidence": "3;3;4;4",
        "soundness": "2;3;2;3",
        "contribution": "2;3;2;4",
        "presentation": "3;2;2;4",
        "wc_summary": "86;68;47;105",
        "wc_strengths": "24;76;76;225",
        "wc_weaknesses": "104;173;115;246",
        "wc_questions": "38;52;3;87",
        "wc_review": "252;369;241;663",
        "wc_reply_reviewers": "17;9;42;9",
        "wc_reply_authors": "289;226;1049;549",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            76.5,
            21.47673159491453
        ],
        "wc_strengths_avg": [
            100.25,
            75.08786519804649
        ],
        "wc_weaknesses_avg": [
            159.5,
            56.40257086339239
        ],
        "wc_questions_avg": [
            45.0,
            30.108138434649195
        ],
        "wc_review_avg": [
            381.25,
            170.2268706755781
        ],
        "wc_reply_reviewers_avg": [
            19.25,
            13.534677683639163
        ],
        "wc_reply_authors_avg": [
            528.25,
            324.11678065166575
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 238,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1624045542134367526&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=EnXJfQqy0K",
        "pdf": "https://openreview.net/pdf?id=EnXJfQqy0K",
        "email": "umass.edu;mails.tsinghua.edu.cn;sjtu.edu.cn;umass.edu;mit.edu;mit.edu;jhu.edu;umass.edu",
        "author_num": 8,
        "aff_unique_index": "0;1;2;0;3;3;4;0",
        "aff_unique_norm": "University of Massachusetts Amherst;Tsinghua University;Shanghai Jiao Tong University;Massachusetts Institute of Technology;Johns Hopkins University",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.umass.edu;https://www.tsinghua.edu.cn;https://www.sjtu.edu.cn;https://web.mit.edu;https://www.jhu.edu",
        "aff_unique_abbr": "UMass Amherst;THU;SJTU;MIT;JHU",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Amherst;",
        "aff_country_unique_index": "0;1;1;0;0;0;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "An Emulator for Fine-tuning Large Language Models using Small Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19092",
        "id": "Eo7kv0sllr",
        "author_site": "Eric Mitchell, Rafael Rafailov, Archit Sharma, Chelsea Finn, Christopher Manning",
        "tldr": "",
        "abstract": "Widely used language models (LMs) are typically built by scaling up a two-stage training pipeline: a pre-training stage that uses a very large, diverse dataset of text and a fine-tuning (sometimes, 'alignment') stage that uses targeted examples or other specifications of desired behaviors. While it has been hypothesized that knowledge and skills come from pre-training, and fine-tuning mostly filters this knowledge and skillset, this intuition has not been extensively tested. To aid in doing so, we introduce a novel technique for decoupling the knowledge and skills gained in these two stages, enabling a direct answer to the question, *What would happen if we combined the knowledge learned by a large model during pre-training with the knowledge learned by a small model during fine-tuning (or vice versa)?* Using an RL-based framework derived from recent developments in learning from human preferences, we introduce *emulated fine-tuning (EFT)*, a principled and practical method for sampling from a distribution that approximates (or 'emulates') the result of pre-training and fine-tuning at different scales. Our experiments with EFT show that scaling up fine-tuning tends to improve helpfulness, while scaling up pre-training tends to improve factuality. Beyond decoupling scale, we show that EFT enables test-time adjustment of competing behavioral traits like helpfulness and harmlessness without additional training. Finally, a special case of emulated fine-tuning, which we call LM *up-scaling*, avoids resource-intensive fine-tuning of large pre-trained models by ensembling them with small fine-tuned models, essentially emulating the result of fine-tuning the large pre-trained model. Up-scaling consistently improves helpfulness and factuality of instruction-following models in the Llama, Llama-2, and Falcon families, without additional hyperparameters or training. For reference implementation, see [https://github.com/eric-mitchell/emulated-fine-tuning](https://github.com/eric-mitchell/emulated-fine-tuning).",
        "keywords": "pre-training;fine-tuning;decouple;scale;reward;alignment",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Eric Mitchell;Rafael Rafailov;Archit Sharma;Chelsea Finn;Christopher D Manning",
        "authorids": "~Eric_Mitchell1;~Rafael_Rafailov1;~Archit_Sharma1;~Chelsea_Finn1;~Christopher_D_Manning1",
        "gender": "M;M;M;F;M",
        "homepage": "https://ericmitchell.ai;https://rmrafailov.github.io/;;https://ai.stanford.edu/~cbfinn/;https://nlp.stanford.edu/~manning/",
        "dblp": "238/0419;272/5358;220/3163.html;131/1783;m/ChristopherDManning",
        "google_scholar": "q77J4fgAAAAJ;TwABcRgAAAAJ;_0IIzxgAAAAJ;vfPE6hgAAAAJ;1zmDOdwAAAAJ",
        "orcid": "0000-0002-7487-1744;;;;0000-0001-6155-649X",
        "linkedin": ";;;;christopher-manning-011575/",
        "or_profile": "~Eric_Mitchell1;~Rafael_Rafailov1;~Archit_Sharma1;~Chelsea_Finn1;~Christopher_D_Manning1",
        "aff": "Stanford University;Stanford University;Stanford University;Google;Computer Science Department, Stanford University",
        "aff_domain": "stanford.edu;stanford.edu;stanford.edu;google.com;cs.stanford.edu",
        "position": "PhD student;PhD student;Graduate Student;Research Scientist;Full Professor",
        "bibtex": "@inproceedings{\nmitchell2024an,\ntitle={An Emulator for Fine-tuning Large Language Models using Small Language Models},\nauthor={Eric Mitchell and Rafael Rafailov and Archit Sharma and Chelsea Finn and Christopher D Manning},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Eo7kv0sllr}\n}",
        "github": "",
        "project": "",
        "reviewers": "oV1U;UMGS;XUbA;fHwV",
        "pdf_size": 1420966,
        "rating": "6;6;6;8",
        "confidence": "2;3;2;5",
        "soundness": "3;3;3;4",
        "contribution": "3;3;3;4",
        "presentation": "2;2;2;2",
        "wc_summary": "60;83;57;171",
        "wc_strengths": "63;71;40;113",
        "wc_weaknesses": "117;60;58;313",
        "wc_questions": "79;85;6;98",
        "wc_review": "319;299;161;695",
        "wc_reply_reviewers": "46;0;0;35",
        "wc_reply_authors": "546;330;270;604",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            1.224744871391589
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            92.75,
            46.283771453934044
        ],
        "wc_strengths_avg": [
            71.75,
            26.394838510587633
        ],
        "wc_weaknesses_avg": [
            137.0,
            104.33839178365747
        ],
        "wc_questions_avg": [
            67.0,
            35.88175023601831
        ],
        "wc_review_avg": [
            368.5,
            198.07763629445904
        ],
        "wc_reply_reviewers_avg": [
            20.25,
            20.620075169601105
        ],
        "wc_reply_authors_avg": [
            437.5,
            140.62983325027446
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.9428090415820632,
        "gs_citation": 46,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9824227867403005167&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=Eo7kv0sllr",
        "pdf": "https://openreview.net/pdf?id=Eo7kv0sllr",
        "email": "stanford.edu;stanford.edu;stanford.edu;google.com;cs.stanford.edu",
        "author_num": 5,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "Stanford University;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.stanford.edu;https://www.google.com",
        "aff_unique_abbr": "Stanford;Google",
        "aff_campus_unique_index": "0;0;0;1;0",
        "aff_campus_unique": "Stanford;Mountain View",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "ToRA: A Tool-Integrated Reasoning Agent for Mathematical Problem Solving",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19091",
        "id": "Ep0TtjVoap",
        "author_site": "Zhibin Gou, Zhihong Shao, Yeyun Gong, yelong shen, Yujiu Yang, Minlie Huang, Nan Duan, Weizhu Chen",
        "tldr": "",
        "abstract": "Large language models have made significant progress in various language tasks, yet they still struggle with complex mathematics. In this paper, we propose ToRA a series of Tool-integrated Reasoning Agents designed to solve challenging mathematical problems by seamlessly integrating natural language reasoning with the utilization of external tools (e.g., computation libraries and symbolic solvers), thereby amalgamating the analytical prowess of language and the computational efficiency of tools. To train ToRA, we curate interactive tool-use trajectories on mathematical datasets, apply imitation learning on the annotations, and propose output space shaping to further refine models' reasoning behavior. As a result, ToRA models significantly outperform open-source models on 10 mathematical reasoning datasets across all scales with 13%-19% absolute improvements on average. Notably, ToRA-7B reaches 44.6% on the competition-level dataset MATH, surpassing the best open-source model WizardMath-70B by 22% absolute. ToRA-34B is also the first open-source model that achieves an accuracy exceeding 50% on MATH, which significantly outperforms GPT-4's CoT result, and is competitive with GPT-4 solving problems with programs. Additionally, we conduct a comprehensive analysis of the benefits and remaining challenges of tool interaction for mathematical reasoning, providing valuable insights for future research.",
        "keywords": "Large Language Models;Mathematical Reasoning;Tool Learning",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "",
        "author": "Zhibin Gou;Zhihong Shao;Yeyun Gong;yelong shen;Yujiu Yang;Minlie Huang;Nan Duan;Weizhu Chen",
        "authorids": "~Zhibin_Gou1;~Zhihong_Shao1;~Yeyun_Gong2;~yelong_shen1;~Yujiu_Yang2;~Minlie_Huang1;~Nan_Duan1;~Weizhu_Chen1",
        "gender": "M;M;M;;M;M;M;M",
        "homepage": "https://github.com/zubingou;;;;https://sites.google.com/view/iigroup-thu;http://coai.cs.tsinghua.edu.cn/hml;https://nanduan.github.io/;https://www.microsoft.com/en-us/research/people/wzchen/",
        "dblp": "315/9328;247/5748;06/10400.html;;30/3847;;;79/2536",
        "google_scholar": ";PZy4HEIAAAAJ;piUkwMYAAAAJ;;4gH3sxsAAAAJ;https://scholar.google.com/citations?hl=zh-CN;Qaa6OxIAAAAJ;LG_E-4EAAAAJ",
        "orcid": ";;;;0000-0002-6427-1024;;;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Zhibin_Gou1;~Zhihong_Shao1;~Yeyun_Gong2;~yelong_shen1;~Yujiu_Yang2;~Minlie_Huang1;~Nan_Duan1;~Weizhu_Chen1",
        "aff": "Microsoft;Tsinghua University;Microsoft;;Tsinghua University;Tsinghua University;Microsoft Research Asia;Microsoft GenAI",
        "aff_domain": "microsoft.com;tsinghua.edu.cn;microsoft.com;;tsinghua.edu.cn;tsinghua.edu.cn;microsoft.com;microsoft.com",
        "position": "Intern;PhD student;Researcher;;Full Professor;Full Professor;Principal Researcher;Vice President",
        "bibtex": "@inproceedings{\ngou2024tora,\ntitle={To{RA}: A Tool-Integrated Reasoning Agent for Mathematical Problem Solving},\nauthor={Zhibin Gou and Zhihong Shao and Yeyun Gong and yelong shen and Yujiu Yang and Minlie Huang and Nan Duan and Weizhu Chen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Ep0TtjVoap}\n}",
        "github": "",
        "project": "",
        "reviewers": "U6Sz;Gq26;V1TN;mvjp",
        "pdf_size": 891470,
        "rating": "5;6;8;8",
        "confidence": "5;3;3;5",
        "soundness": "2;3;3;4",
        "contribution": "2;2;3;4",
        "presentation": "2;3;3;4",
        "wc_summary": "52;48;41;129",
        "wc_strengths": "15;32;60;37",
        "wc_weaknesses": "508;27;72;124",
        "wc_questions": "116;36;99;11",
        "wc_review": "691;143;272;301",
        "wc_reply_reviewers": "265;22;14;23",
        "wc_reply_authors": "3159;642;1366;1027",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "7;2;2;2",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            1.0
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            67.5,
            35.7246413557925
        ],
        "wc_strengths_avg": [
            36.0,
            16.077935190813527
        ],
        "wc_weaknesses_avg": [
            182.75,
            190.89444072575816
        ],
        "wc_questions_avg": [
            65.5,
            43.33878170876519
        ],
        "wc_review_avg": [
            351.75,
            204.69657422634117
        ],
        "wc_reply_reviewers_avg": [
            81.0,
            106.28969846603198
        ],
        "wc_reply_authors_avg": [
            1548.5,
            964.458526842912
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.25,
            2.165063509461097
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.19245008972987526,
        "gs_citation": 193,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4348118988413656609&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=Ep0TtjVoap",
        "pdf": "https://openreview.net/pdf?id=Ep0TtjVoap",
        "email": "microsoft.com;tsinghua.edu.cn;microsoft.com;;tsinghua.edu.cn;tsinghua.edu.cn;microsoft.com;microsoft.com",
        "author_num": 8,
        "aff_unique_index": "0;1;0;1;1;0;0",
        "aff_unique_norm": "Microsoft;Tsinghua University",
        "aff_unique_dep": "Microsoft Corporation;",
        "aff_unique_url": "https://www.microsoft.com;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "Microsoft;THU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Asia",
        "aff_country_unique_index": "0;1;0;1;1;1;0",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "Privileged Sensing Scaffolds Reinforcement Learning",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19090",
        "id": "EpVe8jAjdx",
        "author_site": "Edward Hu, James Springer, Oleh Rybkin, Dinesh Jayaraman",
        "tldr": "",
        "abstract": "We need to look at our shoelaces as we first learn to tie them but having mastered this skill, can do it from touch alone. We call this phenomenon \u201csensory scaffolding\u201d: observation streams that are not needed by a master might yet aid a novice learner. We consider such sensory scaffolding setups for training artificial agents. For example, a robot arm may need to be deployed with just a low-cost, robust, general-purpose camera; yet its performance may improve by having privileged training-time-only access to informative albeit expensive and unwieldy motion capture rigs or fragile tactile sensors. For these settings, we propose \u201cScaffolder\u201d, a reinforcement learning approach which effectively exploits privileged sensing in critics, world models, reward estimators, and other such auxiliary components that are only used at training time, to improve the target policy. For evaluating sensory scaffolding agents, we design a new \u201cS3\u201d suite of ten diverse simulated robotic tasks that explore a wide range of practical sensor setups. Agents must use privileged camera sensing to train blind hurdlers, privileged active visual perception to help robot arms overcome visual occlusions, privileged touch sensors to train robot hands, and more. Scaffolder easily outperforms relevant prior baselines and frequently performs comparably even to policies that have test-time access to the privileged sensors. Website: https://penn-pal-lab.github.io/scaffolder/",
        "keywords": "reinforcement learning;model-based reinforcement learning;world models;robotics;privileged information;asymmetric learning;multimodality;perception;sensing",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Edward S. Hu;James Springer;Oleh Rybkin;Dinesh Jayaraman",
        "authorids": "~Edward_S._Hu1;~James_Springer1;~Oleh_Rybkin1;~Dinesh_Jayaraman2",
        "gender": "M;M;M;M",
        "homepage": "https://www.grasp.upenn.edu/people/james-springer/;http://olehrybkin.com/;https://www.seas.upenn.edu/~dineshj/;https://www.edwardshu.com",
        "dblp": ";217/2946;145/3870;245/4627",
        "google_scholar": ";https://scholar.google.com/citations?view_op=list_works;QxLpghAAAAAJ;",
        "orcid": ";0000-0002-5898-006X;0000-0002-6888-3095;",
        "linkedin": ";oleh-rybkin/;dinesh-jayaraman-44b31539/;",
        "or_profile": "~James_Springer1;~Oleh_Rybkin1;~Dinesh_Jayaraman2;~Edward_Shichao_Hu1",
        "aff": "University of Pennsylvania;University of California, Berkeley;University of Pennsylvania;University of Pennsylvania",
        "aff_domain": "upenn.edu;berkeley.edu;upenn.edu;upenn.edu",
        "position": "MS student;Postdoc;Assistant Professor;PhD student",
        "bibtex": "@inproceedings{\nhu2024privileged,\ntitle={Privileged Sensing Scaffolds Reinforcement Learning},\nauthor={Edward S. Hu and James Springer and Oleh Rybkin and Dinesh Jayaraman},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=EpVe8jAjdx}\n}",
        "github": "",
        "project": "",
        "reviewers": "bAbn;V3Vw;xL3j;Sbzi",
        "pdf_size": 4993377,
        "rating": "8;8;8;10",
        "confidence": "3;3;2;4",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;4",
        "presentation": "4;3;3;4",
        "wc_summary": "93;60;63;453",
        "wc_strengths": "159;136;16;147",
        "wc_weaknesses": "147;213;142;131",
        "wc_questions": "29;40;49;42",
        "wc_review": "428;449;270;773",
        "wc_reply_reviewers": "36;10;16;0",
        "wc_reply_authors": "589;1132;1322;628",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "1;3;4;1",
        "rating_avg": [
            8.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            167.25,
            165.4816832764279
        ],
        "wc_strengths_avg": [
            114.5,
            57.447802394869726
        ],
        "wc_weaknesses_avg": [
            158.25,
            32.135455497005175
        ],
        "wc_questions_avg": [
            40.0,
            7.176350047203662
        ],
        "wc_review_avg": [
            480.0,
            182.76624414809208
        ],
        "wc_reply_reviewers_avg": [
            15.5,
            13.143439428094915
        ],
        "wc_reply_authors_avg": [
            917.75,
            316.76203607755775
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            1.299038105676658
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.816496580927726,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2612132821386841387&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=EpVe8jAjdx",
        "pdf": "https://openreview.net/pdf?id=EpVe8jAjdx",
        "email": "upenn.edu;berkeley.edu;upenn.edu;upenn.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "University of Pennsylvania;University of California, Berkeley",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.upenn.edu;https://www.berkeley.edu",
        "aff_unique_abbr": "UPenn;UC Berkeley",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Berkeley",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Self-supervised Representation Learning from Random Data Projectors",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19089",
        "id": "EpYnZpDpsQ",
        "author_site": "Yi Sui, Tongzi Wu, Jesse Cresswell, Ga Wu, George Stein, Xiao Shi (Gary) Huang, Xiaochen Zhang, Maksims Volkovs",
        "tldr": "",
        "abstract": "Self-supervised representation learning (SSRL) has advanced considerably by exploiting the transformation invariance assumption under artificially designed data augmentations. While augmentation-based SSRL algorithms push the boundaries of performance in computer vision and natural language processing, they are often not directly applicable to other data modalities, and can conflict with application-specific data augmentation constraints. This paper presents an SSRL approach that can be applied to any data modality and network architecture because it does not rely on augmentations or masking. Specifically, we show that high-quality data representations can be learned by reconstructing random data projections. We evaluate the proposed approach on a wide range of representation learning tasks that span diverse modalities and real-world applications. We show that it outperforms multiple state-of-the-art SSRL baselines. \nDue to its wide applicability and strong empirical results, we argue that learning from randomness is a fruitful research direction worthy of attention and further study.",
        "keywords": "Representation learning;Self-supervised learning;random data projections;domain-agnostic representation learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/bd1bd358dd0b792bebf14e90ca691099591e4888.zip",
        "author": "Yi Sui;Tongzi Wu;Jesse C. Cresswell;Ga Wu;George Stein;Xiao Shi Huang;Xiaochen Zhang;Maksims Volkovs",
        "authorids": "~Yi_Sui1;~Tongzi_Wu1;~Jesse_C._Cresswell1;~Ga_Wu1;~George_Stein1;~Xiao_Shi_Huang1;~Xiaochen_Zhang2;~Maksims_Volkovs3",
        "gender": "F;F;M;;M;;;M",
        "homepage": "https://www.linkedin.com/in/yi-sui-90513699/;;;https://georgestein.github.io/;;;https://jescresswell.github.io/;https://www.cs.toronto.edu/~mvolkovs",
        "dblp": ";294/7224;161/0064;220/5541;280/1580;76/2582;279/6764;22/1815",
        "google_scholar": "fLo2o54AAAAJ;https://scholar.google.com/citations?hl=zh-CN;IdBlVPUAAAAJ;;dPnxxNEAAAAJ;;https://scholar.google.ca/citations?hl=en;https://scholar.google.ca/citations?user=m9I8jgcAAAAJ",
        "orcid": "0009-0009-9207-7403;;;0000-0002-5193-516X;;;0000-0002-9284-8804;",
        "linkedin": ";;;;xiaoshihuang/;https://linkedin.com/in/lisazhang1123;;",
        "or_profile": "~Yi_Sui1;~Tongzi_Wu1;~Ga_Wu1;~George_Stein1;~Xiao_Shi_Huang1;~Xiaochen_Zhang2;~Jesse_C_Cresswell1;~Maksims_Volkovs1",
        "aff": "Layer6 AI;Layer 6 AI;Dalhousie University;Layer6 AI;Layer 6 AI;Layer6 AI;Layer 6 AI;Layer6 AI",
        "aff_domain": "layer6.ai;layer6.ai;dal.ca;layer6.ai;layer6.ai;layer6.ai;layer6.ai;layer6.ai",
        "position": "Machine Learning Scientist;Machine Learning Scientist;Assistant Professor;Machine Learning Scientist;Senior Machine Learning Scientist;Machine Learning Engineer;Staff Machine Learning Scientist;Principal Researcher",
        "bibtex": "@inproceedings{\nsui2024selfsupervised,\ntitle={Self-supervised Representation Learning from Random Data Projectors},\nauthor={Yi Sui and Tongzi Wu and Jesse C. Cresswell and Ga Wu and George Stein and Xiao Shi Huang and Xiaochen Zhang and Maksims Volkovs},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=EpYnZpDpsQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "ze2f;sQMY;Eryk;6gYm;gtio",
        "pdf_size": 1858298,
        "rating": "5;6;6;6;8",
        "confidence": "4;4;5;2;4",
        "soundness": "2;2;3;2;3",
        "contribution": "2;2;3;2;3",
        "presentation": "3;3;4;2;4",
        "wc_summary": "68;56;130;82;65",
        "wc_strengths": "24;15;31;32;200",
        "wc_weaknesses": "369;161;46;222;210",
        "wc_questions": "159;3;591;12;83",
        "wc_review": "620;235;798;348;558",
        "wc_reply_reviewers": "320;28;182;0;88",
        "wc_reply_authors": "1515;707;796;1082;389",
        "reply_reviewers": "1;1;1;0;1",
        "reply_authors": "3;1;1;2;1",
        "rating_avg": [
            6.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.8,
            0.9797958971132712
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            3.2,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            80.2,
            26.263282353887146
        ],
        "wc_strengths_avg": [
            60.4,
            70.06454167408789
        ],
        "wc_weaknesses_avg": [
            201.6,
            104.27770615045193
        ],
        "wc_questions_avg": [
            169.6,
            218.07484953565827
        ],
        "wc_review_avg": [
            511.8,
            199.6
        ],
        "wc_reply_reviewers_avg": [
            123.6,
            116.333314231135
        ],
        "wc_reply_authors_avg": [
            897.8,
            379.6079029735814
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4
        ],
        "reply_authors_avg": [
            1.6,
            0.8
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.04166666666666666,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12973636929830756218&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 8,
        "openreview": "https://openreview.net/forum?id=EpYnZpDpsQ",
        "pdf": "https://openreview.net/pdf?id=EpYnZpDpsQ",
        "email": "layer6.ai;layer6.ai;dal.ca;layer6.ai;layer6.ai;layer6.ai;layer6.ai;layer6.ai",
        "author_num": 8,
        "aff_unique_index": "0;1;2;0;1;0;1;0",
        "aff_unique_norm": "Layer6 AI;Layer 6 AI;Dalhousie University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://layer6.ai;https://layer6.ai;https://www.dal.ca",
        "aff_unique_abbr": "Layer6;Layer 6 AI;Dal",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "Eqps25f8HU",
        "title": "MoMA: Model-based Mirror Ascent for Offline Reinforcement Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Model-based offline reinforcement learning methods (RL) have achieved state-of-the-art performance in many decision-making problems thanks to their sample efficiency and generalizability. However, prior model-based offline RL methods in the literature either demonstrate their successes solely through empirical studies, or provide algorithms that have theoretical guarantees but are hard to implement in practice. To date, a practically implementable algorithm for model-based offline RL with theoretical guarantees is still lacking. To fill this gap, we develop MoMA, a model-based mirror ascent algorithm with general function approximations under partial coverage of offline data. Iteratively, MoMA conservatively estimates the value function by a minimization procedure within a confidence set of the transition model in the policy evaluation step, then updates the policy with general function approximations instead of commonly-used parametric policy classes in the policy improvement step. Under some mild assumptions, we establish theoretical guarantees of the proposed algorithm by proving an upper bound on the suboptimality of the returned policy. The effectiveness of the proposed algorithm is demonstrated via numerical studies.",
        "keywords": "Offline Reinforcement Learning;Mirror Ascent;Model-based;PAC Guarantee",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Mao Hong;Zhiyue Zhang;Yue Wu;Yanxun Xu",
        "authorids": "~Mao_Hong1;~Zhiyue_Zhang1;~Yue_Wu23;~Yanxun_Xu1",
        "gender": "M;M;;F",
        "homepage": ";;;http://www.ams.jhu.edu/~yxu70",
        "dblp": ";;;",
        "google_scholar": "GUKNcVUAAAAJ;;;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;",
        "linkedin": "mao-hong-a45624195/;zhiyuezhangjhu;yue-wu-ab5243251;",
        "or_profile": "~Mao_Hong1;~Zhiyue_Zhang1;~Yue_Wu23;~Yanxun_Xu1",
        "aff": "Johns Hopkins University;Johns Hopkins University;Johns Hopkins University;Johns Hopkins University",
        "aff_domain": "jh.edu;jh.edu;jh.edu;jhu.edu",
        "position": "PhD student;PhD student;PhD student;Associate Professor",
        "bibtex": "@misc{\nhong2024moma,\ntitle={Mo{MA}: Model-based Mirror Ascent for Offline Reinforcement Learning},\nauthor={Mao Hong and Zhiyue Zhang and Yue Wu and Yanxun Xu},\nyear={2024},\nurl={https://openreview.net/forum?id=Eqps25f8HU}\n}",
        "github": "",
        "project": "",
        "reviewers": "cZbn;xszJ;wmfD;CJRs",
        "site": "https://openreview.net/forum?id=Eqps25f8HU",
        "pdf_size": 5882515,
        "rating": "3;5;5;5",
        "confidence": "4;3;4;3",
        "soundness": "3;4;2;3",
        "contribution": "2;2;2;2",
        "presentation": "3;3;2;3",
        "wc_summary": "43;60;78;40",
        "wc_strengths": "15;83;10;30",
        "wc_weaknesses": "209;134;235;414",
        "wc_questions": "242;129;36;20",
        "wc_review": "509;406;359;504",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "593;1130;638;712",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            55.25,
            15.188400179084036
        ],
        "wc_strengths_avg": [
            34.5,
            28.952547383606852
        ],
        "wc_weaknesses_avg": [
            248.0,
            102.76429340972476
        ],
        "wc_questions_avg": [
            106.75,
            88.48552141452295
        ],
        "wc_review_avg": [
            444.5,
            64.21253771655502
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            768.25,
            213.13420068116707
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:k2bw0R3Mcy0J:scholar.google.com/&scioq=MoMA:+Model-based+Mirror+Ascent+for+Offline+Reinforcement+Learning&hl=en&as_sdt=0,10",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Johns Hopkins University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.jhu.edu",
        "aff_unique_abbr": "JHU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "EraNITdn34",
        "title": "Unlocking the Transferability of Tokens in Deep Models for Tabular Data",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Fine-tuning a pre-trained deep neural network has become a successful paradigm in various machine learning tasks. However, such a paradigm becomes particularly challenging with tabular data when there are discrepancies between the feature sets of pre-trained models and the target tasks. In this paper, we propose TabToken, a method aims at enhancing the quality of feature tokens (\\ie, embeddings of tabular features). TabToken allows for the utilization of pre-trained models when the upstream and downstream tasks share overlapping features, facilitating model fine-tuning even with limited training examples. Specifically, we introduce a contrastive objective that regularizes the tokens, capturing the semantics within and across features. During the pre-training stage, the tokens are learned jointly with top-layer deep models such as transformer. In the downstream task, tokens of the shared features are kept fixed while TabToken efficiently fine-tunes the remaining parts of the model. TabToken not only enables knowledge transfer from a pre-trained model to tasks with heterogeneous features, but also enhances the discriminative ability of deep tabular models in standard classification and regression tasks.",
        "keywords": "tabular data",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Qile Zhou;Han-Jia Ye;Leye Wang;De-Chuan Zhan",
        "authorids": "~Qile_Zhou1;~Han-Jia_Ye1;~Leye_Wang1;~De-Chuan_Zhan1",
        "gender": "M;M;M;M",
        "homepage": "http://www.lamda.nju.edu.cn/zhouql/;http://www.lamda.nju.edu.cn/yehj;https://wangleye.github.io/;http://www.lamda.nju.edu.cn/zhandc/",
        "dblp": "359/3740.html;165/3014;07/8764;74/498",
        "google_scholar": ";mgOYhtoAAAAJ;;mYJf4TcAAAAJ",
        "orcid": ";;;0000-0002-3533-2078",
        "linkedin": ";;;",
        "or_profile": "~Qile_Zhou1;~Han-Jia_Ye1;~Leye_Wang1;~De-Chuan_Zhan1",
        "aff": "Nanjing University;Nanjing University;Peking University;Nanjing University",
        "aff_domain": "nju.edu.cn;nju.edu.cn;pku.edu.cn;nju.edu.cn",
        "position": "MS student;Associate Professor;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nzhou2024unlocking,\ntitle={Unlocking the Transferability of Tokens in Deep Models for Tabular Data},\nauthor={Qile Zhou and Han-Jia Ye and Leye Wang and De-Chuan Zhan},\nyear={2024},\nurl={https://openreview.net/forum?id=EraNITdn34}\n}",
        "github": "",
        "project": "",
        "reviewers": "B5qv;yFnT;6daM",
        "site": "https://openreview.net/forum?id=EraNITdn34",
        "pdf_size": 1068698,
        "rating": "5;6;6",
        "confidence": "3;3;3",
        "soundness": "2;3;3",
        "contribution": "2;2;2",
        "presentation": "2;3;3",
        "wc_summary": "67;76;84",
        "wc_strengths": "42;28;55",
        "wc_weaknesses": "297;53;100",
        "wc_questions": "34;1;27",
        "wc_review": "440;158;266",
        "wc_reply_reviewers": "70;15;44",
        "wc_reply_authors": "1666;598;1216",
        "reply_reviewers": "1;1;1",
        "reply_authors": "3;2;3",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            75.66666666666667,
            6.944222218666553
        ],
        "wc_strengths_avg": [
            41.666666666666664,
            11.025223605694151
        ],
        "wc_weaknesses_avg": [
            150.0,
            105.7008356952142
        ],
        "wc_questions_avg": [
            20.666666666666668,
            14.197026292697903
        ],
        "wc_review_avg": [
            288.0,
            116.17228585166085
        ],
        "wc_reply_reviewers_avg": [
            43.0,
            22.464787260658994
        ],
        "wc_reply_authors_avg": [
            1160.0,
            437.80360893898535
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6961103042533105396&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Nanjing University;Peking University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.nju.edu.cn;http://www.pku.edu.cn",
        "aff_unique_abbr": "Nanjing U;Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Leveraging Low-Rank and Sparse Recurrent Connectivity for Robust Closed-Loop Control",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19088",
        "id": "EriR6Ec69a",
        "author_site": "Neehal Tumma, Mathias Lechner, Noel Loo, Ramin Hasani, Daniela Rus",
        "tldr": "",
        "abstract": "Developing autonomous agents that can interact with changing environments is an open challenge in machine learning. Robustness is particularly important in these settings as agents are often fit offline on expert demonstrations but deployed online where they must generalize to the closed feedback loop within the environment. In this work, we explore the application of recurrent neural networks to tasks of this nature and understand how a parameterization of their recurrent connectivity influences robustness in closed-loop settings. Specifically, we represent the recurrent connectivity as a function of rank and sparsity and show both theoretically and empirically that modulating these two variables has desirable effects on network dynamics. The proposed low-rank, sparse connectivity induces an interpretable prior on the network that proves to be most amenable for a class of models known as closed-form continuous-time neural networks (CfCs). We find that CfCs with fewer parameters can outperform their full-rank, fully-connected counterparts in the online setting under distribution shift. This yields memory-efficient and robust agents while opening a new perspective on how we can modulate network dynamics through connectivity.",
        "keywords": "Low-rank;sparsity;closed-loop;recurrent neural networks",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/662426f547309d5ecb1ad0a1f00d15aea2fc559b.zip",
        "author": "Neehal Tumma;Mathias Lechner;Noel Loo;Ramin Hasani;Daniela Rus",
        "authorids": "~Neehal_Tumma1;~Mathias_Lechner1;~Noel_Loo1;~Ramin_Hasani1;~Daniela_Rus1",
        "gender": "M;Unspecified;;F;M",
        "homepage": "https://ntumm120.github.io/;https://mlech26l.github.io/pages/;https://yolky.github.io/;https://www.csail.mit.edu/person/daniela-rus;http://www.raminhasani.com",
        "dblp": ";209/9862;279/6288;r/DanielaRus;190/3168",
        "google_scholar": "QzU05TwAAAAJ;https://scholar.google.at/citations?hl=en;vokGv-gAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.at/citations?user=YarJF3QAAAAJ",
        "orcid": ";;;;0000-0002-9889-5222",
        "linkedin": "neehal-tumma-82a2141a8/;;noel-loo-23a2a112b;;raminhasani/",
        "or_profile": "~Neehal_Tumma1;~Mathias_Lechner1;~Noel_Loo1;~Daniela_Rus1;~Ramin_M._Hasani1",
        "aff": "Harvard University;;Massachusetts Institute of Technology;Massachusetts Institute of Technology;Massachusetts Institute of Technology",
        "aff_domain": "harvard.edu;;mit.edu;mit.edu;mit.edu",
        "position": "Undergrad student;;PhD student;Full Professor;Researcher",
        "bibtex": "@inproceedings{\ntumma2024leveraging,\ntitle={Leveraging Low-Rank and Sparse Recurrent Connectivity for Robust Closed-Loop Control},\nauthor={Neehal Tumma and Mathias Lechner and Noel Loo and Ramin Hasani and Daniela Rus},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=EriR6Ec69a}\n}",
        "github": "",
        "project": "",
        "reviewers": "XFJy;59d7;p6DM;R5dM",
        "pdf_size": 40587995,
        "rating": "6;6;6;8",
        "confidence": "2;4;2;3",
        "soundness": "2;3;3;4",
        "contribution": "2;2;3;3",
        "presentation": "2;3;1;4",
        "wc_summary": "92;96;20;85",
        "wc_strengths": "36;96;38;44",
        "wc_weaknesses": "364;519;286;138",
        "wc_questions": "3;303;3;2",
        "wc_review": "495;1014;347;269",
        "wc_reply_reviewers": "292;84;59;15",
        "wc_reply_authors": "2100;3096;830;336",
        "reply_reviewers": "4;1;1;1",
        "reply_authors": "6;5;2;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            73.25,
            30.994959267597046
        ],
        "wc_strengths_avg": [
            53.5,
            24.713356712514795
        ],
        "wc_weaknesses_avg": [
            326.75,
            137.5088633506946
        ],
        "wc_questions_avg": [
            77.75,
            130.04878892169663
        ],
        "wc_review_avg": [
            531.25,
            290.2950008181333
        ],
        "wc_reply_reviewers_avg": [
            112.5,
            106.53755206498786
        ],
        "wc_reply_authors_avg": [
            1590.5,
            1081.4632448678042
        ],
        "reply_reviewers_avg": [
            1.75,
            1.299038105676658
        ],
        "reply_authors_avg": [
            3.5,
            2.0615528128088303
        ],
        "replies_avg": [
            30,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.17407765595569782,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:-8Uh_02RbCgJ:scholar.google.com/&scioq=Leveraging+Low-Rank+and+Sparse+Recurrent+Connectivity+for+Robust+Closed-Loop+Control&hl=en&as_sdt=0,5",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=EriR6Ec69a",
        "pdf": "https://openreview.net/pdf?id=EriR6Ec69a",
        "email": "harvard.edu;;mit.edu;mit.edu;mit.edu",
        "author_num": 5,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Harvard University;Massachusetts Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.harvard.edu;https://web.mit.edu",
        "aff_unique_abbr": "Harvard;MIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "EsiU7bNabf",
        "title": "Approximate Clustering for Extracting Task Relationships in Multi-Instruction Tuning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The development of language models involves the evaluation of a broad range of learning tasks. Recent work has shown that by using carefully designed instructions to teach a large transformer model, they can be fine-tuned on a wide range of downstream tasks. However, when the number of instructions increases, they can negatively interfere with each other if trained together. Existing works have relied on domain expertise and manual inspection to construct multi-instruction sets, which can be time-consuming and difficult to scale. To address this challenge, this paper develops a clustering algorithm to find groups of similar tasks based on a given set of task affinity scores. This is an NP-hard problem, and conventional algorithms such as spectral and Llyod's clustering are sensitive to variations in the scale of task losses. Our algorithm instead uses a semidefinite relaxation to maximize the average density of clusters and then rounds the solution with a threshold. We adaptively build the clusters by gradually adding tasks so that the affinities only need to be computed in the existing clusters. Then, we construct an evaluation benchmark to assess task grouping algorithms with verified group structures. The evaluation set includes 63 cases, spanning multitask instruction tuning, multi-instruction tuning, and in-context learning of multiple functions. We validate our algorithm on this evaluation set by showing that it recovers the group structure found by an exhaustive search. We also show that our approach improves performance over multi-instruction and soft-prompt tuning by up to 6\\% on several sentence classification and structure-to-text generative tasks.",
        "keywords": "Multitask learning; Clustering; Instruction fine-tuning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/b68540df502d46bcfccf8e3f5d761d156dadff63.zip",
        "author": "Dongyue Li;Jinhong Yu;Hongyang R. Zhang",
        "authorids": "~Dongyue_Li1;~Jinhong_Yu1;~Hongyang_R._Zhang1",
        "gender": ";M;M",
        "homepage": "https://lidongyue12138.github.io/;https://yu-jinh.github.io;http://www.hongyangzhang.com",
        "dblp": ";;264/2660",
        "google_scholar": "ASLbvk8AAAAJ;;Sx-673sAAAAJ",
        "orcid": "0009-0001-6187-5367;;",
        "linkedin": ";;hongyang-r-zhang-5b7797157",
        "or_profile": "~Dongyue_Li1;~Jinhong_Yu1;~Hongyang_R._Zhang1",
        "aff": "Northeastern University;;Northeastern University",
        "aff_domain": "northeastern.edu;;northeastern.edu",
        "position": "PhD student;;Assistant Professor",
        "bibtex": "@misc{\nli2024approximate,\ntitle={Approximate Clustering for Extracting Task Relationships in Multi-Instruction Tuning},\nauthor={Dongyue Li and Jinhong Yu and Hongyang R. Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=EsiU7bNabf}\n}",
        "github": "",
        "project": "",
        "reviewers": "5Hpz;zYRS;oSbm",
        "site": "https://openreview.net/forum?id=EsiU7bNabf",
        "pdf_size": 971302,
        "rating": "3;3;6",
        "confidence": "3;5;3",
        "soundness": "3;2;3",
        "contribution": "2;2;3",
        "presentation": "2;2;2",
        "wc_summary": "23;46;113",
        "wc_strengths": "19;13;81",
        "wc_weaknesses": "311;104;200",
        "wc_questions": "6;409;261",
        "wc_review": "359;572;655",
        "wc_reply_reviewers": "30;0;0",
        "wc_reply_authors": "857;618;1062",
        "reply_reviewers": "1;0;0",
        "reply_authors": "2;1;2",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            60.666666666666664,
            38.177945931591914
        ],
        "wc_strengths_avg": [
            37.666666666666664,
            30.739045022396013
        ],
        "wc_weaknesses_avg": [
            205.0,
            84.581321815162
        ],
        "wc_questions_avg": [
            225.33333333333334,
            166.4458537249343
        ],
        "wc_review_avg": [
            528.6666666666666,
            124.66577539788359
        ],
        "wc_reply_reviewers_avg": [
            10.0,
            14.142135623730951
        ],
        "wc_reply_authors_avg": [
            845.6666666666666,
            181.43930726891077
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5000000000000001,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4873464685623086884&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Northeastern University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.northeastern.edu",
        "aff_unique_abbr": "NEU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "EsjoMaNeVo",
        "title": "Steering No-Regret Learners to Optimal Equilibria",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We consider the problem of steering no-regret-learning agents to play desirable equilibria via nonnegative payments. We show that steering is impossible if the total budget (across iterations) is finite, both in normal- and extensive-form games. However, vanishing average payments are compatible with steering. When players' full strategies are observed at each timestep, constant per-iteration payments permit steering. When only trajectories through the game tree are observable, steering is impossible with constant per-iteration payments in general extensive-form games, but possible in normal-form games or if the maximum per-iteration payment may grow with time, maintaining vanishing average payments. We supplement our theoretical positive results with experiments highlighting the efficacy of steering in large games, and show how our framework relates to optimal mechanism design and information design.",
        "keywords": "no-regret learning;extensive-form games;optimal equilibria;mechanism design;information design;payments",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/7f385ec77dfdaf075833fecea88cd9ccedeb44be.pdf",
        "author": "Brian Hu Zhang;Gabriele Farina;Ioannis Anagnostides;Federico Cacciamani;Stephen Marcus McAleer;Andreas Alexander Haupt;Andrea Celli;Nicola Gatti;Vincent Conitzer;Tuomas Sandholm",
        "authorids": "~Brian_Hu_Zhang1;~Gabriele_Farina1;~Ioannis_Anagnostides1;~Federico_Cacciamani1;~Stephen_Marcus_McAleer1;~Andreas_Alexander_Haupt1;~Andrea_Celli1;~Nicola_Gatti1;~Vincent_Conitzer2;~Tuomas_Sandholm1",
        "gender": ";M;M;M;M;M;M;M;M;M",
        "homepage": ";http://www.cs.cmu.edu/~gfarina/about/;;;https://www.andrew.cmu.edu/user/smcaleer/;https://www.andyhaupt.com/;https://andcelli.github.io/;https://www4.ceda.polimi.it/manifesti/manifesti/controller/ricerche/RicercaPerDocentiPublic.do?k_doc=75785&lang=EN&EVN_PRODOTTI=evento&__pj0=0&__pj1=d918ee8916afbd0005f5c0bc3c0ff350;https://www.cs.cmu.edu/~conitzer/;http://www.cs.cmu.edu/~sandholm",
        "dblp": "213/8211;;273/7648;285/5552;;158/5197.html;190/7301.html;g/NicolaGatti;c/VincentConitzer;s/TuomasSandholm",
        "google_scholar": ";sktDNcEAAAAJ;QVwDo_sAAAAJ;ntSIxxMAAAAJ;iEFL4-YAAAAJ;O6NknDYAAAAJ;9wQscqEAAAAJ;https://scholar.google.com.tw/citations?user=j-HrYREAAAAJ;juRk4lQAAAAJ;0DpK1EMAAAAJ",
        "orcid": ";;;;;0000-0002-2952-4188;;0000-0001-7349-3932;0000-0003-1899-7884;",
        "linkedin": ";;;;stephen-mcaleer/;indraos/;;nicola-gatti-1284b21;vincent-conitzer-2563082/;",
        "or_profile": "~Brian_Hu_Zhang1;~Gabriele_Farina1;~Ioannis_Anagnostides1;~Federico_Cacciamani1;~Stephen_Marcus_McAleer1;~Andreas_Alexander_Haupt1;~Andrea_Celli1;~Nicola_Gatti1;~Vincent_Conitzer2;~Tuomas_Sandholm1",
        "aff": "Carnegie Mellon University;Massachusetts Institute of Technology;Carnegie Mellon University;;Carnegie Mellon University;Massachusetts Institute of Technology;Bocconi University;Polytechnic Institute of Milan;University of Oxford;Carnegie Mellon University",
        "aff_domain": "cmu.edu;mit.edu;cmu.edu;;cmu.edu;mit.edu;unibocconi.it;polimi.it;oxford.ac.uk;cmu.edu",
        "position": "PhD student;Assistant Professor;PhD student;;Postdoc;PhD student;Assistant Professor;Full Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nzhang2024steering,\ntitle={Steering No-Regret Learners to Optimal Equilibria},\nauthor={Brian Hu Zhang and Gabriele Farina and Ioannis Anagnostides and Federico Cacciamani and Stephen Marcus McAleer and Andreas Alexander Haupt and Andrea Celli and Nicola Gatti and Vincent Conitzer and Tuomas Sandholm},\nyear={2024},\nurl={https://openreview.net/forum?id=EsjoMaNeVo}\n}",
        "github": "",
        "project": "",
        "reviewers": "yahc;CT7x;VPEt;ogtK",
        "site": "https://openreview.net/forum?id=EsjoMaNeVo",
        "pdf_size": 970760,
        "rating": "5;5;6;8",
        "confidence": "3;3;4;3",
        "soundness": "3;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;1;3;4",
        "wc_summary": "97;58;209;240",
        "wc_strengths": "43;22;81;76",
        "wc_weaknesses": "312;76;723;7",
        "wc_questions": "82;146;5;43",
        "wc_review": "534;302;1018;366",
        "wc_reply_reviewers": "114;199;360;10",
        "wc_reply_authors": "1250;809;1346;97",
        "reply_reviewers": "1;2;2;1",
        "reply_authors": "4;3;3;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            151.0,
            75.58108228915486
        ],
        "wc_strengths_avg": [
            55.5,
            24.23324163210527
        ],
        "wc_weaknesses_avg": [
            279.5,
            279.9182916495455
        ],
        "wc_questions_avg": [
            69.0,
            52.12964607591346
        ],
        "wc_review_avg": [
            555.0,
            280.419328863044
        ],
        "wc_reply_reviewers_avg": [
            170.75,
            128.13542640503445
        ],
        "wc_reply_authors_avg": [
            875.5,
            492.97692643773905
        ],
        "reply_reviewers_avg": [
            1.5,
            0.5
        ],
        "reply_authors_avg": [
            2.75,
            1.0897247358851685
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6128468813485600634&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0;1;2;3;4;0",
        "aff_unique_norm": "Carnegie Mellon University;Massachusetts Institute of Technology;Bocconi University;Polytechnic Institute of Milan;University of Oxford",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.cmu.edu;https://web.mit.edu;https://www.bocconi.edu;https://www.polimi.it/;https://www.ox.ac.uk",
        "aff_unique_abbr": "CMU;MIT;Bocconi;Politecnico di Milano;Oxford",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;1;1;2;0",
        "aff_country_unique": "United States;Italy;United Kingdom"
    },
    {
        "id": "EuwZ3Ki81R",
        "title": "Revisitng graph neural networks for traffic forecasting",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Accurate traffic forecasting is crucial for a wide range of traffic management applications. In recent years, Graph Neural Networks (GNNs) have emerged as one of the most promising methods to predict traffic. However, their complex architectures prevent them from being used in large networks and long-term forecasting. Although there are complex spatial-temporal dependencies in traffic data, the evolution of the traffic flow, in particular, is governed by linear dynamics, based on the law of flow conservation. Hence, we conjecture that linear models are sufficient for accurate traffic flow predictions. In this study, we investigate linear regression models to predict traffic flow. Models are created for different periods in the day, and exploit historical traffic data from the neighboring region as input. Using multiple real-world traffic data sets collected from the entire California highway systems, we demonstrate that our simple linear models outperform state-of-the-art GNNs by achieving both higher accuracy and significantly better efficiency. Moreover, we conduct comprehensive studies to analyze the impacts of various design elements of GNNs on the improvement of prediction accuracy. Based on our findings, we advocate re-considering the design of model architectures for traffic forecasting.",
        "keywords": "Graph-structured dynamics;Linear model;Large network;Traffic forecasting",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Weiheng Zhong;Hadi Meidani",
        "authorids": "~Weiheng_Zhong1;~Hadi_Meidani1",
        "gender": "M;Not Specified",
        "homepage": ";https://uq.cee.illinois.edu",
        "dblp": ";",
        "google_scholar": "fgLb_DsAAAAJ;",
        "orcid": "0000-0002-7902-3568;",
        "linkedin": "weiheng-zhong-796481238/;",
        "or_profile": "~Weiheng_Zhong1;~Hadi_Meidani1",
        "aff": "University of Illinois Urbana Champaign;",
        "aff_domain": "illinois.edu;",
        "position": "PhD student;",
        "bibtex": "@misc{\nzhong2024revisitng,\ntitle={Revisitng graph neural networks for traffic forecasting},\nauthor={Weiheng Zhong and Hadi Meidani},\nyear={2024},\nurl={https://openreview.net/forum?id=EuwZ3Ki81R}\n}",
        "github": "",
        "project": "",
        "reviewers": "gedi;R1zg;NDtY;d1Pk",
        "site": "https://openreview.net/forum?id=EuwZ3Ki81R",
        "pdf_size": 2130880,
        "rating": "3;3;5;5",
        "confidence": "4;5;4;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;1;3",
        "presentation": "3;3;3;3",
        "wc_summary": "61;79;47;140",
        "wc_strengths": "49;41;101;100",
        "wc_weaknesses": "87;145;91;182",
        "wc_questions": "11;11;3;1",
        "wc_review": "208;276;242;423",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            81.75,
            35.49207658055527
        ],
        "wc_strengths_avg": [
            72.75,
            27.896012259819503
        ],
        "wc_weaknesses_avg": [
            126.25,
            39.5055375865207
        ],
        "wc_questions_avg": [
            6.5,
            4.55521678957215
        ],
        "wc_review_avg": [
            287.25,
            81.97979934105719
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.7071067811865475,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:KcA7k1de4gMJ:scholar.google.com/&scioq=Revisitng+graph+neural+networks+for+traffic+forecasting&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Illinois Urbana-Champaign",
        "aff_unique_dep": "",
        "aff_unique_url": "https://illinois.edu",
        "aff_unique_abbr": "UIUC",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Urbana-Champaign",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Interpreting Robustness Proofs of Deep Neural Networks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19087",
        "id": "Ev10F9TWML",
        "author_site": "Debangshu Banerjee, Avaljot Singh, Gagandeep Singh",
        "tldr": "",
        "abstract": "In recent years numerous methods have been developed to formally verify the robustness of deep neural networks (DNNs). \nThough the proposed techniques are effective in providing mathematical guarantees about the DNNs' behavior, it is not clear whether the proofs generated by these methods are human-understandable. \nIn this paper, we bridge this gap by developing new concepts, algorithms, and representations to generate human understandable insights into the internal workings of DNN robustness proofs. \nLeveraging the proposed method, we show that the robustness proofs of standard DNNs rely more on spurious input features as compared to the proofs of DNNs trained to be robust. \nRobustness proofs of the provably robust DNNs filter out a larger number of spurious input features as compared to adversarially trained DNNs, sometimes even leading to the pruning of semantically meaningful input features.\nThe proofs for the DNNs combining adversarial and provably robust training tend to achieve the middle ground",
        "keywords": "Neural Network Verification;Robustness;Certification",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "",
        "author": "Debangshu Banerjee;Avaljot Singh;Gagandeep Singh",
        "authorids": "~Debangshu_Banerjee2;~Avaljot_Singh1;~Gagandeep_Singh1",
        "gender": "M;;M",
        "homepage": "https://debangshu-banerjee.github.io/;;https://ggndpsngh.github.io/",
        "dblp": "268/6756;;64/3747-1",
        "google_scholar": "G5dhKqAAAAAJ;;https://scholar.google.ch/citations?user=m4b2ruEAAAAJ",
        "orcid": "0009-0001-0163-9717;;0000-0002-9299-2961",
        "linkedin": "debangshu-banerjee/;avaljot-singh/;gagandeep-singh-1bb01b49/",
        "or_profile": "~Debangshu_Banerjee2;~Avaljot_Singh1;~Gagandeep_Singh1",
        "aff": "University of Illinois, Urbana Champaign;Department of Computer Science;University of Illinois, Urbana Champaign",
        "aff_domain": "uiuc.edu;cs.illinois.edu;illinois.edu",
        "position": "PhD student;PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nbanerjee2024interpreting,\ntitle={Interpreting Robustness Proofs of Deep Neural Networks},\nauthor={Debangshu Banerjee and Avaljot Singh and Gagandeep Singh},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Ev10F9TWML}\n}",
        "github": "",
        "project": "",
        "reviewers": "UvmS;YfNd;zRr5;rPr5",
        "pdf_size": 4492459,
        "rating": "6;6;6;6",
        "confidence": "3;3;2;3",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;2",
        "presentation": "2;3;3;3",
        "wc_summary": "47;85;76;93",
        "wc_strengths": "19;57;58;85",
        "wc_weaknesses": "112;111;212;167",
        "wc_questions": "3;35;73;138",
        "wc_review": "181;288;419;483",
        "wc_reply_reviewers": "10;0;43;0",
        "wc_reply_authors": "343;346;660;544",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "1;2;2;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            75.25,
            17.383541066192468
        ],
        "wc_strengths_avg": [
            54.75,
            23.498670175139697
        ],
        "wc_weaknesses_avg": [
            150.5,
            42.1218470630147
        ],
        "wc_questions_avg": [
            62.25,
            50.26616655365714
        ],
        "wc_review_avg": [
            342.75,
            116.88108272941349
        ],
        "wc_reply_reviewers_avg": [
            13.25,
            17.65467360219384
        ],
        "wc_reply_authors_avg": [
            473.25,
            135.12841115028326
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15563423151810987692&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 9,
        "openreview": "https://openreview.net/forum?id=Ev10F9TWML",
        "pdf": "https://openreview.net/pdf?id=Ev10F9TWML",
        "email": "uiuc.edu;cs.illinois.edu;illinois.edu",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Illinois Urbana-Champaign;Unknown Institution",
        "aff_unique_dep": ";Department of Computer Science",
        "aff_unique_url": "https://illinois.edu;",
        "aff_unique_abbr": "UIUC;",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Urbana-Champaign;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States;"
    },
    {
        "id": "EvBx5whpzJ",
        "title": "Con4m: Unleashing the Power of Consistency and Context in Classification for Blurred-Segmented Time Series",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Blurred-Segmented Time Series (BST) has emerged as a prevalent form of time series data in various practical applications, presenting unique challenges for the Time Series Classification (TSC) task. The BST data is segmented into continuous states with inherently blurred transitions. These transitions lead to inconsistency in annotations among different individuals due to experiential differences, thereby hampering model training and validation. However, existing TSC methods often fail to recognize label inconsistency and contextual dependencies between consecutive classified samples. In this work, we first theoretically clarify the connotation of valuable contextual information. Based on these insights, we incorporate prior knowledge of BST data at both the data and class levels into our model design to capture effective contextual information. Furthermore, we propose a label consistency training framework to harmonize inconsistent labels. Extensive experiments on two public and one private BST data fully validate the effectiveness of our proposed approach, Con4m, in handling the TSC task on BST data.",
        "keywords": "Time series classification;Label consistency learning;Context-aware time series model;Blurred-segmented time series",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/111d8dad5ae832cadf767852460a271a1c86c81d.zip",
        "author": "Junru Chen;Tianyu Cao;Jing Xu;Jiahe Li;Zhilong Chen;Tao Xiao;Yang Yang",
        "authorids": "~Junru_Chen1;~Tianyu_Cao2;~Jing_Xu13;~Jiahe_Li5;~Zhilong_Chen2;~Tao_Xiao1;~Yang_Yang35",
        "gender": "M;;;F;M;;M",
        "homepage": "https://mrnobodycali.github.io/;https://springcty.github.io/;;https://erikaqvq.github.io/;https://cnblogs.com/Apocrypha;;http://yangy.org",
        "dblp": "212/6753;;;;;;",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;;;https://scholar.google.com/citations?hl=zh-CN;;;",
        "orcid": ";;0009-0005-3420-4356;;;0009-0000-5146-3265;0000-0002-5058-4417",
        "linkedin": ";tianyu-cao-98234b267/;;;;;",
        "or_profile": "~Junru_Chen1;~Tianyu_Cao2;~Jing_Xu13;~Jiahe_Li5;~Zhilong_Chen2;~Tao_Xiao1;~Yang_Yang35",
        "aff": "Zhejiang University;Zhejiang University;State Grid Power Supply Co. Ltd.;Zhejiang University;Zhejiang University;State Grid Power Supply Co. Ltd.;Zhejiang University",
        "aff_domain": "zju.edu.cn;zju.edu.cn;zj.sgcc.com.cn;zju.edu.cn;zju.edu.cn;zj.sgcc.com.cn;zju.edu.cn",
        "position": "PhD student;Undergrad student;Researcher;Undergrad student;Undergrad student;Researcher;Associate Professor",
        "bibtex": "@misc{\nchen2024conm,\ntitle={Con4m: Unleashing the Power of Consistency and Context in Classification for Blurred-Segmented Time Series},\nauthor={Junru Chen and Tianyu Cao and Jing Xu and Jiahe Li and Zhilong Chen and Tao Xiao and Yang Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=EvBx5whpzJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "JdCs;zaSc;2FMY;5NtK",
        "site": "https://openreview.net/forum?id=EvBx5whpzJ",
        "pdf_size": 6295195,
        "rating": "3;5;5;6",
        "confidence": "4;3;3;3",
        "soundness": "2;1;3;3",
        "contribution": "2;2;3;2",
        "presentation": "1;1;3;2",
        "wc_summary": "55;191;92;95",
        "wc_strengths": "21;51;84;119",
        "wc_weaknesses": "139;302;174;112",
        "wc_questions": "50;253;26;85",
        "wc_review": "265;797;376;411",
        "wc_reply_reviewers": "95;412;0;107",
        "wc_reply_authors": "1411;2405;968;901",
        "reply_reviewers": "1;2;0;1",
        "reply_authors": "3;5;2;3",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            108.25,
            50.30593901320201
        ],
        "wc_strengths_avg": [
            68.75,
            36.5812451947716
        ],
        "wc_weaknesses_avg": [
            181.75,
            72.82298744215318
        ],
        "wc_questions_avg": [
            103.5,
            88.82707920448584
        ],
        "wc_review_avg": [
            462.25,
            200.64318453413762
        ],
        "wc_reply_reviewers_avg": [
            153.5,
            154.89431881124628
        ],
        "wc_reply_authors_avg": [
            1421.25,
            600.8254218156885
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            3.25,
            1.0897247358851685
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.9271726499455306,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:dbJRKRhuNREJ:scholar.google.com/&scioq=Con4m:+Unleashing+the+Power+of+Consistency+and+Context+in+Classification+for+Blurred-Segmented+Time+Series&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;0;1;0",
        "aff_unique_norm": "Zhejiang University;State Grid Corporation of China",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.zju.edu.cn;http://www.sgcc.com.cn",
        "aff_unique_abbr": "ZJU;SGCC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Pushing Mixture of Experts to the Limit: Extremely Parameter Efficient MoE for Instruction Tuning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19086",
        "id": "EvDeiLv7qc",
        "author_site": "Ted Zadouri, Ahmet \u00dcst\u00fcn, Arash Ahmadian, Beyza Ermis, Acyr Locatelli, Sara Hooker",
        "tldr": "",
        "abstract": "The Mixture of Experts (MoE) is a widely known neural architecture where  an ensemble of specialized sub-models optimizes overall performance with a constant computational cost. However, conventional MoEs pose challenges at scale due to the need to store all experts in memory. In this paper, we push MoE to the limit. We propose extremely parameter-efficient MoE by uniquely combining MoE architecture with lightweight experts.Our MoE architecture outperforms standard parameter-efficient fine-tuning (PEFT) methods and is on par with full fine-tuning by only updating the lightweight experts -- less than 1\\% of an 11B parameters model. Furthermore, our method generalizes to unseen tasks as it does not depend on any prior task knowledge. Our research underscores the versatility of the mixture of experts architecture, showcasing its ability to deliver robust performance even when subjected to rigorous parameter constraints.",
        "keywords": "Mixture of Experts;Parameter-Efficient Fine-Tuning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/cdab0aef4d2af75fe7359591824f4c859b8a1648.pdf",
        "author": "Ted Zadouri;Ahmet \u00dcst\u00fcn;Arash Ahmadian;Beyza Ermis;Acyr Locatelli;Sara Hooker",
        "authorids": "~Ted_Zadouri1;~Ahmet_\u00dcst\u00fcn1;~Arash_Ahmadian1;~Beyza_Ermis1;~Acyr_Locatelli1;~Sara_Hooker2",
        "gender": ";M;M;F;M;",
        "homepage": ";https://ahmetustun.github.io/;https://twitter.com/aahmadian_;https://www.cmpe.boun.edu.tr/people/beyza.ermi%C5%9F;https://acyrl.github.io/;https://www.sarahooker.me/",
        "dblp": ";186/0896;330/4756;117/9290;330/2243.html;210/2611",
        "google_scholar": ";fvotcRIAAAAJ;https://scholar.google.com/citations?hl=en;v2cMiCAAAAAJ;pv4OI2EAAAAJ;2xy6h3sAAAAJ",
        "orcid": ";;0000-0003-3855-970X;;;",
        "linkedin": "www.linkedin.com/in/tedzed;ahmet-%C3%BCst%C3%BCn/;arash-ahmadian/;;;",
        "or_profile": "~Ted_Zadouri1;~Ahmet_\u00dcst\u00fcn1;~Arash_Ahmadian1;~Beyza_Ermis1;~Acyr_Locatelli1;~Sara_Hooker1",
        "aff": "University of California, Los Angeles;Cohere For AI;University of Toronto;Cohere AI;Cohere;Cohere For AI",
        "aff_domain": "ucla.edu;cohere.com;utoronto.ca;cohere.com;cohere.com;cohere.com",
        "position": "MS student;Researcher;Undergrad student;Researcher;Researcher;Principal Researcher",
        "bibtex": "@inproceedings{\nzadouri2024pushing,\ntitle={Pushing Mixture of Experts to the Limit: Extremely Parameter Efficient MoE for Instruction Tuning},\nauthor={Ted Zadouri and Ahmet {\\\"U}st{\\\"u}n and Arash Ahmadian and Beyza Ermis and Acyr Locatelli and Sara Hooker},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=EvDeiLv7qc}\n}",
        "github": "",
        "project": "",
        "reviewers": "hesi;Bdev;EZ7y;s33v",
        "pdf_size": 476074,
        "rating": "5;6;8;8",
        "confidence": "5;4;4;4",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "64;107;92;82",
        "wc_strengths": "42;34;121;30",
        "wc_weaknesses": "352;153;105;88",
        "wc_questions": "140;40;103;72",
        "wc_review": "598;334;421;272",
        "wc_reply_reviewers": "282;32;26;0",
        "wc_reply_authors": "1789;976;917;1146",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "4;3;2;3",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            86.25,
            15.626499928006911
        ],
        "wc_strengths_avg": [
            56.75,
            37.34551512564795
        ],
        "wc_weaknesses_avg": [
            174.5,
            105.21525554785295
        ],
        "wc_questions_avg": [
            88.75,
            37.036299761180246
        ],
        "wc_review_avg": [
            406.25,
            122.70773203021886
        ],
        "wc_reply_reviewers_avg": [
            85.0,
            114.37219941926448
        ],
        "wc_reply_authors_avg": [
            1207.0,
            346.3762405246642
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.7777777777777777,
        "gs_citation": 106,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7691187958727841289&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=EvDeiLv7qc",
        "pdf": "https://openreview.net/pdf?id=EvDeiLv7qc",
        "email": "ucla.edu;cohere.com;utoronto.ca;cohere.com;cohere.com;cohere.com",
        "author_num": 6,
        "aff_unique_index": "0;1;2;3;1;1",
        "aff_unique_norm": "University of California, Los Angeles;Cohere;University of Toronto;Cohere AI",
        "aff_unique_dep": ";Cohere AI;;",
        "aff_unique_url": "https://www.ucla.edu;https://cohere.ai;https://www.utoronto.ca;https://cohere.ai",
        "aff_unique_abbr": "UCLA;Cohere;U of T;Cohere AI",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Los Angeles;",
        "aff_country_unique_index": "0;0;1;1;0;0",
        "aff_country_unique": "United States;Canada"
    },
    {
        "id": "EvRZ68ObgW",
        "title": "Controlling language over-optimization by targeting reward distribution",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Reinforcement Learning (RL) has become a key optimization tool for fine-tuning and aligning Large Language Models (LLM) with human preferences. However, this approach relies on reward models susceptible to reward over-optimization, wherein language models learn to hack the reward function, resulting in unnatural generations.\nIn this paper, we address this issue by aligning the reward distribution of sentences generated by the fine-tuned model with a predefined target reward distribution. It offers an a priori and parameter-free control over the distribution of rewards of the model, setting it apart from other regularization and post-processing techniques. \nOur experiments show that this RL approach alleviates several optimization challenges in LLM: it reduces the log-likelihood error accumulation when generating lengthy sequences, mitigates reward hacking when generating positive reviews on IMDB, and \nupholds length constraints while aligning summaries with human preferences on the TL;DR dataset.\nOur findings highlight that targeting reward distributions is a promising strategy to better control and enhance the reliability of RL-based fine-tuning.",
        "keywords": "Large Language Models;Reinforcement Learning;fine-tuning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Mathieu Rita;Florian Strub;Rahma Chaabouni;Paul Michel;Emmanuel Dupoux;Olivier Pietquin",
        "authorids": "~Mathieu_Rita1;~Florian_Strub1;~Rahma_Chaabouni1;~Paul_Michel1;~Emmanuel_Dupoux1;~Olivier_Pietquin1",
        "gender": "M;M;F;M;M;M",
        "homepage": ";http://www.florian-strub.com;;https://pmichel31415.github.io/;http://www.lscp.net/persons/dupoux/;http://www.cristal.univ-lille.fr/~pietquin/",
        "dblp": ";;;185/1024;41/8160;58/6269",
        "google_scholar": "https://scholar.google.fr/citations?hl=fr;zxO5kccAAAAJ;https://scholar.google.com/citations?hl=fr;oyyIf0YAAAAJ;https://scholar.google.fr/citations?user=94c1abIAAAAJ;8K8-LdwAAAAJ",
        "orcid": ";;;;0000-0002-7814-2952;",
        "linkedin": ";florian-strub-64443527/;;paul-michel-4954b799/;emmanuel-dupoux-18034055/;opietquin/",
        "or_profile": "~Mathieu_Rita1;~Florian_Strub1;~Rahma_Chaabouni1;~Paul_Michel1;~Emmanuel_Dupoux1;~Olivier_Pietquin1",
        "aff": "INRIA;Google DeepMind;Google;Google DeepMind;EHESS;Cohere",
        "aff_domain": "inria.fr;google.com;google.com;deepmind.com;ehess.fr;cohere.com",
        "position": "PhD student;Research Scientist;Researcher;Researcher;Full Professor;Director of Research",
        "bibtex": "@misc{\nrita2024controlling,\ntitle={Controlling language over-optimization by targeting reward distribution},\nauthor={Mathieu Rita and Florian Strub and Rahma Chaabouni and Paul Michel and Emmanuel Dupoux and Olivier Pietquin},\nyear={2024},\nurl={https://openreview.net/forum?id=EvRZ68ObgW}\n}",
        "github": "",
        "project": "",
        "reviewers": "Bj8n;xFiE;d8qz;2uTB",
        "site": "https://openreview.net/forum?id=EvRZ68ObgW",
        "pdf_size": 568832,
        "rating": "3;3;3;6",
        "confidence": "3;4;4;2",
        "soundness": "1;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;1;2;3",
        "wc_summary": "46;41;150;61",
        "wc_strengths": "18;21;157;28",
        "wc_weaknesses": "232;48;135;26",
        "wc_questions": "119;182;529;6",
        "wc_review": "415;292;971;121",
        "wc_reply_reviewers": "225;292;0;0",
        "wc_reply_authors": "410;595;1099;60",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            74.5,
            44.206899913927465
        ],
        "wc_strengths_avg": [
            56.0,
            58.42516581063335
        ],
        "wc_weaknesses_avg": [
            110.25,
            81.25384606281723
        ],
        "wc_questions_avg": [
            209.0,
            195.2165464298557
        ],
        "wc_review_avg": [
            449.75,
            318.53993077791677
        ],
        "wc_reply_reviewers_avg": [
            129.25,
            131.40276823568064
        ],
        "wc_reply_authors_avg": [
            541.0,
            375.1006531585889
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.8703882797784892,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:MBi-mX7Crx0J:scholar.google.com/&scioq=Controlling+language+over-optimization+by+targeting+reward+distribution&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1;2;3",
        "aff_unique_norm": "INRIA;Google;Ecole des Hautes Etudes en Sciences Sociales;Cohere",
        "aff_unique_dep": ";Google DeepMind;;",
        "aff_unique_url": "https://www.inria.fr;https://deepmind.com;https://www.ehess.fr;https://cohere.ai",
        "aff_unique_abbr": "INRIA;DeepMind;EHESS;",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;2;1;0;2",
        "aff_country_unique": "France;United Kingdom;United States"
    },
    {
        "id": "EvszuxrPTb",
        "title": "Learning Forward Compatible Representation in Class Incremental Learning by Increasing Effective Rank",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Class Incremental Learning (CIL) is a prominent subfield of continual learning, aiming to enable models to incrementally learn new tasks while preserving the knowledge learned from the previous tasks. The main challenge of CIL is known as catastrophic forgetting, where a model that is naively fine-tuned to new tasks experiences a significant drop in performance on previous tasks. To address the challenge, previous studies have mostly focused on backward compatible approaches. Recently, a forward compatible approach has been introduced that supports a concurrent use with the existing backward compatible methods. The forward compatible method, however, is limited in that it relies solely on class information. In this study, we propose an effective-Rank based Forward Compatible (RFC) representation regularization that is not confined to specific types of information, such as class information. The proposed method increases the efficient rank of representation during the base session, thereby facilitating the encoding of more informative features pertinent to unseen novel tasks. To substantiate the effectiveness of our method, we establish a theoretical connection between effective rank and Shannon entropy of the representations. Subsequently, we conduct comprehensive experiments, by integrating it into ten well-known backward compatible CIL methods. The results demonstrate that our forward compatible approach is effective in enhancing the performance of novel tasks while mitigating catastrophic forgetting. Furthermore, the results indicate that our method significantly improves the average incremental accuracy of all ten cases that we have examined, underscoring its efficacy and general applicability.",
        "keywords": "class incremental learning;continual learning;lifelong learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/098de368f32adc632fe50716ff0a6d34f3d27113.zip",
        "author": "Jaeill Kim;Wonseok Lee;Moonjung Eo;Wonjong Rhee",
        "authorids": "~Jaeill_Kim1;~Wonseok_Lee1;~Moonjung_Eo1;~Wonjong_Rhee1",
        "gender": "M;M;F;",
        "homepage": "https://sites.google.com/view/jaeillkim;https://www.notion.so/Wonseok-Lee-c17872c7855c4577a12b55ac7e5f43d5;;http://drl.snu.ac.kr",
        "dblp": "311/1999;82/688;274/0874;37/711",
        "google_scholar": "kVJRl3wAAAAJ;;3gt2shwAAAAJ;https://scholar.google.co.kr/citations?user=htFuYWsAAAAJ",
        "orcid": ";;0000-0002-0114-8010;0000-0002-2590-8774",
        "linkedin": ";;;wonjong/",
        "or_profile": "~Jaeill_Kim1;~Wonseok_Lee1;~Moonjung_Eo1;~Wonjong_Rhee1",
        "aff": "Seoul National University;Seoul National University;LG AI Research;Seoul National University",
        "aff_domain": "snu.ac.kr;snu.ac.kr;lgresearch.ai;snu.ac.kr",
        "position": "PhD student;MS student;Researcher;Full Professor",
        "bibtex": "@misc{\nkim2024learning,\ntitle={Learning Forward Compatible Representation in Class Incremental Learning by Increasing Effective Rank},\nauthor={Jaeill Kim and Wonseok Lee and Moonjung Eo and Wonjong Rhee},\nyear={2024},\nurl={https://openreview.net/forum?id=EvszuxrPTb}\n}",
        "github": "",
        "project": "",
        "reviewers": "NY2P;od6p;7g6A;VnSg",
        "site": "https://openreview.net/forum?id=EvszuxrPTb",
        "pdf_size": 9687521,
        "rating": "3;3;5;5",
        "confidence": "5;4;4;4",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "2;3;3;3",
        "wc_summary": "54;32;136;39",
        "wc_strengths": "34;32;141;26",
        "wc_weaknesses": "236;204;261;103",
        "wc_questions": "300;2;280;38",
        "wc_review": "624;270;818;206",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            65.25,
            41.61354947610213
        ],
        "wc_strengths_avg": [
            58.25,
            47.8663503935698
        ],
        "wc_weaknesses_avg": [
            201.0,
            60.07911450745592
        ],
        "wc_questions_avg": [
            155.0,
            135.78291497828437
        ],
        "wc_review_avg": [
            479.5,
            252.06893898296948
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Rdw2BXB3z6EJ:scholar.google.com/&scioq=Learning+Forward+Compatible+Representation+in+Class+Incremental+Learning+by+Increasing+Effective+Rank&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Seoul National University;LG",
        "aff_unique_dep": ";LG AI Research",
        "aff_unique_url": "https://www.snu.ac.kr;https://www.lgaires.com",
        "aff_unique_abbr": "SNU;LG AI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "EvwnYpesoD",
        "title": "A Bias-Variance-Covariance Decomposition of Kernel Scores for Generative Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Generative models, like large language models, are becoming increasingly relevant in our daily lives, yet a theoretical framework to assess their generalization behavior and uncertainty does not exist.\nParticularly, the problem of uncertainty estimation is commonly solved in an ad-hoc manner and task-dependent.\nFor example, natural language approaches cannot be transferred to image generation.\nIn this paper, we introduce the first bias-variance-covariance decomposition for kernel scores and their associated entropy.\nWe propose unbiased and consistent estimators for each quantity which only require generated samples but not the underlying model itself.\nAs an application, we offer a generalization evaluation of diffusion models and discover how mode collapse of minority groups is a contrary phenomenon to overfitting.\nFurther, we demonstrate that variance and predictive kernel entropy are viable measures of uncertainty for image, audio, and language generation.\nSpecifically, our approach for uncertainty estimation is more predictive of performance on CoQA and TriviaQA question answering datasets than existing baselines and can also be applied to closed-source models.",
        "keywords": "Kernel Score;Generative Models;Bias-Variance-Covariance Decomposition;Image Generation;Audio Generation;Natural Language Generation;Diffusion Models;Large Language Models",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/b6f8a84b873acb3176084382c9ce1c263562f309.zip",
        "author": "Sebastian Gregor Gruber;Florian Buettner",
        "authorids": "~Sebastian_Gregor_Gruber1;~Florian_Buettner1",
        "gender": "M;",
        "homepage": "https://www.kuleuven.be/wieiswie/en/person/00178219;",
        "dblp": ";245/4220",
        "google_scholar": "_ThqALUAAAAJ;AaPKbPAAAAAJ",
        "orcid": "0000-0002-8544-3470;0000-0001-5587-6761",
        "linkedin": "sebastian-gruber-21b76813b/;",
        "or_profile": "~Sebastian_Gregor_Gruber1;~Florian_Buettner1",
        "aff": "Johann Wolfgang Goethe Universit\u00e4t Frankfurt am Main;Deutsches Krebsforschungszentrum",
        "aff_domain": "uni-frankfurt.de;dkfz.de",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\ngruber2024a,\ntitle={A Bias-Variance-Covariance Decomposition of Kernel Scores for Generative Models},\nauthor={Sebastian Gregor Gruber and Florian Buettner},\nyear={2024},\nurl={https://openreview.net/forum?id=EvwnYpesoD}\n}",
        "github": "",
        "project": "",
        "reviewers": "XNge;ox7H;27VK;vzDu",
        "site": "https://openreview.net/forum?id=EvwnYpesoD",
        "pdf_size": 1022434,
        "rating": "5;6;6;6",
        "confidence": "1;2;2;2",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;2",
        "presentation": "2;2;3;2",
        "wc_summary": "41;38;93;87",
        "wc_strengths": "54;44;85;75",
        "wc_weaknesses": "232;5;41;45",
        "wc_questions": "70;27;149;48",
        "wc_review": "397;114;368;255",
        "wc_reply_reviewers": "0;0;27;0",
        "wc_reply_authors": "489;259;716;364",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "3;3;5;3",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            1.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            64.75,
            25.36114153582208
        ],
        "wc_strengths_avg": [
            64.5,
            16.28649747490233
        ],
        "wc_weaknesses_avg": [
            80.75,
            88.70280435251188
        ],
        "wc_questions_avg": [
            73.5,
            46.16546328154847
        ],
        "wc_review_avg": [
            283.5,
            111.31599166337243
        ],
        "wc_reply_reviewers_avg": [
            6.75,
            11.691342951089922
        ],
        "wc_reply_authors_avg": [
            457.0,
            170.2630318066726
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.5,
            0.8660254037844386
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:PWzJqZN1_e4J:scholar.google.com/&scioq=A+Bias-Variance-Covariance+Decomposition+of+Kernel+Scores+for+Generative+Models&hl=en&as_sdt=0,47",
        "gs_version_total": 8,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Johann Wolfgang Goethe University Frankfurt am Main;Deutsches Krebsforschungszentrum",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uni-frankfurt.de;https://www.dkfz.de",
        "aff_unique_abbr": "JWGU;DKFZ",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Frankfurt am Main;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Germany"
    },
    {
        "title": "DATS: Difficulty-Aware Task Sampler for Meta-Learning Physics-Informed Neural Networks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19085",
        "id": "EvyYFSxdgB",
        "author_site": "Maryam Toloubidokhti, Yubo Ye, Ryan Missel, Xiajun Jiang, Nilesh Kumar, Ruby Shrestha, Linwei Wang",
        "tldr": "",
        "abstract": "Advancements in deep learning have led to the development of physics-informed neural networks (PINNs) for solving partial differential equations (PDEs) without being supervised by PDE solutions. While vanilla PINNs require training one network per PDE configuration, recent works have showed the potential to meta-learn PINNs across a range of PDE configurations. It is however known that PINN training is associated with different levels of difficulty, depending on the underlying PDE configurations or the number of residual sampling points available. Existing meta-learning approaches, however, treat all PINN tasks equally. We address this gap by introducing a novel difficulty-aware task sampler (DATS) for meta-learning of PINNs. We derive an optimal analytical solution to optimize the probability for sampling individual PINN tasks in order to minimize their validation loss across tasks. We further present two alternative strategies to utilize this sampling probability to either adaptively weigh PINN tasks, or dynamically allocate optimal residual points across tasks. We evaluated DATS against uniform and self-paced task-sampling baselines on two representative meta-PINN models, across four benchmark PDEs as well as three different residual point sampling strategies. The results demonstrated that DATS was able to improve the accuracy of meta-learned PINN solutions when reducing performance disparity across PDE configurations, at only a fraction of residual sampling budgets required by its baselines.",
        "keywords": "Meta Learning;Physics Informed Neural Network (PINN);Adaptive Sampler;Partial Differential Equations",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Maryam Toloubidokhti;Yubo Ye;Ryan Missel;Xiajun Jiang;Nilesh Kumar;Ruby Shrestha;Linwei Wang",
        "authorids": "~Maryam_Toloubidokhti1;~Yubo_Ye1;~Ryan_Missel1;~Xiajun_Jiang1;~Nilesh_Kumar1;~Ruby_Shrestha1;~Linwei_Wang1",
        "gender": "F;M;M;M;M;F;F",
        "homepage": ";https://goforit-yyb.github.io/GoForItYYB.github.io/;;;;;https://people.rit.edu/lxwast",
        "dblp": "295/3704;;278/4319;45/10201;;;02/6162",
        "google_scholar": "Qjpj72cAAAAJ;;;P9klFBUAAAAJ;FFHmY7kAAAAJ;JcG1vjIAAAAJ;https://scholar.google.com.tw/citations?user=CG56DzcAAAAJ",
        "orcid": ";;0000-0002-9509-6775;0000-0003-1075-6736;;;",
        "linkedin": ";;;;nilesh-kumar-597148102/;ruby--shrestha;",
        "or_profile": "~Maryam_Toloubidokhti1;~Yubo_Ye1;~Ryan_Missel1;~Xiajun_Jiang1;~Nilesh_Kumar1;~Ruby_Shrestha1;~Linwei_Wang1",
        "aff": "Rochester Institute of Technology;Zhejiang University;Rochester Institute of Technology;Rochester Institute of Technology;Rochester Institute of Technology;Rochester Institute of Technology;Rochester Institute of Technology",
        "aff_domain": "rit.edu;zju.edu.cn;rit.edu;rit.edu;rit.edu;rit.edu;rit.edu",
        "position": "PhD student;MS student;PhD student;PhD student;PhD student;PhD student;Professor",
        "bibtex": "@inproceedings{\ntoloubidokhti2024dats,\ntitle={{DATS}: Difficulty-Aware Task Sampler for Meta-Learning Physics-Informed Neural Networks},\nauthor={Maryam Toloubidokhti and Yubo Ye and Ryan Missel and Xiajun Jiang and Nilesh Kumar and Ruby Shrestha and Linwei Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=EvyYFSxdgB}\n}",
        "github": "",
        "project": "",
        "reviewers": "LK9J;USEY;Z9PQ",
        "pdf_size": 3802197,
        "rating": "6;6;6",
        "confidence": "3;4;4",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "2;3;3",
        "wc_summary": "67;79;60",
        "wc_strengths": "51;91;40",
        "wc_weaknesses": "78;214;279",
        "wc_questions": "7;134;94",
        "wc_review": "203;518;473",
        "wc_reply_reviewers": "0;0;17",
        "wc_reply_authors": "339;1020;938",
        "reply_reviewers": "0;0;1",
        "reply_authors": "1;2;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            68.66666666666667,
            7.845734863959881
        ],
        "wc_strengths_avg": [
            60.666666666666664,
            21.913973218524802
        ],
        "wc_weaknesses_avg": [
            190.33333333333334,
            83.74697341131532
        ],
        "wc_questions_avg": [
            78.33333333333333,
            53.01781671182706
        ],
        "wc_review_avg": [
            398.0,
            139.10427743243557
        ],
        "wc_reply_reviewers_avg": [
            5.666666666666667,
            8.013876853447538
        ],
        "wc_reply_authors_avg": [
            765.6666666666666,
            303.55047173227865
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17039100041829261602&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=EvyYFSxdgB",
        "pdf": "https://openreview.net/pdf?id=EvyYFSxdgB",
        "email": "rit.edu;zju.edu.cn;rit.edu;rit.edu;rit.edu;rit.edu;rit.edu",
        "author_num": 7,
        "aff_unique_index": "0;1;0;0;0;0;0",
        "aff_unique_norm": "Rochester Institute of Technology;Zhejiang University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.rit.edu;https://www.zju.edu.cn",
        "aff_unique_abbr": "RIT;ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;0;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "EwAGztBkJ6",
        "title": "On the Generalization of Gradient-based Neural Network Interpretations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Feature saliency maps are commonly used for interpreting neural network predictions. This approach to interpretability is often studied as a post-processing problem independent of training setups, where the gradients of trained models are used to explain their output predictions. However, in this work, we observe that gradient-based interpretation methods are highly sensitive to the training set: models trained on disjoint datasets without regularization produce inconsistent interpretations across test data. Our numerical observations pose the question of how many training samples are required for accurate gradient-based interpretations. To address this question, we study the generalization aspect of gradient-based explanation schemes and show that the proper generalization of interpretations from training samples to test data requires more training data than standard deep supervised learning problems. We prove generalization error bounds for widely-used gradient-based interpretations, suggesting that the sample complexity of interpretable deep learning is greater than that of standard deep learning. Our bounds also indicate that Gaussian smoothing in the widely-used SmoothGrad method plays the role of a regularization mechanism for reducing the generalization gap. We evaluate our findings on various neural net architectures and datasets, to shed light on how training data affect the generalization of interpretation methods.",
        "keywords": "interpretability;generalization;robustness;explainable AI",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/c44676f5dc65b4cd30ab4da877422fd0d70db7bf.zip",
        "author": "Ching Lam Choi;Farzan Farnia",
        "authorids": "~Ching_Lam_Choi1;~Farzan_Farnia1",
        "gender": "F;M",
        "homepage": "https://chinglamchoi.github.io/cchoi/;https://www.cse.cuhk.edu.hk/~farnia/",
        "dblp": "288/0502;132/7757",
        "google_scholar": "https://scholar.google.com.hk/citations?user=1uIAXh0AAAAJ;GYPCqcYAAAAJ",
        "orcid": ";0000-0002-6049-9232",
        "linkedin": "ching-lam-choi/;farzan-farnia-00798335",
        "or_profile": "~Ching_Lam_Choi1;~Farzan_Farnia1",
        "aff": "The Chinese University of Hong Kong;The Chinese University of Hong Kong",
        "aff_domain": "cuhk.edu.hk;cuhk.edu.hk",
        "position": "Undergrad student;Assistant Professor",
        "bibtex": "@misc{\nchoi2024on,\ntitle={On the Generalization of Gradient-based Neural Network Interpretations},\nauthor={Ching Lam Choi and Farzan Farnia},\nyear={2024},\nurl={https://openreview.net/forum?id=EwAGztBkJ6}\n}",
        "github": "",
        "project": "",
        "reviewers": "Cg7V;Yqqc;DbhP",
        "site": "https://openreview.net/forum?id=EwAGztBkJ6",
        "pdf_size": 1435413,
        "rating": "3;3;6",
        "confidence": "3;4;4",
        "soundness": "2;3;3",
        "contribution": "1;2;3",
        "presentation": "3;2;3",
        "wc_summary": "191;27;33",
        "wc_strengths": "20;22;42",
        "wc_weaknesses": "68;373;14",
        "wc_questions": "362;182;78",
        "wc_review": "641;604;167",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "335;540;168",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            83.66666666666667,
            75.93564526770167
        ],
        "wc_strengths_avg": [
            28.0,
            9.93310961716756
        ],
        "wc_weaknesses_avg": [
            151.66666666666666,
            158.05132780910833
        ],
        "wc_questions_avg": [
            207.33333333333334,
            117.318180839781
        ],
        "wc_review_avg": [
            470.6666666666667,
            215.25540385525488
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            347.6666666666667,
            152.13225240632644
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:u-WpuPve-SsJ:scholar.google.com/&scioq=On+the+Generalization+of+Gradient-based+Neural+Network+Interpretations&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Chinese University of Hong Kong",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cuhk.edu.hk",
        "aff_unique_abbr": "CUHK",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "EwMhfwiAuv",
        "title": "Localized Text-to-Image Generation For Free via Cross Attention Control",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Despite the tremendous success in text-to-image generative models, localized text-to-image generation (that is, generating objects or features at specific locations in an image while maintaining a consistent overall generation) still requires either explicit training or substantial additional inference time. In this work, we show that localized generation can be achieved by simply controlling cross attention maps during inference. With no additional training, model architecture modification or inference time, our proposed cross attention control (CAC) provides new open-vocabulary localization abilities to standard text-to-image models. CAC also enhances models that are already trained for localized generation when deployed at inference time. Furthermore, to assess localized text-to-image generation performance automatically, we develop a standardized suite of evaluations using large pretrained recognition models. Our experiments show that CAC improves localized generation performance with various types of location information ranging from bounding boxes to semantic segmentation maps, and enhances the compositional capability of state-of-the-art text-to-image generative models.",
        "keywords": "generative model;diffusion model;controllable generation",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Yutong He;Ruslan Salakhutdinov;J Zico Kolter",
        "authorids": "~Yutong_He1;~Ruslan_Salakhutdinov1;~J_Zico_Kolter1",
        "gender": "F;M;M",
        "homepage": "https://kellyyutonghe.github.io/;http://www.zicokolter.com;https://www.cs.cmu.edu/~rsalakhu/",
        "dblp": ";67/2526;",
        "google_scholar": "uNF3hk0AAAAJ;UXh1I6UAAAAJ;",
        "orcid": ";;",
        "linkedin": "yutong-he-b7608b12b/;;",
        "or_profile": "~Yutong_He1;~Zico_Kolter1;~Russ_Salakhutdinov1",
        "aff": "School of Computer Science, Carnegie Mellon University;Carnegie Mellon University;School of Computer Science, Carnegie Mellon University",
        "aff_domain": "cs.cmu.edu;cmu.edu;cs.cmu.edu",
        "position": "PhD student;Full Professor;Full Professor",
        "bibtex": "@misc{\nhe2024localized,\ntitle={Localized Text-to-Image Generation For Free via Cross Attention Control},\nauthor={Yutong He and Ruslan Salakhutdinov and J Zico Kolter},\nyear={2024},\nurl={https://openreview.net/forum?id=EwMhfwiAuv}\n}",
        "github": "",
        "project": "",
        "reviewers": "WuMR;J2jj;EyKK;oxfo",
        "site": "https://openreview.net/forum?id=EwMhfwiAuv",
        "pdf_size": 14344489,
        "rating": "3;3;3;8",
        "confidence": "4;4;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;1;2;3",
        "presentation": "3;2;2;3",
        "wc_summary": "81;69;77;75",
        "wc_strengths": "97;28;52;42",
        "wc_weaknesses": "224;74;187;129",
        "wc_questions": "60;37;1;3",
        "wc_review": "462;208;317;249",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            2.165063509461097
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            75.5,
            4.330127018922194
        ],
        "wc_strengths_avg": [
            54.75,
            25.839649765428323
        ],
        "wc_weaknesses_avg": [
            153.5,
            57.03726851804879
        ],
        "wc_questions_avg": [
            25.25,
            24.641174890820444
        ],
        "wc_review_avg": [
            309.0,
            96.53237798790622
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 22,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15317292200151968710&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Carnegie Mellon University",
        "aff_unique_dep": "School of Computer Science",
        "aff_unique_url": "https://www.cmu.edu",
        "aff_unique_abbr": "CMU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Pittsburgh;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "ExZ5gonvhs",
        "title": "GPS-SSL: Guided Positive Sampling to Inject Prior into Self-Supervised Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this paper, we propose Guided Positive Sampling Self-Supervised Learning (GPS-SSL), a general method to embed a priori knowledge into Self-Supervised Learning (SSL) positive samples selection. Current SSL methods leverage Data-Augmentations (DA) for generating positive samples and their performance heavily relies on the chosen set of DA. However, designing optimal DA given a target dataset requires domain knowledge regarding that dataset and can be costly to search and find. Our method designs a metric space where distances better align with semantic relationship thus enabling nearest neighbor sampling to provide meaningful positive samples. This strategy comes in contrast with the current strategy where DA are the sole mean to incorporate known properties into the learned SSL representation. A key benefit of GPS-SSL lies in its applicability to any SSL method, e.g. SimCLR or BYOL. As a direct by-product, GPS-SSL also reduces the importance of DA to learn informative representations, a dependency that has been one of the major bottlenecks of SSL. We evaluate GPS-SSL along with multiple baseline SSL methods on multiple downstream datasets from different domains when the models use strong or minimal data augmentations. We show that when using strong DA, GPS-SSL outperforms the baselines on under- studied domains. Additionally, when using minimal augmentations \u2013which is the most realistic scenario for which one does not know a priori the strong DA that aligns with the possible downstream tasks\u2013 GPS-SSL outperforms the baselines on all datasets by a significant margin. We believe that opening a new avenue to impact the SSL representations that is not solely based on altering the DA will open the door to multiple interesting research directions, greatly increasing the reach of SSL.",
        "keywords": "self-supervised learning;computer vision;data augmentation;real-world datasets",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Aarash Feizi;Randall Balestriero;Arantxa Casanova;Adriana Romero-Soriano;Reihaneh Rabbany",
        "authorids": "~Aarash_Feizi1;~Randall_Balestriero1;~Arantxa_Casanova1;~Adriana_Romero-Soriano1;~Reihaneh_Rabbany1",
        "gender": "M;M;F;F;F",
        "homepage": "https://aarashfeizi.github.io/;https://randallbalestriero.github.io/;;http://www.reirab.com/;https://sites.google.com/site/adriromsor/home",
        "dblp": "275/3823;175/5364;193/6415.html;94/9024;54/10771",
        "google_scholar": "wdZdCMoAAAAJ;S1x_xqcAAAAJ;iFhSTbAAAAAJ;https://scholar.google.ca/citations?user=Foh_c-QAAAAJ;https://scholar.google.ca/citations?user=Sm15FXIAAAAJ",
        "orcid": ";;;;",
        "linkedin": "aarashfeizi/;randallbalestriero/;;;https://ca.linkedin.com/in/adriana-romero-a6415123",
        "or_profile": "~Aarash_Feizi1;~Randall_Balestriero1;~Arantxa_Casanova1;~Reihaneh_Rabbany1;~Adriana_Romero1",
        "aff": "ServiceNow Inc;Citadel;Meta;Montreal Institute for Learning Algorithms, University of Montreal, University of Montreal;Meta",
        "aff_domain": "servicenow.com;citadel.com;meta.com;mila.umontreal.ca;meta.com",
        "position": "Intern;Researcher;Researcher;Assistant Professor;Research Scientist",
        "bibtex": "@misc{\nfeizi2024gpsssl,\ntitle={{GPS}-{SSL}: Guided Positive Sampling to Inject Prior into Self-Supervised Learning},\nauthor={Aarash Feizi and Randall Balestriero and Arantxa Casanova and Adriana Romero-Soriano and Reihaneh Rabbany},\nyear={2024},\nurl={https://openreview.net/forum?id=ExZ5gonvhs}\n}",
        "github": "",
        "project": "",
        "reviewers": "sJCd;aLRr;uQnq",
        "site": "https://openreview.net/forum?id=ExZ5gonvhs",
        "pdf_size": 5188434,
        "rating": "5;5;6",
        "confidence": "4;3;3",
        "soundness": "2;3;3",
        "contribution": "2;2;2",
        "presentation": "2;3;3",
        "wc_summary": "39;68;93",
        "wc_strengths": "35;17;45",
        "wc_weaknesses": "408;99;50",
        "wc_questions": "2;33;137",
        "wc_review": "484;217;325",
        "wc_reply_reviewers": "154;78;37",
        "wc_reply_authors": "1964;1378;1215",
        "reply_reviewers": "1;1;1",
        "reply_authors": "5;4;4",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            66.66666666666667,
            22.065558884580486
        ],
        "wc_strengths_avg": [
            32.333333333333336,
            11.585431464655176
        ],
        "wc_weaknesses_avg": [
            185.66666666666666,
            158.48098378740025
        ],
        "wc_questions_avg": [
            57.333333333333336,
            57.73695138778593
        ],
        "wc_review_avg": [
            342.0,
            109.66312051004202
        ],
        "wc_reply_reviewers_avg": [
            89.66666666666667,
            48.472214262972926
        ],
        "wc_reply_authors_avg": [
            1519.0,
            321.621931258841
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1961431032390815133&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2;3;2",
        "aff_unique_norm": "ServiceNow;Citadel;Meta;University of Montreal",
        "aff_unique_dep": ";;Meta Platforms, Inc.;Montreal Institute for Learning Algorithms",
        "aff_unique_url": "https://www.servicenow.com;https://www.citadel.edu;https://meta.com;https://www.umontreal.ca",
        "aff_unique_abbr": "ServiceNow;Citadel;Meta;UM",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Montreal",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "United States;Canada"
    },
    {
        "id": "ExiBN1ZWJn",
        "title": "Denoising Graph Dissipation Model Improves Graph Representation Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph-structured data are considered non-Euclidean as they provide superior representations of complex relations or interdependency. Many variants of graph neural networks (GNNs) have emerged for graph representation learning which is essentially equivalent to node feature embedding, since an instance in graph-structured data is an individual node. GNNs obtain node feature embedding with a given graph structure, however, graph representation learning tasks entail underlying factors such as homophilous relation for node classification or structure-based heuristics for link prediction. Existing graph representation learning models have been primarily developed toward focusing on task-specific factors rather than generalizing the underlying factors. We introduce Graph dissipation model that captures latent factors for any given downstream task. Graph dissipation model leverages Laplacian smoothing and subgraph sampling as a noise source in the forward diffusion process, and then learns the latent factors by capturing the intrinsic data distribution within graph structure in the denoising process. We demonstrate the effectiveness of our proposed model in two distinct graph representation learning tasks: link prediction tasks and node classification tasks, highlighting its capability to capture the underlying representational factors in various graph-related tasks.",
        "keywords": "graph representation learning;diffusion generative models",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Seoyoon Kim;Hyemin Jung;Seohui Bae;Woohyung Lim",
        "authorids": "~Seoyoon_Kim1;~Hyemin_Jung1;~Seohui_Bae1;~Woohyung_Lim1",
        "gender": ";F;F;M",
        "homepage": "https://github.com/sykim45;;;",
        "dblp": ";;;86/7195",
        "google_scholar": ";;;https://scholar.google.co.kr/citations?user=gtvxdcUAAAAJ",
        "orcid": "0009-0004-7872-3484;;;0000-0003-0525-9065",
        "linkedin": ";hyemin-jung-1a74ba220/;seohui-bae-2709391a8/;woohyunglim/",
        "or_profile": "~Seoyoon_Kim1;~Hyemin_Jung1;~Seohui_Bae1;~Woohyung_Lim1",
        "aff": "LG AI Research;LG AI Research;LG AI Research;LG AI Research",
        "aff_domain": "lgresearch.ai;lgresearch.ai;lgresearch.ai;lgresearch.ai",
        "position": "Researcher;Researcher;Researcher;Vice President",
        "bibtex": "@misc{\nkim2024denoising,\ntitle={Denoising Graph Dissipation Model Improves Graph Representation Learning},\nauthor={Seoyoon Kim and Hyemin Jung and Seohui Bae and Woohyung Lim},\nyear={2024},\nurl={https://openreview.net/forum?id=ExiBN1ZWJn}\n}",
        "github": "",
        "project": "",
        "reviewers": "ntqg;Uwe6;7MVc;yTz6",
        "site": "https://openreview.net/forum?id=ExiBN1ZWJn",
        "pdf_size": 824720,
        "rating": "3;5;5;6",
        "confidence": "4;2;3;4",
        "soundness": "3;3;3;2",
        "contribution": "3;2;2;2",
        "presentation": "3;3;2;3",
        "wc_summary": "54;63;31;148",
        "wc_strengths": "33;99;62;123",
        "wc_weaknesses": "221;144;102;208",
        "wc_questions": "100;61;166;77",
        "wc_review": "408;367;361;556",
        "wc_reply_reviewers": "220;153;0;79",
        "wc_reply_authors": "3070;1307;1742;914",
        "reply_reviewers": "2;1;0;1",
        "reply_authors": "7;4;4;2",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            74.0,
            44.288824775557096
        ],
        "wc_strengths_avg": [
            79.25,
            34.4265522525855
        ],
        "wc_weaknesses_avg": [
            168.75,
            48.31860407751863
        ],
        "wc_questions_avg": [
            101.0,
            40.006249511795026
        ],
        "wc_review_avg": [
            423.0,
            78.88916275382823
        ],
        "wc_reply_reviewers_avg": [
            113.0,
            82.11881635776298
        ],
        "wc_reply_authors_avg": [
            1758.25,
            811.9939577977166
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            4.25,
            1.7853571071357126
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.20751433915982243,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:_r_6T2ffFwUJ:scholar.google.com/&scioq=Denoising+Graph+Dissipation+Model+Improves+Graph+Representation+Learning&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "LG",
        "aff_unique_dep": "LG AI Research",
        "aff_unique_url": "https://www.lgaires.com",
        "aff_unique_abbr": "LG AI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "ExpwgjvwmC",
        "title": "OmniInput: A Model-centric Evaluation Framework through Output Distribution",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We propose a novel model-centric evaluation framework, OmniInput, to evaluate the quality of an AI/ML model's predictions on all possible inputs (including human-unrecognizable ones), which is crucial for AI safety and reliability. Unlike traditional data-centric evaluation based on pre-defined test sets, the test set in OmniInput is self-constructed by the model itself and the model quality is evaluated by investigating its output distribution. We employ an efficient sampler to obtain representative inputs and the output distribution of the trained model, which, after selective annotation, can be used to estimate the model's precision and recall at different output values and a comprehensive precision-recall curve. Our experiments demonstrate that OmniInput enables a more fine-grained comparison between models, especially when their performance is almost the same on pre-defined test sets, leading to new findings and insights for how to train more robust, generalizable models.",
        "keywords": "comprehensive model evaluation; output distribution",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/575eaf2391e9c6ca2f5fea805dc98fefe1706b17.pdf",
        "author": "Weitang Liu;Ying Wai Li;Tianle Wang;Yi-Zhuang You;Jingbo Shang",
        "authorids": "~Weitang_Liu1;~Ying_Wai_Li1;~Tianle_Wang1;~Yi-Zhuang_You1;~Jingbo_Shang2",
        "gender": "M;;M;M;M",
        "homepage": "https://github.com/wetliu;;https://wtl666wtl.github.io/;https://everettyou.github.io/;https://shangjingbo1226.github.io/",
        "dblp": "194/3059;;237/9664-3.html;;151/3145.html",
        "google_scholar": "lm55cKIAAAAJ;;https://scholar.google.com/citations?hl=zh-CN;jXdbhiQAAAAJ;0SkFI4MAAAAJ",
        "orcid": ";;;0000-0003-4080-5340;",
        "linkedin": ";;;;",
        "or_profile": "~Weitang_Liu1;~Ying_Wai_Li1;~Tianle_Wang1;~Yi-Zhuang_You1;~Jingbo_Shang2",
        "aff": "University of California, San Diego;;University of California, San Diego;University of California, San Diego;University of California, San Diego",
        "aff_domain": "ucsd.edu;;ucsd.edu;ucsd.edu;ucsd.edu",
        "position": "PhD student;;MS student;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nliu2024omniinput,\ntitle={OmniInput: A Model-centric Evaluation Framework through Output Distribution},\nauthor={Weitang Liu and Ying Wai Li and Tianle Wang and Yi-Zhuang You and Jingbo Shang},\nyear={2024},\nurl={https://openreview.net/forum?id=ExpwgjvwmC}\n}",
        "github": "",
        "project": "",
        "reviewers": "8n4h;BbXK;HAeb;XWBZ",
        "site": "https://openreview.net/forum?id=ExpwgjvwmC",
        "pdf_size": 1389088,
        "rating": "5;5;6;6",
        "confidence": "2;3;4;4",
        "soundness": "3;1;3;3",
        "contribution": "2;2;3;2",
        "presentation": "3;3;4;2",
        "wc_summary": "73;40;55;63",
        "wc_strengths": "20;35;34;36",
        "wc_weaknesses": "32;155;137;144",
        "wc_questions": "103;21;85;19",
        "wc_review": "228;251;311;262",
        "wc_reply_reviewers": "111;101;0;155",
        "wc_reply_authors": "582;1184;179;675",
        "reply_reviewers": "1;2;0;1",
        "reply_authors": "3;5;2;3",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            57.75,
            12.07010770457331
        ],
        "wc_strengths_avg": [
            31.25,
            6.53356717268599
        ],
        "wc_weaknesses_avg": [
            117.0,
            49.49242366261729
        ],
        "wc_questions_avg": [
            57.0,
            37.54996671103717
        ],
        "wc_review_avg": [
            263.0,
            30.306764921383476
        ],
        "wc_reply_reviewers_avg": [
            91.75,
            56.73347777106565
        ],
        "wc_reply_authors_avg": [
            655.0,
            357.82188306474495
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            3.25,
            1.0897247358851685
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.9045340337332909,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:magtP5Vm0-cJ:scholar.google.com/&scioq=OmniInput:+A+Model-centric+Evaluation+Framework+through+Output+Distribution&hl=en&as_sdt=0,5",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of California, San Diego",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucsd.edu",
        "aff_unique_abbr": "UCSD",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "San Diego",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "EyC5qvRPz7",
        "title": "Emerging Semantic Segmentation from Positive and Negative Coarse Label Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large annotated dataset is of crucial importance for developing machine learning models for segmentation. However, the process of producing labels at the pixel level is time-consuming, error-prone, and even requires expert-level annotators for medical imaging, which is rare to have in practice. We note that it is simpler and less expensive to draw merely rough and approximate annotations, e.g., coarse annotations, which reduce the effort for expert and non-expert level annotators. In this paper, we propose to use coarse drawings from both positive (e.g., objects to be segmented) and negative (objects not to be segmented) classes in the image, even with noisy pixels, to train a convolutional neural network (CNN) for semantic segmentation. We present a method for learning the true segmentation label distributions from purely noisy coarse annotations using two coupled CNNs. The separation of the two CNNs is achieved by high fidelity with the characters of the noisy training annotations. We propose to add a complementary label learning that encourages estimating negative label distribution.  To illustrate the properties of our method, we first use a toy segmentation dataset based on MNIST. We then present the quantitative results on publicly available datasets: Cityscapes dataset for multi-class segmentation, and retinal images for medical applications. In all experiments, our method outperforms the state-of-the-art methods, particularly in the cases where the ratio of coarse annotations is small compared to the given dense annotations.",
        "keywords": "Image Segmentation; Weakly-supervised learning; Coarse Annotation;",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/17d2887262731c8651c99734540cb1c12187c774.pdf",
        "author": "Le Zhang;Fuping Wu;Kevin Bronik;Thomas E. Nichols;Bartlomiej Papiez",
        "authorids": "~Le_Zhang4;~Fuping_Wu1;~Kevin_Bronik1;~Thomas_E._Nichols1;~Bartlomiej_Papiez1",
        "gender": "M;M;M;M;",
        "homepage": "https://cheonglok.github.io/l.zhang/;;https://kbronik2017.github.io/;http://nisox.org;https://www.bdi.ox.ac.uk/Team/bartek-papiez",
        "dblp": "03/4043-5;;222/2775.html;;44/8930",
        "google_scholar": "https://scholar.google.com.hk/citations?hl=en;;WjnkiQIAAAAJ;OTJoPikAAAAJ;https://scholar.google.co.uk/citations?user=-LSjTyUAAAAJ",
        "orcid": ";0000-0001-7179-4766;;0000-0002-4516-5103;0000-0002-8432-2511",
        "linkedin": ";;kevinbronik/?originalSubdomain=uk;thomasenichols;",
        "or_profile": "~Le_Zhang4;~Fuping_Wu1;~Kevin_Bronik1;~Thomas_E._Nichols1;~Bartlomiej_Papiez1",
        "aff": "University of Birmingham;University of Oxford;University of Oxford;University of Oxford;University of Oxford",
        "aff_domain": "bham.ac.uk;ox.ac.uk;ox.ac.uk;ox.ac.uk;ox.ac.uk",
        "position": "Assistant Professor;Postdoc;Researcher;Full Professor;Principal Researcher",
        "bibtex": "@misc{\nanonymous2024emerging,\ntitle={Emerging Semantic Segmentation from Positive and Negative Coarse Label Learning},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=EyC5qvRPz7}\n}",
        "github": "",
        "project": "",
        "reviewers": "xtWR;GdJZ;64sj;fJPX",
        "site": "https://openreview.net/forum?id=EyC5qvRPz7",
        "pdf_size": 12867733,
        "rating": "3;5;5;6",
        "confidence": "4;4;4;4",
        "soundness": "2;3;2;3",
        "contribution": "2;3;2;2",
        "presentation": "2;2;3;2",
        "wc_summary": "107;60;120;119",
        "wc_strengths": "54;41;79;86",
        "wc_weaknesses": "740;102;144;239",
        "wc_questions": "64;43;97;4",
        "wc_review": "965;246;440;448",
        "wc_reply_reviewers": "61;84;41;23",
        "wc_reply_authors": "738;430;507;288",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            101.5,
            24.5
        ],
        "wc_strengths_avg": [
            65.0,
            18.261982367749674
        ],
        "wc_weaknesses_avg": [
            306.25,
            255.29627396419244
        ],
        "wc_questions_avg": [
            52.0,
            33.741665637605976
        ],
        "wc_review_avg": [
            524.75,
            266.73711309077333
        ],
        "wc_reply_reviewers_avg": [
            52.25,
            22.730761095924613
        ],
        "wc_reply_authors_avg": [
            490.75,
            162.93767980427364
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:3AgiNaDEsLoJ:scholar.google.com/&scioq=Emerging+Semantic+Segmentation+from+Positive+and+Negative+Coarse+Label+Learning&hl=en&as_sdt=0,34",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1;1",
        "aff_unique_norm": "University of Birmingham;University of Oxford",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.birmingham.ac.uk;https://www.ox.ac.uk",
        "aff_unique_abbr": "Birmingham;Oxford",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "EyDPfGy4Wh",
        "title": "Few Heads are Enough",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The costly self-attention layers in modern Transformers require memory and compute quadratic in sequence length. Existing approximation methods usually underperform and fail to obtain significant speedups in practice. The recently proposed Flash-Attention reduces both compute and memory through a *hardware*-aware implementation. Can we achieve this also through *algorithmic* improvements? Here we present Expert Projection Attention (EPA) - a novel method that reduces both compute and memory requirements, while matching the language modeling performance of baseline Transformers using the same parameter budget. EPA uses Mixture-of-Experts (MoE) layers for the value and output projections and requires 4 to 8 times fewer attention matrices than standard Transformers. Our novel attention can also be combined with MoE MLP layers, resulting in an efficient \"Fast Transformer\".",
        "keywords": "transformers;attention;moe;mixture of experts;efficient transformers;language modelling",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "R\u00f3bert Csord\u00e1s;Piotr Pi\u0119kos;Kazuki Irie;J\u00fcrgen Schmidhuber",
        "authorids": "~R\u00f3bert_Csord\u00e1s1;~Piotr_Pi\u0119kos2;~Kazuki_Irie1;~J\u00fcrgen_Schmidhuber1",
        "gender": "M;M;;M",
        "homepage": "https://robertcsordas.github.io/;https://piotrpiekos.github.io;https://sites.harvard.edu/kazuki-irie/;http://people.idsia.ch/~juergen/",
        "dblp": "166/4773.html;;148/9667;s/JurgenSchmidhuber",
        "google_scholar": "av1lplwAAAAJ;;https://scholar.google.de/citations?user=-gZ-BdwAAAAJ;https://scholar.google.ch/citations?user=gLnCTgIAAAAJ",
        "orcid": ";;0000-0003-0923-691X;",
        "linkedin": "robertcsordas/;;;",
        "or_profile": "~R\u00f3bert_Csord\u00e1s1;~Piotr_Pi\u0119kos2;~Kazuki_Irie1;~J\u00fcrgen_Schmidhuber1",
        "aff": "IDSIA;King Abdullah University of Science and Technology;Harvard University;IDSIA",
        "aff_domain": "idsia.ch;kaust.edu.sa;fas.harvard.edu;idsia.ch",
        "position": "Postdoc;PhD student;Postpostdoc;Scientific Director",
        "bibtex": "@misc{\ncsord{\\'a}s2024few,\ntitle={Few Heads are Enough},\nauthor={R{\\'o}bert Csord{\\'a}s and Piotr Pi{\\k{e}}kos and Kazuki Irie and J{\\\"u}rgen Schmidhuber},\nyear={2024},\nurl={https://openreview.net/forum?id=EyDPfGy4Wh}\n}",
        "github": "",
        "project": "",
        "reviewers": "obUv;dyhc;DLPx",
        "site": "https://openreview.net/forum?id=EyDPfGy4Wh",
        "pdf_size": 841235,
        "rating": "5;6;6",
        "confidence": "4;3;3",
        "soundness": "3;2;2",
        "contribution": "2;2;3",
        "presentation": "2;2;3",
        "wc_summary": "117;24;105",
        "wc_strengths": "22;16;61",
        "wc_weaknesses": "4;40;130",
        "wc_questions": "4;92;66",
        "wc_review": "147;172;362",
        "wc_reply_reviewers": "717;767;0",
        "wc_reply_authors": "3057;1649;718",
        "reply_reviewers": "4;6;0",
        "reply_authors": "6;5;1",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            82.0,
            41.30375285612676
        ],
        "wc_strengths_avg": [
            33.0,
            19.949937343260004
        ],
        "wc_weaknesses_avg": [
            58.0,
            52.99056519796708
        ],
        "wc_questions_avg": [
            54.0,
            36.914315199752345
        ],
        "wc_review_avg": [
            227.0,
            96.00347215943113
        ],
        "wc_reply_reviewers_avg": [
            494.6666666666667,
            350.3772569991126
        ],
        "wc_reply_authors_avg": [
            1808.0,
            961.4887761522059
        ],
        "reply_reviewers_avg": [
            3.3333333333333335,
            2.494438257849294
        ],
        "reply_authors_avg": [
            4.0,
            2.160246899469287
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9999999999999997,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:3FDiOvlFBFsJ:scholar.google.com/&scioq=Few+Heads+are+Enough&hl=en&as_sdt=0,34",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Institute of Digital Technologies;King Abdullah University of Science and Technology;Harvard University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.idsia.ch;https://www.kast.kau.edu.sa;https://www.harvard.edu",
        "aff_unique_abbr": "IDSIA;KAUST;Harvard",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;0",
        "aff_country_unique": "Switzerland;Saudi Arabia;United States"
    },
    {
        "id": "EyQO9RPhwN",
        "title": "Geometry-Guided Conditional Adaption for Surrogate Models of Large-Scale 3D PDEs on Arbitrary Geometries",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Deep learning surrogate models aim to accelerate the solving of partial differential equations (PDEs) and have achieved certain promising results. Although several main-stream models through neural operator learning have been applied to delve into PDEs on varying geometries, they were designed to map the complex geometry to a latent uniform grid, which is still challenging to learn by the networks with general architectures. In this work, we rethink the critical factors of PDE solutions and propose a novel model-agnostic framework, called 3D Geometry-Guided Conditional Adaption (3D-GeoCA), for solving PDEs on arbitrary 3D geometries. Starting with a 3D point cloud geometry encoder, 3D-GeoCA can extract the essential and robust representations of any kind of geometric shapes, which is regarded as a conditioning key to guiding the adaption of hidden features in the surrogate model. We conduct experiments on the public Shape-Net Car computational fluid dynamics dataset using several surrogate models as the backbones with various point cloud geometry encoders to simulate corresponding large-scale Reynolds Average Navier-Stokes equations. Equipped with 3D-GeoCA, these backbone models can reduce their L-2 errors by a large margin. Moreover, this 3D-GeoCA is model-agnostic so that it can be applied to any surrogate model. Our experimental results further show that its overall performance is positively correlated to the power of the applied backbone model.",
        "keywords": "partial differential equations;surrogate model;geometry-guided conditional adaption;3D understanding",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/4348f2bdb7d920e719bdece116a48511ba694e98.zip",
        "author": "Jingyang Deng;Xingjian Li;Haoyi Xiong;Xiaoguang Hu;Jinwen Ma",
        "authorids": "~Jingyang_Deng1;~Xingjian_Li1;~Haoyi_Xiong1;huxiaoguang@baidu.com;~Jinwen_Ma1",
        "gender": "M;M;M;;M",
        "homepage": ";;https://sites.google.com/site/haoyixiongshomepage/;;https://www.math.pku.edu.cn/teachers/jwma/homepage/",
        "dblp": "368/3826.html;79/8061-2;06/2700;;m/JinwenMa",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;f_Kcie0AAAAJ;;",
        "orcid": "0009-0008-3487-225X;;;;0000-0002-7388-4295",
        "linkedin": ";;;;",
        "or_profile": "~Jingyang_Deng1;~Xingjian_Li1;~Haoyi_Xiong1;huxiaoguang@baidu.com;~Jinwen_Ma1",
        "aff": "Peking University;Carnegie Mellon University;Baidu;;Peking University",
        "aff_domain": "pku.edu.cn;cmu.edu;baidu.com;;pku.edu.cn",
        "position": "PhD student;Postdoc;Principal Researcher;;Full Professor",
        "bibtex": "@misc{\ndeng2024geometryguided,\ntitle={Geometry-Guided Conditional Adaption for Surrogate Models of Large-Scale 3D {PDE}s on Arbitrary Geometries},\nauthor={Jingyang Deng and Xingjian Li and Haoyi Xiong and Xiaoguang Hu and Jinwen Ma},\nyear={2024},\nurl={https://openreview.net/forum?id=EyQO9RPhwN}\n}",
        "github": "",
        "project": "",
        "reviewers": "vtzc;SunQ;E9jv;Wkj4",
        "site": "https://openreview.net/forum?id=EyQO9RPhwN",
        "pdf_size": 2054699,
        "rating": "3;5;5;5",
        "confidence": "2;2;3;3",
        "soundness": "2;2;3;3",
        "contribution": "3;3;2;2",
        "presentation": "2;2;2;3",
        "wc_summary": "71;49;72;127",
        "wc_strengths": "92;60;70;35",
        "wc_weaknesses": "779;192;162;213",
        "wc_questions": "131;134;110;203",
        "wc_review": "1073;435;414;578",
        "wc_reply_reviewers": "124;93;80;0",
        "wc_reply_authors": "742;297;378;528",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            2.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            79.75,
            28.78693279944913
        ],
        "wc_strengths_avg": [
            64.25,
            20.474068965401088
        ],
        "wc_weaknesses_avg": [
            336.5,
            256.11960096798526
        ],
        "wc_questions_avg": [
            144.5,
            35.01785258978626
        ],
        "wc_review_avg": [
            625.0,
            266.23955378568377
        ],
        "wc_reply_reviewers_avg": [
            74.25,
            45.75136609982264
        ],
        "wc_reply_authors_avg": [
            486.25,
            169.32568470258727
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12227990109439811014&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Peking University;Carnegie Mellon University;Baidu",
        "aff_unique_dep": ";;Baidu, Inc.",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.cmu.edu;https://www.baidu.com",
        "aff_unique_abbr": "Peking U;CMU;Baidu",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "EyWKb7Ltcx",
        "title": "Intrinsic Riemannian Classifiers on the Deformed SPD Manifolds: A Unified Framework",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Geometric deep learning, which extends deep learning techniques to non-Euclidean spaces, has gained significant attention in machine learning. To better classify non-Euclidean features in geometric deep learning, researchers started exploring intrinsic classifiers based on Riemannian geometry. However, existing approaches suffer from limited applicability due to their strong reliance on specific geometric properties. In this paper, we propose a general framework to design intrinsic Riemannian classifiers. Our framework exhibits broad applicability while requiring only minimal geometric properties, enabling its use with a wide range of Riemannian metrics on various Riemannian manifolds. Specifically, we focus on symmetric positive definite (SPD) manifolds and systematically study five families of deformed parameterized Riemannian metrics, developing diverse SPD classifiers respecting these metrics. The versatility and effectiveness of the proposed framework are showcased in three applications, including radar recognition, human action recognition, and electroencephalography (EEG) classification.",
        "keywords": "Riemannian geometry;Riemannian classifier;SPD Neural Networks;Matrix manifolds",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/7ed98cc75bc21996b80c42ac21251e0babeb28c7.pdf",
        "author": "Ziheng Chen;Yue Song;Yunmei Liu;Xiaojun Wu;Emanuele Strano;Nicu Sebe",
        "authorids": "~Ziheng_Chen2;~Yue_Song1;~Yunmei_Liu1;~Xiaojun_Wu2;emanuele.strano@mindearth.ch;~Nicu_Sebe1",
        "gender": "M;M;F;M;;M",
        "homepage": "https://gitzh-chen.github.io/;https://kingjamessong.github.io/;https://yunmeil.github.io/;https://scholar.google.com/citations?user=5IST34sAAAAJ&hl=en;;http://disi.unitn.it/~sebe/",
        "dblp": ";11/1346;;13/5168-1.html;;20/3519",
        "google_scholar": "47Y-sn4AAAAJ;Uza2i10AAAAJ;;5IST34sAAAAJ;;https://scholar.google.it/citations?user=stFCYOAAAAAJ",
        "orcid": "0000-0002-5366-7293;;;0009-0000-0199-5001;;0000-0002-6597-7248",
        "linkedin": "ziheng-chen-geometrier/;;;;;",
        "or_profile": "~Ziheng_Chen2;~Yue_Song1;~Yunmei_Liu1;~Xiaojun_Wu2;emanuele.strano@mindearth.ch;~Nicu_Sebe1",
        "aff": "University of Trento;University of Trento, Italy;;Jiangnan University;;University of Trento",
        "aff_domain": "unitn.it;unitn.it;;jiangnan.edu.cn;;unitn.it",
        "position": "PhD student;PhD student;;Full Professor;;Full Professor",
        "bibtex": "@misc{\nchen2024intrinsic,\ntitle={Intrinsic Riemannian Classifiers on the Deformed {SPD} Manifolds: A Unified Framework},\nauthor={Ziheng Chen and Yue Song and Yunmei Liu and Xiaojun Wu and Emanuele Strano and Nicu Sebe},\nyear={2024},\nurl={https://openreview.net/forum?id=EyWKb7Ltcx}\n}",
        "github": "",
        "project": "",
        "reviewers": "fSLb;Qd7L;ur4M;tGbz",
        "site": "https://openreview.net/forum?id=EyWKb7Ltcx",
        "pdf_size": 1755365,
        "rating": "3;5;6;6",
        "confidence": "4;4;3;3",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "3;2;2;2",
        "wc_summary": "38;33;107;58",
        "wc_strengths": "27;27;62;37",
        "wc_weaknesses": "63;108;222;91",
        "wc_questions": "544;46;47;14",
        "wc_review": "672;214;438;200",
        "wc_reply_reviewers": "189;0;79;0",
        "wc_reply_authors": "2951;876;1092;163",
        "reply_reviewers": "2;0;1;0",
        "reply_authors": "5;2;3;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            59.0,
            29.248931604419333
        ],
        "wc_strengths_avg": [
            38.25,
            14.306903927824496
        ],
        "wc_weaknesses_avg": [
            121.0,
            60.48553546096785
        ],
        "wc_questions_avg": [
            162.75,
            220.51459702251006
        ],
        "wc_review_avg": [
            381.0,
            192.73038162158036
        ],
        "wc_reply_reviewers_avg": [
            67.0,
            77.46934877743584
        ],
        "wc_reply_authors_avg": [
            1270.5,
            1029.335829552241
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.75,
            1.479019945774904
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.8164965809277259,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:QZKZwAGKiL4J:scholar.google.com/&scioq=Intrinsic+Riemannian+Classifiers+on+the+Deformed+SPD+Manifolds:+A+Unified+Framework&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "University of Trento;Jiangnan University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.unitn.it;https://www.jnu.edu.cn",
        "aff_unique_abbr": "UniTN;JNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "Italy;China"
    },
    {
        "id": "EyfOZKXpcN",
        "title": "Improving Language Models via Plug-and-Play Retrieval Feedback",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs) exhibit remarkable performance across various NLP tasks. However, they often generate incorrect or hallucinated information, which hinders their practical applicability in real-world scenarios. Human feedback has been shown to effectively enhance the factuality and quality of generated content, addressing some of these limitations. However, this approach is resource-intensive, involving manual input and supervision, which can be time-consuming and expensive. Moreover, it cannot be provided during inference, further limiting its practical utility in dynamic and interactive applications. In this paper, we introduce ReFeed, a novel pipeline designed to enhance LLMs by providing automatic retrieval feedback in a plug-and-play framework without the need for expensive fine-tuning. ReFeed first generates initial outputs, then utilizes a retrieval model to acquire relevant information from large document collections, and finally incorporates the retrieved information into the in-context demonstration for output refinement, thereby addressing the limitations of LLMs in a more efficient and cost-effective manner. Experiments on four knowledge-intensive benchmark datasets demonstrate our proposed ReFeed could improve over +6.0% under zero-shot setting and +2.5% under few-shot setting, compared to baselines without using retrieval feedback.",
        "keywords": "Automatic feedback;information retrieval",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Wenhao Yu;Zhihan Zhang;Zhenwen Liang;Meng Jiang;Ashish Sabharwal",
        "authorids": "~Wenhao_Yu2;~Zhihan_Zhang2;~Zhenwen_Liang1;~Meng_Jiang3;~Ashish_Sabharwal1",
        "gender": "M;;M;M;M",
        "homepage": "https://wyu97.github.io/;;https://zhenwen-nlp.github.io/;http://www.meng-jiang.com/;",
        "dblp": "159/8117-2.html;;226/6083;69/339-1;13/154",
        "google_scholar": "z4qSdX8AAAAJ;;4rKhF2AAAAAJ;LZIPfCkAAAAJ;7VspfeAAAAAJ",
        "orcid": "0000-0002-4075-5980;;;0000-0002-3009-519X;",
        "linkedin": ";;;meng-jiang-94b10916/;ashish-sabharwal-82a2b661",
        "or_profile": "~Wenhao_Yu2;~Zhihan_Zhang2;~Zhenwen_Liang1;~Meng_Jiang3;~Ashish_Sabharwal1",
        "aff": "Tencent AI Lab;;University of Notre Dame;University of Notre Dame;Allen Institute for AI",
        "aff_domain": "tencent.com;;nd.edu;nd.edu;allenai.org",
        "position": "Researcher;;PhD student;Associate Professor;Principal Researcher",
        "bibtex": "@misc{\nyu2024improving,\ntitle={Improving Language Models via Plug-and-Play Retrieval Feedback},\nauthor={Wenhao Yu and Zhihan Zhang and Zhenwen Liang and Meng Jiang and Ashish Sabharwal},\nyear={2024},\nurl={https://openreview.net/forum?id=EyfOZKXpcN}\n}",
        "github": "",
        "project": "",
        "reviewers": "fuhX;Jo78;KK6a;N6CA",
        "site": "https://openreview.net/forum?id=EyfOZKXpcN",
        "pdf_size": 609709,
        "rating": "5;5;6;6",
        "confidence": "5;4;4;5",
        "soundness": "2;3;3;3",
        "contribution": "2;1;3;3",
        "presentation": "2;2;3;2",
        "wc_summary": "91;54;303;89",
        "wc_strengths": "65;7;8;38",
        "wc_weaknesses": "120;124;35;34",
        "wc_questions": "27;8;42;160",
        "wc_review": "303;193;388;321",
        "wc_reply_reviewers": "12;0;0;11",
        "wc_reply_authors": "829;390;539;1311",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "2;1;1;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            134.25,
            98.53267224631635
        ],
        "wc_strengths_avg": [
            29.5,
            23.984369910422913
        ],
        "wc_weaknesses_avg": [
            78.25,
            43.77427897750002
        ],
        "wc_questions_avg": [
            59.25,
            59.402756670040155
        ],
        "wc_review_avg": [
            301.25,
            70.06559426708661
        ],
        "wc_reply_reviewers_avg": [
            5.75,
            5.7608593109014565
        ],
        "wc_reply_authors_avg": [
            767.25,
            351.3875175642982
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 64,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4008617626230499572&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "Tencent;University of Notre Dame;Allen Institute for AI",
        "aff_unique_dep": "Tencent AI Lab;;",
        "aff_unique_url": "https://ai.tencent.com;https://www.nd.edu;https://allenai.org",
        "aff_unique_abbr": "Tencent AI Lab;Notre Dame;AI2",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "F0XXA9OG13",
        "title": "MediTab: Scaling Medical Tabular Data Predictors via Data Consolidation, Enrichment, and Refinement",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Tabular data prediction has been employed in medical applications such as patient health risk prediction. However, existing methods usually revolve around the algorithm design while overlooking the significance of data engineering. Medical tabular datasets frequently exhibit significant heterogeneity across different sources, with limited sample sizes per source. As such, previous predictors are often trained on manually curated small datasets that struggle to generalize across different tabular datasets during inference.\n\nThis paper proposes to scale medical tabular data predictors (MediTab) to various tabular inputs with varying features. The method uses a data engine that leverages large language models (LLMs) to consolidate tabular samples to overcome the barrier across tables with distinct schema. It also aligns out-domain data with the target task using a \"learn, annotate, and refinement'' pipeline. The expanded training data then enables the pre-trained MediTab to infer for arbitrary tabular input in the domain without fine-tuning, resulting in significant improvements over supervised baselines: it reaches an average ranking of 1.57 and 1.00 on 7 patient outcome prediction datasets and 3 trial outcome prediction datasets, respectively. In addition, MediTab exhibits impressive zero-shot performances: it outperforms supervised XGBoost models by 8.9% and 17.2% on average in two prediction tasks, respectively.",
        "keywords": "tabular prediction;large language model;AI for healthcare",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Zifeng Wang;Chufan Gao;Cao Xiao;Jimeng Sun",
        "authorids": "~Zifeng_Wang3;~Chufan_Gao1;~Cao_Xiao2;~Jimeng_Sun3",
        "gender": "M;;F;",
        "homepage": "https://zifengwang.xyz;https://chufangao.github.io;https://sites.google.com/view/danicaxiao/home;http://sunlab.org",
        "dblp": ";239/1854.html;170/1833;",
        "google_scholar": "kMlWwTAAAAAJ;rBlZICgAAAAJ;ahaV25EAAAAJ;9jmmp5sAAAAJ",
        "orcid": ";0000-0003-2807-0337;;0000-0003-1512-6426",
        "linkedin": ";chufangao/;caoxiao/;jimengsun/",
        "or_profile": "~Zifeng_Wang3;~Chufan_Gao1;~Cao_Xiao2;~Jimeng_Sun3",
        "aff": "University of Illinois, Urbana Champaign;University of Illinois Urbana-Champaign;GE Healthcare;Georgia Institute of Technology",
        "aff_domain": "illinois.edu;illinois.edu;ge.com;gatech.edu",
        "position": "PhD student;PhD student;VP of AI;Associate Professor",
        "bibtex": "@misc{\nwang2024meditab,\ntitle={MediTab: Scaling Medical Tabular Data Predictors via Data Consolidation, Enrichment, and Refinement},\nauthor={Zifeng Wang and Chufan Gao and Cao Xiao and Jimeng Sun},\nyear={2024},\nurl={https://openreview.net/forum?id=F0XXA9OG13}\n}",
        "github": "",
        "project": "",
        "reviewers": "R9Te;bkYv;zDeD",
        "site": "https://openreview.net/forum?id=F0XXA9OG13",
        "pdf_size": 1110037,
        "rating": "3;6;6",
        "confidence": "5;3;3",
        "soundness": "3;3;3",
        "contribution": "1;3;3",
        "presentation": "3;3;3",
        "wc_summary": "69;86;61",
        "wc_strengths": "9;53;86",
        "wc_weaknesses": "554;69;123",
        "wc_questions": "70;306;94",
        "wc_review": "702;514;364",
        "wc_reply_reviewers": "556;186;81",
        "wc_reply_authors": "3689;1192;1297",
        "reply_reviewers": "2;1;1",
        "reply_authors": "6;3;3",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            72.0,
            10.424330514074594
        ],
        "wc_strengths_avg": [
            49.333333333333336,
            31.541859312489635
        ],
        "wc_weaknesses_avg": [
            248.66666666666666,
            217.02585611447827
        ],
        "wc_questions_avg": [
            156.66666666666666,
            106.04820706745694
        ],
        "wc_review_avg": [
            526.6666666666666,
            138.27830230693783
        ],
        "wc_reply_reviewers_avg": [
            274.3333333333333,
            203.72912299314393
        ],
        "wc_reply_authors_avg": [
            2059.3333333333335,
            1153.1453604044125
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            4.0,
            1.4142135623730951
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5065540389692673776&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "University of Illinois Urbana-Champaign;GE Healthcare;Georgia Institute of Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://illinois.edu;https://www.gehealthcare.com;https://www.gatech.edu",
        "aff_unique_abbr": "UIUC;GEHC;Georgia Tech",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Urbana-Champaign;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "F0jBJQEfDp",
        "title": "Augmented Policy Optimization for Safe Reinforcement Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Safe reinforcement learning (RL) holds a critical role in acquiring policies that conform to explicit constraints, ensuring their suitability for safety-critical applications. However, methods rooted in the primal-dual concept demonstrate inherent instability. \nMeanwhile, owing to policy initialization and algorithmic approximation errors, prior methods relying on trust region invariably produced infeasible policies during training, rendering the constructed local optimization problem insoluble.\nIn this paper, we present the Augmented Constraint Policy Optimization (ACPO) algorithm, which encompasses a novel approach to constructing local policy search problems and an optimization problem decomposition method. Specifically, this method introduces an approach for constructing local policy search optimization that guarantees a solution without relying on hypothetical premises. Utilizing the Alternating Direction Method of Multipliers (ADMM) algorithm as a foundation, we partition the original optimization problem into simpler subproblems that can be efficiently and robustly solved using first-order methods.\nComprehensive experimental evaluations have conclusively demonstrated that the proposed method consistently outperforms the baselines in terms of both performance and constraint satisfaction.",
        "keywords": "Safe reinforcement learning;Constrained policy optimization;Constrained Markov decision processes",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Luoyang Sun;Ning Yang;Jiwen Jiang;Rasul Tutunov;Haifeng Zhang;Jun Wang",
        "authorids": "~Luoyang_Sun1;~Ning_Yang5;jiangjiwen2023@ia.ac.cn;~Rasul_Tutunov3;~Haifeng_Zhang3;~Jun_Wang2",
        "gender": "M;F;;;;M",
        "homepage": ";http://marl.ia.ac.cn/people/yangning.html;;;https://pkuzhf.github.io;http://www0.cs.ucl.ac.uk/staff/jun.wang/",
        "dblp": ";67/1751-5;;;93/7133-2;w/JunWang12",
        "google_scholar": ";https://scholar.google.com/citations?hl=zh-CN;;Zcov4c4AAAAJ;;https://scholar.google.co.uk/citations?user=wIE1tY4AAAAJ",
        "orcid": ";;;;;",
        "linkedin": "%E7%BD%97%E6%B4%8B-%E5%AD%99-31ab44292/;;;;;",
        "or_profile": "~Luoyang_Sun1;~Ning_Yang5;jiangjiwen2023@ia.ac.cn;~Rasul_Tutunov3;~Haifeng_Zhang3;~Jun_Wang2",
        "aff": "Institute of Automation, Chinese Academy of Sciences;Institute of Automation, Chinese Academy of Sciences;;;Institute of Automation, Chinese Academy of Sciences;University College London",
        "aff_domain": "ia.ac.cn;ia.ac.cn;;;ia.ac.cn;ucl.ac.uk",
        "position": "PhD student;Assistant Professor;;;Associate Professor;Professor",
        "bibtex": "@misc{\nsun2024augmented,\ntitle={Augmented Policy Optimization for Safe Reinforcement Learning},\nauthor={Luoyang Sun and Ning Yang and Jiwen Jiang and Rasul Tutunov and Haifeng Zhang and Jun Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=F0jBJQEfDp}\n}",
        "github": "",
        "project": "",
        "reviewers": "Q99o;wA8B;3HXh;Bx7v",
        "site": "https://openreview.net/forum?id=F0jBJQEfDp",
        "pdf_size": 2291502,
        "rating": "3;3;5;6",
        "confidence": "4;4;3;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "48;85;55;74",
        "wc_strengths": "25;24;44;128",
        "wc_weaknesses": "180;186;137;296",
        "wc_questions": "98;59;123;136",
        "wc_review": "351;354;359;634",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            65.5,
            14.739402972983676
        ],
        "wc_strengths_avg": [
            55.25,
            42.75146196330601
        ],
        "wc_weaknesses_avg": [
            199.75,
            58.69571960543631
        ],
        "wc_questions_avg": [
            104.0,
            29.351320242878344
        ],
        "wc_review_avg": [
            424.5,
            120.98863582998199
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:KT5WOESbIvQJ:scholar.google.com/&scioq=Augmented+Policy+Optimization+for+Safe+Reinforcement+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "Chinese Academy of Sciences;University College London",
        "aff_unique_dep": "Institute of Automation;",
        "aff_unique_url": "http://www.ia.cas.cn;https://www.ucl.ac.uk",
        "aff_unique_abbr": "CAS;UCL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "id": "F0q880yOgY",
        "title": "Can Language Agents Approach the Performance of RL? An Empirical Study On OpenAI Gym",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The formidable capacity for zero- or few-shot decision-making in language agents encourages us to pose a compelling question: *Can language agents approach the performance of reinforcement learning (RL) in traditional sequential decision-making tasks and exhibit greater efficacy?*\nTo investigate this, we first develop a $\\texttt{TextGym}$ simulator by grounding OpenAI Gym in a textual environment.\nThis allows for straightforward comparisons between RL agents and language agents, given the widespread adoption of OpenAI Gym.\nTo ensure a fair and effective benchmarking, we introduce $5$ levels of scenario for accurate domain-knowledge controlling and a unified RL-inspired framework for language agents.\nAdditionally, we propose an innovative explore-exploit-guided language  ($\\texttt{EXE}$) agent to solve the severely partially observable and sparse reward tasks within $\\texttt{TextGym}$.\nThrough numerical experiments and ablation studies, we extract valuable insights into the decision-making capabilities of language agents and evaluate their potential to compete with RL in classical sequential decision-making problems. \nThis paper sheds light on the performance of language agents and paves the way for future research in this exciting domain.",
        "keywords": "LLM Agents;Benchmark;Reinforcement Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Junjie Sheng;Zixiao Huang;Chuyun Shen;Wenhao Li;Yun Hua;Bo Jin;Hongyuan Zha;Xiangfeng Wang",
        "authorids": "~Junjie_Sheng1;~Zixiao_Huang1;~Chuyun_Shen1;~Wenhao_Li2;~Yun_Hua1;~Bo_Jin1;~Hongyuan_Zha1;~Xiangfeng_Wang1",
        "gender": "M;M;M;M;;;;M",
        "homepage": ";https://orcid.org/0000-0002-5557-3186;;https://tomaxent.com;;;;https://xfwang87.github.io/",
        "dblp": ";;;;23/8866;;z/HongyuanZha;84/4695",
        "google_scholar": "2A7h6E0AAAAJ;;sB4jZ54AAAAJ;HAtzuaYAAAAJ;hjnEwrEAAAAJ;;n1DQMIsAAAAJ;YpGMkgsAAAAJ",
        "orcid": ";0000-0002-5557-3186;;;;;;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Junjie_Sheng1;~Zixiao_Huang1;~Chuyun_Shen1;~Wenhao_Li2;~Yun_Hua1;~Bo_Jin1;~Hongyuan_Zha1;~Xiangfeng_Wang1",
        "aff": "East China Normal University;East China Normal University;East China Normal University;The Chinese University of Hong Kong, Shenzhen;East China Normal University;;The Chinese University of Hong Kong, Shenzhen;East China Normal University",
        "aff_domain": "ecnu.edu.cn;stu.ecnu.edu.cn;ecnu.edu.cn;cuhk.edu.cn;ecnu.edu.cn;;cuhk.edu.cn;ecnu.edu.cn",
        "position": "PhD student;PhD student;PhD student;Postdoc;PhD student;;Full Professor;Full Professor",
        "bibtex": "@misc{\nsheng2024can,\ntitle={Can Language Agents Approach the Performance of {RL}? An Empirical Study On Open{AI} Gym},\nauthor={Junjie Sheng and Zixiao Huang and Chuyun Shen and Wenhao Li and Yun Hua and Bo Jin and Hongyuan Zha and Xiangfeng Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=F0q880yOgY}\n}",
        "github": "",
        "project": "",
        "reviewers": "i4oJ;9WGb;DgbS;CAf4;tsqs",
        "site": "https://openreview.net/forum?id=F0q880yOgY",
        "pdf_size": 3069144,
        "rating": "3;3;3;5;8",
        "confidence": "3;4;3;3;3",
        "soundness": "2;1;1;2;4",
        "contribution": "3;1;2;2;4",
        "presentation": "1;1;1;3;4",
        "wc_summary": "79;49;260;346;50",
        "wc_strengths": "52;83;96;70;66",
        "wc_weaknesses": "235;370;386;100;167",
        "wc_questions": "246;43;593;477;109",
        "wc_review": "612;545;1335;993;392",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "631;573;1146;266;368",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "1;1;4;1;1",
        "rating_avg": [
            4.4,
            1.9595917942265424
        ],
        "confidence_avg": [
            3.2,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.0,
            1.0954451150103321
        ],
        "contribution_avg": [
            2.4,
            1.019803902718557
        ],
        "presentation_avg": [
            2.0,
            1.2649110640673518
        ],
        "wc_summary_avg": [
            156.8,
            122.90386487006826
        ],
        "wc_strengths_avg": [
            73.4,
            15.014659503298766
        ],
        "wc_weaknesses_avg": [
            251.6,
            111.80089445080482
        ],
        "wc_questions_avg": [
            293.6,
            210.91192474585213
        ],
        "wc_review_avg": [
            775.4,
            342.7188935556369
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            596.8,
            305.00321309782953
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.6,
            1.2000000000000002
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.35721725415588024,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:S4rE64GkiVkJ:scholar.google.com/&scioq=Can+Language+Agents+Approach+the+Performance+of+RL%3F+An+Empirical+Study+On+OpenAI+Gym&hl=en&as_sdt=0,47",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;0;1;0",
        "aff_unique_norm": "East China Normal University;Chinese University of Hong Kong",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.ecnu.edu.cn;https://www.cuhk.edu.cn",
        "aff_unique_abbr": "ECNU;CUHK",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Shenzhen",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "RT-Trajectory: Robotic Task Generalization via Hindsight Trajectory Sketches",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19084",
        "id": "F1TKzG8LJO",
        "author_site": "Jiayuan Gu, Sean Kirmani, Paul Wohlhart, Yao Lu, Montserrat Gonzalez Arenas, Kanishka Rao, Wenhao Yu, Chuyuan Fu, Keerthana Gopalakrishnan, Zhuo Xu, Priya Sundaresan, Peng Xu, Hao Su, Karol Hausman, Chelsea Finn, Quan Vuong, Ted Xiao",
        "tldr": "",
        "abstract": "Generalization remains one of the most important desiderata for robust robot learning systems. While recently proposed approaches show promise in generalization to novel objects, semantic concepts, or visual distribution shifts, generalization to new tasks remains challenging. For example, a language-conditioned policy trained on pick-and-place tasks will not be able to generalize to a folding task, even if the arm trajectory of folding is similar to pick-and-place. Our key insight is that this kind of generalization becomes feasible if we represent the task through rough trajectory sketches. We propose a policy conditioning method using such rough trajectory sketches, which we call RT-Trajectory, that is practical, easy to specify, and allows the policy to effectively perform new tasks that would otherwise be challenging to perform. We find that trajectory sketches strike a balance between being detailed enough to express low-level motion-centric guidance while being coarse enough to allow the learned policy to interpret the trajectory sketch in the context of situational visual observations. In addition, we show how trajectory sketches can provide a useful interface to communicate with robotic policies -- they can be specified through simple human inputs like drawings or videos, or through automated methods such as modern image-generating or waypoint-generating methods. We evaluate RT-Trajectory at scale on a variety of real-world robotic tasks, and find that RT-Trajectory is able to perform a wider range of tasks compared to language-conditioned and goal-conditioned policies, when provided the same training data.",
        "keywords": "robotics;robot learning;robot manipulation;task representation;behavior cloning;multitask imitation learning;goal conditioning",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/7b13ad7cc32db0ddb255c91a260ba8c4536f510a.zip",
        "author": "Jiayuan Gu;Sean Kirmani;Paul Wohlhart;Yao Lu;Montserrat Gonzalez Arenas;Kanishka Rao;Wenhao Yu;Chuyuan Fu;Keerthana Gopalakrishnan;Zhuo Xu;Priya Sundaresan;Peng Xu;Hao Su;Karol Hausman;Chelsea Finn;Quan Vuong;Ted Xiao",
        "authorids": "~Jiayuan_Gu1;~Sean_Kirmani1;~Paul_Wohlhart1;~Yao_Lu13;~Montserrat_Gonzalez_Arenas1;~Kanishka_Rao1;~Wenhao_Yu1;~Chuyuan_Fu1;~Keerthana_Gopalakrishnan1;~Zhuo_Xu1;~Priya_Sundaresan1;~Peng_Xu9;~Hao_Su1;~Karol_Hausman2;~Chelsea_Finn1;~Quan_Vuong2;~Ted_Xiao1",
        "gender": ";M;M;;F;;M;F;F;M;F;M;M;F;M;M;M",
        "homepage": "https://jiayuan-gu.github.io/;https://kirmani.io/;;;;https://research.google/people/KanishkaRao/;https://wenhaoyu.weebly.com/;;https://keerthanapg.com;;;;http://ai.ucsd.edu/~haosu;https://ai.stanford.edu/~cbfinn/;https://quanvuong.github.io;https://www.tedxiao.me;https://karolhausman.github.io/",
        "dblp": "210/2429;;http://dblp.uni-trier.de/pers/hd/w/Wohlhart:Paul;26/5662-6;;;;;;;;;09/4945-1;131/1783;;198/0598;135/8164",
        "google_scholar": "YH1v2uYAAAAJ;iyEuK8kAAAAJ;SzHPa90AAAAJ;OI7zFmwAAAAJ;;;1bF2s2kAAAAJ;bDq7MZMAAAAJ;;;7SUquR4AAAAJ;460NWeQAAAAJ;1P8Zu04AAAAJ;vfPE6hgAAAAJ;NSWI3OwAAAAJ;;yy0UFOwAAAAJ",
        "orcid": "0000-0002-3207-7921;;;;;;;;;;;;;;;;",
        "linkedin": ";skirmani;;;montse90/;;;;;zhuo-xu-joe/;;;;;;;karolhausman/",
        "or_profile": "~Jiayuan_Gu1;~Sean_Kirmani1;~Paul_Wohlhart1;~Yao_Lu13;~Montserrat_Gonzalez_Arenas1;~Kanishka_Rao1;~Wenhao_Yu1;~Chuyuan_Fu1;~Keerthana_Gopalakrishnan1;~Zhuo_Xu1;~Priya_Sundaresan1;~Peng_Xu9;~Hao_Su1;~Chelsea_Finn1;~Quan_Vuong2;~Ted_Xiao1;~Karol_Hausman1",
        "aff": "University of California, San Diego;Google DeepMind;Graz University of Technology;NVIDIA;;;Google;Google;Research, Google;Google DeepMind;Stanford University;Google;University of California, San Diego;Google;physical intelligence;;Google Brain",
        "aff_domain": "ucsd.edu;google.com; ;nvidia.com;;;google.com;google.com;research.google.com;google.com;stanford.edu;google.com;ucsd.edu;google.com;physicalintelligence.company;;google.com",
        "position": "PhD student;Researcher;Post Doc;Principal Researcher;;;Software Engineer;software engineer;Researcher;Researcher;PhD student;Researcher;Associate Professor;Research Scientist;Researcher;;Research Scientist",
        "bibtex": "@inproceedings{\ngu2024rttrajectory,\ntitle={{RT}-Trajectory: Robotic Task Generalization via Hindsight Trajectory Sketches},\nauthor={Jiayuan Gu and Sean Kirmani and Paul Wohlhart and Yao Lu and Montserrat Gonzalez Arenas and Kanishka Rao and Wenhao Yu and Chuyuan Fu and Keerthana Gopalakrishnan and Zhuo Xu and Priya Sundaresan and Peng Xu and Hao Su and Karol Hausman and Chelsea Finn and Quan Vuong and Ted Xiao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=F1TKzG8LJO}\n}",
        "github": "",
        "project": "",
        "reviewers": "YmAB;Ryeg;zAA2",
        "pdf_size": 34016371,
        "rating": "5;8;8",
        "confidence": "4;4;5",
        "soundness": "2;3;3",
        "contribution": "2;3;4",
        "presentation": "3;3;4",
        "wc_summary": "116;61;250",
        "wc_strengths": "144;38;2",
        "wc_weaknesses": "486;95;2",
        "wc_questions": "36;46;2",
        "wc_review": "782;240;256",
        "wc_reply_reviewers": "303;0;0",
        "wc_reply_authors": "2220;707;410",
        "reply_reviewers": "1;0;0",
        "reply_authors": "5;1;1",
        "rating_avg": [
            7.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            142.33333333333334,
            79.37393918801197
        ],
        "wc_strengths_avg": [
            61.333333333333336,
            60.273450945577096
        ],
        "wc_weaknesses_avg": [
            194.33333333333334,
            209.705083920782
        ],
        "wc_questions_avg": [
            28.0,
            18.83259585576738
        ],
        "wc_review_avg": [
            426.0,
            251.8147467220033
        ],
        "wc_reply_reviewers_avg": [
            101.0,
            142.8355697996826
        ],
        "wc_reply_authors_avg": [
            1112.3333333333333,
            792.5681183483362
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            1.8856180831641267
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            17,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 53,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17222874884217225293&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=F1TKzG8LJO",
        "pdf": "https://openreview.net/pdf?id=F1TKzG8LJO",
        "email": "ucsd.edu;google.com; ;nvidia.com;;;google.com;google.com;research.google.com;google.com;stanford.edu;google.com;ucsd.edu;google.com;physicalintelligence.company;;google.com",
        "author_num": 17,
        "aff_unique_index": "0;1;2;3;1;1;1;1;4;1;0;1;5;1",
        "aff_unique_norm": "University of California, San Diego;Google;Graz University of Technology;NVIDIA;Stanford University;Physical Intelligence",
        "aff_unique_dep": ";Google DeepMind;;NVIDIA Corporation;;",
        "aff_unique_url": "https://www.ucsd.edu;https://deepmind.com;https://www.tugraz.at;https://www.nvidia.com;https://www.stanford.edu;",
        "aff_unique_abbr": "UCSD;DeepMind;TUGraz;NVIDIA;Stanford;",
        "aff_campus_unique_index": "0;2;2;2;3;2;0;2;2",
        "aff_campus_unique": "San Diego;;Mountain View;Stanford",
        "aff_country_unique_index": "0;1;2;0;0;0;0;1;0;0;0;0;0",
        "aff_country_unique": "United States;United Kingdom;Austria;"
    },
    {
        "id": "F2MdnvZl3D",
        "title": "Deep Generalized Green's Function",
        "track": "main",
        "status": "Desk Reject",
        "tldr": "",
        "abstract": "The Green's function has ubiquitous usages in efficient problem-solving of partial differential equations (PDEs) and analyzing the system governed by the PDE. However, obtaining a closed-form Green's function for most PDEs on various domains is almost impractical. Numerical Green's function (NGF) seeks an approximate Green's function using traditional methods, like finite element analysis, which is particularly useful for complex problems like fracture mechanics and dynamic scattering. In this study, we introduce the Deep Generalized Green's Function (DGGF), a deep-learning approach addressing the challenges associated with NGF: problem-specific modeling,  time consumption, and data storage demand. Our method is demonstrated to efficiently solve PDE problems with the integral format of solutions compared to direct methods, for instance, FEM and physics-informed neural networks (PINNs). Besides, our method relieves the training burden and scales to higher dimensions than any method with direct Gaussian approximation of a Dirac delta function. Since our method directly addresses the singularity,  it applies to different PDEs without prior knowledge, whereas BI-GreenNet is limited to PDEs with known expressions of the singular part of the Green's function. The numerical results confirm the advantages of DGGFs and the benefits of Generalized Greens Functions as a novel alternative approach to solving PDEs without suffering from singularities.",
        "keywords": "Partial Differential Equation; Deep Learning; Green's Function; Boundary Element Method",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Rixi Peng;Juncheng Dong;Jordan Malof;Willie Padilla;Vahid Tarokh",
        "authorids": "~Rixi_Peng1;~Juncheng_Dong1;~Jordan_Malof1;~Willie_Padilla1;~Vahid_Tarokh1",
        "gender": "M;;M;;",
        "homepage": ";;https://jmalof.com/;https://padillalab.pratt.duke.edu/;",
        "dblp": "275/3964;;77/8580;275/3841;",
        "google_scholar": ";;4hX2HZ8AAAAJ;5mFPlG0AAAAJ;",
        "orcid": "0000-0002-3948-8918;;0000-0002-7851-4920;0000-0001-7734-8847;",
        "linkedin": ";;;williepadilla/;",
        "or_profile": "~Rixi_Peng1;~Juncheng_Dong1;~Jordan_Malof1;~Willie_Padilla1;~Vahid_Tarokh1",
        "aff": ";;University of Montana;;",
        "aff_domain": ";;umonana.edu;;",
        "position": ";;Assistant Professor;;",
        "bibtex": "@misc{\npeng2024deep,\ntitle={Deep Generalized Green's Function},\nauthor={Rixi Peng and Juncheng Dong and Jordan Malof and Willie Padilla and Vahid Tarokh},\nyear={2024},\nurl={https://openreview.net/forum?id=F2MdnvZl3D}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=F2MdnvZl3D",
        "pdf_size": 3935770,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9633175541361699649&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Montana",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.umt.edu",
        "aff_unique_abbr": "UM",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Fixed Non-negative Orthogonal Classifier: Inducing Zero-mean Neural Collapse with Feature Dimension Separation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19083",
        "id": "F4bmOrmUwc",
        "author_site": "Hoyong Kim, Kangil Kim",
        "tldr": "",
        "abstract": "Fixed classifiers in neural networks for classification problems have demonstrated cost efficiency and even outperformed learnable classifiers in some popular benchmarks when incorporating orthogonality. Despite these advantages, prior research has yet to investigate the training dynamics of fixed orthogonal classifiers on neural collapse, a recently clarified phenomenon that last-layer features converge to a specific form, called simplex ETF, in training classification models involving the post-zero-error phase. Ensuring this phenomenon is critical for obtaining global optimality in a layer-peeled model, potentially leading to enhanced performance in practice. However, fixed orthogonal classifiers cannot invoke neural collapse due to their geometric limitations. To overcome the limits, we analyze a $\\textit{zero-mean neural collapse}$ considering the orthogonality in non-negative Euclidean space. Then, we propose a $\\textit{fixed non-negative orthogonal classifier}$ that induces the optimal solution and maximizes the margin of an orthogonal layer-peeled model by satisfying the properties of zero-mean neural collapse. Building on this foundation, we exploit a $\\textit{feature dimension separation}$ effect inherent in our classifier for further purposes: (1) enhances softmax masking by mitigating feature interference in continual learning and (2) tackles the limitations of mixup on the hypersphere in imbalanced learning. We conducted comprehensive experiments on various datasets and architectures and demonstrated significant performance improvements.",
        "keywords": "neural collapse;orthogonal;fixed classifier;imbalanced;continual",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/f42d27b26c00110c8fdb853d492db5cbe7beeded.zip",
        "author": "Hoyong Kim;Kangil Kim",
        "authorids": "~Hoyong_Kim1;~Kangil_Kim1",
        "gender": "M;M",
        "homepage": "https://khyong.github.io/;",
        "dblp": ";45/8372",
        "google_scholar": "PaBLiH4AAAAJ;RZggOtkAAAAJ",
        "orcid": "0000-0002-1608-1939;0000-0003-3220-6401",
        "linkedin": "hoyong-kim-66220a175/;",
        "or_profile": "~Hoyong_Kim1;~Kangil_Kim1",
        "aff": "Gwangju Institute of Science and Technology;Gwangju Institute of Science and Technology",
        "aff_domain": "gist.ac.kr;gist.ac.kr",
        "position": "PhD student;Associate Professor",
        "bibtex": "@inproceedings{\nkim2024fixed,\ntitle={Fixed Non-negative Orthogonal Classifier: Inducing Zero-mean Neural Collapse with Feature Dimension Separation},\nauthor={Hoyong Kim and Kangil Kim},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=F4bmOrmUwc}\n}",
        "github": "",
        "project": "",
        "reviewers": "iab3;jWfm;EhX5;WNdB",
        "pdf_size": 4470752,
        "rating": "5;6;6;6",
        "confidence": "4;3;3;4",
        "soundness": "3;2;3;2",
        "contribution": "3;3;3;2",
        "presentation": "3;3;3;2",
        "wc_summary": "137;120;66;113",
        "wc_strengths": "30;33;78;45",
        "wc_weaknesses": "76;116;144;296",
        "wc_questions": "54;5;5;17",
        "wc_review": "297;274;293;471",
        "wc_reply_reviewers": "0;39;0;0",
        "wc_reply_authors": "319;730;449;1643",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;1;1;3",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            109.0,
            26.315394733881533
        ],
        "wc_strengths_avg": [
            46.5,
            19.03286631067428
        ],
        "wc_weaknesses_avg": [
            158.0,
            83.2586331859946
        ],
        "wc_questions_avg": [
            20.25,
            20.09197601033806
        ],
        "wc_review_avg": [
            333.75,
            79.71629381751262
        ],
        "wc_reply_reviewers_avg": [
            9.75,
            16.887495373796554
        ],
        "wc_reply_authors_avg": [
            785.25,
            517.0204904063281
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9409419247774733371&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=F4bmOrmUwc",
        "pdf": "https://openreview.net/pdf?id=F4bmOrmUwc",
        "email": "gist.ac.kr;gist.ac.kr",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Gwangju Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.gist.ac.kr",
        "aff_unique_abbr": "GIST",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Gwangju",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "F5ERvanO6m",
        "title": "Deep Stochastic Mechanics",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper introduces a novel deep-learning-based approach for numerical simulation of a time-evolving Schr\u00f6dinger equation inspired by stochastic mechanics and generative diffusion models. Unlike existing approaches, which exhibit computational complexity that scales exponentially in the problem dimension, our method allows us to adapt to the latent low-dimensional structure of the wave function by sampling from the Markovian diffusion. Depending on the latent dimension, our method may have far lower computational complexity in higher dimensions. Moreover, we propose novel equations for stochastic quantum mechanics, resulting in linear computational complexity with respect to the number of dimensions. Numerical simulations verify our theoretical findings and show a significant advantage of our method compared to other deep-learning-based approaches used for quantum mechanics.",
        "keywords": "diffusion models;quantum mechanics;deep learning",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/e403bc77bd7d7db7b495d2b4ead1c2d3c210974a.pdf",
        "author": "Elena Orlova;Aleksei Ustimenko;Ruoxi Jiang;Peter Y. Lu;Rebecca Willett",
        "authorids": "~Elena_Orlova1;~Aleksei_Ustimenko1;~Ruoxi_Jiang1;~Peter_Y._Lu1;~Rebecca_Willett1",
        "gender": ";M;F;;F",
        "homepage": ";;https://roxie62.github.io/;;https://willett.psd.uchicago.edu/",
        "dblp": ";242/3873;296/0221;;w/RebeccaWillett",
        "google_scholar": ";OES5pK4AAAAJ;fbVZpI4AAAAJ;;bGRVPl8AAAAJ",
        "orcid": ";;;;0000-0002-8109-7582",
        "linkedin": ";;ruoxi-jiang/;;rebecca-willett-90b95973/",
        "or_profile": "~Elena_Orlova1;~Aleksei_Ustimenko1;~Ruoxi_Jiang1;~Peter_Y._Lu1;~Rebecca_Willett1",
        "aff": ";ShareChat;University of Chicago;;University of Chicago",
        "aff_domain": ";sharechat.co;uchicago.edu;;uchicago.edu",
        "position": ";Researcher;PhD student;;Full Professor",
        "bibtex": "@misc{\norlova2024deep,\ntitle={Deep Stochastic Mechanics},\nauthor={Elena Orlova and Aleksei Ustimenko and Ruoxi Jiang and Peter Y. Lu and Rebecca Willett},\nyear={2024},\nurl={https://openreview.net/forum?id=F5ERvanO6m}\n}",
        "github": "",
        "project": "",
        "reviewers": "APZm;JVMX;oJtq;iLX6",
        "site": "https://openreview.net/forum?id=F5ERvanO6m",
        "pdf_size": 3542161,
        "rating": "6;6;8;8",
        "confidence": "4;4;3;3",
        "soundness": "2;3;3;4",
        "contribution": "3;3;3;4",
        "presentation": "1;3;3;4",
        "wc_summary": "25;113;111;109",
        "wc_strengths": "14;64;56;242",
        "wc_weaknesses": "172;151;116;62",
        "wc_questions": "95;33;114;70",
        "wc_review": "306;361;397;483",
        "wc_reply_reviewers": "2673;11;0;11",
        "wc_reply_authors": "4182;1398;1162;708",
        "reply_reviewers": "6;1;0;1",
        "reply_authors": "8;2;2;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            89.5,
            37.265936188428164
        ],
        "wc_strengths_avg": [
            94.0,
            87.5328509760764
        ],
        "wc_weaknesses_avg": [
            125.25,
            41.63757317615905
        ],
        "wc_questions_avg": [
            78.0,
            30.306764921383476
        ],
        "wc_review_avg": [
            386.75,
            64.32874551862487
        ],
        "wc_reply_reviewers_avg": [
            673.75,
            1154.2762613430114
        ],
        "wc_reply_authors_avg": [
            1862.5,
            1361.9297889392096
        ],
        "reply_reviewers_avg": [
            2.0,
            2.345207879911715
        ],
        "reply_authors_avg": [
            3.25,
            2.7726341266023544
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4334904437321309573&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "ShareChat;University of Chicago",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.sharechat.com;https://www.uchicago.edu",
        "aff_unique_abbr": ";UChicago",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "India;United States"
    },
    {
        "id": "F5UgXkPgSn",
        "title": "Fusion over the Grassmannian for High-Rank Matrix Completion",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper presents a new paradigm to cluster and complete data lying in a union of subspaces using points in the Grassmannian as proxies. Our main theoretical contribution exploits the geometry of this Riemannian manifold to obtain local convergence guarantees. Furthermore, our approach does not require prior knowledge of the number of subspaces, is naturally suited to handle noise, and only requires an upper bound on the subspaces' dimensions.  We detail clustering, completion, model selection, and sketching techniques that can be used in practice. We complement our analysis with synthetic and real-data experiments, which show that our approach performs comparable to the state-of-the-art in the {\\em easy} cases (high sampling rates), and significantly better in the {\\em difficult} cases (low sampling rates), thus shortening the gap towards the fundamental sampling limit of HRMC.",
        "keywords": "Manifold Learning;Subspace Clustering;Matrix Completion",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/0438dfa9c76e236199d0265364e516a37c7bab4f.zip",
        "author": "Jeremy Scott Johnson;Huanran Li;Daniel L. Pimentel-Alarc\u00f3n",
        "authorids": "~Jeremy_Scott_Johnson1;~Huanran_Li1;~Daniel_L._Pimentel-Alarc\u00f3n1",
        "gender": "M;M;",
        "homepage": ";https://huanranli.github.io/;https://danielpimentel.github.io/",
        "dblp": ";327/9353;150/6256",
        "google_scholar": ";Jwt-ofkAAAAJ;",
        "orcid": ";;",
        "linkedin": "jeremy-johnson-9a1110213/;huanran-li-870954163/;",
        "or_profile": "~Jeremy_Scott_Johnson1;~Huanran_Li1;~Daniel_L._Pimentel-Alarc\u00f3n1",
        "aff": "University of Wisconsin, Madison;University of Wisconsin, Madison;University of Wisconsin, Madison",
        "aff_domain": "wisc.edu;wisc.edu;wisc.edu",
        "position": "PhD student;PhD student;Assistant Professor",
        "bibtex": "@misc{\njohnson2024fusion,\ntitle={Fusion over the Grassmannian for High-Rank Matrix Completion},\nauthor={Jeremy Scott Johnson and Huanran Li and Daniel L. Pimentel-Alarc{\\'o}n},\nyear={2024},\nurl={https://openreview.net/forum?id=F5UgXkPgSn}\n}",
        "github": "",
        "project": "",
        "reviewers": "eDfV;hQSx;2gRt;H7XT",
        "site": "https://openreview.net/forum?id=F5UgXkPgSn",
        "pdf_size": 530067,
        "rating": "3;3;3;3",
        "confidence": "3;4;3;3",
        "soundness": "2;2;3;2",
        "contribution": "1;1;2;2",
        "presentation": "2;2;3;3",
        "wc_summary": "122;279;89;92",
        "wc_strengths": "61;41;19;61",
        "wc_weaknesses": "184;241;25;161",
        "wc_questions": "62;86;12;73",
        "wc_review": "429;647;145;387",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            145.5,
            78.14889634537394
        ],
        "wc_strengths_avg": [
            45.5,
            17.342145196024624
        ],
        "wc_weaknesses_avg": [
            152.75,
            79.29809266306472
        ],
        "wc_questions_avg": [
            58.25,
            28.021197333447407
        ],
        "wc_review_avg": [
            402.0,
            178.20493820318222
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:4Hw5G839yMYJ:scholar.google.com/&scioq=Fusion+over+the+Grassmannian+for+High-Rank+Matrix+Completion&hl=en&as_sdt=0,33",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Wisconsin",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.wisc.edu",
        "aff_unique_abbr": "UW",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Madison",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Illusory Attacks: Information-theoretic detectability matters in adversarial attacks",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19082",
        "id": "F5dhGCdyYh",
        "author_site": "Tim Franzmeyer, Stephen McAleer, Joao F. Henriques, Jakob Foerster, Philip Torr, Adel Bibi, Christian Schroeder de Witt",
        "tldr": "",
        "abstract": "Autonomous agents deployed in the real world need to be robust against adversarial attacks on sensory inputs. \nRobustifying agent policies requires anticipating the strongest attacks possible.\nWe demonstrate that existing observation-space attacks on reinforcement learning agents have a common weakness: while effective, their lack of information-theoretic detectability constraints makes them \\textit{detectable} using automated means or human inspection. \nDetectability is undesirable to adversaries as it may trigger security escalations.\nWe introduce \\textit{\\eattacks{}}, a novel form of adversarial attack on sequential decision-makers that is both effective and of $\\epsilon-$bounded statistical detectability. \nWe propose a novel dual ascent algorithm to learn such attacks end-to-end.\nCompared to existing attacks, we empirically find \\eattacks{} to be significantly harder to detect with automated methods, and a small study with human participants\\footnote{IRB approval under reference R84123/RE001} suggests they are similarly harder to detect for humans. \nOur findings suggest the need for better anomaly detectors, as well as effective hardware- and system-level defenses. The project website can be found at https://tinyurl.com/illusory-attacks.",
        "keywords": "sequential decision making;adversarial attacks;robust human-AI systems;robust mixed-autonomy systems",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/1721249f804bc10b66bd90e4c045a436738fbd12.zip",
        "author": "Tim Franzmeyer;Stephen Marcus McAleer;Joao F. Henriques;Jakob Nicolaus Foerster;Philip Torr;Adel Bibi;Christian Schroeder de Witt",
        "authorids": "~Tim_Franzmeyer1;~Stephen_Marcus_McAleer1;~Joao_F._Henriques1;~Jakob_Nicolaus_Foerster1;~Philip_Torr1;~Adel_Bibi1;~Christian_Schroeder_de_Witt1",
        "gender": ";M;M;M;;M;M",
        "homepage": "https://www.robots.ox.ac.uk/~frtim/;https://www.andrew.cmu.edu/user/smcaleer/;http://www.robots.ox.ac.uk/~joao/;https://www.jakobfoerster.com;http://www.robots.ox.ac.uk/~tvg/;http://adelbibi.com;https://www.schroederdewitt.com",
        "dblp": "298/1117;;31/8617.html;176/5095;;176/0964;",
        "google_scholar": "Jvv1rkkAAAAJ;iEFL4-YAAAAJ;aCQjyp0AAAAJ;6z4lQzMAAAAJ;;Q4j2laYAAAAJ;DE60h_0AAAAJ",
        "orcid": ";;;;;0000-0002-6169-3918;",
        "linkedin": "tim-franzmeyer-370257110/;stephen-mcaleer/;;;;adel-bibi-ba3671ab/;",
        "or_profile": "~Tim_Franzmeyer1;~Stephen_Marcus_McAleer1;~Joao_F._Henriques1;~Jakob_Nicolaus_Foerster1;~Philip_Torr1;~Adel_Bibi1;~Christian_Schroeder_de_Witt1",
        "aff": "University of Oxford;Carnegie Mellon University;University of Oxford;University of Oxford, University of Oxford;University of Oxford;University of Oxford;University of Oxford",
        "aff_domain": "ox.ac.uk;cmu.edu;ox.ac.uk;eng.ox.ac.uk;ox.ac.uk;ox.ac.uk;oxford.ac.uk",
        "position": "PhD student;Postdoc;Principal Researcher;Associate Professor;Full Professor;Senior Researcher;Lecturer",
        "bibtex": "@inproceedings{\nfranzmeyer2024illusory,\ntitle={Illusory Attacks: Information-theoretic detectability matters in adversarial attacks},\nauthor={Tim Franzmeyer and Stephen Marcus McAleer and Joao F. Henriques and Jakob Nicolaus Foerster and Philip Torr and Adel Bibi and Christian Schroeder de Witt},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=F5dhGCdyYh}\n}",
        "github": "",
        "project": "",
        "reviewers": "5HNt;iko8;JhVN",
        "pdf_size": 2151802,
        "rating": "6;8;8",
        "confidence": "4;2;3",
        "soundness": "3;3;3",
        "contribution": "4;3;3",
        "presentation": "2;3;4",
        "wc_summary": "178;63;105",
        "wc_strengths": "58;58;100",
        "wc_weaknesses": "289;31;77",
        "wc_questions": "66;57;18",
        "wc_review": "591;209;300",
        "wc_reply_reviewers": "0;0;35",
        "wc_reply_authors": "766;337;412",
        "reply_reviewers": "0;0;1",
        "reply_authors": "2;1;2",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            115.33333333333333,
            47.51374070261733
        ],
        "wc_strengths_avg": [
            72.0,
            19.79898987322333
        ],
        "wc_weaknesses_avg": [
            132.33333333333334,
            112.3605308321783
        ],
        "wc_questions_avg": [
            47.0,
            20.83266665599966
        ],
        "wc_review_avg": [
            366.6666666666667,
            162.9198848787001
        ],
        "wc_reply_reviewers_avg": [
            11.666666666666666,
            16.49915822768611
        ],
        "wc_reply_authors_avg": [
            505.0,
            187.0775240374963
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9742896332639909054&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=F5dhGCdyYh",
        "pdf": "https://openreview.net/pdf?id=F5dhGCdyYh",
        "email": "ox.ac.uk;cmu.edu;ox.ac.uk;eng.ox.ac.uk;ox.ac.uk;ox.ac.uk;oxford.ac.uk",
        "author_num": 7,
        "aff_unique_index": "0;1;0;0;0;0;0",
        "aff_unique_norm": "University of Oxford;Carnegie Mellon University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ox.ac.uk;https://www.cmu.edu",
        "aff_unique_abbr": "Oxford;CMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;0;0;0",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "id": "F6QqOdLzsx",
        "title": "Advancing Test-Time Adaptation for Acoustic Foundation Models in Open-World Shifts",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Test-Time Adaptation (TTA) is a critical paradigm for tackling distribution shifts during inference, especially in visual recognition tasks. However, while acoustic models face similar challenges due to distribution shifts in test-time speech, TTA techniques specifically designed for acoustic modeling in the context of open-world data shifts remain scarce. This gap is further exacerbated when considering the unique characteristics of acoustic foundation models: 1) they are primarily built on transformer architectures with layer normalization and 2) they deal with test-time speech data of varying lengths in a non-stationary manner. These aspects make the direct application of vision-focused TTA methods, which are mostly reliant on batch normalization and assume independent samples, infeasible. In this paper, we delve into TTA for pre-trained acoustic models facing open-world data shifts. We find that noisy, high-entropy speech frames, often non-silent, carry key semantic content. Traditional TTA methods might inadvertently filter out this information using potentially flawed heuristics. In response, we introduce a heuristic-free, learning-based adaptation enriched by confidence enhancement. Noting that speech signals' short-term consistency, we also apply consistency regularization during test-time optimization. Our experiments on synthetic and real-world datasets affirm our method's superiority over existing baselines.",
        "keywords": "Test Time Adaptation;Acoustic Foundation Models;Open-World Shifts",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/d514ed5c231facae8574ab124e5a7d4f1a260153.zip",
        "author": "Hongfu Liu;Hengguan Huang;Ye Wang",
        "authorids": "~Hongfu_Liu4;~Hengguan_Huang1;~Ye_Wang3",
        "gender": "M;M;M",
        "homepage": "https://waffle-liu.github.io/;;https://smcnus.comp.nus.edu.sg/",
        "dblp": "32/9075-2;166/6435;44/6292-7",
        "google_scholar": "6xFZDEcAAAAJ;GQm1eZEAAAAJ;https://scholar.google.com.sg/citations?user=CdgLLL8AAAAJ",
        "orcid": ";;0000-0002-0123-1260",
        "linkedin": "hongfu-liu-38585b184/;;",
        "or_profile": "~Hongfu_Liu4;~Hengguan_Huang1;~Ye_Wang3",
        "aff": "National University of Singapore;National University of Singapore;National University of Singapore",
        "aff_domain": "nus.edu.sg;nus.edu.sg;nus.edu.sg",
        "position": "PhD student;PhD student;Associate Professor",
        "bibtex": "@misc{\nliu2024advancing,\ntitle={Advancing Test-Time Adaptation for Acoustic Foundation Models in Open-World Shifts},\nauthor={Hongfu Liu and Hengguan Huang and Ye Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=F6QqOdLzsx}\n}",
        "github": "",
        "project": "",
        "reviewers": "UNGc;hWCQ;SG39;cqyf",
        "site": "https://openreview.net/forum?id=F6QqOdLzsx",
        "pdf_size": 300868,
        "rating": "5;6;6;6",
        "confidence": "3;5;4;2",
        "soundness": "2;2;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "60;277;123;50",
        "wc_strengths": "47;31;62;11",
        "wc_weaknesses": "273;260;29;5",
        "wc_questions": "150;263;144;80",
        "wc_review": "530;831;358;146",
        "wc_reply_reviewers": "214;644;57;4",
        "wc_reply_authors": "717;1204;603;397",
        "reply_reviewers": "1;3;1;1",
        "reply_authors": "3;3;2;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            127.5,
            90.73725805863873
        ],
        "wc_strengths_avg": [
            37.75,
            18.93904696651867
        ],
        "wc_weaknesses_avg": [
            141.75,
            125.12268978886283
        ],
        "wc_questions_avg": [
            159.25,
            65.88389408649128
        ],
        "wc_review_avg": [
            466.25,
            250.69141887986513
        ],
        "wc_reply_reviewers_avg": [
            229.75,
            251.32486446828136
        ],
        "wc_reply_authors_avg": [
            730.25,
            296.5901001382211
        ],
        "reply_reviewers_avg": [
            1.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.2581988897471611,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17833880766013368425&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "National University of Singapore",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nus.edu.sg",
        "aff_unique_abbr": "NUS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Singapore"
    },
    {
        "title": "Sparse Autoencoders Find Highly Interpretable Features in Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19081",
        "id": "F76bwRSLeK",
        "author_site": "Robert Huben, Hoagy Cunningham, Logan Smith, Aidan Ewart, Lee Sharkey",
        "tldr": "",
        "abstract": "One of the roadblocks to a better understanding of neural networks' internals is \\textit{polysemanticity}, where neurons appear to activate in multiple, semantically distinct contexts. Polysemanticity prevents us from identifying concise, human-understandable explanations for what neural networks are doing internally. One hypothesised cause of polysemanticity is \\textit{superposition}, where neural networks represent more features than they have neurons by assigning features to an overcomplete set of directions in activation space, rather than to individual neurons. Here, we attempt to identify those directions, using sparse autoencoders to reconstruct the internal activations of a language model. These autoencoders learn sets of sparsely activating features that are more interpretable and monosemantic than directions identified by alternative approaches, where interpretability is measured by automated methods. Moreover, we show that with our learned set of features, we can pinpoint the features that are causally responsible for counterfactual behaviour on the indirect object identification task \\citep{wang2022interpretability} to a finer degree than previous decompositions. This work indicates that it is possible to resolve superposition in language models using a scalable, unsupervised method. Our method may serve as a foundation for future mechanistic interpretability work, which we hope will enable greater model transparency and steerability.",
        "keywords": "language model;interpretability;representation learning;sparsity;dictionary learning;unsupervised learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Robert Huben;Hoagy Cunningham;Logan Riggs Smith;Aidan Ewart;Lee Sharkey",
        "authorids": "~Robert_Huben1;~Hoagy_Cunningham1;~Logan_Riggs_Smith1;~Aidan_Ewart1;~Lee_Sharkey1",
        "gender": ";M;;;M",
        "homepage": ";https://www.lesswrong.com/users/hoagy;https://www.spiedigitallibrary.org/profile/Logan.Smith-4229428;https://baidicoot.github.io;https://leesharkey.github.io",
        "dblp": ";;;;",
        "google_scholar": "Zyi236gAAAAJ;;;;ZzXikBsAAAAJ",
        "orcid": ";;;;",
        "linkedin": "roberthuben/;;;;",
        "or_profile": "~Robert_Huben1;~Hoagy_Cunningham1;~Logan_Riggs_Smith1;~Aidan_Ewart1;~Lee_Sharkey1",
        "aff": "Independent;Anthropic;;University of Bristol;Apollo Research",
        "aff_domain": "gmail.com;anthropic.com;;bristol.ac.uk;apolloresearch.ai",
        "position": "Researcher;Researcher;;Undergrad student;Researcher",
        "bibtex": "@inproceedings{\nhuben2024sparse,\ntitle={Sparse Autoencoders Find Highly Interpretable Features in Language Models},\nauthor={Robert Huben and Hoagy Cunningham and Logan Riggs Smith and Aidan Ewart and Lee Sharkey},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=F76bwRSLeK}\n}",
        "github": "",
        "project": "",
        "reviewers": "oRDV;apJf;k1em;FVSC;V2wZ",
        "pdf_size": 1818039,
        "rating": "1;5;6;6;6",
        "confidence": "5;4;4;4;3",
        "soundness": "1;2;3;3;3",
        "contribution": "1;2;4;3;3",
        "presentation": "1;3;2;3;3",
        "wc_summary": "40;137;54;122;93",
        "wc_strengths": "5;61;63;52;51",
        "wc_weaknesses": "41;389;176;208;32",
        "wc_questions": "1;12;96;75;26",
        "wc_review": "87;599;389;457;202",
        "wc_reply_reviewers": "62;244;96;135;0",
        "wc_reply_authors": "260;879;681;1094;468",
        "reply_reviewers": "1;1;1;2;0",
        "reply_authors": "2;2;1;2;1",
        "rating_avg": [
            4.8,
            1.9390719429665317
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.4,
            0.8
        ],
        "contribution_avg": [
            2.6,
            1.019803902718557
        ],
        "presentation_avg": [
            2.4,
            0.8
        ],
        "wc_summary_avg": [
            89.2,
            37.50946547206451
        ],
        "wc_strengths_avg": [
            46.4,
            21.237702323933256
        ],
        "wc_weaknesses_avg": [
            169.2,
            130.4781974124413
        ],
        "wc_questions_avg": [
            42.0,
            36.99189100329963
        ],
        "wc_review_avg": [
            346.8,
            182.2047200266777
        ],
        "wc_reply_reviewers_avg": [
            107.4,
            81.4213731154173
        ],
        "wc_reply_authors_avg": [
            676.4,
            294.0330593657795
        ],
        "reply_reviewers_avg": [
            1.0,
            0.6324555320336759
        ],
        "reply_authors_avg": [
            1.6,
            0.4898979485566356
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.8154100913168024,
        "gs_citation": 257,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3171773312943220036&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=F76bwRSLeK",
        "pdf": "https://openreview.net/pdf?id=F76bwRSLeK",
        "email": "gmail.com;anthropic.com;;bristol.ac.uk;apolloresearch.ai",
        "author_num": 5,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Independent;Anthropic;University of Bristol;Apollo Research",
        "aff_unique_dep": ";;;",
        "aff_unique_url": ";https://www.anthropic.com;https://www.bristol.ac.uk;",
        "aff_unique_abbr": ";Anthropic;Bristol;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "1;2",
        "aff_country_unique": ";United States;United Kingdom"
    },
    {
        "title": "GTMGC: Using Graph Transformer to Predict Molecule\u2019s Ground-State Conformation",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19080",
        "id": "F7QnIKlC1N",
        "author_site": "Guikun Xu, Yongquan Jiang, PengChuan Lei, Yan Yang, Jim Chen",
        "tldr": "",
        "abstract": "The ground-state conformation of a molecule is often decisive for its properties. However, experimental or computational methods, such as density functional theory (DFT), are time-consuming and labor-intensive for obtaining this conformation. Deep learning (DL) based molecular representation learning (MRL) has made significant advancements in molecular modeling and has achieved remarkable results in various tasks. Consequently, it has emerged as a promising approach for directly predicting the ground-state conformation of molecules. In this regard, we introduce GTMGC, a novel network based on Graph-Transformer (GT) that seamlessly predicts the spatial configuration of molecules in a 3D space from their 2D topological architecture in an end-to-end manner. Moreover, we propose a novel self-attention mechanism called Molecule Structural Residual Self-Attention (MSRSA) for molecular structure modeling. This mechanism not only guarantees high model performance and easy implementation but also lends itself well to other molecular modeling tasks. Our method has been evaluated on the Molecule3D benchmark dataset and the QM9 dataset. Experimental results demonstrate that our approach achieves remarkable performance and outperforms current state-of-the-art methods as well as the widely used open-source software RDkit.",
        "keywords": "molecular conformation prediction;molecule modeling;graph neural network;graph transformer",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Guikun Xu;Yongquan Jiang;PengChuan Lei;Yan Yang;Jim Chen",
        "authorids": "~Guikun_Xu1;~Yongquan_Jiang1;~PengChuan_Lei1;~Yan_Yang8;~Jim_Chen2",
        "gender": "M;;M;F;M",
        "homepage": "http://homepage.richxu.online;http://yqjiang.cdzyit.com;https://github.com/amiscolo;;http://cs.gmu.edu/~jchen",
        "dblp": ";;;37/1091-1.html;",
        "google_scholar": ";;;;",
        "orcid": ";;;0000-0002-6134-6094;",
        "linkedin": ";;;;",
        "or_profile": "~Guikun_Xu1;~Yongquan_Jiang1;~PengChuan_Lei1;~Yan_Yang8;~Jim_Chen2",
        "aff": "Southwest Jiaotong University;Southwest Jiaotong University;Southwest Jiaotong University;Southwest Jiaotong University;",
        "aff_domain": "swjtu.edu.cn;swjtu.edu.cn;swjtu.edu.cn;swjtu.edu.cn;",
        "position": "MS student;Associate Professor;Undergrad student;Full Professor;",
        "bibtex": "@inproceedings{\nxu2024gtmgc,\ntitle={{GTMGC}: Using Graph Transformer to Predict Molecule{\\textquoteright}s Ground-State Conformation},\nauthor={Guikun Xu and Yongquan Jiang and PengChuan Lei and Yan Yang and Jim Chen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=F7QnIKlC1N}\n}",
        "github": "",
        "project": "",
        "reviewers": "1WnG;Po8N;BbTi",
        "pdf_size": 10805003,
        "rating": "3;8;8",
        "confidence": "4;4;4",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "3;3;3",
        "wc_summary": "77;41;97",
        "wc_strengths": "39;74;206",
        "wc_weaknesses": "201;86;120",
        "wc_questions": "170;3;60",
        "wc_review": "487;204;483",
        "wc_reply_reviewers": "170;104;0",
        "wc_reply_authors": "2141;281;740",
        "reply_reviewers": "1;1;0",
        "reply_authors": "6;1;1",
        "rating_avg": [
            6.333333333333333,
            2.357022603955158
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            71.66666666666667,
            23.170862929310353
        ],
        "wc_strengths_avg": [
            106.33333333333333,
            71.90889297499226
        ],
        "wc_weaknesses_avg": [
            135.66666666666666,
            48.23783669370849
        ],
        "wc_questions_avg": [
            77.66666666666667,
            69.31249686905112
        ],
        "wc_review_avg": [
            391.3333333333333,
            132.47473553683946
        ],
        "wc_reply_reviewers_avg": [
            91.33333333333333,
            69.97777424932069
        ],
        "wc_reply_authors_avg": [
            1054.0,
            791.137156250419
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            2.3570226039551585
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15451112684904515218&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=F7QnIKlC1N",
        "pdf": "https://openreview.net/pdf?id=F7QnIKlC1N",
        "email": "swjtu.edu.cn;swjtu.edu.cn;swjtu.edu.cn;swjtu.edu.cn;",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Southwest Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.swjtu.edu.cn",
        "aff_unique_abbr": "SWJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "F7XPZnIUHh",
        "title": "Adversarial Learning of Decomposed Representations for Treatment Effect Estimation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Estimating the Individual-level Treatment Effect (ITE) from observational data is an important issue both theoretically and practically. Including all the pre-treatment covariates for prediction is unnecessary and may aggravate the issue of data unbalance.\nWhile the confounders (C) are necessary, there are some covariates that only affect the treatment (instrumental variables, I), and some only affect the outcome (adjustment variables, A). Theoretical analyses show that including extra information in I may increase the variance lower bound and hence should be discarded. To facilitate the decomposed representation learning for the ITE estimation, we provide a rigorous definition of  {I, C, A} in terms of the causal graph and prove that such decomposition is identifiable from observational data. Under the guidance of such theoretical justification, we propose an effective ADR algorithm to learn the decomposed representations and simultaneously estimate the treatment effect by introducing adversarial modules to constrain the independence and conditional independence relations. Our proposed algorithm can be applied to both categorical and numerical treatments and the disentanglement is assured by both theoretical analyses and empirical results. Experimental results on both synthetic and real data show that the ADR Algorithm is advantageous compared to the state-of-the-art methods. Theoretical analyses also provide a path to further explore the issue of decomposed representation learning for ITE estimation.",
        "keywords": "Causal Inference;Decomposed Representations;Individual Treatment Effect;Observational Data;Representation Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/388ed2af4777ef496d05c088bd2ee4b91ee91c06.zip",
        "author": "Xiangyu Zheng;Guogang Tian;Sen Wang;Zhixiang Huang",
        "authorids": "~Xiangyu_Zheng1;~Guogang_Tian1;~Sen_Wang12;~Zhixiang_Huang1",
        "gender": "F;M;M;M",
        "homepage": "https://songxichen.com/index.php/people/zhengxiangyu;;http://www.jd.com;",
        "dblp": ";35/1527.html;;",
        "google_scholar": ";;;",
        "orcid": ";;;",
        "linkedin": ";;;huangzhixiang-b7210ab8/",
        "or_profile": "~Xiangyu_Zheng1;~Guogang_Tian1;~Sen_Wang12;~Zhixiang_Huang1",
        "aff": "JD.com, Inc.;;;",
        "aff_domain": "jd.com;;;",
        "position": "Algorithm Developer ;;;",
        "bibtex": "@misc{\nzheng2024adversarial,\ntitle={Adversarial Learning of Decomposed Representations for Treatment Effect Estimation},\nauthor={Xiangyu Zheng and Guogang Tian and Sen Wang and Zhixiang Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=F7XPZnIUHh}\n}",
        "github": "",
        "project": "",
        "reviewers": "912z;zHRm;sLak;8Xzt;Yi3t",
        "site": "https://openreview.net/forum?id=F7XPZnIUHh",
        "pdf_size": 746681,
        "rating": "3;3;5;5;5",
        "confidence": "5;3;4;3;4",
        "soundness": "2;2;3;3;3",
        "contribution": "2;1;3;3;3",
        "presentation": "2;3;2;2;2",
        "wc_summary": "61;104;206;37;73",
        "wc_strengths": "62;61;55;11;67",
        "wc_weaknesses": "206;280;377;463;133",
        "wc_questions": "94;5;406;27;423",
        "wc_review": "423;450;1044;538;696",
        "wc_reply_reviewers": "146;119;346;0;0",
        "wc_reply_authors": "351;604;866;89;712",
        "reply_reviewers": "1;2;1;0;0",
        "reply_authors": "2;3;2;1;1",
        "rating_avg": [
            4.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.8,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.4,
            0.8
        ],
        "presentation_avg": [
            2.2,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            96.2,
            58.98949058942618
        ],
        "wc_strengths_avg": [
            51.2,
            20.458738964071078
        ],
        "wc_weaknesses_avg": [
            291.8,
            117.71728844991291
        ],
        "wc_questions_avg": [
            191.0,
            184.90538120887666
        ],
        "wc_review_avg": [
            630.2,
            227.8002633887854
        ],
        "wc_reply_reviewers_avg": [
            122.2,
            126.90847095446387
        ],
        "wc_reply_authors_avg": [
            524.4,
            274.90405599044914
        ],
        "reply_reviewers_avg": [
            0.8,
            0.7483314773547883
        ],
        "reply_authors_avg": [
            1.8,
            0.7483314773547883
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.21821789023599233,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:y3vyqtXOlVMJ:scholar.google.com/&scioq=Adversarial+Learning+of+Decomposed+Representations+for+Treatment+Effect+Estimation&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "JD.com",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.jd.com",
        "aff_unique_abbr": "JD.com",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "F8l0llkMk0",
        "title": "The Map Equation goes Neural",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Community detection and graph clustering are essential for unsupervised data exploration and understanding the high-level organisation of networked systems.\nRecently, graph clustering has been highlighted as an under-explored primary task for graph neural networks.\nWhile hierarchical graph pooling has been shown to improve performance in graph and node classification tasks, it performs poorly in identifying meaningful clusters.\nCommunity detection has a long history in network science, but typically relies on optimising objective functions with custom-tailored search algorithms, not leveraging recent advances in deep learning, particularly from graph neural networks.\nIn this paper, we narrow this gap between the deep learning and network science communities.\nWe consider the map equation, an information-theoretic objective function for community detection.\nExpressing it in a fully differentiable tensor form that produces soft cluster assignments, we optimise the map equation with deep learning through gradient descent.\nMore specifically, the reformulated map equation is a loss function compatible with any graph neural network architecture, enabling flexible clustering and graph pooling that clusters both graph structure and data features in an end-to-end way, automatically finding an optimum number of clusters without explicit regularisation.\nWe evaluate our approach experimentally using different neural network architectures for unsupervised clustering in synthetic and real data.\nOur results show that our approach achieves competitive performance against baselines, naturally detects overlapping communities, and avoids over-partitioning sparse graphs.",
        "keywords": "community detection;unsupervised clustering;graph neural network",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/2201766e55a4765033cf9f64c9740c6b0fec6e25.zip",
        "author": "Christopher Bl\u00f6cker;Chester Tan;Ingo Scholtes",
        "authorids": "~Christopher_Bl\u00f6cker1;~Chester_Tan1;~Ingo_Scholtes1",
        "gender": "M;;M",
        "homepage": "https://chrisbloecker.se;https://chester-tan.com;https://www.ingoscholtes.net",
        "dblp": "216/7409;;s/IngoScholtes",
        "google_scholar": "https://scholar.google.se/citations?user=4mw83wwAAAAJ;;pouriVsAAAAJ",
        "orcid": "0000-0001-7881-2496;;0000-0003-2253-0216",
        "linkedin": ";;",
        "or_profile": "~Christopher_Bl\u00f6cker1;~Chester_Tan1;~Ingo_Scholtes1",
        "aff": "University of Zurich;Bayerische Julius-Maximilians-Universit\u00e4t W\u00fcrzburg;University of Zurich",
        "aff_domain": "uzh.ch;uni-wuerzburg.de;uzh.ch",
        "position": "Postdoc;PhD student;Assistant Professor",
        "bibtex": "@misc{\nbl{\\\"o}cker2024the,\ntitle={The Map Equation goes Neural},\nauthor={Christopher Bl{\\\"o}cker and Chester Tan and Ingo Scholtes},\nyear={2024},\nurl={https://openreview.net/forum?id=F8l0llkMk0}\n}",
        "github": "",
        "project": "",
        "reviewers": "rHRz;MNLx;r6gM",
        "site": "https://openreview.net/forum?id=F8l0llkMk0",
        "pdf_size": 1322397,
        "rating": "1;3;6",
        "confidence": "4;4;5",
        "soundness": "1;3;2",
        "contribution": "2;2;3",
        "presentation": "1;2;3",
        "wc_summary": "54;106;41",
        "wc_strengths": "15;94;43",
        "wc_weaknesses": "83;379;72",
        "wc_questions": "61;7;207",
        "wc_review": "213;586;363",
        "wc_reply_reviewers": "0;110;64",
        "wc_reply_authors": "672;1793;909",
        "reply_reviewers": "0;1;1",
        "reply_authors": "1;3;3",
        "rating_avg": [
            3.3333333333333335,
            2.0548046676563256
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            67.0,
            28.083209693100727
        ],
        "wc_strengths_avg": [
            50.666666666666664,
            32.70406023042943
        ],
        "wc_weaknesses_avg": [
            178.0,
            142.19939052846416
        ],
        "wc_questions_avg": [
            91.66666666666667,
            84.48010942753857
        ],
        "wc_review_avg": [
            387.3333333333333,
            153.24562709004854
        ],
        "wc_reply_reviewers_avg": [
            58.0,
            45.10727953076606
        ],
        "wc_reply_authors_avg": [
            1124.6666666666667,
            482.3859681025374
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.917662935482247,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15100796483245989237&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Zurich;University of W\u00fcrzburg",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.unizh.ch;https://www.uni-wuerzburg.de",
        "aff_unique_abbr": "UZH;JMU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";W\u00fcrzburg",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Switzerland;Germany"
    },
    {
        "id": "F9ApWtHVac",
        "title": "Bridge-TTS: Text-to-Speech Synthesis with Schrodinger Bridge",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In text-to-speech (TTS) synthesis, diffusion models have achieved promising generation quality. However, with the pre-defined data-to-noise diffusion process, their prior distribution is restricted to a noisy representation, which provides little information of the generation target. In this work, we present a novel TTS system, Bridge-TTS, making the first attempt to substitute the noisy Gaussian prior in established diffusion-based TTS methods with a clean and deterministic one, which provides strong structural information of the target. Specifically, we leverage the latent representation obtained from text input as our prior, and build a fully tractable Schrodinger bridge (SB) between it and the ground-truth mel-spectrogram, leading to a faster generation process. Moreover, the tractability and flexibility of our proposed SB formulation allow us to empirically study the noise schedule and the model parameterization in training, as well as developing training-free stochastic and deterministic samplers with theory-grounded analyses of the bridge SDE and ODE, which further enrich our design spaces for exploring better generation performance. Experimental results on the LJ-Speech dataset illustrate the effectiveness of our method in terms of synthesis quality and sampling efficiency, outperforming the diffusion counterpart Grad-TTS in 50-step synthesis and strong fast TTS models in few-step scenario.",
        "keywords": "Diffusion Models;Schrodinger Bridge;Text-to-Speech Synthesis;High-Quality Generation;Efficient Sampling",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/222e145c1d7fe46ac5833d8530bf9b430d6017dc.zip",
        "author": "Zehua Chen;Guande He;Kaiwen Zheng;Xu Tan;Jun Zhu",
        "authorids": "~Zehua_Chen1;~Guande_He1;~Kaiwen_Zheng2;~Xu_Tan1;~Jun_Zhu2",
        "gender": "M;;M;M;M",
        "homepage": ";https://guandehe.github.io/;https://zhengkw18.github.io/;https://tan-xu.github.io/;http://ml.cs.tsinghua.edu.cn/~jun",
        "dblp": ";348/7035.html;;96/10484-3;50/2644-1",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;3rddMeMAAAAJ;0d80xSIAAAAJ;tob-U1oAAAAJ;axsP38wAAAAJ",
        "orcid": ";;;0000-0001-5631-0639;",
        "linkedin": "zehua-chen-7b1b89156/;;;;",
        "or_profile": "~Zehua_Chen1;~Guande_He1;~Kaiwen_Zheng2;~Xu_Tan1;~Jun_Zhu2",
        "aff": "Tsinghua University;Tsinghua University;Tsinghua University;Microsoft;Tsinghua University",
        "aff_domain": "mail.tsinghua.edu.cn;mails.tsinghua.edu.cn;cs.tsinghua.edu.cn;microsoft.com;mail.tsinghua.edu.cn",
        "position": "Postdoc;MS student;MS student;Principal Researcher;Professor",
        "bibtex": "@misc{\nchen2024bridgetts,\ntitle={Bridge-{TTS}: Text-to-Speech Synthesis with Schrodinger Bridge},\nauthor={Zehua Chen and Guande He and Kaiwen Zheng and Xu Tan and Jun Zhu},\nyear={2024},\nurl={https://openreview.net/forum?id=F9ApWtHVac}\n}",
        "github": "",
        "project": "",
        "reviewers": "zyj4;8tg3;SrNQ;vLu2",
        "site": "https://openreview.net/forum?id=F9ApWtHVac",
        "pdf_size": 2832237,
        "rating": "5;5;5;5",
        "confidence": "5;2;4;3",
        "soundness": "3;2;3;2",
        "contribution": "2;2;3;2",
        "presentation": "2;2;3;3",
        "wc_summary": "61;65;97;173",
        "wc_strengths": "50;32;13;90",
        "wc_weaknesses": "133;99;112;269",
        "wc_questions": "144;68;75;148",
        "wc_review": "388;264;297;680",
        "wc_reply_reviewers": "451;291;165;94",
        "wc_reply_authors": "1370;967;1305;1171",
        "reply_reviewers": "2;2;1;1",
        "reply_authors": "4;6;5;4",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            99.0,
            44.94441010848846
        ],
        "wc_strengths_avg": [
            46.25,
            28.44622119016865
        ],
        "wc_weaknesses_avg": [
            153.25,
            67.9204497923858
        ],
        "wc_questions_avg": [
            108.75,
            37.35890121510535
        ],
        "wc_review_avg": [
            407.25,
            163.88925376607216
        ],
        "wc_reply_reviewers_avg": [
            250.25,
            135.68598859130591
        ],
        "wc_reply_authors_avg": [
            1203.25,
            154.12069134285636
        ],
        "reply_reviewers_avg": [
            1.5,
            0.5
        ],
        "reply_authors_avg": [
            4.75,
            0.82915619758885
        ],
        "replies_avg": [
            32,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2214881701810532231&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "Tsinghua University;Microsoft",
        "aff_unique_dep": ";Microsoft Corporation",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.microsoft.com",
        "aff_unique_abbr": "THU;Microsoft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "F9Qy7mH34l",
        "title": "Key-Graph Transformer for Image Restoration",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "It is widely acknowledged that capturing non-local information among input images is crucial for effective image restoration (IR). \nHowever, fully incorporating such global cues into transformer-based methods can be computationally expensive, particularly when dealing with large input images or patches. Furthermore, it is assumed that the attention mechanism within the transformer considers numerous unnecessary cues from unrelated objects or regions. In response to these challenges, we introduce the K-Graph Transformer (KGT) for IR in this paper. Specifically, KGT treats image features within a given window as the nodes of a graph. Instead of establishing connections among all the nodes, the proposed K-Graph Constructor creates a sparse yet representative K-Graph that connects only the essential nodes flexibly. Then the K-Graph Attention Block is proposed within each KGT layer to conduct the self-attention operation only among these selected nodes with linear computational complexity. Extensive experimental results validate that the proposed KGT outperforms state-of-the-art methods on various benchmark datasets both quantitatively and qualitatively.",
        "keywords": "Transformer;Image Restoration;Graph",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/159972ece52caf512b1eb73c47e524dd43601b0b.pdf",
        "author": "Bin Ren;Yawei Li;Jingyun Liang;Rakesh Ranjan;Mengyuan Liu;Rita Cucchiara;Luc Van Gool;Nicu Sebe",
        "authorids": "~Bin_Ren2;~Yawei_Li1;~Jingyun_Liang1;~Rakesh_Ranjan2;~Mengyuan_Liu2;~Rita_Cucchiara1;~Luc_Van_Gool1;~Nicu_Sebe1",
        "gender": ";M;;;;F;;M",
        "homepage": ";https://yaweili.bitbucket.io/;https://jingyunliang.github.io/;;https://www.semanticscholar.org/author/Mengyuan-Liu/47842072;https://aimagelab.ing.unimore.it/imagelab/;;http://disi.unitn.it/~sebe/",
        "dblp": ";32/6740-1;210/5052;;;c/RitaCucchiara;61/5017;20/3519",
        "google_scholar": ";IFLsTGsAAAAJ;https://scholar.google.com.hk/citations?user=3-Hz9BgAAAAJ;;woX_4AcAAAAJ;OM3sZEoAAAAJ;https://scholar.google.be/citations?user=TwMib_QAAAAJ;https://scholar.google.it/citations?user=stFCYOAAAAAJ",
        "orcid": ";0000-0002-8948-7892;;;0000-0002-6332-8316;0000-0002-2239-283X;;0000-0002-6597-7248",
        "linkedin": ";yawei-li-89912ba8/;;;;rita-cucchiara-a4653a13/?originalSubdomain=it;;",
        "or_profile": "~Bin_Ren2;~Yawei_Li1;~Jingyun_Liang1;~Rakesh_Ranjan2;~Mengyuan_Liu2;~Rita_Cucchiara1;~Luc_Van_Gool1;~Nicu_Sebe1",
        "aff": ";ETHZ - ETH Zurich;ETH Zurich;;Peking University;Universit\u00e0 di modena e reggio emilia;KU Leuven;University of Trento",
        "aff_domain": ";ethz.ch;ethz.ch;;pku.edu.cn;unimore.it;kuleuven.be;unitn.it",
        "position": ";Lecturer;PhD student;;Assistant Professor;Full Professor;Emeritus;Full Professor",
        "bibtex": "@misc{\nren2024keygraph,\ntitle={Key-Graph Transformer for Image Restoration},\nauthor={Bin Ren and Yawei Li and Jingyun Liang and Rakesh Ranjan and Mengyuan Liu and Rita Cucchiara and Luc Van Gool and Nicu Sebe},\nyear={2024},\nurl={https://openreview.net/forum?id=F9Qy7mH34l}\n}",
        "github": "",
        "project": "",
        "reviewers": "ruU5;29bC;1vRJ;rJSD",
        "site": "https://openreview.net/forum?id=F9Qy7mH34l",
        "pdf_size": 9639876,
        "rating": "5;6;6;6",
        "confidence": "2;2;5;3",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "32;75;34;63",
        "wc_strengths": "35;108;43;85",
        "wc_weaknesses": "76;143;71;65",
        "wc_questions": "126;29;5;50",
        "wc_review": "269;355;153;263",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1341;514;351;654",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;1;1;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.0,
            1.224744871391589
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            51.0,
            18.506755523321747
        ],
        "wc_strengths_avg": [
            67.75,
            30.011456145945335
        ],
        "wc_weaknesses_avg": [
            88.75,
            31.56243811875122
        ],
        "wc_questions_avg": [
            52.5,
            45.32383478921438
        ],
        "wc_review_avg": [
            260.0,
            71.7007670809734
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            715.0,
            376.99270549972186
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.4714045207910316,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9341438577730307463&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;2;3;4",
        "aff_unique_norm": "ETH Zurich;Peking University;Universit\u00e0 di Modena e Reggio Emilia;Katholieke Universiteit Leuven;University of Trento",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.ethz.ch;http://www.pku.edu.cn;https://www.unimore.it;https://www.kuleuven.be;https://www.unitn.it",
        "aff_unique_abbr": "ETHZ;Peking U;Unimore;KU Leuven;UniTN",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;2;3;2",
        "aff_country_unique": "Switzerland;China;Italy;Belgium"
    },
    {
        "title": "Explaining Kernel Clustering via Decision Trees",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19079",
        "id": "FAGtjl7HOw",
        "author_site": "Maximilian Fleissner, Leena Chennuru Vankadara, Debarghya Ghoshdastidar",
        "tldr": "",
        "abstract": "Despite the growing popularity of explainable and interpretable machine learning, there is still surprisingly limited work on inherently interpretable clustering methods. Recently, there has been a surge of interest in explaining the classic k-means algorithm, leading to efficient algorithms that approximate k-means clusters using axis-aligned decision trees. However, interpretable variants of k-means have limited applicability in practice, where more flexible clustering methods are often needed to obtain useful partitions of the data. In this work, we investigate interpretable kernel clustering, and propose algorithms that construct decision trees to approximate the partitions induced by kernel k-means, a nonlinear extension of k-means. We further build on previous work on explainable k-means and demonstrate how a suitable choice of features allows preserving interpretability without sacrificing approximation guarantees on the interpretable model.",
        "keywords": "Kernel k-means;Price of explainability",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/28ce2b712266260e3bbde5a7263b55cd3c74b9b4.zip",
        "author": "Maximilian Fleissner;Leena Chennuru Vankadara;Debarghya Ghoshdastidar",
        "authorids": "~Maximilian_Fleissner1;~Leena_Chennuru_Vankadara2;~Debarghya_Ghoshdastidar1",
        "gender": ";F;M",
        "homepage": ";https://leenacvankadara.com;https://www.cit.tum.de/tfai/people/debarghya-ghoshdastidar/",
        "dblp": ";;63/10964",
        "google_scholar": ";;Kp-enVQAAAAJ",
        "orcid": ";;0000-0003-0202-7007",
        "linkedin": ";;",
        "or_profile": "~Maximilian_Fleissner1;~Leena_Chennuru_Vankadara2;~Debarghya_Ghoshdastidar1",
        "aff": ";Amazon Development Center Germany;Technical University Munich",
        "aff_domain": ";amazon.de;tum.de",
        "position": ";Applied Scientist II;Assistant Professor",
        "bibtex": "@inproceedings{\nfleissner2024explaining,\ntitle={Explaining Kernel Clustering via Decision Trees},\nauthor={Maximilian Fleissner and Leena Chennuru Vankadara and Debarghya Ghoshdastidar},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=FAGtjl7HOw}\n}",
        "github": "",
        "project": "",
        "reviewers": "762t;JcS6;aXrD;8Bws",
        "pdf_size": 1521377,
        "rating": "6;6;8;8",
        "confidence": "3;4;5;4",
        "soundness": "3;3;4;3",
        "contribution": "3;2;3;2",
        "presentation": "3;3;4;3",
        "wc_summary": "150;118;164;122",
        "wc_strengths": "82;34;154;106",
        "wc_weaknesses": "246;259;172;105",
        "wc_questions": "36;19;58;93",
        "wc_review": "514;430;548;426",
        "wc_reply_reviewers": "15;41;152;56",
        "wc_reply_authors": "256;750;505;435",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            138.5,
            19.20286436967152
        ],
        "wc_strengths_avg": [
            94.0,
            43.266615305567875
        ],
        "wc_weaknesses_avg": [
            195.5,
            61.897092015699734
        ],
        "wc_questions_avg": [
            51.5,
            27.663152387246107
        ],
        "wc_review_avg": [
            479.5,
            52.90321351298048
        ],
        "wc_reply_reviewers_avg": [
            66.0,
            51.77354536826699
        ],
        "wc_reply_authors_avg": [
            486.5,
            177.17011599025383
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.7071067811865475,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10160765888551207281&as_sdt=20000005&sciodt=0,21&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=FAGtjl7HOw",
        "pdf": "https://openreview.net/pdf?id=FAGtjl7HOw",
        "email": ";amazon.de;tum.de",
        "author_num": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Amazon;Technical University of Munich",
        "aff_unique_dep": "Development Center;",
        "aff_unique_url": "https://www.amazon.de;https://www.tum.de",
        "aff_unique_abbr": "Amazon;TUM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "FAO4VS9QRV",
        "title": "Delta-LoRA: Fine-Tuning High-Rank Parameters with the Delta of Low-Rank Matrices",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this paper, we present \\textbf{Delta-LoRA}, which is a novel parameter-efficient approach to fine-tune large language models (LLMs). In contrast to LoRA and other low-rank adaptation methods such as AdaLoRA, Delta-LoRA not only updates the low-rank matrices $A$ and $B$, but also propagate the learning to the pre-trained weights $W$ via updates utilizing the delta of the product of two low-rank matrices ($A^{(t+1)}B^{(t+1)} - A^{(t)}B^{(t)}$). Such a strategy effectively addresses the limitation that the incremental update of low-rank matrices is inadequate for learning representations capable for downstream tasks. Moreover, as the update of $W$ does not need to compute the gradients of $W$ and store their momentums, Delta-LoRA shares comparable memory requirements and computational costs with LoRA. Extensive experiments show that Delta-LoRA significantly outperforms existing low-rank adaptation methods. We further support these results with comprehensive analyses that underscore the effectiveness of Delta-LoRA.",
        "keywords": "Parameter-Efficient Fine-Tuning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/70f7c9c7760660a3e28b4e830d391c13ef9a41ff.zip",
        "author": "Bojia Zi;Xianbiao Qi;Lingzhi Wang;Jianan Wang;Kam-Fai Wong;Lei Zhang",
        "authorids": "~Bojia_Zi2;~Xianbiao_Qi2;~Lingzhi_Wang1;~Jianan_Wang2;~Kam-Fai_Wong2;~Lei_Zhang23",
        "gender": "M;M;F;F;M;M",
        "homepage": "https://zibojia.github.io;https://www.linkedin.com/in/xianbiao-qi-39617727/;https://scholar.google.com/citations?user=_h8phjoAAAAJ&hl=zh-CN;https://scholar.google.com/citations?user=mt5mvZ8AAAAJ&hl=en;http://www.se.cuhk.edu.hk/~kfwong;https://www.leizhang.org/",
        "dblp": "276/3240;118/3741;;49/6053,;w/KamFaiWong;z/LeiZhang",
        "google_scholar": ";odjSydQAAAAJ;_h8phjoAAAAJ;mt5mvZ8AAAAJ;;fIlGZToAAAAJ",
        "orcid": ";;0000-0002-1346-2437;;0000-0002-9427-5659;",
        "linkedin": ";;lingzhi-wang-baa986290;;;",
        "or_profile": "~Bojia_Zi2;~Xianbiao_Qi2;~Lingzhi_Wang1;~Jianan_Wang2;~Kam-Fai_Wong2;~Lei_Zhang1",
        "aff": "The Chinese University of Hong Kong;International Digital Economy Academy;The Chinese University of Hong Kong;International Digital Economy Academy (IDEA);The Chinese University of Hong Kong;International Digital Economy Academy",
        "aff_domain": "cuhk.edu.hk;idea.edu.cn;cuhk.edu.hk;idea.edu.cn;cuhk.edu.hk;idea.edu.cn",
        "position": "PhD student;Researcher;Postdoc;Researcher;Full Professor;Chief Scientist",
        "bibtex": "@misc{\nzi2024deltalora,\ntitle={Delta-Lo{RA}: Fine-Tuning High-Rank Parameters with the Delta of Low-Rank Matrices},\nauthor={Bojia Zi and Xianbiao Qi and Lingzhi Wang and Jianan Wang and Kam-Fai Wong and Lei Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=FAO4VS9QRV}\n}",
        "github": "",
        "project": "",
        "reviewers": "p8Lv;e3re;SSSB;rQDs",
        "site": "https://openreview.net/forum?id=FAO4VS9QRV",
        "pdf_size": 655426,
        "rating": "3;5;6;6",
        "confidence": "5;3;3;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "39;50;28;61",
        "wc_strengths": "41;23;72;89",
        "wc_weaknesses": "76;317;39;204",
        "wc_questions": "50;4;12;37",
        "wc_review": "206;394;151;391",
        "wc_reply_reviewers": "0;215;13;0",
        "wc_reply_authors": "589;2499;388;706",
        "reply_reviewers": "0;2;1;0",
        "reply_authors": "2;5;2;2",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            44.5,
            12.298373876248844
        ],
        "wc_strengths_avg": [
            56.25,
            25.781534089343868
        ],
        "wc_weaknesses_avg": [
            159.0,
            109.86127616225838
        ],
        "wc_questions_avg": [
            25.75,
            18.552290963651902
        ],
        "wc_review_avg": [
            285.5,
            108.75775834394528
        ],
        "wc_reply_reviewers_avg": [
            57.0,
            91.37559849325201
        ],
        "wc_reply_authors_avg": [
            1045.5,
            846.8501933636196
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.75,
            1.299038105676658
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.7385489458759963,
        "gs_citation": 51,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12730780881158806726&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;1;0;1",
        "aff_unique_norm": "Chinese University of Hong Kong;International Digital Economy Academy",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cuhk.edu.hk;",
        "aff_unique_abbr": "CUHK;",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China;"
    },
    {
        "id": "FAY6ORIvn5",
        "title": "How well does Persistent Homology generalize on graphs?",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Persistent Homology (PH) is one of the pillars of topological data analysis that leverages multiscale topological descriptors to extract meaningful features from data. More recently, the combination of PH and neural networks has been successfully used to tackle predictive tasks on graphs. However, the generalization capabilities of PH on graphs remain largely unexplored. We derive a PAC-Bayesian perturbation analysis to bridge this gap. Specifically, we introduce the first data-dependent generalization guarantees for neural network-based persistence layers (PersLay). Notably, PersLay consists of a general framework that subsumes various vectorization methods of persistence diagrams in the literature. We substantiate our theoretical analysis with experimental studies and provide insights about the generalization of PH on real-world graph classification benchmarks.",
        "keywords": "Generalization Bounds;Persistence Homology;Topological Data Analysis;Graph Representation Learning;Learning Theory",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/d85ecbf78a192476697378852c30683b111b82ea.pdf",
        "author": "Kirill Brilliantov;Amauri H Souza;Vikas Garg",
        "authorids": "~Kirill_Brilliantov1;~Amauri_H_Souza1;~Vikas_Garg2",
        "gender": "M;M;",
        "homepage": "https://github.com/kibrq;http://www.amauriholanda.org;",
        "dblp": "350/5533;131/3352;",
        "google_scholar": "thgwrhYAAAAJ;lP0LBI4AAAAJ;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Kirill_Brilliantov1;~Amauri_H_Souza1;~Vikas_Garg2",
        "aff": "ETHZ - ETH Zurich;Federal Institute of Cear\u00e1;",
        "aff_domain": "ethz.ch;ifce.edu.br;",
        "position": "MS student;Associate Professor;",
        "bibtex": "@misc{\nbrilliantov2024how,\ntitle={How well does Persistent Homology generalize on graphs?},\nauthor={Kirill Brilliantov and Amauri H Souza and Vikas Garg},\nyear={2024},\nurl={https://openreview.net/forum?id=FAY6ORIvn5}\n}",
        "github": "",
        "project": "",
        "reviewers": "yvKz;ys8K;qwyi;1CoA",
        "site": "https://openreview.net/forum?id=FAY6ORIvn5",
        "pdf_size": 1214469,
        "rating": "3;6;6;6",
        "confidence": "3;3;2;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "2;2;1;3",
        "wc_summary": "33;43;45;51",
        "wc_strengths": "31;7;43;65",
        "wc_weaknesses": "194;38;225;161",
        "wc_questions": "49;898;5;5",
        "wc_review": "307;986;318;282",
        "wc_reply_reviewers": "74;267;306;31",
        "wc_reply_authors": "1064;2812;1344;787",
        "reply_reviewers": "1;2;4;1",
        "reply_authors": "2;6;4;2",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            43.0,
            6.48074069840786
        ],
        "wc_strengths_avg": [
            36.5,
            20.946360065653412
        ],
        "wc_weaknesses_avg": [
            154.5,
            70.96654141213308
        ],
        "wc_questions_avg": [
            239.25,
            380.7534471281908
        ],
        "wc_review_avg": [
            473.25,
            296.3236195445783
        ],
        "wc_reply_reviewers_avg": [
            169.5,
            118.78657331533728
        ],
        "wc_reply_authors_avg": [
            1501.75,
            781.6861182725455
        ],
        "reply_reviewers_avg": [
            2.0,
            1.224744871391589
        ],
        "reply_authors_avg": [
            3.5,
            1.6583123951777
        ],
        "replies_avg": [
            33,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:HSQGwfrLaXwJ:scholar.google.com/&scioq=How+well+does+Persistent+Homology+generalize+on+graphs%3F&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "ETH Zurich;Federal Institute of Cear\u00e1",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ethz.ch;http://www.ifce.edu.br",
        "aff_unique_abbr": "ETHZ;IFCE",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Switzerland;Brazil"
    },
    {
        "id": "FBDtqWXfuq",
        "title": "Exploring Modality Collaboration with Modality-Agnostic Transformers in Multi-Modal Federated Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In Federated Learning (FL), the focus has predominantly been on uni-modal scenarios, limiting the system's ability to leverage multi-modal data. This paper introduces a novel setting, Modality-Collaborated Federated Learning (MCFL), designed to facilitate collaboration among uni-modal clients with different data modalities. Unlike existing frameworks that emphasize multi-modal clients and tasks, MCFL aims to be more practical by focusing on uni-modal clients and ensuring performance gains across individual modalities. To address the challenges of model heterogeneity and modality gaps in MCFL, we propose Federated Modality Collaboration (FedCola), a framework based on a modality-agnostic transformer. FedCola explores optimal strategies in cross-modal parameter-sharing, model aggregation, and temporal modality arrangement. Our comprehensive evaluations demonstrate that FedCola significantly outperforms existing solutions, serving as a robust baseline for MCFL and marking a substantial advancement in federated learning.",
        "keywords": "federated learning;computer vision;vision transformer;multi-modal learning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Guangyu Sun;Matias Mendieta;Chen Chen",
        "authorids": "~Guangyu_Sun3;~Matias_Mendieta1;~Chen_Chen18",
        "gender": "M;;M",
        "homepage": "https://imguangyu.github.io/;https://sites.google.com/view/matiasmendieta;https://www.crcv.ucf.edu/chenchen/",
        "dblp": ";254/1788;65/4423-1",
        "google_scholar": "e4NjsVIAAAAJ;iO5zyPwAAAAJ;TuEwcZ0AAAAJ",
        "orcid": "0000-0002-8523-9074;0000-0002-5497-6207;0000-0003-3957-7061",
        "linkedin": "guangyu-sun-686b94198/;matias-mendieta/;dennychen/",
        "or_profile": "~Guangyu_Sun3;~Matias_Mendieta1;~Chen_Chen18",
        "aff": "University of Central Florida;University of Central Florida;University of Central Florida",
        "aff_domain": "ucf.edu;ucf.edu;ucf.edu",
        "position": "PhD student;PhD student;Assistant Professor",
        "bibtex": "@misc{\nsun2024exploring,\ntitle={Exploring Modality Collaboration with Modality-Agnostic Transformers in Multi-Modal Federated Learning},\nauthor={Guangyu Sun and Matias Mendieta and Chen Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=FBDtqWXfuq}\n}",
        "github": "",
        "project": "",
        "reviewers": "2xgy;iEDo;9GDZ;RJk2;pPNy;Pvz2;stt3",
        "site": "https://openreview.net/forum?id=FBDtqWXfuq",
        "pdf_size": 733358,
        "rating": "3;3;3;5;5;5;8",
        "confidence": "4;4;5;3;4;4;4",
        "soundness": "2;2;2;3;2;2;3",
        "contribution": "2;2;2;3;2;2;4",
        "presentation": "3;2;2;3;2;2;3",
        "wc_summary": "48;88;82;80;56;64;86",
        "wc_strengths": "35;44;66;94;14;98;44",
        "wc_weaknesses": "173;15;30;90;67;221;113",
        "wc_questions": "5;265;401;68;23;2;3",
        "wc_review": "261;412;579;332;160;385;246",
        "wc_reply_reviewers": "0;1901;0;21;0;0;20",
        "wc_reply_authors": "1299;2584;0;787;0;0;769",
        "reply_reviewers": "0;4;0;1;0;0;1",
        "reply_authors": "3;6;0;2;0;0;2",
        "rating_avg": [
            4.571428571428571,
            1.6781914463529615
        ],
        "confidence_avg": [
            4.0,
            0.5345224838248488
        ],
        "soundness_avg": [
            2.2857142857142856,
            0.4517539514526256
        ],
        "contribution_avg": [
            2.4285714285714284,
            0.7284313590846836
        ],
        "presentation_avg": [
            2.4285714285714284,
            0.49487165930539345
        ],
        "wc_summary_avg": [
            72.0,
            14.696938456699069
        ],
        "wc_strengths_avg": [
            56.42857142857143,
            28.784207688329687
        ],
        "wc_weaknesses_avg": [
            101.28571428571429,
            69.11835457225172
        ],
        "wc_questions_avg": [
            109.57142857142857,
            147.44282876797382
        ],
        "wc_review_avg": [
            339.2857142857143,
            126.41622215716541
        ],
        "wc_reply_reviewers_avg": [
            277.42857142857144,
            662.8806953943753
        ],
        "wc_reply_authors_avg": [
            777.0,
            874.1595147013256
        ],
        "reply_reviewers_avg": [
            0.8571428571428571,
            1.355261854357877
        ],
        "reply_authors_avg": [
            1.8571428571428572,
            2.030381486221699
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.31851102863530306,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:gdhuqb_X694J:scholar.google.com/&scioq=Exploring+Modality+Collaboration+with+Modality-Agnostic+Transformers+in+Multi-Modal+Federated+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Central Florida",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucf.edu",
        "aff_unique_abbr": "UCF",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "LOQA: Learning with Opponent Q-Learning Awareness",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19078",
        "id": "FDQF6A1s6M",
        "author_site": "Milad Aghajohari, Juan Duque, Timotheus Cooijmans, Aaron Courville",
        "tldr": "",
        "abstract": "In various real-world scenarios, interactions among agents often resemble the dynamics of general-sum games, where each agent strives to optimize its own utility. Despite the ubiquitous relevance of such settings, decentralized machine learning algorithms have struggled to find equilibria that maximize individual utility while preserving social welfare. In this paper we introduce Learning with Opponent Q-Learning Awareness (LOQA) , a novel reinforcement learning algorithm tailored to optimizing an agent's individual utility while fostering cooperation among adversaries in partially competitive environments. LOQA assumes that each agent samples actions proportionally to their action-value function Q. Experimental results demonstrate the effectiveness of LOQA at achieving state-of-the-art performance in benchmark scenarios such as the Iterated Prisoner's Dilemma and the Coin Game. LOQA achieves these outcomes with a significantly reduced computational footprint compared to previous works, making it a promising approach for practical multi-agent applications.",
        "keywords": "multi-agent reinforcement learning;social dilemmas;deep reinforcement learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/0cf3cb959958f47fcab67857f11b8fbff4ef4d38.pdf",
        "author": "Milad Aghajohari;Juan Agustin Duque;Tim Cooijmans;Aaron Courville",
        "authorids": "~Milad_Aghajohari1;~Juan_Agustin_Duque1;~Tim_Cooijmans1;~Aaron_Courville3",
        "gender": "M;M;M;",
        "homepage": ";https://juanduquevan.github.io/;;",
        "dblp": "241/5265;364/5866;153/5756;56/1688",
        "google_scholar": ";;https://scholar.google.ca/citations?user=Ec6vKzwAAAAJ;https://scholar.google.ca/citations?user=km6CP8cAAAAJ",
        "orcid": ";;;",
        "linkedin": "milad-aghajohari-6b9a669b/;;;",
        "or_profile": "~Milad_Aghajohari1;~Juan_Agustin_Duque1;~Tim_Cooijmans1;~Aaron_Courville3",
        "aff": "Montreal Institute for Learning Algorithms, University of Montreal, Universit\u00e9 de Montr\u00e9al;Universit\u00e9 de Montr\u00e9al;University of Montreal;Universit\u00e9 de Montr\u00e9al",
        "aff_domain": "mila.umontreal.ca;umontreal.ca;umontreal.ca; ",
        "position": "Researcher;PhD student;PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\naghajohari2024loqa,\ntitle={{LOQA}: Learning with Opponent Q-Learning Awareness},\nauthor={Milad Aghajohari and Juan Agustin Duque and Tim Cooijmans and Aaron Courville},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=FDQF6A1s6M}\n}",
        "github": "",
        "project": "",
        "reviewers": "iBDc;rBSb;F4Df;xNg3;SYs7",
        "pdf_size": 506641,
        "rating": "3;3;3;5;6",
        "confidence": "4;4;3;3;3",
        "soundness": "3;3;2;2;2",
        "contribution": "2;2;2;2;3",
        "presentation": "3;3;2;2;3",
        "wc_summary": "74;105;86;34;83",
        "wc_strengths": "35;35;43;51;72",
        "wc_weaknesses": "59;100;88;208;194",
        "wc_questions": "38;49;258;56;16",
        "wc_review": "206;289;475;349;365",
        "wc_reply_reviewers": "0;371;26;74;256",
        "wc_reply_authors": "0;884;503;243;185",
        "reply_reviewers": "0;2;1;1;1",
        "reply_authors": "0;2;1;1;1",
        "rating_avg": [
            4.0,
            1.2649110640673518
        ],
        "confidence_avg": [
            3.4,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            76.4,
            23.482759633399137
        ],
        "wc_strengths_avg": [
            47.2,
            13.746272221951665
        ],
        "wc_weaknesses_avg": [
            129.8,
            59.80769181301014
        ],
        "wc_questions_avg": [
            83.4,
            88.34387358498607
        ],
        "wc_review_avg": [
            336.8,
            88.81081015281866
        ],
        "wc_reply_reviewers_avg": [
            145.4,
            143.960550151769
        ],
        "wc_reply_authors_avg": [
            363.0,
            306.2332444395938
        ],
        "reply_reviewers_avg": [
            1.0,
            0.6324555320336759
        ],
        "reply_authors_avg": [
            1.0,
            0.6324555320336759
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.6454972243679028,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16891326160127149250&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=FDQF6A1s6M",
        "pdf": "https://openreview.net/pdf?id=FDQF6A1s6M",
        "email": "mila.umontreal.ca;umontreal.ca;umontreal.ca; ",
        "author_num": 4,
        "aff_unique_index": "0;1;0;1",
        "aff_unique_norm": "University of Montreal;Universit\u00e9 de Montr\u00e9al",
        "aff_unique_dep": "Montreal Institute for Learning Algorithms;",
        "aff_unique_url": "https://www.mila.quebec;https://www.umontreal.ca",
        "aff_unique_abbr": "MILA;UdeM",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Montreal;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "title": "Attention-based Iterative Decomposition for Tensor Product Representation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19077",
        "id": "FDb2JQZsFH",
        "author_site": "TAEWON PARK, inchul choi, Minho Lee",
        "tldr": "",
        "abstract": "In recent research, Tensor Product Representation (TPR) is applied for the systematic generalization task of deep neural networks by learning the compositional structure of data. However, such prior works show limited performance in discovering and representing the symbolic structure from unseen test data because their decomposition to the structural representations was incomplete. In this work, we propose an Attention-based Iterative Decomposition (AID) module designed to enhance the decomposition operations for the structured representations encoded from the sequential input data with TPR. Our AID can be easily adapted to any TPR-based model and provides enhanced systematic decomposition through a competitive attention mechanism between input features and structured representations. In our experiments, AID shows effectiveness by significantly improving the performance of TPR-based prior works on the series of systematic generalization tasks. Moreover, in the quantitative and qualitative evaluations, AID produces more compositional and well-bound structural representations than other works.",
        "keywords": "tensor product representation;systematic generalization;compositional generalization;binding problem;structured representation learning;competitive attention",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/6d1f11974a82ecd4b29be4477fcad12f55e17a87.zip",
        "author": "Taewon Park;Inchul Choi;Minho Lee",
        "authorids": "~Taewon_Park1;~Inchul_Choi1;~Minho_Lee2",
        "gender": "M;M;M",
        "homepage": ";;https://www.knu.ac.kr/",
        "dblp": "82/10595;;",
        "google_scholar": "https://scholar.google.co.kr/citations?hl=ko;JUEWM6QAAAAJ;",
        "orcid": ";;",
        "linkedin": "taewon-park-755394169/;;",
        "or_profile": "~Taewon_Park1;~Inchul_Choi1;~Minho_Lee2",
        "aff": "Kyungpook National University;;Kyungpook National University",
        "aff_domain": "knu.ac.kr;;knu.ac.kr",
        "position": "PhD student;;Full Professor",
        "bibtex": "@inproceedings{\npark2024attentionbased,\ntitle={Attention-based Iterative Decomposition for Tensor Product Representation},\nauthor={Taewon Park and Inchul Choi and Minho Lee},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=FDb2JQZsFH}\n}",
        "github": "",
        "project": "",
        "reviewers": "bYLE;bmNb;rEt9;Qfs2;8A4n",
        "pdf_size": 1882319,
        "rating": "6;6;6;8;8",
        "confidence": "3;2;4;2;4",
        "soundness": "3;3;3;3;3",
        "contribution": "3;2;2;3;4",
        "presentation": "4;3;3;3;3",
        "wc_summary": "81;65;163;43;311",
        "wc_strengths": "57;61;181;55;122",
        "wc_weaknesses": "26;158;155;40;1116",
        "wc_questions": "106;51;113;11;203",
        "wc_review": "270;335;612;149;1752",
        "wc_reply_reviewers": "13;53;131;41;55",
        "wc_reply_authors": "563;938;1407;440;1752",
        "reply_reviewers": "1;1;1;1;1",
        "reply_authors": "2;3;2;2;4",
        "rating_avg": [
            6.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.0,
            0.8944271909999159
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.8,
            0.7483314773547882
        ],
        "presentation_avg": [
            3.2,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            132.6,
            97.99101999673235
        ],
        "wc_strengths_avg": [
            95.2,
            49.648363517844174
        ],
        "wc_weaknesses_avg": [
            299.0,
            412.24167668977867
        ],
        "wc_questions_avg": [
            96.8,
            64.93812439545817
        ],
        "wc_review_avg": [
            623.6,
            584.2925979336039
        ],
        "wc_reply_reviewers_avg": [
            58.6,
            39.179586521554825
        ],
        "wc_reply_authors_avg": [
            1020.0,
            497.50698487558947
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.6,
            0.8
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10166902688982667234&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=FDb2JQZsFH",
        "pdf": "https://openreview.net/pdf?id=FDb2JQZsFH",
        "email": "knu.ac.kr;;knu.ac.kr",
        "author_num": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Kyungpook National University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.knu.ac.kr",
        "aff_unique_abbr": "KNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "FDfq0RRkuz",
        "title": "WASA: WAtermark-based Source Attribution for Large Language Model-Generated Data",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The impressive performances of large language models (LLMs) and their immense potential for commercialization have given rise to serious concerns over the intellectual property (IP) of their training data. In particular, the synthetic texts generated by LLMs may infringe the IP of the data being used to train the LLMs. To this end, it is imperative to be able to (a) identify the data provider who contributed to the generation of a synthetic text by an LLM (source attribution) and (b) verify whether the text data from a data provider has been used to train an LLM (data provenance). In this paper, we show that both problems can be solved by watermarking, i.e., by enabling an LLM to generate synthetic texts with embedded watermarks that contain information about their source(s). We identify the key properties of such watermarking frameworks (e.g., source attribution accuracy, robustness against adversaries), and propose a WAtermarking for Source Attribution (WASA) framework that satisfies these key properties due to our algorithmic designs. Our WASA framework enables an LLM to learn an accurate mapping from the texts of different data providers to their corresponding unique watermarks, which sets the foundation for effective source attribution (and hence data provenance). Extensive empirical evaluations show that our WASA framework achieves effective source attribution and data provenance.",
        "keywords": "Large Language Model;Source Attribution;Data Provenance",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/40db9626a26019f86c675a992a3ae2fdc4c4d085.zip",
        "author": "Xinyang Lu;Jingtan Wang;Zitong Zhao;Zhongxiang Dai;Chuan-Sheng Foo;See-Kiong Ng;Bryan Kian Hsiang Low",
        "authorids": "~Xinyang_Lu1;~Jingtan_Wang1;~Zitong_Zhao1;~Zhongxiang_Dai1;~Chuan-Sheng_Foo1;~See-Kiong_Ng1;~Bryan_Kian_Hsiang_Low1",
        "gender": "M;F;;M;M;M;M",
        "homepage": ";https://jtwang2000.github.io/;https://github.com/WilsonZzt;https://daizhongxiang.github.io/;http://ai.stanford.edu/~csfoo;https://www.comp.nus.edu.sg/~ngsk/;http://www.comp.nus.edu.sg/~lowkh",
        "dblp": ";;;172/4968;73/1823;00/5480;97/4877",
        "google_scholar": ";;;1v8xOIYAAAAJ;AgbeqGkAAAAJ;https://scholar.google.com.tw/citations?user=_wsommYAAAAJ;https://scholar.google.com.tw/citations?user=2P-Q09UAAAAJ",
        "orcid": "0000-0003-0610-070X;;;;0000-0002-4748-5792;0000-0001-6565-7511;",
        "linkedin": "xinyang-lu-370724170;jingtan-wang-130643193/;;;;seekiong/?originalSubdomain=sg;",
        "or_profile": "~Xinyang_Lu1;~Jingtan_Wang1;~Zitong_Zhao1;~Zhongxiang_Dai1;~Chuan-Sheng_Foo1;~See-Kiong_Ng1;~Bryan_Kian_Hsiang_Low1",
        "aff": "National University of Singapore;National University of Singapore, National University of Singapore;National University of Singapore;Massachusetts Institute of Technology;Institute for Infocomm Research, A*STAR;National University of Singapore;National University of Singapore",
        "aff_domain": "u.nus.edu;u.nus.edu;u.nus;mit.edu;i2r.a-star.edu.sg;nus.edu.sg;nus.edu.sg",
        "position": "PhD student;PhD student;PhD student;Postdoc;Principal Scientist;Full Professor;Associate Professor",
        "bibtex": "@misc{\nlu2024wasa,\ntitle={{WASA}: {WA}termark-based Source Attribution for Large Language Model-Generated Data},\nauthor={Xinyang Lu and Jingtan Wang and Zitong Zhao and Zhongxiang Dai and Chuan-Sheng Foo and See-Kiong Ng and Bryan Kian Hsiang Low},\nyear={2024},\nurl={https://openreview.net/forum?id=FDfq0RRkuz}\n}",
        "github": "",
        "project": "",
        "reviewers": "fyL5;aG26;K4wg;ViRU",
        "site": "https://openreview.net/forum?id=FDfq0RRkuz",
        "pdf_size": 1644453,
        "rating": "5;5;6;6",
        "confidence": "4;2;3;3",
        "soundness": "3;3;3;3",
        "contribution": "3;2;3;2",
        "presentation": "3;2;3;4",
        "wc_summary": "85;67;98;73",
        "wc_strengths": "61;13;86;94",
        "wc_weaknesses": "186;15;38;334",
        "wc_questions": "104;259;101;46",
        "wc_review": "436;354;323;547",
        "wc_reply_reviewers": "42;124;34;12",
        "wc_reply_authors": "2691;1277;2427;1600",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "7;3;5;5",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            80.75,
            11.882234638316145
        ],
        "wc_strengths_avg": [
            63.5,
            31.595094555959157
        ],
        "wc_weaknesses_avg": [
            143.25,
            128.1978451456966
        ],
        "wc_questions_avg": [
            127.5,
            79.35521406939812
        ],
        "wc_review_avg": [
            415.0,
            86.67467911679859
        ],
        "wc_reply_reviewers_avg": [
            53.0,
            42.43819034784589
        ],
        "wc_reply_authors_avg": [
            1998.75,
            579.338577603805
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            5.0,
            1.4142135623730951
        ],
        "replies_avg": [
            30,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:TpFfJKtwfMkJ:scholar.google.com/&scioq=WASA:+WAtermark-based+Source+Attribution+for+Large+Language+Model-Generated+Data&hl=en&as_sdt=0,48",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;2;0;0",
        "aff_unique_norm": "National University of Singapore;Massachusetts Institute of Technology;Institute for Infocomm Research",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.nus.edu.sg;https://web.mit.edu;https://www.i2r.a-star.edu.sg",
        "aff_unique_abbr": "NUS;MIT;I2R",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0;0;0",
        "aff_country_unique": "Singapore;United States"
    },
    {
        "id": "FDve8qGH3M",
        "title": "Simple CNN for Vision",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Traditional Convolutional Neural Networks (CNNs) tend to use 3$\\times$3 small kernels, but can only capture neighboring spatial information in one block. \nInspired by the success of Vision Transformers (ViTs) in capturing long-range visual dependencies, recent CNNs have reached a consensus on utilizing large kernel convolutions (e.g., 31$\\times$31 and, astonishingly, 51$\\times$51 kernels). \nNevertheless, these approaches necessitate adopting specialized techniques such as re-parameterization or sparsity, which require extra post-processing. And too large kernels are unfriendly to hardware. \nThis paper introduces a Simple Convolutional Neural Network (SCNN) that employs a sequence of stacked 3$\\times$3 convolutions but surpasses state-of-the-art CNNs utilizing larger kernels. Notably, we propose simple yet highly effective designs that enable 3$\\times$3 convolutions to progressively capture visual cues of various sizes, thereby overcoming the limitations of smaller kernels. \nFirst, we build a thin and deep model, which encourages more convolutions to capture more spatial information under the same computing complexity instead of opting for a heavier, shallower architecture. Furthermore, we introduce an innovative block comprising two 3$\\times$3 depthwise convolutions to enlarge the receptive field. Finally, we replace the input of the popular Sigmoid Linear Unit (SiLU) activation function with global average pooled features to capture all spatial information. \nOur SCNN performs superior to state-of-the-art CNNs and ViTs across various tasks, including ImageNet-1K image classification, COCO instance segmentation, and ADE20K semantic segmentation. \nRemarkably, SCNN outperforms the small version of Swin Transformer, a well-known ViTs, while requiring only 50\\% computation, which further proves that large kernel convolution is not the only choice for high-performance CNNs.",
        "keywords": "backbone; cnn",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Shenqi Lai;Hao Zhang;Wenqi Shao;Haifeng Liu;Deng Cai;Wenxiao Wang;Kaipeng Zhang",
        "authorids": "~Shenqi_Lai1;~Hao_Zhang56;~Wenqi_Shao2;~Haifeng_Liu5;~Deng_Cai4;~Wenxiao_Wang2;~Kaipeng_Zhang1",
        "gender": "M;M;M;F;M;M;M",
        "homepage": ";;https://wqshao126.github.io/;https://person.zju.edu.cn/hfliu;http://www.cad.zju.edu.cn/home/dengcai/;https://wenxiaowang.com;http://kpzhang93.github.io/",
        "dblp": "238/0159;;227/3122;;c/DCai;243/5853-1;179/2126",
        "google_scholar": "CgadbL8AAAAJ;hwZUvY0AAAAJ;Bs9mrwwAAAAJ;;vzxDyJoAAAAJ;https://scholar.google.com.hk/citations?user=rcxOjikAAAAJ;4OqZBmYAAAAJ",
        "orcid": ";0000-0002-3572-7053;;;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Shenqi_Lai1;~Hao_Zhang56;~Wenqi_Shao2;~Haifeng_Liu5;~Deng_Cai4;~Wenxiao_Wang2;~Kaipeng_Zhang1",
        "aff": "Zhejiang University;Xi'an Jiaotong University;Shanghai AI Laboratory;Zhejiang University;Zhejiang University;Zhejiang University;Shanghai AI Laboratory",
        "aff_domain": "zju.edu.cn;xjtu.edu.cn;pjlab.org.cn;zju.edu.cn;zju.edu.cn;zju.edu.cn;pjlab.org.cn",
        "position": "PhD student;PhD student;Researcher;Associate Professor;Professor;Assistant Professor;Researcher",
        "bibtex": "@misc{\nlai2024simple,\ntitle={Simple {CNN} for Vision},\nauthor={Shenqi Lai and Hao Zhang and Wenqi Shao and Haifeng Liu and Deng Cai and Wenxiao Wang and Kaipeng Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=FDve8qGH3M}\n}",
        "github": "",
        "project": "",
        "reviewers": "of72;gmsA;tQCD;SZ8J",
        "site": "https://openreview.net/forum?id=FDve8qGH3M",
        "pdf_size": 568277,
        "rating": "3;5;6;6",
        "confidence": "4;4;1;4",
        "soundness": "3;3;3;2",
        "contribution": "2;2;3;4",
        "presentation": "2;3;3;1",
        "wc_summary": "77;48;61;59",
        "wc_strengths": "105;10;36;47",
        "wc_weaknesses": "157;53;64;94",
        "wc_questions": "56;25;6;279",
        "wc_review": "395;136;167;479",
        "wc_reply_reviewers": "0;72;0;54",
        "wc_reply_authors": "427;375;161;768",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            1.299038105676658
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            61.25,
            10.353139620424328
        ],
        "wc_strengths_avg": [
            49.5,
            34.74550330618338
        ],
        "wc_weaknesses_avg": [
            92.0,
            40.41658075592244
        ],
        "wc_questions_avg": [
            91.5,
            109.7144019716646
        ],
        "wc_review_avg": [
            294.25,
            146.21794520509445
        ],
        "wc_reply_reviewers_avg": [
            31.5,
            32.13642792844283
        ],
        "wc_reply_authors_avg": [
            432.75,
            217.72043427294554
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.4714045207910316,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2479560129407859632&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0;0;0;2",
        "aff_unique_norm": "Zhejiang University;Xi'an Jiao Tong University;Shanghai AI Laboratory",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.zju.edu.cn;https://www.xjtu.edu.cn;https://www.shanghai-ai-lab.com",
        "aff_unique_abbr": "ZJU;XJTU;SAIL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Few-shot Hybrid Domain Adaptation of Image Generator",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19076",
        "id": "FE2e8664Sl",
        "author_site": "Hengjia Li, Yang Liu, Linxuan Xia, Yuqi Lin, Wenxiao Wang, Tu Zheng, Zheng Yang, Xiaohui Zhong, Xiaobo Ren, Xiaofei He",
        "tldr": "",
        "abstract": "Can a pre-trained generator be adapted to the hybrid of multiple target domains and generate images with integrated attributes of them? In this work, we introduce a new task -- Few-shot $\\textit{Hybrid Domain Adaptation}$ (HDA). Given a source generator and several target domains, HDA aims to acquire an adapted generator that preserves the integrated attributes of all target domains, without overriding the source domain's characteristics. Compared with $\\textit{Domain Adaptation}$ (DA), HDA offers greater flexibility and versatility to adapt generators to more composite and expansive domains. Simultaneously, HDA also presents more challenges than DA as we have access only to images from individual target domains and lack authentic images from the hybrid domain. To address this issue, we introduce a discriminator-free framework that directly encodes different domains' images into well-separable subspaces. To achieve HDA, we propose a novel directional subspace loss comprised of a distance loss and a direction loss. Concretely, the distance loss blends the attributes of all target domains by reducing the distances from generated images to all target subspaces. The direction loss preserves the characteristics from the source domain by guiding the adaptation along the perpendicular to subspaces. Experiments show that our method can obtain numerous domain-specific attributes in a single adapted generator, which surpasses the baseline methods in semantic similarity, image fidelity, and cross-domain consistency.",
        "keywords": "Few shot; Domain Adaptation; Image Generator",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/00b5f138d545586686cd525e03cbff8dd3bf9f3d.zip",
        "author": "Hengjia Li;Yang Liu;Linxuan Xia;Yuqi Lin;Wenxiao Wang;Tu Zheng;Zheng Yang;Xiaohui Zhong;Xiaobo Ren;Xiaofei He",
        "authorids": "~Hengjia_Li1;~Yang_Liu42;~Linxuan_Xia1;~Yuqi_Lin1;~Wenxiao_Wang2;~Tu_Zheng1;~Zheng_Yang2;~Xiaohui_Zhong2;~Xiaobo_Ren2;~Xiaofei_He2",
        "gender": "M;M;M;M;M;;M;;;M",
        "homepage": "https://echopluto.github.io/HomePage/;;https://github.com/Xialinxuan;http://wiki.zjulearning.org.cn/wiki/User:Linyuqi;https://wenxiaowang.com;http://person.zjulearning.org.cn/tuzheng/;https://www.linkedin.com/in/zheng-yang-5455774b/;https://github.com/;https://github.com/;https://person.zju.edu.cn/0007101",
        "dblp": "255/5148;51/3710-212.html;359/6129;117/7752;243/5853-1;229/4199;59/5806-8;;;h/XiaofeiHe.html",
        "google_scholar": "FstE4t0AAAAJ;DzQAV2gAAAAJ;;5-jDh48AAAAJ;https://scholar.google.com.hk/citations?user=rcxOjikAAAAJ;;y8b7ARgAAAAJ;;;QLLFowsAAAAJ",
        "orcid": ";;;;;;0009-0009-2840-2494;;;0009-0001-9107-2354",
        "linkedin": ";;;;;;;;;",
        "or_profile": "~Hengjia_Li1;~Yang_Liu42;~Linxuan_Xia1;~Yuqi_Lin1;~Wenxiao_Wang2;~Tu_Zheng1;~Zheng_Yang2;~Xiaohui_Zhong2;~Xiaobo_Ren2;~Xiaofei_He2",
        "aff": "FABU Inc;Alibaba Group;FABU Inc;Zhejiang University;Zhejiang University;Fabu;Fabu Inc;Ningbo Beilun Third Container Terminal Co., Ltd;ningbo zhoushan port company limited;Zhejiang University",
        "aff_domain": "fabu.ai;alibaba-inc.com;fabu.ai;zju.edu.cn;zju.edu.cn;fabu.ai;fabu.ai;nbport.com.cn;nbport.com.cn;zju.edu.cn",
        "position": "Intern;Researcher;Intern;PhD student;Assistant Professor;Researcher;CTO;Researcher;Researcher;Professor",
        "bibtex": "@inproceedings{\nli2024fewshot,\ntitle={Few-shot Hybrid Domain Adaptation of Image Generator},\nauthor={Hengjia Li and Yang Liu and Linxuan Xia and Yuqi Lin and Wenxiao Wang and Tu Zheng and Zheng Yang and Xiaohui Zhong and Xiaobo Ren and Xiaofei He},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=FE2e8664Sl}\n}",
        "github": "",
        "project": "",
        "reviewers": "bxKn;2zhA;fvXy",
        "pdf_size": 19344913,
        "rating": "5;8;8",
        "confidence": "2;4;3",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "3;4;3",
        "wc_summary": "161;50;147",
        "wc_strengths": "129;76;57",
        "wc_weaknesses": "234;193;150",
        "wc_questions": "165;6;17",
        "wc_review": "689;325;371",
        "wc_reply_reviewers": "78;18;0",
        "wc_reply_authors": "896;693;695",
        "reply_reviewers": "1;1;0",
        "reply_authors": "3;2;2",
        "rating_avg": [
            7.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            119.33333333333333,
            49.358101890391026
        ],
        "wc_strengths_avg": [
            87.33333333333333,
            30.466739606039603
        ],
        "wc_weaknesses_avg": [
            192.33333333333334,
            34.296096311711956
        ],
        "wc_questions_avg": [
            62.666666666666664,
            72.49980842886568
        ],
        "wc_review_avg": [
            461.6666666666667,
            161.84217277609966
        ],
        "wc_reply_reviewers_avg": [
            32.0,
            33.34666400106613
        ],
        "wc_reply_authors_avg": [
            761.3333333333334,
            95.22721366406886
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.8660254037844387,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12758224603798179147&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=FE2e8664Sl",
        "pdf": "https://openreview.net/pdf?id=FE2e8664Sl",
        "email": "fabu.ai;alibaba-inc.com;fabu.ai;zju.edu.cn;zju.edu.cn;fabu.ai;fabu.ai;nbport.com.cn;nbport.com.cn;zju.edu.cn",
        "author_num": 10,
        "aff_unique_index": "0;1;0;2;2;3;0;4;5;2",
        "aff_unique_norm": "Fabu Inc;Alibaba Group;Zhejiang University;Fabu;Ningbo Beilun Third Container Terminal Co., Ltd;Ningbo Zhoushan Port Company Limited",
        "aff_unique_dep": ";;;;;",
        "aff_unique_url": ";https://www.alibaba.com;https://www.zju.edu.cn;;;",
        "aff_unique_abbr": ";Alibaba;ZJU;;;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "1;1;1;2;1;1;1",
        "aff_country_unique": ";China;United States"
    },
    {
        "id": "FE6WxgrOWP",
        "title": "Chain of Images for Intuitively Reasoning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The human brain is naturally equipped to comprehend and interpret visual information rapidly.\nWhen confronted with complex problems or concepts, we prefer to use flowcharts, sketches, and diagrams to aid our thought process.\nLeveraging this inherent ability can significantly enhance logical reasoning.\nHowever, currently large language models do not utilize such visual intuition to help their thinking.\nTo mitigate such limitations, we present Chain of Images (CoI), which can convert complex language reasoning problems to simple pattern recognition by generating a series of images as intermediate representations.\nIn supporting our CoI reasoning, we introduce a symbolic multi-modal model (SyMLM) that generates images strictly based on language instructions and accepts both text and image as input.\nExperiments on Geometry, Chess and Common Sense tasks show that Chain of Images prompting improve the performance by a large margin over the pure-language Chain of Thoughts (CoT) baselines.\nThese results underscore the benefits of intuitive reasoning: 1) An image can represent complex textual logic in a more compact and intuitive way; \n2) Images concisely capture the state at each step in long reasoning chains;\n3) Images can help eliminate the textual hallucination problem and introduce visual commonsense knowledge.",
        "keywords": "LLM;CoT;multimodal",
        "primary_area": "causal reasoning",
        "supplementary_material": "/attachment/d8e0ac4bc61028af6d9b10b9a4ad89f4c431f5a2.zip",
        "author": "Fanxu Meng;Haotong Yang;Yiding Wang;Muhan Zhang",
        "authorids": "~Fanxu_Meng1;~Haotong_Yang1;~Yiding_Wang1;~Muhan_Zhang1",
        "gender": "M;M;M;M",
        "homepage": "https://fxmeng.github.io/;https://haotong-yang.github.io/;https://github.com/Blancokdb;https://muhanzhang.github.io/",
        "dblp": ";329/6378.html;;157/5518",
        "google_scholar": "xvfuhRUAAAAJ;Zn2kjLoAAAAJ;tGh4jp0AAAAJ;https://scholar.google.com.hk/citations?user=OBBqkosAAAAJ",
        "orcid": ";;;0000-0002-7680-6401",
        "linkedin": ";;;jerry-muhan-zhang-a33a1777/",
        "or_profile": "~Fanxu_Meng1;~Haotong_Yang1;~Yiding_Wang1;~Muhan_Zhang1",
        "aff": "Peking University;Peking University;Peking University;Peking University",
        "aff_domain": "pku.edu.cn;pku.edu.cn;pku.edu.cn;pku.edu.cn",
        "position": "PhD student;PhD student;Undergrad student;Assistant Professor",
        "bibtex": "@misc{\nmeng2024chain,\ntitle={Chain of Images for Intuitively Reasoning},\nauthor={Fanxu Meng and Haotong Yang and Yiding Wang and Muhan Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=FE6WxgrOWP}\n}",
        "github": "",
        "project": "",
        "reviewers": "bdXh;ZLmV;QAod;KgMJ",
        "site": "https://openreview.net/forum?id=FE6WxgrOWP",
        "pdf_size": 2349421,
        "rating": "3;5;5;5",
        "confidence": "4;3;4;4",
        "soundness": "2;3;3;2",
        "contribution": "2;2;2;3",
        "presentation": "2;3;2;2",
        "wc_summary": "58;60;119;108",
        "wc_strengths": "75;62;35;140",
        "wc_weaknesses": "249;163;312;168",
        "wc_questions": "131;7;30;106",
        "wc_review": "513;292;496;522",
        "wc_reply_reviewers": "0;0;119;0",
        "wc_reply_authors": "434;317;407;400",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            86.25,
            27.535204738661378
        ],
        "wc_strengths_avg": [
            78.0,
            38.59404099080582
        ],
        "wc_weaknesses_avg": [
            223.0,
            61.6887347900733
        ],
        "wc_questions_avg": [
            68.5,
            51.422271439523165
        ],
        "wc_review_avg": [
            455.75,
            95.00098683697975
        ],
        "wc_reply_reviewers_avg": [
            29.75,
            51.528511525174096
        ],
        "wc_reply_authors_avg": [
            389.5,
            43.74071330008234
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16635517254303893452&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Peking University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.pku.edu.cn",
        "aff_unique_abbr": "Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "FE7PY7e4tr",
        "title": "Neural Network Expressive Power Analysis Via Manifold Topology",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "A prevalent assumption regarding real-world data is that it lies on or close to a lower-dimensional manifold. When deploying a neural network on data manifolds, the required size of the network heavily depends on the intricacy of the underlying latent manifold. While significant advancements have been made in understanding the geometric attributes of manifolds, it's essential to recognize that topology, too, is a fundamental characteristic of manifolds. In this study, we delve into a challenge where a classifier is trained with data on low-dimensional manifolds. We present an upper bound on the size of ReLU neural networks. This bound integrates the topological facets of manifolds, with empirical evidence confirming the tightness.",
        "keywords": "neural network;topology;manifold",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Jiachen Yao;Mayank Goswami;Chao Chen",
        "authorids": "~Jiachen_Yao1;~Mayank_Goswami1;~Chao_Chen1",
        "gender": "M;;M",
        "homepage": ";;https://chaochen.github.io/",
        "dblp": ";;66/3019-12",
        "google_scholar": ";;J-iIIFAAAAAJ",
        "orcid": ";;0000-0003-1703-6483",
        "linkedin": "https://www.linkedin.com/feed/;;",
        "or_profile": "~Jiachen_Yao1;~Mayank_Goswami1;~Chao_Chen1",
        "aff": ", State University of New York at Stony Brook;;State University of New York at Stony Brook",
        "aff_domain": "cs.stonybrook.edu;;stonybrook.edu",
        "position": "PhD student;;Associate Professor",
        "bibtex": "@misc{\nyao2024neural,\ntitle={Neural Network Expressive Power Analysis Via Manifold Topology},\nauthor={Jiachen Yao and Mayank Goswami and Chao Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=FE7PY7e4tr}\n}",
        "github": "",
        "project": "",
        "reviewers": "DRpb;mSxa;ai47;9Qss",
        "site": "https://openreview.net/forum?id=FE7PY7e4tr",
        "pdf_size": 1729433,
        "rating": "3;5;5;8",
        "confidence": "2;4;2;3",
        "soundness": "2;4;2;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "43;106;56;151",
        "wc_strengths": "24;38;46;165",
        "wc_weaknesses": "405;556;152;311",
        "wc_questions": "44;113;125;39",
        "wc_review": "516;813;379;666",
        "wc_reply_reviewers": "222;409;0;6",
        "wc_reply_authors": "451;1011;532;195",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            89.0,
            42.83106349368411
        ],
        "wc_strengths_avg": [
            68.25,
            56.410881042579014
        ],
        "wc_weaknesses_avg": [
            356.0,
            146.66458331853673
        ],
        "wc_questions_avg": [
            80.25,
            39.02162861798569
        ],
        "wc_review_avg": [
            593.5,
            162.36763840125286
        ],
        "wc_reply_reviewers_avg": [
            159.25,
            169.6752412699036
        ],
        "wc_reply_authors_avg": [
            547.25,
            295.2290424399334
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.37998029782867415,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:i2y0YB_4BrcJ:scholar.google.com/&scioq=Neural+Network+Expressive+Power+Analysis+Via+Manifold+Topology&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "State University of New York at Stony Brook",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.stonybrook.edu",
        "aff_unique_abbr": "SUNY Stony Brook",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Stony Brook",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "FFvCjbhpDq",
        "title": "The Role of Forgetting in Fine-Tuning Reinforcement Learning Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Fine-tuning is a widespread technique that allows practitioners to transfer pre-trained capabilities, as recently showcased by the successful applications of foundation models. However, fine-tuning pre-trained reinforcement learning (RL) agents remains a challenge. This work conceptualizes one specific cause of poor transfers in the RL setting: *forgetting of pre-trained capabilities*. Namely, due to the distribution shift between the pre-training and fine-tuning data, the pre-trained model can significantly deteriorate before the agent reaches parts of the state space known by the pre-trained policy. In many cases, re-learning the lost capabilities takes as much time as learning them from scratch. We identify conditions when this problem occurs, perform a thorough analysis, and identify potential solutions. Namely, we propose to counteract deterioration by applying techniques that mitigate forgetting. We experimentally confirm this to be an efficient solution; for example, it allows us to significantly improve the fine-tuning process on Montezuma's Revenge as well as on the challenging NetHack domain.",
        "keywords": "reinforcement learning;transfer learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/82c867e5aaad8271df6b516b615f37d11c0efe26.zip",
        "author": "Maciej Wolczyk;Bart\u0142omiej Cupia\u0142;Mateusz Ostaszewski;Micha\u0142 Bortkiewicz;Micha\u0142 Zaj\u0105c;Razvan Pascanu;\u0141ukasz Kuci\u0144ski;Piotr Mi\u0142o\u015b",
        "authorids": "~Maciej_Wolczyk1;~Bart\u0142omiej_Cupia\u01421;~Mateusz_Ostaszewski1;~Micha\u0142_Bortkiewicz1;~Micha\u0142_Zaj\u0105c1;~Razvan_Pascanu1;~\u0141ukasz_Kuci\u0144ski1;~Piotr_Mi\u0142o\u015b1",
        "gender": "M;M;;;M;M;M;",
        "homepage": ";https://bartekcupial.github.io/;;;;https://razp.info;https://sites.google.com/view/lukaszkucinski;",
        "dblp": "236/5956;;;;02/6977-5.html;65/8368.html;250/9699;208/0989.html",
        "google_scholar": ";2I0GV_UAAAAJ;;;https://scholar.google.pl/citations?user=5HHtXzwAAAAJ;https://scholar.google.ca/citations?user=eSPY8LwAAAAJ;l6dK-VUAAAAJ;Se68XecAAAAJ",
        "orcid": ";;;;;;0000-0002-5617-8129;",
        "linkedin": ";bart%C5%82omiej-cupia%C5%82-7b37b0160;;;;;https://linkedin.com/in/lukasz-kucinski;piotr-milos-4b02151/",
        "or_profile": "~Maciej_Wolczyk1;~Bart\u0142omiej_Cupia\u01421;~Mateusz_Ostaszewski1;~Micha\u0142_Bortkiewicz1;~Micha\u0142_Zaj\u0105c1;~Razvan_Pascanu1;~\u0141ukasz_Kuci\u0144ski1;~Piotr_Mi\u0142o\u015b1",
        "aff": "IDEAS NCBR Sp.;University of Warsaw;;;FAR AI;Google DeepMind;Institute of Mathematics Polish Academy of Sciences;IDEAS NCBR",
        "aff_domain": "ideas-ncbr.pl;uw.edu.pl;;;far.ai;google.com;impan.pl;ideas-ncbr.pl",
        "position": "Postdoc;PhD student;;;Research Engineer;Research Scientist;Assistant Professor;Researcher",
        "bibtex": "@misc{\nwolczyk2024the,\ntitle={The Role of Forgetting in Fine-Tuning Reinforcement Learning Models},\nauthor={Maciej Wolczyk and Bart{\\l}omiej Cupia{\\l} and Mateusz Ostaszewski and Micha{\\l} Bortkiewicz and Micha{\\l} Zaj{\\k{a}}c and Razvan Pascanu and {\\L}ukasz Kuci{\\'n}ski and Piotr Mi{\\l}o{\\'s}},\nyear={2024},\nurl={https://openreview.net/forum?id=FFvCjbhpDq}\n}",
        "github": "",
        "project": "",
        "reviewers": "bshN;BuFP;dWac;5ZRC",
        "site": "https://openreview.net/forum?id=FFvCjbhpDq",
        "pdf_size": 16243201,
        "rating": "3;3;6;8",
        "confidence": "4;4;4;4",
        "soundness": "2;3;3;3",
        "contribution": "1;1;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "72;118;141;76",
        "wc_strengths": "28;65;76;122",
        "wc_weaknesses": "194;103;190;81",
        "wc_questions": "47;73;338;79",
        "wc_review": "341;359;745;358",
        "wc_reply_reviewers": "0;0;18;35",
        "wc_reply_authors": "900;509;1538;680",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "2;2;4;2",
        "rating_avg": [
            5.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            101.75,
            28.951468011138918
        ],
        "wc_strengths_avg": [
            72.75,
            33.53636086399358
        ],
        "wc_weaknesses_avg": [
            142.0,
            50.62114182829147
        ],
        "wc_questions_avg": [
            134.25,
            118.24841436569034
        ],
        "wc_review_avg": [
            450.75,
            170.03584180989606
        ],
        "wc_reply_reviewers_avg": [
            13.25,
            14.549484526951462
        ],
        "wc_reply_authors_avg": [
            906.75,
            389.91753935928557
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            0.8660254037844386
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7224542359831138096&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;3;4;5",
        "aff_unique_norm": "IDEAS NCBR;University of Warsaw;FAR AI;Google;Polish Academy of Sciences;Institute for Development, Economic Analysis, and Simulation (IDEAS)",
        "aff_unique_dep": ";;;Google DeepMind;Institute of Mathematics;",
        "aff_unique_url": ";https://www.uw.edu.pl;https://www.far.ai;https://deepmind.com;https://www.impan.pl/;https://www.ideas-ncbr.gov.pl",
        "aff_unique_abbr": ";UW;FAR AI;DeepMind;PAS;IDEAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;2;0;0",
        "aff_country_unique": "Poland;United States;United Kingdom"
    },
    {
        "id": "FG9x4k2WZP",
        "title": "Conditional Diffusion Distillation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Generative diffusion models provide strong priors for text-to-image generation and thereby serve as a foundation for conditional generation tasks such as image editing, restoration, and super-resolution. However, one major limitation of diffusion models is their slow sampling time. To address this challenge, we present a novel conditional distillation method designed to supplement the diffusion priors with the help of image conditions, allowing for conditional sampling with very few steps. We directly distill the unconditional pre-training in a single stage through joint-learning, largely simplifying the previous two-stage procedures that involve both distillation and conditional finetuning separately. Furthermore, our method enables a new parameter-efficient distillation mechanism that distills each task with only a small number of additional parameters combined with the shared frozen unconditional backbone. Experiments across multiple tasks including super-resolution, image editing, and depth-to-image generation demonstrate that our method outperforms existing distillation techniques for the same sampling time. Notably, our method is the first distillation strategy that can match the performance of the much slower fine-tuned conditional diffusion models.",
        "keywords": "Generative Models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/09c2dea7c8a78fa6e482a7274c3e8ecdf88f1718.pdf",
        "author": "Kangfu Mei;Mauricio Delbracio;Hossein Talebi;Zhengzhong Tu;Vishal M. Patel;Peyman Milanfar",
        "authorids": "~Kangfu_Mei1;~Mauricio_Delbracio1;~Hossein_Talebi1;~Zhengzhong_Tu1;~Vishal_M._Patel1;~Peyman_Milanfar1",
        "gender": ";M;M;M;;M",
        "homepage": ";;;https://vztu.github.io;;http://www.milanfar.org",
        "dblp": ";90/10811;145/0046;218/1473.html;;48/6882",
        "google_scholar": ";lDDm920AAAAJ;kqXlLzYAAAAJ;9ajdZaEAAAAJ;;iGzDl8IAAAAJ",
        "orcid": ";;;0000-0002-7594-2292;;",
        "linkedin": ";;;zhengzhongtu/;;",
        "or_profile": "~Kangfu_Mei1;~Mauricio_Delbracio1;~Hossein_Talebi1;~Zhengzhong_Tu1;~Vishal_M._Patel1;~Peyman_Milanfar1",
        "aff": ";Google;Google Research;Google;;Google",
        "aff_domain": ";google.com;google.com;google.com;;google.com",
        "position": ";Research Scientist;Google Research;Researcher;;Distinguished Scientist",
        "bibtex": "@misc{\nmei2024conditional,\ntitle={Conditional Diffusion Distillation},\nauthor={Kangfu Mei and Mauricio Delbracio and Hossein Talebi and Zhengzhong Tu and Vishal M. Patel and Peyman Milanfar},\nyear={2024},\nurl={https://openreview.net/forum?id=FG9x4k2WZP}\n}",
        "github": "",
        "project": "",
        "reviewers": "ugTK;9yxs;UAJi;KX2e",
        "site": "https://openreview.net/forum?id=FG9x4k2WZP",
        "pdf_size": 16515284,
        "rating": "3;3;3;5",
        "confidence": "3;4;4;3",
        "soundness": "2;2;2;3",
        "contribution": "2;3;2;2",
        "presentation": "1;2;3;3",
        "wc_summary": "30;39;103;18",
        "wc_strengths": "18;80;121;16",
        "wc_weaknesses": "461;176;308;173",
        "wc_questions": "6;85;35;14",
        "wc_review": "515;380;567;221",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            47.5,
            32.89756829919196
        ],
        "wc_strengths_avg": [
            58.75,
            44.200537327050675
        ],
        "wc_weaknesses_avg": [
            279.5,
            118.11964273566018
        ],
        "wc_questions_avg": [
            35.0,
            30.748983723043597
        ],
        "wc_review_avg": [
            420.75,
            134.00816206485334
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13666841775797611460&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Google",
        "aff_unique_dep": "Google",
        "aff_unique_url": "https://www.google.com",
        "aff_unique_abbr": "Google",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Mountain View",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "FGoq622oqY",
        "title": "BayOTIDE: Bayesian Online Multivariate Time series Imputation with functional decomposition",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In real-world scenarios like traffic and energy, massive time-series data with missing values and noises are widely observed, even sampled irregularly. While many imputation methods have been proposed, most of them work with a local horizon, which means models are trained by splitting the long sequence into batches of fit-sized patches. This local horizon can make models ignore global trends or periodic patterns. More importantly, almost all methods assume the observations are sampled at regular time stamps, and fail to handle complex irregular sampled time series arising from different applications. Thirdly, most existing methods are learned in an offline manner. Thus, it is not suitable for many applications with fast-arriving streaming data. To overcome these limitations, we propose BayOTIDE: Bayesian Online Multivariate Time series Imputation with functional decomposition. We treat the multivariate time series as the weighted combination of groups of low-rank temporal factors with different patterns.  We apply a group of Gaussian Processes (GPs) with different kernels as functional priors to fit the factors. For computational efficiency, we further convert the GPs into a state-space prior by constructing an equivalent stochastic differential equation (SDE), and developing a scalable algorithm for online inference. The proposed method can not only handle imputation over arbitrary time stamps, but also offer uncertainty quantification and interpretability for the downstream application. We evaluate our method on both synthetic and real-world datasets.",
        "keywords": "Time series imputation;Bayesian model;Online learning",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/06102ae5ba8e55f58a00245a8ff7e75959728913.pdf",
        "author": "Shikai Fang;Qingsong Wen;Yingtao Luo;Shandian Zhe;Liang Sun",
        "authorids": "~Shikai_Fang2;~Qingsong_Wen2;~Yingtao_Luo1;~Shandian_Zhe1;~Liang_Sun2",
        "gender": ";;;;M",
        "homepage": ";;https://yingtaoluo.github.io/;;https://www.linkedin.com/in/liang-sun-a0a87621/",
        "dblp": ";;278/2956;;18/5837-1",
        "google_scholar": ";;g_MmNEoAAAAJ;;D_cOMBgAAAAJ",
        "orcid": ";;0000-0003-1794-3657;;0009-0002-5835-7259",
        "linkedin": ";;;;",
        "or_profile": "~Shikai_Fang2;~Qingsong_Wen2;~Yingtao_Luo1;~Shandian_Zhe1;~Liang_Sun2",
        "aff": ";;Carnegie Mellon University;;Alibaba Group",
        "aff_domain": ";;andrew.cmu.edu;;alibaba-inc.com",
        "position": ";;PhD student;;Staff Software Engineer",
        "bibtex": "@misc{\nfang2024bayotide,\ntitle={Bay{OTIDE}: Bayesian Online Multivariate Time series Imputation with functional decomposition},\nauthor={Shikai Fang and Qingsong Wen and Yingtao Luo and Shandian Zhe and Liang Sun},\nyear={2024},\nurl={https://openreview.net/forum?id=FGoq622oqY}\n}",
        "github": "",
        "project": "",
        "reviewers": "XZJX;PJoe;SiJc;CYA1;FPUc",
        "site": "https://openreview.net/forum?id=FGoq622oqY",
        "pdf_size": 830185,
        "rating": "5;5;5;5;8",
        "confidence": "3;3;3;2;4",
        "soundness": "3;3;3;2;4",
        "contribution": "3;2;3;2;3",
        "presentation": "2;2;2;1;3",
        "wc_summary": "103;80;97;90;120",
        "wc_strengths": "54;55;106;64;81",
        "wc_weaknesses": "202;66;72;24;73",
        "wc_questions": "110;201;159;15;159",
        "wc_review": "469;402;434;193;433",
        "wc_reply_reviewers": "36;56;0;91;49",
        "wc_reply_authors": "468;631;714;348;636",
        "reply_reviewers": "1;1;0;1;1",
        "reply_authors": "2;3;2;3;2",
        "rating_avg": [
            5.6,
            1.2
        ],
        "confidence_avg": [
            3.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            3.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            98.0,
            13.401492454200763
        ],
        "wc_strengths_avg": [
            72.0,
            19.56527536223296
        ],
        "wc_weaknesses_avg": [
            87.4,
            60.09192957461093
        ],
        "wc_questions_avg": [
            128.8,
            63.78212915856604
        ],
        "wc_review_avg": [
            386.2,
            98.90075833885197
        ],
        "wc_reply_reviewers_avg": [
            46.4,
            29.49305002877797
        ],
        "wc_reply_authors_avg": [
            559.4,
            132.61915397106105
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4
        ],
        "reply_authors_avg": [
            2.4,
            0.4898979485566356
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.7905694150420948,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17471294240726183854&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Carnegie Mellon University;Alibaba Group",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cmu.edu;https://www.alibaba.com",
        "aff_unique_abbr": "CMU;Alibaba",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "FH7lfTfjcm",
        "title": "ADELT: Transpilation Between Deep Learning Frameworks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We propose the Adversarial DEep Learning Transpiler (ADELT), a novel approach to source-to-source transpilation between deep learning frameworks. ADELT uniquely decouples code skeleton transpilation and API keyword mapping. For code transpilation, it uses few-shot prompting on large language models, while for API keyword mapping, it employs contextual embeddings from a code-specific BERT. These embeddings are trained in a domain-adversarial setup to generate a keyword translation dictionary. ADELT is trained on an unlabeled web-crawled deep learning corpus, eschewing hand-crafted rules and parallel data. It outperforms state-of-the-art transpilers, improving exact match scores by 15.9 pts and 12.0 pts for PyTorch-Keras and PyTorch-MXNet transpilation pairs respectively. We provide open access to our code, corpus, and evaluation benchmarks.",
        "keywords": "Code Transpilation;Deep Learning;Deep Learning Frameworks;PyTorch;Application;Adversarial Training",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/9a4dc14b026f87ae6a22fb6dc70ee04b96548e20.zip",
        "author": "Linyuan Gong;Jiayi Wang;Alvin Cheung",
        "authorids": "~Linyuan_Gong1;~Jiayi_Wang6;~Alvin_Cheung2",
        "gender": "M;M;",
        "homepage": "https://gonglinyuan.com;;",
        "dblp": "213/8172;;",
        "google_scholar": "w5A4QPQAAAAJ;;",
        "orcid": ";;",
        "linkedin": ";jiayi-wang-8abb2a156/;",
        "or_profile": "~Linyuan_Gong1;~Jiayi_Wang6;~Alvin_Cheung2",
        "aff": "University of California, Berkeley;;",
        "aff_domain": "berkeley.edu;;",
        "position": "PhD student;;",
        "bibtex": "@misc{\ngong2024adelt,\ntitle={{ADELT}: Transpilation Between Deep Learning Frameworks},\nauthor={Linyuan Gong and Jiayi Wang and Alvin Cheung},\nyear={2024},\nurl={https://openreview.net/forum?id=FH7lfTfjcm}\n}",
        "github": "",
        "project": "",
        "reviewers": "DL7Y;MAQg;hxrU;TwWZ",
        "site": "https://openreview.net/forum?id=FH7lfTfjcm",
        "pdf_size": 506126,
        "rating": "3;3;6;6",
        "confidence": "4;5;4;4",
        "soundness": "1;3;4;3",
        "contribution": "2;2;4;3",
        "presentation": "2;3;3;3",
        "wc_summary": "112;53;62;156",
        "wc_strengths": "45;48;95;222",
        "wc_weaknesses": "162;204;77;84",
        "wc_questions": "115;35;35;149",
        "wc_review": "434;340;269;611",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "790;766;212;659",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            1.0897247358851685
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            95.75,
            41.41482222586498
        ],
        "wc_strengths_avg": [
            102.5,
            71.78614072368008
        ],
        "wc_weaknesses_avg": [
            131.75,
            53.41523659032131
        ],
        "wc_questions_avg": [
            83.5,
            49.96748943062879
        ],
        "wc_review_avg": [
            413.5,
            128.16883396520387
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            606.75,
            233.18380625592334
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896258,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9034244923532131120&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of California, Berkeley",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.berkeley.edu",
        "aff_unique_abbr": "UC Berkeley",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Berkeley",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "FHhj5d2gYe",
        "title": "Image-driven Video Editing with Latent Diffusion Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recent works in Text-to-Image (T2I) models have shown potential in addressing text-driven video editing using latent diffusion models (LDM). However, text prompts as a representation of visual signals remain a crude abstraction, leaving the challenge of achieving fine-grained and controllable video editing unresolved. In this study, we introduce the Latent prompt based Image-driven Video Editing (LIVE) framework to unlock the capabilities of pretrained LDM for precise editing control. At the heart of LIVE lies a novel Latent Prompt Mechanism, which utilizes latent code from a reference image as a prompt to enrich visual details. We begin by revisiting the attention mechanisms in LDM and enhancing them to facilitate comprehensive interactions between video frames and latent prompts in both spatial and temporal dimensions. We also devise a training process to fine-tune components such as latent prompts, textual embeddings, and LDM parameters, effectively representing the provided video and image within the diffusion space. Subsequently, these optimized elements are combined to generate the edited video output, enabling seamless object substitution in each frame with user-specified targets while maintaining visual consistency across frames. Our experiments on real-world videos demonstrate the efficacy of the LIVE framework and its promising applications in image-driven video editing tasks.",
        "keywords": "Diffusion Model;Video edit",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/306ddc75e98611672f8b04e2cdc0141849dd5305.zip",
        "author": "Liangbing Zhao;Zicheng Zhang;Xuecheng Nie;Si Liu;Luoqi Liu",
        "authorids": "~Liangbing_Zhao1;~Zicheng_Zhang3;~Xuecheng_Nie2;~Si_Liu5;~Luoqi_Liu7",
        "gender": "M;M;F;M;M",
        "homepage": "https://liangbingzhao.github.io/;https://niexc.github.io/;https://colalab.net;;",
        "dblp": ";124/9139;60/7642;29/8842;",
        "google_scholar": "1xzCu0wAAAAJ;https://scholar.google.com.sg/citations?user=h93ctSsAAAAJ;https://scholar.google.com/citations?hl=zh-CN;nw4XTwMAAAAJ;H8WNWPsAAAAJ",
        "orcid": ";;0000-0002-9180-2935;;",
        "linkedin": ";;;;",
        "or_profile": "~Liangbing_Zhao1;~Xuecheng_Nie2;~Si_Liu5;~Luoqi_Liu7;~zicheng_zhang1",
        "aff": "King Abdullah University of Science and Technology;Meitu Inc.;Beihang University;Meitu inc;University of Chinese Academy of Sciences",
        "aff_domain": "kaust.edu.sa;meitu.com;buaa.edu.cn;meitu.com;ucas.ac.cn",
        "position": "MS student;Researcher;Full Professor;Principal Researcher;PhD student",
        "bibtex": "@misc{\nzhao2024imagedriven,\ntitle={Image-driven Video Editing with Latent Diffusion Models},\nauthor={Liangbing Zhao and Zicheng Zhang and Xuecheng Nie and Si Liu and Luoqi Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=FHhj5d2gYe}\n}",
        "github": "",
        "project": "",
        "reviewers": "W3nE;9nKT;PX4c;oLny",
        "site": "https://openreview.net/forum?id=FHhj5d2gYe",
        "pdf_size": 21626909,
        "rating": "3;3;5;5",
        "confidence": "5;3;3;4",
        "soundness": "2;3;3;2",
        "contribution": "3;3;2;2",
        "presentation": "2;2;3;2",
        "wc_summary": "65;94;79;102",
        "wc_strengths": "89;122;86;44",
        "wc_weaknesses": "220;361;197;226",
        "wc_questions": "78;12;13;6",
        "wc_review": "452;589;375;378",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            85.0,
            14.19506956657839
        ],
        "wc_strengths_avg": [
            85.25,
            27.6891224129621
        ],
        "wc_weaknesses_avg": [
            251.0,
            64.42437426937106
        ],
        "wc_questions_avg": [
            27.25,
            29.422567868899545
        ],
        "wc_review_avg": [
            448.5,
            86.7827747885489
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.30151134457776363,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:wHlG-rDxMUgJ:scholar.google.com/&scioq=Image-driven+Video+Editing+with+Latent+Diffusion+Models&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "King Abdullah University of Science and Technology;Meitu Inc.;Beihang University;Meitu Inc;University of Chinese Academy of Sciences",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.kast.kau.edu.sa;https://www.meitu.com;http://www.buaa.edu.cn/;https://www.meitu.com;http://www.ucas.ac.cn",
        "aff_unique_abbr": "KAUST;Meitu;BUAA;Meitu;UCAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;1",
        "aff_country_unique": "Saudi Arabia;China"
    },
    {
        "title": "Multimarginal Generative Modeling with Stochastic Interpolants",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19075",
        "id": "FHqAzWl2wE",
        "author_site": "Michael Albergo, Nicholas Boffi, Michael Lindsey, Eric Vanden-Eijnden",
        "tldr": "",
        "abstract": "Given a set of $K$ probability densities, we consider the multimarginal generative modeling problem of learning a joint distribution that recovers these densities as marginals. The structure of this joint distribution should identify multi-way correspondences among the prescribed marginals. We formalize an approach to this task within a generalization of the stochastic interpolant framework, leading to efficient learning algorithms built upon dynamical transport of measure. Our generative models are defined by velocity and score fields that can be characterized as the minimizers of simple quadratic objectives, and they are defined on a simplex that generalizes the time variable in the usual dynamical transport framework. The resulting transport on the simplex is influenced by all marginals, and we show that multi-way correspondences can be extracted. The identification of such correspondences has applications to style transfer, algorithmic fairness, and data decorruption.  In addition, the multimarginal perspective enables an efficient algorithm for optimizing the dynamical transport cost in the ordinary two-marginal setting. We demonstrate these capacities with several numerical examples.",
        "keywords": "multi-marginal;unsupervised learning;generative modeling;measure transport;optimal transport",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Michael Samuel Albergo;Nicholas Matthew Boffi;Michael Lindsey;Eric Vanden-Eijnden",
        "authorids": "~Michael_Samuel_Albergo1;~Nicholas_Matthew_Boffi1;~Michael_Lindsey1;~Eric_Vanden-Eijnden1",
        "gender": "M;M;;M",
        "homepage": "http://malbergo.me;https://nmboffi.github.io;https://quantumtative.github.io/;https://wp.nyu.edu/courantinstituteofmathematicalsciences-eve2/",
        "dblp": ";;;88/7927",
        "google_scholar": "GQyCZ4kAAAAJ;_jkX2q0AAAAJ;;A5Gx65gAAAAJ",
        "orcid": "0000-0001-9058-5943;;;",
        "linkedin": ";;;",
        "or_profile": "~Michael_Samuel_Albergo1;~Nicholas_Matthew_Boffi1;~Michael_Lindsey1;~Eric_Vanden-Eijnden1",
        "aff": "New York University;NYU, New York University;University of California, Berkeley;New York University",
        "aff_domain": "nyu.edu;cims.nyu.edu;berkeley.edu;nyu.edu",
        "position": "PhD student;Instructor;Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\nalbergo2024multimarginal,\ntitle={Multimarginal Generative Modeling with Stochastic Interpolants},\nauthor={Michael Samuel Albergo and Nicholas Matthew Boffi and Michael Lindsey and Eric Vanden-Eijnden},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=FHqAzWl2wE}\n}",
        "github": "",
        "project": "",
        "reviewers": "yfUs;2Wkn;PidH",
        "pdf_size": 7307516,
        "rating": "5;5;8",
        "confidence": "3;4;3",
        "soundness": "3;3;4",
        "contribution": "2;3;4",
        "presentation": "3;3;3",
        "wc_summary": "54;144;37",
        "wc_strengths": "34;85;46",
        "wc_weaknesses": "68;149;36",
        "wc_questions": "23;136;39",
        "wc_review": "179;514;158",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "436;663;318",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            6.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            78.33333333333333,
            46.949145063805176
        ],
        "wc_strengths_avg": [
            55.0,
            21.77154105707724
        ],
        "wc_weaknesses_avg": [
            84.33333333333333,
            47.55581516024676
        ],
        "wc_questions_avg": [
            66.0,
            49.926612809869916
        ],
        "wc_review_avg": [
            283.6666666666667,
            163.09574556751082
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            472.3333333333333,
            143.16967400799498
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17935311711721244830&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=FHqAzWl2wE",
        "pdf": "https://openreview.net/pdf?id=FHqAzWl2wE",
        "email": "nyu.edu;cims.nyu.edu;berkeley.edu;nyu.edu",
        "author_num": 4,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "New York University;University of California, Berkeley",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.nyu.edu;https://www.berkeley.edu",
        "aff_unique_abbr": "NYU;UC Berkeley",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";New York;Berkeley",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "FI0vOp2asx",
        "title": "Cooperative Hardware-Prompt Learning for Snapshot Compressive Imaging",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Spectral snapshot compressive imaging (Spectral SCI) applies an optical encoder to compressively capture 2D measurements, followed by which the 3D hyperspectral data can be restored via training a deep reconstruction network. Existing reconstruction models are generally trained with a single well-calibrated hardware instance, making their performance vulnerable to hardware shifts and limited in adapting to multiple hardware configurations. To facilitate cross-hardware learning, previous efforts attempt to directly collect multi-hardware data and perform centralized training, which, however, is impractical due to severe user data privacy concerns and hardware heterogeneity across different platforms/institutions. In this study, we explicitly consider data privacy and heterogeneity in cooperatively optimizing spectral SCI systems by proposing a novel Federated Hardware-Prompt learning (FedHP) framework. Rather than mitigating the client drift by rectifying the gradients, which only takes effect on the learning manifold but fails to solve the heterogeneity rooted in the input data space, FedHP learns a hardware-conditioned prompter to align inconsistent data distribution across clients, serving as an indicator of the data inconsistency among different coded apertures. Extensive experiments demonstrate that the proposed FedHP coordinates the pre-trained model to multiple hardware configurations, outperforming prevalent FL frameworks for 0.35dB under challenging heterogeneous setting. Moreover, a new Snapshot Spectral Heterogeneous Dataset (SSHD) has been built upon multiple practical spectral SCI systems. We will release the data and code to enrich further exploration of this practical computational imaging problem.",
        "keywords": "snapshot compressive imaging;hyperpectral imaging;prompt learning;federated learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/3b35e5377d5c8176a843d141492de06f91f9ef65.zip",
        "author": "Jiamian Wang;Zongliang Wu;Yulun Zhang;Xin Yuan;Tao Lin;ZHIQIANG TAO",
        "authorids": "~Jiamian_Wang1;~Zongliang_Wu1;~Yulun_Zhang1;~Xin_Yuan4;~Tao_Lin1;~ZHIQIANG_TAO2",
        "gender": "M;M;M;M;M;",
        "homepage": "https://jiamian-wang.github.io/;;http://yulunzhang.com/;https://en.westlake.edu.cn/faculty/xin-yuan.html;https://lins-lab.github.io/;http://ztao.cc/",
        "dblp": "291/6309;;166/2763-1.html;78/713-2;64/4492-4.html;135/5229.html",
        "google_scholar": "MGSkEscAAAAJ;;ORmLjWoAAAAJ;cS9CbWkAAAAJ;QE9pa_cAAAAJ;sEKglOkAAAAJ",
        "orcid": ";0000-0003-0750-0246;0000-0002-2288-5079;0000-0002-8311-7524;0000-0002-3246-6935;",
        "linkedin": "%E5%8A%A0%E5%86%95-%E7%8E%8B-5928b81ba/;;yulun-zhang-1116b5b9/;xin-yuan-0024bb31/;;",
        "or_profile": "~Jiamian_Wang1;~Zongliang_Wu1;~Yulun_Zhang1;~Xin_Yuan4;~Tao_Lin1;~ZHIQIANG_TAO2",
        "aff": "Rochester Institute of Technology;Zhejiang University;Swiss Federal Institute of Technology;Westlake University;Westlake University;Rochester Institute of Technology",
        "aff_domain": "rit.edu;zju.edu.cn;ethz.ch;westlake.edu.cn;westlake.edu;rit.edu",
        "position": "PhD student;PhD student;Postdoc;Associate Professor;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nwang2024cooperative,\ntitle={Cooperative Hardware-Prompt Learning for Snapshot Compressive Imaging},\nauthor={Jiamian Wang and Zongliang Wu and Yulun Zhang and Xin Yuan and Tao Lin and ZHIQIANG TAO},\nyear={2024},\nurl={https://openreview.net/forum?id=FI0vOp2asx}\n}",
        "github": "",
        "project": "",
        "reviewers": "bAjN;99wV;X7WS;UbMX",
        "site": "https://openreview.net/forum?id=FI0vOp2asx",
        "pdf_size": 5666155,
        "rating": "6;6;8;8",
        "confidence": "3;4;5;4",
        "soundness": "3;2;4;4",
        "contribution": "2;3;3;4",
        "presentation": "2;3;4;3",
        "wc_summary": "41;81;66;66",
        "wc_strengths": "99;52;93;153",
        "wc_weaknesses": "247;101;88;78",
        "wc_questions": "185;55;33;66",
        "wc_review": "572;289;280;363",
        "wc_reply_reviewers": "0;29;18;17",
        "wc_reply_authors": "1461;751;568;674",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            63.5,
            14.361406616345072
        ],
        "wc_strengths_avg": [
            99.25,
            35.91918011313733
        ],
        "wc_weaknesses_avg": [
            128.5,
            68.90029027515051
        ],
        "wc_questions_avg": [
            84.75,
            59.08627167117587
        ],
        "wc_review_avg": [
            376.0,
            117.65415419780128
        ],
        "wc_reply_reviewers_avg": [
            16.0,
            10.36822067666386
        ],
        "wc_reply_authors_avg": [
            863.5,
            351.0316937257945
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.7071067811865475,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17681974547602435562&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;3;3;0",
        "aff_unique_norm": "Rochester Institute of Technology;Zhejiang University;Swiss Federal Institute of Technology;Westlake University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.rit.edu;https://www.zju.edu.cn;https://www.ethz.ch;https://www.westlake.edu.cn",
        "aff_unique_abbr": "RIT;ZJU;ETH Zurich;WU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;1;1;0",
        "aff_country_unique": "United States;China;Switzerland"
    },
    {
        "title": "CLIP the Bias: How Useful is Balancing Data in Multimodal Learning?",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19074",
        "id": "FIGXAxr9E4",
        "author_site": "Ibrahim Alabdulmohsin, Xiao Wang, Andreas Steiner, Priya Goyal, Alexander D'Amour, Xiaohua Zhai",
        "tldr": "",
        "abstract": "We study data-balancing for mitigating biases in contrastive language-image pretraining (CLIP), identifying areas of strength and limitation. First, we reaffirm prior conclusions that CLIP can inadvertently absorb stereotypes. To counter this, we present a novel algorithm, called Multi-Modal Moment Matching (M4), designed to reduce both representation and association biases in multimodal data. We use M4 to conduct an in-depth analysis taking into account various factors, such as the model, representation, and data size. Our study also explores the dynamic nature of how CLIP learns/unlearns biases. In particular, we find that fine-tuning is effective in countering representation biases, though its impact diminishes for association biases. Also, data balancing has a mixed impact on quality: it tends to improve classification but can hurt retrieval. Interestingly, data and architectural improvements seem to mitigate the negative impact of data balancing on performance; e.g. applying M4 to SigLIP-B/16 with data quality filters improves COCO image-to-text retrieval @5 from 86% (without data balancing) to 87% and ImageNet 0-shot classification from 77% to 77.5%! Finally, we conclude with recommendations for improving the efficacy of data balancing in multimodal systems.",
        "keywords": "contrastive language image pretraining;multimodal learning;fairness;bias;data balancing",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Ibrahim Alabdulmohsin;Xiao Wang;Andreas Peter Steiner;Priya Goyal;Alexander D'Amour;Xiaohua Zhai",
        "authorids": "~Ibrahim_Alabdulmohsin1;~Xiao_Wang5;~Andreas_Peter_Steiner1;~Priya_Goyal1;~Alexander_D'Amour1;~Xiaohua_Zhai2",
        "gender": "M;M;M;F;M;",
        "homepage": "http://ibomohsin.com;;;https://prigoyal.github.io/;http://www.alexdamour.com;",
        "dblp": "153/5393;49/67-38;s/AndreasSteiner;202/2125;209/4892;66/636",
        "google_scholar": "8WNMsPYAAAAJ;ukyXqzMAAAAJ;;-9yiQMsAAAAJ;okP0uukAAAAJ;",
        "orcid": ";;;;;",
        "linkedin": ";;andreas-steiner-1859223b/;;;",
        "or_profile": "~Ibrahim_Alabdulmohsin1;~Xiao_Wang5;~Andreas_Peter_Steiner1;~Priya_Goyal1;~Alexander_D'Amour1;~Xiaohua_Zhai2",
        "aff": "Google;Google DeepMind;Google DeepMind;Google;Google;Google DeepMind",
        "aff_domain": "google.com;google.com;deepmind.com;google.com;google.com;google.com",
        "position": "Research Scientist;Researcher;Research Engineer;Researcher;Research Scientist;Researcher",
        "bibtex": "@inproceedings{\nalabdulmohsin2024clip,\ntitle={{CLIP} the Bias: How Useful is Balancing Data in Multimodal Learning?},\nauthor={Ibrahim Alabdulmohsin and Xiao Wang and Andreas Peter Steiner and Priya Goyal and Alexander D'Amour and Xiaohua Zhai},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=FIGXAxr9E4}\n}",
        "github": "",
        "project": "",
        "reviewers": "yvnK;5bEw;yZxD",
        "pdf_size": 7459279,
        "rating": "6;6;6",
        "confidence": "4;3;4",
        "soundness": "3;2;3",
        "contribution": "2;2;3",
        "presentation": "3;3;3",
        "wc_summary": "70;149;62",
        "wc_strengths": "81;50;40",
        "wc_weaknesses": "124;30;50",
        "wc_questions": "225;48;51",
        "wc_review": "500;277;203",
        "wc_reply_reviewers": "0;132;60",
        "wc_reply_authors": "623;590;401",
        "reply_reviewers": "0;1;1",
        "reply_authors": "2;2;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            93.66666666666667,
            39.262648351270904
        ],
        "wc_strengths_avg": [
            57.0,
            17.45470328211473
        ],
        "wc_weaknesses_avg": [
            68.0,
            40.431011200150145
        ],
        "wc_questions_avg": [
            108.0,
            82.74055837375042
        ],
        "wc_review_avg": [
            326.6666666666667,
            126.23346976491176
        ],
        "wc_reply_reviewers_avg": [
            64.0,
            53.96295025292817
        ],
        "wc_reply_authors_avg": [
            538.0,
            97.80593029055038
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11871824030346999268&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=FIGXAxr9E4",
        "pdf": "https://openreview.net/pdf?id=FIGXAxr9E4",
        "email": "google.com;google.com;deepmind.com;google.com;google.com;google.com",
        "author_num": 6,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "Google",
        "aff_unique_dep": "Google",
        "aff_unique_url": "https://www.google.com",
        "aff_unique_abbr": "Google",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Mountain View;",
        "aff_country_unique_index": "0;1;1;0;0;1",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "title": "QLLM: Accurate and Efficient Low-Bitwidth Quantization for Large Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19073",
        "id": "FIplmUWdm3",
        "author_site": "Jing Liu, Ruihao Gong, Xiuying Wei, Zhiwei Dong, Jianfei Cai, Bohan Zhuang",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) have demonstrated unparalleled efficacy in natural language processing. However, their high computational demands and memory overheads hinder their broad deployment. To address this, two quantization strategies emerge, including Quantization-Aware Training (QAT) and Post-Training Quantization (PTQ). For LLMs, the billions of parameters make the QAT impractical due to the prohibitive training cost and thus PTQ becomes more prevalent. In existing studies, activation outliers in particular channels are identified as the biggest challenge to PTQ accuracy. They propose to transform the magnitudes from activations to weights, which however offers limited alleviation or suffers from unstable gradients, resulting in a severe performance drop at low-bitwidth. In this paper, we propose QLLM, an accurate and efficient low-bitwidth PTQ method designed for LLMs. QLLM introduces an adaptive channel reassembly technique that reallocates the magnitude of outliers to other channels, thereby mitigating their impact on the quantization range. This is achieved by channel disassembly and channel assembly, which first breaks down the outlier channels into several sub-channels to ensure a more balanced distribution of activation magnitudes. Then similar channels are merged to maintain the original channel number for efficiency. Additionally, an adaptive strategy is designed to autonomously determine the optimal number of sub-channels for channel disassembly. To further compensate for the performance loss caused by quantization, we propose an efficient tuning method that only learns a small number of low-rank weights while freezing the pre-trained quantized model. After training, these low-rank parameters can be fused into the frozen weights without affecting inference. Extensive experiments on LLaMA-1 and LLaMA-2 show that QLLM is able to obtain accurate quantized models efficiently. For example, QLLM quantizes the 4-bit LLaMA-2-70B within 10 hours on a single A100-80G GPU, outperforming the previous state-of-the-art method by 7.89% on the average accuracy across five zero-shot tasks. Code is available at [ZIP Lab](https://github.com/ziplab/QLLM) and [ModelTC](https://github.com/ModelTC/QLLM).",
        "keywords": "Network Quantization;Large Language Models",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Jing Liu;Ruihao Gong;Xiuying Wei;Zhiwei Dong;Jianfei Cai;Bohan Zhuang",
        "authorids": "~Jing_Liu8;~Ruihao_Gong1;~Xiuying_Wei1;~Zhiwei_Dong1;~Jianfei_Cai1;~Bohan_Zhuang1",
        "gender": "M;M;F;M;M;M",
        "homepage": "https://www.jing-liu.com/;https://xhplus.github.io;https://wimh966.github.io/;https://zwdong.com.cn;https://jianfei-cai.github.io/;https://bohanzhuang.github.io/",
        "dblp": "72/2590-48;247/1172;315/9021;;83/6096;145/1096",
        "google_scholar": "-lHaZH4AAAAJ;8i7Z15kAAAAJ;;RFJ4DuYAAAAJ;https://scholar.google.com.tw/citations?user=N6czCoUAAAAJ;https://scholar.google.com.au/citations?user=DFuDBBwAAAAJ",
        "orcid": "0000-0002-6745-3050;0000-0002-6024-7086;;;;",
        "linkedin": "jing-liu-619688133/;;%E7%A7%80%E9%A2%96-%E9%AD%8F-6b1277221/;;;bohan-zhuang/",
        "or_profile": "~Jing_Liu8;~Ruihao_Gong1;~Xiuying_Wei1;~Zhiwei_Dong1;~Jianfei_Cai1;~Bohan_Zhuang1",
        "aff": "Monash University;SenseTime;EPFL - EPF Lausanne;University of Science and Technology Beijing;Monash University;Monash University",
        "aff_domain": "monash.edu.au;sensetime.com;epfl.ch;ustb.edu.cn;monash.edu;monash.edu",
        "position": "PhD student;Principal Researcher;PhD student;PhD student;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nliu2024qllm,\ntitle={{QLLM}: Accurate and Efficient Low-Bitwidth Quantization for Large Language Models},\nauthor={Jing Liu and Ruihao Gong and Xiuying Wei and Zhiwei Dong and Jianfei Cai and Bohan Zhuang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=FIplmUWdm3}\n}",
        "github": "",
        "project": "",
        "reviewers": "rXfg;wUVT;KacJ;dSZP",
        "pdf_size": 1838006,
        "rating": "6;6;6;6",
        "confidence": "4;4;4;5",
        "soundness": "3;3;3;3",
        "contribution": "3;2;2;3",
        "presentation": "3;2;3;2",
        "wc_summary": "64;151;137;176",
        "wc_strengths": "56;56;38;39",
        "wc_weaknesses": "227;167;254;155",
        "wc_questions": "5;351;60;145",
        "wc_review": "352;725;489;515",
        "wc_reply_reviewers": "37;208;21;17",
        "wc_reply_authors": "753;2490;1102;520",
        "reply_reviewers": "1;2;1;1",
        "reply_authors": "2;6;4;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            132.0,
            41.67133307202926
        ],
        "wc_strengths_avg": [
            47.25,
            8.757139944068497
        ],
        "wc_weaknesses_avg": [
            200.75,
            41.09972627646077
        ],
        "wc_questions_avg": [
            140.25,
            131.50166348757722
        ],
        "wc_review_avg": [
            520.25,
            133.44919445242073
        ],
        "wc_reply_reviewers_avg": [
            70.75,
            79.5938910972444
        ],
        "wc_reply_authors_avg": [
            1216.25,
            764.0119027214171
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.5,
            1.6583123951777
        ],
        "replies_avg": [
            31,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 68,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15715045504028392144&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=FIplmUWdm3",
        "pdf": "https://openreview.net/pdf?id=FIplmUWdm3",
        "email": "monash.edu.au;sensetime.com;epfl.ch;ustb.edu.cn;monash.edu;monash.edu",
        "author_num": 6,
        "aff_unique_index": "0;1;2;3;0;0",
        "aff_unique_norm": "Monash University;SenseTime;EPFL;University of Science and Technology Beijing",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.monash.edu;https://www.sensetime.com;https://www.epfl.ch;http://www.ustb.edu.cn",
        "aff_unique_abbr": "Monash;SenseTime;EPFL;USTB",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Lausanne",
        "aff_country_unique_index": "0;1;2;1;0;0",
        "aff_country_unique": "Australia;China;Switzerland"
    },
    {
        "id": "FItPCl4uEc",
        "title": "Efficient Transfer Learning from Arbitrary Pre-Trained Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Transfer learning typically involves loading pre-trained weights as an initialization, followed by fine-tuning on a downstream task. As pre-trained models become ever larger, this procedure is becoming prohibitively expensive, as we are forced to re-use the pre-trained architecture for fine-tuning. This procedure also precludes combining multiple pre-trained models that learn complementary information. Moreover, alternatives such as knowledge distillation do not reflect that we wish to transfer aspects of the pre-trained representation that are most relevant to the downstream task. To address these challenges, we introduce Adaptive Feature Transfer (AFT). Instead of transferring weights, AFT operates purely on features, thereby decoupling the choice of the pre-trained model from the possibly smaller downstream model. AFT (1) enables transfer from multiple pre-trained models, even over multiple modalities, with minimal training overhead and no inference overhead; (2) selectively transfers the information in the pre-trained features most relevant for the downstream task, through a prior that favors low mutual information between the downstream inputs and features given the pre-trained features; (3) performs feature transfer in an efficient kernel formulation that prioritizes the most relevant degrees of freedom. Empirically, AFT delivers a substantial boost in performance across diverse vision, language, and multi-modal datasets, relative to both standard transfer learning and knowledge distillation with the downstream model.",
        "keywords": "Transfer learning;Foundation models",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Shikai Qiu;Boran Han;Danielle C. Maddix;Shuai Zhang;Bernie Wang;Andrew Gordon Wilson",
        "authorids": "~Shikai_Qiu1;~Boran_Han1;~Danielle_C._Maddix1;~Shuai_Zhang7;~Bernie_Wang1;~Andrew_Gordon_Wilson1",
        "gender": "M;;;;M;Not Specified",
        "homepage": "https://shikaiqiu.github.io/;;https://dcmaddix.github.io/;;http://web.mit.edu/~ywang02/www/;https://cims.nyu.edu/~andrewgw",
        "dblp": ";;216/8804;;43/8355-1;65/10453",
        "google_scholar": "pK0OAsQAAAAJ;;IPDByA8AAAAJ;;IKUm624AAAAJ;https://scholar.google.com.tw/citations?user=twWX2LIAAAAJ",
        "orcid": ";;;;0000-0002-0291-7184;",
        "linkedin": ";;danielle-maddix-robinson/;;;",
        "or_profile": "~Shikai_Qiu1;~Boran_Han1;~Danielle_C._Maddix1;~Shuai_Zhang7;~Bernie_Wang1;~Andrew_Gordon_Wilson1",
        "aff": "New York University;;AWS AI Labs;;Amazon;New York University",
        "aff_domain": "nyu.edu;;amazon.com;;amazon.com;nyu.edu",
        "position": "PhD student;;Applied Scientist;;Principal Researcher;Associate Professor",
        "bibtex": "@misc{\nqiu2024efficient,\ntitle={Efficient Transfer Learning from Arbitrary Pre-Trained Models},\nauthor={Shikai Qiu and Boran Han and Danielle C. Maddix and Shuai Zhang and Bernie Wang and Andrew Gordon Wilson},\nyear={2024},\nurl={https://openreview.net/forum?id=FItPCl4uEc}\n}",
        "github": "",
        "project": "",
        "reviewers": "U9CF;ocxo;U7ws;QqHJ",
        "site": "https://openreview.net/forum?id=FItPCl4uEc",
        "pdf_size": 506785,
        "rating": "3;6;6;6",
        "confidence": "4;4;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;2;2",
        "presentation": "2;3;3;2",
        "wc_summary": "79;108;75;71",
        "wc_strengths": "64;68;32;30",
        "wc_weaknesses": "343;166;351;207",
        "wc_questions": "52;116;189;37",
        "wc_review": "538;458;647;345",
        "wc_reply_reviewers": "252;39;0;15",
        "wc_reply_authors": "931;890;789;697",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            83.25,
            14.566657131957214
        ],
        "wc_strengths_avg": [
            48.5,
            17.57128339080558
        ],
        "wc_weaknesses_avg": [
            266.75,
            81.59771749258677
        ],
        "wc_questions_avg": [
            98.5,
            60.08535595301071
        ],
        "wc_review_avg": [
            497.0,
            110.46040014412405
        ],
        "wc_reply_reviewers_avg": [
            76.5,
            102.27536360238472
        ],
        "wc_reply_authors_avg": [
            826.75,
            91.00652449137918
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:qPTaTvS_mlUJ:scholar.google.com/&scioq=Efficient+Transfer+Learning+from+Arbitrary+Pre-Trained+Models&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;0",
        "aff_unique_norm": "New York University;Amazon",
        "aff_unique_dep": ";AWS AI Labs",
        "aff_unique_url": "https://www.nyu.edu;https://aws.amazon.com",
        "aff_unique_abbr": "NYU;AWS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "SequenceMatch: Imitation Learning for Autoregressive Sequence Modelling with Backtracking",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19072",
        "id": "FJWT0692hw",
        "author_site": "Chris Cundy, Stefano Ermon",
        "tldr": "",
        "abstract": "In many domains, autoregressive models can attain high likelihood on the task of predicting the next observation. However, this maximum-likelihood (MLE) objective does not necessarily match a downstream use-case of autoregressively generating high-quality sequences. The MLE objective weights sequences proportionally to their frequency under the data distribution, with no guidance for the model's behaviour out of distribution (OOD): leading to compounding error during autoregressive generation. In order to address this compounding error problem, we formulate sequence generation as an imitation learning (IL) problem. This allows us to minimize a variety of divergences between the distribution of sequences generated by an autoregressive model and sequences from a dataset, including divergences with weight on OOD generated sequences. The IL framework also allows us to incorporate backtracking by introducing a backspace action into the generation process. This further mitigates the compounding error problem by allowing the model to revert a sampled token if it takes the sequence OOD. Our resulting method, SequenceMatch, can be implemented without adversarial training or major architectural changes. We identify the SequenceMatch-\u03c72 divergence as a more suitable training objective for autoregressive models which are used for generation. We show that empirically, SequenceMatch training leads to improvements over MLE on text generation with language models and arithmetic",
        "keywords": "Sequence Modelling;Imitiation Learning;Language Modelling",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/e4fc212a684d7bd02f8fddc68e8d65a37913041d.pdf",
        "author": "Chris Cundy;Stefano Ermon",
        "authorids": "~Chris_Cundy1;~Stefano_Ermon1",
        "gender": "M;M",
        "homepage": "http://cundy.me;http://cs.stanford.edu/~ermon/",
        "dblp": "206/7233;47/8135",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;",
        "orcid": ";",
        "linkedin": "chrisjcundy/;",
        "or_profile": "~Chris_Cundy1;~Stefano_Ermon1",
        "aff": "Stanford University;Stanford University",
        "aff_domain": "stanford.edu;stanford.edu",
        "position": "PhD student;Associate Professor",
        "bibtex": "@inproceedings{\ncundy2024sequencematch,\ntitle={SequenceMatch: Imitation Learning for Autoregressive Sequence Modelling with Backtracking},\nauthor={Chris Cundy and Stefano Ermon},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=FJWT0692hw}\n}",
        "github": "",
        "project": "",
        "reviewers": "aeRK;roYx;n9EH;TvsS",
        "pdf_size": 547607,
        "rating": "6;6;6;6",
        "confidence": "3;3;2;2",
        "soundness": "3;3;2;3",
        "contribution": "2;3;3;2",
        "presentation": "3;4;3;3",
        "wc_summary": "94;231;54;73",
        "wc_strengths": "15;72;69;157",
        "wc_weaknesses": "211;205;97;193",
        "wc_questions": "55;13;2;196",
        "wc_review": "375;521;222;619",
        "wc_reply_reviewers": "68;0;19;144",
        "wc_reply_authors": "1179;122;335;1191",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "2;2;2;3",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            2.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            113.0,
            69.58088818059166
        ],
        "wc_strengths_avg": [
            78.25,
            50.81030899335291
        ],
        "wc_weaknesses_avg": [
            176.5,
            46.354611421087334
        ],
        "wc_questions_avg": [
            66.5,
            77.3385414912901
        ],
        "wc_review_avg": [
            434.25,
            150.18218103357003
        ],
        "wc_reply_reviewers_avg": [
            57.75,
            55.63440931653719
        ],
        "wc_reply_authors_avg": [
            706.75,
            484.16132383741683
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15356484589822200821&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=FJWT0692hw",
        "pdf": "https://openreview.net/pdf?id=FJWT0692hw",
        "email": "stanford.edu;stanford.edu",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Stanford University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.stanford.edu",
        "aff_unique_abbr": "Stanford",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Stanford",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Bayesian Low-rank Adaptation for Large Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19071",
        "id": "FJiUyzOF1m",
        "author_site": "Adam Yang, Maxime Robeyns, Xi Wang, Laurence Aitchison",
        "tldr": "",
        "abstract": "Parameter-efficient fine-tuning (PEFT) has emerged as a new paradigm for cost-efficient fine-tuning of large language models (LLMs), with low-rank adaptation (LoRA) being a widely adopted choice. However, fine-tuned LLMs often become overconfident especially when fine-tuned on small datasets. Bayesian methods, with their inherent ability to estimate uncertainty, serve as potent tools to mitigate overconfidence and enhance calibration. In this work, we introduce Laplace-LoRA, a straightforward yet effective Bayesian method, which applies the Laplace approximation to the LoRA parameters and, considerably boosts the calibration of fine-tuned LLMs.",
        "keywords": "Large language models;Bayesian deep learning;Laplace approximation;uncertainty calibration",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/4fe9f6bd4328038d20981e3df03fdc92053a01ad.pdf",
        "author": "Adam X. Yang;Maxime Robeyns;Xi Wang;Laurence Aitchison",
        "authorids": "~Adam_X._Yang1;~Maxime_Robeyns1;~Xi_Wang4;~Laurence_Aitchison1",
        "gender": "M;;M;",
        "homepage": ";https://maximerobeyns.com;;http://www.gatsby.ucl.ac.uk/~laurence/",
        "dblp": ";;;155/1918.html",
        "google_scholar": ";;giztudUAAAAJ;",
        "orcid": "0000-0003-4979-8386;;;",
        "linkedin": ";;wang-xi-660a47153/;",
        "or_profile": "~Adam_X._Yang1;~Maxime_Robeyns1;~Xi_Wang4;~Laurence_Aitchison1",
        "aff": "University of Bristol;University of Bristol;University of Massachusetts, Amherst;University of Bristol",
        "aff_domain": "bristol.ac.uk;bristol.ac.uk;umass.edu;bristol.ac.uk",
        "position": "PhD student;PhD student;PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nyang2024bayesian,\ntitle={Bayesian Low-rank Adaptation for Large Language Models},\nauthor={Adam X. Yang and Maxime Robeyns and Xi Wang and Laurence Aitchison},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=FJiUyzOF1m}\n}",
        "github": "",
        "project": "",
        "reviewers": "sBHc;5qzU;EVj9;CyBU",
        "pdf_size": 925125,
        "rating": "6;6;6;8",
        "confidence": "3;4;4;3",
        "soundness": "3;3;3;4",
        "contribution": "2;3;3;4",
        "presentation": "3;4;4;4",
        "wc_summary": "51;40;44;13",
        "wc_strengths": "50;58;133;44",
        "wc_weaknesses": "157;46;149;84",
        "wc_questions": "64;24;8;2",
        "wc_review": "322;168;334;143",
        "wc_reply_reviewers": "16;9;0;0",
        "wc_reply_authors": "412;274;279;269",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            37.0,
            14.404860290887934
        ],
        "wc_strengths_avg": [
            71.25,
            35.99565946055163
        ],
        "wc_weaknesses_avg": [
            109.0,
            46.09229870596605
        ],
        "wc_questions_avg": [
            24.5,
            24.181604578687494
        ],
        "wc_review_avg": [
            241.75,
            86.80545777772271
        ],
        "wc_reply_reviewers_avg": [
            6.25,
            6.722164829874376
        ],
        "wc_reply_authors_avg": [
            308.5,
            59.860253925288355
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 75,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11192201999437599918&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=FJiUyzOF1m",
        "pdf": "https://openreview.net/pdf?id=FJiUyzOF1m",
        "email": "bristol.ac.uk;bristol.ac.uk;umass.edu;bristol.ac.uk",
        "author_num": 4,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "University of Bristol;University of Massachusetts Amherst",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.bristol.ac.uk;https://www.umass.edu",
        "aff_unique_abbr": "Bristol;UMass Amherst",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Amherst",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "id": "FJjHQS2DyE",
        "title": "Conditional Support Alignment for Domain Adaptation with Label Shift",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Unsupervised domain adaptation (UDA) refers to a domain adaptation framework in which a learning model is trained based on the labeled samples on the source domain and unlabelled ones in the target domain. The dominant existing methods in the field that rely on the classical covariate shift assumption to learn domain-invariant feature representation have yielded suboptimal performance under label distribution shift. In this paper, we propose a novel conditional adversarial support alignment (CASA) whose aim is to minimize the conditional symmetric support divergence between the source's and target domain's feature representation distributions, aiming at a more discriminative representation for the classification task. We also introduce a novel theoretical target risk bound, which justifies the merits of aligning the supports of conditional feature distributions compared to the existing marginal support alignment approach in the UDA settings. We then provide a complete training process for learning in which the objective optimization functions are precisely based on the proposed target risk bound. Our empirical results demonstrate that CASA outperforms other state-of-the-art methods on different UDA benchmark tasks under different label shift conditions.",
        "keywords": "Deep Learning;Unsupervised Domain Adaptation;Conditional Support Alignment",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/e26c3e7c148feb4639dcf1690d7f8a60c23142db.zip",
        "author": "Anh T Nguyen;Tung Lam Tran;Anh Tong;Tuan-Duy H. Nguyen;Toan Tran",
        "authorids": "~Anh_T_Nguyen1;~Tung_Lam_Tran1;~Anh_Tong5;~Tuan-Duy_H._Nguyen1;~Toan_Tran1",
        "gender": "M;;M;M;Not Specified",
        "homepage": ";;;;https://duynht.github.io/",
        "dblp": "311/8264;178/8536;207/8479-3;https://dblp.org/pers/t/Tong:Anh.html;265/4122",
        "google_scholar": "cbWwuJAAAAAJ;--2qc0UAAAAJ;https://scholar.google.com.au/citations?user=PnwSuNMAAAAJ;amN_LloAAAAJ;A4cqJA8AAAAJ",
        "orcid": ";;0000-0001-7182-7548;;0000-0001-8201-1843",
        "linkedin": "teeann/;;;;itstuanduy/",
        "or_profile": "~Anh_T_Nguyen1;~Tung_Lam_Tran1;~Toan_Tran1;~Anh_Tong1;~Tuan-Duy_Hien_Nguyen1",
        "aff": "VinAI Research;VinAi Research;Hanoi University of Science and Technology;Korea Advanced Institute of Science & Technology;National University of Singapore ",
        "aff_domain": "vinai.io;vinai.io;hust.edu.vn;kaist.ac.kr;nus.edu.sg",
        "position": "Researcher;Research resident;Lecturer;Postdoc;PhD student",
        "bibtex": "@misc{\nnguyen2024conditional,\ntitle={Conditional Support Alignment for Domain Adaptation with Label Shift},\nauthor={Anh T Nguyen and Tung Lam Tran and Anh Tong and Tuan-Duy H. Nguyen and Toan Tran},\nyear={2024},\nurl={https://openreview.net/forum?id=FJjHQS2DyE}\n}",
        "github": "",
        "project": "",
        "reviewers": "XqJP;o6SV;UE75",
        "site": "https://openreview.net/forum?id=FJjHQS2DyE",
        "pdf_size": 800220,
        "rating": "5;6;6",
        "confidence": "4;3;4",
        "soundness": "3;3;2",
        "contribution": "2;2;2",
        "presentation": "3;3;2",
        "wc_summary": "51;46;117",
        "wc_strengths": "45;62;33",
        "wc_weaknesses": "73;236;116",
        "wc_questions": "6;2;492",
        "wc_review": "175;346;758",
        "wc_reply_reviewers": "0;8;67",
        "wc_reply_authors": "848;467;562",
        "reply_reviewers": "0;1;1",
        "reply_authors": "3;3;2",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            71.33333333333333,
            32.355662392986005
        ],
        "wc_strengths_avg": [
            46.666666666666664,
            11.897712198383164
        ],
        "wc_weaknesses_avg": [
            141.66666666666666,
            68.97503574160405
        ],
        "wc_questions_avg": [
            166.66666666666666,
            230.05120203023404
        ],
        "wc_review_avg": [
            426.3333333333333,
            244.69345902350742
        ],
        "wc_reply_reviewers_avg": [
            25.0,
            29.87752778706208
        ],
        "wc_reply_authors_avg": [
            625.6666666666666,
            161.9265951665205
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15642784876383723900&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1;2;3",
        "aff_unique_norm": "VinAI Research;Hanoi University of Science and Technology;Korea Advanced Institute of Science and Technology;National University of Singapore",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.vinai.io/;https://www.hust.edu.vn;https://www.kaist.ac.kr;https://www.nus.edu.sg",
        "aff_unique_abbr": "VinAI;HUST;KAIST;NUS",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hanoi",
        "aff_country_unique_index": "0;0;0;1;2",
        "aff_country_unique": "Vietnam;South Korea;Singapore"
    },
    {
        "id": "FJlIwGqPdL",
        "title": "The Pitfalls and Promise of Conformal Inference Under Adversarial Attacks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In safety-critical applications such as medical imaging and autonomous driving, where decisions have profound implications for patient health and road safety, it is imperative to maintain both high adversarial robustness to protect against potential adversarial attacks and reliable uncertainty quantification in decision-making. With extensive research focused on enhancing adversarial robustness through various forms of improved adversarial training (AT), a notable knowledge gap remains concerning the uncertainty inherent in adversarially trained models. To address this gap, this study investigates the uncertainty of deep learning models by examining the performance of conformal prediction (CP) in the context of standard adversarial attacks within the adversarial defense community. It is first unveiled that existing conformal prediction methods fail under the commonly used $l_{\\infty}$-norm bounded attack if the model is not adversarially trained, which underpins the importance of adversarial training for CP. Our paper next demonstrates that the prediction set size of CP using adversarially trained models with AT variants is often worse than using standard AT, which inspires us to research into CP-efficient AT for improved prediction set size. Our empirical study finds two factors are strongly correlated with the efficiency of CP: 1) \\emph{predictive entropy} and 2) \\emph{distribution of the true class probability ranking (TCPR)}. Based on the two observations, we propose the Uncertainty-Reducing AT (AT-UR) to learn an adversarially robust and CP-efficient model with \\emph{entropy minimization} and \\emph{Beta importance weighting}. Theoretically, this paper presents generalization error analysis for Beta importance weighting indicating that the proposed UR-AT can potentially learn a model with improved generalization. Empirically, we demonstrate the substantially improved CP-efficiency of our method on four image classification datasets compared with several popular AT baselines.",
        "keywords": "Adversarial Robustness; Prediction Uncertainty",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Ziquan Liu;Yufei CUI;Yan Yan;Yi Xu;Xiangyang Ji;Xue Liu;Miguel R. D. Rodrigues;Antoni B. Chan",
        "authorids": "~Ziquan_Liu1;~Yufei_CUI2;~Yan_Yan3;~Yi_Xu8;~Xiangyang_Ji1;~Xue_Liu1;~Miguel_R._D._Rodrigues1;~Antoni_B._Chan1",
        "gender": "M;M;M;;;M;M;M",
        "homepage": "https://sites.google.com/view/ziquanliu;;http://iemppu.github.io/;;;http://www.cs.mcgill.ca/~xueliu/;https://www.ee.ucl.ac.uk/iiml/;http://www.cs.cityu.edu.hk/~abchan/",
        "dblp": "207/9035;188/0049;13/3953-6;;;l/XueLiu;21/6763;55/5814",
        "google_scholar": "https://scholar.google.com.hk/citations?user=x28OqBkAAAAJ;;A6co_BAAAAAJ;;;https://scholar.google.com.tw/citations?user=rfLIRakAAAAJ;;j4vFSn8AAAAJ",
        "orcid": ";;0000-0001-9108-6767;;;;;0000-0002-2886-2513",
        "linkedin": ";;;;;;;",
        "or_profile": "~Ziquan_Liu1;~Yufei_CUI2;~Yan_Yan3;~Yi_Xu8;~Xiangyang_Ji1;~Xue_Liu1;~Miguel_R._D._Rodrigues1;~Antoni_B._Chan1",
        "aff": "Queen Mary, University of London;McGill University;Washington State University, Pullman;;;McGill University;University College London;City University of Hong Kong",
        "aff_domain": "qmul.ac.uk;cs.mcgill.ca;wsu.edu;;;mcgill.ca;ucl.ac.uk;cityu.edu.hk",
        "position": "Lecturer;Postdoc;Assistant Professor;;;Full Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nliu2024the,\ntitle={The Pitfalls and Promise of Conformal Inference Under Adversarial Attacks},\nauthor={Ziquan Liu and Yufei CUI and Yan Yan and Yi Xu and Xiangyang Ji and Xue Liu and Miguel R. D. Rodrigues and Antoni B. Chan},\nyear={2024},\nurl={https://openreview.net/forum?id=FJlIwGqPdL}\n}",
        "github": "",
        "project": "",
        "reviewers": "k8ir;GTvN;XaQc",
        "site": "https://openreview.net/forum?id=FJlIwGqPdL",
        "pdf_size": 1942993,
        "rating": "3;3;6",
        "confidence": "4;3;3",
        "soundness": "1;1;4",
        "contribution": "1;2;3",
        "presentation": "2;3;3",
        "wc_summary": "185;83;109",
        "wc_strengths": "45;15;65",
        "wc_weaknesses": "62;24;47",
        "wc_questions": "894;255;86",
        "wc_review": "1186;377;307",
        "wc_reply_reviewers": "0;188;0",
        "wc_reply_authors": "1343;716;259",
        "reply_reviewers": "0;1;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            1.4142135623730951
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            125.66666666666667,
            43.27688631231329
        ],
        "wc_strengths_avg": [
            41.666666666666664,
            20.548046676563253
        ],
        "wc_weaknesses_avg": [
            44.333333333333336,
            15.627610892974722
        ],
        "wc_questions_avg": [
            411.6666666666667,
            347.96966662180324
        ],
        "wc_review_avg": [
            623.3333333333334,
            398.89040544434704
        ],
        "wc_reply_reviewers_avg": [
            62.666666666666664,
            88.62404990871396
        ],
        "wc_reply_authors_avg": [
            772.6666666666666,
            444.35146249587416
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9621002763644992885&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;1;2;1;3;4",
        "aff_unique_norm": "Queen Mary, University of London;McGill University;Washington State University;University College London;City University of Hong Kong",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.qmul.ac.uk;https://www.mcgill.ca;https://wsu.edu;https://www.ucl.ac.uk;https://www.cityu.edu.hk",
        "aff_unique_abbr": "QMUL;McGill;WSU;UCL;CityU",
        "aff_campus_unique_index": "0;2;3",
        "aff_campus_unique": "London;;Pullman;Hong Kong SAR",
        "aff_country_unique_index": "0;1;2;1;0;3",
        "aff_country_unique": "United Kingdom;Canada;United States;China"
    },
    {
        "id": "FKg1N2fAFG",
        "title": "Towards Mitigating Architecture Overfitting in Dataset Distillation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Dataset distillation methods have demonstrated remarkable performance for neural networks trained with very limited training data. However, a significant challenge arises in the form of architecture overfitting: the distilled training data synthesized by a specific network architecture (i.e., training network) generates poor performance when trained by other network architectures (i.e., test networks). This paper addresses this issue and proposes a series of approaches in both architecture designs and training schemes which can be adopted together to boost the generalization performance across different network architectures on the distilled training data. We conduct extensive experiments to demonstrate the effectiveness and generality of our methods. Particularly, across various scenarios involving different sizes of distilled data, our approaches achieve comparable or superior performance to existing methods when training on the distilled data using networks with larger capacities.",
        "keywords": "dataset distillation;architecture overfitting",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/cc4b035cc796b6159d39b6ddc62db62512301527.zip",
        "author": "Xuyang Zhong;Chen Liu",
        "authorids": "~Xuyang_Zhong1;~Chen_Liu1",
        "gender": "M;M",
        "homepage": ";http://liuchen1993.cn/HomePage/index.html",
        "dblp": ";10/2639-27",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;48PsswEAAAAJ",
        "orcid": ";",
        "linkedin": "xuyang-zhong-62a937226;",
        "or_profile": "~Xuyang_Zhong1;~Chen_Liu1",
        "aff": "City University of Hong Kong;City University of Hong Kong",
        "aff_domain": "cityu.edu.hk;cityu.edu.hk",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nzhong2024towards,\ntitle={Towards Mitigating Architecture Overfitting in Dataset Distillation},\nauthor={Xuyang Zhong and Chen Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=FKg1N2fAFG}\n}",
        "github": "",
        "project": "",
        "reviewers": "w1VW;wW36;MbH7;Mz7n",
        "site": "https://openreview.net/forum?id=FKg1N2fAFG",
        "pdf_size": 704670,
        "rating": "5;5;5;6",
        "confidence": "4;5;5;3",
        "soundness": "3;2;4;4",
        "contribution": "3;2;2;3",
        "presentation": "3;3;4;4",
        "wc_summary": "66;82;83;232",
        "wc_strengths": "39;30;65;135",
        "wc_weaknesses": "86;272;224;19",
        "wc_questions": "53;13;6;126",
        "wc_review": "244;397;378;512",
        "wc_reply_reviewers": "55;143;30;142",
        "wc_reply_authors": "1075;1245;1540;1086",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "3;4;3;3",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            115.75,
            67.4550776443108
        ],
        "wc_strengths_avg": [
            67.25,
            41.172654760168186
        ],
        "wc_weaknesses_avg": [
            150.25,
            102.00091911350603
        ],
        "wc_questions_avg": [
            49.5,
            47.668123520860355
        ],
        "wc_review_avg": [
            382.75,
            95.10881925457807
        ],
        "wc_reply_reviewers_avg": [
            92.5,
            50.77647092896473
        ],
        "wc_reply_authors_avg": [
            1236.5,
            187.6945657178172
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.25,
            0.4330127018922193
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.8703882797784891,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3066664505202729875&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "City University of Hong Kong",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cityu.edu.hk",
        "aff_unique_abbr": "CityU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Denoising Diffusion Bridge Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19070",
        "id": "FKksTayvGo",
        "author_site": "Linqi Zhou, Aaron Lou, Samar Khanna, Stefano Ermon",
        "tldr": "",
        "abstract": "Diffusion models are powerful generative models that map noise to data using stochastic processes. However, for many applications such as image editing, the model input comes from a distribution that is not random noise. As such, diffusion models must rely on cumbersome methods like guidance or projected sampling to incorporate this information in the generative process. In our work, we propose Denoising Diffusion Bridge Models (DDBMs), a natural alternative to this paradigm based on *diffusion bridges*, a family of processes that interpolate between two paired distributions given as endpoints. Our method learns the score of the diffusion bridge from data and maps from one endpoint distribution to the other by solving a (stochastic) differential equation based on the learned score. Our method naturally unifies several classes of generative models, such as score-based diffusion models and OT-Flow-Matching, allowing us to adapt existing design and architectural choices to our more general problem. Empirically, we apply DDBMs to challenging image datasets in both pixel and latent space. On standard image translation problems, DDBMs achieve significant improvement over baseline methods, and, when we reduce the problem to image generation by setting the source distribution to random noise, DDBMs achieve comparable FID scores to state-of-the-art methods despite being built for a more general task.",
        "keywords": "Generative Modeling;Diffusion Models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/b0357f9f2446403bdab76ec4f9759ccd03f73ff7.pdf",
        "author": "Linqi Zhou;Aaron Lou;Samar Khanna;Stefano Ermon",
        "authorids": "~Linqi_Zhou1;~Aaron_Lou1;~Samar_Khanna1;~Stefano_Ermon1",
        "gender": "M;M;;M",
        "homepage": "https://alexzhou907.github.io;https://aaronlou.com;https://samar-khanna.github.io/;http://cs.stanford.edu/~ermon/",
        "dblp": "42/10445;232/3858;;47/8135",
        "google_scholar": ";;DPHEQsMAAAAJ;",
        "orcid": ";;;",
        "linkedin": ";;samar-khanna-133b8190/;",
        "or_profile": "~Linqi_Zhou1;~Aaron_Lou1;~Samar_Khanna1;~Stefano_Ermon1",
        "aff": "Stanford University;Stanford University;Computer Science Department, Stanford University;Stanford University",
        "aff_domain": "stanford.edu;stanford.edu;cs.stanford.edu;stanford.edu",
        "position": "PhD student;PhD student;Researcher;Associate Professor",
        "bibtex": "@inproceedings{\nzhou2024denoising,\ntitle={Denoising Diffusion Bridge Models},\nauthor={Linqi Zhou and Aaron Lou and Samar Khanna and Stefano Ermon},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=FKksTayvGo}\n}",
        "github": "",
        "project": "",
        "reviewers": "BgL3;H8Nr;2Uac;zUzA",
        "pdf_size": 15962244,
        "rating": "6;6;8;8",
        "confidence": "4;4;3;4",
        "soundness": "4;2;3;4",
        "contribution": "2;2;3;4",
        "presentation": "2;2;3;4",
        "wc_summary": "125;199;162;36",
        "wc_strengths": "202;104;205;42",
        "wc_weaknesses": "951;906;119;36",
        "wc_questions": "76;174;30;54",
        "wc_review": "1354;1383;516;168",
        "wc_reply_reviewers": "1153;1179;0;17",
        "wc_reply_authors": "1645;2722;188;251",
        "reply_reviewers": "3;2;0;1",
        "reply_authors": "5;5;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            130.5,
            60.508263898413084
        ],
        "wc_strengths_avg": [
            138.25,
            68.84175695026966
        ],
        "wc_weaknesses_avg": [
            503.0,
            426.8073335827303
        ],
        "wc_questions_avg": [
            83.5,
            54.7243090408641
        ],
        "wc_review_avg": [
            855.25,
            527.8907912627384
        ],
        "wc_reply_reviewers_avg": [
            587.25,
            578.8542022824055
        ],
        "wc_reply_authors_avg": [
            1201.5,
            1053.4757946910788
        ],
        "reply_reviewers_avg": [
            1.5,
            1.118033988749895
        ],
        "reply_authors_avg": [
            3.0,
            2.0
        ],
        "replies_avg": [
            41,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 59,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=128113798851844474&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=FKksTayvGo",
        "pdf": "https://openreview.net/pdf?id=FKksTayvGo",
        "email": "stanford.edu;stanford.edu;cs.stanford.edu;stanford.edu",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Stanford University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.stanford.edu",
        "aff_unique_abbr": "Stanford",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Stanford",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "FL1VmOgiO8",
        "title": "Sentiment-Enhanced Stock Price Prediction: A Novel Ensemble Model Approach",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Stock price prediction remains a formidable challenge within the realm of financial markets, wherein a multitude of models and methodologies have been under exploration to prognosticate the dynamic behaviour of equities. This research endeavour encompasses an exhaustive examination of extant stock prediction systems, entailing a meticulous assessment of their merits and demerits, concurrently pinpointing discernible lacunae and avenues for enhancement. Subsequently, we harnessed the capabilities of BERT, an exemplar in the domain of natural language processing, to conduct sentiment analysis across a heterogeneous corpus of news articles pertinent to the subject stocks. Additionally, an ancillary sub-experiment was conducted to ascertain the relative impact of three distinct categories of news articles, namely headlines, summaries, and a composite amalgamation of the two, on the efficacy of stock price prediction.\n\nThe outcome of this investigative pursuit was the generation of sentiment scores for each trading date, which were subsequently integrated as input features in the training of a neural network. Through a comparative analysis of various neural network models, including but not limited to RNN, LSTM, GAN, and WGAN-GP, we discerned that the WGAN-GP model exhibited the most favourable predictive performance. Building upon these findings, we introduced the FB-GAN model, an ensemble architecture comprising WGAN-GP, which capitalizes on the fusion of historical stock price data and market sentiment scores for enhanced stock price prediction.\n\nSubsequently, a comprehensive evaluation of our approach was undertaken vis-\u00e0-vis established models, gauging its performance against five prominent equities, namely Amazon, Apple, Microsoft, Nvidia, and Adobe. In summation, this research makes a compelling case for the integration of BERT-based sentiment analysis within the ambit of stock price prediction. Our initial hypothesis regarding the significant influence of market sentiment on stock price prediction was validated, and our proposed FB-GAN model outperformed all other models. Furthermore, incorporating both the headline and summary of the news article contributed to enhanced stock price prediction compared to utilizing either the headline or summary in isolation.",
        "keywords": "Stock Price Prediction;Sentiment Analysis;Finance;NLP;BERT",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Jainendra Kumar Jain;Ruchit Agrawal",
        "authorids": "~Jainendra_Kumar_Jain1;r.r.agrawal@bham.ac.uk",
        "gender": "M;",
        "homepage": ";",
        "dblp": ";",
        "google_scholar": "https://scholar.google.com/citations?hl=en;",
        "orcid": ";",
        "linkedin": "jainendra-kumar-jain-555940128/;",
        "or_profile": "~Jainendra_Kumar_Jain1;r.r.agrawal@bham.ac.uk",
        "aff": ";",
        "aff_domain": ";",
        "position": ";",
        "bibtex": "@misc{\njain2024sentimentenhanced,\ntitle={Sentiment-Enhanced Stock Price Prediction: A Novel Ensemble Model Approach},\nauthor={Jainendra Kumar Jain and Ruchit Agrawal},\nyear={2024},\nurl={https://openreview.net/forum?id=FL1VmOgiO8}\n}",
        "github": "",
        "project": "",
        "reviewers": "vbhJ;p754;J1EJ",
        "site": "https://openreview.net/forum?id=FL1VmOgiO8",
        "pdf_size": 1817400,
        "rating": "1;3;3",
        "confidence": "5;4;4",
        "soundness": "1;3;2",
        "contribution": "1;2;1",
        "presentation": "1;3;3",
        "wc_summary": "14;103;41",
        "wc_strengths": "1;43;33",
        "wc_weaknesses": "17;58;188",
        "wc_questions": "22;42;3",
        "wc_review": "54;246;265",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            52.666666666666664,
            37.2588542795162
        ],
        "wc_strengths_avg": [
            25.666666666666668,
            17.9133717900592
        ],
        "wc_weaknesses_avg": [
            87.66666666666667,
            72.89413937728845
        ],
        "wc_questions_avg": [
            22.333333333333332,
            15.923427883328248
        ],
        "wc_review_avg": [
            188.33333333333334,
            95.3041913500602
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:DIbCBSnUG3sJ:scholar.google.com/&scioq=Sentiment-Enhanced+Stock+Price+Prediction:+A+Novel+Ensemble+Model+Approach&hl=en&as_sdt=0,44",
        "gs_version_total": 0
    },
    {
        "id": "FLOaCQfZe9",
        "title": "Dream to Adapt: Meta Reinforcement Learning by Latent Context Imagination and MDP Imagination",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Meta reinforcement learning (Meta RL) has been amply explored to quickly learn an unseen task by transferring previously learned knowledge from similar tasks. However, even though Meta RL shows the ability to generalize, most state-of-the-art algorithms require the meta-training tasks to have a dense coverage on the task distribution and a great amount of data for each of them. In this paper, we propose MetaDreamer, a context-based Meta RL algorithm that requires less real training tasks and data by doing meta-imagination and MDP-imagination. We perform meta-imagination by interpolating on the learned latent context space with disentangled properties, as well as MDP-imagination through the generative world model where physical knowledge is added to plain VAE networks. Our autonomous highway merging experiments in the paper, OpenAI Gym-based and MuJoCo-based experiments show that MetaDreamer outperforms existing approaches on unseen interpolated tasks.",
        "keywords": "meta learning;reinforcement learning;imagination;generalization",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Lu Wen;Songan Zhang;Eric H. Tseng;Huei Peng",
        "authorids": "~Lu_Wen2;~Songan_Zhang1;~Eric_H._Tseng1;~Huei_Peng1",
        "gender": ";;M;M",
        "homepage": ";;;https://huei.engin.umich.edu/",
        "dblp": "196/4065;;33/7140;",
        "google_scholar": ";YnSPFY8AAAAJ;UWnwlu4AAAAJ;MMgcQiIAAAAJ",
        "orcid": "0000-0002-8197-8195;;;",
        "linkedin": ";;;",
        "or_profile": "~Lu_Wen2;~Songan_Zhang1;~Eric_H._Tseng1;~Huei_Peng1",
        "aff": "University of Michigan - Ann Arbor;Shanghai Jiaotong University;;University of Michigan - Ann Arbor",
        "aff_domain": "umich.edu;sjtu.edu.cn;;umich.edu",
        "position": "PhD student;Assistant Professor;;Full Professor",
        "bibtex": "@misc{\nwen2024dream,\ntitle={Dream to Adapt: Meta Reinforcement Learning by Latent Context Imagination and {MDP} Imagination},\nauthor={Lu Wen and Songan Zhang and Eric H. Tseng and Huei Peng},\nyear={2024},\nurl={https://openreview.net/forum?id=FLOaCQfZe9}\n}",
        "github": "",
        "project": "",
        "reviewers": "iZ95;Jvj1;xXsW;eJ5U",
        "site": "https://openreview.net/forum?id=FLOaCQfZe9",
        "pdf_size": 3845610,
        "rating": "1;3;3;3",
        "confidence": "4;4;5;4",
        "soundness": "1;2;3;2",
        "contribution": "1;1;1;3",
        "presentation": "1;1;1;1",
        "wc_summary": "149;31;75;80",
        "wc_strengths": "26;32;90;36",
        "wc_weaknesses": "487;356;599;292",
        "wc_questions": "5;24;40;47",
        "wc_review": "667;443;804;455",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            1.0,
            0.0
        ],
        "wc_summary_avg": [
            83.75,
            42.22188413607332
        ],
        "wc_strengths_avg": [
            46.0,
            25.65151067676132
        ],
        "wc_weaknesses_avg": [
            433.5,
            118.61808462456304
        ],
        "wc_questions_avg": [
            29.0,
            16.170961628796228
        ],
        "wc_review_avg": [
            592.25,
            151.2768571196533
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1888408492382619618&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Michigan;Shanghai Jiao Tong University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.umich.edu;https://www.sjtu.edu.cn",
        "aff_unique_abbr": "UM;SJTU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Ann Arbor;",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "FLOxzCa6DS",
        "title": "Differentially Private Latent Diffusion Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Diffusion models (DMs) are widely used for generating high-quality high-\ndimensional images in a non-differentially private manner. However, due to the\nnotoriously slow training process of DMs, applying differential privacy (DP) to\nthe training routine requires adding large amounts of noise, yielding poor-quality\ngenerated images. To address this challenge, recent papers suggest pre-training\nDMs with public data, then fine-tuning them with private data using DP-SGD for a\nrelatively short period. In this paper, we aim to further improve the current state\nof DMs with DP by adopting the Latent Diffusion Models (LDMs). LDMs are\nequipped with powerful pre-trained autoencoders that map the high-dimensional\npixels into lower-dimensional latent representations, where DMs are then trained\nin the latent space, yielding a more efficient and fast training. In our algorithm,\nDP-LDMs, rather than fine-tuning the entire DMs, we fine-tune only the attention\nmodules of LDMs at varying layers with privacy-sensitive data, reducing the num-\nber of trainable parameters by approximately 96% compared to fine-tuning the\nentire DMs. The smaller parameter space to fine-tune with DP-SGD helps our algo-\nrithm to achieve a new state-of-the-art results in several public-private benchmark\ndata pairs. Our approach also allows us to generate high-dimensional images (256\nby 256) and those conditioned on text prompts with differential privacy, which\nhave not been attempted yet in DP literature. Our approach provides a promising\ndirection for training more powerful, yet training-efficient differentially private\nDMs that can produce high-quality high-dimensional synthetic images.",
        "keywords": "differential privacy;latent diffusion models;generative modelling;synthetic image generation",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Saiyue Lyu;Margarita Vinaroz;Michael F Liu;Mijung Park",
        "authorids": "~Saiyue_Lyu1;~Margarita_Vinaroz1;~Michael_F_Liu1;~Mijung_Park3",
        "gender": "F;;M;",
        "homepage": "https://saiyuelyu.github.io/;;;https://www.cs.ubc.ca/~mijungp/",
        "dblp": "346/4001;294/8892;;20/10800",
        "google_scholar": ";;;fqKsAJcAAAAJ",
        "orcid": "0000-0002-3822-9746;;;",
        "linkedin": "https://linkedin.com/in/saiyue-lyu-ubc;margarita-vinaroz-corcoles/;michael-f-liu/;",
        "or_profile": "~Saiyue_Lyu1;~Margarita_Vinaroz1;~Michael_F_Liu1;~Mi_Jung_Park1",
        "aff": "University of British Columbia;Max-Planck-Institute for Intelligent Systems, Max-Planck Institute;University of British Columbia;Technical University of Denmark",
        "aff_domain": "cs.ubc.ca;is.mpg.de;cs.ubc.ca;dtu.dk",
        "position": "PhD student;PhD student;MS student;Associate Professor",
        "bibtex": "@misc{\nlyu2024differentially,\ntitle={Differentially Private Latent Diffusion Models},\nauthor={Saiyue Lyu and Margarita Vinaroz and Michael F Liu and Mijung Park},\nyear={2024},\nurl={https://openreview.net/forum?id=FLOxzCa6DS}\n}",
        "github": "",
        "project": "",
        "reviewers": "2m5o;muGo;c8Le;Tmmk",
        "site": "https://openreview.net/forum?id=FLOxzCa6DS",
        "pdf_size": 12079766,
        "rating": "5;5;6;8",
        "confidence": "4;4;4;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;2;2",
        "presentation": "3;3;3;2",
        "wc_summary": "46;32;85;59",
        "wc_strengths": "25;15;57;41",
        "wc_weaknesses": "202;154;11;473",
        "wc_questions": "99;65;634;6",
        "wc_review": "372;266;787;579",
        "wc_reply_reviewers": "29;122;164;20",
        "wc_reply_authors": "1001;792;1633;670",
        "reply_reviewers": "1;2;2;1",
        "reply_authors": "3;4;5;3",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            55.5,
            19.525624189766635
        ],
        "wc_strengths_avg": [
            34.5,
            15.960889699512368
        ],
        "wc_weaknesses_avg": [
            210.0,
            167.3095932694835
        ],
        "wc_questions_avg": [
            201.0,
            252.1973433642789
        ],
        "wc_review_avg": [
            501.0,
            199.84118694603472
        ],
        "wc_reply_reviewers_avg": [
            83.75,
            61.16524748580684
        ],
        "wc_reply_authors_avg": [
            1024.0,
            370.9952829888811
        ],
        "reply_reviewers_avg": [
            1.5,
            0.5
        ],
        "reply_authors_avg": [
            3.75,
            0.82915619758885
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 27,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11383384812562557549&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "University of British Columbia;Max-Planck-Institute for Intelligent Systems;Technical University of Denmark",
        "aff_unique_dep": ";Intelligent Systems;",
        "aff_unique_url": "https://www.ubc.ca;https://www.mpi-is.mpg.de;https://www.tek.dk",
        "aff_unique_abbr": "UBC;MPI-IS;DTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;2",
        "aff_country_unique": "Canada;Germany;Denmark"
    },
    {
        "id": "FLR7ElwD51",
        "title": "Learning Scalable Causal Discovery Policies with Adversarial Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Learning the structure of causal graphs from observational data is a fundamental but challenging problem. Existing works focus on designing search-based methods for finding optimal causal graphs. However, search-based methods have proven low-efficient since they are naturally limited by the burdensome computation of decision criteria at every step. Consequently, they can hardly scale to larger tasks. This paper proposes a novel framework called AGCORL to learn reusable causal discovery policies, which can zero-shot generalize to related tasks with much larger sizes. Specifically, AGCORL employs an Ordering Learning (OL) agent to directly infer the order of variables taken from the observational data as input. To further improve the generalizability of the OL agent, an ADversarial (AD) agent is employed to actively mine tasks where the OL agent fails to find high-quality solutions. We theoretically prove that the AD agent significantly reduces the number of required tasks to achieve generalizability of the OL agent. Extensive empirical evaluations demonstrate the superiority of our method in both runtime and solution quality over the state-of-the-art baselines.",
        "keywords": "Reinforcement learning;causal discovery;adversarial training",
        "primary_area": "causal reasoning",
        "supplementary_material": "",
        "author": "Xinyu Cai;Mengyue Yang;Yanchen Deng;Furui Liu;Mengchen Zhao;Bo An",
        "authorids": "~Xinyu_Cai1;~Mengyue_Yang1;~Yanchen_Deng2;~Furui_Liu1;~Mengchen_Zhao1;~Bo_An2",
        "gender": "M;F;M;M;M;M",
        "homepage": ";https://ymy4323460.github.io/;;;https://batmanzzmc.github.io/;https://personal.ntu.edu.sg/boan/",
        "dblp": ";262/3824.html;https://dblp.uni-trier.de/pid/199/6564.html;116/7289;178/8719;42/6178-1.html",
        "google_scholar": ";kJJkqdcAAAAJ;Yk3RZdoAAAAJ;https://scholar.google.com.hk/citations?user=DJY8NXMAAAAJ;nLgORGMAAAAJ;PEEpuNwAAAAJ",
        "orcid": ";;;;;0000-0002-7064-7438",
        "linkedin": "xinyu-cai-241223147/;;;;;",
        "or_profile": "~Xinyu_Cai1;~Mengyue_Yang1;~Yanchen_Deng2;~Furui_Liu1;~Mengchen_Zhao1;~Bo_An2",
        "aff": "Nanyang Technological University;University College London;;Zhejiang Lab & UCAS & Zhejiang University;Huawei Noah's Ark Lab;Nanyang Technological University",
        "aff_domain": "ntu.edu.sg;ucl.ac.uk;;zhejianglab.com;huawei.com;ntu.edu.sg",
        "position": "PhD student;PhD student;;Associate Professor;Research Scientist;Full Professor",
        "bibtex": "@misc{\ncai2024learning,\ntitle={Learning Scalable Causal Discovery Policies with Adversarial Reinforcement Learning},\nauthor={Xinyu Cai and Mengyue Yang and Yanchen Deng and Furui Liu and Mengchen Zhao and Bo An},\nyear={2024},\nurl={https://openreview.net/forum?id=FLR7ElwD51}\n}",
        "github": "",
        "project": "",
        "reviewers": "L2qU;GfFV;Wgj3;yLLZ",
        "site": "https://openreview.net/forum?id=FLR7ElwD51",
        "pdf_size": 788852,
        "rating": "5;5;5;6",
        "confidence": "4;3;3;4",
        "soundness": "2;3;2;3",
        "contribution": "1;2;2;3",
        "presentation": "2;2;3;3",
        "wc_summary": "76;48;95;78",
        "wc_strengths": "34;89;59;52",
        "wc_weaknesses": "52;335;218;140",
        "wc_questions": "297;225;132;76",
        "wc_review": "459;697;504;346",
        "wc_reply_reviewers": "311;268;15;0",
        "wc_reply_authors": "1274;1033;666;386",
        "reply_reviewers": "5;1;1;0",
        "reply_authors": "4;2;1;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            74.25,
            16.857861667483217
        ],
        "wc_strengths_avg": [
            58.5,
            19.83053201505194
        ],
        "wc_weaknesses_avg": [
            186.25,
            104.03935553433614
        ],
        "wc_questions_avg": [
            182.5,
            84.86607095889381
        ],
        "wc_review_avg": [
            501.5,
            126.70142067080384
        ],
        "wc_reply_reviewers_avg": [
            148.5,
            141.91634860015247
        ],
        "wc_reply_authors_avg": [
            839.75,
            339.8517139871447
        ],
        "reply_reviewers_avg": [
            1.75,
            1.920286436967152
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:wXMKFrmNmVUJ:scholar.google.com/&scioq=Learning+Scalable+Causal+Discovery+Policies+with+Adversarial+Reinforcement+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;0",
        "aff_unique_norm": "Nanyang Technological University;University College London;Zhejiang University;Huawei",
        "aff_unique_dep": ";;;Noah's Ark Lab",
        "aff_unique_url": "https://www.ntu.edu.sg;https://www.ucl.ac.uk;http://www.zju.edu.cn;https://www.huawei.com",
        "aff_unique_abbr": "NTU;UCL;ZJU;Huawei",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;2;0",
        "aff_country_unique": "Singapore;United Kingdom;China"
    },
    {
        "title": "Post-hoc bias scoring is optimal for fair classification",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19069",
        "id": "FM5xfcaR2Y",
        "author_site": "Wenlong Chen, Yegor Klochkov, Yang Liu",
        "tldr": "",
        "abstract": "We consider a binary classification problem under group fairness constraints, which can be one of Demographic Parity (DP), Equalized Opportunity (EOp), or Equalized Odds (EO). We propose an explicit characterization of Bayes optimal classifier under the fairness constraints, which turns out to be a simple modification rule of the unconstrained classifier. Namely, we introduce a novel instance-level measure of bias, which we call bias score, and the modification rule is a simple linear rule on top of the finite amount of bias scores. Based on this characterization, we develop a post-hoc approach that allows us to adapt to fairness constraints while maintaining high accuracy. In the case of DP and EOp constraints, the modification rule is thresholding a single bias score, while in the case of EO constraints we are required to fit a linear modification rule with 2 parameters. The method can also be applied for composite group-fairness criteria, such as ones involving several sensitive attributes. We achieve competitive or better performance compared to both in-processing and post-processing methods across three datasets: Adult, COMPAS, and CelebA. Unlike most post-processing methods, we do not require access to sensitive attributes during the inference time.",
        "keywords": "group fairness;post-hoc fair classification;Bayes optimal classifier;accuracy-fairness trade-off",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Wenlong Chen;Yegor Klochkov;Yang Liu",
        "authorids": "~Wenlong_Chen1;~Yegor_Klochkov2;~Yang_Liu3",
        "gender": "M;M;M",
        "homepage": "https://chenw20.github.io/wenlongchen.github.io/;;http://www.yliuu.com",
        "dblp": ";251/3118;51/3710-18",
        "google_scholar": "UFIDCfQAAAAJ;T3CDHrEAAAAJ;jKrIVCIAAAAJ",
        "orcid": ";;0000-0001-8420-6011",
        "linkedin": "wenlong-chen-029454195/?originalSubdomain=uk;;",
        "or_profile": "~Wenlong_Chen1;~Yegor_Klochkov2;~Yang_Liu3",
        "aff": "RIKEN;ByteDance, AI Lab;University of California, Santa Cruz",
        "aff_domain": "riken.jp;bytedance.com;ucsc.edu",
        "position": "Research Intern;Researcher;Assistant Professor",
        "bibtex": "@inproceedings{\nchen2024posthoc,\ntitle={Post-hoc bias scoring is optimal for fair classification},\nauthor={Wenlong Chen and Yegor Klochkov and Yang Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=FM5xfcaR2Y}\n}",
        "github": "",
        "project": "",
        "reviewers": "v53s;cdR8;ErzV;in91",
        "pdf_size": 594793,
        "rating": "6;8;8;8",
        "confidence": "4;3;4;4",
        "soundness": "2;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;3;2",
        "wc_summary": "93;30;188;196",
        "wc_strengths": "125;129;79;162",
        "wc_weaknesses": "589;214;260;21",
        "wc_questions": "2;173;251;1",
        "wc_review": "809;546;778;380",
        "wc_reply_reviewers": "661;253;76;0",
        "wc_reply_authors": "2220;847;1107;17",
        "reply_reviewers": "3;1;1;0",
        "reply_authors": "5;3;3;1",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            126.75,
            69.0049817042219
        ],
        "wc_strengths_avg": [
            123.75,
            29.55820529057879
        ],
        "wc_weaknesses_avg": [
            271.0,
            204.324496818174
        ],
        "wc_questions_avg": [
            106.75,
            108.80343514797683
        ],
        "wc_review_avg": [
            628.25,
            175.7048306108856
        ],
        "wc_reply_reviewers_avg": [
            247.5,
            255.77382586965382
        ],
        "wc_reply_authors_avg": [
            1047.75,
            787.4685311172758
        ],
        "reply_reviewers_avg": [
            1.25,
            1.0897247358851685
        ],
        "reply_authors_avg": [
            3.0,
            1.4142135623730951
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17854080463372302427&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=FM5xfcaR2Y",
        "pdf": "https://openreview.net/pdf?id=FM5xfcaR2Y",
        "email": "riken.jp;bytedance.com;ucsc.edu",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "RIKEN;ByteDance;University of California, Santa Cruz",
        "aff_unique_dep": ";AI Lab;",
        "aff_unique_url": "https://www.riken.jp;https://www.bytedance.com;https://www.ucsc.edu",
        "aff_unique_abbr": "RIKEN;ByteDance;UCSC",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Santa Cruz",
        "aff_country_unique_index": "0;1;2",
        "aff_country_unique": "Japan;China;United States"
    },
    {
        "id": "FMLyPgqos1",
        "title": "Graph-Relational Federated Learning: Enhanced Personalization and Robustness",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Hypernetwork has recently emerged as a promising technique to generate personalized models in federated learning (FL). However, existing works tend to treat each client equally and independently --- each client contributes equally to learning the hypernetwork, and their representations are independent in the hypernetwork. Such an independent treatment ignores topological structures among different clients, which are usually reflected in the heterogeneity of client data distribution. In this work, we propose Panacea, a novel FL framework that can incorporate client relations as a graph to facilitate learning and personalization using graph hypernetwork. Empirically, we show that Panacea achieves state-of-the-art performance in terms of both accuracy and speed on multiple benchmarks. Further, Panacea improves robustness by leveraging the client relation graph. Specifically, it (1) generalizes better to novel clients outside of the training and (2) is more resilient to label-flipping attacks, which is also proved by our theoretical analysis.",
        "keywords": "Federated Learning;Robustness",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/b73fe12ae1e0c89a83ba057932734fc7a83f38dd.zip",
        "author": "Wanyu Lin;Hao Lan;Hao He;Baochun Li",
        "authorids": "~Wanyu_Lin1;~Hao_Lan1;~Hao_He1;~Baochun_Li1",
        "gender": "F;M;M;M",
        "homepage": "https://wanyu-lin.github.io;https://lanhao.me;http://people.csail.mit.edu/hehaodele;http://iqua.ece.toronto.edu/bli/",
        "dblp": "152/1714;160/7129;;l/BaochunLi",
        "google_scholar": "vgLANV0AAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en;https://scholar.google.com.tw/citations?user=rkb3_FgAAAAJ",
        "orcid": ";;;0000-0003-2404-0974",
        "linkedin": ";;;https://linkedin.com/in/baochun",
        "or_profile": "~Wanyu_Lin1;~Hao_Lan1;~Hao_He1;~Baochun_Li1",
        "aff": "The Hong Kong Polytechnic University;Tsinghua University;Massachusetts Institute of Technology;University of Toronto",
        "aff_domain": "polyu.edu.hk;tsinghua.edu.cn;mit.edu;toronto.edu",
        "position": "Assistant Professor;Postdoc;PhD student;Full Professor",
        "bibtex": "@misc{\nlin2024graphrelational,\ntitle={Graph-Relational Federated Learning: Enhanced Personalization and Robustness},\nauthor={Wanyu Lin and Hao Lan and Hao He and Baochun Li},\nyear={2024},\nurl={https://openreview.net/forum?id=FMLyPgqos1}\n}",
        "github": "",
        "project": "",
        "reviewers": "2W8m;i3ns;vqGr",
        "site": "https://openreview.net/forum?id=FMLyPgqos1",
        "pdf_size": 937958,
        "rating": "5;5;5",
        "confidence": "3;5;5",
        "soundness": "3;2;2",
        "contribution": "3;3;2",
        "presentation": "2;2;3",
        "wc_summary": "77;70;13",
        "wc_strengths": "42;59;22",
        "wc_weaknesses": "159;102;60",
        "wc_questions": "25;60;20",
        "wc_review": "303;291;115",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            53.333333333333336,
            28.66279043560755
        ],
        "wc_strengths_avg": [
            41.0,
            15.121728296285006
        ],
        "wc_weaknesses_avg": [
            107.0,
            40.570925550201586
        ],
        "wc_questions_avg": [
            35.0,
            17.795130420052185
        ],
        "wc_review_avg": [
            236.33333333333334,
            85.93537623638409
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:WN-XL_ff_nIJ:scholar.google.com/&scioq=Graph-Relational+Federated+Learning:+Enhanced+Personalization+and+Robustness&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Hong Kong Polytechnic University;Tsinghua University;Massachusetts Institute of Technology;University of Toronto",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.polyu.edu.hk;https://www.tsinghua.edu.cn;https://web.mit.edu;https://www.utoronto.ca",
        "aff_unique_abbr": "PolyU;THU;MIT;U of T",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;1;2",
        "aff_country_unique": "China;United States;Canada"
    },
    {
        "title": "Gradual Optimization Learning for Conformational Energy Minimization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19068",
        "id": "FMMF1a9ifL",
        "author_site": "Artem Tsypin, Leonid A. Ugadiarov, Kuzma Khrabrov, Alexander Telepov, Egor Rumiantsev, Alexey Skrynnik, Aleksandr Panov, Dmitry P. Vetrov, Elena Tutubalina, Artur Kadurin",
        "tldr": "",
        "abstract": "Molecular conformation optimization is crucial to computer-aided drug discovery and materials design.\nTraditional energy minimization techniques rely on iterative optimization methods that use molecular forces calculated by a physical simulator (oracle) as anti-gradients.\nHowever, this is a computationally expensive approach that requires many interactions with a physical simulator.\nOne way to accelerate this procedure is to replace the physical simulator with a neural network.\nDespite recent progress in neural networks for molecular conformation energy prediction, such models are prone to errors due to distribution shift, leading to inaccurate energy minimization.\nWe find that the quality of energy minimization with neural networks can be improved by providing optimization trajectories as additional training data.\nStill, obtaining complete optimization trajectories demands a lot of additional computations.\nTo reduce the required additional data, we present the Gradual Optimization Learning Framework (GOLF) for energy minimization with neural networks.\nThe framework consists of an efficient data-collecting scheme and an external optimizer.\nThe external optimizer utilizes gradients from the energy prediction model to generate optimization trajectories, and the data-collecting scheme selects additional training data to be processed by the physical simulator. \nOur results demonstrate that the neural network trained with GOLF performs \\textit{on par} with the oracle on a benchmark of diverse drug-like molecules using significantly less additional data.",
        "keywords": "energy minimization;conformational optimization;geometry optimization",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Artem Tsypin;Leonid Anatolievich Ugadiarov;Kuzma Khrabrov;Alexander Telepov;Egor Rumiantsev;Alexey Skrynnik;Aleksandr Panov;Dmitry P. Vetrov;Elena Tutubalina;Artur Kadurin",
        "authorids": "~Artem_Tsypin1;~Leonid_Anatolievich_Ugadiarov1;~Kuzma_Khrabrov1;~Alexander_Telepov1;~Egor_Rumiantsev1;~Alexey_Skrynnik1;~Aleksandr_Panov1;~Dmitry_P._Vetrov1;~Elena_Tutubalina1;~Artur_Kadurin1",
        "gender": "M;M;M;M;M;M;M;M;F;M",
        "homepage": ";https://github.com/ugadiarov-la-phystech-edu;;;https://github.com/AztecAlive;https://tviskaron.github.io;http://grafft.github.io;https://constructor.university/faculty-member/dmitry-vetrov;;",
        "dblp": "304/7594;;360/7510;;;222/2698;177/9975;89/3348;153/5554;230/8564",
        "google_scholar": "ppR0eQYAAAAJ;;https://scholar.google.co.uk/citations?user=DRmC-YUAAAAJ;;IxItI3UAAAAJ;ITgs9IMAAAAJ;https://scholar.google.ru/citations?hl=ru;https://scholar.google.ru/citations?user=7HU0UoUAAAAJ;https://scholar.google.ru/citations?user=npM9yekAAAAJ;https://scholar.google.ru/citations?user=HFLFHzUAAAAJ",
        "orcid": "0000-0002-0754-759X;;0000-0002-0446-6751;0000-0002-7280-1531;0000-0001-8262-5685;0000-0001-9243-1622;0000-0002-9747-3837;;0000-0001-7936-0284;0000-0003-1482-9365",
        "linkedin": ";;;;;alexey-skrynnik-65a125168/;;;;",
        "or_profile": "~Artem_Tsypin1;~Leonid_Anatolievich_Ugadiarov1;~Kuzma_Khrabrov1;~Alexander_Telepov1;~Egor_Rumiantsev1;~Alexey_Skrynnik1;~Aleksandr_Panov1;~Dmitry_P._Vetrov1;~Elena_Tutubalina1;~Artur_Kadurin1",
        "aff": "Artificial Intelligence Research Institute;Federal Research Center \u00abComputer Science and Control\u00bb of Russian Academy of Sciences;Artificial Intelligence Research Institute (AIRI);AIRI;EPFL - EPF Lausanne;AIRI;Federal Research Center \u00abComputer Science and Control\u00bb of Russian Academy of Sciences;National Research University Higher School of Economics;Kazan Federal University;Kuban State University",
        "aff_domain": "airi.net;frccsc.ru;airi.net;airi.net;epfl.ch;airi.net;frccsc.ru;hse.ru;kpfu.ru;kubsu.ru",
        "position": "Researcher;Researcher;Researcher;Researcher;PhD student;Senior Research Scientist;Principal Researcher;Full Professor;Researcher;Associate Professor",
        "bibtex": "@inproceedings{\ntsypin2024gradual,\ntitle={Gradual Optimization Learning for Conformational Energy Minimization},\nauthor={Artem Tsypin and Leonid Anatolievich Ugadiarov and Kuzma Khrabrov and Alexander Telepov and Egor Rumiantsev and Alexey Skrynnik and Aleksandr Panov and Dmitry P. Vetrov and Elena Tutubalina and Artur Kadurin},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=FMMF1a9ifL}\n}",
        "github": "",
        "project": "",
        "reviewers": "HQch;bemc;DBvP;RbRE",
        "pdf_size": 2803064,
        "rating": "6;6;6;8",
        "confidence": "3;4;3;4",
        "soundness": "3;2;3;2",
        "contribution": "3;2;2;3",
        "presentation": "3;2;3;4",
        "wc_summary": "1248;115;39;26",
        "wc_strengths": "63;30;22;37",
        "wc_weaknesses": "85;126;94;175",
        "wc_questions": "318;159;43;23",
        "wc_review": "1714;430;198;261",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "2232;824;1135;574",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "4;2;2;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            357.0,
            515.540978002719
        ],
        "wc_strengths_avg": [
            38.0,
            15.378556499229699
        ],
        "wc_weaknesses_avg": [
            120.0,
            35.220732530712645
        ],
        "wc_questions_avg": [
            135.75,
            117.33578951027687
        ],
        "wc_review_avg": [
            650.75,
            619.701288928787
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1191.25,
            632.8891589370132
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.25,
            1.0897247358851685
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6290084761575543925&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=FMMF1a9ifL",
        "pdf": "https://openreview.net/pdf?id=FMMF1a9ifL",
        "email": "airi.net;frccsc.ru;airi.net;airi.net;epfl.ch;airi.net;frccsc.ru;hse.ru;kpfu.ru;kubsu.ru",
        "author_num": 10,
        "aff_unique_index": "0;1;0;0;2;0;1;3;4;5",
        "aff_unique_norm": "Artificial Intelligence Research Institute;Russian Academy of Sciences;EPFL;National Research University Higher School of Economics;Kazan Federal University;Kuban State University",
        "aff_unique_dep": ";Computer Science and Control;;;;",
        "aff_unique_url": ";https://www.ras.ru;https://www.epfl.ch;https://hse.ru;http://kpfu.ru;http://www.kubsu.ru",
        "aff_unique_abbr": ";RAS;EPFL;HSE;KFU;KubSU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Lausanne",
        "aff_country_unique_index": "0;1;3;4;3;1;1;1;1",
        "aff_country_unique": "United States;Russian Federation;;Japan;Switzerland"
    },
    {
        "id": "FMsmo01TaI",
        "title": "The Power of the Senses: Generalizable Manipulation from Vision and Touch through Masked Multimodal Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Humans rely on the synergy of their senses for most essential tasks. For tasks requiring object manipulation, we seamlessly and effectively exploit the complementarity of our senses of vision and touch. This paper draws inspiration from such capabilities and aims to find a systematic approach to fuse visual and tactile information in a reinforcement learning setting. We propose Masked Multimodal Learning (M3L), which jointly learns a policy and visual-tactile representations based on masked autoencoding. The representations jointly learned from vision and touch improve sample efficiency, and unlock generalization capabilities beyond those achievable through each of the senses separately. Remarkably, representations learned in a multimodal setting also benefit vision-only policies at test time. We consider simulations provided of both visual and tactile observations, namely, a robotic insertion environment, a door opening task, and dexterous in-hand manipulation, demonstrating the benefits of learning a multimodal policy. Videos of the experiments are available at https://m3l.site. Code will be released upon acceptance.",
        "keywords": "Representation Learning;Visual-Tactile Robotic Manipulation;Reinforcement Learning",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Carmelo Sferrazza;Younggyo Seo;Hao Liu;Youngwoon Lee;Pieter Abbeel",
        "authorids": "~Carmelo_Sferrazza1;~Younggyo_Seo1;~Hao_Liu1;~Youngwoon_Lee1;~Pieter_Abbeel2",
        "gender": ";M;M;M;M",
        "homepage": "https://sferrazza.cc;https://younggyo.me/;https://youngwoon.github.io;https://people.eecs.berkeley.edu/~pabbeel/;https://haoliu.ai",
        "dblp": "190/8406;265/5586;117/4767;;09/3214-55",
        "google_scholar": "x0_lwNYAAAAJ;tI1-YwIAAAAJ;CDPa3AgAAAAJ;https://scholar.google.com.tw/citations?user=vtwH6GkAAAAJ;wtK4Yh4AAAAJ",
        "orcid": "0000-0002-7432-7634;;0000-0001-9918-1056;;",
        "linkedin": "csferrazza/;;;;",
        "or_profile": "~Carmelo_Sferrazza1;~Younggyo_Seo1;~Youngwoon_Lee1;~Pieter_Abbeel2;~Hao_Liu10",
        "aff": "University of California, Berkeley;Dyson;University of California, Berkeley;Covariant;University of California, Berkeley",
        "aff_domain": "berkeley.edu;dyson.com;berkeley.edu;covariant.ai;berkeley.edu",
        "position": "Postdoc;Researcher;Postdoc;Founder;PhD student",
        "bibtex": "@misc{\nsferrazza2024the,\ntitle={The Power of the Senses: Generalizable Manipulation from Vision and Touch through Masked Multimodal Learning},\nauthor={Carmelo Sferrazza and Younggyo Seo and Hao Liu and Youngwoon Lee and Pieter Abbeel},\nyear={2024},\nurl={https://openreview.net/forum?id=FMsmo01TaI}\n}",
        "github": "",
        "project": "",
        "reviewers": "HDvH;pVq9;bnCo",
        "site": "https://openreview.net/forum?id=FMsmo01TaI",
        "pdf_size": 4856293,
        "rating": "3;5;5",
        "confidence": "3;4;4",
        "soundness": "3;2;1",
        "contribution": "1;3;2",
        "presentation": "3;3;2",
        "wc_summary": "43;82;64",
        "wc_strengths": "49;116;61",
        "wc_weaknesses": "181;422;242",
        "wc_questions": "5;220;71",
        "wc_review": "278;840;438",
        "wc_reply_reviewers": "0;74;160",
        "wc_reply_authors": "860;971;848",
        "reply_reviewers": "0;1;1",
        "reply_authors": "3;3;3",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            63.0,
            15.937377450509228
        ],
        "wc_strengths_avg": [
            75.33333333333333,
            29.169999809545573
        ],
        "wc_weaknesses_avg": [
            281.6666666666667,
            102.30781440774155
        ],
        "wc_questions_avg": [
            98.66666666666667,
            89.92713099442732
        ],
        "wc_review_avg": [
            518.6666666666666,
            236.41958933688684
        ],
        "wc_reply_reviewers_avg": [
            78.0,
            65.38093503970914
        ],
        "wc_reply_authors_avg": [
            893.0,
            55.37147279962851
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.0,
            0.0
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.9999999999999998,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15156661832121506907&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;0;2;0",
        "aff_unique_norm": "University of California, Berkeley;Dyson;Covariant",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.berkeley.edu;https://www.dyson.com;",
        "aff_unique_abbr": "UC Berkeley;;",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Berkeley;",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "United States;United Kingdom;"
    },
    {
        "id": "FNCFiXKYoq",
        "title": "MAAD Private: Multi-Attribute Adversarial Debiasing with Differential Privacy",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Balancing the trade-offs between algorithmic fairness, individual privacy, and\nmodel utility, is pivotal for the advancement of ethical artificial intelligence. In\nthis work, we explore fair classification through the lens of differential privacy.\nWe present an enhancement to the adversarial debiasing approach, enabling it\nto account for multiple sensitive attributes while upholding a privacy-conscious\nlearning paradigm. Empirical results from two tabular datasets and a natural language\ndataset demonstrate our model\u2019s ability to concurrently debias up to four\nsensitive attributes and meet various fairness criteria, within the constraints of differential\nprivacy.",
        "keywords": "differential privacy;fair classification;adversarial learning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/da70cd8e972f57905bc1e5480fa438f32ae19ea8.pdf",
        "author": "Niloy Purkait;Emmanuel Keuleers;Henry Brighton",
        "authorids": "~Niloy_Purkait1;~Emmanuel_Keuleers1;h.j.brighton@tilburguniversity.edu",
        "gender": "M;;",
        "homepage": ";https://www.tilburguniversity.edu/staff/e-a-keuleers;",
        "dblp": ";;",
        "google_scholar": ";;",
        "orcid": ";;",
        "linkedin": "niloy-purkait;;",
        "or_profile": "~Niloy_Purkait1;~Emmanuel_Keuleers1;h.j.brighton@tilburguniversity.edu",
        "aff": ";Tilburg University;",
        "aff_domain": ";tilburguniversity.edu;",
        "position": ";Associate Professor;",
        "bibtex": "@misc{\npurkait2024maad,\ntitle={{MAAD} Private: Multi-Attribute Adversarial Debiasing with Differential Privacy},\nauthor={Niloy Purkait and Emmanuel Keuleers and Henry Brighton},\nyear={2024},\nurl={https://openreview.net/forum?id=FNCFiXKYoq}\n}",
        "github": "",
        "project": "",
        "reviewers": "DNiP;id92;5K9B;VSVe;LNLd",
        "site": "https://openreview.net/forum?id=FNCFiXKYoq",
        "pdf_size": 230511,
        "rating": "3;3;3;3;3",
        "confidence": "4;4;5;3;4",
        "soundness": "2;2;2;2;3",
        "contribution": "1;2;2;3;1",
        "presentation": "2;2;1;2;3",
        "wc_summary": "93;109;43;52;21",
        "wc_strengths": "51;43;20;46;12",
        "wc_weaknesses": "519;105;31;121;100",
        "wc_questions": "9;312;27;138;6",
        "wc_review": "672;569;121;357;139",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.2,
            0.39999999999999997
        ],
        "contribution_avg": [
            1.8,
            0.7483314773547883
        ],
        "presentation_avg": [
            2.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            63.6,
            32.55518391900129
        ],
        "wc_strengths_avg": [
            34.4,
            15.447977213862014
        ],
        "wc_weaknesses_avg": [
            175.2,
            174.6498210706212
        ],
        "wc_questions_avg": [
            98.4,
            117.32109784689197
        ],
        "wc_review_avg": [
            371.6,
            221.9563921134059
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:W4K3-nbbICgJ:scholar.google.com/&scioq=MAAD+Private:+Multi-Attribute+Adversarial+Debiasing+with+Differential+Privacy&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Tilburg University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tilburguniversity.edu/",
        "aff_unique_abbr": "Tilburg U",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Netherlands"
    },
    {
        "title": "SEINE: Short-to-Long Video Diffusion Model for Generative Transition and Prediction",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19067",
        "id": "FNq3nIvP4F",
        "author_site": "Xinyuan Chen, Yaohui Wang, Lingjun Zhang, Shaobin Zhuang, Xin Ma, Jiashuo Yu, Yali Wang, Dahua Lin, Yu Qiao, Ziwei Liu",
        "tldr": "",
        "abstract": "Recently video generation has achieved substantial progress with realistic results. Nevertheless, existing AI-generated videos are usually very short clips (\"shot-level'') depicting a single scene. To deliver a coherent long video (\"story-level''), it is desirable to have creative transition and prediction effects across different clips. This paper presents a short-to-long video diffusion model, SEINE, that focuses on generative transition and prediction. The goal is to generate high-quality long videos with smooth and creative transitions between scenes and varying lengths of shot-level videos. Specifically, we propose a random-mask video diffusion model to automatically generate transitions based on textual descriptions. By providing the images of different scenes as inputs, combined with text-based control, our model generates transition videos that ensure coherence and visual quality. Furthermore, the model can be readily extended to various tasks such as image-to-video animation and autoregressive video prediction. To conduct a comprehensive evaluation of this new generative task, we propose three assessing criteria for smooth and creative transition: temporal consistency, semantic similarity, and video-text semantic alignment. Extensive experiments validate the effectiveness of our approach over existing methods for generative transition and prediction, enabling the creation of story-level long videos.",
        "keywords": "generative model; video generation; diffusion model",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/0aca679cba688b36d8b9e374ec4f09022aa9a1fa.zip",
        "author": "Xinyuan Chen;Yaohui Wang;Lingjun Zhang;Shaobin Zhuang;Xin Ma;Jiashuo Yu;Yali Wang;Dahua Lin;Yu Qiao;Ziwei Liu",
        "authorids": "~Xinyuan_Chen1;~Yaohui_Wang1;~Lingjun_Zhang1;~Shaobin_Zhuang1;~Xin_Ma3;~Jiashuo_Yu1;~Yali_Wang1;~Dahua_Lin1;~Yu_Qiao1;~Ziwei_Liu1",
        "gender": "F;M;F;M;;M;M;M;;M",
        "homepage": ";https://wyhsirius.github.io/;;https://github.com/897295875;https://maxin-cn.github.io/;;;http://dahua.site;;https://liuziwei7.github.io/",
        "dblp": ";168/6263-1.html;;;;289/7338;01/773-1;53/6088;;05/6300-2",
        "google_scholar": "3fWSC8YAAAAJ;R7LyAb4AAAAJ;https://scholar.google.com.hk/citations?user=b8er2Q4AAAAJ;;https://scholar.google.com.hk/citations?user=dN8QWCQAAAAJ;iH0Aq0YAAAAJ;https://scholar.google.com/citations?hl=en;GMzzRRUAAAAJ;;https://scholar.google.com.hk/citations?user=lc45xlcAAAAJ",
        "orcid": "0000-0002-5517-7255;;;;0000-0001-9389-9032;;;;;",
        "linkedin": ";;;;;;;;;",
        "or_profile": "~Xinyuan_Chen1;~Yaohui_Wang1;~Lingjun_Zhang1;~Shaobin_Zhuang1;~Xin_Ma3;~Jiashuo_Yu1;~Yali_Wang1;~Dahua_Lin1;~Yu_Qiao1;~Ziwei_Liu1",
        "aff": "Shanghai Artificial Intelligence Laboratory;Shanghai AI Laboratory;East China Normal University;Shanghai Jiaotong University;Monash University;Shanghai AI Laboratory;SIAT, Chinese Academy of Sciences;The Chinese University of Hong Kong;;Nanyang Technological University",
        "aff_domain": "pjlab.org.cn;pjlab.org.cn;ecnu.edu.cn;sjtu.edu.cn;monash.edu;pjlab.org.cn;siat.ac.cn;cuhk.edu.hk;;ntu.edu.sg",
        "position": "Research Scientist;Research Scientist;MS student;PhD student;PhD student;Researcher;Full Professor;Associate Professor;;Assistant Professor",
        "bibtex": "@inproceedings{\nchen2024seine,\ntitle={{SEINE}: Short-to-Long Video Diffusion Model for Generative Transition and Prediction},\nauthor={Xinyuan Chen and Yaohui Wang and Lingjun Zhang and Shaobin Zhuang and Xin Ma and Jiashuo Yu and Yali Wang and Dahua Lin and Yu Qiao and Ziwei Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=FNq3nIvP4F}\n}",
        "github": "",
        "project": "",
        "reviewers": "Tv5a;GChA;4xUi;Yzaz",
        "pdf_size": 40908474,
        "rating": "5;5;6;6",
        "confidence": "3;3;4;4",
        "soundness": "3;3;2;3",
        "contribution": "2;3;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "126;66;52;58",
        "wc_strengths": "99;123;27;73",
        "wc_weaknesses": "192;162;249;36",
        "wc_questions": "105;20;2;41",
        "wc_review": "522;371;330;208",
        "wc_reply_reviewers": "0;0;109;26",
        "wc_reply_authors": "1708;778;485;299",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "4;2;1;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            75.5,
            29.576172842340505
        ],
        "wc_strengths_avg": [
            80.5,
            35.59143155311401
        ],
        "wc_weaknesses_avg": [
            159.75,
            77.9819690697792
        ],
        "wc_questions_avg": [
            42.0,
            38.903727327853815
        ],
        "wc_review_avg": [
            357.75,
            112.19263567632235
        ],
        "wc_reply_reviewers_avg": [
            33.75,
            44.72345581459465
        ],
        "wc_reply_authors_avg": [
            817.5,
            541.7446354141405
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 129,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6072100883560598995&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=FNq3nIvP4F",
        "pdf": "https://openreview.net/pdf?id=FNq3nIvP4F",
        "email": "pjlab.org.cn;pjlab.org.cn;ecnu.edu.cn;sjtu.edu.cn;monash.edu;pjlab.org.cn;siat.ac.cn;cuhk.edu.hk;;ntu.edu.sg",
        "author_num": 10,
        "aff_unique_index": "0;1;2;3;4;1;5;6;7",
        "aff_unique_norm": "Shanghai Artificial Intelligence Laboratory;Shanghai AI Laboratory;East China Normal University;Shanghai Jiao Tong University;Monash University;Shenzhen Institute of Advanced Technology;Chinese University of Hong Kong;Nanyang Technological University",
        "aff_unique_dep": ";;;;;;;",
        "aff_unique_url": "http://www.shailab.org/;https://www.shanghai-ai-lab.com;http://www.ecnu.edu.cn;https://www.sjtu.edu.cn;https://www.monash.edu;http://www.siat.ac.cn;https://www.cuhk.edu.hk;https://www.ntu.edu.sg",
        "aff_unique_abbr": "Shanghai AI Lab;SAIL;ECNU;SJTU;Monash;SIAT;CUHK;NTU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;1;0;0;0;2",
        "aff_country_unique": "China;Australia;Singapore"
    },
    {
        "title": "A Symmetry-Aware Exploration of Bayesian Neural Network Posteriors",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19066",
        "id": "FOSBQuXgAq",
        "author_site": "Olivier Laurent, Emanuel Aldea, Gianni Franchi",
        "tldr": "",
        "abstract": "The distribution of modern deep neural networks (DNNs) weights -- crucial for uncertainty quantification and robustness -- is an eminently complex object due to its extremely high dimensionality. This paper presents one of the first large-scale explorations of the posterior distribution of deep Bayesian Neural Networks (BNNs), expanding its study to real-world vision tasks and architectures. Specifically, we investigate the optimal approach for approximating the posterior, analyze the connection between posterior quality and uncertainty quantification, delve into the impact of modes on the posterior, and explore methods for visualizing the posterior. Moreover, we uncover weight-space symmetries as a critical aspect for understanding the posterior. To this extent, we develop an in-depth assessment of the impact of both permutation and scaling symmetries that tend to obfuscate the Bayesian posterior. While the first type of transformation is known for duplicating modes, we explore the relationship between the latter and L2 regularization, challenging previous misconceptions. Finally, to help the community improve our understanding of the Bayesian posterior, we release the first large-scale checkpoint dataset, including thousands of real-world models, along with our code.",
        "keywords": "bayesian posterior;bayesian neural networks;dataset;ensembles;uncertainty quantification;weight-space symmetries;computer vision",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/fa9367a5e764d138369829754f36d8aad6782313.zip",
        "author": "Olivier Laurent;Emanuel Aldea;Gianni Franchi",
        "authorids": "~Olivier_Laurent1;~Emanuel_Aldea1;~Gianni_Franchi1",
        "gender": ";M;M",
        "homepage": ";http://hebergement.u-psud.fr/emi/;https://giannifranchi.github.io/",
        "dblp": "05/5071-2;76/456;155/3061",
        "google_scholar": "https://scholar.google.com/citations?hl=fr;T7LppsgAAAAJ;ZCW6-psAAAAJ",
        "orcid": "0009-0005-2291-2005;;0000-0002-2184-1381",
        "linkedin": "olivier-laurent-100772190/;;gianni-franchi-94435754/",
        "or_profile": "~Olivier_Laurent1;~Emanuel_Aldea1;~Gianni_Franchi1",
        "aff": "Universit\u00e9 Paris-Saclay;University Paris-Saclay;ENSTA Paris",
        "aff_domain": "universite-paris-saclay.fr;u-psud.fr;ensta-paristech.fr",
        "position": "PhD student;Associate Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nlaurent2024a,\ntitle={A Symmetry-Aware Exploration of Bayesian Neural Network Posteriors},\nauthor={Olivier Laurent and Emanuel Aldea and Gianni Franchi},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=FOSBQuXgAq}\n}",
        "github": "",
        "project": "",
        "reviewers": "24pF;Mjnv;hdLm;QYDw;cm11",
        "pdf_size": 1578388,
        "rating": "3;5;6;6;8",
        "confidence": "4;4;4;3;3",
        "soundness": "2;3;3;4;3",
        "contribution": "1;2;3;3;3",
        "presentation": "2;3;3;3;3",
        "wc_summary": "87;117;96;97;169",
        "wc_strengths": "74;141;116;134;312",
        "wc_weaknesses": "277;654;385;137;168",
        "wc_questions": "227;89;126;188;379",
        "wc_review": "665;1001;723;556;1028",
        "wc_reply_reviewers": "0;290;808;375;41",
        "wc_reply_authors": "1794;3125;3604;740;978",
        "reply_reviewers": "0;1;3;1;1",
        "reply_authors": "3;5;6;2;3",
        "rating_avg": [
            5.6,
            1.624807680927192
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            3.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            2.4,
            0.8
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            113.2,
            29.572960622839236
        ],
        "wc_strengths_avg": [
            155.4,
            81.69112558901364
        ],
        "wc_weaknesses_avg": [
            324.2,
            186.61982745678446
        ],
        "wc_questions_avg": [
            201.8,
            100.69240289118142
        ],
        "wc_review_avg": [
            794.6,
            187.57889007028484
        ],
        "wc_reply_reviewers_avg": [
            302.8,
            290.1140465403218
        ],
        "wc_reply_authors_avg": [
            2048.2,
            1140.293365761636
        ],
        "reply_reviewers_avg": [
            1.2,
            0.9797958971132713
        ],
        "reply_authors_avg": [
            3.8,
            1.469693845669907
        ],
        "replies_avg": [
            36,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.7035264706814485,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8720865840263248806&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=FOSBQuXgAq",
        "pdf": "https://openreview.net/pdf?id=FOSBQuXgAq",
        "email": "universite-paris-saclay.fr;u-psud.fr;ensta-paristech.fr",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Universit\u00e9 Paris-Saclay;University Paris-Saclay;\u00c9cole Nationale Sup\u00e9rieure de Techniques Avanc\u00e9es",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.universite-paris-saclay.fr;https://www.universite-paris-saclay.fr;https://www.ensta.fr",
        "aff_unique_abbr": "UPSaclay;UPSaclay;ENSTA",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Paris",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "France"
    },
    {
        "id": "FOlhvs5Wh4",
        "title": "Slightly Harmonizing Certified Robust Radius and Accuracy",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In the field of certified robustness through randomized smoothing, several works endeavor to improve the certified robust radius through, e.g., examining various smoothing distributions, conducting smooth training with adversarial data, or employing f-divergence based metrics. However, there is a lack of theoretical studies that delve into the relationship between the accuracy performance, the certified robust radius, and the model weights for smoothed classifiers. In the context of this study, we develop a generalization error bound that possesses a certified robust radius for a variant of the smoothed classifier (i.e., the classifier with both smoothed inputs and weights); In other words, the generalization bound holds under any data perturbation within the certified robust radius. As a byproduct, we find that the underpinnings of both the generalization bound and the certified robust radius draw, in part, upon weight spectral norm, which thereby inspires the adoption of spectral regularization in smooth training to boost certified robustness. Utilizing the dimension-independent property of spherical Gaussian inputs in smooth training, we propose a novel and inexpensive spectral regularizer to enhance smoothed classifiers. In addition to the theoretical contribution, an extensive set of empirical results is provided to substantiate the effectiveness of our proposed method.",
        "keywords": "Certified robustness;Randomized smoothing;Generalization",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/597440f7f854a3b44c05a8294200dab123d7e913.zip",
        "author": "Gaojie Jin;Xinping Yi;Pengfei Yang;Xiaowei Huang;Lijun Zhang",
        "authorids": "~Gaojie_Jin1;~Xinping_Yi1;~Pengfei_Yang2;~Xiaowei_Huang1;~Lijun_Zhang2",
        "gender": "M;M;M;M;M",
        "homepage": "https://alexkael.github.io/;https://sites.google.com/site/xinpingyi00/;https://iscasmc.ios.ac.cn/?page_id=1181;https://cgi.csc.liv.ac.uk/~xiaowei/;",
        "dblp": "276/5476;95/10043.html;;60/5414-1.html;76/4015-1",
        "google_scholar": "n_cu7jwAAAAJ;wAcbI5kAAAAJ;;https://scholar.google.co.uk/citations?user=X4fLCCIAAAAJ;",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Gaojie_Jin1;~Xinping_Yi1;~Pengfei_Yang2;~Xiaowei_Huang1;~Lijun_Zhang2",
        "aff": "Chinese Academy of Sciences, Chinese Academy of Sciences;Southeast University;;University of Liverpool;Chinese Academy of Sciences, Chinese Academy of Sciences",
        "aff_domain": "ios.ac.cn;seu.edu.cn;;liverpool.ac.uk;ios.ac.cn",
        "position": "Associate Professor;Full Professor;;Full Professor;Full Professor",
        "bibtex": "@misc{\njin2024slightly,\ntitle={Slightly Harmonizing Certified Robust Radius and Accuracy},\nauthor={Gaojie Jin and Xinping Yi and Pengfei Yang and Xiaowei Huang and Lijun Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=FOlhvs5Wh4}\n}",
        "github": "",
        "project": "",
        "reviewers": "g8UQ;BZwW;fngE;RAXB",
        "site": "https://openreview.net/forum?id=FOlhvs5Wh4",
        "pdf_size": 2395788,
        "rating": "3;3;5;8",
        "confidence": "2;4;3;3",
        "soundness": "2;2;3;3",
        "contribution": "2;3;2;3",
        "presentation": "2;2;2;3",
        "wc_summary": "112;52;136;75",
        "wc_strengths": "70;24;39;40",
        "wc_weaknesses": "496;285;184;113",
        "wc_questions": "98;9;165;27",
        "wc_review": "776;370;524;255",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            93.75,
            32.45285041410076
        ],
        "wc_strengths_avg": [
            43.25,
            16.69393602479655
        ],
        "wc_weaknesses_avg": [
            269.5,
            144.34767057351496
        ],
        "wc_questions_avg": [
            74.75,
            61.82384248815339
        ],
        "wc_review_avg": [
            481.25,
            195.1094244263972
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:FNAZowbpXFEJ:scholar.google.com/&scioq=Slightly+Harmonizing+Certified+Robust+Radius+and+Accuracy&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Chinese Academy of Sciences;Southeast University;University of Liverpool",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.cas.cn;https://www.seu.edu.cn/;https://www.liverpool.ac.uk",
        "aff_unique_abbr": "CAS;SEU;Liv Uni",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "id": "FPpLTTvzR0",
        "title": "IDEA: Invariant Causal Defense for Graph Adversarial Robustness",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Despite the success of graph neural networks (GNNs), their vulnerability to adversarial attacks poses tremendous challenges for practical applications. Existing defense methods suffer from severe performance decline under some unknown attacks, due to either limited observed adversarial examples (adversarial training) or pre-de\ufb01ned heuristics (graph puri\ufb01cation or robust aggregation). To address these limitations, we analyze the causalities in graph adversarial attacks and conclude that causal features are desirable to achieve graph adversarial robustness, owing to their determinedness for labels and invariance across attacks. To learn these causal features, we innovatively propose an Invariant causal DEfense method against adversarial Attacks (IDEA). We derive node-based and structurebased invariance objectives from an information-theoretic perspective. IDEA is provably a causally invariant defense across various attacks. Extensive experiments demonstrate that IDEA signi\ufb01cantly outperforms all baselines under both poisoning and evasion attacks on \ufb01ve benchmark datasets, highlighting its strong and invariant predictability. The implementation of IDEA is available at https://anonymous.4open.science/r/IDEA_repo-666B.",
        "keywords": "Invariant Causal Defense;Adversarial Robustness;Invariant Learning;Graph Neural Networks",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/4b16d062453532ee27e9781fe55c2ad497059c45.zip",
        "author": "Shuchang Tao;Qi Cao;Huawei Shen;Yunfan Wu;Bingbing Xu;Xueqi Cheng",
        "authorids": "~Shuchang_Tao1;~Qi_Cao1;~Huawei_Shen1;~Yunfan_Wu1;~Bingbing_Xu2;~Xueqi_Cheng1",
        "gender": "F;F;M;M;F;M",
        "homepage": "https://taoshuchang.github.io/;https://caoqi92.github.io/biography/;https://www.ict.ac.cn/sourcedb/cn/jssrck/201402/t20140221_4037648.html;https://profile.yunfan.info;https://bingbing-x.github.io/;https://people.ucas.ac.cn/~cxq?language=en",
        "dblp": "211/9461.html;40/5905;;289/3320;154/5877;44/912",
        "google_scholar": "LdavvIwAAAAJ;FflWb1gAAAAJ;;L6Pwc_kAAAAJ;https://scholar.google.com.hk/citations?hl=zh-CN;hY8aLqAAAAAJ",
        "orcid": ";;0000-0002-1081-8119;0000-0001-6994-6791;0009-0004-8319-2681;",
        "linkedin": ";;;;;",
        "or_profile": "~Shuchang_Tao1;~Qi_Cao1;~Huawei_Shen1;~Yunfan_Wu1;~Bingbing_Xu2;~Xueqi_Cheng1",
        "aff": "Alibaba Group;Institute of Computing Technology, Chinese Academy of Sciences, China;Institute of Computing Technology, Chinese Academy of Sciences;Institute of Computing Technology, Chinese Academy of Sciences;Institute of Computing Technology, Chinese Academy of Sciences;Institute of Computing Technology, Chinese Academy",
        "aff_domain": "alibaba-inc.com;ict.ac.cn;ict.ac.cn;ict.ac.cn;ict.ac.cn;ict.ac.cn",
        "position": "Researcher;Associate Professor;Full Professor;PhD student;Associate Professor;Full Professor",
        "bibtex": "@misc{\ntao2024idea,\ntitle={{IDEA}: Invariant Causal Defense for Graph Adversarial Robustness},\nauthor={Shuchang Tao and Qi Cao and Huawei Shen and Yunfan Wu and Bingbing Xu and Xueqi Cheng},\nyear={2024},\nurl={https://openreview.net/forum?id=FPpLTTvzR0}\n}",
        "github": "",
        "project": "",
        "reviewers": "knCN;P55P;6toz;jN54",
        "site": "https://openreview.net/forum?id=FPpLTTvzR0",
        "pdf_size": 5028975,
        "rating": "5;6;6;8",
        "confidence": "2;3;3;2",
        "soundness": "2;2;3;3",
        "contribution": "3;2;2;2",
        "presentation": "3;2;3;3",
        "wc_summary": "77;21;41;50",
        "wc_strengths": "30;24;10;48",
        "wc_weaknesses": "188;66;46;108",
        "wc_questions": "56;39;17;165",
        "wc_review": "351;150;114;371",
        "wc_reply_reviewers": "0;31;16;70",
        "wc_reply_authors": "1494;854;855;1119",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "5;3;4;4",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            2.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            47.25,
            20.129269733400662
        ],
        "wc_strengths_avg": [
            28.0,
            13.638181696985855
        ],
        "wc_weaknesses_avg": [
            102.0,
            54.46099521676041
        ],
        "wc_questions_avg": [
            69.25,
            56.984098659187374
        ],
        "wc_review_avg": [
            246.5,
            115.42205161926381
        ],
        "wc_reply_reviewers_avg": [
            29.25,
            25.955490748587284
        ],
        "wc_reply_authors_avg": [
            1080.5,
            262.01956033853656
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.0,
            0.7071067811865476
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.2294157338705618,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6491187196706858796&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1;1;1;1",
        "aff_unique_norm": "Alibaba Group;Chinese Academy of Sciences",
        "aff_unique_dep": ";Institute of Computing Technology",
        "aff_unique_url": "https://www.alibaba.com;http://www.ict.ac.cn",
        "aff_unique_abbr": "Alibaba;CAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "FPr6hoa8Dq",
        "title": "Individual/Joint Deblurring and Low-Light Image Enhancement in One Go via Unsupervised Deblurring Paradigm",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Image restoration and enhancement, e.g., image deblurring, deraining and low-light image enhancement (LLIE), aim to improve the visual quality according to the corrupted/low-quality observation. Deep learning-based methods have achieved remarkable results on these individual tasks, but it is still hard to tackle them together. While some attempts have been made to implement joint task processing, they inevitably lead to higher data cost and higher training cost. Moreover, these attempts are strictly limited by the data distribution, i.e., the distribution of the inference data is required to be as close as possible to the training data, otherwise the data cannot be used for inference. In this paper, we take the LLIE and deblurring task as the subjects of this study in an attempt to seek a novel solution to the joint task processing problem. Specifically, we tackle this kind of problem in an extraordinary manner, i.e., \\textit{Individual/Joint \\underline{D}eblurring and Low-Light Image \\underline{E}nhancement in One Go \\underline{v}ia \\underline{U}nsupervised \\underline{D}eblurring \\underline{P}aradigm (DEvUDP)}, which integrates the noise self-regression and could avoid the limitations of aforementioned attempts. More specifically, a novel architecture with a transformation branch and a self-regression branch is elaborated, which only accepts unpaired blurry-sharp data as input to train the model; in this way, the pre-trained model can be surprisingly applied to both LLIE, deblurring and mixed degradation processing. Besides, we can choose to highlight perceptual performance or distortion performance of the model by configuring different components to the architecture. Extensive experiments have demonstrate the superiority of the method on different widely-used datasets.",
        "keywords": "deblurring;low-light image enhancement;unsupervised learning;joint task processing",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/de2a40ebb5503fe0ea5d3eb91b38a6c529a60c36.zip",
        "author": "Suiyi Zhao;Zhao Zhang;Jicong Fan;Yang Zhao;Shuicheng YAN",
        "authorids": "~Suiyi_Zhao1;~Zhao_Zhang3;~Jicong_Fan2;~Yang_Zhao6;~Shuicheng_YAN3",
        "gender": ";M;M;M;M",
        "homepage": "https://scholar.google.com/citations?hl=en&user=7hKutlIAAAAJ;http://www.escience.cn/people/cszzhang;https://jicongfan.github.io/;;https://yanshuicheng.ai/",
        "dblp": "318/3006;87/6853-1;139/1570;50/2082-2;y/ShuichengYan",
        "google_scholar": "https://scholar.google.com/citations?hl=en;h6SCUNwAAAAJ;vdJsnhIAAAAJ;https://scholar.google.com.hk/citations?hl=zh-CN;https://scholar.google.com.hk/citations?user=DNuiPHwAAAAJ",
        "orcid": "0000-0001-9324-3391;0000-0002-5703-7969;0000-0001-9665-0355;0000-0002-4032-8049;",
        "linkedin": ";;;;",
        "or_profile": "~Suiyi_Zhao1;~Zhao_Zhang3;~Jicong_Fan2;~Yang_Zhao6;~Shuicheng_YAN3",
        "aff": "Hefei University of Technology;Hefei University of Technology;The Chinese University of Hong Kong, Shenzhen;Hefei University of Technology;sea Group",
        "aff_domain": "hfut.edu.cn;hfut.edu;cuhk.edu.cn;hfut.edu;sea.com",
        "position": "PhD student;Full Professor;Assistant Professor;Associate Professor;Researcher",
        "bibtex": "@misc{\nzhao2024individualjoint,\ntitle={Individual/Joint Deblurring and Low-Light Image Enhancement in One Go via Unsupervised Deblurring Paradigm},\nauthor={Suiyi Zhao and Zhao Zhang and Jicong Fan and Yang Zhao and Shuicheng YAN},\nyear={2024},\nurl={https://openreview.net/forum?id=FPr6hoa8Dq}\n}",
        "github": "",
        "project": "",
        "reviewers": "q5w6;3D3W;Vy5q;KNEC",
        "site": "https://openreview.net/forum?id=FPr6hoa8Dq",
        "pdf_size": 1850147,
        "rating": "3;3;5;5",
        "confidence": "4;5;4;5",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;3;3",
        "wc_summary": "89;49;72;66",
        "wc_strengths": "25;29;69;27",
        "wc_weaknesses": "129;69;112;233",
        "wc_questions": "38;4;116;2",
        "wc_review": "281;151;369;328",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            69.0,
            14.300349646075091
        ],
        "wc_strengths_avg": [
            37.5,
            18.2414363469547
        ],
        "wc_weaknesses_avg": [
            135.75,
            60.2551864987571
        ],
        "wc_questions_avg": [
            40.0,
            46.151923036857305
        ],
        "wc_review_avg": [
            282.25,
            81.92488938045629
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:C9rWWCtsXbkJ:scholar.google.com/&scioq=Individual/Joint+Deblurring+and+Low-Light+Image+Enhancement+in+One+Go+via+Unsupervised+Deblurring+Paradigm&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;2",
        "aff_unique_norm": "Hefei University of Technology;Chinese University of Hong Kong;Sea Group",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.hfut.edu.cn/;https://www.cuhk.edu.cn;",
        "aff_unique_abbr": "HUT;CUHK;",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Shenzhen",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China;"
    },
    {
        "title": "ChatEval: Towards Better LLM-based Evaluators through Multi-Agent Debate",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19065",
        "id": "FQepisCUWu",
        "author_site": "Chi-Min Chan, Weize Chen, Yusheng Su, Jianxuan Yu, Wei Xue, Shanghang Zhang, Jie Fu, Zhiyuan Liu",
        "tldr": "",
        "abstract": "Text evaluation has historically posed significant challenges, often demanding substantial labor and time cost. With the emergence of large language models (LLMs), researchers have explored LLMs' potential as alternatives for human evaluation. While these single-agent-based approaches show promise, experimental results suggest that further advancements are needed to bridge the gap between their current effectiveness and human-level evaluation quality.\nRecognizing that best practices of human evaluation processes often involve multiple human annotators collaborating in the evaluation, we resort to a multi-agent debate framework, moving beyond single-agent prompting strategies.\nIn this paper, we construct a multi-agent referee team called $\\textbf{ChatEval}$ to autonomously discuss and evaluate the quality of different texts. \nOur experiments on two benchmarks illustrate that ChatEval delivers superior accuracy and correlation in alignment with human assessment. Furthermore, we find that the diverse role prompts (different personas) are essential in the multi-agent debate process; that is, utilizing the same role description in the prompts can lead to a degradation in performance. Our qualitative analysis also shows that ChatEval transcends mere textual scoring, offering a human-mimicking evaluation process for reliable assessments.",
        "keywords": "Large Language Model;Multi-Agent Debate;LLM evaluators",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/82064add65d8616909409d7735a785e68d29e452.zip",
        "author": "Chi-Min Chan;Weize Chen;Yusheng Su;Jianxuan Yu;Wei Xue;Shanghang Zhang;Jie Fu;Zhiyuan Liu",
        "authorids": "~Chi-Min_Chan1;~Weize_Chen1;~Yusheng_Su1;~Jianxuan_Yu1;~Wei_Xue5;~Shanghang_Zhang4;~Jie_Fu2;~Zhiyuan_Liu1",
        "gender": "M;M;M;M;M;M;M;F",
        "homepage": "https://chenweize1998.github.io/;https://yushengsu-thu.github.io/;https://yujianxu21.wordpress.com;http://www.wei-xue.com;http://nlp.csai.tsinghua.edu.cn/~lzy;https://github.com/chanchimin;https://bigaidream.github.io/;https://www.shanghangzhang.com/",
        "dblp": "245/7488;260/5558;354/7970;;53/3245-1;306/0963.html;;95/11531",
        "google_scholar": "0CoGHtIAAAAJ;xwy6Va4AAAAJ;;77lSoywAAAAJ;dT0v5u0AAAAJ;5U4P54wAAAAJ;66osleIAAAAJ;voqw10cAAAAJ",
        "orcid": ";0000-0001-9509-9573;0009-0004-9497-6852;;0000-0002-7709-2543;;0000-0002-4494-843X;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Weize_Chen1;~Yusheng_Su1;~Jianxuan_Yu1;~Wei_Xue5;~Zhiyuan_Liu1;~CHIMIN_CHAN1;~Jie_Fu1;~Shanghang_Zhang1",
        "aff": "Tsinghua University;Advanced Micro Devices;tsinghua university;Hong Kong University of Science and Technology;Tsinghua University;Hong Kong University of Science and Technology;Hong Kong University of Science and Technology;Peking University",
        "aff_domain": "tsinghua.edu.cn;amd.com;thu.edu;ust.hk;tsinghua.edu.cn;ust.hk;ust.hk;pku.edu.cn",
        "position": "PhD student;Researcher;Undergrad student;Assistant Professor;Associate Professor;PhD student;Researcher;Assistant Professor",
        "bibtex": "@inproceedings{\nchan2024chateval,\ntitle={ChatEval: Towards Better {LLM}-based Evaluators through Multi-Agent Debate},\nauthor={Chi-Min Chan and Weize Chen and Yusheng Su and Jianxuan Yu and Wei Xue and Shanghang Zhang and Jie Fu and Zhiyuan Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=FQepisCUWu}\n}",
        "github": "",
        "project": "",
        "reviewers": "XZLb;zL85;rxGE;asDf;2Bwn",
        "pdf_size": 865188,
        "rating": "5;5;6;6;6",
        "confidence": "3;4;4;4;4",
        "soundness": "2;2;3;3;3",
        "contribution": "2;3;3;3;3",
        "presentation": "1;2;3;3;3",
        "wc_summary": "124;115;34;75;64",
        "wc_strengths": "492;61;66;48;33",
        "wc_weaknesses": "2;234;86;81;97",
        "wc_questions": "143;16;34;76;143",
        "wc_review": "761;426;220;280;337",
        "wc_reply_reviewers": "12;125;14;0;108",
        "wc_reply_authors": "1155;737;508;796;893",
        "reply_reviewers": "1;1;1;0;1",
        "reply_authors": "4;2;2;2;2",
        "rating_avg": [
            5.6,
            0.48989794855663565
        ],
        "confidence_avg": [
            3.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.8,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.4,
            0.8
        ],
        "wc_summary_avg": [
            82.4,
            33.25417267050858
        ],
        "wc_strengths_avg": [
            140.0,
            176.37119946295087
        ],
        "wc_weaknesses_avg": [
            100.0,
            75.0013333214817
        ],
        "wc_questions_avg": [
            82.4,
            53.17367769865086
        ],
        "wc_review_avg": [
            404.8,
            190.60472187225582
        ],
        "wc_reply_reviewers_avg": [
            51.8,
            53.31566373965535
        ],
        "wc_reply_authors_avg": [
            817.8,
            210.8738011228517
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4
        ],
        "reply_authors_avg": [
            2.4,
            0.8000000000000002
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.6123724356957946,
        "gs_citation": 461,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5895022507506453381&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=FQepisCUWu",
        "pdf": "https://openreview.net/pdf?id=FQepisCUWu",
        "email": "tsinghua.edu.cn;amd.com;thu.edu;ust.hk;tsinghua.edu.cn;ust.hk;ust.hk;pku.edu.cn",
        "author_num": 8,
        "aff_unique_index": "0;1;0;2;0;2;2;3",
        "aff_unique_norm": "Tsinghua University;Advanced Micro Devices, Inc.;Hong Kong University of Science and Technology;Peking University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.amd.com;https://www.ust.hk;http://www.pku.edu.cn",
        "aff_unique_abbr": "THU;AMD;HKUST;Peking U",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;1;0;0;0;0;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "ZeroFlow: Scalable Scene Flow via Distillation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19064",
        "id": "FRCHDhbxZF",
        "author_site": "Kyle Vedder, Neehar Peri, Nathaniel Chodosh, Ishan Khatri, ERIC EATON, Dinesh Jayaraman, Yang Liu, Deva Ramanan, James Hays",
        "tldr": "",
        "abstract": "Scene flow estimation is the task of describing the 3D motion field between temporally successive point clouds. State-of-the-art methods use strong priors and test-time optimization techniques, but require on the order of tens of seconds to process full-size point clouds, making them unusable as computer vision primitives for real-time applications such as open world object detection. Feedforward methods are considerably faster, running on the order of tens to hundreds of milliseconds for full-size point clouds, but require expensive human supervision. To address both limitations, we propose _Scene Flow via Distillation_, a simple, scalable distillation framework that uses a label-free optimization method to produce pseudo-labels to supervise a feedforward model. Our instantiation of this framework, _ZeroFlow_, achieves **state-of-the-art** performance on the _Argoverse 2 Self-Supervised Scene Flow Challenge_ while using zero human labels by simply training on large-scale, diverse unlabeled data. At test-time, ZeroFlow is over 1000$\\times$ faster than label-free state-of-the-art optimization-based methods on full-size point clouds (34 FPS vs 0.028 FPS) and over 1000$\\times$ cheaper to train on unlabeled data compared to the cost of human annotation (\\\\$394 vs ~\\\\$750,000). To facilitate further research, we will release our code, trained model weights, and high quality pseudo-labels for the Argoverse 2 and Waymo Open datasets.",
        "keywords": "Scene Flow;Distillation;Scaling",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/3959386584dd451079ad7fa7b74a5f99a381d810.pdf",
        "author": "Kyle Vedder;Neehar Peri;Nathaniel Eliot Chodosh;Ishan Khatri;ERIC EATON;Dinesh Jayaraman;Yang Liu;Deva Ramanan;James Hays",
        "authorids": "~Kyle_Vedder1;~Neehar_Peri1;~Nathaniel_Eliot_Chodosh1;~Ishan_Khatri1;~ERIC_EATON1;~Dinesh_Jayaraman2;~Yang_Liu40;~Deva_Ramanan1;~James_Hays1",
        "gender": "M;M;M;M;;M;M;M;M",
        "homepage": "http://vedder.io;http://neeharperi.com;https://nchodosh.github.io;https://ishan.khatri.io;;https://www.seas.upenn.edu/~dineshj/;;https://www.cs.cmu.edu/~deva/;http://www.cc.gatech.edu/~hays/",
        "dblp": "230/8595;241/5094;;298/7510;22/2336;145/3870;;49/488;57/5958",
        "google_scholar": "Ml6RzmEAAAAJ;X3cGY7wAAAAJ;b4qKr7gAAAAJ;-pgIngUAAAAJ;QIZWnnQAAAAJ;QxLpghAAAAAJ;nVWQwHkAAAAJ;9B8PoXUAAAAJ;vjZrDKQAAAAJ",
        "orcid": ";;;;;0000-0002-6888-3095;;;0000-0001-7016-4252",
        "linkedin": ";neeharperi/;;https://linkedin.com/in/ikhatri;;dinesh-jayaraman-44b31539/;yang-liu-24b98a33/;;james-h-hays/",
        "or_profile": "~Kyle_Vedder1;~Neehar_Peri1;~Nathaniel_Eliot_Chodosh1;~Ishan_Khatri1;~ERIC_EATON1;~Dinesh_Jayaraman2;~Yang_Liu40;~Deva_Ramanan1;~James_Hays1",
        "aff": "School of Engineering and Applied Science, University of Pennsylvania;Carnegie Mellon University;Carnegie Mellon University;Stack AV;University of Pennsylvania;University of Pennsylvania;Lawrence Livermore National Laboratory;School of Computer Science, Carnegie Mellon University;Georgia Institute of Technology",
        "aff_domain": "seas.upenn.edu;cmu.edu;cmu.edu;stackav.com;upenn.edu;upenn.edu;llnl.gov;cs.cmu.edu;gatech.edu",
        "position": "PhD student;PhD student;PhD student;Researcher;Faculty;Assistant Professor;Postdoc;Full Professor;Associate professor",
        "bibtex": "@inproceedings{\nvedder2024zeroflow,\ntitle={ZeroFlow: Scalable Scene Flow via Distillation},\nauthor={Kyle Vedder and Neehar Peri and Nathaniel Eliot Chodosh and Ishan Khatri and ERIC EATON and Dinesh Jayaraman and Yang Liu and Deva Ramanan and James Hays},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=FRCHDhbxZF}\n}",
        "github": "",
        "project": "",
        "reviewers": "pGhB;E12X;q16v",
        "pdf_size": 1394799,
        "rating": "5;5;8",
        "confidence": "2;4;4",
        "soundness": "3;2;3",
        "contribution": "1;2;3",
        "presentation": "3;3;3",
        "wc_summary": "50;58;100",
        "wc_strengths": "42;53;155",
        "wc_weaknesses": "33;196;97",
        "wc_questions": "94;5;52",
        "wc_review": "219;312;404",
        "wc_reply_reviewers": "0;0;198",
        "wc_reply_authors": "481;734;243",
        "reply_reviewers": "0;0;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            6.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            69.33333333333333,
            21.9291789378647
        ],
        "wc_strengths_avg": [
            83.33333333333333,
            50.87457343528516
        ],
        "wc_weaknesses_avg": [
            108.66666666666667,
            67.05387551978052
        ],
        "wc_questions_avg": [
            50.333333333333336,
            36.353205574688396
        ],
        "wc_review_avg": [
            311.6666666666667,
            75.5263015261718
        ],
        "wc_reply_reviewers_avg": [
            66.0,
            93.33809511662427
        ],
        "wc_reply_authors_avg": [
            486.0,
            200.4810880523813
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.5000000000000001,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16584997421443362698&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=FRCHDhbxZF",
        "pdf": "https://openreview.net/pdf?id=FRCHDhbxZF",
        "email": "seas.upenn.edu;cmu.edu;cmu.edu;stackav.com;upenn.edu;upenn.edu;llnl.gov;cs.cmu.edu;gatech.edu",
        "author_num": 9,
        "aff_unique_index": "0;1;1;2;0;0;3;1;4",
        "aff_unique_norm": "University of Pennsylvania;Carnegie Mellon University;Stack AV;Lawrence Livermore National Laboratory;Georgia Institute of Technology",
        "aff_unique_dep": "School of Engineering and Applied Science;;;;",
        "aff_unique_url": "https://www.upenn.edu;https://www.cmu.edu;;https://www.llnl.gov;https://www.gatech.edu",
        "aff_unique_abbr": "UPenn;CMU;;LLNL;Georgia Tech",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Pittsburgh",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States;"
    },
    {
        "id": "FRjflOWx2W",
        "title": "Unsupervised Open-Set Task Adaptation Using a Vision-Language Foundation Model",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Human-labeled data is essential for developing deep learning models that can attain human-level recognition. \nHowever, the cost associated with annotation presents a substantial practical challenge when deploying these models in real-world applications.\nRecently, vision-language models like CLIP have shown remarkable zero-shot learning abilities due to vision-language pre-training. \nWhile these models can adapt to various tasks without task-specific human-labeled data, fine-tuning them with such data, though beneficial, can be impractical in cost-sensitive situations.\nIn this paper, we propose an alternative method that harnesses vast amounts of open-set unlabeled data from the wild to establish a robust image classification model suitable for real-world scenarios.\nOur proposed algorithm, Unsupervised Open-Set Task Adaptation (UOTA), offers a straightforward and practical solution, fully capitalizing on the pre-trained CLIP model to enhance its performance by exhaustively utilizing open-set unlabeled data. \nWe substantiate the effectiveness of our contributions through comprehensive experiments conducted on open-set domain adaptation (OSDA) benchmarks that are relevant to our framework.\nRemarkably, without leveraging any source domain model or labeled source data, our method substantially enhances CLIP's classification performance and attains state-of-the-art results on these benchmarks.",
        "keywords": "Unsupervised task adaptation;open-set task adaptation;Vision-language model",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Youngjo Min;Kwangrok Ryoo;Bumsoo Kim;Taesup Kim",
        "authorids": "~Youngjo_Min1;~Kwangrok_Ryoo1;~Bumsoo_Kim1;~Taesup_Kim1",
        "gender": "M;M;M;M",
        "homepage": "https://sites.google.com/view/youngjo-min;;https://bmsookim.github.io/;",
        "dblp": ";;47/6553;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;https://scholar.google.co.kr/citations?user=zKNSsekAAAAJ;7V7yNeoAAAAJ",
        "orcid": ";0000-0002-5801-0696;;",
        "linkedin": ";;bumsoo-kim-003193144/;",
        "or_profile": "~Youngjo_Min1;~Kwangrok_Ryoo1;~Bumsoo_Kim1;~Taesup_Kim1",
        "aff": "Duke University;LG AI Research;LG AI Research;Seoul National University",
        "aff_domain": "duke.edu;lgresearch.ai;lgresearch.ai;snu.ac.kr",
        "position": "PhD student;Researcher;Researcher;Assistant Professor",
        "bibtex": "@misc{\nmin2024unsupervised,\ntitle={Unsupervised Open-Set Task Adaptation Using a Vision-Language Foundation Model},\nauthor={Youngjo Min and Kwangrok Ryoo and Bumsoo Kim and Taesup Kim},\nyear={2024},\nurl={https://openreview.net/forum?id=FRjflOWx2W}\n}",
        "github": "",
        "project": "",
        "reviewers": "UHKB;G7av;a6QH;uTep",
        "site": "https://openreview.net/forum?id=FRjflOWx2W",
        "pdf_size": 19575745,
        "rating": "3;3;3;5",
        "confidence": "3;4;4;5",
        "soundness": "3;1;1;2",
        "contribution": "2;1;2;3",
        "presentation": "2;2;1;3",
        "wc_summary": "36;58;69;65",
        "wc_strengths": "45;22;128;40",
        "wc_weaknesses": "6;46;315;86",
        "wc_questions": "353;78;163;107",
        "wc_review": "440;204;675;298",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            57.0,
            12.747548783981962
        ],
        "wc_strengths_avg": [
            58.75,
            40.88627520330019
        ],
        "wc_weaknesses_avg": [
            113.25,
            119.8652889705773
        ],
        "wc_questions_avg": [
            175.25,
            107.07561580490676
        ],
        "wc_review_avg": [
            404.25,
            177.4632004106767
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:_Jww5-2tlUQJ:scholar.google.com/&scioq=Unsupervised+Open-Set+Task+Adaptation+Using+a+Vision-Language+Foundation+Model&hl=en&as_sdt=0,48",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "Duke University;LG;Seoul National University",
        "aff_unique_dep": ";LG AI Research;",
        "aff_unique_url": "https://www.duke.edu;https://www.lgaires.com;https://www.snu.ac.kr",
        "aff_unique_abbr": "Duke;LG AI;SNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "United States;South Korea"
    },
    {
        "id": "FRpCyW7pWp",
        "title": "Cont-GRU: Fully Continuous Gated Recurrent Units for Irregular Time Series",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "For a long time, RNN-based models, such as RNNs, LSTMs and GRUs, have been used to process time series. However, RNN-based models do not fit well with sporadically (or irregularly) observed real-world data. To this end, some methods \\emph{partially} continuously model RNNs/GRUs using ordinary differential equations (ODEs). In this paper, however, we propose Cont-GRU, which models GRUs as delay differential equations (DDEs). By redefining GRUs as DDEs, we show that i) all the parts of GRUs (the hidden state, the reset gate, the update gate, and the update vector) can be interpreted \\emph{fully} continuously, and ii) our method does not inherit the limitations of ODEs.  In our experiments using 5 real-world datasets and 17 baselines, Cont-GRU outperforms all baselines by non-trivial margins.",
        "keywords": "Time-series;Continuous GRU",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/d129f814c1c367c878e53cfe9e14a7afcac61fd7.pdf",
        "author": "Sheo yon Jhin;Noseong Park",
        "authorids": "~Sheo_yon_Jhin1;~Noseong_Park1",
        "gender": "F;",
        "homepage": "https://sheoyonj.space/;",
        "dblp": "280/3334.html;",
        "google_scholar": "S_EBNdgAAAAJ;",
        "orcid": ";",
        "linkedin": "sheoyon-jhin/;",
        "or_profile": "~Sheo_yon_Jhin1;~Noseong_Park1",
        "aff": "Yonsei University;",
        "aff_domain": "yonsei.ac.kr;",
        "position": "MS student;",
        "bibtex": "@misc{\njhin2024contgru,\ntitle={Cont-{GRU}: Fully Continuous Gated Recurrent Units for Irregular Time Series},\nauthor={Sheo yon Jhin and Noseong Park},\nyear={2024},\nurl={https://openreview.net/forum?id=FRpCyW7pWp}\n}",
        "github": "",
        "project": "",
        "reviewers": "LsJ8;YiRU;ZdKC;JpZR",
        "site": "https://openreview.net/forum?id=FRpCyW7pWp",
        "pdf_size": 900050,
        "rating": "3;3;5;5",
        "confidence": "3;5;3;3",
        "soundness": "3;2;2;3",
        "contribution": "3;1;2;2",
        "presentation": "3;1;2;2",
        "wc_summary": "52;55;27;50",
        "wc_strengths": "33;41;21;74",
        "wc_weaknesses": "76;54;93;312",
        "wc_questions": "22;273;49;60",
        "wc_review": "183;423;190;496",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            46.0,
            11.113055385446435
        ],
        "wc_strengths_avg": [
            42.25,
            19.66437133498043
        ],
        "wc_weaknesses_avg": [
            133.75,
            103.83731265783028
        ],
        "wc_questions_avg": [
            101.0,
            100.26215637018785
        ],
        "wc_review_avg": [
            323.0,
            138.94063480494106
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:khAB_eEN8soJ:scholar.google.com/&scioq=Cont-GRU:+Fully+Continuous+Gated+Recurrent+Units+for+Irregular+Time+Series&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Yonsei University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.yonsei.ac.kr",
        "aff_unique_abbr": "Yonsei",
        "aff_country_unique_index": "0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "FRxDrdysBt",
        "title": "Formally Specifying the High-Level Behavior of LLM-Based Agents",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "LLM-based agents have recently emerged as promising tools for solving challenging problems without the need for task-specific finetuned models that can be expensive to procure. Currently, the design and implementation of such agents is ad hoc, as the wide variety of tasks that LLM-based agents may be applied to naturally means there can be no one-size-fits-all approach to agent design. In this work we aim to alleviate the difficulty of designing and implementing new agents by proposing a minimalistic, high-level generation framework that simplifies the process of building agents. The framework we introduce allows the user to specify desired agent behaviors in Linear Temporal Logic (LTL). The declarative LTL specification is then used to construct a constrained decoder that guarantees the LLM will produce an output exhibiting the desired behavior. By designing our framework in this way, we obtain several benefits, including the ability to enforce complex agent behavior, the ability to formally validate prompt examples, and the ability to seamlessly incorporate content-focused logical constraints into generation. In particular, our declarative approach, in which the desired behavior is simply described without concern for how it should be implemented or enforced, enables rapid design, implementation and experimentation with different LLM-based agents. We demonstrate how the proposed framework can be used to implement recent LLM-based agents, and show how the guardrails our approach provides can lead to improvements in agent performance. In addition, we release our code for general use.",
        "keywords": "LLM-based agents;logic;constrained decoding",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "/attachment/bd60f8b277ecf274f4e87d9cfc118f2c545c7488.zip",
        "author": "Maxwell Crouse;Ibrahim Abdelaziz;Kinjal Basu;Soham Dan;Sadhana Kumaravel;Achille Fokoue;Pavan Kapanipathi;Luis A. Lastras",
        "authorids": "~Maxwell_Crouse1;~Ibrahim_Abdelaziz2;~Kinjal_Basu2;~Soham_Dan1;~Sadhana_Kumaravel1;~Achille_Fokoue1;~Pavan_Kapanipathi1;~Luis_A._Lastras1",
        "gender": ";M;M;F;M;M;M;",
        "homepage": ";;https://sdan2.github.io/;;https://researcher.watson.ibm.com/researcher/view.php?person=us-achille;https://researcher.watson.ibm.com/researcher/view.php?person=us-kapanipa;;",
        "dblp": "218/7208;88/11337-2;181/9448;188/9067;13/2150;27/8503;160/9934;153/1958.html",
        "google_scholar": "dagUw4MAAAAJ;yPOTTbEAAAAJ;nOsmu8UAAAAJ;Irvlq8sAAAAJ;sf_8K8gAAAAJ;ZnHk2x8AAAAJ;IxBeLg8AAAAJ;_kKCBlYAAAAJ",
        "orcid": ";;;;;;;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Maxwell_Crouse1;~Kinjal_Basu2;~Soham_Dan1;~Sadhana_Kumaravel1;~Achille_Fokoue1;~Pavan_Kapanipathi1;~Luis_A._Lastras1;~Ibrahim_Abdelaziz1",
        "aff": "International Business Machines;International Business Machines;International Business Machines;International Business Machines;International Business Machines;International Business Machines;International Business Machines;International Business Machines (IBM)",
        "aff_domain": "ibm.com;ibm.com;ibm.com;ibm.com;ibm.com;ibm.com;ibm.com;ibm.com",
        "position": "Researcher;Researcher;Researcher;Researcher;Principal Researcher;Principal Researcher;Director;Researcher",
        "bibtex": "@misc{\ncrouse2024formally,\ntitle={Formally Specifying the High-Level Behavior of {LLM}-Based Agents},\nauthor={Maxwell Crouse and Ibrahim Abdelaziz and Kinjal Basu and Soham Dan and Sadhana Kumaravel and Achille Fokoue and Pavan Kapanipathi and Luis A. Lastras},\nyear={2024},\nurl={https://openreview.net/forum?id=FRxDrdysBt}\n}",
        "github": "",
        "project": "",
        "reviewers": "dXvQ;a6kU;M2DU;nTyW;34dE",
        "site": "https://openreview.net/forum?id=FRxDrdysBt",
        "pdf_size": 865328,
        "rating": "3;3;3;5;6",
        "confidence": "4;4;4;4;4",
        "soundness": "2;1;3;3;3",
        "contribution": "2;1;2;2;2",
        "presentation": "2;2;3;3;4",
        "wc_summary": "97;104;93;66;199",
        "wc_strengths": "88;46;72;13;165",
        "wc_weaknesses": "518;125;179;19;273",
        "wc_questions": "4;3;28;187;24",
        "wc_review": "707;278;372;285;661",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            4.0,
            1.2649110640673518
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.4,
            0.8
        ],
        "contribution_avg": [
            1.8,
            0.4000000000000001
        ],
        "presentation_avg": [
            2.8,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            111.8,
            45.46383177867875
        ],
        "wc_strengths_avg": [
            76.8,
            50.885754391578
        ],
        "wc_weaknesses_avg": [
            222.8,
            168.92649288965896
        ],
        "wc_questions_avg": [
            49.2,
            69.64309010950046
        ],
        "wc_review_avg": [
            460.6,
            185.95762958265522
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10059196215274208316&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0;0;0;0;1",
        "aff_unique_norm": "International Business Machines Corporation;International Business Machines",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ibm.com;https://www.ibm.com",
        "aff_unique_abbr": "IBM;IBM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "FT4gAPFsQd",
        "title": "How Sparse Can We Prune A Deep Network: A Geometric Viewpoint",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Network pruning constitutes an effective measure to alleviate the storage and computational burden of deep neural networks which arises from its overparameterization. A fundamental question is: How sparse can we prune a deep network without sacrifice on the performance?  To address this problem, in this work we take a first principles approach, specifically, by directly enforcing the sparsity constraint on the original loss function and exploiting the universal \\textit{concentration} effect in the high-dimensional world, \nwe're able to characterize the sharp phase transition point of pruning ratio, which turns out to equal one minus the normalized squared Gaussian width of a convex set determined by the $l_1$-regularized loss function. Meanwhile, we provide efficient countermeasures to address the challenges in computing the involved Gaussian width, including the spectrum estimation of a large-scale Hessian matrix and dealing with the non-definite positiveness of a Hessian matrix. Moreover, through the lens of the pruning ratio threshold, we're able to identify the key factors that impact the pruning performance, thus providing intuitive explanations on many phenomena of existing pruning algorithms. \nExtensive experiments are performed which demonstrate that the theoretical pruning ratio threshold coincides very well with the experimental one. All codes are available at: \\url{https://anonymous.4open.science/r/Global-One-shot-Pruning-BC7B/}",
        "keywords": "Pruning;Statistical Dimension;High Dimension Geometry",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/29ce36980908a6ab3ccb799a8d390c81255f8384.pdf",
        "author": "Qiaozhe Zhang;Ruijie ZHANG;Jun Sun;Yingzhuang Liu",
        "authorids": "~Qiaozhe_Zhang1;~Ruijie_ZHANG1;~Jun_Sun13;~Yingzhuang_Liu1",
        "gender": "M;M;M;M",
        "homepage": "https://scholar.google.com/citations?view_op=list_works&hl=en&user=OllfhOIAAAAJ;https://github.com/K1seki221;;http://eic.hust.edu.cn/professor/liuyingzhuang/index.htm",
        "dblp": "228/1392;04/2964.html;;16/5714",
        "google_scholar": ";ZFNjMTwAAAAJ;;",
        "orcid": ";;0000-0002-5360-1024;",
        "linkedin": ";;;",
        "or_profile": "~Qiaozhe_Zhang1;~Ruijie_ZHANG1;~Jun_Sun13;~Yingzhuang_Liu1",
        "aff": "Huazhong University of Science and Technology;Huazhong University of Science and Technology;Huazhong University of Science and Technology;Huazhong University of Science and Technology",
        "aff_domain": "hust.edu.cn;hust.edu.cn;hust.edu.cn;hust.edu.cn",
        "position": "PhD student;MS student;Associate Professor;Full Professor",
        "bibtex": "@misc{\nzhang2024how,\ntitle={How Sparse Can We Prune A Deep Network: A Geometric Viewpoint},\nauthor={Qiaozhe Zhang and Ruijie ZHANG and Jun Sun and Yingzhuang Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=FT4gAPFsQd}\n}",
        "github": "",
        "project": "",
        "reviewers": "yqv3;QdAJ;Br8B;VwZk",
        "site": "https://openreview.net/forum?id=FT4gAPFsQd",
        "pdf_size": 1030038,
        "rating": "5;5;6;8",
        "confidence": "4;2;4;2",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "45;73;121;108",
        "wc_strengths": "49;55;133;71",
        "wc_weaknesses": "336;91;252;79",
        "wc_questions": "104;19;4;2",
        "wc_review": "534;238;510;260",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1221;373;941;510",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;2;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.0,
            1.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            86.75,
            29.819247140060394
        ],
        "wc_strengths_avg": [
            77.0,
            33.31666249791537
        ],
        "wc_weaknesses_avg": [
            189.5,
            108.72097313766098
        ],
        "wc_questions_avg": [
            32.25,
            41.9426692045225
        ],
        "wc_review_avg": [
            385.5,
            136.98448817293146
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            761.25,
            338.2102711332109
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.40824829046386296,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:5G6Lynu7YB0J:scholar.google.com/&scioq=How+Sparse+Can+We+Prune+A+Deep+Network:+A+Geometric+Viewpoint&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Huazhong University of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.hust.edu.cn",
        "aff_unique_abbr": "HUST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "FTSUDBM6lu",
        "title": "Patch Ranking Map: Explaining Relations among Top-Ranked Patches, Top-Ranked Features and Decisions of Convolutional Neural Networks for Image Classification",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Since a conventional Convolutional Neural Network (CNN) using a large number of extracted features is not fully explainable and not very memory-efficient, we develop an explainable and efficient CNN model consisting of convolutional layers, a new feature selection (FS) layer, a classifier, and a novel ``Patch Ranking Map\" (PRM). The PRM contains top-ranked image patches that have important associations with decisions of the CNN. Top-ranked common features selected by different FS methods are used to generate two newly defined matrices: the ``feature accumulation matrix\" and the ``feature ranking matrix\". Different from a typical heatmap, these two matrices are used to rank image patches in the PRM to effectively explain the relationship among an input image, top-ranked features, top-ranked feature maps, and the final classification decision. Simulation results using the Alzheimer's MRI preprocessed dataset for 4-class image classification with $6,400$ $128\\times128$ images indicate that the three PRMs based on three robust top-ranked common feature sets generated by seven different FS methods have the same top two most important patches associated with Alzheimer's disease diagnosis. In addition, $8\\times8$ patches of a $128\\times128$ image at the 7th and 12th patch rows and at the 8th and 9th patch columns are most informative because they have the top two most important patches and the top two most top-ranked common row-wise and column-wise features. The relationship among brain regions associated with Alzheimer's disease, the top-ranked patches, the top patch rows, and the top patch columns will be analyzed based on research results in brain informatics and medical informatics. The simulations also show that the trained CNN with FS can have higher classification accuracy and smaller model size than the conventional CNN without FS. More effective and efficient optimization algorithms will be developed to select the top (most informative) features and rank patches for building an accurate and efficient CNN model with more explainable decisions that can be captured by the PRM for various image classification applications.",
        "keywords": "convolutional neural networks;deep learning;feature selection;image classification;optimization",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Luna Zhang",
        "authorids": "~Luna_Zhang1",
        "gender": "",
        "homepage": "",
        "dblp": "",
        "google_scholar": "",
        "orcid": "",
        "linkedin": "",
        "or_profile": "",
        "aff": "",
        "aff_domain": "",
        "position": "",
        "bibtex": "@misc{\nzhang2024patch,\ntitle={Patch Ranking Map: Explaining Relations among Top-Ranked Patches, Top-Ranked Features and Decisions of Convolutional Neural Networks for Image Classification},\nauthor={Luna Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=FTSUDBM6lu}\n}",
        "github": "",
        "project": "",
        "reviewers": "PHrZ;tnrN;xK6b;1SjE",
        "site": "https://openreview.net/forum?id=FTSUDBM6lu",
        "pdf_size": 5586709,
        "rating": "1;1;3;5",
        "confidence": "3;4;3;4",
        "soundness": "2;1;3;3",
        "contribution": "2;1;2;2",
        "presentation": "1;2;2;2",
        "wc_summary": "21;83;82;63",
        "wc_strengths": "15;36;33;38",
        "wc_weaknesses": "48;438;50;386",
        "wc_questions": "1;4;165;123",
        "wc_review": "85;561;330;610",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.5,
            1.6583123951777
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            62.25,
            25.113492389550284
        ],
        "wc_strengths_avg": [
            30.5,
            9.12414379544733
        ],
        "wc_weaknesses_avg": [
            230.5,
            182.43012360901366
        ],
        "wc_questions_avg": [
            73.25,
            72.29929114451953
        ],
        "wc_review_avg": [
            396.5,
            208.6246629715672
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0.30151134457776363,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:UWPoNIT0O2wJ:scholar.google.com/&scioq=Patch+Ranking+Map:+Explaining+Relations+among+Top-Ranked+Patches,+Top-Ranked+Features+and+Decisions+of+Convolutional+Neural+Networks+for+Image+Classification&hl=en&as_sdt=0,44",
        "gs_version_total": 0
    },
    {
        "id": "FTpdQBoBd0",
        "title": "Enhancing Fine-Tuning Performance of Large-Scale Text-to-Image Models on Specialized Datasets",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Fine-tuning pre-trained large-scale text-to-image models on specialized datasets has gained popularity for downstream image generation tasks. However, direct fine-tuning of Stable-Diffusion on such datasets often falls short of yielding satisfactory outcomes. To delve into the underlying reasons, we introduce a novel perspective to investigate the intrinsic factors impacting fine-tuning outcomes. We identified that the limitations in fine-tuning stem from an inability to effectively improve text-image alignment and reduce text-image alignment drift. To tackle this issue, we leverage the powerful optimization capabilities of contrastive learning for feature distribution. By explicitly refining text feature representations during generation, we aim to enhance text-image alignment and minimize the alignment drift, thereby improving the fine-tuning performance on specialized datasets. Our approach is versatile, resource-efficient, and seamlessly integrates with existing controllable generation methods. Experimental results demonstrate a significant enhancement in fine-tuning performance achieved by our method.",
        "keywords": "fine-tuning pre-trained models;stable-diffusion;diffusion models;contrastive learning",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Yan-Lin Zhu;Peipei Yang",
        "authorids": "~Yan-Lin_Zhu1;~Peipei_Yang1",
        "gender": "M;M",
        "homepage": "http://www.nlpr.ia.ac.cn/pal/People/ZhuYanLin.html;https://people.ucas.edu.cn/~ppyang",
        "dblp": ";77/10460",
        "google_scholar": ";",
        "orcid": ";0000-0002-1106-7062",
        "linkedin": ";",
        "or_profile": "~Yan-Lin_Zhu1;~Peipei_Yang1",
        "aff": "Institute of Automation, Chinese Academy of Sciences; Institute of automation, Chinese academy of science",
        "aff_domain": "ia.ac.cn;nlpr.ia.ac.cn",
        "position": "MS student;Associate Professor",
        "bibtex": "@misc{\nzhu2024enhancing,\ntitle={Enhancing Fine-Tuning Performance of Large-Scale Text-to-Image Models on Specialized Datasets},\nauthor={Yan-Lin Zhu and Peipei Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=FTpdQBoBd0}\n}",
        "github": "",
        "project": "",
        "reviewers": "mXUe;AZtN;kPtw;6e1T",
        "site": "https://openreview.net/forum?id=FTpdQBoBd0",
        "pdf_size": 19679519,
        "rating": "3;3;3;3",
        "confidence": "5;4;4;4",
        "soundness": "3;2;1;2",
        "contribution": "2;2;3;2",
        "presentation": "3;2;2;2",
        "wc_summary": "116;52;47;27",
        "wc_strengths": "23;25;82;22",
        "wc_weaknesses": "140;249;168;155",
        "wc_questions": "5;5;24;17",
        "wc_review": "284;331;321;221",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            60.5,
            33.380383460949034
        ],
        "wc_strengths_avg": [
            38.0,
            25.42636427018224
        ],
        "wc_weaknesses_avg": [
            178.0,
            42.172265767919086
        ],
        "wc_questions_avg": [
            12.75,
            8.13557004763649
        ],
        "wc_review_avg": [
            289.25,
            43.1182965804541
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:9bQ6Mfsh_38J:scholar.google.com/&scioq=Enhancing+Fine-Tuning+Performance+of+Large-Scale+Text-to-Image+Models+on+Specialized+Datasets&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Chinese Academy of Sciences",
        "aff_unique_dep": "Institute of Automation",
        "aff_unique_url": "http://www.ia.cas.cn",
        "aff_unique_abbr": "CAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "MVDream: Multi-view Diffusion for 3D Generation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19063",
        "id": "FUgrjq2pbB",
        "author_site": "Yichun Shi, Peng Wang, Jianglong Ye, Long Mai, Kejie Li, Xiao Yang",
        "tldr": "",
        "abstract": "We introduce MVDream, a diffusion model that is able to generate consistent multi-view images from a given text prompt. Learning from both 2D and 3D data, a multi-view diffusion model can achieve the generalizability of 2D diffusion models and the consistency of 3D renderings. We demonstrate that such a multi-view diffusion model is implicitly a generalizable 3D prior agnostic to 3D representations. It can be applied to 3D generation via Score Distillation Sampling, significantly enhancing the consistency and stability of existing 2D-lifting methods. It can also learn new concepts from a few 2D examples, akin to DreamBooth, but for 3D generation.",
        "keywords": "Image Generation;3D Generation;Diffusion Model;Multi-view consistency",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/89289af41f813876cb2a33943e35321d57747a6c.zip",
        "author": "Yichun Shi;Peng Wang;Jianglong Ye;Long Mai;Kejie Li;Xiao Yang",
        "authorids": "~Yichun_Shi1;~Peng_Wang2;~Jianglong_Ye1;~Long_Mai2;~Kejie_Li2;~Xiao_Yang1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://seasonsh.github.io/;https://pengwangucla.github.io/peng-wang.github.io/;https://jianglongye.com;http://mai-t-long.com/;https://likojack.github.io/kejieli/#/home;",
        "dblp": "196/7886;95/4442;307/5025;12/10762;44/3202;57/3385-2.html",
        "google_scholar": "RXZChV0AAAAJ;Svk4ntYAAAAJ;nkEGpKsAAAAJ;QHCY1cgAAAAJ;https://scholar.google.com.au/citations?user=JBwsoCUAAAAJ;_MAKSLkAAAAJ",
        "orcid": ";;0000-0003-1347-9199;;;",
        "linkedin": ";;;long-mai-80b21619/;kejie-li-3b8ab4100/?trk=public_profile_browsemap&originalSubdomain=uk;",
        "or_profile": "~Yichun_Shi1;~Peng_Wang2;~Jianglong_Ye1;~Long_Mai2;~Kejie_Li2;~Xiao_Yang1",
        "aff": "ByteDance;Bytedance US AILab;University of California, San Diego;Adobe Systems;ByteDance;Bytedance",
        "aff_domain": "bytedance.com;bytedance.com;ucsd.edu;adobe.com;bytedance.com;bytedance.com",
        "position": "Researcher;Research Scientist;PhD student;Senior Research Scientist;Researcher;Research Scientist",
        "bibtex": "@inproceedings{\nshi2024mvdream,\ntitle={{MVD}ream: Multi-view Diffusion for 3D Generation},\nauthor={Yichun Shi and Peng Wang and Jianglong Ye and Long Mai and Kejie Li and Xiao Yang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=FUgrjq2pbB}\n}",
        "github": "",
        "project": "",
        "reviewers": "XNxK;QGG2;nQgK;HRvB",
        "pdf_size": 26279324,
        "rating": "6;6;6;8",
        "confidence": "4;3;5;4",
        "soundness": "2;3;3;3",
        "contribution": "4;3;3;3",
        "presentation": "2;3;3;4",
        "wc_summary": "69;80;56;153",
        "wc_strengths": "98;125;53;112",
        "wc_weaknesses": "405;234;128;189",
        "wc_questions": "2;4;3;178",
        "wc_review": "574;443;240;632",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "514;370;484;320",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            89.5,
            37.63309713536743
        ],
        "wc_strengths_avg": [
            97.0,
            27.13853349022382
        ],
        "wc_weaknesses_avg": [
            239.0,
            102.95872959589197
        ],
        "wc_questions_avg": [
            46.75,
            75.78052190371876
        ],
        "wc_review_avg": [
            472.25,
            150.5562602484533
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            422.0,
            79.71198153351854
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 630,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1055797503638839115&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=FUgrjq2pbB",
        "pdf": "https://openreview.net/pdf?id=FUgrjq2pbB",
        "email": "bytedance.com;bytedance.com;ucsd.edu;adobe.com;bytedance.com;bytedance.com",
        "author_num": 6,
        "aff_unique_index": "0;0;1;2;0;0",
        "aff_unique_norm": "ByteDance;University of California, San Diego;Adobe",
        "aff_unique_dep": ";;Adobe Systems Incorporated",
        "aff_unique_url": "https://www.bytedance.com;https://www.ucsd.edu;https://www.adobe.com",
        "aff_unique_abbr": "ByteDance;UCSD;Adobe",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";United States;San Diego",
        "aff_country_unique_index": "0;1;1;1;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "FVAqmAY2C9",
        "title": "Towards Faster and Stronger Deep Earth Mover's Distance for Few-Shot Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recent works in few-shot learning (FSL) for visual recognition have indicated that dense features benefit representation learning across novel categories. One of  particularly interesting methods is  DeepEMD that is formalized as optimal  matching of dense features via  an effective statistical distance, i.e., Earth Mover's Distance. Despite its competitive performance, DeepEMD is computationally very expensive due to inherent linear programming. Towards addressing this problem, we propose a metric-based Gaussian EMD (GEMD-M) for FSL. We adopt  Gaussians for modeling  distributions and closed form EMD between Gaussians as a dis-similarity measure. We illuminate  that this metric amounts to feature matching, in which the optimal matching flows follow a joint Gaussian and can be expressed analytically.  As the distance in  GEMD-M is entangled and  not that GPU-friendly,  we further present a transfer learning-based Gaussian EMD (GEMD-T). The key idea is to learn a parametric EMD for a more discriminative metric based  on  square-roots of covariance matrices (via learnable orthogonal matrices) and mean vectors. The learnable metric in GEMD-T is decoupled and thus can be implemented by a fully-connected layer followed by a softmax classifier, very suitable for GPU. We conduct extensive experiments  on large-scale Meta-Dataset and three small-scale benchmarks. The results show   our GEMD is superior to  DeepEMD and  achieves  compelling performance compared to state-of-the-art methods.",
        "keywords": "Few-shot learning; Visual recognition; Earth Mover's Distance; Gaussian distribution",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Fei Long;Jiaming Lv;Peihua Li",
        "authorids": "~Fei_Long1;~Jiaming_Lv1;~Peihua_Li1",
        "gender": ";M;M",
        "homepage": ";https://github.com/JiamingLv;https://www.peihuali.org",
        "dblp": ";163/2658;80/5257",
        "google_scholar": ";;AVweY3cAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Fei_Long1;~Jiaming_Lv1;~Peihua_Li1",
        "aff": ";Dalian University of Technology;Dalian University of Technology",
        "aff_domain": ";dlut.edu.cn;dlut.edu.cn",
        "position": ";MS student;Full Professor",
        "bibtex": "@misc{\nanonymous2025towards,\ntitle={Towards Faster and Stronger Deep Earth Mover's Distance for Few-Shot Learning},\nauthor={Anonymous},\nyear={2025},\nurl={https://openreview.net/forum?id=FVAqmAY2C9}\n}",
        "github": "",
        "project": "",
        "reviewers": "dGAQ;YQkJ;rDfm;epv6",
        "site": "https://openreview.net/forum?id=FVAqmAY2C9",
        "pdf_size": 6189436,
        "rating": "5;6;6;6",
        "confidence": "4;4;4;3",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;2",
        "presentation": "2;3;2;2",
        "wc_summary": "69;39;94;72",
        "wc_strengths": "103;24;47;22",
        "wc_weaknesses": "87;97;103;151",
        "wc_questions": "156;6;52;5",
        "wc_review": "415;166;296;250",
        "wc_reply_reviewers": "18;0;0;12",
        "wc_reply_authors": "806;600;812;762",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "2;1;1;2",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            68.5,
            19.576771950451892
        ],
        "wc_strengths_avg": [
            49.0,
            32.687918257362305
        ],
        "wc_weaknesses_avg": [
            109.5,
            24.632295873507204
        ],
        "wc_questions_avg": [
            54.75,
            61.46289531091096
        ],
        "wc_review_avg": [
            281.75,
            89.95102834320461
        ],
        "wc_reply_reviewers_avg": [
            7.5,
            7.794228634059948
        ],
        "wc_reply_authors_avg": [
            745.0,
            85.9127464349732
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:PFPGjm-UXkMJ:scholar.google.com/&scioq=Towards+Faster+and+Stronger+Deep+Earth+Mover%27s+Distance+for+Few-Shot+Learning&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Dalian University of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.dlut.edu.cn/",
        "aff_unique_abbr": "DUT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "FVItLat5ii",
        "title": "Identifying Interpretable Features in Convolutional Neural Networks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Single neurons in neural networks are often 'interpretable' in that they represent individual, intuitively meaningful features. However, many neurons exhibit $\\textit{mixed selectivity}$, i.e., they represent multiple unrelated features. A recent hypothesis proposes that features in deep networks may be represented on non-orthogonal axes by multiple neurons, since the number of possible interpretable features in natural data is generally larger than the number of neurons in a given network. Accordingly, we should be able to find meaningful directions in activation space that are not aligned with individual neurons. Here, we propose (1) an automated method for quantifying visual interpretability that is validated against a large database of human psychophysics judgments of neuron interpretability, and (2) an approach for finding meaningful directions in network activation space. We leverage these methods to discover directions in convolutional neural networks that are more intuitively meaningful than individual neurons. In a series of analyses to understand this phenomenon we find, for instance, examples of $\\textit{feature synergy}$ where pairs of uninterpretable neurons work together to encode interpretable features. These results contribute to a larger effort to automate interpretability research, providing a foundation for scaling bespoke perceptual judgments to the analysis of complex neural network models.",
        "keywords": "interpretability;convolutional neural networks;psychophysics;monosemanticity",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "David A. Klindt;Sophia Sanborn;Francisco Acosta;FREDERIC P POITEVIN;Nina Miolane",
        "authorids": "~David_A._Klindt1;~Sophia_Sanborn1;~Francisco_Acosta1;~FREDERIC_P_POITEVIN1;~Nina_Miolane2",
        "gender": ";F;M;;",
        "homepage": ";https://sophiasanborn.com;https://web.physics.ucsb.edu/~facosta/;;https://www.ece.ucsb.edu/people/faculty/nina-miolane",
        "dblp": ";212/5137;;;",
        "google_scholar": ";tCUvC4oAAAAJ;;qz6POUsAAAAJ;",
        "orcid": ";0000-0002-1957-7067;;0000-0002-3181-8652;",
        "linkedin": ";sophia-sanborn;;;",
        "or_profile": "~David_A._Klindt1;~Sophia_Sanborn1;~Francisco_Acosta1;~FREDERIC_P_POITEVIN1;~Nina_Miolane2",
        "aff": ";Science;University of California, Santa Barbara;SLAC National Accelerator Laboratory;University of California, Santa Barbara",
        "aff_domain": ";science.xyz;ucsb.edu;slac.stanford.edu;ucsb.edu",
        "position": ";Researcher;PhD student;Associate Staff Scientist;Assistant Professor",
        "bibtex": "@misc{\nklindt2024identifying,\ntitle={Identifying Interpretable Features in Convolutional Neural Networks},\nauthor={David A. Klindt and Sophia Sanborn and Francisco Acosta and FREDERIC P POITEVIN and Nina Miolane},\nyear={2024},\nurl={https://openreview.net/forum?id=FVItLat5ii}\n}",
        "github": "",
        "project": "",
        "reviewers": "SvsS;WTDd;KsZY;c2XN",
        "site": "https://openreview.net/forum?id=FVItLat5ii",
        "pdf_size": 3636074,
        "rating": "1;5;5;5",
        "confidence": "3;4;5;5",
        "soundness": "1;3;2;3",
        "contribution": "1;3;2;2",
        "presentation": "2;3;1;4",
        "wc_summary": "130;110;83;105",
        "wc_strengths": "39;55;89;56",
        "wc_weaknesses": "214;279;129;628",
        "wc_questions": "53;6;69;28",
        "wc_review": "436;450;370;817",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.7320508075688772
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            107.0,
            16.718253497300488
        ],
        "wc_strengths_avg": [
            59.75,
            18.18481509391833
        ],
        "wc_weaknesses_avg": [
            312.5,
            189.76103393478863
        ],
        "wc_questions_avg": [
            39.0,
            24.01041440708594
        ],
        "wc_review_avg": [
            518.25,
            175.1090731515646
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.8703882797784891,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:OdDItVryHSUJ:scholar.google.com/&scioq=Identifying+Interpretable+Features+in+Convolutional+Neural+Networks&hl=en&as_sdt=0,34",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "Science;University of California, Santa Barbara;SLAC National Accelerator Laboratory",
        "aff_unique_dep": ";;",
        "aff_unique_url": ";https://www.ucsb.edu;https://www.slac.stanford.edu",
        "aff_unique_abbr": ";UCSB;SLAC",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Santa Barbara",
        "aff_country_unique_index": "1;1;1",
        "aff_country_unique": ";United States"
    },
    {
        "title": "Multisize Dataset Condensation",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19062",
        "id": "FVhmnvqnsI",
        "author_site": "Yang He, Lingao Xiao, Joey Tianyi Zhou, Ivor Tsang",
        "tldr": "",
        "abstract": "While dataset condensation effectively enhances training efficiency, its application in on-device scenarios brings unique challenges. 1) Due to the fluctuating computational resources of these devices, there's a demand for a flexible dataset size that diverges from a predefined size. 2) The limited computational power on devices often prevents additional condensation operations. These two challenges connect to the \"subset degradation problem\" in traditional dataset condensation: a subset from a larger condensed dataset is often unrepresentative compared to directly condensing the whole dataset to that smaller size. In this paper, we propose Multisize Dataset Condensation (MDC) by **compressing $N$ condensation processes into a single condensation process to obtain datasets with multiple sizes.** Specifically, we introduce an \"adaptive subset loss\" on top of the basic condensation loss to mitigate the \"subset degradation problem\". Our MDC method offers several benefits: 1) No additional condensation process is required; 2) reduced storage requirement by reusing condensed images. Experiments validate our findings on networks including ConvNet, ResNet and DenseNet, and datasets including SVHN,  CIFAR-10, CIFAR-100 and ImageNet. For example, we achieved 5.22%-6.40% average accuracy gains on condensing CIFAR-10 to ten images per class. Code is available at: [https://github.com/he-y/Multisize-Dataset-Condensation](https://github.com/he-y/Multisize-Dataset-Condensation).",
        "keywords": "Dataset Condensation;Dataset Distillation;Image Classification",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/bf69019ab4256b6451e720650a077e557b0d8fbe.pdf",
        "author": "Yang He;Lingao Xiao;Joey Tianyi Zhou;Ivor Tsang",
        "authorids": "~Yang_He2;~Lingao_Xiao1;~Joey_Tianyi_Zhou1;~Ivor_Tsang1",
        "gender": "M;M;M;M",
        "homepage": ";https://joeyzhouty.github.io/;https://www.a-star.edu.sg/cfar/about-cfar/management/prof-ivor-tsang;https://he-y.github.io/",
        "dblp": "341/5434;123/5110;35/5873;06/1998-2",
        "google_scholar": "MlNI5YYAAAAJ;https://scholar.google.com.sg/citations?user=cYNqDokAAAAJ;rJMOlVsAAAAJ;vvnFsIIAAAAJ",
        "orcid": "0009-0007-1697-1986;0000-0002-4675-7055;;0000-0002-2257-6073",
        "linkedin": ";;;",
        "or_profile": "~Lingao_Xiao1;~Joey_Tianyi_Zhou1;~Ivor_W_Tsang1;~yang_he1",
        "aff": "School of Computer Science and  Engineering, Nanyang Technological University;A*STAR Centre for Frontier AI Research;A*STAR;Institute of High Performance Computing, Singapore, A*STAR",
        "aff_domain": "scse.ntu.edu.sg;cfar.a-star.edu.sg;cfar.a-star.edu.sg;ihpc.a-star.edu.sg",
        "position": "Undergrad student;Principal Researcher;Principal Researcher;Researcher",
        "bibtex": "@inproceedings{\nhe2024multisize,\ntitle={Multisize Dataset Condensation},\nauthor={Yang He and Lingao Xiao and Joey Tianyi Zhou and Ivor Tsang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=FVhmnvqnsI}\n}",
        "github": "",
        "project": "",
        "reviewers": "CWAb;DoMB;6Dsd;ZxGV",
        "pdf_size": 4790626,
        "rating": "6;8;8;8",
        "confidence": "3;5;4;4",
        "soundness": "3;4;4;3",
        "contribution": "3;4;4;3",
        "presentation": "3;4;3;3",
        "wc_summary": "85;60;72;88",
        "wc_strengths": "24;72;114;85",
        "wc_weaknesses": "19;58;45;55",
        "wc_questions": "63;2;3;82",
        "wc_review": "191;192;234;310",
        "wc_reply_reviewers": "0;18;0;11",
        "wc_reply_authors": "370;711;458;591",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            76.25,
            11.143944544011335
        ],
        "wc_strengths_avg": [
            73.75,
            32.4990384473141
        ],
        "wc_weaknesses_avg": [
            44.25,
            15.35211711784404
        ],
        "wc_questions_avg": [
            37.5,
            35.64056677439347
        ],
        "wc_review_avg": [
            231.75,
            48.39615170651485
        ],
        "wc_reply_reviewers_avg": [
            7.25,
            7.660776723022281
        ],
        "wc_reply_authors_avg": [
            532.5,
            129.65434817236172
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.816496580927726,
        "gs_citation": 24,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3607691017378204358&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=FVhmnvqnsI",
        "pdf": "https://openreview.net/pdf?id=FVhmnvqnsI",
        "email": "scse.ntu.edu.sg;cfar.a-star.edu.sg;cfar.a-star.edu.sg;ihpc.a-star.edu.sg",
        "author_num": 4,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Nanyang Technological University;A*STAR;Agency for Science, Technology and Research;Institute of High Performance Computing",
        "aff_unique_dep": "School of Computer Science and Engineering;Centre for Frontier AI Research;;",
        "aff_unique_url": "https://www.ntu.edu.sg;https://www.a-star.edu.sg;https://www.a-star.edu.sg;https://www.ihpc.a-star.edu.sg",
        "aff_unique_abbr": "NTU;A*STAR;A*STAR;IHPC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Singapore"
    },
    {
        "title": "Neural-Symbolic Recursive Machine for Systematic Generalization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19061",
        "id": "FWJAmwE0xH",
        "author_site": "Qing Li, Yixin Zhu, Yitao Liang, Yingnian Wu, Song-Chun Zhu, Siyuan Huang",
        "tldr": "",
        "abstract": "Current learning models often struggle with human-like systematic generalization, particularly in learning compositional rules from limited data and extrapolating them to novel combinations. We introduce the Neural-Symbolic Recursive Ma- chine ( NSR), whose core is a Grounded Symbol System ( GSS), allowing for the emergence of combinatorial syntax and semantics directly from training data. The NSR employs a modular design that integrates neural perception, syntactic parsing, and semantic reasoning. These components are synergistically trained through a novel deduction-abduction algorithm. Our findings demonstrate that NSR\u2019s design, imbued with the inductive biases of equivariance and compositionality, grants it the expressiveness to adeptly handle diverse sequence-to-sequence tasks and achieve unparalleled systematic generalization. We evaluate NSR\u2019s efficacy across four challenging benchmarks designed to probe systematic generalization capabilities: SCAN for semantic parsing, PCFG for string manipulation, HINT for arithmetic reasoning, and a compositional machine translation task. The results affirm NSR \u2019s superiority over contemporary neural and hybrid models in terms of generalization and transferability.",
        "keywords": "Neuro-symbolic AI;Systematic Generalization;Compositional Generalization",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "/attachment/53b47e622163d9c5441cd1a32768c5f57e6f67e8.zip",
        "author": "Qing Li;Yixin Zhu;Yitao Liang;Ying Nian Wu;Song-Chun Zhu;Siyuan Huang",
        "authorids": "~Qing_Li1;~Yixin_Zhu1;~Yitao_Liang1;~Ying_Nian_Wu1;~Song-Chun_Zhu1;~Siyuan_Huang2",
        "gender": "M;M;M;M;M;M",
        "homepage": "http://liqing-ustc.github.io/;https://yzhu.io/;https://web.cs.ucla.edu/~yliang/;https://zhusongchun.net/;https://siyuanhuang.com/;http://www.stat.ucla.edu/~ywu/",
        "dblp": "181/2689-3;91/1103-1.html;173/4969;10/10313;62/885-1;18/568.html",
        "google_scholar": "iwdFZBEAAAAJ;qG9l6JEAAAAJ;KVzR1XEAAAAJ;https://scholar.google.com.tw/citations?user=Al8dyb4AAAAJ;1NN7Ee8AAAAJ;7k_1QFIAAAAJ",
        "orcid": ";0000-0001-7024-1545;;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Qing_Li1;~Yixin_Zhu1;~Yitao_Liang1;~Song-Chun_Zhu1;~Siyuan_Huang2;~Yingnian_Wu1",
        "aff": "Beijing Institute for General Artificial Intelligence (BIGAI);Peking University;Peking University;Peking University;Beijing Institute for General Artificial Intelligence;UCLA",
        "aff_domain": "bigai.ai;pku.edu.cn;pku.edu.cn;pku.edu.cn;bigai.ai;stat.ucla.edu",
        "position": "Researcher;Assistant Professor;Assistant Professor;Full Professor;Researcher;Full Professor",
        "bibtex": "@inproceedings{\nli2024neuralsymbolic,\ntitle={Neural-Symbolic Recursive Machine for Systematic Generalization},\nauthor={Qing Li and Yixin Zhu and Yitao Liang and Ying Nian Wu and Song-Chun Zhu and Siyuan Huang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=FWJAmwE0xH}\n}",
        "github": "",
        "project": "",
        "reviewers": "Gi7u;ih16;WJqb;brEA",
        "pdf_size": 2863407,
        "rating": "3;6;8;8",
        "confidence": "3;4;4;2",
        "soundness": "1;3;3;4",
        "contribution": "2;2;3;3",
        "presentation": "1;4;3;2",
        "wc_summary": "93;123;188;69",
        "wc_strengths": "23;177;114;36",
        "wc_weaknesses": "182;48;386;104",
        "wc_questions": "101;1;79;42",
        "wc_review": "399;349;767;251",
        "wc_reply_reviewers": "0;79;34;0",
        "wc_reply_authors": "990;187;569;349",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "3;2;2;1",
        "rating_avg": [
            6.25,
            2.0463381929681126
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            1.0897247358851685
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            118.25,
            44.58348909630111
        ],
        "wc_strengths_avg": [
            87.5,
            62.29967897188556
        ],
        "wc_weaknesses_avg": [
            180.0,
            128.10152223919903
        ],
        "wc_questions_avg": [
            55.75,
            37.995887935406905
        ],
        "wc_review_avg": [
            441.5,
            195.32216976062907
        ],
        "wc_reply_reviewers_avg": [
            28.25,
            32.42202183701689
        ],
        "wc_reply_authors_avg": [
            523.75,
            301.40286577934194
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.03683547343418787,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=612089640198545872&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 9,
        "openreview": "https://openreview.net/forum?id=FWJAmwE0xH",
        "pdf": "https://openreview.net/pdf?id=FWJAmwE0xH",
        "email": "bigai.ai;pku.edu.cn;pku.edu.cn;pku.edu.cn;bigai.ai;stat.ucla.edu",
        "author_num": 6,
        "aff_unique_index": "0;1;1;1;0;2",
        "aff_unique_norm": "Beijing Institute for General Artificial Intelligence;Peking University;University of California, Los Angeles",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.bigmodel.cn/;http://www.pku.edu.cn;https://www.ucla.edu",
        "aff_unique_abbr": "BIGAI;Peking U;UCLA",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Los Angeles",
        "aff_country_unique_index": "0;0;0;0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "FWsGuAFn3n",
        "title": "Prompt-based 3D Molecular Diffusion Models for Structure-based Drug Design",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Generating ligand molecules that bind to specific protein targets via generative models holds substantial promise for advancing structure-based drug design. Existing methods generate molecules from scratch without reference or template ligands, which poses challenges in model optimization and may yield suboptimal outcomes. To address this problem, we propose an innovative prompt-based 3D molecular diffusion model named PromptDiff to facilitate target-aware molecule generation. PromptDiff leverages a curated set of ligand prompts, i.e., those with desired properties such as high binding affinity and synthesizability, to steer the diffusion model towards synthesizing ligands that satisfy design criteria. Specifically, we design a geometric protein-molecule interaction network (PMINet), and pretrain it with binding affinity signals to: (i) retrieve target-aware ligand molecules with high binding affinity to serve as prompts, and (ii) incorporate essential protein-ligand binding structures for steering molecular diffusion generation with two effective prompting mechanisms, i.e., exemplar prompting and self prompting. Empirical studies on CrossDocked2020 dataset show PromptDiff can generate molecules with more realistic 3D structures and achieve state-of-the-art binding affinities towards the protein targets, while maintaining proper molecular properties.",
        "keywords": "Diffusion Model;Structure-based Drug Design;Molecule Generation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/01e90a85c4401b61f776353d06f94abe60805f47.zip",
        "author": "Ling Yang;Zhilin Huang;Xiangxin Zhou;Minkai Xu;Wentao Zhang;Yu Wang;Xiawu Zheng;Wenming Yang;Ron O. Dror;Shenda Hong;Bin CUI",
        "authorids": "~Ling_Yang1;~Zhilin_Huang1;~Xiangxin_Zhou1;~Minkai_Xu1;~Wentao_Zhang1;~Yu_Wang60;~Xiawu_Zheng1;~Wenming_Yang1;~Ron_O._Dror1;~Shenda_Hong1;~Bin_CUI2",
        "gender": "M;M;Not Specified;M;;M;M;M;M;;M",
        "homepage": "https://yangling0818.github.io/;https://zerinhwang03.github.io/;;https://minkaixu.com;;;https://sites.google.com/view/zhengxiawu/%E9%A6%96%E9%A1%B5;https://www.sigs.tsinghua.edu.cn/ywm_en/main.htm;http://drorlab.stanford.edu/;;https://cuibinpku.github.io/index.html",
        "dblp": "01/24-6.html;266/8046.html;247/9275;257/3355;;02/5889-8;222/7865;75/2339.html;23/256;;55/5031.html",
        "google_scholar": "https://scholar.google.com.hk/citations?user=sIKujqAAAAAJ;https://scholar.google.com/citations?hl=zh-CN;eQgIWcQAAAAJ;https://scholar.google.com/citations?hl=en;;https://scholar.google.com/citations?hl=en;jBgXocYAAAAJ;https://scholar.google.com/citations?hl=zh-CN;GTmdNU0AAAAJ;;IJAU8KoAAAAJ",
        "orcid": "0000-0003-1905-8053;0000-0003-3417-743X;;;;0000-0003-4976-9366;0000-0002-6855-5403;0000-0002-2506-1286;0000-0002-6418-2793;;0000-0003-1681-4677",
        "linkedin": ";;;;;;;;rondror/;;",
        "or_profile": "~Ling_Yang1;~Zhilin_Huang1;~Xiangxin_Zhou1;~Minkai_Xu1;~Wentao_Zhang1;~Yu_Wang60;~Xiawu_Zheng1;~Wenming_Yang1;~Ron_O._Dror1;~Shenda_Hong1;~Bin_CUI2",
        "aff": "Peking University;Tsinghua University;Institute of Automation, Chinese Academy of Sciences;Stanford University;;Peng Cheng Laboratory;PengCheng Lab;Tsinghua University,;Stanford University;;Peking University",
        "aff_domain": "pku.edu.cn;mails.tsinghua.edu.cn;ia.ac.cn;stanford.edu;;pcl.ac.cn;pcl.ac.cn;tsinghua.edu.cn;stanford.edu;;pku.edu.cn",
        "position": "PhD student;PhD student;PhD student;PhD student;;Full Professor;Postdoc;Associate Professor;Full Professor;;Full Professor",
        "bibtex": "@misc{\nyang2024promptbased,\ntitle={Prompt-based 3D Molecular Diffusion Models for  Structure-based Drug Design},\nauthor={Ling Yang and Zhilin Huang and Xiangxin Zhou and Minkai Xu and Wentao Zhang and Yu Wang and Xiawu Zheng and Wenming Yang and Ron O. Dror and Shenda Hong and Bin CUI},\nyear={2024},\nurl={https://openreview.net/forum?id=FWsGuAFn3n}\n}",
        "github": "",
        "project": "",
        "reviewers": "gTfj;78qn;DL9h;M3og",
        "site": "https://openreview.net/forum?id=FWsGuAFn3n",
        "pdf_size": 2248441,
        "rating": "3;3;3;6",
        "confidence": "4;4;4;3",
        "soundness": "2;3;3;3",
        "contribution": "1;2;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "68;63;42;110",
        "wc_strengths": "67;38;30;113",
        "wc_weaknesses": "286;151;103;458",
        "wc_questions": "205;73;4;11",
        "wc_review": "626;325;179;692",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            70.75,
            24.67159297653883
        ],
        "wc_strengths_avg": [
            62.0,
            32.50384592629001
        ],
        "wc_weaknesses_avg": [
            249.5,
            137.81237244892057
        ],
        "wc_questions_avg": [
            73.25,
            80.66714015012556
        ],
        "wc_review_avg": [
            455.5,
            211.23742566126865
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1760709971340089868&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;4;5;1;3;0",
        "aff_unique_norm": "Peking University;Tsinghua University;Chinese Academy of Sciences;Stanford University;Pengcheng Laboratory;Pengcheng Lab",
        "aff_unique_dep": ";;Institute of Automation;;Peng Cheng Laboratory;",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.tsinghua.edu.cn;http://www.ia.cas.cn;https://www.stanford.edu;http://www.pcl.ac.cn;",
        "aff_unique_abbr": "Peking U;THU;CAS;Stanford;PCL;",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Stanford",
        "aff_country_unique_index": "0;0;0;1;0;0;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "FXIzz8pHBy",
        "title": "Domain Adaptation for Large-Vocabulary Object Detectors",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large-vocabulary object detectors (LVDs) aim to detect objects of many categories, which learn super objectness features and can locate objects accurately while applied to various downstream data. However, LVDs often struggle in recognizing the located objects due to domain discrepancy in data distribution and object vocabulary. At the other end, recent vision-language foundation models such as CLIP demonstrate superior open-vocabulary recognition capability. This paper presents KGD, a Knowledge Graph Distillation technique that exploits the implicit knowledge graphs (KG) in CLIP for effectively adapting LVDs to various downstream domains. KGD consists of two consecutive stages: 1) KG extraction that employs CLIP to encode downstream domain data as nodes and their feature distances as edges, constructing KG that inherits the rich semantic relations in CLIP explicitly; and 2) KG encapsulation that transfers the extracted KG into LVDs to enable accurate cross-domain object classification. In addition, KGD can extract both visual and textual KG independently, providing complementary vision and language knowledge for object localization and object classification in detection tasks over various downstream domains. Experiments over multiple widely adopted detection benchmarks show that KGD outperforms the state-of-the-art consistently by large margins.",
        "keywords": "large-vocabulary object detection;transfer learning;knowledge distillation",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Kai Jiang;Jiaxing Huang;Yunsong Li;Weiying Xie;Ling Shao;Shijian Lu",
        "authorids": "~Kai_Jiang2;~Jiaxing_Huang2;~Yunsong_Li1;~Weiying_Xie1;~Ling_Shao1;~Shijian_Lu1",
        "gender": "M;M;M;F;M;M",
        "homepage": ";https://jxhuang0508.github.io/;https://web.xidian.edu.cn/ysli/;https://web.xidian.edu.cn/wyxie/;;https://personal.ntu.edu.sg/shijian.lu/",
        "dblp": ";62/6016-1.html;;/150/3937.html;;42/2718",
        "google_scholar": "QzspFz4AAAAJ;czirNcwAAAAJ;aY_2RzkAAAAJ;y0ha5lMAAAAJ;z84rLjoAAAAJ;https://scholar.google.com.sg/scholar?hl=en",
        "orcid": "0000-0001-9921-2043;;;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Kai_Jiang2;~Jiaxing_Huang2;~Yunsong_Li1;~Weiying_Xie1;~Ling_Shao1;~Shijian_Lu1",
        "aff": "Xidian University;Nanyang Technological University;Xidian University ;Xidian University;University of Chinese Academy of Sciences;Nanyang Technological University",
        "aff_domain": "xidian.edu;ntu.edu.sg;xidian.edu.cn;xidian.edu.cn;ucas.ac.cn;ntu.edu.sg",
        "position": "PhD student;Postdoc;Full Professor;Full Professor;Full Professor;Associate Professor",
        "bibtex": "@misc{\njiang2024domain,\ntitle={Domain Adaptation for Large-Vocabulary Object Detectors},\nauthor={Kai Jiang and Jiaxing Huang and Yunsong Li and Weiying Xie and Ling Shao and Shijian Lu},\nyear={2024},\nurl={https://openreview.net/forum?id=FXIzz8pHBy}\n}",
        "github": "",
        "project": "",
        "reviewers": "HDW7;iHrk;pudg;MJjx;xetS",
        "site": "https://openreview.net/forum?id=FXIzz8pHBy",
        "pdf_size": 19887910,
        "rating": "5;5;5;5;6",
        "confidence": "4;4;4;4;3",
        "soundness": "2;2;3;3;3",
        "contribution": "2;2;3;3;3",
        "presentation": "2;3;4;3;2",
        "wc_summary": "61;70;47;39;49",
        "wc_strengths": "54;13;30;27;92",
        "wc_weaknesses": "214;194;82;62;10",
        "wc_questions": "41;3;28;1;210",
        "wc_review": "370;280;187;129;361",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            5.2,
            0.39999999999999997
        ],
        "confidence_avg": [
            3.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.8,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            53.2,
            10.961751684835777
        ],
        "wc_strengths_avg": [
            43.2,
            27.737339454244704
        ],
        "wc_weaknesses_avg": [
            112.4,
            78.65265411923491
        ],
        "wc_questions_avg": [
            56.6,
            78.17569954915658
        ],
        "wc_review_avg": [
            265.4,
            94.91596283028477
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10838931091427597330&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0;0;2;1",
        "aff_unique_norm": "Xidian University;Nanyang Technological University;University of Chinese Academy of Sciences",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.xidian.edu.cn/;https://www.ntu.edu.sg;http://www.ucas.ac.cn",
        "aff_unique_abbr": "Xidian;NTU;UCAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;0;1",
        "aff_country_unique": "China;Singapore"
    },
    {
        "title": "Improving Non-Transferable Representation Learning by Harnessing Content and Style",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19060",
        "id": "FYKVPOHCpE",
        "author_site": "Ziming Hong, Zhenyi Wang, Li Shen, Yu Yao, Zhuo Huang, Shiming Chen, chuanwu yang, Mingming Gong, Tongliang Liu",
        "tldr": "",
        "abstract": "Non-transferable learning (NTL) aims to restrict the generalization of models toward the target domain(s). To this end, existing works learn non-transferable representations by reducing statistical dependence between the source and target domain. However, such statistical methods essentially neglect to distinguish between *styles* and *contents*, leading them to inadvertently fit (i) spurious correlation between *styles* and *labels*, and (ii) fake independence between *contents* and *labels*. Consequently, their performance will be limited when natural distribution shifts occur or malicious intervention is imposed. In this paper, we propose a novel method (dubbed as H-NTL) to understand and advance the NTL problem by introducing a causal model to separately model *content* and *style* as two latent factors, based on which we disentangle and harness them as guidances for learning non-transferable representations with intrinsically causal relationships. Speci\ufb01cally, to avoid fitting spurious correlation and fake independence, we propose a variational inference framework to disentangle the naturally mixed *content factors* and *style factors* under our causal model. Subsequently, based on dual-path knowledge distillation, we harness the disentangled two *factors* as guidances for non-transferable representation learning: (i) we constraint the source domain representations to fit *content factors* (which are the intrinsic cause of *labels*), and (ii) we enforce that the target domain representations fit *style factors* which barely can predict labels. As a result, the learned feature representations follow optimal untransferability toward the target domain and minimal negative influence on the source domain, thus enabling better NTL performance. Empirically, the proposed H-NTL signi\ufb01cantly outperforms competing methods by a large margin.",
        "keywords": "non-transferable representation learning;domain adaptation;transfer learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Ziming Hong;Zhenyi Wang;Li Shen;Yu Yao;Zhuo Huang;Shiming Chen;Chuanwu Yang;Mingming Gong;Tongliang Liu",
        "authorids": "~Ziming_Hong1;~Zhenyi_Wang1;~Li_Shen1;~Yu_Yao3;~Zhuo_Huang2;~Shiming_Chen1;~Chuanwu_Yang1;~Mingming_Gong1;~Tongliang_Liu1",
        "gender": "M;M;M;M;M;M;M;M;M",
        "homepage": "https://sites.google.com/view/ziminghong/;https://sites.google.com/site/mathshenli/home;https://a5507203.github.io/;https://zhuohuangai.github.io/;https://shiming-chen.github.io/;;https://mingming-gong.github.io/;https://tongliang-liu.github.io/;https://joey-wang123.github.io/",
        "dblp": "304/3159;91/3680-8;230/9625;;63/3682-2;;98/8479;150/6667;10/10222-1",
        "google_scholar": "j6gyDlIAAAAJ;yVhgENIAAAAJ;OkcaMKAAAAAJ;;https://scholar.google.com/citations?hl=en;;https://scholar.google.com.au/citations?user=6BmiCJIAAAAJ;https://scholar.google.com.au/citations?user=EiLdZ_YAAAAJ;F4uLsroAAAAJ",
        "orcid": "0000-0001-8574-6108;;;;;0000-0003-1876-9443;0000-0001-7147-5589;;",
        "linkedin": ";;yu-yao-150377134/;;;;;;",
        "or_profile": "~Ziming_Hong1;~Li_Shen1;~Yu_Yao3;~Zhuo_Huang2;~Shiming_Chen1;~Chuanwu_Yang1;~Mingming_Gong1;~Tongliang_Liu1;~Zhenyi_Wang8",
        "aff": "University of Sydney;JD Explore Academy;University of Sydney;University of Sydney;Mohamed bin Zayed University of Artificial Intelligence;Huazhong University of Science and Technology;University of Melbourne;Mohamed bin Zayed University of Artificial Intelligence;University of Maryland, College Park",
        "aff_domain": "usyd.edu.au;jd.com;sydney.edu.au;uni.sydney.edu.au;mbzuai.ac.ae;hust.edu.cn;unimelb.edu.au;mbzuai.ac.ae;umd.edu",
        "position": "PhD student;Researcher;Lecturer;PhD student;Postdoc;PhD student;Assistant Professor;Affiliated Associate Professor;Postdoc",
        "bibtex": "@inproceedings{\nhong2024improving,\ntitle={Improving Non-Transferable Representation Learning by Harnessing Content and Style},\nauthor={Ziming Hong and Zhenyi Wang and Li Shen and Yu Yao and Zhuo Huang and Shiming Chen and Chuanwu Yang and Mingming Gong and Tongliang Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=FYKVPOHCpE}\n}",
        "github": "",
        "project": "",
        "reviewers": "BF2B;AgKr;fXnt",
        "pdf_size": 3713538,
        "rating": "6;6;8",
        "confidence": "2;3;3",
        "soundness": "3;3;4",
        "contribution": "3;3;3",
        "presentation": "3;3;3",
        "wc_summary": "75;77;59",
        "wc_strengths": "221;37;38",
        "wc_weaknesses": "120;95;23",
        "wc_questions": "2;18;22",
        "wc_review": "418;227;142",
        "wc_reply_reviewers": "0;5;10",
        "wc_reply_authors": "1479;1013;408",
        "reply_reviewers": "0;1;1",
        "reply_authors": "3;2;1",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            70.33333333333333,
            8.055363982396383
        ],
        "wc_strengths_avg": [
            98.66666666666667,
            86.50369292052733
        ],
        "wc_weaknesses_avg": [
            79.33333333333333,
            41.12041936664665
        ],
        "wc_questions_avg": [
            14.0,
            8.640987597877148
        ],
        "wc_review_avg": [
            262.3333333333333,
            115.41326709794771
        ],
        "wc_reply_reviewers_avg": [
            5.0,
            4.08248290463863
        ],
        "wc_reply_authors_avg": [
            966.6666666666666,
            438.45967760888675
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.49999999999999983,
        "gs_citation": 24,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16078311380635074820&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=FYKVPOHCpE",
        "pdf": "https://openreview.net/pdf?id=FYKVPOHCpE",
        "email": "usyd.edu.au;jd.com;sydney.edu.au;uni.sydney.edu.au;mbzuai.ac.ae;hust.edu.cn;unimelb.edu.au;mbzuai.ac.ae;umd.edu",
        "author_num": 9,
        "aff_unique_index": "0;1;0;0;2;3;4;2;5",
        "aff_unique_norm": "University of Sydney;JD;Mohamed bin Zayed University of Artificial Intelligence;Huazhong University of Science and Technology;University of Melbourne;University of Maryland",
        "aff_unique_dep": ";JD Explore Academy;;;;",
        "aff_unique_url": "https://www.sydney.edu.au;;https://mbzuai.ac.ae;http://www.hust.edu.cn;https://www.unimelb.edu.au;https://www/umd.edu",
        "aff_unique_abbr": "USYD;;MBZUAI;HUST;UniMelb;UMD",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";College Park",
        "aff_country_unique_index": "0;0;0;2;3;0;2;4",
        "aff_country_unique": "Australia;;United Arab Emirates;China;United States"
    },
    {
        "id": "FZfWQFrdBT",
        "title": "Split and Merge Proxy: pre-training protein inter-chain contact prediction by mining rich information from monomer data",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Protein inter-chain contact prediction is a key intelligent biology computation technology for protein multimer function analysis but still suffers from low accuracy. An important problem is that the number of training data cannot meet the requirements of deep-learning-based methods due to the expensive cost of capturing structure information of multimer data. In this paper, we solve this data volume bottleneck in a cheap way, borrowing rich information from monomer data. To utilize monomer (single chain) data in this multimer (multiple chains) problem, we propose a simple but effective pre-training method called Split and Merge Proxy (SMP), which utilizes monomer data to construct a proxy task for model pre-training. This proxy task cuts monomer data into two sub-parts, called pseudo multimer, and pre-trains the model to merge them back together by predicting their pseudo contacts. The pre-trained model is then used to initialize our target -- protein inter-chain contact prediction. Because of the consistency between this proxy task and the final target, the whole method brings a stronger pre-trained model for subsequent fine-tuning, leading to significant performance gains. Extensive experiments validate the effectiveness of our method and show the model performs better than the state-of-the-art (SOTA) method by 11.40\\% and 2.97\\% on the P@ $L/10$ metric for bounded benchmarks DIPS-Plus and CASP-CAPRI, respectively. Further, the model also achieves almost 1.5 times performance superiority to the SOTA approach on the harder unbounded benchmark DB5. Finally, we also effectively apply our SMP on docking and interaction site prediction tasks to verify the SMP is a general method for other multimer-related tasks. The code, model, and pre-training data will be released after this paper is accepted.",
        "keywords": "Protein Bioinformatics;Protein Inter-chain Contact Prediction;Pre-training",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/2a8db89917e0bf5896145d5e5b83c82775b6ed27.pdf",
        "author": "Hao Du;Yuchen Ren;Yan Lu;He Huang;Yating Liu;Zhendong Mao;Xinqi Gong;Wanli Ouyang",
        "authorids": "~Hao_Du5;~Yuchen_Ren1;~Yan_Lu10;~He_Huang6;~Yating_Liu1;~Zhendong_Mao1;~Xinqi_Gong1;~Wanli_Ouyang1",
        "gender": "M;;Not Specified;M;F;;M;",
        "homepage": ";;;;https://github.com/cherry0116?tab=repositories;;https://www.researchgate.net/profile/Xinqi-Gong;",
        "dblp": ";;;;;;200/7127;",
        "google_scholar": "NnZgom8AAAAJ;;YbbHudwAAAAJ;vV9bZ4AAAAAJ;;;JDAZPZ0AAAAJ;",
        "orcid": ";;;;;;0000-0003-2802-6176;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Hao_Du5;~Yuchen_Ren1;~Yan_Lu10;~He_Huang6;~Yating_Liu1;~Zhendong_Mao1;~Xinqi_Gong1;~Wanli_Ouyang1",
        "aff": "Shanghai Artificial Intelligence Laboratory;;University of Sydney;Beijing Academy of Artificial Intelligence;University of Science and Technology of China;;Renmin University of China;",
        "aff_domain": "pjlab.org.cn;;uni.sydney.edu.au;baai.ac.cn;ustc.edu;;ruc.edu.cn;",
        "position": "Research Assistant;;PhD student;Researcher;PhD student;;Full Professor;",
        "bibtex": "@misc{\ndu2024split,\ntitle={Split and Merge Proxy: pre-training protein inter-chain contact prediction by mining rich information from monomer data},\nauthor={Hao Du and Yuchen Ren and Yan Lu and He Huang and Yating Liu and Zhendong Mao and Xinqi Gong and Wanli Ouyang},\nyear={2024},\nurl={https://openreview.net/forum?id=FZfWQFrdBT}\n}",
        "github": "",
        "project": "",
        "reviewers": "SSrL;moXw;EkLP;oBJT",
        "site": "https://openreview.net/forum?id=FZfWQFrdBT",
        "pdf_size": 3623067,
        "rating": "5;5;6;6",
        "confidence": "3;4;3;4",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;2",
        "presentation": "3;2;3;3",
        "wc_summary": "99;56;63;73",
        "wc_strengths": "38;36;13;58",
        "wc_weaknesses": "239;108;92;9",
        "wc_questions": "9;55;81;487",
        "wc_review": "385;255;249;627",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1171;1238;929;1307",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            72.75,
            16.315253599009733
        ],
        "wc_strengths_avg": [
            36.25,
            15.943258763502524
        ],
        "wc_weaknesses_avg": [
            112.0,
            82.39235401419236
        ],
        "wc_questions_avg": [
            158.0,
            191.68985366993215
        ],
        "wc_review_avg": [
            379.0,
            153.14698821720262
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1161.25,
            142.45064934916934
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Qymo4dA1xkcJ:scholar.google.com/&scioq=Split+and+Merge+Proxy:+pre-training+protein+inter-chain+contact+prediction+by+mining+rich+information+from+monomer+data&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "Shanghai Artificial Intelligence Laboratory;University of Sydney;Beijing Academy of Artificial Intelligence;University of Science and Technology of China;Renmin University of China",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "http://www.shailab.org/;https://www.sydney.edu.au;https://www.baaic.cn;http://www.ustc.edu.cn;http://www.ruc.edu.cn",
        "aff_unique_abbr": "Shanghai AI Lab;USYD;BAAI;USTC;RUC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;0",
        "aff_country_unique": "China;Australia"
    },
    {
        "id": "FbLuklVaX7",
        "title": "Node Classification in the Heterophilic Regime via Diffusion-Jump GNNs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In the heterophilic regime (HR), vanilla GNNs learn latent spaces where nodes with different labels may have similar embeddings. As a result, the performance of node classification degrades significantly in this context. However, existing metrics for heterophily count local discontinuities instead of characterizing heterophily in a structural way. In the ideal (homophilic) regime, nodes belonging to the same community have the same label: most of the nodes are harmonic (their unknown labels result from averaging those of their neighbors given some labeled nodes). Harmonic solvers are natural minimizers of the Laplacian Dirichlet energy. Therefore, a homophilic network is more harmonic than any heterophilic version of the same network. In other words, heterophily can be seen as a \u201closs of harmonicity\u201d. In this paper, we define \u201cstructural heterophily\u201d in terms of the ratio between the harmonicity of the network (Laplacian Dirichlet energy) and the harmonicity of its homophilic version (the so-called \u201cground\u201d energy).\n\nIn this paper, we also propose a novel GNN model (Diffusion-Jump GNN) that bypasses structural heterophily by \u201cjumping\u201d through the network in order to relate distant homologs. However, instead of using hops as standard High-Order (HO) GNNs (MixHop) do, our jumps are rooted in a structural well-known metric: the diffusion distance. Given the diffusion distances matrix (DM), we explore different orders of\ndistances wrt each node (closest node, second closest node, etc.) in parallel. Each parallel exploration defines a \u201cjump\u201d that masks the network: it is a new graph that feeds a vanilla GNN layer. Consequently, different GNNs attend to different slices of the DM. As a result, we allow distant homologs to have similar embeddings in (at least) one of the jumps. In addition, as the final embedding of each node depends on the concatenation of its parallel embeddings, we can capture the explainability of each jump via learnable coefficients.\n\nSince computing the DM is the core of this method, our main\ncontribution is that we learn both the diffusion distances and the\n\u201ccoefficients\u201d of the edges associated with each jump, thus defining\n\u201clearnable structural filters\u201d. In order to learn the DM, we exploit\nthe fact that diffusion distances have a spectral interpretation.\nInstead of computing the eigenvectors of the Laplacian, we learn\northogonal approximations of the Fiedler vector solving a\ntrace-ratio optimization problem while the prediction loss is minimized. This leads to an interplay between a Dirichlert loss, which\ncaptures low-frequency content, and a prediction loss which refines\nthat content leading to empirical eigenfunctions. Finally, our experimental results show that we are very competitive with the SOTA both in homophilic and heterophilic datasets, even in large graphs.",
        "keywords": "graph neural networks;heterophily;homophily;node classification;diffusion;Dirichlet problem;high-order graph neural networks;structural filters",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/6d163291dc62d23f3dae59dc4f9d75397bd7be9f.zip",
        "author": "Ahmed Begga;Francisco Escolano;Miguel Angel Lozano;Edwin Hancock",
        "authorids": "~Ahmed_Begga1;~Francisco_Escolano1;~Miguel_Angel_Lozano1;~Edwin_Hancock1",
        "gender": "M;M;M;M",
        "homepage": ";https://sites.google.com/site/scohomepage/;;https://pure.york.ac.uk/portal/en/persons/edwin-r-hancock",
        "dblp": "322/6223;e/FranciscoEscolano;57/1260;h/EdwinRHancock",
        "google_scholar": "https://scholar.google.es/citations?hl=es;pAe4Pf8AAAAJ;;EjDU2ncAAAAJ",
        "orcid": "0009-0000-8733-2072;0000-0003-3238-4021;0000-0002-4757-5587;0000-0003-4496-2028",
        "linkedin": "ahmed-begga-518a9b23a;;;edwin-hancock-11913117/?originalSubdomain=uk",
        "or_profile": "~Ahmed_Begga1;~Francisco_Escolano1;~Miguel_Angel_Lozano1;~Edwin_Hancock1",
        "aff": ";University of Alicante;Universidad de Alicante;Anhui University",
        "aff_domain": ";ua.es;ua.es;ahu.edu.cn",
        "position": ";Full Professor;Associate Professor;Honorary Professor",
        "bibtex": "@misc{\nbegga2024node,\ntitle={Node Classification in the Heterophilic Regime via Diffusion-Jump {GNN}s},\nauthor={Ahmed Begga and Francisco Escolano and Miguel Angel Lozano and Edwin Hancock},\nyear={2024},\nurl={https://openreview.net/forum?id=FbLuklVaX7}\n}",
        "github": "",
        "project": "",
        "reviewers": "BSdo;q3r3;6voN",
        "site": "https://openreview.net/forum?id=FbLuklVaX7",
        "pdf_size": 6650451,
        "rating": "1;3;8",
        "confidence": "4;4;5",
        "soundness": "1;2;4",
        "contribution": "1;2;4",
        "presentation": "1;1;4",
        "wc_summary": "14;63;106",
        "wc_strengths": "7;52;93",
        "wc_weaknesses": "53;418;133",
        "wc_questions": "147;385;95",
        "wc_review": "221;918;427",
        "wc_reply_reviewers": "404;160;0",
        "wc_reply_authors": "801;903;711",
        "reply_reviewers": "2;1;0",
        "reply_authors": "3;2;1",
        "rating_avg": [
            4.0,
            2.943920288775949
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "contribution_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "presentation_avg": [
            2.0,
            1.4142135623730951
        ],
        "wc_summary_avg": [
            61.0,
            37.58545818087983
        ],
        "wc_strengths_avg": [
            50.666666666666664,
            35.122009560324926
        ],
        "wc_weaknesses_avg": [
            201.33333333333334,
            156.64893516678907
        ],
        "wc_questions_avg": [
            209.0,
            126.24843233350134
        ],
        "wc_review_avg": [
            522.0,
            292.3707691727521
        ],
        "wc_reply_reviewers_avg": [
            188.0,
            166.11642503577625
        ],
        "wc_reply_authors_avg": [
            805.0,
            78.43468620451031
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.9607689228305227,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13466201722095791454&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of Alicante;Universidad de Alicante;Anhui University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ua.es;https://www.ua.es;http://www.ahu.edu.cn/",
        "aff_unique_abbr": "UA;UA;AHU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "Spain;China"
    },
    {
        "id": "FbN5rR2sEN",
        "title": "Weakly Supervised Monocular 3D Detection with a Single-View Image",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Monocular 3D detection (M3D) aims for precise 3D object localization from a single-view image which usually involves labor-intensive annotation of 3D detection boxes. Weakly supervised M3D has recently been studied to obviate the 3D annotation process by leveraging many existing 2D annotations, but it often requires extra training data such as LiDAR point clouds or multi-view images which greatly degrades its applicability and usability in various applications. We propose SKD-WM3D, a weakly supervised monocular 3D detection framework that exploits depth information to achieve M3D with a single-view image exclusively without any 3D annotations or other training data. One key design in SKD-WM3D is a self-knowledge distillation framework, which transforms image features into 3D-like representations by fusing depth information and effectively mitigates the inherent depth ambiguity in monocular scenarios with little computational overhead in inference. In addition, we design an uncertainty-aware distillation loss and a gradient-targeted transfer modulation strategy which facilitate knowledge acquisition and knowledge transfer, respectively. Extensive experiments show that SKD-WM3D surpasses the state-of-the-art clearly and its performance is even on a par with many fully supervised methods.",
        "keywords": "Monocular 3D Object Detecction;Knowledge Distillation;Weakly Supervised Learning;Computer vision",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Xueying Jiang;Sheng Jin;Lewei Lu;Shijian Lu",
        "authorids": "~Xueying_Jiang1;~Sheng_Jin3;~Lewei_Lu1;~Shijian_Lu1",
        "gender": ";M;M;M",
        "homepage": ";;;https://personal.ntu.edu.sg/shijian.lu/",
        "dblp": ";70/6780-2;247/6438;42/2718",
        "google_scholar": ";https://scholar.google.com/citations?view_op=list_works;https://scholar.google.com.hk/citations?user=zdgKJXIAAAAJ;https://scholar.google.com.sg/scholar?hl=en",
        "orcid": ";0000-0001-7254-1664;;",
        "linkedin": ";;lewei-lu-94015977/;",
        "or_profile": "~Xueying_Jiang1;~Sheng_Jin3;~Lewei_Lu1;~Shijian_Lu1",
        "aff": ";Nanyang Technological University;SenseTime;Nanyang Technological University",
        "aff_domain": ";ntu.edu.sg;sensetime.com;ntu.edu.sg",
        "position": ";Postdoc;Researcher;Associate Professor",
        "bibtex": "@misc{\njiang2024weakly,\ntitle={Weakly Supervised Monocular 3D Detection with a Single-View Image},\nauthor={Xueying Jiang and Sheng Jin and Lewei Lu and Shijian Lu},\nyear={2024},\nurl={https://openreview.net/forum?id=FbN5rR2sEN}\n}",
        "github": "",
        "project": "",
        "reviewers": "mWR5;r6LJ;Wtxb;Be8N",
        "site": "https://openreview.net/forum?id=FbN5rR2sEN",
        "pdf_size": 5161749,
        "rating": "3;5;5;6",
        "confidence": "5;4;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;2;2",
        "wc_summary": "42;102;109;98",
        "wc_strengths": "61;66;39;77",
        "wc_weaknesses": "79;104;232;316",
        "wc_questions": "4;62;2;124",
        "wc_review": "186;334;382;615",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            87.75,
            26.705570579937064
        ],
        "wc_strengths_avg": [
            60.75,
            13.827056809024834
        ],
        "wc_weaknesses_avg": [
            182.75,
            96.36746079460639
        ],
        "wc_questions_avg": [
            48.0,
            50.05996404313531
        ],
        "wc_review_avg": [
            379.25,
            154.09311308426473
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9271726499455306,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=915091977170288794&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Nanyang Technological University;SenseTime",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ntu.edu.sg;https://www.sensetime.com",
        "aff_unique_abbr": "NTU;SenseTime",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Singapore;China"
    },
    {
        "id": "FbRWdSxTPY",
        "title": "SQS: Speech Quality Assessment in the Data Annotation Context",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Audio quality plays a crucial role in the data annotation process as it influences various factors that could significantly impact the annotation results. These factors include transcription speed, annotation confidence, and the number of audio replays, among others. Consequently, transcriptions often contain numerous errors and may have blank or incomprehensible sections. Most existing objective measures (e.g., Perceptual Evaluation Score Quality (PESQ), Speech Intelligibility Index (SII)) and subjective measures (e.g., Mean Opinion Score (MOS)), and speech quality measures (e.g., Word Error Rate (WER)) do not consider factors that could hinder the annotation process. These measures poorly correlate with the audio quality perceived by the annotator in the annotation context. We propose a novel subjective speech quality measure within the audio annotation framework, called Speech Quality Score (SQS). This measure encompasses the most relevant characteristics that can impact transcription performance and, consequently, annotation quality. Additionally, we propose a DNN-based model to predict the SQS measure. Our experiments were conducted on a dataset composed of 1,020 audio samples with SQS annotations created specifically for this study, using the RTVE2020 Database. The results demonstrate that our proposed model achieved a high performance with a linear correlation coefficient of 0.8 between ground-truth and predicted SQS values. In contrast, state-of-the-art MOS prediction models exhibited a poor correlation (i.e., 0.2) with ground-truth SQS values.",
        "keywords": "Speech quality;audio annotation;subjective measurements;speech intelligibility",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Fernando M. Espinoza-Cuadros;Rafael Ginard-Aguilera;Juan M. Perero-Codosero",
        "authorids": "~Fernando_M._Espinoza-Cuadros1;~Rafael_Ginard-Aguilera1;~Juan_M._Perero-Codosero1",
        "gender": "M;;M",
        "homepage": ";;https://www.linkedin.com/in/rafa-ginard/",
        "dblp": ";;",
        "google_scholar": "https://scholar.google.es/citations?user=v6mROEEAAAAJ;https://scholar.google.es/citations?user=hONwhFIAAAAJ;",
        "orcid": ";0000-0002-3556-3896;",
        "linkedin": ";juan-manuel-perero-codosero/;rafa-ginard/",
        "or_profile": "~Fernando_M._Espinoza-Cuadros1;~Juan_Manuel_Perero1;~Rafael_Ginard1",
        "aff": "Sigma Cognition;Sigma Cognition;",
        "aff_domain": "sigmacognition.ai;sigmacognition.ai;",
        "position": "Researcher;Principal Researcher;",
        "bibtex": "@misc{\nanonymous2024sqs,\ntitle={{SQS}: Speech Quality Assessment in the Data Annotation Context},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=FbRWdSxTPY}\n}",
        "github": "",
        "project": "",
        "reviewers": "115n;SKsa;PsYv;YGuK",
        "site": "https://openreview.net/forum?id=FbRWdSxTPY",
        "pdf_size": 1000042,
        "rating": "3;3;5;6",
        "confidence": "5;4;5;4",
        "soundness": "2;3;2;2",
        "contribution": "1;2;1;2",
        "presentation": "2;2;2;2",
        "wc_summary": "46;84;61;101",
        "wc_strengths": "10;41;24;71",
        "wc_weaknesses": "147;395;132;133",
        "wc_questions": "24;27;37;72",
        "wc_review": "227;547;254;377",
        "wc_reply_reviewers": "53;33;0;0",
        "wc_reply_authors": "436;701;0;669",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "1;1;0;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            73.0,
            21.083168642308014
        ],
        "wc_strengths_avg": [
            36.5,
            22.74313083108832
        ],
        "wc_weaknesses_avg": [
            201.75,
            111.73042334118313
        ],
        "wc_questions_avg": [
            40.0,
            19.091883092036785
        ],
        "wc_review_avg": [
            351.25,
            126.36925061105649
        ],
        "wc_reply_reviewers_avg": [
            21.5,
            22.63294059551255
        ],
        "wc_reply_authors_avg": [
            451.5,
            280.02187414557454
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            0.75,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.19245008972987526,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:4o1XBA31eGsJ:scholar.google.com/&scioq=SQS:+Speech+Quality+Assessment+in+the+Data+Annotation+Context&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Sigma Cognition",
        "aff_unique_dep": "",
        "aff_unique_url": "",
        "aff_unique_abbr": "",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "",
        "aff_country_unique": ""
    },
    {
        "id": "FbjQYJKAyt",
        "title": "Implicit Neural Representation Image Codec with Mixed Context for Fast Decoding",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Image compression using Implicit Neural Representation (INR) is an emerging technology. While it may not match the quality of cutting-edge autoencoder models, it offers two key benefits: low computational complexity and parameter-free decoding. It also surpasses many traditional and early neural compression methods in terms of quality. In this study, we introduce a new mixed auto-regressive model (MARM) to notably decrease the decoding time for the current INR codec, particularly in scenarios with limited computational resources. MARM includes our proposed auto-regressive upsampler (ARU) blocks, which are highly computationally efficient, and ARM from previous work to strike a balance between decoding time and reconstruction quality. We also suggest enhancing ARU's performance using a checkerboard two-stage decoding strategy. Moreover, the balance between quality and speed can be adjusted by the ratio of different modules. Comprehensive experiments reveal that our method significantly boosts computational efficiency while preserving image quality. It also significantly excels in decoding acceleration when the quality requirements are more lenient.",
        "keywords": "Image Compression;Implicit Neural Representation;Adaptive Entropy Modeling",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Xiang Liu;Jiahong Chen;Bin Chen;Zimo Liu;Shu-Tao Xia",
        "authorids": "~Xiang_Liu11;jh-chen22@mails.tsinghua.edu.cn;~Bin_Chen4;~Zimo_Liu1;~Shu-Tao_Xia1",
        "gender": ";;M;;M",
        "homepage": "https://scholar.google.com/citations?user=agAss5gAAAAJ&hl=en&oi=sra;;https://binchen17tsinghua.wixsite.com/website;;https://www.sigs.tsinghua.edu.cn/xst/list.htm",
        "dblp": ";;22/5523-11;211/7223;03/6195",
        "google_scholar": "agAss5gAAAAJ;;Yl0wv7AAAAAJ;qj2tU6oAAAAJ;https://scholar.google.com.hk/citations?user=koAXTXgAAAAJ",
        "orcid": ";;0000-0002-4798-230X;;0000-0002-8639-982X",
        "linkedin": ";;;;",
        "or_profile": "~Xiang_Liu11;jh-chen22@mails.tsinghua.edu.cn;~Bin_Chen4;~Zimo_Liu1;~Shu-Tao_Xia1",
        "aff": "Tsinghua University;;Harbin Institute of Technology, Shenzhen;PengCheng Lab;Shenzhen International Graduate School, Tsinghua University",
        "aff_domain": "mail.tsinghua.edu.cn;;hit.edu.cn;pcl.ac.cn;sz.tsinghua.edu.cn",
        "position": "PhD student;;Assistant Professor;Postdoc;Full Professor",
        "bibtex": "@misc{\nliu2024implicit,\ntitle={Implicit Neural Representation Image Codec with Mixed Context for Fast Decoding},\nauthor={Xiang Liu and Jiahong Chen and Bin Chen and Zimo Liu and Shu-Tao Xia},\nyear={2024},\nurl={https://openreview.net/forum?id=FbjQYJKAyt}\n}",
        "github": "",
        "project": "",
        "reviewers": "8Lyx;wVzy;GVAi",
        "site": "https://openreview.net/forum?id=FbjQYJKAyt",
        "pdf_size": 3806152,
        "rating": "3;3;6",
        "confidence": "4;4;4",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "2;3;3",
        "wc_summary": "47;67;56",
        "wc_strengths": "38;17;62",
        "wc_weaknesses": "204;186;136",
        "wc_questions": "69;89;13",
        "wc_review": "358;359;267",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            56.666666666666664,
            8.178562764256865
        ],
        "wc_strengths_avg": [
            39.0,
            18.384776310850235
        ],
        "wc_weaknesses_avg": [
            175.33333333333334,
            28.767265347188555
        ],
        "wc_questions_avg": [
            57.0,
            32.16623488483952
        ],
        "wc_review_avg": [
            328.0,
            43.135445594854666
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:EX0z19uGYFwJ:scholar.google.com/&scioq=Implicit+Neural+Representation+Image+Codec+with+Mixed+Context+for+Fast+Decoding&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Tsinghua University;Harbin Institute of Technology;Pengcheng Lab",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;http://en.hhit.edu.cn/;",
        "aff_unique_abbr": "THU;HIT;",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Shenzhen",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "OVOR: OnePrompt with Virtual Outlier Regularization for Rehearsal-Free Class-Incremental Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19059",
        "id": "FbuyDzZTPt",
        "author_site": "Wei-Cheng Huang, Chun-Fu Chen, Hsiang Hsu",
        "tldr": "",
        "abstract": "Recent works have shown that by using large pre-trained models along with learnable prompts, rehearsal-free methods\nfor class-incremental learning (CIL) settings can achieve superior performance to prominent rehearsal-based ones.\nRehearsal-free CIL methods struggle with distinguishing classes from different tasks, as those are not trained together.\nIn this work we propose a regularization method based on virtual outliers to tighten decision boundaries of the classifier,\nsuch that confusion of classes among different tasks is mitigated.\nRecent prompt-based methods often require a pool of task-specific prompts, in order to prevent overwriting knowledge\nof previous tasks with that of the new task, leading to extra computation in querying and composing an\nappropriate prompt from the pool.\nThis additional cost can be eliminated, without sacrificing accuracy, as we reveal in the paper.\nWe illustrate that a simplified prompt-based method can achieve results comparable to\nprevious state-of-the-art (SOTA) methods equipped with a prompt pool, using much less learnable parameters and lower inference cost.\nOur regularization method has demonstrated its compatibility with different prompt-based methods, boosting\nthose previous SOTA rehearsal-free CIL methods' accuracy on the ImageNet-R and CIFAR-100 benchmarks. Our source code is available at https://github.com/jpmorganchase/ovor.",
        "keywords": "Rehearsal-free continual learning;Class-incremental learning;Parameter-efficient fine-tuning;Outlier regularization",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Wei-Cheng Huang;Chun-Fu Chen;Hsiang Hsu",
        "authorids": "~Wei-Cheng_Huang1;~Chun-Fu_Chen1;~Hsiang_Hsu1",
        "gender": ";M;M",
        "homepage": ";;https://hsianghsu.github.io",
        "dblp": ";48/915;",
        "google_scholar": ";9gqd5cYAAAAJ;https://scholar.google.com.tw/citations?user=JRl3iYIAAAAJ",
        "orcid": ";;0000-0001-8084-3929",
        "linkedin": ";;",
        "or_profile": "~Wei-Cheng_Huang1;~Chun-Fu_Chen1;~Hsiang_Hsu1",
        "aff": ";JPMorganChase, GTAR;JP Morgan & Chase Bank",
        "aff_domain": ";jpmchase.com;jpmchase.com",
        "position": ";Executive Director;Researcher",
        "bibtex": "@inproceedings{\nhuang2024ovor,\ntitle={{OVOR}: OnePrompt with Virtual Outlier Regularization for Rehearsal-Free Class-Incremental Learning},\nauthor={Wei-Cheng Huang and Chun-Fu Chen and Hsiang Hsu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=FbuyDzZTPt}\n}",
        "github": "",
        "project": "",
        "reviewers": "DjrG;Dx4f;2hZK",
        "pdf_size": 2247414,
        "rating": "6;6;6",
        "confidence": "5;4;2",
        "soundness": "2;2;2",
        "contribution": "3;3;2",
        "presentation": "3;1;3",
        "wc_summary": "187;124;78",
        "wc_strengths": "167;95;26",
        "wc_weaknesses": "1192;249;32",
        "wc_questions": "55;199;50",
        "wc_review": "1601;667;186",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1119;1942;459",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;3;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            1.247219128924647
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            129.66666666666666,
            44.67910274638717
        ],
        "wc_strengths_avg": [
            96.0,
            57.56735185849702
        ],
        "wc_weaknesses_avg": [
            491.0,
            503.5361622233965
        ],
        "wc_questions_avg": [
            101.33333333333333,
            69.09092238171058
        ],
        "wc_review_avg": [
            818.0,
            587.4560976504258
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1173.3333333333333,
            606.6499997710561
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 17,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15052571377538039182&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=FbuyDzZTPt",
        "pdf": "https://openreview.net/pdf?id=FbuyDzZTPt",
        "email": ";jpmchase.com;jpmchase.com",
        "author_num": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "JPMorgan Chase;JPMorgan Chase & Co.",
        "aff_unique_dep": "Global Technology, Analytics, and Research (GTAR);",
        "aff_unique_url": "https://www.jpmorganchase.com;https://www.jpmorganchase.com",
        "aff_unique_abbr": "JPM;JPM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "FcBmz8nLnq",
        "title": "Finding Adversarially Robust Graph Lottery Tickets",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph Lottery Tickets (GLTs), comprising a sparse graph neural network (GNN) and a sparse input graph adjacency matrix, can significantly reduce the inference latency and compute footprint compared to their dense counterparts. However, their performance against adversarial structure perturbations remains to be fully explored. In this work, we first investigate the resilience of GLTs against different structure perturbation attacks and observe that they are vulnerable and show a large drop in classification accuracy. We then present an adversarially robust graph sparsification (ARGS) framework that prunes the adjacency matrix and the GNN weights by optimizing a novel loss function capturing the graph homophily property and information associated with both the true labels of the train nodes and the pseudo labels of the test nodes. By iteratively applying ARGS to prune both the perturbed graph adjacency matrix and the GNN model weights, we can find adversarially robust graph lottery tickets that are highly sparse yet achieve competitive performance under different untargeted training-time structure attacks. Evaluations conducted on various benchmarks, considering different poisoning structure attacks such as PGD, MetaAttack, PR-BCD attack, and adaptive attacks, demonstrate that the GLTs generated by ARGS can significantly improve their robustness, even when subjected to high levels of sparsity.",
        "keywords": "Lottery Tickets Hypothesis;Graph Adversarial Attack;Graph Lottery Ticket",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/2e4d8654afd44231dd8648144601d8cd80694a79.zip",
        "author": "Subhajit Dutta Chowdhury;Zhiyu Ni;Qingyuan Peng;Souvik Kundu;Pierluigi Nuzzo",
        "authorids": "~Subhajit_Dutta_Chowdhury1;~Zhiyu_Ni1;~Qingyuan_Peng1;~Souvik_Kundu2;~Pierluigi_Nuzzo1",
        "gender": ";M;M;M;",
        "homepage": ";https://zyni2001.github.io/;https://www.linkedin.com/in/qingyuanpeng/;https://ksouvik52.github.io;https://descyphy.usc.edu/",
        "dblp": ";;;126/2210;75/1989-2",
        "google_scholar": ";1a9Kv9UAAAAJ;;https://scholar.google.com/citations?hl=en;GsDdaaYAAAAJ",
        "orcid": ";;;0000-0002-3533-9405;",
        "linkedin": ";zhiyu-ni-14342b1ab/;;souvik-kundu-64922b50/;",
        "or_profile": "~Subhajit_Dutta_Chowdhury1;~Zhiyu_Ni1;~Qingyuan_Peng1;~Souvik_Kundu2;~Pierluigi_Nuzzo1",
        "aff": ";University of Southern California;;Intel;University of Southern California",
        "aff_domain": ";usc.edu;;intel.com;usc.edu",
        "position": ";PhD student;;Researcher;Associate Professor",
        "bibtex": "@misc{\nchowdhury2024finding,\ntitle={Finding Adversarially Robust Graph Lottery Tickets},\nauthor={Subhajit Dutta Chowdhury and Zhiyu Ni and Qingyuan Peng and Souvik Kundu and Pierluigi Nuzzo},\nyear={2024},\nurl={https://openreview.net/forum?id=FcBmz8nLnq}\n}",
        "github": "",
        "project": "",
        "reviewers": "eZKc;69mY;j8ef;3X3M",
        "site": "https://openreview.net/forum?id=FcBmz8nLnq",
        "pdf_size": 837644,
        "rating": "3;6;6;6",
        "confidence": "5;3;1;3",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "1;2;3;3",
        "wc_summary": "149;54;60;68",
        "wc_strengths": "89;35;106;165",
        "wc_weaknesses": "385;51;8;220",
        "wc_questions": "6;82;10;122",
        "wc_review": "629;222;184;575",
        "wc_reply_reviewers": "0;16;0;70",
        "wc_reply_authors": "1609;1060;230;1907",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "4;3;2;5",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.0,
            1.4142135623730951
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            82.75,
            38.57055223872222
        ],
        "wc_strengths_avg": [
            98.75,
            46.370114297896656
        ],
        "wc_weaknesses_avg": [
            166.0,
            149.21963677746973
        ],
        "wc_questions_avg": [
            55.0,
            49.10193478876367
        ],
        "wc_review_avg": [
            402.5,
            200.86127053267387
        ],
        "wc_reply_reviewers_avg": [
            21.5,
            28.75326068465975
        ],
        "wc_reply_authors_avg": [
            1201.5,
            637.8912524874439
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.5,
            1.118033988749895
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10163476765292515467&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Southern California;Intel",
        "aff_unique_dep": ";Intel Corporation",
        "aff_unique_url": "https://www.usc.edu;https://www.intel.com",
        "aff_unique_abbr": "USC;Intel",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Los Angeles;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "FcxwXnYXWh",
        "title": "Limited-Memory Greedy Quasi-Newton Method with Non-asymptotic Superlinear Convergence Rate",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Non-asymptotic convergence analysis of quasi-Newton methods has gained attention with a landmark result establishing an explicit local superlinear rate of $\\mathcal{O}((1/\\sqrt{t})^t)$. The methods that obtain this rate, however, exhibit a well-known drawback: they require the storage of the previous Hessian approximation matrix or instead storing all past curvature information to form the current Hessian inverse approximation. Limited-memory variants of quasi-Newton methods such as the celebrated L-BFGS alleviate this issue by leveraging a limited window of past curvature information to construct the Hessian inverse approximation. As a result, their per iteration complexity and storage requirement is $\\mathcal{O}(\\tau d)$ where $\\tau \\le d$ is the size of the window and $d$ is the problem dimension reducing the $\\mathcal{O}(d^2)$ computational cost and memory requirement of standard quasi-Newton methods. However, to the best of our knowledge, there is no result showing a non-asymptotic superlinear convergence rate for any limited-memory quasi-Newton method. In this work, we close this gap by presenting a Limited-memory Greedy BFGS (LG-BFGS) method that can achieve an explicit non-asymptotic superlinear rate. We incorporate displacement aggregation, i.e., decorrelating projection, in post-processing gradient variations, together with a basis vector selection scheme on variable variations, which $\\textit{greedily}$ maximizes a progress measure of the Hessian estimate to the true Hessian. Their combination allows past curvature information to remain in a sparse subspace while yielding a valid representation of the full history. Interestingly, our established $\\textit{non-asymptotic}$ superlinear convergence rate demonstrates an explicit trade-off between the convergence speed and memory requirement, which to our knowledge, is the first of its kind. Numerical results corroborate our theoretical findings and demonstrate the effectiveness of our method.",
        "keywords": "Quasi-Newton method;limited memory;non-asymptotic superlinear convergence",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/9a0587bd6c7f562fd66360483faccf1978f66681.zip",
        "author": "Zhan Gao;Aryan Mokhtari;Alec Koppel",
        "authorids": "~Zhan_Gao1;~Aryan_Mokhtari3;~Alec_Koppel1",
        "gender": ";M;M",
        "homepage": ";https://sites.utexas.edu/mokhtari/;http://koppel.netlify.app/",
        "dblp": ";140/7407;149/0076",
        "google_scholar": ";glcep6EAAAAJ;8ClxyjIAAAAJ",
        "orcid": ";;0000-0003-2447-2873",
        "linkedin": ";;alec-koppel-9860b697/",
        "or_profile": "~Zhan_Gao1;~Aryan_Mokhtari3;~Alec_Koppel1",
        "aff": ";University of Texas, Austin;J.P. Morgan Chase",
        "aff_domain": ";utexas.edu;jpmorgan.com",
        "position": ";Assistant Professor;Research Team Lead",
        "bibtex": "@misc{\ngao2024limitedmemory,\ntitle={Limited-Memory Greedy Quasi-Newton Method with Non-asymptotic Superlinear Convergence Rate},\nauthor={Zhan Gao and Aryan Mokhtari and Alec Koppel},\nyear={2024},\nurl={https://openreview.net/forum?id=FcxwXnYXWh}\n}",
        "github": "",
        "project": "",
        "reviewers": "XXyA;hAw3;AdGH;PF4F",
        "site": "https://openreview.net/forum?id=FcxwXnYXWh",
        "pdf_size": 473559,
        "rating": "3;5;5;6",
        "confidence": "3;4;4;2",
        "soundness": "2;2;3;3",
        "contribution": "1;2;3;3",
        "presentation": "2;2;4;3",
        "wc_summary": "145;45;102;307",
        "wc_strengths": "103;56;110;5",
        "wc_weaknesses": "230;144;184;46",
        "wc_questions": "2;6;582;1",
        "wc_review": "480;251;978;359",
        "wc_reply_reviewers": "24;93;131;0",
        "wc_reply_authors": "1134;932;1214;186",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "4;2;4;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            149.75,
            97.47147018486999
        ],
        "wc_strengths_avg": [
            68.5,
            42.13371571556442
        ],
        "wc_weaknesses_avg": [
            151.0,
            67.83067152844649
        ],
        "wc_questions_avg": [
            147.75,
            250.7213343535009
        ],
        "wc_review_avg": [
            517.0,
            278.2130478608076
        ],
        "wc_reply_reviewers_avg": [
            62.0,
            52.4642735582987
        ],
        "wc_reply_authors_avg": [
            866.5,
            406.1043585089921
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            1.299038105676658
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.20751433915982243,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12703262226954147114&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Texas at Austin;JPMorgan Chase & Co.",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.utexas.edu;https://www.jpmorganchase.com",
        "aff_unique_abbr": "UT Austin;JPM",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Austin;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Fd8MBEOirN",
        "title": "OpenPatch: a 3D patchwork for Out-Of-Distribution detection",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Moving deep learning models from the laboratory setting to the open world en-\ntails preparing them to handle unforeseen conditions. In several applications the\noccurrence of novel classes during deployment poses a significant threat, thus it is\ncrucial to effectively detect them. Ideally, this skill should be used when needed\nwithout requiring any further computational training effort at every new task.\nOut-of-distribution detection has attracted significant attention in the last years,\nhowever the majority of the studies deal with 2D images ignoring the inherent 3D\nnature of the real-world and often confusing between domain and semantic novelty.\nIn this work, we focus on the latter, considering the objects\u2019 geometric structure\ncaptured by 3D point clouds regardless of the specific domain.\nWe advance the field by introducing OpenPatch that builds on a large pre-trained\nmodel and simply extracts from its intermediate features a set of patch represen-\ntations that describe each known class. For any new sample, we obtain a novelty\nscore by evaluating whether it can be recomposed mainly by patches of a single\nknown class or rather via the contribution of multiple classes. We present an\nextensive experimental evaluation of our approach for the task of semantic novelty\ndetection on real-world point cloud samples when the reference known data are\nsynthetic. We demonstrate that OpenPatch excels in both the full and few-shot\nknown sample scenarios, showcasing its robustness across varying pre-training\nobjectives and network backbones. The inherent training-free nature of our method\nallows for its immediate application to a wide array of real-world tasks, offering a\ncompelling advantage over approaches that need expensive retraining efforts.",
        "keywords": "3D;point clouds;open set;semantic novelty detection;out of distribution;OOD",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/62800aa90a8c6a771c1554470a8aa60bd42a6288.zip",
        "author": "Paolo Rabino;Antonio Alliegro;Francesco Cappio Borlino;Tatiana Tommasi",
        "authorids": "~Paolo_Rabino1;~Antonio_Alliegro1;~Francesco_Cappio_Borlino1;~Tatiana_Tommasi2",
        "gender": "M;M;M;F",
        "homepage": "https://www.polito.it/en/staff?p=paolo.rabino;https://www.polito.it/personale?p=antonio.alliegro;;https://www.tatianatommasi.com",
        "dblp": ";263/2610;266/1264;10/1266",
        "google_scholar": "8cuwiyAAAAAJ;yQqW5q0AAAAJ;https://scholar.google.it/citations?user=zP8AvuYAAAAJ;ykFtI-QAAAAJ",
        "orcid": ";;0000-0002-8507-0213;",
        "linkedin": ";antonio-alliegro-788442140;;",
        "or_profile": "~Paolo_Rabino1;~Antonio_Alliegro1;~Francesco_Cappio_Borlino1;~Tatiana_Tommasi2",
        "aff": "Polytechnic Institute of Turin;Politecnico di Torino;Politecnico di Torino;Polytechnic Institute of Turin",
        "aff_domain": "polito.it;polito.it;polito.it;polito.it",
        "position": "PhD student;PhD student;PhD student;Associate Professor",
        "bibtex": "@misc{\nrabino2024openpatch,\ntitle={OpenPatch: a 3D patchwork for Out-Of-Distribution detection},\nauthor={Paolo Rabino and Antonio Alliegro and Francesco Cappio Borlino and Tatiana Tommasi},\nyear={2024},\nurl={https://openreview.net/forum?id=Fd8MBEOirN}\n}",
        "github": "",
        "project": "",
        "reviewers": "shas;RMdW;3nEL;3HQY",
        "site": "https://openreview.net/forum?id=Fd8MBEOirN",
        "pdf_size": 4178541,
        "rating": "3;3;3;6",
        "confidence": "3;4;4;2",
        "soundness": "3;1;1;3",
        "contribution": "2;1;2;2",
        "presentation": "3;1;1;3",
        "wc_summary": "54;147;278;60",
        "wc_strengths": "36;6;74;48",
        "wc_weaknesses": "165;144;157;101",
        "wc_questions": "21;23;199;3",
        "wc_review": "276;320;708;212",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "448;459;418;278",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.0,
            1.0
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            1.0
        ],
        "wc_summary_avg": [
            134.75,
            90.52451325469804
        ],
        "wc_strengths_avg": [
            41.0,
            24.43358344574123
        ],
        "wc_weaknesses_avg": [
            141.75,
            24.691850882426778
        ],
        "wc_questions_avg": [
            61.5,
            79.76684775017752
        ],
        "wc_review_avg": [
            379.0,
            193.79112466777212
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            400.75,
            72.44092420724628
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8703882797784892,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8182357623652769202&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1;0",
        "aff_unique_norm": "Polytechnic Institute of Turin;Politecnico di Torino",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.polito.it;https://www.polito.it",
        "aff_unique_abbr": "Polito;Polito",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Italy"
    },
    {
        "id": "FdUloEgBSE",
        "title": "Text-guided Diffusion Model for 3D Molecule Generation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The *de novo* generation of molecules with desired properties is a critical task in fields like biology, chemistry, and drug discovery.\nRecent advancements in diffusion models, particularly equivariant diffusion models, have shown promise in generating 3D molecular structures.\nHowever, these models largely work under value guidance, typically conditioning on a single property value, which might limit their ability to address complex real-world requirements.\nTo address this, we propose the text guidance instead, and introduce TEDMol, a new *Text-guided Diffusion Model for 3D Molecule Generation*.\nIt aims to integrate the capabilities of language models with diffusion models, thereby providing a deeper level of language understanding in 3D molecule generation.\nSpecifically, TEDMol utilizes textual conditions to guide the reverse process, enabling the adept and flexible generation of 3D molecules.\nOur experimental results on various tasks demonstrate that TEDMol not only enhances the stability and diversity of the generated molecules, but also excels in capturing and utilizing information derived from textual descriptions.\nOur approach forms a flexible and efficient text-guided molecular diffusion framework, providing a powerful tool for generating 3D molecular structures in response to complex, textual conditions.",
        "keywords": "Drug design;Generative Models;Diffusion Models",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Yanchen Luo;Sihang Li;Zhiyuan Liu;Jiancan Wu;Zhengyi Yang;Xiangnan He;Xiang Wang;Qi Tian",
        "authorids": "~Yanchen_Luo1;~Sihang_Li1;~Zhiyuan_Liu5;~Jiancan_Wu1;~Zhengyi_Yang1;~Xiangnan_He1;~Xiang_Wang6;~Qi_Tian3",
        "gender": "M;;M;M;;M;M;M",
        "homepage": "https://github.com/lyc0930;;https://acharkq.github.io/;https://wujcan.github.io/;https://github.com/YangZhengyi98;http://staff.ustc.edu.cn/~hexn;https://github.com/xiangwang1223;https://www.qitian1987.com/index.html",
        "dblp": "359/3305;;53/3245-10;257/4945;;59/1007;31/2864-10;78/1467-1.html",
        "google_scholar": "e5SeNbMAAAAJ;;https://scholar.google.com.sg/citations?user=zF0AH64AAAAJ;z9zW1UgAAAAJ;;https://scholar.google.com.sg/citations?user=X45Go24AAAAJ;https://scholar.google.com.sg/citations?user=HdhaQB0AAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": "0009-0009-2637-176X;;;0000-0002-6941-5218;;0000-0001-8472-7992;0000-0002-6148-6329;0000-0002-7252-5047",
        "linkedin": ";;;;;;;",
        "or_profile": "~Yanchen_Luo1;~Sihang_Li1;~Zhiyuan_Liu5;~Jiancan_Wu1;~Zhengyi_Yang1;~Xiangnan_He1;~Xiang_Wang6;~Qi_Tian3",
        "aff": "University of Science and Technology of China;;National University of Singapore;University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China;Huawei Technologies Ltd.",
        "aff_domain": "ustc.edu.cn;;nus.edu.sg;ustc.edu.cn;ustc.edu.cn;ustc.edu.cn;ustc.edu.cn;huawei.com",
        "position": "PhD student;;PhD student;Postdoc;PhD student;Professor;Full Professor;Principal Researcher",
        "bibtex": "@misc{\nluo2024textguided,\ntitle={Text-guided Diffusion Model for 3D Molecule Generation},\nauthor={Yanchen Luo and Sihang Li and Zhiyuan Liu and Jiancan Wu and Zhengyi Yang and Xiangnan He and Xiang Wang and Qi Tian},\nyear={2024},\nurl={https://openreview.net/forum?id=FdUloEgBSE}\n}",
        "github": "",
        "project": "",
        "reviewers": "e3Wq;Ced2;wYzV;ytEe",
        "site": "https://openreview.net/forum?id=FdUloEgBSE",
        "pdf_size": 1326497,
        "rating": "1;3;5;6",
        "confidence": "4;4;3;4",
        "soundness": "1;2;3;3",
        "contribution": "1;2;2;2",
        "presentation": "2;2;2;3",
        "wc_summary": "41;50;60;106",
        "wc_strengths": "31;41;114;48",
        "wc_weaknesses": "301;210;781;66",
        "wc_questions": "191;65;10;23",
        "wc_review": "564;366;965;243",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "505;328;400;342",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.75,
            1.920286436967152
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            64.25,
            25.02373872945448
        ],
        "wc_strengths_avg": [
            58.5,
            32.60751447136074
        ],
        "wc_weaknesses_avg": [
            339.5,
            268.3174425936562
        ],
        "wc_questions_avg": [
            72.25,
            71.51005174099653
        ],
        "wc_review_avg": [
            534.5,
            273.6626572990915
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            393.75,
            69.67199939717533
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.3758230140014144,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13753010052593363963&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;0;0;0;2",
        "aff_unique_norm": "University of Science and Technology of China;National University of Singapore;Huawei",
        "aff_unique_dep": ";;Huawei Technologies",
        "aff_unique_url": "http://www.ustc.edu.cn;https://www.nus.edu.sg;https://www.huawei.com",
        "aff_unique_abbr": "USTC;NUS;Huawei",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;0;0;0",
        "aff_country_unique": "China;Singapore"
    },
    {
        "title": "AlpaGasus: Training a Better Alpaca with Fewer Data",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19058",
        "id": "FdVXgSJhvz",
        "author_site": "Lichang Chen, Shiyang Li, Jun Yan, Hai Wang, Kalpa Gunaratna, Vikas Yadav, Zheng Tang, Vijay Srinivasan, Tianyi Zhou, Heng Huang, Hongxia Jin",
        "tldr": "",
        "abstract": "Large language models~(LLMs) strengthen instruction-following capability through instruction-finetuning (IFT) on supervised instruction/response data. However, widely used IFT datasets (e.g., Alpaca's 52k data) surprisingly contain many low-quality instances with incorrect or irrelevant responses, which are misleading and detrimental to IFT.  In this paper, we propose a simple and effective data selection strategy that automatically identifies and removes low-quality data using a strong LLM (e.g., ChatGPT). To this end, we introduce Alpagasus, which is finetuned on only 9k high-quality data filtered from the 52k Alpaca data. Alpagasus significantly outperforms the original Alpaca as evaluated by GPT-4 on multiple test sets and the controlled human study. Its 13B variant matches $>90\\%$ performance of its teacher LLM (i.e., Text-Davinci-003) on test tasks. It also provides 5.7x faster training, reducing the training time for a 7B variant from 80 minutes (for Alpaca) to 14 minutes \\footnote{We apply IFT for the same number of epochs as Alpaca(7B) but on fewer data, using 4$\\times$NVIDIA A100 (80GB) GPUs and following the original Alpaca setting and hyperparameters.}.  In the experiment, we also demonstrate that our method can work not only for machine-generated datasets but also for human-written datasets. Overall, Alpagasus demonstrates a novel data-centric IFT paradigm that can be generally applied to instruction-tuning data, leading to faster training and better instruction-following models.",
        "keywords": "data selection; large language model; instruction tuning;",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/6b1ca7838f672567409d0e33e16521f036e0b44b.pdf",
        "author": "Lichang Chen;Shiyang Li;Jun Yan;Hai Wang;Kalpa Gunaratna;Vikas Yadav;Zheng Tang;Vijay Srinivasan;Tianyi Zhou;Heng Huang;Hongxia Jin",
        "authorids": "~Lichang_Chen2;~Shiyang_Li1;~Jun_Yan5;~Hai_Wang1;~Kalpa_Gunaratna1;~Vikas_Yadav2;~Zheng_Tang3;~Vijay_Srinivasan1;~Tianyi_Zhou1;~Heng_Huang1;~Hongxia_Jin1",
        "gender": ";;;M;;M;M;;M;M;",
        "homepage": ";;;http://ttic.uchicago.edu/~haiwang/;https://kalpagunaratna.github.io;;http://ztang.info;;https://tianyizhou.github.io/;https://www.cs.umd.edu/~heng/;",
        "dblp": ";;89/5901-12;;00/9080;;;;88/8205-1;03/281;",
        "google_scholar": ";;rhNj2RcAAAAJ;sOF6iA4AAAAJ;XZQibgsAAAAJ;FyS1eswAAAAJ;;;OKvgizMAAAAJ;4OqLaDwAAAAJ;",
        "orcid": ";;;;;;;;0000-0001-5348-0632;;",
        "linkedin": ";;;;kalpagunaratna/;vyf95/;;;tianyizhou;;",
        "or_profile": "~Lichang_Chen2;~Shiyang_Li1;~Jun_Yan5;~Hai_Wang1;~Kalpa_Gunaratna1;~Vikas_Yadav2;~Zheng_Tang3;~Vijay_Srinivasan1;~Tianyi_Zhou1;~Heng_Huang1;~Hongxia_Jin1",
        "aff": ";;University of Southern California;Samsung;Samsung;ServiceNow Inc;Samsung;;University of Maryland, College Park;Department of Computer Science, University of Maryland, College Park;",
        "aff_domain": ";;usc.edu;samsung.com;samsung.com;servicenow.com;samsung.com;;umd.edu;cs.umd.edu;",
        "position": ";;PhD student;Researcher;Researcher;Researcher;Researcher;;Assistant Professor;Full Professor;",
        "bibtex": "@inproceedings{\nchen2024alpagasus,\ntitle={AlpaGasus: Training a Better Alpaca with Fewer Data},\nauthor={Lichang Chen and Shiyang Li and Jun Yan and Hai Wang and Kalpa Gunaratna and Vikas Yadav and Zheng Tang and Vijay Srinivasan and Tianyi Zhou and Heng Huang and Hongxia Jin},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=FdVXgSJhvz}\n}",
        "github": "",
        "project": "",
        "reviewers": "egVm;BizM;qmSJ",
        "pdf_size": 2415838,
        "rating": "6;6;6",
        "confidence": "5;4;4",
        "soundness": "2;2;3",
        "contribution": "1;2;2",
        "presentation": "3;2;3",
        "wc_summary": "48;71;33",
        "wc_strengths": "33;47;29",
        "wc_weaknesses": "113;264;72",
        "wc_questions": "50;56;2",
        "wc_review": "244;438;136",
        "wc_reply_reviewers": "49;0;0",
        "wc_reply_authors": "1375;1179;516",
        "reply_reviewers": "1;0;0",
        "reply_authors": "5;5;3",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            50.666666666666664,
            15.627610892974722
        ],
        "wc_strengths_avg": [
            36.333333333333336,
            7.717224601860151
        ],
        "wc_weaknesses_avg": [
            149.66666666666666,
            82.56041558896261
        ],
        "wc_questions_avg": [
            36.0,
            24.166091947189145
        ],
        "wc_review_avg": [
            272.6666666666667,
            124.94621064904513
        ],
        "wc_reply_reviewers_avg": [
            16.333333333333332,
            23.098821518760555
        ],
        "wc_reply_authors_avg": [
            1023.3333333333334,
            367.55437995243943
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 235,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5256571148060741678&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=FdVXgSJhvz",
        "pdf": "https://openreview.net/pdf?id=FdVXgSJhvz",
        "email": ";;usc.edu;samsung.com;samsung.com;servicenow.com;samsung.com;;umd.edu;cs.umd.edu;",
        "author_num": 11,
        "aff_unique_index": "0;1;1;2;1;3;4",
        "aff_unique_norm": "University of Southern California;Samsung;ServiceNow;University of Maryland;University of Maryland, College Park",
        "aff_unique_dep": ";Samsung;;;Department of Computer Science",
        "aff_unique_url": "https://www.usc.edu;https://www.samsung.com;https://www.servicenow.com;https://www/umd.edu;https://www/umd.edu",
        "aff_unique_abbr": "USC;Samsung;ServiceNow;UMD;UMD",
        "aff_campus_unique_index": "0;2;2",
        "aff_campus_unique": "Los Angeles;;College Park",
        "aff_country_unique_index": "0;1;1;0;1;0;0",
        "aff_country_unique": "United States;South Korea"
    },
    {
        "title": "On the Power of the Weisfeiler-Leman Test for Graph Motif Parameters",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19057",
        "id": "FddFxi08J3",
        "author_site": "Matthias Lanzinger, Pablo Barcelo",
        "tldr": "",
        "abstract": "Seminal research in the field of graph neural networks (GNNs) has revealed a direct correspondence between the expressive capabilities of GNNs and the $k$-dimensional \nWeisfeiler-Leman ($k$WL) test, a widely-recognized method for verifying graph isomorphism. This connection has reignited interest in comprehending the specific graph properties effectively distinguishable by the $k$WL test.\nA central focus of research in this field revolves around determining the least dimensionality $k$, for which $k$WL can discern graphs with different number of occurrences of a pattern graph $p$. We refer to such a least $k$ as the WL-dimension of this pattern counting problem. This inquiry traditionally delves into two distinct counting problems related to patterns: subgraph counting and induced subgraph counting. Intriguingly, despite their initial appearance as separate challenges with seemingly divergent approaches, both of these problems are interconnected components of a more comprehensive problem: \"graph motif parameters\". In this paper, we provide a precise characterization of the WL-dimension of labeled graph motif parameters. As specific instances of this result, we obtain characterizations of the WL-dimension of the subgraph counting and induced subgraph counting problem for every labeled pattern $p$. Particularly noteworthy is our resolution of a problem left open in previous work \nconcerning induced copies.\nWe additionally demonstrate that in cases where the $k$WL test distinguishes between graphs with varying occurrences of a pattern $p$, the exact number of occurrences of $p$ can be computed uniformly using only local information of the last layer of a corresponding GNN.\nWe finally delve into the challenge of recognizing the WL-dimension of various graph parameters. We give a polynomial time algorithm for determining the WL-dimension of the subgraph counting problem for given pattern $p$, answering an open question from previous work.\nWe additionally show how to utilize deep results from the field of graph motif parameters, together with our characterization, to determine the WL-dimension of induced subgraph counting and counting $k$-graphlets.",
        "keywords": "WL test;graph neural networks;graph motif parameters;subgraph counting",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Matthias Lanzinger;Pablo Barcelo",
        "authorids": "~Matthias_Lanzinger1;~Pablo_Barcelo1",
        "gender": "M;M",
        "homepage": "https://www.cs.ox.ac.uk/people/matthias.lanzinger/;https://pbarcelo.ing.uc.cl/",
        "dblp": "232/1851;29/5169",
        "google_scholar": "XAR1lVUAAAAJ;9OH3PokAAAAJ",
        "orcid": "0000-0002-7601-3727;0000-0003-2293-2653",
        "linkedin": "matthias-lanzinger/;",
        "or_profile": "~Matthias_Lanzinger1;~Pablo_Barcelo1",
        "aff": "Technische Universit\u00e4t Wien;Pontificia Universidad Cat\u00f3lica",
        "aff_domain": "tuwien.ac.at;uc.cl",
        "position": "Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\nlanzinger2024on,\ntitle={On the Power of the Weisfeiler-Leman Test for Graph Motif Parameters},\nauthor={Matthias Lanzinger and Pablo Barcelo},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=FddFxi08J3}\n}",
        "github": "",
        "project": "",
        "reviewers": "Jgdr;2nvm;kH24;p7nS",
        "pdf_size": 466146,
        "rating": "6;6;6;8",
        "confidence": "2;4;3;2",
        "soundness": "3;4;2;3",
        "contribution": "3;2;2;3",
        "presentation": "3;3;2;3",
        "wc_summary": "155;229;96;54",
        "wc_strengths": "45;112;30;56",
        "wc_weaknesses": "115;120;81;25",
        "wc_questions": "1;41;61;157",
        "wc_review": "316;502;268;292",
        "wc_reply_reviewers": "7;8;65;7",
        "wc_reply_authors": "172;992;127;258",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            133.5,
            65.78183639881149
        ],
        "wc_strengths_avg": [
            60.75,
            30.994959267597046
        ],
        "wc_weaknesses_avg": [
            85.25,
            37.88386859865291
        ],
        "wc_questions_avg": [
            65.0,
            57.3410847473258
        ],
        "wc_review_avg": [
            344.5,
            92.50270266321952
        ],
        "wc_reply_reviewers_avg": [
            21.75,
            24.973736204260668
        ],
        "wc_reply_authors_avg": [
            387.25,
            352.31049870817077
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13818316806967603857&as_sdt=800005&sciodt=0,15&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=FddFxi08J3",
        "pdf": "https://openreview.net/pdf?id=FddFxi08J3",
        "email": "tuwien.ac.at;uc.cl",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Technische Universit\u00e4t Wien;Pontificia Universidad Cat\u00f3lica",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tuwien.ac.at;https://www.puc.cl",
        "aff_unique_abbr": "TU Wien;PUC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Austria;Chile"
    },
    {
        "title": "Does Writing with Language Models Reduce Content Diversity?",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19056",
        "id": "Feiz5HtCD0",
        "author_site": "Vishakh Padmakumar, He He",
        "tldr": "",
        "abstract": "Large language models (LLMs) have led to a surge in collaborative writing with model assistance. As different users incorporate suggestions from the same model, there is a risk of decreased diversity in the produced content, potentially limiting diverse perspectives in public discourse. In this work, we measure the impact of co-writing on diversity via a controlled experiment, where users write argumentative essays in three setups---using a base LLM (GPT3), a feedback-tuned LLM (InstructGPT), and writing without model help. We develop a set of diversity metrics and find that writing with InstructGPT (but not the GPT3) results in a statistically significant reduction in diversity. Specifically, it increases the similarity between the writings of different authors and reduces the overall lexical and content diversity. We additionally find that this effect is mainly attributable to InstructGPT contributing less diverse text to co-written essays. In contrast, the user-contributed text remains unaffected by model collaboration. This suggests that the recent improvement in generation quality from adapting models to human feedback might come at the cost of more homogeneous and less diverse content.",
        "keywords": "collaborative writing;text generation;language models;evaluation;human-AI collaboration;diversity",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/929fc519a7fda7f682fd61a84863ec647866909e.zip",
        "author": "Vishakh Padmakumar;He He",
        "authorids": "~Vishakh_Padmakumar1;~He_He2",
        "gender": ";F",
        "homepage": "https://vishakhpk.github.io/;http://hhexiy.github.io",
        "dblp": "285/5184;08/8618-1",
        "google_scholar": "OeBKZ8AAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0002-3396-3589;",
        "linkedin": ";",
        "or_profile": "~Vishakh_Padmakumar1;~He_He1",
        "aff": "New York University;New York University",
        "aff_domain": "nyu.edu;nyu.edu",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\npadmakumar2024does,\ntitle={Does Writing with Language Models Reduce Content Diversity?},\nauthor={Vishakh Padmakumar and He He},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Feiz5HtCD0}\n}",
        "github": "",
        "project": "",
        "reviewers": "ttyL;vExG;qs9Z",
        "pdf_size": 958567,
        "rating": "5;6;6",
        "confidence": "3;4;4",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "3;4;3",
        "wc_summary": "142;272;102",
        "wc_strengths": "71;169;103",
        "wc_weaknesses": "457;369;262",
        "wc_questions": "60;309;41",
        "wc_review": "730;1119;508",
        "wc_reply_reviewers": "188;103;0",
        "wc_reply_authors": "1249;1286;936",
        "reply_reviewers": "1;1;0",
        "reply_authors": "4;3;3",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            172.0,
            72.5718035235908
        ],
        "wc_strengths_avg": [
            114.33333333333333,
            40.80304999493161
        ],
        "wc_weaknesses_avg": [
            362.6666666666667,
            79.73428093082394
        ],
        "wc_questions_avg": [
            136.66666666666666,
            122.10469096457987
        ],
        "wc_review_avg": [
            785.6666666666666,
            252.52634626025767
        ],
        "wc_reply_reviewers_avg": [
            97.0,
            76.86785197120228
        ],
        "wc_reply_authors_avg": [
            1157.0,
            156.99893842528576
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.9999999999999997,
        "gs_citation": 99,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8623382831014617668&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=Feiz5HtCD0",
        "pdf": "https://openreview.net/pdf?id=Feiz5HtCD0",
        "email": "nyu.edu;nyu.edu",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "New York University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nyu.edu",
        "aff_unique_abbr": "NYU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "FeqxK6PW79",
        "title": "Analyzing Deep Transformer Models for Time Series Forecasting via Manifold Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep transformer models consistently achieve groundbreaking results on natural language processing and computer vision problems, among other engineering and scientific domains. However, despite active research that aims to better understand transformer neural networks via e.g., computing saliency scores or analyzing their attention matrix, these models are not well-understood at large. This problem is further exacerbated for deep time series forecasting methods, for which analysis and understanding work is relatively scarce. Indeed, deep time series forecasting methods only recently emerged as state-of-the-art, and moreover, time series data may be less ``natural'' to interpret and analyze, unlike image and text information. Complimentary to existing analysis studies, we employ a manifold learning viewpoint, i.e., we assume that latent representations of time series forecasting models lie next to a low-dimensional manifold. In this work, we study geometric features of latent data manifolds including their intrinsic dimension and principal curvatures. Our results demonstrate that deep transformer models share a similar geometric behavior across layers, and that geometric features are correlated with model performance. Further, untrained models present different structures, which rapidly converge during training. Our geometric analysis and differentiable tools may be used in designing new and improved deep forecasting neural nets.",
        "keywords": "representation learning;manifold analysis;deep neural networks;time series forecasting",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Ilya Kaufman;Omri Azencot",
        "authorids": "~Ilya_Kaufman1;~Omri_Azencot1",
        "gender": ";Unspecified",
        "homepage": ";http://omriazencot.com",
        "dblp": ";132/3985.html",
        "google_scholar": ";https://scholar.google.co.il/citations?user=MEGuRmAAAAAJ",
        "orcid": ";",
        "linkedin": "ilya-kaufman-2bb698149;omri-azencot-a8812417/",
        "or_profile": "~Ilya_Kaufman1;~Omri_Azencot1",
        "aff": "Ben-Gurion University of the Negev;Ben-Gurion University of the Negev",
        "aff_domain": "bgu.ac.il;bgu.ac.il",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nkaufman2024analyzing,\ntitle={Analyzing Deep Transformer Models for Time Series Forecasting via Manifold Learning},\nauthor={Ilya Kaufman and Omri Azencot},\nyear={2024},\nurl={https://openreview.net/forum?id=FeqxK6PW79}\n}",
        "github": "",
        "project": "",
        "reviewers": "qBpo;VSrC;xeJH;SZbM",
        "site": "https://openreview.net/forum?id=FeqxK6PW79",
        "pdf_size": 1141524,
        "rating": "3;5;5;6",
        "confidence": "3;4;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;2;3",
        "wc_summary": "95;151;42;92",
        "wc_strengths": "71;113;76;88",
        "wc_weaknesses": "85;205;303;668",
        "wc_questions": "30;36;82;2",
        "wc_review": "281;505;503;850",
        "wc_reply_reviewers": "0;12;83;221",
        "wc_reply_authors": "601;852;1165;1109",
        "reply_reviewers": "0;1;2;1",
        "reply_authors": "1;2;3;2",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            95.0,
            38.58108344772085
        ],
        "wc_strengths_avg": [
            87.0,
            16.232683080747925
        ],
        "wc_weaknesses_avg": [
            315.25,
            217.80309341237557
        ],
        "wc_questions_avg": [
            37.5,
            28.718460961548757
        ],
        "wc_review_avg": [
            534.75,
            203.5096742172224
        ],
        "wc_reply_reviewers_avg": [
            79.0,
            87.9062000088731
        ],
        "wc_reply_authors_avg": [
            931.75,
            224.48761101673296
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.9271726499455306,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17017152594093589779&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Ben-Gurion University of the Negev",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.bgu.ac.il",
        "aff_unique_abbr": "BGU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Israel"
    },
    {
        "title": "Debiased Collaborative Filtering with Kernel-Based Causal Balancing",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19055",
        "id": "Ffjc8ApSbt",
        "author_site": "Haoxuan Li, Yanghao Xiao, Chunyuan Zheng, Peng Wu, Zhi Geng, Xu Chen, Peng Cui",
        "tldr": "",
        "abstract": "Collaborative filtering builds personalized models from the collected user feedback. However, the collected data is observational rather than experimental, leading to various biases in the data, which can significantly affect the learned model. To address this issue, many studies have focused on propensity-based methods to combat the selection bias by reweighting the sample loss, and demonstrate that\nbalancing is important for debiasing both theoretically and empirically. However, there are two questions that still need to be addressed: which function class should be balanced and how to effectively balance that function class? In this paper, we first perform theoretical analysis to show the effect of balancing finite-dimensional function classes on the bias of IPS and DR methods, and based on this, we propose a universal kernel-based balancing method to balance functions on the reproducing kernel Hilbert space. In addition, we propose a novel adaptive causal balancing method during the alternating update between unbiased evaluation and training of the prediction model. Specifically, the prediction loss of the model is projected in the kernel-based covariate function space, and the projection coefficients are used to determine which functions should be prioritized for balancing to reduce the estimation bias. We conduct extensive experiments on three real-world datasets to demonstrate the effectiveness of the proposed approach.",
        "keywords": "Recommender System;Causal Inference;Bias;Debias;Balancing",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/9947f262b1ce4c360c04ebc9077c7e1ca5026dbe.zip",
        "author": "Haoxuan Li;Chunyuan Zheng;Yanghao Xiao;Peng Wu;Zhi Geng;Xu Chen;Peng Cui",
        "authorids": "~Haoxuan_Li6;~Chunyuan_Zheng1;~Yanghao_Xiao1;~Peng_Wu5;~Zhi_Geng1;~Xu_Chen13;~Peng_Cui1",
        "gender": "M;M;;M;M;M;M",
        "homepage": "https://haoxuanli-pku.github.io/;;;https://pengwu.site/;https://stxy.btbu.edu.cn/szdw/bssds/34339356074b408c8650309f05f24558.htm;https://gsai.ruc.edu.cn/chenxu;http://pengcui.thumedialab.com/",
        "dblp": "145/4965-1.html;;322/6462;15/6146-12;;83/6331-17;31/891-1",
        "google_scholar": "gtDqiucAAAAJ;https://scholar.google.com/citations?hl=en;hzfFzKUAAAAJ;https://scholar.google.com/citations?view_op=list_works;;loPoqy0AAAAJ;https://scholar.google.com.tw/citations?user=G8x97ZgAAAAJ",
        "orcid": "0000-0003-3620-3769;0000-0002-0306-7310;0000-0001-9929-4448;0000-0001-7154-8880;;0000-0003-0144-1775;0000-0003-2957-8511",
        "linkedin": ";;;;;;",
        "or_profile": "~Haoxuan_Li6;~Chunyuan_Zheng1;~Yanghao_Xiao1;~Peng_Wu5;~Zhi_Geng1;~Xu_Chen13;~Peng_Cui1",
        "aff": "Peking University;Peking University;University of Chinese Academy of Sciences;Beijing Technology and Business University;School of mathematical Science, Peking University, Peking University;Renmin University of China;Tsinghua University",
        "aff_domain": "pku.edu.cn;stu.pku.edu.cn;ucas.ac.cn;btbu.edu.cn;math.pku.edu.cn;ruc.edu.cn;tsinghua.edu.cn",
        "position": "PhD student;PhD student;PhD student;Associate Professor;Full Professor;Associate Professor;Associate Professor",
        "bibtex": "@inproceedings{\nli2024debiased,\ntitle={Debiased Collaborative Filtering with Kernel-based Causal Balancing},\nauthor={Haoxuan Li and Yanghao Xiao and Chunyuan Zheng and Peng Wu and Zhi Geng and Xu Chen and Peng Cui},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Ffjc8ApSbt}\n}",
        "github": "",
        "project": "",
        "reviewers": "4dU2;CJCu;ptof",
        "pdf_size": 500250,
        "rating": "6;6;8",
        "confidence": "3;4;3",
        "soundness": "3;3;4",
        "contribution": "3;3;3",
        "presentation": "2;3;3",
        "wc_summary": "44;86;112",
        "wc_strengths": "89;49;22",
        "wc_weaknesses": "128;622;50",
        "wc_questions": "2;5;62",
        "wc_review": "263;762;246",
        "wc_reply_reviewers": "0;84;0",
        "wc_reply_authors": "653;2113;721",
        "reply_reviewers": "0;1;0",
        "reply_authors": "1;4;2",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            80.66666666666667,
            28.015868519267592
        ],
        "wc_strengths_avg": [
            53.333333333333336,
            27.523727137790686
        ],
        "wc_weaknesses_avg": [
            266.6666666666667,
            253.26841273417594
        ],
        "wc_questions_avg": [
            23.0,
            27.60434748368452
        ],
        "wc_review_avg": [
            423.6666666666667,
            239.33844005693882
        ],
        "wc_reply_reviewers_avg": [
            28.0,
            39.59797974644666
        ],
        "wc_reply_authors_avg": [
            1162.3333333333333,
            672.7958250630144
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 23,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15831417560528395050&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=Ffjc8ApSbt",
        "pdf": "https://openreview.net/pdf?id=Ffjc8ApSbt",
        "email": "pku.edu.cn;stu.pku.edu.cn;ucas.ac.cn;btbu.edu.cn;math.pku.edu.cn;ruc.edu.cn;tsinghua.edu.cn",
        "author_num": 7,
        "aff_unique_index": "0;0;1;2;0;3;4",
        "aff_unique_norm": "Peking University;University of Chinese Academy of Sciences;Beijing Technology and Business University;Renmin University of China;Tsinghua University",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "http://www.pku.edu.cn;http://www.ucas.ac.cn;http://www.btbu.edu.cn;http://www.ruc.edu.cn;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "Peking U;UCAS;BTBU;RUC;THU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Peking",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "A Versatile Causal Discovery Framework to Allow Causally-Related Hidden Variables",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19054",
        "id": "FhQSGhBlqv",
        "author_site": "Xinshuai Dong, Biwei Huang, Ignavier Ng, Xiangchen Song, Yujia Zheng, songyao jin, Roberto Legaspi, Peter Spirtes, Kun Zhang",
        "tldr": "",
        "abstract": "Most existing causal discovery methods rely on the assumption of no latent confounders, limiting their applicability in solving real-life problems. In this paper, we introduce a novel, versatile framework for causal discovery that accommodates the presence of causally-related hidden variables almost everywhere in the causal network (for instance, they can be effects of measured variables), based on rank information of covariance matrix over measured variables. We start by investigating the efficacy of rank in comparison to conditional independence and, theoretically, establish necessary and sufficient conditions for the identifiability of certain latent structural patterns. Furthermore, we develop a  Rank-based Latent Causal Discovery algorithm, RLCD, that can efficiently locate hidden variables, determine their cardinalities, and discover the entire causal structure over both measured and hidden ones. We also show that, under certain graphical conditions, RLCD correctly identifies the Markov Equivalence Class of the whole latent causal graph asymptotically. Experimental results on both synthetic and real-world personality data sets demonstrate the efficacy of the proposed approach in finite-sample cases. Our code will be publicly available.",
        "keywords": "Causal Discovery; Latent Variables",
        "primary_area": "causal reasoning",
        "supplementary_material": "",
        "author": "Xinshuai Dong;Biwei Huang;Ignavier Ng;Xiangchen Song;Yujia Zheng;Songyao Jin;Roberto Legaspi;Peter Spirtes;Kun Zhang",
        "authorids": "~Xinshuai_Dong1;~Biwei_Huang1;~Ignavier_Ng1;~Xiangchen_Song1;~Yujia_Zheng1;~Songyao_Jin1;~Roberto_Legaspi1;~Peter_Spirtes1;~Kun_Zhang1",
        "gender": "M;F;M;M;M;M;M;M;M",
        "homepage": "https://dongxinshuai.github.io/;;https://ignavierng.github.io/;https://xiangchensong.github.io/;https://yjzheng.com;https://github.com/Songyao-Jin;https://www.researchgate.net/profile/Roberto-Legaspi;https://www.cmu.edu/dietrich/philosophy/people/faculty/spirtes.html;http://www.andrew.cmu.edu/user/kunz1/",
        "dblp": "279/6151.html;165/3288;251/3037;261/9024;245/6109-1.html;365/4229;296/0450.html;87/3550;96/3115-1",
        "google_scholar": "A7JyL1sAAAAJ;;;foR8BIoAAAAJ;https://scholar.google.co.uk/citations?user=ioiW248AAAAJ;IPNzHfgAAAAJ;zE7Zhk0AAAAJ;mar1eCwAAAAJ;RGoypN4AAAAJ",
        "orcid": ";;;;0009-0003-5225-6366;;0000-0001-8909-635X;;",
        "linkedin": ";;;;;songyao-jin-b97466223/;roberto-legaspi-5a3a4361/;;",
        "or_profile": "~Xinshuai_Dong1;~Biwei_Huang1;~Ignavier_Ng1;~Xiangchen_Song1;~Yujia_Zheng1;~Songyao_Jin1;~Roberto_Legaspi1;~Peter_Spirtes1;~Kun_Zhang1",
        "aff": "Carnegie Mellon University;University of California, San Diego;Carnegie Mellon University;Carnegie Mellon University;Carnegie Mellon University;Mohamed bin Zayed University of Artificial Intelligence;KDDI Research, Inc.;Carnegie Mellon University;Carnegie Mellon University",
        "aff_domain": "cmu.edu;ucsd.edu;cmu.edu;cmu.edu;cmu.edu;mbzuai.ac.ae;kddi-research.jp;cmu.edu;cmu.edu",
        "position": "PhD student;Assistant Professor;PhD student;PhD student;PhD student;MS student;Researcher;Full Professor;Associate Professor",
        "bibtex": "@inproceedings{\ndong2024a,\ntitle={A Versatile Causal Discovery Framework to Allow Causally-Related Hidden Variables},\nauthor={Xinshuai Dong and Biwei Huang and Ignavier Ng and Xiangchen Song and Yujia Zheng and Songyao Jin and Roberto Legaspi and Peter Spirtes and Kun Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=FhQSGhBlqv}\n}",
        "github": "",
        "project": "",
        "reviewers": "aySa;Rcya;G6SE;DkWP",
        "pdf_size": 3084948,
        "rating": "6;8;8;8",
        "confidence": "4;3;4;4",
        "soundness": "3;3;4;4",
        "contribution": "3;4;4;3",
        "presentation": "3;4;4;4",
        "wc_summary": "79;21;75;63",
        "wc_strengths": "85;65;58;24",
        "wc_weaknesses": "379;43;13;171",
        "wc_questions": "392;56;90;69",
        "wc_review": "935;185;236;327",
        "wc_reply_reviewers": "25;16;0;28",
        "wc_reply_authors": "956;329;256;764",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "3;1;1;1",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.5,
            0.5
        ],
        "presentation_avg": [
            3.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            59.5,
            22.994564575133836
        ],
        "wc_strengths_avg": [
            58.0,
            21.988633427296023
        ],
        "wc_weaknesses_avg": [
            151.5,
            144.12754767913037
        ],
        "wc_questions_avg": [
            151.75,
            139.2378809807159
        ],
        "wc_review_avg": [
            420.75,
            301.2278000118847
        ],
        "wc_reply_reviewers_avg": [
            17.25,
            10.894379284750462
        ],
        "wc_reply_authors_avg": [
            576.25,
            292.89620601844604
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 17,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3390470032313254624&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=FhQSGhBlqv",
        "pdf": "https://openreview.net/pdf?id=FhQSGhBlqv",
        "email": "cmu.edu;ucsd.edu;cmu.edu;cmu.edu;cmu.edu;mbzuai.ac.ae;kddi-research.jp;cmu.edu;cmu.edu",
        "author_num": 9,
        "aff_unique_index": "0;1;0;0;0;2;3;0;0",
        "aff_unique_norm": "Carnegie Mellon University;University of California, San Diego;Mohamed bin Zayed University of Artificial Intelligence;KDDI Research",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.cmu.edu;https://www.ucsd.edu;https://mbzuai.ac.ae;https://www.kddi-research.com",
        "aff_unique_abbr": "CMU;UCSD;MBZUAI;KDDI",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";San Diego",
        "aff_country_unique_index": "0;0;0;0;0;1;2;0;0",
        "aff_country_unique": "United States;United Arab Emirates;Japan"
    },
    {
        "id": "FhZi7r4nzA",
        "title": "DiPmark: A Stealthy, Efficient and Resilient Watermark for Large Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Watermarking techniques offer a promising way to secure data via embedding covert information into the data. A paramount challenge in the domain lies in preserving the distribution of original data during watermarking. Our research extends and refines existing watermarking framework, placing emphasis on the importance of a distribution-preserving (DiP) watermark. Contrary to the current strategies, our proposed DiPmark preserves the original token distribution during watermarking (stealthy), is detectable without access to the language model API or weights (efficient), and is robust to moderate changes of tokens (resilient). This is achieved by incorporating a novel reweight strategy, combined with a hash function that assigns unique i.i.d. watermark codes based on the context. The empirical benchmarks of our approach underscore its stealthiness, efficiency, and resilience, making it a robust solution for watermarking tasks that demand impeccable quality preservation.",
        "keywords": "LLM Watermark",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/f1514c378c8b8cff1b62db724d9146fea2244cd2.zip",
        "author": "Yihan Wu;Zhengmian Hu;Hongyang Zhang;Heng Huang",
        "authorids": "~Yihan_Wu1;~Zhengmian_Hu1;~Hongyang_Zhang1;~Heng_Huang1",
        "gender": "M;M;M;M",
        "homepage": "https://yihwu.github.io/;https://www.umd.edu/;https://hongyanz.github.io/;https://www.cs.umd.edu/~heng/",
        "dblp": ";285/4945;23/10537-1;03/281",
        "google_scholar": "cajTg_wAAAAJ;4eXiWWgAAAAJ;https://scholar.google.com/citations?hl=en;4OqLaDwAAAAJ",
        "orcid": ";0000-0003-0316-146X;;",
        "linkedin": ";;;",
        "or_profile": "~Yihan_Wu1;~Zhengmian_Hu1;~Hongyang_Zhang1;~Heng_Huang1",
        "aff": "University of Maryland, College Park;University of Maryland, College Park;School of Computer Science, University of Waterloo;Department of Computer Science, University of Maryland, College Park",
        "aff_domain": "umd.edu;umd.edu;uwaterloo.ca;cs.umd.edu",
        "position": "PhD student;PhD student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nwu2024dipmark,\ntitle={DiPmark: A Stealthy, Efficient and Resilient Watermark for Large Language Models},\nauthor={Yihan Wu and Zhengmian Hu and Hongyang Zhang and Heng Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=FhZi7r4nzA}\n}",
        "github": "",
        "project": "",
        "reviewers": "6R4r;mbUM;NL4L;Gfoi",
        "site": "https://openreview.net/forum?id=FhZi7r4nzA",
        "pdf_size": 1256743,
        "rating": "3;3;6;6",
        "confidence": "3;3;4;4",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;1;2;2",
        "wc_summary": "71;94;62;84",
        "wc_strengths": "140;41;69;67",
        "wc_weaknesses": "151;840;97;84",
        "wc_questions": "153;10;2;10",
        "wc_review": "515;985;230;245",
        "wc_reply_reviewers": "0;0;11;0",
        "wc_reply_authors": "1131;2080;777;539",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "3;5;2;2",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            77.75,
            12.214233500306108
        ],
        "wc_strengths_avg": [
            79.25,
            36.772102197182036
        ],
        "wc_weaknesses_avg": [
            293.0,
            316.8083016589054
        ],
        "wc_questions_avg": [
            43.75,
            63.160015041163504
        ],
        "wc_review_avg": [
            493.75,
            305.4581599826726
        ],
        "wc_reply_reviewers_avg": [
            2.75,
            4.763139720814412
        ],
        "wc_reply_authors_avg": [
            1131.75,
            586.5958468144827
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            1.224744871391589
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 42,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7608593732682453285&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "University of Maryland;University of Waterloo;University of Maryland, College Park",
        "aff_unique_dep": ";School of Computer Science;Department of Computer Science",
        "aff_unique_url": "https://www/umd.edu;https://uwaterloo.ca;https://www/umd.edu",
        "aff_unique_abbr": "UMD;UWaterloo;UMD",
        "aff_campus_unique_index": "0;0;1;0",
        "aff_campus_unique": "College Park;Waterloo",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "United States;Canada"
    },
    {
        "id": "FhbZ1PQCaG",
        "title": "Think Before You Act: Decision Transformers with Internal Memory",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language model (LLM)-based decision-making agents have shown the ability to generalize across multiple tasks. However, their performance relies on massive data and computation. We argue that this inefficiency stems from the forgetting phenomenon, in which a model memorizes its behaviors in parameters throughout training. As a result, training on a new task may deteriorate the model's performance on previous tasks. In contrast to LLMs' implicit memory mechanism, the human brain utilizes distributed memory storage, which helps manage and organize multiple skills efficiently, mitigating the forgetting phenomenon. Thus inspired, we propose an internal memory module to store, blend, and retrieve information for different downstream tasks. Evaluation results show that the proposed method improves training efficiency and generalization in both Atari games and meta-world object manipulation tasks. Moreover, we demonstrate that memory fine-tuning further enhances the adaptability of the proposed architecture.",
        "keywords": "Decision Transformer;Internal Memory",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/ae0a760a8a1dda71555f92d0e204037953f673cf.pdf",
        "author": "Jikun Kang;Romain Laroche;Xingdi Yuan;Adam Trischler;Xue Liu;Jie Fu",
        "authorids": "~Jikun_Kang1;~Romain_Laroche1;~Xingdi_Yuan2;~Adam_Trischler1;~Xue_Liu1;~Jie_Fu2",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://luciferkonn.github.io;https://www.researchgate.net/profile/Romain_Laroche;https://www.microsoft.com/en-us/research/people/adtrisch/;http://www.cs.mcgill.ca/~xueliu/;https://bigaidream.github.io/;https://xingdi-eric-yuan.github.io/",
        "dblp": "299/0233;65/9019;177/9137;l/XueLiu;;40/10147",
        "google_scholar": "Jikun%20Kang;RiIOKJMAAAAJ;https://scholar.google.ca/citations?user=EvUM6UUAAAAJ;https://scholar.google.com.tw/citations?user=rfLIRakAAAAJ;66osleIAAAAJ;hYfE-B8AAAAJ",
        "orcid": "0009-0001-1334-7092;;;;0000-0002-4494-843X;",
        "linkedin": "kang-jikun-91993814b/;romain-laroche-6282397/?originalSubdomain=ca;;;;",
        "or_profile": "~Jikun_Kang1;~Romain_Laroche1;~Adam_Trischler1;~Xue_Liu1;~Jie_Fu1;~Eric_Yuan1",
        "aff": "Convergence AI;Wayve;;McGill University;Hong Kong University of Science and Technology;Microsoft Research",
        "aff_domain": "convergence.ai;wayve.ai;;mcgill.ca;ust.hk;microsoft.com",
        "position": "Researcher;Principal Researcher;;Full Professor;Researcher;Senior Researcher",
        "bibtex": "@misc{\nkang2024think,\ntitle={Think Before You Act: Decision Transformers with Internal Memory},\nauthor={Jikun Kang and Romain Laroche and Xingdi Yuan and Adam Trischler and Xue Liu and Jie Fu},\nyear={2024},\nurl={https://openreview.net/forum?id=FhbZ1PQCaG}\n}",
        "github": "",
        "project": "",
        "reviewers": "NgFj;qzjQ;hmxu;gRQQ",
        "site": "https://openreview.net/forum?id=FhbZ1PQCaG",
        "pdf_size": 811045,
        "rating": "5;6;6;6",
        "confidence": "4;4;4;3",
        "soundness": "3;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;3;2",
        "wc_summary": "97;72;54;30",
        "wc_strengths": "32;172;26;20",
        "wc_weaknesses": "375;126;26;32",
        "wc_questions": "175;431;387;90",
        "wc_review": "679;801;493;172",
        "wc_reply_reviewers": "0;51;17;0",
        "wc_reply_authors": "2147;1262;1354;392",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "5;4;3;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            63.25,
            24.529319191530774
        ],
        "wc_strengths_avg": [
            62.5,
            63.36205489092032
        ],
        "wc_weaknesses_avg": [
            139.75,
            141.49271182644003
        ],
        "wc_questions_avg": [
            270.75,
            142.33125974289695
        ],
        "wc_review_avg": [
            536.25,
            237.1807064244476
        ],
        "wc_reply_reviewers_avg": [
            17.0,
            20.820662813657012
        ],
        "wc_reply_authors_avg": [
            1288.75,
            621.636298409287
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.25,
            1.479019945774904
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:kobrGaE9hy0J:scholar.google.com/&scioq=Think+Before+You+Act:+Decision+Transformers+with+Internal+Memory&hl=en&as_sdt=0,34",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "Convergence AI;Wayve;McGill University;Hong Kong University of Science and Technology;Microsoft",
        "aff_unique_dep": ";;;;Microsoft Research",
        "aff_unique_url": ";https://www.wayve.ai;https://www.mcgill.ca;https://www.ust.hk;https://www.microsoft.com/en-us/research",
        "aff_unique_abbr": ";;McGill;HKUST;MSR",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "1;2;3;4",
        "aff_country_unique": ";United Kingdom;Canada;China;United States"
    },
    {
        "id": "FiQRgzKl64",
        "title": "Mixture-of-Supernets: Improving Weight-Sharing Supernet Training with Architecture-Routed Mixture-of-Experts",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Weight-sharing supernet has become a vital component for performance estimation in the state-of-the-art (SOTA) neural architecture search (NAS) frameworks. Although supernet can directly generate different subnetworks without retraining, there is no guarantee for the quality of these subnetworks because of weight sharing. In NLP tasks such as machine translation and pre-trained language modeling, we observe that given the same model architecture, there is a large performance gap between supernet and training from scratch. Hence, supernet cannot be directly used and retraining is necessary after finding the optimal architectures. \n\nIn this work, we propose mixture-of-supernets, a generalized supernet formulation where mixture-of-experts (MoE) is adopted to enhance the expressive power of the supernet model, with negligible training overhead. In this way, different subnetworks do not share the model weights directly, but do so indirectly through an architecture-based routing mechanism. As a result, model weights of different subnetworks are customized towards their specific architectures and the weight generation is learned by gradient descent. Compared to existing weight-sharing supernet for NLP, our method can minimize the retraining time, greatly improving training efficiency. In addition, the proposed method achieves the SOTA performance in NAS for building fast machine translation models, yielding better latency-BLEU tradeoff compared to HAT, the state-of-the-art NAS for MT. We also achieve the SOTA performance in NAS for building memory-efficient task-agnostic BERT models, outperforming NAS-BERT and AutoDistil in various model sizes.",
        "keywords": "Neural architecture search;Supernet;Machine Translation;Language models",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/ee2e00298cd7c5160d726fb64ea495a53dd1f32e.zip",
        "author": "Ganesh Jawahar;Haichuan Yang;Yunyang Xiong;Zechun Liu;Dilin Wang;Fei Sun;Meng Li;Aasish Pappu;Barlas Oguz;Muhammad Abdul-Mageed;Laks V. S. Lakshmanan;Raghuraman Krishnamoorthi;Vikas Chandra",
        "authorids": "~Ganesh_Jawahar1;~Haichuan_Yang1;~Yunyang_Xiong2;~Zechun_Liu1;~Dilin_Wang1;~Fei_Sun2;~Meng_Li1;~Aasish_Pappu2;~Barlas_Oguz1;~Muhammad_Abdul-Mageed2;~Laks_V._S._Lakshmanan1;~Raghuraman_Krishnamoorthi1;~Vikas_Chandra2",
        "gender": "M;M;M;;;M;M;M;;;;M;M",
        "homepage": "https://ganeshjawahar.github.io/;https://hyang1990.github.io/;;;;https://feisun.org/;https://mengli.me;https://www.aasish.net;;;https://www.cs.ubc.ca/~laks;;https://v-chandra.github.io/",
        "dblp": "203/9710;39/5066;140/7645;;;;70/1726-4;;https://dblp.org/pers/hd/o/Oguz:Barlas;;l/LVSLakshmanan;;57/5163",
        "google_scholar": "https://scholar.google.co.in/citations?user=X7SMP1EAAAAJ;4KNoCFIAAAAJ;k5FaRwcAAAAJ;;;RNj18KkAAAAJ;lvdRkEkAAAAJ;-ax7mIAAAAAJ;iPmTQZMAAAAJ;;https://scholar.google.ca/citations?user=_RCsaOsAAAAJ;F1mr9C0AAAAJ;p-h_BvcAAAAJ",
        "orcid": ";;;;;;;;;;0000-0002-9775-4241;;",
        "linkedin": "https://in.linkedin.com/in/ganesh-jawahar-ab928435;haichuan-yang-5470b1161/;;;;fei-sun-39a644/;;;barlas-o%C4%9Fuz-25465050;;laksvslakshmanan/;raghuraman-krishnamoorthi-b8670a5/;vchandra/",
        "or_profile": "~Ganesh_Jawahar1;~Haichuan_Yang1;~Yunyang_Xiong2;~Zechun_Liu1;~Dilin_Wang1;~Fei_Sun2;~Meng_Li1;~Aasish_Pappu2;~Barlas_Oguz1;~Muhammad_Abdul-Mageed2;~Laks_V._S._Lakshmanan1;~Raghuraman_Krishnamoorthi1;~Vikas_Chandra2",
        "aff": "University of British Columbia;Meta Facebook;Meta Facebook;;;Meta Inc.;Peking University;Meta AI;Meta;;University of British Columbia;Meta Facebook;Meta",
        "aff_domain": "ubc.ca;fb.com;fb.com;;;meta.com;pku.edu.cn;fb.com;meta.com;;ubc.ca;meta.com;meta.com",
        "position": "PhD student;Research Scientist;Researcher;;;Software engineer;Assistant Professor;Researcher;Research Scientist;;Professor;Researcher;Director, AI",
        "bibtex": "@misc{\njawahar2024mixtureofsupernets,\ntitle={Mixture-of-Supernets: Improving Weight-Sharing Supernet Training with Architecture-Routed Mixture-of-Experts},\nauthor={Ganesh Jawahar and Haichuan Yang and Yunyang Xiong and Zechun Liu and Dilin Wang and Fei Sun and Meng Li and Aasish Pappu and Barlas Oguz and Muhammad Abdul-Mageed and Laks V. S. Lakshmanan and Raghuraman Krishnamoorthi and Vikas Chandra},\nyear={2024},\nurl={https://openreview.net/forum?id=FiQRgzKl64}\n}",
        "github": "",
        "project": "",
        "reviewers": "GCC7;yeUq;gRzs;g33E",
        "site": "https://openreview.net/forum?id=FiQRgzKl64",
        "pdf_size": 1532082,
        "rating": "3;5;5;5",
        "confidence": "4;3;3;3",
        "soundness": "2;2;2;2",
        "contribution": "2;3;2;2",
        "presentation": "3;2;2;2",
        "wc_summary": "18;95;71;31",
        "wc_strengths": "30;48;74;17",
        "wc_weaknesses": "321;23;193;161",
        "wc_questions": "9;270;112;13",
        "wc_review": "378;436;450;222",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "484;771;700;346",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            53.75,
            30.80077109424373
        ],
        "wc_strengths_avg": [
            42.25,
            21.3819433167334
        ],
        "wc_weaknesses_avg": [
            174.5,
            105.99410360958764
        ],
        "wc_questions_avg": [
            101.0,
            105.9363016156407
        ],
        "wc_review_avg": [
            371.5,
            90.43644176989716
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            575.25,
            169.3832562563372
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            13,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10889148957747347204&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1;1;2;1;1;0;1;1",
        "aff_unique_norm": "University of British Columbia;Meta;Peking University",
        "aff_unique_dep": ";Meta Platforms, Inc.;",
        "aff_unique_url": "https://www.ubc.ca;https://meta.com;http://www.pku.edu.cn",
        "aff_unique_abbr": "UBC;Meta;Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;2;1;1;0;1;1",
        "aff_country_unique": "Canada;United States;China"
    },
    {
        "title": "Let's do the time-warp-attend: Learning topological invariants of dynamical systems",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19053",
        "id": "Fj7Fzm5lWL",
        "author_site": "Noa Moriel, Matt Ricci, Mor Nitzan",
        "tldr": "",
        "abstract": "Dynamical systems across the sciences, from electrical circuits to ecological networks, undergo qualitative and often catastrophic changes in behavior, called bifurcations, when their underlying parameters cross a threshold. Existing methods predict oncoming catastrophes in individual systems but are primarily time-series-based and struggle both to categorize qualitative dynamical regimes across diverse systems and to generalize to real data. To address this challenge, we propose a data-driven, physically-informed deep-learning framework for classifying dynamical regimes and characterizing bifurcation boundaries based on the extraction of topologically invariant features. We focus on the paradigmatic case of the supercritical Hopf bifurcation, which is used to model periodic dynamics across a wide range of applications. Our convolutional attention method is trained with data augmentations that encourage the learning of topological invariants which can be used to detect bifurcation boundaries in unseen systems and to design models of biological systems like oscillatory gene regulatory networks. We further demonstrate our method's use in analyzing real data by recovering distinct proliferation and differentiation dynamics along pancreatic endocrinogenesis trajectory in gene expression space based on single-cell data. Our method provides valuable insights into the qualitative, long-term behavior of a wide range of dynamical systems, and can detect bifurcations or catastrophic transitions in large-scale physical and biological systems.",
        "keywords": "dynamical systems;bifurcations;topological invariance;Hopf bifurcation;physics-informed machine learning;augmentation;single-cell RNA-sequencing",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Noa Moriel;Matt Ricci;Mor Nitzan",
        "authorids": "~Noa_Moriel1;~Matt_Ricci1;~Mor_Nitzan1",
        "gender": ";M;",
        "homepage": ";http://www.matthew-ricci.com;https://www.nitzanlab.com/",
        "dblp": ";;",
        "google_scholar": ";;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Noa_Moriel1;~Matt_Ricci1;~Mor_Nitzan1",
        "aff": ";, Hebrew University of Jerusalem;Hebrew University of Jerusalem",
        "aff_domain": ";mail.huji.ac.il;huji.ac.il",
        "position": ";Postdoc;Assistant Professor",
        "bibtex": "@inproceedings{\nmoriel2024lets,\ntitle={Let's do the time-warp-attend: Learning topological invariants of dynamical systems},\nauthor={Noa Moriel and Matt Ricci and Mor Nitzan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Fj7Fzm5lWL}\n}",
        "github": "",
        "project": "",
        "reviewers": "YdjJ;sMRU;YHJc;pimK",
        "pdf_size": 9495604,
        "rating": "3;6;6;6",
        "confidence": "4;4;5;3",
        "soundness": "2;3;3;2",
        "contribution": "1;4;3;2",
        "presentation": "2;2;3;3",
        "wc_summary": "51;74;73;139",
        "wc_strengths": "12;145;140;87",
        "wc_weaknesses": "108;130;436;474",
        "wc_questions": "2;102;82;32",
        "wc_review": "173;451;731;732",
        "wc_reply_reviewers": "75;79;86;111",
        "wc_reply_authors": "538;192;835;998",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            1.118033988749895
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            84.25,
            32.91940916845258
        ],
        "wc_strengths_avg": [
            96.0,
            53.558379363083795
        ],
        "wc_weaknesses_avg": [
            287.0,
            168.71573726241425
        ],
        "wc_questions_avg": [
            54.5,
            39.607448794387146
        ],
        "wc_review_avg": [
            521.75,
            231.636973516751
        ],
        "wc_reply_reviewers_avg": [
            87.75,
            13.988834833537782
        ],
        "wc_reply_authors_avg": [
            640.75,
            307.1216167904825
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15580848829869707235&as_sdt=80005&sciodt=0,11&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=Fj7Fzm5lWL",
        "pdf": "https://openreview.net/pdf?id=Fj7Fzm5lWL",
        "email": ";mail.huji.ac.il;huji.ac.il",
        "author_num": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Hebrew University of Jerusalem",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.huji.ac.il",
        "aff_unique_abbr": "HUJI",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Jerusalem",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Israel"
    },
    {
        "id": "FjifPJV2Ol",
        "title": "SOLVING SCHRODINGER BRIDGE PROBLEM VIA STOCHASTIC ACTION MINIMIZATION",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The Schrodinger bridge problem is a classical entropy-regularized optimal transport problem that seeks to find optimal diffusion trajectories that transform one probability distribution into another. Although mathematical theory has reached\na mature stage, the ongoing research in algorithmic advancements remains a dynamic field, driven by recent innovations in diffusion models. We introduce stochastic Lagrangian and stochastic action as viable alter-\nnative for serving as a direct loss function. We demonstrate the feasibility of incorporating all the vital physical constraints necessary to solve the problem directly into the Lagrangian,  providing an intuitive grasp of the loss function and streamlining the training process.",
        "keywords": "Schrodinger bridge;optimal transport;single-cell;trajectories",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Mykola Bordyuh;Daniel Wong;Robert Moccia;Djork-Arn\u00e9 Clevert",
        "authorids": "~Mykola_Bordyuh1;daniel.wong@pfizer.com;robert.moccia@pfizer.com;~Djork-Arn\u00e9_Clevert2",
        "gender": "M;;;",
        "homepage": "https://www.linkedin.com/in/mykola-bordyuh-phd-54803a66/;;;",
        "dblp": ";;;",
        "google_scholar": ";;;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Mykola_Bordyuh1;daniel.wong@pfizer.com;robert.moccia@pfizer.com;~Djork-Arn\u00e9_Clevert2",
        "aff": "Bristol Myers Squibb;;;",
        "aff_domain": "bms.com;;;",
        "position": "Researcher;;;",
        "bibtex": "@misc{\nbordyuh2024solving,\ntitle={{SOLVING} {SCHRODINGER} {BRIDGE} {PROBLEM} {VIA} {STOCHASTIC} {ACTION} {MINIMIZATION}},\nauthor={Mykola Bordyuh and Daniel Wong and Robert Moccia and Djork-Arn{\\'e} Clevert},\nyear={2024},\nurl={https://openreview.net/forum?id=FjifPJV2Ol}\n}",
        "github": "",
        "project": "",
        "reviewers": "yQV5;krSx;RX7G;tBew;qM7P",
        "site": "https://openreview.net/forum?id=FjifPJV2Ol",
        "pdf_size": 850416,
        "rating": "3;3;3;3;5",
        "confidence": "4;4;4;4;2",
        "soundness": "3;2;1;2;3",
        "contribution": "2;1;1;2;3",
        "presentation": "2;2;1;1;3",
        "wc_summary": "47;91;76;125;77",
        "wc_strengths": "32;77;47;14;43",
        "wc_weaknesses": "66;313;430;78;74",
        "wc_questions": "9;74;50;54;56",
        "wc_review": "154;555;603;271;250",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            3.4,
            0.8
        ],
        "confidence_avg": [
            3.6,
            0.8
        ],
        "soundness_avg": [
            2.2,
            0.7483314773547882
        ],
        "contribution_avg": [
            1.8,
            0.7483314773547883
        ],
        "presentation_avg": [
            1.8,
            0.7483314773547883
        ],
        "wc_summary_avg": [
            83.2,
            25.332982453710418
        ],
        "wc_strengths_avg": [
            42.6,
            20.655265672462313
        ],
        "wc_weaknesses_avg": [
            192.2,
            151.05019033420646
        ],
        "wc_questions_avg": [
            48.6,
            21.443880245888334
        ],
        "wc_review_avg": [
            366.6,
            178.5010924336319
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:weCIN63nriMJ:scholar.google.com/&scioq=SOLVING+SCHRODINGER+BRIDGE+PROBLEM+VIA+STOCHASTIC+ACTION+MINIMIZATION&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Bristol Myers Squibb",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.bms.com",
        "aff_unique_abbr": "BMS",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Candidate Label Set Pruning: A Data-centric Perspective for Deep Partial-label Learning",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19052",
        "id": "Fk5IzauJ7F",
        "author_site": "Shuo He, Chaojie Wang, Guowu Yang, Lei Feng",
        "tldr": "",
        "abstract": "Partial-label learning (PLL) allows each training example to be equipped with a set of candidate labels. Existing deep PLL research focuses on a \\emph{learning-centric} perspective to design various training strategies for label disambiguation i.e., identifying the concealed true label from the candidate label set, for model training. However, when the size of the candidate label set becomes excessively large, these learning-centric strategies would be unable to find the true label for model training, thereby causing performance degradation. This motivates us to think from a \\emph{data-centric} perspective and pioneer a new PLL-related task called candidate label set pruning (CLSP) that aims to filter out certain potential false candidate labels in a training-free manner. To this end, we propose the first CLSP method based on the inconsistency between the representation space and the candidate label space. Specifically, for each candidate label of a training instance, if it is not a candidate label of the instance's nearest neighbors in the representation space, then it has a high probability of being a false label. Based on this intuition, we employ a per-example pruning scheme that filters out a specific proportion of high-probability false candidate labels. Theoretically, we prove an upper bound of the pruning error rate and analyze how the quality of representations affects our proposed method. Empirically, extensive experiments on both benchmark-simulated and real-world PLL datasets validate the great value of CLSP to significantly improve many state-of-the-art deep PLL methods.",
        "keywords": "partial label learning;label disambiguation;candidate label set pruning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/e98e8e6e979da6eba336f2681663b47ea771ee42.zip",
        "author": "Shuo He;Chaojie Wang;Guowu Yang;Lei Feng",
        "authorids": "~Shuo_He1;~Chaojie_Wang1;~Guowu_Yang1;~Lei_Feng1",
        "gender": "M;M;;M",
        "homepage": ";https://chaojiewang94.github.io/;;https://lfeng1995.github.io/",
        "dblp": "186/3430-1;134/9314-1;38/4538;76/847-6",
        "google_scholar": "hwYvF98AAAAJ;https://scholar.google.com/citations?hl=en;;https://scholar.google.com.sg/citations?user=KomQOFkAAAAJ",
        "orcid": ";;;0000-0003-2839-5799",
        "linkedin": ";;;",
        "or_profile": "~Shuo_He1;~Chaojie_Wang1;~Guowu_Yang1;~Lei_Feng1",
        "aff": "University of Electronic Science and Technology of China;Skywork AI;University of Electronic Science and Technology of China;Singapore University of Technology and Design",
        "aff_domain": "uestc.edu.cn;kunlun-inc.com;uestc.edu.cn;sutd.edu.sg",
        "position": "PhD student;Researcher;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nhe2024candidate,\ntitle={Candidate Label Set Pruning: A Data-centric Perspective for Deep Partial-label Learning},\nauthor={Shuo He and Chaojie Wang and Guowu Yang and Lei Feng},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Fk5IzauJ7F}\n}",
        "github": "",
        "project": "",
        "reviewers": "i6zq;289c;zBDH;kuyu",
        "pdf_size": 2805475,
        "rating": "8;8;8;8",
        "confidence": "4;4;4;4",
        "soundness": "4;3;4;3",
        "contribution": "4;3;4;3",
        "presentation": "4;3;3;3",
        "wc_summary": "59;98;202;131",
        "wc_strengths": "68;71;178;116",
        "wc_weaknesses": "15;164;51;38",
        "wc_questions": "132;49;99;148",
        "wc_review": "274;382;530;433",
        "wc_reply_reviewers": "59;63;0;16",
        "wc_reply_authors": "367;995;776;732",
        "reply_reviewers": "2;2;0;1",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            122.5,
            52.5
        ],
        "wc_strengths_avg": [
            108.25,
            44.53299338692606
        ],
        "wc_weaknesses_avg": [
            67.0,
            57.467382052778426
        ],
        "wc_questions_avg": [
            107.0,
            37.8615900352851
        ],
        "wc_review_avg": [
            404.75,
            92.32923426520985
        ],
        "wc_reply_reviewers_avg": [
            34.5,
            27.13392710243027
        ],
        "wc_reply_authors_avg": [
            717.5,
            225.5487752128129
        ],
        "reply_reviewers_avg": [
            1.25,
            0.82915619758885
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5886271182784892121&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=Fk5IzauJ7F",
        "pdf": "https://openreview.net/pdf?id=Fk5IzauJ7F",
        "email": "uestc.edu.cn;kunlun-inc.com;uestc.edu.cn;sutd.edu.sg",
        "author_num": 4,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "University of Electronic Science and Technology of China;Skywork AI;Singapore University of Technology and Design",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.uestc.edu.cn;https://www.skywork.ai;https://www.sutd.edu.sg",
        "aff_unique_abbr": "UESTC;Skywork AI;SUTD",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;2",
        "aff_country_unique": "China;United States;Singapore"
    },
    {
        "id": "FlEUIydMMh",
        "title": "Neuro-Causal Factor Analysis",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Factor analysis (FA) is a statistical tool for studying how observed variables with some mutual dependences can be expressed as functions of mutually independent unobserved factors, and it is widely applied throughout the psychological, biological, and physical sciences.  We revisit this classic method from the comparatively new perspective given by advancements in causal discovery and deep learning, introducing a framework for Neuro-Causal Factor Analysis (NCFA).  Our approach is fully nonparametric: it identifies factors via latent causal discovery methods and then uses a variational autoencoder (VAE) that is constrained to abide by the Markov factorization of the distribution with respect to the learned graph.  We evaluate NCFA on real and synthetic data sets, finding that it performs comparably to standard VAEs on data reconstruction tasks but with the advantages of sparser architecture, lower model complexity, and causal interpretability.  Unlike traditional FA methods, our proposed NCFA method allows learning and reasoning about the latent factors underlying observed data from a justifiably causal perspective, even when the relations between factors and measurements are highly nonlinear.",
        "keywords": "variational autoencoder;latent variable models;generative models;causality;factor analysis;causal discovery",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Alex Markham;Mingyu Liu;Bryon Aragam;Liam Solus",
        "authorids": "~Alex_Markham1;~Mingyu_Liu5;~Bryon_Aragam1;~Liam_Solus1",
        "gender": "Non-Binary;M;;M",
        "homepage": "https://causal.dev;;http://bryonaragam.com/;https://people.kth.se/~solus/",
        "dblp": "251/3018;;140/7564;",
        "google_scholar": "UoPc5ekAAAAJ;xfOaxusAAAAJ;u-W3_9QAAAAJ;https://scholar.google.se/citations?user=ysymiooAAAAJ",
        "orcid": "0000-0002-5495-1077;;;",
        "linkedin": ";;;",
        "or_profile": "~Alex_Markham1;~Mingyu_Liu5;~Bryon_Aragam1;~Liam_Solus1",
        "aff": "KTH Royal Institute of Technology;;Booth School of Business;KTH Royal Institute of Technology",
        "aff_domain": "kth.se;;chicagobooth.edu;kth.se",
        "position": "Postdoc;;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nmarkham2024neurocausal,\ntitle={Neuro-Causal Factor Analysis},\nauthor={Alex Markham and Mingyu Liu and Bryon Aragam and Liam Solus},\nyear={2024},\nurl={https://openreview.net/forum?id=FlEUIydMMh}\n}",
        "github": "",
        "project": "",
        "reviewers": "eQDF;XmbE;hmd4;WRCe;VCXV",
        "site": "https://openreview.net/forum?id=FlEUIydMMh",
        "pdf_size": 779985,
        "rating": "3;5;5;5;6",
        "confidence": "3;3;4;4;2",
        "soundness": "3;2;2;2;3",
        "contribution": "2;3;2;3;2",
        "presentation": "2;4;1;3;3",
        "wc_summary": "71;47;22;79;62",
        "wc_strengths": "71;18;10;65;8",
        "wc_weaknesses": "320;17;149;99;20",
        "wc_questions": "56;78;4;82;49",
        "wc_review": "518;160;185;325;139",
        "wc_reply_reviewers": "34;60;0;21;11",
        "wc_reply_authors": "358;217;266;313;305",
        "reply_reviewers": "1;1;0;1;1",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            4.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.2,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.6,
            1.019803902718557
        ],
        "wc_summary_avg": [
            56.2,
            20.133554082675023
        ],
        "wc_strengths_avg": [
            34.4,
            27.702707448911923
        ],
        "wc_weaknesses_avg": [
            121.0,
            111.25286513164504
        ],
        "wc_questions_avg": [
            53.8,
            27.888348821685373
        ],
        "wc_review_avg": [
            265.4,
            142.0628030133152
        ],
        "wc_reply_reviewers_avg": [
            25.2,
            20.701690752206687
        ],
        "wc_reply_authors_avg": [
            291.8,
            47.46956919964621
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.21821789023599236,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4772255552658760831&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "KTH Royal Institute of Technology;University of Chicago Booth School of Business",
        "aff_unique_dep": ";Booth School of Business",
        "aff_unique_url": "https://www.kth.se;https://www.chicagobooth.edu",
        "aff_unique_abbr": "KTH;Booth",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Chicago",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Sweden;United States"
    },
    {
        "id": "FlH6VB5sJN",
        "title": "A Parallel Multi-compartment Spiking Neuron For Multi-scale Sequential Modeling",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The human brain possesses remarkable abilities in processing sensory signals that exhibit complex temporal dynamics. However, brain-inspired Spiking Neural Networks (SNNs) encounter challenges when dealing with sensory signals that have a high temporal complexity. These challenges primarily arise from the utilization of simplified spiking neuron models, such as the widely adopted Leaky Integrate-and-Fire (LIF) model, which has limited capability to process temporal information across multiple time scales. Additionally, these spiking neuron models can only be updated sequentially in time, resulting in slow training processes that pose particular difficulties when dealing with long sequences. To address these issues, we propose a novel Parallel Multi-compartment Spiking Neuron (PMSN), which is derived from the cable model of hippocampus pyramidal neurons. The PMSN model captures the intricate interactions among various neuronal compartments, allowing multi-scale temporal information to be preserved and integrated for effective sequential modeling. Furthermore, the PMSN model has been meticulously designed to facilitate parallel training on GPU-accelerated machine learning frameworks. Our experimental results across numerous sequential modeling tasks demonstrate the superior performance of the proposed PMSN model compared with other spiking neuron models. Specifically, it exhibits enhanced classification accuracy, accelerated simulation, and favorable trade-offs between accuracy and computation cost.",
        "keywords": "Spiking Neural Networks;Spiking Neuron Models;Multi-compartment Model;Sequential Modeling;Brain-inspired Computing;Neuromorphics.",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/7f2e90641094cdbf0be543c9029e2c53419d6912.zip",
        "author": "Xinyi Chen;Jibin Wu;Chenxiang Ma;Yinsong Yan;KC Tan",
        "authorids": "~Xinyi_Chen5;~Jibin_Wu1;~Chenxiang_Ma1;~Yinsong_Yan1;~KC_Tan1",
        "gender": "F;M;M;M;",
        "homepage": ";https://www.jibinwu.com/;;;",
        "dblp": ";228/1824;264/5441;326/8830;",
        "google_scholar": "VrmLTG0AAAAJ;https://scholar.google.com.sg/citations?user=QwDyvrgAAAAJ;;;",
        "orcid": ";;0000-0003-2065-7571;0000-0002-3926-5917;",
        "linkedin": ";;;;",
        "or_profile": "~Xinyi_Chen5;~Jibin_Wu1;~Chenxiang_Ma1;~Yinsong_Yan1;~KC_Tan1",
        "aff": "Hong Kong Polytechnic University;Hong Kong Polytechnic University;The Hong Kong Polytechnic University;Hong Kong Polytechnic University;",
        "aff_domain": "polyu.edu.hk;polyu.edu.hk;comp.polyu.edu.hk;polyu.edu.hk;",
        "position": "PhD student;Assistant Professor;PhD student;PhD student;",
        "bibtex": "@misc{\nchen2024a,\ntitle={A Parallel Multi-compartment Spiking Neuron For Multi-scale Sequential Modeling},\nauthor={Xinyi Chen and Jibin Wu and Chenxiang Ma and Yinsong Yan and KC Tan},\nyear={2024},\nurl={https://openreview.net/forum?id=FlH6VB5sJN}\n}",
        "github": "",
        "project": "",
        "reviewers": "kRbB;QBv1;Chwq;9iDX;cmkV",
        "site": "https://openreview.net/forum?id=FlH6VB5sJN",
        "pdf_size": 675741,
        "rating": "3;5;6;6;6",
        "confidence": "5;3;2;3;3",
        "soundness": "2;3;2;3;3",
        "contribution": "2;2;2;2;3",
        "presentation": "3;3;3;3;3",
        "wc_summary": "68;60;32;119;93",
        "wc_strengths": "53;38;47;87;71",
        "wc_weaknesses": "33;191;192;58;78",
        "wc_questions": "137;12;112;197;3",
        "wc_review": "291;301;383;461;245",
        "wc_reply_reviewers": "196;0;162;45;0",
        "wc_reply_authors": "2205;798;2258;879;510",
        "reply_reviewers": "1;0;2;1;0",
        "reply_authors": "5;2;4;2;2",
        "rating_avg": [
            5.2,
            1.16619037896906
        ],
        "confidence_avg": [
            3.2,
            0.9797958971132712
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            74.4,
            29.601351320505625
        ],
        "wc_strengths_avg": [
            59.2,
            17.6
        ],
        "wc_weaknesses_avg": [
            110.4,
            67.73654848012261
        ],
        "wc_questions_avg": [
            92.2,
            74.52623699074037
        ],
        "wc_review_avg": [
            336.2,
            76.63523993568494
        ],
        "wc_reply_reviewers_avg": [
            80.6,
            82.70816162870507
        ],
        "wc_reply_authors_avg": [
            1330.0,
            746.4092711106957
        ],
        "reply_reviewers_avg": [
            0.8,
            0.7483314773547883
        ],
        "reply_authors_avg": [
            3.0,
            1.2649110640673518
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9101820546182064,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10501702385450132655&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Hong Kong Polytechnic University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.polyu.edu.hk",
        "aff_unique_abbr": "PolyU",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Incentive-Aware Federated Learning with Training-Time Model Rewards",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19051",
        "id": "FlY7WQ2hWS",
        "author_site": "Zhaoxuan Wu, Mohammad Mohammadi Amiri, Ramesh Raskar, Bryan Kian Hsiang Low",
        "tldr": "",
        "abstract": "In federated learning (FL), incentivizing contributions of training resources (e.g., data, compute) from potentially competitive clients is crucial. Existing incentive mechanisms often distribute post-training monetary rewards, which suffer from practical challenges of timeliness and feasibility of the rewards. Rewarding the clients after the completion of training may incentivize them to abort the collaboration, and monetizing the contribution is challenging in practice. To address these problems, we propose an incentive-aware algorithm that offers differentiated training-time model rewards for each client at each FL iteration. We theoretically prove that such a $\\textit{local}$ design ensures the $\\textit{global}$ objective of client incentivization. Through theoretical analyses, we further identify the issue of error propagation in model rewards and thus propose a stochastic reference-model recovery strategy to ensure theoretically that all the clients eventually obtain the optimal model in the limit. We perform extensive experiments to demonstrate the superior incentivizing performance of our method compared to existing baselines.",
        "keywords": "Collaborative learning;Incentives;Global-to-local design",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/de8b0952ab69623f9bbfc712f3455c71b17b4cc0.zip",
        "author": "Zhaoxuan Wu;Mohammad Mohammadi Amiri;Ramesh Raskar;Bryan Kian Hsiang Low",
        "authorids": "~Zhaoxuan_Wu1;~Mohammad_Mohammadi_Amiri1;~Ramesh_Raskar1;~Bryan_Kian_Hsiang_Low1",
        "gender": "M;;M;M",
        "homepage": "https://zhaoxuanwu.github.io/;;https://www.media.mit.edu/people/raskar/overview/;http://www.comp.nus.edu.sg/~lowkh",
        "dblp": "298/5083;;r/RameshRaskar;97/4877",
        "google_scholar": "Th_mPm8AAAAJ;;;https://scholar.google.com.tw/citations?user=2P-Q09UAAAAJ",
        "orcid": "0009-0002-5659-6387;;0000-0002-3254-3224;",
        "linkedin": "zhaoxuanwu/;;;",
        "or_profile": "~Zhaoxuan_Wu1;~Mohammad_Mohammadi_Amiri1;~Ramesh_Raskar1;~Bryan_Kian_Hsiang_Low1",
        "aff": "National University of Singapore;;Massachusetts Institute of Technology;National University of Singapore",
        "aff_domain": "u.nus.edu;;mit.edu;nus.edu.sg",
        "position": "PhD student;;Associate Professor;Associate Professor",
        "bibtex": "@inproceedings{\nwu2024incentiveaware,\ntitle={Incentive-Aware Federated Learning with Training-Time Model Rewards},\nauthor={Zhaoxuan Wu and Mohammad Mohammadi Amiri and Ramesh Raskar and Bryan Kian Hsiang Low},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=FlY7WQ2hWS}\n}",
        "github": "",
        "project": "",
        "reviewers": "LXR6;dsGp;EksS;xzxw",
        "pdf_size": 940681,
        "rating": "3;5;6;6",
        "confidence": "3;2;2;3",
        "soundness": "3;4;2;3",
        "contribution": "2;3;2;3",
        "presentation": "2;4;2;3",
        "wc_summary": "116;34;94;259",
        "wc_strengths": "21;25;61;11",
        "wc_weaknesses": "362;2;154;214",
        "wc_questions": "24;69;72;144",
        "wc_review": "523;130;381;628",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1192;580;998;1127",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "4;3;4;4",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            2.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            125.75,
            82.57837186576155
        ],
        "wc_strengths_avg": [
            29.5,
            18.887826767524103
        ],
        "wc_weaknesses_avg": [
            183.0,
            129.0387538687506
        ],
        "wc_questions_avg": [
            77.25,
            42.97310205233036
        ],
        "wc_review_avg": [
            415.5,
            186.69025148625195
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            974.25,
            238.0886127054379
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            3.75,
            0.4330127018922193
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.40824829046386296,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4193186991448468420&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=FlY7WQ2hWS",
        "pdf": "https://openreview.net/pdf?id=FlY7WQ2hWS",
        "email": "u.nus.edu;;mit.edu;nus.edu.sg",
        "author_num": 4,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "National University of Singapore;Massachusetts Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.nus.edu.sg;https://web.mit.edu",
        "aff_unique_abbr": "NUS;MIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Singapore;United States"
    },
    {
        "title": "DisenBooth: Identity-Preserving Disentangled Tuning for Subject-Driven Text-to-Image Generation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19050",
        "id": "FlhjUkC7vH",
        "author_site": "Hong Chen, Yipeng Zhang, Simin Wu, Xin Wang, Xuguang Duan, Yuwei Zhou, Wenwu Zhu",
        "tldr": "",
        "abstract": "Subject-driven text-to-image generation aims to generate customized images of the given subject based on the text descriptions, which has drawn increasing attention. Existing methods mainly resort to finetuning a pretrained generative model, where the identity-relevant information (e.g., the boy) and the identity-irrelevant information (e.g., the background or the pose of the boy) are entangled in the latent embedding space. However, the highly entangled latent embedding may lead to the failure of subject-driven text-to-image generation as follows: (i) the identity-irrelevant information hidden in the entangled embedding may dominate the generation process, resulting in the generated images heavily dependent on the irrelevant information while ignoring the given text descriptions; (ii) the identity-relevant information carried in the entangled embedding can not be appropriately preserved, resulting in identity change of the subject in the generated images. To tackle the problems, we propose DisenBooth, an identity-preserving disentangled tuning framework for subject-driven text-to-image generation. Specifically, DisenBooth finetunes the pretrained diffusion model in the denoising process. Different from previous works that utilize an entangled embedding to denoise each image, DisenBooth instead utilizes disentangled embeddings to respectively preserve the subject identity and capture the identity-irrelevant information. We further design the novel weak denoising and contrastive embedding auxiliary tuning objectives to achieve the disentanglement. Extensive experiments show that our proposed DisenBooth framework outperforms baseline models for subject-driven text-to-image generation with the identity-preserved embedding. Additionally, by combining the identity-preserved embedding and identity-irrelevant embedding, DisenBooth demonstrates more generation flexibility and controllability.",
        "keywords": "diffusion model;subject-driven text-to-image generation;disentangled finetuning;customized and personalized generation",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Hong Chen;Yipeng Zhang;Simin Wu;Xin Wang;Xuguang Duan;Yuwei Zhou;Wenwu Zhu",
        "authorids": "~Hong_Chen9;~Yipeng_Zhang3;~Simin_Wu1;~Xin_Wang17;~Xuguang_Duan1;~Yuwei_Zhou1;~Wenwu_Zhu1",
        "gender": "M;M;F;M;M;M;M",
        "homepage": "https://forchchch.github.io/;https://definezyp.github.io;https://gitee.com/simin-wu;http://mn.cs.tsinghua.edu.cn/xinwang/;;;http://media.cs.tsinghua.edu.cn/en/zww",
        "dblp": "52/4150-11;155/6855-3;;10/5630-19;222/2730;124/2955;97/6308-1.html",
        "google_scholar": ";dSU7yOUAAAAJ;;YPOBHYUAAAAJ;p2B9-xUAAAAJ;Ed748H0AAAAJ;https://scholar.google.com.tw/citations?user=7t2jzpgAAAAJ",
        "orcid": "0000-0002-0943-2286;0009-0002-0886-8296;;0000-0002-0351-2939;;0000-0001-9582-7331;0000-0003-2236-9290",
        "linkedin": ";;;;;;",
        "or_profile": "~Hong_Chen9;~Yipeng_Zhang3;~Simin_Wu1;~Xin_Wang17;~Xuguang_Duan1;~Yuwei_Zhou1;~Wenwu_Zhu1",
        "aff": "Tsinghua University;Computer Science and Technology, Tsinghua University, Tsinghua University;Lanzhou University;Tsinghua University;Meituan;Tsinghua University;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;mails.tsinghua.edu.cn;lzu.edu.cn;cs.tsinghua.edu.cn;meituan.com;tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "PhD student;PhD student;Undergrad student;Associate Professor;Researcher;PhD student;Full Professor",
        "bibtex": "@inproceedings{\nchen2024disenbooth,\ntitle={DisenBooth: Identity-Preserving Disentangled Tuning for Subject-Driven Text-to-Image Generation},\nauthor={Hong Chen and Yipeng Zhang and Simin Wu and Xin Wang and Xuguang Duan and Yuwei Zhou and Wenwu Zhu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=FlhjUkC7vH}\n}",
        "github": "",
        "project": "",
        "reviewers": "nfwg;QDoi;UqfN;9xGd",
        "pdf_size": 14661387,
        "rating": "6;8;8;8",
        "confidence": "4;4;4;2",
        "soundness": "3;4;3;3",
        "contribution": "3;4;3;3",
        "presentation": "2;4;3;3",
        "wc_summary": "60;93;44;173",
        "wc_strengths": "64;24;31;174",
        "wc_weaknesses": "158;143;181;216",
        "wc_questions": "3;105;3;164",
        "wc_review": "285;365;259;727",
        "wc_reply_reviewers": "0;27;31;10",
        "wc_reply_authors": "684;708;465;948",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "2;3;3;4",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            92.5,
            49.721725633771
        ],
        "wc_strengths_avg": [
            73.25,
            60.097316911822276
        ],
        "wc_weaknesses_avg": [
            174.5,
            27.518175811634027
        ],
        "wc_questions_avg": [
            68.75,
            68.97961655445759
        ],
        "wc_review_avg": [
            409.0,
            187.70721882761995
        ],
        "wc_reply_reviewers_avg": [
            17.0,
            12.589678312014172
        ],
        "wc_reply_authors_avg": [
            701.25,
            171.0575561032017
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 65,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10633195529945685499&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=FlhjUkC7vH",
        "pdf": "https://openreview.net/pdf?id=FlhjUkC7vH",
        "email": "tsinghua.edu.cn;mails.tsinghua.edu.cn;lzu.edu.cn;cs.tsinghua.edu.cn;meituan.com;tsinghua.edu.cn;tsinghua.edu.cn",
        "author_num": 7,
        "aff_unique_index": "0;0;1;0;2;0;0",
        "aff_unique_norm": "Tsinghua University;Lanzhou University;Meituan",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.lzu.edu.cn;https://www.meituan.com",
        "aff_unique_abbr": "THU;LZU;Meituan",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Unified Language-Vision Pretraining in LLM with Dynamic Discrete Visual Tokenization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19049",
        "id": "FlvtjAB0gl",
        "author_site": "Yang Jin, Kun Xu, Kun Xu, Liwei Chen, Chao Liao, Jianchao Tan, Quzhe Huang, Bin CHEN, Chengru Song, dai meng, Di ZHANG, Wenwu Ou, Kun Gai, Yadong MU",
        "tldr": "",
        "abstract": "Recently, the remarkable advance of the Large Language Model (LLM) has inspired researchers to transfer its extraordinary reasoning capability to both vision and language data. However, the prevailing approaches primarily regard the visual input as a prompt and focus exclusively on optimizing the text generation process conditioned upon vision content by a frozen LLM. Such an inequitable treatment of vision and language heavily constrains the model's potential. In this paper, we break through this limitation by representing both vision and language in a unified form. Specifically, we introduce a well-designed visual tokenizer to translate the non-linguistic image into a sequence of discrete tokens like a foreign language that LLM can read. The resulting visual tokens encompass high-level semantics worthy of a word and also support dynamic sequence length varying from the image. Coped with this tokenizer, the presented foundation model called LaVIT can handle both image and text indiscriminately under the same generative learning paradigm. This unification empowers LaVIT to serve as an impressive generalist interface to understand and generate multi-modal content simultaneously. Extensive experiments further showcase that it outperforms the existing models by a large margin on massive vision-language tasks. Our code and models are available at https://github.com/jy0205/LaVIT.",
        "keywords": "Vision Language Learning;Large Language Model;Pretraining",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yang Jin;Kun Xu;Kun Xu;Liwei Chen;Chao Liao;Jianchao Tan;Quzhe Huang;Bin CHEN;Chengru Song;dai meng;Di ZHANG;Wenwu Ou;Kun Gai;Yadong MU",
        "authorids": "~Yang_Jin1;~Kun_Xu6;~Kun_Xu4;~Liwei_Chen3;~Chao_Liao2;~Jianchao_Tan1;~Quzhe_Huang1;~Bin_CHEN14;~Chengru_Song1;~dai_meng1;~Di_ZHANG3;~Wenwu_Ou3;~Kun_Gai1;~Yadong_MU1",
        "gender": "M;M;;M;M;M;;M;M;M;M;M;M;M",
        "homepage": ";;https://sites.google.com/view/kunxu2/home;;https://github.com/TiaoziLiao;https://jianchaotan.github.io/;https://andrewzhe.github.io/;;;http://www.daimeng.com;;;;http://www.muyadong.com/",
        "dblp": "51/3584;;;;;165/9938;278/1884;;144/1365;;;;59/2902;55/1817",
        "google_scholar": "O3NlYwEAAAAJ;MGTIEMIAAAAJ;;https://scholar.google.com/citations?hl=en;xWoj6YsAAAAJ;1Gywy80AAAAJ;https://scholar.google.com/citations?hl=en;;;;;oP_7RCcAAAAJ;PXO4ygEAAAAJ;https://scholar.google.com.tw/citations?user=Fqqx4HsAAAAJ",
        "orcid": ";;;;;;;;;;0009-0006-5475-2728;;;",
        "linkedin": ";;;;;jianchao-tan-b58a96a7/;;https://www.linkedin.cn/incareer/in/ACoAAB5S2noB9wuKN_heeuCJsqbT-BMkQS0awyo;;;;;;",
        "or_profile": "~Yang_Jin1;~Kun_Xu6;~Kun_Xu4;~Liwei_Chen3;~Chao_Liao2;~Jianchao_Tan1;~Quzhe_Huang1;~Bin_CHEN14;~Chengru_Song1;~dai_meng1;~Di_ZHANG3;~Wenwu_Ou3;~Kun_Gai1;~Yadong_MU1",
        "aff": "Peking University;Kuaishou- \u5feb\u624b\u79d1\u6280;Tencent AI Lab;Kuaishou- \u5feb\u624b\u79d1\u6280;ByteDance Inc.;Kuaishou;Peking University;;Kuaishou- \u5feb\u624b\u79d1\u6280;Baidu;Kuaishou Technology;Kuaishou Technology;Kuaishou- \u5feb\u624b\u79d1\u6280;Peking University",
        "aff_domain": "pku.edu.cn;kuaishou.com;tencent.com;kuaishou.com;bytedance.com;kuaishou.com;pku.edu.cn;;kuaishou.com;baidu.com;kuaishou.com;kuaishou.com;kuaishou.com;pku.edu.cn",
        "position": "PhD student;Researcher;Researcher;Researcher;Researcher;Researcher;PhD student;;Principal Researcher;principal engineer;VP;Researcher;Instructor;Associate Professor",
        "bibtex": "@inproceedings{\njin2024unified,\ntitle={Unified Language-Vision Pretraining in {LLM} with Dynamic Discrete Visual Tokenization},\nauthor={Yang Jin and Kun Xu and Kun Xu and Liwei Chen and Chao Liao and Jianchao Tan and Quzhe Huang and Bin CHEN and Chengru Song and dai meng and Di ZHANG and Wenwu Ou and Kun Gai and Yadong MU},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=FlvtjAB0gl}\n}",
        "github": "",
        "project": "",
        "reviewers": "L5Te;54hM;6o4w;K5nK",
        "pdf_size": 10664967,
        "rating": "5;6;6;8",
        "confidence": "5;4;4;3",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "43;74;117;237",
        "wc_strengths": "56;45;32;52",
        "wc_weaknesses": "278;127;323;77",
        "wc_questions": "3;107;4;108",
        "wc_review": "380;353;476;474",
        "wc_reply_reviewers": "32;0;0;0",
        "wc_reply_authors": "2006;1287;1058;597",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "4;2;2;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            117.75,
            73.69319846498726
        ],
        "wc_strengths_avg": [
            46.25,
            9.12071817347735
        ],
        "wc_weaknesses_avg": [
            201.25,
            102.05972516129955
        ],
        "wc_questions_avg": [
            55.5,
            52.002403790594144
        ],
        "wc_review_avg": [
            420.75,
            55.08799778536156
        ],
        "wc_reply_reviewers_avg": [
            8.0,
            13.856406460551018
        ],
        "wc_reply_authors_avg": [
            1237.0,
            508.7980935498874
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            1.0897247358851685
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            14,
            0
        ],
        "corr_rating_confidence": -0.9733285267845754,
        "gs_citation": 86,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12342237664363030748&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=FlvtjAB0gl",
        "pdf": "https://openreview.net/pdf?id=FlvtjAB0gl",
        "email": "pku.edu.cn;kuaishou.com;tencent.com;kuaishou.com;bytedance.com;kuaishou.com;pku.edu.cn;;kuaishou.com;baidu.com;kuaishou.com;kuaishou.com;kuaishou.com;pku.edu.cn",
        "author_num": 14,
        "aff_unique_index": "0;1;2;1;3;1;0;1;4;1;1;1;0",
        "aff_unique_norm": "Peking University;Kuaishou Technology;Tencent;ByteDance;Baidu",
        "aff_unique_dep": ";;Tencent AI Lab;;Baidu, Inc.",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.kuaishou.com;https://ai.tencent.com;https://www.bytedance.com;https://www.baidu.com",
        "aff_unique_abbr": "Peking U;Kuaishou;Tencent AI Lab;ByteDance;Baidu",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "SOInter: A Novel Deep Energy-Based Interpretation Method for Explaining Structured Output Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19048",
        "id": "Fn655mJ4bv",
        "author_site": "S. Fatemeh Seyyedsalehi, Mahdieh Baghshah, Hamid Rabiee",
        "tldr": "",
        "abstract": "This paper proposes a novel interpretation technique to explain the behavior of structured output models, which simultaneously learn mappings between an input vector and a set of output variables. As a result of the complex relationships between the computational path of output variables in structured models, a feature may impact an output value via other output variables. We focus on one of the outputs as the target and try to find the most important features adopted by the structured model to decide on the target in each locality of the input space. We consider an arbitrary structured output model available as a black-box and argue that considering correlations among output variables can improve explanation quality. The goal is to train a function as an interpreter for the target output variable over the input space. We introduce an energy-based training process for the interpreter function, which effectively considers the structural information incorporated into the model to be explained. The proposed method's effectiveness is confirmed using various simulated and real data sets.",
        "keywords": "Interpretation;Structured output;Energy function;Explainable Structured output",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "S. Fatemeh Seyyedsalehi;Mahdieh Soleymani Baghshah;Hamid R. Rabiee",
        "authorids": "~S._Fatemeh_Seyyedsalehi1;~Mahdieh_Soleymani_Baghshah1;~Hamid_R._Rabiee1",
        "gender": "F;M;F",
        "homepage": ";http://sharif.edu/~rabiee;http://sharif.edu/~soleymani/",
        "dblp": "199/0856.html;01/4547;21/473",
        "google_scholar": "BkleiwoAAAAJ;rKDtrNgAAAAJ;S1U0KlgAAAAJ",
        "orcid": ";0000-0002-9835-4493;",
        "linkedin": "seyyede-fatemeh-seyyedsalehi-586928155/;hrabiee/;",
        "or_profile": "~S._Fatemeh_Seyyedsalehi1;~Hamid_R._Rabiee1;~Mahdieh_Baghshah1",
        "aff": "Sharif University of Technology;Sharif University of Technology;Sharif University of Technology",
        "aff_domain": "sharif.edu;sharif.edu;sharif.edu",
        "position": "Assistant Professor;Full Professor;Associate Professor",
        "bibtex": "@inproceedings{\nseyyedsalehi2024sointer,\ntitle={{SOI}nter: A Novel Deep Energy-Based Interpretation Method for Explaining Structured Output Models},\nauthor={S. Fatemeh Seyyedsalehi and Mahdieh Soleymani Baghshah and Hamid R. Rabiee},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Fn655mJ4bv}\n}",
        "github": "",
        "project": "",
        "reviewers": "nGJs;Nt2X;ZVtY;gHPF",
        "pdf_size": 888196,
        "rating": "3;5;6;6",
        "confidence": "1;4;3;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "1;3;3;2",
        "wc_summary": "50;148;156;144",
        "wc_strengths": "11;121;62;129",
        "wc_weaknesses": "112;195;115;141",
        "wc_questions": "2;30;26;161",
        "wc_review": "175;494;359;575",
        "wc_reply_reviewers": "0;12;73;32",
        "wc_reply_authors": "780;808;1305;830",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.0,
            1.224744871391589
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            124.5,
            43.229041164476456
        ],
        "wc_strengths_avg": [
            80.75,
            47.8663503935698
        ],
        "wc_weaknesses_avg": [
            140.75,
            33.28945028083221
        ],
        "wc_questions_avg": [
            54.75,
            62.27108076788133
        ],
        "wc_review_avg": [
            400.75,
            151.463485698699
        ],
        "wc_reply_reviewers_avg": [
            29.25,
            27.725214156071004
        ],
        "wc_reply_authors_avg": [
            930.75,
            216.79872578038828
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.8333333333333331,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:VA4larE8tjQJ:scholar.google.com/&scioq=SOInter:+A+Novel+Deep+Energy-Based+Interpretation+Method+for+Explaining+Structured+Output+Models&hl=en&as_sdt=0,33",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=Fn655mJ4bv",
        "pdf": "https://openreview.net/pdf?id=Fn655mJ4bv",
        "email": "sharif.edu;sharif.edu;sharif.edu",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Sharif University of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sharif.edu",
        "aff_unique_abbr": "SUT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Iran"
    },
    {
        "title": "PnP Inversion: Boosting Diffusion-based Editing with 3 Lines of Code",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19047",
        "id": "FoMZ4ljhVw",
        "author_site": "Xuan Ju, Ailing Zeng, Yuxuan Bian, Shaoteng Liu, Qiang Xu",
        "tldr": "",
        "abstract": "Text-guided diffusion models have revolutionized image generation and editing, offering exceptional realism and diversity. Specifically, in the context of diffusion-based editing, where a source image is edited according to a target prompt, the process commences by acquiring a noisy latent vector corresponding to the source image via the diffusion model. This vector is subsequently fed into separate source and target diffusion branches for editing. The accuracy of this inversion process significantly impacts the final editing outcome, influencing both essential content preservation of the source image and edit fidelity according to the target prompt. \nPrior inversion techniques aimed at finding a unified solution in both the source and target diffusion branches. However, our theoretical and empirical analyses reveal that disentangling these branches leads to a distinct separation of responsibilities for preserving essential content and ensuring edit fidelity. Building on this insight, we introduce \u201cPnP Inversion,\u201d a novel technique achieving optimal performance of both branches with just three lines of code. To assess image editing performance, we present PIE-Bench, an editing benchmark with 700 images showcasing diverse scenes and editing types, accompanied by versatile annotations and comprehensive evaluation metrics. Compared to state-of-the-art optimization-based inversion techniques, our solution not only yields superior performance across 8 editing methods but also achieves nearly an order of speed-up.",
        "keywords": "diffusion models;image editing;diffusion inversion",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/a54ff03304618f3236668edffe83917b71121b04.zip",
        "author": "Xuan Ju;Ailing Zeng;Yuxuan Bian;Shaoteng Liu;Qiang Xu",
        "authorids": "~Xuan_Ju1;~Ailing_Zeng1;~Yuxuan_Bian1;~Shaoteng_Liu1;~Qiang_Xu1",
        "gender": "F;F;M;M;M",
        "homepage": "https://juxuan27.github.io/;https://ailingzeng.site/;https://yxbian23.github.io;https://www.shaotengliu.com/;https://github.com/cure-lab",
        "dblp": "34/8495;226/4720;357/3628;02/10511;43/1230-1",
        "google_scholar": "https://scholar.google.com.hk/citations?user=pWzvK20AAAAJ;Tn7fzS8AAAAJ;https://scholar.google.com/citations?hl=zh-CN;v4JMf6kAAAAJ;https://scholar.google.com.tw/citations?user=eSiKPqUAAAAJ",
        "orcid": ";;;;",
        "linkedin": "%E7%92%87-%E9%9E%A0-122070217/;%E7%88%B1%E7%8E%B2-%E6%9B%BE-65504112a/;yuxuan-bian-433455268/;;",
        "or_profile": "~Xuan_Ju1;~Ailing_Zeng1;~Yuxuan_Bian1;~Shaoteng_Liu1;~Qiang_Xu1",
        "aff": "Chinese University of Hong Kong;International Digital Economy Academy;The Chinese University of Hong Kong;Adobe Systems;The Chinese University of Hong Kong",
        "aff_domain": "cuhk.hk;idea.edu.cn;cse.cuhk.edu.hk;adobe.com;cuhk.edu.hk",
        "position": "PhD student;Researcher;PhD student;Intern;Full Professor",
        "bibtex": "@inproceedings{\nju2024pnp,\ntitle={PnP Inversion: Boosting Diffusion-based Editing with 3 Lines of Code},\nauthor={Xuan Ju and Ailing Zeng and Yuxuan Bian and Shaoteng Liu and Qiang Xu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=FoMZ4ljhVw}\n}",
        "github": "",
        "project": "",
        "reviewers": "jyta;WzRy;2rho;C1kK",
        "pdf_size": 23413576,
        "rating": "6;6;6;8",
        "confidence": "4;4;4;2",
        "soundness": "3;4;3;3",
        "contribution": "3;2;3;3",
        "presentation": "3;3;3;2",
        "wc_summary": "31;115;31;69",
        "wc_strengths": "105;83;52;127",
        "wc_weaknesses": "2;320;133;34",
        "wc_questions": "89;11;7;254",
        "wc_review": "227;529;223;484",
        "wc_reply_reviewers": "0;0;0;115",
        "wc_reply_authors": "216;1026;1126;1790",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;2;2;4",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            61.5,
            34.565155865408734
        ],
        "wc_strengths_avg": [
            91.75,
            27.725214156071004
        ],
        "wc_weaknesses_avg": [
            122.25,
            123.96446063287655
        ],
        "wc_questions_avg": [
            90.25,
            100.03343191153645
        ],
        "wc_review_avg": [
            365.75,
            141.65340624213735
        ],
        "wc_reply_reviewers_avg": [
            28.75,
            49.79646071760522
        ],
        "wc_reply_authors_avg": [
            1039.5,
            558.8083302886599
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            1.0897247358851685
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 111,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7553259448575262519&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=FoMZ4ljhVw",
        "pdf": "https://openreview.net/pdf?id=FoMZ4ljhVw",
        "email": "cuhk.hk;idea.edu.cn;cse.cuhk.edu.hk;adobe.com;cuhk.edu.hk",
        "author_num": 5,
        "aff_unique_index": "0;1;0;2;0",
        "aff_unique_norm": "Chinese University of Hong Kong;International Digital Economy Academy;Adobe",
        "aff_unique_dep": ";;Adobe Systems Incorporated",
        "aff_unique_url": "https://www.cuhk.edu.hk;;https://www.adobe.com",
        "aff_unique_abbr": "CUHK;;Adobe",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;2;0",
        "aff_country_unique": "China;;United States"
    },
    {
        "id": "FoqZKsH9sE",
        "title": "LSP: Low-Power Semi-structured Pruning for Vision Transformers",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Vision transformers (ViTs) have emerged as a promising alternative to convolutional neural networks (CNNs) for various image analysis tasks, offering comparable or superior performance. However, one significant drawback of ViTs is their resource-intensive nature, leading to increased memory footprint, computation complexity, and power consumption. To democratize this high-performance technology and make it more environmentally friendly, it is essential to compress ViT models, reducing their resource requirements while maintaining high performance. In this paper, we introduce a new block-structured pruning to address the resource-intensive issue for ViTs, offering a balanced trade-off between accuracy and hardware acceleration. Unlike unstructured pruning or channel-wise structured pruning, block pruning leverages the block-wise structure of linear layers, resulting in more efficient matrix multiplications. To optimize this pruning scheme, our paper proposes a novel hardware-aware learning objective that simultaneously maximizes speedup and minimizes power consumption during inference, tailored to the block sparsity structure. This objective eliminates the need for empirical look-up tables and focuses solely on reducing parametrized layer connections. Moreover, our paper provides a lightweight algorithm to achieve post-training pruning for ViTs, utilizing second-order Taylor approximation and empirical optimization to solve the proposed hardware-aware objective. Extensive experiments on ImageNet are conducted across various ViT architectures, including DeiT-B and DeiT-S, demonstrating competitive performance with other pruning methods and achieving a remarkable balance between accuracy preservation and power savings.",
        "keywords": "Model Compression;Vision Transformer;Model Pruning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Kaixin Xu;Zhe Wang;Chunyun Chen;Xue Geng;Jie Lin;Min Wu;Xiaoli Li;Weisi Lin",
        "authorids": "~Kaixin_Xu1;~Zhe_Wang12;chunyun001@e.ntu.edu.sg;~Xue_Geng1;~Jie_Lin1;~Min_Wu2;~Xiaoli_Li1;~Weisi_Lin1",
        "gender": ";M;;F;M;M;M;M",
        "homepage": ";https://www.linkedin.com/in/wangzhemark/?originalSubdomain=sg;;;;https://sites.google.com/site/wumincf/;https://personal.ntu.edu.sg/xlli/;http://www.ntu.edu.sg/home/wslin/",
        "dblp": ";;;149/3281;88/6731;16/0-8;l/XiaoliLi.html;14/3737.html",
        "google_scholar": ";Xqu6fAkAAAAJ;;ZYVZ1bgAAAAJ;;https://scholar.google.com.sg/citations?user=Hji1uWQAAAAJ;E3yQKloAAAAJ;https://scholar.google.com.tw/citations?user=D_S41X4AAAAJ",
        "orcid": ";;;;;0000-0003-0977-3600;0000-0002-0762-6562;",
        "linkedin": ";;;xue-geng-9963b95a/;;;li-xiaoli-41027ba/;",
        "or_profile": "~Kaixin_Xu1;~Zhe_Wang12;chunyun001@e.ntu.edu.sg;~Xue_Geng1;~Jie_Lin1;~Min_Wu2;~Xiaoli_Li1;~Weisi_Lin1",
        "aff": ";, A*STAR;;Institute for Infocomm Research, A*STAR;;Institute for Infocomm Research (I2R), A*STAR;A*STAR;Nanyang Technological University",
        "aff_domain": ";i2r.a-star.edu.sg;;i2r.a-star.edu.sg;;i2r.a-star.edu.sg;a-star.edu.sg;ntu.edu.sg",
        "position": ";Researcher;;Research Scientist;;Principal Researcher;Principal Researcher;Full Professor",
        "bibtex": "@misc{\nxu2024lsp,\ntitle={{LSP}: Low-Power Semi-structured Pruning for Vision Transformers},\nauthor={Kaixin Xu and Zhe Wang and Chunyun Chen and Xue Geng and Jie Lin and Min Wu and Xiaoli Li and Weisi Lin},\nyear={2024},\nurl={https://openreview.net/forum?id=FoqZKsH9sE}\n}",
        "github": "",
        "project": "",
        "reviewers": "yotU;d35y;cWB3;rMt3",
        "site": "https://openreview.net/forum?id=FoqZKsH9sE",
        "pdf_size": 2454045,
        "rating": "5;5;5;6",
        "confidence": "4;5;5;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "76;46;66;51",
        "wc_strengths": "35;19;24;57",
        "wc_weaknesses": "187;197;115;126",
        "wc_questions": "6;127;5;4",
        "wc_review": "304;389;210;238",
        "wc_reply_reviewers": "0;88;68;0",
        "wc_reply_authors": "872;2814;1755;1122",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "2;5;4;2",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            59.75,
            11.92424001771182
        ],
        "wc_strengths_avg": [
            33.75,
            14.618053906043718
        ],
        "wc_weaknesses_avg": [
            156.25,
            36.134298111351214
        ],
        "wc_questions_avg": [
            35.5,
            52.83228179815821
        ],
        "wc_review_avg": [
            285.25,
            68.93973817762873
        ],
        "wc_reply_reviewers_avg": [
            39.0,
            39.63584236521283
        ],
        "wc_reply_authors_avg": [
            1640.75,
            749.9411226889748
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.25,
            1.299038105676658
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:pOjKvVFLqc8J:scholar.google.com/&scioq=LSP:+Low-Power+Semi-structured+Pruning+for+Vision+Transformers&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;2;3",
        "aff_unique_norm": "A*STAR;Institute for Infocomm Research;Agency for Science, Technology and Research;Nanyang Technological University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.a-star.edu.sg;https://www.i2r.a-star.edu.sg;https://www.a-star.edu.sg;https://www.ntu.edu.sg",
        "aff_unique_abbr": "A*STAR;I2R;A*STAR;NTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Singapore"
    },
    {
        "id": "FpElWzxzu4",
        "title": "NeRT: Implicit Neural Representation for Time Series",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Time series is one of the most fundamental data types in real-world environments and there have been many different deep-learning models to effectively handle time series data, ranging from recurrent neural networks to Transformers to differential equation-based models. These existing models, however, tend to underperform due to irregular measurements, sensitivity to hyper-parameters (e.g., a window size), to name a few. Modeling time series as a continuous-in-time signal via implicit neural representations (INRs) can be an alternative approach to overcome such limitations. However, na\u00efve adoptions of existing INR frameworks toward time series do not yield promising outcomes. To address this, we propose NeRT, a novel class of INRs tailored to handle time-series data; the core ideas are to design a new coordinate system, to employ learnable Fourier features, and to model periodic and scale components of time series separately. Thanks to the inherent characteristics of INRs, our model can learn from both regular and irregular time series in a continuous-time manner and perform time series forecasting and imputation at the same time with a single trained model. Moreover, we show that NeRT can be efficiently parameterized via latent modulation. Through extensive experiments with real-world and scientific datasets, we demonstrate that NeRT significantly outperforms baselines including popular INR-based methods and previous time series models.",
        "keywords": "Implicit neural representation;time-series",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/eb25d740e15b157e0bc5e893034791c740534394.zip",
        "author": "Woojin Cho;Minju Jo;Kookjin Lee;Noseong Park",
        "authorids": "~Woojin_Cho1;~Minju_Jo1;~Kookjin_Lee1;~Noseong_Park1",
        "gender": "M;F;M;",
        "homepage": "https://woojin-cho.github.io/;;https://scholar.google.com/citations?hl=en&user=KL89hVQAAAAJ&view_op=list_works;",
        "dblp": ";236/8419.html;122/5103;",
        "google_scholar": "cqIj5tQAAAAJ;xLVtvn8AAAAJ;https://scholar.google.com/citations?hl=en;",
        "orcid": ";0000-0002-7908-5005;;",
        "linkedin": "woojin-cho-02b905264/;;;",
        "or_profile": "~Woojin_Cho1;~Minju_Jo1;~Kookjin_Lee1;~Noseong_Park1",
        "aff": "Yonsei University;LG CNS;Arizona State University;",
        "aff_domain": "yonsei.ac.kr;lgcns.com;asu.edu;",
        "position": "MS student;Researcher;Assistant Professor;",
        "bibtex": "@misc{\ncho2024nert,\ntitle={Ne{RT}: Implicit Neural Representation for Time Series},\nauthor={Woojin Cho and Minju Jo and Kookjin Lee and Noseong Park},\nyear={2024},\nurl={https://openreview.net/forum?id=FpElWzxzu4}\n}",
        "github": "",
        "project": "",
        "reviewers": "96cx;34Ud;wYL3;9g36",
        "site": "https://openreview.net/forum?id=FpElWzxzu4",
        "pdf_size": 3526862,
        "rating": "3;3;5;6",
        "confidence": "4;4;4;4",
        "soundness": "1;2;2;4",
        "contribution": "2;1;2;3",
        "presentation": "2;2;3;3",
        "wc_summary": "184;163;44;47",
        "wc_strengths": "41;44;12;25",
        "wc_weaknesses": "1027;208;282;173",
        "wc_questions": "80;80;9;1",
        "wc_review": "1332;495;347;246",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.25,
            1.0897247358851685
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            109.5,
            64.43795465407014
        ],
        "wc_strengths_avg": [
            30.5,
            12.893796958227627
        ],
        "wc_weaknesses_avg": [
            422.5,
            351.21966061141853
        ],
        "wc_questions_avg": [
            42.5,
            37.606515392947536
        ],
        "wc_review_avg": [
            605.0,
            428.9737754222279
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:r7XffJFBdToJ:scholar.google.com/&scioq=NeRT:+Implicit+Neural+Representation+for+Time+Series&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Yonsei University;LG;Arizona State University",
        "aff_unique_dep": ";LG CNS;",
        "aff_unique_url": "https://www.yonsei.ac.kr;https://www.lgcns.com;https://www.asu.edu",
        "aff_unique_abbr": "Yonsei;LG CNS;ASU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "id": "Fq8tKtjACC",
        "title": "Textbooks Are All You Need",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We introduce phi-1, a new large language model for code, with significantly smaller size than competing models: phi-1 is a Transformer-based model with 1.3B parameters, trained for 4 days on 8 A100s, using a selection of ``textbook quality\" data from the web (6B tokens) and synthetically generated textbooks and exercises with GPT-3.5 (1B tokens). Despite this small scale, phi-1 attains pass@1 accuracy 50.6% on HumanEval and 55.5% on MBPP. It also displays surprising emergent properties compared to phi-1-base, our model before our finetuning stage on a dataset of coding exercises, and phi-1-small, a smaller model with 350M parameters trained with the same pipeline as phi-1 that still achieves 45% on HumanEval.",
        "keywords": "large language models;coding models",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Suriya Gunasekar;Yi Zhang;Jyoti Aneja;Caio Cesar Teodoro Mendes;Allie Del Giorno;Sivakanth Gopi;Mojan Javaheripi;Piero Conti Kauffmann;Gustavo Henrique de Rosa;Olli Saarikivi;Adil Salim;Shital Shah;Harkirat Behl;Xin Wang;Sebastien Bubeck;Ronen Eldan;Adam Tauman Kalai;Yin Tat Lee;Yuanzhi Li",
        "authorids": "~Suriya_Gunasekar1;~Yi_Zhang1;~Jyoti_Aneja2;~Caio_Cesar_Teodoro_Mendes1;~Allie_Del_Giorno1;~Sivakanth_Gopi1;~Mojan_Javaheripi1;~Piero_Conti_Kauffmann1;~Gustavo_Henrique_de_Rosa1;~Olli_Saarikivi1;~Adil_Salim2;~Shital_Shah1;~Harkirat_Behl1;~Xin_Wang1;~Sebastien_Bubeck1;~Ronen_Eldan1;~Adam_Tauman_Kalai1;~Yin_Tat_Lee1;~Yuanzhi_Li1",
        "gender": ";M;;M;;M;F;M;M;;M;M;M;F;;M;;;M",
        "homepage": "http://sgunasekar.github.io;https://yi-zhang.me;http://jyotianeja.com/;;;https://aka.ms/sigopi;https://sites.google.com/view/mojan-javaheripi/home;https://microsoft.com/en-us/research/people/pkauffmann/;https://gugarosa.github.io;;https://adil-salim.github.io;http://shital.com;https://harkiratbehl.github.io/;https://people.eecs.berkeley.edu/~xinw/;http://sbubeck.com/;;;;",
        "dblp": ";64/6544-74;;20/11498;;123/7803.html;229/4177;;121/8054;;192/3273;188/5763;199/2125;;35/4292;85/9583;;;73/3628",
        "google_scholar": "EkREu_QAAAAJ;lc6CVqEAAAAJ;FYB92lkAAAAJ;;;bYhGFrwAAAAJ;Poczb1oAAAAJ;;UGto_zMAAAAJ;;;1PEHzesAAAAJ;R7k23-0AAAAJ;e9gUdKwAAAAJ;V2Y1L4sAAAAJ;;;;",
        "orcid": ";;;;;;;;0000-0002-6442-8343;;;;;;;;;;",
        "linkedin": ";;;;;sivakanthgopi/;;;gugarosa;;;http://www.linkedin.com/in/shitals;;xin-wang-aa83a577;;;;;",
        "or_profile": "~Suriya_Gunasekar1;~Yi_Zhang1;~Jyoti_Aneja2;~Caio_Cesar_Teodoro_Mendes1;~Allie_Del_Giorno1;~Sivakanth_Gopi1;~Mojan_Javaheripi1;~Piero_Conti_Kauffmann1;~Gustavo_Henrique_de_Rosa1;~Olli_Saarikivi1;~Adil_Salim2;~Shital_Shah1;~Harkirat_Behl1;~Xin_Wang1;~Sebastien_Bubeck1;~Ronen_Eldan1;~Adam_Tauman_Kalai1;~Yin_Tat_Lee1;~Yuanzhi_Li1",
        "aff": "Microsoft;Microsoft;;Microsoft;;Microsoft Research;Microsoft;Microsoft Research ;Microsoft Research;;Microsoft;Microsoft Research;Microsoft Research;Microsoft;Microsoft;Microsoft Research;;;Carnegie Mellon University",
        "aff_domain": "microsoft.com;microsoft.com;;microsoft.com;;microsoft.com;microsoft.com;microsoft.com;microsoft.com;;microsoft.com;research.microsoft.com;microsoft.com;microsoft.com;microsoft.com;microsoft.com;;;andrew.cmu.edu",
        "position": "Senior Researcher;Researcher;;Researcher;;Senior Researcher;Researcher;Research Engineer;Research Software Engineer;;Researcher;Principal Research Engineer;Researcher;Senior Researcher;Researcher;Principal Researcher;;;Assistant Professor",
        "bibtex": "@misc{\ngunasekar2024textbooks,\ntitle={Textbooks Are All You Need},\nauthor={Suriya Gunasekar and Yi Zhang and Jyoti Aneja and Caio Cesar Teodoro Mendes and Allie Del Giorno and Sivakanth Gopi and Mojan Javaheripi and Piero Conti Kauffmann and Gustavo Henrique de Rosa and Olli Saarikivi and Adil Salim and Shital Shah and Harkirat Behl and Xin Wang and Sebastien Bubeck and Ronen Eldan and Adam Tauman Kalai and Yin Tat Lee and Yuanzhi Li},\nyear={2024},\nurl={https://openreview.net/forum?id=Fq8tKtjACC}\n}",
        "github": "",
        "project": "",
        "reviewers": "QdXo;zVvy;JG5J;DYsB;UYV3;71cs",
        "site": "https://openreview.net/forum?id=Fq8tKtjACC",
        "pdf_size": 1243317,
        "rating": "5;5;6;6;6;8",
        "confidence": "4;3;3;3;4;5",
        "soundness": "2;3;3;2;2;3",
        "contribution": "2;3;3;2;3;4",
        "presentation": "3;3;4;4;3;3",
        "wc_summary": "113;164;125;51;65;94",
        "wc_strengths": "77;55;48;56;78;101",
        "wc_weaknesses": "673;38;69;14;188;47",
        "wc_questions": "137;71;32;131;2;124",
        "wc_review": "1000;328;274;252;333;366",
        "wc_reply_reviewers": "0;0;105;0;0;0",
        "wc_reply_authors": "1074;712;397;578;589;700",
        "reply_reviewers": "0;0;1;0;0;0",
        "reply_authors": "2;1;1;1;1;1",
        "rating_avg": [
            6.0,
            1.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.7453559924999298
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.8333333333333335,
            0.6871842709362768
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            102.0,
            37.700574708263176
        ],
        "wc_strengths_avg": [
            69.16666666666667,
            18.142185339393073
        ],
        "wc_weaknesses_avg": [
            171.5,
            231.08782601715163
        ],
        "wc_questions_avg": [
            82.83333333333333,
            51.97248203510093
        ],
        "wc_review_avg": [
            425.5,
            259.71378477085113
        ],
        "wc_reply_reviewers_avg": [
            17.5,
            39.131189606246316
        ],
        "wc_reply_authors_avg": [
            675.0,
            206.27004953054464
        ],
        "reply_reviewers_avg": [
            0.16666666666666666,
            0.372677996249965
        ],
        "reply_authors_avg": [
            1.1666666666666667,
            0.3726779962499649
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            19,
            0
        ],
        "corr_rating_confidence": 0.6708203932499368,
        "gs_citation": 633,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6827925014385411453&as_sdt=5,34&sciodt=0,34&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;0;0;0;0;0;0;0;0;0;0;0;1",
        "aff_unique_norm": "Microsoft;Carnegie Mellon University",
        "aff_unique_dep": "Microsoft Corporation;",
        "aff_unique_url": "https://www.microsoft.com;https://www.cmu.edu",
        "aff_unique_abbr": "Microsoft;CMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Fr87G8v7PL",
        "title": "Relative Margin for Contrastive Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Contrastive image-text pretraining plays an integral part behind the breakthroughs in multimodal understanding and generation in recent years. Conceptually, the contrastive loss encourages the alignment of actual image-text pairs to stand out against wrong pairs, essentially creating a separation between them. During our exploration of contrastive learning, however, we identified a practical issue that the gradients of image-text pairs drop off quickly once the separation is created, resulting in little contribution to the optimization from the large volume of higher-separation pairs. To address it, we propose to apply margins to the higherseparation training pairs to re-balance the gradient strength. We define Relative Alignment Score as the separation indicator, and incorporate a margin function that is linear to the Relative Alignment Score to adaptively increase a pair\u2019s contribution to the optimization. We name this method Relative Margin, and observe significant performance improvements after applying it on zero-shot image-text retrieval and image classification benchmarks. Specifically, we train CoCa models with and without our proposed Relative Margin on the open LAION-2B dataset. We observe +2.4 for ViT-B and +2.6 for ViT-L on MSCOCO image-to-text retrieval recall, and +2.0 for both ViT-B and ViT-L on zero-shot ImageNet top-1 accuracy. Notably, ViT-L with Relative Margin achieves 82.4% zero-shot ImageNet top-1 accuracy when trained with open DataComp-1B dataset, outperforming previous state-of-the-arts that use larger models. Consistent improvements are also observed in few-shot linear probes of the ViT in CoCa with Relative Margin.",
        "keywords": "Contrastive Learning;Multimodal Foundation Models",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Siyuan Qiao;Chenxi Liu;Yonghui Wu;Jiahui Yu",
        "authorids": "~Siyuan_Qiao1;~Chenxi_Liu1;~Yonghui_Wu1;~Jiahui_Yu1",
        "gender": "M;;M;M",
        "homepage": "https://www.cs.jhu.edu/~syqiao/;;;http://jiahuiyu.com/",
        "dblp": "43/7562;146/8008;26/2189;185/1060",
        "google_scholar": "6Hfk-90AAAAJ;;55FnA9wAAAAJ;-CLCMk4AAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;jiahuiyuu/",
        "or_profile": "~Siyuan_Qiao1;~Chenxi_Liu1;~Yonghui_Wu1;~Jiahui_Yu1",
        "aff": "Google;Waymo;;Google Brain",
        "aff_domain": "google.com;waymo.com;;google.com",
        "position": "Research Scientist;Researcher;;Research Scientist",
        "bibtex": "@misc{\nqiao2024relative,\ntitle={Relative Margin for Contrastive Learning},\nauthor={Siyuan Qiao and Chenxi Liu and Yonghui Wu and Jiahui Yu},\nyear={2024},\nurl={https://openreview.net/forum?id=Fr87G8v7PL}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=Fr87G8v7PL",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:xGIgNyaCFaoJ:scholar.google.com/&scioq=Relative+Margin+for+Contrastive+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Google;Waymo",
        "aff_unique_dep": "Google;",
        "aff_unique_url": "https://www.google.com;https://www.waymo.com",
        "aff_unique_abbr": "Google;Waymo",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Mountain View;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "AttEXplore: Attribution for Explanation with model parameters eXploration",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19046",
        "id": "FsVxd9CIlb",
        "author_site": "Zhiyu Zhu, Huaming Chen, Jiayu Zhang, Xinyi Wang, Zhibo Jin, Jason Xue, Flora Salim",
        "tldr": "",
        "abstract": "Due to the real-world noise and human-added perturbations, attaining the trustworthiness of deep neural networks (DNNs) is a challenging task. Therefore, it becomes essential to offer explanations for the decisions made by these non-linear and complex parameterized models. Attribution methods are promising for this goal, yet its performance can be further improved. In this paper, for the first time, we present that the decision boundary exploration approaches of attribution are consistent with the process for transferable adversarial attacks. Specifically, the transferable adversarial attacks craft general adversarial samples from the source model, which is consistent with the generation of adversarial samples that can cross multiple decision boundaries in attribution. Utilizing this consistency, we introduce a novel attribution method via model parameter exploration. Furthermore, inspired by the capability of frequency exploration to investigate the model parameters, we provide enhanced explainability for DNNs by manipulating the input features based on frequency information to explore the decision boundaries of different models. Large-scale experiments demonstrate that our \\textbf{A}ttribution method for \\textbf{E}xplanation with model parameter e\\textbf{X}ploration (AttEXplore) outperforms other state-of-the-art interpretability methods. Moreover, by employing other transferable attack techniques, AttEXplore can explore potential variations in attribution outcomes. Our code is available at: https://github.com/LMBTough/ATTEXPLORE.",
        "keywords": "attribution;transferability;adversarial attack",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/ffe162cede20a43469d96a669f6e1462022c658c.pdf",
        "author": "Zhiyu Zhu;Huaming Chen;Jiayu Zhang;Xinyi Wang;Zhibo Jin;Jason Xue;Flora D. Salim",
        "authorids": "~Zhiyu_Zhu2;~Huaming_Chen1;~Jiayu_Zhang1;~Xinyi_Wang9;~Zhibo_Jin1;~Jason_Xue1;~Flora_D._Salim1",
        "gender": ";;M;M;M;;",
        "homepage": ";;https://github.com/KxPlaug;https://github.com/noctisluna;https://github.com/Davidjinzb;;",
        "dblp": ";;;;;;",
        "google_scholar": ";;;;;;",
        "orcid": ";;;;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Zhiyu_Zhu2;~Huaming_Chen1;~Jiayu_Zhang1;~Xinyi_Wang9;~Zhibo_Jin1;~Jason_Xue1;~Flora_D._Salim1",
        "aff": ";;Suzhou Yierqi;Universiti Malaya;University of Sydney;;",
        "aff_domain": ";;szyierqi.com;um.edu.my;usyd.edu.au;;",
        "position": ";;Researcher;MS student;MS student;;",
        "bibtex": "@inproceedings{\nzhu2024attexplore,\ntitle={Att{EX}plore: Attribution for Explanation with model parameters eXploration},\nauthor={Zhiyu Zhu and Huaming Chen and Jiayu Zhang and Xinyi Wang and Zhibo Jin and Jason Xue and Flora D. Salim},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=FsVxd9CIlb}\n}",
        "github": "",
        "project": "",
        "reviewers": "H27T;UxR1;r7kS;M36V",
        "pdf_size": 5426607,
        "rating": "5;6;6;6",
        "confidence": "3;3;3;4",
        "soundness": "2;3;2;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;2;3",
        "wc_summary": "62;62;154;60",
        "wc_strengths": "34;34;185;62",
        "wc_weaknesses": "571;134;293;100",
        "wc_questions": "1;28;56;74",
        "wc_review": "668;258;688;296",
        "wc_reply_reviewers": "519;14;284;0",
        "wc_reply_authors": "1633;407;1780;539",
        "reply_reviewers": "1;1;3;0",
        "reply_authors": "3;2;5;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            84.5,
            40.13415004706092
        ],
        "wc_strengths_avg": [
            78.75,
            62.39941906780864
        ],
        "wc_weaknesses_avg": [
            274.5,
            186.04099010701916
        ],
        "wc_questions_avg": [
            39.75,
            27.73422975314079
        ],
        "wc_review_avg": [
            477.5,
            201.07399135641586
        ],
        "wc_reply_reviewers_avg": [
            204.25,
            214.0915400010005
        ],
        "wc_reply_authors_avg": [
            1089.75,
            620.6929091748995
        ],
        "reply_reviewers_avg": [
            1.25,
            1.0897247358851685
        ],
        "reply_authors_avg": [
            2.75,
            1.479019945774904
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7899402595634045724&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=FsVxd9CIlb",
        "pdf": "https://openreview.net/pdf?id=FsVxd9CIlb",
        "email": ";;szyierqi.com;um.edu.my;usyd.edu.au;;",
        "author_num": 7,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Suzhou Yierqi;Universiti Malaya;University of Sydney",
        "aff_unique_dep": ";;",
        "aff_unique_url": ";https://www.malaya.edu.my;https://www.sydney.edu.au",
        "aff_unique_abbr": ";UM;USYD",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2",
        "aff_country_unique": "China;Malaysia;Australia"
    },
    {
        "title": "GeneOH Diffusion: Towards Generalizable Hand-Object Interaction Denoising via Denoising Diffusion",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19045",
        "id": "FvK2noilxT",
        "author_site": "Xueyi Liu, Li Yi",
        "tldr": "",
        "abstract": "In this work, we tackle the challenging problem of denoising hand-object interactions (HOI). Given an erroneous interaction sequence, the objective is to refine the incorrect hand trajectory to remove interaction artifacts for a perceptually realistic sequence.  This challenge involves intricate interaction noise, including unnatural hand poses and incorrect hand-object relations, alongside the necessity for robust generalization to new interactions and diverse noise patterns. We tackle those challenges through a novel approach, GeneOH Diffusion, incorporating two key designs: an innovative contact-centric HOI representation named GeneOH and a new domain-generalizable denoising scheme. The contact-centric representation GeneOH informatively parameterizes the HOI process, facilitating enhanced generalization across various HOI scenarios. The new denoising scheme consists of a canonical denoising model trained to project noisy data samples from a whitened noise space to a clean data manifold and a ``denoising via diffusion'' strategy which can handle input trajectories with various noise patterns by first diffusing them to align with the whitened noise space and cleaning via the canonical denoiser. Extensive experiments on four benchmarks with significant domain variations demonstrate the superior effectiveness of our method. GeneOH Diffusion also shows promise for various downstream applications. We include [a website](https://meowuu7.github.io/GeneOH-Diffusion/) for introducing the work.",
        "keywords": "motion refinement;hand-object interaction;inverse problem;generative prior",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/ece1477462f2695836edcb7946ec8347a3ede837.zip",
        "author": "Xueyi Liu;Li Yi",
        "authorids": "~Xueyi_Liu1;~Li_Yi2",
        "gender": "F;M",
        "homepage": "https://meowuu7.github.io;https://ericyi.github.io/",
        "dblp": "47/10627;26/4239-1",
        "google_scholar": "bspSfNEAAAAJ;UyZL660AAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Xueyi_Liu1;~Li_Yi2",
        "aff": "Tsinghua University;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nliu2024geneoh,\ntitle={Gene{OH} Diffusion: Towards Generalizable Hand-Object Interaction Denoising via Denoising Diffusion},\nauthor={Xueyi Liu and Li Yi},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=FvK2noilxT}\n}",
        "github": "",
        "project": "",
        "reviewers": "A9wU;xeyt;C7Zj;uUah",
        "pdf_size": 32691320,
        "rating": "6;6;6;8",
        "confidence": "4;2;3;4",
        "soundness": "3;3;3;4",
        "contribution": "3;3;4;3",
        "presentation": "3;3;3;3",
        "wc_summary": "92;99;55;72",
        "wc_strengths": "48;35;80;70",
        "wc_weaknesses": "101;18;44;128",
        "wc_questions": "4;1;106;110",
        "wc_review": "245;153;285;380",
        "wc_reply_reviewers": "253;0;0;31",
        "wc_reply_authors": "2456;152;1699;1292",
        "reply_reviewers": "2;0;0;1",
        "reply_authors": "6;2;4;3",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            79.5,
            17.269916039170543
        ],
        "wc_strengths_avg": [
            58.25,
            17.725334975678173
        ],
        "wc_weaknesses_avg": [
            72.75,
            43.80282525134652
        ],
        "wc_questions_avg": [
            55.25,
            52.77961254120761
        ],
        "wc_review_avg": [
            265.75,
            81.49654900669107
        ],
        "wc_reply_reviewers_avg": [
            71.0,
            105.83713903918606
        ],
        "wc_reply_authors_avg": [
            1399.75,
            832.7221550433254
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.75,
            1.479019945774904
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.5222329678670935,
        "gs_citation": 23,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16209352063268137072&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=FvK2noilxT",
        "pdf": "https://openreview.net/pdf?id=FvK2noilxT",
        "email": "tsinghua.edu.cn;tsinghua.edu.cn",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Tsinghua University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "FvfhHucpLd",
        "title": "DIVERSITY OF THOUGHT IMPROVES REASONING ABILITIES OF LARGE LANGUAGE MODELS",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs) are documented to struggle in settings that require complex reasoning. Nevertheless, instructing the model to break the problem into smaller reasoning steps (Wei et al., 2022b), or ensembling various generations through decoding alterations (Wang et al., 2023) boosts performance. Current approaches assume the input prompt is fixed and expect the decoding strategies introduce diversity needed for ensembling. In this work, we relax this assumption and discuss how one can create and leverage variations of the input prompt as a means to diversity of thought to improve model performance. We propose a methodology to automatically improve prompt diversity by soliciting feedback from the LLM. In our new prompting approach, DIV-SE (DIVerse reasoning path Self-Ensemble), we use these diverse prompts as part of an ensemble across multiple inference calls. We also propose a cost-effective alternative where diverse prompts are used within a single inference call; we call this IDIV-SE (In-call DIVerse reasoning path Self-Ensemble). Under a fixed generation budget, DIVSE and IDIV-SE generate more accurate results than the previously discussed baselines using both GPT-3.5 and GPT-4 on several reasoning benchmarks, without modifying the decoding process. Additionally, DIV-SE advances state-of-the-art performance on recent planning benchmarks (Valmeekam et al., 2022), exceeding\nthe highest previously reported accuracy by at least 29.6 percentage points on the most challenging 4/5 blocks task in the Blocksworld problem. Our results shed light on how to enforce prompt diversity towards LLM reasoning without increasing the generation budget.",
        "keywords": "diverse reasoning paths",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/2540c6fcdd8d2e5747b58dceef9404a2d25d0746.pdf",
        "author": "Ranjita Naik;Varun Chandrasekaran;Mert Yuksekgonul;Hamid Palangi;Besmira Nushi",
        "authorids": "~Ranjita_Naik1;~Varun_Chandrasekaran1;~Mert_Yuksekgonul1;~Hamid_Palangi1;~Besmira_Nushi1",
        "gender": "F;M;M;M;F",
        "homepage": "https://github.com/ranjita-naik/;http://pages.cs.wisc.edu/~chandrasekaran/;https://cs.stanford.edu/~merty;https://www.hamidpalangi.com/;http://besmiranushi.com/",
        "dblp": ";;249/5558;01/963;117/4927",
        "google_scholar": ";Sl7nSOsAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.ca/citations?user=B1lAghgAAAAJ;QWTkjB8AAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Ranjita_Naik1;~Varun_Chandrasekaran1;~Mert_Yuksekgonul1;~Hamid_Palangi1;~Besmira_Nushi1",
        "aff": "Microsoft;University of Illinois Urbana-Champaign;Microsoft;Google;Microsoft",
        "aff_domain": "microsoft.com;illinois.edu;microsoft.com;google.com;microsoft.com",
        "position": "Researcher;Assistant Professor;Intern;Staff Research Scientist;Researcher",
        "bibtex": "@misc{\nnaik2024diversity,\ntitle={{DIVERSITY} {OF} {THOUGHT} {IMPROVES} {REASONING} {ABILITIES} {OF} {LARGE} {LANGUAGE} {MODELS}},\nauthor={Ranjita Naik and Varun Chandrasekaran and Mert Yuksekgonul and Hamid Palangi and Besmira Nushi},\nyear={2024},\nurl={https://openreview.net/forum?id=FvfhHucpLd}\n}",
        "github": "",
        "project": "",
        "reviewers": "Vhwc;PAGk;YP6t",
        "site": "https://openreview.net/forum?id=FvfhHucpLd",
        "pdf_size": 955830,
        "rating": "3;3;5",
        "confidence": "4;4;4",
        "soundness": "3;2;2",
        "contribution": "3;2;2",
        "presentation": "2;3;3",
        "wc_summary": "87;240;115",
        "wc_strengths": "50;85;10",
        "wc_weaknesses": "173;244;164",
        "wc_questions": "58;223;98",
        "wc_review": "368;792;387",
        "wc_reply_reviewers": "0;200;117",
        "wc_reply_authors": "770;1811;1274",
        "reply_reviewers": "0;2;1",
        "reply_authors": "3;5;4",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            147.33333333333334,
            66.51482708556208
        ],
        "wc_strengths_avg": [
            48.333333333333336,
            30.64129385141706
        ],
        "wc_weaknesses_avg": [
            193.66666666666666,
            35.78019315518325
        ],
        "wc_questions_avg": [
            126.33333333333333,
            70.27722880769338
        ],
        "wc_review_avg": [
            515.6666666666666,
            195.55107318095247
        ],
        "wc_reply_reviewers_avg": [
            105.66666666666667,
            82.04199466668817
        ],
        "wc_reply_authors_avg": [
            1285.0,
            425.05764314972623
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            4.0,
            0.816496580927726
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9245429615559080413&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;2;0",
        "aff_unique_norm": "Microsoft;University of Illinois Urbana-Champaign;Google",
        "aff_unique_dep": "Microsoft Corporation;;Google",
        "aff_unique_url": "https://www.microsoft.com;https://illinois.edu;https://www.google.com",
        "aff_unique_abbr": "Microsoft;UIUC;Google",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Urbana-Champaign;Mountain View",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "FvqGxAyCpi",
        "title": "Customizing Global Model for Diverse Target Distributions in Federated Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Federated learning (FL) is a privacy-preserving approach to train a global model on decentralized data. Most existing FL algorithms optimize the global model by minimizing the average loss among clients, aiming to perform well on commonly assumed uniform target data distribution. In practice, though, the need often arises for a tailored model to excel on its specific unlabeled target dataset with arbitrary distribution. The misalignment of the assumed and actual target distribution violates the plausible uniform assumption and thus undermines the effectiveness of vanilla FL methods. To fill this gap, we propose FedSSA, a self-supervised aggregation method capable of training a specific global model for specific target data. FedSSA leverages the target dataset on the server side to dynamically learn aggregation weights for local models in a self-supervised manner. These aggregation weights are iteratively adjusted to promote transformation-invariant.\nWith extensive qualitative and quantitative experiments, we demonstrate that FedSSA consistently outperforms 12 classical baselines across multiple datasets, heterogeneity scenarios and different target distributions. Furthermore, we showcase the plug-and-play property of FedSSA by combining it with various FL methods.",
        "keywords": "federated learning;self-supervised learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Rui Ye;Jingyi Chai;Mingkai Xu;Siheng Chen;Yanfeng Wang",
        "authorids": "~Rui_Ye1;~Jingyi_Chai1;~Mingkai_Xu1;~Siheng_Chen1;~Yanfeng_Wang1",
        "gender": "M;F;;M;M",
        "homepage": "http://rui-ye.github.io/;;;https://cmic.sjtu.edu.cn/wangyanfeng/;https://siheng-chen.github.io/",
        "dblp": ";340/7940;;55/5407-1.html;136/4945",
        "google_scholar": "Q4-VTxcAAAAJ;aeYq_ScAAAAJ;OXN81PMAAAAJ;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com/citations?hl=en",
        "orcid": ";;0009-0006-5369-4028;0000-0002-3196-2347;",
        "linkedin": ";;mingkai-xu-218887236/;;",
        "or_profile": "~Rui_Ye1;~Jingyi_Chai1;~Mingkai_Xu1;~Yanfeng_Wang1;~Siheng_Chen2",
        "aff": "Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn",
        "position": "PhD student;Undergrad student;PhD student;Full Professor;Associate Professor",
        "bibtex": "@misc{\nye2024customizing,\ntitle={Customizing Global Model for Diverse Target Distributions in Federated Learning},\nauthor={Rui Ye and Jingyi Chai and Mingkai Xu and Siheng Chen and Yanfeng Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=FvqGxAyCpi}\n}",
        "github": "",
        "project": "",
        "reviewers": "oAHD;Q6HC;ovj7;6Ffb",
        "site": "https://openreview.net/forum?id=FvqGxAyCpi",
        "pdf_size": 2807319,
        "rating": "3;3;3;6",
        "confidence": "3;4;5;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "78;114;59;70",
        "wc_strengths": "30;17;18;46",
        "wc_weaknesses": "247;194;182;54",
        "wc_questions": "99;59;3;27",
        "wc_review": "454;384;262;197",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            80.25,
            20.620075169601105
        ],
        "wc_strengths_avg": [
            27.75,
            11.712706775122479
        ],
        "wc_weaknesses_avg": [
            169.25,
            70.89208347904581
        ],
        "wc_questions_avg": [
            47.0,
            36.0
        ],
        "wc_review_avg": [
            324.25,
            100.58920170674385
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ED8pV2OqejgJ:scholar.google.com/&scioq=Customizing+Global+Model+for+Diverse+Target+Distributions+in+Federated+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Shanghai Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sjtu.edu.cn",
        "aff_unique_abbr": "SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "FwdnG0xR02",
        "title": "Balancing the Picture: Debiasing Vision-Language Datasets with Synthetic Contrast Sets",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Vision-language models are growing in popularity and public visibility to generate, edit, and caption images at scale; but their outputs can perpetuate and amplify societal biases learned during pre-training on uncurated image-text pairs from the internet. Although debiasing methods have been proposed, we argue that these measurements of model bias lack validity due to dataset bias. We demonstrate there are spurious correlations in COCO Captions, the most commonly used dataset for evaluating bias, between background context and the gender of people in-situ. This is problematic because commonly-used bias metrics (such as Bias@K) rely on per-gender base rates. To address this issue, we propose a novel dataset debiasing pipeline to augment the COCO dataset with synthetic, gender-balanced contrast sets, where only the gender of the subject is edited and the background is fixed. As existing image editing methods have limitations and sometimes produce low-quality images; we introduce a method to automatically filter the generated images based on their similarity to real images. Using our balanced synthetic contrast sets, we benchmark bias in multiple CLIP-based models, demonstrating how metrics are skewed by imbalance in the original COCO images. Our results indicate that the proposed approach improves the validity of the evaluation, ultimately contributing to more realistic understanding of bias in CLIP.",
        "keywords": "Fairness;Bias",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/74def7bf0d54c14aa427c9c82258450f56cc7180.pdf",
        "author": "Brandon Abreu Smith;Miguel Farinha;Siobhan Mackenzie Hall;Hannah Rose Kirk;Aleksandar Shtedritski;Max Bain",
        "authorids": "~Brandon_Abreu_Smith1;~Miguel_Farinha1;~Siobhan_Mackenzie_Hall1;~Hannah_Rose_Kirk1;~Aleksandar_Shtedritski1;~Max_Bain1",
        "gender": "M;M;;F;M;M",
        "homepage": "https://brandonsmith.co.uk/;;;https://www.hannahrosekirk.com/;;",
        "dblp": ";;;284/9434;284/9612;249/2729",
        "google_scholar": ";HE6se3sAAAAJ;A9c8wlwAAAAJ;Fha8ldEAAAAJ;cGnonsQAAAAJ;fExMPsgAAAAJ",
        "orcid": ";0000-0002-1729-723X;0000-0002-1520-4220;0000-0002-7419-5993;;",
        "linkedin": "brandon-abreu-smith/;miguel-farinha-973a051b5/;siobhan-hall-805255bb/;hannah-rose-kirk;;",
        "or_profile": "~Brandon_Abreu_Smith1;~Miguel_Farinha1;~Siobhan_Mackenzie_Hall1;~Hannah_Rose_Kirk1;~Aleksandar_Shtedritski1;~Max_Bain1",
        "aff": ";University of Oxford;Microsoft Research;University of Oxford;Google;Reka AI",
        "aff_domain": ";ox.ac.uk;research.microsoft.com;ox.ac.uk;deepmind.com;reka.ai",
        "position": ";PhD student;Intern;PhD student;Intern;Researcher",
        "bibtex": "@misc{\nsmith2024balancing,\ntitle={Balancing the Picture: Debiasing Vision-Language Datasets with Synthetic Contrast Sets},\nauthor={Brandon Abreu Smith and Miguel Farinha and Siobhan Mackenzie Hall and Hannah Rose Kirk and Aleksandar Shtedritski and Max Bain},\nyear={2024},\nurl={https://openreview.net/forum?id=FwdnG0xR02}\n}",
        "github": "",
        "project": "",
        "reviewers": "YKtn;E6KN;Nd3Y",
        "site": "https://openreview.net/forum?id=FwdnG0xR02",
        "pdf_size": 5373158,
        "rating": "3;5;6",
        "confidence": "4;4;3",
        "soundness": "3;3;3",
        "contribution": "2;2;4",
        "presentation": "3;3;3",
        "wc_summary": "77;66;77",
        "wc_strengths": "50;37;86",
        "wc_weaknesses": "170;255;81",
        "wc_questions": "113;6;49",
        "wc_review": "410;364;293",
        "wc_reply_reviewers": "0;0;13",
        "wc_reply_authors": "805;778;732",
        "reply_reviewers": "0;0;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            73.33333333333333,
            5.185449728701348
        ],
        "wc_strengths_avg": [
            57.666666666666664,
            20.725722075613085
        ],
        "wc_weaknesses_avg": [
            168.66666666666666,
            71.04145894397784
        ],
        "wc_questions_avg": [
            56.0,
            43.96210489349511
        ],
        "wc_review_avg": [
            355.6666666666667,
            48.12714641678044
        ],
        "wc_reply_reviewers_avg": [
            4.333333333333333,
            6.128258770283413
        ],
        "wc_reply_authors_avg": [
            771.6666666666666,
            30.136725472788548
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.7559289460184545,
        "gs_citation": 22,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9860224282727997031&as_sdt=40000005&sciodt=0,22&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0;2;3",
        "aff_unique_norm": "University of Oxford;Microsoft;Google;Reka AI",
        "aff_unique_dep": ";Microsoft Research;Google;",
        "aff_unique_url": "https://www.ox.ac.uk;https://www.microsoft.com/en-us/research;https://www.google.com;https://www.reka.ai",
        "aff_unique_abbr": "Oxford;MSR;Google;Reka AI",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;0;1;1",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "id": "FwwnW2dK9w",
        "title": "Poisoning-based Backdoor Attacks for Arbitrary Target Label with Positive Triggers",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Poisoning-based backdoor attacks expose vulnerabilities in the data preparation stage of deep neural network (DNN) training. The DNNs trained on the poisoned dataset will be embedded with a backdoor, making them behave well on clean data while outputting malicious predictions whenever a trigger is applied. To exploit the abundant information contained in the input data to output label mapping, our scheme utilizes the network trained from the clean dataset as a trigger generator to produce poisons that significantly raise the success rate of backdoor attacks versus conventional approaches. Specifically, we provide a new categorization of triggers inspired by the adversarial technique and develop a multi-label and multi-payload Poisoning-based backdoor attack with Positive Triggers (PPT), which effectively moves the input closer to the target label on benign classifiers. After the classifier is trained on the poisoned dataset, we can generate an input-label-aware trigger to make the infected classifier predict any given input to any target label with a high possibility. Under both dirty- and clean-label settings, we show empirically that the proposed poisoning-based backdoor attack achieves a high attack success rate without sacrificing accuracy across various datasets, including SVHN, CIFAR10, GTSRB, and Tiny ImageNet. Furthermore, the PPT attack can elude a variety of classical backdoor defenses, proving its effectiveness.",
        "keywords": "Poisoning-based backdoor attack;positive trigger;multi-label and multi-payload attack",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/725d26c2ece88a2d013770265c5afec48dd0dceb.zip",
        "author": "Binxiao Huang;Jason Chun Lok Li;Chang Liu;Ngai Wong",
        "authorids": "~Binxiao_Huang1;~Jason_Chun_Lok_Li1;~Chang_Liu35;~Ngai_Wong1",
        "gender": "M;M;;M",
        "homepage": "https://harr7y.github.io/;;;https://www.eee.hku.hk/~nwong/",
        "dblp": "317/0063;;;88/3656",
        "google_scholar": "kJ_qMjoAAAAJ;Tcpdsh0AAAAJ;;PM_uMYIAAAAJ",
        "orcid": "0000-0001-5316-703X;;;0000-0002-3026-0108",
        "linkedin": ";jason-chun-lok-li-0590b3166;;",
        "or_profile": "~Binxiao_Huang1;~Jason_Chun_Lok_Li1;~Chang_Liu35;~Ngai_Wong1",
        "aff": "University of Hong Kong;University of Hong Kong;;The University of Hong Kong",
        "aff_domain": "hku.hk;eee.hku.hk;;hku.hk",
        "position": "PhD student;PhD student;;Associate Professor",
        "bibtex": "@misc{\nhuang2024poisoningbased,\ntitle={Poisoning-based Backdoor Attacks for Arbitrary Target Label with Positive Triggers},\nauthor={Binxiao Huang and Jason Chun Lok Li and Chang Liu and Ngai Wong},\nyear={2024},\nurl={https://openreview.net/forum?id=FwwnW2dK9w}\n}",
        "github": "",
        "project": "",
        "reviewers": "N6ns;GFty;rras;dCfv",
        "site": "https://openreview.net/forum?id=FwwnW2dK9w",
        "pdf_size": 1378206,
        "rating": "3;3;3;5",
        "confidence": "4;4;4;5",
        "soundness": "3;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;2;3",
        "wc_summary": "80;125;42;67",
        "wc_strengths": "85;32;41;88",
        "wc_weaknesses": "216;220;302;313",
        "wc_questions": "160;1;47;38",
        "wc_review": "541;378;432;506",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            78.5,
            30.120590963658067
        ],
        "wc_strengths_avg": [
            61.5,
            25.22399651125888
        ],
        "wc_weaknesses_avg": [
            262.75,
            44.94093345715017
        ],
        "wc_questions_avg": [
            61.5,
            59.42432162002356
        ],
        "wc_review_avg": [
            464.25,
            63.46800374992111
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2307185724965597034&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Hong Kong",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.hku.hk",
        "aff_unique_abbr": "HKU",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "AnimateDiff: Animate Your Personalized Text-to-Image Diffusion Models without Specific Tuning",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19044",
        "id": "Fx2SbBgcte",
        "author_site": "Yuwei GUO, Ceyuan Yang, Anyi Rao, Zhengyang Liang, Yaohui Wang, Yu Qiao, Maneesh Agrawala, Dahua Lin, Bo DAI",
        "tldr": "",
        "abstract": "With the advance of text-to-image (T2I) diffusion models (e.g., Stable Diffusion) and corresponding personalization techniques such as DreamBooth and LoRA, everyone can manifest their imagination into high-quality images at an affordable cost. However, adding motion dynamics to existing high-quality personalized T2Is and enabling them to generate animations remains an open challenge. In this paper, we present AnimateDiff, a practical framework for animating personalized T2I models without requiring model-specific tuning. At the core of our framework is a plug-and-play motion module that can be trained once and seamlessly integrated into any personalized T2Is originating from the same base T2I. Through our proposed training strategy, the motion module effectively learns transferable motion priors from real-world videos. Once trained, the motion module can be inserted into a personalized T2I model to form a personalized animation generator. We further propose MotionLoRA, a lightweight fine-tuning technique for AnimateDiff that enables a pre-trained motion module to adapt to new motion patterns, such as different shot types, at a low training and data collection cost. We evaluate AnimateDiff and MotionLoRA on several public representative personalized T2I models collected from the community. The results demonstrate that our approaches help these models generate temporally smooth animation clips while preserving the visual quality and motion diversity. Codes and pre-trained weights are available at https://github.com/guoyww/AnimateDiff.",
        "keywords": "Deep Learning;Diffusion Model;Video Generation",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Yuwei Guo;Ceyuan Yang;Anyi Rao;Zhengyang Liang;Yaohui Wang;Yu Qiao;Maneesh Agrawala;Dahua Lin;Bo Dai",
        "authorids": "~Yuwei_Guo1;~Ceyuan_Yang2;~Anyi_Rao2;~Zhengyang_Liang2;~Yaohui_Wang1;~Yu_Qiao1;~Maneesh_Agrawala2;~Dahua_Lin1;~Bo_Dai2",
        "gender": "M;M;M;M;M;;M;M;M",
        "homepage": "https://guoyww.github.io;https://ceyuan.me/;http://anyirao.com/;https://github.com/MaxLeung99;https://wyhsirius.github.io/;;http://graphics.stanford.edu/~maneesh;http://dahua.site;http://daibo.info/",
        "dblp": "159/7655-2;218/2676;211/7941;;168/6263-1.html;;64/2431.html;53/6088;64/2903-2",
        "google_scholar": "K2ZLY98AAAAJ;Rfj4jWoAAAAJ;8lKr7j4AAAAJ;;R7LyAb4AAAAJ;;YPzKczYAAAAJ;GMzzRRUAAAAJ;https://scholar.google.com.hk/citations?user=KNWTvgEAAAAJ",
        "orcid": "0009-0003-1516-4083;;0000-0003-1004-7753;;;;0000-0002-8996-7327;;0000-0003-0777-9232",
        "linkedin": ";;anyirao/;;;;maneesh-agrawala-1a5a20192/;;",
        "or_profile": "~Yuwei_Guo1;~Ceyuan_Yang2;~Anyi_Rao2;~Zhengyang_Liang2;~Yaohui_Wang1;~Yu_Qiao1;~Maneesh_Agrawala2;~Dahua_Lin1;~Bo_Dai2",
        "aff": "The Chinese University of Hong Kong;ByteDance Inc.;Stanford University;Shanghai Artificial Intelligence Laboratory;Shanghai AI Laboratory;;Stanford University;The Chinese University of Hong Kong;Shanghai AI Laboratory",
        "aff_domain": "cuhk.edu.hk;bytedance.com;stanford.edu;pjlab.org.cn;pjlab.org.cn;;stanford.edu;cuhk.edu.hk;pjlab.org.cn",
        "position": "PhD student;Researcher;Postdoc;Intern;Research Scientist;;Full Professor;Associate Professor;Scientist",
        "bibtex": "@inproceedings{\nguo2024animatediff,\ntitle={AnimateDiff: Animate Your Personalized Text-to-Image Diffusion Models without Specific Tuning},\nauthor={Yuwei Guo and Ceyuan Yang and Anyi Rao and Zhengyang Liang and Yaohui Wang and Yu Qiao and Maneesh Agrawala and Dahua Lin and Bo Dai},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Fx2SbBgcte}\n}",
        "github": "",
        "project": "",
        "reviewers": "eMMP;Jp9x;ih9K;31Uu",
        "pdf_size": 47286501,
        "rating": "6;6;8;8",
        "confidence": "3;4;5;4",
        "soundness": "3;3;3;4",
        "contribution": "2;3;3;4",
        "presentation": "3;4;4;4",
        "wc_summary": "122;120;110;101",
        "wc_strengths": "76;135;76;68",
        "wc_weaknesses": "28;138;155;100",
        "wc_questions": "48;8;122;19",
        "wc_review": "274;401;463;288",
        "wc_reply_reviewers": "0;16;0;0",
        "wc_reply_authors": "558;618;371;433",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            113.25,
            8.407585860400118
        ],
        "wc_strengths_avg": [
            88.75,
            26.901440481877547
        ],
        "wc_weaknesses_avg": [
            105.25,
            48.843500079335016
        ],
        "wc_questions_avg": [
            49.25,
            44.47119854467608
        ],
        "wc_review_avg": [
            356.5,
            78.77340921910134
        ],
        "wc_reply_reviewers_avg": [
            4.0,
            6.928203230275509
        ],
        "wc_reply_authors_avg": [
            495.0,
            97.87492017876694
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.7071067811865475,
        "gs_citation": 832,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17668344440294432493&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=Fx2SbBgcte",
        "pdf": "https://openreview.net/pdf?id=Fx2SbBgcte",
        "email": "cuhk.edu.hk;bytedance.com;stanford.edu;pjlab.org.cn;pjlab.org.cn;;stanford.edu;cuhk.edu.hk;pjlab.org.cn",
        "author_num": 9,
        "aff_unique_index": "0;1;2;3;4;2;0;4",
        "aff_unique_norm": "Chinese University of Hong Kong;ByteDance;Stanford University;Shanghai Artificial Intelligence Laboratory;Shanghai AI Laboratory",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.cuhk.edu.hk;https://www.bytedance.com;https://www.stanford.edu;http://www.shailab.org/;https://www.shanghai-ai-lab.com",
        "aff_unique_abbr": "CUHK;ByteDance;Stanford;Shanghai AI Lab;SAIL",
        "aff_campus_unique_index": "0;2;2;0",
        "aff_campus_unique": "Hong Kong SAR;;Stanford",
        "aff_country_unique_index": "0;0;1;0;0;1;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "FyZaVdQLdJ",
        "title": "Spiking Mixers for Robust and Energy-efficient Vision-and-Language Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Multimodal learning is a fundamental challenge in artificial intelligence, with applications spanning computer vision, speech recognition, and natural language processing. This paper presents the pioneering incorporation of Spiking Neural Networks (SNNs) into the Vision-and-Language domain, introducing MLP-Mixer as a unified backbone and adapting mixture of experts approach to effectively fuse different modalities. The Mixer is directly trained using surrogate gradients and has small timesteps. We propose a SNN specific adversarial training technique, combined with the mixture of experts framework, leads to improvements in adversarial robustness. We hope these findings will shed light on future research in the field of Multimodal Spiking Neural Network and adversarial robustness of Multimodal Learning.",
        "keywords": "Spiking Neural Networks;Multimodal Learning;Mixture of Experts;Adversarial Robustness",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Mufeng Chen;Erping Li",
        "authorids": "~Mufeng_Chen1;~Erping_Li1",
        "gender": ";M",
        "homepage": ";https://person.zju.edu.cn/en/liep",
        "dblp": "318/9008.html;80/4276-1",
        "google_scholar": "FKZmlWIAAAAJ;",
        "orcid": "0000-0001-9358-2828;",
        "linkedin": ";",
        "or_profile": "~Mufeng_Chen1;~Erping_Li1",
        "aff": "Zhejiang University;Zhejiang University",
        "aff_domain": "zju.edu.cn;zju.edu.cn",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nchen2024spiking,\ntitle={Spiking Mixers for Robust and Energy-efficient Vision-and-Language Learning},\nauthor={Mufeng Chen and Erping Li},\nyear={2024},\nurl={https://openreview.net/forum?id=FyZaVdQLdJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=FyZaVdQLdJ",
        "pdf_size": 1743047,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:q4tTJm3_PEcJ:scholar.google.com/&scioq=Spiking+Mixers+for+Robust+and+Energy-efficient+Vision-and-Language+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Zhejiang University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.zju.edu.cn",
        "aff_unique_abbr": "ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "G0EVNrBQh6",
        "title": "Investigating Human-Identifiable Features Hidden in Adversarial Perturbations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Neural networks perform exceedingly well across various machine learning tasks but are not immune to adversarial perturbations. This vulnerability has implications for real-world applications. While much research has been conducted, the underlying reasons why neural networks fall prey to adversarial attacks are not yet fully understood. Central to our study, which explores up to five attack algorithms across three datasets, is the identification of human-identifiable features in adversarial perturbations. Additionally, we uncover two distinct effects manifesting within human-identifiable features. Specifically, the masking effect is prominent in untargeted attacks, while the generation effect is more common in targeted attacks. Using pixel-level annotations, we extract such features and demonstrate their ability to compromise target models. In addition, our findings indicate a notable extent of similarity in perturbations across different attack algorithms when averaged over multiple models. This work also provides insights into phenomena associated with adversarial perturbations, such as transferability and model interpretability. Our study contributes to a deeper understanding of the underlying mechanisms behind adversarial attacks and offers insights for the development of more resilient defense strategies for neural networks.",
        "keywords": "Adversarial Attack;Computer Vision;Neural Network",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/b98380a20c6212c3dafdc11a2bfe42bc266ea709.pdf",
        "author": "Dennis Yuren Menn;Tzu-hsun Feng;Sriram Vishwanath;Hung-yi Lee",
        "authorids": "~Dennis_Yuren_Menn1;~Tzu-hsun_Feng1;~Sriram_Vishwanath2;~Hung-yi_Lee2",
        "gender": ";M;;Non-Binary",
        "homepage": "https://github.com/DennisMenn;;http://sriram.utlinc.org/#/;https://speech.ee.ntu.edu.tw/~hylee/index.html",
        "dblp": ";;71/2804;81/8056",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;;https://scholar.google.com/citations?hl=en;DxLO11IAAAAJ",
        "orcid": ";;0000-0003-3112-4885;",
        "linkedin": ";joseph-feng-91537b193/;;",
        "or_profile": "~Dennis_Yuren_Menn1;~Tzu-hsun_Feng1;~Sriram_Vishwanath2;~Hung-yi_Lee2",
        "aff": "National Taiwan University;National Taiwan University;University of Texas at Austin;National Taiwan University",
        "aff_domain": "ntu.edu.tw;ntu.edu.tw;utexas.edu;ntu.edu.tw",
        "position": "MS student;MS student;Full Professor;Full Professor",
        "bibtex": "@misc{\nmenn2024investigating,\ntitle={Investigating Human-Identifiable Features Hidden in Adversarial Perturbations},\nauthor={Dennis Yuren Menn and Tzu-hsun Feng and Sriram Vishwanath and Hung-yi Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=G0EVNrBQh6}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZsSi;3kT3;G5Xu;QGNn;MnMs",
        "site": "https://openreview.net/forum?id=G0EVNrBQh6",
        "pdf_size": 15587153,
        "rating": "3;5;5;5;10",
        "confidence": "5;4;3;5;5",
        "soundness": "2;3;2;3;4",
        "contribution": "2;2;1;2;4",
        "presentation": "1;2;3;2;4",
        "wc_summary": "92;52;131;81;167",
        "wc_strengths": "55;71;48;16;223",
        "wc_weaknesses": "1292;337;236;291;306",
        "wc_questions": "5;6;144;4;165",
        "wc_review": "1444;466;559;392;861",
        "wc_reply_reviewers": "1003;0;0;0;0",
        "wc_reply_authors": "2616;1195;546;1029;693",
        "reply_reviewers": "2;0;0;0;0",
        "reply_authors": "6;2;1;2;1",
        "rating_avg": [
            5.6,
            2.33238075793812
        ],
        "confidence_avg": [
            4.4,
            0.7999999999999999
        ],
        "soundness_avg": [
            2.8,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.2,
            0.9797958971132712
        ],
        "presentation_avg": [
            2.4,
            1.019803902718557
        ],
        "wc_summary_avg": [
            104.6,
            40.18258329176958
        ],
        "wc_strengths_avg": [
            82.6,
            72.44473755905256
        ],
        "wc_weaknesses_avg": [
            492.4,
            401.1376820993012
        ],
        "wc_questions_avg": [
            64.8,
            73.5429126428917
        ],
        "wc_review_avg": [
            744.4,
            384.47397831322735
        ],
        "wc_reply_reviewers_avg": [
            200.6,
            401.2
        ],
        "wc_reply_authors_avg": [
            1215.8,
            737.2704795392258
        ],
        "reply_reviewers_avg": [
            0.4,
            0.8000000000000002
        ],
        "reply_authors_avg": [
            2.4,
            1.8547236990991407
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.19293590828532248,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:MsQL94sj_fsJ:scholar.google.com/&scioq=Investigating+Human-Identifiable+Features+Hidden+in+Adversarial+Perturbations&hl=en&as_sdt=0,44",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "National Taiwan University;University of Texas at Austin",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ntu.edu.tw;https://www.utexas.edu",
        "aff_unique_abbr": "NTU;UT Austin",
        "aff_campus_unique_index": "0;0;1;0",
        "aff_campus_unique": "Taiwan;Austin",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "G0uzEweZB1",
        "title": "FrAug: Frequency Domain Augmentation for Time Series Forecasting",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Data augmentation (DA) has become a \\emph{de facto} solution to expand training data size for deep learning. With the proliferation of deep models for time series analysis, various time series DA techniques are proposed in the literature, e.g., cropping-, warping-, flipping-, and mixup-based methods. However, these augmentation methods mainly apply to time series classification and anomaly detection tasks. In time series forecasting (TSF), we need to model the fine-grained temporal relationship within time series segments to generate accurate forecasting results given data in a look-back window. Existing DA solutions in the time domain would break such a relationship, leading to poor forecasting accuracy. To tackle this problem, this paper proposes simple yet effective frequency domain augmentation techniques that ensure the semantic consistency of augmented data-label pairs in forecasting, named FrAug. We conduct extensive experiments on eight widely used benchmarks with several state-of-the-art TSF deep models. Our results show that FrAug can boost the forecasting accuracy of TSF models in most cases. Moreover, we show that FrAug enables models trained with 1% of the original training data to achieve similar performance to the ones trained on full training data, which is particularly attractive for cold-start forecasting. Finally, we show that applying test-time training with FrAug greatly improves forecasting accuracy for time series with significant distribution shifts, which often occurs in real-life TSF applications. Our code is available at https://anonymous.4open.science/r/Fraug-more-results-1785.",
        "keywords": "Time series forecasting;Data augmentation;Few shot learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Muxi Chen;Zhijian Xu;Ailing Zeng;Qiang Xu",
        "authorids": "~Muxi_Chen1;~Zhijian_Xu1;~Ailing_Zeng1;~Qiang_Xu1",
        "gender": "M;M;F;M",
        "homepage": "https://github.com/mixiancmx;http://notfornow.com;https://ailingzeng.site/;https://github.com/cure-lab",
        "dblp": "316/2877;72/8350;226/4720;43/1230-1",
        "google_scholar": ";;Tn7fzS8AAAAJ;https://scholar.google.com.tw/citations?user=eSiKPqUAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;%E7%88%B1%E7%8E%B2-%E6%9B%BE-65504112a/;",
        "or_profile": "~Muxi_Chen1;~Zhijian_Xu1;~Ailing_Zeng1;~Qiang_Xu1",
        "aff": "The Chinese University of Hong Kong;The Chinese University of Hong Kong;International Digital Economy Academy;The Chinese University of Hong Kong",
        "aff_domain": "cse.cuhk.edu.hk;cuhk.edu.hk;idea.edu.cn;cuhk.edu.hk",
        "position": "PhD student;PhD student;Researcher;Full Professor",
        "bibtex": "@misc{\nchen2024fraug,\ntitle={FrAug: Frequency Domain Augmentation for Time Series Forecasting},\nauthor={Muxi Chen and Zhijian Xu and Ailing Zeng and Qiang Xu},\nyear={2024},\nurl={https://openreview.net/forum?id=G0uzEweZB1}\n}",
        "github": "",
        "project": "",
        "reviewers": "j37M;bZGH;SMpB;Arja;Wo4Z",
        "site": "https://openreview.net/forum?id=G0uzEweZB1",
        "pdf_size": 500758,
        "rating": "3;5;5;5;5",
        "confidence": "4;4;4;4;4",
        "soundness": "3;3;3;2;3",
        "contribution": "1;1;2;2;1",
        "presentation": "3;2;2;2;2",
        "wc_summary": "146;64;65;94;106",
        "wc_strengths": "75;39;54;26;31",
        "wc_weaknesses": "74;178;149;86;256",
        "wc_questions": "29;27;43;2;96",
        "wc_review": "324;308;311;208;489",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            4.6,
            0.7999999999999999
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            1.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.2,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            95.0,
            30.278705388440898
        ],
        "wc_strengths_avg": [
            45.0,
            17.7426040929735
        ],
        "wc_weaknesses_avg": [
            148.6,
            66.15617884974918
        ],
        "wc_questions_avg": [
            39.4,
            31.232034836046143
        ],
        "wc_review_avg": [
            328.0,
            90.58255902766273
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 16,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7908077548457293828&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Chinese University of Hong Kong;International Digital Economy Academy",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cuhk.edu.hk;",
        "aff_unique_abbr": "CUHK;",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China;"
    },
    {
        "title": "CRAFT: Customizing LLMs by Creating and Retrieving from Specialized Toolsets",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19043",
        "id": "G0vdDSt9XM",
        "author_site": "Lifan Yuan, Yangyi Chen, Xingyao Wang, Yi Fung, Hao Peng, Heng Ji",
        "tldr": "",
        "abstract": "Large language models (LLMs) are often augmented with tools to solve complex tasks. By generating code snippets and executing them through task-specific Application Programming Interfaces (APIs), they can offload certain functions to dedicated external modules, such as image encoding and performing calculations. However, most existing approaches to augment LLMs with tools are constrained\nby general-purpose APIs and lack the flexibility for tailoring them to specific tasks. In this work, we present CRAFT, a general tool creation and retrieval framework for LLMs. It creates toolsets specifically curated for the tasks and equips LLMs with a component that retrieves tools from these sets to enhance their capability to solve complex tasks. For each task, we collect specific code solutions by prompting\nGPT-4 to solve the training examples. Following a validation step ensuring the correctness, these solutions are abstracted into code snippets to enhance reusability, and deduplicated for higher quality. At inference time, the language model retrieves snippets from the toolsets and then executes them or generates the output conditioning on the retrieved snippets. Our method is designed to be flexible and\noffers a plug-and-play approach to adapt off-the-shelf LLMs to unseen domains and modalities, without any finetuning. Experiments on vision-language, tabular processing, and mathematical reasoning tasks show that our approach achieves substantial improvements compared to strong baselines. In addition, our in-depth analysis reveals that: (1) consistent performance improvement can be achieved by\nscaling up the number of tools and the capability of the backbone models; (2) each component of our approach contributes to the performance gains; (3) the created tools are well-structured and reliable with low complexity  and atomicity.",
        "keywords": "Tool Creation;Tool Retrieval;LLM;Multimodality;Reasoning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/01c732a2c83e29c5f0cc389c90614f7c4f6ea9fd.zip",
        "author": "Lifan Yuan;Yangyi Chen;Xingyao Wang;Yi Fung;Hao Peng;Heng Ji",
        "authorids": "~Lifan_Yuan1;~Yangyi_Chen1;~Xingyao_Wang1;~Yi_Fung1;~Hao_Peng4;~Heng_Ji3",
        "gender": ";M;M;F;;F",
        "homepage": ";https://yangyi-chen.github.io/;https://xwang.dev;https://mayrfung.github.io;;http://blender.cs.illinois.edu/hengji.html",
        "dblp": ";05/10083;264/9892;223/2782-1.html;;",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;F7qq3YcAAAAJ;eUae2K0AAAAJ;;z7GCqT4AAAAJ",
        "orcid": ";;0000-0002-3483-8624;;;",
        "linkedin": ";yangyi-chen-4006a11b2/;;;;",
        "or_profile": "~Lifan_Yuan1;~Yangyi_Chen1;~Xingyao_Wang1;~Yi_Fung1;~Hao_Peng4;~Heng_Ji3",
        "aff": ";Department of Computer Science, University of Illinois at Urbana-Champaign;University of Illinois Urbana-Champaign;University of Illinois, Urbana Champaign;;University of Illinois, Urbana-Champaign",
        "aff_domain": ";cs.illinois.edu;cs.illinois.edu;illinois.edu;;uiuc.edu",
        "position": ";PhD student;PhD student;PhD student;;Full Professor",
        "bibtex": "@inproceedings{\nyuan2024craft,\ntitle={{CRAFT}: Customizing {LLM}s by Creating and Retrieving from Specialized Toolsets},\nauthor={Lifan Yuan and Yangyi Chen and Xingyao Wang and Yi Fung and Hao Peng and Heng Ji},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=G0vdDSt9XM}\n}",
        "github": "",
        "project": "",
        "reviewers": "nWn7;A2gB;3JvW",
        "pdf_size": 7307880,
        "rating": "6;6;8",
        "confidence": "3;3;3",
        "soundness": "4;3;3",
        "contribution": "3;3;3",
        "presentation": "4;3;3",
        "wc_summary": "86;129;76",
        "wc_strengths": "57;95;92",
        "wc_weaknesses": "133;233;101",
        "wc_questions": "4;237;88",
        "wc_review": "280;694;357",
        "wc_reply_reviewers": "0;22;0",
        "wc_reply_authors": "236;1437;977",
        "reply_reviewers": "0;1;0",
        "reply_authors": "1;3;2",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            97.0,
            22.992752481307377
        ],
        "wc_strengths_avg": [
            81.33333333333333,
            17.249798710580816
        ],
        "wc_weaknesses_avg": [
            155.66666666666666,
            56.22178304615471
        ],
        "wc_questions_avg": [
            109.66666666666667,
            96.34774978632811
        ],
        "wc_review_avg": [
            443.6666666666667,
            179.78196671400485
        ],
        "wc_reply_reviewers_avg": [
            7.333333333333333,
            10.370899457402697
        ],
        "wc_reply_authors_avg": [
            883.3333333333334,
            494.75942526533936
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 62,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14416118386875501838&as_sdt=20000005&sciodt=0,21&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=G0vdDSt9XM",
        "pdf": "https://openreview.net/pdf?id=G0vdDSt9XM",
        "email": ";cs.illinois.edu;cs.illinois.edu;illinois.edu;;uiuc.edu",
        "author_num": 6,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "University of Illinois Urbana-Champaign;University of Illinois",
        "aff_unique_dep": "Department of Computer Science;",
        "aff_unique_url": "https://illinois.edu;https://illinois.edu",
        "aff_unique_abbr": "UIUC;UIUC",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Urbana-Champaign",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "G1DoOVM3xZ",
        "title": "A Nearly Optimal and Low-Switching Algorithm for Reinforcement Learning with General Function Approximation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The exploration-exploitation dilemma has been a central challenge in reinforcement learning (RL) with complex model classes. In this paper, we propose a new algorithm, Monotonic  Q-Learning with Upper Confidence Bound (MQL-UCB) for RL with general function approximation, where the Bellman operator of the underlying Markov decision process (MDP) is assumed to map any value functions into a function class with a bounded eluder dimension. Our key algorithmic design includes: (1) a general deterministic policy-switching strategy that achieves low switching cost, (2) a monotonic value function structure with carefully controlled function class complexity, and (3) a variance weighted regression scheme that exploits historical trajectories with high data efficiency. MQL-UCB achieves minimax optimal regret of $\\tilde{O}(d\\sqrt{HK})$ when $K$ is sufficiently large and near optimal policy switching cost of $\\tilde{O}(dH)$, with $d$ being the eluder dimension of the function class, $H$ being the planning horizon, and $K$ being the number of episodes. Our work sheds light on designing provably sample-efficient and deployment-efficient Q-learning with nonlinear function approximation.",
        "keywords": "Reinforcement learning;sample efficiency;function approximation",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Heyang Zhao;Jiafan He;Quanquan Gu",
        "authorids": "~Heyang_Zhao1;~Jiafan_He1;~Quanquan_Gu1",
        "gender": "M;M;M",
        "homepage": "https://web.cs.ucla.edu/~hyzhao/;https://sites.google.com/g.ucla.edu/jiafan-he-homepage;http://web.cs.ucla.edu/~qgu/",
        "dblp": ";214/5785;50/4597",
        "google_scholar": "zHQ1ap0AAAAJ;F3AXNBwAAAAJ;GU9HgNAAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Heyang_Zhao1;~Jiafan_He1;~Quanquan_Gu1",
        "aff": "Computer Science Department, University of California, Los Angeles;University of California, Los Angeles;University of California, Los Angeles",
        "aff_domain": "cs.ucla.edu;ucla.edu;cs.ucla.edu",
        "position": "PhD student;PhD student;Associate Professor",
        "bibtex": "@misc{\nzhao2024a,\ntitle={A Nearly Optimal and Low-Switching Algorithm for Reinforcement Learning with General Function Approximation},\nauthor={Heyang Zhao and Jiafan He and Quanquan Gu},\nyear={2024},\nurl={https://openreview.net/forum?id=G1DoOVM3xZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "rQVV;kAyi;XUgy;BQ2A",
        "site": "https://openreview.net/forum?id=G1DoOVM3xZ",
        "pdf_size": 599381,
        "rating": "5;5;5;6",
        "confidence": "3;3;3;4",
        "soundness": "3;2;3;3",
        "contribution": "3;2;2;2",
        "presentation": "2;2;2;2",
        "wc_summary": "52;55;119;85",
        "wc_strengths": "43;65;77;36",
        "wc_weaknesses": "201;121;187;346",
        "wc_questions": "5;48;5;16",
        "wc_review": "301;289;388;483",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "755;852;726;730",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            77.75,
            27.086666461563706
        ],
        "wc_strengths_avg": [
            55.25,
            16.498105951896417
        ],
        "wc_weaknesses_avg": [
            213.75,
            82.11386910869564
        ],
        "wc_questions_avg": [
            18.5,
            17.613914953808536
        ],
        "wc_review_avg": [
            365.25,
            77.9819690697792
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            765.75,
            51.02144157116692
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13480435116067117237&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of California, Los Angeles",
        "aff_unique_dep": "Computer Science Department",
        "aff_unique_url": "https://www.ucla.edu",
        "aff_unique_abbr": "UCLA",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Los Angeles",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Customizable Combination of Parameter-Efficient Modules for Multi-Task Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19042",
        "id": "G1Hlubz1fR",
        "author_site": "Haowen Wang, Tao Sun, Congyun Jin, Yingbo Wang, Yibo Fan, Yunqi Xu, Yuliang Du, Cong Fan",
        "tldr": "",
        "abstract": "Modular and composable transfer learning is an emerging direction in the field of Parameter Efficient Fine-Tuning, as it enables neural networks to better organize various aspects of knowledge, leading to improved cross-task generalization.\nIn this paper, we introduce a novel approach Customized Polytropon ($\\texttt{C-Poly}$) that combines task-common skills and task-specific skills, while the skill parameters being highly parameterized using low-rank techniques.\nEach task is associated with a customizable number of exclusive specialized skills and also benefits from skills shared with peer tasks. A skill assignment matrix is jointly learned. To evaluate our approach, we conducted extensive experiments on the Super-NaturalInstructions and the SuperGLUE benchmarks.\nOur findings demonstrate that $\\texttt{C-Poly}$ outperforms fully-shared, task-specific, and skill-indistinguishable baselines, significantly enhancing the sample efficiency in multi-task learning scenarios.",
        "keywords": "Modular skill learning;Multi-task learning;Parameter-Efficient;Fine-Tuning",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Haowen Wang;Tao Sun;Congyun Jin;Yingbo Wang;Yibo Fan;Yunqi Xu;Yuliang Du;Cong Fan",
        "authorids": "~Haowen_Wang1;~Tao_Sun15;~Congyun_Jin1;~Yingbo_Wang3;~Yibo_Fan1;~Yunqi_Xu1;~Yuliang_Du1;~Cong_Fan1",
        "gender": "M;M;F;M;M;;;M",
        "homepage": ";;https://github.com/Auazure;https://github.com/wangyingbo1118;http://viplab.fudan.edu.cn/;https://github.com/Xuyunqixyq;https://github.com/Rafantasy;https://openreview.net/profile/activate?token=d1573cce0a47a7eb41f38265c2e5630dbc872aa108a27033d5ca0ca56ef2318c",
        "dblp": ";;;;15/6772.html;;;17/5679",
        "google_scholar": "X-HgtJIAAAAJ;https://scholar.google.com.sg/citations?user=GqvmRNYAAAAJ;;;;;;",
        "orcid": "0000-0003-4323-7166;0000-0001-6357-6726;0009-0008-1180-5513;;0000-0003-2523-8261;;;",
        "linkedin": ";taosunvoyage/;;;;;;",
        "or_profile": "~Haowen_Wang1;~Tao_Sun15;~Congyun_Jin1;~Yingbo_Wang3;~Yibo_Fan1;~Yunqi_Xu1;~Yuliang_Du1;~Cong_Fan1",
        "aff": "Alipay;Ant Group;Alibaba Group;Alibaba Group;Fudan University;Ant Group;;AntGroup",
        "aff_domain": "alipay.com;antgroup.com;alipay.com;alibaba-inc.com;fudan.edu.cn;antgroup.com;;fudan.edu.cn",
        "position": "Researcher;Researcher;Researcher;Researcher;Full Professor;Researcher;;Principal Researcher",
        "bibtex": "@inproceedings{\nwang2024customizable,\ntitle={Customizable Combination of Parameter-Efficient Modules for Multi-Task Learning},\nauthor={Haowen Wang and Tao Sun and Congyun Jin and Yingbo Wang and Yibo Fan and Yunqi Xu and Yuliang Du and Cong Fan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=G1Hlubz1fR}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZWwD;WuXZ;soi2;yvMZ",
        "pdf_size": 1699230,
        "rating": "6;6;6;6",
        "confidence": "3;3;4;4",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "211;62;132;175",
        "wc_strengths": "133;50;66;50",
        "wc_weaknesses": "385;60;176;64",
        "wc_questions": "74;131;58;71",
        "wc_review": "803;303;432;360",
        "wc_reply_reviewers": "96;0;0;116",
        "wc_reply_authors": "608;437;574;580",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "4;4;4;6",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            145.0,
            55.4842319943243
        ],
        "wc_strengths_avg": [
            74.75,
            34.259122872601395
        ],
        "wc_weaknesses_avg": [
            171.25,
            131.90029378284189
        ],
        "wc_questions_avg": [
            83.5,
            28.075790282732914
        ],
        "wc_review_avg": [
            474.5,
            195.09036367796335
        ],
        "wc_reply_reviewers_avg": [
            53.0,
            53.4696175411794
        ],
        "wc_reply_authors_avg": [
            549.75,
            66.34898265987204
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            4.5,
            0.8660254037844386
        ],
        "replies_avg": [
            32,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13346926275963663837&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=G1Hlubz1fR",
        "pdf": "https://openreview.net/pdf?id=G1Hlubz1fR",
        "email": "alipay.com;antgroup.com;alipay.com;alibaba-inc.com;fudan.edu.cn;antgroup.com;;fudan.edu.cn",
        "author_num": 8,
        "aff_unique_index": "0;1;2;2;3;1;1",
        "aff_unique_norm": "Alipay;Ant Group;Alibaba Group;Fudan University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.alipay.com;https://www.antgroup.com;https://www.alibaba.com;https://www.fudan.edu.cn",
        "aff_unique_abbr": "Alipay;Ant Group;Alibaba;Fudan",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "G1YmAZ3sM8",
        "title": "Low rank field-weighted factorization machines for low latency item recommendation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Factorization machine (FM) variants are widely used in item recommendation systems that operate under strict throughput and latency requirements, such as online advertising systems. Their main strength is their ability to model pairwise feature interactions while being resilient to data sparsity by learning factorized representation, and having computational graphs that allow fast inference. Moreover, when items are ranked as a part of a query for each incoming user, these graphs facilitate computing the portion stemming from the user and context fields only once per query, and the computational cost for each ranked item is proportional only to the number of fields that vary among the ranked items. Consequently, in terms of inference cost, the number of user or context fields is practically unlimited.\n\nMore advanced variants of FMs, such as field-aware and field-weighted FMs, provide better accuracy by learning a representation of field-wise interactions, but require computing all pairwise interaction terms explicitly. In particular, the computational cost during inference is proportional to the square of the number of all fields, including user, context, and item. This is prohibitive in many systems when the number of fields is large, and imposes a limit on the number of user and context fields. To mitigate this caveat, heuristic pruning of low intensity field interactions is commonly used to accelerate inference. \n\nIn this work we propose an alternative to the pruning heuristic in field-weighted FMs using a diagonal plus symmetric low-rank decomposition, that reduces the computational cost of inference, by allowing it to be proportional to the number of item fields only. Using a set of numerical experiments, we show that aggressive rank reduction outperforms similarly aggressive pruning, both in terms of accuracy and item recommendation speed. Beyond computational complexity analysis, we corroborate our claim of faster inference experimentally having deployed our solution to a major online advertising system, where we observed significant ranking latency improvements.",
        "keywords": "factorization machine;supervised learning;recommender system",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Alex Shtoff;Michael Viderman;Naama Krasne;Oren Somekh;Ariel Raviv",
        "authorids": "~Alex_Shtoff1;~Michael_Viderman2;~Naama_Krasne1;~Oren_Somekh2;~Ariel_Raviv1",
        "gender": "M;M;;M;",
        "homepage": "https://alexshtf.github.io;https://www.linkedin.com/in/michael-viderman-86668172;;;",
        "dblp": "305/0557;;;;89/10321",
        "google_scholar": "XcpQMwwAAAAJ;;;https://scholar.google.co.il/citations?user=wuj-SeUAAAAJ;https://scholar.google.co.il/citations?user=95ohCqUAAAAJ",
        "orcid": ";;;;",
        "linkedin": "alexshtf/?lipi=urn%3Ali%3Apage%3Ad_flagship3_feed%3BhOwAOew2T02l4V4ROjS8%2BA%3D%3D;michael-viderman-86668172;naama-haramaty-krasne-2768b9ab/;;",
        "or_profile": "~Alex_Shtoff1;~Michael_Viderman2;~Naama_Krasne1;~Oren_Somekh2;~Ariel_Raviv1",
        "aff": "Yahoo Research;Yahoo;;Yahoo;Yahoo",
        "aff_domain": "yahooinc.com;yahoo.com;;yahoo-inc.com;yahoo-inc.com",
        "position": "Researcher;Researcher;;Principal Researcher;Sr. Director, Research",
        "bibtex": "@misc{\nshtoff2024low,\ntitle={Low rank field-weighted factorization machines for low latency item recommendation},\nauthor={Alex Shtoff and Michael Viderman and Naama Krasne and Oren Somekh and Ariel Raviv},\nyear={2024},\nurl={https://openreview.net/forum?id=G1YmAZ3sM8}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=G1YmAZ3sM8",
        "pdf_size": 549407,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17573556781480101879&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Yahoo",
        "aff_unique_dep": "Yahoo Research",
        "aff_unique_url": "https://research.yahoo.com",
        "aff_unique_abbr": "Yahoo Research",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "G2Lnqs4eMJ",
        "title": "Optimal Neural Network Approximation for High-Dimensional Continuous Functions",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The original version of the Kolmogorov-Arnold representation theorem states\nthat for any continuous function $f : [0, 1]^d \\rightarrow \\mathbb{R}$, there exist $(d+1)(2d+1)$ univariate continuous functions such that $f$ can be expressed as product and linear combinations of them. So one can use this representation to find the optimum size of a neural network to approximate $f$. Now the important question is to check how does the size of the neural network depends on $d$.  It is proved that function space generated by special class of activation function called EUAF (elementary universal activation function), with $\\mathcal{O}(d^2)$ neurons is dense in $C([a, b]^d)$ with 11 hidden layers.  In this paper we provide classes of $d$-variate functions for which the optimized neural networks will have $\\mathcal{O}(d)$ number of neurons with elementary superexpressive activation function defined by Yarotsky. We provide a new construction of neural network of $\\mathcal{O}(d)$ neuron size to approximate $d$-variate continuous functions of certain classes. We also prove that the size $\\mathcal{O}(d)$ is optimal in those cases.",
        "keywords": "Neural Network Optimizations;KA representation;Elementary Superexpressive Activations",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Ayan Maiti;Haizhao Yang",
        "authorids": "~Ayan_Maiti1;~Haizhao_Yang1",
        "gender": ";M",
        "homepage": ";https://haizhaoyang.github.io",
        "dblp": ";139/1215",
        "google_scholar": ";p4mxTIwAAAAJ",
        "orcid": ";",
        "linkedin": "ayan-maiti-756813229/;",
        "or_profile": "~Ayan_Maiti1;~Haizhao_Yang1",
        "aff": "Purdue University;University of Maryland, College Park",
        "aff_domain": "purdue.edu;umd.edu",
        "position": "Postdoc;Associate Professor",
        "bibtex": "@misc{\nanonymous2024optimal,\ntitle={Optimal Neural Network Approximation for High-Dimensional Continuous Functions},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=G2Lnqs4eMJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "j6pw;jmHW;oDtw;ksYY",
        "site": "https://openreview.net/forum?id=G2Lnqs4eMJ",
        "pdf_size": 215643,
        "rating": "1;1;3;5",
        "confidence": "3;2;4;3",
        "soundness": "1;2;2;3",
        "contribution": "2;1;2;2",
        "presentation": "1;1;1;3",
        "wc_summary": "91;81;48;79",
        "wc_strengths": "17;18;45;106",
        "wc_weaknesses": "98;238;519;73",
        "wc_questions": "232;21;150;20",
        "wc_review": "438;358;762;278",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.5,
            1.6583123951777
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            74.75,
            16.099301227071937
        ],
        "wc_strengths_avg": [
            46.5,
            36.1420807370024
        ],
        "wc_weaknesses_avg": [
            232.0,
            177.2300764543084
        ],
        "wc_questions_avg": [
            105.75,
            90.04547462254835
        ],
        "wc_review_avg": [
            459.0,
            183.85592185186746
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.42640143271122083,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:usbpG7nbt9EJ:scholar.google.com/&scioq=Optimal+Neural+Network+Approximation+for+High-Dimensional+Continuous+Functions&hl=en&as_sdt=0,5",
        "gs_version_total": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Purdue University;University of Maryland",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.purdue.edu;https://www/umd.edu",
        "aff_unique_abbr": "Purdue;UMD",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";College Park",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "G2LsKEOs5k",
        "title": "LAVITA: Latent Video Diffusion Models with Spatio-temporal Transformers",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Video generation is a challenging task as it requires effective modeling of rich spatio-temporal information from high-dimensional video data. To tackle this challenge, we propose a novel architecture, the LAtent VIdeo diffusion model with spatio-temporal TrAnsformers, referred to as LAVITA, which integrates the Transformer architecture into diffusion models for the first time within the realm of video generation. Conceptually, LATIVA models spatial and temporal information separately to accommodate their inherent disparities as well as to reduce the computational complexity. Following this design strategy, we design several Transformer-based model variants to integrate spatial and temporal information harmoniously. Moreover, we identify the best practices in architectural choices and learning strategies for LAVITA through rigorous empirical analysis. Our comprehensive evaluation demonstrates that LAVITA achieves state-of-the-art performance across several standard video generation benchmarks, including FaceForensics, SkyTimelapse, UCF101, and Taichi-HD, outperforming current best models. We strongly believe that LAVITA provides valuable insights for future research on incorporating Transformers into diffusion models for video generation.",
        "keywords": "video generation;diffusion models;transformers",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/614042084fa6f14496c2331d81705e9b1d580d3c.zip",
        "author": "Xin Ma;Yaohui Wang;Xinyuan Chen;Yuan-Fang Li;Cunjian Chen;Ziwei Liu;Yu Qiao",
        "authorids": "~Xin_Ma3;~Yaohui_Wang1;~Xinyuan_Chen1;~Yuan-Fang_Li1;~Cunjian_Chen2;~Ziwei_Liu1;~Yu_Qiao1",
        "gender": ";M;F;M;M;M;",
        "homepage": "https://maxin-cn.github.io/;https://wyhsirius.github.io/;;https://users.monash.edu.au/~yli/;https://cunjian.github.io/;https://liuziwei7.github.io/;",
        "dblp": ";168/6263-1.html;;20/2537;73/2740.html;05/6300-2;",
        "google_scholar": "https://scholar.google.com.hk/citations?user=dN8QWCQAAAAJ;R7LyAb4AAAAJ;3fWSC8YAAAAJ;https://scholar.google.com.tw/citations?user=wufXO1kAAAAJ;f26cvh8AAAAJ;https://scholar.google.com.hk/citations?user=lc45xlcAAAAJ;",
        "orcid": "0000-0001-9389-9032;;0000-0002-5517-7255;;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Xin_Ma3;~Yaohui_Wang1;~Xinyuan_Chen1;~Yuan-Fang_Li1;~Cunjian_Chen2;~Ziwei_Liu1;~Yu_Qiao1",
        "aff": "Monash University;Shanghai AI Laboratory;Shanghai Artificial Intelligence Laboratory;Oracle;Monash University;Nanyang Technological University;",
        "aff_domain": "monash.edu;pjlab.org.cn;pjlab.org.cn;oracle.com;monash.edu;ntu.edu.sg;",
        "position": "PhD student;Research Scientist;Research Scientist;Principal Researcher;Lecturer;Assistant Professor;",
        "bibtex": "@misc{\nma2024lavita,\ntitle={{LAVITA}: Latent Video Diffusion Models with Spatio-temporal Transformers},\nauthor={Xin Ma and Yaohui Wang and Xinyuan Chen and Yuan-Fang Li and Cunjian Chen and Ziwei Liu and Yu Qiao},\nyear={2024},\nurl={https://openreview.net/forum?id=G2LsKEOs5k}\n}",
        "github": "",
        "project": "",
        "reviewers": "u898;dGeE;rGPr;xLU2",
        "site": "https://openreview.net/forum?id=G2LsKEOs5k",
        "pdf_size": 2001667,
        "rating": "3;3;5;5",
        "confidence": "3;5;4;4",
        "soundness": "2;1;2;3",
        "contribution": "1;1;3;2",
        "presentation": "2;2;3;4",
        "wc_summary": "38;45;49;125",
        "wc_strengths": "38;24;31;87",
        "wc_weaknesses": "6;230;357;390",
        "wc_questions": "222;3;2;5",
        "wc_review": "304;302;439;607",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            64.25,
            35.29429840639986
        ],
        "wc_strengths_avg": [
            45.0,
            24.748737341529164
        ],
        "wc_weaknesses_avg": [
            245.75,
            150.75870621625805
        ],
        "wc_questions_avg": [
            58.0,
            94.6916046965094
        ],
        "wc_review_avg": [
            413.0,
            125.0139992160878
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:cRHw5DbmwUUJ:scholar.google.com/&scioq=LAVITA:+Latent+Video+Diffusion+Models+with+Spatio-temporal+Transformers&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;0;4",
        "aff_unique_norm": "Monash University;Shanghai AI Laboratory;Shanghai Artificial Intelligence Laboratory;Oracle Corporation;Nanyang Technological University",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.monash.edu;https://www.shanghai-ai-lab.com;http://www.shailab.org/;https://www.oracle.com;https://www.ntu.edu.sg",
        "aff_unique_abbr": "Monash;SAIL;Shanghai AI Lab;Oracle;NTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;2;0;3",
        "aff_country_unique": "Australia;China;United States;Singapore"
    },
    {
        "title": "Image Clustering Conditioned on Text Criteria",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19041",
        "id": "G2cG3mQqop",
        "author_site": "Sehyun Kwon, Jaeseung Park, Minkyu Kim, Jaewoong Cho, Ernest K Ryu, Kangwook Lee",
        "tldr": "",
        "abstract": "Classical clustering methods do not provide users with direct control of the clustering results, and the clustering results may not be consistent with the relevant criterion that a user has in mind. In this work, we present a new methodology for performing image clustering based on user-specified criteria in the form of text by leveraging modern Vision-Language Models and Large Language Models. We call our method Image Clustering Conditioned on Text Criteria (IC$|$TC), and it represents a different paradigm of image clustering. IC$|$TC requires a minimal and practical degree of human intervention and grants the user significant control over the clustering results in return. Our experiments show that IC$|$TC can effectively cluster images with various criteria, such as human action, physical location, or the person's mood, significantly outperforming baselines.",
        "keywords": "image clustering;vision-language models;large language models;foundation models",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/4c0a7552023c95cd25fc3902e8b054ed9fcf81f4.zip",
        "author": "Sehyun Kwon;Jaeseung Park;Minkyu Kim;Jaewoong Cho;Ernest K. Ryu;Kangwook Lee",
        "authorids": "~Sehyun_Kwon1;~Jaeseung_Park1;~Minkyu_Kim2;~Jaewoong_Cho1;~Ernest_K._Ryu1;~Kangwook_Lee1",
        "gender": "M;;M;;M;M",
        "homepage": "https://sehyunkwon.github.io/;;https://github.com/kimmk135;https://sites.google.com/view/jaewoongcho;http://www.math.snu.ac.kr/~ernestryu/;http://kangwooklee.com/",
        "dblp": ";;83/6739-4;184/3848;165/5192;88/9826-1",
        "google_scholar": "p9oKN9kAAAAJ;;f-kVmJwAAAAJ;;CNOqUZoAAAAJ;sCEl8r-n5VEC",
        "orcid": ";;;;0000-0001-6820-9095;",
        "linkedin": ";;kimmk135/;;;",
        "or_profile": "~Sehyun_Kwon1;~Jaeseung_Park1;~Minkyu_Kim2;~Jaewoong_Cho1;~Ernest_K._Ryu1;~Kangwook_Lee1",
        "aff": "KRAFTON;;KRAFTON, Inc.;KRAFTON;Seoul National University;KRAFTON",
        "aff_domain": "krafton.com;;krafton.com;krafton.com;snu.ac.kr;krafton.com",
        "position": "Intern;;Researcher;Researcher;Assistant Professor;Researcher",
        "bibtex": "@inproceedings{\nkwon2024image,\ntitle={Image Clustering Conditioned on Text Criteria},\nauthor={Sehyun Kwon and Jaeseung Park and Minkyu Kim and Jaewoong Cho and Ernest K. Ryu and Kangwook Lee},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=G2cG3mQqop}\n}",
        "github": "",
        "project": "",
        "reviewers": "zuGS;32Bv;heiR;t6rL",
        "pdf_size": 10405333,
        "rating": "6;6;8;8",
        "confidence": "5;5;3;4",
        "soundness": "3;3;3;4",
        "contribution": "3;2;3;3",
        "presentation": "3;3;4;3",
        "wc_summary": "85;53;52;38",
        "wc_strengths": "13;103;31;65",
        "wc_weaknesses": "84;154;76;193",
        "wc_questions": "28;69;76;5",
        "wc_review": "210;379;235;301",
        "wc_reply_reviewers": "0;0;0;58",
        "wc_reply_authors": "524;586;122;1030",
        "reply_reviewers": "0;0;0;2",
        "reply_authors": "1;1;1;3",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            57.0,
            17.219175357722563
        ],
        "wc_strengths_avg": [
            53.0,
            34.38022687534217
        ],
        "wc_weaknesses_avg": [
            126.75,
            48.823022233368555
        ],
        "wc_questions_avg": [
            44.5,
            29.261749776799064
        ],
        "wc_review_avg": [
            281.25,
            65.49952289902576
        ],
        "wc_reply_reviewers_avg": [
            14.5,
            25.11473670974872
        ],
        "wc_reply_authors_avg": [
            565.5,
            321.94525932214003
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.9045340337332909,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13773771448879911325&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=G2cG3mQqop",
        "pdf": "https://openreview.net/pdf?id=G2cG3mQqop",
        "email": "krafton.com;;krafton.com;krafton.com;snu.ac.kr;krafton.com",
        "author_num": 6,
        "aff_unique_index": "0;1;0;2;0",
        "aff_unique_norm": "KRAFTON Inc.;KRAFTON, Inc.;Seoul National University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.krafton.com;https://www.krafton.com;https://www.snu.ac.kr",
        "aff_unique_abbr": "KRAFTON;KRAFTON;SNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "G2xm6yFkl8",
        "title": "BenthIQ: a Transformer-Based Benthic Classification Model for Coral Restoration",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Coral reefs are vital for marine biodiversity, coastal protection, and supporting human livelihoods globally. However, they are increasingly threatened by mass bleaching events, pollution, and unsustainable practices with the advent of climate change. Monitoring the health of these ecosystems is crucial for effective restoration and management. Current methods for creating benthic composition maps often compromise between spatial coverage and resolution. In this paper, we introduce BenthIQ, a multi-label semantic segmentation network designed for high-precision classification of underwater substrates, including live coral, algae, rock, and sand. Although commonly deployed CNNs are limited in learning long-range semantic information, transformer-based models have recently achieved state-of-the-art performance in vision tasks such as object detection and image classification. We integrate the hierarchical Swin Transformer as the backbone of a U-shaped encoder-decoder architecture for local-global semantic feature learning. Using a real-world case study in French Polynesia, we demonstrate that our approach outperforms traditional CNN and attention-based models on pixel-wise classification of shallow reef imagery.",
        "keywords": "coral reefs;benthos;remote sensing;semantic segmentation;convolutional neural networks;vision transformers",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/8b90d4ede391fc8d57a53a641832d68c807d13cd.zip",
        "author": "Rupa Kurinchi-Vendhan;Drew Gray",
        "authorids": "~Rupa_Kurinchi-Vendhan1;~Drew_Gray1",
        "gender": "F;M",
        "homepage": "https://rupakv.com;https://www.linkedin.com/in/drewjgray/",
        "dblp": ";",
        "google_scholar": "YY9cf7sAAAAJ;",
        "orcid": ";",
        "linkedin": "rupakurinchi-vendhan/;",
        "or_profile": "~Rupa_Kurinchi-Vendhan1;~Drew_Gray1",
        "aff": "Massachusetts Institute of Technology;",
        "aff_domain": "mit.edu;",
        "position": "PhD student;",
        "bibtex": "@misc{\nkurinchi-vendhan2024benthiq,\ntitle={Benth{IQ}: a Transformer-Based Benthic Classification Model for Coral Restoration},\nauthor={Rupa Kurinchi-Vendhan and Drew Gray},\nyear={2024},\nurl={https://openreview.net/forum?id=G2xm6yFkl8}\n}",
        "github": "",
        "project": "",
        "reviewers": "G8Fd;cnzW;pc9S",
        "site": "https://openreview.net/forum?id=G2xm6yFkl8",
        "pdf_size": 2368911,
        "rating": "3;5;6",
        "confidence": "5;4;3",
        "soundness": "2;3;3",
        "contribution": "1;2;3",
        "presentation": "3;3;3",
        "wc_summary": "66;47;88",
        "wc_strengths": "21;23;22",
        "wc_weaknesses": "157;167;43",
        "wc_questions": "33;64;201",
        "wc_review": "277;301;354",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            67.0,
            16.753109164172084
        ],
        "wc_strengths_avg": [
            22.0,
            0.816496580927726
        ],
        "wc_weaknesses_avg": [
            122.33333333333333,
            56.24549364665187
        ],
        "wc_questions_avg": [
            99.33333333333333,
            72.99467256055213
        ],
        "wc_review_avg": [
            310.6666666666667,
            32.1696889771861
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.9819805060619659,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:yxXOqV6rDy8J:scholar.google.com/&scioq=BenthIQ:+a+Transformer-Based+Benthic+Classification+Model+for+Coral+Restoration&hl=en&as_sdt=0,33",
        "gs_version_total": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "Massachusetts Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://web.mit.edu",
        "aff_unique_abbr": "MIT",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "title": "PTaRL: Prototype-based Tabular Representation Learning via Space Calibration",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19040",
        "id": "G32oY4Vnm8",
        "author_site": "Hangting Ye, Wei Fan, Xiaozhuang Song, Shun Zheng, He Zhao, Dandan Guo, Yi Chang",
        "tldr": "",
        "abstract": "Tabular data have been playing a mostly important role in diverse real-world fields, such as healthcare, engineering, finance, etc.\nWith the recent success of deep learning, many tabular machine learning (ML) methods based on deep networks (e.g., Transformer, ResNet) have achieved competitive performance on tabular benchmarks. However, existing deep tabular ML methods suffer from the representation entanglement and localization, which largely hinders their prediction performance and leads to  performance inconsistency on tabular tasks.\nTo overcome these problems, we explore a novel direction of applying prototype learning for tabular ML and propose a prototype-based tabular representation learning framework, PTaRL, for tabular prediction tasks. The core idea of PTaRL is to construct prototype-based projection space (P-Space) and learn the disentangled representation around global data prototypes. Specifically, PTaRL mainly involves two stages: (i) Prototype Generating, that constructs global prototypes as the basis vectors of P-Space for representation, and (ii) Prototype Projecting, that projects the data samples into P-Space and keeps the core global data information via Optimal Transport. Then, to further acquire the disentangled representations, we constrain PTaRL with two strategies: (i) to diversify the coordinates towards global prototypes of different representations within P-Space, we bring up a diversifying constraint for representation calibration; (ii) to avoid prototype entanglement in P-Space, we introduce a matrix orthogonalization constraint to ensure the independence of global prototypes. \nFinally, we conduct extensive experiments in PTaRL coupled with state-of-the-art deep tabular ML models on various tabular benchmarks and the results have shown our consistent superiority.",
        "keywords": "Tabular data;Deep neural networks;Tabular representation learning;Prototype learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Hangting Ye;Wei Fan;Xiaozhuang Song;Shun Zheng;He Zhao;Dan dan Guo;Yi Chang",
        "authorids": "~Hangting_Ye1;~Wei_Fan6;~Xiaozhuang_Song1;~Shun_Zheng1;~He_Zhao1;~Dan_dan_Guo1;~Yi_Chang4",
        "gender": "M;M;M;M;;F;M",
        "homepage": ";https://weifan.site/;;;;https://github.com/Dan123dan;http://www.yichang-cs.com",
        "dblp": "307/5289;54/3488-10;283/0298.html;179/2615.html;;121/1618;02/5438.html",
        "google_scholar": "Dh7oBowAAAAJ;cQ8zLJ4AAAAJ;;21Q9To4AAAAJ;;https://scholar.google.com.hk/citations?user=QLOY4JkAAAAJ;https://scholar.google.com.hk/citations?user=drEkR50AAAAJ",
        "orcid": ";0000-0001-7656-445X;;0009-0005-7355-7090;;;0000-0003-2697-8093",
        "linkedin": ";;;;;;",
        "or_profile": "~Hangting_Ye1;~Wei_Fan6;~Xiaozhuang_Song1;~Shun_Zheng1;~He_Zhao1;~Dan_dan_Guo1;~Yi_Chang4",
        "aff": "Jilin University;University of Oxford;Shanghai Artificial Intelligence Laboratory;Microsoft;;Jilin University;Jilin University, China",
        "aff_domain": "jlu.edu.cn;ox.ac.uk;pjlab.org.cn;microsoft.com;;jlu.edu.cn;jlu.edu.cn",
        "position": "PhD student;Postdoc Researcher;Intern;Senior Researcher;;Lecturer;Full Professor",
        "bibtex": "@inproceedings{\nye2024ptarl,\ntitle={{PT}a{RL}: Prototype-based Tabular Representation Learning via Space Calibration},\nauthor={Hangting Ye and Wei Fan and Xiaozhuang Song and Shun Zheng and He Zhao and Dan dan Guo and Yi Chang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=G32oY4Vnm8}\n}",
        "github": "",
        "project": "",
        "reviewers": "GXco;z5Xh;7NUi",
        "pdf_size": 11170477,
        "rating": "8;8;8",
        "confidence": "3;2;4",
        "soundness": "3;4;3",
        "contribution": "2;4;2",
        "presentation": "3;3;2",
        "wc_summary": "48;106;60",
        "wc_strengths": "44;11;58",
        "wc_weaknesses": "25;39;26",
        "wc_questions": "223;16;89",
        "wc_review": "340;172;233",
        "wc_reply_reviewers": "20;0;41",
        "wc_reply_authors": "1645;350;979",
        "reply_reviewers": "1;0;1",
        "reply_authors": "4;1;2",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            71.33333333333333,
            24.997777679003566
        ],
        "wc_strengths_avg": [
            37.666666666666664,
            19.70335560817553
        ],
        "wc_weaknesses_avg": [
            30.0,
            6.377042156569663
        ],
        "wc_questions_avg": [
            109.33333333333333,
            85.72177215983243
        ],
        "wc_review_avg": [
            248.33333333333334,
            69.43742186714276
        ],
        "wc_reply_reviewers_avg": [
            20.333333333333332,
            16.73983937265296
        ],
        "wc_reply_authors_avg": [
            991.3333333333334,
            528.7534607189084
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 26,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2611979656453422429&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=G32oY4Vnm8",
        "pdf": "https://openreview.net/pdf?id=G32oY4Vnm8",
        "email": "jlu.edu.cn;ox.ac.uk;pjlab.org.cn;microsoft.com;;jlu.edu.cn;jlu.edu.cn",
        "author_num": 7,
        "aff_unique_index": "0;1;2;3;0;0",
        "aff_unique_norm": "Jilin University;University of Oxford;Shanghai Artificial Intelligence Laboratory;Microsoft",
        "aff_unique_dep": ";;;Microsoft Corporation",
        "aff_unique_url": "http://www.jlu.edu.cn;https://www.ox.ac.uk;http://www.shailab.org/;https://www.microsoft.com",
        "aff_unique_abbr": "JLU;Oxford;Shanghai AI Lab;Microsoft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;2;0;0",
        "aff_country_unique": "China;United Kingdom;United States"
    },
    {
        "id": "G3LOFL4jGp",
        "title": "MacDC: Masking-augmented Collaborative Domain Congregation for Multi-target Domain Adaptation in Semantic Segmentation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "This paper addresses the challenges in multi-target domain adaptive segmentation which aims at learning a single model that adapts to multiple diverse target domains. Existing methods show limited performance as they only consider the difference in visual appearance (testyle) while ignoring the contextual variations among multiple target domains. In contrast, we propose a novel approach termed Masking-augmented Collaborative Domain Congregation (MacDC) to handle the style gap and contextual gap altogether. The proposed MacDC comprises two key parts: collaborative domain congregation (CDC) and multi-context masking consistency (MCMC). Our CDC handles the style and contextual gaps among target domains by data mixing, which generates image-level and region-level intermediate domains among target domains. To further strengthen contextual alignment, our MCMC adopts a masking-based self-supervised augmentation consistency that enforces the model's understanding of diverse contexts together. Our proposed MacDC directly learns a single model for multi-target domain adaptation without requiring multiple network training and subsequent distillation. Despite its simplicity, MacDC shows efficacy in mitigating the style and contextual gap among multiple target domains and demonstrates superior performance on multi-target domain adaptation for segmentation benchmarks compared to existing state-of-the-art approaches.",
        "keywords": "Multi-target Domain Adaptive Semantic Segmentation; Multi-target Domain Adaptation; Semantic Segmentation;Scene Parsing.",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Fei Pan;Dong He;Xu Yin;Chenshuang Zhang;Munchurl Kim",
        "authorids": "~Fei_Pan2;~Dong_He2;~Xu_Yin1;~Chenshuang_Zhang2;~Munchurl_Kim2",
        "gender": "M;M;F;M;M",
        "homepage": "https://www.feipan.info;;https://chenshuang-zhang.github.io/;http://www.viclab.kaist.ac.kr;",
        "dblp": ";;165/5102.html;;142/8633",
        "google_scholar": "VGE3DlYAAAAJ;;HbqjLHYAAAAJ;bGXte_4AAAAJ;Mq7z_LIAAAAJ",
        "orcid": "0000-0002-5688-5413;0000-0001-6438-8989;;0000-0003-1634-7722;0000-0003-1967-7030",
        "linkedin": ";;;;",
        "or_profile": "~Fei_Pan2;~Dong_He2;~Chenshuang_Zhang2;~Munchurl_Kim2;~Yin_Xu2",
        "aff": "University of Michigan - Ann Arbor;sapeon;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology",
        "aff_domain": "umich.edu;sapeon.com;kaist.ac.kr;kaist.ac.kr;kaist.ac.kr",
        "position": "Postdoc;Researcher;PhD student;Full Professor;PhD student",
        "bibtex": "@misc{\nanonymous2024macdc,\ntitle={Mac{DC}: Masking-augmented Collaborative Domain Congregation for Multi-target Domain Adaptation in Semantic Segmentation},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=G3LOFL4jGp}\n}",
        "github": "",
        "project": "",
        "reviewers": "zRcv;TU98;9HYr",
        "site": "https://openreview.net/forum?id=G3LOFL4jGp",
        "pdf_size": 9039292,
        "rating": "3;3;5",
        "confidence": "5;4;4",
        "soundness": "2;3;2",
        "contribution": "2;2;2",
        "presentation": "3;3;3",
        "wc_summary": "80;154;51",
        "wc_strengths": "34;42;60",
        "wc_weaknesses": "112;280;111",
        "wc_questions": "3;226;2",
        "wc_review": "229;702;224",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            95.0,
            43.36665385600631
        ],
        "wc_strengths_avg": [
            45.333333333333336,
            10.873004286866726
        ],
        "wc_weaknesses_avg": [
            167.66666666666666,
            79.43271086621402
        ],
        "wc_questions_avg": [
            77.0,
            105.35970134100924
        ],
        "wc_review_avg": [
            385.0,
            224.1621436966257
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:WVY1bSY3viYJ:scholar.google.com/&scioq=MacDC:+Masking-augmented+Collaborative+Domain+Congregation+for+Multi-target+Domain+Adaptation+in+Semantic+Segmentation&hl=en&as_sdt=0,5",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;2;2",
        "aff_unique_norm": "University of Michigan;SAPEON;Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.umich.edu;https://www.sapeon.ai;https://www.kaist.ac.kr",
        "aff_unique_abbr": "UM;;KAIST",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Ann Arbor;",
        "aff_country_unique_index": "0;1;1;1;1",
        "aff_country_unique": "United States;South Korea"
    },
    {
        "id": "G3OCarOfxx",
        "title": "Why Clean Generalization and Robust Overfitting Both Happen in Adversarial Training",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Adversarial training is a standard method to train deep neural networks to be robust to adversarial perturbation. Similar to surprising $\\textit{clean generalization}$ ability in the standard deep learning setting, neural networks trained by adversarial training also generalize well for $\\textit{unseen clean data}$. However, in constrast with clean generalization, while adversarial training method is able to achieve low robust training error, there still exists a significant $\\textit{robust generalization gap}$, which promotes us exploring what mechanism leads to both $\\textit{clean generalization and robust overfitting (CGRO)}$ during learning process. In this paper, we provide a theoretical understanding of this puzzling phenomenon (CGRO) through $\\textit{feature learning theory}$. Specifically, we prove that, under our theoretical framework (patch-structured dataset and one-hidden-layer CNN model) , a $\\textit{three-stage phase transition}$ happens from adversarial training dynamics, and the network learner provably partially learns the true feature but exactly memorizes the spurious features from training-adversarial examples, which thereby results in CGRO phenomenon. Besides, for more general data assumption, we then show the efficiency of CGRO classifier from the perspective of $\\textit{representation complexity}$. On the empirical side, we also verify our theoretical analysis about learning process in real-world vision dataset.",
        "keywords": "deep learning theory;adversarial robustness;adversarial training;clean generalization and robust overfitting",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Binghui Li;Yuanzhi Li",
        "authorids": "~Binghui_Li1;~Yuanzhi_Li1",
        "gender": "Not Specified;M",
        "homepage": "https://libinghui0000.github.io/;",
        "dblp": "244/9096.html;73/3628",
        "google_scholar": "U6BRIM4AAAAJ;",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Binghui_Li1;~Yuanzhi_Li1",
        "aff": "Peking University;Carnegie Mellon University",
        "aff_domain": "pku.edu.cn;andrew.cmu.edu",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nli2024why,\ntitle={Why Clean Generalization and Robust Overfitting Both Happen in Adversarial Training},\nauthor={Binghui Li and Yuanzhi Li},\nyear={2024},\nurl={https://openreview.net/forum?id=G3OCarOfxx}\n}",
        "github": "",
        "project": "",
        "reviewers": "LZqy;6rXn;rmWV;CpMF;EEZ9",
        "site": "https://openreview.net/forum?id=G3OCarOfxx",
        "pdf_size": 616808,
        "rating": "3;5;5;5;6",
        "confidence": "3;2;3;4;3",
        "soundness": "2;2;3;3;3",
        "contribution": "2;3;2;2;3",
        "presentation": "3;3;1;3;3",
        "wc_summary": "76;102;165;113;25",
        "wc_strengths": "35;52;47;33;52",
        "wc_weaknesses": "149;274;533;335;190",
        "wc_questions": "5;159;572;65;6",
        "wc_review": "265;587;1317;546;273",
        "wc_reply_reviewers": "0;0;0;0;22",
        "wc_reply_authors": "265;575;593;394;210",
        "reply_reviewers": "0;0;0;0;1",
        "reply_authors": "1;1;1;1;2",
        "rating_avg": [
            4.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.6,
            0.8
        ],
        "wc_summary_avg": [
            96.2,
            45.88420207435234
        ],
        "wc_strengths_avg": [
            43.8,
            8.23164625090267
        ],
        "wc_weaknesses_avg": [
            296.2,
            134.92131039980305
        ],
        "wc_questions_avg": [
            161.4,
            212.83853034636377
        ],
        "wc_review_avg": [
            597.6,
            383.74449833189794
        ],
        "wc_reply_reviewers_avg": [
            4.4,
            8.8
        ],
        "wc_reply_authors_avg": [
            407.4,
            156.18015238819558
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4
        ],
        "reply_authors_avg": [
            1.2,
            0.4
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4328077788895486452&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Peking University;Carnegie Mellon University",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.cmu.edu",
        "aff_unique_abbr": "Peking U;CMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "G3srXhs3Ki",
        "title": "MetaCloak: Preventing Unauthorized Subject-driven Text-to-image Synthesis Via Meta-learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Text-to-image diffusion models, epitomized by DreamBooth, allow seamless generation of personalized images from scant reference photos. Yet, these tools, in the wrong hands, can fabricate misleading or harmful content, endangering individuals. To address this, existing poisoning-based approaches perturb user images in an imperceptible way to render them \"unlearnable\" from malicious uses. We identify two limitations of these defending approaches: i) sub-optimal due to the hand-crafted heuristics for solving intractable bilevel optimization; and ii) lack of robustness against simple countermeasures like Gaussian filtering transformations. To solve these challenges, we propose MetaCloak to prevent the unauthorized subject-driven text-to-image synthesis of DreamBooth finetuning. \nMetaCloak combines a first-order method that approximately solves the bilevel problem via meta-learning and a transformation-robust noise crafting process. Specifically, MetaCloak unrolls the training trajectory of the inner optimization loop and conducts iterative updates between surrogate models and the perturbation. To improve the robustness and transferability of our perturbation across models, we further propose \\textit{curricular ensembling} by looping over steps-staggered clean surrogate diffusion models of different versions.\nFurthermore, to bypass transformation defenses, MetaCloak crafts transformation-robust perturbation by conducting denoising-error maximization for semantic distortion. Extensive experiments on the VGGFace2 and CelebA-HQ datasets show that MetaCloak significantly outperforms existing attacking approaches. Notably, MetaCloak can successfully fool several online DreamBooth training services like Replicate in a black-box manner, demonstrating the defense effectiveness of MetaCloak in real-world scenarios.",
        "keywords": "Poisoning Attack;Unauthorized Synthesis;DreamBooth;Text-to-Image Diffusion Models",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/78f647347e32647af655f73ed0664a13f142176d.zip",
        "author": "Yixin Liu;Chenrui Fan;Yutong Dai;Xun Chen;Pan Zhou;Lichao Sun",
        "authorids": "~Yixin_Liu4;~Chenrui_Fan1;~Yutong_Dai2;~Xun_Chen1;~Pan_Zhou5;~Lichao_Sun1",
        "gender": ";M;M;;M;M",
        "homepage": ";https://www.linkedin.com/in/chenrui-fan-a1b102298/;https://roth.rbind.io;;http://faculty.hust.edu.cn/pzhou/zh_CN/index.htm;https://lichao-sun.github.io/",
        "dblp": ";342/1752.html;;;84/6614-1;121/0780-1.html",
        "google_scholar": ";IR8PuQUAAAAJ;;;cTpFPJgAAAAJ;WhGUE7AAAAAJ",
        "orcid": ";0000-0003-3183-2224;0000-0003-4212-2017;;;",
        "linkedin": ";chenrui-fan-a1b102298/;;;;lichao-sun-b273a290/",
        "or_profile": "~Yixin_Liu4;~Chenrui_Fan1;~Yutong_Dai2;~Xun_Chen1;~Pan_Zhou5;~Lichao_Sun1",
        "aff": ";Huazhong University of Science and Technology;SalesForce.com;;Huazhong University of Science and Technology;Lehigh University",
        "aff_domain": ";hust.edu.cn;salesforce.com;;hust.edu.cn;lehigh.edu",
        "position": ";Undergrad student;Researcher;;Professor;Assistant Professor",
        "bibtex": "@misc{\nliu2024metacloak,\ntitle={MetaCloak: Preventing Unauthorized Subject-driven Text-to-image Synthesis Via Meta-learning},\nauthor={Yixin Liu and Chenrui Fan and Yutong Dai and Xun Chen and Pan Zhou and Lichao Sun},\nyear={2024},\nurl={https://openreview.net/forum?id=G3srXhs3Ki}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=G3srXhs3Ki",
        "pdf_size": 48747206,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:4twOPZTAZYQJ:scholar.google.com/&scioq=MetaCloak:+Preventing+Unauthorized+Subject-driven+Text-to-image+Synthesis+Via+Meta-learning&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "Huazhong University of Science and Technology;Salesforce;Lehigh University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.hust.edu.cn;https://www.salesforce.com;https://www.lehigh.edu",
        "aff_unique_abbr": "HUST;Salesforce;Lehigh",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "G4D6jClNFl",
        "title": "Deepfake Detection with Contrastive Learning in Curved Spaces",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deepfake detectors excel in familiar scenarios but falter when faced with new generation techniques. Improving their generalization can be achieved through synthetic data during training or using one-class anomaly detection methods. However, existing techniques, limited to non-negative-curvature spaces, struggle to effectively identify counterfeit features on the intricate and diverse non-Euclidean human face manifold. Human faces defy simple Euclidean geometry due to their complexity. To overcome this limitation, we introduce a novel and efficient deepfake detector, called CTru, that learns a rich representation of facial geometry across multiple-curvature spaces in a self-supervised manner. During inference, the fakeness score is computed by integrating angle-based similarity in spherical space and model confidence in hyperbolic space with Busemann distance. CTru establishes new SoTA results on various challenging datasets in both cross-dataset and cross-manipulation scenarios, while being trained only on pristine faces, highlighting its impressive generalization performance. Code source will be made available.",
        "keywords": "deepfakes;forgery;detection",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Nicolas Larue;Ngoc-Son Vu",
        "authorids": "~Nicolas_Larue1;~Ngoc-Son_Vu2",
        "gender": "M;M",
        "homepage": ";",
        "dblp": ";11/8109",
        "google_scholar": ";Fw14qXwAAAAJ",
        "orcid": ";",
        "linkedin": "nicolas-larue-1750a6159/;",
        "or_profile": "~Nicolas_Larue1;~Ngoc-Son_Vu2",
        "aff": "CY Cergy Paris University;Ecole Nationale Sup\u00e9rieure de l'Electronique et de ses Applications",
        "aff_domain": "cyu.fr;ensea.fr",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\nlarue2024deepfake,\ntitle={Deepfake Detection with Contrastive Learning in Curved Spaces},\nauthor={Nicolas Larue and Ngoc-Son Vu},\nyear={2024},\nurl={https://openreview.net/forum?id=G4D6jClNFl}\n}",
        "github": "",
        "project": "",
        "reviewers": "V3Kg;GhyQ;gKak;L6YJ",
        "site": "https://openreview.net/forum?id=G4D6jClNFl",
        "pdf_size": 898855,
        "rating": "3;5;5;6",
        "confidence": "4;4;4;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;2;2",
        "wc_summary": "43;156;36;51",
        "wc_strengths": "3;31;46;19",
        "wc_weaknesses": "113;141;95;61",
        "wc_questions": "3;95;18;1",
        "wc_review": "162;423;195;132",
        "wc_reply_reviewers": "0;128;178;8",
        "wc_reply_authors": "1464;1598;1255;472",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "4;3;4;2",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            71.5,
            49.073923829259876
        ],
        "wc_strengths_avg": [
            24.75,
            15.785673884886892
        ],
        "wc_weaknesses_avg": [
            102.5,
            29.03015673398957
        ],
        "wc_questions_avg": [
            29.25,
            38.525154120392564
        ],
        "wc_review_avg": [
            228.0,
            114.76715558033143
        ],
        "wc_reply_reviewers_avg": [
            78.5,
            76.62081962495573
        ],
        "wc_reply_authors_avg": [
            1197.25,
            436.19913743610266
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.25,
            0.82915619758885
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.6622661785325219,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:aFynTt7Lqs8J:scholar.google.com/&scioq=Deepfake+Detection+with+Contrastive+Learning+in+Curved+Spaces&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "CY Cergy Paris University;Ecole Nationale Sup\u00e9rieure de l'Electronique et de ses Applications",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.u-cergy.fr;https://www.enssea.fr",
        "aff_unique_abbr": "CY Paris;ENSEA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "France"
    },
    {
        "id": "G4Y9oSoMpQ",
        "title": "HeteroSFL: Split Federated Learning with heterogeneous clients and non-IID data",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Split federated learning (SFL) is an emerging privacy-preserving decentralized learning scheme, which splits a machine learning model so that most of the computations are offloaded to the server. While SFL is edge-friendly, it has high communication cost and so existing SFL schemes focus on reducing the communication cost of homogeneous client-based systems. However a more realistic scenario is when clients are heterogeneous, i.e. they have different system capabilities including computing power and communication data rates. We focus\non the heterogeneity due to different data rates since in SFL the computation in the client-end is quite small. In this paper, we propose HeteroSFL, the first SFL framework with heterogeneous clients that handles non-IID data with label distribution skew across clients and across groups of clients. HeteroSFL compresses data with different compression factors in low-end and high-end group using narrow and wide bottleneck layers (BL), respectively. It provides a mechanism to address the challenge of aggregating different-sized BL models, and utilizes bidirectional knowledge sharing (BDKS) to address the overfitting caused by the different label distributions across high- and low-end groups. We show that HeteroSFL achieves significant training time reduction with minimum accuracy loss compared to competing methods. Specifically, it can reduce the training time of SFL by 16\u00d7 to 256\u00d7 with 1.24% to 5.59% accuracy loss for VGG11 on CIFAR10 for non-IID data.",
        "keywords": "Split Federated Learning;Communication Heterogeneity;Non-IID data",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/e4bd24772ae430e23d6ace85b9b7e5d7fa06ee08.zip",
        "author": "Xing Chen;Jingtao Li;Deliang Fan;Chaitali Chakrabarti",
        "authorids": "~Xing_Chen3;~Jingtao_Li1;~Deliang_Fan1;~Chaitali_Chakrabarti1",
        "gender": "F;M;M;F",
        "homepage": ";https://zlijingtao.github.io;https://faculty.engineering.asu.edu/dfan/;https://www.public.asu.edu/~chaitali/",
        "dblp": "89/120;;129/1701;45/2824",
        "google_scholar": "7E7smpcAAAAJ;JIBdJbAAAAAJ;sAflhJUAAAAJ;u5DHuKcAAAAJ",
        "orcid": ";0000-0003-4250-869X;0000-0002-7989-6297;",
        "linkedin": ";;;",
        "or_profile": "~Xing_Chen3;~Jingtao_Li1;~Deliang_Fan1;~Chaitali_Chakrabarti1",
        "aff": ";Sony AI;Johns Hopkins University;",
        "aff_domain": ";sony.com;jhu.edu;",
        "position": ";Researcher;Associate Professor;",
        "bibtex": "@misc{\nchen2024heterosfl,\ntitle={Hetero{SFL}: Split Federated Learning with heterogeneous clients and non-{IID} data},\nauthor={Xing Chen and Jingtao Li and Deliang Fan and Chaitali Chakrabarti},\nyear={2024},\nurl={https://openreview.net/forum?id=G4Y9oSoMpQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "wycu;NpV1;iigy",
        "site": "https://openreview.net/forum?id=G4Y9oSoMpQ",
        "pdf_size": 872458,
        "rating": "3;5;6",
        "confidence": "4;4;4",
        "soundness": "3;2;2",
        "contribution": "2;2;3",
        "presentation": "3;1;2",
        "wc_summary": "53;33;133",
        "wc_strengths": "24;39;43",
        "wc_weaknesses": "443;134;79",
        "wc_questions": "150;30;135",
        "wc_review": "670;236;390",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            73.0,
            43.20493798938573
        ],
        "wc_strengths_avg": [
            35.333333333333336,
            8.178562764256865
        ],
        "wc_weaknesses_avg": [
            218.66666666666666,
            160.20889141645318
        ],
        "wc_questions_avg": [
            105.0,
            53.38539126015655
        ],
        "wc_review_avg": [
            432.0,
            179.65151451258814
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:RIjj_yKmQHQJ:scholar.google.com/&scioq=HeteroSFL:+Split+Federated+Learning+with+heterogeneous+clients+and+non-IID+data&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Sony;Johns Hopkins University",
        "aff_unique_dep": "Sony AI;",
        "aff_unique_url": "https://www.sony.com;https://www.jhu.edu",
        "aff_unique_abbr": "Sony AI;JHU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Japan;United States"
    },
    {
        "id": "G536mmC2HL",
        "title": "TorSeq: Torsion Sequential Modeling for Molecular 3D Conformation Generation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In the realms of chemistry and drug discovery, the generation of 3D low-energy molecular conformers is critical. While various methods, including deep generative and diffusion-based techniques, have been developed to predict 3D atomic coordinates and molecular geometry elements like bond lengths, angles, and torsion angles, they often neglect the intrinsic correlations among these elements. This oversight, especially regarding torsion angles, can produce less-than-optimal 3D conformers in the context of energy efficiency. Addressing this gap, we introduce a method that explicitly models the dependencies of geometry elements through sequential probability factorization, with a particular focus on optimizing torsion angle correlations. Experimental evaluations on benchmark datasets for molecule conformer generation underscore our approach's superior efficiency and efficacy.",
        "keywords": "conformer generation;sequential model;geometric deep learning",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Xiangyang Xu;Hongyang Gao",
        "authorids": "~Xiangyang_Xu2;~Hongyang_Gao1",
        "gender": "M;M",
        "homepage": "https://www.cs.iastate.edu/people/xiangyang-xu;https://faculty.sites.iastate.edu/hygao/",
        "dblp": ";200/7985",
        "google_scholar": ";jGmq0aEAAAAJ",
        "orcid": ";0000-0002-9020-9080",
        "linkedin": ";hongyang-gao-74924690/",
        "or_profile": "~Xiangyang_Xu2;~Hongyang_Gao1",
        "aff": "Iowa State University;Iowa State University",
        "aff_domain": "iastate.edu;iastate.edu",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nxu2024torseq,\ntitle={TorSeq: Torsion Sequential Modeling for Molecular 3D Conformation Generation},\nauthor={Xiangyang Xu and Hongyang Gao},\nyear={2024},\nurl={https://openreview.net/forum?id=G536mmC2HL}\n}",
        "github": "",
        "project": "",
        "reviewers": "Mhor;3sE9;sEK1;Xdkx",
        "site": "https://openreview.net/forum?id=G536mmC2HL",
        "pdf_size": 2874676,
        "rating": "3;3;3;3",
        "confidence": "4;5;4;4",
        "soundness": "2;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "3;2;2;2",
        "wc_summary": "69;53;31;78",
        "wc_strengths": "51;33;19;84",
        "wc_weaknesses": "259;185;20;442",
        "wc_questions": "149;72;73;134",
        "wc_review": "528;343;143;738",
        "wc_reply_reviewers": "0;417;0;0",
        "wc_reply_authors": "956;1038;845;781",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "2;3;3;2",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            57.75,
            17.851820635442202
        ],
        "wc_strengths_avg": [
            46.75,
            24.31434761617099
        ],
        "wc_weaknesses_avg": [
            226.5,
            151.54289821697353
        ],
        "wc_questions_avg": [
            107.0,
            34.90701935141412
        ],
        "wc_review_avg": [
            438.0,
            220.31227836868285
        ],
        "wc_reply_reviewers_avg": [
            104.25,
            180.56629668905546
        ],
        "wc_reply_authors_avg": [
            905.0,
            99.07825190222121
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:nwolAQx4rAoJ:scholar.google.com/&scioq=TorSeq:+Torsion+Sequential+Modeling+for+Molecular+3D+Conformation+Generation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Iowa State University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.iastate.edu",
        "aff_unique_abbr": "ISU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "G5Fo7H6dqE",
        "title": "Iterated Deep $Q$-Network: Efficient Learning of Bellman Iterations for Deep Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Value-based Reinforcement Learning (RL) methods hinge on the application of the Bellman operator, which needs to be approximated from samples. Most approaches consist of an iterative scheme alternating the application of a Bellman iteration and a subsequent projection step in the considered function space. In this paper, we propose a new perspective by introducing iterated Deep $Q$-Network (iDQN), a novel DQN-based algorithm that aims to obtain an approximation of several consecutive Bellman iterations at once.\nTo this end, iDQN leverages the online network of DQN to build a target for a second online network, which in turn serves as a target for a third online network, and so forth, thereby taking into account future Bellman iterations. This entails that iDQN allows for better learning of the Bellman iterations than DQN, while using the same number of gradient steps.\nWe theoretically prove the benefit of iDQN in terms of error propagation under the lens of approximate value iteration. Then, we evaluate iDQN against relevant baselines on $54$ Atari $2600$ games, showing that iDQN outperforms DQN while being orthogonal to more advanced DQN-based approaches.",
        "keywords": "deep reinforcement learning;bellman operator;approximate value iteration;atari games",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/2d7bcaf6b2540575edcfeb4417e31b7734ee544e.zip",
        "author": "Th\u00e9o Vincent;Boris Belousov;Jan Peters;Carlo D'Eramo",
        "authorids": "~Th\u00e9o_Vincent2;~Boris_Belousov1;~Jan_Peters3;~Carlo_D'Eramo2",
        "gender": "M;M;M;M",
        "homepage": "https://www.jan-peters.net;https://carloderamo.wixsite.com/home;https://www.ias.informatik.tu-darmstadt.de/Team/BorisBelousov;https://www.ias.informatik.tu-darmstadt.de/Team/TheoVincent",
        "dblp": "p/JanPeters1;182/8953;191/6726;",
        "google_scholar": "https://scholar.google.de/citations?user=-kIVAcAAAAAJ;https://scholar.google.it/citations?user=1Rt_86gAAAAJ;https://scholar.google.de/citations?user=XjNbRVYAAAAJ;nZPOL4wAAAAJ",
        "orcid": "0000-0002-5266-8091;0000-0003-2712-118X;0000-0001-7172-9104;0000-0002-1723-7405",
        "linkedin": "janrpeters/;carlo-d-eramo-6438a289/;boris-belousov/;theo-vincent/",
        "or_profile": "~Jan_Peters3;~Carlo_D'Eramo2;~Boris_Belousov2;~Th\u00e9o_VINCENT1",
        "aff": "TU Darmstadt;TU Darmstadt;German Research Centre for AI;Technische Universit\u00e4t Darmstadt",
        "aff_domain": "tu-darmstadt.de;tu-darmstadt.de;dfki.de;tu-darmstadt.de",
        "position": "Full Professor;Postdoc;Researcher;PhD student",
        "bibtex": "@misc{\nvincent2024iterated,\ntitle={Iterated Deep \\$Q\\$-Network: Efficient Learning of Bellman Iterations for Deep Reinforcement Learning},\nauthor={Th{\\'e}o Vincent and Boris Belousov and Jan Peters and Carlo D'Eramo},\nyear={2024},\nurl={https://openreview.net/forum?id=G5Fo7H6dqE}\n}",
        "github": "",
        "project": "",
        "reviewers": "i5KK;AD1r;u8zz;LPKc",
        "site": "https://openreview.net/forum?id=G5Fo7H6dqE",
        "pdf_size": 12826747,
        "rating": "3;3;5;5",
        "confidence": "5;4;4;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "3;3;3;4",
        "wc_summary": "82;171;63;110",
        "wc_strengths": "111;69;35;70",
        "wc_weaknesses": "492;304;40;152",
        "wc_questions": "1;198;232;29",
        "wc_review": "686;742;370;361",
        "wc_reply_reviewers": "668;0;62;147",
        "wc_reply_authors": "1969;918;567;665",
        "reply_reviewers": "2;0;1;1",
        "reply_authors": "3;2;2;2",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            106.5,
            40.81972562377165
        ],
        "wc_strengths_avg": [
            71.25,
            26.929305598176867
        ],
        "wc_weaknesses_avg": [
            247.0,
            169.66732154425023
        ],
        "wc_questions_avg": [
            115.0,
            101.20523701864444
        ],
        "wc_review_avg": [
            539.75,
            175.40007839222878
        ],
        "wc_reply_reviewers_avg": [
            219.25,
            264.28902266269023
        ],
        "wc_reply_authors_avg": [
            1029.75,
            557.1935817110602
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:UJHPoVH5zKYJ:scholar.google.com/&scioq=Iterated+Deep+%24Q%24-Network:+Efficient+Learning+of+Bellman+Iterations+for+Deep+Reinforcement+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Technische Universit\u00e4t Darmstadt;German Research Centre for Artificial Intelligence",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tu-darmstadt.de;https://www.dfki.de/",
        "aff_unique_abbr": "TU Darmstadt;DFKI",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Darmstadt;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "G7M3f3Ditm",
        "title": "TPA-Gen: A Multi-modal Data Generative Method for Text and Physics-based Animation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Powered by an enormous amount of paired data from the vision and language domains, Vision-Language (V&L) Multi-Modality (MM) research has achieved remarkable results in both text-driven generation and understanding. However, constrained by the data, the learned Multi-Modality (MM) knowledge space predominantly represents the alignments between text and appearances or shapes, lacking further understanding of the underlying dynamics. In this paper, we aim to expand the Multi-Modality (MM) knowledge space by bridging the gap between text, vision, and real-world physical dynamics from a data-centric perspective, enabling Multi-Modality (MM) models to better estimate these dynamics. We propose an automatic pipeline to generate Text-to-Video/Simulation (T2V/S) data. Each generated scenario comprises a high-resolution 3D physical simulation and a textual description of the physical phenomena. To simulate a diverse set of real-world dynamic phenomena---such as elastic deformations, material fractures, collisions, and turbulence---as faithfully as possible, we take advantage of state-of-the-art physical simulation methods: (i) Incremental Potential Contact (IPC) and (ii) Material Point Method (MPM . Additionally, high-quality, multi-view rendering is integrated into the pipeline. We envision our work as the first step towards fully automatic Text-to-Simulation (T2S), potentially shifting the paradigm towards understanding world dynamics.",
        "keywords": "Text to Physics-based Animation;Multimodal Generation",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/5346a2e5938f55d805f64bde5f8c5ff36ac79275.pdf",
        "author": "Yuxing Qiu;Feng Gao;Minchen Li;Yin Yang;Chenfanfu Jiang",
        "authorids": "~Yuxing_Qiu1;~Feng_Gao2;~Minchen_Li1;~Yin_Yang4;~Chenfanfu_Jiang3",
        "gender": "F;M;M;M;",
        "homepage": "https://yuxingqiu.github.io/;https://fen9.github.io/;https://www.cs.cmu.edu/~minchenl/;https://yangzzzy.github.io/;",
        "dblp": ";10/2674-13;175/5809;56/2998-2;132/7630",
        "google_scholar": "zPZ6ijgAAAAJ;amaLnocAAAAJ;https://scholar.google.ca/citations?user=Gk7K7VkAAAAJ;-z2_nggAAAAJ;",
        "orcid": ";0000-0003-1515-1357;0000-0001-9868-7311;0000-0001-7645-5931;",
        "linkedin": ";;minchenli/;;",
        "or_profile": "~Yuxing_Qiu1;~Feng_Gao2;~Minchen_Li1;~Yin_Yang4;~Chenfanfu_Jiang3",
        "aff": "University of California, Los Angeles;Amazon;School of Computer Science, Carnegie Mellon University;University of Utah;University of California, Los Angeles",
        "aff_domain": "ucla.edu;amazon.com;cs.cmu.edu;utah.edu;ucla.edu",
        "position": "PhD student;Researcher;Assistant Professor;Associate Professor;Associate Professor",
        "bibtex": "@misc{\nqiu2024tpagen,\ntitle={{TPA}-Gen: A Multi-modal Data Generative Method for Text and Physics-based Animation},\nauthor={Yuxing Qiu and Feng Gao and Minchen Li and Yin Yang and Chenfanfu Jiang},\nyear={2024},\nurl={https://openreview.net/forum?id=G7M3f3Ditm}\n}",
        "github": "",
        "project": "",
        "reviewers": "dZiU;ZNsp;dKyv",
        "site": "https://openreview.net/forum?id=G7M3f3Ditm",
        "pdf_size": 22543963,
        "rating": "1;3;5",
        "confidence": "3;3;3",
        "soundness": "2;1;3",
        "contribution": "2;2;2",
        "presentation": "3;2;3",
        "wc_summary": "59;130;79",
        "wc_strengths": "83;59;83",
        "wc_weaknesses": "131;170;454",
        "wc_questions": "15;20;73",
        "wc_review": "288;379;689",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            1.632993161855452
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            89.33333333333333,
            29.892399628593814
        ],
        "wc_strengths_avg": [
            75.0,
            11.313708498984761
        ],
        "wc_weaknesses_avg": [
            251.66666666666666,
            143.95446811019409
        ],
        "wc_questions_avg": [
            36.0,
            26.242459234352765
        ],
        "wc_review_avg": [
            452.0,
            171.65275024498345
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:xYgfVRG0D3IJ:scholar.google.com/&scioq=TPA-Gen:+A+Multi-modal+Data+Generative+Method+for+Text+and+Physics-based+Animation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;0",
        "aff_unique_norm": "University of California, Los Angeles;Amazon;Carnegie Mellon University;University of Utah",
        "aff_unique_dep": ";Amazon.com, Inc.;School of Computer Science;",
        "aff_unique_url": "https://www.ucla.edu;https://www.amazon.com;https://www.cmu.edu;https://www.utah.edu",
        "aff_unique_abbr": "UCLA;Amazon;CMU;Utah",
        "aff_campus_unique_index": "0;2;0",
        "aff_campus_unique": "Los Angeles;;Pittsburgh",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Hypothesis Search: Inductive Reasoning with Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19039",
        "id": "G7UtIGQmjm",
        "author_site": "Ruocheng Wang, Eric Zelikman, Gabriel Poesia, Yewen Pu, Nick Haber, Noah Goodman",
        "tldr": "",
        "abstract": "Inductive reasoning is a core problem-solving capacity: humans can identify underlying principles from a few examples, which can then be robustly generalized to novel scenarios. Recent work has evaluated large language models (LLMs) on inductive reasoning tasks by directly prompting them yielding \"in context learning.\" This can work well for straightforward inductive tasks, but performs very poorly on more complex tasks such as the Abstraction and Reasoning Corpus (ARC). In this work, we propose to improve the inductive reasoning ability of LLMs by generating explicit hypotheses at multiple levels of abstraction: we prompt the LLM to propose multiple abstract hypotheses about the problem, in natural language, then implement the natural language hypotheses as concrete Python programs. These programs can be directly verified by running on the observed examples and generalized to novel inputs. To reduce the hypothesis search space, we explore steps to filter the set of hypotheses to be implemented as programs: we either ask the LLM to summarize them into a smaller set of hypotheses, or ask human annotators to select a subset. We verify our pipeline's effectiveness on the ARC visual inductive reasoning benchmark, its variant 1D-ARC, and string transformation dataset SyGuS. On a random 40-problem subset of ARC, our automated pipeline using LLM summaries achieves 27.5% accuracy, significantly outperforming the direct prompting baseline (accuracy of 12.5%). With the minimal human input of selecting from LLM-generated candidates, the performance is boosted to 37.5%. Our ablation studies show that abstract hypothesis generation and concrete program representations are both beneficial for LLMs to perform inductive reasoning tasks.",
        "keywords": "Inductive reasoning;large language models",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "",
        "author": "Ruocheng Wang;Eric Zelikman;Gabriel Poesia;Yewen Pu;Nick Haber;Noah Goodman",
        "authorids": "~Ruocheng_Wang1;~Eric_Zelikman1;~Gabriel_Poesia1;~Yewen_Pu1;~Nick_Haber1;~Noah_Goodman1",
        "gender": ";M;M;M;;",
        "homepage": "https://cs.stanford.edu/~rcwang/;https://zelikman.me;https://gpoesia.com;http://www.mit.edu/~yewenpu;;https://cocolab.stanford.edu/",
        "dblp": "206/8366;217/2378;150/2695.html;53/10322;179/4983;96/1216",
        "google_scholar": "7gnfDDMAAAAJ;V5B8dSUAAAAJ;as5iYn4AAAAJ;LJnNKXMAAAAJ;euNCoVYAAAAJ;OUpIbcQAAAAJ",
        "orcid": ";;;;0000-0001-8804-7804;",
        "linkedin": ";ericzelikman/;;;;",
        "or_profile": "~Ruocheng_Wang1;~Eric_Zelikman1;~Gabriel_Poesia1;~Yewen_Pu1;~Nick_Haber1;~Noah_Goodman1",
        "aff": "Stanford University;Stanford University;Stanford University;Autodesk;Stanford University;Stanford University",
        "aff_domain": "stanford.edu;stanford.edu;stanford.edu;autodesk.com;stanford.edu;stanford.edu",
        "position": "PhD student;PhD student;PhD student;Principal Researcher;Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\nwang2024hypothesis,\ntitle={Hypothesis Search: Inductive Reasoning with Language Models},\nauthor={Ruocheng Wang and Eric Zelikman and Gabriel Poesia and Yewen Pu and Nick Haber and Noah Goodman},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=G7UtIGQmjm}\n}",
        "github": "",
        "project": "",
        "reviewers": "7fhN;SPJ6;PFzt;e7wF;Bu26;qtss",
        "pdf_size": 750779,
        "rating": "3;3;5;6;6;6",
        "confidence": "4;4;5;3;3;2",
        "soundness": "2;2;3;3;3;3",
        "contribution": "2;2;2;3;2;2",
        "presentation": "3;3;3;3;3;3",
        "wc_summary": "86;121;110;80;67;51",
        "wc_strengths": "45;135;68;160;75;53",
        "wc_weaknesses": "226;214;326;2;151;128",
        "wc_questions": "129;100;230;14;246;44",
        "wc_review": "486;570;734;256;539;276",
        "wc_reply_reviewers": "0;0;0;0;0;0",
        "wc_reply_authors": "1187;1269;1195;346;1764;442",
        "reply_reviewers": "0;0;0;0;0;0",
        "reply_authors": "2;2;3;1;3;1",
        "rating_avg": [
            4.833333333333333,
            1.3437096247164249
        ],
        "confidence_avg": [
            3.5,
            0.9574271077563381
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.1666666666666665,
            0.3726779962499649
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            85.83333333333333,
            23.884560331356788
        ],
        "wc_strengths_avg": [
            89.33333333333333,
            42.866718506967096
        ],
        "wc_weaknesses_avg": [
            174.5,
            99.69578727308391
        ],
        "wc_questions_avg": [
            127.16666666666667,
            86.7571642895015
        ],
        "wc_review_avg": [
            476.8333333333333,
            167.2646771503841
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1033.8333333333333,
            493.5015760416126
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.582975248068166,
        "gs_citation": 104,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4011197260672979021&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=G7UtIGQmjm",
        "pdf": "https://openreview.net/pdf?id=G7UtIGQmjm",
        "email": "stanford.edu;stanford.edu;stanford.edu;autodesk.com;stanford.edu;stanford.edu",
        "author_num": 6,
        "aff_unique_index": "0;0;0;1;0;0",
        "aff_unique_norm": "Stanford University;Autodesk",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.stanford.edu;https://www.autodesk.com",
        "aff_unique_abbr": "Stanford;Autodesk",
        "aff_campus_unique_index": "0;0;0;0;0",
        "aff_campus_unique": "Stanford;",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "G7waGZjsdt",
        "title": "Visual Category Discovery via Linguistic Anchoring",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We address the problem of generalized category discovery (GCD) that aims to classify entire images of a partially labeled image collection with the total number of target classes being unknown. Motivated by the relevance of visual category to linguistic semantics, we propose language-anchored contrastive learning for GCD. Assuming consistent relations between images and their corresponding texts in an image-text joint embedding space, our method incorporates image-text consistency constraints into contrastive learning. To perform this process without manual image-text annotations, we assign each image with a corresponding text embedding by retrieving $k$-nearest-neighbor words among a random corpus of diverse words and aggregating them through cross-attention. The proposed method achieves state-of-the-art performance on the standard benchmarks, ImageNet100, CUB, Stanford Cars, and Herbarium19.",
        "keywords": "multi-modal;clustering;category discovery",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Sua Choi;Dahyun Kang;Minsu Cho",
        "authorids": "~Sua_Choi1;~Dahyun_Kang1;~Minsu_Cho1",
        "gender": "F;;M",
        "homepage": "https://github.com/sua-choi;;http://cvlab.postech.ac.kr/~mcho/",
        "dblp": "375/1247;;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;5TyoF5QAAAAJ",
        "orcid": "0009-0004-9006-4282;;",
        "linkedin": ";;minsu-cho-062b3750/",
        "or_profile": "~Sua_Choi1;~Dahyun_Kang1;~Minsu_Cho1",
        "aff": "Pohang University of Science and Technology;;POSTECH",
        "aff_domain": "postech.ac.kr;;postech.ac.kr",
        "position": "MS student;;Associate Professor",
        "bibtex": "@misc{\nchoi2024visual,\ntitle={Visual Category Discovery via Linguistic Anchoring},\nauthor={Sua Choi and Dahyun Kang and Minsu Cho},\nyear={2024},\nurl={https://openreview.net/forum?id=G7waGZjsdt}\n}",
        "github": "",
        "project": "",
        "reviewers": "9cFD;4NxT;ixQ1;H3av",
        "site": "https://openreview.net/forum?id=G7waGZjsdt",
        "pdf_size": 1028522,
        "rating": "3;3;6;8",
        "confidence": "5;3;4;3",
        "soundness": "3;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;2",
        "wc_summary": "62;94;133;95",
        "wc_strengths": "19;32;77;38",
        "wc_weaknesses": "125;349;145;86",
        "wc_questions": "36;62;95;60",
        "wc_review": "242;537;450;279",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            5.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            96.0,
            25.149552679918582
        ],
        "wc_strengths_avg": [
            41.5,
            21.615966321217286
        ],
        "wc_weaknesses_avg": [
            176.25,
            101.96905167745751
        ],
        "wc_questions_avg": [
            63.25,
            20.99255820523073
        ],
        "wc_review_avg": [
            377.0,
            121.20024752449972
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.42640143271122094,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:iGiQe9HyVgkJ:scholar.google.com/&scioq=Visual+Category+Discovery+via+Linguistic+Anchoring&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Pohang University of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.postech.ac.kr",
        "aff_unique_abbr": "POSTECH",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Pohang",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "Empirical Likelihood for Fair Classification",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19038",
        "id": "GACjMj1MS1",
        "author_site": "Pangpang Liu, Yichuan Zhao",
        "tldr": "",
        "abstract": "Machine learning algorithms are commonly being deployed in decision-making systems that have a direct impact on human lives. However, if these algorithms are trained solely to minimize training/test errors, they may inadvertently discriminate against individuals based on their sensitive attributes, such as gender, race or age. Recently, algorithms that ensure the fairness are developed in the machine learning community. Fairness criteria are applied by these algorithms to measure the fairness, but they often use the point estimate to assess the fairness and fail to consider the uncertainty of the sample fairness criterion once the algorithms are deployed. We suggest that assessing the fairness should take the uncertainty into account. In this paper, we use the covariance as a proxy for the fairness and develop the confidence region of the covariance vector using empirical likelihood \\citep{Owen1988}. Our confidence region based fairness constraints for classification take uncertainty into consideration during fairness assessment. The proposed confidence region can be used to test the fairness and impose fairness constraint using the significant level as a tool to balance the accuracy and fairness.   Simulation studies show that our method exactly covers the target Type I error rate and effectively balances the trade-off between accuracy and fairness. Finally, we conduct data analysis to demonstrate the effectiveness of our method.",
        "keywords": "Fair Classification;Empirical Likelihood",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/7b176ffe05f498907e1219b91e13dc2d186bcad2.zip",
        "author": "Pangpang Liu;Yichuan Zhao",
        "authorids": "~Pangpang_Liu1;~Yichuan_Zhao1",
        "gender": "M;M",
        "homepage": "https://business.purdue.edu/students/?u=liu3364;https://math.gsu.edu/yichuan/",
        "dblp": "293/7352;https://dblp.org/search?q=yichuan%20zhao%20author%3AYichuan_Zhao%3A",
        "google_scholar": "WLh6B9UAAAAJ;7bkblcwAAAAJ",
        "orcid": "0009-0007-4415-5265;0000-0002-5069-1968",
        "linkedin": "pangpang-liu-b036921b4/;yichuan-zhao-20626681/",
        "or_profile": "~Pangpang_Liu1;~Yichuan_Zhao1",
        "aff": "Purdue University;",
        "aff_domain": "purdue.edu;",
        "position": "PhD student;",
        "bibtex": "@inproceedings{\nliu2024empirical,\ntitle={Empirical Likelihood for Fair Classification},\nauthor={Pangpang Liu and Yichuan Zhao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=GACjMj1MS1}\n}",
        "github": "",
        "project": "",
        "reviewers": "umPv;Rn9g;YzKS",
        "pdf_size": 472796,
        "rating": "5;6;6",
        "confidence": "3;3;4",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "2;3;3",
        "wc_summary": "58;45;82",
        "wc_strengths": "63;31;70",
        "wc_weaknesses": "156;70;150",
        "wc_questions": "76;116;76",
        "wc_review": "353;262;378",
        "wc_reply_reviewers": "0;97;0",
        "wc_reply_authors": "784;617;853",
        "reply_reviewers": "0;2;0",
        "reply_authors": "1;2;1",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            61.666666666666664,
            15.326085243430198
        ],
        "wc_strengths_avg": [
            54.666666666666664,
            16.97710877099579
        ],
        "wc_weaknesses_avg": [
            125.33333333333333,
            39.20317447463775
        ],
        "wc_questions_avg": [
            89.33333333333333,
            18.856180831641264
        ],
        "wc_review_avg": [
            331.0,
            49.846430831772366
        ],
        "wc_reply_reviewers_avg": [
            32.333333333333336,
            45.726238516730064
        ],
        "wc_reply_authors_avg": [
            751.3333333333334,
            99.07685008225799
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1183245285429730787&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=GACjMj1MS1",
        "pdf": "https://openreview.net/pdf?id=GACjMj1MS1",
        "email": "purdue.edu;",
        "author_num": 2,
        "aff_unique_index": "0",
        "aff_unique_norm": "Purdue University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.purdue.edu",
        "aff_unique_abbr": "Purdue",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "GAXedKmbFZ",
        "title": "Disco-Bench: A Context-Aware Evaluation Benchmark for Language Modelling",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Modeling large contexts, especially linguistic phenomena that span beyond individual sentences, is a fundamental yet challenging aspect of natural language processing (NLP). However, existing evaluation benchmarks primarily focus on the evaluation of inter-sentence properties and overlook critical discourse phenomena that cross sentences. To bridge the gap, we propose Disco-Bench, a benchmark that can evaluate intra-sentence contextual properties across a diverse set of NLP tasks, covering understanding, translation, and generation.\nDisco-Bench consists of 9 document-level testsets in the literature domain, which contain rich discourse phenomena (e.g. cohesion and coherence) in Chinese and/or English. For linguistic analysis, we also design a diagnostic test suite to probe the extent to which the evaluated models have internalized contextual information. We totally evaluate 20 general-purpose and domain-specific models based on advanced pretraining architectures and large language models (LLMs). Our results show that (1) our evaluation benchmark is both challenging and necessary; (2) fine-grained pretraining with literary document-level training data consistently enhances the modeling of discourse information. We will release the datasets, pretrained models, and leaderboard, which we hope can significantly facilitate research in this field.",
        "keywords": "Language Modelling;Benchmark;Language Understanding;Language Translation;Language Generation;Large Language Model",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Longyue Wang;DongHuai Liu;Deng Cai;Dian Yu;Haiyun Jiang;Yan Wang;Leyang Cui;Shuming Shi;Zhaopeng Tu",
        "authorids": "~Longyue_Wang3;~DongHuai_Liu1;~Deng_Cai1;~Dian_Yu3;~Haiyun_Jiang1;~Yan_Wang17;~Leyang_Cui1;~Shuming_Shi1;~Zhaopeng_Tu1",
        "gender": "M;M;M;F;M;M;M;M;M",
        "homepage": "http://longyuewang.com/;;https://jcyk.github.io/;https://sites.google.com/site/yudiandoris/;;https://libertywing.github.io/yanwang.github.io/;https://github.com/Nealcly;;http://www.zptu.net",
        "dblp": "127/3421;;c/DCai-2;136/8648-1.html;;59/2227-60;247/6181;s/ShumingShi;71/9281",
        "google_scholar": "r1ctChkAAAAJ;;KpbRLYcAAAAJ;ERdzqyYAAAAJ;fk684xEAAAAJ;https://scholar.google.com/citations?hl=zh-CN;6YVwZgkAAAAJ;Lg31AKMAAAAJ;IvE2zRgAAAAJ",
        "orcid": "0000-0002-9062-6183;;;;;;;;",
        "linkedin": "vincentwang0229/;https://www.linkedin.cn/incareer/in/ACoAADcBL_QBPqcNI2ce-tmzkgRzIcDjPTdhqQY;;;;;;;tuzhaopeng",
        "or_profile": "~Longyue_Wang3;~DongHuai_Liu1;~Deng_Cai1;~Dian_Yu3;~Haiyun_Jiang1;~Yan_Wang17;~Leyang_Cui1;~Shuming_Shi1;~Zhaopeng_Tu1",
        "aff": "Tencent AI Lab;;Tencent AI Lab;Tencent AI Lab;Tencent AI Lab;miHoYo;Tencent AI Lab;Tencent AI Lab;Tencent AI Lab",
        "aff_domain": "tencent.com;;tencent.com;tencent.com;tencent.com;mihoyo.com;tencent.com;tencent.com;tencent.com",
        "position": "Senior Researcher;;Research Scientist;NLP researcher;Researcher;Research Scientist;Researcher;Principal Researcher;Principal Researcher",
        "bibtex": "@misc{\nwang2024discobench,\ntitle={Disco-Bench: A Context-Aware Evaluation Benchmark for Language Modelling},\nauthor={Longyue Wang and DongHuai Liu and Deng Cai and Dian Yu and Haiyun Jiang and Yan Wang and Leyang Cui and Shuming Shi and Zhaopeng Tu},\nyear={2024},\nurl={https://openreview.net/forum?id=GAXedKmbFZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "8L44;Q2Uh;maWf;iRfK",
        "site": "https://openreview.net/forum?id=GAXedKmbFZ",
        "pdf_size": 2449175,
        "rating": "3;3;5;6",
        "confidence": "4;4;2;2",
        "soundness": "2;2;3;3",
        "contribution": "1;2;3;3",
        "presentation": "2;3;1;2",
        "wc_summary": "92;139;89;81",
        "wc_strengths": "16;69;64;55",
        "wc_weaknesses": "49;234;157;109",
        "wc_questions": "86;6;278;288",
        "wc_review": "243;448;588;533",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "369;543;668;373",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.0,
            1.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            100.25,
            22.730761095924613
        ],
        "wc_strengths_avg": [
            51.0,
            20.820662813657012
        ],
        "wc_weaknesses_avg": [
            137.25,
            67.70662818365717
        ],
        "wc_questions_avg": [
            164.5,
            121.88006399735767
        ],
        "wc_review_avg": [
            453.0,
            131.10110602126895
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            488.25,
            125.31036469502433
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -0.9622504486493761,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:EEKMgX-Kr6EJ:scholar.google.com/&scioq=Disco-Bench:+A+Context-Aware+Evaluation+Benchmark+for+Language+Modelling&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;1;0;0;0",
        "aff_unique_norm": "Tencent;miHoYo",
        "aff_unique_dep": "Tencent AI Lab;",
        "aff_unique_url": "https://ai.tencent.com;https://www.mihoyo.com",
        "aff_unique_abbr": "Tencent AI Lab;miHoYo",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "GDNo5oLpMx",
        "title": "Pre-Training and Fine-Tuning Image Super-Resolution Models for Efficient Video Super-Resolution",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In this paper, we propose a novel framework for adapting pre-trained image super-resolution (SR) models to tackle the challenging task of efficient video SR. This is achieved by freezing the pre-trained image SR model and fine-tuning it with the addition of several lightweight adapter modules. These adapters facilitate spatial and temporal learning, progressively equipping the image SR model with spatiotemporal reasoning capabilities for video SR. Also, these Adapters are compact and extendable, embedding only a few trainable parameters for each video dataset. Moreover, the parameters of the image SR model remain unchanged, resulting in substantial parameter sharing. This allows us to train video SR models quickly and efficiently. Remarkably, despite having significantly fewer parameters, our proposed method achieves competitive or even superior performance compared to existing video SR methods across multiple benchmarks.",
        "keywords": "Image Super-Resolution; Efficient Video Super-Resolution; Pre-Training and Fine-Tuning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/b9bd7d5e65449be23e4f2cd68f4930d861b1369c.zip",
        "author": "Hao Tang;Ling Shao;Luc Van Gool",
        "authorids": "~Hao_Tang6;~Ling_Shao1;~Luc_Van_Gool1",
        "gender": "M;M;",
        "homepage": "https://ha0tang.github.io/;;",
        "dblp": "07/5751-5;;61/5017",
        "google_scholar": "9zJkeEMAAAAJ;z84rLjoAAAAJ;https://scholar.google.be/citations?user=TwMib_QAAAAJ",
        "orcid": "0000-0002-2077-1246;;",
        "linkedin": "hao-tang-887475138/;;",
        "or_profile": "~Hao_Tang6;~Ling_Shao1;~Luc_Van_Gool1",
        "aff": "Carnegie Mellon University;University of Chinese Academy of Sciences;KU Leuven",
        "aff_domain": "cmu.edu;ucas.ac.cn;kuleuven.be",
        "position": "Postdoc;Full Professor;Emeritus",
        "bibtex": "@misc{\ntang2024pretraining,\ntitle={Pre-Training and Fine-Tuning Image Super-Resolution Models for Efficient Video Super-Resolution},\nauthor={Hao Tang and Ling Shao and Luc Van Gool},\nyear={2024},\nurl={https://openreview.net/forum?id=GDNo5oLpMx}\n}",
        "github": "",
        "project": "",
        "reviewers": "cshF;sGmU;dM9L;BWkb",
        "site": "https://openreview.net/forum?id=GDNo5oLpMx",
        "pdf_size": 28452734,
        "rating": "1;3;5;6",
        "confidence": "5;5;4;3",
        "soundness": "3;3;3;4",
        "contribution": "1;2;2;2",
        "presentation": "2;1;2;4",
        "wc_summary": "86;96;67;111",
        "wc_strengths": "92;46;29;159",
        "wc_weaknesses": "288;120;156;216",
        "wc_questions": "2;68;54;83",
        "wc_review": "468;330;306;569",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.920286436967152
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            90.0,
            15.98436736314578
        ],
        "wc_strengths_avg": [
            81.5,
            50.331401728940556
        ],
        "wc_weaknesses_avg": [
            195.0,
            63.7102817447859
        ],
        "wc_questions_avg": [
            51.75,
            30.498975392625898
        ],
        "wc_review_avg": [
            418.25,
            106.7576109698976
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.9028289727756884,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ihTSOHmjK1wJ:scholar.google.com/&scioq=Pre-Training+and+Fine-Tuning+Image+Super-Resolution+Models+for+Efficient+Video+Super-Resolution&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Carnegie Mellon University;University of Chinese Academy of Sciences;Katholieke Universiteit Leuven",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.cmu.edu;http://www.ucas.ac.cn;https://www.kuleuven.be",
        "aff_unique_abbr": "CMU;UCAS;KU Leuven",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2",
        "aff_country_unique": "United States;China;Belgium"
    },
    {
        "id": "GDdhaasBgN",
        "title": "Rare Event Probability Learning by Normalizing Flows",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "A rare event is defined by a low probability of occurrence. Accurate estimation of such small probabilities is of utmost importance across diverse domains. Conventional Monte Carlo methods are inefficient, demanding an exorbitant number of samples to achieve reliable estimates. Inspired by the exact sampling capabilities of normalizing flows, we revisit this challenge and propose normalizing flow assisted importance sampling, termed NOFIS. NOFIS first learns a sequence of proposal distributions associated with predefined nested subset events by minimizing KL divergence losses. Next, it estimates the rare event probability by utilizing importance sampling in conjunction with the last proposal. The efficacy of our NOFIS method is substantiated through comprehensive qualitative visualizations, affirming the optimality of the learned proposal distribution, as well as a series of quantitative experiments encompassing 10 distinct test cases, which highlight NOFIS's superiority over baseline approaches.",
        "keywords": "rare event estimation;normalizing flows",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Zhengqi Gao;Dinghuai Zhang;Luca Daniel;Duane S Boning",
        "authorids": "~Zhengqi_Gao1;~Dinghuai_Zhang1;~Luca_Daniel1;~Duane_S_Boning1",
        "gender": "M;;;M",
        "homepage": "http://zhengqigao.github.io/;;https://www.mit.edu/~dluca/;https://boning.mit.edu/",
        "dblp": "256/9403;;35/5202;26/1132",
        "google_scholar": "igvvVY4AAAAJ;;;https://scholar.google.com.tw/citations?user=oIdI_PcAAAAJ",
        "orcid": ";;0000-0002-5880-3151;0000-0002-0417-445X",
        "linkedin": "zhengqi-gao-729b51146/;;;",
        "or_profile": "~Zhengqi_Gao1;~Dinghuai_Zhang1;~Luca_Daniel1;~Duane_S_Boning1",
        "aff": "Massachusetts Institute of Technology;;;Massachusetts Institute of Technology",
        "aff_domain": "mit.edu;;;mit.edu",
        "position": "PhD student;;;Full Professor",
        "bibtex": "@misc{\ngao2024rare,\ntitle={Rare Event Probability Learning by Normalizing Flows},\nauthor={Zhengqi Gao and Dinghuai Zhang and Luca Daniel and Duane S Boning},\nyear={2024},\nurl={https://openreview.net/forum?id=GDdhaasBgN}\n}",
        "github": "",
        "project": "",
        "reviewers": "U9Yx;E1PQ;27ee;9Yao",
        "site": "https://openreview.net/forum?id=GDdhaasBgN",
        "pdf_size": 9827942,
        "rating": "3;3;3;5",
        "confidence": "4;3;4;3",
        "soundness": "2;3;3;3",
        "contribution": "1;2;1;2",
        "presentation": "3;3;3;3",
        "wc_summary": "127;45;110;55",
        "wc_strengths": "39;26;28;60",
        "wc_weaknesses": "309;110;556;99",
        "wc_questions": "38;30;701;92",
        "wc_review": "513;211;1395;306",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            84.25,
            34.95264653785175
        ],
        "wc_strengths_avg": [
            38.25,
            13.497684986693088
        ],
        "wc_weaknesses_avg": [
            268.5,
            185.84200278731393
        ],
        "wc_questions_avg": [
            215.25,
            281.45992165848406
        ],
        "wc_review_avg": [
            606.25,
            468.2933775957119
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10719615831514374012&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Massachusetts Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://web.mit.edu",
        "aff_unique_abbr": "MIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "GDdxmymrwL",
        "title": "Corex: Pushing the Boundaries of Complex Reasoning through Multi-Model Collaboration",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) are evolving at an unprecedented pace and have exhibited considerable capability in the realm of natural language processing (NLP) with world knowledge. Benefiting from ultra-large-scale training corpora, a single LLM can manage typical NLP tasks competently. However, its performance in executing reasoning tasks is still confined by the limitations of its internal representations. To push this boundary further, we introduce Corex in this paper, a suite of novel general-purpose strategies that transform LLMs into autonomous agents pioneering multi-model collaborations for complex task-solving. Inspired by human behaviors, Corex is constituted by diverse collaboration paradigms including Debate, Review, and Retrieve modes, which collectively work towards enhancing the factuality, faithfulness, and reliability of the reasoning process. These paradigms foster task-agnostic approaches that enable LLMs to ''think outside the box,'' thereby overcoming hallucinations and providing better solutions. Through extensive experiments across four different types of reasoning tasks, we demonstrate that orchestrating multiple LLMs to work in concert yields substantially better performance compared to existing methods. Further results and in-depth analysis demonstrate the cost-effectiveness of our method, facilitating collaboration among different LLMs and promoting annotation efficiency. Our code and data are available at https://anonymous.4open.science/r/Corex.",
        "keywords": "Large Language Models;Complex Reasoning;Multi-Model Collaboration",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Qiushi Sun;Zhangyue Yin;Xiang Li;Zhiyong Wu;Xipeng Qiu;Lingpeng Kong",
        "authorids": "~Qiushi_Sun1;~Zhangyue_Yin1;~Xiang_Li24;~Zhiyong_Wu3;~Xipeng_Qiu1;~Lingpeng_Kong1",
        "gender": "M;M;M;;M;M",
        "homepage": "https://qiushisun.github.io/;https://yinzhangyue.github.io/;https://lixiang3776.github.io;;https://xpqiu.github.io/;https://ikekonglp.github.io/",
        "dblp": "247/8469;314/5418;40/1491-67.html;;69/1395;144/7656",
        "google_scholar": "QgMkYFAAAAAJ;9gRQqSkAAAAJ;JnxxNtsAAAAJ;;Pq4Yp_kAAAAJ;f1hBi5wAAAAJ",
        "orcid": "0000-0002-5207-818X;;0009-0003-0142-2483;;0000-0001-7163-5247;",
        "linkedin": "qiushi-sun/;zhangyue-yin-083286288/;;;;",
        "or_profile": "~Qiushi_Sun1;~Zhangyue_Yin1;~Xiang_Li24;~Zhiyong_Wu3;~Xipeng_Qiu1;~Lingpeng_Kong1",
        "aff": "National University of Singapore;Fudan University;East China Normal University;;Fudan University;Department of Computer Science, The University of Hong Kong",
        "aff_domain": "u.nus.edu;fudan.edu.cn;ecnu.edu.cn;;fudan.edu.cn;cs.hku.hk",
        "position": "MS student;PhD student;Full Professor;;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nsun2024corex,\ntitle={Corex: Pushing the Boundaries of Complex Reasoning through Multi-Model Collaboration},\nauthor={Qiushi Sun and Zhangyue Yin and Xiang Li and Zhiyong Wu and Xipeng Qiu and Lingpeng Kong},\nyear={2024},\nurl={https://openreview.net/forum?id=GDdxmymrwL}\n}",
        "github": "",
        "project": "",
        "reviewers": "aQai;Lg3j;kCUS;1uTs",
        "site": "https://openreview.net/forum?id=GDdxmymrwL",
        "pdf_size": 1248793,
        "rating": "3;5;5;8",
        "confidence": "5;4;3;2",
        "soundness": "2;3;2;4",
        "contribution": "1;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "68;144;89;89",
        "wc_strengths": "41;85;109;44",
        "wc_weaknesses": "207;234;579;137",
        "wc_questions": "6;144;70;2",
        "wc_review": "322;607;847;272",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1282;1615;1163;457",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;3;2;1",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            97.5,
            28.182441342083905
        ],
        "wc_strengths_avg": [
            69.75,
            28.560243346302215
        ],
        "wc_weaknesses_avg": [
            289.25,
            170.9917761180344
        ],
        "wc_questions_avg": [
            55.5,
            57.78191758673296
        ],
        "wc_review_avg": [
            512.0,
            231.81350262657264
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1129.25,
            422.0025918166854
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.9393364366277244,
        "gs_citation": 45,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15662879292631356469&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;1;3",
        "aff_unique_norm": "National University of Singapore;Fudan University;East China Normal University;University of Hong Kong",
        "aff_unique_dep": ";;;Department of Computer Science",
        "aff_unique_url": "https://www.nus.edu.sg;https://www.fudan.edu.cn;http://www.ecnu.edu.cn;https://www.hku.hk",
        "aff_unique_abbr": "NUS;Fudan;ECNU;HKU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;1;1;1;1",
        "aff_country_unique": "Singapore;China"
    },
    {
        "id": "GEZACBPDn7",
        "title": "KDGCN: A Kernel-based Double-level Graph Convolution Network for Semi-supervised Graph Classification with Scarce Labels",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph classification, which is significant in various fields, often faces the challenge of label scarcity. Under such a scenario, supervised methods based on graph neural networks do not perform well because they only utilize information from labeled data. Meanwhile, semi-supervised methods based on graph contrastive learning often yield complex models as well as elaborate hyperparameter-tuning. In this work, we present a novel semi-supervised graph classification method, which combines GCN modules with graph kernels such as Weisfeiler-Lehman subtree kernel. First, we use a GCN module as well as a readout operation to attain a graph feature vector for each graph in the dataset. Then, we view the graphs as meta-nodes of a supergraph constructed by a graph kernel among graphs. Finally, we use another GCN module, whose inputs are the graph feature vectors, to learn meta-node representations over the supergraph in a semi-supervised manner. Note that the two GCN modules are optimized jointly. Compared to contrastive learning based semi-supervised graph classification methods, our method has fewer hyperparameters and is easier to implement. Experiments on seven benchmark datasets demonstrate the effectiveness of our method in comparison to many baselines including supervised GCNs, label propagation, graph contrastive learning, etc.",
        "keywords": "graph neural network;graph classification;semi-supervised learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Chao Ouyang;Haijun Zhang;Jicong Fan",
        "authorids": "~Chao_Ouyang1;~Haijun_Zhang1;~Jicong_Fan2",
        "gender": "M;M;M",
        "homepage": "https://talentedmuse.github.io/;http://www.dl2link.com;https://jicongfan.github.io/",
        "dblp": "216/0481;70/2140-2;139/1570",
        "google_scholar": ";;vdJsnhIAAAAJ",
        "orcid": "0009-0008-4689-8027;0000-0002-1648-0227;0000-0001-9665-0355",
        "linkedin": ";;",
        "or_profile": "~Chao_Ouyang1;~Haijun_Zhang1;~Jicong_Fan2",
        "aff": "Harbin Institute of Technology;Harbin Institute of Technology, Shenzhen;The Chinese University of Hong Kong, Shenzhen",
        "aff_domain": "hit.edu.cn;hit.edu.cn;cuhk.edu.cn",
        "position": "PhD student;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nouyang2024kdgcn,\ntitle={{KDGCN}: A Kernel-based Double-level Graph Convolution Network for Semi-supervised Graph Classification with Scarce Labels},\nauthor={Chao Ouyang and Haijun Zhang and Jicong Fan},\nyear={2024},\nurl={https://openreview.net/forum?id=GEZACBPDn7}\n}",
        "github": "",
        "project": "",
        "reviewers": "jG7C;Qkvr;mRm5;2nwv",
        "site": "https://openreview.net/forum?id=GEZACBPDn7",
        "pdf_size": 1669542,
        "rating": "3;5;5;8",
        "confidence": "5;3;4;4",
        "soundness": "1;3;3;4",
        "contribution": "1;2;2;3",
        "presentation": "2;2;2;3",
        "wc_summary": "42;106;95;66",
        "wc_strengths": "31;36;42;109",
        "wc_weaknesses": "244;65;82;78",
        "wc_questions": "31;50;114;235",
        "wc_review": "348;257;333;488",
        "wc_reply_reviewers": "536;0;0;0",
        "wc_reply_authors": "1076;588;731;706",
        "reply_reviewers": "2;0;0;0",
        "reply_authors": "3;1;1;1",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            1.0897247358851685
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            77.25,
            25.053692342646823
        ],
        "wc_strengths_avg": [
            54.5,
            31.70567772497538
        ],
        "wc_weaknesses_avg": [
            117.25,
            73.44853640475077
        ],
        "wc_questions_avg": [
            107.5,
            79.77624959848639
        ],
        "wc_review_avg": [
            356.5,
            83.39214591314939
        ],
        "wc_reply_reviewers_avg": [
            134.0,
            232.09480821422954
        ],
        "wc_reply_authors_avg": [
            775.25,
            181.84247991049835
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.39605901719066966,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:3_U7N5wxFxIJ:scholar.google.com/&scioq=KDGCN:+A+Kernel-based+Double-level+Graph+Convolution+Network+for+Semi-supervised+Graph+Classification+with+Scarce+Labels&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Harbin Institute of Technology;Chinese University of Hong Kong",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.hit.edu.cn/;https://www.cuhk.edu.cn",
        "aff_unique_abbr": "HIT;CUHK",
        "aff_campus_unique_index": "0;1;1",
        "aff_campus_unique": "Harbin;Shenzhen",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Identifying the Risks of LM Agents with an LM-Emulated Sandbox",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19037",
        "id": "GEcwtMk1uA",
        "author_site": "Yangjun Ruan, Honghua Dong, Andrew Wang, Silviu Pitis, Yongchao Zhou, Jimmy Ba, Yann Dubois, Chris Maddison, Tatsunori Hashimoto",
        "tldr": "",
        "abstract": "Recent advances in Language Model (LM) agents and tool use, exemplified by applications like ChatGPT Plugins, enable a rich set of capabilities but also amplify potential risks\u2014such as leaking private data or causing financial losses. Identifying these risks is labor-intensive, necessitating implementing the tools, setting up the environment for each test scenario manually, and finding risky cases. As tools and agents become more complex, the high cost of testing these agents will make it increasingly difficult to find high-stakes, long-tail risks. To address these challenges, we introduce ToolEmu: a framework that uses an LM to emulate tool execution and enables scalable testing of LM agents against a diverse range of tools and scenarios. Alongside the emulator, we develop an LM-based automatic safety evaluator that examines agent failures and quantifies associated risks. We test both the tool emulator and evaluator through human evaluation and find that 68.8% of failures identified with ToolEmu would be valid real-world agent failures. Using our curated initial benchmark consisting of 36 high-stakes toolkits and 144 test cases, we provide a quantitative risk analysis of current LM agents and identify numerous failures with potentially severe outcomes. Notably, even the safest LM agent exhibits such failures 23.9% of the time according to our evaluator, underscoring the need to develop safer LM agents for real-world deployment.",
        "keywords": "Language Model Agent;Tool Use;Evaluation;Safety;Language Model",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/85c23fd1fde464458191316b3a00a952a1543d90.zip",
        "author": "Yangjun Ruan;Honghua Dong;Andrew Wang;Silviu Pitis;Yongchao Zhou;Jimmy Ba;Yann Dubois;Chris J. Maddison;Tatsunori Hashimoto",
        "authorids": "~Yangjun_Ruan1;~Honghua_Dong1;~Andrew_Wang4;~Silviu_Pitis1;~Yongchao_Zhou1;~Jimmy_Ba1;~Yann_Dubois1;~Chris_J._Maddison1;~Tatsunori_Hashimoto1",
        "gender": "M;M;M;M;M;M;M;M;M",
        "homepage": "http://www.cs.toronto.edu/~yjruan/;https://dhh1995.github.io/;https://www.cs.toronto.edu/~andrewwang/;https://silviupitis.com;;http://jimmylba.github.io;http://yanndubs.github.io/;https://thashim.github.io;http://www.cs.toronto.edu/~cmaddis/",
        "dblp": "237/3892;238/2646;;https://dblp.org/pers/hd/p/Pitis:Silviu;;https://dblp.org/pers/b/Ba:Jimmy.html;198/7527;;139/1388",
        "google_scholar": "https://scholar.google.com.hk/citations?user=9AdCSywAAAAJ;MrGN4oMAAAAJ;https://scholar.google.ca/citations?user=cxqJgC8AAAAJ;oYlo1ycAAAAJ;35M6rhsAAAAJ;https://scholar.google.ca/citations?user=ymzxRhAAAAAJ;bfM1kzAAAAAJ;5ygiTwsAAAAJ;https://scholar.google.ca/citations?user=WjCG3owAAAAJ",
        "orcid": ";;;;;;;;",
        "linkedin": ";;andrew-w-09420b229/;;yongchao-zhou-a298a7158/;;duboisyann/;;",
        "or_profile": "~Yangjun_Ruan1;~Honghua_Dong1;~Andrew_Wang4;~Silviu_Pitis1;~Yongchao_Zhou1;~Jimmy_Ba1;~Yann_Dubois1;~Tatsunori_Hashimoto1;~Chris_J_Maddison1",
        "aff": "University of Toronto;Department of Computer Science, University of Toronto;Department of Computer Science, University of Toronto;;University of Toronto;Department of Computer Science, University of Toronto;Stanford University;Stanford University;Google",
        "aff_domain": "toronto.edu;cs.toronto.edu;cs.toronto.edu;;mail.utoronto.ca;cs.toronto.edu;stanford.edu;stanford.edu;google.com",
        "position": "PhD student;PhD student;MS student;;PhD student;Assistant Professor;PhD student;Assistant Professor;Researcher",
        "bibtex": "@inproceedings{\nruan2024identifying,\ntitle={Identifying the Risks of {LM} Agents with an {LM}-Emulated Sandbox},\nauthor={Yangjun Ruan and Honghua Dong and Andrew Wang and Silviu Pitis and Yongchao Zhou and Jimmy Ba and Yann Dubois and Chris J. Maddison and Tatsunori Hashimoto},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=GEcwtMk1uA}\n}",
        "github": "",
        "project": "",
        "reviewers": "nwq5;5zXC;3bW4",
        "pdf_size": 2323605,
        "rating": "6;8;8",
        "confidence": "3;4;5",
        "soundness": "2;3;3",
        "contribution": "3;3;3",
        "presentation": "3;4;3",
        "wc_summary": "38;79;124",
        "wc_strengths": "68;83;86",
        "wc_weaknesses": "14;40;126",
        "wc_questions": "195;72;87",
        "wc_review": "315;274;423",
        "wc_reply_reviewers": "9;8;0",
        "wc_reply_authors": "891;816;1039",
        "reply_reviewers": "1;1;0",
        "reply_authors": "3;4;4",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            80.33333333333333,
            35.122009560324926
        ],
        "wc_strengths_avg": [
            79.0,
            7.874007874011811
        ],
        "wc_weaknesses_avg": [
            60.0,
            47.86090958879351
        ],
        "wc_questions_avg": [
            118.0,
            54.7905101272109
        ],
        "wc_review_avg": [
            337.3333333333333,
            62.84548954026498
        ],
        "wc_reply_reviewers_avg": [
            5.666666666666667,
            4.0276819911981905
        ],
        "wc_reply_authors_avg": [
            915.3333333333334,
            92.65107782547497
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.8660254037844385,
        "gs_citation": 115,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4586505086341753791&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 8,
        "openreview": "https://openreview.net/forum?id=GEcwtMk1uA",
        "pdf": "https://openreview.net/pdf?id=GEcwtMk1uA",
        "email": "toronto.edu;cs.toronto.edu;cs.toronto.edu;;mail.utoronto.ca;cs.toronto.edu;stanford.edu;stanford.edu;google.com",
        "author_num": 9,
        "aff_unique_index": "0;0;0;0;0;1;1;2",
        "aff_unique_norm": "University of Toronto;Stanford University;Google",
        "aff_unique_dep": ";;Google",
        "aff_unique_url": "https://www.utoronto.ca;https://www.stanford.edu;https://www.google.com",
        "aff_unique_abbr": "U of T;Stanford;Google",
        "aff_campus_unique_index": "1;1;1;2;2;3",
        "aff_campus_unique": ";Toronto;Stanford;Mountain View",
        "aff_country_unique_index": "0;0;0;0;0;1;1;1",
        "aff_country_unique": "Canada;United States"
    },
    {
        "id": "GFqQ6gOupN",
        "title": "A Weight Variation-Aware Training Method for Hardware Neuromorphic Chips",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Hardware neuromorphic chips that mimic the biological nervous systems have recently attracted significant attention due to their ultra-low power and parallel computation. However, the inherent variability of nano-scale synaptic devices causes a weight perturbation and performance drop of neural networks. This paper proposes a training method to find weight with robustness to intrinsic device variability. A stochastic weight characteristic incurred by device inherent variability is considered during training. We investigate the impact of weight variation on both Spiking Neural Network (SNN) and standard Artificial Neural Network (ANN) with different architectures including fully connected, CNN, VGG, ResNet, MobileNet and EfficientNet on MNIST, N-MNIST, CIFAR-10, CIFAR-100, and ImageNet. Experimental results show that a weight variation-aware training method (WVAT) can dramatically minimize the performance drop on weight variability by exploring a flat loss landscape. On ferroelectric tunnel junctions (FTJ) devices, WVAT yields 78.01% accuracy of VGG-5 on CIFAR-10 for weight perturbations, while SGD scores 28.43%. Finally, WVAT is easy to implement on various architectures with little computational overhead.",
        "keywords": "hardware implementation;synaptic device;edge computing systems;neuro-inspired computing",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Min-Hye Oh",
        "authorids": "~Min-Hye_Oh1",
        "gender": "F",
        "homepage": "",
        "dblp": "",
        "google_scholar": "https://scholar.google.co.kr/citations?user=Mj90gSEAAAAJ",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Min-Hye_Oh1",
        "aff": "",
        "aff_domain": "",
        "position": "",
        "bibtex": "@misc{\noh2024a,\ntitle={A Weight Variation-Aware Training Method for Hardware Neuromorphic Chips},\nauthor={Min-Hye Oh},\nyear={2024},\nurl={https://openreview.net/forum?id=GFqQ6gOupN}\n}",
        "github": "",
        "project": "",
        "reviewers": "tUb1;Z5Eu;Q4cw;WCbC",
        "site": "https://openreview.net/forum?id=GFqQ6gOupN",
        "pdf_size": 2471708,
        "rating": "3;3;3;5",
        "confidence": "5;5;4;5",
        "soundness": "3;2;2;3",
        "contribution": "2;2;1;2",
        "presentation": "3;3;2;2",
        "wc_summary": "33;92;187;213",
        "wc_strengths": "17;14;92;52",
        "wc_weaknesses": "174;104;457;250",
        "wc_questions": "3;22;136;151",
        "wc_review": "227;232;872;666",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            131.25,
            72.4305702034714
        ],
        "wc_strengths_avg": [
            43.75,
            31.60992723813201
        ],
        "wc_weaknesses_avg": [
            246.25,
            132.17861967807048
        ],
        "wc_questions_avg": [
            78.0,
            66.056793745988
        ],
        "wc_review_avg": [
            499.25,
            279.41490207216935
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:JGmLy6Dgf0cJ:scholar.google.com/&scioq=A+Weight+Variation-Aware+Training+Method+for+Hardware+Neuromorphic+Chips&hl=en&as_sdt=0,5",
        "gs_version_total": 2
    },
    {
        "id": "GGPyzKsHZ1",
        "title": "Lifelong Audio-video Masked Autoencoder with Forget-robust Localized Alignments",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We present a lifelong audio-video masked autoencoder that continually learns the multimodal representations from a video stream containing audio-video pairs, while its distribution continually shifts over time. Specifically, we propose two novel ideas to tackle the problem: (1) Localized Alignment: We introduce a small trainable multimodal encoder that predicts the audio and video tokens that are well-aligned with each other. This allows the model to learn only the highly correlated audiovisual patches with accurate multimodal relationships.\n(2) Forget-robust multimodal patch selection: We compare the relative importance of each audio-video patch between the current and past data pair to mitigate unintended drift of the previously learned audio-video representations. Our proposed method, FLAVA (Forget-robust Localized Audio-Video Alignment), therefore, captures the complex relationships between the audio and video modalities during training on a sequence of pre-training tasks while alleviating the forgetting of learned audiovisual correlations. Our experiments validate that FLAVA outperforms the state-of-the-art continual learning methods on several benchmark datasets under continual audio-video representation learning scenarios.",
        "keywords": "continual-learning audio-visual representation-learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/526ab590a8f0373dafad321992eb0f4f28ebb87f.zip",
        "author": "Jaewoo Lee;Jaehong Yoon;Wonjae Kim;Yunji Kim;Sung Ju Hwang",
        "authorids": "~Jaewoo_Lee4;~Jaehong_Yoon1;~Wonjae_Kim1;~Yunji_Kim1;~Sung_Ju_Hwang1",
        "gender": "M;M;M;;",
        "homepage": "https://g-jwlee.github.io/;https://jaehong31.github.io/;https://wonjae.kim;;",
        "dblp": ";203/4449;158/3433;;",
        "google_scholar": ";-5comoUAAAAJ;https://scholar.google.co.kr/citations?user=UpZ41EwAAAAJ;;",
        "orcid": ";;0000-0002-6616-7685;;",
        "linkedin": ";jaehongyoon/;;;",
        "or_profile": "~Jaewoo_Lee4;~Jaehong_Yoon1;~Wonjae_Kim1;~Yunji_Kim1;~Sung_Ju_Hwang1",
        "aff": "Korea Advanced Institute of Science & Technology;University of North Carolina at Chapel Hill;NAVER;;",
        "aff_domain": "kaist.edu;unc.edu;navercorp.com;;",
        "position": "MS student;Postdoc;Research Scientist;;",
        "bibtex": "@misc{\nlee2024lifelong,\ntitle={Lifelong Audio-video Masked Autoencoder with Forget-robust Localized Alignments},\nauthor={Jaewoo Lee and Jaehong Yoon and Wonjae Kim and Yunji Kim and Sung Ju Hwang},\nyear={2024},\nurl={https://openreview.net/forum?id=GGPyzKsHZ1}\n}",
        "github": "",
        "project": "",
        "reviewers": "4AjC;YJJY;Q9gf;nu6v;hYwV",
        "site": "https://openreview.net/forum?id=GGPyzKsHZ1",
        "pdf_size": 7956824,
        "rating": "5;5;5;5;8",
        "confidence": "4;4;3;3;2",
        "soundness": "2;3;3;2;3",
        "contribution": "3;2;3;2;3",
        "presentation": "2;3;2;1;2",
        "wc_summary": "79;27;81;74;89",
        "wc_strengths": "47;38;9;54;57",
        "wc_weaknesses": "170;44;112;420;231",
        "wc_questions": "5;114;41;352;2",
        "wc_review": "301;223;243;900;379",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "2158;1536;1288;5428;3498",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "6;5;4;10;8",
        "rating_avg": [
            5.6,
            1.2
        ],
        "confidence_avg": [
            3.2,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            70.0,
            22.036333633342913
        ],
        "wc_strengths_avg": [
            41.0,
            17.28583234906552
        ],
        "wc_weaknesses_avg": [
            195.4,
            128.24601358326893
        ],
        "wc_questions_avg": [
            102.8,
            130.97389052784527
        ],
        "wc_review_avg": [
            409.2,
            251.31526018131092
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            2781.6,
            1528.9145953911227
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            6.6,
            2.1540659228538015
        ],
        "replies_avg": [
            42,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.8017837257372732,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12010701414465020705&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology;University of North Carolina;NAVER Corporation",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.kaist.ac.kr;https://www.unc.edu;https://www.naver.com",
        "aff_unique_abbr": "KAIST;UNC;NAVER",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Chapel Hill",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "id": "GGo5eMv45h",
        "title": "Hybrid Reinforcement Learning for Optimizing Pump Sustainability in Real-World Water Distribution Networks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "This article addresses the pump-scheduling optimization problem to enhance real-time control of real-world water distribution networks (WDNs). Our primary objectives are to adhere to physical operational constraints while reducing energy consumption and operational costs. Traditional optimization techniques, such as evolution-based and genetic algorithms, often fall short due to their lack of convergence guarantees. Conversely, reinforcement learning (RL) stands out for its adaptability to uncertainties and reduced inference time, enabling real-time responsiveness. However, the effective implementation of RL is contingent on building accurate simulation models for WDNs, and prior applications have been limited by errors in simulation training data. These errors can potentially cause the RL agent to learn misleading patterns and actions and recommend suboptimal operational strategies. To overcome these challenges, we present an improved \"hybrid RL\" methodology. This method integrates the benefits of RL while anchoring it in historical data, which serves as a baseline to incrementally introduce optimal control recommendations. By leveraging operational data as a foundation for the agent's actions, we enhance the explainability of the agent's actions, foster more robust recommendations, and minimize error. Our findings demonstrate that the hybrid RL agent can significantly improve sustainability, operational efficiency, and dynamically adapt to emerging scenarios in real-world WDNs.",
        "keywords": "Reinforcement Learning;Pump Optimization;Hybrid RL;Operational Efficiency;Sustainability;Water Distribution Networks",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Harsh Patel;Yuan Zhou;Alexander P Lamb;Shu Wang;Jieliang Luo",
        "authorids": "~Harsh_Patel2;~Yuan_Zhou17;~Alexander_P_Lamb1;~Shu_Wang9;~Jieliang_Luo1",
        "gender": "M;M;M;F;M",
        "homepage": ";;;http://ashleywang.me;",
        "dblp": ";;;;",
        "google_scholar": ";;EWVG4WIAAAAJ;;",
        "orcid": ";;;;",
        "linkedin": "harsh-b-patel/;zhou-yuan-364301b5;lambalexander/;;rodger-luo/",
        "or_profile": "~Harsh_Patel2;~Yuan_Zhou17;~Alexander_P_Lamb1;~Shu_Wang9;~Jieliang_Luo1",
        "aff": "Autodesk;Autodesk;;;Autodesk",
        "aff_domain": "autodesk.com;autodesk.com;;;autodesk.com",
        "position": "Principal Machine Learning Engineer;Manager of Machine Learning Engineering;;;Principal Research Scientist",
        "bibtex": "@misc{\npatel2024hybrid,\ntitle={Hybrid Reinforcement Learning for Optimizing Pump Sustainability in Real-World Water Distribution Networks},\nauthor={Harsh Patel and Yuan Zhou and Alexander P Lamb and Shu Wang and Jieliang Luo},\nyear={2024},\nurl={https://openreview.net/forum?id=GGo5eMv45h}\n}",
        "github": "",
        "project": "",
        "reviewers": "uinH;WJdj;E3Kq;V1rK",
        "site": "https://openreview.net/forum?id=GGo5eMv45h",
        "pdf_size": 3862725,
        "rating": "1;3;3;3",
        "confidence": "3;2;5;4",
        "soundness": "2;2;4;2",
        "contribution": "1;1;3;1",
        "presentation": "2;1;4;1",
        "wc_summary": "60;48;100;67",
        "wc_strengths": "1;8;117;18",
        "wc_weaknesses": "56;71;332;60",
        "wc_questions": "3;5;43;24",
        "wc_review": "120;132;592;169",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            1.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            2.0,
            1.224744871391589
        ],
        "wc_summary_avg": [
            68.75,
            19.279198634798075
        ],
        "wc_strengths_avg": [
            36.0,
            47.15400301140933
        ],
        "wc_weaknesses_avg": [
            129.75,
            116.8981928859467
        ],
        "wc_questions_avg": [
            18.75,
            16.223054582907622
        ],
        "wc_review_avg": [
            253.25,
            196.4094893328731
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.2581988897471611,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2483581915093440417&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Autodesk",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.autodesk.com",
        "aff_unique_abbr": "Autodesk",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Grokking in Linear Estimators -- A Solvable Model that Groks without Understanding",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19036",
        "id": "GH2LYb9XV0",
        "author_site": "Noam Levi, Alon Beck, Yohai Bar-Sinai",
        "tldr": "",
        "abstract": "Grokking is the intriguing phenomenon where a model learns to generalize long after it has fit the training data. \n    We show both analytically and numerically that grokking can surprisingly occur in linear networks performing linear tasks in a simple teacher-student setup. In this setting, the full training dynamics is derived in terms of the expected training and generalization data covariance matrix. We present exact predictions on how the grokking time depends on input and output dimensionality, train sample size, regularization, and network parameters initialization.\n    The key findings are that late generalization increase may not imply a transition from \"memorization\" to \"understanding\", but can simply be an artifact of the accuracy measure.\n    We provide empirical verification for these propositions, along with preliminary results indicating that some predictions also hold for deeper networks, with non-linear activations.",
        "keywords": "Grokking;Random Matrix Theory;Linear Regression;Representation Learning",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Noam Itzhak Levi;Alon Beck;Yohai Bar-Sinai",
        "authorids": "~Noam_Itzhak_Levi1;~Alon_Beck1;~Yohai_Bar-Sinai1",
        "gender": "M;M;",
        "homepage": "https://inspirehep.net/authors/1645549;;https://yohai.github.io",
        "dblp": "97/693;;",
        "google_scholar": "bOrtf9UAAAAJ;;b7Io-mAAAAAJ",
        "orcid": "0000-0002-3421-6059;0000-0002-6125-2303;0000-0002-6648-009X",
        "linkedin": "noam-levi-b240035a/;;",
        "or_profile": "~Noam_Itzhak_Levi1;~Alon_Beck1;~Yohai_Bar-Sinai1",
        "aff": "Tel Aviv University;Tel Aviv University;Tel Aviv University",
        "aff_domain": "tau.ac.il;tau.ac.il;tau.ac.il",
        "position": "PhD student;PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nlevi2024grokking,\ntitle={Grokking in Linear Estimators -- A Solvable Model that Groks without Understanding},\nauthor={Noam Itzhak Levi and Alon Beck and Yohai Bar-Sinai},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=GH2LYb9XV0}\n}",
        "github": "",
        "project": "",
        "reviewers": "VxMM;minU;wJux;Eifc",
        "pdf_size": 2271148,
        "rating": "3;5;6;8",
        "confidence": "4;4;4;3",
        "soundness": "3;4;3;3",
        "contribution": "2;3;2;3",
        "presentation": "3;2;3;2",
        "wc_summary": "207;201;44;65",
        "wc_strengths": "25;86;62;136",
        "wc_weaknesses": "283;550;128;84",
        "wc_questions": "10;211;202;40",
        "wc_review": "525;1048;436;325",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "563;775;615;229",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            129.25,
            75.14777109136371
        ],
        "wc_strengths_avg": [
            77.25,
            40.28259549731124
        ],
        "wc_weaknesses_avg": [
            261.25,
            182.36141998789108
        ],
        "wc_questions_avg": [
            115.75,
            91.4231234425952
        ],
        "wc_review_avg": [
            583.5,
            277.38105558959865
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            545.5,
            198.73286089622923
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8006407690254357,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16936948365219736406&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=GH2LYb9XV0",
        "pdf": "https://openreview.net/pdf?id=GH2LYb9XV0",
        "email": "tau.ac.il;tau.ac.il;tau.ac.il",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Tel Aviv University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tau.ac.il",
        "aff_unique_abbr": "TAU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Israel"
    },
    {
        "title": "Effective Structural Encodings via Local Curvature Profiles",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19035",
        "id": "GIUjLsDP4Z",
        "author_site": "Lukas Fesser, Melanie Weber",
        "tldr": "",
        "abstract": "Structural and Positional Encodings can significantly improve the performance of Graph Neural Networks in downstream tasks. Recent literature has begun to systematically investigate differences in the structural properties that these approaches encode, as well as performance trade-offs between them. However, the question of which structural properties yield the most effective encoding remains open. In this paper, we investigate this question from a geometric perspective. We propose a novel structural encoding based on discrete Ricci curvature (Local Curvature Profiles, short LCP) and show that it significantly outperforms existing encoding approaches. We further show that combining local structural encodings, such as LCP, with global positional encodings improves downstream performance, suggesting that they capture complementary geometric information. Finally, we compare different encoding types with (curvature-based) rewiring techniques. Rewiring has recently received a surge of interest due to its ability to improve the performance of Graph Neural Networks by mitigating over-smoothing and over-squashing effects. Our results suggest that utilizing curvature information for structural encodings delivers significantly larger performance increases than rewiring.",
        "keywords": "Graph Neural Networks;Discrete Curvature;Rewiring;Positional Encodings;Structural Encodings",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Lukas Fesser;Melanie Weber",
        "authorids": "~Lukas_Fesser1;~Melanie_Weber1",
        "gender": ";",
        "homepage": ";",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": ";",
        "aff": ";",
        "aff_domain": ";",
        "position": ";",
        "bibtex": "@inproceedings{\nfesser2024effective,\ntitle={Effective Structural Encodings via Local Curvature Profiles},\nauthor={Lukas Fesser and Melanie Weber},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=GIUjLsDP4Z}\n}",
        "github": "",
        "project": "",
        "reviewers": "pewF;GHx9;hevh;JWiJ",
        "pdf_size": 2401174,
        "rating": "3;6;6;8",
        "confidence": "2;4;3;2",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "52;37;106;71",
        "wc_strengths": "51;86;99;92",
        "wc_weaknesses": "225;73;50;62",
        "wc_questions": "49;1;42;30",
        "wc_review": "377;197;297;255",
        "wc_reply_reviewers": "0;6;0;19",
        "wc_reply_authors": "566;160;459;328",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            66.5,
            25.79244075305786
        ],
        "wc_strengths_avg": [
            82.0,
            18.479718612576328
        ],
        "wc_weaknesses_avg": [
            102.5,
            71.19164276795416
        ],
        "wc_questions_avg": [
            30.5,
            18.33712082089225
        ],
        "wc_review_avg": [
            281.5,
            65.58010369006746
        ],
        "wc_reply_reviewers_avg": [
            6.25,
            7.75806032459145
        ],
        "wc_reply_authors_avg": [
            378.25,
            151.59877143301657
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.1266600992762247,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15088829097246118211&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=GIUjLsDP4Z",
        "pdf": "https://openreview.net/pdf?id=GIUjLsDP4Z",
        "email": ";",
        "author_num": 2
    },
    {
        "id": "GIVprkGmp0",
        "title": "Enhancing Deep Graph Neural Networks via Improving Signal Propagation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Graph neural networks (GNNs) suffer from the \\textit{curse of depth}, a phenomenon where performance degrades significantly as network depth increases. \nIn this work, we aim to provide a more principled analysis and solution via the lens of signal propagation. \nWe identify three  metrics for a good signal propagation in \ngraph neural nets:\nforward-propagation, backward-propagation, and graph embedding variation (GEV).\nWe prove that traditional initialization methods, which deteriorate the performance of deep GNNs, fail to simultaneously \ncontrol the three metrics.\nTo tackle this issue, we develop a new GNN initialization method called \\textbf{S}ignal \\textbf{P}ropagation \\textbf{o}n \\textbf{G}raph (SPoGInit), which searches for weight variances that minimize the three metrics.\n% By carefully designing and optimizing initial weight metrics,\nIn various datasets, SPoGInit achieves notable performance enhancements in node classification tasks as GNNs grow deeper. For instance, we observed a 2.2\\% gain in test accuracy on OGBN-Arxiv dataset as the depth increases from 4 to 64.",
        "keywords": "signal propagation;deep graph convolutional networks;over-smoothing;initialization",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Senmiao Wang;Yupeng Chen;Yushun Zhang;Bingheng Li;Tian Ding;Ruoyu Sun",
        "authorids": "~Senmiao_Wang1;~Yupeng_Chen3;~Yushun_Zhang1;~Bingheng_Li1;~Tian_Ding1;~Ruoyu_Sun1",
        "gender": ";M;M;M;M;",
        "homepage": ";;https://zyushun.github.io/;https://github.com/uestclbh;;https://ruoyus.github.io/",
        "dblp": ";;276/8662;;;30/9879-1",
        "google_scholar": ";;https://scholar.google.com/citations?hl=en;;https://scholar.google.com.hk/citations?user=lVkDF-YAAAAJ;PsfzbCMAAAAJ",
        "orcid": ";0000-0003-1802-7220;;0009-0000-0950-9012;0000-0002-9383-8405;",
        "linkedin": ";;;;;",
        "or_profile": "~Senmiao_Wang1;~Yupeng_Chen3;~Yushun_Zhang1;~Bingheng_Li1;~Tian_Ding1;~Ruoyu_Sun1",
        "aff": ";Sichuan University;The Chinese University of Hong Kong, Shenzhen;University of Electronic Science and Technology of China;Shenzhen Research Institute of Big Data;The Chinese University of Hong Kong",
        "aff_domain": ";scu.edu.cn;cuhk.edu.cn;uestc.edu.cn;sribd.cn;cuhk.edu.cn",
        "position": ";MS student;PhD student;Undergrad student;Researcher;Associate Professor",
        "bibtex": "@misc{\nwang2024enhancing,\ntitle={Enhancing Deep Graph Neural Networks via Improving Signal Propagation},\nauthor={Senmiao Wang and Yupeng Chen and Yushun Zhang and Bingheng Li and Tian Ding and Ruoyu Sun},\nyear={2024},\nurl={https://openreview.net/forum?id=GIVprkGmp0}\n}",
        "github": "",
        "project": "",
        "reviewers": "S8wQ;c4kx;oZQy;4Jkm",
        "site": "https://openreview.net/forum?id=GIVprkGmp0",
        "pdf_size": 1359824,
        "rating": "3;5;5;5",
        "confidence": "4;4;4;4",
        "soundness": "3;3;3;2",
        "contribution": "2;2;2;2",
        "presentation": "2;3;3;2",
        "wc_summary": "81;38;61;61",
        "wc_strengths": "28;21;50;54",
        "wc_weaknesses": "76;172;82;376",
        "wc_questions": "3;9;76;39",
        "wc_review": "188;240;269;530",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            60.25,
            15.22128443988877
        ],
        "wc_strengths_avg": [
            38.25,
            14.042346669983617
        ],
        "wc_weaknesses_avg": [
            176.5,
            121.29612524726419
        ],
        "wc_questions_avg": [
            31.75,
            28.960101864461734
        ],
        "wc_review_avg": [
            306.75,
            132.11997388737254
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:JDap9E-KW_MJ:scholar.google.com/&scioq=Enhancing+Deep+Graph+Neural+Networks+via+Improving+Signal+Propagation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;1",
        "aff_unique_norm": "Sichuan University;Chinese University of Hong Kong;University of Electronic Science and Technology of China;Shenzhen Research Institute of Big Data",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.scu.edu.cn;https://www.cuhk.edu.cn;https://www.uestc.edu.cn;http://www.sribd.cn",
        "aff_unique_abbr": "SCU;CUHK;UESTC;",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Shenzhen;Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "GKING3cAaf",
        "title": "MeRino: Entropy-driven Design for Mobile-friendly Generative Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Generative Large Language Models (LLMs) stand as a revolutionary advancement in the modern era of artificial intelligence (AI). However, deploying LLMs to resource-constrained devices is difficult due to their high computational cost. In this paper, we propose a novel information-entropy framework for designing mobile-friendly generative language models. Our key design paradigm is to maximize the entropy of transformer decoders within the given computational budgets. The whole design procedure involves solving a mathematical programming (MP) problem, which can be done on the CPU within minutes, making it nearly zero-cost. We evaluate our designed models, termed MeRino, across twelve NLP downstream tasks, showing their competitive performance against the state-of-the-art autoregressive transformer models under the mobile setting. Notably, MeRino achieves similar or better zero and one-shot performance compared to the 350M parameter OPT while being 4.9$\\times$ faster on mobile devices with 5.5$\\times$ reduction in model size.",
        "keywords": "deep learning architecture;autoregressive transformers",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/a2b6308110628e754b9789bfed4386cc55c4495f.pdf",
        "author": "Youpeng Zhao;Ming Lin;Huadong Tang;Qiang Wu;Jun Wang",
        "authorids": "~Youpeng_Zhao2;~Ming_Lin4;~Huadong_Tang1;~Qiang_Wu2;~Jun_Wang7",
        "gender": "M;M;M;M;M",
        "homepage": "https://kennethzhao24.github.io/;https://minglin-home.github.io/;https://huadongtang.github.io/;https://www.uts.edu.au/staff/qiang.wu;http://www.cass.eecs.ucf.edu/jun-wang",
        "dblp": "259/5839;;214/3553;87/2533-1;w/JunWang1.html",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en;LiiZikgAAAAJ;https://scholar.google.com.au/citations?hl=en;wYNgwnMAAAAJ",
        "orcid": ";;;0000-0001-5641-2483;",
        "linkedin": "ypzhao24/;;;;jun-wang-2369543/",
        "or_profile": "~Youpeng_Zhao2;~Ming_Lin4;~Huadong_Tang1;~Qiang_Wu2;~Jun_Wang7",
        "aff": "d-Matrix;Oracle;University of Technology Sydney;University of Technology Sydney;University of Central Florida",
        "aff_domain": "d-matrix.ai;oracle.com;uts.edu.au;uts.edu.au;ucf.edu",
        "position": "Research Intern;Principal Researcher;PhD student;Associate Professor;Full Professor",
        "bibtex": "@misc{\nzhao2024merino,\ntitle={MeRino: Entropy-driven Design for Mobile-friendly Generative Language Models},\nauthor={Youpeng Zhao and Ming Lin and Huadong Tang and Qiang Wu and Jun Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=GKING3cAaf}\n}",
        "github": "",
        "project": "",
        "reviewers": "SWdN;BhDx;e1q5;iksc",
        "site": "https://openreview.net/forum?id=GKING3cAaf",
        "pdf_size": 1072008,
        "rating": "3;3;5;6",
        "confidence": "4;4;4;3",
        "soundness": "2;3;2;4",
        "contribution": "2;4;2;3",
        "presentation": "2;3;3;4",
        "wc_summary": "54;128;35;59",
        "wc_strengths": "38;32;9;34",
        "wc_weaknesses": "348;108;15;98",
        "wc_questions": "5;87;260;2",
        "wc_review": "445;355;319;193",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            69.0,
            35.220732530712645
        ],
        "wc_strengths_avg": [
            28.25,
            11.321991874224253
        ],
        "wc_weaknesses_avg": [
            142.25,
            124.15388636687939
        ],
        "wc_questions_avg": [
            88.5,
            104.72463893468432
        ],
        "wc_review_avg": [
            328.0,
            90.44888059008801
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.7777777777777777,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:tIbs0GvbgjUJ:scholar.google.com/&scioq=MeRino:+Entropy-driven+Design+for+Mobile-friendly+Generative+Language+Models&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;2;3",
        "aff_unique_norm": "d-Matrix;Oracle Corporation;University of Technology Sydney;University of Central Florida",
        "aff_unique_dep": ";;;",
        "aff_unique_url": ";https://www.oracle.com;https://www.uts.edu.au;https://www.ucf.edu",
        "aff_unique_abbr": ";Oracle;UTS;UCF",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "1;2;2;1",
        "aff_country_unique": ";United States;Australia"
    },
    {
        "id": "GKau1ekOtH",
        "title": "SAM-CLIP: Merging Vision Foundation Models towards Semantic and Spatial Understanding",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The landscape of publicly available vision foundation models (VFMs), such as CLIP and Segment Anything Model (SAM), is expanding rapidly. VFMs are endowed with distinct capabilities stemming from their pre-training objectives. For instance, CLIP excels in semantic understanding, while SAM specializes in spatial understanding for segmentation. In this work, we introduce a simple recipe to efficiently merge VFMs into a unified model that assimilates their expertise. Our proposed method integrates multi-task learning, continual learning techniques, and teacher-student distillation. This strategy entails significantly less computational cost compared to traditional multi-task training from scratch. Additionally, it only demands a small fraction of the pre-training datasets that were initially used to train individual models. By applying our method to SAM and CLIP, we derive SAM-CLIP : a unified model that amalgamates the strengths of SAM and CLIP into a single backbone, making it apt for edge device applications. We show that SAM-CLIP learns richer visual representations, equipped with both localization and semantic features, suitable for a broad range of vision tasks. SAM-CLIP obtains improved performance on several head probing tasks when compared with SAM and CLIP. We further show that SAM-CLIP not only retains the foundational strengths of its precursor models but also introduces synergistic functionalities, most notably in zero-shot semantic segmentation, where SAM-CLIP establishes new state-of-the-art results on 5 benchmarks. It outperforms previous models that are specifically designed for this task by a large margin, including +6.8% and +5.9% mean IoU improvement on Pascal-VOC and COCO-Stuff datasets, respectively.",
        "keywords": "Foundation Model;Multi-Task Learning;Zero-Shot Learning;Semantic Segmentation",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Haoxiang Wang;Pavan Kumar Anasosalu Vasu;Fartash Faghri;Raviteja Vemulapalli;Mehrdad Farajtabar;Sachin Mehta;Mohammad Rastegari;Oncel Tuzel;Hadi Pouransari",
        "authorids": "~Haoxiang_Wang1;~Pavan_Kumar_Anasosalu_Vasu1;~Fartash_Faghri1;~Raviteja_Vemulapalli1;~Mehrdad_Farajtabar1;~Sachin_Mehta1;~Mohammad_Rastegari2;~Oncel_Tuzel2;~Hadi_Pouransari1",
        "gender": "M;M;M;M;M;M;M;M;M",
        "homepage": "https://haoxiang-wang.github.io/;;;http://ravitejav.weebly.com/;https://www.cc.gatech.edu/~mfarajta/;https://sacmehta.github.io/;https://mrastegari.github.io/;http://www.onceltuzel.net;",
        "dblp": ";294/8896;115/7922;135/4940;21/9988;34/11140;31/5228;73/2943.html;162/5187",
        "google_scholar": "bcInPlwAAAAJ;;https://scholar.google.ca/citations?user=KUG_tG0AAAAJ;0OFqm7YAAAAJ;shkKxnQAAAAJ;https://scholar.google.co.in/citations?user=cnRJ0GUAAAAJ;N4-2Z_cAAAAJ;Fe7NTe0AAAAJ;besz69AAAAAJ",
        "orcid": ";;;;;;;;",
        "linkedin": "haoxiang-wang-071414ab/;pavankumar-vasu-anasosalu-b0767329;fartash-faghri;raviteja-vemulapalli-85146113?utm_source=share&utm_campaign=share_via&utm_content=profile&utm_medium=ios_app;;;;;",
        "or_profile": "~Haoxiang_Wang1;~Pavan_Kumar_Anasosalu_Vasu1;~Fartash_Faghri1;~Raviteja_Vemulapalli1;~Mehrdad_Farajtabar1;~Sachin_Mehta1;~Mohammad_Rastegari2;~Oncel_Tuzel2;~Hadi_Pouransari1",
        "aff": "University of Illinois, Urbana Champaign;Apple;Apple;Apple;Apple;Apple;Department of Computer Science, University of Washington;Apple;Apple",
        "aff_domain": "illinois.edu;apple.com;apple.com;apple.com;apple.com;apple.com;cs.washington.edu;apple.com;apple.com",
        "position": "PhD student;Researcher;Researcher;Researcher;Researcher;Researcher;Assistant Professor;Principal Researcher;Principal Researcher",
        "bibtex": "@misc{\nwang2024samclip,\ntitle={{SAM}-{CLIP}: Merging Vision Foundation Models towards Semantic and Spatial Understanding},\nauthor={Haoxiang Wang and Pavan Kumar Anasosalu Vasu and Fartash Faghri and Raviteja Vemulapalli and Mehrdad Farajtabar and Sachin Mehta and Mohammad Rastegari and Oncel Tuzel and Hadi Pouransari},\nyear={2024},\nurl={https://openreview.net/forum?id=GKau1ekOtH}\n}",
        "github": "",
        "project": "",
        "reviewers": "Unxf;a39d;K2ur;Kk2t",
        "site": "https://openreview.net/forum?id=GKau1ekOtH",
        "pdf_size": 9108312,
        "rating": "3;5;5;5",
        "confidence": "4;5;4;5",
        "soundness": "2;3;3;2",
        "contribution": "3;2;2;2",
        "presentation": "2;3;3;3",
        "wc_summary": "177;68;50;47",
        "wc_strengths": "52;66;51;34",
        "wc_weaknesses": "83;244;129;141",
        "wc_questions": "670;41;67;23",
        "wc_review": "982;419;297;245",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "845;598;453;629",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            85.5,
            53.434539391670626
        ],
        "wc_strengths_avg": [
            50.75,
            11.344051304538427
        ],
        "wc_weaknesses_avg": [
            149.25,
            58.831857866295536
        ],
        "wc_questions_avg": [
            200.25,
            271.6609789793153
        ],
        "wc_review_avg": [
            485.75,
            293.38828793937904
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            631.25,
            140.15415619952196
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 97,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10709890529483110578&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;1;1;1;1;2;1;1",
        "aff_unique_norm": "University of Illinois Urbana-Champaign;Apple;University of Washington",
        "aff_unique_dep": ";Apple Inc.;Department of Computer Science",
        "aff_unique_url": "https://illinois.edu;https://www.apple.com;https://www.washington.edu",
        "aff_unique_abbr": "UIUC;Apple;UW",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Urbana-Champaign;;Seattle",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "GKge9khQSa",
        "title": "PPT: Token Pruning and Pooling for Efficient Vision Transformers",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Vision Transformers (ViTs) have emerged as powerful models in the field of computer vision, delivering superior performance across various vision tasks. However, the high computational complexity poses a significant barrier to their practical applications in real-world scenarios. Motivated by the fact that not all tokens contribute equally to the final predictions and fewer tokens bring less computational cost, reducing redundant tokens has become a prevailing paradigm for accelerating vision transformers. However, we argue that it is not optimal to either only reduce inattentive redundancy by token pruning, or only reduce duplicative redundancy by token merging. To this end, in this paper we propose a novel acceleration framework, namely token Pruning & Pooling Transformers (PPT), to adaptively tackle these two types of redundancy in different layers. By heuristically integrating both token pruning and token pooling techniques in ViTs without additional trainable parameters, PPT effectively reduces the model complexity while maintaining its predictive accuracy. For example, PPT reduces over 37% FLOPs and improves the throughput by over 45% for DeiT-S without any accuracy drop on the ImageNet dataset.",
        "keywords": "Vision Transformers;Token Pruning;Token Pooling;Model Acceleration",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/7ff307172ca29b6d9c8b354f985f8d0561003365.zip",
        "author": "Xinjian Wu;Fanhu Zeng;Xiudong Wang;Yunhe Wang;Xinghao Chen",
        "authorids": "~Xinjian_Wu1;~Fanhu_Zeng2;~Xiudong_Wang1;~Yunhe_Wang1;~Xinghao_Chen1",
        "gender": "M;M;M;M;M",
        "homepage": "http://www.nlpr.ia.ac.cn/pal/index.html;https://aurorazengfh.github.io/;https://ieeexplore.ieee.org/author/37086028798;https://www.wangyunhe.site/;",
        "dblp": ";358/6344;198/9668;63/8217-1;30/4937-1",
        "google_scholar": ";;;https://scholar.google.com.sg/citations?user=isizOkYAAAAJ;tuGWUVIAAAAJ",
        "orcid": ";;;0000-0002-0142-509X;0000-0002-2102-8235",
        "linkedin": ";;;;",
        "or_profile": "~Xinjian_Wu1;~Fanhu_Zeng2;~Xiudong_Wang1;~Yunhe_Wang1;~Xinghao_Chen1",
        "aff": "Institute of Automation, Chinese Academy of Sciences;Institute of Automation, Chinese Academy of Sciences;Huawei Technologies Ltd.;Huawei Noah's Ark Lab;Huawei Noah's Ark Lab",
        "aff_domain": "ia.ac.cn;ia.ac.cn;huawei.com;huawei.com;huawei.com",
        "position": "PhD student;MS student;Researcher;Principal Researcher;Researcher",
        "bibtex": "@misc{\nwu2024ppt,\ntitle={{PPT}: Token Pruning and Pooling for Efficient Vision Transformers},\nauthor={Xinjian Wu and Fanhu Zeng and Xiudong Wang and Yunhe Wang and Xinghao Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=GKge9khQSa}\n}",
        "github": "",
        "project": "",
        "reviewers": "SM9c;b5bi;Egiv;zbfa",
        "site": "https://openreview.net/forum?id=GKge9khQSa",
        "pdf_size": 3955658,
        "rating": "3;5;5;6",
        "confidence": "5;4;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "18;94;40;38",
        "wc_strengths": "30;31;26;35",
        "wc_weaknesses": "124;131;107;69",
        "wc_questions": "16;198;52;54",
        "wc_review": "188;454;225;196",
        "wc_reply_reviewers": "0;135;0;0",
        "wc_reply_authors": "375;623;481;390",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            47.5,
            28.191310718020897
        ],
        "wc_strengths_avg": [
            30.5,
            3.2015621187164243
        ],
        "wc_weaknesses_avg": [
            107.75,
            24.014318645341575
        ],
        "wc_questions_avg": [
            80.0,
            69.7853852894716
        ],
        "wc_review_avg": [
            265.75,
            109.55449557183859
        ],
        "wc_reply_reviewers_avg": [
            33.75,
            58.45671475544961
        ],
        "wc_reply_authors_avg": [
            467.25,
            98.64678149843512
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9271726499455306,
        "gs_citation": 26,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8804051866623163693&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1;1;1",
        "aff_unique_norm": "Chinese Academy of Sciences;Huawei",
        "aff_unique_dep": "Institute of Automation;Huawei Technologies",
        "aff_unique_url": "http://www.ia.cas.cn;https://www.huawei.com",
        "aff_unique_abbr": "CAS;Huawei",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "GKxmmAwxj1",
        "title": "Scalable Normalizing Flows Enable Boltzmann Generators for Macromolecules",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The Boltzmann distribution of a protein provides a roadmap to all of its functional states. Normalizing flows are a promising tool for modeling this distribution, but current methods are intractable for typical pharmacological targets; they become computationally intractable due to the size of the system, heterogeneity of intra-molecular potential energy, and long-range interactions. To remedy these issues, we present a novel flow architecture that utilizes split channels and gated attention to efficiently learn the conformational distribution of proteins defined by internal coordinates. We show that by utilizing a 2-Wasserstein loss, one can smooth the transition from maximum likelihood training to energy-based training, enabling the training of Boltzmann Generators for macromolecules. We evaluate our model and training strategy on villin headpiece HP35(nle-nle), a 35-residue subdomain, and protein G, a 56-residue protein. We demonstrate that standard architectures and training strategies, such as maximum likelihood alone, fail while our novel architecture and multi-stage training strategy are able to model the conformational distributions of protein G and HP35.",
        "keywords": "normalizing flow;protein conformations;boltzmann generators;generative models",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/d7dd783c13e32b8dd3944e24b9628f65e94a47f5.pdf",
        "author": "Joseph Chahn Kim;David A Bloore;Karan Kapoor;Jun Feng;Ming-Hong Hao;Mengdi Wang",
        "authorids": "~Joseph_Chahn_Kim1;~David_A_Bloore1;~Karan_Kapoor1;~Jun_Feng4;~Ming-Hong_Hao1;~Mengdi_Wang1",
        "gender": "M;;M;;;F",
        "homepage": "https://www.hadtomakeaurl.com/;;https://www.ks.uiuc.edu/~kkapoor/;;;http://mwang.princeton.edu",
        "dblp": ";;;;;",
        "google_scholar": ";;28Ka7I8AAAAJ;;;",
        "orcid": ";;;;;",
        "linkedin": ";david-bloore-9896b94b/;;jun-feng-a3a2473/;;",
        "or_profile": "~Joseph_Chahn_Kim1;~David_A_Bloore1;~Karan_Kapoor1;~Jun_Feng4;~Ming-Hong_Hao1;~Mengdi_Wang1",
        "aff": "Princeton University;Fidelity Investments;Ensem Therapeutics;Cellarity Inc;;Princeton University",
        "aff_domain": "princeton.edu;fidelity.com;ensemtx.com;cellarity.com;;princeton.edu",
        "position": "PhD student;Principal Researcher;Researcher;Researcher;;Full Professor",
        "bibtex": "@misc{\nkim2024scalable,\ntitle={Scalable Normalizing Flows Enable Boltzmann Generators for Macromolecules},\nauthor={Joseph Chahn Kim and David A Bloore and Karan Kapoor and Jun Feng and Ming-Hong Hao and Mengdi Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=GKxmmAwxj1}\n}",
        "github": "",
        "project": "",
        "reviewers": "2JvV;3BfG;xhnH;VZgX",
        "site": "https://openreview.net/forum?id=GKxmmAwxj1",
        "pdf_size": 1159247,
        "rating": "5;6;6;6",
        "confidence": "4;4;3;3",
        "soundness": "3;2;3;4",
        "contribution": "2;3;3;3",
        "presentation": "3;3;2;2",
        "wc_summary": "92;112;19;66",
        "wc_strengths": "45;155;91;56",
        "wc_weaknesses": "86;393;254;6",
        "wc_questions": "62;224;153;122",
        "wc_review": "285;884;517;250",
        "wc_reply_reviewers": "46;293;0;0",
        "wc_reply_authors": "404;1318;1081;427",
        "reply_reviewers": "1;3;0;0",
        "reply_authors": "2;5;2;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            72.25,
            34.802119188348286
        ],
        "wc_strengths_avg": [
            86.75,
            42.90906081470439
        ],
        "wc_weaknesses_avg": [
            184.75,
            149.88891720204
        ],
        "wc_questions_avg": [
            140.25,
            58.379683966256614
        ],
        "wc_review_avg": [
            484.0,
            252.70832989832368
        ],
        "wc_reply_reviewers_avg": [
            84.75,
            121.69095077284916
        ],
        "wc_reply_authors_avg": [
            807.5,
            400.9379627822738
        ],
        "reply_reviewers_avg": [
            1.0,
            1.224744871391589
        ],
        "reply_authors_avg": [
            2.5,
            1.5
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14598555614518611852&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;2;3;0",
        "aff_unique_norm": "Princeton University;Fidelity Investments;Ensem Therapeutics;Cellarity Inc",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.princeton.edu;https://www.fidelity.com;https://www.ensemtherapeutics.com;",
        "aff_unique_abbr": "Princeton;Fidelity;;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "RAPTOR: Recursive Abstractive Processing for Tree-Organized Retrieval",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19034",
        "id": "GN921JHCRw",
        "author_site": "Parth Sarthi, Salman Abdullah, Aditi Tuli, Shubh Khanna, Anna Goldie, Christopher Manning",
        "tldr": "",
        "abstract": "Retrieval-augmented language models can better adapt to changes in world state and incorporate long-tail knowledge.  However, most existing methods retrieve only short contiguous chunks from a retrieval corpus, limiting holistic understanding of the overall document context. We introduce the novel approach of recursively embedding, clustering, and summarizing chunks of text, constructing a tree with differing levels of summarization from the bottom up. At inference time, our RAPTOR model retrieves from this tree, integrating information across lengthy documents at different levels of abstraction. Controlled experiments show that retrieval with recursive summaries offers significant improvements over traditional retrieval-augmented LMs on several tasks. On question-answering tasks that involve complex, multi-step reasoning, we show state-of-the-art results; for example, by coupling RAPTOR retrieval with the use of GPT-4, we can improve the best performance on the QuALITY benchmark by 20\\% in absolute accuracy.",
        "keywords": "Retrieval Augmented Language Models;Information Retrieval;summarization;QA",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/d08bad0d7976e4e81370c62a8f20de5efd38236a.zip",
        "author": "Parth Sarthi;Salman Abdullah;Aditi Tuli;Shubh Khanna;Anna Goldie;Christopher D Manning",
        "authorids": "~Parth_Sarthi1;~Salman_Abdullah1;~Aditi_Tuli1;~Shubh_Khanna1;~Anna_Goldie2;~Christopher_D_Manning1",
        "gender": ";M;F;M;F;M",
        "homepage": ";;;;http://annagoldie.com;https://nlp.stanford.edu/~manning/",
        "dblp": ";;;;;m/ChristopherDManning",
        "google_scholar": "2zua7z0AAAAJ;;;HsShv4sAAAAJ;;1zmDOdwAAAAJ",
        "orcid": ";;;;;0000-0001-6155-649X",
        "linkedin": ";salman-abdullah-b71640172/;aditi-tuli-49548722b/;shubh-khanna/;;christopher-manning-011575/",
        "or_profile": "~Parth_Sarthi1;~Salman_Abdullah1;~Aditi_Tuli1;~Shubh_Khanna1;~Anna_Goldie2;~Christopher_D_Manning1",
        "aff": "Stanford University;Computer Science Department, Stanford University;Stanford University;Stanford University;Stanford University;Computer Science Department, Stanford University",
        "aff_domain": "stanford.edu;cs.stanford.edu;stanford.edu;stanford.edu;stanford.edu;cs.stanford.edu",
        "position": "Undergrad student;Undergrad student;Undergrad student;Undergrad student;PhD student;Full Professor",
        "bibtex": "@inproceedings{\nsarthi2024raptor,\ntitle={{RAPTOR}: Recursive Abstractive Processing for Tree-Organized Retrieval},\nauthor={Parth Sarthi and Salman Abdullah and Aditi Tuli and Shubh Khanna and Anna Goldie and Christopher D Manning},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=GN921JHCRw}\n}",
        "github": "",
        "project": "",
        "reviewers": "YAgR;VSBj;DRXQ;PvjZ",
        "pdf_size": 2452208,
        "rating": "6;6;8;8",
        "confidence": "3;4;3;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;4",
        "presentation": "2;2;3;3",
        "wc_summary": "132;50;135;136",
        "wc_strengths": "50;101;62;45",
        "wc_weaknesses": "99;167;48;144",
        "wc_questions": "183;406;31;54",
        "wc_review": "464;724;276;379",
        "wc_reply_reviewers": "115;177;0;97",
        "wc_reply_authors": "1729;3214;749;1013",
        "reply_reviewers": "1;3;0;1",
        "reply_authors": "4;7;2;4",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            113.25,
            36.54705870518173
        ],
        "wc_strengths_avg": [
            64.5,
            21.96019125599775
        ],
        "wc_weaknesses_avg": [
            114.5,
            45.521972716480555
        ],
        "wc_questions_avg": [
            168.5,
            148.85647449808826
        ],
        "wc_review_avg": [
            460.75,
            165.92675341848886
        ],
        "wc_reply_reviewers_avg": [
            97.25,
            63.507381460740454
        ],
        "wc_reply_authors_avg": [
            1676.25,
            957.4903067394469
        ],
        "reply_reviewers_avg": [
            1.25,
            1.0897247358851685
        ],
        "reply_authors_avg": [
            4.25,
            1.7853571071357126
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 129,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6186698799058088635&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=GN921JHCRw",
        "pdf": "https://openreview.net/pdf?id=GN921JHCRw",
        "email": "stanford.edu;cs.stanford.edu;stanford.edu;stanford.edu;stanford.edu;cs.stanford.edu",
        "author_num": 6,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "Stanford University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.stanford.edu",
        "aff_unique_abbr": "Stanford",
        "aff_campus_unique_index": "0;0;0;0;0;0",
        "aff_campus_unique": "Stanford",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "GOSLsf0lFD",
        "title": "VariedVision: Employing Adaptive Patching Mechanisms in Vision Transformer Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Leveraging self-attention mechanisms, Vision Transformers (ViTs) have recently achieved unprecedented success across diverse vision tasks. However, they encounter significant computational overheads, exacerbated by the increasing number of patches, attention heads, and transformer blocks. The predominant uniform patching strategy in ViTs overlooks the disparate detail levels within different image regions, leading to inefficiencies. Addressing these constraints, we introduce VariedVision, a groundbreaking framework that incorporates adaptive patching mechanisms, allowing the model to tap into multi-resolution information by allocating variable patch sizes to different regions based on their intrinsic details. This enables more refined attention to areas requiring finer granularity and more comprehensive coverage for areas with lesser details. VariedVision employs an auxiliary network to dynamically assign 'detail scores' to various image regions, thereby determining the optimal patch size for each, ensuring uniformity in the number of patches while enhancing adaptability to diverse long-range dependencies between them. The integration of dynamic positional embeddings caters to the varying patch sizes and multi-resolution nature of the input, enriching the model's spatial and contextual awareness. This multi-resolution approach enables VariedVision to perceive and process details at different scales effectively, optimizing the representation of both macro and micro-level features within the image. VariedVision is optimized end-to-end, harmonizing the adaptive patching mechanism with the transformer backbone, unveiling an enhancement in both efficiency and accuracy. Rigorous experiments on ImageNet validate VariedVision's efficacy, showcasing enhanced efficiency/accuracy trade-offs and revealing insights into potential redundancies and inefficiencies in conventional uniform patching methodologies.",
        "keywords": "Vision Transformers; Adaptive patching mechanisms; Multi-resolution information;",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Xin Ma;Won Hwa Kim",
        "authorids": "~Xin_Ma2;~Won_Hwa_Kim4",
        "gender": "M;M",
        "homepage": "https://xma24.github.io/xma/;https://wwplato.github.io/",
        "dblp": ";12/10278",
        "google_scholar": "RAw-wJIAAAAJ;aWPSHNwAAAAJ",
        "orcid": ";",
        "linkedin": "xin-ma-b4b8b1197/;",
        "or_profile": "~Xin_Ma2;~Won_Hwa_Kim1",
        "aff": "University of Texas at Arlington, University of Texas, Arlington;Pohang University of Science and Technology",
        "aff_domain": "mavs.uta.edu;postech.ac.kr",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\nma2024variedvision,\ntitle={VariedVision: Employing Adaptive Patching Mechanisms in Vision Transformer Models},\nauthor={Xin Ma and Won Hwa Kim},\nyear={2024},\nurl={https://openreview.net/forum?id=GOSLsf0lFD}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=GOSLsf0lFD",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Ir8oL1tgRCMJ:scholar.google.com/&scioq=VariedVision:+Employing+Adaptive+Patching+Mechanisms+in+Vision+Transformer+Models&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Texas at Arlington;Pohang University of Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uta.edu;https://www.postech.ac.kr",
        "aff_unique_abbr": "UTA;POSTECH",
        "aff_campus_unique_index": "0;1",
        "aff_campus_unique": "Arlington;Pohang",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United States;South Korea"
    },
    {
        "id": "GOiEdLIgVF",
        "title": "Saliency-Guided Hidden Associative Replay for Continual Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Continual Learning (CL) is a burgeoning domain in next-generation AI, focusing on training neural networks over a sequence of tasks akin to human learning. While CL provides an edge over traditional supervised learning, its central challenge remains to counteract \\emph{catastrophic forgetting} and ensure the retention of prior tasks during subsequent learning. Amongst various strategies to tackle this, replay-based methods have emerged as preeminent, echoing biological memory mechanisms. However, these methods are memory-intensive, often preserving entire data samples\u2014an approach inconsistent with humans' selective memory retention of salient experiences. While some recent works have explored the storage of only significant portions of data in episodic memory, the inherent nature of partial data necessitates innovative retrieval mechanisms. Current solutions, like inpainting, approximate full data reconstruction from partial cues, a method that diverges from genuine human memory processes. Addressing these nuances, this paper presents the **S**aliency-Guided **H**idden **A**ssociative **R**eplay for **C**ontinual Learning (**SHARC**). This novel framework synergizes associative memory with replay-based strategies. SHARC primarily archives salient data segments via sparse memory encoding. Importantly, by harnessing associative memory paradigms, it introduces a content-focused memory retrieval mechanism, promising swift and near-perfect recall, bringing CL a step closer to authentic human memory processes. Extensive experimental results demonstrate the effectiveness of our proposed method for various continual learning tasks. Anonymous code can be found at: https://anonymous.4open.science/r/SHARC-6319.",
        "keywords": "Continual Learning;Memory Replay;Associative Memory",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Guangji Bai;Qilong Zhao;Xiaoyang Jiang;Yifei Zhang;Liang Zhao",
        "authorids": "~Guangji_Bai1;~Qilong_Zhao1;~Xiaoyang_Jiang1;~Yifei_Zhang10;~Liang_Zhao6",
        "gender": "M;M;;M;M",
        "homepage": "https://baithebest.github.io/;;https://github.com/thisisnotahuman;https://yifeizhangcs.github.io/;https://cs.emory.edu/~lzhao41/",
        "dblp": "286/0892;203/2297;;55/5266-6;63/5422-2",
        "google_scholar": "gBMbU28AAAAJ;;;y5FkC7cAAAAJ;qnvyqtwAAAAJ",
        "orcid": "0000-0003-3932-2472;0009-0006-1985-3267;;0009-0004-6136-733X;0000-0002-2648-9989",
        "linkedin": "https://linkedin.com/in/guangji-bai/;;;yifei-jimmy-zhang/;",
        "or_profile": "~Guangji_Bai1;~Qilong_Zhao1;~Xiaoyang_Jiang1;~Yifei_Zhang10;~Liang_Zhao6",
        "aff": "Emory University;Emory University;Northeastern University;Emory University;Emory University",
        "aff_domain": "emory.edu;emory.edu;neu.edu.cn;emory.edu;emory.edu",
        "position": "PhD student;MS student;Undergrad student;PhD student;Associate Professor",
        "bibtex": "@misc{\nbai2024saliencyguided,\ntitle={Saliency-Guided Hidden Associative Replay for Continual Learning},\nauthor={Guangji Bai and Qilong Zhao and Xiaoyang Jiang and Yifei Zhang and Liang Zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=GOiEdLIgVF}\n}",
        "github": "",
        "project": "",
        "reviewers": "8orT;vmux;prAb;WbsA;3N7Y",
        "site": "https://openreview.net/forum?id=GOiEdLIgVF",
        "pdf_size": 3237685,
        "rating": "3;3;3;3;6",
        "confidence": "4;3;5;5;2",
        "soundness": "2;3;2;1;3",
        "contribution": "2;2;2;3;3",
        "presentation": "2;4;3;3;3",
        "wc_summary": "63;68;121;85;79",
        "wc_strengths": "28;45;36;106;68",
        "wc_weaknesses": "393;218;99;504;52",
        "wc_questions": "97;84;30;105;62",
        "wc_review": "581;415;286;800;261",
        "wc_reply_reviewers": "0;0;0;21;24",
        "wc_reply_authors": "530;1409;1234;0;440",
        "reply_reviewers": "0;0;0;1;1",
        "reply_authors": "1;2;2;0;1",
        "rating_avg": [
            3.6,
            1.2
        ],
        "confidence_avg": [
            3.8,
            1.16619037896906
        ],
        "soundness_avg": [
            2.2,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            3.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            83.2,
            20.439178065665946
        ],
        "wc_strengths_avg": [
            56.6,
            28.09697492613751
        ],
        "wc_weaknesses_avg": [
            253.2,
            172.0132553031888
        ],
        "wc_questions_avg": [
            75.6,
            27.045147439050876
        ],
        "wc_review_avg": [
            468.6,
            200.88464351463006
        ],
        "wc_reply_reviewers_avg": [
            9.0,
            11.063453348751466
        ],
        "wc_reply_authors_avg": [
            722.6,
            523.7906452009238
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.2,
            0.7483314773547883
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.7717436331412897,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9060914702686428703&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "Emory University;Northeastern University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.emory.edu;https://www.northeastern.edu",
        "aff_unique_abbr": "Emory;NEU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "GOt2kP383R",
        "title": "Overcoming Distribution Mismatch in Quantizing Image Super-Resolution Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Quantization is a promising approach to reduce the high computational complexity of image super-resolution (SR) networks. However, compared to high-level tasks like image classification, low-bit quantization leads to severe accuracy loss in SR networks. This is because feature distributions of SR networks are significantly divergent for each channel or input image, and is thus difficult to determine a quantization range. Existing SR quantization works approach this distribution mismatch problem by dynamically adapting quantization ranges to the variant distributions during test time. However, such dynamic adaptation incurs additional computational costs that limit the benefits of quantization. Instead, we propose a new quantization-aware training framework that effectively Overcomes the Distribution Mismatch problem in SR networks without the need for dynamic adaptation. Intuitively, the mismatch can be reduced by directly regularizing the variance in features during training. However, we observe that variance regularization can collide with the reconstruction loss during training and adversely impact SR accuracy. Thus, we avoid the conflict between two losses by regularizing the variance only when the gradients of variance regularization are cooperative with that of reconstruction. Additionally, to further reduce the distribution mismatch, we introduce selective distribution offsets to layers with a significant mismatch, which selectively scales or shifts channel-wise features. Our proposed algorithm, called ODM, effectively reduces the mismatch in distributions with minimal computational overhead. Experimental results show that ODM effectively outperforms existing SR quantization approaches with similar or fewer computations, demonstrating the importance of reducing the distribution mismatch problem.",
        "keywords": "quantization;image super-resolution;quantization-aware training",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/5fe2a11b606161d49905a115dd651de9f9322185.zip",
        "author": "Cheeun Hong;Kyoung Mu Lee",
        "authorids": "~Cheeun_Hong1;~Kyoung_Mu_Lee2",
        "gender": "F;M",
        "homepage": "https://cheeun.github.io/;https://cv.snu.ac.kr/kmlee/",
        "dblp": "281/7988;17/4029",
        "google_scholar": "HHjMKhIAAAAJ;Hofj9kAAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Cheeun_Hong1;~Kyoung_Mu_Lee1",
        "aff": "Seoul National University;Seoul National University",
        "aff_domain": "snu.ac.kr;snu.ac.kr",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nhong2024overcoming,\ntitle={Overcoming Distribution Mismatch in Quantizing Image Super-Resolution Networks},\nauthor={Cheeun Hong and Kyoung Mu Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=GOt2kP383R}\n}",
        "github": "",
        "project": "",
        "reviewers": "p2GR;v9HR;Yy9i;Bh7W",
        "site": "https://openreview.net/forum?id=GOt2kP383R",
        "pdf_size": 3960966,
        "rating": "3;6;6;6",
        "confidence": "5;4;4;3",
        "soundness": "2;3;3;2",
        "contribution": "2;3;3;3",
        "presentation": "2;3;3;2",
        "wc_summary": "42;70;85;84",
        "wc_strengths": "29;64;58;92",
        "wc_weaknesses": "12;74;32;133",
        "wc_questions": "172;4;102;44",
        "wc_review": "255;212;277;353",
        "wc_reply_reviewers": "0;16;0;0",
        "wc_reply_authors": "680;454;394;574",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            70.25,
            17.354754391808605
        ],
        "wc_strengths_avg": [
            60.75,
            22.37604746151563
        ],
        "wc_weaknesses_avg": [
            62.75,
            46.32156625158523
        ],
        "wc_questions_avg": [
            80.5,
            63.283094108932445
        ],
        "wc_review_avg": [
            274.25,
            51.12423593561081
        ],
        "wc_reply_reviewers_avg": [
            4.0,
            6.928203230275509
        ],
        "wc_reply_authors_avg": [
            525.5,
            110.2576527956223
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11499548342948551694&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Seoul National University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.snu.ac.kr",
        "aff_unique_abbr": "SNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "GOvTGntFNj",
        "title": "Query-Efficient Offline Preference-Based Reinforcement Learning via In-Dataset Exploration",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Preference-based reinforcement learning has shown great promise in various applications to avoid reward annotations and align better with human intentions. However, obtaining preference feedback can still be expensive or time-consuming, which forms a strong barrier for preference-based RL. In this paper, we propose a novel approach to improve the query efficiency of offline preference-based RL by introducing the concept of in-dataset exploration. In-dataset exploration consists of two key features: weighted trajectory queries and a principled pairwise exploration strategy that balances between pessimism over transitions and optimism over reward functions. We show that such a strategy leads to a provably efficient algorithm that judiciously selects queries to minimize the overall number of queries while ensuring robust performance. We further design an empirical version of our algorithm that tailors the theoretical insights to practical settings. Experiments on various tasks demonstrate that our approach achieves strong performance with significantly fewer queries than state-of-the-art methods.",
        "keywords": "preference-based RL;offline RL;reinforcement learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/697af3f025dcc67e3251ed6b29ac0bba1d01efe7.zip",
        "author": "Hao Hu;Yiqin Yang;Jin Zhang;Shuai Wang;Bo Liu;Yang Gao;Chongjie Zhang",
        "authorids": "~Hao_Hu3;~Yiqin_Yang1;~Jin_Zhang6;~Shuai_Wang26;~Bo_Liu2;~Yang_Gao1;~Chongjie_Zhang1",
        "gender": "M;M;M;M;M;M;",
        "homepage": "https://mousehu.github.io;https://www.researchgate.net/profile/Yiqin-Yang-2;http://group.iiis.tsinghua.edu.cn/~milab/person-zhangjin.html;;https://liubo-cs.github.io/;http://yang-gao.weebly.com;",
        "dblp": "67/6924-6;180/7725;43/6657-16;42/1503.html;58/2670-6.html;89/4402-29;29/6693",
        "google_scholar": "https://scholar.google.com/citations?hl=en;aHTi5IEAAAAJ;;;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en;LjxqXycAAAAJ",
        "orcid": ";;;;0000-0003-2519-6196;;",
        "linkedin": "hao-hu-tsinghua;;;;bo-liu-8b2b8118/;yang-gao-45245348/;",
        "or_profile": "~Hao_Hu3;~Yiqin_Yang1;~Jin_Zhang6;~Shuai_Wang26;~Bo_Liu2;~Yang_Gao1;~Chongjie_Zhang1",
        "aff": "Tsinghua University;Tsinghua University;Tsinghua University;;Auburn University;Tsinghua University;Washington University, Saint Louis",
        "aff_domain": "tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;;auburn.edu;tsinghua.edu.cn;wustl.edu",
        "position": "PhD student;PhD student;PhD student;;Assistant Professor;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nhu2024queryefficient,\ntitle={Query-Efficient Offline Preference-Based Reinforcement Learning via In-Dataset Exploration},\nauthor={Hao Hu and Yiqin Yang and Jin Zhang and Shuai Wang and Bo Liu and Yang Gao and Chongjie Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=GOvTGntFNj}\n}",
        "github": "",
        "project": "",
        "reviewers": "HCQm;i96V;8oYp",
        "site": "https://openreview.net/forum?id=GOvTGntFNj",
        "pdf_size": 1099412,
        "rating": "3;5;8",
        "confidence": "3;4;3",
        "soundness": "3;3;3",
        "contribution": "3;2;2",
        "presentation": "3;2;3",
        "wc_summary": "49;314;87",
        "wc_strengths": "36;172;33",
        "wc_weaknesses": "227;153;188",
        "wc_questions": "88;133;172",
        "wc_review": "400;772;480",
        "wc_reply_reviewers": "0;0;268",
        "wc_reply_authors": "983;1360;955",
        "reply_reviewers": "0;0;2",
        "reply_authors": "2;2;3",
        "rating_avg": [
            5.333333333333333,
            2.0548046676563256
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            150.0,
            116.99857548990357
        ],
        "wc_strengths_avg": [
            80.33333333333333,
            64.82969141441974
        ],
        "wc_weaknesses_avg": [
            189.33333333333334,
            30.225081564084416
        ],
        "wc_questions_avg": [
            131.0,
            34.322004603461025
        ],
        "wc_review_avg": [
            550.6666666666666,
            159.877731059985
        ],
        "wc_reply_reviewers_avg": [
            89.33333333333333,
            126.33641157199649
        ],
        "wc_reply_authors_avg": [
            1099.3333333333333,
            184.6732850799547
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.1147078669352809,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Fb9FyVgvQfYJ:scholar.google.com/&scioq=Query-Efficient+Offline+Preference-Based+Reinforcement+Learning+via+In-Dataset+Exploration&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;0;2",
        "aff_unique_norm": "Tsinghua University;Auburn University;Washington University in St. Louis",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.auburn.edu;https://wustl.edu",
        "aff_unique_abbr": "THU;Auburn;WUSTL",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Saint Louis",
        "aff_country_unique_index": "0;0;0;1;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "The Reversal Curse: LLMs trained on \u201cA is B\u201d fail to learn \u201cB is A\u201d",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19033",
        "id": "GPKTIktA0k",
        "author_site": "Lukas Berglund, Meg Tong, Maximilian Kaufmann, Mikita Balesni, Asa Stickland, Tomek Korbak, Owain Evans",
        "tldr": "",
        "abstract": "We expose a surprising failure of generalization in auto-regressive large language models (LLMs). If a model is trained on a sentence of the form ''_A_ is _B_'', it will not automatically generalize to the reverse direction ''_B_ is _A_''. This is the **Reversal Curse**. For instance, if a model is trained on ''Valentina Tereshkova was the first woman to travel to space'', it will not automatically be able to answer the question, ''Who was the first woman to travel to space?''. Moreover, the likelihood of the correct answer (''Valentina Tershkova'') will not be higher than for a random name. Thus, models do not generalize a prevalent pattern in their training set: if ''_A_ is _B_'' occurs, ''_B_ is _A_'' is more likely to occur. It is worth noting, however, that if ''_A_ is _B_'' appears _in-context_, models can deduce the reverse relationship. \n\nWe provide evidence for the Reversal Curse by finetuning GPT-3 and Llama-1 on fictitious statements such as ''Uriah Hawthorne is the composer of _Abyssal Melodies_'' and showing that they fail to correctly answer ''Who composed _Abyssal Melodies?_''. The Reversal Curse is robust across model sizes and model families and is not alleviated by data augmentation.\n\nWe also evaluate ChatGPT (GPT-3.5 and GPT-4) on questions about real-world celebrities, such as ''Who is Tom Cruise's mother? [A: Mary Lee Pfeiffer]'' and the reverse ''Who is Mary Lee Pfeiffer's son?''. GPT-4 correctly answers questions like the former 79\\% of the time, compared to 33\\% for the latter.\n\n Code available at: https://github.com/lukasberglund/reversal_curse.",
        "keywords": "LLMs;Large Language Models;Question Answering;Generalization;Knowledge Representation;Logical Inference;Relations",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/a0fb1a9ca3f83664ef1eafc51cf04c1cd0bd33d0.pdf",
        "author": "Lukas Berglund;Meg Tong;Maximilian Kaufmann;Mikita Balesni;Asa Cooper Stickland;Tomasz Korbak;Owain Evans",
        "authorids": "~Lukas_Berglund1;~Meg_Tong1;~Maximilian_Kaufmann1;~Mikita_Balesni1;~Asa_Cooper_Stickland1;~Tomasz_Korbak1;~Owain_Evans1",
        "gender": "M;;M;M;M;;",
        "homepage": ";https://www.megtong.com/;https://mikitabalesni.com;https://homepages.inf.ed.ac.uk/s1302760/;https://tomekkorbak.com;https://owainevans.github.io/;https://maxkaufmann.com/",
        "dblp": ";;;236/4708;209/9713.html;52/10432;127/0266",
        "google_scholar": "https://scholar.google.com/citations?hl=en;_pTshvoAAAAJ;mDXcNBMAAAAJ;https://scholar.google.co.uk/citations?hl=en;YQ5rrk4AAAAJ;4VpTwzIAAAAJ;",
        "orcid": ";;;;0000-0002-6258-2013;;",
        "linkedin": "lukas-berglund;;mbalesni/;asa-cooper-stickland-a2712b122;tomaszkorbak/;;",
        "or_profile": "~Lukas_Berglund1;~Meg_Tong1;~Mikita_Balesni1;~Asa_Cooper_Stickland1;~Tomasz_Korbak1;~Owain_Evans1;~Max_Kaufmann1",
        "aff": ";;Apollo Research;New York University;Anthropic;Truthful AI;UK AI Safety Institute",
        "aff_domain": ";;apolloresearch.ai;nyu.edu;anthropic.com;owainevans.com;gov.uk",
        "position": ";;Researcher;Postdoc;Researcher;Principal Researcher;Researcher",
        "bibtex": "@inproceedings{\nberglund2024the,\ntitle={The Reversal Curse: {LLM}s trained on {\\textquotedblleft}A is B{\\textquotedblright} fail to learn {\\textquotedblleft}B is A{\\textquotedblright}},\nauthor={Lukas Berglund and Meg Tong and Maximilian Kaufmann and Mikita Balesni and Asa Cooper Stickland and Tomasz Korbak and Owain Evans},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=GPKTIktA0k}\n}",
        "github": "",
        "project": "",
        "reviewers": "SewQ;r4om;zDBK;YHWk",
        "pdf_size": 1558199,
        "rating": "6;6;6;8",
        "confidence": "4;3;3;3",
        "soundness": "3;3;2;1",
        "contribution": "3;3;2;2",
        "presentation": "3;4;3;4",
        "wc_summary": "47;40;120;146",
        "wc_strengths": "59;32;39;220",
        "wc_weaknesses": "290;47;42;923",
        "wc_questions": "3;261;104;105",
        "wc_review": "399;380;305;1394",
        "wc_reply_reviewers": "203;0;0;0",
        "wc_reply_authors": "898;676;581;697",
        "reply_reviewers": "2;0;0;0",
        "reply_authors": "2;2;2;3",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            88.25,
            45.75136609982264
        ],
        "wc_strengths_avg": [
            87.5,
            77.13786359499464
        ],
        "wc_weaknesses_avg": [
            325.5,
            359.23564689490377
        ],
        "wc_questions_avg": [
            118.25,
            92.24796745728331
        ],
        "wc_review_avg": [
            619.5,
            448.536787788917
        ],
        "wc_reply_reviewers_avg": [
            50.75,
            87.90157848412052
        ],
        "wc_reply_authors_avg": [
            713.0,
            115.4058057465048
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 174,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5106607594083514979&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=GPKTIktA0k",
        "pdf": "https://openreview.net/pdf?id=GPKTIktA0k",
        "email": ";;apolloresearch.ai;nyu.edu;anthropic.com;owainevans.com;gov.uk",
        "author_num": 7,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "Apollo Research;New York University;Anthropic;Truthful AI;UK AI Safety Institute",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": ";https://www.nyu.edu;https://www.anthropic.com;;",
        "aff_unique_abbr": ";NYU;Anthropic;;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "1;1;2",
        "aff_country_unique": ";United States;United Kingdom"
    },
    {
        "title": "AutoChunk: Automated Activation Chunk for Memory-Efficient Deep Learning Inference",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19032",
        "id": "GQGNLEHmdl",
        "author_site": "Xuanlei Zhao, Shenggan Cheng, Guangyang LU, Haotian Zhou, Bin Jia, Yang You",
        "tldr": "",
        "abstract": "Large deep learning models have achieved impressive performance across a range of applications. However, their large memory requirements, including parameter memory and activation memory, have become a significant challenge for their practical serving. While existing methods mainly address parameter memory, the importance of activation memory has been overlooked. Especially for long input sequences, activation memory is expected to experience a significant exponential growth as the length of sequences increases. In this approach, we propose AutoChunk, an automatic and adaptive compiler system that efficiently reduces activation memory for long sequence inference by chunk strategies. The proposed system generates chunk plans by optimizing through multiple stages. In each stage, the chunk search pass explores all possible chunk candidates and the chunk selection pass identifies the optimal one. At runtime, AutoChunk employs code generation to automatically apply chunk strategies. The experiments demonstrate that AutoChunk can reduce over 80% of activation memory while maintaining speed loss within 10%, extend max sequence length by 3.2x to 11.7x, and outperform state-of-the-art methods by a large margin.",
        "keywords": "Long Sequence Inference;Inference;Compiler;Activation Memory;Machine Learning Infrastructure;Low Resource Inference",
        "primary_area": "infrastructure, software libraries, hardware, etc.",
        "supplementary_material": "",
        "author": "Xuanlei Zhao;Shenggan Cheng;Guangyang LU;Haotian Zhou;Bin Jia;Yang You",
        "authorids": "~Xuanlei_Zhao1;~Shenggan_Cheng1;~Guangyang_LU1;~Haotian_Zhou1;~Bin_Jia1;~Yang_You1",
        "gender": "M;M;M;;M;M",
        "homepage": ";;;https://github.com/ht-zhou;https://github.com/FoolPlayer;https://www.comp.nus.edu.sg/~youy/",
        "dblp": "367/3224;258/2485;;;;33/8167-1.html",
        "google_scholar": "I5NBOacAAAAJ;kDdwP6UAAAAJ;;;;jF4dPZwAAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";;guangyang-lu-405978221/;;;yang-you-0b92914b/",
        "or_profile": "~Xuanlei_Zhao1;~Shenggan_Cheng1;~Guangyang_LU1;~Haotian_Zhou1;~Bin_Jia1;~Yang_You1",
        "aff": "National University of Singapore;National University of Singapore;;National University of Singapore;National University of Singapore;National University of Singapore",
        "aff_domain": "u.nus.edu;nus.edu;;u.nus.edu;u.nus.edu;nus.edu.sg",
        "position": "PhD student;PhD student;;MS student;MS student;Professor",
        "bibtex": "@inproceedings{\nzhao2024autochunk,\ntitle={AutoChunk: Automated Activation Chunk for Memory-Efficient Deep Learning Inference},\nauthor={Xuanlei Zhao and Shenggan Cheng and Guangyang LU and Haotian Zhou and Bin Jia and Yang You},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=GQGNLEHmdl}\n}",
        "github": "",
        "project": "",
        "reviewers": "m8Q2;Tqhc;Ypeq",
        "pdf_size": 508348,
        "rating": "5;6;8",
        "confidence": "3;2;3",
        "soundness": "2;3;4",
        "contribution": "3;4;4",
        "presentation": "3;3;2",
        "wc_summary": "99;33;64",
        "wc_strengths": "38;28;195",
        "wc_weaknesses": "162;53;129",
        "wc_questions": "58;22;67",
        "wc_review": "357;136;455",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "603;221;357",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            65.33333333333333,
            26.960877005188255
        ],
        "wc_strengths_avg": [
            87.0,
            76.47657593450865
        ],
        "wc_weaknesses_avg": [
            114.66666666666667,
            45.63867755411948
        ],
        "wc_questions_avg": [
            49.0,
            19.44222209522358
        ],
        "wc_review_avg": [
            316.0,
            133.41913905683347
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            393.6666666666667,
            158.09139410128842
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.18898223650461363,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:NdufXSaVAzYJ:scholar.google.com/&scioq=AutoChunk:+Automated+Activation+Chunk+for+Memory-Efficient+Deep+Learning+Inference&hl=en&as_sdt=0,5",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=GQGNLEHmdl",
        "pdf": "https://openreview.net/pdf?id=GQGNLEHmdl",
        "email": "u.nus.edu;nus.edu;;u.nus.edu;u.nus.edu;nus.edu.sg",
        "author_num": 6,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "National University of Singapore",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nus.edu.sg",
        "aff_unique_abbr": "NUS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Singapore"
    },
    {
        "id": "GRlKzhHl9Z",
        "title": "Efficient Detection of LLM-generated Texts with a Bayesian Surrogate Model",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The detection of machine-generated text, especially from large language models (LLMs), is crucial in preventing serious social problems resulting from their misuse. Some methods train dedicated detectors on specific datasets but fall short in generalizing to unseen test data, while other zero-shot ones often yield suboptimal performance. Although the recent DetectGPT has shown promising detection performance, it suffers from significant inefficiency issues, as detecting a single candidate requires scoring hundreds of its perturbations with the source LLM. This paper aims to bridge this gap. Technically, we propose to incorporate a Bayesian surrogate model, which allows us to select typical samples based on Bayesian uncertainty and interpolate scores from typical samples to other samples, to improve query efficiency. Our empirical results demonstrate that our method significantly outperforms existing approaches under a low query budget. Notably, our method achieves similar performance with up to 2 times fewer queries than DetectGPT and 3.7\\% higher AUROC at a query number of 5.",
        "keywords": "Detection of Machine-generated Text;Gaussian Process;Uncertainty Quantification",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/db9c5807d51b198879a274bda694515e06e10c47.zip",
        "author": "Zhijie Deng;Hongcheng Gao;Yibo Miao;Hao Zhang",
        "authorids": "~Zhijie_Deng1;~Hongcheng_Gao1;~Yibo_Miao2;~Hao_Zhang2",
        "gender": "M;M;M;M",
        "homepage": "https://thudzj.github.io/;https://gao-hongcheng.github.io/;https://github.com/yibomiao;https://cseweb.ucsd.edu/~haozhang/",
        "dblp": "209/4959;318/1404;;55/2270-25",
        "google_scholar": "J3dR0sUAAAAJ;https://scholar.google.com/citations?hl=en;PaVrM_kAAAAJ;H1d4BS8AAAAJ",
        "orcid": "0000-0002-0932-1631;;;",
        "linkedin": ";;;",
        "or_profile": "~Zhijie_Deng1;~Hongcheng_Gao1;~Yibo_Miao2;~Hao_Zhang2",
        "aff": "Shanghai Jiaotong University;University of Chinese Academy of Sciences;Shanghai Jiaotong University;Carnegie Mellon University",
        "aff_domain": "sjtu.edu.cn;ucas.ac.cn;sjtu.edu.cn;cmu.edu",
        "position": "Assistant Professor;MS student;MS student;PhD student",
        "bibtex": "@misc{\ndeng2024efficient,\ntitle={Efficient Detection of {LLM}-generated Texts with a Bayesian Surrogate Model},\nauthor={Zhijie Deng and Hongcheng Gao and Yibo Miao and Hao Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=GRlKzhHl9Z}\n}",
        "github": "",
        "project": "",
        "reviewers": "2wLg;59P9;5xFn",
        "site": "https://openreview.net/forum?id=GRlKzhHl9Z",
        "pdf_size": 1027986,
        "rating": "5;5;6",
        "confidence": "3;4;3",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "3;2;3",
        "wc_summary": "70;57;56",
        "wc_strengths": "100;75;16",
        "wc_weaknesses": "159;483;15",
        "wc_questions": "5;46;74",
        "wc_review": "334;661;161",
        "wc_reply_reviewers": "60;270;19",
        "wc_reply_authors": "723;736;482",
        "reply_reviewers": "1;2;1",
        "reply_authors": "3;4;1",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            61.0,
            6.377042156569663
        ],
        "wc_strengths_avg": [
            63.666666666666664,
            35.216788925485844
        ],
        "wc_weaknesses_avg": [
            219.0,
            195.71407716360108
        ],
        "wc_questions_avg": [
            41.666666666666664,
            28.33529404980455
        ],
        "wc_review_avg": [
            385.3333333333333,
            207.32636644243354
        ],
        "wc_reply_reviewers_avg": [
            116.33333333333333,
            109.94038788765887
        ],
        "wc_reply_authors_avg": [
            647.0,
            116.79326464598319
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 24,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4248611346571148364&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "Shanghai Jiao Tong University;University of Chinese Academy of Sciences;Carnegie Mellon University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.sjtu.edu.cn;http://www.ucas.ac.cn;https://www.cmu.edu",
        "aff_unique_abbr": "SJTU;UCAS;CMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Reward-Consistent Dynamics Models are Strongly Generalizable for Offline Reinforcement Learning",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19031",
        "id": "GSBHKiw19c",
        "author_site": "Fan-Ming Luo, Tian Xu, Xingchen Cao, Yang Yu",
        "tldr": "",
        "abstract": "Learning a precise dynamics model can be crucial for offline reinforcement learning, which, unfortunately, has been found to be quite challenging. Dynamics models that are learned by fitting historical transitions often struggle to generalize to unseen transitions. In this study, we identify a hidden but pivotal factor termed dynamics reward that remains consistent across transitions, offering a pathway to better generalization. Therefore, we propose the idea of reward-consistent dynamics models: any trajectory generated by the dynamics model should maximize the dynamics reward derived from the data. We implement this idea as the MOREC (Model-based Offline reinforcement learning with Reward Consistency) method, which can be seamlessly integrated into previous offline model-based reinforcement learning (MBRL) methods. MOREC learns a generalizable dynamics reward function from offline data, which is subsequently employed as a transition filter in any offline MBRL method: when generating transitions, the dynamics model generates a batch of transitions and selects the one with the highest dynamics reward value. On a synthetic task, we visualize that MOREC has a strong generalization ability and can surprisingly recover some distant unseen transitions. On 21 offline tasks in D4RL and NeoRL benchmarks, MOREC improves the previous state-of-the-art performance by a significant margin, i.e., 4.6\\% on D4RL tasks and 25.9\\% on NeoRL tasks. Notably, MOREC is the first method that can achieve above 95\\% online RL performance in 6 out of 12 D4RL tasks and 3 out of 9 NeoRL tasks. Code is available at https://github.com/polixir/morec.",
        "keywords": "model-based offline reinforcement learning;dynamics reward;reward-consistent dynamics model learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Fan-Ming Luo;Tian Xu;Xingchen Cao;Yang Yu",
        "authorids": "~Fan-Ming_Luo1;~Tian_Xu2;~Xingchen_Cao1;~Yang_Yu5",
        "gender": ";M;M;",
        "homepage": ";http://www.lamda.nju.edu.cn/xut/;https://grimreaperno218.github.io/;",
        "dblp": ";07/2985-3;;",
        "google_scholar": ";e5mnk1wAAAAJ;;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Fan-Ming_Luo1;~Tian_Xu2;~Xingchen_Cao1;~Yang_Yu5",
        "aff": ";Nanjing University;Nanjing University;",
        "aff_domain": ";nju.edu.cn;lamda.nju.edu.cn;",
        "position": ";PhD student;MS student;",
        "bibtex": "@inproceedings{\nluo2024rewardconsistent,\ntitle={Reward-Consistent Dynamics Models are Strongly Generalizable for Offline Reinforcement Learning},\nauthor={Fan-Ming Luo and Tian Xu and Xingchen Cao and Yang Yu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=GSBHKiw19c}\n}",
        "github": "",
        "project": "",
        "reviewers": "F8oz;Gxsz;HqU2;zEZ1",
        "pdf_size": 9089821,
        "rating": "6;6;6;8",
        "confidence": "4;3;3;4",
        "soundness": "2;3;4;3",
        "contribution": "3;3;3;3",
        "presentation": "3;2;4;3",
        "wc_summary": "62;92;22;175",
        "wc_strengths": "39;45;59;108",
        "wc_weaknesses": "245;148;64;32",
        "wc_questions": "115;47;38;199",
        "wc_review": "461;332;183;514",
        "wc_reply_reviewers": "288;132;0;128",
        "wc_reply_authors": "1577;1319;386;1093",
        "reply_reviewers": "2;3;0;1",
        "reply_authors": "4;5;1;3",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            87.75,
            56.16215362679747
        ],
        "wc_strengths_avg": [
            62.75,
            27.11434122378783
        ],
        "wc_weaknesses_avg": [
            122.25,
            82.56626126935869
        ],
        "wc_questions_avg": [
            99.75,
            64.57311747159184
        ],
        "wc_review_avg": [
            372.5,
            127.87200631881866
        ],
        "wc_reply_reviewers_avg": [
            137.0,
            102.0735029280371
        ],
        "wc_reply_authors_avg": [
            1093.75,
            443.0515630262464
        ],
        "reply_reviewers_avg": [
            1.5,
            1.118033988749895
        ],
        "reply_authors_avg": [
            3.25,
            1.479019945774904
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14783777019731853505&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=GSBHKiw19c",
        "pdf": "https://openreview.net/pdf?id=GSBHKiw19c",
        "email": ";nju.edu.cn;lamda.nju.edu.cn;",
        "author_num": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Nanjing University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nju.edu.cn",
        "aff_unique_abbr": "Nanjing U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "GT57SN8xt9",
        "title": "Parameter-Efficient Long-Tailed Recognition",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The \"pre-training and fine-tuning\" paradigm in addressing long-tailed recognition tasks has sparked significant interest since the emergence of large vision-language models like the contrastive language-image pre-training (CLIP). While previous studies have shown promise in adapting pre-trained models for these tasks, they often undesirably require extensive training epochs or additional training data to maintain good performance. In this paper, we propose PEL, a fine-tuning method that can effectively adapt pre-trained models to long-tailed recognition tasks in fewer than 20 epochs without the need for extra data. We first empirically find that commonly used fine-tuning methods, such as full fine-tuning and classifier fine-tuning, suffer from overfitting, resulting in performance deterioration on tail classes. To mitigate this issue, PEL introduces a small number of task-specific parameters by adopting the design of any existing parameter-efficient fine-tuning method. Additionally, to expedite convergence, PEL presents a novel semantic-aware classifier initialization technique derived from the CLIP textual encoder without adding any computational overhead. Our experimental results on four long-tailed datasets demonstrate that PEL consistently outperforms previous state-of-the-art approaches. The source code is available in the supplementary material.",
        "keywords": "long-tailed recognition;class-imbalanced learning;parameter-efficient fine-tuning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/6c6e237414193890733fc9a296d1a8c63fa7b2e5.zip",
        "author": "Jiang-Xin Shi;Tong Wei;Zhi Zhou;Xin-Yan Han;Jie-Jing Shao;Yu-Feng Li",
        "authorids": "~Jiang-Xin_Shi1;~Tong_Wei1;~Zhi_Zhou2;~Xin-Yan_Han1;~Jie-Jing_Shao1;~Yu-Feng_Li1",
        "gender": ";M;M;F;M;M",
        "homepage": "http://www.lamda.nju.edu.cn/shijx;https://palm.seu.edu.cn/weit/;http://www.lamda.nju.edu.cn/zhouz/;http://www.lamda.nju.edu.cn/hanxy/;http://www.lamda.nju.edu.cn/shaojj/;https://cs.nju.edu.cn/liyf/index.htm",
        "dblp": "299/5485.html;49/933-1;04/2090-7;;299/4982;57/413",
        "google_scholar": "KEgtGncAAAAJ;EFCZuW4AAAAJ;VzvP5a8AAAAJ;;k1tEDpQAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0002-0318-0911;0000-0002-2766-8209;;;0000-0001-8107-114X;0000-0002-2220-5248",
        "linkedin": ";;;;;",
        "or_profile": "~Jiang-Xin_Shi1;~Tong_Wei1;~Zhi_Zhou2;~Xin-Yan_Han1;~Jie-Jing_Shao1;~Yu-feng_Li2",
        "aff": "Nanjing University;Southeast University;Nanjing University;;Nanjing University;Nanjing University",
        "aff_domain": "nju.edu.cn;seu.edu.cn;nju.edu.cn;;nju.edu.cn;nju.edu.cn",
        "position": "PhD student;Associate Professor;PhD student;;PhD student;Assistant Professor",
        "bibtex": "@misc{\nshi2024parameterefficient,\ntitle={Parameter-Efficient Long-Tailed Recognition},\nauthor={Jiang-Xin Shi and Tong Wei and Zhi Zhou and Xin-Yan Han and Jie-Jing Shao and Yu-Feng Li},\nyear={2024},\nurl={https://openreview.net/forum?id=GT57SN8xt9}\n}",
        "github": "",
        "project": "",
        "reviewers": "4hL6;GTCk;BCXb;egTN",
        "site": "https://openreview.net/forum?id=GT57SN8xt9",
        "pdf_size": 9318343,
        "rating": "5;5;5;6",
        "confidence": "4;4;5;5",
        "soundness": "3;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "89;69;113;71",
        "wc_strengths": "34;67;55;39",
        "wc_weaknesses": "69;173;126;73",
        "wc_questions": "27;95;78;3",
        "wc_review": "219;404;372;186",
        "wc_reply_reviewers": "263;203;261;0",
        "wc_reply_authors": "1547;2129;1651;292",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "3;3;3;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            85.5,
            17.684739183827393
        ],
        "wc_strengths_avg": [
            48.75,
            13.083864108129525
        ],
        "wc_weaknesses_avg": [
            110.25,
            42.64607250380743
        ],
        "wc_questions_avg": [
            50.75,
            37.23153904957462
        ],
        "wc_review_avg": [
            295.25,
            94.16308990257276
        ],
        "wc_reply_reviewers_avg": [
            181.75,
            107.66469941443202
        ],
        "wc_reply_authors_avg": [
            1404.75,
            678.900719914186
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.8660254037844386
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 20,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17176806289179305778&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;0;0",
        "aff_unique_norm": "Nanjing University;Southeast University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.nju.edu.cn;https://www.seu.edu.cn/",
        "aff_unique_abbr": "Nanjing U;SEU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Noisy Interpolation Learning with Shallow Univariate ReLU Networks",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19030",
        "id": "GTUoTJXPBf",
        "author_site": "Nirmit Joshi, Gal Vardi, Nathan Srebro",
        "tldr": "",
        "abstract": "Understanding how overparameterized neural networks generalize despite perfect interpolation of noisy training data is a fundamental question. Mallinar et. al. (2022) noted that neural networks seem to often exhibit ``tempered overfitting'', wherein the population risk does not converge to the Bayes optimal error, but neither does it approach infinity, yielding non-trivial generalization. However, this has not been studied rigorously.  We provide the first rigorous analysis of the overfiting behaviour of regression with minimum norm ($\\ell_2$ of weights), focusing on univariate two-layer ReLU networks.  We show overfitting is tempered (with high probability) when measured with respect to the $L_1$ loss, but also show that the situation is more complex than suggested by Mallinar et. al., and overfitting is catastrophic with respect to the $L_2$ loss, or when taking an expectation over the training set.",
        "keywords": "Interpolation Learning;Benign Overfitting;ReLU Networks",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/d3a6839e00980b396ee980ec8e0395c05b1ec21c.pdf",
        "author": "Nirmit Joshi;Gal Vardi;Nathan Srebro",
        "authorids": "~Nirmit_Joshi1;~Gal_Vardi1;~Nathan_Srebro1",
        "gender": "M;M;M",
        "homepage": "https://nirmitj6.github.io/static-webpage/;https://sites.google.com/view/galvardi/home;http://ttic.uchicago.edu/~nati/",
        "dblp": "327/7118;https://dblp.uni-trier.de/pid/167/9638.html;50/3633",
        "google_scholar": ";https://scholar.google.co.il/citations?hl=en;https://scholar.google.com.tw/citations?user=ZnT-QpMAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Nirmit_Joshi1;~Gal_Vardi1;~Nathan_Srebro1",
        "aff": "Toyota Technological Institute at Chicago;Toyota Technological Institute at Chicago;University of Chicago",
        "aff_domain": "ttic.edu;ttic.edu;uchicago.edu",
        "position": "PhD student;Postdoc;Full Professor",
        "bibtex": "@inproceedings{\njoshi2024noisy,\ntitle={Noisy Interpolation Learning with Shallow Univariate Re{LU} Networks},\nauthor={Nirmit Joshi and Gal Vardi and Nathan Srebro},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=GTUoTJXPBf}\n}",
        "github": "",
        "project": "",
        "reviewers": "toQ6;9Vzu;bbgZ",
        "pdf_size": 499876,
        "rating": "8;8;8",
        "confidence": "4;4;4",
        "soundness": "4;4;3",
        "contribution": "3;4;3",
        "presentation": "3;4;3",
        "wc_summary": "68;123;117",
        "wc_strengths": "19;96;87",
        "wc_weaknesses": "106;188;46",
        "wc_questions": "90;101;126",
        "wc_review": "283;508;376",
        "wc_reply_reviewers": "0;0;9",
        "wc_reply_authors": "677;747;279",
        "reply_reviewers": "0;0;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            102.66666666666667,
            24.63511495586917
        ],
        "wc_strengths_avg": [
            67.33333333333333,
            34.373762603991366
        ],
        "wc_weaknesses_avg": [
            113.33333333333333,
            58.20271089524573
        ],
        "wc_questions_avg": [
            105.66666666666667,
            15.062831370260005
        ],
        "wc_review_avg": [
            389.0,
            92.31467922275417
        ],
        "wc_reply_reviewers_avg": [
            3.0,
            4.242640687119285
        ],
        "wc_reply_authors_avg": [
            567.6666666666666,
            206.10892481619734
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14976422241348864295&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=GTUoTJXPBf",
        "pdf": "https://openreview.net/pdf?id=GTUoTJXPBf",
        "email": "ttic.edu;ttic.edu;uchicago.edu",
        "author_num": 3,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Toyota Technological Institute at Chicago;University of Chicago",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tti-chicago.org;https://www.uchicago.edu",
        "aff_unique_abbr": "TTI Chicago;UChicago",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Chicago;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "DiffAR: Denoising Diffusion Autoregressive Model for Raw Speech Waveform Generation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19029",
        "id": "GTk0AdOYLq",
        "author_site": "Roi Benita, Michael Elad, Joseph Keshet",
        "tldr": "",
        "abstract": "Diffusion models have recently been shown to be relevant for high-quality speech generation. Most work has been focused on generating spectrograms, and as such, they further require a subsequent model to convert the spectrogram to a waveform (i.e., a vocoder). This work proposes a diffusion probabilistic end-to-end model for generating a raw speech waveform. The proposed model is autoregressive, generating overlapping frames sequentially, where each frame is conditioned on a portion of the previously generated one. Hence, our model can effectively synthesize an unlimited speech duration while preserving high-fidelity synthesis and temporal coherence. We implemented the proposed model for unconditional and conditional speech generation, where the latter can be driven by an input sequence of phonemes, amplitudes, and pitch values. Working on the waveform directly has some empirical advantages. Specifically, it allows the creation of local acoustic behaviors, like vocal fry, which makes the overall waveform sounds more natural. Furthermore, the proposed diffusion model is stochastic and not deterministic; therefore, each inference generates a slightly different waveform variation, enabling abundance of valid realizations. Experiments show that the proposed model generates speech with superior quality compared with other state-of-the-art neural speech generation systems.",
        "keywords": "Diffusion models;speech generation;text to speech;autoregressive model",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Roi Benita;Michael Elad;Joseph Keshet",
        "authorids": "~Roi_Benita1;~Michael_Elad1;~Joseph_Keshet3",
        "gender": ";M;M",
        "homepage": ";https://elad.cs.technion.ac.il/;https://keshet.net.technion.ac.il",
        "dblp": ";e/MichaelElad;45/4451",
        "google_scholar": ";UpZbV44AAAAJ;https://scholar.google.com.tw/citations?user=GoWgJ1AAAAAJ",
        "orcid": ";0000-0001-8131-6928;0000-0003-2332-5783",
        "linkedin": "roi-benita-a62ba5120;michael-elad-5553852a3/;jkeshet/",
        "or_profile": "~Roi_Benita1;~Michael_Elad1;~Yossi_Keshet1",
        "aff": "Technion - Israel Institute of Technology, Technion;Verily;Technion - Israel Institute of Technology, Technion",
        "aff_domain": "technion.ac.il;verily.com;technion.ac.il",
        "position": "MS student;Principal Researcher;Associate Professor",
        "bibtex": "@inproceedings{\nbenita2024diffar,\ntitle={Diff{AR}: Denoising Diffusion Autoregressive Model for Raw Speech Waveform Generation},\nauthor={Roi Benita and Michael Elad and Joseph Keshet},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=GTk0AdOYLq}\n}",
        "github": "",
        "project": "",
        "reviewers": "u4XD;9k2u;iPTb;a3Eo",
        "pdf_size": 14037259,
        "rating": "5;6;6;6",
        "confidence": "4;4;3;4",
        "soundness": "3;3;3;4",
        "contribution": "2;2;2;2",
        "presentation": "3;2;3;2",
        "wc_summary": "47;62;190;100",
        "wc_strengths": "27;59;31;170",
        "wc_weaknesses": "26;245;186;536",
        "wc_questions": "276;8;11;81",
        "wc_review": "376;374;418;887",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "682;874;439;1681",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;2;1;4",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            99.75,
            55.57146300035658
        ],
        "wc_strengths_avg": [
            71.75,
            58.0490094661399
        ],
        "wc_weaknesses_avg": [
            248.25,
            184.44562206786043
        ],
        "wc_questions_avg": [
            94.0,
            109.0619090241868
        ],
        "wc_review_avg": [
            513.75,
            216.2109791384332
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            919.0,
            466.1646704760025
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4646384278593037230&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=GTk0AdOYLq",
        "pdf": "https://openreview.net/pdf?id=GTk0AdOYLq",
        "email": "technion.ac.il;verily.com;technion.ac.il",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Technion - Israel Institute of Technology;Verily",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.technion.ac.il;https://www.verily.com",
        "aff_unique_abbr": "Technion;Verily",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Israel;United States"
    },
    {
        "title": "DreamFlow: High-quality text-to-3D generation by Approximating Probability Flow",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19028",
        "id": "GURqUuTebY",
        "author_site": "Kyungmin Lee, Kihyuk Sohn, Jinwoo Shin",
        "tldr": "",
        "abstract": "Recent progress in text-to-3D generation has been achieved through the utilization of score distillation methods: they make use of the pre-trained text-to-image (T2I) diffusion models by distilling via the diffusion model training objective. However, such an approach inevitably results in the use of random timesteps at each update, which increases the variance of the gradient and ultimately prolongs the optimization process. In this paper, we propose to enhance the text-to-3D optimization by leveraging the T2I diffusion prior in the generative sampling process with a predetermined timestep schedule. To this end, we interpret text-to-3D optimization as a multi-view image-to-image translation problem, and propose a solution by approximating the probability flow. By leveraging the proposed novel optimization algorithm, we design DreamFlow, a practical three-stage coarse-to-fine text-to-3D optimization framework that enables fast generation of high-quality and high-resolution (i.e., 1024\u00d71024) 3D contents. For example, we demonstrate that DreamFlow is 5 times faster than the existing state-of-the-art text-to-3D method, while producing more photorealistic 3D contents.",
        "keywords": "Text-to-3D generation;Diffusion model;Score Distillation Sampling",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/1c19ac7a118cf01ab18c80ecc40b65451328e55d.zip",
        "author": "Kyungmin Lee;Kihyuk Sohn;Jinwoo Shin",
        "authorids": "~Kyungmin_Lee1;~Kihyuk_Sohn1;~Jinwoo_Shin1",
        "gender": "M;M;M",
        "homepage": "https://kyungmnlee.github.io/;https://sites.google.com/site/kihyuksml/;https://sites.google.com/site/mijirim/",
        "dblp": "57/5118;53/10771;31/7062",
        "google_scholar": "6dpime0AAAAJ;VxpypngAAAAJ;https://scholar.google.com.tw/citations?user=m3eDp7kAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Kyungmin_Lee1;~Kihyuk_Sohn1;~Jinwoo_Shin1",
        "aff": "Korea Advanced Institute of Science & Technology;Google;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;google.com;kaist.ac.kr",
        "position": "PhD student;Research Scientist;Full Professor",
        "bibtex": "@inproceedings{\nlee2024dreamflow,\ntitle={DreamFlow: High-quality text-to-3D generation by Approximating Probability Flow},\nauthor={Kyungmin Lee and Kihyuk Sohn and Jinwoo Shin},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=GURqUuTebY}\n}",
        "github": "",
        "project": "",
        "reviewers": "9SLV;paN1;pJwX;ZxmY",
        "pdf_size": 44819462,
        "rating": "5;6;6;8",
        "confidence": "4;4;4;3",
        "soundness": "2;3;3;2",
        "contribution": "2;2;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "68;81;38;75",
        "wc_strengths": "46;58;25;48",
        "wc_weaknesses": "252;314;59;107",
        "wc_questions": "108;181;51;2",
        "wc_review": "474;634;173;232",
        "wc_reply_reviewers": "0;159;33;9",
        "wc_reply_authors": "790;827;385;207",
        "reply_reviewers": "0;2;1;1",
        "reply_authors": "2;4;3;3",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            65.5,
            16.53027525481654
        ],
        "wc_strengths_avg": [
            44.25,
            12.007809958522827
        ],
        "wc_weaknesses_avg": [
            183.0,
            103.77138333856786
        ],
        "wc_questions_avg": [
            85.5,
            66.68770501374297
        ],
        "wc_review_avg": [
            378.25,
            185.80416437744339
        ],
        "wc_reply_reviewers_avg": [
            50.25,
            63.9350256119445
        ],
        "wc_reply_authors_avg": [
            552.25,
            264.188734619779
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.9271726499455306,
        "gs_citation": 16,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17594697572391320248&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=GURqUuTebY",
        "pdf": "https://openreview.net/pdf?id=GURqUuTebY",
        "email": "kaist.ac.kr;google.com;kaist.ac.kr",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.kaist.ac.kr;https://www.google.com",
        "aff_unique_abbr": "KAIST;Google",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "title": "Duolando: Follower GPT with Off-Policy Reinforcement Learning for Dance Accompaniment",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19027",
        "id": "GW4j4n2cjH",
        "author_site": "Siyao Li, Tianpei Gu, Zhitao Yang, Zhengyu Lin, Ziwei Liu, Henghui Ding, Lei Yang, Chen Change Loy",
        "tldr": "",
        "abstract": "We introduce a novel task within the field of human motion generation, termed dance accompaniment, which necessitates the generation of responsive movements from a dance partner, the \"follower\", synchronized with the lead dancer\u2019s movements and the underlying musical rhythm. Unlike existing solo or group dance generation tasks, a duet dance scenario entails a heightened degree of interaction between the two participants, requiring delicate coordination in both pose and position. To support this task, we first build a large-scale and diverse duet interactive dance dataset, DD100, by recording about 117 minutes of professional dancers\u2019 performances. To address the challenges inherent in this task, we propose a GPT based model, Duolando, which autoregressively predicts the subsequent tokenized motion conditioned on the coordinated information of the music, the leader\u2019s and the follower\u2019s movements. To further enhance the GPT\u2019s capabilities of generating stable results on unseen conditions (music and leader motions), we devise an off-policy reinforcement learning strategy that allows the model to explore viable trajectories from out-of-distribution samplings, guided by human-defined rewards. Based on the collected dataset and proposed method, we establish a benchmark with several carefully designed metrics.",
        "keywords": "motion generation;multi-modality;dance generation;human human-interaction;GPT;reinforcement learning",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/8e14ada198839d8fe5444b2e64f1901b14b7433f.zip",
        "author": "Li Siyao;Tianpei Gu;Zhitao Yang;Zhengyu Lin;Ziwei Liu;Henghui Ding;Lei Yang;Chen Change Loy",
        "authorids": "~Li_Siyao1;~Tianpei_Gu1;~Zhitao_Yang1;~Zhengyu_Lin1;~Ziwei_Liu1;~Henghui_Ding2;~Lei_Yang7;~Chen_Change_Loy2",
        "gender": "M;M;M;M;M;M;M;M",
        "homepage": "https://lisiyao21.github.io;https://gutianpei.github.io/;https://github.com/Maoxie;https://scholar.google.com/citations?user=XbFxzicAAAAJ;https://liuziwei7.github.io/;https://www.yanglei.me;https://www.mmlab-ntu.com/person/ccloy/index.html;https://henghuiding.github.io/",
        "dblp": ";299/7580;;;05/6300-2;50/2484-45;01/5855;230/1216",
        "google_scholar": "83WWEs4AAAAJ;zWL2qoUAAAAJ;WMVmXgoAAAAJ;XbFxzicAAAAJ;https://scholar.google.com.hk/citations?user=lc45xlcAAAAJ;jZH2IPYAAAAJ;https://scholar.google.co.uk/citations?user=559LF80AAAAJ;WI_flSwAAAAJ",
        "orcid": ";;0000-0003-0780-0134;;;0000-0002-0571-5924;0000-0001-5345-1591;0000-0003-4868-6526",
        "linkedin": ";;zhitaoyang/;;;;;",
        "or_profile": "~Li_Siyao1;~Tianpei_Gu1;~Zhitao_Yang1;~Zhengyu_Lin1;~Ziwei_Liu1;~Lei_Yang7;~Chen_Change_Loy2;~Henghui_Ding1",
        "aff": "Nanyang Technological University;ByteDance Inc.;Sensetime Ltd.;Sensetime;Nanyang Technological University;Sensetime Ltd.;Nanyang Technological University;Nanyang Technological University",
        "aff_domain": "ntu.edu.sg;bytedance.com;sensetime.com;sensetime.com;ntu.edu.sg;sensetime.com;ntu.edu.sg;ntu.edu.sg",
        "position": "PhD student;Researcher;Researcher;Researcher;Assistant Professor;Researcher;Full Professor;Postdoc",
        "bibtex": "@inproceedings{\nsiyao2024duolando,\ntitle={Duolando: Follower {GPT} with Off-Policy Reinforcement Learning for Dance Accompaniment},\nauthor={Li Siyao and Tianpei Gu and Zhitao Yang and Zhengyu Lin and Ziwei Liu and Henghui Ding and Lei Yang and Chen Change Loy},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=GW4j4n2cjH}\n}",
        "github": "",
        "project": "",
        "reviewers": "CR8y;cNc4;JwGL;otBs",
        "pdf_size": 14196062,
        "rating": "3;6;8;8",
        "confidence": "4;3;4;4",
        "soundness": "2;4;4;3",
        "contribution": "1;2;4;3",
        "presentation": "2;4;3;3",
        "wc_summary": "77;81;96;211",
        "wc_strengths": "37;216;69;98",
        "wc_weaknesses": "164;294;196;145",
        "wc_questions": "2;72;23;61",
        "wc_review": "280;663;384;515",
        "wc_reply_reviewers": "58;91;11;0",
        "wc_reply_authors": "746;732;227;718",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "3;2;2;2",
        "rating_avg": [
            6.25,
            2.0463381929681126
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            1.118033988749895
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            116.25,
            55.160561092142636
        ],
        "wc_strengths_avg": [
            105.0,
            67.62026323521671
        ],
        "wc_weaknesses_avg": [
            199.75,
            57.386300630028416
        ],
        "wc_questions_avg": [
            39.5,
            28.271009886454358
        ],
        "wc_review_avg": [
            460.5,
            143.53483897646592
        ],
        "wc_reply_reviewers_avg": [
            40.0,
            36.62649314362488
        ],
        "wc_reply_authors_avg": [
            605.75,
            218.8953802618959
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.07053456158585983,
        "gs_citation": 19,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6118267083104415383&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=GW4j4n2cjH",
        "pdf": "https://openreview.net/pdf?id=GW4j4n2cjH",
        "email": "ntu.edu.sg;bytedance.com;sensetime.com;sensetime.com;ntu.edu.sg;sensetime.com;ntu.edu.sg;ntu.edu.sg",
        "author_num": 8,
        "aff_unique_index": "0;1;2;2;0;2;0;0",
        "aff_unique_norm": "Nanyang Technological University;ByteDance;SenseTime",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ntu.edu.sg;https://www.bytedance.com;https://www.sensetime.com",
        "aff_unique_abbr": "NTU;ByteDance;SenseTime",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;0;1;0;0",
        "aff_country_unique": "Singapore;China"
    },
    {
        "title": "Rethinking Information-theoretic Generalization: Loss Entropy Induced PAC Bounds",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19026",
        "id": "GWSIo2MzuH",
        "author_site": "Yuxin Dong, Tieliang Gong, Hong Chen, Shujian Yu, Chen Li",
        "tldr": "",
        "abstract": "Information-theoretic generalization analysis has achieved astonishing success in characterizing the generalization capabilities of noisy and iterative learning algorithms. However, current advancements are mostly restricted to average-case scenarios and necessitate the stringent bounded loss assumption, leaving a gap with regard to computationally tractable PAC generalization analysis, especially for long-tailed loss distributions. In this paper, we bridge this gap by introducing a novel class of PAC bounds through leveraging loss entropies. These bounds simplify the computation of key information metrics in previous PAC information-theoretic bounds to one-dimensional variables, thereby enhancing computational tractability. Moreover, our data-independent bounds provide novel insights into the generalization behavior of the minimum error entropy criterion, while our data-dependent bounds improve over previous results by alleviating the bounded loss assumption under both leave-one-out and supersample settings. Extensive numerical studies indicate strong correlations between the generalization error and the induced loss entropy, showing that the presented bounds adeptly capture the patterns of the true generalization gap under various learning scenarios.",
        "keywords": "information theory;generalization bound;learning theory;minimum error entropy",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/4c8d87eb16d439bf9b56ecf7c244e32344015ec6.zip",
        "author": "Yuxin Dong;Tieliang Gong;Hong Chen;Shujian Yu;Chen Li",
        "authorids": "~Yuxin_Dong1;~Tieliang_Gong2;~Hong_Chen1;~Shujian_Yu1;~Chen_Li19",
        "gender": "M;;;M;M",
        "homepage": "https://yuxin-dong.github.io/;;https://chenhongml.github.io/;https://sjyucnel.github.io/;http://chenli.group",
        "dblp": ";;https://dblp.uni-trier.de/pers/hd/c/Chen_0004:Hong;154/5763.html;l/ChenLi32",
        "google_scholar": "yFJv-2kAAAAJ;;;O8kpnMoAAAAJ;",
        "orcid": "0000-0002-4475-5056;;;;0000-0002-0079-3106",
        "linkedin": "yuxin-dong-939a03349;;;;",
        "or_profile": "~Yuxin_Dong1;~Tieliang_Gong2;~Hong_Chen1;~Shujian_Yu1;~Chen_Li19",
        "aff": "Xi'an Jiaotong University;;Huazhong Agricultural University;University of Troms\u00f8;Xi'an Jiaotong University",
        "aff_domain": "xjtu.edu.cn;;hzau.edu.cn;uit.no;xjtu.edu.cn",
        "position": "PhD student;;Full Professor;Guest Associate Professor;Full Professor",
        "bibtex": "@inproceedings{\ndong2024rethinking,\ntitle={Rethinking Information-theoretic Generalization: Loss Entropy Induced {PAC} Bounds},\nauthor={Yuxin Dong and Tieliang Gong and Hong Chen and Shujian Yu and Chen Li},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=GWSIo2MzuH}\n}",
        "github": "",
        "project": "",
        "reviewers": "YPBm;gBmk;xf1n;Fiyn",
        "pdf_size": 977820,
        "rating": "6;6;6;8",
        "confidence": "4;4;3;4",
        "soundness": "2;2;3;3",
        "contribution": "4;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "93;24;35;58",
        "wc_strengths": "235;15;93;72",
        "wc_weaknesses": "518;312;70;8",
        "wc_questions": "782;4;103;64",
        "wc_review": "1628;355;301;202",
        "wc_reply_reviewers": "852;515;64;10",
        "wc_reply_authors": "4084;1565;452;69",
        "reply_reviewers": "3;2;1;1",
        "reply_authors": "8;4;1;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            52.5,
            26.405491853021786
        ],
        "wc_strengths_avg": [
            103.75,
            80.97337525384502
        ],
        "wc_weaknesses_avg": [
            227.0,
            202.80285994038644
        ],
        "wc_questions_avg": [
            238.25,
            315.9085112813518
        ],
        "wc_review_avg": [
            621.5,
            583.6876305011098
        ],
        "wc_reply_reviewers_avg": [
            360.25,
            345.0379508112115
        ],
        "wc_reply_authors_avg": [
            1542.5,
            1566.8536147324037
        ],
        "reply_reviewers_avg": [
            1.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.5,
            2.8722813232690143
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9771769310941214787&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=GWSIo2MzuH",
        "pdf": "https://openreview.net/pdf?id=GWSIo2MzuH",
        "email": "xjtu.edu.cn;;hzau.edu.cn;uit.no;xjtu.edu.cn",
        "author_num": 5,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Xi'an Jiao Tong University;Huazhong Agricultural University;University of Troms\u00f8",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.xjtu.edu.cn;http://www.hzau.edu.cn/;https://uit.no",
        "aff_unique_abbr": "XJTU;HAU;UIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "China;Norway"
    },
    {
        "id": "GWWeQ3WUMS",
        "title": "Unleashing the Potential of LLMs for Quantum Computing: A Study in Quantum Architecture Design",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) contribute significantly to the development of conversational AI and has great potentials to assist the scientific research in various areas. This paper attempts to address the following questions: What opportunities do the current generation of generative pre-trained transformers (GPTs) offer for the developments of noisy intermediate-scale quantum (NISQ) technologies? Additionally, what potentials does the forthcoming generation of GPTs possess to push the frontier of research in fault-tolerant quantum computing (FTQC)? In this paper, we implement a QGAS model, which can rapidly propose promising ansatz architectures and evaluate them with application benchmarks including quantum chemistry and quantum finance tasks. Our results demonstrate that after a limited number of prompt guidelines and iterations, we can obtain a high-performance ansatz which is able to produce comparable results that are achieved by state-of-the-art quantum architecture search methods. This study provides a simple overview of GPT\u2019s capabilities in supporting quantum computing research while highlighting the limitations of the current GPT at the same time. Additionally, we discuss futuristic applications for LLM in quantum research.",
        "keywords": "Large Language Models;Quantum Computing;Variational Quantum Algorithms",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Zhiding Liang;Jinglei Cheng;Rui Yang;Hang Ren;Zhixin Song;Di Wu;Tongyang Li;Yiyu Shi",
        "authorids": "~Zhiding_Liang1;~Jinglei_Cheng1;~Rui_Yang12;~Hang_Ren3;~Zhixin_Song1;~Di_Wu30;~Tongyang_Li1;~Yiyu_Shi1",
        "gender": "M;M;F;;M;M;M;M",
        "homepage": "https://zlianghahaha.github.io/;https://jinleic.github.io/;https://www.pku.edu.cn;;https://physics.gatech.edu/user/zhixin-song;https://www.unarylab.com;https://www.tongyangli.com/;",
        "dblp": ";;;;;52/328-16.html;142/1312;94/5536",
        "google_scholar": ";;;;0Oy99nMAAAAJ;v6DNkTAAAAAJ;ny0ZgiQAAAAJ;",
        "orcid": ";;;;;0000-0001-9775-8026;0000-0002-0338-413X;",
        "linkedin": ";;;hangren0/;;diwu1990/;;",
        "or_profile": "~Zhiding_Liang1;~Jinglei_Cheng1;~Rui_Yang12;~Hang_Ren3;~Zhixin_Song1;~Di_Wu30;~Tongyang_Li1;~Yiyu_Shi1",
        "aff": "University of Notre Dame;Purdue University;Peking University;University of California, Berkeley;Georgia Institute of Technology;University of Central Florida;Peking University;University of Notre Dame",
        "aff_domain": "nd.edu;purdue.edu;pku.edu.cn;berkeley.edu;gatech.edu;ucf.edu;pku.edu.cn;nd.edu",
        "position": "PhD student;PhD student;Undergrad student;PhD student;PhD student;Assistant Professor;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nliang2024unleashing,\ntitle={Unleashing the Potential of {LLM}s for Quantum Computing: A Study in Quantum Architecture Design},\nauthor={Zhiding Liang and Jinglei Cheng and Rui Yang and Hang Ren and Zhixin Song and Di Wu and Tongyang Li and Yiyu Shi},\nyear={2024},\nurl={https://openreview.net/forum?id=GWWeQ3WUMS}\n}",
        "github": "",
        "project": "",
        "reviewers": "A6VM;GZfc;mQvQ",
        "site": "https://openreview.net/forum?id=GWWeQ3WUMS",
        "pdf_size": 1096122,
        "rating": "1;1;3",
        "confidence": "4;5;4",
        "soundness": "1;2;2",
        "contribution": "1;1;2",
        "presentation": "2;3;3",
        "wc_summary": "55;72;77",
        "wc_strengths": "48;42;73",
        "wc_weaknesses": "300;71;210",
        "wc_questions": "11;5;64",
        "wc_review": "414;190;424",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            68.0,
            9.41629792788369
        ],
        "wc_strengths_avg": [
            54.333333333333336,
            13.424687043734844
        ],
        "wc_weaknesses_avg": [
            193.66666666666666,
            94.19955178001409
        ],
        "wc_questions_avg": [
            26.666666666666668,
            26.512051766864232
        ],
        "wc_review_avg": [
            342.6666666666667,
            108.02880274363046
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 34,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12538592680143513105&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;3;4;5;2;0",
        "aff_unique_norm": "University of Notre Dame;Purdue University;Peking University;University of California, Berkeley;Georgia Institute of Technology;University of Central Florida",
        "aff_unique_dep": ";;;;;",
        "aff_unique_url": "https://www.nd.edu;https://www.purdue.edu;http://www.pku.edu.cn;https://www.berkeley.edu;https://www.gatech.edu;https://www.ucf.edu",
        "aff_unique_abbr": "Notre Dame;Purdue;Peking U;UC Berkeley;Georgia Tech;UCF",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Berkeley",
        "aff_country_unique_index": "0;0;1;0;0;0;1;0",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "Domain Randomization via Entropy Maximization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19025",
        "id": "GXtmuiVrOM",
        "author_site": "Gabriele Tiboni, Pascal Klink, Jan Peters, Tatiana Tommasi, Carlo D'Eramo, Georgia Chalvatzaki",
        "tldr": "",
        "abstract": "Varying dynamics parameters in simulation is a popular Domain Randomization (DR) approach for overcoming the reality gap in Reinforcement Learning (RL). Nevertheless, DR heavily hinges on the choice of the sampling distribution of the dynamics parameters, since high variability is crucial to regularize the agent's behavior but notoriously leads to overly conservative policies when randomizing excessively. In this paper, we propose a novel approach to address sim-to-real transfer, which automatically shapes dynamics distributions during training in simulation without requiring real-world data. We introduce DOmain RAndomization via Entropy MaximizatiON (DORAEMON), a constrained optimization problem that directly maximizes the entropy of the training distribution while retaining generalization capabilities. In achieving this, DORAEMON gradually increases the diversity of sampled dynamics parameters as long as the probability of success of the current policy is sufficiently high. We empirically validate the consistent benefits of DORAEMON in obtaining highly adaptive and generalizable policies, i.e. solving the task at hand across the widest range of dynamics parameters, as opposed to representative baselines from the DR literature. Notably, we also demonstrate the Sim2Real applicability of DORAEMON through its successful zero-shot transfer in a robotic manipulation setup under unknown real-world parameters.",
        "keywords": "Reinforcement Learning;Sim-to-Real Transfer;Domain Randomization",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/abef0c510604558cca92321bac5aeb636783a430.zip",
        "author": "Gabriele Tiboni;Pascal Klink;Jan Peters;Tatiana Tommasi;Carlo D'Eramo;Georgia Chalvatzaki",
        "authorids": "~Gabriele_Tiboni1;~Pascal_Klink2;~Jan_Peters3;~Tatiana_Tommasi2;~Carlo_D'Eramo2;~Georgia_Chalvatzaki1",
        "gender": "M;M;M;F;M;F",
        "homepage": "https://gabrieletiboni.com/;;https://www.jan-peters.net;https://www.tatianatommasi.com;https://carloderamo.wixsite.com/home;https://www.ias.informatik.tu-darmstadt.de/Team/GeorgiaChalvatzaki",
        "dblp": ";;p/JanPeters1;10/1266;182/8953;145/3334",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.de/citations?user=ZjqU_KwAAAAJ;https://scholar.google.de/citations?user=-kIVAcAAAAAJ;ykFtI-QAAAAJ;https://scholar.google.it/citations?user=1Rt_86gAAAAJ;https://scholar.google.gr/citations?user=mlho5FkAAAAJ",
        "orcid": ";;0000-0002-5266-8091;;0000-0003-2712-118X;",
        "linkedin": "gabrieletiboni/;;janrpeters/;;carlo-d-eramo-6438a289/;",
        "or_profile": "~Gabriele_Tiboni1;~Pascal_Klink2;~Jan_Peters3;~Tatiana_Tommasi2;~Carlo_D'Eramo2;~Georgia_Chalvatzaki1",
        "aff": "Polytechnic Institute of Turin;Amazon;TU Darmstadt;Polytechnic Institute of Turin;TU Darmstadt;Technische Universit\u00e4t Darmstadt",
        "aff_domain": "polito.it;amazon.de;tu-darmstadt.de;polito.it;tu-darmstadt.de;tu-darmstadt.de",
        "position": "PhD student;Postdoc;Full Professor;Associate Professor;Postdoc;Assistant Professor",
        "bibtex": "@inproceedings{\ntiboni2024domain,\ntitle={Domain Randomization via Entropy Maximization},\nauthor={Gabriele Tiboni and Pascal Klink and Jan Peters and Tatiana Tommasi and Carlo D'Eramo and Georgia Chalvatzaki},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=GXtmuiVrOM}\n}",
        "github": "",
        "project": "",
        "reviewers": "7kiW;eC78;TxSB;W7po;QW63;BXPC",
        "pdf_size": 5062314,
        "rating": "5;5;6;6;6;8",
        "confidence": "3;5;3;5;3;3",
        "soundness": "2;3;3;3;3;4",
        "contribution": "2;1;3;3;3;4",
        "presentation": "3;2;3;3;3;2",
        "wc_summary": "44;156;62;55;141;124",
        "wc_strengths": "22;15;34;47;140;208",
        "wc_weaknesses": "115;243;8;89;314;150",
        "wc_questions": "37;2;105;34;178;83",
        "wc_review": "218;416;209;225;773;565",
        "wc_reply_reviewers": "23;204;6;123;0;0",
        "wc_reply_authors": "1067;2192;692;1020;1442;666",
        "reply_reviewers": "1;2;1;2;0;0",
        "reply_authors": "2;5;2;4;2;1",
        "rating_avg": [
            6.0,
            1.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            3.0,
            0.5773502691896257
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            97.0,
            44.61688768467234
        ],
        "wc_strengths_avg": [
            77.66666666666667,
            71.58367287463128
        ],
        "wc_weaknesses_avg": [
            153.16666666666666,
            100.49447193198682
        ],
        "wc_questions_avg": [
            73.16666666666667,
            57.74488914373481
        ],
        "wc_review_avg": [
            401.0,
            210.88464461248319
        ],
        "wc_reply_reviewers_avg": [
            59.333333333333336,
            77.66094399517831
        ],
        "wc_reply_authors_avg": [
            1179.8333333333333,
            521.7753081760599
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            1.3743685418725535
        ],
        "replies_avg": [
            31,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.3535533905932737,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7653209995512004812&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=GXtmuiVrOM",
        "pdf": "https://openreview.net/pdf?id=GXtmuiVrOM",
        "email": "polito.it;amazon.de;tu-darmstadt.de;polito.it;tu-darmstadt.de;tu-darmstadt.de",
        "author_num": 6,
        "aff_unique_index": "0;1;2;0;2;2",
        "aff_unique_norm": "Polytechnic Institute of Turin;Amazon;Technische Universit\u00e4t Darmstadt",
        "aff_unique_dep": ";Amazon.com, Inc.;",
        "aff_unique_url": "https://www.polito.it;https://www.amazon.com;https://www.tu-darmstadt.de",
        "aff_unique_abbr": "Polito;Amazon;TU Darmstadt",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Darmstadt",
        "aff_country_unique_index": "0;1;2;0;2;2",
        "aff_country_unique": "Italy;United States;Germany"
    },
    {
        "id": "GY1fKFXG5i",
        "title": "Non-Vacuous Generalization Bounds for Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Modern language models can contain billions of parameters, raising the question of whether they can generalize beyond the training data or simply regurgitate their training corpora. We provide the first non-vacuous generalization bounds for pretrained large language models (LLMs), indicating that language models are capable of discovering regularities that generalize to unseen data. In particular, we derive a compression bound that is valid for the unbounded log-likelihood loss using prediction smoothing, and we extend the bound to handle subsampling, accelerating bound computation on massive datasets. To achieve the extreme level of compression required for non-vacuous generalization bounds, we devise SubLoRA, a low-dimensional non-linear parameterization. Using this approach, we find that larger models have better generalization bounds and are more compressible than smaller models.",
        "keywords": "Large language models;PAC-Bayes bounds;generalization",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/dce4c787ce6a464be3319424d51459b9f5cf94b1.zip",
        "author": "Sanae Lotfi;Marc Anton Finzi;Yilun Kuang;Tim G. J. Rudner;Micah Goldblum;Andrew Gordon Wilson",
        "authorids": "~Sanae_Lotfi1;~Marc_Anton_Finzi1;~Yilun_Kuang1;~Tim_G._J._Rudner2;~Micah_Goldblum1;~Andrew_Gordon_Wilson1",
        "gender": "F;M;M;;Not Specified;Not Specified",
        "homepage": "https://sanaelotfi.github.io/;https://mfinzi.github.io;https://yilunkuang.github.io/;;https://cims.nyu.edu/~andrewgw;https://timrudner.com",
        "dblp": "281/6627;222/3062;;241/7231;65/10453;230/3480",
        "google_scholar": "0GyjMX4AAAAJ;ysMAhlwAAAAJ;XvIasgEAAAAJ;pGDKzuUAAAAJ;https://scholar.google.com.tw/citations?user=twWX2LIAAAAJ;https://scholar.google.de/citations?user=MbBntPgAAAAJ",
        "orcid": ";;;;;",
        "linkedin": "sanae-lotfi-636825127;;yilun-mark-kuang/;;;trudner",
        "or_profile": "~Sanae_Lotfi1;~Marc_Anton_Finzi1;~Yilun_Kuang1;~Micah_Goldblum1;~Andrew_Gordon_Wilson1;~Tim_Georg_Johann_Rudner1",
        "aff": "Microsoft;Carnegie Mellon University;New York University;New York University;New York University;New York University",
        "aff_domain": "microsoft.com;cmu.edu;nyu.edu;nyu.edu;nyu.edu;nyu.edu",
        "position": "Researcher;Postdoc;PhD student;Postdoc;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nlotfi2024nonvacuous,\ntitle={Non-Vacuous Generalization Bounds for Large Language Models},\nauthor={Sanae Lotfi and Marc Anton Finzi and Yilun Kuang and Tim G. J. Rudner and Micah Goldblum and Andrew Gordon Wilson},\nyear={2024},\nurl={https://openreview.net/forum?id=GY1fKFXG5i}\n}",
        "github": "",
        "project": "",
        "reviewers": "9VJi;GeY3;TUxG;DsFt;dFjh",
        "site": "https://openreview.net/forum?id=GY1fKFXG5i",
        "pdf_size": 362216,
        "rating": "5;6;6;8;8",
        "confidence": "3;3;4;2;3",
        "soundness": "3;3;3;3;3",
        "contribution": "2;2;3;3;3",
        "presentation": "2;3;3;3;3",
        "wc_summary": "72;89;257;50;91",
        "wc_strengths": "36;49;56;43;77",
        "wc_weaknesses": "35;191;119;1;84",
        "wc_questions": "98;145;2;1;342",
        "wc_review": "241;474;434;95;594",
        "wc_reply_reviewers": "97;36;67;0;7",
        "wc_reply_authors": "867;1289;636;527;748",
        "reply_reviewers": "1;1;1;0;1",
        "reply_authors": "2;2;1;1;1",
        "rating_avg": [
            6.6,
            1.2
        ],
        "confidence_avg": [
            3.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            111.8,
            74.07941684435697
        ],
        "wc_strengths_avg": [
            52.2,
            14.048487463068755
        ],
        "wc_weaknesses_avg": [
            86.0,
            66.24801883830187
        ],
        "wc_questions_avg": [
            117.6,
            125.25909148640669
        ],
        "wc_review_avg": [
            367.6,
            177.38387750863944
        ],
        "wc_reply_reviewers_avg": [
            41.4,
            36.53272505576336
        ],
        "wc_reply_authors_avg": [
            813.4,
            263.3785108925935
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4
        ],
        "reply_authors_avg": [
            1.4,
            0.4898979485566356
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5270462766947298,
        "gs_citation": 22,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12924325717022661669&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 10,
        "aff_unique_index": "0;1;2;2;2;2",
        "aff_unique_norm": "Microsoft;Carnegie Mellon University;New York University",
        "aff_unique_dep": "Microsoft Corporation;;",
        "aff_unique_url": "https://www.microsoft.com;https://www.cmu.edu;https://www.nyu.edu",
        "aff_unique_abbr": "Microsoft;CMU;NYU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "GYAvwLviup",
        "title": "Aligning brain functions boosts the decoding of videos in novel subjects",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep learning is leading to major advances in the realm of brain decoding from functional Magnetic Resonance Imaging (fMRI). However, the large inter-subject variability in brain characteristics has limited most studies to train models on one subject at a time. Consequently, this approach hampers the training of deep learning models, which typically requires very large datasets. Here, we propose to boost brain decoding by aligning brain responses to videos across subjects. Compared to the anatomically-aligned baseline, our method improves out-of-subject decoding performance by up to 75%.  Moreover, it also outperforms classical single-subject approaches when less than 100 minutes of data is available for the tested subject. Furthermore, we propose a new multi-subject alignment method, which obtains comparable results to that of classical single-subject approaches while easing out-of-subject generalization. Finally, we show that this method aligns neural representations in accordance with brain anatomy. Overall, this study lays foundations to leverage extensive neuroimaging datasets and enhance the decoding of individuals with a limited amount of brain recordings.",
        "keywords": "fmri;functional alignment;brain decoding;optimal transport;video decoding",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/ef72789d4c7fab5ef49cebb2e0551ada20bc235d.pdf",
        "author": "Alexis Thual;Yohann Benchetrit;Felix Geilert;J\u00e9r\u00e9my Rapin;Iurii Makarov;Hubert Banville;Jean-Remi King",
        "authorids": "~Alexis_Thual1;~Yohann_Benchetrit1;~Felix_Geilert1;~J\u00e9r\u00e9my_Rapin1;~Iurii_Makarov1;~Hubert_Banville1;~Jean-Remi_King1",
        "gender": "M;M;M;M;M;;M",
        "homepage": ";;https://github.com/felixnext;;;;https://kingjr.github.io/",
        "dblp": ";42/9992.html;;133/8584;;;",
        "google_scholar": ";;kqzMxH4AAAAJ;tQ8DdN8AAAAJ;pq0fEl0AAAAJ;;XZOgIwEAAAAJ",
        "orcid": ";;;;;;",
        "linkedin": "alexisthual/;;felixgeilert/;j%C3%A9r%C3%A9my-rapin-13851613/;lvoursl/;;",
        "or_profile": "~Alexis_Thual1;~Yohann_Benchetrit1;~Felix_Geilert1;~J\u00e9r\u00e9my_Rapin1;~Iurii_Makarov1;~Hubert_Banville1;~Jean-Remi_King1",
        "aff": "CEA;Meta AI;Meta AI;Meta Facebook;Meta Facebook;;CNRS",
        "aff_domain": "cea.fr;ai.meta.com;meta.com;meta.com;facebook.com;;cnrs.fr",
        "position": "PhD student;Researcher;Researcher;Research Engineer;Researcher;;Associate Professor",
        "bibtex": "@misc{\nthual2024aligning,\ntitle={Aligning brain functions boosts the decoding of videos in novel subjects},\nauthor={Alexis Thual and Yohann Benchetrit and Felix Geilert and J{\\'e}r{\\'e}my Rapin and Iurii Makarov and Hubert Banville and Jean-Remi King},\nyear={2024},\nurl={https://openreview.net/forum?id=GYAvwLviup}\n}",
        "github": "",
        "project": "",
        "reviewers": "jWwB;tcU3;uqYK;HiZ5",
        "site": "https://openreview.net/forum?id=GYAvwLviup",
        "pdf_size": 14252946,
        "rating": "3;3;5;6",
        "confidence": "4;3;3;3",
        "soundness": "1;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "1;3;3;3",
        "wc_summary": "13;42;94;72",
        "wc_strengths": "9;17;56;27",
        "wc_weaknesses": "23;53;42;34",
        "wc_questions": "24;5;178;91",
        "wc_review": "69;117;370;224",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "656;609;1482;947",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;3;3;2",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            55.25,
            30.589009464185008
        ],
        "wc_strengths_avg": [
            27.25,
            17.781661902083282
        ],
        "wc_weaknesses_avg": [
            38.0,
            10.977249200050075
        ],
        "wc_questions_avg": [
            74.5,
            67.75876327088622
        ],
        "wc_review_avg": [
            195.0,
            115.57032491085243
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            923.5,
            347.469782858884
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.75,
            0.4330127018922193
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5555555555555555,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:smScBxJRTcMJ:scholar.google.com/&scioq=Aligning+brain+functions+boosts+the+decoding+of+videos+in+novel+subjects&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1;1;2",
        "aff_unique_norm": "Commissariat \u00e0 l'\u00c9nergie Atomique et aux \u00c9nergies Alternatives;Meta;Centre National de la Recherche Scientifique",
        "aff_unique_dep": ";Meta AI;",
        "aff_unique_url": "https://www cea fr;https://meta.com;https://www.cnrs.fr",
        "aff_unique_abbr": "CEA;Meta;CNRS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;1;0",
        "aff_country_unique": "France;United States"
    },
    {
        "id": "GYHF2OfyWP",
        "title": "A Study of Black-Box Attacks Against Robust Federated Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The original Federated Learning (FL) algorithm, FedAvg, is vulnerable to adversarial attacks from its clients. To enhance the security of FL, researchers introduced various defensive aggregation rules. Some of the aggregation rules are based on robust statistics, such as geometry median, and Krum, and some are designed against Sybil attackers, namely FoolsGold, and CONTRA. The previous works evaluate their robustness in a white-box setting, where attackers know which aggregation rule is used by the federated server, the parameters of the FL system, and sometimes the data of honest clients. In this paper, we propose an untargeted attack algorithm based on reinforcement learning (UA-RL) to study the robustness of the aggregation rules in a black-box setting. UA-RL uses the sum of gradients of unmodified datasets to maximize the loss function. It applies reinforcement learning to search for the best parameter controlling the attack magnitude to bypass the aggregation rules. Our experiments on non-i.i.d. datasets indicate that defensive aggregation rules, including Krum, geometry median, FoolsGold, and CONTRA are vulnerable to UA-RL attacks. On i.i.d. datasets, FoolsGold, and CONTRA are fragile, but geometry median and Krum are relatively robust. We further perform a theoretical analysis to explain these experiment results.",
        "keywords": "Federated Learning;Adversarial Attacks",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Yang Li;Adams Wai-Kin Kong",
        "authorids": "~Yang_Li77;~Adams_Wai-Kin_Kong1",
        "gender": "M;M",
        "homepage": "http://www.linkedin.com/in/yang-li-yangland;https://personal.ntu.edu.sg/AdamsKong/",
        "dblp": ";16/3792",
        "google_scholar": ";2GfXvbUAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Yang_Li77;~Adams_Wai-Kin_Kong1",
        "aff": "Nanyang Technological University;Nanyang Technological University",
        "aff_domain": "ntu.edu.sg;ntu.edu.sg",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\nli2024a,\ntitle={A Study of Black-Box Attacks Against Robust Federated Learning},\nauthor={Yang Li and Adams Wai-Kin Kong},\nyear={2024},\nurl={https://openreview.net/forum?id=GYHF2OfyWP}\n}",
        "github": "",
        "project": "",
        "reviewers": "4bmv;cBxt;hDgi;UYNs",
        "site": "https://openreview.net/forum?id=GYHF2OfyWP",
        "pdf_size": 2751631,
        "rating": "3;3;3;3",
        "confidence": "4;4;3;4",
        "soundness": "2;3;1;2",
        "contribution": "2;2;2;2",
        "presentation": "3;2;2;2",
        "wc_summary": "91;173;53;49",
        "wc_strengths": "55;84;40;36",
        "wc_weaknesses": "212;227;504;197",
        "wc_questions": "41;53;5;6",
        "wc_review": "399;537;602;288",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            91.5,
            49.82720140646071
        ],
        "wc_strengths_avg": [
            53.75,
            18.846418757949746
        ],
        "wc_weaknesses_avg": [
            285.0,
            126.88380511318219
        ],
        "wc_questions_avg": [
            26.25,
            21.182244923520265
        ],
        "wc_review_avg": [
            456.5,
            121.8082509520599
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:9w8bsxYgX9YJ:scholar.google.com/&scioq=A+Study+of+Black-Box+Attacks+Against+Robust+Federated+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Nanyang Technological University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ntu.edu.sg",
        "aff_unique_abbr": "NTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Singapore"
    },
    {
        "title": "MMD Graph Kernel: Effective Metric Learning for Graphs via Maximum Mean Discrepancy",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19024",
        "id": "GZ6AcZwA8r",
        "author_site": "Yan Sun, Jicong Fan",
        "tldr": "",
        "abstract": "This paper focuses on graph metric learning. First, we present a class of maximum mean discrepancy (MMD) based graph kernels, called MMD-GK. These kernels are computed by applying MMD to the node representations of two graphs with message-passing propagation. \nSecondly, we provide a class of deep MMD-GKs that are able to learn graph kernels and implicit graph features adaptively in an unsupervised manner. Thirdly, we propose a class of supervised deep MMD-GKs that are able to utilize label information of graphs and hence yield more discriminative metrics. Besides the algorithms, we provide theoretical analysis for the proposed methods. The proposed methods are evaluated in comparison to many baselines such as graph kernels and graph neural networks in the tasks of graph clustering and graph classification. The numerical results demonstrate the effectiveness and superiority of our methods.",
        "keywords": "graph kernel;graph metric learning;maximum mean discrepancy",
        "primary_area": "metric learning, kernel learning, and sparse coding",
        "supplementary_material": "",
        "author": "Yan Sun;Jicong Fan",
        "authorids": "~Yan_Sun7;~Jicong_Fan2",
        "gender": "F;M",
        "homepage": "https://yan-sun-x.github.io/;https://jicongfan.github.io/",
        "dblp": ";139/1570",
        "google_scholar": "oNsiHHMAAAAJ;vdJsnhIAAAAJ",
        "orcid": ";0000-0001-9665-0355",
        "linkedin": "%E5%BD%A6-%E5%AD%99-7988bb1a5/;",
        "or_profile": "~Yan_Sun7;~Jicong_Fan2",
        "aff": "National University of Singapore;The Chinese University of Hong Kong, Shenzhen",
        "aff_domain": "u.nus.edu;cuhk.edu.cn",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nsun2024mmd,\ntitle={{MMD} Graph Kernel: Effective Metric Learning for Graphs via Maximum Mean Discrepancy},\nauthor={Yan Sun and Jicong Fan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=GZ6AcZwA8r}\n}",
        "github": "",
        "project": "",
        "reviewers": "a9u9;CP9G;avjd;9SJd",
        "pdf_size": 1660850,
        "rating": "6;8;8;8",
        "confidence": "3;5;5;4",
        "soundness": "2;4;3;3",
        "contribution": "1;4;3;4",
        "presentation": "1;3;3;4",
        "wc_summary": "59;47;31;66",
        "wc_strengths": "15;105;65;67",
        "wc_weaknesses": "605;38;37;45",
        "wc_questions": "30;147;118;2",
        "wc_review": "709;337;251;180",
        "wc_reply_reviewers": "11;32;15;0",
        "wc_reply_authors": "2677;1258;1405;724",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "5;4;3;1",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            1.224744871391589
        ],
        "presentation_avg": [
            2.75,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            50.75,
            13.273563952458284
        ],
        "wc_strengths_avg": [
            63.0,
            31.96873472629156
        ],
        "wc_weaknesses_avg": [
            181.25,
            244.67159111756314
        ],
        "wc_questions_avg": [
            74.25,
            59.968220750660926
        ],
        "wc_review_avg": [
            369.25,
            203.8803264172392
        ],
        "wc_reply_reviewers_avg": [
            14.5,
            11.5
        ],
        "wc_reply_authors_avg": [
            1516.0,
            716.6013536130113
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.25,
            1.479019945774904
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.8703882797784891,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1412170634909588756&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=GZ6AcZwA8r",
        "pdf": "https://openreview.net/pdf?id=GZ6AcZwA8r",
        "email": "u.nus.edu;cuhk.edu.cn",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "National University of Singapore;Chinese University of Hong Kong",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.nus.edu.sg;https://www.cuhk.edu.cn",
        "aff_unique_abbr": "NUS;CUHK",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Shenzhen",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Singapore;China"
    },
    {
        "id": "GaBg3pgXfX",
        "title": "MusicAOG: an Energy-Based Model for Learning and Sampling a Hierarchical Representation of Symbolic Music",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In addressing the challenge of interpretability and generalizability of artificial music intelligence, this paper introduces a novel symbolic representation that amalgamates both explicit and implicit musical information across diverse traditions and granularities. Utilizing a hierarchical and-or graph representation, the model employs nodes and edges to encapsulate a broad spectrum of musical elements, including structures, textures, rhythms, and harmonies. This hierarchical approach expands the representability across various scales of music. This representation serves as the foundation for an energy-based model, uniquely tailored to learn musical concepts through a flexible algorithm framework relying on the minimax entropy principle. Utilizing an adapted Metropolis-Hastings sampling technique, the model enables fine-grained control over music generation. A comprehensive empirical evaluation, contrasting this novel approach with existing methodologies, manifests considerable advancements in interpretability and controllability. This study marks a substantial contribution to the fields of music analysis, composition, and computational musicology.",
        "keywords": "Music Generation;Symbolic Representation;Artificial Music Intelligence;And-Or Graph;Symbolic Music",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/35aba2c236b6daf7da1c0eb08d5a53a9758d5729.zip",
        "author": "Yikai Qian;Tianle Wang;Xinyi Tong;Peiyang Yu;Jialan Dong;Sitong Chen;Xin Jin;Duo XU;Bo Zheng;Tiezheng Ge;Song-Chun Zhu",
        "authorids": "~Yikai_Qian1;~Tianle_Wang3;~Xinyi_Tong2;~Peiyang_Yu1;~Jialan_Dong1;~Sitong_Chen1;~Xin_Jin1;~Duo_XU3;~Bo_Zheng5;~Tiezheng_Ge3;~Song-Chun_Zhu1",
        "gender": "M;;F;;F;M;M;F;M;M;M",
        "homepage": "https://github.com/zekios;https://scholar.google.com/citations?user=Zk8mUU4AAAAJ&hl=zh-CN;;https://github.com/caichening;https://github.com/B-AloNEver;https://portal.pku.edu.cn/;http://jinxin.me;https://www.tjcm.edu.cn/info/1523/13870.htm;;;https://zhusongchun.net/",
        "dblp": ";;;;;;68/3340-15;;33/1610-7;;10/10313",
        "google_scholar": ";;;;;;UGPgvcUAAAA;;3gHhO9QAAAAJ;db5ZTlMAAAAJ;https://scholar.google.com.tw/citations?user=Al8dyb4AAAAJ",
        "orcid": ";;0000-0002-3269-3628;;;;0000-0003-3873-1653;;0000-0002-4037-6315;0000-0003-1381-2692;",
        "linkedin": ";;;;;;;;bo-zheng-0315254/;;",
        "or_profile": "~Yikai_Qian1;~Tianle_Wang3;~Xinyi_Tong2;~Peiyang_Yu1;~Jialan_Dong1;~Sitong_Chen1;~Xin_Jin1;~Duo_XU3;~Bo_Zheng5;~Tiezheng_Ge3;~Song-Chun_Zhu1",
        "aff": "Central Conservatory of Music;Beijing Institute for General Artificial Intelligence;Central Conservatory of Music\u200c;central conservatory of music;Beijing University of Posts and Telecommunications;Peking University;Beijing Electronic Science and Technology Institute;Tianjin Conservatory of Music;Alibaba Group;Alibaba Group;Peking University",
        "aff_domain": "mail.ccom.edu.cn;bigai.ai;ccom.edu;ccom.edu.cn;bupt.edu.cn;pku.edu.cn;besti.edu.cn;tjcm.edu.cn;alibaba-inc.com;alibaba-inc.com;pku.edu.cn",
        "position": "PhD student;Intern;PhD student;PhD student;Undergrad student;Undergrad student;Associate Professor;Associate Professor;Principal Researcher;Researcher;Full Professor",
        "bibtex": "@misc{\nqian2024musicaog,\ntitle={Music{AOG}: an Energy-Based Model for Learning and Sampling a Hierarchical Representation of Symbolic Music},\nauthor={Yikai Qian and Tianle Wang and Xinyi Tong and Peiyang Yu and Jialan Dong and Sitong Chen and Xin Jin and Duo XU and Bo Zheng and Tiezheng Ge and Song-Chun Zhu},\nyear={2024},\nurl={https://openreview.net/forum?id=GaBg3pgXfX}\n}",
        "github": "",
        "project": "",
        "reviewers": "T1Mh;kK8y;296y;swR4",
        "site": "https://openreview.net/forum?id=GaBg3pgXfX",
        "pdf_size": 4684422,
        "rating": "3;3;3;5",
        "confidence": "3;2;4;3",
        "soundness": "1;3;2;2",
        "contribution": "2;2;3;3",
        "presentation": "1;1;2;2",
        "wc_summary": "51;96;61;40",
        "wc_strengths": "58;87;124;50",
        "wc_weaknesses": "353;189;201;128",
        "wc_questions": "81;156;198;25",
        "wc_review": "543;528;584;243",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            62.0,
            20.988091861815356
        ],
        "wc_strengths_avg": [
            79.75,
            29.02046691560975
        ],
        "wc_weaknesses_avg": [
            217.75,
            82.84737473209395
        ],
        "wc_questions_avg": [
            115.0,
            66.75702210254738
        ],
        "wc_review_avg": [
            474.5,
            135.21926637872284
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15300501106518957027&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0;0;2;3;4;5;6;6;3",
        "aff_unique_norm": "Central Conservatory of Music;Beijing Institute for General Artificial Intelligence;Beijing University of Posts and Telecommunications;Peking University;Beijing Electronic Science and Technology Institute;Tianjin Conservatory of Music;Alibaba Group",
        "aff_unique_dep": ";;;;;;",
        "aff_unique_url": "http://www.ccom.edu.cn;http://www.bigaiai.org/;http://www.bupt.edu.cn/;http://www.pku.edu.cn;;http://www.tjcm.edu.cn;https://www.alibaba.com",
        "aff_unique_abbr": "CCOM;BIGAI;BUPT;Peking U;;;Alibaba",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Beijing",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Robust Model Based Reinforcement Learning Using $\\mathcal{L}_1$ Adaptive Control",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19023",
        "id": "GaLCLvJaoF",
        "author_site": "Minjun Sung, Sambhu Harimanas Karumanchi, Aditya Gahlawat, Naira HOVAKIMYAN",
        "tldr": "",
        "abstract": "We introduce $\\mathcal{L}_1$-MBRL, a control-theoretic augmentation scheme for Model-Based Reinforcement Learning (MBRL) algorithms. Unlike model-free approaches, MBRL algorithms learn a model of the transition function using data and use it to design a control input. Our approach generates a series of approximate control-affine models of the learned transition function according to the proposed switching law. Using the approximate model, control input produced by the underlying MBRL is perturbed by the $\\mathcal{L}_1$ adaptive control, which is designed to enhance the robustness of the system against uncertainties. Importantly, this approach is agnostic to the choice of MBRL algorithm,  enabling the use of the scheme with various MBRL algorithms. MBRL algorithms with $\\mathcal{L}_1$ augmentation exhibit enhanced performance and sample efficiency across multiple MuJoCo environments, outperforming the original MBRL algorithms, both with and without system noise.",
        "keywords": "Robust control;Reinforcement learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/f093d2a2d02929c413e77273772d03893f5ba2bb.zip",
        "author": "Minjun Sung;Sambhu Harimanas Karumanchi;Aditya Gahlawat;Naira Hovakimyan",
        "authorids": "~Minjun_Sung1;~Sambhu_Harimanas_Karumanchi1;~Aditya_Gahlawat1;~Naira_Hovakimyan1",
        "gender": "M;M;M;F",
        "homepage": ";;https://adityagahlawat.github.io/;http://naira.mechse.illinois.edu/",
        "dblp": ";;20/11049.html;",
        "google_scholar": "u7w4vh0AAAAJ;https://scholar.google.ae/citations?user=VLOxHSEAAAAJ;srVEmhwAAAAJ;8mA9QpUAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;nhovakim/",
        "or_profile": "~Minjun_Sung1;~Sambhu_Harimanas_Karumanchi1;~Aditya_Gahlawat1;~Naira_Hovakimyan1",
        "aff": "University of Illinois, Urbana Champaign;University of Illinois, Urbana Champaign;;University of Illinois, Urbana Champaign",
        "aff_domain": "illinois.edu;illinois.edu;;illinois.edu",
        "position": "PhD student;PhD student;;professor",
        "bibtex": "@inproceedings{\nsung2024robust,\ntitle={Robust Model Based Reinforcement Learning Using \\${\\textbackslash}mathcal\\{L\\}\\_1\\$ Adaptive Control},\nauthor={Minjun Sung and Sambhu Harimanas Karumanchi and Aditya Gahlawat and Naira Hovakimyan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=GaLCLvJaoF}\n}",
        "github": "",
        "project": "",
        "reviewers": "26Jm;QoUP;NiYe;QEpj",
        "pdf_size": 811429,
        "rating": "6;6;6;8",
        "confidence": "3;2;4;5",
        "soundness": "3;3;2;3",
        "contribution": "2;3;3;3",
        "presentation": "4;3;2;4",
        "wc_summary": "64;71;35;68",
        "wc_strengths": "48;61;18;62",
        "wc_weaknesses": "121;47;448;105",
        "wc_questions": "65;20;98;11",
        "wc_review": "298;199;599;246",
        "wc_reply_reviewers": "23;0;61;11",
        "wc_reply_authors": "1085;390;1766;583",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "2;1;4;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            59.5,
            14.361406616345072
        ],
        "wc_strengths_avg": [
            47.25,
            17.76759691123141
        ],
        "wc_weaknesses_avg": [
            180.25,
            157.01811201259554
        ],
        "wc_questions_avg": [
            48.5,
            35.14612354157995
        ],
        "wc_review_avg": [
            335.5,
            156.10973704417032
        ],
        "wc_reply_reviewers_avg": [
            23.75,
            22.993205518152532
        ],
        "wc_reply_authors_avg": [
            956.0,
            532.0305442359489
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.7745966692414834,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "openreview": "https://openreview.net/forum?id=GaLCLvJaoF",
        "pdf": "https://openreview.net/pdf?id=GaLCLvJaoF",
        "email": "illinois.edu;illinois.edu;;illinois.edu",
        "author_num": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Illinois Urbana-Champaign",
        "aff_unique_dep": "",
        "aff_unique_url": "https://illinois.edu",
        "aff_unique_abbr": "UIUC",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Urbana-Champaign",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Gb4K2KCaPZ",
        "title": "DAVIS: High-Quality Audio-Visual Separation with Generative Diffusion Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We propose DAVIS, a Diffusion model-based Audio-VIusal Separation framework that solves the audio-visual sound source separation task through a generative manner. While existing discriminative methods that perform mask regression have made remarkable progress in this field, they face limitations in capturing the complex data distribution required for high-quality separation of sounds from diverse categories. In contrast, DAVIS leverages a generative diffusion model and a Separation U-Net to synthesize separated magnitudes starting from Gaussian noises, conditioned on both the audio mixture and the visual footage. With its generative objective, DAVIS is better suited to achieving the goal of high-quality sound separation across diverse categories. We compare DAVIS to existing state-of-the-art discriminative audio-visual separation methods on the domain-specific MUSIC dataset and the open-domain AVE dataset, and results show that DAVIS outperforms other methods in separation quality, demonstrating the advantages of our framework for tackling the audio-visual source separation task.",
        "keywords": "Audio-visual separation;diffusion models",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/e6aeef5fc7006403109c8f8b58ed2f6f21aae80b.zip",
        "author": "Chao Huang;Susan Liang;Yapeng Tian;Anurag Kumar;Chenliang Xu",
        "authorids": "~Chao_Huang3;~Susan_Liang1;~Yapeng_Tian1;~Anurag_Kumar1;~Chenliang_Xu1",
        "gender": "M;M;M;M;M",
        "homepage": "https://wikichao.github.io/;https://liangsusan-git.github.io/;http://www.yapengtian.com/;https://anuragkr90.github.io/;https://www.cs.rochester.edu/~cxu22/",
        "dblp": "18/4087;299/1813;176/4020;33/2741-3;117/4770",
        "google_scholar": "5yYP5RIAAAAJ;x3HBE2gAAAAJ;lxCqdpoAAAAJ;HH5cCX0AAAAJ;https://scholar.google.com.tw/citations?user=54HfyDIAAAAJ",
        "orcid": ";0009-0009-3523-1339;;;",
        "linkedin": ";;;anurag-kumar-90;",
        "or_profile": "~Chao_Huang3;~Susan_Liang1;~Yapeng_Tian1;~Anurag_Kumar1;~Chenliang_Xu1",
        "aff": "Department of Computer Science, University of Rochester;Meta Facebook;University of Texas at Dallas;Meta;University of Rochester",
        "aff_domain": "cs.rochester.edu;meta.com;utdallas.edu;fb.com;rochester.edu",
        "position": "PhD student;Intern;Assistant Professor;Research Scientist;Associate Professor",
        "bibtex": "@misc{\nhuang2024davis,\ntitle={{DAVIS}: High-Quality Audio-Visual Separation with Generative Diffusion Models},\nauthor={Chao Huang and Susan Liang and Yapeng Tian and Anurag Kumar and Chenliang Xu},\nyear={2024},\nurl={https://openreview.net/forum?id=Gb4K2KCaPZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "g6s8;gkhm;tFUD;AwVq",
        "site": "https://openreview.net/forum?id=Gb4K2KCaPZ",
        "pdf_size": 4104692,
        "rating": "3;3;5;6",
        "confidence": "5;4;3;4",
        "soundness": "3;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;3;4",
        "wc_summary": "63;97;45;60",
        "wc_strengths": "60;41;27;103",
        "wc_weaknesses": "330;154;282;144",
        "wc_questions": "207;67;2;36",
        "wc_review": "660;359;356;343",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            66.25,
            19.01808349965895
        ],
        "wc_strengths_avg": [
            57.75,
            28.630185119904482
        ],
        "wc_weaknesses_avg": [
            227.5,
            80.39123086506389
        ],
        "wc_questions_avg": [
            78.0,
            77.94549377609972
        ],
        "wc_review_avg": [
            429.5,
            133.2150517021256
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5443310539518174,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7355981587734255595&as_sdt=5,31&sciodt=0,31&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;1;0",
        "aff_unique_norm": "University of Rochester;Meta;University of Texas at Dallas",
        "aff_unique_dep": "Department of Computer Science;Meta Platforms, Inc.;",
        "aff_unique_url": "https://www.rochester.edu;https://meta.com;https://www.utdallas.edu",
        "aff_unique_abbr": "U of R;Meta;UT Dallas",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Dallas",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "GcML5JKOCF",
        "title": "WinSyn: A High Resolution Testbed for Synthetic Data",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We present WinSyn, a dataset of high resolution photographs and renderings of 3D models as a testbed for synthetic-to-real research. The dataset consists of 75,739 photographs of building windows, including traditional and modern designs, captured globally. Within these, we supply 89,318 crops containing windows, of which 9,002 are semantically labeled. Further, we present our domain-matched photorealistic procedural model which enables experimentation over a variety of parameter distributions and engineering approaches. Our procedural model provides a second corresponding dataset of 21,000 synthetic images. This jointly developed dataset is designed to facilitate\nresearch in the field of synthetic-to-real learning and synthetic data generation. WinSyn allows experimentation into the factors which make it challenging for synthetic data to complete with real world data. We perform ablations using our synthetic model to identify the salient rendering, materials, and geometric factors pertinent to accuracy within a labeling task. In addition, we leverage our dataset to explore the impact of semi-supervised approaches to synthetic modeling research.",
        "keywords": "Synthetic data;machine learning;rendering;graphics;dataset",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/c292e6b6b7d9fe80459289b82472e47f219acaf4.pdf",
        "author": "Tom Kelly;John Femiani;Peter Wonka",
        "authorids": "~Tom_Kelly1;~John_Femiani1;~Peter_Wonka1",
        "gender": ";M;M",
        "homepage": ";http://miamioh.edu/cec/academics/departments/cse/about/faculty-and-staff/femiani-john/index.html;http://peterwonka.net",
        "dblp": ";79/2994;98/5522",
        "google_scholar": ";BRJQl5cAAAAJ;https://scholar.google.com.tw/citations?user=0EKXSXgAAAAJ",
        "orcid": ";0000-0002-0924-6686;0000-0003-0627-9746",
        "linkedin": ";john-femiani-5593894b/;",
        "or_profile": "~Tom_Kelly1;~John_Femiani1;~Peter_Wonka1",
        "aff": ";Miami University;KAUST",
        "aff_domain": ";miamioh.edu;kaust.edu.sa",
        "position": ";Full Professor;Full Professor",
        "bibtex": "@misc{\nkelly2024winsyn,\ntitle={WinSyn: A High Resolution Testbed for Synthetic Data},\nauthor={Tom Kelly and John Femiani and Peter Wonka},\nyear={2024},\nurl={https://openreview.net/forum?id=GcML5JKOCF}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZJ39;7VZc;CUsR;YaDy",
        "site": "https://openreview.net/forum?id=GcML5JKOCF",
        "pdf_size": 19915615,
        "rating": "3;3;3;5",
        "confidence": "3;3;4;4",
        "soundness": "3;1;2;3",
        "contribution": "1;2;1;3",
        "presentation": "3;2;2;3",
        "wc_summary": "75;77;58;194",
        "wc_strengths": "252;75;62;35",
        "wc_weaknesses": "282;381;157;72",
        "wc_questions": "101;43;67;56",
        "wc_review": "710;576;344;357",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            101.0,
            54.198708471696996
        ],
        "wc_strengths_avg": [
            106.0,
            85.5190037360118
        ],
        "wc_weaknesses_avg": [
            223.0,
            117.90038167877151
        ],
        "wc_questions_avg": [
            66.75,
            21.52179128232592
        ],
        "wc_review_avg": [
            496.75,
            153.80080461428022
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2182596930652450134&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Miami University;King Abdullah University of Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.miamioh.edu;https://www.kaust.edu.sa",
        "aff_unique_abbr": "MU;KAUST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United States;Saudi Arabia"
    },
    {
        "id": "Gd0fy9y8uM",
        "title": "HiFi-123: Towards High-fidelity One Image to 3D Content Generation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recent advances in text-to-image diffusion models have enabled 3D generation from a single image. However, current image-to-3D methods often produce suboptimal results for novel views, with blurred textures and deviations from the reference image, limiting their practical applications. In this paper, we introduce HiFi-123, a method designed for high-fidelity and multi-view consistent 3D generation. Our contributions are twofold: First, we propose a reference-based novel view enhancement technique that substantially reduces the quality gap between synthesized and reference views. Second, capitalizing on the novel view enhancement, we present a novel reference-guided state distillation loss. When incorporated into the optimization-based image-to-3D pipeline, our method significantly improves 3D generation quality, achieving state-of-the-art performance. Comprehensive evaluations demonstrate the effectiveness of our approach over existing methods, both qualitatively and quantitatively. Video comparisons are available on the supplementary project page. We will release our code to the public.",
        "keywords": "3D generation;Diffusion models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/3905592259641e3c2414d2649899e95fc6a65df8.zip",
        "author": "Wangbo Yu;Li Yuan;Yan-Pei Cao;Xiangjun Gao;Xiaoyu Li;Long Quan;Ying Shan;Yonghong Tian",
        "authorids": "~Wangbo_Yu1;~Li_Yuan2;~Yan-Pei_Cao1;~Xiangjun_Gao1;~Xiaoyu_Li2;~Long_Quan2;~Ying_Shan2;~Yonghong_Tian1",
        "gender": "M;M;M;M;M;M;M;M",
        "homepage": ";https://yanpei.me/;https://gaoxiangjun.github.io;https://xiaoyu258.github.io;https://www.cse.ust.hk/~quan/;;http://www.pkuml.org;https://yuanli2333.github.io/",
        "dblp": ";141/6343;255/7982;18/6855-2;04/575;68/5910;86/5857;98/4583-7",
        "google_scholar": "UOE8-qsAAAAJ;50194vkAAAAJ;qgdesEcAAAAJ;https://scholar.google.com.hk/citations?user=Dt0PcAYAAAAJ;ZMLhZJ8AAAAJ;4oXBp9UAAAAJ;https://scholar.google.com/citations?hl=en;-5juAR0AAAAJ",
        "orcid": "0000-0003-4387-8967;;0009-0003-6177-4413;;0000-0001-8148-1771;0000-0001-7673-8325;0000-0002-2978-5935;0000-0002-2120-5588",
        "linkedin": ";;;;;YingShanProfile/;;",
        "or_profile": "~Wangbo_Yu1;~Yan-Pei_Cao1;~Xiangjun_Gao1;~Xiaoyu_Li2;~Long_Quan2;~Ying_Shan2;~Yonghong_Tian1;~Yuan_LI2",
        "aff": "Peking University;VAST;Hong Kong University of Science and Technology;Tencent;Hong Kong University of Science and Technology;Tencent PCG ARC Lab;Peking University;Peking University",
        "aff_domain": "pku.edu.cn;vast3dai.com;ust.hk;tencent.com;ust.hk;arc.tencent.com;pku.edu.cn;pku.edu.cn",
        "position": "PhD student;Principal Researcher;PhD student;Researcher;Full Professor;Director;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nyu2024hifi,\ntitle={HiFi-123: Towards High-fidelity One Image to 3D Content Generation},\nauthor={Wangbo Yu and Li Yuan and Yan-Pei Cao and Xiangjun Gao and Xiaoyu Li and Long Quan and Ying Shan and Yonghong Tian},\nyear={2024},\nurl={https://openreview.net/forum?id=Gd0fy9y8uM}\n}",
        "github": "",
        "project": "",
        "reviewers": "WKaM;jpP8;vttR;gkLK",
        "site": "https://openreview.net/forum?id=Gd0fy9y8uM",
        "pdf_size": 25552634,
        "rating": "3;5;5;8",
        "confidence": "5;4;5;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "59;94;55;228",
        "wc_strengths": "24;25;49;101",
        "wc_weaknesses": "283;156;212;141",
        "wc_questions": "3;60;81;39",
        "wc_review": "369;335;397;509",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "389;398;409;168",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            109.0,
            70.35978965289763
        ],
        "wc_strengths_avg": [
            49.75,
            31.235996862594284
        ],
        "wc_weaknesses_avg": [
            198.0,
            55.753923628745625
        ],
        "wc_questions_avg": [
            45.75,
            28.80429655450728
        ],
        "wc_review_avg": [
            402.5,
            65.28973885688318
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            341.0,
            100.13241233486788
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.7001400420140049,
        "gs_citation": 24,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5421668714634352275&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2;3;2;3;0;0",
        "aff_unique_norm": "Peking University;VAST;Hong Kong University of Science and Technology;Tencent",
        "aff_unique_dep": ";;;Tencent Holdings Limited",
        "aff_unique_url": "http://www.pku.edu.cn;;https://www.ust.hk;https://www.tencent.com",
        "aff_unique_abbr": "Peking U;;HKUST;Tencent",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China;"
    },
    {
        "id": "GdTOzdAX5A",
        "title": "On the Identifiability of Switching Dynamical Systems",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In the realm of interpretability and out-of-distribution generalisation, the identifiability of latent variable models has emerged as a captivating field of inquiry. In this work, we delve into the identifiability of Switching Dynamical Systems, taking an initial stride toward extending identifiability analysis to sequential latent variable models. We first prove the identifiability of Markov Switching Models, which commonly serve as the prior distribution for the continuous latent variables in Switching Dynamical Systems. We present identification conditions for first-order Markov dependency structures, whose transition distribution is parametrised via non-linear Gaussians. We then establish the identifiability of the latent variables and non-linear mappings in Switching Dynamical Systems up to affine transformations, by leveraging identifiability analysis techniques from identifiable deep latent variable models. We finally develop estimation algorithms for identifiable Switching Dynamical Systems. Throughout empirical studies, we demonstrate the practicality of identifiable Switching Dynamical Systems for segmenting high-dimensional time series such as videos, and showcase the use of identifiable Markov Switching Models for regime-dependent causal discovery in climate data.",
        "keywords": "identifiability;probabilistic inference;generative modelling;state-space models;time series data;latent variable models",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Carles Balsells-Rodas;Yixin Wang;Yingzhen Li",
        "authorids": "~Carles_Balsells-Rodas1;~Yixin_Wang1;~Yingzhen_Li1",
        "gender": ";F;M",
        "homepage": ";http://yingzhenli.net/home/en/;",
        "dblp": ";117/9230;",
        "google_scholar": "gFLW9qcAAAAJ;https://scholar.google.se/citations?hl=en;ZHmqn_AAAAAJ",
        "orcid": "0000-0002-6617-4842;;",
        "linkedin": ";;carles-balsells-rodas-a07911150/",
        "or_profile": "~Yixin_Wang1;~Yingzhen_Li1;~Carles_Balsells_Rodas1",
        "aff": "University of Michigan - Ann Arbor;Imperial College London;Imperial College London, Imperial College London",
        "aff_domain": "umich.edu;imperial.ac.uk;imperial.ac.uk",
        "position": "Assistant Professor;Associate Professor;PhD student",
        "bibtex": "@misc{\nbalsells-rodas2024on,\ntitle={On the Identifiability of Switching Dynamical Systems},\nauthor={Carles Balsells-Rodas and Yixin Wang and Yingzhen Li},\nyear={2024},\nurl={https://openreview.net/forum?id=GdTOzdAX5A}\n}",
        "github": "",
        "project": "",
        "reviewers": "SfP9;QaMu;nPz5;JVt8",
        "site": "https://openreview.net/forum?id=GdTOzdAX5A",
        "pdf_size": 7325034,
        "rating": "5;6;6;6",
        "confidence": "4;3;4;3",
        "soundness": "3;3;4;3",
        "contribution": "2;2;3;3",
        "presentation": "3;2;3;2",
        "wc_summary": "42;44;66;46",
        "wc_strengths": "93;295;44;10",
        "wc_weaknesses": "671;3;30;61",
        "wc_questions": "82;3;51;4",
        "wc_review": "888;345;191;121",
        "wc_reply_reviewers": "329;23;41;0",
        "wc_reply_authors": "2280;1128;1443;988",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "7;3;3;2",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            49.5,
            9.630680142129112
        ],
        "wc_strengths_avg": [
            110.5,
            110.53166966982812
        ],
        "wc_weaknesses_avg": [
            191.25,
            277.74302421483065
        ],
        "wc_questions_avg": [
            35.0,
            33.354160160315836
        ],
        "wc_review_avg": [
            386.25,
            300.805065615591
        ],
        "wc_reply_reviewers_avg": [
            98.25,
            134.01375862201613
        ],
        "wc_reply_authors_avg": [
            1459.75,
            501.4221649468639
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.75,
            1.920286436967152
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=543694841544533237&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "University of Michigan;Imperial College London",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.umich.edu;https://www.imperial.ac.uk",
        "aff_unique_abbr": "UM;ICL",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Ann Arbor;",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "Gdm87rRjep",
        "title": "Compress, Then Prompt: Improving Accuracy-Efficiency Trade-off of LLM Inference with Transferable Prompt",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "While the numerous parameters in Large Language Models (LLMs) contribute to their superior performance, this massive scale makes them inefficient and memory-hungry. Thus, they are hard to deploy on the commodity hardware, such as one single GPU.\nGiven the memory and power constraints of such devices, model compression methods are widely employed to reduce the model size and inference latency, which essentially trades off model quality in return for improved efficiency.\nThus, optimizing this accuracy-efficiency trade-off is crucial for the LLM deployment on commodity hardware.\nIn this paper, we introduce a new perspective to optimize this trade-off by prompting compressed models.\nSpecifically, we first observe that for certain questions, the generation quality of a compressed LLM can be significantly improved by adding carefully designed hard prompts, though this isn't the case for all questions.\nBased on this observation, we propose a soft prompt learning method where we expose the compressed model to the prompt learning process, aiming to enhance the performance of prompts.\nOur experimental analysis suggests our soft prompt strategy greatly improves the performance of the $8\\times$ compressed Llama-7B model (with a joint 4-bit quantization and 50\\% weight pruning compression), allowing them to match their uncompressed counterparts on popular benchmarks.\nMoreover, we demonstrate that these learned prompts can be transferred across various datasets, tasks, and compression levels.\nHence with this transferability, we can stitch the soft prompt to a newly compressed model to improve the test-time accuracy in an ``in-situ'' way.",
        "keywords": "Large Language Models;Efficiency;Prompt",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Zhaozhuo Xu;Zirui Liu;Beidi Chen;Yuxin Tang;Jue WANG;Kaixiong Zhou;Xia Hu;Anshumali Shrivastava",
        "authorids": "~Zhaozhuo_Xu2;~Zirui_Liu1;~Beidi_Chen1;~Yuxin_Tang2;~Jue_WANG1;~Kaixiong_Zhou1;~Xia_Hu4;~Anshumali_Shrivastava1",
        "gender": ";M;F;;M;M;;M",
        "homepage": "https://ottovonxu.github.io/;https://zirui-ray-liu.github.io/;https://www.andrew.cmu.edu/user/beidic/;;https://juewang.me/about/;https://kaixiong-zhou.github.io/;;https://www.cs.rice.edu/~as143/",
        "dblp": "195/4352;196/8629-1.html;192/1339;;69/393-19;178/7315;;63/9828",
        "google_scholar": "7tDlVAsAAAAJ;https://scholar.google.com/citations?hl=zh-CN;;;PykI8xcAAAAJ;zMspIjIAAAAJ;;https://scholar.google.com.tw/citations?user=SGT23RAAAAAJ",
        "orcid": ";;;;;0000-0001-5226-8736;;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Zhaozhuo_Xu2;~Zirui_Liu1;~Beidi_Chen1;~Yuxin_Tang2;~Jue_WANG1;~Kaixiong_Zhou1;~Xia_Hu4;~Anshumali_Shrivastava1",
        "aff": "Rice University;Rice University;Meta Facebook;;Together AI;Massachusetts Institute of Technology;;ThirdAI Corp.",
        "aff_domain": "rice.edu;rice.edu;fb.com;;together.ai;mit.edu;;thirdai.com",
        "position": "PhD student;PhD student;Researcher;;Researcher;Postdoc;;CEO",
        "bibtex": "@misc{\nxu2024compress,\ntitle={Compress, Then Prompt: Improving Accuracy-Efficiency Trade-off of {LLM} Inference with Transferable Prompt},\nauthor={Zhaozhuo Xu and Zirui Liu and Beidi Chen and Yuxin Tang and Jue WANG and Kaixiong Zhou and Xia Hu and Anshumali Shrivastava},\nyear={2024},\nurl={https://openreview.net/forum?id=Gdm87rRjep}\n}",
        "github": "",
        "project": "",
        "reviewers": "jG4W;34kz;QUfQ;ARdA",
        "site": "https://openreview.net/forum?id=Gdm87rRjep",
        "pdf_size": 754247,
        "rating": "5;5;5;8",
        "confidence": "4;4;4;3",
        "soundness": "3;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "86;75;53;68",
        "wc_strengths": "41;48;46;91",
        "wc_weaknesses": "65;128;82;23",
        "wc_questions": "62;9;4;41",
        "wc_review": "254;260;185;223",
        "wc_reply_reviewers": "0;313;73;0",
        "wc_reply_authors": "1165;951;1280;50",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "2;2;3;1",
        "rating_avg": [
            5.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            70.5,
            11.968709203585824
        ],
        "wc_strengths_avg": [
            56.5,
            20.081085628023203
        ],
        "wc_weaknesses_avg": [
            74.5,
            37.61980861195336
        ],
        "wc_questions_avg": [
            29.0,
            23.759208741033444
        ],
        "wc_review_avg": [
            230.5,
            29.78674201721296
        ],
        "wc_reply_reviewers_avg": [
            96.5,
            128.5
        ],
        "wc_reply_authors_avg": [
            861.5,
            483.16586179075193
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 38,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13375021987741197977&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;2;3;4",
        "aff_unique_norm": "Rice University;Meta;Together AI;Massachusetts Institute of Technology;ThirdAI Corp.",
        "aff_unique_dep": ";Meta Platforms, Inc.;;;",
        "aff_unique_url": "https://www.rice.edu;https://meta.com;https://www.together.ai;https://web.mit.edu;",
        "aff_unique_abbr": "Rice;Meta;Together AI;MIT;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Ge0GEOvifh",
        "title": "Better Safe than Sorry: Pre-training CLIP against Targeted Data Poisoning and Backdoor Attacks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Contrastive Language-Image Pre-training (CLIP) on large image-caption datasets has achieved remarkable success in zero-shot classification and enabled transferability to new domains. However, CLIP is extremely more vulnerable to targeted data poisoning and backdoor attacks, compared to supervised learning. Perhaps surprisingly, poisoning 0.0001% of CLIP pre-training data is enough to make targeted data poisoning attacks successful. This is four orders of magnitude smaller than what is required to poison supervised models. Despite this vulnerability, existing methods are very limited in defending CLIP models during pre-training. In this work, we propose a strong defense, SAFECLIP, to safely pre-train CLIP against targeted data poisoning and backdoor attacks. SAFECLIP warms up the model by applying unimodal contrastive learning (CL) on image and text modalities separately. Then, it carefully divides the data into safe and risky subsets. SAFECLIP trains on the risky data by applying unimodal CL to image and text modalities separately, and trains on the safe data using the CLIP loss. By gradually increasing the size of the safe subset during the training, SAFECLIP effectively breaks targeted data poisoning and backdoor attacks without harming the CLIP performance. Our extensive experiments show that SAFECLIP decrease the attack success rate of targeted data poisoning attacks from 93.75% to 0% and that of the backdoor attacks from 100% to 0%, without harming the CLIP performance on various datasets.",
        "keywords": "Contrastive Learning;Adversarial Learning;Model Robustness",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Wenhan Yang;Jingdong Gao;Baharan Mirzasoleiman",
        "authorids": "~Wenhan_Yang5;~Jingdong_Gao1;~Baharan_Mirzasoleiman1",
        "gender": "M;;F",
        "homepage": ";https://github.com/mxuan0;http://web.cs.ucla.edu/~baharan/",
        "dblp": ";;52/10075",
        "google_scholar": ";;x63j7HEAAAAJ",
        "orcid": ";;",
        "linkedin": "wenhan-yang-6413981b4/;;",
        "or_profile": "~Wenhan_Yang5;~Jingdong_Gao1;~Baharan_Mirzasoleiman1",
        "aff": "University of California, Los Angeles;;University of California, Los Angeles",
        "aff_domain": "ucla.edu;;ucla.edu",
        "position": "PhD student;;Assistant Professor",
        "bibtex": "@misc{\nyang2024better,\ntitle={Better Safe than Sorry: Pre-training {CLIP} against Targeted Data Poisoning and Backdoor Attacks},\nauthor={Wenhan Yang and Jingdong Gao and Baharan Mirzasoleiman},\nyear={2024},\nurl={https://openreview.net/forum?id=Ge0GEOvifh}\n}",
        "github": "",
        "project": "",
        "reviewers": "2rqV;TTCu;MgX1",
        "site": "https://openreview.net/forum?id=Ge0GEOvifh",
        "pdf_size": 1045896,
        "rating": "3;3;8",
        "confidence": "4;5;4",
        "soundness": "3;1;4",
        "contribution": "2;2;3",
        "presentation": "2;2;3",
        "wc_summary": "97;134;212",
        "wc_strengths": "53;30;112",
        "wc_weaknesses": "249;441;246",
        "wc_questions": "71;133;60",
        "wc_review": "470;738;630",
        "wc_reply_reviewers": "0;0;51",
        "wc_reply_authors": "1103;2047;767",
        "reply_reviewers": "0;0;1",
        "reply_authors": "2;3;1",
        "rating_avg": [
            4.666666666666667,
            2.357022603955158
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            147.66666666666666,
            47.932823363072984
        ],
        "wc_strengths_avg": [
            65.0,
            34.53500639447844
        ],
        "wc_weaknesses_avg": [
            312.0,
            91.22499657440389
        ],
        "wc_questions_avg": [
            88.0,
            32.13513134665341
        ],
        "wc_review_avg": [
            612.6666666666666,
            110.09490855116275
        ],
        "wc_reply_reviewers_avg": [
            17.0,
            24.041630560342615
        ],
        "wc_reply_authors_avg": [
            1305.6666666666667,
            541.8519683045873
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17503491736576494934&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of California, Los Angeles",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucla.edu",
        "aff_unique_abbr": "UCLA",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Los Angeles",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Ge7ZqrKG9t",
        "title": "Modeling Complex Mathematical Reasoning via Large Language Model based MathAgent",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large language models (LLMs) face challenges in solving complex mathematical problems that require comprehensive capacities to parse the statements, associate domain knowledge, perform compound logical reasoning, and integrate the intermediate rationales. Tackling all these problems once could be arduous for LLMs, thus leading to confusion in generation. In this work, we explore the potential of enhancing LLMs with agents by meticulous decomposition and modeling of mathematical reasoning process. Specifically, we propose a formal description of the mathematical solving and extend LLMs with an agent-based zero-shot framework named \\textbf{P}lanner-\\textbf{R}easoner-\\textbf{E}xecutor-\\textbf{R}eflector (PRER). We further provide and implement two MathAgents that define the logical forms and inherent relations via a pool of actions in different grains and orientations: MathAgent-M adapts its actions to LLMs, while MathAgent-H aligns with humankind. Experiments on miniF2F and MATH have demonstrated the effectiveness of PRER and proposed MathAgents, achieving an increase of 12.3% (53.9%$\\rightarrow$66.2%) on MiniF2F, 9.2% (49.8%$\\rightarrow$59.0%) on MATH, and 13.2% (23.2%$\\rightarrow$35.4%) for level-5 problems of MATH against GPT-4. Further analytical results provide more insightful perspectives on exploiting the behaviors of LLMs as agents.",
        "keywords": "large language model; agent; mathematical reasoning; zero-shot prompting",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Haoran Liao;Qinyi Du;Shaohua Hu;Hao HE;Yanyan Xu;Jidong Tian;Yaohui Jin",
        "authorids": "~Haoran_Liao2;~Qinyi_Du2;~Shaohua_Hu1;~Hao_HE4;~Yanyan_Xu2;~Jidong_Tian1;~Yaohui_Jin2",
        "gender": "M;M;M;M;M;M;M",
        "homepage": "http://;;;https://www.researchgate.net/profile/Yanyan-Xu-4;;http://front.sjtu.edu.cn/~jinyh/;http://thinklab.sjtu.edu.cn/member.html",
        "dblp": ";;18/813-7.html;39/706-2;230/4307.html;27/7040;",
        "google_scholar": ";https://scholar.google.com/citations?hl=zh-CN;;4A8N4PMAAAAJ;0iq39EUAAAAJ;H_7_oVcAAAAJ;",
        "orcid": ";;0000-0002-4851-7012;0000-0001-5429-3177;;0000-0001-6158-6277;",
        "linkedin": ";;;;;yaohui-jin-bab58511/;",
        "or_profile": "~Qinyi_Du2;~Shaohua_Hu1;~Hao_HE4;~Yanyan_Xu2;~Jidong_Tian1;~Yaohui_Jin2;~Haoran_Liao1",
        "aff": "Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn",
        "position": "PhD student;PhD student;Associate Professor;Associate Professor;Postdoc;Full Professor;PhD student",
        "bibtex": "@misc{\nliao2024modeling,\ntitle={Modeling Complex Mathematical Reasoning via Large Language Model based MathAgent},\nauthor={Haoran Liao and Qinyi Du and Shaohua Hu and Hao HE and Yanyan Xu and Jidong Tian and Yaohui Jin},\nyear={2024},\nurl={https://openreview.net/forum?id=Ge7ZqrKG9t}\n}",
        "github": "",
        "project": "",
        "reviewers": "DbPQ;CLmw;WFXS;M3Nq",
        "site": "https://openreview.net/forum?id=Ge7ZqrKG9t",
        "pdf_size": 1289258,
        "rating": "3;5;5;6",
        "confidence": "4;3;4;4",
        "soundness": "2;2;3;3",
        "contribution": "1;2;2;3",
        "presentation": "2;2;3;2",
        "wc_summary": "49;56;55;49",
        "wc_strengths": "49;45;53;67",
        "wc_weaknesses": "301;80;190;107",
        "wc_questions": "23;91;105;433",
        "wc_review": "422;272;403;656",
        "wc_reply_reviewers": "61;499;0;56",
        "wc_reply_authors": "474;1519;342;573",
        "reply_reviewers": "1;3;0;1",
        "reply_authors": "2;5;2;2",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            52.25,
            3.2691742076555053
        ],
        "wc_strengths_avg": [
            53.5,
            8.2915619758885
        ],
        "wc_weaknesses_avg": [
            169.5,
            86.06538212312776
        ],
        "wc_questions_avg": [
            163.0,
            158.94024034208581
        ],
        "wc_review_avg": [
            438.25,
            138.34806648450132
        ],
        "wc_reply_reviewers_avg": [
            154.0,
            200.62028810666183
        ],
        "wc_reply_authors_avg": [
            727.0,
            464.54655310313086
        ],
        "reply_reviewers_avg": [
            1.25,
            1.0897247358851685
        ],
        "reply_authors_avg": [
            2.75,
            1.299038105676658
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.13245323570650439,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8161331698886663783&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0;0;0;0",
        "aff_unique_norm": "Shanghai Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sjtu.edu.cn",
        "aff_unique_abbr": "SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "REValueD: Regularised Ensemble Value-Decomposition for Factorisable Markov Decision Processes",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19022",
        "id": "Gf15GsnfTy",
        "author_site": "David Ireland, Giovanni Montana",
        "tldr": "",
        "abstract": "Discrete-action reinforcement learning algorithms often falter in tasks with high-dimensional discrete action spaces due to the vast number of possible actions. A recent advancement leverages value-decomposition, a concept from multi-agent reinforcement learning, to tackle this challenge. This study delves deep into the effects of this value-decomposition, revealing that whilst it curtails the over-estimation bias inherent to Q-learning algorithms, it amplifies target variance. To counteract this, we present an ensemble of critics to mitigate target variance. Moreover, we introduce a regularisation loss that helps to mitigate the effects that exploratory actions in one dimension can have on the value of optimal actions in other dimensions. Our novel algorithm, REValueD, tested on discretised versions of the DeepMind Control Suite tasks, showcases superior performance, especially in the challenging humanoid and dog tasks. We further dissect the factors influencing REValueD's performance, evaluating the significance of the regularisation loss and the scalability of REValueD with increasing sub-actions per dimension.",
        "keywords": "reinforcement learning;learning efficiency;ensembles;value-decomposition",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "David Ireland;Giovanni Montana",
        "authorids": "~David_Ireland1;~Giovanni_Montana1",
        "gender": "M;M",
        "homepage": "https://davidireland3.github.io;https://warwick.ac.uk/fac/sci/statistics/staff/academic-research/montana",
        "dblp": ";89/449",
        "google_scholar": "https://scholar.google.co.uk/citations?hl=en;tD5eGlkAAAAJ",
        "orcid": ";0000-0003-3942-3900",
        "linkedin": ";gmontana/",
        "or_profile": "~David_Ireland1;~Giovanni_Montana1",
        "aff": "University of Warwick;The University of Warwick",
        "aff_domain": "warwick.ac.uk;warwick.ac.uk",
        "position": "PhD student;Full Professor",
        "bibtex": "@inproceedings{\nireland2024revalued,\ntitle={{REV}alueD: Regularised Ensemble Value-Decomposition for Factorisable Markov Decision Processes},\nauthor={David Ireland and Giovanni Montana},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Gf15GsnfTy}\n}",
        "github": "",
        "project": "",
        "reviewers": "fnTY;Athy;bJ1N",
        "pdf_size": 1755770,
        "rating": "5;6;6",
        "confidence": "4;4;3",
        "soundness": "1;3;3",
        "contribution": "2;3;3",
        "presentation": "3;3;3",
        "wc_summary": "64;64;62",
        "wc_strengths": "41;59;77",
        "wc_weaknesses": "78;345;50",
        "wc_questions": "221;59;57",
        "wc_review": "404;527;246",
        "wc_reply_reviewers": "0;54;27",
        "wc_reply_authors": "635;766;435",
        "reply_reviewers": "0;1;1",
        "reply_authors": "2;2;2",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            63.333333333333336,
            0.9428090415820634
        ],
        "wc_strengths_avg": [
            59.0,
            14.696938456699069
        ],
        "wc_weaknesses_avg": [
            157.66666666666666,
            132.9569688115503
        ],
        "wc_questions_avg": [
            112.33333333333333,
            76.84327484490031
        ],
        "wc_review_avg": [
            392.3333333333333,
            115.01400880858915
        ],
        "wc_reply_reviewers_avg": [
            27.0,
            22.045407685048602
        ],
        "wc_reply_authors_avg": [
            612.0,
            136.1053513520562
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8877184011965697972&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=Gf15GsnfTy",
        "pdf": "https://openreview.net/pdf?id=Gf15GsnfTy",
        "email": "warwick.ac.uk;warwick.ac.uk",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Warwick",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.warwick.ac.uk",
        "aff_unique_abbr": "Warwick",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "Gf4KZIqLHD",
        "title": "A Change of Heart: Backdoor Attacks on Security-Centric Diffusion Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Diffusion models have been employed as defensive tools to reinforce the security of other models, notably in purifying adversarial examples and certifying adversarial robustness. Meanwhile, the prohibitive training costs often make the use of pre-trained diffusion models an attractive practice. The tension between the intended use of these models and their unvalidated nature raises significant security concerns that remain largely unexplored. To bridge this gap, we present DIFF2, a novel backdoor attack tailored to security-centric diffusion models. Essentially, DIFF2 superimposes a diffusion model with a malicious diffusion-denoising process, guiding inputs embedded with specific triggers toward an adversary-defined distribution, while preserving the normal process for other inputs. Our case studies on adversarial purification and robustness certification show that DIFF2 substantially diminishes both post-purification and certified accuracy across various benchmark datasets and diffusion models, highlighting the potential risks of utilizing pre-trained diffusion models as defensive tools. We further explore possible countermeasures, suggesting promising avenues for future research.",
        "keywords": "Diffusion Models;Adversarial Purification;Backdoor Attacks",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Changjiang Li;Ren Pang;Bochuan Cao;Jinghui Chen;Ting Wang",
        "authorids": "~Changjiang_Li1;~Ren_Pang1;~Bochuan_Cao1;~Jinghui_Chen1;~Ting_Wang1",
        "gender": "M;M;;M;M",
        "homepage": ";https://ain-soph.github.io/;https://aaaaaasuka.github.io/;https://jinghuichen.github.io/;https://alps-lab.github.io/",
        "dblp": ";252/5223;334/3881;67/5633;12/2633-6.html",
        "google_scholar": "qBBlW0gAAAAJ;M8YmxzYAAAAJ;eOZCg2IAAAAJ;mKia7Y4AAAAJ;cwcBTegAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Changjiang_Li1;~Ren_Pang1;~Bochuan_Cao1;~Jinghui_Chen1;~Ting_Wang1",
        "aff": "State University of New York at Stony Brook;Pennsylvania State University;Pennsylvania State University;Pennsylvania State University;State University of New York at Stony Brook",
        "aff_domain": "stonybrook.edu;psu.edu;psu.edu;psu.edu;cs.stonybrook.edu",
        "position": "PhD student;PhD student;PhD student;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nli2024a,\ntitle={A Change of Heart: Backdoor Attacks on Security-Centric Diffusion Models},\nauthor={Changjiang Li and Ren Pang and Bochuan Cao and Jinghui Chen and Ting Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=Gf4KZIqLHD}\n}",
        "github": "",
        "project": "",
        "reviewers": "oFGZ;YNBr;rxGQ;gB2k",
        "site": "https://openreview.net/forum?id=Gf4KZIqLHD",
        "pdf_size": 3764713,
        "rating": "5;5;6;6",
        "confidence": "3;4;4;4",
        "soundness": "2;3;3;3",
        "contribution": "3;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "82;32;52;74",
        "wc_strengths": "28;19;18;61",
        "wc_weaknesses": "126;389;123;57",
        "wc_questions": "85;3;124;5",
        "wc_review": "321;443;317;197",
        "wc_reply_reviewers": "0;144;185;0",
        "wc_reply_authors": "1012;1914;1533;451",
        "reply_reviewers": "0;1;2;0",
        "reply_authors": "2;3;3;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            60.0,
            19.544820285692065
        ],
        "wc_strengths_avg": [
            31.5,
            17.471405209656147
        ],
        "wc_weaknesses_avg": [
            173.75,
            127.29763352081609
        ],
        "wc_questions_avg": [
            54.25,
            52.112258634605354
        ],
        "wc_review_avg": [
            319.5,
            86.98706800438787
        ],
        "wc_reply_reviewers_avg": [
            82.25,
            83.5175879680442
        ],
        "wc_reply_authors_avg": [
            1227.5,
            550.9094753223982
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5996520946457717438&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1;0",
        "aff_unique_norm": "State University of New York at Stony Brook;Pennsylvania State University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.stonybrook.edu;https://www.psu.edu",
        "aff_unique_abbr": "SUNY Stony Brook;PSU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Stony Brook;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "GfXF04YYvu",
        "title": "Enhancing Group Fairness in Federated Learning through Personalization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Instead of producing a single global model for all participating clients, personalized Federated Learning (FL) algorithms aim to collaboratively train customized models for each client, enhancing their local accuracy. For example, clients could be clustered into different groups in which their models are similar, or clients could tune the global model locally to achieve better local accuracy. In this paper, we investigate the impact of personalization techniques in the FL paradigm on local (group) fairness of the learned models, and show that personalization techniques can also lead to improved fairness. We establish this effect through numerical experiments comparing two types of personalized FL algorithms against the baseline FedAvg algorithm and a baseline fair FL algorithm, and elaborate on the reasons behind improved fairness using personalized FL methods. We further provide analytical support under certain conditions.",
        "keywords": "fairness;personalization;federated learning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/b7a5ab6474329036f87015ff58b848296fd42028.zip",
        "author": "Yifan Yang;Ali Payani;Parinaz Naghizadeh",
        "authorids": "~Yifan_Yang3;~Ali_Payani1;~Parinaz_Naghizadeh1",
        "gender": "M;M;",
        "homepage": "https://sites.google.com/view/yangyifan/yifan_yang;;http://parinazn.com",
        "dblp": ";184/3921;122/6031",
        "google_scholar": "6lsVlz8AAAAJ;9rHwD8wAAAAJ;",
        "orcid": "0009-0006-5463-0915;0000-0003-4054-2958;",
        "linkedin": "yifan-yang-02a8b3161/;ali-payani-59267515;",
        "or_profile": "~Yifan_Yang3;~Ali_Payani1;~Parinaz_Naghizadeh1",
        "aff": "Ohio State University;Cisco;University of California, San Diego",
        "aff_domain": "osu.edu;cisco.com;ucsd.edu",
        "position": "PhD student;Researcher;Assistant Professor",
        "bibtex": "@misc{\nyang2024enhancing,\ntitle={Enhancing Group Fairness in Federated Learning through Personalization},\nauthor={Yifan Yang and Ali Payani and Parinaz Naghizadeh},\nyear={2024},\nurl={https://openreview.net/forum?id=GfXF04YYvu}\n}",
        "github": "",
        "project": "",
        "reviewers": "gUoU;9xvK;4EZY;eX39",
        "site": "https://openreview.net/forum?id=GfXF04YYvu",
        "pdf_size": 1447888,
        "rating": "3;3;5;5",
        "confidence": "4;4;4;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "1;2;3;2",
        "wc_summary": "72;20;43;45",
        "wc_strengths": "31;46;20;53",
        "wc_weaknesses": "52;161;244;195",
        "wc_questions": "67;2;3;95",
        "wc_review": "222;229;310;388",
        "wc_reply_reviewers": "0;0;121;6",
        "wc_reply_authors": "602;237;474;593",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            45.0,
            18.425525772688278
        ],
        "wc_strengths_avg": [
            37.5,
            12.854960132182441
        ],
        "wc_weaknesses_avg": [
            163.0,
            70.55139970262816
        ],
        "wc_questions_avg": [
            41.75,
            40.48070528041724
        ],
        "wc_review_avg": [
            287.25,
            67.67338841819581
        ],
        "wc_reply_reviewers_avg": [
            31.75,
            51.58669886705293
        ],
        "wc_reply_authors_avg": [
            476.5,
            147.21497885745185
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7454042516222033918&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Ohio State University;Cisco Systems;University of California, San Diego",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.osu.edu;https://www.cisco.com;https://www.ucsd.edu",
        "aff_unique_abbr": "OSU;Cisco;UCSD",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";San Diego",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Dictionary Contrastive Learning for Efficient Local Supervision without Auxiliary Networks",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19021",
        "id": "Gg7cXo3S8l",
        "author_site": "Suhwan Choi, Myeongho Jeon, Yeonjung Hwang, Jeonglyul Oh, Sungjun Lim, Joonseok Lee, Myungjoo Kang",
        "tldr": "",
        "abstract": "While backpropagation (BP) has achieved widespread success in deep learning, it\nfaces two prominent challenges: computational inefficiency and biological implausibility.\nIn response to these challenges, local supervision, encompassing Local\nLearning (LL) and Forward Learning (FL), has emerged as a promising research\ndirection. LL employs module-wise BP to achieve competitive results yet relies on\nmodule-wise auxiliary networks, which increase memory and parameter demands.\nConversely, FL updates layer weights without BP and auxiliary networks but falls\nshort of BP\u2019s performance. This paper proposes a simple yet effective objective\nwithin a contrastive learning framework for local supervision without auxiliary\nnetworks. Given the insight that the existing contrastive learning framework for\nlocal supervision is susceptible to task-irrelevant information without auxiliary\nnetworks, we present DICTIONARY CONTRASTIVE LEARNING (DCL) that optimizes\nthe similarity between local features and label embeddings. Our method\nusing static label embeddings yields substantial performance improvements in the\nFL scenario, outperforming state-of-the-art FL approaches. Moreover, our method\nusing adaptive label embeddings closely approaches the performance achieved by\nLL while achieving superior memory and parameter efficiency.",
        "keywords": "Contrastive learning;Forward learning;Local learning;Image classification;Efficient learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/4d7b65bb0cb5bc2c31aba5d42a1ed81262af681a.zip",
        "author": "Suhwan Choi;Myeongho Jeon;Yeonjung Hwang;Jeonglyul Oh;Sungjun Lim;Joonseok Lee;Myungjoo Kang",
        "authorids": "~Suhwan_Choi1;~Myeongho_Jeon1;~Yeonjung_Hwang1;~Jeonglyul_Oh1;~Sungjun_Lim3;~Joonseok_Lee1;~Myungjoo_Kang1",
        "gender": "M;;;M;M;M;",
        "homepage": ";;;http://bdai.snu.ac.kr/ko/;https://drl.snu.ac.kr/;http://www.joonseok.net;http://ncia.snu.ac.kr/",
        "dblp": ";275/3060;;;;77/1319.html;64/5657.html",
        "google_scholar": "PdO6JxkAAAAJ;U1KJOawAAAAJ;;;;https://scholar.google.co.kr/citations?user=M-MfqpMAAAAJ;",
        "orcid": ";;;;;;",
        "linkedin": "suhwan-choi-98a172182;;hwangyj/;;;joonseoklee;",
        "or_profile": "~Suhwan_Choi1;~Myeongho_Jeon1;~Yeonjung_Hwang1;~Jeonglyul_Oh1;~Sungjun_Lim3;~Joonseok_Lee1;~Myungjoo_Kang1",
        "aff": "Seoul National University;Seoul National University;Seoul National University;Seoul National University;Seoul National University;Google Research;Seoul National University",
        "aff_domain": "snu.ac.kr;snu.ac.kr;snu.ac.kr;snu.ac.kr;snu.ac.kr;google.com;snu.ac.kr",
        "position": "MS student;PhD student;MS student;MS student;MS student;Research Scientist;Full Professor",
        "bibtex": "@inproceedings{\nchoi2024dictionary,\ntitle={Dictionary Contrastive Learning for Efficient Local Supervision without Auxiliary Networks},\nauthor={Suhwan Choi and Myeongho Jeon and Yeonjung Hwang and Jeonglyul Oh and Sungjun Lim and Joonseok Lee and Myungjoo Kang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Gg7cXo3S8l}\n}",
        "github": "",
        "project": "",
        "reviewers": "UJZ4;SF1W;3KwZ",
        "pdf_size": 2335227,
        "rating": "6;8;8",
        "confidence": "3;3;4",
        "soundness": "2;3;3",
        "contribution": "2;3;4",
        "presentation": "2;3;3",
        "wc_summary": "78;96;45",
        "wc_strengths": "89;74;59",
        "wc_weaknesses": "759;312;57",
        "wc_questions": "263;92;350",
        "wc_review": "1189;574;511",
        "wc_reply_reviewers": "262;54;0",
        "wc_reply_authors": "1405;609;1240",
        "reply_reviewers": "1;1;0",
        "reply_authors": "4;2;4",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            73.0,
            21.118712081942874
        ],
        "wc_strengths_avg": [
            74.0,
            12.24744871391589
        ],
        "wc_weaknesses_avg": [
            376.0,
            290.1413448648779
        ],
        "wc_questions_avg": [
            235.0,
            107.17275773255068
        ],
        "wc_review_avg": [
            758.0,
            305.8463666614335
        ],
        "wc_reply_reviewers_avg": [
            105.33333333333333,
            112.95230065041714
        ],
        "wc_reply_authors_avg": [
            1084.6666666666667,
            343.0260761063055
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.49999999999999983,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:dvjfSC6KqQcJ:scholar.google.com/&scioq=Dictionary+Contrastive+Learning+for+Efficient+Local+Supervision+without+Auxiliary+Networks&hl=en&as_sdt=0,14",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=Gg7cXo3S8l",
        "pdf": "https://openreview.net/pdf?id=Gg7cXo3S8l",
        "email": "snu.ac.kr;snu.ac.kr;snu.ac.kr;snu.ac.kr;snu.ac.kr;google.com;snu.ac.kr",
        "author_num": 7,
        "aff_unique_index": "0;0;0;0;0;1;0",
        "aff_unique_norm": "Seoul National University;Google",
        "aff_unique_dep": ";Google Research",
        "aff_unique_url": "https://www.snu.ac.kr;https://research.google",
        "aff_unique_abbr": "SNU;Google Research",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0;0;0;0;1;0",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "title": "Investigating the Benefits of Projection Head for Representation Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19020",
        "id": "GgEAdqYPNA",
        "author_site": "Yihao Xue, Eric Gan, Jiayi Ni, Siddharth Joshi, Baharan Mirzasoleiman",
        "tldr": "",
        "abstract": "An effective technique for obtaining high-quality representations is adding a projection head on top of the encoder during training, then discarding it and using the pre-projection representations. Despite its proven practical effectiveness, the reason behind the success of this technique is poorly understood. The pre-projection representations are not directly optimized by the loss function, raising the question: what makes them better? In this work, we provide a rigorous theoretical answer to this question. We start by examining linear models trained with self-supervised contrastive loss. We reveal that the implicit bias of  training algorithms leads to layer-wise progressive feature weighting, where features become increasingly unequal as we go deeper into the layers. Consequently, lower layers tend to have more normalized and less specialized representations. We theoretically characterize scenarios where such representations are more beneficial, highlighting the intricate interplay between data augmentation and input features. Additionally, we demonstrate that introducing non-linearity into the network allows lower layers to learn features that are completely absent in higher layers. Finally, we show how this mechanism improves the robustness in supervised contrastive learning and supervised learning. We empirically validate our results through various experiments on CIFAR-10/100, UrbanCars and shifted versions of ImageNet. We also introduce a potential alternative to projection head, which offers a more interpretable and controllable design.",
        "keywords": "representation learning;representation learning theory;contrastive learning;robustness",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Yihao Xue;Eric Gan;Jiayi Ni;Siddharth Joshi;Baharan Mirzasoleiman",
        "authorids": "~Yihao_Xue1;~Eric_Gan1;~Jiayi_Ni1;~Siddharth_Joshi1;~Baharan_Mirzasoleiman1",
        "gender": ";M;F;M;F",
        "homepage": ";;;https://sjoshi804.github.io;http://web.cs.ucla.edu/~baharan/",
        "dblp": "271/2194;347/3322;;;52/10075",
        "google_scholar": "vMHVm8MAAAAJ;;;;x63j7HEAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";eric-gan-107889207/;jiayi-jenny-ni/;sjoshi804/;",
        "or_profile": "~Yihao_Xue1;~Eric_Gan1;~Jiayi_Ni1;~Siddharth_Joshi1;~Baharan_Mirzasoleiman1",
        "aff": "IBM, International Business Machines;University of California, Los Angeles;University of California, Los Angeles;University of California, Los Angeles;University of California, Los Angeles",
        "aff_domain": "us.ibm.com;ucla.edu;ucla.edu;ucla.edu;ucla.edu",
        "position": "Intern;Undergrad student;Undergrad student;PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nxue2024investigating,\ntitle={Investigating the Benefits of Projection Head for Representation Learning},\nauthor={Yihao Xue and Eric Gan and Jiayi Ni and Siddharth Joshi and Baharan Mirzasoleiman},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=GgEAdqYPNA}\n}",
        "github": "",
        "project": "",
        "reviewers": "EBwM;Kpzq;p748;B9NE",
        "pdf_size": 2171613,
        "rating": "5;5;6;6",
        "confidence": "4;4;4;3",
        "soundness": "3;3;4;3",
        "contribution": "2;2;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "239;67;106;53",
        "wc_strengths": "196;48;100;11",
        "wc_weaknesses": "100;204;23;45",
        "wc_questions": "266;4;216;242",
        "wc_review": "801;323;445;351",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1290;1154;1173;1880",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;2;3;4",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            116.25,
            73.48256595955262
        ],
        "wc_strengths_avg": [
            88.75,
            69.52472581751042
        ],
        "wc_weaknesses_avg": [
            93.0,
            69.95355602112018
        ],
        "wc_questions_avg": [
            182.0,
            104.27847332982968
        ],
        "wc_review_avg": [
            480.0,
            190.7590102721232
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1374.25,
            296.6027435813769
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13670397794741595976&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=GgEAdqYPNA",
        "pdf": "https://openreview.net/pdf?id=GgEAdqYPNA",
        "email": "us.ibm.com;ucla.edu;ucla.edu;ucla.edu;ucla.edu",
        "author_num": 5,
        "aff_unique_index": "0;1;1;1;1",
        "aff_unique_norm": "International Business Machines;University of California, Los Angeles",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ibm.com;https://www.ucla.edu",
        "aff_unique_abbr": "IBM;UCLA",
        "aff_campus_unique_index": "1;1;1;1",
        "aff_campus_unique": ";Los Angeles",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Ggu3cWldTy",
        "title": "Unified Mirror Descent: Towards a Big Unification of Decision Making",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Decision-making problems, encompassing single-agent, cooperative multi-agent, competitive multi-agent, and mixed cooperative-competitive cases, are ubiquitous in real-world applications. In the past several decades, substantial strides in theoretical and algorithmic advancements have been achieved within these fields. Nevertheless, these fields have been predominantly evolving independently, giving rise to a fundamental question: Can we develop a single algorithm to effectively tackle all these scenarios? In this work, we embark upon an exploration of this question by introducing a unified approach to address all types of decision-making scenarios. First, we propose a unified mirror descent (UMD) algorithm which synergistically integrates multiple base policy update rules. Specifically, at each iteration, the new policy of an agent is computed by weighting the base policies obtained through different policy update rules. One of the advantages of UMD is that only minimal modifications are required when integrating new policy update rules. Second, as the evaluation metric of the resulting policy is non-differentiable with respect to the weights of the base policies, we propose a simple yet effective zero-order method to optimize these weights. Finally, we conduct extensive experiments on 24 benchmark environments, which shows that in over 87\\% (21/24) games UMD performs better than or on-par with the base policies, demonstrating its potential to serve as a unified approach for various decision-making problems. To our knowledge, this is the first attempt to comprehensively study all types of decision-making problems under a single algorithmic framework.",
        "keywords": "decision-making problems;reinforcement learning;mirror descent;zero-order optimization",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Pengdeng Li;Shuxin Li;Chang Yang;Xinrun Wang;Shuyue Hu;Xiao Huang;Hau Chan;Bo An",
        "authorids": "~Pengdeng_Li1;~Shuxin_Li1;~Chang_Yang3;~Xinrun_Wang1;~Shuyue_Hu1;~Xiao_Huang1;~Hau_Chan1;~Bo_An2",
        "gender": "M;F;F;M;;M;M;M",
        "homepage": ";;http://none.com;https://rainwangphy.github.io/;;https://www4.comp.polyu.edu.hk/~xiaohuang/;https://cse.unl.edu/~hchan/;https://personal.ntu.edu.sg/boan/",
        "dblp": "199/2319;;;199/6413;;25/692-1.html;48/9282;42/6178-1.html",
        "google_scholar": "HY6ghxoAAAAJ;bSksaBYAAAAJ;;ROANfPUAAAAJ;;Be21PkYAAAAJ;R1w52RIAAAAJ;PEEpuNwAAAAJ",
        "orcid": "0000-0002-5549-3864;0009-0001-5748-2667;;;;0000-0002-3867-900X;;0000-0002-7064-7438",
        "linkedin": ";;;;;;;",
        "or_profile": "~Pengdeng_Li1;~Shuxin_Li1;~Chang_Yang3;~Xinrun_Wang1;~Shuyue_Hu1;~Xiao_Huang1;~Hau_Chan1;~Bo_An2",
        "aff": "Nanyang Technological University;Nanyang Technological University;The Hong Kong Polytechnic University;Nanyang Technological University;;The Hong Kong Polytechnic University;University of Nebraska, Lincoln;Nanyang Technological University",
        "aff_domain": "ntu.edu.sg;ntu.edu.sg;polyu.edu.hk;ntu.edu.sg;;polyu.edu.hk;unl.edu;ntu.edu.sg",
        "position": "Postdoc;PhD student;PhD student;Postdoc;;Assistant Professor;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nli2024unified,\ntitle={Unified Mirror Descent: Towards a Big Unification of Decision Making},\nauthor={Pengdeng Li and Shuxin Li and Chang Yang and Xinrun Wang and Shuyue Hu and Xiao Huang and Hau Chan and Bo An},\nyear={2024},\nurl={https://openreview.net/forum?id=Ggu3cWldTy}\n}",
        "github": "",
        "project": "",
        "reviewers": "5a1i;4eSm;crN4;amuq;Wqtu",
        "site": "https://openreview.net/forum?id=Ggu3cWldTy",
        "pdf_size": 7611409,
        "rating": "3;3;5;5;5",
        "confidence": "4;3;4;3;3",
        "soundness": "2;1;2;2;3",
        "contribution": "2;2;2;2;2",
        "presentation": "1;1;3;1;3",
        "wc_summary": "34;63;80;99;222",
        "wc_strengths": "32;21;54;1;44",
        "wc_weaknesses": "1132;304;99;361;71",
        "wc_questions": "58;150;97;1;220",
        "wc_review": "1256;538;330;462;557",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            4.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.4,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.8,
            0.9797958971132713
        ],
        "wc_summary_avg": [
            99.6,
            64.82160133782565
        ],
        "wc_strengths_avg": [
            30.4,
            18.423897524682445
        ],
        "wc_weaknesses_avg": [
            393.4,
            386.053156961577
        ],
        "wc_questions_avg": [
            105.2,
            75.28452696271658
        ],
        "wc_review_avg": [
            628.6,
            323.6921994735122
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.16666666666666663,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:YxYAs3DhtfcJ:scholar.google.com/&scioq=Unified+Mirror+Descent:+Towards+a+Big+Unification+of+Decision+Making&hl=en&as_sdt=0,48",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;1;2;0",
        "aff_unique_norm": "Nanyang Technological University;Hong Kong Polytechnic University;University of Nebraska",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ntu.edu.sg;https://www.polyu.edu.hk;https://www.unl.edu",
        "aff_unique_abbr": "NTU;PolyU;UNL",
        "aff_campus_unique_index": "1;1;2",
        "aff_campus_unique": ";Hong Kong SAR;Lincoln",
        "aff_country_unique_index": "0;0;1;0;1;2;0",
        "aff_country_unique": "Singapore;China;United States"
    },
    {
        "id": "GhYXocT75t",
        "title": "Forward-Backward Reasoning in Large Language Models for Mathematical Verification",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Chain-of-Thought (CoT) prompting in large language models (LLMs) has shown promising performance on mathematical reasoning tasks. Recently, Self-Consistency samples a diverse set of reasoning chains with different answers and chooses the answer by majority voting. Though effective, its performance cannot be further improved by sampling more reasoning chains. To address this problem, we propose to integrate backward reasoning into answer verification. We first mask a number in the question by ${\\bf x}$. The LLM is then asked to predict the masked number with a candidate answer $\\hat{A}_c$ embedded in the template: ``*If we know the answer to the above question is $\\hat{A}_c$, what is the value of unknown variable ${\\bf x}$?*'' The LLM is expected to predict the masked number successfully if the provided candidate answer is correct. To further improve performance, we propose FOBAR (FOrward-BAckward Reasoning) to combine forward and backward reasoning for verifying candidate answers. Experiments are performed on six standard mathematical data sets and three LLMs (*text-davinci-003*, *GPT-3.5-Turbo*,*GPT-4*). Results show that FOBAR achieves state-of-the-art performance. In particular, FOBAR outperforms Self-Consistency which uses forward reasoning alone, demonstrating that combining forward and forward reasoning is better. It also outperforms existing verification methods, verifying the effectiveness of using the simple template in backward reasoning and the proposed combination.",
        "keywords": "chain-of-thought prompting;forward reasoning;backward reasoning;large language models;prompting",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/800c43eb4f71465251a4562769011b6a79f3abfc.zip",
        "author": "Weisen Jiang;Han Shi;Longhui Yu;Zhengying Liu;Yu Zhang;Zhenguo Li;James Kwok",
        "authorids": "~Weisen_Jiang1;~Han_Shi1;~Longhui_Yu1;~Zhengying_Liu2;~Yu_Zhang3;~Zhenguo_Li1;~James_Kwok1",
        "gender": "M;M;M;M;M;M;",
        "homepage": "https://wayson-ust.github.io/;https://han-shi.github.io/;https://yulonghui.github.io/;;http://cse.sustech.edu.cn/faculty/~zhangy/;http://www.ee.columbia.edu/~zgli/;",
        "dblp": "302/7625;;313/9946;241/1782;50/671-6;23/6479;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.com.hk/citations?user=Johp_14AAAAJ;https://scholar.google.com.hk/citations?user=3eHjDDgAAAAJ;http:// DFme0joAAAAJ;https://scholar.google.com.hk/citations?user=jaRS5w4AAAAJ;XboZC1AAAAAJ;",
        "orcid": ";;;;;;",
        "linkedin": ";;%E9%BE%99%E8%BE%89-%E8%99%9E-71655a154/;;;;",
        "or_profile": "~Weisen_Jiang1;~Han_Shi1;~Longhui_Yu1;~Zhengying_Liu2;~Yu_Zhang3;~Zhenguo_Li1;~James_Kwok1",
        "aff": "Hong Kong University of Science and Technology;Huawei Technologies Ltd.;;Huawei Technologies Ltd.;Southern University of Science and Technology;Huawei Noah's Ark Lab;",
        "aff_domain": "ust.hk;huawei.com;;huawei.com;sustc.edu.cn;huawei.com;",
        "position": "PhD student;Principal Researcher;;Researcher;Associate Professor;Principal Researcher;",
        "bibtex": "@misc{\njiang2024forwardbackward,\ntitle={Forward-Backward Reasoning in Large Language Models for Mathematical Verification},\nauthor={Weisen Jiang and Han Shi and Longhui Yu and Zhengying Liu and Yu Zhang and Zhenguo Li and James Kwok},\nyear={2024},\nurl={https://openreview.net/forum?id=GhYXocT75t}\n}",
        "github": "",
        "project": "",
        "reviewers": "YtZF;PfVM;nUu4",
        "site": "https://openreview.net/forum?id=GhYXocT75t",
        "pdf_size": 863170,
        "rating": "3;3;8",
        "confidence": "5;4;4",
        "soundness": "2;3;4",
        "contribution": "2;1;3",
        "presentation": "3;3;4",
        "wc_summary": "81;148;88",
        "wc_strengths": "52;62;146",
        "wc_weaknesses": "100;159;234",
        "wc_questions": "44;128;297",
        "wc_review": "277;497;765",
        "wc_reply_reviewers": "480;259;96",
        "wc_reply_authors": "6425;3044;2346",
        "reply_reviewers": "2;1;1",
        "reply_authors": "13;7;5",
        "rating_avg": [
            4.666666666666667,
            2.357022603955158
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            105.66666666666667,
            30.070288030250428
        ],
        "wc_strengths_avg": [
            86.66666666666667,
            42.153159892099296
        ],
        "wc_weaknesses_avg": [
            164.33333333333334,
            54.83510635431365
        ],
        "wc_questions_avg": [
            156.33333333333334,
            105.21195538319567
        ],
        "wc_review_avg": [
            513.0,
            199.54615172101583
        ],
        "wc_reply_reviewers_avg": [
            278.3333333333333,
            157.3622854717384
        ],
        "wc_reply_authors_avg": [
            3938.3333333333335,
            1781.2793779253782
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            8.333333333333334,
            3.39934634239519
        ],
        "replies_avg": [
            35,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 23,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6593705415021715639&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;1;2;1",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Huawei;Southern University of Science and Technology",
        "aff_unique_dep": ";Huawei Technologies;",
        "aff_unique_url": "https://www.ust.hk;https://www.huawei.com;https://www.sustech.edu.cn",
        "aff_unique_abbr": "HKUST;Huawei;SUSTech",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "GicZtgSlJW",
        "title": "Primal-Dual Continual Learning: Stability and Plasticity through Lagrange Multipliers",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Continual learning is inherently a constrained learning problem. The goal is to learn a predictor under a no-forgetting requirement. Although several prior studies formulate it as such, they do not solve the constrained optimization problem explicitly. In this work, we show that it is both possible and beneficial to undertake the constrained optimization problem directly. To do this, we leverage recent results in constrained learning through Lagrangian duality. We focus on memory-based methods, where a small subset of samples from previous tasks can be stored in a replay buffer. In this setting, we analyze two versions of the continual learning problem: a coarse approach with constraints at the task level and a fine approach with constraints at the sample level. We show that dual variables indicate the sensitivity of the optimal value with respect to constraint perturbations. We then leverage this result to partition the buffer in the coarse approach, allocating more resources to harder tasks, and to populate the buffer in the fine approach, including only impactful samples. We derive sub-optimality bounds, and empirically corroborate our theoretical results in various continual learning benchmarks. We also discuss the limitations of these methods with respect to the amount of memory available and the number of constraints involved in the optimization problem.",
        "keywords": "Continual Learning;Constrained Optimization;Duality",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/cdf32f176ed3399771457b209ef8e8ed7df534d8.zip",
        "author": "Juan Elenter;Navid NaderiAlizadeh;Tara Javidi;Alejandro Ribeiro",
        "authorids": "~Juan_Elenter1;~Navid_NaderiAlizadeh2;~Tara_Javidi2;~Alejandro_Ribeiro1",
        "gender": ";M;M;F",
        "homepage": "https://juanelenter.github.io/;https://alelab.seas.upenn.edu;https://www.seas.upenn.edu/~nnaderi/;http://tjavidi.eng.ucsd.edu",
        "dblp": "313/9585;32/15;126/5064.html;74/2569",
        "google_scholar": "https://scholar.google.com/citations?hl=en;7mrPM4kAAAAJ;roVp_WwAAAAJ;4wzZ0yAAAAAJ",
        "orcid": ";0000-0003-4230-9906;0000-0002-4891-6726;0000-0001-7112-1043",
        "linkedin": "juan-elenter/;;navid-naderi-alizadeh/;tara-javidi-28b450155/",
        "or_profile": "~Juan_Elenter1;~Alejandro_Ribeiro1;~Navid_Naderializadeh1;~Tara_Javidi1",
        "aff": "University of Pennsylvania;University of Pennsylvania;Duke University;University of California, San Diego",
        "aff_domain": "upenn.edu;upenn.edu;duke.edu;ucsd.edu",
        "position": "PhD student;Full Professor;Assistant Research Professor;Researcher",
        "bibtex": "@misc{\nelenter2024primaldual,\ntitle={Primal-Dual Continual Learning: Stability and Plasticity through Lagrange Multipliers},\nauthor={Juan Elenter and Navid NaderiAlizadeh and Tara Javidi and Alejandro Ribeiro},\nyear={2024},\nurl={https://openreview.net/forum?id=GicZtgSlJW}\n}",
        "github": "",
        "project": "",
        "reviewers": "ipX4;Heyc;CG5c;aK2g",
        "site": "https://openreview.net/forum?id=GicZtgSlJW",
        "pdf_size": 2346626,
        "rating": "3;3;6;8",
        "confidence": "3;5;3;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "94;103;99;97",
        "wc_strengths": "47;43;103;46",
        "wc_weaknesses": "680;212;564;106",
        "wc_questions": "3;67;107;5",
        "wc_review": "824;425;873;254",
        "wc_reply_reviewers": "0;300;306;37",
        "wc_reply_authors": "770;541;654;316",
        "reply_reviewers": "0;1;2;1",
        "reply_authors": "2;1;2;1",
        "rating_avg": [
            5.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            98.25,
            3.2691742076555053
        ],
        "wc_strengths_avg": [
            59.75,
            25.01374622082826
        ],
        "wc_weaknesses_avg": [
            390.5,
            238.0729930084469
        ],
        "wc_questions_avg": [
            45.5,
            43.849173310337335
        ],
        "wc_review_avg": [
            594.0,
            262.15548821262547
        ],
        "wc_reply_reviewers_avg": [
            160.75,
            142.86597740539906
        ],
        "wc_reply_authors_avg": [
            570.25,
            167.64005338820434
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.1421338109037403,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12312448737598121590&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "University of Pennsylvania;Duke University;University of California, San Diego",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.upenn.edu;https://www.duke.edu;https://www.ucsd.edu",
        "aff_unique_abbr": "UPenn;Duke;UCSD",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";San Diego",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Giwj9cgAIl",
        "title": "Mechanistic Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We present Mechanistic Neural Networks, a new neural module that represent the evolution of its input data in the form of differential explicit equations.\nSimilar to regular neural networks, Mechanistic Neural Networks $\\mathcal{}F(x)$ receive as input system observations $x$, \\emph{e.g.} $n$-body trajectories or fluid dynamics recordings.\nHowever, unlike regular neural network modules that return vector-valued outputs, mechanistic neural networks output (the parameters of) a \\emph{mechanism} $\\mathcal{U}_x=F(x)$ in the form of an explicit symbolic ordinary differential equation $\\mathcal{U}_x$ (and not the numerical solution of the differential equation), that can be solved in the forward pass to solve arbitrary tasks, supervised and unsupervised. Providing explicit equations as part of multi-layer architectures, they differ from Neural ODEs, UDEs and symbolic regression methods like SINDy. \nTo learn explicit differential equations as representations, Mechanistic Neural Networks employ a new parallel and differentiable ODE solver design that (i) is able to solve large batches of independent ODEs in parallel on GPU and (ii) do so for hundreds of steps at once (iii) with \\emph{learnable} step sizes.\nThe new solver overcomes the limitations of traditional ODE solvers that proceed sequentially and do not scale for large numbers of independent ODEs.\nMechanistic Neural Networks can be employed in diverse settings including governing equation discovery, prediction for dynamical systems, PDE solving and yield competitive or state-of-the-art results.",
        "keywords": "differential equations;differentiable optimization;dynamics",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "/attachment/e7dfb125bf2bb7025a974fd7f602a1a5f3ab5441.pdf",
        "author": "Adeel Pervez;Francesco Locatello;Efstratios Gavves",
        "authorids": "~Adeel_Pervez1;~Francesco_Locatello1;~Efstratios_Gavves1",
        "gender": ";M;M",
        "homepage": ";https://twitter.com/FrancescoLocat8;https://www.egavves.com",
        "dblp": "225/4821;195/6074;03/8693",
        "google_scholar": ";;https://scholar.google.nl/citations?user=QqfCvsgAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Adeel_Pervez1;~Francesco_Locatello1;~Efstratios_Gavves1",
        "aff": "University of Amsterdam;Institute of Science and Technology;University of Amsterdam",
        "aff_domain": "uva.nl;ist.ac.at;uva.nl",
        "position": "Postdoc;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\npervez2024mechanistic,\ntitle={Mechanistic Neural Networks},\nauthor={Adeel Pervez and Francesco Locatello and Efstratios Gavves},\nyear={2024},\nurl={https://openreview.net/forum?id=Giwj9cgAIl}\n}",
        "github": "",
        "project": "",
        "reviewers": "L7km;5iBu;Uvxo",
        "site": "https://openreview.net/forum?id=Giwj9cgAIl",
        "pdf_size": 1109138,
        "rating": "3;3;8",
        "confidence": "2;4;4",
        "soundness": "3;2;3",
        "contribution": "2;2;3",
        "presentation": "1;1;3",
        "wc_summary": "202;73;157",
        "wc_strengths": "64;19;65",
        "wc_weaknesses": "395;326;60",
        "wc_questions": "5;9;99",
        "wc_review": "666;427;381",
        "wc_reply_reviewers": "48;89;0",
        "wc_reply_authors": "723;1346;536",
        "reply_reviewers": "1;1;0",
        "reply_authors": "1;2;1",
        "rating_avg": [
            4.666666666666667,
            2.357022603955158
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            144.0,
            53.46026561849464
        ],
        "wc_strengths_avg": [
            49.333333333333336,
            21.452790546272112
        ],
        "wc_weaknesses_avg": [
            260.3333333333333,
            144.4306831051568
        ],
        "wc_questions_avg": [
            37.666666666666664,
            43.39994879669279
        ],
        "wc_review_avg": [
            491.3333333333333,
            124.92753455059012
        ],
        "wc_reply_reviewers_avg": [
            45.666666666666664,
            36.37153954521157
        ],
        "wc_reply_authors_avg": [
            868.3333333333334,
            346.2815168167208
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Amsterdam;Institute of Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uva.nl;",
        "aff_unique_abbr": "UvA;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Netherlands;"
    },
    {
        "id": "Gk75gOjtQh",
        "title": "Variational Inference with Singularity-Free Planar Flows",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Variational inference is a method for approximating probability distributions. The approximation quality depends on the expressiveness of variational distributions. Normalizing flows provide a way to construct a flexible and rich family of distributions. Planar flow, an early studied normalizing flow, is simple but powerful. Our research reveals a crucial insight into planar flow's constrained parameters: they exhibit a non-removable singularity in their original reparameterization. The gradients of the associated parameters diverge to infinity in different directions as they approach to the singularity, which creates a potential for the model to overshoot and get stuck in some undesirable states. We then propose a new reparameterization to circumvent the singularity. The resulting singularity-free planar flows are more stable in training and demonstrate better performance in variational inference tasks.",
        "keywords": "variational inference;normalizing flow;planar flow;variational autoencoder",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/d9a3935471657728deb00c6f942ab82cd3cd6f1d.zip",
        "author": "Jiangrong Ouyang;Mingming Gong;Howard Bondell",
        "authorids": "~Jiangrong_Ouyang1;~Mingming_Gong1;~Howard_Bondell2",
        "gender": ";M;",
        "homepage": ";https://mingming-gong.github.io/;",
        "dblp": ";98/8479;",
        "google_scholar": ";https://scholar.google.com.au/citations?user=6BmiCJIAAAAJ;",
        "orcid": "0000-0002-0512-5166;0000-0001-7147-5589;",
        "linkedin": ";;",
        "or_profile": "~Jiangrong_Ouyang1;~Mingming_Gong1;~Howard_Bondell2",
        "aff": "University of Melbourne;University of Melbourne;",
        "aff_domain": "unimelb.edu.au;unimelb.edu.au;",
        "position": "PhD student;Assistant Professor;",
        "bibtex": "@misc{\nouyang2024variational,\ntitle={Variational Inference with Singularity-Free Planar Flows},\nauthor={Jiangrong Ouyang and Mingming Gong and Howard Bondell},\nyear={2024},\nurl={https://openreview.net/forum?id=Gk75gOjtQh}\n}",
        "github": "",
        "project": "",
        "reviewers": "ndCL;seL3;KdQZ;Z1xs",
        "site": "https://openreview.net/forum?id=Gk75gOjtQh",
        "pdf_size": 706750,
        "rating": "5;5;6;6",
        "confidence": "4;5;3;5",
        "soundness": "2;3;3;3",
        "contribution": "3;2;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "65;26;83;80",
        "wc_strengths": "48;33;68;143",
        "wc_weaknesses": "361;52;163;186",
        "wc_questions": "2;170;34;132",
        "wc_review": "476;281;348;541",
        "wc_reply_reviewers": "313;27;105;22",
        "wc_reply_authors": "1447;877;667;758",
        "reply_reviewers": "2;1;1;1",
        "reply_authors": "4;3;2;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            63.5,
            22.699118925632334
        ],
        "wc_strengths_avg": [
            73.0,
            42.27883631321941
        ],
        "wc_weaknesses_avg": [
            190.5,
            110.712465422824
        ],
        "wc_questions_avg": [
            84.5,
            68.78044780313661
        ],
        "wc_review_avg": [
            411.5,
            102.46096817813113
        ],
        "wc_reply_reviewers_avg": [
            116.75,
            117.9880820252622
        ],
        "wc_reply_authors_avg": [
            937.25,
            303.5789641921851
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.30151134457776363,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:uUZut4GZyvYJ:scholar.google.com/&scioq=Variational+Inference+with+Singularity-Free+Planar+Flows&hl=en&as_sdt=0,15",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Melbourne",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.unimelb.edu.au",
        "aff_unique_abbr": "UniMelb",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Australia"
    },
    {
        "title": "Orbit-Equivariant Graph Neural Networks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19019",
        "id": "GkJOCga62u",
        "author_site": "Matthew Morris, Bernardo Grau, Ian Horrocks",
        "tldr": "",
        "abstract": "Equivariance is an important structural property that is captured by architectures such as graph neural networks (GNNs). However, equivariant graph functions cannot produce different outputs for similar nodes, which may be undesirable when the function is trying to optimize some global graph property. In this paper, we define orbit-equivariance, a relaxation of equivariance which allows for such functions whilst retaining important structural inductive biases. We situate the property in the hierarchy of graph functions, define a taxonomy of orbit-equivariant functions, and provide four different ways to achieve non-equivariant GNNs. For each, we analyze their expressivity with respect to orbit-equivariance and evaluate them on two novel datasets, one of which stems from a real-world use-case of designing optimal bioisosteres.",
        "keywords": "graph neural networks;equivariance;expressivity;graph orbits",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/0370ad204f90a8960e724e1b9de9cf6271545c29.zip",
        "author": "Matthew Morris;Bernardo Cuenca Grau;Ian Horrocks",
        "authorids": "~Matthew_Morris1;~Bernardo_Cuenca_Grau1;~Ian_Horrocks1",
        "gender": "M;;",
        "homepage": ";https://www.cs.ox.ac.uk/people/bernardo.cuencagrau/;http://www.cs.ox.ac.uk/ian.horrocks/",
        "dblp": "223/6302;71/6448;h/IanHorrocks",
        "google_scholar": "zYqLN38AAAAJ;THu1uZMAAAAJ;0ypdmcYAAAAJ",
        "orcid": "0000-0003-3337-7229;;",
        "linkedin": ";;",
        "or_profile": "~Matthew_Morris1;~Bernardo_Cuenca_Grau1;~Ian_Horrocks1",
        "aff": "Department of Computer Science, University of Oxford;University of Oxford;University of Oxford",
        "aff_domain": "cs.ox.ac.uk;cs.ox.ac.uk;ox.ac.uk",
        "position": "PhD student;Professor;Full Professor",
        "bibtex": "@inproceedings{\nmorris2024orbitequivariant,\ntitle={Orbit-Equivariant Graph Neural Networks},\nauthor={Matthew Morris and Bernardo Cuenca Grau and Ian Horrocks},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=GkJOCga62u}\n}",
        "github": "",
        "project": "",
        "reviewers": "AmbM;y9Hz;GKac;nEVg",
        "pdf_size": 18113224,
        "rating": "6;6;8;8",
        "confidence": "2;2;4;3",
        "soundness": "3;3;4;3",
        "contribution": "3;3;3;3",
        "presentation": "2;2;3;4",
        "wc_summary": "91;123;69;139",
        "wc_strengths": "42;105;178;57",
        "wc_weaknesses": "56;64;163;166",
        "wc_questions": "75;455;10;85",
        "wc_review": "264;747;420;447",
        "wc_reply_reviewers": "0;678;0;28",
        "wc_reply_authors": "182;850;262;73",
        "reply_reviewers": "0;2;0;1",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            105.5,
            27.253440149823287
        ],
        "wc_strengths_avg": [
            95.5,
            53.011791141216875
        ],
        "wc_weaknesses_avg": [
            112.25,
            52.33724773046439
        ],
        "wc_questions_avg": [
            156.25,
            174.87048779025008
        ],
        "wc_review_avg": [
            469.5,
            174.78057672407422
        ],
        "wc_reply_reviewers_avg": [
            176.5,
            289.7667165151995
        ],
        "wc_reply_authors_avg": [
            341.75,
            301.0086169862916
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.9045340337332909,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9477417997625996319&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=GkJOCga62u",
        "pdf": "https://openreview.net/pdf?id=GkJOCga62u",
        "email": "cs.ox.ac.uk;cs.ox.ac.uk;ox.ac.uk",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Oxford",
        "aff_unique_dep": "Department of Computer Science",
        "aff_unique_url": "https://www.ox.ac.uk",
        "aff_unique_abbr": "Oxford",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Oxford;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "title": "FeatUp: A Model-Agnostic Framework for Features at Any Resolution",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19018",
        "id": "GkJiNn2QDF",
        "author_site": "Stephanie Fu, Mark Hamilton, Laura E. Brandt, Axel Feldmann, Zhoutong Zhang, William Freeman",
        "tldr": "",
        "abstract": "Deep features are a cornerstone of computer vision research, capturing image semantics and enabling the community to solve downstream tasks even in the zero- or few-shot regime. However, these features often lack the spatial resolution to directly perform dense prediction tasks like segmentation and depth prediction because models aggressively pool information over large areas. In this work, we introduce FeatUp, a task- and model-agnostic framework to restore lost spatial information in deep features. We introduce two variants of FeatUp: one that guides features with high-resolution signal in a single forward pass, and one that fits an implicit model to a single image to reconstruct features at any resolution. Both approaches use a multi-view consistency loss with deep analogies to NeRFs. Our features retain their original semantics and can be swapped into existing applications to yield resolution and performance gains even without re-training. We show that FeatUp significantly outperforms other feature upsampling and image super-resolution approaches in class activation map generation, transfer learning for segmentation and depth prediction, and end-to-end training for semantic segmentation.",
        "keywords": "deep learning;deep features;computer vision;feature upsampling",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Stephanie Fu;Mark Hamilton;Laura E. Brandt;Axel Feldmann;Zhoutong Zhang;William T. Freeman",
        "authorids": "~Stephanie_Fu1;~Mark_Hamilton1;~Laura_E._Brandt1;~Axel_Feldmann1;~Zhoutong_Zhang1;~William_T._Freeman1",
        "gender": "F;M;M;M;M;F",
        "homepage": "https://stephanie-fu.github.io/;https://mhamilton.net;https://feldmann.nyc;https://ztzhang.info;https://billf.mit.edu/;https://people.csail.mit.edu/lebrandt",
        "dblp": "270/1541;91/631;260/5858;169/4798;86/6650;294/9084",
        "google_scholar": "Rx-h05AAAAAJ;kgZtMGsAAAAJ;QkpYowMAAAAJ;;https://scholar.google.com.tw/citations?user=0zZnyMEAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0001-6591-6026;;;;;0000-0002-1425-3581",
        "linkedin": "stephanie-fu/;;;;;",
        "or_profile": "~Stephanie_Fu1;~Mark_Hamilton1;~Axel_Feldmann1;~Zhoutong_Zhang1;~William_T._Freeman1;~Laura_E_Brandt1",
        "aff": "University of California, Berkeley;Massachusetts Institute of Technology;Computer Science and Artificial Intelligence Laboratory, Electrical Engineering & Computer Science;Adobe Systems;Massachusetts Institute of Technology;Massachusetts Institute of Technology",
        "aff_domain": "berkeley.edu;mit.edu;csail.mit.edu;adobe.com;mit.edu;mit.edu",
        "position": "PhD student;PhD student;PhD student;Researcher;Professor;PhD student",
        "bibtex": "@inproceedings{\nfu2024featup,\ntitle={FeatUp: A Model-Agnostic Framework for Features at Any Resolution},\nauthor={Stephanie Fu and Mark Hamilton and Laura E. Brandt and Axel Feldmann and Zhoutong Zhang and William T. Freeman},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=GkJiNn2QDF}\n}",
        "github": "",
        "project": "",
        "reviewers": "mrZx;2f29;2Fqt",
        "pdf_size": 16960577,
        "rating": "3;6;6",
        "confidence": "5;4;4",
        "soundness": "3;4;4",
        "contribution": "2;3;4",
        "presentation": "2;4;3",
        "wc_summary": "101;53;90",
        "wc_strengths": "52;54;52",
        "wc_weaknesses": "489;176;186",
        "wc_questions": "168;10;12",
        "wc_review": "810;293;340",
        "wc_reply_reviewers": "517;0;0",
        "wc_reply_authors": "1814;784;750",
        "reply_reviewers": "1;0;0",
        "reply_authors": "3;2;2",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            81.33333333333333,
            20.531818125912658
        ],
        "wc_strengths_avg": [
            52.666666666666664,
            0.9428090415820634
        ],
        "wc_weaknesses_avg": [
            283.6666666666667,
            145.24997609485365
        ],
        "wc_questions_avg": [
            63.333333333333336,
            74.01501349200865
        ],
        "wc_review_avg": [
            481.0,
            233.42807600343764
        ],
        "wc_reply_reviewers_avg": [
            172.33333333333334,
            243.71613724896338
        ],
        "wc_reply_authors_avg": [
            1116.0,
            493.7556750728711
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 50,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15307057336741142347&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=GkJiNn2QDF",
        "pdf": "https://openreview.net/pdf?id=GkJiNn2QDF",
        "email": "berkeley.edu;mit.edu;csail.mit.edu;adobe.com;mit.edu;mit.edu",
        "author_num": 6,
        "aff_unique_index": "0;1;1;2;1;1",
        "aff_unique_norm": "University of California, Berkeley;Massachusetts Institute of Technology;Adobe",
        "aff_unique_dep": ";;Adobe Systems Incorporated",
        "aff_unique_url": "https://www.berkeley.edu;https://web.mit.edu;https://www.adobe.com",
        "aff_unique_abbr": "UC Berkeley;MIT;Adobe",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Berkeley;;Cambridge",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Gl4AsqInti",
        "title": "How Hessian structure explains mysteries in sharpness regularization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent work has shown that first order methods like SAM which implicitly penalize second order information  can improve generalization in deep learning. Seemingly similar methods like weight noise and gradient penalties often fail to provide such benefits. We show that these differences can be explained by the structure of the Hessian of the loss. First, we show that a common decomposition of the Hessian can be quantitatively interpreted as separating the feature exploitation from feature exploration. The feature exploration, which can be described by the Nonlinear Modelling Error matrix (NME), is commonly neglected in the literature since it vanishes at interpolation. Our work shows that the NME is in fact important as it can explain why gradient penalties underperform for certain architectures. Furthermore, we provide evidence that challenges the long held equivalence of weight noise and gradient penalties. This equivalence relies on the assumption that the NME can be ignored, which we find does not hold for modern networks since they involve significant feature learning. Intriguingly, we find that regularizing feature exploitation but not feature exploration yields performance comparable to SAM. This suggests that properly controlling regularization on the two parts of the Hessian is important for the success of many second order methods.",
        "keywords": "hessian;gauss newton;sharpness;flatness",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Yann Dauphin;Atish Agarwala;Hossein Mobahi",
        "authorids": "~Yann_Dauphin1;~Atish_Agarwala1;~Hossein_Mobahi2",
        "gender": "M;;M",
        "homepage": "https://www.dauphin.io;;http://people.csail.mit.edu/hmobahi/",
        "dblp": "22/9988;265/6410.html;94/1490",
        "google_scholar": "XSforroAAAAJ;https://scholar.google.com/citations?hl=en;GSHmKZkAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Yann_Dauphin1;~Atish_Agarwala1;~Hossein_Mobahi1",
        "aff": "Google;Google;Google",
        "aff_domain": "google.com;google.com;google.com",
        "position": "Researcher;Researcher;Research Scientist",
        "bibtex": "@misc{\ndauphin2024how,\ntitle={How Hessian structure explains mysteries in sharpness regularization},\nauthor={Yann Dauphin and Atish Agarwala and Hossein Mobahi},\nyear={2024},\nurl={https://openreview.net/forum?id=Gl4AsqInti}\n}",
        "github": "",
        "project": "",
        "reviewers": "jCBc;cVpc;Xtsh;Me8D",
        "site": "https://openreview.net/forum?id=Gl4AsqInti",
        "pdf_size": 1393589,
        "rating": "3;5;5;6",
        "confidence": "4;4;4;3",
        "soundness": "2;2;4;3",
        "contribution": "1;2;3;3",
        "presentation": "1;1;3;3",
        "wc_summary": "109;583;156;112",
        "wc_strengths": "58;78;59;54",
        "wc_weaknesses": "742;959;43;75",
        "wc_questions": "71;2;167;133",
        "wc_review": "980;1622;425;374",
        "wc_reply_reviewers": "0;0;0;10",
        "wc_reply_authors": "638;1440;561;541",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "2;3;2;2",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.0,
            1.0
        ],
        "wc_summary_avg": [
            240.0,
            198.90324280916084
        ],
        "wc_strengths_avg": [
            62.25,
            9.283722313813572
        ],
        "wc_weaknesses_avg": [
            454.75,
            403.27681249980145
        ],
        "wc_questions_avg": [
            93.25,
            62.930020657870436
        ],
        "wc_review_avg": [
            850.25,
            504.99622523341696
        ],
        "wc_reply_reviewers_avg": [
            2.5,
            4.330127018922194
        ],
        "wc_reply_authors_avg": [
            795.0,
            374.147698108648
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.6622661785325219,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:H9Dve_GAH8kJ:scholar.google.com/&scioq=How+Hessian+structure+explains+mysteries+in+sharpness+regularization&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Google",
        "aff_unique_dep": "Google",
        "aff_unique_url": "https://www.google.com",
        "aff_unique_abbr": "Google",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Mountain View",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Tree-Planner: Efficient Close-loop Task Planning with Large Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19017",
        "id": "Glcsog6zOe",
        "author_site": "Mengkang Hu, Yao Mu, Xinmiao Yu, Mingyu Ding, Shiguang Wu, Wenqi Shao, Qiguang Chen, Bin Wang, Yu Qiao, Ping Luo",
        "tldr": "",
        "abstract": "This paper studies close-loop task planning, which refers to the process of generating a sequence of skills (a plan) to accomplish a specific goal while adapting the plan based on real-time observations.\nRecently, prompting Large Language Models (LLMs) to generate actions iteratively has become a prevalent paradigm due to its superior performance and user-friendliness.\nHowever, this paradigm is plagued by two inefficiencies: high token consumption and redundant error correction, both of which hinder its scalability for large-scale testing and applications.\nTo address these issues, we propose Tree-Planner, which reframes task planning with LLMs into three distinct phases: \nplan sampling,  action tree construction, and grounded deciding.\nTree-Planner starts by using an LLM to sample a set of potential plans before execution, followed by the aggregation of them to form an action tree.\nFinally, the LLM performs a top-down decision-making process on the tree, taking into account real-time environmental information.\nExperiments show that Tree-Planner achieves state-of-the-art performance while maintaining high efficiency.\nBy decomposing LLM queries into a single plan-sampling call and multiple grounded-deciding calls,\na considerable part\nof the prompt are less likely to be repeatedly consumed. \nAs a result, token consumption is reduced by 92.2\\% compared to the previously best-performing model.\nAdditionally, by enabling backtracking on the action tree as needed, the correction process becomes more flexible, leading to a 40.5\\% decrease in error corrections.",
        "keywords": "Embodied Agents;Large Language Models;Task Planning",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/fccc835b414762bea35ce317949151d5d4e8b760.pdf",
        "author": "Mengkang Hu;Yao Mu;Xinmiao Chelsey Yu;Mingyu Ding;Shiguang Wu;Wenqi Shao;Qiguang Chen;Bin Wang;Yu Qiao;Ping Luo",
        "authorids": "~Mengkang_Hu2;~Yao_Mu1;~Xinmiao_Chelsey_Yu2;~Mingyu_Ding1;~Shiguang_Wu4;~Wenqi_Shao2;~Qiguang_Chen1;~Bin_Wang12;~Yu_Qiao1;~Ping_Luo2",
        "gender": ";M;F;M;M;M;M;M;;",
        "homepage": ";https://yaomarkmu.github.io/;;https://dingmyu.github.io/;;https://wqshao126.github.io/;https://scholar.google.com/citations?user=8j8AfF0AAAAJ;http://binwang.top;;",
        "dblp": ";260/0674;;188/5243;275/7661-1.html;227/3122;292/9953;13/1898-34;;",
        "google_scholar": ";;yflYWnYAAAAJ;w4yTWwoAAAAJ;https://scholar.google.com/citations?hl=zh-CN;Bs9mrwwAAAAJ;8j8AfF0AAAAJ;KWZG_YsAAAAJ;;",
        "orcid": ";;;0000-0001-6556-8359;0000-0001-9091-5236;;;0000-0002-0267-3749;;",
        "linkedin": ";;;dingmyu/;;;;;;",
        "or_profile": "~Mengkang_Hu2;~Yao_Mu1;~Xinmiao_Chelsey_Yu2;~Mingyu_Ding1;~Shiguang_Wu4;~Wenqi_Shao2;~Qiguang_Chen1;~Bin_Wang12;~Yu_Qiao1;~Ping_Luo2",
        "aff": ";The University of Hong Kong;Harbin Institute of Technology;University of California, Berkeley;Huawei Technologies Ltd.;Shanghai AI Laboratory;Harbin Institute of Technology;Huawei Noah's Ark Lab;;",
        "aff_domain": ";hku.hk;hit.edu.cn;berkeley.edu;huawei.com;pjlab.org.cn;hit.edu.cn;huawei.com;;",
        "position": ";PhD student;MS student;Postdoc;Researcher;Researcher;PhD student;Senior Researcher;;",
        "bibtex": "@inproceedings{\nhu2024treeplanner,\ntitle={Tree-Planner: Efficient Close-loop Task Planning with Large Language Models},\nauthor={Mengkang Hu and Yao Mu and Xinmiao Chelsey Yu and Mingyu Ding and Shiguang Wu and Wenqi Shao and Qiguang Chen and Bin Wang and Yu Qiao and Ping Luo},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Glcsog6zOe}\n}",
        "github": "",
        "project": "",
        "reviewers": "mZgD;m5sK;K1gw;cPrG",
        "pdf_size": 913379,
        "rating": "3;5;5;8",
        "confidence": "4;5;3;3",
        "soundness": "1;3;3;4",
        "contribution": "1;2;2;3",
        "presentation": "3;3;3;4",
        "wc_summary": "402;201;135;110",
        "wc_strengths": "122;77;71;131",
        "wc_weaknesses": "883;185;172;117",
        "wc_questions": "674;173;256;56",
        "wc_review": "2081;636;634;414",
        "wc_reply_reviewers": "611;305;0;127",
        "wc_reply_authors": "6666;2144;2461;1310",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "14;5;7;4",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            1.0897247358851685
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            212.0,
            114.62329606149005
        ],
        "wc_strengths_avg": [
            100.25,
            26.52710877574109
        ],
        "wc_weaknesses_avg": [
            339.25,
            314.9701374733802
        ],
        "wc_questions_avg": [
            289.75,
            232.94674820653753
        ],
        "wc_review_avg": [
            941.25,
            664.1917550677665
        ],
        "wc_reply_reviewers_avg": [
            260.75,
            229.40834226331003
        ],
        "wc_reply_authors_avg": [
            3145.25,
            2075.724135693373
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            7.5,
            3.905124837953327
        ],
        "replies_avg": [
            41,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": -0.46442036401282394,
        "gs_citation": 55,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14571680586890535385&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=Glcsog6zOe",
        "pdf": "https://openreview.net/pdf?id=Glcsog6zOe",
        "email": ";hku.hk;hit.edu.cn;berkeley.edu;huawei.com;pjlab.org.cn;hit.edu.cn;huawei.com;;",
        "author_num": 10,
        "aff_unique_index": "0;1;2;3;4;1;3",
        "aff_unique_norm": "University of Hong Kong;Harbin Institute of Technology;University of California, Berkeley;Huawei;Shanghai AI Laboratory",
        "aff_unique_dep": ";;;Huawei Technologies;",
        "aff_unique_url": "https://www.hku.hk;http://www.hit.edu.cn/;https://www.berkeley.edu;https://www.huawei.com;https://www.shanghai-ai-lab.com",
        "aff_unique_abbr": "HKU;HIT;UC Berkeley;Huawei;SAIL",
        "aff_campus_unique_index": "0;1;2;1",
        "aff_campus_unique": "Hong Kong SAR;Harbin;Berkeley;",
        "aff_country_unique_index": "0;0;1;0;0;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Improved algorithm and bounds for successive projection",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19016",
        "id": "GlpawHh80l",
        "author_site": "Jiashun Jin, Tracy Ke, Gabriel Moryoussef, Jiajun Tang, Jingming Wang",
        "tldr": "",
        "abstract": "Consider a $K$-vertex simplex in a $d$-dimensional  space. We measure $n$ points on the simplex, but due to the measurement noise, \nsome of the observed points fall outside the simplex. The interest is vertex hunting (i.e.,  estimating the vertices of the simplex).  The successive projection algorithm (SPA)  is one of the most popular approaches to vertex hunting, but it is vulnerable to noise and outliers, and may perform unsatisfactorily.  We propose pseudo-point SPA  (pp-SPA) as a new approach to vertex hunting. The approach contains \ntwo novel ideas (a projection step and a denoise step) and generates roughly $n$ pseudo-points, which can be fed in to SPA for vertex hunting. For theory, we first derive an improved non-asymptotic bound for the orthodox SPA, and then use the result to derive the bounds for pp-SPA.  Compared with the orthodox SPA,  pp-SPA has a faster rate and more satisfactory numerical performance in a broad setting.  The analysis is quite delicate: the non-asymptotic bound is hard to derive, and we need precise results on the extreme values of (possibly) high-dimensional random vectors.",
        "keywords": "Simplex;vertex hunting;successive projection;pseudo-points;pruning;hyper-spectral unmixing;archetypal analysis;network analysis.",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/96e83130c61651e54037f34cc3b6e56103e42f30.pdf",
        "author": "Jiashun Jin;Tracy Ke;Gabriel Moryoussef;Jiajun Tang;Jingming Wang",
        "authorids": "~Jiashun_Jin1;~Tracy_Ke1;~Gabriel_Moryoussef1;jiajuntang@fas.harvard.edu;jingmingwang@fas.harvard.edu",
        "gender": ";;M;;",
        "homepage": ";;http://gabrielmoryoussef.github.io;;",
        "dblp": ";;;;",
        "google_scholar": ";;kUQryMEAAAAJ;;",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Jiashun_Jin1;~Tracy_Ke1;~Gabriel_Moryoussef1;jiajuntang@fas.harvard.edu;jingmingwang@fas.harvard.edu",
        "aff": ";;Carnegie Mellon University;;",
        "aff_domain": ";;cmu.edu;;",
        "position": ";;PhD student;;",
        "bibtex": "@inproceedings{\njin2024improved,\ntitle={Improved algorithm and bounds for successive projection},\nauthor={Jiashun Jin and Tracy Ke and Gabriel Moryoussef and Jiajun Tang and Jingming Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=GlpawHh80l}\n}",
        "github": "",
        "project": "",
        "reviewers": "WFSc;xzLC;wP9r;KsqF",
        "pdf_size": 465834,
        "rating": "3;6;6;8",
        "confidence": "3;2;2;3",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;3;2;3",
        "wc_summary": "50;349;209;373",
        "wc_strengths": "34;59;26;186",
        "wc_weaknesses": "35;165;49;467",
        "wc_questions": "166;63;1;10",
        "wc_review": "285;636;285;1036",
        "wc_reply_reviewers": "431;0;0;0",
        "wc_reply_authors": "1403;1153;503;907",
        "reply_reviewers": "2;0;0;0",
        "reply_authors": "4;2;1;2",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            2.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            245.25,
            128.95808427547303
        ],
        "wc_strengths_avg": [
            76.25,
            64.52276729961294
        ],
        "wc_weaknesses_avg": [
            179.0,
            173.76420805217626
        ],
        "wc_questions_avg": [
            60.0,
            65.62392856268207
        ],
        "wc_review_avg": [
            560.5,
            309.6776549898297
        ],
        "wc_reply_reviewers_avg": [
            107.75,
            186.62847451554651
        ],
        "wc_reply_authors_avg": [
            991.5,
            332.10954518050215
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            2.25,
            1.0897247358851685
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.14002800840280097,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7637820419035078049&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=GlpawHh80l",
        "pdf": "https://openreview.net/pdf?id=GlpawHh80l",
        "email": ";;cmu.edu;;",
        "author_num": 5,
        "aff_unique_index": "0",
        "aff_unique_norm": "Carnegie Mellon University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cmu.edu",
        "aff_unique_abbr": "CMU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Offline RL with Observation Histories: Analyzing and Improving Sample Complexity",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19015",
        "id": "GnOLWS4Llt",
        "author_site": "Joey Hong, Anca Dragan, Sergey Levine",
        "tldr": "",
        "abstract": "Offline reinforcement learning (RL) can in principle synthesize more optimal behavior from a dataset consisting only of suboptimal trials. One way that this can happen is by \"stitching\" together the best parts of otherwise suboptimal trajectories that overlap on similar states, to create new behaviors where each individual state is in-distribution, but the overall returns are higher. However, in many interesting and complex applications, such as autonomous navigation and dialogue systems, the state is partially observed. Even worse, the state representation is unknown or not easy to define. In such cases, policies and value functions are often conditioned on observation histories instead of states. In these cases, it is not clear if the same kind of \"stitching\" is feasible at the level of observation histories, since two different trajectories would always have different histories, and thus \"similar states\" that might lead to effective stitching cannot be leveraged.  Theoretically, we show that standard offline RL algorithms conditioned on observation histories suffer from poor sample complexity, in accordance with the above intuition. We then identify sufficient conditions under which offline RL can still be efficient -- intuitively, it needs to learn a compact representation of history comprising only features relevant for action selection. We introduce a bisimulation loss that captures the extent to which this happens, and propose that offline RL can explicitly optimize this loss to aid worst-case sample complexity. Empirically, we show that across a variety of tasks either our proposed loss improves performance, or the value of this loss is already minimized as a consequence of standard offline RL, indicating that it correlates well with good performance.",
        "keywords": "offline reinforcement learning;POMDPs;representation learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Joey Hong;Anca Dragan;Sergey Levine",
        "authorids": "~Joey_Hong2;~Anca_Dragan1;~Sergey_Levine1",
        "gender": "M;F;M",
        "homepage": ";http://www.ancadragan.com/;https://people.eecs.berkeley.edu/~svlevine/",
        "dblp": "188/6056.html;;80/7594",
        "google_scholar": "SiBVfPUAAAAJ;;8R35rCwAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Joey_Hong2;~Anca_Dragan1;~Sergey_Levine1",
        "aff": "University of California, Berkeley;University of California, Berkeley;Google",
        "aff_domain": "berkeley.edu;berkeley.edu;google.com",
        "position": "PhD student;Associate Professor;Research Scientist",
        "bibtex": "@inproceedings{\nhong2024offline,\ntitle={Offline {RL} with Observation Histories: Analyzing and Improving Sample Complexity},\nauthor={Joey Hong and Anca Dragan and Sergey Levine},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=GnOLWS4Llt}\n}",
        "github": "",
        "project": "",
        "reviewers": "dUhS;Hq7u;HexG",
        "pdf_size": 926050,
        "rating": "5;5;5",
        "confidence": "2;3;3",
        "soundness": "3;3;3",
        "contribution": "2;2;3",
        "presentation": "3;3;3",
        "wc_summary": "98;89;71",
        "wc_strengths": "54;14;43",
        "wc_weaknesses": "67;2;100",
        "wc_questions": "32;215;81",
        "wc_review": "251;320;295",
        "wc_reply_reviewers": "0;0;66",
        "wc_reply_authors": "280;496;795",
        "reply_reviewers": "0;0;1",
        "reply_authors": "2;2;2",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            86.0,
            11.224972160321824
        ],
        "wc_strengths_avg": [
            37.0,
            16.87206764645835
        ],
        "wc_weaknesses_avg": [
            56.333333333333336,
            40.71308825863687
        ],
        "wc_questions_avg": [
            109.33333333333333,
            77.34913631637323
        ],
        "wc_review_avg": [
            288.6666666666667,
            28.522895287041873
        ],
        "wc_reply_reviewers_avg": [
            22.0,
            31.11269837220809
        ],
        "wc_reply_authors_avg": [
            523.6666666666666,
            211.1560770825431
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18313554286351869061&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=GnOLWS4Llt",
        "pdf": "https://openreview.net/pdf?id=GnOLWS4Llt",
        "email": "berkeley.edu;berkeley.edu;google.com",
        "author_num": 3,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "University of California, Berkeley;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.berkeley.edu;https://www.google.com",
        "aff_unique_abbr": "UC Berkeley;Google",
        "aff_campus_unique_index": "0;0;1",
        "aff_campus_unique": "Berkeley;Mountain View",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Gny0PVtKz2",
        "title": "ConvFormer: Revisiting Token-mixers for Sequential User Modeling",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Sequential user modeling is essential for building recommender systems, aiming to predict users' subsequent preferences based on their historical behavior. Despite the widespread success of the Transformer architecture in various domains, we observe that its self-attentive token mixer is outperformed by simpler strategies in the realm of sequential user modeling. This observation motivates our study, which aims to revisit and optimize the design of token mixers for this specific application. We start by examining the core building blocks of the self-attentive token mixer, identifying three empirically-validated criteria essential for designing effective token mixers in sequential user models. To validate the utility of these criteria, we develop ConvFormer, a streamlined modification to the Transformer architecture that satisfies the proposed criteria simultaneously. We also present an acceleration technique to handle the computational cost of processing long sequences. Experimental results on four public datasets reveal that even a simple model, when designed in accordance with the proposed criteria, can surpass various complex and delicate solutions, validating the efficacy of the proposed criteria.",
        "keywords": "Sequential user modeling;Transformer;Token mixer",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/e12ffe11125b91c401486bc7b4919a81ea3cbf95.zip",
        "author": "Eric Wang;Jianxun Lian;Haoxuan Li;Mingqi Wu;Wanyue Xu;Jiajun Fan;Chaozhuo Li;Xing Xie",
        "authorids": "~Eric_Wang3;~Jianxun_Lian1;~Haoxuan_Li6;~Mingqi_Wu1;~Wanyue_Xu1;~Jiajun_Fan1;~Chaozhuo_Li1;~Xing_Xie3",
        "gender": ";M;M;M;F;;;M",
        "homepage": ";https://www.microsoft.com/en-us/research/people/jialia/;https://haoxuanli-pku.github.io/;;https://vivian1tsui.github.io;;https://scss.bupt.edu.cn/info/1063/5534.htm;http://research.microsoft.com/en-us/people/xingx/",
        "dblp": ";161/0030;145/4965-1.html;;;;316/1269.html;08/6809-1",
        "google_scholar": ";tSq7dIkAAAAJ;gtDqiucAAAAJ;gBTnIloAAAAJ;;;https://scholar.google.com/citations?hl=zh-CN;5EQfAFIAAAAJ",
        "orcid": ";0000-0003-3108-5601;0000-0003-3620-3769;;;;0000-0002-8179-7503;0000-0002-8608-8482",
        "linkedin": ";;;;;;;xingx/",
        "or_profile": "~Eric_Wang3;~Jianxun_Lian1;~Haoxuan_Li6;~Mingqi_Wu1;~Wanyue_Xu1;~Jiajun_Fan1;~Chaozhuo_Li1;~Xing_Xie3",
        "aff": ";Microsoft Research;Peking University;Microsoft;Fudan University;;Beijing University of Posts and Telecommunications;Microsoft Research Asia",
        "aff_domain": ";microsoft.com;pku.edu.cn;microsoft.com;fudan.edu.cn;;bupt.edu.cn;microsoft.com",
        "position": ";Researcher;PhD student;Researcher;PhD student;;Associate Professor;Senior Principal Researcher",
        "bibtex": "@misc{\nwang2024convformer,\ntitle={ConvFormer: Revisiting Token-mixers for Sequential User Modeling},\nauthor={Eric Wang and Jianxun Lian and Haoxuan Li and Mingqi Wu and Wanyue Xu and Jiajun Fan and Chaozhuo Li and Xing Xie},\nyear={2024},\nurl={https://openreview.net/forum?id=Gny0PVtKz2}\n}",
        "github": "",
        "project": "",
        "reviewers": "dYvo;TxzE;DKuE",
        "site": "https://openreview.net/forum?id=Gny0PVtKz2",
        "pdf_size": 891668,
        "rating": "3;5;6",
        "confidence": "4;5;4",
        "soundness": "2;2;4",
        "contribution": "1;3;3",
        "presentation": "2;2;4",
        "wc_summary": "97;191;49",
        "wc_strengths": "11;65;17",
        "wc_weaknesses": "476;48;10",
        "wc_questions": "3;927;31",
        "wc_review": "587;1231;107",
        "wc_reply_reviewers": "1863;0;43",
        "wc_reply_authors": "3105;3059;1806",
        "reply_reviewers": "4;0;1",
        "reply_authors": "6;6;7",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            112.33333333333333,
            58.97645481225726
        ],
        "wc_strengths_avg": [
            31.0,
            24.166091947189145
        ],
        "wc_weaknesses_avg": [
            178.0,
            211.2881129327125
        ],
        "wc_questions_avg": [
            320.3333333333333,
            429.1303868160456
        ],
        "wc_review_avg": [
            641.6666666666666,
            460.49635057065206
        ],
        "wc_reply_reviewers_avg": [
            635.3333333333334,
            868.2689035597722
        ],
        "wc_reply_authors_avg": [
            2656.6666666666665,
            601.8052471984234
        ],
        "reply_reviewers_avg": [
            1.6666666666666667,
            1.699673171197595
        ],
        "reply_authors_avg": [
            6.333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.18898223650461357,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:WrjxShE7NyoJ:scholar.google.com/&scioq=ConvFormer:+Revisiting+Token-mixers+for+Sequential+User+Modeling&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;2;3;0",
        "aff_unique_norm": "Microsoft;Peking University;Fudan University;Beijing University of Posts and Telecommunications",
        "aff_unique_dep": "Microsoft Research;;;",
        "aff_unique_url": "https://www.microsoft.com/en-us/research;http://www.pku.edu.cn;https://www.fudan.edu.cn;http://www.bupt.edu.cn/",
        "aff_unique_abbr": "MSR;Peking U;Fudan;BUPT",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Beijing;Asia",
        "aff_country_unique_index": "0;1;0;1;1;1",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "Go33RnNiVH",
        "title": "$\\beta$-DQN: Diverse Exploration via Learning a Behavior Function",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Efficient exploration remains a pivotal challenge in reinforcement learning (RL). \nWhile numerous methods have been proposed, their lack of simplicity, generality and computational efficiency often lead researchers to choose simple techniques such as $\\epsilon$-greedy.\nMotivated by these considerations, we propose $\\beta$-DQN. \nThis method improves exploration by constructing a set of diverse polices through a behavior function $\\beta$ learned from the replay memory.\nFirst, $\\beta$ differentiates actions based on their frequency at each state, which can be used to design strategies for better state coverage. \nSecond, we constrain temporal difference (TD) learning to in-sample data and derive two functions $Q$ and $Q_{\\textit{mask}}$.\nFunction $Q$ may overestimate unseen actions, providing a foundation for bias correction exploration.\n$Q_{\\textit{mask}}$ reduces the values of unseen actions in $Q$ using $\\beta$ as an action mask, thus yields a greedy policy that purely exploit in-sample data.\nWe combine $\\beta, Q, Q_{\\textit{mask}}$ to construct a set of policies ranging from exploration to exploitation.\nThen an adaptive meta-controller selects an effective policy for each episode.\n$\\beta$-DQN is straightforward to implement, imposes minimal hyper-parameter tuning demands, and adds a modest computational overhead to DQN. \nOur experiments, conducted on simple and challenging exploration domains, demonstrate $\\beta$-DQN significantly enhances performance and exhibits broad applicability across a wide range of tasks.",
        "keywords": "Deep Reinforcement Learning;Exploration",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Hongming Zhang;Fengshuo Bai;Chenjun Xiao;Chao Gao;bo xu;Martin M\u00fcller",
        "authorids": "~Hongming_Zhang3;~Fengshuo_Bai1;~Chenjun_Xiao1;~Chao_Gao1;~bo_xu1;~Martin_M\u00fcller2",
        "gender": "M;;;M;M;M",
        "homepage": "https://github.com/initial-h;https://changwinde.github.io/;https://chenjun-x.github.io/;http://cgao3.github.io;;https://webdocs.cs.ualberta.ca/~mmueller/",
        "dblp": ";346/1114;178/8641;;;https://dblp.org/pers/hd/m/M=uuml=ller_0003:Martin",
        "google_scholar": "https://scholar.google.ca/citations?user=mwbsY3AAAAAJ;https://scholar.google.com/citations?hl=en;;https://scholar.google.ca/citations?user=N2H5y_MAAAAJ;;J60BcHkAAAAJ",
        "orcid": ";;0000-0002-5493-1500;;;0000-0002-5639-5318",
        "linkedin": ";;;;;",
        "or_profile": "~Hongming_Zhang3;~Fengshuo_Bai1;~Chenjun_Xiao1;~Chao_Gao1;~bo_xu1;~Martin_Mueller1",
        "aff": "University of Alberta;Shanghai Jiaotong University;Huawei Technologies Ltd.;Huawei Technologies Canada;;University of Alberta",
        "aff_domain": "ualberta.ca;sjtu.edu.cn;huawei.com;huawei.com;;ualberta.ca",
        "position": "PhD student;PhD student;Researcher;Researcher;;Full Professor",
        "bibtex": "@misc{\nzhang2024betadqn,\ntitle={\\${\\textbackslash}beta\\$-{DQN}: Diverse Exploration via Learning a Behavior Function},\nauthor={Hongming Zhang and Fengshuo Bai and Chenjun Xiao and Chao Gao and bo xu and Martin M{\\\"u}ller},\nyear={2024},\nurl={https://openreview.net/forum?id=Go33RnNiVH}\n}",
        "github": "",
        "project": "",
        "reviewers": "J55j;G7o1;7r6n;fvxy;Swey",
        "site": "https://openreview.net/forum?id=Go33RnNiVH",
        "pdf_size": 2754690,
        "rating": "3;3;3;5;6",
        "confidence": "4;4;4;3;3",
        "soundness": "3;2;3;3;3",
        "contribution": "1;3;2;2;2",
        "presentation": "3;3;3;2;3",
        "wc_summary": "72;43;173;60;113",
        "wc_strengths": "73;126;51;31;88",
        "wc_weaknesses": "194;430;110;4;89",
        "wc_questions": "2;176;47;267;143",
        "wc_review": "341;775;381;362;433",
        "wc_reply_reviewers": "0;36;0;0;0",
        "wc_reply_authors": "501;302;411;321;200",
        "reply_reviewers": "0;1;0;0;0",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            4.0,
            1.2649110640673518
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            92.2,
            46.533428844219074
        ],
        "wc_strengths_avg": [
            73.8,
            32.49246066397557
        ],
        "wc_weaknesses_avg": [
            165.4,
            145.45597272027027
        ],
        "wc_questions_avg": [
            127.0,
            94.10844807986156
        ],
        "wc_review_avg": [
            458.4,
            161.2124064704699
        ],
        "wc_reply_reviewers_avg": [
            7.2,
            14.400000000000002
        ],
        "wc_reply_authors_avg": [
            347.0,
            102.09995102839179
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.9682458365518543,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Qis5_4VeHusJ:scholar.google.com/&scioq=%24%5Cbeta%24-DQN:+Diverse+Exploration+via+Learning+a+Behavior+Function&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;2;0",
        "aff_unique_norm": "University of Alberta;Shanghai Jiao Tong University;Huawei",
        "aff_unique_dep": ";;Huawei Technologies",
        "aff_unique_url": "https://www.ualberta.ca;https://www.sjtu.edu.cn;https://www.huawei.com",
        "aff_unique_abbr": "UAlberta;SJTU;Huawei",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;0;0",
        "aff_country_unique": "Canada;China"
    },
    {
        "id": "Go8hf9wKJx",
        "title": "DOG: Diffusion-based Outlier Generation for Out-of-Distribution Detection",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "\\textit{Out-of-distribution} (OOD) detection is essential for neural networks to ensure reliable predictions in open-world machine learning. Previous approaches have shown that suitable surrogate outlier data are helpful in training OOD detection models. However, obtaining appropriate surrogate outliers presents several substantial challenges, including difficulties in collecting surrogate datasets and confusion of selecting the appropriate outlier data. In this paper, we propose a novel framework called \\textit{Diffusion-Based Outlier Generation} (\\texttt{DOG}), which synthesizes surrogate outlier data using a large-scale pre-trained diffusion model. \\texttt{DOG} generates surrogate outliers using only the \\textit{in-distribution} (ID) data, which are subsequently used to further fine-tune the OOD detection model. Compared to previous methods that only use visual or text category information to synthesize outliers, our implementation combines both of them to generate outliers for downstream fine-tuning tasks. Specifically, our method reconstructs images with a diffusion model conditioned on the text category, which utilizes the implicit semantic information contained in the visual images, along with explicit textual category information, to synthesize surrogate outliers. In addition, our \\texttt{DOG} presents a novel approach for outlier exposure by allowing dynamic adjustment of surrogate outlier data based on the results, leading to an enhancement in OOD detection performance. Extensive experiments across various OOD detection tasks demonstrate that \\texttt{DOG} achieves the optimal performance compared to its advanced counterparts.",
        "keywords": "OOD Detection;Reliable Machine Learning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/9b8092bbd9be7dcdf529410816f2d3cf0e98d3c7.pdf",
        "author": "Hao Jiang;Zhen Fang;Xue Jiang;Zhun Zhong;Tongliang Liu;Bo Han",
        "authorids": "~Hao_Jiang11;~Zhen_Fang2;~Xue_Jiang3;~Zhun_Zhong1;~Tongliang_Liu1;~Bo_Han1",
        "gender": "M;M;F;M;M;M",
        "homepage": "https://www.cnblogs.com/Antares-how/;https://fang-zhen.github.io/index.html;;http://zhunzhong.site;https://tongliang-liu.github.io/;https://bhanml.github.io/",
        "dblp": ";;;32/6525;150/6667;241/0472-3",
        "google_scholar": ";OzD6WJcAAAAJ;https://scholar.google.com/citations?hl=zh-CN;nZizkQ0AAAAJ;https://scholar.google.com.au/citations?user=EiLdZ_YAAAAJ;nTNjqHwAAAAJ",
        "orcid": ";0000-0003-0602-6255;0000-0003-2577-2296;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Hao_Jiang11;~Zhen_Fang2;~Xue_Jiang3;~Zhun_Zhong1;~Tongliang_Liu1;~bo_han2",
        "aff": "Harbin Institute of Technology (shenzhen);University of Technology Sydney;Southern University of Science and Technology;University of Nottingham;Mohamed bin Zayed University of Artificial Intelligence;MBZUAI",
        "aff_domain": "hit.edu.cn;uts.edu.au;sustech.edu.cn;nottingham.ac.uk;mbzuai.ac.ae;mbzuai.ac.ae",
        "position": "MS student;Assistant Professor;PhD student;Assistant Professor;Affiliated Associate Professor;Researcher",
        "bibtex": "@misc{\njiang2024dog,\ntitle={{DOG}: Diffusion-based Outlier Generation for Out-of-Distribution Detection},\nauthor={Hao Jiang and Zhen Fang and Xue Jiang and Zhun Zhong and Tongliang Liu and Bo Han},\nyear={2024},\nurl={https://openreview.net/forum?id=Go8hf9wKJx}\n}",
        "github": "",
        "project": "",
        "reviewers": "QUNt;sCqT;2oHU;7TEf",
        "site": "https://openreview.net/forum?id=Go8hf9wKJx",
        "pdf_size": 3585694,
        "rating": "3;3;5;6",
        "confidence": "4;4;4;4",
        "soundness": "2;2;3;3",
        "contribution": "1;2;2;3",
        "presentation": "1;2;1;3",
        "wc_summary": "52;98;96;47",
        "wc_strengths": "35;32;39;17",
        "wc_weaknesses": "445;180;126;101",
        "wc_questions": "56;60;9;17",
        "wc_review": "588;370;270;182",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            73.25,
            23.826193569263218
        ],
        "wc_strengths_avg": [
            30.75,
            8.317902379807062
        ],
        "wc_weaknesses_avg": [
            213.0,
            136.95437196380405
        ],
        "wc_questions_avg": [
            35.5,
            22.721135535003526
        ],
        "wc_review_avg": [
            352.5,
            151.36297433652658
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Ci9gpp1640YJ:scholar.google.com/&scioq=DOG:+Diffusion-based+Outlier+Generation+for+Out-of-Distribution+Detection&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;4;4",
        "aff_unique_norm": "Harbin Institute of Technology;University of Technology Sydney;Southern University of Science and Technology;University of Nottingham;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.hit.edu.cn/;https://www.uts.edu.au;https://www.sustech.edu.cn;https://www.nottingham.ac.uk;https://mbzuai.ac.ae",
        "aff_unique_abbr": "HIT;UTS;SUSTech;UoN;MBZUAI",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Shenzhen;",
        "aff_country_unique_index": "0;1;0;2;3;3",
        "aff_country_unique": "China;Australia;United Kingdom;United Arab Emirates"
    },
    {
        "id": "GoJ8jGmjyW",
        "title": "HowToCaption: Prompting LLMs to Transform Video Annotations at Scale",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Instructional videos are an excellent source for learning multimodal representations by leveraging video-subtitle pairs extracted with automatic speech recognition systems (ASR) from the audio signal in the videos. However, in contrast to human-annotated captions, both speech and subtitles naturally differ from the visual content of the videos and thus provide only noisy supervision for multimodal learning. As a result, large-scale annotation-free web video training data remains sub-optimal for training text-video models. In this work, we propose to leverage the capability of large language models (LLMs) to obtain fine-grained video descriptions aligned with videos. Specifically, we prompt an LLM to create plausible video descriptions based on ASR narrations of the video for a large-scale instructional video dataset. To this end, we introduce a prompting method that is able to take into account a longer text of subtitles, allowing us to capture context beyond a single sentence. To align the captions to the video temporally, we prompt the LLM to generate timestamps for each produced caption based on the subtitles. In this way, we obtain human-style video captions at scale without human supervision. We apply our method to the subtitles of the HowTo100M dataset, creating a new large-scale dataset, HowToCaption. Our evaluation shows that the resulting captions not only significantly improve the performance over many different benchmark datasets for text-video retrieval but also lead to a disentangling of textual narration from the audio, boosting performance in text-video-audio tasks.",
        "keywords": "Video-Language Dataset; Video-Language Model; LLM",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Nina Shvetsova;Anna Kukleva;Xudong Hong;Christian Rupprecht;Bernt Schiele;Hilde Kuehne",
        "authorids": "~Nina_Shvetsova1;~Anna_Kukleva1;~Xudong_Hong1;~Christian_Rupprecht1;~Bernt_Schiele1;~Hilde_Kuehne5",
        "gender": "F;F;M;M;M;F",
        "homepage": "https://ninatu.github.io/;https://annusha.github.io/;http://xudonghong.me/;http://chrirupp.github.io;http://www.mpi-inf.mpg.de/~schiele;https://hildekuehne.github.io",
        "dblp": "301/1304;239/5182;56/7697-2;https://dblp.uni-trier.de/pid/76/744-1;s/BerntSchiele;45/4963",
        "google_scholar": "qZtU1L4AAAAJ;eLZ_clAAAAAJ;https://scholar.google.de/citations?user=aAaiRrQAAAAJ;https://scholar.google.de/citations?user=IrYlproAAAAJ;https://scholar.google.de/citations?user=z76PBfYAAAAJ;pxhCcH0AAAAJ",
        "orcid": "0000-0003-0910-188X;;0000-0002-7740-4447;;0000-0001-9683-5237;0000-0003-1079-4441",
        "linkedin": ";;xudong-hong/;;;hilde-kuehne-8b9aa661",
        "or_profile": "~Nina_Shvetsova1;~Anna_Kukleva1;~Xudong_Hong1;~Christian_Rupprecht1;~Bernt_Schiele1;~Hilde_Kuehne5",
        "aff": "Rheinische Friedrich-Wilhelms Universit\u00e4t Bonn;Saarland Informatics Campus, Max-Planck Institute;Max-Planck Institute for Informatics;University of Oxford;Max Planck Institute for Informatics, Saarland Informatics Campus;Rheinische Friedrich-Wilhelms-Universit\u00e4t Bonn, Rheinische Friedrich-Wilhelms Universit\u00e4t Bonn",
        "aff_domain": "uni-bonn.de;mpi-inf.mpg.de;mpi-inf.mpg.de;ox.ac.uk;mpi-inf.mpg.de;cs.uni-bonn.de",
        "position": "PhD student;PhD student;PhD student;Associate Professor;Full Professor;Associate Professor",
        "bibtex": "@misc{\nshvetsova2024howtocaption,\ntitle={HowToCaption: Prompting {LLM}s to Transform Video Annotations at Scale},\nauthor={Nina Shvetsova and Anna Kukleva and Xudong Hong and Christian Rupprecht and Bernt Schiele and Hilde Kuehne},\nyear={2024},\nurl={https://openreview.net/forum?id=GoJ8jGmjyW}\n}",
        "github": "",
        "project": "",
        "reviewers": "hb9c;qBgz;d1GH;MMYt",
        "site": "https://openreview.net/forum?id=GoJ8jGmjyW",
        "pdf_size": 5348828,
        "rating": "5;5;5;5",
        "confidence": "5;3;3;4",
        "soundness": "2;3;3;2",
        "contribution": "1;3;2;2",
        "presentation": "1;2;3;3",
        "wc_summary": "102;117;38;50",
        "wc_strengths": "44;187;75;79",
        "wc_weaknesses": "221;222;77;174",
        "wc_questions": "4;112;20;88",
        "wc_review": "371;638;210;391",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1036;465;346;918",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;1;2",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            76.75,
            33.446786093734026
        ],
        "wc_strengths_avg": [
            96.25,
            54.117349343810254
        ],
        "wc_weaknesses_avg": [
            173.5,
            58.99364372540486
        ],
        "wc_questions_avg": [
            56.0,
            45.16635916254486
        ],
        "wc_review_avg": [
            402.5,
            153.00408491278918
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            691.25,
            291.8281814698505
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 27,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10857900051268741043&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;2;3;4;5",
        "aff_unique_norm": "Rheinische Friedrich-Wilhelms Universit\u00e4t Bonn;Max-Planck Institute;Max-Planck Institute for Informatics;University of Oxford;Max Planck Institute for Informatics;Rheinische Friedrich-Wilhelms-Universit\u00e4t Bonn",
        "aff_unique_dep": ";Informatics;;;;",
        "aff_unique_url": "https://www.uni-bonn.de/;https://www.mpi-sws.org;https://mpi-inf.mpg.de;https://www.ox.ac.uk;https://mpi-inf.mpg.de;https://www.uni-bonn.de",
        "aff_unique_abbr": "Uni Bonn;MPI-SWS;MPII;Oxford;MPII;Uni Bonn",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Saarland",
        "aff_country_unique_index": "0;0;0;1;0;0",
        "aff_country_unique": "Germany;United Kingdom"
    },
    {
        "id": "GpGJg1gsjl",
        "title": "Uncertainty for Active Learning on Graphs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Active learning (AL) is a promising technique to improve data efficiency of machine learning models by iteratively acquiring data labels during training. While Uncertainty Sampling (US) - a strategy that labels data points with the highest uncertainty - has proven effective for independent data, its implications for interdependent data, such as nodes in graphs, remain under-explored. In this work, we\npropose the first extensive study of US for node classification. Our contribution is threefold: **(1)** We are the first to provide a benchmark for US approaches beyond predictive uncertainty. We highlight a performance gap between conventional AL strategies for graphs and US. **(2)** We develop novel ground-truth Bayesian uncertainty estimates in terms of the data-generating process. We both theoretically prove and empirically confirm their effectiveness in guiding US toward high-quality label queries. **(3)** Based on our analysis, we highlight pitfalls in modeling uncertainty and relate them to contemporary uncertainty estimators for node classification.",
        "keywords": "Active Learning;Uncertainty Estimation;Node Classification;Machine Learning on Graphs",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Dominik Fuchsgruber;Tom Wollschl\u00e4ger;Bertrand Charpentier;Antonio Oroz;Stephan G\u00fcnnemann",
        "authorids": "~Dominik_Fuchsgruber1;~Tom_Wollschl\u00e4ger1;~Bertrand_Charpentier2;~Antonio_Oroz1;~Stephan_G\u00fcnnemann1",
        "gender": "M;M;;M;M",
        "homepage": "https://github.com/dfuchsgruber;https://www.linkedin.com/in/wollschlaeger/;https://sharpenb.github.io/;https://www.linkedin.com/in/antoniooroz/;http://www.daml.in.tum.de",
        "dblp": "377/3314.html;332/0829;222/1875;;43/3011",
        "google_scholar": "https://scholar.google.de/citations?user=K-egQS0AAAAJ;https://scholar.google.com/citations?hl=en;0rqI-ycAAAAJ;;",
        "orcid": ";;;;",
        "linkedin": ";wollschlaeger/;bertrand-charpentier-76995ab6/;;",
        "or_profile": "~Dominik_Fuchsgruber1;~Tom_Wollschl\u00e4ger1;~Bertrand_Charpentier2;~Antonio_Oroz1;~Stephan_G\u00fcnnemann1",
        "aff": "Technische Universit\u00e4t M\u00fcnchen;Valence Labs powered by recursion;Technical University Munich;Department of Informatics, Technische Universit\u00e4t M\u00fcnchen;Technical University Munich",
        "aff_domain": "tum.de;valencelabs.com;tum.de;in.tum.de;tum.de",
        "position": "PhD student;Researcher;PhD student;MS student;Professor",
        "bibtex": "@misc{\nfuchsgruber2024uncertainty,\ntitle={Uncertainty for Active Learning on Graphs},\nauthor={Dominik Fuchsgruber and Tom Wollschl{\\\"a}ger and Bertrand Charpentier and Antonio Oroz and Stephan G{\\\"u}nnemann},\nyear={2024},\nurl={https://openreview.net/forum?id=GpGJg1gsjl}\n}",
        "github": "",
        "project": "",
        "reviewers": "FXsp;KZ6P;5NFL;fMcb",
        "site": "https://openreview.net/forum?id=GpGJg1gsjl",
        "pdf_size": 926570,
        "rating": "3;3;5;6",
        "confidence": "3;4;4;3",
        "soundness": "2;2;2;3",
        "contribution": "1;2;2;2",
        "presentation": "3;2;3;3",
        "wc_summary": "62;53;112;130",
        "wc_strengths": "19;42;36;45",
        "wc_weaknesses": "195;198;58;115",
        "wc_questions": "10;45;87;43",
        "wc_review": "286;338;293;333",
        "wc_reply_reviewers": "28;112;50;83",
        "wc_reply_authors": "652;1601;1687;1429",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;3;4;3",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            89.25,
            32.53747839031168
        ],
        "wc_strengths_avg": [
            35.5,
            10.062305898749054
        ],
        "wc_weaknesses_avg": [
            141.5,
            58.58540773947041
        ],
        "wc_questions_avg": [
            46.25,
            27.325583250865844
        ],
        "wc_review_avg": [
            312.5,
            23.200215516240362
        ],
        "wc_reply_reviewers_avg": [
            68.25,
            31.95602447113846
        ],
        "wc_reply_authors_avg": [
            1342.25,
            409.19883614203985
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.19245008972987526,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16177362924329470064&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;2;0;2",
        "aff_unique_norm": "Technische Universit\u00e4t M\u00fcnchen;Valence Labs;Technical University of Munich",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.tum.de;;https://www.tum.de",
        "aff_unique_abbr": "TUM;;TUM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Germany;"
    },
    {
        "id": "Gq1Zjhovjr",
        "title": "Consistency Regularization for Domain Generalization with Logit Attribution Matching",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Domain generalization (DG) is about training models that generalize well to unseen domains that follow different distributions than the training domains. It has recently been shown that an effective way to achieve good DG performance is targeted data augmentation, which randomizes spurious factors while preserving robustly predictive factors in training examples. Data augmentation (DA) naturally leads to paired training examples that share the same semantic contents, which can be utilized via consistency regularization (CR). In this paper, we show that CR can further boost DG performance on top of targeted DA. We also propose a novel CR-based DG method called Logit Attribution Matching (LAM). In comparison with previous CR-based DG methods, a key advantage of LAM is that it leverages class labels  often associated with semantic sharing (SS) pairs.  Empirically we find that LAM consistently outperforms previous CR-based DG methods on benchmarks with multiple classes.  In fact, it is the only one that can consistently improve the model DG performance over the targeted DA on all evaluated datasets. To justify the CR-based approach to DG theoretically, we establish conditions for optimal DG in a causal framework and explain how CR is related to those conditions.",
        "keywords": "Domain generalization;Consistency regularization;Causal",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Han Gao;Kaican Li;Weiyan Xie;Zhi LIN;Yongxiang Huang;Luning Wang;Caleb Chen Cao;Nevin L. Zhang",
        "authorids": "~Han_Gao5;~Kaican_Li1;~Weiyan_Xie1;~Zhi_LIN1;~Yongxiang_Huang1;~Luning_Wang1;~Caleb_Chen_Cao1;~Nevin_L._Zhang1",
        "gender": "M;M;M;M;M;M;M;M",
        "homepage": ";;;;;https://sites.google.com/view/goupcaleb/home;https://cse.hkust.edu.hk/~lzhang/teach/courses.html;",
        "dblp": ";272/5206;316/9920;26/6387;27/10746;117/4950;https://dblp.uni-trier.de/pid/z/NevinLianwenZhang.html;",
        "google_scholar": "04k5WPQAAAAJ;Mc-lzZMAAAAJ;_kc1e7EAAAAJ;https://scholar.google.com/citations?hl=zh-CN;SZ0bbEoAAAAJ;S85Wi_gAAAAJ;;",
        "orcid": "0000-0002-0450-1262;;;0000-0002-8573-3400;;;;",
        "linkedin": "%E5%AF%92-%E9%AB%98-058202107/;;;%E6%B0%B8%E7%A5%A5-%E9%BB%84-01919aa9/;;;;zhi-lin-658174214/",
        "or_profile": "~Han_Gao5;~Kaican_Li1;~Weiyan_Xie1;~Yongxiang_Huang1;~Luning_Wang1;~Caleb_Chen_Cao1;~Nevin_Zhang1;~LIN_ZHI1",
        "aff": "Huawei Technologies Ltd.;Hong Kong University of Science and Technology;Hong Kong University of Science and Technology;Huawei Technologies Ltd.;;Hong Kong University of Science and Technology;Hong Kong University of Science and Technology;Hong Kong University of Science and Technology",
        "aff_domain": "huawei.com;connect.ust.hk;ust.hk;huawei.com;;ust.hk;ust.hk;ust.hk",
        "position": "AI Research Engineer;PhD student;PhD student;Principal Researcher;;Researcher;Full Professor;PhD student",
        "bibtex": "@misc{\ngao2024consistency,\ntitle={Consistency Regularization for Domain Generalization with Logit Attribution Matching},\nauthor={Han Gao and Kaican Li and Weiyan Xie and Zhi LIN and Yongxiang Huang and Luning Wang and Caleb Chen Cao and Nevin L. Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=Gq1Zjhovjr}\n}",
        "github": "",
        "project": "",
        "reviewers": "H9LW;9AoB;4UiZ;cViE;THPX",
        "site": "https://openreview.net/forum?id=Gq1Zjhovjr",
        "pdf_size": 32265961,
        "rating": "3;3;5;6;6",
        "confidence": "4;3;4;4;3",
        "soundness": "3;2;3;3;3",
        "contribution": "2;2;2;2;3",
        "presentation": "2;1;3;3;3",
        "wc_summary": "71;164;171;80;69",
        "wc_strengths": "50;49;88;60;64",
        "wc_weaknesses": "139;197;150;175;84",
        "wc_questions": "2;57;43;17;28",
        "wc_review": "262;467;452;332;245",
        "wc_reply_reviewers": "251;136;0;15;57",
        "wc_reply_authors": "2334;1583;1413;1033;492",
        "reply_reviewers": "3;1;0;1;1",
        "reply_authors": "6;4;2;3;2",
        "rating_avg": [
            4.6,
            1.3564659966250536
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.4,
            0.8
        ],
        "wc_summary_avg": [
            111.0,
            46.33357314086623
        ],
        "wc_strengths_avg": [
            62.2,
            14.119490075778232
        ],
        "wc_weaknesses_avg": [
            149.0,
            38.225645841502796
        ],
        "wc_questions_avg": [
            29.4,
            19.252012881774206
        ],
        "wc_review_avg": [
            351.6,
            92.92276362657323
        ],
        "wc_reply_reviewers_avg": [
            91.8,
            92.55787378716086
        ],
        "wc_reply_authors_avg": [
            1371.0,
            610.0757330036985
        ],
        "reply_reviewers_avg": [
            1.2,
            0.9797958971132713
        ],
        "reply_authors_avg": [
            3.4,
            1.4966629547095764
        ],
        "replies_avg": [
            32,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.06019292654288467,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3454727502033972670&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;1;0;1;1;1",
        "aff_unique_norm": "Huawei;Hong Kong University of Science and Technology",
        "aff_unique_dep": "Huawei Technologies;",
        "aff_unique_url": "https://www.huawei.com;https://www.ust.hk",
        "aff_unique_abbr": "Huawei;HKUST",
        "aff_campus_unique_index": "1;1;1;1;1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "GqI4fTVUXC",
        "title": "On the Disconnect Between Theory and Practice of Overparametrized Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The infinite-width limit of neural networks (NNs) has garnered significant attention as a theoretical framework for analyzing the behavior of large-scale, overparametrized networks. By approaching infinite width, NNs effectively converge to a linear model with features characterized by the neural tangent kernel (NTK). This establishes a connection between NNs and kernel methods, the latter of which are well understood. Based on this link, theoretical benefits and algorithmic improvements have been hypothesized and empirically demonstrated in synthetic architectures. These advantages include faster optimization, reliable uncertainty quantification and improved continual learning. However, current results quantifying the rate of convergence to the kernel regime suggest that exploiting these benefits requires architectures that are orders of magnitude wider than they are deep. This assumption raises concerns that practically relevant architectures do not exhibit behavior as predicted via the NTK. In this work, we empirically investigate whether the limiting regime either describes the behavior of large-width architectures used in practice or is informative for algorithmic improvements. Our empirical results demonstrate that this is not the case in optimization, uncertainty quantification or continual learning. This observed disconnect between theory and practice calls into question the practical relevance of the infinite-width limit.",
        "keywords": "neural tangent kernel;overparametrization theory;uncertainty quantification;optimization;continual learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/579ae287f3f19dd9a06f414d759879b0279c1dd0.zip",
        "author": "Jonathan Wenger;Felix Dangel;Agustinus Kristiadi",
        "authorids": "~Jonathan_Wenger1;~Felix_Dangel1;~Agustinus_Kristiadi1",
        "gender": "M;M;",
        "homepage": "https://jonathanwenger.netlify.app/;https://f-dangel.com;https://agustinus.kristia.de",
        "dblp": "242/9063;236/4218;215/3954",
        "google_scholar": "https://scholar.google.com/citations?hl=de;9hlJ9W0AAAAJ;_1qe2mYAAAAJ",
        "orcid": "0000-0003-2261-1331;0000-0002-1414-8554;0000-0003-1615-1121",
        "linkedin": ";;agustinus-kristiadi/",
        "or_profile": "~Jonathan_Wenger1;~Felix_Dangel1;~Agustinus_Kristiadi1",
        "aff": "Columbia University;Vector Institute, Toronto;Vector Institute",
        "aff_domain": "columbia.edu;vectorinstitute.ai;vectorinstitute.ai",
        "position": "Postdoc;Postdoc;Postdoc",
        "bibtex": "@misc{\nwenger2024on,\ntitle={On the Disconnect Between Theory and Practice of Overparametrized Neural Networks},\nauthor={Jonathan Wenger and Felix Dangel and Agustinus Kristiadi},\nyear={2024},\nurl={https://openreview.net/forum?id=GqI4fTVUXC}\n}",
        "github": "",
        "project": "",
        "reviewers": "cgm5;PQv1;9JCy;59VJ",
        "site": "https://openreview.net/forum?id=GqI4fTVUXC",
        "pdf_size": 14136827,
        "rating": "5;5;6;8",
        "confidence": "3;2;3;4",
        "soundness": "3;2;3;4",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;4",
        "wc_summary": "92;122;57;146",
        "wc_strengths": "64;14;38;116",
        "wc_weaknesses": "163;199;217;243",
        "wc_questions": "67;39;139;44",
        "wc_review": "386;374;451;549",
        "wc_reply_reviewers": "387;0;52;12",
        "wc_reply_authors": "1468;810;745;493",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            104.25,
            33.31947628640042
        ],
        "wc_strengths_avg": [
            58.0,
            37.86819245752297
        ],
        "wc_weaknesses_avg": [
            205.5,
            29.098969053902923
        ],
        "wc_questions_avg": [
            72.25,
            39.958572296817614
        ],
        "wc_review_avg": [
            440.0,
            69.41541615520288
        ],
        "wc_reply_reviewers_avg": [
            112.75,
            159.50450620593764
        ],
        "wc_reply_authors_avg": [
            879.0,
            360.08124083323196
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.8660254037844386,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6585694152751624127&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Columbia University;Vector Institute",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.columbia.edu;https://vectorinstitute.ai",
        "aff_unique_abbr": "Columbia;Vector Institute",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Toronto",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "United States;Canada"
    },
    {
        "id": "GrRZz9qqJp",
        "title": "Mask Models are Token Level Contrastive Learners",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In recent years, the field of self-supervised learning has seen a surge in the development of mask models, which have been demonstrated to have strong performance on downstream tasks and efficient training. To better understand the underlying mechanism behind these models' success, we propose a theoretical framework for understanding mask models. By treating mask modeling as a low-rank recovery task, we demonstrate that it is a parametric version of Spectral Clustering and the reconstruction loss conforms to the form of Spectral Contrastive loss. This means that mask modeling can be understood as a token level Contrastive Learning. Our framework can be used to explain why optimal masking ratios vary among modalities and why there is a large gap between linear probing and finetuning performance for mask models. Additionally, our analysis suggests that the success of mask models depends on the model architecture, where a token mixing layer and layer normalization are crucial for the success of mask models. Our framework has the potential to be a step stone for future algorithm and network architecture design in the field of self-supervised learning.",
        "keywords": "mask model;self-supervised learning;Contrastive Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/172ba0897eaa73743224a45cd87ac38c38c308df.pdf",
        "author": "Zixuan Pan;Zihao Wei",
        "authorids": "~Zixuan_Pan1;~Zihao_Wei1",
        "gender": "M;M",
        "homepage": "https://zxp46.github.io/;https://Zi-hao-Wei.github.io",
        "dblp": ";",
        "google_scholar": ";3pHahugAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Zixuan_Pan1;~Zihao_Wei1",
        "aff": "University of Michigan - Ann Arbor;University of Michigan - Ann Arbor",
        "aff_domain": "umich.edu;umich.edu",
        "position": "MS student;MS student",
        "bibtex": "@misc{\npan2024mask,\ntitle={Mask Models are Token Level Contrastive Learners},\nauthor={Zixuan Pan and Zihao Wei},\nyear={2024},\nurl={https://openreview.net/forum?id=GrRZz9qqJp}\n}",
        "github": "",
        "project": "",
        "reviewers": "rQ46;wnEL;zZgx;oRYb",
        "site": "https://openreview.net/forum?id=GrRZz9qqJp",
        "pdf_size": 878337,
        "rating": "3;3;3;6",
        "confidence": "3;3;2;4",
        "soundness": "3;1;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;1;3",
        "wc_summary": "61;67;93;89",
        "wc_strengths": "20;37;46;36",
        "wc_weaknesses": "205;202;411;78",
        "wc_questions": "4;25;5;50",
        "wc_review": "290;331;555;253",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            77.5,
            13.738631664034086
        ],
        "wc_strengths_avg": [
            34.75,
            9.364160400164021
        ],
        "wc_weaknesses_avg": [
            224.0,
            119.50941385514365
        ],
        "wc_questions_avg": [
            21.0,
            18.721645226849056
        ],
        "wc_review_avg": [
            357.25,
            117.45717304617884
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:M6FVXFLhzpoJ:scholar.google.com/&scioq=Mask+Models+are+Token+Level+Contrastive+Learners&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Michigan",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.umich.edu",
        "aff_unique_abbr": "UM",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Ann Arbor",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "GrgWf0ABUC",
        "title": "LatticeGen: A Cooperative Framework Which Hides Generated Text in A Lattice For Privacy-Aware Generation on Cloud",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In the current user-server interaction paradigm of prompted generation with large language model (LLM) on cloud, the server fully controls the generation process, which leaves zero option for users who want to keep the generated text to themselves. We propose LatticeGen, a cooperative framework in which the server still handles most of computation while the user controls the sampling operation. The key idea is that the true generated sequence is mixed with noise tokens by the user and hidden in a noised lattice. Considering potential attack from a hypothetically malicious server and how the user can defend against it, we propose the repeated beam-search attack and the mixing noise scheme. In our experiments we apply LatticeGen to protect both prompt and generation. It is shown that while the noised lattice degrades generation quality, LatticeGen successfully protects the true generation to a remarkable degree under strong attacks (more than 50\\% of the semantic remains hidden as measured by BERTScore).",
        "keywords": "Privacy and Security;Large Language Model;Lattice;Generative Models;NLP",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Mengke Zhang;Tianxing He;Tianle Wang;Lu Mi;Fatemehsadat Mireshghallah;Binyi Chen;Hao Wang;Yulia Tsvetkov",
        "authorids": "~Mengke_Zhang1;~Tianxing_He1;~Tianle_Wang1;~Lu_Mi1;~Fatemehsadat_Mireshghallah1;~Binyi_Chen2;~Hao_Wang3;~Yulia_Tsvetkov1",
        "gender": "M;M;M;F;F;M;F;M",
        "homepage": "https://www.linkedin.com/in/mkzhang2001/;https://cloudygoose.github.io/;https://wtl666wtl.github.io/;https://lumimim.github.io;https://homes.cs.washington.edu/~niloofar/;;https://homes.cs.washington.edu/~yuliats/;http://www.wanghao.in",
        "dblp": ";149/0111;237/9664-3.html;185/3258;241/9430.html;133/2004.html;75/8157;w/HaoWang-14",
        "google_scholar": ";egmfjjwAAAAJ;https://scholar.google.com/citations?hl=zh-CN;vokCG-MAAAAJ;WUCu45YAAAAJ;a89ft7EAAAAJ;SEDPkrsAAAAJ;NrOA9QoAAAAJ",
        "orcid": ";;;;;0000-0003-0835-9678;0000-0002-4634-7128;",
        "linkedin": ";;;lu-mi-698899172/;;binyi-chen-a0440437/;;",
        "or_profile": "~Mengke_Zhang1;~Tianxing_He1;~Tianle_Wang1;~Lu_Mi1;~Fatemehsadat_Mireshghallah1;~Binyi_Chen2;~Yulia_Tsvetkov1;~Hao_Wang4",
        "aff": "University of California, San Diego;University of Washington;University of California, San Diego;Allen Institute;University of Washington;;Department of Computer Science, University of Washington;Rutgers University",
        "aff_domain": "ucsd.edu;cs.washington.edu;ucsd.edu;allen.org;uw.edu;;cs.washington.edu;cs.rutgers.edu",
        "position": "Undergrad student;Postdoc;MS student;Postdoc;Postdoc;;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nzhang2024latticegen,\ntitle={LatticeGen: A Cooperative Framework Which Hides Generated Text in A Lattice For Privacy-Aware Generation on Cloud},\nauthor={Mengke Zhang and Tianxing He and Tianle Wang and Lu Mi and Fatemehsadat Mireshghallah and Binyi Chen and Hao Wang and Yulia Tsvetkov},\nyear={2024},\nurl={https://openreview.net/forum?id=GrgWf0ABUC}\n}",
        "github": "",
        "project": "",
        "reviewers": "s2Jy;hyc5;RjUf",
        "site": "https://openreview.net/forum?id=GrgWf0ABUC",
        "pdf_size": 1071449,
        "rating": "3;5;6",
        "confidence": "2;3;2",
        "soundness": "2;3;2",
        "contribution": "2;2;2",
        "presentation": "1;3;3",
        "wc_summary": "26;58;126",
        "wc_strengths": "28;95;58",
        "wc_weaknesses": "272;155;78",
        "wc_questions": "1;70;24",
        "wc_review": "327;378;286",
        "wc_reply_reviewers": "833;0;0",
        "wc_reply_authors": "507;465;345",
        "reply_reviewers": "1;0;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            70.0,
            41.697322056298376
        ],
        "wc_strengths_avg": [
            60.333333333333336,
            27.402351886086144
        ],
        "wc_weaknesses_avg": [
            168.33333333333334,
            79.75936030056631
        ],
        "wc_questions_avg": [
            31.666666666666668,
            28.686039965266882
        ],
        "wc_review_avg": [
            330.3333333333333,
            37.63272807307786
        ],
        "wc_reply_reviewers_avg": [
            277.6666666666667,
            392.67996581892936
        ],
        "wc_reply_authors_avg": [
            439.0,
            68.64400920692205
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.18898223650461363,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11017105014425701838&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;0;2;1;1;3",
        "aff_unique_norm": "University of California, San Diego;University of Washington;Allen Institute for Artificial Intelligence;Rutgers University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.ucsd.edu;https://www.washington.edu;https://allenai.org;https://www.rutgers.edu",
        "aff_unique_abbr": "UCSD;UW;AI2;Rutgers",
        "aff_campus_unique_index": "0;0;2",
        "aff_campus_unique": "San Diego;;Seattle",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "DreamSmooth: Improving Model-based Reinforcement Learning via Reward Smoothing",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19014",
        "id": "GruDNzQ4ux",
        "author_site": "Vint Lee, Pieter Abbeel, Youngwoon Lee",
        "tldr": "",
        "abstract": "Model-based reinforcement learning (MBRL) has gained much attention for its ability to learn complex behaviors in a sample-efficient way: planning actions by generating imaginary trajectories with predicted rewards. Despite its success, we found that surprisingly, reward prediction is often a bottleneck of MBRL, especially for sparse rewards that are challenging (or even ambiguous) to predict. Motivated by the intuition that humans can learn from rough reward estimates, we propose a simple yet effective reward smoothing approach, DreamSmooth, which learns to predict a temporally-smoothed reward, instead of the exact reward at the given timestep. We empirically show that DreamSmooth achieves state-of-the-art performance on long-horizon sparse-reward tasks both in sample efficiency and final performance without losing performance on common benchmarks, such as Deepmind Control Suite and Atari benchmarks.",
        "keywords": "Model-based Reinforcement Learning; Reward Shaping; Reward Smoothing",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Vint Lee;Pieter Abbeel;Youngwoon Lee",
        "authorids": "~Vint_Lee1;~Pieter_Abbeel2;~Youngwoon_Lee1",
        "gender": "Not Specified;M;M",
        "homepage": ";https://people.eecs.berkeley.edu/~pabbeel/;https://youngwoon.github.io",
        "dblp": ";;117/4767",
        "google_scholar": ";https://scholar.google.com.tw/citations?user=vtwH6GkAAAAJ;CDPa3AgAAAAJ",
        "orcid": ";;0000-0001-9918-1056",
        "linkedin": "vintlee/;;",
        "or_profile": "~Vint_Lee1;~Pieter_Abbeel2;~Youngwoon_Lee1",
        "aff": "University of California, Berkeley;Covariant;University of California, Berkeley",
        "aff_domain": "berkeley.edu;covariant.ai;berkeley.edu",
        "position": "Undergrad student;Founder;Postdoc",
        "bibtex": "@inproceedings{\nlee2024dreamsmooth,\ntitle={DreamSmooth: Improving Model-based Reinforcement Learning via Reward Smoothing},\nauthor={Vint Lee and Pieter Abbeel and Youngwoon Lee},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=GruDNzQ4ux}\n}",
        "github": "",
        "project": "",
        "reviewers": "BjnM;Q6F6;7VX8;4wgT",
        "pdf_size": 7541824,
        "rating": "5;6;6;6",
        "confidence": "4;4;3;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "122;39;113;92",
        "wc_strengths": "84;77;39;98",
        "wc_weaknesses": "80;73;50;122",
        "wc_questions": "192;82;55;81",
        "wc_review": "478;271;257;393",
        "wc_reply_reviewers": "61;11;26;197",
        "wc_reply_authors": "596;315;438;682",
        "reply_reviewers": "1;1;1;2",
        "reply_authors": "2;1;1;2",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            91.5,
            32.20636583037583
        ],
        "wc_strengths_avg": [
            74.5,
            21.84605227495348
        ],
        "wc_weaknesses_avg": [
            81.25,
            26.013217794036937
        ],
        "wc_questions_avg": [
            102.5,
            52.79441258315126
        ],
        "wc_review_avg": [
            349.75,
            90.99828295083375
        ],
        "wc_reply_reviewers_avg": [
            73.75,
            73.43492016745166
        ],
        "wc_reply_authors_avg": [
            507.75,
            141.5704330006799
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17787604858364109748&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=GruDNzQ4ux",
        "pdf": "https://openreview.net/pdf?id=GruDNzQ4ux",
        "email": "berkeley.edu;covariant.ai;berkeley.edu",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of California, Berkeley;Covariant",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.berkeley.edu;",
        "aff_unique_abbr": "UC Berkeley;",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Berkeley;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States;"
    },
    {
        "id": "GrunXMbdXY",
        "title": "FLAT-Chat: A Word Recovery Attack on Federated Language Model Training",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Gradient exchange is widely applied in collaborative training of machine learning models, including Federated Learning. Curious-but-honest participants could potentially infer the output labels in recently used training data by analyzing the latest gradient updates. Previous works mostly demonstrate the attack performance under constraint training settings, such as dozens of short sentences in a batch and a small output space for labels. In this work, we propose a novel gradient flattening attack on the last linear layer of a language model, which significantly improves the attacker's efficiency in inferring the words used in training. We validate the capability of the attack on two language generation tasks: machine translation and language modeling. The attack environment is scaled up to industrial settings of a large output vocabulary and realistic training batch sizes. To mitigate the negative impact of the new attack, we explore two defense methods and demonstrate that adding differential privacy with small noise could effectively defend against our new attack without degrading model utility.",
        "keywords": "Label inference attack;Large-scale language model;Matrix flattening",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/1deb3edede89ea86b8ba463a440817d52b430b90.pdf",
        "author": "Qiongkai Xu;Jun Wang;Olga Ohrimenko;Trevor Cohn",
        "authorids": "~Qiongkai_Xu1;~Jun_Wang29;~Olga_Ohrimenko1;~Trevor_Cohn1",
        "gender": "M;M;;M",
        "homepage": "https://xuqiongkai.github.io;;;https://people.eng.unimelb.edu.au/tcohn/",
        "dblp": "127/0174;125/8189;;66/4613",
        "google_scholar": "https://scholar.google.com.au/citations?user=wCer2WUAAAAJ;pW78ZCUAAAAJ;;https://scholar.google.com.au/citations?user=FCom398AAAAJ",
        "orcid": "0000-0003-3312-6825;;;",
        "linkedin": ";;;",
        "or_profile": "~Qiongkai_Xu1;~Jun_Wang29;~Olga_Ohrimenko1;~Trevor_Cohn1",
        "aff": "Macquarie University;Research, Google;;The University of Melbourne",
        "aff_domain": "mq.edu.au;research.google.com;;unimelb.edu.au",
        "position": "Assistant Professor;Intern;;Professor",
        "bibtex": "@misc{\nxu2024flatchat,\ntitle={{FLAT}-Chat: A Word Recovery Attack on Federated Language Model Training},\nauthor={Qiongkai Xu and Jun Wang and Olga Ohrimenko and Trevor Cohn},\nyear={2024},\nurl={https://openreview.net/forum?id=GrunXMbdXY}\n}",
        "github": "",
        "project": "",
        "reviewers": "3Q3Y;CmSz;t7LN;2HVX",
        "site": "https://openreview.net/forum?id=GrunXMbdXY",
        "pdf_size": 784428,
        "rating": "3;3;5;6",
        "confidence": "5;4;4;4",
        "soundness": "2;3;2;3",
        "contribution": "2;2;3;3",
        "presentation": "1;3;2;3",
        "wc_summary": "173;99;128;95",
        "wc_strengths": "23;71;66;43",
        "wc_weaknesses": "1020;498;114;90",
        "wc_questions": "488;45;57;40",
        "wc_review": "1704;713;365;268",
        "wc_reply_reviewers": "74;0;0;0",
        "wc_reply_authors": "764;533;366;347",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            123.75,
            31.155858197135252
        ],
        "wc_strengths_avg": [
            50.75,
            19.188212527486765
        ],
        "wc_weaknesses_avg": [
            430.5,
            376.88824603587733
        ],
        "wc_questions_avg": [
            157.5,
            190.91424776584904
        ],
        "wc_review_avg": [
            762.5,
            568.2008887708643
        ],
        "wc_reply_reviewers_avg": [
            18.5,
            32.04293994002423
        ],
        "wc_reply_authors_avg": [
            502.5,
            167.4253565025322
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5555555555555555,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4650267065091270554&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Macquarie University;Google;University of Melbourne",
        "aff_unique_dep": ";Google Research;",
        "aff_unique_url": "https://www.mq.edu.au;https://research.google;https://www.unimelb.edu.au",
        "aff_unique_abbr": "MQ;Google;UniMelb",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Australia;United States"
    },
    {
        "id": "Gs8jWk0F01",
        "title": "Deep Reinforcement Learning for Dynamic Capacitated Vehicle Routing Problem",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep Reinforcement Learning (DRL) has become increasingly popular for solving Capacitated Vehicle Routing Problem (CVRP) due to its great potential. However, the current DRL models are only suitable for static environments where information about customers and orders is provided before the delivery vehicle departs from the depot and does not change during delivery. In reality, delivery tasks are dynamic, and much information about customers and orders is disclosed over time. In this paper, we propose a DRL model based on a designed dynamic attention network for dynamic CVRP, which extends the attention model from the original static-only CVRP environment to a dynamic CVRP environment. With dynamic encoder-decoder architecture, the proposed DRL model can track the changes in customer disclosure status in real-time. For comparison, we develop two methods based on LKH and OR-Tools for dynamic CVRP. Experimental results show that the DRL model outperforms LKH and OR-Tools in computational speed and solution quality. The code is publicly available on https://anonymous.4open.science/r/AM2DCVRP-0D4B.",
        "keywords": "attention model;deep reinforcement learning;dynamic capacitated vehicle routing;LKH;OR-tools",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Kaiqiang Tang;Huiqiao Fu;Jiasheng Liu;Guizhou Deng;Yuanyang Lu;Yiming Qi;Chunlin Chen",
        "authorids": "~Kaiqiang_Tang1;~Huiqiao_Fu1;~Jiasheng_Liu1;~Guizhou_Deng1;~Yuanyang_Lu1;~Yiming_Qi1;~Chunlin_Chen1",
        "gender": "M;M;M;;M;M;M",
        "homepage": "https://scholar.google.com/citations?user=gkKO99wAAAAJ&hl=zh-CN;;;;https://github.com/lyy20597;https://github.com/OneMingQi/;https://sme.nju.edu.cn/ccl/list.htm",
        "dblp": ";243/7065;;;;;68/6992.html",
        "google_scholar": "gkKO99wAAAAJ;;;;;;",
        "orcid": ";;0000-0001-6094-3420;0000-0001-6589-4402;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Kaiqiang_Tang1;~Huiqiao_Fu1;~Jiasheng_Liu1;~Guizhou_Deng1;~Yuanyang_Lu1;~Yiming_Qi1;~Chunlin_Chen1",
        "aff": "Nanjing University;Nanjing University;;;Nanjing University;Nanjing University;Nanjing University",
        "aff_domain": "smail.nju.edu.cn;nju.edu.cn;;;nju.edu.cn;nju.edu.cn;nju.edu.cn",
        "position": "PhD student;PhD student;;;MS student;MS student;Full Professor",
        "bibtex": "@misc{\ntang2024deep,\ntitle={Deep Reinforcement Learning for Dynamic Capacitated Vehicle Routing Problem},\nauthor={Kaiqiang Tang and Huiqiao Fu and Jiasheng Liu and Guizhou Deng and Yuanyang Lu and Yiming Qi and Chunlin Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=Gs8jWk0F01}\n}",
        "github": "",
        "project": "",
        "reviewers": "9vhk;p28C;rVn7;CZ1i;zXXw",
        "site": "https://openreview.net/forum?id=Gs8jWk0F01",
        "pdf_size": 1062338,
        "rating": "1;1;3;3;3",
        "confidence": "5;5;5;5;3",
        "soundness": "2;1;1;2;1",
        "contribution": "2;1;1;1;2",
        "presentation": "2;1;2;2;1",
        "wc_summary": "79;57;13;60;42",
        "wc_strengths": "23;26;13;75;42",
        "wc_weaknesses": "288;438;73;311;250",
        "wc_questions": "84;10;2;4;4",
        "wc_review": "474;531;101;450;338",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            2.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            4.6,
            0.7999999999999999
        ],
        "soundness_avg": [
            1.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            1.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            1.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            50.2,
            22.01272359341297
        ],
        "wc_strengths_avg": [
            35.8,
            21.70161284328886
        ],
        "wc_weaknesses_avg": [
            272.0,
            117.82868920598243
        ],
        "wc_questions_avg": [
            20.8,
            31.713719428663676
        ],
        "wc_review_avg": [
            378.8,
            152.4039369570222
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.408248290463863,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:9Peu7OMHREMJ:scholar.google.com/&scioq=Deep+Reinforcement+Learning+for+Dynamic+Capacitated+Vehicle+Routing+Problem&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Nanjing University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nju.edu.cn",
        "aff_unique_abbr": "Nanjing U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "GsNp4ob8BY",
        "title": "Mark My Words: Repurposing LLMs for Specialized Domains via Ability Tokens",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) have demonstrated remarkable proficiency in natural language understanding and generation. However, their capabilities wane in highly specialized domains, such as biomedical sciences, which are sparsely represented in the pretraining corpus. In this work, we explore how to repurpose general LMs as specialized task solvers. We introduce a novel and systematic framework for adding markup-style language extensions (which we term *`ability tokens\"*) to pretrained LMs. These tokens are learned embeddings appended to the LM's embedding matrix, preserving the pretrained weights and the model's original capabilities. We introduce two types of ability tokens: *domain markers*, which delimit and aid in the processing of specialized inputs (e.g., molecular formulas), and *functional tokens*, which guide the model on how to leverage these inputs to solve specific tasks (e.g., predicting molecule properties). During inference, these tokens are inserted into the input text to wrap specialized information and provide problem context. Experimental results show that (i) our markup extensions significantly boost performance in various specialized domains, such as protein and molecular property prediction, matching and outperforming expert models specifically tailored to these tasks, and (ii) we can learn the ability tokens separately and combine them in a modular fashion, achieving zero-shot generalization to  unseen tasks. Overall, our framework offers a promising method to enhance LMs with domain-specific knowledge while maintaining their general capacities.",
        "keywords": "LLM Adaptation;Specialized Domains",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/c6649f4b9753f7f6feb7286c9f48677210b2e89b.zip",
        "author": "Junhong Shen;Neil Tenenholtz;James Brian Hall;David Alvarez-Melis;Nicolo Fusi",
        "authorids": "~Junhong_Shen1;~Neil_Tenenholtz1;~James_Brian_Hall1;~David_Alvarez-Melis1;~Nicolo_Fusi1",
        "gender": "F;;M;M;M",
        "homepage": "https://sjunhongshen.github.io;;https://www.microsoft.com/en-us/research/people/jamhall/;https://dmelis.github.io/;",
        "dblp": "256/9575;75/10171;;168/8255;86/10995",
        "google_scholar": "M561o6QAAAAJ;SGl2QI8AAAAJ;;XsxZrYYAAAAJ;GldD-lwAAAAJ",
        "orcid": "0009-0002-3156-4899;0000-0003-1250-3716;;0000-0002-9591-8986;",
        "linkedin": ";neil-tenenholtz/;;;",
        "or_profile": "~Junhong_Shen1;~Neil_Tenenholtz1;~James_Brian_Hall1;~David_Alvarez-Melis1;~Nicolo_Fusi1",
        "aff": "Carnegie Mellon University;American College of Radiology Data Science Institute;Microsoft;Microsoft;Microsoft",
        "aff_domain": "cmu.edu;acr.org;microsoft.com;microsoft.com;microsoft.com",
        "position": "PhD student;Senior Scientist;Researcher;Senior Researcher;Researcher",
        "bibtex": "@misc{\nshen2024mark,\ntitle={Mark My Words: Repurposing {LLM}s for Specialized Domains via Ability Tokens},\nauthor={Junhong Shen and Neil Tenenholtz and James Brian Hall and David Alvarez-Melis and Nicolo Fusi},\nyear={2024},\nurl={https://openreview.net/forum?id=GsNp4ob8BY}\n}",
        "github": "",
        "project": "",
        "reviewers": "bkwo;VcX3;4P5B;gWMh",
        "site": "https://openreview.net/forum?id=GsNp4ob8BY",
        "pdf_size": 1591095,
        "rating": "5;5;5;6",
        "confidence": "4;4;4;3",
        "soundness": "2;3;3;4",
        "contribution": "2;3;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "127;108;108;113",
        "wc_strengths": "102;39;36;109",
        "wc_weaknesses": "141;54;124;17",
        "wc_questions": "25;54;42;136",
        "wc_review": "395;255;310;375",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "716;891;957;1210",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;2;2;2",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            114.0,
            7.7781745930520225
        ],
        "wc_strengths_avg": [
            71.5,
            34.106451002706216
        ],
        "wc_weaknesses_avg": [
            84.0,
            50.59150126256385
        ],
        "wc_questions_avg": [
            64.25,
            42.68708821177664
        ],
        "wc_review_avg": [
            333.75,
            55.26922742358536
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            943.5,
            177.282965904793
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6398263268662971940&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;2;2",
        "aff_unique_norm": "Carnegie Mellon University;American College of Radiology;Microsoft",
        "aff_unique_dep": ";Data Science Institute;Microsoft Corporation",
        "aff_unique_url": "https://www.cmu.edu;https://www.acr.org;https://www.microsoft.com",
        "aff_unique_abbr": "CMU;ACR;Microsoft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Gsn43rbDwp",
        "title": "Enable Quantum Graph Neural Networks on a Single Qubits",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In the present NISQ era, quantum machine learning encounters significant challenges in realizing practical implementations due to constrained resources. Recently, a novel single qubit methodology enabled the execution of numerous operations on a single qubit.  However, the applicability of this approach to more intricate neural network architectures remains uncertain. In this study, we investigate graph data, which poses inherent challenges for machine learning due to its intricate structure. Through the utilization of quantum walk, we introduce a graph embedding approach to reduce network parameters, culminating in the design of a novel single-qubit Quantum Graph Neural Network (sQGNN) architecture. Our experimental assessments encompass both simulations and practical executions on quantum computers, revealing that the devised sQGNNs adeptly adapt to graphs of varying dimensions and compositions. Consequently, these single-qubit QGNNs make efficient use of limited qubit resources, paving the way for the realization of expansive quantum graph neural networks on resource-constrained Variational Quantum Circuits (VQCs). This breakthrough opens up new possibilities for practical applications within the current NISQ regime.",
        "keywords": "Quantum Machine Learning;Quantum Neural Networks;Single Qubit;NISQ Bottleneck",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "YIJIE ZHU;Richard Jiang",
        "authorids": "~YIJIE_ZHU2;~Richard_Jiang3",
        "gender": "M;M",
        "homepage": ";https://wp.lancs.ac.uk/autobrain",
        "dblp": ";70/8305",
        "google_scholar": "https://scholar.google.co.uk/citations?hl=zh-CN;NuyoNc4AAAAJ",
        "orcid": ";0000-0003-1721-9474",
        "linkedin": ";",
        "or_profile": "~YIJIE_ZHU2;~Richard_M._Jiang1",
        "aff": "Lancaster University;Shanghai Jiaotong University",
        "aff_domain": "lancaster.ac.uk;sjtu.edu.cn",
        "position": "PhD student;Visiting Scholar",
        "bibtex": "@misc{\nzhu2024enable,\ntitle={Enable Quantum Graph Neural Networks on a Single Qubits},\nauthor={YIJIE ZHU and Richard Jiang},\nyear={2024},\nurl={https://openreview.net/forum?id=Gsn43rbDwp}\n}",
        "github": "",
        "project": "",
        "reviewers": "w9tL;uTG1;5o3F;KmxC",
        "site": "https://openreview.net/forum?id=Gsn43rbDwp",
        "pdf_size": 1047940,
        "rating": "3;3;3;5",
        "confidence": "3;2;5;4",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;2;2",
        "wc_summary": "72;100;99;127",
        "wc_strengths": "40;71;42;65",
        "wc_weaknesses": "291;385;199;75",
        "wc_questions": "103;4;33;150",
        "wc_review": "506;560;373;417",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            99.5,
            19.448650338776723
        ],
        "wc_strengths_avg": [
            54.5,
            13.683932183404009
        ],
        "wc_weaknesses_avg": [
            237.5,
            114.57202974548369
        ],
        "wc_questions_avg": [
            72.5,
            57.421685799008024
        ],
        "wc_review_avg": [
            464.0,
            73.26322406228107
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.2581988897471611,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:6nSr2cH7XbkJ:scholar.google.com/&scioq=Enable+Quantum+Graph+Neural+Networks+on+a+Single+Qubits&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Lancaster University;Shanghai Jiao Tong University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.lancaster.ac.uk;https://www.sjtu.edu.cn",
        "aff_unique_abbr": "Lancaster;SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United Kingdom;China"
    },
    {
        "id": "GstK7tITrE",
        "title": "AniHead: Efficient and Animatable 3D Head Avatars Generation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent advances in diffusion models have led to great progress in generating high-quality 3D shape with textual guidance, especially for 3D head avatars. In spite of the current achievements, the Score Distillation Sampling (SDS) training strategy is too time-consuming for real-time applications. Besides, the implicit representations make these methods generally unavailable in animation. To solve these problems, we present an efficient generalized framework called AniHead, which contains shape and texture modelling respectively for generating animatable 3D head avatars. We propose a novel one-stage shape predicting module driven by parametric FLAME model. As for texture modelling, a conditional diffusion model is finetuned based on the proposed mean texture token. We further introduce a data-free strategy to train our model without collecting large-scale training set. Extensive experiments are conducted to show that our proposed method is not only more efficient than trivial SDS-based methods, but also able to produce high-fidelity and animatable 3D head avatars. The generated assets can be smoothly applied to various downstream tasks such as video and audio based head animation.",
        "keywords": "diffusion model;text-to-3D;3D head avatar",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/df45167333d4a035908699740770311e3a0f7c7f.zip",
        "author": "Shijie Zhang;Chengming Xu;Junwei Zhu;Xuelin Qian;Ying Tai;Yanwei Fu",
        "authorids": "~Shijie_Zhang3;~Chengming_Xu1;~Junwei_Zhu1;~Xuelin_Qian1;~Ying_Tai1;~Yanwei_Fu2",
        "gender": "F;M;M;;M;M",
        "homepage": "https://github.com/CookieJenny;https://chmxu.github.io;https://hmzjwhmzjw.github.io/;;https://tyshiwo.github.io/;http://yanweifu.github.io",
        "dblp": "27/4070.html;115/9183-1;;;158/1384;63/9065",
        "google_scholar": ";pjcYzvYAAAAJ;-OxQlHsAAAAJ;;NKaiUasAAAAJ;https://scholar.google.co.uk/citations?user=Vg54TcsAAAAJ",
        "orcid": ";0000-0003-3891-2227;0000-0002-5407-5150;;;0000-0002-6595-6893",
        "linkedin": ";;;;;",
        "or_profile": "~Shijie_Zhang3;~Chengming_Xu1;~Junwei_Zhu1;~Xuelin_Qian1;~Ying_Tai1;~Yanwei_Fu2",
        "aff": "Fudan University;Tencent;Tencent Youtu Lab;;Nanjing University;Fudan University,",
        "aff_domain": "fudan.edu.cn;tencent.com;tencent.com;;nju.edu.cn;fudan.edu.cn",
        "position": "MS student;Researcher;Researcher;;Associate Professor;Professor",
        "bibtex": "@misc{\nzhang2024anihead,\ntitle={AniHead: Efficient and Animatable 3D Head Avatars Generation},\nauthor={Shijie Zhang and Chengming Xu and Junwei Zhu and Xuelin Qian and Ying Tai and Yanwei Fu},\nyear={2024},\nurl={https://openreview.net/forum?id=GstK7tITrE}\n}",
        "github": "",
        "project": "",
        "reviewers": "3kTT;ggv2;9Wmk",
        "site": "https://openreview.net/forum?id=GstK7tITrE",
        "pdf_size": 43352377,
        "rating": "5;5;6",
        "confidence": "4;4;3",
        "soundness": "2;2;2",
        "contribution": "2;2;2",
        "presentation": "3;2;2",
        "wc_summary": "139;134;78",
        "wc_strengths": "21;92;55",
        "wc_weaknesses": "73;417;86",
        "wc_questions": "137;204;90",
        "wc_review": "370;847;309",
        "wc_reply_reviewers": "62;58;5",
        "wc_reply_authors": "247;1070;465",
        "reply_reviewers": "1;1;1",
        "reply_authors": "1;2;1",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            117.0,
            27.65260686927485
        ],
        "wc_strengths_avg": [
            56.0,
            28.994252303976847
        ],
        "wc_weaknesses_avg": [
            192.0,
            159.18752044889283
        ],
        "wc_questions_avg": [
            143.66666666666666,
            46.77843757782235
        ],
        "wc_review_avg": [
            508.6666666666667,
            240.53043235501175
        ],
        "wc_reply_reviewers_avg": [
            41.666666666666664,
            25.978623691198287
        ],
        "wc_reply_authors_avg": [
            594.0,
            348.1503506628518
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.9999999999999997,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:olWrZtWOOxIJ:scholar.google.com/&scioq=AniHead:+Efficient+and+Animatable+3D+Head+Avatars+Generation&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;2;0",
        "aff_unique_norm": "Fudan University;Tencent;Nanjing University",
        "aff_unique_dep": ";Tencent Holdings Limited;",
        "aff_unique_url": "https://www.fudan.edu.cn;https://www.tencent.com;https://www.nju.edu.cn",
        "aff_unique_abbr": "Fudan;Tencent;Nanjing U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "GszBQ3ZTzk",
        "title": "PDED: Revitalize physics laws submerged in data information for Traffic State Estimation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Traditional physics-informed deep learning combines the data-driven methods with the model-based methods by incorporating physics loss as a constraint in total loss function in general, which aims to enforce the neural network to behave according to the physics property. However, this simple integration makes physical knowledge submerged in data information since data loss and physics loss could have large magnitude differences, conflicting directions of the gradients, and varying convergence rates so that the physics law may not work as expected and inhibits the model from working effectively furthermore, especially for traffic state estimation (TSE). To alleviate these issues, we propose a Physical knowledge combined Data information neural network with Ensemble Distillation framework (PDED) to first disentangle the data-driven model and physics-based model, and then reassemble them to take advantages of label information and physics property. Practically, we separately train data-driven model based on true labels and physics-based model according to physics laws. Then, we introduce the ensemble learning and knowledge distillation to assemble their representations of these two models for constructing a more competitive learnable online teacher model, which in turn distills knowledge to guide the update of them for learning richer knowledge to improve the performance of student models. Through extensive experiments on both synthetic dataset and real-world datasets, our model demonstrates better performance than the existing state-of-the-art methods.",
        "keywords": "Physics-informed deep learning;Traffic state estimation;Knowledge distillation;Ensemble learning",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/a2e6b5b1436004e0907405012360cce043adef51.zip",
        "author": "Yao Fu;Hong Zhao;Xiaoyu Cai;Ruiheng Yang;Weihao Jiang;Shiliang Pu",
        "authorids": "~Yao_Fu7;~Hong_Zhao5;~Xiaoyu_Cai1;~Ruiheng_Yang1;~Weihao_Jiang2;~Shiliang_Pu1",
        "gender": "M;M;F;M;M;M",
        "homepage": "https://orcid.org/0000-0002-8931-3665;https://orcid.org/0000-0001-5448-8775;https://orcid.org/0000-0003-0098-4700;https://orcid.org/0000-0003-1244-7697;https://orcid.org/0000-0003-3482-8538;",
        "dblp": "237/6498.html;72/4751-2.html;156/1776;353/8494;262/6776.html;155/3173",
        "google_scholar": ";;;;;https://scholar.google.com.hk/citations?user=NWR_wpoAAAAJ",
        "orcid": "0000-0002-8931-3665;0000-0001-5448-8775;0000-0003-0098-4700;0000-0003-1244-7697;0000-0003-3482-8538;",
        "linkedin": ";;;;;",
        "or_profile": "~Yao_Fu7;~Hong_Zhao5;~Xiaoyu_Cai1;~Ruiheng_Yang1;~Weihao_Jiang2;~Shiliang_Pu1",
        "aff": "Hikvision Research Institute;Hikvision Research Institute;Hikvision Research Institute;Hikvision Research Institute;Hikvision Research Institute;",
        "aff_domain": "hikvision.com;hikvision.com;hikvision.com;hikvision.com;hikvision.com;",
        "position": "Researcher;Researcher;Researcher;Researcher;Researcher;",
        "bibtex": "@misc{\nfu2024pded,\ntitle={{PDED}: Revitalize physics laws submerged in data information for Traffic State Estimation},\nauthor={Yao Fu and Hong Zhao and Xiaoyu Cai and Ruiheng Yang and Weihao Jiang and Shiliang Pu},\nyear={2024},\nurl={https://openreview.net/forum?id=GszBQ3ZTzk}\n}",
        "github": "",
        "project": "",
        "reviewers": "gduu;m66B;ntPW",
        "site": "https://openreview.net/forum?id=GszBQ3ZTzk",
        "pdf_size": 1705079,
        "rating": "3;5;5",
        "confidence": "2;4;4",
        "soundness": "2;3;3",
        "contribution": "1;3;3",
        "presentation": "3;3;4",
        "wc_summary": "168;52;78",
        "wc_strengths": "75;32;89",
        "wc_weaknesses": "385;132;192",
        "wc_questions": "22;212;31",
        "wc_review": "650;428;390",
        "wc_reply_reviewers": "253;0;0",
        "wc_reply_authors": "1086;985;569",
        "reply_reviewers": "1;0;0",
        "reply_authors": "2;2;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            99.33333333333333,
            49.701330185642135
        ],
        "wc_strengths_avg": [
            65.33333333333333,
            24.25329301810833
        ],
        "wc_weaknesses_avg": [
            236.33333333333334,
            107.93928334433618
        ],
        "wc_questions_avg": [
            88.33333333333333,
            87.52269546935939
        ],
        "wc_review_avg": [
            489.3333333333333,
            114.66279063216435
        ],
        "wc_reply_reviewers_avg": [
            84.33333333333333,
            119.26534376013103
        ],
        "wc_reply_authors_avg": [
            880.0,
            223.7424114169387
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:B4-Ttv73GI4J:scholar.google.com/&scioq=PDED:+Revitalize+physics+laws+submerged+in+data+information+for+Traffic+State+Estimation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Hikvision Research Institute",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.hikvision.com/cn/",
        "aff_unique_abbr": "Hikvision",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "GtnNhtuVrc",
        "title": "Semi-Supervised Semantic Segmentation via Marginal Contextual Information",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We present a novel confidence refinement scheme that enhances pseudo-labels in semi-supervised semantic segmentation. Unlike current leading methods, which filter pixels with low-confidence predictions in isolation, our approach leverages the spatial correlation of labels in segmentation maps by grouping neighboring pixels and considering their pseudo-labels collectively. With this contextual information, our method, named S4MC, increases the amount of unlabeled data used during training while maintaining the quality of the pseudo-labels, all with negligible computational overhead. Through extensive experiments on standard benchmarks, we demonstrate that S4MC outperforms existing state-of-the-art semi-supervised learning approaches, offering a promising solution for reducing the cost of acquiring dense annotations. For example, S4MC achieves a  1.29 mIoU improvement over the prior state-of-the-art method on PASCAL VOC 12 with 366 annotated images. The code to reproduce our experiments is available at https://s4mcontext.github.io/",
        "keywords": "Semantic segmentation;semi-supervised learning;contextual information;semi-supervised segmentation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Moshe Kimhi;Shai Kimhi;Evgenii Zheltonozhskii;Or Litany;Chaim Baskin",
        "authorids": "~Moshe_Kimhi2;~Shai_Kimhi1;~Evgenii_Zheltonozhskii1;~Or_Litany1;~Chaim_Baskin1",
        "gender": "Non-Binary;;M;M;M",
        "homepage": "https://mkimhi.github.io/;http://GitHub.com/shaithekimhi;https://evgeniizh.com/;http://orlitany.github.io;https://chaimbaskin.bgu.ac.il",
        "dblp": "317/6911.html;;205/2315;119/1476;205/2308",
        "google_scholar": "uz7qJbsAAAAJ;;1yHw4W0AAAAJ;https://scholar.google.co.il/citations?user=Ihs8dwsAAAAJ;https://scholar.google.co.il/citations?user=lfWCxJYAAAAJ",
        "orcid": "0009-0000-7645-7339;;0000-0002-5400-9321;;0000-0003-4341-5639",
        "linkedin": "moshekimhi/;;zheltonozhskiy/;;chaim-baskin-97441340/",
        "or_profile": "~Moshe_Kimhi2;~Shai_Kimhi1;~Evgenii_Zheltonozhskii1;~Or_Litany1;~Chaim_Baskin1",
        "aff": "Technion - Israel Institute of Technology, Technion - Israel Institute of Technology;;Technion - Israel Institute of Technology, Technion;NVIDIA;Technion, Technion",
        "aff_domain": "campus.technion.ac.il;;technion.ac.il;nvidia.com;technion.ac.il",
        "position": "PhD student;;PhD student;Research Scientist;Visiting Assistant Professor",
        "bibtex": "@misc{\nkimhi2024semisupervised,\ntitle={Semi-Supervised Semantic Segmentation via Marginal Contextual Information},\nauthor={Moshe Kimhi and Shai Kimhi and Evgenii Zheltonozhskii and Or Litany and Chaim Baskin},\nyear={2024},\nurl={https://openreview.net/forum?id=GtnNhtuVrc}\n}",
        "github": "",
        "project": "",
        "reviewers": "xqtS;Fubg;HMfh;P9tM",
        "site": "https://openreview.net/forum?id=GtnNhtuVrc",
        "pdf_size": 24964253,
        "rating": "5;5;5;6",
        "confidence": "3;4;3;5",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;3;3",
        "wc_summary": "120;135;116;67",
        "wc_strengths": "53;50;103;89",
        "wc_weaknesses": "136;58;186;151",
        "wc_questions": "69;196;47;45",
        "wc_review": "378;439;452;352",
        "wc_reply_reviewers": "0;45;0;19",
        "wc_reply_authors": "506;916;788;633",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "2;4;2;2",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            109.5,
            25.53918557824427
        ],
        "wc_strengths_avg": [
            73.75,
            22.818577957445115
        ],
        "wc_weaknesses_avg": [
            132.75,
            46.81546218932373
        ],
        "wc_questions_avg": [
            89.25,
            62.34731349464867
        ],
        "wc_review_avg": [
            405.25,
            41.541395017500314
        ],
        "wc_reply_reviewers_avg": [
            16.0,
            18.452642087245934
        ],
        "wc_reply_authors_avg": [
            710.75,
            154.9699567658196
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            0.8660254037844386
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.8703882797784891,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11273827857411512363&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Technion - Israel Institute of Technology;NVIDIA",
        "aff_unique_dep": ";NVIDIA Corporation",
        "aff_unique_url": "https://www.technion.ac.il/en/;https://www.nvidia.com",
        "aff_unique_abbr": "Technion;NVIDIA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "Israel;United States"
    },
    {
        "id": "GwBTlCIGs5",
        "title": "Addressing Sample Inefficiency in Multi-View Representation Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Non-contrastive self-supervised learning (NC-SSL) methods like BarlowTwins and VICReg have shown great promise for label-free representation learning in computer vision. Despite the apparent simplicity of these techniques, researchers must rely on several empirical heuristics to achieve competitive performance, most notably using high-dimensional projector heads and two augmentations of the same image. In this work, we provide theoretical insights on the implicit bias of the BarlowTwins and VICReg loss that can explain these heuristics and guide the development of more principled recommendations. Our first insight is that the orthogonality of the features is more important than projector dimensionality for learning good representations. Based on this, we empirically demonstrate that low-dimensional projector heads are sufficient with appropriate regularization, contrary to the existing heuristic. Our second theoretical insight suggests that using multiple data augmentations better represents the desiderata of the SSL objective. Based on this, we demonstrate that leveraging more augmentations per sample improves representation quality and trainability. In particular, it improves optimization convergence, leading to better features emerging earlier in the training. Remarkably, we demonstrate that we can reduce the pretraining dataset size by up to 4x while maintaining accuracy and improving convergence simply by using more data augmentations. Combining these insights, we present practical pretraining recommendations that improve wall-clock time by 2x and improve performance on CIFAR-10/STL-10 datasets using a ResNet-50 backbone. Thus, this work provides a theoretical insight into NC-SSL and produces practical recommendations for improving its sample and compute efficiency.",
        "keywords": "representation learning;self-supervised learning;eigenfunctions;data-augmentation;learning dynamics;sample efficient",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/ac50da7ea3af4a39453022bc2cd3e637229eb264.pdf",
        "author": "Kumar Krishna Agrawal;Arna Ghosh;Adam M Oberman;Blake Aaron Richards",
        "authorids": "~Kumar_Krishna_Agrawal1;~Arna_Ghosh1;~Adam_M_Oberman1;~Blake_Aaron_Richards1",
        "gender": ";M;M;M",
        "homepage": "https://kumarkrishna.github.io/;https://arnaghosh.github.io/;https://www.adamoberman.net/;http://linclab.org",
        "dblp": "190/7111;190/7223;31/8186;70/10850",
        "google_scholar": "https://scholar.google.co.in/citations?user=Wd8_fOcAAAAJ;https://scholar.google.ca/citations?user=YjS546oAAAAJ;https://scholar.google.ca/citations?user=LPAZlL8AAAAJ;https://scholar.google.ca/citations?user=1CPY1LsAAAAJ",
        "orcid": ";;;0000-0001-9662-2151",
        "linkedin": ";;adam-oberman-527348107/;",
        "or_profile": "~Kumar_Krishna_Agrawal1;~Arna_Ghosh1;~Adam_M_Oberman1;~Blake_Aaron_Richards1",
        "aff": "University of California Berkeley, USA;McGill University;McGill University;Mila - Quebec Artificial Intelligence Institute",
        "aff_domain": "berkeley.edu;mcgill.ca;mcgill.ca;mila.quebec",
        "position": "PhD student;PhD student;Full Professor;Associate Professor",
        "bibtex": "@misc{\nagrawal2024addressing,\ntitle={Addressing Sample Inefficiency in Multi-View Representation Learning},\nauthor={Kumar Krishna Agrawal and Arna Ghosh and Adam M Oberman and Blake Aaron Richards},\nyear={2024},\nurl={https://openreview.net/forum?id=GwBTlCIGs5}\n}",
        "github": "",
        "project": "",
        "reviewers": "ArGT;Ajht;QPCx;tALx",
        "site": "https://openreview.net/forum?id=GwBTlCIGs5",
        "pdf_size": 7688640,
        "rating": "3;3;6;8",
        "confidence": "4;3;3;3",
        "soundness": "2;2;2;4",
        "contribution": "1;3;2;3",
        "presentation": "2;3;3;4",
        "wc_summary": "60;58;66;84",
        "wc_strengths": "8;82;35;115",
        "wc_weaknesses": "891;164;276;115",
        "wc_questions": "17;1;2;25",
        "wc_review": "976;305;379;339",
        "wc_reply_reviewers": "1008;0;29;0",
        "wc_reply_authors": "1230;1100;1005;305",
        "reply_reviewers": "2;0;1;0",
        "reply_authors": "3;3;3;1",
        "rating_avg": [
            5.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            67.0,
            10.246950765959598
        ],
        "wc_strengths_avg": [
            60.0,
            41.34610017885605
        ],
        "wc_weaknesses_avg": [
            361.5,
            311.22700718286
        ],
        "wc_questions_avg": [
            11.25,
            10.158124826955023
        ],
        "wc_review_avg": [
            499.75,
            276.2076890674841
        ],
        "wc_reply_reviewers_avg": [
            259.25,
            432.4531043939909
        ],
        "wc_reply_authors_avg": [
            910.0,
            358.3120148697222
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.5,
            0.8660254037844386
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5443310539518174,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Fih6n2G4Va0J:scholar.google.com/&scioq=Addressing+Sample+Inefficiency+in+Multi-View+Representation+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "University of California, Berkeley;McGill University;Quebec Artificial Intelligence Institute",
        "aff_unique_dep": ";;Artificial Intelligence",
        "aff_unique_url": "https://www.berkeley.edu;https://www.mcgill.ca;https://mila.quebec",
        "aff_unique_abbr": "UC Berkeley;McGill;Mila",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Berkeley;",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "United States;Canada"
    },
    {
        "id": "GwKNdRc9Bj",
        "title": "Exploiting Action Distances for Reward Learning from Human Preferences",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Preference-based Reinforcement Learning (PbRL) with binary preference feedbacks over trajectory pairs has proved to be quite effective in learning complex preferences of a human in the loop in domains with high dimensional state spaces and action spaces. While the human preference is primarily inferred from the feedback provided, we propose that the policy being learned (jointly with the reward model) during training can provide valuable learning signal about the structure of the state space that can be leveraged by the reward learning process. We introduce an action distance measure based on the policy and use it as an auxiliary prediction task for reward learning to influence its embedding space. This measure not only provides insight into the transition dynamics of the environment but also informs about the reachability of states and the overall state space structure. We evaluate the performance and sample efficiency of our approach using a combination of six tasks in Meta-World domains with simulated oracles. We also conduct human in the loop evaluation on three tasks to confirm our findings from oracular experiments. We demonstrate that the proposed simple auxiliary task for constraining reward model's embedding space can provide strong empirical improvements to sample efficiency and accelerate policy learning.",
        "keywords": "Preference based Reinforcement Learning;Human Aware AI;Reward Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/08468f99fbd2ad03a6ad16361cc419efd60ce46b.zip",
        "author": "Mudit Verma;Siddhant Bhambri;Subbarao Kambhampati",
        "authorids": "~Mudit_Verma2;~Siddhant_Bhambri1;~Subbarao_Kambhampati1",
        "gender": "M;M;M",
        "homepage": "https://famishedrover.github.io/;https://sbhambr1.github.io;http://rakaposhi.eas.asu.edu",
        "dblp": "192/7474;;k/SKambhampati",
        "google_scholar": "8TtypKwAAAAJ;E9I6GbwAAAAJ;yl3L07sAAAAJ",
        "orcid": ";0000-0003-1182-4999;",
        "linkedin": ";siddhant-bhambri/;",
        "or_profile": "~Mudit_Verma2;~Siddhant_Bhambri1;~Subbarao_Kambhampati1",
        "aff": "Arizona State University;Microsoft;Arizona State University",
        "aff_domain": "asu.edu;microsoft.com;asu.edu",
        "position": "PhD student;Intern;Full Professor",
        "bibtex": "@misc{\nverma2024exploiting,\ntitle={Exploiting Action Distances for Reward Learning from Human Preferences},\nauthor={Mudit Verma and Siddhant Bhambri and Subbarao Kambhampati},\nyear={2024},\nurl={https://openreview.net/forum?id=GwKNdRc9Bj}\n}",
        "github": "",
        "project": "",
        "reviewers": "Yyxw;kRFF;FW2T;tG87",
        "site": "https://openreview.net/forum?id=GwKNdRc9Bj",
        "pdf_size": 4202473,
        "rating": "3;3;3;6",
        "confidence": "5;4;4;3",
        "soundness": "2;2;2;3",
        "contribution": "2;1;2;3",
        "presentation": "2;3;2;3",
        "wc_summary": "29;133;103;89",
        "wc_strengths": "62;21;79;37",
        "wc_weaknesses": "732;277;182;51",
        "wc_questions": "135;87;352;27",
        "wc_review": "958;518;716;204",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            88.5,
            37.851684242580276
        ],
        "wc_strengths_avg": [
            49.75,
            22.331312097590683
        ],
        "wc_weaknesses_avg": [
            310.5,
            256.2406095840392
        ],
        "wc_questions_avg": [
            150.25,
            122.60378256807577
        ],
        "wc_review_avg": [
            599.0,
            276.20463428407567
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5448594575883409705&as_sdt=80005&sciodt=0,11&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Arizona State University;Microsoft",
        "aff_unique_dep": ";Microsoft Corporation",
        "aff_unique_url": "https://www.asu.edu;https://www.microsoft.com",
        "aff_unique_abbr": "ASU;Microsoft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Universal Jailbreak Backdoors from Poisoned Human Feedback",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19013",
        "id": "GxCGsxiAaK",
        "author_site": "Javier Rando, Florian Tramer",
        "tldr": "",
        "abstract": "Reinforcement Learning from Human Feedback (RLHF) is used to align large language models to produce helpful and harmless responses. Yet, these models can be jailbroken by finding adversarial prompts that revert the model to its unaligned behavior. In this paper, we consider a new threat where an attacker poisons the RLHF data to embed a jailbreak trigger into the model as a backdoor. The trigger then acts like a universal sudo command, enabling arbitrary harmful responses without  the need to search for an adversarial prompt. Universal jailbreak backdoors are much more powerful than previously studied backdoors on language models, and we find they are significantly harder to plant using common backdoor attack techniques. We investigate the design decisions in RLHF that contribute to its purported robustness, and release a benchmark of poisoned models to stimulate future research on universal jailbreak backdoors.",
        "keywords": "large language models;data poisoning;human feedback;jailbreak",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Javier Rando;Florian Tram\u00e8r",
        "authorids": "~Javier_Rando2;~Florian_Tram\u00e8r1",
        "gender": "M;M",
        "homepage": "https://javirando.com;http://floriantramer.com",
        "dblp": "257/3128;158/7224",
        "google_scholar": "d_rilUYAAAAJ;https://scholar.google.ch/citations?user=ijH0-a8AAAAJ",
        "orcid": ";",
        "linkedin": "https://linkedin.com/in/javier-rando;",
        "or_profile": "~Javier_Rando2;~Florian_Tramer1",
        "aff": "Department of Computer Science, ETHZ - ETH Zurich;ETHZ - ETH Zurich",
        "aff_domain": "inf.ethz.ch;ethz.ch",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nrando2024universal,\ntitle={Universal Jailbreak Backdoors from Poisoned Human Feedback},\nauthor={Javier Rando and Florian Tram{\\`e}r},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=GxCGsxiAaK}\n}",
        "github": "",
        "project": "",
        "reviewers": "Yw38;apv8;pAKa;BqZN",
        "pdf_size": 2612807,
        "rating": "5;6;6;6",
        "confidence": "3;5;2;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "127;31;58;49",
        "wc_strengths": "94;38;36;49",
        "wc_weaknesses": "127;160;81;54",
        "wc_questions": "145;5;11;4",
        "wc_review": "493;234;186;156",
        "wc_reply_reviewers": "104;11;185;9",
        "wc_reply_authors": "263;430;568;428",
        "reply_reviewers": "1;1;2;1",
        "reply_authors": "2;2;3;2",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            66.25,
            36.396256675652786
        ],
        "wc_strengths_avg": [
            54.25,
            23.47738273317535
        ],
        "wc_weaknesses_avg": [
            105.5,
            40.88092464707715
        ],
        "wc_questions_avg": [
            41.25,
            59.959882421499124
        ],
        "wc_review_avg": [
            267.25,
            133.2729811327112
        ],
        "wc_reply_reviewers_avg": [
            77.25,
            73.09711006599372
        ],
        "wc_reply_authors_avg": [
            422.25,
            108.04715405784643
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.2581988897471611,
        "gs_citation": 80,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4777621637839124955&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=GxCGsxiAaK",
        "pdf": "https://openreview.net/pdf?id=GxCGsxiAaK",
        "email": "inf.ethz.ch;ethz.ch",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "ETH Zurich",
        "aff_unique_dep": "Department of Computer Science",
        "aff_unique_url": "https://www.ethz.ch",
        "aff_unique_abbr": "ETHZ",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Zurich;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Switzerland"
    },
    {
        "id": "GxmltrqVNn",
        "title": "Gated Attention Bins for Depth Estimation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Estimating pinpoint-accuracy depth from a single RGB image is challenging because it is an ill-posed problem as infinitely many 3D scenes can be projected to the same 2D scene. We propose a method to convert monocular depth estimation from a regression problem to a classification problem. The natural long-range property of the attention mechanism allows it to make good use of the global effective information in the fine features. We compute gated attention on highest-resolution feature map to obtain the association information between features to divide the depth range into bins whose center value is estimated adaptively per image. The final depth values are estimated by linearly combining with the results of the multiscale feature fusion and bin centers. We call our new building block GABins. Experiments demonstrate that our method improves the performance across all metrics on both the KITTI and NYUv2 datasets compared to previous methods. Further, we explore the model generalization capability via zero-shot testing.",
        "keywords": "monocular depth estimation\uff0cgated attention;multiscale feature fusion",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Xidan Zhang;Jianing Wei;Zhiming Tan",
        "authorids": "~Xidan_Zhang2;~Jianing_Wei3;~Zhiming_Tan1",
        "gender": ";;",
        "homepage": "https://github.com/danyake;https://www.fujitsu.com/cn/about/local/subsidiaries/frdc/;",
        "dblp": ";;",
        "google_scholar": ";;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Xidan_Zhang2;~Jianing_Wei3;~Zhiming_Tan1",
        "aff": ";;",
        "aff_domain": ";;",
        "position": ";;",
        "bibtex": "@misc{\nzhang2024gated,\ntitle={Gated Attention Bins for Depth Estimation},\nauthor={Xidan Zhang and Jianing Wei and Zhiming Tan},\nyear={2024},\nurl={https://openreview.net/forum?id=GxmltrqVNn}\n}",
        "github": "",
        "project": "",
        "reviewers": "Kve8;H1hq;vZWC;C3QZ",
        "site": "https://openreview.net/forum?id=GxmltrqVNn",
        "pdf_size": 9401923,
        "rating": "1;3;3;3",
        "confidence": "1;4;3;5",
        "soundness": "1;1;3;2",
        "contribution": "1;1;2;2",
        "presentation": "2;2;2;3",
        "wc_summary": "52;48;108;75",
        "wc_strengths": "5;21;59;73",
        "wc_weaknesses": "159;196;119;199",
        "wc_questions": "28;1;52;78",
        "wc_review": "244;266;338;425",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            1.479019945774904
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            70.75,
            23.84716964337697
        ],
        "wc_strengths_avg": [
            39.5,
            27.54541704167864
        ],
        "wc_weaknesses_avg": [
            168.25,
            32.50673007240193
        ],
        "wc_questions_avg": [
            39.75,
            28.516442625264464
        ],
        "wc_review_avg": [
            318.25,
            70.76148316704506
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.8783100656536799,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Mx0YwHRngloJ:scholar.google.com/&scioq=Gated+Attention+Bins+for+Depth+Estimation&hl=en&as_sdt=0,5",
        "gs_version_total": 0
    },
    {
        "id": "GxrVyYoLSx",
        "title": "Implicit Regularisation in Overparametrized Networks: A Multiscale Analysis of the Fokker-Planck equation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In over-parametrised networks, a large continuous set of solutions (an invariant manifold) exists where the empirical loss is minimal. However, noise in the learning dynamics can introduce a drift along this manifold, biasing the dynamics towards solutions with higher ``smoothness'', therefore acting as a regularizer. In Li et al. (2022), a derivation of this drift was presented, borrowing the results from Katzenberger (1991), which shows that in the small learning-rate limit, $\\eta \\to 0$, the learning dynamics can be approximated by a stochastic differential equation (SDE), whose solution exhibit two distinct phases: a first phase, occurring over a number of steps $O(\\eta^{-1})$, where the parameters are deterministically driven towards the invariant manifold; and a second phase, over timescales $O(\\eta^{-2})$, in which noise induces a deterministic drift along the invariant manifold.\nThis latter contribution to the drift, can be regarded as the result of averaging the dynamics over the $O(\\eta^{1/2})$ fluctuations orthogonal to the manifold, described by an Ornstein--Uhlenbeck process, as first suggested by Blanc et al. (2020).\nWe offer a new derivation of the results by Li et al. (2022), that builds on the very intuitive arguments by Blanc et al. (2020), by implementing the averaging of the Fokker-Planck equation associated with the $\\eta \\to 0$ dynamics over such Ornstein--Uhlenbeck quasi-stationary state.\nOur contribution demonstrates the application of multiscale methods for elliptic partial differential equations (PDEs) (Pavliotis and Stuart (2008)) to optimization problems in machine learning.",
        "keywords": "overparametrized networks;optimisation;implicit regularization;multiscale;fokker-planck equation",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Alberto Pezzotta;Peter E. Latham",
        "authorids": "~Alberto_Pezzotta1;~Peter_E._Latham1",
        "gender": "Not Specified;M",
        "homepage": ";http://www.gatsby.ucl.ac.uk/~pel/",
        "dblp": ";18/4059",
        "google_scholar": ";",
        "orcid": "0000-0002-8998-7942;",
        "linkedin": ";",
        "or_profile": "~Alberto_Pezzotta1;~Peter_E._Latham1",
        "aff": "University College London, University of London;",
        "aff_domain": "ucl.ac.uk;",
        "position": "Postdoc;",
        "bibtex": "@misc{\npezzotta2024implicit,\ntitle={Implicit Regularisation in Overparametrized Networks: A Multiscale Analysis of the Fokker-Planck equation},\nauthor={Alberto Pezzotta and Peter E. Latham},\nyear={2024},\nurl={https://openreview.net/forum?id=GxrVyYoLSx}\n}",
        "github": "",
        "project": "",
        "reviewers": "57JF;a3pb;NSHD;3Hfp",
        "site": "https://openreview.net/forum?id=GxrVyYoLSx",
        "pdf_size": 307709,
        "rating": "3;3;3;5",
        "confidence": "3;3;3;4",
        "soundness": "2;2;2;3",
        "contribution": "3;2;2;2",
        "presentation": "1;1;2;2",
        "wc_summary": "75;75;172;44",
        "wc_strengths": "128;25;120;63",
        "wc_weaknesses": "667;102;115;116",
        "wc_questions": "75;9;8;40",
        "wc_review": "945;211;415;263",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            91.5,
            48.16897341650536
        ],
        "wc_strengths_avg": [
            84.0,
            42.290660907581
        ],
        "wc_weaknesses_avg": [
            250.0,
            240.8183963072589
        ],
        "wc_questions_avg": [
            33.0,
            27.44995446262161
        ],
        "wc_review_avg": [
            458.5,
            290.7107669144712
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:th9TMvU2hw0J:scholar.google.com/&scioq=Implicit+Regularisation+in+Overparametrized+Networks:+A+Multiscale+Analysis+of+the+Fokker-Planck+equation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "University College London",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucl.ac.uk",
        "aff_unique_abbr": "UCL",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "GxwxTR4jmj",
        "title": "Adapting Cross-View Localization to New Areas without Ground Truth Positions",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Given a ground-level query image, cross-view localization aims to estimate the location of the ground camera by matching the query to a geo-referenced aerial image that covers the local surroundings. Recent works have focused on developing powerful frameworks trained with ground truth (GT) locations of ground images within aerial images. However, the trained models always suffer a performance drop when applied to images in a new target area that differs from the training data. In most deployment scenarios, acquiring accurate GT location data for target-area images to re-train the network can be expensive and sometimes infeasible. In contrast, collecting images with coarse GT with errors of tens of meters is relatively easier. Motivated by this, our paper focuses on improving the generalization of a trained model by leveraging only the target area images without accurate GT. We propose a weakly-supervised learning approach based on knowledge self-distillation, namely, using predictions from a teacher model to supervise a student model with the same architecture. Our approach includes a mode-based pseudo GT generation for reducing uncertainty in pseudo GT and an outlier filtering to remove unreliable pseudo GT for student training. We validate our approach is generic by performing experiments on two recent state-of-the-art models with two benchmarks. The results demonstrate that our approach consistently and considerably boosts the localization performance in the target area.",
        "keywords": "Cross-view localization;weakly-supervised learning;knowledge distillation;ground-to-aerial visual localization",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Zimin Xia;Yujiao Shi;Hongdong Li;Julian F. P. Kooij",
        "authorids": "~Zimin_Xia1;~Yujiao_Shi1;~Hongdong_Li1;~Julian_F._P._Kooij1",
        "gender": "M;F;M;M",
        "homepage": "https://ziminxia.github.io/;https://shiyujiao.github.io/;http://users.cecs.anu.edu.au/~hongdong/;https://jkooij.github.io/",
        "dblp": "239/7414;159/2546;59/4859.html;56/7158",
        "google_scholar": "Wl7NqjoAAAAJ;rVsRpZEAAAAJ;https://scholar.google.com.tw/citations?hl=en;https://scholar.google.nl/citations?user=Uq5KrMoAAAAJ",
        "orcid": "0000-0002-4981-9514;0000-0001-6028-9051;;0000-0001-9919-0710",
        "linkedin": "zimin-xia-1928861b1/;yujiao-shi-053a12198/;;",
        "or_profile": "~Zimin_Xia1;~Yujiao_Shi1;~Hongdong_Li1;~Julian_Kooij1",
        "aff": "Delft University of Technology;Australian National University;Australian National University;Delft University of Technology",
        "aff_domain": "tudelft.nl;anu.edu.au;anu.edu.au;tudelft.nl",
        "position": "PhD student;Postdoc;Full Professor;Associate Professor",
        "bibtex": "@misc{\nxia2024adapting,\ntitle={Adapting Cross-View Localization to New Areas without Ground Truth Positions},\nauthor={Zimin Xia and Yujiao Shi and Hongdong Li and Julian F. P. Kooij},\nyear={2024},\nurl={https://openreview.net/forum?id=GxwxTR4jmj}\n}",
        "github": "",
        "project": "",
        "reviewers": "Tcvm;8CJA",
        "site": "https://openreview.net/forum?id=GxwxTR4jmj",
        "pdf_size": 4422983,
        "rating": "3;5",
        "confidence": "4;4",
        "soundness": "2;2",
        "contribution": "1;2",
        "presentation": "2;3",
        "wc_summary": "40;56",
        "wc_strengths": "15;51",
        "wc_weaknesses": "109;188",
        "wc_questions": "227;3",
        "wc_review": "391;298",
        "wc_reply_reviewers": "0;0",
        "wc_reply_authors": "307;318",
        "reply_reviewers": "0;0",
        "reply_authors": "1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            48.0,
            8.0
        ],
        "wc_strengths_avg": [
            33.0,
            18.0
        ],
        "wc_weaknesses_avg": [
            148.5,
            39.5
        ],
        "wc_questions_avg": [
            115.0,
            112.0
        ],
        "wc_review_avg": [
            344.5,
            46.5
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            312.5,
            5.5
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:qUZdJF9z1DgJ:scholar.google.com/&scioq=Adapting+Cross-View+Localization+to+New+Areas+without+Ground+Truth+Positions&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;0",
        "aff_unique_norm": "Delft University of Technology;Australian National University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tudelft.nl;https://www.anu.edu.au",
        "aff_unique_abbr": "TU Delft;ANU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "Netherlands;Australia"
    },
    {
        "id": "Gyz9xEl8YQ",
        "title": "Learning Concept-Based Visual Causal Transition and Symbolic Reasoning for Visual Planning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Visual planning simulates how humans make decisions to achieve desired goals in the form of searching for visual causal transitions between an initial visual state and a final visual goal state. It has become increasingly important in egocentric vision with its advantages in guiding agents to perform daily tasks in complex environments. In this paper, we propose an interpretable and generalizable visual planning framework consisting of i) a novel Substitution-based Concept Learner (SCL) that abstracts visual inputs into disentangled concept representations, ii) symbol abstraction and reasoning that performs task planning via the self-learned symbols, and iii) a Visual Causal Transition model (ViCT) that grounds visual causal transitions to semantically similar real-world actions. Given an initial state, we perform goal-conditioned visual planning with a symbolic reasoning method fueled by the learned representations and causal transitions to reach the goal state. To verify the effectiveness of the proposed model, we collect a large-scale visual planning dataset based on AI2-THOR, dubbed as $\\textit{CCTP}$. Extensive experiments on this challenging dataset demonstrate the superior performance of our method in visual task planning. Empirically, we show that our framework can generalize to unseen task trajectories and unseen object categories. We will release our dataset and codes upon acceptance.",
        "keywords": "Representation Learning;Concept Learning;Causal Transition;Visual Planning;Symbol Reasoning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yilue Qian;Peiyu Yu;Ying Nian Wu;Wei Wang;Lifeng Fan",
        "authorids": "~Yilue_Qian1;~Peiyu_Yu1;~Ying_Nian_Wu1;~Wei_Wang4;~Lifeng_Fan1",
        "gender": ";M;F;;M",
        "homepage": "https://github.com/FQYQC;http://cognn.com/;https://lifengfan.github.io/;;http://www.stat.ucla.edu/~ywu/",
        "dblp": ";;164/3405;249/9449;18/568.html",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;WvdVTmIAAAAJ;https://scholar.google.com/citations?hl=en;7k_1QFIAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Yilue_Qian1;~Wei_Wang4;~Lifeng_Fan1;~Peiyu_Yu2;~Yingnian_Wu1",
        "aff": "Peking University;Beijing Institute for General Artificial Intelligence;Beijing Institute of General Artificial Intelligence;UCLA Department of Statistics;UCLA",
        "aff_domain": "pku.edu.cn;bigai.ai;bigai.ai;g.ucla.edu;stat.ucla.edu",
        "position": "Undergrad student;Research Scientist;Researcher;PhD student;Full Professor",
        "bibtex": "@misc{\nqian2024learning,\ntitle={Learning Concept-Based Visual Causal Transition and Symbolic Reasoning for Visual Planning},\nauthor={Yilue Qian and Peiyu Yu and Ying Nian Wu and Wei Wang and Lifeng Fan},\nyear={2024},\nurl={https://openreview.net/forum?id=Gyz9xEl8YQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "h59h;YcnS;mQyd;g4Qf",
        "site": "https://openreview.net/forum?id=Gyz9xEl8YQ",
        "pdf_size": 2089667,
        "rating": "3;3;5;6",
        "confidence": "4;4;2;3",
        "soundness": "2;3;2;3",
        "contribution": "1;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "71;68;71;95",
        "wc_strengths": "62;57;62;82",
        "wc_weaknesses": "557;371;188;123",
        "wc_questions": "51;101;3;5",
        "wc_review": "741;597;324;305",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            76.25,
            10.894379284750462
        ],
        "wc_strengths_avg": [
            65.75,
            9.60143218483576
        ],
        "wc_weaknesses_avg": [
            309.75,
            169.25036927581576
        ],
        "wc_questions_avg": [
            40.0,
            40.11234224026316
        ],
        "wc_review_avg": [
            491.75,
            184.53912186850786
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.7543365091413573,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10815958775744815944&as_sdt=80005&sciodt=0,11&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;3",
        "aff_unique_norm": "Peking University;Beijing Institute for General Artificial Intelligence;Beijing Institute of General Artificial Intelligence;University of California, Los Angeles",
        "aff_unique_dep": ";;;Department of Statistics",
        "aff_unique_url": "http://www.pku.edu.cn;http://www.bigaiai.org/;http://www.bigaiai.cn;https://www.ucla.edu",
        "aff_unique_abbr": "Peking U;BIGAI;BIGAI;UCLA",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Los Angeles",
        "aff_country_unique_index": "0;0;0;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "GzAk5WmCYP",
        "title": "FedPop: Federated Population-based Hyperparameter Tuning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Federated Learning (FL) is a distributed machine learning (ML) paradigm, in which multiple clients collaboratively train ML models without centralizing their local data. Similar to conventional ML pipelines, the client local optimization and server aggregation procedure in FL are sensitive to the hyperparameter (HP) selection. Despite extensive research on tuning HPs for centralized ML, these methods yield suboptimal results when employed in FL. This is mainly because their \"training-after-tuning\" framework is unsuitable for FL with limited client computation power. While some approaches have been proposed for HP-Tuning in FL, they are limited to the HPs for client local updates. In this work, we propose a novel HP-tuning algorithm, called Federated Population-based Hyperparameter Tuning (FedPop), to address this vital yet challenging problem. FedPop employs population-based evolutionary algorithms to optimize the HPs, which accommodates various HP types at both the client and server sides. Compared with prior tuning methods, FedPop employs an online  \"tuning-while-training\" framework, offering computational efficiency and enabling the exploration of a broader HP search space. Our empirical validation on the common FL benchmarks and complex real-world FL datasets, including full-sized Non-IID ImageNet-1K, demonstrates the effectiveness of the proposed method, which substantially outperforms the concurrent state-of-the-art HP tuning methods in FL.",
        "keywords": "Federated Learning;Hyperparameter Tuning;Evolutionary Methods",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/fc3a91c5f7d971d2010649de5dd8e9d004486d3b.zip",
        "author": "Haokun Chen;Denis Krompa\u00df;Jindong Gu;Volker Tresp",
        "authorids": "~Haokun_Chen3;~Denis_Krompa\u00df1;~Jindong_Gu1;~Volker_Tresp1",
        "gender": "M;M;;M",
        "homepage": "https://github.com/Chunk245;;;https://www.dbs.ifi.lmu.de/~tresp/",
        "dblp": ";130/7297;;t/VolkerTresp",
        "google_scholar": "ilbqzDwAAAAJ;https://scholar.google.de/citations?user=xEnt2TEAAAAJ;;xIJHTUwAAAAJ",
        "orcid": ";;;0000-0001-9428-3686",
        "linkedin": "haokun-chen-4a08991a4/;denis-krompa\u00df-0669b191/;;volker-tresp-8110a118/",
        "or_profile": "~Haokun_Chen3;~Denis_Krompa\u00df1;~Jindong_Gu1;~Volker_Tresp1",
        "aff": "University of Munich, Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen;Siemens Technology;;Siemens Corporate Research",
        "aff_domain": "campus.lmu.de;siemens.com;;siemens.com",
        "position": "PhD student;Researcher;;Principal Researcher",
        "bibtex": "@misc{\nchen2024fedpop,\ntitle={FedPop: Federated Population-based Hyperparameter Tuning},\nauthor={Haokun Chen and Denis Krompa{\\ss} and Jindong Gu and Volker Tresp},\nyear={2024},\nurl={https://openreview.net/forum?id=GzAk5WmCYP}\n}",
        "github": "",
        "project": "",
        "reviewers": "T6YN;RYh9;KeXM;5toX;wxrg",
        "site": "https://openreview.net/forum?id=GzAk5WmCYP",
        "pdf_size": 1732780,
        "rating": "3;3;5;5;8",
        "confidence": "4;4;4;4;4",
        "soundness": "2;2;2;2;4",
        "contribution": "2;4;2;2;3",
        "presentation": "2;2;2;2;4",
        "wc_summary": "206;54;73;61;100",
        "wc_strengths": "111;113;23;51;63",
        "wc_weaknesses": "273;296;151;279;116",
        "wc_questions": "891;756;2;111;164",
        "wc_review": "1481;1219;249;502;443",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "464;295;172;317;198",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            4.8,
            1.8330302779823362
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.4,
            0.8
        ],
        "contribution_avg": [
            2.6,
            0.8
        ],
        "presentation_avg": [
            2.4,
            0.8
        ],
        "wc_summary_avg": [
            98.8,
            55.847649905792814
        ],
        "wc_strengths_avg": [
            72.2,
            34.999428566763775
        ],
        "wc_weaknesses_avg": [
            223.0,
            74.2940105257483
        ],
        "wc_questions_avg": [
            384.8,
            364.4949382364589
        ],
        "wc_review_avg": [
            778.8,
            481.02573735716055
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            289.2,
            103.35840556045744
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12247863263613900697&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen;Siemens AG",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.lmu.de;https://www.siemens.com",
        "aff_unique_abbr": "LMU;Siemens",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "GzG4BqztV8",
        "title": "EntProp: High Entropy Propagation via Auxiliary Batch Normalization Layers",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep neural networks (DNNs) struggle to generalize to out-of-distribution domains that are different from those in training despite their impressive performance.\nIn practical applications, it is important for DNNs to have both high standard accuracy and robustness against out-of-distribution domains.\nOne technique that achieves both of these improvements is disentangled learning with mixture distribution via auxiliary batch normalization layers (ABNs).\nThis technique treats clean and transformed samples as different domains, allowing a DNN to learn better features from mixed domains.\nHowever, if we distinguish the domains of the samples based on entropy, we find that some transformed samples are drawn from the same domain as clean samples, and these samples are not completely different domains.\nTo generate samples drawn from a completely different domain than clean samples, we hypothesize that transforming clean high-entropy samples to further increase the entropy generates out-of-distribution samples that are much further away from the in-distribution domain.\nOn the basis of the hypothesis, we propose high entropy propagation~(EntProp), which feeds high-entropy samples to the network that uses ABNs.\nWe introduce two techniques, data augmentation and free adversarial training, that increase entropy and bring the sample further away from the in-distribution domain.\nThese techniques do not require additional training costs.\nOur experimental results show that EntProp achieves higher standard accuracy and robustness with a lower training cost than existing methods.\nIn particular, EntProp is highly effective at training on small datasets.",
        "keywords": "adversarial training;batch normalization;disentangled learning;entropy",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Shohei Enomoto",
        "authorids": "~Shohei_Enomoto1",
        "gender": "M",
        "homepage": "",
        "dblp": "254/8054",
        "google_scholar": "https://scholar.google.co.jp/citations?user=QLIY4JgAAAAJ",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Shohei_Enomoto1",
        "aff": "NTT",
        "aff_domain": "ntt.co.jp",
        "position": "Researcher",
        "bibtex": "@misc{\nenomoto2024entprop,\ntitle={EntProp: High Entropy Propagation via Auxiliary Batch Normalization Layers},\nauthor={Shohei Enomoto},\nyear={2024},\nurl={https://openreview.net/forum?id=GzG4BqztV8}\n}",
        "github": "",
        "project": "",
        "reviewers": "hjam;A6wK;2wsR;CJYg",
        "site": "https://openreview.net/forum?id=GzG4BqztV8",
        "pdf_size": 474744,
        "rating": "3;3;5;5",
        "confidence": "3;5;4;3",
        "soundness": "3;2;2;2",
        "contribution": "1;2;2;2",
        "presentation": "2;2;3;2",
        "wc_summary": "57;56;117;63",
        "wc_strengths": "20;55;113;72",
        "wc_weaknesses": "159;176;210;430",
        "wc_questions": "93;80;160;208",
        "wc_review": "329;367;600;773",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            73.25,
            25.40054133281415
        ],
        "wc_strengths_avg": [
            65.0,
            33.45893004864322
        ],
        "wc_weaknesses_avg": [
            243.75,
            109.08798054781288
        ],
        "wc_questions_avg": [
            135.25,
            51.82361913259243
        ],
        "wc_review_avg": [
            517.25,
            180.46381216188468
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.30151134457776363,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:bC39kd_5pokJ:scholar.google.com/&scioq=EntProp:+High+Entropy+Propagation+via+Auxiliary+Batch+Normalization+Layers&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "NTT Corporation",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ntt.co.jp",
        "aff_unique_abbr": "NTT",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Japan"
    },
    {
        "title": "PINNACLE: PINN Adaptive ColLocation and Experimental points selection",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19012",
        "id": "GzNaCp6Vcg",
        "author_site": "Gregory Kang Ruey Lau, Apivich Hemachandra, See-Kiong Ng, Bryan Kian Hsiang Low",
        "tldr": "",
        "abstract": "Physics-Informed Neural Networks (PINNs), which incorporate PDEs as soft constraints, train with a composite loss function that contains multiple training point types: different types of collocation points chosen during training to enforce each PDE and initial/boundary conditions, and experimental points which are usually costly to obtain via experiments or simulations. Training PINNs using this loss function is challenging as it typically requires selecting large numbers of points of different types, each with different training dynamics. Unlike past works that focused on the selection of either collocation or experimental points, this work introduces PINN Adaptive ColLocation and Experimental points selection (PINNACLE), the first algorithm that jointly optimizes the selection of all training point types, while automatically adjusting the proportion of collocation point types as training progresses. PINNACLE uses information on the interactions among training point types, which had not been considered before, based on an analysis of PINN training dynamics via the Neural Tangent Kernel (NTK). We theoretically show that the criterion used by PINNACLE is related to the PINN generalization error, and empirically demonstrate that PINNACLE is able to outperform existing point selection methods for forward, inverse, and transfer learning problems.",
        "keywords": "Physics-informed Neural Networks;PINNs;adaptive training points selection",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "/attachment/b604ca26f186e6b1aab73e0e73eac05453f58908.zip",
        "author": "Gregory Kang Ruey Lau;Apivich Hemachandra;See-Kiong Ng;Bryan Kian Hsiang Low",
        "authorids": "~Gregory_Kang_Ruey_Lau1;~Apivich_Hemachandra1;~See-Kiong_Ng1;~Bryan_Kian_Hsiang_Low1",
        "gender": "M;M;M;M",
        "homepage": "https://www.comp.nus.edu.sg/~greglau/;https://apivich-h.github.io/;https://www.comp.nus.edu.sg/~ngsk/;http://www.comp.nus.edu.sg/~lowkh",
        "dblp": "358/7226;;00/5480;97/4877",
        "google_scholar": ";;https://scholar.google.com.tw/citations?user=_wsommYAAAAJ;https://scholar.google.com.tw/citations?user=2P-Q09UAAAAJ",
        "orcid": ";;0000-0001-6565-7511;",
        "linkedin": "gregorylau/;;seekiong/?originalSubdomain=sg;",
        "or_profile": "~Gregory_Kang_Ruey_Lau1;~Apivich_Hemachandra1;~See-Kiong_Ng1;~Bryan_Kian_Hsiang_Low1",
        "aff": "National University of Singapore;National University of Singapore;National University of Singapore;National University of Singapore",
        "aff_domain": "u.nus.edu;nus.edu;nus.edu.sg;nus.edu.sg",
        "position": "PhD student;PhD student;Full Professor;Associate Professor",
        "bibtex": "@inproceedings{\nlau2024pinnacle,\ntitle={{PINNACLE}: {PINN} Adaptive ColLocation and Experimental points selection},\nauthor={Gregory Kang Ruey Lau and Apivich Hemachandra and See-Kiong Ng and Bryan Kian Hsiang Low},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=GzNaCp6Vcg}\n}",
        "github": "",
        "project": "",
        "reviewers": "hySh;nqGc;WCRx;Eh91",
        "pdf_size": 12454676,
        "rating": "6;8;8;8",
        "confidence": "3;4;4;3",
        "soundness": "3;3;4;3",
        "contribution": "3;3;4;3",
        "presentation": "3;3;4;3",
        "wc_summary": "48;87;86;44",
        "wc_strengths": "25;92;95;45",
        "wc_weaknesses": "11;79;58;144",
        "wc_questions": "30;180;65;3",
        "wc_review": "114;438;304;236",
        "wc_reply_reviewers": "14;0;26;19",
        "wc_reply_authors": "1468;879;1028;1640",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "4;3;3;4",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            66.25,
            20.30240133580262
        ],
        "wc_strengths_avg": [
            64.25,
            30.11125204969066
        ],
        "wc_weaknesses_avg": [
            73.0,
            47.81736086402093
        ],
        "wc_questions_avg": [
            69.5,
            67.47777411859404
        ],
        "wc_review_avg": [
            273.0,
            117.08543888972702
        ],
        "wc_reply_reviewers_avg": [
            14.75,
            9.522998477370455
        ],
        "wc_reply_authors_avg": [
            1253.75,
            310.84270539937074
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.5,
            0.5
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 29,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6577458969772878241&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=GzNaCp6Vcg",
        "pdf": "https://openreview.net/pdf?id=GzNaCp6Vcg",
        "email": "u.nus.edu;nus.edu;nus.edu.sg;nus.edu.sg",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "National University of Singapore",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nus.edu.sg",
        "aff_unique_abbr": "NUS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Singapore"
    },
    {
        "title": "A Benchmark Study on Calibration",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19011",
        "id": "GzNhzX9kVa",
        "author_site": "Linwei Tao, Younan Zhu, Haolan Guo, Minjing Dong, Chang Xu",
        "tldr": "",
        "abstract": "Deep neural networks are increasingly utilized in various machine learning tasks. However, as these models grow in complexity, they often face calibration issues, despite enhanced prediction accuracy. Many studies have endeavored to improve calibration performance through the use of specific loss functions, data preprocessing and training frameworks. Yet, investigations into calibration properties have been somewhat overlooked. Our study leverages the Neural Architecture Search (NAS) search space, offering an exhaustive model architecture space for thorough calibration properties exploration. We specifically create a model calibration dataset. This dataset evaluates 90 bin-based and 12 additional calibration measurements across 117,702 unique neural networks within the widely employed NATS-Bench search space. Our analysis aims to answer several longstanding questions in the field, using our proposed dataset: (i) Can model calibration be generalized across different datasets? (ii) Can robustness be used as a calibration measurement? (iii) How reliable are calibration metrics? (iv) Does a post-hoc calibration method affect all models uniformly? (v) How does calibration interact with accuracy? (vi) What is the impact of bin size on calibration measurement? (vii) Which architectural designs are beneficial for calibration? Additionally, our study bridges an existing gap by exploring calibration within NAS. By providing this dataset, we enable further research into NAS calibration. As far as we are aware, our research represents the first large-scale investigation into calibration properties and the premier study of calibration issues within NAS.",
        "keywords": "Calibration",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/0d6cf0e00355c594d93eca5f20f6b1f06a740424.pdf",
        "author": "Linwei Tao;Younan Zhu;Haolan Guo;Minjing Dong;Chang Xu",
        "authorids": "~Linwei_Tao2;~Younan_Zhu1;~Haolan_Guo1;~Minjing_Dong1;~Chang_Xu4",
        "gender": "M;;M;M;",
        "homepage": "http://www.taolinwei.com;;;https://www.cs.cityu.edu.hk/~minjdong/;https://sydney.edu.au/engineering/about/our-people/academic-staff/c-xu.html",
        "dblp": "179/9246;;;246/2900.html;97/2966-2",
        "google_scholar": "GeNHmf4AAAAJ;;;https://scholar.google.com.au/citations?user=gJJRqlsAAAAJ;N4F_3eoAAAAJ",
        "orcid": "0000-0002-8848-0189;;;0009-0003-1717-818X;0000-0002-4756-0609",
        "linkedin": "linwei-tao-125aa5195;younan-zhu-592495192;haolan-guo-50994a273/;;",
        "or_profile": "~Linwei_Tao2;~Younan_Zhu1;~Haolan_Guo1;~Minjing_Dong1;~Charles_Xu1",
        "aff": "University of Sydney;University of Sydney;University of Sydney;City University of Hong Kong;University of Sydney",
        "aff_domain": "usyd.edu.au;usyd.edu.au;usyd.edu.au;cityu.edu.hk;sydney.eud.au",
        "position": "PhD student;MS student;Undergrad student;Assistant Professor;Associate Professor",
        "bibtex": "@inproceedings{\ntao2024a,\ntitle={A Benchmark Study on Calibration},\nauthor={Linwei Tao and Younan Zhu and Haolan Guo and Minjing Dong and Chang Xu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=GzNhzX9kVa}\n}",
        "github": "",
        "project": "",
        "reviewers": "Xzoe;qRJE;S1Jc",
        "pdf_size": 9223444,
        "rating": "3;6;6",
        "confidence": "4;4;3",
        "soundness": "3;3;2",
        "contribution": "2;3;2",
        "presentation": "3;3;2",
        "wc_summary": "55;153;65",
        "wc_strengths": "51;102;45",
        "wc_weaknesses": "232;312;141",
        "wc_questions": "6;63;4",
        "wc_review": "344;630;255",
        "wc_reply_reviewers": "461;76;0",
        "wc_reply_authors": "1421;2184;729",
        "reply_reviewers": "4;1;0",
        "reply_authors": "5;6;2",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            91.0,
            44.03029260255565
        ],
        "wc_strengths_avg": [
            66.0,
            25.573423705088842
        ],
        "wc_weaknesses_avg": [
            228.33333333333334,
            69.85858731911362
        ],
        "wc_questions_avg": [
            24.333333333333332,
            27.353650985238193
        ],
        "wc_review_avg": [
            409.6666666666667,
            159.97985984353016
        ],
        "wc_reply_reviewers_avg": [
            179.0,
            201.80353482203097
        ],
        "wc_reply_authors_avg": [
            1444.6666666666667,
            594.2369523645896
        ],
        "reply_reviewers_avg": [
            1.6666666666666667,
            1.699673171197595
        ],
        "reply_authors_avg": [
            4.333333333333333,
            1.699673171197595
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8407074288890703136&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=GzNhzX9kVa",
        "pdf": "https://openreview.net/pdf?id=GzNhzX9kVa",
        "email": "usyd.edu.au;usyd.edu.au;usyd.edu.au;cityu.edu.hk;sydney.eud.au",
        "author_num": 5,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "University of Sydney;City University of Hong Kong",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.sydney.edu.au;https://www.cityu.edu.hk",
        "aff_unique_abbr": "USYD;CityU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "Australia;China"
    },
    {
        "id": "GztevK7jDh",
        "title": "Constructing Informative Subtask Representations for Multi-Agent Coordination",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The introduction of subtasks holds the promise of promoting coordination in scenarios without communication. Instead of manually defined subtasks, recent studies attempt to decompose the overall task and allocate subtasks to agents automatically, but it remains unclear how to acquire a set of proficient subtask representations. In essence, the subtasks serve as auxiliary signals that assist agents in deducing the broader context from limited observations. To embed maximal information into subtask representations, we propose to first learn a vector quantization variational autoencoder which takes individual observations of agents as inputs and reconstructs the global state based on their assigned subtasks as latent variables. Next, the informative representations can be readily integrated into various classic multi-agent reinforcement learning frameworks to facilitate insightful decisions of agents. Experiments on StarCraft II micro-war challenges and Google Research Football have demonstrated that our method learns reasonable and informative subtask representations, which facilitate the decision-making of agents and significantly improve the overall performance.",
        "keywords": "Multi-Agent Reinforcement Learning;Coordination;Subtask Representation;Vector Quantised Variational Autoencoder",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/5936edd4120d60cc70bdee151b6711c006d1e286.zip",
        "author": "Guangchong Zhou;Zhiwei Xu;Bin Zhang;Dapeng Li;Zeren Zhang;Guoliang Fan",
        "authorids": "~Guangchong_Zhou1;~Zhiwei_Xu3;~Bin_Zhang12;~Dapeng_Li2;~Zeren_Zhang2;~Guoliang_Fan3",
        "gender": "M;M;;;;M",
        "homepage": "https://github.com/Jugg1er;;;;;http://www.ia.ac.cn",
        "dblp": "322/1173;262/0620-5;;;;f/GuoliangFan",
        "google_scholar": ";https://scholar.google.co.uk/citations?user=kZoG7ssAAAAJ;;;;",
        "orcid": ";0000-0002-0754-5295;;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Guangchong_Zhou1;~Zhiwei_Xu3;~Bin_Zhang12;~Dapeng_Li2;~Zeren_Zhang2;~Guoliang_Fan3",
        "aff": "Institute of Automation, Chinese Academy of Sciences;Institute of Automation, Chinese Academy of Sciences;;;;Institute of Automation, Chinese Academy of Sciences",
        "aff_domain": "ia.ac.cn;ia.ac.cn;;;;ia.ac.cn",
        "position": "PhD student;PhD student;;;;Full Professor",
        "bibtex": "@misc{\nzhou2024constructing,\ntitle={Constructing Informative Subtask Representations for Multi-Agent Coordination},\nauthor={Guangchong Zhou and Zhiwei Xu and Bin Zhang and Dapeng Li and Zeren Zhang and Guoliang Fan},\nyear={2024},\nurl={https://openreview.net/forum?id=GztevK7jDh}\n}",
        "github": "",
        "project": "",
        "reviewers": "qmnG;E766;J7bq;FTem",
        "site": "https://openreview.net/forum?id=GztevK7jDh",
        "pdf_size": 11353288,
        "rating": "3;5;5;6",
        "confidence": "5;4;4;3",
        "soundness": "3;2;2;3",
        "contribution": "3;2;3;3",
        "presentation": "3;2;3;4",
        "wc_summary": "64;64;101;49",
        "wc_strengths": "22;31;33;49",
        "wc_weaknesses": "249;176;392;12",
        "wc_questions": "2;96;1;46",
        "wc_review": "337;367;527;156",
        "wc_reply_reviewers": "0;71;151;0",
        "wc_reply_authors": "763;563;639;296",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            69.5,
            19.189841062395487
        ],
        "wc_strengths_avg": [
            33.75,
            9.730750228014282
        ],
        "wc_weaknesses_avg": [
            207.25,
            136.9075874449623
        ],
        "wc_questions_avg": [
            36.25,
            38.98958194184698
        ],
        "wc_review_avg": [
            346.75,
            131.70112945605288
        ],
        "wc_reply_reviewers_avg": [
            55.5,
            62.29165273132509
        ],
        "wc_reply_authors_avg": [
            565.25,
            171.0590175933441
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.9733285267845754,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4988001006190092953&as_sdt=5,34&sciodt=0,34&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Chinese Academy of Sciences",
        "aff_unique_dep": "Institute of Automation",
        "aff_unique_url": "http://www.ia.cas.cn",
        "aff_unique_abbr": "CAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "H03dW4TysQ",
        "title": "Experts on Demand: Dynamic Routing for Personalized Diffusion Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Diffusion models have excelled in the realm of image generation, owing to their expansive parameter space. However, this complexity introduces efficiency challenges. Most users only exploit a fraction of the available capabilities for specialized image categories. In this paper, we introduce Mixture of Expert Diffusion Models (MoEDM), a tailored and efficient strategy for large-scale diffusion models specific to certain applications. By employing dynamic routing, MoEDM selectively activates only indispensable neurons, thereby optimizing runtime performance for specialized tasks while minimizing computational costs. Our MoEDM doubles the sampling speed without compromising efficacy across various applications. Moreover, MoEDM's modular design allows straightforward incorporation of state-of-the-art optimization methods such as DPM-Solver and Latent Diffusion. Empirical assessments, validated by FID and KID scores, confirm the advantages of MoEDM in terms of both efficiency and robustness.",
        "keywords": "generative model;personalization;diffusion models;dynamic models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/e9837c27914f374d85808f28126c9c235623eed6.zip",
        "author": "Juntu Zhao;Jialing Zhang;Chongxuan Li;Dequan Wang",
        "authorids": "~Juntu_Zhao1;~Jialing_Zhang1;~Chongxuan_Li1;~Dequan_Wang1",
        "gender": "M;F;M;",
        "homepage": "https://juntuzhao.run;https://dqwang.group/authors/jialing-zhang/;http://ml.cs.tsinghua.edu.cn/~chongxuan;",
        "dblp": ";;161/9965;",
        "google_scholar": ";;UKMcQn4AAAAJ;",
        "orcid": ";;0000-0002-0912-9076;",
        "linkedin": ";;;",
        "or_profile": "~Juntu_Zhao1;~Jialing_Zhang1;~Chongxuan_Li1;~Dequan_Wang1",
        "aff": "Shanghai Jiaotong University;Shanghai Jiaotong University;Renmin University of China;",
        "aff_domain": "sjtu.edu.cn;sjtu.edu.cn;ruc.edu.cn;",
        "position": "PhD student;MS student;Associate Professor;",
        "bibtex": "@misc{\nzhao2024experts,\ntitle={Experts on Demand: Dynamic Routing for Personalized Diffusion Models},\nauthor={Juntu Zhao and Jialing Zhang and Chongxuan Li and Dequan Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=H03dW4TysQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "2faf;3fLN;gbUm;vr1Z",
        "site": "https://openreview.net/forum?id=H03dW4TysQ",
        "pdf_size": 13009172,
        "rating": "3;3;3;5",
        "confidence": "3;4;4;5",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "1;2;1;3",
        "wc_summary": "66;41;109;70",
        "wc_strengths": "31;27;42;34",
        "wc_weaknesses": "176;397;317;134",
        "wc_questions": "30;2;8;43",
        "wc_review": "303;467;476;281",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "383;393;185;324",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            71.5,
            24.336187047275914
        ],
        "wc_strengths_avg": [
            33.5,
            5.5
        ],
        "wc_weaknesses_avg": [
            256.0,
            105.93158169309095
        ],
        "wc_questions_avg": [
            20.75,
            16.543503256565703
        ],
        "wc_review_avg": [
            381.75,
            90.14259536978065
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            321.25,
            82.96497755077138
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Kx9_VQnEs0wJ:scholar.google.com/&scioq=Experts+on+Demand:+Dynamic+Routing+for+Personalized+Diffusion+Models&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Shanghai Jiao Tong University;Renmin University of China",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.sjtu.edu.cn;http://www.ruc.edu.cn",
        "aff_unique_abbr": "SJTU;RUC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "H0RztJssmQ",
        "title": "Adaptive Environmental Modeling for Task-Oriented Language Agents",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent advancements in the realm of intelligent agents, particularly those employing large language models, have been notably significant. Notwithstanding these advancements, intelligent agents encounter substantial challenges, predominantly in interactive and dynamic scenarios such as online shopping, attributed to an absence of integrated environmental modeling. In this paper, we propose a task-oriented environmental adaptation approach, allowing language agents to autonomously model new environments. This approach comprises two pivotal phases: Pre-Task Environment Exploration and In-Task Environment Update. The Pre-Task Environment Exploration phase incorporates a greedy exploration strategy, leveraging an agent in the role of an Evaluator to optimally explore environmental information based on present observations and feasible actions. This strategy is implemented through a recursive algorithm, enabling agents to choose and execute the top-k scored actions, thereby efficiently forming an Action-Observation Tree as the initial environmental modeling. During the In-Task Environment Update phase, agents employ environmental information to enhance task performance. The information generated from task execution and interaction trajectories is used to refine environmental modeling. These processes are iteratively executed, achieving mutual enhancement. We conduct a systematic evaluation of the environmental modeling, assessing both its effectiveness and comprehensiveness. The results demonstrate that under our approach, agents can indeed construct accurate environmental modeling. Simultaneously, we observe a significant enhancement in agent performance on both the ALFWorld-Eco and the WebShop benchmark datasets due to the application of environmental modeling.",
        "keywords": "Large Language Model;Environmental Adaptation;Agents;Interactive Decision Making",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Zhi Li;Yicheng Li;Yue DENG;Yin Zhang",
        "authorids": "~Zhi_Li6;~Yicheng_Li3;~Yue_DENG2;~Yin_Zhang3",
        "gender": "M;M;;M",
        "homepage": "https://github.com/silora;https://github.com/RuoShuiDY;https://person.zju.edu.cn/en/zhangyin;",
        "dblp": ";;91/3045-6;",
        "google_scholar": ";;vCoh6tYAAAAJ;https://scholar.google.com.hk/citations?hl=zh-CN",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Yicheng_Li3;~Yue_DENG2;~Yin_Zhang3;~Zhi_Ii1",
        "aff": "Zhejiang University;Zhejiang University;Zhejiang University;Zhejiang University",
        "aff_domain": "zju.edu.cn;zju.edu.cn;zju.edu.cn;zju.edu.cn",
        "position": "MS student;PhD student;Full Professor;PhD student",
        "bibtex": "@misc{\nli2024adaptive,\ntitle={Adaptive Environmental Modeling for Task-Oriented Language Agents},\nauthor={Zhi Li and Yicheng Li and Yue DENG and Yin Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=H0RztJssmQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "aS2x;7M58;KgBF",
        "site": "https://openreview.net/forum?id=H0RztJssmQ",
        "pdf_size": 1097639,
        "rating": "3;5;5",
        "confidence": "4;3;3",
        "soundness": "2;3;2",
        "contribution": "2;2;2",
        "presentation": "3;1;2",
        "wc_summary": "37;626;59",
        "wc_strengths": "97;2;29",
        "wc_weaknesses": "34;2;141",
        "wc_questions": "157;2;1",
        "wc_review": "325;632;230",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1318;1559;838",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;3;2",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            240.66666666666666,
            272.61980037325895
        ],
        "wc_strengths_avg": [
            42.666666666666664,
            39.96943276499625
        ],
        "wc_weaknesses_avg": [
            59.0,
            59.43624034767565
        ],
        "wc_questions_avg": [
            53.333333333333336,
            73.30453980181278
        ],
        "wc_review_avg": [
            395.6666666666667,
            171.55433217756084
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1238.3333333333333,
            299.68909815933506
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9999999999999998,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:7fM595UVAV0J:scholar.google.com/&scioq=Adaptive+Environmental+Modeling+for+Task-Oriented+Language+Agents&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Zhejiang University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.zju.edu.cn",
        "aff_unique_abbr": "ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "H1ggsZOGIb",
        "title": "FusionAD: Multi-modality Fusion for Prediction and Planning Tasks of Autonomous Driving",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Building a multi-modality multi-task neural network toward accurate and robust\nperformance is a de-facto standard in perception task of autonomous driving.\nHowever, leveraging such data from multiple sensors to jointly optimize the pre-\ndiction and planning tasks remains largely unexplored. In this paper, we present\nFusionAD, to the best of our knowledge, the first unified framework that fuse the\ninformation from two most critical sensors, camera and LiDAR, goes beyond per-\nception task. Concretely, we first build a transformer based multi-modality fusion\nnetwork to effectively produce fusion based features. In constrast to camera-based\nend-to-end method UniAD, we then establish a fusion aided modality-aware pre-\ndiction and status-aware planning modules, dubbed FMSPnP that take advantages\nof multi-modality features. We conduct extensive experiments on commonly used\nbenchmark nuScenes dataset, our FusionAD achieves state-of-the-art performance\nand surpassing baselines on average 15% on perception tasks like detection and\ntracking, 10% on occupancy prediction accuracy, reducing prediction error from\n0.708 to 0.389 in ADE score and reduces the collision rate from 0.31% to only\n0.12%.",
        "keywords": "autonomous driving;planning;prediction;perception;bird's eye view;end-to-end",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/0533d5d389a227035996219b9b848aee57c72af7.zip",
        "author": "Tengju Ye;Wei Jing;Chunyong Hu;Shikun Huang;lingping Gao;Jingke Wang;Fangzhen Li;Weibo Mao;Wencong Xiao;Kun Li;Hang Zheng;Junbo Chen;Kaicheng Yu",
        "authorids": "~Tengju_Ye1;~Wei_Jing1;~Chunyong_Hu1;~Shikun_Huang1;~lingping_Gao1;~Jingke_Wang1;~Fangzhen_Li1;~Weibo_Mao1;~Wencong_Xiao1;~Kun_Li7;~Hang_Zheng1;~Junbo_Chen1;~Kaicheng_Yu1",
        "gender": "M;;M;M;;;M;M;;M;M;M;M",
        "homepage": ";http://weijing.github.io/;;;https://ieeexplore.ieee.org/author/37089196389;;;;;https://flunge.github.io/;;;https://www.yukaicheng.cn",
        "dblp": "160/9533;;288/2242;;;262/1535;;44/4166;167/7982;;92/1606;33/1695;",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=zh-CN;;;;;https://scholar.google.com/citations?hl=en;;https://scholar.google.com/citations?hl=en;;https://scholar.google.com.hk/citations?user=4YOIYGwAAAAJ;j9OguiIAAAAJ",
        "orcid": ";;;;;;;;;;;0009-0002-2640-4137;",
        "linkedin": ";;;;;;https://www.linkedin.cn/incareer/in/ACoAACCm7JUB06PVjPG3HM_BDe_jQzQBzZeoao0;weibo-mao-3b2876236/;;;;;",
        "or_profile": "~Tengju_Ye1;~Wei_Jing1;~Chunyong_Hu1;~Shikun_Huang1;~lingping_Gao1;~Jingke_Wang1;~Fangzhen_Li1;~Weibo_Mao1;~Wencong_Xiao1;~Kun_Li7;~Hang_Zheng1;~Junbo_Chen1;~Kaicheng_Yu1",
        "aff": "UDEER AI PTE.LTD;NetEase, Inc.;Alibaba Group;Tongji University;;Udeer.AI;Baidu;;Alibaba Group;Alibaba Group;;UDEER AI PTE.LTD;Westlake University",
        "aff_domain": "udeer.ai;netease.com;alibaba-inc.com;tongji.edu.cn;;udeer.ai;baidu.com;;alibaba-inc.com;alibaba-inc.com;;udeer.ai;westlake.edu",
        "position": "Researcher;Researcher;Researcher;MS student;;Researcher;Researcher;;Researcher;Researcher;;Principal Researcher;Assistant Professor",
        "bibtex": "@misc{\nye2024fusionad,\ntitle={Fusion{AD}: Multi-modality Fusion for Prediction and Planning Tasks of Autonomous Driving},\nauthor={Tengju Ye and Wei Jing and Chunyong Hu and Shikun Huang and lingping Gao and Jingke Wang and Fangzhen Li and Weibo Mao and Wencong Xiao and Kun Li and Hang Zheng and Junbo Chen and Kaicheng Yu},\nyear={2024},\nurl={https://openreview.net/forum?id=H1ggsZOGIb}\n}",
        "github": "",
        "project": "",
        "reviewers": "eLPm;ynwV;Zqsu;w8af",
        "site": "https://openreview.net/forum?id=H1ggsZOGIb",
        "pdf_size": 10933947,
        "rating": "3;3;5;6",
        "confidence": "5;4;5;4",
        "soundness": "3;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;3;3",
        "wc_summary": "61;109;32;66",
        "wc_strengths": "67;53;32;74",
        "wc_weaknesses": "261;256;145;116",
        "wc_questions": "91;117;5;60",
        "wc_review": "480;535;214;316",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            67.0,
            27.504545078950134
        ],
        "wc_strengths_avg": [
            56.5,
            16.03901493234544
        ],
        "wc_weaknesses_avg": [
            194.5,
            64.8401881551866
        ],
        "wc_questions_avg": [
            68.25,
            41.72154719087009
        ],
        "wc_review_avg": [
            386.25,
            127.98510655541136
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            13,
            0
        ],
        "corr_rating_confidence": -0.19245008972987526,
        "gs_citation": 41,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8489573265721846624&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;3;4;5;2;2;0;6",
        "aff_unique_norm": "UDEER AI PTE.LTD;NetEase, Inc.;Alibaba Group;Tongji University;Udeer.ai;Baidu;Westlake University",
        "aff_unique_dep": ";;;;;Baidu, Inc.;",
        "aff_unique_url": ";https://www.163.com;https://www.alibaba.com;https://www.tongji.edu.cn;;https://www.baidu.com;https://www.westlake.edu.cn",
        "aff_unique_abbr": ";NetEase;Alibaba;Tongji;;Baidu;WU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;1;1;1;0;1",
        "aff_country_unique": "Singapore;China;"
    },
    {
        "title": "A unique M-pattern for micro-expression spotting in long videos",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19010",
        "id": "H396R79GiQ",
        "author_site": "Jinxuan Wang, Shiting Xu, Tong Zhang",
        "tldr": "",
        "abstract": "Micro-expression spotting (MES) is challenging since the small magnitude of micro-expression (ME) makes them susceptible to global movements like head rotation. However, the unique movement pattern and inherent characteristics of ME allow them to be distinguished from other movements. Existing MES methods based on fixed reference frame degrade optical flow accuracy and are overly dependent on facial alignment. In this paper, we propose a skip-$k$-frame block-wise main directional mean optical flow (MDMO) feature for MES based on unfixed reference frame. By employing skip-$k$-frame strategy, we substantiate the existence of a distinct and exclusive movement pattern in ME, called M-pattern due to its feature curve resembling the letter `M'. Based on M-pattern and characteristics of ME, we then provide a novel spotting rules to precisely locate ME intervals. Block-wise MDMO feature is capable of removing global movements without compromising complete ME movements in the early feature extraction stage. Besides, A novel pixelmatch-based facial alignment algorithm with dynamic update of reference frame is proposed to better align facial images and reduce jitter between frames. Experimental results on CAS(ME)$^2$, SAMM-LV and CASME II validate the proposed methods are superior to the state-of-the-art methods.",
        "keywords": "Micro-expression spotting;Optical flow;Facial alignment",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Jinxuan Wang;Shiting Xu;Tong Zhang",
        "authorids": "~Jinxuan_Wang1;~Shiting_Xu2;~Tong_Zhang14",
        "gender": ";M;F",
        "homepage": ";http://www2.scut.edu.cn/cs/2021/0317/c22284a422099/page.htm;",
        "dblp": ";07/4227-15;155/0102",
        "google_scholar": ";https://scholar.google.com/citations?hl=zh-CN;",
        "orcid": "0009-0001-5957-1153;;0000-0002-2188-4533",
        "linkedin": ";;https://www.linkedin.cn/injobs/in/%E6%96%BD%E5%A9%B7-%E8%AE%B8-38593b15b",
        "or_profile": "~Jinxuan_Wang1;~Tong_Zhang14;~Shiting_XU1",
        "aff": "South China University of Technology;South China University of Technology;South China University of Technology",
        "aff_domain": "scut.edu.cn;scut.edu.cn;scut.edu.cn",
        "position": "MS student;Full Professor;PhD student",
        "bibtex": "@inproceedings{\nwang2024a,\ntitle={A unique M-pattern for micro-expression spotting in long videos},\nauthor={Jinxuan Wang and Shiting Xu and Tong Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=H396R79GiQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "KsQW;32Bs;Z3Ax;yjCN;o3nk",
        "pdf_size": 9455509,
        "rating": "5;6;8;8;8",
        "confidence": "2;2;4;3;2",
        "soundness": "1;3;3;3;3",
        "contribution": "2;2;3;3;3",
        "presentation": "1;3;3;3;2",
        "wc_summary": "56;76;127;49;87",
        "wc_strengths": "18;62;48;51;90",
        "wc_weaknesses": "71;36;33;9;179",
        "wc_questions": "34;44;127;73;52",
        "wc_review": "179;218;335;182;408",
        "wc_reply_reviewers": "31;60;33;0;70",
        "wc_reply_authors": "1268;814;600;338;896",
        "reply_reviewers": "1;1;1;0;1",
        "reply_authors": "2;2;1;1;2",
        "rating_avg": [
            7.0,
            1.2649110640673518
        ],
        "confidence_avg": [
            2.6,
            0.8
        ],
        "soundness_avg": [
            2.6,
            0.8000000000000002
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.4,
            0.8
        ],
        "wc_summary_avg": [
            79.0,
            27.589853207293437
        ],
        "wc_strengths_avg": [
            53.8,
            23.24134247413432
        ],
        "wc_weaknesses_avg": [
            65.6,
            60.05197748617443
        ],
        "wc_questions_avg": [
            66.0,
            33.087762088119526
        ],
        "wc_review_avg": [
            264.4,
            91.47808480723675
        ],
        "wc_reply_reviewers_avg": [
            38.8,
            24.587801853764805
        ],
        "wc_reply_authors_avg": [
            783.2,
            309.9899353204874
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4
        ],
        "reply_authors_avg": [
            1.6,
            0.4898979485566356
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5929270612815711,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3241201029834677952&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=H396R79GiQ",
        "pdf": "https://openreview.net/pdf?id=H396R79GiQ",
        "email": "scut.edu.cn;scut.edu.cn;scut.edu.cn",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "South China University of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.scut.edu.cn",
        "aff_unique_abbr": "SCUT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Increasing Model Capacity for Free: A Simple Strategy for Parameter Efficient Fine-tuning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19009",
        "id": "H3IUunLy8s",
        "author_site": "Haobo SONG, Hao Zhao, Soumajit Majumder, Tao Lin",
        "tldr": "",
        "abstract": "Fine-tuning large pre-trained foundation models, such as the 175B GPT-3, has become the prevailing approach for downstream tasks. While parameter-efficient fine-tuning methods have been proposed and proven effective without retraining all model parameters, their performance is limited by the capacity of incremental modules, especially under constrained parameter budgets.\nTo overcome this challenge, we propose CAPABOOST, a simple yet effective strategy that enhances model capacity by leveraging low-rank updates through parallel weight modules in target layers. By applying static random masks to the shared weight matrix, CAPABOOST constructs a diverse set of weight matrices, effectively increasing the rank of incremental weights without adding parameters. Notably, our approach can be seamlessly integrated into various existing parameter-efficient fine-tuning methods. We extensively validate the efficacy of CAPABOOST through experiments on diverse downstream tasks, including natural language understanding, question answering, and image classification. Our results demonstrate significant improvements over baselines, without incurring additional computation\nor storage costs. We will make our code and benchmark publicly available.",
        "keywords": "Parameter-efficient Fine-tuning;Model Capacity",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Haobo SONG;Hao Zhao;Soumajit Majumder;Tao Lin",
        "authorids": "~Haobo_SONG1;~Hao_Zhao3;~Soumajit_Majumder2;~Tao_Lin1",
        "gender": ";M;;M",
        "homepage": ";https://marcelluszhao.github.io/;;https://lins-lab.github.io/",
        "dblp": ";;;64/4492-4.html",
        "google_scholar": ";vwWiKP8AAAAJ;;QE9pa_cAAAAJ",
        "orcid": ";;;0000-0002-3246-6935",
        "linkedin": ";hao-zhao-039a761a3/;;",
        "or_profile": "~Haobo_SONG1;~Hao_Zhao3;~Soumajit_Majumder2;~Tao_Lin1",
        "aff": ";EPFL - EPF Lausanne;;Westlake University",
        "aff_domain": ";epfl.ch;;westlake.edu",
        "position": ";MS student;;Assistant Professor",
        "bibtex": "@inproceedings{\nsong2024increasing,\ntitle={Increasing Model Capacity for Free: A Simple Strategy for Parameter Efficient Fine-tuning},\nauthor={Haobo SONG and Hao Zhao and Soumajit Majumder and Tao Lin},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=H3IUunLy8s}\n}",
        "github": "",
        "project": "",
        "reviewers": "LzY5;ZJAd;7oiV",
        "pdf_size": 1295780,
        "rating": "6;6;8",
        "confidence": "3;3;3",
        "soundness": "3;3;2",
        "contribution": "2;3;2",
        "presentation": "3;3;3",
        "wc_summary": "62;90;50",
        "wc_strengths": "43;81;57",
        "wc_weaknesses": "201;48;403",
        "wc_questions": "77;5;50",
        "wc_review": "383;224;560",
        "wc_reply_reviewers": "0;0;142",
        "wc_reply_authors": "1506;717;1489",
        "reply_reviewers": "0;0;1",
        "reply_authors": "4;3;4",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            67.33333333333333,
            16.75974011996871
        ],
        "wc_strengths_avg": [
            60.333333333333336,
            15.69146972791976
        ],
        "wc_weaknesses_avg": [
            217.33333333333334,
            145.38760454576436
        ],
        "wc_questions_avg": [
            44.0,
            29.698484809834994
        ],
        "wc_review_avg": [
            389.0,
            137.23702124426922
        ],
        "wc_reply_reviewers_avg": [
            47.333333333333336,
            66.93944195232649
        ],
        "wc_reply_authors_avg": [
            1237.3333333333333,
            367.9966787289738
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10046615701354795532&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=H3IUunLy8s",
        "pdf": "https://openreview.net/pdf?id=H3IUunLy8s",
        "email": ";epfl.ch;;westlake.edu",
        "author_num": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "EPFL;Westlake University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.epfl.ch;https://www.westlake.edu.cn",
        "aff_unique_abbr": "EPFL;WU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Lausanne;",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Switzerland;China"
    },
    {
        "id": "H3N5JJfqMX",
        "title": "Density Ratio Estimation-based Bayesian Optimization with Semi-Supervised Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Bayesian optimization has attracted huge attention from diverse research areas in science and engineering, since it is capable of finding a global optimum of an expensive-to-evaluate black-box function efficiently. In general, a probabilistic regression model, e.g., Gaussian processes and Bayesian neural networks, is widely used as a surrogate function to model an explicit distribution over function evaluations given an input to estimate and a training dataset. Beyond the probabilistic regression-based Bayesian optimization, density ratio estimation-based Bayesian optimization has been suggested in order to estimate a density ratio of the groups relatively close and relatively far to a global optimum. Developing this line of research further, a supervised classifier can be employed to estimate a class probability for the two groups instead of a density ratio. However, the supervised classifiers used in this strategy are prone to be overconfident for a global solution candidate. To solve this problem, we propose density ratio estimation-based Bayesian optimization with semi-supervised learning. Finally, we demonstrate the experimental results of our methods and several baseline methods in two distinct scenarios with unlabeled point sampling and a fixed-size pool.",
        "keywords": "Global optimization;Bayesian optimization;Density ratio estimation-based Bayesian optimization",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Jungtaek Kim",
        "authorids": "~Jungtaek_Kim1",
        "gender": "M",
        "homepage": "https://jungtaekkim.github.io",
        "dblp": "31/3193-1",
        "google_scholar": "KXNUYWgAAAAJ",
        "orcid": "0000-0002-1905-1399",
        "linkedin": "jungtaekkim",
        "or_profile": "~Jungtaek_Kim1",
        "aff": "University of Pittsburgh",
        "aff_domain": "pitt.edu",
        "position": "Postdoc",
        "bibtex": "@misc{\nkim2024density,\ntitle={Density Ratio Estimation-based Bayesian Optimization with Semi-Supervised Learning},\nauthor={Jungtaek Kim},\nyear={2024},\nurl={https://openreview.net/forum?id=H3N5JJfqMX}\n}",
        "github": "",
        "project": "",
        "reviewers": "NoA7;tEiT;fMcY;WaiC",
        "site": "https://openreview.net/forum?id=H3N5JJfqMX",
        "pdf_size": 3950894,
        "rating": "3;6;6;6",
        "confidence": "4;4;3;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "1;1;3;3",
        "wc_summary": "78;92;71;55",
        "wc_strengths": "94;3;52;17",
        "wc_weaknesses": "99;192;77;90",
        "wc_questions": "198;36;32;3",
        "wc_review": "469;323;232;165",
        "wc_reply_reviewers": "0;23;80;0",
        "wc_reply_authors": "534;433;296;238",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "2;2;3;2",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            1.0
        ],
        "wc_summary_avg": [
            74.0,
            13.322912594474229
        ],
        "wc_strengths_avg": [
            41.5,
            35.174564673923115
        ],
        "wc_weaknesses_avg": [
            114.5,
            45.423011789180165
        ],
        "wc_questions_avg": [
            67.25,
            76.55512719602783
        ],
        "wc_review_avg": [
            297.25,
            113.91745915354679
        ],
        "wc_reply_reviewers_avg": [
            25.75,
            32.6984326841517
        ],
        "wc_reply_authors_avg": [
            375.25,
            115.81747493362131
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=819420866494840916&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Pittsburgh",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.pitt.edu",
        "aff_unique_abbr": "Pitt",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "title": "On the Humanity of Conversational AI: Evaluating the Psychological Portrayal of LLMs",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19008",
        "id": "H3UayAQWoE",
        "author_site": "Jen-tse Huang, Wenxuan Wang, Eric John Li, Man Ho LAM, Shujie Ren, Youliang Yuan, Wenxiang Jiao, Zhaopeng Tu, Michael Lyu",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) have recently showcased their remarkable capacities, not only in natural language processing tasks but also across diverse domains such as clinical medicine, legal consultation, and education. LLMs become more than mere applications, evolving into assistants capable of addressing diverse user requests. This narrows the distinction between human beings and artificial intelligence agents, raising intriguing questions regarding the potential manifestation of personalities, temperaments, and emotions within LLMs. In this paper, we propose a framework, PsychoBench, for evaluating diverse psychological aspects of LLMs. Comprising thirteen scales commonly used in clinical psychology, PsychoBench further classifies these scales into four distinct categories: personality traits, interpersonal relationships, motivational tests, and emotional abilities. Our study examines five popular models, namely text-davinci-003, ChatGPT, GPT-4, LLaMA-2-7b, and LLaMA-2-13b. Additionally, we employ a jailbreak approach to bypass the safety alignment protocols and test the intrinsic natures of LLMs. We have made PsychoBench openly accessible via https://github.com/CUHK-ARISE/PsychoBench.",
        "keywords": "LLM;Benchmark;Evaluation;Psychometrics",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/e1a6dd583f45c6e3e14f255592329602b01fbb75.zip",
        "author": "Jen-tse Huang;Wenxuan Wang;Eric John Li;Man Ho LAM;Shujie Ren;Youliang Yuan;Wenxiang Jiao;Zhaopeng Tu;Michael Lyu",
        "authorids": "~Jen-tse_Huang1;~Wenxuan_Wang2;~Eric_John_Li1;~Man_Ho_LAM1;~Shujie_Ren1;~Youliang_Yuan1;~Wenxiang_Jiao1;~Zhaopeng_Tu1;~Michael_Lyu1",
        "gender": "M;;M;M;;M;M;M;M",
        "homepage": "https://penguinnnnn.github.io/;;;https://donaldlamnl.github.io/DonaldLamNL/home;;https://youliangyuan.github.io;https://wxjiao.github.io/;http://www.zptu.net;http://www.cse.cuhk.edu.hk/~lyu",
        "dblp": "317/7026;203/1536-1;348/7146;;;302/7588;239/4883;71/9281;l/MichaelRLyu",
        "google_scholar": "XBzDTAQAAAAJ;4v5x0bUAAAAJ;https://scholar.google.com.hk/citations?user=m71w120AAAAJ;hOd8TtoAAAAJ;https://scholar.google.com/citations?hl=en;cd-wSAsAAAAJ;CvtODukAAAAJ;IvE2zRgAAAAJ;uQnBgK0AAAAJ",
        "orcid": "0000-0003-3446-0083;;;;;;;;0000-0002-3666-5798",
        "linkedin": "jen-tse-huang-08a169200/;;eric-john-li-b380a2250;donald-lam-17236126b/;;;;tuzhaopeng;michael-lyu-58b154/",
        "or_profile": "~Jen-tse_Huang1;~Wenxuan_Wang2;~Eric_John_Li1;~Man_Ho_LAM1;~Shujie_Ren1;~Youliang_Yuan1;~Wenxiang_Jiao1;~Zhaopeng_Tu1;~Michael_Lyu1",
        "aff": "The Chinese University of Hong Kong;The Chinese University of Hong Kong;The Chinese University of Hong Kong;Department of Computer Science and Engineering, The Chinese University of Hong Kong;Tianjin Medical University ;The Chinese University of Hong Kong-Shenzhen;Tencent AI Lab;Tencent AI Lab;The Chinese University of Hong Kong",
        "aff_domain": "cuhk.edu.hk;cuhk.edu.hk;cse.cuhk.edu.hk;cse.cuhk.edu.hk;tmu.edu.cn;cuhk.edu.cn;tencent.com;tencent.com;cuhk.edu.hk",
        "position": "PhD student;PhD student;Undergrad student;Undergrad student;MS student;PhD student;Researcher;Principal Researcher;Full Professor",
        "bibtex": "@inproceedings{\nhuang2024on,\ntitle={On the Humanity of Conversational {AI}: Evaluating the Psychological Portrayal of {LLM}s},\nauthor={Jen-tse Huang and Wenxuan Wang and Eric John Li and Man Ho LAM and Shujie Ren and Youliang Yuan and Wenxiang Jiao and Zhaopeng Tu and Michael Lyu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=H3UayAQWoE}\n}",
        "github": "",
        "project": "",
        "reviewers": "N5Ty;Rgnn;PbNV",
        "pdf_size": 367865,
        "rating": "6;6;8",
        "confidence": "2;4;4",
        "soundness": "3;3;3",
        "contribution": "3;2;3",
        "presentation": "3;3;3",
        "wc_summary": "61;166;78",
        "wc_strengths": "43;217;96",
        "wc_weaknesses": "76;390;206",
        "wc_questions": "72;82;194",
        "wc_review": "252;855;574",
        "wc_reply_reviewers": "0;80;0",
        "wc_reply_authors": "1348;1793;1610",
        "reply_reviewers": "0;1;0",
        "reply_authors": "2;3;3",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            101.66666666666667,
            46.0169051062276
        ],
        "wc_strengths_avg": [
            118.66666666666667,
            72.82093716019376
        ],
        "wc_weaknesses_avg": [
            224.0,
            128.82028825719445
        ],
        "wc_questions_avg": [
            116.0,
            55.3052137385497
        ],
        "wc_review_avg": [
            560.3333333333334,
            246.3633269967121
        ],
        "wc_reply_reviewers_avg": [
            26.666666666666668,
            37.71236166328253
        ],
        "wc_reply_authors_avg": [
            1583.6666666666667,
            182.62225737540558
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 56,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12357160479292711027&as_sdt=80005&sciodt=0,11&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=H3UayAQWoE",
        "pdf": "https://openreview.net/pdf?id=H3UayAQWoE",
        "email": "cuhk.edu.hk;cuhk.edu.hk;cse.cuhk.edu.hk;cse.cuhk.edu.hk;tmu.edu.cn;cuhk.edu.cn;tencent.com;tencent.com;cuhk.edu.hk",
        "author_num": 9,
        "aff_unique_index": "0;0;0;0;1;0;2;2;0",
        "aff_unique_norm": "Chinese University of Hong Kong;Tianjin Medical University;Tencent",
        "aff_unique_dep": ";;Tencent AI Lab",
        "aff_unique_url": "https://www.cuhk.edu.hk;http://www.tmu.edu.cn/;https://ai.tencent.com",
        "aff_unique_abbr": "CUHK;TMU;Tencent AI Lab",
        "aff_campus_unique_index": "0;0;0;0;2;0",
        "aff_campus_unique": "Hong Kong SAR;;Shenzhen",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "H49g8rRIiF",
        "title": "From Language to 3D Worlds: Adapting Language Models for Point Cloud Perception",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Typical 3D perception approaches are inclined to learn a well-performed network via supervised training or pretraining-finetuning. Either way, they only explore in-modality solutions and data. In this work, we introduce a cross-modal strategy that applies pretrained language models for understanding 3D point clouds, given that both point clouds and texts are discrete data. The language model is trained on language corpus and frozen. We propose a simple yet effective approach, named LAMP (LAnguage Models can read Point clouds), which merely trains a small portion of parameters to align the data distribution of 3D point clouds with pretrained language models and spark the 3D perception ability of language models. Furthermore, we utilize the 3D-aware language model to simultaneously extract features of point clouds and texts, which mitigates the modality gap and boosts the performance on multimodal tasks, e.g., 3D visual grounding. Extensive experiments on unimodal and multimodal tasks validate the effectiveness of our proposed method.",
        "keywords": "Natural Language; 3D Perception; Cross-modality Knowledge",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yiyuan Zhang;Kaixiong Gong;Yuhao Kang;Xiaohan Ding;Wanli Ouyang;Xiangyu Yue",
        "authorids": "~Yiyuan_Zhang1;~Kaixiong_Gong1;~Yuhao_Kang2;~Xiaohan_Ding1;~Wanli_Ouyang1;~Xiangyu_Yue1",
        "gender": "M;M;;M;;M",
        "homepage": "https://invictus717.github.io/;;;https://dingxiaohan.xyz/;;http://xyue.io/",
        "dblp": "163/6458;289/0124;241/5156;218/7379;;207/7518",
        "google_scholar": "KuYlJCIAAAAJ;kBVshUUAAAAJ;https://scholar.google.com/citations?hl=en;CIjw0KoAAAAJ;;-xQ-C1sAAAAJ",
        "orcid": "0000-0001-6643-9698;;;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Yiyuan_Zhang1;~Kaixiong_Gong1;~Yuhao_Kang2;~Xiaohan_Ding1;~Wanli_Ouyang1;~Xiangyu_Yue1",
        "aff": "The Chinese University of Hong Kong;The Chinese University of Hong Kong;Beijing Institute of Technology;Tencent AI Lab;;The Chinese University of Hong Kong",
        "aff_domain": "ie.cuhk.edu;ie.cuhk.edu;bit.edu.cn;tencent.com;;ie.cuhk.edu",
        "position": "PhD student;PhD student;MS student;Researcher;;Assistant Professor",
        "bibtex": "@misc{\nzhang2024from,\ntitle={From Language to 3D Worlds: Adapting Language Models for Point Cloud Perception},\nauthor={Yiyuan Zhang and Kaixiong Gong and Yuhao Kang and Xiaohan Ding and Wanli Ouyang and Xiangyu Yue},\nyear={2024},\nurl={https://openreview.net/forum?id=H49g8rRIiF}\n}",
        "github": "",
        "project": "",
        "reviewers": "rpJb;ZVvW;x2q6",
        "site": "https://openreview.net/forum?id=H49g8rRIiF",
        "pdf_size": 2248548,
        "rating": "5;5;5",
        "confidence": "5;4;5",
        "soundness": "3;3;2",
        "contribution": "3;2;2",
        "presentation": "3;2;2",
        "wc_summary": "93;46;99",
        "wc_strengths": "48;77;43",
        "wc_weaknesses": "157;242;279",
        "wc_questions": "5;108;84",
        "wc_review": "303;473;505",
        "wc_reply_reviewers": "0;11;0",
        "wc_reply_authors": "427;676;546",
        "reply_reviewers": "0;1;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            79.33333333333333,
            23.697163449568293
        ],
        "wc_strengths_avg": [
            56.0,
            14.98888477061141
        ],
        "wc_weaknesses_avg": [
            226.0,
            51.07510809255979
        ],
        "wc_questions_avg": [
            65.66666666666667,
            44.00252518006464
        ],
        "wc_review_avg": [
            427.0,
            88.649121071033
        ],
        "wc_reply_reviewers_avg": [
            3.6666666666666665,
            5.185449728701348
        ],
        "wc_reply_authors_avg": [
            549.6666666666666,
            101.68688323585408
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:v_HpzUu0FdEJ:scholar.google.com/&scioq=From+Language+to+3D+Worlds:+Adapting+Language+Models+for+Point+Cloud+Perception&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2;0",
        "aff_unique_norm": "Chinese University of Hong Kong;Beijing Institute of Technology;Tencent",
        "aff_unique_dep": ";;Tencent AI Lab",
        "aff_unique_url": "https://www.cuhk.edu.hk;http://www.bit.edu.cn/;https://ai.tencent.com",
        "aff_unique_abbr": "CUHK;BIT;Tencent AI Lab",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Unified Projection-Free Algorithms for Adversarial DR-Submodular Optimization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19007",
        "id": "H4A9e8HvIn",
        "author_site": "Mohammad Pedramfar, Yididiya Nadew, Chris Quinn, Vaneet Aggarwal",
        "tldr": "",
        "abstract": "This paper introduces unified projection-free Frank-Wolfe type algorithms for adversarial continuous DR-submodular optimization, spanning scenarios such as full information and (semi-)bandit feedback, monotone and non-monotone functions, different constraints, and types of stochastic queries. For every problem considered in the non-monotone setting, the proposed algorithms are either the first with proven sub-linear $\\alpha$-regret bounds or have better $\\alpha$-regret bounds than the state of the art, where $\\alpha$ is a corresponding approximation bound in the offline setting. In the monotone setting, the proposed approach gives state-of-the-art sub-linear $\\alpha$-regret bounds among projection-free algorithms in 7 of the 8 considered cases while matching the result of the remaining case. Additionally, this paper addresses semi-bandit and bandit feedback for adversarial DR-submodular optimization, advancing the understanding of this optimization area.",
        "keywords": "Stochastic optimization;submodular maximization;Frank-Wolfe algorithm",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Mohammad Pedramfar;Yididiya Y. Nadew;Christopher John Quinn;Vaneet Aggarwal",
        "authorids": "~Mohammad_Pedramfar1;~Yididiya_Y._Nadew1;~Christopher_John_Quinn1;~Vaneet_Aggarwal1",
        "gender": ";;M;M",
        "homepage": ";;https://www.cs.iastate.edu/people/christopher-quinn;",
        "dblp": ";;50/8822;91/6560",
        "google_scholar": ";;oXWIgXcAAAAJ;",
        "orcid": ";;0000-0002-9053-1504;",
        "linkedin": ";;;",
        "or_profile": "~Mohammad_Pedramfar1;~Yididiya_Y._Nadew1;~Christopher_John_Quinn1;~Vaneet_Aggarwal1",
        "aff": ";;Iowa State University;Purdue University",
        "aff_domain": ";;iastate.edu;purdue.edu",
        "position": ";;Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\npedramfar2024unified,\ntitle={Unified Projection-Free Algorithms for Adversarial {DR}-Submodular Optimization},\nauthor={Mohammad Pedramfar and Yididiya Y. Nadew and Christopher John Quinn and Vaneet Aggarwal},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=H4A9e8HvIn}\n}",
        "github": "",
        "project": "",
        "reviewers": "5yTK;EVLt;ZRDt",
        "pdf_size": 825533,
        "rating": "5;6;10",
        "confidence": "4;3;3",
        "soundness": "3;3;3",
        "contribution": "2;3;4",
        "presentation": "2;2;4",
        "wc_summary": "50;58;109",
        "wc_strengths": "35;119;68",
        "wc_weaknesses": "16;104;8",
        "wc_questions": "118;4;13",
        "wc_review": "219;285;198",
        "wc_reply_reviewers": "107;0;0",
        "wc_reply_authors": "2937;204;21",
        "reply_reviewers": "1;0;0",
        "reply_authors": "4;1;1",
        "rating_avg": [
            7.0,
            2.160246899469287
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            72.33333333333333,
            26.132142830026183
        ],
        "wc_strengths_avg": [
            74.0,
            34.55430508634199
        ],
        "wc_weaknesses_avg": [
            42.666666666666664,
            43.49201714746691
        ],
        "wc_questions_avg": [
            45.0,
            51.749396131742444
        ],
        "wc_review_avg": [
            234.0,
            37.067505985701274
        ],
        "wc_reply_reviewers_avg": [
            35.666666666666664,
            50.440283724640395
        ],
        "wc_reply_authors_avg": [
            1054.0,
            1333.5763945121405
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            1.4142135623730951
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.654653670707977,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16272158720355832970&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=H4A9e8HvIn",
        "pdf": "https://openreview.net/pdf?id=H4A9e8HvIn",
        "email": ";;iastate.edu;purdue.edu",
        "author_num": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Iowa State University;Purdue University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.iastate.edu;https://www.purdue.edu",
        "aff_unique_abbr": "ISU;Purdue",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "DMV3D: Denoising Multi-view Diffusion Using 3D Large Reconstruction Model",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19006",
        "id": "H4yQefeXhp",
        "author_site": "Yinghao Xu, Hao Tan, Fujun Luan, Sai Bi, Peng Wang, Jiahao Li, Zifan Shi, Kalyan Sunkavalli, Gordon Wetzstein, Zexiang Xu, Kai Zhang",
        "tldr": "",
        "abstract": "We propose DMV3D, a novel 3D generation approach that uses a transformer-based 3D large reconstruction model to denoise multi-view diffusion. Our reconstruction model incorporates a triplane NeRF representation and, functioning as a denoiser, can denoise noisy multi-view images via 3D NeRF reconstruction and rendering, achieving single-stage 3D generation in the 2D diffusion denoising process. We train DMV3D on large-scale multi-view image datasets of extremely diverse objects using only image reconstruction losses, without accessing 3D assets. We demonstrate state-of-the-art results for the single-image reconstruction problem where probabilistic modeling of unseen object parts is required for generating diverse reconstructions with sharp textures. We also show high-quality text-to-3D generation results outperforming previous 3D diffusion models. Our project website is at: https://dmv3d.github.io/.",
        "keywords": "3D Generation; Single-view 3D Reconstruction; text-to-3D",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Yinghao Xu;Hao Tan;Fujun Luan;Sai Bi;Peng Wang;Jiahao Li;Zifan Shi;Kalyan Sunkavalli;Gordon Wetzstein;Zexiang Xu;Kai Zhang",
        "authorids": "~Yinghao_Xu1;~Hao_Tan1;~Fujun_Luan2;~Sai_Bi1;~Peng_Wang17;~Jiahao_Li2;~Zifan_Shi2;~Kalyan_Sunkavalli1;~Gordon_Wetzstein3;~Zexiang_Xu1;~Kai_Zhang7",
        "gender": "M;M;M;M;M;;M;M;M;M;F",
        "homepage": "https://justimyhxu.github.io/;http://www.cs.unc.edu/~airsplay/;https://luanfujun.com/;https://sai-bi.github.io/;https://totoro97.github.io;https://jiahao.ai;http://www.kalyans.org/;http://web.stanford.edu/~gordonwz/;https://cseweb.ucsd.edu/~zex014/;https://kai-46.github.io/website/;https://vivianszf.github.io/",
        "dblp": "232/2482;94/877-2;183/9337;165/9898;95/4442-99;;42/5978;13/4660;154/0366;55/957-45;136/5965",
        "google_scholar": "https://scholar.google.com/citations?hl=en;OV1Y3FUAAAAJ;NLxrmYQAAAAJ;-q4nE1kAAAAJ;KvXvmawAAAAJ;w9jtLkIAAAAJ;j7uL6VEAAAAJ;VOf45S0AAAAJ;_RRIYvEAAAAJ;6B7FPMoAAAAJ;",
        "orcid": ";;;;;;;0000-0002-9243-6885;;;",
        "linkedin": ";hao-tan-23677180/;luanfujun/;;;jiahaoli95;;gordon-wetzstein-2406723/;;;",
        "or_profile": "~Yinghao_Xu1;~Hao_Tan1;~Fujun_Luan2;~Sai_Bi1;~Peng_Wang17;~Jiahao_Li2;~Kalyan_Sunkavalli1;~Gordon_Wetzstein3;~Zexiang_Xu1;~Kai_Zhang7;~Zifan_SHI1",
        "aff": "Stanford University;Adobe Systems;Adobe Systems;Adobe Systems;The University of Hong Kong;Toyota Technological Institute at Chicago;Adobe Research;Stanford University;Adobe Research;Adobe Systems;Hong Kong University of Science and Technology",
        "aff_domain": "stanford.edu;adobe.com;adobe.com;adobe.com;hku.hk;ttic.edu;adobe.com;stanford.edu;adobe.com;adobe.com;ust.hk",
        "position": "Postdoc;Research Scientist;Researcher;Researcher;PhD student;PhD student;Principal Scientist;Associate Professor;Researcher;Researcher;PhD student",
        "bibtex": "@inproceedings{\nxu2024dmvd,\ntitle={{DMV}3D: Denoising Multi-view Diffusion Using 3D Large Reconstruction Model},\nauthor={Yinghao Xu and Hao Tan and Fujun Luan and Sai Bi and Peng Wang and Jiahao Li and Zifan Shi and Kalyan Sunkavalli and Gordon Wetzstein and Zexiang Xu and Kai Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=H4yQefeXhp}\n}",
        "github": "",
        "project": "",
        "reviewers": "nAvZ;PYdg;3SCV;X5Dv",
        "pdf_size": 24294949,
        "rating": "6;8;8;10",
        "confidence": "4;4;5;5",
        "soundness": "3;3;3;4",
        "contribution": "2;3;3;4",
        "presentation": "3;3;3;3",
        "wc_summary": "90;139;33;76",
        "wc_strengths": "48;116;17;106",
        "wc_weaknesses": "118;95;39;40",
        "wc_questions": "59;37;5;151",
        "wc_review": "315;387;94;373",
        "wc_reply_reviewers": "293;0;73;20",
        "wc_reply_authors": "1033;255;899;168",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "3;2;5;2",
        "rating_avg": [
            8.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            84.5,
            37.83186487605389
        ],
        "wc_strengths_avg": [
            71.75,
            40.90461465409496
        ],
        "wc_weaknesses_avg": [
            73.0,
            34.4746283518764
        ],
        "wc_questions_avg": [
            63.0,
            54.31390245600108
        ],
        "wc_review_avg": [
            292.25,
            117.59969175129669
        ],
        "wc_reply_reviewers_avg": [
            96.5,
            116.542910552294
        ],
        "wc_reply_authors_avg": [
            588.75,
            381.45535453051383
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            1.224744871391589
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": 0.7071067811865476,
        "gs_citation": 150,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1451864293291739699&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=H4yQefeXhp",
        "pdf": "https://openreview.net/pdf?id=H4yQefeXhp",
        "email": "stanford.edu;adobe.com;adobe.com;adobe.com;hku.hk;ttic.edu;adobe.com;stanford.edu;adobe.com;adobe.com;ust.hk",
        "author_num": 11,
        "aff_unique_index": "0;1;1;1;2;3;1;0;1;1;4",
        "aff_unique_norm": "Stanford University;Adobe;University of Hong Kong;Toyota Technological Institute at Chicago;Hong Kong University of Science and Technology",
        "aff_unique_dep": ";Adobe Systems Incorporated;;;",
        "aff_unique_url": "https://www.stanford.edu;https://www.adobe.com;https://www.hku.hk;https://www.tti-chicago.org;https://www.ust.hk",
        "aff_unique_abbr": "Stanford;Adobe;HKU;TTI Chicago;HKUST",
        "aff_campus_unique_index": "0;2;3;0;2",
        "aff_campus_unique": "Stanford;;Hong Kong SAR;Chicago",
        "aff_country_unique_index": "0;0;0;0;1;0;0;0;0;0;1",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "H4zAFFyoXK",
        "title": "BLSP: Bootstrapping Language-Speech Pre-training via Behavior Alignment of Continuation Writing",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The emergence of large language models (LLMs) has sparked significant interest in extending their remarkable language capabilities to speech. However, modality alignment between speech and text still remains an open problem. Current solutions can be categorized into two strategies. One is a cascaded approach where outputs (tokens or states) of a separately trained speech recognition system are used as inputs for LLMs, which limits their potential in modeling alignment between speech and text. The other is an end-to-end approach that relies on speech instruction data, which is very difficult to collect in large quantities. In this paper, we address these issues and propose the **BLSP** approach that **B**ootstraps **L**anguage-**S**peech **P**re-training via behavior alignment of continuation writing. We achieve this by learning a lightweight modality adapter between a frozen speech encoder and an LLM, ensuring that the LLM exhibits the same generation behavior regardless of the modality of input: a speech segment or its transcript. The training process can be divided into two steps. The first step prompts an LLM to generate texts with speech transcripts as prefixes, obtaining text continuations. In the second step, these continuations are used as supervised signals to train the modality adapter in an end-to-end manner. We demonstrate that this straightforward process can extend the capabilities of LLMs to speech, enabling speech recognition, speech translation, spoken language understanding, and speech conversation, even in zero-shot cross-lingual scenarios.",
        "keywords": "Cross-Modal Alignment;Speech-Text Large Language Model;Behavior Alignment",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Chen Wang;Minpeng Liao;Zhongqiang Huang;Jinliang Lu;Junhong Wu;Yuchen Liu;Jiajun Zhang;Chengqing Zong",
        "authorids": "~Chen_Wang29;~Minpeng_Liao1;~Zhongqiang_Huang1;~Jinliang_Lu1;~Junhong_Wu1;~Yuchen_Liu15;~Jiajun_Zhang1;~Chengqing_Zong1",
        "gender": "M;;M;M;M;M;M;M",
        "homepage": ";;;https://jinlianglu96.github.io/about/;;;http://www.nlpr.ia.ac.cn/cip/jjzhang.htm;http://www.nlpr.ia.ac.cn/cip/english/zong.htm",
        "dblp": ";;10/3565;249/9047;168/4295;69/10440-7;71/6950-1.html;38/6093",
        "google_scholar": "FgrrqlAAAAAJ;;;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?view_op=list_works;jKKnvEcAAAAJ;93zngeYAAAAJ;l8lvKOQAAAAJ",
        "orcid": ";;;0000-0002-5395-2385;;;;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Chen_Wang29;~Minpeng_Liao1;~Zhongqiang_Huang1;~Jinliang_Lu1;~Junhong_Wu1;~Yuchen_Liu15;~Jiajun_Zhang1;~Chengqing_Zong1",
        "aff": "Institute of Automation, Chinese Academy of Sciences;;Alibaba Group;Institute of automation, Chinese Academy of Sciences;University of Chinese Academy of Sciences;Institute of Automation, Chinese Academy of Sciences;Institute of Automation, Chinese Academy of Sciences;Institute of Automation, Chinese Academy of Sciences",
        "aff_domain": "ia.ac.cn;;alibaba-inc.com;ia.ac.cn;ia.ac.cn;ia.ac.cn;ia.ac.cn;ia.ac.cn",
        "position": "PhD student;;Senior Staff Engineer;PhD student;PhD student;Assistant Professor;Full Professor;Researcher",
        "bibtex": "@misc{\nwang2024blsp,\ntitle={{BLSP}: Bootstrapping Language-Speech Pre-training via Behavior Alignment of Continuation Writing},\nauthor={Chen Wang and Minpeng Liao and Zhongqiang Huang and Jinliang Lu and Junhong Wu and Yuchen Liu and Jiajun Zhang and Chengqing Zong},\nyear={2024},\nurl={https://openreview.net/forum?id=H4zAFFyoXK}\n}",
        "github": "",
        "project": "",
        "reviewers": "tfEL;Dd3G;ZRsu;EDCC",
        "site": "https://openreview.net/forum?id=H4zAFFyoXK",
        "pdf_size": 597701,
        "rating": "5;6;6;8",
        "confidence": "2;4;4;3",
        "soundness": "1;3;2;4",
        "contribution": "1;4;3;4",
        "presentation": "2;3;3;4",
        "wc_summary": "72;112;45;125",
        "wc_strengths": "75;216;21;63",
        "wc_weaknesses": "142;627;11;65",
        "wc_questions": "70;100;85;68",
        "wc_review": "359;1055;162;321",
        "wc_reply_reviewers": "172;26;0;19",
        "wc_reply_authors": "1136;1122;921;388",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "2;2;2;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            1.118033988749895
        ],
        "contribution_avg": [
            3.0,
            1.224744871391589
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            88.5,
            31.815876539866068
        ],
        "wc_strengths_avg": [
            93.75,
            73.37361583021516
        ],
        "wc_weaknesses_avg": [
            211.25,
            244.50600708367065
        ],
        "wc_questions_avg": [
            80.75,
            12.910751333675357
        ],
        "wc_review_avg": [
            474.25,
            343.34339588814
        ],
        "wc_reply_reviewers_avg": [
            54.25,
            68.64537493524236
        ],
        "wc_reply_authors_avg": [
            891.75,
            303.0234108117721
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.20751433915982243,
        "gs_citation": 37,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6040946396008246141&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;2;0;0;0",
        "aff_unique_norm": "Chinese Academy of Sciences;Alibaba Group;University of Chinese Academy of Sciences",
        "aff_unique_dep": "Institute of Automation;;",
        "aff_unique_url": "http://www.ia.cas.cn;https://www.alibaba.com;http://www.ucas.ac.cn",
        "aff_unique_abbr": "CAS;Alibaba;UCAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "H56qXKaNpF",
        "title": "POSITION EMBEDDING INTERPOLATION IS ALL YOU NEED FOR EFFICIENT IMAGE-TO-IMAGE VIT",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recently, general image inpainting methods have made great progress in free-form large-miss region restoration, but it is still challenging to inpaint a high-resolution image directly to obtain a photo-realistic image and maintain a low training and inferring cost simultaneously. To address this, we propose a computation-efficient framework with a diffusion model and a ViT-based super-resolution (ViTSR) module. In this paper, we train the guided diffusion model for inpainting the image in low-resolution to reduce the training and inferring costs and use ViTSR for reconstructing the image to the original high-resolution. The idea is simple to understand, but the key point is that our framework requires an excellent reconstruction module to bring the low-resolution output to high resolution and hardly discriminate compared to the origin image in texture. ViTSR employs the vanilla ViT architecture and utilizes position embedding interpolation (PEI) to make the module capable of training at low resolution and suiting any resolution when inferring. ViTSR leverages latent image-to-image translation to capture global attention information and reconstruct the image with state-of-the-art performance. In the experiments on CelebA, Places2, and other datasets, this framework obtained superior performance in high-resolution image inpainting and super-resolution tasks. We further propose a general ViT-based auto-encoder for image-to-image translation tasks that can be accelerated by position embedding interpolation.",
        "keywords": "super-resolution;image inpainting;vision Transformer;position embedding interpolation;diffusion model",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/27f34d905a2eab05f13d1c4dc63c2c23b4e07b68.zip",
        "author": "Zhihua Chen;Xiankang Yu;Lei Dai;Lei Liang;Daqi Gao;Bin Sheng",
        "authorids": "~Zhihua_Chen1;~Xiankang_Yu1;~Lei_Dai3;~Lei_Liang1;~Daqi_Gao1;~Bin_Sheng1",
        "gender": ";M;;;M;M",
        "homepage": ";https://github.com/Shawn-Yu-1;https://orcid.org/0000-0002-9498-384X;;https://github.com/gaodaqi/;https://www.cs.sjtu.edu.cn/en/PeopleDetail.aspx?id=149",
        "dblp": ";;;;;24/2408-1.html",
        "google_scholar": ";;;;;",
        "orcid": "0000-0003-4496-1340;0009-0009-1886-5372;0000-0002-9498-384X;0009-0004-2636-3659;;",
        "linkedin": ";;;;;",
        "or_profile": "~Zhihua_Chen1;~Xiankang_Yu1;~Lei_Dai3;~Lei_Liang1;~Daqi_Gao1;~Bin_Sheng1",
        "aff": "East China University of Science and Technology;East China University of Science and Technology;East China University of Science and Technology;East China University of Science and Technology;East China University of Science and Technology;Shanghai Jiaotong University",
        "aff_domain": "ecust.edu.cn;ecust.edu.cn;ecust.edu.cn;ecust.edu.cn;ecust.edu.cn;cs.sjtu.edu.cn",
        "position": "Full Professor;MS student;Lecturer;PhD student;Full Professor;Full Professor",
        "bibtex": "@misc{\nchen2024position,\ntitle={{POSITION} {EMBEDDING} {INTERPOLATION} {IS} {ALL} {YOU} {NEED} {FOR} {EFFICIENT} {IMAGE}-{TO}-{IMAGE} {VIT}},\nauthor={Zhihua Chen and Xiankang Yu and Lei Dai and Lei Liang and Daqi Gao and Bin Sheng},\nyear={2024},\nurl={https://openreview.net/forum?id=H56qXKaNpF}\n}",
        "github": "",
        "project": "",
        "reviewers": "gKZS;B9FJ;dBej;qNze",
        "site": "https://openreview.net/forum?id=H56qXKaNpF",
        "pdf_size": 11873726,
        "rating": "3;3;5;5",
        "confidence": "4;5;5;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;3;2",
        "presentation": "3;2;2;3",
        "wc_summary": "74;57;75;41",
        "wc_strengths": "46;17;22;38",
        "wc_weaknesses": "69;271;79;67",
        "wc_questions": "232;2;50;189",
        "wc_review": "421;347;226;335",
        "wc_reply_reviewers": "0;0;60;0",
        "wc_reply_authors": "568;817;732;698",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            61.75,
            13.953046262375826
        ],
        "wc_strengths_avg": [
            30.75,
            11.734031702701335
        ],
        "wc_weaknesses_avg": [
            121.5,
            86.43350044976773
        ],
        "wc_questions_avg": [
            118.25,
            95.02203691775924
        ],
        "wc_review_avg": [
            332.25,
            69.62533662396183
        ],
        "wc_reply_reviewers_avg": [
            15.0,
            25.98076211353316
        ],
        "wc_reply_authors_avg": [
            703.75,
            89.5610825079733
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:4xQq46cYTxgJ:scholar.google.com/&scioq=POSITION+EMBEDDING+INTERPOLATION+IS+ALL+YOU+NEED+FOR+EFFICIENT+IMAGE-TO-IMAGE+VIT&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0;1",
        "aff_unique_norm": "East China University of Science and Technology;Shanghai Jiao Tong University",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.ecust.edu.cn;https://www.sjtu.edu.cn",
        "aff_unique_abbr": "ECUST;SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "H5XZLeXWPS",
        "title": "Walking Down the Memory Maze: Beyond Context Limit through Interactive Reading",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs) have advanced in large strides due to the effectiveness of the self-attention mechanism that processes and compares all tokens at once. However, this mechanism comes with a fundamental issue \u2014 the predetermined context window is bound to be limited. Despite attempts to extend the context window through methods like extrapolating the positional embedding, using recurrence, or selectively retrieving essential parts of the long sequence, long-text understanding continues to be a challenge. We propose an alternative approach which instead treats the LLM as an interactive agent, allowing it to decide how to read the text via iterative prompting. We introduce MemWalker, a method that first processes the long context into a tree of summary nodes. Upon receiving a query, the model navigates this tree in search of relevant information, and responds once it gathers sufficient information. On long-text question answering\ntasks our method outperforms baseline approaches that use long context windows, recurrence, and retrieval. We show that, beyond effective reading, MemWalker enhances explainability by highlighting the reasoning steps as it interactively reads the text; pinpointing the relevant text segments related to the query.",
        "keywords": "LLM;language model;long context;reasoning;memory",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/c96a20f22b19d1bed3ef1e89b4f3d85e0cd5cc77.pdf",
        "author": "Howard Chen;Ramakanth Pasunuru;Jason E Weston;Asli Celikyilmaz",
        "authorids": "~Howard_Chen1;~Ramakanth_Pasunuru2;~Jason_E_Weston1;~Asli_Celikyilmaz1",
        "gender": "M;M;;F",
        "homepage": "https://howard50b.github.io/;http://rama-kanth.com;;https://asli.us",
        "dblp": "06/2061;199/1748;;15/3724",
        "google_scholar": "wsNa_W4AAAAJ;https://scholar.google.com/citations?hl=en;;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;",
        "linkedin": ";;;aslicelikyilmaz/",
        "or_profile": "~Howard_Chen1;~Ramakanth_Pasunuru2;~Jason_E_Weston1;~Asli_Celikyilmaz1",
        "aff": "Princeton University;Meta Platforms Inc;;FAIR ",
        "aff_domain": "princeton.edu;meta.com;;meta.com",
        "position": "PhD student;Researcher;;Principal Researcher",
        "bibtex": "@misc{\nchen2024walking,\ntitle={Walking Down the Memory Maze: Beyond Context Limit through Interactive Reading},\nauthor={Howard Chen and Ramakanth Pasunuru and Jason E Weston and Asli Celikyilmaz},\nyear={2024},\nurl={https://openreview.net/forum?id=H5XZLeXWPS}\n}",
        "github": "",
        "project": "",
        "reviewers": "T9FN;yntC;rkxv;nCny",
        "site": "https://openreview.net/forum?id=H5XZLeXWPS",
        "pdf_size": 411079,
        "rating": "3;5;6;8",
        "confidence": "4;4;4;4",
        "soundness": "1;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;2;2",
        "wc_summary": "59;87;112;113",
        "wc_strengths": "44;33;37;320",
        "wc_weaknesses": "624;178;353;200",
        "wc_questions": "56;59;189;284",
        "wc_review": "783;357;691;917",
        "wc_reply_reviewers": "245;0;52;0",
        "wc_reply_authors": "440;335;479;145",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            92.75,
            22.094965489902897
        ],
        "wc_strengths_avg": [
            108.5,
            122.1730330310253
        ],
        "wc_weaknesses_avg": [
            338.75,
            177.94855295843234
        ],
        "wc_questions_avg": [
            147.0,
            95.60073221476915
        ],
        "wc_review_avg": [
            687.0,
            206.78007640969668
        ],
        "wc_reply_reviewers_avg": [
            74.25,
            100.84238940048971
        ],
        "wc_reply_authors_avg": [
            349.75,
            129.4128567801515
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 71,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5871170584801390041&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Princeton University;Meta",
        "aff_unique_dep": ";Meta Platforms Inc",
        "aff_unique_url": "https://www.princeton.edu;https://www.meta.com",
        "aff_unique_abbr": "Princeton;Meta",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "H65sp7ztys",
        "title": "Test Time Augmentations are Worth One Million Images for Out-of-Distribution Detection",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Out-of-distribution (OOD) detection is a major threat for deploying machine learning models in safety-critical scenarios. Data augmentations have been proven to be beneficial to OOD detection by providing diverse features. However, previous methods have only focused on the role of data augmentation in the training phase, overlooking its impact on the testing phase. In this paper, we present the first comprehensive study of the impact of test-time augmentation (TTA) on OOD detection. We find aggressive TTAs can cause distribution shifts on OOD scores of In-distribution (InD) data, whereas mild TTAs do not, resulting in the effectiveness of mild TTAs on OOD Detection. Based on the above observations, we propose a detection method that performs a K-nearest-neighbor (KNN) search on mild TTAs instead of InD data. With only 25 TTAs, our method outperforms state-of-the-art methods using the entire training set (1.2 million images) on IMAGENET for OOD detection. Moreover, our approach is compatible with various model architectures and robust to adversarial examples.",
        "keywords": "Out-of-distribution;Test time augmentation;OOD Detection",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/3ff1c6eb817ffe032f08d0d46626d85e0c73c56c.zip",
        "author": "Zhiyuan He;Yijun YANG;Pin-Yu Chen;Qiang Xu;Tsung-Yi Ho",
        "authorids": "~Zhiyuan_He2;~Yijun_YANG2;~Pin-Yu_Chen1;~Qiang_Xu1;~Tsung-Yi_Ho2",
        "gender": ";F;M;M;M",
        "homepage": ";https://yangyijune.github.io/;http://www.pinyuchen.com;https://github.com/cure-lab;https://www.cse.cuhk.edu.hk/people/faculty/tsung-yi-ho/",
        "dblp": ";;39/8969;43/1230-1;63/4181.html",
        "google_scholar": ";GZDKIUMAAAAJ;jxwlCUUAAAAJ;https://scholar.google.com.tw/citations?user=eSiKPqUAAAAJ;TRDUYkAAAAAJ",
        "orcid": ";0000-0002-4496-3154;0000-0003-1039-8369;;0000-0001-7348-5625",
        "linkedin": ";%E4%B8%80%E5%90%9B-%E6%9D%A8-82aa60133/;pin-yu-chen-940062a2;;",
        "or_profile": "~Zhiyuan_He2;~Yijun_YANG2;~Pin-Yu_Chen1;~Qiang_Xu1;~Tsung-Yi_Ho2",
        "aff": ";The Chinese University of Hong Kong;International Business Machines;The Chinese University of Hong Kong;Department of Computer Science and Engineering, The Chinese University of Hong Kong",
        "aff_domain": ";cuhk.edu.hk;ibm.com;cuhk.edu.hk;cse.cuhk.edu.hk",
        "position": ";PhD student;Principal Researcher;Full Professor;Full Professor",
        "bibtex": "@misc{\nhe2024test,\ntitle={Test Time Augmentations are Worth One Million Images for Out-of-Distribution Detection},\nauthor={Zhiyuan He and Yijun YANG and Pin-Yu Chen and Qiang Xu and Tsung-Yi Ho},\nyear={2024},\nurl={https://openreview.net/forum?id=H65sp7ztys}\n}",
        "github": "",
        "project": "",
        "reviewers": "58Yc;jHRr;xPk1",
        "site": "https://openreview.net/forum?id=H65sp7ztys",
        "pdf_size": 1724543,
        "rating": "3;3;5",
        "confidence": "3;3;4",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "3;1;3",
        "wc_summary": "65;69;93",
        "wc_strengths": "30;66;10",
        "wc_weaknesses": "127;253;174",
        "wc_questions": "5;2;2",
        "wc_review": "227;390;279",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            75.66666666666667,
            12.364824660660938
        ],
        "wc_strengths_avg": [
            35.333333333333336,
            23.170862929310356
        ],
        "wc_weaknesses_avg": [
            184.66666666666666,
            51.98931514156432
        ],
        "wc_questions_avg": [
            3.0,
            1.4142135623730951
        ],
        "wc_review_avg": [
            298.6666666666667,
            67.98202376772521
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Tgp1vGaAiNkJ:scholar.google.com/&scioq=Test+Time+Augmentations+are+Worth+One+Million+Images+for+Out-of-Distribution+Detection&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Chinese University of Hong Kong;International Business Machines Corporation",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cuhk.edu.hk;https://www.ibm.com",
        "aff_unique_abbr": "CUHK;IBM",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "H6XYCIlZdo",
        "title": "How far can we go without finetuning?",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Many of the existing deep learning methods are trained for scenarios which: (1) use (costly) fine-tuning of the latent spaces on the target dataset in the \u201ddownstream task\u201d (2) do not account for continual and open-set learning (3) do not provide interpretability. Instead of trying to solve the problem of semi- and unsupervised learning through representation learning, we propose recasting it into the problem of analysing existing foundational models\u2019 feature spaces. We show that a simple baseline, based on non-parametric clustering analysis of the latent feature spaces and pre-trained classifiers on large-scale datasets, can help solve a set of such problems even without finetuning. It can also be seen as a set of metrics for assessment of generalisation within the latent feature spaces. We argue that better generalising pre-trained architectures can solve a number of problems without finetuning, providing the basis for lifelong learning without catastrophic forgetting and with a means of interpretation.",
        "keywords": "lifelong learning;transformers",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Dmitry Kangin;Plamen P Angelov",
        "authorids": "~Dmitry_Kangin1;~Plamen_P_Angelov1",
        "gender": "M;Not Specified",
        "homepage": ";https://www.lancaster.ac.uk/people-profiles/plamen-angelov",
        "dblp": "134/0570;16/6228.html",
        "google_scholar": "https://scholar.google.co.uk/citations?user=vv-leaMAAAAJ;CCW8PwkAAAAJ",
        "orcid": ";0000-0002-5770-934X",
        "linkedin": "dmitry-kangin-34bab097/;",
        "or_profile": "~Dmitry_Kangin1;~Plamen_P_Angelov1",
        "aff": "Lancaster University;Lancaster University",
        "aff_domain": "lancaster.ac.uk;lancaster.ac.uk",
        "position": "Postdoc;Full Professor",
        "bibtex": "@misc{\nkangin2024how,\ntitle={How far can we go without finetuning?},\nauthor={Dmitry Kangin and Plamen P Angelov},\nyear={2024},\nurl={https://openreview.net/forum?id=H6XYCIlZdo}\n}",
        "github": "",
        "project": "",
        "reviewers": "Zcdi;gqXU;zkVN;YapA",
        "site": "https://openreview.net/forum?id=H6XYCIlZdo",
        "pdf_size": 3161107,
        "rating": "1;3;3;5",
        "confidence": "4;4;4;4",
        "soundness": "1;2;2;2",
        "contribution": "1;1;1;3",
        "presentation": "1;2;2;1",
        "wc_summary": "29;132;116;212",
        "wc_strengths": "16;72;40;140",
        "wc_weaknesses": "203;399;95;345",
        "wc_questions": "296;80;34;117",
        "wc_review": "544;683;285;814",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            122.25,
            64.9706664580255
        ],
        "wc_strengths_avg": [
            67.0,
            46.593991028886975
        ],
        "wc_weaknesses_avg": [
            260.5,
            119.39325776608996
        ],
        "wc_questions_avg": [
            131.75,
            99.28336970510217
        ],
        "wc_review_avg": [
            581.5,
            196.00829064098284
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:slPdp2hHy7AJ:scholar.google.com/&scioq=How+far+can+we+go+without+finetuning%3F&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Lancaster University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.lancaster.ac.uk",
        "aff_unique_abbr": "Lancaster",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "H6XiAoyugv",
        "title": "Robust Backdoor Attack with Visible, Semantic, Sample-specific and Compatible Triggers",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep neural networks (DNNs) can be manipulated to exhibit specific behaviors when exposed to specific trigger patterns, without affecting their performance on benign samples, dubbed backdoor attack.\nSome recent research has focused on designing invisible triggers for backdoor attacks to ensure visual stealthiness, while showing high effectiveness, even under backdoor defense. \nHowever, we find that these carefully designed invisible triggers are often susceptible to visual distortion during inference, such as Gaussian blurring or environmental variations in physical scenarios. This phenomenon could significantly undermine the practical effectiveness of attacks, but has been rarely paid attention and thoroughly investigated.\nTo address this limitation, we define a novel trigger called the Visible, Semantic, Sample-Specific, and Compatible trigger (VSSC-trigger), to achieve effective, stealthy and robust simultaneously. \nTo implement it, we develop an innovative approach by utilizing the powerful capabilities of large language models for choosing the suitable trigger and advanced image editing technique for generating the poisoned image with the trigger.\nExtensive experimental results and analysis validate the effectiveness, stealthiness and robustness of the VSSC-trigger. It demonstrates superior resistance to distortions compared to most digital backdoor attacks and allows more efficient and flexible trigger integration compared to physical backdoor attacks.\nWe hope that the proposed VSSC trigger and implementation approach could inspire future studies on designing more practical triggers in backdoor attack.",
        "keywords": "backdoor attack",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/61769530dcf259f7d95ff58e72a1cd28f9c87630.pdf",
        "author": "Ruotong Wang;Hongrui Chen;Zihao Zhu;Li Liu;Yong Zhang;Yanbo Fan;Baoyuan Wu",
        "authorids": "~Ruotong_Wang2;~Hongrui_Chen1;~Zihao_Zhu2;~Li_Liu8;~Yong_Zhang6;~Yanbo_Fan1;~Baoyuan_Wu1",
        "gender": "F;;;F;M;M;M",
        "homepage": "https://github.com/wrt2000;;;https://liliu-avril.github.io/;https://yzhang2016.github.io/yongnorriszhang.github.io/;https://sites.google.com/site/yanbofan0124/;https://sites.google.com/site/baoyuanwu2015/",
        "dblp": ";;;33/4528-36;66/4615-34.html;181/4574;73/7781",
        "google_scholar": "MBpCQlMAAAAJ;;;KQ2S01UAAAAJ;a_zSeVEAAAAJ;OlOqHyUAAAAJ;JNTG1KoAAAAJ",
        "orcid": ";;;;;0000-0002-8530-485X;0000-0003-2183-5990",
        "linkedin": ";;;;;;",
        "or_profile": "~Ruotong_Wang2;~Hongrui_Chen1;~Zihao_Zhu2;~Li_Liu8;~Yong_Zhang6;~Yanbo_Fan1;~Baoyuan_Wu1",
        "aff": "The Chinese University of Hong Kong, Shenzhen;;;The Hong Kong University of Science and Technology (Guangzhou);Tencent AI Lab;Ant Research;The Chinese University of Hong Kong, Shenzhen",
        "aff_domain": "cuhk.edu.cn;;;hkust-gz.edu.cn;tencent.com;antgroup.com;cuhk.edu.cn",
        "position": "MS student;;;Assistant Professor;Researcher;Associate Professor;Associate Professor",
        "bibtex": "@misc{\nwang2024robust,\ntitle={Robust Backdoor Attack with Visible, Semantic, Sample-specific and Compatible Triggers},\nauthor={Ruotong Wang and Hongrui Chen and Zihao Zhu and Li Liu and Yong Zhang and Yanbo Fan and Baoyuan Wu},\nyear={2024},\nurl={https://openreview.net/forum?id=H6XiAoyugv}\n}",
        "github": "",
        "project": "",
        "reviewers": "TWWZ;aqPM;a1qc",
        "site": "https://openreview.net/forum?id=H6XiAoyugv",
        "pdf_size": 4848541,
        "rating": "3;5;5",
        "confidence": "4;3;3",
        "soundness": "2;2;2",
        "contribution": "1;2;3",
        "presentation": "3;3;3",
        "wc_summary": "32;142;135",
        "wc_strengths": "16;94;26",
        "wc_weaknesses": "315;106;29",
        "wc_questions": "3;50;169",
        "wc_review": "366;392;359",
        "wc_reply_reviewers": "261;0;20",
        "wc_reply_authors": "2568;981;1150",
        "reply_reviewers": "1;0;1",
        "reply_authors": "5;3;4",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            103.0,
            50.2858495669176
        ],
        "wc_strengths_avg": [
            45.333333333333336,
            34.65384378231207
        ],
        "wc_weaknesses_avg": [
            150.0,
            120.83321839074992
        ],
        "wc_questions_avg": [
            74.0,
            69.86176827612272
        ],
        "wc_review_avg": [
            372.3333333333333,
            14.197026292697903
        ],
        "wc_reply_reviewers_avg": [
            93.66666666666667,
            118.60391599306023
        ],
        "wc_reply_authors_avg": [
            1566.3333333333333,
            711.6377043287
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            4.0,
            0.816496580927726
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.9999999999999998,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14347440569694381647&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;3;0",
        "aff_unique_norm": "Chinese University of Hong Kong;Hong Kong University of Science and Technology;Tencent;Ant Research",
        "aff_unique_dep": ";;Tencent AI Lab;",
        "aff_unique_url": "https://www.cuhk.edu.cn;https://www.ust.hk;https://ai.tencent.com;https://www.antgroup.com",
        "aff_unique_abbr": "CUHK;HKUST;Tencent AI Lab;Ant Research",
        "aff_campus_unique_index": "0;1;0",
        "aff_campus_unique": "Shenzhen;Guangzhou;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "H6pf70GZVU",
        "title": "YoooP: You Only Optimize One Prototype per Class for Non-Exemplar Incremental Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Incremental learning (IL) usually addresses catastrophic forgetting of old tasks when learning new tasks by replaying old tasks' data stored in a memory, which can be limited by its size and the risk of privacy leakage. Recent non-exemplar IL methods only store class centroids as prototypes and perturb them with Gaussian noise to create synthetic data for replay. However, the class prototypes learned in different tasks might be close to each other, leading to the intersection of their synthetic data and forgetting. Moreover, the Gaussian perturbation does not preserve the real data distribution and thus can be detrimental. In this paper, we propose YoooP, a novel exemplar-free IL approach that can greatly outperform previous methods by only storing and replaying one prototype per class even without synthetic data replay. Instead of storing class centroids, YoooP optimizes each class prototype by (1) moving it to the high-density region within every class using an attentional mean-shift algorithm; and (2) minimizing its similarity to other classes' samples and meanwhile maximizing its similarity to samples from its class, resulting in compact classes distant from each other in the representation space. Moreover, we extend YoooP to YoooP+ by synthesizing replay data preserving the angular distribution between each class prototype and the class's real data in history, which cannot be obtained by Gaussian perturbation. YoooP+ effectively stabilizes and further improves YoooP without storing any real data. Extensive experiments demonstrate the superiority of YoooP/YoooP+ over non-exemplar baselines in terms of accuracy and anti-forgetting.",
        "keywords": "continual learning;non-exemplar incremental learning;prototype optimization",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/81c7fb3cef42da68abcd73f779d7cbb84082bc3f.zip",
        "author": "Jiangtao Kong;Zhenyu Zong;Tianyi Zhou;Huajie Shao",
        "authorids": "~Jiangtao_Kong2;~Zhenyu_Zong1;~Tianyi_Zhou1;~Huajie_Shao1",
        "gender": "M;M;M;M",
        "homepage": ";;https://tianyizhou.github.io/;https://huajieshao.github.io/",
        "dblp": "238/7670;;88/8205-1;179/4173",
        "google_scholar": "https://scholar.google.com/citations?hl=en;AJRbXUMAAAAJ;OKvgizMAAAAJ;5-D7ZLsAAAAJ",
        "orcid": ";;0000-0001-5348-0632;0000-0001-7627-5615",
        "linkedin": ";zyzong-185a81255/;tianyizhou;huajie-shao-508465113/",
        "or_profile": "~Jiangtao_Kong2;~Zhenyu_Zong1;~Tianyi_Zhou1;~Huajie_Shao1",
        "aff": "J.P. Morgan Chase;College of William and Mary;University of Maryland, College Park;College of William and Mary",
        "aff_domain": "jpmorgan.com;wm.edu;umd.edu;wm.edu",
        "position": "Intern;PhD student;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nkong2024yooop,\ntitle={YoooP: You Only Optimize One Prototype per Class for Non-Exemplar Incremental Learning},\nauthor={Jiangtao Kong and Zhenyu Zong and Tianyi Zhou and Huajie Shao},\nyear={2024},\nurl={https://openreview.net/forum?id=H6pf70GZVU}\n}",
        "github": "",
        "project": "",
        "reviewers": "eHC3;gcwm;EwLK;ZsAp",
        "site": "https://openreview.net/forum?id=H6pf70GZVU",
        "pdf_size": 8159367,
        "rating": "3;5;6;6",
        "confidence": "4;4;5;4",
        "soundness": "2;2;3;2",
        "contribution": "2;2;3;3",
        "presentation": "3;2;3;2",
        "wc_summary": "47;100;45;158",
        "wc_strengths": "13;83;40;78",
        "wc_weaknesses": "248;560;175;59",
        "wc_questions": "3;136;99;116",
        "wc_review": "311;879;359;411",
        "wc_reply_reviewers": "0;0;149;54",
        "wc_reply_authors": "1730;1622;896;1595",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "4;4;3;4",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            87.5,
            46.295248136282844
        ],
        "wc_strengths_avg": [
            53.5,
            28.692333470807146
        ],
        "wc_weaknesses_avg": [
            260.5,
            185.58623332564298
        ],
        "wc_questions_avg": [
            88.5,
            51.07102896946565
        ],
        "wc_review_avg": [
            490.0,
            227.35654817928602
        ],
        "wc_reply_reviewers_avg": [
            50.75,
            60.857928817862344
        ],
        "wc_reply_authors_avg": [
            1460.75,
            329.9480072678118
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.75,
            0.4330127018922193
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.4714045207910316,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:FwsJW8o2A9YJ:scholar.google.com/&scioq=YoooP:+You+Only+Optimize+One+Prototype+per+Class+for+Non-Exemplar+Incremental+Learning&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "JPMorgan Chase & Co.;College of William and Mary;University of Maryland",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.jpmorganchase.com;https://www.wm.edu;https://www/umd.edu",
        "aff_unique_abbr": "JPM;WM;UMD",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";College Park",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "H7R0z6V9fR",
        "title": "TANGO: Time-Reversal Latent GraphODE for Multi-Agent Dynamical Systems",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Learning complex multi-agent system dynamics from data is crucial across many\ndomains, such as in physical simulations and material modeling. Extended from\npurely data-driven approaches, existing physics-informed approaches such as\nHamiltonian Neural Network strictly follow energy conservation law to introduce\ninductive bias, making their learning more sample efficiently. However, many\nreal-world systems do not strictly conserve energy, such as spring systems with\nfrictions. Recognizing this, we turn our attention to a broader physical principle:\nTime-Reversal Symmetry, which depicts that the dynamics of a system shall re-\nmain invariant when traversed back over time. It still helps to preserve energies\nfor conservative systems and in the meanwhile, serves as a strong inductive bias\nfor non-conservative, reversible systems. To inject such inductive bias, in this pa-\nper, we propose a simple-yet-effective self-supervised regularization term as a soft\nconstraint that aligns the forward and backward trajectories predicted by a contin-\nuous graph neural network-based ordinary differential equation (GraphODE). It\neffectively imposes time-reversal symmetry to enable more accurate model pre-\ndictions across a wider range of dynamical systems under classical mechanics. In\naddition, we further provide theoretical analysis to show that our regularization\nessentially minimizes higher-order Taylor expansion terms during the ODE inte-\ngration steps, which enables our model to be more noise-tolerant and even applica-\nble to irreversible systems. Experimental results on a variety of physical systems\ndemonstrate the effectiveness of our proposed method. Particularly, it achieves an\nMSE improvement of 11.5 % on a challenging chaotic triple-pendulum systems",
        "keywords": "NeuralODE;Graph Neural Networks;Dynamical Systems;Physical Simulations;Physics-informed Neural Networks",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/9347d5cb9eeb0faf8401840e3bd801a07d8e9048.pdf",
        "author": "Zijie Huang;Wanjia Zhao;Jingdong Gao;Ziniu Hu;Xiao Luo;Yadi Cao;Yizhou Sun;Wei Wang",
        "authorids": "~Zijie_Huang1;~Wanjia_Zhao1;~Jingdong_Gao1;~Ziniu_Hu1;~Xiao_Luo3;~Yadi_Cao1;~Yizhou_Sun1;~Wei_Wang13",
        "gender": "F;F;;M;M;M;F;F",
        "homepage": "https://zijieh.github.io/;https://wanjiazhao1203.github.io/;https://github.com/mxuan0;http://acbull.github.io;http://luoxiao12.github.io;https://eydcao.github.io/;http://web.cs.ucla.edu/~yzsun/;http://www.cs.ucla.edu/~weiwang",
        "dblp": "246/8147-2;;;180/5436;50/1585-1;330/3851;37/3868;w/WeiWang.html",
        "google_scholar": "SejA1zsAAAAJ;https://scholar.google.com/citations?hl=zh-CN;;x6ct1CsAAAAJ;https://scholar.google.com.hk/citations?;hkVMfjcAAAAJ;https://scholar.google.com.tw/citations?user=TQgOjK0AAAAJ;UedS9LQAAAAJ",
        "orcid": ";;;;;0000-0001-8872-5759;;0000-0002-8180-2886",
        "linkedin": "zijie-huang-62514a177/;;;;%E9%9C%84-%E7%BD%97-303548214/;https://www.linkedin.com/mwlite/in/elliott-cao;;wei-wang-8800845/",
        "or_profile": "~Zijie_Huang1;~Wanjia_Zhao1;~Jingdong_Gao1;~Ziniu_Hu1;~Xiao_Luo3;~Yadi_Cao1;~Yizhou_Sun1;~Wei_Wang13",
        "aff": "University of California, Los Angeles;Zhejiang University;;Deepmind;University of California, Los Angeles;University of California, Los Angeles;University of California, Los Angeles;University of California, Los Angeles",
        "aff_domain": "cs.ucla.edu;zju.edu.cn;;deepmind.com;cs.ucla.edu;ucla.edu;ucla.edu;ucla.edu",
        "position": "PhD student;Undergrad student;;Visiting Researcher;Postdoc;PhD student;Associate Professor;Full Professor",
        "bibtex": "@misc{\nhuang2024tango,\ntitle={{TANGO}: Time-Reversal Latent Graph{ODE} for Multi-Agent Dynamical Systems},\nauthor={Zijie Huang and Wanjia Zhao and Jingdong Gao and Ziniu Hu and Xiao Luo and Yadi Cao and Yizhou Sun and Wei Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=H7R0z6V9fR}\n}",
        "github": "",
        "project": "",
        "reviewers": "m559;qpBm;g9nP;zZGZ",
        "site": "https://openreview.net/forum?id=H7R0z6V9fR",
        "pdf_size": 1265732,
        "rating": "3;5;5;8",
        "confidence": "4;3;3;4",
        "soundness": "1;2;2;3",
        "contribution": "1;2;2;4",
        "presentation": "2;3;2;3",
        "wc_summary": "53;129;104;70",
        "wc_strengths": "95;62;69;129",
        "wc_weaknesses": "378;517;724;78",
        "wc_questions": "48;79;199;119",
        "wc_review": "574;787;1096;396",
        "wc_reply_reviewers": "130;634;999;245",
        "wc_reply_authors": "1127;2621;1501;803",
        "reply_reviewers": "1;2;2;3",
        "reply_authors": "4;6;5;4",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            1.0897247358851685
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            89.0,
            29.50423698386386
        ],
        "wc_strengths_avg": [
            88.75,
            26.290445032368698
        ],
        "wc_weaknesses_avg": [
            424.25,
            234.77688876889053
        ],
        "wc_questions_avg": [
            111.25,
            56.57019975216633
        ],
        "wc_review_avg": [
            713.25,
            260.75599226096415
        ],
        "wc_reply_reviewers_avg": [
            502.0,
            342.3689530316673
        ],
        "wc_reply_authors_avg": [
            1513.0,
            685.730267670897
        ],
        "reply_reviewers_avg": [
            2.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            4.75,
            0.82915619758885
        ],
        "replies_avg": [
            34,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.14002800840280097,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6974479462239135431&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;0;0;0;0",
        "aff_unique_norm": "University of California, Los Angeles;Zhejiang University;DeepMind",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ucla.edu;https://www.zju.edu.cn;https://deepmind.com",
        "aff_unique_abbr": "UCLA;ZJU;DeepMind",
        "aff_campus_unique_index": "0;0;0;0;0",
        "aff_campus_unique": "Los Angeles;",
        "aff_country_unique_index": "0;1;2;0;0;0;0",
        "aff_country_unique": "United States;China;United Kingdom"
    },
    {
        "id": "H7z1gHsaZ0",
        "title": "Staleness-based subgraph sampling for large-scale GNNs training",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Training Graph Neural Networks (GNNs) on large-scale graphs is challenging. The main difficulty is to obtain accurate node embeddings while avoiding the neighbor explosion problem. Many of the existing solutions use historical embeddings to tackle this challenge. Specifically, by using historical embeddings for the out-of-batch nodes, these methods can approximate full-batch training without dropping any input data while keeping constant GPU memory consumption. However, it still remains nascent to specifically design a subgraph sampling method that can benefit these historical embedding-based methods. In this paper, we first analyze the approximation error of node embeddings caused by using historical embeddings for out-of-batch neighbors and prove that this approximation error can be minimized by minimizing the staleness of historical embeddings of out-of-batch nodes. Based on the theoretical analysis, we design a simple yet effective \\underline{S}taleness score-based \\underline{S}ubgraph \\underline{S}ampling method (S3) to benefit these historical embedding-based methods. The key idea is to first define the edge weight as the sum of the staleness scores of the source and target nodes and then apply graph partitioning to minimize edge cuts, with each resulting partition as a mini-batch during training. In this way, we can explicitly minimize the approximation error of node embeddings. Furthermore, to deal with the dynamic changes of staleness scores during training and improve the efficiency of graph partitioning, we design a fast algorithm to generate mini-batches via a local refinement heuristic. Experimental results show that (1) our S3 sampling method can further improve historical embedding-based methods and set the new state-of-the-art, and (2) our fast algorithm is 3x faster than re-partitioning graph from scratch on the large-scale ogbn-products dataset with 2M nodes. In addition, the consistent improvements on all three historical embedding-based methods (GAS, GraphFM, and LMC) also show the generalizability of our subgraph sampling method.",
        "keywords": "subgraph sampling;large-scale GNNs training;historical embeddings;staleness",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/5690704fbd723fec1e91270a1d6446d9089078d2.pdf",
        "author": "Limei Wang;Si Zhang;Hanqing Zeng;Hao Wu;Zhigang Hua;Kaveh Hassani;Andrey Malevich;Bo Long;Shuiwang Ji",
        "authorids": "~Limei_Wang1;~Si_Zhang1;~Hanqing_Zeng1;~Hao_Wu16;~Zhigang_Hua1;~Kaveh_Hassani1;~Andrey_Malevich1;~Bo_Long1;~Shuiwang_Ji1",
        "gender": ";M;M;;M;M;M;M;M",
        "homepage": "https://limei0307.github.io/;https://sizhang2.web.illinois.edu/;https://hanqingzeng.com;;https://kavehhassani.github.io/;;https://www.linkedin.com/in/bolonglinkedin/;http://people.tamu.edu/~sji;https://www.linkedin.com/in/zhi-h-888b7b307/",
        "dblp": "57/2674;119/2063;136/2474;;131/9880;;96/6993.html;84/6405;76/170",
        "google_scholar": "https://scholar.google.com/citations?hl=en;JCs-EyYAAAAJ;ubUx3R0AAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.ca/citations?user=1CiEWwsAAAAJ;;;BZGj6sAAAAAJ;",
        "orcid": ";;;;0000-0001-9162-9442;;;0000-0002-4205-4563;0009-0000-2045-0701",
        "linkedin": ";;hanqing-zeng-a9477995/;hao-howard-wu-ba107158/;https://ca.linkedin.com/in/kavehhassani;amalevich/;bolonglinkedin/;shuiwang-ji-9a040715/;zhi-h-888b7b307/",
        "or_profile": "~Limei_Wang1;~Si_Zhang1;~Hanqing_Zeng1;~Hao_Wu16;~Kaveh_Hassani1;~Andrey_Malevich1;~Bo_Long1;~Shuiwang_Ji1;~Zhigang_Hua2",
        "aff": "Texas A&M;Meta;Meta AI;Meta Facebook;University of Toronto;Meta Facebook;Meta;Texas A&M University;Ant Group",
        "aff_domain": "tamu.edu;fb.com;meta.com;fb.com;utoronto.ca;facebook.com;meta.com;tamu.edu;antfin.com",
        "position": "PhD student;Researcher;Researcher;Research Scientist;Lecturer;Researcher;Principal Researcher;Professor;Software Engineer",
        "bibtex": "@misc{\nwang2024stalenessbased,\ntitle={Staleness-based subgraph sampling for large-scale {GNN}s training},\nauthor={Limei Wang and Si Zhang and Hanqing Zeng and Hao Wu and Zhigang Hua and Kaveh Hassani and Andrey Malevich and Bo Long and Shuiwang Ji},\nyear={2024},\nurl={https://openreview.net/forum?id=H7z1gHsaZ0}\n}",
        "github": "",
        "project": "",
        "reviewers": "XXgf;Ummh;BmCi;No3a",
        "site": "https://openreview.net/forum?id=H7z1gHsaZ0",
        "pdf_size": 348535,
        "rating": "3;3;5;5",
        "confidence": "4;4;3;3",
        "soundness": "2;2;3;2",
        "contribution": "1;2;2;2",
        "presentation": "3;3;3;3",
        "wc_summary": "81;73;65;77",
        "wc_strengths": "15;32;84;22",
        "wc_weaknesses": "321;186;48;87",
        "wc_questions": "17;219;1;114",
        "wc_review": "434;510;198;300",
        "wc_reply_reviewers": "15;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            74.0,
            5.916079783099616
        ],
        "wc_strengths_avg": [
            38.25,
            27.095894522971555
        ],
        "wc_weaknesses_avg": [
            160.5,
            105.43837062473983
        ],
        "wc_questions_avg": [
            87.75,
            87.24498552925549
        ],
        "wc_review_avg": [
            360.5,
            120.2279085736752
        ],
        "wc_reply_reviewers_avg": [
            3.75,
            6.49519052838329
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8202610994058087336&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1;2;1;1;0;3",
        "aff_unique_norm": "Texas A&M University;Meta;University of Toronto;Ant Group",
        "aff_unique_dep": ";Meta Platforms, Inc.;;",
        "aff_unique_url": "https://www.tamu.edu;https://meta.com;https://www.utoronto.ca;https://www.antgroup.com",
        "aff_unique_abbr": "TAMU;Meta;U of T;Ant Group",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;1;0;0;0;2",
        "aff_country_unique": "United States;Canada;China"
    },
    {
        "id": "H8CtXin7mZ",
        "title": "A Neural-preconditioned Poisson Solver for Mixed Dirichlet and Neumann Boundary Conditions",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We introduce a neural-preconditioned iterative solver for Poisson equations\nwith mixed boundary conditions. The Poisson equation is ubiquitous in scientific computing:\nit governs a wide array of physical phenomena, arises as a subproblem in many numerical\nalgorithms, and serves as a model problem for the broader class of elliptic PDEs.\nThe most popular Poisson discretizations yield large sparse linear systems.\nAt high resolution, and for performance-critical applications, iterative solvers can be\n advantageous for these---but only when paired with powerful preconditioners.\n The core of our solver is a neural network trained to approximate the inverse of a\n discrete structured-grid Laplace operator for a domain of arbitrary shape and\n with mixed boundary conditions. The structure of this problem motivates a novel network\n architecture that we demonstrate is highly effective as a preconditioner even for boundary\n  conditions outside the training set. We show that on challenging test cases arising from\n  an incompressible fluid simulation, our method outperforms state-of-the-art solvers\n  like algebraic multigrid as well as some recent neural preconditioners.",
        "keywords": "Computational Linear Algebra;Neural Network;Conjugate Gradients;Partial Differential Equations;Fluid Simulation",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/c0730fc52d77e7c60948bdbb8c3a10ff31d2e678.zip",
        "author": "Weixian Lan;Elias Gueidon;Ayano Kaneda;Julian Panetta;Joseph Teran",
        "authorids": "~Weixian_Lan1;~Elias_Gueidon1;~Ayano_Kaneda1;~Julian_Panetta1;~Joseph_Teran1",
        "gender": ";M;F;M;M",
        "homepage": "https://www.weixianlan.com;;https://sites.google.com/view/pandako;http://julianpanetta.com;https://www.math.ucla.edu/~jteran/",
        "dblp": "358/4635;;;;",
        "google_scholar": "1NVO-OIAAAAJ;;YCs12mQAAAAJ;1rQ_OTEAAAAJ;ksjNjEwAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";egueidon/;kaneda-ayano-b75a49115/;;",
        "or_profile": "~Weixian_Lan1;~Elias_Gueidon1;~Ayano_Kaneda1;~Julian_Panetta1;~Joseph_Teran1",
        "aff": "University of California, Davis;University of California, Los Angeles;Waseda University;University of California, Davis;",
        "aff_domain": "ucdavis.edu;ucla.edu;waseda.jp;ucdavis.edu;",
        "position": "PhD student;PhD student;PhD student;Assistant Professor;",
        "bibtex": "@misc{\nlan2024a,\ntitle={A Neural-preconditioned Poisson Solver for Mixed Dirichlet and Neumann Boundary Conditions},\nauthor={Weixian Lan and Elias Gueidon and Ayano Kaneda and Julian Panetta and Joseph Teran},\nyear={2024},\nurl={https://openreview.net/forum?id=H8CtXin7mZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "ND3n;ddbQ;2G4U;TVSw",
        "site": "https://openreview.net/forum?id=H8CtXin7mZ",
        "pdf_size": 8406361,
        "rating": "5;5;5;6",
        "confidence": "3;4;4;5",
        "soundness": "3;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "109;70;45;127",
        "wc_strengths": "78;52;29;181",
        "wc_weaknesses": "136;169;160;486",
        "wc_questions": "33;121;176;260",
        "wc_review": "356;412;410;1054",
        "wc_reply_reviewers": "88;0;222;246",
        "wc_reply_authors": "113;393;221;379",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            87.75,
            32.151010870577615
        ],
        "wc_strengths_avg": [
            85.0,
            58.07322963293844
        ],
        "wc_weaknesses_avg": [
            237.75,
            143.83388856594263
        ],
        "wc_questions_avg": [
            147.5,
            82.58480489775344
        ],
        "wc_review_avg": [
            558.0,
            287.2455395650209
        ],
        "wc_reply_reviewers_avg": [
            139.0,
            100.32447358446493
        ],
        "wc_reply_authors_avg": [
            276.5,
            116.07217582177049
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:MmQ3tzegVbMJ:scholar.google.com/&scioq=A+Neural-preconditioned+Poisson+Solver+for+Mixed+Dirichlet+and+Neumann+Boundary+Conditions&hl=en&as_sdt=0,44",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "University of California, Davis;University of California, Los Angeles;Waseda University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ucdavis.edu;https://www.ucla.edu;https://www.waseda.jp/top",
        "aff_unique_abbr": "UC Davis;UCLA;Waseda",
        "aff_campus_unique_index": "0;1;0",
        "aff_campus_unique": "Davis;Los Angeles;",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "United States;Japan"
    },
    {
        "id": "H8OOlBjhkU",
        "title": "Optimization over Sparse Restricted Convex Sets via Two Steps Projection",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In sparse optimization,  enforcing hard constraints using the $\\ell_0$ pseudo-norm offers advantages like controlled sparsity compared to convex relaxations. However, many real-world applications (e.g., portfolio optimization) demand not only sparsity constraints but also some extra constraint (such as limit of budget). While prior algorithms have been developed to address this complex scenario with mixed combinatorial and convex constraints, they typically require the closed form projection onto the mixed constraints which might not exist, and/or only provide local guarantees of convergence which is different from the global guarantees commonly sought in sparse optimization. To fill this gap, in this paper, we study the problem of sparse optimization with extra $\\textit{restricted convex}$ constraints commonly encountered in the literature. We present a new variant of iterative hard-thresholding algorithm equipped with a two-step consecutive projection operator customized for these mixed constraints,  serving as a simple alternative to the Euclidean projection onto the mixed constraint. By introducing a novel trade-off between sparsity relaxation and sub-optimality, we provide global guarantees in objective value for the output of our algorithm, in the deterministic, stochastic, and zeroth-order settings, under the conventional restricted strong-convexity/smoothness assumptions.  As a fundamental contribution in  proof techniques, we develop a novel extension of the classic three-point lemma to the considered two-step non-convex projection operator, which allows us to analyze the convergence in objective value in an elegant way that has not been possible with existing techniques. Finally, we illustrate the applicability of our method on several sparse learning tasks.",
        "keywords": "sparse learning;hard-thresholding;stochastic optimization;zeroth-order optimization;restricted smoothness;restricted strong convexity",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/faa47b5f0f4294ad07e9eab7220ea538805c3f58.zip",
        "author": "William de Vazelhes;Xiaotong Yuan;Bin Gu",
        "authorids": "~William_de_Vazelhes2;~Xiaotong_Yuan1;~Bin_Gu1",
        "gender": "M;M;M",
        "homepage": "https://sites.google.com/site/xtyuan1980/;https://mbzuai.ac.ae/study/faculty/bin-gu/;http://github.com/wdevazelhes",
        "dblp": "64/5926;29/1758-1;247/1152",
        "google_scholar": "yzU6g24AAAAJ;Vo8OgCgAAAAJ;ple0xCwAAAAJ",
        "orcid": ";0000-0001-6049-1815;",
        "linkedin": ";;",
        "or_profile": "~Xiaotong_Yuan1;~Bin_Gu1;~William_De_Vazelhes1",
        "aff": "Nanjing University;Mohamed bin Zayed University of Artificial Intelligence;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_domain": "nju.edu.cn;mbzuai.ac.ae;mbzuai.ac.ae",
        "position": "Full Professor;Assistant Professor;PhD student",
        "bibtex": "@misc{\nvazelhes2024optimization,\ntitle={Optimization over Sparse Restricted Convex Sets via Two Steps Projection},\nauthor={William de Vazelhes and Xiaotong Yuan and Bin Gu},\nyear={2024},\nurl={https://openreview.net/forum?id=H8OOlBjhkU}\n}",
        "github": "",
        "project": "",
        "reviewers": "MFJV;r73h;LAEa;cMSm",
        "site": "https://openreview.net/forum?id=H8OOlBjhkU",
        "pdf_size": 468070,
        "rating": "3;3;6;8",
        "confidence": "4;4;3;1",
        "soundness": "2;3;2;2",
        "contribution": "2;2;3;2",
        "presentation": "2;2;3;2",
        "wc_summary": "20;37;87;12",
        "wc_strengths": "20;26;78;1",
        "wc_weaknesses": "79;259;80;1",
        "wc_questions": "79;38;114;1",
        "wc_review": "198;360;359;15",
        "wc_reply_reviewers": "0;0;32;0",
        "wc_reply_authors": "1915;531;797;17",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "4;2;3;1",
        "rating_avg": [
            5.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            3.0,
            1.224744871391589
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            39.0,
            29.146183283579344
        ],
        "wc_strengths_avg": [
            31.25,
            28.525208149985513
        ],
        "wc_weaknesses_avg": [
            104.75,
            94.64770203232618
        ],
        "wc_questions_avg": [
            58.0,
            42.50294107470682
        ],
        "wc_review_avg": [
            233.0,
            142.08624141696478
        ],
        "wc_reply_reviewers_avg": [
            8.0,
            13.856406460551018
        ],
        "wc_reply_authors_avg": [
            815.0,
            694.2233070129524
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.9622504486493763,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:agZnoT41xwUJ:scholar.google.com/&scioq=Optimization+over+Sparse+Restricted+Convex+Sets+via+Two+Steps+Projection&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Nanjing University;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.nju.edu.cn;https://mbzuai.ac.ae",
        "aff_unique_abbr": "Nanjing U;MBZUAI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "China;United Arab Emirates"
    },
    {
        "id": "H8Qg1IIMaR",
        "title": "Fool Your Large (Vision and) Language Models with Embarrassingly Simple Permutations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language and vision-language models are rapidly being deployed in practice thanks to their impressive capabilities in instruction following, in-context learning, and so on. This raises an urgent need to carefully analyse their robustness so that stakeholders can understand if and when such models are trustworthy enough to be relied upon in any given application. In this paper, we highlight a specific vulnerability in popular models, namely permutation sensitivity in multiple-choice question answering (MCQA). Specifically, we show empirically that popular models are vulnerable to adversarial permutation in answer sets for multiple-choice prompting, which is surprising as models should ideally be as invariant to prompt permutation as humans are. These vulnerabilities persist across various model sizes, and exist in very recent language and vision-language models.",
        "keywords": "Adversarial Attack; Large Language Model; Vision and Language Model",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/66071c09b206d247df4b0efbfd0f2382cbe8e183.zip",
        "author": "Yongshuo Zong;Yist Tingyang YU;Bingchen Zhao;Ruchika Chavhan;Timothy Hospedales",
        "authorids": "~Yongshuo_Zong1;~Yist_Tingyang_YU1;~Bingchen_Zhao1;~Ruchika_Chavhan1;~Timothy_Hospedales1",
        "gender": ";F;M;F;M",
        "homepage": "https://ys-zong.github.io/;https://yistyu.github.io/;http://bzhao.me/;https://ruchikachavhan.github.io/;http://homepages.inf.ed.ac.uk/thospeda/",
        "dblp": ";;120/3602;;32/3545",
        "google_scholar": "38-dM-MAAAAJ;1Cw8oZ4AAAAJ;lEcqFJEAAAAJ;vWDTlWoAAAAJ;https://scholar.google.fr/citations?user=nHhtvqkAAAAJ",
        "orcid": ";;;;0000-0003-4867-7486",
        "linkedin": ";;;ruchika-chavhan-5b5520159/?originalSubdomain=in;timothyhospedales/",
        "or_profile": "~Yongshuo_Zong1;~Yist_Tingyang_YU1;~Bingchen_Zhao1;~Ruchika_Chavhan1;~Timothy_Hospedales1",
        "aff": "University of Edinburgh;EPFL - EPF Lausanne;University of Edinburgh, University of Edinburgh;University of Edinburgh, University of Edinburgh;Samsung AI Research Centre",
        "aff_domain": "ed.ac.uk;epfl.ch;ed.ac.uk;ed.ac.uk;samsung.com",
        "position": "PhD student;PhD student;PhD student;PhD student;Principal Researcher",
        "bibtex": "@misc{\nzong2024fool,\ntitle={Fool Your Large (Vision and) Language Models with Embarrassingly Simple Permutations},\nauthor={Yongshuo Zong and Yist Tingyang YU and Bingchen Zhao and Ruchika Chavhan and Timothy Hospedales},\nyear={2024},\nurl={https://openreview.net/forum?id=H8Qg1IIMaR}\n}",
        "github": "",
        "project": "",
        "reviewers": "EvuZ;d9tg;FKE2;RBKq",
        "site": "https://openreview.net/forum?id=H8Qg1IIMaR",
        "pdf_size": 2729132,
        "rating": "5;5;6;6",
        "confidence": "4;3;3;4",
        "soundness": "2;3;3;2",
        "contribution": "2;3;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "63;39;49;43",
        "wc_strengths": "19;41;36;75",
        "wc_weaknesses": "86;90;88;209",
        "wc_questions": "4;4;19;17",
        "wc_review": "172;174;192;344",
        "wc_reply_reviewers": "0;0;75;18",
        "wc_reply_authors": "848;534;391;1506",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "3;2;2;3",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            48.5,
            9.096702699330127
        ],
        "wc_strengths_avg": [
            42.75,
            20.327014045353536
        ],
        "wc_weaknesses_avg": [
            118.25,
            52.413619413278454
        ],
        "wc_questions_avg": [
            11.0,
            7.035623639735144
        ],
        "wc_review_avg": [
            220.5,
            71.72691266184542
        ],
        "wc_reply_reviewers_avg": [
            23.25,
            30.768287245149022
        ],
        "wc_reply_authors_avg": [
            819.75,
            429.3066357511843
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:XFBN4BGEVIcJ:scholar.google.com/&scioq=Fool+Your+Large+(Vision+and)+Language+Models+with+Embarrassingly+Simple+Permutations&hl=en&as_sdt=0,11",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0;2",
        "aff_unique_norm": "University of Edinburgh;EPFL;Samsung",
        "aff_unique_dep": ";;AI Research",
        "aff_unique_url": "https://www.ed.ac.uk;https://www.epfl.ch;https://www.samsung.com/global/researchers/samsung-ai-research-centre/",
        "aff_unique_abbr": "Edinburgh;EPFL;SARC",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Lausanne",
        "aff_country_unique_index": "0;1;0;0;2",
        "aff_country_unique": "United Kingdom;Switzerland;South Korea"
    },
    {
        "id": "H8RgPl5OQX",
        "title": "Imagination Mechanism: Mesh Information Propagation for Enhancing Data Efficiency in Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Reinforcement learning(RL) algorithms face the challenge of limited data efficiency, particularly when dealing with high-dimensional state spaces and large-scale problems. Most of RL methods often rely solely on state transition information within the same episode when updating the agent's Critic, which can lead to low data efficiency and sub-optimal training time consumption. Inspired by human-like analogical reasoning abilities, we introduce a novel mesh information propagation mechanism, termed the 'Imagination Mechanism (IM)', designed to significantly enhance the data efficiency of RL algorithms. Specifically, IM enables information generated by a single sample to be effectively broadcasted to different states across episodes, instead of simply transmitting in the same episode. This capability enhances the model's comprehension of state interdependencies and facilitates more efficient learning of limited sample information. To promote versatility, we extend the IM to function as a plug-and-play module that can be seamlessly and fluidly integrated into other widely adopted RL algorithms. Our experiments demonstrate that IM consistently boosts four mainstream SOTA RL algorithms, such as SAC, PPO, DDPG, and DQN, by a considerable margin, ultimately leading to superior performance than before across various tasks. For access to our code and data, please visit https://github.com/OuAzusaKou/imagination_mechanism.",
        "keywords": "Data effciency;Mesh information propagation;Imagination mechanism;Reinforcement learning;State transition information",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Zihang Wang;Maowei Jiang",
        "authorids": "~Zihang_Wang2;~Maowei_Jiang1",
        "gender": "M;M",
        "homepage": ";https://blog.csdn.net/weixin_43332715",
        "dblp": ";335/2192",
        "google_scholar": ";ZRREqFIAAAAJ",
        "orcid": "0000-0002-7367-1898;0000-0002-4267-5570",
        "linkedin": ";",
        "or_profile": "~Zihang_Wang2;~Maowei_Jiang1",
        "aff": "University of Chinese Academy of Sciences;University of Chinese Academy of Sciences",
        "aff_domain": "ucas.ac.cn;ucas.edu",
        "position": "MS student;MS student",
        "bibtex": "@misc{\nwang2024imagination,\ntitle={Imagination Mechanism: Mesh Information Propagation for Enhancing Data Efficiency in Reinforcement Learning},\nauthor={Zihang Wang and Maowei Jiang},\nyear={2024},\nurl={https://openreview.net/forum?id=H8RgPl5OQX}\n}",
        "github": "",
        "project": "",
        "reviewers": "drgh;Cj8r;Wa5F;1rXd",
        "site": "https://openreview.net/forum?id=H8RgPl5OQX",
        "pdf_size": 821693,
        "rating": "3;3;3;3",
        "confidence": "3;4;4;4",
        "soundness": "3;2;1;3",
        "contribution": "2;2;2;2",
        "presentation": "2;1;1;2",
        "wc_summary": "62;196;100;37",
        "wc_strengths": "46;37;38;27",
        "wc_weaknesses": "205;286;360;32",
        "wc_questions": "111;30;82;27",
        "wc_review": "424;549;580;123",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            98.75,
            60.462281630782016
        ],
        "wc_strengths_avg": [
            37.0,
            6.745368781616021
        ],
        "wc_weaknesses_avg": [
            220.75,
            121.98642342490413
        ],
        "wc_questions_avg": [
            62.5,
            35.52815784698103
        ],
        "wc_review_avg": [
            419.0,
            180.59761903192413
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:mEMdFVxx4iIJ:scholar.google.com/&scioq=Imagination+Mechanism:+Mesh+Information+Propagation+for+Enhancing+Data+Efficiency+in+Reinforcement+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Chinese Academy of Sciences",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.ucas.ac.cn",
        "aff_unique_abbr": "UCAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "H8eTJ0s0Bj",
        "title": "LR-XFL: Logical Reasoning-based Explainable Federated Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Federated learning (FL) is an emerging approach for training machine learning models collaboratively while preserving data privacy. The need for privacy protection makes it difficult for FL models to achieve global transparency and explainability. To address this limitation, we incorporate logic-based explanations into FL by proposing the Logical Reasoning-based eXplainable Federated Learning (LR-XFL) approach. Under LR-XFL, FL clients create local logic rules based on their local data and send them, along with model updates, to the FL server. The FL server connects the local logic rules through a proper logical connector that is derived based on properties of client data, without requiring access to the raw data. In addition, the server also aggregates the local model updates with weight values determined by the quality of the clients\u2019 local data as reflected by their uploaded logic rules. The results show that LR-XFL outperforms the most relevant baseline by 1.19%, 5.81% and 5.41% in terms of classification accuracy, rule accuracy and rule fidelity, respectively. The explicit rule evaluation and expression under LR-XFL enable human experts to validate and correct the rules on the server side, hence improving the global FL model\u2019s robustness to errors. It has the potential to enhance the transparency of FL models for areas like healthcare and finance where both data privacy and explainability are important.",
        "keywords": "Federated Learning;Explainable AI;Logical Reasoning",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "",
        "author": "Yanci Zhang;Han Yu",
        "authorids": "~Yanci_Zhang2;~Han_Yu1",
        "gender": ";M",
        "homepage": ";https://sites.google.com/site/hanyushomepage/home",
        "dblp": ";35/1096-1",
        "google_scholar": "-oOUbz4AAAAJ;https://scholar.google.com.sg/citations?hl=en",
        "orcid": ";0000-0001-6893-8650",
        "linkedin": ";",
        "or_profile": "~Yanci_Zhang2;~Han_Yu1",
        "aff": "Nanyang Technological University;Nanyang Technological University",
        "aff_domain": "ntu.edu.sg;ntu.edu.sg",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\nzhang2024lrxfl,\ntitle={{LR}-{XFL}: Logical Reasoning-based Explainable Federated Learning},\nauthor={Yanci Zhang and Han Yu},\nyear={2024},\nurl={https://openreview.net/forum?id=H8eTJ0s0Bj}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=H8eTJ0s0Bj",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15967333937672143756&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Nanyang Technological University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ntu.edu.sg",
        "aff_unique_abbr": "NTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Singapore"
    },
    {
        "id": "H8tpFITvpo",
        "title": "FedHC: Proximal Correction with Hessian and Cosine Correlation for Federated Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Federated learning (FL), a prominent distributed learning approach, involves collaborative\nupdates among participants and individual updates on private data.\nWhile widely-used FL methods, such as FedDC and others, traditionally rely\non first-order optimization techniques like Stochastic Gradient Descent (SGD) to\nachieve convergence, there is a growing interest in leveraging second-order optimization\nmethods to enhance convergence in complex models. However, applying\nthese second-order techniques to FL models often results in convergence challenges.\nTo address these issues, we present an innovative integrated methodology\nknown as FedHC, combining proximal correction with Hessian optimization and\ncosine correlation for FL. FedHC introduces the Hessian optimizer with proximal\ncorrection to accelerate convergence. Additionally, we employ cosine correlation\nto minimize learning discrepancies and bridge the gap between local and global\nmodels. Experimental results and analyses conducted on four datasets demonstrate\nthat FedHC significantly accelerates convergence and outperforms existing\nmethods in various image classification tasks, maintaining robustness in both IID\nand Non-IID client settings.",
        "keywords": "Federated Learning;Proximal Correction with Hessian and Cosine correlation;FedHC",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/9c546a41072f84e69463256bf56e551652f8d38d.pdf",
        "author": "Kushall Pal Singh;Monu Verma;Santosh Kumar Vipparthi;Subrahmanyam Murala;G Sankara Raju Kosuru;Dinesh Kumar Tyagi;Mohamed Abdel-mottaleb",
        "authorids": "~Kushall_Pal_Singh1;~Monu_Verma1;~Santosh_Kumar_Vipparthi1;~Subrahmanyam_Murala2;~G_Sankara_Raju_Kosuru1;~Dinesh_Kumar_Tyagi1;~Mohamed_Abdel-mottaleb1",
        "gender": "M;F;M;M;;M;M",
        "homepage": "https://mnit.ac.in/dept_cse/people;https://visionintelligence.github.io/Monu.html;;https://www.scss.tcd.ie/~muralas/;;https://mnit.ac.in/dept_cse/people;https://people.miami.edu/profile/b4062526410b2477325ca25241f580f1",
        "dblp": ";https://dblp.uni-trier.de/pers/ht/v/Verma:Monu;148/8541;61/10849;;35/9571;",
        "google_scholar": "I5byoh0AAAAJ;d8fP0LIAAAAJ;https://scholar.google.co.in/citations?user=JWSfd7YAAAAJ;https://scholar.google.co.in/citations?user=5lGnNQoAAAAJ;https://scholar.google.co.in/citations?user=-AK3itMAAAAJ;;",
        "orcid": ";0000-0003-4962-882X;0000-0002-5672-3537;0000-0003-3384-4368;;0000-0003-1104-7456;",
        "linkedin": ";monu-verma-0469b6253/;santosh-kumar-vipparthi-b1a55479/;subrahmanyam-murala-b5114716/?originalSubdomain=ie;;;",
        "or_profile": "~Kushall_Pal_Singh1;~Monu_Verma1;~Santosh_Kumar_Vipparthi1;~Subrahmanyam_Murala2;~G_Sankara_Raju_Kosuru1;~Dinesh_Kumar_Tyagi1;~Mohamed_Abdel-mottaleb1",
        "aff": "Malaviya National Institute of Technology Jaipur;;Indian Institute of Technology Ropar (IIT Ropar);University of Dublin, Trinity College;I I T Ropar, India;Malaviya National Institute of Technology Jaipur;University of Miami",
        "aff_domain": "mnit.ac.in;;iitrpr.ac.in;tcd.ie;iitrpr.ac.in;mnit.ac.in;miami.edu",
        "position": "PhD student;;Associate Professor;Associate Professor;Assistant Professor;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nsingh2024fedhc,\ntitle={Fed{HC}: Proximal Correction with Hessian and Cosine Correlation for Federated Learning},\nauthor={Kushall Pal Singh and Monu Verma and Santosh Kumar Vipparthi and Subrahmanyam Murala and G Sankara Raju Kosuru and Dinesh Kumar Tyagi and Mohamed Abdel-mottaleb},\nyear={2024},\nurl={https://openreview.net/forum?id=H8tpFITvpo}\n}",
        "github": "",
        "project": "",
        "reviewers": "YJUU;vZhu;zx4S",
        "site": "https://openreview.net/forum?id=H8tpFITvpo",
        "pdf_size": 305053,
        "rating": "1;1;3",
        "confidence": "5;5;4",
        "soundness": "1;1;1",
        "contribution": "1;1;1",
        "presentation": "1;1;2",
        "wc_summary": "71;49;31",
        "wc_strengths": "43;13;19",
        "wc_weaknesses": "371;359;120",
        "wc_questions": "91;2;2",
        "wc_review": "576;423;172",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            1.0,
            0.0
        ],
        "contribution_avg": [
            1.0,
            0.0
        ],
        "presentation_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            50.333333333333336,
            16.35712552851373
        ],
        "wc_strengths_avg": [
            25.0,
            12.96148139681572
        ],
        "wc_weaknesses_avg": [
            283.3333333333333,
            115.59796230422441
        ],
        "wc_questions_avg": [
            31.666666666666668,
            41.95500235040182
        ],
        "wc_review_avg": [
            390.3333333333333,
            166.54195333975827
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.9999999999999998,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:nuP2Z5wibjgJ:scholar.google.com/&scioq=FedHC:+Proximal+Correction+with+Hessian+and+Cosine+Correlation+for+Federated+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;1;0;3",
        "aff_unique_norm": "Malaviya National Institute of Technology;Indian Institute of Technology Ropar;Trinity College Dublin;University of Miami",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.mnit.ac.in;https://www.iitrpr.ac.in;https://www.tcd.ie;https://www.miami.edu",
        "aff_unique_abbr": "MNIT;IIT Ropar;TCD;UM",
        "aff_campus_unique_index": "0;1;1;0",
        "aff_campus_unique": "Jaipur;Ropar;",
        "aff_country_unique_index": "0;0;1;0;0;2",
        "aff_country_unique": "India;Ireland;United States"
    },
    {
        "title": "Discovering modular solutions that generalize compositionally",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19005",
        "id": "H98CVcX1eh",
        "author_site": "Simon Schug, Seijin Kobayashi, Yassir Akram, Maciej Wo\u0142czyk, Alexandra M Proca, Johannes von Oswald, Razvan Pascanu, Joao Sacramento, Angelika Steger",
        "tldr": "",
        "abstract": "Many complex tasks can be decomposed into simpler, independent parts. Discovering such underlying compositional structure has the potential to enable compositional generalization. Despite progress, our most powerful systems struggle to compose flexibly. It therefore seems natural to make models more modular to help capture the compositional nature of many tasks. However, it is unclear under which circumstances modular systems can discover hidden compositional structure. To shed light on this question, we study a teacher-student setting with a modular teacher where we have full control over the composition of ground truth modules. This allows us to relate the problem of compositional generalization to that of identification of the underlying modules. In particular we study modularity in hypernetworks representing a general class of multiplicative interactions. We show theoretically that identification up to linear transformation purely from demonstrations is possible without having to learn an exponential number of module combinations. We further demonstrate empirically that under the theoretically identified conditions, meta-learning from finite data can discover modular policies that generalize compositionally in a number of complex environments.",
        "keywords": "modularity;compositionality;compositional generalization;teacher-student;meta-learning;hypernetworks",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/827f38623ac1d912562ca45e672fb9c24593e46c.zip",
        "author": "Simon Schug;Seijin Kobayashi;Yassir Akram;Maciej Wolczyk;Alexandra Maria Proca;Johannes von Oswald;Razvan Pascanu;Joao Sacramento;Angelika Steger",
        "authorids": "~Simon_Schug1;~Seijin_Kobayashi1;~Yassir_Akram1;~Maciej_Wolczyk1;~Alexandra_Maria_Proca1;~Johannes_von_Oswald2;~Razvan_Pascanu1;~Joao_Sacramento1;~Angelika_Steger2",
        "gender": ";;M;M;F;Not Specified;M;M;",
        "homepage": "https://smn.one/;;https://as.inf.ethz.ch/people/members/yakram/index.html;;https://aproca.github.io/;https://as.inf.ethz.ch/people/members/voswaldj/index.html;https://razp.info;http://www.joaosacramento.com;",
        "dblp": "262/5139;;329/5709;236/5956;;242/8029;65/8368.html;59/9214;",
        "google_scholar": "T-ZAeg0AAAAJ;;_eYyLKIAAAAJ;;ONLlzEUAAAAJ;https://scholar.google.ch/citations?user=jdnL-PgAAAAJ;https://scholar.google.ca/citations?user=eSPY8LwAAAAJ;9hpcmYUAAAAJ;",
        "orcid": "0000-0002-5305-2547;;;;0000-0003-1516-0114;;;;",
        "linkedin": ";;;;;johswald/?originalSubdomain=de;;;",
        "or_profile": "~Simon_Schug1;~Seijin_Kobayashi1;~Yassir_Akram1;~Maciej_Wolczyk1;~Alexandra_Maria_Proca1;~Johannes_von_Oswald2;~Razvan_Pascanu1;~Joao_Sacramento1;~Angelika_Steger2",
        "aff": "Google DeepMind;;Department of Computer Science, ETHZ - ETH Zurich;IDEAS NCBR Sp.;Imperial College London;Google;Google DeepMind;Department of Computer Science, ETHZ - ETH Zurich;",
        "aff_domain": "deepmind.com;;inf.ethz.ch;ideas-ncbr.pl;ic.ac.uk;research.google.com;google.com;inf.ethz.ch;",
        "position": "Intern;;PhD student;Postdoc;PhD student;Researcher;Research Scientist;Principal Researcher;",
        "bibtex": "@inproceedings{\nschug2024discovering,\ntitle={Discovering modular solutions that generalize compositionally},\nauthor={Simon Schug and Seijin Kobayashi and Yassir Akram and Maciej Wolczyk and Alexandra Maria Proca and Johannes von Oswald and Razvan Pascanu and Joao Sacramento and Angelika Steger},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=H98CVcX1eh}\n}",
        "github": "",
        "project": "",
        "reviewers": "9UrZ;bgW6;4knX;KGfv",
        "pdf_size": 1595609,
        "rating": "6;6;6;8",
        "confidence": "3;4;2;3",
        "soundness": "3;3;2;3",
        "contribution": "2;3;2;3",
        "presentation": "3;2;1;2",
        "wc_summary": "39;60;72;133",
        "wc_strengths": "47;246;26;47",
        "wc_weaknesses": "71;1078;37;660",
        "wc_questions": "6;69;46;203",
        "wc_review": "163;1453;181;1043",
        "wc_reply_reviewers": "112;1840;24;289",
        "wc_reply_authors": "931;4564;489;2279",
        "reply_reviewers": "1;6;1;2",
        "reply_authors": "2;7;1;5",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            76.0,
            34.96426747409418
        ],
        "wc_strengths_avg": [
            91.5,
            89.61166218746308
        ],
        "wc_weaknesses_avg": [
            461.5,
            433.6372331799934
        ],
        "wc_questions_avg": [
            81.0,
            73.9560680404252
        ],
        "wc_review_avg": [
            710.0,
            557.2225767141888
        ],
        "wc_reply_reviewers_avg": [
            566.25,
            741.5667114292551
        ],
        "wc_reply_authors_avg": [
            2065.75,
            1585.9166710454872
        ],
        "reply_reviewers_avg": [
            2.5,
            2.0615528128088303
        ],
        "reply_authors_avg": [
            3.75,
            2.384848003542364
        ],
        "replies_avg": [
            33,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5859591535713126535&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=H98CVcX1eh",
        "pdf": "https://openreview.net/pdf?id=H98CVcX1eh",
        "email": "deepmind.com;;inf.ethz.ch;ideas-ncbr.pl;ic.ac.uk;research.google.com;google.com;inf.ethz.ch;",
        "author_num": 9,
        "aff_unique_index": "0;1;2;3;0;0;1",
        "aff_unique_norm": "Google;ETH Zurich;IDEAS NCBR;Imperial College London",
        "aff_unique_dep": "Google DeepMind;Department of Computer Science;;",
        "aff_unique_url": "https://deepmind.com;https://www.ethz.ch;;https://www.imperial.ac.uk",
        "aff_unique_abbr": "DeepMind;ETHZ;;ICL",
        "aff_campus_unique_index": "1;2;1",
        "aff_campus_unique": ";Zurich;Mountain View",
        "aff_country_unique_index": "0;1;2;0;3;0;1",
        "aff_country_unique": "United Kingdom;Switzerland;Poland;United States"
    },
    {
        "id": "H9D1revQeW",
        "title": "Training graph backward compatible embeddings",
        "track": "main",
        "status": "Desk Reject",
        "tldr": "",
        "abstract": "In this paper we study the problem of training backward compatible embeddings.\nWe suggest framework to train neural networks end-to-end using contrastive learning. Applying contrastive learning allow us to improve exciting method, BCAligner, for solving backward compatibility problem and obtain significant metrics improvement. We consider graph neural networks (GCN, GAT) for our experiments and use open-source graph datasets (Cora, CiteSeer) to compare methods. Our method outperform BC-Aligner by 6%/5% accuracy for Cora/CiteSeer\ndatasets correspondingly.",
        "keywords": "Contrastive learning;embeddings;supervised;graph neural nework",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Daniil Bondarev;Dmitrii Kiselev",
        "authorids": "~Daniil_Bondarev1;~Dmitrii_Kiselev1",
        "gender": ";",
        "homepage": ";https://www.linkedin.com/in/mkiseljov/",
        "dblp": ";274/8290.html",
        "google_scholar": ";uiOSkDsAAAAJ",
        "orcid": ";0000-0001-6190-7587",
        "linkedin": ";",
        "or_profile": "~Daniil_Bondarev1;~Dmitrii_Kiselev1",
        "aff": ";Higher School of Economics",
        "aff_domain": ";hse.ru",
        "position": ";Researcher",
        "bibtex": "@misc{\nbondarev2024training,\ntitle={Training graph backward compatible embeddings},\nauthor={Daniil Bondarev and Dmitrii Kiselev},\nyear={2024},\nurl={https://openreview.net/forum?id=H9D1revQeW}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=H9D1revQeW",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:GwaIZjJOE8sJ:scholar.google.com/&scioq=Training+graph+backward+compatible+embeddings&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Higher School of Economics",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.hse.ru",
        "aff_unique_abbr": "HSE",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Russian Federation"
    },
    {
        "id": "H9DYMIpz9c",
        "title": "Farzi Data: Autoregressive Data Distillation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We study data distillation for auto-regressive machine learning tasks, where the input and output have a strict left-to-right causal structure. More specifically, we propose Farzi, which summarizes an event sequence dataset into a small number of synthetic sequences \u2014 Farzi Data \u2014 which are optimized to maintain (if not improve) model performance compared to training on the full dataset. Under the hood, FARZI conducts memory-efficient data distillation by (i) deriving efficient reverse-mode differentiation of the Adam optimizer by leveraging Hessian-Vector Products; and (ii) factorizing the high-dimensional discrete event-space into a latent-space which provably promotes implicit regularization. Empirically, for sequential recommendation and language modeling tasks, we are able to achieve 98 \u2212 120% of downstream full-data performance when training state-of-the-art models on Farzi Data of size as little as 0.1% of the original dataset. Notably, being able to train better models with significantly less data sheds light on the design of future large auto-regressive models, and opens up new opportunities to further scale up model and data sizes.",
        "keywords": "Data Distillation;Meta Learning;Recommender Systems;Language Modeling",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Noveen Sachdeva;Zexue He;Wang-Cheng Kang;Jianmo Ni;Derek Zhiyuan Cheng;Julian McAuley",
        "authorids": "~Noveen_Sachdeva2;~Zexue_He1;~Wang-Cheng_Kang3;~Jianmo_Ni2;~Derek_Zhiyuan_Cheng1;~Julian_McAuley1",
        "gender": "M;F;M;;M;M",
        "homepage": "https://www.noveens.com/;https://zexuehe.github.io/;http://cseweb.ucsd.edu/~wckang/;;https://ai.google/research/people/ZhiyuanCheng;http://cseweb.ucsd.edu/~jmcauley/",
        "dblp": "216/7290;215/4688;https://dblp.uni-trier.de/pers/k/Kang:Wang=Cheng;161/2449;;29/3483",
        "google_scholar": "i6tMWAoAAAAJ;-JrCM0AAAAAJ;kA2I_d0AAAAJ;VECFLiAAAAAJ;qYYPst0AAAAJ;icbo4M0AAAAJ",
        "orcid": ";;;;;0000-0003-0955-7588",
        "linkedin": "noveensachdeva/;;;;;",
        "or_profile": "~Noveen_Sachdeva2;~Zexue_He1;~Wang-Cheng_Kang3;~Jianmo_Ni2;~Derek_Zhiyuan_Cheng1;~Julian_McAuley1",
        "aff": "University of California, San Diego;University of California, San Diego;Google;Google;Google;University of California, San Diego, University of California, San Diego",
        "aff_domain": "ucsd.edu;ucsd.edu;google.com;google.com;google.com;eng.ucsd.edu",
        "position": "PhD student;PhD student;Software Engineer;Software engineer;Principal Researcher;Full Professor",
        "bibtex": "@misc{\nsachdeva2024farzi,\ntitle={Farzi Data: Autoregressive Data Distillation},\nauthor={Noveen Sachdeva and Zexue He and Wang-Cheng Kang and Jianmo Ni and Derek Zhiyuan Cheng and Julian McAuley},\nyear={2024},\nurl={https://openreview.net/forum?id=H9DYMIpz9c}\n}",
        "github": "",
        "project": "",
        "reviewers": "LDAP;THWQ;FjiL;htDK;At7H",
        "site": "https://openreview.net/forum?id=H9DYMIpz9c",
        "pdf_size": 750417,
        "rating": "3;5;5;6;6",
        "confidence": "4;2;4;3;3",
        "soundness": "2;2;2;4;3",
        "contribution": "3;3;2;3;3",
        "presentation": "2;2;4;4;3",
        "wc_summary": "134;56;214;85;97",
        "wc_strengths": "230;76;264;200;86",
        "wc_weaknesses": "648;347;282;140;64",
        "wc_questions": "149;27;194;10;4",
        "wc_review": "1161;506;954;435;251",
        "wc_reply_reviewers": "182;0;0;0;0",
        "wc_reply_authors": "941;680;451;412;355",
        "reply_reviewers": "1;0;0;0;0",
        "reply_authors": "2;1;1;1;1",
        "rating_avg": [
            5.0,
            1.0954451150103321
        ],
        "confidence_avg": [
            3.2,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.6,
            0.8
        ],
        "contribution_avg": [
            2.8,
            0.39999999999999997
        ],
        "presentation_avg": [
            3.0,
            0.8944271909999159
        ],
        "wc_summary_avg": [
            117.2,
            54.48449320678316
        ],
        "wc_strengths_avg": [
            171.2,
            76.44710589682253
        ],
        "wc_weaknesses_avg": [
            296.2,
            202.41580965922597
        ],
        "wc_questions_avg": [
            76.8,
            78.98202327112163
        ],
        "wc_review_avg": [
            661.4,
            340.3084483229883
        ],
        "wc_reply_reviewers_avg": [
            36.4,
            72.79999999999998
        ],
        "wc_reply_authors_avg": [
            567.8,
            216.82564423979005
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            1.2,
            0.4000000000000001
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.48795003647426666,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13084775630886397776&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;1;1;1;0",
        "aff_unique_norm": "University of California, San Diego;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.ucsd.edu;https://www.google.com",
        "aff_unique_abbr": "UCSD;Google",
        "aff_campus_unique_index": "0;0;1;1;1;0",
        "aff_campus_unique": "San Diego;Mountain View",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "HAJzPND6Xt",
        "title": "Efficient Realistic Avatar Generation via Model Compression and Enhanced Rendering",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In order to integrate digital avatars into people's lives, efficiently generating complete, realistic, and animatable avatars is a very important requirement. However, with the increasing parameter counts and model sizes, efficiency such as training speed and model sizes are challenged when the models are deployed on devices, while the graphical rule-based micro-renderers, which simplify real-world photorealistic mechanisms such as illumination and reflections, are unable to generate photorealistic images. Based on these issues, we propose a two-stage model compression optimization architecture, where the first stage uses our proposed distillation architecture to compress the model, and the second stage uses our proposed generative adversarial renderer to customize its inverse version to the student network to further improve the realism of digital avatars. Specifically, in the knowledge distillation process, multi-scale feature fusion is achieved by concatenating the output features of RandLA-Net and GCN to combine global and local information to better capture the details and contextual information of the point cloud. We construct assisted supervision, which enables point-level supervision by building the graph topology of the entire point cloud. We also propose to feed the extracted point cloud features as latent codes into our well-designed neural renderer to render more realistic facial images. Experiments show that the method not only improves the network performance but also reduces the parameters and computation of the whole network compared to existing SOTA methods, and our method reduces the number of parameters of the teacher model by about 95\\% and 90\\% of the computation in knowledge distillation.",
        "keywords": "Head Avatars;Knowledge distillation;Neural network compression;Generative adversarial renderer",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Shengjia Zhang",
        "authorids": "~Shengjia_Zhang1",
        "gender": "M",
        "homepage": "",
        "dblp": "",
        "google_scholar": "owkQc3kAAAAJ",
        "orcid": "0009-0008-3512-6371",
        "linkedin": "",
        "or_profile": "~Shengjia_Zhang1",
        "aff": "Ningxia University",
        "aff_domain": "nxu.edu.cn",
        "position": "MS student",
        "bibtex": "@misc{\nzhang2024efficient,\ntitle={Efficient Realistic Avatar Generation via Model Compression and Enhanced Rendering},\nauthor={Shengjia Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=HAJzPND6Xt}\n}",
        "github": "",
        "project": "",
        "reviewers": "vN9C;LZcv;S2Ns;qfwg",
        "site": "https://openreview.net/forum?id=HAJzPND6Xt",
        "pdf_size": 12942941,
        "rating": "3;3;3;5",
        "confidence": "4;4;5;4",
        "soundness": "3;2;3;2",
        "contribution": "2;3;3;2",
        "presentation": "2;3;3;3",
        "wc_summary": "38;57;93;58",
        "wc_strengths": "28;37;101;43",
        "wc_weaknesses": "387;330;409;150",
        "wc_questions": "150;70;106;53",
        "wc_review": "603;494;709;304",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            61.5,
            19.85572965166478
        ],
        "wc_strengths_avg": [
            52.25,
            28.647643882176418
        ],
        "wc_weaknesses_avg": [
            319.0,
            101.74232157760113
        ],
        "wc_questions_avg": [
            94.75,
            37.19795021234369
        ],
        "wc_review_avg": [
            527.5,
            149.7639809834127
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:MxMlqxRtCVUJ:scholar.google.com/&scioq=Efficient+Realistic+Avatar+Generation+via+Model+Compression+and+Enhanced+Rendering&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Ningxia University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.nxu.edu.cn",
        "aff_unique_abbr": "",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "HAMBmtKLc8",
        "title": "Graph Neural Networks on Symmetric Positive Definite Manifold",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Geometric deep learning equips graph neural networks (GNNs) with some symmetry aesthetics from its underlying principles, which draw the structural properties of graphs.\nHowever, modeling in Euclidean or hyperbolic geometry, or even their combinations, usually hypothesizes that the graph nodes satisfy the preferred geometric properties, which ignores the actual graph structures.\nThis prompted us to consider a more solid expression to relieve the above significant hypothesis for the geometric graph embeddings.\nIn this study, we generalize the fundamental components of GNNs on the Symmetric Positive Definite (SPD) manifold, which could be approximately observed by the integration of Euclidean and non-Euclidean geometric structures.\nThis motivates us to reconstruct the GNNs with manifold-preserving linear transformation, neighborhood aggregation, non-linear activation, and multinomial logistic regression, in which the Log-Cholesky metric  derives the closed-form Fr\u00e9chet mean representation for neighborhood aggregation and computational tractability for learning geometric embeddings.\nExperiments demonstrate that the SPDGNN can learn superior representations for grid and hierarchical node structures, leading to significant performance improvements in subsequent classifications compared to the Euclidean and Hyperbolic analogs.",
        "keywords": "Non-Euclidean Geometry;Graph Neural Network;Symmetric Positive Definite Manifold;Log-Cholesky Metric",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/d4eb0a86249a31a5b9c18028b4afced16ce7c8f1.zip",
        "author": "Yu Wang;Xiaofeng Cao;Yi Chang",
        "authorids": "~Yu_Wang61;~Xiaofeng_Cao2;~Yi_Chang4",
        "gender": ";M;M",
        "homepage": ";http://www.yichang-cs.com;https://xiaofengcaoml.github.io/",
        "dblp": "02/5889-152;02/5438.html;117/3982-2.html",
        "google_scholar": "iCBQJRcAAAAJ;https://scholar.google.com.hk/citations?user=drEkR50AAAAJ;",
        "orcid": ";0000-0003-2697-8093;",
        "linkedin": ";;",
        "or_profile": "~Yu_Wang61;~Yi_Chang4;~Xiaofeng_Cao1",
        "aff": "Jilin University;Jilin University, China;Jilin University",
        "aff_domain": "jlu.edu.cn;jlu.edu.cn;jlu.edu.cn",
        "position": "Postdoc;Full Professor;Associate Professor",
        "bibtex": "@misc{\nwang2024graph,\ntitle={Graph Neural Networks on Symmetric Positive Definite Manifold},\nauthor={Yu Wang and Xiaofeng Cao and Yi Chang},\nyear={2024},\nurl={https://openreview.net/forum?id=HAMBmtKLc8}\n}",
        "github": "",
        "project": "",
        "reviewers": "xhi5;KpWj;Jw38;KteU",
        "site": "https://openreview.net/forum?id=HAMBmtKLc8",
        "pdf_size": 20653963,
        "rating": "3;3;5;8",
        "confidence": "3;3;4;4",
        "soundness": "1;2;3;4",
        "contribution": "2;2;2;4",
        "presentation": "1;1;3;2",
        "wc_summary": "55;149;121;116",
        "wc_strengths": "31;52;53;47",
        "wc_weaknesses": "532;131;129;94",
        "wc_questions": "41;49;55;91",
        "wc_review": "659;381;358;348",
        "wc_reply_reviewers": "0;0;23;0",
        "wc_reply_authors": "1483;774;853;777",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "3;2;2;2",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            1.118033988749895
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            110.25,
            34.28829975370607
        ],
        "wc_strengths_avg": [
            45.75,
            8.814051281902097
        ],
        "wc_weaknesses_avg": [
            221.5,
            179.87009201087324
        ],
        "wc_questions_avg": [
            59.0,
            19.131126469708992
        ],
        "wc_review_avg": [
            436.5,
            129.01647181658626
        ],
        "wc_reply_reviewers_avg": [
            5.75,
            9.959292143521045
        ],
        "wc_reply_authors_avg": [
            971.75,
            296.8630787080131
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.8551861104941366,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:rUBNAnLE7YIJ:scholar.google.com/&scioq=Graph+Neural+Networks+on+Symmetric+Positive+Definite+Manifold&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Jilin University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.jlu.edu.cn",
        "aff_unique_abbr": "JLU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "HANfmG6tQK",
        "title": "REVISITING LARS FOR LARGE BATCH TRAINING GENERALIZATION OF NEURAL NETWORKS",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "LARS and LAMB have emerged as prominent techniques in Large Batch Learn-\ning (LBL), ensuring the stability of AI training. One of the primary challenges\nin LBL is convergence stability, where the AI agent usually gets trapped into the\nsharp minimizer. Addressing this challenge, a relatively recent technique, known\nas warm-up, has been employed. However, warm-up lacks a strong theoretical\nfoundation, leaving the door open for further exploration of more efficacious al-\ngorithms. In light of this situation, we conduct empirical experiments to analyze\nthe behaviors of the two most popular optimizers in the LARS family: LARS\nand LAMB, with and without a warm-up strategy. Our analyses give a compre-\nhensive insight into the behavior of LARS, LAMB, and the necessity of a warm-\nup technique in LBL, including an explanation of their failure in many cases.\nBuilding upon these insights, we propose a novel algorithm called Time Varying\nLARS (TVLARS), which facilitates robust training in the initial phase without the\nneed for warm-up. We run extensive experimental evaluations to demonstrate that\nTVLARS achieves competitive results with LARS and LAMB when warm-up is\nutilized while surpassing their performance without the warm-up technique.",
        "keywords": "Large Batch Training;Optimization;High Learning Rate;Redundant WarmUp",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/1de2806fede07cb4a8ea497f6a7d2583327462fb.zip",
        "author": "Khoi Hoang Do;Duong Minh Nguyen;Hoa Tien Nguyen;Long Tran-Thanh;Viet Quoc Pham",
        "authorids": "~Khoi_Hoang_Do1;~Duong_Minh_Nguyen1;~Hoa_Tien_Nguyen2;~Long_Tran-Thanh1;~Viet_Quoc_Pham2",
        "gender": "M;M;M;;M",
        "homepage": "https://scholar.google.com/citations?user=MDLVBrAAAAAJ&hl=en;https://www.github.com/skydvn;;https://warwick.ac.uk/fac/sci/dcs/people/long_tran-thanh/;https://www.scss.tcd.ie/viet.pham",
        "dblp": ";157/4392;82/8786.html;46/8333;",
        "google_scholar": "MDLVBrAAAAAJ;3ea0RLkAAAAJ;B7sDxxIAAAAJ;https://scholar.google.co.uk/citations?user=YBQai3gAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;0000-0003-4743-5012;;0000-0002-9485-9216",
        "linkedin": "hoangkhoidoo/;;;;pqv90/",
        "or_profile": "~Khoi_Hoang_Do1;~Duong_Minh_Nguyen1;~Hoa_Tien_Nguyen2;~Long_Tran-Thanh1;~Viet_Quoc_Pham2",
        "aff": "Hanoi University of Science and Technology;Pusan National University;Hanoi University of Science and Technology;The university of Warwick;University of Dublin, Trinity College",
        "aff_domain": "sis.hust.edu.vn;pusan.ac.kr;hust.edu.vn;warwick.ac.uk;tcd.ie",
        "position": "Undergrad student;PhD student;Assistant Professor;Full Professor;Assistant Professor",
        "bibtex": "@misc{\ndo2024revisiting,\ntitle={{REVISITING} {LARS} {FOR} {LARGE} {BATCH} {TRAINING} {GENERALIZATION} {OF} {NEURAL} {NETWORKS}},\nauthor={Khoi Hoang Do and Duong Minh Nguyen and Hoa Tien Nguyen and Long Tran-Thanh and Viet Quoc Pham},\nyear={2024},\nurl={https://openreview.net/forum?id=HANfmG6tQK}\n}",
        "github": "",
        "project": "",
        "reviewers": "XbTS;k26Y;Kfjf",
        "site": "https://openreview.net/forum?id=HANfmG6tQK",
        "pdf_size": 15566511,
        "rating": "5;6;6",
        "confidence": "3;4;4",
        "soundness": "3;4;4",
        "contribution": "2;2;4",
        "presentation": "2;4;3",
        "wc_summary": "88;83;97",
        "wc_strengths": "48;34;86",
        "wc_weaknesses": "94;45;61",
        "wc_questions": "70;51;155",
        "wc_review": "300;213;399",
        "wc_reply_reviewers": "0;53;0",
        "wc_reply_authors": "911;426;181",
        "reply_reviewers": "0;1;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            89.33333333333333,
            5.792715732327588
        ],
        "wc_strengths_avg": [
            56.0,
            21.96967607104544
        ],
        "wc_weaknesses_avg": [
            66.66666666666667,
            20.401524997465806
        ],
        "wc_questions_avg": [
            92.0,
            45.217990519998416
        ],
        "wc_review_avg": [
            304.0,
            75.98684096605149
        ],
        "wc_reply_reviewers_avg": [
            17.666666666666668,
            24.984439601924677
        ],
        "wc_reply_authors_avg": [
            506.0,
            303.3424907042643
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.9999999999999997,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=441413942425718812&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;0;2;3",
        "aff_unique_norm": "Hanoi University of Science and Technology;Pusan National University;University of Warwick;Trinity College Dublin",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.hust.edu.vn;https://www.pnu.ac.kr;https://warwick.ac.uk;https://www.tcd.ie",
        "aff_unique_abbr": "HUST;PNU;Warwick;TCD",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hanoi;",
        "aff_country_unique_index": "0;1;0;2;3",
        "aff_country_unique": "Vietnam;South Korea;United Kingdom;Ireland"
    },
    {
        "id": "HBEjrlu7Aa",
        "title": "Object-level Data Augmentation for Visual 3D Object Detection in Autonomous Driving",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Data augmentation plays an important role in visual-based 3D object detection. Existing detectors typically employ image/BEV-level data augmentation techniques, failing to utilize flexible object-level augmentations because of 2D-3D inconsistencies. This limitation hinders us from increasing the diversity of training data.  To alleviate this issue, we propose an object-level data augmentation approach that incorporates scene reconstruction and neural scene rendering. Specifically, we reconstruct the scene and objects by extracting image features from sequences and aligning them with associated LiDAR point clouds. This approach is intended to conduct the editing process within a 3D space, allowing for flexible object manipulation. Additionally, we introduce a neural scene renderer to project the edited 3D scene onto a specified camera plane and render it onto a 2D image. Combining with the scene reconstruction, it overcomes the challenges stemming from 2D/3D inconsistencies, enabling the generation of object-level augmented images with corresponding labels for model training. To validate the proposed method, we apply our method to two popular multi-camera detectors: PETRv2 and BEVFormer, consistently boosting the performance. Codes will be public.",
        "keywords": "Data augmentation;3D object detection;autonomous driving",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/ea0431777bebf6394ce782c1258da4e334f1d670.zip",
        "author": "Haoran Cheng;Junkai Xu;Liang Peng;Qi Zhou;Linxuan Xia;Boxi Wu;Xiaofei He",
        "authorids": "~Haoran_Cheng2;~Junkai_Xu1;~Liang_Peng3;~Qi_Zhou7;~Linxuan_Xia1;~Boxi_Wu1;~Xiaofei_He2",
        "gender": "M;M;M;;M;M;M",
        "homepage": "https://github.com/chenghaoran1998;https://github.com/cskkxjk;https://spengliang.github.io/;;https://github.com/Xialinxuan;http://wiki.zjulearning.org:8081/wiki/User:Wuboxi;https://person.zju.edu.cn/0007101",
        "dblp": ";;57/3505-1;;359/6129;;h/XiaofeiHe.html",
        "google_scholar": "4s389vQAAAAJ;Tsnf3JkAAAAJ;_sJpS34AAAAJ;;;;QLLFowsAAAAJ",
        "orcid": "0009-0000-3950-2700;0000-0002-6366-8863;;;;;0009-0001-9107-2354",
        "linkedin": ";;;;;;",
        "or_profile": "~Haoran_Cheng2;~Junkai_Xu1;~Liang_Peng3;~Qi_Zhou7;~Linxuan_Xia1;~Boxi_Wu1;~Xiaofei_He2",
        "aff": "College of Computer Science and Technology, Zhejiang University;Zhejiang University;FABU Inc;;FABU Inc;Zhejiang University;Zhejiang University",
        "aff_domain": "cs.zju.edu.cn;zju.edu.cn;fabu.ai;;fabu.ai;zju.edu.cn;zju.edu.cn",
        "position": "PhD student;PhD student;Researcher;;Intern;Researcher;Professor",
        "bibtex": "@misc{\ncheng2024objectlevel,\ntitle={Object-level Data Augmentation for Visual 3D Object Detection in Autonomous Driving},\nauthor={Haoran Cheng and Junkai Xu and Liang Peng and Qi Zhou and Linxuan Xia and Boxi Wu and Xiaofei He},\nyear={2024},\nurl={https://openreview.net/forum?id=HBEjrlu7Aa}\n}",
        "github": "",
        "project": "",
        "reviewers": "m1gL;v2XH;ZS78",
        "site": "https://openreview.net/forum?id=HBEjrlu7Aa",
        "pdf_size": 11977362,
        "rating": "5;6;6",
        "confidence": "5;5;3",
        "soundness": "3;4;3",
        "contribution": "3;3;3",
        "presentation": "3;4;3",
        "wc_summary": "109;87;41",
        "wc_strengths": "56;61;38",
        "wc_weaknesses": "123;110;129",
        "wc_questions": "2;3;6",
        "wc_review": "290;261;214",
        "wc_reply_reviewers": "0;114;37",
        "wc_reply_authors": "969;1180;523",
        "reply_reviewers": "0;2;1",
        "reply_authors": "3;3;2",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            79.0,
            28.331372481167705
        ],
        "wc_strengths_avg": [
            51.666666666666664,
            9.877021593352703
        ],
        "wc_weaknesses_avg": [
            120.66666666666667,
            7.93025150224688
        ],
        "wc_questions_avg": [
            3.6666666666666665,
            1.699673171197595
        ],
        "wc_review_avg": [
            255.0,
            31.31559781748812
        ],
        "wc_reply_reviewers_avg": [
            50.333333333333336,
            47.48567035315905
        ],
        "wc_reply_authors_avg": [
            890.6666666666666,
            273.8787241746893
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:tIidM292td8J:scholar.google.com/&scioq=Object-level+Data+Augmentation+for+Visual+3D+Object+Detection+in+Autonomous+Driving&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;1;0;0",
        "aff_unique_norm": "Zhejiang University;Fabu Inc",
        "aff_unique_dep": "College of Computer Science and Technology;",
        "aff_unique_url": "http://www.zju.edu.cn;",
        "aff_unique_abbr": "ZJU;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China;"
    },
    {
        "id": "HBFzStNrS9",
        "title": "Unitention: Attend a sample to the dataset",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We propose an end-to-end trainable module termed Unitention, an abbreviation for universal-individual cross-attention, to improve deep features of a given neural network by attending the feature of a data sample to those of the entire dataset.\nThis innovation is motivated by two key observations: (i) traditional visual encoding methods, such as Bag of visual Words, encode an image by using a universal dataset-wide codebook, while (ii) deep models typically process every individual data sample in isolation, without explicitly using any universal information.\nOur Unitention can bridge this gap by attentively merging universal and individual features, thus complementing and enhancing the given deep model.\nWe evaluate its efficacy on various classification benchmarks and model architectures.\nOn ImageNet, Unitention improves the accuracy of different ConvNets and Transformers. In particular, some \\knn classifiers with Unitention can even outperform baseline classifiers.\nImprovements in fine-grained tasks are more substantial (up to 2.3%).\nFurther validations on other modalities also confirm Unitention's versatility.\nIn summary, Unitention reveals the potential of using dataset-level information to enhance deep features.\nIt opens up a new backbone-independent direction for improving neural networks, orthogonal to the mainstream research on backbone architecture design.",
        "keywords": "Neural Network Backbone;Image Classification;Cross Attention",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Keyu Tian;Lu Chi;Yi Jiang;Chen Lin;Yansong Tang;Song Bai;Zehuan Yuan;Hengshuang Zhao",
        "authorids": "~Keyu_Tian1;~Lu_Chi1;~Yi_Jiang2;~Chen_Lin2;~Yansong_Tang1;~Song_Bai3;~Zehuan_Yuan1;~Hengshuang_Zhao2",
        "gender": "M;M;M;M;M;;M;M",
        "homepage": ";;https://enjoyyi.github.io/;https://scholar.google.com/citations?hl=en&user=rObgGWIAAAAJ;https://andytang15.github.io/;https://songbai.site/;https://shallowyuan.github.io/;https://hszhao.github.io",
        "dblp": "265/5609;https://dblp.org/pers/hd/c/Chi:Lu;;;214/9568;;227/3298;185/7848",
        "google_scholar": "6FdkbygAAAAJ;;https://scholar.google.com.hk/citations?user=6dikuoYAAAAJ;https://scholar.google.com/citations?hl=en;TIbistUAAAAJ;LXuWMF4AAAAJ;;4uE10I0AAAAJ",
        "orcid": "0000-0001-5909-2091;;0000-0002-2133-8719;;;;;0000-0001-8277-2706",
        "linkedin": "keyu-tian/;;;;;;;hengshuang-zhao-347b8391/?originalSubdomain=hk",
        "or_profile": "~Keyu_Tian1;~Lu_Chi1;~Yi_Jiang2;~Chen_Lin2;~Yansong_Tang1;~Song_Bai3;~Zehuan_Yuan1;~Hengshuang_Zhao2",
        "aff": "Peking University;;Bytedance;University of Oxford, University of Oxford;Tsinghua University;ByteDance;ByteDance Inc.;The University of Hong Kong",
        "aff_domain": "pku.edu.cn;;bytedance.com;eng.ox.ac.uk;tsinghua.edu.cn;bytedance.com;bytedance.com;hku.hk",
        "position": "MS student;;Researcher;PhD student;Assistant Professor;Computer Vision Lead;Researcher;Assistant Professor",
        "bibtex": "@misc{\ntian2024unitention,\ntitle={Unitention: Attend a sample to the dataset},\nauthor={Keyu Tian and Lu Chi and Yi Jiang and Chen Lin and Yansong Tang and Song Bai and Zehuan Yuan and Hengshuang Zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=HBFzStNrS9}\n}",
        "github": "",
        "project": "",
        "reviewers": "Ubis;yV5u;zCBo;CKwM",
        "site": "https://openreview.net/forum?id=HBFzStNrS9",
        "pdf_size": 1381861,
        "rating": "5;5;5;6",
        "confidence": "5;3;4;5",
        "soundness": "2;2;3;3",
        "contribution": "3;2;2;3",
        "presentation": "3;3;2;2",
        "wc_summary": "69;86;149;53",
        "wc_strengths": "83;28;62;48",
        "wc_weaknesses": "76;238;442;252",
        "wc_questions": "16;80;10;73",
        "wc_review": "244;432;663;426",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "685;966;1310;1166",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;2;2;2",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            89.25,
            36.41685736029401
        ],
        "wc_strengths_avg": [
            55.25,
            20.06707502353046
        ],
        "wc_weaknesses_avg": [
            252.0,
            129.68423188653276
        ],
        "wc_questions_avg": [
            44.75,
            31.91688424642982
        ],
        "wc_review_avg": [
            441.25,
            148.65963641822887
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1031.75,
            234.5233197360126
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.5222329678670935,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:G2nGsUMyByoJ:scholar.google.com/&scioq=Unitention:+Attend+a+sample+to+the+dataset&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;1;1;4",
        "aff_unique_norm": "Peking University;ByteDance;University of Oxford;Tsinghua University;University of Hong Kong",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.bytedance.com;https://www.ox.ac.uk;https://www.tsinghua.edu.cn;https://www.hku.hk",
        "aff_unique_abbr": "Peking U;Bytedance;Oxford;THU;HKU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;1;0;0;0;0",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "title": "Lewis's Signaling Game as beta-VAE For Natural Word Lengths and Segments",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19004",
        "id": "HC0msxE3sf",
        "author_site": "Ryo Ueda, TADAHIRO TANIGUCHI",
        "tldr": "",
        "abstract": "As a sub-discipline of evolutionary and computational linguistics, emergent communication (EC) studies communication protocols, called emergent languages, arising in simulations where agents communicate. A key goal of EC is to give rise to languages that share statistical properties with natural languages. In this paper, we reinterpret Lewis's signaling game, a frequently used setting in EC, as beta-VAE and reformulate its objective function as ELBO. Consequently, we clarify the existence of prior distributions of emergent languages and show that the choice of the priors can influence their statistical properties. Specifically, we address the properties of word lengths and segmentation, known as Zipf's law of abbreviation (ZLA) and Harris's articulation scheme (HAS), respectively. It has been reported that the emergent languages do not follow them when using the conventional objective. We experimentally demonstrate that by selecting an appropriate prior distribution, more natural segments emerge, while suggesting that the conventional one prevents the languages from following ZLA and HAS.",
        "keywords": "Emergent Communication;Emergent Language;Probabilistic Generative Model;Variational Autoencoder;beta-VAE;Zipf\u2019s law of abbreviation;Harris\u2019s articulation scheme",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Ryo Ueda;Tadahiro Taniguchi",
        "authorids": "~Ryo_Ueda1;~Tadahiro_Taniguchi2",
        "gender": "M;M",
        "homepage": "https://sites.google.com/view/ryo-ueda/;http://www.em.ci.ritsumei.ac.jp/",
        "dblp": "191/3366;25/4674",
        "google_scholar": "https://scholar.google.co.jp/citations?user=4HULQlwAAAAJ;https://scholar.google.co.uk/citations?user=dPOCLQEAAAAJ",
        "orcid": ";0000-0002-5682-2076",
        "linkedin": ";",
        "or_profile": "~Ryo_Ueda1;~Tadahiro_Taniguchi2",
        "aff": "The University of Tokyo;Kyoto University",
        "aff_domain": "u-tokyo.ac.jp;kyoto-u.ac.jp",
        "position": "PhD student;Full Professor",
        "bibtex": "@inproceedings{\nueda2024lewiss,\ntitle={Lewis's Signaling Game as beta-{VAE} For Natural Word Lengths and Segments},\nauthor={Ryo Ueda and Tadahiro Taniguchi},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=HC0msxE3sf}\n}",
        "github": "",
        "project": "",
        "reviewers": "unmd;TgUR;E7HT;knBD",
        "pdf_size": 450141,
        "rating": "3;5;8;8",
        "confidence": "5;3;3;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;4",
        "presentation": "1;2;3;4",
        "wc_summary": "118;143;72;78",
        "wc_strengths": "21;202;94;124",
        "wc_weaknesses": "44;552;178;3",
        "wc_questions": "10;122;544;72",
        "wc_review": "193;1019;888;277",
        "wc_reply_reviewers": "0;98;217;0",
        "wc_reply_authors": "257;1588;2342;106",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;3;4;1",
        "rating_avg": [
            6.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            102.75,
            29.200813344836817
        ],
        "wc_strengths_avg": [
            110.25,
            64.87825136361182
        ],
        "wc_weaknesses_avg": [
            194.25,
            216.44904134691842
        ],
        "wc_questions_avg": [
            187.0,
            209.89759407863636
        ],
        "wc_review_avg": [
            594.25,
            363.4386984073105
        ],
        "wc_reply_reviewers_avg": [
            78.75,
            89.28430713176868
        ],
        "wc_reply_authors_avg": [
            1073.25,
            932.2728610766271
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            1.299038105676658
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.8164965809277261,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14475267031553886914&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=HC0msxE3sf",
        "pdf": "https://openreview.net/pdf?id=HC0msxE3sf",
        "email": "u-tokyo.ac.jp;kyoto-u.ac.jp",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Tokyo;Kyoto University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.u-tokyo.ac.jp;https://www.kyoto-u.ac.jp",
        "aff_unique_abbr": "UTokyo;Kyoto U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Japan"
    },
    {
        "id": "HC26cxtI96",
        "title": "The Fine-Grained Chip Placement with Hybrid Action Spaces and Feature Fusion",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Chip placement is an essential and time-consuming step in the physical design process. Deep reinforcement learning, as an emerging field, has gained significant attention due to its ability to replace weeks of expert model design. We devise a fusion-based reinforcement learning framework to address the limited representation problem of both graph networks and CNN networks. Furthermore,the structure of PDQN in the hybrid action space allows for precise coordinate placement, compared to other RL-based structures in placement. The experimental results can demonstrate the effectiveness of our model.",
        "keywords": "Deep Reinforcement Learning;Chip Placement;hybrid action space;feature fusion",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/1f1ed9eb685f7de595a99282eb2adaf6abb62e53.pdf",
        "author": "Mingyue Wang",
        "authorids": "~Mingyue_Wang1",
        "gender": "F",
        "homepage": "https://github.com/mywanglucky",
        "dblp": "",
        "google_scholar": "",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Mingyue_Wang1",
        "aff": "University of Science and Technology of China",
        "aff_domain": "ustc.edu.cn",
        "position": "PhD student",
        "bibtex": "@misc{\nwang2024the,\ntitle={The Fine-Grained Chip Placement with Hybrid Action Spaces and Feature Fusion},\nauthor={Mingyue Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=HC26cxtI96}\n}",
        "github": "",
        "project": "",
        "reviewers": "XWnU;YRSP;WddF;QMCZ",
        "site": "https://openreview.net/forum?id=HC26cxtI96",
        "pdf_size": 175739,
        "rating": "1;1;1;1",
        "confidence": "5;5;4;3",
        "soundness": "1;1;2;1",
        "contribution": "2;1;2;1",
        "presentation": "1;1;1;1",
        "wc_summary": "87;62;36;7",
        "wc_strengths": "13;18;27;1",
        "wc_weaknesses": "23;10;46;1",
        "wc_questions": "1;21;40;1",
        "wc_review": "124;111;149;10",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            1.0,
            0.0
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            1.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            1.0,
            0.0
        ],
        "wc_summary_avg": [
            48.0,
            29.75735203273302
        ],
        "wc_strengths_avg": [
            14.75,
            9.390819985496474
        ],
        "wc_weaknesses_avg": [
            20.0,
            16.926310879810757
        ],
        "wc_questions_avg": [
            15.75,
            16.20763708873073
        ],
        "wc_review_avg": [
            98.5,
            52.88903478037768
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:rNRAZtr3D50J:scholar.google.com/&scioq=The+Fine-Grained+Chip+Placement+with+Hybrid+Action+Spaces+and+Feature+Fusion&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Science and Technology of China",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.ustc.edu.cn",
        "aff_unique_abbr": "USTC",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "HCCkCjClO0",
        "title": "Online Weight Approximation for Continual Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Continual Learning primarily focuses on studying learning scenarios that challenge a learner\u2019s capacity to adapt to new problems, while reducing the loss of previously acquired knowledge. This work addresses challenges arising when training a deep neural network across numerous tasks. We propose an Online Weight Approximation scheme to model the dynamics of the weights of such a model across different tasks. We show that this represents a viable approach for tackling the problem of catastrophic forgetting both in domain-incremental and class-incremental learning problems, provided that the task identities can be estimated. Empirical experiments under several configurations demonstrate the effectiveness and superiority of this approach also when compared with a powerful replay strategy.",
        "keywords": "online function approximation;continual learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/a61051699534bcb608ba01b13d53ed7dcbc1c8e1.zip",
        "author": "Alessandro Betti;Gabriele Ciravegna;Marco Gori;Kevin Mottin;Frederic Precioso",
        "authorids": "~Alessandro_Betti1;~Gabriele_Ciravegna1;~Marco_Gori1;~Kevin_Mottin1;~Frederic_Precioso2",
        "gender": "M;M;M;M;M",
        "homepage": "http://sailab.diism.unisi.it/people/alessandro-betti/;https://dbdmg.polito.it/dbdmg_web/gabriele-ciravegna/;http://sailab.diism.unisi.it/people/marco-gori/;;https://www.i3s.unice.fr/~precioso/",
        "dblp": "180/7658;228/1667;g/MarcoGori;;83/1407.html",
        "google_scholar": "https://scholar.google.com/citations?hl=it;https://scholar.google.it/citations?view_op=list_works;;;-0cKTucAAAAJ",
        "orcid": ";0000-0002-6799-1043;0000-0001-6337-5430;0009-0003-9277-0749;0000-0001-8712-1443",
        "linkedin": ";gabriele-ciravegna-5a1130124/;;;fr%C3%A9d%C3%A9ric-precioso-3a37389/",
        "or_profile": "~Alessandro_Betti1;~Gabriele_Ciravegna1;~Marco_Gori1;~Kevin_Mottin1;~Frederic_Precioso1",
        "aff": "Institute for Advanced Studies Lucca;Polytechnic Institute of Turin;University of Siena;Universit\u00e9 de Nice-Sophia Antipolis;Universit\u00e9 de Nice-Sophia Antipolis",
        "aff_domain": "imtlucca.it;polito.it;unisi.it;unice.fr;unice.fr",
        "position": "Assistant Professor;Postdoc;Full Professor;PhD student;Full Professor",
        "bibtex": "@misc{\nbetti2024online,\ntitle={Online Weight Approximation for Continual Learning},\nauthor={Alessandro Betti and Gabriele Ciravegna and Marco Gori and Kevin Mottin and Frederic Precioso},\nyear={2024},\nurl={https://openreview.net/forum?id=HCCkCjClO0}\n}",
        "github": "",
        "project": "",
        "reviewers": "Si3p;nrVT;fbhj;AoB5",
        "site": "https://openreview.net/forum?id=HCCkCjClO0",
        "pdf_size": 573952,
        "rating": "3;3;3;3",
        "confidence": "4;4;5;4",
        "soundness": "2;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "2;2;2;1",
        "wc_summary": "47;13;21;63",
        "wc_strengths": "13;15;21;70",
        "wc_weaknesses": "269;404;433;49",
        "wc_questions": "1;8;5;106",
        "wc_review": "330;440;480;288",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "204;237;187;159",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            36.0,
            20.024984394500787
        ],
        "wc_strengths_avg": [
            29.75,
            23.42407949098534
        ],
        "wc_weaknesses_avg": [
            288.75,
            151.62515457535403
        ],
        "wc_questions_avg": [
            30.0,
            43.94883388669147
        ],
        "wc_review_avg": [
            384.5,
            78.23522224676044
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            196.75,
            28.252212302756046
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:PH6ShedtglwJ:scholar.google.com/&scioq=Online+Weight+Approximation+for+Continual+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;3",
        "aff_unique_norm": "Institute for Advanced Studies;Polytechnic Institute of Turin;University of Siena;Universit\u00e9 de Nice-Sophia Antipolis",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.iasl.it;https://www.polito.it;https://www.unisi.it;https://www.unice.fr",
        "aff_unique_abbr": ";Polito;UniSi;UNICA",
        "aff_campus_unique_index": "0;2;2",
        "aff_campus_unique": "Lucca;;Sophia Antipolis",
        "aff_country_unique_index": "0;0;0;1;1",
        "aff_country_unique": "Italy;France"
    },
    {
        "id": "HCMmC8DETj",
        "title": "Analysis of Task Transferability in Large Pre-trained Classifiers",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Transfer learning is a cornerstone of modern machine learning, enabling models to transfer the knowledge acquired from a source task to downstream target tasks with minimal fine-tuning. However, the relationship between the source task performance and the downstream target task performance (i.e., transferability) is not well understood. In this work, we rigorously analyze the transferability of large pre-trained models on downstream classification tasks after linear fine-tuning. We use a novel Task Transfer Analysis approach that transforms the distribution (and classifier) of the source task to produce a new distribution (and classifier) similar to that of the target task. Using this, we propose an upper bound on transferability composed of the Wasserstein distance between the transformed source and the target \ndistributions, the conditional entropy between the label distributions of the two tasks, and the weighted loss of the source classifier on the source task. We propose an optimization problem that minimizes the proposed bound to estimate transferability. Using state-of-the-art pre-trained models, we show that the proposed upper bound accurately estimates transferability on various datasets and demonstrates the importance of high relatedness between the source and target tasks for achieving high transferability.",
        "keywords": "Transfer Learning;Distribution Shift",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/d49d5eff1148f732b141d6ee3670b8dc8c0e43fe.zip",
        "author": "Akshay Mehra;Yunbei Zhang;Jihun Hamm",
        "authorids": "~Akshay_Mehra1;~Yunbei_Zhang1;~Jihun_Hamm2",
        "gender": "M;;M",
        "homepage": "https://akshaymehra24.github.io/;https://zybeich.github.io/;https://www.cs.tulane.edu/~jhamm3",
        "dblp": "215/3754;351/0497;69/7426.html",
        "google_scholar": "5hTbBDMAAAAJ;tVb54uUAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Akshay_Mehra1;~Yunbei_Zhang1;~Jihun_Hamm1",
        "aff": "Tulane University;Tulane University;Tulane University",
        "aff_domain": "tulane.edu;tulane.edu;cs.tulane.edu",
        "position": "PhD student;PhD student;Associate Professor",
        "bibtex": "@misc{\nmehra2024analysis,\ntitle={Analysis of Task Transferability in Large Pre-trained Classifiers},\nauthor={Akshay Mehra and Yunbei Zhang and Jihun Hamm},\nyear={2024},\nurl={https://openreview.net/forum?id=HCMmC8DETj}\n}",
        "github": "",
        "project": "",
        "reviewers": "Zr88;2KtK;GYU6;nX5m",
        "site": "https://openreview.net/forum?id=HCMmC8DETj",
        "pdf_size": 2938992,
        "rating": "3;3;3;5",
        "confidence": "4;4;4;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "2;2;2;3",
        "wc_summary": "211;93;128;66",
        "wc_strengths": "126;19;48;42",
        "wc_weaknesses": "355;134;356;93",
        "wc_questions": "200;2;20;27",
        "wc_review": "892;248;552;228",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            124.5,
            54.56418239101544
        ],
        "wc_strengths_avg": [
            58.75,
            40.307412469668655
        ],
        "wc_weaknesses_avg": [
            234.5,
            121.86570477373854
        ],
        "wc_questions_avg": [
            62.25,
            80.05115551945518
        ],
        "wc_review_avg": [
            480.0,
            270.3035330882673
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14387118144118928695&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Tulane University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tulane.edu",
        "aff_unique_abbr": "Tulane",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Forward $\\chi^2$ Divergence Based Variational Importance Sampling",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19003",
        "id": "HD5Y7M8Xdk",
        "author_site": "Chengrui Li, Yule Wang, Weihan Li, Anqi Wu",
        "tldr": "",
        "abstract": "Maximizing the marginal log-likelihood is a crucial aspect of learning latent variable models, and variational inference (VI) stands as the commonly adopted method. However, VI can encounter challenges in achieving a high marginal log-likelihood when dealing with complicated posterior distributions. In response to this limitation, we introduce a novel variational importance sampling (VIS) approach that directly estimates and maximizes the marginal log-likelihood. VIS leverages the optimal proposal distribution, achieved by minimizing the forward $\\chi^2$ divergence, to enhance marginal log-likelihood estimation. We apply VIS to various popular latent variable models, including mixture models, variational auto-encoders, and partially observable generalized linear models. Results demonstrate that our approach consistently outperforms state-of-the-art baselines, in terms of both log-likelihood and model parameter estimation. Code: \\url{https://github.com/JerrySoybean/vis}.",
        "keywords": "Importance sampling;$\\chi^2$ divergence;latent variable models",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/f62bb583a5e0f97dcc8d9a7fdcc47761f9fbc00b.zip",
        "author": "Chengrui Li;Yule Wang;Weihan Li;Anqi Wu",
        "authorids": "~Chengrui_Li1;~Yule_Wang1;~Weihan_Li1;~Anqi_Wu3",
        "gender": "M;M;M;F",
        "homepage": "https://jerrysoybean.github.io/;https://yulewang97.github.io/;https://weihanlikk.github.io/;https://sites.google.com/view/brainml/home",
        "dblp": "174/4237;;24/8923;15/9453",
        "google_scholar": "https://scholar.google.com/citations?h;vqsl1YYAAAAJ;qW4_NR4AAAAJ;ptGYJiEAAAAJ",
        "orcid": "0000-0001-5947-2393;;;0000-0002-7866-9455",
        "linkedin": ";yule-wang-a8002b195/;;",
        "or_profile": "~Chengrui_Li1;~Yule_Wang1;~Weihan_Li1;~Anqi_Wu3",
        "aff": "Georgia Institute of Technology;Georgia Institute of Technology;Georgia Institute of Technology;Georgia Institute of Technology",
        "aff_domain": "gatech.edu;gatech.edu;gatech.edu;gatech.edu",
        "position": "PhD student;PhD student;PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nli2024forward,\ntitle={Forward \\${\\textbackslash}chi{\\textasciicircum}2\\$ Divergence Based Variational Importance Sampling},\nauthor={Chengrui Li and Yule Wang and Weihan Li and Anqi Wu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=HD5Y7M8Xdk}\n}",
        "github": "",
        "project": "",
        "reviewers": "84Pi;J8Yz;T2mb;QxSX",
        "pdf_size": 3056032,
        "rating": "5;6;8;8",
        "confidence": "3;4;4;3",
        "soundness": "2;3;4;4",
        "contribution": "2;2;3;3",
        "presentation": "2;2;4;3",
        "wc_summary": "92;26;86;132",
        "wc_strengths": "94;109;27;165",
        "wc_weaknesses": "186;216;57;138",
        "wc_questions": "110;24;111;76",
        "wc_review": "482;375;281;511",
        "wc_reply_reviewers": "0;206;0;0",
        "wc_reply_authors": "1537;926;1028;896",
        "reply_reviewers": "0;2;0;0",
        "reply_authors": "4;3;2;2",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            84.0,
            37.86819245752297
        ],
        "wc_strengths_avg": [
            98.75,
            49.15473018947414
        ],
        "wc_weaknesses_avg": [
            149.25,
            60.08899649686288
        ],
        "wc_questions_avg": [
            80.25,
            35.40038841594821
        ],
        "wc_review_avg": [
            412.25,
            91.14651666410516
        ],
        "wc_reply_reviewers_avg": [
            51.5,
            89.20061658979718
        ],
        "wc_reply_authors_avg": [
            1096.75,
            258.84491012959865
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.19245008972987526,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2920849684938273476&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=HD5Y7M8Xdk",
        "pdf": "https://openreview.net/pdf?id=HD5Y7M8Xdk",
        "email": "gatech.edu;gatech.edu;gatech.edu;gatech.edu",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Georgia Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.gatech.edu",
        "aff_unique_abbr": "Georgia Tech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "HDbKLu0bkn",
        "title": "Heterogeneity of Regularization between adjacent periods",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Since the inception of deep learning, regularization techniques have been developed for the purpose of preventing the overfitting phenomenon. Regularization is typically accomplished in two ways: incorporating randomness (e.g., injecting noise into data, activating nodes, or using dropout) or heterogeneity (e.g., data augmentation). These approaches are known to lead to better generalization and, consequently, improved performance. In the case of introducing heterogeneity by adjusting the hyperparameter during the training process, such as the drop rate of dropout, experiments have shown that tuning hyperparameters after a period, which consists of a certain number of forward propagations, is more effective than either uniformly sustaining hyperparameters or tuning them during every propagation. Therefore, this paper proposes a novel regularization technique named Periodic Regularization that introduces periodicity into the dynamic hyperparameter tuning of other regularization methods. Furthermore, this paper suggests combining Periodic Regularization and other learning techniques such as Reinforcement Learning and Transfer Learning. This approach, particularly when combining dropout and reinforcement learning, shows significant improvement in empirical testing across various popular datasets. This is notably evident in Facial Expression Recognition (FER) tasks, where conventional methods, such as noise injection and dropout, have proven ineffective. Our proposed periodic regularization method not only can fill the research gap found in traditional regularization techniques but also can be a cornerstone for further research where the concept of periodic regularization is combined with diverse vanilla regularization techniques and learning techniques.",
        "keywords": "Regularization;Heterogeneity;Periodic Regularization;Reinforcement Learning;Transfer Learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/f5045dee6a060ddee61ec4d389c4fc682002fe76.zip",
        "author": "SangHwa Hong;Bongseok Kim;Min Kyu Sim",
        "authorids": "~SangHwa_Hong1;~Bongseok_Kim1;~Min_Kyu_Sim1",
        "gender": "M;M;",
        "homepage": "https://scholar.google.com/citations?view_op=list_works&hl=ko&user=e4Rt2ccAAAAJ;https://github.com/bongseokkim;",
        "dblp": ";;",
        "google_scholar": ";;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~SangHwa_Hong1;~Bongseok_Kim1;~Min_Kyu_Sim1",
        "aff": "Seoul National University of Science and Technology;;",
        "aff_domain": "seoultech.ac.kr;;",
        "position": "Undergrad student;;",
        "bibtex": "@misc{\nanonymous2024heterogeneity,\ntitle={Heterogeneity of Regularization between adjacent periods},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=HDbKLu0bkn}\n}",
        "github": "",
        "project": "",
        "reviewers": "yqeu;KrfM;kYa6;QKyW",
        "site": "https://openreview.net/forum?id=HDbKLu0bkn",
        "pdf_size": 1754744,
        "rating": "1;1;3;5",
        "confidence": "5;5;5;3",
        "soundness": "1;2;1;3",
        "contribution": "1;1;1;3",
        "presentation": "1;1;2;2",
        "wc_summary": "76;44;55;86",
        "wc_strengths": "17;60;49;56",
        "wc_weaknesses": "55;396;195;61",
        "wc_questions": "7;6;15;60",
        "wc_review": "155;506;314;263",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.5,
            1.6583123951777
        ],
        "confidence_avg": [
            4.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            1.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            65.25,
            16.60383991732033
        ],
        "wc_strengths_avg": [
            45.5,
            16.91892431568863
        ],
        "wc_weaknesses_avg": [
            176.75,
            138.4058795716425
        ],
        "wc_questions_avg": [
            22.0,
            22.214859891523062
        ],
        "wc_review_avg": [
            309.5,
            127.14656896668505
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8703882797784891,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:CxlEbuZa8KIJ:scholar.google.com/&scioq=Heterogeneity+of+Regularization+between+adjacent+periods&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Seoul National University of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.snust.ac.kr",
        "aff_unique_abbr": "SNUST",
        "aff_country_unique_index": "0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "HDoUgQEdNb",
        "title": "SocREval: LLMs with the Socratic Method for Reference-free Reasoning Evaluation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "To comprehensively assess the capacity of current models for complex reasoning, it is crucial to assess their step-by-step reasoning in a scalable manner. Established reference-based evaluation metrics rely on human-annotated reasoning chains to assess the model-derived chains. However, such ``gold-standard'' human-written reasoning chains may not be unique and their acquisition is often labor-intensive. Existing reference-free reasoning metrics eliminate the need for human-crafted reasoning chains as references, but they typically require fine-tuning on datasets with human-derived reasoning chains, which complicates the process and raises concerns regarding generalizability across diverse datasets. To address these challenges, we harness GPT-4 to automatically evaluate reasoning chain quality, obviating the need for human-crafted references. Leveraging the Socratic method, we devise tailored prompts to enhance reference-free reasoning evaluation, which we term SocREval (**Soc**ratic method for **R**easoning **Eval**uation). Empirical results from four human annotated datasets reveal that SocREval significantly improves GPT-4's performance, surpassing existing reference-free and reference-based reasoning evaluation metrics. Beyond its demonstrated efficacy, our proposed framework, large language models (LLMs) with the Socratic method, proves to be both cost-efficient and robust to prompt writing and example selection, as substantiated by our in-depth analysis.",
        "keywords": "Large Language Model;Socratic Method;Reference-Free Reasoning Evaluation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/d5bc9b7193665a211761ce4250bc51196d6998b0.zip",
        "author": "Hangfeng He;Hongming Zhang;Dan Roth",
        "authorids": "~Hangfeng_He3;~Hongming_Zhang2;~Dan_Roth3",
        "gender": "M;M;M",
        "homepage": "https://hornhehhf.github.io;http://www.cse.ust.hk/~hzhangal/;https://www.cis.upenn.edu/~danroth/",
        "dblp": "190/7762-1.html;;r/DanRoth",
        "google_scholar": "BbpI6QoAAAAJ;i5ETuuQAAAAJ;E-bpPWgAAAAJ",
        "orcid": "0000-0001-5136-1218;;",
        "linkedin": ";;dan-roth-8667361/",
        "or_profile": "~Hangfeng_He3;~Hongming_Zhang2;~Dan_Roth3",
        "aff": "University of Rochester;Tencent AI Lab Seattle;Amazon",
        "aff_domain": "rochester.edu;tencent.com;amazon.com",
        "position": "Assistant Professor;Researcher;VP and Distinguished Scientist",
        "bibtex": "@misc{\nhe2024socreval,\ntitle={Soc{RE}val: {LLM}s with the Socratic Method for Reference-free Reasoning Evaluation},\nauthor={Hangfeng He and Hongming Zhang and Dan Roth},\nyear={2024},\nurl={https://openreview.net/forum?id=HDoUgQEdNb}\n}",
        "github": "",
        "project": "",
        "reviewers": "TsV2;fFgo;Hwhe;QzWF",
        "site": "https://openreview.net/forum?id=HDoUgQEdNb",
        "pdf_size": 392884,
        "rating": "3;3;5;5",
        "confidence": "4;4;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;2",
        "presentation": "3;3;3;3",
        "wc_summary": "111;47;84;117",
        "wc_strengths": "36;22;156;78",
        "wc_weaknesses": "193;277;219;165",
        "wc_questions": "55;9;79;54",
        "wc_review": "395;355;538;414",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            89.75,
            27.63489641739227
        ],
        "wc_strengths_avg": [
            73.0,
            52.16320542297991
        ],
        "wc_weaknesses_avg": [
            213.5,
            41.33702940463913
        ],
        "wc_questions_avg": [
            49.25,
            25.301926804099327
        ],
        "wc_review_avg": [
            425.5,
            68.35385870600138
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ndaDCF0JOvIJ:scholar.google.com/&scioq=SocREval:+LLMs+with+the+Socratic+Method+for+Reference-free+Reasoning+Evaluation&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of Rochester;Tencent;Amazon",
        "aff_unique_dep": ";Tencent AI Lab;Amazon.com, Inc.",
        "aff_unique_url": "https://www.rochester.edu;https://ai.tencent.com;https://www.amazon.com",
        "aff_unique_abbr": "U of R;Tencent AI Lab;Amazon",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Seattle",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "\"What Data Benefits My Classifier?\" Enhancing Model Performance and Interpretability through Influence-Based Data Selection",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19002",
        "id": "HE9eUQlAvo",
        "author_site": "Anshuman Chhabra, Peizhao Li, Prasant Mohapatra, Hongfu Liu",
        "tldr": "",
        "abstract": "Classification models are ubiquitously deployed in society and necessitate high utility, fairness, and robustness performance. Current research efforts mainly focus on improving model architectures and learning algorithms on fixed datasets to achieve this goal. In contrast, in this paper, we address an orthogonal yet crucial problem: given a fixed convex learning model (or a convex surrogate for a non-convex model) and a function of interest, we assess what data benefits the model by interpreting the feature space, and then aim to improve performance as measured by this function. To this end, we propose the use of influence estimation models for interpreting the classifier's performance from the perspective of the data feature space. Additionally, we propose data selection approaches based on influence that enhance model utility, fairness, and robustness. Through extensive experiments on synthetic and real-world datasets, we validate and demonstrate the effectiveness of our approaches not only for conventional classification scenarios, but also under more challenging scenarios such as distribution shifts, fairness poisoning attacks, utility evasion attacks, online learning, and active learning.",
        "keywords": "Data Selection;Interpretability;Fairness;Robustness",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Anshuman Chhabra;Peizhao Li;Prasant Mohapatra;Hongfu Liu",
        "authorids": "~Anshuman_Chhabra1;~Peizhao_Li1;~Prasant_Mohapatra1;~Hongfu_Liu2",
        "gender": "M;M;M;M",
        "homepage": "https://anshumanc.com;https://peizhaoli.com;https://faculty.engineering.ucdavis.edu/mohapatra/;http://hongfuliu.com/",
        "dblp": "199/8940;232/1771;m/Prasant_Mohapatra2.html;32/9075-1",
        "google_scholar": "https://scholar.google.co.in/citations?user=1U7Zy7sAAAAJ;h8UyqB4AAAAJ;;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0001-9376-2896;;0000-0002-2768-5308;",
        "linkedin": "anshuman-chhabra-860a8411a/;peizhao-li-099037182/;;",
        "or_profile": "~Anshuman_Chhabra1;~Peizhao_Li1;~Prasant_Mohapatra1;~Hongfu_Liu2",
        "aff": "University of South Florida;Brandeis University;University of South Florida;Brandeis University",
        "aff_domain": "usf.edu;brandeis.edu;usf.edu;brandeis.edu",
        "position": "Assistant Professor;PhD student;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nchhabra2024what,\ntitle={''What Data Benefits My Classifier?'' Enhancing Model Performance and Interpretability through Influence-Based Data Selection},\nauthor={Anshuman Chhabra and Peizhao Li and Prasant Mohapatra and Hongfu Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=HE9eUQlAvo}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZqCd;MiDf;GBD9;bDe3;MEKL",
        "pdf_size": 6164902,
        "rating": "6;6;6;6;8",
        "confidence": "4;4;4;4;3",
        "soundness": "3;3;3;3;3",
        "contribution": "3;3;3;3;3",
        "presentation": "2;3;3;3;2",
        "wc_summary": "133;46;64;137;41",
        "wc_strengths": "41;27;165;101;111",
        "wc_weaknesses": "46;141;112;575;559",
        "wc_questions": "241;57;125;21;27",
        "wc_review": "461;271;466;834;738",
        "wc_reply_reviewers": "45;40;0;152;391",
        "wc_reply_authors": "2633;1290;755;1988;3153",
        "reply_reviewers": "2;1;0;1;2",
        "reply_authors": "5;3;1;4;6",
        "rating_avg": [
            6.4,
            0.7999999999999999
        ],
        "confidence_avg": [
            3.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            84.2,
            42.196682334041384
        ],
        "wc_strengths_avg": [
            89.0,
            50.10389206438957
        ],
        "wc_weaknesses_avg": [
            286.6,
            231.062415810101
        ],
        "wc_questions_avg": [
            94.2,
            82.16665990534118
        ],
        "wc_review_avg": [
            554.0,
            204.32229442721123
        ],
        "wc_reply_reviewers_avg": [
            125.6,
            141.9388600771473
        ],
        "wc_reply_authors_avg": [
            1963.8,
            869.2312465621562
        ],
        "reply_reviewers_avg": [
            1.2,
            0.7483314773547883
        ],
        "reply_authors_avg": [
            3.8,
            1.7204650534085253
        ],
        "replies_avg": [
            32,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 17,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17648783162612138147&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=HE9eUQlAvo",
        "pdf": "https://openreview.net/pdf?id=HE9eUQlAvo",
        "email": "usf.edu;brandeis.edu;usf.edu;brandeis.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;0;1",
        "aff_unique_norm": "University of South Florida;Brandeis University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.usf.edu;https://www.brandeis.edu",
        "aff_unique_abbr": "USF;Brandeis",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "HEcbGXzIHK",
        "title": "Episodic Memory Theory for the Mechanistic Interpretation of Recurrent Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Understanding the intricate operations of Recurrent Neural Networks (RNNs) mechanistically is pivotal for advancing their capabilities and applications. In this pursuit, we propose the Episodic Memory Theory (EMT), illustrating that RNNs can be conceptualized as discrete-time analogs of the recently proposed General Sequential Episodic Memory Model. To substantiate EMT, we introduce a novel set of algorithmic tasks tailored to probe the variable binding behavior in RNNs. Utilizing the EMT, we formulate a mathematically rigorous circuit that facilitates variable binding in these tasks. Our empirical investigations reveal that trained RNNs consistently converge to the variable binding circuit, thus indicating universality in the dynamics of RNNs. Building on these findings, we devise an algorithm to define a \\textit{privileged basis}, which reveals hidden neurons instrumental in the temporal storage and composition of variables \u2014 a mechanism vital for the successful generalization in these tasks. We show that the privileged basis enhances the interpretability of the learned parameters and hidden states of RNNs. Our work represents a step toward demystifying the internal mechanisms of RNNs and, for computational neuroscience, serves to bridge the gap between artificial neural networks and neural memory models.",
        "keywords": "mechanistic interpretability;memory models;recurrent neural networks",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/9c67eb1136a1bf73ff40d0760ec67c475e571265.zip",
        "author": "Arjun Karuvally;Peter DelMastro;Hava T Siegelmann",
        "authorids": "~Arjun_Karuvally1;~Peter_DelMastro1;~Hava_T_Siegelmann1",
        "gender": "M;M;F",
        "homepage": "https://arjunkaruvally.github.io/;;https://www.cics.umass.edu/faculty/directory/siegelmann_hava",
        "dblp": "215/5092;;s/HavaTSiegelmann.html",
        "google_scholar": "YfurSO4AAAAJ;;https://scholar.google.co.il/citations?user=A2fiOI0AAAAJ",
        "orcid": "0000-0002-8298-1409;;0000-0003-4938-8723",
        "linkedin": "arjunksuresh;pdelmastro;hava-siegelmann-4b272a/",
        "or_profile": "~Arjun_Karuvally1;~Peter_DelMastro1;~Hava_T_Siegelmann1",
        "aff": "University of Massachusetts, Amherst;Virginia Polytechnic Institute and State University;University of Massachusetts at Amherst",
        "aff_domain": "umass.edu;vt.edu;umass.edu",
        "position": "PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nkaruvally2024episodic,\ntitle={Episodic Memory Theory for the Mechanistic Interpretation of Recurrent Neural Networks},\nauthor={Arjun Karuvally and Peter DelMastro and Hava T Siegelmann},\nyear={2024},\nurl={https://openreview.net/forum?id=HEcbGXzIHK}\n}",
        "github": "",
        "project": "",
        "reviewers": "VSBc;xCsT;Ub1M;PqoU",
        "site": "https://openreview.net/forum?id=HEcbGXzIHK",
        "pdf_size": 11914647,
        "rating": "1;5;5;6",
        "confidence": "4;3;4;3",
        "soundness": "2;2;1;2",
        "contribution": "1;2;3;3",
        "presentation": "1;2;1;3",
        "wc_summary": "27;35;61;135",
        "wc_strengths": "14;29;61;42",
        "wc_weaknesses": "158;371;467;65",
        "wc_questions": "2;128;2;90",
        "wc_review": "201;563;591;332",
        "wc_reply_reviewers": "15;303;0;0",
        "wc_reply_authors": "571;1106;738;456",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            4.25,
            1.920286436967152
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            64.5,
            42.59988262894629
        ],
        "wc_strengths_avg": [
            36.5,
            17.269916039170543
        ],
        "wc_weaknesses_avg": [
            265.25,
            160.84833695130328
        ],
        "wc_questions_avg": [
            55.5,
            55.161127617190715
        ],
        "wc_review_avg": [
            421.75,
            162.3135468776405
        ],
        "wc_reply_reviewers_avg": [
            79.5,
            129.18300971877068
        ],
        "wc_reply_authors_avg": [
            717.75,
            245.55892877270824
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.6509445549041193,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:NV2IKZJWqLoJ:scholar.google.com/&scioq=Episodic+Memory+Theory+for+the+Mechanistic+Interpretation+of+Recurrent+Neural+Networks&hl=en&as_sdt=0,33",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Massachusetts Amherst;Virginia Tech",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.umass.edu;https://www.vt.edu",
        "aff_unique_abbr": "UMass Amherst;VT",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Amherst;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "HFG7LcCCwK",
        "title": "Conditional Generative Models are Sufficient to Sample from Any Causal Effect Estimand",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The ability to apply causal reasoning from observational data has made causal inference algorithms widely adopted in machine learning applications. While there exist sound and complete algorithms to compute causal effects, these algorithms require explicit access to conditional likelihoods over the observational distribution. In the high dimensional regime, conditional likelihoods are difficult to estimate. To alleviate this issue, researchers have approached the causal effect estimation problem by simulating causal relations with neural models. However, none of these existing approaches can be applied to generic scenarios such as causal graphs having latent confounders and obtaining conditional interventional samples.  In this paper, we show that any identifiable causal effect given an arbitrary causal graph containing latent confounders can be computed through push-forward computations using trained conditional generative models. Based on this observation, we devise a diffusion-based approach to sample from any such interventional or conditional interventional distribution. To showcase our algorithm's performance, we conduct experiments on a semi-synthetic Colored MNIST dataset having both the intervention ($X$) and the target variable ($Y$) as images and present interventional image samples from $P(Y|do(X))$. We also perform a case study on a real-world COVIDx chest X-ray image dataset to demonstrate our algorithm's utility.",
        "keywords": "Causality;Causal inference;Structural causal models;Causal graphs;Causal effect;Generative models;Diffusion models",
        "primary_area": "causal reasoning",
        "supplementary_material": "/attachment/2e02548301490abeb297758938ae16cd58d9efc9.zip",
        "author": "Md Musfiqur Rahman;Matt Jordan;Murat Kocaoglu",
        "authorids": "~Md_Musfiqur_Rahman1;~Matt_Jordan1;~Murat_Kocaoglu1",
        "gender": "M;M;M",
        "homepage": "https://sites.google.com/view/musfiqshohan/home;https://www.cs.utexas.edu/~mjordan/;https://www.muratkocaoglu.com",
        "dblp": "249/2369;236/5728;74/11343",
        "google_scholar": "vMGENI8AAAAJ;Zj7R8p0AAAAJ;7N7bzdwAAAAJ",
        "orcid": ";;",
        "linkedin": "md-musfiqur-rahman-861b58150/;;mkocaoglu/",
        "or_profile": "~Md_Musfiqur_Rahman1;~Matt_Jordan1;~Murat_Kocaoglu1",
        "aff": "Purdue University;University of Texas, Austin;Purdue University",
        "aff_domain": "purdue.edu;utexas.edu;purdue.edu",
        "position": "PhD student;PhD student;Assistant Professor",
        "bibtex": "@misc{\nrahman2024conditional,\ntitle={Conditional Generative Models are Sufficient to Sample from Any Causal Effect Estimand},\nauthor={Md Musfiqur Rahman and Matt Jordan and Murat Kocaoglu},\nyear={2024},\nurl={https://openreview.net/forum?id=HFG7LcCCwK}\n}",
        "github": "",
        "project": "",
        "reviewers": "2Jjc;Xy4K;jtV4;ZLmN",
        "site": "https://openreview.net/forum?id=HFG7LcCCwK",
        "pdf_size": 2019633,
        "rating": "1;5;5;6",
        "confidence": "4;3;3;2",
        "soundness": "3;2;3;3",
        "contribution": "1;2;2;2",
        "presentation": "2;2;2;3",
        "wc_summary": "72;34;50;67",
        "wc_strengths": "115;58;53;32",
        "wc_weaknesses": "1313;152;169;120",
        "wc_questions": "65;18;103;48",
        "wc_review": "1565;262;375;267",
        "wc_reply_reviewers": "0;0;0;36",
        "wc_reply_authors": "2090;1746;1739;895",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "3;3;3;3",
        "rating_avg": [
            4.25,
            1.920286436967152
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            55.75,
            14.972892172189045
        ],
        "wc_strengths_avg": [
            64.5,
            30.744918279286416
        ],
        "wc_weaknesses_avg": [
            438.5,
            505.19921813082806
        ],
        "wc_questions_avg": [
            58.5,
            30.712375355872428
        ],
        "wc_review_avg": [
            617.25,
            549.0429741832601
        ],
        "wc_reply_reviewers_avg": [
            9.0,
            15.588457268119896
        ],
        "wc_reply_authors_avg": [
            1617.5,
            440.606684016482
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            0.0
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.9205746178983233,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15455534211566406457&as_sdt=5,34&sciodt=0,34&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Purdue University;University of Texas at Austin",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.purdue.edu;https://www.utexas.edu",
        "aff_unique_abbr": "Purdue;UT Austin",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Austin",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "HFXpAf88jH",
        "title": "Beyond Implicit Bias: The Insignificance of SGD Noise in Online Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The success of SGD in deep learning has been ascribed by prior works to the *implicit bias* induced by high learning rate or small batch size (\"SGD noise\"). While prior works  that focused on *offline learning* (i.e., multiple-epoch training), we study the impact of SGD noise on *online* (i.e., single epoch) learning. Through an extensive empirical analysis of image and language data, we demonstrate that large learning rate and small batch size do *not* confer any implicit bias advantages in online learning. In contrast to offline learning, the benefits of SGD noise in online learning are strictly computational, facilitating larger or more cost-effective gradient steps. \nThis suggests that SGD in the online regime can be construed as taking noisy steps along the \"golden path\" of the noiseless *gradient flow* algorithm. We study this hypothesis and provide supporting evidence in function space by conducting experiments that reduce SGD noise during training and by measuring the pointwise functional distance between models trained with varying SGD noise levels, but at equivalent loss values. Our findings challenge the prevailing understanding of SGD and offer novel insights into its role in online learning.",
        "keywords": "online learning;large learning rate;batch size;implicit bias of SGD",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/347ae79574ff7379dfb23e13a7f7ba99c5d796d6.zip",
        "author": "Nikhil Vyas;Depen Morwani;Rosie Zhao;Gal Kaplun;Sham M. Kakade;Boaz Barak",
        "authorids": "~Nikhil_Vyas1;~Depen_Morwani1;~Rosie_Zhao1;~Gal_Kaplun1;~Sham_M._Kakade1;~Boaz_Barak2",
        "gender": "M;M;F;M;M;M",
        "homepage": "https://nikhilvyas.github.io/;;https://rosieyzh.github.io/;http://www.galkaplun.com;https://shamulent.github.io;https://boazbarak.org",
        "dblp": "176/1074;277/5200;277/9223;237/9816;s/SMKakade;b/BBarak",
        "google_scholar": ";vOngxFUAAAAJ;rgwbR6wAAAAJ;y4BzFYsAAAAJ;https://scholar.google.com.tw/citations?user=wb-DKCIAAAAJ;I0fbJ6cAAAAJ",
        "orcid": ";;;;;0000-0002-4053-8927",
        "linkedin": ";depen-morwani-070298122/;https://linkedin.com/in/rosieyzh;gal-kaplun-865496151/;;",
        "or_profile": "~Nikhil_Vyas1;~Depen_Morwani1;~Rosie_Zhao1;~Gal_Kaplun1;~Sham_M._Kakade1;~Boaz_Barak2",
        "aff": "Harvard University;Harvard University, Harvard University;Harvard University, Harvard University;;Harvard University;Harvard University",
        "aff_domain": "harvard.edu;g.harvard.edu;g.harvard.edu;;harvard.edu;fas.harvard.edu",
        "position": "Postdoc;PhD student;PhD student;;Full Professor;Full Professor",
        "bibtex": "@misc{\nvyas2024beyond,\ntitle={Beyond Implicit Bias: The Insignificance of {SGD} Noise in Online Learning},\nauthor={Nikhil Vyas and Depen Morwani and Rosie Zhao and Gal Kaplun and Sham M. Kakade and Boaz Barak},\nyear={2024},\nurl={https://openreview.net/forum?id=HFXpAf88jH}\n}",
        "github": "",
        "project": "",
        "reviewers": "7b7M;RXA2;6xnX",
        "site": "https://openreview.net/forum?id=HFXpAf88jH",
        "pdf_size": 3984556,
        "rating": "5;5;6",
        "confidence": "1;2;3",
        "soundness": "2;2;3",
        "contribution": "2;2;2",
        "presentation": "2;3;3",
        "wc_summary": "91;99;82",
        "wc_strengths": "31;46;44",
        "wc_weaknesses": "16;144;306",
        "wc_questions": "187;238;8",
        "wc_review": "325;527;440",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "379;751;727",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            2.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            90.66666666666667,
            6.944222218666553
        ],
        "wc_strengths_avg": [
            40.333333333333336,
            6.649979114420001
        ],
        "wc_weaknesses_avg": [
            155.33333333333334,
            118.6629212892085
        ],
        "wc_questions_avg": [
            144.33333333333334,
            98.62499119842236
        ],
        "wc_review_avg": [
            430.6666666666667,
            82.7298145907642
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            619.0,
            169.98823488700623
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.8660254037844385,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7105605598769388633&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Harvard University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.harvard.edu",
        "aff_unique_abbr": "Harvard",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Temporal Generalization Estimation in Evolving Graphs",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19001",
        "id": "HFtrXBfNru",
        "author_site": "Bin Lu, Tingyan Ma, Xiaoying Gan, Xinbing Wang, Yunqiang Zhu, Chenghu Zhou, Shiyu Liang",
        "tldr": "",
        "abstract": "Graph Neural Networks (GNNs) are widely deployed in vast fields, but they often struggle to maintain accurate representations as graphs evolve. We theoretically establish a lower bound, proving that under mild conditions, representation distortion inevitably occurs over time. To estimate the temporal distortion without human annotation after deployment, one naive approach is to pre-train a recurrent model (e.g., RNN) before deployment and use this model afterwards, but the estimation is far from satisfactory. In this paper, we analyze the representation distortion from an information theory perspective, and attribute it primarily to inaccurate feature extraction during evolution. Consequently, we introduce Smart, a straightforward and effective baseline enhanced by an adaptive feature extractor through self-supervised graph reconstruction. In synthetic random graphs, we further refine the former lower bound to show the inevitable distortion over time and empirically observe that Smart achieves good estimation performance. Moreover, we observe that Smart consistently shows outstanding generalization estimation on four real-world evolving graphs. The ablation studies underscore the necessity of graph reconstruction. For example, on OGB-arXiv dataset, the estimation metric MAPE deteriorates from 2.19% to 8.00% without reconstruction.",
        "keywords": "Generalization Estimation;Evolving Graph;Graph Neural Network",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Bin Lu;Tingyan Ma;Xiaoying Gan;Xinbing Wang;Yunqiang Zhu;Chenghu Zhou;Shiyu Liang",
        "authorids": "~Bin_Lu2;~Tingyan_Ma1;~Xiaoying_Gan1;~Xinbing_Wang1;~Yunqiang_Zhu1;~Chenghu_Zhou3;~Shiyu_Liang1",
        "gender": "M;F;F;M;M;M;M",
        "homepage": "https://robinlu1209.github.io/;;https://iiot.sjtu.edu.cn/#/xygan;http://www.cs.sjtu.edu.cn/~wang-xb/;http://english.igsnrr.cas.cn/people/scientists/index_19010.html?json=http://www.igsnrr.cas.cn/sourcedb_igsnrr_cas/yw/scientists/En_sklreis/202012/t20201211_5815482.json;http://www.igsnrr.cas.cn/gkjj/ysfc/ysfc_zhouchenghu/;",
        "dblp": "48/7036-5;;13/29.html;96/1149.html;;85/1324.html;",
        "google_scholar": "HsI7HPoAAAAJ;;VRypOjcAAAAJ;https://scholar.google.com.tw/citations?user=CT5yZbwAAAAJ;;;L8r9ox4AAAAJ",
        "orcid": "0000-0001-6452-7029;0009-0001-6464-1128;0000-0001-5200-1409;0000-0002-0357-8356;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Bin_Lu2;~Tingyan_Ma1;~Xiaoying_Gan1;~Xinbing_Wang1;~Yunqiang_Zhu1;~Chenghu_Zhou3;~Shiyu_Liang1",
        "aff": "Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;Institute of Geographic Sciences and Natural Resources Research, CAS;IGSNRR, Chinese Academy of Sciences, Beijing, China;Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;cs.sjtu.edu.cn;igsnrr.ac.cn;lreis.ac.cn;sjtu.edu.cn",
        "position": "PhD student;MS student;Full Professor;Full Professor;Full Professor;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nlu2024temporal,\ntitle={Temporal Generalization Estimation in Evolving Graphs},\nauthor={Bin Lu and Tingyan Ma and Xiaoying Gan and Xinbing Wang and Yunqiang Zhu and Chenghu Zhou and Shiyu Liang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=HFtrXBfNru}\n}",
        "github": "",
        "project": "",
        "reviewers": "e5fg;btk3;qkRe;jJDp;JYus",
        "pdf_size": 918879,
        "rating": "5;5;6;6;8",
        "confidence": "4;5;3;3;3",
        "soundness": "2;3;2;3;3",
        "contribution": "2;3;2;3;4",
        "presentation": "3;3;3;3;3",
        "wc_summary": "122;52;96;47;133",
        "wc_strengths": "74;63;75;59;182",
        "wc_weaknesses": "190;157;175;22;201",
        "wc_questions": "4;4;18;95;137",
        "wc_review": "390;276;364;223;653",
        "wc_reply_reviewers": "0;0;121;0;18",
        "wc_reply_authors": "682;382;486;422;921",
        "reply_reviewers": "0;0;1;0;1",
        "reply_authors": "2;2;2;2;3",
        "rating_avg": [
            6.0,
            1.0954451150103321
        ],
        "confidence_avg": [
            3.6,
            0.8
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.8,
            0.7483314773547882
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            90.0,
            35.21931288370062
        ],
        "wc_strengths_avg": [
            90.6,
            46.11550715323426
        ],
        "wc_weaknesses_avg": [
            149.0,
            65.19815948322469
        ],
        "wc_questions_avg": [
            51.6,
            54.47421408336241
        ],
        "wc_review_avg": [
            381.2,
            148.55490567463602
        ],
        "wc_reply_reviewers_avg": [
            27.8,
            47.118573832407115
        ],
        "wc_reply_authors_avg": [
            578.6,
            199.83953562796327
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            2.2,
            0.39999999999999997
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.6846531968814578,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9133883817112255719&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=HFtrXBfNru",
        "pdf": "https://openreview.net/pdf?id=HFtrXBfNru",
        "email": "sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;cs.sjtu.edu.cn;igsnrr.ac.cn;lreis.ac.cn;sjtu.edu.cn",
        "author_num": 7,
        "aff_unique_index": "0;0;0;0;1;1;0",
        "aff_unique_norm": "Shanghai Jiao Tong University;Chinese Academy of Sciences",
        "aff_unique_dep": ";Institute of Geographic Sciences and Natural Resources Research",
        "aff_unique_url": "https://www.sjtu.edu.cn;http://www.igsnrr.cas.cn",
        "aff_unique_abbr": "SJTU;CAS",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Beijing",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "SparseDFF: Sparse-View Feature Distillation for One-Shot Dexterous Manipulation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/19000",
        "id": "HHWlwxDeRn",
        "author_site": "Qianxu Wang, Haotong Zhang, Congyue Deng, Yang You, Hao Dong, Yixin Zhu, Leonidas Guibas",
        "tldr": "",
        "abstract": "Humans demonstrate remarkable skill in transferring manipulation abilities across objects of varying shapes, poses, and appearances, a capability rooted in their understanding of semantic correspondences between different instances. To equip robots with a similar high-level comprehension, we present SparseDFF, a novel DFF for 3D scenes utilizing large 2D vision models to extract semantic features from sparse RGBD images, a domain where research is limited despite its relevance to many tasks with fixed-camera setups. SparseDFF generates view-consistent 3D DFFs, enabling efficient one-shot learning of dexterous manipulations by mapping image features to a 3D point cloud. Central to SparseDFF is a feature refinement network, optimized with a contrastive loss between views and a point-pruning mechanism for feature continuity. This facilitates the minimization of feature discrepancies w.r.t. end-effector parameters, bridging demonstrations and target manipulations. Validated in real-world scenarios with a dexterous hand, SparseDFF proves effective in manipulating both rigid and deformable objects, demonstrating significant generalization capabilities across object and scene variations.",
        "keywords": "dexterous manipulaiton;one-shot manipulation transfer;distilled feature field;implicit field",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/2ca43d96c9b6b70dfa12130b3083fffc63fa7e25.zip",
        "author": "Qianxu Wang;Haotong Zhang;Congyue Deng;Yang You;Hao Dong;Yixin Zhu;Leonidas Guibas",
        "authorids": "~Qianxu_Wang1;~Haotong_Zhang3;~Congyue_Deng1;~Yang_You2;~Hao_Dong3;~Yixin_Zhu1;~Leonidas_Guibas1",
        "gender": ";F;M;M;M;M;",
        "homepage": "https://github.com/Halowangqx/Halowangqx.github.io;https://cs.stanford.edu/~congyue/;https://qq456cvb.github.io;https://zsdonghao.github.io;https://yzhu.io/;http://geometry.stanford.edu/;https://github.com/Haotong-Zhang",
        "dblp": ";267/5521;33/8167;14/1525-3.html;91/1103-1.html;g/LeonidasJGuibas;",
        "google_scholar": ";XJZ8UBcAAAAJ;1YV1_KUAAAAJ;xLFL4sMAAAAJ;qG9l6JEAAAAJ;https://scholar.google.com.tw/citations?user=5JlEyTAAAAAJ;",
        "orcid": ";;;0000-0003-2261-9122;0000-0001-7024-1545;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Qianxu_Wang1;~Congyue_Deng1;~Yang_You2;~Hao_Dong3;~Yixin_Zhu1;~Leonidas_Guibas1;~Zhang_Haotong1",
        "aff": "Peking University;Stanford University;Stanford University;Peking University;Peking University;Stanford University;Peking University",
        "aff_domain": "pku.edu.cn;stanford.edu;stanford.edu;pku.edu.cn;pku.edu.cn;stanford.edu;pku.edu.cn",
        "position": "Undergrad student;PhD student;Postdoc;Assistant Professor;Assistant Professor;Full Professor;Undergrad student",
        "bibtex": "@inproceedings{\nwang2024sparsedff,\ntitle={Sparse{DFF}: Sparse-View Feature Distillation for One-Shot Dexterous Manipulation},\nauthor={Qianxu Wang and Haotong Zhang and Congyue Deng and Yang You and Hao Dong and Yixin Zhu and Leonidas Guibas},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=HHWlwxDeRn}\n}",
        "github": "",
        "project": "",
        "reviewers": "hwb9;sPkV;dYVL;Txdk",
        "pdf_size": 9289332,
        "rating": "6;6;6;6",
        "confidence": "3;4;3;4",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;4;2;3",
        "wc_summary": "97;55;90;221",
        "wc_strengths": "53;26;69;28",
        "wc_weaknesses": "34;76;153;231",
        "wc_questions": "104;1;6;45",
        "wc_review": "288;158;318;525",
        "wc_reply_reviewers": "12;88;0;17",
        "wc_reply_authors": "566;371;580;677",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "2;3;2;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            115.75,
            62.81470767264622
        ],
        "wc_strengths_avg": [
            44.0,
            17.930421077041107
        ],
        "wc_weaknesses_avg": [
            123.5,
            75.32097981306404
        ],
        "wc_questions_avg": [
            39.0,
            41.212862069989754
        ],
        "wc_review_avg": [
            322.25,
            131.6023840969456
        ],
        "wc_reply_reviewers_avg": [
            29.25,
            34.47734763580284
        ],
        "wc_reply_authors_avg": [
            548.5,
            111.03715594340481
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 16,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12752113101433447398&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=HHWlwxDeRn",
        "pdf": "https://openreview.net/pdf?id=HHWlwxDeRn",
        "email": "pku.edu.cn;stanford.edu;stanford.edu;pku.edu.cn;pku.edu.cn;stanford.edu;pku.edu.cn",
        "author_num": 7,
        "aff_unique_index": "0;1;1;0;0;1;0",
        "aff_unique_norm": "Peking University;Stanford University",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.stanford.edu",
        "aff_unique_abbr": "Peking U;Stanford",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Stanford",
        "aff_country_unique_index": "0;1;1;0;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Looped Transformers are Better at Learning Learning Algorithms",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18999",
        "id": "HHbRxoDTxE",
        "author_site": "Liu Yang, Kangwook Lee, Robert Nowak, Dimitris Papailiopoulos",
        "tldr": "",
        "abstract": "Transformers have demonstrated effectiveness in in-context solving data-fitting problems from various (latent) models, as reported by Garg et al. (2022). However, the absence of an inherent iterative structure in the transformer architecture presents a challenge in emulating the iterative algorithms, which are commonly employed in traditional machine learning methods. To address this, we propose the utilization of looped transformer architecture and its associated training methodology, with the aim of incorporating iterative characteristics into the transformer architectures. Experimental results suggest that the looped transformer achieves performance comparable to the standard transformer in solving various data-fitting problems, while utilizing less than 10% of the parameter count.",
        "keywords": "in-context learning;transformers;looped transformers",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Liu Yang;Kangwook Lee;Robert D Nowak;Dimitris Papailiopoulos",
        "authorids": "~Liu_Yang6;~Kangwook_Lee1;~Robert_D_Nowak1;~Dimitris_Papailiopoulos1",
        "gender": ";M;M;M",
        "homepage": "https://leiay.github.io/;http://kangwooklee.com/;http://nowak.ece.wisc.edu;http://papail.io",
        "dblp": ";88/9826-1;n/RobertDNowak;",
        "google_scholar": "ul5MsOIAAAAJ;sCEl8r-n5VEC;fn13u8IAAAAJ;hYi6i9sAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Liu_Yang6;~Kangwook_Lee1;~Robert_D_Nowak1;~Dimitris_Papailiopoulos1",
        "aff": "Meta Facebook;KRAFTON;University of Wisconsin - Madison;University of Wisconsin - Madison",
        "aff_domain": "meta.com;krafton.com;;wisc.edu",
        "position": "Intern;Researcher;Full Professor;Associate Professor",
        "bibtex": "@inproceedings{\nyang2024looped,\ntitle={Looped Transformers are Better at Learning Learning Algorithms},\nauthor={Liu Yang and Kangwook Lee and Robert D Nowak and Dimitris Papailiopoulos},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=HHbRxoDTxE}\n}",
        "github": "",
        "project": "",
        "reviewers": "gzpZ;xBYm;QsDA",
        "pdf_size": 2514361,
        "rating": "5;6;8",
        "confidence": "4;4;3",
        "soundness": "2;3;3",
        "contribution": "2;2;3",
        "presentation": "2;3;2",
        "wc_summary": "27;52;72",
        "wc_strengths": "31;55;59",
        "wc_weaknesses": "80;55;137",
        "wc_questions": "11;24;69",
        "wc_review": "149;186;337",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "360;953;492",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;3;2",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            50.333333333333336,
            18.408935028645434
        ],
        "wc_strengths_avg": [
            48.333333333333336,
            12.364824660660938
        ],
        "wc_weaknesses_avg": [
            90.66666666666667,
            34.315529364349835
        ],
        "wc_questions_avg": [
            34.666666666666664,
            24.850665092821068
        ],
        "wc_review_avg": [
            224.0,
            81.31830462243214
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            601.6666666666666,
            254.20770160550913
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.944911182523068,
        "gs_citation": 17,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14877470084774714323&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=HHbRxoDTxE",
        "pdf": "https://openreview.net/pdf?id=HHbRxoDTxE",
        "email": "meta.com;krafton.com;;wisc.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;2;2",
        "aff_unique_norm": "Meta;KRAFTON Inc.;University of Wisconsin-Madison",
        "aff_unique_dep": "Meta Platforms, Inc.;;",
        "aff_unique_url": "https://meta.com;https://www.krafton.com;https://www.wisc.edu",
        "aff_unique_abbr": "Meta;KRAFTON;UW-Madison",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Madison",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "United States;South Korea"
    },
    {
        "id": "HJVe0NH4qq",
        "title": "Personalized Facial Expressions and Head Poses for Speech-Driven 3D Facial Animation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Speech-driven 3D facial animation aims at generating facial movements that are synchronized with the driving speech, which has been widely explored recently. Existing works mostly neglect the person-specific talking style in generation, including facial expression and head pose styles. Several works intend to capture the personalities by fine-tuning modules. However, limited training data leads to the lack of vividness. In this work, we propose AdaMesh, a novel adaptive speech-driven facial animation approach, which learns the personalized talking style from a reference video of about 10 seconds and generates vivid facial expressions and head poses. Specifically, we propose mixture-of-low-rank adaptation (MoLoRA) to fine-tune the expression adapter, which efficiently captures the facial expression style. For the personalized pose style, we propose a pose adapter by building a discrete pose prior and retrieving the appropriate style embedding with a semantic-aware pose style matrix without fine-tuning. Extensive experimental results show that our approach outperforms state-of-the-art methods, preserves the talking style in the reference video, and generates vivid facial animation. The supplementary video and code will be available at https://adamesh.github.io.",
        "keywords": "3D Facial Animation;Low-Rank Adaptation;Head Pose",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Liyang Chen;Weihong Bao;Shun Lei;Boshi Tang;Zhiyong Wu;Shiyin Kang;Haozhi Huang",
        "authorids": "~Liyang_Chen1;~Weihong_Bao1;~Shun_Lei1;~Boshi_Tang1;~Zhiyong_Wu2;~Shiyin_Kang1;~Haozhi_Huang2",
        "gender": "M;M;M;M;M;M;M",
        "homepage": "https://github.com/LeoniusChen;;https://lg-lg.github.io/shunlei.github.io/;https://github.com/TangYucopper;;https://scholar.google.com/citations?user=mnCHk8EAAAAJ;https://cg.cs.tsinghua.edu.cn/people/~huanghz/",
        "dblp": "228/1883;327/6138;292/3774;;24/968-1.html;;192/2776",
        "google_scholar": "jk6jWXgAAAAJ;14R5bLoAAAAJ;kL2xyTYAAAAJ;;7Xl6KdkAAAAJ;mnCHk8EAAAAJ;https://scholar.google.com.hk/citations?user=wTJ83eEAAAAJ",
        "orcid": ";;0000-0003-3597-3913;;0000-0001-8533-0524;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Liyang_Chen1;~Weihong_Bao1;~Shun_Lei1;~Boshi_Tang1;~Zhiyong_Wu2;~Shiyin_Kang1;~Haozhi_Huang2",
        "aff": "Tsinghua University;Tsinghua University;Tsinghua University;Tsinghua University;Tsinghua University;;XVERSE Technology",
        "aff_domain": "tsinghua.edu.cn;tsinghua.edu.cn;mail.tsinghua.edu.cn;mails.tsinghua.edu.cn;tsinghua.edu.cn;;xverse.cn",
        "position": "PhD student;MS student;PhD student;MS student;Associate Professor;;Principal Researcher",
        "bibtex": "@misc{\nchen2024personalized,\ntitle={Personalized Facial Expressions and Head Poses for Speech-Driven 3D Facial Animation},\nauthor={Liyang Chen and Weihong Bao and Shun Lei and Boshi Tang and Zhiyong Wu and Shiyin Kang and Haozhi Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=HJVe0NH4qq}\n}",
        "github": "",
        "project": "",
        "reviewers": "aeAB;UjL5;GUue;ChZu",
        "site": "https://openreview.net/forum?id=HJVe0NH4qq",
        "pdf_size": 2937509,
        "rating": "3;5;5;8",
        "confidence": "5;5;3;4",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;2;3",
        "wc_summary": "70;50;58;98",
        "wc_strengths": "127;48;26;150",
        "wc_weaknesses": "263;136;193;221",
        "wc_questions": "25;2;5;15",
        "wc_review": "485;236;282;484",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "694;720;409;489",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            69.0,
            18.193405398660254
        ],
        "wc_strengths_avg": [
            87.75,
            51.982569193913456
        ],
        "wc_weaknesses_avg": [
            203.25,
            46.13228262290952
        ],
        "wc_questions_avg": [
            11.75,
            9.03811374126261
        ],
        "wc_review_avg": [
            371.75,
            113.91745915354679
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            578.0,
            132.3839114092041
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.37998029782867415,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:tnITT8gl0FwJ:scholar.google.com/&scioq=Personalized+Facial+Expressions+and+Head+Poses+for+Speech-Driven+3D+Facial+Animation&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0;1",
        "aff_unique_norm": "Tsinghua University;XVERSE Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tsinghua.edu.cn;",
        "aff_unique_abbr": "THU;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China;"
    },
    {
        "title": "Frequency-Aware Transformer for Learned Image Compression",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18998",
        "id": "HKGQDDTuvZ",
        "author_site": "Han Li, Shaohui Li, Wenrui Dai, Chenglin Li, Junni Zou, Hongkai Xiong",
        "tldr": "",
        "abstract": "Learned image compression (LIC) has gained traction as an effective solution for image storage and transmission in recent years. However, existing LIC methods are redundant in latent representation due to limitations in capturing anisotropic frequency components and preserving directional details. To overcome these challenges, we propose a novel frequency-aware transformer (FAT) block that for the first time achieves multiscale directional ananlysis for LIC. The FAT block comprises frequency-decomposition window attention (FDWA) modules to capture multiscale and directional frequency components of natural images. Additionally, we introduce frequency-modulation feed-forward network (FMFFN) to adaptively modulate different frequency components, improving rate-distortion performance. Furthermore, we present a transformer-based channel-wise autoregressive (T-CA) model that effectively exploits channel dependencies. Experiments show that our method achieves state-of-the-art rate-distortion performance compared to existing LIC methods, and evidently outperforms latest standardized codec VTM-12.1 by 14.5\\%, 15.1\\%, 13.0\\% in BD-rate on the Kodak, Tecnick, and CLIC datasets.",
        "keywords": "learned image compression;frequency-aware;transformer;entropy model",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Han Li;Shaohui Li;Wenrui Dai;Chenglin Li;Junni Zou;Hongkai Xiong",
        "authorids": "~Han_Li8;~Shaohui_Li3;~Wenrui_Dai1;~Chenglin_Li2;~Junni_Zou1;~Hongkai_Xiong1",
        "gender": "M;M;;M;F;M",
        "homepage": ";;;https://min.sjtu.edu.cn/En/FacultyShow/4?Vid=17;http://www.cs.sjtu.edu.cn/~zou-jn;http://min.sjtu.edu.cn",
        "dblp": ";;16/5135.html;;91/4613;21/3569",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;UDQR5QkAAAAJ;Xg8MhyAAAAAJ;ltW2JMcAAAAJ;https://scholar.google.com/citations?hl=zh-CN;bB16iN4AAAAJ",
        "orcid": ";0000-0002-9650-8874;;;;0000-0003-4552-0029",
        "linkedin": "https://www.linkedin.cn/incareer/in/%E6%B6%B5-%E6%9D%8E-5591031b8;;;;;",
        "or_profile": "~Han_Li8;~Shaohui_Li3;~Wenrui_Dai1;~Chenglin_Li2;~Junni_Zou1;~Hongkai_Xiong1",
        "aff": "Shanghai Jiaotong University; Tsinghua University;Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn;tsinghua.edu.cn;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn",
        "position": "PhD student;Postdoc;Associate Professor;Full Professor;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nli2024frequencyaware,\ntitle={Frequency-Aware Transformer for Learned  Image Compression},\nauthor={Han Li and Shaohui Li and Wenrui Dai and Chenglin Li and Junni Zou and Hongkai Xiong},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=HKGQDDTuvZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZpGq;fcgY;kfZs;Xwct",
        "pdf_size": 9765382,
        "rating": "6;6;6;6",
        "confidence": "5;4;4;3",
        "soundness": "3;3;3;3",
        "contribution": "3;2;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "61;97;71;55",
        "wc_strengths": "50;67;23;19",
        "wc_weaknesses": "103;184;52;159",
        "wc_questions": "90;217;19;4",
        "wc_review": "304;565;165;237",
        "wc_reply_reviewers": "0;34;0;0",
        "wc_reply_authors": "1635;1691;731;1003",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "3;4;2;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            71.0,
            16.06237840420901
        ],
        "wc_strengths_avg": [
            39.75,
            19.74050404624968
        ],
        "wc_weaknesses_avg": [
            124.5,
            51.11017511220246
        ],
        "wc_questions_avg": [
            82.5,
            84.1739270795892
        ],
        "wc_review_avg": [
            317.75,
            150.975784482148
        ],
        "wc_reply_reviewers_avg": [
            8.5,
            14.722431864335457
        ],
        "wc_reply_authors_avg": [
            1265.0,
            409.9317016284542
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 31,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1677175637328566262&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=HKGQDDTuvZ",
        "pdf": "https://openreview.net/pdf?id=HKGQDDTuvZ",
        "email": "sjtu.edu.cn;tsinghua.edu.cn;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn",
        "author_num": 6,
        "aff_unique_index": "0;1;0;0;0;0",
        "aff_unique_norm": "Shanghai Jiao Tong University;Tsinghua University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.sjtu.edu.cn;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "SJTU;THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "HKJfSd5hcb",
        "title": "MiniGPT-5: Interleaved Vision-and-Language Generation via Generative Vokens",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) have garnered significant attention for their advancements in natural language processing, demonstrating unparalleled prowess in text comprehension and generation. Yet, the simultaneous generation of images with coherent textual narratives remains an evolving frontier. In response, we introduce an innovative interleaved vision-and-language generation technique anchored by the concept of ``generative vokens,\" acting as the bridge for harmonized image-text outputs. Our approach is characterized by a distinctive two-staged training strategy focusing on description-free multimodal generation, where the training requires no comprehensive descriptions of images.  To bolster model integrity, classifier-free guidance is incorporated, enhancing the effectiveness of vokens on image generation.  Our model, MiniGPT-5, exhibits substantial improvement over the baseline Divter model on the MMDialog dataset and consistently delivers superior or comparable multimodal outputs in human evaluations on the VIST dataset, highlighting its efficacy across diverse benchmarks.",
        "keywords": "Multimodal Generation; Multimodal Large Language Model",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/e852ec1038306083df76d578b27a0a658c8e8e89.pdf",
        "author": "Kaizhi Zheng;Xuehai He;Xin Eric Wang",
        "authorids": "~Kaizhi_Zheng1;~Xuehai_He1;~Xin_Eric_Wang2",
        "gender": "M;M;M",
        "homepage": "https://kzzheng.github.io/;;https://eric-xw.github.io",
        "dblp": ";251/0763;10/5630-61",
        "google_scholar": "jLa6wpUAAAAJ;kDzxOzUAAAAJ;YjqluE0AAAAJ",
        "orcid": "0000-0003-3534-3487;;0000-0003-2605-5504",
        "linkedin": ";;",
        "or_profile": "~Kaizhi_Zheng1;~Xuehai_He1;~Xin_Eric_Wang2",
        "aff": "University of California, Santa Cruz;University of California Santa Curz;University of California, Santa Cruz",
        "aff_domain": "ucsc.edu;ucsc.edu;ucsc.edu",
        "position": "PhD student;PhD student;Assistant Professor",
        "bibtex": "@misc{\nzheng2024minigpt,\ntitle={Mini{GPT}-5: Interleaved Vision-and-Language Generation via Generative Vokens},\nauthor={Kaizhi Zheng and Xuehai He and Xin Eric Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=HKJfSd5hcb}\n}",
        "github": "",
        "project": "",
        "reviewers": "sgCo;vkr4;zEXf;yx5e",
        "site": "https://openreview.net/forum?id=HKJfSd5hcb",
        "pdf_size": 9264605,
        "rating": "3;5;5;5",
        "confidence": "5;4;3;4",
        "soundness": "1;2;3;3",
        "contribution": "2;2;3;2",
        "presentation": "2;3;2;2",
        "wc_summary": "76;77;33;101",
        "wc_strengths": "33;48;50;81",
        "wc_weaknesses": "340;102;75;128",
        "wc_questions": "177;89;2;78",
        "wc_review": "626;316;160;388",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            71.75,
            24.508926945094924
        ],
        "wc_strengths_avg": [
            53.0,
            17.449928366615147
        ],
        "wc_weaknesses_avg": [
            161.25,
            104.88892934909765
        ],
        "wc_questions_avg": [
            86.5,
            62.06649659840645
        ],
        "wc_review_avg": [
            372.5,
            167.96651452000782
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 99,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1997615847083584812&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of California, Santa Cruz",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucsc.edu",
        "aff_unique_abbr": "UCSC",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Santa Cruz",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "HKV45Y0rFz",
        "title": "Conservative Prediction via Data-Driven Confidence Minimization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In safety-critical applications of machine learning, it is often desirable for a model to be conservative, abstaining from making predictions on \"unknown\" inputs which are not well-represented in the training data. However, detecting unknown examples is challenging, as it is impossible to anticipate all potential inputs at test time. To address this, prior work (Hendrycks et al., 2018) minimizes model confidence on an auxiliary outlier dataset carefully curated to be disjoint from the training distribution. We theoretically analyze the choice of auxiliary dataset for confidence minimization, revealing two actionable insights: (1) if the auxiliary set contains unknown examples similar to those seen at test time, confidence minimization leads to provable detection of unknown test examples, and (2) if the first condition is satisfied, it is unnecessary to filter out known examples for out-of-distribution (OOD) detection. Motivated by these guidelines, we propose the Data-Driven Confidence Minimization (DCM) framework, which minimizes confidence on an uncertainty dataset. We apply DCM to two problem settings in which conservative prediction is paramount\u2014selective classification and OOD detection\u2014and provide a realistic way to gather uncertainty data for each setting. Our experiments show that DCM consistently outperforms existing selective classification approaches on 4 datasets when tested on unseen distributions and outperforms state-of-the-art OOD detection methods on 8 ID-OOD dataset pairs, reducing FPR (at TPR 95%) by 6.3% and 58.1% on CIFAR-10 and CIFAR-100 compared to Outlier Exposure.",
        "keywords": "conservative prediction;confidence;uncertainty;robustness;selective classification;OOD detection",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Caroline Choi;Fahim Tajwar;Yoonho Lee;Huaxiu Yao;Ananya Kumar;Chelsea Finn",
        "authorids": "~Caroline_Choi1;~Fahim_Tajwar1;~Yoonho_Lee1;~Huaxiu_Yao1;~Ananya_Kumar1;~Chelsea_Finn1",
        "gender": "M;M;M;M;F;F",
        "homepage": "https://tajwarfahim.github.io/;https://yoonholee.com/;http://huaxiuyao.mystrikingly.com;https://ananyakumar.wordpress.com/;https://ai.stanford.edu/~cbfinn/;",
        "dblp": "292/1504;213/8086;197/1635;192/0474;131/1783;334/4032",
        "google_scholar": "iMlmLO4AAAAJ;https://scholar.google.co.kr/citations?user=BAAZ_ysAAAAJ;A20BZnQAAAAJ;tP5IBFkAAAAJ;vfPE6hgAAAAJ;",
        "orcid": "0000-0001-9257-6282;;;;;",
        "linkedin": "fahim-tajwar-8a5377162/;;huaxiuyao/;;;caroline-choi-4a915012a/",
        "or_profile": "~Fahim_Tajwar1;~Yoonho_Lee1;~Huaxiu_Yao1;~Ananya_Kumar1;~Chelsea_Finn1;~Caroline_Sujin_Choi1",
        "aff": "Carnegie Mellon University;Stanford University;Department of Computer Science, University of North Carolina at Chapel Hill;OpenAI;Google;Computer Science Department, Stanford University",
        "aff_domain": "andrew.cmu.edu;stanford.edu;cs.unc.edu;openai.com;google.com;cs.stanford.edu",
        "position": "PhD student;PhD student;Assistant Professor;Researcher;Research Scientist;MS student",
        "bibtex": "@misc{\nchoi2024conservative,\ntitle={Conservative Prediction via Data-Driven Confidence Minimization},\nauthor={Caroline Choi and Fahim Tajwar and Yoonho Lee and Huaxiu Yao and Ananya Kumar and Chelsea Finn},\nyear={2024},\nurl={https://openreview.net/forum?id=HKV45Y0rFz}\n}",
        "github": "",
        "project": "",
        "reviewers": "QVJM;UGo2;sVZ1;bNMd",
        "site": "https://openreview.net/forum?id=HKV45Y0rFz",
        "pdf_size": 4636730,
        "rating": "3;5;5;6",
        "confidence": "3;4;4;2",
        "soundness": "2;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "63;150;93;49",
        "wc_strengths": "39;105;13;27",
        "wc_weaknesses": "465;158;121;116",
        "wc_questions": "203;4;1;2",
        "wc_review": "770;417;228;194",
        "wc_reply_reviewers": "448;10;206;6",
        "wc_reply_authors": "3590;933;1524;635",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "8;3;6;3",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            88.75,
            38.77096207214879
        ],
        "wc_strengths_avg": [
            46.0,
            35.2845575287547
        ],
        "wc_weaknesses_avg": [
            215.0,
            145.2463424668587
        ],
        "wc_questions_avg": [
            52.5,
            86.89792862893799
        ],
        "wc_review_avg": [
            402.25,
            228.68578333600013
        ],
        "wc_reply_reviewers_avg": [
            167.5,
            181.0048341895873
        ],
        "wc_reply_authors_avg": [
            1670.5,
            1153.4848286821982
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            5.0,
            2.1213203435596424
        ],
        "replies_avg": [
            31,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.20751433915982243,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17391772246767406223&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;3;4;1",
        "aff_unique_norm": "Carnegie Mellon University;Stanford University;University of North Carolina at Chapel Hill;OpenAI;Google",
        "aff_unique_dep": ";;Department of Computer Science;;Google",
        "aff_unique_url": "https://www.cmu.edu;https://www.stanford.edu;https://www.unc.edu;https://openai.com;https://www.google.com",
        "aff_unique_abbr": "CMU;Stanford;UNC Chapel Hill;OpenAI;Google",
        "aff_campus_unique_index": "1;2;3;1",
        "aff_campus_unique": ";Stanford;Chapel Hill;Mountain View",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Symmetric Basis Convolutions for Learning Lagrangian Fluid Mechanics",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18997",
        "id": "HKgRwNhI9R",
        "author_site": "Rene Winchenbach, Nils Thuerey",
        "tldr": "",
        "abstract": "Learning physical simulations has been an essential and central aspect of many recent research efforts in machine learning, particularly for Navier-Stokes-based fluid mechanics. Classic numerical solvers have traditionally been computationally expensive and challenging to use in inverse problems, whereas Neural solvers aim to address both concerns through machine learning. We propose a general formulation for continuous convolutions using separable basis functions as a superset of existing methods and evaluate a large set of basis functions in the context of (a) a compressible 1D SPH simulation, (b) a weakly compressible 2D SPH simulation, and (c) an incompressible 2D SPH Simulation. We demonstrate that even and odd symmetries included in the basis functions are key aspects of stability and accuracy.\nOur broad evaluation shows that Fourier-based continuous convolutions outperform all other architectures regarding accuracy and generalization. Finally, using these Fourier-based networks, we show that prior inductive biases, such as window functions, are no longer necessary. An implementation of our approach, as well as complete datasets and solver implementations, is available at https://github.com/orgs/tum-pbs/SFBC.",
        "keywords": "CConv;GNN;SPH;Lagrangian Fluids;Fourier Methods",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/58de08462c34e721785dbbfa23157c10a81256bb.zip",
        "author": "Rene Winchenbach;Nils Thuerey",
        "authorids": "~Rene_Winchenbach1;~Nils_Thuerey1",
        "gender": "M;M",
        "homepage": ";https://ge.in.tum.de",
        "dblp": "184/1286;42/478",
        "google_scholar": ";https://scholar.google.com.tw/citations?user=GEehwv8AAAAJ",
        "orcid": "0000-0003-2446-9412;",
        "linkedin": ";",
        "or_profile": "~Rene_Winchenbach1;~Nils_Thuerey1",
        "aff": "Technische Universit\u00e4t M\u00fcnchen;Technical University Munich",
        "aff_domain": "tum.de;tum.de",
        "position": "Postdoc;Associate Professor",
        "bibtex": "@inproceedings{\nwinchenbach2024symmetric,\ntitle={Symmetric Basis Convolutions for Learning Lagrangian Fluid Mechanics},\nauthor={Rene Winchenbach and Nils Thuerey},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=HKgRwNhI9R}\n}",
        "github": "",
        "project": "",
        "reviewers": "akhW;Acuo;T2aE;Ac8w",
        "pdf_size": 11700509,
        "rating": "5;6;6;6",
        "confidence": "4;3;5;3",
        "soundness": "4;3;4;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "56;166;48;114",
        "wc_strengths": "51;53;81;106",
        "wc_weaknesses": "102;33;33;116",
        "wc_questions": "192;85;101;1",
        "wc_review": "401;337;263;337",
        "wc_reply_reviewers": "13;0;0;25",
        "wc_reply_authors": "587;556;732;228",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            96.0,
            47.77028364998475
        ],
        "wc_strengths_avg": [
            72.75,
            22.56518335843961
        ],
        "wc_weaknesses_avg": [
            71.0,
            38.32101251271944
        ],
        "wc_questions_avg": [
            94.75,
            67.7878123264057
        ],
        "wc_review_avg": [
            334.5,
            48.854375443761434
        ],
        "wc_reply_reviewers_avg": [
            9.5,
            10.404326023342406
        ],
        "wc_reply_authors_avg": [
            525.75,
            184.29646632532052
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.17407765595569782,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12570849254483363228&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=HKgRwNhI9R",
        "pdf": "https://openreview.net/pdf?id=HKgRwNhI9R",
        "email": "tum.de;tum.de",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Technische Universit\u00e4t M\u00fcnchen;Technical University of Munich",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tum.de;https://www.tum.de",
        "aff_unique_abbr": "TUM;TUM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "HKkiX32Zw1",
        "title": "Promptbreeder: Self-Referential Self-Improvement via Prompt Evolution",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Popular prompt strategies like Chain-of-Thought Prompting can dramatically improve the reasoning abilities of Large Language Models (LLMs) in various domains. However, such hand-crafted prompt-strategies are often sub-optimal. In this paper, we present Promptbreeder, a general-purpose self-referential self-improvement mechanism that evolves and adapts prompts for a given domain. Driven by an LLM, Promptbreeder mutates a population of task-prompts, evaluates them for fitness on a training set, and repeats this process over multiple generations to evolve task-prompts. Crucially, the mutation of these task-prompts is governed by mutation-prompts that the LLM generates and improves throughout evolution in a self-referential way. That is, Promptbreeder is not just improving task-prompts, but it is also improving the mutation-prompts that improve these task-prompts. Promptbreeder outperforms state-of-the-art prompt strategies such as Chain-of-Thought and Plan-and-Solve Prompting on commonly used arithmetic and commonsense reasoning benchmarks. Furthermore, Promptbreeder is able to evolve intricate task-prompts for the challenging problem of hate speech classification.",
        "keywords": "Prompt Evolution;Large Language Models;Prompt Engineering;Self-Reference;Self-Improvement;Open-Endedness",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Chrisantha Fernando;Dylan Sunil Banarse;Henryk Michalewski;Simon Osindero;Tim Rockt\u00e4schel",
        "authorids": "~Chrisantha_Fernando1;~Dylan_Sunil_Banarse1;~Henryk_Michalewski1;~Simon_Osindero1;~Tim_Rockt\u00e4schel1",
        "gender": "M;M;M;Non-Binary;M",
        "homepage": ";https://2ne1.com;https://www.mimuw.edu.pl/~henrykm/;;http://rockt.ai",
        "dblp": ";;https://dblp.uni-trier.de/pers/hd/m/Michalewski:Henryk;05/5467;43/11537",
        "google_scholar": ";UPcOdkQAAAAJ;YdHW1ycAAAAJ;Jq8ZS5kAAAAJ;https://scholar.google.co.uk/citations?user=mWBY8aIAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;henryk-michalewski-8a230a27/;;rockt/",
        "or_profile": "~Chrisantha_Fernando1;~Dylan_Sunil_Banarse1;~Henryk_Michalewski1;~Simon_Osindero1;~Tim_Rocktaeschel1",
        "aff": ";Google DeepMind;Google DeepMind;Google;Google DeepMind",
        "aff_domain": ";deepmind.com;google.com;google.com;google.com",
        "position": ";Researcher;Researcher;Scientist;Senior Staff Research Scientist",
        "bibtex": "@misc{\nfernando2024promptbreeder,\ntitle={Promptbreeder: Self-Referential Self-Improvement via Prompt Evolution},\nauthor={Chrisantha Fernando and Dylan Sunil Banarse and Henryk Michalewski and Simon Osindero and Tim Rockt{\\\"a}schel},\nyear={2024},\nurl={https://openreview.net/forum?id=HKkiX32Zw1}\n}",
        "github": "",
        "project": "",
        "reviewers": "AFtS;7CXL;PsCD;ceRr;DPYS",
        "site": "https://openreview.net/forum?id=HKkiX32Zw1",
        "pdf_size": 830052,
        "rating": "5;5;5;6;8",
        "confidence": "5;2;3;3;3",
        "soundness": "2;2;3;3;2",
        "contribution": "2;2;3;2;3",
        "presentation": "2;2;3;3;2",
        "wc_summary": "68;67;103;51;86",
        "wc_strengths": "42;35;83;19;75",
        "wc_weaknesses": "114;145;223;68;99",
        "wc_questions": "71;169;21;1;54",
        "wc_review": "295;416;430;139;314",
        "wc_reply_reviewers": "158;199;0;25;0",
        "wc_reply_authors": "1405;953;676;439;297",
        "reply_reviewers": "2;1;0;1;0",
        "reply_authors": "4;3;2;2;1",
        "rating_avg": [
            5.8,
            1.16619037896906
        ],
        "confidence_avg": [
            3.2,
            0.9797958971132712
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            75.0,
            17.854971296532515
        ],
        "wc_strengths_avg": [
            50.8,
            24.33433787880821
        ],
        "wc_weaknesses_avg": [
            129.8,
            52.79166600894501
        ],
        "wc_questions_avg": [
            63.2,
            58.29030794222998
        ],
        "wc_review_avg": [
            318.8,
            104.62389784365712
        ],
        "wc_reply_reviewers_avg": [
            76.4,
            84.85894177987373
        ],
        "wc_reply_authors_avg": [
            754.0,
            394.35009826295214
        ],
        "reply_reviewers_avg": [
            0.8,
            0.7483314773547883
        ],
        "reply_authors_avg": [
            2.4,
            1.019803902718557
        ],
        "replies_avg": [
            30,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.14002800840280097,
        "gs_citation": 200,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15203972626303466013&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Google",
        "aff_unique_dep": "Google DeepMind",
        "aff_unique_url": "https://deepmind.com",
        "aff_unique_abbr": "DeepMind",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "id": "HL5P4H8eO2",
        "title": "Differentiable Trajectory Optimization as a Policy Class for Reinforcement and Imitation Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper introduces DiffTOP, a new policy class for reinforcement learning and imitation learning that utilizes differentiable trajectory optimization to generate the policy actions. Trajectory optimization is a powerful and widely used algorithm in control, parameterized by a cost and a dynamics function. The key to our approach is to leverage the recent progress in differentiable trajectory optimization, which enables computing the gradients of the loss with respect to the parameters of trajectory optimization. As a result, the cost and dynamics functions of trajectory optimization can be learned end-to-end, e.g., using the policy gradient loss in reinforcement learning, or using the imitation loss in imitation learning. When applied to model-based reinforcement learning, DiffTOP addresses the \u201cobjective mismatch\u201d issue of prior algorithms, as the dynamics model in DiffTOP is learned to directly maximize task performance by differentiating the policy gradient loss through the trajectory optimization process. When applied to imitation learning, DiffTOP performs test-time trajectory optimization to compute the actions with a learned cost function, outperforming prior methods that only perform forward passes of the policy network to generate actions. We benchmark DiffTOP on 15 model-based RL tasks, and 13 imitation learning tasks with high-dimensional image and point cloud inputs, and show that it outperforms prior state-of-the-art methods in both domains.",
        "keywords": "differentiable trajectory optimization;model-based reinforcement learning;imitation learning",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/e6df10bd6fb741dd44f899dbd8851166a44cfb7b.pdf",
        "author": "Weikang Wan;Yufei Wang;Zackory Erickson;David Held",
        "authorids": "~Weikang_Wan1;~Yufei_Wang4;~Zackory_Erickson1;~David_Held1",
        "gender": "M;;M;M",
        "homepage": "https://wkwan7.github.io/;https://yufeiwang63.github.io/;https://zackory.com;http://davheld.github.io/",
        "dblp": "314/9770;;;22/11147",
        "google_scholar": "MVE-fyQAAAAJ;HQl9718AAAAJ;wElkTtIAAAAJ;0QtU-NsAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Weikang_Wan1;~Yufei_Wang4;~Zackory_Erickson1;~David_Held1",
        "aff": "Peking University;School of Computer Science, Carnegie Mellon University;Carnegie Mellon University;Carnegie Mellon University",
        "aff_domain": "pku.edu.cn;cs.cmu.edu;cmu.edu;cmu.edu",
        "position": "Undergrad student;PhD student;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nwan2024differentiable,\ntitle={Differentiable Trajectory Optimization as a Policy Class for Reinforcement and Imitation Learning},\nauthor={Weikang Wan and Yufei Wang and Zackory Erickson and David Held},\nyear={2024},\nurl={https://openreview.net/forum?id=HL5P4H8eO2}\n}",
        "github": "",
        "project": "",
        "reviewers": "fm37;zYV2;WGnQ;cY2u",
        "site": "https://openreview.net/forum?id=HL5P4H8eO2",
        "pdf_size": 5878945,
        "rating": "6;8;8;10",
        "confidence": "3;4;4;4",
        "soundness": "3;3;4;4",
        "contribution": "3;3;3;4",
        "presentation": "1;3;4;4",
        "wc_summary": "40;103;192;104",
        "wc_strengths": "43;91;74;96",
        "wc_weaknesses": "173;213;33;75",
        "wc_questions": "260;128;67;41",
        "wc_review": "516;535;366;316",
        "wc_reply_reviewers": "0;26;0;0",
        "wc_reply_authors": "1007;1413;672;190",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "3;2;1;1",
        "rating_avg": [
            8.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            1.224744871391589
        ],
        "wc_summary_avg": [
            109.75,
            54.10348879693434
        ],
        "wc_strengths_avg": [
            76.0,
            20.724381776062707
        ],
        "wc_weaknesses_avg": [
            123.5,
            72.46205903781647
        ],
        "wc_questions_avg": [
            124.0,
            84.63155439905378
        ],
        "wc_review_avg": [
            433.25,
            94.16839968906767
        ],
        "wc_reply_reviewers_avg": [
            6.5,
            11.258330249197702
        ],
        "wc_reply_authors_avg": [
            820.5,
            448.72625285356327
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.816496580927726,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2761178161156184476&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Peking University;Carnegie Mellon University",
        "aff_unique_dep": ";School of Computer Science",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.cmu.edu",
        "aff_unique_abbr": "Peking U;CMU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Pittsburgh",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "HL9YzviPCy",
        "title": "PrACTiS: Perceiver-Attentional Copulas for Time Series",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Transformers incorporating copula structures have demonstrated remarkable performance in time series prediction. However, their heavy reliance on self-attention mechanisms demands substantial computational resources, thus limiting their practical utility across a wide range of tasks. In this work, we present a model that combines the perceiver architecture with a copula structure to enhance time-series forecasting. By leveraging the perceiver as the encoder, we efficiently transform complex, high-dimensional, multimodal data into a compact latent space, thereby significantly reducing computational demands. To further reduce complexity, we introduce midpoint inference and local attention mechanisms, enabling the model to capture dependencies within imputed samples effectively. Subsequently, we deploy the copula-based attention and output variance testing mechanism to capture the joint distribution of missing data, while simultaneously mitigating error propagation during prediction. Our experimental results on the unimodal and multimodal benchmarks showcase a consistent 20\\% improvement over the state-of-the-art methods, while utilizing less than half of available memory resources.",
        "keywords": "perceiver;transformer;copula;time series prediction",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Cat Phuoc Le;Chris Cannella;Ali Hasan;Yuting Ng;Vahid Tarokh",
        "authorids": "~Cat_Phuoc_Le1;~Chris_Cannella1;~Ali_Hasan1;~Yuting_Ng1;~Vahid_Tarokh1",
        "gender": "M;M;;;",
        "homepage": "https://scholars.duke.edu/person/cat.le;;https://alluly.github.io;http://yutingng.com/;",
        "dblp": "251/5583;;200/8502.html;207/0736;",
        "google_scholar": "gSzKGdQAAAAJ;http://scholar.google.com/citations?user=T5vA9UIAAAAJ;4De_LnYAAAAJ;;",
        "orcid": "0000-0002-9121-9395;;;;",
        "linkedin": "catphuocle/;;;;",
        "or_profile": "~Cat_Phuoc_Le1;~Chris_Cannella1;~Ali_Hasan1;~Yuting_Ng1;~Vahid_Tarokh1",
        "aff": "Duke University;Duke University;Morgan Stanley;DSO National Laboratories (Singapore);",
        "aff_domain": "duke.edu;duke.edu;morganstanley.com;dso.org.sg;",
        "position": "Postdoc;PhD student;Researcher;Researcher;",
        "bibtex": "@misc{\nle2024practis,\ntitle={Pr{ACT}iS: Perceiver-Attentional Copulas for Time Series},\nauthor={Cat Phuoc Le and Chris Cannella and Ali Hasan and Yuting Ng and Vahid Tarokh},\nyear={2024},\nurl={https://openreview.net/forum?id=HL9YzviPCy}\n}",
        "github": "",
        "project": "",
        "reviewers": "n61f;Eqmq;jRTE;JVje",
        "site": "https://openreview.net/forum?id=HL9YzviPCy",
        "pdf_size": 10123745,
        "rating": "3;3;3;5",
        "confidence": "4;2;4;2",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "3;2;2;2",
        "wc_summary": "99;67;94;68",
        "wc_strengths": "42;23;45;18",
        "wc_weaknesses": "15;162;209;60",
        "wc_questions": "14;1;109;19",
        "wc_review": "170;253;457;165",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "162;175;103;170",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            1.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            82.0,
            14.611639196202457
        ],
        "wc_strengths_avg": [
            32.0,
            11.683321445547923
        ],
        "wc_weaknesses_avg": [
            111.5,
            77.49354811853694
        ],
        "wc_questions_avg": [
            35.75,
            42.7982184208642
        ],
        "wc_review_avg": [
            261.25,
            118.29703081650021
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            152.5,
            28.952547383606852
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11756834305620753430&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "Duke University;Morgan Stanley;DSO National Laboratories",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.duke.edu;https://www.morganstanley.com;https://www.dso.org.sg",
        "aff_unique_abbr": "Duke;Morgan Stanley;DSO",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "United States;Singapore"
    },
    {
        "id": "HM2E7fnw2U",
        "title": "Mitigating Mode Collapse in Sequential Disentanglement via an Architecture Bias",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "One of the fundamental representation learning tasks is unsupervised sequential disentanglement, where latent representations of the inputs are decomposed to a single static factor and a sequence of dynamic factors. To extract this latent information, existing variational methods condition the static and dynamic codes on the entire input sequence. Unfortunately, these models often suffer from mode collapse, i.e., the dynamic vectors encode static and dynamic information, leading to a non-meaningful static component.  Attempts to alleviate this problem via reducing the dynamic dimension and mutual information loss terms gain only partial success.  Often, promoting a certain functionality of the model is better achieved via specific architectural biases instead of incorporating additional loss terms. For instance, convolutional nets gain translation-invariance with shared kernels and attention models realize the underlying correspondence between source and target sentences. Inspired by these successes, we propose in this work a novel model that mitigates mode collapse by conditioning the static component on a single sample from the sequence, and subtracting the resulting code from the dynamic factors.  Remarkably, our variational model has less hyper-parameters in comparison to existing work, and it facilitates the analysis and visualization of disentangled latent data. \nWe evaluate our work on multiple data-modality benchmarks including general time series, video, and audio, and we show beyond state-of-the-art results on generation and prediction tasks in comparison to several strong baselines.",
        "keywords": "Unsupervised Learning;Sequential Disentanglement",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Nimrod Berman;Ilan Naiman;Gal Fadlon;Idan Arbiv;Omri Azencot",
        "authorids": "~Nimrod_Berman1;~Ilan_Naiman1;~Gal_Fadlon1;~Idan_Arbiv1;~Omri_Azencot1",
        "gender": "M;M;M;M;Unspecified",
        "homepage": ";https://www.linkedin.com/in/ilan-naiman-80071a190;;;http://omriazencot.com",
        "dblp": ";285/4824;;;132/3985.html",
        "google_scholar": ";Fglytk8AAAAJ;;;https://scholar.google.co.il/citations?user=MEGuRmAAAAAJ",
        "orcid": ";;;;",
        "linkedin": "nimrod-berman-a26250143/;ilan-naiman-80071a190;gal-fadlon-89478a214/;idan-arbiv/;omri-azencot-a8812417/",
        "or_profile": "~Nimrod_Berman1;~Ilan_Naiman1;~Gal_Fadlon1;~Idan_Arbiv1;~Omri_Azencot1",
        "aff": ";Ben Gurion University of the Negev, Technion;Ben-Gurion University of the Negev;Ben-Gurion University of the Negev;Ben-Gurion University of the Negev",
        "aff_domain": ";bgu.ac.il;bgu.ac.il;bgu.ac.il;bgu.ac.il",
        "position": ";PhD student;MS student;MS student;Assistant Professor",
        "bibtex": "@misc{\nberman2024mitigating,\ntitle={Mitigating Mode Collapse in Sequential Disentanglement via an Architecture Bias},\nauthor={Nimrod Berman and Ilan Naiman and Gal Fadlon and Idan Arbiv and Omri Azencot},\nyear={2024},\nurl={https://openreview.net/forum?id=HM2E7fnw2U}\n}",
        "github": "",
        "project": "",
        "reviewers": "WJJF;gfeQ;MtBA;nhge",
        "site": "https://openreview.net/forum?id=HM2E7fnw2U",
        "pdf_size": 2929115,
        "rating": "1;5;6;6",
        "confidence": "5;4;4;4",
        "soundness": "1;2;2;4",
        "contribution": "1;2;2;2",
        "presentation": "2;3;3;4",
        "wc_summary": "117;40;98;85",
        "wc_strengths": "26;49;59;76",
        "wc_weaknesses": "214;109;201;92",
        "wc_questions": "116;24;15;94",
        "wc_review": "473;222;373;347",
        "wc_reply_reviewers": "129;17;0;75",
        "wc_reply_authors": "718;520;425;525",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.5,
            2.0615528128088303
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            1.0897247358851685
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            85.0,
            28.36370920736567
        ],
        "wc_strengths_avg": [
            52.5,
            18.090052515125542
        ],
        "wc_weaknesses_avg": [
            154.0,
            54.032397688794084
        ],
        "wc_questions_avg": [
            62.25,
            43.56819367382587
        ],
        "wc_review_avg": [
            353.75,
            89.43538170098006
        ],
        "wc_reply_reviewers_avg": [
            55.25,
            50.85457206584281
        ],
        "wc_reply_authors_avg": [
            547.0,
            106.46360880601408
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9801960588196067,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:YfJM95GneHkJ:scholar.google.com/&scioq=Mitigating+Mode+Collapse+in+Sequential+Disentanglement+via+an+Architecture+Bias&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Ben Gurion University of the Negev;Ben-Gurion University of the Negev",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.bgu.ac.il;https://www.bgu.ac.il",
        "aff_unique_abbr": "BGU;BGU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Israel"
    },
    {
        "title": "Efficiently Computing Similarities to Private Datasets",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18996",
        "id": "HMe5CJv9dQ",
        "author_site": "Arturs Backurs, Zinan Lin, Sepideh Mahabadi, Sandeep Silwal, Jakub Tarnawski",
        "tldr": "",
        "abstract": "Many methods in differentially private model training rely on computing the similarity between a query point (such as public or synthetic data) and private data. We abstract out this common subroutine and study the following fundamental algorithmic problem: Given a similarity function $f$ and a large high-dimensional private dataset $X \\subset \\mathbb{R}^d$, output a differentially private (DP) data-structure which approximates $\\sum_{x \\in X} f(x,y)$ for any query $y$. We consider the cases where $f$ is a kernel function, such as $f(x,y) = e^{-\\|x-y\\|_2^2/\\sigma^2}$ (also known as DP kernel density estimation), or a distance function such as $f(x,y) = \\|x-y\\|_2$, among others. \n    \nOur theoretical results improve upon prior work and give better privacy-utility trade-offs as well as faster query times for a wide range of kernels and distance functions. The unifying approach behind our results is leveraging `low-dimensional structures' present in the specific functions $f$ that we study, using tools such as provable dimensionality reduction, approximation theory, and one-dimensional decomposition of the functions. Our algorithms empirically exhibit improved query times and accuracy over prior state of the art. We also present an application to DP classification. Our experiments demonstrate that the simple methodology of classifying based on average similarity is orders of magnitude faster than prior DP-SGD based approaches for comparable accuracy.",
        "keywords": "differential privacy;distance estimation;sublinear algorithms;high dimensional data analysis;kernels",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/b164b4e7c5396a8dac49164217608592eab25b62.zip",
        "author": "Arturs Backurs;Zinan Lin;Sepideh Mahabadi;Sandeep Silwal;Jakub Tarnawski",
        "authorids": "~Arturs_Backurs1;~Zinan_Lin1;~Sepideh_Mahabadi1;~Sandeep_Silwal1;~Jakub_Tarnawski1",
        "gender": ";M;F;M;M",
        "homepage": "http://www.mit.edu/~backurs/;https://zinanlin.me/;https://www.mit.edu/~mahabadi/;https://sandeepsilwal.com;http://jakub.tarnawski.org/",
        "dblp": "74/10669;64/237-1;130/0388;225/4637;157/6045",
        "google_scholar": "UNHdIKoAAAAJ;67nE-wQ_g_cC;NirVdpMAAAAJ;MnDnUvcAAAAJ;ddHxUHoAAAAJ",
        "orcid": ";;;;0000-0001-6175-5827",
        "linkedin": ";;;;jakubtarnawski/",
        "or_profile": "~Arturs_Backurs1;~Zinan_Lin1;~Sepideh_Mahabadi1;~Sandeep_Silwal1;~Jakub_Tarnawski1",
        "aff": "Microsoft;Microsoft;Microsoft Research;Massachusetts Institute of Technology;Microsoft",
        "aff_domain": "microsoft.com;microsoft.com;microsoft.com;mit.edu;microsoft.com",
        "position": "Researcher;Senior Researcher;Researcher;PhD student;Researcher",
        "bibtex": "@inproceedings{\nbackurs2024efficiently,\ntitle={Efficiently Computing Similarities to Private Datasets},\nauthor={Arturs Backurs and Zinan Lin and Sepideh Mahabadi and Sandeep Silwal and Jakub Tarnawski},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=HMe5CJv9dQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "8tNP;PamP;3sGr;8sJu",
        "pdf_size": 640953,
        "rating": "6;8;8;8",
        "confidence": "3;3;3;2",
        "soundness": "3;3;3;3",
        "contribution": "2;3;2;2",
        "presentation": "3;4;2;3",
        "wc_summary": "135;25;69;162",
        "wc_strengths": "57;25;64;65",
        "wc_weaknesses": "76;1;23;57",
        "wc_questions": "37;99;1;1",
        "wc_review": "305;150;157;285",
        "wc_reply_reviewers": "12;0;29;28",
        "wc_reply_authors": "538;334;95;552",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "2;1;1;4",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            97.75,
            53.93224916504039
        ],
        "wc_strengths_avg": [
            52.75,
            16.315253599009733
        ],
        "wc_weaknesses_avg": [
            39.25,
            29.123658767400773
        ],
        "wc_questions_avg": [
            34.5,
            40.03436024217197
        ],
        "wc_review_avg": [
            224.25,
            71.14553745668101
        ],
        "wc_reply_reviewers_avg": [
            17.25,
            12.028611723719408
        ],
        "wc_reply_authors_avg": [
            379.75,
            185.66687238169334
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14771652146842972202&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=HMe5CJv9dQ",
        "pdf": "https://openreview.net/pdf?id=HMe5CJv9dQ",
        "email": "microsoft.com;microsoft.com;microsoft.com;mit.edu;microsoft.com",
        "author_num": 5,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "Microsoft;Massachusetts Institute of Technology",
        "aff_unique_dep": "Microsoft Corporation;",
        "aff_unique_url": "https://www.microsoft.com;https://web.mit.edu",
        "aff_unique_abbr": "Microsoft;MIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "HNOqhcua6b",
        "title": "TransFusion: Contrastive Learning with Attention Layers",
        "track": "main",
        "status": "Desk Reject",
        "tldr": "",
        "abstract": "This paper proposes TransFusion, a novel framework for training attention-based neural networks to extract useful features for downstream classification tasks. TransFusion leverages the fusion-like behavior of the self-attention mechanism, where samples from the same cluster have higher attention scores and gradually converge. In the pursuit of deriving meaningful features, TransFusion adopts a strategy of training with affinity matrices, effectively capturing the resemblances among samples within the same class. In the context of classification-related tasks with limited understanding of the Attention layer's functionality, we offer theoretical insights into the actual behavior of each layer. Our main result demonstrates TransFusion's effectiveness at fusing data points within the same cluster, while simultaneously ensuring careful management of noise levels. Furthermore, experimental results indicate that TransFusion successfully extracts features that isolate clusters from complex real-world data, leading to improved classification accuracy in downstream tasks.",
        "keywords": "Transformer;Representation Learning;Subspace Clustering",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/f313e66e71cded2efc593a65d55f17f830f9ff00.zip",
        "author": "Huanran Li;Daniel L. Pimentel-Alarc\u00f3n",
        "authorids": "~Huanran_Li1;~Daniel_L._Pimentel-Alarc\u00f3n1",
        "gender": "M;",
        "homepage": "https://huanranli.github.io/;https://danielpimentel.github.io/",
        "dblp": "327/9353;150/6256",
        "google_scholar": "Jwt-ofkAAAAJ;",
        "orcid": ";",
        "linkedin": "huanran-li-870954163/;",
        "or_profile": "~Huanran_Li1;~Daniel_L._Pimentel-Alarc\u00f3n1",
        "aff": "University of Wisconsin, Madison;University of Wisconsin, Madison",
        "aff_domain": "wisc.edu;wisc.edu",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nli2024transfusion,\ntitle={TransFusion: Contrastive Learning with Attention Layers},\nauthor={Huanran Li and Daniel L. Pimentel-Alarc{\\'o}n},\nyear={2024},\nurl={https://openreview.net/forum?id=HNOqhcua6b}\n}",
        "github": "",
        "project": "",
        "reviewers": "KE1w;Ak7r;VzcH;WPJh",
        "site": "https://openreview.net/forum?id=HNOqhcua6b",
        "pdf_size": 10796869,
        "rating": "3;3;3;5",
        "confidence": "3;4;4;4",
        "soundness": "1;1;3;3",
        "contribution": "2;2;2;2",
        "presentation": "2;1;3;3",
        "wc_summary": "77;42;107;63",
        "wc_strengths": "20;13;113;18",
        "wc_weaknesses": "358;82;185;116",
        "wc_questions": "131;3;4;3",
        "wc_review": "586;140;409;200",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            1.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            72.25,
            23.615408105726228
        ],
        "wc_strengths_avg": [
            41.0,
            41.6473288459176
        ],
        "wc_weaknesses_avg": [
            185.25,
            106.41751500575458
        ],
        "wc_questions_avg": [
            35.25,
            55.28279569631044
        ],
        "wc_review_avg": [
            333.75,
            176.57912532346512
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:HM6MMzwZkHYJ:scholar.google.com/&scioq=TransFusion:+Contrastive+Learning+with+Attention+Layers&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Wisconsin",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.wisc.edu",
        "aff_unique_abbr": "UW",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Madison",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "HOf3K763zg",
        "title": "Beyond Differentiability: Neurosymbolic Learning with Black-Box Programs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Neurosymbolic learning has demonstrated promising potential as a paradigm to combine the worlds of classical algorithms and deep learning. However, existing general neurosymbolic frameworks require that programs be written in differentiable logic programming languages, restricting their applicability to a small fragment of algorithms. We introduce Infer-Sample-Estimate-Descend (ISED), a general algorithm for neurosymbolic learning with black-box programs. We evaluate ISED extensively on a set of 30 benchmark tasks that encompass rich data types and reasoning patterns. ISED achieves 30% higher accuracy than end-to-end neural baselines. Moreover, ISED's solutions often outperform those obtained using Scallop, a state-of-the-art neurosymbolic framework: the programs in 17 (61%) of the benchmarks cannot be specified using Scallop, and ISED on average achieves higher accuracy on those that can be specified using Scallop.",
        "keywords": "learning algorithms;symbolic reasoning",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "",
        "author": "Alaia Solko-Breslin;Ziyang Li;Neelay Velingker;Rajeev Alur;Mayur Naik",
        "authorids": "~Alaia_Solko-Breslin1;~Ziyang_Li2;~Neelay_Velingker1;~Rajeev_Alur1;~Mayur_Naik1",
        "gender": "F;M;M;M;M",
        "homepage": "https://alaiasolkobreslin.github.io/;https://liby99.github.io;https://www.linkedin.com/in/nvelingker/;http://www.cis.upenn.edu/~alur/;http://www.cis.upenn.edu/~mhnaik/",
        "dblp": "278/3188;;236/5641;https://dblp.uni-trier.de/pid/a/RAlur.html;92/6794",
        "google_scholar": "T-9avSwAAAAJ;aAQ9abEAAAAJ;;ZvLa1RIAAAAJ;https://scholar.google.com.tw/citations?user=fmsV6nEAAAAJ",
        "orcid": "0009-0009-3723-5181;;;;",
        "linkedin": "alaia-solko-breslin/;liby99/;;;ai4code/",
        "or_profile": "~Alaia_Solko-Breslin1;~Ziyang_Li2;~Neelay_Velingker1;~Rajeev_Alur1;~Mayur_Naik1",
        "aff": "University of Pennsylvania;School of Engineering and Applied Science, University of Pennsylvania;University of Pennsylvania;University of Pennsylvania;University of Pennsylvania",
        "aff_domain": "upenn.edu;seas.upenn.edu;upenn.edu;upenn.edu;upenn.edu",
        "position": "PhD student;PhD student;PhD student;Full Professor;Professor",
        "bibtex": "@misc{\nsolko-breslin2024beyond,\ntitle={Beyond Differentiability: Neurosymbolic Learning with Black-Box Programs},\nauthor={Alaia Solko-Breslin and Ziyang Li and Neelay Velingker and Rajeev Alur and Mayur Naik},\nyear={2024},\nurl={https://openreview.net/forum?id=HOf3K763zg}\n}",
        "github": "",
        "project": "",
        "reviewers": "9rTK;Bw9k;4kqW;7YF3",
        "site": "https://openreview.net/forum?id=HOf3K763zg",
        "pdf_size": 2091669,
        "rating": "3;5;5;6",
        "confidence": "5;2;2;2",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "75;76;45;137",
        "wc_strengths": "49;82;12;9",
        "wc_weaknesses": "245;182;61;17",
        "wc_questions": "50;36;19;24",
        "wc_review": "419;376;137;187",
        "wc_reply_reviewers": "6;0;0;0",
        "wc_reply_authors": "66;336;161;74",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            2.75,
            1.299038105676658
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            83.25,
            33.439310698637314
        ],
        "wc_strengths_avg": [
            38.0,
            29.891470355270247
        ],
        "wc_weaknesses_avg": [
            126.25,
            91.38209616768484
        ],
        "wc_questions_avg": [
            32.25,
            11.96609794377432
        ],
        "wc_review_avg": [
            279.75,
            120.03619245877469
        ],
        "wc_reply_reviewers_avg": [
            1.5,
            2.598076211353316
        ],
        "wc_reply_authors_avg": [
            159.25,
            108.63557198266138
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9271726499455307,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:WyikztZJHLQJ:scholar.google.com/&scioq=Beyond+Differentiability:+Neurosymbolic+Learning+with+Black-Box+Programs&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "University of Pennsylvania",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.upenn.edu",
        "aff_unique_abbr": "UPenn",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "HOpQt44EzC",
        "title": "Differentially Private Vision-Language Foundation Models via Image Captioning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The common practice of training foundation models on web-crawled data raises privacy and copyright concerns, as sensitive training data can be memorized by the model and unintentionally misused. Differential privacy (DP) is a robust and rigorous framework for mitigating against such risks, albeit often with significant performance loss and is commonly perceived as unviable in most use case. In this work, we demonstrate that combining DP with vision-language pre-training can be a powerful recipe for obtaining differentially private foundation models trained from scratch. Our model uses text supervision to learn superior image representations, and also exhibits the first instance of multi-modal capabilities for DP training. Under a privacy budget of $\\varepsilon=8$, our image captioner (DP-Cap) trained on a 233M subset of the LAION-2B dataset attains 52.8\\% zero-shot accuracy on CIFAR-10. On the challenging ARO benchmark, DP-Cap achieves performance close to its non-private counterpart (Cap), and greatly surpasses the best non-private CLIP model. Our work challenges the prevailing sentiment that high-utility foundation models are unattainable for DP training from scratch.",
        "keywords": "differential privacy;private foundation model;vision-language model",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/7c70a6a02dc02f92cbc2b5ff53465d2264559746.pdf",
        "author": "Tom Sander;Yaodong Yu;Maziar Sanjabi;Alain Oliviero Durmus;Yi Ma;Kamalika Chaudhuri;Chuan Guo",
        "authorids": "~Tom_Sander1;~Yaodong_Yu4;~Maziar_Sanjabi1;~Alain_Oliviero_Durmus1;~Yi_Ma4;~Kamalika_Chaudhuri1;~Chuan_Guo1",
        "gender": "M;M;M;M;F;M;M",
        "homepage": ";https://yaodongyu.github.io;https://sites.google.com/view/maziar;http://people.eecs.berkeley.edu/~yima/;http://cseweb.ucsd.edu/users/kamalika;https://sites.google.com/view/chuanguo;",
        "dblp": ";;21/8577;;56/6435;;01/11275",
        "google_scholar": ";bZ9oyW8AAAAJ;bc_N2-oAAAAJ;https://scholar.google.com.hk/citations?user=XqLiBQMAAAAJ;I-DJ7EsAAAAJ;0gp5M-kAAAAJ;",
        "orcid": ";;;;;;",
        "linkedin": "tomsdr;;;;;;",
        "or_profile": "~Tom_Sander1;~Yaodong_Yu4;~Maziar_Sanjabi1;~Yi_Ma4;~Kamalika_Chaudhuri1;~Chuan_Guo1;~Alain_Durmus1",
        "aff": "\u00c9cole Polytechnique;Electrical Engineering & Computer Science Department, University of California Berkeley;Meta;University of California, Berkeley;University of California, San Diego;Meta;\u00c9cole Polytechnique",
        "aff_domain": "polytechnique.fr;eecs.berkeley.edu;meta.com;berkeley.edu;ucsd.edu;meta.com;polytechnique.fr",
        "position": "PhD student;PhD student;Researcher;Full Professor;Associate Professor;Researcher;Full Professor",
        "bibtex": "@misc{\nsander2024differentially,\ntitle={Differentially Private Vision-Language Foundation Models via Image Captioning},\nauthor={Tom Sander and Yaodong Yu and Maziar Sanjabi and Alain Oliviero Durmus and Yi Ma and Kamalika Chaudhuri and Chuan Guo},\nyear={2024},\nurl={https://openreview.net/forum?id=HOpQt44EzC}\n}",
        "github": "",
        "project": "",
        "reviewers": "fvPE;aDje;nthH;NLQ1",
        "site": "https://openreview.net/forum?id=HOpQt44EzC",
        "pdf_size": 5557872,
        "rating": "3;6;6;6",
        "confidence": "4;4;3;3",
        "soundness": "2;4;3;3",
        "contribution": "2;2;3;2",
        "presentation": "3;4;3;2",
        "wc_summary": "50;127;78;91",
        "wc_strengths": "45;70;97;141",
        "wc_weaknesses": "196;29;124;211",
        "wc_questions": "19;41;146;18",
        "wc_review": "310;267;445;461",
        "wc_reply_reviewers": "0;0;124;19",
        "wc_reply_authors": "1133;471;1043;659",
        "reply_reviewers": "0;0;2;1",
        "reply_authors": "3;1;3;2",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            86.5,
            27.681221071332818
        ],
        "wc_strengths_avg": [
            88.25,
            35.57650207651112
        ],
        "wc_weaknesses_avg": [
            140.0,
            72.03124322125781
        ],
        "wc_questions_avg": [
            56.0,
            52.76836173314461
        ],
        "wc_review_avg": [
            370.75,
            83.83428594554856
        ],
        "wc_reply_reviewers_avg": [
            35.75,
            51.538213977591425
        ],
        "wc_reply_authors_avg": [
            826.5,
            271.6850198299494
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ZORCSF5ge5wJ:scholar.google.com/&scioq=Differentially+Private+Vision-Language+Foundation+Models+via+Image+Captioning&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;1;3;2;0",
        "aff_unique_norm": "Ecole Polytechnique;University of California, Berkeley;Meta;University of California, San Diego",
        "aff_unique_dep": ";Electrical Engineering & Computer Science Department;Meta Platforms, Inc.;",
        "aff_unique_url": "https://www.polytechnique.edu;https://www.berkeley.edu;https://meta.com;https://www.ucsd.edu",
        "aff_unique_abbr": "X;UC Berkeley;Meta;UCSD",
        "aff_campus_unique_index": "1;1;2",
        "aff_campus_unique": ";Berkeley;San Diego",
        "aff_country_unique_index": "0;1;1;1;1;1;0",
        "aff_country_unique": "France;United States"
    },
    {
        "title": "Compositional Conservatism: A Transductive Approach in Offline Reinforcement Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18995",
        "id": "HRkyLbBRHI",
        "author_site": "Yeda Song, Dongwook Lee, Gunhee Kim",
        "tldr": "",
        "abstract": "Offline reinforcement learning (RL) is a compelling framework for learning optimal policies from past experiences without additional interaction with the environment. Nevertheless, offline RL inevitably faces the problem of distributional shifts, where the states and actions encountered during policy execution may not be in the training dataset distribution. A common solution involves incorporating conservatism into the policy or the value function to safeguard against uncertainties and unknowns. In this work, we focus on achieving the same objectives of conservatism but from a different perspective. We propose COmpositional COnservatism with Anchor-seeking (COCOA) for offline RL, an approach that pursues conservatism in a _compositional_ manner on top of the transductive reparameterization (Netanyahu et al., 2023), which decomposes the input variable (the state in our case) into an anchor and its difference from the original input. Our COCOA seeks both in-distribution anchors and differences by utilizing the learned reverse dynamics model, encouraging conservatism in the compositional input space for the policy or value function. Such compositional conservatism is independent of and agnostic to the prevalent _behavioral_ conservatism in offline RL. We apply COCOA to four state-of-the-art offline RL algorithms and evaluate them on the D4RL benchmark, where COCOA generally improves the performance of each algorithm. The code is available at https://github.com/runamu/compositional-conservatism.",
        "keywords": "offline reinforcement learning;compositional generalization;conservatism;transduction",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/9f7760815f3469bbe12348c4695e1ab1870c17a7.zip",
        "author": "Yeda Song;Dongwook Lee;Gunhee Kim",
        "authorids": "~Yeda_Song1;~Dongwook_Lee5;~Gunhee_Kim1",
        "gender": "F;M;M",
        "homepage": "https://yedasong.com/;https://dwsmart32.github.io;http://vision.snu.ac.kr/gunhee/",
        "dblp": "348/6368;;45/115",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;https://scholar.google.co.kr/citations?user=CiSdOV0AAAAJ",
        "orcid": "0009-0008-0180-8665;;0000-0002-9543-7453",
        "linkedin": "yeda-song-991633198/;dongwook-lee-1738701b2/;",
        "or_profile": "~Yeda_Song1;~Dongwook_Lee5;~Gunhee_Kim1",
        "aff": "Seoul National University;Seoul National University;Seoul National University",
        "aff_domain": "snu.ac.kr;snu.ac.kr;snu.ac.kr",
        "position": "MS student;Undergrad student;Full Professor",
        "bibtex": "@inproceedings{\nsong2024compositional,\ntitle={Compositional Conservatism: A Transductive Approach in Offline Reinforcement Learning},\nauthor={Yeda Song and Dongwook Lee and Gunhee Kim},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=HRkyLbBRHI}\n}",
        "github": "",
        "project": "",
        "reviewers": "7X6Q;HX7o;vdDy",
        "pdf_size": 4422770,
        "rating": "5;6;8",
        "confidence": "3;2;3",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "3;3;3",
        "wc_summary": "19;99;83",
        "wc_strengths": "24;96;100",
        "wc_weaknesses": "119;53;197",
        "wc_questions": "152;3;9",
        "wc_review": "314;251;389",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "768;746;400",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            67.0,
            34.56395039150859
        ],
        "wc_strengths_avg": [
            73.33333333333333,
            34.92213560989012
        ],
        "wc_weaknesses_avg": [
            123.0,
            58.855755878248644
        ],
        "wc_questions_avg": [
            54.666666666666664,
            68.86863501543274
        ],
        "wc_review_avg": [
            318.0,
            56.40921910468182
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            638.0,
            168.53090715553236
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.18898223650461363,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6099002884256706814&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=HRkyLbBRHI",
        "pdf": "https://openreview.net/pdf?id=HRkyLbBRHI",
        "email": "snu.ac.kr;snu.ac.kr;snu.ac.kr",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Seoul National University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.snu.ac.kr",
        "aff_unique_abbr": "SNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "HSESApr9r7",
        "title": "FedEve: On Bridging the Client Drift and Period Drift for Cross-device Federated Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Federated learning (FL) is a machine learning paradigm that allows multiple clients to collaboratively train a shared model without exposing their private data. Data heterogeneity is a fundamental challenge in FL, which can result in poor convergence and performance degradation. \\textit{Client drift} has been recognized as one of the factors contributing to this issue resulting from the multiple local updates in \\fedavg. However, in cross-device FL, a different form of drift arises due to the partial client participation, but it has not been studied well. This drift, we referred as \\textit{period drift},  occurs as participating clients at each communication round may exhibit distinct data distribution that deviates from that of all clients. It could be more harmful than client drift since the optimization objective shifts with every round. \nIn this paper, we investigate the interaction between period drift and client drift, finding that period drift can have a particularly detrimental effect on cross-device FL as the degree of data heterogeneity increases. To tackle these issues, we propose a predict-observe framework and present an instantiated method, \\fedeve, where these two types of drift can counteract each other to mitigate their overall impact. We provide theoretical evidence that our approach can reduce the variance of model updates. Extensive experiments demonstrate that our method outperforms alternatives on non-iid data in cross-device settings.",
        "keywords": "Federated Learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Tao Shen;Zexi Li;Yaliang Li;Ziyu Zhao;Fengda Zhang;Shengyu Zhang;Kun Kuang;Chao Wu;Fei Wu",
        "authorids": "~Tao_Shen4;~Zexi_Li1;~Yaliang_Li1;~Ziyu_Zhao3;~Fengda_Zhang1;~Shengyu_Zhang2;~Kun_Kuang1;~Chao_Wu1;~Fei_Wu1",
        "gender": ";M;M;M;M;M;M;M;M",
        "homepage": ";https://zexilee.github.io/about-zexili/;https://sites.google.com/site/yaliangli/;https://scholar.google.com/citations?user=GzZxXIcAAAAJ;;https://shengyuzhang.github.io/;http://kunkuang.github.io;;https://person.zju.edu.cn/wufei",
        "dblp": ";151/9187-1;https://dblp.org/pers/hd/l/Li:Yaliang;157/9260-1;255/0136;47/3459-1;194/4245;45/3158-1;84/3254-1",
        "google_scholar": ";https://scholar.google.com.hk/citations?user=6lMg5eoAAAAJ;CCPBcdYAAAAJ;GzZxXIcAAAAJ;odIl1AIAAAAJ;l4Dyt7EAAAAJ;https://scholar.google.com.hk/citations?user=FOsNiMQAAAAJ;gpTPt58AAAAJ;XJLn4MYAAAAJ",
        "orcid": ";0000-0003-0831-3549;0000-0002-4204-6096;0000-0003-1460-2777;;0000-0002-0030-8289;0009-0000-7528-8131;0000-0003-0885-6869;",
        "linkedin": ";;;;;;;;",
        "or_profile": "~Tao_Shen4;~Zexi_Li1;~Yaliang_Li1;~Ziyu_Zhao3;~Fengda_Zhang1;~Shengyu_Zhang2;~Kun_Kuang1;~Chao_Wu1;~Fei_Wu1",
        "aff": ";Zhejiang University;Alibaba Group;Zhejiang University;Zhejiang University;Zhejiang University;Zhejiang University;Zhejiang University;Zhejiang University",
        "aff_domain": ";zju.edu.cn;alibaba-inc.com;zju.edu.cn;zju.edu.cn;zju.edu.cn;zju.edu.cn;zju.edu.cn;zju.edu.cn",
        "position": ";PhD student;Staff Engineer;PhD student;PhD student;ZJU100 Young Professor;Associate Professor;Associate Professor;Full Professor",
        "bibtex": "@misc{\nshen2024fedeve,\ntitle={FedEve: On Bridging the Client Drift and Period Drift for Cross-device Federated Learning},\nauthor={Tao Shen and Zexi Li and Yaliang Li and Ziyu Zhao and Fengda Zhang and Shengyu Zhang and Kun Kuang and Chao Wu and Fei Wu},\nyear={2024},\nurl={https://openreview.net/forum?id=HSESApr9r7}\n}",
        "github": "",
        "project": "",
        "reviewers": "GeAV;UbMd;NDKx",
        "site": "https://openreview.net/forum?id=HSESApr9r7",
        "pdf_size": 6018887,
        "rating": "3;3;6",
        "confidence": "4;4;4",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "2;2;3",
        "wc_summary": "99;264;43",
        "wc_strengths": "29;3;141",
        "wc_weaknesses": "132;3;44",
        "wc_questions": "45;3;2",
        "wc_review": "305;273;230",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            135.33333333333334,
            93.80949963741531
        ],
        "wc_strengths_avg": [
            57.666666666666664,
            59.87394165151388
        ],
        "wc_weaknesses_avg": [
            59.666666666666664,
            53.81656085464978
        ],
        "wc_questions_avg": [
            16.666666666666668,
            20.038851153585515
        ],
        "wc_review_avg": [
            269.3333333333333,
            30.728199137310703
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17136124032857786895&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0;0;0;0;0",
        "aff_unique_norm": "Zhejiang University;Alibaba Group",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.zju.edu.cn;https://www.alibaba.com",
        "aff_unique_abbr": "ZJU;Alibaba",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Beyond Weisfeiler-Lehman: A Quantitative Framework for GNN Expressiveness",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18994",
        "id": "HSKaGOi7Ar",
        "author_site": "Bohang Zhang, Jingchu Gai, Yiheng Du, Qiwei Ye, Di He, Liwei Wang",
        "tldr": "",
        "abstract": "Designing expressive Graph Neural Networks (GNNs) is a fundamental topic in the graph learning community. So far, GNN expressiveness has been primarily assessed via the Weisfeiler-Lehman (WL) hierarchy. However, such an expressivity measure has notable limitations: it is inherently coarse, qualitative, and may not well reflect practical requirements (e.g., the ability to encode substructures). In this paper, we introduce a novel framework for quantitatively studying the expressiveness of GNN architectures, addressing all the above limitations. Specifically, we identify a fundamental expressivity measure termed homomorphism expressivity, which quantifies the ability of GNN models to count graphs under homomorphism. Homomorphism expressivity offers a complete and practical assessment tool: the completeness enables direct expressivity comparisons between GNN models, while the practicality allows for understanding concrete GNN abilities such as subgraph counting. By examining four classes of prominent GNNs as case studies, we derive simple, unified, and elegant descriptions of their homomorphism expressivity for both invariant and equivariant settings. Our results provide novel insights into a series of previous work, unify the landscape of different subareas in the community, and settle several open questions. Empirically, extensive experiments on both synthetic and real-world tasks verify our theory, showing that the practical performance of GNN models aligns well with the proposed metric.",
        "keywords": "Graph Neural Networks;Expressive Power;Homomorphism;Subgraph Counting;Weisfeiler-Lehman",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Bohang Zhang;Jingchu Gai;Yiheng Du;Qiwei Ye;Di He;Liwei Wang",
        "authorids": "~Bohang_Zhang1;~Jingchu_Gai1;~Yiheng_Du1;~Qiwei_Ye1;~Di_He1;~Liwei_Wang1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://zbh2047.github.io;http://www.baidu.com;https://github.com/mrlazy1708;;https://dihe-pku.github.io/;http://www.liweiwang-pku.com/",
        "dblp": "276/0156.html;;;50/995;74/184;",
        "google_scholar": "https://scholar.google.com.hk/citations?hl=zh-CN;;;RJ6SuR8AAAAJ;https://scholar.google.co.jp/citations?user=orVoz4IAAAAJ;VZHxoh8AAAAJ",
        "orcid": ";;;0000-0003-4264-5846;;",
        "linkedin": "zhangbohang;;;qiwei-ye-15282964/;;",
        "or_profile": "~Bohang_Zhang1;~Jingchu_Gai1;~Yiheng_Du1;~Qiwei_Ye1;~Di_He1;~Liwei_Wang1",
        "aff": "Peking University;School of Mathematical Science, Peking University, Peking University;Peking University;Beijing Academy of Artificial Intelligence;Microsoft;Peking University",
        "aff_domain": "pku.edu.cn;math.pku.edu.cn;pku.edu.cn;baai.ac.cn;microsoft.com;pku.edu.cn",
        "position": "PhD student;Undergrad student;Undergrad student;Principal Researcher;Senior Researcher;Full Professor",
        "bibtex": "@inproceedings{\nzhang2024beyond,\ntitle={Beyond Weisfeiler-Lehman: A Quantitative Framework for {GNN} Expressiveness},\nauthor={Bohang Zhang and Jingchu Gai and Yiheng Du and Qiwei Ye and Di He and Liwei Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=HSKaGOi7Ar}\n}",
        "github": "",
        "project": "",
        "reviewers": "wf9E;3wF7;aNaP;TDGD",
        "pdf_size": 2357121,
        "rating": "8;8;8;10",
        "confidence": "3;4;5;4",
        "soundness": "4;4;3;4",
        "contribution": "3;4;3;4",
        "presentation": "3;3;4;3",
        "wc_summary": "107;137;129;123",
        "wc_strengths": "233;49;38;75",
        "wc_weaknesses": "307;62;50;119",
        "wc_questions": "133;66;216;349",
        "wc_review": "780;314;433;666",
        "wc_reply_reviewers": "250;14;0;110",
        "wc_reply_authors": "1222;865;1006;2044",
        "reply_reviewers": "2;1;0;1",
        "reply_authors": "3;2;3;5",
        "rating_avg": [
            8.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            124.0,
            11.0
        ],
        "wc_strengths_avg": [
            98.75,
            78.66503352824557
        ],
        "wc_weaknesses_avg": [
            134.5,
            102.94780230777148
        ],
        "wc_questions_avg": [
            191.0,
            105.56751394250033
        ],
        "wc_review_avg": [
            548.25,
            184.2069149082086
        ],
        "wc_reply_reviewers_avg": [
            93.5,
            99.78351567268012
        ],
        "wc_reply_authors_avg": [
            1284.25,
            456.69704126477546
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            3.25,
            1.0897247358851685
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 36,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14128115364975220269&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=HSKaGOi7Ar",
        "pdf": "https://openreview.net/pdf?id=HSKaGOi7Ar",
        "email": "pku.edu.cn;math.pku.edu.cn;pku.edu.cn;baai.ac.cn;microsoft.com;pku.edu.cn",
        "author_num": 6,
        "aff_unique_index": "0;0;0;1;2;0",
        "aff_unique_norm": "Peking University;Beijing Academy of Artificial Intelligence;Microsoft",
        "aff_unique_dep": ";;Microsoft Corporation",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.baaic.cn;https://www.microsoft.com",
        "aff_unique_abbr": "Peking U;BAAI;Microsoft",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Peking",
        "aff_country_unique_index": "0;0;0;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "HSUSo9p8X5",
        "title": "Stochastic Subgoal Representation for Hierarchical Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Goal-conditioned hierarchical reinforcement learning (HRL) promises to make long-term decision-making feasible by reducing the effective planning horizon through a latent subgoal space for high-level policies. However, existing methods employ deterministic subgoal representations, which may hinder the stability and efficiency of hierarchical policy learning. This paper introduces a Gaussian process (GP) based Bayesian approach to learn stochastic subgoal representations. Our method learns a posterior distribution over the latent subgoal space, utilizing GPs to account for the stochastic uncertainties in the learned representation, thus facilitating improved exploration. Moreover, our approach offers an adaptive memory that integrates long-range subgoal information from prior planning steps. This enhances representation in novel state regions and bolsters robustness against environmental stochasticity. In experiments, our approach surpasses state-of-the-art HRL methods in both deterministic and stochastic settings with dense and sparse external rewards. Additionally, we demonstrate that our approach allows transfer of low-level policies across tasks.",
        "keywords": "reinforcement learning;hierarchical reinforcement learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Vivienne Huiling Wang;Tinghuai Wang;Wenyan Yang;Joni-kristian Kamarainen;Joni Pajarinen",
        "authorids": "~Vivienne_Huiling_Wang1;~Tinghuai_Wang1;~Wenyan_Yang1;~Joni-kristian_Kamarainen1;~Joni_Pajarinen2",
        "gender": ";;M;M;",
        "homepage": ";;;https://webpages.tuni.fi/vision/public_pages/JoniKamarainen/;",
        "dblp": ";;;k/JoniKristianKamarainen;23/8355",
        "google_scholar": ";;https://scholar.google.com/citations?hl=en;https://scholar.google.fi/citations?user=r6Y4nacAAAAJ;https://scholar.google.fi/citations?user=-2fJStwAAAAJ",
        "orcid": ";;;0000-0002-5801-4371;0000-0003-4469-8191",
        "linkedin": ";;;;",
        "or_profile": "~Vivienne_Huiling_Wang1;~Tinghuai_Wang1;~Wenyan_Yang1;~Joni-kristian_Kamarainen1;~Joni_Pajarinen2",
        "aff": ";;Tampere University;Tampere University;Aalto University",
        "aff_domain": ";;tuni.fi;tuni.fi;aalto.fi",
        "position": ";;PhD student;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nwang2024stochastic,\ntitle={Stochastic Subgoal Representation for Hierarchical Reinforcement Learning},\nauthor={Vivienne Huiling Wang and Tinghuai Wang and Wenyan Yang and Joni-kristian Kamarainen and Joni Pajarinen},\nyear={2024},\nurl={https://openreview.net/forum?id=HSUSo9p8X5}\n}",
        "github": "",
        "project": "",
        "reviewers": "WYwK;yjMq;qYdp;f9CU",
        "site": "https://openreview.net/forum?id=HSUSo9p8X5",
        "pdf_size": 5240499,
        "rating": "1;6;8;8",
        "confidence": "4;4;3;4",
        "soundness": "1;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "1;3;3;3",
        "wc_summary": "108;115;36;64",
        "wc_strengths": "31;117;23;62",
        "wc_weaknesses": "38;307;62;72",
        "wc_questions": "40;77;75;51",
        "wc_review": "217;616;196;249",
        "wc_reply_reviewers": "0;436;77;13",
        "wc_reply_authors": "584;1454;885;374",
        "reply_reviewers": "0;1;2;1",
        "reply_authors": "2;4;3;2",
        "rating_avg": [
            5.75,
            2.8613807855648994
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            80.75,
            32.39888115352134
        ],
        "wc_strengths_avg": [
            58.25,
            36.91459738369091
        ],
        "wc_weaknesses_avg": [
            119.75,
            108.81262564610782
        ],
        "wc_questions_avg": [
            60.75,
            15.75396775418815
        ],
        "wc_review_avg": [
            319.5,
            172.22151433546276
        ],
        "wc_reply_reviewers_avg": [
            131.5,
            178.20283387196736
        ],
        "wc_reply_authors_avg": [
            824.25,
            406.42365519246044
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.45398994507478646,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:aoYaI_W5AhUJ:scholar.google.com/&scioq=Stochastic+Subgoal+Representation+for+Hierarchical+Reinforcement+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Tampere University;Aalto University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tuni.fi;https://www.aalto.fi",
        "aff_unique_abbr": "Tuni;Aalto",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Finland"
    },
    {
        "title": "Learning to Compose: Improving Object Centric Learning by Injecting Compositionality",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18993",
        "id": "HT2dAhh4uV",
        "author_site": "Whie Jung, Jaehoon Yoo, Sungjin Ahn, Seunghoon Hong",
        "tldr": "",
        "abstract": "Learning compositional representation is a key aspect of object-centric learning as it enables flexible systematic generalization and supports complex visual reasoning. However, most of the existing approaches rely on auto-encoding objective, while the compositionality is implicitly imposed by the architectural or algorithmic bias in the encoder. This misalignment between auto-encoding objective and learning compositionality often results in failure of capturing meaningful object representations. In this study, we propose a novel objective that explicitly encourages compositionality of the representations. Built upon the existing object-centric learning framework (e.g., slot attention), our method incorporates additional constraints that an arbitrary mixture of object representations from two images should be valid by maximizing the likelihood of the composite data. We demonstrate that incorporating our objective to the existing framework consistently improves the objective-centric learning and enhances the robustness to the architectural choices.",
        "keywords": "Object-Centric learning;Compositionality",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Whie Jung;Jaehoon Yoo;Sungjin Ahn;Seunghoon Hong",
        "authorids": "~Whie_Jung1;~Jaehoon_Yoo1;~Sungjin_Ahn1;~Seunghoon_Hong2",
        "gender": "M;M;;",
        "homepage": ";;;",
        "dblp": "203/5794;289/0340;;",
        "google_scholar": "https://scholar.google.co.kr/citations?user=hB5GMiIAAAAJ;L99pxh8AAAAJ;;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Whie_Jung1;~Jaehoon_Yoo1;~Sungjin_Ahn1;~Seunghoon_Hong2",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;;",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr;;",
        "position": "PhD student;PhD student;;",
        "bibtex": "@inproceedings{\njung2024learning,\ntitle={Learning to Compose: Improving Object Centric Learning by Injecting Compositionality},\nauthor={Whie Jung and Jaehoon Yoo and Sungjin Ahn and Seunghoon Hong},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=HT2dAhh4uV}\n}",
        "github": "",
        "project": "",
        "reviewers": "H2Bo;f9fX;Cp4U;6966",
        "pdf_size": 4130446,
        "rating": "6;6;6;8",
        "confidence": "4;4;4;4",
        "soundness": "3;2;3;4",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "69;50;151;160",
        "wc_strengths": "102;131;134;59",
        "wc_weaknesses": "97;125;254;159",
        "wc_questions": "2;178;204;212",
        "wc_review": "270;484;743;590",
        "wc_reply_reviewers": "0;0;117;0",
        "wc_reply_authors": "954;773;1461;530",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "2;2;3;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            107.5,
            48.57211133973898
        ],
        "wc_strengths_avg": [
            106.5,
            30.137186331839274
        ],
        "wc_weaknesses_avg": [
            158.75,
            59.21306865886955
        ],
        "wc_questions_avg": [
            149.0,
            85.7962703152066
        ],
        "wc_review_avg": [
            521.75,
            172.05576857519193
        ],
        "wc_reply_reviewers_avg": [
            29.25,
            50.66248612138966
        ],
        "wc_reply_authors_avg": [
            929.5,
            341.7546634648897
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3436252611814118715&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=HT2dAhh4uV",
        "pdf": "https://openreview.net/pdf?id=HT2dAhh4uV",
        "email": "kaist.ac.kr;kaist.ac.kr;;",
        "author_num": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "HTH3HnJeRC",
        "title": "DER-Solomon: A Large Number of CVRPTW Instances Generated Based on the Solomon Benchmark Distribution",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The Solomon benchmark is a well-known resource for researching Capacitated Vehicle Routing Problem with Time Windows (CVRPTW), and has been used by many traditional methods. However, the limited scale of the Solomon benchmark poses challenges to effective utilization by learning-based approaches. To address this, we propose an expanded version with a large set of new instances, called DER-Solomon benchmark, which follows a similar distribution as the Solomon benchmark. First, we analyze the Solomon benchmark and use backward derivation to establish an approximate distribution, from which the DER-Solomon is generated, thereby significantly expanding the size of the benchmark. Next, we validate the distribution consistency between the DER-Solomon benchmark and the original Solomon benchmark using traditional algorithms. We then demonstrate the superiority and reliability of DER-Solomon compared to other similar Solomon-like datasets using state-of-the-art Deep Reinforcement Learning (DRL) algorithms. Finally, we train multiple DRL algorithms using the DER-Solomon benchmark and compare them with the traditional algorithms. The results show that the  DRL algorithms trained on the DER-Solomon benchmark can achieve the same level of solution quality as the traditional algorithms on the Solomon benchmark while reducing the computational time by over 1000 times on CVRPTW. All the results demonstrate that the DER-Solomon benchmark is sufficiently excellent, serving as an extension of the Solomon benchmark, which offers valuable tools and resources for further research and solutions to the CVRPTW problem.",
        "keywords": "backward derivation;capacitated vehicle routing problem with time windows;deep reinforcement learning;Solomon benchmark",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Kaiqiang Tang;Huiqiao Fu;Jiasheng Liu;Guizhou Deng;Yiming Qi;Yuanyang Lu;Chunlin Chen",
        "authorids": "~Kaiqiang_Tang1;~Huiqiao_Fu1;~Jiasheng_Liu1;~Guizhou_Deng1;~Yiming_Qi1;~Yuanyang_Lu1;~Chunlin_Chen1",
        "gender": "M;M;M;;M;M;M",
        "homepage": "https://scholar.google.com/citations?user=gkKO99wAAAAJ&hl=zh-CN;;;;https://github.com/OneMingQi/;https://github.com/lyy20597;https://sme.nju.edu.cn/ccl/list.htm",
        "dblp": ";243/7065;;;;;68/6992.html",
        "google_scholar": "gkKO99wAAAAJ;;;;;;",
        "orcid": ";;0000-0001-6094-3420;0000-0001-6589-4402;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Kaiqiang_Tang1;~Huiqiao_Fu1;~Jiasheng_Liu1;~Guizhou_Deng1;~Yiming_Qi1;~Yuanyang_Lu1;~Chunlin_Chen1",
        "aff": "Nanjing University;Nanjing University;;;Nanjing University;Nanjing University;Nanjing University",
        "aff_domain": "smail.nju.edu.cn;nju.edu.cn;;;nju.edu.cn;nju.edu.cn;nju.edu.cn",
        "position": "PhD student;PhD student;;;MS student;MS student;Full Professor",
        "bibtex": "@misc{\ntang2024dersolomon,\ntitle={{DER}-Solomon: A Large Number of {CVRPTW} Instances Generated Based on the Solomon Benchmark Distribution},\nauthor={Kaiqiang Tang and Huiqiao Fu and Jiasheng Liu and Guizhou Deng and Yiming Qi and Yuanyang Lu and Chunlin Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=HTH3HnJeRC}\n}",
        "github": "",
        "project": "",
        "reviewers": "D9sp;c63s;mp8y;Cpep",
        "site": "https://openreview.net/forum?id=HTH3HnJeRC",
        "pdf_size": 3114191,
        "rating": "3;3;3;6",
        "confidence": "3;4;3;3",
        "soundness": "2;3;3;2",
        "contribution": "3;2;2;3",
        "presentation": "2;2;2;3",
        "wc_summary": "36;107;23;44",
        "wc_strengths": "26;48;14;44",
        "wc_weaknesses": "269;278;33;33",
        "wc_questions": "9;5;21;64",
        "wc_review": "340;438;91;185",
        "wc_reply_reviewers": "158;0;27;89",
        "wc_reply_authors": "1600;1047;166;699",
        "reply_reviewers": "2;0;1;1",
        "reply_authors": "4;2;1;2",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            52.5,
            32.34578797927173
        ],
        "wc_strengths_avg": [
            33.0,
            13.74772708486752
        ],
        "wc_weaknesses_avg": [
            153.25,
            120.29209242506342
        ],
        "wc_questions_avg": [
            24.75,
            23.41340428045439
        ],
        "wc_review_avg": [
            263.5,
            134.36982548176508
        ],
        "wc_reply_reviewers_avg": [
            68.5,
            60.92002954693965
        ],
        "wc_reply_authors_avg": [
            878.0,
            521.735086035049
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.25,
            1.0897247358851685
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:hTEQh54HnoEJ:scholar.google.com/&scioq=DER-Solomon:+A+Large+Number+of+CVRPTW+Instances+Generated+Based+on+the+Solomon+Benchmark+Distribution&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Nanjing University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nju.edu.cn",
        "aff_unique_abbr": "Nanjing U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "HTfNizaxFw",
        "title": "Complexity-Limited Multi-Task Training for Compositional Emergent Communication",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Human languages are largely compositional: sentences derive meanings based on the meanings of constituent words. Conversely, emergent communication systems, learned by unsupervised neural networks, rarely learn human-like compositionality. To encourage compositionality, we propose a new training method that combines information-bottleneck losses with a multi-task framework. By training on a diversity of tasks, we induce task-specific vocabulary; by penalizing complexity, we decrease redundancy and entanglement in communication. Our information-theoretic framing explains results from studies in noisy-channel emergent communication, and outperforms recent population-based training methods. Our work thus address important theoretical questions in compositional communication, and achieves state-of-the-art results.",
        "keywords": "Emergent communication;information bottleneck;compositionality",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/368ac2856a54d0a998bd36813554e3380185f004.pdf",
        "author": "Mycal Tucker;Julie Shah",
        "authorids": "~Mycal_Tucker1;~Julie_Shah2",
        "gender": "M;F",
        "homepage": "http://mycaltucker.com;https://interactive.mit.edu",
        "dblp": "256/5146;",
        "google_scholar": "V1kgcxIAAAAJ;",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Mycal_Tucker1;~Julie_Shah2",
        "aff": "Massachusetts Institute of Technology;Massachusetts Institute of Technology",
        "aff_domain": "mit.edu;mit.edu",
        "position": "PhD student;Professor",
        "bibtex": "@misc{\ntucker2024complexitylimited,\ntitle={Complexity-Limited Multi-Task Training for Compositional Emergent Communication},\nauthor={Mycal Tucker and Julie Shah},\nyear={2024},\nurl={https://openreview.net/forum?id=HTfNizaxFw}\n}",
        "github": "",
        "project": "",
        "reviewers": "mmZM;yKWc;Toth",
        "site": "https://openreview.net/forum?id=HTfNizaxFw",
        "pdf_size": 0,
        "rating": "3;3;3",
        "confidence": "3;1;3",
        "soundness": "2;2;2",
        "contribution": "2;2;1",
        "presentation": "2;2;2",
        "wc_summary": "58;159;124",
        "wc_strengths": "78;14;46",
        "wc_weaknesses": "86;75;274",
        "wc_questions": "75;1;36",
        "wc_review": "297;249;480",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            113.66666666666667,
            41.87547678003864
        ],
        "wc_strengths_avg": [
            46.0,
            26.127890589687233
        ],
        "wc_weaknesses_avg": [
            145.0,
            91.32725040570676
        ],
        "wc_questions_avg": [
            37.333333333333336,
            30.225081564084416
        ],
        "wc_review_avg": [
            342.0,
            99.52889027814989
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:OcwGMEtHds0J:scholar.google.com/&scioq=Complexity-Limited+Multi-Task+Training+for+Compositional+Emergent+Communication&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Massachusetts Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://web.mit.edu",
        "aff_unique_abbr": "MIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "HTzdVhbTEt",
        "title": "Designing Long-term Group Fair Policies in Dynamical Systems",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Neglecting the effect that decisions have on individuals (and thus, on the underlying data distribution) when designing algorithmic decision-making policies may increase inequalities and unfairness in the long term\u2014even if fairness considerations were taken in the policy design process. In this paper, we propose a novel framework for achieving long-term group fairness in dynamical systems, in which current decisions may affect an individual\u2019s features in the next step, and thus, future decisions. Specifically, our framework allows us to identify a time-independent policy that converges, if deployed, to the targeted fair stationary state of the system in the long term, independently of the initial data distribution. We model the system dynamics with a time-homogeneous Markov chain and optimize the policy leveraging the Markov chain convergence theorem to ensure unique convergence. We provide examples of different targeted fair states of the system, encompassing a range of long-term goals for society and policy makers. Furthermore, we show how our approach facilitates the evaluation of different long-term targets by examining their impact on the group-conditional population distribution in the long term and how it evolves until convergence.",
        "keywords": "Long-term Fairness;Dynamical Systems",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/cc55563830565dc5681560c16e2dfa87bcb63f97.zip",
        "author": "Miriam Rateike;Isabel Valera;Patrick Forr\u00e9",
        "authorids": "~Miriam_Rateike1;~Isabel_Valera1;~Patrick_Forr\u00e91",
        "gender": ";F;",
        "homepage": "https://sites.google.com/view/miriam-rateike/about;https://ivaleram.github.io/;",
        "dblp": "305/0173.html;126/1768.html;",
        "google_scholar": ";https://scholar.google.es/citations?user=cpdQqpsAAAAJ;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Miriam_Rateike1;~Isabel_Valera1;~Patrick_Forr\u00e91",
        "aff": "Saarland University;Universit\u00e4t des Saarlandes;",
        "aff_domain": "cs.uni-saarland.de;uni-saarland.de;",
        "position": "PhD student;Full Professor;",
        "bibtex": "@misc{\nrateike2024designing,\ntitle={Designing Long-term Group Fair Policies in Dynamical Systems},\nauthor={Miriam Rateike and Isabel Valera and Patrick Forr{\\'e}},\nyear={2024},\nurl={https://openreview.net/forum?id=HTzdVhbTEt}\n}",
        "github": "",
        "project": "",
        "reviewers": "NkS5;ftJq;LjFL;nac1",
        "site": "https://openreview.net/forum?id=HTzdVhbTEt",
        "pdf_size": 1047511,
        "rating": "3;3;3;5",
        "confidence": "4;4;3;2",
        "soundness": "2;2;3;2",
        "contribution": "1;2;2;2",
        "presentation": "2;3;3;3",
        "wc_summary": "52;172;27;67",
        "wc_strengths": "44;50;21;20",
        "wc_weaknesses": "139;346;68;159",
        "wc_questions": "65;35;14;27",
        "wc_review": "300;603;130;273",
        "wc_reply_reviewers": "0;123;0;0",
        "wc_reply_authors": "712;484;703;764",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            79.5,
            55.283360968739956
        ],
        "wc_strengths_avg": [
            33.75,
            13.423393758658799
        ],
        "wc_weaknesses_avg": [
            178.0,
            102.7204945470961
        ],
        "wc_questions_avg": [
            35.25,
            18.73999733191016
        ],
        "wc_review_avg": [
            326.5,
            172.2128044019956
        ],
        "wc_reply_reviewers_avg": [
            30.75,
            53.26056233274298
        ],
        "wc_reply_authors_avg": [
            665.75,
            107.48575487012221
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8703882797784891,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15088021642380262238&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Saarland University;Universit\u00e4t des Saarlandes",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uni-saarland.de;https://www.uni-saarland.de",
        "aff_unique_abbr": "UdS;UDS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "HU1pesCJF4",
        "title": "Pixel Reweighted Adversarial Training",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Adversarial training (AT) is a well-known defensive framework that trains a model with generated adversarial examples (AEs). AEs are crafted by intentionally adding perturbations to the natural images, aiming to mislead the model into making erroneous outputs. In existing AT methods, the magnitude of perturbations is usually constrained by a predefined perturbation budget, denoted as $\\epsilon$, and keeps the same on each dimension of the image (i.e., each pixel within an image). However, in this paper, we discover that not all pixels contribute equally to the accuracy on AEs (i.e., robustness) and accuracy on natural images (i.e., accuracy). Motivated by this finding, we propose a new framework called Pixel-reweighted AdveRsarial Training (PART), to partially lower $\\epsilon$ for pixels that rarely influence the model's outputs, which guides the model to focus more on regions where pixels are important for model's outputs. Specifically, we first use class activation mapping (CAM) methods to identify important pixel regions, then we keep the perturbation budget for these regions while lowering it for the remaining regions when generating AEs. In the end, we use these reweighted AEs to train a model. PART achieves a notable improvement in the robustness-accuracy trade-off on CIFAR-10, SVHN and Tiny-ImageNet and serves as a general framework, seamlessly integrating with a variety of AT, CAM and AE generation methods. More importantly, our work revisits the conventional AT framework and justifies the necessity to allocate distinct weights to different pixel regions during AT.",
        "keywords": "Adversarial Training",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Jiacheng Zhang;Feng Liu;Dawei Zhou;Jingfeng Zhang;Tongliang Liu",
        "authorids": "~Jiacheng_Zhang7;~Feng_Liu2;~Dawei_Zhou3;~Jingfeng_Zhang1;~Tongliang_Liu1",
        "gender": "M;M;M;M;M",
        "homepage": "https://jiachengz01.github.io/;https://fengliu90.github.io/index.html;https://zjfheart.github.io;https://tongliang-liu.github.io/;",
        "dblp": ";77/1318-3;227/2664.html;150/6667;39/3130-4",
        "google_scholar": "https://scholar.google.com.au/citations?user=i9ESB0QAAAAJ;https://scholar.google.com/citations?hl=en;NS0P1FkAAAAJ;https://scholar.google.com.au/citations?user=EiLdZ_YAAAAJ;https://scholar.google.com.hk/citations?user=7H-LIigAAAAJ",
        "orcid": "0009-0003-0944-9736;0000-0002-5005-9129;0000-0003-3491-8074;;0000-0002-0694-3603",
        "linkedin": "jiacheng-zhang-0ab996217/;alexfengliu;;;",
        "or_profile": "~Jiacheng_Zhang7;~Feng_Liu2;~Jingfeng_Zhang1;~Tongliang_Liu1;~Zhou_Dawei1",
        "aff": "University of Melbourne;University of Melbourne;University of Auckland;Mohamed bin Zayed University of Artificial Intelligence;Xidian University",
        "aff_domain": "unimelb.edu.au;unimelb.edu.au;auckland.ac.nz;mbzuai.ac.ae;xidian.edu.cn",
        "position": "PhD student;Assistant Professor;Assistant Professor;Affiliated Associate Professor;PhD student",
        "bibtex": "@misc{\nzhang2024pixel,\ntitle={Pixel Reweighted Adversarial Training},\nauthor={Jiacheng Zhang and Feng Liu and Dawei Zhou and Jingfeng Zhang and Tongliang Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=HU1pesCJF4}\n}",
        "github": "",
        "project": "",
        "reviewers": "h86N;u6mu;QPEP;tC3M",
        "site": "https://openreview.net/forum?id=HU1pesCJF4",
        "pdf_size": 4064237,
        "rating": "5;6;6;8",
        "confidence": "4;3;3;4",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "75;88;112;76",
        "wc_strengths": "57;71;71;54",
        "wc_weaknesses": "274;110;146;228",
        "wc_questions": "232;16;198;29",
        "wc_review": "638;285;527;387",
        "wc_reply_reviewers": "108;64;135;22",
        "wc_reply_authors": "2665;1416;1272;1499",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "6;6;4;4",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            87.75,
            14.905955185763842
        ],
        "wc_strengths_avg": [
            63.25,
            7.8222439235810075
        ],
        "wc_weaknesses_avg": [
            189.5,
            64.87487957599613
        ],
        "wc_questions_avg": [
            118.75,
            97.10657804700978
        ],
        "wc_review_avg": [
            459.25,
            134.2802572979364
        ],
        "wc_reply_reviewers_avg": [
            82.25,
            43.03704799356015
        ],
        "wc_reply_authors_avg": [
            1713.0,
            555.6055255304792
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            5.0,
            1.0
        ],
        "replies_avg": [
            30,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.2294157338705618,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:-th91y0gcNUJ:scholar.google.com/&scioq=Pixel+Reweighted+Adversarial+Training&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2;3",
        "aff_unique_norm": "University of Melbourne;University of Auckland;Mohamed bin Zayed University of Artificial Intelligence;Xidian University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.unimelb.edu.au;https://www.auckland.ac.nz;https://mbzuai.ac.ae;http://www.xidian.edu.cn/",
        "aff_unique_abbr": "UniMelb;UoA;MBZUAI;Xidian",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;2;3",
        "aff_country_unique": "Australia;New Zealand;United Arab Emirates;China"
    },
    {
        "id": "HW2lIdrvPb",
        "title": "Model Selection of Anomaly Detectors in the Absence of Labeled Validation Data",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Anomaly detection requires detecting abnormal samples in large unlabeled datasets. While progress in deep learning and the advent of foundation models has produced powerful unsupervised anomaly detection methods, their deployment in practice is often hindered by the lack of labeled data---without it, the detection accuracy of an anomaly detector cannot be evaluated reliably.\nIn this work, we propose a general-purpose framework for evaluating image-based anomaly detectors with synthetically generated validation data. Our method assumes access to a small support set of normal images which are processed with a pre-trained diffusion model (our proposed method requires no training or fine-tuning) to produce synthetic anomalies. When mixed with normal samples from the support set, the synthetic anomalies create detection tasks that compose a validation framework for anomaly detection evaluation and model selection. In an extensive empirical study, ranging from natural images to industrial applications, we find that our synthetic validation framework selects the same models and hyper-parameters as selection with a ground-truth validation set. \nIn addition, we find that prompts selected by our method for CLIP-based anomaly detection outperforms all other prompt selection strategies, and leads to the overall best detection accuracy, even on the challenging MVTec-AD dataset.",
        "keywords": "Anomaly detection;Model selection;Diffusion models;Synthetic data generation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/5b76ff0ac67ae0f897f780096453aa8bc685bcda.pdf",
        "author": "Clement Fung;Chen Qiu;Aodong Li;Maja Rudolph",
        "authorids": "~Clement_Fung1;~Chen_Qiu1;~Aodong_Li1;~Maja_Rudolph4",
        "gender": "M;M;M;F",
        "homepage": "https://clementfung.me;;https://aodongli.github.io;http://maja-rita-rudolph.com/",
        "dblp": ";;207/7672;164/5581",
        "google_scholar": "j-0C0kUAAAAJ;uX5Y9XUAAAAJ;;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Clement_Fung1;~Chen_Qiu1;~Aodong_Li1;~Maja_Rudolph4",
        "aff": "Carnegie Mellon University;Robert Bosch LLC, USA;University of California, Irvine;Bosch",
        "aff_domain": "cmu.edu;us.bosch.com;uci.edu;bosch.com",
        "position": "PhD student;Researcher;PhD student;Researcher",
        "bibtex": "@misc{\nfung2024model,\ntitle={Model Selection of Anomaly Detectors in the Absence of Labeled Validation Data},\nauthor={Clement Fung and Chen Qiu and Aodong Li and Maja Rudolph},\nyear={2024},\nurl={https://openreview.net/forum?id=HW2lIdrvPb}\n}",
        "github": "",
        "project": "",
        "reviewers": "Wc92;tN6d;v3es",
        "site": "https://openreview.net/forum?id=HW2lIdrvPb",
        "pdf_size": 4083503,
        "rating": "5;6;6",
        "confidence": "5;4;3",
        "soundness": "3;4;2",
        "contribution": "3;3;2",
        "presentation": "3;4;2",
        "wc_summary": "59;83;75",
        "wc_strengths": "67;47;25",
        "wc_weaknesses": "152;112;241",
        "wc_questions": "58;31;82",
        "wc_review": "336;273;423",
        "wc_reply_reviewers": "68;42;102",
        "wc_reply_authors": "195;270;239",
        "reply_reviewers": "1;1;2",
        "reply_authors": "1;2;1",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            72.33333333333333,
            9.977753031397176
        ],
        "wc_strengths_avg": [
            46.333333333333336,
            17.15290710702481
        ],
        "wc_weaknesses_avg": [
            168.33333333333334,
            53.91557185905468
        ],
        "wc_questions_avg": [
            57.0,
            20.83266665599966
        ],
        "wc_review_avg": [
            344.0,
            61.497967446087195
        ],
        "wc_reply_reviewers_avg": [
            70.66666666666667,
            24.567367696917707
        ],
        "wc_reply_authors_avg": [
            234.66666666666666,
            30.771559740918054
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5087325531543981466&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Carnegie Mellon University;Robert Bosch LLC;University of California, Irvine;Robert Bosch GmbH",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.cmu.edu;https://www.bosch.com;https://www.uci.edu;https://www.bosch.com",
        "aff_unique_abbr": "CMU;Bosch;UCI;Bosch",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Irvine",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "United States;Germany"
    },
    {
        "title": "In-Context Learning through the Bayesian Prism",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18992",
        "id": "HX5ujdsSon",
        "author_site": "Madhur Panwar, Kabir Ahuja, Navin Goyal",
        "tldr": "",
        "abstract": "In-context learning (ICL) is one of the surprising and useful features of large language models and subject of intense research. Recently, stylized meta-learning-like ICL setups have been devised that train transformers on sequences of input-output pairs $(x, f(x))$. The function $f$ comes from a function class and generalization is checked by evaluating on sequences generated from unseen functions from the same class. One of the main discoveries in this line of research has been that for several function classes, such as linear regression, transformers successfully generalize to new functions in the class. However, the inductive biases of these models resulting in this behavior are not clearly understood. A model with unlimited training data and compute is a Bayesian predictor: it learns the pretraining distribution.\nIn this paper we empirically examine how far this Bayesian perspective can help us understand ICL. To this end, we generalize the previous meta-ICL setup to hierarchical meta-ICL setup which involve unions of multiple task families. We instantiate this setup on a diverse range of linear and nonlinear function families and find that transformers can do ICL in this setting as well. Where Bayesian inference is tractable, we find evidence that high-capacity transformers mimic the Bayesian predictor. The Bayesian perspective provides insights into the inductive bias of ICL and how transformers perform a particular task when they are trained on multiple tasks. We also find that transformers can learn to generalize to new function classes that were not seen during pretraining. This involves deviation from the Bayesian predictor. We examine these deviations in more depth offering new insights and hypotheses.",
        "keywords": "In-context Learning;Transformers;Inductive Biases;Meta Learning;Language Modelling;Bayesian Inference",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Madhur Panwar;Kabir Ahuja;Navin Goyal",
        "authorids": "~Madhur_Panwar1;~Kabir_Ahuja1;~Navin_Goyal1",
        "gender": "M;M;",
        "homepage": "https://mdrpanwar.github.io/;https://kabirahuja2431.github.io/;",
        "dblp": "280/0072;https://dblp.uni-trier.de/pid/265/5632;20/6275",
        "google_scholar": "I7OVMTsAAAAJ;xQ4sUrYAAAAJ;",
        "orcid": "0000-0002-0053-733X;;",
        "linkedin": "mdrpanwar/;kabirahuja2431/;",
        "or_profile": "~Madhur_Panwar1;~Kabir_Ahuja1;~Navin_Goyal1",
        "aff": "Microsoft;Microsoft;Microsoft",
        "aff_domain": "microsoft.com;microsoft.com;microsoft.com",
        "position": "Research Fellow;Research Fellow;Researcher",
        "bibtex": "@inproceedings{\npanwar2024incontext,\ntitle={In-Context Learning through the Bayesian Prism},\nauthor={Madhur Panwar and Kabir Ahuja and Navin Goyal},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=HX5ujdsSon}\n}",
        "github": "",
        "project": "",
        "reviewers": "C7Ly;P1i1;Rt1y",
        "pdf_size": 7870028,
        "rating": "6;6;8",
        "confidence": "4;2;4",
        "soundness": "2;2;3",
        "contribution": "3;2;3",
        "presentation": "3;2;2",
        "wc_summary": "111;50;268",
        "wc_strengths": "78;15;154",
        "wc_weaknesses": "136;247;2",
        "wc_questions": "59;25;589",
        "wc_review": "384;337;1013",
        "wc_reply_reviewers": "39;0;72",
        "wc_reply_authors": "566;743;1332",
        "reply_reviewers": "1;0;1",
        "reply_authors": "2;2;3",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            143.0,
            91.82955225125878
        ],
        "wc_strengths_avg": [
            82.33333333333333,
            56.82917873377686
        ],
        "wc_weaknesses_avg": [
            128.33333333333334,
            100.16763726651216
        ],
        "wc_questions_avg": [
            224.33333333333334,
            258.2315928687959
        ],
        "wc_review_avg": [
            578.0,
            308.1893357445495
        ],
        "wc_reply_reviewers_avg": [
            37.0,
            29.427877939124322
        ],
        "wc_reply_authors_avg": [
            880.3333333333334,
            327.4490630447565
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 31,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2049321930298013141&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=HX5ujdsSon",
        "pdf": "https://openreview.net/pdf?id=HX5ujdsSon",
        "email": "microsoft.com;microsoft.com;microsoft.com",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Microsoft",
        "aff_unique_dep": "Microsoft Corporation",
        "aff_unique_url": "https://www.microsoft.com",
        "aff_unique_abbr": "Microsoft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Label-Noise Robust Diffusion Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18991",
        "id": "HXWTXXtHNl",
        "author_site": "Byeonghu Na, Yeongmin Kim, HeeSun Bae, Jung Hyun Lee, Se Jung Kwon, Wanmo Kang, Il-chul Moon",
        "tldr": "",
        "abstract": "Conditional diffusion models have shown remarkable performance in various generative tasks, but training them requires large-scale datasets that often contain noise in conditional inputs, a.k.a. noisy labels. This noise leads to condition mismatch and quality degradation of generated data. This paper proposes Transition-aware weighted Denoising Score Matching (TDSM) for training conditional diffusion models with noisy labels, which is the first study in the line of diffusion models. The TDSM objective contains a weighted sum of score networks, incorporating instance-wise and time-dependent label transition probabilities. We introduce a transition-aware weight estimator, which leverages a time-dependent noisy-label classifier distinctively customized to the diffusion process. Through experiments across various datasets and noisy label settings, TDSM improves the quality of generated samples aligned with given conditions. Furthermore, our method improves generation performance even on prevalent benchmark datasets, which implies the potential noisy labels and their risk of generative model learning. Finally, we show the improved performance of TDSM on top of conventional noisy label corrections, which empirically proving its contribution as a part of label-noise robust generative models. Our code is available at: https://github.com/byeonghu-na/tdsm.",
        "keywords": "diffusion model;noisy label;robustness",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Byeonghu Na;Yeongmin Kim;HeeSun Bae;Jung Hyun Lee;Se Jung Kwon;Wanmo Kang;Il-chul Moon",
        "authorids": "~Byeonghu_Na1;~Yeongmin_Kim1;~HeeSun_Bae1;~Jung_Hyun_Lee1;~Se_Jung_Kwon1;~Wanmo_Kang1;~Il-chul_Moon1",
        "gender": "M;M;F;M;M;M;",
        "homepage": "https://sites.google.com/view/byeonghu-na;https://sites.google.com/view/yeongmin-space/%ED%99%88;;;;https://sites.google.com/site/wanmokang/;",
        "dblp": "276/5100;;;132/2899;119/5676;;",
        "google_scholar": "https://scholar.google.co.kr/citations?user=mJoqpmEAAAAJ;SBF13JUAAAAJ;https://scholar.google.co.kr/citations?user=D9U_ohsAAAAJ;;https://scholar.google.co.kr/citations?user=8eTxKOkAAAAJ;;",
        "orcid": "0000-0003-3463-2674;;0000-0002-9986-0945;;;;",
        "linkedin": "byeonghu-na-17942120b/;;heesun-bae-8a4b8523a/;;se-jung-kwon-305503175/;;",
        "or_profile": "~Byeonghu_Na1;~Yeongmin_Kim1;~HeeSun_Bae1;~Jung_Hyun_Lee1;~Se_Jung_Kwon1;~Wanmo_Kang1;~Il-chul_Moon1",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;NAVER CLOVA;NAVER Cloud;;",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr;kaist.ac.kr;navercorp.com;navercorp.com;;",
        "position": "PhD student;PhD student;PhD student;Researcher;AI Researcher;;",
        "bibtex": "@inproceedings{\nna2024labelnoise,\ntitle={Label-Noise Robust Diffusion Models},\nauthor={Byeonghu Na and Yeongmin Kim and HeeSun Bae and Jung Hyun Lee and Se Jung Kwon and Wanmo Kang and Il-chul Moon},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=HXWTXXtHNl}\n}",
        "github": "",
        "project": "",
        "reviewers": "BRfo;LRz9;TMN7;Zgz7",
        "pdf_size": 14133900,
        "rating": "5;6;6;6",
        "confidence": "3;3;4;4",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "42;64;122;53",
        "wc_strengths": "33;23;112;92",
        "wc_weaknesses": "53;95;358;266",
        "wc_questions": "5;42;5;134",
        "wc_review": "133;224;597;545",
        "wc_reply_reviewers": "36;0;58;0",
        "wc_reply_authors": "1461;2359;1961;2166",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "3;5;5;5",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            70.25,
            30.873734791890662
        ],
        "wc_strengths_avg": [
            65.0,
            37.83516882478523
        ],
        "wc_weaknesses_avg": [
            193.0,
            124.25578457359642
        ],
        "wc_questions_avg": [
            46.5,
            52.72807601268986
        ],
        "wc_review_avg": [
            374.75,
            199.71776961502448
        ],
        "wc_reply_reviewers_avg": [
            23.5,
            24.753787588973125
        ],
        "wc_reply_authors_avg": [
            1986.75,
            334.5806143517583
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            4.5,
            0.8660254037844386
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12154525258644057572&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=HXWTXXtHNl",
        "pdf": "https://openreview.net/pdf?id=HXWTXXtHNl",
        "email": "kaist.ac.kr;kaist.ac.kr;kaist.ac.kr;navercorp.com;navercorp.com;;",
        "author_num": 7,
        "aff_unique_index": "0;0;0;1;1",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology;NAVER Corporation",
        "aff_unique_dep": ";CLOVA",
        "aff_unique_url": "https://www.kaist.ac.kr;https://www.naver.com",
        "aff_unique_abbr": "KAIST;NAVER",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "HXZK1Z8tHa",
        "title": "ShareFormer: Share Attention for Efficient Image Restoration",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Transformer-based networks are gaining popularity due to their superior ability to handle long-range information. However, they come with significant drawbacks, such as long inference time, and challenging training processes. These limitations become even more pronounced when performing high-resolution image restoration tasks. We have noticed that there is a trade-off between models' latency time and their trainability. Including a convolutional module can improve the networks' trainability but not reduce their latency. Conversely, sparsification notably reduces latency but renders networks harder to optimize. To address these issues, a novel Transformer for image restoration called ShareFormer is proposed here. ShareFormer offers optimal performance with lower latency and better trainability than other Transformer-based methods. It achieves this by facilitating the sharing of the attention maps amongst neighboring blocks in the network, thereby considerably improving the inference speed. To maintain the model's information flow integrity, residual connections are added to the \"Value\" of self-attention. Several lesion studies indicate that incorporating residual connections on \"Value\" can aggregate the shallow transformers with shared attention, introducing a local inductive bias and making the network easier to optimize without the need for additional convolution. The effectiveness, efficiency, and easy-to-train of our ShareFormer is supported by numerous experimental results. Our code and pre-trained models will be open-sourced upon publication of the paper.",
        "keywords": "Efficient Image Restoration;Image Super Resolution;Image Denoising;Self Attention;Transformer",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/c8a887e90e7d64b0677f1079a61e79d7d1fcdf2f.zip",
        "author": "JiaKui Hu;Lujia Jin;Yanye Lu",
        "authorids": "~JiaKui_Hu1;~Lujia_Jin1;~Yanye_Lu2",
        "gender": "M;M;M",
        "homepage": "https://github.com/jkhu29;;https://wiki.milab.wiki/pages/viewpage.action?pageId=7503960",
        "dblp": "327/3225;309/8769;173/2256",
        "google_scholar": "VagFt-sAAAAJ;-BWasB8AAAAJ;WSFToOMAAAAJ",
        "orcid": ";0000-0002-7011-0008;0000-0002-3063-8051",
        "linkedin": ";lujia-jin-ab75431b7/;",
        "or_profile": "~JiaKui_Hu1;~Lujia_Jin1;~Yanye_Lu2",
        "aff": "Peking University;Peking University;Peking University",
        "aff_domain": "pku.edu.cn;pku.edu.cn;pku.edu.cn",
        "position": "PhD student;PhD student;Assistant Professor",
        "bibtex": "@misc{\nhu2024shareformer,\ntitle={ShareFormer: Share Attention for Efficient Image Restoration},\nauthor={JiaKui Hu and Lujia Jin and Yanye Lu},\nyear={2024},\nurl={https://openreview.net/forum?id=HXZK1Z8tHa}\n}",
        "github": "",
        "project": "",
        "reviewers": "nYLY;F9tc;DFQF",
        "site": "https://openreview.net/forum?id=HXZK1Z8tHa",
        "pdf_size": 8161924,
        "rating": "5;5;6",
        "confidence": "5;5;4",
        "soundness": "3;2;3",
        "contribution": "2;2;3",
        "presentation": "3;2;3",
        "wc_summary": "59;73;69",
        "wc_strengths": "80;113;48",
        "wc_weaknesses": "252;167;80",
        "wc_questions": "6;388;79",
        "wc_review": "397;741;276",
        "wc_reply_reviewers": "129;335;79",
        "wc_reply_authors": "2158;2408;1528",
        "reply_reviewers": "2;1;1",
        "reply_authors": "5;5;3",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            67.0,
            5.887840577551898
        ],
        "wc_strengths_avg": [
            80.33333333333333,
            26.537185649993525
        ],
        "wc_weaknesses_avg": [
            166.33333333333334,
            70.22028829967084
        ],
        "wc_questions_avg": [
            157.66666666666666,
            165.57442099819914
        ],
        "wc_review_avg": [
            471.3333333333333,
            196.97772011631727
        ],
        "wc_reply_reviewers_avg": [
            181.0,
            110.79109470831429
        ],
        "wc_reply_authors_avg": [
            2031.3333333333333,
            370.2551672683163
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.9999999999999998,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:XLG5qjyJYGsJ:scholar.google.com/&scioq=ShareFormer:+Share+Attention+for+Efficient+Image+Restoration&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Peking University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.pku.edu.cn",
        "aff_unique_abbr": "Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Diffusion Sampling with Momentum for Mitigating Divergence Artifacts",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18990",
        "id": "HXc5aXeoc8",
        "author_site": "Suttisak Wisadwongsa, Worameth Chinchuthakun, Pramook Khungurn, Amit Raj, Supasorn Suwajanakorn",
        "tldr": "",
        "abstract": "Despite the remarkable success of diffusion models in image generation, slow sampling remains a persistent issue. To accelerate the sampling process, prior studies have reformulated diffusion sampling as an ODE/SDE and introduced higher-order numerical methods. However, these methods often produce divergence artifacts, especially with a low number of sampling steps, which limits the achievable acceleration. In this paper, we investigate the potential causes of these artifacts and suggest that the small stability regions of these methods could be the principal cause. To address this issue, we propose two novel techniques. The first technique involves the incorporation of Heavy Ball (HB) momentum, a well-known technique for improving optimization, into existing diffusion numerical methods to expand their stability regions.  We also prove that the resulting methods have first-order convergence. The second technique, called Generalized Heavy Ball (GHVB), constructs a new high-order method that offers a variable trade-off between accuracy and artifact suppression. Experimental results show that our techniques are highly effective in reducing artifacts and improving image quality, surpassing state-of-the-art diffusion solvers on both pixel-based and latent-based diffusion models for low-step sampling. Our research provides novel insights into the design of numerical methods for future diffusion work.",
        "keywords": "diffusion models;heavy ball momentum;divergence artifacts;numerical method;ode solver;image generation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/48018c347d9202ae4635de3ae350895705b6483e.zip",
        "author": "Suttisak Wizadwongsa;Worameth Chinchuthakun;Pramook Khungurn;Amit Raj;Supasorn Suwajanakorn",
        "authorids": "~Suttisak_Wizadwongsa1;~Worameth_Chinchuthakun1;~Pramook_Khungurn1;~Amit_Raj1;~Supasorn_Suwajanakorn2",
        "gender": "M;;M;M;M",
        "homepage": "https://sites.google.com/view/suttisak-wizadwongsa/;;http://pkhungurn.github.io/;https://amitraj93.github.io/;http://www.supasorn.com",
        "dblp": "210/6607;;22/1621.html;84/531;38/9726",
        "google_scholar": "https://scholar.google.com/citations?hl=th;;YxhRvCcAAAAJ;JVumcGEAAAAJ;DTNZMGAAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;pramook-khungurn-8385839/;;",
        "or_profile": "~Suttisak_Wizadwongsa1;~Worameth_Chinchuthakun1;~Pramook_Khungurn1;~Amit_Raj1;~Supasorn_Suwajanakorn2",
        "aff": "Vidyasirimedhi Institute of Science and Technology (VISTEC);;pixiv Inc.;Google DeepMind;Vidyasirimedhi Institute of Science and Technology",
        "aff_domain": "vistec.ac.th;;pixiv.co.jp;google.com;vistec.ac.th",
        "position": "PhD student;;Researcher;Researcher;Lecturer",
        "bibtex": "@inproceedings{\nwizadwongsa2024diffusion,\ntitle={Diffusion Sampling with Momentum for Mitigating Divergence Artifacts},\nauthor={Suttisak Wizadwongsa and Worameth Chinchuthakun and Pramook Khungurn and Amit Raj and Supasorn Suwajanakorn},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=HXc5aXeoc8}\n}",
        "github": "",
        "project": "",
        "reviewers": "Z3BT;DpnC;uXih;jPhx",
        "pdf_size": 35054247,
        "rating": "5;6;8;8",
        "confidence": "3;2;4;2",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "83;96;57;29",
        "wc_strengths": "41;76;97;24",
        "wc_weaknesses": "99;79;81;149",
        "wc_questions": "147;64;17;81",
        "wc_review": "370;315;252;283",
        "wc_reply_reviewers": "0;0;27;0",
        "wc_reply_authors": "857;853;277;289",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            66.25,
            25.68438241422207
        ],
        "wc_strengths_avg": [
            59.5,
            28.64000698323937
        ],
        "wc_weaknesses_avg": [
            102.0,
            28.231188426986208
        ],
        "wc_questions_avg": [
            77.25,
            46.59600304747179
        ],
        "wc_review_avg": [
            305.0,
            43.64057744805859
        ],
        "wc_reply_reviewers_avg": [
            6.75,
            11.691342951089922
        ],
        "wc_reply_authors_avg": [
            569.0,
            286.03496289789473
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.17407765595569782,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5372451178142505278&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=HXc5aXeoc8",
        "pdf": "https://openreview.net/pdf?id=HXc5aXeoc8",
        "email": "vistec.ac.th;;pixiv.co.jp;google.com;vistec.ac.th",
        "author_num": 5,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Vidyasirimedhi Institute of Science and Technology;pixiv Inc.;Google",
        "aff_unique_dep": ";;Google DeepMind",
        "aff_unique_url": "https://www.vistec.ac.th;https://www.pixiv.net;https://deepmind.com",
        "aff_unique_abbr": "VISTEC;pixiv;DeepMind",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;0",
        "aff_country_unique": "Thailand;Japan;United Kingdom"
    },
    {
        "id": "HXjXPQU3yJ",
        "title": "Prior Mismatch and Adaptation in PnP-ADMM with a Nonconvex Convergence Analysis",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Plug-and-Play (PnP) priors is a widely-used family of methods for solving imaging inverse problems by integrating physical measurement models with image priors specified using image denoisers.  PnP methods have been shown to achieve state-of-the-art performance when the prior is obtained using powerful deep denoisers. Despite extensive work on PnP, the topic of distribution mismatch between the training and testing data has often been overlooked in the PnP literature. This paper presents a set of new theoretical and numerical results on the topic of prior distribution mismatch and domain adaptation for alternating direction method of multipliers (ADMM) variant of PnP. Our theoretical result provides an explicit error bound for PnP-ADMM due to the mismatch between the desired denoiser and the one used for inference. Our analysis contributes to the work in the area by considering the mismatch under nonconvex data-fidelity terms and expansive denoisers. Our first set of numerical results quantifies the impact of the prior distribution mismatch on the performance of PnP-ADMM on the problem of image super-resolution. Our second set of numerical results considers a simple and effective domain adaption strategy that closes the performance gap due to the use of mismatched denoisers. Our results suggests the relative robustness of PnP-ADMM to prior distribution mismatch, while also showing that the performance gap can be significantly reduced with few training samples from the desired distribution.",
        "keywords": "Computational Imaging;Plug-and-Play Priors;Inverse Problems;Distribution Dhift;Mismatched Priors;Domain Adaptation",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/e77f5ff4e8765290bb41392b90cd0c4fe95a4418.zip",
        "author": "Shirin Shoushtari;Jiaming Liu;Edward P. Chandler;M. Salman Asif;Ulugbek Kamilov",
        "authorids": "~Shirin_Shoushtari1;~Jiaming_Liu3;~Edward_P._Chandler1;~M._Salman_Asif1;~Ulugbek_Kamilov1",
        "gender": "F;M;Not Specified;M;M",
        "homepage": ";https://jiamingliu-jeremy.github.io/;https://ukmlv.github.io;;https://www.ece.ucr.edu/~sasif",
        "dblp": "321/1728;33/5934-1;73/9223;;21/1910",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;KEucBooAAAAJ;https://scholar.google.com.tw/citations?user=3qYUSDwAAAAJ;;Dl0puDcAAAAJ",
        "orcid": ";0000-0002-1042-4443;0000-0001-6770-3278;0009-0006-2650-1083;0000-0001-5993-3903",
        "linkedin": ";;;edward-chandler-93279b1a3/;",
        "or_profile": "~Shirin_Shoushtari1;~Jiaming_Liu3;~Ulugbek_Kamilov1;~Edward_Pearson_Chandler1;~Salman_Asif1",
        "aff": "Washington University, Saint Louis;Washington University, St. Louis;Google;Washington University in St. Louis;University of California, Riverside",
        "aff_domain": "wustl.edu;wustl.edu;google.com;wustl.edu;ucr.edu",
        "position": "PhD student;PhD student;Visiting Faculty Researcher;PhD student;Associate Professor",
        "bibtex": "@misc{\nshoushtari2024prior,\ntitle={Prior Mismatch and Adaptation in PnP-{ADMM} with a Nonconvex Convergence Analysis},\nauthor={Shirin Shoushtari and Jiaming Liu and Edward P. Chandler and M. Salman Asif and Ulugbek Kamilov},\nyear={2024},\nurl={https://openreview.net/forum?id=HXjXPQU3yJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "E3jh;rsM4;wzA2;aNsR",
        "site": "https://openreview.net/forum?id=HXjXPQU3yJ",
        "pdf_size": 8049064,
        "rating": "5;6;6;8",
        "confidence": "2;4;2;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "4;4;2;3",
        "wc_summary": "61;100;15;145",
        "wc_strengths": "16;41;52;55",
        "wc_weaknesses": "146;64;56;194",
        "wc_questions": "56;760;1;281",
        "wc_review": "279;965;124;675",
        "wc_reply_reviewers": "0;0;0;117",
        "wc_reply_authors": "358;404;183;787",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.0,
            1.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            80.25,
            47.98632617736015
        ],
        "wc_strengths_avg": [
            41.0,
            15.346009253222807
        ],
        "wc_weaknesses_avg": [
            115.0,
            57.62811813689564
        ],
        "wc_questions_avg": [
            274.5,
            299.2895754950379
        ],
        "wc_review_avg": [
            510.75,
            330.3803679094749
        ],
        "wc_reply_reviewers_avg": [
            29.25,
            50.66248612138966
        ],
        "wc_reply_authors_avg": [
            433.0,
            220.38715933556566
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.6882472016116854,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=808533261507513277&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;1;0;2",
        "aff_unique_norm": "Washington University in St. Louis;Google;University of California, Riverside",
        "aff_unique_dep": ";Google;",
        "aff_unique_url": "https://wustl.edu;https://www.google.com;https://www.ucr.edu",
        "aff_unique_abbr": "WUSTL;Google;UCR",
        "aff_campus_unique_index": "0;1;2;1;3",
        "aff_campus_unique": "Saint Louis;St. Louis;Mountain View;Riverside",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "FairerCLIP: Debiasing CLIP's Zero-Shot Predictions using Functions in RKHSs",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18989",
        "id": "HXoq9EqR9e",
        "author_site": "Sepehr Dehdashtian, Lan Wang, Vishnu Boddeti",
        "tldr": "",
        "abstract": "Large pre-trained vision-language models such as CLIP provide compact and general-purpose representations of text and images that are demonstrably effective across multiple downstream zero-shot prediction tasks. However, owing to the nature of their training process, these models have the potential to 1) propagate or amplify societal biases in the training data and 2) learn to rely on spurious features. This paper proposes FairerCLIP, a general approach for making zero-shot predictions of CLIP more fair and robust to spurious correlations. We formulate the problem of jointly debiasing CLIP\u2019s image and text representations in reproducing kernel Hilbert spaces (RKHSs), which affords multiple benefits: 1) Flexibility: Unlike existing approaches, which are specialized to either learn with or without ground-truth labels, FairerCLIP is adaptable to learning in both scenarios. 2) Ease of Optimization: FairerCLIP lends itself to an iterative optimization involving closed-form solvers, which leads to 4\u00d7-10\u00d7 faster training than the existing methods. 3) Sample Efficiency: Under sample-limited conditions, FairerCLIP significantly outperforms baselines when they fail entirely. And, 4) Performance: Empirically, FairerCLIP achieves appreciable accuracy gains on benchmark fairness and spurious correlation datasets over their respective baselines.",
        "keywords": "CLIP;debiasing;fair representation learning;vision-language models;dependence measure;zero-shot",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Sepehr Dehdashtian;Lan Wang;Vishnu Boddeti",
        "authorids": "~Sepehr_Dehdashtian1;~Lan_Wang3;~Vishnu_Boddeti1",
        "gender": "M;;M",
        "homepage": "https://sepehrdehdashtian.github.io/;;https://hal.cse.msu.edu",
        "dblp": "274/7429;;55/6988",
        "google_scholar": "aoiXI54AAAAJ;;JKcrO9IAAAAJ",
        "orcid": ";;",
        "linkedin": "sepehr-dehdashtian-b94253a5/;;",
        "or_profile": "~Sepehr_Dehdashtian1;~Lan_Wang3;~Vishnu_Boddeti1",
        "aff": "Michigan State University;;Michigan State University",
        "aff_domain": "msu.edu;;msu.edu",
        "position": "PhD student;;Associate Professor",
        "bibtex": "@inproceedings{\ndehdashtian2024fairerclip,\ntitle={Fairer{CLIP}: Debiasing {CLIP}'s Zero-Shot Predictions using Functions in {RKHS}s},\nauthor={Sepehr Dehdashtian and Lan Wang and Vishnu Boddeti},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=HXoq9EqR9e}\n}",
        "github": "",
        "project": "",
        "reviewers": "75gn;9VkB;p1sH;2eeh",
        "pdf_size": 1482079,
        "rating": "6;6;6;8",
        "confidence": "4;3;4;1",
        "soundness": "3;3;3;4",
        "contribution": "3;3;3;4",
        "presentation": "3;3;3;3",
        "wc_summary": "58;72;139;52",
        "wc_strengths": "56;63;138;58",
        "wc_weaknesses": "46;32;880;22",
        "wc_questions": "9;217;143;12",
        "wc_review": "169;384;1300;144",
        "wc_reply_reviewers": "27;228;435;0",
        "wc_reply_authors": "442;2079;2180;468",
        "reply_reviewers": "1;1;2;0",
        "reply_authors": "1;3;4;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            1.224744871391589
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            80.25,
            34.686993239541536
        ],
        "wc_strengths_avg": [
            78.75,
            34.30287888793009
        ],
        "wc_weaknesses_avg": [
            245.0,
            366.7165117635147
        ],
        "wc_questions_avg": [
            95.25,
            88.70280435251188
        ],
        "wc_review_avg": [
            499.25,
            471.6330008597787
        ],
        "wc_reply_reviewers_avg": [
            172.5,
            175.29475177540257
        ],
        "wc_reply_authors_avg": [
            1292.25,
            838.0615654592448
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.25,
            1.299038105676658
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.9428090415820632,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=380593294758569122&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=HXoq9EqR9e",
        "pdf": "https://openreview.net/pdf?id=HXoq9EqR9e",
        "email": "msu.edu;;msu.edu",
        "author_num": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Michigan State University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.msu.edu",
        "aff_unique_abbr": "MSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "HXu7oYPOhg",
        "title": "Memory-efficient particle filter recurrent neural network for object localization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This study proposes a novel memory-efficient recurrent neural network (RNN) architecture specified to solve the object localization problem. This problem is to recover the object states along with its movement in a noisy environment. We take the idea of the classical particle filter and combine it with GRU RNN architecture. The key feature of the resulting memory-efficient particle filter RNN model (mePFRNN) is that it requires the same number of parameters to process environments of different sizes.  Thus, the proposed mePFRNN architecture consumes less memory to store parameters compared to the previously proposed PFRNN model. To demonstrate the performance of our model, we test it on symmetric and noisy environments that are incredibly challenging for filtering algorithms. In our experiments, the mePFRNN model provides more precise localization than the considered competitors and requires fewer trained parameters.",
        "keywords": "object localization;particle filter;GRU RNN;symmetric environment",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/08b9d2b4e2c563d080a637122472a8fafb718b59.zip",
        "author": "Roman Korkin;Ivan Oseledets;Aleksandr Katrutsa",
        "authorids": "~Roman_Korkin1;~Ivan_Oseledets1;~Aleksandr_Katrutsa1",
        "gender": "M;M;M",
        "homepage": ";http://oseledets.github.io;https://www.linkedin.com/in/aleksandr-katrutsa-598762a0/",
        "dblp": ";56/7175;197/1422",
        "google_scholar": "T9WWpm4AAAAJ;https://scholar.google.ru/citations?user=5kMqBQEAAAAJ;https://scholar.google.ru/citations?user=mKP8BpEAAAAJ",
        "orcid": ";;0000-0002-7050-1615",
        "linkedin": ";;aleksandr-katrutsa-598762a0/",
        "or_profile": "~Roman_Korkin1;~Ivan_Oseledets1;~Alexandr_Katrutsa1",
        "aff": ";Institute of Numerical Mathematics;Skolkovo Institute of Science and Technology",
        "aff_domain": ";inm.ras.ru;skoltech.ru",
        "position": ";Researcher;Researcher",
        "bibtex": "@misc{\nkorkin2024memoryefficient,\ntitle={Memory-efficient particle filter recurrent neural network for object localization},\nauthor={Roman Korkin and Ivan Oseledets and Aleksandr Katrutsa},\nyear={2024},\nurl={https://openreview.net/forum?id=HXu7oYPOhg}\n}",
        "github": "",
        "project": "",
        "reviewers": "B8nM;Y3Q6;mq82",
        "site": "https://openreview.net/forum?id=HXu7oYPOhg",
        "pdf_size": 320285,
        "rating": "1;3;8",
        "confidence": "4;3;3",
        "soundness": "2;2;3",
        "contribution": "1;2;3",
        "presentation": "1;2;2",
        "wc_summary": "44;16;117",
        "wc_strengths": "17;9;86",
        "wc_weaknesses": "105;506;39",
        "wc_questions": "75;61;51",
        "wc_review": "241;592;293",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "247;708;170",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.0,
            2.943920288775949
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            59.0,
            42.57542327055207
        ],
        "wc_strengths_avg": [
            37.333333333333336,
            34.56716489515576
        ],
        "wc_weaknesses_avg": [
            216.66666666666666,
            206.35621844007727
        ],
        "wc_questions_avg": [
            62.333333333333336,
            9.843215373488933
        ],
        "wc_review_avg": [
            375.3333333333333,
            154.67025857898113
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            375.0,
            237.55560752519958
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.720576692122892,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2325389985742172002&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Institute of Numerical Mathematics;Skolkovo Institute of Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": ";https://www.skoltech.ru",
        "aff_unique_abbr": ";Skoltech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "1",
        "aff_country_unique": ";Russian Federation"
    },
    {
        "title": "Neural Language of Thought Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18988",
        "id": "HYyRwm367m",
        "author_site": "Yi-Fu Wu, Minseung Lee, Sungjin Ahn",
        "tldr": "",
        "abstract": "The Language of Thought Hypothesis suggests that human cognition operates on a structured, language-like system of mental representations. While neural language models can naturally benefit from the compositional structure inherently and explicitly expressed in language data, learning such representations from non-linguistic general observations, like images, remains a challenge. In this work, we introduce the Neural Language of Thought Model (NLoTM), a novel approach for unsupervised learning of LoTH-inspired representation and generation. NLoTM comprises two key components: (1) the Semantic Vector-Quantized Variational Autoencoder, which learns hierarchical, composable discrete representations aligned with objects and their properties, and (2) the Autoregressive LoT Prior, an autoregressive transformer that learns to generate semantic concept tokens compositionally, capturing the underlying data distribution. We evaluate NLoTM on several 2D and 3D image datasets, demonstrating superior performance in downstream tasks, out-of-distribution generalization, and image generation quality compared to patch-based VQ-VAE and continuous object-centric representations. Our work presents a significant step towards creating neural networks exhibiting more human-like understanding by developing LoT-like representations and offers insights into the intersection of cognitive science and machine learning.",
        "keywords": "unsupervised object-centric learning;discrete representations",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Yi-Fu Wu;Minseung Lee;Sungjin Ahn",
        "authorids": "~Yi-Fu_Wu1;~Minseung_Lee2;~Sungjin_Ahn1",
        "gender": "M;M;",
        "homepage": "https://www.yifuwu.com/;https://www.notion.so/agentlearning/Minseung-Lee-22-S-ff25798bb92a460daf083000c344d66c;",
        "dblp": "256/1572;;",
        "google_scholar": "Fv2A650AAAAJ;;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Yi-Fu_Wu1;~Minseung_Lee2;~Sungjin_Ahn1",
        "aff": "Meta Facebook;KAIST;",
        "aff_domain": "meta.com;kaist.ac.kr;",
        "position": "Intern;MS student;",
        "bibtex": "@inproceedings{\nwu2024neural,\ntitle={Neural Language of Thought Models},\nauthor={Yi-Fu Wu and Minseung Lee and Sungjin Ahn},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=HYyRwm367m}\n}",
        "github": "",
        "project": "",
        "reviewers": "41Cm;qSSD;cC8S;gjT4",
        "pdf_size": 9524931,
        "rating": "6;6;6;8",
        "confidence": "3;4;2;3",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "86;94;44;139",
        "wc_strengths": "34;118;47;34",
        "wc_weaknesses": "229;144;88;151",
        "wc_questions": "7;66;4;227",
        "wc_review": "356;422;183;551",
        "wc_reply_reviewers": "123;73;73;0",
        "wc_reply_authors": "1073;1075;205;1622",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "3;3;1;4",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            90.75,
            33.71479645496915
        ],
        "wc_strengths_avg": [
            58.25,
            34.90254288730264
        ],
        "wc_weaknesses_avg": [
            153.0,
            50.214539727055154
        ],
        "wc_questions_avg": [
            76.0,
            90.61732726140184
        ],
        "wc_review_avg": [
            378.0,
            132.64049155518083
        ],
        "wc_reply_reviewers_avg": [
            67.25,
            43.86556166288082
        ],
        "wc_reply_authors_avg": [
            993.75,
            507.37233615955057
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            1.0897247358851685
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6680778776097007533&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=HYyRwm367m",
        "pdf": "https://openreview.net/pdf?id=HYyRwm367m",
        "email": "meta.com;kaist.ac.kr;",
        "author_num": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Meta;Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "Meta Platforms, Inc.;",
        "aff_unique_url": "https://meta.com;https://www.kaist.ac.kr",
        "aff_unique_abbr": "Meta;KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United States;South Korea"
    },
    {
        "title": "Set Learning for Accurate and Calibrated Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18987",
        "id": "HZ3S17EI0o",
        "author_site": "Lukas Muttenthaler, Robert A Vandermeulen, Qiuyi (Richard) Zhang, Thomas Unterthiner, Klaus R Muller",
        "tldr": "",
        "abstract": "Model overconfidence and poor calibration are common in machine learning and difficult to account for when applying standard empirical risk minimization. In this work, we propose a novel method to alleviate these problems that we call odd-$k$-out learning (OKO), which minimizes the cross-entropy error for sets rather than for single examples. This naturally allows the model to capture correlations across data examples and achieves both better accuracy and calibration, especially in limited training data and class-imbalanced regimes. Perhaps surprisingly, OKO often yields better calibration even when training with hard labels and dropping any additional calibration parameter tuning, such as temperature scaling. We demonstrate this in extensive experimental analyses and provide a mathematical theory to interpret our findings. We emphasize that OKO is a general framework that can be easily adapted to many settings and a trained model can be applied to single examples at inference time, without significant run-time overhead or architecture changes.",
        "keywords": "set learning;calibration;overconfidence;class imbalance;long-tailed classification;low data;classification calibration;safety",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Lukas Muttenthaler;Robert A. Vandermeulen;Qiuyi Zhang;Thomas Unterthiner;Klaus Robert Muller",
        "authorids": "~Lukas_Muttenthaler1;~Robert_A._Vandermeulen2;~Qiuyi_Zhang1;~Thomas_Unterthiner1;~Klaus_Robert_Muller1",
        "gender": "M;M;;M;M",
        "homepage": "https://lukasmut.github.io/;https://qiuyiz.github.io;;https://www.ml.tu-berlin.de/menue/members/klaus-robert_mueller/;https://www.user.tu-berlin.de/rvdm/",
        "dblp": "245/4369;133/8559;https://dblp.uni-trier.de/pers/u/Unterthiner:Thomas;m/KRMuller.html;137/3375",
        "google_scholar": "https://scholar.google.com/citations?hl=en;mE11hO8AAAAJ;https://scholar.google.at/citations?user=QCARd5gAAAAJ;https://scholar.google.de/citations?hl=de;eSjfzOUAAAAJ",
        "orcid": "0000-0002-0804-4687;;;0000-0002-3861-7685;0000-0001-6863-7006",
        "linkedin": "lukas-muttenthaler/;;;;",
        "or_profile": "~Lukas_Muttenthaler1;~Qiuyi_Zhang1;~Thomas_Unterthiner1;~Klaus_Robert_Muller1;~Robert_Vandermeulen1",
        "aff": "TU Berlin;Google;Google;TU Berlin;Berlin Institute for the Foundations of Learning and Data",
        "aff_domain": "tu-berlin.de;google.com;google.com;tu-berlin.de;tu-berlin.de",
        "position": "PhD student;Researcher;Researcher;Full Professor;Researcher",
        "bibtex": "@inproceedings{\nmuttenthaler2024set,\ntitle={Set Learning for Accurate and Calibrated Models},\nauthor={Lukas Muttenthaler and Robert A. Vandermeulen and Qiuyi Zhang and Thomas Unterthiner and Klaus Robert Muller},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=HZ3S17EI0o}\n}",
        "github": "",
        "project": "",
        "reviewers": "ALEr;S9eW;ZKiJ;se1z",
        "pdf_size": 3371899,
        "rating": "3;6;8;8",
        "confidence": "5;3;4;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "1;2;4;2",
        "wc_summary": "195;103;56;541",
        "wc_strengths": "14;10;90;62",
        "wc_weaknesses": "41;62;89;1002",
        "wc_questions": "946;290;2;228",
        "wc_review": "1196;465;237;1833",
        "wc_reply_reviewers": "0;26;0;168",
        "wc_reply_authors": "1008;840;336;558",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "3;2;2;3",
        "rating_avg": [
            6.25,
            2.0463381929681126
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            223.75,
            189.86491908722897
        ],
        "wc_strengths_avg": [
            44.0,
            33.52610922848042
        ],
        "wc_weaknesses_avg": [
            298.5,
            406.52213961849606
        ],
        "wc_questions_avg": [
            366.5,
            351.32428040202404
        ],
        "wc_review_avg": [
            932.75,
            629.0088930213944
        ],
        "wc_reply_reviewers_avg": [
            48.5,
            69.80508577460527
        ],
        "wc_reply_authors_avg": [
            685.5,
            258.0130810637321
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.6998739952495694,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4125912615930601108&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=HZ3S17EI0o",
        "pdf": "https://openreview.net/pdf?id=HZ3S17EI0o",
        "email": "tu-berlin.de;google.com;google.com;tu-berlin.de;tu-berlin.de",
        "author_num": 5,
        "aff_unique_index": "0;1;1;0;2",
        "aff_unique_norm": "Technische Universit\u00e4t Berlin;Google;Berlin Institute for the Foundations of Learning and Data",
        "aff_unique_dep": ";Google;",
        "aff_unique_url": "https://www.tu-berlin.de;https://www.google.com;https://www.bifold.berlin",
        "aff_unique_abbr": "TU Berlin;Google;BIFOLD",
        "aff_campus_unique_index": "0;1;1;0",
        "aff_campus_unique": "Berlin;Mountain View;",
        "aff_country_unique_index": "0;1;1;0;0",
        "aff_country_unique": "Germany;United States"
    },
    {
        "id": "HZdJgJ8ldH",
        "title": "Proactive Learning: Search-augmented learning using Pre-trained Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large pre-trained models are increasingly important tools in machine learning. Although versatile, their knowledge is however limited and often insufficient to handle domain-specific nuances. This paper introduces a novel ``webly-supervised'' learning approach that uses web search to enrich a pre-trained model for visual recognition. This strategy empowers the model to access relevant, up-to-date information as required. Our method first identifies test instances that the pre-trained model is uncertain about. We then formulate a query for Google Search to retrieve images to resolve this uncertainty. These serve as noisy data to train a compact classifier, with no need for additional manual labelling.\n\nWhile multiple attempts at search-augmented learning appeared in the past, this iteration of the concept benefits from recent advances in NLP and multi-modal learning. This allows demonstrating unique benefits in uncertainty quantification and domain-specific recognition (e.g. +15 percentage points in accuracy on the Stanford Cars and Flowers datasets). We also present extensive experiments to explore the impact of noisy retrieval and different fine-tuning strategies.",
        "keywords": "Generalisation; machine learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Hamed Damirchi;Cristian Rodriguez;Ehsan Abbasnejad;Damien Teney;Javen Qinfeng Shi;Anton van den Hengel;Stephen Gould",
        "authorids": "~Hamed_Damirchi1;~Cristian_Rodriguez1;~Ehsan_Abbasnejad3;~Damien_Teney1;~Javen_Qinfeng_Shi1;~Anton_van_den_Hengel1;~Stephen_Gould1",
        "gender": "Non-Binary;M;M;;M;M;M",
        "homepage": "https://hamed-d.github.io/;;https://www.damienteney.info;;http://users.cecs.anu.edu.au/~sgould/;https://ehsanabb.github.io/;https://cs.adelaide.edu.au/~javen/",
        "dblp": "270/0010;247/5999;62/10068;v/AntonvandenHengel;89/1569.html;30/11191;http://dblp.uni-trier.de/pers/hd/s/Shi:Qinfeng",
        "google_scholar": "DkrjEmEAAAAJ;https://scholar.google.com/citations?hl=es;https://scholar.google.com.au/citations?user=iS_jP_3dpD8J;https://scholar.google.com.au/citations?user=nMGZ2ZQAAAAJ;YvdzeM8AAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com.au/citations?user=h6O9vYkAAAAJ",
        "orcid": "0000-0001-7142-3500;;;0000-0003-3027-8364;0000-0001-8929-7899;;0000-0002-9126-2107",
        "linkedin": ";;;;;;",
        "or_profile": "~Hamed_Damirchi1;~Cristian_Rodriguez1;~Damien_Teney1;~Anton_van_den_Hengel1;~Stephen_Gould1;~Ehsan_M_Abbasnejad1;~Javen_Shi1",
        "aff": "University of Adelaide;University of Adelaide;Idiap Research Institute;University of Adelaide;Australian National University;University of Adelaide;University of Adelaide",
        "aff_domain": "adelaide.edu.au;adelaide.edu.au;idiap.ch;adelaide.edu.au;anu.edu.au;adelaide.edu.au;adelaide.edu.au",
        "position": "PhD student;Postdoc;Researcher;Professor;Full Professor;Assistant Professor;Professor",
        "bibtex": "@misc{\ndamirchi2024proactive,\ntitle={Proactive Learning: Search-augmented learning using Pre-trained Models},\nauthor={Hamed Damirchi and Cristian Rodriguez and Ehsan Abbasnejad and Damien Teney and Javen Qinfeng Shi and Anton van den Hengel and Stephen Gould},\nyear={2024},\nurl={https://openreview.net/forum?id=HZdJgJ8ldH}\n}",
        "github": "",
        "project": "",
        "reviewers": "dJXS;QgSd;6yvj",
        "site": "https://openreview.net/forum?id=HZdJgJ8ldH",
        "pdf_size": 10148108,
        "rating": "3;3;6",
        "confidence": "4;4;4",
        "soundness": "3;2;3",
        "contribution": "2;2;3",
        "presentation": "3;3;3",
        "wc_summary": "106;118;42",
        "wc_strengths": "30;44;57",
        "wc_weaknesses": "195;109;83",
        "wc_questions": "60;604;40",
        "wc_review": "391;875;222",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            88.66666666666667,
            33.359989341858146
        ],
        "wc_strengths_avg": [
            43.666666666666664,
            11.025223605694151
        ],
        "wc_weaknesses_avg": [
            129.0,
            47.86090958879351
        ],
        "wc_questions_avg": [
            234.66666666666666,
            261.2857099464535
        ],
        "wc_review_avg": [
            496.0,
            276.7321207714541
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:tDo66Ob1LOEJ:scholar.google.com/&scioq=Proactive+Learning:+Search-augmented+learning+using+Pre-trained+Models&hl=en&as_sdt=0,48",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;2;0;0",
        "aff_unique_norm": "University of Adelaide;Idiap Research Institute;Australian National University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.adelaide.edu.au;https://www.idiap.ch;https://www.anu.edu.au",
        "aff_unique_abbr": "Adelaide;Idiap;ANU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0;0;0",
        "aff_country_unique": "Australia;Switzerland"
    },
    {
        "title": "Principled Architecture-aware Scaling of Hyperparameters",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18986",
        "id": "HZndRcfyNI",
        "author_site": "Wuyang Chen, Junru Wu, Zhangyang Wang, Boris Hanin",
        "tldr": "",
        "abstract": "Training a high-quality deep neural network requires choosing suitable hyperparameters, which is a non-trivial and expensive process. Current works try to automatically optimize or design principles of hyperparameters, such that they can generalize to diverse unseen scenarios. However, most designs of principles or optimization methods are agnostic to the choice of network structures, and thus largely ignore the impact of neural architectures on hyperparameters. In this work, we precisely characterize the dependence of initializations and maximal learning rates on the network architecture, which includes the network depth, width, convolutional kernel size, and connectivity patterns. By pursuing every parameter to be maximally updated with the same mean squared change in pre-activations, we can generalize our initialization and learning rates across MLPs (multi-layer perception) and CNNs (convolutional neural network) with sophisticated graph topologies. We verify our principles with comprehensive experiments. More importantly, our strategy further sheds light on advancing current benchmarks for architecture design. A fair comparison of AutoML algorithms requires accurate network rankings. However, we demonstrate that network rankings can be easily changed by better training networks in benchmarks with our architecture-aware learning rates and initialization.",
        "keywords": "Hyperparameter Transfer;Neural Network Architecture;Neural Network Initialization;Learning Rate",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/c7f8e5819960e0d981903d85c00f2c4232475ce9.zip",
        "author": "Wuyang Chen;Junru Wu;Zhangyang Wang;Boris Hanin",
        "authorids": "~Wuyang_Chen1;~Junru_Wu2;~Zhangyang_Wang1;~Boris_Hanin1",
        "gender": ";M;M;",
        "homepage": ";http://sandbox3aster.github.io/;https://vita-group.github.io;https://hanin.princeton.edu",
        "dblp": ";;119/4026;205/2534",
        "google_scholar": ";nBbGvyEAAAAJ;pxFyKAIAAAAJ;",
        "orcid": ";;;",
        "linkedin": ";junru-wu/;;",
        "or_profile": "~Wuyang_Chen1;~Junru_Wu2;~Zhangyang_Wang1;~Boris_Hanin1",
        "aff": ";Google Research;University of Texas at Austin;Princeton University",
        "aff_domain": ";google.com;utexas.edu;princeton.edu",
        "position": ";Researcher;Associate Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nchen2024principled,\ntitle={Principled Architecture-aware Scaling of Hyperparameters},\nauthor={Wuyang Chen and Junru Wu and Zhangyang Wang and Boris Hanin},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=HZndRcfyNI}\n}",
        "github": "",
        "project": "",
        "reviewers": "X2JZ;nJvL;drLU;BP74",
        "pdf_size": 959714,
        "rating": "6;6;6;8",
        "confidence": "4;4;4;3",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "100;92;71;164",
        "wc_strengths": "227;187;109;228",
        "wc_weaknesses": "158;215;165;239",
        "wc_questions": "1;3;5;144",
        "wc_review": "486;497;350;775",
        "wc_reply_reviewers": "0;0;0;120",
        "wc_reply_authors": "259;181;416;600",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            106.75,
            34.70860844228705
        ],
        "wc_strengths_avg": [
            187.75,
            48.380652124583854
        ],
        "wc_weaknesses_avg": [
            194.25,
            33.92178503557854
        ],
        "wc_questions_avg": [
            38.25,
            61.07116750153054
        ],
        "wc_review_avg": [
            527.0,
            154.4457833674976
        ],
        "wc_reply_reviewers_avg": [
            30.0,
            51.96152422706632
        ],
        "wc_reply_authors_avg": [
            364.0,
            160.40105984687258
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:4vTgHHGiQy8J:scholar.google.com/&scioq=Principled+Architecture-aware+Scaling+of+Hyperparameters&hl=en&as_sdt=0,33",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=HZndRcfyNI",
        "pdf": "https://openreview.net/pdf?id=HZndRcfyNI",
        "email": ";google.com;utexas.edu;princeton.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Google;University of Texas at Austin;Princeton University",
        "aff_unique_dep": "Google Research;;",
        "aff_unique_url": "https://research.google;https://www.utexas.edu;https://www.princeton.edu",
        "aff_unique_abbr": "Google Research;UT Austin;Princeton",
        "aff_campus_unique_index": "0;1",
        "aff_campus_unique": "Mountain View;Austin;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "HZnnHDrBXD",
        "title": "Tree-based Action-Manipulation Attack Against Continuous Reinforcement Learning with Provably Efficient Support",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Due to the widespread application of reinforcement learning, research on its adversarial attacks is necessary for building secure reinforcement learning applications. However, most of the current security research focuses only on reinforcement learning with discrete states and actions, and these methods cannot be directly applied to reinforcement learning in continuous state and action spaces. In this paper, we investigate attacks on continuous reinforcement learning. Rather than manipulating observations or environments, our focus lies in action-manipulation attacks that impose more restrictions on the attacker. Our study investigates the action-manipulation attack in both white-box and black-box scenarios. We propose a black-box attack method called LCBT, which uses a layered binary tree structure-based refinement and segmentation method to handle continuous action spaces. Additionally, we prove that under the condition of a sublinear relationship between the dynamic regret and total step counts of the reinforcement learning agent, LCBT can force the agent to frequently take actions according to specified policies with only sublinear attack cost. We conduct experiments to evaluate the effectiveness of the LCBT attack on three widely-used reinforcement learning algorithms: DDPG, PPO, and TD3.",
        "keywords": "reinforcement learning security;adversarial;provably efficient",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/aae3970df5b4291a11a0e52f742c7d4d5af1b0b3.zip",
        "author": "Zhi Luo;Xiyuan Yang;Lixing Chen;Pan Zhou;Renfu Li",
        "authorids": "~Zhi_Luo3;~Xiyuan_Yang2;~Lixing_Chen1;~Pan_Zhou5;~Renfu_Li1",
        "gender": "M;M;M;M;M",
        "homepage": "https://github.com/comeony;https://icst.sjtu.edu.cn/DirectoryDetail.aspx?id=27;http://faculty.hust.edu.cn/pzhou/zh_CN/index.htm;http://hust.ae.lrf;",
        "dblp": ";154/7371;84/6614-1;;145/3566.html",
        "google_scholar": ";boMMe2YAAAAJ;cTpFPJgAAAAJ;;",
        "orcid": ";0000-0002-1805-0183;;;0000-0002-3571-9299",
        "linkedin": ";;;;",
        "or_profile": "~Xiyuan_Yang2;~Lixing_Chen1;~Pan_Zhou5;~Renfu_Li1;~Zhi_Luo4",
        "aff": "Huazhong University of Science and Technology;Shanghai Jiaotong University;Huazhong University of Science and Technology;Huazhong University of Science and Technology;Huazhong University of Science and Technology",
        "aff_domain": "hust.edu.cn;sjtu.edu.cn;hust.edu.cn;hust.edu.cn;hust.edu.cn",
        "position": "MS student;Assistant Professor;Professor;Full Professor;PhD student",
        "bibtex": "@misc{\nanonymous2024treebased,\ntitle={Tree-based Action-Manipulation Attack Against Continuous Reinforcement Learning with Provably Efficient Support},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=HZnnHDrBXD}\n}",
        "github": "",
        "project": "",
        "reviewers": "rSLW;BCGQ;5Edg;hNCZ",
        "site": "https://openreview.net/forum?id=HZnnHDrBXD",
        "pdf_size": 709690,
        "rating": "5;6;6;6",
        "confidence": "3;2;4;3",
        "soundness": "3;3;3;2",
        "contribution": "2;2;3;2",
        "presentation": "2;2;2;2",
        "wc_summary": "121;119;238;141",
        "wc_strengths": "169;57;136;78",
        "wc_weaknesses": "136;47;121;82",
        "wc_questions": "36;269;28;68",
        "wc_review": "462;492;523;369",
        "wc_reply_reviewers": "62;228;0;32",
        "wc_reply_authors": "462;1394;910;587",
        "reply_reviewers": "1;2;0;1",
        "reply_authors": "1;3;2;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            154.75,
            48.828142499996865
        ],
        "wc_strengths_avg": [
            110.0,
            44.69339996017309
        ],
        "wc_weaknesses_avg": [
            96.5,
            34.7167106736799
        ],
        "wc_questions_avg": [
            100.25,
            98.5707233411625
        ],
        "wc_review_avg": [
            461.5,
            57.5955727465228
        ],
        "wc_reply_reviewers_avg": [
            80.5,
            87.93605631366465
        ],
        "wc_reply_authors_avg": [
            838.25,
            360.1030234530113
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:65_6YpefTUQJ:scholar.google.com/&scioq=Tree-based+Action-Manipulation+Attack+Against+Continuous+Reinforcement+Learning+with+Provably+Efficient+Support&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0;0",
        "aff_unique_norm": "Huazhong University of Science and Technology;Shanghai Jiao Tong University",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.hust.edu.cn;https://www.sjtu.edu.cn",
        "aff_unique_abbr": "HUST;SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "HZtBP6DZah",
        "title": "Contrastive Grouping-based Invariant Learning for Generalizable Graph Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recently, Graph Neural Networks (GNNs) have demonstrated remarkable success in various graph learning tasks. However, most existing GNNs fail to generalize under distribution shifts, namely testing and training graphs come from different distributions. Graph invariant learning is proposed to tackle the out-of-distribution (OOD) generalization problem by capturing the invariant relationships between graph features and labels.\nTo this end, most graph invariant learning methods estimate the probabilities of nodes or edges belonging to the invariant\nsubgraphs by measuring these edges' or nodes' contribution degrees of the corresponding edges or nodes to the model's predictive performance.\nNonetheless, relying solely on the predictive performance of the model is insufficient to determine whether the given edge or node belongs to an invariant subgraph.\nTo solve this problem, we propose a novel Contrastive Grouping-based Invariant Learning(CGIL) algorithm for OOD generalization on graphs. Our algorithm incorporates the idea of node grouping into the design of learning invariant features. Unlike existing methods that simply employ a mask generator to learn node weights, CGIL tries to cluster graph nodes into an invariant group and several contrast groups. Then CGIL takes the graph connectivity information into account to enforce the graph connectivity inside the invariant group. A contrastive loss constraint is adopted to promote the grouping and invariant subgraph generating procedure.\nCompared with nine state-of-the-art generalization methods, extensive experiments on four benchmark datasets demonstrate the effectiveness of our proposed CGIL algorithm for the graph classification tasks.",
        "keywords": "grouping-based; graph invariant learning; out-of-distribution generalization",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Xuecheng Ning;Kui Yu",
        "authorids": "~Xuecheng_Ning1;~Kui_Yu2",
        "gender": "M;M",
        "homepage": "https://github.com/PumpkinNing;https://sites.google.com/site/yukuiwebsite/",
        "dblp": ";52/2586",
        "google_scholar": ";rlzrsxwAAAAJ",
        "orcid": ";0000-0003-2442-4572",
        "linkedin": ";",
        "or_profile": "~Xuecheng_Ning1;~Kui_Yu2",
        "aff": "Hefei University of Technology;Hefei University of Technology",
        "aff_domain": "hfut.edu.cn;hfut.edu.cn",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nning2024contrastive,\ntitle={Contrastive Grouping-based Invariant Learning for Generalizable Graph Learning},\nauthor={Xuecheng Ning and Kui Yu},\nyear={2024},\nurl={https://openreview.net/forum?id=HZtBP6DZah}\n}",
        "github": "",
        "project": "",
        "reviewers": "8ra5;vit7;kFr5;bSXr",
        "site": "https://openreview.net/forum?id=HZtBP6DZah",
        "pdf_size": 2462227,
        "rating": "1;3;3;5",
        "confidence": "3;5;5;3",
        "soundness": "3;2;2;3",
        "contribution": "2;1;1;2",
        "presentation": "3;2;3;2",
        "wc_summary": "60;44;48;68",
        "wc_strengths": "18;9;31;53",
        "wc_weaknesses": "50;158;192;76",
        "wc_questions": "5;5;2;121",
        "wc_review": "133;216;273;318",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.0,
            1.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            55.0,
            9.539392014169456
        ],
        "wc_strengths_avg": [
            27.75,
            16.543503256565703
        ],
        "wc_weaknesses_avg": [
            119.0,
            58.008620049092706
        ],
        "wc_questions_avg": [
            33.25,
            50.67728781219453
        ],
        "wc_review_avg": [
            235.0,
            69.09775683768613
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:5vRj1DTIztkJ:scholar.google.com/&scioq=Contrastive+Grouping-based+Invariant+Learning+for+Generalizable+Graph+Learning&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Hefei University of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.hfut.edu.cn/",
        "aff_unique_abbr": "HUT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "HaLxcQ6OOm",
        "title": "Eureka-Moments in Transformers: Multi-Step Tasks Reveal Softmax Induced Optimization Problems",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this work, we study rapid, step-wise improvements of the loss in transformers when being confronted with multi-step decision tasks. We found that transformers struggle to learn the intermediate tasks, whereas CNNs have no such issue on the tasks we studied. When \ntransformers learn the intermediate task, they do this rapidly and unexpectedly after both training and validation loss saturated for hundreds of epochs. We call these rapid improvements Eureka-moments, since the transformer appears to suddenly learn a previously incomprehensible task. Similar leaps in performance have become known as Grokking. In contrast to Grokking, for Eureka-moments, both the validation and the training loss saturate before rapidly improving. We trace the problem back to the Softmax function in the self-attention block of transformers and show ways to alleviate the problem. These fixes improve training speed. The improved models reach 95% of the baseline model in just 20% of training steps while having a much higher likelihood to learn the intermediate task, lead to higher final accuracy and are more robust to hyper-parameters.",
        "keywords": "transformers;attention;softmax;grokking;sudden loss drop;local optimum;softmax temperature;phase transition;analysis paper",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/54e84679da835d8987be0962d88ca2fe5f129289.pdf",
        "author": "David T Hoffmann;Simon Schrodi;Nadine Behrmann;Volker Fischer;Thomas Brox",
        "authorids": "~David_T_Hoffmann1;~Simon_Schrodi1;~Nadine_Behrmann1;~Volker_Fischer1;~Thomas_Brox1",
        "gender": ";M;;M;M",
        "homepage": ";https://lmb.informatik.uni-freiburg.de/people/schrodi/;;;https://lmb.informatik.uni-freiburg.de/people/brox/index.en.html",
        "dblp": ";289/1328;;84/4102-3;97/4586",
        "google_scholar": ";https://scholar.google.de/citations?user=yC-y0PEAAAAJ;;https://scholar.google.de/citations?hl=de;https://scholar.google.com/citations?hl=de",
        "orcid": ";0009-0003-7006-953X;;0000-0001-5437-4030;0000-0002-6282-8861",
        "linkedin": ";simon-schrodi-7b55161bb/;nadine-behrmann;;",
        "or_profile": "~David_T_Hoffmann1;~Simon_Schrodi1;~Nadine_Behrmann1;~Volker_Fischer1;~Thomas_Brox1",
        "aff": ";University of Freiburg, Albert-Ludwigs-Universit\u00e4t Freiburg;Robert Bosch GmbH, Bosch;Bosch Center for Artificial Intelligence;University of Freiburg",
        "aff_domain": ";cs.uni-freiburg.de;de.bosch.com;bosch.com;uni-freiburg.de",
        "position": ";PhD student;PhD student;Postdoc;Full Professor",
        "bibtex": "@misc{\nhoffmann2024eurekamoments,\ntitle={Eureka-Moments in Transformers: Multi-Step Tasks Reveal Softmax Induced Optimization Problems},\nauthor={David T Hoffmann and Simon Schrodi and Nadine Behrmann and Volker Fischer and Thomas Brox},\nyear={2024},\nurl={https://openreview.net/forum?id=HaLxcQ6OOm}\n}",
        "github": "",
        "project": "",
        "reviewers": "Lp2g;Ddae;Kjsr;ULYQ",
        "site": "https://openreview.net/forum?id=HaLxcQ6OOm",
        "pdf_size": 2091910,
        "rating": "5;5;5;6",
        "confidence": "3;4;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;3;2;3",
        "presentation": "2;3;2;3",
        "wc_summary": "86;106;136;134",
        "wc_strengths": "40;91;104;84",
        "wc_weaknesses": "274;638;189;130",
        "wc_questions": "2;64;121;6",
        "wc_review": "402;899;550;354",
        "wc_reply_reviewers": "0;228;54;0",
        "wc_reply_authors": "250;764;643;362",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            115.5,
            20.75451758051726
        ],
        "wc_strengths_avg": [
            79.75,
            24.045529730076648
        ],
        "wc_weaknesses_avg": [
            307.75,
            197.42134509723107
        ],
        "wc_questions_avg": [
            48.25,
            48.64347335460329
        ],
        "wc_review_avg": [
            551.25,
            213.37452401821545
        ],
        "wc_reply_reviewers_avg": [
            70.5,
            93.56682104250416
        ],
        "wc_reply_authors_avg": [
            504.75,
            207.12239738859725
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5148688068900508481&as_sdt=8005&sciodt=0,7&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "University of Freiburg;Robert Bosch GmbH;Bosch Center for Artificial Intelligence",
        "aff_unique_dep": ";;Center for Artificial Intelligence",
        "aff_unique_url": "https://www.uni-freiburg.de;https://www.bosch.com;https://www.bosch-ai.com",
        "aff_unique_abbr": "UoF;Bosch;BCAI",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Freiburg;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "HadkNCPhfU",
        "title": "SEAL: Simultaneous Label Hierarchy Exploration And Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Label hierarchy is an important source of external knowledge that can enhance classification performance. However, most existing methods rely on predefined label hierarchies that may not match the data distribution. To address this issue, we propose Simultaneous label hierarchy Exploration And Learning (SEAL), a new framework that explores the label hierarchy by augmenting the observed labels with latent labels that follow a prior hierarchical structure. Our approach uses a 1-Wasserstein metric over the tree metric space as an objective function, which enables us to simultaneously learn a data-driven label hierarchy and perform (semi-)supervised learning. We evaluate our method on several datasets and show that it achieves superior results in both supervised and semi-supervised scenarios.",
        "keywords": "semi-supervised learning;image classification;optimal transport",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/94d6676504ace453bfc4e05ffc3a324fd9158ab5.zip",
        "author": "Zhiquan Tan;Zihao Wang;Yifan Zhang",
        "authorids": "~Zhiquan_Tan1;~Zihao_Wang11;~Yifan_Zhang16",
        "gender": "M;;",
        "homepage": ";https://zihao-wang.github.io;",
        "dblp": "326/0177;148/9655-1;",
        "google_scholar": ";T28rR00AAAAJ;",
        "orcid": ";0000-0002-3919-0396;",
        "linkedin": "https://www.linkedin.cn/incareer/in/ACoAAC1A8_QBFX8OlchWmVI_pNXN4zm_t6vPKCs;zihao-wang-6a0a3286/;",
        "or_profile": "~Zhiquan_Tan1;~Zihao_Wang11;~Yifan_Zhang16",
        "aff": "Tsinghua University;Hong Kong University of Science and Technology;",
        "aff_domain": "tsinghua.edu.cn;cse.ust.hk;",
        "position": "PhD student;PhD student;",
        "bibtex": "@misc{\ntan2024seal,\ntitle={{SEAL}: Simultaneous Label Hierarchy Exploration And Learning},\nauthor={Zhiquan Tan and Zihao Wang and Yifan Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=HadkNCPhfU}\n}",
        "github": "",
        "project": "",
        "reviewers": "DPWp;wvK6;LQMB;WAR6",
        "site": "https://openreview.net/forum?id=HadkNCPhfU",
        "pdf_size": 3018992,
        "rating": "5;5;5;6",
        "confidence": "3;2;3;3",
        "soundness": "3;2;3;2",
        "contribution": "2;2;2;2",
        "presentation": "2;1;3;3",
        "wc_summary": "58;84;57;190",
        "wc_strengths": "29;47;66;64",
        "wc_weaknesses": "178;324;99;163",
        "wc_questions": "4;6;38;68",
        "wc_review": "269;461;260;485",
        "wc_reply_reviewers": "0;0;0;15",
        "wc_reply_authors": "590;850;500;693",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "2;2;2;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            97.25,
            54.63229356342272
        ],
        "wc_strengths_avg": [
            51.5,
            14.941552797483935
        ],
        "wc_weaknesses_avg": [
            191.0,
            82.31949951256992
        ],
        "wc_questions_avg": [
            29.0,
            26.248809496813376
        ],
        "wc_review_avg": [
            368.75,
            104.64314358810137
        ],
        "wc_reply_reviewers_avg": [
            3.75,
            6.49519052838329
        ],
        "wc_reply_authors_avg": [
            658.25,
            130.0737771420512
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15087907183477516011&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Tsinghua University;Hong Kong University of Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.ust.hk",
        "aff_unique_abbr": "THU;HKUST",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "Hbbus5IOYt",
        "title": "How Does RLHF Shift Behavior Distributions? Distinguishability and Steerability",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) have shown impressive capabilities, but their potential for causing harm has raised concerns.  This paper delves into the impact of a common alignment approach, Reinforcement Learning from Human Feedback (RLHF), on an LLM's susceptibility to having its behavior steered into negative territory under persona prompts. We provide a systematic study to understand RLHF's effects on behavior distributions and the resulting vulnerabilities to prompt steering. In particular, we conceptualize LLM outputs as a decomposition of behaviors into positive and negative sub-distributions. Based on the decomposition, we first examine how RLHF influences the distinguishability between these sub-distributions across a wide spectrum of behaviors. Subsequently, we investigate behavioral steerability by devising persona prompts of varying lengths for each behavior in consideration. Our findings reveal that the RLHF model can be steered to exhibit more negative behavior, resulting in a significantly higher misalignment rate compared to the base model. However, the extent of this susceptibility does not appear to be predicted by the degree of distinguishability observed in the behavior sub-distributions.",
        "keywords": "RLHF;Alignment;Distinguishability;Steerability",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Benjamin David Hayum;Quentin Feuillade Montixi;Yixuan Li",
        "authorids": "~Benjamin_David_Hayum1;~Quentin_Feuillade_Montixi1;~Yixuan_Li1",
        "gender": "M;M;F",
        "homepage": ";;http://pages.cs.wisc.edu/~sharonli/",
        "dblp": ";;144/6087-1",
        "google_scholar": ";;https://scholar.google.com/citations?hl=en",
        "orcid": ";;",
        "linkedin": "benjamin-hayum-2a40b71b9/;quentin101010/;liyixuan",
        "or_profile": "~Benjamin_David_Hayum1;~Quentin_Feuillade_Montixi1;~Yixuan_Li1",
        "aff": "University of Wisconsin - Madison;PRISM Eval;Cornell University",
        "aff_domain": "wisc.edu;prism-eval.ai;cornell.edu",
        "position": "Undergrad student;Researcher;Graduate Student",
        "bibtex": "@misc{\nhayum2024how,\ntitle={How Does {RLHF} Shift Behavior Distributions? Distinguishability and Steerability},\nauthor={Benjamin David Hayum and Quentin Feuillade Montixi and Yixuan Li},\nyear={2024},\nurl={https://openreview.net/forum?id=Hbbus5IOYt}\n}",
        "github": "",
        "project": "",
        "reviewers": "jcwj;uiXy;dnKS",
        "site": "https://openreview.net/forum?id=Hbbus5IOYt",
        "pdf_size": 1524235,
        "rating": "3;3;3",
        "confidence": "4;4;4",
        "soundness": "1;1;2",
        "contribution": "1;1;2",
        "presentation": "2;3;2",
        "wc_summary": "83;155;89",
        "wc_strengths": "22;57;99",
        "wc_weaknesses": "355;722;316",
        "wc_questions": "1;32;317",
        "wc_review": "461;966;821",
        "wc_reply_reviewers": "66;309;0",
        "wc_reply_authors": "589;1450;758",
        "reply_reviewers": "2;2;0",
        "reply_authors": "2;2;1",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            109.0,
            32.61901286060018
        ],
        "wc_strengths_avg": [
            59.333333333333336,
            31.47838764754143
        ],
        "wc_weaknesses_avg": [
            464.3333333333333,
            182.892196540901
        ],
        "wc_questions_avg": [
            116.66666666666667,
            142.22126735790567
        ],
        "wc_review_avg": [
            749.3333333333334,
            212.3021955190813
        ],
        "wc_reply_reviewers_avg": [
            125.0,
            132.86835590162167
        ],
        "wc_reply_authors_avg": [
            932.3333333333334,
            372.4910140601456
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:F5FKVUJO7PAJ:scholar.google.com/&scioq=How+Does+RLHF+Shift+Behavior+Distributions%3F+Distinguishability+and+Steerability&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of Wisconsin-Madison;PRISM;Cornell University",
        "aff_unique_dep": ";Evaluation;",
        "aff_unique_url": "https://www.wisc.edu;;https://www.cornell.edu",
        "aff_unique_abbr": "UW-Madison;PRISM;Cornell",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Madison;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States;"
    },
    {
        "id": "HcapceS1Xe",
        "title": "Stream: A Generalized Continual Learning Benchmark and Baseline",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In a typical Continual Learning (CL) setting, the goal is to learn a sequence of tasks that are presented once while maintaining performance on all previously learned tasks. Current state-of-the-art approaches require the task identity during training to mitigate forgetting, whereas General Continual Learning (GCL) evaluates the ability to learn the sequence of tasks without their identity. We find that GCL methods ignore the domain gap between two consecutive tasks (\u2018learning-gap\u2019) and, as a result, often fail under more challenging scenarios. Motivated by a learner that needs to generalize across modalities and tasks, we propose a challenging GCL benchmark: the multi-modal Stream. Our benchmark provides a method to construct a sequence of tasks with varying learning-gaps from Vision and Text datasets. We perform a systematic analysis of meta-training statistics from the literature that are used to identify novel tasks, to find that they correlate to the learning-gap. Inspired by biological mechanisms of learning in mammals, we propose a baseline method to achieve GCL on Stream: \u03b1MetaSup, which uses a \u2018dummy\u2019 Stream to train a Transformer model to identify novel task transitions (\u2018surprise\u2019). The trained Transformer is then used as an auxiliary novelty detector to a learner in the benchmark Stream. We show how \u03b1MetaSup can augment existing CL methods that use rehearsal memory and improve their performance by as much as 10.5% AUC thereby outperforming 7 SOTA GCL baselines.",
        "keywords": "Continual Learning;Generalization;Multi-modal",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Iordanis Fostiropoulos;Jiaye Zhu;Laurent Itti",
        "authorids": "~Iordanis_Fostiropoulos1;~Jiaye_Zhu1;~Laurent_Itti1",
        "gender": "M;M;M",
        "homepage": "https://iordanis.me;;http://ilab.usc.edu",
        "dblp": "227/5493;197/1745;31/3256",
        "google_scholar": "XTLv1v8AAAAJ;https://scholar.google.com/citations?hl=en;xhUvqK8AAAAJ",
        "orcid": ";;0000-0002-0168-2977",
        "linkedin": ";jiayezhu/;",
        "or_profile": "~Iordanis_Fostiropoulos1;~Jiaye_Zhu1;~Laurent_Itti1",
        "aff": ";;University of Southern California",
        "aff_domain": ";;usc.edu",
        "position": ";;Professor",
        "bibtex": "@misc{\nfostiropoulos2024stream,\ntitle={Stream: A Generalized Continual Learning Benchmark and Baseline},\nauthor={Iordanis Fostiropoulos and Jiaye Zhu and Laurent Itti},\nyear={2024},\nurl={https://openreview.net/forum?id=HcapceS1Xe}\n}",
        "github": "",
        "project": "",
        "reviewers": "18Hf;uFkC;AAR3;Tzaa",
        "site": "https://openreview.net/forum?id=HcapceS1Xe",
        "pdf_size": 3059911,
        "rating": "3;3;5;5",
        "confidence": "3;3;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;2",
        "presentation": "2;3;2;3",
        "wc_summary": "39;60;69;23",
        "wc_strengths": "76;30;65;22",
        "wc_weaknesses": "353;33;190;120",
        "wc_questions": "15;61;4;4",
        "wc_review": "483;184;328;169",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            47.75,
            17.963504669189696
        ],
        "wc_strengths_avg": [
            48.25,
            22.76373211931646
        ],
        "wc_weaknesses_avg": [
            174.0,
            117.36055555424062
        ],
        "wc_questions_avg": [
            21.0,
            23.526580712037184
        ],
        "wc_review_avg": [
            291.0,
            127.0492030671582
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Pw8riAGc64IJ:scholar.google.com/&scioq=Stream:+A+Generalized+Continual+Learning+Benchmark+and+Baseline&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Southern California",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.usc.edu",
        "aff_unique_abbr": "USC",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Los Angeles",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Topic Modeling as Multi-Objective Contrastive Optimization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18985",
        "id": "HdAoLSBYXj",
        "author_site": "Thong Thanh Nguyen, Xiaobao Wu, Xinshuai Dong, Cong-Duy Nguyen, See-Kiong Ng, Anh Tuan Luu",
        "tldr": "",
        "abstract": "Recent representation learning approaches enhance neural topic models by optimizing the weighted linear combination of the evidence lower bound (ELBO) of the log-likelihood and the contrastive learning objective that contrasts pairs of input documents. However, document-level contrastive learning might capture low-level mutual information, such as word ratio, which disturbs topic modeling. Moreover, there is a potential conflict between the ELBO loss that memorizes input details for better reconstruction quality, and the contrastive loss which attempts to learn topic representations that generalize among input documents. To address these issues, we first introduce a novel contrastive learning method oriented towards sets of topic vectors to capture useful semantics that are shared among a set of input documents. Secondly, we explicitly cast contrastive topic modeling as a gradient-based multi-objective optimization problem, with the goal of achieving a Pareto stationary solution that balances the trade-off between the ELBO and the contrastive objective. Extensive experiments demonstrate that our framework consistently produces higher-performing neural topic models in terms of topic coherence, topic diversity, and downstream performance.",
        "keywords": "neural topic model; contrastive learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/00b068dc16b69fb8f553aec25a3cf60e7a01e994.zip",
        "author": "Thong Thanh Nguyen;Xiaobao Wu;Xinshuai Dong;Cong-Duy T Nguyen;See-Kiong Ng;Anh Tuan Luu",
        "authorids": "~Thong_Thanh_Nguyen1;~Xiaobao_Wu1;~Xinshuai_Dong1;~Cong-Duy_T_Nguyen1;~See-Kiong_Ng1;~Anh_Tuan_Luu2",
        "gender": "M;;M;M;M;M",
        "homepage": "https://nguyentthong.github.io/;https://bobxwu.github.io/;https://dongxinshuai.github.io/;https://duyngtr16061999.github.io/;https://www.comp.nus.edu.sg/~ngsk/;https://tuanluu.github.io/",
        "dblp": "29/5255.html;249/8429;279/6151.html;;00/5480;81/8329.html",
        "google_scholar": "C2zb0lkAAAAJ;Y1oag4sAAAAJ;A7JyL1sAAAAJ;vIdT3F8AAAAJ;https://scholar.google.com.tw/citations?user=_wsommYAAAAJ;https://scholar.google.com.sg/citations?hl=en",
        "orcid": ";;;;0000-0001-6565-7511;",
        "linkedin": ";xiaobao-wu/;;;seekiong/?originalSubdomain=sg;",
        "or_profile": "~Thong_Thanh_Nguyen1;~Xiaobao_Wu1;~Xinshuai_Dong1;~Cong-Duy_T_Nguyen1;~See-Kiong_Ng1;~Anh_Tuan_Luu2",
        "aff": "National University of Singapore;Nanyang Technological University;Carnegie Mellon University;School of Computer Science and  Engineering, Nanyang Technological University;National University of Singapore;Nanyang Technological University",
        "aff_domain": "nus.edu;ntu.edu.sg;cmu.edu;scse.ntu.edu.sg;nus.edu.sg;ntu.edu.sg",
        "position": "PhD student;PhD student;PhD student;PhD student;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nnguyen2024topic,\ntitle={Topic Modeling as Multi-Objective Contrastive Optimization},\nauthor={Thong Thanh Nguyen and Xiaobao Wu and Xinshuai Dong and Cong-Duy T Nguyen and See-Kiong Ng and Anh Tuan Luu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=HdAoLSBYXj}\n}",
        "github": "",
        "project": "",
        "reviewers": "QHKf;3szg;ioHf",
        "pdf_size": 535980,
        "rating": "6;6;6",
        "confidence": "3;3;3",
        "soundness": "3;3;2",
        "contribution": "3;3;3",
        "presentation": "2;3;4",
        "wc_summary": "76;49;119",
        "wc_strengths": "62;34;78",
        "wc_weaknesses": "78;91;135",
        "wc_questions": "267;91;36",
        "wc_review": "483;265;368",
        "wc_reply_reviewers": "67;58;0",
        "wc_reply_authors": "977;481;673",
        "reply_reviewers": "2;1;0",
        "reply_authors": "4;3;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            81.33333333333333,
            28.82514334550461
        ],
        "wc_strengths_avg": [
            58.0,
            18.184242262647807
        ],
        "wc_weaknesses_avg": [
            101.33333333333333,
            24.390344173235622
        ],
        "wc_questions_avg": [
            131.33333333333334,
            98.52354484532562
        ],
        "wc_review_avg": [
            372.0,
            89.04306074403927
        ],
        "wc_reply_reviewers_avg": [
            41.666666666666664,
            29.69100125552447
        ],
        "wc_reply_authors_avg": [
            710.3333333333334,
            204.20469033681758
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            3.0,
            0.816496580927726
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12195055359102102332&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=HdAoLSBYXj",
        "pdf": "https://openreview.net/pdf?id=HdAoLSBYXj",
        "email": "nus.edu;ntu.edu.sg;cmu.edu;scse.ntu.edu.sg;nus.edu.sg;ntu.edu.sg",
        "author_num": 6,
        "aff_unique_index": "0;1;2;1;0;1",
        "aff_unique_norm": "National University of Singapore;Nanyang Technological University;Carnegie Mellon University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.nus.edu.sg;https://www.ntu.edu.sg;https://www.cmu.edu",
        "aff_unique_abbr": "NUS;NTU;CMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0;0",
        "aff_country_unique": "Singapore;United States"
    },
    {
        "id": "HeNuL50C60",
        "title": "CARD: Certifiable Reweighting for Single Domain Generalization Object Detection",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Single Domain Generalization Object Detection (S-DGOD) is a challenging yet practical task, where we only have access to data from one specific source domain to train an object detection network, but have to generalize to numerous unseen target domains. Recent works point out that the learning dynamics of Deep Neural Networks (DNNs) are biased by gradient descent to learn simple semantics, which are usually non-causal and spuriously correlated to the ground truth labels, as a result, DNN-based object detection networks fail to consistently generalize well in the Out-of-Domain (OoD) scenario. In this paper, we focus on S-DGOD based on theoretical analysis, exploring a classic and widely-used approach, Generalizable Reweighting (GRW), which iteratively reweightes the training samples to improve generalization performance. In our theoretical analysis, we first identify that the vanilla GRW hardly outperforms Empirical Risk Minimization (ERM) in the S-DGOD scenario. To provide a generalization guarantee, we further derive Certifiable Feature Perturbation (CFP) based on our theory, which aims to train a robust object detection network against additional perturbations added to the extracted features. We demonstrate that GRW works well with CFP in achieving OoD generalization, thus, surpassing ERM by a large margin under worse conditions. This brand new reweighting strategy is named Certifiable Reweighting (CARD). Our extensive experiments show that the proposed CARD achieves SOTA performance compared to baseline methods on the five urban-scene S-DGOD benchmarks.",
        "keywords": "single domain generalization;object detection",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/b2e27fabdf5e30ce642ab457e46ceb22cd166152.zip",
        "author": "Fan Wu;Xue Zhao;Jinling Gao;Nanyang Ye",
        "authorids": "~Fan_Wu14;~Xue_Zhao4;~Jinling_Gao1;~Nanyang_Ye1",
        "gender": ";F;M;",
        "homepage": ";;;",
        "dblp": ";;;175/2581",
        "google_scholar": ";;;",
        "orcid": ";0000-0002-0752-3926;0000-0002-8616-1547;",
        "linkedin": ";;;",
        "or_profile": "~Fan_Wu14;~Xue_Zhao4;~Jinling_Gao1;~Nanyang_Ye1",
        "aff": ";Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University",
        "aff_domain": ";sjtu.edu.cn;sjtu.edu.cn;sjtu.edu",
        "position": ";PhD student;MS student;Associate Professor",
        "bibtex": "@misc{\nwu2024card,\ntitle={{CARD}: Certifiable Reweighting for Single Domain Generalization Object Detection},\nauthor={Fan Wu and Xue Zhao and Jinling Gao and Nanyang Ye},\nyear={2024},\nurl={https://openreview.net/forum?id=HeNuL50C60}\n}",
        "github": "",
        "project": "",
        "reviewers": "7drN;W6J9;suAi;Y71C",
        "site": "https://openreview.net/forum?id=HeNuL50C60",
        "pdf_size": 9805509,
        "rating": "3;3;5;5",
        "confidence": "5;3;5;2",
        "soundness": "2;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "2;2;2;2",
        "wc_summary": "74;75;77;51",
        "wc_strengths": "63;37;17;38",
        "wc_weaknesses": "233;117;257;180",
        "wc_questions": "47;22;13;50",
        "wc_review": "417;251;364;319",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            1.299038105676658
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            69.25,
            10.59186008215743
        ],
        "wc_strengths_avg": [
            38.75,
            16.315253599009733
        ],
        "wc_weaknesses_avg": [
            196.75,
            53.816238255753255
        ],
        "wc_questions_avg": [
            33.0,
            15.858751527153705
        ],
        "wc_review_avg": [
            337.75,
            60.923620214166526
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.19245008972987523,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:HndEjmL-UBAJ:scholar.google.com/&scioq=CARD:+Certifiable+Reweighting+for+Single+Domain+Generalization+Object+Detection&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Shanghai Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sjtu.edu.cn",
        "aff_unique_abbr": "SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "HexshmBu0P",
        "title": "A Recipe for Watermarking Diffusion Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Diffusion models (DMs) have demonstrated advantageous potential on generative tasks. Widespread interest exists in incorporating DMs into downstream applications, such as producing or editing photorealistic images. However, practical deployment and unprecedented power of DMs raise legal issues, including copyright protection and monitoring of generated content. In this regard, watermarking has been a proven solution for copyright protection and content monitoring, but it is underexplored in the DMs literature. Specifically, DMs generate samples from longer tracks and may have newly designed multimodal structures, necessitating the modification of conventional watermarking pipelines. To this end, we conduct comprehensive analyses and derive a recipe for efficiently watermarking state-of-the-art DMs (e.g., Stable Diffusion), via training from scratch or finetuning. Our recipe is straightforward but involves empirically ablated implementation details, providing a foundation for future research on watermarking DMs.",
        "keywords": "Diffusion Models;Watermarking;Copyright Protection",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/4d0b798dfa6e812d5d2b5198622138ba9af16e32.zip",
        "author": "Yunqing Zhao;Tianyu Pang;Chao Du;Xiao Yang;Ngai-man Cheung;Min Lin",
        "authorids": "~Yunqing_Zhao2;~Tianyu_Pang1;~Chao_Du1;~Xiao_Yang4;~Ngai-man_Cheung1;~Min_Lin1",
        "gender": ";M;M;M;M;M",
        "homepage": ";https://p2333.github.io/;https://duchao0726.github.io/;https://ml.cs.tsinghua.edu.cn/~xiaoyang/;https://sites.google.com/site/mancheung0407/;https://linmin.me",
        "dblp": ";202/2550;75/7523;57/33851;82/3605;",
        "google_scholar": ";wYDbtFsAAAAJ;QOp7xW0AAAAJ;bwkwp0MAAAAJ;https://scholar.google.com.sg/citations?hl=en;BGONmkIAAAAJ",
        "orcid": ";0000-0003-0639-6176;0000-0003-1244-6336;0000-0001-9502-9962;0000-0003-0135-3791;",
        "linkedin": ";%E5%A4%A9%E5%AE%87-%E5%BA%9E-b3999017a/;duchao/;;;min-lin-08a3a422/",
        "or_profile": "~Yunqing_Zhao2;~Tianyu_Pang1;~Chao_Du1;~Xiao_Yang4;~Ngai-man_Cheung1;~Min_Lin1",
        "aff": ";Sea AI Lab;Sea AI Lab;Tsinghua University;Singapore University of Technology and Design;Sea AI Lab",
        "aff_domain": ";sea.com;sea.com;mail.tsinghua.edu.cn;sutd.edu.sg;sea.com",
        "position": ";Senior Research Scientist;Senior Research Scientist;Postdoc;Associate Professor;Principal Researcher",
        "bibtex": "@misc{\nzhao2024a,\ntitle={A Recipe for Watermarking Diffusion Models},\nauthor={Yunqing Zhao and Tianyu Pang and Chao Du and Xiao Yang and Ngai-man Cheung and Min Lin},\nyear={2024},\nurl={https://openreview.net/forum?id=HexshmBu0P}\n}",
        "github": "",
        "project": "",
        "reviewers": "7nbF;wQee;zWgb",
        "site": "https://openreview.net/forum?id=HexshmBu0P",
        "pdf_size": 23571001,
        "rating": "5;5;6",
        "confidence": "3;4;3",
        "soundness": "3;3;3",
        "contribution": "2;2;3",
        "presentation": "3;2;3",
        "wc_summary": "30;40;73",
        "wc_strengths": "43;75;61",
        "wc_weaknesses": "98;191;156",
        "wc_questions": "61;70;158",
        "wc_review": "232;376;448",
        "wc_reply_reviewers": "223;199;17",
        "wc_reply_authors": "1106;1202;709",
        "reply_reviewers": "1;2;1",
        "reply_authors": "4;4;3",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            47.666666666666664,
            18.372685039360892
        ],
        "wc_strengths_avg": [
            59.666666666666664,
            13.097921802925667
        ],
        "wc_weaknesses_avg": [
            148.33333333333334,
            38.35216928530756
        ],
        "wc_questions_avg": [
            96.33333333333333,
            43.75944342526409
        ],
        "wc_review_avg": [
            352.0,
            89.7997772825746
        ],
        "wc_reply_reviewers_avg": [
            146.33333333333334,
            91.9758422389029
        ],
        "wc_reply_authors_avg": [
            1005.6666666666666,
            213.40467557098077
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 148,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2646068845536634567&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;2;0",
        "aff_unique_norm": "Sea AI Lab;Tsinghua University;Singapore University of Technology and Design",
        "aff_unique_dep": ";;",
        "aff_unique_url": ";https://www.tsinghua.edu.cn;https://www.sutd.edu.sg",
        "aff_unique_abbr": ";THU;SUTD",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "1;2",
        "aff_country_unique": ";China;Singapore"
    },
    {
        "title": "Towards Best Practices of Activation Patching in Language Models: Metrics and Methods",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18984",
        "id": "Hf17y6u9BC",
        "author_site": "Fred Zhang, Neel Nanda",
        "tldr": "",
        "abstract": "Mechanistic interpretability seeks to understand the internal mechanisms of\nmachine learning models, where localization\u2014identifying the important model\ncomponents\u2014is a key step. Activation patching, also known as causal tracing or\ninterchange intervention, is a standard technique for this task (Vig et al., 2020), but\nthe literature contains many variants with little consensus on the choice of hyperparameters or methodology. In this work, we systematically examine the impact\nof methodological details in activation patching, including evaluation metrics and\ncorruption methods. In several settings of localization and circuit discovery in language models, we find that varying these hyperparameters could lead to disparate\ninterpretability results. Backed by empirical observations, we give conceptual arguments for why certain metrics or methods may be preferred. Finally, we provide\nrecommendations for the best practices of activation patching going forwards.",
        "keywords": "language model interpretability;interpretability;mechanistic interpretability;circuit analysis;activation patching;large language models",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Fred Zhang;Neel Nanda",
        "authorids": "~Fred_Zhang1;~Neel_Nanda1",
        "gender": "M;M",
        "homepage": "http://fredzhang.me/;https://neelnanda.io",
        "dblp": "232/9071;285/6389",
        "google_scholar": "guJ_kBQAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";",
        "linkedin": "fred-zhang-0/;https://linkedin.com/in/neel-nanda-993580151",
        "or_profile": "~Fred_Zhang1;~Neel_Nanda1",
        "aff": "University of California, Berkeley;Google DeepMind",
        "aff_domain": "berkeley.edu;deepmind.com",
        "position": "PhD student;Researcher",
        "bibtex": "@inproceedings{\nzhang2024towards,\ntitle={Towards Best Practices of Activation Patching in Language Models: Metrics and Methods},\nauthor={Fred Zhang and Neel Nanda},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Hf17y6u9BC}\n}",
        "github": "",
        "project": "",
        "reviewers": "PYwb;4A2t;bjM9",
        "pdf_size": 1045758,
        "rating": "6;6;8",
        "confidence": "4;2;3",
        "soundness": "3;3;4",
        "contribution": "2;2;3",
        "presentation": "3;3;3",
        "wc_summary": "116;105;102",
        "wc_strengths": "39;66;86",
        "wc_weaknesses": "132;36;109",
        "wc_questions": "22;1;26",
        "wc_review": "309;208;323",
        "wc_reply_reviewers": "89;0;20",
        "wc_reply_authors": "718;885;594",
        "reply_reviewers": "2;0;1",
        "reply_authors": "2;2;1",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            107.66666666666667,
            6.018490028422597
        ],
        "wc_strengths_avg": [
            63.666666666666664,
            19.258475767539053
        ],
        "wc_weaknesses_avg": [
            92.33333333333333,
            40.92540639857946
        ],
        "wc_questions_avg": [
            16.333333333333332,
            10.96458946893235
        ],
        "wc_review_avg": [
            280.0,
            51.23150072627842
        ],
        "wc_reply_reviewers_avg": [
            36.333333333333336,
            38.12552367582058
        ],
        "wc_reply_authors_avg": [
            732.3333333333334,
            119.23180038153505
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 78,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6616315800538646640&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=Hf17y6u9BC",
        "pdf": "https://openreview.net/pdf?id=Hf17y6u9BC",
        "email": "berkeley.edu;deepmind.com",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of California, Berkeley;Google",
        "aff_unique_dep": ";Google DeepMind",
        "aff_unique_url": "https://www.berkeley.edu;https://deepmind.com",
        "aff_unique_abbr": "UC Berkeley;DeepMind",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Berkeley;",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "Hf54sNeeBM",
        "title": "Knowledge Accumulating Contrastive Prompt for Continual Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Continual learning has been challenged by the issue of catastrophic forgetting (CF). Prompt-based methods have recently emerged as a promising approach to alleviate this problem, capturing the previous knowledge by the group of prompts. However, selecting an appropriate prompt during the inference stage can be challenging, and may limit the overall performance by the misaligned prompts. \nIn this paper, we propose a novel approach to prompt-based continual learning, which accumulates the knowledge in a single prompt, which has not been explored previously. Specifically, inspired by contrastive learning, we treat the input with the current and previous prompt as two different augmented views (i.e., positive pair). We then pull the features of the positive pairs in the embedding space to accumulate knowledge. Our experimental results demonstrate the state-of-the-art performance in continual learning even with a single prompt, highlighting the potential of this approach towards a `holistic' prompt for the model.",
        "keywords": "Prompt learning;Continual learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Chanyong Jung;Jong Chul Ye",
        "authorids": "~Chanyong_Jung1;~Jong_Chul_Ye1",
        "gender": "M;M",
        "homepage": "https://sites.google.com/view/jcy132;https://bispl.weebly.com/",
        "dblp": "221/2728;15/5613",
        "google_scholar": "https://scholar.google.com/citations?hl=en;HNMjoNEAAAAJ",
        "orcid": ";",
        "linkedin": "chanyongjung/;",
        "or_profile": "~Chanyong_Jung1;~Jong_Chul_Ye1",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\njung2024knowledge,\ntitle={Knowledge Accumulating Contrastive Prompt for Continual Learning},\nauthor={Chanyong Jung and Jong Chul Ye},\nyear={2024},\nurl={https://openreview.net/forum?id=Hf54sNeeBM}\n}",
        "github": "",
        "project": "",
        "reviewers": "5sqM;fnKJ;ieXN;1SQd",
        "site": "https://openreview.net/forum?id=Hf54sNeeBM",
        "pdf_size": 1363816,
        "rating": "3;5;5;6",
        "confidence": "4;5;5;3",
        "soundness": "2;3;2;3",
        "contribution": "1;2;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "82;66;61;71",
        "wc_strengths": "20;47;40;40",
        "wc_weaknesses": "475;179;311;140",
        "wc_questions": "123;40;6;2",
        "wc_review": "700;332;418;253",
        "wc_reply_reviewers": "151;0;0;95",
        "wc_reply_authors": "853;577;377;548",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            70.0,
            7.7781745930520225
        ],
        "wc_strengths_avg": [
            36.75,
            10.084022015049353
        ],
        "wc_weaknesses_avg": [
            276.25,
            131.08275058145523
        ],
        "wc_questions_avg": [
            42.75,
            48.6280526034099
        ],
        "wc_review_avg": [
            425.75,
            168.74888888523088
        ],
        "wc_reply_reviewers_avg": [
            61.5,
            64.60843598168896
        ],
        "wc_reply_authors_avg": [
            588.75,
            170.63466089865798
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.20751433915982243,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:LB9bLKKFEj8J:scholar.google.com/&scioq=Knowledge+Accumulating+Contrastive+Prompt+for+Continual+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "Novel Quadratic Constraints for Extending LipSDP beyond Slope-Restricted Activations",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18983",
        "id": "HfXDrAzFvG",
        "author_site": "Patricia Pauli, Aaron Havens, Alexandre Araujo, Siddharth Garg, Farshad Khorrami, Frank Allg\u00f6wer, Bin Hu",
        "tldr": "",
        "abstract": "Recently, semidefinite programming (SDP) techniques have shown great promise in providing accurate Lipschitz bounds for neural networks. Specifically, the LipSDP approach (Fazlyab et al., 2019) has received much attention and provides the least conservative Lipschitz upper bounds that can be computed with polynomial time guarantees. However, one main restriction of LipSDP is that its formulation requires the activation functions to be slope-restricted on $[0,1]$, preventing its further use for more general activation functions such as GroupSort, MaxMin, and Householder. One can rewrite MaxMin activations for example as residual ReLU networks. However, a direct application of LipSDP to the resultant residual ReLU networks is conservative and even fails in recovering the well-known fact that the MaxMin activation is 1-Lipschitz. Our paper bridges this gap and extends LipSDP  beyond slope-restricted activation functions. To this end, we provide novel quadratic constraints for GroupSort, MaxMin, and Householder activations via leveraging their underlying properties such as sum preservation. Our proposed analysis is general and provides a unified approach for estimating $\\ell_2$ and $\\ell_\\infty$ Lipschitz bounds for a rich class of neural network architectures, including non-residual and residual neural networks and implicit models,  with GroupSort, MaxMin, and HouseHolder activations. Finally, we illustrate the utility of our approach with a variety of experiments and show that our proposed SDPs generate less conservative Lipschitz bounds in comparison to existing approaches.",
        "keywords": "Neural Networks;Semidefinite Programming;Lipschitz Constant Estimation",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/a625ac89dfbf7df2fe2416b661167d7cf90836ac.zip",
        "author": "Patricia Pauli;Aaron J Havens;Alexandre Araujo;Siddharth Garg;Farshad Khorrami;Frank Allg\u00f6wer;Bin Hu",
        "authorids": "~Patricia_Pauli1;~Aaron_J_Havens1;~Alexandre_Araujo3;~Siddharth_Garg1;~Farshad_Khorrami1;~Frank_Allg\u00f6wer1;~Bin_Hu2",
        "gender": "F;M;M;M;;M;M",
        "homepage": "https://www.ist.uni-stuttgart.de/institute/team/Pauli/;https://aaronhavens.github.io/;http://engineering.nyu.edu/people/siddharth-garg/;https://engineering.nyu.edu/faculty/farshad-khorrami;;;https://alexandrearaujo.com/",
        "dblp": "234/2147;;94/3807;94/5644;https://dblp.uni-trier.de/pid/39/189.html;;228/6599",
        "google_scholar": "hOpUd1sAAAAJ;;https://scholar.google.com.tw/citations?user=Yf8OqQQAAAAJ;NdOqlPQAAAAJ;https://scholar.google.de/citations?user=WQYw3oIAAAAJ;;https://scholar.google.fr/citations?user=wsu61VYAAAAJ",
        "orcid": "0000-0001-5677-7095;;;;0000-0002-3702-3658;;",
        "linkedin": "patricia-pauli-055258109/;;;;;;",
        "or_profile": "~Patricia_Pauli1;~Aaron_J_Havens1;~Siddharth_Garg1;~Farshad_Khorrami1;~Frank_Allg\u00f6wer1;~Bin_Hu2;~Alexandre_ARAUJO1",
        "aff": "University of Stuttgart;University of Illinois, Urbana Champaign;New York University;New York University;Universit\u00e4t Stuttgart;University of Illinois, Urbana Champaign;New York University",
        "aff_domain": "uni-stuttgart.de;illinois.edu;nyu.edu;nyu.edu;uni-stuttgart.de;illinois.edu;nyu.edu",
        "position": "PhD student;PhD student;Associate Professor;Full Professor;Full Professor;Assistant Professor;Postdoc",
        "bibtex": "@inproceedings{\npauli2024novel,\ntitle={Novel Quadratic Constraints for Extending Lip{SDP} beyond Slope-Restricted Activations},\nauthor={Patricia Pauli and Aaron J Havens and Alexandre Araujo and Siddharth Garg and Farshad Khorrami and Frank Allg{\\\"o}wer and Bin Hu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=HfXDrAzFvG}\n}",
        "github": "",
        "project": "",
        "reviewers": "pJPd;8tsi;ykPt",
        "pdf_size": 399863,
        "rating": "6;6;6",
        "confidence": "3;2;3",
        "soundness": "3;3;4",
        "contribution": "2;3;2",
        "presentation": "3;3;3",
        "wc_summary": "47;95;105",
        "wc_strengths": "22;125;48",
        "wc_weaknesses": "35;249;31",
        "wc_questions": "59;149;18",
        "wc_review": "163;618;202",
        "wc_reply_reviewers": "25;248;37",
        "wc_reply_authors": "695;914;699",
        "reply_reviewers": "1;1;1",
        "reply_authors": "1;2;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            82.33333333333333,
            25.315783394730033
        ],
        "wc_strengths_avg": [
            65.0,
            43.734044709661454
        ],
        "wc_weaknesses_avg": [
            105.0,
            101.83647021900684
        ],
        "wc_questions_avg": [
            75.33333333333333,
            54.713394663058104
        ],
        "wc_review_avg": [
            327.6666666666667,
            205.91314242228987
        ],
        "wc_reply_reviewers_avg": [
            103.33333333333333,
            102.41202186375496
        ],
        "wc_reply_authors_avg": [
            769.3333333333334,
            102.30781440774155
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16332396218252715492&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=HfXDrAzFvG",
        "pdf": "https://openreview.net/pdf?id=HfXDrAzFvG",
        "email": "uni-stuttgart.de;illinois.edu;nyu.edu;nyu.edu;uni-stuttgart.de;illinois.edu;nyu.edu",
        "author_num": 7,
        "aff_unique_index": "0;1;2;2;0;1;2",
        "aff_unique_norm": "University of Stuttgart;University of Illinois Urbana-Champaign;New York University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.uni-stuttgart.de;https://illinois.edu;https://www.nyu.edu",
        "aff_unique_abbr": "USTuttgart;UIUC;NYU",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Urbana-Champaign",
        "aff_country_unique_index": "0;1;1;1;0;1;1",
        "aff_country_unique": "Germany;United States"
    },
    {
        "title": "SGD Finds then Tunes Features in Two-Layer Neural Networks with near-Optimal Sample Complexity: A Case Study in the XOR problem",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18982",
        "id": "HgOJlxzB16",
        "tldr": "",
        "abstract": "In this work, we consider the optimization process of minibatch stochastic gradient descent (SGD) on a 2-layer neural network with data separated by a quadratic ground truth function. We prove that with data drawn from the Boolean hypercube labeled by the quadratic ``XOR'' function $y = -x_ix_j$ , it is possible to train to a population error $o(1)$\n with $\\Theta(d\\text{polylog}(d))$ samples. Our result considers simultaneously training both layers of the two-layer-neural network with ReLU activations via standard minibatch SGD on the logistic loss. To our knowledge, this work is the first to give a sample complexity of \n for efficiently learning the XOR function on isotropic data on a standard neural network with standard training. Our main technique is showing that the network evolves in two phases: a \\em signal-finding \\em phase where the network is small and many of the neurons evolve independently to find features, and a \\em signal-heavy \\em phase, where SGD maintains and balances the features. We leverage the simultaneous training of the layers to show that it is sufficient for only a small fraction of the neurons to learn features, since those neurons will be amplified by the simultaneous growth of their second layer weights.",
        "keywords": "optimization;stochastic gradient descent;two-layer neural network;sample complexity",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/8b1780346b88534d9bfd63f65b47944e2581da7b.pdf",
        "author": "Margalit Glasgow",
        "authorids": "~Margalit_Glasgow1",
        "gender": "F",
        "homepage": "https://margalitglasgow.github.io/",
        "dblp": "268/0063",
        "google_scholar": "ErDOPbEAAAAJ",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Margalit_Glasgow1",
        "aff": "Stanford University",
        "aff_domain": "stanford.edu",
        "position": "PhD student",
        "bibtex": "@inproceedings{\nglasgow2024sgd,\ntitle={{SGD} Finds then Tunes Features in Two-Layer Neural Networks with near-Optimal Sample Complexity: A Case Study in the {XOR} problem},\nauthor={Margalit Glasgow},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=HgOJlxzB16}\n}",
        "github": "",
        "project": "",
        "reviewers": "kd4Q;Y9yq;xNLA;chEd",
        "pdf_size": 332563,
        "rating": "6;8;8;8",
        "confidence": "2;4;4;3",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;3;3;4",
        "wc_summary": "88;111;103;90",
        "wc_strengths": "55;72;119;87",
        "wc_weaknesses": "23;85;44;14",
        "wc_questions": "358;154;128;76",
        "wc_review": "524;422;394;267",
        "wc_reply_reviewers": "26;13;9;14",
        "wc_reply_authors": "518;154;391;467",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            98.0,
            9.460443964212251
        ],
        "wc_strengths_avg": [
            83.25,
            23.54118731075389
        ],
        "wc_weaknesses_avg": [
            41.5,
            27.37243138634199
        ],
        "wc_questions_avg": [
            179.0,
            107.09341716464182
        ],
        "wc_review_avg": [
            401.75,
            91.61434112626691
        ],
        "wc_reply_reviewers_avg": [
            15.5,
            6.34428877022476
        ],
        "wc_reply_authors_avg": [
            382.5,
            139.44981176036057
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0.8703882797784891,
        "gs_citation": 21,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17133824541112394691&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=HgOJlxzB16",
        "pdf": "https://openreview.net/pdf?id=HgOJlxzB16",
        "email": "stanford.edu",
        "author_num": 1,
        "aff_unique_index": "0",
        "aff_unique_norm": "Stanford University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.stanford.edu",
        "aff_unique_abbr": "Stanford",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Stanford",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "HgSfV6sGIn",
        "title": "STExplainer: Global Explainability of GNNs via Frequent SubTree Mining",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The need for transparency and interpretability in critical domains has led to an increasing interest in understanding the inner workings of Graph Neural Networks (GNNs). While local-level GNN explainability has been extensively studied to find important features within individual graph samples, recent research has emphasized the importance of global explainability of GNNs by uncovering global graphical concepts in a dataset underlying GNN behaviors. In this paper, we look into the intrinsic message-passing mechanism of standard GNNs and introduce a new method, STExplainer, to directly extract global explanations of GNNs using rooted subtrees on a dataset level instead of per instance. Unlike existing global explainers, which typically identify clusters of instance-level explanations or aggregate local graphical patterns into prototypes represented as latent vectors or rely on human-defined natural language rules, our approach extracts more intuitive global explanations through rooted subtree patterns and subgraph patterns, along with their associated relative importance scores, without relying on any instance-level explainers. We empirically demonstrate the effectiveness of our approach in extracting meaningful and high-quality global explanations on both synthetic and real-world datasets. The global explanations extracted by STExplainer are faithful to the original GNNs and distinguishable among different classes.",
        "keywords": "Graph Neural Networks;Interpretability;Global-level explanation\uff0c",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/ff100ab554174bee76d243dcd80a551f9beb8aa5.zip",
        "author": "Shengyao Lu;Yakun Yu;Jiuding Yang;Baochun Li;Di Niu",
        "authorids": "~Shengyao_Lu1;~Yakun_Yu1;~Jiuding_Yang1;~Baochun_Li1;~Di_Niu1",
        "gender": "F;F;M;M;M",
        "homepage": "https://sluxsr.github.io/;;;http://iqua.ece.toronto.edu/bli/;https://www.ualberta.ca/~dniu",
        "dblp": "320/4184;;;l/BaochunLi;82/4953",
        "google_scholar": "https://scholar.google.ca/citations?user=MSsab9EAAAAJ;;https://scholar.google.ca/citations?user=sR9gmbEAAAAJ;https://scholar.google.com.tw/citations?user=rkb3_FgAAAAJ;https://scholar.google.ca/citations?user=3kC5OogAAAAJ",
        "orcid": ";0000-0003-4571-1570;;0000-0003-2404-0974;0000-0002-5250-7327",
        "linkedin": ";;;https://linkedin.com/in/baochun;",
        "or_profile": "~Shengyao_Lu1;~Yakun_Yu1;~Jiuding_Yang1;~Baochun_Li1;~Di_Niu1",
        "aff": "University of Alberta;University of Alberta;University of Alberta;University of Toronto;University of Alberta",
        "aff_domain": "ualberta.ca;ualberta.ca;ualberta.ca;toronto.edu;ualberta.ca",
        "position": "PhD student;PhD student;PhD student;Full Professor;Full Professor",
        "bibtex": "@misc{\nlu2024stexplainer,\ntitle={{STE}xplainer: Global Explainability of {GNN}s via Frequent SubTree Mining},\nauthor={Shengyao Lu and Yakun Yu and Jiuding Yang and Baochun Li and Di Niu},\nyear={2024},\nurl={https://openreview.net/forum?id=HgSfV6sGIn}\n}",
        "github": "",
        "project": "",
        "reviewers": "zuiK;tXc8;GgEn;zhbU",
        "site": "https://openreview.net/forum?id=HgSfV6sGIn",
        "pdf_size": 1785229,
        "rating": "3;5;5;6",
        "confidence": "5;5;3;3",
        "soundness": "1;2;2;3",
        "contribution": "2;3;2;3",
        "presentation": "2;3;2;3",
        "wc_summary": "67;38;254;126",
        "wc_strengths": "30;58;105;80",
        "wc_weaknesses": "290;8;283;123",
        "wc_questions": "5;47;187;13",
        "wc_review": "392;151;829;342",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "650;320;523;521",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            1.0
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            121.25,
            82.94388163089548
        ],
        "wc_strengths_avg": [
            68.25,
            27.643941470058138
        ],
        "wc_weaknesses_avg": [
            176.0,
            117.76884138005265
        ],
        "wc_questions_avg": [
            63.0,
            73.30757123244501
        ],
        "wc_review_avg": [
            428.5,
            248.10330509688902
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            503.5,
            118.13234104173166
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.6882472016116854,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2543635922774680534&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "University of Alberta;University of Toronto",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ualberta.ca;https://www.utoronto.ca",
        "aff_unique_abbr": "UAlberta;U of T",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "HgVEz6wwbM",
        "title": "What's the Magic Word? A Control Theory of LLM Prompting",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Prompt engineering is effective and important in the deployment of LLMs but is poorly understood mathematically. \nHere, we formalize prompt engineering as an optimal control problem on LLMs -- where the prompt is considered a control variable for modulating the output distribution of the LLM. \nWithin this framework, we ask a simple question: given a sequence of tokens, does there always exist a prompt we can prepend that will steer the LLM toward accurately predicting the final token?\nWe call such an optimal prompt the magic word since prepending the prompt causes the LLM to output the correct answer. If magic words exist, can we find them? If so, what are their properties?\nWe offer analytic analysis on the controllability of a self-attention head where we prove a bound on controllability as a function of the singular values of its weight matrices.\nWe take inspiration from control theory to propose a metric called $k - \\epsilon$ controllability to characterize LLM steerability. \nWe compute the $k-\\epsilon$ controllability of a panel of large language models, including Falcon-7b, Llama-7b, and Falcon-40b on 5000 WikiText causal language modeling tasks. \nRemarkably, we find that magic words of 10 tokens or less exist for over 97\\% of WikiText instances surveyed for each model.",
        "keywords": "language models;control theory;LLMs;prompt optimization;alignment;mechanistic interpretability",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Aman Bhargava;Cameron Witkowski;Manav Shah;Matt Thomson",
        "authorids": "~Aman_Bhargava1;~Cameron_Witkowski1;~Manav_Shah1;~Matt_Thomson1",
        "gender": "M;M;M;",
        "homepage": "https://aman-bhargava.com/;http://cameronwitkowski.com;;https://thomsonlab.caltech.edu",
        "dblp": ";;;",
        "google_scholar": "DA8VdbYAAAAJ;;;",
        "orcid": "0000-0002-3347-0602;;;",
        "linkedin": "aman-b-479975118/;cameron-witkowski/;manav-shah-88557a1a0/;",
        "or_profile": "~Aman_Bhargava1;~Cameron_Witkowski1;~Manav_Shah1;~Matt_Thomson1",
        "aff": "California Institute of Technology;University of Toronto;University of Toronto;California Institute of Technology",
        "aff_domain": "caltech.edu;utoronto.ca;utoronto.ca;caltech.edu",
        "position": "PhD student;MS student;Undergrad student;Assistant Professor",
        "bibtex": "@misc{\nbhargava2024whats,\ntitle={What's the Magic Word? A Control Theory of {LLM} Prompting},\nauthor={Aman Bhargava and Cameron Witkowski and Manav Shah and Matt Thomson},\nyear={2024},\nurl={https://openreview.net/forum?id=HgVEz6wwbM}\n}",
        "github": "",
        "project": "",
        "reviewers": "EeUn;fWP6;8q5r;jCxR;4Qb8",
        "site": "https://openreview.net/forum?id=HgVEz6wwbM",
        "pdf_size": 712771,
        "rating": "3;5;5;5;5",
        "confidence": "3;3;3;4;5",
        "soundness": "2;2;3;3;3",
        "contribution": "2;3;2;2;3",
        "presentation": "2;2;2;3;2",
        "wc_summary": "57;82;47;130;116",
        "wc_strengths": "83;62;43;88;136",
        "wc_weaknesses": "351;186;177;198;249",
        "wc_questions": "17;46;37;16;182",
        "wc_review": "508;376;304;432;683",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "823;511;370;263;699",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "2;1;1;1;1",
        "rating_avg": [
            4.6,
            0.7999999999999999
        ],
        "confidence_avg": [
            3.6,
            0.8
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.2,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            86.4,
            32.289936512789865
        ],
        "wc_strengths_avg": [
            82.4,
            31.219224846238575
        ],
        "wc_weaknesses_avg": [
            232.2,
            64.41552607873354
        ],
        "wc_questions_avg": [
            59.6,
            62.278728310716176
        ],
        "wc_review_avg": [
            460.6,
            129.77457378084506
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            533.2,
            205.7225315807678
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.2,
            0.4000000000000001
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.37500000000000017,
        "gs_citation": 25,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=287401120743037566&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1;0",
        "aff_unique_norm": "California Institute of Technology;University of Toronto",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.caltech.edu;https://www.utoronto.ca",
        "aff_unique_abbr": "Caltech;U of T",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Pasadena;",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "United States;Canada"
    },
    {
        "title": "Can Transformers Capture Spatial Relations between Objects?",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18981",
        "id": "HgZUcwFhjr",
        "author_site": "Chuan Wen, Dinesh Jayaraman, Yang Gao",
        "tldr": "",
        "abstract": "Spatial relationships between objects represent key scene information for humans to understand and interact with the world. To study the capability of current computer vision systems to recognize physically grounded spatial relations, we start by proposing precise relation definitions that permit consistently annotating a benchmark dataset. Despite the apparent simplicity of this task relative to others in the recognition literature, we observe that existing approaches perform poorly on this benchmark. We propose new approaches exploiting the long-range attention capabilities of transformers for this task, and evaluating key design principles. We identify a simple ``RelatiViT'' architecture and demonstrate that it outperforms all current approaches. To our knowledge, this is the first method to convincingly outperform naive baselines on spatial relation prediction in in-the-wild settings. The code and datasets are available in \\url{https://sites.google.com/view/spatial-relation}.",
        "keywords": "Spatial relation;Transformer;Spatial predicates;Visual recognition;Neural network architecture",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Chuan Wen;Dinesh Jayaraman;Yang Gao",
        "authorids": "~Chuan_Wen1;~Dinesh_Jayaraman2;~Yang_Gao1",
        "gender": "M;M;M",
        "homepage": "https://alvinwen428.github.io/;https://www.seas.upenn.edu/~dineshj/;http://yang-gao.weebly.com",
        "dblp": "239/8286;145/3870;89/4402-29",
        "google_scholar": "G5M9nYwAAAAJ;QxLpghAAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";0000-0002-6888-3095;",
        "linkedin": ";dinesh-jayaraman-44b31539/;yang-gao-45245348/",
        "or_profile": "~Chuan_Wen1;~Dinesh_Jayaraman2;~Yang_Gao1",
        "aff": "University of California, Berkeley;University of Pennsylvania;Tsinghua University",
        "aff_domain": "berkeley.edu;upenn.edu;tsinghua.edu.cn",
        "position": "Intern;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nwen2024can,\ntitle={Can Transformers Capture Spatial Relations between Objects?},\nauthor={Chuan Wen and Dinesh Jayaraman and Yang Gao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=HgZUcwFhjr}\n}",
        "github": "",
        "project": "",
        "reviewers": "hAXs;Jenr;MUvq;ubwR;XTRZ",
        "pdf_size": 1292192,
        "rating": "5;5;6;8;8",
        "confidence": "4;4;4;4;4",
        "soundness": "3;3;3;3;4",
        "contribution": "2;2;2;3;3",
        "presentation": "3;4;3;4;4",
        "wc_summary": "111;63;38;79;79",
        "wc_strengths": "63;84;75;117;70",
        "wc_weaknesses": "216;324;122;1219;95",
        "wc_questions": "6;61;4;149;2",
        "wc_review": "396;532;239;1564;246",
        "wc_reply_reviewers": "18;0;42;1004;37",
        "wc_reply_authors": "655;922;821;1487;421",
        "reply_reviewers": "1;0;1;2;1",
        "reply_authors": "2;3;3;3;2",
        "rating_avg": [
            6.4,
            1.3564659966250536
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.2,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            3.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            74.0,
            23.815961034566715
        ],
        "wc_strengths_avg": [
            81.8,
            18.882796403075474
        ],
        "wc_weaknesses_avg": [
            395.2,
            419.6633889202154
        ],
        "wc_questions_avg": [
            44.4,
            56.7823916368446
        ],
        "wc_review_avg": [
            595.4,
            496.19899234077457
        ],
        "wc_reply_reviewers_avg": [
            220.2,
            392.1817945800136
        ],
        "wc_reply_authors_avg": [
            861.2,
            355.8743598519006
        ],
        "reply_reviewers_avg": [
            1.0,
            0.6324555320336759
        ],
        "reply_authors_avg": [
            2.6,
            0.4898979485566356
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12613822922798318334&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=HgZUcwFhjr",
        "pdf": "https://openreview.net/pdf?id=HgZUcwFhjr",
        "email": "berkeley.edu;upenn.edu;tsinghua.edu.cn",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of California, Berkeley;University of Pennsylvania;Tsinghua University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.berkeley.edu;https://www.upenn.edu;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "UC Berkeley;UPenn;THU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Berkeley;",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "HgndgAbBcR",
        "title": "CNNGEN: A GENERATOR AND BENCHMARK FOR SUSTAINABLE CONVOLUTIONAL NEURAL NETWORK SEARCH",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Neural Architecture Search (NAS) emerged as a promising approach to search for\noptimal neural network architectures in a limited, predefined architecture space.\nOne popular method to form such a space is to derive a known architecture in\nwhich we insert cells where NAS algorithms can automatically combine network\nfunctions and connections. Cell-based methods yielded hundreds of thousands\nof trained architectures whose specifications and performance are available to de-\nsign performance prediction models. Cell-based approaches come with three main\nlimitations: i) generated networks have limited diversity resulting in very sim-\nilar performances, in turn hampering the generalization of trained performance\nmodels, ii) networks\u2019 implementations are missing hampering performance un-\nderstanding, and iii) they solely focus on performance metrics (e.g., accuracy)\nignoring the growing sustainability concern. We propose CNNGen, an approach\nthat addresses: i) by leveraging a domain-specific language (DSL) to automat-\nically generate convolutional neural networks (CNNs) without predefined cells\nor base skeleton. It allows the exploration of diverse and potentially unknown\ntopologies; ii) CNNGen\u2019s comprehensive pipeline stores the network description\n(textual and image representation) and the fully executable generated Python code\n(integrated with popular deep-learning frameworks) for analysis or retraining, and\niii) in addition to training and performance metrics, CNNGen also computes en-\nergy consumption and carbon impact for green machine learning endeavors. We\ndemonstrate the possibilities of CNNGen by designing two performance predic-\ntors and comparing them to the state of the art.",
        "keywords": "CNN;NAS;Neural Architecture Search;convolutional neural network;energy consumption;sustainability",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Antoine Gratia;Gilles Perrouin;Paul Temple;Shin'ichi Satoh;Hong Liu",
        "authorids": "~Antoine_Gratia1;~Gilles_Perrouin1;~Paul_Temple1;~Shin'ichi_Satoh1;~Hong_Liu9",
        "gender": "M;M;;M;Non-Binary",
        "homepage": "https://antgratia.github.io/;;https://templep.github.io/;http://www.satoh-lab.nii.ac.jp/;https://lynnhongliu.github.io/hliu/",
        "dblp": ";65/5965.html;;50/290;29/5010-9",
        "google_scholar": ";SeGlh04AAAAJ;2b5VarUAAAAJ;https://scholar.google.co.jp/citations?user=7aEF5cQAAAAJ;BC7N2dYAAAAJ",
        "orcid": ";0000-0002-8431-0377;0000-0002-8276-0593;0000-0001-6995-6447;0000-0001-5318-6388",
        "linkedin": "antoine-gratia-6b627b1b5/;;;shin-ichi-satoh-a8669573/;",
        "or_profile": "~Antoine_Gratia1;~Gilles_Perrouin1;~Paul_Temple1;~Shin'ichi_Satoh1;~Hong_Liu9",
        "aff": "Facult\u00e9s Universitaires Notre-Dame de la Paix;Facult\u00e9s Universitaires Notre-Dame de la Paix;Universit\u00e9 de Rennes;National Institute of Informatics;Osaka University, Tokyo Institute of Technology",
        "aff_domain": "fundp.ac.be;fundp.ac.be;univ-rennes.fr;nii.ac.jp;osaka-u.ac.jp",
        "position": "PhD student;Researcher;Associate Professor;Professor;Assistant Professor",
        "bibtex": "@misc{\ngratia2024cnngen,\ntitle={{CNNGEN}: A {GENERATOR} {AND} {BENCHMARK} {FOR} {SUSTAINABLE} {CONVOLUTIONAL} {NEURAL} {NETWORK} {SEARCH}},\nauthor={Antoine Gratia and Gilles Perrouin and Paul Temple and Shin'ichi Satoh and Hong Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=HgndgAbBcR}\n}",
        "github": "",
        "project": "",
        "reviewers": "pJLK;vffX;WMeX",
        "site": "https://openreview.net/forum?id=HgndgAbBcR",
        "pdf_size": 786122,
        "rating": "3;3;5",
        "confidence": "2;4;3",
        "soundness": "1;1;3",
        "contribution": "1;1;2",
        "presentation": "2;3;3",
        "wc_summary": "29;78;93",
        "wc_strengths": "11;81;54",
        "wc_weaknesses": "144;360;29",
        "wc_questions": "56;2;49",
        "wc_review": "240;521;225",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "342;82;191",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "contribution_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            66.66666666666667,
            27.329267990359508
        ],
        "wc_strengths_avg": [
            48.666666666666664,
            28.82514334550461
        ],
        "wc_weaknesses_avg": [
            177.66666666666666,
            137.2111106612321
        ],
        "wc_questions_avg": [
            35.666666666666664,
            23.976840677805924
        ],
        "wc_review_avg": [
            328.6666666666667,
            136.1380018788125
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            205.0,
            106.60519061784312
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Phs0cRK7b1YJ:scholar.google.com/&scioq=CNNGEN:+A+GENERATOR+AND+BENCHMARK+FOR+SUSTAINABLE+CONVOLUTIONAL+NEURAL+NETWORK+SEARCH&hl=en&as_sdt=0,47",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2;3",
        "aff_unique_norm": "Facult\u00e9s Universitaires Notre-Dame de la Paix;Universit\u00e9 de Rennes;National Institute of Informatics;Osaka University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.fundp.ac.be;https://www.univ-rennes1.fr;https://www.nii.ac.jp/;https://www.osaka-u.ac.jp",
        "aff_unique_abbr": "FUNDP;UR1;NII;Osaka U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;2;2",
        "aff_country_unique": "Belgium;France;Japan"
    },
    {
        "id": "Hh0Cg4epYY",
        "title": "Neural Bounds on Bayes Error: Advancing Classification and Generative Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper presents a groundbreaking technique for approximating the upper limit of Bayes error in various classification tasks, including binary and multi-class problems. Utilizing f-divergence bounds to gauge the dissimilarity between distinct distributions, we establish an upper bound for Bayes error. This bound serves as a criterion for neural network training and test data classification. We showcase this technique's applicability to both binary and multi-class cases, examining the network output against a specific threshold for classification. Experimental results substantiate the method's effectiveness in approximating Bayes error. These experiments focus on Gaussian distributions with disparate means but identical variance, comparing the outcomes with theoretical Bayes error. Finally, the paper explores the potential applications of this approach in Generative Adversarial Networks (GANs), offering a promising avenue for future research.",
        "keywords": "f-Divergence;Bayes Error;Generative Adversarial Networks (GANs);Representation Learning Neural Networks;Multiclass Classification",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Mohammadreza Tavasoli Naeini",
        "authorids": "~Mohammadreza_Tavasoli_Naeini1",
        "gender": "",
        "homepage": "https://www.linkedin.com/in/mohammadreza-tavasoli-naeini-88baa992/",
        "dblp": "",
        "google_scholar": "",
        "orcid": "",
        "linkedin": "mohammadreza-tavasoli-naeini-88baa992/",
        "or_profile": "~Mohammadreza_Tavasoli_Naeini1",
        "aff": "",
        "aff_domain": "",
        "position": "",
        "bibtex": "@misc{\nnaeini2024neural,\ntitle={Neural Bounds on Bayes Error: Advancing Classification and Generative Models},\nauthor={Mohammadreza Tavasoli Naeini},\nyear={2024},\nurl={https://openreview.net/forum?id=Hh0Cg4epYY}\n}",
        "github": "",
        "project": "",
        "reviewers": "Cupy;YCSh;Xo7X",
        "site": "https://openreview.net/forum?id=Hh0Cg4epYY",
        "pdf_size": 962248,
        "rating": "1;3;3",
        "confidence": "5;2;4",
        "soundness": "1;1;1",
        "contribution": "1;1;1",
        "presentation": "1;1;1",
        "wc_summary": "21;78;17",
        "wc_strengths": "1;22;29",
        "wc_weaknesses": "21;215;36",
        "wc_questions": "1;6;3",
        "wc_review": "44;321;85",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            1.247219128924647
        ],
        "soundness_avg": [
            1.0,
            0.0
        ],
        "contribution_avg": [
            1.0,
            0.0
        ],
        "presentation_avg": [
            1.0,
            0.0
        ],
        "wc_summary_avg": [
            38.666666666666664,
            27.860764925289153
        ],
        "wc_strengths_avg": [
            17.333333333333332,
            11.897712198383164
        ],
        "wc_weaknesses_avg": [
            90.66666666666667,
            88.12995454945435
        ],
        "wc_questions_avg": [
            3.3333333333333335,
            2.0548046676563256
        ],
        "wc_review_avg": [
            150.0,
            122.06828689986055
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.7559289460184544,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ylTlKkxcNjYJ:scholar.google.com/&scioq=Neural+Bounds+on+Bayes+Error:+Advancing+Classification+and+Generative+Models&hl=en&as_sdt=0,5",
        "gs_version_total": 0
    },
    {
        "id": "HhVns87e74",
        "title": "Towards a Better Theoretical Understanding of Independent Subnetwork Training",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Modern advancements in large-scale machine learning would be impossible without the paradigm of data-parallel distributed computing. Since distributed computing with large-scale models imparts excessive pressure on communication channels, significant recent research has been directed toward co-designing communication compression strategies and training algorithms with the goal of reducing communication costs. While pure data parallelism allows better data scaling, it suffers from poor model scaling properties. Indeed, compute nodes are severely limited by memory constraints, preventing further increases in model size. For this reason, the latest achievements in training giant neural network models also rely on some form of model parallelism. In this work, we take a closer theoretical look at Independent Subnetwork Training (IST), which is a recently proposed and highly effective technique for solving the aforementioned problems. We identify fundamental differences between IST and alternative approaches, such as distributed methods with compressed communication, and provide a precise analysis of its optimization performance on a quadratic model.",
        "keywords": "Optimization;Distributed Learning;Independent Subnetwork Training;Federated Learning",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/c7a53e10027aa32acbfceeb16e206c1abf5199af.pdf",
        "author": "Egor Shulgin;Peter Richt\u00e1rik",
        "authorids": "~Egor_Shulgin1;~Peter_Richt\u00e1rik1",
        "gender": ";M",
        "homepage": "https://shulgin-egor.github.io/;https://richtarik.org",
        "dblp": "234/8612;62/8001",
        "google_scholar": "cND99UYAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0001-6500-7746;0000-0003-4380-5848",
        "linkedin": "egor-shulgin-a34373127/;richtarik/",
        "or_profile": "~Egor_Shulgin1;~Peter_Richtarik1",
        "aff": "KAUST;King Abdullah University of Science and Technology (KAUST)",
        "aff_domain": "kaust.edu.sa;kaust.edu.sa",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nshulgin2024towards,\ntitle={Towards a Better Theoretical Understanding of Independent Subnetwork Training},\nauthor={Egor Shulgin and Peter Richt{\\'a}rik},\nyear={2024},\nurl={https://openreview.net/forum?id=HhVns87e74}\n}",
        "github": "",
        "project": "",
        "reviewers": "2HE3;GaQK;VkZR;cu8b",
        "site": "https://openreview.net/forum?id=HhVns87e74",
        "pdf_size": 505091,
        "rating": "5;5;5;6",
        "confidence": "3;3;2;3",
        "soundness": "3;2;3;3",
        "contribution": "2;3;2;2",
        "presentation": "2;3;3;3",
        "wc_summary": "158;58;58;18",
        "wc_strengths": "41;55;35;34",
        "wc_weaknesses": "29;222;92;122",
        "wc_questions": "42;90;23;11",
        "wc_review": "270;425;208;185",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "326;370;325;479",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            73.0,
            51.720402163943
        ],
        "wc_strengths_avg": [
            41.25,
            8.37779804005802
        ],
        "wc_weaknesses_avg": [
            116.25,
            69.67199939717533
        ],
        "wc_questions_avg": [
            41.5,
            30.103986446980738
        ],
        "wc_review_avg": [
            272.0,
            93.64560854626339
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            375.0,
            62.733563584416274
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17068243367403856419&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 14,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "King Abdullah University of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaust.edu.sa",
        "aff_unique_abbr": "KAUST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Saudi Arabia"
    },
    {
        "title": "Towards a statistical theory of data selection under weak supervision",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18980",
        "id": "HhfcNgQn6p",
        "author_site": "Germain Kolossov, Andrea Montanari, Pulkit Tandon",
        "tldr": "",
        "abstract": "Given a sample of size $N$, it is often useful to select a subsample of smaller size $n<N$ to be used for statistical estimation or learning.  Such a data selection step is useful to reduce the requirements of data labeling and the computational complexity of learning. We assume to be given $N$ unlabeled samples $x_{i}$, and to be given access to a  'surrogate model' that can predict labels $y_i$ better than random guessing. Our goal is to select a subset of the samples, to be denoted by {$x_{i}$}$_{i\\in G}$, of size $|G|=n<N$. We then acquire labels for this set and we use them to train a model via regularized empirical risk minimization. By using a mixture of numerical experiments on real and synthetic data, and mathematical derivations under low- and high- dimensional asymptotics, we show that: $(i)$ Data selection can be very effective, in particular beating training on the full sample in some cases; $(ii)$ Certain popular choices in data selection methods (e.g. unbiased reweighted subsampling, or influence function-based subsampling) can be substantially suboptimal.",
        "keywords": "Data Selection;Empirical Risk Minimization;Influence Functions;High dimensional asymptotics",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/f5c561e59a49e56e07bbc82994cc66894f6d625f.pdf",
        "author": "Germain Kolossov;Andrea Montanari;Pulkit Tandon",
        "authorids": "~Germain_Kolossov1;~Andrea_Montanari1;~Pulkit_Tandon1",
        "gender": "M;M;M",
        "homepage": ";;",
        "dblp": ";83/5094;191/6675",
        "google_scholar": ";;YXrj9aIAAAAJ",
        "orcid": ";;",
        "linkedin": "german-kolosov-5abb85174;;",
        "or_profile": "~Germain_Kolossov1;~Andrea_Montanari1;~Pulkit_Tandon1",
        "aff": "Granica;Stanford University;Granica ",
        "aff_domain": "granica.ai;stanford.edu;granica.ai",
        "position": "Researcher;Full Professor;Researcher",
        "bibtex": "@inproceedings{\nkolossov2024towards,\ntitle={Towards a statistical theory of data selection under weak supervision},\nauthor={Germain Kolossov and Andrea Montanari and Pulkit Tandon},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=HhfcNgQn6p}\n}",
        "github": "",
        "project": "",
        "reviewers": "fDUv;NQ88;NBpo;Vo45",
        "pdf_size": 1154223,
        "rating": "5;8;8;10",
        "confidence": "2;4;2;3",
        "soundness": "3;4;4;3",
        "contribution": "2;3;4;4",
        "presentation": "2;4;3;3",
        "wc_summary": "119;295;196;85",
        "wc_strengths": "5;175;158;153",
        "wc_weaknesses": "21;278;42;238",
        "wc_questions": "62;311;71;161",
        "wc_review": "207;1059;467;637",
        "wc_reply_reviewers": "4;51;36;340",
        "wc_reply_authors": "123;798;346;590",
        "reply_reviewers": "1;1;1;2",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            7.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            173.75,
            80.73219617971506
        ],
        "wc_strengths_avg": [
            122.75,
            68.4703402941741
        ],
        "wc_weaknesses_avg": [
            144.75,
            114.370833257435
        ],
        "wc_questions_avg": [
            151.25,
            100.02593413710267
        ],
        "wc_review_avg": [
            592.5,
            309.82374021368986
        ],
        "wc_reply_reviewers_avg": [
            107.75,
            135.1598590558602
        ],
        "wc_reply_authors_avg": [
            464.25,
            253.78965207431133
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.46442036401282394,
        "gs_citation": 17,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=339913454978360760&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=HhfcNgQn6p",
        "pdf": "https://openreview.net/pdf?id=HhfcNgQn6p",
        "email": "granica.ai;stanford.edu;granica.ai",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Granica;Stanford University",
        "aff_unique_dep": ";",
        "aff_unique_url": ";https://www.stanford.edu",
        "aff_unique_abbr": ";Stanford",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Stanford",
        "aff_country_unique_index": "1",
        "aff_country_unique": ";United States"
    },
    {
        "id": "HiClR4rwJf",
        "title": "Value Factorization for Asynchronous Multi-Agent Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Value factorization has become widely used to design high-quality and scalable multi-agent reinforcement learning algorithms. However, existing methods assume agents execute synchronously, which does not align with the asynchronous nature of real-world multi-agent systems. In these systems, agents often make decisions at different times, executing asynchronous (*macro-*)actions characterized by varying and unknown duration. Our work introduces value factorization to the asynchronous framework. To this end, we formalize the consistency requirement between joint and individual macro-action selection, proving it generalizes the synchronous case. We then propose approaches that use asynchronous centralized information to enable factorization architectures to support macro-actions. We evaluate the resultant asynchronous value factorization algorithms across increasingly complex domains that are standard benchmarks in the macro-action literature. Crucially, the proposed methods scale well in these challenging coordination tasks where their synchronous counterparts fail.",
        "keywords": "Reinforcement Learning;Asynchronous Multi-Agent Reinforcement Learning;Macro-Actions",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Enrico Marchesini;Yuchen Xiao;Christopher Amato",
        "authorids": "~Enrico_Marchesini1;~Yuchen_Xiao1;~Christopher_Amato1",
        "gender": "M;;M",
        "homepage": "https://emarche.github.io;https://ycx424.wixsite.com/xiaoyc;http://www.ccs.neu.edu/home/camato/index.html",
        "dblp": "https://dblp.uni-trier.de/pid/238/2360.html;;10/3254",
        "google_scholar": "https://scholar.google.it/citations?user=9V1_SGkAAAAJ;q_ka-B0AAAAJ;-8-sD-sAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Enrico_Marchesini1;~Yuchen_Xiao1;~Christopher_Amato1",
        "aff": "Massachusetts Institute of Technology;J.P. Morgan Chase;Northeastern University",
        "aff_domain": "mit.edu;jpmorgan.com;northeastern.edu",
        "position": "Postdoc;Researcher;Associate Professor",
        "bibtex": "@misc{\nmarchesini2024value,\ntitle={Value Factorization for Asynchronous Multi-Agent Reinforcement Learning},\nauthor={Enrico Marchesini and Yuchen Xiao and Christopher Amato},\nyear={2024},\nurl={https://openreview.net/forum?id=HiClR4rwJf}\n}",
        "github": "",
        "project": "",
        "reviewers": "mc14;E8n9;eKQs;JQAT",
        "site": "https://openreview.net/forum?id=HiClR4rwJf",
        "pdf_size": 5787390,
        "rating": "5;5;6;6",
        "confidence": "4;4;4;4",
        "soundness": "3;2;3;3",
        "contribution": "2;3;3;2",
        "presentation": "3;3;2;3",
        "wc_summary": "57;74;52;82",
        "wc_strengths": "21;50;98;55",
        "wc_weaknesses": "70;129;58;43",
        "wc_questions": "87;303;560;60",
        "wc_review": "235;556;768;240",
        "wc_reply_reviewers": "144;186;421;78",
        "wc_reply_authors": "1129;1203;1492;640",
        "reply_reviewers": "1;1;2;1",
        "reply_authors": "2;2;3;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            66.25,
            12.214233500306108
        ],
        "wc_strengths_avg": [
            56.0,
            27.504545078950134
        ],
        "wc_weaknesses_avg": [
            75.0,
            32.61134771824066
        ],
        "wc_questions_avg": [
            252.5,
            200.9682810793783
        ],
        "wc_review_avg": [
            449.75,
            225.10261548902537
        ],
        "wc_reply_reviewers_avg": [
            207.25,
            129.27369221926014
        ],
        "wc_reply_authors_avg": [
            1116.0,
            306.4677797093848
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:x_rGMwA_TNcJ:scholar.google.com/&scioq=Value+Factorization+for+Asynchronous+Multi-Agent+Reinforcement+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Massachusetts Institute of Technology;JPMorgan Chase & Co.;Northeastern University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://web.mit.edu;https://www.jpmorganchase.com;https://www.northeastern.edu",
        "aff_unique_abbr": "MIT;JPM;NEU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Dynamic Neural Response Tuning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18979",
        "id": "HiTg16qhxp",
        "author_site": "Tian Qiu, Xu Wenxiang, lin chen, Zhou Linyun, Zunlei Feng, Mingli Song",
        "tldr": "",
        "abstract": "Artificial Neural Networks (ANNs) have gained widespread applications across various areas in recent years. The ANN design was initially inspired by principles of biology. The biological neural network's fundamental response process comprises information transmission and aggregation. The information transmission in biological neurons is often achieved by triggering action potentials that propagate through axons. ANNs utilize activation mechanisms to simulate such biological behavior. However, previous studies have only considered static response conditions, while the biological neuron's response conditions are typically dynamic, depending on multiple factors such as neuronal properties and the real-time environment. Therefore, the dynamic response conditions of biological neurons could help improve the static ones of existing activations in ANNs. Additionally, the biological neuron's aggregated response exhibits high specificity for different categories, allowing the nervous system to differentiate and identify objects. Inspired by these biological patterns, we propose a novel Dynamic Neural Response Tuning (DNRT) mechanism, which aligns the response patterns of ANNs with those of biological neurons. DNRT comprises Response-Adaptive Activation (RAA) and Aggregated Response Regularization (ARR), mimicking the biological neuron's information transmission and aggregation behaviors. RAA dynamically adjusts the response condition based on the characteristics and strength of the input signal. ARR is devised to enhance the network's ability to learn category specificity by imposing constraints on the network's response distribution. Extensive experimental studies indicate that the proposed DNRT is highly interpretable, applicable to various mainstream network architectures, and can achieve remarkable performance compared with existing neural response mechanisms in multiple tasks and domains. Code is available at https://github.com/horrible-dong/DNRT.",
        "keywords": "biological neuron;artificial neural network;information transmission;information aggregation;neural response;dynamic tuning;activation function;neural representation;neuronal",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Tian Qiu;Wenxiang Xu;Lin Chen;Linyun Zhou;Zunlei Feng;Mingli Song",
        "authorids": "~Tian_Qiu2;~Wenxiang_Xu1;~Lin_Chen25;~Linyun_Zhou1;~Zunlei_Feng1;~Mingli_Song1",
        "gender": "M;M;;F;M;M",
        "homepage": "https://github.com/horrible-dong;https://tcmyxc.github.io/;https://github.com/CL-ing/CL-ing;https://github.com/imAzhou;https://person.zju.edu.cn/en/zunleifeng;https://person.zju.edu.cn/msong",
        "dblp": ";;;;191/2455;71/5333",
        "google_scholar": ";;;;wMtjcGwAAAAJ;7oLbhAwAAAAJ",
        "orcid": ";;;;;0000-0003-2621-6048",
        "linkedin": ";;;;;",
        "or_profile": "~Tian_Qiu2;~Wenxiang_Xu1;~Lin_Chen25;~Linyun_Zhou1;~Zunlei_Feng1;~Mingli_Song1",
        "aff": "Zhejiang University;Zhejiang University;Zhejiang University;Zhejiang University;Zhejiang University;Zhejiang University",
        "aff_domain": "zju.edu.cn;zju.edu.cn;zju.edu.cn;zju.edu.cn;zju.edu.cn;zju.edu.cn",
        "position": "MS student;MS student;MS student;PhD student;Associate Professor;Full Professor",
        "bibtex": "@inproceedings{\nqiu2024dynamic,\ntitle={Dynamic Neural Response Tuning},\nauthor={Tian Qiu and Wenxiang Xu and Lin Chen and Linyun Zhou and Zunlei Feng and Mingli Song},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=HiTg16qhxp}\n}",
        "github": "",
        "project": "",
        "reviewers": "2aiC;Hui7;9nGD;sidQ",
        "pdf_size": 4197997,
        "rating": "3;5;6;8",
        "confidence": "3;3;3;4",
        "soundness": "2;2;2;4",
        "contribution": "2;2;2;4",
        "presentation": "2;2;3;3",
        "wc_summary": "34;94;120;183",
        "wc_strengths": "22;94;126;258",
        "wc_weaknesses": "264;76;136;240",
        "wc_questions": "375;130;181;111",
        "wc_review": "695;394;563;792",
        "wc_reply_reviewers": "86;65;0;0",
        "wc_reply_authors": "2051;1467;1249;1170",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "5;4;4;3",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            107.75,
            53.480720825359114
        ],
        "wc_strengths_avg": [
            125.0,
            85.5277732669336
        ],
        "wc_weaknesses_avg": [
            179.0,
            76.49182962905255
        ],
        "wc_questions_avg": [
            199.25,
            104.64792162293526
        ],
        "wc_review_avg": [
            611.0,
            149.34021561521865
        ],
        "wc_reply_reviewers_avg": [
            37.75,
            38.473204961375394
        ],
        "wc_reply_authors_avg": [
            1484.25,
            344.8183398544805
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            4.0,
            0.7071067811865476
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.8006407690254357,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10429151161871459743&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=HiTg16qhxp",
        "pdf": "https://openreview.net/pdf?id=HiTg16qhxp",
        "email": "zju.edu.cn;zju.edu.cn;zju.edu.cn;zju.edu.cn;zju.edu.cn;zju.edu.cn",
        "author_num": 6,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "Zhejiang University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.zju.edu.cn",
        "aff_unique_abbr": "ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Self-Guided Masked Autoencoders for Domain-Agnostic Self-Supervised Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18978",
        "id": "HiYMiZYwkw",
        "author_site": "Johnathan Xie, Yoonho Lee, Annie Chen, Chelsea Finn",
        "tldr": "",
        "abstract": "Self-supervised learning excels in learning representations from large amounts of unlabeled data, demonstrating success across multiple data modalities. Yet, extending self-supervised learning to new modalities is non-trivial because the specifics of existing methods are tailored to each domain, such as domain-specific augmentations which reflect the invariances in the target task. While masked modeling is promising as a domain-agnostic framework for self-supervised learning because it does not rely on input augmentations, its mask sampling procedure remains domain-specific. We present Self-guided Masked Autoencoders (SMA), a fully domain-agnostic masked modeling method. SMA trains an attention based model using a masked modeling objective, by learning masks to sample without any domain-specific assumptions. We evaluate SMA on three self-supervised learning benchmarks in protein biology, chemical property prediction, and particle physics. We find SMA is capable of learning representations without domain-specific knowledge and achieves state-of-the-art performance on these three benchmarks.",
        "keywords": "self-supervised learning;domain-agnostic learning;masked modeling;protein biology;chemistry;particle physics",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/ba2212ecc13a0b8e2117c48da0847819389e0b2b.zip",
        "author": "Johnathan Wenjia Xie;Yoonho Lee;Annie S Chen;Chelsea Finn",
        "authorids": "~Johnathan_Wenjia_Xie1;~Yoonho_Lee1;~Annie_S_Chen1;~Chelsea_Finn1",
        "gender": "M;M;F;F",
        "homepage": ";https://yoonholee.com/;https://anniesch.github.io/;https://ai.stanford.edu/~cbfinn/",
        "dblp": "302/3497.html;213/8086;277/1527.html;131/1783",
        "google_scholar": ";https://scholar.google.co.kr/citations?user=BAAZ_ysAAAAJ;;vfPE6hgAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;annie-s-chen/;",
        "or_profile": "~Johnathan_Wenjia_Xie1;~Yoonho_Lee1;~Annie_S_Chen1;~Chelsea_Finn1",
        "aff": "Computer Science Department, Stanford University;Stanford University;Stanford University;Google",
        "aff_domain": "cs.stanford.edu;stanford.edu;stanford.edu;google.com",
        "position": "Researcher;PhD student;PhD student;Research Scientist",
        "bibtex": "@inproceedings{\nxie2024selfguided,\ntitle={Self-Guided Masked Autoencoders for Domain-Agnostic Self-Supervised Learning},\nauthor={Johnathan Wenjia Xie and Yoonho Lee and Annie S Chen and Chelsea Finn},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=HiYMiZYwkw}\n}",
        "github": "",
        "project": "",
        "reviewers": "eSva;Md4o;ijD8;zapB;36zB",
        "pdf_size": 1128253,
        "rating": "6;6;6;6;6",
        "confidence": "3;3;4;3;2",
        "soundness": "3;3;3;2;3",
        "contribution": "3;3;3;3;3",
        "presentation": "3;3;3;3;2",
        "wc_summary": "41;92;70;70;110",
        "wc_strengths": "47;77;67;87;153",
        "wc_weaknesses": "337;121;284;101;243",
        "wc_questions": "75;16;51;55;173",
        "wc_review": "500;306;472;313;679",
        "wc_reply_reviewers": "119;22;73;0;22",
        "wc_reply_authors": "1390;772;1266;706;1540",
        "reply_reviewers": "3;1;1;0;1",
        "reply_authors": "5;3;4;2;4",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            76.6,
            23.268863315598377
        ],
        "wc_strengths_avg": [
            86.2,
            35.92436499090833
        ],
        "wc_weaknesses_avg": [
            217.2,
            91.90952072554835
        ],
        "wc_questions_avg": [
            74.0,
            53.020750654814385
        ],
        "wc_review_avg": [
            454.0,
            137.73162309360913
        ],
        "wc_reply_reviewers_avg": [
            47.2,
            43.17128675404522
        ],
        "wc_reply_authors_avg": [
            1134.8,
            335.26729634725785
        ],
        "reply_reviewers_avg": [
            1.2,
            0.9797958971132712
        ],
        "reply_authors_avg": [
            3.6,
            1.019803902718557
        ],
        "replies_avg": [
            32,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14077570978455337614&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=HiYMiZYwkw",
        "pdf": "https://openreview.net/pdf?id=HiYMiZYwkw",
        "email": "cs.stanford.edu;stanford.edu;stanford.edu;google.com",
        "author_num": 4,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "Stanford University;Google",
        "aff_unique_dep": "Computer Science Department;Google",
        "aff_unique_url": "https://www.stanford.edu;https://www.google.com",
        "aff_unique_abbr": "Stanford;Google",
        "aff_campus_unique_index": "0;0;0;1",
        "aff_campus_unique": "Stanford;Mountain View",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Hikig6ljsd",
        "title": "Novel Domain Extrapolation with Large Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We study Domain Generalization (DG), which evaluates models' ability to generalize to unseen test domains. Various augmentation strategies, such as domain augmentation, have been proposed to mitigate this issue. However, many of these methods largely rely on interpolating existing domains and frequently face difficulties in creating truly ``novel'' domains. \n\nWe introduce a novel approach to domain extrapolation that leverages the extensive knowledge encapsulated within large language models (LLMs) to synthesize entirely new domains. Starting with the class of interest, we query the LLMs to extract relevant knowledge for these novel domains. We then bridge the gap between the text-centric knowledge derived from LLMs and the pixel input space of the model using text-to-image generation techniques. By augmenting the training set of domain generalization datasets with high-fidelity, photo-realistic images of these new domains, we achieve significant improvements over all existing methods. This is demonstrated in both single and multi-domain generalization across various benchmarks.\n\nOur empirical findings support our argument that the knowledge from the LLMs and a realization that can bridge the text-driven knowledge and the pixel input space is adequate to learn a generalized model for any task. To illustrate, we put forth a much more difficult setting termed, data-free domain generalization, that aims to learn a generalized model in the absence of any collected data. Surprisingly, our proposed method exhibits commendable performance in this setting, even surpassing the supervised setting by approximately 1-2% on datasets such as VLCS.",
        "keywords": "domain generalization;out-of-distribution generalization",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/f25a644335d1f070590c9ef0a79ad9e9454b1d84.pdf",
        "author": "Yijiang Li;Sucheng Ren;Weipeng DENG;Ying Gao;Edith C. H. Ngai;Haohan Wang",
        "authorids": "~Yijiang_Li1;~Sucheng_Ren1;~Weipeng_DENG1;~Ying_Gao1;~Edith_C._H._Ngai1;~Haohan_Wang1",
        "gender": "Not Specified;M;M;F;F;M",
        "homepage": "https://williamium3000.github.io/;https://oliverren.netlify.com/;;http://www2.scut.edu.cn/cs/2017/0629/c22284a328111/page.htm;https://www.eee.hku.hk/people/echngai/;http://cs.cmu.edu/~haohanw",
        "dblp": ";270/9042;331/7435;15/1300-4;25/5713;132/4066",
        "google_scholar": "https://scholar.google.com.hk/citations?user=Dx3z0m8AAAAJ;Hbf-SoAAAAAJ;https://scholar.google.com/citations?hl=en;;jFt4ZtUAAAAJ;nZxJGeUAAAAJ",
        "orcid": ";;;;0000-0002-3454-8731;",
        "linkedin": ";;;;;haohanwang/",
        "or_profile": "~Yijiang_Li1;~Sucheng_Ren1;~Weipeng_DENG1;~Ying_Gao1;~Edith_C._H._Ngai1;~Haohan_Wang1",
        "aff": "Johns Hopkins University;Johns Hopkins University;University of Hong Kong;South China University of Technology;University of Hong Kong;University of Illinois, Urbana Champaign",
        "aff_domain": "jh.edu;jh.edu;hku.hk;mail.scut.edu.cn;hku.hk;illinois.edu",
        "position": "MS student;PhD student;PhD student;Full Professor;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nli2024novel,\ntitle={Novel Domain Extrapolation with Large Language Models},\nauthor={Yijiang Li and Sucheng Ren and Weipeng DENG and Ying Gao and Edith C. H. Ngai and Haohan Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=Hikig6ljsd}\n}",
        "github": "",
        "project": "",
        "reviewers": "ek11;iNq6;8hCj;h1jS",
        "site": "https://openreview.net/forum?id=Hikig6ljsd",
        "pdf_size": 1200620,
        "rating": "1;3;3;3",
        "confidence": "4;5;5;4",
        "soundness": "1;2;2;3",
        "contribution": "1;2;1;2",
        "presentation": "2;4;3;3",
        "wc_summary": "103;63;82;95",
        "wc_strengths": "91;36;23;46",
        "wc_weaknesses": "512;148;164;39",
        "wc_questions": "19;2;70;5",
        "wc_review": "725;249;339;185",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            85.75,
            15.122417134836613
        ],
        "wc_strengths_avg": [
            49.0,
            25.583197610932064
        ],
        "wc_weaknesses_avg": [
            215.75,
            177.67438616750587
        ],
        "wc_questions_avg": [
            24.0,
            27.3221521846285
        ],
        "wc_review_avg": [
            374.5,
            209.62526088236598
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:z-8BExSTUQ8J:scholar.google.com/&scioq=Novel+Domain+Extrapolation+with+Large+Language+Models&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2;1;3",
        "aff_unique_norm": "Johns Hopkins University;University of Hong Kong;South China University of Technology;University of Illinois Urbana-Champaign",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.jhu.edu;https://www.hku.hk;https://www.scut.edu.cn;https://illinois.edu",
        "aff_unique_abbr": "JHU;HKU;SCUT;UIUC",
        "aff_campus_unique_index": "1;1;2",
        "aff_campus_unique": ";Hong Kong SAR;Urbana-Champaign",
        "aff_country_unique_index": "0;0;1;1;1;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "HilIIP4yzw",
        "title": "Improving Learning Conditions for Computer Science Students by Using the Flipped Classroom",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The flipped classroom is a pedagogical strategy that provides the instructors with a method of minimizing the amount of traditional direct instructions during the teaching process while emphasizing the one-to-one interaction. The students watch some educational resources before attending the session in which they build the required knowledge and prepare questions to be discussed during the session. Such resources are accessed via technological tools, offering flexibility and accessibility. The flipped classroom offers self-paced learning process supporting mastery learning and self-efficacy. \nIn order to improve the learning conditions of Computer Science students at the Lebanese University - Faculty of Sciences - Fanar, we tested the flipped classroom in two master's courses. We designed these courses based on the ADDIE pedagogical model, we used different tools to set up our teaching-learning activities and we evaluated the work of our students by the rubrics-based evaluation method. We prefer to apply the flipped classroom in other courses, starting next academic year, to assess the student\u2019s satisfaction.",
        "keywords": "flipped classroom;e-learning;teaching method;pedagogical scenario;pedagogical model",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Ziad EL BALAA",
        "authorids": "~Ziad_EL_BALAA1",
        "gender": "M",
        "homepage": "",
        "dblp": "",
        "google_scholar": "https://scholar.google.fr/citations?hl=fr",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Ziad_EL_BALAA1",
        "aff": "Lebanese University",
        "aff_domain": "ul.edu.lb",
        "position": "Lecturer",
        "bibtex": "@misc{\nbalaa2024improving,\ntitle={Improving Learning Conditions for Computer Science Students by Using the Flipped Classroom},\nauthor={Ziad EL BALAA},\nyear={2024},\nurl={https://openreview.net/forum?id=HilIIP4yzw}\n}",
        "github": "",
        "project": "",
        "reviewers": "i42D;NhRH;hXGw;W9yV;jdfG",
        "site": "https://openreview.net/forum?id=HilIIP4yzw",
        "pdf_size": 839268,
        "rating": "1;1;1;3;3",
        "confidence": "5;5;5;5;5",
        "soundness": "1;1;2;2;1",
        "contribution": "1;1;1;1;1",
        "presentation": "1;2;3;2;2",
        "wc_summary": "59;54;97;46;18",
        "wc_strengths": "7;1;50;22;29",
        "wc_weaknesses": "40;8;100;75;79",
        "wc_questions": "12;1;7;22;45",
        "wc_review": "118;64;254;165;171",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            1.8,
            0.9797958971132713
        ],
        "confidence_avg": [
            5.0,
            0.0
        ],
        "soundness_avg": [
            1.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            1.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            54.8,
            25.419677417308034
        ],
        "wc_strengths_avg": [
            21.8,
            17.313578486263317
        ],
        "wc_weaknesses_avg": [
            60.4,
            32.52445233973971
        ],
        "wc_questions_avg": [
            17.4,
            15.4220621189256
        ],
        "wc_review_avg": [
            154.4,
            62.936793690177765
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:sjnsfiPjEeoJ:scholar.google.com/&scioq=Improving+Learning+Conditions+for+Computer+Science+Students+by+Using+the+Flipped+Classroom&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Lebanese University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.lub.edu.lb",
        "aff_unique_abbr": "LU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Lebanon"
    },
    {
        "id": "HipfLjyLUW",
        "title": "Hierarchical GFlownet for Crystal Structure Generation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Discovering new solid-state materials necessitates the ability to rapidly explore the vast space of crystal structures and locate stable regions. Generating stable materials with desired properties and composition is a challenging task because of (a) the exponentially large number of possibilities when the elements from the periodic table are considered along with vast variations in their 3D arrangement and corresponding lattice parameters and (b) the rarity of the stable structures. Furthermore, materials discovery requires not only optimized solution structures but also diversity in the configuration of generated material structures. Existing methods have difficulty when exploring large material spaces and generating significantly diverse samples with desired properties and requirements. We propose Crystal Hierarchical Generative Flow Network (CHGlownet), a new generative model that employs a hierarchical exploration strategy with Generative Flow Network to efficiently explore the material space while generating the crystal structure with desired properties. Our model decomposes the large material space into a hierarchy of subspaces of space groups, lattice parameters, and atoms. We significantly outperform the iterative generative methods such as Generative Flow Network (GFlowNet) and Physics Guided Crystal Generative Model (PGCGM) in crystal structure generative tasks in validity, diversity, and generating stable structures with optimized properties and requirements.",
        "keywords": "generative model;crystal structure generation",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/f0e2c5be31d41a567430781090cf4d7f96053449.pdf",
        "author": "Tri Minh Nguyen;Sherif Abdulkader Tawfik;Truyen Tran;Sunil Gupta;Santu Rana;Svetha Venkatesh",
        "authorids": "~Tri_Minh_Nguyen3;~Sherif_Abdulkader_Tawfik1;~Truyen_Tran1;~Sunil_Gupta2;~Santu_Rana1;~Svetha_Venkatesh1",
        "gender": ";M;M;M;F;M",
        "homepage": ";https://sheriftawfikabbas.github.io/;http://truyentran.github.io;;https://www.deakin.edu.au/about-deakin/people/svetha-venkatesh;https://personal-sites.deakin.edu.au/~sunilg/",
        "dblp": ";;55/2269;57/6712;81/1984;47/333-1",
        "google_scholar": "https://scholar.google.com.au/citations?user=lYsThNEAAAAJ;NhT7vZIAAAAJ;https://scholar.google.com.au/citations?user=zvspVLwAAAAJ;S9PwnMYAAAAJ;AEkRUQcAAAAJ;https://scholar.google.com.au/citations?user=bXeL2t8AAAAJ",
        "orcid": ";0000-0003-3592-1419;0000-0001-6531-8907;0000-0003-2247-850X;;0000-0002-3308-1930",
        "linkedin": ";sheriftawfik/;truyen-tran;santur/;;",
        "or_profile": "~Tri_Minh_Nguyen3;~Sherif_Abdulkader_Tawfik1;~Truyen_Tran1;~Santu_Rana1;~Svetha_Venkatesh1;~Sunil_Kumar_Gupta1",
        "aff": ";Deakin University;Deakin University;Deakin University;Deakin University;Deakin University",
        "aff_domain": ";deakin.edu.au;deakin.edu.au;deakin.edu.au;deakin.edu.au;deakin.edu.au",
        "position": ";Postdoc;Full Professor;Associate Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nnguyen2024hierarchical,\ntitle={Hierarchical {GF}lownet for Crystal Structure Generation},\nauthor={Tri Minh Nguyen and Sherif Abdulkader Tawfik and Truyen Tran and Sunil Gupta and Santu Rana and Svetha Venkatesh},\nyear={2024},\nurl={https://openreview.net/forum?id=HipfLjyLUW}\n}",
        "github": "",
        "project": "",
        "reviewers": "a89B;45US;SEfh;ni6Z",
        "site": "https://openreview.net/forum?id=HipfLjyLUW",
        "pdf_size": 1070000,
        "rating": "3;3;5;5",
        "confidence": "4;5;4;4",
        "soundness": "2;1;3;3",
        "contribution": "2;2;2;4",
        "presentation": "2;1;2;4",
        "wc_summary": "65;142;89;117",
        "wc_strengths": "23;221;57;42",
        "wc_weaknesses": "284;1579;154;80",
        "wc_questions": "45;29;217;68",
        "wc_review": "417;1971;517;307",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "573;1080;162;485",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            2.25,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            103.25,
            28.968733144547414
        ],
        "wc_strengths_avg": [
            85.75,
            79.01067965787917
        ],
        "wc_weaknesses_avg": [
            524.25,
            613.3230694340463
        ],
        "wc_questions_avg": [
            89.75,
            74.76421269564737
        ],
        "wc_review_avg": [
            803.0,
            678.4231717740779
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            575.0,
            329.2787572862847
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2318024903913319877&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Deakin University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.deakin.edu.au",
        "aff_unique_abbr": "Deakin",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Australia"
    },
    {
        "id": "HjIa9SoYEZ",
        "title": "CTRL: Graph condensation via crafting rational trajectory matching",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Training on large-scale graphs has achieved remarkable results in graph representation learning, but its cost and storage have raised growing concerns. Generally,\nexisting graph distillation methods address these issues by employing gradient\nmatching, but these strategies primarily emphasize matching directions of the\ngradients. We empirically demonstrate this can result in deviations in the matching\ntrajectories and disparities in the frequency distribution. Accordingly, we propose\nCrafTing RationaL trajectory (CTRL), a novel graph dataset distillation method.\nCTRL introduces gradient magnitude matching during the gradient matching process by incorporating the Euclidean distance into the criterion. Additionally, to\nprevent the disregard for the evenness of feature distribution and the lack of variation that the naive random sampling initialization may introduce, we adopt a simple\ninitialization approach that ensures evenly distributed features. CTRL not only\nachieves state-of-the-art performances in 34 cases of experiments on 12 datasets\nwith lossless performances on 5 datasets but can also be easily integrated into other\ngraph distillation methods based on gradient matching.",
        "keywords": "Dataset distillation",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/37c936aa7838f6aec2dedf8181310a2c70f94944.zip",
        "author": "Tianle Zhang;Yuchen Zhang;Beining Yang;Kai Wang;Tianyi Li;Kaipeng Zhang;Wenqi Shao;Ping Liu;Joey Tianyi Zhou;Yang You",
        "authorids": "~Tianle_Zhang4;~Yuchen_Zhang8;~Beining_Yang1;~Kai_Wang8;~Tianyi_Li5;~Kaipeng_Zhang1;~Wenqi_Shao2;~Ping_Liu1;~Joey_Tianyi_Zhou1;~Yang_You1",
        "gender": "M;M;;M;M;M;M;M;M;M",
        "homepage": ";https://yuczhang.com/;;https://kaiwang960112.github.io/;https://scholar.google.com/citations?user=pHXKrL0AAAAJ;http://kpzhang93.github.io/;https://wqshao126.github.io/;https://sites.google.com/site/pingliu264/;https://joeyzhouty.github.io/;https://www.comp.nus.edu.sg/~youy/",
        "dblp": ";;;78/2022-36;;179/2126;227/3122;34/188-4;123/5110;33/8167-1.html",
        "google_scholar": ";Y2oqeP0AAAAJ;;i2II0XIAAAAJ;;4OqZBmYAAAAJ;Bs9mrwwAAAAJ;;https://scholar.google.com.sg/citations?user=cYNqDokAAAAJ;jF4dPZwAAAAJ",
        "orcid": "0000-0003-1502-9730;;;0000-0002-1154-5175;;;;;0000-0002-4675-7055;",
        "linkedin": ";;;;;;;;;yang-you-0b92914b/",
        "or_profile": "~Tianle_Zhang4;~Yuchen_Zhang8;~Beining_Yang1;~Kai_Wang8;~Tianyi_Li5;~Kaipeng_Zhang1;~Wenqi_Shao2;~Ping_Liu1;~Joey_Tianyi_Zhou1;~Yang_You1",
        "aff": "University of Electronic Science and Technology of China;University of Electronic Science and Technology of China;;National University of Singapore;Zhejiang University;Shanghai AI Laboratory;Shanghai AI Laboratory;Institute of High Performance Computing, Singapore, A*STAR;A*STAR Centre for Frontier AI Research;National University of Singapore",
        "aff_domain": "cn.edu;uestc.edu.cn;;u.nus.edu;zju.edu.cn;pjlab.org.cn;pjlab.org.cn;ihpc.a-star.edu.sg;cfar.a-star.edu.sg;nus.edu.sg",
        "position": "Undergrad student;Undergrad student;;PhD student;Undergrad student;Researcher;Researcher;Research Scientist;Principal Researcher;Professor",
        "bibtex": "@misc{\nzhang2024ctrl,\ntitle={{CTRL}: Graph condensation via crafting rational trajectory matching},\nauthor={Tianle Zhang and Yuchen Zhang and Beining Yang and Kai Wang and Tianyi Li and Kaipeng Zhang and Wenqi Shao and Ping Liu and Joey Tianyi Zhou and Yang You},\nyear={2024},\nurl={https://openreview.net/forum?id=HjIa9SoYEZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "kSU8;ftx3;C2Qb;x24f",
        "site": "https://openreview.net/forum?id=HjIa9SoYEZ",
        "pdf_size": 25065425,
        "rating": "3;5;5;6",
        "confidence": "4;4;3;3",
        "soundness": "3;2;3;3",
        "contribution": "1;2;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "68;93;91;68",
        "wc_strengths": "46;49;27;61",
        "wc_weaknesses": "188;161;188;160",
        "wc_questions": "49;2;74;22",
        "wc_review": "351;305;380;311",
        "wc_reply_reviewers": "212;0;34;13",
        "wc_reply_authors": "2567;2282;2486;1634",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "6;6;6;5",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            80.0,
            12.020815280171307
        ],
        "wc_strengths_avg": [
            45.75,
            12.193748398257199
        ],
        "wc_weaknesses_avg": [
            174.25,
            13.754544703478919
        ],
        "wc_questions_avg": [
            36.75,
            27.215574585152524
        ],
        "wc_review_avg": [
            336.75,
            30.597181242722343
        ],
        "wc_reply_reviewers_avg": [
            64.75,
            85.87600072197121
        ],
        "wc_reply_authors_avg": [
            2242.25,
            366.2051167037402
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            5.75,
            0.4330127018922193
        ],
        "replies_avg": [
            33,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": -0.6882472016116854,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7385995001927473429&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2;3;3;4;5;1",
        "aff_unique_norm": "University of Electronic Science and Technology of China;National University of Singapore;Zhejiang University;Shanghai AI Laboratory;Institute of High Performance Computing;A*STAR",
        "aff_unique_dep": ";;;;;Centre for Frontier AI Research",
        "aff_unique_url": "https://www.uestc.edu.cn;https://www.nus.edu.sg;https://www.zju.edu.cn;https://www.shanghai-ai-lab.com;https://www.ihpc.a-star.edu.sg;https://www.a-star.edu.sg",
        "aff_unique_abbr": "UESTC;NUS;ZJU;SAIL;IHPC;A*STAR",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0;0;1;1;1",
        "aff_country_unique": "China;Singapore"
    },
    {
        "id": "HjfvnxaU5k",
        "title": "Enhanced Bayesian Optimization via Preferential Modeling of Abstract Properties",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Experimental (design) optimization is a key driver in designing and discovering new products and processes. Bayesian Optimization (BO) is an effective tool for optimizing expensive and black-box experimental design processes. While Bayesian optimization is a principled data-driven approach to experimental optimization, it learns everything from scratch and could greatly benefit from the expertise of its human (domain) experts who often reason about systems at different abstraction levels using physical properties that are not necessarily directly measured (or measurable). In this paper, we propose a human-AI collaborative Bayesian framework to incorporate expert preferences about unmeasured abstract properties into the surrogate modeling to further boost the performance of BO. We provide an efficient strategy that can also handle any incorrect/misleading expert bias in preferential judgments. We discuss the convergence details of our proposed framework. The empirical results show the efficacy of our proposed method.",
        "keywords": "Human-AI Teaming;Bayesian Optimisation;Preference Learning;Rank Gaussian Process;Thompson Sampling",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/472a28e1d88f07f8784b92630ba7b7b5a08afd5e.zip",
        "author": "Arun Kumar A V;Alistair Shilton;Sunil Gupta;Santu Rana;Stewart Greenhill;Svetha Venkatesh",
        "authorids": "~Arun_Kumar_A_V1;~Alistair_Shilton1;~Sunil_Gupta2;~Santu_Rana1;~Stewart_Greenhill1;~Svetha_Venkatesh1",
        "gender": ";M;;F;M;M",
        "homepage": ";;https://www.deakin.edu.au/about-deakin/people/stewart-greenhill;https://www.deakin.edu.au/about-deakin/people/svetha-venkatesh;;https://personal-sites.deakin.edu.au/~sunilg/",
        "dblp": "01/5564;57/6712;;81/1984;;47/333-1",
        "google_scholar": ";S9PwnMYAAAAJ;;AEkRUQcAAAAJ;;https://scholar.google.com.au/citations?user=bXeL2t8AAAAJ",
        "orcid": ";0000-0003-2247-850X;;;;0000-0002-3308-1930",
        "linkedin": ";santur/;;;arunkumar-av/;",
        "or_profile": "~Alistair_Shilton1;~Santu_Rana1;~Stewart_Greenhill1;~Svetha_Venkatesh1;~Arun_Kumar_Anjanapura_Venkatesh1;~Sunil_Kumar_Gupta1",
        "aff": "Deakin University;Deakin University;Deakin University;Deakin University;Deakin University;Deakin University",
        "aff_domain": "deakin.edu.au;deakin.edu.au;deakin.edu.au;deakin.edu.au;deakin.edu.au;deakin.edu.au",
        "position": "Researcher;Associate Professor;Researcher;Full Professor;Postdoc;Full Professor",
        "bibtex": "@misc{\nv2024enhanced,\ntitle={Enhanced Bayesian Optimization via Preferential Modeling of Abstract Properties},\nauthor={Arun Kumar A V and Alistair Shilton and Sunil Gupta and Santu Rana and Stewart Greenhill and Svetha Venkatesh},\nyear={2024},\nurl={https://openreview.net/forum?id=HjfvnxaU5k}\n}",
        "github": "",
        "project": "",
        "reviewers": "cKDa;4RNk;NPJR;hhJX",
        "site": "https://openreview.net/forum?id=HjfvnxaU5k",
        "pdf_size": 516228,
        "rating": "1;3;3;5",
        "confidence": "4;4;3;4",
        "soundness": "1;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "2;2;3;3",
        "wc_summary": "72;59;126;173",
        "wc_strengths": "52;47;71;54",
        "wc_weaknesses": "534;523;217;278",
        "wc_questions": "209;146;31;557",
        "wc_review": "867;775;445;1062",
        "wc_reply_reviewers": "276;0;202;0",
        "wc_reply_authors": "722;517;570;341",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            107.5,
            45.40099117860754
        ],
        "wc_strengths_avg": [
            56.0,
            9.027735042633894
        ],
        "wc_weaknesses_avg": [
            388.0,
            142.19880449567782
        ],
        "wc_questions_avg": [
            235.75,
            196.14710678467833
        ],
        "wc_review_avg": [
            787.25,
            223.12146355740856
        ],
        "wc_reply_reviewers_avg": [
            119.5,
            122.33049497161367
        ],
        "wc_reply_authors_avg": [
            537.5,
            136.13320682331698
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1203257182121148646&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "Deakin University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.deakin.edu.au",
        "aff_unique_abbr": "Deakin",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "Australia"
    },
    {
        "id": "Hk7yW3vmSq",
        "title": "Conceptual Graph Counterfactuals",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Conceptual counterfactuals refer to hypothetical scenarios involving changes in a\nhigh-level conceptual representation. In the realm of XAI, conceptual Counterfac\ntual Explanations (CEs) allow for more meaningful and interpretable modifications.\nFor instance, instead of explaining image predictions through superficial pixel-level\nchanges, the focus shifts to alterations in the underlying semantics. In this work,\nwe propose representing input data as semantic graphs to achieve more descriptive,\naccurate, and human-aligned explanations. Furthermore, we introduce a model-\nagnostic GNN-powered method to efficiently compute counterfactuals. We begin\nby representing images as scene graphs and obtain appropriate representations\nthrough GNNs to bypass solving the NP-hard graph similarity problem for all input\npairs, an integral part of the CE computation process. We apply our method to\nwidely-used datasets and compare our CEs with previous state-of-the-art explana\ntion models based on semantics, including both white and black-box approaches.\nWe outperform both approaches quantitatively and qualitatively, as validated by\nhuman subjects, specifically when the graphs contain numerous edges, highlighting\nthe significance of capturing intricate relationships. Given the model-agnostic\nnature of our approach and the generalizability of the graph representation, this\nmethod is successfully extended to diverse modalities and classifiers, including\nnon-neural models. Additionally, it is proven consistent across generated anno\ntations, at least in the case of scene graph generation. Our approach is, to our\nknowledge, the first to emphasize semantic graphs as a vehicle for CEs, allowing\nthe transition from low-level features to concepts. It uniquely leverages graph\nmatching GNNs as a XAI tool achieving efficient approximation and significant\nacceleration in comparison to the exact Graph Edit Distance (GED) algorithm. It is\nwidely applicable and easily extensible, producing actionable explanations.",
        "keywords": "Graph Neural Networks;Graph Matching;Graph Similarity;Scene Graphs;Counterfactual Explanations;Conceptual Counterfactuals",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/b025b2a041c0be52428d7c9711377b8150cf7b12.zip",
        "author": "Angeliki Dimitriou;Maria Lymperaiou;Georgios Filandrianos;Konstantinos Thomas;Giorgos Stamou",
        "authorids": "~Angeliki_Dimitriou1;~Maria_Lymperaiou1;~Georgios_Filandrianos1;~Konstantinos_Thomas1;~Giorgos_Stamou1",
        "gender": "F;F;M;;M",
        "homepage": "https://www.ails.ece.ntua.gr/people/angelikidim;https://www.ails.ece.ntua.gr/people/marialymp;https://www.ails.ece.ntua.gr/people/geofila;;https://www.ece.ntua.gr/en/staff/174",
        "dblp": "367/3837;329/4552;290/5533.html;290/5433.html;s/GBStamou",
        "google_scholar": "pyiokhkAAAAJ;YNikyhIAAAAJ;oPIyXYcAAAAJ;;https://scholar.google.gr/citations?user=R3y5dxMAAAAJ",
        "orcid": "0009-0001-5817-3794;0000-0001-9442-4186;0000-0002-7015-7746;;",
        "linkedin": "angeliki-dimitriou-81079621b/;maria-lymperaiou-55a5b964/;george-filandrianos-7693b9188/;;",
        "or_profile": "~Angeliki_Dimitriou1;~Maria_Lymperaiou1;~Georgios_Filandrianos1;~Konstantinos_Thomas1;~Giorgos_B._Stamou1",
        "aff": "National Technical University of Athens;National Technical University of Athens;National Technical University of Athens;National Technical University of Athens;National Technical University of Athens",
        "aff_domain": "ntua.gr;ntua.gr;ntua.gr;ntua.gr;ntua.gr",
        "position": "PhD student;PhD student;PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\ndimitriou2024conceptual,\ntitle={Conceptual Graph Counterfactuals},\nauthor={Angeliki Dimitriou and Maria Lymperaiou and Georgios Filandrianos and Konstantinos Thomas and Giorgos Stamou},\nyear={2024},\nurl={https://openreview.net/forum?id=Hk7yW3vmSq}\n}",
        "github": "",
        "project": "",
        "reviewers": "iSZ3;B8to;DyGD;wCZ7",
        "site": "https://openreview.net/forum?id=Hk7yW3vmSq",
        "pdf_size": 8653915,
        "rating": "5;5;5;6",
        "confidence": "3;4;2;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;2",
        "presentation": "3;3;3;3",
        "wc_summary": "149;81;91;53",
        "wc_strengths": "119;67;93;38",
        "wc_weaknesses": "814;247;325;230",
        "wc_questions": "146;7;203;75",
        "wc_review": "1228;402;712;396",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1201;500;791;791",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;2;2",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            93.5,
            34.93923296238771
        ],
        "wc_strengths_avg": [
            79.25,
            30.086334107032716
        ],
        "wc_weaknesses_avg": [
            404.0,
            239.40864646039833
        ],
        "wc_questions_avg": [
            107.75,
            73.75423716641642
        ],
        "wc_review_avg": [
            684.5,
            338.81669085214793
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            820.75,
            249.62008633120854
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Cyz1ZkHKqboJ:scholar.google.com/&scioq=Conceptual+Graph+Counterfactuals&hl=en&as_sdt=0,31",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "National Technical University of Athens",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ntua.gr",
        "aff_unique_abbr": "NTUA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Greece"
    },
    {
        "id": "HkibCOnsEv",
        "title": "Structured Inverse-Free Natural Gradient: Memory-Efficient & Numerically-Stable KFAC for Large Neural Nets",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Second-order methods for deep learning---such as KFAC---can be useful for neural network training.\nHowever, they are often memory-inefficient and numerically unstable for low-precision training since their preconditioning Kronecker factors are dense, and require high-precision matrix inversion or decomposition.\nThus, such methods are not widely used for training large neural networks such as transformer-based models.\nWe address these two issues by (i) formulating an inverse-free update of KFAC and (ii) imposing structures in each of the Kronecker factors, resulting in a method we term structured inverse-free natural gradient descent (SINGD).\nOn large transformer- and convolution-based models, we show that, in contrast to KFAC, SINGD is memory efficient and numerically robust.",
        "keywords": "Natural gradient descent;KFAC;Second-order method;Optimization",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Wu Lin;Felix Dangel;Runa Eschenhagen;Kirill Neklyudov;Agustinus Kristiadi;Richard E Turner;Alireza Makhzani",
        "authorids": "~Wu_Lin2;~Felix_Dangel1;~Runa_Eschenhagen1;~Kirill_Neklyudov1;~Agustinus_Kristiadi1;~Richard_E_Turner1;~Alireza_Makhzani1",
        "gender": "M;;M;;M;;M",
        "homepage": "https://f-dangel.com;https://runame.github.io;https://necludov.github.io/;https://agustinus.kristia.de;https://rich-turner-group.github.io/;http://www.alireza.ai/;https://yorkerlin.github.io/",
        "dblp": "236/4218;242/9235;195/1093;215/3954;40/5352;122/5126.html;70/10338",
        "google_scholar": "9hlJ9W0AAAAJ;Ribmq4oAAAAJ;https://scholar.google.ru/citations?user=eOttYWgAAAAJ;_1qe2mYAAAAJ;https://scholar.google.co.uk/citations?user=DgLEyZgAAAAJ;B0KVWJEAAAAJ;https://scholar.google.ca/citations?user=sGl6muoAAAAJ",
        "orcid": "0000-0002-1414-8554;;;0000-0003-1615-1121;;;",
        "linkedin": ";;;agustinus-kristiadi/;;;",
        "or_profile": "~Felix_Dangel1;~Runa_Eschenhagen1;~Kirill_Neklyudov1;~Agustinus_Kristiadi1;~Richard_E_Turner1;~Alireza_Makhzani1;~Wu_Lin1",
        "aff": "Vector Institute, Toronto;University of Cambridge;Vector Institute;Vector Institute;Microsoft Research;Vector Institute;Vector Institute",
        "aff_domain": "vectorinstitute.ai;cam.ac.uk;vectorinstitute.ai;vectorinstitute.ai;research.microsoft.com;vectorinstitute.ai;vectorinstitute.ai",
        "position": "Postdoc;PhD student;Postdoc;Postdoc;Researcher;Researcher;Postdoc",
        "bibtex": "@misc{\nlin2024structured,\ntitle={Structured Inverse-Free Natural Gradient: Memory-Efficient \\& Numerically-Stable {KFAC} for Large Neural Nets},\nauthor={Wu Lin and Felix Dangel and Runa Eschenhagen and Kirill Neklyudov and Agustinus Kristiadi and Richard E Turner and Alireza Makhzani},\nyear={2024},\nurl={https://openreview.net/forum?id=HkibCOnsEv}\n}",
        "github": "",
        "project": "",
        "reviewers": "GKer;qqwe;zZxu;bReV",
        "site": "https://openreview.net/forum?id=HkibCOnsEv",
        "pdf_size": 735304,
        "rating": "5;5;6;6",
        "confidence": "3;3;3;3",
        "soundness": "2;3;3;2",
        "contribution": "2;3;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "175;67;64;77",
        "wc_strengths": "122;58;34;20",
        "wc_weaknesses": "130;165;279;46",
        "wc_questions": "4;116;95;60",
        "wc_review": "431;406;472;203",
        "wc_reply_reviewers": "29;10;116;15",
        "wc_reply_authors": "338;622;362;180",
        "reply_reviewers": "1;1;2;1",
        "reply_authors": "1;1;3;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            95.75,
            46.007472219195
        ],
        "wc_strengths_avg": [
            58.5,
            39.099232729044694
        ],
        "wc_weaknesses_avg": [
            155.0,
            83.63910568627573
        ],
        "wc_questions_avg": [
            68.75,
            42.39914503855001
        ],
        "wc_review_avg": [
            378.0,
            103.7472891212103
        ],
        "wc_reply_reviewers_avg": [
            42.5,
            43.00290687848904
        ],
        "wc_reply_authors_avg": [
            375.5,
            158.56465558250994
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0;1;0;0;2;0;0",
        "aff_unique_norm": "Vector Institute;University of Cambridge;Microsoft",
        "aff_unique_dep": ";;Microsoft Research",
        "aff_unique_url": "https://vectorinstitute.ai;https://www.cam.ac.uk;https://www.microsoft.com/en-us/research",
        "aff_unique_abbr": "Vector Institute;Cambridge;MSR",
        "aff_campus_unique_index": "0;1",
        "aff_campus_unique": "Toronto;Cambridge;",
        "aff_country_unique_index": "0;1;0;0;2;0;0",
        "aff_country_unique": "Canada;United Kingdom;United States"
    },
    {
        "id": "Hm6maU150b",
        "title": "NeFL: Nested Federated Learning for Heterogeneous Clients",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Federated learning (FL) is a promising approach in distributed learning keeping privacy. However, during the training pipeline of FL, slow or incapable clients (i.e., stragglers) slow down the total training time and degrade performance. System heterogeneity, including heterogeneous computing and network bandwidth, has been addressed to mitigate the impact of stragglers. Previous studies tackle the system heterogeneity by splitting a model into submodels, but with less degree-of-freedom in terms of model architecture. We propose nested federated learning (NeFL), a generalized framework that efficiently divides a model into submodels using both depthwise and widthwise scaling. NeFL is implemented by interpreting forward propagation of models as solving ordinary differential equations (ODEs) with adaptive step sizes. To address the inconsistency that arises when training multiple submodels of different architecture, we decouple a few parameters from parameters being trained for each submodel. NeFL enables resource-constrained clients to effectively join the FL pipeline and the model to be trained with a larger amount of data. Through a series of experiments, we demonstrate that NeFL leads to significant performance gains, especially for the worst-case submodel. Furthermore, we demonstrate NeFL aligns with recent studies in FL, regarding pre-trained models of FL and the statistical heterogeneity.",
        "keywords": "federated learning;system heterogeneity",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/ade7f7b08166dedbf0d47570a73e6b283c37e797.pdf",
        "author": "Honggu Kang;Seohyeon Cha;Jinwoo Shin;Jongmyeong Lee;Joonhyuk Kang",
        "authorids": "~Honggu_Kang1;~Seohyeon_Cha1;~Jinwoo_Shin1;~Jongmyeong_Lee1;~Joonhyuk_Kang1",
        "gender": "M;;M;M;M",
        "homepage": ";https://seohyeon-cha.github.io;https://sites.google.com/site/mijirim/;https://github.com/JongmyeongLee;http://artlab.kaist.ac.kr/bbs/board.php?bo_table=sub1_1",
        "dblp": ";;31/7062;;",
        "google_scholar": "https://scholar.google.es/citations?user=zVQggNkAAAAJ;y424CngAAAAJ;https://scholar.google.com.tw/citations?user=m3eDp7kAAAAJ;;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;;",
        "linkedin": "honggu-kang-77130810b/;;;;",
        "or_profile": "~Honggu_Kang1;~Seohyeon_Cha1;~Jinwoo_Shin1;~Jongmyeong_Lee1;~Joonhyuk_Kang1",
        "aff": "KAIST;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;;Korea Advanced Institute of Science & Technology",
        "aff_domain": "ee.kaist.ac.kr;kaist.ac.kr;kaist.ac.kr;;kaist.ac.kr",
        "position": "PhD student;MS student;Full Professor;;Full Professor",
        "bibtex": "@misc{\nkang2024nefl,\ntitle={Ne{FL}: Nested Federated Learning for Heterogeneous Clients},\nauthor={Honggu Kang and Seohyeon Cha and Jinwoo Shin and Jongmyeong Lee and Joonhyuk Kang},\nyear={2024},\nurl={https://openreview.net/forum?id=Hm6maU150b}\n}",
        "github": "",
        "project": "",
        "reviewers": "7d7r;HZdf;5ayx",
        "site": "https://openreview.net/forum?id=Hm6maU150b",
        "pdf_size": 632672,
        "rating": "5;6;6",
        "confidence": "4;3;3",
        "soundness": "2;3;4",
        "contribution": "2;3;4",
        "presentation": "3;2;3",
        "wc_summary": "75;18;57",
        "wc_strengths": "111;100;71",
        "wc_weaknesses": "119;53;136",
        "wc_questions": "1;109;225",
        "wc_review": "306;280;489",
        "wc_reply_reviewers": "0;24;0",
        "wc_reply_authors": "595;584;1000",
        "reply_reviewers": "0;1;0",
        "reply_authors": "1;1;2",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            50.0,
            23.790754506740637
        ],
        "wc_strengths_avg": [
            94.0,
            16.87206764645835
        ],
        "wc_weaknesses_avg": [
            102.66666666666667,
            35.798820588890294
        ],
        "wc_questions_avg": [
            111.66666666666667,
            91.46705539275997
        ],
        "wc_review_avg": [
            358.3333333333333,
            93.00298680986302
        ],
        "wc_reply_reviewers_avg": [
            8.0,
            11.313708498984761
        ],
        "wc_reply_authors_avg": [
            726.3333333333334,
            193.56365590908044
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9999999999999997,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18055965594873964038&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "HmKav4WZ9w",
        "title": "Basis Function Encoding of Numerical Features in Factorization Machines for Improved Accuracy",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Factorization machine (FM) variants are widely used for large scale real-time content recommendation systems, since they offer an excellent balance between model accuracy and low computational costs for training and inference. These systems are trained on tabular data with both numerical and categorical columns. Incorporating numerical columns poses a challenge, and they are typically incorporated using a scalar transformation or binning, which can be either learned or chosen a-priori. In this work, we provide a systematic and theoretically-justified way to incorporate numerical features into FM variants by encoding them into a vector of function values for a set of functions of one's choice.\n \n We view factorization machines as approximators of *segmentized* functions, namely, functions from a field's value to the real numbers, assuming the remaining fields are assigned some given constants, which we refer to as the segment. From this perspective, we show that our technique yields a model that learns segmentized functions of the numerical feature spanned by the set of functions of one's choice, namely, the spanning coefficients vary between segments. Hence, to improve model accuracy we advocate the use of functions known to have strong approximation power, and offer the B-Spline basis due to its well-known approximation power, availability in software libraries, and efficiency. Our technique preserves fast training and inference, and requires only a small modification of the computational graph of an FM model. Therefore, it is easy to incorporate into an existing system to improve its performance. Finally, we back our claims with a set of experiments that include a synthetic experiment, performance evaluation on several data-sets, and an A/B test on a real online advertising system which shows improved performance. The results can be reproduced with the code in the supplemental material.",
        "keywords": "factorization machine;supervised learning;recommender system",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/4daa1702cdf4e1763db22e055b7f49c653042dac.zip",
        "author": "Alex Shtoff;Elie Abboud;Rotem Stram;Oren Somekh",
        "authorids": "~Alex_Shtoff1;~Elie_Abboud1;~Rotem_Stram1;~Oren_Somekh2",
        "gender": "M;M;F;M",
        "homepage": "https://alexshtf.github.io;;;",
        "dblp": "305/0557;;187/9049;",
        "google_scholar": "XcpQMwwAAAAJ;;https://scholar.google.co.il/citations?user=JJFQitwAAAAJ;https://scholar.google.co.il/citations?user=wuj-SeUAAAAJ",
        "orcid": ";;;",
        "linkedin": "alexshtf/?lipi=urn%3Ali%3Apage%3Ad_flagship3_feed%3BhOwAOew2T02l4V4ROjS8%2BA%3D%3D;elie-abboud1996;;",
        "or_profile": "~Alex_Shtoff1;~Elie_Abboud1;~Rotem_Stram1;~Oren_Somekh2",
        "aff": "Yahoo Research;;Yahoo;Yahoo",
        "aff_domain": "yahooinc.com;;yahoo-inc.com;yahoo-inc.com",
        "position": "Researcher;;Researcher;Principal Researcher",
        "bibtex": "@misc{\nshtoff2024basis,\ntitle={Basis Function Encoding of Numerical Features in Factorization Machines for Improved Accuracy},\nauthor={Alex Shtoff and Elie Abboud and Rotem Stram and Oren Somekh},\nyear={2024},\nurl={https://openreview.net/forum?id=HmKav4WZ9w}\n}",
        "github": "",
        "project": "",
        "reviewers": "fV9X;cfSS;TbNK;c3Zp;xr1T;Ema4;cQDt;zL9t",
        "site": "https://openreview.net/forum?id=HmKav4WZ9w",
        "pdf_size": 945076,
        "rating": "3;3;5;5;5;5;6;6",
        "confidence": "3;4;2;3;3;2;4;3",
        "soundness": "3;2;2;2;2;2;3;3",
        "contribution": "2;2;2;2;2;2;3;3",
        "presentation": "2;2;2;2;1;2;4;2",
        "wc_summary": "236;32;85;61;119;98;152;92",
        "wc_strengths": "69;24;38;36;68;67;188;326",
        "wc_weaknesses": "471;246;127;148;223;114;485;415",
        "wc_questions": "118;11;64;80;8;53;55;264",
        "wc_review": "894;313;314;325;418;332;880;1097",
        "wc_reply_reviewers": "0;0;75;52;0;0;35;353",
        "wc_reply_authors": "98;96;129;505;113;197;137;208",
        "reply_reviewers": "0;0;1;1;0;0;1;1",
        "reply_authors": "1;1;1;2;1;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.375,
            0.4841229182759271
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.125,
            0.7806247497997998
        ],
        "wc_summary_avg": [
            109.375,
            58.4121937184352
        ],
        "wc_strengths_avg": [
            102.0,
            97.19696497319245
        ],
        "wc_weaknesses_avg": [
            278.625,
            145.56350632971163
        ],
        "wc_questions_avg": [
            81.625,
            76.51296867198397
        ],
        "wc_review_avg": [
            571.625,
            306.21517659155955
        ],
        "wc_reply_reviewers_avg": [
            64.375,
            112.36651803362068
        ],
        "wc_reply_authors_avg": [
            185.375,
            127.07570332286184
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.125,
            0.33071891388307384
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.16222142113076257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:7zZRZkwi7u0J:scholar.google.com/&scioq=Basis+Function+Encoding+of+Numerical+Features+in+Factorization+Machines+for+Improved+Accuracy&hl=en&as_sdt=0,5",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Yahoo",
        "aff_unique_dep": "Yahoo Research",
        "aff_unique_url": "https://research.yahoo.com",
        "aff_unique_abbr": "Yahoo Research",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "HmL2Buf0Ur",
        "title": "Can Copyright be Reduced to Privacy?",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "There is a growing concern that generative AI models may generate outputs that closely resemble the copyrighted input content used for their training.  This worry has intensified as the quality and complexity of generative models have immensely improved, and the availability of extensive datasets containing copyrighted material has expanded. Researchers are actively exploring strategies to mitigate the risk of producing infringing samples, and a recent line of work suggests employing techniques such as differential privacy and other forms of algorithmic stability to safeguard copyrighted content.\nIn this work, we examine whether algorithmic stability techniques such as differential privacy are suitable to ensure the responsible use of generative models without inadvertently violating copyright laws. We argue that there are fundamental differences between privacy and copyright that should not be overlooked. In particular, we highlight that although algorithmic stability may be perceived as a practical tool to detect copying, it does not necessarily equate to copyright protection. Therefore, if it is adopted as a standard for copyright infringement, it may undermine the intended purposes of copyright law",
        "keywords": "copyright;privacy;generative AI",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Niva Elkin-Koren;Uri Y. Hacohen;Roi Livni;Shay Moran",
        "authorids": "~Niva_Elkin-Koren1;~Uri_Y._Hacohen1;~Roi_Livni1;~Shay_Moran1",
        "gender": "F;M;Not Specified;M",
        "homepage": "https://en-law.tau.ac.il/profile/elkiniva;https://en-law.tau.ac.il/profile/urihacohen;https://www.rlivni.sites.tau.ac.il/;http://www.cs.technion.ac.il/~shaymrn/",
        "dblp": ";;59/11348;119/5111",
        "google_scholar": "https://scholar.google.com/citations?hl=en;AaiD8DcAAAAJ;xhU85M4AAAAJ;kALYnggAAAAJ",
        "orcid": "0000-0003-2519-2494;;;",
        "linkedin": ";;;",
        "or_profile": "~Niva_Elkin-Koren1;~Uri_Y._Hacohen1;~Roi_Livni1;~Shay_Moran1",
        "aff": "Tel Aviv University;Tel Aviv University, Tel Aviv University;Tel Aviv University;Google",
        "aff_domain": "tau.ac.il;tauex.tau.ac.il;tau.ac.il;google.com",
        "position": "Full Professor;Assistant Professor;Assistant Professor;Visiting Faculty",
        "bibtex": "@misc{\nelkin-koren2024can,\ntitle={Can Copyright be Reduced to Privacy?},\nauthor={Niva Elkin-Koren and Uri Y. Hacohen and Roi Livni and Shay Moran},\nyear={2024},\nurl={https://openreview.net/forum?id=HmL2Buf0Ur}\n}",
        "github": "",
        "project": "",
        "reviewers": "ycKh;rrnp;83w5;ttA1",
        "site": "https://openreview.net/forum?id=HmL2Buf0Ur",
        "pdf_size": 380491,
        "rating": "3;3;3;6",
        "confidence": "5;2;2;4",
        "soundness": "2;2;2;3",
        "contribution": "2;3;2;3",
        "presentation": "2;1;1;2",
        "wc_summary": "54;61;267;72",
        "wc_strengths": "59;78;23;64",
        "wc_weaknesses": "265;164;402;168",
        "wc_questions": "275;18;14;1",
        "wc_review": "653;321;706;305",
        "wc_reply_reviewers": "32;0;0;101",
        "wc_reply_authors": "770;433;654;302",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            1.299038105676658
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            113.5,
            88.85521931771932
        ],
        "wc_strengths_avg": [
            56.0,
            20.285462775100793
        ],
        "wc_weaknesses_avg": [
            249.75,
            96.75839756837647
        ],
        "wc_questions_avg": [
            77.0,
            114.48799063657289
        ],
        "wc_review_avg": [
            496.25,
            184.29239675038144
        ],
        "wc_reply_reviewers_avg": [
            33.25,
            41.23939257554602
        ],
        "wc_reply_authors_avg": [
            539.75,
            183.02236885146033
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 27,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5468509876958238615&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "Tel Aviv University;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.tau.ac.il;https://www.google.com",
        "aff_unique_abbr": "TAU;Google",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Tel Aviv;Mountain View",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "Israel;United States"
    },
    {
        "id": "HnVtsfyvap",
        "title": "Label-efficient Training of Small Task-specific Models by Leveraging Vision Foundation Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large Vision Foundation Models (VFMs) pretrained on massive datasets exhibit impressive perform on various downstream tasks, especially with limited labeled target data. However, due to their high memory and compute requirements, these models cannot be deployed in resource constrained settings. This raises an important question: How can we utilize the knowledge from a large VFM to train a small task-specific model for a new target task with limited labeled training data? In this work, we answer this question by proposing a simple yet highly effective task-oriented knowledge transfer approach to leverage pretrained VFMs for effective training of small task-specific models. Our experimental results on three target tasks under limited labeled data settings show that the proposed knowledge transfer approach outperforms task-agnostic VFM distillation, web-scale CLIP pretraining and supervised ImageNet pretraining approaches by 1-10.5%, 2-21%, and 2-14%, respectively. We also show that the dataset used for transferring knowledge has a significant effect on the final target task performance, and propose a retrieval-based approach to curate effective transfer sets.",
        "keywords": "Foundation models;Knowledge Distillation;Label-efficiency",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/d3ec5ffa4e863dd58c1741ab0efe0c5aac715cf9.pdf",
        "author": "Raviteja Vemulapalli;Hadi Pouransari;Fartash Faghri;Sachin Mehta;Mehrdad Farajtabar;Mohammad Rastegari;Oncel Tuzel",
        "authorids": "~Raviteja_Vemulapalli1;~Hadi_Pouransari1;~Fartash_Faghri1;~Sachin_Mehta1;~Mehrdad_Farajtabar1;~Mohammad_Rastegari2;~Oncel_Tuzel2",
        "gender": "M;M;M;M;M;M;M",
        "homepage": "http://ravitejav.weebly.com/;;;https://sacmehta.github.io/;https://www.cc.gatech.edu/~mfarajta/;https://mrastegari.github.io/;http://www.onceltuzel.net",
        "dblp": "135/4940;162/5187;115/7922;34/11140;21/9988;31/5228;73/2943.html",
        "google_scholar": "0OFqm7YAAAAJ;besz69AAAAAJ;https://scholar.google.ca/citations?user=KUG_tG0AAAAJ;https://scholar.google.co.in/citations?user=cnRJ0GUAAAAJ;shkKxnQAAAAJ;N4-2Z_cAAAAJ;Fe7NTe0AAAAJ",
        "orcid": ";;;;;;",
        "linkedin": "raviteja-vemulapalli-85146113?utm_source=share&utm_campaign=share_via&utm_content=profile&utm_medium=ios_app;;fartash-faghri;;;;",
        "or_profile": "~Raviteja_Vemulapalli1;~Hadi_Pouransari1;~Fartash_Faghri1;~Sachin_Mehta1;~Mehrdad_Farajtabar1;~Mohammad_Rastegari2;~Oncel_Tuzel2",
        "aff": "Apple;Apple;Apple;Apple;Apple;Department of Computer Science, University of Washington;Apple",
        "aff_domain": "apple.com;apple.com;apple.com;apple.com;apple.com;cs.washington.edu;apple.com",
        "position": "Researcher;Principal Researcher;Researcher;Researcher;Researcher;Assistant Professor;Principal Researcher",
        "bibtex": "@misc{\nvemulapalli2024labelefficient,\ntitle={Label-efficient Training of Small Task-specific Models by Leveraging Vision Foundation Models},\nauthor={Raviteja Vemulapalli and Hadi Pouransari and Fartash Faghri and Sachin Mehta and Mehrdad Farajtabar and Mohammad Rastegari and Oncel Tuzel},\nyear={2024},\nurl={https://openreview.net/forum?id=HnVtsfyvap}\n}",
        "github": "",
        "project": "",
        "reviewers": "M3yw;Ph8P;H2Cx;KUqe",
        "site": "https://openreview.net/forum?id=HnVtsfyvap",
        "pdf_size": 7038288,
        "rating": "3;5;6;6",
        "confidence": "4;4;4;3",
        "soundness": "2;3;4;3",
        "contribution": "1;3;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "86;219;27;85",
        "wc_strengths": "17;156;118;45",
        "wc_weaknesses": "275;83;60;64",
        "wc_questions": "201;69;32;85",
        "wc_review": "579;527;237;279",
        "wc_reply_reviewers": "1206;10;17;0",
        "wc_reply_authors": "1521;507;191;427",
        "reply_reviewers": "2;1;1;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            104.25,
            70.42504881077471
        ],
        "wc_strengths_avg": [
            84.0,
            55.56527692723217
        ],
        "wc_weaknesses_avg": [
            120.5,
            89.62282075453774
        ],
        "wc_questions_avg": [
            96.75,
            63.18375978050056
        ],
        "wc_review_avg": [
            405.5,
            149.38122371971653
        ],
        "wc_reply_reviewers_avg": [
            308.25,
            518.351413135915
        ],
        "wc_reply_authors_avg": [
            661.5,
            509.6496345529937
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.4714045207910316,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=317594927543420461&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0;0;0;1;0",
        "aff_unique_norm": "Apple;University of Washington",
        "aff_unique_dep": "Apple Inc.;Department of Computer Science",
        "aff_unique_url": "https://www.apple.com;https://www.washington.edu",
        "aff_unique_abbr": "Apple;UW",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Seattle",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "HoY24hOeVP",
        "title": "Efficient Personalized Text-to-image Generation by Leveraging Textual Subspace",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Personalized text-to-image generation has attracted unprecedented attention in the recent few years due to its unique capability of generating highly-personalized images via using the input concept dataset and novel textual prompt. However, previous methods solely focus on the performance of the reconstruction task, degrading its ability to combine with different textual prompt. Besides, optimizing in the high-dimensional embedding space usually leads to unnecessary time-consuming training process and slow convergence. To address these issues, we propose an efficient method to explore the target embedding in a textual subspace, drawing inspiration from the self-expressiveness property. Additionally, we propose an efficient selection strategy for determining the basis vectors of the texual subspace. The experimental evaluations demonstrate that the learned embedding can not only faithfully reconstruct input image, but also significantly improves its alignment with novel input textual prompt. Furthermore, we observe that optimizing in the textual subspace leads to an significant improvement of the robustness to the initial word, relaxing the constraint that requires users to input the most relevant initial word. Our method opens the door to more efficient representation learning for personalized text-to-image generation.",
        "keywords": "Text-to-image Generation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/4297fe30c9a7c4f3dbb48a5243a71bf377bfe40b.zip",
        "author": "Shian Du;Xiaotian Cheng;Qi Qian;Henglu Wei;Yi Xu;Xiangyang Ji",
        "authorids": "~Shian_Du1;~Xiaotian_Cheng1;~Qi_Qian1;~Henglu_Wei1;~Yi_Xu8;~Xiangyang_Ji1",
        "gender": "M;M;;M;;",
        "homepage": ";https://github.com/greatwallet;http://qi-qian.com;https://faculty.dlut.edu.cn/weihenglu/zh_CN/index/1178003/list/index.htm;;",
        "dblp": "317/1383;281/6648;05/2084-1;170/3329;;",
        "google_scholar": "SUgR5VAAAAAJ;https://scholar.google.com/citations?hl=en;Rp_40_gAAAAJ;;;",
        "orcid": ";;;0000-0002-2072-5020;;",
        "linkedin": ";;;;;",
        "or_profile": "~Shian_Du1;~Xiaotian_Cheng1;~Qi_Qian1;~Henglu_Wei1;~Yi_Xu8;~Xiangyang_Ji1",
        "aff": "Tsinghua University;Tsinghua University;Alibaba Group;Tsinghua University;;",
        "aff_domain": "tsinghua.edu.cn;tsinghua.edu.cn;alibaba-inc.com;tsinghua.edu.cn;;",
        "position": "MS student;PhD student;Researcher;Postdoc;;",
        "bibtex": "@misc{\ndu2024efficient,\ntitle={Efficient Personalized Text-to-image Generation by Leveraging Textual Subspace},\nauthor={Shian Du and Xiaotian Cheng and Qi Qian and Henglu Wei and Yi Xu and Xiangyang Ji},\nyear={2024},\nurl={https://openreview.net/forum?id=HoY24hOeVP}\n}",
        "github": "",
        "project": "",
        "reviewers": "s24C;uaaP;GqUH;pRpB;qu14",
        "site": "https://openreview.net/forum?id=HoY24hOeVP",
        "pdf_size": 41963746,
        "rating": "3;6;6;6;6",
        "confidence": "4;5;2;4;4",
        "soundness": "3;3;3;2;3",
        "contribution": "2;3;2;2;2",
        "presentation": "3;2;3;3;3",
        "wc_summary": "32;48;55;72;44",
        "wc_strengths": "61;50;37;2;51",
        "wc_weaknesses": "178;313;112;146;91",
        "wc_questions": "17;4;15;2;47",
        "wc_review": "288;415;219;222;233",
        "wc_reply_reviewers": "0;0;0;196;0",
        "wc_reply_authors": "337;338;337;747;430",
        "reply_reviewers": "0;0;0;2;0",
        "reply_authors": "1;1;1;2;1",
        "rating_avg": [
            5.4,
            1.2
        ],
        "confidence_avg": [
            3.8,
            0.9797958971132712
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            50.2,
            13.212115651930995
        ],
        "wc_strengths_avg": [
            40.2,
            20.565991344936428
        ],
        "wc_weaknesses_avg": [
            168.0,
            78.32496409191644
        ],
        "wc_questions_avg": [
            17.0,
            16.112107248898266
        ],
        "wc_review_avg": [
            275.4,
            74.13123498229339
        ],
        "wc_reply_reviewers_avg": [
            39.2,
            78.4
        ],
        "wc_reply_authors_avg": [
            437.8,
            158.7115622757208
        ],
        "reply_reviewers_avg": [
            0.4,
            0.8
        ],
        "reply_authors_avg": [
            1.2,
            0.4
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.10206207261596577,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:THz_uEy9EC8J:scholar.google.com/&scioq=Efficient+Personalized+Text-to-image+Generation+by+Leveraging+Textual+Subspace&hl=en&as_sdt=0,5",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Tsinghua University;Alibaba Group",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.alibaba.com",
        "aff_unique_abbr": "THU;Alibaba",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Chain-of-Experts: When LLMs Meet Complex Operations Research Problems",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18977",
        "id": "HobyL1B9CZ",
        "author_site": "Ziyang Xiao, Dongxiang Zhang, Yangjun Wu, Lilin Xu, Yuan Wang, Xiongwei Han, Xiaojin Fu, Tao Zhong, Jia Zeng, Mingli Song, Gang Chen",
        "tldr": "",
        "abstract": "Large language models (LLMs) have emerged as powerful techniques for various NLP tasks, such as mathematical reasoning and plan generation. In this paper, we study automatic modeling and programming for complex operation research (OR) problems, so as to alleviate the heavy dependence on domain experts and benefit a spectrum of industry sectors. We present the first LLM-based solution, namely Chain-of-Experts (CoE), a novel multi-agent cooperative framework to enhance reasoning capabilities. Specifically, each agent is assigned a specific role and endowed with domain knowledge related to OR. We also introduce a conductor to orchestrate these agents via forward thought construction and backward reflection mechanism. Furthermore, we release a benchmark dataset (ComplexOR) of complex OR problems to facilitate OR research and community development. Experimental results show that CoE significantly outperforms the state-of-the-art LLM-based approaches both on LPWP and ComplexOR.",
        "keywords": "Large Language Model;Operations Research",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/3f0d4c6ed8e2ba0732bc18a12b30fe3f624154c1.zip",
        "author": "Ziyang Xiao;Dongxiang Zhang;Yangjun Wu;Lilin Xu;Yuan Jessica Wang;Xiongwei Han;Xiaojin Fu;Tao Zhong;Jia Zeng;Mingli Song;Gang Chen",
        "authorids": "~Ziyang_Xiao2;~Dongxiang_Zhang2;~Yangjun_Wu1;~Lilin_Xu2;~Yuan_Jessica_Wang1;~Xiongwei_Han1;~Xiaojin_Fu1;~Tao_Zhong2;~Jia_Zeng1;~Mingli_Song1;~Gang_Chen6",
        "gender": "M;M;M;M;F;M;;;M;M;M",
        "homepage": ";https://person.zju.edu.cn/zhangdongxiang;;;https://www.suss.edu.sg/about-suss/faculty-and-staff/detail/wang-yuan;;;;;https://person.zju.edu.cn/msong;",
        "dblp": ";89/6013;304/5895.html;;;299/1779.html;;;31/435;71/5333;67/6383-1",
        "google_scholar": "uSb7TOAAAAAJ;nYN9A3IAAAAJ;;;;SEJtThAAAAAJ;;;;7oLbhAwAAAAJ;",
        "orcid": ";;;0000-0002-2516-1578;;;0000-0002-3357-0355;;;0000-0003-2621-6048;0000-0002-7483-0045",
        "linkedin": ";;;;;;;;;;",
        "or_profile": "~Ziyang_Xiao2;~Dongxiang_Zhang2;~Yangjun_Wu1;~Lilin_Xu2;~Yuan_Jessica_Wang1;~Xiongwei_Han1;~Xiaojin_Fu1;~Tao_Zhong2;~Jia_Zeng1;~Mingli_Song1;~Gang_Chen6",
        "aff": "Zhejiang University;Zhejiang University;Zhejiang University;University of Electronic Science and Technology of China;Singapore University of Social Sciences;Huawei Technologies Ltd.;;;;Zhejiang University;College of Computer Science and Technology, Zhejiang University",
        "aff_domain": "zjut.edu.cn;zju.edu.cn;zju.edu.cn;uestc.edu.cn;suss.edu.sg;huawei.com;;;;zju.edu.cn;cs.zju.edu.cn",
        "position": "PhD student;Researcher;PhD student;Undergrad student;Assistant Professor;Researcher;;;;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nxiao2024chainofexperts,\ntitle={Chain-of-Experts: When {LLM}s Meet Complex Operations Research Problems},\nauthor={Ziyang Xiao and Dongxiang Zhang and Yangjun Wu and Lilin Xu and Yuan Jessica Wang and Xiongwei Han and Xiaojin Fu and Tao Zhong and Jia Zeng and Mingli Song and Gang Chen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=HobyL1B9CZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "suKy;CHCN;ocDx;B8wx",
        "pdf_size": 777166,
        "rating": "6;6;8;8",
        "confidence": "3;4;4;4",
        "soundness": "3;3;3;3",
        "contribution": "3;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "118;98;164;64",
        "wc_strengths": "20;73;45;30",
        "wc_weaknesses": "65;99;54;40",
        "wc_questions": "38;41;87;22",
        "wc_review": "241;311;350;156",
        "wc_reply_reviewers": "0;19;15;0",
        "wc_reply_authors": "748;646;726;454",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            111.0,
            36.180105030251084
        ],
        "wc_strengths_avg": [
            42.0,
            19.987496091306685
        ],
        "wc_weaknesses_avg": [
            64.5,
            21.80022935659164
        ],
        "wc_questions_avg": [
            47.0,
            24.197107265125723
        ],
        "wc_review_avg": [
            264.5,
            73.81903548543559
        ],
        "wc_reply_reviewers_avg": [
            8.5,
            8.616843969807043
        ],
        "wc_reply_authors_avg": [
            643.5,
            115.80479264693668
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 50,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10791353186889149525&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=HobyL1B9CZ",
        "pdf": "https://openreview.net/pdf?id=HobyL1B9CZ",
        "email": "zjut.edu.cn;zju.edu.cn;zju.edu.cn;uestc.edu.cn;suss.edu.sg;huawei.com;;;;zju.edu.cn;cs.zju.edu.cn",
        "author_num": 11,
        "aff_unique_index": "0;0;0;1;2;3;0;0",
        "aff_unique_norm": "Zhejiang University;University of Electronic Science and Technology of China;Singapore University of Social Sciences;Huawei",
        "aff_unique_dep": ";;;Huawei Technologies",
        "aff_unique_url": "https://www.zju.edu.cn;https://www.uestc.edu.cn;https://www.suss.edu.sg;https://www.huawei.com",
        "aff_unique_abbr": "ZJU;UESTC;SUSS;Huawei",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;1;0;0;0",
        "aff_country_unique": "China;Singapore"
    },
    {
        "id": "HodMKbJkl3",
        "title": "SGD batch saturation for training wide neural networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The performance of the mini-batch stochastic gradient method strongly depends on the batch-size that is used. In the classical convex setting with interpolation, prior work showed that increasing the batch size linearly increases the convergence speed, but only up to a point; when the batch size is larger than a certain threshold (the critical batchsize), further increasing the batch size only leads to negligible improvement. \nThe goal of this work is to investigate the relationship between the batchsize and convergence speed for a broader class of nonconvex problems. Building on recent improved convergence guarantees for SGD, we prove that a similar linear scaling and batch-size saturation phenomenon occurs for training  sufficiently wide neural networks. We conduct a number of numerical experiments on benchmark datasets, which corroborate our findings.",
        "keywords": "mini-batch SGD;batch size;Polyak-Lojasiewicz;PL condition;convergence",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Chaoyue Liu;Dmitriy Drusvyatskiy;Mikhail Belkin;Damek Davis;Yian Ma",
        "authorids": "~Chaoyue_Liu2;~Dmitriy_Drusvyatskiy3;~Mikhail_Belkin1;~Damek_Davis1;~Yian_Ma1",
        "gender": "M;M;;;M",
        "homepage": "https://cliu212.github.io/;https://sites.google.com/uw.edu/ddrusv;;;https://sites.google.com/view/yianma",
        "dblp": "191/6684-1;;;;",
        "google_scholar": "sRjoMX0AAAAJ;;;;A0TFlacAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Chaoyue_Liu2;~Dmitriy_Drusvyatskiy3;~Mikhail_Belkin1;~Damek_Davis1;~Yian_Ma1",
        "aff": "University of California, San Diego;University of Washington, Seattle;;;University of California, San Diego",
        "aff_domain": "ucsd.edu;uw.edu;;;ucsd.edu",
        "position": "Postdoc;Associate Professor;;;Assistant Professor",
        "bibtex": "@misc{\nliu2024sgd,\ntitle={{SGD} batch saturation for training wide neural networks},\nauthor={Chaoyue Liu and Dmitriy Drusvyatskiy and Mikhail Belkin and Damek Davis and Yian Ma},\nyear={2024},\nurl={https://openreview.net/forum?id=HodMKbJkl3}\n}",
        "github": "",
        "project": "",
        "reviewers": "mzrR;daaT;UrqU;vAXR",
        "site": "https://openreview.net/forum?id=HodMKbJkl3",
        "pdf_size": 695499,
        "rating": "1;3;5;5",
        "confidence": "5;5;3;3",
        "soundness": "2;2;3;2",
        "contribution": "2;1;2;2",
        "presentation": "1;2;4;2",
        "wc_summary": "152;52;43;47",
        "wc_strengths": "132;1;30;42",
        "wc_weaknesses": "87;89;268;346",
        "wc_questions": "725;3;322;5",
        "wc_review": "1096;145;663;440",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            1.6583123951777
        ],
        "confidence_avg": [
            4.0,
            1.0
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            73.5,
            45.434018092174064
        ],
        "wc_strengths_avg": [
            51.25,
            48.945760797029195
        ],
        "wc_weaknesses_avg": [
            197.5,
            112.92143286373938
        ],
        "wc_questions_avg": [
            263.75,
            296.26286891880324
        ],
        "wc_review_avg": [
            586.0,
            347.0684370552874
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9045340337332909,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:jvxsz8BTv2wJ:scholar.google.com/&scioq=SGD+batch+saturation+for+training+wide+neural+networks&hl=en&as_sdt=0,5",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of California, San Diego;University of Washington",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ucsd.edu;https://www.washington.edu",
        "aff_unique_abbr": "UCSD;UW",
        "aff_campus_unique_index": "0;1;0",
        "aff_campus_unique": "San Diego;Seattle",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Howb7fXB4V",
        "title": "Pick-or-Mix: Dynamic Channel Sampling for ConvNets",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Channel squeezing is a crucial operation in convolutional neural networks (ConvNets). It is carried out via 1 \u00d7 1 convolution layers and dominates a large portion of computations and parameters of a given network. ResNet-50, for instance, consists of 16 such layers, forming 33% of total layers and 25% (1.05B/4.12B) of total FLOPs. In light of their predominance, we present a new multi-purpose module for dynamic channel sampling, namely Pick-or-Mix (PiX). PiX divides a set of channels into subsets and then picks from them, where the picking decision is dynamically made per each pixel based on the input activations. We show that PiX allows ConvNets to learn better data representation than vanilla channel squeezing in far fewer computations. We plug PiX into prominent ConvNet architectures and verify its multi-purpose utilities. After replacing 1 \u00d7 1 channel squeezing layers in the ResNet family with PiX, the networks become 25% faster without losing accuracy. We also show that PiX can achieve state-of-the-art performance on network downscaling and dynamic channel pruning.",
        "keywords": "Channel Squeezing;Network Downscaling;Dynamic Channel Sampling",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Ashish Kumar;Daneul Kim;Jaesik Park;Laxmidhar Behera",
        "authorids": "~Ashish_Kumar2;~Daneul_Kim1;~Jaesik_Park3;~Laxmidhar_Behera1",
        "gender": "M;M;M;M",
        "homepage": "https://ashishkumar822.github.io;;http://jaesik.info;https://home.iitk.ac.in/~lbehera/",
        "dblp": "34/5378-6;;00/10336;14/1412",
        "google_scholar": "n-oRDEYAAAAJ;;_3q6KBIAAAAJ;https://scholar.google.co.in/citations?user=QWTcyP8AAAAJ",
        "orcid": ";;;",
        "linkedin": "ashishkumar822/;carpedkm;;laxmidhar-behera-a74a5b174/?originalSubdomain=in",
        "or_profile": "~Ashish_Kumar2;~Daneul_Kim1;~Jaesik_Park3;~Laxmidhar_Behera1",
        "aff": "ScorelabsAI, USA;Seoul National University;Seoul National University;Indian Institute of Technology, Kanpur",
        "aff_domain": "scorelabsai.com;snu.ac.kr;snu.ac.kr;iitmandi.ac.in",
        "position": "Researcher;MS student;Assistant Professor;Director",
        "bibtex": "@misc{\nkumar2024pickormix,\ntitle={Pick-or-Mix: Dynamic Channel Sampling for ConvNets},\nauthor={Ashish Kumar and Daneul Kim and Jaesik Park and Laxmidhar Behera},\nyear={2024},\nurl={https://openreview.net/forum?id=Howb7fXB4V}\n}",
        "github": "",
        "project": "",
        "reviewers": "45BR;Nuqz;35yc;9dqH",
        "site": "https://openreview.net/forum?id=Howb7fXB4V",
        "pdf_size": 3107475,
        "rating": "3;5;5;5",
        "confidence": "4;5;5;4",
        "soundness": "3;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "3;2;3;4",
        "wc_summary": "86;68;67;85",
        "wc_strengths": "55;45;28;65",
        "wc_weaknesses": "177;137;114;292",
        "wc_questions": "5;80;2;27",
        "wc_review": "323;330;211;469",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            76.5,
            9.013878188659973
        ],
        "wc_strengths_avg": [
            48.25,
            13.663363421939708
        ],
        "wc_weaknesses_avg": [
            180.0,
            68.47992406537846
        ],
        "wc_questions_avg": [
            28.5,
            31.26099806468117
        ],
        "wc_review_avg": [
            333.25,
            91.49965846930796
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15563413537205031989&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "ScorelabsAI;Seoul National University;Indian Institute of Technology Kanpur",
        "aff_unique_dep": ";;",
        "aff_unique_url": ";https://www.snu.ac.kr;https://www.iitk.ac.in",
        "aff_unique_abbr": ";SNU;IIT Kanpur",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Kanpur",
        "aff_country_unique_index": "0;1;1;2",
        "aff_country_unique": "United States;South Korea;India"
    },
    {
        "id": "HqQctXKI7W",
        "title": "Casting Light on Large Generative Networks: Taming Epistemic Uncertainty in Diffusion Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Epistemic uncertainty plays a pivotal role in contemporary machine learning, serving as a fundamental element that underlies decision-making processes, risk evaluations, and the overall generalizability of models. In this work, we introduce an innovative framework, diffusion ensembles for capturing uncertainty (DECU), designed for estimating epistemic uncertainty within the realm of large high-performing generative diffusion models. These models typically encompass over 100 million parameters and generate outputs within a high-dimensional image space. Consequently, applying conventional methods for estimating epistemic uncertainty is unrealistic without vast computing resources. To address this gap, this paper first presents a novel method for training ensembles of conditional diffusion models in a computationally efficient manner. This is achieved by fitting an ensemble within the conditional networks while using a static set of pre-trained parameters for the remainder of the model. As a result, we significantly reduce the computational load, enabling us to train only a fraction (one thousandth) of the entire network. Furthermore, this substantial reduction in the number of parameters to be trained leads to a marked decrease (87%) in the required training steps compared to a full model on the same dataset. Second, we employ Pairwise-Distance Estimators (PaiDEs) to accurately capture epistemic uncertainty with these ensembles. PaiDEs efficiently gauge the mutual information between model outputs and weights in high-dimensional output space. To validate the effectiveness of our framework, we conducted experiments on the Imagenet dataset. The results demonstrate our ability to capture epistemic uncertainty, particularly for under-sampled image classes. This study represents a significant advancement in detecting epistemic uncertainty for conditional diffusion models, thereby casting new light on the $\\textit{black box}$ of these models.",
        "keywords": "Calibration & Uncertainty Quantification;Ensemble Methods;Diffusion Models",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/24cc5c89e81294c6f9d7cac52bbae518a7f0cbd9.zip",
        "author": "Lucas Berry;Axel Brando;David Meger",
        "authorids": "~Lucas_Berry1;~Axel_Brando1;~David_Meger2",
        "gender": ";M;M",
        "homepage": ";https://axelbrando.github.io;http://www.cim.mcgill.ca/~dmeger/",
        "dblp": "339/6507;223/9914;51/3415.html",
        "google_scholar": "WfYYLtQAAAAJ;https://scholar.google.es/citations?user=sBv2dGAAAAAJ;https://scholar.google.com.tw/citations?user=gFwEytkAAAAJ",
        "orcid": ";;",
        "linkedin": "lucas-berry-86291878/;axelbrando/;",
        "or_profile": "~Lucas_Berry1;~Axel_Brando1;~David_Meger2",
        "aff": "McGill University, McGill University;Barcelona Supercomputing Center;McGill University",
        "aff_domain": "mail.mcgill.ca;bsc.es;mcgill.ca",
        "position": "PhD student;Postdoc;Associate Professor",
        "bibtex": "@misc{\nberry2024casting,\ntitle={Casting Light on Large Generative Networks: Taming Epistemic Uncertainty in Diffusion Models},\nauthor={Lucas Berry and Axel Brando and David Meger},\nyear={2024},\nurl={https://openreview.net/forum?id=HqQctXKI7W}\n}",
        "github": "",
        "project": "",
        "reviewers": "6wEZ;2AQN;LLz1;UPab",
        "site": "https://openreview.net/forum?id=HqQctXKI7W",
        "pdf_size": 30032894,
        "rating": "3;3;6;6",
        "confidence": "3;4;4;2",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;1;3;3",
        "wc_summary": "192;17;62;98",
        "wc_strengths": "74;9;172;84",
        "wc_weaknesses": "186;92;185;77",
        "wc_questions": "165;2;13;146",
        "wc_review": "617;120;432;405",
        "wc_reply_reviewers": "94;0;402;198",
        "wc_reply_authors": "675;161;371;258",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            92.25,
            64.34428879084763
        ],
        "wc_strengths_avg": [
            84.75,
            58.02316347804556
        ],
        "wc_weaknesses_avg": [
            135.0,
            50.77893263943227
        ],
        "wc_questions_avg": [
            81.5,
            74.40598094239468
        ],
        "wc_review_avg": [
            393.5,
            177.74208843152485
        ],
        "wc_reply_reviewers_avg": [
            173.5,
            149.36113952430867
        ],
        "wc_reply_authors_avg": [
            366.25,
            193.12868119468948
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3015113445777637,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:oGWJKHpYS9QJ:scholar.google.com/&scioq=Casting+Light+on+Large+Generative+Networks:+Taming+Epistemic+Uncertainty+in+Diffusion+Models&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "McGill University;Barcelona Supercomputing Center",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.mcgill.ca;https://www.bsc.es",
        "aff_unique_abbr": "McGill;BSC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Canada;Spain"
    },
    {
        "id": "HqmpIud9Uq",
        "title": "Tackling Non-Stationarity in Reinforcement Learning via Causal-Origin Representation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In real-world scenarios, the application of reinforcement learning is significantly challenged by complex non-stationarity. Most existing methods attempt to model changes in the environment explicitly, often requiring impractical prior knowledge. In this paper, we propose a new perspective, positing that non-stationarity can propagate and accumulate through complex causal relationships during state transitions, thereby compounding its sophistication and affecting policy learning. We believe that this challenge can be more effectively addressed by tracing the causal origin of non-stationarity. To this end, we introduce the Causal-Origin REPresentation (COREP) algorithm. COREP primarily employs a guided updating mechanism to learn a stable graph representation for states termed as causal-origin representation. By leveraging this representation, the learned policy exhibits impressive resilience to non-stationarity. We supplement our approach with a theoretical analysis grounded in the causal interpretation for non-stationary reinforcement learning, advocating for the validity of the causal-origin representation. Experimental results further demonstrate the superior performance of COREP over existing methods in tackling non-stationarity.",
        "keywords": "Reinforcement Learning;Non Stationarity;Causal Structure",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/c44d004d418f56b3ad3c0bac4337b47bc249e82e.zip",
        "author": "Wanpeng Zhang;Yilin Li;Boyu Yang;Zongqing Lu",
        "authorids": "~Wanpeng_Zhang1;~Yilin_Li1;~Boyu_Yang2;~Zongqing_Lu2",
        "gender": "M;M;;",
        "homepage": "https://zhangwp.com;;;",
        "dblp": "73/10693-2;;;",
        "google_scholar": "_IKNf9EAAAAJ;https://scholar.google.com/citations?hl=en;;",
        "orcid": "0000-0001-5351-3449;0000-0001-7124-9186;;",
        "linkedin": ";;;",
        "or_profile": "~Wanpeng_Zhang1;~Yilin_Li1;~Boyu_Yang2;~Zongqing_Lu2",
        "aff": "Peking University;Peking University;;",
        "aff_domain": "pku.edu.cn;pku.edu.cn;;",
        "position": "PhD student;PhD student;;",
        "bibtex": "@misc{\nzhang2024tackling,\ntitle={Tackling Non-Stationarity in Reinforcement Learning via Causal-Origin Representation},\nauthor={Wanpeng Zhang and Yilin Li and Boyu Yang and Zongqing Lu},\nyear={2024},\nurl={https://openreview.net/forum?id=HqmpIud9Uq}\n}",
        "github": "",
        "project": "",
        "reviewers": "gcQg;RPQF;TjfN;7zHg;soT9",
        "site": "https://openreview.net/forum?id=HqmpIud9Uq",
        "pdf_size": 1918102,
        "rating": "3;3;3;3;8",
        "confidence": "4;4;4;3;3",
        "soundness": "3;3;1;2;2",
        "contribution": "2;1;2;2;2",
        "presentation": "2;3;2;1;2",
        "wc_summary": "50;17;69;56;205",
        "wc_strengths": "636;17;43;27;87",
        "wc_weaknesses": "31;380;93;375;185",
        "wc_questions": "3;29;19;6;11",
        "wc_review": "720;443;224;464;488",
        "wc_reply_reviewers": "23;137;0;0;0",
        "wc_reply_authors": "1322;902;373;1815;330",
        "reply_reviewers": "1;1;0;0;0",
        "reply_authors": "3;4;2;4;1",
        "rating_avg": [
            4.0,
            2.0
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.2,
            0.7483314773547882
        ],
        "contribution_avg": [
            1.8,
            0.4000000000000001
        ],
        "presentation_avg": [
            2.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            79.4,
            65.09869430334221
        ],
        "wc_strengths_avg": [
            162.0,
            238.20663298909207
        ],
        "wc_weaknesses_avg": [
            212.8,
            143.13685758741528
        ],
        "wc_questions_avg": [
            13.6,
            9.414881836751857
        ],
        "wc_review_avg": [
            467.8,
            157.5314571760193
        ],
        "wc_reply_reviewers_avg": [
            32.0,
            53.2503521115119
        ],
        "wc_reply_authors_avg": [
            948.4,
            566.7855326311709
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            2.8,
            1.16619037896906
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.6123724356957946,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:dxVnbhmEw3MJ:scholar.google.com/&scioq=Tackling+Non-Stationarity+in+Reinforcement+Learning+via+Causal-Origin+Representation&hl=en&as_sdt=0,31",
        "gs_version_total": 8,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Peking University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.pku.edu.cn",
        "aff_unique_abbr": "Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Oracle Efficient Algorithms for Groupwise Regret",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18976",
        "id": "HrRKc9ei7h",
        "author_site": "Krishna Acharya, Eshwar Ram Arunachaleswaran, Sampath Kannan, Aaron Roth, Juba Ziani",
        "tldr": "",
        "abstract": "We study the problem of online prediction, in which at each time step $t \\in \\{1,2, \\cdots T\\}$, an individual $x_t$ arrives, whose label we must predict. Each individual is associated with various groups, defined based on their features such as age, sex, race etc., which may intersect. Our goal is to make predictions that have regret guarantees not just overall but also simultaneously on each sub-sequence comprised of the members of any single group. Previous work such as  [Blum & Lykouris][1] and [Lee et al][2] provide attractive regret guarantees for these problems; however, these are computationally intractable on large model classes (e.g., the set of all linear models, as used in linear regression). We show that a simple modification of the sleeping experts technique of [Blum & Lykouris][1] yields an efficient *reduction* to the well-understood problem of obtaining diminishing external regret *absent group considerations*. \nOur approach gives similar regret guarantees compared to [Blum & Lykouris][1]; however, we run in time linear in the number of groups, and are oracle-efficient in the hypothesis class. This in particular implies that our algorithm is efficient whenever the number of groups is  polynomially bounded and the external-regret problem can be solved efficiently, an improvement on [Blum & Lykouris][1]'s stronger condition that the model class must be small. Our approach can handle online linear regression and online combinatorial optimization problems like online shortest paths. Beyond providing theoretical regret bounds, we evaluate this algorithm with an extensive set of experiments on synthetic data and on two real data sets --- Medical costs and the Adult income dataset, both instantiated with intersecting groups defined in terms of race, sex, and other demographic characteristics. \nWe find that uniformly across groups, our algorithm gives substantial error improvements compared to running a standard online linear regression algorithm with no groupwise regret guarantees.",
        "keywords": "Oracle efficiency;online learning;groupwise regret;sleeping experts",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/94d5449299346bbf81377b0ba066a5a2db130287.zip",
        "author": "Krishna Acharya;Eshwar Ram Arunachaleswaran;Sampath Kannan;Aaron Roth;Juba Ziani",
        "authorids": "~Krishna_Acharya1;~Eshwar_Ram_Arunachaleswaran2;~Sampath_Kannan1;~Aaron_Roth1;~Juba_Ziani1",
        "gender": "M;M;M;M;M",
        "homepage": "https://krishnacharya.github.io/;https://www.seas.upenn.edu/~eshwar/;;http://www.cis.upenn.edu/~aaroth/;http://www.juba-ziani.com",
        "dblp": "329/5744;;86/5425;80/3311;157/3784",
        "google_scholar": "J6dLfsEAAAAJ;aXBGOt4AAAAJ;;https://scholar.google.com.tw/citations?user=kLUQrrYAAAAJ;https://scholar.google.co.in/citations?user=1bwPKXpo97YC",
        "orcid": ";;;;0000-0002-3324-4349",
        "linkedin": "krishna-acharya-289662137/;;;;",
        "or_profile": "~Krishna_Acharya1;~Eshwar_Ram_Arunachaleswaran2;~Sampath_Kannan1;~Aaron_Roth1;~Juba_Ziani1",
        "aff": "Georgia Institute of Technology;University of Pennsylvania;University of Pennsylvania;University of Pennsylvania;Georgia Institute of Technology",
        "aff_domain": "gatech.edu;seas.upenn.edu;upenn.edu;upenn.edu;gatech.edu",
        "position": "PhD student;PhD student;Full Professor;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nacharya2024oracle,\ntitle={Oracle Efficient Algorithms for Groupwise Regret},\nauthor={Krishna Acharya and Eshwar Ram Arunachaleswaran and Sampath Kannan and Aaron Roth and Juba Ziani},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=HrRKc9ei7h}\n}",
        "github": "",
        "project": "",
        "reviewers": "6fRD;1CJx;eJaJ;vWf7",
        "pdf_size": 1099508,
        "rating": "3;6;8;8",
        "confidence": "4;5;4;3",
        "soundness": "1;4;3;4",
        "contribution": "1;2;4;3",
        "presentation": "2;3;2;4",
        "wc_summary": "47;92;334;145",
        "wc_strengths": "42;36;139;113",
        "wc_weaknesses": "80;56;328;36",
        "wc_questions": "17;97;132;2",
        "wc_review": "186;281;933;296",
        "wc_reply_reviewers": "0;0;89;0",
        "wc_reply_authors": "687;244;367;176",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            6.25,
            2.0463381929681126
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            1.224744871391589
        ],
        "contribution_avg": [
            2.5,
            1.118033988749895
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            154.5,
            109.28517740297629
        ],
        "wc_strengths_avg": [
            82.5,
            44.51123453691214
        ],
        "wc_weaknesses_avg": [
            125.0,
            118.23282116231516
        ],
        "wc_questions_avg": [
            62.0,
            54.198708471696996
        ],
        "wc_review_avg": [
            424.0,
            296.8829735771319
        ],
        "wc_reply_reviewers_avg": [
            22.25,
            38.53813046840752
        ],
        "wc_reply_authors_avg": [
            368.5,
            196.21480576144094
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.34554737023254406,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18358346266562805499&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "openreview": "https://openreview.net/forum?id=HrRKc9ei7h",
        "pdf": "https://openreview.net/pdf?id=HrRKc9ei7h",
        "email": "gatech.edu;seas.upenn.edu;upenn.edu;upenn.edu;gatech.edu",
        "author_num": 5,
        "aff_unique_index": "0;1;1;1;0",
        "aff_unique_norm": "Georgia Institute of Technology;University of Pennsylvania",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.gatech.edu;https://www.upenn.edu",
        "aff_unique_abbr": "Georgia Tech;UPenn",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "HrTGl8AhnS",
        "title": "PACIA: Parameter-Efficient Adapter for Few-Shot Molecular Property Prediction",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Molecular property prediction (MPP) plays a crucial role in biomedical applications, but it often encounters challenges due to a scarcity of labeled data. Existing works commonly adopt gradient-based strategy to update a large amount of parameter for property-level adaptation.  However, the increase of adaptive parameters can cause overfitting and lead to poor performance. Observing that graph neural network (GNN) performs well as both encoder and predictor, we propose PACIA, a parameter-efficient GNN adapter for few-shot MPP. We design a unified adapter to generate a few adaptive parameters to modulate the message passing process of GNN. We then adopt hierarchical adaptation mechanism to adapt the encoder on property-level and the predictor on molecule-level by the unified GNN adapter. Extensive results show that PACIA obtains the state-of-the-art performance in few-shot MPP problems, and our proposed hierarchical adaptation mechanism is rational and effective.",
        "keywords": "molecular property prediction;few-shot learning;hypernetwork",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/21beb7781101ba65c6f876b40b677ecc880b187d.pdf",
        "author": "Shiguang Wu;Yaqing Wang;quanming yao",
        "authorids": "~Shiguang_Wu3;~Yaqing_Wang2;~quanming_yao1",
        "gender": ";F;M",
        "homepage": "https://ovo67.github.io/;http://www.cse.ust.hk/~ywangcy/;https://lars-group.github.io/",
        "dblp": "275/7661;147/1393-2;158/1014",
        "google_scholar": "JoGRPwcAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com/schhp?hl=en",
        "orcid": ";0000-0003-1457-1114;",
        "linkedin": ";;",
        "or_profile": "~Shiguang_Wu3;~Yaqing_Wang2;~quanming_yao1",
        "aff": "Tsinghua University;Baidu Research;Department of Electronic Engineering",
        "aff_domain": "mails.tsinghua.edu.cn;baidu.com;tsinghua.edu.cn",
        "position": "PhD student;Researcher;Assistant Professor",
        "bibtex": "@misc{\nwu2024pacia,\ntitle={{PACIA}: Parameter-Efficient Adapter for Few-Shot Molecular Property Prediction},\nauthor={Shiguang Wu and Yaqing Wang and quanming yao},\nyear={2024},\nurl={https://openreview.net/forum?id=HrTGl8AhnS}\n}",
        "github": "",
        "project": "",
        "reviewers": "mPeR;tnxf;smzw;WZaL",
        "site": "https://openreview.net/forum?id=HrTGl8AhnS",
        "pdf_size": 1704592,
        "rating": "3;5;6;6",
        "confidence": "4;4;3;2",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;2",
        "presentation": "2;2;3;3",
        "wc_summary": "59;56;68;82",
        "wc_strengths": "19;92;117;56",
        "wc_weaknesses": "229;132;130;112",
        "wc_questions": "3;5;61;36",
        "wc_review": "310;285;376;286",
        "wc_reply_reviewers": "0;0;0;17",
        "wc_reply_authors": "523;234;362;504",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            66.25,
            10.108783309577865
        ],
        "wc_strengths_avg": [
            71.0,
            37.03376837428241
        ],
        "wc_weaknesses_avg": [
            150.75,
            45.84416538666616
        ],
        "wc_questions_avg": [
            26.25,
            23.951774464536026
        ],
        "wc_review_avg": [
            314.25,
            37.029549011566424
        ],
        "wc_reply_reviewers_avg": [
            4.25,
            7.361215932167728
        ],
        "wc_reply_authors_avg": [
            405.75,
            117.06061464045027
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.7385489458759963,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=703692783636141514&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Tsinghua University;Baidu;Institution Name Not Provided",
        "aff_unique_dep": ";Baidu Research;Department of Electronic Engineering",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://research.baidu.com;",
        "aff_unique_abbr": "THU;Baidu;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China;"
    },
    {
        "id": "HsJzGWvg7K",
        "title": "Sparse Cocktail: Every Sparse Pattern Every Sparse Ratio All At Once",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Sparse Neural Networks (SNNs) have received voluminous attention for mitigating the explosion in computational costs and memory footprints of modern deep neural networks. Despite their popularity, most state-of-the-art training approaches seek to find a single high-quality sparse subnetwork with a preset sparsity pattern and ratio, making them inadequate to satiate platform and resource variability. Recently proposed approaches attempt to jointly train multiple subnetworks (we term as ``sparse co-training\") with a \\ul{fixed sparsity pattern}, to allow switching sparsity ratios subject to resource requirements. In this work, we take one more step forward and expand the scope of sparse co-training to cover \\underline{diverse sparsity patterns} and \\underline{multiple sparsity ratios} \\textit{at once}. We introduce \\textbf{Sparse Cocktail}, the \\underline{first} sparse co-training framework that co-trains a suite of sparsity patterns simultaneously, loaded with multiple sparsity ratios which facilitate harmonious switch across various sparsity patterns and ratios at inference depending on the hardware availability. More specifically, Sparse Cocktail alternatively trains subnetworks generated from different sparsity patterns with a gradual increase in sparsity ratios across patterns and relies on an \\textit{unified mask generation process} and the \\textit{Dense Pivot Co-training}  to ensure the subnetworks of different patterns orchestrate their shared parameters without canceling each other\u2019s performance. Experiment results on image classification, object detection and instance segmentation illustrate the favorable effectiveness and flexibility of Sparse Cocktail, pointing to a promising direction for sparse co-training. Codes will be released.",
        "keywords": "Sparse co-training;pruning;efficient and flexible NN inferencing",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Zhangheng LI;Shiwei Liu;Tianlong Chen;AJAY KUMAR JAISWAL;Zhenyu Zhang;Dilin Wang;Raghuraman Krishnamoorthi;Shiyu Chang;Zhangyang Wang",
        "authorids": "~Zhangheng_LI2;~Shiwei_Liu2;~Tianlong_Chen1;~AJAY_KUMAR_JAISWAL1;~Zhenyu_Zhang4;~Dilin_Wang1;~Raghuraman_Krishnamoorthi1;~Shiyu_Chang2;~Zhangyang_Wang1",
        "gender": "M;M;M;M;M;M;Unspecified;M;M",
        "homepage": ";https://shiweiliuiiiiiii.github.io/;https://tianlong-chen.github.io;https://ajay1994.github.io/;https://zhenyu.gallery;;http://people.csail.mit.edu/chang87/;https://vita-group.github.io;",
        "dblp": ";234/8697-3.html;;30/9707;01/1844-15;;28/9988;119/4026;142/7035",
        "google_scholar": "https://scholar.google.co.uk/citations?user=NZCLqZMAAAAJ;73IbXtsAAAAJ;LE3ctn0AAAAJ;I783HxYAAAAJ;ZLyJRxoAAAAJ;F1mr9C0AAAAJ;r21asW4AAAAJ;pxFyKAIAAAAJ;dmTy9EIAAAAJ",
        "orcid": ";;0000-0001-7774-8197;;;;;;",
        "linkedin": "%E7%AB%A0%E6%81%92-%E6%9D%8E-b1b19711a/;;tianlong-chen-783862167/;;zhenyu-allen-zhang-a9b1391a3/;raghuraman-krishnamoorthi-b8670a5/;;;",
        "or_profile": "~Zhangheng_LI2;~Shiwei_Liu2;~Tianlong_Chen1;~AJAY_KUMAR_JAISWAL1;~Zhenyu_Zhang4;~Raghuraman_Krishnamoorthi1;~Shiyu_Chang2;~Zhangyang_Wang1;~Dilin_Wang2",
        "aff": "University of Texas at Austin;University of Oxford;Harvard University;University of Texas, Austin;University of Texas at Austin;Meta Facebook;University of California, Santa Barbara;University of Texas at Austin;Meta",
        "aff_domain": "utexas.edu;ox.ac.uk;harvard.edu;utexas.edu;utexas.edu;meta.com;ucsb.edu;utexas.edu;meta.com",
        "position": "PhD student;Postdoc;Postdoc;PhD student;PhD student;Researcher;Assistant Professor;Associate Professor;Research Scientist",
        "bibtex": "@misc{\nli2024sparse,\ntitle={Sparse Cocktail: Every Sparse Pattern Every Sparse Ratio All At Once},\nauthor={Zhangheng LI and Shiwei Liu and Tianlong Chen and AJAY KUMAR JAISWAL and Zhenyu Zhang and Dilin Wang and Raghuraman Krishnamoorthi and Shiyu Chang and Zhangyang Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=HsJzGWvg7K}\n}",
        "github": "",
        "project": "",
        "reviewers": "MPL5;1N1a;TUJX",
        "site": "https://openreview.net/forum?id=HsJzGWvg7K",
        "pdf_size": 912665,
        "rating": "3;6;8",
        "confidence": "3;4;4",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "2;3;3",
        "wc_summary": "59;29;67",
        "wc_strengths": "20;172;223",
        "wc_weaknesses": "301;129;74",
        "wc_questions": "125;2;20",
        "wc_review": "505;332;384",
        "wc_reply_reviewers": "213;0;0",
        "wc_reply_authors": "2076;965;315",
        "reply_reviewers": "1;0;0",
        "reply_authors": "4;2;1",
        "rating_avg": [
            5.666666666666667,
            2.0548046676563256
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            51.666666666666664,
            16.35712552851373
        ],
        "wc_strengths_avg": [
            138.33333333333334,
            86.22580175845793
        ],
        "wc_weaknesses_avg": [
            168.0,
            96.68850328072446
        ],
        "wc_questions_avg": [
            49.0,
            54.24020648928247
        ],
        "wc_review_avg": [
            407.0,
            72.47528314305966
        ],
        "wc_reply_reviewers_avg": [
            71.0,
            100.40916292848975
        ],
        "wc_reply_authors_avg": [
            1118.6666666666667,
            727.0902435201715
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.9176629354822472,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8961225764107459830&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;0;0;3;4;0;3",
        "aff_unique_norm": "University of Texas at Austin;University of Oxford;Harvard University;Meta;University of California, Santa Barbara",
        "aff_unique_dep": ";;;Meta Platforms, Inc.;",
        "aff_unique_url": "https://www.utexas.edu;https://www.ox.ac.uk;https://www.harvard.edu;https://meta.com;https://www.ucsb.edu",
        "aff_unique_abbr": "UT Austin;Oxford;Harvard;Meta;UCSB",
        "aff_campus_unique_index": "0;0;0;2;0",
        "aff_campus_unique": "Austin;;Santa Barbara",
        "aff_country_unique_index": "0;1;0;0;0;0;0;0;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "Hsf2pDv2Qw",
        "title": "RL Simplex: Bringing Computational Efficiency in Linear Programming via Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In the simplex method, the selection of variables during the pivot operation in each iteration significantly impacts the overall computational process.  The primary objective of this study is to provide explicit guidance for the selection of pivot variables, particularly when multiple candidate variables for pivoting are available, through the application of reinforcement learning techniques.  We illustrate our approach, termed RL Simplex, to the Euclidean Traveling Salesman Problem (TSP) with varying city counts,  substantially reducing the number of iterations.  Our experimental findings demonstrate the practical feasibility and successful integration of reinforcement learning with the simplex method, surpassing the performance of established solver software packages such as Gurobi and SciPy.",
        "keywords": "Reinforcement learning;Pivot rules;Simplex method;Linear programming;TSP",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Guantao Zhao;Amin Dehghanian;Mahdi Noorizadegan;Nicoleta Serban",
        "authorids": "~Guantao_Zhao1;~Amin_Dehghanian1;~Mahdi_Noorizadegan1;~Nicoleta_Serban1",
        "gender": "M;M;M;F",
        "homepage": ";https://sites.google.com/view/amin-dehghanian;https://www.northumbria.ac.uk/about-us/our-staff/n/mahdi-noorizadegan/;https://www.healthanalytics.gatech.edu/",
        "dblp": ";;;",
        "google_scholar": ";PRC-zmYAAAAJ;;",
        "orcid": "0000-0002-0286-8757;;;",
        "linkedin": ";;;",
        "or_profile": "~Guantao_Zhao1;~Amin_Dehghanian1;~Mahdi_Noorizadegan1;~Nicoleta_Serban2",
        "aff": "Georgia Institute of Technology;;Northumbria University;Georgia Institute of Technology",
        "aff_domain": "gatech.edu;;northumbria.ac.uk;gatech.edu",
        "position": "PhD student;;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nzhao2024rl,\ntitle={{RL} Simplex: Bringing Computational Efficiency in Linear Programming via Reinforcement Learning},\nauthor={Guantao Zhao and Amin Dehghanian and Mahdi Noorizadegan and Nicoleta Serban},\nyear={2024},\nurl={https://openreview.net/forum?id=Hsf2pDv2Qw}\n}",
        "github": "",
        "project": "",
        "reviewers": "TGjj;PpN6;95G6;tujU",
        "site": "https://openreview.net/forum?id=Hsf2pDv2Qw",
        "pdf_size": 360885,
        "rating": "1;3;3;6",
        "confidence": "5;5;3;2",
        "soundness": "2;2;2;2",
        "contribution": "1;2;1;3",
        "presentation": "3;3;1;2",
        "wc_summary": "71;52;76;44",
        "wc_strengths": "60;31;79;55",
        "wc_weaknesses": "122;363;233;69",
        "wc_questions": "4;32;196;123",
        "wc_review": "257;478;584;291",
        "wc_reply_reviewers": "0;0;106;0",
        "wc_reply_authors": "329;776;515;419",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.75,
            1.299038105676658
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            60.75,
            13.179055353097201
        ],
        "wc_strengths_avg": [
            56.25,
            17.108112110925624
        ],
        "wc_weaknesses_avg": [
            196.75,
            112.761640197365
        ],
        "wc_questions_avg": [
            88.75,
            75.95845904176835
        ],
        "wc_review_avg": [
            402.5,
            134.39215006837267
        ],
        "wc_reply_reviewers_avg": [
            26.5,
            45.89934640057525
        ],
        "wc_reply_authors_avg": [
            509.75,
            167.1995439587082
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8354004862362578,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Qd-3HOluVlgJ:scholar.google.com/&scioq=RL+Simplex:+Bringing+Computational+Efficiency+in+Linear+Programming+via+Reinforcement+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Georgia Institute of Technology;Northumbria University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.gatech.edu;https://www.northumbria.ac.uk",
        "aff_unique_abbr": "Georgia Tech;Northumbria",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "HvTJLthEGQ",
        "title": "Zero-shot Clustering of Embeddings with Pretrained and Self-Supervised Learning Encoders",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this work, we explore whether pretrained models can provide a useful representation space for datasets they were not trained on, and whether these representations can be used to group novel unlabelled data into meaningful clusters. To this end, we conduct experiments using image representation encoders pretrained on ImageNet using either supervised or self-supervised training techniques. These encoders are deployed on image datasets that were not seen during training, and we investigate whether their embeddings can be clustered with conventional clustering algorithms. We find that it is possible to create well-defined clusters using self-supervised feature encoders, especially when using the agglomerative clustering method, and that it is possible to do so even for very fine-grained datasets such as iNaturalist. We also find indications that the Silhouette score is a good proxy of cluster quality for self-supervised feature encoders when no ground truth is available.",
        "keywords": "ssl;clustering",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Scott C Lowe;Joakim Bruslund Haurum;Sageev Oore;Thomas B. Moeslund;Graham W. Taylor",
        "authorids": "~Scott_C_Lowe1;~Joakim_Bruslund_Haurum1;~Sageev_Oore1;~Thomas_B._Moeslund1;~Graham_W._Taylor1",
        "gender": ";M;M;M;",
        "homepage": "https://scottclowe.com/;https://vbn.aau.dk/en/persons/139317;;http://thbm.blog.aau.dk/;https://www.gwtaylor.ca",
        "dblp": "245/0038;201/0296;67/4980;12/6781;17/1633",
        "google_scholar": "https://scholar.google.ca/citations?user=ZFPhxuAAAAAJ;GAEtgr4AAAAJ;https://scholar.google.ca/citations?user=cI0dYX4AAAAJ;https://scholar.google.dk/citations?user=XmkDts4AAAAJ;https://scholar.google.ca/citations?user=PUeKU8kAAAAJ",
        "orcid": "0000-0002-5237-3867;0000-0002-0544-0422;;;",
        "linkedin": "scottclowe/;;;;",
        "or_profile": "~Scott_C_Lowe1;~Joakim_Bruslund_Haurum1;~Sageev_Oore1;~Thomas_B._Moeslund1;~Graham_W_Taylor1",
        "aff": "Vector Institute;University of Edinburgh;Vector Institute;Aalborg University;University of Guelph",
        "aff_domain": "vectorinstitute.ai;ed.ac.uk;vectorinstitute.ai;aau.dk;uoguelph.ca",
        "position": "Postdoc;Visiting Researcher;Researcher;Full Professor;Full Professor",
        "bibtex": "@misc{\nlowe2024zeroshot,\ntitle={Zero-shot Clustering of Embeddings with Pretrained and Self-Supervised Learning Encoders},\nauthor={Scott C Lowe and Joakim Bruslund Haurum and Sageev Oore and Thomas B. Moeslund and Graham W. Taylor},\nyear={2024},\nurl={https://openreview.net/forum?id=HvTJLthEGQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "B14Z;bmQE;JmUn;XtjS",
        "site": "https://openreview.net/forum?id=HvTJLthEGQ",
        "pdf_size": 275115,
        "rating": "1;3;5;5",
        "confidence": "5;4;4;4",
        "soundness": "2;4;3;2",
        "contribution": "1;2;3;3",
        "presentation": "2;3;3;2",
        "wc_summary": "21;154;74;70",
        "wc_strengths": "14;71;87;46",
        "wc_weaknesses": "230;224;347;181",
        "wc_questions": "3;143;38;4",
        "wc_review": "268;592;546;301",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "727;677;667;427",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.5,
            1.6583123951777
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            79.75,
            47.67795612230038
        ],
        "wc_strengths_avg": [
            54.5,
            27.572631357924475
        ],
        "wc_weaknesses_avg": [
            245.5,
            61.573127255321374
        ],
        "wc_questions_avg": [
            47.0,
            57.18828551373087
        ],
        "wc_review_avg": [
            426.75,
            143.6512704433901
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            624.5,
            116.27015954233485
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.8703882797784891,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=866541729486456651&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;2;3",
        "aff_unique_norm": "Vector Institute;University of Edinburgh;Aalborg University;University of Guelph",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://vectorinstitute.ai/;https://www.ed.ac.uk;https://www.aau.dk;https://www.uoguelph.ca",
        "aff_unique_abbr": "Vector Institute;Edinburgh;AAU;U of G",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;2;0",
        "aff_country_unique": "Canada;United Kingdom;Denmark"
    },
    {
        "id": "HwQ8NVvdmm",
        "title": "Hadamard Domain Training with Integers for Class Incremental Quantized Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Continual learning is a desirable feature in many modern machine learning applications, which allows in-field adaptation and updating, ranging from accommodating distribution shift, to fine-tuning, and to learning new tasks. For applications with privacy and low latency requirements, the compute and memory demands imposed by continual learning can be cost-prohibitive for resource-constraint edge platforms. Reducing computational precision through fully quantized training (FQT) simultaneously reduces memory footprint and increases compute efficiency for both training and inference. However, aggressive quantization especially integer FQT typically degrades model accuracy to unacceptable levels. In this paper, we propose a technique that leverages inexpensive Hadamard transforms to enable low-precision training with only integer matrix multiplications. We further determine which tensors need stochastic rounding and propose tiled matrix multiplication to enable low-bit width accumulators. We demonstrate the effectiveness of our technique on several human activity recognition datasets and CIFAR100 in a class incremental learning setting. We achieve less than 0.5% and 3% accuracy degradation while we quantize all matrix multiplications inputs down to 4-bits with 8-bit accumulators.",
        "keywords": "Quantization;Continual Learning;Class Incremental Learning;Fully Quantized Learning;Human Activity Recognition;Hadamard;Accumulator Quantization;Edge Computation",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/6a0c4c196a60bdf0bcd883d8d036c547972faaa2.zip",
        "author": "Martin Schiemer;Clemens JS Schaefer;Jayden Parker Vap;Mark James Horeni;Yu Emma Wang;Juan Ye;Siddharth Joshi",
        "authorids": "~Martin_Schiemer1;~Clemens_JS_Schaefer1;~Jayden_Parker_Vap2;~Mark_James_Horeni1;~Yu_Emma_Wang1;~Juan_Ye1;~Siddharth_Joshi2",
        "gender": "M;M;M;M;F;;M",
        "homepage": ";http://clemens-schafer.com/;;;https://yuemmawang.github.io/;;",
        "dblp": ";261/9795;;;;;63/6495-1.html",
        "google_scholar": ";VgWtDQcAAAAJ;;;cIt4my0AAAAJ;;PegsFZ8AAAAJ",
        "orcid": "0000-0003-2986-2707;;;;;;0000-0002-9201-9678",
        "linkedin": ";clemens-schaefer-112903258/;jayden-vap-7829b41b2;mark-h-4868a3153/;emma-yu-w-507b35bb/;;",
        "or_profile": "~Martin_Schiemer1;~Clemens_JS_Schaefer1;~Jayden_Parker_Vap2;~Mark_James_Horeni1;~Yu_Emma_Wang1;~Juan_Ye1;~Siddharth_Joshi2",
        "aff": "University of St Andrews;Google;University of Notre Dame;University of Notre Dame;Google;University of St Andrews;University of Notre Dame",
        "aff_domain": "st-andrews.ac.uk;google.com;nd.edu;nd.edu;google.com;st-andrews.ac.uk;nd.edu",
        "position": "PhD student;Software Engineer;PhD student;PhD student;Researcher;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nschiemer2024hadamard,\ntitle={Hadamard Domain Training with Integers for Class  Incremental Quantized Learning},\nauthor={Martin Schiemer and Clemens JS Schaefer and Jayden Parker Vap and Mark James Horeni and Yu Emma Wang and Juan Ye and Siddharth Joshi},\nyear={2024},\nurl={https://openreview.net/forum?id=HwQ8NVvdmm}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZGvQ;2d5P;q1uv;YCXn",
        "site": "https://openreview.net/forum?id=HwQ8NVvdmm",
        "pdf_size": 1141929,
        "rating": "3;5;5;5",
        "confidence": "4;4;2;3",
        "soundness": "2;2;2;2",
        "contribution": "1;2;2;3",
        "presentation": "2;1;2;2",
        "wc_summary": "72;202;38;78",
        "wc_strengths": "61;31;16;140",
        "wc_weaknesses": "285;171;57;172",
        "wc_questions": "131;77;9;157",
        "wc_review": "549;481;120;547",
        "wc_reply_reviewers": "0;0;133;29",
        "wc_reply_authors": "1780;962;391;1400",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "3;2;1;3",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            97.5,
            62.231422930863474
        ],
        "wc_strengths_avg": [
            62.0,
            47.859168400631454
        ],
        "wc_weaknesses_avg": [
            171.25,
            80.61133605145122
        ],
        "wc_questions_avg": [
            93.5,
            56.681125606325075
        ],
        "wc_review_avg": [
            424.25,
            177.77707248123983
        ],
        "wc_reply_reviewers_avg": [
            40.5,
            54.70146250330058
        ],
        "wc_reply_authors_avg": [
            1133.25,
            517.1321760439974
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3415043232500253173&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;2;1;0;2",
        "aff_unique_norm": "University of St Andrews;Google;University of Notre Dame",
        "aff_unique_dep": ";Google;",
        "aff_unique_url": "https://www.st-andrews.ac.uk;https://www.google.com;https://www.nd.edu",
        "aff_unique_abbr": "St Andrews;Google;Notre Dame",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;1;1;1;0;1",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "id": "HxHrRUHMOD",
        "title": "Accurate Differential Operators for Neural Fields",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Neural fields have become widely used in various fields, from shape representation to neural rendering, and for solving partial differential equations (PDEs). With the advent of hybrid neural field representations like Instant NGP that leverage small MLPs and explicit representations, these models train quickly and can fit large scenes. Yet in many applications like rendering and simulation, hybrid neural fields can cause noticeable and unreasonable artifacts. This is because they do not yield accurate spatial derivatives needed for these downstream applications. In this work, we propose two ways to circumvent these challenges. Our first approach is a post hoc operator that uses local polynomial-fitting to obtain more accurate derivatives from pre-trained hybrid neural fields. Additionally, we also propose a self-supervised fine-tuning approach that refines the neural field to yield accurate derivatives directly while preserving the initial signal. We show the application of our method on rendering, collision simulation, and solving PDEs. We observe that using our approach yields more accurate derivatives, reducing artifacts and leading to more accurate simulations in downstream applications.",
        "keywords": "Neural Fields;Deep Learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Aditya Chetan;Guandao Yang;Zichen Wang;Steve Marschner;Bharath Hariharan",
        "authorids": "~Aditya_Chetan1;~Guandao_Yang1;~Zichen_Wang10;~Steve_Marschner1;~Bharath_Hariharan3",
        "gender": "M;M;M;M;M",
        "homepage": "https://justachetan.github.io;http://www.guandaoyang.com;https://zichenwang01.github.io/;http://www.cs.cornell.edu/~srm/;http://home.bharathh.info",
        "dblp": "218/5449;209/9624;;;05/8412",
        "google_scholar": "-wsZhDAAAAAJ;_kElCmMAAAAJ;https://scholar.google.com/citations?view_op=list_works;https://scholar.google.com.tw/citations?user=llo3F3QAAAAJ;TpglobcAAAAJ",
        "orcid": ";0000-0002-2992-5803;0000-0001-8666-2061;;",
        "linkedin": "achetan/;guandao-yang-349b83a6/;;;",
        "or_profile": "~Aditya_Chetan1;~Guandao_Yang1;~Zichen_Wang10;~Steve_Marschner1;~Bharath_Hariharan2",
        "aff": "Cornell University;Stanford University;Cornell University;NVIDIA;Cornell University",
        "aff_domain": "cornell.edu;stanford.edu;cornell.edu;nvidia.com;cornell.edu",
        "position": "PhD student;Postdoc;Undergrad student;Visiting Professor;Assistant Professor",
        "bibtex": "@misc{\nchetan2024accurate,\ntitle={Accurate Differential Operators for Neural Fields},\nauthor={Aditya Chetan and Guandao Yang and Zichen Wang and Steve Marschner and Bharath Hariharan},\nyear={2024},\nurl={https://openreview.net/forum?id=HxHrRUHMOD}\n}",
        "github": "",
        "project": "",
        "reviewers": "6pQ5;DXqV;gdRC;LQfg",
        "site": "https://openreview.net/forum?id=HxHrRUHMOD",
        "pdf_size": 21206374,
        "rating": "3;3;6;8",
        "confidence": "4;4;4;4",
        "soundness": "3;2;3;3",
        "contribution": "1;2;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "83;78;143;97",
        "wc_strengths": "78;62;77;133",
        "wc_weaknesses": "249;451;95;46",
        "wc_questions": "39;4;125;25",
        "wc_review": "449;595;440;301",
        "wc_reply_reviewers": "0;0;57;13",
        "wc_reply_authors": "575;575;547;149",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            5.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            100.25,
            25.645418694183956
        ],
        "wc_strengths_avg": [
            87.5,
            27.02313823374332
        ],
        "wc_weaknesses_avg": [
            210.25,
            157.89454550427004
        ],
        "wc_questions_avg": [
            48.25,
            46.02920268698992
        ],
        "wc_review_avg": [
            446.25,
            104.00811266434941
        ],
        "wc_reply_reviewers_avg": [
            17.5,
            23.41473894793619
        ],
        "wc_reply_authors_avg": [
            461.5,
            180.78371054937443
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:AZb1ZYsHsfYJ:scholar.google.com/&scioq=Accurate+Differential+Operators+for+Neural+Fields&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;2;0",
        "aff_unique_norm": "Cornell University;Stanford University;NVIDIA",
        "aff_unique_dep": ";;NVIDIA Corporation",
        "aff_unique_url": "https://www.cornell.edu;https://www.stanford.edu;https://www.nvidia.com",
        "aff_unique_abbr": "Cornell;Stanford;NVIDIA",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Stanford",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "HyEP74HLTh",
        "title": "Adversarial Robust Representation Learning via Contrast and Alignment",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Deep neural networks are vulnerable to adversarial noise. Adversarial training (AT) has been demonstrated to be the most effective defense strategy to protect neural networks from being fooled. However, we find AT omits to learning robust features, resulting in poor performance of adversarial robustness. To address this issue, we highlight two characteristics of robust representation: \n$(1) exclusion$: the feature of natural examples keeps away from that of other classes; $(2) alignment$: the feature of natural and corresponding adversarial examples is close to each other. These motivate us to propose a generic framework of AT to gain robust representation, by the asymmetric negative contrast and reverse attention. Specifically, we design an asymmetric negative contrast based on predicted probabilities, to push away examples of different classes in the feature space. Moreover, we propose to weight feature by parameters of the linear classifier as the reverse attention, to obtain class-aware feature and pull close the feature of the same class. Empirical evaluations on three benchmark datasets show our methods greatly advance the robustness of AT and achieve state-of-the-art performance.",
        "keywords": "Robust Representation Learning via Asymmetric Negative Contrast and Reverse Attention",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Nuoyan Zhou;Decheng Liu;Dawei Zhou;Nannan Wang;Xinbo Gao",
        "authorids": "~Nuoyan_Zhou2;~Decheng_Liu2;~Dawei_Zhou3;~Nannan_Wang1;~Xinbo_Gao3",
        "gender": "M;M;M;M;M",
        "homepage": "https://openi.pcl.ac.cn/zhounuoyan;;;http://see.xidian.edu.cn/faculty/xbgao/;",
        "dblp": ";;10/8359-1;;39/3130-4",
        "google_scholar": ";c5TFU9sAAAAJ;SRBn7oUAAAAJ;;https://scholar.google.com.hk/citations?user=7H-LIigAAAAJ",
        "orcid": ";0000-0002-6550-212X;;0000-0003-1443-0776;0000-0002-0694-3603",
        "linkedin": ";;;;",
        "or_profile": "~Nuoyan_Zhou2;~Decheng_Liu2;~Nannan_Wang1;~Xinbo_Gao3;~Zhou_Dawei1",
        "aff": ";Xidian University ;Xidian University;Xidian University;Xidian University",
        "aff_domain": ";xidian.edu.cn;xidian.edu.cn;xidian.edu.cn;xidian.edu.cn",
        "position": ";Assistant Professor;Full Professor;Full Professor;PhD student",
        "bibtex": "@misc{\nzhou2024adversarial,\ntitle={Adversarial Robust Representation Learning via Contrast and Alignment},\nauthor={Nuoyan Zhou and Decheng Liu and Dawei Zhou and Nannan Wang and Xinbo Gao},\nyear={2024},\nurl={https://openreview.net/forum?id=HyEP74HLTh}\n}",
        "github": "",
        "project": "",
        "reviewers": "LVdG;iSTX;oaVG;ZWp1",
        "site": "https://openreview.net/forum?id=HyEP74HLTh",
        "pdf_size": 2051416,
        "rating": "3;5;5;8",
        "confidence": "4;4;4;5",
        "soundness": "2;2;2;3",
        "contribution": "2;3;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "85;38;58;146",
        "wc_strengths": "28;38;53;73",
        "wc_weaknesses": "240;272;403;54",
        "wc_questions": "2;2;50;54",
        "wc_review": "355;350;564;327",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            81.75,
            40.671703922997864
        ],
        "wc_strengths_avg": [
            48.0,
            16.95582495781317
        ],
        "wc_weaknesses_avg": [
            242.25,
            124.66830992678132
        ],
        "wc_questions_avg": [
            27.0,
            25.03996805109783
        ],
        "wc_review_avg": [
            399.0,
            95.84623101614378
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.8892972917998875,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:h8YLLWaRsd4J:scholar.google.com/&scioq=Adversarial+Robust+Representation+Learning+via+Contrast+and+Alignment&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Xidian University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.xidian.edu.cn/",
        "aff_unique_abbr": "Xidian",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "I07KLz6Em1",
        "title": "QuantEase: Optimization-based Quantization for Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "With the rising popularity of Large Language Models (LLMs), there has been an increasing interest in compression techniques that enable their efficient deployment. This study focuses on the Post-Training Quantization (PTQ) of LLMs. Drawing from recent advances, our work introduces QuantEase, a layer-wise quantization framework where individual layers undergo separate quantization. The problem is framed as a discrete-structured non-convex optimization, prompting the development of algorithms rooted in Coordinate Descent (CD) techniques. These CD-based methods provide high-quality solutions to the complex non-convex layer-wise quantization problems. Notably, our CD-based approach features straightforward updates, relying solely on matrix and vector operations, circumventing the need for matrix inversion or decomposition. We also explore an outlier-aware variant of our approach, allowing for retaining significant weights (outliers) with complete precision. Our proposal attains state-of-the-art performance regarding perplexity and zero-shot accuracy in empirical evaluations across various LLMs and datasets, with relative improvements of up to 15% over methods such as GPTQ. Particularly noteworthy is our outlier-aware algorithm\u2019s capability to achieve near or sub-3-bit quantization of LLMs with an acceptable drop in accuracy, obviating the need for non-uniform quantization or grouping techniques, improving upon methods such as SpQR by up to two times in terms of perplexity.",
        "keywords": "Post-training Quantization;Quantization;Large Language Models",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Kayhan Behdin;Ayan Acharya;Aman Gupta;Sathiya Keerthi;Rahul Mazumder",
        "authorids": "~Kayhan_Behdin1;~Ayan_Acharya1;~Aman_Gupta1;~Sathiya_Keerthi1;~Rahul_Mazumder1",
        "gender": "M;M;M;M;M",
        "homepage": "http://mit.edu/~behdink/www/;;;http://www.keerthis.com;http://www.mit.edu/~rahulmaz/",
        "dblp": "199/2308.html;53/770;359/1957.html;;11/9365.html",
        "google_scholar": ";u11FXaoAAAAJ;vuGUPbkAAAAJ;Sr7jln4AAAAJ;cyCp3pIAAAAJ",
        "orcid": "0000-0003-3482-0421;;;;0000-0003-1384-9743",
        "linkedin": ";;aman-gupta1/;;",
        "or_profile": "~Kayhan_Behdin1;~Ayan_Acharya1;~Aman_Gupta1;~Sathiya_Keerthi1;~Rahul_Mazumder1",
        "aff": "Massachusetts Institute of Technology;LinkedIn;LinkedIn;;Massachusetts Institute of Technology",
        "aff_domain": "mit.edu;linkedin.com;linkedin.com;;mit.edu",
        "position": "PhD student;Researcher;Researcher;;Associate Professor",
        "bibtex": "@misc{\nbehdin2024quantease,\ntitle={QuantEase: Optimization-based Quantization for Large Language Models},\nauthor={Kayhan Behdin and Ayan Acharya and Aman Gupta and Sathiya Keerthi and Rahul Mazumder},\nyear={2024},\nurl={https://openreview.net/forum?id=I07KLz6Em1}\n}",
        "github": "",
        "project": "",
        "reviewers": "Y8vm;3JsL;g6vC",
        "site": "https://openreview.net/forum?id=I07KLz6Em1",
        "pdf_size": 497532,
        "rating": "3;3;5",
        "confidence": "4;4;4",
        "soundness": "2;3;4",
        "contribution": "2;4;3",
        "presentation": "3;2;4",
        "wc_summary": "35;102;15",
        "wc_strengths": "32;117;31",
        "wc_weaknesses": "115;92;59",
        "wc_questions": "1;9;54",
        "wc_review": "183;320;159",
        "wc_reply_reviewers": "222;138;83",
        "wc_reply_authors": "891;1426;523",
        "reply_reviewers": "1;2;1",
        "reply_authors": "2;3;2",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            50.666666666666664,
            37.20513704076659
        ],
        "wc_strengths_avg": [
            60.0,
            40.307154038292836
        ],
        "wc_weaknesses_avg": [
            88.66666666666667,
            22.983085567917602
        ],
        "wc_questions_avg": [
            21.333333333333332,
            23.32857094256359
        ],
        "wc_review_avg": [
            220.66666666666666,
            70.91935952584143
        ],
        "wc_reply_reviewers_avg": [
            147.66666666666666,
            57.156704671358455
        ],
        "wc_reply_authors_avg": [
            946.6666666666666,
            370.7436970319103
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:HPFU8CLJdZ0J:scholar.google.com/&scioq=QuantEase:+Optimization-based+Quantization+for+Large+Language+Models&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;0",
        "aff_unique_norm": "Massachusetts Institute of Technology;LinkedIn Corporation",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://web.mit.edu;https://www.linkedin.com",
        "aff_unique_abbr": "MIT;LinkedIn",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "I09JonzQJV",
        "title": "Counterfactual Fairness With the Human in the Loop",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Machine learning models have been increasingly used in human-related applications such as healthcare, lending, and college admissions. As a result, there are growing concerns about potential biases against certain demographic groups. To address the unfairness issue, various fairness notions have been introduced in the literature to measure and mitigate such biases. Among them, Counterfactual Fairness (CF) (Kusner $\\textit{et al.}$) is a notion defined based on an underlying causal graph that requires the prediction perceived by an individual in the real world to remain the same as it would be in a counterfactual world, in which the individual belongs to a different demographic group. Unlike Kusner $\\textit{et al.}$, this work studies the long-term impact of machine learning decisions using a causal inference framework where the individuals' future status may change based on the current predictions. We observe that imposing the original counterfactual fairness may not lead to a fair future outcome for the individuals. We thus introduce a fairness notion called $\\textit{lookahead counterfactual fairness}$ (LCF), which accounts for the downstream effects of ML models and requires the individual $\\textit{future status}$ to be counterfactually fair. We theoretically identify conditions under which LCF can be improved and propose an algorithm based on our theoretical results. Experiments on both synthetic and real data show the effectiveness of our  method.",
        "keywords": "Counterfactual Fairness;Strategic Behavior;Human in the Loop",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/be458ac18a64bbec6ef4c97dee409f1696ef30bb.zip",
        "author": "Zhiqun Zuo;Tian Xie;Xuwei Tan;Xueru Zhang;Mohammad Mahdi Khalili",
        "authorids": "~Zhiqun_Zuo1;~Tian_Xie4;~Xuwei_Tan1;~Xueru_Zhang2;~Mohammad_Mahdi_Khalili3",
        "gender": "M;M;M;F;M",
        "homepage": "https://github.com/zuozhiqun;https://www.linkedin.com/in/tianxie1999/;https://engineering.osu.edu/people/tan.1206;https://xueruzhang.github.io/;https://Khalilimahdi.github.io",
        "dblp": "258/4850;;308/6151;;159/2163.html",
        "google_scholar": ";;IpTmmIYAAAAJ;PNBO_a4AAAAJ;hSgnKecAAAAJ",
        "orcid": ";;;;0000-0002-4223-3254",
        "linkedin": ";tianxie1999/;;;mohammad-mahdi-khalili-aa4241127",
        "or_profile": "~Zhiqun_Zuo1;~Tian_Xie4;~Xuwei_Tan1;~Xueru_Zhang2;~Mohammad_Mahdi_Khalili3",
        "aff": "Ohio State University, Columbus;Ohio State University, Columbus;Ohio State University, Columbus;Ohio State University;Yahoo! Research",
        "aff_domain": "osu.edu;osu.edu;osu.edu;osu.edu;yahooinc.com",
        "position": "PhD student;PhD student;PhD student;Assistant Professor;Research Scientist",
        "bibtex": "@misc{\nzuo2024counterfactual,\ntitle={Counterfactual Fairness With the Human in the Loop},\nauthor={Zhiqun Zuo and Tian Xie and Xuwei Tan and Xueru Zhang and Mohammad Mahdi Khalili},\nyear={2024},\nurl={https://openreview.net/forum?id=I09JonzQJV}\n}",
        "github": "",
        "project": "",
        "reviewers": "VAjK;pE5E;HGLj;ouSR",
        "site": "https://openreview.net/forum?id=I09JonzQJV",
        "pdf_size": 520122,
        "rating": "3;3;5;5",
        "confidence": "4;4;4;5",
        "soundness": "1;3;2;3",
        "contribution": "1;2;3;2",
        "presentation": "3;3;2;3",
        "wc_summary": "201;67;70;90",
        "wc_strengths": "71;60;45;68",
        "wc_weaknesses": "841;166;735;299",
        "wc_questions": "5;58;7;100",
        "wc_review": "1118;351;857;557",
        "wc_reply_reviewers": "22;0;271;202",
        "wc_reply_authors": "857;286;912;871",
        "reply_reviewers": "1;0;3;3",
        "reply_authors": "2;1;4;4",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            107.0,
            54.98636194548608
        ],
        "wc_strengths_avg": [
            61.0,
            10.074720839804943
        ],
        "wc_weaknesses_avg": [
            510.25,
            284.184249211669
        ],
        "wc_questions_avg": [
            42.5,
            39.41129279787711
        ],
        "wc_review_avg": [
            720.75,
            291.50503854993656
        ],
        "wc_reply_reviewers_avg": [
            123.75,
            115.62087830491515
        ],
        "wc_reply_authors_avg": [
            731.5,
            258.0024224692474
        ],
        "reply_reviewers_avg": [
            1.75,
            1.299038105676658
        ],
        "reply_authors_avg": [
            2.75,
            1.299038105676658
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:KQTC7UoZg_cJ:scholar.google.com/&scioq=Counterfactual+Fairness+With+the+Human+in+the+Loop&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;1",
        "aff_unique_norm": "Ohio State University;Yahoo!",
        "aff_unique_dep": ";Yahoo! Research",
        "aff_unique_url": "https://www.osu.edu;https://research.yahoo.com",
        "aff_unique_abbr": "OSU;Yahoo!",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Columbus;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "I0gwsdSgsk",
        "title": "Memory Efficient Neural Processes via Constant Memory Attention Block",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Neural Processes (NPs) are popular meta-learning methods for efficiently modelling predictive uncertainty. Recent state-of-the-art methods, however, leverage expensive attention mechanisms, limiting their applications, particularly in low-resource settings. In this work, we propose Constant Memory Attention Block (CMAB),  a novel general-purpose attention block that (1) is permutation invariant, (2) computes its output in constant memory, and (3) performs updates in constant computation. Building on CMAB, we propose Constant Memory Attentive Neural Processes (CMANPs), an NP variant which only requires **constant** memory. Empirically, we show CMANPs achieve state-of-the-art results on popular NP benchmarks (meta-regression and image completion) while being significantly more memory efficient than prior methods.",
        "keywords": "Attention;Neural Processes;Meta-learning;Efficiency",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/4b6ede13c9638d350427ac961921a0c217c0a245.zip",
        "author": "Leo Feng;Frederick Tung;Hossein Hajimirsadeghi;Yoshua Bengio;Mohamed Osama Ahmed",
        "authorids": "~Leo_Feng1;~Frederick_Tung1;~Hossein_Hajimirsadeghi1;~Yoshua_Bengio1;~Mohamed_Osama_Ahmed2",
        "gender": "M;M;M;M;M",
        "homepage": "https://leofeng-ca.github.io/;;;http://yoshuabengio.org;",
        "dblp": "255/9367;10/7697;64/8131;56/953;https://dblp.org/pers/hd/a/Ahmed:Mohamed_Osama",
        "google_scholar": "WsRunnEAAAAJ;https://scholar.google.ca/citations?user=T4EeZ9gAAAAJ;;kukA0LcAAAAJ;https://scholar.google.ca/citations?user=jyVyVj4AAAAJ",
        "orcid": ";;;;0000-0001-6758-1178",
        "linkedin": "leo-feng/;;;yoshuabengio/?originalSubdomain=ca;mohamed-osama-ahmed-91439a154/",
        "or_profile": "~Leo_Feng1;~Frederick_Tung1;~Hossein_Hajimirsadeghi1;~Yoshua_Bengio1;~Mohamed_Osama_Ahmed2",
        "aff": "Mila - Quebec Artificial Intelligence Institute;Borealis AI;Borealis AI;University of Montreal;",
        "aff_domain": "mila.quebec;borealisai.com;borealisai.com;umontreal.ca;",
        "position": "PhD student;Researcher;Principal Researcher;Full Professor;",
        "bibtex": "@misc{\nfeng2024memory,\ntitle={Memory Efficient Neural Processes via Constant Memory Attention Block},\nauthor={Leo Feng and Frederick Tung and Hossein Hajimirsadeghi and Yoshua Bengio and Mohamed Osama Ahmed},\nyear={2024},\nurl={https://openreview.net/forum?id=I0gwsdSgsk}\n}",
        "github": "",
        "project": "",
        "reviewers": "PUEj;GqA3;SwB8;wchU",
        "site": "https://openreview.net/forum?id=I0gwsdSgsk",
        "pdf_size": 5308603,
        "rating": "3;3;6;8",
        "confidence": "4;3;3;4",
        "soundness": "2;3;3;3",
        "contribution": "3;1;3;3",
        "presentation": "3;2;4;3",
        "wc_summary": "208;17;29;121",
        "wc_strengths": "36;26;85;150",
        "wc_weaknesses": "36;188;89;395",
        "wc_questions": "7;18;116;85",
        "wc_review": "287;249;319;751",
        "wc_reply_reviewers": "0;0;0;17",
        "wc_reply_authors": "684;964;685;709",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "2;3;1;1",
        "rating_avg": [
            5.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            93.75,
            77.26375282109976
        ],
        "wc_strengths_avg": [
            74.25,
            49.10384404504397
        ],
        "wc_weaknesses_avg": [
            177.0,
            137.17689309792667
        ],
        "wc_questions_avg": [
            56.5,
            45.510987684294435
        ],
        "wc_review_avg": [
            401.5,
            203.29965568096765
        ],
        "wc_reply_reviewers_avg": [
            4.25,
            7.361215932167728
        ],
        "wc_reply_authors_avg": [
            760.5,
            117.9162838627473
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.23570226039551587,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2028368274085747897&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "Quebec Artificial Intelligence Institute;Borealis AI;University of Montreal",
        "aff_unique_dep": "Artificial Intelligence;;",
        "aff_unique_url": "https://mila.quebec;https://www.borealisai.com;https://wwwumontreal.ca",
        "aff_unique_abbr": "Mila;Borealis AI;UM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "I0wEUVzbNY",
        "title": "A Critical Study of What Pre-trained Code Models (do not) Learn",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Parallel to the recent success of self-attention-based language models across a range of coding assistance tasks, several studies have underscored that pre-trained code models (PCMs) utilize self-attention and hidden representations to encode relations among input tokens. Our research extends upon these insights by understanding the properties of code that PCMs may not fully encode and by broadening the scope to encompass data flow relations. Our study reveals that while PCMs do encode syntactic and data flow relations in self-attention, they only encode relations within specific subsets of input tokens. Specifically, by categorizing input tokens into syntactic tokens and identifiers, we find that models encode relations among syntactic tokens and among identifiers but fail to encode relations between syntactic tokens and identifiers. We show that this limitation results in hidden representations not encoding enough information about input tokens to discriminate between different identifier types and syntax structures. Importantly, we observe that this learning gap persists across different model architectures, datasets, and pre-training objectives. Our findings shed light on why PCMs fail to generalize beyond dataset they are trained on and in real world applications.",
        "keywords": "Explainability;interpretation of learned representations;neural code intelligence;neural networks",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/53b1ba27ce0912aa6b991262e42bbad8bf7f229b.zip",
        "author": "Abhinav Anand;Krishna Narasimhan;Mira Mezini",
        "authorids": "~Abhinav_Anand2;~Krishna_Narasimhan1;~Mira_Mezini1",
        "gender": "M;M;F",
        "homepage": "https://abx04.netlify.app/;;http://www.stg.tu-darmstadt.de/staff/mira_mezini/",
        "dblp": ";174/2005.html;m/MiraMezini",
        "google_scholar": "0tQ24QMAAAAJ;;https://scholar.google.com.tw/citations?user=ESQUnJEAAAAJ",
        "orcid": "0000-0002-4793-7015;;0000-0001-6563-7537",
        "linkedin": ";;miramezini/?originalSubdomain=de",
        "or_profile": "~Abhinav_Anand2;~Krishna_Narasimhan1;~Mira_Mezini1",
        "aff": "Technische Universit\u00e4t Darmstadt;;Technische Universit\u00e4t Darmstadt",
        "aff_domain": "tu-darmstadt.de;;tu-darmstsdt.de",
        "position": "PhD student;;Full Professor",
        "bibtex": "@misc{\nanand2024a,\ntitle={A Critical Study of What Pre-trained Code Models (do not) Learn},\nauthor={Abhinav Anand and Krishna Narasimhan and Mira Mezini},\nyear={2024},\nurl={https://openreview.net/forum?id=I0wEUVzbNY}\n}",
        "github": "",
        "project": "",
        "reviewers": "Yafu;vS1o;GkFF;gkoc",
        "site": "https://openreview.net/forum?id=I0wEUVzbNY",
        "pdf_size": 1524477,
        "rating": "3;5;5;5",
        "confidence": "4;3;4;3",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;2",
        "presentation": "2;3;3;2",
        "wc_summary": "130;84;135;96",
        "wc_strengths": "41;28;75;149",
        "wc_weaknesses": "251;287;114;120",
        "wc_questions": "39;24;143;5",
        "wc_review": "461;423;467;370",
        "wc_reply_reviewers": "108;0;0;29",
        "wc_reply_authors": "874;589;986;201",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "2;1;2;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            111.25,
            21.741377601246892
        ],
        "wc_strengths_avg": [
            73.25,
            46.980714128246284
        ],
        "wc_weaknesses_avg": [
            193.0,
            77.08761249383717
        ],
        "wc_questions_avg": [
            52.75,
            53.480720825359114
        ],
        "wc_review_avg": [
            430.25,
            38.661188548724155
        ],
        "wc_reply_reviewers_avg": [
            34.25,
            44.19488092528364
        ],
        "wc_reply_authors_avg": [
            662.5,
            303.219804762156
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ZfnF1Jzt4FcJ:scholar.google.com/&scioq=A+Critical+Study+of+What+Pre-trained+Code+Models+(do+not)+Learn&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Technische Universit\u00e4t Darmstadt",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tu-darmstadt.de",
        "aff_unique_abbr": "TUD",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "I1Gd2d1WXY",
        "title": "Adaptive Resolution Residual Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The majority of deep learning methods for signals assume a fixed signal resolution during training and inference, making it impractical to apply a single network at various signal resolutions. We address this shortcoming by introducing Adaptive Resolution Residual Networks (ARRNs) that implement two novel components: Laplacian residuals, which define the structure of ARRNs and allow compressing high-resolution ARRNs into low-resolution ARRNs, and Laplacian dropout, which improves the robustness of compressed ARRNs through a training augmentation. We formulate Laplacian residuals by combining the properties of standard residuals and Laplacian pyramids. Thanks to this structure, lower resolution signals require a lower number of Laplacian residuals for exact computation. This adaptation greatly reduces the computational cost of inference on lower resolution signals. This adaptation is effectively instantaneous and requires no additional training. We formulate Laplacian dropout through the converse idea that randomly lowering the number of Laplacian residuals is equivalent to randomly lowering signal resolution. We leverage this as a training augmentation that has the effect of improving the performance of the many low-resolution ARRNs that can be derived from a single high-resolution ARRN. We provide a solid theoretical grounding for the advantageous properties of ARRNs, along with a set of experiments that demonstrate these properties in practice.",
        "keywords": "Convolutional Neural Network;Residual Network;Adaptive Resolution;Bandwidth Robustness;Robustness;Laplacian Pyramid;Laplacian Residual;Laplacian Dropout",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/f3ac2f705f3b2eef2ba30a85c4fc989241019c22.pdf",
        "author": "L\u00e9a Demeule;Mahtab Sandhu;Glen Berseth",
        "authorids": "~L\u00e9a_Demeule1;~Mahtab_Sandhu1;~Glen_Berseth1",
        "gender": "F;;M",
        "homepage": "https://leademeule.com;;http://fracturedplane.com/",
        "dblp": ";228/4784;147/5478",
        "google_scholar": ";Gdv8B50AAAAJ;https://scholar.google.ca/citations?user=-WZcuuwAAAAJ",
        "orcid": ";;0000-0001-7351-8028",
        "linkedin": ";;glen-berseth-0523278b?trk=hp-identity-name",
        "or_profile": "~L\u00e9a_Demeule1;~Mahtab_Sandhu1;~Glen_Berseth1",
        "aff": "Montreal Institute for Learning Algorithms, University of Montreal, Universit\u00e9 de Montr\u00e9al;Montreal Institute for Learning Algorithms, University of Montreal, Universit\u00e9 de Montr\u00e9al;Montreal Institute for Learning Algorithms, University of Montreal, Universit\u00e9 de Montr\u00e9al",
        "aff_domain": "mila.umontreal.ca;mila.umontreal.ca;mila.umontreal.ca",
        "position": "PhD student;MS student;Assistant Professor",
        "bibtex": "@misc{\ndemeule2024adaptive,\ntitle={Adaptive Resolution Residual Networks},\nauthor={L{\\'e}a Demeule and Mahtab Sandhu and Glen Berseth},\nyear={2024},\nurl={https://openreview.net/forum?id=I1Gd2d1WXY}\n}",
        "github": "",
        "project": "",
        "reviewers": "Ag6R;DCC2;FCGS;quBW",
        "site": "https://openreview.net/forum?id=I1Gd2d1WXY",
        "pdf_size": 2841396,
        "rating": "3;3;3;6",
        "confidence": "4;5;4;2",
        "soundness": "3;2;2;4",
        "contribution": "2;2;1;3",
        "presentation": "3;2;3;4",
        "wc_summary": "68;68;38;41",
        "wc_strengths": "29;27;19;62",
        "wc_weaknesses": "57;16;142;57",
        "wc_questions": "146;205;11;23",
        "wc_review": "300;316;210;183",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "729;531;636;297",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;3;3;3",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            53.75,
            14.289419162443238
        ],
        "wc_strengths_avg": [
            34.25,
            16.452583383772897
        ],
        "wc_weaknesses_avg": [
            68.0,
            45.88572762853391
        ],
        "wc_questions_avg": [
            96.25,
            82.0590488611707
        ],
        "wc_review_avg": [
            252.25,
            56.84353525248056
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            548.25,
            161.08596307561996
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            3.0,
            0.0
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.9271726499455307,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:s6qBtpWcsJUJ:scholar.google.com/&scioq=Adaptive+Resolution+Residual+Networks&hl=en&as_sdt=0,44",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Montreal",
        "aff_unique_dep": "Montreal Institute for Learning Algorithms",
        "aff_unique_url": "https://www.mila.quebec",
        "aff_unique_abbr": "MILA",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Montreal",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "I1jIKhMJ8y",
        "title": "Learning Embeddings for Sequential Tasks Using Population of Agents",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We present an information-theoretic framework to learn fixed-dimensional embeddings for tasks in reinforcement learning. We leverage the idea that two tasks are similar if observing an agent's performance on one task reduces our uncertainty about its performance on the other. This intuition is captured by our information-theoretic criterion which uses a diverse agent population as an approximation for the space of agents to measure similarity between tasks in sequential decision-making settings. In addition to qualitative assessment, we empirically demonstrate the effectiveness of our techniques based on task embeddings by quantitative comparisons against strong baselines on two application scenarios: predicting an agent's performance on a new task by observing its performance on a small quiz of tasks, and selecting tasks with desired characteristics from a given set of options.",
        "keywords": "task embeddings;reinforcement learning;population-based techniques",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/4d7dba152572e1a6e1637390016d2f0a2aba0a44.zip",
        "author": "Mridul Mahajan;Georgios Tzannetos;Goran Radanovic;Adish Singla",
        "authorids": "~Mridul_Mahajan1;~Georgios_Tzannetos1;~Goran_Radanovic1;~Adish_Singla2",
        "gender": ";M;;",
        "homepage": "https://mridulmahajan44.github.io/;https://georgetzannetos.github.io/;;https://machineteaching.mpi-sws.org/adishsingla.html",
        "dblp": ";345/8576;133/1771;58/657",
        "google_scholar": "myoAmX4AAAAJ;E_EE9gUAAAAJ;KBG_JlAAAAAJ;kXz2seUAAAAJ",
        "orcid": ";;;",
        "linkedin": ";gtzannetos;;",
        "or_profile": "~Mridul_Mahajan1;~Georgios_Tzannetos1;~Goran_Radanovic1;~Adish_Kumar_Singla1",
        "aff": "Max Planck Institute for Intelligent Systems;MPI-SWS;MPI-SWS;Max Planck Institute for Software Systems (MPI-SWS)",
        "aff_domain": "tuebingen.mpg.de;mpi-sws.org;mpi-sws.org;mpi-sws.org",
        "position": "Intern;PhD student;Research group leader;Researcher",
        "bibtex": "@misc{\nmahajan2024learning,\ntitle={Learning Embeddings for Sequential Tasks Using Population of Agents},\nauthor={Mridul Mahajan and Georgios Tzannetos and Goran Radanovic and Adish Singla},\nyear={2024},\nurl={https://openreview.net/forum?id=I1jIKhMJ8y}\n}",
        "github": "",
        "project": "",
        "reviewers": "9bsB;HkeS;Q8ok;viG4",
        "site": "https://openreview.net/forum?id=I1jIKhMJ8y",
        "pdf_size": 4607141,
        "rating": "5;5;5;6",
        "confidence": "3;4;3;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "106;170;109;108",
        "wc_strengths": "76;101;25;52",
        "wc_weaknesses": "207;259;82;192",
        "wc_questions": "39;97;58;82",
        "wc_review": "428;627;274;434",
        "wc_reply_reviewers": "145;34;269;47",
        "wc_reply_authors": "558;993;935;789",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;3;3;2",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            123.25,
            27.012728481217888
        ],
        "wc_strengths_avg": [
            63.5,
            28.182441342083905
        ],
        "wc_weaknesses_avg": [
            185.0,
            64.45541094431096
        ],
        "wc_questions_avg": [
            69.0,
            22.214859891523062
        ],
        "wc_review_avg": [
            440.75,
            125.20258583591634
        ],
        "wc_reply_reviewers_avg": [
            123.75,
            94.20025212280486
        ],
        "wc_reply_authors_avg": [
            818.75,
            167.89338134661534
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:V7DGh0HImrkJ:scholar.google.com/&scioq=Learning+Embeddings+for+Sequential+Tasks+Using+Population+of+Agents&hl=en&as_sdt=0,5",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Max Planck Institute for Intelligent Systems;Max Planck Institute for Software Systems",
        "aff_unique_dep": "Intelligent Systems;",
        "aff_unique_url": "https://www.mpi-is.mpg.de;https://www.mpi-sws.org",
        "aff_unique_abbr": "MPI-IS;MPI-SWS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "title": "Energy-Based Concept Bottleneck Models: Unifying Prediction, Concept Intervention, and Probabilistic Interpretations",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18975",
        "id": "I1quoTXZzc",
        "author_site": "Xinyue Xu, Yi Qin, Lu Mi, Hao Wang, Xiaomeng Li",
        "tldr": "",
        "abstract": "Existing methods, such as concept bottleneck models (CBMs), have been successful in providing concept-based interpretations for black-box deep learning models. They typically work by predicting concepts given the input and then predicting the final class label given the predicted concepts. However, (1) they often fail to capture the high-order, nonlinear interaction between concepts, e.g., correcting a predicted concept (e.g., \u201cyellow breast\u201d) does not help correct highly correlated concepts (e.g., \u201cyellow belly\u201d), leading to suboptimal final accuracy; (2) they cannot naturally quantify the complex conditional dependencies between different concepts and class labels (e.g., for an image with the class label \u201cKentucky Warbler\u201d and a concept \u201cblack bill\u201d, what is the probability that the model correctly predicts another concept \u201cblack crown\u201d), therefore failing to provide deeper insight into how a black-box model works. In response to these limitations, we propose Energy-based Concept Bottleneck Models (ECBMs). Our ECBMs use a set of neural networks to define the joint energy of candidate (input, concept, class) tuples. With such a unified interface, prediction, concept correction, and conditional dependency quantification are then represented as conditional probabilities, which are generated by composing different energy functions. Our ECBMs address both limitations of existing CBMs, providing higher accuracy and richer concept interpretations. Empirical results show that our approach outperforms the state-of-the-art on real-world datasets.",
        "keywords": "Interpretability;Concepts;Energy-Based Model;Probabilistic Methods",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Xinyue Xu;Yi Qin;Lu Mi;Hao Wang;Xiaomeng Li",
        "authorids": "~Xinyue_Xu1;~Yi_Qin5;~Lu_Mi1;~Hao_Wang3;~Xiaomeng_Li1",
        "gender": "F;F;F;M;M",
        "homepage": ";https://lumimim.github.io;https://xmengli.github.io/;http://www.wanghao.in;https://easonqin.top",
        "dblp": ";185/3258;02/9850-1;w/HaoWang-14;",
        "google_scholar": ";vokCG-MAAAAJ;uVTzPpoAAAAJ;NrOA9QoAAAAJ;",
        "orcid": "0000-0002-2037-5462;;;;",
        "linkedin": ";lu-mi-698899172/;;;",
        "or_profile": "~Xinyue_Xu1;~Lu_Mi1;~Xiaomeng_Li1;~Hao_Wang4;~Yi_QIN4",
        "aff": "Hong Kong University of Science and Technology;Allen Institute;Hong Kong University of Science and Technology;Rutgers University;Hong Kong University of Science and Technology",
        "aff_domain": "ust.hk;allen.org;ust.hk;cs.rutgers.edu;ust.hk",
        "position": "PhD student;Postdoc;Assistant Professor;Assistant Professor;PhD student",
        "bibtex": "@inproceedings{\nxu2024energybased,\ntitle={Energy-Based Concept Bottleneck Models: Unifying Prediction, Concept Intervention, and Probabilistic Interpretations},\nauthor={Xinyue Xu and Yi Qin and Lu Mi and Hao Wang and Xiaomeng Li},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=I1quoTXZzc}\n}",
        "github": "",
        "project": "",
        "reviewers": "doCC;JBWu;tSsK;XFNY;WpSc",
        "pdf_size": 3115942,
        "rating": "6;6;6;6;8",
        "confidence": "4;5;4;4;4",
        "soundness": "3;3;3;2;1",
        "contribution": "3;3;2;2;2",
        "presentation": "2;3;3;3;2",
        "wc_summary": "406;54;107;32;166",
        "wc_strengths": "148;61;42;27;302",
        "wc_weaknesses": "204;246;539;314;757",
        "wc_questions": "92;3;2;85;640",
        "wc_review": "850;364;690;458;1865",
        "wc_reply_reviewers": "25;11;0;26;772",
        "wc_reply_authors": "732;837;1322;2078;3746",
        "reply_reviewers": "1;1;0;1;2",
        "reply_authors": "2;2;3;6;6",
        "rating_avg": [
            6.4,
            0.7999999999999999
        ],
        "confidence_avg": [
            4.2,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.4,
            0.8
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            153.0,
            134.71154367759283
        ],
        "wc_strengths_avg": [
            116.0,
            102.02156634751302
        ],
        "wc_weaknesses_avg": [
            412.0,
            207.64296279912787
        ],
        "wc_questions_avg": [
            164.4,
            240.90047737603177
        ],
        "wc_review_avg": [
            845.4,
            537.6949320943986
        ],
        "wc_reply_reviewers_avg": [
            166.8,
            302.7523080011117
        ],
        "wc_reply_authors_avg": [
            1743.0,
            1108.5514873022362
        ],
        "reply_reviewers_avg": [
            1.0,
            0.6324555320336759
        ],
        "reply_authors_avg": [
            3.8,
            1.8330302779823362
        ],
        "replies_avg": [
            32,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.2500000000000001,
        "gs_citation": 17,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16224323699207955240&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=I1quoTXZzc",
        "pdf": "https://openreview.net/pdf?id=I1quoTXZzc",
        "email": "ust.hk;allen.org;ust.hk;cs.rutgers.edu;ust.hk",
        "author_num": 5,
        "aff_unique_index": "0;1;0;2;0",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Allen Institute for Artificial Intelligence;Rutgers University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ust.hk;https://allenai.org;https://www.rutgers.edu",
        "aff_unique_abbr": "HKUST;AI2;Rutgers",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;1;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Understanding Domain Generalization: A Noise Robustness Perspective",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18974",
        "id": "I2mIxuXA72",
        "author_site": "RUI QIAO, Bryan Kian Hsiang Low",
        "tldr": "",
        "abstract": "Despite the rapid development of machine learning algorithms for domain generalization (DG), there is no clear empirical evidence that the existing DG algorithms outperform the classic empirical risk minimization (ERM) across standard benchmarks. To better understand this phenomenon, we investigate whether there are benefits of DG algorithms over ERM through the lens of label noise.\nSpecifically, our finite-sample analysis reveals that label noise exacerbates the effect of spurious correlations for ERM, undermining generalization. \nConversely, we illustrate that DG algorithms exhibit implicit label-noise robustness during finite-sample training even when spurious correlation is present.\nSuch desirable property helps mitigate spurious correlations and improve generalization in synthetic experiments. \nHowever, additional comprehensive experiments on real-world benchmark datasets indicate that label-noise robustness does not necessarily translate to better performance compared to ERM. \nWe conjecture that the failure mode of ERM arising from spurious correlations may be less pronounced in practice. Our code is available at https://github.com/qiaoruiyt/NoiseRobustDG",
        "keywords": "out-of-distribution generalization;distribution shifts;spurious correlation;noise robustness",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/3c3190ccab92b7056e0b2794120ff1ea5d80e8b8.zip",
        "author": "Rui Qiao;Bryan Kian Hsiang Low",
        "authorids": "~Rui_Qiao3;~Bryan_Kian_Hsiang_Low1",
        "gender": "M;M",
        "homepage": "https://qiaoruiyt.github.io/;http://www.comp.nus.edu.sg/~lowkh",
        "dblp": "31/3517-6;97/4877",
        "google_scholar": "Ox5Z9EwAAAAJ;https://scholar.google.com.tw/citations?user=2P-Q09UAAAAJ",
        "orcid": "0000-0002-6719-4490;",
        "linkedin": ";",
        "or_profile": "~Rui_Qiao3;~Bryan_Kian_Hsiang_Low1",
        "aff": "University of Washington;National University of Singapore",
        "aff_domain": "uw.edu;nus.edu.sg",
        "position": "Intern;Associate Professor",
        "bibtex": "@inproceedings{\nqiao2024understanding,\ntitle={Understanding Domain Generalization: A Noise Robustness Perspective},\nauthor={Rui Qiao and Bryan Kian Hsiang Low},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=I2mIxuXA72}\n}",
        "github": "",
        "project": "",
        "reviewers": "jUs6;qd9a;TZVP;4qg5",
        "pdf_size": 787695,
        "rating": "3;5;5;6",
        "confidence": "3;5;3;4",
        "soundness": "2;2;2;2",
        "contribution": "2;2;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "25;46;110;76",
        "wc_strengths": "76;54;46;175",
        "wc_weaknesses": "72;297;156;329",
        "wc_questions": "59;71;153;45",
        "wc_review": "232;468;465;625",
        "wc_reply_reviewers": "0;0;0;83",
        "wc_reply_authors": "865;1581;1619;1731",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "3;3;4;3",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            64.25,
            32.03416145304884
        ],
        "wc_strengths_avg": [
            87.75,
            51.55761340481151
        ],
        "wc_weaknesses_avg": [
            213.5,
            104.45214215132211
        ],
        "wc_questions_avg": [
            82.0,
            42.01190307520001
        ],
        "wc_review_avg": [
            447.5,
            140.24353817556087
        ],
        "wc_reply_reviewers_avg": [
            20.75,
            35.94005425705421
        ],
        "wc_reply_authors_avg": [
            1449.0,
            341.6518695982798
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.25,
            0.4330127018922193
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.48420012470625223,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11742256945565347189&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=I2mIxuXA72",
        "pdf": "https://openreview.net/pdf?id=I2mIxuXA72",
        "email": "uw.edu;nus.edu.sg",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Washington;National University of Singapore",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.washington.edu;https://www.nus.edu.sg",
        "aff_unique_abbr": "UW;NUS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United States;Singapore"
    },
    {
        "id": "I4Yd9i5FFm",
        "title": "Asymmetric Momentum: A Rethinking of Gradient Descent",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Through theoretical and experimental validation, unlike all existing adaptive methods like Adam which penalize frequently-changing parameters and are only applicable to sparse gradients, we propose the simplest SGD enhanced method, Loss-Controlled Asymmetric Momentum(LCAM). By averaging the loss, we divide training process into different loss phases and using different momentum. It not only can accelerates slow-changing parameters for sparse gradients, similar to adaptive optimizers, but also can choose to accelerates frequently-changing parameters for non-sparse gradients, thus being adaptable to all types of datasets. We reinterpret the machine learning training process through the concepts of weight coupling and weight traction, and experimentally validate that weights have directional specificity, which are correlated with the specificity of the dataset. Thus interestingly, we observe that in non-sparse gradients, frequently-changing parameters should actually be accelerated, which is completely opposite to traditional adaptive perspectives. Compared to traditional SGD with momentum, this algorithm separates the weights without additional computational costs. It is noteworthy that this method relies on the network's ability to extract complex features. We primarily use Wide Residual Networks for our research, employing the classic datasets Cifar10 and Cifar100 to test the  ability for feature separation and conclude phenomena that are much more important than just accuracy rates. Finally, compared to classic SGD tuning methods, while using WRN on these two datasets and with nearly half the training epochs, we achieve equal or better test accuracy.",
        "keywords": "Gradient Descent;Optimizer;Machine Learning",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/8340738af3c71162815b3749a1392678aa46dd72.zip",
        "author": "Gongyue Zhang;Dinghuang Zhang;Shuwen Zhao;Donghan Liu;Carrie M. Toptan;Honghai LIU",
        "authorids": "~Gongyue_Zhang1;~Dinghuang_Zhang1;~Shuwen_Zhao1;~Donghan_Liu1;~Carrie_M._Toptan1;~Honghai_LIU1",
        "gender": "M;M;F;M;F;M",
        "homepage": ";;;;https://researchportal.port.ac.uk/en/persons/carrie-toptan-2;https://www.port.ac.uk/about-us/structure-and-governance/our-people/our-staff/honghai-liu",
        "dblp": ";;;;;10/4601",
        "google_scholar": ";;;;;",
        "orcid": "0000-0003-3018-5782;0000-0001-6952-613X;0000-0001-8100-799X;0000-0002-4087-9246;;0000-0002-2880-4698",
        "linkedin": ";dinghuang-zhang;;;;",
        "or_profile": "~Gongyue_Zhang1;~Dinghuang_Zhang1;~Shuwen_Zhao1;~Donghan_Liu1;~Carrie_M._Toptan1;~Honghai_LIU1",
        "aff": "Harbin Institute of Technology;;;;University of Portsmouth;University of Portsmouth",
        "aff_domain": "hit.edu.cn;;;;port.ac.uk;port.ac.uk",
        "position": "Postdoc;;;;PhD student;Full Professor",
        "bibtex": "@misc{\nzhang2024asymmetric,\ntitle={Asymmetric Momentum: A Rethinking of Gradient Descent},\nauthor={Gongyue Zhang and Dinghuang Zhang and Shuwen Zhao and Donghan Liu and Carrie M. Toptan and Honghai LIU},\nyear={2024},\nurl={https://openreview.net/forum?id=I4Yd9i5FFm}\n}",
        "github": "",
        "project": "",
        "reviewers": "SnV5;KDdh;cZTD;Erbu",
        "site": "https://openreview.net/forum?id=I4Yd9i5FFm",
        "pdf_size": 529132,
        "rating": "1;3;3;5",
        "confidence": "4;3;4;4",
        "soundness": "1;2;1;2",
        "contribution": "1;3;1;2",
        "presentation": "2;2;2;2",
        "wc_summary": "38;143;43;123",
        "wc_strengths": "22;67;14;78",
        "wc_weaknesses": "143;109;119;98",
        "wc_questions": "37;1;2;3",
        "wc_review": "240;320;178;302",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "247;247;247;247",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            86.75,
            46.82080200082011
        ],
        "wc_strengths_avg": [
            45.25,
            27.67105888830422
        ],
        "wc_weaknesses_avg": [
            117.25,
            16.618889854620253
        ],
        "wc_questions_avg": [
            10.75,
            15.171931320698759
        ],
        "wc_review_avg": [
            260.0,
            55.87486017879597
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            247.0,
            0.0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7532334589483646204&as_sdt=4005&sciodt=0,6&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Harbin Institute of Technology;University of Portsmouth",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.hit.edu.cn/;https://www.port.ac.uk",
        "aff_unique_abbr": "HIT;UoP",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Harbin;",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "title": "Domain-Inspired Sharpness-Aware Minimization Under Domain Shifts",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18973",
        "id": "I4wB3HA3dJ",
        "author_site": "Ruipeng Zhang, Ziqing Fan, Jiangchao Yao, Ya Zhang, Yanfeng Wang",
        "tldr": "",
        "abstract": "This paper presents a Domain-Inspired Sharpness-Aware Minimization (DISAM) algorithm for optimization under domain shifts. It is motivated by the inconsistent convergence degree of SAM across different domains, which induces optimization bias towards certain domains and thus impairs the overall convergence. To address this issue, we consider the domain-level convergence consistency in the sharpness estimation to prevent the overwhelming (deficient) perturbations for less (well) optimized domains. Specifically, DISAM introduces the constraint of minimizing variance in the domain loss, which allows the elastic gradient calibration in perturbation generation: when one domain is optimized above the averaging level w.r.t. loss, the gradient perturbation towards that domain will be weakened automatically, and vice versa. Under this mechanism, we theoretically show that DISAM can achieve faster overall convergence and improved generalization in principle when inconsistent convergence emerges. Extensive experiments on various domain generalization benchmarks show the superiority of DISAM over a range of state-of-the-art methods. Furthermore, we show the superior efficiency of DISAM in parameter-efficient fine-tuning combined with the pretraining models. The source code is released at https://github.com/MediaBrain-SJTU/DISAM.",
        "keywords": "generalization;sharpness-aware minimization;domain shift",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Ruipeng Zhang;Ziqing Fan;Jiangchao Yao;Ya Zhang;Yanfeng Wang",
        "authorids": "~Ruipeng_Zhang1;~Ziqing_Fan1;~Jiangchao_Yao1;~Ya_Zhang1;~Yanfeng_Wang1",
        "gender": "M;;M;F;M",
        "homepage": "https://frankzhangrp.github.io/;;https://sunarker.github.io/;https://annzhanglion.github.io/;https://cmic.sjtu.edu.cn/wangyanfeng/",
        "dblp": ";;166/5900;85/3714-2;55/5407-1.html",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;;w8oDh9QAAAAJ;pbjw9sMAAAAJ;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": "0000-0002-4372-4987;;;0000-0002-5390-9053;0000-0002-3196-2347",
        "linkedin": ";;;;",
        "or_profile": "~Ruipeng_Zhang1;~Ziqing_Fan1;~Jiangchao_Yao1;~Ya_Zhang1;~Yanfeng_Wang1",
        "aff": "Shanghai Jiaotong University;;Shanghai Artificial Intelligence Laboratory;Shanghai Jiaotong University;Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn;;pjlab.org.cn;sjtu.edu.cn;sjtu.edu.cn",
        "position": "PhD student;;Researcher;Professor;Full Professor",
        "bibtex": "@inproceedings{\nzhang2024domaininspired,\ntitle={Domain-Inspired Sharpness-Aware Minimization Under Domain Shifts},\nauthor={Ruipeng Zhang and Ziqing Fan and Jiangchao Yao and Ya Zhang and Yanfeng Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=I4wB3HA3dJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "sVwJ;BeTH;d1EH;mma9",
        "pdf_size": 6281350,
        "rating": "5;6;6;8",
        "confidence": "3;4;5;4",
        "soundness": "2;3;4;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;4;3",
        "wc_summary": "84;43;196;72",
        "wc_strengths": "38;30;126;129",
        "wc_weaknesses": "46;103;126;135",
        "wc_questions": "118;139;265;74",
        "wc_review": "286;315;713;410",
        "wc_reply_reviewers": "0;0;0;32",
        "wc_reply_authors": "2045;1655;1599;1403",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "6;5;5;4",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            98.75,
            58.09206055908157
        ],
        "wc_strengths_avg": [
            80.75,
            46.847491928597414
        ],
        "wc_weaknesses_avg": [
            102.5,
            34.64462440264001
        ],
        "wc_questions_avg": [
            149.0,
            70.96125703508922
        ],
        "wc_review_avg": [
            431.0,
            169.1493422984553
        ],
        "wc_reply_reviewers_avg": [
            8.0,
            13.856406460551018
        ],
        "wc_reply_authors_avg": [
            1675.5,
            232.94795556089346
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            5.0,
            0.7071067811865476
        ],
        "replies_avg": [
            30,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.3244428422615251,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9403953345107806630&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=I4wB3HA3dJ",
        "pdf": "https://openreview.net/pdf?id=I4wB3HA3dJ",
        "email": "sjtu.edu.cn;;pjlab.org.cn;sjtu.edu.cn;sjtu.edu.cn",
        "author_num": 5,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Shanghai Jiao Tong University;Shanghai Artificial Intelligence Laboratory",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.sjtu.edu.cn;http://www.shailab.org/",
        "aff_unique_abbr": "SJTU;Shanghai AI Lab",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "I5AjtSen6L",
        "title": "ELEGANT: Certified Defense on the Fairness of Graph Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph Neural Networks (GNNs) have emerged as a prominent graph learning model in various graph-based tasks over the years. Nevertheless, due to the vulnerabilities of GNNs, it has been empirically proved that malicious attackers could easily corrupt the fairness level of their predictions by adding perturbations to the input graph data. In this paper, we take crucial steps to study a novel problem of certifiable defense on the fairness level of GNNs. Specifically, we propose a principled framework named ELEGANT and present a detailed theoretical certification analysis for the fairness of GNNs. ELEGANT takes any GNNs as its backbone, and the fairness level of such a backbone is theoretically impossible to be corrupted under certain perturbation budgets for attackers. Notably, ELEGANT does not have any assumption over the GNN structure or parameters, and does not require re-training the GNNs to realize certification. Hence it can serve as a plug-and-play framework for any optimized GNNs ready to be deployed. We verify the satisfactory effectiveness of ELEGANT in practice through extensive experiments on real-world datasets across different backbones of GNNs, where ELEGANT is also demonstrated to be beneficial for GNN debiasing.",
        "keywords": "Algorithmic Fairness;Graph Neural Networks;Attack and Defense",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/b7471174718ff11956072309b84b849065fe24c9.zip",
        "author": "Yushun Dong;Binchi Zhang;Hanghang Tong;Jundong Li",
        "authorids": "~Yushun_Dong1;~Binchi_Zhang1;~Hanghang_Tong3;~Jundong_Li2",
        "gender": "M;M;;M",
        "homepage": "https://yushundong.github.io;https://zhangbinchi.github.io/;http://tonghanghang.org;https://jundongli.github.io/",
        "dblp": "251/9559;304/7647;58/1757;144/7997.html",
        "google_scholar": "https://scholar.google.com/citations?hl=en;c8Z36PAAAAAJ;RaINcuUAAAAJ;uY6ek7sAAAAJ",
        "orcid": "0000-0001-7504-6159;0000-0001-7321-3822;0000-0003-4405-3887;",
        "linkedin": ";binchi-zhang-274922221/;htong/;",
        "or_profile": "~Yushun_Dong1;~Binchi_Zhang1;~Hanghang_Tong3;~Jundong_Li2",
        "aff": "University of Virginia, Charlottesville;University of Virginia, Charlottesville;University of Illinois, Urbana Champaign;University of Virginia",
        "aff_domain": "virginia.edu;virginia.edu;illinois.edu;virginia.edu",
        "position": "PhD student;PhD student;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\ndong2024elegant,\ntitle={{ELEGANT}: Certified Defense on the Fairness of Graph Neural Networks},\nauthor={Yushun Dong and Binchi Zhang and Hanghang Tong and Jundong Li},\nyear={2024},\nurl={https://openreview.net/forum?id=I5AjtSen6L}\n}",
        "github": "",
        "project": "",
        "reviewers": "NACu;zsXF;wEZx;dksM",
        "site": "https://openreview.net/forum?id=I5AjtSen6L",
        "pdf_size": 5133068,
        "rating": "5;5;6;6",
        "confidence": "3;4;5;3",
        "soundness": "3;2;1;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;1;3",
        "wc_summary": "60;43;82;119",
        "wc_strengths": "46;28;40;98",
        "wc_weaknesses": "272;135;784;229",
        "wc_questions": "56;5;64;6",
        "wc_review": "434;211;970;452",
        "wc_reply_reviewers": "0;0;982;40",
        "wc_reply_authors": "1238;1068;4965;1690",
        "reply_reviewers": "0;0;6;1",
        "reply_authors": "3;3;13;4",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            76.0,
            28.416544476765644
        ],
        "wc_strengths_avg": [
            53.0,
            26.77685567799177
        ],
        "wc_weaknesses_avg": [
            355.0,
            252.58958806728356
        ],
        "wc_questions_avg": [
            32.75,
            27.39867697535777
        ],
        "wc_review_avg": [
            516.75,
            278.3696957285401
        ],
        "wc_reply_reviewers_avg": [
            255.5,
            419.762730599085
        ],
        "wc_reply_authors_avg": [
            2240.25,
            1589.474185855184
        ],
        "reply_reviewers_avg": [
            1.75,
            2.48746859276655
        ],
        "reply_authors_avg": [
            5.75,
            4.205650960315181
        ],
        "replies_avg": [
            36,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.30151134457776363,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11156368930068035266&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "University of Virginia;University of Illinois Urbana-Champaign",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.virginia.edu;https://illinois.edu",
        "aff_unique_abbr": "UVA;UIUC",
        "aff_campus_unique_index": "0;0;1",
        "aff_campus_unique": "Charlottesville;Urbana-Champaign;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "I5MquO1g7R",
        "title": "Change Point Detection via Variational Time-Varying Hidden Markov Model",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The task of modeling time series data that exhibit sudden regime shifts has been an enduring focus of research due to its inherent complexity. Among the various strategies to tackle this issue, the Hidden Markov Model (HMM) has been extensively investigated, which captures the regime changes by modeling the transition between latent states. Despite its popularity, the HMM-based methodology carries certain limitations, including specific distribution assumptions and its computational intensity for inference and learning, particularly when the number of change points is unidentified. In this work, we propose a novel approach that models the location of change points and introduce the $\\textbf{TV-HMM}$, a variant of the Hidden Markov Model incorporating the time-varying location transition matrix. Based on the novel modeling scheme, we propose an associated variational EM algorithm that simultaneously detects the locations and the number of change points, together with inferring the posterior distributions of regime parameters. In contrast to previous approaches, the proposed method exhibits robustness against the misspecification of change point numbers and can be augmented with stochastic approximation techniques to effectively mitigate the computational burden. Furthermore, we establish the statistical consistency of the change point location estimation under the Gaussian likelihood assumption. We also generalize the parametric likelihood function using the Maximum Mean Discrepancy (MMD) and propose the semi-parametric $\\textbf{TV-HMM}$ that is free of distribution assumptions. A series of experiments validate the theoretical convergence rate and demonstrate our estimation accuracy in terms of Rand index and MSE.",
        "keywords": "Change Point Detection;Probabilistic Modeling;Bayesian Inference;Hidden Markov Model",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/6a24902ae36b34144058be624936ca5264098864.pdf",
        "author": "Hao Zhang;Qishi Dong;Chuanlong Xie;Heng Peng",
        "authorids": "~Hao_Zhang67;~Qishi_Dong1;~Chuanlong_Xie1;~Heng_Peng2",
        "gender": "M;M;M;M",
        "homepage": ";https://github.com/Derrick-97;;http://www.math.hkbu.edu.hk/~hpeng",
        "dblp": ";;;",
        "google_scholar": ";;_fgE3u8AAAAJ;",
        "orcid": "0000-0003-0504-104X;;;",
        "linkedin": ";;;",
        "or_profile": "~Hao_Zhang67;~Qishi_Dong1;~Chuanlong_Xie1;~Heng_Peng2",
        "aff": "Hong Kong Baptist University;University of Hong Kong;Beijing Normal University;Hong Kong Baptist University",
        "aff_domain": "hkbu.edu.hk;hku.hk;bnu.edu.cn;hkbu.edu.hk",
        "position": "PhD student;Postdoc;Associate Professor;Associate Professor",
        "bibtex": "@misc{\nzhang2024change,\ntitle={Change Point Detection via Variational Time-Varying Hidden Markov Model},\nauthor={Hao Zhang and Qishi Dong and Chuanlong Xie and Heng Peng},\nyear={2024},\nurl={https://openreview.net/forum?id=I5MquO1g7R}\n}",
        "github": "",
        "project": "",
        "reviewers": "98Hf;MqQg;hP3N;bXnv",
        "site": "https://openreview.net/forum?id=I5MquO1g7R",
        "pdf_size": 1254016,
        "rating": "3;5;5;6",
        "confidence": "3;3;3;4",
        "soundness": "2;2;3;2",
        "contribution": "2;3;3;3",
        "presentation": "2;2;3;2",
        "wc_summary": "97;36;81;100",
        "wc_strengths": "27;42;76;85",
        "wc_weaknesses": "40;131;50;81",
        "wc_questions": "200;60;40;486",
        "wc_review": "364;269;247;752",
        "wc_reply_reviewers": "0;0;33;0",
        "wc_reply_authors": "692;352;577;909",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "2;2;2;3",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            78.5,
            25.578311124857326
        ],
        "wc_strengths_avg": [
            57.5,
            23.817010727629107
        ],
        "wc_weaknesses_avg": [
            75.5,
            35.42950747611375
        ],
        "wc_questions_avg": [
            196.5,
            178.148112535609
        ],
        "wc_review_avg": [
            408.0,
            203.41705926494956
        ],
        "wc_reply_reviewers_avg": [
            8.25,
            14.289419162443238
        ],
        "wc_reply_authors_avg": [
            632.5,
            201.09264034270373
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.6622661785325219,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:BcQdCFO86skJ:scholar.google.com/&scioq=Change+Point+Detection+via+Variational+Time-Varying+Hidden+Markov+Model&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Hong Kong Baptist University;University of Hong Kong;Beijing Normal University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.hkbu.edu.hk;https://www.hku.hk;https://www.bnu.edu.cn",
        "aff_unique_abbr": "HKBU;HKU;BNU",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "I5lcjmFmlc",
        "title": "Robust Classification via a Single Diffusion Model",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recently, diffusion models have been successfully applied to improving adversarial robustness of image classifiers by purifying the adversarial noises or generating realistic data for adversarial training. However, the diffusion-based purification can be evaded by stronger adaptive attacks while adversarial training does not perform well under unseen threats, exhibiting inevitable limitations of these methods. To better harness the expressive power of diffusion models, in this paper we propose Robust Diffusion Classifier (RDC), a generative classifier that is constructed from a pre-trained diffusion model to be adversarially robust. Our method first maximizes the data likelihood of a given input and then predicts the class probabilities of the optimized input using the conditional likelihood estimated by the diffusion model through Bayes' theorem. To further reduce the computational complexity, we propose a new diffusion backbone called multi-head diffusion and develop efficient sampling strategies. As our method does not require training on particular adversarial attacks, we demonstrate that it is more generalizable to defend against multiple unseen threats. In particular, RDC achieves 75.67% robust accuracy against $\\ell_\\infty$ norm-bounded perturbations with $\\epsilon_\\infty=8/255$ on CIFAR-10, surpassing the previous state-of-the-art adversarial training models by +4.77%. The findings highlight the potential of generative classifiers by employing diffusion models for adversarial robustness compared with the commonly studied discriminative classifiers.",
        "keywords": "Adversarial defense;diffusion models;generative classifier;robustness",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/b6d22a74f3a4864b1d093253cb674b2bf9d79ab1.zip",
        "author": "Huanran Chen;Yinpeng Dong;Zhengyi Wang;Xiao Yang;Chengqi Duan;Hang Su;Jun Zhu",
        "authorids": "~Huanran_Chen1;~Yinpeng_Dong2;~Zhengyi_Wang1;~Xiao_Yang4;~Chengqi_Duan1;~Hang_Su3;~Jun_Zhu2",
        "gender": "M;M;M;M;M;M;M",
        "homepage": "https://huanranchen.github.io/;https://dongyp13.github.io;https://thuwzy.github.io;https://ml.cs.tsinghua.edu.cn/~xiaoyang/;;http://ml.cs.tsinghua.edu.cn/~jun;",
        "dblp": "329/6558;183/0980;;57/33851;336/2001;50/2644-1;26/5371-6",
        "google_scholar": "https://scholar.google.co.jp/citations?user=QYsKXccAAAAJ;6_4ad84AAAAJ;dtuPuRQAAAAJ;bwkwp0MAAAAJ;r9qb4ZwAAAAJ;axsP38wAAAAJ;dxN1_X0AAAAJ",
        "orcid": ";;;0000-0001-9502-9962;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Huanran_Chen1;~Yinpeng_Dong2;~Zhengyi_Wang1;~Xiao_Yang4;~Chengqi_Duan1;~Jun_Zhu2;~Hang_Su2",
        "aff": ";Tsinghua University;Tsinghua University;Tsinghua University;University of Hong Kong;Tsinghua University;Tsinghua University",
        "aff_domain": ";tsinghua.edu.cn;tsinghua.edu.cn;mail.tsinghua.edu.cn;hku.hk;mail.tsinghua.edu.cn;tsinghua.edu.cn",
        "position": ";Postdoc;PhD student;Postdoc;PhD student;Professor;Associate Professor",
        "bibtex": "@misc{\nchen2024robust,\ntitle={Robust Classification via a Single Diffusion Model},\nauthor={Huanran Chen and Yinpeng Dong and Zhengyi Wang and Xiao Yang and Chengqi Duan and Hang Su and Jun Zhu},\nyear={2024},\nurl={https://openreview.net/forum?id=I5lcjmFmlc}\n}",
        "github": "",
        "project": "",
        "reviewers": "noA3;ScPt;Xkzq",
        "site": "https://openreview.net/forum?id=I5lcjmFmlc",
        "pdf_size": 2716088,
        "rating": "8;8;8",
        "confidence": "3;4;4",
        "soundness": "4;4;3",
        "contribution": "3;4;4",
        "presentation": "4;3;2",
        "wc_summary": "64;96;82",
        "wc_strengths": "65;162;74",
        "wc_weaknesses": "116;425;326",
        "wc_questions": "75;14;168",
        "wc_review": "320;697;650",
        "wc_reply_reviewers": "101;111;183",
        "wc_reply_authors": "1528;818;1491",
        "reply_reviewers": "1;1;1",
        "reply_authors": "3;2;3",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            80.66666666666667,
            13.097921802925667
        ],
        "wc_strengths_avg": [
            100.33333333333333,
            43.759443425264095
        ],
        "wc_weaknesses_avg": [
            289.0,
            128.83322552819982
        ],
        "wc_questions_avg": [
            85.66666666666667,
            63.32105144069827
        ],
        "wc_review_avg": [
            555.6666666666666,
            167.74252756995034
        ],
        "wc_reply_reviewers_avg": [
            131.66666666666666,
            36.527006751473934
        ],
        "wc_reply_authors_avg": [
            1279.0,
            326.32601285626413
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 65,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1883020923716387299&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;0;0;1;0;0",
        "aff_unique_norm": "Tsinghua University;University of Hong Kong",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.hku.hk",
        "aff_unique_abbr": "THU;HKU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "DiffusionSat: A Generative Foundation Model for Satellite Imagery",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18972",
        "id": "I5webNFDgQ",
        "author_site": "Samar Khanna, Patrick Liu, Linqi Zhou, Chenlin Meng, Robin Rombach, Marshall Burke, David Lobell, Stefano Ermon",
        "tldr": "",
        "abstract": "Diffusion models have achieved state-of-the-art results on many modalities including images, speech, and video. However, existing models are not tailored to support remote sensing data, which is widely used in important applications including environmental monitoring and crop-yield prediction. Satellite images are significantly different from natural images -- they can be multi-spectral, irregularly sampled across time -- and existing diffusion models trained on images from the Web do not support them. Furthermore, remote sensing data is inherently spatio-temporal, requiring conditional generation tasks not supported by traditional methods based on captions or images. In this paper, we present DiffusionSat, to date the largest generative foundation model trained on a collection of publicly available large, high-resolution remote sensing datasets .\nAs text-based captions are sparsely available for satellite images, we incorporate the associated metadata such as geolocation as conditioning information. \nOur method produces realistic samples and can be used to solve multiple generative tasks including temporal generation, multi-spectral superrresolution and in-painting. Our method outperforms previous state-of-the-art methods for satellite image generation and is the first large-scale _generative_ foundation model for satellite imagery.\nThe project website can be found here: https://samar-khanna.github.io/DiffusionSat/",
        "keywords": "satellite images;generative models;diffusion models;computer vision",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Samar Khanna;Patrick Liu;Linqi Zhou;Chenlin Meng;Robin Rombach;Marshall Burke;David B. Lobell;Stefano Ermon",
        "authorids": "~Samar_Khanna1;~Patrick_Liu1;~Linqi_Zhou1;~Chenlin_Meng1;~Robin_Rombach1;~Marshall_Burke1;~David_B._Lobell1;~Stefano_Ermon1",
        "gender": ";M;M;F;M;;;M",
        "homepage": "https://samar-khanna.github.io/;https://web.stanford.edu/~pliu1/;https://alexzhou907.github.io;https://chenlin9.github.io/;https://hci.iwr.uni-heidelberg.de/user/1149/biblio;http://web.stanford.edu/~mburke/;;http://cs.stanford.edu/~ermon/",
        "dblp": ";;42/10445;227/2517;263/9785;;00/11322;47/8135",
        "google_scholar": "DPHEQsMAAAAJ;;;nEFU7wIAAAAJ;ygdQhrIAAAAJ;ppx71KUAAAAJ;;",
        "orcid": ";;;;;;;",
        "linkedin": "samar-khanna-133b8190/;;;;;;;",
        "or_profile": "~Samar_Khanna1;~Patrick_Liu1;~Linqi_Zhou1;~Chenlin_Meng1;~Robin_Rombach1;~Marshall_Burke1;~David_B._Lobell1;~Stefano_Ermon1",
        "aff": "Computer Science Department, Stanford University;Stanford University;Stanford University;Stanford University;Stability AI;;Stanford University;Stanford University",
        "aff_domain": "cs.stanford.edu;stanford.edu;stanford.edu;stanford.edu;stabilty.ai;;stanford.edu;stanford.edu",
        "position": "Researcher;Undergrad student;PhD student;PhD student;Researcher;;Full Professor;Associate Professor",
        "bibtex": "@inproceedings{\nkhanna2024diffusionsat,\ntitle={DiffusionSat: A Generative Foundation Model for Satellite Imagery},\nauthor={Samar Khanna and Patrick Liu and Linqi Zhou and Chenlin Meng and Robin Rombach and Marshall Burke and David B. Lobell and Stefano Ermon},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=I5webNFDgQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZvAY;DCYE;tt9n;tstN",
        "pdf_size": 3666107,
        "rating": "3;6;8;8",
        "confidence": "4;4;4;4",
        "soundness": "2;3;4;2",
        "contribution": "1;3;3;3",
        "presentation": "2;3;4;2",
        "wc_summary": "64;75;67;78",
        "wc_strengths": "37;56;172;75",
        "wc_weaknesses": "40;235;280;146",
        "wc_questions": "158;50;100;227",
        "wc_review": "299;416;619;526",
        "wc_reply_reviewers": "0;0;25;116",
        "wc_reply_authors": "1613;798;1224;1133",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "5;3;5;5",
        "rating_avg": [
            6.25,
            2.0463381929681126
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            71.0,
            5.70087712549569
        ],
        "wc_strengths_avg": [
            85.0,
            51.995192085422666
        ],
        "wc_weaknesses_avg": [
            175.25,
            91.77520089871773
        ],
        "wc_questions_avg": [
            133.75,
            66.02414331136755
        ],
        "wc_review_avg": [
            465.0,
            119.78522446445555
        ],
        "wc_reply_reviewers_avg": [
            35.25,
            47.72512441052407
        ],
        "wc_reply_authors_avg": [
            1192.0,
            290.2507536596589
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            4.5,
            0.8660254037844386
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 70,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1748253284438467719&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=I5webNFDgQ",
        "pdf": "https://openreview.net/pdf?id=I5webNFDgQ",
        "email": "cs.stanford.edu;stanford.edu;stanford.edu;stanford.edu;stabilty.ai;;stanford.edu;stanford.edu",
        "author_num": 8,
        "aff_unique_index": "0;0;0;0;1;0;0",
        "aff_unique_norm": "Stanford University;Stability AI",
        "aff_unique_dep": "Computer Science Department;",
        "aff_unique_url": "https://www.stanford.edu;https://stability.ai",
        "aff_unique_abbr": "Stanford;Stability AI",
        "aff_campus_unique_index": "0;0;0;0;0;0",
        "aff_campus_unique": "Stanford;",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "I7FPVqlwSe",
        "title": "Reward Translation via Reward Machine in Semi-Alignable MDPs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep reinforcement learning often relies heavily on the quality of dense rewards, which can necessitate significant engineering effort. Reusing human-designed rewards across similar tasks in different domains can enhance learning efficiency in reinforcement learning. \nCurrent works have delved into an assortment of domains characterized by divergent embodiments, differing viewpoints, and dynamic disparities. However, these studies require either alignment or alignable demonstrations in which states maintain a bijective map, consequently restricting the applicability to more generalized reward reusing across disparate domains.\nIt becomes crucial to identify the latent structural similarities through coarser-grained alignments between distinct domains, as this enables a reinforcement learning agent to harness its capacity for abstract transfer in a manner akin to human navigation based on maps.\nTo address this challenge, semi-alignable Markov Decision Processes (MDPs) is introduced as a fundamental underpinning to delineate the coarse-grained latent structural resemblances amidst varying domains\nSubsequently, the Neural Reward Translation (NRT) framework is established, which employs reward machines to resolve cross-domain reward transfer problem within semi-alignable MDPs, thus facilitating more versatile reward reusing that supports reinforcement learning across diverse domains.\nOur methodology is corroborated through several semi-alignable  environments, highlighting NRT's efficacy in domain adaptation undertakings involving semi-alignable MDPs.",
        "keywords": "Reinforcement Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/4be961a029757758dc76b77a67fe77097e566415.pdf",
        "author": "Yun Hua;Wenhao Li;Bo Jin;Baoxiang Wang;Xiaofeng He;Hongyuan Zha;Xiangfeng Wang",
        "authorids": "~Yun_Hua1;~Wenhao_Li2;~Bo_Jin1;~Baoxiang_Wang1;~Xiaofeng_He2;~Hongyuan_Zha1;~Xiangfeng_Wang1",
        "gender": ";M;;;M;;M",
        "homepage": ";https://tomaxent.com;;;;;https://xfwang87.github.io/",
        "dblp": "23/8866;;;;;z/HongyuanZha;84/4695",
        "google_scholar": "hjnEwrEAAAAJ;HAtzuaYAAAAJ;;;;n1DQMIsAAAAJ;YpGMkgsAAAAJ",
        "orcid": ";;;;0000-0002-6911-348X;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Yun_Hua1;~Wenhao_Li2;~Bo_Jin1;~Baoxiang_Wang1;~Xiaofeng_He2;~Hongyuan_Zha1;~Xiangfeng_Wang1",
        "aff": "East China Normal University;The Chinese University of Hong Kong, Shenzhen;;;East China Normal University;The Chinese University of Hong Kong, Shenzhen;East China Normal University",
        "aff_domain": "ecnu.edu.cn;cuhk.edu.cn;;;ecnu.edu.cn;cuhk.edu.cn;ecnu.edu.cn",
        "position": "PhD student;Postdoc;;;Full Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nhua2024reward,\ntitle={Reward Translation via Reward Machine in Semi-Alignable {MDP}s},\nauthor={Yun Hua and Wenhao Li and Bo Jin and Baoxiang Wang and Xiaofeng He and Hongyuan Zha and Xiangfeng Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=I7FPVqlwSe}\n}",
        "github": "",
        "project": "",
        "reviewers": "FyDb;YSPR;heMd;LeVr",
        "site": "https://openreview.net/forum?id=I7FPVqlwSe",
        "pdf_size": 2640312,
        "rating": "3;3;3;6",
        "confidence": "4;3;2;3",
        "soundness": "2;1;2;2",
        "contribution": "2;2;2;2",
        "presentation": "2;1;1;3",
        "wc_summary": "105;84;67;67",
        "wc_strengths": "54;146;50;85",
        "wc_weaknesses": "114;840;239;71",
        "wc_questions": "2;97;198;24",
        "wc_review": "275;1167;554;247",
        "wc_reply_reviewers": "48;51;37;11",
        "wc_reply_authors": "25;324;252;80",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            80.75,
            15.626499928006911
        ],
        "wc_strengths_avg": [
            83.75,
            38.408169703853375
        ],
        "wc_weaknesses_avg": [
            316.0,
            308.7612346134145
        ],
        "wc_questions_avg": [
            80.25,
            76.53879735140865
        ],
        "wc_review_avg": [
            560.75,
            370.0259281455828
        ],
        "wc_reply_reviewers_avg": [
            36.75,
            15.75396775418815
        ],
        "wc_reply_authors_avg": [
            170.25,
            122.02945341187102
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:6x1APJyA-fwJ:scholar.google.com/&scioq=Reward+Translation+via+Reward+Machine+in+Semi-Alignable+MDPs&hl=en&as_sdt=0,19",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;1;0",
        "aff_unique_norm": "East China Normal University;Chinese University of Hong Kong",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.ecnu.edu.cn;https://www.cuhk.edu.cn",
        "aff_unique_abbr": "ECNU;CUHK",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Shenzhen",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "I7kpf3mZ4n",
        "title": "Meta- (out-of-context) learning in neural networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Brown et al. (2020) famously introduced the phenomenon of in-context learning in large language models (LLMs). We establish the existence of a phenomenon we call **meta-out-of-context learning (meta-OCL)** via carefully designed synthetic experiments with LLMs. Our results suggest that meta-OCL leads LLMs to more readily \u201cinternalize\u201d the semantic content of text that is, *or appears to be*, broadly useful (such as true statements, or text from authoritative sources) and use it in appropriate circumstances. We further demonstrate meta-OCL in a synthetic computer vision setting, and propose two hypotheses for the emergence of meta-OCL: one relying on the way models store knowledge in their parameters, and another suggesting that the implicit gradient alignment bias of gradient-descent-based optimizers may be responsible. Finally, we reflect on what our results might imply about capabilities of future AI systems, and discuss potential risks.",
        "keywords": "LLMs;large language models;in-context learning;meta-learning;world models;internalization;consistency;learning factual associations",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Dmitrii Krasheninnikov;Egor Krasheninnikov;Bruno Kacper Mlodozeniec;David Krueger",
        "authorids": "~Dmitrii_Krasheninnikov1;~Egor_Krasheninnikov1;~Bruno_Kacper_Mlodozeniec2;~David_Krueger1",
        "gender": "M;M;Not Specified;M",
        "homepage": "https://krasheninnikov.github.io/about/;;https://brunokm.github.io;https://mila.umontreal.ca/en/person/david-scott-krueger/",
        "dblp": ";;241/6874;142/2741.html",
        "google_scholar": "BIQflKQAAAAJ;6DiC_yYAAAAJ;kGPBRy8AAAAJ;https://scholar.google.ca/citations?user=5Uz70IoAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;bkmlodozeniec/;",
        "or_profile": "~Dmitrii_Krasheninnikov1;~Egor_Krasheninnikov1;~Bruno_Kacper_Mlodozeniec2;~David_Krueger1",
        "aff": "University of Cambridge;University of Cambridge;University of Cambridge;University of Cambridge",
        "aff_domain": "cam.ac.uk;cam.ac.uk;cam.ac.uk;cam.ac.uk",
        "position": "PhD student;Research Assistant;PhD student;Assistant Professor",
        "bibtex": "@misc{\nkrasheninnikov2024meta,\ntitle={Meta- (out-of-context) learning in neural networks},\nauthor={Dmitrii Krasheninnikov and Egor Krasheninnikov and Bruno Kacper Mlodozeniec and David Krueger},\nyear={2024},\nurl={https://openreview.net/forum?id=I7kpf3mZ4n}\n}",
        "github": "",
        "project": "",
        "reviewers": "Vaqj;Rz8f;UZ6L;zUXo",
        "site": "https://openreview.net/forum?id=I7kpf3mZ4n",
        "pdf_size": 865168,
        "rating": "5;5;5;6",
        "confidence": "4;2;4;2",
        "soundness": "2;3;3;2",
        "contribution": "2;2;2;3",
        "presentation": "2;1;2;2",
        "wc_summary": "686;66;56;200",
        "wc_strengths": "81;61;29;127",
        "wc_weaknesses": "1334;279;254;203",
        "wc_questions": "53;151;5;603",
        "wc_review": "2154;557;344;1133",
        "wc_reply_reviewers": "550;30;0;0",
        "wc_reply_authors": "2097;1027;616;966",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "4;2;1;2",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.0,
            1.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            252.0,
            256.9396816375392
        ],
        "wc_strengths_avg": [
            74.5,
            35.53519382246282
        ],
        "wc_weaknesses_avg": [
            517.5,
            472.20149300907553
        ],
        "wc_questions_avg": [
            203.0,
            236.85860761222085
        ],
        "wc_review_avg": [
            1047.0,
            701.2763364038459
        ],
        "wc_reply_reviewers_avg": [
            145.0,
            234.14738947936192
        ],
        "wc_reply_authors_avg": [
            1176.5,
            554.1076159014601
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            1.0897247358851685
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6261552456557695503&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of Cambridge",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cam.ac.uk",
        "aff_unique_abbr": "Cambridge",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Cambridge",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "I8pdQLfR77",
        "title": "Improving MLP Module in Vision Transformer",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Transformer models have been gaining substantial interest in the field of computer vision tasks nowadays. Although a vision transformer contains two important components which are self-attention module and multi-layer perceptron (MLP) module, the majority of research tends to concentrate on modifying the former while leaving the latter in its original form. In this paper, we focus on improving the MLP module within the vision transformer. Through theoretical analysis, we demonstrate that the effect of the MLP module primarily lies in providing non-linearity, whose degree corresponds to the hidden dimensions. Thus, the computational cost of the MLP module can be reduced by enhancing the degree of non-linearity in the nonlinear function. Leveraging this insight, we propose an improved MLP (IMLP) module for vision transformers which involves the usage of the arbitrary GeLU (AGeLU) function and integrating multiple instances of it to augment non-linearity so that the number of hidden dimensions can be effectively reduced. Besides, a spatial enhancement part is involved to further enrich the non-linearity in the proposed IMLP module. Experimental results show that we can apply our method to a wide range of state-of-the-art vision transformer models irrespective of how they modify their self-attention part and the overall architecture, and reduce FLOPs and parameters without compromising classification accuracy on the ImageNet dataset.",
        "keywords": "vision transformer;MLP;efficient model design",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Yixing Xu;Chao Li;Dong Li;Xiao Sheng;Fan Jiang;Lu Tian;Ashish Sirasao",
        "authorids": "~Yixing_Xu2;~Chao_Li27;~Dong_Li13;~Xiao_Sheng1;~Fan_Jiang5;~Lu_Tian3;~Ashish_Sirasao1",
        "gender": "M;M;M;M;F;M;M",
        "homepage": ";;;;;;https://sites.google.com/site/lidonggg930/",
        "dblp": "142/1013;;;;;19/4292.html;47/4826-25",
        "google_scholar": "32tJoOkAAAAJ;;https://scholar.google.com/citations?view_op=list_works;;edbuKpcAAAAJ;;I9s_CWwAAAAJ",
        "orcid": ";;;;;;",
        "linkedin": ";%E8%B6%85-%E6%9D%8E-6164a6a0/;;fan-jiang-996514268/;;;",
        "or_profile": "~Yixing_Xu2;~Chao_Li27;~Xiao_Sheng1;~Fan_Jiang5;~Lu_Tian3;~Ashish_Sirasao1;~Dong_Li4",
        "aff": "Advanced Micro Devices;;;Advanced Micro Devices;AMD;Amd inc;Advanced Micro Devices",
        "aff_domain": "amd.com;;;amd.com;amd.com;amd.com;amd.com",
        "position": "Principal Researcher;;;Principal Researcher;Researcher;Researcher;Researcher",
        "bibtex": "@misc{\nxu2024improving,\ntitle={Improving {MLP} Module in Vision Transformer},\nauthor={Yixing Xu and Chao Li and Dong Li and Xiao Sheng and Fan Jiang and Lu Tian and Ashish Sirasao},\nyear={2024},\nurl={https://openreview.net/forum?id=I8pdQLfR77}\n}",
        "github": "",
        "project": "",
        "reviewers": "5FNj;as7x;JSwb;oReY",
        "site": "https://openreview.net/forum?id=I8pdQLfR77",
        "pdf_size": 577532,
        "rating": "3;3;5;8",
        "confidence": "5;5;4;5",
        "soundness": "2;2;3;4",
        "contribution": "1;2;3;4",
        "presentation": "2;2;4;3",
        "wc_summary": "57;68;97;86",
        "wc_strengths": "18;18;60;128",
        "wc_weaknesses": "69;310;111;159",
        "wc_questions": "6;133;31;3",
        "wc_review": "150;529;299;376",
        "wc_reply_reviewers": "196;195;0;60",
        "wc_reply_authors": "719;1877;820;569",
        "reply_reviewers": "3;1;0;1",
        "reply_authors": "5;4;2;2",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            4.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            1.118033988749895
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            77.0,
            15.508062419270823
        ],
        "wc_strengths_avg": [
            56.0,
            44.96665431183423
        ],
        "wc_weaknesses_avg": [
            162.25,
            91.05321246392134
        ],
        "wc_questions_avg": [
            43.25,
            52.945136698284195
        ],
        "wc_review_avg": [
            338.5,
            136.73788794624554
        ],
        "wc_reply_reviewers_avg": [
            112.75,
            85.42650349862156
        ],
        "wc_reply_authors_avg": [
            996.25,
            516.2835340198252
        ],
        "reply_reviewers_avg": [
            1.25,
            1.0897247358851685
        ],
        "reply_authors_avg": [
            3.25,
            1.299038105676658
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.07053456158585983,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8210759453494852946&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Advanced Micro Devices, Inc.",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.amd.com",
        "aff_unique_abbr": "AMD",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "IAWIgFT71j",
        "title": "Assessing Large Language Models on Climate Information",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Understanding how climate change affects us and learning about available solutions are key steps toward empowering individuals and communities to mitigate and adapt to it. As Large Language Models (LLMs) rise in popularity, it is necessary to assess their capability in this domain. In this study, we present a comprehensive evaluation framework, grounded in science communication principles, to analyze LLM responses to climate change topics. Our framework emphasizes both the presentational and epistemological adequacy of answers, offering a fine-grained analysis of LLM generations. Spanning 8 dimensions, our framework discerns up to 30 distinct issues in model outputs.\nThe task is a real-world example of a growing number of challenging problems where AI can complement and lift human performance. We introduce a novel and practical protocol for scalable oversight that uses AI Assistance and relies on raters with relevant educational backgrounds.\nWe evaluate several recent LLMs and conduct a comprehensive analysis of the results, shedding light on both the potential and the limitations of LLMs in the realm of climate communication.",
        "keywords": "ai;llm;climate;climate change;climate information;scalable oversight;alignment;evaluation;human evaluation",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Jannis Bulian;Mike S. Sch\u00e4fer;Afra Amini;Heidi Lam;Massimiliano Ciaramita;Ben Gaiarin;Michelle Chen Huebscher;Christian Buck;Niels G. Mede;Markus Leippold;Nadine Strauss",
        "authorids": "~Jannis_Bulian1;~Mike_S._Sch\u00e4fer1;~Afra_Amini1;~Heidi_Lam1;~Massimiliano_Ciaramita2;~Ben_Gaiarin1;~Michelle_Chen_Huebscher1;~Christian_Buck1;~Niels_G._Mede1;~Markus_Leippold1;~Nadine_Strauss1",
        "gender": "M;M;F;;;M;F;M;M;M;F",
        "homepage": "http://bulian.org/;https://www.ikmz.uzh.ch/en/research/divisions/science-crisis-and-risk-communication/team/mike-s-schaefer.html;;http://google.com;;;https://arxiv.org/search/cs?searchtype=author&query=Huebscher%2C+M+C;;https://www.nielsmede.com/;https://www.bf.uzh.ch/de/persons/leippold-markus;https://www.nadinestrauss.com",
        "dblp": "09/10967;;270/4959;;31/916;;;;;;",
        "google_scholar": "https://scholar.google.co.uk/citations?user=Yq32OuIAAAAJ;;;;;btkFBuQAAAAJ;;DSb_wQ8AAAAJ;wzJ53tgAAAAJ;-Ta9boQAAAAJ;https://scholar.google.com/citations?hl=de",
        "orcid": "0000-0002-2908-4485;;;;;;;;0000-0001-5707-7568;;0000-0002-5050-7067",
        "linkedin": "jbulian/;;afraamini;;;bgaiarin/;;;ngmede/;markus-leippold-578bb95/;nadine-strau\u00df-bb129572/",
        "or_profile": "~Jannis_Bulian1;~Mike_S._Sch\u00e4fer1;~Afra_Amini1;~Heidi_Lam1;~Massimiliano_Ciaramita2;~Ben_Gaiarin1;~Michelle_Chen_Huebscher1;~Christian_Buck1;~Niels_G._Mede1;~Markus_Leippold1;~Nadine_Strauss1",
        "aff": "Google DeepMind;University of Zurich;ETHZ - ETH Zurich;;Google;Research, Google;;Google;University of Zurich;University of Zurich;University of Zurich",
        "aff_domain": "google.com;uzh.ch;ethz.ch;;google.com;research.google.com;;google.com;uzh.ch;uzh.ch;uzh.ch",
        "position": "Researcher;Full Professor;PhD student;;Research Scientist;Technical Program Manager;;Researcher;Postdoc;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nbulian2024assessing,\ntitle={Assessing Large Language Models on Climate Information},\nauthor={Jannis Bulian and Mike S. Sch{\\\"a}fer and Afra Amini and Heidi Lam and Massimiliano Ciaramita and Ben Gaiarin and Michelle Chen Huebscher and Christian Buck and Niels G. Mede and Markus Leippold and Nadine Strauss},\nyear={2024},\nurl={https://openreview.net/forum?id=IAWIgFT71j}\n}",
        "github": "",
        "project": "",
        "reviewers": "6F8Y;Y9KD;ihxg;yjrw",
        "site": "https://openreview.net/forum?id=IAWIgFT71j",
        "pdf_size": 2738831,
        "rating": "3;5;5;8",
        "confidence": "5;5;5;4",
        "soundness": "2;2;2;3",
        "contribution": "1;2;3;3",
        "presentation": "3;3;4;4",
        "wc_summary": "24;116;71;83",
        "wc_strengths": "62;101;230;70",
        "wc_weaknesses": "188;991;1381;172",
        "wc_questions": "25;191;127;149",
        "wc_review": "299;1399;1809;474",
        "wc_reply_reviewers": "0;0;483;56",
        "wc_reply_authors": "378;1140;1667;917",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "2;3;4;2",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            73.5,
            32.98863440641337
        ],
        "wc_strengths_avg": [
            115.75,
            67.55136934215324
        ],
        "wc_weaknesses_avg": [
            683.0,
            521.587480677978
        ],
        "wc_questions_avg": [
            123.0,
            61.07372593840988
        ],
        "wc_review_avg": [
            995.25,
            628.8220634646974
        ],
        "wc_reply_reviewers_avg": [
            134.75,
            202.35782045673452
        ],
        "wc_reply_authors_avg": [
            1025.5,
            462.5097296273885
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": -0.8892972917998875,
        "gs_citation": 28,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9869895816938654350&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 12,
        "aff_unique_index": "0;1;2;0;0;0;1;1;1",
        "aff_unique_norm": "Google;University of Zurich;ETH Zurich",
        "aff_unique_dep": "Google DeepMind;;",
        "aff_unique_url": "https://deepmind.com;https://www.unizh.ch;https://www.ethz.ch",
        "aff_unique_abbr": "DeepMind;UZH;ETHZ",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;1;2;2;2;1;1;1",
        "aff_country_unique": "United Kingdom;Switzerland;United States"
    },
    {
        "id": "IAZVktzmG5",
        "title": "Learning Epipolar Feature Fields for Multi-Image Super-Resolution",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Multi-image super-resolution (MISR) allows to increase the spatial resolution of a low-resolution (LR) acquisition by combining multiple images carrying complementary information in the form of sub-pixel offsets in the scene sampling, and can be significantly more effective than its single-image counterpart. Its main difficulty lies in accurately registering and fusing the multi-image information. Currently studied settings, such as burst photography, typically involve assumptions of small geometric disparity between the LR images and rely on optical flow for image registration.\nWe study a MISR method that can increase the resolution of sets of images acquired with arbitrary, and potentially wildly different, camera positions and orientations, generalizing the currently studied MISR settings. Our proposed model, called EpiMISR, moves away from optical flow and explicitly uses the epipolar geometry of the acquisition process, together with transformer-based processing of radiance feature fields to substantially improve over state-of-the-art MISR methods in presence of large disparities in the LR images.",
        "keywords": "super-resolution;multi-image;nerf",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/33fa0b6791bf1e1d239d066674fd5d62e9c30952.zip",
        "author": "Luca Savant Aira;Diego Valsesia;Andrea Bordone Molini;Giulia Fracastoro;Enrico Magli;Andrea Mirabile",
        "authorids": "~Luca_Savant_Aira1;~Diego_Valsesia1;~Andrea_Bordone_Molini1;~Giulia_Fracastoro1;~Enrico_Magli1;~Andrea_Mirabile1",
        "gender": "M;;;F;M;M",
        "homepage": "https://github.com/mezzelfo;;;;https://ipl.polito.it/enrico-magli;",
        "dblp": "317/0636;136/4988;;152/3306;81/5607;",
        "google_scholar": "-4oI6CEAAAAJ;https://scholar.google.it/citations?user=5YXpLhQAAAAJ;TGs6Dg8AAAAJ;https://scholar.google.it/citations?user=RAF6dlIAAAAJ;;",
        "orcid": "0009-0002-6728-0855;0000-0003-1997-2910;0000-0002-2452-1930;;0000-0002-0901-0251;",
        "linkedin": ";;andrea-bordone-molini-39ba11a0/;;;https://linkedin.com/in/amirabile",
        "or_profile": "~Luca_Savant_Aira1;~Diego_Valsesia1;~Andrea_Bordone_Molini1;~Giulia_Fracastoro1;~Enrico_Magli1;~Andrea_Mirabile1",
        "aff": "Polytechnic Institute of Turin;Politecnico di Torino;;Politecnico di Torino;Politecnico di Torino;Zebra technologies",
        "aff_domain": "polito.it;polito.it;;polito.it;polito.it;zebra.com",
        "position": "PhD student;Assistant Professor;;Assistant Professor;Full Professor;Director of AI",
        "bibtex": "@misc{\naira2024learning,\ntitle={Learning Epipolar Feature Fields for Multi-Image Super-Resolution},\nauthor={Luca Savant Aira and Diego Valsesia and Andrea Bordone Molini and Giulia Fracastoro and Enrico Magli and Andrea Mirabile},\nyear={2024},\nurl={https://openreview.net/forum?id=IAZVktzmG5}\n}",
        "github": "",
        "project": "",
        "reviewers": "usbg;de1T;Cf89;eUdX",
        "site": "https://openreview.net/forum?id=IAZVktzmG5",
        "pdf_size": 2300635,
        "rating": "3;6;8;10",
        "confidence": "5;5;5;4",
        "soundness": "2;3;3;4",
        "contribution": "2;2;3;4",
        "presentation": "2;3;3;4",
        "wc_summary": "87;32;67;176",
        "wc_strengths": "27;26;88;71",
        "wc_weaknesses": "362;249;30;155",
        "wc_questions": "92;77;2;9",
        "wc_review": "568;384;187;411",
        "wc_reply_reviewers": "0;121;0;30",
        "wc_reply_authors": "1510;882;35;323",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "3;2;1;1",
        "rating_avg": [
            6.75,
            2.5860201081971503
        ],
        "confidence_avg": [
            4.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            90.5,
            53.14367318881901
        ],
        "wc_strengths_avg": [
            53.0,
            27.175356483402386
        ],
        "wc_weaknesses_avg": [
            199.0,
            122.03073383373551
        ],
        "wc_questions_avg": [
            45.0,
            39.931190816202815
        ],
        "wc_review_avg": [
            387.5,
            135.4114101543884
        ],
        "wc_reply_reviewers_avg": [
            37.75,
            49.60027721696724
        ],
        "wc_reply_authors_avg": [
            687.5,
            564.1260940605389
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.7255892438417318,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:r6IPiW8W_6gJ:scholar.google.com/&scioq=Learning+Epipolar+Feature+Fields+for+Multi-Image+Super-Resolution&hl=en&as_sdt=0,48",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1;2",
        "aff_unique_norm": "Polytechnic Institute of Turin;Politecnico di Torino;Zebra Technologies Corporation",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.polito.it;https://www.polito.it;https://www.zebra.com",
        "aff_unique_abbr": "Polito;Polito;Zebra",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;1",
        "aff_country_unique": "Italy;United States"
    },
    {
        "id": "IAkflJmNrC",
        "title": "Polarity-Aware Semantic Retrieval with Fine-Tuned Sentence Embeddings",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper investigates the effectiveness of fine-tuning sentence embeddings for simultaneously retrieving sentences of equal polarity and high semantic similarity. We define two opposing metrics to support evaluation: Polarity Score and Semantic Similarity Score, used in a test suite with various lightweight sentence-transformer models, hyperparameters and loss functions. We perform evaluations on two binary classification problems from different domains: the SST-2 dataset for sentiment analysis and on detecting sarcastic news headlines.\nOur findings show a trade-off between a model's capability for retaining semantic similarity while being fine-tuned to differentiate between the polarity of training data. By accepting a minor decrease in semantic similarity, however, we achieve polarity scores far higher than the baselines. The results and modeling scheme allows for using a single, efficient model for text analytics systems suitable for in-domain retrieval.",
        "keywords": "sentence embeddings;transformers;fine-tuning;classification;semantic textual similarity",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/3775f3743563094139de890d5494998659a7afa9.zip",
        "author": "Tollef Emil J\u00f8rgensen;Jens Breitung",
        "authorids": "~Tollef_Emil_J\u00f8rgensen1;~Jens_Breitung1",
        "gender": "M;M",
        "homepage": ";",
        "dblp": ";",
        "google_scholar": "LpJWJnIAAAAJ;",
        "orcid": "0009-0007-7954-0016;0009-0006-6697-5275",
        "linkedin": ";",
        "or_profile": "~Tollef_Emil_J\u00f8rgensen1;~Jens_Breitung1",
        "aff": "Norwegian University of Science and Technology;Rheinisch Westf\u00e4lische Technische Hochschule Aachen",
        "aff_domain": "ntnu.no;rwth-aachen.de",
        "position": "PhD student;MS student",
        "bibtex": "@misc{\nj{\\o}rgensen2024polarityaware,\ntitle={Polarity-Aware Semantic Retrieval with Fine-Tuned Sentence Embeddings},\nauthor={Tollef Emil J{\\o}rgensen and Jens Breitung},\nyear={2024},\nurl={https://openreview.net/forum?id=IAkflJmNrC}\n}",
        "github": "",
        "project": "",
        "reviewers": "DEGg;TX7z;Co32;urPj",
        "site": "https://openreview.net/forum?id=IAkflJmNrC",
        "pdf_size": 463232,
        "rating": "3;3;5;5",
        "confidence": "3;5;3;3",
        "soundness": "1;1;4;3",
        "contribution": "1;1;2;2",
        "presentation": "1;2;4;2",
        "wc_summary": "43;36;59;184",
        "wc_strengths": "28;55;50;49",
        "wc_weaknesses": "35;111;158;243",
        "wc_questions": "200;1;64;42",
        "wc_review": "306;203;331;518",
        "wc_reply_reviewers": "16;0;17;19",
        "wc_reply_authors": "314;101;189;336",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.25,
            1.299038105676658
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            80.5,
            60.33448433524563
        ],
        "wc_strengths_avg": [
            45.5,
            10.35615758860399
        ],
        "wc_weaknesses_avg": [
            136.75,
            75.42670283129178
        ],
        "wc_questions_avg": [
            76.75,
            74.66382993123243
        ],
        "wc_review_avg": [
            339.5,
            113.67607487945737
        ],
        "wc_reply_reviewers_avg": [
            13.0,
            7.582875444051551
        ],
        "wc_reply_authors_avg": [
            235.0,
            95.54318395364476
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ODPVsI8FAK4J:scholar.google.com/&scioq=Polarity-Aware+Semantic+Retrieval+with+Fine-Tuned+Sentence+Embeddings&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Norwegian University of Science and Technology;RWTH Aachen University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ntnu.no;https://www.rwth-aachen.de",
        "aff_unique_abbr": "NTNU;RWTH",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Aachen",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Norway;Germany"
    },
    {
        "id": "IAlmvV1pZd",
        "title": "L-MBOP-E: Latent-Model Based Offline Planning with Extrinsic Policy Guided Exploration",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Offline planning has recently emerged as a promising reinforcement learning (RL) paradigm. In particular, model-based offline planning learns an approximate dynamics model from the offline dataset, and then uses it for rollout-aided planning decision making. Nevertheless, existing model-based offline planning algorithms could be overly conservative and suffer from compounding modeling errors. To tackle these challenges, we propose L-MBOP-E ($\\underline{L}$atent-$\\underline{M}$odel $\\underline{B}$ased $\\underline{O}$ffline $\\underline{P}$lanning with $\\underline{E}$xtrinsic policy guided exploration) that is built on two key ideas: 1) low-dimensional latent model learning to reduce the effects of compounding errors when learning a dynamics model with limited offline data, and 2) a Thompson Sampling based exploration strategy with an extrinsic policy to guide planning beyond the behavior policy and hence get the best out of these two policies, where the extrinsic policy can be a meta-learned policy  or a policy learned from another similar RL task. Extensive experimental results demonstrate that  L-MBOP-E significantly outperforms the state-of-the-art model-based offline planning algorithms on the MuJoCo D4RL and Deepmind Control tasks, yielding more than 200% gains in some cases.  More importantly, reduced model uncertainty and superior performance on new tasks with zero-shot adaptation indicates that L-MBOP-E provides a more flexible and light-weight solution to offline planning.",
        "keywords": "reinforcement learning;offline planning;offline reinforcement learning;model-based reinforcement learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/f7a969ebd0dd8b4af391109c21d68d482fe7bb99.zip",
        "author": "Imran Adham;Hang Wang;Sen Lin;Junshan Zhang",
        "authorids": "~Imran_Adham1;~Hang_Wang2;~Sen_Lin1;~Junshan_Zhang1",
        "gender": "M;M;;M",
        "homepage": ";https://ustcmike.github.io/;https://slin70.github.io/;https://faculty.engineering.ucdavis.edu/jzhang/",
        "dblp": ";;70/9499-1.html;59/1232.html",
        "google_scholar": "RVLDV48AAAAJ;Xdb3u_q3RKwC;94-TbUsAAAAJ;UtAdFs8AAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Imran_Adham1;~Hang_Wang2;~Sen_Lin1;~Junshan_Zhang1",
        "aff": "University of California, Davis;University of California, Davis;University of Houston;University of California, Davis",
        "aff_domain": "ucdavis.edu;ucdavis.edu;uh.edu;ucdavis.edu",
        "position": "PhD student;PhD student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nadham2024lmbope,\ntitle={L-{MBOP}-E: Latent-Model Based Offline Planning with Extrinsic Policy Guided Exploration},\nauthor={Imran Adham and Hang Wang and Sen Lin and Junshan Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=IAlmvV1pZd}\n}",
        "github": "",
        "project": "",
        "reviewers": "4zzv;yied;763y;sSEa",
        "site": "https://openreview.net/forum?id=IAlmvV1pZd",
        "pdf_size": 8754743,
        "rating": "3;3;3;5",
        "confidence": "4;4;3;4",
        "soundness": "2;1;1;2",
        "contribution": "1;1;2;2",
        "presentation": "2;3;3;3",
        "wc_summary": "65;90;97;97",
        "wc_strengths": "27;14;65;69",
        "wc_weaknesses": "282;178;211;51",
        "wc_questions": "176;364;59;197",
        "wc_review": "550;646;432;414",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.5,
            0.5
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            87.25,
            13.160072188251856
        ],
        "wc_strengths_avg": [
            43.75,
            23.742103950576915
        ],
        "wc_weaknesses_avg": [
            180.5,
            83.67944789492817
        ],
        "wc_questions_avg": [
            199.0,
            108.80946649993281
        ],
        "wc_review_avg": [
            510.5,
            94.06779470148112
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:lh3G3dHGRO0J:scholar.google.com/&scioq=L-MBOP-E:+Latent-Model+Based+Offline+Planning+with+Extrinsic+Policy+Guided+Exploration&hl=en&as_sdt=0,10",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "University of California, Davis;University of Houston",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ucdavis.edu;https://www.uh.edu",
        "aff_unique_abbr": "UC Davis;UH",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Davis;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "IB1HqbA2Pn",
        "title": "LLaVA-Plus: Learning to Use Tools for Creating Multimodal Agents",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this paper, we introduce LLaVA-Plus, an end-to-end training approach to systematically expanding the capabilities of large multimodal models (LMM), towards building general-purpose multimodal agents. It maintains a skill repository that contains a wide range of vision and vision-language pre-trained models as multimodal tools. Based on the user instruction and input image, LMM is trained to activate the appropriated tools when needed, grasping skills on the fly and aggregating the tool execution results to complete the real-world tasks in the wild. To facilitate the model capability on learning to use skills, we make the first attempt to build multimodal instruction-following data for tool use, covering skills in visual understanding, generation, external knowledge and their compositions. Empirical results show that LLaVA-Plus outperforms LLaVA in existing capabilities, and extends many new capabilities.\nCompared with large language model (LLM) based tool use methods, LLaVA-Plus is distinct in that the query image is considered throughout the entire interaction process, yielding higher multimodal tool use performance and enabling new scenarios.",
        "keywords": "Large Language Model;Large Multi-modal Model;Large Agent",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Shilong Liu;Hao Cheng;Haotian Liu;Hao Zhang;Feng Li;Tianhe Ren;Xueyan Zou;Jianwei Yang;Hang Su;Jun Zhu;Lei Zhang;Jianfeng Gao;Chunyuan Li",
        "authorids": "~Shilong_Liu1;~Hao_Cheng4;~Haotian_Liu1;~Hao_Zhang39;~Feng_Li9;~Tianhe_Ren1;~Xueyan_Zou1;~Jianwei_Yang1;~Hang_Su3;~Jun_Zhu2;~Lei_Zhang23;~Jianfeng_Gao1;~Chunyuan_Li1",
        "gender": "M;M;;M;M;;F;M;M;;M;M;M",
        "homepage": "https://www.lsl.zone;https://sites.google.com/site/hcheng2site/Home;https://hliu.cc;https://haozhang534.github.io/;https://fengli-ust.github.io/;https://rentainhe.github.io/;https://maureenzou.github.io/;http://ml.cs.tsinghua.edu.cn/~jun;https://www.microsoft.com/en-us/research/people/jfgao/;http://chunyuan.li/;;https://jwyang.github.io/;https://www.leizhang.org/",
        "dblp": ";09/5158-2;66/10511;55/2270-97;92/2954-40.html;;273/3780;50/2644-1;92/5339;64/9590;26/5371-6;;z/LeiZhang",
        "google_scholar": "nkSVY3MAAAAJ;https://scholar.google.com/citations?hl=en;Xo6wfnQAAAAJ;B8hPxMQAAAAJ;https://scholar.google.com/citations?hl=zh-CN;cW4ILs0AAAAJ;eslbQqoAAAAJ;axsP38wAAAAJ;https://scholar.google.com/citations?hl=en;Zd7WmXUAAAAJ;dxN1_X0AAAAJ;Cl9byD8AAAAJ;fIlGZToAAAAJ",
        "orcid": ";0000-0001-7988-3149;;;;;;;;;;;",
        "linkedin": ";;;hao-zhang-3b09b8196/;;;;;;;;;",
        "or_profile": "~Shilong_Liu1;~Hao_Cheng4;~Haotian_Liu1;~Hao_Zhang39;~Feng_Li9;~Tianhe_Ren1;~Xueyan_Zou1;~Jun_Zhu2;~Jianfeng_Gao1;~Chunyuan_Li1;~Hang_Su2;~Jianwei_Yang2;~Lei_Zhang1",
        "aff": "NVIDIA;Microsoft Research;Department of Computer Science, University of Wisconsin - Madison;Hong Kong University of Science and Technology;Hong Kong University of Science and Technology;The International Digital Economy Academy;University of Wisconsin - Madison;Tsinghua University;Microsoft Research;Microsoft Research;Tsinghua University;Microsoft;International Digital Economy Academy",
        "aff_domain": "nvidia.com;microsoft.com;cs.wisc.edu;ust.hk;ust.hk;idea.edu.cn;wisc.edu;mail.tsinghua.edu.cn;microsoft.com;microsoft.com;tsinghua.edu.cn;microsoft.com;idea.edu.cn",
        "position": "Research Intern;Researcher;PhD student;PhD student;PhD student;Researcher;PhD student;Professor;Principal Researcher;Principal Researcher;Associate Professor;Researcher;Chief Scientist",
        "bibtex": "@misc{\nliu2024llavaplus,\ntitle={{LL}a{VA}-Plus: Learning to Use Tools for Creating Multimodal Agents},\nauthor={Shilong Liu and Hao Cheng and Haotian Liu and Hao Zhang and Feng Li and Tianhe Ren and Xueyan Zou and Jianwei Yang and Hang Su and Jun Zhu and Lei Zhang and Jianfeng Gao and Chunyuan Li},\nyear={2024},\nurl={https://openreview.net/forum?id=IB1HqbA2Pn}\n}",
        "github": "",
        "project": "",
        "reviewers": "aMGS;FDvd;3S2M;xZda",
        "site": "https://openreview.net/forum?id=IB1HqbA2Pn",
        "pdf_size": 26020660,
        "rating": "3;3;6;10",
        "confidence": "4;5;3;4",
        "soundness": "2;2;2;4",
        "contribution": "2;2;2;4",
        "presentation": "2;3;3;3",
        "wc_summary": "171;77;58;88",
        "wc_strengths": "91;70;65;46",
        "wc_weaknesses": "434;226;175;37",
        "wc_questions": "248;5;112;117",
        "wc_review": "944;378;410;288",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "3230;1259;2094;677",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "6;2;3;1",
        "rating_avg": [
            5.5,
            2.8722813232690143
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            98.5,
            43.21168823362494
        ],
        "wc_strengths_avg": [
            68.0,
            16.015617378046965
        ],
        "wc_weaknesses_avg": [
            218.0,
            142.59207551613798
        ],
        "wc_questions_avg": [
            120.5,
            86.14087299302231
        ],
        "wc_review_avg": [
            505.0,
            257.37326978534503
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1815.0,
            959.7194902678594
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            3.0,
            1.8708286933869707
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            13,
            0
        ],
        "corr_rating_confidence": -0.3692744729379982,
        "gs_citation": 125,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15599440693702906776&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;2;3;3;4;2;5;1;1;5;1;4",
        "aff_unique_norm": "NVIDIA;Microsoft;University of Wisconsin-Madison;Hong Kong University of Science and Technology;International Digital Economy Academy;Tsinghua University",
        "aff_unique_dep": "NVIDIA Corporation;Microsoft Research;Department of Computer Science;;;",
        "aff_unique_url": "https://www.nvidia.com;https://www.microsoft.com/en-us/research;https://www.wisc.edu;https://www.ust.hk;;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "NVIDIA;MSR;UW-Madison;HKUST;;THU",
        "aff_campus_unique_index": "1;2;2;1",
        "aff_campus_unique": ";Madison;Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;1;1;2;0;1;0;0;1;0",
        "aff_country_unique": "United States;China;Unknown;"
    },
    {
        "id": "IBACinPJG5",
        "title": "MIRAGE: Modelling Interpretable Multivariate Time Series Forecasts with Actionable Ground Explanations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Multi-variate Time Series (MTS) forecasting has made large strides (with very negligible errors) through recent advancements in neural networks, e.g., Trans- formers. However, in critical situations like predicting a death in an ICU or sudden gaming overindulgence; an accurate prediction without a contributing evidence is irrelevant. It is important to have model driven Interpretability, allowing proactive comprehension of trajectory to an extremity; and an associated Explainability, al- lowing for preventive steps; e.g., controlling BP to avoid death, or nudging players to take breaks to prevent overplay. We introduce a novel deep neural network, MI- RAGE, which overcomes the inter-dependent challenges of\u2014(a) temporally non- smooth data trajectories for interpretability; (b) highly multi-dimensional tempo- ral space for explainability; and (c) improving forecasting accuracy\u2014all at once. MIRAGE: (i) achieves over 85% improvement on the MSE of the forecasts on the most relevant SOM-VAE based SOTA networks; and (ii) unravels the intricate multi-variate relationships and temporal trajectories contributing to any sudden movement to criticalities on temporally chaotic datasets.",
        "keywords": "Representation Learning;Interpretable Representations;Explainability;Forecasting;Markov Models;LSTM;Attention Networks;Clustering",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Hussain Jagirdar;Rukma Ameet Talwadker;Aditya Pareek;Pulkit Agrawal;Tridib Mukherjee",
        "authorids": "hussain.jagirdar@games24x7.com;~Rukma_Ameet_Talwadker1;aditya.pareek@games24x7.com;pulkit.agrawal@games24x7.com;~Tridib_Mukherjee1",
        "gender": ";F;;;",
        "homepage": ";;;;",
        "dblp": ";134/5726.html;;;84/6388",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;;;",
        "orcid": ";;;;",
        "linkedin": ";rukma-talwadker-80b20915/;;;tridib-mukherjee-b3a77aa",
        "or_profile": "hussain.jagirdar@games24x7.com;~Rukma_Ameet_Talwadker1;aditya.pareek@games24x7.com;pulkit.agrawal@games24x7.com;~Tridib_Mukherjee1",
        "aff": ";;;;Games24x7",
        "aff_domain": ";;;;games24x7.com",
        "position": ";;;;Principal Researcher",
        "bibtex": "@misc{\njagirdar2024mirage,\ntitle={{MIRAGE}: Modelling Interpretable Multivariate Time Series Forecasts with Actionable Ground Explanations},\nauthor={Hussain Jagirdar and Rukma Ameet Talwadker and Aditya Pareek and Pulkit Agrawal and Tridib Mukherjee},\nyear={2024},\nurl={https://openreview.net/forum?id=IBACinPJG5}\n}",
        "github": "",
        "project": "",
        "reviewers": "EVwY;QroT;nYfL",
        "site": "https://openreview.net/forum?id=IBACinPJG5",
        "pdf_size": 8638951,
        "rating": "3;3;5",
        "confidence": "4;4;2",
        "soundness": "2;1;2",
        "contribution": "2;2;2",
        "presentation": "2;1;2",
        "wc_summary": "43;78;76",
        "wc_strengths": "15;38;53",
        "wc_weaknesses": "222;289;102",
        "wc_questions": "107;180;14",
        "wc_review": "387;585;245",
        "wc_reply_reviewers": "0;276;0",
        "wc_reply_authors": "768;1117;760",
        "reply_reviewers": "0;1;0",
        "reply_authors": "1;2;1",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            65.66666666666667,
            16.048537489614297
        ],
        "wc_strengths_avg": [
            35.333333333333336,
            15.627610892974722
        ],
        "wc_weaknesses_avg": [
            204.33333333333334,
            77.3577547646144
        ],
        "wc_questions_avg": [
            100.33333333333333,
            67.93297350248176
        ],
        "wc_review_avg": [
            405.6666666666667,
            139.4305880676435
        ],
        "wc_reply_reviewers_avg": [
            92.0,
            130.10764773832474
        ],
        "wc_reply_authors_avg": [
            881.6666666666666,
            166.43784291907764
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:52KZ--e58aoJ:scholar.google.com/&scioq=MIRAGE:+Modelling+Interpretable+Multivariate+Time+Series+Forecasts+with+Actionable+Ground+Explanations&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Games24x7",
        "aff_unique_dep": "",
        "aff_unique_url": "",
        "aff_unique_abbr": ""
    },
    {
        "id": "ICDJDL5lmQ",
        "title": "Wasserstein Distortion: Unifying fidelity and realism",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We introduce a distortion measure for images, Wasserstein distortion, that simultaneously generalizes pixel-level fidelity on the one hand and realism or perceptual quality on the other. We show how Wasserstein distortion reduces mathematically to a pure fidelity constraint or a pure realism constraint under different parameter choices. Pairs of images that are close under Wasserstein distortion illustrate its utility. In particular, we generate random textures that have high fidelity to a reference texture in one location of the image and smoothly transition to an independent realization of the texture as one moves away from this point. Connections between Wasserstein distortion and models of the human visual system are noted.",
        "keywords": "information theory;texture synthesis;distortion-realism tradeoff;distortion-perception tradeoff",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/7bcf68ef4bb55fc206245c4c70f3ee7ee92bc7ae.zip",
        "author": "Yang Qiu;Aaron B. Wagner;Johannes Ball\u00e9;Lucas Theis",
        "authorids": "~Yang_Qiu3;~Aaron_B._Wagner1;~Johannes_Ball\u00e91;~Lucas_Theis1",
        "gender": "M;Non-Binary;M;",
        "homepage": ";https://balle.io;http://theis.io;http://people.ece.cornell.edu/wagner",
        "dblp": ";84/4973;28/8772;",
        "google_scholar": ";uKDe38UAAAAJ;https://scholar.google.co.uk/citations?hl=en;",
        "orcid": ";0000-0003-0769-8985;;0000-0001-9127-0089",
        "linkedin": "yang-qiu-72aa257b/;;;",
        "or_profile": "~Yang_Qiu3;~Johannes_Ball\u00e91;~Lucas_Theis1;~Aaron_Wagner1",
        "aff": "Cornell University;Google;Google;Cornell University",
        "aff_domain": "cornell.edu;google.com;google.com;cornell.edu",
        "position": "PhD student;Research Scientist;Researcher;Full Professor",
        "bibtex": "@misc{\nqiu2024wasserstein,\ntitle={Wasserstein Distortion: Unifying fidelity and realism},\nauthor={Yang Qiu and Aaron B. Wagner and Johannes Ball{\\'e} and Lucas Theis},\nyear={2024},\nurl={https://openreview.net/forum?id=ICDJDL5lmQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "xJ9L;fzyQ;nULJ;GTX1",
        "site": "https://openreview.net/forum?id=ICDJDL5lmQ",
        "pdf_size": 46841171,
        "rating": "3;3;5;5",
        "confidence": "3;5;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;1;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "18;85;183;93",
        "wc_strengths": "14;36;39;113",
        "wc_weaknesses": "51;238;138;64",
        "wc_questions": "14;84;27;114",
        "wc_review": "97;443;387;384",
        "wc_reply_reviewers": "0;766;21;0",
        "wc_reply_authors": "203;1505;563;572",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "2;3;2;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            94.75,
            58.687200478468895
        ],
        "wc_strengths_avg": [
            50.5,
            37.35304539123952
        ],
        "wc_weaknesses_avg": [
            122.75,
            74.35514440844022
        ],
        "wc_questions_avg": [
            59.75,
            40.91683638797115
        ],
        "wc_review_avg": [
            327.75,
            135.28003363394023
        ],
        "wc_reply_reviewers_avg": [
            196.75,
            328.7684405474467
        ],
        "wc_reply_authors_avg": [
            710.75,
            482.1111775306604
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.30151134457776363,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8379025146187109596&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;1;0",
        "aff_unique_norm": "Cornell University;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.cornell.edu;https://www.google.com",
        "aff_unique_abbr": "Cornell;Google",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "ICSvW69W5K",
        "title": "Semantic Parsing with Candidate Expressions for Knowledge Base Question Answering",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Semantic parsers convert natural language to logical forms, which can then be evaluated on knowledge bases (KBs) to produce denotations.\nEarly neural semantic parsers used grammars that define actions, such as production rules, then the semantic parsers could sequentially take actions to construct well-typed logical forms.\nIn contrast, recent neural semantic parsers have been developed with pre-trained sequence-to-sequence (seq2seq) models, such as BART and T5, which treat logical forms as sequences of tokens.\nHowever, the seq2seq models have difficulty in learning to generate logical forms that contain components drawn from large KBs.\nIn this work, we propose a grammar augmented with candidate expressions for seq2seq semantic parsing on large KBs.\nThe grammar defines actions as production rules, and our semantic parser predicts actions during inference under the constraints by types and candidate expressions.\nWe apply the grammar to knowledge base question answering, where the constraints by candidate expressions assist a semantic parser to generate valid KB components.\nExperiments on the KQA Pro benchmark showed that the constraints by candidate expressions increased the accuracy of our semantic parser, and our semantic parser achieved state-of-the-art performance on KQA Pro.",
        "keywords": "semantic parsing;constrained decoding;sequence-to-sequence;natural language processing",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "/attachment/4335f4092da8ef5cdcf93bb8477167541953057e.zip",
        "author": "Daehwan Nam;Gary Lee",
        "authorids": "~Daehwan_Nam1;~Gary_Lee1",
        "gender": "M;M",
        "homepage": "https://github.com/daehwannam;https://sites.google.com/view/gary-geunbae-lee/",
        "dblp": "194/5311.html;l/GGLee",
        "google_scholar": ";https://scholar.google.com.tw/citations?user=t30saScAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Daehwan_Nam1;~Gary_Lee1",
        "aff": "Pohang University of Science and Technology;POSTECH",
        "aff_domain": "postech.edu;postech.ac.kr",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nnam2024semantic,\ntitle={Semantic Parsing with Candidate Expressions for Knowledge Base Question Answering},\nauthor={Daehwan Nam and Gary Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=ICSvW69W5K}\n}",
        "github": "",
        "project": "",
        "reviewers": "4fJL;Ntkc;iWQY;pMus",
        "site": "https://openreview.net/forum?id=ICSvW69W5K",
        "pdf_size": 413947,
        "rating": "3;5;6;6",
        "confidence": "4;4;3;4",
        "soundness": "3;4;3;3",
        "contribution": "1;2;2;3",
        "presentation": "3;4;3;4",
        "wc_summary": "89;76;97;39",
        "wc_strengths": "84;26;75;55",
        "wc_weaknesses": "190;29;68;94",
        "wc_questions": "1;88;36;56",
        "wc_review": "364;219;276;244",
        "wc_reply_reviewers": "267;0;0;135",
        "wc_reply_authors": "973;631;667;1624",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "3;1;1;3",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            75.25,
            22.230328382639787
        ],
        "wc_strengths_avg": [
            60.0,
            22.259829289552066
        ],
        "wc_weaknesses_avg": [
            95.25,
            59.39433895582979
        ],
        "wc_questions_avg": [
            45.25,
            31.5703579327191
        ],
        "wc_review_avg": [
            275.75,
            54.81046889053222
        ],
        "wc_reply_reviewers_avg": [
            100.5,
            110.80726510477551
        ],
        "wc_reply_authors_avg": [
            973.75,
            398.2457626893223
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            1.0
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.4714045207910316,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:L4Guo2kZWRkJ:scholar.google.com/&scioq=Semantic+Parsing+with+Candidate+Expressions+for+Knowledge+Base+Question+Answering&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Pohang University of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.postech.ac.kr",
        "aff_unique_abbr": "POSTECH",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Pohang",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "ICuUgRLp4C",
        "title": "Learning High-Order Relationships of Brain Regions",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Discovering reliable and informative interactions among brain regions from functional magnetic resonance imaging (fMRI) signals is essential in neuroscientific predictions of cognition. Most of the current methods fail to accurately characterize those interactions because they only focus on pairwise connections and overlook the high-order relationships of brain regions. We delve into this problem and argue that these high-order relationships should be maximally informative and minimally redundant (MIMR). However, identifying such high-order relationships is challenging and highly under-explored. Methods that can be tailored to our context are also non-existent. In response to this gap, we propose a novel method named HyBRiD that aims to extract MIMR high-order relationships from fMRI data. HyBRiD employs a Constructor to identify hyperedge structures, and a Weighter to compute a weight for each hyperedge. HyBRiD achieves the MIMR objective through an innovative information bottleneck framework named multi-head drop-bottleneck with theoretical guarantees. Our comprehensive experiments demonstrate the effectiveness of our model. In terms of the quality of hyperedges measured by the CPM metric, our model outperforms the state-of-the-art predictive model by an average of 12.1%.",
        "keywords": "fMRI;information bottleneck;brain",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/f5a1769bfcbba864ba99dc655fad1ac1c54bba5e.zip",
        "author": "Weikang Qiu;Huangrui Chu;Selena Wang;Haolan Zuo;Xiaoxiao Li;Yize Zhao;Zhitao Ying",
        "authorids": "~Weikang_Qiu1;~Huangrui_Chu1;~Selena_Wang1;~Haolan_Zuo1;~Xiaoxiao_Li1;~Yize_Zhao1;~Zhitao_Ying1",
        "gender": "M;M;F;M;Unspecified;;M",
        "homepage": "https://www.boltzmachine.com;https://huangruichu.github.io/;https://www.selenawangcv.com;;https://xxlya.github.io/;https://www.yizezhao.com/;https://www.cs.yale.edu/homes/ying-rex",
        "dblp": "336/1936;;;;71/8042;;209/4936",
        "google_scholar": "OLRjhHAAAAAJ;;;;sdENOQ4AAAAJ;;6fqNXooAAAAJ",
        "orcid": ";;;;;;",
        "linkedin": ";huangruichu/;;daniel-zuo-604619244/;;;rex-ying-92770148/",
        "or_profile": "~Weikang_Qiu1;~Huangrui_Chu1;~Selena_Wang1;~Haolan_Zuo1;~Xiaoxiao_Li1;~Yize_Zhao1;~Zhitao_Ying1",
        "aff": "Yale University;Yale University;Yale University;Yale University;University of British Columbia;;Yale University",
        "aff_domain": "yale.edu;yale.edu;yale.edu;yale.edu;ece.ubc.ca;;yale.edu",
        "position": "PhD student;MS student;Postdoc;MS student;Assistant Professor;;Assistant Professor",
        "bibtex": "@misc{\nqiu2024learning,\ntitle={Learning High-Order Relationships of Brain Regions},\nauthor={Weikang Qiu and Huangrui Chu and Selena Wang and Haolan Zuo and Xiaoxiao Li and Yize Zhao and Zhitao Ying},\nyear={2024},\nurl={https://openreview.net/forum?id=ICuUgRLp4C}\n}",
        "github": "",
        "project": "",
        "reviewers": "eSJE;JozW;Z7u6;yeBt",
        "site": "https://openreview.net/forum?id=ICuUgRLp4C",
        "pdf_size": 2038438,
        "rating": "3;3;6;6",
        "confidence": "4;5;1;3",
        "soundness": "2;2;3;3",
        "contribution": "2;1;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "135;64;112;77",
        "wc_strengths": "48;14;211;118",
        "wc_weaknesses": "521;83;45;277",
        "wc_questions": "289;45;11;30",
        "wc_review": "993;206;379;502",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1718;633;123;1099",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;1;1;2",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            3.25,
            1.479019945774904
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            97.0,
            28.098042636454235
        ],
        "wc_strengths_avg": [
            97.75,
            75.37365255843716
        ],
        "wc_weaknesses_avg": [
            231.5,
            188.8881944431679
        ],
        "wc_questions_avg": [
            93.75,
            113.3696939221413
        ],
        "wc_review_avg": [
            520.0,
            292.63031285224025
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            893.25,
            588.1242959613214
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.8451542547285167,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4767684268898720399&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;0;0;0;1;0",
        "aff_unique_norm": "Yale University;University of British Columbia",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.yale.edu;https://www.ubc.ca",
        "aff_unique_abbr": "Yale;UBC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;1;0",
        "aff_country_unique": "United States;Canada"
    },
    {
        "id": "ICwdNpmu2d",
        "title": "LLM-based Stock Market Trend Prediction",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "LLM-based Stock Market Trend Prediction\n\nInvestor sentiment, which is driven by 'intriguing factors' such as news articles and options volume, has been historically resistant to effective use in quantitative methods for predictive market analysis. The emerging science of large language models (LLMs), however, offers a potential solution to this problem. In this paper, we describe our initial experiments with a novel system which prompts available LLMs in a way which allows us to link responses with features in the otherwise more traditional quantitative methods. The results show high accuracy in predicting market moves. We describe the experiments and our initial thoughts about next steps in the paper.",
        "keywords": "Stock Market Trend Prediction;Moving Averages;Options Volume;Market Volatility;LLM;LSTM Sentiment Analysis;Demand & Supply Dependency tree;Multi Layer Neural Networks",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Manaswini Swamy;Arunima Shukla;James Purtilo",
        "authorids": "~Manaswini_Swamy1;~Arunima_Shukla1;~James_Purtilo1",
        "gender": "F;F;",
        "homepage": ";;",
        "dblp": ";;",
        "google_scholar": ";;",
        "orcid": "0009-0009-5764-1494;0009-0007-0343-9616;",
        "linkedin": "manaswini-swamy/;arunima-shukla-pg;",
        "or_profile": "~Manaswini_Swamy1;~Arunima_Shukla1;~James_Purtilo1",
        "aff": ";;University of Maryland, College Park",
        "aff_domain": ";;umd.edu",
        "position": ";;Associate Professor",
        "bibtex": "@misc{\nswamy2024llmbased,\ntitle={{LLM}-based Stock Market Trend Prediction},\nauthor={Manaswini Swamy and Arunima Shukla and James Purtilo},\nyear={2024},\nurl={https://openreview.net/forum?id=ICwdNpmu2d}\n}",
        "github": "",
        "project": "",
        "reviewers": "fQZv;Tge5;m81M;Tvq8",
        "site": "https://openreview.net/forum?id=ICwdNpmu2d",
        "pdf_size": 675614,
        "rating": "1;1;1;3",
        "confidence": "5;5;5;4",
        "soundness": "1;1;1;1",
        "contribution": "1;1;1;1",
        "presentation": "1;1;1;1",
        "wc_summary": "17;69;97;13",
        "wc_strengths": "2;31;55;5",
        "wc_weaknesses": "380;48;93;54",
        "wc_questions": "2;42;134;24",
        "wc_review": "401;190;379;96",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            1.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.0,
            0.0
        ],
        "contribution_avg": [
            1.0,
            0.0
        ],
        "presentation_avg": [
            1.0,
            0.0
        ],
        "wc_summary_avg": [
            49.0,
            35.4400902933387
        ],
        "wc_strengths_avg": [
            23.25,
            21.52179128232592
        ],
        "wc_weaknesses_avg": [
            143.75,
            137.4888631853504
        ],
        "wc_questions_avg": [
            50.5,
            50.2468904510518
        ],
        "wc_review_avg": [
            266.5,
            128.12981698262118
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2248789227676848938&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Maryland",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www/umd.edu",
        "aff_unique_abbr": "UMD",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "College Park",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "ID8IQUDM4v",
        "title": "Distributed Linear Dimensionality Reduction Assisted by Centralized NN for Classification",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Linear dimensionality reduction is a widely used technique in data compression, especially under computationally-constrained platforms. This paper presents a linear dimensionality reduction technique tailored for distributed edge devices, balancing resource constraints like data-rate and computing power at the device side, while ensuring high classification accuracy at the server side. The core concept of our approach is the simultaneous training of a unique single-layer for each distributed device, determined by its compression needs, coupled with a centralized deep neural network on the server for all-device classification. A standout feature of our approach is its adaptability: when integrating a new device aiming to compress data in an untrained dimension, only minimal training for the device's initial two layers is needed, leaving the server's  centralized deep neural network and the compression layers for all existing devices untouched. Additionally, our findings indicate that the peak accuracy attainable through our method approaches that of the optimal accuracy achievable by the ideal Maximum Likelihood classifier, outperforming traditional matrix decomposition-based techniques like Principal Component Analysis (PCA) and Linear Discriminant Analysis (LDA). Compared to distance-metric-based strategies like Neighborhood Component Analysis (NCA), our technique offers a marked reduction in training complexity for large datasets. Experimental studies show that our approaches result in significant improvements in classification accuracy under the same data-rate requirements compared to existing linear dimensionality reduction approaches on real data sets.",
        "keywords": "linear dimensionality reduction;edge computing;classfication",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Chengzhang Li;Peizhong Ju;Atilla Eryilmaz;Ness Shroff",
        "authorids": "~Chengzhang_Li1;~Peizhong_Ju1;~Atilla_Eryilmaz1;~Ness_Shroff1",
        "gender": "M;M;M;M",
        "homepage": "https://chengzhang17.github.io/;;https://www.atillaeryilmaz.com;http://newslab.ece.ohio-state.edu/",
        "dblp": "35/9090;167/9021;56/5751;67/1991",
        "google_scholar": "gR5PFNMAAAAJ;VDzpfOYAAAAJ;kVX9Zc4AAAAJ;https://scholar.google.com.tw/citations?user=5kL-ZrAAAAAJ",
        "orcid": ";0000-0002-4569-3539;;0000-0002-4606-6879",
        "linkedin": ";;;nessshroff/",
        "or_profile": "~Chengzhang_Li1;~Peizhong_Ju1;~Atilla_Eryilmaz1;~Ness_Shroff1",
        "aff": "Ohio State University, Columbus;Ohio State University, Columbus;Ohio State University;Ohio State University, Columbus",
        "aff_domain": "osu.edu;osu.edu;osu.edu;osu.edu",
        "position": "Postdoc;Postdoc;Full Professor;Full Professor",
        "bibtex": "@misc{\nli2024distributed,\ntitle={Distributed Linear Dimensionality Reduction Assisted by Centralized {NN} for Classification},\nauthor={Chengzhang Li and Peizhong Ju and Atilla Eryilmaz and Ness Shroff},\nyear={2024},\nurl={https://openreview.net/forum?id=ID8IQUDM4v}\n}",
        "github": "",
        "project": "",
        "reviewers": "Tdne;X1NB;32g2;YX5B",
        "site": "https://openreview.net/forum?id=ID8IQUDM4v",
        "pdf_size": 645815,
        "rating": "1;3;3;3",
        "confidence": "4;5;2;5",
        "soundness": "1;3;2;1",
        "contribution": "1;2;2;1",
        "presentation": "2;3;2;2",
        "wc_summary": "67;106;52;98",
        "wc_strengths": "14;16;1;19",
        "wc_weaknesses": "32;57;25;118",
        "wc_questions": "380;19;11;16",
        "wc_review": "493;198;89;251",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "274;254;304;262",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            1.224744871391589
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            80.75,
            22.083647796503186
        ],
        "wc_strengths_avg": [
            12.5,
            6.87386354243376
        ],
        "wc_weaknesses_avg": [
            58.0,
            36.62649314362488
        ],
        "wc_questions_avg": [
            106.5,
            157.93115588762086
        ],
        "wc_review_avg": [
            257.75,
            147.84683797768554
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            273.5,
            18.993419913222578
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:wmR3NiMBFxUJ:scholar.google.com/&scioq=Distributed+Linear+Dimensionality+Reduction+Assisted+by+Centralized+NN+for+Classification&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Ohio State University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.osu.edu",
        "aff_unique_abbr": "OSU",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Columbus;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "IDDiv29paY",
        "title": "Fooling Contrastive Language-Image Pre-Training with CLIPMasterPrints",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Models leveraging both visual and textual data such as Contrastive Language-Image Pre-training (CLIP), are the backbone of many recent advances in artificial intelligence. In this work, we show that despite their versatility, such models are vulnerable to what we refer to as fooling master images. Fooling master images are capable of maximizing the confidence score of a CLIP model for a significant number of widely varying prompts, while being either unrecognizable or unrelated to the attacked prompt for humans. We demonstrate how fooling master images can be mined using stochastic gradient descent, projected gradient descent, or gradient-free optimisation. Contrary to many common adversarial attacks, the gradient-free optimisation approach allows us to mine fooling examples even when the weights of the model are not accessible. We investigate the properties of the mined fooling master images, and find that images trained on a small number of image captions potentially generalize to a much larger number of semantically related captions. Finally, we evaluate possible mitigation strategies and find that vulnerability to fooling master examples appears to be closely related to a modality gap in contrastive pre-trained multi-modal networks.",
        "keywords": "contrastive language image pre-training; adverserial attacks; fooling master images; modality gap; projected gradient descent; latent variable evolution; black-box attack; ai robustness",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/67b0f9ded9db1b9eb87bec3137d5dda83336afe9.zip",
        "author": "Matthias Freiberger;Peter Kun;Christian Igel;Anders Sundnes L\u00f8vlie;Sebastian Risi",
        "authorids": "~Matthias_Freiberger1;~Peter_Kun1;~Christian_Igel1;~Anders_Sundnes_L\u00f8vlie1;~Sebastian_Risi1",
        "gender": "M;M;M;M;M",
        "homepage": ";;https://christian-igel.github.io/;;http://www.sebastianrisi.com",
        "dblp": "200/9091;;38/6146;17/2635.html;81/7183",
        "google_scholar": "qkPbhlUAAAAJ;C5aOceIAAAAJ;https://scholar.google.dk/citations?user=d-jF4zIAAAAJ;https://scholar.google.dk/citations?hl=en;Tf8winBIYUsC",
        "orcid": "0000-0003-2101-6274;0000-0003-0778-7662;0000-0003-2868-0856;0000-0003-0484-4668;",
        "linkedin": "matthias-freiberger-a1377b7b/;;christianigel/;;",
        "or_profile": "~Matthias_Freiberger1;~Peter_Kun1;~Christian_Igel1;~Anders_Sundnes_L\u00f8vlie1;~Sebastian_Risi1",
        "aff": "Copenhagen University;IT University of Copenhagen;University of Copenhagen;IT University of Copenhagen;IT University of Copenhagen",
        "aff_domain": "ku.dk;itu.dk;ku.dk;itu.dk;itu.dk",
        "position": "Postdoc;Postdoc;Full Professor;Associate Professor;Professor",
        "bibtex": "@misc{\nfreiberger2024fooling,\ntitle={Fooling Contrastive Language-Image Pre-Training with {CLIPM}asterPrints},\nauthor={Matthias Freiberger and Peter Kun and Christian Igel and Anders Sundnes L{\\o}vlie and Sebastian Risi},\nyear={2024},\nurl={https://openreview.net/forum?id=IDDiv29paY}\n}",
        "github": "",
        "project": "",
        "reviewers": "1X8T;W2Qv;zgK9",
        "site": "https://openreview.net/forum?id=IDDiv29paY",
        "pdf_size": 3773947,
        "rating": "3;3;6",
        "confidence": "4;4;5",
        "soundness": "2;2;3",
        "contribution": "1;2;3",
        "presentation": "2;3;3",
        "wc_summary": "80;98;92",
        "wc_strengths": "88;22;105",
        "wc_weaknesses": "133;109;52",
        "wc_questions": "26;29;2",
        "wc_review": "327;258;251",
        "wc_reply_reviewers": "120;0;22",
        "wc_reply_authors": "874;249;135",
        "reply_reviewers": "1;0;1",
        "reply_authors": "2;1;2",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            90.0,
            7.483314773547883
        ],
        "wc_strengths_avg": [
            71.66666666666667,
            35.798820588890294
        ],
        "wc_weaknesses_avg": [
            98.0,
            33.97057550292606
        ],
        "wc_questions_avg": [
            19.0,
            12.083045973594572
        ],
        "wc_review_avg": [
            278.6666666666667,
            34.296096311711956
        ],
        "wc_reply_reviewers_avg": [
            47.333333333333336,
            52.162140378716146
        ],
        "wc_reply_authors_avg": [
            419.3333333333333,
            324.8490247621022
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:n4GtIF2gt7IJ:scholar.google.com/&scioq=Fooling+Contrastive+Language-Image+Pre-Training+with+CLIPMasterPrints&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;1;1",
        "aff_unique_norm": "University of Copenhagen;IT University of Copenhagen",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ku.dk;https://itu.dk",
        "aff_unique_abbr": "UCPH;ITU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Denmark"
    },
    {
        "title": "Eureka: Human-Level Reward Design via Coding Large Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18971",
        "id": "IEduRUO55F",
        "author_site": "Yecheng Jason Ma, William Liang, Guanzhi Wang, De-An Huang, Osbert Bastani, Dinesh Jayaraman, Yuke Zhu, Jim Fan, anima anandkumar",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) have excelled as high-level semantic planners for sequential decision-making tasks. However, harnessing them to learn complex low-level manipulation tasks, such as dexterous pen spinning, remains an open problem. We bridge this fundamental gap and present Eureka, a human-level reward design algorithm powered by LLMs. Eureka exploits the remarkable zero-shot generation, code-writing, and in-context improvement capabilities of state-of-the-art LLMs, such as GPT-4, to perform evolutionary optimization over reward code. The resulting rewards can then be used to acquire complex skills via reinforcement learning. Without any task-specific prompting or pre-defined reward templates, Eureka generates reward functions that outperform expert human-engineered rewards. In a diverse suite of 29 open-source RL environments that include 10 distinct robot morphologies, Eureka outperforms human experts on 83% of the tasks, leading to an average normalized improvement of 52%. The generality of Eureka also enables a new gradient-free in-context learning approach to reinforcement learning from human feedback (RLHF), readily incorporating human inputs to improve the quality and the safety of the generated rewards without model updating. Finally, using Eureka rewards in a curriculum learning setting, we demonstrate for the first time, a simulated Shadow Hand capable of performing pen spinning tricks, adeptly manipulating a pen in circles at rapid speed.",
        "keywords": "Large Language Models;Reinforcement Learning;Dexterous Manipulation;Reward Learning;Robotics",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Yecheng Jason Ma;William Liang;Guanzhi Wang;De-An Huang;Osbert Bastani;Dinesh Jayaraman;Yuke Zhu;Linxi Fan;Anima Anandkumar",
        "authorids": "~Yecheng_Jason_Ma2;~William_Liang1;~Guanzhi_Wang1;~De-An_Huang1;~Osbert_Bastani1;~Dinesh_Jayaraman2;~Yuke_Zhu1;~Linxi_Fan2;~Anima_Anandkumar1",
        "gender": ";M;M;M;M;M;M;;",
        "homepage": ";https://www.seas.upenn.edu/~wjhliang/;https://www.guanzhi.me/;http://ai.stanford.edu/~dahuang/;http://obastani.github.io;https://www.seas.upenn.edu/~dineshj/;https://cs.utexas.edu/~yukez/;;",
        "dblp": ";;239/8731;119/0335;21/11275;145/3870;133/1772;154/6778;",
        "google_scholar": ";;QDmEj4MAAAAJ;HEY3UzgAAAAJ;cxYepGkAAAAJ;QxLpghAAAAAJ;mWGyYMsAAAAJ;sljtWIUAAAAJ;",
        "orcid": ";;;;;0000-0002-6888-3095;;;",
        "linkedin": ";;;;;dinesh-jayaraman-44b31539/;;;",
        "or_profile": "~Yecheng_Jason_Ma2;~William_Liang1;~Guanzhi_Wang1;~De-An_Huang1;~Osbert_Bastani1;~Dinesh_Jayaraman2;~Yuke_Zhu1;~Linxi_Fan2;~Anima_Anandkumar1",
        "aff": ";University of Pennsylvania;California Institute of Technology;NVIDIA;University of Pennsylvania;University of Pennsylvania;Computer Science Department, University of Texas, Austin;NVIDIA;",
        "aff_domain": ";upenn.edu;caltech.edu;nvidia.com;upenn.edu;upenn.edu;cs.utexas.edu;nvidia.com;",
        "position": ";Undergrad student;PhD student;Research Scientist;Assistant Professor;Assistant Professor;Assistant Professor;Researcher;",
        "bibtex": "@inproceedings{\nma2024eureka,\ntitle={Eureka: Human-Level Reward Design via Coding Large Language Models},\nauthor={Yecheng Jason Ma and William Liang and Guanzhi Wang and De-An Huang and Osbert Bastani and Dinesh Jayaraman and Yuke Zhu and Linxi Fan and Anima Anandkumar},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=IEduRUO55F}\n}",
        "github": "",
        "project": "",
        "reviewers": "XD65;hi7d;DCBe;JeMn",
        "pdf_size": 3875021,
        "rating": "5;6;6;8",
        "confidence": "4;4;4;4",
        "soundness": "3;2;2;4",
        "contribution": "2;3;3;3",
        "presentation": "4;2;3;4",
        "wc_summary": "82;97;118;70",
        "wc_strengths": "104;99;96;75",
        "wc_weaknesses": "239;403;359;114",
        "wc_questions": "293;73;36;49",
        "wc_review": "718;672;609;308",
        "wc_reply_reviewers": "43;16;209;296",
        "wc_reply_authors": "2277;1317;2927;1733",
        "reply_reviewers": "1;1;3;2",
        "reply_authors": "5;4;7;5",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            91.75,
            17.92170471802278
        ],
        "wc_strengths_avg": [
            93.5,
            11.05667219374799
        ],
        "wc_weaknesses_avg": [
            278.75,
            112.47305232810213
        ],
        "wc_questions_avg": [
            112.75,
            104.91037841891526
        ],
        "wc_review_avg": [
            576.75,
            159.914625660069
        ],
        "wc_reply_reviewers_avg": [
            141.0,
            116.05817506750655
        ],
        "wc_reply_authors_avg": [
            2063.5,
            603.6776871808332
        ],
        "reply_reviewers_avg": [
            1.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            5.25,
            1.0897247358851685
        ],
        "replies_avg": [
            47,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 380,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=455546167728485817&as_sdt=5,34&sciodt=0,34&hl=en",
        "gs_version_total": 8,
        "openreview": "https://openreview.net/forum?id=IEduRUO55F",
        "pdf": "https://openreview.net/pdf?id=IEduRUO55F",
        "email": ";upenn.edu;caltech.edu;nvidia.com;upenn.edu;upenn.edu;cs.utexas.edu;nvidia.com;",
        "author_num": 9,
        "aff_unique_index": "0;1;2;0;0;3;2",
        "aff_unique_norm": "University of Pennsylvania;California Institute of Technology;NVIDIA;University of Texas at Austin",
        "aff_unique_dep": ";;NVIDIA Corporation;Computer Science Department",
        "aff_unique_url": "https://www.upenn.edu;https://www.caltech.edu;https://www.nvidia.com;https://www.utexas.edu",
        "aff_unique_abbr": "UPenn;Caltech;NVIDIA;UT Austin",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Pasadena;Austin",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "GNNCert: Deterministic Certification of Graph Neural Networks against Adversarial Perturbations",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18970",
        "id": "IGzaH538fz",
        "author_site": "Zaishuo Xia, Han Yang, Binghui Wang, Jinyuan Jia",
        "tldr": "",
        "abstract": "Graph classification, which aims to predict a label for a graph, has many real-world applications such as malware detection, fraud detection, and healthcare. However, many studies show an attacker could carefully perturb the structure and/or node features in a graph such that a graph classifier misclassifies the perturbed graph. Such vulnerability impedes the deployment of graph classification in security/safety-critical applications. Existing empirical defenses lack formal robustness guarantees and could be broken by adaptive or unknown attacks. Existing provable defenses have the following limitations: 1)  they achieve sub-optimal robustness guarantees for graph structure perturbation, 2) they cannot provide robustness guarantees for arbitrarily node feature perturbations, 3) their robustness guarantees are probabilistic, meaning they could be incorrect with a non-zero probability, and 4) they incur large computation costs. We aim to address those limitations in this work. We propose GNNCert, a certified defense against both graph structure and node feature perturbations for graph classification. Our GNNCert provably predicts the same label for a graph when the number of perturbed edges and the number of nodes with perturbed features are bounded. Our results on 8 benchmark datasets show that GNNCert outperforms three state-of-the-art methods.",
        "keywords": "Adversarial attacks to graph classification; provable robustness",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "zaishuo xia;Han Yang;Binghui Wang;Jinyuan Jia",
        "authorids": "~zaishuo_xia1;~Han_Yang9;~Binghui_Wang2;~Jinyuan_Jia2",
        "gender": "M;F;M;",
        "homepage": "https://xiafire.github.io/;https://github.com/Y-Helios;https://wangbinghui.net;https://jinyuan-jia.github.io/",
        "dblp": ";;123/7149;24/5124-1.html",
        "google_scholar": "WJy7jS4AAAAJ;;SoOztcEAAAAJ;iyg4ytkAAAAJ",
        "orcid": ";;0000-0001-5616-060X;0000-0002-9785-7769",
        "linkedin": ";;;",
        "or_profile": "~zaishuo_xia1;~Han_Yang9;~Binghui_Wang2;~Jinyuan_Jia2",
        "aff": "Renmin University of China;Sichuan University;Illinois Institute of Technology;Pennsylvania State University",
        "aff_domain": "ruc.edu.cn;scu.edu.cn;iit.edu;psu.edu",
        "position": "Undergrad student;Undergrad student;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nxia2024gnncert,\ntitle={{GNNC}ert: Deterministic Certification of Graph Neural Networks against Adversarial Perturbations},\nauthor={zaishuo xia and Han Yang and Binghui Wang and Jinyuan Jia},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=IGzaH538fz}\n}",
        "github": "",
        "project": "",
        "reviewers": "xWrk;nFKx;LqWt",
        "pdf_size": 3805066,
        "rating": "8;8;8",
        "confidence": "4;4;3",
        "soundness": "3;4;3",
        "contribution": "2;4;3",
        "presentation": "1;4;4",
        "wc_summary": "114;54;70",
        "wc_strengths": "138;158;31",
        "wc_weaknesses": "474;200;219",
        "wc_questions": "101;2;42",
        "wc_review": "827;414;362",
        "wc_reply_reviewers": "233;84;9",
        "wc_reply_authors": "1045;588;305",
        "reply_reviewers": "3;1;1",
        "reply_authors": "5;2;2",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.0,
            1.4142135623730951
        ],
        "wc_summary_avg": [
            79.33333333333333,
            25.368396787253932
        ],
        "wc_strengths_avg": [
            109.0,
            55.75541827182957
        ],
        "wc_weaknesses_avg": [
            297.6666666666667,
            124.92753455059012
        ],
        "wc_questions_avg": [
            48.333333333333336,
            40.663934334438856
        ],
        "wc_review_avg": [
            534.3333333333334,
            208.0325829180505
        ],
        "wc_reply_reviewers_avg": [
            108.66666666666667,
            93.09612714226564
        ],
        "wc_reply_authors_avg": [
            646.0,
            304.8748377066672
        ],
        "reply_reviewers_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            3.0,
            1.4142135623730951
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14176049863250284573&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=IGzaH538fz",
        "pdf": "https://openreview.net/pdf?id=IGzaH538fz",
        "email": "ruc.edu.cn;scu.edu.cn;iit.edu;psu.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Renmin University of China;Sichuan University;Illinois Institute of Technology;Pennsylvania State University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "http://www.ruc.edu.cn;https://www.scu.edu.cn;https://www.iit.edu;https://www.psu.edu",
        "aff_unique_abbr": "RUC;SCU;IIT;PSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "IHQzgH9c0c",
        "title": "RealignDiff: Boosting text-to-image diffusion model with coarse-to-fine semantic re-alignment",
        "track": "main",
        "status": "Desk Reject",
        "tldr": "",
        "abstract": "Recent advances in text-to-image diffusion models have achieved remarkable success in generating high-quality, realistic images based on given text prompts. However, previous methods have struggled to establish precise modality alignment between text concepts and generated images due to the absence of successful semantic guidance that can diagnose the modality discrepancy. In this paper, we propose a two-stage coarse-to-fine semantic realignment method, named RealignDiff, aimed at improving the alignment between text and images in text-to-image diffusion models.\nDuring the coarse semantic realignment stage, we introduce a caption reward from a global semantic perspective, which is incorporated into the reward feedback learning framework to optimize the text-to-image diffusion model based on the caption reward score. Specifically, the caption reward generates a detailed caption that corresponds to all crucial content in the synthetic image using a BLIP-2 model and then calculates the reward score by measuring the similarity between the generated caption and the given prompt.\nIn the fine semantic realignment stage, we propose a local dense caption generation module from the local semantic perspective to refine the previously generated images. The local dense caption module provides the mask, detailed caption, and the corresponding likelihood score for each object appearing in the generated image. Furthermore, we also introduce an attention modulation method to guide the text-to-image diffusion model in realigning the generated captions with the object masks of the generated images.\nExperimental results on the MS-COCO benchmark demonstrate that the proposed two-stage coarse-to-fine semantic realignment method outperforms other baseline realignment techniques by a substantial margin in both visual quality and semantic similarity with the input prompt.",
        "keywords": "Text-to-Image Diffusion;Text-Image Alignment;Semantic Re-alignment",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Guian Fang;Zutao Jiang;Jianhua Han;Guansong Lu;Hang Xu;Xiaodan Liang",
        "authorids": "~Guian_Fang1;~Zutao_Jiang1;~Jianhua_Han1;~Guansong_Lu1;~Hang_Xu1;~Xiaodan_Liang2",
        "gender": "M;M;M;M;M;F",
        "homepage": "https://enderfga.cn;https://jiangzt.github.io/;;;;https://www.sysu-hcp.net/",
        "dblp": "348/7142;199/6895;29/6207;220/3032;;",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;BCR0RI4AAAAJ;OEPMQEMAAAAJ;YIt8thUAAAAJ;https://scholar.google.com.hk/citations?user=J_8TX6sAAAAJ;voxznZAAAAAJ",
        "orcid": "0009-0004-7344-2333;;;;0000-0003-3645-8972;",
        "linkedin": "enderfga;;;;;",
        "or_profile": "~Guian_Fang1;~Zutao_Jiang1;~Jianhua_Han1;~Guansong_Lu1;~Hang_Xu1;~Xiaodan_Liang2",
        "aff": "SUN YAT-SEN UNIVERSITY;Mohamed bin Zayed University of Artificial Intelligence;Huawei Technologies Ltd.;Huawei;Huawei Noah\u2018s Ark Lab;SUN YAT-SEN UNIVERSITY",
        "aff_domain": "sysu.edu.cn;mbzuai.ac.ae;huawei.com;huawei.com;huawei.com;sysu.edu.cn",
        "position": "Undergrad student;Postdoc;Researcher;Researcher;Researcher;Associate Professor",
        "bibtex": "@misc{\nfang2024realigndiff,\ntitle={RealignDiff: Boosting text-to-image diffusion model with coarse-to-fine semantic re-alignment},\nauthor={Guian Fang and Zutao Jiang and Jianhua Han and Guansong Lu and Hang Xu and Xiaodan Liang},\nyear={2024},\nurl={https://openreview.net/forum?id=IHQzgH9c0c}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=IHQzgH9c0c",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14771374530557620765&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2;2;2;0",
        "aff_unique_norm": "Sun Yat-sen University;Mohamed bin Zayed University of Artificial Intelligence;Huawei",
        "aff_unique_dep": ";;Huawei Technologies",
        "aff_unique_url": "http://www.sysu.edu.cn;https://mbzuai.ac.ae;https://www.huawei.com",
        "aff_unique_abbr": "SYSU;MBZUAI;Huawei",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;0;0",
        "aff_country_unique": "China;United Arab Emirates"
    },
    {
        "id": "IHedM0Zem9",
        "title": "BEEF: Building a BridgE from Event to Frame",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Event-based cameras are attracting significant interest as they provide event streams which contain rich edge information with high dynamic range and high temporal resolution. Many state-of-the-art event-based algorithms rely on splitting the events into several fixed groups, which are then aggregated into 2D frames by different event representations. However, the fixed slicing method can result in the omission of crucial temporal information, particularly when dealing with diverse motion scenarios (e.g., high-speed and low-speed). In this work, to build a BridgE from converting Event streams to Frames, we propose BEEF, a novel-designed event processing framework capable of splitting events stream to frames in an adaptive manner. In particular, BEEF integrates a low-energy spiking neural network (SNN) as an event trigger to determine the slicing time based on the spike generation. To guide the SNN in firing spikes at optimal time steps, we introduce the Spiking Position-aware Loss (SPA-Loss) function to modulate the neuron's spiking state. In addition, we develop a novel Feedback-Update training strategy that supervises the SNN to make precise event slicing decisions based on the feedback from the downstream artificial neural network (ANN). The newly sliced dataset by SNN is then used to fine-tune the ANN to improve the overall performance. Extensive experiments demonstrate that our BEEF achieves state-of-the-art performance in event-based object tracking and recognition.\nNotably, BEEF provides a brand-new SNN-ANN cooperation paradigm, where the SNN acts as an efficient, low-energy data processor to assist the ANN in improving downstream performance, injecting new perspectives and potential avenues of exploration.",
        "keywords": "Event-based Camera;Spiking Neural Network;Object Tracking;Image Recognization",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/0d2a1c10a2ffaf54d90a815990f32e79d1571ecc.zip",
        "author": "Jiahang Cao;Mingyuan Sun;Ziqing Wang;Hao Cheng;Qiang Zhang;Renjing Xu",
        "authorids": "~Jiahang_Cao1;~Mingyuan_Sun1;~Ziqing_Wang1;~Hao_Cheng15;~Qiang_Zhang10;~Renjing_Xu1",
        "gender": "M;M;;M;;",
        "homepage": "https://github.com/AndyCao1125;https://myuansun.github.io;;https://github.com/ChaduCheng;;",
        "dblp": ";;;;;",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;;;;",
        "orcid": ";;;0000-0002-3246-6636;;",
        "linkedin": ";;;;;",
        "or_profile": "~Jiahang_Cao1;~Mingyuan_Sun1;~Ziqing_Wang1;~Hao_Cheng15;~Qiang_Zhang10;~Renjing_Xu1",
        "aff": "Hong Kong University of Science and Technology;Northeastern University;;Hong Kong University of Science and Technology(Guangzhou);;",
        "aff_domain": "ust.hk;neu.edu.cn;;connect.hkust-gz.edu.cn;;",
        "position": "MS student;MS student;;PhD student;;",
        "bibtex": "@misc{\ncao2024beef,\ntitle={{BEEF}: Building a BridgE from Event to Frame},\nauthor={Jiahang Cao and Mingyuan Sun and Ziqing Wang and Hao Cheng and Qiang Zhang and Renjing Xu},\nyear={2024},\nurl={https://openreview.net/forum?id=IHedM0Zem9}\n}",
        "github": "",
        "project": "",
        "reviewers": "q3dC;689Y;YMHz;48Pk;erhw",
        "site": "https://openreview.net/forum?id=IHedM0Zem9",
        "pdf_size": 4206554,
        "rating": "3;5;5;5;6",
        "confidence": "4;3;5;3;5",
        "soundness": "3;3;2;2;3",
        "contribution": "3;2;2;2;3",
        "presentation": "2;3;3;2;4",
        "wc_summary": "163;53;58;40;88",
        "wc_strengths": "52;30;46;50;49",
        "wc_weaknesses": "430;211;275;66;213",
        "wc_questions": "9;11;4;25;2",
        "wc_review": "654;305;383;181;352",
        "wc_reply_reviewers": "0;77;0;25;31",
        "wc_reply_authors": "4079;1251;1643;1041;839",
        "reply_reviewers": "0;1;0;1;1",
        "reply_authors": "14;4;5;4;4",
        "rating_avg": [
            4.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            4.0,
            0.8944271909999159
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.8,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            80.4,
            44.19321214847366
        ],
        "wc_strengths_avg": [
            45.4,
            7.939773296511683
        ],
        "wc_weaknesses_avg": [
            239.0,
            117.61462494094857
        ],
        "wc_questions_avg": [
            10.2,
            8.084553172563094
        ],
        "wc_review_avg": [
            375.0,
            155.54420593516173
        ],
        "wc_reply_reviewers_avg": [
            26.6,
            28.203545876361005
        ],
        "wc_reply_authors_avg": [
            1770.6,
            1184.4974630618674
        ],
        "reply_reviewers_avg": [
            0.6,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            6.2,
            3.919183588453085
        ],
        "replies_avg": [
            45,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.22821773229381923,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Iltq2vm1KDMJ:scholar.google.com/&scioq=BEEF:+Building+a+BridgE+from+Event+to+Frame&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Northeastern University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ust.hk;https://www.northeastern.edu",
        "aff_unique_abbr": "HKUST;NEU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "IHmmnNvU2U",
        "title": "Weighted Risk Invariance for Density-Aware Domain Generalization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Learning how to generalize training performance to unseen test distributions is essential to building robust, practically useful models. To this end, many recent studies focus on learning invariant features from multiple domains. Our first observation is that the performance of existing invariant learning methods can degrade under covariate shift. To address this problem, we focus on finding invariant predictors from multiple, potentially shifted invariant feature distributions. We propose a novel optimization problem, Weighted Risk Invariance (WRI), and we show that the solution to this problem provably achieves out-of-distribution generalization. We also introduce an algorithm to practically solve the WRI problem that learns the density of invariant features and model parameters simultaneously, and we demonstrate our approach outperforms previous invariant learning methods under covariate shift in the invariant features. Finally, we show that the learned density over invariant features effectively detects when the features are out-of-distribution.",
        "keywords": "Domain generalization;invariant learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/b1e2a378a1201e1aadf4a12e73a206d93d901dda.zip",
        "author": "Gina Wong;Joshua Gleason;Rama Chellappa;Yoav Wald;Anqi Liu",
        "authorids": "~Gina_Wong1;~Joshua_Gleason1;~Rama_Chellappa1;~Yoav_Wald1;~Anqi_Liu2",
        "gender": ";M;;;F",
        "homepage": ";;;;https://anqiliu-ai.github.io/",
        "dblp": "280/3687.html;96/9962;;;",
        "google_scholar": ";FUchtr4AAAAJ;;;Q8yp6zQAAAAJ",
        "orcid": ";;;;0000-0002-0468-5698",
        "linkedin": ";;;;",
        "or_profile": "~Gina_Wong1;~Joshua_Gleason1;~Rama_Chellappa1;~Yoav_Wald1;~Anqi_Liu2",
        "aff": "Johns Hopkins University;University of Maryland, College Park;;;University of Illinois, Chicago",
        "aff_domain": "jhu.edu;umd.edu;;;uic.edu",
        "position": "PhD student;PhD student;;;PhD student",
        "bibtex": "@misc{\nwong2024weighted,\ntitle={Weighted Risk Invariance for Density-Aware Domain Generalization},\nauthor={Gina Wong and Joshua Gleason and Rama Chellappa and Yoav Wald and Anqi Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=IHmmnNvU2U}\n}",
        "github": "",
        "project": "",
        "reviewers": "G5hc;nCje;924Z;qV1P",
        "site": "https://openreview.net/forum?id=IHmmnNvU2U",
        "pdf_size": 849467,
        "rating": "3;5;6;6",
        "confidence": "3;3;3;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;3;4",
        "wc_summary": "67;94;86;170",
        "wc_strengths": "31;70;36;123",
        "wc_weaknesses": "398;350;80;111",
        "wc_questions": "4;9;35;102",
        "wc_review": "500;523;237;506",
        "wc_reply_reviewers": "139;63;44;0",
        "wc_reply_authors": "1363;1141;530;880",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "3;4;3;3",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            104.25,
            39.20698279643564
        ],
        "wc_strengths_avg": [
            65.0,
            36.694686263817545
        ],
        "wc_weaknesses_avg": [
            234.75,
            140.70780895174227
        ],
        "wc_questions_avg": [
            37.5,
            39.05444917035702
        ],
        "wc_review_avg": [
            441.5,
            118.36912604222437
        ],
        "wc_reply_reviewers_avg": [
            61.5,
            50.24191477242881
        ],
        "wc_reply_authors_avg": [
            978.5,
            310.2825325409086
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.25,
            0.4330127018922193
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.4714045207910316,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:AY2wA9wOJisJ:scholar.google.com/&scioq=Weighted+Risk+Invariance+for+Density-Aware+Domain+Generalization&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Johns Hopkins University;University of Maryland;University of Illinois at Chicago",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.jhu.edu;https://www/umd.edu;https://www.uic.edu",
        "aff_unique_abbr": "JHU;UMD;UIC",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";College Park;Chicago",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "II0OENWgi8",
        "title": "Skill-Conditioned Policy Optimization with Successor Features Representations",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "A key aspect of intelligence is the ability to exhibit a wide range of behaviors to adapt to unforeseen situations. Designing artificial agents that are capable of showcasing a broad spectrum of skills is a long-standing challenge in Artificial Intelligence. In the last decade, progress in deep Reinforcement Learning (RL) has enabled to solve complex tasks with high-dimensional, continuous state and action spaces. However, most approaches return only one highly-specialized solution to a single problem. We introduce a Skill-Conditioned Optimal Agent (SCOPA) that leverages successor features representations to learn skills that solve a task. We derive a policy skill improvement update with successor features analogous to the classic policy improvement update, that we use to learn skills. From this result, we develop an algorithm that combines successor features with universal function approximators to learn a skill representation that extends the traditional concept of goal to trajectory-based skill. We seamlessly unify value function and successor features policy iteration with constrained optimization to (1) maximize performance while (2) executing a skill. Compared with other skill-conditioned RL methods, SCOPA reaches significantly higher performance and skill space coverage on challenging continuous control locomotion tasks with various types of skills. We also demonstrate that the diversity of skills is useful in downstream adaptation tasks. Videos of our results are available at: http://bit.ly/scopa.",
        "keywords": "Reinforcement Learning;Quality-Diversity",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/3d7504cc99253369fdab1a5c949d1c5320a5a26f.zip",
        "author": "Luca Grillotti;Maxence Faldor;Borja G. Le\u00f3n;Antoine Cully",
        "authorids": "~Luca_Grillotti1;~Maxence_Faldor1;~Borja_G._Le\u00f3n1;~Antoine_Cully1",
        "gender": "M;M;M;M",
        "homepage": "https://luca.grillotti.com;https://maxencefaldor.github.io;https://www.doc.ic.ac.uk/~bg19/;",
        "dblp": ";342/2945;259/1299;https://dblp.org/pers/c/Cully:Antoine.html",
        "google_scholar": ";s36pCYsAAAAJ;https://scholar.google.es/citations?user=sJiadiMAAAAJ;rZtJlPQAAAAJ",
        "orcid": ";0000-0003-4743-9494;;",
        "linkedin": ";maxencefaldor/;borja-gonzalez-leon/;",
        "or_profile": "~Luca_Grillotti1;~Maxence_Faldor1;~Borja_G._Le\u00f3n1;~Antoine_Cully1",
        "aff": "Imperial College London;Imperial College London;Imperial College London;Imperial College London",
        "aff_domain": "imperial.ac.uk;imperial.ac.uk;imperial.ac.uk;imperial.ac.uk",
        "position": "PhD student;PhD student;PhD student;Assistant Professor",
        "bibtex": "@misc{\ngrillotti2024skillconditioned,\ntitle={Skill-Conditioned Policy Optimization with Successor Features Representations},\nauthor={Luca Grillotti and Maxence Faldor and Borja G. Le{\\'o}n and Antoine Cully},\nyear={2024},\nurl={https://openreview.net/forum?id=II0OENWgi8}\n}",
        "github": "",
        "project": "",
        "reviewers": "XD7J;a9mP;SA5X;9NVL",
        "site": "https://openreview.net/forum?id=II0OENWgi8",
        "pdf_size": 6837080,
        "rating": "5;5;5;8",
        "confidence": "4;4;3;4",
        "soundness": "2;2;2;4",
        "contribution": "2;3;2;4",
        "presentation": "3;2;2;4",
        "wc_summary": "64;155;158;86",
        "wc_strengths": "104;148;55;222",
        "wc_weaknesses": "305;631;411;244",
        "wc_questions": "218;35;298;36",
        "wc_review": "691;969;922;588",
        "wc_reply_reviewers": "521;0;700;0",
        "wc_reply_authors": "4417;2319;2634;473",
        "reply_reviewers": "1;0;3;0",
        "reply_authors": "8;4;5;1",
        "rating_avg": [
            5.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            115.75,
            41.49924698112003
        ],
        "wc_strengths_avg": [
            132.25,
            61.377418485954585
        ],
        "wc_weaknesses_avg": [
            397.75,
            147.32850199469212
        ],
        "wc_questions_avg": [
            146.75,
            114.78975346258045
        ],
        "wc_review_avg": [
            792.5,
            158.14945463073846
        ],
        "wc_reply_reviewers_avg": [
            305.25,
            311.7413791911494
        ],
        "wc_reply_authors_avg": [
            2460.75,
            1398.9435969687984
        ],
        "reply_reviewers_avg": [
            1.0,
            1.224744871391589
        ],
        "reply_authors_avg": [
            4.5,
            2.5
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10123382383675242511&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Imperial College London",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.imperial.ac.uk",
        "aff_unique_abbr": "ICL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "IJBsKYXaH4",
        "title": "Molecular Conformation Generation via Shifting Scores",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Molecular conformation generation, a critical aspect of computational chemistry, involves producing the three-dimensional conformer geometry for a given molecule. Generating molecular conformation via diffusion requires learning to reverse a noising process. Diffusion on inter-atomic distances instead of conformation preserves SE(3)-equivalence and shows superior performance compared to alternative techniques, whereas related generative modelings are predominantly based upon heuristical assumptions. In response to this, we propose a novel molecular conformation generation approach driven by the observation that the disintegration of a molecule can be viewed as casting increasing force fields to its composing atoms, such that the distribution of the change of inter-atomic distance shifts from Gaussian to Maxwell-Boltzmann distribution. The corresponding generative modeling ensures a feasible inter-atomic distance geometry and exhibits time reversibility. Experimental results on molecular datasets demonstrate the advantages of the proposed shifting distribution compared to the state-of-the-art.",
        "keywords": "molecule conformation generation;generative diffusion model",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/8af5a3a7c3fbe75cd7b1f3b9b9f4da0ee8d7461b.zip",
        "author": "Zihan Zhou;Ruiying Liu;Chaolong Ying;Ruimao Zhang;Tianshu Yu",
        "authorids": "~Zihan_Zhou7;~Ruiying_Liu1;~Chaolong_Ying1;~Ruimao_Zhang1;~Tianshu_Yu2",
        "gender": "M;F;M;M;M",
        "homepage": "https://github.com/zzh1282260738;https://sds.cuhk.edu.cn/en/node/712;https://sds.cuhk.edu.cn/node/708;http://zhangruimao.site/#;https://mypage.cuhk.edu.cn/academics/yutianshu/",
        "dblp": "00/6525;190/9026;295/3323;54/10697;152/6675",
        "google_scholar": "NxB0_NkAAAAJ;;1-O3158AAAAJ;ZJwZdtgAAAAJ;MTHO7DsAAAAJ",
        "orcid": "0009-0006-6107-6190;;0000-0002-8555-8817;;0000-0002-6537-1924",
        "linkedin": ";;;;",
        "or_profile": "~Zihan_Zhou7;~Ruiying_Liu1;~Chaolong_Ying1;~Ruimao_Zhang1;~Tianshu_Yu2",
        "aff": "The Chinese University of Hong Kong, Shenzhen;The Chinese University of Hong Kong, Shenzhen;The Chinese University of Hong Kong, Shenzhen;The Chinese University of Hong Kong (Shenzhen);Chinese University of Hong Kong (Shenzhen)",
        "aff_domain": "cuhk.edu.cn;cuhk.edu.com;cuhk.edu.cn;cuhk.edu.cn;cuhk.edu.cn",
        "position": "PhD student;PhD student;PhD student;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nzhou2024molecular,\ntitle={Molecular Conformation Generation via Shifting Scores},\nauthor={Zihan Zhou and Ruiying Liu and Chaolong Ying and Ruimao Zhang and Tianshu Yu},\nyear={2024},\nurl={https://openreview.net/forum?id=IJBsKYXaH4}\n}",
        "github": "",
        "project": "",
        "reviewers": "XVGd;K1M9;1N22;QEij",
        "site": "https://openreview.net/forum?id=IJBsKYXaH4",
        "pdf_size": 13380730,
        "rating": "3;3;5;5",
        "confidence": "4;3;4;4",
        "soundness": "2;3;3;2",
        "contribution": "2;1;2;3",
        "presentation": "1;2;3;3",
        "wc_summary": "50;47;66;60",
        "wc_strengths": "41;45;50;5",
        "wc_weaknesses": "415;66;47;438",
        "wc_questions": "58;37;60;252",
        "wc_review": "564;195;223;755",
        "wc_reply_reviewers": "475;74;0;0",
        "wc_reply_authors": "1122;304;346;1426",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "3;1;1;2",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            55.75,
            7.628073151196179
        ],
        "wc_strengths_avg": [
            35.25,
            17.75352077758099
        ],
        "wc_weaknesses_avg": [
            241.5,
            185.300431731823
        ],
        "wc_questions_avg": [
            101.75,
            87.2134593970449
        ],
        "wc_review_avg": [
            434.25,
            235.3628847120973
        ],
        "wc_reply_reviewers_avg": [
            137.25,
            197.3263477085612
        ],
        "wc_reply_authors_avg": [
            799.5,
            486.7471109313336
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13096160343806717903&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Chinese University of Hong Kong",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cuhk.edu.cn",
        "aff_unique_abbr": "CUHK",
        "aff_campus_unique_index": "0;0;0;0;0",
        "aff_campus_unique": "Shenzhen",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "IKOAJG6mru",
        "title": "Creative Robot Tool Use with Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Tool use is a hallmark of advanced intelligence, exemplified in both animal behavior and robotic capabilities. This paper investigates the feasibility of imbuing robots with the ability to creatively use tools in tasks that involve implicit physical constraints and long-term planning. Leveraging Large Language Models (LLMs), we develop RoboTool, a system that accepts natural language instructions and outputs executable code for controlling robots in both simulated and real-world environments. RoboTool incorporates four pivotal components: (i) an \u201cAnalyzer\u201d that interprets natural language to discern key task-related concepts, (ii) a \u201cPlanner\u201d that generates comprehensive strategies based on the language input and key concepts, (iii) a \u201cCalculator\u201d that computes parameters for each skill, and (iv) a \u201cCoder\u201d that translates these plans into executable Python code. Our results show that RoboTool can not only comprehend implicit physical constraints and environmental factors but also demonstrate creative tool use. Unlike traditional Task and Motion Planning (TAMP) methods that rely on explicit optimization and are confined to formal logic, our LLM-based system offers a more flexible, efficient, and user-friendly solution for complex robotics tasks. Through extensive experiments, we validate that RoboTool is proficient in handling tasks that would otherwise be infeasible without the creative use of tools, thereby expanding the capabilities of robotic systems.",
        "keywords": "Large Language Model;Robot Learning;Tool Use",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Mengdi Xu;Wenhao Yu;Peide Huang;Shiqi Liu;Xilun Zhang;Yaru Niu;Tingnan Zhang;Fei Xia;Jie Tan;Ding Zhao",
        "authorids": "~Mengdi_Xu3;~Wenhao_Yu1;~Peide_Huang1;~Shiqi_Liu2;~Xilun_Zhang1;~Yaru_Niu1;~Tingnan_Zhang1;~Fei_Xia1;~Jie_Tan1;~Ding_Zhao1",
        "gender": "F;M;;M;M;M;M;M;M;",
        "homepage": "https://mxu34.github.io/;https://wenhaoyu.weebly.com/;https://peidehuang.github.io/;https://shiqiliu-67.github.io/;https://github.com/XilunZhangRobo;https://yaruniu.com/;;;http://www.jie-tan.net;https://safeai-lab.github.io",
        "dblp": ";;295/8645;;;210/6648;https://dblp.uni-trier.de/pers/hd/z/Zhang:Tingnan;;81/7419;",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;1bF2s2kAAAAJ;g5U-sjoAAAAJ;PiuAi5wAAAAJ;;7yn5-VEAAAAJ;RM2vMNcAAAAJ;pqP5_PgAAAAJ;neGbgzYAAAAJ;z7tPc9IAAAAJ",
        "orcid": "0000-0001-9332-4175;;;;;;;0000-0003-4343-1444;;",
        "linkedin": ";;peidehuang/;shiqiliu2/;;yaru-niu-2b847b169/;;;jie-tan/;",
        "or_profile": "~Mengdi_Xu3;~Wenhao_Yu1;~Peide_Huang1;~Shiqi_Liu2;~Xilun_Zhang1;~Yaru_Niu1;~Tingnan_Zhang1;~Fei_Xia1;~Jie_Tan1;~Ding_Zhao1",
        "aff": "Carnegie Mellon University;Google;Carnegie Mellon University;Carnegie Mellon University;Carnegie Mellon University;Carnegie Mellon University;Google;Google;Google;Carnegie Mellon University",
        "aff_domain": "cmu.edu;google.com;cmu.edu;cmu.edu;cmu.edu;andrew.cmu.edu;google.com;google.com;google.com;cmu.edu",
        "position": "PhD student;Software Engineer;PhD student;PhD student;MS student;PhD student;Software Engineer;Researcher;Research Scientist;Associate Professor",
        "bibtex": "@misc{\nxu2024creative,\ntitle={Creative Robot Tool Use with Large Language Models},\nauthor={Mengdi Xu and Wenhao Yu and Peide Huang and Shiqi Liu and Xilun Zhang and Yaru Niu and Tingnan Zhang and Fei Xia and Jie Tan and Ding Zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=IKOAJG6mru}\n}",
        "github": "",
        "project": "",
        "reviewers": "b6vg;xccj;pWWx;QoGZ",
        "site": "https://openreview.net/forum?id=IKOAJG6mru",
        "pdf_size": 10967354,
        "rating": "1;5;6;8",
        "confidence": "4;4;3;3",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;4;2;4",
        "wc_summary": "72;78;65;78",
        "wc_strengths": "23;106;58;32",
        "wc_weaknesses": "184;328;443;270",
        "wc_questions": "76;152;61;234",
        "wc_review": "355;664;627;614",
        "wc_reply_reviewers": "0;0;438;52",
        "wc_reply_authors": "973;1752;2367;999",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "4;5;5;3",
        "rating_avg": [
            5.0,
            2.5495097567963922
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            73.25,
            5.356071321407137
        ],
        "wc_strengths_avg": [
            54.75,
            32.25968846718765
        ],
        "wc_weaknesses_avg": [
            306.25,
            94.11794462269137
        ],
        "wc_questions_avg": [
            130.75,
            68.87443284702967
        ],
        "wc_review_avg": [
            565.0,
            122.6234072271685
        ],
        "wc_reply_reviewers_avg": [
            122.5,
            183.3868861178465
        ],
        "wc_reply_authors_avg": [
            1522.75,
            579.1918399805024
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            4.25,
            0.82915619758885
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": -0.7844645405527362,
        "gs_citation": 44,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2643658652448954041&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0;0;0;0;1;1;1;0",
        "aff_unique_norm": "Carnegie Mellon University;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.cmu.edu;https://www.google.com",
        "aff_unique_abbr": "CMU;Google",
        "aff_campus_unique_index": "1;1;1;1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "IKkFJgAdlW",
        "title": "Graph Structure and Feature Extrapolation for Out-of-Distribution Generalization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Out-of-distribution (OOD) generalization deals with the prevalent learning scenario where test distribution shifts from training distribution. With rising application demands and inherent complexity, graph OOD problems call for specialized solutions. While data-centric methods exhibit performance enhancements on many generic machine learning tasks, there is a notable absence of data augmentation methods tailored for graph OOD generalization. In this work, we propose to achieve graph OOD generalization with the novel design of non-Euclidean-space linear extrapolation. The proposed augmentation strategy extrapolates both structure and feature spaces to generate OOD graph data. Our design tailors OOD samples for specific shifts without corrupting underlying causal mechanisms.\nTheoretical analysis and empirical results evidence the effectiveness of our method in solving target shifts, showing substantial and constant improvements across various graph OOD tasks.",
        "keywords": "Deep learning;Data augmentation;Out-of-distribution generalization",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/752ad8ed373e4f6592b234510cf16facee515adc.pdf",
        "author": "Xiner Li;Shurui Gui;Youzhi Luo;Shuiwang Ji",
        "authorids": "~Xiner_Li1;~Shurui_Gui1;~Youzhi_Luo1;~Shuiwang_Ji1",
        "gender": "F;M;M;M",
        "homepage": ";https://cm-bf.github.io;https://lyzustc.github.io/;http://people.tamu.edu/~sji",
        "dblp": "267/6459;272/0674.html;280/0590;84/6405",
        "google_scholar": "bBQx_5MAAAAJ;U4AjtOkAAAAJ;3lqQFIoAAAAJ;BZGj6sAAAAAJ",
        "orcid": ";;0000-0002-3763-0239;0000-0002-4205-4563",
        "linkedin": ";;youzhi-luo-139981172/;shuiwang-ji-9a040715/",
        "or_profile": "~Xiner_Li1;~Shurui_Gui1;~Youzhi_Luo1;~Shuiwang_Ji1",
        "aff": "Texas A&M University - College Station;Texas A&M University;Texas A&M University;Texas A&M University",
        "aff_domain": "tamu.edu;tamu.edu;tamu.edu;tamu.edu",
        "position": "PhD student;PhD student;PhD student;Professor",
        "bibtex": "@misc{\nli2024graph,\ntitle={Graph Structure and Feature Extrapolation for Out-of-Distribution Generalization},\nauthor={Xiner Li and Shurui Gui and Youzhi Luo and Shuiwang Ji},\nyear={2024},\nurl={https://openreview.net/forum?id=IKkFJgAdlW}\n}",
        "github": "",
        "project": "",
        "reviewers": "hu8t;cpdN;EXsh;wvB3",
        "site": "https://openreview.net/forum?id=IKkFJgAdlW",
        "pdf_size": 6956165,
        "rating": "3;5;5;6",
        "confidence": "4;4;4;2",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "18;184;61;28",
        "wc_strengths": "27;93;30;75",
        "wc_weaknesses": "66;112;6;21",
        "wc_questions": "20;54;198;42",
        "wc_review": "131;443;295;166",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            72.75,
            66.1716517853378
        ],
        "wc_strengths_avg": [
            56.25,
            28.49012986983387
        ],
        "wc_weaknesses_avg": [
            51.25,
            41.444993666304256
        ],
        "wc_questions_avg": [
            78.5,
            70.06247212309883
        ],
        "wc_review_avg": [
            258.75,
            122.66290188969117
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.6622661785325219,
        "gs_citation": 18,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15376445850681789433&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Texas A&M University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tamu.edu",
        "aff_unique_abbr": "TAMU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "College Station;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Robot Fleet Learning via Policy Merging",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18969",
        "id": "IL71c1z7et",
        "author_site": "Lirui Wang, Kaiqing Zhang, Allan Zhou, Max Simchowitz, Russ Tedrake",
        "tldr": "",
        "abstract": "Fleets of robots ingest massive amounts of heterogeneous streaming data silos generated by interacting with their environments, far more than what can be stored or transmitted with ease. At the same time, teams of robots should co-acquire diverse skills through their heterogeneous experiences in varied settings. How can we enable such fleet-level learning without having to transmit or centralize fleet-scale data? In this paper, we investigate policy merging (PoMe) from such distributed heterogeneous datasets as a potential solution. To efficiently merge policies in the fleet setting, we propose FLEET-MERGE, an instantiation of distributed learning that accounts for the permutation invariance that arises when parameterizing the control policies with recurrent neural networks. We show that FLEET-MERGE consolidates the behavior of policies trained on 50 tasks in the Meta-World environment, with good performance on nearly all training tasks at test time. Moreover, we introduce a novel robotic tool-use benchmark, FLEET-TOOLS, for fleet policy learning in compositional and contact-rich robot manipulation tasks, to validate the efficacy of FLEET-MERGE on the benchmark.",
        "keywords": "Fleet Learning;Weight Merging;Multi-task Policy Learning",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Lirui Wang;Kaiqing Zhang;Allan Zhou;Max Simchowitz;Russ Tedrake",
        "authorids": "~Lirui_Wang1;~Kaiqing_Zhang3;~Allan_Zhou1;~Max_Simchowitz1;~Russ_Tedrake1",
        "gender": "M;;M;M;M",
        "homepage": "https://liruiw.github.io/;http://bland.website;;http://people.csail.mit.edu/russt;https://kzhang66.github.io/",
        "dblp": "221/9612;195/6907;176/5165;73/1296;",
        "google_scholar": "EM9YhH0AAAAJ;;;nxNkEiYAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Lirui_Wang1;~Allan_Zhou1;~Max_Simchowitz1;~Russ_Tedrake1;~kaiqing_zhang1",
        "aff": "Massachusetts Institute of Technology;Stanford University;Massachusetts Institute of Technology;Massachusetts Institute of Technology;University of Maryland, College Park",
        "aff_domain": "mit.edu;stanford.edu;mit.edu;mit.edu;umd.edu",
        "position": "PhD student;PhD student;Postdoc;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nwang2024robot,\ntitle={Robot Fleet Learning via Policy Merging},\nauthor={Lirui Wang and Kaiqing Zhang and Allan Zhou and Max Simchowitz and Russ Tedrake},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=IL71c1z7et}\n}",
        "github": "",
        "project": "",
        "reviewers": "2Z2Z;DxkE;FoVN",
        "pdf_size": 13006116,
        "rating": "5;8;8",
        "confidence": "4;3;3",
        "soundness": "3;4;4",
        "contribution": "3;2;4",
        "presentation": "2;4;4",
        "wc_summary": "93;64;190",
        "wc_strengths": "227;85;104",
        "wc_weaknesses": "263;193;77",
        "wc_questions": "54;164;88",
        "wc_review": "637;506;459",
        "wc_reply_reviewers": "167;104;20",
        "wc_reply_authors": "1632;703;464",
        "reply_reviewers": "1;1;1",
        "reply_authors": "4;3;2",
        "rating_avg": [
            7.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            115.66666666666667,
            53.87846405465628
        ],
        "wc_strengths_avg": [
            138.66666666666666,
            62.940889376903115
        ],
        "wc_weaknesses_avg": [
            177.66666666666666,
            76.70433857061512
        ],
        "wc_questions_avg": [
            102.0,
            45.985504962614755
        ],
        "wc_review_avg": [
            534.0,
            75.31710739710246
        ],
        "wc_reply_reviewers_avg": [
            97.0,
            60.21627686929839
        ],
        "wc_reply_authors_avg": [
            933.0,
            503.8061796630393
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.0,
            0.816496580927726
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17634328602335433556&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=IL71c1z7et",
        "pdf": "https://openreview.net/pdf?id=IL71c1z7et",
        "email": "mit.edu;stanford.edu;mit.edu;mit.edu;umd.edu",
        "author_num": 5,
        "aff_unique_index": "0;1;0;0;2",
        "aff_unique_norm": "Massachusetts Institute of Technology;Stanford University;University of Maryland",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://web.mit.edu;https://www.stanford.edu;https://www/umd.edu",
        "aff_unique_abbr": "MIT;Stanford;UMD",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Stanford;College Park",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "IL9o1meezQ",
        "title": "Random Walk Diffusion For Graph Generation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph generation addresses the problem of generating new graphs that have a data distribution similar to real-world graphs. Recently, the task of graph generation has gained increasing attention with applications ranging from data augmentation to constructing molecular graphs with specific properties. Previous diffusion-based approaches have shown promising results in terms of the quality of the generated graphs. However, most methods are designed for generating small graphs and do not scale well to large graphs. In this work, we introduce ARROW-Diff, a novel random walk-based diffusion approach for graph generation. It utilizes an order agnostic autoregressive diffusion model enabling us to generate graphs at a very large scale. ARROW-Diff encompasses an iterative procedure that builds the final graph from sampled random walks based on an edge classification task and directed by node degrees. Our method outperforms all baseline methods in terms of training and generation time and can be trained both on single- and multi-graph datasets. Moreover, it outperforms most baselines on multiple graph statistics reflecting the high quality of the generated graphs.",
        "keywords": "Graph Generation;Diffusion Models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/0e1fe1d062ced9b5196a521863434b90f68dd742.zip",
        "author": "Tobias Bernecker;Ghalia Rehawi;Janine Knauer-Arloth;Annalisa Marsico",
        "authorids": "~Tobias_Bernecker1;~Ghalia_Rehawi1;~Janine_Knauer-Arloth1;~Annalisa_Marsico1",
        "gender": "M;F;;F",
        "homepage": ";;;https://www.helmholtz-munich.de/en/icb/research-groups/marsico-lab",
        "dblp": "153/1163;329/0536;;",
        "google_scholar": ";TeDcp7oAAAAJ;;https://scholar.google.de/citations?user=YMUe_pYAAAAJ",
        "orcid": "0000-0001-8621-9617;0000-0001-5115-8658;;",
        "linkedin": "https://linkedin.com/in/tobias-bernecker;ghalia-rehawi-35089642/;;annalisa-marsico-08b47a30/?originalSubdomain=de",
        "or_profile": "~Tobias_Bernecker1;~Ghalia_Rehawi1;~Janine_Knauer-Arloth1;~Annalisa_Marsico1",
        "aff": "Helmholtz Zentrum M\u00fcnchen;Max Planck Institute of Psychiatry;;Helmholtz Center Munich",
        "aff_domain": "helmholtz-munich.de;psych.mpg.de;;helmholtz-munich.de",
        "position": "PhD student;PhD student;;Assistant Professor",
        "bibtex": "@misc{\nbernecker2024random,\ntitle={Random Walk Diffusion For Graph Generation},\nauthor={Tobias Bernecker and Ghalia Rehawi and Janine Knauer-Arloth and Annalisa Marsico},\nyear={2024},\nurl={https://openreview.net/forum?id=IL9o1meezQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "sVdq;Yei3;ynZg;zEev",
        "site": "https://openreview.net/forum?id=IL9o1meezQ",
        "pdf_size": 1345032,
        "rating": "3;3;6;6",
        "confidence": "5;4;4;4",
        "soundness": "2;3;4;2",
        "contribution": "3;2;3;2",
        "presentation": "2;3;3;3",
        "wc_summary": "100;82;72;108",
        "wc_strengths": "28;57;77;142",
        "wc_weaknesses": "261;430;106;136",
        "wc_questions": "13;237;37;144",
        "wc_review": "402;806;292;530",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "883;1202;105;415",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            90.5,
            14.239030865898142
        ],
        "wc_strengths_avg": [
            76.0,
            41.89868733027325
        ],
        "wc_weaknesses_avg": [
            233.25,
            127.60363435263119
        ],
        "wc_questions_avg": [
            107.75,
            89.44656225926181
        ],
        "wc_review_avg": [
            507.5,
            191.8195766860098
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            651.25,
            421.67426705930257
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896258,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:yuqXkxA0kdIJ:scholar.google.com/&scioq=Random+Walk+Diffusion+For+Graph+Generation&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Helmholtz Zentrum M\u00fcnchen;Max Planck Institute of Psychiatry;Helmholtz Center Munich",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.helmholtz-muenchen.de;https://www.mpib-psycho.de;https://www.helmholtz-munich.de",
        "aff_unique_abbr": ";MPIP;HMGU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "ILStlRb1Sp",
        "title": "Understanding the Mechanics and Dynamics of Memorisation in Large Language Models: A Case Study with Random Strings",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Understanding whether and to what extent large language models (LLMs) have memorised training data has important implications for the privacy of its training data and the reliability of its generated output. In this work, we focus on the more foundational question of how LLMs memorise training data. To this end, we systematically train LLMs of different sizes to memorise random token strings of different lengths and different entropies (i.e., sampled from different alphabet distributions) and study their ability to recall the strings. We observe many striking memorisation dynamics including (i) memorisation in phases with the alphabet distributions in the random strings being learnt before their relative positions in the string are memorised and (ii) memorisation in parts at the granularity of individual tokens, but not necessarily in the order in which they appear in the string. Next, we investigate memorisation mechanics by checking to what extent different parts of a token\u2019s prefix in the string are necessary and sufficient to recollect the token. We leverage our insights to explain the dynamics of memorising strings and we conclude by discussing the implications of our findings for quantifying memorisation.",
        "keywords": "language models;memorization",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/bb73c9e915d0d6cccc7525d86c07bdb734716469.zip",
        "author": "Till Speicher;Aflah Mohammad Khan;Qinyuan Wu;Vedant Nanda;Soumi Das;Bishwamittra Ghosh;Krishna P. Gummadi;Evimaria Terzi",
        "authorids": "~Till_Speicher1;afkhan@mpi-sws.org;~Qinyuan_Wu1;~Vedant_Nanda2;~Soumi_Das1;~Bishwamittra_Ghosh1;~Krishna_P._Gummadi1;~Evimaria_Terzi1",
        "gender": "M;;F;;F;M;M;",
        "homepage": "https://tillspeicher.com/;;https://qinyuanwu0710.github.io//;;https://soumidas.github.io/;https://bishwamittra.github.io;https://www.mpi-sws.org/~gummadi/;https://cs-people.bu.edu/evimaria/",
        "dblp": "144/7849;;277/0677;;252/5452;230/0441;g/PKrishnaGummadi;t/EvimariaTerzi",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;TFf6P8kAAAAJ;;1tJnMkoAAAAJ;xO4PpdAAAAAJ;https://scholar.google.com.tw/citations?user=Bz3APTsAAAAJ;j6KFCRAAAAAJ",
        "orcid": "0009-0000-1172-2525;;0000-0002-1453-9643;;;0000-0003-2971-8975;;",
        "linkedin": ";;;;soumi-das;;;evimaria-terzi-4a621a2/",
        "or_profile": "~Till_Speicher1;afkhan@mpi-sws.org;~Qinyuan_Wu1;~Vedant_Nanda2;~Soumi_Das1;~Bishwamittra_Ghosh1;~Krishna_P._Gummadi1;~Evimaria_Terzi1",
        "aff": "MPI-SWS;;MPI-SWS;;MPI-SWS;Institute of High Performance Computing, Singapore, A*STAR;MPI-SWS;Boston University, Boston University",
        "aff_domain": "mpi-sws.org;;mpi-sws.org;;mpi-sws.org;ihpc.a-star.edu.sg;mpi-sws.org;bu.edu",
        "position": "PhD student;;PhD student;;Postdoc;Researcher;Full Professor;Full Professor",
        "bibtex": "@misc{\nspeicher2024understanding,\ntitle={Understanding the Mechanics and Dynamics of Memorisation in Large Language Models: A Case Study with Random Strings},\nauthor={Till Speicher and Aflah Mohammad Khan and Qinyuan Wu and Vedant Nanda and Soumi Das and Bishwamittra Ghosh and Krishna P. Gummadi and Evimaria Terzi},\nyear={2024},\nurl={https://openreview.net/forum?id=ILStlRb1Sp}\n}",
        "github": "",
        "project": "",
        "reviewers": "ueBA;jCFX;NLd8;j45i;LNRg",
        "site": "https://openreview.net/forum?id=ILStlRb1Sp",
        "pdf_size": 741586,
        "rating": "3;5;5;6;6",
        "confidence": "4;3;3;2;3",
        "soundness": "2;3;3;3;3",
        "contribution": "2;2;2;3;3",
        "presentation": "3;2;3;3;3",
        "wc_summary": "83;137;104;87;120",
        "wc_strengths": "38;44;118;49;15",
        "wc_weaknesses": "134;246;1168;193;32",
        "wc_questions": "186;54;7;5;1",
        "wc_review": "441;481;1397;334;168",
        "wc_reply_reviewers": "0;187;148;0;0",
        "wc_reply_authors": "433;615;1238;347;159",
        "reply_reviewers": "0;1;1;0;0",
        "reply_authors": "1;1;2;1;1",
        "rating_avg": [
            5.0,
            1.0954451150103321
        ],
        "confidence_avg": [
            3.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            106.2,
            20.252407264322926
        ],
        "wc_strengths_avg": [
            52.8,
            34.61444785057245
        ],
        "wc_weaknesses_avg": [
            354.6,
            412.8591042958845
        ],
        "wc_questions_avg": [
            50.6,
            70.4062497225921
        ],
        "wc_review_avg": [
            564.2,
            430.26103704611694
        ],
        "wc_reply_reviewers_avg": [
            67.0,
            82.9795155445005
        ],
        "wc_reply_authors_avg": [
            558.4,
            370.1338136404184
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.2,
            0.4
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.8660254037844387,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15083125685348633397&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;0;2",
        "aff_unique_norm": "Max Planck Institute for Software Systems;Institute of High Performance Computing;Boston University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.mpi-sws.org;https://www.ihpc.a-star.edu.sg;https://www.bu.edu",
        "aff_unique_abbr": "MPI-SWS;IHPC;BU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Boston",
        "aff_country_unique_index": "0;0;0;1;0;2",
        "aff_country_unique": "Germany;Singapore;United States"
    },
    {
        "title": "Uncertainty-aware Constraint Inference in Inverse Constrained Reinforcement Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18968",
        "id": "ILYjDvUM6U",
        "author_site": "Sheng Xu, Guiliang Liu",
        "tldr": "",
        "abstract": "Aiming for safe control, Inverse Constrained Reinforcement Learning (ICRL) considers inferring the constraints respected by expert agents from their demonstrations and learning imitation policies that adhere to these constraints. While previous ICRL works often neglected underlying uncertainties during training, we contend that modeling these uncertainties is crucial for facilitating robust constraint inference. This insight leads to the development of an Uncertainty-aware Inverse Constrained Reinforcement Learning (UAICRL) algorithm. Specifically, 1) aleatoric uncertainty arises from the inherent stochasticity of environment dynamics, leading to constraint-violating behaviors in imitation policies. To address this, UAICRL constructs risk-sensitive constraints by incorporating distributional Bellman updates into the cumulative costs model. 2) Epistemic uncertainty, resulting from the model's limited knowledge of Out-of-Distribution (OoD) samples, affects the accuracy of step-wise cost predictions. To tackle this issue, UAICRL develops an information-theoretic quantification of the epistemic uncertainty and mitigates its impact through flow-based generative data augmentation. Empirical results demonstrate that UAICRL consistently outperforms other baselines in continuous and discrete environments with stochastic dynamics. The code is available at https://github.com/Jasonxu1225/UAICRL.",
        "keywords": "Inverse Constrained Reinforcement Learning;Constrained Reinforcement Learning;Inverse Reinforcement Learning;Uncertainty Modeling",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/c6a17515d6338ac816c9871684a8061107752eb6.zip",
        "author": "Sheng Xu;Guiliang Liu",
        "authorids": "~Sheng_Xu8;~Guiliang_Liu1",
        "gender": ";M",
        "homepage": "https://shengxu.net/;http://guiliang.me/",
        "dblp": ";220/5411",
        "google_scholar": "rJhWU6gAAAAJ;CuMylvEAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Sheng_Xu8;~Guiliang_Liu1",
        "aff": "The Chinese University of Hong Kong, Shenzhen;The Chinese University of Hong Kong, Shenzhen",
        "aff_domain": "cuhk.edu.cn;cuhk.edu.hk",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nxu2024uncertaintyaware,\ntitle={Uncertainty-aware Constraint Inference in Inverse Constrained Reinforcement Learning},\nauthor={Sheng Xu and Guiliang Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ILYjDvUM6U}\n}",
        "github": "",
        "project": "",
        "reviewers": "4NEv;zJng;nMsK;8mMN",
        "pdf_size": 13200081,
        "rating": "5;6;6;6",
        "confidence": "3;3;3;3",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;2",
        "presentation": "3;1;3;3",
        "wc_summary": "75;121;73;64",
        "wc_strengths": "46;115;54;42",
        "wc_weaknesses": "62;659;78;120",
        "wc_questions": "117;29;138;84",
        "wc_review": "300;924;343;310",
        "wc_reply_reviewers": "13;19;26;151",
        "wc_reply_authors": "1356;801;1214;2126",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "4;2;3;4",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            83.25,
            22.18529918662356
        ],
        "wc_strengths_avg": [
            64.25,
            29.61735133329785
        ],
        "wc_weaknesses_avg": [
            229.75,
            248.73115506506215
        ],
        "wc_questions_avg": [
            92.0,
            41.15215668710451
        ],
        "wc_review_avg": [
            469.25,
            263.03172337191575
        ],
        "wc_reply_reviewers_avg": [
            52.25,
            57.198666942508375
        ],
        "wc_reply_authors_avg": [
            1374.25,
            479.51974672582566
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.25,
            0.82915619758885
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11794003764520622765&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=ILYjDvUM6U",
        "pdf": "https://openreview.net/pdf?id=ILYjDvUM6U",
        "email": "cuhk.edu.cn;cuhk.edu.hk",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Chinese University of Hong Kong",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cuhk.edu.cn",
        "aff_unique_abbr": "CUHK",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Shenzhen",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Performance Gaps in Multi-view Clustering under the Nested Matrix-Tensor Model",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18967",
        "id": "ILqA09Oeq2",
        "author_site": "Hugo Lebeau, Mohamed El Amine Seddik, Jos\u00e9 Henrique Goulart",
        "tldr": "",
        "abstract": "We study the estimation of a planted signal hidden in a recently introduced nested matrix-tensor model, which is an extension of the classical spiked rank-one tensor model, motivated by multi-view clustering. Prior work has theoretically examined the performance of a tensor-based approach, which relies on finding a best rank-one approximation, a problem known to be computationally hard. A tractable alternative approach consists in computing instead the best rank-one (matrix) approximation of an unfolding of the observed tensor data, but its performance was hitherto unknown. We quantify here the performance gap between these two approaches, in particular by deriving the precise algorithmic threshold of the unfolding approach and demonstrating that it exhibits a BBP-type transition behavior. This work is therefore in line with recent contributions which deepen our understanding of why tensor-based methods surpass matrix-based methods in handling structured tensor data.",
        "keywords": "random tensors;multi-view clustering;random matrix theory;tensor unfolding",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/46f1a07148baa7988404fdb89ec120e286d2a60f.zip",
        "author": "Hugo Lebeau;Mohamed El Amine Seddik;Jos\u00e9 Henrique De Morais Goulart",
        "authorids": "~Hugo_Lebeau1;~Mohamed_El_Amine_Seddik1;~Jos\u00e9_Henrique_De_Morais_Goulart1",
        "gender": "M;M;M",
        "homepage": "https://hugolebeau.github.io/;https://melaseddik.github.io/;https://www.irit.fr/~Henrique.Goulart/",
        "dblp": ";211/7861;62/10874",
        "google_scholar": "atRIpOIAAAAJ;https://scholar.google.fr/citations?user=85Hxd24AAAAJ;IWj6KeoAAAAJ",
        "orcid": "0009-0001-8317-3876;;",
        "linkedin": "hugo-lebeau/;melaseddik;",
        "or_profile": "~Hugo_Lebeau1;~Mohamed_El_Amine_Seddik1;~Jos\u00e9_Henrique_De_Morais_Goulart1",
        "aff": "Universit\u00e9 Grenoble Alpes;Technology Innovation Institute;INP Toulouse",
        "aff_domain": "u-grenoble3.fr;polytechnique.edu;toulouse-inp.fr",
        "position": "PhD student;Researcher;Assistant Professor",
        "bibtex": "@inproceedings{\nlebeau2024performance,\ntitle={Performance Gaps in Multi-view Clustering under the Nested Matrix-Tensor Model},\nauthor={Hugo Lebeau and Mohamed El Amine Seddik and Jos{\\'e} Henrique De Morais Goulart},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ILqA09Oeq2}\n}",
        "github": "",
        "project": "",
        "reviewers": "hX5q;sHnH;9jwW;yQ9E;xYze",
        "pdf_size": 624119,
        "rating": "5;6;6;6;8",
        "confidence": "2;1;2;4;5",
        "soundness": "3;3;3;3;3",
        "contribution": "2;3;2;3;3",
        "presentation": "3;3;3;2;3",
        "wc_summary": "24;19;90;59;114",
        "wc_strengths": "23;13;56;51;70",
        "wc_weaknesses": "76;62;59;236;29",
        "wc_questions": "2;31;29;4;272",
        "wc_review": "125;125;234;350;485",
        "wc_reply_reviewers": "0;0;19;0;0",
        "wc_reply_authors": "284;151;416;552;317",
        "reply_reviewers": "0;0;1;0;0",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            6.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            2.8,
            1.469693845669907
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            61.2,
            36.8423669163641
        ],
        "wc_strengths_avg": [
            42.6,
            21.265935201631738
        ],
        "wc_weaknesses_avg": [
            92.4,
            73.4155296922933
        ],
        "wc_questions_avg": [
            67.6,
            102.91472197892777
        ],
        "wc_review_avg": [
            263.8,
            138.40433519221858
        ],
        "wc_reply_reviewers_avg": [
            3.8,
            7.6000000000000005
        ],
        "wc_reply_authors_avg": [
            344.0,
            134.1834565063816
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.7222222222222222,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1321509606726743571&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 19,
        "openreview": "https://openreview.net/forum?id=ILqA09Oeq2",
        "pdf": "https://openreview.net/pdf?id=ILqA09Oeq2",
        "email": "u-grenoble3.fr;polytechnique.edu;toulouse-inp.fr",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Universit\u00e9 Grenoble Alpes;Technology Innovation Institute;Institut National Polytechnique de Toulouse",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.univ-grenoble-alpes.fr;;https://www.inp-toulouse.fr",
        "aff_unique_abbr": "UGA;;INP Toulouse",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "France;"
    },
    {
        "id": "ILtA2ebLYR",
        "title": "Efficient Interactive Preference Learning in Evolutionary Algorithms: Active Dueling Bandits and Active Learning Integration",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Optimization problems find widespread use in both single-objective and multi-objective scenarios. In practical applications, users aspire for solutions that converge to the region of interest (ROI) along the Pareto front (PF). While the conventional approach involves approximating a fitness function or an objective function to reflect user preferences, this paper explores an alternative avenue. Specifically, we aim to discover a method that sidesteps the need for calculating the fitness function, relying solely on human guidance. Our proposed approach entails conducting a human-dominated search facilitated by an active dueling bandit algorithm.\n    The experimental phase is structured into three sessions. Firstly, we accsess the performance of our active dueling bandit algorithm. Secondly, we implement our proposed method within the context of multi-objective Evolutionary Algorithms (EAs). Finally, we deploy our method in a practical problem, specifically in protein structure prediction (PSP). \n    This research presents a novel interactive preference-based EA framework that not only addresses the limitations of traditional techniques but also unveils new possibilities for optimization problems.",
        "keywords": "Preference learning;multi-objective optimization;interactive multi-objective optimization;active learning",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Tian Huang;Ke Li",
        "authorids": "~Tian_Huang3;~Ke_Li5",
        "gender": "F;M",
        "homepage": ";https://colalab.ai/",
        "dblp": ";75/6627-1.html",
        "google_scholar": ";https://scholar.google.co.uk/citations?user=lUFU8KsAAAAJ",
        "orcid": "0009-0008-0406-7815;0000-0001-7200-4244",
        "linkedin": ";ke-li-29423226/",
        "or_profile": "~Tian_Huang3;~Ke_Li5",
        "aff": "University of Electronic Science and Technology of China;University of Exeter",
        "aff_domain": "uestc.edu.cn;exeter.ac.uk",
        "position": "MS student;Associate Professor",
        "bibtex": "@misc{\nhuang2024efficient,\ntitle={Efficient Interactive Preference Learning in Evolutionary Algorithms: Active Dueling Bandits and Active Learning Integration},\nauthor={Tian Huang and Ke Li},\nyear={2024},\nurl={https://openreview.net/forum?id=ILtA2ebLYR}\n}",
        "github": "",
        "project": "",
        "reviewers": "5t57;ch6a;NX1i;Xsp2",
        "site": "https://openreview.net/forum?id=ILtA2ebLYR",
        "pdf_size": 4764513,
        "rating": "3;3;3;3",
        "confidence": "3;4;3;3",
        "soundness": "2;4;3;1",
        "contribution": "1;2;2;1",
        "presentation": "1;3;2;1",
        "wc_summary": "63;123;37;46",
        "wc_strengths": "48;44;53;24",
        "wc_weaknesses": "583;215;88;343",
        "wc_questions": "3;3;113;34",
        "wc_review": "697;385;291;447",
        "wc_reply_reviewers": "90;0;0;0",
        "wc_reply_authors": "1365;588;355;513",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            1.118033988749895
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            67.25,
            33.51398961627815
        ],
        "wc_strengths_avg": [
            42.25,
            11.008519428151999
        ],
        "wc_weaknesses_avg": [
            307.25,
            182.95952421232408
        ],
        "wc_questions_avg": [
            38.25,
            44.97429821575874
        ],
        "wc_review_avg": [
            455.0,
            150.35291816256844
        ],
        "wc_reply_reviewers_avg": [
            22.5,
            38.97114317029974
        ],
        "wc_reply_authors_avg": [
            705.25,
            390.0810012035962
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Y6vKg9TT5eYJ:scholar.google.com/&scioq=Efficient+Interactive+Preference+Learning+in+Evolutionary+Algorithms:+Active+Dueling+Bandits+and+Active+Learning+Integration&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Electronic Science and Technology of China;University of Exeter",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uestc.edu.cn;https://www.exeter.ac.uk",
        "aff_unique_abbr": "UESTC;Exeter",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "id": "IMkRWksMbD",
        "title": "Taming Mode Collapse in Score Distillation for Text-to-3D Generation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Despite the remarkable performance of score distillation in text-to-3D generation,\nsuch techniques notoriously suffer from view inconsistency issues, also known\nas \u201cJanus\u201d artifact, where the generated objects fake each view with multiple\nfront faces. Although empirically effective methods have approached this problem\nvia time re-scheduling or prompt engineering, a statistical view to explain and\ntackle this problem remains elusive. In this paper, we reveal that the existing\nscore distillation-based text-to-3D generation frameworks degenerate to maximal\nlikelihood seeking on each view independently and thus suffer from the mode\ncollapse problem, manifesting as the Janus artifact in practice. To tame mode\ncollapse, we improve score distillation by re-establishing the entropy term in the\ncorreponding variational objective and derive a new update rule for 3D score\ndistillation, dubbed Entropic Score Distillation (ESD). The entropy is applied to\nthe distribution of rendered images. Maximizing the entropy encourages diversity\namong different views in generated 3D assets, thereby alleviating the Janus problem.\nWe conduct experiments with our proposed ESD, and validate that ESD can be an\neffective treatment for Janus artifacts for score distillation.",
        "keywords": "Text-to-3D Generation;Mode Collapse",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/a43c3b9340b2882614f69983e0341d2a3e34c894.zip",
        "author": "Peihao Wang;Dejia Xu;Zhiwen Fan;Dilin Wang;Sreyas Mohan;Forrest Iandola;Rakesh Ranjan;YILEI LI;qiang liu;Zhangyang Wang;Vikas Chandra",
        "authorids": "~Peihao_Wang1;~Dejia_Xu1;~Zhiwen_Fan2;~Dilin_Wang1;~Sreyas_Mohan1;~Forrest_Iandola1;~Rakesh_Ranjan2;~YILEI_LI1;~qiang_liu4;~Zhangyang_Wang1;~Vikas_Chandra2",
        "gender": "M;M;;;M;;;;;M;M",
        "homepage": "https://peihaowang.github.io/;https://ir1d.github.io;;;https://sreyas-mohan.github.io;http://forrestiandola.com;;https://liyilui.github.io/personal_page/;;https://vita-group.github.io;https://v-chandra.github.io/",
        "dblp": "239/4075;264/5685;;;200/8516;89/10238;;;;119/4026;57/5163",
        "google_scholar": "fqf2tBsAAAAJ;ET0e93cAAAAJ;;;https://scholar.google.co.in/citations?user=jaobZDsAAAAJ;;;iTp5xFcAAAAJ;;pxFyKAIAAAAJ;p-h_BvcAAAAJ",
        "orcid": ";;;;;;;;;;",
        "linkedin": "peihao-wang-25a411162/;;;;;;;;;;vchandra/",
        "or_profile": "~Peihao_Wang1;~Dejia_Xu1;~Zhiwen_Fan2;~Dilin_Wang1;~Sreyas_Mohan1;~Forrest_Iandola1;~Rakesh_Ranjan2;~YILEI_LI1;~qiang_liu4;~Zhangyang_Wang1;~Vikas_Chandra2",
        "aff": "University of Texas, Austin;University of Texas at Austin;;;Meta;Meta;;Meta Facebook;;University of Texas at Austin;Meta",
        "aff_domain": "utexas.edu;utexas.edu;;;meta.com;meta.com;;fb.com;;utexas.edu;meta.com",
        "position": "PhD student;PhD student;;;Researcher;Researcher;;Researcher;;Associate Professor;Director, AI",
        "bibtex": "@misc{\nwang2024taming,\ntitle={Taming Mode Collapse in Score Distillation for Text-to-3D Generation},\nauthor={Peihao Wang and Dejia Xu and Zhiwen Fan and Dilin Wang and Sreyas Mohan and Forrest Iandola and Rakesh Ranjan and YILEI LI and qiang liu and Zhangyang Wang and Vikas Chandra},\nyear={2024},\nurl={https://openreview.net/forum?id=IMkRWksMbD}\n}",
        "github": "",
        "project": "",
        "reviewers": "nCDX;Ybnt;mdp1;S4R1",
        "site": "https://openreview.net/forum?id=IMkRWksMbD",
        "pdf_size": 10748571,
        "rating": "3;5;5;6",
        "confidence": "5;4;2;4",
        "soundness": "2;2;2;4",
        "contribution": "1;3;3;2",
        "presentation": "3;3;2;3",
        "wc_summary": "126;56;73;71",
        "wc_strengths": "72;50;39;25",
        "wc_weaknesses": "395;98;141;92",
        "wc_questions": "104;132;193;3",
        "wc_review": "697;336;446;191",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            81.5,
            26.51886121235224
        ],
        "wc_strengths_avg": [
            46.5,
            17.18284027743958
        ],
        "wc_weaknesses_avg": [
            181.5,
            124.70465107605249
        ],
        "wc_questions_avg": [
            108.0,
            68.63308240200203
        ],
        "wc_review_avg": [
            417.5,
            184.9844588066792
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": -0.4736842105263159,
        "gs_citation": 23,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13674099373163530370&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;1;1;1;0;1",
        "aff_unique_norm": "University of Texas at Austin;Meta",
        "aff_unique_dep": ";Meta Platforms, Inc.",
        "aff_unique_url": "https://www.utexas.edu;https://meta.com",
        "aff_unique_abbr": "UT Austin;Meta",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Austin;",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Adversarial Feature Map Pruning for Backdoor",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18966",
        "id": "IOEEDkla96",
        "author_site": "Dong HUANG, Qingwen Bu",
        "tldr": "",
        "abstract": "Deep neural networks have been widely used in many critical applications, such as autonomous vehicles and medical diagnosis. However, their security is threatened by backdoor attacks, which are achieved by adding artificial patterns to specific training data. Existing defense strategies primarily focus on using reverse engineering to reproduce the backdoor trigger generated by attackers and subsequently repair the DNN model by adding the trigger into inputs and fine-tuning the model with ground truth labels. However, once the trigger generated by the attackers is complex and invisible, the defender cannot reproduce the trigger successfully then the DNN model will not be repaired, as the trigger is not effectively removed. \n\nIn this work, we propose Adversarial Feature Map Pruning for Backdoor (FMP) to mitigate backdoor from the DNN. Unlike existing defense strategies, which focus on reproducing backdoor triggers, FMP attempts to prune backdoor feature maps, which are trained to extract backdoor information from inputs. After pruning these backdoor feature maps, FMP will fine-tune the model with a secure subset of training data. Our experiments demonstrate that, compared to existing defense strategies, FMP can effectively reduce the Attack Success Rate (ASR) even against the most complex and invisible attack triggers (e.g., FMP decreases the ASR to 2.86% in CIFAR10, which is 19.2% to 65.41% lower than baselines). Second, unlike conventional defense methods that tend to exhibit low robust accuracy (that is, the accuracy of the model on poisoned data), FMP achieves a higher RA, indicating its superiority in maintaining model performance while mitigating the effects of backdoor attacks (e.g., FMP obtains 87.40% RA in CIFAR10). Our code is publicly available at: https://github.com/hku-systems/FMP.",
        "keywords": "Backdoor Defense;Data Poisoning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/68eeac584ac34fbbaef0a65c05f54b5b92a52b2a.zip",
        "author": "Dong HUANG;Qingwen Bu",
        "authorids": "~Dong_HUANG4;~Qingwen_Bu1",
        "gender": "M;M",
        "homepage": "https://huangd1999.github.io/;https://github.com/retsuh-bqw",
        "dblp": "94/3756-5.html;326/7970",
        "google_scholar": "UER9hrAAAAAJ;https://scholar.google.com.hk/citations?user=-JCRysgAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Dong_HUANG4;~Qingwen_Bu1",
        "aff": "The University of Hong Kong;Shanghai Jiaotong University",
        "aff_domain": "cs.hku.hk;sjtu.edu.cn",
        "position": "PhD student;PhD student",
        "bibtex": "@inproceedings{\nhuang2024adversarial,\ntitle={Adversarial Feature Map Pruning for Backdoor},\nauthor={Dong HUANG and Qingwen Bu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=IOEEDkla96}\n}",
        "github": "",
        "project": "",
        "reviewers": "gATw;x3Nd;W4kG",
        "pdf_size": 307742,
        "rating": "6;6;6",
        "confidence": "4;3;4",
        "soundness": "3;2;3",
        "contribution": "2;2;2",
        "presentation": "2;3;1",
        "wc_summary": "86;31;102",
        "wc_strengths": "81;24;35",
        "wc_weaknesses": "319;51;47",
        "wc_questions": "124;19;94",
        "wc_review": "610;125;278",
        "wc_reply_reviewers": "0;15;18",
        "wc_reply_authors": "2133;709;381",
        "reply_reviewers": "0;1;1",
        "reply_authors": "6;3;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            73.0,
            30.40833219146796
        ],
        "wc_strengths_avg": [
            46.666666666666664,
            24.689178916188272
        ],
        "wc_weaknesses_avg": [
            139.0,
            127.28969583853466
        ],
        "wc_questions_avg": [
            79.0,
            44.15880433163923
        ],
        "wc_review_avg": [
            337.6666666666667,
            202.4456031190162
        ],
        "wc_reply_reviewers_avg": [
            11.0,
            7.874007874011811
        ],
        "wc_reply_authors_avg": [
            1074.3333333333333,
            760.4723678229356
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            2.0548046676563256
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9876940950539242045&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=IOEEDkla96",
        "pdf": "https://openreview.net/pdf?id=IOEEDkla96",
        "email": "cs.hku.hk;sjtu.edu.cn",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Hong Kong;Shanghai Jiao Tong University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.hku.hk;https://www.sjtu.edu.cn",
        "aff_unique_abbr": "HKU;SJTU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "IORAqe04sO",
        "title": "The crossover strategy based on the cellular automata for genetic Algorithms with binary chromosomes population",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this paper we propose a crossover operator for genetic algorithms with binary chromosomes population based on the cellular automata (CGACell). After presenting the fundamental elements regarding cellular automata with specific examples for one- and two- dimensional cases, the the most widely used crossover operators in applications with genetic algorithms are described and the crossover operator based on cellular automata is defined. Specific forms of the crossover operator based on the ECA and 2D CA cases are described and exemplified. The CGACell crossover operator is used in the genetic structure to improved the KNN algorithm in terms of the parameter represented by the number of nearest neighbors selected by the data classification method. Validity and practical performance testing is performed on image data classification problems by optimizing the nearest-neighbors-based algorithm. The experimental study on the proposed crossover operator, by comparing the algorithm based on CGACell with standard data classification algorithms such as PCA, Kmeans or KNN, attests good qualitative performance in terms of correctness percentages in the recognition of new images, in classification applications of facial image classes corresponding to several persons.",
        "keywords": "Genetic Algorithms (GA);Cellular Automata (CA);Elementary Cellular Automata (ECA);Crossover Operators;K-nearest neighbors (KNN);Kmeans;Face Images Classification;Principal Component Analysis (PCA)",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Doru Constantin",
        "authorids": "~Doru_Constantin1",
        "gender": "M",
        "homepage": "http://upb.ro",
        "dblp": "",
        "google_scholar": "",
        "orcid": "0009-0002-7308-480X",
        "linkedin": "",
        "or_profile": "~Doru_Constantin1",
        "aff": "The National University of Science and Technology POLITEHNICA Bucharest, Pite\u0219ti University Centre",
        "aff_domain": "upb.ro",
        "position": "Associate Professor",
        "bibtex": "@misc{\nconstantin2024the,\ntitle={The crossover strategy based on the cellular automata for genetic Algorithms with binary chromosomes population},\nauthor={Doru Constantin},\nyear={2024},\nurl={https://openreview.net/forum?id=IORAqe04sO}\n}",
        "github": "",
        "project": "",
        "reviewers": "3qA6;oJwJ",
        "site": "https://openreview.net/forum?id=IORAqe04sO",
        "pdf_size": 927587,
        "rating": "1;3",
        "confidence": "4;4",
        "soundness": "2;2",
        "contribution": "1;2",
        "presentation": "1;2",
        "wc_summary": "73;120",
        "wc_strengths": "52;43",
        "wc_weaknesses": "285;33",
        "wc_questions": "56;233",
        "wc_review": "466;429",
        "wc_reply_reviewers": "0;0",
        "wc_reply_authors": "0;0",
        "reply_reviewers": "0;0",
        "reply_authors": "0;0",
        "rating_avg": [
            2.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            96.5,
            23.5
        ],
        "wc_strengths_avg": [
            47.5,
            4.5
        ],
        "wc_weaknesses_avg": [
            159.0,
            126.0
        ],
        "wc_questions_avg": [
            144.5,
            88.5
        ],
        "wc_review_avg": [
            447.5,
            18.5
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:a_HofaQySqMJ:scholar.google.com/&scioq=The+crossover+strategy+based+on+the+cellular+automata+for+genetic+Algorithms+with+binary+chromosomes+population&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "National University of Science and Technology POLITEHNICA Bucharest",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.upb.ro",
        "aff_unique_abbr": "UPB",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Pite\u0219ti",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Romania"
    },
    {
        "id": "IOp3Qgep9V",
        "title": "Towards Adversarially Robust Condensed Dataset by Curvature Regularization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Dataset condensation is a recent technique designed to mitigate the rising computational demands of training deep neural networks. It does so by generating a significantly smaller, synthetic dataset derived from a larger one. While an abundance of research has aimed at improving the accuracy of models trained on synthetic datasets and enhancing the efficiency of synthesizing these datasets, there has been a noticeable gap in research focusing on analyzing and enhancing the robustness of these datasets against adversarial attacks. This is surprising considering the appealing hypothesis that condensed datasets might inherently promote models that are robust to adversarial attacks. In this study, we first challenge this intuitive assumption by empirically demonstrating that dataset condensation methods are not inherently robust. This empirical evidence propels us to explore methods aimed at enhancing the adversarial robustness of condensed datasets. Our investigation is underpinned by the hypothesis that the observed lack of robustness originates from the high curvature of the loss landscape in the input space. Based on our theoretical analysis, we propose a new method that aims to enhance robustness by incorporating curvature regularization into the condensation process. Our empirical study suggests that the new method is capable of generating robust synthetic datasets that can withstand various adversarial attacks.",
        "keywords": "adversarial;robustness;dataset condensation;dataset distillation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/c478c8d49fe769327462c898bd1c12270be6a975.pdf",
        "author": "Eric Xue;Haoyang Liu;Yifan Shen;Haohan Wang",
        "authorids": "~Eric_Xue1;~Haoyang_Liu1;~Yifan_Shen5;~Haohan_Wang1",
        "gender": "M;M;;M",
        "homepage": "https://ericxue.com;;;http://cs.cmu.edu/~haohanw",
        "dblp": "248/7781-2;53/8773-1;;132/4066",
        "google_scholar": ";1jLWSKAAAAAJ;;nZxJGeUAAAAJ",
        "orcid": ";0000-0002-9657-9007;;",
        "linkedin": ";haoyang-liu-58268a1a2/;;haohanwang/",
        "or_profile": "~Eric_Xue1;~Haoyang_Liu1;~Yifan_Shen5;~Haohan_Wang1",
        "aff": "University of Toronto;University of Illinois, Urbana-Champaign;;University of Illinois, Urbana Champaign",
        "aff_domain": "mail.utoronto.ca;uiuc.edu;;illinois.edu",
        "position": "Undergrad student;PhD student;;Assistant Professor",
        "bibtex": "@misc{\nxue2024towards,\ntitle={Towards Adversarially Robust Condensed Dataset by Curvature Regularization},\nauthor={Eric Xue and Haoyang Liu and Yifan Shen and Haohan Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=IOp3Qgep9V}\n}",
        "github": "",
        "project": "",
        "reviewers": "r5Wk;8UKM;jErL;upET",
        "site": "https://openreview.net/forum?id=IOp3Qgep9V",
        "pdf_size": 2079480,
        "rating": "1;3;3;5",
        "confidence": "4;3;4;2",
        "soundness": "1;2;2;2",
        "contribution": "1;3;2;2",
        "presentation": "1;3;3;2",
        "wc_summary": "111;64;64;102",
        "wc_strengths": "35;55;30;136",
        "wc_weaknesses": "242;200;89;201",
        "wc_questions": "12;171;156;177",
        "wc_review": "400;490;339;616",
        "wc_reply_reviewers": "0;71;81;0",
        "wc_reply_authors": "698;476;329;616",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            85.25,
            21.48691462262556
        ],
        "wc_strengths_avg": [
            64.0,
            42.60868456077939
        ],
        "wc_weaknesses_avg": [
            183.0,
            56.855078928799315
        ],
        "wc_questions_avg": [
            129.0,
            67.98161516174795
        ],
        "wc_review_avg": [
            461.25,
            104.24820142333392
        ],
        "wc_reply_reviewers_avg": [
            38.0,
            38.16411927452276
        ],
        "wc_reply_authors_avg": [
            529.75,
            140.4784236101758
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8528028654224418,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Mqs9Qwz0-KYJ:scholar.google.com/&scioq=Towards+Adversarially+Robust+Condensed+Dataset+by+Curvature+Regularization&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of Toronto;University of Illinois;University of Illinois Urbana-Champaign",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.utoronto.ca;https://illinois.edu;https://illinois.edu",
        "aff_unique_abbr": "U of T;UIUC;UIUC",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Urbana-Champaign",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "Canada;United States"
    },
    {
        "id": "IOrnCVIKIZ",
        "title": "LETI: Learning to Generate from Textual Interactions",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Finetuning pre-trained language models (LMs) enhances the models' capabilities.\nPrior techniques fine-tune a pre-trained LM on input-output pairs (e.g., instruction fine-tuning) or with numerical rewards that gauge the quality of its outputs (e.g., reinforcement learning from human feedback). \nWe explore LMs' potential to learn from textual interactions (LETI) that not only check their correctness with binary labels but also pinpoint and explain errors in their outputs through textual feedback. \nOur investigation focuses on the code generation task, where the model produces code in response to natural language instructions. \nThis setting invites a natural and scalable way to acquire textual feedback: the error messages and stack traces from code execution using a Python interpreter. \nLETI iteratively fine-tunes the model, using the LM objective, on a concatenation of natural language instructions, LM-generated programs, and textual feedback, which is only provided when the generated program fails to solve the task. \nPrepended to this fine-tuning text, a binary reward token is used to differentiate correct and buggy solutions.\nLETI requires no ground-truth outputs for training and even outperforms a fine-tuned baseline that does. \nLETI not only improves the performance of two base LMs of different scales on a code generation dataset MBPP, but also generalizes to other datasets. \nTrained on MBPP, it achieves comparable or better performance than the base LMs on unseen problems in HumanEval. \nFurthermore, compared to binary feedback, we observe that textual feedback leads to improved generation quality and sample efficiency, achieving the same performance with fewer than half of the gradient steps.\nLETI is equally applicable in natural language tasks when they can be formulated as code generation, which we empirically verified on event argument extraction.",
        "keywords": "learning from textual feedback;large language model;instruction finetuning;reinforcement learning from human feedback",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Xingyao Wang;Hao Peng;Reyhaneh Jabbarvand;Heng Ji",
        "authorids": "~Xingyao_Wang1;~Hao_Peng4;~Reyhaneh_Jabbarvand1;~Heng_Ji3",
        "gender": "M;F;F;M",
        "homepage": "https://xwang.dev;https://reyhaneh.cs.illinois.edu/;http://blender.cs.illinois.edu/hengji.html;https://haopeng-nlp.github.io/",
        "dblp": "264/9892;18/10505;;",
        "google_scholar": "F7qq3YcAAAAJ;9gmW8MYAAAAJ;z7GCqT4AAAAJ;6Y37nm0AAAAJ",
        "orcid": "0000-0002-3483-8624;;;",
        "linkedin": ";;;",
        "or_profile": "~Xingyao_Wang1;~Reyhaneh_Jabbarvand1;~Heng_Ji3;~Hao_Peng1",
        "aff": "University of Illinois Urbana-Champaign;Department of Computer Science;University of Illinois, Urbana-Champaign;University of Illinois Urbana-Champaign",
        "aff_domain": "cs.illinois.edu;cs.illinois.edu;uiuc.edu;illinois.edu",
        "position": "PhD student;Assistant Professor;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nwang2024leti,\ntitle={{LETI}: Learning to Generate from Textual Interactions},\nauthor={Xingyao Wang and Hao Peng and Reyhaneh Jabbarvand and Heng Ji},\nyear={2024},\nurl={https://openreview.net/forum?id=IOrnCVIKIZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "MfcU;kgWB;KLdC;bsvm;WAJY;9ZHv",
        "site": "https://openreview.net/forum?id=IOrnCVIKIZ",
        "pdf_size": 4099987,
        "rating": "5;5;5;5;5;6",
        "confidence": "3;4;4;4;4;4",
        "soundness": "3;3;2;2;3;3",
        "contribution": "2;2;3;3;2;3",
        "presentation": "2;3;3;4;3;4",
        "wc_summary": "83;144;90;255;33;110",
        "wc_strengths": "99;84;147;143;86;82",
        "wc_weaknesses": "115;76;285;259;140;130",
        "wc_questions": "149;109;67;236;46;180",
        "wc_review": "446;413;589;893;305;502",
        "wc_reply_reviewers": "51;0;317;519;45;86",
        "wc_reply_authors": "771;727;1359;775;570;715",
        "reply_reviewers": "1;0;2;1;1;1",
        "reply_authors": "1;1;2;1;1;1",
        "rating_avg": [
            5.166666666666667,
            0.37267799624996495
        ],
        "confidence_avg": [
            3.8333333333333335,
            0.3726779962499649
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.1666666666666665,
            0.6871842709362768
        ],
        "wc_summary_avg": [
            119.16666666666667,
            69.20360459462273
        ],
        "wc_strengths_avg": [
            106.83333333333333,
            27.5524751862494
        ],
        "wc_weaknesses_avg": [
            167.5,
            76.88682158428279
        ],
        "wc_questions_avg": [
            131.16666666666666,
            65.26207849041347
        ],
        "wc_review_avg": [
            524.6666666666666,
            185.84641209581875
        ],
        "wc_reply_reviewers_avg": [
            169.66666666666666,
            186.7044604597211
        ],
        "wc_reply_authors_avg": [
            819.5,
            250.70550452672555
        ],
        "reply_reviewers_avg": [
            1.0,
            0.5773502691896257
        ],
        "reply_authors_avg": [
            1.1666666666666667,
            0.3726779962499649
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.20000000000000007,
        "gs_citation": 34,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2686597194145113573&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "University of Illinois Urbana-Champaign;Unknown Institution;University of Illinois",
        "aff_unique_dep": ";Department of Computer Science;",
        "aff_unique_url": "https://illinois.edu;;https://illinois.edu",
        "aff_unique_abbr": "UIUC;;UIUC",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Urbana-Champaign;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States;"
    },
    {
        "id": "IP28nY6TJQ",
        "title": "In-Context Learning for Few-Shot Molecular Property Prediction",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In-context learning has become an important approach for few-shot learning in Large Language Models because of its ability to rapidly adapt to new tasks without fine-tuning model parameters. However, it is restricted to applications in natural language and inapplicable to other domains. In this paper, we adapt the concepts underpinning in-context learning to develop a new algorithm for few-shot molecular property prediction. Our approach learns to predict molecular properties from a context of (molecule, property measurement) pairs and rapidly adapts to new properties without fine-tuning. On the FS-Mol and BACE molecular property prediction benchmarks, we find this method surpasses the performance of recent meta-learning algorithms at small support sizes and is competitive with the best methods at large support sizes.",
        "keywords": "Meta-learning;molecular property prediction",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/8f29c368ee8c779acf47445f8b5065b1ecc6da0f.zip",
        "author": "Christopher Fifty;Jure Leskovec;Sebastian Thrun",
        "authorids": "~Christopher_Fifty2;~Jure_Leskovec1;~Sebastian_Thrun1",
        "gender": ";M;",
        "homepage": "http://cs.stanford.edu/~jure/;http://robot.cc;https://cfifty.github.io",
        "dblp": "l/JureLeskovec;t/SebastianThrun;236/4965",
        "google_scholar": "Q_kKkIUAAAAJ;;lg2M2RYAAAAJ",
        "orcid": "0000-0002-5411-923X;;",
        "linkedin": "leskovec/;sebastian-thrun-59a0b273/;",
        "or_profile": "~Jure_Leskovec1;~Sebastian_Thrun1;~Chris_Fifty1",
        "aff": "Kumo.AI;;Computer Science Department, Stanford University",
        "aff_domain": "kumo.ai;;cs.stanford.edu",
        "position": "Chief Scientist;;PhD student",
        "bibtex": "@misc{\nfifty2024incontext,\ntitle={In-Context Learning for Few-Shot Molecular Property Prediction},\nauthor={Christopher Fifty and Jure Leskovec and Sebastian Thrun},\nyear={2024},\nurl={https://openreview.net/forum?id=IP28nY6TJQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "69rR;62tm;8K7Q;bDhz",
        "site": "https://openreview.net/forum?id=IP28nY6TJQ",
        "pdf_size": 2182762,
        "rating": "3;3;3;5",
        "confidence": "4;4;4;4",
        "soundness": "2;2;2;3",
        "contribution": "1;1;2;2",
        "presentation": "2;2;3;2",
        "wc_summary": "73;65;89;53",
        "wc_strengths": "26;43;71;44",
        "wc_weaknesses": "97;235;353;287",
        "wc_questions": "164;2;166;80",
        "wc_review": "360;345;679;464",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            70.0,
            13.076696830622021
        ],
        "wc_strengths_avg": [
            46.0,
            16.109003693587013
        ],
        "wc_weaknesses_avg": [
            243.0,
            94.09569596958194
        ],
        "wc_questions_avg": [
            103.0,
            67.86015030929418
        ],
        "wc_review_avg": [
            462.0,
            133.40352319185578
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16556045922678777712&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Kumo.AI;Stanford University",
        "aff_unique_dep": ";Computer Science Department",
        "aff_unique_url": "https://www.kumo.ai;https://www.stanford.edu",
        "aff_unique_abbr": "Kumo.AI;Stanford",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Stanford",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "IPayPEGwdE",
        "title": "Learning Good Interventions in Causal Contextual Bandits with Adaptive Context",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We study a variant of causal contextual bandits where the context is stochastically dependent on an initial action chosen by the learner. This adaptive context setting allows the environment to elicit some initial choice from the learner before providing the context. Upon observing the context, the learner picks another action (an intervention in a causal graph) based on which they receive a reward. The objective is to identify near-optimal atomic causal interventions at the initial state and post context identification, to maximize reward. We extend prior work from the deterministic context setting to obtain simple regret minimization guarantees. This is achieved through an instance-dependent causal parameter, $\\lambda$, which characterizes our upper bound. Furthermore, we prove that our simple regret is essentially tight for a large class of instances. A key feature of our work is that we use convex optimization to address the bandit exploration problem. We also conduct experiments to validate our theoretical results",
        "keywords": "Causal Bandits;Causality;Causal Inference;Simple Regret;Contextual Bandits;Causal Contextual Bandits;Convex Exploration;Intervention Complexity;Simple Regret;Simple regret lower bound",
        "primary_area": "causal reasoning",
        "supplementary_material": "/attachment/9ef71e8da5455f52043cc707233bc20cdf22d6a9.pdf",
        "author": "Rahul Madhavan;Gaurav Sinha;Aurghya Maiti;Siddharth Barman",
        "authorids": "~Rahul_Madhavan1;~Gaurav_Sinha2;~Aurghya_Maiti1;~Siddharth_Barman1",
        "gender": "M;M;M;M",
        "homepage": ";https://sinhagaurav.github.io/;;http://www.csa.iisc.ac.in/~barman/",
        "dblp": "290/2008;29/2979-1;255/5004;63/478.html",
        "google_scholar": "HrM2xRcAAAAJ;3Tt6250AAAAJ;;https://scholar.google.co.in/citations?user=HcGQSKIAAAAJ",
        "orcid": ";0000-0002-3590-9543;;",
        "linkedin": "rahul-madhavan/;gaurav-sinha-370376128/;aurghya/;",
        "or_profile": "~Rahul_Madhavan1;~Gaurav_Sinha2;~Aurghya_Maiti1;~Siddharth_Barman1",
        "aff": "Indian Institute of Science, Bangalore;Microsoft Research;Columbia University;Indian Institute of Science",
        "aff_domain": "iisc.ac.in;research.microsoft.com;columbia.edu;iisc.ac.in",
        "position": "PhD student;Principal Researcher;PhD student;Associate Professor",
        "bibtex": "@misc{\nmadhavan2024learning,\ntitle={Learning Good Interventions in Causal Contextual Bandits with Adaptive Context},\nauthor={Rahul Madhavan and Gaurav Sinha and Aurghya Maiti and Siddharth Barman},\nyear={2024},\nurl={https://openreview.net/forum?id=IPayPEGwdE}\n}",
        "github": "",
        "project": "",
        "reviewers": "fZFX;oUko;73yj;aW5H",
        "site": "https://openreview.net/forum?id=IPayPEGwdE",
        "pdf_size": 1041519,
        "rating": "5;5;5;5",
        "confidence": "4;3;3;3",
        "soundness": "3;3;2;3",
        "contribution": "2;2;2;2",
        "presentation": "2;2;2;2",
        "wc_summary": "78;86;58;47",
        "wc_strengths": "43;24;41;77",
        "wc_weaknesses": "117;66;124;117",
        "wc_questions": "97;2;4;58",
        "wc_review": "335;178;227;299",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "663;688;628;896",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;2;1;2",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            67.25,
            15.514106484100203
        ],
        "wc_strengths_avg": [
            46.25,
            19.22725929507375
        ],
        "wc_weaknesses_avg": [
            106.0,
            23.27015255644019
        ],
        "wc_questions_avg": [
            40.25,
            39.72640809335775
        ],
        "wc_review_avg": [
            259.75,
            61.15298439160594
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            718.75,
            104.53079689737375
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:5IyNB5N3yrMJ:scholar.google.com/&scioq=Learning+Good+Interventions+in+Causal+Contextual+Bandits+with+Adaptive+Context&hl=en&as_sdt=0,23",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Indian Institute of Science;Microsoft;Columbia University",
        "aff_unique_dep": ";Microsoft Research;",
        "aff_unique_url": "https://www.iisc.ac.in;https://www.microsoft.com/en-us/research;https://www.columbia.edu",
        "aff_unique_abbr": "IISc;MSR;Columbia",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Bangalore;",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "India;United States"
    },
    {
        "title": "Window Attention is Bugged: How not to Interpolate Position Embeddings",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18965",
        "id": "IPhm01y9a9",
        "author_site": "Daniel Bolya, Chaitanya Ryali, Judy Hoffman, Christoph Feichtenhofer",
        "tldr": "",
        "abstract": "Window attention, position embeddings, and high resolution finetuning are core concepts in the modern transformer era of computer vision. However, we find that naively combining these near ubiquitous components can have a detrimental effect on performance. The issue is simple: interpolating position embeddings while using window attention is wrong. We study two state-of-the-art methods that have these three components, namely Hiera and ViTDet, and find that both do indeed suffer from this bug. To fix it, we introduce a simple absolute window position embedding strategy, which solves the bug outright in Hiera and allows us to increase both speed and performance of the model in ViTDet. We finally combine the two to obtain HieraDet, which achieves 61.7 box mAP on COCO, making it state-of-the-art for models that only use ImageNet-1k pretraining. This all stems from what is essentially a 3 line bug fix, which we name \"absolute win\".",
        "keywords": "Bug fix;window attention;position embeddings;high resolution finetuning;image classification;video classification;object detection;instance segmentation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Daniel Bolya;Chaitanya Ryali;Judy Hoffman;Christoph Feichtenhofer",
        "authorids": "~Daniel_Bolya1;~Chaitanya_Ryali1;~Judy_Hoffman1;~Christoph_Feichtenhofer4",
        "gender": "M;;F;M",
        "homepage": "https://dbolya.github.io;;https://www.cc.gatech.edu/~judy/;http://feichtenhofer.github.io/",
        "dblp": "239/4186.html;231/7672;45/10336;127/1937",
        "google_scholar": "K3ht_ZUAAAAJ;;mqpjAt4AAAAJ;UxuqG1EAAAAJ",
        "orcid": ";;;",
        "linkedin": "daniel-bolya-060398130/;;;christoph-feichtenhofer-549433a1",
        "or_profile": "~Daniel_Bolya1;~Chaitanya_Ryali1;~Judy_Hoffman1;~Christoph_Feichtenhofer4",
        "aff": "Georgia Institute of Technology;University of California, San Diego;Georgia Institute of Technology;Meta FAIR",
        "aff_domain": "gatech.edu;ucsd.edu;gatech.edu;meta.com",
        "position": "PhD student;PhD student;Assistant Professor;Principal Researcher",
        "bibtex": "@inproceedings{\nbolya2024window,\ntitle={Window Attention is Bugged: How not to Interpolate Position Embeddings},\nauthor={Daniel Bolya and Chaitanya Ryali and Judy Hoffman and Christoph Feichtenhofer},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=IPhm01y9a9}\n}",
        "github": "",
        "project": "",
        "reviewers": "4xm4;7g6r;QscK;hUZp",
        "pdf_size": 3776786,
        "rating": "6;6;6;6",
        "confidence": "3;3;4;2",
        "soundness": "3;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "3;3;4;3",
        "wc_summary": "67;201;77;207",
        "wc_strengths": "34;45;84;207",
        "wc_weaknesses": "114;42;94;133",
        "wc_questions": "346;11;3;2",
        "wc_review": "561;299;258;549",
        "wc_reply_reviewers": "114;0;18;0",
        "wc_reply_authors": "1404;446;709;573",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            138.0,
            66.12866246946176
        ],
        "wc_strengths_avg": [
            92.5,
            68.66767798608018
        ],
        "wc_weaknesses_avg": [
            95.75,
            33.95861451826325
        ],
        "wc_questions_avg": [
            90.5,
            147.55422731999244
        ],
        "wc_review_avg": [
            416.75,
            139.07259794797824
        ],
        "wc_reply_reviewers_avg": [
            33.0,
            47.3392015141785
        ],
        "wc_reply_authors_avg": [
            783.0,
            370.4004589629986
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5883957484371840390&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=IPhm01y9a9",
        "pdf": "https://openreview.net/pdf?id=IPhm01y9a9",
        "email": "gatech.edu;ucsd.edu;gatech.edu;meta.com",
        "author_num": 4,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "Georgia Institute of Technology;University of California, San Diego;Meta",
        "aff_unique_dep": ";;Meta Platforms, Inc.",
        "aff_unique_url": "https://www.gatech.edu;https://www.ucsd.edu;https://meta.com",
        "aff_unique_abbr": "Georgia Tech;UCSD;Meta",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";San Diego",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "IQDSUpp69I",
        "title": "Optimal algorithms for group distributionally robust optimization and beyond",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Distributionally robust optimization (DRO) can improve the robustness and fairness of learning methods. In this paper, we devise stochastic algorithms for a class of DRO problems, including group DRO, subpopulation fairness, and empirical conditional value at risk (CVaR) optimization. Our new algorithms achieve faster convergence rates than existing algorithms for multiple DRO settings. We also provide a new information-theoretic lower bound that implies our bounds are tight up to a log factor for group DRO. Empirically, too, our algorithms outperform known methods.",
        "keywords": "Distributionally robust optimization;Convex optimization;Fairness",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Tasuku Soma;Khashayar Gatmiry;Sharut Gupta;Stefanie Jegelka",
        "authorids": "~Tasuku_Soma1;~Khashayar_Gatmiry1;~Sharut_Gupta1;~Stefanie_Jegelka3",
        "gender": "M;M;F;F",
        "homepage": "https://tasusu.github.io;http://ce.sharif.edu/~kgatmiry/;https://www.mit.edu/~sharut/;http://people.csail.mit.edu/stefje/",
        "dblp": "127/1214;;;38/7003",
        "google_scholar": ";;https://scholar.google.com/citations?hl=en;gTWUZlsAAAAJ",
        "orcid": "0000-0001-9519-2487;;;",
        "linkedin": ";;sharut-gupta/;",
        "or_profile": "~Tasuku_Soma1;~Khashayar_Gatmiry1;~Sharut_Gupta1;~Stefanie_Jegelka3",
        "aff": "Massachusetts Institute of Technology;Massachusetts Institute of Technology;Google;Massachusetts Institute of Technology",
        "aff_domain": "mit.edu;mit.edu;google.com;mit.edu",
        "position": "Postdoc;PhD student;Student Researcher;Associate Professor",
        "bibtex": "@misc{\nsoma2024optimal,\ntitle={Optimal algorithms for group distributionally robust optimization and beyond},\nauthor={Tasuku Soma and Khashayar Gatmiry and Sharut Gupta and Stefanie Jegelka},\nyear={2024},\nurl={https://openreview.net/forum?id=IQDSUpp69I}\n}",
        "github": "",
        "project": "",
        "reviewers": "4T2i;xpZv;tgUD",
        "site": "https://openreview.net/forum?id=IQDSUpp69I",
        "pdf_size": 454518,
        "rating": "3;5;5",
        "confidence": "4;4;4",
        "soundness": "2;2;3",
        "contribution": "3;3;2",
        "presentation": "2;1;3",
        "wc_summary": "42;122;50",
        "wc_strengths": "20;137;39",
        "wc_weaknesses": "2;524;64",
        "wc_questions": "288;52;3",
        "wc_review": "352;835;156",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            71.33333333333333,
            35.97530016861877
        ],
        "wc_strengths_avg": [
            65.33333333333333,
            51.266189854739764
        ],
        "wc_weaknesses_avg": [
            196.66666666666666,
            232.83947737061735
        ],
        "wc_questions_avg": [
            114.33333333333333,
            124.41954115902463
        ],
        "wc_review_avg": [
            447.6666666666667,
            285.3352803671888
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=864933710638135178&as_sdt=80005&sciodt=0,11&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Massachusetts Institute of Technology;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://web.mit.edu;https://www.google.com",
        "aff_unique_abbr": "MIT;Google",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "IQZicPtADC",
        "title": "The Role of Representation Transfer in Multitask Imitation Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Transferring representation for multitask imitation learning has the potential to provide improved sample efficiency on learning new tasks, when compared to learning from scratch. In this work, we provide a statistical guarantee indicating that we can indeed achieve improved sample efficiency on the target task when a representation is trained using sufficiently diverse source tasks. Our theoretical results can be readily extended to account for commonly used neural network architectures such as multilayer perceptrons and convolutional networks with realistic assumptions. Inspired by the theory, we propose a practical metric that estimates the notion of task diversity. We conduct empirical analyses that align with our theoretical findings on five simulated environments\u2014in particular leveraging more data from source tasks can improve sample efficiency on learning in the new task. Our experiments further demonstrate that our proposed task diversity metric is positively correlated to the imitation performance.",
        "keywords": "Imitation Learning;Multitask Learning;Task Diversity;Representation Learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Bryan Chan;Karime Pereida;James Bergstra",
        "authorids": "~Bryan_Chan1;~Karime_Pereida1;~James_Bergstra1",
        "gender": "M;F;",
        "homepage": "https://chanb.github.io/;https://karimepereida.com/;",
        "dblp": "45/2096-2;;",
        "google_scholar": "Gy7DMdcAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.ca/citations?user=KOBmy0sAAAAJ",
        "orcid": "0000-0002-6278-9575;;",
        "linkedin": "chanbpy;;",
        "or_profile": "~Bryan_Chan1;~Karime_Pereida1;~James_Bergstra1",
        "aff": "University of Alberta;;Ocado Technology",
        "aff_domain": "ualberta.ca;;ocado.com",
        "position": "PhD student;;Researcher",
        "bibtex": "@misc{\nchan2024the,\ntitle={The Role of Representation Transfer in Multitask Imitation Learning},\nauthor={Bryan Chan and Karime Pereida and James Bergstra},\nyear={2024},\nurl={https://openreview.net/forum?id=IQZicPtADC}\n}",
        "github": "",
        "project": "",
        "reviewers": "kWs2;Ss6u;StV9;F18A;Eicc;Fs7F",
        "site": "https://openreview.net/forum?id=IQZicPtADC",
        "pdf_size": 1858979,
        "rating": "5;5;5;6;6;8",
        "confidence": "4;3;3;3;4;3",
        "soundness": "4;3;2;3;3;3",
        "contribution": "2;2;2;3;3;3",
        "presentation": "3;2;3;3;3;2",
        "wc_summary": "72;259;30;115;267;71",
        "wc_strengths": "30;58;220;61;182;61",
        "wc_weaknesses": "434;63;406;42;173;140",
        "wc_questions": "209;479;218;3;86;6",
        "wc_review": "745;859;874;221;708;278",
        "wc_reply_reviewers": "374;0;1062;0;0;16",
        "wc_reply_authors": "2098;1417;1834;159;562;332",
        "reply_reviewers": "4;0;3;0;0;1",
        "reply_authors": "8;3;6;2;2;3",
        "rating_avg": [
            5.833333333333333,
            1.0671873729054748
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.5773502691896257
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            135.66666666666666,
            93.35178389059072
        ],
        "wc_strengths_avg": [
            102.0,
            71.65426249242492
        ],
        "wc_weaknesses_avg": [
            209.66666666666666,
            155.29183995160707
        ],
        "wc_questions_avg": [
            166.83333333333334,
            163.85299983691343
        ],
        "wc_review_avg": [
            614.1666666666666,
            264.87947993170195
        ],
        "wc_reply_reviewers_avg": [
            242.0,
            390.85206067428294
        ],
        "wc_reply_authors_avg": [
            1067.0,
            752.0487572846148
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            1.5986105077709065
        ],
        "reply_authors_avg": [
            4.0,
            2.23606797749979
        ],
        "replies_avg": [
            42,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.22086305214969312,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:eoMW1EIv2Z4J:scholar.google.com/&scioq=The+Role+of+Representation+Transfer+in+Multitask+Imitation+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Alberta;Ocado Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ualberta.ca;https://technology.ocado.com",
        "aff_unique_abbr": "UAlberta;Ocado Tech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Canada;United Kingdom"
    },
    {
        "id": "IQZuCuFeAM",
        "title": "From Random to Relevant: Harnessing Salient Masks in Non-IID Federated Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Federated learning (FL) offers the ability to train models using decentralized data at client sites, ensuring data privacy by eliminating the need for data centralization. A predominant challenge with FL is the constrained computation and narrow communication bandwidth, particularly evident in resource-restricted edge client nodes. Various solutions, such as transmitting sparse models and iterative pruning have been suggested to tackle this. However, many existing methods necessitate the transmission of full model weights throughout the training, rely heavily on arbitrary or random pruning criteria or costly iterative pruning schedules. \n\nIn this work, we propose SSFL, a streamlined approach for sparse decentralized FL training and communication. SSFL identifies a subnetwork prior to training, leveraging parameter saliency scores keeping in mind the distribution of local client data in non-IID scenarios. Distinctively, only the sparse model weights are communicated in each round between client models in a decentralized manner, sidestepping the conventional need of transferring the complete dense model at any phase of training. We validate SSFL's effectiveness using standard non-IID benchmarks, noting marked improvements in the sparsity-accuracy trade-offs. Finally, we deploy our method in a real-world federated learning framework and report improvement in communication time.",
        "keywords": "Sparsity;Pruning;Federated Learning;Sparse Federated Learning;Communication efficiency;Efficient FL;Pruning at Initialization",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/0e3ed90908ac2d0cad79788e306d37e93ecfcd78.zip",
        "author": "Riyasat Ohib;Bishal Thapaliya;Jingyu Liu;Vince Calhoun;Sergey Plis",
        "authorids": "~Riyasat_Ohib1;~Bishal_Thapaliya2;~Jingyu_Liu5;~Vince_Calhoun1;~Sergey_Plis1",
        "gender": "M;M;;;M",
        "homepage": "https://www.riyasatohib.com/;;;;",
        "dblp": ";;;48/3821.html;07/227",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;s0MUCP0AAAAJ;WNOoGKIAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;;0000-0003-0040-0365",
        "linkedin": ";bthapaliya1;;;sergeyplis/",
        "or_profile": "~Riyasat_Ohib1;~Bishal_Thapaliya2;~Jingyu_Liu5;~Vince_Calhoun1;~Sergey_Plis1",
        "aff": "Georgia Institute of Technology;Georgia State University;;Emory University;Georgia State University",
        "aff_domain": "gatech.edu;gsu.edu;;emory.edu;gsu.edu",
        "position": "PhD student;PhD student;;Full Professor;Associate Professor",
        "bibtex": "@misc{\nohib2024from,\ntitle={From Random to Relevant: Harnessing Salient Masks in Non-{IID} Federated Learning},\nauthor={Riyasat Ohib and Bishal Thapaliya and Jingyu Liu and Vince Calhoun and Sergey Plis},\nyear={2024},\nurl={https://openreview.net/forum?id=IQZuCuFeAM}\n}",
        "github": "",
        "project": "",
        "reviewers": "p421;mEiz;1qhQ",
        "site": "https://openreview.net/forum?id=IQZuCuFeAM",
        "pdf_size": 1238946,
        "rating": "3;6;8",
        "confidence": "3;5;2",
        "soundness": "2;3;3",
        "contribution": "1;2;2",
        "presentation": "2;3;3",
        "wc_summary": "78;60;69",
        "wc_strengths": "20;23;36",
        "wc_weaknesses": "225;293;43",
        "wc_questions": "32;3;48",
        "wc_review": "355;379;196",
        "wc_reply_reviewers": "0;105;17",
        "wc_reply_authors": "1964;1800;807",
        "reply_reviewers": "0;1;1",
        "reply_authors": "3;3;3",
        "rating_avg": [
            5.666666666666667,
            2.0548046676563256
        ],
        "confidence_avg": [
            3.3333333333333335,
            1.247219128924647
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            69.0,
            7.3484692283495345
        ],
        "wc_strengths_avg": [
            26.333333333333332,
            6.944222218666553
        ],
        "wc_weaknesses_avg": [
            187.0,
            105.53988187726318
        ],
        "wc_questions_avg": [
            27.666666666666668,
            18.62495339293199
        ],
        "wc_review_avg": [
            310.0,
            81.20344820264715
        ],
        "wc_reply_reviewers_avg": [
            40.666666666666664,
            46.016905106227604
        ],
        "wc_reply_authors_avg": [
            1523.6666666666667,
            511.1635963390021
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.0,
            0.0
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.21677749238103006,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Nk30jan6uTUJ:scholar.google.com/&scioq=From+Random+to+Relevant:+Harnessing+Salient+Masks+in+Non-IID+Federated+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "Georgia Institute of Technology;Georgia State University;Emory University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.gatech.edu;https://www.gsu.edu;https://www.emory.edu",
        "aff_unique_abbr": "Georgia Tech;GSU;Emory",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Learning Hierarchical Image Segmentation For Recognition and By Recognition",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18964",
        "id": "IRcv4yFX6z",
        "author_site": "Tsung-Wei Ke, Sangwoo Mo, Stella Yu",
        "tldr": "",
        "abstract": "Large vision and language models learned directly through image-text associations often lack detailed visual substantiation, whereas image segmentation tasks are treated separately from recognition, supervisedly learned without interconnections.\n\nOur key observation is that,  while an image can be recognized in multiple ways, each has a consistent part-and-whole visual organization.  Segmentation thus should be treated not as an end task to be mastered through supervised learning, but as an internal process that evolves with and supports the ultimate goal of recognition. \n\nWe propose to integrate a hierarchical segmenter into the recognition process, \n{\\it train} and {\\it adapt} the entire model solely on image-level recognition objectives.  We learn hierarchical segmentation {\\it for free} alongside recognition,  automatically uncovering part-to-whole relationships that not only underpin but also enhance recognition. \n\nEnhancing the Vision Transformer (ViT) with adaptive segment tokens and graph pooling, our model surpasses ViT in unsupervised part-whole discovery, semantic segmentation, image classification, and efficiency.  Notably, our model (trained on {\\it unlabeled} 1M ImageNet images) outperforms SAM (trained on 11M images and 1 billion masks) by absolute 8\\% in mIoU on PartImageNet object segmentation.",
        "keywords": "segmentation in the loop for recognition;hierarchical segmentation;part-to-whole recognition;vision transformer",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/24d9d0bb53be30feea6b1af0b4ef0e187b93f269.zip",
        "author": "Tsung-Wei Ke;Sangwoo Mo;Stella X. Yu",
        "authorids": "~Tsung-Wei_Ke2;~Sangwoo_Mo1;~Stella_X._Yu2",
        "gender": ";M;F",
        "homepage": "https://twke18.github.io/;https://sites.google.com/view/sangwoomo;http://www.eecs.umich.edu/~stellayu",
        "dblp": "173/4984;198/0432;58/5089",
        "google_scholar": "WTEFsHMAAAAJ;https://scholar.google.co.kr/citations?user=Sq9y3NMAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Tsung-Wei_Ke2;~Sangwoo_Mo1;~Stella_Yu2",
        "aff": "Carnegie Mellon University;University of Michigan - Ann Arbor;University of California, Berkeley",
        "aff_domain": "andrew.cmu.edu;umich.edu;berkeley.edu",
        "position": "Postdoc;Postdoc;Adjunct Professor",
        "bibtex": "@inproceedings{\nke2024learning,\ntitle={Learning Hierarchical Image Segmentation For Recognition and By Recognition},\nauthor={Tsung-Wei Ke and Sangwoo Mo and Stella X. Yu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=IRcv4yFX6z}\n}",
        "github": "",
        "project": "",
        "reviewers": "hsyp;GfNL;5FXt;RnRE",
        "pdf_size": 23900142,
        "rating": "6;8;8;10",
        "confidence": "4;4;3;4",
        "soundness": "3;4;3;4",
        "contribution": "3;4;3;4",
        "presentation": "4;3;4;4",
        "wc_summary": "80;268;132;50",
        "wc_strengths": "75;36;103;114",
        "wc_weaknesses": "119;207;248;45",
        "wc_questions": "27;144;41;21",
        "wc_review": "301;655;524;230",
        "wc_reply_reviewers": "0;24;49;0",
        "wc_reply_authors": "659;289;754;427",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            8.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.5,
            0.5
        ],
        "presentation_avg": [
            3.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            132.5,
            83.55088270030426
        ],
        "wc_strengths_avg": [
            82.0,
            30.124740662784138
        ],
        "wc_weaknesses_avg": [
            154.75,
            78.6586772072859
        ],
        "wc_questions_avg": [
            58.25,
            50.03686141236279
        ],
        "wc_review_avg": [
            427.5,
            170.3503742291164
        ],
        "wc_reply_reviewers_avg": [
            18.25,
            20.27775875189366
        ],
        "wc_reply_authors_avg": [
            532.25,
            184.0426241390836
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14525207159457422539&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=IRcv4yFX6z",
        "pdf": "https://openreview.net/pdf?id=IRcv4yFX6z",
        "email": "andrew.cmu.edu;umich.edu;berkeley.edu",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Carnegie Mellon University;University of Michigan;University of California, Berkeley",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.cmu.edu;https://www.umich.edu;https://www.berkeley.edu",
        "aff_unique_abbr": "CMU;UM;UC Berkeley",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Ann Arbor;Berkeley",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "IRtIHp7vsM",
        "title": "AutoM3L: Automated Multimodal Machine Learning with Large Language Model",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Automated Machine Learning (AutoML) stands as a promising solution for automating machine learning (ML) training pipelines to reduce manual costs. However, most current AutoML frameworks are confined to unimodal scenarios and exhibit limitations when extended to challenging and complex multimodal settings. Recent advances show that large language models (LLMs) have exceptional abilities in reasoning, interaction, and code generation, which shows promise in automating the ML pipelines. Innovatively, we propose AutoM3L, an Automated Multimodal Machine Learning framework, where LLMs act as controllers to automate training pipeline assembling. Specifically, AutoM3L offers automation and interactivity by first comprehending data modalities and then automatically selecting appropriate models to construct training pipelines in alignment with user requirements. Furthermore, it streamlines user engagement and removes the need for intensive manual feature engineering and hyperparameter optimization. At each stage, users can customize the pipelines through directives, which are the capabilities lacking in previous rule-based AutoML approaches. We conduct quantitative evaluations on four multimodal datasets spanning classification, regression, and retrieval, which yields that AutoM3L can achieve competitive or even better performance than traditional rule-based AutoML methods. We show the user friendliness and usability of AutoM3L in the user study. Code is available at:\nhttps://anonymous.4open.science/r/anonymization_code",
        "keywords": "AutoML;Large Language Model",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/39b177981a1c8d93f2f24a93bc6b3677395e82a9.pdf",
        "author": "Daqin Luo;Yiqing Shen",
        "authorids": "~Daqin_Luo2;~Yiqing_Shen1",
        "gender": ";",
        "homepage": ";",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": ";",
        "aff": ";",
        "aff_domain": ";",
        "position": ";",
        "bibtex": "@misc{\nluo2024automl,\ntitle={AutoM3L: Automated Multimodal Machine Learning with Large Language Model},\nauthor={Daqin Luo and Yiqing Shen},\nyear={2024},\nurl={https://openreview.net/forum?id=IRtIHp7vsM}\n}",
        "github": "",
        "project": "",
        "reviewers": "HozN;Lpkx;4U2h;jKdu",
        "site": "https://openreview.net/forum?id=IRtIHp7vsM",
        "pdf_size": 734001,
        "rating": "3;5;5;6",
        "confidence": "4;3;4;3",
        "soundness": "1;3;3;2",
        "contribution": "2;2;3;2",
        "presentation": "1;3;3;3",
        "wc_summary": "53;50;90;87",
        "wc_strengths": "38;52;38;46",
        "wc_weaknesses": "129;172;160;280",
        "wc_questions": "42;3;49;125",
        "wc_review": "262;277;337;538",
        "wc_reply_reviewers": "0;78;0;0",
        "wc_reply_authors": "1193;1077;1521;1959",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "3;2;3;4",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            70.0,
            18.560711193270585
        ],
        "wc_strengths_avg": [
            43.5,
            5.894913061275798
        ],
        "wc_weaknesses_avg": [
            185.25,
            56.90946757789955
        ],
        "wc_questions_avg": [
            54.75,
            44.18356594934365
        ],
        "wc_review_avg": [
            353.5,
            110.15557180642294
        ],
        "wc_reply_reviewers_avg": [
            19.5,
            33.77499074759311
        ],
        "wc_reply_authors_avg": [
            1437.5,
            342.2992112173208
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.6882472016116854,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:gf_trBG59UcJ:scholar.google.com/&scioq=AutoM3L:+Automated+Multimodal+Machine+Learning+with+Large+Language+Model&hl=en&as_sdt=0,31",
        "gs_version_total": 0
    },
    {
        "id": "IS6usp1u2X",
        "title": "Absolute Policy Optimization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In recent years, trust region on-policy reinforcement learning has achieved impressive results in addressing complex control tasks and gaming scenarios. However, contemporary state-of-the-art algorithms within this category primarily emphasize improvement in expected performance, lacking the ability to control over the worst-case performance outcomes. To address this limitation, we introduce a novel objective function; by optimizing which, it will lead to guaranteed monotonic improvement in the lower bound of near-total performance samples (absolute performance). Considering this groundbreaking theoretical advancement, we then refine this theoretically grounded algorithm through a series of approximations, resulting in a practical solution called Absolute Policy Optimization (APO). \nOur experiments demonstrate the effectiveness of our approach across challenging continuous control benchmark tasks and extend its applicability to mastering Atari games. Our findings reveal that APO significantly outperforms state-of-the-art policy gradient algorithms, resulting in substantial improvements in both expected performance and worst-case performance.",
        "keywords": "Reinforcement Learning;Trust Region Policy Optimization;Worst-case Performance Improvement;Atari Games",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/e89991d0589ea0a92834ec5f32ff7317f656129e.zip",
        "author": "Weiye Zhao;Feihan Li;Yifan Sun;Rui Chen;Tianhao Wei;Changliu Liu",
        "authorids": "~Weiye_Zhao1;~Feihan_Li1;~Yifan_Sun9;~Rui_Chen11;~Tianhao_Wei1;~Changliu_Liu1",
        "gender": "M;M;M;M;M;F",
        "homepage": "https://github.com/CaesarAndylaw;;https://yifansun98.github.io/;https://ruichen.pub/;;http://www.cs.cmu.edu/~cliu6/index.html",
        "dblp": "228/6863;;99/10261-11;;222/5386;166/3563",
        "google_scholar": "P-79KOcAAAAJ;;DGhQSYUAAAAJ;XiUE0wMAAAAJ;V22j1C0AAAAJ;",
        "orcid": "0000-0002-8426-5238;0000-0003-1770-4664;0009-0007-2073-7789;0000-0002-8671-8771;;",
        "linkedin": ";;yifansun1/;;;",
        "or_profile": "~Weiye_Zhao1;~Feihan_Li1;~Yifan_Sun9;~Rui_Chen11;~Tianhao_Wei1;~Changliu_Liu1",
        "aff": "Carnegie Mellon University;Tsinghua University;Carnegie Mellon University;Carnegie Mellon University;Carnegie Mellon University;Carnegie Mellon University",
        "aff_domain": "andrew.cmu.edu;tsinghua.edu.cn;andrew.cmu.edu;andrew.cmu.edu;andrew.cmu.edu;cmu.edu",
        "position": "PhD student;Undergrad student;PhD student;PhD student;PhD student;Assistant Professor",
        "bibtex": "@misc{\nzhao2024absolute,\ntitle={Absolute Policy Optimization},\nauthor={Weiye Zhao and Feihan Li and Yifan Sun and Rui Chen and Tianhao Wei and Changliu Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=IS6usp1u2X}\n}",
        "github": "",
        "project": "",
        "reviewers": "Hx6X;qB7m;9WdD;GtPP",
        "site": "https://openreview.net/forum?id=IS6usp1u2X",
        "pdf_size": 10256744,
        "rating": "3;3;5;5",
        "confidence": "4;4;3;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "1;2;3;3",
        "wc_summary": "92;71;60;68",
        "wc_strengths": "63;77;32;39",
        "wc_weaknesses": "305;514;64;87",
        "wc_questions": "40;155;66;53",
        "wc_review": "500;817;222;247",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            72.75,
            11.818946653572814
        ],
        "wc_strengths_avg": [
            52.75,
            18.115946014492316
        ],
        "wc_weaknesses_avg": [
            242.5,
            182.79838620731857
        ],
        "wc_questions_avg": [
            78.5,
            45.11374513382812
        ],
        "wc_review_avg": [
            446.5,
            239.96510162938276
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3475426265790996417&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;0;0;0",
        "aff_unique_norm": "Carnegie Mellon University;Tsinghua University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cmu.edu;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "CMU;THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "ISfY3YMXxU",
        "title": "INRet: A General Framework for Accurate Retrieval of INRs for Shapes",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Implicit neural representations (INRs) have become an important representation for encoding various data types, such as 3D objects/scenes, videos, and audio. They have proven to be particularly effective at generating 3D content, e.g., 3D scene reconstruction from 2D images, novel content creation, as well as the representation, interpolation and completion of 3D shapes. With the widespread generation of 3D data in an INR format, there is a need to support effective organization and retrieval of INRs saved in a data store. A key aspect of retrieval and clustering of INRs in a data store is the formulation of similarity between INRs that would, for example, enable retrieval of similar INRs using a query INR. In this work, we propose INRet (INR Retrieve), a method for determining similarity between INRs that represent shapes, thus enabling accurate retrieval of similar shape INRs from an INR data store. INRet flexibly supports different INR architectures such as INRs with octree grids and hash grids, as well as different implicit functions including signed/unsigned distance function and occupancy field. We demonstrate that our method is more general and accurate than the existing INR retrieval method, which only supports simple MLP INRs and requires the same architecture between the query and stored INRs. Compared to 3D shape retrieval by converting INRs to other representations like point clouds or multi-view images, INRet achieves higher retrieval accuracy while avoiding the overhead of conversion.",
        "keywords": "INRet: A General Framework for Accurate Retrieval of INRs for Shapes",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Gavin Guan;Yuchen Chen;Haoze Deng;Daniel Kwan;Ruofan Liang;Selvakumar Panneer;Nilesh Jain;Nandita Vijaykumar",
        "authorids": "~Gavin_Guan1;~Yuchen_Chen3;~Haoze_Deng1;~Daniel_Kwan1;~Ruofan_Liang1;~Selvakumar_Panneer1;~Nilesh_Jain1;~Nandita_Vijaykumar1",
        "gender": ";F;;M;M;M;;F",
        "homepage": ";;;;https://nexuslrf.github.io/;;;http://www.cs.toronto.edu/~nandita/",
        "dblp": ";;;398/4473;246/4635;211/9289;134/6343.html;163/0027",
        "google_scholar": ";;;;;rcZzmS0AAAAJ;sWUGELEAAAAJ;",
        "orcid": ";;;;;;;",
        "linkedin": ";yuchen-chen-yc/;;daniel-kwan-525ab323a;;selvakumarpanneer/;nilesh-jain-4693532/;",
        "or_profile": "~Gavin_Guan1;~Yuchen_Chen3;~Haoze_Deng1;~Daniel_Kwan1;~Ruofan_Liang1;~Selvakumar_Panneer1;~Nilesh_Jain1;~Nandita_Vijaykumar1",
        "aff": ";University of Toronto;;University of Toronto;University of Toronto;Intel;Intel Corp;University of Toronto",
        "aff_domain": ";cs.toronto.edu;;utoronto.ca;toronto.edu;intel.com;intel.com;cs.toronto.edu",
        "position": ";MS student;;Undergrad student;PhD student;Principal Researcher;Principal Researcher;Assistant Professor",
        "bibtex": "@misc{\nguan2024inret,\ntitle={{INR}et: A General Framework for Accurate Retrieval of {INR}s for Shapes},\nauthor={Gavin Guan and Yuchen Chen and Haoze Deng and Daniel Kwan and Ruofan Liang and Selvakumar Panneer and Nilesh Jain and Nandita Vijaykumar},\nyear={2024},\nurl={https://openreview.net/forum?id=ISfY3YMXxU}\n}",
        "github": "",
        "project": "",
        "reviewers": "U5A9;rhWp;9nfq;upUQ",
        "site": "https://openreview.net/forum?id=ISfY3YMXxU",
        "pdf_size": 3457872,
        "rating": "5;6;6;6",
        "confidence": "4;3;4;4",
        "soundness": "3;2;4;3",
        "contribution": "2;2;4;3",
        "presentation": "2;2;4;3",
        "wc_summary": "48;177;176;89",
        "wc_strengths": "54;74;156;199",
        "wc_weaknesses": "175;274;148;277",
        "wc_questions": "6;66;78;76",
        "wc_review": "283;591;558;641",
        "wc_reply_reviewers": "0;32;0;0",
        "wc_reply_authors": "291;988;339;848",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;2;1;2",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            122.5,
            55.9128786595718
        ],
        "wc_strengths_avg": [
            120.75,
            59.17505809038129
        ],
        "wc_weaknesses_avg": [
            218.5,
            57.803546603993084
        ],
        "wc_questions_avg": [
            56.5,
            29.508473359359
        ],
        "wc_review_avg": [
            518.25,
            138.9988758947352
        ],
        "wc_reply_reviewers_avg": [
            8.0,
            13.856406460551018
        ],
        "wc_reply_authors_avg": [
            616.5,
            306.0069443656467
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:RtL1hYt_6DMJ:scholar.google.com/&scioq=INRet:+A+General+Framework+for+Accurate+Retrieval+of+INRs+for+Shapes&hl=en&as_sdt=0,31",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0;1;1;0",
        "aff_unique_norm": "University of Toronto;Intel",
        "aff_unique_dep": ";Intel Corporation",
        "aff_unique_url": "https://www.utoronto.ca;https://www.intel.com",
        "aff_unique_abbr": "U of T;Intel",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;1;0",
        "aff_country_unique": "Canada;United States"
    },
    {
        "id": "ISq7Hnln0t",
        "title": "Segment Anything Meets Universal Adversarial Perturbation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "As Segment Anything Model (SAM) becomes a popular foundation model in computer vision, its adversarial robustness has become a concern that cannot be ignored. In this work, we investigate whether it is possible to attack SAM with image-agnostic Universal Adversarial Perturbation (UAP). In other words, we seek a single perturbation that can fool the SAM to predict invalid masks for most images. We conduct a preliminary investigation and find that universal adversarial attack on SAM is a non-trivial task under the traditional supervised paradigm by focusing on destroying the features in the images. Considering its image-agnostic property, the UAP itself is expected to have independent features. Motivated by this rationale, we propose a novel self-supervised contrastive learning (CL) framework for crafting a UAP. Specifically, we treat the UAP as an anchor image with independent features, with random images and UAP augmented with random images set to negative and positive samples. Extensive experiments verify the effectiveness of our method. Another merit of our proposed method is that the infoNCE attack loss calculated on the embedded feature space attack requires no access to the SAM mask decoder, which makes our universal attack method prompt-agnostic and thus further enhances its flexibility.",
        "keywords": "Universal Adversarial Perturbation;Adversarial Robustness;Segment Anything",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Dongshen Han;Chaoning Zhang;Sheng Zheng",
        "authorids": "~Dongshen_Han1;~Chaoning_Zhang1;~Sheng_Zheng1",
        "gender": "M;M;",
        "homepage": "https://www.bing.com/ck/a?!&&p=ce5fd036ef7d156cJmltdHM9MTY2ODAzODQwMCZpZ3VpZD0wZjVlOTc2Mi04YjAyLTY5ODktMDc5OC04NTc0OGEyYTY4OGMmaW5zaWQ9NTEyMw&ptn=3&hsh=3&fclid=0f5e9762-8b02-6989-0798-85748a2a688c&psq=percv&u=a1aHR0cDovL2N2bGFiLmtodS5hYy5rci8&ntb=1;;https://scholar.google.com/citations?user=TgrJOjoAAAAJ&hl=en",
        "dblp": ";;",
        "google_scholar": ";https://scholar.google.co.kr/citations?user=lvhxhyQAAAAJ;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Dongshen_Han1;~Chaoning_Zhang1;~Sheng_Zheng1",
        "aff": "Kyung Hee University;Kyung Hee Universityniversity;Beijing Institute of Technology",
        "aff_domain": "khu.ac.kr;khu.ac.kr;bit.edu.cn",
        "position": "PhD student;Assistant Professor;PhD student",
        "bibtex": "@misc{\nhan2024segment,\ntitle={Segment Anything Meets Universal Adversarial Perturbation},\nauthor={Dongshen Han and Chaoning Zhang and Sheng Zheng},\nyear={2024},\nurl={https://openreview.net/forum?id=ISq7Hnln0t}\n}",
        "github": "",
        "project": "",
        "reviewers": "8LBE;K3ep;HSyT",
        "site": "https://openreview.net/forum?id=ISq7Hnln0t",
        "pdf_size": 2927047,
        "rating": "1;3;5",
        "confidence": "5;4;5",
        "soundness": "2;3;3",
        "contribution": "2;2;2",
        "presentation": "2;1;2",
        "wc_summary": "20;65;66",
        "wc_strengths": "9;23;41",
        "wc_weaknesses": "132;194;516",
        "wc_questions": "1;22;17",
        "wc_review": "162;304;640",
        "wc_reply_reviewers": "0;12;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;1;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            1.632993161855452
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            50.333333333333336,
            21.452790546272112
        ],
        "wc_strengths_avg": [
            24.333333333333332,
            13.097921802925667
        ],
        "wc_weaknesses_avg": [
            280.6666666666667,
            168.31980143630028
        ],
        "wc_questions_avg": [
            13.333333333333334,
            8.9566858950296
        ],
        "wc_review_avg": [
            368.6666666666667,
            200.42843000820906
        ],
        "wc_reply_reviewers_avg": [
            4.0,
            5.656854249492381
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4974712517589695737&as_sdt=5,40&sciodt=0,40&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Kyung Hee University;Beijing Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.khu.ac.kr;http://www.bit.edu.cn/",
        "aff_unique_abbr": "KHU;BIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "South Korea;China"
    },
    {
        "id": "ISrxxvXJQO",
        "title": "On the Hidden Waves of Image",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this paper, we introduce an intriguing phenomenon \u2013 the successful reconstruction of images using a set of one-way wave equations with hidden and learnable speeds. Each individual image corresponds to a solution with a unique initial condition, which can be computed from the original image using a visual encoder (e.g., a convolutional neural network). Furthermore, the solution for each image exhibits two noteworthy mathematical properties: (a) it can be decomposed into a collection of special solutions of the same one-way wave equations that are first-order autoregressive, with shared coefficient matrices for autoregression, and (b) the product of these coefficient matrices forms a diagonal matrix with the speeds of the wave equations as its diagonal elements. We term this phenomenon *hidden waves*, as it reveals that, although the speeds of the set of wave equations and autoregressive coefficient matrices are latent, they are both learnable and shared across images. This represents a mathematical invariance across images, providing a new mathematical perspective to understand images.",
        "keywords": "mathematical property of images;partial differential equation",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Yinpeng Chen;Dongdong Chen;Xiyang Dai;Mengchen Liu;Lu Yuan;Zicheng Liu;Youzuo Lin",
        "authorids": "~Yinpeng_Chen1;~Dongdong_Chen1;~Xiyang_Dai4;~Mengchen_Liu3;~Lu_Yuan1;~Zicheng_Liu1;~Youzuo_Lin1",
        "gender": "M;M;M;M;M;M;M",
        "homepage": "https://scholar.google.com/citations?user=V_VpLksAAAAJ&hl=en;http://www.dongdongchen.bid/;https://scholar.google.com/citations?user=cOPQtYgAAAAJ&hl=en;https://www.microsoft.com/en-us/research/people/luyuan/;https://sites.google.com/view/zichengliu/home?pli=1;https://sites.google.com/site/youzuolin044/;https://sites.google.com/site/xiyangdai/",
        "dblp": "45/6977;92/1489-1;;;l/ZichengLiu;;176/5470",
        "google_scholar": ";https://scholar.google.com.sg/citations?user=sYKpKqEAAAAJ;cOPQtYgAAAAJ;k9TsUVsAAAAJ;bkALdvsAAAAJ;CMXuHYgAAAAJ;QC8RwcoAAAAJ",
        "orcid": ";;;;0000-0001-5894-7828;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Yinpeng_Chen1;~Dongdong_Chen1;~Mengchen_Liu3;~Lu_Yuan1;~Zicheng_Liu1;~Youzuo_Lin1;~Xiyang_Dai2",
        "aff": "Google DeepMind;Microsoft Research;Microsoft;Microsoft;Microsoft;Los Alamos National Laboratory;Microsoft",
        "aff_domain": "google.com;microsoft.com;microsoft.com;microsoft.com;microsoft.com;lanl.gov;microsoft.com",
        "position": "Research Scientist;Principal Researcher;Researcher;Principal Research Manager;partner research manager;Researcher;Researcher",
        "bibtex": "@misc{\nchen2024on,\ntitle={On the Hidden Waves of Image},\nauthor={Yinpeng Chen and Dongdong Chen and Xiyang Dai and Mengchen Liu and Lu Yuan and Zicheng Liu and Youzuo Lin},\nyear={2024},\nurl={https://openreview.net/forum?id=ISrxxvXJQO}\n}",
        "github": "",
        "project": "",
        "reviewers": "Zqsi;Y4BM;kuax;nr9w",
        "site": "https://openreview.net/forum?id=ISrxxvXJQO",
        "pdf_size": 6989146,
        "rating": "5;6;6;8",
        "confidence": "3;3;4;2",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "124;101;66;14",
        "wc_strengths": "68;54;32;46",
        "wc_weaknesses": "406;95;28;35",
        "wc_questions": "87;130;143;2",
        "wc_review": "685;380;269;97",
        "wc_reply_reviewers": "153;0;96;34",
        "wc_reply_authors": "1836;1177;1339;159",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "5;2;4;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            76.25,
            41.45102531904368
        ],
        "wc_strengths_avg": [
            50.0,
            13.038404810405298
        ],
        "wc_weaknesses_avg": [
            141.0,
            155.19826029952785
        ],
        "wc_questions_avg": [
            90.5,
            55.13846207503434
        ],
        "wc_review_avg": [
            357.75,
            214.1580899709371
        ],
        "wc_reply_reviewers_avg": [
            70.75,
            58.648849093567044
        ],
        "wc_reply_authors_avg": [
            1127.75,
            609.7431323926494
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            1.5811388300841898
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.6488856845230502,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3574297783310209762&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1;1;2;1",
        "aff_unique_norm": "Google;Microsoft;Los Alamos National Laboratory",
        "aff_unique_dep": "Google DeepMind;Microsoft Research;",
        "aff_unique_url": "https://deepmind.com;https://www.microsoft.com/en-us/research;https://www.lanl.gov",
        "aff_unique_abbr": "DeepMind;MSR;LANL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;1;1;1",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "title": "Davidsonian Scene Graph: Improving Reliability in Fine-grained Evaluation for Text-to-Image Generation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18963",
        "id": "ITq4ZRUT4a",
        "author_site": "Jaemin Cho, Yushi Hu, Jason Baldridge, Roopal Garg, Peter Anderson, Ranjay Krishna, Mohit Bansal, Jordi Pont-Tuset, Su Wang",
        "tldr": "",
        "abstract": "Evaluating text-to-image models is notoriously difficult. A strong recent approach for assessing text-image faithfulness is based on QG/A (question generation and answering), which uses pre-trained foundational models to automatically generate a set of questions and answers from the prompt, and output images are scored based on whether these answers extracted with a visual question answering model are consistent with the prompt-based answers. This kind of evaluation is naturally dependent on the quality of the underlying QG and VQA models. We identify and address several reliability challenges in existing QG/A work: (a) QG questions should respect the prompt (avoiding hallucinations, duplications, and omissions) and (b) VQA answers should be consistent (not asserting that there is no motorcycle in an image while also claiming the motorcycle is blue). We address these issues with Davidsonian Scene Graph (DSG), an empirically grounded evaluation framework inspired by formal semantics, which is adaptable to any QG/A frameworks. DSG produces atomic and unique questions organized in dependency graphs, which (i) ensure appropriate semantic coverage and (ii) sidestep inconsistent answers. With extensive experimentation and human evaluation on a range of model configurations (LLM, VQA, and T2I), we empirically demonstrate that DSG addresses the challenges noted above. Finally, we present DSG-1k, an open-sourced evaluation benchmark that includes 1,060 prompts, covering a wide range of fine-grained semantic categories with a balanced distribution. We release the DSG-1k prompts and the corresponding DSG questions.",
        "keywords": "text-to-image generation;text-to-image evaluation;Davidsonian semantics;large language models;scene graphs;visual question answering;question generation;benchmark",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Jaemin Cho;Yushi Hu;Jason Michael Baldridge;Roopal Garg;Peter Anderson;Ranjay Krishna;Mohit Bansal;Jordi Pont-Tuset;Su Wang",
        "authorids": "~Jaemin_Cho1;~Yushi_Hu1;~Jason_Michael_Baldridge1;roopalgarg@google.com;~Peter_Anderson1;~Ranjay_Krishna1;~Mohit_Bansal2;~Jordi_Pont-Tuset2;~Su_Wang4",
        "gender": "M;M;M;;M;M;M;M;",
        "homepage": "https://j-min.io;https://yushi-hu.github.io;https://research.google/people/jasonbaldridge/?&type=google;;http://www.panderson.me/;http://ranjaykrishna.com;https://www.cs.unc.edu/~mbansal/;https://jponttuset.cat;https://jacobsuwang.github.io/",
        "dblp": "130/8348-1;268/5766;90/6617;;88/3792-1;167/3785;32/5243.html;14/6661;37/5976-1",
        "google_scholar": "IbQZoHQAAAAJ;mXN51X0AAAAJ;TP_JZm8AAAAJ;;r5mA7Q8AAAAJ;IcqahyAAAAAJ;DN8QtscAAAAJ;VCBBx24AAAAJ;bJZV7r4AAAAJ",
        "orcid": "0000-0002-1558-6169;;;;;0000-0001-8784-2531;;;",
        "linkedin": ";;jason-baldridge-9b26295/;;panderson80;ranjay-krishna-1a344444/;;;",
        "or_profile": "~Jaemin_Cho1;~Yushi_Hu1;~Jason_Michael_Baldridge1;roopalgarg@google.com;~Peter_Anderson1;~Ranjay_Krishna1;~Mohit_Bansal2;~Jordi_Pont-Tuset2;~Su_Wang4",
        "aff": "University of North Carolina, Chapel Hill;University of Washington;Google;;Balyasny Asset Management;University of Washington;University of North Carolina at Chapel Hill;Google;Google",
        "aff_domain": "unc.edu;uw.edu;google.com;;bamfunds.com;cs.washington.edu;unc.edu;google.com;google.com",
        "position": "PhD student;PhD student;Research Scientist;;Principal Researcher;Assistant Professor;Full Professor;Research Scientist;Researcher",
        "bibtex": "@inproceedings{\ncho2024davidsonian,\ntitle={Davidsonian Scene Graph: Improving Reliability in Fine-grained Evaluation for Text-to-Image Generation},\nauthor={Jaemin Cho and Yushi Hu and Jason Michael Baldridge and Roopal Garg and Peter Anderson and Ranjay Krishna and Mohit Bansal and Jordi Pont-Tuset and Su Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ITq4ZRUT4a}\n}",
        "github": "",
        "project": "",
        "reviewers": "p5Xv;tDEJ;A5bo",
        "pdf_size": 12059440,
        "rating": "5;5;8",
        "confidence": "3;5;3",
        "soundness": "2;2;3",
        "contribution": "3;2;3",
        "presentation": "3;2;3",
        "wc_summary": "217;147;84",
        "wc_strengths": "87;83;65",
        "wc_weaknesses": "164;77;17",
        "wc_questions": "27;65;15",
        "wc_review": "495;372;181",
        "wc_reply_reviewers": "217;0;0",
        "wc_reply_authors": "2149;858;139",
        "reply_reviewers": "2;0;0",
        "reply_authors": "4;2;1",
        "rating_avg": [
            6.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            149.33333333333334,
            54.322084725173134
        ],
        "wc_strengths_avg": [
            78.33333333333333,
            9.568466729604882
        ],
        "wc_weaknesses_avg": [
            86.0,
            60.34898507845845
        ],
        "wc_questions_avg": [
            35.666666666666664,
            21.31248981752771
        ],
        "wc_review_avg": [
            349.3333333333333,
            129.18806274403047
        ],
        "wc_reply_reviewers_avg": [
            72.33333333333333,
            102.29478101165388
        ],
        "wc_reply_authors_avg": [
            1048.6666666666667,
            831.5809575073788
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -0.5000000000000001,
        "gs_citation": 88,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11824699428690849399&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=ITq4ZRUT4a",
        "pdf": "https://openreview.net/pdf?id=ITq4ZRUT4a",
        "email": "unc.edu;uw.edu;google.com;;bamfunds.com;cs.washington.edu;unc.edu;google.com;google.com",
        "author_num": 9,
        "aff_unique_index": "0;1;2;3;1;0;2;2",
        "aff_unique_norm": "University of North Carolina;University of Washington;Google;Balyasny Asset Management",
        "aff_unique_dep": ";;Google;",
        "aff_unique_url": "https://www.unc.edu;https://www.washington.edu;https://www.google.com;https://www.balyasny.com",
        "aff_unique_abbr": "UNC;UW;Google;",
        "aff_campus_unique_index": "0;2;0;2;2",
        "aff_campus_unique": "Chapel Hill;;Mountain View",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "IU4L7wiwxw",
        "title": "Pushing Gradient towards Zero: A Novel Pruning Method for Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recently, large language models (LLMs) have attracted widespread attention due to their dominating performance on some complex language modelling tasks. However, because of their massive size, LLMs require huge amounts of GPU resources in inference which limits their usability. In this paper, we propose an effective pruning method termed PGZ(Pushing Gradient towards Zero), which prunes LLMs in one-shot, without any retraining. The method consists of a new gradual pruning method and a novel fine-tuning method where gradient is pushed towards zero. More precisely, we construct a loss function based on gradient information and optimize it leveraging second-order information implicitly. In addition, the inherently nature of PGZ makes it suitable for parallelization. Notably, we conduct a thorough evaluation of PGZ on LLaMA-7B,13B,30B,65B across various language benchmarks. Experimental results demonstrate that PGZ consistently outperforms the existing pruning methods for LLMs in unstructured pattern and semi-structured (2:4 and 4:8) pattern. PGZ is also competitive in terms of zero-shot tasks and is compatible with weight quantization approaches.",
        "keywords": "large language models;model prune;gradient;sparsity",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/5d57c9ac4583affe8fbc7775d9491670b89f7bd6.zip",
        "author": "Cheng Jiang;Ranjun Li;Zhuoyi Zhang;Yu Shen",
        "authorids": "~Cheng_Jiang4;liranjun323@gmail.com;zhuo1zhang@gmail.com;~Yu_Shen5",
        "gender": "M;;;M",
        "homepage": "https://github.com/laojiangLoveLearning;;;http://cdmd.cnki.com.cn/article/cdmd-10358-1015615828.htm",
        "dblp": ";;;",
        "google_scholar": ";;;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Cheng_Jiang4;liranjun323@gmail.com;zhuo1zhang@gmail.com;~Yu_Shen5",
        "aff": "sensetime;;;",
        "aff_domain": "sensetime.com;;;",
        "position": "Researcher;;;",
        "bibtex": "@misc{\njiang2024pushing,\ntitle={Pushing Gradient towards Zero: A Novel Pruning Method for Large Language Models},\nauthor={Cheng Jiang and Ranjun Li and Zhuoyi Zhang and Yu Shen},\nyear={2024},\nurl={https://openreview.net/forum?id=IU4L7wiwxw}\n}",
        "github": "",
        "project": "",
        "reviewers": "ERPv;ZRAv;DWaW;NTSu",
        "site": "https://openreview.net/forum?id=IU4L7wiwxw",
        "pdf_size": 361575,
        "rating": "3;5;5;5",
        "confidence": "3;4;3;4",
        "soundness": "2;3;3;3",
        "contribution": "3;3;2;2",
        "presentation": "1;2;3;2",
        "wc_summary": "64;58;78;122",
        "wc_strengths": "34;32;106;38",
        "wc_weaknesses": "168;157;174;32",
        "wc_questions": "105;69;2;12",
        "wc_review": "371;316;360;204",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            80.5,
            25.034975534240093
        ],
        "wc_strengths_avg": [
            52.5,
            30.963688410782073
        ],
        "wc_weaknesses_avg": [
            132.75,
            58.48664377445503
        ],
        "wc_questions_avg": [
            47.0,
            42.12481453965109
        ],
        "wc_review_avg": [
            312.75,
            66.07334939292846
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:z0u5130SRrMJ:scholar.google.com/&scioq=Pushing+Gradient+towards+Zero:+A+Novel+Pruning+Method+for+Large+Language+Models&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "SenseTime",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sensetime.com",
        "aff_unique_abbr": "SenseTime",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "IWfqn6Ythj",
        "title": "Clustering for Protein Representation Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Protein representation learning is a challenging task that aims to capture the structure and function of proteins from their amino acid sequences. Previous methods largely ignored the fact that not all amino acids are equally important for protein folding and activity. In this article, we propose a neural clustering framework that can automatically discover the critical components of a protein by considering both its primary and tertiary structure information. Our framework treats a protein as a graph, where each node represents an amino acid and each edge represents a spatial or sequential connection between amino acids. We then apply an iterative clustering strategy to group the nodes into clusters based on their 1D and 3D positions and assign scores to each cluster. We select the highest-scoring clusters and use their medoid nodes for the next iteration of clustering, until we obtain a hierarchical and informative representation of the protein. We evaluate our framework on four protein-related tasks: protein fold classification, enzyme reaction classification, gene ontology term prediction, and enzyme commission number prediction. Experimental results demonstrate that our method achieves state-of-the-art performance. Our code will be released.",
        "keywords": "Protein;Amino Acids;Protein Representation Learning;Clustering",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Ruijie Quan;Wenguan Wang;Fan Ma;Hehe Fan;Yi Yang",
        "authorids": "~Ruijie_Quan1;~Wenguan_Wang4;~Fan_Ma2;~Hehe_Fan1;~Yi_Yang4",
        "gender": "M;M;M;M;M",
        "homepage": ";https://sites.google.com/view/wenguanwang/;;https://hehefan.github.io;http://reler.net/",
        "dblp": "238/0204;145/1078;126/0861;184/5722.html;",
        "google_scholar": "WKLRPsAAAAAJ;CqAQQkgAAAAJ;FyglsaAAAAAJ;hVuflMQAAAAJ;https://scholar.google.com.au/citations?user=RMSuNFwAAAAJ",
        "orcid": ";0000-0002-0802-9567;;0000-0001-9572-2345;",
        "linkedin": ";wenguanwang;;;",
        "or_profile": "~Ruijie_Quan1;~Wenguan_Wang4;~Fan_Ma2;~Hehe_Fan1;~Yi_Yang4",
        "aff": "Zhejiang University;Zhejiang University;Zhejiang University;Zhejiang University;Zhejiang University",
        "aff_domain": "zju.edu.cn;zju.edu.cn;zju.edu.cn;zju.edu.cn;zju.edu.cn",
        "position": "Postdoc;Full Professor;Postdoc;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nquan2024clustering,\ntitle={Clustering for Protein Representation Learning},\nauthor={Ruijie Quan and Wenguan Wang and Fan Ma and Hehe Fan and Yi Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=IWfqn6Ythj}\n}",
        "github": "",
        "project": "",
        "reviewers": "36dv;9Yjf;5mqs;KtEJ",
        "site": "https://openreview.net/forum?id=IWfqn6Ythj",
        "pdf_size": 3795220,
        "rating": "1;3;3;8",
        "confidence": "4;4;3;2",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;4",
        "presentation": "4;1;2;3",
        "wc_summary": "93;85;164;98",
        "wc_strengths": "29;41;22;36",
        "wc_weaknesses": "539;90;282;8",
        "wc_questions": "203;127;58;49",
        "wc_review": "864;343;526;191",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            2.5860201081971503
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            110.0,
            31.51983502494897
        ],
        "wc_strengths_avg": [
            32.0,
            7.176350047203662
        ],
        "wc_weaknesses_avg": [
            229.75,
            204.37022165667875
        ],
        "wc_questions_avg": [
            109.25,
            61.96924640497091
        ],
        "wc_review_avg": [
            481.0,
            250.92728030248125
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.903594257860088,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=327929119842025700&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Zhejiang University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.zju.edu.cn",
        "aff_unique_abbr": "ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "IWpLQfZ8Xg",
        "title": "Fine-grained Local Sensitivity Analysis of Standard Dot-Product Self-Attention",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Self-attention has been widely used in various machine learning models, such as vision transformers. The standard dot-product self-attention is arguably the most popular structure, and there is a growing interest in understanding the mathematical properties of such attention mechanisms. This paper presents a fine-grained local sensitivity analysis of the standard dot-product self-attention. Despite the well-known fact that dot-product self-attention is not (globally) Lipschitz, we develop new theoretical local bounds quantifying the effect of input feature perturbations on the attention output. Utilizing mathematical techniques from optimization and matrix theory, our analysis reveals that the local sensitivity of dot-product self-attention to $\\ell_2$ perturbations can actually be controlled by several key quantities associated with the attention weight matrices and the unperturbed input. We empirically validate our theoretical findings through several examples, offering new insights for achieving low sensitivity in dot-product self-attention against $\\ell_2$ input perturbations.",
        "keywords": "Self-attention;Vision Transformers (ViT);Local Sensitivity",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Aaron J Havens;Alexandre Araujo;Huan Zhang;Bin Hu",
        "authorids": "~Aaron_J_Havens1;~Alexandre_Araujo3;~Huan_Zhang1;~Bin_Hu2",
        "gender": "M;M;M;M",
        "homepage": "https://aaronhavens.github.io/;http://huan-zhang.com;;https://alexandrearaujo.com/",
        "dblp": ";23/1797-1.html;;228/6599",
        "google_scholar": ";LTa3GzEAAAAJ;;https://scholar.google.fr/citations?user=wsu61VYAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Aaron_J_Havens1;~Huan_Zhang1;~Bin_Hu2;~Alexandre_ARAUJO1",
        "aff": "University of Illinois, Urbana Champaign;University of Illinois, Urbana Champaign;University of Illinois, Urbana Champaign;New York University",
        "aff_domain": "illinois.edu;uiuc.edu;illinois.edu;nyu.edu",
        "position": "PhD student;Assistant Professor;Assistant Professor;Postdoc",
        "bibtex": "@misc{\nhavens2024finegrained,\ntitle={Fine-grained Local Sensitivity Analysis of Standard Dot-Product Self-Attention},\nauthor={Aaron J Havens and Alexandre Araujo and Huan Zhang and Bin Hu},\nyear={2024},\nurl={https://openreview.net/forum?id=IWpLQfZ8Xg}\n}",
        "github": "",
        "project": "",
        "reviewers": "BhUy;VymQ;d9ub",
        "site": "https://openreview.net/forum?id=IWpLQfZ8Xg",
        "pdf_size": 778524,
        "rating": "5;5;8",
        "confidence": "2;4;3",
        "soundness": "3;2;3",
        "contribution": "2;2;3",
        "presentation": "3;2;3",
        "wc_summary": "52;52;194",
        "wc_strengths": "27;77;71",
        "wc_weaknesses": "79;204;56",
        "wc_questions": "49;40;160",
        "wc_review": "207;373;481",
        "wc_reply_reviewers": "98;27;117",
        "wc_reply_authors": "610;1620;836",
        "reply_reviewers": "1;1;1",
        "reply_authors": "1;3;2",
        "rating_avg": [
            6.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            99.33333333333333,
            66.9394419523265
        ],
        "wc_strengths_avg": [
            58.333333333333336,
            22.291004663067316
        ],
        "wc_weaknesses_avg": [
            113.0,
            65.02819901140326
        ],
        "wc_questions_avg": [
            83.0,
            54.57105459856901
        ],
        "wc_review_avg": [
            353.6666666666667,
            112.69230477523989
        ],
        "wc_reply_reviewers_avg": [
            80.66666666666667,
            38.7327022323801
        ],
        "wc_reply_authors_avg": [
            1022.0,
            432.79864448339794
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:pRnZyZZHykAJ:scholar.google.com/&scioq=Fine-grained+Local+Sensitivity+Analysis+of+Standard+Dot-Product+Self-Attention&hl=en&as_sdt=0,5",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "University of Illinois Urbana-Champaign;New York University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://illinois.edu;https://www.nyu.edu",
        "aff_unique_abbr": "UIUC;NYU",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Urbana-Champaign;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Improved Active Learning via Dependent Leverage Score Sampling",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18962",
        "id": "IYxDy2jDFL",
        "author_site": "Atsushi Shimizu, Xiaoou Cheng, Christopher Musco, Jonathan Weare",
        "tldr": "",
        "abstract": "We show how to obtain improved active learning methods in the agnostic (adversarial noise) setting by combining marginal leverage score sampling with non-independent sampling strategies that promote spatial coverage. In particular, we propose an easily implemented method based on the \\emph{pivotal sampling algorithm}, which we test on problems motivated by learning-based methods for parametric PDEs and uncertainty quantification. In comparison to independent sampling, our method reduces the number of samples needed to reach a given target accuracy by up to $50\\%$.\n\nWe support our findings with two theoretical results. First, we show that any non-independent leverage score sampling method that obeys a weak \\emph{one-sided $\\ell_{\\infty}$ independence condition} (which includes pivotal sampling) can actively learn $d$ dimensional linear functions with $O(d\\log d)$ samples, matching independent sampling. This result extends recent work on matrix Chernoff bounds under $\\ell_{\\infty}$ independence, and may be of interest for analyzing other sampling strategies beyond pivotal sampling. Second, we show that, for the important case of polynomial regression, our pivotal method obtains an improved bound of $O(d)$ samples.",
        "keywords": "leverage score sampling;active learning;polynomial regression;differential equations;pivotal sampling",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Atsushi Shimizu;Xiaoou Cheng;Christopher Musco;Jonathan Weare",
        "authorids": "~Atsushi_Shimizu1;~Xiaoou_Cheng1;~Christopher_Musco1;~Jonathan_Weare1",
        "gender": "M;F;M;M",
        "homepage": ";https://chengxo.github.io;https://cims.nyu.edu/~weare/;https://www.chrismusco.com/",
        "dblp": ";10/8074;;149/2243",
        "google_scholar": ";SOuYjCgAAAAJ;;HXXSrNMAAAAJ",
        "orcid": ";0000-0002-6696-1731;;",
        "linkedin": "atsushi-shimizu/;;;",
        "or_profile": "~Atsushi_Shimizu1;~Xiaoou_Cheng1;~Jonathan_Weare1;~Christopher_P_Musco1",
        "aff": ";NYU, New York University;New York University;New York University",
        "aff_domain": ";cims.nyu.edu;nyu.edu;nyu.edu",
        "position": ";PhD student;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nshimizu2024improved,\ntitle={Improved Active Learning via Dependent Leverage Score Sampling},\nauthor={Atsushi Shimizu and Xiaoou Cheng and Christopher Musco and Jonathan Weare},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=IYxDy2jDFL}\n}",
        "github": "",
        "project": "",
        "reviewers": "BstN;hDW2;gm2B;gr3D;Q8k3",
        "pdf_size": 2411071,
        "rating": "6;6;8;8;8",
        "confidence": "3;4;4;4;2",
        "soundness": "3;3;3;3;4",
        "contribution": "3;3;3;3;3",
        "presentation": "3;4;3;4;3",
        "wc_summary": "71;173;111;128;24",
        "wc_strengths": "88;92;156;151;33",
        "wc_weaknesses": "58;119;80;54;43",
        "wc_questions": "38;121;95;78;141",
        "wc_review": "255;505;442;411;241",
        "wc_reply_reviewers": "9;26;0;0;21",
        "wc_reply_authors": "425;609;95;173;373",
        "reply_reviewers": "1;1;0;0;1",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            7.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.4,
            0.8
        ],
        "soundness_avg": [
            3.2,
            0.39999999999999997
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            101.4,
            50.67780579306883
        ],
        "wc_strengths_avg": [
            104.0,
            45.506043554675244
        ],
        "wc_weaknesses_avg": [
            70.8,
            26.932508238186802
        ],
        "wc_questions_avg": [
            94.6,
            35.5786452805612
        ],
        "wc_review_avg": [
            370.8,
            104.8358717233753
        ],
        "wc_reply_reviewers_avg": [
            11.2,
            10.684568311354464
        ],
        "wc_reply_authors_avg": [
            335.0,
            183.55598600971857
        ],
        "reply_reviewers_avg": [
            0.6,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.10206207261596574,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4270106096945477271&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=IYxDy2jDFL",
        "pdf": "https://openreview.net/pdf?id=IYxDy2jDFL",
        "email": ";cims.nyu.edu;nyu.edu;nyu.edu",
        "author_num": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "New York University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nyu.edu",
        "aff_unique_abbr": "NYU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "New York;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "HIFA: High-fidelity Text-to-3D Generation with Advanced Diffusion Guidance",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18961",
        "id": "IZMPWmcS3H",
        "author_site": "Junzhe Zhu, Peiye Zhuang, Sanmi Koyejo",
        "tldr": "",
        "abstract": "The advancements in automatic text-to-3D generation have been remarkable. Most existing methods use pre-trained text-to-image diffusion models to optimize 3D representations like Neural Radiance Fields (NeRFs) via latent-space denoising score matching. Yet, these methods often result in artifacts and inconsistencies across different views due to their suboptimal optimization approaches and limited understanding of 3D geometry. Moreover, the inherent constraints of NeRFs in rendering crisp geometry and stable textures usually lead to a two-stage optimization to attain high-resolution details. This work proposes holistic sampling and smoothing approaches to achieve high-quality text-to-3D generation, all in a single-stage optimization. We compute denoising scores in the text-to-image diffusion model's latent and image spaces. Instead of randomly sampling timesteps (also referred to as noise levels in denoising score matching), we introduce a novel timestep annealing approach that progressively reduces the sampled timestep throughout optimization. To generate high-quality renderings in a single-stage optimization, we propose regularization for the variance of z-coordinates along NeRF rays. To address texture flickering issues in NeRFs, we introduce a kernel smoothing technique that refines importance sampling weights coarse-to-fine, ensuring accurate and thorough sampling in high-density regions. Extensive experiments demonstrate the superiority of our method over previous approaches, enabling the generation of highly detailed and view-consistent 3D assets through a single-stage training process.",
        "keywords": "Text-to-3D;Generative models;Diffusion models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/6f033b8e199485b6424866253a22956e9258aed6.zip",
        "author": "Junzhe Zhu;Peiye Zhuang;Sanmi Koyejo",
        "authorids": "~Junzhe_Zhu1;~Peiye_Zhuang2;~Sanmi_Koyejo1",
        "gender": ";F;M",
        "homepage": ";https://payeah.net;https://cs.stanford.edu/~sanmi/",
        "dblp": ";244/7937;14/8885",
        "google_scholar": "ss3SR9YAAAAJ;gsPILWoAAAAJ;EaaOeJwAAAAJ",
        "orcid": ";;0000-0002-4023-419X",
        "linkedin": ";;sanmi-koyejo-984754/",
        "or_profile": "~Junzhe_Zhu1;~Peiye_Zhuang2;~Oluwasanmi_O_Koyejo1",
        "aff": "Tepan;Snap Inc.;Google",
        "aff_domain": "tepan.co;snapchat.com;google.com",
        "position": "Principal Researcher;Researcher;Research Scientist",
        "bibtex": "@inproceedings{\nzhu2024hifa,\ntitle={{HIFA}: High-fidelity Text-to-3D Generation with Advanced Diffusion Guidance},\nauthor={Junzhe Zhu and Peiye Zhuang and Sanmi Koyejo},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=IZMPWmcS3H}\n}",
        "github": "",
        "project": "",
        "reviewers": "CJyW;iKQ3;WWao",
        "pdf_size": 12409987,
        "rating": "6;6;8",
        "confidence": "4;4;3",
        "soundness": "3;3;4",
        "contribution": "3;3;3",
        "presentation": "3;3;3",
        "wc_summary": "100;75;59",
        "wc_strengths": "32;40;55",
        "wc_weaknesses": "215;92;54",
        "wc_questions": "45;4;17",
        "wc_review": "392;211;185",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "744;661;254",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;2;1",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            78.0,
            16.87206764645835
        ],
        "wc_strengths_avg": [
            42.333333333333336,
            9.533566430716727
        ],
        "wc_weaknesses_avg": [
            120.33333333333333,
            68.71357620991324
        ],
        "wc_questions_avg": [
            22.0,
            17.107503227141788
        ],
        "wc_review_avg": [
            262.6666666666667,
            92.06640115819789
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            553.0,
            214.12301760125337
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.9999999999999998,
        "gs_citation": 59,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11181538821179068961&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=IZMPWmcS3H",
        "pdf": "https://openreview.net/pdf?id=IZMPWmcS3H",
        "email": "tepan.co;snapchat.com;google.com",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Tepan;Snap Inc.;Google",
        "aff_unique_dep": ";;Google",
        "aff_unique_url": ";https://www.snapinc.com;https://www.google.com",
        "aff_unique_abbr": ";Snap;Google",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "1;1",
        "aff_country_unique": ";United States"
    },
    {
        "id": "IZVCzCWwoY",
        "title": "Completion Consistency for Point Cloud Completion Enhancement",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Point cloud completion networks are conventionally trained to minimize the disparities between the completed point cloud and the ground-truth counterpart. However, an incomplete object-level point cloud can have multiple valid completion solutions when it is examined in isolation. This one-to-many mapping issue can cause contradictory supervision signals to the network, because the loss function may produce various values for identical input-output pairs of the network. And in many cases, this issue could adversely impact the network optimization process. In this work, we propose to enhance the conventional learning objective using a novel completion consistency loss to mitigate the one-to-many mapping problem. Specifically, the proposed consistency loss imposes a constraint to ensure that a point cloud completion network generates a consistent completion solution for incomplete objects originating from the same source point cloud. Experimental results across multiple well-established datasets and benchmarks demonstrate the excellent capability of the proposed completion consistency loss to enhance the completion performance of various existing networks without any modification to the design of the networks.",
        "keywords": "point cloud completion",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Kevin Tirta Wijaya;Dong-Hee Paek;Seung-Hyun Kong",
        "authorids": "~Kevin_Tirta_Wijaya1;~Dong-Hee_Paek1;~Seung-Hyun_Kong1",
        "gender": ";M;M",
        "homepage": ";http://ave.kaist.ac.kr/bbs/board.php?bo_table=sub1_2&wr_id=5;http://ave.kaist.ac.kr",
        "dblp": ";296/4789;21/7533",
        "google_scholar": ";https://scholar.google.co.kr/citations?user=5vfSQOUAAAAJ;tOYRXjUAAAAJ",
        "orcid": ";0000-0003-0008-3726;0000-0002-4753-1998",
        "linkedin": ";dong-hee-paek-8113021a3/;seung-hyun-kong-1b64a2ba/",
        "or_profile": "~Kevin_Tirta_Wijaya1;~Dong-Hee_Paek1;~Seung-Hyun_Kong1",
        "aff": ";Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology",
        "aff_domain": ";kaist.ac.kr;kaist.ac.kr",
        "position": ";PhD student;Associate Professor",
        "bibtex": "@misc{\nwijaya2024completion,\ntitle={Completion Consistency for Point Cloud Completion Enhancement},\nauthor={Kevin Tirta Wijaya and Dong-Hee Paek and Seung-Hyun Kong},\nyear={2024},\nurl={https://openreview.net/forum?id=IZVCzCWwoY}\n}",
        "github": "",
        "project": "",
        "reviewers": "CxXc;MC7Y;3ARx;uAuJ",
        "site": "https://openreview.net/forum?id=IZVCzCWwoY",
        "pdf_size": 1568072,
        "rating": "3;3;3;5",
        "confidence": "5;5;5;3",
        "soundness": "3;2;1;2",
        "contribution": "2;2;1;2",
        "presentation": "3;3;2;3",
        "wc_summary": "94;69;120;91",
        "wc_strengths": "16;18;5;18",
        "wc_weaknesses": "98;192;41;144",
        "wc_questions": "5;97;410;43",
        "wc_review": "213;376;576;296",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            93.5,
            18.090052515125542
        ],
        "wc_strengths_avg": [
            14.25,
            5.402545696243577
        ],
        "wc_weaknesses_avg": [
            118.75,
            55.854162781300374
        ],
        "wc_questions_avg": [
            138.75,
            159.9818349063418
        ],
        "wc_review_avg": [
            365.25,
            134.63538725015798
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:uzWexsKxYVkJ:scholar.google.com/&scioq=Completion+Consistency+for+Point+Cloud+Completion+Enhancement&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "IZbLMHbOQg",
        "title": "Diffusion Models for Imperceptible and Transferable Adversarial Attack",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Many existing adversarial attacks generate $L_p$-norm perturbations on image RGB space. Despite some achievements in transferability and attack success rate, the crafted adversarial examples are easily perceived by human eyes. Towards visual imperceptibility, some recent works explore unrestricted attacks without $L_p$-norm constraints, yet lacking transferability of attacking black-box models. In this work, we propose a novel imperceptible and transferable attack by leveraging both the generative and discriminative power of diffusion models. Specifically, instead of direct manipulation in pixel space, we craft perturbations in the latent space of diffusion models. Combined with well-designed content-preserving structures, we can generate human-insensitive perturbations embedded with semantic clues. For better transferability, we further ''deceive'' the diffusion model which can be viewed as an implicit recognition surrogate, by distracting its attention away from the target regions. Extensive experiments on various model structures, datasets, and defense methods have demonstrated the superiority of our attack.",
        "keywords": "Adversarial Attack;Imperceptibility;Transferability;Unrestricted Attack;Diffusion Model",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/087ad872c7b4e5138a0a65acbc0c88f44d1a6c40.zip",
        "author": "Jianqi Chen;Hao Chen;Keyan Chen;Yilan Zhang;Zhengxia Zou;Zhenwei Shi",
        "authorids": "~Jianqi_Chen1;~Hao_Chen14;~Keyan_Chen2;~Yilan_Zhang1;~Zhengxia_Zou1;~Zhenwei_Shi2",
        "gender": "M;M;F;M;M;M",
        "homepage": "https://windvchen.github.io/;https://kyanchen.github.io/;;http://www-personal.umich.edu/~zzhengxi/;http://levir.buaa.edu.cn/index.htm;https://chenhao.in/",
        "dblp": "86/10143;;207/6668;170/2587.html;;175/3324-45",
        "google_scholar": "https://scholar.google.com.hk/citations?user=7jZZKH0AAAAJ;5RF4ia8AAAAJ;wZ4M4ecAAAAJ;DzwoyZsAAAAJ;https://scholar.google.com.hk/citations?user=kNhFWQIAAAAJ;BEDNoZIAAAAJ",
        "orcid": "0000-0003-0031-8417;0000-0003-0483-1306;0000-0003-3633-7038;;;0000-0002-6418-3761",
        "linkedin": ";;;;;",
        "or_profile": "~Jianqi_Chen1;~Keyan_Chen2;~Yilan_Zhang1;~Zhengxia_Zou1;~Zhenwei_Shi2;~Hao_Chen66",
        "aff": "Beihang University;Beihang University;Beihang University;Beihang University;Beihang University;Shanghai Artificial Intelligence Laboratory",
        "aff_domain": "buaa.edu.cn;buaa.edu.cn;buaa.edu.cn;buaa.edu;buaa.edu.cn;pjlab.org.cn",
        "position": "MS student;PhD student;MS student;Full Professor;Full Professor;Researcher",
        "bibtex": "@misc{\nchen2024diffusion,\ntitle={Diffusion Models for Imperceptible and Transferable Adversarial Attack},\nauthor={Jianqi Chen and Hao Chen and Keyan Chen and Yilan Zhang and Zhengxia Zou and Zhenwei Shi},\nyear={2024},\nurl={https://openreview.net/forum?id=IZbLMHbOQg}\n}",
        "github": "",
        "project": "",
        "reviewers": "9mVi;WbRq;eRtP",
        "site": "https://openreview.net/forum?id=IZbLMHbOQg",
        "pdf_size": 5089377,
        "rating": "3;5;6",
        "confidence": "3;4;4",
        "soundness": "2;3;3",
        "contribution": "2;2;3",
        "presentation": "3;3;3",
        "wc_summary": "25;56;42",
        "wc_strengths": "10;44;52",
        "wc_weaknesses": "163;158;32",
        "wc_questions": "4;2;21",
        "wc_review": "202;260;147",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1458;1604;309",
        "reply_reviewers": "0;0;0",
        "reply_authors": "3;3;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            41.0,
            12.675435561221029
        ],
        "wc_strengths_avg": [
            35.333333333333336,
            18.208667044996886
        ],
        "wc_weaknesses_avg": [
            117.66666666666667,
            60.609863517051046
        ],
        "wc_questions_avg": [
            9.0,
            8.524474568362947
        ],
        "wc_review_avg": [
            203.0,
            46.13747572924495
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1123.6666666666667,
            579.1317255647074
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.9449111825230683,
        "gs_citation": 68,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7700281406354131625&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;0;0;0;0;1",
        "aff_unique_norm": "Beihang University;Shanghai Artificial Intelligence Laboratory",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.buaa.edu.cn/;http://www.shailab.org/",
        "aff_unique_abbr": "BUAA;Shanghai AI Lab",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "IaKxCsJSOO",
        "title": "Expressive Modeling is Insufficient for Offline RL: A Tractable Inference Perspective",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "A popular paradigm for offline Reinforcement Learning (RL) tasks is to first fit the offline trajectories to a sequence model, and then prompt the model for actions that lead to high expected return. While a common consensus is that more expressive sequence models imply better performance, this paper highlights that tractability, the ability to exactly and efficiently answer various probabilistic queries, plays an equally important role. Specifically, due to the fundamental stochasticity from the offline data-collection policies and the environment dynamics, highly non-trivial conditional/constrained generation is required to elicit rewarding actions. While it is still possible to approximate such queries, we observe that such crude estimates significantly undermine the benefits brought by expressive sequence models. To overcome this problem, this paper proposes Trifle (Tractable Inference for Offline RL), which leverages modern Tractable Probabilistic Models (TPMs) to bridge the gap between good sequence models and high expected returns at evaluation time. Empirically, Trifle achieves the most state-of-the-art scores in 9 Gym-MuJoCo benchmarks against strong baselines. Further, owing to its tractability, Trifle significantly outperforms prior approaches in stochastic environments and safe RL tasks (i.e. with state/action constraints) with minimum algorithmic modifications.",
        "keywords": "Offline Reinforcement Learning; Tractable Probabilistic Models;",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/6e3e031f5d124a056cc486f0a3684d45e5dd1fac.pdf",
        "author": "Xuejie Liu;Anji Liu;Guy Van den Broeck;Yitao Liang",
        "authorids": "~Xuejie_Liu2;~Anji_Liu1;~Guy_Van_den_Broeck1;~Yitao_Liang1",
        "gender": ";M;M;M",
        "homepage": ";https://liuanji.github.io/;https://web.cs.ucla.edu/~yliang/;http://web.cs.ucla.edu/~guyvdb/",
        "dblp": ";227/8622;173/4969;96/7521.html",
        "google_scholar": "vxqpWKUAAAAJ;k_4zYecAAAAJ;KVzR1XEAAAAJ;d0KQ9z0AAAAJ",
        "orcid": ";;;0000-0003-3434-2503",
        "linkedin": "lxj-25a92b263;anji-liu-7610b7190/;;guyvdb",
        "or_profile": "~Xuejie_Liu2;~Anji_Liu1;~Yitao_Liang1;~Guy_Van_den_Broek1",
        "aff": "Peking University;University of California, Los Angeles;Peking University;University of California, Los Angeles",
        "aff_domain": "pku.edu.cn;ucla.edu;pku.edu.cn;ucla.edu",
        "position": "PhD student;PhD student;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nliu2024expressive,\ntitle={Expressive Modeling is Insufficient for Offline {RL}: A Tractable Inference Perspective},\nauthor={Xuejie Liu and Anji Liu and Guy Van den Broeck and Yitao Liang},\nyear={2024},\nurl={https://openreview.net/forum?id=IaKxCsJSOO}\n}",
        "github": "",
        "project": "",
        "reviewers": "WTWy;WNH3;94tr;dbnt",
        "site": "https://openreview.net/forum?id=IaKxCsJSOO",
        "pdf_size": 600636,
        "rating": "5;5;6;8",
        "confidence": "3;3;4;4",
        "soundness": "3;3;3;3",
        "contribution": "3;2;2;4",
        "presentation": "3;3;4;4",
        "wc_summary": "26;160;130;76",
        "wc_strengths": "35;29;111;51",
        "wc_weaknesses": "202;69;243;37",
        "wc_questions": "122;102;1;28",
        "wc_review": "385;360;485;192",
        "wc_reply_reviewers": "0;0;54;0",
        "wc_reply_authors": "756;122;191;53",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            98.0,
            51.32250968142536
        ],
        "wc_strengths_avg": [
            56.5,
            32.47691487810996
        ],
        "wc_weaknesses_avg": [
            137.75,
            86.72189746540374
        ],
        "wc_questions_avg": [
            63.25,
            50.17656325417276
        ],
        "wc_review_avg": [
            355.5,
            105.34823206869682
        ],
        "wc_reply_reviewers_avg": [
            13.5,
            23.382685902179844
        ],
        "wc_reply_authors_avg": [
            280.5,
            278.83193862970575
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.8164965809277259,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14997641141727408421&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;1",
        "aff_unique_norm": "Peking University;University of California, Los Angeles",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.ucla.edu",
        "aff_unique_abbr": "Peking U;UCLA",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Los Angeles",
        "aff_country_unique_index": "0;1;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Towards Generative Abstract Reasoning: Completing Raven\u2019s Progressive Matrix via Rule Abstraction and Selection",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18960",
        "id": "IcR1OOFzxm",
        "author_site": "Fan Shi, Bin Li, Xiangyang Xue",
        "tldr": "",
        "abstract": "Endowing machines with abstract reasoning ability has been a long-term research topic in artificial intelligence. Raven's Progressive Matrix (RPM) is widely used to probe abstract visual reasoning in machine intelligence, where models will analyze the underlying rules and select one image from candidates to complete the image matrix. Participators of RPM tests can show powerful reasoning ability by inferring and combining attribute-changing rules and imagining the missing images at arbitrary positions of a matrix. However, existing solvers can hardly manifest such an ability in realistic RPM tests. In this paper, we propose a deep latent variable model for answer generation problems through Rule AbstractIon and SElection (RAISE). RAISE can encode image attributes into latent concepts and abstract atomic rules that act on the latent concepts. When generating answers, RAISE selects one atomic rule out of the global knowledge set for each latent concept to constitute the underlying rule of an RPM. In the experiments of bottom-right and arbitrary-position answer generation, RAISE outperforms the compared solvers in most configurations of realistic RPM datasets. In the odd-one-out task and two held-out configurations, RAISE can leverage acquired latent concepts and atomic rules to find the rule-breaking image in a matrix and handle problems with unseen combinations of rules and attributes.",
        "keywords": "Deep Latent Variable Models;Generative Models;Raven\u2019s Progressive Matrix;Abstract Visual Reasoning",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/51c0bcedce6b677fa81d0395cd300b87837c827d.zip",
        "author": "Fan Shi;Bin Li;Xiangyang Xue",
        "authorids": "~Fan_Shi1;~Bin_Li4;~Xiangyang_Xue2",
        "gender": ";M;M",
        "homepage": ";https://aimpressionist.github.io/publications;http://homepage.fudan.edu.cn//xyxue",
        "dblp": ";89/6764-15;84/3791",
        "google_scholar": "MRVWY-gAAAAJ;8t97oL8AAAAJ;",
        "orcid": ";0000-0002-9633-0033;0000-0002-4897-9209",
        "linkedin": ";;",
        "or_profile": "~Fan_Shi1;~Bin_Li4;~Xiangyang_Xue2",
        "aff": "Fudan University;Fudan University;Fudan University",
        "aff_domain": "fudan.edu.cn;fudan.edu.cn;fudan.edu.cn",
        "position": "PhD student;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nshi2024towards,\ntitle={Towards Generative Abstract Reasoning: Completing Raven{\\textquoteright}s Progressive Matrix via Rule Abstraction and Selection},\nauthor={Fan Shi and Bin Li and Xiangyang Xue},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=IcR1OOFzxm}\n}",
        "github": "",
        "project": "",
        "reviewers": "qkwH;w266;5rkm;TA5q",
        "pdf_size": 3154134,
        "rating": "6;6;6;8",
        "confidence": "4;4;5;5",
        "soundness": "3;4;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;4;4;3",
        "wc_summary": "84;145;106;73",
        "wc_strengths": "81;113;156;105",
        "wc_weaknesses": "119;113;519;197",
        "wc_questions": "2;253;160;2",
        "wc_review": "286;624;941;377",
        "wc_reply_reviewers": "0;0;0;16",
        "wc_reply_authors": "558;1326;583;838",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;2;1;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            102.0,
            27.52271788904577
        ],
        "wc_strengths_avg": [
            113.75,
            27.086666461563706
        ],
        "wc_weaknesses_avg": [
            237.0,
            166.15053415502462
        ],
        "wc_questions_avg": [
            104.25,
            107.40664551134627
        ],
        "wc_review_avg": [
            557.0,
            253.86315211152643
        ],
        "wc_reply_reviewers_avg": [
            4.0,
            6.928203230275509
        ],
        "wc_reply_authors_avg": [
            826.25,
            308.6327712670837
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4980961281184481549&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=IcR1OOFzxm",
        "pdf": "https://openreview.net/pdf?id=IcR1OOFzxm",
        "email": "fudan.edu.cn;fudan.edu.cn;fudan.edu.cn",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Fudan University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.fudan.edu.cn",
        "aff_unique_abbr": "Fudan",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Vanishing Gradients in Reinforcement Finetuning of Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18959",
        "id": "IcVNBR7qZi",
        "author_site": "Noam Razin, Hattie Zhou, Omid Saremi, Vimal Thilak, Arwen Bradley, Preetum Nakkiran, Joshua Susskind, Etai Littwin",
        "tldr": "",
        "abstract": "Pretrained language models are commonly aligned with human preferences and downstream tasks via reinforcement finetuning (RFT), which refers to maximizing a (possibly learned) reward function using policy gradient algorithms. This work identifies a fundamental optimization obstacle in RFT: we prove that the expected gradient for an input vanishes when its reward standard deviation under the model is small, even if the expected reward is far from optimal. Through experiments on an RFT benchmark and controlled environments, as well as a theoretical analysis, we then demonstrate that vanishing gradients due to small reward standard deviation are prevalent and detrimental, leading to extremely slow reward maximization. Lastly, we explore ways to overcome vanishing gradients in RFT. We find the common practice of an initial supervised finetuning (SFT) phase to be the most promising candidate, which sheds light on its importance in an RFT pipeline. Moreover, we show that a relatively small number of SFT optimization steps on as few as 1% of the input samples can suffice, indicating that the initial SFT phase need not be expensive in terms of compute and data labeling efforts. Overall, our results emphasize that being mindful for inputs whose expected gradient vanishes, as measured by the reward standard deviation, is crucial for successful execution of RFT.",
        "keywords": "Vanishing Gradients;Reinforcement Finetuning;Supervised Finetuning;Language Models",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Noam Razin;Hattie Zhou;Omid Saremi;Vimal Thilak;Arwen Bradley;Preetum Nakkiran;Joshua M. Susskind;Etai Littwin",
        "authorids": "~Noam_Razin1;~Hattie_Zhou1;~Omid_Saremi1;~Vimal_Thilak2;~Arwen_Bradley1;~Preetum_Nakkiran1;~Joshua_M._Susskind1;~Etai_Littwin1",
        "gender": "M;F;;M;F;;M;M",
        "homepage": "https://noamrazin.github.io/;http://hattiezhou.com;;;;http://preetum.nakkiran.org;http://www.apple.com;",
        "dblp": "247/1241;;;14/4821;278/8216;151/6343;132/7797;",
        "google_scholar": "tDsd50oAAAAJ;;;KyBnuqsAAAAJ;cxi6phoAAAAJ;zithBbUAAAAJ;Sv2TGqsAAAAJ;NOVS7vwAAAAJ",
        "orcid": ";;;;0000-0002-4086-217X;;;",
        "linkedin": ";;omidsaremi/;;arwen-bradley-2084ba2b/;;joshua-susskind-8ab2ab5/;",
        "or_profile": "~Noam_Razin1;~Hattie_Zhou1;~Omid_Saremi1;~Vimal_Thilak2;~Arwen_Bradley1;~Preetum_Nakkiran1;~Joshua_M._Susskind1;~Etai_Littwin1",
        "aff": "Tel Aviv University;University of Montreal;Apple;Apple;Apple;Apple;Apple;",
        "aff_domain": "tau.ac.il;umontreal.ca;apple.com;apple.com;apple.com;apple.com;apple.com;",
        "position": "PhD student;PhD student;ML;Engineer;Researcher;Principal Researcher;Researcher;",
        "bibtex": "@inproceedings{\nrazin2024vanishing,\ntitle={Vanishing Gradients in Reinforcement Finetuning of Language Models},\nauthor={Noam Razin and Hattie Zhou and Omid Saremi and Vimal Thilak and Arwen Bradley and Preetum Nakkiran and Joshua M. Susskind and Etai Littwin},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=IcVNBR7qZi}\n}",
        "github": "",
        "project": "",
        "reviewers": "4NxS;voez;xsTc;PKCD",
        "pdf_size": 8722091,
        "rating": "5;6;6;8",
        "confidence": "3;3;3;3",
        "soundness": "3;3;3;4",
        "contribution": "2;3;3;4",
        "presentation": "3;3;3;4",
        "wc_summary": "76;52;157;162",
        "wc_strengths": "49;49;18;52",
        "wc_weaknesses": "136;298;294;7",
        "wc_questions": "222;6;38;35",
        "wc_review": "483;405;507;256",
        "wc_reply_reviewers": "0;0;33;0",
        "wc_reply_authors": "978;736;1328;237",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "2;1;3;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            111.75,
            48.530274056510336
        ],
        "wc_strengths_avg": [
            42.0,
            13.910427743243556
        ],
        "wc_weaknesses_avg": [
            183.75,
            121.1700767516469
        ],
        "wc_questions_avg": [
            75.25,
            85.64279012269509
        ],
        "wc_review_avg": [
            412.75,
            98.04176406001679
        ],
        "wc_reply_reviewers_avg": [
            8.25,
            14.289419162443238
        ],
        "wc_reply_authors_avg": [
            819.75,
            396.85411362363374
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11442394660782699019&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=IcVNBR7qZi",
        "pdf": "https://openreview.net/pdf?id=IcVNBR7qZi",
        "email": "tau.ac.il;umontreal.ca;apple.com;apple.com;apple.com;apple.com;apple.com;",
        "author_num": 8,
        "aff_unique_index": "0;1;2;2;2;2;2",
        "aff_unique_norm": "Tel Aviv University;University of Montreal;Apple",
        "aff_unique_dep": ";;Apple Inc.",
        "aff_unique_url": "https://www.tau.ac.il;https://wwwumontreal.ca;https://www.apple.com",
        "aff_unique_abbr": "TAU;UM;Apple",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;2;2;2;2",
        "aff_country_unique": "Israel;Canada;United States"
    },
    {
        "id": "IcbC9F9xJ7",
        "title": "A General Single-Cell Analysis Framework via Conditional Diffusion Generative Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The fast-growing single-cell analysis community extends the horizon of quantitative analysis to numerous computational tasks. While the tasks hold vastly different targets from each other, existing works typically design specific model frameworks according to the downstream objectives. In this work, we propose a general single-cell analysis framework by unifying common computational tasks as posterior estimation problems. In light of conditional diffusion generative models, we introduce scDiff through the proposed framework and study different conditioning strategies. With data-specific conditions, scDiff achieves competitive performance against state-of-the-art in various benchmarking tasks. In addition, we illustrate the flexibility of scDiff by incorporating prior information through large language models and graph neural networks. Additional few-shot and zero-shot experiments prove the effectiveness of the prior conditioner on scDiff.",
        "keywords": "Single-cell analysis;Diffusion generative models;AI for science",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/9c6eee28ae0cf54e65fcb2206404347ab6558e06.zip",
        "author": "Wenzhuo Tang;Renming Liu;Hongzhi Wen;Xinnan Dai;Jiayuan Ding;Hang Li;Wenqi Fan;Yuying Xie;Jiliang Tang",
        "authorids": "~Wenzhuo_Tang1;~Renming_Liu1;~Hongzhi_Wen1;~Xinnan_Dai1;~Jiayuan_Ding1;~Hang_Li10;~Wenqi_Fan1;~Yuying_Xie1;~Jiliang_Tang1",
        "gender": "M;M;M;F;M;M;M;M;M",
        "homepage": ";https://github.com/RemyLau;https://www.cse.msu.edu/~wenhongz/;;;https://hzlihang99.github.io/;https://wenqifan03.github.io;https://cmse.msu.edu/directory/faculty/yuying-xie/;https://www.cse.msu.edu/~tangjili/",
        "dblp": ";;179/0477;;197/1055;83/5560-7.html;218/7410;24/2813-1;64/10812",
        "google_scholar": ";by5L-BcAAAAJ;;LGKDd2AAAAAJ;7lwkXGEAAAAJ;25Vx5UIAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en;WtzKMWAAAAAJ",
        "orcid": ";0000-0002-6025-6492;0000-0003-0775-8538;;;0000-0002-3464-3245;0000-0002-4049-1233;0000-0002-1049-2219;0000-0001-7125-3898",
        "linkedin": "wenzhuo-tang-66b757207;remy-liu-a24780213/;;;jiayuand/;;wenqi-fan-a425a7196/;yuying-xie-b754bb17/;",
        "or_profile": "~Wenzhuo_Tang1;~Renming_Liu1;~Hongzhi_Wen1;~Xinnan_Dai1;~Jiayuan_Ding1;~Hang_Li10;~Wenqi_Fan1;~Yuying_Xie1;~Jiliang_Tang1",
        "aff": "Michigan State University;Michigan State University;Michigan State University;Michigan State University;Michigan State University;Michigan State University;The Hong Kong Polytechnic University;Michigan State University;Michigan State University",
        "aff_domain": "msu.edu;msu.edu;msu.edu;msu.edu;msu.edu;msu.edu;polyu.edu.hk;msu.edu;msu.edu",
        "position": "PhD student;PhD student;PhD student;PhD student;PhD student;PhD student;Assistant Professor;Associate Professor;Full Professor",
        "bibtex": "@misc{\ntang2024a,\ntitle={A General Single-Cell Analysis Framework via Conditional Diffusion Generative Models},\nauthor={Wenzhuo Tang and Renming Liu and Hongzhi Wen and Xinnan Dai and Jiayuan Ding and Hang Li and Wenqi Fan and Yuying Xie and Jiliang Tang},\nyear={2024},\nurl={https://openreview.net/forum?id=IcbC9F9xJ7}\n}",
        "github": "",
        "project": "",
        "reviewers": "Abad;Z48j;qLUM;Cfbr",
        "site": "https://openreview.net/forum?id=IcbC9F9xJ7",
        "pdf_size": 642315,
        "rating": "6;6;6;8",
        "confidence": "4;3;3;5",
        "soundness": "2;2;3;4",
        "contribution": "2;2;3;4",
        "presentation": "2;3;2;4",
        "wc_summary": "55;121;78;148",
        "wc_strengths": "57;68;26;163",
        "wc_weaknesses": "290;194;285;297",
        "wc_questions": "7;275;164;81",
        "wc_review": "409;658;553;689",
        "wc_reply_reviewers": "12;131;20;0",
        "wc_reply_authors": "2573;3171;2421;1317",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "5;5;4;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            100.5,
            36.238791370574155
        ],
        "wc_strengths_avg": [
            78.5,
            51.15906566777779
        ],
        "wc_weaknesses_avg": [
            266.5,
            42.07433897282285
        ],
        "wc_questions_avg": [
            131.75,
            99.62272582096918
        ],
        "wc_review_avg": [
            577.25,
            109.43576883268102
        ],
        "wc_reply_reviewers_avg": [
            40.75,
            52.58980414491007
        ],
        "wc_reply_authors_avg": [
            2370.5,
            669.7423011875538
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.0,
            1.224744871391589
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.8703882797784891,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9876147466325927106&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0;0;0;1;0;0",
        "aff_unique_norm": "Michigan State University;Hong Kong Polytechnic University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.msu.edu;https://www.polyu.edu.hk",
        "aff_unique_abbr": "MSU;PolyU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;0;0;1;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "IdibrApfps",
        "title": "ISET: Invertible Sequence Embedding from Transformer",
        "track": "main",
        "status": "Desk Reject",
        "tldr": "",
        "abstract": "Sequence embeddings are essential in Natural Language Processing (NLP) as they convert variable-length sentences into fixed-length representations suitable for deep learning tasks. Despite the achievements of pre-trained language models like BERT, continuous efforts are directed toward enhancing sentence embeddings through contrastive learning methods. Furthermore, the distinction between semantic and invertible embeddings underlines the need for representations that not only capture meaning but also allow the reconstruction of the original sentence. Before the emergence of invertible embeddings, the Transformer architecture lacked readily available methods to achieve this goal. In response, a pioneering approach was introduced to create invertible sentence-level embeddings within the Transformer framework. To achieve contextualized sequence embeddings, a Generative Pre-trained Sequence (GPS) is proposed, which predicts the following sequences from previous sequences, comprising four steps: transformer-based symbol embeddings (optional), sequence-wise aggregation, GPS pretraining, and coupled GPS pretraining. This innovative method sought to leverage the strengths of Transformers while addressing the imperative need for invertibility in sentence embeddings. Doing so paved the way for applications that require both semantic representation and the ability to reconstruct the original sentences.",
        "keywords": "Variable-length sentences;Fixed-length representations;NLP;Pre-trained language models;BERT;Invertible embeddings;Sentence-level embeddings;Semantic representation;Generative Pre-trained Sequence (GPS).",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Debi Prasad Ghosh",
        "authorids": "~Debi_Prasad_Ghosh1",
        "gender": "M",
        "homepage": "",
        "dblp": "92/1150",
        "google_scholar": "NkdvMYcAAAAJ",
        "orcid": "0000-0001-7393-2907",
        "linkedin": "debiprasadghosh/",
        "or_profile": "~Debi_Prasad_Ghosh1",
        "aff": "",
        "aff_domain": "",
        "position": "",
        "bibtex": "@misc{\nghosh2024iset,\ntitle={{ISET}: Invertible Sequence Embedding from Transformer},\nauthor={Debi Prasad Ghosh},\nyear={2024},\nurl={https://openreview.net/forum?id=IdibrApfps}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=IdibrApfps",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:7YVFx5f5x74J:scholar.google.com/&scioq=ISET:+Invertible+Sequence+Embedding+from+Transformer&hl=en&as_sdt=0,33",
        "gs_version_total": 0
    },
    {
        "id": "IefMMX12yk",
        "title": "Lightweight Graph Neural Network Search with Graph Sparsification",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph Neural Architecture Search (GNAS) has achieved superior performance on various graph-structured tasks. However, existing GNAS studies overlook the applications of GNAS in resource-constraint scenarios. This paper proposes to design a joint graph data and architecture mechanism, which identifies important sub-architectures via the valuable graph data. To search for optimal lightweight Graph Neural Networks (GNNs), we propose Lightweight Graph Neural Architecture Search with Graph SparsIfication and Network Pruning (GASSIP). In particular, GASSIP comprises an operation-pruned architecture search module to enable efficient lightweight GNN search. Meanwhile, we design a novel curriculum graph data sparsification module with an architecture-aware edge-removing difficulty measurement to help select optimal sub-architectures. With the aid of two differentiable masks, we iteratively optimize these two modules to efficiently search for the optimal lightweight architecture. Extensive experiments on five benchmarks demonstrate the effectiveness of GASSIP. Particularly, our method achieves on-par or even higher node classification performance with half or fewer model parameters of searched GNNs and a sparser graph.",
        "keywords": "graph neural network;neural architecture search;graph sparsification",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Beini Xie;Heng Chang;Ziwei Zhang;Zeyang Zhang;Simin Wu;Xin Wang;Yuan Meng;Wenwu Zhu",
        "authorids": "~Beini_Xie1;~Heng_Chang2;~Ziwei_Zhang1;~Zeyang_Zhang1;~Simin_Wu1;~Xin_Wang17;~Yuan_Meng2;~Wenwu_Zhu1",
        "gender": "F;M;;;F;M;F;M",
        "homepage": ";https://hchang95.github.io;;https://zzythu.com;https://gitee.com/simin-wu;http://mn.cs.tsinghua.edu.cn/xinwang/;;http://media.cs.tsinghua.edu.cn/en/zww",
        "dblp": ";79/5668;;236/0242;;10/5630-19;;97/6308-1.html",
        "google_scholar": ";e9NeskoAAAAJ;;w_njVcAAAAAJ;;YPOBHYUAAAAJ;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com.tw/citations?user=7t2jzpgAAAAJ",
        "orcid": ";0000-0002-4978-8041;;0000-0003-1329-1313;;0000-0002-0351-2939;0000-0002-7450-9438;0000-0003-2236-9290",
        "linkedin": "https://www.linkedin.cn/incareer/in/beini-xie;;;zeyang-zhang-a7a039159;;;;",
        "or_profile": "~Beini_Xie1;~Heng_Chang2;~Ziwei_Zhang1;~Zeyang_Zhang1;~Simin_Wu1;~Xin_Wang17;~Yuan_Meng2;~Wenwu_Zhu1",
        "aff": ";Tsinghua University;;Tsinghua University;Lanzhou University;Tsinghua University;Tsinghua University;Tsinghua University",
        "aff_domain": ";tsinghua.edu.cn;;tsinghua.edu.cn;lzu.edu.cn;cs.tsinghua.edu.cn;mail.tsinghua.edu.cn;tsinghua.edu.cn",
        "position": ";Researcher;;PhD student;Undergrad student;Associate Professor;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nxie2024lightweight,\ntitle={Lightweight Graph Neural Network Search with Graph Sparsification},\nauthor={Beini Xie and Heng Chang and Ziwei Zhang and Zeyang Zhang and Simin Wu and Xin Wang and Yuan Meng and Wenwu Zhu},\nyear={2024},\nurl={https://openreview.net/forum?id=IefMMX12yk}\n}",
        "github": "",
        "project": "",
        "reviewers": "hwTX;WS6Y;CX38",
        "site": "https://openreview.net/forum?id=IefMMX12yk",
        "pdf_size": 742474,
        "rating": "3;5;8",
        "confidence": "5;4;2",
        "soundness": "2;3;3",
        "contribution": "2;2;3",
        "presentation": "3;3;3",
        "wc_summary": "87;22;64",
        "wc_strengths": "31;31;47",
        "wc_weaknesses": "129;276;63",
        "wc_questions": "167;2;70",
        "wc_review": "414;331;244",
        "wc_reply_reviewers": "0;117;0",
        "wc_reply_authors": "1041;984;385",
        "reply_reviewers": "0;1;0",
        "reply_authors": "3;2;1",
        "rating_avg": [
            5.333333333333333,
            2.0548046676563256
        ],
        "confidence_avg": [
            3.6666666666666665,
            1.247219128924647
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            57.666666666666664,
            26.911377189252548
        ],
        "wc_strengths_avg": [
            36.333333333333336,
            7.542472332656507
        ],
        "wc_weaknesses_avg": [
            156.0,
            89.02808545621994
        ],
        "wc_questions_avg": [
            79.66666666666667,
            67.70688459988557
        ],
        "wc_review_avg": [
            329.6666666666667,
            69.4086129781856
        ],
        "wc_reply_reviewers_avg": [
            39.0,
            55.154328932550705
        ],
        "wc_reply_authors_avg": [
            803.3333333333334,
            296.72021988548215
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.9971764649527382,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:NajYkFEJb7sJ:scholar.google.com/&scioq=Lightweight+Graph+Neural+Network+Search+with+Graph+Sparsification&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;0;0",
        "aff_unique_norm": "Tsinghua University;Lanzhou University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.lzu.edu.cn",
        "aff_unique_abbr": "THU;LZU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "IfqXxs1lCJ",
        "title": "On the Evaluation of Generative Models in Distributed Learning Tasks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The evaluation of deep generative models including generative adversarial networks (GANs) and diffusion models has been extensively studied in the literature. While the existing evaluation methods mainly target a centralized learning problem with training data stored by a single client, many applications of generative models concern distributed learning settings, e.g. the federated learning scenario, where training data are collected by and distributed among several clients.\nIn this paper, we study the evaluation of generative models in distributed learning tasks with heterogeneous data distributions. First, we focus on the Fr\u00e9chet inception distance (FID) and consider the following FID-based aggregate scores over the clients: 1) FID-avg as the mean of clients' individual FID scores, 2) FID-all as the FID distance of the trained model to the collective dataset containing all clients' data. We prove that the model rankings according to the FID-all and FID-avg scores could be inconsistent, which can lead to different optimal generative models according to the two aggregate scores. Next, we consider the kernel inception distance (KID) and similarly define the KID-avg and KID-all aggregations. Unlike the FID case, we prove that KID-all and KID-avg result in the same rankings of generative models. We perform several numerical experiments on standard image datasets and training schemes to support our theoretical findings on the evaluation of generative models in distributed learning problems.",
        "keywords": "generative models;model evaluation;distributed learning",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/bbe5e0f9e16436b565f761dc2987558e854621bc.pdf",
        "author": "Zixiao Wang;Farzan Farnia;Zhenghao Lin;Yunheng Shen;Bei Yu",
        "authorids": "~Zixiao_Wang1;~Farzan_Farnia1;~Zhenghao_Lin3;~Yunheng_Shen1;~Bei_Yu2",
        "gender": "M;M;M;;M",
        "homepage": "https://shiningsord.github.io/;https://www.cse.cuhk.edu.hk/~farnia/;https://resume.lnzh.me/;;http://www.cse.cuhk.edu.hk/~byu/index.html",
        "dblp": ";132/7757;;;28/4556-1.html",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;GYPCqcYAAAAJ;;;tGneTm4AAAAJ",
        "orcid": "0009-0000-8179-0996;0000-0002-6049-9232;;;0000-0001-6406-4810",
        "linkedin": ";farzan-farnia-00798335;;;yubei/",
        "or_profile": "~Zixiao_Wang1;~Farzan_Farnia1;~Zhenghao_Lin3;~Yunheng_Shen1;~Bei_Yu2",
        "aff": "Department of Computer Science and Engineering, The Chinese University of Hong Kong;The Chinese University of Hong Kong;University of Glasgow;;Department of Computer Science and Engineering, The Chinese University of Hong Kong",
        "aff_domain": "cse.cuhk.edu.hk;cuhk.edu.hk;gla.ac.uk;;cse.cuhk.edu.hk",
        "position": "PhD student;Assistant Professor;MS student;;Associate Professor",
        "bibtex": "@misc{\nwang2024on,\ntitle={On the Evaluation of Generative Models in Distributed Learning Tasks},\nauthor={Zixiao Wang and Farzan Farnia and Zhenghao Lin and Yunheng Shen and Bei Yu},\nyear={2024},\nurl={https://openreview.net/forum?id=IfqXxs1lCJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "dkjU;1nBR;MMnw",
        "site": "https://openreview.net/forum?id=IfqXxs1lCJ",
        "pdf_size": 1278663,
        "rating": "3;5;6",
        "confidence": "3;3;4",
        "soundness": "3;2;3",
        "contribution": "1;2;2",
        "presentation": "3;3;4",
        "wc_summary": "49;104;136",
        "wc_strengths": "28;63;119",
        "wc_weaknesses": "123;179;215",
        "wc_questions": "1;41;285",
        "wc_review": "201;387;755",
        "wc_reply_reviewers": "0;0;43",
        "wc_reply_authors": "648;583;742",
        "reply_reviewers": "0;0;1",
        "reply_authors": "1;1;2",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            96.33333333333333,
            35.92894221778438
        ],
        "wc_strengths_avg": [
            70.0,
            37.47888294315436
        ],
        "wc_weaknesses_avg": [
            172.33333333333334,
            37.85351884420904
        ],
        "wc_questions_avg": [
            109.0,
            125.51759504813127
        ],
        "wc_review_avg": [
            447.6666666666667,
            230.2018437999333
        ],
        "wc_reply_reviewers_avg": [
            14.333333333333334,
            20.27039439401436
        ],
        "wc_reply_authors_avg": [
            657.6666666666666,
            65.27037783115877
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.7559289460184545,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11122519530741201182&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Chinese University of Hong Kong;University of Glasgow",
        "aff_unique_dep": "Department of Computer Science and Engineering;",
        "aff_unique_url": "https://www.cuhk.edu.hk;https://www.gla.ac.uk",
        "aff_unique_abbr": "CUHK;Glasgow",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "title": "DP-OPT: Make Large Language Model Your Privacy-Preserving Prompt Engineer",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18958",
        "id": "Ifz3IgsEPX",
        "author_site": "Junyuan Hong, Jiachen (Tianhao) Wang, Chenhui Zhang, Zhangheng LI, Bo Li, Zhangyang Wang",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) have emerged as dominant tools for various tasks, particularly when tailored for a specific target by prompt tuning. Nevertheless, concerns surrounding data privacy present obstacles due to the tuned prompts' dependency on sensitive private information. A practical solution is to host a local LLM and optimize a soft prompt privately using data. Yet, hosting a local model becomes problematic when model ownership is protected. Alternative methods, like sending data to the model's provider for training, intensify these privacy issues facing an untrusted provider. In this paper, we present a novel solution called Differentially-Private Offsite Prompt Tuning (DP-OPT) to address this challenge. Our approach involves tuning a discrete prompt on the client side and then applying it to the desired cloud models. We demonstrate that prompts suggested by LLMs themselves can be transferred without compromising performance significantly. To ensure that the prompts do not leak private information, we introduce the first private prompt generation mechanism, by a differentially-private (DP) ensemble of in-context learning with private demonstrations.  With DP-OPT, generating privacy-preserving prompts by Vicuna-7b can yield competitive performance compared to non-private in-context learning on GPT3.5 or local private prompt tuning.\nCodes are available at https://github.com/VITA-Group/DP-OPT.",
        "keywords": "large language model;privacy;prompt tuing",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Junyuan Hong;Jiachen T. Wang;Chenhui Zhang;Zhangheng LI;Bo Li;Zhangyang Wang",
        "authorids": "~Junyuan_Hong1;~Jiachen_T._Wang1;~Chenhui_Zhang2;~Zhangheng_LI2;~Bo_Li19;~Zhangyang_Wang1",
        "gender": "M;M;M;F;M;M",
        "homepage": "https://jyhong.gitlab.io/;https://www.danielz.ch/;;http://boli.cs.illinois.edu/;https://vita-group.github.io;https://tianhaowang.netlify.app/",
        "dblp": "185/1316;;;50/3402-26;119/4026;274/2144",
        "google_scholar": "7Cbv6doAAAAJ;UYxdrBsAAAAJ;https://scholar.google.co.uk/citations?user=NZCLqZMAAAAJ;K8vJkTcAAAAJ;pxFyKAIAAAAJ;nvQOtgkAAAAJ",
        "orcid": "0000-0002-5718-5187;0000-0003-3915-6099;;;;",
        "linkedin": ";danielz02/;%E7%AB%A0%E6%81%92-%E6%9D%8E-b1b19711a/;;;tian-hao-wang/",
        "or_profile": "~Junyuan_Hong1;~Chenhui_Zhang2;~Zhangheng_LI2;~Bo_Li19;~Zhangyang_Wang1;~Tianhao_Wang2",
        "aff": "University of Texas at Austin;Massachusetts Institute of Technology;University of Texas at Austin;University of Illinois, Urbana Champaign;University of Texas at Austin;Princeton University",
        "aff_domain": "utexas.edu;mit.edu;utexas.edu;illinois.edu;utexas.edu;princeton.edu",
        "position": "Postdoc;PhD student;PhD student;Assistant Professor;Associate Professor;PhD student",
        "bibtex": "@inproceedings{\nhong2024dpopt,\ntitle={{DP}-{OPT}: Make Large Language Model Your Privacy-Preserving Prompt Engineer},\nauthor={Junyuan Hong and Jiachen T. Wang and Chenhui Zhang and Zhangheng LI and Bo Li and Zhangyang Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Ifz3IgsEPX}\n}",
        "github": "",
        "project": "",
        "reviewers": "rsb4;D5hy;pHUr;W4ZT",
        "pdf_size": 536483,
        "rating": "6;8;8;8",
        "confidence": "3;3;4;4",
        "soundness": "3;4;4;3",
        "contribution": "3;3;3;2",
        "presentation": "3;4;3;3",
        "wc_summary": "22;96;75;75",
        "wc_strengths": "36;284;336;32",
        "wc_weaknesses": "252;35;79;186",
        "wc_questions": "20;2;2;2",
        "wc_review": "330;417;492;295",
        "wc_reply_reviewers": "29;0;38;550",
        "wc_reply_authors": "876;14;328;729",
        "reply_reviewers": "1;0;1;3",
        "reply_authors": "4;1;2;4",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            67.0,
            27.358728040608906
        ],
        "wc_strengths_avg": [
            172.0,
            139.2264342716569
        ],
        "wc_weaknesses_avg": [
            138.0,
            85.71755946129124
        ],
        "wc_questions_avg": [
            6.5,
            7.794228634059948
        ],
        "wc_review_avg": [
            383.5,
            76.79355441702123
        ],
        "wc_reply_reviewers_avg": [
            154.25,
            228.9174250685168
        ],
        "wc_reply_authors_avg": [
            486.75,
            338.7088535896279
        ],
        "reply_reviewers_avg": [
            1.25,
            1.0897247358851685
        ],
        "reply_authors_avg": [
            2.75,
            1.299038105676658
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 44,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9308169723658493724&as_sdt=5,31&sciodt=0,31&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=Ifz3IgsEPX",
        "pdf": "https://openreview.net/pdf?id=Ifz3IgsEPX",
        "email": "utexas.edu;mit.edu;utexas.edu;illinois.edu;utexas.edu;princeton.edu",
        "author_num": 6,
        "aff_unique_index": "0;1;0;2;0;3",
        "aff_unique_norm": "University of Texas at Austin;Massachusetts Institute of Technology;University of Illinois Urbana-Champaign;Princeton University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.utexas.edu;https://web.mit.edu;https://illinois.edu;https://www.princeton.edu",
        "aff_unique_abbr": "UT Austin;MIT;UIUC;Princeton",
        "aff_campus_unique_index": "0;0;2;0",
        "aff_campus_unique": "Austin;;Urbana-Champaign",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "IhD1rBHhDy",
        "title": "Mining Patents with Large Language Models Demonstrates Congruence of Functional Labels and Chemical Structures",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Predicting chemical function from structure is a major goal of the chemical sciences, from the discovery and repurposing of novel drugs to the creation of new materials. Recently, new machine learning algorithms are opening up the possibility of general predictive models spanning many different chemical functions. Here, we consider the challenge of applying large language models to chemical patents in order to consolidate and leverage the information about chemical functionality captured by these resources. Chemical patents contain vast knowledge on chemical function, but their usefulness as a dataset has historically been neglected due to the impracticality of extracting high-quality functional labels. Using a scalable ChatGPT-assisted patent summarization and word-embedding label cleaning pipeline, we derive a Chemical Function (CheF) dataset, containing 100K molecules and their patent-derived functional labels. The functional labels were validated to be of high quality, allowing us to detect a strong relationship between functional label and chemical structural spaces. Further, we find that the co-occurrence graph of the functional labels contains a robust semantic structure, which allowed us in turn to examine functional relatedness among the compounds. We then trained a model on the CheF dataset, allowing us to assign new functional labels to compounds. Using this model, we were able to retrodict approved Hepatitis C antivirals, uncover an antiviral mechanism undisclosed in the patent, and identify plausible serotonin-related drugs. The CheF dataset and associated model offers a promising new approach to predict chemical functionality.",
        "keywords": "large language model;LLM;ChatGPT;data mining;chemistry;function;antiviral;drug discovery;CheF;patents;functionality;chemical function;electroluminescence;serotonin;5-ht;hcv;hepatitis",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Clayton W Kosonocky;Claus O Wilke;Edward Marcotte;Andrew Ellington",
        "authorids": "~Clayton_W_Kosonocky1;~Claus_O_Wilke1;~Edward_Marcotte1;~Andrew_Ellington1",
        "gender": "M;M;M;",
        "homepage": ";;http://www.marcottelab.org/index.php/Main_Page;http://www.ellingtonlab.org",
        "dblp": ";;;",
        "google_scholar": "908tnhAAAAAJ;;KxmUmKkAAAAJ;",
        "orcid": ";0000-0002-7470-9261;0000-0001-8808-180X;0000-0001-6246-5338",
        "linkedin": "clay-kosonocky/;;;",
        "or_profile": "~Clayton_W_Kosonocky1;~Claus_O_Wilke1;~Edward_Marcotte1;~Andrew_Ellington1",
        "aff": "University of Texas at Austin;University of Texas, Austin;University of Texas at Austin;University of Texas at Austin",
        "aff_domain": "utexas.edu;utexas.edu;utexas.edu;utexas.edu",
        "position": "PhD student;Researcher;Full Professor;Full Professor",
        "bibtex": "@misc{\nkosonocky2024mining,\ntitle={Mining Patents with Large Language Models Demonstrates Congruence of Functional Labels and Chemical Structures},\nauthor={Clayton W Kosonocky and Claus O Wilke and Edward Marcotte and Andrew Ellington},\nyear={2024},\nurl={https://openreview.net/forum?id=IhD1rBHhDy}\n}",
        "github": "",
        "project": "",
        "reviewers": "HDTT;qEJ1;pFTF;Lg3y",
        "site": "https://openreview.net/forum?id=IhD1rBHhDy",
        "pdf_size": 33429821,
        "rating": "3;5;6;8",
        "confidence": "4;4;3;4",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "37;57;44;161",
        "wc_strengths": "55;75;26;118",
        "wc_weaknesses": "159;154;23;90",
        "wc_questions": "37;35;71;39",
        "wc_review": "288;321;164;408",
        "wc_reply_reviewers": "236;0;0;0",
        "wc_reply_authors": "1396;1226;769;803",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "2;2;1;2",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            74.75,
            50.310908359917335
        ],
        "wc_strengths_avg": [
            68.5,
            33.47013594235912
        ],
        "wc_weaknesses_avg": [
            106.5,
            55.35566818312286
        ],
        "wc_questions_avg": [
            45.5,
            14.79019945774904
        ],
        "wc_review_avg": [
            295.25,
            87.54248968358165
        ],
        "wc_reply_reviewers_avg": [
            59.0,
            102.19099764656376
        ],
        "wc_reply_authors_avg": [
            1048.5,
            269.56121753694464
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.16012815380508713,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6525860836238186756&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of Texas at Austin",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.utexas.edu",
        "aff_unique_abbr": "UT Austin",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Austin",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "IhOeYKqnfp",
        "title": "Continual Memory Neurons",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Learning with neural networks by continuously processing a stream of data is very related to the way humans learn from perceptual information. However, when data is not i.i.d., it is largely known that it is very hard to find a good trade-off between plasticity and stability, frequently resulting in catastrophic forgetting issues. In this paper, to our best knowledge, we are the first to follow a significantly novel route, tackling the problem at the lowest level of abstraction. We propose a neuron model, referred to as Continual Memory Neuron (CMN), which does not only compute a response to an input pattern, but also diversifies computations to preserve what was previously learned, while being plastic enough to adapt to new knowledge. The values attached to weights are computed as a function of the neuron input, which acts as a query in a key-value map, with the goal of selecting and blending a set of learnable memory units. We show that this computational scheme is motivated by and strongly related to the ones of popular models that perform computations relying on a set of samples stored in a memory buffer, including Kernel Machines and Transformers. Experiments on class-and-domain incremental streams processed in online and single-pass manner support CMNs' capability to mitigate forgetting, while keeping competitive or better performance with respect to continual learning methods that explicitly store and replay data over time.",
        "keywords": "Neuron Model;Online Continual Learning;Replay-buffer-free Learning;Self-organized Memories",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/f821dc6f6881a5ee8147214ed206f1c86bcfcada.zip",
        "author": "Matteo Tiezzi;Simone Marullo;Federico Becattini;Stefano Melacci",
        "authorids": "~Matteo_Tiezzi1;~Simone_Marullo1;~Federico_Becattini2;~Stefano_Melacci1",
        "gender": "M;M;M;M",
        "homepage": "https://mtiezzi.github.io/;;https://docenti.unisi.it/it/becattini-0;http://www.dii.unisi.it/~melacci",
        "dblp": "225/6739;274/1399;183/0099;96/4456.html",
        "google_scholar": "HJ2TW1YAAAAJ;;https://scholar.google.it/citations?user=t0sXvkAAAAAJ;https://scholar.google.it/citations?user=_HHu1MQAAAAJ",
        "orcid": ";;0000-0003-2537-2700;0000-0002-0415-0888",
        "linkedin": "mtiezzi/?originalSubdomain=it;simone-marullo-27664b106/;;stefano-melacci-105524a/",
        "or_profile": "~Matteo_Tiezzi1;~Simone_Marullo1;~Federico_Becattini2;~Stefano_Melacci1",
        "aff": "University of Siena;;University of Siena;University of Siena",
        "aff_domain": "unisi.it;;unisi.it;unisi.it",
        "position": "Postdoc;;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\ntiezzi2024continual,\ntitle={Continual Memory Neurons},\nauthor={Matteo Tiezzi and Simone Marullo and Federico Becattini and Stefano Melacci},\nyear={2024},\nurl={https://openreview.net/forum?id=IhOeYKqnfp}\n}",
        "github": "",
        "project": "",
        "reviewers": "8Cfm;Cr65;9zgE;Lniw",
        "site": "https://openreview.net/forum?id=IhOeYKqnfp",
        "pdf_size": 1485572,
        "rating": "3;3;5;6",
        "confidence": "5;4;3;4",
        "soundness": "2;1;2;3",
        "contribution": "2;4;2;3",
        "presentation": "1;2;3;3",
        "wc_summary": "74;292;69;53",
        "wc_strengths": "32;58;26;42",
        "wc_weaknesses": "38;328;44;220",
        "wc_questions": "122;133;24;1",
        "wc_review": "266;811;163;316",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "804;1335;697;774",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            122.0,
            98.45557373760005
        ],
        "wc_strengths_avg": [
            39.5,
            12.114041439585717
        ],
        "wc_weaknesses_avg": [
            157.5,
            122.61627135091003
        ],
        "wc_questions_avg": [
            70.0,
            58.20223363411408
        ],
        "wc_review_avg": [
            389.0,
            249.80892698220373
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            902.5,
            252.73553371063596
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5443310539518174,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6694231808378556236&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Siena",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.unisi.it",
        "aff_unique_abbr": "UniSi",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Italy"
    },
    {
        "id": "IhWtRwIbos",
        "title": "Discovering Environments with XRM",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Successful out-of-distribution generalization requires environment annotations. Unfortunately, these are resource-intensive to obtain, and their relevance to model performance is limited by the expectations and perceptual biases of human annotators. Therefore, to enable robust AI systems across applications, we must develop algorithms to automatically discover environments inducing broad generalization. Current proposals, which divide examples based on their training error, suffer from one fundamental problem. These methods add hyper-parameters and early-stopping criteria that are impossible to tune without a validation set with human-annotated environments, the very information subject to discovery. In this paper, we propose Cross-Risk-Minimization (XRM) to address this issue. XRM trains two twin networks, each learning from one random half of the training data, while imitating confident held-out mistakes made by its sibling. XRM provides a recipe for hyper-parameter tuning, does not require early-stopping, and can discover environments for all training and validation data. Domain generalization algorithms built on top of XRM environments achieve oracle worst-group-accuracy, solving a long-standing problem in out-of-distribution generalization.",
        "keywords": "domain;environment;generalization;invariance;spurious;out-of-distribution",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Mohammad Pezeshki;Diane Bouchacourt;Mark Ibrahim;Nicolas Ballas;Pascal Vincent;David Lopez-Paz",
        "authorids": "~Mohammad_Pezeshki1;~Diane_Bouchacourt3;~Mark_Ibrahim1;~Nicolas_Ballas1;~Pascal_Vincent1;~David_Lopez-Paz2",
        "gender": "M;;;M;;F",
        "homepage": "https://mohammadpz.github.io/;https://markibrahim.me/;;http://www.iro.umontreal.ca/~vincentp;http://lopezpaz.org;https://dianebouchacourt.github.io/",
        "dblp": "139/0888;180/5660;120/9066;43/861;74/10481;176/1498",
        "google_scholar": "HT85tXsAAAAJ;AqYyoCMAAAAJ;euUV4iUAAAAJ;WBCKQMsAAAAJ;;",
        "orcid": ";;;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Mohammad_Pezeshki1;~Mark_Ibrahim1;~Nicolas_Ballas1;~Pascal_Vincent1;~David_Lopez-Paz2;~Diane_Nicole_Bouchacourt1",
        "aff": "Meta Facebook;Facebook AI Research (FAIR) Meta;Meta;Facebook A.I. Research;Meta Facebook;Meta AI Research",
        "aff_domain": "fb.com;ai.facebook.com;meta.com;fb.com;fb.com;meta.com",
        "position": "Postdoc;Researcher;Researcher;Research Scientist;Research Scientist;Researcher",
        "bibtex": "@misc{\npezeshki2024discovering,\ntitle={Discovering Environments with {XRM}},\nauthor={Mohammad Pezeshki and Diane Bouchacourt and Mark Ibrahim and Nicolas Ballas and Pascal Vincent and David Lopez-Paz},\nyear={2024},\nurl={https://openreview.net/forum?id=IhWtRwIbos}\n}",
        "github": "",
        "project": "",
        "reviewers": "KDkA;fj8c;f39H",
        "site": "https://openreview.net/forum?id=IhWtRwIbos",
        "pdf_size": 1253272,
        "rating": "3;5;6",
        "confidence": "2;4;4",
        "soundness": "2;2;2",
        "contribution": "2;2;3",
        "presentation": "2;3;3",
        "wc_summary": "44;78;67",
        "wc_strengths": "11;50;76",
        "wc_weaknesses": "914;191;521",
        "wc_questions": "179;76;2",
        "wc_review": "1148;395;666",
        "wc_reply_reviewers": "203;0;115",
        "wc_reply_authors": "890;264;584",
        "reply_reviewers": "1;0;2",
        "reply_authors": "2;1;2",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            63.0,
            14.165686240583852
        ],
        "wc_strengths_avg": [
            45.666666666666664,
            26.71246067953223
        ],
        "wc_weaknesses_avg": [
            542.0,
            295.5367997390511
        ],
        "wc_questions_avg": [
            85.66666666666667,
            72.58252008729252
        ],
        "wc_review_avg": [
            736.3333333333334,
            311.40791397921936
        ],
        "wc_reply_reviewers_avg": [
            106.0,
            83.11838946145834
        ],
        "wc_reply_authors_avg": [
            579.3333333333334,
            255.58473263392622
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.944911182523068,
        "gs_citation": 24,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12498502238921331189&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "Meta",
        "aff_unique_dep": "Meta Platforms, Inc.",
        "aff_unique_url": "https://meta.com",
        "aff_unique_abbr": "Meta",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "IiimxXqxNP",
        "title": "Efficient and scalable reinforcement learning via hypermodel",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Data-efficient reinforcement learning(RL) requires deep exploration.\n    Thompson sampling is a principled method for deep exploration in reinforcement learning.\n    However, Thompson sampling need to track the degree of uncertainty by maintaining the posterior distribution of models, which is computationally feasible only in simple environments with restrictive assumptions.\n    A key problem in modern RL is how to develop data and computation efficient algorithm that is scalable to large-scale complex environments.\n    We develop a principled framework, called HyperFQI, to tackle both the computation and data efficiency issues.\n    HyperFQI can be regarded as approximate Thompson sampling for reinforcement learning based on hypermodel. Hypermodel in this context serves as the role for uncertainty estimation of action-value function.\n    HyperFQI demonstrates its ability for efficient and scalable deep exploration in DeepSea benchmark with large state space.\n    HyperFQI also achieves super-human performance in Atari benchmark with 2M interactions with low computation costs.\n    We also give a rigorous performance analysis for the proposed method, justifying its computation and data efficiency.\n    To the best of knowledge, this is the first principled RL algorithm that is provably efficient and also practically scalable to complex environments such as Arcade learning environment that requires deep networks for pixel-based control.",
        "keywords": "Reinforcement Learning; exploration; sample efficiency; computation efficiency",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Yingru Li;Jiawei Xu;Lei Han;Zhi-Quan Luo",
        "authorids": "~Yingru_Li1;~Jiawei_Xu1;~Lei_Han1;~Zhi-Quan_Luo1",
        "gender": "M;M;M;M",
        "homepage": "https://richardli.xyz;https://github.com/jiawei415;https://www.leihan.org;",
        "dblp": "156/7684;;75/2307-1;",
        "google_scholar": "OOhB7fcAAAAJ;;Tz4_zi8AAAAJ;dW3gcXoAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Yingru_Li1;~Jiawei_Xu1;~Lei_Han1;~Zhi-Quan_Luo1",
        "aff": "The Chinese University of Hong Kong, Shenzhen, China;CUHK(SZ);Tencent Robotics X;The Chinese University of Hong Kong, Shenzhen",
        "aff_domain": "cuhk.edu.cn;link.cuhk.edu.cn;tencent.com;cuhk.edu.cn",
        "position": "PhD student;PhD student;Principal Researcher;Full Professor",
        "bibtex": "@misc{\nli2024efficient,\ntitle={Efficient and scalable reinforcement learning via hypermodel},\nauthor={Yingru Li and Jiawei Xu and Lei Han and Zhi-Quan Luo},\nyear={2024},\nurl={https://openreview.net/forum?id=IiimxXqxNP}\n}",
        "github": "",
        "project": "",
        "reviewers": "bSoB;47P5;2VR8;87xX;h2ut",
        "site": "https://openreview.net/forum?id=IiimxXqxNP",
        "pdf_size": 3135289,
        "rating": "3;3;5;6;6",
        "confidence": "5;5;3;4;3",
        "soundness": "1;1;2;4;3",
        "contribution": "2;2;3;4;3",
        "presentation": "2;1;3;3;4",
        "wc_summary": "35;68;87;30;80",
        "wc_strengths": "25;32;64;10;58",
        "wc_weaknesses": "432;248;165;32;11",
        "wc_questions": "474;39;31;29;83",
        "wc_review": "966;387;347;101;232",
        "wc_reply_reviewers": "0;0;0;18;0",
        "wc_reply_authors": "732;302;500;40;145",
        "reply_reviewers": "0;0;0;1;0",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            4.6,
            1.3564659966250536
        ],
        "confidence_avg": [
            4.0,
            0.8944271909999159
        ],
        "soundness_avg": [
            2.2,
            1.16619037896906
        ],
        "contribution_avg": [
            2.8,
            0.7483314773547882
        ],
        "presentation_avg": [
            2.6,
            1.019803902718557
        ],
        "wc_summary_avg": [
            60.0,
            23.31523107327054
        ],
        "wc_strengths_avg": [
            37.8,
            20.32141727340886
        ],
        "wc_weaknesses_avg": [
            177.6,
            154.13578429423845
        ],
        "wc_questions_avg": [
            131.2,
            172.52292601274763
        ],
        "wc_review_avg": [
            406.6,
            296.8976928169028
        ],
        "wc_reply_reviewers_avg": [
            3.6,
            7.2
        ],
        "wc_reply_authors_avg": [
            343.8,
            248.45957417656498
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8242255917447339,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5029921099334397070&as_sdt=5,39&sciodt=0,39&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Chinese University of Hong Kong;Chinese University of Hong Kong, Shenzhen;Tencent",
        "aff_unique_dep": ";;Tencent Robotics X",
        "aff_unique_url": "https://www.cuhk.edu.cn;https://www.cuhk.edu.cn/sz;https://www.tencent.com",
        "aff_unique_abbr": "CUHK;CUHK(SZ);Tencent Robotics X",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Shenzhen;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "Iip7rt9UL3",
        "title": "Lightweight, Pre-trained Transformers for Remote Sensing Timeseries",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Machine learning models for parsing remote sensing data have a wide range of societally relevant applications, but labels used to train these models can be difficult or impossible to acquire. This challenge has spurred research into self-supervised learning for remote sensing data aiming to unlock the use of machine learning in geographies or application domains where labelled datasets are small. Current self-supervised learning approaches for remote sensing data draw significant inspiration from techniques applied to natural images. However, remote sensing data has important differences from natural images -- for example, the temporal dimension is critical for many tasks and data is collected from many complementary sensors. We show we can create significantly smaller performant models by designing architectures and self-supervised training techniques specifically for remote sensing data. We introduce the Pretrained Remote Sensing Transformer (Presto), a transformer-based model pre-trained on remote sensing pixel-timeseries data. Presto excels at a wide variety of globally distributed remote sensing tasks and performs competitively with much larger models while requiring far less compute. Presto can be used for transfer learning or as a feature extractor for simple models, enabling efficient deployment at scale.",
        "keywords": "remote sensing;ai for good;agriculture;land cover mapping;satellite data",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Gabriel Tseng;Ruben Cartuyvels;Ivan Zvonkov;Mirali Purohit;David Rolnick;Hannah Kerner",
        "authorids": "~Gabriel_Tseng1;~Ruben_Cartuyvels1;~Ivan_Zvonkov1;~Mirali_Purohit1;~David_Rolnick1;~Hannah_Kerner1",
        "gender": "M;;;F;M;F",
        "homepage": "https://gabrieltseng.github.io/;;https://ivanzvonkov.github.io/;;http://www.davidrolnick.com/;https://hannah-rae.github.io/",
        "dblp": ";;319/6737;;37/10718;218/2646",
        "google_scholar": ";;6BDzRugAAAAJ;hUF42PEAAAAJ;P_luG3cAAAAJ;g5CD7dQAAAAJ",
        "orcid": ";;;0009-0009-0354-4920;;0000-0002-3259-7759",
        "linkedin": ";;;mirali-purohit/;;hannahkerner/",
        "or_profile": "~Gabriel_Tseng1;~Ruben_Cartuyvels1;~Ivan_Zvonkov1;~Mirali_Purohit1;~David_Rolnick1;~Hannah_Kerner1",
        "aff": "Allen Institute for Artificial Intelligence;;;Arizona State University (ASU);McGill University;Arizona State University",
        "aff_domain": "allenai.org;;;asu.edu;cs.mcgill.ca;asu.edu",
        "position": "Intern;;;PhD student;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\ntseng2024lightweight,\ntitle={Lightweight, Pre-trained Transformers for Remote Sensing Timeseries},\nauthor={Gabriel Tseng and Ruben Cartuyvels and Ivan Zvonkov and Mirali Purohit and David Rolnick and Hannah Kerner},\nyear={2024},\nurl={https://openreview.net/forum?id=Iip7rt9UL3}\n}",
        "github": "",
        "project": "",
        "reviewers": "DF48;X32p;T6WZ;5BXx",
        "site": "https://openreview.net/forum?id=Iip7rt9UL3",
        "pdf_size": 3433155,
        "rating": "3;5;5;6",
        "confidence": "4;4;4;4",
        "soundness": "1;3;2;3",
        "contribution": "2;3;2;3",
        "presentation": "2;3;3;4",
        "wc_summary": "46;76;107;95",
        "wc_strengths": "86;106;235;53",
        "wc_weaknesses": "783;150;247;92",
        "wc_questions": "102;16;128;38",
        "wc_review": "1017;348;717;278",
        "wc_reply_reviewers": "256;0;0;0",
        "wc_reply_authors": "3024;487;921;380",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "5;1;2;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            81.0,
            23.03258561256204
        ],
        "wc_strengths_avg": [
            120.0,
            69.03984356876832
        ],
        "wc_weaknesses_avg": [
            318.0,
            274.11949948881784
        ],
        "wc_questions_avg": [
            71.0,
            45.617978911828175
        ],
        "wc_review_avg": [
            590.0,
            297.6432428260383
        ],
        "wc_reply_reviewers_avg": [
            64.0,
            110.85125168440814
        ],
        "wc_reply_authors_avg": [
            1203.0,
            1070.694867831167
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            1.6393596310755
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 72,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2538327610560973805&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "Allen Institute for Artificial Intelligence;Arizona State University;McGill University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://allenai.org;https://www.asu.edu;https://www.mcgill.ca",
        "aff_unique_abbr": "AI2;ASU;McGill",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "United States;Canada"
    },
    {
        "id": "IjJU2BRSCV",
        "title": "Differentiable Tree Search in Latent State Space",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In decision-making problems with limited training data, policy functions approximated using deep neural networks often exhibit suboptimal performance. An alternative approach involves learning a world model from the limited data and determining actions through online search. However, the performance is adversely affected by compounding errors arising from inaccuracies in the learnt world model. While methods like TreeQN have attempted to address these inaccuracies by incorporating algorithmic structural biases into their architectures, the biases they introduce are often weak and insufficient for complex decision-making tasks. In this work, we introduce Differentiable Tree Search (DTS), a novel neural network architecture that significantly strengthens the inductive bias by embedding the algorithmic structure of a best-first online search algorithm. DTS employs a learnt world model to conduct a fully differentiable online search in latent state space. The world model is jointly optimised with the search algorithm, enabling the learning of a robust world model and mitigating the effect of model inaccuracies. We address potential Q-function discontinuities arising from naive incorporation of best-first search by adopting a stochastic tree expansion policy, formulating search tree expansion as a decision-making task, and introducing an effective variance reduction technique for the gradient computation. We evaluate DTS in an offline-RL setting with a limited training data scenario on Procgen games and grid navigation task, and demonstrate that DTS outperforms popular model-free and model-based baselines.",
        "keywords": "Reinforcement Learning;Online Search;Algorithmic Inductive Bias;Procgen;Offline-RL",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/c3eb33e3bc556ffc3725cfe61e55ee66b7c5e547.zip",
        "author": "Dixant Mittal;Wee Sun Lee",
        "authorids": "~Dixant_Mittal1;~Wee_Sun_Lee1",
        "gender": "M;M",
        "homepage": "https://www.dixantmittal.com;http://www.comp.nus.edu.sg/~leews/",
        "dblp": "258/5802;86/1498",
        "google_scholar": "1AoSTvUAAAAJ;https://scholar.google.com.sg/citations?user=8PCrLgwAAAAJ",
        "orcid": "0000-0001-5738-3979;",
        "linkedin": "dixantmittal/;",
        "or_profile": "~Dixant_Mittal1;~Wee_Sun_Lee1",
        "aff": "National University of Singapore;National University of Singapore",
        "aff_domain": "u.nus.edu;nus.edu.sg",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nmittal2024differentiable,\ntitle={Differentiable Tree Search in Latent State Space},\nauthor={Dixant Mittal and Wee Sun Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=IjJU2BRSCV}\n}",
        "github": "",
        "project": "",
        "reviewers": "SaqX;CkbR;ZXWN;NKWY",
        "site": "https://openreview.net/forum?id=IjJU2BRSCV",
        "pdf_size": 492767,
        "rating": "5;6;6;6",
        "confidence": "4;4;4;3",
        "soundness": "3;2;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;3;3;2",
        "wc_summary": "222;91;89;65",
        "wc_strengths": "68;83;125;49",
        "wc_weaknesses": "321;51;110;65",
        "wc_questions": "64;151;56;178",
        "wc_review": "675;376;380;357",
        "wc_reply_reviewers": "0;35;78;0",
        "wc_reply_authors": "475;907;640;701",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;2;2;2",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            116.75,
            61.621323419738395
        ],
        "wc_strengths_avg": [
            81.25,
            27.985487310390006
        ],
        "wc_weaknesses_avg": [
            136.75,
            108.58723451676997
        ],
        "wc_questions_avg": [
            112.25,
            53.19010716289261
        ],
        "wc_review_avg": [
            447.0,
            131.92232563141084
        ],
        "wc_reply_reviewers_avg": [
            28.25,
            32.080952292598795
        ],
        "wc_reply_authors_avg": [
            680.75,
            154.59038618232378
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:qbwLRI_WpdcJ:scholar.google.com/&scioq=Differentiable+Tree+Search+in+Latent+State+Space&hl=en&as_sdt=0,5",
        "gs_version_total": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "National University of Singapore",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nus.edu.sg",
        "aff_unique_abbr": "NUS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Singapore"
    },
    {
        "title": "GraphChef: Decision-Tree Recipes to Explain Graph Neural Networks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18957",
        "id": "IjMUGuUmBI",
        "author_site": "Peter M\u00fcller, Lukas Faber, Karolis Martinkus, Roger Wattenhofer",
        "tldr": "",
        "abstract": "We propose a new self-explainable Graph Neural Network (GNN) model: GraphChef. GraphChef integrates decision trees into the GNN message passing framework. Given a dataset, GraphChef returns a set of rules (a recipe) that explains each class in the dataset unlike existing GNNs and explanation methods that reason on individual graphs. Thanks to the decision trees, GraphChef  recipes are human understandable.  We also present a new pruning method to produce small and easy to digest trees. Experiments demonstrate that GraphChef reaches comparable accuracy to not self-explainable GNNs and produced decision trees are indeed small. We further validate the correctness of the discovered recipes on datasets where explanation ground truth is available: Reddit-Binary, MUTAG, BA-2Motifs, BA-Shapes, Tree-Cycle, and Tree-Grid.",
        "keywords": "Graph Neural Networks;GNN;Explainability;Decision Trees",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/f54bec525dfcaccee5a198f22d9775be87a286ca.zip",
        "author": "Peter M\u00fcller;Lukas Faber;Karolis Martinkus;Roger Wattenhofer",
        "authorids": "~Peter_M\u00fcller2;~Lukas_Faber1;~Karolis_Martinkus1;~Roger_Wattenhofer1",
        "gender": ";;M;Not Specified",
        "homepage": ";;https://disco.ethz.ch/members/mkarolis;https://disco.ethz.ch/members/wroger",
        "dblp": ";;276/5531;w/RogerWattenhofer",
        "google_scholar": ";;https://scholar.google.ch/citations?user=Sr6ho54AAAAJ;https://scholar.google.ch/citations?user=EG3VPm4AAAAJ",
        "orcid": ";;0000-0002-5344-4321;",
        "linkedin": "muepe/;;;roger-wattenhofer-4466731/",
        "or_profile": "~Peter_M\u00fcller2;~Lukas_Faber1;~Karolis_Martinkus1;~Roger_Wattenhofer1",
        "aff": ";;Prescient Design / Genentech / Roche;Swiss Federal Institute of Technology",
        "aff_domain": ";;roche.com;ethz.ch",
        "position": ";;Researcher;Full Professor",
        "bibtex": "@inproceedings{\nm{\\\"u}ller2024graphchef,\ntitle={GraphChef: Decision-Tree Recipes to Explain Graph Neural Networks},\nauthor={Peter M{\\\"u}ller and Lukas Faber and Karolis Martinkus and Roger Wattenhofer},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=IjMUGuUmBI}\n}",
        "github": "",
        "project": "",
        "reviewers": "2W2r;VFKG;U2So;8CuG;2TRZ",
        "pdf_size": 5714175,
        "rating": "6;6;6;8;8",
        "confidence": "4;3;4;2;4",
        "soundness": "3;3;3;3;3",
        "contribution": "3;3;3;3;3",
        "presentation": "3;3;2;3;4",
        "wc_summary": "75;73;113;111;60",
        "wc_strengths": "125;51;115;215;26",
        "wc_weaknesses": "111;62;217;41;1",
        "wc_questions": "8;110;69;4;35",
        "wc_review": "319;296;514;371;122",
        "wc_reply_reviewers": "27;5;5;0;0",
        "wc_reply_authors": "741;624;510;42;303",
        "reply_reviewers": "2;1;1;0;0",
        "reply_authors": "2;1;1;1;1",
        "rating_avg": [
            6.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.4,
            0.8
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            86.4,
            21.536945001554887
        ],
        "wc_strengths_avg": [
            106.4,
            65.95028430567984
        ],
        "wc_weaknesses_avg": [
            86.4,
            74.31177564827797
        ],
        "wc_questions_avg": [
            45.2,
            39.876810303734175
        ],
        "wc_review_avg": [
            324.4,
            126.42879418866575
        ],
        "wc_reply_reviewers_avg": [
            7.4,
            10.05186549850325
        ],
        "wc_reply_authors_avg": [
            444.0,
            247.5681724293331
        ],
        "reply_reviewers_avg": [
            0.8,
            0.7483314773547883
        ],
        "reply_authors_avg": [
            1.2,
            0.4000000000000001
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.4082482904638631,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5374310698404019470&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=IjMUGuUmBI",
        "pdf": "https://openreview.net/pdf?id=IjMUGuUmBI",
        "email": ";;roche.com;ethz.ch",
        "author_num": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Roche;Swiss Federal Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.roche.com;https://www.ethz.ch",
        "aff_unique_abbr": "Roche;ETH Zurich",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Switzerland"
    },
    {
        "id": "IkIqzDI7ie",
        "title": "M$^4$LE: A Multi-Ability Multi-Range Long Context Evaluation Benchmark for Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Managing long sequences has become an important and necessary feature for large language models (LLMs). However, it is still an open question of how to comprehensively and systematically evaluate the long-sequence capability of LLMs. One of the reasons is that conventional and widely-used benchmarks mainly consist of short sequences.  In this paper, we propose $\\textbf{M$^4$LE}$, a $\\textbf{M}$ulti-ability, $\\textbf{M}$ulti-range, $\\textbf{M}$ulti-task, $\\textbf{M}$ulti-domain benchmark for $\\textbf{L}$ong-context $\\textbf{E}$valuation.\n$\\textbf{M$^4$LE}$ is based on a diverse NLP task pool comprising\n36 NLP datasets, 12 task types and 12 domains.\nTo alleviate the scarcity of tasks with naturally long sequences and incorporate multiple-ability assessment, we propose an automatic approach  (but with negligible human annotations) to convert short-sequence tasks into a unified long-sequence scenario where LLMs have to identify single or multiple relevant spans in long contexts based on explicit or semantic hints.\nSpecifically, the scenario includes five different types of abilities: (1) explicit single-span; (2) semantic single-span; (3) explicit multiple-span; (4) semantic multiple-span; and (5) global context understanding.\nThe resulting samples in $\\textbf{M$^4$LE}$ are evenly distributed from 1k to 8k input length.\nWe conducted a systematic evaluation on 11 well-established LLMs, especially those optimized for long-sequence inputs. Our results reveal that: 1) Current LLMs struggle to understand long context, particularly when tasks require multiple-span attention. 2) Semantic retrieval task is more difficult for competent LLMs. 3) Models fine-tuned on longer text with position interpolation have comparable performance to those using Neural Tangent Kernel (NTK) aware scaling methods without fine-tuning.\nWe make our benchmark publicly available to encourage future research in this challenging area.",
        "keywords": "long-context;natural language understanding;large language model;evaluation;benchmark",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Wai-Chung Kwan;Xingshan Zeng;Yufei Wang;Yusen Sun;Liangyou Li;Lifeng Shang;Qun Liu;Kam-Fai Wong",
        "authorids": "~Wai-Chung_Kwan2;~Xingshan_Zeng1;~Yufei_Wang7;~Yusen_Sun1;~Liangyou_Li1;~Lifeng_Shang1;~Qun_Liu1;~Kam-Fai_Wong2",
        "gender": "M;M;;M;M;M;M;",
        "homepage": ";https://garyyufei.github.io/;;;;http://liuquncn.github.io/;http://www.se.cuhk.edu.hk/~kfwong;https://kwanwaichung.github.io/",
        "dblp": "220/2024;61/5568-3;315/8150;78/7942;70/4288;75/4402-1;w/KamFaiWong;",
        "google_scholar": "Ca08I6AAAAAJ;gFoSqqkAAAAJ;;PPDE-uIAAAAJ;https://scholar.google.com.hk/citations?user=jMQIjYoAAAAJ;2HhiGzcAAAAJ;;77Lyt1cAAAAJ",
        "orcid": ";;0000-0002-9544-950X;0000-0002-0279-003X;;0000-0002-7000-1792;0000-0002-9427-5659;",
        "linkedin": ";garyyufei/;;;;qunliu/;;wai-chung-kwan-46a6bb152",
        "or_profile": "~Xingshan_Zeng1;~Yufei_Wang7;~Yusen_Sun1;~Liangyou_Li1;~Lifeng_Shang1;~Qun_Liu1;~Kam-Fai_Wong2;~Wai_Chung_Kwan1",
        "aff": "Huawei Technologies Ltd.;Huawei Technologies Ltd.;Huawei Technologies Ltd.;Huawei Noah's Ark Lab;Huawei Technologies Ltd.;Huawei Noah's Ark Lab;The Chinese University of Hong Kong;The Chinese University of Hong Kong",
        "aff_domain": "huawei.com;huawei.com;huawei.com;huawei.com;huawei.com;huawei.com;cuhk.edu.hk;cuhk.edu.hk",
        "position": "Researcher;Researcher;Researcher;Researcher;Researcher;Chief Scientist of Speech and Language Computing;Full Professor;PhD student",
        "bibtex": "@misc{\nkwan2024mle,\ntitle={M\\${\\textasciicircum}4\\${LE}: A Multi-Ability Multi-Range Long Context Evaluation Benchmark for Large Language Models},\nauthor={Wai-Chung Kwan and Xingshan Zeng and Yufei Wang and Yusen Sun and Liangyou Li and Lifeng Shang and Qun Liu and Kam-Fai Wong},\nyear={2024},\nurl={https://openreview.net/forum?id=IkIqzDI7ie}\n}",
        "github": "",
        "project": "",
        "reviewers": "sezj;qZry;2qJD;NJ6x",
        "site": "https://openreview.net/forum?id=IkIqzDI7ie",
        "pdf_size": 10325122,
        "rating": "3;5;5;6",
        "confidence": "4;5;4;4",
        "soundness": "3;3;1;3",
        "contribution": "3;3;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "74;103;101;37",
        "wc_strengths": "51;63;90;70",
        "wc_weaknesses": "227;434;107;25",
        "wc_questions": "2;4;6;12",
        "wc_review": "354;604;304;144",
        "wc_reply_reviewers": "0;0;15;0",
        "wc_reply_authors": "766;1179;453;209",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "2;3;1;2",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            78.75,
            26.686841326766267
        ],
        "wc_strengths_avg": [
            68.5,
            14.150971698084906
        ],
        "wc_weaknesses_avg": [
            198.25,
            153.9048001200742
        ],
        "wc_questions_avg": [
            6.0,
            3.7416573867739413
        ],
        "wc_review_avg": [
            351.5,
            165.13252253871738
        ],
        "wc_reply_reviewers_avg": [
            3.75,
            6.49519052838329
        ],
        "wc_reply_authors_avg": [
            651.75,
            362.8273521938499
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.13245323570650439,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:fNZC4LdST4sJ:scholar.google.com/&scioq=M%24%5E4%24LE:+A+Multi-Ability+Multi-Range+Long+Context+Evaluation+Benchmark+for+Large+Language+Models&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0;0;1;1",
        "aff_unique_norm": "Huawei;Chinese University of Hong Kong",
        "aff_unique_dep": "Huawei Technologies;",
        "aff_unique_url": "https://www.huawei.com;https://www.cuhk.edu.hk",
        "aff_unique_abbr": "Huawei;CUHK",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Large Language Models Cannot Self-Correct Reasoning Yet",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18956",
        "id": "IkmD3fKBPQ",
        "author_site": "Jie Huang, Xinyun Chen, Swaroop Mishra, Huaixiu Steven Zheng, Adams Yu, Xinying Song, Denny Zhou",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) have emerged as a groundbreaking technology with their unparalleled text generation capabilities across various applications. Nevertheless, concerns persist regarding the accuracy and appropriateness of their generated content. A contemporary methodology, self-correction, has been proposed as a remedy to these issues. Building upon this premise, this paper critically examines the role and efficacy of self-correction within LLMs, shedding light on its true potential and limitations. Central to our investigation is the notion of intrinsic self-correction, whereby an LLM attempts to correct its initial responses based solely on its inherent capabilities, without the crutch of external feedback. In the context of reasoning, our research indicates that LLMs struggle to self-correct their responses without external feedback, and at times, their performance even degrades after self-correction. Drawing from these insights, we offer suggestions for future research and practical applications in this field.",
        "keywords": "Large Language Models;Self-Correction;Reasoning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Jie Huang;Xinyun Chen;Swaroop Mishra;Huaixiu Steven Zheng;Adams Wei Yu;Xinying Song;Denny Zhou",
        "authorids": "~Jie_Huang3;~Xinyun_Chen1;~Swaroop_Mishra1;~Huaixiu_Steven_Zheng1;~Adams_Wei_Yu1;~Xinying_Song1;~Denny_Zhou1",
        "gender": ";M;M;M;M;;F",
        "homepage": "https://jeffhj.github.io/;https://swarooprm.github.io/;;https://adamsyu.github.io/;;https://dennyzhou.github.io/;https://jungyhuk.github.io/",
        "dblp": "29/6643-9;249/2784;307/3201;65/10635;12/6134;178/3277;",
        "google_scholar": "GIoPkMoAAAAJ;-7LK2SwAAAAJ;PyK4x4wAAAAJ;-hW6cvgAAAAJ;e7SbG_UAAAAJ;UwLsYw8AAAAJ;d4W1UT0AAAAJ",
        "orcid": ";;;;;;",
        "linkedin": "jie-huang-4b0104151/;;;;;;",
        "or_profile": "~Jie_Huang3;~Swaroop_Mishra1;~Huaixiu_Steven_Zheng1;~Adams_Wei_Yu1;~Xinying_Song1;~Dengyong_Zhou2;~Xinyun_Chen2",
        "aff": "University of Illinois, Urbana Champaign;Google;Google;Google Brain;Google;Google DeepMind;Google",
        "aff_domain": "illinois.edu;google.com;google.com;google.com;google.com;google.com;google.com",
        "position": "PhD student;Researcher;Software Engineer;Research Scientist;Software Engineer;Research Scientist;Researcher",
        "bibtex": "@inproceedings{\nhuang2024large,\ntitle={Large Language Models Cannot Self-Correct Reasoning Yet},\nauthor={Jie Huang and Xinyun Chen and Swaroop Mishra and Huaixiu Steven Zheng and Adams Wei Yu and Xinying Song and Denny Zhou},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=IkmD3fKBPQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "yEtd;No3p;oT3c;N1pE",
        "pdf_size": 282947,
        "rating": "5;6;8;8",
        "confidence": "3;4;4;4",
        "soundness": "3;3;3;3",
        "contribution": "2;3;4;3",
        "presentation": "1;4;3;4",
        "wc_summary": "47;61;101;192",
        "wc_strengths": "42;58;87;101",
        "wc_weaknesses": "344;781;115;116",
        "wc_questions": "169;46;72;44",
        "wc_review": "602;946;375;453",
        "wc_reply_reviewers": "144;0;0;21",
        "wc_reply_authors": "1089;1490;352;535",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "3;4;1;2",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            1.224744871391589
        ],
        "wc_summary_avg": [
            100.25,
            56.55694033449829
        ],
        "wc_strengths_avg": [
            72.0,
            23.24865587512534
        ],
        "wc_weaknesses_avg": [
            339.0,
            271.7048030491916
        ],
        "wc_questions_avg": [
            82.75,
            51.006739750742746
        ],
        "wc_review_avg": [
            594.0,
            218.98059274739393
        ],
        "wc_reply_reviewers_avg": [
            41.25,
            59.93903152370749
        ],
        "wc_reply_authors_avg": [
            866.5,
            450.7940216994897
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.7777777777777777,
        "gs_citation": 431,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3909307420246116708&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=IkmD3fKBPQ",
        "pdf": "https://openreview.net/pdf?id=IkmD3fKBPQ",
        "email": "illinois.edu;google.com;google.com;google.com;google.com;google.com;google.com",
        "author_num": 7,
        "aff_unique_index": "0;1;1;1;1;1;1",
        "aff_unique_norm": "University of Illinois Urbana-Champaign;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://illinois.edu;https://www.google.com",
        "aff_unique_abbr": "UIUC;Google",
        "aff_campus_unique_index": "0;1;1;1;1;1",
        "aff_campus_unique": "Urbana-Champaign;Mountain View;",
        "aff_country_unique_index": "0;0;0;0;0;1;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "IlNVkYUSfF",
        "title": "Resonator-Gated RNNs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Sequence learning tasks frequently involve data with repetitive and periodic temporal patterns. Detecting these patterns is essential for accurate predictions and informed decision-making in various domains. There is, however, still huge potential in augmenting sequence learning algorithms in this regard. In RNN-based sequence learning, gated RNNs, such as long short-term memory networks (LSTMs)\nand gated recurrent units (GRUs), are the de facto standard. While adept at capturing longer-term dependencies, gated RNNs still sometimes struggle with periodic data components, because their gating mechanism is designed to prioritize retaining static relevant information. As a result, these networks often challenged by periodicity in the data. We present a novel memory unit that incorporates a simple resonator circuit. The resonator facilitates the recognition of periodic data patterns, focusing on data-specific time scales and respective frequencies. Moreover, it enables the forward propagation of information through resonating dynamics while stably channeling the gradient backwards. We show that our resonator-gated RNN (RG-RNN) accelerates the training convergence on multiple sequence classifications tasks. Moreover, it significantly outperforms vanilla LSTMs on three out of four benchmark tasks in terms of accuracy. We conclude that resonator-based gating offers a new inductive bias to gated RNNs, focusing learning on the detection and processing of periodic data patterns.",
        "keywords": "sequence learning;RNN;LSTM;resonators;time series;ECG;MNIST;speech commands",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Robert Deibel;Shahram Eivazi;Martin V. Butz;Sebastian Otte",
        "authorids": "~Robert_Deibel1;~Shahram_Eivazi2;~Martin_V._Butz2;~Sebastian_Otte1",
        "gender": "M;;M;",
        "homepage": ";;https://cm.inf.uni-tuebingen.de;",
        "dblp": ";;b/MartinVButz.html;",
        "google_scholar": ";;https://scholar.google.de/citations?user=dIcpfzAAAAAJ;",
        "orcid": ";;0000-0002-8120-8537;",
        "linkedin": "robert-deibel;;martin-butz-85b971150/;",
        "or_profile": "~Robert_Deibel1;~Shahram_Eivazi2;~Martin_V._Butz2;~Sebastian_Otte1",
        "aff": "Eberhard-Karls-Universit\u00e4t T\u00fcbingen;;University of Tuebingen;",
        "aff_domain": "uni-tuebingen.de;;uni-tuebingen.de;",
        "position": "PhD student;;Full Professor;",
        "bibtex": "@misc{\ndeibel2024resonatorgated,\ntitle={Resonator-Gated {RNN}s},\nauthor={Robert Deibel and Shahram Eivazi and Martin V. Butz and Sebastian Otte},\nyear={2024},\nurl={https://openreview.net/forum?id=IlNVkYUSfF}\n}",
        "github": "",
        "project": "",
        "reviewers": "KRtM;kRNM;ZNzp;UaUD",
        "site": "https://openreview.net/forum?id=IlNVkYUSfF",
        "pdf_size": 971067,
        "rating": "3;5;6;6",
        "confidence": "4;4;3;3",
        "soundness": "2;2;4;3",
        "contribution": "2;2;2;3",
        "presentation": "4;3;2;3",
        "wc_summary": "52;33;44;78",
        "wc_strengths": "21;17;21;82",
        "wc_weaknesses": "57;63;115;59",
        "wc_questions": "56;8;88;81",
        "wc_review": "186;121;268;300",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "222;110;214;303",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            51.75,
            16.588776326179094
        ],
        "wc_strengths_avg": [
            35.25,
            27.040478915877213
        ],
        "wc_weaknesses_avg": [
            73.5,
            24.057223447438815
        ],
        "wc_questions_avg": [
            58.25,
            31.355820831226854
        ],
        "wc_review_avg": [
            218.75,
            70.09769967695088
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            212.25,
            68.53603067000597
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8164965809277259,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:IslzZiLya3sJ:scholar.google.com/&scioq=Resonator-Gated+RNNs&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Eberhard Karls University of T\u00fcbingen;University of Tuebingen",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uni-tuebingen.de/;https://www.uni-tuebingen.de/",
        "aff_unique_abbr": "Uni T\u00fcbingen;Uni T\u00fcbingen",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "T\u00fcbingen;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "IlQxeKrWDt",
        "title": "Concise and Organized Perception Facilitates Large Language Models for Deductive Reasoning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Exploiting large language models (LLMs) to tackle deductive reasoning has garnered growing attention. It still remains highly challenging to achieve satisfactory results in complex deductive problems, characterized by plenty of premises (i.e., facts or rules) entailing intricate relationships among entities and requiring multi-hop reasoning. One intuitive solution is to decompose the original task into smaller sub-tasks, and then chain the multiple casual reasoning steps together in a forward (e.g., Selection-Inference) or backward (e.g., LAMBADA) direction. However, these techniques inevitably necessitate a large number of overall stages, leading to computationally expensive operations and a higher possibility of making misleading steps. In addition to stage-by-stage decomposition, we draw inspiration from another aspect of human problem-solving. Humans tend to distill the most relevant information and organize their thoughts systematically (e.g., creating mind maps), which assists them in answering questions or drawing conclusions precisely and quickly. In light of this, we propose a novel reasoning approach named Concise and Organized Perception (COP). COP carefully analyzes the given statements to efficiently identify the most pertinent information while eliminating redundancy. It then prompts the LLMs in a more organized form that adapts to the model's inference process. By perceiving concise and organized proofs, the deductive reasoning abilities of LLMs can be better elicited, and the risk of acquiring errors caused by excessive reasoning stages is mitigated. Furthermore, our approach can be combined with the aforementioned ones to further boost their performance. Extensive experimental results on three popular deductive benchmarks (i.e., ProofWriter, PrOntoQA and PrOntoQA-OOD) show that COP significantly outperforms previous state-of-the-art methods.",
        "keywords": "deductive reasoning;logical reasoning;large language models;in-context learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Shaotian Yan;Chen Shen;Junjie Liu;Jieping Ye",
        "authorids": "~Shaotian_Yan1;~Chen_Shen7;~Junjie_Liu5;~Jieping_Ye4",
        "gender": "M;M;M;M",
        "homepage": ";;https://github.com/jumptoliujj;http://yelabs.net/",
        "dblp": "274/1197;55/5393-3;;03/5454",
        "google_scholar": "sBhbb2wAAAAJ;b6vn1uMAAAAJ;;T9AzhwcAAAAJ",
        "orcid": ";;;0000-0001-8662-5818",
        "linkedin": ";;;",
        "or_profile": "~Shaotian_Yan1;~Chen_Shen7;~Junjie_Liu5;~Jieping_Ye4",
        "aff": "Alibaba Group;Alibaba Group;Zhejiang University;Alibaba Group",
        "aff_domain": "alibaba-inc.com;alibaba-inc.com;zju.edu.cn;alibaba-inc.com",
        "position": "Researcher;Researcher;PhD student;Principal Researcher",
        "bibtex": "@misc{\nyan2024concise,\ntitle={Concise and Organized Perception Facilitates Large Language Models for Deductive Reasoning},\nauthor={Shaotian Yan and Chen Shen and Junjie Liu and Jieping Ye},\nyear={2024},\nurl={https://openreview.net/forum?id=IlQxeKrWDt}\n}",
        "github": "",
        "project": "",
        "reviewers": "3B4m;fpHM;pmsh;Fc11",
        "site": "https://openreview.net/forum?id=IlQxeKrWDt",
        "pdf_size": 1154241,
        "rating": "3;5;6;8",
        "confidence": "4;3;2;3",
        "soundness": "3;2;3;4",
        "contribution": "1;2;3;3",
        "presentation": "2;2;3;4",
        "wc_summary": "94;91;44;115",
        "wc_strengths": "44;113;120;79",
        "wc_weaknesses": "152;138;2;6",
        "wc_questions": "257;4;57;55",
        "wc_review": "547;346;223;255",
        "wc_reply_reviewers": "0;0;25;0",
        "wc_reply_authors": "3947;1449;1696;771",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "7;2;4;1",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            86.0,
            25.95187854472196
        ],
        "wc_strengths_avg": [
            89.0,
            30.257230540814536
        ],
        "wc_weaknesses_avg": [
            74.5,
            70.68769341264432
        ],
        "wc_questions_avg": [
            93.25,
            96.89781989291606
        ],
        "wc_review_avg": [
            342.75,
            126.26237563106437
        ],
        "wc_reply_reviewers_avg": [
            6.25,
            10.825317547305483
        ],
        "wc_reply_authors_avg": [
            1965.75,
            1192.9558615053618
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.5,
            2.29128784747792
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5883484054145521,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=537640961969336172&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Alibaba Group;Zhejiang University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.alibaba.com;https://www.zju.edu.cn",
        "aff_unique_abbr": "Alibaba;ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "ImwrWH6U0Y",
        "title": "A Comprehensive Study of Privacy Risks in Curriculum Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Curriculum learning (CL) is a machine learning technique that progressively trains a model on data of increasing difficulty or complexity. This way, the model can learn more efficiently and achieve better performance than random or uniform sampling of data.\nHowever, most existing works focus on improving the performance of CL and its privacy risks have never been studied. \nIn this work, we take the first step to investigate the privacy leakage of CL through the lens of membership inference attack (MIA) and attribute inference attack (AIA).\nOur evaluation of 9 benchmark datasets using various attack methods (NN-based, metric-based, label-only MIA, and NN-based AIA) highlights new insights. First, MIA is slightly more effective with CL, especially on a subset of challenging training samples. Second, models trained with CL are less susceptible to AIA compared to MIA. Third, established defense techniques like DP-SGD, MemGuard, and MixupMMD remain effective under CL, albeit with a notable accuracy impact for DP-SGD. Lastly, we propose a novel MIA called Diff-Cali, which leverages difficulty scores to enhance calibration and effectiveness against all CL and normal training methods.\nWith this study, we hope to draw the community's attention to the unintended privacy risks of emerging machine-learning techniques and develop new attack benchmarks and defense solutions.",
        "keywords": "curriculum Learning;membership inference attack;attribute inference attack",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/691dbaa74a2b38693e2220164bb1fc419b76c642.pdf",
        "author": "Joann Qiongna Chen;Xinlei He;Zheng Li;Yang Zhang;Zhou Li",
        "authorids": "~Joann_Qiongna_Chen1;~Xinlei_He1;~Zheng_Li17;~Yang_Zhang15;~Zhou_Li1",
        "gender": ";M;M;M;M",
        "homepage": "https://joannqc.com/;https://xinleihe.github.io/;https://zhenglisec.github.io/;https://yangzhangalmo.github.io/;https://faculty.sites.uci.edu/zhouli/",
        "dblp": ";227/7262;10/1143-23;06/6785-16;62/4119-1",
        "google_scholar": ";6hZNEtoAAAAJ;xEAaaGsAAAAJ;Xeb2888AAAAJ;zxJYEVwAAAAJ",
        "orcid": ";;0000-0002-4466-7523;0000-0003-3612-7348;",
        "linkedin": ";;;;zhou-li-0b943323",
        "or_profile": "~Joann_Qiongna_Chen1;~Xinlei_He1;~Zheng_Li17;~Yang_Zhang15;~Zhou_Li1",
        "aff": "University of California, Irvine;Hong Kong University of Science and Technology;CISPA Helmholtz Center for Information Security;CISPA Helmholtz Center for Information Security;University of California, Irvine",
        "aff_domain": "uci.edu;hkust-gz.edu.cn;cispa.de;cispa.de;uci.edu",
        "position": "PhD student;Assistant Professor;Postdoc;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nchen2024a,\ntitle={A Comprehensive Study of Privacy Risks in Curriculum Learning},\nauthor={Joann Qiongna Chen and Xinlei He and Zheng Li and Yang Zhang and Zhou Li},\nyear={2024},\nurl={https://openreview.net/forum?id=ImwrWH6U0Y}\n}",
        "github": "",
        "project": "",
        "reviewers": "rVvZ;zNpb;455n;tgat",
        "site": "https://openreview.net/forum?id=ImwrWH6U0Y",
        "pdf_size": 13712998,
        "rating": "3;5;5;6",
        "confidence": "4;4;4;4",
        "soundness": "2;3;2;3",
        "contribution": "2;2;3;2",
        "presentation": "2;3;3;3",
        "wc_summary": "61;35;26;77",
        "wc_strengths": "19;37;33;53",
        "wc_weaknesses": "529;89;115;57",
        "wc_questions": "234;2;34;47",
        "wc_review": "843;163;208;234",
        "wc_reply_reviewers": "0;0;45;0",
        "wc_reply_authors": "750;232;584;377",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            49.75,
            20.314711418083203
        ],
        "wc_strengths_avg": [
            35.5,
            12.114041439585717
        ],
        "wc_weaknesses_avg": [
            197.5,
            192.49090887623757
        ],
        "wc_questions_avg": [
            79.25,
            90.83329510702559
        ],
        "wc_review_avg": [
            362.0,
            278.8646625157085
        ],
        "wc_reply_reviewers_avg": [
            11.25,
            19.48557158514987
        ],
        "wc_reply_authors_avg": [
            485.75,
            197.29213745103985
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4213325254699046943&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2;2;0",
        "aff_unique_norm": "University of California, Irvine;Hong Kong University of Science and Technology;CISPA Helmholtz Center for Information Security",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.uci.edu;https://www.ust.hk;https://www.cispa.de/",
        "aff_unique_abbr": "UCI;HKUST;CISPA",
        "aff_campus_unique_index": "0;1;0",
        "aff_campus_unique": "Irvine;Hong Kong SAR;",
        "aff_country_unique_index": "0;1;2;2;0",
        "aff_country_unique": "United States;China;Germany"
    },
    {
        "id": "Io0Q37X5fP",
        "title": "Counterfactual Generative Models for Time-Varying Treatments",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Estimating the counterfactual outcome of treatment is essential for decision-making in public health and clinical science, among others. Often, treatments are administered in a sequential, time-varying manner, leading to an exponentially increased number of possible counterfactual outcomes. Furthermore, in modern applications, the outcomes are high-dimensional and conventional average treatment effect estimation fails to capture disparities in individuals.  To tackle these challenges, we propose a novel conditional generative framework capable of producing counterfactual samples under time-varying treatment, without the need for explicit density estimation. \nOur method carefully addresses the distribution mismatch between the observed and counterfactual distributions via a loss function based on inverse probability weighting. We present a thorough evaluation of our method using both synthetic and real-world data. \nOur results demonstrate that our method is capable of generating high-quality counterfactual samples and outperforms the state-of-the-art baselines.",
        "keywords": "causal inference;policy evaluation;longitudinal causal inference;time series;generative models",
        "primary_area": "causal reasoning",
        "supplementary_material": "/attachment/c9f93df0d5f4a85991b6263fc187fae8ef0b9b3d.zip",
        "author": "Shenghao Wu;Wenbin Zhou;Minshuo Chen;Shixiang Zhu",
        "authorids": "~Shenghao_Wu1;~Wenbin_Zhou1;~Minshuo_Chen1;~Shixiang_Zhu1",
        "gender": "M;M;M;M",
        "homepage": "https://shenghaowu.github.io/;;https://minshuochen.github.io;https://sites.google.com/view/woodyzhu",
        "dblp": "217/5537;;217/1509;133/3853",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;qU9WvTgAAAAJ;v6_Gv6IAAAAJ",
        "orcid": "0009-0003-8624-8057;;;0000-0002-2241-6096",
        "linkedin": "shenghao-wu-13552287/;wenbin-zhou-33462a270/;;shixiang-zhu-26b956a0/",
        "or_profile": "~Shenghao_Wu1;~Wenbin_Zhou1;~Minshuo_Chen1;~Shixiang_Zhu1",
        "aff": "ByteDance Inc.;Carnegie Mellon University;Princeton University;Carnegie Mellon University",
        "aff_domain": "bytedance.com;cmu.edu;princeton.edu;cmu.edu",
        "position": "Researcher;PhD student;Postdoc;Assistant Professor",
        "bibtex": "@misc{\nwu2024counterfactual,\ntitle={Counterfactual Generative Models for Time-Varying Treatments},\nauthor={Shenghao Wu and Wenbin Zhou and Minshuo Chen and Shixiang Zhu},\nyear={2024},\nurl={https://openreview.net/forum?id=Io0Q37X5fP}\n}",
        "github": "",
        "project": "",
        "reviewers": "iR6m;QN9X;kkvR;9P43",
        "site": "https://openreview.net/forum?id=Io0Q37X5fP",
        "pdf_size": 5987022,
        "rating": "3;5;6;6",
        "confidence": "4;4;3;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;2",
        "presentation": "2;3;2;3",
        "wc_summary": "30;66;71;58",
        "wc_strengths": "24;30;55;41",
        "wc_weaknesses": "355;68;90;82",
        "wc_questions": "2;224;21;82",
        "wc_review": "411;388;237;263",
        "wc_reply_reviewers": "249;0;0;0",
        "wc_reply_authors": "1666;707;955;1515",
        "reply_reviewers": "2;0;0;0",
        "reply_authors": "3;2;3;4",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            56.25,
            15.848895860595462
        ],
        "wc_strengths_avg": [
            37.5,
            11.800423721205947
        ],
        "wc_weaknesses_avg": [
            148.75,
            119.33854155301212
        ],
        "wc_questions_avg": [
            82.25,
            87.01257093087182
        ],
        "wc_review_avg": [
            324.75,
            75.75082507801483
        ],
        "wc_reply_reviewers_avg": [
            62.25,
            107.82016277116261
        ],
        "wc_reply_authors_avg": [
            1210.75,
            393.3804615127701
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.4714045207910316,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7415958938079721032&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "ByteDance;Carnegie Mellon University;Princeton University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.bytedance.com;https://www.cmu.edu;https://www.princeton.edu",
        "aff_unique_abbr": "ByteDance;CMU;Princeton",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "IoDhZOgteu",
        "title": "DEXR: A Unified Approach Towards Environment Agnostic Exploration",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The exploration-exploitation dilemma poses pivotal challenges in reinforcement learning (RL). While recent advances in curiosity-driven techniques have demonstrated capabilities in sparse reward scenarios, they necessitate extensive hyperparameter tuning on different types of environments and often fall short in dense reward settings. In response to these challenges, we introduce the novel \\textbf{D}elayed \\textbf{EX}ploration \\textbf{R}einforcement Learning (DEXR) framework. DEXR adeptly curbs over-exploration and optimization instabilities issues of curiosity-driven methods, and can efficiently adapt to both dense and sparse reward environments with minimal hyperparameter tuning. This is facilitated by an auxiliary exploitation-only policy that streamlines data collection, guiding the exploration policy towards high-value regions and minimizing unnecessary exploration. Additionally, this exploration policy yields diverse, in-distribution data, and bolsters training robustness with neural network structures. We verify the efficacy of DEXR with both theoretical validations and comprehensive empirical evaluations, demonstrating its superiority in a broad range of environments.",
        "keywords": "Reinforcement Learning;Exploration;Intrinsic Rewards",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/c2c09eaca8c131fc88f1a57244c9dffa6cc26be7.zip",
        "author": "Yiran Wang;Yunfan Li;Sanae Amani;Lin Yang",
        "authorids": "~Yiran_Wang2;~Yunfan_Li4;~Sanae_Amani1;~Lin_Yang12",
        "gender": ";M;F;",
        "homepage": ";https://scholar.google.com/citations?user=kUQDprYAAAAJ&hl=en;;",
        "dblp": ";;;",
        "google_scholar": ";;qlwIFJsAAAAJ;",
        "orcid": ";;;",
        "linkedin": ";;sanaeamani/;",
        "or_profile": "~Yiran_Wang2;~Yunfan_Li4;~Sanae_Amani1;~Lin_Yang12",
        "aff": ";University of California, Los Angeles;;",
        "aff_domain": ";ucla.edu;;",
        "position": ";PhD student;;",
        "bibtex": "@misc{\nwang2024dexr,\ntitle={{DEXR}: A Unified Approach Towards Environment Agnostic Exploration},\nauthor={Yiran Wang and Yunfan Li and Sanae Amani and Lin Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=IoDhZOgteu}\n}",
        "github": "",
        "project": "",
        "reviewers": "Nqr6;NQDk;CdTY;CCrp",
        "site": "https://openreview.net/forum?id=IoDhZOgteu",
        "pdf_size": 31858547,
        "rating": "3;5;5;6",
        "confidence": "3;5;3;4",
        "soundness": "2;4;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;4;3;3",
        "wc_summary": "97;48;77;76",
        "wc_strengths": "55;17;118;101",
        "wc_weaknesses": "469;32;170;252",
        "wc_questions": "104;59;138;127",
        "wc_review": "725;156;503;556",
        "wc_reply_reviewers": "296;229;194;55",
        "wc_reply_authors": "829;905;547;641",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            74.5,
            17.44276354251241
        ],
        "wc_strengths_avg": [
            72.75,
            39.58771905528279
        ],
        "wc_weaknesses_avg": [
            230.75,
            158.43512079081455
        ],
        "wc_questions_avg": [
            107.0,
            30.306764921383476
        ],
        "wc_review_avg": [
            485.0,
            206.8852338858431
        ],
        "wc_reply_reviewers_avg": [
            193.5,
            87.9616393662601
        ],
        "wc_reply_authors_avg": [
            730.5,
            143.03408684645768
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.48420012470625223,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:-TBdlTk6wNIJ:scholar.google.com/&scioq=DEXR:+A+Unified+Approach+Towards+Environment+Agnostic+Exploration&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of California, Los Angeles",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucla.edu",
        "aff_unique_abbr": "UCLA",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Los Angeles",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Consistent Video-to-Video Transfer Using Synthetic Dataset",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18955",
        "id": "IoKRezZMxF",
        "author_site": "Jiaxin Cheng, Tianjun Xiao, Tong He",
        "tldr": "",
        "abstract": "We introduce a novel and efficient approach for text-based video-to-video editing that eliminates the need for resource-intensive per-video-per-model finetuning. At the core of our approach is a synthetic paired video dataset tailored for video-to-video transfer tasks. Inspired by Instruct Pix2Pix's image transfer via editing instruction, we adapt this paradigm to the video domain. Extending the Prompt-to-Prompt to videos, we efficiently generate paired samples, each with an input video and its edited counterpart. Alongside this, we introduce the Long Video Sampling Correction during sampling, ensuring consistent long videos across batches. Our method surpasses current methods like Tune-A-Video, heralding substantial progress in text-based video-to-video editing and suggesting exciting avenues for further exploration and deployment.",
        "keywords": "Computer Vision;Video Editing;Diffusion Model",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/9cab55bbe2e33a78087b54a1213ffdd7a40cefee.zip",
        "author": "Jiaxin Cheng;Tianjun Xiao;Tong He",
        "authorids": "~Jiaxin_Cheng1;~Tianjun_Xiao1;~Tong_He5",
        "gender": "M;M;M",
        "homepage": ";http://tianjunxiao.com/;https://hetong007.github.io/",
        "dblp": "230/4175;;02/1554-2",
        "google_scholar": "cPeV9YIAAAAJ;DaKJ9pAAAAAJ;hV5D8GYAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Jiaxin_Cheng1;~Tianjun_Xiao1;~Tong_He5",
        "aff": "USC/ISI;Amazon;Amazon",
        "aff_domain": "isi.edu;amazon.com;amazon.com",
        "position": "PhD student;Senior Applied Scientist;Researcher",
        "bibtex": "@inproceedings{\ncheng2024consistent,\ntitle={Consistent Video-to-Video Transfer Using Synthetic Dataset},\nauthor={Jiaxin Cheng and Tianjun Xiao and Tong He},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=IoKRezZMxF}\n}",
        "github": "",
        "project": "",
        "reviewers": "NGWA;99Pg;BaKN;3EH3",
        "pdf_size": 1172301,
        "rating": "5;5;6;8",
        "confidence": "4;4;4;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "73;53;102;190",
        "wc_strengths": "32;56;108;78",
        "wc_weaknesses": "88;169;89;38",
        "wc_questions": "5;110;56;10",
        "wc_review": "198;388;355;316",
        "wc_reply_reviewers": "20;146;68;27",
        "wc_reply_authors": "446;711;666;295",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            104.5,
            52.347397260990924
        ],
        "wc_strengths_avg": [
            68.5,
            28.01338965566288
        ],
        "wc_weaknesses_avg": [
            96.0,
            46.92014492731241
        ],
        "wc_questions_avg": [
            45.25,
            42.34014052881733
        ],
        "wc_review_avg": [
            314.25,
            71.79267023868105
        ],
        "wc_reply_reviewers_avg": [
            65.25,
            50.096781333734405
        ],
        "wc_reply_authors_avg": [
            529.5,
            168.4762594551529
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.9428090415820632,
        "gs_citation": 20,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3814644184482168985&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=IoKRezZMxF",
        "pdf": "https://openreview.net/pdf?id=IoKRezZMxF",
        "email": "isi.edu;amazon.com;amazon.com",
        "author_num": 3,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "University of Southern California;Amazon",
        "aff_unique_dep": ";Amazon.com, Inc.",
        "aff_unique_url": "https://isi.usc.edu;https://www.amazon.com",
        "aff_unique_abbr": "USC;Amazon",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "ISI;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "IpJIq3iwMH",
        "title": "Federated Binary Matrix Factorization using Proximal Optimization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Identifying informative components in binary data is an essential task in many research areas, including life sciences, social sciences, natural language processing, and recommendation systems.  Boolean matrix factorization (BMF) is a family of methods that performs this task by efficiently factorizing the data into its constituent parts. In real-world settings, the data is often distributed across stakeholders and required to stay private, prohibiting the straightforward application of BMF. To adapt BMF to this context, we approach the problem from a federated-learning perspective, while building on a state-of-the-art continuous binary matrix factorization relaxation to BMF that enables efficient gradient-based optimization. We propose to only share the relaxed component matrices, which are aggregated centrally using a proximal operator that regularizes for binary outcomes. We show the convergence of our federated proximal gradient descent algorithm and provide differential privacy guarantees. Our extensive empirical evaluation demonstrates that our algorithm outperforms, in terms of quality and efficacy, federation schemes of state-of-the-art BMF methods on a diverse set of real-world and synthetic data.",
        "keywords": "federated learning;binary matrix factorization;boolean matrix factorization;proximal operator;differential privacy",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/4124899844c02ec921bcf5095fd2c8899293898b.zip",
        "author": "Sebastian Dalleiger;Jilles Vreeken;Michael Kamp",
        "authorids": "~Sebastian_Dalleiger1;~Jilles_Vreeken2;~Michael_Kamp1",
        "gender": ";M;M",
        "homepage": ";https://vreeken.eu;http://michaelkamp.org",
        "dblp": "266/4791;94/6462;133/7744",
        "google_scholar": "Wi97BMwAAAAJ;p5HEQfIAAAAJ;https://scholar.google.de/citations?user=8R5jbvQAAAAJ",
        "orcid": "0000-0003-1915-1709;0000-0002-2310-2806;0000-0001-6231-0694",
        "linkedin": "sebastian-dalleiger-3962b024a/;jilles-vreeken-b3b05b58/;michael-kamp-29096a95/",
        "or_profile": "~Sebastian_Dalleiger1;~Jilles_Vreeken2;~Michael_Kamp1",
        "aff": "Max-Planck Institute for Informatics;CISPA Helmholtz Center for Information Security;Institute for AI in Medicine IKIM",
        "aff_domain": "mpi-inf.mpg.de;cispa.de;uk-essen.de",
        "position": "Researcher;Tenured Faculty;Research Group Leader",
        "bibtex": "@misc{\ndalleiger2024federated,\ntitle={Federated Binary Matrix Factorization using Proximal Optimization},\nauthor={Sebastian Dalleiger and Jilles Vreeken and Michael Kamp},\nyear={2024},\nurl={https://openreview.net/forum?id=IpJIq3iwMH}\n}",
        "github": "",
        "project": "",
        "reviewers": "iqWp;d72F;nPms",
        "site": "https://openreview.net/forum?id=IpJIq3iwMH",
        "pdf_size": 2445827,
        "rating": "3;5;5",
        "confidence": "4;3;3",
        "soundness": "2;3;3",
        "contribution": "1;2;3",
        "presentation": "3;2;3",
        "wc_summary": "31;123;25",
        "wc_strengths": "44;50;31",
        "wc_weaknesses": "882;118;122",
        "wc_questions": "25;288;161",
        "wc_review": "982;579;339",
        "wc_reply_reviewers": "0;0;15",
        "wc_reply_authors": "756;960;911",
        "reply_reviewers": "0;0;1",
        "reply_authors": "1;2;2",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            59.666666666666664,
            44.850368510811094
        ],
        "wc_strengths_avg": [
            41.666666666666664,
            7.93025150224688
        ],
        "wc_weaknesses_avg": [
            374.0,
            359.21395667020886
        ],
        "wc_questions_avg": [
            158.0,
            107.39025405811584
        ],
        "wc_review_avg": [
            633.3333333333334,
            265.3002491936678
        ],
        "wc_reply_reviewers_avg": [
            5.0,
            7.0710678118654755
        ],
        "wc_reply_authors_avg": [
            875.6666666666666,
            86.94953836692994
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.9999999999999998,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:CSD0mYUpy-IJ:scholar.google.com/&scioq=Federated+Binary+Matrix+Factorization+using+Proximal+Optimization&hl=en&as_sdt=0,33",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Max-Planck Institute for Informatics;CISPA Helmholtz Center for Information Security;Institute for AI in Medicine",
        "aff_unique_dep": ";;AI in Medicine",
        "aff_unique_url": "https://mpi-inf.mpg.de;https://www.cispa.de/;",
        "aff_unique_abbr": "MPII;CISPA;IKIM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "Germany;Unknown"
    },
    {
        "id": "IpoZ32sq44",
        "title": "SemStamp: A Semantic Watermark with Paraphrastic Robustness for Text Generation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Existing watermarking algorithms are vulnerable to paraphrase attacks because of their token-level design.\nTo address this issue, we propose SemStamp,  a robust sentence-level semantic watermarking algorithm based on locality-sensitive hashing (LSH), which partitions the semantic space of sentences. The algorithm encodes and LSH-hashes a candidate sentence generated by an LLM, and conducts sentence-level rejection sampling until the sampled sentence falls in watermarked partitions in the semantic embedding space. A margin-based constraint is used to enhance its robustness. To show the advantages of our algorithm, we propose a \"bigram\" paraphrase attack using the paraphrase that has the fewest bigram overlaps with the original sentence. This attack is shown to be effective against the existing token-level watermarking method. Experimental results show that our novel semantic watermark algorithm is not only more robust than the previous state-of-the-art method on both common and bigram paraphrase attacks, but also is better at preserving the quality of generation.",
        "keywords": "AI-generated text detection;large language model;natural language watermark;locality-sensitive hashing;paraphrase attack;sentence encoder;contrastive learning",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Abe Bohan Hou;Jingyu Zhang;Tianxing He;Yichen Wang;Yung-Sung Chuang;Hongwei Wang;Lingfeng Shen;Benjamin Van Durme;Daniel Khashabi;Yulia Tsvetkov",
        "authorids": "~Abe_Bohan_Hou1;~Jingyu_Zhang2;~Tianxing_He1;~Yichen_Wang4;~Yung-Sung_Chuang1;~Hongwei_Wang1;~Lingfeng_Shen1;~Benjamin_Van_Durme2;~Daniel_Khashabi2;~Yulia_Tsvetkov1",
        "gender": "M;;M;M;M;M;M;;M;F",
        "homepage": "https://abehou.com;https://jackz.io/;https://cloudygoose.github.io/;https://yichenzw.com;https://people.csail.mit.edu/yungsung/;https://hongweiw.net;;;http://danielkhashabi.com/;https://homes.cs.washington.edu/~yuliats/",
        "dblp": "358/7004;92/3672.html;149/0111;;64/3095;https://dblp.org/pers/hd/w/Wang_0004:Hongwei;240/5490.html;;71/10515;75/8157",
        "google_scholar": ";9EC0sDMAAAAJ;egmfjjwAAAAJ;86XiOcsAAAAJ;3ar1DOwAAAAJ;3C__4wsAAAAJ;PoSTdLAAAAAJ;;pK2kQvgAAAAJ;SEDPkrsAAAAJ",
        "orcid": ";;;;0000-0002-1723-5063;0000-0001-7474-8271;;;;0000-0002-4634-7128",
        "linkedin": "bohanhou/;;;;yschuang;hongwei-wang-730a7b72/;;;;",
        "or_profile": "~Abe_Bohan_Hou1;~Jingyu_Zhang2;~Tianxing_He1;~Yichen_Wang4;~Yung-Sung_Chuang1;~Hongwei_Wang1;~Lingfeng_Shen1;~Benjamin_Van_Durme2;~Daniel_Khashabi2;~Yulia_Tsvetkov1",
        "aff": "Johns Hopkins University;Johns Hopkins University;University of Washington;Xi'an Jiaotong University;Massachusetts Institute of Technology;Tencent AI Lab;Johns Hopkins University;;Johns Hopkins University;Department of Computer Science, University of Washington",
        "aff_domain": "jh.edu;cs.jhu.edu;cs.washington.edu;xjtu.edu.cn;mit.edu;tencent.com;jh.edu;;jhu.edu;cs.washington.edu",
        "position": "Undergrad student;PhD student;Postdoc;Undergrad student;PhD student;Researcher;MS student;;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nhou2024semstamp,\ntitle={SemStamp: A Semantic Watermark with Paraphrastic Robustness for Text Generation},\nauthor={Abe Bohan Hou and Jingyu Zhang and Tianxing He and Yichen Wang and Yung-Sung Chuang and Hongwei Wang and Lingfeng Shen and Benjamin Van Durme and Daniel Khashabi and Yulia Tsvetkov},\nyear={2024},\nurl={https://openreview.net/forum?id=IpoZ32sq44}\n}",
        "github": "",
        "project": "",
        "reviewers": "GzBM;feNQ;ouFD",
        "site": "https://openreview.net/forum?id=IpoZ32sq44",
        "pdf_size": 484647,
        "rating": "3;5;5",
        "confidence": "5;3;4",
        "soundness": "1;2;3",
        "contribution": "1;3;3",
        "presentation": "2;3;2",
        "wc_summary": "366;71;49",
        "wc_strengths": "23;51;39",
        "wc_weaknesses": "134;100;119",
        "wc_questions": "17;82;2",
        "wc_review": "540;304;209",
        "wc_reply_reviewers": "147;0;15",
        "wc_reply_authors": "262;165;302",
        "reply_reviewers": "1;0;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            162.0,
            144.52912047980735
        ],
        "wc_strengths_avg": [
            37.666666666666664,
            11.469767022723502
        ],
        "wc_weaknesses_avg": [
            117.66666666666667,
            13.912424503139471
        ],
        "wc_questions_avg": [
            33.666666666666664,
            34.721111093332766
        ],
        "wc_review_avg": [
            351.0,
            139.15698569122094
        ],
        "wc_reply_reviewers_avg": [
            54.0,
            66.04543890383347
        ],
        "wc_reply_authors_avg": [
            243.0,
            57.52101065407897
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 61,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10136672149005318618&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;1;2;3;4;0;0;1",
        "aff_unique_norm": "Johns Hopkins University;University of Washington;Xi'an Jiao Tong University;Massachusetts Institute of Technology;Tencent",
        "aff_unique_dep": ";;;;Tencent AI Lab",
        "aff_unique_url": "https://www.jhu.edu;https://www.washington.edu;https://www.xjtu.edu.cn;https://web.mit.edu;https://ai.tencent.com",
        "aff_unique_abbr": "JHU;UW;XJTU;MIT;Tencent AI Lab",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Seattle",
        "aff_country_unique_index": "0;0;0;1;0;1;0;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "IrZTJ7t2GW",
        "title": "Fair Adversarial Training: on the Adversarial Attack and Defense of Fairness",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "While numerous work has been proposed to address fairness in machine learning, existing methods do not guarantee fair predictions under imperceptible adversarial feature perturbation, and a seemingly fair model can suffer from large group-wise disparities under such perturbation. Moreover, while adversarial training has been shown to be reliable in improving a model's robustness to defend against adversarial feature perturbation that deteriorates accuracy, it has not been properly studied in the context of adversarial perturbation against fairness. To tackle these challenges, in this paper, we study the problem of adversarial attack and adversarial robustness w.r.t. two terms: fairness and accuracy. From the adversarial attack perspective, we propose a unified structure for adversarial attacks against fairness which brings together common notions in group fairness, and we theoretically prove the equivalence of adversarial attacks against different fairness notions. Further, we derive the connections between adversarial attacks against fairness and those against accuracy. From the adversarial robustness perspective, we theoretically align robustness to adversarial attacks against fairness and accuracy, where robustness w.r.t. one term enhances robustness w.r.t. the other term. Our study suggests a novel way to unify adversarial training w.r.t. fairness and accuracy, and experiments show our proposed method achieves better robustness w.r.t. both terms.",
        "keywords": "fairness;adversarial attack;adversarial robustness",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/33ac72d4bc6f4f4d3240553d30438a06fb4fd025.zip",
        "author": "Junyi Chai;Taeuk Jang;Jing Gao;Xiaoqian Wang",
        "authorids": "~Junyi_Chai1;~Taeuk_Jang1;~Jing_Gao2;~Xiaoqian_Wang1",
        "gender": "M;M;F;F",
        "homepage": ";;https://engineering.purdue.edu/~jinggao/;https://engineering.purdue.edu/~joywang/",
        "dblp": "323/9078;61/6076;67/4834-4;151/3215-1",
        "google_scholar": "fucMzpYAAAAJ;https://scholar.google.co.kr/citations?user=AWJhF1UAAAAJ;Ftj1h4cAAAAJ;I3tc214AAAAJ",
        "orcid": "0000-0002-4324-5361;;;",
        "linkedin": "junyi-chai-260869256/?trk=opento_sprofile_details;taeuk-jang-a52674178/;;",
        "or_profile": "~Junyi_Chai1;~Taeuk_Jang1;~Jing_Gao2;~Xiaoqian_Wang1",
        "aff": "Purdue University;Purdue University;Purdue University;Purdue University",
        "aff_domain": "purdue.edu;purdue.edu;purdue.edu;purdue.edu",
        "position": "PhD student;PhD student;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nchai2024fair,\ntitle={Fair Adversarial Training: on the Adversarial Attack and Defense of Fairness},\nauthor={Junyi Chai and Taeuk Jang and Jing Gao and Xiaoqian Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=IrZTJ7t2GW}\n}",
        "github": "",
        "project": "",
        "reviewers": "D6Dd;HjJ2;qsra;AyY3",
        "site": "https://openreview.net/forum?id=IrZTJ7t2GW",
        "pdf_size": 660727,
        "rating": "3;5;6;6",
        "confidence": "4;3;4;3",
        "soundness": "1;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;3;2",
        "wc_summary": "65;11;56;96",
        "wc_strengths": "23;40;44;79",
        "wc_weaknesses": "462;192;18;94",
        "wc_questions": "124;2;5;2",
        "wc_review": "674;245;123;271",
        "wc_reply_reviewers": "416;115;0;0",
        "wc_reply_authors": "1148;589;41;111",
        "reply_reviewers": "2;1;0;0",
        "reply_authors": "3;2;1;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            57.0,
            30.422031490352513
        ],
        "wc_strengths_avg": [
            46.5,
            20.35313243704762
        ],
        "wc_weaknesses_avg": [
            191.5,
            167.91292386234002
        ],
        "wc_questions_avg": [
            33.25,
            52.408849443581566
        ],
        "wc_review_avg": [
            328.25,
            207.2913107199624
        ],
        "wc_reply_reviewers_avg": [
            132.75,
            170.140199541437
        ],
        "wc_reply_authors_avg": [
            472.25,
            443.4937288169924
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.40824829046386296,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:CqIEmCvNEBUJ:scholar.google.com/&scioq=Fair+Adversarial+Training:+on+the+Adversarial+Attack+and+Defense+of+Fairness&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Purdue University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.purdue.edu",
        "aff_unique_abbr": "Purdue",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "IrdbUQ1zTw",
        "title": "Reinforcement Learning-based Layer-wise Aggregation for Personalized Federated Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "A key challenge in Federated Learning (FL) is statistical heterogeneity, which may result in slow convergence and accuracy reduction. To tackle this problem, personalized federated learning (PFL) aims to adapt the global model to the individual data distribution of each client. One approach for this is personalized aggregation, which automatically determines how much each client can benefit from other clients' models. This paper proposes a new PFL method based on two principles: a) shared knowledge and personalized knowledge are reflected in different layers of the network and b) clients with more data should contribute more to shared knowledge, while knowledge transfer from similar clients can boost personalization. Based on these, we propose a Reinforcement Learning-based Layer-wise Aggregation method (pFedRLLA) that applies different mechanisms for different neural network layers. For layers representing shared knowledge, aggregation is carried out based on the size of the local data samples of the client. For layers representing personalized knowledge, a deep reinforcement learning (DRL) agent is used to generate personalized aggregation weights. To ascertain efficiency and scalability, we train a single DRL agent (for all users) that operates on the server-side and takes as input a subset of user models. To further reduce its state-space, we design a multi-head auto-encoder to obtain low-dimensional embeddings of user models. Extensive experiments on benchmark datasets for variable data heterogeneity levels reveal that the proposed algorithm consistently outperforms baselines in terms of both higher accuracy (up to +3.1\\%) and faster convergence (a reduction of global rounds by up to 20.5\\%).",
        "keywords": "Personalized Federated Learning;Reinforcement Learning;Layer-wise Aggregation",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Ziwen Huang;Nikolaos Freris",
        "authorids": "~Ziwen_Huang1;~Nikolaos_Freris2",
        "gender": ";Not Specified",
        "homepage": ";http://staff.ustc.edu.cn/~nfr/",
        "dblp": ";92/7140",
        "google_scholar": ";j38QfhkAAAAJ",
        "orcid": ";0000-0001-6006-3001",
        "linkedin": ";",
        "or_profile": "~Ziwen_Huang1;~Nikolaos_Freris2",
        "aff": ";University of Science and Technology of China",
        "aff_domain": ";ustc.edu.cn",
        "position": ";Full Professor",
        "bibtex": "@misc{\nhuang2024reinforcement,\ntitle={Reinforcement Learning-based Layer-wise Aggregation for Personalized Federated Learning},\nauthor={Ziwen Huang and Nikolaos Freris},\nyear={2024},\nurl={https://openreview.net/forum?id=IrdbUQ1zTw}\n}",
        "github": "",
        "project": "",
        "reviewers": "qRiv;M4kH;54Ry",
        "site": "https://openreview.net/forum?id=IrdbUQ1zTw",
        "pdf_size": 6552758,
        "rating": "3;6;6",
        "confidence": "4;3;3",
        "soundness": "1;3;3",
        "contribution": "1;2;2",
        "presentation": "3;3;2",
        "wc_summary": "66;54;132",
        "wc_strengths": "25;54;57",
        "wc_weaknesses": "59;77;209",
        "wc_questions": "316;6;120",
        "wc_review": "466;191;518",
        "wc_reply_reviewers": "227;16;0",
        "wc_reply_authors": "1900;376;716",
        "reply_reviewers": "1;1;0",
        "reply_authors": "3;1;1",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            84.0,
            34.292856398964496
        ],
        "wc_strengths_avg": [
            45.333333333333336,
            14.429907214608907
        ],
        "wc_weaknesses_avg": [
            115.0,
            66.87301398920195
        ],
        "wc_questions_avg": [
            147.33333333333334,
            128.02430324833728
        ],
        "wc_review_avg": [
            391.6666666666667,
            143.47202592220626
        ],
        "wc_reply_reviewers_avg": [
            81.0,
            103.44402673265705
        ],
        "wc_reply_authors_avg": [
            997.3333333333334,
            653.1999863917805
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:YTZ0B-5bn5AJ:scholar.google.com/&scioq=Reinforcement+Learning-based+Layer-wise+Aggregation+for+Personalized+Federated+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 2,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Science and Technology of China",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.ustc.edu.cn",
        "aff_unique_abbr": "USTC",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "IryGDUHxDE",
        "title": "Unsupervised open-vocabulary action recognition with an autoregressive model",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Current works on zero/few- shot action recognition are largely based on contrastive approaches trained in a supervised manner to select an action class out of a predefined set. Instead, in this work, we propose a new paradigm for zero-shot action recognition based on  autoregressive generation of a free-form action-specific caption describing the action occurring in the video. To this end, we propose to adapt an image-based pre-trained autoregressive Vision & Language (V&L) Model for action recognition. We firstly show that direct fine-tuning of an autoregressive model using the action classes suffers from severe overfitting.\nTo alleviate this, we then introduce an unsupervised learning framework consisting of two key components: (a) an unsupervised method for adapting the autoregressive model to action/video data by means of pseudo-caption generation and self-training without using any action-specific labels; (b) a retrieval component for discovering a diverse set of pseudo-captions for each video. In the process, we show that both components are necessary to obtain high accuracy. Our model results in predictions that are fine-grained, interpretable, and naturally open-vocabulary. Importantly, when evaluated for zero- and few-shot action recognition, our approach matches or even outperforms contrastive learning-based methods.",
        "keywords": "zero-shot;action recognition;autoregressive models;vision-language",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Adrian Bulat;Enrique Sanchez;Brais Martinez;Georgios Tzimiropoulos",
        "authorids": "~Adrian_Bulat1;~Enrique_Sanchez1;~Brais_Martinez3;~Georgios_Tzimiropoulos1",
        "gender": ";M;M;M",
        "homepage": "https://www.adrianbulat.com;http://www.braismartinez.org/;https://ytzimiro.github.io/;https://esanchezlozano.github.io",
        "dblp": "185/6878;14/111;03/3273;119/1475",
        "google_scholar": "https://scholar.google.co.uk/citations?user=5sKcsg0AAAAJ;https://scholar.google.co.uk/citations?user=-62MApgAAAAJ;https://scholar.google.co.uk/citations?user=D4JkWxf-8fwC;https://scholar.google.co.uk/citations?user=VLIQpIYAAAAJ",
        "orcid": "0000-0002-3185-4979;;;0000-0003-0196-922X",
        "linkedin": ";;;enrique-sanchez-lozano/",
        "or_profile": "~Adrian_Bulat1;~Brais_Martinez3;~Georgios_Tzimiropoulos1;~Enrique_S\u00e1nchez-Lozano1",
        "aff": "Samsung AI Center Cambridge;Samsung;Queen Mary University London;Samsung AI Center",
        "aff_domain": "samsung.com;samsung.com;qmul.ac.uk;samsung.com",
        "position": "Research Scientist;Samsung AI Center;Associate Professor;Researcher",
        "bibtex": "@misc{\nbulat2024unsupervised,\ntitle={Unsupervised open-vocabulary action recognition with an autoregressive model},\nauthor={Adrian Bulat and Enrique Sanchez and Brais Martinez and Georgios Tzimiropoulos},\nyear={2024},\nurl={https://openreview.net/forum?id=IryGDUHxDE}\n}",
        "github": "",
        "project": "",
        "reviewers": "bK27;RvG7;JWgN;o3GA",
        "site": "https://openreview.net/forum?id=IryGDUHxDE",
        "pdf_size": 6352584,
        "rating": "3;5;5;8",
        "confidence": "5;3;3;4",
        "soundness": "2;3;2;3",
        "contribution": "2;3;2;4",
        "presentation": "2;1;1;3",
        "wc_summary": "46;62;57;99",
        "wc_strengths": "10;55;30;183",
        "wc_weaknesses": "881;262;116;52",
        "wc_questions": "75;57;115;71",
        "wc_review": "1012;436;318;405",
        "wc_reply_reviewers": "0;0;0;46",
        "wc_reply_authors": "1533;291;658;326",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "2;1;1;2",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            66.0,
            19.912307751739878
        ],
        "wc_strengths_avg": [
            69.5,
            67.4407147055842
        ],
        "wc_weaknesses_avg": [
            327.75,
            328.36136724651396
        ],
        "wc_questions_avg": [
            79.5,
            21.558061137310098
        ],
        "wc_review_avg": [
            542.75,
            274.3532166751467
        ],
        "wc_reply_reviewers_avg": [
            11.5,
            19.91858428704209
        ],
        "wc_reply_authors_avg": [
            702.0,
            500.6980127781615
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.2955402316445243,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:12WAO0GZIsEJ:scholar.google.com/&scioq=Unsupervised+open-vocabulary+action+recognition+with+an+autoregressive+model&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Samsung;Queen Mary University of London",
        "aff_unique_dep": "AI Center;",
        "aff_unique_url": "https://www.samsung.com/global/innovation/ai-research/;https://www.qmul.ac.uk",
        "aff_unique_abbr": "SAC;QMUL",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Cambridge;;London",
        "aff_country_unique_index": "0;1;0;1",
        "aff_country_unique": "United Kingdom;South Korea"
    },
    {
        "id": "IsGsv8qEHp",
        "title": "Human-oriented Representation Learning for Robotic Manipulation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Humans inherently possess generalizable visual representations that empower them to efficiently explore and interact with the environments in manipulation tasks. We advocate that such a representation automatically arises from simultaneously learning about multiple simple perceptual skills that are critical for everyday scenarios (e.g., hand detection, state estimate, etc.) and is better suited for learning robot manipulation policies compared to current state-of-the-art visual representations purely based on self-supervised objectives. We formalize this idea through the lens of human-oriented multi-task fine-tuning on top of pre-trained visual encoders, where each task is a perceptual skill tied to human-environment interactions. We introduce Task Fusion Decoder as a plug-and-play embedding translator that utilizes the underlying relationships among these perceptual skills to guide the representation learning towards encoding meaningful structure for what\u2019s important for all perceptual skills, ultimately empowering learning of downstream robotic manipulation tasks. Extensive experiments across a range of robotic tasks and embodiments, in both simulations and real-world environments, show that our Task Fusion Decoder consistently improves the representation of three state-of-the-art visual encoders including R3M, MVP, and EgoVLP, for downstream manipulation policy-learning. More demos, datasets, models, and code can be found at https://sites.google.com/view/human-oriented-robot-learning.",
        "keywords": "representation learning;robot manipulation;multitask learning",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Mingxiao Huo;Mingyu Ding;Chenfeng Xu;Thomas Tian;Xinghao Zhu;Yao Mu;Lingfeng Sun;Masayoshi Tomizuka;Wei Zhan",
        "authorids": "~Mingxiao_Huo1;~Mingyu_Ding1;~Chenfeng_Xu1;~Thomas_Tian1;~Xinghao_Zhu1;~Yao_Mu1;~Lingfeng_Sun1;~Masayoshi_Tomizuka1;~Wei_Zhan2",
        "gender": "M;M;M;M;;M;M;M;",
        "homepage": ";https://dingmyu.github.io/;;https://scholar.google.com/citations?user=uY4D8-wAAAAJ&hl=en&authuser=1;;https://yaomarkmu.github.io/;https://lingfeng.moe;https://me.berkeley.edu/people/masayoshi-tomizuka/;",
        "dblp": ";188/5243;65/1881;;;260/0674;;10/4434;",
        "google_scholar": ";w4yTWwoAAAAJ;RpqvaTUAAAAJ;;;;Uxb6wbkAAAAJ;;",
        "orcid": ";0000-0001-6556-8359;0000-0002-4941-6985;;;;;;",
        "linkedin": "anthony-huo-3b68a5270/;dingmyu/;;;;;;;",
        "or_profile": "~Mingxiao_Huo1;~Mingyu_Ding1;~Chenfeng_Xu1;~Thomas_Tian1;~Xinghao_Zhu1;~Yao_Mu1;~Lingfeng_Sun1;~Masayoshi_Tomizuka1;~Wei_Zhan2",
        "aff": "Carnegie Mellon University;University of California, Berkeley;University of California, Berkeley;University of California, Berkeley;;The University of Hong Kong;University of California, Berkeley;University of California, Berkeley;",
        "aff_domain": "andrew.cmu.edu;berkeley.edu;berkeley.edu;berkeley.edu;;hku.hk;berkeley.edu;berkeley.edu;",
        "position": "MS student;Postdoc;PhD student;PhD student;;PhD student;PhD student;Full Professor;",
        "bibtex": "@misc{\nhuo2024humanoriented,\ntitle={Human-oriented Representation Learning for Robotic Manipulation},\nauthor={Mingxiao Huo and Mingyu Ding and Chenfeng Xu and Thomas Tian and Xinghao Zhu and Yao Mu and Lingfeng Sun and Masayoshi Tomizuka and Wei Zhan},\nyear={2024},\nurl={https://openreview.net/forum?id=IsGsv8qEHp}\n}",
        "github": "",
        "project": "",
        "reviewers": "uRTQ;UxCD;kBXX;hzuR",
        "site": "https://openreview.net/forum?id=IsGsv8qEHp",
        "pdf_size": 35605873,
        "rating": "3;5;6;6",
        "confidence": "3;4;3;4",
        "soundness": "2;2;2;3",
        "contribution": "3;3;3;3",
        "presentation": "1;3;2;4",
        "wc_summary": "93;160;54;148",
        "wc_strengths": "105;58;61;310",
        "wc_weaknesses": "455;517;232;486",
        "wc_questions": "128;278;18;153",
        "wc_review": "781;1013;365;1097",
        "wc_reply_reviewers": "0;0;0;742",
        "wc_reply_authors": "1322;1104;483;827",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "2;2;1;2",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            113.75,
            42.75730931665368
        ],
        "wc_strengths_avg": [
            133.5,
            103.58692002371728
        ],
        "wc_weaknesses_avg": [
            422.5,
            112.1483392654568
        ],
        "wc_questions_avg": [
            144.25,
            92.42395522806844
        ],
        "wc_review_avg": [
            814.0,
            283.89258532057505
        ],
        "wc_reply_reviewers_avg": [
            185.5,
            321.29542480402677
        ],
        "wc_reply_authors_avg": [
            934.0,
            313.9641699302645
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.40824829046386296,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3368659428600320004&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1;1;2;1;1",
        "aff_unique_norm": "Carnegie Mellon University;University of California, Berkeley;University of Hong Kong",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.cmu.edu;https://www.berkeley.edu;https://www.hku.hk",
        "aff_unique_abbr": "CMU;UC Berkeley;HKU",
        "aff_campus_unique_index": "1;1;1;2;1;1",
        "aff_campus_unique": ";Berkeley;Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;1;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "ItPYVON0mI",
        "title": "ACHIEVING DYNAMIC ACCURACY IN MACHINE-LEARNED CG POTENTIALS BY MODULATING POTENTIAL ENERGY LANDSCAPE",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In this paper, we introduce a coarse-grained (CG) model designed to reproduce the structure and dynamics of all-atom systems. Our approach combines a graph neural network potential and a high-frequency potential energy surface landscape function to effectively capture essential features of the fine-grained atomistic model. The Neural-Network potential accurately captures complex atomic inter- actions using learned representations and can be effectively parameterized to re- produce distribution functions from high-fidelity all-atom (AA) simulations. Nev- ertheless, such parameterization inherently smoothens out the AA Energy land- scape, resulting in the loss of information required for capturing the system dy- namics. We, therefore, provide a route to enrich the ML CG potentials for bulk systems by emulating the AA landscape within the mapped CG ensemble by aug- menting the GNN potential with a high-frequency potential term, thereby pro- viding an accurate representation of CG dynamics as well as the structure. We demonstrate the utility of our framework by reproducing the Radial Distribution Function (RDF) and the mean-square displacement (MSD) of various AA and CG systems. Notably, we apply our methodology to coarse-grain the widely used SPC/E water model, thereby providing compelling evidence of the fidelity of our model to coarse-grain complex systems, which include electrostatic and multi- body effects. Our work signifies a significant step towards more efficient and accurate simulations of complex systems using coarse-grained methodologies.",
        "keywords": "Molecular dynamics;Neural network potential;Graph Neural Network;Neural ODE;Coarse-graining;Dynamics",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Jinu Jeong;Ishan Nadkarni;N R Aluru",
        "authorids": "~Jinu_Jeong1;~Ishan_Nadkarni1;~N_R_Aluru1",
        "gender": ";;",
        "homepage": ";;",
        "dblp": ";;",
        "google_scholar": ";;sACU-OUAAAAJ",
        "orcid": "0000-0002-5585-5431;;",
        "linkedin": "jinu-jeong/;;",
        "or_profile": "~Jinu_Jeong1;~Ishan_Nadkarni1;~N_R_Aluru1",
        "aff": "University of Illinois, Urbana-Champaign;;University of Texas at Austin",
        "aff_domain": "mechse.illinois.edu;;utexas.edu",
        "position": "PhD student;;Full Professor",
        "bibtex": "@misc{\nanonymous2024achieving,\ntitle={{ACHIEVING} {DYNAMIC} {ACCURACY} {IN} {MACHINE}-{LEARNED} {CG} {POTENTIALS} {BY} {MODULATING} {POTENTIAL} {ENERGY} {LANDSCAPE}},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=ItPYVON0mI}\n}",
        "github": "",
        "project": "",
        "reviewers": "f7Ks;AGGc;nqZm;fWpi",
        "site": "https://openreview.net/forum?id=ItPYVON0mI",
        "pdf_size": 3265248,
        "rating": "1;3;3;5",
        "confidence": "5;3;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;2",
        "presentation": "1;2;3;4",
        "wc_summary": "36;55;100;117",
        "wc_strengths": "25;30;30;72",
        "wc_weaknesses": "403;112;106;212",
        "wc_questions": "10;8;80;234",
        "wc_review": "474;205;316;635",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            77.0,
            32.76430985081175
        ],
        "wc_strengths_avg": [
            39.25,
            19.01808349965895
        ],
        "wc_weaknesses_avg": [
            208.25,
            120.06326457330735
        ],
        "wc_questions_avg": [
            83.0,
            91.87491496594704
        ],
        "wc_review_avg": [
            407.5,
            162.44768388622842
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:df4fZHQHFLkJ:scholar.google.com/&scioq=ACHIEVING+DYNAMIC+ACCURACY+IN+MACHINE-LEARNED+CG+POTENTIALS+BY+MODULATING+POTENTIAL+ENERGY+LANDSCAPE&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Illinois;University of Texas at Austin",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://illinois.edu;https://www.utexas.edu",
        "aff_unique_abbr": "UIUC;UT Austin",
        "aff_campus_unique_index": "0;1",
        "aff_campus_unique": "Urbana-Champaign;Austin",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "IuLVxo0T0R",
        "title": "Enhancing Precision Drug Recommendations via Fine-grained Exploration of Motif Relationships",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Making accurate and safe drug recommendation for patients has always been a challenging task. Even though rule-based, instance-based, and longitudinal data-based approaches have made notable strides in drug modeling, they often neglect to fully leverage the rich motifs information. However, it is widely acknowledged that motifs exert a significant influence on both drug action and patient symptomatology. Therefore, there is a pressing need for more comprehensive exploration this invaluable information to further enhance drug recommendation systems. To tackle the aforementioned challenges, we present DEPOT, a novel drug recommendation framework that leverages motifs as higher-level structures to enhance recommendations. In our approach, we employ chemical decomposition to partition drug molecules into motif-trees, enabling us to capture the structural information among substructures. To investigate the relationship between disease progression and motifs, we conduct a meticulous exploration from two perspectives: repetition and exploration. This comprehensive analysis allows us to gain valuable insights into the drug turnover, with the former focusing on reusability and the latter on discovering new requirements. Furthermore, we incorporate historical DDI effects and employ a nonlinear optimization objective to stabilize the training process, ensuring the safety of recommended drug combinations. Extensive experiments are conducted on two data sets to validate the uniqueness of the DEPOT framework and the efficacy of the individual submodules.",
        "keywords": "Drug discovery;Recommender System;Molecular Representation Learning",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Chuang Zhao;Hongke Zhao;Xiaofang Zhou;Xiaomeng Li",
        "authorids": "~Chuang_Zhao1;~Hongke_Zhao1;~Xiaofang_Zhou1;~Xiaomeng_Li1",
        "gender": "M;M;M;F",
        "homepage": "https://data-designer.github.io/;https://www.adm-cube.online/people/teacher/hongke_zhao;https://sites.google.com/view/xiaofang-zhou;https://xmengli.github.io/",
        "dblp": "29/5452-2;;https://dblp.uni-trier.de/pid/z/XiaofangZhou.html;02/9850-1",
        "google_scholar": "YYMcwZAAAAAJ;ChR2MIUAAAAJ;y6m820wAAAAJ;uVTzPpoAAAAJ",
        "orcid": "0000-0001-6220-0540;0000-0003-3099-4803;0000-0001-6343-1455;",
        "linkedin": ";;;",
        "or_profile": "~Chuang_Zhao1;~Hongke_Zhao1;~Xiaofang_Zhou1;~Xiaomeng_Li1",
        "aff": "Hong Kong University of Science and Technology;Tianjin University;Hong Kong University of Science and Technology;Hong Kong University of Science and Technology",
        "aff_domain": "ust.hk;tju.edu.cn;ust.hk;ust.hk",
        "position": "PhD student;Associate Professor;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nzhao2024enhancing,\ntitle={Enhancing Precision Drug Recommendations via Fine-grained Exploration of Motif Relationships},\nauthor={Chuang Zhao and Hongke Zhao and Xiaofang Zhou and Xiaomeng Li},\nyear={2024},\nurl={https://openreview.net/forum?id=IuLVxo0T0R}\n}",
        "github": "",
        "project": "",
        "reviewers": "XZo3;pMng;Wx6A;eiqZ",
        "site": "https://openreview.net/forum?id=IuLVxo0T0R",
        "pdf_size": 1194847,
        "rating": "3;3;5;5",
        "confidence": "4;3;3;3",
        "soundness": "1;2;3;2",
        "contribution": "2;2;2;2",
        "presentation": "2;2;2;2",
        "wc_summary": "83;102;120;158",
        "wc_strengths": "54;49;41;72",
        "wc_weaknesses": "64;239;417;588",
        "wc_questions": "314;9;52;406",
        "wc_review": "515;399;630;1224",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            115.75,
            27.680092124124155
        ],
        "wc_strengths_avg": [
            54.0,
            11.379806676741042
        ],
        "wc_weaknesses_avg": [
            327.0,
            195.66169783583092
        ],
        "wc_questions_avg": [
            195.25,
            168.6169846130573
        ],
        "wc_review_avg": [
            692.0,
            317.8230639837204
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:xUOjeXXsgeQJ:scholar.google.com/&scioq=Enhancing+Precision+Drug+Recommendations+via+Fine-grained+Exploration+of+Motif+Relationships&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Tianjin University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ust.hk;http://www.tju.edu.cn",
        "aff_unique_abbr": "HKUST;TJU",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Talk like a Graph: Encoding Graphs for Large Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18954",
        "id": "IuXR1CCrSi",
        "author_site": "Bahare Fatemi, Jonathan Halcrow, Bryan Perozzi",
        "tldr": "",
        "abstract": "Graphs are a powerful tool for representing and analyzing complex relationships in real-world applications such as social networks, recommender systems, and computational finance. Reasoning on graphs is essential for drawing inferences about the relationships between entities in a complex system, and to identify hidden patterns and trends. Despite the remarkable progress in automated reasoning with natural text, reasoning on graphs with large language models (LLMs) remains an understudied problem. In this work, we perform the first comprehensive study of encoding graph-structured data as text for consumption by LLMs. We show that LLM performance on graph reasoning tasks varies on three fundamental levels: (1) the graph encoding method, (2) the nature of the graph task itself, and (3) interestingly, the very structure of the graph considered. These novel results provide valuable insight on strategies for encoding graphs as text. Using these insights we illustrate how the correct choice of encoders can boost performance on graph reasoning tasks inside LLMs by 4.8% to 61.8%, depending on the task.",
        "keywords": "Graph problems;large language models;encoding graphs;generative models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/d6cb4ff68ef36170c02ac326120076393a2814e3.pdf",
        "author": "Bahare Fatemi;Jonathan Halcrow;Bryan Perozzi",
        "authorids": "~Bahare_Fatemi1;~Jonathan_Halcrow1;~Bryan_Perozzi1",
        "gender": "F;M;",
        "homepage": ";;http://www.perozzi.net/",
        "dblp": ";;91/10813",
        "google_scholar": ";2zZucy4AAAAJ;rZgbMs4AAAAJ",
        "orcid": ";;",
        "linkedin": "bahare-fatemi-b0049179/;;",
        "or_profile": "~Bahare_Fatemi1;~Jonathan_Halcrow1;~Bryan_Perozzi1",
        "aff": "Google;Google;Google",
        "aff_domain": "google.com;google.com;google.com",
        "position": "Researcher;Researcher;Researcher",
        "bibtex": "@inproceedings{\nfatemi2024talk,\ntitle={Talk like a Graph: Encoding Graphs for Large Language Models},\nauthor={Bahare Fatemi and Jonathan Halcrow and Bryan Perozzi},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=IuXR1CCrSi}\n}",
        "github": "",
        "project": "",
        "reviewers": "SLdh;FDET;52xH;PSY3",
        "pdf_size": 534150,
        "rating": "6;6;6;6",
        "confidence": "4;5;3;3",
        "soundness": "3;3;3;3",
        "contribution": "3;2;2;2",
        "presentation": "2;4;3;2",
        "wc_summary": "68;151;136;102",
        "wc_strengths": "16;70;50;42",
        "wc_weaknesses": "312;246;232;157",
        "wc_questions": "3;16;1;2",
        "wc_review": "399;483;419;303",
        "wc_reply_reviewers": "19;22;0;0",
        "wc_reply_authors": "731;940;474;656",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "1;3;2;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            114.25,
            32.06536293261001
        ],
        "wc_strengths_avg": [
            44.5,
            19.35846068260594
        ],
        "wc_weaknesses_avg": [
            236.75,
            55.06984201902163
        ],
        "wc_questions_avg": [
            5.5,
            6.103277807866851
        ],
        "wc_review_avg": [
            401.0,
            64.52906321960671
        ],
        "wc_reply_reviewers_avg": [
            10.25,
            10.304731922762475
        ],
        "wc_reply_authors_avg": [
            700.25,
            167.01253695456518
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 173,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10656281679692095298&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=IuXR1CCrSi",
        "pdf": "https://openreview.net/pdf?id=IuXR1CCrSi",
        "email": "google.com;google.com;google.com",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Google",
        "aff_unique_dep": "Google",
        "aff_unique_url": "https://www.google.com",
        "aff_unique_abbr": "Google",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Mountain View",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Iv60x1iAvp",
        "title": "GNN-based Reinforcement Learning Agent for Session-based Recommendation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "This paper focuses on session-based item recommendation and the challenges of using Reinforcement Learning (RL) in recommender systems. While traditional RL methods rely on one-hot encoded vectors as user state, they often fail to capture user-specific characteristics, which may provide misleading results. In contrast, recently, Graph Neural Networks (GNNs) have emerged as a promising technique for learning user-item representations effectively. However, GNNs prioritize static rating prediction, which does not fully capture the dynamic nature of session-based recommendations. To address these limitations, we propose a novel approach called GNN-RL-based Recommender System (GRRS), which combines both frameworks to provide a unique solution for the session-based recommendation \\footnote{Code available at \\url{https://anonymous.4open.science/r/iclr24_gnn_rl/}}. We demonstrate that our method can leverage the strengths of both GNNs and RL while overcoming their respective shortcomings. Our experiments on several logged public datasets validate the efficacy of our approach over various SOTA algorithms. Additionally, we offer a solution to the \\emph{offline training problem}, which is often encountered by RL algorithms when employed on logged datasets, which may be of independent interest.",
        "keywords": "Graph Neural Network;Reinforcement Learning;Recommendation Systems",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/5dc5613783573d86e9b09560c523a465f0625efe.pdf",
        "author": "Mohammadi Zaki;Brijraj Singh;Pankaj Wasnik",
        "authorids": "~Mohammadi_Zaki1;~Brijraj_Singh1;~Pankaj_Wasnik1",
        "gender": "M;;Not Specified",
        "homepage": "https://sites.google.com/site/mohammadizaki52/home;;https://www.sonyresearchindia.com/",
        "dblp": "153/0722;;184/0627",
        "google_scholar": "H3ji_pAAAAAJ;;3C5r8MoAAAAJ",
        "orcid": ";;0000-0001-5602-2901",
        "linkedin": ";;pankaj-wasnik/",
        "or_profile": "~Mohammadi_Zaki1;~Brijraj_Singh1;~Pankaj_Wasnik1",
        "aff": "Sony Research India, Bangalore;;Sony Research India",
        "aff_domain": "sony.com;;sony.com",
        "position": "Senior Research Engineer;;Principal Researcher",
        "bibtex": "@misc{\nzaki2024gnnbased,\ntitle={{GNN}-based Reinforcement Learning Agent for Session-based Recommendation},\nauthor={Mohammadi Zaki and Brijraj Singh and Pankaj Wasnik},\nyear={2024},\nurl={https://openreview.net/forum?id=Iv60x1iAvp}\n}",
        "github": "",
        "project": "",
        "reviewers": "YFCq;Hpcc;ApTX;Zy8x;htBw",
        "site": "https://openreview.net/forum?id=Iv60x1iAvp",
        "pdf_size": 4268259,
        "rating": "1;1;3;3;5",
        "confidence": "4;3;3;5;3",
        "soundness": "2;1;4;2;4",
        "contribution": "1;1;2;1;3",
        "presentation": "2;1;2;2;3",
        "wc_summary": "45;32;53;71;77",
        "wc_strengths": "25;69;54;14;60",
        "wc_weaknesses": "177;250;144;53;50",
        "wc_questions": "58;2;4;14;103",
        "wc_review": "305;353;255;152;290",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            2.6,
            1.4966629547095767
        ],
        "confidence_avg": [
            3.6,
            0.8
        ],
        "soundness_avg": [
            2.6,
            1.2000000000000002
        ],
        "contribution_avg": [
            1.6,
            0.8
        ],
        "presentation_avg": [
            2.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            55.6,
            16.56019323558756
        ],
        "wc_strengths_avg": [
            44.4,
            21.17167919651155
        ],
        "wc_weaknesses_avg": [
            134.8,
            76.1824126685418
        ],
        "wc_questions_avg": [
            36.2,
            39.08145340183756
        ],
        "wc_review_avg": [
            271.0,
            67.31715977371594
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.1336306209562122,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2579811443042751987&as_sdt=4005&sciodt=0,6&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Sony Research India",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sonyri.com/",
        "aff_unique_abbr": "SRI",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Bangalore;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "India"
    },
    {
        "id": "IwDE4zULBk",
        "title": "InfoScissors: Defense against Data Leakage in Collaborative Inference through the Lens of Mutual Information",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Edge-cloud collaborative inference empowers resource-limited IoT devices to support deep learning applications without disclosing their raw data to the cloud server, thus protecting user's data. Nevertheless, prior research has shown that collaborative inference still results in the exposure of input and predictions from edge devices. To defend against such data leakage in collaborative inference, we introduce InfoScissors, a defense strategy designed to reduce the mutual information between a model's intermediate outcomes and the device's input and predictions. We evaluate our defense on several datasets in the context of diverse attacks and offer a theoretical robustness guarantee.",
        "keywords": "Data leakage; Collaborative inference",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Lin Duan;Jingwei Sun;Jinyuan Jia;Yiran Chen;Maria Gorlatova",
        "authorids": "~Lin_Duan1;~Jingwei_Sun2;~Jinyuan_Jia2;~Yiran_Chen1;~Maria_Gorlatova1",
        "gender": "F;M;;M;",
        "homepage": ";;https://jinyuan-jia.github.io/;https://ece.duke.edu/people/yiran-chen/;",
        "dblp": "203/8667;66/7761-2;24/5124-1.html;80/1641;",
        "google_scholar": "3KGmyogAAAAJ;https://scholar.google.com/citations?hl=zh-CN;iyg4ytkAAAAJ;;",
        "orcid": ";;0000-0002-9785-7769;0000-0002-1486-8412;",
        "linkedin": ";;;;",
        "or_profile": "~Lin_Duan1;~Jingwei_Sun2;~Jinyuan_Jia2;~Yiran_Chen1;~Maria_Gorlatova1",
        "aff": "Duke University;Duke University;Pennsylvania State University;Duke University;",
        "aff_domain": "duke.edu;duke.edu;psu.edu;duke.edu;",
        "position": "PhD student;PhD student;Assistant Professor;Professor;",
        "bibtex": "@misc{\nduan2024infoscissors,\ntitle={InfoScissors: Defense against Data Leakage in Collaborative Inference through the Lens of Mutual Information},\nauthor={Lin Duan and Jingwei Sun and Jinyuan Jia and Yiran Chen and Maria Gorlatova},\nyear={2024},\nurl={https://openreview.net/forum?id=IwDE4zULBk}\n}",
        "github": "",
        "project": "",
        "reviewers": "YVtf;n2i6;9whR;QtK7;rjpt",
        "site": "https://openreview.net/forum?id=IwDE4zULBk",
        "pdf_size": 4739332,
        "rating": "3;3;5;5;5",
        "confidence": "3;5;4;4;4",
        "soundness": "2;3;2;3;2",
        "contribution": "2;2;2;2;2",
        "presentation": "2;3;3;2;3",
        "wc_summary": "172;54;48;45;100",
        "wc_strengths": "42;41;49;88;40",
        "wc_weaknesses": "228;364;291;163;157",
        "wc_questions": "5;40;8;3;79",
        "wc_review": "447;499;396;299;376",
        "wc_reply_reviewers": "0;0;0;18;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;1;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            4.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            83.8,
            48.40826375733796
        ],
        "wc_strengths_avg": [
            52.0,
            18.275666882497067
        ],
        "wc_weaknesses_avg": [
            240.6,
            78.6602822268011
        ],
        "wc_questions_avg": [
            27.0,
            29.305289624912426
        ],
        "wc_review_avg": [
            403.4,
            67.44657144733155
        ],
        "wc_reply_reviewers_avg": [
            3.6,
            7.2
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ZFhwxHaJZgsJ:scholar.google.com/&scioq=InfoScissors:+Defense+against+Data+Leakage+in+Collaborative+Inference+through+the+Lens+of+Mutual+Information&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Duke University;Pennsylvania State University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.duke.edu;https://www.psu.edu",
        "aff_unique_abbr": "Duke;PSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "IxLTEkHzw7",
        "title": "Detecting Change Points in Time Series via Curvatures of Representation Trajectories",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Change points are the timestamps at which a time series experiences meaningful changes. Recently, representation-based change point detection has gained popularity, but its emphasis on consecutive distance difference backfires, especially when the changes are gradual. In this paper, we propose a change point detection method, RECURVE, based on a novel change metric, the curvature of a representation trajectory, to accommodate both gradual and abrupt changes. Here, a sequence of representations in the representation space is interpreted as a trajectory, and a curvature at each timestamp can be computed. Using the theory of random walk, we formally show that the mean curvature is lower near change points than at other points. Extensive experiments using diverse real-world time-series datasets confirm the superiority of RECURVE over state-of-the-art methods.",
        "keywords": "time series;change point detection;curvature",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/599faade14e6a9f9c432fb1e91d4f0a51d6528f9.zip",
        "author": "Yooju Shin;Jaehyun Park;Susik Yoon;Hwanjun Song;Byung Lee;Jae-Gil Lee",
        "authorids": "~Yooju_Shin1;~Jaehyun_Park4;~Susik_Yoon1;~Hwanjun_Song2;~Byung_Lee1;~Jae-Gil_Lee1",
        "gender": "M;;;M;M;M",
        "homepage": ";;http://www.susikyoon.com;https://songhwanjun.github.io/;https://www.uvm.edu/gund/profiles/byung-lee;https://dm.kaist.ac.kr/jaegil/",
        "dblp": "https://dblp.uni-trier.de/pid/242/5190;;179/5307;204/3381;;28/3904",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;tCJs1zEAAAAJ;Ijzuc-8AAAAJ;;https://scholar.google.com.tw/citations?user=h9mbv9MAAAAJ",
        "orcid": "0000-0002-1395-9136;;0000-0001-5596-4972;0000-0002-1105-0818;;0000-0002-8711-7732",
        "linkedin": ";;;;;",
        "or_profile": "~Yooju_Shin1;~Jaehyun_Park4;~Susik_Yoon1;~Hwanjun_Song2;~Byung_Lee1;~Jae-Gil_Lee1",
        "aff": "Korea Advanced Institute of Science & Technology;;Korea University;Amazon Web Services;University of Vermont;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;;korea.ac.kr;amazon.com;;kaist.ac.kr",
        "position": "PhD student;;Assistant Professor;Research Scientist;Full Professor;Full Professor",
        "bibtex": "@misc{\nshin2024detecting,\ntitle={Detecting Change Points in Time Series via Curvatures of Representation Trajectories},\nauthor={Yooju Shin and Jaehyun Park and Susik Yoon and Hwanjun Song and Byung Lee and Jae-Gil Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=IxLTEkHzw7}\n}",
        "github": "",
        "project": "",
        "reviewers": "aWE7;MRxh;M4yt;a2DN",
        "site": "https://openreview.net/forum?id=IxLTEkHzw7",
        "pdf_size": 758540,
        "rating": "3;3;5;6",
        "confidence": "4;3;4;3",
        "soundness": "2;1;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "53;36;44;147",
        "wc_strengths": "51;20;32;188",
        "wc_weaknesses": "81;20;16;251",
        "wc_questions": "962;203;139;150",
        "wc_review": "1147;279;231;736",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            70.0,
            44.8608961123159
        ],
        "wc_strengths_avg": [
            72.75,
            67.45137137227086
        ],
        "wc_weaknesses_avg": [
            92.0,
            95.34411360959837
        ],
        "wc_questions_avg": [
            363.5,
            346.3903145297224
        ],
        "wc_review_avg": [
            598.25,
            373.1269053552692
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.19245008972987526,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:bRDXbNtRDokJ:scholar.google.com/&scioq=Detecting+Change+Points+in+Time+Series+via+Curvatures+of+Representation+Trajectories&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology;Korea University;Amazon;University of Vermont",
        "aff_unique_dep": ";;Amazon Web Services;",
        "aff_unique_url": "https://www.kaist.ac.kr;https://www.korea.ac.kr;https://aws.amazon.com;https://www.uvm.edu",
        "aff_unique_abbr": "KAIST;KU;AWS;UVM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;1;0",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "title": "A Good Learner can Teach Better: Teacher-Student Collaborative Knowledge Distillation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18953",
        "id": "Ixi4j6LtdX",
        "author_site": "Ayan Sengupta, Shantanu Dixit, Md Shad Akhtar, Tanmoy Chakraborty",
        "tldr": "",
        "abstract": "Knowledge distillation (KD) is a technique used to transfer knowledge from a larger ''teacher'' model into a smaller ''student'' model. Recent advancements in meta-learning-based knowledge distillation (MetaKD) emphasize that the fine-tuning of teacher models should be aware of the student's need to achieve better knowledge distillation. However, existing MetaKD methods often lack incentives for the teacher model to improve itself. In this study, we introduce MPDistil, a meta-policy distillation technique, that utilizes novel optimization strategies to foster both *collaboration* and *competition* during the fine-tuning of the teacher model in the meta-learning step. Additionally, we propose a curriculum learning framework for the student model in a competitive setup, in which the student model aims to outperform the teacher model by self-training on various tasks. Exhaustive experiments on SuperGLUE and GLUE benchmarks demonstrate the efficacy of MPDistil compared to $20$ conventional KD and advanced MetaKD baselines, showing significant performance enhancements in the student model -- e.g., a distilled 6-layer BERT model outperforms a 12-layer BERT model on five out of six SuperGLUE tasks. Furthermore, MPDistil, while applied to a large language teacher model (DeBERTa-v2-xxlarge), significantly narrows the performance gap of its smaller student counterpart (DeBERTa-12) by just $4.6$% on SuperGLUE. We further demonstrate how higher rewards and customized training curricula strengthen the student model and enhance generalizability.",
        "keywords": "Knowledge Distillation;Meta-Knowledge Distillation;Policy-driven Knowledge Distillation;Large Language Models",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/89d35f257c8862d94521847e8bfb07e2c664f074.zip",
        "author": "Ayan Sengupta;Shantanu Dixit;Md Shad Akhtar;Tanmoy Chakraborty",
        "authorids": "~Ayan_Sengupta1;shantanu20118@iiitd.ac.in;~Md_Shad_Akhtar1;~Tanmoy_Chakraborty2",
        "gender": "M;;;M",
        "homepage": "https://victor7246.github.io/;;;http://tanmoychak.com",
        "dblp": ";;184/8579.html;65/2136-2.html",
        "google_scholar": "90EGfboAAAAJ;;https://scholar.google.com/citations?hl=en;https://scholar.google.co.in/citations?user=C5S9JnIAAAAJ",
        "orcid": ";;;0000-0002-0210-0369",
        "linkedin": ";;;tanmoy-chakraborty-89553324/",
        "or_profile": "~Ayan_Sengupta1;shantanu20118@iiitd.ac.in;~Md_Shad_Akhtar1;~Tanmoy_Chakraborty2",
        "aff": "Indian Institute of Technology, Delhi;;Indraprastha Institute of Information Technology, Delhi;Indian Institute of Technology, Delhi",
        "aff_domain": "iitd.ac.in;;iiitd.ac.in;iitd.ac.in",
        "position": "PhD student;;Assistant Professor;Associate Professor",
        "bibtex": "@inproceedings{\nsengupta2024a,\ntitle={A Good Learner can Teach Better: Teacher-Student Collaborative Knowledge Distillation},\nauthor={Ayan Sengupta and Shantanu Dixit and Md Shad Akhtar and Tanmoy Chakraborty},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Ixi4j6LtdX}\n}",
        "github": "",
        "project": "",
        "reviewers": "JBkZ;AnAG;cXqE;upPK",
        "pdf_size": 987194,
        "rating": "5;6;8;8",
        "confidence": "4;1;3;4",
        "soundness": "2;3;2;4",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;4",
        "wc_summary": "66;72;86;89",
        "wc_strengths": "16;23;45;42",
        "wc_weaknesses": "167;34;82;152",
        "wc_questions": "24;60;13;5",
        "wc_review": "273;189;226;288",
        "wc_reply_reviewers": "0;0;19;5",
        "wc_reply_authors": "673;432;596;392",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.0,
            1.224744871391589
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            78.25,
            9.54921462739214
        ],
        "wc_strengths_avg": [
            31.5,
            12.298373876248844
        ],
        "wc_weaknesses_avg": [
            108.75,
            53.774413060488165
        ],
        "wc_questions_avg": [
            25.5,
            21.02974084481309
        ],
        "wc_review_avg": [
            244.0,
            39.13438385869899
        ],
        "wc_reply_reviewers_avg": [
            6.0,
            7.7781745930520225
        ],
        "wc_reply_authors_avg": [
            523.25,
            115.40228550596387
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.15713484026367722,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5437496626256498751&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=Ixi4j6LtdX",
        "pdf": "https://openreview.net/pdf?id=Ixi4j6LtdX",
        "email": "iitd.ac.in;;iiitd.ac.in;iitd.ac.in",
        "author_num": 4,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Indian Institute of Technology Delhi;Indraprastha Institute of Information Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.iitdelhi.ac.in;http://www.iiitd.ac.in",
        "aff_unique_abbr": "IIT Delhi;IIIT-D",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Delhi",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "India"
    },
    {
        "title": "VQ-TR: Vector Quantized Attention for Time Series Forecasting",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18952",
        "id": "IxpTsFS7mh",
        "author_site": "Kashif Rasul, Andrew Bennett, Pablo Vicente, Umang Gupta, Hena Ghonia, Anderson Schneider, Yuriy Nevmyvaka",
        "tldr": "",
        "abstract": "Probabilistic time series forecasting is a challenging problem due to the long sequences involved, the large number of samples needed for accurate probabilistic inference, and the need for real-time inference in many applications. These challenges necessitate methods that are not only accurate but computationally efficient. Unfortunately, most current state-of-the-art methods for time series forecasting are based on Transformers, which scale poorly due to quadratic complexity in sequence length, and are therefore needlessly computationally inefficient. Moreover, with a few exceptions, these methods have only been evaluated for non-probabilistic point estimation. In this work, we address these two shortcomings.\nFor the first, we introduce VQ-TR, which maps large sequences to a discrete set of latent representations as part of the Attention module. This not only allows us to attend over larger context windows with linear complexity in sequence length but also allows for effective regularization to avoid overfitting.\nFor the second, we provide what is to the best of our knowledge the first systematic comparison of modern Transformer-based time series forecasting methods for probabilistic forecasting. In this comparison, we find that VQ-TR performs better or comparably to all other methods while being computationally efficient.",
        "keywords": "deep learning;time series forecasting;latent variable models;discrete representation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Kashif Rasul;Andrew Bennett;Pablo Vicente;Umang Gupta;Hena Ghonia;Anderson Schneider;Yuriy Nevmyvaka",
        "authorids": "~Kashif_Rasul1;~Andrew_Bennett5;~Pablo_Vicente1;~Umang_Gupta1;~Hena_Ghonia1;~Anderson_Schneider1;~Yuriy_Nevmyvaka1",
        "gender": ";;M;M;F;;",
        "homepage": ";;https://pablovicente.github.io/;https://umgupta.github.io;https://hstellar.github.io/;;",
        "dblp": "80/5769;;;g/UmangGupta;;;92/1859",
        "google_scholar": "cfIrwmAAAAAJ;;;qxFVK6UAAAAJ;;;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;;;;",
        "linkedin": ";;pablo-vicentejuan/;;hena-ghonia-0876aa129/;;",
        "or_profile": "~Kashif_Rasul1;~Andrew_Bennett5;~Pablo_Vicente1;~Umang_Gupta1;~Hena_Ghonia1;~Anderson_Schneider1;~Yuriy_Nevmyvaka1",
        "aff": "Zalando SE;;Morgan Stanley;Google;;;Morgan Stanley",
        "aff_domain": "zalando.de;;morganstanley.com;google.com;;;morganstanley.com",
        "position": "Researcher;;Researcher;Researcher;;;Principal Researcher",
        "bibtex": "@inproceedings{\nrasul2024vqtr,\ntitle={{VQ}-{TR}: Vector Quantized Attention for Time Series Forecasting},\nauthor={Kashif Rasul and Andrew Bennett and Pablo Vicente and Umang Gupta and Hena Ghonia and Anderson Schneider and Yuriy Nevmyvaka},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=IxpTsFS7mh}\n}",
        "github": "",
        "project": "",
        "reviewers": "9deP;JnRg;XX8d",
        "pdf_size": 585748,
        "rating": "6;6;8",
        "confidence": "4;4;4",
        "soundness": "4;3;4",
        "contribution": "3;2;3",
        "presentation": "3;3;4",
        "wc_summary": "36;118;75",
        "wc_strengths": "41;47;67",
        "wc_weaknesses": "219;112;165",
        "wc_questions": "37;39;79",
        "wc_review": "333;316;386",
        "wc_reply_reviewers": "108;67;115",
        "wc_reply_authors": "942;779;815",
        "reply_reviewers": "2;1;1",
        "reply_authors": "2;1;1",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            76.33333333333333,
            33.48963355361709
        ],
        "wc_strengths_avg": [
            51.666666666666664,
            11.115554667022044
        ],
        "wc_weaknesses_avg": [
            165.33333333333334,
            43.683202975768864
        ],
        "wc_questions_avg": [
            51.666666666666664,
            19.344824171395878
        ],
        "wc_review_avg": [
            345.0,
            29.81051268708183
        ],
        "wc_reply_reviewers_avg": [
            96.66666666666667,
            21.171259344267224
        ],
        "wc_reply_authors_avg": [
            845.3333333333334,
            69.91582240253076
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11585685520974964496&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=IxpTsFS7mh",
        "pdf": "https://openreview.net/pdf?id=IxpTsFS7mh",
        "email": "zalando.de;;morganstanley.com;google.com;;;morganstanley.com",
        "author_num": 7,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "Zalando SE;Morgan Stanley;Google",
        "aff_unique_dep": ";;Google",
        "aff_unique_url": "https://www.zalando.de;https://www.morganstanley.com;https://www.google.com",
        "aff_unique_abbr": "Zalando;Morgan Stanley;Google",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "Germany;United States"
    },
    {
        "id": "IxplM4f1ty",
        "title": "Semi-Supervised End-To-End Contrastive Learning For Time Series Classification",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Time series classification is a critical task in various domains, such as finance, healthcare, and sensor data analysis. Unsupervised contrastive learning has garnered significant interest in learning effective representations from time series data with limited labels. The prevalent approach in existing contrastive learning methods consists of two separate stages: pre-training the encoder on unlabeled datasets and fine-tuning the well-trained model on a small-scale labeled dataset. However, such two-stage approaches suffer from several shortcomings, such as the inability of unsupervised pre-training contrastive loss to directly affect downstream fine-tuning classifiers, and the lack of exploiting the classification loss which is guided by valuable ground truth. In this paper, we propose an end-to-end model called SLOTS (Semi-supervised Learning fOr Time clasSification). SLOTS receives semi-labeled datasets, comprising a large number of unlabeled samples and a small proportion of labeled samples, and maps them to an embedding space through an encoder. We calculate not only the unsupervised contrastive loss but also measure the supervised contrastive loss on the samples with ground truth. The learned embeddings are fed into a classifier, and the classification loss is calculated using the available true labels. The unsupervised, supervised contrastive losses, and classification loss are jointly used to optimize the encoder and classifier. We evaluate SLOTS by comparing it with ten state-of-the-art methods across five datasets. On an EEG-based emotion recognition task using the DEAP dataset with only 10% labeled data, SLOTS significantly outperforms two-stage baselines, achieving up to a 16.10% higher F1 score (compared to TS-TCC) and a 38.49% higher absolute accuracy (compared to TS2Vec) when the labeling ratio increases to 100%. SLOTS also attains the best performance on four diverse datasets with an average 3.55% margin in F1. In various evaluation setups, including leave-trials-out and leave-subjects-out, SLOTS consistently achieves top performance. The results demonstrate that SLOTS is a simple yet effective framework. When compared to the two-stage framework, our end-to-end SLOTS utilizes the same input data, consumes a similar computational cost, but delivers significantly improved performance. Crucially, our end-to-end framework is model-agnostic, allowing it to be seamlessly integrated with any existing self-supervised contrastive model in order to enhance its performance. We release code and datasets at https://anonymous.4open.science/r/SLOTS-242E.",
        "keywords": "Semi-supervised;Contrastive learning;Time series;EEG",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Huili Cai;Xiang Zhang;XIAOFENG LIU",
        "authorids": "~Huili_Cai1;~Xiang_Zhang10;~XIAOFENG_LIU8",
        "gender": "F;M;M",
        "homepage": ";http://xiangzhang.info/;https://jszy.hhu.edu.cn/lxf100/",
        "dblp": "242/8601;https://dblp.uni-trier.de/pers/hd/z/Zhang_0012:Xiang;https://dblp.uni-trier.de/pid/95/6332-6",
        "google_scholar": ";0hCzMi4AAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": "0009-0002-7498-5351;;0000-0003-1310-6739",
        "linkedin": ";;",
        "or_profile": "~Huili_Cai1;~Xiang_Zhang10;~XIAOFENG_LIU8",
        "aff": ";University of North Carolina at Charlotte;Hohai University",
        "aff_domain": ";uncc.edu;hhu.edu.cn",
        "position": ";Assistant Professor;Full Professor",
        "bibtex": "@misc{\ncai2024semisupervised,\ntitle={Semi-Supervised End-To-End Contrastive Learning For Time Series Classification},\nauthor={Huili Cai and Xiang Zhang and XIAOFENG LIU},\nyear={2024},\nurl={https://openreview.net/forum?id=IxplM4f1ty}\n}",
        "github": "",
        "project": "",
        "reviewers": "9UWV;UUpX;DqhR;5BkY;F7FV",
        "site": "https://openreview.net/forum?id=IxplM4f1ty",
        "pdf_size": 864129,
        "rating": "3;3;5;5;6",
        "confidence": "5;5;4;4;4",
        "soundness": "2;2;3;3;3",
        "contribution": "2;2;2;2;3",
        "presentation": "3;3;3;2;3",
        "wc_summary": "38;101;62;50;42",
        "wc_strengths": "45;11;29;79;15",
        "wc_weaknesses": "257;424;127;141;6",
        "wc_questions": "6;10;96;133;27",
        "wc_review": "346;546;314;403;90",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            4.4,
            1.2
        ],
        "confidence_avg": [
            4.4,
            0.48989794855663565
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            58.6,
            22.729716232280595
        ],
        "wc_strengths_avg": [
            35.8,
            24.67711490429949
        ],
        "wc_weaknesses_avg": [
            191.0,
            141.04325577637522
        ],
        "wc_questions_avg": [
            54.4,
            50.93760889558912
        ],
        "wc_review_avg": [
            339.8,
            148.06539095953516
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.9525793444156803,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14934113358960333982&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of North Carolina at Charlotte;Hohai University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uncc.edu;https://www.hohai.edu.cn",
        "aff_unique_abbr": "UNCC;Hohai",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Charlotte;",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "Iy0WQ0c75x",
        "title": "Alignment and Outer Shell Isotropy for Hyperbolic Graph Contrastive Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Learning good self-supervised graph representations that are beneficial to downstream tasks is challenging. Among a variety of methods, contrastive learning enjoys competitive performance. The embeddings of contrastive learning are arranged on a hypersphere that enables the Cosine distance measurement in the Euclidean space. However, the underlying structure of many domains such as graphs exhibits highly non-Euclidean latent geometry. To this end, we propose a novel contrastive learning framework to learn high-quality graph embedding. Specifically, we design the alignment metric that effectively captures the hierarchical data-invariant information, as well as we propose a substitute of uniformity metric  to prevent the so-called dimensional collapse. We show that in the hyperbolic space one has to address the leaf- and height-level uniformity which are related to properties of trees, whereas in the ambient space of the hyperbolic manifold, these notions translate into imposing an isotropic ring density towards boundaries of Poincar\u00e9 ball. This ring density can be easily imposed by promoting the isotropic feature distribution on the tangent space of manifold. In the experiments, we demonstrate the efficacy of our proposed method across different hyperbolic graph embedding techniques in both supervised and self-supervised learning settings.",
        "keywords": "Dimensional;Collapse;Contrastive",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/9445e1a5e0c689914cde78619f2510d2bdb7d1fa.pdf",
        "author": "Yifei Zhang;Hao Zhu;Jiahong Liu;Piotr Koniusz;Irwin King",
        "authorids": "~Yifei_Zhang6;~Hao_Zhu2;~Jiahong_Liu1;~Piotr_Koniusz1;~Irwin_King1",
        "gender": "M;;;;M",
        "homepage": "https://yifeiacc.github.io/;;;https://www.koniusz.com;https://www.cse.cuhk.edu.hk/irwin.king/",
        "dblp": "55/5266-1.html;;;25/8616;k/IrwinKing",
        "google_scholar": "DmwXESQAAAAJ;;;https://scholar.google.co.uk/citations?user=wZ7-1tUAAAAJ;MXvC7tkAAAAJ",
        "orcid": "0000-0003-4185-8663;;;0000-0002-6340-5289;0000-0001-8106-6447",
        "linkedin": ";;;;irwinking/",
        "or_profile": "~Yifei_Zhang6;~Hao_Zhu2;~Jiahong_Liu1;~Piotr_Koniusz1;~Irwin_King1",
        "aff": "Department of Computer Science and Engineering, The Chinese University of Hong Kong;;;Data61, CSIRO;The Chinese University of Hong Kong",
        "aff_domain": "cse.cuhk.edu.hk;;;data61.csiro.au;cuhk.edu.hk",
        "position": "PhD student;;;Principal Researcher;Full Professor",
        "bibtex": "@misc{\nzhang2024alignment,\ntitle={Alignment and Outer Shell Isotropy for Hyperbolic Graph Contrastive Learning},\nauthor={Yifei Zhang and Hao Zhu and Jiahong Liu and Piotr Koniusz and Irwin King},\nyear={2024},\nurl={https://openreview.net/forum?id=Iy0WQ0c75x}\n}",
        "github": "",
        "project": "",
        "reviewers": "WCaW;vDHc;NnrR;M3pp",
        "site": "https://openreview.net/forum?id=Iy0WQ0c75x",
        "pdf_size": 4388817,
        "rating": "3;5;5;6",
        "confidence": "4;4;3;2",
        "soundness": "1;2;3;3",
        "contribution": "2;3;2;3",
        "presentation": "1;2;3;3",
        "wc_summary": "51;204;124;108",
        "wc_strengths": "30;83;51;54",
        "wc_weaknesses": "483;711;100;24",
        "wc_questions": "51;88;6;109",
        "wc_review": "615;1086;281;295",
        "wc_reply_reviewers": "1374;147;24;21",
        "wc_reply_authors": "2551;1397;478;190",
        "reply_reviewers": "5;1;1;1",
        "reply_authors": "5;3;2;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            121.75,
            54.691749834869974
        ],
        "wc_strengths_avg": [
            54.5,
            18.874586088176873
        ],
        "wc_weaknesses_avg": [
            329.5,
            280.67107082846996
        ],
        "wc_questions_avg": [
            63.5,
            39.15673632978111
        ],
        "wc_review_avg": [
            569.25,
            326.8886469426554
        ],
        "wc_reply_reviewers_avg": [
            391.5,
            569.5201927938991
        ],
        "wc_reply_authors_avg": [
            1154.0,
            921.5381164119041
        ],
        "reply_reviewers_avg": [
            2.0,
            1.7320508075688772
        ],
        "reply_authors_avg": [
            2.75,
            1.479019945774904
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.7608859102526822,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13816608458086128275&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Chinese University of Hong Kong;CSIRO",
        "aff_unique_dep": "Department of Computer Science and Engineering;Data61",
        "aff_unique_url": "https://www.cuhk.edu.hk;https://www.csiro.au",
        "aff_unique_abbr": "CUHK;CSIRO",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "China;Australia"
    },
    {
        "id": "IyRQDOPjD5",
        "title": "Full Elastic Weight Consolidation via the Surrogate Hessian-Vector Product",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Elastic weight consolidation (EWC) is a widely accepted method for preventing catastrophic forgetting while learning a series of tasks. The key computation involved in EWC is the Fisher Information Matrix (FIM), which identifies the parameters that are crucial to previous tasks and should not be altered during new learning. However, the practical application of the FIM (a square matrix that is the same size as the number of parameters) has been limited by computational difficulties. As a result, previous uses of EWC have only employed the diagonal elements, or at most diagonal blocks, of the matrix. In this work, we introduce a method for obtaining the gradient step for EWC with the full FIM, which is both memory and computationally efficient. We evaluate the advantages of using the full FIM over just the diagonal in EWC on supervised and reinforcement learning tasks and our results demonstrate a quantitative difference between the two approaches, which are more effective when used in combination. Finally we show both empirically and theoretically that the benefits of using the full FIM are greater when the network is initialised in the lazy regime rather than the feature learning regime.",
        "keywords": "Elastic Weight Consolidation;Continual Learning;Initialization Regimes",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/e63dea4a6f4975a0d7252b40193c32528a1a9494.zip",
        "author": "Devon Jarvis;Geraud Nangue Tasse;Sebastian Lee;Sicelukwanda Zwane;Richard Klein;Benjamin Rosman;Andrew M Saxe",
        "authorids": "~Devon_Jarvis1;~Geraud_Nangue_Tasse1;~Sebastian_Lee1;~Sicelukwanda_Zwane1;~Richard_Klein1;~Benjamin_Rosman1;~Andrew_M_Saxe1",
        "gender": "M;M;;M;M;M;M",
        "homepage": "https://jarvisdevon.github.io/;https://geraudnt.github.io/;https://seblee97.github.io/;https://sml-group.cc/authors/sicelukwanda_zwane/;https://www.wits.ac.za/staff/academic-a-z-listing/k/richardkleinwitsacza/;http://www.raillab.org;https://www.saxelab.org",
        "dblp": "320/3650;256/0971;;;26/8293;45/4591;39/6894",
        "google_scholar": "https://scholar.google.co.za/citations?user=MJjN5nEAAAAJ;CAfsMIsAAAAJ;Vl9WQ0EAAAAJ;;https://scholar.google.co.za/citations?user=QZ_MjosAAAAJ;https://scholar.google.co.za/citations?user=pWJ0SocAAAAJ;h0Al1fcAAAAJ",
        "orcid": "0000-0003-2362-7538;0000-0002-6152-8429;;0000-0001-5361-5752;0000-0003-0783-2072;;0000-0002-9831-8812",
        "linkedin": "devon-jarvis-6b059a139;geraud-nangue-tasse-264281a5/;;;;;",
        "or_profile": "~Devon_Jarvis1;~Geraud_Nangue_Tasse1;~Sebastian_Lee1;~Sicelukwanda_Zwane1;~Richard_Klein1;~Benjamin_Rosman1;~Andrew_M_Saxe1",
        "aff": "University College London, University of London;University of the Witwatersrand;Imperial College London, Imperial College London;University College London, University of London;University of the Witwatersrand;University of the Witwatersrand;University College London, University of London",
        "aff_domain": "ucl.ac.uk;wits.ac.za;imperial.ac.uk;ucl.ac.uk;wits.ac.za;wits.ac.za;ucl.ac.uk",
        "position": "Researcher;PhD student;PhD student;PhD student;Associate Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\njarvis2024full,\ntitle={Full Elastic Weight Consolidation via the Surrogate Hessian-Vector Product},\nauthor={Devon Jarvis and Geraud Nangue Tasse and Sebastian Lee and Sicelukwanda Zwane and Richard Klein and Benjamin Rosman and Andrew M Saxe},\nyear={2024},\nurl={https://openreview.net/forum?id=IyRQDOPjD5}\n}",
        "github": "",
        "project": "",
        "reviewers": "HSfz;gTVN;mrqD",
        "site": "https://openreview.net/forum?id=IyRQDOPjD5",
        "pdf_size": 10432857,
        "rating": "3;3;5",
        "confidence": "2;5;3",
        "soundness": "2;2;3",
        "contribution": "2;2;2",
        "presentation": "2;2;3",
        "wc_summary": "45;83;147",
        "wc_strengths": "54;76;71",
        "wc_weaknesses": "161;509;250",
        "wc_questions": "4;113;134",
        "wc_review": "264;781;602",
        "wc_reply_reviewers": "0;486;509",
        "wc_reply_authors": "315;2972;1097",
        "reply_reviewers": "0;1;2",
        "reply_authors": "2;4;3",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            1.247219128924647
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            91.66666666666667,
            42.089850980438925
        ],
        "wc_strengths_avg": [
            67.0,
            9.41629792788369
        ],
        "wc_weaknesses_avg": [
            306.6666666666667,
            147.6128570130514
        ],
        "wc_questions_avg": [
            83.66666666666667,
            56.98147847229737
        ],
        "wc_review_avg": [
            549.0,
            214.36573109213762
        ],
        "wc_reply_reviewers_avg": [
            331.6666666666667,
            234.71164341709925
        ],
        "wc_reply_authors_avg": [
            1461.3333333333333,
            1114.889032843877
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            3.0,
            0.816496580927726
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.18898223650461354,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ijMcvwYUA1gJ:scholar.google.com/&scioq=Full+Elastic+Weight+Consolidation+via+the+Surrogate+Hessian-Vector+Product&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0;1;1;0",
        "aff_unique_norm": "University College London;University of the Witwatersrand;Imperial College London",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ucl.ac.uk;https://www.wits.ac.za;https://www.imperial.ac.uk",
        "aff_unique_abbr": "UCL;Wits;ICL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;1;1;0",
        "aff_country_unique": "United Kingdom;South Africa"
    },
    {
        "title": "Bellman Optimal Stepsize Straightening of Flow-Matching Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18951",
        "id": "Iyve2ycvGZ",
        "author_site": "Bao Nguyen, Binh Nguyen, Viet Anh Nguyen",
        "tldr": "",
        "abstract": "Flow matching is a powerful framework for generating high-quality samples in various applications, especially image synthesis. However, the intensive computational demands of these models, especially during the finetuning process and sampling processes, pose significant challenges for low-resource scenarios. This paper introduces Bellman Optimal Stepsize Straightening (BOSS) technique for distilling flow-matching generative models: it aims specifically for a few-step efficient image sampling while adhering to a computational budget constraint. First, this technique involves a dynamic programming algorithm that optimizes the stepsizes of the pretrained network. Then, it refines the velocity network to match the optimal step sizes, aiming to straighten the generation paths. Extensive experimental evaluations across image generation tasks demonstrate the efficacy of BOSS in terms of both resource utilization and image quality. Our results reveal that BOSS achieves substantial gains in efficiency while maintaining competitive sample quality, effectively bridging the gap between low-resource constraints and the demanding requirements of flow-matching generative models. Our paper also fortifies the responsible development of artificial intelligence, offering a more sustainable generative model that reduces computational costs and environmental footprints. Our code can be found at https://github.com/nguyenngocbaocmt02/BOSS.",
        "keywords": "flow matching;generative model;efficient sampling;distillation;responsible ML",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Bao Nguyen;Binh Nguyen;Viet Anh Nguyen",
        "authorids": "~Bao_Nguyen2;~Binh_Nguyen2;~Viet_Anh_Nguyen2",
        "gender": "M;M;M",
        "homepage": "https://www.researchgate.net/profile/Nguyen-Bao-36;https://tbng.github.io/;http://www.vietanhnguyen.net",
        "dblp": "299/2996;241/2542;",
        "google_scholar": ";6rpHj_YAAAAJ;3iyf-EoAAAAJ",
        "orcid": "0000-0002-6770-2408;;",
        "linkedin": "bao-nguyen-0a360b197/;;",
        "or_profile": "~Bao_Nguyen2;~Binh_Nguyen2;~Viet_Anh_Nguyen2",
        "aff": "VinUniversity;National University of Singapore;The Chinese University of Hong Kong",
        "aff_domain": "vinuni.edu.vn;nus.edu.sg;cuhk.edu.hk",
        "position": "Research Assistant;Research Fellow;Assistant Professor",
        "bibtex": "@inproceedings{\nnguyen2024bellman,\ntitle={Bellman Optimal Stepsize Straightening of Flow-Matching Models},\nauthor={Bao Nguyen and Binh Nguyen and Viet Anh Nguyen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Iyve2ycvGZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "GU1Q;pSht;TqqW",
        "pdf_size": 16001345,
        "rating": "6;6;6",
        "confidence": "4;5;3",
        "soundness": "2;3;3",
        "contribution": "3;2;3",
        "presentation": "3;3;3",
        "wc_summary": "60;79;105",
        "wc_strengths": "41;64;91",
        "wc_weaknesses": "180;80;129",
        "wc_questions": "37;2;118",
        "wc_review": "318;225;443",
        "wc_reply_reviewers": "241;0;0",
        "wc_reply_authors": "1586;543;681",
        "reply_reviewers": "2;0;0",
        "reply_authors": "3;3;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            81.33333333333333,
            18.445113776342563
        ],
        "wc_strengths_avg": [
            65.33333333333333,
            20.434176165325468
        ],
        "wc_weaknesses_avg": [
            129.66666666666666,
            40.827550610940264
        ],
        "wc_questions_avg": [
            52.333333333333336,
            48.58211833815218
        ],
        "wc_review_avg": [
            328.6666666666667,
            89.31716271554731
        ],
        "wc_reply_reviewers_avg": [
            80.33333333333333,
            113.60848951063865
        ],
        "wc_reply_authors_avg": [
            936.6666666666666,
            462.59149245191367
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2442085478434182095&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=Iyve2ycvGZ",
        "pdf": "https://openreview.net/pdf?id=Iyve2ycvGZ",
        "email": "vinuni.edu.vn;nus.edu.sg;cuhk.edu.hk",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "VinUniversity;National University of Singapore;Chinese University of Hong Kong",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://vinuni.edu.vn;https://www.nus.edu.sg;https://www.cuhk.edu.hk",
        "aff_unique_abbr": "VinUni;NUS;CUHK",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;1;2",
        "aff_country_unique": "Vietnam;Singapore;China"
    },
    {
        "id": "IzkgLgHt5Z",
        "title": "Optimization and Generalizability: Fair Benchmarking for Stochastic Algorithms",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We currently lack full understanding of what makes a good optimizer for deep learning and whether improved optimization performance confers higher generalizability. Current literature neglects an important innate characteristic of SGD and variants, their stochasticity, failing to fairly benchmark these algorithms and reveal their performance in the statistical sense. This paper fills this gap. Unlike existing work which evaluates the end point of one navigation/optimization trajectory, we utilize and sample from the ensemble of many optimization trajectories, so that we can estimate the stationary distribution of a stochastic optimizer. We cast a wide net and include SGD and noise-enabled variants, flat-minima optimizers, and novel algorithms we debut in this paper by recasting and broadening the SGD algorithm under the Basin Hopping framework. Our evaluation considers both synthetic functions with known global and local minima of varying flatness and real-world problems in computer vision and natural language processing. Fair benchmarking accounts for the statistical setting, comparing stationary distributions and establishing statistical significance. Our paper reveals several findings on the relationship between training loss and hold-out accuracy, the comparable performance of SGD, noise-enabled variants, and novel optimizers based on the BH framework; indeed, these algorithms match the performance of flat-minima optimizers such as SAM with half the gradient evaluations. We hope that this work will support further research in deep learning optimization relying not on single models but instead accounting for the stochasticity of optimizers.",
        "keywords": "non-convex optimization; stochastic optimization algorithms; deep learning; generalizability",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/8a0d4d6dc3176f7687155d6325049396c996639d.pdf",
        "author": "Toki Tahmid Inan;Mingrui Liu;Amarda Shehu",
        "authorids": "~Toki_Tahmid_Inan1;~Mingrui_Liu2;~Amarda_Shehu1",
        "gender": "M;;F",
        "homepage": ";https://mingrliu.github.io;https://cs.gmu.edu/~ashehu/",
        "dblp": "229/3494;;53/3810",
        "google_scholar": "4cQqe5cAAAAJ;KFoEnFQAAAAJ;https://scholar.google.com.tw/citations?user=HkB_Gz0AAAAJ",
        "orcid": "0000-0001-9466-0613;;0000-0001-5230-4610",
        "linkedin": "toki-tahmid-inan-682782122/;mingrui-liu-447a2aab/;",
        "or_profile": "~Toki_Tahmid_Inan1;~Mingrui_Liu2;~Amarda_Shehu1",
        "aff": "George Mason University;George Mason University;George Mason University",
        "aff_domain": "gmu.edu;gmu.edu;gmu.edu",
        "position": "PhD student;Assistant Professor;Professor",
        "bibtex": "@misc{\ninan2024optimization,\ntitle={Optimization and Generalizability: Fair Benchmarking for Stochastic Algorithms},\nauthor={Toki Tahmid Inan and Mingrui Liu and Amarda Shehu},\nyear={2024},\nurl={https://openreview.net/forum?id=IzkgLgHt5Z}\n}",
        "github": "",
        "project": "",
        "reviewers": "eDnC;zLAt;uLHr;xXFv",
        "site": "https://openreview.net/forum?id=IzkgLgHt5Z",
        "pdf_size": 9983117,
        "rating": "3;3;5;8",
        "confidence": "3;4;3;3",
        "soundness": "2;2;2;4",
        "contribution": "1;1;2;3",
        "presentation": "1;2;3;3",
        "wc_summary": "225;91;120;117",
        "wc_strengths": "82;78;50;67",
        "wc_weaknesses": "171;181;113;50",
        "wc_questions": "175;29;1;5",
        "wc_review": "653;379;284;239",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "705;765;611;236",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            138.25,
            51.338947203852946
        ],
        "wc_strengths_avg": [
            69.25,
            12.397076268217438
        ],
        "wc_weaknesses_avg": [
            128.75,
            52.356351095163234
        ],
        "wc_questions_avg": [
            52.5,
            71.53146160956031
        ],
        "wc_review_avg": [
            388.75,
            160.71772615365114
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            579.25,
            205.6360559337783
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.49374193110101877,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:nK0o6_bYHTEJ:scholar.google.com/&scioq=Optimization+and+Generalizability:+Fair+Benchmarking+for+Stochastic+Algorithms&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "George Mason University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.gmu.edu",
        "aff_unique_abbr": "GMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Private Zeroth-Order Nonsmooth Nonconvex Optimization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18950",
        "id": "IzqZbNMZ0M",
        "author_site": "Qinzi Zhang, Hoang Tran, Ashok Cutkosky",
        "tldr": "",
        "abstract": "We introduce a new zeroth-order algorithm for private stochastic optimization on nonconvex and nonsmooth objectives.\nGiven a dataset of size $M$, our algorithm ensures $(\\alpha,\\alpha\\rho^2/2)$-Renyi differential privacy and finds a $(\\delta,\\epsilon)$-stationary point so long as $M=\\tilde\\Omega(\\frac{d}{\\delta\\epsilon^3} + \\frac{d^{3/2}}{\\rho\\delta\\epsilon^2})$.\nThis matches the optimal complexity found in its non-private zeroth-order analog. \nNotably, although the objective is not smooth, we have privacy ``for free'' when $\\rho \\ge \\sqrt{d}\\epsilon$.",
        "keywords": "optimization;differential privacy;non-convex;non-smooth",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/48bb802aed7b0fc0ecd25652a0ec8910bc3c30a6.pdf",
        "author": "Qinzi Zhang;Hoang Tran;Ashok Cutkosky",
        "authorids": "~Qinzi_Zhang1;~Hoang_Tran4;~Ashok_Cutkosky1",
        "gender": "M;M;",
        "homepage": ";;http://www.cs.stanford.edu/~ashokc",
        "dblp": "275/8559;79/11286;191/6725",
        "google_scholar": "QYP73uQAAAAJ;IdSgJnEAAAAJ;h4AbGp0AAAAJ",
        "orcid": ";;",
        "linkedin": ";hoang-tran-a04230132/;",
        "or_profile": "~Qinzi_Zhang1;~Hoang_Tran4;~Ashok_Cutkosky1",
        "aff": "Boston University, Boston University;Boston University;Boston University",
        "aff_domain": "bu.edu;bu.edu;bu.edu",
        "position": "PhD student;PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nzhang2024private,\ntitle={Private Zeroth-Order Nonsmooth Nonconvex Optimization},\nauthor={Qinzi Zhang and Hoang Tran and Ashok Cutkosky},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=IzqZbNMZ0M}\n}",
        "github": "",
        "project": "",
        "reviewers": "oGL7;P8ng;oD4K;pExn",
        "pdf_size": 384385,
        "rating": "5;6;6;8",
        "confidence": "4;3;4;4",
        "soundness": "2;3;3;4",
        "contribution": "2;3;3;3",
        "presentation": "3;4;3;4",
        "wc_summary": "60;91;48;16",
        "wc_strengths": "63;77;78;50",
        "wc_weaknesses": "530;45;48;44",
        "wc_questions": "2;73;1;450",
        "wc_review": "655;286;175;560",
        "wc_reply_reviewers": "121;17;0;8",
        "wc_reply_authors": "1285;668;136;300",
        "reply_reviewers": "2;1;0;1",
        "reply_authors": "3;1;1;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            53.75,
            26.85493436968335
        ],
        "wc_strengths_avg": [
            67.0,
            11.467344941179714
        ],
        "wc_weaknesses_avg": [
            166.75,
            209.72765077595275
        ],
        "wc_questions_avg": [
            131.5,
            186.18874831739967
        ],
        "wc_review_avg": [
            419.0,
            195.44948196401035
        ],
        "wc_reply_reviewers_avg": [
            36.5,
            49.1553659329274
        ],
        "wc_reply_authors_avg": [
            597.25,
            441.3373851148348
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.13245323570650439,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14617048431366959324&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=IzqZbNMZ0M",
        "pdf": "https://openreview.net/pdf?id=IzqZbNMZ0M",
        "email": "bu.edu;bu.edu;bu.edu",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Boston University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.bu.edu",
        "aff_unique_abbr": "BU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Boston;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "IzrLkbq1dc",
        "title": "Analyzing Local Representations of Self-supervised Vision Transformers",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In this paper, we present a comparative analysis of various self-supervised Vision Transformers (ViTs), focusing on their local representative power. Inspired by large language models, we examine the abilities of ViTs to perform various computer vision tasks with little to no fine-tuning. We design evaluation framework to analyze the quality of local, i.e. patch-level, representations in the context of few-shot semantic segmentation, instance identification, object retrieval and tracking. We discover that contrastive learning based methods like DINO produce more universal patch representations that can be immediately applied for downstream tasks with no parameter tuning, compared to masked image modeling. The embeddings learned using the latter approach, e.g. in masked autoencoders, have high variance features that harm distance-based algorithms, such as k-NN, and do not contain useful information for most downstream tasks. Finally, we find an object instance retrieval setting where DINOv2, a model pretrained on two orders of magnitude more data, performs worse than its less compute intensive counterpart DINO.",
        "keywords": "vision transformers;analysis;segmentation;tracking",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/5300ba0c2c70f01ce4f404035dffd9353f52a7ed.pdf",
        "author": "Ani Vanyan;Alvard Barseghyan;Hakob Tamazyan;Vahan Huroyan;Hrant Khachatrian;Martin Danelljan",
        "authorids": "~Ani_Vanyan1;~Alvard_Barseghyan1;~Hakob_Tamazyan1;~Vahan_Huroyan1;~Hrant_Khachatrian1;~Martin_Danelljan4",
        "gender": "F;F;M;M;;M",
        "homepage": ";;;https://vahan.huroyan.com/;;https://martin-danelljan.github.io/",
        "dblp": ";;;200/8385;20/10360;151/8848",
        "google_scholar": ";;https://scholar.google.com/citations?hl=en;ZWj2xyAAAAAJ;CxOrE_kAAAAJ;NCSSpMkAAAAJ",
        "orcid": "0000-0002-6203-7146;;;0000-0002-1596-6962;0000-0002-1544-5649;",
        "linkedin": ";alvard-barseghyan-069540214/;hakob-tamazyan/;;;",
        "or_profile": "~Ani_Vanyan1;~Alvard_Barseghyan1;~Hakob_Tamazyan1;~Vahan_Huroyan1;~Hrant_Khachatrian1;~Martin_Danelljan4",
        "aff": "YerevaNN research Lab;YerevaNN research Lab;Yerevan State University;Saint Louis University;YerevaNN;ETH Zurich",
        "aff_domain": "yerevann.com;yerevann.com;ysu.am;slu.edu;yerevann.com;vision.ee.ethz.ch",
        "position": "Researcher;Researcher;PhD student;Assistant Professor;Researcher;Principal Researcher",
        "bibtex": "@misc{\nvanyan2024analyzing,\ntitle={Analyzing Local Representations of Self-supervised Vision Transformers},\nauthor={Ani Vanyan and Alvard Barseghyan and Hakob Tamazyan and Vahan Huroyan and Hrant Khachatrian and Martin Danelljan},\nyear={2024},\nurl={https://openreview.net/forum?id=IzrLkbq1dc}\n}",
        "github": "",
        "project": "",
        "reviewers": "hpmg;NRBU;HZLL;aCKC",
        "site": "https://openreview.net/forum?id=IzrLkbq1dc",
        "pdf_size": 816684,
        "rating": "3;3;5;6",
        "confidence": "4;4;5;4",
        "soundness": "3;2;3;4",
        "contribution": "1;2;2;4",
        "presentation": "2;4;3;4",
        "wc_summary": "87;108;41;71",
        "wc_strengths": "85;62;51;62",
        "wc_weaknesses": "281;493;246;188",
        "wc_questions": "41;173;5;12",
        "wc_review": "494;836;343;333",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            1.0897247358851685
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            76.75,
            24.457871943405053
        ],
        "wc_strengths_avg": [
            65.0,
            12.389511693363866
        ],
        "wc_weaknesses_avg": [
            302.0,
            115.16726965592264
        ],
        "wc_questions_avg": [
            57.75,
            67.89467946754002
        ],
        "wc_review_avg": [
            501.5,
            203.38448810073987
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1259988302136313217&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1;2;3;4",
        "aff_unique_norm": "YerevaNN research Lab;Yerevan State University;Saint Louis University;YerevaNN;ETH Zurich",
        "aff_unique_dep": "research Lab;;;;",
        "aff_unique_url": ";https://www.yerevanstateuniversity.am;https://www.slu.edu;;https://www.ethz.ch",
        "aff_unique_abbr": ";YSU;SLU;;ETHZ",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0;2",
        "aff_country_unique": "Armenia;United States;Switzerland"
    },
    {
        "id": "J0cCuE3JRC",
        "title": "Bag of Features: New Baselines for GNNs for Link Prediction",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph Neural Networks (GNNs) have brought a significant transformation in the realm of graph representation learning. They achieve this by employing a neighborhood aggregation approach, wherein a node's representation vector is iteratively calculated by aggregating and modifying the corresponding vectors of its neighboring nodes. Despite GNNs demonstrating superior performance in various domains over the last ten years, recent theoretical studies have raised concerns about their expressive capabilities, where they show that GNN models yield results comparable to the well-established Weisfeiler-Lehman algorithm.\n\nIn this paper, driven by this motivation, we compare the performance of current GNN models with conventional feature extraction methods in the context of link prediction. Our experiments reveal that when applied to standard feature sets derived from node neighborhoods and node features, standard machine learning (ML) models deliver highly competitive results, even when pitted against cutting-edge GNN models. This holds true across both small and large benchmark datasets, including those from the Open Graph Benchmark (OGB). Our empirical findings corroborate the previously mentioned theoretical observations and imply that there exists ample room for enhancement in current GNN models to reach their potential.",
        "keywords": "graph representation learning;link prediction;feature engineering;graph neural networks",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/77af230c09901e59790161d3e68b8f18fea70bc4.pdf",
        "author": "Astrit Tola;Jack Myrick;Baris Coskunuzer",
        "authorids": "~Astrit_Tola1;~Jack_Myrick1;~Baris_Coskunuzer1",
        "gender": "M;M;M",
        "homepage": "https://astrittola.github.io/;https://github.com/jmyrick02;https://personal.utdallas.edu/~bxc190014/",
        "dblp": "389/5738.html;;287/4893",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;n49tHqQAAAAJ",
        "orcid": "0000-0002-7873-2602;;0000-0001-7462-8819",
        "linkedin": ";;baris-coskunuzer-2ba327169/",
        "or_profile": "~Astrit_Tola1;~Jack_Myrick1;~Baris_Coskunuzer1",
        "aff": "University of Texas at Dallas;The University of Texas at Dallas;University of Texas, Dallas",
        "aff_domain": "utdallas.edu;cs.utdallas.edu;utdallas.edu",
        "position": "PhD student;Undergrad student;Full Professor",
        "bibtex": "@misc{\ntola2024bag,\ntitle={Bag of Features: New Baselines for {GNN}s for Link Prediction},\nauthor={Astrit Tola and Jack Myrick and Baris Coskunuzer},\nyear={2024},\nurl={https://openreview.net/forum?id=J0cCuE3JRC}\n}",
        "github": "",
        "project": "",
        "reviewers": "dape;rEua;Wcv5;in5m",
        "site": "https://openreview.net/forum?id=J0cCuE3JRC",
        "pdf_size": 246471,
        "rating": "3;3;5;8",
        "confidence": "4;4;4;4",
        "soundness": "2;2;3;3",
        "contribution": "1;2;2;4",
        "presentation": "3;2;3;3",
        "wc_summary": "27;18;30;101",
        "wc_strengths": "20;19;6;123",
        "wc_weaknesses": "157;140;22;91",
        "wc_questions": "5;2;32;167",
        "wc_review": "209;179;90;482",
        "wc_reply_reviewers": "212;0;21;88",
        "wc_reply_authors": "2275;896;505;670",
        "reply_reviewers": "3;0;1;1",
        "reply_authors": "6;2;2;3",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            1.0897247358851685
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            44.0,
            33.20391543176798
        ],
        "wc_strengths_avg": [
            42.0,
            47.090338711884414
        ],
        "wc_weaknesses_avg": [
            102.5,
            52.41421562896844
        ],
        "wc_questions_avg": [
            51.5,
            67.69970457838055
        ],
        "wc_review_avg": [
            240.0,
            146.41208966475412
        ],
        "wc_reply_reviewers_avg": [
            80.25,
            82.71751628282851
        ],
        "wc_reply_authors_avg": [
            1086.5,
            700.0780313650757
        ],
        "reply_reviewers_avg": [
            1.25,
            1.0897247358851685
        ],
        "reply_authors_avg": [
            3.25,
            1.6393596310755
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:e5I6FCO1sO4J:scholar.google.com/&scioq=Bag+of+Features:+New+Baselines+for+GNNs+for+Link+Prediction&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Texas at Dallas",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.utdallas.edu",
        "aff_unique_abbr": "UT Dallas",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Dallas",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "J0qgRZQJYX",
        "title": "An Axiomatic Approach to Model-Agnostic Concept Explanations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Concept explanation is a popular approach for examining how human-interpretable concepts impact the predictions of a model. However, most existing methods for concept explanations are tailored to specific models. To address this issue, this paper focuses on model-agnostic measures. Specifically, we propose an approach to concept explanations that satisfy three natural axioms: linearity, recursivity, and similarity. We then establish connections with previous concept explanation methods, offering insight into their varying semantic meanings. Experimentally, we demonstrate the utility of the new method by applying it in different scenarios: for model selection, optimizer selection, and model improvement using a kind of prompt editing for zero-shot vision language models.",
        "keywords": "Interpretability;vision-language model",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/0fe6b4b948c0e19287ca9de6a174f61b00c1d6e3.pdf",
        "author": "Michal Moshkovitz;Zhili Feng;Dotan Di Castro;J Zico Kolter",
        "authorids": "~Michal_Moshkovitz2;~Zhili_Feng1;~Dotan_Di_Castro1;~J_Zico_Kolter1",
        "gender": "F;;M;M",
        "homepage": "https://sites.google.com/view/michal-moshkovitz;https://zhilif.github.io/;;http://www.zicokolter.com",
        "dblp": "87/8727;189/7590;72/538;67/2526",
        "google_scholar": "G3eFbR0AAAAJ;_lnL4aQAAAAJ;zhQaFaMAAAAJ;UXh1I6UAAAAJ",
        "orcid": "0009-0006-9456-9944;;;",
        "linkedin": ";;dotan-di-castro-b0a99039/;",
        "or_profile": "~Michal_Moshkovitz2;~Zhili_Feng1;~Dotan_Di_Castro1;~Zico_Kolter1",
        "aff": "Bosch Center for AI;Microsoft Research;Bosch;Carnegie Mellon University",
        "aff_domain": "bosch.com;microsoft.com;bosch.com;cmu.edu",
        "position": "Researcher;Intern;Bosch Center for Artificial Inteligence;Full Professor",
        "bibtex": "@misc{\nmoshkovitz2024an,\ntitle={An Axiomatic Approach to Model-Agnostic Concept Explanations},\nauthor={Michal Moshkovitz and Zhili Feng and Dotan Di Castro and J Zico Kolter},\nyear={2024},\nurl={https://openreview.net/forum?id=J0qgRZQJYX}\n}",
        "github": "",
        "project": "",
        "reviewers": "NFev;QfZD;iv2S;rtvs",
        "site": "https://openreview.net/forum?id=J0qgRZQJYX",
        "pdf_size": 4006520,
        "rating": "3;3;3;3",
        "confidence": "4;5;4;3",
        "soundness": "2;3;2;2",
        "contribution": "2;2;2;2",
        "presentation": "2;3;2;2",
        "wc_summary": "29;29;91;91",
        "wc_strengths": "25;45;36;61",
        "wc_weaknesses": "114;335;281;276",
        "wc_questions": "1;38;94;10",
        "wc_review": "169;447;502;438",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "194;246;207;196",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            60.0,
            31.0
        ],
        "wc_strengths_avg": [
            41.75,
            13.179055353097201
        ],
        "wc_weaknesses_avg": [
            251.5,
            82.68766534375003
        ],
        "wc_questions_avg": [
            35.75,
            36.29307785239494
        ],
        "wc_review_avg": [
            389.0,
            129.3580302880343
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            210.75,
            20.94486810653149
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7525596008067529574&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Bosch Center for AI;Microsoft;Robert Bosch GmbH;Carnegie Mellon University",
        "aff_unique_dep": "Center for AI;Microsoft Research;;",
        "aff_unique_url": "https://www.bosch-ai.com;https://www.microsoft.com/en-us/research;https://www.bosch.com;https://www.cmu.edu",
        "aff_unique_abbr": "BCAI;MSR;Bosch;CMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;1",
        "aff_country_unique": "Germany;United States"
    },
    {
        "id": "J1SzMZn5lH",
        "title": "Multi-Agent Bayesian Optimization with Coupled Black-box and Affine Constraints",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper studies the problem of distributed multi-agent Bayesian optimization with both coupled black-box constraints and known affine constraints. A primal-dual distributed algorithm is proposed that achieves similar regret/violation bounds as those in the single-agent case for the black-box objective and constraint functions. Additionally, the algorithm guarantees an $\\mathcal{O}(N\\sqrt{T})$ bound on the cumulative violation for the known affine constraints, where $N$ is the number of agents. Hence, it is ensured that the average of the samples satisfies the affine constraints up to the error $\\mathcal{O}(N/\\sqrt{T})$. Furthermore, we characterize certain conditions under which our algorithm can bound a stronger metric of cumulative violation and provide best-iterate convergence without affine constraint. The method is then applied to both sampled instances from Gaussian processes and a real-world optimal power allocation problem for wireless communication; the results show that our method simultaneously provides close-to-optimal performance and maintains minor violations on average, corroborating our theoretical analysis.",
        "keywords": "Bayesian optimization; Multi-Agent Black-box Optimization; Coupled Black-box Constraints; Coupled Affine Constraints",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/7bbbc188dbeaae8fd1bdef6384f9f0e95be2f069.zip",
        "author": "Wenjie Xu;Yuning Jiang;Bratislav Svetozarevic;Colin Jones",
        "authorids": "~Wenjie_Xu3;~Yuning_Jiang5;~Bratislav_Svetozarevic1;~Colin_Jones1",
        "gender": "M;M;M;M",
        "homepage": "https://jackiexuw.github.io/;;;http://la.epfl.ch",
        "dblp": "25/1820.html;;;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;8rcqZtoAAAAJ;e9LqzHAAAAAJ;SulkJJQAAAAJ",
        "orcid": ";;;0000-0001-7239-4799",
        "linkedin": ";;;",
        "or_profile": "~Wenjie_Xu3;~Yuning_Jiang5;~Bratislav_Svetozarevic1;~Colin_Jones1",
        "aff": "EPFL - EPF Lausanne;EPFL - EPF Lausanne;;EPFL - EPF Lausanne",
        "aff_domain": "epfl.ch;epfl.ch;;epfl.ch",
        "position": "PhD student;Postdoc;;Associate Professor",
        "bibtex": "@misc{\nxu2024multiagent,\ntitle={Multi-Agent Bayesian Optimization with Coupled Black-box and Affine Constraints},\nauthor={Wenjie Xu and Yuning Jiang and Bratislav Svetozarevic and Colin Jones},\nyear={2024},\nurl={https://openreview.net/forum?id=J1SzMZn5lH}\n}",
        "github": "",
        "project": "",
        "reviewers": "vwM2;yaEw;t8mC",
        "site": "https://openreview.net/forum?id=J1SzMZn5lH",
        "pdf_size": 434775,
        "rating": "5;6;6",
        "confidence": "5;4;4",
        "soundness": "2;3;3",
        "contribution": "2;2;3",
        "presentation": "3;3;3",
        "wc_summary": "82;142;72",
        "wc_strengths": "49;36;67",
        "wc_weaknesses": "165;107;391",
        "wc_questions": "1;48;9",
        "wc_review": "297;333;539",
        "wc_reply_reviewers": "0;70;28",
        "wc_reply_authors": "843;940;657",
        "reply_reviewers": "0;1;1",
        "reply_authors": "3;4;1",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            98.66666666666667,
            30.912061651652344
        ],
        "wc_strengths_avg": [
            50.666666666666664,
            12.710450643291745
        ],
        "wc_weaknesses_avg": [
            221.0,
            122.51802588462918
        ],
        "wc_questions_avg": [
            19.333333333333332,
            20.531818125912658
        ],
        "wc_review_avg": [
            389.6666666666667,
            106.61248623975628
        ],
        "wc_reply_reviewers_avg": [
            32.666666666666664,
            28.767265347188555
        ],
        "wc_reply_authors_avg": [
            813.3333333333334,
            117.42326099296606
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9999999999999998,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5767358348510236547&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "EPFL",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.epfl.ch",
        "aff_unique_abbr": "EPFL",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Lausanne",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Switzerland"
    },
    {
        "title": "Efficient Score Matching with Deep Equilibrium Layers",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18949",
        "id": "J1djqLAa6N",
        "author_site": "Yuhao Huang, Qingsong Wang, Akwum Onwunta, Bao Wang",
        "tldr": "",
        "abstract": "Score matching methods -- estimate probability densities without computing the normalization constant -- are particularly useful in deep learning. However, computational and memory costs of score matching methods can be prohibitive for high-dimensional data or complex models, particularly due to the derivatives or Hessians of the log density function appearing in the objective function. Some existing approaches modify the objective function to reduce the quadratic computational complexity for Hessian computation. However, the memory bottleneck of score matching methods remains for deep learning. This study improves the memory efficiency of score matching by leveraging deep equilibrium models. We provide a theoretical analysis of deep equilibrium models for scoring matching and applying implicit differentiation to higher-order derivatives. Empirical evaluations demonstrate that our approach enables the development of deep and expressive models with improved performance and comparable computational and memory costs over shallow architectures.",
        "keywords": "score matching;deep equilibrium model;density estimation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/ef5315bfb84626bd08ac47eead7ee2f1f236f503.zip",
        "author": "Yuhao Huang;Qingsong Wang;Akwum Onwunta;Bao Wang",
        "authorids": "~Yuhao_Huang5;~Qingsong_Wang1;ako221@lehigh.edu;~Bao_Wang1",
        "gender": "M;;;M",
        "homepage": ";;;https://www.math.utah.edu/~bwang/index.html",
        "dblp": ";;;",
        "google_scholar": ";;;",
        "orcid": ";;;",
        "linkedin": "yuhao-huang-b86872195/;;;",
        "or_profile": "~Yuhao_Huang5;~Qingsong_Wang1;ako221@lehigh.edu;~Bao_Wang1",
        "aff": "University of Utah;;;University of Utah",
        "aff_domain": "utah.edu;;;utah.edu",
        "position": "PhD student;;;Assistant Professor",
        "bibtex": "@inproceedings{\nhuang2024efficient,\ntitle={Efficient Score Matching with Deep Equilibrium Layers},\nauthor={Yuhao Huang and Qingsong Wang and Akwum Onwunta and Bao Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=J1djqLAa6N}\n}",
        "github": "",
        "project": "",
        "reviewers": "YwTh;CgBT;H3Py;hmh8",
        "pdf_size": 1178043,
        "rating": "6;6;6;8",
        "confidence": "4;4;3;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;2;2;3",
        "wc_summary": "257;171;75;133",
        "wc_strengths": "76;81;149;88",
        "wc_weaknesses": "216;635;367;366",
        "wc_questions": "52;183;173;3",
        "wc_review": "601;1070;764;590",
        "wc_reply_reviewers": "75;130;0;84",
        "wc_reply_authors": "846;1778;1198;742",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "2;4;2;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            159.0,
            66.10597552415364
        ],
        "wc_strengths_avg": [
            98.5,
            29.46608219631514
        ],
        "wc_weaknesses_avg": [
            396.0,
            151.04800561410931
        ],
        "wc_questions_avg": [
            102.75,
            77.29933699586304
        ],
        "wc_review_avg": [
            756.25,
            193.80450846149066
        ],
        "wc_reply_reviewers_avg": [
            72.25,
            46.63890543312525
        ],
        "wc_reply_authors_avg": [
            1141.0,
            404.7357162396222
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.8660254037844386
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4008427230239834535&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=J1djqLAa6N",
        "pdf": "https://openreview.net/pdf?id=J1djqLAa6N",
        "email": "utah.edu;;;utah.edu",
        "author_num": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Utah",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.utah.edu",
        "aff_unique_abbr": "Utah",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Toward Optimal Policy Population Growth in Two-Player Zero-Sum Games",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18948",
        "id": "J2TZgj3Tac",
        "author_site": "Stephen McAleer, John Banister Lanier, Kevin A. Wang, Pierre Baldi, Tuomas Sandholm, Roy Fox",
        "tldr": "",
        "abstract": "In competitive two-agent environments, deep reinforcement learning (RL) methods like Policy Space Response Oracles (PSRO) often increase exploitability between iterations, which is problematic when training in large games. To address this issue, we introduce anytime double oracle (ADO), an algorithm that ensures exploitability does not increase between iterations, and its approximate extensive-form version, anytime PSRO (APSRO). ADO converges to a Nash equilibrium while iteratively reducing exploitability. However, convergence in these algorithms may require adding all of a game's deterministic policies. To improve this, we propose Self-Play PSRO (SP-PSRO), which incorporates an approximately optimal stochastic policy into the population in each iteration. APSRO and SP-PSRO demonstrate lower exploitability and near-monotonic exploitability reduction in games like Leduc poker and Liar's Dice. Empirically, SP-PSRO often converges much faster than APSRO and PSRO, requiring only a few iterations in many games.",
        "keywords": "PSRO;game theory;deep RL;Nash;population",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Stephen Marcus McAleer;JB Lanier;Kevin A. Wang;Pierre Baldi;Tuomas Sandholm;Roy Fox",
        "authorids": "~Stephen_Marcus_McAleer1;~JB_Lanier1;~Kevin_A._Wang1;~Pierre_Baldi1;~Tuomas_Sandholm1;~Roy_Fox1",
        "gender": "M;;;;M;M",
        "homepage": "https://www.andrew.cmu.edu/user/smcaleer/;;;;http://www.cs.cmu.edu/~sandholm;https://royf.org",
        "dblp": ";;;;s/TuomasSandholm;32/7007",
        "google_scholar": "iEFL4-YAAAAJ;;;;0DpK1EMAAAAJ;FH9nKOAAAAAJ",
        "orcid": ";;;;;0000-0002-5562-3315",
        "linkedin": "stephen-mcaleer/;;;;;",
        "or_profile": "~Stephen_Marcus_McAleer1;~JB_Lanier1;~Kevin_A._Wang1;~Pierre_Baldi1;~Tuomas_Sandholm1;~Roy_Fox1",
        "aff": "Carnegie Mellon University;;;;Carnegie Mellon University;University of California, Irvine",
        "aff_domain": "cmu.edu;;;;cmu.edu;uci.edu",
        "position": "Postdoc;;;;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nmcaleer2024toward,\ntitle={Toward Optimal Policy Population Growth in Two-Player Zero-Sum Games},\nauthor={Stephen Marcus McAleer and JB Lanier and Kevin A. Wang and Pierre Baldi and Tuomas Sandholm and Roy Fox},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=J2TZgj3Tac}\n}",
        "github": "",
        "project": "",
        "reviewers": "EJCG;C3x7;xLd8",
        "pdf_size": 2808395,
        "rating": "6;6;6",
        "confidence": "4;2;3",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "3;3;2",
        "wc_summary": "157;195;112",
        "wc_strengths": "72;96;35",
        "wc_weaknesses": "388;142;83",
        "wc_questions": "479;108;515",
        "wc_review": "1096;541;745",
        "wc_reply_reviewers": "582;0;0",
        "wc_reply_authors": "1938;496;719",
        "reply_reviewers": "1;0;0",
        "reply_authors": "4;1;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            154.66666666666666,
            33.9247533357118
        ],
        "wc_strengths_avg": [
            67.66666666666667,
            25.090945688745084
        ],
        "wc_weaknesses_avg": [
            204.33333333333334,
            132.0866718820975
        ],
        "wc_questions_avg": [
            367.3333333333333,
            183.96436853067198
        ],
        "wc_review_avg": [
            794.0,
            229.21169254643183
        ],
        "wc_reply_reviewers_avg": [
            194.0,
            274.35743110038044
        ],
        "wc_reply_authors_avg": [
            1051.0,
            633.7765116085218
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            1.4142135623730951
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15657558803221517423&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=J2TZgj3Tac",
        "pdf": "https://openreview.net/pdf?id=J2TZgj3Tac",
        "email": "cmu.edu;;;;cmu.edu;uci.edu",
        "author_num": 6,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Carnegie Mellon University;University of California, Irvine",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cmu.edu;https://www.uci.edu",
        "aff_unique_abbr": "CMU;UCI",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Irvine",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "J2kRjUAOLh",
        "title": "Contrastive Predict-and-Search for Mixed Integer Linear Programs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Mixed integer linear programs  (MILP) are flexible and powerful tools for modeling and solving many difficult real-world combinatorial optimization problems. In this paper, we propose a novel machine learning (ML)-based framework ConPaS that learns to predict solutions to MILPs with contrastive learning. For training, we collect high-quality solutions as positive samples and low-quality or infeasible solutions as negative samples. We then learn to make discriminative predictions by contrasting the positive and negative samples.   During test time, we predict assignments for a subset of integer variables of a MILP and then solve the resulting reduced MILP to construct high-quality solutions. Empirically, we show that ConPaS achieves state-of-the-art results compared to other ML-based approaches in terms of the quality of and the speed at which the solutions are found.",
        "keywords": "Mixed integer programs; contrastive learning",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Taoan Huang;Aaron M Ferber;Arman Zharmagambetov;Yuandong Tian;Bistra Dilkina",
        "authorids": "~Taoan_Huang2;~Aaron_M_Ferber1;~Arman_Zharmagambetov1;~Yuandong_Tian1;~Bistra_Dilkina2",
        "gender": "M;M;M;M;F",
        "homepage": ";https://aaron-ferber.github.io/;https://arman-z.github.io/;http://yuandong-tian.com;",
        "dblp": "241/7690;163/7788;252/5004;t/YuandongTian;30/5718",
        "google_scholar": ";TuVq07oAAAAJ;D6QocXMAAAAJ;0mgEF28AAAAJ;1jjyaBYAAAAJ",
        "orcid": ";;;0000-0003-4202-4847;0000-0002-6784-473X",
        "linkedin": ";aaron-ferber-64a73980/;;yuandongtian;",
        "or_profile": "~Taoan_Huang2;~Aaron_M_Ferber1;~Arman_Zharmagambetov1;~Yuandong_Tian1;~Bistra_Dilkina2",
        "aff": "University of Southern California;Cornell University;Meta AI (FAIR);Meta AI (FAIR);University of Southern California",
        "aff_domain": "usc.edu;cornell.edu;meta.com;meta.com;usc.edu",
        "position": "PhD student;Postdoc;Postdoc;Research Scientist;Associate Professor",
        "bibtex": "@misc{\nhuang2024contrastive,\ntitle={Contrastive Predict-and-Search for Mixed Integer Linear Programs},\nauthor={Taoan Huang and Aaron M Ferber and Arman Zharmagambetov and Yuandong Tian and Bistra Dilkina},\nyear={2024},\nurl={https://openreview.net/forum?id=J2kRjUAOLh}\n}",
        "github": "",
        "project": "",
        "reviewers": "KTmj;GFiJ;fyvF;nvLV",
        "site": "https://openreview.net/forum?id=J2kRjUAOLh",
        "pdf_size": 852531,
        "rating": "3;5;5;6",
        "confidence": "4;4;4;3",
        "soundness": "3;2;3;3",
        "contribution": "2;3;2;1",
        "presentation": "3;3;3;3",
        "wc_summary": "96;60;59;100",
        "wc_strengths": "29;42;43;85",
        "wc_weaknesses": "347;126;208;247",
        "wc_questions": "92;141;5;5",
        "wc_review": "564;369;315;437",
        "wc_reply_reviewers": "181;0;187;119",
        "wc_reply_authors": "228;228;991;231",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "2;1;2;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            78.75,
            19.30511590226798
        ],
        "wc_strengths_avg": [
            49.75,
            21.087614848531352
        ],
        "wc_weaknesses_avg": [
            232.0,
            79.47012017104291
        ],
        "wc_questions_avg": [
            60.75,
            58.379683966256614
        ],
        "wc_review_avg": [
            421.25,
            93.06550112689449
        ],
        "wc_reply_reviewers_avg": [
            121.75,
            75.16440314404153
        ],
        "wc_reply_authors_avg": [
            419.5,
            329.9579518665977
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.6622661785325219,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13697986095892352198&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;2;2;0",
        "aff_unique_norm": "University of Southern California;Cornell University;Meta",
        "aff_unique_dep": ";;Facebook AI Research (FAIR)",
        "aff_unique_url": "https://www.usc.edu;https://www.cornell.edu;https://ai.facebook.com",
        "aff_unique_abbr": "USC;Cornell;Meta AI",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Los Angeles;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "J2pMoN2pon",
        "title": "How do skip connections affect Graph Convolutional networks with graph sampling? A theoretical analysis on generalization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Skip connections enable deep Graph Convolutional Networks (GCNs) to overcome oversmoothing, while graph sampling  reduces computational demands by selecting a submatrix of the graph adjacency matrix during neighborhood aggregation. Learning deep GCNs with graph sampling has shown empirical success across various applications, but a theoretical understanding of the generalization guarantees remains limited, with existing analyses ignoring either graph sampling or skip connections. This paper presents the first generalization analysis of GCNs with skip connections using graph sampling.\nOur analysis demonstrates that the generalization accuracy of the learned model closely approximates the highest achievable accuracy within a broad class of target functions dependent on the proposed sparse effective adjacency matrix, denoted by $A^*$. Thus, graph sampling maintains generalization performance when $A^*$ accurately models data correlations. Notably, our findings reveal that skip connections lead to different sampling requirements across layers. In a two-hidden-layer GCN, the generalization   is more affected by the sampled matrix deviations from $A^*$ of the first layer than the second layer. To the best of our knowledge, this marks the first theoretical characterization of skip connections' role in sampling requirements. We validate our theoretical results on benchmark datasets.",
        "keywords": "graph neural network (GNN);skip-connection;graph samping;generalization analysis;deep learning theory",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/bfbf013fc598c56b8632e74c6e6f12dcb7fd9e20.zip",
        "author": "Jiawei Sun;Hongkang Li;Meng Wang",
        "authorids": "~Jiawei_Sun4;~Hongkang_Li1;~Meng_Wang4",
        "gender": "M;;F",
        "homepage": "https://sjwramsey.github.io/jiaweisun.github.io/;https://lohek330.github.io/lihongkang.github.io/;https://www.ecse.rpi.edu/~wang/index.html",
        "dblp": ";318/8643;93/6765-3",
        "google_scholar": ";https://scholar.google.com.hk/citations?user=DVlDPjMAAAAJ;",
        "orcid": ";;",
        "linkedin": ";hongkang-li-b7a341173/;",
        "or_profile": "~Jiawei_Sun4;~Hongkang_Li1;~Meng_Wang4",
        "aff": "Rensselaer Polytechnic Institute;Rensselaer Polytechnic Institute;Rensselaer Polytechnic Institute",
        "aff_domain": "rpi.edu;rpi.edu;rpi.edu",
        "position": "PhD student;PhD student;Associate Professor",
        "bibtex": "@misc{\nsun2024how,\ntitle={How do skip connections affect Graph Convolutional  networks  with graph sampling? A theoretical analysis on generalization},\nauthor={Jiawei Sun and Hongkang Li and Meng Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=J2pMoN2pon}\n}",
        "github": "",
        "project": "",
        "reviewers": "8ATu;YYVW;cdgo;urgn",
        "site": "https://openreview.net/forum?id=J2pMoN2pon",
        "pdf_size": 2653365,
        "rating": "3;5;5;6",
        "confidence": "2;5;4;3",
        "soundness": "2;1;4;3",
        "contribution": "2;1;2;3",
        "presentation": "1;1;3;3",
        "wc_summary": "87;31;36;64",
        "wc_strengths": "45;17;29;78",
        "wc_weaknesses": "243;236;124;149",
        "wc_questions": "170;143;16;116",
        "wc_review": "545;427;205;407",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "2348;2189;965;708",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "4;4;2;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.5,
            1.118033988749895
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.0,
            1.0
        ],
        "wc_summary_avg": [
            54.5,
            22.588713996153036
        ],
        "wc_strengths_avg": [
            42.25,
            22.90605815062906
        ],
        "wc_weaknesses_avg": [
            188.0,
            52.31156659860226
        ],
        "wc_questions_avg": [
            111.25,
            58.212434238743185
        ],
        "wc_review_avg": [
            396.0,
            122.23338332877806
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1552.5,
            723.9283459017197
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.75,
            1.299038105676658
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5129891760425771,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15594934209855349323&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Rensselaer Polytechnic Institute",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.rpi.edu",
        "aff_unique_abbr": "RPI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Mitigating Hallucination in Large Multi-Modal Models via Robust Instruction Tuning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18947",
        "id": "J44HfH4JCg",
        "author_site": "Fuxiao Liu, Kevin Lin, Linjie Li, Jianfeng Wang, Yaser Yacoob, Lijuan Wang",
        "tldr": "",
        "abstract": "Despite the promising progress in multi-modal tasks, current large multi-modal models (LMMs) are prone to hallucinating inconsistent descriptions with respect to the associated image and human instructions. This paper addresses this issue by introducing the first large and diverse visual instruction tuning dataset, named Large-scale Robust Visual (LRV)-Instruction. Our dataset comprises 400k visual\ninstructions generated by GPT4, covering 16 vision-and-language tasks with open-ended instructions and answers. Unlike existing studies that primarily focus on positive instruction samples, we design LRV-Instruction to include both positive and negative instructions for more robust visual instruction tuning. Our negative instructions are designed at three semantic levels: (i) Nonexistent Object Manipulation, (ii) Existent Object Manipulation and (iii) Knowledge Manipulation. To efficiently measure the hallucination generated by LMMs, we propose GPT4-Assisted Visual Instruction Evaluation (GAVIE), a stable approach to evaluate visual instruction tuning like human experts. GAVIE does not require human-annotated groundtruth answers and can adapt to diverse instruction formats. We conduct comprehensive experiments to investigate the hallucination of LMMs. Our results demonstrate existing LMMs exhibit significant hallucinations when presented with our negative instructions, particularly Existent Object and Knowledge Manipulation instructions. Moreover, we successfully mitigate hallucination by finetuning MiniGPT4 and mPLUG-Owl on LRV-Instruction while improving performance on several public\ndatasets compared to state-of-the-art methods. Additionally, we observed that a balanced ratio of positive and negative instances in the training data leads to a more robust model. Code and data will be released upon publication.",
        "keywords": "instruction tuning;multimodal large language model;hallucination;datasets",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Fuxiao Liu;Kevin Lin;Linjie Li;Jianfeng Wang;Yaser Yacoob;Lijuan Wang",
        "authorids": "~Fuxiao_Liu1;~Kevin_Lin3;~Linjie_Li1;~Jianfeng_Wang4;~Yaser_Yacoob1;~Lijuan_Wang1",
        "gender": "M;;F;M;;F",
        "homepage": "https://fuxiaoliu.github.io/;https://sites.google.com/site/kevinlin311tw/;;;http://users.umiacs.umd.edu/~yaser/;https://www.microsoft.com/en-us/research/people/lijuanw/",
        "dblp": "276/0603;;200/8256;;12/105.html;51/2527.html",
        "google_scholar": "https://scholar.google.ca/citations?user=e0P54E4AAAAJ;https://scholar.google.com.tw/citations?user=LKSy1kwAAAAJ;WR875gYAAAAJ;vJWEw_8AAAAJ;h6t1HVEAAAAJ;cDcWXuIAAAAJ",
        "orcid": ";0000-0001-8944-1336;;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Fuxiao_Liu1;~Kevin_Lin3;~Linjie_Li1;~Jianfeng_Wang4;~Yaser_Yacoob1;~Lijuan_Wang1",
        "aff": "NVIDIA;Microsoft;Microsoft;Microsoft;University of Maryland, College Park;Microsoft",
        "aff_domain": "nvidia.com;microsoft.com;microsoft.com;microsoft.com;umd.edu;microsoft.com",
        "position": "Researcher;Principal Researcher;Researcher;Principal Researcher;Associate Professor;Principal Researcher",
        "bibtex": "@inproceedings{\nliu2024mitigating,\ntitle={Mitigating Hallucination in Large Multi-Modal Models via Robust Instruction Tuning},\nauthor={Fuxiao Liu and Kevin Lin and Linjie Li and Jianfeng Wang and Yaser Yacoob and Lijuan Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=J44HfH4JCg}\n}",
        "github": "",
        "project": "",
        "reviewers": "68kD;VAPt;WNxt;LKUy",
        "pdf_size": 5919874,
        "rating": "6;8;8;8",
        "confidence": "4;3;4;3",
        "soundness": "3;3;4;3",
        "contribution": "3;3;4;3",
        "presentation": "2;3;3;3",
        "wc_summary": "54;122;118;89",
        "wc_strengths": "33;90;110;78",
        "wc_weaknesses": "271;97;44;79",
        "wc_questions": "87;186;1;26",
        "wc_review": "445;495;273;272",
        "wc_reply_reviewers": "95;0;59;78",
        "wc_reply_authors": "1017;653;256;678",
        "reply_reviewers": "1;0;1;2",
        "reply_authors": "3;1;1;2",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            95.75,
            27.261465477849864
        ],
        "wc_strengths_avg": [
            77.75,
            28.252212302756046
        ],
        "wc_weaknesses_avg": [
            122.75,
            87.68801229358549
        ],
        "wc_questions_avg": [
            75.0,
            71.31269171753371
        ],
        "wc_review_avg": [
            371.25,
            100.32042414184662
        ],
        "wc_reply_reviewers_avg": [
            58.0,
            35.82596823534571
        ],
        "wc_reply_authors_avg": [
            651.0,
            269.5895027629971
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 270,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15381643875390468553&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=J44HfH4JCg",
        "pdf": "https://openreview.net/pdf?id=J44HfH4JCg",
        "email": "nvidia.com;microsoft.com;microsoft.com;microsoft.com;umd.edu;microsoft.com",
        "author_num": 6,
        "aff_unique_index": "0;1;1;1;2;1",
        "aff_unique_norm": "NVIDIA;Microsoft;University of Maryland",
        "aff_unique_dep": "NVIDIA Corporation;Microsoft Corporation;",
        "aff_unique_url": "https://www.nvidia.com;https://www.microsoft.com;https://www/umd.edu",
        "aff_unique_abbr": "NVIDIA;Microsoft;UMD",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";College Park",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "J4V3lW9hq6",
        "title": "A Multi-Grained Group Symmetric Framework for Learning Protein-Ligand Binding Dynamics",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In drug discovery, molecular dynamics (MD) simulation for protein-ligand binding provides a powerful tool for predicting binding affinities, estimating transport properties, and exploring pocket sites. There has been a long history of improving the efficiency of MD simulations through better numerical methods and, more recently, by augmenting them with machine learning (ML) methods. Yet, challenges remain, such as accurate modeling of extended-timescale simulations. To address this issue, we propose NeuralMD, the first ML surrogate that can facilitate numerical MD and provide accurate simulations of protein-ligand binding dynamics. We propose a principled approach that incorporates a novel physics-informed multi-grained group symmetric framework. Specifically, we propose (1) a BindingNet model that satisfies group symmetry using vector frames and captures the multi-level protein-ligand interactions, and (2) an augmented neural ordinary differential equation solver that learns the trajectory under Newtonian mechanics. For the experiment, we design ten single-trajectory and three multi-trajectory binding simulation tasks. We show the efficiency and effectiveness of NeuralMD, with a 2000$\\times$ speedup over standard numerical MD simulation and outperforming all other ML approaches by up to ~80\\% under the stability metric. We further qualitatively show that NeuralMD reaches more stable binding predictions.",
        "keywords": "protein-ligand binding;group symmetric;multi-grained;molecular simulation;Newtonian dynamics",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/da3faed96ba6d53e7595a1c6e5cf7c3c681ebcb6.pdf",
        "author": "Shengchao Liu;weitao Du;Yanjing Li;Zhuoxinran Li;Vignesh C Bhethanabotla;Nakul Rampal;Omar M. Yaghi;Christian Borgs;Anima Anandkumar;Hongyu Guo;Jennifer T Chayes",
        "authorids": "~Shengchao_Liu1;~weitao_Du1;~Yanjing_Li3;~Zhuoxinran_Li2;~Vignesh_C_Bhethanabotla1;~Nakul_Rampal1;~Omar_M._Yaghi2;~Christian_Borgs2;~Anima_Anandkumar1;~Hongyu_Guo1;~Jennifer_T_Chayes1",
        "gender": "M;M;M;F;M;M;M;M;M;F;F",
        "homepage": "https://chao1224.github.io/;;https://www.linkedin.com/in/yanjing-li-6002a4220/;https://zoezxrli.github.io/;;https://www.nakulrampal.xyz/;https://chemistry.berkeley.edu/faculty/chem/yaghi;http://christianborgs.com;https://hongyuharryguo.github.io/;http://jenniferchayes.com/;http://tensorlab.cms.caltech.edu/users/anima/",
        "dblp": ";17/10015;;;;;;b/ChristianBorgs;;;",
        "google_scholar": "F1ws3XUAAAAJ;;;;;ujHDA34AAAAJ;;;https://scholar.google.ca/citations?user=bZUqlakAAAAJ;YAHWbtkAAAAJ;bEcLezcAAAAJ",
        "orcid": "0000-0003-2030-2367;;;;0000-0001-9401-6967;;;;;;",
        "linkedin": ";;;;;nakulrampal/;;;harry-h-y-guo-a582087/;;anima-anandkumar-35171b1/",
        "or_profile": "~Shengchao_Liu1;~weitao_Du1;~Yanjing_Li3;~Zhuoxinran_Li2;~Vignesh_C_Bhethanabotla1;~Nakul_Rampal1;~Omar_M._Yaghi2;~Christian_Borgs2;~Hongyu_Guo1;~Jennifer_T_Chayes1;~anima_anandkumar1",
        "aff": "University of California, Berkeley;Academy of Mathematics and Systems Science, Chinese Academy of Sciences, Chinese Academy of Sciences;;University of Toronto;California Institute of Technology;;;Electrical Engineering & Computer Science Department, University of California, Berkeley;National Research Council Canada;University of California, Berkeley;California Institute of Technology",
        "aff_domain": "berkeley.edu;amss.ac.cn;;utoronto.ca;caltech.edu;;;eecs.berkeley.edu;nrc-cnrc.gc.ca;berkeley.edu;caltech.edu",
        "position": "Postdoc;Postdoc;;Undergrad student;PhD student;;;Full Professor;Senior Research Officer;Full Professor;Full Professor",
        "bibtex": "@misc{\nliu2024a,\ntitle={A Multi-Grained Group Symmetric Framework for Learning Protein-Ligand Binding Dynamics},\nauthor={Shengchao Liu and weitao Du and Yanjing Li and Zhuoxinran Li and Vignesh C Bhethanabotla and Nakul Rampal and Omar M. Yaghi and Christian Borgs and Anima Anandkumar and Hongyu Guo and Jennifer T Chayes},\nyear={2024},\nurl={https://openreview.net/forum?id=J4V3lW9hq6}\n}",
        "github": "",
        "project": "",
        "reviewers": "oR9H;ZPQv;582T;K9WG",
        "site": "https://openreview.net/forum?id=J4V3lW9hq6",
        "pdf_size": 11928112,
        "rating": "3;5;6;6",
        "confidence": "4;3;3;5",
        "soundness": "1;2;3;3",
        "contribution": "1;2;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "77;69;75;82",
        "wc_strengths": "53;97;53;49",
        "wc_weaknesses": "392;133;25;48",
        "wc_questions": "182;267;68;21",
        "wc_review": "704;566;221;200",
        "wc_reply_reviewers": "174;0;205;0",
        "wc_reply_authors": "2049;1458;846;164",
        "reply_reviewers": "1;0;2;0",
        "reply_authors": "4;3;3;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            75.75,
            4.656984002549289
        ],
        "wc_strengths_avg": [
            63.0,
            19.697715603592208
        ],
        "wc_weaknesses_avg": [
            149.5,
            145.67171997337027
        ],
        "wc_questions_avg": [
            134.5,
            96.3288637948149
        ],
        "wc_review_avg": [
            422.75,
            217.9121095763152
        ],
        "wc_reply_reviewers_avg": [
            94.75,
            95.38179857813545
        ],
        "wc_reply_authors_avg": [
            1129.25,
            701.0625417892472
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.75,
            1.0897247358851685
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:5n6xQzM73dwJ:scholar.google.com/&scioq=A+Multi-Grained+Group+Symmetric+Framework+for+Learning+Protein-Ligand+Binding+Dynamics&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;0;4;0;3",
        "aff_unique_norm": "University of California, Berkeley;Chinese Academy of Sciences;University of Toronto;California Institute of Technology;National Research Council Canada",
        "aff_unique_dep": ";Academy of Mathematics and Systems Science;;;",
        "aff_unique_url": "https://www.berkeley.edu;http://www.cas.cn;https://www.utoronto.ca;https://www.caltech.edu;https://www.nrc-cnrc.gc.ca",
        "aff_unique_abbr": "UC Berkeley;CAS;U of T;Caltech;NRC-CNRC",
        "aff_campus_unique_index": "0;2;0;0;2",
        "aff_campus_unique": "Berkeley;;Pasadena",
        "aff_country_unique_index": "0;1;2;0;0;2;0;0",
        "aff_country_unique": "United States;China;Canada"
    },
    {
        "id": "J4zh8rXMm9",
        "title": "Flashback: Understanding and Mitigating Forgetting in Federated Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In the realm of Federated Learning (FL), the convergence and effectiveness of learning algorithms can be severely hampered by the phenomenon of forgetting\u2014where knowledge obtained in one round becomes diluted or lost in subsequent rounds. Such a challenge is a result of severe data heterogeneity across clients. Although FL algorithms like FedAvg have been pivotal, they often falter in scenarios of high data heterogeneity. This work delves into the nuances of this problem, establishing the critical role forgetting plays in the inefficient learning of FL in the context of severe data heterogeneity. Knowledge loss occurs in both the local update and the aggregation step; addressing one phase without considering the other will not mitigate forgetting. We introduce a novel metric that offers a granular measurement of forgetting at every round while ensuring that the occurrence of forgetting is distinctly recognized and not obscured by the simultaneous acquisition of new class-specific knowledge. Leveraging these insights, we propose Flashback, an FL algorithm that integrates a novel dynamic distillation approach. The knowledge of different models is estimated and the distillation loss is adapted accordingly. This adaptive distillation is applied both at the local and global update phases, ensuring models retain essential knowledge across rounds while also assimilating new knowledge. Our approach seeks to robustly mitigate the detrimental effects of forgetting, paving the way for more efficient and consistent FL algorithms, especially in environments of high data heterogeneity. By effectively mitigating forgetting, Flashback achieves faster convergence to target accuracy outperforming baselines, by being up to 88.5$\\times$ faster and at least 4.6$\\times$ faster across the different benchmarks.",
        "keywords": "Federated Learning;Forgetting;Knowledge Distillation;Deep Learning;Continual Learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/a868bde916a050369eb0cc8ab43e938ad0573355.pdf",
        "author": "Mohammed Aljahdali;Ahmed M. Abdelmoniem;Marco Canini",
        "authorids": "~Mohammed_Aljahdali1;~Ahmed_M._Abdelmoniem1;~Marco_Canini1",
        "gender": "M;M;M",
        "homepage": ";https://mcanini.github.io;http://eecs.qmul.ac.uk/~ahmed/",
        "dblp": ";24/5715;207/3449",
        "google_scholar": ";c-rwMUkAAAAJ;CzfuSJgAAAAJ",
        "orcid": "0000-0002-7029-8856;0000-0002-5051-4283;0000-0002-1374-1882",
        "linkedin": ";;",
        "or_profile": "~Mohammed_Aljahdali1;~Marco_Canini1;~Ahmed_Sayed1",
        "aff": "King Abdullah University of Science and Technology;KAUST;Queen Mary, University of London",
        "aff_domain": "kaust.edu.sa;kaust.edu.sa;qmul.ac.uk",
        "position": "PhD student;Associate Professor;Associate Professor",
        "bibtex": "@misc{\naljahdali2024flashback,\ntitle={Flashback: Understanding and Mitigating Forgetting in Federated Learning},\nauthor={Mohammed Aljahdali and Ahmed M. Abdelmoniem and Marco Canini},\nyear={2024},\nurl={https://openreview.net/forum?id=J4zh8rXMm9}\n}",
        "github": "",
        "project": "",
        "reviewers": "eqJf;YZyz;LiW6;VJec",
        "site": "https://openreview.net/forum?id=J4zh8rXMm9",
        "pdf_size": 4360467,
        "rating": "3;3;5;5",
        "confidence": "4;4;4;3",
        "soundness": "2;3;3;2",
        "contribution": "1;1;3;2",
        "presentation": "3;3;3;2",
        "wc_summary": "72;79;49;101",
        "wc_strengths": "41;77;40;37",
        "wc_weaknesses": "150;250;141;185",
        "wc_questions": "37;70;51;28",
        "wc_review": "300;476;281;351",
        "wc_reply_reviewers": "0;0;74;0",
        "wc_reply_authors": "513;705;404;406",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            75.25,
            18.552290963651902
        ],
        "wc_strengths_avg": [
            48.75,
            16.37643123516232
        ],
        "wc_weaknesses_avg": [
            181.5,
            42.82814495165533
        ],
        "wc_questions_avg": [
            46.5,
            15.850867484147358
        ],
        "wc_review_avg": [
            352.0,
            76.02959949914244
        ],
        "wc_reply_reviewers_avg": [
            18.5,
            32.04293994002423
        ],
        "wc_reply_authors_avg": [
            507.0,
            122.52550754842846
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17319983067737656561&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "King Abdullah University of Science and Technology;Queen Mary, University of London",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.kast.kau.edu.sa;https://www.qmul.ac.uk",
        "aff_unique_abbr": "KAUST;QMUL",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";London",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "Saudi Arabia;United Kingdom"
    },
    {
        "id": "J562Q8Hjut",
        "title": "PEACH: Pretrained-embedding Explanation Across Contextual and Hierarchical Structure",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In this work, we propose a novel tree-based explanation technique, PEACH (Pretrained-embedding Explanation Across Contextual and Hierarchical Structure), that can explain how text-based documents are classified by using any pre-trained contextual embeddings in a tree-based human-interpretable manner. Note that PEACH can adopt any contextual embeddings of the PLMs as a training input for the decision tree. \nUsing the proposed PEACH, we perform a comprehensive analysis of several contextual embeddings on nine different NLP text classification benchmarks. This analysis demonstrates the flexibility of the model by applying several PLM contextual embeddings, its attribute selections, scaling, and clustering methods. Furthermore, we show the utility of explanations by visualising the feature selection and important trend of text classification via human-interpretable word-cloud-based trees, which clearly identify model mistakes and assist in dataset debugging. Besides interpretability, PEACH outperforms or is similar to those from pretrained models. Code and Implementation details will be provided via GitHub after the acceptance.",
        "keywords": "Interpretability;Text classification;Global interpretation;Local interpretation",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Feiqi Cao;Caren Han;Hyunsuk Chung",
        "authorids": "~Feiqi_Cao1;~Caren_Han1;~Hyunsuk_Chung1",
        "gender": ";F;M",
        "homepage": ";https://drcarenhan.github.io/;",
        "dblp": ";24/10567;",
        "google_scholar": ";https://scholar.google.com.au/citations?hl=en;https://scholar.google.com.au/citations?user=nxLp48oAAAAJ",
        "orcid": "0000-0002-4910-5925 ;;",
        "linkedin": ";;",
        "or_profile": "~Feiqi_Cao1;~Caren_Han1;~Hyunsuk_Chung1",
        "aff": "University of Sydney, University of Sydney;University of Sydney;FortifyEdge",
        "aff_domain": "uni.sydney.edu.au;sydney.edu.au;fortifyedge.com",
        "position": "PhD student;Associate Professor;CTO",
        "bibtex": "@misc{\ncao2024peach,\ntitle={{PEACH}: Pretrained-embedding Explanation Across Contextual and Hierarchical Structure},\nauthor={Feiqi Cao and Caren Han and Hyunsuk Chung},\nyear={2024},\nurl={https://openreview.net/forum?id=J562Q8Hjut}\n}",
        "github": "",
        "project": "",
        "reviewers": "HiZh;TT7T;1ymx",
        "site": "https://openreview.net/forum?id=J562Q8Hjut",
        "pdf_size": 15240247,
        "rating": "3;3;6",
        "confidence": "4;4;3",
        "soundness": "1;2;3",
        "contribution": "2;2;2",
        "presentation": "2;2;3",
        "wc_summary": "66;205;269",
        "wc_strengths": "39;57;33",
        "wc_weaknesses": "390;193;79",
        "wc_questions": "65;247;38",
        "wc_review": "560;702;419",
        "wc_reply_reviewers": "6;0;0",
        "wc_reply_authors": "123;696;226",
        "reply_reviewers": "1;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            180.0,
            84.73881440441957
        ],
        "wc_strengths_avg": [
            43.0,
            10.198039027185569
        ],
        "wc_weaknesses_avg": [
            220.66666666666666,
            128.46357027923867
        ],
        "wc_questions_avg": [
            116.66666666666667,
            92.8164257493731
        ],
        "wc_review_avg": [
            560.3333333333334,
            115.53450662993382
        ],
        "wc_reply_reviewers_avg": [
            2.0,
            2.8284271247461903
        ],
        "wc_reply_authors_avg": [
            348.3333333333333,
            249.40774290751725
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:oljutEdTi9MJ:scholar.google.com/&scioq=PEACH:+Pretrained-embedding+Explanation+Across+Contextual+and+Hierarchical+Structure&hl=en&as_sdt=0,33",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "University of Sydney;FortifyEdge",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.sydney.edu.au;",
        "aff_unique_abbr": "USYD;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Australia;"
    },
    {
        "id": "J6QKWjq05Z",
        "title": "TreeDQN: Learning to minimize Branch-and-Bound tree",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Combinatorial optimization problems require an exhaustive search to find the optimal solution. A convenient approach to solving combinatorial optimization tasks in the form of Mixed Integer Linear Programs is Branch-and-Bound.  Branch-and-Bound solver splits a task into two parts dividing the domain of an integer variable, then it solves them recursively, producing a tree of nested sub-tasks. The efficiency of the solver depends on the branching heuristic used to select a variable for splitting. In the present work, we propose a reinforcement learning method that can efficiently learn the branching heuristic. We view the variable selection task as a tree Markov Decision Process, prove that the Bellman operator adapted for the tree Markov Decision Process is contracting in mean, and propose a modified learning objective for the reinforcement learning agent. Our agent requires less training data and produces smaller trees compared to previous reinforcement learning methods.",
        "keywords": "reinforcement learning;combinatorial optimization;branch-and-bound",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/35f052b352ae45d1343874ff60733e9139146611.zip",
        "author": "Dmitry Igorevich Sorokin;Alexander Kostin",
        "authorids": "~Dmitry_Igorevich_Sorokin1;~Alexander_Kostin1",
        "gender": "M;M",
        "homepage": ";",
        "dblp": "https://dblp.uni-trier.de/pid/203/4483;",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;",
        "orcid": ";",
        "linkedin": ";kostinalexander/",
        "or_profile": "~Dmitry_Igorevich_Sorokin1;~Alexander_Kostin1",
        "aff": "Artificial Intelligence Research Institute;Sberbank",
        "aff_domain": "airi.net;sber.ru",
        "position": "Researcher;Researcher",
        "bibtex": "@misc{\nsorokin2024treedqn,\ntitle={Tree{DQN}: Learning to minimize Branch-and-Bound tree},\nauthor={Dmitry Igorevich Sorokin and Alexander Kostin},\nyear={2024},\nurl={https://openreview.net/forum?id=J6QKWjq05Z}\n}",
        "github": "",
        "project": "",
        "reviewers": "X3jH;ZMqh;Uoqv;vJVo",
        "site": "https://openreview.net/forum?id=J6QKWjq05Z",
        "pdf_size": 16197649,
        "rating": "3;3;5;6",
        "confidence": "4;3;3;3",
        "soundness": "2;2;2;3",
        "contribution": "3;3;2;3",
        "presentation": "2;2;1;3",
        "wc_summary": "83;76;88;41",
        "wc_strengths": "67;58;46;48",
        "wc_weaknesses": "539;310;575;20",
        "wc_questions": "42;72;28;215",
        "wc_review": "731;516;737;324",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "501;685;936;484",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            72.0,
            18.398369492974098
        ],
        "wc_strengths_avg": [
            54.75,
            8.407585860400118
        ],
        "wc_weaknesses_avg": [
            361.0,
            221.56376057469325
        ],
        "wc_questions_avg": [
            89.25,
            74.32151438177239
        ],
        "wc_review_avg": [
            577.0,
            171.0599310183422
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            651.5,
            182.18740351626948
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5555555555555555,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17446081954055678415&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Artificial Intelligence Research Institute;Sberbank",
        "aff_unique_dep": ";",
        "aff_unique_url": ";https://www.sberbank.ru",
        "aff_unique_abbr": ";Sberbank",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United States;Russian Federation"
    },
    {
        "id": "J7AwIJvR3d",
        "title": "Discovering Divergences between Language Models and Human Brains",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Do machines and humans process language in similar ways? A recent line of research has hinted in the affirmative, demonstrating that human brain signals can be effectively predicted using the internal representations of language models (LMs). This is thought to reflect shared computational principles between LMs and human language processing. However, there are also clear differences in how LMs and humans acquire and use language, even if the final task they are performing is the same. Despite this, there is little work exploring systematic differences between human and machine language processing using brain data. To address this question, we examine the differences between LM representations and the human brain's responses to language, specifically by examining a dataset of Magnetoencephalography (MEG) responses to a written narrative. In doing so we identify three phenomena that, in prior work, LMs have been found to not capture well: emotional understanding, figurative language processing, and physical commonsense. We further fine-tune models on datasets related to these three phenomena, and find that LMs fine-tuned on tasks related to emotion and figurative language show improved alignment with brain responses. We emphasize the importance of understanding not just similarities between human and machine language processing, but also differences. Our work takes the first steps toward this goal in the context of narrative reading.",
        "keywords": "Natural Language Processing;NLP;Brain Imaging;Magnetoencephalography;MEG;Neuroscience;Cognitive Science;Interpretability;Deep Learning",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "Yuchen Zhou;Emmy Liu;Graham Neubig;Leila Wehbe",
        "authorids": "~Yuchen_Zhou4;~Emmy_Liu1;~Graham_Neubig1;~Leila_Wehbe1",
        "gender": "M;F;M;F",
        "homepage": "https://www.zhouyuchen.me/;https://nightingal3.github.io/;http://phontron.com;http://www.cs.cmu.edu/~lwehbe/",
        "dblp": ";249/6997;03/8155;125/4359",
        "google_scholar": "cDhq1EYAAAAJ;;wlosgkoAAAAJ;YezyUawAAAAJ",
        "orcid": ";;;0000-0001-8545-2062",
        "linkedin": ";;;",
        "or_profile": "~Yuchen_Zhou4;~Emmy_Liu1;~Graham_Neubig1;~Leila_Wehbe1",
        "aff": "Carnegie Mellon University;School of Computer Science, Carnegie Mellon University;Carnegie Mellon University;Carnegie Mellon University",
        "aff_domain": "cmu.edu;cs.cmu.edu;cmu.edu;cmu.edu",
        "position": "PhD student;PhD student;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nzhou2024discovering,\ntitle={Discovering Divergences between Language Models and Human Brains},\nauthor={Yuchen Zhou and Emmy Liu and Graham Neubig and Leila Wehbe},\nyear={2024},\nurl={https://openreview.net/forum?id=J7AwIJvR3d}\n}",
        "github": "",
        "project": "",
        "reviewers": "BQhU;atcy;khQ4;u3A8",
        "site": "https://openreview.net/forum?id=J7AwIJvR3d",
        "pdf_size": 7341477,
        "rating": "3;3;3;6",
        "confidence": "4;3;5;1",
        "soundness": "2;1;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;2;3",
        "wc_summary": "113;108;76;75",
        "wc_strengths": "52;67;56;36",
        "wc_weaknesses": "883;671;443;21",
        "wc_questions": "27;357;101;21",
        "wc_review": "1075;1203;676;153",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1019;1415;912;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;2;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            1.479019945774904
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            93.0,
            17.592612085759182
        ],
        "wc_strengths_avg": [
            52.75,
            11.121488209767612
        ],
        "wc_weaknesses_avg": [
            504.5,
            319.5852781340217
        ],
        "wc_questions_avg": [
            126.5,
            136.75799793796338
        ],
        "wc_review_avg": [
            776.75,
            409.22388432250625
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            836.5,
            518.0253372181712
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8783100656536799,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Sw4NeSYCNFkJ:scholar.google.com/&scioq=Discovering+Divergences+between+Language+Models+and+Human+Brains&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Carnegie Mellon University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cmu.edu",
        "aff_unique_abbr": "CMU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Pittsburgh",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "J7hbPeOZ39",
        "title": "Dynamic Assortment Selection and Pricing with Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We consider a dynamic assortment selection and pricing problem in which a seller has $n$ different items available for sale. In each round, the seller observes $d$-dimensional contextual preference information for the user and offers to the user an assortment of $K$ items at prices chosen by the seller. The user selects at most one of the products from the offered assortment according to a multinomial logit choice model whose parameters are unknown. The seller observes which, if any, item is chosen at the end of each round, with a goal of maximizing cumulative revenue over a selling horizon of length $T$. For this problem, we propose an algorithm that learns from user feedback and achieves $n$-independent revenue regret of order $\\widetilde{\\mathcal{O}}(d \\sqrt{T})$. We also show that this regret rate is optimal, up to logarithmic factors, by obtaining lower bounds for the regret achievable by any algorithm.",
        "keywords": "assortment selection;pricing;dynamic;learning;optimal;regret;multinomial logit;contextual",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/975458510251e4e2c7bd81be83e7471ff055a444.zip",
        "author": "Yigit Efe Erginbas;Kannan Ramchandran;Thomas Courtade",
        "authorids": "~Yigit_Efe_Erginbas1;~Kannan_Ramchandran1;~Thomas_Courtade1",
        "gender": "M;M;M",
        "homepage": "https://erginbas.github.io/;https://www.eecs.berkeley.edu/~kannanr/;https://people.eecs.berkeley.edu/~courtade/",
        "dblp": ";53/5765;23/7883.html",
        "google_scholar": ";https://scholar.google.com.tw/citations?user=DcV-5RAAAAAJ;https://scholar.google.com.tw/citations?user=xRmmtzIAAAAJ",
        "orcid": "0000-0001-5010-9766;0000-0002-4567-328X;",
        "linkedin": ";;",
        "or_profile": "~Yigit_Efe_Erginbas1;~Kannan_Ramchandran1;~Thomas_Courtade1",
        "aff": "Uber;University of California, Berkeley;University of California, Berkeley",
        "aff_domain": "uber.com;berkeley.edu;berkeley.edu",
        "position": "Intern;Full Professor;Associate Professor",
        "bibtex": "@misc{\nerginbas2024dynamic,\ntitle={Dynamic Assortment Selection and Pricing with Learning},\nauthor={Yigit Efe Erginbas and Kannan Ramchandran and Thomas Courtade},\nyear={2024},\nurl={https://openreview.net/forum?id=J7hbPeOZ39}\n}",
        "github": "",
        "project": "",
        "reviewers": "nk1g;7z3J;zWYm;5Wv4",
        "site": "https://openreview.net/forum?id=J7hbPeOZ39",
        "pdf_size": 7443695,
        "rating": "3;3;3;3",
        "confidence": "3;4;4;3",
        "soundness": "2;2;3;2",
        "contribution": "2;2;1;2",
        "presentation": "3;2;2;2",
        "wc_summary": "171;129;75;47",
        "wc_strengths": "89;38;21;19",
        "wc_weaknesses": "262;322;169;117",
        "wc_questions": "136;136;2;2",
        "wc_review": "658;625;267;185",
        "wc_reply_reviewers": "0;103;0;0",
        "wc_reply_authors": "166;223;189;293",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            105.5,
            47.94528131109463
        ],
        "wc_strengths_avg": [
            41.75,
            28.261059781968545
        ],
        "wc_weaknesses_avg": [
            217.5,
            79.6131270582936
        ],
        "wc_questions_avg": [
            69.0,
            67.0
        ],
        "wc_review_avg": [
            433.75,
            210.08733303081365
        ],
        "wc_reply_reviewers_avg": [
            25.75,
            44.60030829489859
        ],
        "wc_reply_authors_avg": [
            217.75,
            47.94462952198087
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:CjiESxFwRrIJ:scholar.google.com/&scioq=Dynamic+Assortment+Selection+and+Pricing+with+Learning&hl=en&as_sdt=0,47",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Uber Technologies Inc.;University of California, Berkeley",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uber.com;https://www.berkeley.edu",
        "aff_unique_abbr": "Uber;UC Berkeley",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Berkeley",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Rethinking Label Poisoning for GNNs: Pitfalls and Attacks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18946",
        "id": "J7ioefqDPw",
        "author_site": "Vijay Chandra Lingam, Mohammad Sadegh Akhondzadeh, Aleksandar Bojchevski",
        "tldr": "",
        "abstract": "Node labels for graphs are usually generated using an automated process or crowd-sourced from human users. This opens up avenues for malicious users to compromise the training labels, making it unwise to blindly rely on them. While robustness against noisy labels is an active area of research, there are only a handful of papers in the literature that address this for graph-based data. Even more so, the effects of adversarial label perturbations is sparsely studied. More critically, we reveal that the entire literature on label poisoning for GNNs is plagued by serious evaluation pitfalls. Thus making it hard to conclude how robust GNNs are against label perturbations. After course correcting the state of label poisoning attacks with our faithful evaluation, we identify a discrepancy in attack efficiency of $\\sim9\\%$ on average. Additionally, we introduce two new simple yet effective attacks that are significantly stronger (up to $\\sim8\\%$) than the previous strongest attack. Our strongest proposed attack can be efficiently computed and is theoretically backed.",
        "keywords": "Graph Neural Networks;Label Poisoning Attacks;Pitfalls",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Vijay Lingam;Mohammad Sadegh Akhondzadeh;Aleksandar Bojchevski",
        "authorids": "~Vijay_Lingam1;~Mohammad_Sadegh_Akhondzadeh1;~Aleksandar_Bojchevski1",
        "gender": "M;M;M",
        "homepage": ";https://msadegh97.github.io/;https://abojchevski.github.io/",
        "dblp": "219/1559.html;264/0078;203/8114",
        "google_scholar": "FPOCruQAAAAJ;zmlh-HMAAAAJ;https://scholar.google.de/citations?user=F1APiN4AAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Vijay_Lingam1;~Mohammad_Sadegh_Akhondzadeh1;~Aleksandar_Bojchevski1",
        "aff": "University of Texas at Austin;Universit\u00e4t K\u00f6ln;University of Cologne",
        "aff_domain": "utexas.edu;uni-koeln.de;uni-koeln.de",
        "position": "MS student;Researcher;Full Professor",
        "bibtex": "@inproceedings{\nlingam2024rethinking,\ntitle={Rethinking Label Poisoning for {GNN}s: Pitfalls and Attacks},\nauthor={Vijay Lingam and Mohammad Sadegh Akhondzadeh and Aleksandar Bojchevski},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=J7ioefqDPw}\n}",
        "github": "",
        "project": "",
        "reviewers": "82Ci;Cen8;FFMY;JRv5",
        "pdf_size": 12732269,
        "rating": "5;6;8;8",
        "confidence": "3;5;3;3",
        "soundness": "2;2;3;4",
        "contribution": "2;2;4;3",
        "presentation": "3;2;4;3",
        "wc_summary": "116;94;211;63",
        "wc_strengths": "29;57;188;38",
        "wc_weaknesses": "178;410;147;66",
        "wc_questions": "5;4;46;156",
        "wc_review": "328;565;592;323",
        "wc_reply_reviewers": "0;310;0;0",
        "wc_reply_authors": "688;1111;347;477",
        "reply_reviewers": "0;2;0;0",
        "reply_authors": "1;3;1;1",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            121.0,
            55.2675311552814
        ],
        "wc_strengths_avg": [
            78.0,
            64.30785333067806
        ],
        "wc_weaknesses_avg": [
            200.25,
            127.81700786671546
        ],
        "wc_questions_avg": [
            52.75,
            61.973280532823175
        ],
        "wc_review_avg": [
            452.0,
            126.87198272274301
        ],
        "wc_reply_reviewers_avg": [
            77.5,
            134.23393758658798
        ],
        "wc_reply_authors_avg": [
            655.75,
            289.64234410734906
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2101407073211305793&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=J7ioefqDPw",
        "pdf": "https://openreview.net/pdf?id=J7ioefqDPw",
        "email": "utexas.edu;uni-koeln.de;uni-koeln.de",
        "author_num": 3,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "University of Texas at Austin;University of Cologne",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.utexas.edu;https://www.uni-koeln.de/",
        "aff_unique_abbr": "UT Austin;UC",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Austin;",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "United States;Germany"
    },
    {
        "id": "J88EKENxyF",
        "title": "CAT-LLM: Context-Aware Training enhanced Large Language Models for multi-modal contextual image retrieval",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recently, the unprecedented advancement of Large Language Models (LLMs) has revolutionized in numerous applications in the vision-language domain. Inspired by the extraordinary visual understanding and logical reasoning abilities, we pro- pose a method that employs LLMs to address the Multi-Modal Contextual Image Retrieval (MMCIR) problem, where the input hints include both visual and textual queries. Specifically, given a query comprising a sequence of images and texts, MMCIR aims to select an image from a gallery that best matches the context of the query. In this paper, we first construct a Multi-Modal Captioning (MMC) dataset by enriching existing image captioning datasets from \u27e8image, caption\u27e9 to \u27e8reference image, reference caption, text condition, target caption\u27e9. Then, we introduce a Context-Aware Captioning (CA-Cap) and a Context-Aware Text Matching (CA-TM) objective to instruct a frozen LLM for MMCIR. These specialized objectives enable the LLM to better understand multi-modal inputs and output visual representation from complex multi-modal contexts. Comprehensive experiments demonstrate the effectiveness of our method on recent Zero- Shot Composed Image Retrieval (ZS-CIR) benchmarks (i.e., CIRCO, CIRR, and GeneCIS), and in complex scenarios with dense multi-modal inputs like Visual Storytelling and Visual Dialog.",
        "keywords": "LLM;Composed image retrieval;multi-modal contextual image retrieval;context-aware training",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Wei Li;Hehe Fan;Yongkang Wong;Mohan Kankanhalli;Yi Yang",
        "authorids": "~Wei_Li55;~Hehe_Fan1;~Yongkang_Wong1;~Mohan_Kankanhalli1;~Yi_Yang22",
        "gender": "M;M;M;M;M",
        "homepage": "https://github.com/lw-2018;https://hehefan.github.io;https://sites.google.com/site/yongkangwong/;https://www.comp.nus.edu.sg/~mohan;https://person.zju.edu.cn/yiyang",
        "dblp": ";184/5722.html;89/7407;09/3613.html;33/4854-1.html",
        "google_scholar": "hDubMJwAAAAJ;hVuflMQAAAAJ;https://scholar.google.com.sg/citations?user=Xa0mxggAAAAJ;6Lx_eowAAAAJ;RMSuNFwAAAAJ",
        "orcid": ";0000-0001-9572-2345;0000-0002-1239-4428;0000-0002-4846-2015;",
        "linkedin": ";;yongkangwong/;mohan-kankanhalli-583417221;",
        "or_profile": "~Wei_Li55;~Hehe_Fan1;~Yongkang_Wong1;~Mohan_Kankanhalli1;~Yi_Yang22",
        "aff": "National University of Singapore;Zhejiang University;National University of Singapore;National University of Singapore;Zhejiang University",
        "aff_domain": "nus.edu;zju.edu.cn;nus.edu.sg;nus.edu.sg;zju.edu.cn",
        "position": "Intern;Assistant Professor;Senior Research Fellow;Full Professor;Full Professor",
        "bibtex": "@misc{\nli2024catllm,\ntitle={{CAT}-{LLM}: Context-Aware Training enhanced Large Language Models for multi-modal contextual image retrieval},\nauthor={Wei Li and Hehe Fan and Yongkang Wong and Mohan Kankanhalli and Yi Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=J88EKENxyF}\n}",
        "github": "",
        "project": "",
        "reviewers": "34Fi;xXn6;USW9",
        "site": "https://openreview.net/forum?id=J88EKENxyF",
        "pdf_size": 5906576,
        "rating": "5;5;5",
        "confidence": "4;4;4",
        "soundness": "3;3;2",
        "contribution": "3;2;2",
        "presentation": "3;2;3",
        "wc_summary": "52;109;67",
        "wc_strengths": "61;90;52",
        "wc_weaknesses": "81;207;126",
        "wc_questions": "3;8;25",
        "wc_review": "197;414;270",
        "wc_reply_reviewers": "0;38;0",
        "wc_reply_authors": "628;1550;1548",
        "reply_reviewers": "0;1;0",
        "reply_authors": "1;2;3",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            76.0,
            24.124676163629637
        ],
        "wc_strengths_avg": [
            67.66666666666667,
            16.21384867602041
        ],
        "wc_weaknesses_avg": [
            138.0,
            52.1344415909483
        ],
        "wc_questions_avg": [
            12.0,
            9.41629792788369
        ],
        "wc_review_avg": [
            293.6666666666667,
            90.15665378784986
        ],
        "wc_reply_reviewers_avg": [
            12.666666666666666,
            17.913371790059205
        ],
        "wc_reply_authors_avg": [
            1242.0,
            434.1643314076672
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3139707691922852492&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0;1",
        "aff_unique_norm": "National University of Singapore;Zhejiang University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.nus.edu.sg;https://www.zju.edu.cn",
        "aff_unique_abbr": "NUS;ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;1",
        "aff_country_unique": "Singapore;China"
    },
    {
        "id": "J8FGCqT314",
        "title": "D2T2: Decision Transformer with Temporal Difference via Steering Guidance",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Despite the promising performance of Decision Transformers (DT) on a wide range of tasks, recent studies have found that the performance of DT may largely be dependent on the specific characteristics of the task of interest including, most importantly, the stochasticity of the environment. We first focus on this issue and prove that a well-trained DT can recover the optimal trajectory almost surely in an environment with random initial states but deterministic transition and rewards, explaining the remarkable performance of DT in deterministic tasks. Notably, it follows from our analysis that for stochastic transition and rewards, the performance of DT may degrade significantly due to the growing variance of returns-to-go (RTG) accumulated over the horizon. To this end, we extend DT to Decision Transformer with Temporal Difference via Next-State Guidance (D2T2) which addresses the growing variance problem of RTGs and leads to significantly improved performance in stochastic tasks. D2T2 maps the current state to a guiding vector that steers DT toward high-reward regions where the expected returns are approximated by temporal difference learning. This approach also addresses another severe challenge faced by DT which is its requirement of RTGs as input upon evaluation/deployment. Experimental results on various stochastic tasks and D4RL environments are provided to establish the superior performance of our proposed method compared to the state-of-the-art (SOTA) offline reinforcement learning methods.",
        "keywords": "Offline Reinforcement Learning;Reinforcement Learning via Supervised Learning;Decision Transformer",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/a428af61e3cfffe344821d37a26b90029bc99bd5.zip",
        "author": "Hao-Lun Hsu;Juncheng Dong;Qitong Gao;Alper Kamil Bozkurt;Vahid Tarokh;Miroslav Pajic",
        "authorids": "~Hao-Lun_Hsu1;~Juncheng_Dong1;~Qitong_Gao1;~Alper_Kamil_Bozkurt1;~Vahid_Tarokh1;~Miroslav_Pajic2",
        "gender": "M;;M;;;M",
        "homepage": "https://hlhsu.github.io/;;http://qitonggao.com;;;http://people.duke.edu/~mp275/",
        "dblp": "303/0321;;238/5422;;;74/7446.html",
        "google_scholar": "h9qf9vUAAAAJ;;Flv4SrsAAAAJ;;;Fbn21-8AAAAJ",
        "orcid": ";;;;;",
        "linkedin": "hlhsu/;;qitong-gao;;;",
        "or_profile": "~Hao-Lun_Hsu1;~Juncheng_Dong1;~Qitong_Gao1;~Alper_Kamil_Bozkurt1;~Vahid_Tarokh1;~Miroslav_Pajic2",
        "aff": "Duke University;;Duke University;;;Duke University",
        "aff_domain": "duke.edu;;duke.edu;;;duke.edu",
        "position": "PhD student;;PhD student;;;Associate Professor",
        "bibtex": "@misc{\nhsu2024dt,\ntitle={D2T2: Decision Transformer with Temporal Difference via Steering Guidance},\nauthor={Hao-Lun Hsu and Juncheng Dong and Qitong Gao and Alper Kamil Bozkurt and Vahid Tarokh and Miroslav Pajic},\nyear={2024},\nurl={https://openreview.net/forum?id=J8FGCqT314}\n}",
        "github": "",
        "project": "",
        "reviewers": "Ws8p;iBmd;z6CB",
        "site": "https://openreview.net/forum?id=J8FGCqT314",
        "pdf_size": 1571982,
        "rating": "3;5;6",
        "confidence": "3;4;2",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "1;2;2",
        "wc_summary": "67;122;117",
        "wc_strengths": "33;208;111",
        "wc_weaknesses": "156;561;178",
        "wc_questions": "226;113;2",
        "wc_review": "482;1004;408",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            102.0,
            24.8327740429189
        ],
        "wc_strengths_avg": [
            117.33333333333333,
            71.58367287463128
        ],
        "wc_weaknesses_avg": [
            298.3333333333333,
            185.95041154984185
        ],
        "wc_questions_avg": [
            113.66666666666667,
            91.44883208050767
        ],
        "wc_review_avg": [
            631.3333333333334,
            265.24119003067545
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.3273268353539886,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7852747282723044062&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Duke University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.duke.edu",
        "aff_unique_abbr": "Duke",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "J9Vwp7TiE5",
        "title": "SegGen: Supercharging Segmentation Models with Text2Mask and Mask2Img Synthesis",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We propose SegGen, a highly-effective training data generation method for image segmentation, which pushes the performance limits of state-of-the-art segmentation models to a significant extent. SegGen designs and integrates two data generation strategies: MaskSyn and ImgSyn. (i) MaskSyn synthesizes new mask-image pairs via our proposed text-to-mask generation model and mask-to-image generation model, greatly improving the diversity in segmentation masks for model supervision; (ii) ImgSyn synthesizes new images based on existing masks using the mask-to-image generation model, strongly improving image diversity for model inputs. On the highly competitive ADE20K and COCO benchmarks, our data generation method markedly improves the performance of state-of-the-art segmentation models in semantic segmentation, panoptic segmentation, and instance segmentation. Notably, in terms of the ADE20K mIoU, Mask2Former R50 is largely boosted from 47.2 to 49.9 (+2.7); Mask2Former Swin-L is also significantly increased from 56.1 to 57.4 (+1.3). These promising results strongly suggest the effectiveness of our SegGen even when abundant human-annotated training data is utilized. Moreover, training with our synthetic data makes the segmentation models more robust towards unseen domains. The project will be open-source upon paper acceptance to promote further study.",
        "keywords": "semantic segmentation;panoptic segmentation;instance segmentation;generative models;diffusion models",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Hanrong Ye;Jason Kuen;Qing Liu;Zhe Lin;Brian L. Price;Dan Xu",
        "authorids": "~Hanrong_Ye1;~Jason_Kuen1;~Qing_Liu1;~Zhe_Lin1;~Brian_L._Price2;~Dan_Xu4",
        "gender": ";M;F;M;;M",
        "homepage": ";http://jasonkuen.com/;https://qliu24.github.io/;https://sites.google.com/site/zhelin625/;https://www.brianpricephd.com/;https://www.danxurgb.net",
        "dblp": ";165/1403;53/4481-17;42/1680-1;38/5397;16/3823-2.html",
        "google_scholar": ";e6u7GlQAAAAJ;1ytghtEAAAAJ;R0bnqaAAAAAJ;ntGll74AAAAJ;OuSPv-AAAAAJ",
        "orcid": ";;;0000-0003-1154-9907;;0000-0003-0136-9603",
        "linkedin": ";;;;;",
        "or_profile": "~Hanrong_Ye1;~Jason_Kuen1;~Qing_Liu1;~Zhe_Lin1;~Brian_L._Price2;~Dan_Xu4",
        "aff": ";Adobe Research;Adobe Systems;Adobe Research;Adobe Systems;VGG, University of Oxford",
        "aff_domain": ";adobe.com;adobe.com;adobe.com;adobe.com;ox.ac.uk",
        "position": ";Researcher;Researcher;Principal Researcher;Principal Researcher;Postdoc",
        "bibtex": "@misc{\nye2024seggen,\ntitle={SegGen: Supercharging Segmentation Models with Text2Mask and Mask2Img Synthesis},\nauthor={Hanrong Ye and Jason Kuen and Qing Liu and Zhe Lin and Brian L. Price and Dan Xu},\nyear={2024},\nurl={https://openreview.net/forum?id=J9Vwp7TiE5}\n}",
        "github": "",
        "project": "",
        "reviewers": "vgUs;vvk8;wtDG;RiQa",
        "site": "https://openreview.net/forum?id=J9Vwp7TiE5",
        "pdf_size": 12124307,
        "rating": "5;5;6;8",
        "confidence": "3;4;4;5",
        "soundness": "1;3;3;4",
        "contribution": "1;3;3;3",
        "presentation": "2;4;3;3",
        "wc_summary": "81;107;32;49",
        "wc_strengths": "53;148;25;56",
        "wc_weaknesses": "112;422;106;123",
        "wc_questions": "40;4;2;1",
        "wc_review": "286;681;165;229",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "728;2643;757;287",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;6;1;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            1.0897247358851685
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            67.25,
            28.9169068193678
        ],
        "wc_strengths_avg": [
            70.5,
            46.349217900629135
        ],
        "wc_weaknesses_avg": [
            190.75,
            133.65136549994543
        ],
        "wc_questions_avg": [
            11.75,
            16.345871038277526
        ],
        "wc_review_avg": [
            340.25,
            201.33476475760463
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1103.75,
            907.9915679674564
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.25,
            2.165063509461097
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.8660254037844386,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3144208236949203195&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;0;0;1",
        "aff_unique_norm": "Adobe;University of Oxford",
        "aff_unique_dep": "Adobe Research;VGG",
        "aff_unique_url": "https://research.adobe.com;https://www.ox.ac.uk",
        "aff_unique_abbr": "Adobe;Oxford",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Oxford",
        "aff_country_unique_index": "0;0;0;0;1",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "J9wzKfgZVK",
        "title": "What and How does In-Context Learning Learn? Bayesian Model Averaging, Parameterization, and Generalization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this paper, we conduct a comprehensive study of In-Context Learning (ICL) by addressing several open questions: (a) What type of ICL estimator is learned within language models? (b) What are suitable performance metrics to evaluate ICL accurately and what are the error rates? (c) How does the transformer architecture enable ICL? To answer (a), we take a Bayesian view and demonstrate that ICL implicitly implements the Bayesian model averaging algorithm. This Bayesian model averaging algorithm is proven to be approximately parameterized by the attention mechanism. For (b), we analyze the ICL performance from an online learning perspective and establish a regret bound $\\mathcal{O}(1/T)$, where $T$ is the ICL input sequence length. To address (c), in addition to the encoded Bayesian model averaging algorithm in attention, we show that during pertaining, the total variation distance between the learned model and the nominal model is bounded by a sum of an approximation error and a generalization error of $\\tilde{\\mathcal{O}}(1/\\sqrt{N_{\\mathrm{p}}T_{\\mathrm{p}}})$, where $N_{\\mathrm{p}}$ and $T_{\\mathrm{p}}$ are the number of token sequences and the length of each sequence in pretraining, respectively. Our results provide a unified understanding of the transformer and its ICL ability with bounds on ICL regret, approximation, and generalization, which deepens our knowledge of these essential aspects of modern language models",
        "keywords": "transformer;large language models;in-context learning",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/db615333eea1b99ccc6007791a12ffbd2bfb716f.zip",
        "author": "Yufeng Zhang;Fengzhuo Zhang;Zhuoran Yang;Zhaoran Wang",
        "authorids": "~Yufeng_Zhang2;~Fengzhuo_Zhang1;~Zhuoran_Yang1;~Zhaoran_Wang1",
        "gender": "M;M;M;Not Specified",
        "homepage": ";;https://zhuoranyang.github.io/;https://zhaoranwang.github.io/",
        "dblp": "17/1651;254/1627;;117/2756",
        "google_scholar": ";;;https://scholar.google.com.tw/citations?user=HSx0BgQAAAAJ",
        "orcid": ";;;",
        "linkedin": "yufeng-zhang-485844119/;%E4%B8%B0%E5%8D%93-%E5%BC%A0-4576a5135/;;",
        "or_profile": "~Yufeng_Zhang2;~Fengzhuo_Zhang1;~Zhuoran_Yang1;~Zhaoran_Wang1",
        "aff": "ByteDance Inc.;National University of Singapore;Yale University;Northwestern University",
        "aff_domain": "bytedance.com;nus.edu;yale.edu;northwestern.edu",
        "position": "Researcher;PhD student;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nzhang2024what,\ntitle={What and How does In-Context Learning Learn? Bayesian Model Averaging, Parameterization, and Generalization},\nauthor={Yufeng Zhang and Fengzhuo Zhang and Zhuoran Yang and Zhaoran Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=J9wzKfgZVK}\n}",
        "github": "",
        "project": "",
        "reviewers": "b1Tv;MVTm;xbQq",
        "site": "https://openreview.net/forum?id=J9wzKfgZVK",
        "pdf_size": 326802,
        "rating": "5;5;6",
        "confidence": "3;2;2",
        "soundness": "3;3;4",
        "contribution": "3;2;4",
        "presentation": "2;2;3",
        "wc_summary": "40;180;186",
        "wc_strengths": "70;81;40",
        "wc_weaknesses": "238;128;61",
        "wc_questions": "354;106;205",
        "wc_review": "702;495;492",
        "wc_reply_reviewers": "0;26;167",
        "wc_reply_authors": "3267;2876;3339",
        "reply_reviewers": "0;1;1",
        "reply_authors": "6;5;7",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            135.33333333333334,
            67.4553350167518
        ],
        "wc_strengths_avg": [
            63.666666666666664,
            17.326921891156037
        ],
        "wc_weaknesses_avg": [
            142.33333333333334,
            72.96726815649755
        ],
        "wc_questions_avg": [
            221.66666666666666,
            101.92916930670806
        ],
        "wc_review_avg": [
            563.0,
            98.29547293746543
        ],
        "wc_reply_reviewers_avg": [
            64.33333333333333,
            73.36817354199906
        ],
        "wc_reply_authors_avg": [
            3160.6666666666665,
            203.4245696949008
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            6.0,
            0.816496580927726
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 76,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15284501242159671548&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "ByteDance;National University of Singapore;Yale University;Northwestern University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.bytedance.com;https://www.nus.edu.sg;https://www.yale.edu;https://www.northwestern.edu",
        "aff_unique_abbr": "ByteDance;NUS;Yale;NU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;2",
        "aff_country_unique": "China;Singapore;United States"
    },
    {
        "id": "JAKcnjzQI3",
        "title": "MaSS: Multi-attribute Selective Suppression for Utility-preserving Data Transformation from an Information-theoretic Perspective",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The growing richness of large-scale datasets has been a crucial driving force behind the rapid advancement and wide adoption of machine learning technologies. The massive collection and usage of data, however, pose an increasing risk for people\u2019s private and sensitive information due to either inadvertent mishandling or malicious exploitation. Besides legislative solutions, many technical approaches have been proposed towards data privacy protection. However, they bear various limitations such as leading to degraded data availability and utility, or relying on heuristics and lacking solid theoretical bases. To overcome these limitations, we propose a formal information-theoretic definition for this utility-preserving privacy protection problem, and design a data-driven learnable data transformation framework that is capable of selectively suppressing sensitive attributes from target datasets while preserving the other useful attributes, regardless of whether or not they are known in advance or explicitly annotated for preservation. We provide rigorous theoretical analyses on the operational bounds for our framework, and carry out comprehensive experimental evaluations using datasets of a variety of modalities, including facial images, voice audio clips, and human activity motion sensor signals. Results demonstrate the effectiveness and generalizability of our method on different tasks and configurations.",
        "keywords": "Privacy Protection;Utility Preservation;Information Theory;Contrastive Learning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Yizhuo Chen;Chun-Fu Chen;Hsiang Hsu;Shaohan Hu;Marco Pistoia;Tarek F. Abdelzaher",
        "authorids": "~Yizhuo_Chen2;~Chun-Fu_Chen1;~Hsiang_Hsu1;~Shaohan_Hu2;~Marco_Pistoia2;~Tarek_F._Abdelzaher1",
        "gender": ";M;M;;M;M",
        "homepage": "https://yizhuochen99.github.io/;;https://hsianghsu.github.io;https://hushaohan.github.io/;https://sites.google.com/view/marcopistoia/;http://abdelzaher.cs.illinois.edu/",
        "dblp": ";48/915;;;p/MarcoPistoia;a/TarekFAbdelzaher",
        "google_scholar": ";9gqd5cYAAAAJ;https://scholar.google.com.tw/citations?user=JRl3iYIAAAAJ;m9dh1GoAAAAJ;tj2A8SUAAAAJ;https://scholar.google.com.tw/citations?user=cA28Zs0AAAAJ",
        "orcid": ";;0000-0001-8084-3929;;0000-0001-9002-1128;0000-0003-3883-7220",
        "linkedin": ";;;;pistoia/;tarek-abdelzaher-0216071/",
        "or_profile": "~Yizhuo_Chen2;~Chun-Fu_Chen1;~Hsiang_Hsu1;~Shaohan_Hu2;~Marco_Pistoia2;~Tarek_Abdelzaher1",
        "aff": "J.P. Morgan Chase;JPMorganChase, GTAR;JP Morgan & Chase Bank;J.P. Morgan Chase;J.P. Morgan Chase;University of Illinois, Urbana Champaign",
        "aff_domain": "jpmchase.com;jpmchase.com;jpmchase.com;jpmchase.com;jpmorgan.com;illinois.edu",
        "position": "Intern;Executive Director;Researcher;Executive Director;Principal Researcher;Full Professor",
        "bibtex": "@misc{\nchen2024mass,\ntitle={Ma{SS}: Multi-attribute Selective Suppression for Utility-preserving Data Transformation from an Information-theoretic Perspective},\nauthor={Yizhuo Chen and Chun-Fu Chen and Hsiang Hsu and Shaohan Hu and Marco Pistoia and Tarek F. Abdelzaher},\nyear={2024},\nurl={https://openreview.net/forum?id=JAKcnjzQI3}\n}",
        "github": "",
        "project": "",
        "reviewers": "wuPW;CAg3;YVvf;AsFx",
        "site": "https://openreview.net/forum?id=JAKcnjzQI3",
        "pdf_size": 683556,
        "rating": "3;6;6;6",
        "confidence": "5;4;3;3",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;4;3;3",
        "wc_summary": "106;119;120;73",
        "wc_strengths": "112;183;118;85",
        "wc_weaknesses": "515;112;370;297",
        "wc_questions": "2;55;3;7",
        "wc_review": "735;469;611;462",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1705;1360;1192;482",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;2;2;1",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            104.5,
            19.00657780874821
        ],
        "wc_strengths_avg": [
            124.5,
            35.98958182585621
        ],
        "wc_weaknesses_avg": [
            323.5,
            145.14561653732434
        ],
        "wc_questions_avg": [
            16.75,
            22.16275028059469
        ],
        "wc_review_avg": [
            569.25,
            112.65960899985407
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1184.75,
            445.89313461859894
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.8703882797784892,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:PPLSJu5WWbMJ:scholar.google.com/&scioq=MaSS:+Multi-attribute+Selective+Suppression+for+Utility-preserving+Data+Transformation+from+an+Information-theoretic+Perspective&hl=en&as_sdt=0,33",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;0;0;0;2",
        "aff_unique_norm": "JPMorgan Chase & Co.;JPMorgan Chase;University of Illinois Urbana-Champaign",
        "aff_unique_dep": ";Global Technology, Analytics, and Research (GTAR);",
        "aff_unique_url": "https://www.jpmorganchase.com;https://www.jpmorganchase.com;https://illinois.edu",
        "aff_unique_abbr": "JPM;JPM;UIUC",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Urbana-Champaign",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "JAfGlmRBTU",
        "title": "Representing part-whole hierarchy with coordinated synchrony in neural networks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Human vision flexibly extracts part-whole hierarchy from visual scenes. However, how can a neural network with a fixed architecture parse an image into a part-whole hierarchy that potentially has a different structure for each image is a difficult question. This paper presents a new framework to represent the part-whole hierarchy by the hierarchical neuronal synchrony: (1) Neurons are dynamically synchronized into neuronal groups (of different timescales) to temporarily represent each object (wholes, parts, sub-parts, etc.) as the nodes of the parse tree. (2) The coordinated temporal relationship among neuronal groups represents the structure (edges) of the parse tree. Further, we developed a simple two-level hybrid model inspired by the visual cortical circuit, the Composer, which is able to dynamically achieve the emergent coordinated synchronous states given an image. The synchrony states are gradually created by the iterative top-down prediction / bottom-up integration between levels and inside each level. For evaluation, four synthetic datasets and three quantitative metrics are invented. The quantitative and qualitative results show that the Composer is able to parse a range of scenes of different complexities through dynamically formed neuronal synchrony. It is promising that the systematic framework proposed in this paper, from representation and implementation to evaluation, sheds light on developing human-like vision in neural network models.",
        "keywords": "hierarchical representation;part whole hierarchy;neuronal coherence;synchrony code;metastability;spiking neural network;temporal binding;nested oscillation;object-centric representation;non-equilibrium states;neocortex;top-down modulation;hybrid neural network;unsupervised learning;self-supervised learning;representation learning;segmentation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/4e4b4f692188f8e7ed96d321d066370585df738a.zip",
        "author": "Hao Zheng;Hui Lin;Rong Zhao",
        "authorids": "~Hao_Zheng2;~Hui_Lin5;~Rong_Zhao3",
        "gender": "M;M;F",
        "homepage": "https://bcs.mit.edu/directory/hao-zheng;https://www.researchgate.net/profile/Hui-Lin-59;http://faculty.dpi.tsinghua.edu.cn/home/r_zhao",
        "dblp": ";;",
        "google_scholar": ";;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Hao_Zheng2;~Hui_Lin5;~Rong_Zhao3",
        "aff": "Tsinghua University;Electronic Engineering, Tsinghua University, Tsinghua University;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;mails.tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nzheng2024representing,\ntitle={Representing part-whole hierarchy with coordinated synchrony in neural networks},\nauthor={Hao Zheng and Hui Lin and Rong Zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=JAfGlmRBTU}\n}",
        "github": "",
        "project": "",
        "reviewers": "iE1G;FiYe;JZAs;denz",
        "site": "https://openreview.net/forum?id=JAfGlmRBTU",
        "pdf_size": 24564921,
        "rating": "3;3;5;5",
        "confidence": "4;3;3;3",
        "soundness": "2;1;2;3",
        "contribution": "1;3;2;3",
        "presentation": "3;1;3;2",
        "wc_summary": "79;58;104;118",
        "wc_strengths": "66;84;81;108",
        "wc_weaknesses": "277;96;308;275",
        "wc_questions": "167;55;421;10",
        "wc_review": "589;293;914;511",
        "wc_reply_reviewers": "16;0;91;113",
        "wc_reply_authors": "5081;2086;4062;1166",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "8;4;7;2",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            89.75,
            23.047505287991584
        ],
        "wc_strengths_avg": [
            84.75,
            15.056144924913548
        ],
        "wc_weaknesses_avg": [
            239.0,
            83.59126748650245
        ],
        "wc_questions_avg": [
            163.25,
            159.41514200351233
        ],
        "wc_review_avg": [
            576.75,
            222.89277130494833
        ],
        "wc_reply_reviewers_avg": [
            55.0,
            47.97395126524393
        ],
        "wc_reply_authors_avg": [
            3098.75,
            1550.6733013436453
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            5.25,
            2.384848003542364
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:UzrxsRUkEsQJ:scholar.google.com/&scioq=Representing+part-whole+hierarchy+with+coordinated+synchrony+in+neural+networks&hl=en&as_sdt=0,48",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Tsinghua University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "JB3lbDtsFS",
        "title": "It HAS to be Subjective: Human Annotator Simulation via Zero-shot Density Estimation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Human annotator simulation (HAS) serves as a cost-effective substitute for human evaluation such as data annotation and system assessment. Human perception and behaviour during human evaluation exhibit inherent variability due to diverse cognitive processes and subjective interpretations, which should be taken into account in modelling to better mimic the way people perceive and interact with the world. This paper introduces a novel meta-learning framework that treats HAS as a zero-shot density estimation problem, which incorporates human variability and allows for the efficient generation of human-like annotations for unlabelled test inputs. Under this framework, we propose two new model classes, conditional integer flows and conditional softmax flows, to account for ordinal and categorical annotations, respectively. The proposed method is evaluated on three real-world human evaluation tasks and shows superior capability and efficiency to predict the aggregated behaviours of human annotators, match the distribution of human annotations, and simulate the inter-annotator disagreements.",
        "keywords": "human annotator simulation;normalizing flows;speech processing;emotion recognition;meta-learning;zero-shot learning;fairness",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/6eae93796657f4f579b96d929288cef5183d4706.zip",
        "author": "Wen Wu;Wenlin Chen;Chao Zhang;Phil Woodland",
        "authorids": "~Wen_Wu2;~Wenlin_Chen2;~Chao_Zhang20;~Phil_Woodland1",
        "gender": "F;;M;M",
        "homepage": ";https://wenlin-chen.github.io/;http://mi.eng.cam.ac.uk/~cz277/;http://www.eng.cam.ac.uk/profiles/pw117",
        "dblp": "92/382-7;;94/3019-31.html;42/153",
        "google_scholar": "nvIWQG0AAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.co.uk/citations?view_op=list_works;https://scholar.google.co.uk/citations?user=V_SMuA8AAAAJ",
        "orcid": "0000-0001-8116-7715;;;",
        "linkedin": ";;;",
        "or_profile": "~Wen_Wu2;~Wenlin_Chen2;~Chao_Zhang20;~Phil_Woodland1",
        "aff": "University of Cambridge;Microsoft Research;University College London;University of Cambridge",
        "aff_domain": "cam.ac.uk;microsoft.com;ucl.ac.uk;cam.ac.uk",
        "position": "PhD student;Research Intern;Associate Professor;Full Professor",
        "bibtex": "@misc{\nwu2024it,\ntitle={It {HAS} to be Subjective: Human Annotator Simulation via Zero-shot Density Estimation},\nauthor={Wen Wu and Wenlin Chen and Chao Zhang and Phil Woodland},\nyear={2024},\nurl={https://openreview.net/forum?id=JB3lbDtsFS}\n}",
        "github": "",
        "project": "",
        "reviewers": "Pupg;szvo;2YK4;js5b",
        "site": "https://openreview.net/forum?id=JB3lbDtsFS",
        "pdf_size": 1378326,
        "rating": "5;5;6;6",
        "confidence": "2;4;1;4",
        "soundness": "2;3;3;2",
        "contribution": "2;2;3;3",
        "presentation": "2;2;3;2",
        "wc_summary": "43;36;114;132",
        "wc_strengths": "36;67;240;108",
        "wc_weaknesses": "88;866;187;313",
        "wc_questions": "4;74;73;24",
        "wc_review": "171;1043;614;577",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "247;1919;525;1013",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;3;1;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            2.75,
            1.299038105676658
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            81.25,
            42.30469832063574
        ],
        "wc_strengths_avg": [
            112.75,
            77.77973707849623
        ],
        "wc_weaknesses_avg": [
            363.5,
            300.87746675349416
        ],
        "wc_questions_avg": [
            43.75,
            30.58083550199373
        ],
        "wc_review_avg": [
            601.25,
            308.62953115345266
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            926.0,
            635.5037372038028
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.19245008972987523,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10389844779736466601&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "University of Cambridge;Microsoft;University College London",
        "aff_unique_dep": ";Microsoft Research;",
        "aff_unique_url": "https://www.cam.ac.uk;https://www.microsoft.com/en-us/research;https://www.ucl.ac.uk",
        "aff_unique_abbr": "Cambridge;MSR;UCL",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Cambridge;",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "id": "JBLHIR8kBZ",
        "title": "Neuron to Graph: Interpreting Language Model Neurons at Scale",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Advances in Large Language Models (LLMs) have led to remarkable capabilities, yet their inner mechanisms remain largely unknown. To understand these models, we need to unravel the functions of individual neurons and their contribution to the network. \n\nThis paper introduces a novel automated approach designed to scale interpretability techniques across a vast array of neurons within LLMs, to make them more interpretable and ultimately safe. Conventional methods require examination of examples with strong neuron activation and manual identification of patterns to decipher the concepts a neuron responds to. We propose Neuron to Graph (N$2$G), an innovative tool that automatically extracts a neuron's behaviour from the dataset it was trained on and translates it into an interpretable graph. \n\nN$2$G uses truncation and saliency methods to emphasise only the most pertinent tokens to a neuron while enriching dataset examples with diverse samples to better encompass the full spectrum of neuron behaviour. These graphs can be visualised to aid researchers' manual interpretation, and can generate token activations on text for automatic validation by comparison with the neuron's ground truth activations, which we use to show that the model is better at predicting neuron activation than two baseline methods. We also demonstrate how the generated graph representations can be flexibly used to facilitate further automation of interpretability research, by searching for neurons with particular properties, or programmatically comparing neurons to each other to identify similar neurons. Our method easily scales to build graph representations for all neurons in a 6-layer Transformer model using a single Tesla T4 GPU, allowing for wide usability.",
        "keywords": "Mechanistic Interpretability;Visualisation",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/fdd600d63b6218717354cb594c862ced071cc906.zip",
        "author": "Alex Foote;Neel Nanda;Esben Kran;Ioannis Konstas;Shay B Cohen;Fazl Barez",
        "authorids": "~Alex_Foote1;~Neel_Nanda1;~Esben_Kran1;~Ioannis_Konstas1;~Shay_B_Cohen1;~Fazl_Barez1",
        "gender": "M;M;M;M;M;",
        "homepage": ";https://neelnanda.io;https://apartresearch.com;;http://homepages.inf.ed.ac.uk/scohen;",
        "dblp": "296/0462;285/6389;;69/241;04/5629;",
        "google_scholar": "L4QbBHQAAAAJ;https://scholar.google.com/citations?hl=en;SH5diRUAAAAJ;FAJSqSkjAoIC;;",
        "orcid": ";;0000-0003-0710-2635;;0000-0003-4753-8353;",
        "linkedin": ";https://linkedin.com/in/neel-nanda-993580151;esbenkc/;;;",
        "or_profile": "~Alex_Foote1;~Neel_Nanda1;~Esben_Kran1;~Ioannis_Konstas1;~Shay_B_Cohen1;~Fazl_Barez1",
        "aff": ";Google DeepMind;Apart Research;Heriot-Watt University;University of Edinburgh;",
        "aff_domain": ";deepmind.com;apartresearch.com;hw.ac.uk;ed.ac.uk;",
        "position": ";Researcher;Researcher;Associate Professor;Reader;",
        "bibtex": "@misc{\nfoote2024neuron,\ntitle={Neuron to Graph: Interpreting Language Model Neurons at Scale},\nauthor={Alex Foote and Neel Nanda and Esben Kran and Ioannis Konstas and Shay B Cohen and Fazl Barez},\nyear={2024},\nurl={https://openreview.net/forum?id=JBLHIR8kBZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "cE3E;QyST;B6PG;dCS6;8BeY",
        "site": "https://openreview.net/forum?id=JBLHIR8kBZ",
        "pdf_size": 477058,
        "rating": "1;3;5;5;6",
        "confidence": "4;4;4;5;3",
        "soundness": "2;2;3;3;2",
        "contribution": "2;2;3;3;3",
        "presentation": "2;3;3;2;3",
        "wc_summary": "167;85;16;95;69",
        "wc_strengths": "78;40;73;75;88",
        "wc_weaknesses": "231;81;53;145;105",
        "wc_questions": "32;44;36;18;50",
        "wc_review": "508;250;178;333;312",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            4.0,
            1.7888543819998317
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            86.4,
            48.644012992350866
        ],
        "wc_strengths_avg": [
            70.8,
            16.240689640529432
        ],
        "wc_weaknesses_avg": [
            123.0,
            61.864367773379854
        ],
        "wc_questions_avg": [
            36.0,
            10.954451150103322
        ],
        "wc_review_avg": [
            316.2,
            110.06252768313111
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.17677669529663687,
        "gs_citation": 22,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=515533309210825325&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Google;Apart Research;Heriot-Watt University;University of Edinburgh",
        "aff_unique_dep": "Google DeepMind;;;",
        "aff_unique_url": "https://deepmind.com;;https://www.hw.ac.uk;https://www.ed.ac.uk",
        "aff_unique_abbr": "DeepMind;;HWU;Edinburgh",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United Kingdom;"
    },
    {
        "id": "JBLgjRRuHG",
        "title": "Efficient architectural aspects for text-to-video generation pipeline",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Multimedia generation approaches occupy a prominent place in artificial intelligence research. Text-to-image models achieved high quality results over the last years, however video synthesis methods recently started to develop. In this paper we present a new two-stage latent diffusion video generation architecture using a new MoVQ video decoding scheme. The first stage concerns keyframes synthesis, while the second one is devoted to interpolated frames generation. We compare two temporal conditioning approaches during evaluation and show the improvement of using temporal blocks over temporal layers in terms of IS and CLIPSIM metrics reflecting video generation quality aspects. We also evaluate different configurations of MoVQ-based video decoding scheme to achieve higher PSNR, SSIM, MSE and LPIPS scores. Finally, we compare our pipeline with existing solutions and achieve top-3 CLIPSIM metric score (0.2976).",
        "keywords": "text-to-video;video generation;temporal consistency;frames interpolation;Inception Score;CLIPSIM;MoVQ video decoder",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/85e824fa7cd2f57c7ab32187b44fd2b90363c8a2.zip",
        "author": "Arkhipkin Sergeevich Vladimir;Zein Shaheen;Viacheslav Vasilev;Denis Valerievich Dimitrov;Andrey Kuznetsov",
        "authorids": "~Arkhipkin_Sergeevich_Vladimir1;~Zein_Shaheen1;~Viacheslav_Vasilev1;~Denis_Valerievich_Dimitrov1;~Andrey_Kuznetsov2",
        "gender": "M;M;;M;M",
        "homepage": ";https://github.com/zeinsh;;https://t.me/dendimitrov;",
        "dblp": ";264/5396;;82/8368;50/11063",
        "google_scholar": "D-Ko0oAAAAAJ;https://scholar.google.ru/citations?user=bxlgMxMAAAAJ;redAz-kAAAAJ;3JSIJpYAAAAJ;q0lIfCEAAAAJ",
        "orcid": ";0000-0001-6802-2896;;0000-0002-9756-5424;0000-0001-6446-8663",
        "linkedin": ";zein-shaheen/;;denis-dimitrov-66bbb3116/;https://linkedin.com/in/andrey-kuznetsov-87",
        "or_profile": "~Arkhipkin_Sergeevich_Vladimir1;~Zein_Shaheen1;~Viacheslav_Vasilev1;~Denis_Valerievich_Dimitrov1;~Andrey_Kuznetsov2",
        "aff": "Sber;Sber AI;Moscow Institute of Physics and Technology;Sber;Samara National Research University",
        "aff_domain": "sberbank.ru;sberbank.ru;phystech.edu;sberbank.com;ssau.ru",
        "position": "Researcher;Researcher;PhD;Principal Researcher;Associate Professor",
        "bibtex": "@misc{\nvladimir2024efficient,\ntitle={Efficient architectural aspects for text-to-video generation pipeline},\nauthor={Arkhipkin Sergeevich Vladimir and Zein Shaheen and Viacheslav Vasilev and Denis Valerievich Dimitrov and Andrey Kuznetsov},\nyear={2024},\nurl={https://openreview.net/forum?id=JBLgjRRuHG}\n}",
        "github": "",
        "project": "",
        "reviewers": "ubtc;R6HA;qUnt",
        "site": "https://openreview.net/forum?id=JBLgjRRuHG",
        "pdf_size": 16382332,
        "rating": "5;5;5",
        "confidence": "5;3;4",
        "soundness": "2;3;2",
        "contribution": "2;3;2",
        "presentation": "2;3;3",
        "wc_summary": "37;41;49",
        "wc_strengths": "47;21;43",
        "wc_weaknesses": "104;19;102",
        "wc_questions": "2;10;46",
        "wc_review": "190;91;240",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            42.333333333333336,
            4.988876515698588
        ],
        "wc_strengths_avg": [
            37.0,
            11.430952132988164
        ],
        "wc_weaknesses_avg": [
            75.0,
            39.60639678974429
        ],
        "wc_questions_avg": [
            19.333333333333332,
            19.136933459209764
        ],
        "wc_review_avg": [
            173.66666666666666,
            61.9157133170212
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:N2SoxXsIzFkJ:scholar.google.com/&scioq=Efficient+architectural+aspects+for+text-to-video+generation+pipeline&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;2",
        "aff_unique_norm": "Sberbank;Moscow Institute of Physics and Technology;Samara National Research University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.sberbank.ru;https://www.mipt.ru/en;https://snru.ru",
        "aff_unique_abbr": "Sber;MIPT;SNRU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Russian Federation"
    },
    {
        "id": "JCseZixaI7",
        "title": "Meta Koopman Decomposition for Time Series Forecasting Under Distribution Shifts",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Time series forecasting facilitates various real-world applications and has attracted great research interests. In real-world scenarios, time series forecasting models confront a fundamental issue of temporal distribution shifts, i.e., the statistical properties of time series are evolving over time. In this paper, we utilize Koopman theory to address temporal distribution shifts (TDS). Koopman theory states any time series can be mapped into a Koopman space by proper measurement functions and represented by infinite dimensional linear Koopman operator. Therefore, time series under different distributions can be modeled by different Koopman operators. Considering the linearity of Koopman operators, the Koopman operators for representing time series under different distributions can be decomposed as linear combination of a set of Koopman operators, which we termed as meta Koopman operators. We further theoretically show the infinite dimensional Koopman operators can be approximated by finite matrix multiplications and the meta Koopman operators are equivalent to a set of matrices. Based on the analysis, we propose an auto-encoder framework for implementing the meta Koopman decomposition of time series, which is theoretically able to handle TDS. Extensive experiments conducted on four real-world time series datasets demonstrate the superiority of the proposed model on tackling temporal distribution shifts.",
        "keywords": "Time series forecasting;Koopman;temporal distribution shifts",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Binwu Wang;Xu Wang;Pengkun Wang;Yudong Zhang;Zhengyang Zhou;LEI BAI;Yang Wang",
        "authorids": "~Binwu_Wang1;~Xu_Wang16;~Pengkun_Wang1;~Yudong_Zhang3;~Zhengyang_Zhou1;~LEI_BAI1;~Yang_Wang32",
        "gender": "M;M;M;M;M;M;M",
        "homepage": "https://continualgoing.github.io/;http://home.ustc.edu.cn/~wx309/;http://home.ustc.edu.cn/~pengkun/index.html;http://home.ustc.edu.cn/~zyd2020/;http://home.ustc.edu.cn/~zzy0929/Home/;http://leibai.site/;http://staff.ustc.edu.cn/~angyan/",
        "dblp": "262/4302;181/2815-29;;39/2699-5;246/8238;119/1223-1;",
        "google_scholar": ";7hYGPC8AAAAJ;https://scholar.google.com/citations?hl=zh-CN;LM55u08AAAAJ;dPElQLUAAAAJ;https://scholar.google.com.au/citations?user=sakOO04AAAAJ;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": "0000-0002-4638-0382;0000-0002-1492-3477;0000-0002-2680-4563;0000-0003-4941-0214;0000-0003-4728-7347;0000-0003-3378-7201;0000-0002-6079-7053",
        "linkedin": ";;;;;lei-bai-641370153/;",
        "or_profile": "~Binwu_Wang1;~Xu_Wang16;~Pengkun_Wang1;~Yudong_Zhang3;~Zhengyang_Zhou1;~LEI_BAI1;~Yang_Wang32",
        "aff": "University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China;Shanghai AI Laboratory;University of Science and Technology of China",
        "aff_domain": "ustc.edu.cn;ustc.edu.cn;ustc.edu.cn;ustc.edu.cn;ustc.edu.cn;pjlab.org.cn;ustc.edu.cn",
        "position": "PhD student;Associate Researcher;Researcher;PhD student;Researcher;Researcher;Associate Professor",
        "bibtex": "@misc{\nwang2024meta,\ntitle={Meta Koopman Decomposition for Time Series Forecasting Under Distribution Shifts},\nauthor={Binwu Wang and Xu Wang and Pengkun Wang and Yudong Zhang and Zhengyang Zhou and LEI BAI and Yang Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=JCseZixaI7}\n}",
        "github": "",
        "project": "",
        "reviewers": "anBH;wJjt;t2ZP;qB8r",
        "site": "https://openreview.net/forum?id=JCseZixaI7",
        "pdf_size": 521397,
        "rating": "3;5;5;5",
        "confidence": "5;3;4;4",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;1;2",
        "wc_summary": "74;109;70;81",
        "wc_strengths": "31;50;162;35",
        "wc_weaknesses": "180;127;243;250",
        "wc_questions": "1;78;37;55",
        "wc_review": "286;364;512;421",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            83.5,
            15.239750654128171
        ],
        "wc_strengths_avg": [
            69.5,
            53.87253474638074
        ],
        "wc_weaknesses_avg": [
            200.0,
            50.19462122578474
        ],
        "wc_questions_avg": [
            42.75,
            28.145825622994256
        ],
        "wc_review_avg": [
            395.75,
            82.46931247439862
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:xdsnixcW8zgJ:scholar.google.com/&scioq=Meta+Koopman+Decomposition+for+Time+Series+Forecasting+Under+Distribution+Shifts&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0;1;0",
        "aff_unique_norm": "University of Science and Technology of China;Shanghai AI Laboratory",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.ustc.edu.cn;https://www.shanghai-ai-lab.com",
        "aff_unique_abbr": "USTC;SAIL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "JDd46WodYf",
        "title": "Active Procedure Planning with Uncertainty-awareness in Instructional Videos",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Procedure planning involves the generation of a sequence of steps that bring a specific start state to the desired goal state. Both states are given as visual observations in the case of planning from instructional videos. This is a challenging task due to ambiguities in the visual representations of states and variations arising from multiple feasible plans. Existing approaches address these challenges by adopting strong visual representation learning methods and sophisticated reasoning mechanisms. However, the decision process is passive in the sense that both the visual observations and the reasoning process are fixed during the planning phase. In this paper, we propose an active procedure planning approach that takes account of uncertainties arising from imperfect visual observations and task plan variations. In particular, we develop quantitative metrics to evaluate task uncertainty and use them to guide the selection of additional visual observations. Empirical results show that visual observations driven by uncertainty-awareness lead to significantly higher performance gain compared to opportunistic visual observations. The findings are useful for developing trusted and explainable AI models for procedure planning.",
        "keywords": "Procedure planning;uncertainty estimation;visual reasoning;active learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Qianli Xu;Fen Fang;Yun Liu;Joo Hwee Lim",
        "authorids": "~Qianli_Xu1;~Fen_Fang2;~Yun_Liu1;~Joo_Hwee_Lim1",
        "gender": "M;F;M;M",
        "homepage": ";;https://yun-liu.github.io/;",
        "dblp": "30/3276;79/9756.html;50/2482-11;236/4727",
        "google_scholar": "https://scholar.google.com.sg/citations?user=JLpYAlQAAAAJ;mIPKbnMAAAAJ;https://scholar.google.com.hk/citations?user=UB3doCoAAAAJ;",
        "orcid": "0000-0003-0105-5903;;0000-0001-6143-0264;",
        "linkedin": ";;yun-liu-082989145/;",
        "or_profile": "~Qianli_Xu1;~Fen_Fang2;~Yun_Liu1;~Joo_Hwee_Lim1",
        "aff": "Institute for Infocomm Research, A*STAR; A*STAR;A*STAR;I2R, ASTAR",
        "aff_domain": "i2r.a-star.edu.sg;i2r.a-star.edu.sg;a-star.edu.sg;i2r.a-star.edu.sg",
        "position": "Researcher;Researcher;Researcher;Principal Researcher",
        "bibtex": "@misc{\nxu2024active,\ntitle={Active Procedure Planning with Uncertainty-awareness in Instructional Videos},\nauthor={Qianli Xu and Fen Fang and Yun Liu and Joo Hwee Lim},\nyear={2024},\nurl={https://openreview.net/forum?id=JDd46WodYf}\n}",
        "github": "",
        "project": "",
        "reviewers": "7cDj;4EZu;9LnP",
        "site": "https://openreview.net/forum?id=JDd46WodYf",
        "pdf_size": 5715539,
        "rating": "5;6;6",
        "confidence": "3;3;5",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "3;3;4",
        "wc_summary": "16;93;186",
        "wc_strengths": "38;213;90",
        "wc_weaknesses": "232;75;19",
        "wc_questions": "5;99;218",
        "wc_review": "291;480;513",
        "wc_reply_reviewers": "82;22;313",
        "wc_reply_authors": "1116;407;843",
        "reply_reviewers": "1;1;1",
        "reply_authors": "2;2;2",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            98.33333333333333,
            69.50459617096476
        ],
        "wc_strengths_avg": [
            113.66666666666667,
            73.37725957149273
        ],
        "wc_weaknesses_avg": [
            108.66666666666667,
            90.15665378784986
        ],
        "wc_questions_avg": [
            107.33333333333333,
            87.15630913607013
        ],
        "wc_review_avg": [
            428.0,
            97.80593029055038
        ],
        "wc_reply_reviewers_avg": [
            139.0,
            125.45118572576347
        ],
        "wc_reply_authors_avg": [
            788.6666666666666,
            291.9866815836336
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:QG-JCvKGDw0J:scholar.google.com/&scioq=Active+Procedure+Planning+with+Uncertainty-awareness+in+Instructional+Videos&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Institute for Infocomm Research;Agency for Science, Technology and Research",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.i2r.a-star.edu.sg;https://www.a-star.edu.sg",
        "aff_unique_abbr": "I2R;A*STAR",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Singapore"
    },
    {
        "id": "JDp3AQ2elP",
        "title": "Revisiting Familiar Places in an Infinite World: Continuing RL in Unbounded State Spaces",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep reinforcement learning (RL) algorithms have been successfully applied to train neural network control policies for many  sequential decision-making tasks. However, prior work has shown that neural networks are poor extrapolators and deep RL algorithms perform poorly with weakly informative cost signals. In this paper we show that these challenges are particularly problematic in real-world settings in which the state-space is unbounded and learning must be done without regular episodic resets. For instance, in stochastic queueing problems, the state space and cost can be unbounded and the agent may have to learn online without the system ever being reset to states the agent has seen before. In such settings, we show that deep RL agents can diverge into unseen states from which they can never recover, especially in highly stochastic environments. Towards overcoming this divergence, we introduce a Lyapunov-inspired reward shaping approach that encourages the agent to first learn to be stable (i.e. to achieve bounded cost) and then to learn to be optimal. We theoretically show that our reward shaping technique reduces the rate of divergence of the agent and empirically find that it prevents it. We further combine our reward shaping approach with a weight annealing scheme that gradually introduces the pursuit of optimality and a log-transform of state inputs, and find that these techniques enable deep RL algorithms to learn performant policies when learning online in  unbounded state space domains.",
        "keywords": "reinforcement learning;continuing RL;unbounded state space;reset-free RL",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/94a18ffafa597451c46e47327fa7e6d47fc49ac4.zip",
        "author": "Brahma S Pavse;Yudong Chen;Qiaomin Xie;Josiah P. Hanna",
        "authorids": "~Brahma_S_Pavse1;~Yudong_Chen1;~Qiaomin_Xie1;~Josiah_P._Hanna1",
        "gender": "M;M;F;M",
        "homepage": "https://brahmasp.github.io/;https://pages.cs.wisc.edu/~yudongchen/;https://qiaominxie.github.io/;https://pages.cs.wisc.edu/~jphanna/",
        "dblp": "243/3510;15/1975-1;37/10269;135/6336",
        "google_scholar": "2Dc_GnUAAAAJ;ze5rCdwAAAAJ;RVNcy4EAAAAJ;",
        "orcid": ";0000-0002-6416-5635;;",
        "linkedin": ";;;",
        "or_profile": "~Brahma_S_Pavse1;~Yudong_Chen1;~Qiaomin_Xie1;~Josiah_Hanna2",
        "aff": "University of Wisconsin - Madison;Department of Computer Sciences, University of Wisconsin - Madison;University of Wisconsin - Madison;University of Wisconsin - Madison",
        "aff_domain": "wisc.edu;cs.wisc.edu;wisc.edu;wisc.edu",
        "position": "PhD student;Associate Professor;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\npavse2024revisiting,\ntitle={Revisiting Familiar Places in an Infinite World: Continuing {RL} in Unbounded State Spaces},\nauthor={Brahma S Pavse and Yudong Chen and Qiaomin Xie and Josiah P. Hanna},\nyear={2024},\nurl={https://openreview.net/forum?id=JDp3AQ2elP}\n}",
        "github": "",
        "project": "",
        "reviewers": "JKyj;Nors;bUkB;em6q",
        "site": "https://openreview.net/forum?id=JDp3AQ2elP",
        "pdf_size": 4300832,
        "rating": "3;5;6;6",
        "confidence": "4;4;3;4",
        "soundness": "2;3;3;4",
        "contribution": "2;2;2;2",
        "presentation": "2;3;2;2",
        "wc_summary": "102;47;51;92",
        "wc_strengths": "64;40;27;56",
        "wc_weaknesses": "194;235;50;244",
        "wc_questions": "146;2;131;189",
        "wc_review": "506;324;259;581",
        "wc_reply_reviewers": "412;78;130;9",
        "wc_reply_authors": "1514;498;1374;859",
        "reply_reviewers": "4;1;2;1",
        "reply_authors": "7;3;4;3",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            73.0,
            24.300205760445735
        ],
        "wc_strengths_avg": [
            46.75,
            14.306903927824496
        ],
        "wc_weaknesses_avg": [
            180.75,
            77.80544646745496
        ],
        "wc_questions_avg": [
            117.0,
            69.72445768881964
        ],
        "wc_review_avg": [
            417.5,
            130.79468643641454
        ],
        "wc_reply_reviewers_avg": [
            157.25,
            153.21451465184361
        ],
        "wc_reply_authors_avg": [
            1061.25,
            406.49438803014243
        ],
        "reply_reviewers_avg": [
            2.0,
            1.224744871391589
        ],
        "reply_authors_avg": [
            4.25,
            1.6393596310755
        ],
        "replies_avg": [
            36,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.4714045207910316,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:EDjZPQpuuQwJ:scholar.google.com/&scioq=Revisiting+Familiar+Places+in+an+Infinite+World:+Continuing+RL+in+Unbounded+State+Spaces&hl=en&as_sdt=0,11",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of Wisconsin-Madison",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.wisc.edu",
        "aff_unique_abbr": "UW-Madison",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Madison",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Sample-Efficient Quality-Diversity by Cooperative Coevolution",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18945",
        "id": "JDud6zbpFv",
        "author_site": "Ke Xue, Ren-Jian Wang, Pengyi Li, Dong Li, Jianye HAO, Chao Qian",
        "tldr": "",
        "abstract": "Quality-Diversity (QD) algorithms, as a subset of evolutionary algorithms, have emerged as a powerful optimization paradigm with the aim of generating a set of high-quality and diverse solutions. Although QD has demonstrated competitive performance in reinforcement learning, its low sample efficiency remains a significant impediment for real-world applications. Recent research has primarily focused on augmenting sample efficiency by refining selection and variation operators of QD. However, one of the less considered yet crucial factors is the inherently large-scale issue of the QD optimization problem. In this paper, we propose a novel Cooperative Coevolution QD (CCQD) framework, which decomposes a policy network naturally into two types of layers, corresponding to representation and decision respectively, and thus simplifies the problem significantly. The resulting two (representation and decision) subpopulations are coevolved cooperatively. CCQD can be implemented with different selection and variation operators. Experiments on several popular tasks within the QDAX suite demonstrate that an instantiation of CCQD achieves approximately a 200% improvement in sample efficiency.",
        "keywords": "Quality-Diversity;Reinforcement Learning;Evolutionary Algorithms",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/be2354a20b73f8ab6d22dc510412e7d26ab888ae.zip",
        "author": "Ke Xue;Ren-Jian Wang;Pengyi Li;Dong Li;Jianye HAO;Chao Qian",
        "authorids": "~Ke_Xue1;~Ren-Jian_Wang1;~Pengyi_Li1;~Dong_Li10;~Jianye_HAO1;~Chao_Qian1",
        "gender": "M;Not Specified;M;M;M;M",
        "homepage": "http://www.lamda.nju.edu.cn/xuek/;https://www.lamda.nju.edu.cn/wangrj;https://yeshenpy.github.io/;;http://www.icdai.org/jianye.html;http://www.lamda.nju.edu.cn/qianc/",
        "dblp": "93/2469-1;354/0651;195/6948;47/4826-16;21/7664.html;84/8508-1",
        "google_scholar": "78bZVOwAAAAJ;FQNe_R0AAAAJ;https://scholar.google.com/citations?hl=zh-CN;;;",
        "orcid": "0000-0001-6789-2670;;0009-0009-8546-2346;;0000-0002-0422-8235;",
        "linkedin": ";;;;;",
        "or_profile": "~Ke_Xue1;~Ren-Jian_Wang1;~Pengyi_Li1;~Dong_Li10;~Jianye_HAO1;~Chao_Qian1",
        "aff": "Nanjing University;Nanjing University;Tianjin University;Huawei Technologies Ltd.;Tianjin University;Nanjing university",
        "aff_domain": "nju.edu.cn;nju.edu.cn;tju.edu.cn;huawei.com;tju.edu.cn;nju.edu",
        "position": "PhD student;PhD student;PhD student;Principal Researcher;Associate Professor;Full Professor",
        "bibtex": "@inproceedings{\nxue2024sampleefficient,\ntitle={Sample-Efficient Quality-Diversity by Cooperative Coevolution},\nauthor={Ke Xue and Ren-Jian Wang and Pengyi Li and Dong Li and Jianye HAO and Chao Qian},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=JDud6zbpFv}\n}",
        "github": "",
        "project": "",
        "reviewers": "VT9L;CbDL;zwMj",
        "pdf_size": 7599909,
        "rating": "8;8;8",
        "confidence": "5;5;3",
        "soundness": "2;2;4",
        "contribution": "3;3;3",
        "presentation": "2;3;3",
        "wc_summary": "35;209;194",
        "wc_strengths": "29;148;99",
        "wc_weaknesses": "55;588;58",
        "wc_questions": "28;134;78",
        "wc_review": "147;1079;429",
        "wc_reply_reviewers": "54;35;0",
        "wc_reply_authors": "445;1147;437",
        "reply_reviewers": "1;1;0",
        "reply_authors": "1;2;1",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            146.0,
            78.7273777030583
        ],
        "wc_strengths_avg": [
            92.0,
            48.83304891839815
        ],
        "wc_weaknesses_avg": [
            233.66666666666666,
            250.55449617908587
        ],
        "wc_questions_avg": [
            80.0,
            43.29742101634538
        ],
        "wc_review_avg": [
            551.6666666666666,
            390.2489234094339
        ],
        "wc_reply_reviewers_avg": [
            29.666666666666668,
            22.365648262955006
        ],
        "wc_reply_authors_avg": [
            676.3333333333334,
            332.82761637553784
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8176519945266889369&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=JDud6zbpFv",
        "pdf": "https://openreview.net/pdf?id=JDud6zbpFv",
        "email": "nju.edu.cn;nju.edu.cn;tju.edu.cn;huawei.com;tju.edu.cn;nju.edu",
        "author_num": 6,
        "aff_unique_index": "0;0;1;2;1;0",
        "aff_unique_norm": "Nanjing University;Tianjin University;Huawei",
        "aff_unique_dep": ";;Huawei Technologies",
        "aff_unique_url": "https://www.nju.edu.cn;http://www.tju.edu.cn;https://www.huawei.com",
        "aff_unique_abbr": "Nanjing U;TJU;Huawei",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "JEAlXPYSjC",
        "title": "Your CLIP Model Might Be Undertrained",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Contrastive Language-Image Pretraining (CLIP) models exhibit good performance on a range of vision tasks. To improve the performance of this class of models even further, several works have proposed to modify the CLIP training procedure. In this work, we show that it is possible to achieve substantial gains using a much simpler strategy. Specifically, existing CLIP models---especially those trained on smaller datasets---tend to be undertrained. Indeed, we show that extending the training procedure according to a simple heuristic can significantly improve the performance of CLIP models.",
        "keywords": "clip;pretraining;fine-tuning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/939f07d1f59bbe7c04e78e039e83071fe3c49191.zip",
        "author": "Alaa Khaddaj;Hadi Salman;Andrew Ilyas;Guillaume Leclerc;Aleksander Madry",
        "authorids": "~Alaa_Khaddaj1;~Hadi_Salman1;~Andrew_Ilyas1;~Guillaume_Leclerc1;~Aleksander_Madry1",
        "gender": ";M;M;M;M",
        "homepage": ";https://hadisalman.com/;http://andrewilyas.com;;https://people.csail.mit.edu/madry/",
        "dblp": ";192/3204;156/5465;183/9387;67/2454",
        "google_scholar": "BA1kFjMAAAAJ;Kr8JjF0AAAAJ;Dtw3YBoAAAAJ;;SupjsEUAAAAJ",
        "orcid": ";;;;",
        "linkedin": "alaa-khaddaj;;;;",
        "or_profile": "~Alaa_Khaddaj1;~Hadi_Salman1;~Andrew_Ilyas1;~Guillaume_Leclerc1;~Aleksander_Madry1",
        "aff": "Massachusetts Institute of Technology;Massachusetts Institute of Technology;Massachusetts Institute of Technology;;Massachusetts Institute of Technology",
        "aff_domain": "mit.edu;mit.edu;mit.edu;;mit.edu",
        "position": "PhD student;PhD Student;PhD student;;Professor",
        "bibtex": "@misc{\nkhaddaj2024your,\ntitle={Your {CLIP} Model Might Be Undertrained},\nauthor={Alaa Khaddaj and Hadi Salman and Andrew Ilyas and Guillaume Leclerc and Aleksander Madry},\nyear={2024},\nurl={https://openreview.net/forum?id=JEAlXPYSjC}\n}",
        "github": "",
        "project": "",
        "reviewers": "1NTN;MMUs;B4x4;N6Pn",
        "site": "https://openreview.net/forum?id=JEAlXPYSjC",
        "pdf_size": 469806,
        "rating": "3;3;5;6",
        "confidence": "4;4;5;5",
        "soundness": "2;3;2;4",
        "contribution": "2;2;2;3",
        "presentation": "3;1;3;3",
        "wc_summary": "59;44;112;172",
        "wc_strengths": "36;35;138;45",
        "wc_weaknesses": "58;170;235;134",
        "wc_questions": "2;4;50;8",
        "wc_review": "155;253;535;359",
        "wc_reply_reviewers": "186;0;0;479",
        "wc_reply_authors": "325;268;477;425",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            96.75,
            50.25621852069652
        ],
        "wc_strengths_avg": [
            63.5,
            43.188540146663904
        ],
        "wc_weaknesses_avg": [
            149.25,
            63.91938281929825
        ],
        "wc_questions_avg": [
            16.0,
            19.748417658131498
        ],
        "wc_review_avg": [
            325.5,
            140.835897412556
        ],
        "wc_reply_reviewers_avg": [
            166.25,
            195.88309651422196
        ],
        "wc_reply_authors_avg": [
            373.75,
            81.92488938045629
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.9622504486493761,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:0Sjt4Mc7eykJ:scholar.google.com/&scioq=Your+CLIP+Model+Might+Be+Undertrained&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Massachusetts Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://web.mit.edu",
        "aff_unique_abbr": "MIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "JEI2ozK3Xj",
        "title": "Multi-Label Generalized Zero Shot Chest Xray Classification Using Feature Disentanglement and Multi-Modal Dictionaries",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Generalized zero shot learning (GZSL) aims to correctly predict seen and unseen classes, and most GZSL methods focus on the single label case. However, medical images can have multiple labels as in the case of chest x-rays. We propose a novel multi-modal multi-label GZSL approach that leverages feature disentanglement and multi-modal dictionaries to synthesize features of unseen classes. Feature disentanglement extracts class specific features, which are used with text embeddings to learn a multi-modal dictionary. A subsequent clustering step identifies class centroids, all of which contribute to better multi-label feature synthesis.  Compared to existing methods, our approach does not require class attribute vectors, which are an essential part of GZSL methods for natural images but are not available for medical images. Our approach outperforms state of the art GZSL methods for chest x-rays. We also analyse the performance of different loss terms in ablation studies.",
        "keywords": "Generalized zero shot learning;multi-label;multi-modal;dictionary;feature disentanglement",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/8e6224c44dc315b7bafe7c713f1081624ac9db09.pdf",
        "author": "Dwarikanath Mahapatra",
        "authorids": "~Dwarikanath_Mahapatra1",
        "gender": "M",
        "homepage": "http://www.inceptioniai.org/",
        "dblp": "50/6718.html",
        "google_scholar": "https://scholar.google.ch/citations?user=j5K7HPoAAAAJ",
        "orcid": "",
        "linkedin": "dwarikanath-mahapatra-10897635/",
        "or_profile": "~Dwarikanath_Mahapatra1",
        "aff": "Inception Institute of AI, UAE",
        "aff_domain": "inceptioniai.org",
        "position": "Principal Researcher",
        "bibtex": "@misc{\nmahapatra2024multilabel,\ntitle={Multi-Label Generalized Zero Shot Chest Xray Classification  Using Feature Disentanglement and Multi-Modal Dictionaries},\nauthor={Dwarikanath Mahapatra},\nyear={2024},\nurl={https://openreview.net/forum?id=JEI2ozK3Xj}\n}",
        "github": "",
        "project": "",
        "reviewers": "hByk;9scs;Lpe4",
        "site": "https://openreview.net/forum?id=JEI2ozK3Xj",
        "pdf_size": 2131751,
        "rating": "1;1;3",
        "confidence": "5;4;4",
        "soundness": "1;1;2",
        "contribution": "1;1;1",
        "presentation": "1;1;2",
        "wc_summary": "70;57;38",
        "wc_strengths": "9;1;26",
        "wc_weaknesses": "9;68;73",
        "wc_questions": "1;1;60",
        "wc_review": "89;127;197",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.0,
            0.0
        ],
        "presentation_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            55.0,
            13.140268896284683
        ],
        "wc_strengths_avg": [
            12.0,
            10.424330514074594
        ],
        "wc_weaknesses_avg": [
            50.0,
            29.06314963431642
        ],
        "wc_questions_avg": [
            20.666666666666668,
            27.812866726670865
        ],
        "wc_review_avg": [
            137.66666666666666,
            44.731296525910004
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:d2K9VanpR68J:scholar.google.com/&scioq=Multi-Label+Generalized+Zero+Shot+Chest+Xray+Classification+Using+Feature+Disentanglement+and+Multi-Modal+Dictionaries&hl=en&as_sdt=0,48",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Inception Institute of AI",
        "aff_unique_dep": "",
        "aff_unique_url": "",
        "aff_unique_abbr": "",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United Arab Emirates"
    },
    {
        "id": "JEYWfmz2TU",
        "title": "Robot Learning from Demonstration: Enhancing Plan Execution with Failure Detection Model",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Learning plans from demonstrations has emerged as a valuable paradigm, in which a robot autonomously completes a task by executing a sequence of actions according to a learned plan.\n   Nevertheless, the execution of an action may encounter failures in the real environment, such as failing to pick up a cup, resulting in plan execution failure.\n   The execution of a broken plan may damage the environment, e.g., cooking coffee when a cup is not successfully placed.\n   To avoid such risks, action failure detection is crucial.\n   However, the action failure within the execution of task plans is often neglected in existing research.\n   To address the problem, we propose a framework that learns an executable plan that checks failures of each action, called failure-aware plan.\n   Our framework employs meta-learning to learn neural network-based failure-aware task plans.\n   Initially, by using trajectory data collected from robot randomness execution, the framework pre-trains a model that discriminatively captures the state features of various actions at different stages.\n   Utilizing user demonstration trajectories labeled as either success or failure, the pre-trained model undergoes fine-tuning, which is then employed to determine the success or failure of an action execution by means of the corresponding state features.\n   We demonstrate the effectiveness of our approach through experiments on a robot in a simulation environment.\n   Our approach outperforms the compared method when only limited demonstration data is available.\n   This work contributes to enhancing the reliability of plan execution for robot by considering action failure detection.",
        "keywords": "action failure detection;learning from demonstration;meta learning",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/2482211fcae9c703687de4ca9c780c4c6cb45dcd.pdf",
        "author": "Tianyi Wu;Liwei Shen;Zhen Dong;Xin Peng;Wenyun Zhao",
        "authorids": "~Tianyi_Wu5;~Liwei_Shen1;~Zhen_Dong5;~Xin_Peng6;wyzhao@fudan.edu.cn",
        "gender": ";M;M;M;",
        "homepage": "https://github.com/V0idwu;;https://zhendong2050.github.io/;https://cspengxin.github.io;",
        "dblp": ";39/2105;60/1749-4;;",
        "google_scholar": ";;jfYe73AAAAAJ;wATYGXEAAAAJ;",
        "orcid": ";;;0000-0003-3376-2581;",
        "linkedin": ";;;;",
        "or_profile": "~Tianyi_Wu5;~Liwei_Shen1;~Zhen_Dong5;~Xin_Peng6;wyzhao@fudan.edu.cn",
        "aff": ";;Fudan University;Fudan University;",
        "aff_domain": ";;fudan.edu.cn;fudan.edu.cn;",
        "position": ";;Associate Professor;Full Professor;",
        "bibtex": "@misc{\nwu2024robot,\ntitle={Robot Learning from Demonstration: Enhancing Plan Execution with Failure Detection Model},\nauthor={Tianyi Wu and Liwei Shen and Zhen Dong and Xin Peng and Wenyun Zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=JEYWfmz2TU}\n}",
        "github": "",
        "project": "",
        "reviewers": "z6Zs;kyzR;YtSr;3kJ5",
        "site": "https://openreview.net/forum?id=JEYWfmz2TU",
        "pdf_size": 2471948,
        "rating": "3;3;3;3",
        "confidence": "3;3;4;4",
        "soundness": "2;3;2;2",
        "contribution": "1;2;1;2",
        "presentation": "2;2;3;2",
        "wc_summary": "61;126;66;81",
        "wc_strengths": "26;95;30;26",
        "wc_weaknesses": "148;182;182;140",
        "wc_questions": "100;113;95;132",
        "wc_review": "335;516;373;379",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            83.5,
            25.617376914898998
        ],
        "wc_strengths_avg": [
            44.25,
            29.345996319770776
        ],
        "wc_weaknesses_avg": [
            163.0,
            19.209372712298546
        ],
        "wc_questions_avg": [
            110.0,
            14.300349646075091
        ],
        "wc_review_avg": [
            400.75,
            68.64537493524236
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:8pXobhHBLv4J:scholar.google.com/&scioq=Robot+Learning+from+Demonstration:+Enhancing+Plan+Execution+with+Failure+Detection+Model&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Fudan University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.fudan.edu.cn",
        "aff_unique_abbr": "Fudan",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "JFEFORc7fP",
        "title": "Multimodal Representation Learning by Alternating Unimodal Adaptation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Multimodal learning, which integrates data from diverse sensory modes, plays a pivotal role in artificial intelligence. However, existing multimodal learning methods often struggle with challenges where some modalities appear more dominant than others during multimodal learning, resulting in suboptimal performance. To address this challenge, we propose MLA (Multimodal Learning with Alternating Unimodal Adaptation). MLA reframes the conventional joint multimodal learning process by transforming it into an alternating unimodal learning process, thereby minimizing interference between modalities. Simultaneously, it captures cross-modal interactions through a shared head, which undergoes continuous optimization across different modalities. This optimization process is controlled by a gradient modification mechanism to prevent the shared head from losing previously acquired information. During the inference phase, MLA utilizes a test-time uncertainty-based model fusion mechanism to integrate multimodal information. Extensive experiments are conducted on five diverse datasets, encompassing scenarios with complete modalities and scenarios with missing modalities. These experiments demonstrate the superiority of MLA over competing prior approaches.",
        "keywords": "multimodal learning; modality laziness; missing modality; alternating unimodal learning; test-time multimodal information fusion",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "XiaoHui Zhang;Jaehong Yoon;Mohit Bansal;Huaxiu Yao",
        "authorids": "~XiaoHui_Zhang4;~Jaehong_Yoon1;~Mohit_Bansal2;~Huaxiu_Yao1",
        "gender": "M;M;M;M",
        "homepage": "https://cecile-hi.github.io/;https://jaehong31.github.io/;https://www.cs.unc.edu/~mbansal/;http://huaxiuyao.mystrikingly.com",
        "dblp": "55/1332-6;203/4449;32/5243.html;197/1635",
        "google_scholar": "-7ZwZbMAAAAJ;-5comoUAAAAJ;DN8QtscAAAAJ;A20BZnQAAAAJ",
        "orcid": "0000-0002-9949-5415;;;",
        "linkedin": ";jaehongyoon/;;huaxiuyao/",
        "or_profile": "~XiaoHui_Zhang4;~Jaehong_Yoon1;~Mohit_Bansal2;~Huaxiu_Yao1",
        "aff": "Beijing Jiaotong University;University of North Carolina at Chapel Hill;University of North Carolina at Chapel Hill;Department of Computer Science, University of North Carolina at Chapel Hill",
        "aff_domain": "bjtu.edu.cn;unc.edu;unc.edu;cs.unc.edu",
        "position": "MS student;Postdoc;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nzhang2024multimodal,\ntitle={Multimodal Representation Learning by Alternating Unimodal Adaptation},\nauthor={XiaoHui Zhang and Jaehong Yoon and Mohit Bansal and Huaxiu Yao},\nyear={2024},\nurl={https://openreview.net/forum?id=JFEFORc7fP}\n}",
        "github": "",
        "project": "",
        "reviewers": "7Vty;LsYd;KkKe;FTB4;BKPc",
        "site": "https://openreview.net/forum?id=JFEFORc7fP",
        "pdf_size": 538448,
        "rating": "3;5;5;5;5",
        "confidence": "4;4;4;3;4",
        "soundness": "3;3;3;2;3",
        "contribution": "2;2;2;3;2",
        "presentation": "2;2;2;2;3",
        "wc_summary": "88;43;30;105;28",
        "wc_strengths": "31;15;43;37;8",
        "wc_weaknesses": "310;116;170;82;13",
        "wc_questions": "59;2;2;216;27",
        "wc_review": "488;176;245;440;76",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            4.6,
            0.7999999999999999
        ],
        "confidence_avg": [
            3.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.2,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            58.8,
            31.66954372895195
        ],
        "wc_strengths_avg": [
            26.8,
            13.242356285797479
        ],
        "wc_weaknesses_avg": [
            138.2,
            99.85269150103066
        ],
        "wc_questions_avg": [
            61.2,
            80.18329002978115
        ],
        "wc_review_avg": [
            285.0,
            156.45830115401355
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.2500000000000001,
        "gs_citation": 29,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14620156708569302786&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "Beijing Jiao Tong University;University of North Carolina;University of North Carolina at Chapel Hill",
        "aff_unique_dep": ";;Department of Computer Science",
        "aff_unique_url": "http://www.njtu.edu.cn/en;https://www.unc.edu;https://www.unc.edu",
        "aff_unique_abbr": "BJTU;UNC;UNC Chapel Hill",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Chapel Hill",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "JG9PoF8o07",
        "title": "Beyond Laplace and Gaussian: Exploring the Generalized Gaussian Mechanism for Private Machine Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Differential privacy (DP) is obtained by randomizing a data analysis algorithm, which necessarily introduces a tradeoff between its utility and privacy. Many DP mechanisms are built upon one of two underlying tools: Laplace and Gaussian additive noise mechanisms. We expand the search space of algorithms by investigating the Generalized Gaussian (GG) mechanism, which samples the additive noise term $x$ with probability proportional to $e^{-\\frac{| x |}{\\sigma}^{\\beta} }$ for some $\\beta \\geq 1$. The Laplace and Gaussian mechanisms are special cases of GG for $\\beta=1$ and $\\beta=2$ respectively. \n\nIn this work, we prove that all members of the GG family satisfy differential privacy, and provide an extension to an existing numerical accountant (the PRV accountant) to do privacy accounting. We apply the GG mechanism to two canonical tools for private machine learning, PATE and DP-SGD; we show that $\\beta$ has a weak relationship with test-accuracy, and that $\\beta=2$ (Gaussian) is often a near-optimal value of $\\beta$ for the privacy-accuracy tradeoff of both algorithms. This provides justification for the widespread adoption of the Gaussian mechanism in DP learning. That said, we do observe a minor improvement in the utility of both algorithms for $\\beta\\neq 2$, suggesting that further exploration of general families of noise distributions may be a worthy pursuit to improve performance in DP mechanisms.",
        "keywords": "Privacy;Differential Privacy;Machine Learning;Neural Networks;PATE;Generalized Gaussian;DPSGD",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Roy Rinberg;Ilia Shumailov;Rachel Cummings;Nicolas Papernot",
        "authorids": "~Roy_Rinberg1;~Ilia_Shumailov1;~Rachel_Cummings1;~Nicolas_Papernot1",
        "gender": "M;;M;Unspecified",
        "homepage": "https://www.royrinberg.com;https://rachelcummings.com/;https://www.papernot.fr;https://www.cl.cam.ac.uk/~is410/",
        "dblp": "286/5605;56/9841;162/1405;213/8587",
        "google_scholar": "https://scholar.google.com/citations?;;cGxq0cMAAAAJ;https://scholar.google.co.uk/citations?hl=en",
        "orcid": "0000-0002-0937-2236;;;",
        "linkedin": ";;nicolaspapernot;ilia-shumailov/",
        "or_profile": "~Roy_Rinberg1;~Rachel_Cummings1;~Nicolas_Papernot1;~I_Shumailov1",
        "aff": "Harvard University;Columbia University;Google;Google DeepMind",
        "aff_domain": "harvard.edu;columbia.edu;google.com;google.com",
        "position": "PhD student;Associate Professor;Research Scientist;Research Scientist",
        "bibtex": "@misc{\nrinberg2024beyond,\ntitle={Beyond Laplace and Gaussian: Exploring the Generalized Gaussian Mechanism for Private Machine Learning},\nauthor={Roy Rinberg and Ilia Shumailov and Rachel Cummings and Nicolas Papernot},\nyear={2024},\nurl={https://openreview.net/forum?id=JG9PoF8o07}\n}",
        "github": "",
        "project": "",
        "reviewers": "qfzX;QnfG;aH3Q;7vy3",
        "site": "https://openreview.net/forum?id=JG9PoF8o07",
        "pdf_size": 898592,
        "rating": "1;3;5;8",
        "confidence": "5;3;3;2",
        "soundness": "1;2;4;3",
        "contribution": "1;1;2;3",
        "presentation": "4;3;4;4",
        "wc_summary": "64;100;58;81",
        "wc_strengths": "10;46;73;58",
        "wc_weaknesses": "594;81;99;162",
        "wc_questions": "55;177;28;19",
        "wc_review": "723;404;258;320",
        "wc_reply_reviewers": "0;101;0;27",
        "wc_reply_authors": "1400;1386;467;159",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "2;3;1;1",
        "rating_avg": [
            4.25,
            2.5860201081971503
        ],
        "confidence_avg": [
            3.25,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.5,
            1.118033988749895
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            75.75,
            16.345871038277526
        ],
        "wc_strengths_avg": [
            46.75,
            23.27418097377435
        ],
        "wc_weaknesses_avg": [
            234.0,
            210.0107140124046
        ],
        "wc_questions_avg": [
            69.75,
            63.32209330083774
        ],
        "wc_review_avg": [
            426.25,
            178.99214368234155
        ],
        "wc_reply_reviewers_avg": [
            32.0,
            41.33400537088077
        ],
        "wc_reply_authors_avg": [
            853.0,
            550.8924577447035
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.909316700484831,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:CwzcOoRXJ1gJ:scholar.google.com/&scioq=Beyond+Laplace+and+Gaussian:+Exploring+the+Generalized+Gaussian+Mechanism+for+Private+Machine+Learning&hl=en&as_sdt=0,7",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;2",
        "aff_unique_norm": "Harvard University;Columbia University;Google",
        "aff_unique_dep": ";;Google",
        "aff_unique_url": "https://www.harvard.edu;https://www.columbia.edu;https://www.google.com",
        "aff_unique_abbr": "Harvard;Columbia;Google",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "JGP1GlTnLF",
        "title": "Learning from Distinction: Mitigating backdoors using a low-capacity model",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep neural networks (DNNs) are susceptible to backdoor attacks due to their black-box nature and lack of interpretability. Backdoor attacks intend to manipulate the model's prediction when hidden backdoors are activated by predefined triggers. Although considerable progress has been made in backdoor detection and removal at the model deployment stage, an effective defense against backdoor attacks during the training time is still under-explored. In this paper, we propose a novel training-time backdoor defense method called Learning from Distinction (LfD), allowing training a backdoor-free model on the backdoor-poisoned data. LfD uses a low-capacity model as a teacher to guide the learning of a backdoor-free student model via a dynamic weighting strategy. Extensive experiments on CIFAR-10, GTSRB and ImageNet-subset datasets show that LfD significantly reduces attack success rates by $0.52\\%$, $11.31\\%$ and $1.42\\%$, respectively, with minimal impact on clean accuracy (less than $1$%, $3$% and $1$%).",
        "keywords": "Backdoor Defense;Deep Neural Networks;Model Capacity;Dynamic Learning strategy",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Haosen Sun;Xixiang Lyu",
        "authorids": "~Haosen_Sun2;~Xixiang_Lyu1",
        "gender": "M;F",
        "homepage": "https://github.com/rebtw;",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": ";0000-0003-2879-241X",
        "linkedin": ";",
        "or_profile": "~Haosen_Sun2;~Xixiang_Lyu1",
        "aff": "Xi'an University of Electronic Science and Technology;Xi'an University of Electronic Science and Technology",
        "aff_domain": "xidian.edu.cn;xidian.edu.cn",
        "position": "MS student;Full Professor",
        "bibtex": "@misc{\nsun2024learning,\ntitle={Learning from Distinction: Mitigating backdoors using a low-capacity model},\nauthor={Haosen Sun and Xixiang Lyu},\nyear={2024},\nurl={https://openreview.net/forum?id=JGP1GlTnLF}\n}",
        "github": "",
        "project": "",
        "reviewers": "7h85;5Q8T;8dBF;as8q",
        "site": "https://openreview.net/forum?id=JGP1GlTnLF",
        "pdf_size": 1469392,
        "rating": "3;5;5;5",
        "confidence": "4;4;3;4",
        "soundness": "2;2;3;2",
        "contribution": "2;3;2;2",
        "presentation": "3;2;3;3",
        "wc_summary": "43;82;67;83",
        "wc_strengths": "35;68;31;24",
        "wc_weaknesses": "290;91;249;151",
        "wc_questions": "2;57;2;42",
        "wc_review": "370;298;349;300",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            68.75,
            16.161296358893985
        ],
        "wc_strengths_avg": [
            39.5,
            16.91892431568863
        ],
        "wc_weaknesses_avg": [
            195.25,
            78.56963471978217
        ],
        "wc_questions_avg": [
            25.75,
            24.33490291741473
        ],
        "wc_review_avg": [
            329.25,
            31.155858197135252
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:VHMRRSe-ZoEJ:scholar.google.com/&scioq=Learning+from+Distinction:+Mitigating+backdoors+using+a+low-capacity+model&hl=en&as_sdt=0,31",
        "gs_version_total": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Xi'an University of Electronic Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.xidian.edu.cn/",
        "aff_unique_abbr": "Xidian University",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Xi'an",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "JGTC6WgO4T",
        "title": "Label Space-Induced Pseudo Label Refinement for Multi-Source Black-Box Domain Adaptation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Unsupervised Domain Adaptation (UDA) aims to train a model for an unlabeled target domain by transferring knowledge from a source domain. However, standard UDA requires access to source data and models, prohibiting its practical application in terms of privacy and security. Black-Box DA (BDA) reduces such constraints by defining a pseudo label from a single source prediction, which allows for self-training of the target model. Nonetheless, existing methods have limited consideration for multi-source settings, in which multiple source domains are available to generate pseudo labels. In this work, we introduce a novel training framework for multi-source BDA (MSBDA), dubbed Label Space-Induced Pseudo Label Refinement (LPR). Specifically, LPR incorporates a Pseudo label Refinery Network (PRN) that learns the relation between each source conditioned by the target from source predictions. The target model is adapted by self-learning using a pseudo label generated by PRN. We provide theoretical supports for the performance of the LPR. Experimental results on four benchmark datasets demonstrate that MSBDA using LPR achieves highly competitive performance compared to state-of-the-art approaches with different DA settings.",
        "keywords": "Pseudo Label Refinement;Domain Adaptation;Black-box Domain Adaptation;Multi-source Domain Adaptation;Self learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/80de34ab882d61491f9359eeba825b112f24964d.zip",
        "author": "Chaehwa Yoo;Xiaofeng Liu;Fangxu Xing;Jonghye Woo;Jewon Kang",
        "authorids": "~Chaehwa_Yoo1;~Xiaofeng_Liu1;~Fangxu_Xing1;~Jonghye_Woo1;~Jewon_Kang1",
        "gender": "F;M;M;M;M",
        "homepage": "https://chwaaaa.github.io/;https://medicine.yale.edu/bioimaging/profile/xiaofeng-liu/;http://gordon.mgh.harvard.edu/gc/people/fellows/fangxu-xing/;http://jonghyewoo.com;",
        "dblp": "237/0061;95/6332-1.html;21/10860;;13/5636",
        "google_scholar": "https://scholar.google.com/citations?hl=ko;https://scholar.google.com/citations?hl=en;vXq6jPgAAAAJ;;cklyohIAAAAJ",
        "orcid": ";0000-0002-4514-2016;0000-0002-0517-0952;;",
        "linkedin": ";xiaofengcs/;fangxu-xing-62b2a565/;;",
        "or_profile": "~Chaehwa_Yoo1;~Xiaofeng_Liu1;~Fangxu_Xing1;~Jonghye_Woo1;~Je-Won_Kang1",
        "aff": "Ewha Womans University;Massachusetts General Hospital, Harvard Medical School;Harvard Medical School;Massachusetts General Hospital, Harvard University;Ewha Womans University",
        "aff_domain": "ewhain.net;mgh.harvard.edu;harvard.edu;mgh.harvard.edu;ewha.ac.kr",
        "position": "PhD student;Assistant Professor;Assistant Professor;Associate Professor;Associate Professor",
        "bibtex": "@misc{\nyoo2024label,\ntitle={Label Space-Induced Pseudo Label Refinement for Multi-Source Black-Box Domain Adaptation},\nauthor={Chaehwa Yoo and Xiaofeng Liu and Fangxu Xing and Jonghye Woo and Jewon Kang},\nyear={2024},\nurl={https://openreview.net/forum?id=JGTC6WgO4T}\n}",
        "github": "",
        "project": "",
        "reviewers": "xsDH;mZ6x;6ppz;rvLQ",
        "site": "https://openreview.net/forum?id=JGTC6WgO4T",
        "pdf_size": 798775,
        "rating": "1;3;3;3",
        "confidence": "5;5;3;5",
        "soundness": "2;2;3;2",
        "contribution": "2;2;2;2",
        "presentation": "1;1;2;2",
        "wc_summary": "47;88;69;36",
        "wc_strengths": "23;26;68;53",
        "wc_weaknesses": "115;191;289;95",
        "wc_questions": "129;2;86;5",
        "wc_review": "314;307;512;189",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            60.0,
            20.062402647738878
        ],
        "wc_strengths_avg": [
            42.5,
            18.7949461292125
        ],
        "wc_weaknesses_avg": [
            172.5,
            76.20203409358572
        ],
        "wc_questions_avg": [
            55.5,
            54.18717560456533
        ],
        "wc_review_avg": [
            330.5,
            115.96227834947018
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:SyyGz1qZoloJ:scholar.google.com/&scioq=Label+Space-Induced+Pseudo+Label+Refinement+for+Multi-Source+Black-Box+Domain+Adaptation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;2;0",
        "aff_unique_norm": "Ewha Womans University;Massachusetts General Hospital;Harvard University",
        "aff_unique_dep": ";Harvard Medical School;Medical School",
        "aff_unique_url": "http://www.ewha.ac.kr;https://www.massgeneral.org;https://hms.harvard.edu",
        "aff_unique_abbr": "Ewha;MGH;HMS",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Boston",
        "aff_country_unique_index": "0;1;1;1;0",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "id": "JHD4Q4GbXa",
        "title": "MMPareto: Innocent Uni-modal Assistance for Enhanced Multi-modal Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Multi-modal learning methods with targeted uni-modal constraints have exhibited their superior efficacy in alleviating the imbalanced multi-modal learning problem, where most models cannot jointly utilize all modalities well, limiting their performance. However, in this paper, we first identify that there are gradient conflict between multi-modal and uni-modal learning objectives, potentially misleading the optimization of shared uni-modal encoders. The necessity of diminishing conflict during gradient integration naturally accords with the idea of Pareto methods, which could provide a gradient that benefits all objectives. Unfortunately, conventional Pareto method surprisingly fails in the context of multi-modal scenarios. We further theoretically analyze this counterintuitive phenomenon and attribute it to the priority of Pareto method for multi-modal gradient with small magnitude, weakening model generalization. To this end, we propose MMPareto algorithm, which could ensure a direction that is common to all learning objectives while preserving magnitude with guarantees for generalization, providing innocent uni-modal assistance for primary multi-modal learning. Finally, empirical results across multiple dataset with different modalities indicate our superior method performance. The proposed method is also expected to facilitate multi-task cases with a clear discrepancy in task difficulty, demonstrating its scalability.",
        "keywords": "multi-modal learning;imbalanced multi-modal learning;gradient integration",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yake Wei;Weiran Shen;Di Hu",
        "authorids": "~Yake_Wei1;~Weiran_Shen1;~Di_Hu1",
        "gender": "F;M;M",
        "homepage": "https://echo0409.github.io/;https://www.weiran-shen.info/;https://dtaoo.github.io/",
        "dblp": "275/7048;159/2147;49/8496-1",
        "google_scholar": "https://scholar.google.com.hk/citations?user=i9mWGA0AAAAJ;-lXgERkAAAAJ;https://scholar.google.com.hk/citations?user=F7bvTOEAAAAJ",
        "orcid": ";0000-0003-4366-9276;",
        "linkedin": ";;",
        "or_profile": "~Yake_Wei1;~Weiran_Shen1;~Di_Hu1",
        "aff": "Renmin University of China;Renmin University of China;Renmin University of China",
        "aff_domain": "ruc.edu.cn;ruc.edu.cn;ruc.edu.cn",
        "position": "PhD student;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nwei2024mmpareto,\ntitle={{MMP}areto: Innocent Uni-modal Assistance for Enhanced Multi-modal Learning},\nauthor={Yake Wei and Weiran Shen and Di Hu},\nyear={2024},\nurl={https://openreview.net/forum?id=JHD4Q4GbXa}\n}",
        "github": "",
        "project": "",
        "reviewers": "SyiT;45kN;ZL2h;PLQt",
        "site": "https://openreview.net/forum?id=JHD4Q4GbXa",
        "pdf_size": 1084243,
        "rating": "3;5;5;8",
        "confidence": "4;3;4;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "94;146;83;95",
        "wc_strengths": "86;84;52;121",
        "wc_weaknesses": "184;79;123;44",
        "wc_questions": "9;83;123;33",
        "wc_review": "373;392;381;293",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "174;26;30;35",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            104.5,
            24.41823089414956
        ],
        "wc_strengths_avg": [
            85.75,
            24.416951079117148
        ],
        "wc_weaknesses_avg": [
            107.5,
            52.29005641611032
        ],
        "wc_questions_avg": [
            62.0,
            44.19275958796871
        ],
        "wc_review_avg": [
            359.75,
            39.124001584705006
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            66.25,
            62.291151056951904
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.7001400420140049,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Q_JeaaRpPRgJ:scholar.google.com/&scioq=MMPareto:+Innocent+Uni-modal+Assistance+for+Enhanced+Multi-modal+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Renmin University of China",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.ruc.edu.cn",
        "aff_unique_abbr": "RUC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "JHta7zuRNc",
        "title": "PINA: a PyTorch Framework for Deep Differential Equation Learning for Research and Production Environments",
        "track": "main",
        "status": "Desk Reject",
        "tldr": "",
        "abstract": "The last years have manifested the artificial intelligence revolution in several fields. Within the scientific computing community, there has been a remarkable effort to exploit the advancements in machine learning to address the limitations of conventional methods for solving differential equations. Notably, the physics-informed neural network (PINN) and neural operator (NO) approaches have emerged as central players due to their promising and innovative approaches to compute differential equations' solutions. In this contribution, we are going to present a versatile software designed for tackling differential equation learning using PINN and NO methodologies. The package is called PINA, an open-source Python library built upon the robust foundations of PyTorch and Lightning. It empowers end-users to formulate their problem and craft their models to effortlessly compute the solution. The modular structure of PINA permits it to adapt PINN and NO schemas for user specifics, thus offering the freedom to select the most suitable learning techniques for their particular problem domain.  Furthermore, by leveraging the capabilities of the Lightning package, PINA adapts to various hardware setups, including GPUs and TPUs. This adaptability positions PINA as an ideal candidate for the transition of these methodologies into production and industrial pipelines, where computational efficiency and scalability are of paramount importance.",
        "keywords": "PINN;Neural Operator;Differential Equations;Software",
        "primary_area": "infrastructure, software libraries, hardware, etc.",
        "supplementary_material": "/attachment/d6ccfee50ae2d639fce141d93fafbe941596eed2.zip",
        "author": "Dario Coscia;Nicola Demo;Gianluigi Rozza",
        "authorids": "~Dario_Coscia1;~Nicola_Demo1;~Gianluigi_Rozza1",
        "gender": "M;M;M",
        "homepage": ";https://nicolademo.xyz;http://people.sissa.it/grozza",
        "dblp": ";;",
        "google_scholar": "X6wlDE8AAAAJ;;https://scholar.google.it/citations?user=5LtMTMwAAAAJ",
        "orcid": "0000-0001-8833-6833;;",
        "linkedin": "dario-coscia/;;",
        "or_profile": "~Dario_Coscia1;~Nicola_Demo1;~Gianluigi_Rozza1",
        "aff": "International Higher School for Advanced Studies Trieste;;International Higher School for Advanced Studies Trieste",
        "aff_domain": "sissa.it;;sissa.it",
        "position": "PhD student;;Full Professor",
        "bibtex": "@misc{\ncoscia2024pina,\ntitle={{PINA}: a PyTorch Framework for Deep Differential Equation Learning for Research and Production Environments},\nauthor={Dario Coscia and Nicola Demo and Gianluigi Rozza},\nyear={2024},\nurl={https://openreview.net/forum?id=JHta7zuRNc}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=JHta7zuRNc",
        "pdf_size": 833453,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4508595972759553253&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "International Higher School for Advanced Studies",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sissa.it",
        "aff_unique_abbr": "SISSA",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Trieste",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Italy"
    },
    {
        "id": "JJjfho3pK4",
        "title": "Everyone Counts: Fair and Accurate Heterogeneous Federated Learning with Resource-Adaptive Model Modulation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In the practical implementation of federated learning (FL), a major challenge arises from the presence of diverse and heterogeneous edge devices in real-world scenarios, each equipped with varying computational resources. The conventional FL approaches, operating under the assumption of uniform model capacity, face a dilemma. They can opt for a large global model, but this may not be feasible on resource-constrained devices, resulting in issues of fairness and training biases. Conversely, they can choose a small global model, but this compromises its ability to represent complex patterns due to limited capacity. In this paper, we present a novel approach called Dynamic Federated Learning (DynamicFL). It employs structural re-parameterization to achieve adaptable local model modulation and seamless knowledge transfer across a diverse set of heterogeneous models. DynamicFL ensures equitable treatment of all clients, empowering them to actively participate in the learning process with their full computational potential, thereby fostering sustainability within the FL ecosystem. Extensive experimental results validate that DynamicFL surpasses state-of-the-art techniques, including knowledge distillation and network pruning-based methods, in achieving significantly higher test accuracy in the context of heterogeneous FL.",
        "keywords": "Federated Learning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Feilong Zhang;Xianming Liu;Shiyi Lin;Xiong Zhou;Junjun Jiang;Xiangyang Ji",
        "authorids": "~Feilong_Zhang1;~Xianming_Liu5;~Shiyi_Lin1;~Xiong_Zhou3;~Junjun_Jiang2;~Xiangyang_Ji1",
        "gender": ";M;;M;M;",
        "homepage": ";http://homepage.hit.edu.cn/xmliu;;https://hitcszx.github.io/;http://homepage.hit.edu.cn/jiangjunjun;",
        "dblp": ";89/58201.html;;;https://dblp.uni-trier.de/pers/hd/j/Jiang:Junjun;",
        "google_scholar": ";;https://scholar.google.com.hk/citations?view_op=list_works;BMGootgAAAAJ;WNH2_rgAAAAJ;",
        "orcid": ";0000-0002-8857-1785;;0000-0002-0856-6696;0000-0002-5694-505X;",
        "linkedin": ";;;;;",
        "or_profile": "~Feilong_Zhang1;~Xianming_Liu5;~Shiyi_Lin1;~Xiong_Zhou3;~Junjun_Jiang2;~Xiangyang_Ji1",
        "aff": ";Harbin Institute of Technology;Harbin Institute of Technology;Harbin Institute of Technology;Harbin Institute of Technology;",
        "aff_domain": ";hit.edu.cn;hit.edu.cn;hit.edu.cn;hit.edu.cn;",
        "position": ";Full Professor;PhD student;PhD student;Full Professor;",
        "bibtex": "@misc{\nzhang2024everyone,\ntitle={Everyone Counts: Fair and Accurate Heterogeneous Federated Learning with Resource-Adaptive Model Modulation},\nauthor={Feilong Zhang and Xianming Liu and Shiyi Lin and Xiong Zhou and Junjun Jiang and Xiangyang Ji},\nyear={2024},\nurl={https://openreview.net/forum?id=JJjfho3pK4}\n}",
        "github": "",
        "project": "",
        "reviewers": "UcXY;Mgiw;nk4n",
        "site": "https://openreview.net/forum?id=JJjfho3pK4",
        "pdf_size": 465478,
        "rating": "3;5;5",
        "confidence": "4;3;3",
        "soundness": "3;3;2",
        "contribution": "2;3;2",
        "presentation": "2;3;2",
        "wc_summary": "54;58;51",
        "wc_strengths": "67;36;20",
        "wc_weaknesses": "356;190;67",
        "wc_questions": "9;115;22",
        "wc_review": "486;399;160",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            54.333333333333336,
            2.8674417556808756
        ],
        "wc_strengths_avg": [
            41.0,
            19.510680835549195
        ],
        "wc_weaknesses_avg": [
            204.33333333333334,
            118.4182793697362
        ],
        "wc_questions_avg": [
            48.666666666666664,
            47.20404879056692
        ],
        "wc_review_avg": [
            348.3333333333333,
            137.82678339938948
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.9999999999999998,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:FysaojVncDUJ:scholar.google.com/&scioq=Everyone+Counts:+Fair+and+Accurate+Heterogeneous+Federated+Learning+with+Resource-Adaptive+Model+Modulation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Harbin Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.hit.edu.cn/",
        "aff_unique_abbr": "HIT",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Harbin",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "JKpk2p4O99",
        "title": "Towards robust unlearnable examples via deep hiding",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Ensuring data privacy and protection has become paramount in the era of deep learning. Unlearnable examples are proposed to mislead the deep learning models and prevent data from unauthorized exploration by adding small perturbations to data. However, such perturbations (e.g., noise, texture, color change) predominantly impact low-level features, making them vulnerable to countermeasures like adversarial training, data augmentations, and preprocessing. In contrast, semantic images with intricate shapes have a wealth of high-level features, making them more resilient to countermeasures and potential for producing robust unlearnable examples. In this paper, we propose a Deep Hiding (DH) scheme that adaptively hides semantic images enriched with high-level features. We employ an Invertible Neural Network (INN) to invisibly integrate predefined images, inherently hiding them with deceptive perturbations. To enhance data unlearnability, we introduce a Latent Feature Concentration module, designed to work with the INN, regularizing the intra-class variance of these perturbations. To further boost the robustness of unlearnable examples, we design a Semantic Images Generation module that produces hidden semantic images. By utilizing similar semantic information, this module generates similar semantic images for samples within the same classes, thereby enlarging the inter-class distance and narrowing the intra-class distance. Extensive experiments on CIFAR-10, CIFAR-100, and ImageNet-subset, against 12 countermeasures, reveal that our proposed method exhibits state-of-the-art ro- bustness for unlearnable examples, demonstrating its efficacy in data protection.",
        "keywords": "Data Protection; Information Hiding; Unlearnable Examples",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/a5cd627ad0bbef11e88b3f0b56670df91aa71a73.pdf",
        "author": "Ruohan Meng;Chenyu Yi;Yi Yu;SIYUAN YANG;Bingquan Shen;Alex Kot",
        "authorids": "~Ruohan_Meng1;~Chenyu_Yi1;~Yi_Yu5;~SIYUAN_YANG1;~Bingquan_Shen1;~Alex_Kot1",
        "gender": "F;;;M;;",
        "homepage": ";;https://github.com/yuyi-sd;;;https://www.ntu.edu.sg/home/eackot/",
        "dblp": "245/3800;;99/111-11.html;201/7699-1.html;151/9308;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;https://scholar.google.com/citations?hl=en;lzLsF2MAAAAJ;https://scholar.google.com.sg/citations?user=zrJdj6YAAAAJ;",
        "orcid": ";0000-0001-5002-6549;0000-0003-2730-9553;0000-0003-4681-0431;;",
        "linkedin": ";;%E7%9B%8A-%E4%BD%99-6b453a229;;;",
        "or_profile": "~Ruohan_Meng1;~Chenyu_Yi1;~Yi_Yu5;~SIYUAN_YANG1;~Bingquan_Shen1;~Alex_Kot1",
        "aff": "Nanyang Technological University;Nanyang Technological University;Nanyang Technological University;Nanyang Technological University;DSO National Labs;Nanyang Technological University",
        "aff_domain": "ntu.edu.sg;ntu.edu.sg;ntu.edu.sg;ntu.edu.sg;dso.org.sg;ntu.edu.sg",
        "position": "Postdoc;PhD student;PhD student;PhD student;Researcher;Full Professor",
        "bibtex": "@misc{\nmeng2024towards,\ntitle={Towards robust unlearnable examples via deep hiding},\nauthor={Ruohan Meng and Chenyu Yi and Yi Yu and SIYUAN YANG and Bingquan Shen and Alex Kot},\nyear={2024},\nurl={https://openreview.net/forum?id=JKpk2p4O99}\n}",
        "github": "",
        "project": "",
        "reviewers": "Xq8x;4Lh6;Naq4;p8VW",
        "site": "https://openreview.net/forum?id=JKpk2p4O99",
        "pdf_size": 22591159,
        "rating": "5;5;5;6",
        "confidence": "5;3;4;5",
        "soundness": "3;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "3;2;3;3",
        "wc_summary": "120;45;84;69",
        "wc_strengths": "71;43;46;17",
        "wc_weaknesses": "232;70;250;294",
        "wc_questions": "2;136;156;15",
        "wc_review": "425;294;536;395",
        "wc_reply_reviewers": "0;73;0;0",
        "wc_reply_authors": "2770;1290;2146;3800",
        "reply_reviewers": "0;2;0;0",
        "reply_authors": "4;2;3;5",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            79.5,
            27.207535720825582
        ],
        "wc_strengths_avg": [
            44.25,
            19.122957407263137
        ],
        "wc_weaknesses_avg": [
            211.5,
            84.75110618747108
        ],
        "wc_questions_avg": [
            77.25,
            69.26534126097987
        ],
        "wc_review_avg": [
            412.5,
            86.2510869496727
        ],
        "wc_reply_reviewers_avg": [
            18.25,
            31.60992723813201
        ],
        "wc_reply_authors_avg": [
            2501.5,
            915.4653188406429
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            3.5,
            1.118033988749895
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5222329678670935,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:kORKLsD8VOEJ:scholar.google.com/&scioq=Towards+robust+unlearnable+examples+via+deep+hiding&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;1;0",
        "aff_unique_norm": "Nanyang Technological University;DSO National Laboratories",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ntu.edu.sg;https://www.dso.org.sg",
        "aff_unique_abbr": "NTU;DSO",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "Singapore"
    },
    {
        "id": "JL42j1BL5h",
        "title": "All Languages Matter: On the Multilingual Safety of Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Safety lies at the core of developing and deploying large language models (LLMs). However, previous safety benchmarks only concern the safety in one language, e.g. the majority language in the pretraining data such as English. In this work, we build the first multilingual safety benchmark for LLMs, XSafety, in response to the global deployment of LLMs in practice. XSafety covers 14 kinds of commonly used safety issues across 10 languages that span several language families. \nWe utilize XSafety to empirically study the multilingual safety for 4 widely-used LLMs, including both close-API and open-source models. Experimental results show that all LLMs produce significantly more unsafe responses for non-English queries than English ones, indicating the necessity of developing safety alignment for non-English languages.\nIn addition, we propose several simple and effective prompting methods to improve the multilingual safety of ChatGPT by evoking safety knowledge and improving cross-lingual generalization of safety alignment.\nOur prompting method can significantly reduce the ratio of unsafe responses from 19.1\\% to 9.7\\% for non-English queries.",
        "keywords": "LLMs;Safety;Multilingual",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/a9a3d508081ce3410be7ae48f04fab240b5cb9db.zip",
        "author": "Wenxuan Wang;Zhaopeng Tu;Chang Chen;Youliang Yuan;Jen-tse Huang;Wenxiang Jiao;Michael Lyu",
        "authorids": "~Wenxuan_Wang2;~Zhaopeng_Tu1;~Chang_Chen7;~Youliang_Yuan1;~Jen-tse_Huang1;~Wenxiang_Jiao1;~Michael_Lyu1",
        "gender": ";M;M;M;M;M;M",
        "homepage": ";http://www.zptu.net;;https://youliangyuan.github.io;https://penguinnnnn.github.io/;https://wxjiao.github.io/;http://www.cse.cuhk.edu.hk/~lyu",
        "dblp": "203/1536-1;71/9281;;302/7588;317/7026;239/4883;l/MichaelRLyu",
        "google_scholar": "4v5x0bUAAAAJ;IvE2zRgAAAAJ;;cd-wSAsAAAAJ;XBzDTAQAAAAJ;CvtODukAAAAJ;uQnBgK0AAAAJ",
        "orcid": ";;;;0000-0003-3446-0083;;0000-0002-3666-5798",
        "linkedin": ";tuzhaopeng;acc-cc-20a255252/;;jen-tse-huang-08a169200/;;michael-lyu-58b154/",
        "or_profile": "~Wenxuan_Wang2;~Zhaopeng_Tu1;~Chang_Chen7;~Youliang_Yuan1;~Jen-tse_Huang1;~Wenxiang_Jiao1;~Michael_Lyu1",
        "aff": "The Chinese University of Hong Kong;Tencent AI Lab;Department of Computer Science and Engineering, The Chinese University of Hong Kong;The Chinese University of Hong Kong-Shenzhen;The Chinese University of Hong Kong;Tencent AI Lab;The Chinese University of Hong Kong",
        "aff_domain": "cuhk.edu.hk;tencent.com;cse.cuhk.edu.hk;cuhk.edu.cn;cuhk.edu.hk;tencent.com;cuhk.edu.hk",
        "position": "PhD student;Principal Researcher;Undergrad student;PhD student;PhD student;Researcher;Full Professor",
        "bibtex": "@misc{\nwang2024all,\ntitle={All Languages Matter: On the Multilingual Safety of Large Language Models},\nauthor={Wenxuan Wang and Zhaopeng Tu and Chang Chen and Youliang Yuan and Jen-tse Huang and Wenxiang Jiao and Michael Lyu},\nyear={2024},\nurl={https://openreview.net/forum?id=JL42j1BL5h}\n}",
        "github": "",
        "project": "",
        "reviewers": "HoJx;fybq;h4PH;6bcy",
        "site": "https://openreview.net/forum?id=JL42j1BL5h",
        "pdf_size": 531135,
        "rating": "3;3;3;5",
        "confidence": "3;3;5;4",
        "soundness": "2;2;2;3",
        "contribution": "2;3;2;4",
        "presentation": "2;3;2;2",
        "wc_summary": "93;34;44;46",
        "wc_strengths": "42;32;47;135",
        "wc_weaknesses": "429;273;203;325",
        "wc_questions": "6;2;38;187",
        "wc_review": "570;341;332;693",
        "wc_reply_reviewers": "0;0;0;41",
        "wc_reply_authors": "784;720;748;883",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;2;2",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            54.25,
            22.829531313629722
        ],
        "wc_strengths_avg": [
            64.0,
            41.34610017885605
        ],
        "wc_weaknesses_avg": [
            307.5,
            82.43027356499553
        ],
        "wc_questions_avg": [
            58.25,
            75.63192117089186
        ],
        "wc_review_avg": [
            484.0,
            153.80994766269183
        ],
        "wc_reply_reviewers_avg": [
            10.25,
            17.75352077758099
        ],
        "wc_reply_authors_avg": [
            783.75,
            61.62943695994634
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.17407765595569782,
        "gs_citation": 61,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16422995836767853783&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;0;0;0;1;0",
        "aff_unique_norm": "Chinese University of Hong Kong;Tencent",
        "aff_unique_dep": ";Tencent AI Lab",
        "aff_unique_url": "https://www.cuhk.edu.hk;https://ai.tencent.com",
        "aff_unique_abbr": "CUHK;Tencent AI Lab",
        "aff_campus_unique_index": "0;0;2;0;0",
        "aff_campus_unique": "Hong Kong SAR;;Shenzhen",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "JLulsRraDc",
        "title": "Bridging the Gap Between Foundation Models and Heterogeneous Federated Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Federated learning (FL) offers privacy-preserving decentralized machine learning, optimizing models at edge clients without sharing private data. Simultaneously, foundation models (FMs) have gained traction in the artificial intelligence (AI) community due to their exceptional performance across various tasks.  However, integrating FMs into FL presents challenges, primarily due to their substantial size and intensive resource requirements. This is especially true when considering the resource heterogeneity in edge FL systems. We present an adaptive framework for Resource-aware Federated Foundation Models (RaFFM) to address these challenges. RaFFM introduces specialized model compression algorithms tailored for FL scenarios, such as salient parameter prioritization and high-performance subnetwork extraction. These algorithms enable dynamic scaling of given transformer-based FMs to fit heterogeneous resource constraints at the network edge during both FL's optimization and deployment stages. Experimental results demonstrate that RaFFM shows significant superiority in resource utilization efficiency and uses fewer resources to deploy FMs to FL. Despite the lower resource consumption, target models optimized by RaFFM achieve performance on par with traditional FL methods applied to full-sized FMs. This is evident across tasks in both natural language processing and computer vision domains.",
        "keywords": "Federated Learning;Model Compression;Foundation Models;Model Deployment;Resource Constraints Learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/180f1b29790a1480281cd166d1fa7d553963bd53.zip",
        "author": "Sixing Yu;Juan Pablo Munoz;Ali Jannesari",
        "authorids": "~Sixing_Yu1;~Juan_Pablo_Munoz1;~Ali_Jannesari1",
        "gender": ";M;M",
        "homepage": ";;https://www.cs.iastate.edu/swapp/",
        "dblp": ";174/3681.html;74/1277",
        "google_scholar": ";KqXns-MAAAAJ;https://scholar.google.de/citations?user=YhWnhQEAAAAJ",
        "orcid": ";0000-0002-5901-4023;0000-0001-8672-5317",
        "linkedin": ";jpablomunoz/;ali-jannesari-6ab8a56b/",
        "or_profile": "~Sixing_Yu1;~Juan_Pablo_Munoz1;~Ali_Jannesari1",
        "aff": ";Intel;Iowa State University",
        "aff_domain": ";intel.com;isu.edu",
        "position": ";Researcher;Associate Professor",
        "bibtex": "@misc{\nyu2024bridging,\ntitle={Bridging the Gap Between Foundation Models and Heterogeneous Federated Learning},\nauthor={Sixing Yu and Juan Pablo Munoz and Ali Jannesari},\nyear={2024},\nurl={https://openreview.net/forum?id=JLulsRraDc}\n}",
        "github": "",
        "project": "",
        "reviewers": "U93Y;Y3SH;erSL",
        "site": "https://openreview.net/forum?id=JLulsRraDc",
        "pdf_size": 542441,
        "rating": "5;5;8",
        "confidence": "3;4;4",
        "soundness": "2;2;3",
        "contribution": "3;2;3",
        "presentation": "2;3;4",
        "wc_summary": "42;50;48",
        "wc_strengths": "19;61;78",
        "wc_weaknesses": "14;270;65",
        "wc_questions": "644;2;180",
        "wc_review": "719;383;371",
        "wc_reply_reviewers": "9;0;56",
        "wc_reply_authors": "2945;1814;807",
        "reply_reviewers": "1;0;1",
        "reply_authors": "8;7;2",
        "rating_avg": [
            6.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            46.666666666666664,
            3.39934634239519
        ],
        "wc_strengths_avg": [
            52.666666666666664,
            24.796953217863056
        ],
        "wc_weaknesses_avg": [
            116.33333333333333,
            110.63553779063137
        ],
        "wc_questions_avg": [
            275.3333333333333,
            270.62561265006354
        ],
        "wc_review_avg": [
            491.0,
            161.29476122924763
        ],
        "wc_reply_reviewers_avg": [
            21.666666666666668,
            24.553795814270526
        ],
        "wc_reply_authors_avg": [
            1855.3333333333333,
            873.3240457521417
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            5.666666666666667,
            2.6246692913372702
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9862697770362116475&as_sdt=20000005&sciodt=0,21&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Intel;Iowa State University",
        "aff_unique_dep": "Intel Corporation;",
        "aff_unique_url": "https://www.intel.com;https://www.iastate.edu",
        "aff_unique_abbr": "Intel;ISU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Koopman-based generalization bound: New aspect for full-rank weights",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18944",
        "id": "JN7TcCm9LF",
        "author_site": "Yuka Hashimoto, Sho Sonoda, Isao Ishikawa, Atsushi Nitanda, Taiji Suzuki",
        "tldr": "",
        "abstract": "We propose a new bound for generalization of neural networks using Koopman operators. Whereas most of existing works focus on low-rank weight matrices, we focus on full-rank weight matrices. Our bound is tighter than existing norm-based bounds when the condition numbers of weight matrices are small. Especially, it is completely independent of the width of the network if the weight matrices are orthogonal. Our bound does not contradict to the existing bounds but is a complement to the existing bounds. As supported by several existing empirical results, low-rankness is not the only reason for generalization. Furthermore, our bound can be combined with the existing bounds to obtain a tighter bound. Our result sheds new light on understanding generalization of neural networks with full-rank weight matrices, and it provides a connection between operator-theoretic analysis and generalization of neural networks.",
        "keywords": "generalization bound;full-rank weight matrix;Koopman operator",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Yuka Hashimoto;Sho Sonoda;Isao Ishikawa;Atsushi Nitanda;Taiji Suzuki",
        "authorids": "~Yuka_Hashimoto2;~Sho_Sonoda2;~Isao_Ishikawa1;~Atsushi_Nitanda1;~Taiji_Suzuki1",
        "gender": ";M;M;M;M",
        "homepage": "https://www.rd.ntt/e/ns/qos/person/hashimoto/index.html;https://researchmap.jp/1sa014kawa/?lang=en;https://sites.google.com/site/atsushinitanda;http://ibis.t.u-tokyo.ac.jp/suzuki/;https://sites.google.com/view/shosonoda/research",
        "dblp": "220/5306;220/5361;155/1884;08/312;139/0716",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;https://scholar.google.co.jp/citations?user=LyVvaf8AAAAJ;x8osrBsAAAAJ;zrox37AAAAAJ",
        "orcid": "0000-0002-1424-4298;0000-0002-3100-6187;;;0000-0001-7242-4740",
        "linkedin": ";;;;",
        "or_profile": "~Yuka_Hashimoto2;~Isao_Ishikawa1;~Atsushi_Nitanda1;~Taiji_Suzuki1;~Sho_Sonoda1",
        "aff": "NTT;Ehime University;A*STAR;The University of Tokyo;RIKEN",
        "aff_domain": "ntt.co.jp;ehime-u.ac.jp;a-star.edu.sg;tokyo.ac.jp;riken.jp",
        "position": "Researcher;Associate Professor;Principal Researcher;Associate Professor;Researcher",
        "bibtex": "@inproceedings{\nhashimoto2024koopmanbased,\ntitle={Koopman-based generalization bound: New aspect for full-rank weights},\nauthor={Yuka Hashimoto and Sho Sonoda and Isao Ishikawa and Atsushi Nitanda and Taiji Suzuki},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=JN7TcCm9LF}\n}",
        "github": "",
        "project": "",
        "reviewers": "i9ex;ebFP;K7E7",
        "pdf_size": 891109,
        "rating": "5;6;8",
        "confidence": "3;3;4",
        "soundness": "3;2;3",
        "contribution": "2;3;4",
        "presentation": "3;2;4",
        "wc_summary": "33;231;99",
        "wc_strengths": "106;166;174",
        "wc_weaknesses": "199;1093;109",
        "wc_questions": "2;175;4",
        "wc_review": "340;1665;386",
        "wc_reply_reviewers": "0;580;0",
        "wc_reply_authors": "394;1935;224",
        "reply_reviewers": "0;3;0",
        "reply_authors": "1;4;1",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            121.0,
            82.3164625090267
        ],
        "wc_strengths_avg": [
            148.66666666666666,
            30.346151137976115
        ],
        "wc_weaknesses_avg": [
            467.0,
            444.17113818887424
        ],
        "wc_questions_avg": [
            60.333333333333336,
            81.08568855777749
        ],
        "wc_review_avg": [
            797.0,
            614.0559149350055
        ],
        "wc_reply_reviewers_avg": [
            193.33333333333334,
            273.4146220587984
        ],
        "wc_reply_authors_avg": [
            851.0,
            769.6393094603905
        ],
        "reply_reviewers_avg": [
            1.0,
            1.4142135623730951
        ],
        "reply_authors_avg": [
            2.0,
            1.4142135623730951
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.944911182523068,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12462009055964381655&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=JN7TcCm9LF",
        "pdf": "https://openreview.net/pdf?id=JN7TcCm9LF",
        "email": "ntt.co.jp;ehime-u.ac.jp;a-star.edu.sg;tokyo.ac.jp;riken.jp",
        "author_num": 5,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "NTT Corporation;Ehime University;Agency for Science, Technology and Research;University of Tokyo;RIKEN",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.ntt.co.jp;https://www.ehime-u.ac.jp;https://www.a-star.edu.sg;https://www.u-tokyo.ac.jp;https://www.riken.jp",
        "aff_unique_abbr": "NTT;Ehime U;A*STAR;UTokyo;RIKEN",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "Japan;Singapore"
    },
    {
        "id": "JNN4ekaAIE",
        "title": "What Text Do Language Models Trust?",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large language models (LLMs) are being tasked with increasingly open-ended, delicate, and subjective tasks. In particular, retrieval-augmented models can now answer subjective questions (e.g., ``is aspartame linked to cancer''), and in doing so, they condition on text that comes from arbitrary websites, whose evidence may \\emph{conflict} with one another. Humans are also faced with these same conflicts, and in order to come to an answer they critically evaluate the arguments, trustworthiness, and credibility of a source. In this work, we study what types of evidence current LLMs find convincing, and if they are able to make similar judgements that align with human preferences. Specifically, we construct ConflictingQA, a new benchmark that pairs controversial questions with a series of evidence documents that contain different facts (e.g., quantitative results), argument styles (e.g., appeals to authority), and answers (\\texttt{yes} or \\texttt{no}). We first find that models are highly corrigible: models can update their predictions when given novel contexts, even when it conflicts with their prior knowledge. However, the type of evidence that models find convincing does not align well with human preferences.",
        "keywords": "Language Models;Question Answering;LLM Agents;Alignment",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Alexander Wan;Eric Wallace",
        "authorids": "~Alexander_Wan1;~Eric_Wallace1",
        "gender": "M;M",
        "homepage": "https://wanalex.com;http://www.ericswallace.com/",
        "dblp": "340/8115;218/6165",
        "google_scholar": "iSkfiKIAAAAJ;SgST3LkAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Alexander_Wan1;~Eric_Wallace1",
        "aff": "University of California, Berkeley;University of California, Berkeley",
        "aff_domain": "berkeley.edu;berkeley.edu",
        "position": "Undergrad student;PhD student",
        "bibtex": "@misc{\nwan2024what,\ntitle={What Text Do Language Models Trust?},\nauthor={Alexander Wan and Eric Wallace},\nyear={2024},\nurl={https://openreview.net/forum?id=JNN4ekaAIE}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=JNN4ekaAIE",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of California, Berkeley",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.berkeley.edu",
        "aff_unique_abbr": "UC Berkeley",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Berkeley",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Scaling Laws of RoPE-based Extrapolation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18943",
        "id": "JO7k0SJ5V6",
        "author_site": "Xiaoran Liu, Hang Yan, Chenxin An, Xipeng Qiu, Dahua Lin",
        "tldr": "",
        "abstract": "The extrapolation capability of Large Language Models (LLMs) based on Rotary Position Embedding \\citep{su2021roformer} is currently a topic of considerable interest. The mainstream approach to addressing extrapolation with LLMs involves modifying RoPE by replacing 10000, the rotary base of $\\theta_n={10000}^{-2n/d}$ in the original RoPE, with a larger value and providing longer fine-tuning text. In this work, we first observe that fine-tuning a RoPE-based LLM with either a smaller or larger base in pre-training context length could significantly enhance its extrapolation performance. After that, we propose \\textbf{\\textit{Scaling Laws of RoPE-based Extrapolation}}, a unified framework from the periodic perspective, to describe the relationship between the extrapolation performance and base value as well as tuning context length. In this process, we also explain the origin of the RoPE-based extrapolation issue by \\textbf{\\textit{critical dimension for extrapolation}}. Besides these observations and analyses, we achieve extrapolation up to 1 million context length within only 16K training length on LLaMA2 7B and 13B \\citep{touvron2023llama2}.",
        "keywords": "Position Embeddin;Length Extrapolation;Large Language Model;Natural Language Processing",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Xiaoran Liu;Hang Yan;Chenxin An;Xipeng Qiu;Dahua Lin",
        "authorids": "~Xiaoran_Liu1;~Hang_Yan2;~Chenxin_An1;~Xipeng_Qiu1;~Dahua_Lin1",
        "gender": "M;;M;M;M",
        "homepage": "https://github.com/lxr-tech;;https://chenxinan-fdu.github.io/;https://xpqiu.github.io/;http://dahua.site",
        "dblp": ";;289/7002;69/1395;53/6088",
        "google_scholar": "Qe6F4J4AAAAJ;;fY69CxIAAAAJ;Pq4Yp_kAAAAJ;GMzzRRUAAAAJ",
        "orcid": ";;;0000-0001-7163-5247;",
        "linkedin": ";;;;",
        "or_profile": "~Xiaoran_Liu1;~Hang_Yan2;~Chenxin_An1;~Xipeng_Qiu1;~Dahua_Lin1",
        "aff": "Shanghai Artificial Intelligence Laboratory;;University of Hong Kong;Fudan University;The Chinese University of Hong Kong",
        "aff_domain": "pjlab.org.cn;;hku.hk;fudan.edu.cn;cuhk.edu.hk",
        "position": "Intern;;PhD student;Full Professor;Associate Professor",
        "bibtex": "@inproceedings{\nliu2024scaling,\ntitle={Scaling Laws of Ro{PE}-based Extrapolation},\nauthor={Xiaoran Liu and Hang Yan and Chenxin An and Xipeng Qiu and Dahua Lin},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=JO7k0SJ5V6}\n}",
        "github": "",
        "project": "",
        "reviewers": "jipE;Dcc1;Gdv1",
        "pdf_size": 18052556,
        "rating": "6;8;10",
        "confidence": "5;5;4",
        "soundness": "3;2;4",
        "contribution": "2;3;4",
        "presentation": "3;3;4",
        "wc_summary": "103;39;103",
        "wc_strengths": "93;55;40",
        "wc_weaknesses": "219;317;40",
        "wc_questions": "30;3;1",
        "wc_review": "445;414;184",
        "wc_reply_reviewers": "120;89;0",
        "wc_reply_authors": "2437;1339;340",
        "reply_reviewers": "1;1;0",
        "reply_authors": "5;3;1",
        "rating_avg": [
            8.0,
            1.632993161855452
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            81.66666666666667,
            30.169889330626027
        ],
        "wc_strengths_avg": [
            62.666666666666664,
            22.305953365762143
        ],
        "wc_weaknesses_avg": [
            192.0,
            114.68507604159603
        ],
        "wc_questions_avg": [
            11.333333333333334,
            13.224556283251582
        ],
        "wc_review_avg": [
            347.6666666666667,
            116.41973868530867
        ],
        "wc_reply_reviewers_avg": [
            69.66666666666667,
            50.86146762421322
        ],
        "wc_reply_authors_avg": [
            1372.0,
            856.4146192119796
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.0,
            1.632993161855452
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 56,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4936769074146338990&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=JO7k0SJ5V6",
        "pdf": "https://openreview.net/pdf?id=JO7k0SJ5V6",
        "email": "pjlab.org.cn;;hku.hk;fudan.edu.cn;cuhk.edu.hk",
        "author_num": 5,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Shanghai Artificial Intelligence Laboratory;University of Hong Kong;Fudan University;Chinese University of Hong Kong",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "http://www.shailab.org/;https://www.hku.hk;https://www.fudan.edu.cn;https://www.cuhk.edu.hk",
        "aff_unique_abbr": "Shanghai AI Lab;HKU;Fudan;CUHK",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "On the Stability of Iterative Retraining of Generative Models on their own Data",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18942",
        "id": "JORAfH2xFd",
        "author_site": "Quentin Bertrand, Joey Bose, Alexandre Duplessis, Marco Jiralerspong, Gauthier Gidel",
        "tldr": "",
        "abstract": "Deep generative models have made tremendous progress in modeling complex data, often exhibiting generation quality that surpasses a typical human's ability to discern the authenticity of samples. Undeniably, a key driver of this success is enabled by the massive amounts of web-scale data consumed by these models. Due to these models' striking performance and ease of availability, the web will inevitably be increasingly populated with synthetic content. Such a fact directly implies that future iterations of generative models will be trained on both clean and artificially generated data from past models. In this paper, we develop a framework to rigorously study the impact of training generative models on mixed datasets---from classical training on real data to self-consuming generative models trained on purely synthetic data. We first prove the stability of iterative training under the condition that the initial generative models approximate the data distribution well enough and the proportion of clean training data (w.r.t. synthetic data) is large enough. We empirically validate our theory on both synthetic and natural images by iteratively training normalizing flows and state-of-the-art diffusion models on CIFAR10 and FFHQ.",
        "keywords": "Generative Models;Iterative Training;Diffusion",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Quentin Bertrand;Joey Bose;Alexandre Duplessis;Marco Jiralerspong;Gauthier Gidel",
        "authorids": "~Quentin_Bertrand1;~Joey_Bose1;~Alexandre_Duplessis1;~Marco_Jiralerspong1;~Gauthier_Gidel1",
        "gender": "M;M;;;M",
        "homepage": "https://qb3.github.io/index.html;https://joeybose.github.io/;;https://marcojira.github.io/;https://gauthiergidel.github.io/",
        "dblp": ";174/3372;;319/6631;188/6326",
        "google_scholar": "Uxr3P78AAAAJ;ybPyI7IAAAAJ;;https://scholar.google.ca/citations?user=q2_P1YcAAAAJ;https://scholar.google.fr/citations?user=bDrXQPUAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Quentin_Bertrand1;~Joey_Bose1;~Alexandre_Duplessis1;~Marco_Jiralerspong1;~Gauthier_Gidel1",
        "aff": "INRIA;University of Oxford;;Universit\u00e9 de Montr\u00e9al;Mila - Quebec Artificial Intelligence Institute",
        "aff_domain": "inria.fr;oxford.ac.uk;;umontreal.ca;mila.quebec",
        "position": "Researcher;Postdoc;;PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nbertrand2024on,\ntitle={On the Stability of Iterative Retraining of Generative Models on their own Data},\nauthor={Quentin Bertrand and Joey Bose and Alexandre Duplessis and Marco Jiralerspong and Gauthier Gidel},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=JORAfH2xFd}\n}",
        "github": "",
        "project": "",
        "reviewers": "9HHH;pzxF;LQsW;bfKK",
        "pdf_size": 3959991,
        "rating": "5;6;8;8",
        "confidence": "3;3;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;4;3",
        "presentation": "3;4;4;4",
        "wc_summary": "57;72;81;65",
        "wc_strengths": "141;27;125;155",
        "wc_weaknesses": "981;2;168;135",
        "wc_questions": "47;51;59;62",
        "wc_review": "1226;152;433;417",
        "wc_reply_reviewers": "753;0;227;127",
        "wc_reply_authors": "2009;389;965;960",
        "reply_reviewers": "2;0;2;1",
        "reply_authors": "4;2;3;3",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            68.75,
            8.842369591913696
        ],
        "wc_strengths_avg": [
            112.0,
            50.20956084253277
        ],
        "wc_weaknesses_avg": [
            321.5,
            385.79949455643407
        ],
        "wc_questions_avg": [
            54.75,
            6.015604707757983
        ],
        "wc_review_avg": [
            557.0,
            402.0453954468326
        ],
        "wc_reply_reviewers_avg": [
            276.75,
            286.4894195253989
        ],
        "wc_reply_authors_avg": [
            1080.75,
            584.838599529819
        ],
        "reply_reviewers_avg": [
            1.25,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5555555555555555,
        "gs_citation": 45,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14939837217215108869&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=JORAfH2xFd",
        "pdf": "https://openreview.net/pdf?id=JORAfH2xFd",
        "email": "inria.fr;oxford.ac.uk;;umontreal.ca;mila.quebec",
        "author_num": 5,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "INRIA;University of Oxford;Universit\u00e9 de Montr\u00e9al;Quebec Artificial Intelligence Institute",
        "aff_unique_dep": ";;;Artificial Intelligence",
        "aff_unique_url": "https://www.inria.fr;https://www.ox.ac.uk;https://www.umontreal.ca;https://mila.quebec",
        "aff_unique_abbr": "INRIA;Oxford;UdeM;Mila",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;2",
        "aff_country_unique": "France;United Kingdom;Canada"
    },
    {
        "title": "On the Role of General Function Approximation in Offline Reinforcement Learning",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18941",
        "id": "JSS9rKHySk",
        "author_site": "Chenjie Mao, Qiaosheng Zhang, Zhen Wang, Xuelong Li",
        "tldr": "",
        "abstract": "We study offline reinforcement learning (RL) with general function approximation. General function approximation is a powerful tool for algorithm design and analysis, but its adaptation to offline RL encounters several challenges due to varying approximation targets and assumptions that blur the real meanings of function assumptions. In this paper, we try to formulate and clarify the treatment of general function approximation in offline RL in two aspects: (1) analyzing different types of assumptions and their practical usage, and (2) understanding its role as a restriction on underlying MDPs from information-theoretic perspectives. Additionally, we introduce a new insight for lower bound establishing: one can exploit model-realizability to establish general-purpose lower bounds that can be generalized into other functions. Building upon this insight, we propose two generic lower bounds that contribute to a better understanding of offline RL with general function approximation.",
        "keywords": "reinforcement learning theory;offline reinforcement learning;general function approximation;learnability;minimax lower bounds",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Chenjie Mao;Qiaosheng Zhang;Zhen Wang;Xuelong Li",
        "authorids": "~Chenjie_Mao1;~Qiaosheng_Zhang2;~Zhen_Wang11;~Xuelong_Li2",
        "gender": "M;M;M;M",
        "homepage": "https://aithuuuus.github.io/;https://qiaoshengzhang.github.io/;http://iopen.nwpu.edu.cn/info/1015/1351.htm?ivk_sa=1024320u;",
        "dblp": ";181/8458.html;;l/XuelongLi",
        "google_scholar": ";;https://scholar.google.co.uk/citations?hl=zh-CN;ahUibskAAAAJ",
        "orcid": ";0000-0001-6114-8453;;",
        "linkedin": ";;;",
        "or_profile": "~Chenjie_Mao1;~Qiaosheng_Zhang2;~Zhen_Wang11;~Xuelong_Li2",
        "aff": "Huazhong University of Science and Technology;Shanghai Artificial Intelligence Laboratory;Northwestern Polytechnical University;Northwestern Polytechnical University",
        "aff_domain": "hust.edu.cn;pjlab.org.cn;nwpu.edu.cn;nwpu.edu.cn",
        "position": "Undergrad student;Researcher;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nmao2024on,\ntitle={On the Role of General Function Approximation in Offline Reinforcement Learning},\nauthor={Chenjie Mao and Qiaosheng Zhang and Zhen Wang and Xuelong Li},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=JSS9rKHySk}\n}",
        "github": "",
        "project": "",
        "reviewers": "85dZ;PRdx;XLGY;MhTC;REan",
        "pdf_size": 520955,
        "rating": "6;6;6;8;8",
        "confidence": "3;2;3;4;4",
        "soundness": "3;3;3;3;4",
        "contribution": "3;3;3;3;4",
        "presentation": "3;3;2;2;4",
        "wc_summary": "119;70;57;121;65",
        "wc_strengths": "30;27;23;128;133",
        "wc_weaknesses": "53;94;52;379;5",
        "wc_questions": "27;71;30;2;1",
        "wc_review": "229;262;162;630;204",
        "wc_reply_reviewers": "0;0;11;428;0",
        "wc_reply_authors": "82;410;274;1441;27",
        "reply_reviewers": "0;0;1;2;0",
        "reply_authors": "1;1;1;2;1",
        "rating_avg": [
            6.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.2,
            0.7483314773547882
        ],
        "soundness_avg": [
            3.2,
            0.39999999999999997
        ],
        "contribution_avg": [
            3.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.8,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            86.4,
            27.75319801392265
        ],
        "wc_strengths_avg": [
            68.2,
            50.940749896325634
        ],
        "wc_weaknesses_avg": [
            116.6,
            134.1918030283519
        ],
        "wc_questions_avg": [
            26.2,
            25.466841186138495
        ],
        "wc_review_avg": [
            297.4,
            169.47637003429122
        ],
        "wc_reply_reviewers_avg": [
            87.8,
            170.15334260601523
        ],
        "wc_reply_authors_avg": [
            446.8,
            515.5499587818819
        ],
        "reply_reviewers_avg": [
            0.6,
            0.7999999999999999
        ],
        "reply_authors_avg": [
            1.2,
            0.4
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.8728715609439696,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11631771635053513871&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=JSS9rKHySk",
        "pdf": "https://openreview.net/pdf?id=JSS9rKHySk",
        "email": "hust.edu.cn;pjlab.org.cn;nwpu.edu.cn;nwpu.edu.cn",
        "author_num": 4,
        "aff_unique_index": "0;1;2;2",
        "aff_unique_norm": "Huazhong University of Science and Technology;Shanghai Artificial Intelligence Laboratory;Northwestern Polytechnical University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.hust.edu.cn;http://www.shailab.org/;https://www.nwpu.edu.cn",
        "aff_unique_abbr": "HUST;Shanghai AI Lab;NWPU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "JSlTXa6WE6",
        "title": "Efficient Certification of Physics-Informed Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent work provides promising evidence that Physics-Informed Neural Networks (PINN) can efficiently solve partial differential equations (PDE). However, previous works have failed to provide guarantees on the worst-case residual error of a PINN across the spatio-temporal domain - a measure akin to the tolerance of numerical solvers - focusing instead on point-wise comparisons between their solution and the ones obtained by a solver on a set of inputs. In real-world applications, one cannot consider tests on a finite set of points to be sufficient grounds for deployment, as the performance could be substantially worse on a different set. To alleviate this issue, we establish tolerance-based correctness conditions for PINNs over the entire input domain. To verify the extent to which they hold, we introduce $\\partial$-CROWN: a general, efficient and scalable post-training framework to bound PINN residual errors. We demonstrate its effectiveness in obtaining tight certificates by applying it to two classically studied PDEs - Burgers' and Schr\u00f6dinger's equations -, and two more challenging ones with real-world applications - the Allan-Cahn and Diffusion-Sorption equations.",
        "keywords": "neural network verification;formal verification;physics-informed neural networks",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/aae4048cdb51c90e4a8b66c8195aca5d61f01aa2.zip",
        "author": "Francisco Eiras;Adel Bibi;Rudy R Bunel;Krishnamurthy Dj Dvijotham;Philip Torr;M. Pawan Kumar",
        "authorids": "~Francisco_Eiras1;~Adel_Bibi1;~Rudy_R_Bunel1;~Krishnamurthy_Dj_Dvijotham1;~Philip_Torr1;~M._Pawan_Kumar1",
        "gender": "M;M;M;;;M",
        "homepage": "https://fgirbal.github.io;http://adelbibi.com;http://www.robots.ox.ac.uk/~rudy/;http://www.robots.ox.ac.uk/~tvg/;;http://dvij.github.io",
        "dblp": "218/5843;176/0964;180/5419;;45/2527;16/8758",
        "google_scholar": "O_iJTgYAAAAJ;Q4j2laYAAAAJ;https://scholar.google.fr/citations?user=7cqQFSoAAAAJ;;https://scholar.google.com/citations?hl=en;BUtloecAAAAJ",
        "orcid": ";0000-0002-6169-3918;;;;",
        "linkedin": "franciscogirbaleiras/;adel-bibi-ba3671ab/;;;;",
        "or_profile": "~Francisco_Eiras1;~Adel_Bibi1;~Rudy_R_Bunel1;~Philip_Torr1;~M._Pawan_Kumar1;~Krishnamurthy_Dvijotham2",
        "aff": "University of Oxford;University of Oxford;;University of Oxford;Google DeepMind;Google DeepMind",
        "aff_domain": "ox.ac.uk;ox.ac.uk;;ox.ac.uk;deepmind.com;google.com",
        "position": "PhD student;Senior Researcher;;Full Professor;Researcher;Researcher",
        "bibtex": "@misc{\neiras2024efficient,\ntitle={Efficient Certification of Physics-Informed Neural Networks},\nauthor={Francisco Eiras and Adel Bibi and Rudy R Bunel and Krishnamurthy Dj Dvijotham and Philip Torr and M. Pawan Kumar},\nyear={2024},\nurl={https://openreview.net/forum?id=JSlTXa6WE6}\n}",
        "github": "",
        "project": "",
        "reviewers": "5KvE;3Mdo;2eyr;uoUZ",
        "site": "https://openreview.net/forum?id=JSlTXa6WE6",
        "pdf_size": 1674647,
        "rating": "5;5;6;6",
        "confidence": "4;3;3;4",
        "soundness": "3;3;3;3",
        "contribution": "3;2;3;2",
        "presentation": "3;2;2;3",
        "wc_summary": "26;67;131;70",
        "wc_strengths": "38;33;123;86",
        "wc_weaknesses": "233;367;359;282",
        "wc_questions": "55;20;243;94",
        "wc_review": "352;487;856;532",
        "wc_reply_reviewers": "0;0;102;193",
        "wc_reply_authors": "597;783;994;1267",
        "reply_reviewers": "0;0;1;2",
        "reply_authors": "3;3;3;3",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            73.5,
            37.473323845103465
        ],
        "wc_strengths_avg": [
            70.0,
            36.93913913452776
        ],
        "wc_weaknesses_avg": [
            310.25,
            55.59395200918891
        ],
        "wc_questions_avg": [
            103.0,
            84.9617561023782
        ],
        "wc_review_avg": [
            556.75,
            185.03428736318034
        ],
        "wc_reply_reviewers_avg": [
            73.75,
            80.46233590941789
        ],
        "wc_reply_authors_avg": [
            910.25,
            249.3003961087908
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.0,
            0.0
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:0bbEc04C7agJ:scholar.google.com/&scioq=Efficient+Certification+of+Physics-Informed+Neural+Networks&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;1",
        "aff_unique_norm": "University of Oxford;Google",
        "aff_unique_dep": ";Google DeepMind",
        "aff_unique_url": "https://www.ox.ac.uk;https://deepmind.com",
        "aff_unique_abbr": "Oxford;DeepMind",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "JTBe1WG3Ws",
        "title": "FLIRT: Feedback Loop In-context Red Teaming",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "*Warning: this paper contains content that may be inappropriate or offensive.*\n\nAs generative models become available for public use in various applications, testing and analyzing vulnerabilities of these models has become a priority. In this work, we propose an automatic *red teaming* framework that evaluates a given model and exposes its vulnerabilities against unsafe and inappropriate content generation. Our framework uses in-context learning in a feedback loop to red team models and trigger them into unsafe content generation. In particular, taking text-to-image models as target models, we explore different feedback mechanisms to automatically learn effective and diverse adversarial prompts. Our experiments demonstrate that even with enhanced safety features, Stable Diffusion (SD) models are vulnerable to our adversarial prompts, raising concerns on their robustness in practical uses. As a result of our experiments, we create a benchmark dataset containing over 76k prompts that are successful in triggering at least one studied text-to-image model into generating inappropriate content. Furthermore, we demonstrate that the proposed framework is  effective for red teaming text-to-text models, resulting in significantly higher toxic response generation rate compared to previously reported numbers.",
        "keywords": "Safety;Red-teaming;Generative AI;Adversarial Machine Learning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/2163b7694091592bf547cb8d1b7175dbff9638a3.zip",
        "author": "Ninareh Mehrabi;Palash Goyal;Christophe Dupuy;Qian Hu;Shalini Ghosh;Richard Zemel;Kai-Wei Chang;Aram Galstyan;Rahul Gupta",
        "authorids": "~Ninareh_Mehrabi2;~Palash_Goyal1;~Christophe_Dupuy1;~Qian_Hu4;~Shalini_Ghosh3;~Richard_Zemel1;~Kai-Wei_Chang1;~Aram_Galstyan1;~Rahul_Gupta3",
        "gender": "M;;M;F;M;M;M;M;F",
        "homepage": ";;;http://shalinighosh.com;http://www.cs.columbia.edu/~zemel;http://kwchang.net;http://www.isi.edu/~galstyan;;https://scf.usc.edu/~ninarehm/",
        "dblp": "183/3699;177/9156;;45/4320;16/6366;18/2428;16/3411;;230/8151",
        "google_scholar": "kNeah3kAAAAJ;https://scholar.google.fr/citations?user=LCVtISwAAAAJ;CLleKDAAAAAJ;kC9Pmn8AAAAJ;https://scholar.google.ca/citations?user=iBeDoRAAAAAJ;fqDBtzYAAAAJ;rJTwW0MAAAAJ;1CFrm2YAAAAJ;1R3XgHQAAAAJ",
        "orcid": "0000-0003-2455-2160;;;;;0000-0001-5365-0072;;;",
        "linkedin": "palash-goyal-19b11445/;christophe-dupuy-758b793b/;;shalini-ghosh-99bb3719;;kai-wei-chang-41239040;aram-galstyan-4a01373/;;",
        "or_profile": "~Palash_Goyal1;~Christophe_Dupuy1;~Qian_Hu4;~Shalini_Ghosh3;~Richard_Zemel1;~Kai-Wei_Chang1;~Aram_Galstyan1;~Rahul_Gupta3;~Ninareh_Mehrabi1",
        "aff": "Amazon;Amazon;Amazon;Amazon;Department of Computer Science, University of Toronto;Amazon;Amazon Alexa;Amazon;Amazon",
        "aff_domain": "amazon.com;amazon.com;amazon.com;amazon.com;cs.toronto.edu;amazon.com;amazon.com;amazon.com;amazon.com",
        "position": "Researcher;Researcher;Researcher;Principal Researcher;Full Professor;Researcher;Scholar;Researcher;Researcher",
        "bibtex": "@misc{\nmehrabi2024flirt,\ntitle={{FLIRT}: Feedback Loop In-context Red Teaming},\nauthor={Ninareh Mehrabi and Palash Goyal and Christophe Dupuy and Qian Hu and Shalini Ghosh and Richard Zemel and Kai-Wei Chang and Aram Galstyan and Rahul Gupta},\nyear={2024},\nurl={https://openreview.net/forum?id=JTBe1WG3Ws}\n}",
        "github": "",
        "project": "",
        "reviewers": "dszm;2CM2;Wisf;ZWk1",
        "site": "https://openreview.net/forum?id=JTBe1WG3Ws",
        "pdf_size": 4733028,
        "rating": "5;5;6;8",
        "confidence": "4;4;4;3",
        "soundness": "1;1;3;4",
        "contribution": "2;2;3;2",
        "presentation": "3;3;3;4",
        "wc_summary": "64;159;50;55",
        "wc_strengths": "32;65;78;59",
        "wc_weaknesses": "252;157;53;350",
        "wc_questions": "76;139;2;3",
        "wc_review": "424;520;183;467",
        "wc_reply_reviewers": "0;212;13;414",
        "wc_reply_authors": "813;531;89;1175",
        "reply_reviewers": "0;1;1;2",
        "reply_authors": "2;3;1;3",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            1.299038105676658
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            82.0,
            44.73812691653507
        ],
        "wc_strengths_avg": [
            58.5,
            16.77050983124842
        ],
        "wc_weaknesses_avg": [
            203.0,
            110.2565190816398
        ],
        "wc_questions_avg": [
            55.0,
            57.03069349043548
        ],
        "wc_review_avg": [
            398.5,
            128.98158783330277
        ],
        "wc_reply_reviewers_avg": [
            159.75,
            169.13659420716735
        ],
        "wc_reply_authors_avg": [
            652.0,
            397.196424958735
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -0.9428090415820632,
        "gs_citation": 61,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3679628265599247085&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;0;0;1;0;0;0;0",
        "aff_unique_norm": "Amazon;University of Toronto",
        "aff_unique_dep": "Amazon.com, Inc.;Department of Computer Science",
        "aff_unique_url": "https://www.amazon.com;https://www.utoronto.ca",
        "aff_unique_abbr": "Amazon;U of T",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Toronto",
        "aff_country_unique_index": "0;0;0;0;1;0;0;0;0",
        "aff_country_unique": "United States;Canada"
    },
    {
        "id": "JTcaziw7G1",
        "title": "Don't forget private retrieval: distributed private similarity search for large language models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "While the flexible capabilities of large language models (LLMs) allow them to answer a range of queries based on existing learned knowledge, information retrieval to augment generation is an important tool to allow LLMs to answer questions on information not included in pre-training data. Such private information is increasingly being generated in a wide array of distributed contexts by organizations and individuals. Performing such information retrieval using neural embeddings of queries and documents always leaked information about queries and database content unless both were stored locally. We present Private Retrieval Augmented Generation (PRAG), an approach that uses multi-party computation (MPC) to securely transmit queries to a distributed set of servers containing a privately constructed database to return top-k and approximate top-k documents. This is a first-of-its kind approach to dense information retrieval that ensures no server observes a client's query or can see the database content. The approach introduces a novel MPC friendly protocol for inverted file approximate search (IVF) that allows for fast document search over distributed and private data in sublinear communication complexity. This work presents new avenues through which data for use in LLMs can be accessed and used without needing to centralize or forgo privacy.",
        "keywords": "information retrieval;RAG;MPC;IVF;privacy",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Guy Zyskind;Tobin South;Alex Pentland",
        "authorids": "guyz@mit.edu;~Tobin_South1;~Alex_Pentland1",
        "gender": ";Not Specified;M",
        "homepage": ";https://tobin.page;https://www.media.mit.edu/people/sandy/overview/",
        "dblp": ";;p/AlexPentland",
        "google_scholar": ";r5pPBFMAAAAJ;P4nfoKYAAAAJ",
        "orcid": ";0000-0003-2740-9829;",
        "linkedin": ";;",
        "or_profile": "guyz@mit.edu;~Tobin_South1;~Alex_Pentland1",
        "aff": ";Massachusetts Institute of Technology;Massachusetts Institute of Technology",
        "aff_domain": ";mit.edu;mit.edu",
        "position": ";PhD student;Full Professor",
        "bibtex": "@misc{\nzyskind2024dont,\ntitle={Don't forget private retrieval: distributed private similarity search for large language models},\nauthor={Guy Zyskind and Tobin South and Alex Pentland},\nyear={2024},\nurl={https://openreview.net/forum?id=JTcaziw7G1}\n}",
        "github": "",
        "project": "",
        "reviewers": "zJDJ;LqCL;Ut5B;Hhh4",
        "site": "https://openreview.net/forum?id=JTcaziw7G1",
        "pdf_size": 740535,
        "rating": "3;3;3;3",
        "confidence": "4;3;4;3",
        "soundness": "3;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "3;2;3;2",
        "wc_summary": "159;59;118;26",
        "wc_strengths": "24;27;50;27",
        "wc_weaknesses": "40;60;250;118",
        "wc_questions": "178;4;9;61",
        "wc_review": "401;150;427;232",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            90.5,
            51.480578862324386
        ],
        "wc_strengths_avg": [
            32.0,
            10.464224768228174
        ],
        "wc_weaknesses_avg": [
            117.0,
            81.95730595865142
        ],
        "wc_questions_avg": [
            63.0,
            70.04641318440224
        ],
        "wc_review_avg": [
            302.5,
            115.57356964289023
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5201317840587865660&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Massachusetts Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://web.mit.edu",
        "aff_unique_abbr": "MIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "JVeM7uwDwK",
        "title": "Revealing the Illusion of Joint Multimodal Understanding in VideoQA Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "While VideoQA Transformer models demonstrate competitive performance on standard benchmarks, the reasons behind their success are not fully understood. Do these models jointly capture and leverage the rich multimodal structures and dynamics from video and text? Or are they merely exploiting shortcuts to achieve high scores? Hence, we design $\\textit{QUAG}$ (QUadrant AveraGe), a lightweight and non-parametric probe, to critically analyze multimodal representations. QUAG facilitates combined dataset-model study by systematic ablation of model's coupled multimodal understanding during inference. Surprisingly, it demonstrates that the models manage to maintain high performance even under multimodal impairment. We extend QUAG to design ''QUAG-attention'', a simplistic and less-expressive replacement of self-attention. We find that the models with QUAG-attention achieve similar performance with significantly less mulops without any finetuning. These findings indicate that the current VideoQA benchmarks and metrics do not penalize models that find shortcuts and discount joint multimodal understanding. Motivated by this, we propose the $\\textit{CLAVI}$ (Counterfactual in LAnguage and VIdeo), a diagnostic dataset for coupled multimodal understanding in VideoQA. CLAVI consists of temporal questions and videos that are augmented to curate balanced counterfactuals in language and video domains. We evaluate models on CLAVI and find that all models achieve high performance on multimodal shortcut instances, but most of them have very poor performance on the counterfactual instances that necessitate joint multimodal understanding. Overall, with the multimodal representation analysis using QUAG and diagnostic analysis using CLAVI, we show that many VideoQA models are incapable of learning multimodal representations and that their success on standard datasets is an illusion of joint multimodal understanding.",
        "keywords": "video question answering;multimodal representation learning;interpretability;vision-language model",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/a7e0e3ce591041edcf821ad3db22f628df3ec8b5.zip",
        "author": "Ishaan Singh Rawal;Shantanu Jaiswal;Basura Fernando;Cheston Tan",
        "authorids": "~Ishaan_Singh_Rawal1;~Shantanu_Jaiswal1;~Basura_Fernando1;~Cheston_Tan1",
        "gender": "M;;M;M",
        "homepage": ";;https://basurafernando.github.io/;",
        "dblp": ";203/9071;01/9558;136/9366",
        "google_scholar": "2qv2QwcAAAAJ;GmGNq2MAAAAJ;https://scholar.google.com.au/citations?user=GyvseMkAAAAJ;Up0UYEYAAAAJ",
        "orcid": ";;0000-0002-6920-9916;",
        "linkedin": "ishaan-s-rawal;;;cheston-tan/",
        "or_profile": "~Ishaan_Singh_Rawal1;~Shantanu_Jaiswal1;~Basura_Fernando1;~Cheston_Tan1",
        "aff": "Centre For Frontier AI Research, A*STAR. Singapore;Center for Frontier AI Research, A*STAR Singapore;A*STAR;Singapore University of Technology and Design",
        "aff_domain": "cfar.a-star.edu.sg;ihpc.a-star.edu.sg;astar.edu.sg;sutd.edu.sg",
        "position": "Research Engineer;Research Engineer;Principal Researcher;Assistant Professor",
        "bibtex": "@misc{\nrawal2024revealing,\ntitle={Revealing the Illusion of Joint Multimodal Understanding in Video{QA} Models},\nauthor={Ishaan Singh Rawal and Shantanu Jaiswal and Basura Fernando and Cheston Tan},\nyear={2024},\nurl={https://openreview.net/forum?id=JVeM7uwDwK}\n}",
        "github": "",
        "project": "",
        "reviewers": "ABMn;jfVh;Ui4x;Vyie",
        "site": "https://openreview.net/forum?id=JVeM7uwDwK",
        "pdf_size": 4331738,
        "rating": "5;5;5;6",
        "confidence": "4;3;5;2",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "107;60;134;26",
        "wc_strengths": "67;20;40;19",
        "wc_weaknesses": "422;135;250;52",
        "wc_questions": "3;68;124;5",
        "wc_review": "599;283;548;102",
        "wc_reply_reviewers": "176;26;34;0",
        "wc_reply_authors": "1811;916;1484;162",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "4;4;3;2",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            81.75,
            41.6795813318704
        ],
        "wc_strengths_avg": [
            36.5,
            19.5
        ],
        "wc_weaknesses_avg": [
            214.75,
            138.78287898728718
        ],
        "wc_questions_avg": [
            50.0,
            50.08492787256461
        ],
        "wc_review_avg": [
            383.0,
            201.76843162397827
        ],
        "wc_reply_reviewers_avg": [
            59.0,
            68.70953354520753
        ],
        "wc_reply_authors_avg": [
            1093.25,
            625.7984399948597
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.25,
            0.82915619758885
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.7745966692414834,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10818281711838203912&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "A*STAR;A*STAR Singapore;Agency for Science, Technology and Research;Singapore University of Technology and Design",
        "aff_unique_dep": "Centre For Frontier AI Research;Center for Frontier AI Research;;",
        "aff_unique_url": "https://www.a-star.edu.sg;https://www.a-star.edu.sg;https://www.a-star.edu.sg;https://www.sutd.edu.sg",
        "aff_unique_abbr": "A*STAR;A*STAR;A*STAR;SUTD",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Singapore"
    },
    {
        "title": "AirPhyNet: Harnessing Physics-Guided Neural Networks for Air Quality Prediction",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18940",
        "id": "JW3jTjaaAB",
        "author_site": "Kethmi Hirushini Hettige, Jiahao Ji, Shili Xiang, Cheng Long, Gao Cong, Jingyuan Wang",
        "tldr": "",
        "abstract": "Air quality prediction and modelling plays a pivotal role in public health and environment management, for individuals and authorities to make informed decisions. Although traditional data-driven models have shown promise in this domain, their long-term prediction accuracy can be limited, especially in scenarios with sparse or incomplete data and they often rely on black-box deep learning structures that lack solid physical foundation leading to reduced transparency and interpretability in predictions. To address these limitations, this paper presents a novel approach named Physics guided Neural Network for Air Quality Prediction (AirPhyNet). Specifically, we leverage two well-established physics principles of air particle movement (diffusion and advection) by representing them as differential equation networks. Then, we utilize a graph structure to integrate physics knowledge into a neural network architecture and exploit latent representations to capture spatio-temporal relationships within the air quality data. Experiments on two real-world benchmark datasets demonstrate that AirPhyNet outperforms state-of-the-art models for different testing scenarios including different lead time (24h, 48h, 72h), sparse data and sudden change prediction, achieving reduction in prediction errors up to 10\\%. Moreover, a case study further validates that our model captures underlying physical processes of particle movement and generates accurate predictions with real physical meaning. The code is available at: https://github.com/kethmih/AirPhyNet",
        "keywords": "air quality prediction;physics-informed;spatiotemporal-learning;interpretability",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "",
        "author": "Kethmi Hirushini Hettige;Jiahao Ji;Shili Xiang;Cheng Long;Gao Cong;Jingyuan Wang",
        "authorids": "~Kethmi_Hirushini_Hettige1;~Jiahao_Ji1;~Shili_Xiang1;~Cheng_Long1;~Gao_Cong1;~Jingyuan_Wang2",
        "gender": ";;F;M;M;M",
        "homepage": ";;;https://personal.ntu.edu.sg/c.long/index.html;https://personal.ntu.edu.sg/gaocong/;https://www.bigscity.com",
        "dblp": ";;22/711;58/10813;33/3180;75/5135-1.html",
        "google_scholar": ";;https://scholar.google.com.sg/citations?user=sCm2AHEAAAAJ;LybJ7ksAAAAJ;https://scholar.google.com.tw/citations?user=WFFamJkAAAAJ;qsLImx8AAAAJ",
        "orcid": ";;0000-0001-6598-2904;0000-0001-6806-8405;0000-0002-4430-6373;0000-0003-0651-1592",
        "linkedin": ";;https://sg.linkedin.com/in/shili-xiang-4463543;;;",
        "or_profile": "~Kethmi_Hirushini_Hettige1;~Jiahao_Ji1;~Shili_Xiang1;~Cheng_Long1;~Gao_Cong1;~Jingyuan_Wang2",
        "aff": ";;Institute for Infocomm Research, A*STAR;Nanyang Technological University;Nanyang Technological University;Beihang University",
        "aff_domain": ";;i2r.a-star.edu.sg;ntu.edu.sg;ntu.edu.sg;buaa.edu.cn",
        "position": ";;Researcher;Assistant Professor;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nhettige2024airphynet,\ntitle={AirPhyNet: Harnessing Physics-Guided Neural Networks for Air Quality Prediction},\nauthor={Kethmi Hirushini Hettige and Jiahao Ji and Shili Xiang and Cheng Long and Gao Cong and Jingyuan Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=JW3jTjaaAB}\n}",
        "github": "",
        "project": "",
        "reviewers": "tKfZ;6p5Q;pK4K;8KYF",
        "pdf_size": 7450680,
        "rating": "6;6;6;8",
        "confidence": "4;3;3;5",
        "soundness": "3;3;3;4",
        "contribution": "3;2;2;4",
        "presentation": "3;2;4;3",
        "wc_summary": "177;119;55;96",
        "wc_strengths": "67;19;53;66",
        "wc_weaknesses": "118;95;169;182",
        "wc_questions": "187;117;10;2",
        "wc_review": "549;350;287;346",
        "wc_reply_reviewers": "197;24;408;10",
        "wc_reply_authors": "2347;785;2369;745",
        "reply_reviewers": "2;1;2;1",
        "reply_authors": "6;3;6;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            111.75,
            44.09861108923953
        ],
        "wc_strengths_avg": [
            51.25,
            19.421315609401955
        ],
        "wc_weaknesses_avg": [
            141.0,
            35.742132001323036
        ],
        "wc_questions_avg": [
            79.0,
            77.13300201599831
        ],
        "wc_review_avg": [
            383.0,
            99.03282284172253
        ],
        "wc_reply_reviewers_avg": [
            159.75,
            161.1433756007364
        ],
        "wc_reply_authors_avg": [
            1561.5,
            796.6635111513518
        ],
        "reply_reviewers_avg": [
            1.5,
            0.5
        ],
        "reply_authors_avg": [
            4.25,
            1.7853571071357126
        ],
        "replies_avg": [
            31,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.8703882797784891,
        "gs_citation": 18,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16589339890234944934&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=JW3jTjaaAB",
        "pdf": "https://openreview.net/pdf?id=JW3jTjaaAB",
        "email": ";;i2r.a-star.edu.sg;ntu.edu.sg;ntu.edu.sg;buaa.edu.cn",
        "author_num": 6,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "Institute for Infocomm Research;Nanyang Technological University;Beihang University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.i2r.a-star.edu.sg;https://www.ntu.edu.sg;http://www.buaa.edu.cn/",
        "aff_unique_abbr": "I2R;NTU;BUAA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "Singapore;China"
    },
    {
        "id": "JWHf7lg8zM",
        "title": "MultiContrievers: Analysis of Dense Retrieval Representations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Dense Retrievers compress source documents into vector representations; the information they encode determines what is available to downstream tasks (e.g., QA, summarisation). Yet there is little analysis of the information in retriever representations. We conduct the first analysis comparing the information captured in dense retriever representations as compared to language model representations. To do this analysis, we present MultiContrievers, 25 contrastive dense retrievers initialized from the 25 MultiBerts.\nWe use information theoretic probing to analyse how well MultiContrievers encode two example pieces of information: topic and demographic gender (measured as extractability of these two concepts), and we correlate this to performance on 14 retrieval datasets covering seven distinct retrieval tasks. We find that: 1) MultiContriever contrastive training increases extractability of both topic and gender, but also has a regularisation effect; MultiContrievers are more similar to each other than MultiBerts, 2) extractability of both topic and gender correlate poorly with benchmark performance, revealing a gap between the effect of the training objective on representations, and desirable qualities for the benchmark 3) MultiContriever representations show strong potential for gender bias, and we do find allocational gender bias in retrieval benchmarks. However, a causal analysis shows that the source of the gender bias is not in the representations, suggesting that despite this potential, current gender bias is coming from either the queries or retrieval corpus, and cannot be corrected by improvements to modelling alone. We additionally find 4) significant variability across random seeds, suggesting that future work should test across a broad spread, which is not currently standard. We release our 25 MultiContrievers (including intermediate checkpoints) and all code to facilitate further analysis.",
        "keywords": "information theory;probing;retrieval;dense retrieval;gender bias;fairness",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Seraphina Goldfarb-Tarrant;Pedro Rodriguez;Jane Dwivedi-Yu;Patrick Lewis",
        "authorids": "~Seraphina_Goldfarb-Tarrant1;~Pedro_Rodriguez1;~Jane_Dwivedi-Yu1;~Patrick_Lewis2",
        "gender": "F;M;M;F",
        "homepage": "http://seraphinatarrant.github.io;https://www.pedro.ai;https://patricklewis.io;https://janedwivedi.github.io/",
        "dblp": "239/4080;96/4035;227/3197;215/3352",
        "google_scholar": "ywWpui8AAAAJ;JjpA4qwAAAAJ;JN7Zg-kAAAAJ;ev8Ilx0AAAAJ",
        "orcid": ";;0000-0002-2192-9543;",
        "linkedin": ";pedrorodriguezscience/;patrick-s-h-lewis/;janeaisleyyu/",
        "or_profile": "~Seraphina_Goldfarb-Tarrant1;~Pedro_Rodriguez1;~Patrick_Lewis2;~Jane_Yu1",
        "aff": "University of Edinburgh, University of Edinburgh;Meta FAIR;Cohere;Meta AI ",
        "aff_domain": "ed.ac.uk;fb.com;cohere.ai;meta.com",
        "position": "PhD student;Research Scientist;Director of Agentic AI;Researcher",
        "bibtex": "@misc{\ngoldfarb-tarrant2024multicontrievers,\ntitle={MultiContrievers: Analysis of Dense Retrieval Representations},\nauthor={Seraphina Goldfarb-Tarrant and Pedro Rodriguez and Jane Dwivedi-Yu and Patrick Lewis},\nyear={2024},\nurl={https://openreview.net/forum?id=JWHf7lg8zM}\n}",
        "github": "",
        "project": "",
        "reviewers": "jMXz;wTy7;LvdQ;rp3a",
        "site": "https://openreview.net/forum?id=JWHf7lg8zM",
        "pdf_size": 1732600,
        "rating": "3;3;6;6",
        "confidence": "3;3;4;4",
        "soundness": "2;2;3;2",
        "contribution": "2;3;3;3",
        "presentation": "2;2;3;2",
        "wc_summary": "51;102;100;119",
        "wc_strengths": "17;57;113;31",
        "wc_weaknesses": "75;104;186;90",
        "wc_questions": "5;49;405;513",
        "wc_review": "148;312;804;753",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "129;782;1443;793",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            93.0,
            25.347583711273153
        ],
        "wc_strengths_avg": [
            54.5,
            36.69809259348502
        ],
        "wc_weaknesses_avg": [
            113.75,
            42.955645729054055
        ],
        "wc_questions_avg": [
            243.0,
            219.89997726239082
        ],
        "wc_review_avg": [
            504.25,
            280.89177186240255
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            786.75,
            464.58603885609824
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13939731676803953134&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "University of Edinburgh;Meta;Cohere",
        "aff_unique_dep": ";Meta Platforms, Inc.;",
        "aff_unique_url": "https://www.ed.ac.uk;https://meta.com;https://cohere.ai",
        "aff_unique_abbr": "Edinburgh;Meta;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "id": "JWpil30sQG",
        "title": "Complex QA with Diverse Knowledge Sources: Novel Benchmark and Approach",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The complex question-answering task has traditionally revolved around breaking down multi-hop questions into simpler, single-hop queries and then addressing each of these simplified questions by extracting relevant information from an external knowledge source. Recent advancements in research have taken this a step further, focusing on the challenging scenario where multi-hop questions require evidence from a variety of sources, including unstructured text from sources like Wikipedia, as well as structured knowledge bases and tables. However, in many cases, structured knowledge sources have been treated as supplementary, with the primary emphasis on retrieving information from unstructured text, which often dictates the overall performance of the system. In this research paper, we explore the performance of state-of-the-art models in complex QA tasks when both structured and unstructured knowledge retrieval are given equal importance. Recognizing the absence of a well-established benchmark for such scenarios, we have curated a QA dataset that specifically requires structured knowledge retrieval to obtain accurate answers, as relying solely on unstructured retrieval is insufficient to cover all aspects of these complex questions. Furthermore, we have developed tools that employ symbolic language generation to facilitate information retrieval from structured knowledge sources. Our experiments, conducted on our newly created dataset, highlight the effectiveness and efficiency of the proposed architecture in handling these intricate question-answering tasks.",
        "keywords": "Question Answering Dataset;Natural Language Processing",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Wenting Zhao;Ye Liu;Tong Niu;Philip S. Yu;Shafiq Joty;Yingbo Zhou;Semih Yavuz",
        "authorids": "~Wenting_Zhao4;~Ye_Liu4;~Tong_Niu1;~Philip_S._Yu1;~Shafiq_Joty1;~Yingbo_Zhou1;~Semih_Yavuz1",
        "gender": "F;M;M;M;;M;F",
        "homepage": ";;https://cs.uic.edu/profiles/philip-yu/;https://raihanjoty.github.io/;;;",
        "dblp": "96/2615-6;;y/PhilipSYu;62/2078;72/8614;;41/10049-6.html",
        "google_scholar": "QMKD6YMAAAAJ;rrMtKR4AAAAJ;D0lL1r0AAAAJ;hR249csAAAAJ;H_6RQ7oAAAAJ;krh3p8AAAAAJ;aySy_OMAAAAJ",
        "orcid": ";;0000-0002-3491-5968;;;;",
        "linkedin": ";;;;yingbozhou/;semih-yavuz-4303518b;",
        "or_profile": "~Ye_Liu4;~Tong_Niu1;~Philip_S._Yu1;~Shafiq_Joty1;~Yingbo_Zhou1;~Semih_Yavuz2;~Wenting_Zhao5",
        "aff": "SalesForce.com;Salesforce AI Research;University of Illinois Chicago;SalesForce.com;Salesforce Research;SalesForce.com;University of Illinois at Chicago",
        "aff_domain": "salesforce.com;salesforce.com;uic.edu;salesforce.com;salesforce.com;salesforce.com;uic.edu",
        "position": "Researcher;Research Scientist;Full Professor;Principal Researcher;Research Scientist;Research Scientist;PhD student",
        "bibtex": "@misc{\nzhao2024complex,\ntitle={Complex {QA} with Diverse Knowledge Sources:  Novel Benchmark  and Approach},\nauthor={Wenting Zhao and Ye Liu and Tong Niu and Philip S. Yu and Shafiq Joty and Yingbo Zhou and Semih Yavuz},\nyear={2024},\nurl={https://openreview.net/forum?id=JWpil30sQG}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=JWpil30sQG",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:PilPcG1J4jYJ:scholar.google.com/&scioq=Complex+QA+with+Diverse+Knowledge+Sources:+Novel+Benchmark+and+Approach&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;0;0;1",
        "aff_unique_norm": "Salesforce;University of Illinois at Chicago",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.salesforce.com;https://www.uic.edu",
        "aff_unique_abbr": "Salesforce;UIC",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Chicago",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "ARM: Refining Multivariate Forecasting with Adaptive Temporal-Contextual Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18939",
        "id": "JWpwDdVbaM",
        "author_site": "Jiecheng Lu, Xu Han, Shihao Yang",
        "tldr": "",
        "abstract": "Long-term time series forecasting (LTSF) is important for various domains but is confronted by challenges in handling the complex temporal-contextual relationships. As multivariate input models underperforming some recent univariate counterparts, we posit that the issue lies in the inefficiency of existing multivariate LTSF Transformers to model series-wise relationships: the characteristic differences between series are often captured incorrectly. To address this, we introduce ARM: a multivariate temporal-contextual adaptive learning method, which is an enhanced architecture specifically designed for multivariate LTSF modelling. ARM employs Adaptive Univariate Effect Learning (**A**UEL), Random Dropping (**R**D) training strategy, and Multi-kernel Local Smoothing (**M**KLS), to better handle individual series temporal patterns and correctly learn inter-series dependencies. ARM demonstrates superior performance on multiple benchmarks without significantly increasing computational costs compared to vanilla Transformer, thereby advancing the state-of-the-art in LTSF. ARM is also generally applicable to other LTSF architecture beyond vanilla Transformer.",
        "keywords": "Time Series Forecasting;Transformer;Multivariate Time Series",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Jiecheng Lu;Xu Han;Shihao Yang",
        "authorids": "~Jiecheng_Lu1;~Xu_Han14;~Shihao_Yang1",
        "gender": "M;;M",
        "homepage": ";;https://www.isye.gatech.edu/users/shihao-yang",
        "dblp": "359/2326;;",
        "google_scholar": "H_Bz5A0AAAAJ;;Ig6LhL8AAAAJ",
        "orcid": "0009-0008-3453-8569;;0000-0003-3910-4969",
        "linkedin": "jiecheng-l-b01a491a4/;;",
        "or_profile": "~Jiecheng_Lu1;~Xu_Han14;~Shihao_Yang1",
        "aff": "Georgia Institute of Technology;;Georgia Institute of Technology",
        "aff_domain": "gatech.edu;;gatech.edu",
        "position": "PhD student;;Assistant Professor",
        "bibtex": "@inproceedings{\nlu2024arm,\ntitle={{ARM}: Refining Multivariate Forecasting with Adaptive Temporal-Contextual Learning},\nauthor={Jiecheng Lu and Xu Han and Shihao Yang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=JWpwDdVbaM}\n}",
        "github": "",
        "project": "",
        "reviewers": "X2pk;Eni6;PUmd",
        "pdf_size": 1988520,
        "rating": "6;6;6",
        "confidence": "3;4;3",
        "soundness": "3;4;3",
        "contribution": "4;4;3",
        "presentation": "3;2;2",
        "wc_summary": "100;57;105",
        "wc_strengths": "180;49;21",
        "wc_weaknesses": "166;89;66",
        "wc_questions": "198;25;1",
        "wc_review": "644;220;193",
        "wc_reply_reviewers": "26;59;22",
        "wc_reply_authors": "2359;1009;599",
        "reply_reviewers": "1;1;1",
        "reply_authors": "5;4;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            87.33333333333333,
            21.545816814923082
        ],
        "wc_strengths_avg": [
            83.33333333333333,
            69.3028779264533
        ],
        "wc_weaknesses_avg": [
            107.0,
            42.7629122799964
        ],
        "wc_questions_avg": [
            74.66666666666667,
            87.75850702670115
        ],
        "wc_review_avg": [
            352.3333333333333,
            206.53382827571426
        ],
        "wc_reply_reviewers_avg": [
            35.666666666666664,
            16.579773487261182
        ],
        "wc_reply_authors_avg": [
            1322.3333333333333,
            751.9012937583999
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            1.699673171197595
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4346848956418744206&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=JWpwDdVbaM",
        "pdf": "https://openreview.net/pdf?id=JWpwDdVbaM",
        "email": "gatech.edu;;gatech.edu",
        "author_num": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Georgia Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.gatech.edu",
        "aff_unique_abbr": "Georgia Tech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "JWrl5pJCnl",
        "title": "Instruct2Act: Mapping Multi-modality Instructions to Robotic Arm Actions with Large Language Model",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Foundation models have significantly advanced in various applications, including text-to-image generation, open-vocabulary segmentation, and natural language processing. This paper presents Instruct2Act, a framework that leverages Large Language Models (LLMs) to convert multi-modal instructions to sequential actions for robotic manipulation tasks. Specifically, Instruct2Act uses LLMs to generate Python programs that form a comprehensive perception, planning, and action loop for robotic tasks. It uses pre-defined APIs to access multiple foundation models, with the Segment Anything Model (SAM) identifying potential objects and CLIP semantically classifying them. This approach combines the strengths of foundation models and robotic actions to transform complex high-level instructions into precise policy codes. Our approach is adaptable and versatile, capable of handling various instruction modalities and input types, and meeting specific task requirements. We validated the practicality and efficiency of our approach on robotic tasks including different tabletop and 6 Degree of Freedom(DoF) manipulation scenarios in both simulation and real-world environments. Furthermore, our zero-shot method surpasses many state-of-the-art learning-based policies in several tasks. The code for our proposed approach is available at https://anonymous.4open.science/r/Instruct2Act, providing a solid benchmark for high-level robotic instruction tasks with diverse modality inputs.",
        "keywords": "large language models;robotic manipulation;code generation",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/c55a33f139b9ab8fa1ed5eef8fc6fc7204cf88a2.zip",
        "author": "Siyuan Huang;Zhengkai Jiang;Hao Dong;Yu Qiao;Peng Gao;Hongsheng Li",
        "authorids": "~Siyuan_Huang4;~Zhengkai_Jiang1;~Hao_Dong3;~Yu_Qiao1;~Peng_Gao3;~Hongsheng_Li3",
        "gender": "M;;M;;;M",
        "homepage": "https://siyuanhuang95.github.io/;;https://zsdonghao.github.io;;;http://www.ee.cuhk.edu.hk/~hsli",
        "dblp": "62/885-4.html;;14/1525-3.html;;;27/7402-1",
        "google_scholar": "QNkS4KEAAAAJ;;xLFL4sMAAAAJ;;;BN2Ze-QAAAAJ",
        "orcid": "0009-0005-6363-833X;;0000-0003-2261-9122;;;",
        "linkedin": "siyuan-huang-979672149/;;;;;",
        "or_profile": "~Siyuan_Huang4;~Zhengkai_Jiang1;~Hao_Dong3;~Yu_Qiao1;~Peng_Gao3;~Hongsheng_Li3",
        "aff": "Shanghai Jiaotong University;;Peking University;;;The Chinese University of Hong Kong",
        "aff_domain": "sjtu.edu.cn;;pku.edu.cn;;;cuhk.edu.hk",
        "position": "PhD student;;Assistant Professor;;;Associate Professor",
        "bibtex": "@misc{\nhuang2024instructact,\ntitle={Instruct2Act: Mapping Multi-modality Instructions to Robotic Arm Actions with Large Language Model},\nauthor={Siyuan Huang and Zhengkai Jiang and Hao Dong and Yu Qiao and Peng Gao and Hongsheng Li},\nyear={2024},\nurl={https://openreview.net/forum?id=JWrl5pJCnl}\n}",
        "github": "",
        "project": "",
        "reviewers": "KV7t;V9hM;UX8k;F1ER",
        "site": "https://openreview.net/forum?id=JWrl5pJCnl",
        "pdf_size": 3640144,
        "rating": "3;5;6;6",
        "confidence": "4;4;4;4",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;2",
        "presentation": "4;2;3;2",
        "wc_summary": "55;39;42;112",
        "wc_strengths": "35;34;42;69",
        "wc_weaknesses": "491;222;29;229",
        "wc_questions": "104;25;72;28",
        "wc_review": "685;320;185;438",
        "wc_reply_reviewers": "0;0;0;78",
        "wc_reply_authors": "1100;599;584;803",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            62.0,
            29.487285395573462
        ],
        "wc_strengths_avg": [
            45.0,
            14.19506956657839
        ],
        "wc_weaknesses_avg": [
            242.75,
            164.26864429951323
        ],
        "wc_questions_avg": [
            57.25,
            32.78242669480098
        ],
        "wc_review_avg": [
            407.0,
            183.77839916595204
        ],
        "wc_reply_reviewers_avg": [
            19.5,
            33.77499074759311
        ],
        "wc_reply_authors_avg": [
            771.5,
            208.45683006320516
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 146,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1375998006772233399&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Shanghai Jiao Tong University;Peking University;Chinese University of Hong Kong",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.sjtu.edu.cn;http://www.pku.edu.cn;https://www.cuhk.edu.hk",
        "aff_unique_abbr": "SJTU;Peking U;CUHK",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "JWwvC7As4S",
        "title": "Towards Understanding Neural Collapse: The Effects of Batch Normalization and Weight Decay",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Neural Collapse (NC) is a geometric structure recently observed in the final layer of neural network classifiers. In this paper, we investigate the interrelationships between batch normalization (BN), weight decay, and proximity to the NC structure. Our work introduces the geometrically intuitive intra-class and inter-class cosine similarity measure, which encapsulates multiple core aspects of NC. Leveraging this measure, we establish theoretical guarantees for the emergence of NC under the influence of last-layer BN and weight decay, specifically in scenarios where the regularized cross-entropy loss is near-optimal. Experimental evidence substantiates our theoretical findings, revealing a pronounced occurrence of NC in models incorporating BN and appropriate weight-decay values. This combination of theoretical and empirical insights suggests a greatly influential role of BN and weight decay in the emergence of NC.",
        "keywords": "Cross-Entropy Loss;Neural Collapse;Neural Networks;Deep Learning Theory",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/2d3311a11ce8eeb2bd6bdc1d186bc5e09abffe04.zip",
        "author": "Leyan Pan;Xinyuan Cao",
        "authorids": "~Leyan_Pan1;~Xinyuan_Cao1",
        "gender": "M;F",
        "homepage": ";https://github.com/youki-cao",
        "dblp": "356/6751;271/2539",
        "google_scholar": ";XRgHwgkAAAAJ",
        "orcid": ";",
        "linkedin": "leyanpan-0b8462181/;",
        "or_profile": "~Leyan_Pan1;~Xinyuan_Cao1",
        "aff": "Georgia Institute of Technology;Georgia Institute of Technology",
        "aff_domain": "gatech.edu;gatech.edu",
        "position": "PhD student;PhD student",
        "bibtex": "@misc{\npan2024towards,\ntitle={Towards Understanding Neural Collapse: The Effects of Batch Normalization and Weight Decay},\nauthor={Leyan Pan and Xinyuan Cao},\nyear={2024},\nurl={https://openreview.net/forum?id=JWwvC7As4S}\n}",
        "github": "",
        "project": "",
        "reviewers": "Svsj;PiTj;QjJX;TmdP",
        "site": "https://openreview.net/forum?id=JWwvC7As4S",
        "pdf_size": 870715,
        "rating": "3;5;5;5",
        "confidence": "4;4;3;3",
        "soundness": "2;3;3;2",
        "contribution": "2;3;2;2",
        "presentation": "3;3;2;3",
        "wc_summary": "64;38;102;74",
        "wc_strengths": "34;76;82;55",
        "wc_weaknesses": "1049;413;291;272",
        "wc_questions": "69;95;20;13",
        "wc_review": "1216;622;495;414",
        "wc_reply_reviewers": "403;87;0;84",
        "wc_reply_authors": "2299;761;628;1031",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "5;1;1;2",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            69.5,
            22.907422377910613
        ],
        "wc_strengths_avg": [
            61.75,
            18.89940475253123
        ],
        "wc_weaknesses_avg": [
            506.25,
            317.99321926732966
        ],
        "wc_questions_avg": [
            49.25,
            34.10553474144629
        ],
        "wc_review_avg": [
            686.75,
            314.42755524921796
        ],
        "wc_reply_reviewers_avg": [
            143.5,
            153.83838922713667
        ],
        "wc_reply_authors_avg": [
            1179.75,
            662.3116241619197
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            1.6393596310755
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7380282687713405927&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Georgia Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.gatech.edu",
        "aff_unique_abbr": "Georgia Tech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "The Update-Equivalence Framework for Decision-Time Planning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18938",
        "id": "JXGph215fL",
        "author_site": "Samuel Sokota, Gabriele Farina, David Wu, Hengyuan Hu, Kevin A. Wang, J Kolter, Noam Brown",
        "tldr": "",
        "abstract": "The process of revising (or constructing) a policy at execution time---known as decision-time planning---has been key to achieving superhuman performance in perfect-information games like chess and Go. A recent line of work has extended decision-time planning to imperfect-information games, leading to superhuman performance in poker. However, these methods involve solving subgames whose sizes grow quickly in the amount of non-public information, making them unhelpful when the amount of non-public information is large.\nMotivated by this issue, we introduce an alternative framework for decision-time planning that is not based on solving subgames, but rather on update equivalence. In this update-equivalence framework, decision-time planning algorithms replicate the updates of last-iterate algorithms, which need not rely on public information. This facilitates scalability to games with large amounts of non-public information. Using this framework, we derive a provably sound search algorithm for fully cooperative games based on mirror descent and a search algorithm for adversarial games based on magnetic mirror descent. We validate the performance of these algorithms in cooperative and adversarial domains, notably in Hanabi, the standard benchmark for search in fully cooperative imperfect-information games. Here, our mirror descent approach exceeds or matches the performance of public information-based search while using two orders of magnitude less search time. This is the first instance of a non-public-information-based algorithm outperforming public-information-based approaches in a domain they have historically dominated.",
        "keywords": "imperfect-information games;search;decision-time planning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Samuel Sokota;Gabriele Farina;David J Wu;Hengyuan Hu;Kevin A. Wang;J Zico Kolter;Noam Brown",
        "authorids": "~Samuel_Sokota1;~Gabriele_Farina1;~David_J_Wu1;~Hengyuan_Hu2;~Kevin_A._Wang1;~J_Zico_Kolter1;~Noam_Brown2",
        "gender": "M;M;;;M;M;M",
        "homepage": "https://ssokota.github.io/;http://www.cs.cmu.edu/~gfarina/about/;;http://www.cs.cmu.edu/~noamb;;http://www.zicokolter.com;http://scientist.wang",
        "dblp": "243/5881;;;https://dblp.uni-trier.de/pers/hd/b/Brown:Noam;;67/2526;315/0812.html",
        "google_scholar": ";sktDNcEAAAAJ;;RLDbLcUAAAAJ;oF46lMIAAAAJ;UXh1I6UAAAAJ;",
        "orcid": ";;0000-0002-5834-4936;;;;",
        "linkedin": "samuel-sokota-87a153149/;;;;;;",
        "or_profile": "~Samuel_Sokota1;~Gabriele_Farina1;~David_J_Wu1;~Noam_Brown2;~Hengyuan_Hu1;~Zico_Kolter1;~Kevin_Wang2",
        "aff": "Carnegie Mellon University;Massachusetts Institute of Technology;Meta Facebook;Meta Facebook;Computer Science Department, Stanford University;Carnegie Mellon University;Brown University",
        "aff_domain": "cmu.edu;mit.edu;fb.com;facebook.com;cs.stanford.edu;cmu.edu;brown.edu",
        "position": "PhD student;Assistant Professor;Researcher;Research Scientist;PhD student;Full Professor;PhD student",
        "bibtex": "@inproceedings{\nsokota2024the,\ntitle={The Update-Equivalence Framework for Decision-Time Planning},\nauthor={Samuel Sokota and Gabriele Farina and David J Wu and Hengyuan Hu and Kevin A. Wang and J Zico Kolter and Noam Brown},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=JXGph215fL}\n}",
        "github": "",
        "project": "",
        "reviewers": "Vf98;ipeG;W84D;kQSj",
        "pdf_size": 621769,
        "rating": "3;3;5;6",
        "confidence": "3;3;2;2",
        "soundness": "2;2;3;3",
        "contribution": "1;2;2;3",
        "presentation": "1;1;2;3",
        "wc_summary": "78;50;82;82",
        "wc_strengths": "18;32;50;51",
        "wc_weaknesses": "50;131;106;38",
        "wc_questions": "184;37;28;33",
        "wc_review": "330;250;266;204",
        "wc_reply_reviewers": "0;55;27;42",
        "wc_reply_authors": "527;475;568;272",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            2.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            73.0,
            13.379088160259652
        ],
        "wc_strengths_avg": [
            37.75,
            13.681648292512127
        ],
        "wc_weaknesses_avg": [
            81.25,
            38.518664307060284
        ],
        "wc_questions_avg": [
            70.5,
            65.60678318588711
        ],
        "wc_review_avg": [
            262.5,
            45.13036671687922
        ],
        "wc_reply_reviewers_avg": [
            31.0,
            20.457272545478784
        ],
        "wc_reply_authors_avg": [
            460.5,
            113.71125713842056
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.9622504486493761,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3333910930879121787&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=JXGph215fL",
        "pdf": "https://openreview.net/pdf?id=JXGph215fL",
        "email": "cmu.edu;mit.edu;fb.com;facebook.com;cs.stanford.edu;cmu.edu;brown.edu",
        "author_num": 7,
        "aff_unique_index": "0;1;2;2;3;0;4",
        "aff_unique_norm": "Carnegie Mellon University;Massachusetts Institute of Technology;Meta;Stanford University;Brown University",
        "aff_unique_dep": ";;Meta Platforms, Inc.;Computer Science Department;",
        "aff_unique_url": "https://www.cmu.edu;https://web.mit.edu;https://meta.com;https://www.stanford.edu;https://www.brown.edu",
        "aff_unique_abbr": "CMU;MIT;Meta;Stanford;Brown",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Stanford",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "JXjXeTsqgW",
        "title": "Sequential Condition Evolved Interaction Knowledge Graph for Traditional Chinese Medicine Recommendation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Traditional Chinese Medicine (TCM) has a rich history of utilizing natural herbs to treat a diversity of illnesses. In practice, TCM diagnosis and treatment are highly personalized and organically holistic, requiring comprehensive consideration of the patient's state and symptoms over time. However, existing TCM recommendation approaches overlook the changes in patient status and only explore potential patterns between symptoms and prescriptions. In this paper, we propose a novel Sequential Condition Evolved Interaction Knowledge Graph (SCEIKG), a framework that treats the model as a sequential prescription-making problem by considering the dynamics of the patient's condition across multiple visits. In addition, we incorporate an interaction knowledge graph to enhance the accuracy of recommendations by considering the interactions between different herbs and the patient's condition. Experimental results on a real-world dataset demonstrate that our approach outperforms existing TCM recommendation methods, achieving state-of-the-art performance.",
        "keywords": "Sequential Traditional Chinese Medicine\uff0c Recommendation\uff0c Condition;Multiple visists",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/f4e50b5affead524c0a59e0fba8fe4c2836f3bc7.pdf",
        "author": "Jingjin Liu;Hankz Hankui Zhuo;Kebing Jin;yuan jiamin;yang zhimin;Zhengan Yao",
        "authorids": "~Jingjin_Liu1;~Hankz_Hankui_Zhuo2;~Kebing_Jin1;~yuan_jiamin1;~yang_zhimin1;~Zhengan_Yao1",
        "gender": "F;M;F;M;F;",
        "homepage": "https://github.com/Jingjin-Liu;http://xplan-lab.org;http://xplan-lab.org/cody.html;;;https://math.sysu.edu.cn/teacher/635",
        "dblp": ";12/793;296/8765;;;42/2248",
        "google_scholar": ";;;;;",
        "orcid": ";;0000-0002-2788-5756;0000-0002-9382-4476;0000-0003-4472-6623;",
        "linkedin": ";;;;;",
        "or_profile": "~Jingjin_Liu1;~Hankz_Hankui_Zhuo2;~Kebing_Jin1;~yuan_jiamin1;~yang_zhimin1;~Zhengan_Yao1",
        "aff": "SUN YAT-SEN UNIVERSITY;;SUN YAT-SEN UNIVERSITY;The Second Affiliated Hospital of Guangzhou University of Traditional Chinese Medicine;;SUN YAT-SEN UNIVERSITY",
        "aff_domain": "sysu.edu.cn;;sysu.edu.cn;gzucm.edu.cn;;sysu.edu.cn",
        "position": "PhD student;;PhD student;Researcher;;Full Professor",
        "bibtex": "@misc{\nliu2024sequential,\ntitle={Sequential Condition Evolved Interaction Knowledge Graph for Traditional Chinese Medicine Recommendation},\nauthor={Jingjin Liu and Hankz Hankui Zhuo and Kebing Jin and yuan jiamin and yang zhimin and Zhengan Yao},\nyear={2024},\nurl={https://openreview.net/forum?id=JXjXeTsqgW}\n}",
        "github": "",
        "project": "",
        "reviewers": "WEMc;9xVT;TUE4;K5T8",
        "site": "https://openreview.net/forum?id=JXjXeTsqgW",
        "pdf_size": 6601854,
        "rating": "5;5;5;6",
        "confidence": "3;3;4;4",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;2;3",
        "wc_summary": "111;152;38;64",
        "wc_strengths": "49;32;43;41",
        "wc_weaknesses": "195;148;55;238",
        "wc_questions": "49;30;130;32",
        "wc_review": "404;362;266;375",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "2395;1398;4054;2261",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "6;3;9;5",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            91.25,
            43.757142274147654
        ],
        "wc_strengths_avg": [
            41.25,
            6.098155458825234
        ],
        "wc_weaknesses_avg": [
            159.0,
            67.95954679071956
        ],
        "wc_questions_avg": [
            60.25,
            40.94126891047711
        ],
        "wc_review_avg": [
            351.75,
            51.78983973715308
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            2527.0,
            961.0606120323525
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            5.75,
            2.165063509461097
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17847687869688922671&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Sun Yat-sen University;Guangzhou University of Traditional Chinese Medicine",
        "aff_unique_dep": ";The Second Affiliated Hospital",
        "aff_unique_url": "http://www.sysu.edu.cn;",
        "aff_unique_abbr": "SYSU;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "JXm3QYlNPn",
        "title": "Optimize Weight Rounding via Signed Gradient Descent for the Quantization of LLMs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) have proven their exceptional capabilities in performing language-related tasks. However, their deployment poses significant challenges due to their considerable memory and storage requirements. In response to this issue, weight-only quantization, particularly 3 and 4-bit weight-only quantization, has emerged as one of the most viable solutions. As the number of bits decreases, the quantization grid broadens, thus emphasizing the importance of up and down rounding. While previous studies have demonstrated that fine-tuning up and down rounding with the addition of perturbations can enhance accuracy in some scenarios, our study is driven by the precise and limited boundary of these perturbations, where only the threshold for altering the rounding value is of significance. Consequently, we propose a concise and highly effective approach for optimizing the weight rounding task. Our method, named SignRound, involves lightweight block-wise tuning using signed gradient descent, enabling us to achieve outstanding results within 400 steps. SignRound competes impressively against recent methods without introducing additional inference overhead. The code will be open-sourced.",
        "keywords": "Quantization;LLM;Weight Only",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/85bbef27736067efeafccd5d544ac47f7954ee61.zip",
        "author": "Wenhua Cheng;Weiwei Zhang;Haihao Shen;Yiyang Cai;Xin He;Lv Kaokao",
        "authorids": "~Wenhua_Cheng1;~Weiwei_Zhang2;~Haihao_Shen1;~Yiyang_Cai2;~Xin_He14;~Lv_Kaokao1",
        "gender": ";F;M;M;M;",
        "homepage": ";https://github.com/WeiweiZhang1;;https://github.com/YIYANGCAI;https://github.com/xin3he;https://github.com/lkk12014402",
        "dblp": ";06/4036.html;83/4358;https://dblp.uni-trier.de/pid/254/0283;69/1798.html;259/5543",
        "google_scholar": ";;;;https://scholar.google.com/citations?view_op=list_works;",
        "orcid": ";;;;0009-0008-8916-4453;",
        "linkedin": "wenhua-cheng-05460bb0/;;;;;",
        "or_profile": "~Wenhua_Cheng1;~Weiwei_Zhang2;~Haihao_Shen1;~Yiyang_Cai2;~Xin_He14;~Lv_Kaokao1",
        "aff": "Intel;Intel;Intel;Intel;Intel;Intel",
        "aff_domain": "intel.com;intel.com;intel.com;intel.com;intel.com;intel.com",
        "position": "Researcher;Researcher;Researcher;Researcher;Researcher;Researcher",
        "bibtex": "@misc{\ncheng2024optimize,\ntitle={Optimize Weight Rounding via Signed Gradient Descent for the Quantization of {LLM}s},\nauthor={Wenhua Cheng and Weiwei Zhang and Haihao Shen and Yiyang Cai and Xin He and Lv Kaokao},\nyear={2024},\nurl={https://openreview.net/forum?id=JXm3QYlNPn}\n}",
        "github": "",
        "project": "",
        "reviewers": "TRJs;yH6X;vB5y;GzCp",
        "site": "https://openreview.net/forum?id=JXm3QYlNPn",
        "pdf_size": 1610327,
        "rating": "5;5;5;6",
        "confidence": "5;4;4;5",
        "soundness": "3;2;2;4",
        "contribution": "2;1;2;2",
        "presentation": "3;2;2;4",
        "wc_summary": "53;91;29;44",
        "wc_strengths": "20;50;78;76",
        "wc_weaknesses": "32;60;191;79",
        "wc_questions": "305;4;68;51",
        "wc_review": "410;205;366;250",
        "wc_reply_reviewers": "137;258;221;71",
        "wc_reply_authors": "986;700;967;332",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            54.25,
            22.884219453588535
        ],
        "wc_strengths_avg": [
            56.0,
            23.53720459187964
        ],
        "wc_weaknesses_avg": [
            90.5,
            60.38418667167755
        ],
        "wc_questions_avg": [
            107.0,
            116.69404440673054
        ],
        "wc_review_avg": [
            307.75,
            83.27777314505954
        ],
        "wc_reply_reviewers_avg": [
            171.75,
            72.84015032933416
        ],
        "wc_reply_authors_avg": [
            746.25,
            264.5528066379187
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 20,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10769029938373920067&as_sdt=80005&sciodt=0,11&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "Intel",
        "aff_unique_dep": "Intel Corporation",
        "aff_unique_url": "https://www.intel.com",
        "aff_unique_abbr": "Intel",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "JYXzKTljwx",
        "title": "Uniform Localized Convergence and Sharper Generalization Bounds for Minimax Problems",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Minimax problems have achieved widely success in machine learning such as adversarial training, robust optimization, reinforcement learning. Existing studies focus on minimax problems with specific \\text{algorithms} in stochastic optimization, with only a few work on generalization performance. Current generalization bounds almost all depend on stability, which need case-by-case analyses for specific \\text{algorithms}. Additionally, recent work provides the $O(\\sqrt{d/n})$ generalization bound in expectation based on uniform convergence. In this paper, we study the generalization bounds measured by the gradients of primal functions using the uniform localized convergence. We relax the Lipschitz continuity assumption and give a sharper high probability generalization bound for nonconvex-strongly-concave (NC-SC) stochastic minimax problems considering the localized information. Furthermore, we provide dimension-independent results under Polyak-Lojasiewicz condition for the outer layer. Based on the uniform localized convergence, we analyze some popular \\text{algorithms} such as the empirical saddle point (ESP), gradient descent ascent (GDA) and stochastic gradient descent ascent (SGDA) and improve the generalization bounds for primal functions. We can even gain approximate $O(1/n^2)$ excess primal risk bounds with further assumptions that the optimal population risks are small, which, to the best of our knowledge, are the sharpest results in minimax problems.",
        "keywords": "generalization analysis; minimax problems",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/180d28d336f39f8af88a8404dea7ab0a6ee20b02.pdf",
        "author": "Bowei Zhu;Shaojie Li;Yong Liu",
        "authorids": "~Bowei_Zhu1;~Shaojie_Li2;~Yong_Liu7",
        "gender": ";M;M",
        "homepage": ";;https://iie-liuyong.github.io",
        "dblp": "304/1543;;29/4867-18",
        "google_scholar": ";;vVhmzbAAAAAJ",
        "orcid": ";;0000-0002-6739-621X",
        "linkedin": ";;",
        "or_profile": "~Bowei_Zhu1;~Shaojie_Li2;~Yong_Liu7",
        "aff": "Renmin University of China;Renmin University of China;Renmin University of China",
        "aff_domain": "ruc.edu.cn;ruc.edu.cn;ruc.edu.cn",
        "position": "PhD student;PhD student;Associate Professor",
        "bibtex": "@misc{\nzhu2024uniform,\ntitle={Uniform Localized Convergence and Sharper Generalization Bounds for Minimax Problems},\nauthor={Bowei Zhu and Shaojie Li and Yong Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=JYXzKTljwx}\n}",
        "github": "",
        "project": "",
        "reviewers": "QX5y;KhvS;yKtG;PvDp",
        "site": "https://openreview.net/forum?id=JYXzKTljwx",
        "pdf_size": 671993,
        "rating": "5;5;5;5",
        "confidence": "4;4;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;2",
        "presentation": "3;3;2;2",
        "wc_summary": "70;75;53;45",
        "wc_strengths": "35;49;47;18",
        "wc_weaknesses": "109;44;169;267",
        "wc_questions": "2;101;3;2",
        "wc_review": "216;269;272;332",
        "wc_reply_reviewers": "0;151;0;0",
        "wc_reply_authors": "615;1034;265;469",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            60.75,
            12.214233500306108
        ],
        "wc_strengths_avg": [
            37.25,
            12.336429791475327
        ],
        "wc_weaknesses_avg": [
            147.25,
            82.06209539123407
        ],
        "wc_questions_avg": [
            27.0,
            42.72587038317651
        ],
        "wc_review_avg": [
            272.25,
            41.06321346412139
        ],
        "wc_reply_reviewers_avg": [
            37.75,
            65.38491798572512
        ],
        "wc_reply_authors_avg": [
            595.75,
            281.91077932565827
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:wgJhOD6AehMJ:scholar.google.com/&scioq=Uniform+Localized+Convergence+and+Sharper+Generalization+Bounds+for+Minimax+Problems&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Renmin University of China",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.ruc.edu.cn",
        "aff_unique_abbr": "RUC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Towards Codable Watermarking for Injecting Multi-Bits Information to LLMs",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18937",
        "id": "JYu5Flqm9D",
        "author_site": "Lean Wang, Wenkai Yang, Deli Chen, Hao Zhou, Yankai Lin, Fandong Meng, Jie Zhou, Xu Sun",
        "tldr": "",
        "abstract": "As large language models (LLMs) generate texts with increasing fluency and realism, there is a growing need to identify the source of texts to prevent the abuse of LLMs. Text watermarking techniques have proven reliable in distinguishing whether a text is generated by LLMs by injecting hidden patterns. However, we argue that existing LLM watermarking methods are encoding-inefficient and cannot flexibly meet the diverse information encoding needs (such as encoding model version, generation time, user id, etc.). In this work, we conduct the first systematic study on the topic of **Codable Text Watermarking for LLMs** (CTWL) that allows text watermarks to carry multi-bit customizable information. First of all, we study the taxonomy of LLM watermarking technologies and give a mathematical formulation for CTWL. Additionally, we provide a comprehensive evaluation system for CTWL: (1) watermarking success rate, (2) robustness against various corruptions, (3) coding rate of payload information, (4) encoding and decoding efficiency, (5) impacts on the quality of the generated text. To meet the requirements of these non-Pareto-improving metrics, we follow the most prominent vocabulary partition-based watermarking direction, and devise an advanced CTWL method named **Balance-Marking**. The core idea of our method is to use a proxy language model to split the vocabulary into probability-balanced parts, thereby effectively maintaining the quality of the watermarked text. Our code is available at https://github.com/lancopku/codable-watermarking-for-llm.",
        "keywords": "text watermarking;large language model;codable;systematic study",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/1bb1b52caae91a3c31cb96e8a0c0dbb18a9a3083.zip",
        "author": "Lean Wang;Wenkai Yang;Deli Chen;Hao Zhou;Yankai Lin;Fandong Meng;Jie Zhou;Xu Sun",
        "authorids": "~Lean_Wang1;~Wenkai_Yang1;~Deli_Chen1;~Hao_Zhou8;~Yankai_Lin1;~Fandong_Meng3;~Jie_Zhou8;~Xu_Sun1",
        "gender": "M;M;M;M;M;M;M;M",
        "homepage": "https://leanwang326.github.io/.github.io/;https://keven980716.github.io;;;https://linyankai.github.io/;http://fandongmeng.github.io/;;https://xusun.org/",
        "dblp": ";250/3934;50/2637;;161/0001.html;117/4056.html;00/5012-16;37/1971-1",
        "google_scholar": "jgyRjQQAAAAJ;8oNc9ZMAAAAJ;8YpGRDcAAAAJ;q3WaozcAAAAJ;https://scholar.google.com.hk/citations?user=j8K1FqEAAAAJ;sA8U4S0AAAAJ;https://scholar.google.com.hk/citations?user=OijxQCMAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;;0000-0002-9182-8158;0000-0002-8158-2377;0000-0002-5899-5165;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Lean_Wang1;~Wenkai_Yang1;~Deli_Chen1;~Hao_Zhou8;~Yankai_Lin1;~Fandong_Meng3;~Jie_Zhou8;~Xu_Sun1",
        "aff": "Peking University;Renmin University of China;DeepSeek AI;Tencent;Renmin University of China;WeChat AI, Tencent Inc.;WeChat AI, Tencent Inc.;Peking University",
        "aff_domain": "pku.edu.cn;ruc.edu.cn;deepseek.com;tencent.com;ruc.edu.cn;tencent.com;tencent.com;pku.edu.cn",
        "position": "PhD student;PhD student;Researcher;Researcher;Assistant Professor;Principal Researcher;Principal Researcher;Associate Professor",
        "bibtex": "@inproceedings{\nwang2024towards,\ntitle={Towards Codable Watermarking for Injecting Multi-Bits Information to {LLM}s},\nauthor={Lean Wang and Wenkai Yang and Deli Chen and Hao Zhou and Yankai Lin and Fandong Meng and Jie Zhou and Xu Sun},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=JYu5Flqm9D}\n}",
        "github": "",
        "project": "",
        "reviewers": "pLxG;qLTC;CxJT;iBFF",
        "pdf_size": 1946621,
        "rating": "5;6;6;6",
        "confidence": "2;3;4;2",
        "soundness": "2;3;3;2",
        "contribution": "2;2;3;2",
        "presentation": "3;4;3;2",
        "wc_summary": "70;115;83;78",
        "wc_strengths": "104;137;29;13",
        "wc_weaknesses": "160;736;17;50",
        "wc_questions": "47;299;175;196",
        "wc_review": "381;1287;304;337",
        "wc_reply_reviewers": "0;294;0;0",
        "wc_reply_authors": "2846;3765;662;815",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "5;6;1;2",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            86.5,
            17.09532099727876
        ],
        "wc_strengths_avg": [
            70.75,
            51.4119392748416
        ],
        "wc_weaknesses_avg": [
            240.75,
            290.79320401274856
        ],
        "wc_questions_avg": [
            179.25,
            89.62247207034629
        ],
        "wc_review_avg": [
            577.25,
            410.68380476955747
        ],
        "wc_reply_reviewers_avg": [
            73.5,
            127.30573435631248
        ],
        "wc_reply_authors_avg": [
            2022.0,
            1325.091883606567
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.5,
            2.0615528128088303
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.5222329678670935,
        "gs_citation": 21,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10746357308805002661&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=JYu5Flqm9D",
        "pdf": "https://openreview.net/pdf?id=JYu5Flqm9D",
        "email": "pku.edu.cn;ruc.edu.cn;deepseek.com;tencent.com;ruc.edu.cn;tencent.com;tencent.com;pku.edu.cn",
        "author_num": 8,
        "aff_unique_index": "0;1;2;3;1;3;3;0",
        "aff_unique_norm": "Peking University;Renmin University of China;DeepSeek AI;Tencent",
        "aff_unique_dep": ";;;Tencent Holdings Limited",
        "aff_unique_url": "http://www.pku.edu.cn;http://www.ruc.edu.cn;;https://www.tencent.com",
        "aff_unique_abbr": "Peking U;RUC;DeepSeek AI;Tencent",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0;0;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "JZ1CEYgDob",
        "title": "Flexible Diffusion for Graph Neural Networks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Graph Neural Networks (GNNs) are attracting growing attention due to their promising performance in modeling a variety of graph-structured data. However, most existing GNNs only consider fixed-range discrete message passing and aggregation, none of them are aware of the importance of the degree and local structure of nodes for smoothing features, which significantly limits the applicability of GNNs. Furthermore, previous approaches either focus on adaptive selection for aggregation structures or treat discrete graph convolution as a continuous diffusion process, lacking holistic consideration of the two issues and resulting in the performance of the model being significantly limited. To this end, we propose a novel Flexible Diffusion Convolution (Flexi-DC), which aims to smooth features by setting a specific continuous diffusion for each node through the degree-and-local structure of the nodes. Specifically, Flexi-DC first extracts the degree and local structure knowledge of the nodes in the graph data and then injects it into the diffusion convolution module to smooth features. Additionally, we also utilize the extracted knowledge for smoothing labels. Flexi-DC is an efficient framework that can significantly improve the performance of most GNN architectures. Experimental results demonstrate that Flexi-DC outperforms their vanilla implementations by an average accuracy of 10.82\\% (GCN), 12.33\\% (JKNet), and 11.04\\% (ARMA) on nine graph datasets with different homophily ratios.",
        "keywords": "Graph Neural Network; Diffusion; Smoothing Label",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/b5eddac314b92f0b27fd945538012678cf66ef91.pdf",
        "author": "Songwei Zhao",
        "authorids": "~Songwei_Zhao1",
        "gender": "M",
        "homepage": "https://scholar.google.com.hk/citations?hl=zh-CN&user=yl3MBFEAAAAJ&view_op=list_works",
        "dblp": "297/6288",
        "google_scholar": "https://scholar.google.com.hk/citations?hl=zh-CN",
        "orcid": "0000-0001-6149-3214",
        "linkedin": "",
        "or_profile": "~Songwei_Zhao1",
        "aff": "Jilin University",
        "aff_domain": "jlu.edu.cn",
        "position": "PhD student",
        "bibtex": "@misc{\nzhao2024flexible,\ntitle={Flexible Diffusion for Graph Neural Networks},\nauthor={Songwei Zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=JZ1CEYgDob}\n}",
        "github": "",
        "project": "",
        "reviewers": "RJ7x;co1S;JgmZ;f45a",
        "site": "https://openreview.net/forum?id=JZ1CEYgDob",
        "pdf_size": 4547322,
        "rating": "3;3;3;3",
        "confidence": "4;3;4;4",
        "soundness": "2;1;2;2",
        "contribution": "1;2;2;2",
        "presentation": "1;2;2;1",
        "wc_summary": "44;29;84;150",
        "wc_strengths": "37;17;62;60",
        "wc_weaknesses": "314;442;311;356",
        "wc_questions": "37;17;2;71",
        "wc_review": "432;505;459;637",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            76.75,
            46.826141203391934
        ],
        "wc_strengths_avg": [
            44.0,
            18.425525772688278
        ],
        "wc_weaknesses_avg": [
            355.75,
            52.87898921121696
        ],
        "wc_questions_avg": [
            31.75,
            25.839649765428323
        ],
        "wc_review_avg": [
            508.25,
            78.78253296257998
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3168991173893918167&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Jilin University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.jlu.edu.cn",
        "aff_unique_abbr": "JLU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "JZC8cEmMWY",
        "title": "How Does Message Passing Improve Collaborative Filtering?",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Collaborative filtering (CF) has exhibited prominent results for recommender systems and is broadly utilized for real-world applications. A branch of research enhances CF methods with message passing used in graph neural networks, due to its strong capabilities of extracting knowledge from graph-structured data, like user-item bipartite graphs that naturally exist in CF. They assume that message passing helps CF methods in a manner akin to its benefits for graph-based learning tasks in general (e.g., node classification). However, whether or not this assumption is correct still needs verification, even though message passing empirically improves CF. To address this gap, we formally investigate why message passing helps CF from multiple perspectives (i.e., information passed from neighbors, additional gradients for neighbors, and individual improvement gains of subgroups w.r.t. the node degree) and show that many assumptions made by previous works are not entirely accurate. With our rigorously designed ablation studies and analyses, we discover that message passing  (i) improves the CF performance primarily by information passed from neighbors instead of their accompanying gradients and (ii) usually helps low-degree nodes more than high-degree nodes. Utilizing these novel findings, we present Test-time Aggregation for Collaborative Filtering, namely TAG-CF, a test-time augmentation framework that only conducts message passing once at inference time. \nIt can be used as a plug-and-play module and is effective at enhancing representations trained by different CF supervision signals. Evaluated on five datasets, TAG-CF performs on par with or better than trending graph-based CF methods with less than 1% of their total training time. Furthermore, we show that test-time aggregation in TAG-CF improves recommendation performance in similar ways as the training-time aggregation does, demonstrating the legitimacy of our findings on why message passing improves CF.",
        "keywords": "Collaborative Filtering;Recommender System;Test-time Augmentation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/05589b9e9cffd5555dfc2408b75fd32f3031bca1.zip",
        "author": "Mingxuan Ju;William Shiao;Zhichun Guo;Yanfang Ye;Yozen Liu;Neil Shah;Tong Zhao",
        "authorids": "~Mingxuan_Ju1;~William_Shiao1;~Zhichun_Guo1;~Yanfang_Ye1;~Yozen_Liu1;~Neil_Shah2;~Tong_Zhao3",
        "gender": "M;M;;;;M;M",
        "homepage": "https://jumxglhf.github.io;https://shiao.me;;http://yes-lab.org/;https://www.linkedin.com/in/yozen-liu-531a67130/;http://nshah.net;https://tzhao.io/",
        "dblp": "234/2715;304/3898;;;242/8056.html;71/7771;94/6503-3",
        "google_scholar": "qNoO67AAAAAJ;TIq-P5AAAAAJ;;egjr888AAAAJ;i3U2JjEAAAAJ;Qut69OgAAAAJ;05cRc-MAAAAJ",
        "orcid": "0009-0008-9054-3856;0000-0001-5813-2266;;;;0000-0003-3261-8430;0000-0001-7660-1732",
        "linkedin": ";will-shiao;;;;;",
        "or_profile": "~Mingxuan_Ju1;~William_Shiao1;~Zhichun_Guo1;~Yanfang_Ye1;~Yozen_Liu1;~Neil_Shah2;~Tong_Zhao3",
        "aff": "University of Notre Dame;University of California, Riverside;;University of Notre Dame;Snap Inc.;Snap Inc.;Snap Inc.",
        "aff_domain": "nd.edu;ucr.edu;;nd.edu;snapchat.com;snap.com;snap.com",
        "position": "PhD student;PhD student;;Associate Professor;Researcher;Research Scientist;Researcher",
        "bibtex": "@misc{\nju2024how,\ntitle={How Does Message Passing Improve Collaborative Filtering?},\nauthor={Mingxuan Ju and William Shiao and Zhichun Guo and Yanfang Ye and Yozen Liu and Neil Shah and Tong Zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=JZC8cEmMWY}\n}",
        "github": "",
        "project": "",
        "reviewers": "gGxd;uTpx;6tQK;bF6q",
        "site": "https://openreview.net/forum?id=JZC8cEmMWY",
        "pdf_size": 620556,
        "rating": "3;3;5;8",
        "confidence": "4;5;4;4",
        "soundness": "3;2;2;3",
        "contribution": "2;1;2;3",
        "presentation": "2;2;3;3",
        "wc_summary": "82;64;144;249",
        "wc_strengths": "105;38;45;66",
        "wc_weaknesses": "260;605;164;138",
        "wc_questions": "24;42;35;154",
        "wc_review": "471;749;388;607",
        "wc_reply_reviewers": "0;0;0;82",
        "wc_reply_authors": "2036;2545;1182;1275",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "5;8;5;3",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            134.75,
            72.33040508665772
        ],
        "wc_strengths_avg": [
            63.5,
            26.081602711489953
        ],
        "wc_weaknesses_avg": [
            291.75,
            186.4757021705509
        ],
        "wc_questions_avg": [
            63.75,
            52.49940475853036
        ],
        "wc_review_avg": [
            553.75,
            137.18486614783717
        ],
        "wc_reply_reviewers_avg": [
            20.5,
            35.50704155516198
        ],
        "wc_reply_authors_avg": [
            1759.5,
            561.629103590617
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            5.25,
            1.7853571071357126
        ],
        "replies_avg": [
            32,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.49374193110101877,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16991904459665836101&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0;2;2;2",
        "aff_unique_norm": "University of Notre Dame;University of California, Riverside;Snap Inc.",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.nd.edu;https://www.ucr.edu;https://www.snapinc.com",
        "aff_unique_abbr": "Notre Dame;UCR;Snap",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Riverside",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "JauBLBEjOy",
        "title": "AvatarStudio: High-fidelity and Animatable 3D Avatar Creation from Text",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We study the problem of creating high-fidelity and animatable 3D avatars from only textual descriptions. Existing text-to-avatar methods are either limited to static avatars which cannot be animated or struggle to generate animatable avatars with promising quality and precise pose control. To address these limitations, we propose AvatarStudio, a coarse-to-fine generative model that generates explicit textured 3D meshes for animatable human avatars. Specifically, AvatarStudio begins with a low-resolution NeRF-based representation for coarse generation, followed by incorporating SMPL-guided articulation into the explicit mesh representation to support avatar animation and high-resolution rendering. To ensure view consistency and pose controllability of the resulting avatars, we  introduce a 2D diffusion model conditioned on DensePose for Score Distillation Sampling supervision. By effectively leveraging the synergy between the articulated mesh representation and the DensePose-conditional diffusion model, AvatarStudio can create high-quality avatars from text that are ready for animation, significantly outperforming previous methods.  Moreover, it is competent for many applications, e.g., multimodal avatar animations and style-guided avatar creation. Our project page is https://avatarstudio3d.github.io/.",
        "keywords": "text-guided 3D generative model;animatable human avatar",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Jianfeng Zhang;Xuanmeng Zhang;Huichao Zhang;Jun Hao Liew;Chenxu Zhang;Yi Yang;Jiashi Feng",
        "authorids": "~Jianfeng_Zhang3;~Xuanmeng_Zhang1;~Huichao_Zhang1;~Jun_Hao_Liew1;~Chenxu_Zhang1;~Yi_Yang4;~Jiashi_Feng1",
        "gender": "M;;M;;M;M;M",
        "homepage": "https://jeff95.me;;;;;http://reler.net/;https://sites.google.com/site/jshfeng/",
        "dblp": ";257/4774.html;;;;;56/8278",
        "google_scholar": "https://scholar.google.com.sg/citations?hl=en;https://scholar.google.pl/citations?user=QzlBBMEAAAAJ;https://scholar.google.com.hk/citations?user=ZfUJGskAAAAJ;https://scholar.google.com.sg/citations?user=8gm-CYYAAAAJ;XnefngEAAAAJ;https://scholar.google.com.au/citations?user=RMSuNFwAAAAJ;https://scholar.google.com.sg/citations?user=Q8iay0gAAAAJ",
        "orcid": ";0000-0002-6939-4074;;;;;0000-0001-6843-0064",
        "linkedin": ";;;;;;",
        "or_profile": "~Jianfeng_Zhang3;~Xuanmeng_Zhang1;~Huichao_Zhang1;~Jun_Hao_Liew1;~Chenxu_Zhang1;~Yi_Yang4;~Jiashi_Feng2",
        "aff": "national university of singapore, National University of Singapore;University of Technology Sydney;ByteDance Inc.;ByteDance;Bytedance;Zhejiang University;ByteDance",
        "aff_domain": "u.nus.edu;uts.edu.au;bytedance.com;bytedance.com;bytedance.com;zju.edu.cn;bytedance.com",
        "position": "PhD student;PhD student;Researcher;Researcher;Researcher;Full Professor;Research Lead",
        "bibtex": "@misc{\nzhang2024avatarstudio,\ntitle={AvatarStudio: High-fidelity and Animatable 3D Avatar Creation from Text},\nauthor={Jianfeng Zhang and Xuanmeng Zhang and Huichao Zhang and Jun Hao Liew and Chenxu Zhang and Yi Yang and Jiashi Feng},\nyear={2024},\nurl={https://openreview.net/forum?id=JauBLBEjOy}\n}",
        "github": "",
        "project": "",
        "reviewers": "q3fv;B6UK;L83u",
        "site": "https://openreview.net/forum?id=JauBLBEjOy",
        "pdf_size": 27973853,
        "rating": "5;5;8",
        "confidence": "4;4;4",
        "soundness": "2;3;3",
        "contribution": "2;2;3",
        "presentation": "1;3;3",
        "wc_summary": "98;91;42",
        "wc_strengths": "27;97;75",
        "wc_weaknesses": "81;209;60",
        "wc_questions": "178;2;58",
        "wc_review": "384;399;235",
        "wc_reply_reviewers": "59;0;0",
        "wc_reply_authors": "2738;1039;301",
        "reply_reviewers": "1;0;0",
        "reply_authors": "5;2;1",
        "rating_avg": [
            6.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            77.0,
            24.91318258807306
        ],
        "wc_strengths_avg": [
            66.33333333333333,
            29.227080289043965
        ],
        "wc_weaknesses_avg": [
            116.66666666666667,
            65.84999789082929
        ],
        "wc_questions_avg": [
            79.33333333333333,
            73.41813278899309
        ],
        "wc_review_avg": [
            339.3333333333333,
            74.02852303147904
        ],
        "wc_reply_reviewers_avg": [
            19.666666666666668,
            27.812866726670865
        ],
        "wc_reply_authors_avg": [
            1359.3333333333333,
            1020.3601760598505
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            1.699673171197595
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9431383767642733797&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;2;2;3;2",
        "aff_unique_norm": "National University of Singapore;University of Technology Sydney;ByteDance;Zhejiang University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.nus.edu.sg;https://www.uts.edu.au;https://www.bytedance.com;https://www.zju.edu.cn",
        "aff_unique_abbr": "NUS;UTS;ByteDance;ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;2;2;2;2",
        "aff_country_unique": "Singapore;Australia;China"
    },
    {
        "id": "JbOsMrwjZ3",
        "title": "BioCoder: A Benchmark for Bioinformatics Code Generation with Contextual Pragmatic Knowledge",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Pre-trained language models like ChatGPT have significantly improved code generation. As these models scale up, there is an increasing need for the output to handle more intricate tasks and to be appropriately specialized to particular domains. Bioinformatics provides an important domain. In this field generating functional programs poses additional notable challenges due to the amount of specialized domain knowledge, the need for complicated data operations, and intricate functional dependencies between the operations. Here, we present BioCoder, a benchmark developed to evaluate existing pre-trained models in generating bioinformatics code. In relation to function-code generation, BioCoder covers potential package dependencies, class declarations, and global variables. It incorporates 1026 functions and 1243 methods in Python and Java from GitHub and 253 examples from the Rosalind Project. BioCoder incorporates a fuzz-testing framework for evaluation, and we have applied it to evaluate many models including InCoder, CodeGen, CodeGen2, SantaCoder, StarCoder, StarCoder+, InstructCodeT5+, GPT-3.5, and GPT-4. The results highlight two key aspects of successful models: 1) that they contain specific domain knowledge of bioinformatics (beyond just coding knowledge); 2) that they accommodate a long prompt with full context (i.e. functional dependencies).",
        "keywords": "Code Generation;Benchmark;Large Language Models;Dataset",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/cdabc09969153a9c7af145a7fe1838680f12f18a.pdf",
        "author": "Xiangru Tang;Bill Qian;Rick Gao;Jiakang Chen;Xinyun Chen;Mark Gerstein",
        "authorids": "~Xiangru_Tang2;~Bill_Qian1;~Rick_Gao1;~Jiakang_Chen1;~Xinyun_Chen1;~Mark_Gerstein2",
        "gender": "M;M;M;;M;F",
        "homepage": "https://xiangrutang.github.io/;;;;http://www.gersteinlab.org/;https://jungyhuk.github.io/",
        "dblp": "246/8064;;;;67/5132;",
        "google_scholar": ";;;;YvjuUugAAAAJ;d4W1UT0AAAAJ",
        "orcid": ";;;;0000-0002-9746-3719;",
        "linkedin": ";billqian/;rgao09/;jiakang-chen-78b83820a/;mbgmbg/;",
        "or_profile": "~Xiangru_Tang2;~Bill_Qian1;~Rick_Gao1;~Jiakang_Chen1;~Mark_Gerstein1;~Xinyun_Chen2",
        "aff": "Yale University;Yale University;Yale University;Yale University;Yale University;Google",
        "aff_domain": "yale.edu;yale.edu;yale.edu;yale.edu;yale.edu;google.com",
        "position": "PhD student;Undergrad student;Undergrad student;Undergrad student;Full Professor;Researcher",
        "bibtex": "@misc{\ntang2024biocoder,\ntitle={BioCoder: A Benchmark for Bioinformatics Code Generation with Contextual Pragmatic Knowledge},\nauthor={Xiangru Tang and Bill Qian and Rick Gao and Jiakang Chen and Xinyun Chen and Mark Gerstein},\nyear={2024},\nurl={https://openreview.net/forum?id=JbOsMrwjZ3}\n}",
        "github": "",
        "project": "",
        "reviewers": "Adqr;BxXn;r6TX;p2gV",
        "site": "https://openreview.net/forum?id=JbOsMrwjZ3",
        "pdf_size": 1332416,
        "rating": "5;6;6;8",
        "confidence": "4;2;4;4",
        "soundness": "2;3;3;4",
        "contribution": "2;3;3;4",
        "presentation": "1;3;3;4",
        "wc_summary": "65;102;112;63",
        "wc_strengths": "59;38;38;88",
        "wc_weaknesses": "49;78;538;53",
        "wc_questions": "631;37;47;1",
        "wc_review": "804;255;735;205",
        "wc_reply_reviewers": "448;158;0;0",
        "wc_reply_authors": "3630;894;3294;231",
        "reply_reviewers": "3;1;0;0",
        "reply_authors": "10;2;8;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            85.5,
            21.80022935659164
        ],
        "wc_strengths_avg": [
            55.75,
            20.498475553074673
        ],
        "wc_weaknesses_avg": [
            179.5,
            207.27819470460466
        ],
        "wc_questions_avg": [
            179.0,
            261.5224655741835
        ],
        "wc_review_avg": [
            499.75,
            271.42713110520106
        ],
        "wc_reply_reviewers_avg": [
            151.5,
            182.93373117060725
        ],
        "wc_reply_authors_avg": [
            2012.25,
            1473.3747613896473
        ],
        "reply_reviewers_avg": [
            1.0,
            1.224744871391589
        ],
        "reply_authors_avg": [
            5.25,
            3.832427429188973
        ],
        "replies_avg": [
            32,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.13245323570650439,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7524521038315296808&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0;1",
        "aff_unique_norm": "Yale University;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.yale.edu;https://www.google.com",
        "aff_unique_abbr": "Yale;Google",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "SEA: Sparse Linear Attention with Estimated Attention Mask",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18936",
        "id": "JbcwfmYrob",
        "author_site": "Heejun Lee, Jina Kim, Jeff Willette, Sung Ju Hwang",
        "tldr": "",
        "abstract": "The transformer architecture has driven breakthroughs in recent years on tasks\nwhich require modeling pairwise relationships between sequential elements, as\nis the case in natural language understanding. However, long seqeuences pose a\nproblem due to the quadratic complexity of the attention operation. Previous re-\nsearch has aimed to lower the complexity by sparsifying or linearly approximating\nthe attention matrix. Yet, these approaches cannot straightforwardly distill knowl-\nedge from a teacher\u2019s attention matrix, and often require complete retraining from\nscratch. Furthermore, previous sparse and linear approaches lose interpretability\nif they cannot produce full attention matrices. To address these challenges, we\npropose SEA: Sparse linear attention with an Estimated Attention mask. SEA\nestimates the attention matrix with linear complexity via kernel-based linear at-\ntention, then subsequently creates a sparse attention matrix with a top-k\u0302 selection\nto perform a sparse attention operation. For language modeling tasks (Wikitext2),\nprevious linear and sparse attention methods show roughly two-fold worse per-\nplexity scores over the quadratic OPT-1.3B baseline, while SEA achieves better\nperplexity than OPT-1.3B, using roughly half the memory of OPT-1.3B. More-\nover, SEA maintains an interpretable attention matrix and can utilize knowledge\ndistillation to lower the complexity of existing pretrained transformers. We be-\nlieve that our work will have a large practical impact, as it opens the possibility of\nrunning large transformers on resource-limited devices with less memory.\nCode: https://github.com/gmlwns2000/sea-attention",
        "keywords": "Sparse Attention;Attention Estimation;Linear Attention;Transformers;NLP",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/74f57290d8bc7ba9525a52b10830b2e310f50b87.zip",
        "author": "Heejun Lee;Jina Kim;Jeffrey Willette;Sung Ju Hwang",
        "authorids": "~Heejun_Lee1;~Jina_Kim1;~Jeffrey_Willette1;~Sung_Ju_Hwang1",
        "gender": "M;F;;",
        "homepage": "https://github.com/gmlwns2000;;;",
        "dblp": ";;;",
        "google_scholar": "2RBK_EsAAAAJ;https://scholar.google.com/citations?view_op=list_works;;",
        "orcid": ";;;",
        "linkedin": "%ED%9D%AC%EC%A4%80-%EC%9D%B4-6472ab14b/;jina-kaist-cs-undergrad/;;",
        "or_profile": "~Heejun_Lee1;~Jina_Kim1;~Jeffrey_Willette1;~Sung_Ju_Hwang1",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;;",
        "aff_domain": "kaist.ac.kr;kaist.edu;;",
        "position": "Undergrad student;Undergrad student;;",
        "bibtex": "@inproceedings{\nlee2024sea,\ntitle={{SEA}: Sparse Linear Attention with Estimated Attention Mask},\nauthor={Heejun Lee and Jina Kim and Jeffrey Willette and Sung Ju Hwang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=JbcwfmYrob}\n}",
        "github": "",
        "project": "",
        "reviewers": "VaUL;qYba;V5oR",
        "pdf_size": 16069071,
        "rating": "6;6;8",
        "confidence": "2;3;3",
        "soundness": "2;3;3",
        "contribution": "2;2;3",
        "presentation": "1;3;2",
        "wc_summary": "45;100;83",
        "wc_strengths": "31;81;34",
        "wc_weaknesses": "24;105;215",
        "wc_questions": "84;40;19",
        "wc_review": "184;326;351",
        "wc_reply_reviewers": "5;226;0",
        "wc_reply_authors": "1135;1386;1239",
        "reply_reviewers": "1;1;0",
        "reply_authors": "2;4;3",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            76.0,
            22.992752481307377
        ],
        "wc_strengths_avg": [
            48.666666666666664,
            22.89589968143253
        ],
        "wc_weaknesses_avg": [
            114.66666666666667,
            78.27444595069893
        ],
        "wc_questions_avg": [
            47.666666666666664,
            27.084230754362505
        ],
        "wc_review_avg": [
            287.0,
            73.5436378394941
        ],
        "wc_reply_reviewers_avg": [
            77.0,
            105.37868222115262
        ],
        "wc_reply_authors_avg": [
            1253.3333333333333,
            102.97033013877778
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.0,
            0.816496580927726
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.49999999999999983,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16592384532571811077&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=JbcwfmYrob",
        "pdf": "https://openreview.net/pdf?id=JbcwfmYrob",
        "email": "kaist.ac.kr;kaist.edu;;",
        "author_num": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "Optimal criterion for feature learning of two-layer linear neural network in high dimensional interpolation regime",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18935",
        "id": "Jc0FssXh2R",
        "author_site": "Keita Suzuki, Taiji Suzuki",
        "tldr": "",
        "abstract": "Deep neural networks with feature learning have shown surprising generalization performance in high dimensional settings, but it has not been fully understood how and when they enjoy the benefit of feature learning. In this paper, we theoretically analyze the statistical properties of the benefits from feature learning in a two-layer linear neural network with multiple outputs in a high-dimensional setting. For that purpose, we propose a new criterion that allows feature learning of a two-layer linear neural network in a high-dimensional setting. Interestingly, we can show that models with smaller values of the criterion generalize even in situations where normal ridge regression fails to generalize. This is because the proposed criterion contains a proper regularization for the feature mapping and acts as an upper bound on the predictive risk. As an important characterization of the criterion, the two-layer linear neural network that minimizes this criterion can achieve the optimal Bayes risk that is determined by the distribution of the true signals across the multiple outputs. To the best of our knowledge, this is the first study to specifically identify the conditions under which a model obtained by proper feature learning can outperform normal ridge regression in a high-dimensional multiple-output linear regression problem.",
        "keywords": "two-layer linear neural network;feature learning;optimal criterion;multi-output linear reggression;high-dimensional setting",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/920a4470cbe1224070b0f21f732408b909222390.pdf",
        "author": "Keita Suzuki;Taiji Suzuki",
        "authorids": "~Keita_Suzuki2;~Taiji_Suzuki1",
        "gender": "M;M",
        "homepage": "https://github.com/hamster-86;http://ibis.t.u-tokyo.ac.jp/suzuki/",
        "dblp": ";08/312",
        "google_scholar": ";x8osrBsAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Keita_Suzuki2;~Taiji_Suzuki1",
        "aff": "Preferred Networks, Inc.;The University of Tokyo",
        "aff_domain": "preferred.jp;tokyo.ac.jp",
        "position": "Researcher;Associate Professor",
        "bibtex": "@inproceedings{\nsuzuki2024optimal,\ntitle={Optimal criterion for feature learning of two-layer linear neural network in high dimensional interpolation regime},\nauthor={Keita Suzuki and Taiji Suzuki},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Jc0FssXh2R}\n}",
        "github": "",
        "project": "",
        "reviewers": "8UMM;hzqz;pQvZ;Uw19",
        "pdf_size": 346504,
        "rating": "5;6;6;8",
        "confidence": "5;3;4;4",
        "soundness": "3;3;4;3",
        "contribution": "2;3;3;3",
        "presentation": "2;2;4;3",
        "wc_summary": "90;137;56;85",
        "wc_strengths": "22;145;98;80",
        "wc_weaknesses": "252;418;296;33",
        "wc_questions": "88;304;3;35",
        "wc_review": "452;1004;453;233",
        "wc_reply_reviewers": "8;163;301;0",
        "wc_reply_authors": "1094;1775;1658;224",
        "reply_reviewers": "1;1;4;0",
        "reply_authors": "2;3;5;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            92.0,
            29.04307146291521
        ],
        "wc_strengths_avg": [
            86.25,
            44.03620669403758
        ],
        "wc_weaknesses_avg": [
            249.75,
            139.1337036810276
        ],
        "wc_questions_avg": [
            107.5,
            117.44041042162617
        ],
        "wc_review_avg": [
            535.5,
            284.94604752479023
        ],
        "wc_reply_reviewers_avg": [
            118.0,
            124.03426945808162
        ],
        "wc_reply_authors_avg": [
            1187.75,
            613.1069951484814
        ],
        "reply_reviewers_avg": [
            1.5,
            1.5
        ],
        "reply_authors_avg": [
            2.75,
            1.479019945774904
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.3244428422615251,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1920274402269809189&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=Jc0FssXh2R",
        "pdf": "https://openreview.net/pdf?id=Jc0FssXh2R",
        "email": "preferred.jp;tokyo.ac.jp",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Preferred Networks, Inc.;University of Tokyo",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.preferred-networks.com;https://www.u-tokyo.ac.jp",
        "aff_unique_abbr": "PFN;UTokyo",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Japan"
    },
    {
        "id": "JdWpIe70FL",
        "title": "Escaping the Sample Trap: Fast and Accurate Epistemic Uncertainty Estimation with Pairwise-Distance Estimators",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In machine learning, the ability to assess uncertainty in model predictions is crucial for decision-making, safety-critical applications, and model generalizability. This work introduces a novel approach for epistemic uncertainty estimation for ensemble models using pairwise-distance estimators (PaiDEs). These estimators utilize the pairwise-distance between model components to establish bounds on entropy, which are then used as estimates for information-based criterion. Unlike recent deep learning methods for epistemic uncertainty estimation, which rely on sample-based Monte Carlo estimators, PaiDEs are able to estimate epistemic uncertainty up to 100 times faster, over a larger input space (up to 100 times) and perform more accurately in higher dimensions. To validate our approach, we conducted a series of experiments commonly used to evaluate epistemic uncertainty estimation: 1D sinusoidal data, $\\textit{Pendulum-v0}$, $\\textit{Hopper-v2}$, $\\textit{Ant-v2}$ and $\\textit{Humanoid-v2}$. For each experimental setting, an Active Learning framework was applied to demonstrate the advantages of PaiDEs for epistemic uncertainty estimation.",
        "keywords": "Calibration & Uncertainty Quantification;Active Learning;Ensemble Methods;Multimodal Learning;Probabilistic Methods",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/105ebf4f317aa3f5b9138b59842c4d6f18e9a239.zip",
        "author": "Lucas Berry;David Meger",
        "authorids": "~Lucas_Berry1;~David_Meger2",
        "gender": ";M",
        "homepage": ";http://www.cim.mcgill.ca/~dmeger/",
        "dblp": "339/6507;51/3415.html",
        "google_scholar": "WfYYLtQAAAAJ;https://scholar.google.com.tw/citations?user=gFwEytkAAAAJ",
        "orcid": ";",
        "linkedin": "lucas-berry-86291878/;",
        "or_profile": "~Lucas_Berry1;~David_Meger2",
        "aff": "McGill University, McGill University;McGill University",
        "aff_domain": "mail.mcgill.ca;mcgill.ca",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\nberry2024escaping,\ntitle={Escaping the Sample Trap: Fast and Accurate Epistemic Uncertainty Estimation with Pairwise-Distance Estimators},\nauthor={Lucas Berry and David Meger},\nyear={2024},\nurl={https://openreview.net/forum?id=JdWpIe70FL}\n}",
        "github": "",
        "project": "",
        "reviewers": "3c49;rbCP;ts3p;H6Rh",
        "site": "https://openreview.net/forum?id=JdWpIe70FL",
        "pdf_size": 8046452,
        "rating": "3;5;5;6",
        "confidence": "4;5;5;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "103;147;83;95",
        "wc_strengths": "66;55;26;90",
        "wc_weaknesses": "250;89;35;61",
        "wc_questions": "4;47;254;169",
        "wc_review": "423;338;398;415",
        "wc_reply_reviewers": "0;48;0;0",
        "wc_reply_authors": "475;530;300;60",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            107.0,
            24.166091947189145
        ],
        "wc_strengths_avg": [
            59.25,
            22.993205518152532
        ],
        "wc_weaknesses_avg": [
            108.75,
            83.756716148617
        ],
        "wc_questions_avg": [
            118.5,
            98.91031291023197
        ],
        "wc_review_avg": [
            393.5,
            33.29038900343461
        ],
        "wc_reply_reviewers_avg": [
            12.0,
            20.784609690826528
        ],
        "wc_reply_authors_avg": [
            341.25,
            183.24761253560712
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.20751433915982243,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6846241840988438070&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "McGill University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.mcgill.ca",
        "aff_unique_abbr": "McGill",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Canada"
    },
    {
        "title": "Multimodal Patient Representation Learning with Missing Modalities and Labels",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18934",
        "id": "Je5SHCKpPa",
        "author_site": "Zhenbang Wu, Anant Dadu, Nicholas Tustison, Brian Avants, Michael Nalls, Jimeng Sun, Faraz Faghri",
        "tldr": "",
        "abstract": "Multimodal patient representation learning aims to integrate information from multiple modalities and generate comprehensive patient representations for subsequent clinical predictive tasks. However, many existing approaches either presuppose the availability of all modalities and labels for each patient or only deal with missing modalities. In reality, patient data often comes with both missing modalities and labels for various reasons (i.e., the missing modality and label issue). Moreover, multimodal models might over-rely on certain modalities, causing sub-optimal performance when these modalities are absent (i.e., the modality collapse issue). To address these issues, we introduce MUSE: a mutual-consistent graph contrastive learning method. MUSE uses a flexible bipartite graph to represent the patient-modality relationship, which can adapt to various missing modality patterns. To tackle the modality collapse issue, MUSE learns to focus on modality-general and label-decisive features via a mutual-consistent contrastive learning loss. Notably, the unsupervised component of the contrastive objective only requires self-supervision signals, thereby broadening the training scope to incorporate patients with missing labels. We evaluate MUSE on three publicly available datasets: MIMIC-IV, eICU, and ADNI. Results show that MUSE outperforms all baselines, and MUSE+ further elevates the absolute improvement to ~4% by extending the training scope to patients with absent labels.",
        "keywords": "multi-modal learning;missing modalities;missing labels;clinical predictive modeling;patient representation learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Zhenbang Wu;Anant Dadu;Nicholas Tustison;Brian Avants;Mike Nalls;Jimeng Sun;Faraz Faghri",
        "authorids": "~Zhenbang_Wu1;~Anant_Dadu1;~Nicholas_Tustison1;~Brian_Avants2;michael.nalls@nih.gov;~Jimeng_Sun3;~Faraz_Faghri1",
        "gender": "M;M;M;;;;M",
        "homepage": ";;;;;http://sunlab.org;",
        "dblp": "315/0212;;;;;;",
        "google_scholar": "N8p-spIAAAAJ;https://scholar.google.com/citations?hl=en;m1Vfqh8AAAAJ;;;9jmmp5sAAAAJ;Rr643xYAAAAJ",
        "orcid": ";;0000-0001-9418-5103;;;0000-0003-1512-6426;",
        "linkedin": ";;;;;jimengsun/;",
        "or_profile": "~Zhenbang_Wu1;~Anant_Dadu1;~Nicholas_Tustison1;~Brian_Avants2;michael.nalls@nih.gov;~Jimeng_Sun3;~Faraz_Faghri1",
        "aff": "University of Illinois Urbana Champaign;Department of Computer Science;University of Virginia, Charlottesville;;;Georgia Institute of Technology;National Institutes of Health ",
        "aff_domain": "illinois.edu;cs.illinois.edu;virginia.edu;;;gatech.edu;nih.gov",
        "position": "PhD student;PhD student;Associate Professor;;;Associate Professor;Researcher",
        "bibtex": "@inproceedings{\nwu2024multimodal,\ntitle={Multimodal Patient Representation Learning with Missing Modalities and Labels},\nauthor={Zhenbang Wu and Anant Dadu and Nicholas Tustison and Brian Avants and Mike Nalls and Jimeng Sun and Faraz Faghri},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Je5SHCKpPa}\n}",
        "github": "",
        "project": "",
        "reviewers": "D1yA;3igL;se67;eaku",
        "pdf_size": 647839,
        "rating": "6;6;6;8",
        "confidence": "4;4;3;4",
        "soundness": "4;3;3;3",
        "contribution": "3;4;2;3",
        "presentation": "3;4;3;3",
        "wc_summary": "62;98;87;103",
        "wc_strengths": "148;81;34;192",
        "wc_weaknesses": "77;157;342;479",
        "wc_questions": "137;77;26;238",
        "wc_review": "424;413;489;1012",
        "wc_reply_reviewers": "0;0;36;112",
        "wc_reply_authors": "565;508;933;1455",
        "reply_reviewers": "0;0;1;2",
        "reply_authors": "1;1;2;3",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            87.5,
            15.819292019556375
        ],
        "wc_strengths_avg": [
            113.75,
            60.68103080864728
        ],
        "wc_weaknesses_avg": [
            263.75,
            157.1040658289912
        ],
        "wc_questions_avg": [
            119.5,
            78.89391611524934
        ],
        "wc_review_avg": [
            584.5,
            248.5201199098375
        ],
        "wc_reply_reviewers_avg": [
            37.0,
            45.727453460694704
        ],
        "wc_reply_authors_avg": [
            865.25,
            377.5489206712158
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 18,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7053911669320787420&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=Je5SHCKpPa",
        "pdf": "https://openreview.net/pdf?id=Je5SHCKpPa",
        "email": "illinois.edu;cs.illinois.edu;virginia.edu;;;gatech.edu;nih.gov",
        "author_num": 7,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "University of Illinois Urbana-Champaign;Unknown Institution;University of Virginia;Georgia Institute of Technology;National Institutes of Health",
        "aff_unique_dep": ";Department of Computer Science;;;",
        "aff_unique_url": "https://illinois.edu;;https://www.virginia.edu;https://www.gatech.edu;https://www.nih.gov",
        "aff_unique_abbr": "UIUC;;UVA;Georgia Tech;NIH",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Urbana-Champaign;;Charlottesville",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States;"
    },
    {
        "title": "iTransformer: Inverted Transformers Are Effective for Time Series Forecasting",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18933",
        "id": "JePfAI8fah",
        "author_site": "Yong Liu, Tengge Hu, Haoran Zhang, Haixu Wu, Shiyu Wang, Lintao Ma, Mingsheng Long",
        "tldr": "",
        "abstract": "The recent boom of linear forecasting models questions the ongoing passion for architectural modifications of Transformer-based forecasters. These forecasters leverage Transformers to model the global dependencies over temporal tokens of time series, with each token formed by multiple variates of the same timestamp. However, Transformers are challenged in forecasting series with larger lookback windows due to performance degradation and computation explosion. Besides, the embedding for each temporal token fuses multiple variates that represent potential delayed events and distinct physical measurements, which may fail in learning variate-centric representations and result in meaningless attention maps. In this work, we reflect on the competent duties of Transformer components and repurpose the Transformer architecture without any modification to the basic components. We propose iTransformer that simply applies the attention and feed-forward network on the inverted dimensions. Specifically, the time points of individual series are embedded into variate tokens which are utilized by the attention mechanism to capture multivariate correlations; meanwhile, the feed-forward network is applied for each variate token to learn nonlinear representations. The iTransformer model achieves state-of-the-art on challenging real-world datasets, which further empowers the Transformer family with promoted performance, generalization ability across different variates, and better utilization of arbitrary lookback windows, making it a nice alternative as the fundamental backbone of time series forecasting. Code is available at this repository: https://github.com/thuml/iTransformer.",
        "keywords": "Time Series Forecasting;Transformer",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yong Liu;Tengge Hu;Haoran Zhang;Haixu Wu;Shiyu Wang;Lintao Ma;Mingsheng Long",
        "authorids": "~Yong_Liu15;~Tengge_Hu1;~Haoran_Zhang9;~Haixu_Wu1;~Shiyu_Wang3;~Lintao_Ma1;~Mingsheng_Long5",
        "gender": ";;M;M;;;",
        "homepage": ";http://ise.thss.tsinghua.edu.cn/~mlong/;https://www.thss.tsinghua.edu.cn/;;;;",
        "dblp": ";330/4778;;286/8115;;;",
        "google_scholar": ";;;oLL_x0wAAAAJ;;;",
        "orcid": ";;0009-0004-3245-459X;;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Yong_Liu15;~Tengge_Hu1;~Haoran_Zhang9;~Haixu_Wu1;~Shiyu_Wang3;~Lintao_Ma1;~Mingsheng_Long5",
        "aff": ";Tsinghua University;Tsinghua University;Tsinghua University;;;",
        "aff_domain": ";tsinghua.edu.cn;mails.tsinghua.edu.cn;tsinghua.edu.cn;;;",
        "position": ";MS student;Undergrad student;PhD student;;;",
        "bibtex": "@inproceedings{\nliu2024itransformer,\ntitle={iTransformer: Inverted Transformers Are Effective for Time Series Forecasting},\nauthor={Yong Liu and Tengge Hu and Haoran Zhang and Haixu Wu and Shiyu Wang and Lintao Ma and Mingsheng Long},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=JePfAI8fah}\n}",
        "github": "",
        "project": "",
        "reviewers": "hg6h;b5RW;HTy3;yopU",
        "pdf_size": 6180839,
        "rating": "6;8;8;8",
        "confidence": "4;4;4;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;4",
        "wc_summary": "71;49;133;84",
        "wc_strengths": "75;31;54;32",
        "wc_weaknesses": "99;27;57;14",
        "wc_questions": "19;205;1023;118",
        "wc_review": "264;312;1267;248",
        "wc_reply_reviewers": "0;0;400;26",
        "wc_reply_authors": "756;266;2039;616",
        "reply_reviewers": "0;0;2;1",
        "reply_authors": "2;1;4;2",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            84.25,
            30.80077109424373
        ],
        "wc_strengths_avg": [
            48.0,
            18.096961070853858
        ],
        "wc_weaknesses_avg": [
            49.25,
            32.683137854251385
        ],
        "wc_questions_avg": [
            341.25,
            399.07165709932343
        ],
        "wc_review_avg": [
            522.75,
            430.3378759765401
        ],
        "wc_reply_reviewers_avg": [
            106.5,
            169.7844221358367
        ],
        "wc_reply_authors_avg": [
            919.25,
            670.668835939169
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.25,
            1.0897247358851685
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 912,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9907712640772916932&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=JePfAI8fah",
        "pdf": "https://openreview.net/pdf?id=JePfAI8fah",
        "email": ";tsinghua.edu.cn;mails.tsinghua.edu.cn;tsinghua.edu.cn;;;",
        "author_num": 7,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Tsinghua University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "When Do Prompting and Prefix-Tuning Work? A Theory of Capabilities and Limitations",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18932",
        "id": "JewzobRhay",
        "author_site": "Aleksandar Petrov, Philip Torr, Adel Bibi",
        "tldr": "",
        "abstract": "Context-based fine-tuning methods, including prompting, in-context learning, soft prompting (also known as prompt tuning), and prefix-tuning, have gained popularity due to their ability to often match the performance of full fine-tuning with a fraction of the parameters. Despite their empirical successes, there is little theoretical understanding of how these techniques influence the internal computation of the model and their expressiveness limitations. We show that despite the continuous embedding space being more expressive than the discrete token space, soft-prompting and prefix-tuning are potentially less expressive than full fine-tuning, even with the same number of learnable parameters. Concretely, context-based fine-tuning cannot change the relative attention pattern over the content and can only bias the outputs of an attention layer in a fixed direction. This suggests that while techniques like prompting, in-context learning, soft prompting, and prefix-tuning can effectively elicit skills present in the pretrained model, they may not be able to learn novel tasks that require new attention patterns.",
        "keywords": "prompt;prefix;LLM;fine-tuning;theory",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/6f2a392958535ffcd7f5d2513f73a5151cecd02c.zip",
        "author": "Aleksandar Petrov;Philip Torr;Adel Bibi",
        "authorids": "~Aleksandar_Petrov1;~Philip_Torr1;~Adel_Bibi1",
        "gender": "M;;M",
        "homepage": "https://p-petrov.com/;http://www.robots.ox.ac.uk/~tvg/;http://adelbibi.com",
        "dblp": "49/8105;;176/0964",
        "google_scholar": "em54BT4AAAAJ;;Q4j2laYAAAAJ",
        "orcid": ";;0000-0002-6169-3918",
        "linkedin": "aleksandar-petrov/;;adel-bibi-ba3671ab/",
        "or_profile": "~Aleksandar_Petrov1;~Philip_Torr1;~Adel_Bibi1",
        "aff": "Adobe Systems;University of Oxford;University of Oxford",
        "aff_domain": "adobe.com;ox.ac.uk;ox.ac.uk",
        "position": "Intern;Full Professor;Senior Researcher",
        "bibtex": "@inproceedings{\npetrov2024when,\ntitle={When Do Prompting and Prefix-Tuning Work? A Theory of Capabilities and Limitations},\nauthor={Aleksandar Petrov and Philip Torr and Adel Bibi},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=JewzobRhay}\n}",
        "github": "",
        "project": "",
        "reviewers": "7Rcz;R11r;RrcA;rXHB",
        "pdf_size": 1268445,
        "rating": "6;6;6;8",
        "confidence": "3;3;3;2",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;4",
        "presentation": "3;2;3;2",
        "wc_summary": "125;95;61;138",
        "wc_strengths": "34;37;111;147",
        "wc_weaknesses": "94;149;89;202",
        "wc_questions": "2;40;65;113",
        "wc_review": "255;321;326;600",
        "wc_reply_reviewers": "30;0;0;0",
        "wc_reply_authors": "310;714;968;1140",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "1;1;2;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            104.75,
            29.684802509028085
        ],
        "wc_strengths_avg": [
            82.25,
            48.4632592795821
        ],
        "wc_weaknesses_avg": [
            133.5,
            46.02445002387318
        ],
        "wc_questions_avg": [
            55.0,
            40.30508652763321
        ],
        "wc_review_avg": [
            375.5,
            132.6093888078819
        ],
        "wc_reply_reviewers_avg": [
            7.5,
            12.99038105676658
        ],
        "wc_reply_authors_avg": [
            783.0,
            312.31554556249677
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 38,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8716625399019125009&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=JewzobRhay",
        "pdf": "https://openreview.net/pdf?id=JewzobRhay",
        "email": "adobe.com;ox.ac.uk;ox.ac.uk",
        "author_num": 3,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Adobe;University of Oxford",
        "aff_unique_dep": "Adobe Systems Incorporated;",
        "aff_unique_url": "https://www.adobe.com;https://www.ox.ac.uk",
        "aff_unique_abbr": "Adobe;Oxford",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "title": "SKILL-MIX: a Flexible and Expandable Family of Evaluations for AI Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18931",
        "id": "Jf5gplvglq",
        "author_site": "Dingli Yu, Simran Kaur, Arushi Gupta, Jonah Brown-Cohen, Anirudh Goyal, Sanjeev Arora",
        "tldr": "",
        "abstract": "With LLMs shifting their role from statistical modeling of language to serving as general-purpose AI agents, how should LLM evaluations change? Arguably, a key ability of an AI agent is to flexibly combine, as needed, the basic skills it has learned. The capability to combine skills plays an important role in (human) pedagogy and also in a paper on emergence phenomena (Arora & Goyal, 2023).\n\nThis work introduces SKILL-MIX, a new evaluation to measure ability to combine skills. Using a list of $N$  skills the evaluator repeatedly picks random subsets of $k$ skills and asks the LLM to produce text combining that subset of skills. Since the number of subsets grows like $N^k$, for even modest $k$ this evaluation will, with high probability, require the LLM to produce text significantly different from any text in the training set. \nThe paper develops a methodology for (a) designing and administering such an evaluation, and (b) automatic grading (plus spot-checking by humans) of the results using GPT-4 as well as the open LLaMA-2 70B model. \n\nAdministering a version of SKILL-MIX to popular chatbots gave results that,  while generally in line with prior expectations, contained surprises. Sizeable differences exist among model capabilities that are not captured by their ranking on popular LLM leaderboards (\"cramming for the leaderboard\"). Furthermore, simple probability calculations indicate that GPT-4's reasonable performance on $k=5$ is suggestive of going beyond \"stochastic parrot\" behavior (Bender et al., 2021), i.e., it combines skills in ways that it had not seen during training.\n\nWe sketch how the methodology can lead to a SKILL-MIX based eco-system of open evaluations for AI capabilities of future models. We maintain a leaderboard of SKILL-MIX at [https://skill-mix.github.io](https://skill-mix.github.io).",
        "keywords": "Large language model;skill evaluation;LLM benchmark;emergence",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/fb987782e509bfc4845c7c8dbb9a173851e4a061.zip",
        "author": "Dingli Yu;Simran Kaur;Arushi Gupta;Jonah Brown-Cohen;Anirudh Goyal;Sanjeev Arora",
        "authorids": "~Dingli_Yu1;~Simran_Kaur1;~Arushi_Gupta1;~Jonah_Brown-Cohen1;~Anirudh_Goyal1;~Sanjeev_Arora1",
        "gender": ";F;;M;M;",
        "homepage": "https://dingliyu.net/;;;https://jonahbc.github.io/;https://anirudh9119.github.io/;http://www.cs.princeton.edu/~arora/",
        "dblp": "39/578;211/3465;;157/1513;172/1039;a/SArora",
        "google_scholar": "KJLJstYAAAAJ;AMHNjTIAAAAJ;;fRc3A80AAAAJ;krrh6OUAAAAJ;RUP4S68AAAAJ",
        "orcid": "0000-0002-8824-8611;;;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Dingli_Yu1;~Simran_Kaur1;~Arushi_Gupta1;~Jonah_Brown-Cohen1;~Anirudh_Goyal1;~Sanjeev_Arora1",
        "aff": "Princeton University;Princeton University;;Google DeepMind;Google DeepMind;Princeton University",
        "aff_domain": "princeton.edu;princeton.edu;;deepmind.com;google.com;princeton.edu",
        "position": "PhD student;PhD student;;Researcher;Researcher;Full Professor",
        "bibtex": "@inproceedings{\nyu2024skillmix,\ntitle={{SKILL}-{MIX}: a Flexible and Expandable Family of Evaluations for {AI} Models},\nauthor={Dingli Yu and Simran Kaur and Arushi Gupta and Jonah Brown-Cohen and Anirudh Goyal and Sanjeev Arora},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Jf5gplvglq}\n}",
        "github": "",
        "project": "",
        "reviewers": "VgUg;YRGK;NFpe",
        "pdf_size": 721346,
        "rating": "5;6;8",
        "confidence": "3;3;4",
        "soundness": "3;2;4",
        "contribution": "3;2;3",
        "presentation": "2;3;4",
        "wc_summary": "34;115;150",
        "wc_strengths": "144;56;103",
        "wc_weaknesses": "604;369;68",
        "wc_questions": "3;349;57",
        "wc_review": "785;889;378",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "849;658;499",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            99.66666666666667,
            48.58211833815218
        ],
        "wc_strengths_avg": [
            101.0,
            35.95367389665021
        ],
        "wc_weaknesses_avg": [
            347.0,
            219.3733499463111
        ],
        "wc_questions_avg": [
            136.33333333333334,
            151.9853794137961
        ],
        "wc_review_avg": [
            684.0,
            220.50094482034916
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            668.6666666666666,
            143.08583282615913
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.944911182523068,
        "gs_citation": 34,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15064780658912728261&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=Jf5gplvglq",
        "pdf": "https://openreview.net/pdf?id=Jf5gplvglq",
        "email": "princeton.edu;princeton.edu;;deepmind.com;google.com;princeton.edu",
        "author_num": 6,
        "aff_unique_index": "0;0;1;1;0",
        "aff_unique_norm": "Princeton University;Google",
        "aff_unique_dep": ";Google DeepMind",
        "aff_unique_url": "https://www.princeton.edu;https://deepmind.com",
        "aff_unique_abbr": "Princeton;DeepMind",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;1;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "JfcLYCqOkQ",
        "title": "Conditional MAE: An Empirical Study of Multiple Masking in Masked Autoencoder",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This work aims to study the subtle yet often overlooked element of masked autoencoder (MAE): masking. While masking plays a critical role in the performance of MAE, most current research employs fixed masking strategies directly on the input image. We introduce a masked autoencoder framework with multiple masking stages, termed Conditional MAE, where subsequent maskings are conditioned on previous unmasked representations, enabling a more flexible masking process in masked image modeling. By doing so, our study sheds light on how multiple masking affects the optimization in training and performance of pretrained models, e.g., introducing more locality to models, and summarizes several takeaways from our findings. Finally, we empirically evaluate the performance of our best-performing model (Conditional-MAE) with that of MAE in three folds including transfer learning, robustness, and scalability, demonstrating the effectiveness of our multiple masking strategy. We hope our findings will inspire further research in the field and code will be made available.",
        "keywords": "masked autoencoder;multiple masking",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Jie Zhu;Zhihao Yu;Mingyu Ding;Ping Luo;Leye Wang",
        "authorids": "~Jie_Zhu3;~Zhihao_Yu1;~Mingyu_Ding1;~Ping_Luo2;~Leye_Wang1",
        "gender": ";M;M;M;",
        "homepage": "https://github.com/yzhHoward;https://dingmyu.github.io/;https://wangleye.github.io/;https://scholar.google.com/citations?hl=zh-CN&user=ZL506kEAAAAJ;http://luoping.me/",
        "dblp": "201/5271;188/5243;07/8764;;54/4989-2.html",
        "google_scholar": ";w4yTWwoAAAAJ;;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com.hk/citations?hl=en",
        "orcid": ";0000-0001-6556-8359;;;0000-0002-6685-7950",
        "linkedin": ";dingmyu/;;;",
        "or_profile": "~Zhihao_Yu1;~Mingyu_Ding1;~Leye_Wang1;~zhu_Jie1;~Luo_Ping2",
        "aff": "Peking University;University of California, Berkeley;Peking University;Peking University;The University of Hong Kong",
        "aff_domain": "pku.edu.cn;berkeley.edu;pku.edu.cn;pku.edu.cn;hku.hk",
        "position": "PhD student;Postdoc;Assistant Professor;PhD student;Associate Professor",
        "bibtex": "@misc{\nzhu2024conditional,\ntitle={Conditional {MAE}: An Empirical Study of Multiple Masking in Masked Autoencoder},\nauthor={Jie Zhu and Zhihao Yu and Mingyu Ding and Ping Luo and Leye Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=JfcLYCqOkQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "xPJ6;MagS;GAuN;JZAj",
        "site": "https://openreview.net/forum?id=JfcLYCqOkQ",
        "pdf_size": 22927744,
        "rating": "3;3;5;8",
        "confidence": "5;5;4;4",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;3;4",
        "wc_summary": "46;59;70;181",
        "wc_strengths": "28;39;99;212",
        "wc_weaknesses": "63;210;238;225",
        "wc_questions": "8;15;225;71",
        "wc_review": "145;323;632;689",
        "wc_reply_reviewers": "0;641;0;35",
        "wc_reply_authors": "411;2518;1040;727",
        "reply_reviewers": "0;2;0;1",
        "reply_authors": "3;5;4;2",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            89.0,
            53.791263231123324
        ],
        "wc_strengths_avg": [
            94.5,
            73.02225688103593
        ],
        "wc_weaknesses_avg": [
            184.0,
            70.55848637832305
        ],
        "wc_questions_avg": [
            79.75,
            87.34235799427447
        ],
        "wc_review_avg": [
            447.25,
            223.2536393880288
        ],
        "wc_reply_reviewers_avg": [
            169.0,
            272.8836748506587
        ],
        "wc_reply_authors_avg": [
            1174.0,
            807.1973116902707
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.5,
            1.118033988749895
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.8551861104941366,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:FoMQKn8FJNAJ:scholar.google.com/&scioq=Conditional+MAE:+An+Empirical+Study+of+Multiple+Masking+in+Masked+Autoencoder&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0;2",
        "aff_unique_norm": "Peking University;University of California, Berkeley;University of Hong Kong",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.berkeley.edu;https://www.hku.hk",
        "aff_unique_abbr": "Peking U;UC Berkeley;HKU",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Berkeley;Hong Kong SAR",
        "aff_country_unique_index": "0;1;0;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "JfjduOxrTY",
        "title": "Understanding Graph Transformers by Generalized Propagation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph Transformers (GTs) have recently shown stellar performance on various\ngraph learning benchmarks, which is typically attributed to their underlying global\nself-attention mechanism. In this paper, we use generalized propagation graphs,\nconstructed through two abstract configurable functions and offering a unified\nview across various GNN models used in the literature. We show that by con-\nfiguring the two abstract functions governing the generation of propagation graph,\none could recover the most popular GNN models including graph Transformers,\nmessage-passing neural networks (MPNNs), as well as various forms of graph\nrewiring. We show that the expressivity of the instances of our framework depends\non one of the governing functions (the adjacency function). Empirical results con-\nfirm our theory: by keeping the adjacency function while removing self-attention,\nthe state-of-the-art GT maintains its performance. In other words, by designing\nappropriate adjacency functions, one could construct novel GNN models with di-\nverse expressive power. We also study the geometric properties of the propagation\ngraphs across a wide range of models, using a novel extension the Ollivier-Ricci\ncurvature to weighted digraphs.",
        "keywords": "geometric deep learning; graph transformer; discrete ricci curvature",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Chen Lin;Liheng Ma;Yiyang Chen;Wanli Ouyang;Michael M. Bronstein;Philip Torr",
        "authorids": "~Chen_Lin2;~Liheng_Ma1;~Yiyang_Chen6;~Wanli_Ouyang1;~Michael_M._Bronstein1;~Philip_Torr1",
        "gender": "M;M;M;;M;",
        "homepage": "https://scholar.google.com/citations?hl=en&user=rObgGWIAAAAJ;https://liamma.github.io/;;;http://www.inf.usi.ch/bronstein/;http://www.robots.ox.ac.uk/~tvg/",
        "dblp": ";244/4404;;;07/2668;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;abfvaXwAAAAJ;;;UU3N6-UAAAAJ;",
        "orcid": ";;;;;",
        "linkedin": ";liheng-ma-902103134/;yiyang-chen-127768185/;;mbronstein/;",
        "or_profile": "~Chen_Lin2;~Liheng_Ma1;~Yiyang_Chen6;~Wanli_Ouyang1;~Michael_M._Bronstein1;~Philip_Torr1",
        "aff": "University of Oxford, University of Oxford;Noah's Ark Lab, Montreal, Huawei Technologies Ltd. ;;;University of Oxford;University of Oxford",
        "aff_domain": "eng.ox.ac.uk;huawei.com;;;ox.ac.uk;ox.ac.uk",
        "position": "PhD student;Intern;;;Full Professor;Full Professor",
        "bibtex": "@misc{\nlin2024understanding,\ntitle={Understanding Graph Transformers by Generalized Propagation},\nauthor={Chen Lin and Liheng Ma and Yiyang Chen and Wanli Ouyang and Michael M. Bronstein and Philip Torr},\nyear={2024},\nurl={https://openreview.net/forum?id=JfjduOxrTY}\n}",
        "github": "",
        "project": "",
        "reviewers": "6YEa;5UFG;E8vF;Wt6r",
        "site": "https://openreview.net/forum?id=JfjduOxrTY",
        "pdf_size": 1643370,
        "rating": "3;3;5;6",
        "confidence": "2;4;4;4",
        "soundness": "2;3;3;2",
        "contribution": "2;2;3;3",
        "presentation": "2;3;3;2",
        "wc_summary": "42;100;156;102",
        "wc_strengths": "11;53;79;36",
        "wc_weaknesses": "122;343;181;103",
        "wc_questions": "17;56;105;6",
        "wc_review": "192;552;521;247",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1016;1569;1008;657",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "6;7;5;5",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            100.0,
            40.32369030731191
        ],
        "wc_strengths_avg": [
            44.75,
            24.78280654001883
        ],
        "wc_weaknesses_avg": [
            187.25,
            94.40967905887616
        ],
        "wc_questions_avg": [
            46.0,
            38.80077318817242
        ],
        "wc_review_avg": [
            378.0,
            160.06404968012023
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1062.5,
            326.3835933376554
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            5.75,
            0.82915619758885
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5555555555555555,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:iNDSb3FpMVIJ:scholar.google.com/&scioq=Understanding+Graph+Transformers+by+Generalized+Propagation&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "University of Oxford;Huawei",
        "aff_unique_dep": ";Noah's Ark Lab",
        "aff_unique_url": "https://www.ox.ac.uk;https://www.huawei.com",
        "aff_unique_abbr": "Oxford;Huawei",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Montreal",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "United Kingdom;Canada"
    },
    {
        "title": "The optimality of kernel classifiers in Sobolev space",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18930",
        "id": "JfqN3gu0i7",
        "author_site": "Jianfa Lai, zhifan Li, Dongming Huang, Qian Lin",
        "tldr": "",
        "abstract": "Kernel methods are widely used in machine learning, especially for classification problems. However, the theoretical analysis of kernel classification is still limited. This paper investigates the statistical performances of kernel classifiers. With some mild assumptions on the conditional probability $\\eta(x)=\\mathbb{P}(Y=1\\mid X=x)$, we derive an upper bound on the classification excess risk of a kernel classifier using recent advances in the theory of kernel regression. We also obtain a minimax lower bound for Sobolev spaces, which shows the optimality of the proposed classifier. Our theoretical results can be extended to the generalization error of overparameterized neural network classifiers. To make our theoretical results more applicable in realistic settings, we also propose a simple method to estimate the interpolation smoothness of $2\\eta(x)-1$ and apply the method to real datasets.",
        "keywords": "kernel classification;minimax optimality;neural network classifiers;reproducing kernel Hilbert Space",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/756569af4fc0d4f1961f238dd5a9961be2900855.pdf",
        "author": "Jianfa Lai;zhifan Li;Dongming Huang;Qian Lin",
        "authorids": "~Jianfa_Lai2;~zhifan_Li1;~Dongming_Huang1;~Qian_Lin2",
        "gender": "M;M;M;M",
        "homepage": ";;http://blog.nus.edu.sg/stahd;https://sites.google.com/site/qianlincd/",
        "dblp": "319/6088;;345/0464;79/3108",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;IxSGv9AAAAAJ;;kHPrqdgAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Jianfa_Lai2;~zhifan_Li1;~Dongming_Huang1;~Qian_Lin2",
        "aff": "Tsinghua University;Beijing Institute of Mathematical Sciences and Applications;National University of Singapore;Tsinghua University",
        "aff_domain": "mail.tsinghua.edu.cn;bimsa.cn;nus.edu.sg;tsinghua.edu.cn",
        "position": "Postdoc;Postdoc;Assistant Professor;Associate Professor",
        "bibtex": "@inproceedings{\nlai2024the,\ntitle={The optimality of kernel classifiers in Sobolev space},\nauthor={Jianfa Lai and zhifan Li and Dongming Huang and Qian Lin},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=JfqN3gu0i7}\n}",
        "github": "",
        "project": "",
        "reviewers": "atim;yGYg;3CL4;ABCa",
        "pdf_size": 1560942,
        "rating": "5;5;6;6",
        "confidence": "2;3;4;2",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;2",
        "presentation": "2;3;3;3",
        "wc_summary": "91;67;76;95",
        "wc_strengths": "73;33;97;32",
        "wc_weaknesses": "53;194;109;2",
        "wc_questions": "173;34;1079;76",
        "wc_review": "390;328;1361;205",
        "wc_reply_reviewers": "113;0;414;7",
        "wc_reply_authors": "439;688;1224;471",
        "reply_reviewers": "1;0;2;1",
        "reply_authors": "2;1;3;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            82.25,
            11.299889379989523
        ],
        "wc_strengths_avg": [
            58.75,
            27.589626673806226
        ],
        "wc_weaknesses_avg": [
            89.5,
            71.21973041229516
        ],
        "wc_questions_avg": [
            340.5,
            429.34281174837434
        ],
        "wc_review_avg": [
            571.0,
            460.9408855807868
        ],
        "wc_reply_reviewers_avg": [
            133.5,
            168.02157599546553
        ],
        "wc_reply_authors_avg": [
            705.5,
            314.30916308628355
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.30151134457776363,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14526921204356129585&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=JfqN3gu0i7",
        "pdf": "https://openreview.net/pdf?id=JfqN3gu0i7",
        "email": "mail.tsinghua.edu.cn;bimsa.cn;nus.edu.sg;tsinghua.edu.cn",
        "author_num": 4,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Tsinghua University;Beijing Institute of Mathematical Sciences and Applications;National University of Singapore",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;;https://www.nus.edu.sg",
        "aff_unique_abbr": "THU;;NUS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "China;Singapore"
    },
    {
        "id": "Jg8y1buQ3r",
        "title": "LLM-driven Hateful Meme Detection via Cross-modal Memorizing and Self-rejection Training",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Hateful meme detection (HMD) is critical for determining whether online multimodal content carries harmful information, which plays a pivotal role in maintaining a harmonious internet ecosystem. HMD is predominantly viewed as a multimodal task, where the harmful message in memes is expressed through the information conveyed by the combination of visual and text content (e.g., the contradictions between them) rather than that from one modality. Thus, effective modeling and smooth integration of multimodal information are crucial for achieving promising HMD performance. Current research on HMD conventionally models visual and text data independently, subsequently aligns and merges these multimodal features for HMD predictions. However, existing studies face challenges in identifying hateful information that derives from the complementarities or contradictions between image and text, where in most cases neither image nor text alone carries explicit hateful information. Moreover, these studies do not leverage the capabilities of large language models (LLMs), which have been demonstrated effective in cross-modal information processing. Therefore in this paper, we propose a multimodal approach for HMD following the encoding-decoding paradigm with using LLM and a memory module enhanced by self-rejection training. Particularly, the memory module learns appropriate relationships between image and text that lead to hateful memes, where the resulted information is fed into the LLM and accompanied with visual and text features to predict HMD labels. Self-rejection training performs a discriminative learning according to memory outputs and enhances the memory module to improve HMD. We evaluate our approach on English and Chinese benchmark datasets, where it outperforms strong baselines, demonstrating the effectiveness of all components in it and our model design.",
        "keywords": "Hateful Meme Detection;Multimodality;Self-Rejection Training;Cross-modal Memorizing",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yuanhe Tian;Ruyi Gan;Yan Song;Qunshu Lin;ZIJIAN ZHAO;Yongdong Zhang",
        "authorids": "~Yuanhe_Tian1;~Ruyi_Gan1;~Yan_Song1;~Qunshu_Lin1;~ZIJIAN_ZHAO5;~Yongdong_Zhang2",
        "gender": ";M;;M;M;M",
        "homepage": ";https://github.com/ganzhiruyi;https://clksong.github.io;;https://imcc.ustc.edu.cn/_upload/tpl/0d/13/3347/template3347/zhangyongdong.html;",
        "dblp": "https://dblp.uni-trier.de/pid/246/0133;;09/1398;;z/YongdongZhang;",
        "google_scholar": "5GCwWZ8AAAAJ;y994nEsAAAAJ;;;https://scholar.google.com.hk/citations?user=hxGs4ukAAAAJ;",
        "orcid": ";;;0009-0009-9140-3959;0000-0003-0066-3448;",
        "linkedin": ";;;jack-d-lin/;;%E5%AD%90%E5%81%A5-%E8%B5%B5-4143671b5/",
        "or_profile": "~Yuanhe_Tian1;~Ruyi_Gan1;~Yan_Song1;~Qunshu_Lin1;~Yongdong_Zhang2;~drew_zhao1",
        "aff": "University of Washington, Seattle;University of Science and Technology of China;University of Science and Technology of China;Zhejiang University;University of Science and Technology of China;Zhejiang University",
        "aff_domain": "uw.edu;ustc.edu.cn;ustc.edu.cn;zju.edu.cn;ustc.edu.cn;zju.edu.cn",
        "position": "PhD student;PhD student;Full Professor;PhD student;Full Professor;MS student",
        "bibtex": "@misc{\ntian2024llmdriven,\ntitle={{LLM}-driven Hateful Meme Detection via Cross-modal Memorizing and Self-rejection Training},\nauthor={Yuanhe Tian and Ruyi Gan and Yan Song and Qunshu Lin and ZIJIAN ZHAO and Yongdong Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=Jg8y1buQ3r}\n}",
        "github": "",
        "project": "",
        "reviewers": "UptH;xmfW;uTqz;uMip",
        "site": "https://openreview.net/forum?id=Jg8y1buQ3r",
        "pdf_size": 13190493,
        "rating": "5;5;5;6",
        "confidence": "4;2;4;4",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;2;2;3",
        "wc_summary": "55;60;40;15",
        "wc_strengths": "67;32;40;37",
        "wc_weaknesses": "46;217;281;64",
        "wc_questions": "279;13;23;61",
        "wc_review": "447;322;384;177",
        "wc_reply_reviewers": "120;0;0;0",
        "wc_reply_authors": "905;655;651;568",
        "reply_reviewers": "2;0;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            42.5,
            17.5
        ],
        "wc_strengths_avg": [
            44.0,
            13.583077707206124
        ],
        "wc_weaknesses_avg": [
            152.0,
            99.80731436122305
        ],
        "wc_questions_avg": [
            94.0,
            108.30050784737807
        ],
        "wc_review_avg": [
            332.5,
            100.06622806921425
        ],
        "wc_reply_reviewers_avg": [
            30.0,
            51.96152422706632
        ],
        "wc_reply_authors_avg": [
            694.75,
            126.2584155611023
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:uT83X3HziwQJ:scholar.google.com/&scioq=LLM-driven+Hateful+Meme+Detection+via+Cross-modal+Memorizing+and+Self-rejection+Training&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;2;1;2",
        "aff_unique_norm": "University of Washington;University of Science and Technology of China;Zhejiang University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.washington.edu;http://www.ustc.edu.cn;https://www.zju.edu.cn",
        "aff_unique_abbr": "UW;USTC;ZJU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Seattle;",
        "aff_country_unique_index": "0;1;1;1;1;1",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "Jg8yHRPU7l",
        "title": "Mechanism of clean-priority learning in early stopped neural networks of infinite width",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "When random label noise is added to a training dataset, the prediction error of a neural network on a label-noise-free test dataset initially improves during early training but eventually deteriorates, following a U-shaped dependence on training time. This behaviour is believed to be a result of neural networks learning the pattern of clean data first and fitting the noise later, a phenomenon that we refer to as *clean-priority learning*. In this study, we aim to explore the learning dynamics underlying this phenomenon. We demonstrate that,  in the early stage of training, the update direction of gradient descent is determined by the clean samples of training data, leaving the noisy samples  have minimal to no impact, resulting in a prioritization of clean learning. Moreover, we show both theoretically and experimentally, as the clean-priority learning goes on, the dominance of the  gradients of clean samples over those of noisy samples  diminishes, and finally results in a termination of the clean-priority learning and fitting of the noisy samples.",
        "keywords": "label noise;early stopping;clean-priority learning",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/6381f822efcbdd379b931241f97ccae47ce786ed.pdf",
        "author": "Chaoyue Liu;Amirhesam Abedsoltan;Mikhail Belkin",
        "authorids": "~Chaoyue_Liu2;~Amirhesam_Abedsoltan1;~Mikhail_Belkin1",
        "gender": "M;M;",
        "homepage": "https://cliu212.github.io/;;http://misha.belkin-wang.org/",
        "dblp": "191/6684-1;;",
        "google_scholar": "sRjoMX0AAAAJ;https://scholar.google.com/citations?hl=en;Iwd9DdkAAAAJ",
        "orcid": ";;",
        "linkedin": ";amirhesam-abedsoltan-395732b9/;",
        "or_profile": "~Chaoyue_Liu2;~Amirhesam_Abedsoltan1;~Misha_Belkin1",
        "aff": "University of California, San Diego;University of California, San Diego;University of California, San Diego",
        "aff_domain": "ucsd.edu;ucsd.edu;ucsd.edu",
        "position": "Postdoc;PhD student;Professor",
        "bibtex": "@misc{\nliu2024mechanism,\ntitle={Mechanism of clean-priority learning in early stopped neural networks of infinite width},\nauthor={Chaoyue Liu and Amirhesam Abedsoltan and Mikhail Belkin},\nyear={2024},\nurl={https://openreview.net/forum?id=Jg8yHRPU7l}\n}",
        "github": "",
        "project": "",
        "reviewers": "ofvF;5A6o;aNMp;dh81",
        "site": "https://openreview.net/forum?id=Jg8yHRPU7l",
        "pdf_size": 488502,
        "rating": "3;3;3;5",
        "confidence": "4;4;3;2",
        "soundness": "2;2;3;3",
        "contribution": "1;2;2;3",
        "presentation": "2;2;3;3",
        "wc_summary": "68;133;65;143",
        "wc_strengths": "20;39;17;29",
        "wc_weaknesses": "404;172;74;94",
        "wc_questions": "166;94;35;43",
        "wc_review": "658;438;191;309",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            102.25,
            35.94005425705421
        ],
        "wc_strengths_avg": [
            26.25,
            8.584142356694699
        ],
        "wc_weaknesses_avg": [
            186.0,
            131.08012816594282
        ],
        "wc_questions_avg": [
            84.5,
            52.21350400040204
        ],
        "wc_review_avg": [
            399.0,
            173.18054163213603
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8703882797784891,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:eMq8hDTih_0J:scholar.google.com/&scioq=Mechanism+of+clean-priority+learning+in+early+stopped+neural+networks+of+infinite+width&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of California, San Diego",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucsd.edu",
        "aff_unique_abbr": "UCSD",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "San Diego",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "FLATTEN: optical FLow-guided ATTENtion for consistent text-to-video editing",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18929",
        "id": "JgqftqZQZ7",
        "author_site": "Yuren Cong, Mengmeng Xu, Christian Simon, Shoufa Chen, Jiawei Ren, Yanping Xie, Juan-Manuel Perez-Rua, Bodo Rosenhahn, Tao Xiang, Sen He",
        "tldr": "",
        "abstract": "Text-to-video editing aims to edit the visual appearance of a source video conditional on textual prompts.\nA major challenge in this task is to ensure that all frames in the edited video are visually consistent. \nMost recent works apply advanced text-to-image diffusion models to this task by inflating 2D spatial attention in the U-Net into spatio-temporal attention.\nAlthough temporal context can be added through spatio-temporal attention, it may introduce some irrelevant information for each patch and therefore cause inconsistency in the edited video. \nIn this paper, for the first time, we introduce optical flow into the attention module in diffusion model's U-Net to address the inconsistency issue for text-to-video editing.\nOur method, FLATTEN, enforces the patches on the same flow path across different frames to attend to each other in the attention module,  thus improving the visual consistency in the edited videos. \nAdditionally, our method is training-free and can be seamlessly integrated into any diffusion based text-to-video editing methods and improve their visual consistency.\nExperiment results on existing text-to-video editing benchmarks show that our proposed method achieves the new state-of-the-art performance. In particular, our method excels in maintaining the visual consistency in the edited videos.",
        "keywords": "diffusion model;video editing;text-to-video",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/181282fc781de0510b3d301f3876d462aff1c054.zip",
        "author": "Yuren Cong;Mengmeng Xu;christian simon;Shoufa Chen;Jiawei Ren;Yanping Xie;Juan-Manuel Perez-Rua;Bodo Rosenhahn;Tao Xiang;Sen He",
        "authorids": "~Yuren_Cong1;~Mengmeng_Xu1;~christian_simon1;~Shoufa_Chen1;~Jiawei_Ren1;~Yanping_Xie1;~Juan-Manuel_Perez-Rua1;~Bodo_Rosenhahn1;~Tao_Xiang1;~Sen_He1",
        "gender": "M;M;M;M;Unspecified;;M;M;M;M",
        "homepage": "https://yrcong.github.io;https://ivul.kaust.edu.sa/Pages/Frost-Xu.aspx;;https://www.shoufachen.com;https://jiawei-ren.github.io/;;;http://www.tnt.uni-hannover.de/staff/rosenhahn/;https://www.surrey.ac.uk/people/tao-xiang;https://senhe.github.io",
        "dblp": "256/4899;;;187/4654;122/3626-1;;172/9703;09/2973;22/4460-2.html;166/4467",
        "google_scholar": "6DPcOUEAAAAJ;be_ox9QAAAAJ;eZrRbp4AAAAJ;ogoCvHEAAAAJ;https://scholar.google.com.sg/citations?user=YUKPVCoAAAAJ;;;qq3TxtcAAAAJ\\;MeS5d4gAAAAJ;FvuBXWQAAAAJ",
        "orcid": ";;;0000-0002-6126-2595;0000-0003-1950-5976;;;;0000-0002-2530-1059;",
        "linkedin": "yuren-cong-78626a193/;;;;;yanping-xie-53583428;;b-rosenhahn-a397b1183/;;",
        "or_profile": "~Yuren_Cong1;~Mengmeng_Xu1;~christian_simon1;~Shoufa_Chen1;~Jiawei_Ren1;~Yanping_Xie1;~Juan-Manuel_Perez-Rua1;~Bodo_Rosenhahn1;~Tao_Xiang1;~Sen_He1",
        "aff": "Leibniz University Hannover;Meta ;Sony ;The University of Hong Kong;Nanyang Technological University;Meta;Meta Facebook;Institut f\u00fcr Informationsverarbeitung;University of Surrey;Meta AI",
        "aff_domain": "uni-hannover.de;meta.com;sony.co.jp;hku.hk;ntu.edu.sg;meta.com;fb.com;tnt.uni-hannover.de;surrey.ac.uk;meta.com",
        "position": "PhD student;Researcher;Researcher;PhD student;PhD student;Software Engineer;Research Scientist;Professor;Full Professor;Researcher",
        "bibtex": "@inproceedings{\ncong2024flatten,\ntitle={{FLATTEN}: optical {FL}ow-guided {ATTEN}tion for consistent text-to-video editing},\nauthor={Yuren Cong and Mengmeng Xu and christian simon and Shoufa Chen and Jiawei Ren and Yanping Xie and Juan-Manuel Perez-Rua and Bodo Rosenhahn and Tao Xiang and Sen He},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=JgqftqZQZ7}\n}",
        "github": "",
        "project": "",
        "reviewers": "F5Lm;1FeZ;Hpug;UKpY",
        "pdf_size": 19839952,
        "rating": "5;5;8;8",
        "confidence": "2;4;5;4",
        "soundness": "2;2;2;4",
        "contribution": "2;2;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "29;49;37;375",
        "wc_strengths": "26;9;40;41",
        "wc_weaknesses": "126;230;211;67",
        "wc_questions": "4;2;14;307",
        "wc_review": "185;290;302;790",
        "wc_reply_reviewers": "0;0;202;0",
        "wc_reply_authors": "472;650;1163;836",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;2;2",
        "rating_avg": [
            6.5,
            1.5
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            122.5,
            145.9546162339513
        ],
        "wc_strengths_avg": [
            29.0,
            12.98075498574717
        ],
        "wc_weaknesses_avg": [
            158.5,
            65.75902979819577
        ],
        "wc_questions_avg": [
            81.75,
            130.12758162664824
        ],
        "wc_review_avg": [
            391.75,
            234.39109944705666
        ],
        "wc_reply_reviewers_avg": [
            50.5,
            87.4685657822283
        ],
        "wc_reply_authors_avg": [
            780.25,
            255.72873811912496
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.6882472016116854,
        "gs_citation": 74,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4648206907667477176&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=JgqftqZQZ7",
        "pdf": "https://openreview.net/pdf?id=JgqftqZQZ7",
        "email": "uni-hannover.de;meta.com;sony.co.jp;hku.hk;ntu.edu.sg;meta.com;fb.com;tnt.uni-hannover.de;surrey.ac.uk;meta.com",
        "author_num": 10,
        "aff_unique_index": "0;1;2;3;4;1;1;5;6;1",
        "aff_unique_norm": "Leibniz University Hannover;Meta;Sony Corporation;University of Hong Kong;Nanyang Technological University;Institut f\u00fcr Informationsverarbeitung;University of Surrey",
        "aff_unique_dep": ";Meta Platforms, Inc.;;;;Department of Information Processing;",
        "aff_unique_url": "https://www.leibniz.uni-hannover.de;https://meta.com;https://www.sony.com;https://www.hku.hk;https://www.ntu.edu.sg;;https://www.surrey.ac.uk",
        "aff_unique_abbr": "LUH;Meta;Sony;HKU;NTU;;Surrey",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;1;2;3;4;1;1;0;5;1",
        "aff_country_unique": "Germany;United States;Japan;China;Singapore;United Kingdom"
    },
    {
        "id": "Jh6m4e8Ief",
        "title": "SurroCBM: Concept Bottleneck Surrogate Models for Joint Unsupervised Concept Discovery and Post-hoc Explanation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Explainable AI seeks to bring light to the decision-making processes of black-box models. Traditional saliency-based methods, while highlighting influential data segments, often lack semantic understanding. Recent advancements, such as Concept Activation Vectors (CAVs) and Concept Bottleneck Models (CBMs), offer concept-based explanations but necessitate human-defined concepts. To address the challenge of obtaining these concepts, research has explored concept discovery using latent factors of generative models. However, existing methods either focus on concepts underlying the data or those causal to a single task, leaving a gap in explaining multiple tasks. This paper introduces the Concept Bottleneck Surrogate Models (SurroCBM), a novel framework that jointly tackles unsupervised concept discovery and post-hoc explanation. SurroCBM identifies shared and unique concepts across various black-box models and employs an explainable surrogate model for post-hoc explanations. A unique training strategy is proposed to enhance explanation quality continuously. Through extensive experiments, we demonstrate the efficacy of SurroCBM in concept discovery and explanation, underscoring its potential in advancing the field of explainable AI.",
        "keywords": "Explainable AI;Concept-based Explanation",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Bo Pan;Zhenke Liu;Yifei Zhang;Liang Zhao",
        "authorids": "~Bo_Pan2;~Zhenke_Liu1;~Yifei_Zhang10;~Liang_Zhao6",
        "gender": ";M;M;M",
        "homepage": "https://pb0316.github.io/;https://github.com/Sizchode;https://yifeizhangcs.github.io/;https://cs.emory.edu/~lzhao41/",
        "dblp": ";;55/5266-6;63/5422-2",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;y5FkC7cAAAAJ;qnvyqtwAAAAJ",
        "orcid": "0009-0005-7501-7581;0009-0006-7870-9468;0009-0004-6136-733X;0000-0002-2648-9989",
        "linkedin": "bo-pan;;yifei-jimmy-zhang/;",
        "or_profile": "~Bo_Pan2;~Zhenke_Liu1;~Yifei_Zhang10;~Liang_Zhao6",
        "aff": "Emory University;Brown University;Emory University;Emory University",
        "aff_domain": "emory.edu;brown.edu;emory.edu;emory.edu",
        "position": "PhD student;MS student;PhD student;Associate Professor",
        "bibtex": "@misc{\npan2024surrocbm,\ntitle={Surro{CBM}: Concept Bottleneck Surrogate Models for Joint Unsupervised Concept Discovery and Post-hoc Explanation},\nauthor={Bo Pan and Zhenke Liu and Yifei Zhang and Liang Zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=Jh6m4e8Ief}\n}",
        "github": "",
        "project": "",
        "reviewers": "Nbw8;SJuA;tyc5;Tpcj",
        "site": "https://openreview.net/forum?id=Jh6m4e8Ief",
        "pdf_size": 2083470,
        "rating": "3;3;3;3",
        "confidence": "4;5;4;4",
        "soundness": "3;2;1;2",
        "contribution": "1;2;1;1",
        "presentation": "3;3;1;2",
        "wc_summary": "72;59;190;119",
        "wc_strengths": "97;46;240;47",
        "wc_weaknesses": "719;398;793;367",
        "wc_questions": "138;94;603;136",
        "wc_review": "1026;597;1826;669",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            110.0,
            51.29814811472242
        ],
        "wc_strengths_avg": [
            107.5,
            79.22909818999582
        ],
        "wc_weaknesses_avg": [
            569.25,
            188.8919995658895
        ],
        "wc_questions_avg": [
            242.75,
            208.7311368722932
        ],
        "wc_review_avg": [
            1029.5,
            487.709185888476
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:gnfoUCnNiGEJ:scholar.google.com/&scioq=SurroCBM:+Concept+Bottleneck+Surrogate+Models+for+Joint+Unsupervised+Concept+Discovery+and+Post-hoc+Explanation&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Emory University;Brown University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.emory.edu;https://www.brown.edu",
        "aff_unique_abbr": "Emory;Brown",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Jhu4dQv5rY",
        "title": "Contextual Biasing with the Knuth-Morris-Pratt Matching Algorithm",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Contextual biasing refers to the problem of biasing the automatic speech recognition (ASR) systems towards rare entities that are relevant to the specific user or application scenarios. We propose algorithms for contextual biasing based on the Knuth-Morris-Pratt algorithm for pattern matching. During beam search, we boost the score of a token extension if it extends matching into a set of biasing phrases. Our method simulates the classical approaches often implemented in the weighted finite state transducer (WFST) framework, but avoids the FST language altogether, with careful considerations on memory footprint and efficiency on tensor processing units (TPUs) by vectorization. Without introducing additional model parameters, our method achieves significant word error rate (WER) reductions on biasing test sets by itself, and yields further performance gain when combined with a model-based biasing method.",
        "keywords": "Speech Recognition;Contextual Biasing;Knuth-Morris-Pratt matching;Neural Associative Memory biasing",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Weiran Wang;Zelin Wu;Diamantino Caseiro;Tsendsuren Munkhdalai;Khe Chai Sim;Golan Pundak;Pat Rondon;Song Gan;Rohit Prabhavalkar;Zhong Meng;Ding Zhao;Tara N Sainath;Yanzhang He;Pedro Moreno Mengibar",
        "authorids": "~Weiran_Wang2;zelinwu@google.com;dcaseiro@google.com;~Tsendsuren_Munkhdalai1;~Khe_Chai_Sim1;~Golan_Pundak1;rondon@google.com;gansong@google.com;~Rohit_Prabhavalkar1;zhongmeng@google.com;dingzhao@google.com;~Tara_N_Sainath1;~Yanzhang_He1;pedro@google.com",
        "gender": "M;;;;;M;;;M;;;;M;",
        "homepage": "https://weiranwang19.github.io/;;;http://tsendeemts.com;;;;;https://research.google/people/RohitPrabhavalkar/;;;https://sites.google.com/site/tsainath/;;",
        "dblp": ";;;17/11240;78/6873;;;;87/8758;;;28/7825;122/0851;",
        "google_scholar": "O9djN1AAAAAJ;;;-fHyrYQAAAAJ;;qZ2fcpUAAAAJ;;;JgltxisAAAAJ;;;RtQA6Z8AAAAJ;2JH-fJYAAAAJ;",
        "orcid": ";;;0000-0002-8783-4993;;;;;;;;;;",
        "linkedin": ";;;;;;;;rohitprabhavalkar;;;;;",
        "or_profile": "~Weiran_Wang2;zelinwu@google.com;dcaseiro@google.com;~Tsendsuren_Munkhdalai1;~Khe_Chai_Sim1;~Golan_Pundak1;rondon@google.com;gansong@google.com;~Rohit_Prabhavalkar1;zhongmeng@google.com;dingzhao@google.com;~Tara_N_Sainath1;~Yanzhang_He1;pedro@google.com",
        "aff": "Google;;;Google;Google;Google;;;Google;;;Google;Google Inc.;",
        "aff_domain": "google.com;;;google.com;google.com;google.com;;;google.com;;;google.com;google.com;",
        "position": "Researcher;;;Research Scientist;Research Scientist;Researcher;;;Researcher;;;Research Scientist;Researcher;",
        "bibtex": "@misc{\nwang2024contextual,\ntitle={Contextual Biasing with the Knuth-Morris-Pratt Matching Algorithm},\nauthor={Weiran Wang and Zelin Wu and Diamantino Caseiro and Tsendsuren Munkhdalai and Khe Chai Sim and Golan Pundak and Pat Rondon and Song Gan and Rohit Prabhavalkar and Zhong Meng and Ding Zhao and Tara N Sainath and Yanzhang He and Pedro Moreno Mengibar},\nyear={2024},\nurl={https://openreview.net/forum?id=Jhu4dQv5rY}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZLRq;kxsf;8igc",
        "site": "https://openreview.net/forum?id=Jhu4dQv5rY",
        "pdf_size": 282565,
        "rating": "3;5;6",
        "confidence": "4;4;5",
        "soundness": "2;3;2",
        "contribution": "2;3;2",
        "presentation": "1;3;2",
        "wc_summary": "88;49;251",
        "wc_strengths": "115;22;36",
        "wc_weaknesses": "531;222;207",
        "wc_questions": "65;75;462",
        "wc_review": "799;368;956",
        "wc_reply_reviewers": "20;0;0",
        "wc_reply_authors": "168;227;170",
        "reply_reviewers": "1;0;0",
        "reply_authors": "1;1;2",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            129.33333333333334,
            87.49222187651249
        ],
        "wc_strengths_avg": [
            57.666666666666664,
            40.94169295745136
        ],
        "wc_weaknesses_avg": [
            320.0,
            149.3251485852266
        ],
        "wc_questions_avg": [
            200.66666666666666,
            184.83566274456405
        ],
        "wc_review_avg": [
            707.6666666666666,
            248.58577772851143
        ],
        "wc_reply_reviewers_avg": [
            6.666666666666667,
            9.428090415820632
        ],
        "wc_reply_authors_avg": [
            188.33333333333334,
            27.35365098523819
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            14,
            0
        ],
        "corr_rating_confidence": 0.7559289460184544,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4814123224355156022&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;0;0;0;0;0",
        "aff_unique_norm": "Google",
        "aff_unique_dep": "Google",
        "aff_unique_url": "https://www.google.com",
        "aff_unique_abbr": "Google",
        "aff_campus_unique_index": "0;0;0;0;0;0;0",
        "aff_campus_unique": "Mountain View",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Rethinking Channel Dependence for Multivariate Time Series Forecasting: Learning from Leading Indicators",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18928",
        "id": "JiTVtCUOpS",
        "author_site": "Lifan Zhao, Yanyan Shen",
        "tldr": "",
        "abstract": "Recently, channel-independent methods have achieved state-of-the-art performance in multivariate time series (MTS) forecasting. Despite reducing overfitting risks, these methods miss potential opportunities in utilizing channel dependence for accurate predictions. We argue that there exist locally stationary lead-lag relationships between variates, i.e., some lagged variates may follow the leading indicators within a short time period. Exploiting such channel dependence is beneficial since leading indicators offer advance information that can be used to reduce the forecasting difficulty of the lagged variates. In this paper, we propose a new method named LIFT that first efficiently estimates leading indicators and their leading steps at each time step and then judiciously allows the lagged variates to utilize the advance information from leading indicators. LIFT plays as a plugin that can be seamlessly collaborated with arbitrary time series forecasting methods. Extensive experiments on six real-world datasets demonstrate that LIFT improves the state-of-the-art methods by 5.4% in average forecasting performance. Our code is available at https://github.com/SJTU-Quant/LIFT.",
        "keywords": "Multivariate time series forecasting;channel dependence;lead-lag relationships;distribution shift",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Lifan Zhao;Yanyan Shen",
        "authorids": "~Lifan_Zhao3;~Yanyan_Shen1",
        "gender": "M;",
        "homepage": "https://mogicianxd.github.io/;",
        "dblp": "133/7476.html;",
        "google_scholar": "yRptfaQAAAAJ;",
        "orcid": "0000-0003-3526-8579;",
        "linkedin": ";",
        "or_profile": "~Lifan_Zhao3;~Yanyan_Shen1",
        "aff": "Shanghai Jiaotong University;",
        "aff_domain": "sjtu.edu.cn;",
        "position": "PhD student;",
        "bibtex": "@inproceedings{\nzhao2024rethinking,\ntitle={Rethinking Channel Dependence for Multivariate Time Series Forecasting: Learning from Leading Indicators},\nauthor={Lifan Zhao and Yanyan Shen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=JiTVtCUOpS}\n}",
        "github": "",
        "project": "",
        "reviewers": "4A7m;cNYF;MEf1;JmQw",
        "pdf_size": 1539795,
        "rating": "6;6;6;6",
        "confidence": "3;2;3;2",
        "soundness": "3;3;3;3",
        "contribution": "3;2;2;3",
        "presentation": "3;3;4;3",
        "wc_summary": "88;65;132;75",
        "wc_strengths": "68;58;52;54",
        "wc_weaknesses": "37;151;145;46",
        "wc_questions": "230;2;27;2",
        "wc_review": "423;276;356;177",
        "wc_reply_reviewers": "17;16;12;14",
        "wc_reply_authors": "721;697;781;252",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;2;2;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            2.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            90.0,
            25.583197610932064
        ],
        "wc_strengths_avg": [
            58.0,
            6.164414002968976
        ],
        "wc_weaknesses_avg": [
            94.75,
            53.38714732967102
        ],
        "wc_questions_avg": [
            65.25,
            95.6644526456928
        ],
        "wc_review_avg": [
            308.0,
            91.80686248859614
        ],
        "wc_reply_reviewers_avg": [
            14.75,
            1.920286436967152
        ],
        "wc_reply_authors_avg": [
            612.75,
            210.51410285299178
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 33,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10127737632100391262&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=JiTVtCUOpS",
        "pdf": "https://openreview.net/pdf?id=JiTVtCUOpS",
        "email": "sjtu.edu.cn;",
        "author_num": 2,
        "aff_unique_index": "0",
        "aff_unique_norm": "Shanghai Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sjtu.edu.cn",
        "aff_unique_abbr": "SJTU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "Jj8AAlNobk",
        "title": "A Differentiable Sequence Model Perspective on Policy Gradients",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Progress in sequence modeling with deep learning has been driven by the advances in temporal credit assignment coming from better gradient propagation in neural network architectures. In this paper, we reveal that using deep dynamics models conditioned on sequences of actions allows to draw a direct connection between gradient propagation in neural networks and policy gradients, and to harness those advances for sequential decision-making. We leverage this connection to analyze, understand and improve policy gradient methods with tools that have been developed for deep sequence models, theoretically showing that modern architectures provably give better policy gradients. Furthermore, we empirically demonstrate that, in our algorithmic framework, better sequence models entail better policy optimization: when the environment dynamics is well-behaved, we find that better neural network architectures yield more accurate policy gradients; when it is chaotic or non-differentiable, we discover that neural networks are able to provide gradients better-suited for policy optimization compared to the real differentiable simulator. On an optimal control testbed, we show that, within our framework, agents enjoy increased long-term credit assignment capabilities and sample efficiency when compared to traditional model-based and model-free approaches.",
        "keywords": "reinforcement learning;policy gradient;sequence models;gradients;transformers;credit assignment;world models;backpropagation;decision-aware",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/f421bc3a0e7907073d6250345fc72f27495e97d8.zip",
        "author": "Michel Ma;Pierluca D'Oro;Tianwei Ni;Clement Gehring;Pierre-Luc Bacon",
        "authorids": "~Michel_Ma1;~Pierluca_D'Oro1;~Tianwei_Ni1;~Clement_Gehring1;~Pierre-Luc_Bacon1",
        "gender": "M;M;M;M;",
        "homepage": ";https://proceduralia.github.io;https://twni2016.github.io/;http://people.csail.mit.edu/gehring/;",
        "dblp": ";248/8326;230/8153;131/5247;",
        "google_scholar": ";https://scholar.google.it/citations?user=AuVp7pkAAAAJ;njAD34UAAAAJ;KvX7mJUAAAAJ;",
        "orcid": ";;;;",
        "linkedin": "michel-ma/;;;;",
        "or_profile": "~Michel_Ma1;~Pierluca_D'Oro1;~Tianwei_Ni1;~Clement_Gehring1;~Pierre-Luc_Bacon1",
        "aff": "University of Montreal;Universit\u00e9 de Montr\u00e9al;Amazon Web Services;Massachusetts Institute of Technology;",
        "aff_domain": "umontreal.ca;umontreal.ca;amazon.com;mit.edu;",
        "position": "PhD student;PhD student;Intern;PhD student;",
        "bibtex": "@misc{\nma2024a,\ntitle={A Differentiable Sequence Model Perspective on Policy Gradients},\nauthor={Michel Ma and Pierluca D'Oro and Tianwei Ni and Clement Gehring and Pierre-Luc Bacon},\nyear={2024},\nurl={https://openreview.net/forum?id=Jj8AAlNobk}\n}",
        "github": "",
        "project": "",
        "reviewers": "YpGq;JUws;KDm5;ruP8",
        "site": "https://openreview.net/forum?id=Jj8AAlNobk",
        "pdf_size": 1223354,
        "rating": "3;3;5;6",
        "confidence": "4;4;3;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;2;3",
        "wc_summary": "72;94;257;98",
        "wc_strengths": "68;16;124;40",
        "wc_weaknesses": "112;197;238;47",
        "wc_questions": "8;2;504;184",
        "wc_review": "260;309;1123;369",
        "wc_reply_reviewers": "0;0;872;100",
        "wc_reply_authors": "326;657;1302;330",
        "reply_reviewers": "0;0;2;2",
        "reply_authors": "1;2;2;3",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            130.25,
            73.84570061960277
        ],
        "wc_strengths_avg": [
            62.0,
            40.24922359499622
        ],
        "wc_weaknesses_avg": [
            148.5,
            74.15692819959575
        ],
        "wc_questions_avg": [
            174.5,
            203.80076054813927
        ],
        "wc_review_avg": [
            515.25,
            353.0016820073242
        ],
        "wc_reply_reviewers_avg": [
            243.0,
            365.44082968382173
        ],
        "wc_reply_authors_avg": [
            653.75,
            397.6407769582994
        ],
        "reply_reviewers_avg": [
            1.0,
            1.0
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9622504486493761,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:GchNqbK4gw8J:scholar.google.com/&scioq=A+Differentiable+Sequence+Model+Perspective+on+Policy+Gradients&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "University of Montreal;Universit\u00e9 de Montr\u00e9al;Amazon;Massachusetts Institute of Technology",
        "aff_unique_dep": ";;Amazon Web Services;",
        "aff_unique_url": "https://wwwumontreal.ca;https://www.umontreal.ca;https://aws.amazon.com;https://web.mit.edu",
        "aff_unique_abbr": "UM;UdeM;AWS;MIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;1",
        "aff_country_unique": "Canada;United States"
    },
    {
        "id": "Jk6gGj0kQm",
        "title": "Predicting the Encoding Error of Implicit Neural Representations",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Implicit Neural Representations (INRs), which encode signals such as images, videos, and 3D shapes in the weights of neural networks, are becoming increasingly popular. Among their many applications is signal compression, for which there is great interest in achieving the highest possible fidelity to the original signal subject to constraints such as neural network size, training (encoding) and inference (decoding) time. Yet training INRs can be a computationally expensive process, making it costly to know if one has made the best possible tradeoff given such constraints. Towards this goal, we propose a novel problem: predicting the encoding error (training loss) that an INR will reach on a given training signal. We present a method which predicts the encoding loss that a popular INR network (SIREN) will reach, given its network hyperparameters and the signal to encode. Our predictive method demonstrates the tractability of this regression problem, and allows users to anticipate the encoding error that a SIREN network will reach in milliseconds instead of minutes or longer. We also offer insights into SIREN network behavior, such as why narrow SIRENs can have very high random variation in encoding loss, and how the performance of SIRENs relates to JPEG compression.",
        "keywords": "Coordinate networks;Implicit neural reresentations;SIREN;compression",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Jeremy Vonderfecht;Feng Liu",
        "authorids": "~Jeremy_Vonderfecht1;~Feng_Liu6",
        "gender": ";",
        "homepage": "https://github.com/JeremyIV;",
        "dblp": ";77/1318-15",
        "google_scholar": ";https://scholar.google.com/citations?hl=en",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Jeremy_Vonderfecht1;~Feng_Liu6",
        "aff": "Portland State University;Portland State University",
        "aff_domain": "pdx.edu;pdx.edu",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nvonderfecht2024predicting,\ntitle={Predicting the Encoding Error of Implicit Neural Representations},\nauthor={Jeremy Vonderfecht and Feng Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=Jk6gGj0kQm}\n}",
        "github": "",
        "project": "",
        "reviewers": "bVWr;w62A;Ny7t;Dqyn",
        "site": "https://openreview.net/forum?id=Jk6gGj0kQm",
        "pdf_size": 3622100,
        "rating": "3;3;3;5",
        "confidence": "4;3;4;3",
        "soundness": "3;2;1;3",
        "contribution": "2;2;2;2",
        "presentation": "3;2;2;4",
        "wc_summary": "148;27;102;120",
        "wc_strengths": "124;11;71;73",
        "wc_weaknesses": "367;306;360;257",
        "wc_questions": "28;3;33;2",
        "wc_review": "667;347;566;452",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            99.25,
            44.81838350498599
        ],
        "wc_strengths_avg": [
            69.75,
            40.02108819110245
        ],
        "wc_weaknesses_avg": [
            322.5,
            44.57858230136979
        ],
        "wc_questions_avg": [
            16.5,
            14.115594213493104
        ],
        "wc_review_avg": [
            508.0,
            120.10620300384156
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:gZGsMstV7s8J:scholar.google.com/&scioq=Predicting+the+Encoding+Error+of+Implicit+Neural+Representations&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Portland State University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.pdx.edu",
        "aff_unique_abbr": "PSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "JkMAlN3YcI",
        "title": "How Temporal Unrolling Supports Neural Physics Simulators",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Unrolling training trajectories over time strongly influences the inference accuracy of neural network-augmented physics simulators. We analyze these effects by studying three variants of training neural networks on discrete ground truth trajectories. In addition to commonly used one-step setups and fully differentiable unrolling, we include a third, less widely used variant: unrolling without temporal gradients. Comparing networks trained with these three modalities makes it possible to disentangle the two dominant effects of unrolling, training distribution shift and long-term gradients. We present a detailed benchmark across physical systems, network sizes, network architectures, training setups, and test scenarios. It provides an empirical basis for our main findings: Fully differentiable setups perform best across most tests, yielding an improvement of 38% on average. Nevertheless, the accuracy of unrolling without temporal gradients comes comparatively close with 23%. These results motivate integrating non-differentiable numerical simulators into training setups even if full differentiability is unavailable. Furthermore, we empirically show that these behaviors are invariant to changes in the underlying physical system, the network architecture and size, and the numerical\nscheme.",
        "keywords": "neural simulators;unrolling;differentiable simulator;partial differential equation;fluids benchmark",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Bj\u00f6rn Malte List;Liwei Chen;Kartik Bali;Nils Thuerey",
        "authorids": "~Bj\u00f6rn_Malte_List1;~Liwei_Chen2;~Kartik_Bali1;~Nils_Thuerey1",
        "gender": "M;M;M;M",
        "homepage": "https://ge.in.tum.de/about/bjorn-list/;;https://github.com/kbali1297;https://ge.in.tum.de",
        "dblp": "314/5406;;;42/478",
        "google_scholar": ";;;https://scholar.google.com.tw/citations?user=GEehwv8AAAAJ",
        "orcid": "0000-0002-1110-9517;0000-0002-0309-2284;;",
        "linkedin": ";liwei-chen-46557017/;;",
        "or_profile": "~Bj\u00f6rn_Malte_List1;~Liwei_Chen2;~Kartik_Bali1;~Nils_Thuerey1",
        "aff": "Technische Universit\u00e4t M\u00fcnchen;Technical University Munich;Technische Universit\u00e4t M\u00fcnchen;Technical University Munich",
        "aff_domain": "tum.de;tum.de;tum.de;tum.de",
        "position": "PhD student;Postdoc;MS student;Associate Professor",
        "bibtex": "@misc{\nlist2024how,\ntitle={How Temporal Unrolling Supports Neural Physics Simulators},\nauthor={Bj{\\\"o}rn Malte List and Liwei Chen and Kartik Bali and Nils Thuerey},\nyear={2024},\nurl={https://openreview.net/forum?id=JkMAlN3YcI}\n}",
        "github": "",
        "project": "",
        "reviewers": "GanK;CxuR;9oEF;BVZT",
        "site": "https://openreview.net/forum?id=JkMAlN3YcI",
        "pdf_size": 4057199,
        "rating": "3;5;5;6",
        "confidence": "4;4;4;2",
        "soundness": "2;3;2;4",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "96;129;43;166",
        "wc_strengths": "59;109;22;75",
        "wc_weaknesses": "278;362;71;64",
        "wc_questions": "303;18;161;66",
        "wc_review": "736;618;297;371",
        "wc_reply_reviewers": "23;0;0;0",
        "wc_reply_authors": "1980;1396;754;793",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "3;2;1;2",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            108.5,
            45.202322949158265
        ],
        "wc_strengths_avg": [
            66.25,
            31.283981524096323
        ],
        "wc_weaknesses_avg": [
            193.75,
            129.7196496294991
        ],
        "wc_questions_avg": [
            137.0,
            108.78189187544037
        ],
        "wc_review_avg": [
            505.5,
            178.42995824692667
        ],
        "wc_reply_reviewers_avg": [
            5.75,
            9.959292143521045
        ],
        "wc_reply_authors_avg": [
            1230.75,
            501.8960923338615
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.6622661785325219,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5345055699836936648&as_sdt=80005&sciodt=0,11&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;1",
        "aff_unique_norm": "Technische Universit\u00e4t M\u00fcnchen;Technical University of Munich",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tum.de;https://www.tum.de",
        "aff_unique_abbr": "TUM;TUM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "JlSyXwCEIQ",
        "title": "CodeIt: Abstract Reasoning with Iterative Policy-Guided Program Synthesis",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Artificial intelligence systems are increasingly solving tasks that are commonly believed to require human-like reasoning ability. However, learned approaches still fare poorly on the Abstraction and Reasoning Corpus (ARC), a benchmark that measures skill-acquisition efficiency as a proxy for intelligence. Each ARC task requires an agent to reason about a transformation between input and output pairs. In this work, we solve these tasks by identifying the program that applies this transformation. We propose CodeIt, a program synthesis approach that leverages a higher level of abstraction through a domain-specific language. CodeIt iterates between sampling from the current large language model policy and learning that policy using supervised learning. The sampling stage augments newfound programs using hindsight relabeling and program mutation, requiring no expert search procedure. We demonstrate CodeIt\u2019s effectiveness on the ARC benchmark, where we show that learning to write code in iterations leads to intertask generalization, which results in state-of-the-art performance.",
        "keywords": "Program synthesis;abstract reasoning;reinforcement learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Natasha Butt;Blazej Manczak;Auke Wiggers;Corrado Rainone;David W. Zhang;Micha\u00ebl Defferrard;Taco Cohen",
        "authorids": "~Natasha_Butt1;~Blazej_Manczak1;~Auke_Wiggers1;~Corrado_Rainone1;~David_W._Zhang1;~Micha\u00ebl_Defferrard1;~Taco_Cohen1",
        "gender": "F;M;M;M;M;M;M",
        "homepage": "https://ivi.fnwi.uva.nl/quva/people.html;;;https://deff.ch;http://www.ta.co.nl;https://aukejw.github.io/;https://davzha.netlify.app/",
        "dblp": ";;304/2695;182/2568.html;142/2903;182/2485;119/0960",
        "google_scholar": ";;ss6yaikAAAAJ;https://scholar.google.ch/citations?user=Ztj2-gUAAAAJ;a3q4YxEAAAAJ;https://scholar.google.nl/citations?user=rrwwB4cAAAAJ;https://scholar.google.nl/citations?user=MG3oLzUAAAAJ",
        "orcid": ";;0000-0003-0381-7254;0000-0002-6028-9024;;;0000-0002-2137-1738",
        "linkedin": ";blaise-blazej-manczak-10769b150/;corrado-rainone-2361641a1/;https://linkedin.com/in/mdeff;;;david-zhang-1b86b314a",
        "or_profile": "~Natasha_Butt1;~Blazej_Manczak1;~Corrado_Rainone1;~Micha\u00ebl_Defferrard1;~Taco_Cohen1;~Auke_J._Wiggers1;~David_W_Zhang1",
        "aff": "University of Amsterdam;Qualcomm Inc, QualComm;Qualcomm Inc, QualComm;Qualcomm;Meta;QualComm;Qualcomm Inc, QualComm",
        "aff_domain": "uva.nl;qti.qualcomm.com;qti.qualcomm.com;qualcomm.com;meta.com;qualcomm.com;qti.qualcomm.com",
        "position": "PhD student;Researcher;Researcher;Researcher;Researcher;Researcher;Researcher",
        "bibtex": "@misc{\nbutt2024codeit,\ntitle={CodeIt: Abstract Reasoning with Iterative Policy-Guided Program Synthesis},\nauthor={Natasha Butt and Blazej Manczak and Auke Wiggers and Corrado Rainone and David W. Zhang and Micha{\\\"e}l Defferrard and Taco Cohen},\nyear={2024},\nurl={https://openreview.net/forum?id=JlSyXwCEIQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "JPeY;NHnw;xY18;WdyM",
        "site": "https://openreview.net/forum?id=JlSyXwCEIQ",
        "pdf_size": 1406987,
        "rating": "5;6;6;6",
        "confidence": "4;5;4;3",
        "soundness": "3;4;3;2",
        "contribution": "2;4;3;2",
        "presentation": "3;4;3;2",
        "wc_summary": "130;91;74;81",
        "wc_strengths": "51;154;68;62",
        "wc_weaknesses": "355;314;407;235",
        "wc_questions": "170;768;20;230",
        "wc_review": "706;1327;569;608",
        "wc_reply_reviewers": "0;10;27;75",
        "wc_reply_authors": "454;738;751;812",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            94.0,
            21.644860821913362
        ],
        "wc_strengths_avg": [
            83.75,
            41.014479150660925
        ],
        "wc_weaknesses_avg": [
            327.75,
            62.87835478127589
        ],
        "wc_questions_avg": [
            297.0,
            282.4836278441637
        ],
        "wc_review_avg": [
            802.5,
            306.9059302131518
        ],
        "wc_reply_reviewers_avg": [
            28.0,
            28.801041647829337
        ],
        "wc_reply_authors_avg": [
            688.75,
            138.38239591797796
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17413436114368097841&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1;2;1;1",
        "aff_unique_norm": "University of Amsterdam;Qualcomm Incorporated;Meta",
        "aff_unique_dep": ";;Meta Platforms, Inc.",
        "aff_unique_url": "https://www.uva.nl;https://www.qualcomm.com;https://meta.com",
        "aff_unique_abbr": "UvA;Qualcomm;Meta",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;1;1;1",
        "aff_country_unique": "Netherlands;United States"
    },
    {
        "id": "Jla53ILAha",
        "title": "Implicit regularization of multi-task learning and finetuning in overparameterized neural networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "It is common in deep learning to train networks on auxiliary tasks with the expectation that the learning will transfer, at least partially, to another task of interest. In this work, we investigate the inductive biases that result from learning auxiliary tasks, either simultaneously (multi-task learning, MTL) or sequentially (pretraining and subsequent finetuning, PT+FT). In the simplified setting of two-layer diagonal linear networks trained with gradient descent, we identify implicit regularization penalties associated with MTL and PT+FT, both of which incentivize feature sharing between tasks and sparsity in learned task-specific features. Notably, our results imply that during finetuning, networks operate in a hybrid of the kernel (or \"lazy\") regime and the feature learning (\"rich\") regime identified in prior work. Moreover, PT+FT can exhibit a novel ``nested feature learning'' behavior not captured by either regime, which biases it to extract a sparse subset of the features learned during pretraining. In ReLU networks, we reproduce all of these qualitative behaviors. We also observe that PT+FT (but not MTL) is biased to learn features that are correlated with (but distinct from) those needed for the auxiliary task, while MTL is biased toward using identical features for both tasks. As a result, we find that in realistic settings, MTL generalizes better when comparatively little data is available for the task of interest, while PT+FT outperforms it with more data available. We show that our findings hold qualitatively for a deep architecture trained on image classification tasks. Our characterization of the nested feature learning regime also motivates a modification to PT+FT that we find empirically improves performance. Overall, our results shed light on the impact of auxiliary task learning and suggest ways to leverage it more effectively.",
        "keywords": "multi-task learning;pretraining;representation learning;implicit regularization",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/cadd3a3ecf4831470641c0145bfe867a38018e80.pdf",
        "author": "Jack Lindsey;Samuel Lippl",
        "authorids": "~Jack_Lindsey1;~Samuel_Lippl1",
        "gender": ";M",
        "homepage": ";https://sflippl.github.io",
        "dblp": ";",
        "google_scholar": "CNrQvh4AAAAJ;56QHqZsAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Jack_Lindsey1;~Samuel_Lippl1",
        "aff": "Columbia University;Columbia University",
        "aff_domain": "columbia.edu;columbia.edu",
        "position": "Student;PhD student",
        "bibtex": "@misc{\nlindsey2024implicit,\ntitle={Implicit regularization of multi-task learning and finetuning in overparameterized neural networks},\nauthor={Jack Lindsey and Samuel Lippl},\nyear={2024},\nurl={https://openreview.net/forum?id=Jla53ILAha}\n}",
        "github": "",
        "project": "",
        "reviewers": "bJHA;ToRY;gQGL",
        "site": "https://openreview.net/forum?id=Jla53ILAha",
        "pdf_size": 860710,
        "rating": "3;6;8",
        "confidence": "4;2;4",
        "soundness": "2;3;3",
        "contribution": "1;3;3",
        "presentation": "2;3;3",
        "wc_summary": "111;60;162",
        "wc_strengths": "114;119;109",
        "wc_weaknesses": "722;146;88",
        "wc_questions": "1;168;2",
        "wc_review": "948;493;361",
        "wc_reply_reviewers": "353;16;0",
        "wc_reply_authors": "1278;402;163",
        "reply_reviewers": "1;1;0",
        "reply_authors": "2;2;1",
        "rating_avg": [
            5.666666666666667,
            2.0548046676563256
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            111.0,
            41.641325627314025
        ],
        "wc_strengths_avg": [
            114.0,
            4.08248290463863
        ],
        "wc_weaknesses_avg": [
            318.6666666666667,
            286.18098391674374
        ],
        "wc_questions_avg": [
            57.0,
            78.48991442641957
        ],
        "wc_review_avg": [
            600.6666666666666,
            251.4442725977711
        ],
        "wc_reply_reviewers_avg": [
            123.0,
            162.76568024822268
        ],
        "wc_reply_authors_avg": [
            614.3333333333334,
            479.31919311549467
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.11470786693528094,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3977208783691436996&as_sdt=4005&sciodt=0,6&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Columbia University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.columbia.edu",
        "aff_unique_abbr": "Columbia",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "JmyyGlQW5P",
        "title": "Speeding Up Speech Synthesis In Diffusion Models By Reducing Data Distribution Recovery Steps Via Content Transfer",
        "track": "main",
        "status": "Desk Reject",
        "tldr": "",
        "abstract": "Diffusion based vocoders have been criticised for being slow due to the many steps required during sampling. Moreover, the model\u2019s loss function that is popularly implemented is designed such that the the target is the original input x0 or error \u03b50. For early time steps of the reverse process, this results in large prediction errors, which can lead to speech distortions and increase the learning time. We propose\na setup where the targets are the different outputs of forward process time steps with a goal to reduce the magnitude of prediction errors and reduce the training time. We use the different layers of a neural network (NN) to perform denoising by training them to learn to generate representations similar to the noised out-puts in the forward process of the diffusion. The NN layers learn to progressively denoise the input in the reverse process until finally the final layer estimates the clean speech. To avoid 1:1 mapping between layers of the neural network and the forward process steps, we define a skip parameter \u03c4 > 1 such that an NN layer is trained to cumulatively remove the noise injected in the \u03c4 steps in the forward process. This significantly reduces the number of data distribution recovery steps and, consequently, the time to generate speech. We show through extensive evaluation that the proposed technique generates high-fidelity speech in competitive\ntime that outperforms current state-of-the-art tools. The proposed technique is also able to generalize well to unseen speech.",
        "keywords": "diffusion;vocoder;speech synthesis",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Peter Ochieng",
        "authorids": "~Peter_Ochieng1",
        "gender": "M",
        "homepage": "",
        "dblp": "",
        "google_scholar": "g_8i05QAAAAJ",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Peter_Ochieng1",
        "aff": "Taita Taveta University",
        "aff_domain": "ttu.ac.ke",
        "position": "Lecturer",
        "bibtex": "@misc{\nochieng2024speeding,\ntitle={Speeding Up Speech Synthesis In Diffusion Models By Reducing Data Distribution Recovery Steps Via Content Transfer},\nauthor={Peter Ochieng},\nyear={2024},\nurl={https://openreview.net/forum?id=JmyyGlQW5P}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=JmyyGlQW5P",
        "pdf_size": 981117,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:18yHGlUV1QcJ:scholar.google.com/&scioq=Speeding+Up+Speech+Synthesis+In+Diffusion+Models+By+Reducing+Data+Distribution+Recovery+Steps+Via+Content+Transfer&hl=en&as_sdt=0,5",
        "gs_version_total": 4,
        "aff_unique_index": "0",
        "aff_unique_norm": "Taita Taveta University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.taitatavetauniversity.ac.ke",
        "aff_unique_abbr": "",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Kenya"
    },
    {
        "id": "Jn8CYfYLUT",
        "title": "Unlocking the Power of Diffusion Models to Rescue Data Insufficiency for Long-Tailed Recognition",
        "track": "main",
        "status": "Desk Reject",
        "tldr": "",
        "abstract": "Long-tailed learning aims to tackle the crucial challenge that head classes dominate the training procedure under severe class imbalance in real-world scenarios. Generating diverse samples for tail categories is considered a key factor in addressing the problem of long-tailed recognition. While diffusion models have demonstrated their efficacy in generating high-quality images, adapting these models to long-tailed domains for data augmentation purposes remains an open challenge.  This arises from homogenized generated samples due to the lack of diversity in their generative distributions during diffusion training, and limited semantic information stemming from biased classifier boundaries during diffusion sampling. To overcome the aforementioned challenges, we present DiffRC, a diffusion model-based data augmentation framework designed to generate a diverse array of synthetic samples for tail categories, thereby enhancing the overall classification performance. Building upon the properties of the long-tailed problem, we extract rich generative distribution knowledge of head categories and match the pairwise sample diversity between head and tail categories, enabling the target diffusion model to learn diverse generation preserving inter-sample variation during the diffusion training process.  Moreover, we incorporate modified feature prototypes, which encode essential semantic information, to guide the sampling procedure and circumvent the biased classifier predictions during diffusion sampling. Our approach surpasses previous data augmentation techniques for long-tailed learning by a considerable margin and achieves state-of-the-art performance.",
        "keywords": "Diffusion model;Long-tailed learning",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Siming Fu;Xiaoxuan He;Jianhong Bai;Weihu Huang;Sicheng Zhu;Haoji Hu",
        "authorids": "~Siming_Fu1;~Xiaoxuan_He1;~Jianhong_Bai2;~Weihu_Huang1;22160603@zju.edu.cn;~Haoji_Hu1",
        "gender": "F;M;M;M;;M",
        "homepage": "https://www.researchgate.net/profile/Fu-Siming-2;https://github.com/Shredded-Pork;https://jianhongbai.github.io/;https://person.zju.edu.cn/0085200?ivk_sa=1024320u;;https://person.zju.edu.cn/huhaoji",
        "dblp": "324/0710;188/4696;349/0391;;;65/11145",
        "google_scholar": "tql_Zc4AAAAJ;;U926UgYAAAAJ;;;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": "0000-0003-3257-1011;;0000-0002-3121-7259;;;0000-0001-6048-6549",
        "linkedin": ";;;;;",
        "or_profile": "~Siming_Fu1;~Xiaoxuan_He1;~Jianhong_Bai2;~Weihu_Huang1;22160603@zju.edu.cn;~Haoji_Hu1",
        "aff": "Zhejiang University;Zhejiang University;Zhejiang University;Zhejiang University;;Zhejiang University",
        "aff_domain": "zju.edu.cn;zju.edu.cn;zju.edu.cn;zju.edu.cn;;zju.edu.cn",
        "position": "PhD student;PhD student;PhD student;MS student;;Associate Professor",
        "bibtex": "@misc{\nfu2024unlocking,\ntitle={Unlocking the Power of Diffusion Models to Rescue Data Insufficiency for Long-Tailed Recognition},\nauthor={Siming Fu and Xiaoxuan He and Jianhong Bai and Weihu Huang and Sicheng Zhu and Haoji Hu},\nyear={2024},\nurl={https://openreview.net/forum?id=Jn8CYfYLUT}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=Jn8CYfYLUT",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:q9uRra4ukXQJ:scholar.google.com/&scioq=Unlocking+the+Power+of+Diffusion+Models+to+Rescue+Data+Insufficiency+for+Long-Tailed+Recognition&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Zhejiang University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.zju.edu.cn",
        "aff_unique_abbr": "ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Repeated Random Sampling for Minimizing the Time-to-Accuracy of Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18927",
        "id": "JnRStoIuTe",
        "author_site": "Patrik Okanovic, Roger Waleffe, Vasilis Mageirakos, Konstantinos Nikolakakis, Amin Karbasi, Dionysios Kalogerias, Nezihe Merve G\u00fcrel, Theodoros Rekatsinas",
        "tldr": "",
        "abstract": "Methods for carefully selecting or generating a small set of training data to learn from, i.e., data pruning, coreset selection, and dataset distillation, have been shown to be effective in reducing the ever-increasing cost of training neural networks. Behind this success are rigorously designed, yet expensive, strategies for identifying the most informative training examples out of large datasets. In this work, we revisit these methods to understand if the additional computational costs associated with such strategies are justified from the perspective of time-to-accuracy, which has become a critical efficiency measure of deep neural network training over large datasets. Surprisingly, we find that many of the recently proposed methods underperform what we call Repeated Sampling of Random Subsets (RSRS or RS2), a powerful yet overlooked extension of the standard random baseline that learns from repeatedly sampled data throughout training instead of a fixed random subset. We test RS2 against thirty-two state-of-the-art data pruning and distillation methods across four datasets including ImageNet. Our results demonstrate that RS2 significantly reduces time-to-accuracy, particularly in practical regimes where accuracy, but not runtime, is similar to that of training on full dataset. For example, when training ResNet-18 on ImageNet, with 10\\% of the dataset each epoch RS2 reaches an accuracy of 66\\% versus 69\\% when training with the full dataset. The best competing method achieves only 55\\% while training 1.6$\\times$ slower than RS2. Beyond the above meta-study, we discuss the theoretical properties of RS2 such as its convergence rate and generalization error. Our primary goal is to highlight that future works that aim to minimize total training cost by using subset selection, need to consider 1) the total computation cost (including preparing the subset) and 2) should aim to outperform a simple extension of random sampling (i.e., RS2).",
        "keywords": "data pruning;dataset distillation;random sampling;corset selection;data-efficient learning",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/9e7370d52abba95188410f1bf221f307a636adaf.zip",
        "author": "Patrik Okanovic;Roger Waleffe;Vasilis Mageirakos;Konstantinos Nikolakakis;Amin Karbasi;Dionysios Kalogerias;Nezihe Merve G\u00fcrel;Theodoros Rekatsinas",
        "authorids": "~Patrik_Okanovic1;~Roger_Waleffe1;~Vasilis_Mageirakos1;~Konstantinos_Nikolakakis1;~Amin_Karbasi3;~Dionysios_Kalogerias1;~Nezihe_Merve_G\u00fcrel2;~Theodoros_Rekatsinas2",
        "gender": "M;;;;;;Not Specified;",
        "homepage": ";;;;;;https://nezihemervegurel.github.io/;",
        "dblp": "323/5046;;;232/4111;;;215/5003;",
        "google_scholar": "ywvPTZ4AAAAJ;;;Rz29mAgAAAAJ;;;5yYPHwYAAAAJ;",
        "orcid": ";;;;;;;",
        "linkedin": "patrik-okanovic;;;;;;nezihemervegurel/;",
        "or_profile": "~Patrik_Okanovic1;~Roger_Waleffe1;~Vasilis_Mageirakos1;~Konstantinos_Nikolakakis1;~Amin_Karbasi3;~Dionysios_Kalogerias1;~Nezihe_Merve_G\u00fcrel2;~Theodoros_Rekatsinas2",
        "aff": "Department of Computer Science, ETHZ - ETH Zurich;;;;;;Delft University of Technology;",
        "aff_domain": "inf.ethz.ch;;;;;;tudelft.nl;",
        "position": "PhD student;;;;;;Assistant Professor;",
        "bibtex": "@inproceedings{\nokanovic2024repeated,\ntitle={Repeated Random Sampling for Minimizing the Time-to-Accuracy of Learning},\nauthor={Patrik Okanovic and Roger Waleffe and Vasilis Mageirakos and Konstantinos Nikolakakis and Amin Karbasi and Dionysios Kalogerias and Nezihe Merve G{\\\"u}rel and Theodoros Rekatsinas},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=JnRStoIuTe}\n}",
        "github": "",
        "project": "",
        "reviewers": "ns5a;hzLv;MpXN;9ict;ph2C",
        "pdf_size": 653014,
        "rating": "3;3;6;6;8",
        "confidence": "3;4;3;4;5",
        "soundness": "3;1;3;2;3",
        "contribution": "3;2;3;2;3",
        "presentation": "2;1;3;3;3",
        "wc_summary": "82;103;78;96;150",
        "wc_strengths": "75;72;78;38;110",
        "wc_weaknesses": "399;187;90;222;107",
        "wc_questions": "26;70;6;1;101",
        "wc_review": "582;432;252;357;468",
        "wc_reply_reviewers": "27;55;47;0;57",
        "wc_reply_authors": "872;778;364;452;464",
        "reply_reviewers": "1;1;1;0;1",
        "reply_authors": "2;1;1;1;2",
        "rating_avg": [
            5.2,
            1.9390719429665317
        ],
        "confidence_avg": [
            3.8,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.4,
            0.8
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.4,
            0.8
        ],
        "wc_summary_avg": [
            101.8,
            25.755776051208397
        ],
        "wc_strengths_avg": [
            74.6,
            22.85257097133712
        ],
        "wc_weaknesses_avg": [
            201.0,
            110.45179944210959
        ],
        "wc_questions_avg": [
            40.8,
            38.706071875094736
        ],
        "wc_review_avg": [
            418.2,
            110.3347633341369
        ],
        "wc_reply_reviewers_avg": [
            37.2,
            21.414014102918678
        ],
        "wc_reply_authors_avg": [
            586.0,
            200.39161659111392
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4
        ],
        "reply_authors_avg": [
            1.4,
            0.4898979485566356
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.5788837387409699,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3736000331071316352&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=JnRStoIuTe",
        "pdf": "https://openreview.net/pdf?id=JnRStoIuTe",
        "email": "inf.ethz.ch;;;;;;tudelft.nl;",
        "author_num": 8,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "ETH Zurich;Delft University of Technology",
        "aff_unique_dep": "Department of Computer Science;",
        "aff_unique_url": "https://www.ethz.ch;https://www.tudelft.nl",
        "aff_unique_abbr": "ETHZ;TU Delft",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Zurich;",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Switzerland;Netherlands"
    },
    {
        "title": "LabelDP-Pro: Learning with Label Differential Privacy via Projections",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18926",
        "id": "JnYaF3vv3G",
        "author_site": "Badih Ghazi, Yangsibo Huang, Pritish Kamath, Ravi Kumar, Pasin Manurangsi, Chiyuan Zhang",
        "tldr": "",
        "abstract": "Label differentially private (label DP) algorithms seek to preserve the privacy of the labels in a training dataset in settings where the features are known to the adversary. In this work, we study a new family of label DP training algorithms. Unlike most prior label DP algorithms that have been based on label randomization, our algorithm naturally leverages the power of the central model of DP. It interleaves gradient projection operations with private stochastic gradient descent steps in order to improve the utility of the trained model while guaranteeing the privacy of the labels. We show that such projection-based algorithms can be made practical and that they improve on the state-of-the art for label DP training in the high-privacy regime. We complement our empirical evaluation with theoretical results shedding light on the efficacy of our method through the lens of bias-variance trade-offs.",
        "keywords": "Differential Privacy;Label Differential Privacy;Projections",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Badih Ghazi;Yangsibo Huang;Pritish Kamath;Ravi Kumar;Pasin Manurangsi;Chiyuan Zhang",
        "authorids": "~Badih_Ghazi1;~Yangsibo_Huang2;~Pritish_Kamath2;~Ravi_Kumar1;~Pasin_Manurangsi2;~Chiyuan_Zhang1",
        "gender": ";F;M;M;M;M",
        "homepage": "https://sites.google.com/view/badihghazi/home;https://hazelsuko07.github.io/yangsibo/;https://pritishkamath.github.io/;https://sites.google.com/site/ravik53/;https://pasin30055.github.io/;http://pluskid.org",
        "dblp": "125/2134;;https://dblp.org/pers/k/Kamath:Pritish.html;k/RaviKumar.html;133/2059;21/8315",
        "google_scholar": "GBJLTN8AAAAJ;NMPUDa0AAAAJ;1JFARhUAAAAJ;J_XhIsgAAAAJ;35hM-PkAAAAJ;l_G2vr0AAAAJ",
        "orcid": ";;;0000-0002-2203-2586;;",
        "linkedin": "badih-ghazi-608379132/;;;ravi-kumar-a3a9631;;",
        "or_profile": "~Badih_Ghazi1;~Yangsibo_Huang2;~Pritish_Kamath2;~Ravi_Kumar1;~Pasin_Manurangsi2;~Chiyuan_Zhang1",
        "aff": "Google;Princeton University;Google Research;Google;Google;Google",
        "aff_domain": "google.com;princeton.edu;google.com;google.com;google.com;google.com",
        "position": "Researcher;PhD student;Research Scientist;Research Scientist;Research Scientist;Research Scientist",
        "bibtex": "@inproceedings{\nghazi2024labeldppro,\ntitle={Label{DP}-Pro: Learning with Label Differential Privacy via Projections},\nauthor={Badih Ghazi and Yangsibo Huang and Pritish Kamath and Ravi Kumar and Pasin Manurangsi and Chiyuan Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=JnYaF3vv3G}\n}",
        "github": "",
        "project": "",
        "reviewers": "zF53;NHnW;Taxi;3Pz1",
        "pdf_size": 1834095,
        "rating": "5;6;6;6",
        "confidence": "4;4;5;3",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "64;56;71;47",
        "wc_strengths": "79;33;28;72",
        "wc_weaknesses": "271;21;97;84",
        "wc_questions": "7;225;60;53",
        "wc_review": "421;335;256;256",
        "wc_reply_reviewers": "120;0;0;311",
        "wc_reply_authors": "889;1083;770;1117",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "3;3;2;2",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            59.5,
            8.958236433584458
        ],
        "wc_strengths_avg": [
            53.0,
            22.704625079485456
        ],
        "wc_weaknesses_avg": [
            118.25,
            92.75606449176247
        ],
        "wc_questions_avg": [
            86.25,
            82.65402289060104
        ],
        "wc_review_avg": [
            317.0,
            68.15790489737782
        ],
        "wc_reply_reviewers_avg": [
            107.75,
            127.16205212247874
        ],
        "wc_reply_authors_avg": [
            964.75,
            142.15198732342787
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:2ZKz0AQpQekJ:scholar.google.com/&scioq=LabelDP-Pro:+Learning+with+Label+Differential+Privacy+via+Projections&hl=en&as_sdt=0,44",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=JnYaF3vv3G",
        "pdf": "https://openreview.net/pdf?id=JnYaF3vv3G",
        "email": "google.com;princeton.edu;google.com;google.com;google.com;google.com",
        "author_num": 6,
        "aff_unique_index": "0;1;0;0;0;0",
        "aff_unique_norm": "Google;Princeton University",
        "aff_unique_dep": "Google;",
        "aff_unique_url": "https://www.google.com;https://www.princeton.edu",
        "aff_unique_abbr": "Google;Princeton",
        "aff_campus_unique_index": "0;0;0;0;0",
        "aff_campus_unique": "Mountain View;",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "JopVmAPyx6",
        "title": "How does representation impact in-context learning: An exploration on a synthetic task",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In-context learning, i.e., learning from in-context samples, is an impressive ability of Transformer. However, the exact mechanism behind this learning process remains unclear. In this study, we aim to explore this aspect from a relatively unexplored perspective of representation learning. In the context of in-context learning scenarios, the representation becomes more complex as it can be influenced by both model weights and in-context samples. We refer to these two conceptual aspects of representation as the in-weight component and the in-context component, respectively. To examine the impact of these two components on in-context learning capabilities, we create a novel synthetic task, which allows us to develop two probes - the in-weights probe and the in-context probe - to evaluate the respective components. Our findings reveal that the quality of the in-context component is closely related to in-context learning performance, signifying the connection between in-context learning and representation learning. Additionally, we discover that a well-developed in-weights component can positively affect the learning of the in-context component, suggesting that in-weights learning should serve as the foundation for in-context learning. To gain a deeper understanding of the in-context learning mechanism and the importance of the in-weights component, we demonstrate through construction that a simple Transformer, using pattern matching and a copy-paste mechanism for in-context learning, can achieve comparable performance to a more complex, best-tuned Transformer under the assumption of a perfect in-weights component. Overall, our discoveries from the perspective of representation learning provide valuable insights into new approaches for enhancing in-context capacity.",
        "keywords": "In-context learning; representation learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Jingwen Fu;Tao Yang;Yuwang Wang;Yan Lu;Nanning Zheng",
        "authorids": "~Jingwen_Fu1;~Tao_Yang9;~Yuwang_Wang3;~Yan_Lu7;~Nanning_Zheng1",
        "gender": "M;M;M;M;M",
        "homepage": "https://www.jw-fu.cn/;https://github.com/ThomasMrY;;https://www.microsoft.com/en-us/research/people/yanlu/;",
        "dblp": "247/5290;;161/2633;15/4830-1;07/256-1",
        "google_scholar": ";https://scholar.google.com.hk/citations?user=qT5psCEAAAAJ;;djk5l-4AAAAJ;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": ";;;0000-0001-5383-6424;",
        "linkedin": ";;;;",
        "or_profile": "~Jingwen_Fu1;~Tao_Yang9;~Yuwang_Wang3;~Yan_Lu7;~Nanning_Zheng1",
        "aff": "Microsoft;Xi'an Jiaotong University;Tsinghua University;Microsoft Research Asia;Xi'an Jiaotong University",
        "aff_domain": "microsoft.com;xjtu.edu.cn;tsinghua.edu.cn;microsoft.com;xjtu.edu.cn",
        "position": "Intern;PhD student;Researcher;Partner Research Manager;Full Professor",
        "bibtex": "@misc{\nfu2024how,\ntitle={How does representation impact in-context learning: An exploration on a synthetic task},\nauthor={Jingwen Fu and Tao Yang and Yuwang Wang and Yan Lu and Nanning Zheng},\nyear={2024},\nurl={https://openreview.net/forum?id=JopVmAPyx6}\n}",
        "github": "",
        "project": "",
        "reviewers": "gm8Y;MkMt;EdZW;F4jH",
        "site": "https://openreview.net/forum?id=JopVmAPyx6",
        "pdf_size": 1332724,
        "rating": "3;5;5;5",
        "confidence": "4;3;2;3",
        "soundness": "2;2;3;2",
        "contribution": "2;3;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "84;257;89;128",
        "wc_strengths": "49;143;120;145",
        "wc_weaknesses": "38;130;185;357",
        "wc_questions": "333;158;45;352",
        "wc_review": "504;688;439;982",
        "wc_reply_reviewers": "0;249;0;0",
        "wc_reply_authors": "421;548;360;719",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            139.5,
            69.94462095114963
        ],
        "wc_strengths_avg": [
            114.25,
            38.931831449342326
        ],
        "wc_weaknesses_avg": [
            177.5,
            116.18196934120199
        ],
        "wc_questions_avg": [
            222.0,
            127.12788836443403
        ],
        "wc_review_avg": [
            653.25,
            210.63163936123178
        ],
        "wc_reply_reviewers_avg": [
            62.25,
            107.82016277116261
        ],
        "wc_reply_authors_avg": [
            512.0,
            137.41360922412306
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1798770068623980883&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0;1",
        "aff_unique_norm": "Microsoft;Xi'an Jiao Tong University;Tsinghua University",
        "aff_unique_dep": "Microsoft Corporation;;",
        "aff_unique_url": "https://www.microsoft.com;https://www.xjtu.edu.cn;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "Microsoft;XJTU;THU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Asia",
        "aff_country_unique_index": "0;1;1;1;1",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "JorjkFYatI",
        "title": "Go beyond End-to-End Training: Boosting Greedy Local Learning with Context Supply",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Traditional end-to-end (E2E) training of deep networks necessitates storing intermediate activations for back-propagation, resulting in a large memory footprint on GPUs and restricted model parallelization. As an alternative, greedy local learning partitions the network into gradient-isolated modules and trains supervisely based on local preliminary losses, thereby providing asynchronous and parallel training methods that substantially reduce memory cost. However, empirical experiments reveal that as the number of segmentations of the gradient-isolated module increases, the performance of the local learning scheme degrades substantially, severely limiting its expansibility. To avoid this issue, we theoretically analyze the greedy local learning from the standpoint of information theory and propose a ContSup scheme, which incorporates context supply between isolated modules to compensate for information loss. Experiments on benchmark datasets (i.e. CIFAR, SVHN, STL-10) achieve SOTA results and indicate that our proposed method can significantly improve the performance of greedy local learning with minimal memory and computational overhead, allowing for the boost of the number of isolated modules.",
        "keywords": "Greedy Local Learning;End-to-End Training;Memory Cost Optimization;Model Parallelization",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/8bd53bda63e8dd70e329e2cd39374a1f8090aab0.zip",
        "author": "Chengting Yu;Fengzhao Zhang;Hanzhi Ma;Aili Wang;Erping Li",
        "authorids": "~Chengting_Yu1;~Fengzhao_Zhang1;~Hanzhi_Ma1;~Aili_Wang2;~Erping_Li1",
        "gender": "M;M;F;F;M",
        "homepage": ";https://github.com/zhangfzR;;https://person.zju.edu.cn/en/ailiwang;https://person.zju.edu.cn/en/liep",
        "dblp": "305/8526;;;95/3819-2;80/4276-1",
        "google_scholar": "7oeTzcwAAAAJ;;;WurRhGMAAAAJ;",
        "orcid": ";;0000-0001-7914-9323;0000-0002-1019-4019;",
        "linkedin": ";;;aili-wang-10b3b187/;",
        "or_profile": "~Chengting_Yu1;~Fengzhao_Zhang1;~Hanzhi_Ma1;~Aili_Wang2;~Erping_Li1",
        "aff": "Zhejiang University;Zhejiang University;Zhejiang University;Zhejiang University;Zhejiang University",
        "aff_domain": "zju.edu.cn;zju.edu.cn;zju.edu.cn;zju.edu.cn;zju.edu.cn",
        "position": "PhD student;MS student;Assistant Professor;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nyu2024go,\ntitle={Go beyond End-to-End Training: Boosting Greedy Local Learning with Context Supply},\nauthor={Chengting Yu and Fengzhao Zhang and Hanzhi Ma and Aili Wang and Erping Li},\nyear={2024},\nurl={https://openreview.net/forum?id=JorjkFYatI}\n}",
        "github": "",
        "project": "",
        "reviewers": "qZKx;PbnD;DP2z",
        "site": "https://openreview.net/forum?id=JorjkFYatI",
        "pdf_size": 2157561,
        "rating": "3;5;6",
        "confidence": "5;4;2",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "2;3;2",
        "wc_summary": "85;77;90",
        "wc_strengths": "45;72;76",
        "wc_weaknesses": "217;203;162",
        "wc_questions": "2;1;6",
        "wc_review": "349;353;334",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.6666666666666665,
            1.247219128924647
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            84.0,
            5.354126134736337
        ],
        "wc_strengths_avg": [
            64.33333333333333,
            13.767917618708921
        ],
        "wc_weaknesses_avg": [
            194.0,
            23.338094752285727
        ],
        "wc_questions_avg": [
            3.0,
            2.160246899469287
        ],
        "wc_review_avg": [
            345.3333333333333,
            8.178562764256865
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9285714285714286,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5258436794418256640&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Zhejiang University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.zju.edu.cn",
        "aff_unique_abbr": "ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "Jos5c7vJPP",
        "title": "Exchangeable Dataset Amortization for Bayesian Posterior Inference",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Bayesian inference is a natural approach to reasoning about uncertainty. Unfortunately, in practice it generally requires expensive iterative methods like MCMC to approximate posterior distributions. Not only are these methods computationally expensive, they must be re-run when new observations are available, making them impractical or of limited use in many contexts. In this work, we amortize the posterior parameter inference for probabilistic models by leveraging permutation invariant, set-based network architectures which respect the inherent exchangeability of independent observations of a dataset. Such networks take a set of observations explicitly as input to predict the posterior with a single forward pass and allow the model to generalize to datasets of different cardinality and different orderings. Our experiments explore the effectiveness of this approach for both posterior estimation directly as well as model predictive performance. They show that our approach is comparable to dataset-specific procedures like Maximum Likelihood estimation and MCMC on a range of probabilistic models. Our proposed approach uses a reverse KL-based training objective which does not require the availability of ground truth parameter values during training. This allows us to train the amortization networks more generally. We compare this approach to existing forward KL-based training methods and show substantially improved generalization performance. Finally, we also compare various architectural elements, including different set-based architectures (DeepSets vs Transformers) and distributional parameterizations (Gaussian vs Normalizing Flows).",
        "keywords": "Bayesian Inference;Amortization;Variational Inference;Transformers;Permutation Invariance",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/dc32629ed407855f79d8982f09d19b9f650361ed.pdf",
        "author": "Sarthak Mittal;Niels Leif Bracher;Guillaume Lajoie;Priyank Jaini;Marcus A Brubaker",
        "authorids": "~Sarthak_Mittal1;~Niels_Leif_Bracher1;~Guillaume_Lajoie1;~Priyank_Jaini1;~Marcus_A_Brubaker1",
        "gender": "M;;M;M;M",
        "homepage": "https://sarthmit.github.io/;;https://dms.umontreal.ca/~lajoie/;https://priyankjaini.github.io/;https://mbrubake.github.io",
        "dblp": "228/8275;287/7659;31/10384;184/4579;18/3060",
        "google_scholar": "FGGgTrcAAAAJ;;;https://scholar.google.ca/citations?user=keg9BGEAAAAJ;https://scholar.google.ca/citations?user=x2wyjkAAAAAJ",
        "orcid": ";;;;0000-0002-7892-9026",
        "linkedin": ";nielsbracher/;;;marcus-brubaker-86538011/",
        "or_profile": "~Sarthak_Mittal1;~Niels_Leif_Bracher1;~Guillaume_Lajoie1;~Priyank_Jaini1;~Marcus_A_Brubaker1",
        "aff": "University of Montreal;York University;Mila - Quebec Artificial Intelligence Institute;Google;Borealis AI",
        "aff_domain": "umontreal.ca;yorku.ca;mila.quebec;google.com;borealisai.com",
        "position": "PhD student;PhD student;Associate Professor;Researcher;Academic Advisor",
        "bibtex": "@misc{\nmittal2024exchangeable,\ntitle={Exchangeable Dataset Amortization for Bayesian Posterior Inference},\nauthor={Sarthak Mittal and Niels Leif Bracher and Guillaume Lajoie and Priyank Jaini and Marcus A Brubaker},\nyear={2024},\nurl={https://openreview.net/forum?id=Jos5c7vJPP}\n}",
        "github": "",
        "project": "",
        "reviewers": "xVE8;iJJB;oaRk",
        "site": "https://openreview.net/forum?id=Jos5c7vJPP",
        "pdf_size": 2655884,
        "rating": "3;3;5",
        "confidence": "4;3;4",
        "soundness": "2;2;3",
        "contribution": "2;2;2",
        "presentation": "3;1;3",
        "wc_summary": "118;70;130",
        "wc_strengths": "53;29;74",
        "wc_weaknesses": "548;620;306",
        "wc_questions": "5;34;186",
        "wc_review": "724;753;696",
        "wc_reply_reviewers": "562;341;125",
        "wc_reply_authors": "993;1120;827",
        "reply_reviewers": "1;2;1",
        "reply_authors": "2;3;2",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            106.0,
            25.92296279363144
        ],
        "wc_strengths_avg": [
            52.0,
            18.384776310850235
        ],
        "wc_weaknesses_avg": [
            491.3333333333333,
            134.3064489226866
        ],
        "wc_questions_avg": [
            75.0,
            79.37673882609859
        ],
        "wc_review_avg": [
            724.3333333333334,
            23.27134623427608
        ],
        "wc_reply_reviewers_avg": [
            342.6666666666667,
            178.40839541780414
        ],
        "wc_reply_authors_avg": [
            980.0,
            119.96944055327867
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:s2wMakCWhgQJ:scholar.google.com/&scioq=Exchangeable+Dataset+Amortization+for+Bayesian+Posterior+Inference&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "University of Montreal;York University;Quebec Artificial Intelligence Institute;Google;Borealis AI",
        "aff_unique_dep": ";;Artificial Intelligence;Google;",
        "aff_unique_url": "https://wwwumontreal.ca;https://www.yorku.ca;https://mila.quebec;https://www.google.com;https://www.borealisai.com",
        "aff_unique_abbr": "UM;York U;Mila;Google;Borealis AI",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "Canada;United States"
    },
    {
        "id": "Jpu1Gd3F1r",
        "title": "Data Imputation by Pursuing Better Classification: A Supervised Learning Approach",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Data imputation, the process of filling in missing feature elements for incomplete data sets, plays a crucial role in data-driven learning. A fundamental belief is that data imputation is helpful for learning performance, and it follows that the pursuit of better classification can guide the data imputation process. While some works consider using label information to assist in this task, their simplistic utilization of labels lacks flexibility and may rely on strict assumptions. In this paper, we propose a new framework that effectively leverages supervision information to complete missing data in a manner conducive to classification. Specifically, this framework operates in two stages. Firstly, it leverages labels to supervise the optimization of similarity relationships among data, represented by the kernel matrix, with the goal of enhancing classification accuracy. To mitigate overfitting that may occur during this process, a perturbation variable is introduced to improve the robustness of the framework. Secondly, the learned kernel matrix serves as additional supervision information to guide data imputation through regression, utilizing the block coordinate descent method. The superiority of the proposed method is evaluated on four real-world data sets by comparing it with state-of-the-art imputation methods. Remarkably, our algorithm significantly outperforms other methods when the data is missing more than 60\\% of the features.",
        "keywords": "data imputation;supervised learning;kernel methods;SVM",
        "primary_area": "metric learning, kernel learning, and sparse coding",
        "supplementary_material": "/attachment/8b527745c26ce1eedd563ce87ff2ac16d44d9c8e.pdf",
        "author": "Ruikai Yang;FAN He;Mingzhen He;Kaijie Wang",
        "authorids": "~Ruikai_Yang1;~FAN_He1;~Mingzhen_He1;~Kaijie_Wang1",
        "gender": "M;F;M;M",
        "homepage": "http://www.pami.sjtu.edu.cn/StudentDetail/89;http://www.pami.sjtu.edu.cn/StudentDetail/12;https://mingzhenhe.github.io/;",
        "dblp": ";;313/1706;",
        "google_scholar": "uQD3zSsAAAAJ;https://scholar.google.com/citations?hl=en;;",
        "orcid": "0000-0002-5950-177X;;0000-0002-9214-4196;0000-0003-0725-4727",
        "linkedin": ";;;",
        "or_profile": "~Ruikai_Yang1;~FAN_He1;~Mingzhen_He1;~Kaijie_Wang1",
        "aff": "Shanghai Jiaotong University;KU Leuven;Shanghai Jiaotong University;",
        "aff_domain": "sjtu.edu.cn;kuleuven.be;sjtu.edu.cn;",
        "position": "PhD student;Postdoc;PhD student;",
        "bibtex": "@misc{\nyang2024data,\ntitle={Data Imputation by Pursuing Better Classification: A Supervised Learning Approach},\nauthor={Ruikai Yang and FAN He and Mingzhen He and Kaijie Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=Jpu1Gd3F1r}\n}",
        "github": "",
        "project": "",
        "reviewers": "Jet1;h2QN;UxXs;VYgf",
        "site": "https://openreview.net/forum?id=Jpu1Gd3F1r",
        "pdf_size": 1655251,
        "rating": "3;5;8;8",
        "confidence": "3;3;4;4",
        "soundness": "2;3;3;3",
        "contribution": "3;2;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "89;116;101;65",
        "wc_strengths": "288;37;21;22",
        "wc_weaknesses": "437;91;70;64",
        "wc_questions": "42;45;444;91",
        "wc_review": "856;289;636;242",
        "wc_reply_reviewers": "485;0;33;155",
        "wc_reply_authors": "1572;459;1488;713",
        "reply_reviewers": "2;0;1;2",
        "reply_authors": "4;2;4;4",
        "rating_avg": [
            6.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            92.75,
            18.659782956937093
        ],
        "wc_strengths_avg": [
            92.0,
            113.3379901004072
        ],
        "wc_weaknesses_avg": [
            165.5,
            157.0708438889917
        ],
        "wc_questions_avg": [
            155.5,
            167.6939175998939
        ],
        "wc_review_avg": [
            505.75,
            253.07348241172957
        ],
        "wc_reply_reviewers_avg": [
            168.25,
            191.77248890286637
        ],
        "wc_reply_authors_avg": [
            1058.0,
            481.3839423994116
        ],
        "reply_reviewers_avg": [
            1.25,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.5,
            0.8660254037844386
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.9428090415820635,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13513287411815354627&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Shanghai Jiao Tong University;Katholieke Universiteit Leuven",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.sjtu.edu.cn;https://www.kuleuven.be",
        "aff_unique_abbr": "SJTU;KU Leuven",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "China;Belgium"
    },
    {
        "id": "JpyWPfzu0b",
        "title": "PaLI-3 Vision Language Models: Smaller, Faster, Stronger",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper presents PaLI-3, a smaller, faster and stronger vision language model (VLM) that compares favorably to similar models that are 10x larger.\nAs part of arriving at this strong performance, we compare Vision Transformer (ViT) models pretrained using classification objectives to contrastively pretrained ones (SigLIP). \nWe find that, while slightly underperforming on standard image classification benchmarks, SigLIP-based PaLI shows superior performance across various multimodal benchmarks, especially on localization and text understanding.\nThe SigLIP encoder we use is a scaled-up version using 2 billion parameters, and achieves a new state-of-the-art on multilingual cross-modal retrieval.\nWe consider that PaLI-3, at only 5B parameters, rekindles research on fundamental pieces of complex VLMs, and could fuel a new generation of scaled-up models.",
        "keywords": "Vision and Language;Multimodality;Contrastive Learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/96de1ef08e5c78c89c808f39fe98e65a6b795863.pdf",
        "author": "Xi Chen;Xiao Wang;Lucas Beyer;Alexander Kolesnikov;Jialin Wu;Paul Voigtlaender;Sebastian Goodman;Basil Mustafa;Ibrahim Alabdulmohsin;Piotr Padlewski;Daniel Salz;Xi Xiong;Daniel Vlasic;Filip Pavetic;Keran Rong;Tianli Yu;Daniel Keysers;Xiaohua Zhai;Radu Soricut",
        "authorids": "~Xi_Chen23;~Xiao_Wang5;~Lucas_Beyer1;~Alexander_Kolesnikov2;~Jialin_Wu1;~Paul_Voigtlaender1;~Sebastian_Goodman1;~Basil_Mustafa1;~Ibrahim_Alabdulmohsin1;~Piotr_Padlewski1;~Daniel_Salz1;xixiong@google.com;~Daniel_Vlasic1;~Filip_Pavetic1;~Keran_Rong1;tianliyu@google.com;~Daniel_Keysers2;~Xiaohua_Zhai2;~Radu_Soricut2",
        "gender": ";M;;;M;M;M;M;M;;M;;;M;;;M;;M",
        "homepage": "https://xchen147.github.io/;;http://lucasb.eyer.be;;https://jialinwu.netlify.app/;https://www.vision.rwth-aachen.de/person/197/;https://research.google/people/106379/;https://www.basilmustafa.com/;http://ibomohsin.com;;;;;;;;http://www.keysers.net/daniel;;",
        "dblp": "16/3283;49/67-38;126/4720;137/6963-3.html;149/5889;https://dblp.uni-trier.de/pers/v/Voigtlaender:Paul;192/1217;;153/5393;210/6394;329/5637;;;149/2329;;;02/6955;66/636;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;ukyXqzMAAAAJ;p2gwhK4AAAAJ;H9I0CVwAAAAJ;M7EpKqsAAAAJ;taUv_MUAAAAJ;hNNaQL8AAAAJ;https://scholar.google.co.uk/citations?user=LuxZAJwAAAAJ;8WNMsPYAAAAJ;QnU4nRAAAAAJ;;;;aA76AEQAAAAJ;;;nZO3qCcAAAAJ;;NAzD9mgAAAAJ",
        "orcid": ";;;;;0000-0002-7548-7162;;;;0000-0001-5107-0824;;;;;;;;;",
        "linkedin": ";;;;jialin-wu-a50135175/;;;basil-mustafa/;;piotr-padlewski/;daniel-salz-452563124;;;filip-pavetic/;;;daniel-keysers-14b9511/;;",
        "or_profile": "~Xi_Chen23;~Xiao_Wang5;~Lucas_Beyer1;~Alexander_Kolesnikov2;~Jialin_Wu1;~Paul_Voigtlaender1;~Sebastian_Goodman1;~Basil_Mustafa1;~Ibrahim_Alabdulmohsin1;~Piotr_Padlewski1;~Daniel_Salz1;xixiong@google.com;~Daniel_Vlasic1;~Filip_Pavetic1;~Keran_Rong1;tianliyu@google.com;~Daniel_Keysers2;~Xiaohua_Zhai2;~Radu_Soricut2",
        "aff": "Google;Google DeepMind;Google Brain;Google;Google;Google;Google;Google;Google;Google;Google Deepmind;;;Google;;;Google;Google DeepMind;Google",
        "aff_domain": "google.com;google.com;google.com;google.com;google.com;google.com;google.com;google.com;google.com;google.com;google.com;;;google.com;;;google.com;google.com;google.com",
        "position": "Researcher;Researcher;Researcher;Researcher;Researcher;Researcher;Researcher;Research Software Engineer;Research Scientist;Software Engineer;Researcher;;;Software Engineer;;;Software Engineer;Researcher;Research Scientist",
        "bibtex": "@misc{\nchen2024pali,\ntitle={Pa{LI}-3 Vision Language Models: Smaller, Faster, Stronger},\nauthor={Xi Chen and Xiao Wang and Lucas Beyer and Alexander Kolesnikov and Jialin Wu and Paul Voigtlaender and Sebastian Goodman and Basil Mustafa and Ibrahim Alabdulmohsin and Piotr Padlewski and Daniel Salz and Xi Xiong and Daniel Vlasic and Filip Pavetic and Keran Rong and Tianli Yu and Daniel Keysers and Xiaohua Zhai and Radu Soricut},\nyear={2024},\nurl={https://openreview.net/forum?id=JpyWPfzu0b}\n}",
        "github": "",
        "project": "",
        "reviewers": "Cwas;fT87;LxB9",
        "site": "https://openreview.net/forum?id=JpyWPfzu0b",
        "pdf_size": 692564,
        "rating": "3;6;8",
        "confidence": "5;4;4",
        "soundness": "3;3;4",
        "contribution": "2;2;4",
        "presentation": "3;3;4",
        "wc_summary": "122;83;50",
        "wc_strengths": "28;54;72",
        "wc_weaknesses": "69;190;98",
        "wc_questions": "2;2;145",
        "wc_review": "221;329;365",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "256;298;386",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            5.666666666666667,
            2.0548046676563256
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            85.0,
            29.427877939124322
        ],
        "wc_strengths_avg": [
            51.333333333333336,
            18.06162291219209
        ],
        "wc_weaknesses_avg": [
            119.0,
            51.581650484127266
        ],
        "wc_questions_avg": [
            49.666666666666664,
            67.41084647311753
        ],
        "wc_review_avg": [
            305.0,
            61.18823416311342
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            313.3333333333333,
            54.168461508725
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            19,
            0
        ],
        "corr_rating_confidence": -0.9176629354822472,
        "gs_citation": 97,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14650423215196634958&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0;0;0;0;0;0;0;1;0;0;0;0",
        "aff_unique_norm": "Google;DeepMind",
        "aff_unique_dep": "Google;DeepMind",
        "aff_unique_url": "https://www.google.com;https://deepmind.com",
        "aff_unique_abbr": "Google;DeepMind",
        "aff_campus_unique_index": "0;0;0;0;0;0;0;0;0;0;0;0",
        "aff_campus_unique": "Mountain View;",
        "aff_country_unique_index": "0;1;0;0;0;0;0;0;0;0;1;0;0;1;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "JpzVlO9X7r",
        "title": "Does GPT-4 have good intuition about functions?",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Humans inherently possess the intuition to model real-world functions such as predicting the trajectory of a ball at an intuitive level. Do Large Language Models (LLMs), trained on extensive web data comprising of human-generated knowledge, exhibit similar capabilities? This research pivots on probing such ability of LLMs (in particular, \\textit{GPT-4}) to mimic human-like intuition in comprehending various types of functions. Our evaluation reveals the potent abilities of GPT-4 not just to discern various patterns in data, but also to harness domain knowledge for function modeling at an intuitive level, all without the necessity of gradient-based learning. In circumstances where data is scarce or domain knowledge takes precedence, GPT-4 manages to exceed the performance of traditional machine learning models. Our findings underscore the remarkable potential of LLMs for data science applications while also underlining areas for improvement.",
        "keywords": "Large Language Models;Function modelling;Evaluation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/f9b6ba42c323cef8d787f15654f2f10ef0c3ac2e.pdf",
        "author": "Shoaib Ahmed Siddiqui;Juyeon Heo;Yanzhi Chen;Adrian Weller",
        "authorids": "~Shoaib_Ahmed_Siddiqui1;~Juyeon_Heo1;~Yanzhi_Chen1;~Adrian_Weller1",
        "gender": "M;F;;M",
        "homepage": ";https://sites.google.com/view/juyeonheo/%ED%99%88;https://cyz-ai.github.io/;http://mlg.eng.cam.ac.uk/adrian/",
        "dblp": "208/3111;;73/10772;73/8324",
        "google_scholar": "https://scholar.google.de/citations?user=9SOO4z0AAAAJ;;W5sSgIsAAAAJ;https://scholar.google.co.uk/citations?user=Ek4hM10AAAAJ",
        "orcid": "0000-0003-4600-7331;;;",
        "linkedin": "shoaibahmedsiddiqui/;;;",
        "or_profile": "~Shoaib_Ahmed_Siddiqui1;~Juyeon_Heo1;~Yanzhi_Chen1;~Adrian_Weller1",
        "aff": "University of Cambridge;University of Cambridge;University of Cambridge;University of Cambridge",
        "aff_domain": "cam.ac.uk;cam.ac.uk;cam.ac.uk;cam.ac.uk",
        "position": "PhD student;PhD student;PhD student;Principal Researcher",
        "bibtex": "@misc{\nsiddiqui2024does,\ntitle={Does {GPT}-4 have good intuition about functions?},\nauthor={Shoaib Ahmed Siddiqui and Juyeon Heo and Yanzhi Chen and Adrian Weller},\nyear={2024},\nurl={https://openreview.net/forum?id=JpzVlO9X7r}\n}",
        "github": "",
        "project": "",
        "reviewers": "rQFr;zRGM;3rSb",
        "site": "https://openreview.net/forum?id=JpzVlO9X7r",
        "pdf_size": 16897048,
        "rating": "3;5;6",
        "confidence": "4;4;4",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "1;3;3",
        "wc_summary": "64;105;145",
        "wc_strengths": "31;53;87",
        "wc_weaknesses": "1305;184;172",
        "wc_questions": "312;153;3",
        "wc_review": "1712;495;407",
        "wc_reply_reviewers": "737;0;0",
        "wc_reply_authors": "4427;916;389",
        "reply_reviewers": "1;0;0",
        "reply_authors": "6;2;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            104.66666666666667,
            33.06895153396242
        ],
        "wc_strengths_avg": [
            57.0,
            23.03620339089466
        ],
        "wc_weaknesses_avg": [
            553.6666666666666,
            531.295481713226
        ],
        "wc_questions_avg": [
            156.0,
            126.16655658295505
        ],
        "wc_review_avg": [
            871.3333333333334,
            595.5257247918757
        ],
        "wc_reply_reviewers_avg": [
            245.66666666666666,
            347.4251318229904
        ],
        "wc_reply_authors_avg": [
            1910.6666666666667,
            1792.2764543699413
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.0,
            2.160246899469287
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:o_V99Zmd5UYJ:scholar.google.com/&scioq=Does+GPT-4+have+good+intuition+about+functions%3F&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of Cambridge",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cam.ac.uk",
        "aff_unique_abbr": "Cambridge",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Cambridge",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "Jr3X3BTwsj",
        "title": "Universal Metric Learning with Parameter-Efficient Transfer Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "A common practice in metric learning is to train and test an embedding model for each dataset. This dataset-specific approach fails to simulate real-world scenarios that involve multiple heterogeneous distributions of data. In this regard, we introduce a novel metric learning paradigm, called Universal Metric Learning (UML), which learns a unified distance metric capable of capturing relations across multiple data distributions. UML presents new challenges, such as imbalanced data distribution and bias towards dominant distributions. To address these challenges, we propose Parameter-efficient Universal Metric leArning (PUMA), which consists of a pre-trained frozen model and two additional modules, stochastic adapter and prompt pool. These modules enable to capture dataset-specific knowledge while avoiding bias towards dominant distributions. Additionally, we compile a new universal metric learning benchmark with a total of 8 different datasets. PUMA outperforms the state-of-the-art dataset-specific models while using about 69 times fewer trainable parameters.",
        "keywords": "deep metric learning;parameter-efficient transfer learning",
        "primary_area": "metric learning, kernel learning, and sparse coding",
        "supplementary_material": "/attachment/01cd6148db8995bceb1846819a3a82d4604ed03d.zip",
        "author": "Sungyeon Kim;Donghyun Kim;Suha Kwak",
        "authorids": "~Sungyeon_Kim1;~Donghyun_Kim2;~Suha_Kwak3",
        "gender": "M;M;M",
        "homepage": "https://github.com/tjddus9597;https://cs-people.bu.edu/donhk;https://suhakwak.github.io/",
        "dblp": "69/8198;;65/6173",
        "google_scholar": "https://scholar.google.com/citations?hl=ko;https://scholar.google.co.kr/citations?user=UsqNPH4AAAAJ;-gscDIEAAAAJ",
        "orcid": ";;",
        "linkedin": "sungyeonkim-b47b0a242/;;",
        "or_profile": "~Sungyeon_Kim1;~Donghyun_Kim2;~Suha_Kwak3",
        "aff": "POSTECH;Korea University;POSTECH",
        "aff_domain": "postech.ac.kr;korea.ac.kr;postech.ac.kr",
        "position": "PhD student;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nkim2024universal,\ntitle={Universal Metric Learning with Parameter-Efficient Transfer Learning},\nauthor={Sungyeon Kim and Donghyun Kim and Suha Kwak},\nyear={2024},\nurl={https://openreview.net/forum?id=Jr3X3BTwsj}\n}",
        "github": "",
        "project": "",
        "reviewers": "xsqK;f9dZ;W7ZY",
        "site": "https://openreview.net/forum?id=Jr3X3BTwsj",
        "pdf_size": 2449319,
        "rating": "3;5;6",
        "confidence": "5;5;4",
        "soundness": "2;2;3",
        "contribution": "1;2;2",
        "presentation": "3;3;3",
        "wc_summary": "56;80;95",
        "wc_strengths": "56;35;83",
        "wc_weaknesses": "298;110;304",
        "wc_questions": "109;19;3",
        "wc_review": "519;244;485",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            77.0,
            16.06237840420901
        ],
        "wc_strengths_avg": [
            58.0,
            19.6468827043885
        ],
        "wc_weaknesses_avg": [
            237.33333333333334,
            90.07157647609422
        ],
        "wc_questions_avg": [
            43.666666666666664,
            46.65714188512718
        ],
        "wc_review_avg": [
            416.0,
            122.41187306248796
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.7559289460184544,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10139592967140098025&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Pohang University of Science and Technology;Korea University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.postech.ac.kr;https://www.korea.ac.kr",
        "aff_unique_abbr": "POSTECH;KU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Pohang;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "A Mutual Information Perspective on Federated Contrastive Learning",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18925",
        "id": "JrmPG9ufKg",
        "author_site": "Christos Louizos, Matthias Reisser, Denis Korzhenkov",
        "tldr": "",
        "abstract": "We investigate contrastive learning in the federated setting through the lens of Sim- CLR and multi-view mutual information maximization. In doing so, we uncover a connection between contrastive representation learning and user verification; by adding a user verification loss to each client\u2019s local SimCLR loss we recover a lower bound to the global multi-view mutual information. To accommodate for the case of when some labelled data are available at the clients, we extend our SimCLR variant to the federated semi-supervised setting. We see that a supervised SimCLR objective can be obtained with two changes: a) the contrastive loss is computed between datapoints that share the same label and b) we require an additional auxiliary head that predicts the correct labels from either of the two views. Along with the proposed SimCLR extensions, we also study how different sources of non-i.i.d.-ness can impact the performance of federated unsupervised learning through global mutual information maximization; we find that a global objective is beneficial for some sources of non-i.i.d.-ness but can be detrimental for others. We empirically evaluate our proposed extensions in various tasks to validate our claims and furthermore demonstrate that our proposed modifications generalize to other pretraining methods.",
        "keywords": "federated learning;contrastive learning;self-supervised;semi-supervised;mutual information",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/2d348072b6858c94c0d7d97d253a6a212dcff0ec.pdf",
        "author": "Christos Louizos;Matthias Reisser;Denis Korzhenkov",
        "authorids": "~Christos_Louizos1;~Matthias_Reisser1;~Denis_Korzhenkov1",
        "gender": ";M;M",
        "homepage": ";http://matthiasreisser.github.io/;",
        "dblp": ";228/6851;230/3666",
        "google_scholar": ";;https://scholar.google.ru/citations?user=ypspak0AAAAJ",
        "orcid": ";;",
        "linkedin": ";;denis-korzhenkov-5b498512a/",
        "or_profile": "~Christos_Louizos1;~Matthias_Reisser1;~Denis_Korzhenkov1",
        "aff": ";Qualcomm Inc, QualComm;Qualcomm Inc, QualComm",
        "aff_domain": ";qti.qualcomm.com;qti.qualcomm.com",
        "position": ";Senior Engineer;Researcher",
        "bibtex": "@inproceedings{\nlouizos2024a,\ntitle={A Mutual Information Perspective on Federated Contrastive Learning},\nauthor={Christos Louizos and Matthias Reisser and Denis Korzhenkov},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=JrmPG9ufKg}\n}",
        "github": "",
        "project": "",
        "reviewers": "3B5H;JEx9;wQ6s",
        "pdf_size": 376760,
        "rating": "5;6;8",
        "confidence": "4;4;4",
        "soundness": "3;3;3",
        "contribution": "2;2;2",
        "presentation": "3;3;3",
        "wc_summary": "113;78;141",
        "wc_strengths": "72;64;18",
        "wc_weaknesses": "244;59;43",
        "wc_questions": "47;37;321",
        "wc_review": "476;238;523",
        "wc_reply_reviewers": "177;327;156",
        "wc_reply_authors": "535;757;672",
        "reply_reviewers": "1;2;1",
        "reply_authors": "2;3;2",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            110.66666666666667,
            25.772509040103607
        ],
        "wc_strengths_avg": [
            51.333333333333336,
            23.79542439676633
        ],
        "wc_weaknesses_avg": [
            115.33333333333333,
            91.21525213593516
        ],
        "wc_questions_avg": [
            135.0,
            131.58520686865475
        ],
        "wc_review_avg": [
            412.3333333333333,
            124.75665201592348
        ],
        "wc_reply_reviewers_avg": [
            220.0,
            76.14459928320589
        ],
        "wc_reply_authors_avg": [
            654.6666666666666,
            91.45612184114424
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18102476301718115276&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=JrmPG9ufKg",
        "pdf": "https://openreview.net/pdf?id=JrmPG9ufKg",
        "email": ";qti.qualcomm.com;qti.qualcomm.com",
        "author_num": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Qualcomm Incorporated",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.qualcomm.com",
        "aff_unique_abbr": "Qualcomm",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "A Hard-to-Beat Baseline for Training-free CLIP-based Adaptation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18924",
        "id": "Js5PJPHDyY",
        "author_site": "Zhengbo Wang, Jian Liang, Lijun Sheng, Ran He, Zilei Wang, Tieniu Tan",
        "tldr": "",
        "abstract": "Contrastive Language-Image Pretraining (CLIP) has gained popularity for its remarkable zero-shot capacity.\nRecent research has focused on developing efficient fine-tuning methods, such as prompt learning and adapter, to enhance CLIP's performance in downstream tasks.\nHowever, these methods still require additional training time and computational resources, which is undesirable for devices with limited resources.\nIn this paper, we revisit a classical algorithm, Gaussian Discriminant Analysis (GDA), and apply it to the downstream classification of CLIP.\nTypically, GDA assumes that features of each class follow Gaussian distributions with identical covariance.\nBy leveraging Bayes' formula, the classifier can be expressed in terms of the class means and covariance, which can be estimated from the data without the need for training.\nTo integrate knowledge from both visual and textual modalities, we ensemble it with the original zero-shot classifier within CLIP.\nExtensive results on 17 datasets validate that our method surpasses or achieves comparable results with state-of-the-art methods on few-shot classification, imbalanced learning, and out-of-distribution generalization.\nIn addition, we extend our method to base-to-new generalization and unsupervised learning, once again demonstrating its superiority over competing approaches.\nOur code is publicly available at https://github.com/mrflogs/ICLR24.",
        "keywords": "CLIP;training-free adaptation",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/540462c69b4fb0f6c7fb5906af636a5bd53e277e.zip",
        "author": "Zhengbo Wang;Jian Liang;Lijun Sheng;Ran He;Zilei Wang;Tieniu Tan",
        "authorids": "~Zhengbo_Wang1;~Jian_Liang1;~Lijun_Sheng1;~Ran_He1;~Zilei_Wang1;~Tieniu_Tan1",
        "gender": ";M;M;M;M;",
        "homepage": "https://github.com/mrflogs;https://liangjian.xyz;https://tomsheng21.github.io/;https://rhe-web.github.io/;;",
        "dblp": "193/0358;19/2208-1;321/3477;61/6198-1;49/1878;",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;https://scholar.google.com.sg/citations?user=1sM6ZrcAAAAJ;ayrg9AUAAAAJ;https://scholar.google.com.hk/citations?hl=zh-CN;",
        "orcid": ";0000-0003-3890-1894;;0000-0002-3807-991X;;",
        "linkedin": ";;;;;",
        "or_profile": "~Zhengbo_Wang1;~Jian_Liang1;~Lijun_Sheng1;~Ran_He1;~Zilei_Wang1;~Tieniu_Tan1",
        "aff": "University of Science and Technology of China;Institute of Automation, Chinese Academy of Sciences;University of Science and Technology of China;Institute of Automation, Chinese Academy of Sciences;University of Science and Technology of China;",
        "aff_domain": "ustc.edu.cn;ia.ac.cn;ustc.edu.cn;ia.ac.cn;ustc.edu.cn;",
        "position": "PhD student;Associate Professor;PhD student;Full Professor;Associate Professor;",
        "bibtex": "@inproceedings{\nwang2024a,\ntitle={A Hard-to-Beat Baseline for Training-free {CLIP}-based Adaptation},\nauthor={Zhengbo Wang and Jian Liang and Lijun Sheng and Ran He and Zilei Wang and Tieniu Tan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Js5PJPHDyY}\n}",
        "github": "",
        "project": "",
        "reviewers": "e8KM;4kGv;CXou",
        "pdf_size": 650132,
        "rating": "6;6;6",
        "confidence": "5;4;4",
        "soundness": "3;3;2",
        "contribution": "3;2;3",
        "presentation": "3;3;3",
        "wc_summary": "54;87;101",
        "wc_strengths": "68;26;59",
        "wc_weaknesses": "216;138;18",
        "wc_questions": "10;25;242",
        "wc_review": "348;276;420",
        "wc_reply_reviewers": "20;56;59",
        "wc_reply_authors": "1119;684;1024",
        "reply_reviewers": "1;1;1",
        "reply_authors": "5;4;5",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            80.66666666666667,
            19.70335560817553
        ],
        "wc_strengths_avg": [
            51.0,
            18.05547008526779
        ],
        "wc_weaknesses_avg": [
            124.0,
            81.43709228600933
        ],
        "wc_questions_avg": [
            92.33333333333333,
            106.00733727226411
        ],
        "wc_review_avg": [
            348.0,
            58.787753826796276
        ],
        "wc_reply_reviewers_avg": [
            45.0,
            17.72004514666935
        ],
        "wc_reply_authors_avg": [
            942.3333333333334,
            186.741056605724
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 29,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1805228999290369049&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=Js5PJPHDyY",
        "pdf": "https://openreview.net/pdf?id=Js5PJPHDyY",
        "email": "ustc.edu.cn;ia.ac.cn;ustc.edu.cn;ia.ac.cn;ustc.edu.cn;",
        "author_num": 6,
        "aff_unique_index": "0;1;0;1;0",
        "aff_unique_norm": "University of Science and Technology of China;Chinese Academy of Sciences",
        "aff_unique_dep": ";Institute of Automation",
        "aff_unique_url": "http://www.ustc.edu.cn;http://www.ia.cas.cn",
        "aff_unique_abbr": "USTC;CAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "JsJGd0xfgv",
        "title": "Quantum Architecture Search with Unsupervised Representation Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Utilizing unsupervised representation learning for quantum architecture search\n(QAS) represents a cutting-edge approach poised to realize potential quantum advantage\non Noisy Intermediate-Scale Quantum (NISQ) devices. QAS is a scheme\nto design quantum circuits for variational quantum algorithms (VQAs). Most\nQAS algorithms combine their search space and search algorithms together and\nthus generally require evaluating a large number of quantum circuits during the\nsearch process, which results in formidable computational demands and limits\ntheir applications to large-scale quantum circuits. Predictor-based QAS algorithms\ncan alleviate this problem by directly estimating the performance of circuits\naccording to their structures. However, a high-performance predictor generally requires\nvery time-consuming labeling to obtain a large number of labeled quantum\ncircuits because the gate parameters of quantum circuits need to be optimized until\nconvergence to their ground-truth performances. Recently, a classical neural\narchitecture search algorithm Arch2vec inspires us by showing that architecture\nsearch can benefit from decoupling unsupervised representation learning from the\nsearch process. Whether unsupervised representation learning can help QAS without\nany predictor is still an open topic. In this work, we propose a framework\nQAS with unsupervised representation learning and visualize how unsupervised\narchitecture representation learning encourages quantum circuit architectures with\nsimilar connections and operators to cluster together. Specifically, our framework\nenables the process of QAS to be decoupled from unsupervised architecture representation\nlearning so that the learned representation can be directly applied to\ndifferent downstream applications. Furthermore, our framework is predictor-free\neliminating the need for a large number of labeled quantum circuits. During the\nsearch process, we use two algorithms REINFORCE and Bayesian Optimization\nto directly search on the latent representation, and compare them with the method\nRandom Search. The results show our framework can more efficiently get well-performing\ncandidate circuits within a limited number of searches.",
        "keywords": "QAS;Unsupervised Representation Learning;Predictor-free",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/5791a8a702f054f53c5301553cc27505cd28cf27.zip",
        "author": "Yize Sun;Zixin Wu;Yunpu Ma;Volker Tresp",
        "authorids": "~Yize_Sun1;~Zixin_Wu1;~Yunpu_Ma1;~Volker_Tresp1",
        "gender": "M;M;M;M",
        "homepage": ";;https://dblp.org/pid/199/8143.html;https://www.dbs.ifi.lmu.de/~tresp/",
        "dblp": ";;199/8143.html;t/VolkerTresp",
        "google_scholar": "https://scholar.google.de/citations?user=apkM3GIAAAAJ;;fj5DzgcAAAAJ;xIJHTUwAAAAJ",
        "orcid": "0009-0007-2921-2858;0009-0006-4383-3127;;0000-0001-9428-3686",
        "linkedin": ";zixin-wu-a30a73265;yunpu-ma-05a9b41b0/?originalSubdomain=de;volker-tresp-8110a118/",
        "or_profile": "~Yize_Sun1;~Zixin_Wu1;~Yunpu_Ma1;~Volker_Tresp1",
        "aff": "Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen;Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen;Siemens Corporate Research;Siemens Corporate Research",
        "aff_domain": "lmu.de;lmu.de;siemens.com;siemens.com",
        "position": "PhD student;MS student;Researcher;Principal Researcher",
        "bibtex": "@misc{\nsun2024quantum,\ntitle={Quantum Architecture Search with Unsupervised Representation Learning},\nauthor={Yize Sun and Zixin Wu and Yunpu Ma and Volker Tresp},\nyear={2024},\nurl={https://openreview.net/forum?id=JsJGd0xfgv}\n}",
        "github": "",
        "project": "",
        "reviewers": "asUZ;QFKe;o6Zq;EmZc",
        "site": "https://openreview.net/forum?id=JsJGd0xfgv",
        "pdf_size": 15134844,
        "rating": "5;5;5;5",
        "confidence": "3;3;4;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;2",
        "presentation": "3;3;4;2",
        "wc_summary": "80;93;53;89",
        "wc_strengths": "89;73;67;60",
        "wc_weaknesses": "139;55;59;241",
        "wc_questions": "129;78;140;4",
        "wc_review": "437;299;319;394",
        "wc_reply_reviewers": "0;0;90;0",
        "wc_reply_authors": "1227;970;1371;1013",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "2;2;3;2",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            78.75,
            15.594470173750693
        ],
        "wc_strengths_avg": [
            72.25,
            10.709224995301948
        ],
        "wc_weaknesses_avg": [
            123.5,
            75.6620776875708
        ],
        "wc_questions_avg": [
            87.75,
            53.71394139327331
        ],
        "wc_review_avg": [
            362.25,
            55.82730066911708
        ],
        "wc_reply_reviewers_avg": [
            22.5,
            38.97114317029974
        ],
        "wc_reply_authors_avg": [
            1145.25,
            162.67202433116765
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1617362738409296327&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;1;1",
        "aff_unique_norm": "Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen;Siemens AG",
        "aff_unique_dep": ";Corporate Research",
        "aff_unique_url": "https://www.lmu.de;https://www.siemens.com/research",
        "aff_unique_abbr": "LMU;Siemens",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "JshLcbPI9J",
        "title": "Deep Backtracking Counterfactuals for Causally Compliant Explanations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Counterfactuals can offer valuable insights by answering what would have been observed under altered circumstances, conditional on a factual observation. Whereas the classical interventional interpretation of counterfactuals has been studied extensively, backtracking constitutes a less studied alternative where all causal laws are kept intact. In the present work, we introduce a practical method for computing backtracking counterfactuals in structural causal models that consist of deep generative components. To this end, we impose conditions on the structural assignments that enable the generation of counterfactuals by solving a tractable constrained optimization problem in the structured latent space of a causal model. Our formulation also facilitates a comparison with methods in the field of counterfactual explanations. Compared to these, our method represents a versatile, modular and causally compliant alternative. We demonstrate these properties experimentally on a modified version of MNIST and CelebA.",
        "keywords": "counterfactuals;generative modeling;causality;counterfactual explanations",
        "primary_area": "causal reasoning",
        "supplementary_material": "/attachment/34d00bacf9a19e21513e31d30dadf0c87185cbec.zip",
        "author": "Klaus-Rudolf Kladny;Julius von K\u00fcgelgen;Bernhard Sch\u00f6lkopf;Michael Muehlebach",
        "authorids": "~Klaus-Rudolf_Kladny1;~Julius_von_K\u00fcgelgen2;~Bernhard_Sch\u00f6lkopf1;~Michael_Muehlebach1",
        "gender": ";;;",
        "homepage": ";;;https://sites.google.com/view/mmuehlebach/",
        "dblp": ";;;142/1129",
        "google_scholar": ";;;uTfYBAsAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Klaus-Rudolf_Kladny1;~Julius_von_K\u00fcgelgen2;~Bernhard_Sch\u00f6lkopf1;~Michael_Muehlebach1",
        "aff": ";;;Max-Planck Institute",
        "aff_domain": ";;;mpg.de",
        "position": ";;;Principal Researcher",
        "bibtex": "@misc{\nkladny2024deep,\ntitle={Deep Backtracking Counterfactuals for Causally Compliant Explanations},\nauthor={Klaus-Rudolf Kladny and Julius von K{\\\"u}gelgen and Bernhard Sch{\\\"o}lkopf and Michael Muehlebach},\nyear={2024},\nurl={https://openreview.net/forum?id=JshLcbPI9J}\n}",
        "github": "",
        "project": "",
        "reviewers": "5aYw;xQRn;GJzV;6DZ1;8kK7",
        "site": "https://openreview.net/forum?id=JshLcbPI9J",
        "pdf_size": 2203392,
        "rating": "3;5;5;6;6",
        "confidence": "2;4;4;4;3",
        "soundness": "3;2;3;3;2",
        "contribution": "2;2;2;2;2",
        "presentation": "3;4;3;4;3",
        "wc_summary": "58;34;94;38;14",
        "wc_strengths": "7;50;47;28;20",
        "wc_weaknesses": "41;271;180;156;146",
        "wc_questions": "36;5;367;273;17",
        "wc_review": "142;360;688;495;197",
        "wc_reply_reviewers": "67;45;0;89;18",
        "wc_reply_authors": "760;595;2090;608;588",
        "reply_reviewers": "2;1;0;2;1",
        "reply_authors": "3;1;4;2;1",
        "rating_avg": [
            5.0,
            1.0954451150103321
        ],
        "confidence_avg": [
            3.4,
            0.8
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            47.6,
            27.08209740769721
        ],
        "wc_strengths_avg": [
            30.4,
            16.255460620972883
        ],
        "wc_weaknesses_avg": [
            158.8,
            73.60271734114168
        ],
        "wc_questions_avg": [
            139.6,
            150.59030513283383
        ],
        "wc_review_avg": [
            376.4,
            199.27729424096464
        ],
        "wc_reply_reviewers_avg": [
            43.8,
            32.145917314645104
        ],
        "wc_reply_authors_avg": [
            928.2,
            584.3555082310768
        ],
        "reply_reviewers_avg": [
            1.2,
            0.7483314773547883
        ],
        "reply_authors_avg": [
            2.2,
            1.16619037896906
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.6846531968814578,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2309742213852659234&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0",
        "aff_unique_norm": "Max-Planck-Gesellschaft zur F\u00f6rderung der Wissenschaften e.V.",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.mpg.de",
        "aff_unique_abbr": "MPG",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Germany"
    },
    {
        "title": "Exploring Weight Balancing on Long-Tailed Recognition Problem",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18923",
        "id": "JsnR0YO4Fq",
        "author_site": "Naoya Hasegawa, Issei Sato",
        "tldr": "",
        "abstract": "Recognition problems in long-tailed data, in which the sample size per class is heavily skewed, have gained importance because the distribution of the sample size per class in a dataset is generally exponential unless the sample size is intentionally adjusted. Various methods have been devised to address these problems.\nRecently, weight balancing, which combines well-known classical regularization techniques with two-stage training, has been proposed. Despite its simplicity, it is known for its high performance compared with existing methods devised in various ways.\nHowever, there is a lack of understanding as to why this method is effective for long-tailed data. In this study, we analyze weight balancing by focusing on neural collapse and the cone effect at each training stage and found that it can be decomposed into an increase in Fisher's discriminant ratio of the feature extractor caused by weight decay and cross entropy loss and implicit logit adjustment caused by weight decay and class-balanced loss. Our analysis enables the training method to be further simplified by reducing the number of training stages to one while increasing accuracy. Code is available at https://github.com/HN410/Exploring-Weight-Balancing-on-Long-Tailed-Recognition-Problem.",
        "keywords": "long-tailed recognition;imbalanced learning;weight decay;regularization;neural collapse;simplex ETF;machine learning;learning theory",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/cb18be5b20f4233738a1c23a35320070c7568ba1.pdf",
        "author": "Naoya Hasegawa;Issei Sato",
        "authorids": "~Naoya_Hasegawa1;~Issei_Sato2",
        "gender": "M;",
        "homepage": "https://hn410.github.io/Portfolio.github.io/;https://www.ml.is.s.u-tokyo.ac.jp/issei-sato-en",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Naoya_Hasegawa1;~Issei_Sato2",
        "aff": "The University of Tokyo;The University of Tokyo",
        "aff_domain": "u-tokyo.ac.jp;u-tokyo.ac.jp",
        "position": "MS student;Full Professor",
        "bibtex": "@inproceedings{\nhasegawa2024exploring,\ntitle={Exploring Weight Balancing on Long-Tailed Recognition Problem},\nauthor={Naoya Hasegawa and Issei Sato},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=JsnR0YO4Fq}\n}",
        "github": "",
        "project": "",
        "reviewers": "2xQy;GF5W;dLbF;7mhz",
        "pdf_size": 1255948,
        "rating": "6;6;6;8",
        "confidence": "3;4;4;3",
        "soundness": "3;3;2;4",
        "contribution": "3;3;2;4",
        "presentation": "3;3;2;3",
        "wc_summary": "77;93;25;112",
        "wc_strengths": "71;63;41;104",
        "wc_weaknesses": "59;33;118;161",
        "wc_questions": "75;116;2;86",
        "wc_review": "282;305;186;463",
        "wc_reply_reviewers": "22;0;19;0",
        "wc_reply_authors": "810;964;922;1082",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "2;2;3;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            76.75,
            32.34482184214345
        ],
        "wc_strengths_avg": [
            69.75,
            22.620510604316607
        ],
        "wc_weaknesses_avg": [
            92.75,
            50.01187359017856
        ],
        "wc_questions_avg": [
            69.75,
            41.89495793051952
        ],
        "wc_review_avg": [
            309.0,
            99.48617994475414
        ],
        "wc_reply_reviewers_avg": [
            10.25,
            10.304731922762475
        ],
        "wc_reply_authors_avg": [
            944.5,
            97.31777843744688
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15854661045249906456&as_sdt=5,31&sciodt=0,31&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=JsnR0YO4Fq",
        "pdf": "https://openreview.net/pdf?id=JsnR0YO4Fq",
        "email": "u-tokyo.ac.jp;u-tokyo.ac.jp",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Tokyo",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.u-tokyo.ac.jp",
        "aff_unique_abbr": "UTokyo",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Japan"
    },
    {
        "title": "ReFusion: Improving Natural Language Understanding with Computation-Efficient Retrieval Representation Fusion",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18922",
        "id": "JtKGkz9fAe",
        "author_site": "Shangyu Wu, Ying Xiong, Yufei CUI, Xue Liu, Buzhou Tang, Tei-Wei Kuo, Chun Jason Xue",
        "tldr": "",
        "abstract": "Retrieval-based augmentations (RA) incorporating knowledge from an external database into language models have greatly succeeded in various knowledge-intensive (KI) tasks. However, integrating retrievals in non-knowledge-intensive (NKI) tasks is still challenging.\nExisting works focus on concatenating retrievals with inputs to improve model performance. Unfortunately, the use of retrieval concatenation-based augmentations causes an increase in the input length, substantially raising the computational demands of attention mechanisms.\nThis paper proposes a new paradigm of RA named \\textbf{ReFusion}, a computation-efficient \\textbf{Re}trieval representation \\textbf{Fusion} with bi-level optimization. Unlike previous works, ReFusion directly fuses the retrieval representations into the hidden states of models.\nSpecifically, ReFusion leverages an adaptive retrieval integrator to seek the optimal combination of the proposed ranking schemes across different model layers. Experimental results demonstrate that the proposed ReFusion can achieve superior and robust performance in various NKI tasks.",
        "keywords": "Retrieval Augmentation; Non-Knowledge-Intensive Task; Natural Language Understanding;",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Shangyu Wu;Ying Xiong;Yufei CUI;Xue Liu;Buzhou Tang;Tei-Wei Kuo;Chun Jason Xue",
        "authorids": "~Shangyu_Wu1;~Ying_Xiong2;~Yufei_CUI2;~Xue_Liu1;~Buzhou_Tang1;~Tei-Wei_Kuo1;~Chun_Jason_Xue1",
        "gender": "M;F;M;M;M;M;M",
        "homepage": ";;;http://www.cs.mcgill.ca/~xueliu/;;http://www.csie.ntu.edu.tw/~ktw;https://www.cs.cityu.edu.hk/~jasonxue/",
        "dblp": "241/1185.html;;188/0049;l/XueLiu;00/7437;07/3181.html;x/ChunJasonXue.html",
        "google_scholar": "M3EFHTEAAAAJ;nz7B_JcAAAAJ;;https://scholar.google.com.tw/citations?user=rfLIRakAAAAJ;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com.tw/citations?user=gBuHlIQAAAAJ;C6oyGQkAAAAJ",
        "orcid": ";0000-0001-7423-2937;;;;;",
        "linkedin": ";ying-xiong-42642b2a9/;;;;;",
        "or_profile": "~Shangyu_Wu1;~Ying_Xiong2;~Yufei_CUI2;~Xue_Liu1;~Buzhou_Tang1;~Tei-Wei_Kuo1;~Chun_Jason_Xue1",
        "aff": "City University of Hong Kong;Mohamed bin Zayed University of Artificial Intelligence;McGill University;McGill University;Harbin Institute of Technology;National Taiwan University;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_domain": "cityu.edu.hk;mbzuai.ac.ae;cs.mcgill.ca;mcgill.ca;hit.edu.cn;ntu.edu.tw;mbzuai.ac.ae",
        "position": "PhD student;Postdoc;Postdoc;Full Professor;Full Professor;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nwu2024refusion,\ntitle={ReFusion: Improving Natural Language Understanding with Computation-Efficient Retrieval Representation Fusion},\nauthor={Shangyu Wu and Ying Xiong and Yufei CUI and Xue Liu and Buzhou Tang and Tei-Wei Kuo and Chun Jason Xue},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=JtKGkz9fAe}\n}",
        "github": "",
        "project": "",
        "reviewers": "aM36;UsSB;UAxr;9abu",
        "pdf_size": 1276111,
        "rating": "3;6;8;8",
        "confidence": "4;3;3;4",
        "soundness": "3;3;4;3",
        "contribution": "3;2;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "47;89;98;241",
        "wc_strengths": "70;51;68;61",
        "wc_weaknesses": "167;132;142;50",
        "wc_questions": "39;53;71;41",
        "wc_review": "323;325;379;393",
        "wc_reply_reviewers": "0;0;31;0",
        "wc_reply_authors": "1148;468;416;866",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "4;1;1;2",
        "rating_avg": [
            6.25,
            2.0463381929681126
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            118.75,
            73.15864610556977
        ],
        "wc_strengths_avg": [
            62.5,
            7.433034373659253
        ],
        "wc_weaknesses_avg": [
            122.75,
            43.89404857153188
        ],
        "wc_questions_avg": [
            51.0,
            12.727922061357855
        ],
        "wc_review_avg": [
            355.0,
            31.400636936215164
        ],
        "wc_reply_reviewers_avg": [
            7.75,
            13.423393758658799
        ],
        "wc_reply_authors_avg": [
            724.5,
            300.1412167630431
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.3665083330689157,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16849547171335853214&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=JtKGkz9fAe",
        "pdf": "https://openreview.net/pdf?id=JtKGkz9fAe",
        "email": "cityu.edu.hk;mbzuai.ac.ae;cs.mcgill.ca;mcgill.ca;hit.edu.cn;ntu.edu.tw;mbzuai.ac.ae",
        "author_num": 7,
        "aff_unique_index": "0;1;2;2;3;4;1",
        "aff_unique_norm": "City University of Hong Kong;Mohamed bin Zayed University of Artificial Intelligence;McGill University;Harbin Institute of Technology;National Taiwan University",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.cityu.edu.hk;https://mbzuai.ac.ae;https://www.mcgill.ca;http://www.hit.edu.cn/;https://www.ntu.edu.tw",
        "aff_unique_abbr": "CityU;MBZUAI;McGill;HIT;NTU",
        "aff_campus_unique_index": "0;2;3",
        "aff_campus_unique": "Hong Kong SAR;;Harbin;Taiwan",
        "aff_country_unique_index": "0;1;2;2;0;0;1",
        "aff_country_unique": "China;United Arab Emirates;Canada"
    },
    {
        "id": "JttlL9xosQ",
        "title": "RetroTune: Mitigating spurious features via retrospective fine-tuning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Spurious features are non-predictive and are associated with class labels in the majority of training samples. Models trained with standard empirical risk minimization tend to base their predictions on spurious features, such as identifying objects only by their frequently co-occurring backgrounds, leading to poor performance on data without the spurious features. Mitigating a model's reliance on spurious features typically requires external supervisions, such as accurate annotations of spurious features, which are not free to get. \nIn this paper, we propose RetroTune, a general self-guided spurious feature mitigation method that first inspects a model's latent representations based on the training samples for identifying unknown spurious features and then fine-tunes the model by targeting at the identified spurious features. Our method mimics the way of retrospection: it analyzes a model's latent representations for training samples after the model has been trained and then identifies and adjusts incorrect weights in the last classification layer of the model based on the analyzed results. RetroTune is fully unsupervised in identifying spurious features and does not need additional data to mitigate a model's reliance on spurious features. Our method achieves a maximum of 27.2\\% increment in worst-group accuracy than the best baselines on training and selecting models that are robust to unknown spurious features.",
        "keywords": "spurious features;robustness;classification",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Guangtao Zheng;Aidong Zhang",
        "authorids": "~Guangtao_Zheng1;~Aidong_Zhang2",
        "gender": ";F",
        "homepage": "https://gtzheng.github.io/;https://engineering.virginia.edu/faculty/aidong-zhang",
        "dblp": "178/7288;z/AidongZhang.html",
        "google_scholar": "SHMLzswAAAAJ;O8XxkE4AAAAJ",
        "orcid": "0000-0002-1287-4931;0000-0001-9723-3246",
        "linkedin": ";",
        "or_profile": "~Guangtao_Zheng1;~Aidong_Zhang2",
        "aff": "University of Virginia;University of Virginia",
        "aff_domain": "virginia.edu;virginia.edu",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nzheng2024retrotune,\ntitle={RetroTune: Mitigating spurious features via retrospective fine-tuning},\nauthor={Guangtao Zheng and Aidong Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=JttlL9xosQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "nfXr;uLm7;GfBE;ARMu",
        "site": "https://openreview.net/forum?id=JttlL9xosQ",
        "pdf_size": 6896429,
        "rating": "3;3;5;5",
        "confidence": "4;4;4;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "3;2;2;3",
        "wc_summary": "99;70;68;93",
        "wc_strengths": "35;13;95;47",
        "wc_weaknesses": "116;37;259;283",
        "wc_questions": "252;558;58;5",
        "wc_review": "502;678;480;428",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            82.5,
            13.683932183404009
        ],
        "wc_strengths_avg": [
            47.5,
            30.012497396917837
        ],
        "wc_weaknesses_avg": [
            173.75,
            101.53663132091788
        ],
        "wc_questions_avg": [
            218.25,
            216.63607155780866
        ],
        "wc_review_avg": [
            522.0,
            93.98936110007345
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:NPWH4m0SQFMJ:scholar.google.com/&scioq=RetroTune:+Mitigating+spurious+features+via+retrospective+fine-tuning&hl=en&as_sdt=0,47",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Virginia",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.virginia.edu",
        "aff_unique_abbr": "UVA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "JuyFppXzh2",
        "title": "Gandalf: Learning label correlations in Extreme Multi-label Classification via Label Features",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Extreme Multi-label Text Classification (XMC) involves learning a classifier that can assign an input with a subset of most relevant labels from millions of label choices. Recent works in this domain have increasingly focused on a symmetric problem setting where both input instances and label features are short-text in nature. Short-text XMC with label features has found numerous applications in areas such as query-to-ad-phrase matching in search ads, title-based product recommendation, prediction of related searches, amongst others. In this paper, we propose Gandalf, a novel approach which makes use of a label correlation graph to leverage label features as additional data points to supplement the training distribution. By exploiting the characteristics of the short-text XMC problem, it leverages the label features to construct valid training instances, and uses the label graph for generating the corresponding soft-label targets, hence effectively capturing the label-label correlations.  While most recent advances in XMC have been algorithmic, mainly aimed towards developing novel deep-learning frameworks, our data-centric augmentation approach is orthogonal to these methodologies, and can be applied in a plug-and-play manner to a variety of them. This generality and effectiveness of \\textit{Gandalf} is demonstrated by showing up to 30\\% relative improvements for 5 state-of-the-art algorithms across 4 benchmark datasets consisting of up to 1.3 million labels.",
        "keywords": "Extreme Multilabel Classification;Key-phrase ads matching;short-text classification",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/3dc7bb8b88d09e69df30a441f23b0a5fb51b000b.pdf",
        "author": "Siddhant Kharbanda;Devaansh Gupta;Erik Schultheis;Atmadeep Banerjee;Vikas Verma;Cho-Jui Hsieh;Rohit Babbar",
        "authorids": "~Siddhant_Kharbanda1;~Devaansh_Gupta1;~Erik_Schultheis1;~Atmadeep_Banerjee1;~Vikas_Verma1;~Cho-Jui_Hsieh1;~Rohit_Babbar1",
        "gender": "M;M;;M;M;M;",
        "homepage": ";https://devaansh100.github.io;https://www.aalto.fi/en/people/erik-schultheis;https://atom-101.github.io;;http://web.cs.ucla.edu/~chohsieh/index.html;",
        "dblp": "302/0835;351/9786;268/7969;;57/6603;14/2770;",
        "google_scholar": "4lVrfloAAAAJ;lSBqiz4AAAAJ;MGxmO7EAAAAJ;lMSaCAkAAAAJ;;Wy89g4IAAAAJ;",
        "orcid": "0009-0000-6847-5836;;0000-0003-1685-8397;;;;",
        "linkedin": "siddhant-kharbanda-32782b18a/;devaanshgupta/;;;;;",
        "or_profile": "~Siddhant_Kharbanda1;~Devaansh_Gupta1;~Erik_Schultheis1;~Atmadeep_Banerjee1;~Vikas_Verma1;~Cho-Jui_Hsieh1;~Rohit_Babbar1",
        "aff": "University of California, Los Angeles;Nanyang Technological University;Aalto University;;Aalto University;University of California, Los Angeles;",
        "aff_domain": "ucla.edu;ntu.edu.sg;aalto.fi;;aalto.fi;ucla.edu;",
        "position": "MS student;Researcher;PhD student;;Postdoc;Associate Professor;",
        "bibtex": "@misc{\nkharbanda2024gandalf,\ntitle={Gandalf: Learning label correlations in Extreme Multi-label Classification via Label Features},\nauthor={Siddhant Kharbanda and Devaansh Gupta and Erik Schultheis and Atmadeep Banerjee and Vikas Verma and Cho-Jui Hsieh and Rohit Babbar},\nyear={2024},\nurl={https://openreview.net/forum?id=JuyFppXzh2}\n}",
        "github": "",
        "project": "",
        "reviewers": "pzXY;tePQ;S9V4;Wc5R",
        "site": "https://openreview.net/forum?id=JuyFppXzh2",
        "pdf_size": 1621832,
        "rating": "5;5;5;6",
        "confidence": "4;4;4;5",
        "soundness": "3;3;2;3",
        "contribution": "2;2;2;2",
        "presentation": "2;2;3;3",
        "wc_summary": "85;44;185;75",
        "wc_strengths": "53;23;36;27",
        "wc_weaknesses": "167;61;105;79",
        "wc_questions": "4;56;54;86",
        "wc_review": "309;184;380;267",
        "wc_reply_reviewers": "0;0;0;17",
        "wc_reply_authors": "479;591;328;577",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            97.25,
            52.869532814277825
        ],
        "wc_strengths_avg": [
            34.75,
            11.54068888758379
        ],
        "wc_weaknesses_avg": [
            103.0,
            40.124805295477756
        ],
        "wc_questions_avg": [
            50.0,
            29.427877939124322
        ],
        "wc_review_avg": [
            285.0,
            70.93306704210667
        ],
        "wc_reply_reviewers_avg": [
            4.25,
            7.361215932167728
        ],
        "wc_reply_authors_avg": [
            493.75,
            104.97469933274398
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16322013156606850823&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;2;2;0",
        "aff_unique_norm": "University of California, Los Angeles;Nanyang Technological University;Aalto University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ucla.edu;https://www.ntu.edu.sg;https://www.aalto.fi",
        "aff_unique_abbr": "UCLA;NTU;Aalto",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Los Angeles;",
        "aff_country_unique_index": "0;1;2;2;0",
        "aff_country_unique": "United States;Singapore;Finland"
    },
    {
        "id": "Jw0qHTfdhv",
        "title": "Learning to Generate Predictor for Long-Term Time Series Forecasting",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Long-term time series forecasting (LTSF) is a significant challenge in machine learning with numerous real-world applications. Although transformer architecture have shown promising performance in the LTSF task, recent research suggests that they are not suitable for time series forecasting due to their permutation invariant characteristic, and proposes a simple linear predictor which outperforms all existing transformer architectures. However, the linear predictor is inflexible and cannot reflect the characteristics of the time series for prediction due to its simple architecture. In this paper, we introduce a novel Learning to Generate Predictor (LGPred) framework, which generates a linear predictor adaptively to the given input time series by leveraging time series decomposition. LGPred obtains representations from the decomposed time series and generates a predictor suitable for the given time series from these representations.\nOur extensive experiments demonstrate that LGPred achieves state-of-the-art performance for both multivariate and univariate forecasting tasks.",
        "keywords": "Time series forecasting;Learning to Generate",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/d25de0f3601c26bff3196b88b1d88dced36c93a8.zip",
        "author": "Jun Seo;Jinseok Yang;Hyeokjun Choe;Soyeon Park;Seohui Bae;Wonbin Ahn;Dongwan Kang;Minjae Kim;Hyeseung Cho;Woohyung Lim",
        "authorids": "~Jun_Seo1;~Jinseok_Yang1;~Hyeokjun_Choe1;~Soyeon_Park3;~Seohui_Bae1;~Wonbin_Ahn1;~Dongwan_Kang1;~Minjae_Kim6;~Hyeseung_Cho1;~Woohyung_Lim1",
        "gender": "M;M;M;F;F;M;M;M;F;M",
        "homepage": ";https://www.lgresearch.ai/;;https://www.lgresearch.ai/;;https://www.lgresearch.ai/;;https://www.lgresearch.ai/;https://www.lgresearch.ai/ourwork/research?tab=PD;",
        "dblp": "222/1700;;;;;;;;169/2928.html;86/7195",
        "google_scholar": ";;FpmqgJEAAAAJ;Z270FY0AAAAJ;;;;;;https://scholar.google.co.kr/citations?user=gtvxdcUAAAAJ",
        "orcid": ";;;;;;;;0009-0009-4165-7643;0000-0003-0525-9065",
        "linkedin": ";;;;seohui-bae-2709391a8/;wonbin-ahn-9956b625;%EB%8F%99%EC%99%84-%EA%B0%95-13622a172/;;;woohyunglim/",
        "or_profile": "~Jun_Seo1;~Jinseok_Yang1;~Hyeokjun_Choe1;~Soyeon_Park3;~Seohui_Bae1;~Wonbin_Ahn1;~Dongwan_Kang1;~Minjae_Kim6;~Hyeseung_Cho1;~Woohyung_Lim1",
        "aff": "LG AI Research;LG AI Research;LG AI Research;LG AI Research;LG AI Research;LG AI Research;;lg ai research;LG AI Research;LG AI Research",
        "aff_domain": "lgresearch.ai;lgresearch.ai;lgresearch.ai;lgresearch.ai;lgresearch.ai;lgresearch.ai;;lgresearch.ai;lgresearch.ai;lgresearch.ai",
        "position": "Researcher;Researcher;Researcher;Researcher;Researcher;Researcher;;Researcher;Researcher;Vice President",
        "bibtex": "@misc{\nseo2024learning,\ntitle={Learning to Generate Predictor for Long-Term Time Series Forecasting},\nauthor={Jun Seo and Jinseok Yang and Hyeokjun Choe and Soyeon Park and Seohui Bae and Wonbin Ahn and Dongwan Kang and Minjae Kim and Hyeseung Cho and Woohyung Lim},\nyear={2024},\nurl={https://openreview.net/forum?id=Jw0qHTfdhv}\n}",
        "github": "",
        "project": "",
        "reviewers": "dX6j;LX8c;qCaW;qLBd",
        "site": "https://openreview.net/forum?id=Jw0qHTfdhv",
        "pdf_size": 2310915,
        "rating": "3;5;5;6",
        "confidence": "4;5;3;4",
        "soundness": "2;2;1;3",
        "contribution": "2;2;1;3",
        "presentation": "3;3;2;3",
        "wc_summary": "73;63;51;113",
        "wc_strengths": "21;30;13;38",
        "wc_weaknesses": "205;188;268;141",
        "wc_questions": "83;4;40;5",
        "wc_review": "382;285;372;297",
        "wc_reply_reviewers": "0;20;0;0",
        "wc_reply_authors": "623;604;464;542",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            75.0,
            23.280893453645632
        ],
        "wc_strengths_avg": [
            25.5,
            9.394147114027968
        ],
        "wc_weaknesses_avg": [
            200.5,
            45.47801666739657
        ],
        "wc_questions_avg": [
            33.0,
            32.30325061042619
        ],
        "wc_review_avg": [
            334.0,
            43.35320057389074
        ],
        "wc_reply_reviewers_avg": [
            5.0,
            8.660254037844387
        ],
        "wc_reply_authors_avg": [
            558.25,
            62.1143099454546
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:AfCIKdKll2oJ:scholar.google.com/&scioq=Learning+to+Generate+Predictor+for+Long-Term+Time+Series+Forecasting&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0;0;0;0;0",
        "aff_unique_norm": "LG",
        "aff_unique_dep": "LG AI Research",
        "aff_unique_url": "https://www.lgaires.com",
        "aff_unique_abbr": "LG AI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "JyXnsA8UAC",
        "title": "Locally Optimal Descent for Adaptive Stepsize Scheduling",
        "track": "main",
        "status": "Desk Reject",
        "tldr": "",
        "abstract": "We introduce a novel dynamic learning-rate scheduling scheme grounded in theory with the goal of simplifying the manual and time-consuming tuning of schedules in practice.  Our approach is based on estimating the locally-optimal stepsize, guaranteeing maximal descent in the direction of the stochastic gradient of the current step.  We first establish theoretical convergence bounds for our method within the context of smooth non-convex stochastic optimization, matching state-of-the-art bounds while only assuming knowledge of the smoothness parameter.  We then present a practical implementation of our algorithm and conduct systematic experiments across diverse datasets and optimization algorithms, comparing our scheme with existing state-of-the-art learning-rate schedulers. Our findings indicate that our method needs minimal tuning when compared to existing approaches, removing the need for auxiliary manual schedules and warm-up phases and achieving comparable performance with drastically reduced parameter tuning.",
        "keywords": "step-size tuning;optimization;non-convex;learning rate schedulers",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Gilad Yehudai;Yoel Drori;Mariano Schain;Tomer Koren;Amit Daniely;Alon Cohen",
        "authorids": "~Gilad_Yehudai2;~Yoel_Drori1;~Mariano_Schain1;~Tomer_Koren1;~Amit_Daniely1;~Alon_Cohen1",
        "gender": "M;;M;;M;M",
        "homepage": ";;https://tomerkoren.github.io;;https://sites.google.com/site/aloncohentechnion/;",
        "dblp": "239/4344;115/7818;12/10044;;133/2021;https://dblp.uni-trier.de/pers/s/Schain:Mariano.html",
        "google_scholar": "opVT1qkAAAAJ;7pRQY3MAAAAJ;wGG1voYAAAAJ;;shoYR_AAAAAJ;NtmhkjwAAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Gilad_Yehudai2;~Yoel_Drori1;~Tomer_Koren1;~Amit_Daniely1;~Alon_Cohen1;~Mariano_R_Schain1",
        "aff": "New York University;Google;Tel Aviv University;Hebrew U and Google;Google;Google",
        "aff_domain": "nyu.edu;google.com;tau.ac.il;ac.il;google.com;google.com",
        "position": "Postdoc;Researcher;Associate Professor;Assistant Professor;Researcher;Researcher",
        "bibtex": "@misc{\nyehudai2024locally,\ntitle={Locally Optimal Descent for Adaptive Stepsize Scheduling},\nauthor={Gilad Yehudai and Yoel Drori and Mariano Schain and Tomer Koren and Amit Daniely and Alon Cohen},\nyear={2024},\nurl={https://openreview.net/forum?id=JyXnsA8UAC}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=JyXnsA8UAC",
        "pdf_size": 561427,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:4BU1oHzbguMJ:scholar.google.com/&scioq=Locally+Optimal+Descent+for+Adaptive+Stepsize+Scheduling&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;1;1",
        "aff_unique_norm": "New York University;Google;Tel Aviv University;Hebrew University of Jerusalem",
        "aff_unique_dep": ";Google;;",
        "aff_unique_url": "https://www.nyu.edu;https://www.google.com;https://www.tau.ac.il;https://www.huji.ac.il",
        "aff_unique_abbr": "NYU;Google;TAU;HUJI",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0;1;1;0;0",
        "aff_country_unique": "United States;Israel"
    },
    {
        "id": "JzAuFCKiov",
        "title": "Pairwise Proximal Policy Optimization: Harnessing Relative Feedback for LLM Alignment",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) can acquire extensive world knowledge through pre-training on large corpora. However, due to exposure to low-quality data, LLMs may exhibit harmful behaviors without aligning with human values. The dominant approach for steering LLMs towards beneficial behaviors involves Reinforcement Learning with Human Feedback (RLHF), with Proximal Policy Optimization (PPO) serving as the default RL optimizer. Despite its effectiveness, PPO has limitations when optimizing rewards trained from comparison-based loss. Primarily, PPO is not invariant to equivalent reward functions containing identical preference information due to the need to calibrate the reward scale. Additionally, PPO's necessity for token-wise updates introduces complexities in both function approximation and algorithm design compared to trajectory-wise optimization. This paper proposes a new framework, reinforcement learning with relative feedback, and a novel trajectory-wise policy gradient algorithm, Pairwise Proximal Policy Optimization (P3O) that operates directly on comparative rewards. We theoretically show that P3O is invariant to equivalent rewards and avoids the complexities of PPO. Empirical evaluations demonstrate that P3O outperforms PPO in the KL-Reward trade-off and can align with human preferences as well as or better than prior methods. In summary, this work introduces a simpler yet effective approach for aligning LLMs to human preferences through relative feedback.",
        "keywords": "LLMs;Fine-tune;RLHF;Alignment;Policy gradient;PbRL",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Tianhao Wu;Banghua Zhu;Ruoyu Zhang;Zhaojin Wen;Kannan Ramchandran;Jiantao Jiao",
        "authorids": "~Tianhao_Wu1;~Banghua_Zhu1;~Ruoyu_Zhang1;~Zhaojin_Wen1;~Kannan_Ramchandran1;~Jiantao_Jiao1",
        "gender": "M;M;M;F;M;M",
        "homepage": "https://thwu1.github.io/tianhaowu/;https://people.eecs.berkeley.edu/~banghua/;https://github.com/ridiculouz;;https://www.eecs.berkeley.edu/~kannanr/;https://scholar.google.com/citations?user=aO8KpGcAAAAJ&hl=en",
        "dblp": ";204/5394;81/8054;;53/5765;43/8919",
        "google_scholar": "df-THM0AAAAJ;https://scholar.google.com/citations?hl=en;siuZCjUAAAAJ;;https://scholar.google.com.tw/citations?user=DcV-5RAAAAAJ;aO8KpGcAAAAJ",
        "orcid": ";;0009-0000-3871-6424;;0000-0002-4567-328X;",
        "linkedin": "tianhao-wu-b069296/;;;zhaojin-wen-7657bb220;;",
        "or_profile": "~Tianhao_Wu1;~Banghua_Zhu1;~Ruoyu_Zhang1;~Zhaojin_Wen1;~Kannan_Ramchandran1;~Jiantao_Jiao1",
        "aff": "University of California, Berkeley;University of California, Berkeley;Peking University;;University of California, Berkeley;University of California, Berkeley",
        "aff_domain": "berkeley.edu;berkeley.edu;pku.edu.cn;;berkeley.edu;berkeley.edu",
        "position": "PhD student;PhD student;MS student;;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nwu2024pairwise,\ntitle={Pairwise Proximal Policy Optimization: Harnessing Relative Feedback for {LLM} Alignment},\nauthor={Tianhao Wu and Banghua Zhu and Ruoyu Zhang and Zhaojin Wen and Kannan Ramchandran and Jiantao Jiao},\nyear={2024},\nurl={https://openreview.net/forum?id=JzAuFCKiov}\n}",
        "github": "",
        "project": "",
        "reviewers": "e7ty;gDa8;aFkV;fT3s",
        "site": "https://openreview.net/forum?id=JzAuFCKiov",
        "pdf_size": 986471,
        "rating": "5;5;6;6",
        "confidence": "3;3;3;4",
        "soundness": "3;2;3;4",
        "contribution": "2;2;3;4",
        "presentation": "1;2;3;3",
        "wc_summary": "228;55;71;73",
        "wc_strengths": "2;65;48;80",
        "wc_weaknesses": "2;154;103;190",
        "wc_questions": "2;20;5;6",
        "wc_review": "234;294;227;349",
        "wc_reply_reviewers": "0;0;41;0",
        "wc_reply_authors": "644;618;599;584",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            106.75,
            70.35046197431826
        ],
        "wc_strengths_avg": [
            48.75,
            29.269224451631786
        ],
        "wc_weaknesses_avg": [
            112.25,
            70.76148316704506
        ],
        "wc_questions_avg": [
            8.25,
            6.94172168845741
        ],
        "wc_review_avg": [
            276.0,
            49.542910693660296
        ],
        "wc_reply_reviewers_avg": [
            10.25,
            17.75352077758099
        ],
        "wc_reply_authors_avg": [
            611.25,
            22.42069356643545
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 48,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16773991885828846626&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "University of California, Berkeley;Peking University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.berkeley.edu;http://www.pku.edu.cn",
        "aff_unique_abbr": "UC Berkeley;Peking U",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Berkeley;",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "JzFLBOFMZ2",
        "title": "Causal Structure Learning Supervised by Large Language Model",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Causal discovery from observational data is pivotal for deciphering complex relationships. While Causal Structure Learning (CSL) aims to extract causal Directed Acyclic Graphs (DAGs), its efficacy is hampered by the expansive DAG space and data sparsity. The advent of Large Language Models (LLMs) presents a novel avenue, given their aptitude in causal reasoning, thereby constraining CSL with knowledge-based causal inference.\nA pioneering study integrated LLMs into CSL, achieving notable results in several real-world DAGs. Yet, it faced pitfalls such as erroneous LLM inferences and the inefficacy of ancestral constraints.\nIn response, we introduce the Iterative LLM Supervised CSL (ILS-CSL) framework. This approach seamlessly merges LLM-based causal inference with CSL, iteratively refining the causal DAG based on LLM feedback. \nGiven LLM's shortness in distinguishing indirect causality form the direct, ILS-CSL is still capable to offer constraints on direct causality that are more powerful than the indirect, by integrating statistical dependencies indicated by data.\nMoreover, the prior errors are significantly reduced while using identical LLM resources.\nOur evaluations on eight real-world datasets confirm ILS-CSL's dominance, establishing a new benchmark in CSL performance.",
        "keywords": "Causal discovery;Large Language Model;Causal structure learning;Bayesian Network structure learning",
        "primary_area": "causal reasoning",
        "supplementary_material": "/attachment/76800894e39472f5a66307a7afd267ed81740db0.zip",
        "author": "Taiyu Ban;Lyuzhou Chen;Derui Lyu;Xiangyu Wang;Huanhuan Chen",
        "authorids": "~Taiyu_Ban1;~Lyuzhou_Chen1;~Derui_Lyu1;~Xiangyu_Wang7;~Huanhuan_Chen1",
        "gender": "M;M;M;M;",
        "homepage": ";https://scholar.google.com/citations?hl=zh-CN&user=K0i72_4AAAAJ;;;",
        "dblp": ";336/0856;340/0074;02/6128-16.html?q=Xiangyu%20Wang%200016;",
        "google_scholar": ";https://scholar.google.com/citations?hl=zh-CN;;https://scholar.google.com/citations?view_op=list_works;",
        "orcid": "0000-0002-1379-7528;;0000-0002-6416-6013;0000-0001-9843-5982;",
        "linkedin": ";;;;",
        "or_profile": "~Taiyu_Ban1;~Lyuzhou_Chen1;~Derui_Lyu1;~Xiangyu_Wang7;~Huanhuan_Chen1",
        "aff": "University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China;",
        "aff_domain": "ustc.edu.cn;ustc.edu.cn;ustc.edu.cn;ustc.edu.cn;",
        "position": "PhD student;PhD student;PhD student;Assistant Professor;",
        "bibtex": "@misc{\nban2024causal,\ntitle={Causal Structure Learning Supervised by Large Language Model},\nauthor={Taiyu Ban and Lyuzhou Chen and Derui Lyu and Xiangyu Wang and Huanhuan Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=JzFLBOFMZ2}\n}",
        "github": "",
        "project": "",
        "reviewers": "3btv;88gm;7W49;FmXM;t8Bs",
        "site": "https://openreview.net/forum?id=JzFLBOFMZ2",
        "pdf_size": 1500613,
        "rating": "1;3;3;3;6",
        "confidence": "4;4;5;4;3",
        "soundness": "1;3;2;2;3",
        "contribution": "1;2;2;2;3",
        "presentation": "2;2;1;1;3",
        "wc_summary": "66;60;72;77;105",
        "wc_strengths": "51;22;44;14;111",
        "wc_weaknesses": "527;372;93;344;5",
        "wc_questions": "3;82;109;272;233",
        "wc_review": "647;536;318;707;454",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            3.2,
            1.6
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.2,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            1.8,
            0.7483314773547883
        ],
        "wc_summary_avg": [
            76.0,
            15.582040944625964
        ],
        "wc_strengths_avg": [
            48.4,
            34.13268228545773
        ],
        "wc_weaknesses_avg": [
            268.2,
            191.55510956380152
        ],
        "wc_questions_avg": [
            139.8,
            99.16329966272804
        ],
        "wc_review_avg": [
            532.4,
            138.38005636651548
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5929270612815711,
        "gs_citation": 25,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12628229950501845557&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of Science and Technology of China",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.ustc.edu.cn",
        "aff_unique_abbr": "USTC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Rethinking Channel Dimensions to Isolate Outliers for Low-bit Weight Quantization of Large Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18921",
        "id": "JzG7kSpjJk",
        "author_site": "Jung Hwan Heo, Jeonghoon Kim, Beomseok Kwon, Byeongwook Kim, Se Jung Kwon, Dongsoo Lee",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) have recently demonstrated a remarkable success across various tasks. However, efficiently serving LLMs has been a challenge due to its large memory bottleneck, specifically in small batch inference settings (e.g. mobile devices). Weight-only quantization can be a promising approach, but sub-4 bit quantization remains a challenge due to large-magnitude activation outliers. To mitigate the undesirable outlier effect, we first propose per-IC quantization, a simple yet effective method that creates quantization groups within each input channel (IC) rather than the conventional per-output channel (OC). Our method is motivated by the observation that activation outliers affect the input dimension of the weight matrix, so similarly grouping the weights in the IC direction can $\\textit{isolate outliers to be within a group}$. We also find that activation outliers do not dictate quantization difficulty, and inherent weight sensitivities also exist. With per-IC quantization as a new outlier-friendly scheme, we then propose Adaptive Dimensions ($\\textbf{AdaDim}$), a versatile quantization framework that can adapt to various weight sensitivity patterns. We demonstrate the effectiveness of AdaDim by augmenting prior methods such as Round-To-Nearest and GPTQ, showing significant improvements across various language modeling benchmarks for both base (up to $+4.7\\%$ on MMLU) and instruction-tuned (up to $+10\\%$ on HumanEval) LLMs.",
        "keywords": "large language models;quantization;model compression",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Jung Hwan Heo;Jeonghoon Kim;Beomseok Kwon;Byeongwook Kim;Se Jung Kwon;Dongsoo Lee",
        "authorids": "~Jung_Hwan_Heo1;~Jeonghoon_Kim1;~Beomseok_Kwon1;~Byeongwook_Kim1;~Se_Jung_Kwon1;~Dongsoo_Lee1",
        "gender": "M;M;M;;M;M",
        "homepage": ";;https://jchoi-hyu.github.io/;;;",
        "dblp": "323/8144;;;220/5405;119/5676;11/9680",
        "google_scholar": ";https://scholar.google.com/citations?hl=ko;;https://scholar.google.co.kr/citations?user=OjfC7gUAAAAJ;https://scholar.google.co.kr/citations?user=8eTxKOkAAAAJ;ALiieEkAAAAJ",
        "orcid": ";0000-0002-6068-6476;;;;",
        "linkedin": "johnheo-13/;jeonghoon-kim-804892175/;;;se-jung-kwon-305503175/;",
        "or_profile": "~Jung_Hwan_Heo1;~Jeonghoon_Kim1;~Beomseok_Kwon1;~Byeongwook_Kim1;~Se_Jung_Kwon1;~Dongsoo_Lee1",
        "aff": "University of Southern California;NAVER;NAVER CLOUD;NAVER CLOUD;NAVER Cloud;NAVER CLOVA",
        "aff_domain": "usc.edu;navercorp.com;navercorp.com;navercorp.com;navercorp.com;navercorp.com",
        "position": "Researcher;Researcher;Researcher;Researcher;AI Researcher;Executive Officer",
        "bibtex": "@inproceedings{\nheo2024rethinking,\ntitle={Rethinking Channel Dimensions to Isolate Outliers for Low-bit Weight Quantization of Large Language Models},\nauthor={Jung Hwan Heo and Jeonghoon Kim and Beomseok Kwon and Byeongwook Kim and Se Jung Kwon and Dongsoo Lee},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=JzG7kSpjJk}\n}",
        "github": "",
        "project": "",
        "reviewers": "horP;JAtq;ubBB",
        "pdf_size": 3311432,
        "rating": "6;6;6",
        "confidence": "4;4;5",
        "soundness": "3;2;3",
        "contribution": "2;2;2",
        "presentation": "1;3;3",
        "wc_summary": "49;67;68",
        "wc_strengths": "17;38;48",
        "wc_weaknesses": "297;105;42",
        "wc_questions": "2;38;87",
        "wc_review": "365;248;245",
        "wc_reply_reviewers": "10;0;17",
        "wc_reply_authors": "2192;2018;2048",
        "reply_reviewers": "1;0;1",
        "reply_authors": "5;5;5",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            61.333333333333336,
            8.73053390247253
        ],
        "wc_strengths_avg": [
            34.333333333333336,
            12.918548250050733
        ],
        "wc_weaknesses_avg": [
            148.0,
            108.45275469069469
        ],
        "wc_questions_avg": [
            42.333333333333336,
            34.83612429010374
        ],
        "wc_review_avg": [
            286.0,
            55.87486017879597
        ],
        "wc_reply_reviewers_avg": [
            9.0,
            6.97614984548545
        ],
        "wc_reply_authors_avg": [
            2086.0,
            75.9473501841901
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            5.0,
            0.0
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 16,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6231514038063523317&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=JzG7kSpjJk",
        "pdf": "https://openreview.net/pdf?id=JzG7kSpjJk",
        "email": "usc.edu;navercorp.com;navercorp.com;navercorp.com;navercorp.com;navercorp.com",
        "author_num": 6,
        "aff_unique_index": "0;1;1;1;1;1",
        "aff_unique_norm": "University of Southern California;NAVER Corporation",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.usc.edu;https://www.naver.com",
        "aff_unique_abbr": "USC;NAVER",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Los Angeles;",
        "aff_country_unique_index": "0;1;1;1;1;1",
        "aff_country_unique": "United States;South Korea"
    },
    {
        "title": "Efficient Inverse Multiagent Learning",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18920",
        "id": "JzvIWvC9MG",
        "author_site": "Denizalp Goktas, Amy Greenwald, Sadie Zhao, Alec Koppel, Sumitra Ganesh",
        "tldr": "",
        "abstract": "In this paper, we study inverse game theory (resp. inverse multiagent learning) in\nwhich the goal is to find parameters of a game\u2019s payoff functions for which the\nexpected (resp. sampled) behavior is an equilibrium. We formulate these problems\nas generative-adversarial (i.e., min-max) optimization problems, which we develop\npolynomial-time algorithms to solve, the former of which relies on an exact first-\norder oracle, and the latter, a stochastic one. We extend our approach to solve\ninverse multiagent simulacral learning in polynomial time and number of samples.\nIn these problems, we seek a simulacrum, meaning parameters and an associated\nequilibrium that replicate the given observations in expectation. We find that our\napproach outperforms the widely-used ARIMA method in predicting prices in\nSpanish electricity markets based on time-series data.",
        "keywords": "Inverse Game Theory;Inverse Multiagent Reinforcement Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/c3dfc85d646404f81033e7ed07d571e2f21f5138.pdf",
        "author": "Denizalp Goktas;Amy Greenwald;Sadie Zhao;Alec Koppel;Sumitra Ganesh",
        "authorids": "~Denizalp_Goktas1;~Amy_Greenwald1;~Sadie_Zhao1;~Alec_Koppel1;~Sumitra_Ganesh1",
        "gender": "M;;;M;F",
        "homepage": "https://www.denizalpgoktas.com/about/;;;http://koppel.netlify.app/;",
        "dblp": "297/4657;;;149/0076;98/463.html",
        "google_scholar": "sokzE0sAAAAJ;;;8ClxyjIAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;0000-0003-2447-2873;",
        "linkedin": "denizalp-goktas/;;;alec-koppel-9860b697/;sumitra-ganesh-0379853",
        "or_profile": "~Denizalp_Goktas1;~Amy_Greenwald1;~Sadie_Zhao1;~Alec_Koppel1;~Sumitra_Ganesh1",
        "aff": "Brown University;;;J.P. Morgan Chase;J.P. Morgan Chase",
        "aff_domain": "brown.edu;;;jpmorgan.com;jpmorgan.com",
        "position": "PhD student;;;Research Team Lead;Researcher",
        "bibtex": "@inproceedings{\ngoktas2024efficient,\ntitle={Efficient Inverse Multiagent Learning},\nauthor={Denizalp Goktas and Amy Greenwald and Sadie Zhao and Alec Koppel and Sumitra Ganesh},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=JzvIWvC9MG}\n}",
        "github": "",
        "project": "",
        "reviewers": "Wrco;WrBZ;zp62;F6LX",
        "pdf_size": 1475318,
        "rating": "6;6;8;10",
        "confidence": "2;2;3;3",
        "soundness": "2;2;4;4",
        "contribution": "2;3;3;4",
        "presentation": "1;2;3;3",
        "wc_summary": "26;143;78;47",
        "wc_strengths": "17;129;34;71",
        "wc_weaknesses": "33;144;49;75",
        "wc_questions": "27;40;78;62",
        "wc_review": "103;456;239;255",
        "wc_reply_reviewers": "52;141;0;0",
        "wc_reply_authors": "196;1056;374;478",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "3;3;1;1",
        "rating_avg": [
            7.5,
            1.6583123951777
        ],
        "confidence_avg": [
            2.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            1.0
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            73.5,
            44.18427322023075
        ],
        "wc_strengths_avg": [
            62.75,
            42.944004238077284
        ],
        "wc_weaknesses_avg": [
            75.25,
            42.42861652234256
        ],
        "wc_questions_avg": [
            51.75,
            19.651653874419832
        ],
        "wc_review_avg": [
            263.25,
            125.98487012336045
        ],
        "wc_reply_reviewers_avg": [
            48.25,
            57.603710817967276
        ],
        "wc_reply_authors_avg": [
            526.0,
            322.18317771106547
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            1.0
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.9045340337332909,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7154595786449293365&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=JzvIWvC9MG",
        "pdf": "https://openreview.net/pdf?id=JzvIWvC9MG",
        "email": "brown.edu;;;jpmorgan.com;jpmorgan.com",
        "author_num": 5,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Brown University;JPMorgan Chase & Co.",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.brown.edu;https://www.jpmorganchase.com",
        "aff_unique_abbr": "Brown;JPM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "K13qUXDsTS",
        "title": "Bidirectional-Reachable Hierarchical RL with Mutually Responsive Policies",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Hierarchical reinforcement learning (HRL) addresses complex long-horizon tasks by skillfully decomposing them into subgoals. Therefore, the effectiveness of HRL is greatly influenced by subgoal reachability. Typical HRL methods only consider subgoal reachability from the unilateral level, where a dominant level enforces compliance to the subordinate level. However, we observe that when the dominant level becomes trapped in local exploration or generates unattainable subgoals, the subordinate level is negatively affected and cannot follow the dominant level's actions. This can potentially make both levels stuck in local optima, ultimately hindering subsequent subgoal reachability.\nAllowing real-time bilateral information sharing and error correction would be a natural cure for this issue, which motivates us to propose a mutual response mechanism. Based on this, we propose the Bidirectional-reachable Hierarchical Policy Optimization~(BrHPO)\u2014a simple yet effective algorithm that also enjoys computation efficiency. Experiment results on a variety of long-horizon tasks showcase that BrHPO outperforms other state-of-the-art HRL baselines, coupled with a significantly higher exploration efficiency.",
        "keywords": "Hierarchical reinforcement learning;Bidirectional reachability",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/10188d3023755d81a3bb47f48a4b3fdb5ffc6665.zip",
        "author": "Yu Luo;Tianying Ji;Fuchun Sun;Xianyuan Zhan;Jianwei Dr. Zhang;Wenbing Huang",
        "authorids": "~Yu_Luo5;~Tianying_Ji2;~Fuchun_Sun1;~Xianyuan_Zhan1;~Jianwei_Dr._Zhang1;~Wenbing_Huang1",
        "gender": "M;F;M;M;M;M",
        "homepage": ";;https://www.cs.tsinghua.edu.cn/info/1121/3555.htm;http://zhanxianyuan.xyz/;https://tams.informatik.uni-hamburg.de/people/zhang/;https://gsai.ruc.edu.cn/english/wenbing_huang",
        "dblp": ";124/2199.html;;181/5081;;155/3181-1.html",
        "google_scholar": "https://scholar.google.com.hk/citations?user=KQjoQOMAAAAJ;https://scholar.google.com/citations?hl=zh-CN;;pDMnGloAAAAJ;;0yNkmO4AAAAJ",
        "orcid": "0000-0001-6229-4639;;;0000-0002-3683-0554;;",
        "linkedin": ";;;;;",
        "or_profile": "~Yu_Luo5;~Tianying_Ji2;~Fuchun_Sun1;~Xianyuan_Zhan1;~Jianwei_Dr._Zhang1;~Wenbing_Huang1",
        "aff": "Tsinghua University;Tsinghua University;Tsinghua University;Tsinghua University;Universit\u00e4t Hamburg;Renmin University of China",
        "aff_domain": "tsinghua.edu.cn;tsinghua.edu.cn;cs.tsinghua.edu.cn;tsinghua.edu.cn;uni-hamburg.de;ruc.edu.cn",
        "position": "PhD student;PhD student;Full Professor;Associate Professor;Full Professor;Associate Professor",
        "bibtex": "@misc{\nluo2024bidirectionalreachable,\ntitle={Bidirectional-Reachable Hierarchical {RL} with Mutually Responsive Policies},\nauthor={Yu Luo and Tianying Ji and Fuchun Sun and Xianyuan Zhan and Jianwei Dr. Zhang and Wenbing Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=K13qUXDsTS}\n}",
        "github": "",
        "project": "",
        "reviewers": "QVuZ;VKLy;cpCG",
        "site": "https://openreview.net/forum?id=K13qUXDsTS",
        "pdf_size": 2499617,
        "rating": "5;5;6",
        "confidence": "3;3;4",
        "soundness": "1;3;2",
        "contribution": "2;2;3",
        "presentation": "3;3;3",
        "wc_summary": "151;46;108",
        "wc_strengths": "103;38;62",
        "wc_weaknesses": "664;266;122",
        "wc_questions": "35;2;144",
        "wc_review": "953;352;436",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            101.66666666666667,
            43.099368389287974
        ],
        "wc_strengths_avg": [
            67.66666666666667,
            26.83695627716046
        ],
        "wc_weaknesses_avg": [
            350.6666666666667,
            229.22671940436808
        ],
        "wc_questions_avg": [
            60.333333333333336,
            60.675823484774845
        ],
        "wc_review_avg": [
            580.3333333333334,
            265.7371299277205
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.9999999999999997,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:q6-I6j_W2bgJ:scholar.google.com/&scioq=Bidirectional-Reachable+Hierarchical+RL+with+Mutually+Responsive+Policies&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;1;2",
        "aff_unique_norm": "Tsinghua University;University of Hamburg;Renmin University of China",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.uni-hamburg.de;http://www.ruc.edu.cn",
        "aff_unique_abbr": "THU;UHH;RUC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;1;0",
        "aff_country_unique": "China;Germany"
    },
    {
        "id": "K1VLZ5rNuZ",
        "title": "$MC^2$: Multimodal Concept-based Continual learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The inability of deep neural networks to learn continually while retaining interpretability limit their deployment in critical settings. Existing research has made strides in either interpretability or continual learning, but the synergy of these two directions largely remains under-explored. This work examines this intersection from the perspective of concept-based models where classes are considered as combinations of text-based concepts, and thus can enhance the interpretability of models in a continual learning setting. Addressing the unique challenges of learning new concepts without forgetting past ones, our method $\\mathbf{MC^2}$ proposes an approach to seamlessly learn both classes and concepts over time. We adopt a multimodal approach to concepts, emphasizing text-based human-understandavle semantics associated with images. Through various experimental studies, we demonstrate that $\\mathbf{MC^2}$ outperforms existing concept-based approaches by a large margin in a continual setting, while performing comparably if not better in full-data settings. We also demonstrate that $\\mathbf{MC^2}$ can be used as a post-hoc interpretability method to examine image regions associated with abstract textual concepts. Our code for $\\mathbf{MC^2}$ will be publicly released on acceptance.",
        "keywords": "Concept-based Models;Continual Learning;Interpretability",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Susmit Agrawal;Deepika Vemuri;Vineeth N. Balasubramanian",
        "authorids": "~Susmit_Agrawal1;~Deepika_Vemuri1;~Vineeth_N._Balasubramanian2",
        "gender": "M;;M",
        "homepage": "https://susmit-a.github.io;https://sites.google.com/view/deepika-vemuri-homepage/home;https://people.iith.ac.in/vineethnb/",
        "dblp": "278/3579;;88/4691",
        "google_scholar": "https://scholar.google.com/citations?hl=en;vpTuijEAAAAJ;https://scholar.google.co.in/citations?user=7soDcboAAAAJ",
        "orcid": "0000-0002-7701-131X;;0000-0003-2656-0375",
        "linkedin": "susmitagrawal;;vineethnb?originalSubdomain=in",
        "or_profile": "~Susmit_Agrawal1;~Deepika_Vemuri1;~Vineeth_Balasubramanian1",
        "aff": "Indian Institute of Technology Hyderabad;Indian Institute of Technology, Hyderabad;Indian Institute of Technology Hyderabad",
        "aff_domain": "iith.ac.in;iith.ac.in;iith.ac.in",
        "position": "MS student;PhD student;Full Professor",
        "bibtex": "@misc{\nagrawal2024mc,\ntitle={\\${MC}{\\textasciicircum}2\\$: Multimodal Concept-based Continual learning},\nauthor={Susmit Agrawal and Deepika Vemuri and Vineeth N. Balasubramanian},\nyear={2024},\nurl={https://openreview.net/forum?id=K1VLZ5rNuZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "U4mx;pP9w;Nstq;49aA",
        "site": "https://openreview.net/forum?id=K1VLZ5rNuZ",
        "pdf_size": 10058465,
        "rating": "3;3;3;5",
        "confidence": "4;5;4;3",
        "soundness": "2;1;2;3",
        "contribution": "2;3;2;2",
        "presentation": "2;2;1;2",
        "wc_summary": "62;261;96;58",
        "wc_strengths": "39;121;19;76",
        "wc_weaknesses": "227;660;430;191",
        "wc_questions": "8;140;1;18",
        "wc_review": "336;1182;546;343",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            119.25,
            83.16061267210577
        ],
        "wc_strengths_avg": [
            63.75,
            38.86756359742658
        ],
        "wc_weaknesses_avg": [
            377.0,
            187.07886037711475
        ],
        "wc_questions_avg": [
            41.75,
            57.0454862368619
        ],
        "wc_review_avg": [
            601.75,
            345.4608335253072
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:At7DVpWp8QAJ:scholar.google.com/&scioq=%24MC%5E2%24:+Multimodal+Concept-based+Continual+learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Indian Institute of Technology Hyderabad",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.iith.ac.in",
        "aff_unique_abbr": "IIT Hyderabad",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hyderabad",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "India"
    },
    {
        "id": "K1bv86Uvbp",
        "title": "LARGE LANGUAGE MODELS FOR BIOMEDICAL KNOWLEDGE GRAPH CONSTRUCTION",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The automatic construction of knowledge graphs (KGs) is an important research area in medicine, with far-reaching applications spanning drug discovery and clinical trial design. These applications hinge on the accurate identification of interactions among medical and biological entities. In this study, we propose an end-to-end machine learning solution based on large language models (LLMs) that utilize electronic medical record notes to construct KGs. The entities used in the KG construction process are diseases, factors, treatments, as well as manifestations that coexist with the patient while experiencing the disease. Given the critical need for high-quality performance in medical applications, we embark on a comprehensive assessment of 12 LLMs of various architectures, evaluating their performance and safety attributes. To gauge the quantitative   efficacy of our approach by assessing both precision and recall, we manually annotate a dataset provided by the Macula and Retina Institute.  We also assess the qualitative performance of LLMs, such as the ability to generate structured outputs or the tendency to hallucinate. The results illustrate that in contrast to encoder-only and encoder-decoder, decoder-only LLMs require further investigation. Additionally, we provide guided prompt design to utilize such LLMs. The application of the proposed methodology is demonstrated on age-related macular degeneration.",
        "keywords": "Knowledge Graphs;Knowledge Discovery;Large Language Models;Relation Extraction;EMR;Clinical Notes",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Vahan Arsenyan;Spartak Bughdaryan;Fadi S Shaya;Kent Small;Davit Shahnazaryan",
        "authorids": "~Vahan_Arsenyan1;~Spartak_Bughdaryan1;~Fadi_S_Shaya1;~Kent_Small1;~Davit_Shahnazaryan1",
        "gender": "M;M;M;M;M",
        "homepage": ";;;https://www.asrs.org/find-a-specialist/profile/524/Kent-W-Small;https://www.linkedin.com/in/davit-shahnazaryan/",
        "dblp": ";;;;",
        "google_scholar": "C5SdQnkAAAAJ;;;;",
        "orcid": ";;0000-0003-4955-4103;;",
        "linkedin": "vahan-arsenyan-a41390140/;spartak-bughdaryan/;;;davit-shahnazaryan/",
        "or_profile": "~Vahan_Arsenyan1;~Spartak_Bughdaryan1;~Fadi_S_Shaya1;~Kent_Small1;~Davit_Shahnazaryan1",
        "aff": "Ecole Nationale de la Statistique et de l'Administration Economique;;;;Amaros AI",
        "aff_domain": "ensae.edu;;;;amaros.ai",
        "position": "PhD student;;;;Principal Researcher",
        "bibtex": "@misc{\nanonymous2024large,\ntitle={{LARGE} {LANGUAGE} {MODELS} {FOR} {BIOMEDICAL} {KNOWLEDGE} {GRAPH} {CONSTRUCTION}},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=K1bv86Uvbp}\n}",
        "github": "",
        "project": "",
        "reviewers": "ycCD;a8TG;7yEf;aBzH;wiD2",
        "site": "https://openreview.net/forum?id=K1bv86Uvbp",
        "pdf_size": 694467,
        "rating": "1;3;3;3;5",
        "confidence": "5;5;3;4;3",
        "soundness": "2;2;2;1;3",
        "contribution": "1;2;1;2;2",
        "presentation": "2;1;3;2;2",
        "wc_summary": "70;64;269;70;91",
        "wc_strengths": "73;43;53;23;43",
        "wc_weaknesses": "94;451;338;107;212",
        "wc_questions": "46;92;130;48;2",
        "wc_review": "283;650;790;248;348",
        "wc_reply_reviewers": "0;0;54;0;228",
        "wc_reply_authors": "515;716;174;256;737",
        "reply_reviewers": "0;0;1;0;1",
        "reply_authors": "1;1;1;1;2",
        "rating_avg": [
            3.0,
            1.2649110640673518
        ],
        "confidence_avg": [
            4.0,
            0.8944271909999159
        ],
        "soundness_avg": [
            2.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            1.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            112.8,
            78.6368870187522
        ],
        "wc_strengths_avg": [
            47.0,
            16.24807680927192
        ],
        "wc_weaknesses_avg": [
            240.4,
            137.04977198083913
        ],
        "wc_questions_avg": [
            63.6,
            43.733739835509155
        ],
        "wc_review_avg": [
            463.8,
            216.21507810511275
        ],
        "wc_reply_reviewers_avg": [
            56.4,
            88.31217356627567
        ],
        "wc_reply_authors_avg": [
            479.6,
            230.98969673991957
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.2,
            0.4
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.7071067811865475,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:zCRc0As2Yy8J:scholar.google.com/&scioq=LARGE+LANGUAGE+MODELS+FOR+BIOMEDICAL+KNOWLEDGE+GRAPH+CONSTRUCTION&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Ecole Nationale de la Statistique et de l'Administration Economique;Amaros AI",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://ensae.fr;",
        "aff_unique_abbr": "ENSAE;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0",
        "aff_country_unique": "France;"
    },
    {
        "title": "Conditional Information Bottleneck Approach for Time Series Imputation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18919",
        "id": "K1mcPiDdOJ",
        "author_site": "MinGyu Choi, Changhee Lee",
        "tldr": "",
        "abstract": "Time series imputation presents a significant challenge because it requires capturing the underlying temporal dynamics from partially observed time series data. Among the recent successes of imputation methods based on generative models, the information bottleneck (IB) framework offers a well-suited theoretical foundation for multiple imputations, allowing us to account for the uncertainty associated with the imputed values. However, directly applying the IB framework to time series data without considering their temporal context can lead to a substantial loss of temporal dependencies, which, in turn, can degrade the overall imputation performance. To address such a challenge, we propose a novel conditional information bottleneck (CIB) approach for time series imputation, which aims to mitigate the potentially negative consequences of the regularization constraint by focusing on reducing the redundant information conditioned on the temporal context. We provide a theoretical analysis of its effect by adapting variational decomposition. We use the resulting insight and propose a novel deep learning method that can approximately achieve the proposed CIB objective for time series imputation as a combination of evidence lower bound and novel temporal kernel-enhanced contrastive optimization. Our experiments, conducted on multiple real-world datasets, consistently demonstrate that our method significantly improves imputation performance (including both interpolation and extrapolation), and also enhances classification performance based on the imputed values.",
        "keywords": "time series imputation; time series interpolation; information bottleneck",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "MinGyu Choi;Changhee Lee",
        "authorids": "~MinGyu_Choi1;~Changhee_Lee1",
        "gender": ";",
        "homepage": "https://chemgyu.github.io/;",
        "dblp": ";",
        "google_scholar": ";https://scholar.google.com/citations?hl=en",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~MinGyu_Choi1;~Changhee_Lee1",
        "aff": "Massachusetts Institute of Technology;ChungAng University",
        "aff_domain": "mit.edu;cau.ac.kr",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nchoi2024conditional,\ntitle={Conditional Information Bottleneck Approach for Time Series Imputation},\nauthor={MinGyu Choi and Changhee Lee},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=K1mcPiDdOJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "yyLt;mVWF;Vm5N;wRxf",
        "pdf_size": 3224622,
        "rating": "6;6;6;8",
        "confidence": "4;4;4;4",
        "soundness": "3;3;3;4",
        "contribution": "3;3;3;4",
        "presentation": "3;2;4;3",
        "wc_summary": "39;78;83;77",
        "wc_strengths": "16;32;220;22",
        "wc_weaknesses": "121;77;389;87",
        "wc_questions": "218;2;476;1",
        "wc_review": "394;189;1168;187",
        "wc_reply_reviewers": "36;39;0;0",
        "wc_reply_authors": "1336;609;1670;566",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "4;2;4;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            69.25,
            17.612140698961042
        ],
        "wc_strengths_avg": [
            72.5,
            85.35074692116056
        ],
        "wc_weaknesses_avg": [
            168.5,
            128.3462114750568
        ],
        "wc_questions_avg": [
            174.25,
            195.3540055898522
        ],
        "wc_review_avg": [
            484.5,
            403.48141221126906
        ],
        "wc_reply_reviewers_avg": [
            18.75,
            18.779976038323372
        ],
        "wc_reply_authors_avg": [
            1045.25,
            472.98064178145813
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.0,
            1.0
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3812885014720386225&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=K1mcPiDdOJ",
        "pdf": "https://openreview.net/pdf?id=K1mcPiDdOJ",
        "email": "mit.edu;cau.ac.kr",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Massachusetts Institute of Technology;Chungang University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://web.mit.edu;http://www.cau.ac.kr",
        "aff_unique_abbr": "MIT;CAU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United States;South Korea"
    },
    {
        "title": "Towards Enhancing Time Series Contrastive Learning: A Dynamic Bad Pair Mining Approach",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18918",
        "id": "K2c04ulKXn",
        "author_site": "Xiang Lan, Hanshu Yan, Shenda Hong, Mengling Feng",
        "tldr": "",
        "abstract": "*Not all positive pairs are beneficial to time series contrastive learning*. In this paper, we study two types of bad positive pairs that can impair the quality of time series representation learned through contrastive learning: the noisy positive pair and the faulty positive pair. We observe that, with the presence of noisy positive pairs, the model tends to simply learn the pattern of noise (Noisy Alignment). Meanwhile, when faulty positive pairs arise, the model wastes considerable amount of effort aligning non-representative patterns (Faulty Alignment). To address this problem, we propose a Dynamic Bad Pair Mining (DBPM) algorithm, which reliably identifies and suppresses bad positive pairs in time series contrastive learning. Specifically, DBPM utilizes a memory module to dynamically track the training behavior of each positive pair along training process. This allows us to identify potential bad positive pairs at each epoch based on their historical training behaviors. The identified bad pairs are subsequently down-weighted through a transformation module, thereby mitigating their negative impact on the representation learning process. DBPM is a simple algorithm designed as a lightweight **plug-in** without learnable parameters to enhance the performance of existing state-of-the-art methods. Through extensive experiments conducted on four large-scale, real-world time series datasets, we demonstrate DBPM's efficacy in mitigating the adverse effects of bad positive pairs.",
        "keywords": "Time Series Contrastive Learning;Healthcare;Self-Supervised Representation Learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Xiang Lan;Hanshu Yan;Shenda Hong;Mengling Feng",
        "authorids": "~Xiang_Lan2;~Hanshu_Yan1;~Shenda_Hong1;~Mengling_Feng1",
        "gender": "M;;;M",
        "homepage": "https://www.lanxplanet.com;;;https://www.mornin-feng.com",
        "dblp": "45/5842-4;;;31/7025",
        "google_scholar": "09Qb5fUAAAAJ;;;F2ET1WsAAAAJ",
        "orcid": "0000-0002-0325-2065;;;0000-0002-5338-6248",
        "linkedin": ";;;mengling-mornin-feng-9400811a/",
        "or_profile": "~Xiang_Lan2;~Hanshu_Yan1;~Shenda_Hong1;~Mengling_Feng1",
        "aff": "National University of Singapore;;;National University of Singapore",
        "aff_domain": "nus.edu.sg;;;nus.edu.sg",
        "position": "PhD student;;;Assistant Professor",
        "bibtex": "@inproceedings{\nlan2024towards,\ntitle={Towards Enhancing Time Series Contrastive Learning: A Dynamic Bad Pair Mining Approach},\nauthor={Xiang Lan and Hanshu Yan and Shenda Hong and Mengling Feng},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=K2c04ulKXn}\n}",
        "github": "",
        "project": "",
        "reviewers": "iore;Cugc;gEVT;DxUx",
        "pdf_size": 2028666,
        "rating": "5;6;6;8",
        "confidence": "4;3;3;4",
        "soundness": "2;3;3;4",
        "contribution": "2;3;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "131;197;76;128",
        "wc_strengths": "68;147;245;281",
        "wc_weaknesses": "146;54;206;93",
        "wc_questions": "7;52;21;33",
        "wc_review": "352;450;548;535",
        "wc_reply_reviewers": "0;0;57;7",
        "wc_reply_authors": "799;761;953;551",
        "reply_reviewers": "0;0;2;1",
        "reply_authors": "2;2;3;2",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            133.0,
            42.935998882057
        ],
        "wc_strengths_avg": [
            185.25,
            83.58939825121365
        ],
        "wc_weaknesses_avg": [
            124.75,
            57.15494291835134
        ],
        "wc_questions_avg": [
            28.25,
            16.513252253871737
        ],
        "wc_review_avg": [
            471.25,
            78.46456206466713
        ],
        "wc_reply_reviewers_avg": [
            16.0,
            23.843238035132728
        ],
        "wc_reply_authors_avg": [
            766.0,
            143.44685427014426
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.2294157338705618,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5547514966523637906&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=K2c04ulKXn",
        "pdf": "https://openreview.net/pdf?id=K2c04ulKXn",
        "email": "nus.edu.sg;;;nus.edu.sg",
        "author_num": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "National University of Singapore",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nus.edu.sg",
        "aff_unique_abbr": "NUS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Singapore"
    },
    {
        "id": "K3SviXqDcj",
        "title": "Invariance as A Necessary Condition for Online Continual Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Traditional supervised learning aims to learn only features that are sufficient to classify the current given classes. \nThis is highly problematic for continual learning (CL), which learns a sequence of tasks incrementally. It is also a major cause for \ncatastrophic forgetting (CF). Although numerous CL methods have been proposed to mitigate CF, theoretical understanding of the problem is still limited. Recent work showed that if the CL learner can learn as many features as possible from the data (dubbed holistic representations), CF can be significantly reduced. This paper shows that learning holistic representations is insufficient and it is also necessary to learn invariant representations because many features in the data are irrelevant or variant, and learning them may also cause CF. This paper studies it both theoretically and empirically. A novel invariant feature learning method related to causal inference theory is proposed for online CL, which boosts online CL performance markedly.",
        "keywords": "continual learning;online continual learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/860742a99d2a849b513e47fb0e6994511aa48327.zip",
        "author": "Yiduo Guo;Bing Liu;Dongyan Zhao",
        "authorids": "~Yiduo_Guo2;~Bing_Liu1;~Dongyan_Zhao2",
        "gender": "M;M;M",
        "homepage": "https://www.cs.uic.edu/~liub/;https://www.wict.pku.edu.cn/zhaodongyan/en/;https://github.com/gydpku",
        "dblp": "l/BingLiu1.html;63/1870;196/5954.html",
        "google_scholar": "Kt1bjZoAAAAJ;lhR8-68AAAAJ;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Bing_Liu1;~Dongyan_Zhao2;~Yiduo_GUO1",
        "aff": "University of Illinois at Chicago;Peking University;Peking University",
        "aff_domain": "uic.edu;pku.edu.cn;pku.edu.cn",
        "position": "Full Professor;Full Professor;PhD student",
        "bibtex": "@misc{\nguo2024invariance,\ntitle={Invariance as A Necessary Condition for Online Continual Learning},\nauthor={Yiduo Guo and Bing Liu and Dongyan Zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=K3SviXqDcj}\n}",
        "github": "",
        "project": "",
        "reviewers": "yhUR;Xe1e;C77j",
        "site": "https://openreview.net/forum?id=K3SviXqDcj",
        "pdf_size": 1177165,
        "rating": "3;5;6",
        "confidence": "4;4;4",
        "soundness": "2;2;3",
        "contribution": "1;2;3",
        "presentation": "1;3;3",
        "wc_summary": "87;95;46",
        "wc_strengths": "73;82;82",
        "wc_weaknesses": "204;340;123",
        "wc_questions": "1;226;164",
        "wc_review": "365;743;415",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "483;703;416",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            76.0,
            21.463146709340332
        ],
        "wc_strengths_avg": [
            79.0,
            4.242640687119285
        ],
        "wc_weaknesses_avg": [
            222.33333333333334,
            89.5333581533845
        ],
        "wc_questions_avg": [
            130.33333333333334,
            94.89058026075203
        ],
        "wc_review_avg": [
            507.6666666666667,
            167.65308096052263
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            534.0,
            122.59146245422912
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:emL1Yr0zZSMJ:scholar.google.com/&scioq=Invariance+as+A+Necessary+Condition+for+Online+Continual+Learning&hl=en&as_sdt=0,7",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "University of Illinois at Chicago;Peking University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uic.edu;http://www.pku.edu.cn",
        "aff_unique_abbr": "UIC;Peking U",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Chicago;",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "K3tHTPjFBM",
        "title": "Equivariant Protein Multi-task Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Understanding and leveraging the 3D structures of proteins is central to various tasks in biology and drug discovery. While deep learning has been applied successfully for modeling protein structures, current methods usually employ distinct models for different tasks. Such a single-task strategy is not only resource-consuming when the number of tasks increases but also incapable of combining multi-source datasets for larger-scale model training, given that protein datasets are usually of small size for most structural tasks. In this paper, we propose to adopt one single model to address multiple tasks jointly, upon the input of 3D protein structures. In particular, we first construct a standard multi-task benchmark called PROMPT, consisting of 6 representative tasks integrated from 4 public datasets. The resulting benchmark contains partially labeled data for training and fully-labeled data for validation/testing. Then, we develop a novel graph neural network for multi-task learning, dubbed Heterogeneous Multichannel Equivariant Network (HeMeNet), which is equivariant to 3D rotations/translations/reflections of proteins and able to capture various relationships between different atoms owing to the heterogeneous multichannel graph construction of proteins. Besides, HeMeNet is able to achieve task-specific learning via the task-aware readout mechanism. Extensive evaluations verify the effectiveness of multi-task learning on our benchmark, and our model generally surpasses state-of-the-art models. Our study is expected to open up a new venue for structure-based protein learning.",
        "keywords": "Equivariant neural network;Multitask learning;Heterogeneous graph",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Rong Han;Wenbing Huang;Lingxiao Luo;Xinyan Han;Jiaming Shen;Zhiqiang Zhang;JUN ZHOU;Ting Chen",
        "authorids": "~Rong_Han1;~Wenbing_Huang1;~Lingxiao_Luo1;~Xinyan_Han1;~Jiaming_Shen4;~Zhiqiang_Zhang4;~JUN_ZHOU6;~Ting_Chen3",
        "gender": "M;M;;F;F;M;M;M",
        "homepage": ";https://gsai.ruc.edu.cn/english/wenbing_huang;;https://github.com/hanxinyan20;https://jiaming07.github.io/;;https://scholar.google.com/citations?user=mCVvloEAAAAJ&hl=en;http://timlab.cn",
        "dblp": "202/0285;155/3181-1.html;;357/3046;;67/2010-12;99/3847-11;19/1766-7",
        "google_scholar": "siJxWj0AAAAJ;0yNkmO4AAAAJ;uravRdUAAAAJ;;;TMx0g8kAAAAJ;mCVvloEAAAAJ;yE6LvhMAAAAJ",
        "orcid": "0009-0005-1008-3422;;;;;0000-0002-2321-7259;0000-0001-6033-6102;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Rong_Han1;~Wenbing_Huang1;~Lingxiao_Luo1;~Xinyan_Han1;~Jiaming_Shen4;~Zhiqiang_Zhang4;~JUN_ZHOU6;~Ting_Chen3",
        "aff": "Tsinghua University;Renmin University of China;Computer Science and Technology, Tsinghua University;Tsinghua University;Tsinghua University;Ant Group;Ant Group;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;ruc.edu.cn;mails.tsinghua.edu.cn;tsinghua.edu.cn;mail.tsinghua.edu.cn;antfin.com;antgroup.com;cs.tsinghua.edu.cn",
        "position": "PhD student;Associate Professor;MS student;Undergrad student;Undergrad student;Researcher;Researcher;Professor",
        "bibtex": "@misc{\nhan2024equivariant,\ntitle={Equivariant Protein Multi-task Learning},\nauthor={Rong Han and Wenbing Huang and Lingxiao Luo and Xinyan Han and Jiaming Shen and Zhiqiang Zhang and JUN ZHOU and Ting Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=K3tHTPjFBM}\n}",
        "github": "",
        "project": "",
        "reviewers": "STD6;y1Y9;N1C4;Katf",
        "site": "https://openreview.net/forum?id=K3tHTPjFBM",
        "pdf_size": 832292,
        "rating": "3;3;5;5",
        "confidence": "3;3;4;3",
        "soundness": "3;2;3;2",
        "contribution": "1;2;2;2",
        "presentation": "2;3;2;3",
        "wc_summary": "129;45;92;105",
        "wc_strengths": "32;40;56;81",
        "wc_weaknesses": "106;213;63;230",
        "wc_questions": "102;41;196;5",
        "wc_review": "369;339;407;421",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "743;1098;590;1034",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;2;1;2",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            92.75,
            30.597181242722343
        ],
        "wc_strengths_avg": [
            52.25,
            18.713297411199342
        ],
        "wc_weaknesses_avg": [
            153.0,
            70.42371759570777
        ],
        "wc_questions_avg": [
            86.0,
            72.35675504056273
        ],
        "wc_review_avg": [
            384.0,
            32.202484376209235
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            866.25,
            208.17825895131315
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:48Iz2LgP6qYJ:scholar.google.com/&scioq=Equivariant+Protein+Multi-task+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0;0;2;2;0",
        "aff_unique_norm": "Tsinghua University;Renmin University of China;Ant Group",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;http://www.ruc.edu.cn;https://www.antgroup.com",
        "aff_unique_abbr": "THU;RUC;Ant Group",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "K4fd38VWHt",
        "title": "Assessing Robustness via Score-based Adversarial Image Generation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Most adversarial attacks and defenses focus on perturbations within small $\\ell_p$-norm constraints. However, $\\ell_p$ threat models cannot capture all relevant semantic-preserving perturbations, and hence, the scope of robustness evaluations is limited.\nIn this work, we introduce Score-Based Adversarial Generation (ScoreAG), a novel framework that leverages the advancements in score-based generative models to generate adversarial examples beyond $\\ell_p$-norm constraints, so-called unrestricted adversarial examples, overcoming their limitations. \nUnlike traditional methods, ScoreAG maintains the core semantics of images while generating realistic adversarial examples, either by transforming existing images or synthesizing new ones entirely from scratch. We further exploit the generative capability of ScoreAG to purify images, empirically enhancing the robustness of classifiers. Our extensive empirical evaluation demonstrates that ScoreAG matches the performance of state-of-the-art attacks and defenses across multiple benchmarks.\nThis work highlights the importance of investigating adversarial examples bounded by semantics rather than $\\ell_p$-norm constraints. ScoreAG represents an important step towards more encompassing robustness assessments.",
        "keywords": "Adversarial attacks;adversarial defenses;robustness assessments;purification;generative models",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Marcel Kollovieh;Lukas Gosch;Yan Scholten;Marten Lienen;Stephan G\u00fcnnemann",
        "authorids": "~Marcel_Kollovieh1;~Lukas_Gosch1;~Yan_Scholten1;~Marten_Lienen1;~Stephan_G\u00fcnnemann1",
        "gender": "M;M;;;M",
        "homepage": "https://marcelkollovieh.de;https://saper0.github.io/;;https://martenlienen.com;http://www.daml.in.tum.de",
        "dblp": "299/1647;289/9853;240/9194;192/3468;43/3011",
        "google_scholar": "4oq7nmIAAAAJ;ilCFrEMAAAAJ;8G2bJ7sAAAAJ;;",
        "orcid": ";;;;",
        "linkedin": "marcel-kollovieh-8a2ab21b7/;;;;",
        "or_profile": "~Marcel_Kollovieh1;~Lukas_Gosch1;~Yan_Scholten1;~Marten_Lienen1;~Stephan_G\u00fcnnemann1",
        "aff": "Department of Informatics, Technische Universit\u00e4t M\u00fcnchen;Technical University of Munich;Technische Universit\u00e4t M\u00fcnchen;Technical University Munich;Technical University Munich",
        "aff_domain": "in.tum.de;tum.de;tum.de;tum.de;tum.de",
        "position": "PhD student;PhD student;PhD student;PhD student;Professor",
        "bibtex": "@misc{\nkollovieh2024assessing,\ntitle={Assessing Robustness via Score-based Adversarial Image Generation},\nauthor={Marcel Kollovieh and Lukas Gosch and Yan Scholten and Marten Lienen and Stephan G{\\\"u}nnemann},\nyear={2024},\nurl={https://openreview.net/forum?id=K4fd38VWHt}\n}",
        "github": "",
        "project": "",
        "reviewers": "dx4f;rCh2;3Sog;4m9f",
        "site": "https://openreview.net/forum?id=K4fd38VWHt",
        "pdf_size": 10286271,
        "rating": "3;5;5;6",
        "confidence": "4;5;4;3",
        "soundness": "2;3;2;3",
        "contribution": "2;2;3;2",
        "presentation": "2;3;3;3",
        "wc_summary": "63;53;85;93",
        "wc_strengths": "47;59;39;147",
        "wc_weaknesses": "656;115;196;294",
        "wc_questions": "46;2;41;85",
        "wc_review": "812;229;361;619",
        "wc_reply_reviewers": "0;74;33;162",
        "wc_reply_authors": "1105;708;368;826",
        "reply_reviewers": "0;1;1;3",
        "reply_authors": "2;2;1;2",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            73.5,
            16.147755261955144
        ],
        "wc_strengths_avg": [
            73.0,
            43.31281565541543
        ],
        "wc_weaknesses_avg": [
            315.25,
            206.68983405092763
        ],
        "wc_questions_avg": [
            43.5,
            29.3981291921782
        ],
        "wc_review_avg": [
            505.25,
            225.9185417357327
        ],
        "wc_reply_reviewers_avg": [
            67.25,
            60.660427792754646
        ],
        "wc_reply_authors_avg": [
            751.75,
            264.3278031157525
        ],
        "reply_reviewers_avg": [
            1.25,
            1.0897247358851685
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.3244428422615251,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7081024985055085301&as_sdt=5,31&sciodt=0,31&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0;1;1",
        "aff_unique_norm": "Technische Universit\u00e4t M\u00fcnchen;Technical University of Munich",
        "aff_unique_dep": "Department of Informatics;",
        "aff_unique_url": "https://www.tum.de;https://www.tum.de",
        "aff_unique_abbr": "TUM;TUM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "K6BXvqWWmq",
        "title": "MOTSC: Model-based Offline Traffic Signal Control",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Urban areas are currently suffering from more and more severe traffic congestion. One of the most straightforward ways to relieve congestion is to optimize the control of traffic lights. Varieties of reinforcement learning (RL) methods are thus born and have shown good performance in traffic signal control. However, on one hand, the performance of the RL agents may be unstable due to limited interaction data in the early stages of training, leading to even more serious traffic congestion. On the other hand, most of the data generated by the interaction are discarded after training, leading to low data utilization. Hence, it is necessary to introduce offline reinforcement learning to traffic signal control, which trains RL policies without interaction between RL policies and the environment and fully utilizes the data collected in the past.\nIn this paper, we propose an offline traffic signal control method based on model-based offline reinforcement learning. We formulate offline policy optimization under traffic signal control and design the transition model. A theoretical proof has been given out that our method can estimate the state of out-of-distribution samples more accurately. We conduct extensive experiments to compare our method with methods of traffic signal control and offline reinforcement learning under offline traffic signal control, where our method achieves better performance on various metrics.",
        "keywords": "traffic signal control;offline reinforcement learning;transition model;movement independent transition",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/df4800a510039d308637237cdc8c8327b2a43937.zip",
        "author": "Yicheng Liu;Chumeng Liang;Zherui Huang;Guanjie Zheng",
        "authorids": "~Yicheng_Liu3;~Chumeng_Liang2;~Zherui_Huang1;~Guanjie_Zheng1",
        "gender": ";M;M;",
        "homepage": "https://github.com/liuyc1515;https://zheruihuang.com/;http://jhc.sjtu.edu.cn/~gjzheng/;https://caradryanl.github.io",
        "dblp": ";;204/3356;330/5426.html",
        "google_scholar": ";;jJpqDQIAAAAJ;4S0PYJYAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Yicheng_Liu3;~Zherui_Huang1;~Guanjie_Zheng1;~Caradryan_Liang1",
        "aff": "Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;University of Southern California",
        "aff_domain": "sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;usc.edu",
        "position": "Undergrad student;Undergrad student;Assistant Professor;MS student",
        "bibtex": "@misc{\nliu2024motsc,\ntitle={{MOTSC}: Model-based Offline Traffic Signal Control},\nauthor={Yicheng Liu and Chumeng Liang and Zherui Huang and Guanjie Zheng},\nyear={2024},\nurl={https://openreview.net/forum?id=K6BXvqWWmq}\n}",
        "github": "",
        "project": "",
        "reviewers": "o1af;8gyt;5yTR;JUsa",
        "site": "https://openreview.net/forum?id=K6BXvqWWmq",
        "pdf_size": 1042981,
        "rating": "3;3;5;6",
        "confidence": "4;4;3;3",
        "soundness": "2;1;3;3",
        "contribution": "2;1;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "52;15;74;86",
        "wc_strengths": "52;10;81;53",
        "wc_weaknesses": "158;4;207;72",
        "wc_questions": "74;125;51;51",
        "wc_review": "336;154;413;262",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "245;371;139;276",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            56.75,
            27.012728481217888
        ],
        "wc_strengths_avg": [
            49.0,
            25.347583711273153
        ],
        "wc_weaknesses_avg": [
            110.25,
            78.09089255476594
        ],
        "wc_questions_avg": [
            75.25,
            30.21899237234756
        ],
        "wc_review_avg": [
            291.25,
            95.54939821893176
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            257.75,
            82.7990791011591
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9622504486493761,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:74C9YQMwlqUJ:scholar.google.com/&scioq=MOTSC:+Model-based+Offline+Traffic+Signal+Control&hl=en&as_sdt=0,23",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "Shanghai Jiao Tong University;University of Southern California",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.sjtu.edu.cn;https://www.usc.edu",
        "aff_unique_abbr": "SJTU;USC",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Los Angeles",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "K6iBe17Y16",
        "title": "On Using Admissible Bounds for Learning Forward Search Heuristics",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In recent years, there has been growing interest in utilizing modern machine learning techniques to learn heuristic functions for forward search algorithms. Despite this, there has been little theoretical understanding of what they should learn, how to train them, and why we do so. This lack of understanding has resulted in the adoption of diverse training targets (suboptimal vs optimal costs vs admissible heuristics) and loss functions (e.g., square vs absolute errors) in the literature. In this work, we focus on how to effectively utilize the information provided by admissible heuristics in heuristic learning. We argue that learning from poly-time admissible heuristics by minimizing mean square errors (MSE) is not the correct approach, since its result is merely a noisy, inadmissible copy \nof an efficiently computable heuristic. Instead, we propose to model the learned heuristic as a truncated gaussian, where admissible heuristics are used not as training targets but as lower bounds of this distribution. This results in a different loss function from the MSE commonly employed in the literature, which implicitly models the learned heuristic as a gaussian distribution. We conduct experiments where both MSE and our novel loss function are applied to learning a heuristic from optimal plan costs. Results show that our proposed method\nconverges faster during training and yields better heuristics, with 40% lower MSE on average.",
        "keywords": "heuristic learning;neuro-symbolic AI;forward search;machine learning;automated planning;statistical modelling",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "/attachment/88d60151f51c620fe5c0583fb81c076469091b62.zip",
        "author": "Carlos N\u00fa\u00f1ez-Molina;Masataro Asai;Juan Fernandez-Olivares;Pablo Mesejo",
        "authorids": "~Carlos_N\u00fa\u00f1ez-Molina1;~Masataro_Asai1;~Juan_Fernandez-Olivares1;~Pablo_Mesejo1",
        "gender": "M;M;;",
        "homepage": "https://github.com/TheAeryan;https://guicho271828.github.io/;;https://www.ugr.es/~pmesejo/",
        "dblp": "282/0087;149/1319;85/4387.html;03/9015",
        "google_scholar": "https://scholar.google.es/citations?user=FGEjj_4AAAAJ;https://scholar.google.co.jp/citations?user=b4UzH5AAAAAJ;https://scholar.google.es/citations?user=upEKpU8AAAAJ;dUlIWxcAAAAJ",
        "orcid": "0000-0003-1450-7323;;0000-0002-7391-882X;0000-0001-9955-2101",
        "linkedin": "carlos-n\u00fa\u00f1ez-molina-a631021ab/;masataro-asai-158a0638/;;https://es.linkedin.com/in/pablo-mesejo-santiago-71b34854/en",
        "or_profile": "~Carlos_N\u00fa\u00f1ez-Molina1;~Masataro_Asai1;~Juan_Fernandez-Olivares1;~Pablo_Mesejo1",
        "aff": "Universidad de Granada;IBM Research / MIT-IBM Watson AI Lab;Universidad de Granada;University of Granada",
        "aff_domain": "ugr.es;ibm.com;ugr.es;ugr.es",
        "position": "PhD student;Research Staff Member;Associate Professor;Associate Professor",
        "bibtex": "@misc{\nn{\\'u}{\\~n}ez-molina2024on,\ntitle={On Using Admissible Bounds for Learning Forward Search Heuristics},\nauthor={Carlos N{\\'u}{\\~n}ez-Molina and Masataro Asai and Juan Fernandez-Olivares and Pablo Mesejo},\nyear={2024},\nurl={https://openreview.net/forum?id=K6iBe17Y16}\n}",
        "github": "",
        "project": "",
        "reviewers": "hjVN;j4wF;63nm;LPcd;795y",
        "site": "https://openreview.net/forum?id=K6iBe17Y16",
        "pdf_size": 464569,
        "rating": "3;5;5;6;8",
        "confidence": "2;3;3;4;3",
        "soundness": "2;2;3;3;4",
        "contribution": "1;2;2;3;4",
        "presentation": "3;3;3;3;4",
        "wc_summary": "85;48;130;82;39",
        "wc_strengths": "55;68;44;46;33",
        "wc_weaknesses": "62;144;88;123;9",
        "wc_questions": "62;34;74;28;9",
        "wc_review": "264;294;336;279;90",
        "wc_reply_reviewers": "0;76;0;252;0",
        "wc_reply_authors": "1141;997;735;1312;60",
        "reply_reviewers": "0;1;0;1;0",
        "reply_authors": "3;2;1;2;1",
        "rating_avg": [
            5.4,
            1.624807680927192
        ],
        "confidence_avg": [
            3.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.8,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.4,
            1.019803902718557
        ],
        "presentation_avg": [
            3.2,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            76.8,
            32.19565188033937
        ],
        "wc_strengths_avg": [
            49.2,
            11.720068259186888
        ],
        "wc_weaknesses_avg": [
            85.2,
            47.41054734971955
        ],
        "wc_questions_avg": [
            41.4,
            23.54230235129946
        ],
        "wc_review_avg": [
            252.6,
            84.7764118136643
        ],
        "wc_reply_reviewers_avg": [
            65.6,
            97.73760791015913
        ],
        "wc_reply_authors_avg": [
            849.0,
            437.5051999690975
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.8,
            0.7483314773547883
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5838742081211422,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2454760220967632894&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "Universidad de Granada;IBM;University of Granada",
        "aff_unique_dep": ";Research;",
        "aff_unique_url": "https://www.ugr.es;https://www.ibm.com/research;https://www.ugr.es",
        "aff_unique_abbr": "UGr;IBM;UGr",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "Spain;United States"
    },
    {
        "title": "CAMBranch: Contrastive Learning with Augmented MILPs for Branching",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18917",
        "id": "K6kt50zAiG",
        "author_site": "Jiacheng Lin, Meng XU, Zhihua Xiong, Huangang Wang",
        "tldr": "",
        "abstract": "Recent advancements have introduced machine learning frameworks to enhance the Branch and Bound (B\\&B) branching policies for solving Mixed Integer Linear Programming (MILP). These methods, primarily relying on imitation learning of Strong Branching, have shown superior performance. However, collecting expert samples for imitation learning, particularly for Strong Branching, is a time-consuming endeavor. To address this challenge, we propose \\textbf{C}ontrastive Learning with \\textbf{A}ugmented \\textbf{M}ILPs for \\textbf{Branch}ing (CAMBranch), a framework that generates Augmented MILPs (AMILPs) by applying variable shifting to limited expert data from their original MILPs. This approach enables the acquisition of a considerable number of labeled expert samples. CAMBranch leverages both MILPs and AMILPs for imitation learning and employs contrastive learning to enhance the model's ability to capture MILP features, thereby improving the quality of branching decisions. Experimental results demonstrate that CAMBranch, trained with only 10\\% of the complete dataset, exhibits superior performance. Ablation studies further validate the effectiveness of our method.",
        "keywords": "Contrastive Learning;Mixed Integer Programming;Machine Learning;Branching Stratigies;Data Augmentation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Jiacheng Lin;Meng XU;Zhihua Xiong;Huangang Wang",
        "authorids": "~Jiacheng_Lin3;~Meng_XU6;~Zhihua_Xiong2;~Huangang_Wang1",
        "gender": "M;F;M;M",
        "homepage": "https://linjc16.github.io/;;https://www.au.tsinghua.edu.cn/info/1077/3266.htm;http://www.au.tsinghua.edu.cn/info/1080/1664.htm",
        "dblp": ";;;",
        "google_scholar": "https://scholar.google.com.tw/citations?user=h9tJLt8AAAAJ;;;",
        "orcid": ";0000-0003-4393-9686;;",
        "linkedin": ";;;",
        "or_profile": "~Jiacheng_Lin3;~Meng_XU6;~Zhihua_Xiong2;~Huangang_Wang1",
        "aff": "Department of Computer Science, University of Illinois;;;Tsinghua University",
        "aff_domain": "cs.illinois.edu;;;tsinghua.edu.cn",
        "position": "PhD student;;;Associate Professor",
        "bibtex": "@inproceedings{\nlin2024cambranch,\ntitle={{CAMB}ranch: Contrastive Learning with Augmented {MILP}s for Branching},\nauthor={Jiacheng Lin and Meng XU and Zhihua Xiong and Huangang Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=K6kt50zAiG}\n}",
        "github": "",
        "project": "",
        "reviewers": "8jS2;EfKd;mGEq;vbTP",
        "pdf_size": 932190,
        "rating": "5;6;6;6",
        "confidence": "3;5;4;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;2;3",
        "wc_summary": "265;75;39;57",
        "wc_strengths": "70;88;25;26",
        "wc_weaknesses": "310;113;164;238",
        "wc_questions": "186;3;16;21",
        "wc_review": "831;279;244;342",
        "wc_reply_reviewers": "0;273;221;242",
        "wc_reply_authors": "581;807;1319;1004",
        "reply_reviewers": "0;2;2;1",
        "reply_authors": "2;2;2;3",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            109.0,
            90.96153033013462
        ],
        "wc_strengths_avg": [
            52.25,
            27.49886361288408
        ],
        "wc_weaknesses_avg": [
            206.25,
            74.58677831894873
        ],
        "wc_questions_avg": [
            56.5,
            75.05497984810869
        ],
        "wc_review_avg": [
            424.0,
            237.59103518441094
        ],
        "wc_reply_reviewers_avg": [
            184.0,
            107.83088611339517
        ],
        "wc_reply_authors_avg": [
            927.75,
            270.9735918867372
        ],
        "reply_reviewers_avg": [
            1.25,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5222329678670935,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11887024119723204026&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=K6kt50zAiG",
        "pdf": "https://openreview.net/pdf?id=K6kt50zAiG",
        "email": "cs.illinois.edu;;;tsinghua.edu.cn",
        "author_num": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Illinois;Tsinghua University",
        "aff_unique_dep": "Department of Computer Science;",
        "aff_unique_url": "https://illinois.edu;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "UIUC;THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "K7DwHEAqbJ",
        "title": "Boosting Meta-Training with Base Class Information for Few-Shot Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Few-shot learning aims to learn a classifier that could be adapted to recognize new classes unseen during training  with limited labeled examples. Meta-learning has recently become the most important framework for few-shot learning. Its training framework is originally a task-level learning method, such as Model-Agnostic Meta-Learning (MAML) and Prototypical Networks. And a recently proposed training paradigm, Meta-Baseline that consists of sequential pre-training and meta-training stages, gains state-of-the-art performance. However, Meta-Baseline is not an end-to-end method, which means the meta-training stage can only begin after the completion of pre-training, leading to longer training time. Moreover, the two training stages would adversely affect each other, resulting in a decline in the latter training periods that is even lower than that of Prototypical Networks. In this work, motivated by the optimization method of stochastic variance reduced gradient, we propose a new end-to-end training paradigm consisting of two alternate loops. In the outer loop, we calculate the cross entropy loss on the whole training set but only update the final linear layer; while in the inner loop, we utilize the original meta-learning training mode to calculate the loss and incorporate the outer loss gradient to guide the parameter update. This training paradigm not only converges quickly but also outperforms the baselines, indicating that information from the overall training set and the meta-learning training paradigm could mutually reinforce one another.",
        "keywords": "Few-shot learning\uff0c meta-learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Weihao Jiang;Guodong Liu;Kun He",
        "authorids": "~Weihao_Jiang3;~Guodong_Liu5;~Kun_He1",
        "gender": "M;;F",
        "homepage": "https://github.com/jwhao;https://github.com/branpent;http://faculty.hust.edu.cn/hekun/zh_CN/more/1411001/jsjjgd/index.htm",
        "dblp": ";;59/1028-1",
        "google_scholar": ";;YTQnGJsAAAAJ",
        "orcid": ";;0000-0001-7627-4604",
        "linkedin": ";;",
        "or_profile": "~Weihao_Jiang3;~Guodong_Liu5;~Kun_He1",
        "aff": "Huazhong University of Science and Technology;;Huazhong University of Sceince and Technology",
        "aff_domain": "hust.edu.cn;;hust.edu.cn",
        "position": "PhD student;;Full Professor",
        "bibtex": "@misc{\njiang2024boosting,\ntitle={Boosting Meta-Training with Base Class Information for Few-Shot Learning},\nauthor={Weihao Jiang and Guodong Liu and Kun He},\nyear={2024},\nurl={https://openreview.net/forum?id=K7DwHEAqbJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "6HPg;jif1;gX3A;hGNt",
        "site": "https://openreview.net/forum?id=K7DwHEAqbJ",
        "pdf_size": 1009768,
        "rating": "3;3;5;6",
        "confidence": "4;4;4;3",
        "soundness": "2;3;3;3",
        "contribution": "1;2;2;3",
        "presentation": "2;2;2;3",
        "wc_summary": "38;99;55;106",
        "wc_strengths": "10;151;75;102",
        "wc_weaknesses": "383;471;208;119",
        "wc_questions": "16;118;26;112",
        "wc_review": "447;839;364;439",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            74.5,
            28.74456470360962
        ],
        "wc_strengths_avg": [
            84.5,
            50.91414341811124
        ],
        "wc_weaknesses_avg": [
            295.25,
            138.98268777081555
        ],
        "wc_questions_avg": [
            68.0,
            47.18050444834179
        ],
        "wc_review_avg": [
            522.25,
            185.7193783642407
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.7777777777777777,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=318245110785446325&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Huazhong University of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.hust.edu.cn",
        "aff_unique_abbr": "HUST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "K7KQkiHanD",
        "title": "One-for-All: Generalized LoRA for Parameter-Efficient Fine-tuning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We present Generalized LoRA (GLoRA), a flexible approach for universal parameter-efficient fine-tuning tasks. Enhancing Low-Rank Adaptation (LoRA), GLoRA employs a generalized prompt module to optimize pre-trained model weights and adjust intermediate activations, providing more flexibility and capability across diverse tasks and datasets. Moreover, GLoRA facilitates efficient parameter adaptation by employing a scalable, modular, layer-wise structure search that learns individual adapter of each layer. \nOriginating from a unified mathematical formulation, GLoRA exhibits strong transfer learning, few-shot learning and domain generalization abilities, as it adapts to new tasks through not only weights but also additional dimensions like activations. Comprehensive experiments demonstrate that GLoRA outperforms all previous methods in natural, specialized, and structured benchmarks in the vision field, achieving superior accuracy with fewer parameters and computations. Our models on LLaMA-1 and 2 also show considerable enhancements compared to the original LoRA in the language domain. Furthermore, our structural re-parameterization design ensures that GLoRA incurs no extra inference cost, rendering it a practical solution for resource-limited applications.",
        "keywords": "Generalized Low-Rank Adaptation;Parameter-efficient Fine-tuning;Large VIsion Models;Large Language Models",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/93616b065e6675394f4701dbc3726bb569865a51.zip",
        "author": "Arnav Chavan;Zhuang Liu;Deepak Gupta;Eric Xing;Zhiqiang Shen",
        "authorids": "~Arnav_Chavan1;~Zhuang_Liu1;~Deepak_Gupta2;~Eric_Xing1;~Zhiqiang_Shen1",
        "gender": ";;M;M;",
        "homepage": ";;http://dkgupta90.github.io;http://www.cs.cmu.edu/~epxing/;",
        "dblp": ";;163/3197.html;36/3855;",
        "google_scholar": ";;https://scholar.google.co.in/citations?user=Nsxpe_kAAAAJ;https://scholar.google.com.tw/citations?user=5pKTRxEAAAAJ;",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Arnav_Chavan1;~Zhuang_Liu1;~Deepak_Gupta2;~Eric_Xing1;~Zhiqiang_Shen1",
        "aff": ";;AIQ;School of Computer Science, Carnegie Mellon University;",
        "aff_domain": ";;aiqintelligence.ai;cs.cmu.edu;",
        "position": ";;Researcher;Full Professor;",
        "bibtex": "@misc{\nchavan2024oneforall,\ntitle={One-for-All: Generalized Lo{RA} for Parameter-Efficient Fine-tuning},\nauthor={Arnav Chavan and Zhuang Liu and Deepak Gupta and Eric Xing and Zhiqiang Shen},\nyear={2024},\nurl={https://openreview.net/forum?id=K7KQkiHanD}\n}",
        "github": "",
        "project": "",
        "reviewers": "8AV4;jzkZ;QDBh;1LBP",
        "site": "https://openreview.net/forum?id=K7KQkiHanD",
        "pdf_size": 786191,
        "rating": "5;5;6;6",
        "confidence": "4;5;4;4",
        "soundness": "2;4;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;4;2;3",
        "wc_summary": "145;38;73;63",
        "wc_strengths": "48;83;62;70",
        "wc_weaknesses": "146;136;78;133",
        "wc_questions": "5;37;70;2",
        "wc_review": "344;294;283;268",
        "wc_reply_reviewers": "42;16;19;92",
        "wc_reply_authors": "1069;1159;1003;1197",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "3;3;3;3",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            79.75,
            39.77043499887825
        ],
        "wc_strengths_avg": [
            65.75,
            12.695963925594622
        ],
        "wc_weaknesses_avg": [
            123.25,
            26.564779313971346
        ],
        "wc_questions_avg": [
            28.5,
            27.608875384557045
        ],
        "wc_review_avg": [
            297.25,
            28.525208149985513
        ],
        "wc_reply_reviewers_avg": [
            42.25,
            30.433328769623607
        ],
        "wc_reply_authors_avg": [
            1107.0,
            75.93418202627852
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.0,
            0.0
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 92,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12654460549348039811&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "AIQ;Carnegie Mellon University",
        "aff_unique_dep": ";School of Computer Science",
        "aff_unique_url": ";https://www.cmu.edu",
        "aff_unique_abbr": ";CMU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Pittsburgh",
        "aff_country_unique_index": "1",
        "aff_country_unique": ";United States"
    },
    {
        "id": "K7l94Z81bH",
        "title": "Sparsity-Aware Grouped Reinforcement Learning for Designated Driver Dispatch",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Designated driving service is a fast-growing market that provides drivers to transport customers in their own cars. The main technical challenge in this business is the design of driver dispatch due to slow driver movement and sparse orders. To address these challenges, this paper proposes Reinforcement Learning for Designated Driver Dispatch (RLD3). Our algorithm considers group-sharing structures and frequent rewards with heterogeneous costs to achieve a trade-off between heterogeneity, sparsity, and scalability. Additionally, our algorithm addresses long-term agent cross-effects through window-lasting policy ensembles. We also implement an environment simulator to train and evaluate our algorithm using real-world data. Extensive experiments demonstrate that our algorithm achieves superior performance compared to existing Deep Reinforcement Learning (DRL) and optimization methods.",
        "keywords": "Multi-Agent Reinforcement Learning;Fleet Management;Designated Driving",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Jiaxuan Jiang;Ling Pan;Lin Zhou;Zhixuan Fang",
        "authorids": "~Jiaxuan_Jiang1;~Ling_Pan1;~Lin_Zhou3;~Zhixuan_Fang1",
        "gender": ";F;;M",
        "homepage": "https://people.iiis.tsinghua.edu.cn/~fang/jiaxuan.html;https://ling-pan.github.io/;;https://people.iiis.tsinghua.edu.cn/~fang/",
        "dblp": ";199/9303/;69/6147;179/2243",
        "google_scholar": ";qZ_zlacAAAAJ;;0N4s3CAAAAAJ",
        "orcid": ";;0000-0002-4965-5775;",
        "linkedin": "https://www.linkedin.cn/incareer/in/ACoAACzb3soBpJnA9x0ltJP1drFo7XMRwUTHsds;;;",
        "or_profile": "~Jiaxuan_Jiang1;~Ling_Pan1;~Lin_Zhou3;~Zhixuan_Fang1",
        "aff": "Tsinghua University;Montreal Institute for Learning Algorithms (MILA);Didi Research;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;mila.umontreal.ca;didichuxing.com;tsinghua.edu.cn",
        "position": "PhD student;Postdoc;Researcher;Assistant Professor",
        "bibtex": "@misc{\njiang2024sparsityaware,\ntitle={Sparsity-Aware Grouped Reinforcement Learning for Designated Driver Dispatch},\nauthor={Jiaxuan Jiang and Ling Pan and Lin Zhou and Zhixuan Fang},\nyear={2024},\nurl={https://openreview.net/forum?id=K7l94Z81bH}\n}",
        "github": "",
        "project": "",
        "reviewers": "Y79N;z3iz;A8WA;4mCM",
        "site": "https://openreview.net/forum?id=K7l94Z81bH",
        "pdf_size": 7485320,
        "rating": "5;5;5;6",
        "confidence": "4;4;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "1;2;1;2",
        "wc_summary": "43;50;82;223",
        "wc_strengths": "27;74;43;20",
        "wc_weaknesses": "203;67;52;51",
        "wc_questions": "108;123;136;73",
        "wc_review": "381;314;313;367",
        "wc_reply_reviewers": "123;0;0;4",
        "wc_reply_authors": "2103;1552;835;855",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "4;3;1;2",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            99.5,
            72.8028158796073
        ],
        "wc_strengths_avg": [
            41.0,
            20.796634343085422
        ],
        "wc_weaknesses_avg": [
            93.25,
            63.680354113337025
        ],
        "wc_questions_avg": [
            110.0,
            23.547823678633232
        ],
        "wc_review_avg": [
            343.75,
            30.65432269680738
        ],
        "wc_reply_reviewers_avg": [
            31.75,
            52.7085144924423
        ],
        "wc_reply_authors_avg": [
            1336.25,
            528.513658763896
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:roGKphUGmtwJ:scholar.google.com/&scioq=Sparsity-Aware+Grouped+Reinforcement+Learning+for+Designated+Driver+Dispatch&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Tsinghua University;Montreal Institute for Learning Algorithms;Didi Research",
        "aff_unique_dep": ";Artificial Intelligence;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://mila.quebec;https://www.didi.com",
        "aff_unique_abbr": "THU;MILA;Didi",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Montreal",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "China;Canada"
    },
    {
        "id": "K804zYw6Wc",
        "title": "NIR-Assisted Image Denoising: A Selective Fusion Approach and A Real-World Benchmark Dataset",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Despite the significant progress in image denoising, it is still challenging to restore fine-scale details while removing noise, especially in extremely low-light environments. Leveraging near-infrared (NIR) images to assist visible RGB image denoising shows the potential to address this issue, becoming a promising technology. Nonetheless, existing works still struggle with taking advantage of NIR information effectively for real-world image denoising, due to the content inconsistency between NIR-RGB images and the scarcity of real-world paired datasets. To alleviate the problem, we first propose an efficient Selective Fusion Module (SFM), which can be plug-and-played into the advanced denoising networks to merge the deep NIR-RGB features. Specifically, we sequentially perform the global and local modulation for NIR and RGB features, and then integrate the two modulated features. Furthermore, we present a real-world NIR-Assisted Image Denoising (NAID) dataset, which covers diverse scenarios as well as various noise levels and is expected to serve as a benchmark for future research. Extensive experiments on both synthetic and our real-world datasets demonstrate that the proposed method achieves better results than state-of-the-art ones. The dataset, codes, and pre-trained models will be publicly available.",
        "keywords": "Image Denoising; NIR-Assisted; Real-World",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "RongJian Xu;Zhilu Zhang;Renlong Wu;Dongsheng Jiang;XIAOPENG ZHANG;Qi Tian;Wangmeng Zuo",
        "authorids": "~RongJian_Xu1;~Zhilu_Zhang2;~Renlong_Wu2;~Dongsheng_Jiang2;~XIAOPENG_ZHANG7;~Qi_Tian3;~Wangmeng_Zuo3",
        "gender": ";M;M;M;M;M;M",
        "homepage": ";https://github.com/cszhilu1998;;https://sites.google.com/site/zxphistory/;https://www.qitian1987.com/index.html;;https://sites.google.com/site/dongshengjiangbme/",
        "dblp": ";;318/9080;;78/1467-1.html;93/2671;85/8729",
        "google_scholar": ";8pIq2N0AAAAJ;UpOaYLoAAAAJ;Ud6aBAcAAAAJ;https://scholar.google.com/citations?hl=en;rUOpCEYAAAAJ;-eGIgsoAAAAJ",
        "orcid": "0000-0003-4656-9967;0000-0002-5758-5949;;;0000-0002-7252-5047;0000-0002-3330-783X;",
        "linkedin": ";;;;;;",
        "or_profile": "~RongJian_Xu1;~Zhilu_Zhang2;~Renlong_Wu2;~XIAOPENG_ZHANG7;~Qi_Tian3;~Wangmeng_Zuo3;~Dongsheng_Jiang1",
        "aff": ";Harbin Institute of Technology;Harbin Institute of Technology;Huawei Technologies Ltd.;Huawei Technologies Ltd.;Harbin Institute of Technology;Huawei Technologies Ltd.",
        "aff_domain": ";hit.edu.cn;hit.edu.cn;huawei.com;huawei.com;hit.edu.cn;huawei.com",
        "position": ";PhD student;MS student;Principal Researcher;Principal Researcher;Full Professor;Principal Researcher",
        "bibtex": "@misc{\nanonymous2024nirassisted,\ntitle={{NIR}-Assisted Image Denoising: A Selective Fusion Approach and A Real-World Benchmark Dataset},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=K804zYw6Wc}\n}",
        "github": "",
        "project": "",
        "reviewers": "KiWB;D7EG;YVkk;HWD6",
        "site": "https://openreview.net/forum?id=K804zYw6Wc",
        "pdf_size": 3794586,
        "rating": "5;5;5;8",
        "confidence": "4;3;4;2",
        "soundness": "2;3;2;3",
        "contribution": "2;3;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "54;87;37;61",
        "wc_strengths": "41;51;39;23",
        "wc_weaknesses": "106;65;69;49",
        "wc_questions": "2;49;22;4",
        "wc_review": "203;252;167;137",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "806;1113;976;89",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;2;1",
        "rating_avg": [
            5.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            59.75,
            17.99131735032207
        ],
        "wc_strengths_avg": [
            38.5,
            10.037429949942366
        ],
        "wc_weaknesses_avg": [
            72.25,
            20.873128658636684
        ],
        "wc_questions_avg": [
            19.25,
            18.859679212542297
        ],
        "wc_review_avg": [
            189.75,
            42.868257487329714
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            746.0,
            394.60043081578107
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.8703882797784892,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4112889568599377900&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;1;0;1",
        "aff_unique_norm": "Harbin Institute of Technology;Huawei",
        "aff_unique_dep": ";Huawei Technologies",
        "aff_unique_url": "http://www.hit.edu.cn/;https://www.huawei.com",
        "aff_unique_abbr": "HIT;Huawei",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Harbin;",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "K8Mbkn9c4Q",
        "title": "TABLEYE: SEEING SMALL TABLES THROUGH THE LENS OF IMAGES",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The exploration of few-shot tabular learning becomes imperative. Tabular data is a versatile representation that captures diverse information, yet it is not exempt from limitations, property of data and model size. Labeling extensive tabular data can be challenging, and it may not be feasible to capture every important feature. Few-shot tabular learning, however, remains relatively unexplored, primarily due to scarcity of shared information among independent datasets and the inherent ambiguity in defining boundaries within tabular data. To the best of our knowledge, no meaningful and unrestricted few-shot tabular learning techniques have been developed without imposing constraints on the dataset. In this paper, we propose an innovative framework called TablEye, which aims to overcome the limit of forming prior knowledge for tabular data by adopting domain transformation. It facilitates domain transformation by generating tabular images, which effectively conserve the intrinsic semantics of the original tabular data. This approach harnesses rigorously tested few-shot learning algorithms and embedding functions to acquire and apply prior knowledge. Leveraging shared data domains allows us to utilize this prior knowledge, originally learned from the image domain. Specifically, TablEye demonstrated a superior performance by outstripping the TabLLM in a 4-shot task with a maximum 0.11 AUC and a STUNT in a 1-shot setting, where it led on average by 3.17% accuracy",
        "keywords": "Tabular representation learning;Few-shot learning;Transfer Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Seung-eon Lee;Sang-Chul Lee",
        "authorids": "~Seung-eon_Lee1;~Sang-Chul_Lee2",
        "gender": "M;M",
        "homepage": ";https://ds.dgist.ac.kr/",
        "dblp": ";03/8075",
        "google_scholar": ";",
        "orcid": "0009-0008-3208-4882;0009-0003-7209-1036",
        "linkedin": "seung-eon-lee-94b662216;",
        "or_profile": "~Seung-eon_Lee1;~Sang-Chul_Lee2",
        "aff": "Daegu Gyeongbuk Institute of Science and Technology;Daegu Gyeongbuk Institute of Science and Technology",
        "aff_domain": "dgist.ac.kr;dgist.ac.kr",
        "position": "Undergrad student;Researcher",
        "bibtex": "@misc{\nlee2024tableye,\ntitle={{TABLEYE}: {SEEING} {SMALL} {TABLES} {THROUGH} {THE} {LENS} {OF} {IMAGES}},\nauthor={Seung-eon Lee and Sang-Chul Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=K8Mbkn9c4Q}\n}",
        "github": "",
        "project": "",
        "reviewers": "6PPe;NMSd;hBJa;TNZH",
        "site": "https://openreview.net/forum?id=K8Mbkn9c4Q",
        "pdf_size": 3642312,
        "rating": "5;5;5;8",
        "confidence": "3;4;3;4",
        "soundness": "3;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;2;3",
        "wc_summary": "38;102;72;106",
        "wc_strengths": "39;95;49;123",
        "wc_weaknesses": "63;166;107;157",
        "wc_questions": "135;538;150;179",
        "wc_review": "275;901;378;565",
        "wc_reply_reviewers": "279;190;107;0",
        "wc_reply_authors": "987;1742;523;928",
        "reply_reviewers": "3;1;1;0",
        "reply_authors": "2;4;2;3",
        "rating_avg": [
            5.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            79.5,
            27.326726843879417
        ],
        "wc_strengths_avg": [
            76.5,
            34.15772240650714
        ],
        "wc_weaknesses_avg": [
            123.25,
            41.41482222586498
        ],
        "wc_questions_avg": [
            250.5,
            166.74006717043147
        ],
        "wc_review_avg": [
            529.75,
            238.21983019891522
        ],
        "wc_reply_reviewers_avg": [
            144.0,
            103.0121352074599
        ],
        "wc_reply_authors_avg": [
            1045.0,
            440.268667974454
        ],
        "reply_reviewers_avg": [
            1.25,
            1.0897247358851685
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10534168314737706524&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Daegu Gyeongbuk Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.dgist.ac.kr",
        "aff_unique_abbr": "DGIST",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Daegu",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "K98byXpOpU",
        "title": "Double Momentum Method for Lower-Level Constrained Bilevel Optimization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Bilevel optimization (BO) has recently gained prominence in many machine learning applications due to its ability to capture the nested structure inherent in these problems. \nRecently, many gradient-based methods have been proposed as effective solutions for solving large-scale problems.\nHowever, current methods for the lower-level constrained bilevel optimization (LCBO) problems lack a solid analysis of convergence rate, primarily because of the non-smooth nature of the solutions to the lower-level problem. What's worse, existing methods require either double-loop updates, which are sometimes\nless efficient.\n To solve this problem, in this paper, we propose a novel \\textit{single-loop single-timescale} method with theoretical guarantees for LCBO problems.\n Specifically, we leverage the Gaussian smoothing to design an approximation of the hypergradient.\n Then, using this hypergradient, we propose a \\textit{single-loop single-timescale} algorithm based on the double-momentum method and adaptive step size method.\n Theoretically, we demonstrate that our methods can return a stationary point with $\\tilde{\\mathcal{O}}(\\dfrac{\\sqrt{d_2}}{\\delta \\epsilon^{4}})$ iterations. In addition,  experiments on two applications also demonstrate the superiority of our proposed method.",
        "keywords": "bilevel optimization;constrained optimization;nonsmooth",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/db76b9c521a355d6e4c2c81f129b6e12dc0d4979.zip",
        "author": "Wanli Shi;Yi Chang;Bin Gu",
        "authorids": "~Wanli_Shi1;~Yi_Chang4;~Bin_Gu1",
        "gender": "M;M;M",
        "homepage": ";http://www.yichang-cs.com;https://mbzuai.ac.ae/study/faculty/bin-gu/",
        "dblp": "245/9064;02/5438.html;29/1758-1",
        "google_scholar": "Li38vbwAAAAJ;https://scholar.google.com.hk/citations?user=drEkR50AAAAJ;Vo8OgCgAAAAJ",
        "orcid": ";0000-0003-2697-8093;0000-0001-6049-1815",
        "linkedin": ";;",
        "or_profile": "~Wanli_Shi1;~Yi_Chang4;~Bin_Gu1",
        "aff": "Mohamed bin Zayed University of Artificial Intelligence;Jilin University, China;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_domain": "mbzuai.ac.ae;jlu.edu.cn;mbzuai.ac.ae",
        "position": "Postdoc;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nanonymous2024double,\ntitle={Double Momentum Method for Lower-Level Constrained Bilevel Optimization},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=K98byXpOpU}\n}",
        "github": "",
        "project": "",
        "reviewers": "RgCX;voeq;VJdq;AArG",
        "site": "https://openreview.net/forum?id=K98byXpOpU",
        "pdf_size": 928548,
        "rating": "5;5;5;5",
        "confidence": "3;4;3;3",
        "soundness": "2;2;2;2",
        "contribution": "3;3;2;2",
        "presentation": "2;3;3;3",
        "wc_summary": "66;44;54;53",
        "wc_strengths": "35;8;8;69",
        "wc_weaknesses": "97;137;140;84",
        "wc_questions": "30;4;2;292",
        "wc_review": "228;193;204;498",
        "wc_reply_reviewers": "103;0;0;0",
        "wc_reply_authors": "875;423;903;1212",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "3;2;3;3",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            54.25,
            7.8222439235810075
        ],
        "wc_strengths_avg": [
            30.0,
            25.06990227344335
        ],
        "wc_weaknesses_avg": [
            114.5,
            24.45914961727002
        ],
        "wc_questions_avg": [
            82.0,
            121.74563647211345
        ],
        "wc_review_avg": [
            280.75,
            126.06620284596502
        ],
        "wc_reply_reviewers_avg": [
            25.75,
            44.60030829489859
        ],
        "wc_reply_authors_avg": [
            853.25,
            281.40928822624176
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            0.4330127018922193
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4091420892703425345&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Mohamed bin Zayed University of Artificial Intelligence;Jilin University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://mbzuai.ac.ae;http://www.jlu.edu.cn",
        "aff_unique_abbr": "MBZUAI;JLU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United Arab Emirates;China"
    },
    {
        "title": "Robust Similarity Learning with Difference Alignment Regularization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18916",
        "id": "K9V7ugVuUz",
        "author_site": "Shuo Chen, Gang Niu, Chen Gong, Okan Koc, Jian Yang, Masashi Sugiyama",
        "tldr": "",
        "abstract": "Similarity-based representation learning has shown impressive capabilities in both supervised (e.g., metric learning) and unsupervised (e.g., contrastive learning) scenarios. Existing approaches effectively constrained the representation difference (i.e., the disagreement between the embeddings of two instances) to fit the corresponding (pseudo) similarity supervision. However, most of them can hardly restrict the variation of representation difference, sometimes leading to overfitting results where the clusters are disordered by drastically changed differences. In this paper, we thus propose a novel difference alignment regularization (DAR) to encourage all representation differences between inter-class instances to be as close as possible, so that the learning algorithm can produce consistent differences to distinguish data points from each other. To this end, we construct a new cross-total-variation (CTV) norm to measure the divergence among representation differences, and we convert it into an equivalent stochastic form for easy optimization. Then, we integrate the proposed regularizer into the empirical loss for difference-aligned similarity learning (DASL), shrinking the hypothesis space and alleviating overfitting. Theoretically, we prove that our regularizer tightens the error bound of the traditional similarity learning. Experiments on multi-domain data demonstrate the superiority of DASL over existing approaches in both supervised metric learning and unsupervised contrastive learning tasks.",
        "keywords": "contrastive learning;metric learning;regularization",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Shuo Chen;Gang Niu;Chen Gong;Okan Koc;Jian Yang;Masashi Sugiyama",
        "authorids": "~Shuo_Chen8;~Gang_Niu1;~Chen_Gong5;~Okan_Koc1;~Jian_Yang1;~Masashi_Sugiyama1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://shuochenya.github.io/;https://niug1984.github.io;http://www.escience.cn/people/chengong/index.html;;;http://www.ms.k.u-tokyo.ac.jp/sugi/",
        "dblp": "00/6472-3.html;26/3367-1;21/8587-2;173/7673;y/JianYang3.html;35/1228",
        "google_scholar": "vlu_3ksAAAAJ;https://scholar.google.co.jp/citations?user=HOkcy00AAAAJ;https://scholar.google.com.hk/citations?user=guttoBwAAAAJ;Nhol8b8AAAAJ;https://scholar.google.com.hk/citations?user=6CIDtZQAAAAJ;https://scholar.google.co.jp/citations?user=GkYIrlIAAAAJ",
        "orcid": ";;;;;0000-0001-6658-6743",
        "linkedin": ";;;;;",
        "or_profile": "~Shuo_Chen8;~Gang_Niu1;~Chen_Gong5;~Okan_Koc1;~Jian_Yang1;~Masashi_Sugiyama1",
        "aff": "RIKEN;Southeast University;Nanjing University of Science and Technology;Center for Advanced Intelligence Project, RIKEN;Nanjing University of Science and Technology;The University of Tokyo",
        "aff_domain": "riken.jp;seu.edu.cn;njust.edu.cn;riken.jp;njust.edu.cn;u-tokyo.ac.jp",
        "position": "Research Scientist;Adjunct Full Professor;Full Professor;Postdoc;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nchen2024robust,\ntitle={Robust Similarity Learning with Difference Alignment Regularization},\nauthor={Shuo Chen and Gang Niu and Chen Gong and Okan Koc and Jian Yang and Masashi Sugiyama},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=K9V7ugVuUz}\n}",
        "github": "",
        "project": "",
        "reviewers": "Q8tk;SsFX;V3dP;YcLH",
        "pdf_size": 2099916,
        "rating": "5;6;8;8",
        "confidence": "5;5;5;4",
        "soundness": "2;4;4;3",
        "contribution": "2;4;4;3",
        "presentation": "2;3;4;3",
        "wc_summary": "83;103;80;51",
        "wc_strengths": "90;79;46;40",
        "wc_weaknesses": "199;134;89;246",
        "wc_questions": "3;4;82;2",
        "wc_review": "375;320;297;339",
        "wc_reply_reviewers": "0;0;27;116",
        "wc_reply_authors": "835;352;785;599",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "2;1;2;2",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            3.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            79.25,
            18.552290963651902
        ],
        "wc_strengths_avg": [
            63.75,
            21.21762239271875
        ],
        "wc_weaknesses_avg": [
            167.0,
            60.07911450745592
        ],
        "wc_questions_avg": [
            22.75,
            34.2153109002388
        ],
        "wc_review_avg": [
            332.75,
            28.568995432111365
        ],
        "wc_reply_reviewers_avg": [
            35.75,
            47.625492123441624
        ],
        "wc_reply_authors_avg": [
            642.75,
            189.5024735986314
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5555555555555555,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:uwO7AQDwG4kJ:scholar.google.com/&scioq=Robust+Similarity+Learning+with+Difference+Alignment+Regularization&hl=en&as_sdt=0,33",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=K9V7ugVuUz",
        "pdf": "https://openreview.net/pdf?id=K9V7ugVuUz",
        "email": "riken.jp;seu.edu.cn;njust.edu.cn;riken.jp;njust.edu.cn;u-tokyo.ac.jp",
        "author_num": 6,
        "aff_unique_index": "0;1;2;0;2;3",
        "aff_unique_norm": "RIKEN;Southeast University;Nanjing University of Science and Technology;University of Tokyo",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.riken.jp;https://www.seu.edu.cn/;http://www.nust.edu.cn/;https://www.u-tokyo.ac.jp",
        "aff_unique_abbr": "RIKEN;SEU;NUST;UTokyo",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;0;1;0",
        "aff_country_unique": "Japan;China"
    },
    {
        "title": "VersVideo: Leveraging Enhanced Temporal Diffusion Models for Versatile Video Generation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18915",
        "id": "K9sVJ17zvB",
        "author_site": "Jinxi Xiang, Ricong Huang, Jun Zhang, Guanbin Li, Xiao Han, Yang Wei",
        "tldr": "",
        "abstract": "Creating stable, controllable videos is a complex task due to the need for significant variation in temporal dynamics and cross-frame temporal consistency. To address this, we enhance the spatial-temporal capability and introduce a versatile video generation model, VersVideo, which leverages textual, visual, and stylistic conditions. Current video diffusion models typically extend image diffusion architectures by supplementing 2D operations (such as convolutions and attentions) with temporal operations. While this approach is efficient, it often restricts spatial-temporal performance due to the oversimplification of standard 3D operations. To counter this, we incorporate two key elements: (1) multi-excitation paths for spatial-temporal convolutions with dimension pooling across different axes, and (2) multi-expert spatial-temporal attention blocks. These enhancements boost the model's spatial-temporal performance without significantly escalating training and inference costs. We also tackle the issue of information loss that arises when a variational autoencoder is used to transform pixel space into latent features and then back into pixel frames. To mitigate this, we incorporate temporal modules into the decoder to maintain inter-frame consistency. Lastly, by utilizing the innovative denoising UNet and decoder, we develop a unified ControlNet model suitable for various conditions, including image, Canny, HED, depth, and style. Examples of the videos generated by our model can be found at https://jinxixiang.github.io/versvideo/.",
        "keywords": "video generation;diffusion model;temproal modeling",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Jinxi Xiang;Ricong Huang;Jun Zhang;Guanbin Li;Xiao Han;Yang Wei",
        "authorids": "~Jinxi_Xiang1;~Ricong_Huang1;~Jun_Zhang17;~Guanbin_Li2;~Xiao_Han2;~Yang_Wei2",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://jinxixiang.netlify.app/;;https://junzhang.org;http://guanbinli.com;;",
        "dblp": "227/4249;300/1693;29/4190-18.html;126/4457;01/2095-7;03/1094-32.html",
        "google_scholar": "Zn-0LioAAAAJ;;;2A2Bx2UAAAAJ;XGVV3gEAAAAJ;",
        "orcid": ";0000-0003-3268-7962;0000-0001-5579-7094;0000-0002-2486-2890;;",
        "linkedin": ";;;;xiaohan2009;",
        "or_profile": "~Jinxi_Xiang1;~Ricong_Huang1;~Jun_Zhang17;~Guanbin_Li2;~Xiao_Han2;~Yang_Wei2",
        "aff": "Tencent AI Lab;SUN YAT-SEN UNIVERSITY;Tencent AI Lab;SUN YAT-SEN UNIVERSITY;Tencent AI Lab;Tencent AI Lab",
        "aff_domain": "tencent.com;sysu.edu.cn;tencent.com;sysu.edu.cn;tencent.com;tencent.com",
        "position": "Researcher;MS student;Principal Researcher;Associate Professor;Principal Researcher;Researcher",
        "bibtex": "@inproceedings{\nxiang2024versvideo,\ntitle={VersVideo: Leveraging Enhanced Temporal Diffusion Models for Versatile Video Generation},\nauthor={Jinxi Xiang and Ricong Huang and Jun Zhang and Guanbin Li and Xiao Han and Yang Wei},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=K9sVJ17zvB}\n}",
        "github": "",
        "project": "",
        "reviewers": "eX2J;Cov9;CWze;1xNe",
        "pdf_size": 8886103,
        "rating": "3;6;6;6",
        "confidence": "2;3;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "53;57;115;71",
        "wc_strengths": "40;37;110;98",
        "wc_weaknesses": "113;165;80;143",
        "wc_questions": "8;3;51;11",
        "wc_review": "214;262;356;323",
        "wc_reply_reviewers": "41;0;53;199",
        "wc_reply_authors": "1600;1839;1339;1139",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "4;4;4;3",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            74.0,
            24.596747752497688
        ],
        "wc_strengths_avg": [
            71.25,
            33.040694605289396
        ],
        "wc_weaknesses_avg": [
            125.25,
            31.98730216820418
        ],
        "wc_questions_avg": [
            18.25,
            19.122957407263137
        ],
        "wc_review_avg": [
            288.75,
            54.76940295456944
        ],
        "wc_reply_reviewers_avg": [
            73.25,
            75.21427723511009
        ],
        "wc_reply_authors_avg": [
            1479.25,
            264.3107782516634
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.75,
            0.4330127018922193
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.816496580927726,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=662250185391682579&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=K9sVJ17zvB",
        "pdf": "https://openreview.net/pdf?id=K9sVJ17zvB",
        "email": "tencent.com;sysu.edu.cn;tencent.com;sysu.edu.cn;tencent.com;tencent.com",
        "author_num": 6,
        "aff_unique_index": "0;1;0;1;0;0",
        "aff_unique_norm": "Tencent;Sun Yat-sen University",
        "aff_unique_dep": "Tencent AI Lab;",
        "aff_unique_url": "https://ai.tencent.com;http://www.sysu.edu.cn",
        "aff_unique_abbr": "Tencent AI Lab;SYSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Data Filtering Networks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18914",
        "id": "KAk6ngZ09F",
        "author_site": "Alex Fang, Albin Madappally Jose, Amit Jain, Ludwig Schmidt, Alexander Toshev, Vaishaal Shankar",
        "tldr": "",
        "abstract": "Large training sets have become a cornerstone of machine learning and are the foundation for recent advances in language modeling and multimodal learning. While data curation for pre-training is often still ad-hoc, one common paradigm is to first collect a massive pool of data from the Web and then filter this candidate pool down to an actual training set via various heuristics. In this work, we study the problem of learning a *data filtering network* (DFN) for this second step  of filtering a large uncurated dataset. Our key finding is that the quality of a network for filtering is distinct from its performance on downstream tasks: for instance, a model that performs well on ImageNet can yield worse training sets than a model with low ImageNet accuracy that is trained on a small amount of high-quality data. Based on our insights, we construct new data filtering networks that induce state-of-the-art image-text datasets. Specifically, our best performing dataset DFN-5B enables us to train state-of-the-art models for their compute budgets: among other improvements on a variety of tasks, a ViT-H trained on our dataset achieves 83.0% zero-shot transfer accuracy on ImageNet, out-performing larger models trained on other datasets such as LAION-2B, DataComp-1B, or OpenAI\u2019s WIT. In order to facilitate further research in dataset design, we also release a new 2 billion example dataset DFN-2B and show that high performance data filtering networks can be trained from scratch using only publicly available data.",
        "keywords": "datasets;dataset filtering;dataset curation;large scale machine learning",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Alex Fang;Albin Madappally Jose;Amit Jain;Ludwig Schmidt;Alexander T Toshev;Vaishaal Shankar",
        "authorids": "~Alex_Fang1;~Albin_Madappally_Jose1;~Amit_Jain3;~Ludwig_Schmidt1;~Alexander_T_Toshev1;~Vaishaal_Shankar1",
        "gender": ";M;M;M;M;M",
        "homepage": ";;;http://people.csail.mit.edu/ludwigs/;http://alex.toshev.tech;http://vaishaal.com",
        "dblp": "260/0449;338/9642;;141/2720;96/2687;159/3628",
        "google_scholar": ";za_orHUAAAAJ;;SWMKy70AAAAJ;https://scholar.google.com/citations?hl=en;",
        "orcid": ";;;;;",
        "linkedin": "alex-fang-8a11a8115/;albin-m-jose;amit-jain-5346a76/;ludwig-schmidt-87ba3612/;alexander-toshev-9270726/;",
        "or_profile": "~Alex_Fang1;~Albin_Madappally_Jose1;~Amit_Jain3;~Ludwig_Schmidt1;~Alexander_Toshev1;~vaishaal_naanny_shankar1",
        "aff": "Department of Computer Science, University of Washington;Apple;Apple;University of Washington;Apple;Apple",
        "aff_domain": "cs.washington.edu;apple.com;apple.com;washington.edu;apple.com;apple.com",
        "position": "PhD student;Researcher;Software Engineer;Assistant Professor;research scientist;Researcher",
        "bibtex": "@inproceedings{\nfang2024data,\ntitle={Data Filtering Networks},\nauthor={Alex Fang and Albin Madappally Jose and Amit Jain and Ludwig Schmidt and Alexander T Toshev and Vaishaal Shankar},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=KAk6ngZ09F}\n}",
        "github": "",
        "project": "",
        "reviewers": "2tx6;ZvvG;Q5jf;NYkb",
        "pdf_size": 1261452,
        "rating": "5;6;8;8",
        "confidence": "5;5;4;3",
        "soundness": "3;3;4;4",
        "contribution": "1;3;4;4",
        "presentation": "3;3;3;4",
        "wc_summary": "133;11;185;51",
        "wc_strengths": "50;79;63;40",
        "wc_weaknesses": "223;27;461;60",
        "wc_questions": "104;30;27;38",
        "wc_review": "510;147;736;189",
        "wc_reply_reviewers": "318;8;20;14",
        "wc_reply_authors": "1017;529;376;248",
        "reply_reviewers": "2;1;1;1",
        "reply_authors": "3;3;1;1",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.0,
            1.224744871391589
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            95.0,
            68.07348970047003
        ],
        "wc_strengths_avg": [
            58.0,
            14.611639196202457
        ],
        "wc_weaknesses_avg": [
            192.75,
            171.73289580042606
        ],
        "wc_questions_avg": [
            49.75,
            31.578275760402118
        ],
        "wc_review_avg": [
            395.5,
            241.58073184755443
        ],
        "wc_reply_reviewers_avg": [
            90.0,
            131.70421405558744
        ],
        "wc_reply_authors_avg": [
            542.5,
            291.45539967549064
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            1.0
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.8703882797784892,
        "gs_citation": 153,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2783242154689426992&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=KAk6ngZ09F",
        "pdf": "https://openreview.net/pdf?id=KAk6ngZ09F",
        "email": "cs.washington.edu;apple.com;apple.com;washington.edu;apple.com;apple.com",
        "author_num": 6,
        "aff_unique_index": "0;1;1;0;1;1",
        "aff_unique_norm": "University of Washington;Apple",
        "aff_unique_dep": "Department of Computer Science;Apple Inc.",
        "aff_unique_url": "https://www.washington.edu;https://www.apple.com",
        "aff_unique_abbr": "UW;Apple",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Seattle;",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "KAseclJyj5",
        "title": "Diverse Offline Imitation Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "There has been significant recent progress in the area of unsupervised skill discovery, utilizing various information-theoretic objectives as measures of diversity. Despite these advances, challenges remain: current methods require significant online interaction, fail to leverage vast amounts of available task-agnostic data and typically lack a quantitative measure of skill utility. We address these challenges by proposing a principled offline algorithm for unsupervised skill discovery that, in addition to maximizing diversity, ensures that each learned skill imitates state-only expert demonstrations to a certain degree. Our main analytical contribution is to connect Fenchel duality, reinforcement learning, and unsupervised skill discovery to maximize a mutual information objective subject to KL-divergence state occupancy constraints. Furthermore, we demonstrate the effectiveness of our method on the standard offline benchmark D4RL and on a custom offline dataset collected from a 12-DoF quadruped robot for which the policies trained in simulation transfer well to the real robotic system.",
        "keywords": "reinforcement learning;imitation;duality;skill discovery;mutual information",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/4f05c0cd2cfe84d436aaad18a3ae9865daffa868.zip",
        "author": "Marin Vlastelica;Jin Cheng;Georg Martius;Pavel Kolev",
        "authorids": "~Marin_Vlastelica1;~Jin_Cheng1;~Georg_Martius1;~Pavel_Kolev1",
        "gender": "M;M;M;M",
        "homepage": "https://jin-cheng.me/;https://uni-tuebingen.de/de/264672;http://pavelkolev.github.io/;https://jimimvp.github.io/",
        "dblp": ";47/2706;153/5818.html;226/9727",
        "google_scholar": "jHsJrX8AAAAJ;https://scholar.google.de/citations?user=b-JF-UIAAAAJ;https://scholar.google.de/citations?user=m1j0aaoAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0001-9822-3701;;;0000-0002-2959-4119",
        "linkedin": "jin-cheng-886462163/;;pavel-kolev-72495b1a/;mvlastelica/",
        "or_profile": "~Jin_Cheng1;~Georg_Martius1;~Pavel_Kolev1;~Marin_Vlastelica_Pogan\u010di\u01071",
        "aff": "ETHZ - ETH Zurich;Max Planck Institute for Intelligent Systems;Eberhard-Karls-Universit\u00e4t T\u00fcbingen;Max Planck Institute for Intelligent Systems, Max-Planck Institute",
        "aff_domain": "ethz.ch;tuebingen.mpg.de;uni-tuebingen.de;tuebingen.mpg.de",
        "position": "PhD student;Assistant Professor;Postdoc;PhD student",
        "bibtex": "@misc{\nvlastelica2024diverse,\ntitle={Diverse Offline Imitation Learning},\nauthor={Marin Vlastelica and Jin Cheng and Georg Martius and Pavel Kolev},\nyear={2024},\nurl={https://openreview.net/forum?id=KAseclJyj5}\n}",
        "github": "",
        "project": "",
        "reviewers": "7Hkf;iADi;gvyu",
        "site": "https://openreview.net/forum?id=KAseclJyj5",
        "pdf_size": 7319853,
        "rating": "3;3;5",
        "confidence": "4;3;3",
        "soundness": "3;3;3",
        "contribution": "2;2;3",
        "presentation": "2;2;3",
        "wc_summary": "107;54;65",
        "wc_strengths": "52;146;97",
        "wc_weaknesses": "523;283;59",
        "wc_questions": "192;107;15",
        "wc_review": "874;590;236",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1691;1186;490",
        "reply_reviewers": "0;0;0",
        "reply_authors": "3;2;1",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            75.33333333333333,
            22.83759084394752
        ],
        "wc_strengths_avg": [
            98.33333333333333,
            38.38691906829142
        ],
        "wc_weaknesses_avg": [
            288.3333333333333,
            189.4647431288705
        ],
        "wc_questions_avg": [
            104.66666666666667,
            72.27878127239157
        ],
        "wc_review_avg": [
            566.6666666666666,
            260.9844610103998
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1122.3333333333333,
            492.36865140754935
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14844031990457697163&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "ETH Zurich;Max Planck Institute for Intelligent Systems;Eberhard Karls University of T\u00fcbingen",
        "aff_unique_dep": ";Intelligent Systems;",
        "aff_unique_url": "https://www.ethz.ch;https://www.mpi-is.mpg.de;https://www.uni-tuebingen.de/",
        "aff_unique_abbr": "ETHZ;MPI-IS;Uni T\u00fcbingen",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";T\u00fcbingen",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "Switzerland;Germany"
    },
    {
        "id": "KBGbEncHZF",
        "title": "ARE YOU CERTAIN THAT IT IS A DEEPFAKE? DETECTION, GENERATION, AND SOURCE DETECTION FROM AN UNCERTAINTY PERSPECTIVE",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "As generative models are advancing in quality and quantity for creating synthetic content, deepfakes begin to cause online mistrust. Deepfake detectors are proposed to counter this effect, however, misuse of detectors claiming fake content as real or vice versa further fuels this misinformation problem. In this paper, we evaluate, compare, and analyze the uncertainty of these deepfake detectors. As reflected in detectors' responses, deepfake generators also contribute to this uncertainty as their generative residues vary, so we cross the uncertainty analysis of deepfake detectors and generators. Based on our observations, the uncertainty manifold holds enough consistent information to leverage uncertainty for deepfake source detection. We evaluate uncertainty on two datasets with nine generators, with four blind and two biological detectors, compare different uncertainty methods, explore region- and pixel-based uncertainty, and conduct ablation studies. We conduct and analyze binary real/fake, multi-class real/fake, source detection, and leave-one-out experiments between the generator/detector combinations to share their generalization capability, model calibration, uncertainty, and robustness against adversarial attacks. This comprehensive, uncertainty-forward analysis addresses a critical gap in current deepfake detection understanding that we believe can help drive future improvements to detectors and thus restore trust in media in the age of generative AI.",
        "keywords": "deepfake detection;deepfake source detection;uncertainty quantification",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Neslihan Kose;Anthony Rhodes;Umur A. Ciftci;Ilke Demir",
        "authorids": "~Neslihan_Kose3;~Anthony_Rhodes1;~Umur_A._Ciftci1;~Ilke_Demir3",
        "gender": "F;;;F",
        "homepage": ";;;https://ilkedemir.github.io",
        "dblp": "121/4017;;165/9786;134/7997",
        "google_scholar": "https://scholar.google.fr/citations?user=bMPXaxgAAAAJ;;;6837MdMAAAAJ",
        "orcid": "0000-0003-0665-8375;;;0000-0002-4725-816X",
        "linkedin": "neslihan-k%C3%B6se-cihangir-ph-d-b128b822/;;;ilkedemir",
        "or_profile": "~Neslihan_Kose3;~Anthony_Rhodes1;~Umur_A._Ciftci1;~Ilke_Demir3",
        "aff": "Intel Deutschland GmbH;;State University of New York at Binghamton;Intel",
        "aff_domain": "intel.com;;binghamton.edu;intel.com",
        "position": "AI Research Scientist;;Assistant Professor;Researcher",
        "bibtex": "@misc{\nkose2024are,\ntitle={{ARE} {YOU} {CERTAIN} {THAT} {IT} {IS} A {DEEPFAKE}? {DETECTION}, {GENERATION}, {AND} {SOURCE} {DETECTION} {FROM} {AN} {UNCERTAINTY} {PERSPECTIVE}},\nauthor={Neslihan Kose and Anthony Rhodes and Umur A. Ciftci and Ilke Demir},\nyear={2024},\nurl={https://openreview.net/forum?id=KBGbEncHZF}\n}",
        "github": "",
        "project": "",
        "reviewers": "eCwJ;DTE3;Aw4C",
        "site": "https://openreview.net/forum?id=KBGbEncHZF",
        "pdf_size": 16101248,
        "rating": "3;3;3",
        "confidence": "4;4;4",
        "soundness": "3;2;2",
        "contribution": "2;1;2",
        "presentation": "2;2;1",
        "wc_summary": "103;43;41",
        "wc_strengths": "92;46;10",
        "wc_weaknesses": "750;126;240",
        "wc_questions": "8;40;33",
        "wc_review": "953;255;324",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            62.333333333333336,
            28.767265347188555
        ],
        "wc_strengths_avg": [
            49.333333333333336,
            33.55923452974192
        ],
        "wc_weaknesses_avg": [
            372.0,
            271.3079431199905
        ],
        "wc_questions_avg": [
            27.0,
            13.73559851869101
        ],
        "wc_review_avg": [
            510.6666666666667,
            314.04281378323066
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:-KDap__HcFQJ:scholar.google.com/&scioq=ARE+YOU+CERTAIN+THAT+IT+IS+A+DEEPFAKE%3F+DETECTION,+GENERATION,+AND+SOURCE+DETECTION+FROM+AN+UNCERTAINTY+PERSPECTIVE&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Intel;State University of New York at Binghamton",
        "aff_unique_dep": "Intel Corporation;",
        "aff_unique_url": "https://www.intel.de;https://www.binghamton.edu",
        "aff_unique_abbr": "Intel;SUNY Binghamton",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Binghamton",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "Germany;United States"
    },
    {
        "title": "Diving Segmentation Model into Pixels",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18913",
        "id": "KBo7Z5aTV0",
        "author_site": "Chen Gan, Zihao Yin, Kelei He, Yang Gao, Junfeng Zhang",
        "tldr": "",
        "abstract": "More distinguishable and consistent pixel features for each category will benefit the semantic segmentation under various settings.\nExisting efforts to mine better pixel-level features attempt to explicitly model the categorical distribution, which fails to achieve optimal due to the significant pixel feature variance.\nMoreover, prior research endeavors have scarcely delved into the thorough analysis and meticulous handling of pixel-level variance, leaving semantic segmentation at a coarse granularity.\nIn this work, we analyze the causes of pixel-level variance and introduce the concept of $\\textbf{pixel learning}$ to concentrate on the tailored learning process of pixels to handle the pixel-level variance, enhancing the per-pixel recognition capability of segmentation models.\nUnder the context of the pixel learning scheme, each image is viewed as a distribution of pixels, and pixel learning aims to pursue consistent pixel representation inside an image, continuously align pixels from different images (distributions), and eventually achieve consistent pixel representation for each category, even cross-domains.\nWe proposed a pure pixel-level learning framework, namely PiXL, which consists of a pixel partition module to divide pixels into sub-domains, a prototype generation, a selection module to prepare targets for subsequent alignment, and a pixel alignment module to guarantee pixel feature consistency intra-/inter-images, and inter-domains.\nExtensive evaluations of multiple learning paradigms, including unsupervised domain adaptation and semi-/fully-supervised segmentation, show that PiXL outperforms state-of-the-art performances, especially when annotated images are scarce.\nVisualization of the embedding space further demonstrates that pixel learning attains a superior representation of pixel features.\nThe code is available at https://github.com/ChenGan-JS/PiXL.",
        "keywords": "Semantic Segmentation;Pixel Learning;Representation Learning;Contrastive Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Chen Gan;Zihao Yin;Kelei He;Yang Gao;Junfeng Zhang",
        "authorids": "~Chen_Gan1;~Zihao_Yin1;~Kelei_He1;~Yang_Gao3;jfzhang@nju.edu.cn",
        "gender": "M;M;;M;",
        "homepage": "https://www.researchgate.net/profile/Chen-Gan-3;https://cs.nju.edu.cn/rl/members.htm;;https://cs.nju.edu.cn/gaoyang/;",
        "dblp": "207/6930;257/3403;;89/4402-1;",
        "google_scholar": ";;;https://scholar.google.com.tw/citations?user=CJwLwzQAAAAJ;",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Chen_Gan1;~Zihao_Yin1;~Kelei_He1;~Yang_Gao3;jfzhang@nju.edu.cn",
        "aff": "Nanjing University;Nanjing University;;Nanjing University;",
        "aff_domain": "nju.edu.cn;nju.edu.cn;;nju.edu.cn;",
        "position": "MS student;MS student;;Full Professor;",
        "bibtex": "@inproceedings{\ngan2024diving,\ntitle={Diving Segmentation Model into Pixels},\nauthor={Chen Gan and Zihao Yin and Kelei He and Yang Gao and Junfeng Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=KBo7Z5aTV0}\n}",
        "github": "",
        "project": "",
        "reviewers": "GSD6;YSzS;nhEN;L3L6",
        "pdf_size": 3572440,
        "rating": "6;6;6;6",
        "confidence": "3;3;3;3",
        "soundness": "3;3;3;3",
        "contribution": "3;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "62;76;153;89",
        "wc_strengths": "34;106;31;63",
        "wc_weaknesses": "133;114;52;14",
        "wc_questions": "3;7;2;1",
        "wc_review": "232;303;238;167",
        "wc_reply_reviewers": "0;0;0;4",
        "wc_reply_authors": "1905;740;260;219",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "5;1;1;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            95.0,
            34.8209706929603
        ],
        "wc_strengths_avg": [
            58.5,
            30.137186331839274
        ],
        "wc_weaknesses_avg": [
            78.25,
            47.67795612230038
        ],
        "wc_questions_avg": [
            3.25,
            2.277608394786075
        ],
        "wc_review_avg": [
            235.0,
            48.130032204435516
        ],
        "wc_reply_reviewers_avg": [
            1.0,
            1.7320508075688772
        ],
        "wc_reply_authors_avg": [
            781.0,
            680.5038574468186
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            1.7320508075688772
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Ptcg22EVhqgJ:scholar.google.com/&scioq=Diving+Segmentation+Model+into+Pixels&hl=en&as_sdt=0,48",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=KBo7Z5aTV0",
        "pdf": "https://openreview.net/pdf?id=KBo7Z5aTV0",
        "email": "nju.edu.cn;nju.edu.cn;;nju.edu.cn;",
        "author_num": 5,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Nanjing University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nju.edu.cn",
        "aff_unique_abbr": "Nanjing U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "KC2MViQASx",
        "title": "Mutual Information Estimation via $f$-Divergence and Data Derangement Based Learning Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Estimating mutual information accurately is pivotal across diverse applications, from machine learning to communications and biology, enabling us to gain insights into the inner mechanisms of complex systems. Yet, dealing with high-dimensional data presents a formidable challenge, due to its size and the presence of intricate relationships. Recently proposed neural methods employing variational lower bounds on the mutual information have gained prominence. However, these approaches suffer from either high bias or high variance, as the sample size and the structure of the loss function directly influence the training process.\nIn this paper, we propose a novel class of discriminative mutual information estimators based on the variational representation of the $f$-divergence. We investigate the impact of the permutation function used to obtain the marginal training samples and present a novel architectural solution based on derangements. The proposed estimator is flexible since it exhibits an excellent bias/variance trade-off.  The comparison with state-of-the-art neural estimators, through extensive experimentation within established reference scenarios, shows that our approach offers higher accuracy and lower complexity.",
        "keywords": "mutual information;variational divergence;f-divergence;neural estimators;discriminative;permutation;derangement",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/630421379a5f078b9dfcaefa1035f882a72847fb.zip",
        "author": "Nunzio Alexandro Letizia;Nicola Novello;Andrea M Tonello",
        "authorids": "~Nunzio_Alexandro_Letizia1;~Nicola_Novello1;~Andrea_M_Tonello1",
        "gender": "M;;M",
        "homepage": ";;http://www.andreatonello.com",
        "dblp": "239/8530;;191/4511",
        "google_scholar": "v50jRAIAAAAJ;;https://scholar.google.de/citations?user=qBiseEsAAAAJ",
        "orcid": ";;0000-0002-9873-2407",
        "linkedin": "nunzio-alexandro-letizia/;;",
        "or_profile": "~Nunzio_Alexandro_Letizia1;~Nicola_Novello1;~Andrea_M_Tonello1",
        "aff": ";;Alpen-Adria Universit\u00e4t Klagenfurt",
        "aff_domain": ";;aau.at",
        "position": ";;Full Professor",
        "bibtex": "@misc{\nletizia2024mutual,\ntitle={Mutual Information Estimation via \\$f\\$-Divergence and Data Derangement Based Learning Models},\nauthor={Nunzio Alexandro Letizia and Nicola Novello and Andrea M Tonello},\nyear={2024},\nurl={https://openreview.net/forum?id=KC2MViQASx}\n}",
        "github": "",
        "project": "",
        "reviewers": "8P8h;8KDZ;rzBW;FGDT;zX7N",
        "site": "https://openreview.net/forum?id=KC2MViQASx",
        "pdf_size": 1872359,
        "rating": "5;5;6;6;6",
        "confidence": "3;4;4;4;3",
        "soundness": "3;3;3;3;3",
        "contribution": "2;2;2;3;2",
        "presentation": "3;3;3;2;2",
        "wc_summary": "53;64;97;71;73",
        "wc_strengths": "88;54;57;45;57",
        "wc_weaknesses": "340;43;186;897;118",
        "wc_questions": "89;153;111;240;54",
        "wc_review": "570;314;451;1253;302",
        "wc_reply_reviewers": "0;0;470;807;0",
        "wc_reply_authors": "853;744;1385;1524;560",
        "reply_reviewers": "0;0;2;2;0",
        "reply_authors": "2;2;3;3;2",
        "rating_avg": [
            5.6,
            0.48989794855663565
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            71.6,
            14.499655168313486
        ],
        "wc_strengths_avg": [
            60.2,
            14.579437574886077
        ],
        "wc_weaknesses_avg": [
            316.8,
            306.19170465575974
        ],
        "wc_questions_avg": [
            129.4,
            63.94560188159933
        ],
        "wc_review_avg": [
            578.0,
            351.479729145224
        ],
        "wc_reply_reviewers_avg": [
            255.4,
            330.45520119979955
        ],
        "wc_reply_authors_avg": [
            1013.2,
            374.8799274434416
        ],
        "reply_reviewers_avg": [
            0.8,
            0.9797958971132713
        ],
        "reply_authors_avg": [
            2.4,
            0.4898979485566356
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.16666666666666669,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:xBcYWpQqY2sJ:scholar.google.com/&scioq=Mutual+Information+Estimation+via+%24f%24-Divergence+and+Data+Derangement+Based+Learning+Models&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Alpen-Adria-Universit\u00e4t Klagenfurt",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.aau.at",
        "aff_unique_abbr": "AAU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Austria"
    },
    {
        "title": "A Cognitive Model for Learning Abstract Relational Structures from Memory-based Decision-Making Tasks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18912",
        "id": "KC58bVmxyN",
        "tldr": "",
        "abstract": "Motivated by a recent neuroscientific hypothesis, some theoretical studies have accounted for neural cognitive maps in the rodent hippocampal formation as a representation of the general relational structure across task environments.  However, despite their remarkable results, it is unclear whether their account can be extended to more general settings beyond spatial random-walk tasks in 2D environments.  To address this question, we construct a novel cognitive model that performs memory-based relational decision-making tasks, inspired by previous human studies, for learning abstract structures in non-spatial relations.  Building on previous approaches of modular architecture, we develop a learning algorithm that performs reward-guided search for representation of abstract relations, while dynamically maintaining their binding to concrete entities using our specific memory mechanism enabling content replacement.  Our experiments show (i) the capability of our model to capture relational structures that can generalize over new domains with unseen entities, (ii) the difficulty of our task that leads previous models, including Neural Turing Machine and vanilla Transformer, to complete failure, and (iii) the similarity of  performance and internal representations of our model to recent human behavioral and fMRI experimental data in the human hippocampal formation.",
        "keywords": "Brain-inspired model; hippocampus; entorhinal cortex; memory; relational representation",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/25c4d5d9cde695e6a54ebe6db17c76083769e031.pdf",
        "author": "Haruo Hosoya",
        "authorids": "~Haruo_Hosoya1",
        "gender": "M",
        "homepage": "https://bicr.atr.jp//~hosoya/",
        "dblp": "13/6560",
        "google_scholar": "https://scholar.google.co.jp/citations?hl=ja",
        "orcid": "0000-0002-5660-0801",
        "linkedin": "",
        "or_profile": "~Haruo_Hosoya1",
        "aff": "ATR",
        "aff_domain": "atr.jp",
        "position": "Senior Researcher",
        "bibtex": "@inproceedings{\nhosoya2024a,\ntitle={A Cognitive Model for Learning Abstract Relational Structures from Memory-based Decision-Making Tasks},\nauthor={Haruo Hosoya},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=KC58bVmxyN}\n}",
        "github": "",
        "project": "",
        "reviewers": "RHcS;NM51;k38n;rY1U",
        "pdf_size": 758361,
        "rating": "5;6;8;8",
        "confidence": "4;3;3;4",
        "soundness": "2;4;3;4",
        "contribution": "3;2;3;3",
        "presentation": "2;3;4;3",
        "wc_summary": "89;122;161;136",
        "wc_strengths": "68;31;37;28",
        "wc_weaknesses": "210;93;51;24",
        "wc_questions": "237;46;163;76",
        "wc_review": "604;292;412;264",
        "wc_reply_reviewers": "0;11;13;0",
        "wc_reply_authors": "542;184;350;334",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            127.0,
            26.009613607279906
        ],
        "wc_strengths_avg": [
            41.0,
            15.921683328090658
        ],
        "wc_weaknesses_avg": [
            94.5,
            71.0721464428928
        ],
        "wc_questions_avg": [
            130.5,
            75.01499850029992
        ],
        "wc_review_avg": [
            393.0,
            133.90668392578468
        ],
        "wc_reply_reviewers_avg": [
            6.0,
            6.041522986797286
        ],
        "wc_reply_authors_avg": [
            352.5,
            127.13280457851938
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.19245008972987526,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14459987405271806771&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=KC58bVmxyN",
        "pdf": "https://openreview.net/pdf?id=KC58bVmxyN",
        "email": "atr.jp",
        "author_num": 1,
        "aff_unique_index": "0",
        "aff_unique_norm": "Advanced Telecommunications Research Institute",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.atr.jp",
        "aff_unique_abbr": "ATR",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Japan"
    },
    {
        "id": "KEpR8hFzvO",
        "title": "Harnessing the Power of Neural Operators with Automatically Encoded Conservation Laws",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Neural operators (NOs) have emerged as effective tools for modeling complex physical systems in scientific machine learning. In NOs, a central characteristic is to learn the governing physical laws directly from data. In contrast to other machine learning applications, partial knowledge is often known a priori about the physical system at hand whereby quantities such as mass, energy and momentum are exactly conserved. Currently, NOs have to learn these conservation laws from data and can only approximately satisfy them due to finite training data and random noise. In this work, we introduce conservation law-encoded neural operators (clawNOs), a suite of NOs that endow inference with automatic satisfaction of such conservation laws. ClawNOs are built with a divergence-free prediction of the solution field, with which the continuity equation is automatically guaranteed. As a consequence, clawNOs are compliant with the most fundamental and ubiquitous conservation laws essential for correct physical consistency. As demonstrations, we consider a wide variety of scientific applications ranging from constitutive modeling of material deformation, incompressible fluid dynamics, to atmospheric simulation. ClawNOs significantly outperform the state-of-the-art NOs in both accuracy and generalizability, especially in small-data regimes and long-term prediction.",
        "keywords": "Hidden Physics;Generalizability;Scientific Machine Learning",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/ed302e07e36c09e4be32480dd8dd1de1dcfc9a7b.pdf",
        "author": "Ning Liu;Yiming Fan;Xianyi Zeng;Milan Klower;Yue Yu",
        "authorids": "~Ning_Liu6;yif319@lehigh.edu;xiz222@lehigh.edu;milank@mit.edu;~Yue_Yu3",
        "gender": ";;;;",
        "homepage": ";;;;",
        "dblp": ";;;;",
        "google_scholar": ";;;;",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": ";;;;",
        "aff": ";;;;",
        "aff_domain": ";;;;",
        "position": ";;;;",
        "bibtex": "@misc{\nliu2024harnessing,\ntitle={Harnessing the Power of Neural Operators with Automatically Encoded Conservation Laws},\nauthor={Ning Liu and Yiming Fan and Xianyi Zeng and Milan Klower and Yue Yu},\nyear={2024},\nurl={https://openreview.net/forum?id=KEpR8hFzvO}\n}",
        "github": "",
        "project": "",
        "reviewers": "UzYu;L28W;pjQT;t5ea;1SzR",
        "site": "https://openreview.net/forum?id=KEpR8hFzvO",
        "pdf_size": 3173090,
        "rating": "3;5;5;6;6",
        "confidence": "5;4;2;2;2",
        "soundness": "1;2;2;3;3",
        "contribution": "2;2;3;3;3",
        "presentation": "1;2;2;3;2",
        "wc_summary": "91;59;89;47;51",
        "wc_strengths": "58;23;76;59;42",
        "wc_weaknesses": "313;335;71;42;54",
        "wc_questions": "346;35;95;57;43",
        "wc_review": "808;452;331;205;190",
        "wc_reply_reviewers": "0;114;0;0;0",
        "wc_reply_authors": "1652;1081;551;779;603",
        "reply_reviewers": "0;1;0;0;0",
        "reply_authors": "3;3;1;2;1",
        "rating_avg": [
            5.0,
            1.0954451150103321
        ],
        "confidence_avg": [
            3.0,
            1.2649110640673518
        ],
        "soundness_avg": [
            2.2,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            67.4,
            18.863721796082555
        ],
        "wc_strengths_avg": [
            51.6,
            17.89525076661403
        ],
        "wc_weaknesses_avg": [
            163.0,
            131.96211577570284
        ],
        "wc_questions_avg": [
            115.2,
            117.22525325201904
        ],
        "wc_review_avg": [
            397.2,
            226.28071062288984
        ],
        "wc_reply_reviewers_avg": [
            22.8,
            45.6
        ],
        "wc_reply_authors_avg": [
            933.2,
            404.327787815777
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            2.0,
            0.8944271909999159
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.8660254037844387,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2666518352325242566&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 11
    },
    {
        "id": "KEu5imWGhw",
        "title": "Theory-of-Mind Enhanced Dialogue Generation in Situated Contexts",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Humans talk in free-form while negotiating the expressed meanings or common ground. Despite the impressive conversational abilities of the large generative language models, they do not consider the individual differences in contextual understanding in a shared situated environment. In this work, we propose MindDial, a novel conversational framework that can generate situated free-form responses to negotiate common ground. We design an explicit mind module that can track three-level beliefs -- the speaker's belief, the speaker's prediction of the listener's belief, and the common belief based on the gap between the first two. Then the speaking act classification head will decide to continue to talk, end this turn, or take task-related action. We augment a common ground alignment dataset MutualFriend with belief dynamics annotation, of which the goal is to find a single mutual friend based on the free chat between two agents. Experiments show that our model with mental state modeling can resemble human responses when aligning common ground meanwhile mimic the natural human conversation flow. The ablation study further validates the third-level common belief can aggregate information of the first and second-order beliefs and align common ground more efficiently.",
        "keywords": "Neural dialogue generation;Theory of Mind;Situated dialogue",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/8405124555ccf078c3e50aab686645351d4c564b.zip",
        "author": "Shuwen Qiu;Song-Chun Zhu;Zilong Zheng",
        "authorids": "~Shuwen_Qiu1;~Song-Chun_Zhu1;~Zilong_Zheng1",
        "gender": "F;M;M",
        "homepage": "https://janetalready.github.io/;https://zhusongchun.net/;http://zilongzheng.github.io",
        "dblp": "229/1224;10/10313;218/5234",
        "google_scholar": "XmSVW5kAAAAJ;https://scholar.google.com.tw/citations?user=Al8dyb4AAAAJ;9sDx70IAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Shuwen_Qiu1;~Song-Chun_Zhu1;~Zilong_Zheng1",
        "aff": "University of California, Los Angeles;Peking University;Beijing Institute for General Artificial Intelligence",
        "aff_domain": "ucla.edu;pku.edu.cn;bigai.ai",
        "position": "PhD student;Full Professor;Researcher",
        "bibtex": "@misc{\nqiu2024theoryofmind,\ntitle={Theory-of-Mind Enhanced Dialogue Generation in Situated Contexts},\nauthor={Shuwen Qiu and Song-Chun Zhu and Zilong Zheng},\nyear={2024},\nurl={https://openreview.net/forum?id=KEu5imWGhw}\n}",
        "github": "",
        "project": "",
        "reviewers": "31bg;3axi;bi42",
        "site": "https://openreview.net/forum?id=KEu5imWGhw",
        "pdf_size": 8174079,
        "rating": "3;3;5",
        "confidence": "4;3;3",
        "soundness": "3;1;2",
        "contribution": "2;2;2",
        "presentation": "2;1;2",
        "wc_summary": "96;73;77",
        "wc_strengths": "149;76;10",
        "wc_weaknesses": "239;323;115",
        "wc_questions": "411;432;45",
        "wc_review": "895;904;247",
        "wc_reply_reviewers": "64;0;22",
        "wc_reply_authors": "486;334;161",
        "reply_reviewers": "1;0;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            82.0,
            10.03327796219494
        ],
        "wc_strengths_avg": [
            78.33333333333333,
            56.770493118246634
        ],
        "wc_weaknesses_avg": [
            225.66666666666666,
            85.43743649920422
        ],
        "wc_questions_avg": [
            296.0,
            177.69074258384987
        ],
        "wc_review_avg": [
            682.0,
            307.61339372660615
        ],
        "wc_reply_reviewers_avg": [
            28.666666666666668,
            26.549743668986498
        ],
        "wc_reply_authors_avg": [
            327.0,
            132.77298922095062
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:YI6EAypf-yoJ:scholar.google.com/&scioq=Theory-of-Mind+Enhanced+Dialogue+Generation+in+Situated+Contexts&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of California, Los Angeles;Peking University;Beijing Institute for General Artificial Intelligence",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ucla.edu;http://www.pku.edu.cn;http://www.bigaiai.org/",
        "aff_unique_abbr": "UCLA;Peking U;BIGAI",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Los Angeles;",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "KFjCFxiGk4",
        "title": "Certified Deductive Reasoning with Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Language models often achieve higher accuracy when reasoning step-by-step in complex tasks. However, even when arriving at a correct final answer, their rationales are often logically unsound or inconsistent. This is a major issue when reliable reasoning traces are needed, such when fine-tuning on model-generated reasoning for self-improvement. To tackle these issues, we introduce a class of tools for language models called \\emph{guides}, that use state and incremental constraints to guide generation. A guide can be invoked by the model to constrain its own generation to a set of valid statements given by the tool. In turn, the model's choices can change the guide's state. We show how a general system for logical reasoning can be used as a guide, which we call \\textsc{LogicGuide}. Given a reasoning problem in natural language, a model can formalize its assumptions for \\textsc{LogicGuide} and guarantee that its step-by-step reasoning is sound. In experiments on PrOntoQA, ProofWriter and Syllogism Validity datasets, \\textsc{LogicGuide} significantly improves the performance of GPT-3, GPT-3.5 Turbo and LLaMA (accuracy gains up to 35\\%), while drastically reducing \\emph{content effects} --- the interference between unwanted prior assumptions and reasoning, which humans and language models suffer from. We then explore bootstrapping GPT-3.5 Turbo and LLaMA using their own reasoning traces. We find that LogicGuide is critical: by training only on certified self-generated reasoning, models can self-improve, avoiding learning from their own hallucinations. Moreover, bootstrapped models enjoy significant boosts on ReClor, a challenging real-world reasoning dataset, even when not relying on formalization at inference time.",
        "keywords": "language models;reasoning;logic",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "",
        "author": "Gabriel Poesia;Kanishk Gandhi;Eric Zelikman;Noah Goodman",
        "authorids": "~Gabriel_Poesia1;~Kanishk_Gandhi1;~Eric_Zelikman1;~Noah_Goodman1",
        "gender": "M;M;;M",
        "homepage": "https://gpoesia.com;https://zelikman.me;https://cocolab.stanford.edu/;https://kanishkgandhi.com",
        "dblp": "150/2695.html;217/2378;96/1216;243/5820",
        "google_scholar": "as5iYn4AAAAJ;V5B8dSUAAAAJ;OUpIbcQAAAAJ;",
        "orcid": ";;;",
        "linkedin": ";ericzelikman/;;",
        "or_profile": "~Gabriel_Poesia1;~Eric_Zelikman1;~Noah_Goodman1;~Kanishk_V_Gandhi1",
        "aff": "Stanford University;Stanford University;Stanford University;Stanford University",
        "aff_domain": "stanford.edu;stanford.edu;stanford.edu;stanford.edu",
        "position": "PhD student;PhD student;Full Professor;PhD student",
        "bibtex": "@misc{\npoesia2024certified,\ntitle={Certified Deductive Reasoning with Language Models},\nauthor={Gabriel Poesia and Kanishk Gandhi and Eric Zelikman and Noah Goodman},\nyear={2024},\nurl={https://openreview.net/forum?id=KFjCFxiGk4}\n}",
        "github": "",
        "project": "",
        "reviewers": "cFZp;HHEy;GDuS",
        "site": "https://openreview.net/forum?id=KFjCFxiGk4",
        "pdf_size": 1730745,
        "rating": "5;5;8",
        "confidence": "4;3;3",
        "soundness": "3;3;3",
        "contribution": "2;2;4",
        "presentation": "3;2;3",
        "wc_summary": "104;59;18",
        "wc_strengths": "47;70;19",
        "wc_weaknesses": "399;131;169",
        "wc_questions": "76;138;103",
        "wc_review": "626;398;309",
        "wc_reply_reviewers": "0;6;308",
        "wc_reply_authors": "1205;1173;1247",
        "reply_reviewers": "0;1;3",
        "reply_authors": "2;2;3",
        "rating_avg": [
            6.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            60.333333333333336,
            35.122009560324926
        ],
        "wc_strengths_avg": [
            45.333333333333336,
            20.8539897594894
        ],
        "wc_weaknesses_avg": [
            233.0,
            118.40045044959359
        ],
        "wc_questions_avg": [
            105.66666666666667,
            25.381533094401966
        ],
        "wc_review_avg": [
            444.3333333333333,
            133.49739905914106
        ],
        "wc_reply_reviewers_avg": [
            104.66666666666667,
            143.799242773466
        ],
        "wc_reply_authors_avg": [
            1208.3333333333333,
            30.3021818063027
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            1.247219128924647
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 32,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14422369040649843813&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Stanford University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.stanford.edu",
        "aff_unique_abbr": "Stanford",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Stanford",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "KFuGQgOsGk",
        "title": "TabGFN: Tabular data generation based on GFlowNets",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Generation of synthetic tabular data plays an important role in privacy-preserving data sharing, training data augmentation, data imputation, and algorithm development in various domains such as healthcare and finance. Achieving both high predictive performance and model traceability in tabular data generation is challenging for neural-network-based algorithms due to their inherent model opacity. To overcome this limitation, we present a novel approach for generating synthetic tabular data called TabGFN. It employs generative flow networks for feature generation and uses the critic network of the Wasserstein generative adversarial network with gradient penalty as its reward function. Through simultaneous and iterative training of the flow network and reward function, TabGFN explores a directed acyclic graph of the generative state space, yielding a generative model that represents conditional relationships and feature order. Benchmark tests on diverse datasets demonstrate that the quality of the synthetic data by TabGFN is superior or comparable to that of state-of-the-art algorithms. Moreover, the entire generation process is traceable, as its individual steps are explicitly provided. This traceability enables the discovery of mutual dependencies between features, leading to an interpretable model, which is crucial for high-stakes decision-making. Thus, the proposed approach offers an effective solution for generating tabular data, providing both high-quality synthesis and traceability.",
        "keywords": "generative model;synthetic tabular data;GFlowNets;GAN",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "SUNG YUP LEE;Cheol Ho Kim;Byounghwa Lee;Jung-Hoon Lee",
        "authorids": "~SUNG_YUP_LEE1;~Cheol_Ho_Kim1;~Byounghwa_Lee1;~Jung-Hoon_Lee1",
        "gender": "M;;M;M",
        "homepage": ";;;",
        "dblp": ";24/8734.html;;",
        "google_scholar": ";j6NaxmIAAAAJ;TgWPNDoAAAAJ;kJ576qEAAAAJ",
        "orcid": "0000-0002-6143-8749;0000-0002-2212-1677;0000-0002-4862-2605;0000-0002-3306-8728",
        "linkedin": ";;%EB%B3%91%ED%99%94-%EC%9D%B4-1847201a3/;",
        "or_profile": "~SUNG_YUP_LEE1;~Cheol_Ho_Kim1;~Byounghwa_Lee1;~Jung-Hoon_Lee1",
        "aff": ";Electronics and Telecommunications Research Institute;;Electronics and Telecommunications Research Institute",
        "aff_domain": ";etri.re.kr;;etri.re.kr",
        "position": ";Principal Researcher;;Researcher",
        "bibtex": "@misc{\nlee2024tabgfn,\ntitle={Tab{GFN}: Tabular data generation based on {GF}lowNets},\nauthor={SUNG YUP LEE and Cheol Ho Kim and Byounghwa Lee and Jung-Hoon Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=KFuGQgOsGk}\n}",
        "github": "",
        "project": "",
        "reviewers": "a1vn;wX9t;eJ3x;erTM",
        "site": "https://openreview.net/forum?id=KFuGQgOsGk",
        "pdf_size": 12460945,
        "rating": "3;5;5;5",
        "confidence": "5;3;2;3",
        "soundness": "2;3;3;2",
        "contribution": "2;2;2;2",
        "presentation": "2;2;3;2",
        "wc_summary": "35;43;65;169",
        "wc_strengths": "21;63;47;67",
        "wc_weaknesses": "208;58;122;182",
        "wc_questions": "51;79;67;59",
        "wc_review": "315;243;301;477",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            78.0,
            53.67494760127857
        ],
        "wc_strengths_avg": [
            49.5,
            18.07622748252522
        ],
        "wc_weaknesses_avg": [
            142.5,
            57.902936022277835
        ],
        "wc_questions_avg": [
            64.0,
            10.344080432788601
        ],
        "wc_review_avg": [
            334.0,
            86.86195945291587
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9271726499455306,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:KgB5Y72_wakJ:scholar.google.com/&scioq=TabGFN:+Tabular+data+generation+based+on+GFlowNets&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Electronics and Telecommunications Research Institute",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.etri.re.kr",
        "aff_unique_abbr": "ETRI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "ReMasker: Imputing Tabular Data with Masked Autoencoding",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18911",
        "id": "KI9NqjLVDT",
        "author_site": "Tianyu Du, Luca Melis, Ting Wang",
        "tldr": "",
        "abstract": "We present ReMasker, a new method of imputing missing values in tabular data by extending the masked autoencoding framework. Compared with prior work, ReMasker is extremely simple -- besides the missing values (i.e., naturally masked), we randomly \"re-mask\" another set of values, optimize the autoencoder by reconstructing this re-masked set, and apply the trained model to predict the missing values; and yet highly effective -- with extensive evaluation on benchmark datasets, we show that ReMasker performs on par with or outperforms state-of-the-art methods in terms of both imputation fidelity and utility under various missingness settings, while its performance advantage often increases with the ratio of missing data. We further explore theoretical justification for its effectiveness, showing that ReMasker tends to learn missingness-invariant representations of tabular data. Our findings indicate that masked modeling represents a promising direction for further research on tabular data imputation. The code is publicly available.",
        "keywords": "Masked modeling; Tabular data imputation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/4afd553c49923c5cc6db262f6aadc38d6aae25ee.zip",
        "author": "Tianyu Du;Luca Melis;Ting Wang",
        "authorids": "~Tianyu_Du2;~Luca_Melis1;~Ting_Wang1",
        "gender": "F;;M",
        "homepage": "https://tydusky.github.io/;https://lucamel.is;https://alps-lab.github.io/",
        "dblp": "128/2982.html;;12/2633-6.html",
        "google_scholar": "kBqTzrwAAAAJ;;cwcBTegAAAAJ",
        "orcid": "0000-0003-0896-0690;;",
        "linkedin": ";;",
        "or_profile": "~Tianyu_Du2;~Luca_Melis1;~Ting_Wang1",
        "aff": "Zhejiang University;Meta;State University of New York at Stony Brook",
        "aff_domain": "zju.edu.cn;fb.com;cs.stonybrook.edu",
        "position": "Assistant Professor;Researcher;Associate Professor",
        "bibtex": "@inproceedings{\ndu2024remasker,\ntitle={ReMasker: Imputing Tabular Data with Masked Autoencoding},\nauthor={Tianyu Du and Luca Melis and Ting Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=KI9NqjLVDT}\n}",
        "github": "",
        "project": "",
        "reviewers": "YQFA;Fz3c;w2Hd",
        "pdf_size": 6349960,
        "rating": "5;6;8",
        "confidence": "3;3;4",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "3;3;3",
        "wc_summary": "28;70;82",
        "wc_strengths": "36;66;140",
        "wc_weaknesses": "271;115;233",
        "wc_questions": "71;41;152",
        "wc_review": "406;292;607",
        "wc_reply_reviewers": "770;45;243",
        "wc_reply_authors": "1855;405;1229",
        "reply_reviewers": "3;1;1",
        "reply_authors": "3;2;3",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            60.0,
            23.15167380558045
        ],
        "wc_strengths_avg": [
            80.66666666666667,
            43.70608907489003
        ],
        "wc_weaknesses_avg": [
            206.33333333333334,
            66.41954197038365
        ],
        "wc_questions_avg": [
            88.0,
            46.88283267892417
        ],
        "wc_review_avg": [
            435.0,
            130.22288585344742
        ],
        "wc_reply_reviewers_avg": [
            352.6666666666667,
            305.9698605345885
        ],
        "wc_reply_authors_avg": [
            1163.0,
            593.7968227152
        ],
        "reply_reviewers_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.944911182523068,
        "gs_citation": 21,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13074975522593684422&as_sdt=4005&sciodt=0,6&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=KI9NqjLVDT",
        "pdf": "https://openreview.net/pdf?id=KI9NqjLVDT",
        "email": "zju.edu.cn;fb.com;cs.stonybrook.edu",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Zhejiang University;Meta;State University of New York at Stony Brook",
        "aff_unique_dep": ";Meta Platforms, Inc.;",
        "aff_unique_url": "https://www.zju.edu.cn;https://meta.com;https://www.stonybrook.edu",
        "aff_unique_abbr": "ZJU;Meta;SUNY Stony Brook",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Stony Brook",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "At Which Training Stage Does Code Data Help LLMs Reasoning?",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18910",
        "id": "KIPJKST4gw",
        "author_site": "ma yingwei, Yue Liu, Yue Yu, Yuanliang Zhang, Yu Jiang, Changjian Wang, Shanshan Li",
        "tldr": "",
        "abstract": "Large Language models (LLMs) have exhibited remarkable reasoning capabilities and become the foundation of language technologies. Inspired by the great success of code data in training LLMs, we naturally wonder at which training stage introducing code data can really help LLMs reasoning. To this end, this paper systematically explores the impact of code data on LLMs at different stages. Concretely, we introduce the code data at the pre-training stage, instruction-tuning stage, and both of them, respectively. Then, the reasoning capability of LLMs is comprehensively and fairly evaluated via six reasoning tasks. We critically analyze the experimental results and provide conclusions with insights. First, pre-training LLMs with the mixture of code and text can significantly enhance LLMs' general reasoning capability almost without negative transfer on other tasks. Besides, at the instruction-tuning stage, code data endows LLMs the task-specific reasoning capability. Moreover, the dynamic mixing strategy of code and text data assists LLMs to learn reasoning capability step-by-step during training. These insights deepen the understanding of LLMs regarding reasoning ability for their application, such as scientific question answering, legal support, etc.",
        "keywords": "code data;large language models;reasoning capabilities",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "YINGWEI MA;Yue Liu;Yue Yu;Yuanliang Zhang;Yu Jiang;Changjian Wang;Shanshan Li",
        "authorids": "~YINGWEI_MA2;~Yue_Liu10;~Yue_Yu8;~Yuanliang_Zhang1;~Yu_Jiang4;~Changjian_Wang1;~Shanshan_Li1",
        "gender": "M;M;M;M;M;M;F",
        "homepage": "https://yingweima2022.github.io/;https://yueliu1999.github.io/;http://yuyue.github.io/;;https://scholar.google.com/citations?user=5AJPdKsAAAAJ&hl=en;;https://leopard-lab.github.io/index.html",
        "dblp": "337/0877;74/1932-8;55/2008-1;;https://dblp.uni-trier.de/pid/21/4633-1.html;145/0604;66/5479",
        "google_scholar": "https://scholar.google.com.hk/citations?user=DYtPD6oAAAAJ;5tfpu3MAAAAJ;VnqWgEwAAAAJ;4Fz0PGQAAAAJ;5AJPdKsAAAAJ;;",
        "orcid": ";;0000-0002-9865-2212;;;0000-0002-1160-0365;",
        "linkedin": ";;;;;;",
        "or_profile": "~YINGWEI_MA2;~Yue_Liu10;~Yue_Yu8;~Yuanliang_Zhang1;~Yu_Jiang4;~Changjian_Wang1;~Shanshan_Li1",
        "aff": "National University of Defense Technology;University of Illinois, Urbana Champaign;National University of Defense Technology;National University of Defense Technology;Tsinghua University;National University of Defense Technology;National University of Defense Technology",
        "aff_domain": "nudt.edu.cn;uiuc.edu;nudt.edu.cn;nudt.edu.cn;tsinghua.edu.cn;nudt.edu.cn;nudt.edu.cn",
        "position": "MS student;Intern;Associate Professor;Assistant Professor;Associate Professor;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nma2024at,\ntitle={At Which Training Stage Does Code Data Help {LLM}s Reasoning?},\nauthor={YINGWEI MA and Yue Liu and Yue Yu and Yuanliang Zhang and Yu Jiang and Changjian Wang and Shanshan Li},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=KIPJKST4gw}\n}",
        "github": "",
        "project": "",
        "reviewers": "viag;L6FP;PRkj;BTot",
        "pdf_size": 1160768,
        "rating": "5;8;8;8",
        "confidence": "4;4;5;3",
        "soundness": "2;3;4;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "102;75;62;84",
        "wc_strengths": "32;110;158;53",
        "wc_weaknesses": "225;234;201;343",
        "wc_questions": "98;6;127;136",
        "wc_review": "457;425;548;616",
        "wc_reply_reviewers": "0;56;58;17",
        "wc_reply_authors": "1658;1147;869;1631",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "4;3;3;4",
        "rating_avg": [
            7.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            80.75,
            14.549484526951462
        ],
        "wc_strengths_avg": [
            88.25,
            49.35775015131869
        ],
        "wc_weaknesses_avg": [
            250.75,
            54.609408530032624
        ],
        "wc_questions_avg": [
            91.75,
            51.46054313743686
        ],
        "wc_review_avg": [
            511.5,
            75.34089195118412
        ],
        "wc_reply_reviewers_avg": [
            32.75,
            24.993749218554626
        ],
        "wc_reply_authors_avg": [
            1326.25,
            333.21867819796654
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.5,
            0.5
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 45,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12422572700791695173&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=KIPJKST4gw",
        "pdf": "https://openreview.net/pdf?id=KIPJKST4gw",
        "email": "nudt.edu.cn;uiuc.edu;nudt.edu.cn;nudt.edu.cn;tsinghua.edu.cn;nudt.edu.cn;nudt.edu.cn",
        "author_num": 7,
        "aff_unique_index": "0;1;0;0;2;0;0",
        "aff_unique_norm": "National University of Defense Technology;University of Illinois Urbana-Champaign;Tsinghua University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.nudt.edu.cn/;https://illinois.edu;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "NUDT;UIUC;THU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Urbana-Champaign",
        "aff_country_unique_index": "0;1;0;0;0;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "KIq6p9iv2q",
        "title": "Towards Perpetually Trainable Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Underpinning the past decades of work on the design, initialization, and optimization of neural networks is a seemingly inoccuous assumption:  that the networkis trained on a stationary data distribution. In settings where this assumption is violated, e.g. deep reinforcement learning, learning algorithms become unstableand brittle with respect to hyperparameters and even random seeds. One factor driving this instability is the loss of plasticity, meaning that updating the network\u2019s predictions in response to new information becomes more difficult as training progresses. In this paper, we conduct a thorough analysis of the mehcnaisms of plasticity loss in neural networks trained on nonstationary learning problems, identify solutions to each of these pathologies, and integrate these solutions into a straightforward training protocol designed to maintain plasticity. We validate this approach in a variety of synthetic continual learning tasks, and further demonstrate its effectiveness on naturally arising nonstationarities",
        "keywords": "deep learning;reinforcement learning;continual learning;plasticity;training dynamics",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Clare Lyle;Zeyu Zheng;Khimya Khetarpal;Razvan Pascanu;James Martens;Hado van Hasselt;Will Dabney",
        "authorids": "~Clare_Lyle1;~Zeyu_Zheng1;~Khimya_Khetarpal1;~Razvan_Pascanu1;~James_Martens1;~Hado_van_Hasselt1;~Will_Dabney1",
        "gender": ";M;F;M;M;M;M",
        "homepage": ";http://www-personal.umich.edu/~zeyu/;https://kkhetarpal.github.io/;https://razp.info;http://www.cs.toronto.edu/~jmartens/;http://hadovanhasselt.com;",
        "dblp": "192/1910;48/7883;186/3048;65/8368.html;12/8412;https://dblp.uni-trier.de/pers/h/Hasselt:Hado_van.html;https://dblp.uni-trier.de/pers/hd/d/Dabney:Will",
        "google_scholar": ";;https://scholar.google.ca/citations?user=VLOUhF0AAAAJ;https://scholar.google.ca/citations?user=eSPY8LwAAAAJ;;;https://scholar.google.co.uk/citations?user=dR-7QW8AAAAJ",
        "orcid": ";;;;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Clare_Lyle1;~Zeyu_Zheng1;~Khimya_Khetarpal1;~Razvan_Pascanu1;~James_Martens1;~Hado_van_Hasselt1;~Will_Dabney1",
        "aff": "Google DeepMind;Google DeepMind;Google;Google DeepMind;Google DeepMind;Google DeepMind;Google DeepMind",
        "aff_domain": "google.com;deepmind.com;google.com;google.com;google.com;google.com;google.com",
        "position": "Researcher;Research Scientist;Researcher;Research Scientist;Research Scientist;Research scientist;Research Scientist",
        "bibtex": "@misc{\nlyle2024towards,\ntitle={Towards Perpetually Trainable Neural Networks},\nauthor={Clare Lyle and Zeyu Zheng and Khimya Khetarpal and Razvan Pascanu and James Martens and Hado van Hasselt and Will Dabney},\nyear={2024},\nurl={https://openreview.net/forum?id=KIq6p9iv2q}\n}",
        "github": "",
        "project": "",
        "reviewers": "xE98;m9W8;yXsB;o35T",
        "site": "https://openreview.net/forum?id=KIq6p9iv2q",
        "pdf_size": 4987630,
        "rating": "5;6;6;6",
        "confidence": "3;3;4;5",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;4",
        "presentation": "2;3;3;3",
        "wc_summary": "19;79;77;61",
        "wc_strengths": "58;55;117;48",
        "wc_weaknesses": "750;157;82;393",
        "wc_questions": "5;3;578;191",
        "wc_review": "832;294;854;693",
        "wc_reply_reviewers": "89;54;727;49",
        "wc_reply_authors": "1504;1415;1592;1367",
        "reply_reviewers": "1;1;3;1",
        "reply_authors": "2;2;3;3",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            59.0,
            24.124676163629637
        ],
        "wc_strengths_avg": [
            69.5,
            27.663152387246107
        ],
        "wc_weaknesses_avg": [
            345.5,
            260.21193285474055
        ],
        "wc_questions_avg": [
            194.25,
            234.34309782880314
        ],
        "wc_review_avg": [
            668.25,
            224.71801774668626
        ],
        "wc_reply_reviewers_avg": [
            229.75,
            287.5007608685584
        ],
        "wc_reply_authors_avg": [
            1469.5,
            86.12926331973355
        ],
        "reply_reviewers_avg": [
            1.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.5222329678670935,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:rz0qRq46fVEJ:scholar.google.com/&scioq=Towards+Perpetually+Trainable+Neural+Networks&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0;0;0",
        "aff_unique_norm": "Google",
        "aff_unique_dep": "Google DeepMind",
        "aff_unique_url": "https://deepmind.com",
        "aff_unique_abbr": "DeepMind",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0;1;0;0;0;0",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "id": "KJ1w6MzVZw",
        "title": "Large Pre-trained time series models for cross-domain Time series analysis tasks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large pre-trained models have been instrumental in significant advancements in domains like language and vision making model training for individual downstream tasks more efficient as well as provide superior performance. However, tackling time-series analysis tasks usually involves designing and training a separate model from scratch leveraging training data and domain expertise specific to the task.\nWe tackle a significant challenge for pre-training a general time-series model from multiple heterogeneous time-series dataset: providing semantically useful inputs to models for modeling time series of different dynamics from different domains.\nWe observe that partitioning time-series into segments as inputs to sequential models produces semantically better inputs and propose a novel model LPTM that automatically identifies optimal dataset-specific segmentation strategy leveraging self-supervised learning loss during pre-training.\nLPTM provides performance similar to or better than domain-specific state-of-art model and is significantly more data and compute efficient taking up to 40% less data as well as 50% less training time to achieve state-of-art performance in a wide range of time-series analysis tasks from multiple disparate domains.",
        "keywords": "Time Series Forecasting;Self-supervised learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/6450a25a6fbb89e4c116913d270754f58405ce9d.pdf",
        "author": "Harshavardhan Kamarthi;B. Aditya Prakash",
        "authorids": "~Harshavardhan_Kamarthi1;~B._Aditya_Prakash2",
        "gender": "M;",
        "homepage": "https://www.harsha-pk.com;https://www.cc.gatech.edu/~badityap/",
        "dblp": "245/8927;06/3956",
        "google_scholar": "LNXEjT8AAAAJ;C-NftTgAAAAJ",
        "orcid": "0000-0002-2901-7127;0000-0002-3252-455X",
        "linkedin": "harshavardhan-kamarthi-462928112/;",
        "or_profile": "~Harshavardhan_Kamarthi1;~B._Aditya_Prakash2",
        "aff": "Georgia Institute of Technology;Georgia Institute of Technology",
        "aff_domain": "gatech.edu;gatech.edu",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\nkamarthi2024large,\ntitle={Large Pre-trained time series models for cross-domain Time series analysis tasks},\nauthor={Harshavardhan Kamarthi and B. Aditya Prakash},\nyear={2024},\nurl={https://openreview.net/forum?id=KJ1w6MzVZw}\n}",
        "github": "",
        "project": "",
        "reviewers": "e2Vd;jLeR;xd4P;mzJa;KRyA",
        "site": "https://openreview.net/forum?id=KJ1w6MzVZw",
        "pdf_size": 416258,
        "rating": "3;3;3;5;5",
        "confidence": "5;4;5;5;3",
        "soundness": "2;2;2;2;4",
        "contribution": "1;2;2;3;3",
        "presentation": "2;1;2;1;2",
        "wc_summary": "129;48;37;61;63",
        "wc_strengths": "59;53;131;40;76",
        "wc_weaknesses": "159;413;260;94;310",
        "wc_questions": "223;62;2;1;107",
        "wc_review": "570;576;430;196;556",
        "wc_reply_reviewers": "39;193;35;0;118",
        "wc_reply_authors": "818;506;658;219;554",
        "reply_reviewers": "1;1;1;0;1",
        "reply_authors": "2;1;1;1;2",
        "rating_avg": [
            3.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            4.4,
            0.8
        ],
        "soundness_avg": [
            2.4,
            0.8
        ],
        "contribution_avg": [
            2.2,
            0.7483314773547882
        ],
        "presentation_avg": [
            1.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            67.6,
            32.10981158462316
        ],
        "wc_strengths_avg": [
            71.8,
            31.783014331557666
        ],
        "wc_weaknesses_avg": [
            247.2,
            112.11315712261431
        ],
        "wc_questions_avg": [
            79.0,
            82.24597254577272
        ],
        "wc_review_avg": [
            465.6,
            145.05943609431273
        ],
        "wc_reply_reviewers_avg": [
            77.0,
            69.67639485507269
        ],
        "wc_reply_authors_avg": [
            551.0,
            197.48215109219365
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4
        ],
        "reply_authors_avg": [
            1.4,
            0.4898979485566356
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.4082482904638631,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13226977334258865383&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Georgia Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.gatech.edu",
        "aff_unique_abbr": "Georgia Tech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "KJHUYWviZ6",
        "title": "On Socially Fair Regression and Low-Rank Approximation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Regression and low-rank approximation are two fundamental problems that are applied across a wealth of machine learning applications. In this paper, we study the question of socially fair regression and socially fair low-rank approximation, where the goal is to minimize the loss over all sub-populations of the data. We show that surprisingly, socially fair regression and socially fair low-rank approximation exhibit drastically different complexities. Specifically, we show that while fair regression can be solved up to arbitrary accuracy in polynomial time for a wide variety of loss functions, even constant-factor approximation to fair low-rank approximation requires exponential time under certain standard complexity hypotheses. On the positive side, we give an algorithm for fair low-rank approximation that, for a constant number of groups and constant-factor accuracy, runs in $2^{\\text{poly}(k)}$ rather than the na\\\"{i}ve $n^{\\text{poly}(k)}$, which is a substantial improvement when the dataset has a large number $n$ of observations. Finally, we show that there exists a bicriteria approximation algorithm for fair low-rank approximation that runs in polynomial time.",
        "keywords": "fairness;randomized numerical linear algebra;regression;low-rank approximation",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/22feebc2feb4585796e28c7b448efbd86736dee0.zip",
        "author": "Zhao Song;Ali Vakilian;David Woodruff;Samson Zhou",
        "authorids": "~Zhao_Song3;~Ali_Vakilian1;~David_Woodruff1;~Samson_Zhou1",
        "gender": "M;;M;",
        "homepage": "https://www.youtube.com/@zhaosong2031;http://www.mit.edu/~vakilian/;http://www.cs.cmu.edu/~dwoodruf/;https://samsonzhou.github.io/",
        "dblp": "76/4051-2;116/4679;w/DPWoodruff;179/2683",
        "google_scholar": "yDZct7UAAAAJ;uXZaVaAAAAAJ;https://scholar.google.com.tw/citations?user=0G2t-6sAAAAJ;NpjsgocAAAAJ",
        "orcid": ";0000-0001-5049-7594;;",
        "linkedin": ";;;",
        "or_profile": "~Zhao_Song3;~Ali_Vakilian1;~David_Woodruff1;~Samson_Zhou1",
        "aff": "Adobe;Toyota Technological Institute at Chicago;Carnegie Mellon University;Texas A&M University - College Station",
        "aff_domain": "adobe.com;ttic.edu;cmu.edu;tamu.edu",
        "position": "Researcher;Research Assistant Professor;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nsong2024on,\ntitle={On Socially Fair Regression and Low-Rank Approximation},\nauthor={Zhao Song and Ali Vakilian and David Woodruff and Samson Zhou},\nyear={2024},\nurl={https://openreview.net/forum?id=KJHUYWviZ6}\n}",
        "github": "",
        "project": "",
        "reviewers": "wDtZ;gYDC;5W2W;2ktH",
        "site": "https://openreview.net/forum?id=KJHUYWviZ6",
        "pdf_size": 659334,
        "rating": "3;3;6;6",
        "confidence": "2;4;3;2",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;2",
        "presentation": "1;2;3;2",
        "wc_summary": "53;7;110;43",
        "wc_strengths": "37;7;126;69",
        "wc_weaknesses": "198;95;73;2",
        "wc_questions": "89;95;141;49",
        "wc_review": "377;204;450;163",
        "wc_reply_reviewers": "127;0;39;0",
        "wc_reply_authors": "770;565;529;206",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "2;1;2;1",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            53.25,
            36.961973702712356
        ],
        "wc_strengths_avg": [
            59.75,
            44.08727140570167
        ],
        "wc_weaknesses_avg": [
            92.0,
            70.18903048197774
        ],
        "wc_questions_avg": [
            93.5,
            32.630507198019465
        ],
        "wc_review_avg": [
            298.5,
            118.74868420323654
        ],
        "wc_reply_reviewers_avg": [
            41.5,
            51.867619956963516
        ],
        "wc_reply_authors_avg": [
            517.5,
            201.9758648947938
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.3015113445777637,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:DsrNWPYlcsoJ:scholar.google.com/&scioq=On+Socially+Fair+Regression+and+Low-Rank+Approximation&hl=en&as_sdt=0,19",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Adobe;Toyota Technological Institute at Chicago;Carnegie Mellon University;Texas A&M University",
        "aff_unique_dep": "Adobe Inc.;;;",
        "aff_unique_url": "https://www.adobe.com;https://www.tti-chicago.org;https://www.cmu.edu;https://www.tamu.edu",
        "aff_unique_abbr": "Adobe;TTI Chicago;CMU;TAMU",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Chicago;College Station",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "KJYIgEteHX",
        "title": "Robustness of Deep Learning for Accelerated MRI: Benefits of Diverse Training Data",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep learning based methods for image reconstruction are state-of-the-art for a variety of imaging tasks. However, neural networks often perform worse if the training data differs significantly from the data they are applied to. \nFor example, a network trained for accelerated magnetic resonance imaging (MRI) on one scanner performs worse on another scanner. \nIn this work, we investigate the impact of the training data on the model's performance and robustness. \nWe find that models trained on the combination of various data distributions, such as those obtained from different MRI scanners and anatomies, exhibit robustness equal or superior to models trained on the best single distribution for a specific distributions shift. Thus training on diverse data tends to improve robustness. \nFurthermore, training on diverse data does not compromise in-distribution performance, i.e., a model trained on diverse data yields in-distribution performance at least as good as models trained on the more narrow individual distributions. \nOur results suggest that training a model for imaging on a variety of distributions tends to yield a more effective and robust model than maintaining separate models for individual distributions.",
        "keywords": "Deep Learning;Datasets;Accelerated MRI;Robustness;Distribution-shift;fastMRI;Inverse problems;Image reconstruction",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/14a50c6a2bd0f4294b66713b52911ad6ae58de84.pdf",
        "author": "Kang Lin;Reinhard Heckel",
        "authorids": "~Kang_Lin1;~Reinhard_Heckel1",
        "gender": "M;M",
        "homepage": ";",
        "dblp": ";81/9668",
        "google_scholar": "https://scholar.google.com/citations?hl=en;ZWV0I7cAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Kang_Lin1;~Reinhard_Heckel1",
        "aff": "Technical University Munich;Rice University",
        "aff_domain": "tum.de;rice.edu",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nlin2024robustness,\ntitle={Robustness of Deep Learning for Accelerated {MRI}: Benefits of Diverse Training Data},\nauthor={Kang Lin and Reinhard Heckel},\nyear={2024},\nurl={https://openreview.net/forum?id=KJYIgEteHX}\n}",
        "github": "",
        "project": "",
        "reviewers": "Eeae;JsA6;2hGx;YEQb;xWg5",
        "site": "https://openreview.net/forum?id=KJYIgEteHX",
        "pdf_size": 11296381,
        "rating": "5;5;6;8;10",
        "confidence": "5;5;5;3;4",
        "soundness": "2;2;3;3;3",
        "contribution": "2;2;2;3;4",
        "presentation": "3;3;4;4;4",
        "wc_summary": "57;135;144;155;159",
        "wc_strengths": "68;73;83;134;171",
        "wc_weaknesses": "233;343;122;108;660",
        "wc_questions": "136;181;319;32;38",
        "wc_review": "494;732;668;429;1028",
        "wc_reply_reviewers": "467;426;32;0;518",
        "wc_reply_authors": "1354;1644;568;324;356",
        "reply_reviewers": "1;2;1;0;1",
        "reply_authors": "2;3;1;1;1",
        "rating_avg": [
            6.8,
            1.9390719429665317
        ],
        "confidence_avg": [
            4.4,
            0.8
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.6,
            0.8
        ],
        "presentation_avg": [
            3.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            130.0,
            37.4593112590181
        ],
        "wc_strengths_avg": [
            105.8,
            40.17661011085928
        ],
        "wc_weaknesses_avg": [
            293.2,
            202.11620419946541
        ],
        "wc_questions_avg": [
            141.2,
            105.63976524017838
        ],
        "wc_review_avg": [
            670.2,
            210.27068269257128
        ],
        "wc_reply_reviewers_avg": [
            288.6,
            224.70567416066734
        ],
        "wc_reply_authors_avg": [
            849.2,
            544.9192233716847
        ],
        "reply_reviewers_avg": [
            1.0,
            0.6324555320336759
        ],
        "reply_authors_avg": [
            1.6,
            0.8
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.7219948723811553,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17534568045588487906&as_sdt=5,31&sciodt=0,31&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Technical University of Munich;Rice University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tum.de;https://www.rice.edu",
        "aff_unique_abbr": "TUM;Rice",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Germany;United States"
    },
    {
        "id": "KJzwUyryyl",
        "title": "ALMANACS: A Simulatability Benchmark for Language Model Explainability",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "How do we measure the efficacy of language model explainability methods? While many explainability methods have been developed, they are typically evaluated on bespoke tasks, preventing an apples-to-apples comparison. To help fill this gap, we present ALMANACS, a language model explainability benchmark. ALMANACS scores explainability methods on simulatability, i.e., how well the explanations improve behavior prediction on new inputs. The ALMANACS scenarios span twelve safety-relevant topics such as ethical reasoning and advanced AI behaviors; they have idiosyncratic premises to invoke model-specific behavior; and they have a train-test distributional shift to encourage faithful explanations. By using another language model to predict behavior based on the explanations, ALMANACS is a fully automated benchmark. We use ALMANACS to evaluate counterfactual, rationalization, and salience-based explanations. Our results are sobering: when averaged across all topics, no explanation method outperforms the explanation-free control. We conclude that despite modest successes in prior work, developing an explanation method that aids simulatability in ALMANACS remains an open challenge.",
        "keywords": "explainability;interpretability;simulatability;explanations;evaluation;benchmark;natural language processing",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/d049385c6c76e3b1d58552ae81a0d022c79164bb.zip",
        "author": "Edmund M Mills;Shiye Su;Stuart Russell;Scott Emmons",
        "authorids": "~Edmund_M_Mills1;~Shiye_Su1;~Stuart_Russell1;~Scott_Emmons1",
        "gender": ";;M;M",
        "homepage": "https://www.edmundmills.com;;https://people.eecs.berkeley.edu/~russell/;http://scottemmons.com/",
        "dblp": ";;;180/5699",
        "google_scholar": "djelh-cAAAAJ;;https://scholar.google.com.tw/citations?user=KJGrjCAAAAAJ;LoT0z6oAAAAJ",
        "orcid": ";;;0000-0002-7946-7046",
        "linkedin": ";;;scott-emmons-5258005b/",
        "or_profile": "~Edmund_M_Mills1;~Shiye_Su1;~Stuart_Russell1;~Scott_Emmons1",
        "aff": ";;University of California, Berkeley;University of California, Berkeley",
        "aff_domain": ";;berkeley.edu;berkeley.edu",
        "position": ";;Full Professor;PhD student",
        "bibtex": "@misc{\nmills2024almanacs,\ntitle={{ALMANACS}: A Simulatability Benchmark for Language Model Explainability},\nauthor={Edmund M Mills and Shiye Su and Stuart Russell and Scott Emmons},\nyear={2024},\nurl={https://openreview.net/forum?id=KJzwUyryyl}\n}",
        "github": "",
        "project": "",
        "reviewers": "vWZJ;3Mpe;P4RQ;Lu72",
        "site": "https://openreview.net/forum?id=KJzwUyryyl",
        "pdf_size": 1027302,
        "rating": "3;3;6;8",
        "confidence": "3;3;3;4",
        "soundness": "2;3;3;4",
        "contribution": "2;2;3;3",
        "presentation": "1;2;3;4",
        "wc_summary": "101;82;84;55",
        "wc_strengths": "47;35;91;53",
        "wc_weaknesses": "76;190;110;88",
        "wc_questions": "19;70;1;22",
        "wc_review": "243;377;286;218",
        "wc_reply_reviewers": "0;79;0;0",
        "wc_reply_authors": "631;1014;437;301",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "2;3;2;1",
        "rating_avg": [
            5.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            80.5,
            16.469669092000604
        ],
        "wc_strengths_avg": [
            56.5,
            20.946360065653412
        ],
        "wc_weaknesses_avg": [
            116.0,
            44.429719783046124
        ],
        "wc_questions_avg": [
            28.0,
            25.544079548889602
        ],
        "wc_review_avg": [
            281.0,
            60.52685354452187
        ],
        "wc_reply_reviewers_avg": [
            19.75,
            34.208003449485325
        ],
        "wc_reply_authors_avg": [
            595.75,
            268.4468057176319
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.8164965809277261,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8492257827349576737&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of California, Berkeley",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.berkeley.edu",
        "aff_unique_abbr": "UC Berkeley",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Berkeley",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "KKBZzMLGvH",
        "title": "Hessian-Aware Bayesian Optimization for Decision Making Systems",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Many approaches for optimizing decision making systems rely on gradient based methods requiring informative feedback from the environment. However, in the case where such feedback is sparse or uninformative, such approaches may result in poor performance. Derivative-free approaches such as Bayesian Optimization mitigate the dependency on the quality of gradient feedback, but are known to scale poorly in the high-dimension setting of complex decision making systems. This problem is exacerbated if the system requires interactions between several actors cooperating to accomplish a shared goal. To address the dimensionality challenge, we propose a compact multi-layered architecture modeling the dynamics of actor interactions through the concept of role. Additionally, we introduce Hessian-aware Bayesian Optimization to efficiently optimize the multi-layered architecture parameterized by a large number of parameters. Experimental results demonstrate that our method (HA-GP-UCB) works effectively on several benchmarks under resource constraints and malformed feedback settings.",
        "keywords": "Bayesian Optimization;Active Learning;Gaussian Process;Graphical Models;Bayesian;Probabilistic Methods;Hessian;High-dimensional optimization;Global optimization;Uncertainty;Optimization under Uncertainty",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/e0a7c96e1b7e835f23865d08001ae05074bbf5e7.zip",
        "author": "Mohit Rajpal;Lac Gia Tran;Yehong Zhang;Bryan Kian Hsiang Low",
        "authorids": "~Mohit_Rajpal1;~Lac_Gia_Tran1;~Yehong_Zhang1;~Bryan_Kian_Hsiang_Low1",
        "gender": "Not Specified;M;;M",
        "homepage": "https://mohit-rajpal.github.io/;;;http://www.comp.nus.edu.sg/~lowkh",
        "dblp": "209/4858;220/5500.html;172/1145;97/4877",
        "google_scholar": "https://scholar.google.com.sg/citations?user=qUvSFVkAAAAJ;;jGJHvCMAAAAJ;https://scholar.google.com.tw/citations?user=2P-Q09UAAAAJ",
        "orcid": ";;;",
        "linkedin": "mohit-rajpal/;lac-tran-2801a4125/;;",
        "or_profile": "~Mohit_Rajpal1;~Lac_Gia_Tran1;~Yehong_Zhang1;~Bryan_Kian_Hsiang_Low1",
        "aff": "National University of Singapore;;Pengcheng Laboratory;National University of Singapore",
        "aff_domain": "u.nus.edu;;pcl.ac.cn;nus.edu.sg",
        "position": "PhD student;;Research Scientist;Associate Professor",
        "bibtex": "@misc{\nrajpal2024hessianaware,\ntitle={Hessian-Aware Bayesian Optimization for Decision Making Systems},\nauthor={Mohit Rajpal and Lac Gia Tran and Yehong Zhang and Bryan Kian Hsiang Low},\nyear={2024},\nurl={https://openreview.net/forum?id=KKBZzMLGvH}\n}",
        "github": "",
        "project": "",
        "reviewers": "z1BB;22Fs;hYdE;MZim;jHt7",
        "site": "https://openreview.net/forum?id=KKBZzMLGvH",
        "pdf_size": 10229257,
        "rating": "1;3;5;5;8",
        "confidence": "4;3;2;2;4",
        "soundness": "2;2;2;3;4",
        "contribution": "2;3;3;3;4",
        "presentation": "1;1;2;1;4",
        "wc_summary": "60;68;137;11;64",
        "wc_strengths": "6;44;56;24;82",
        "wc_weaknesses": "244;152;119;74;104",
        "wc_questions": "20;183;8;99;39",
        "wc_review": "330;447;320;208;289",
        "wc_reply_reviewers": "56;245;0;0;98",
        "wc_reply_authors": "888;1899;494;515;292",
        "reply_reviewers": "1;3;0;0;1",
        "reply_authors": "2;7;2;1;2",
        "rating_avg": [
            4.4,
            2.33238075793812
        ],
        "confidence_avg": [
            3.0,
            0.8944271909999159
        ],
        "soundness_avg": [
            2.6,
            0.8
        ],
        "contribution_avg": [
            3.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            1.8,
            1.1661903789690602
        ],
        "wc_summary_avg": [
            68.0,
            40.22437072223753
        ],
        "wc_strengths_avg": [
            42.4,
            26.150334605889842
        ],
        "wc_weaknesses_avg": [
            138.6,
            58.383559329660606
        ],
        "wc_questions_avg": [
            69.8,
            64.67580691417773
        ],
        "wc_review_avg": [
            318.8,
            77.10616058396371
        ],
        "wc_reply_reviewers_avg": [
            79.8,
            90.47076875985967
        ],
        "wc_reply_authors_avg": [
            817.6,
            573.9200641204313
        ],
        "reply_reviewers_avg": [
            1.0,
            1.0954451150103321
        ],
        "reply_authors_avg": [
            2.8,
            2.1354156504062622
        ],
        "replies_avg": [
            31,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.0958706236059213,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:r7TWN_TFHZcJ:scholar.google.com/&scioq=Hessian-Aware+Bayesian+Optimization+for+Decision+Making+Systems&hl=en&as_sdt=0,6",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "National University of Singapore;Pengcheng Laboratory",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.nus.edu.sg;",
        "aff_unique_abbr": "NUS;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Singapore;China"
    },
    {
        "id": "KKZaj2QS3G",
        "title": "Enriching Time Series Representation: Integrating a Noise-Resilient Sampling Strategy with an Efficient Encoder Architecture",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Time series analysis has been an important research area for decades, and with the advent of foundation models, it has witnessed an explosive surge in interest. Contrastive self-supervised learning stands out as a powerful technique to learn representations capable of solving a wide range of downstream tasks. However, there have been several challenges that persist.\nFirst, there is no previous work explicitly considering noise, which is one of the critical factors affecting the efficacy of time series tasks.\nSecond, there is a lack of efficient yet lightweight encoder architectures that can learn informative representations robust to various downstream tasks. \nTo fill in these gaps, we initiate a novel sampling strategy that promotes consistent representation learning with the presence of noise in natural time series. In addition, we propose an encoder architecture that utilizes dilated convolution within the Inception block to create a scalable and robust network architecture with a wide receptive field. Experiments demonstrate that our method consistently outperforms state-of-the-art methods in forecasting, classification, and abnormality detection tasks, e.g. ranks first over two-thirds of the classification UCR datasets, with only 40% of the parameters compared to the second-best approach.",
        "keywords": "Time series analysis;Contrastive self-supervised learning;Representation learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/866ccd67b8d3f3eb620d147f1a42b158e7111e0a.zip",
        "author": "Anh Duy Nguyen;Trang H. Tran;Hieu Pham;Phi Le Nguyen;Lam M. Nguyen",
        "authorids": "~Anh_Duy_Nguyen1;~Trang_H._Tran1;~Hieu_Pham6;~Phi_Le_Nguyen2;~Lam_M._Nguyen1",
        "gender": "M;M;F;M;F",
        "homepage": ";https://huyhieupham.github.io/;https://users.soict.hust.edu.vn/lenp/;https://lamnguyen-mltd.github.io/;https://htt-trangtran.github.io/",
        "dblp": "86/5476;120/1102-1.html;147/2816;181/1428;279/4007",
        "google_scholar": "-NRwc8EAAAAJ;https://scholar.google.com.vn/citations?user=3XZjNBYAAAAJ;L_NKoQwAAAAJ;DeFL5Q8AAAAJ;EWGuYl4AAAAJ",
        "orcid": ";0000-0002-6854-0148;;;0000-0002-9551-4738",
        "linkedin": "duy-nguyen-31b5791b1/;pham-huy-hieu-25615236/;;lam-m-nguyen-71b54750/;trang-tran-313b49195/",
        "or_profile": "~Anh_Duy_Nguyen1;~Hieu_Pham6;~Phi_Le_Nguyen2;~Lam_M_Nguyen1;~Trang_H_Tran1",
        "aff": "University of Illinois Urbana-Champaign;VinUniversity;Hanoi University of Science and Technology;IBM Research, Thomas J. Watson Research Center;Cornell University",
        "aff_domain": "cs.illinois.edu;vinuni.edu;hust.edu.vn;ibm.com;cornell.edu",
        "position": "PhD student;Assistant Professor;Associate Professor;Staff Research Scientist;PhD student",
        "bibtex": "@misc{\nnguyen2024enriching,\ntitle={Enriching Time Series Representation: Integrating a Noise-Resilient Sampling Strategy with an Efficient Encoder Architecture},\nauthor={Anh Duy Nguyen and Trang H. Tran and Hieu Pham and Phi Le Nguyen and Lam M. Nguyen},\nyear={2024},\nurl={https://openreview.net/forum?id=KKZaj2QS3G}\n}",
        "github": "",
        "project": "",
        "reviewers": "UsRW;CP3P;sJ4A;TahQ;CkvB;sMvT",
        "site": "https://openreview.net/forum?id=KKZaj2QS3G",
        "pdf_size": 18856854,
        "rating": "3;5;6;6;6;6",
        "confidence": "3;4;4;4;3;4",
        "soundness": "2;2;3;4;3;3",
        "contribution": "2;2;3;3;3;3",
        "presentation": "3;2;3;4;3;3",
        "wc_summary": "135;73;42;53;89;36",
        "wc_strengths": "24;44;45;77;199;84",
        "wc_weaknesses": "55;198;150;68;113;63",
        "wc_questions": "381;48;3;14;152;39",
        "wc_review": "595;363;240;212;553;222",
        "wc_reply_reviewers": "69;179;0;25;0;0",
        "wc_reply_authors": "1218;1937;1189;585;913;643",
        "reply_reviewers": "1;1;0;1;0;0",
        "reply_authors": "5;7;3;3;2;1",
        "rating_avg": [
            5.333333333333333,
            1.1055415967851332
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.8333333333333335,
            0.6871842709362768
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.5773502691896257
        ],
        "wc_summary_avg": [
            71.33333333333333,
            33.698005216266964
        ],
        "wc_strengths_avg": [
            78.83333333333333,
            57.49613513581201
        ],
        "wc_weaknesses_avg": [
            107.83333333333333,
            52.158146269036656
        ],
        "wc_questions_avg": [
            106.16666666666667,
            132.07752353153134
        ],
        "wc_review_avg": [
            364.1666666666667,
            156.91124525950616
        ],
        "wc_reply_reviewers_avg": [
            45.5,
            64.55682251577545
        ],
        "wc_reply_authors_avg": [
            1080.8333333333333,
            452.6317180912339
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.5,
            1.9790570145063195
        ],
        "replies_avg": [
            31,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.533001790889026,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:XoMTnRMEIooJ:scholar.google.com/&scioq=Enriching+Time+Series+Representation:+Integrating+a+Noise-Resilient+Sampling+Strategy+with+an+Efficient+Encoder+Architecture&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "University of Illinois Urbana-Champaign;VinUniversity;Hanoi University of Science and Technology;IBM;Cornell University",
        "aff_unique_dep": ";;;IBM Research;",
        "aff_unique_url": "https://illinois.edu;https://vinuni.edu.vn;https://www.hust.edu.vn;https://www.ibm.com/research;https://www.cornell.edu",
        "aff_unique_abbr": "UIUC;VinUni;HUST;IBM;Cornell",
        "aff_campus_unique_index": "0;2;3",
        "aff_campus_unique": "Urbana-Champaign;;Hanoi;Yorktown Heights",
        "aff_country_unique_index": "0;1;1;0;0",
        "aff_country_unique": "United States;Vietnam"
    },
    {
        "id": "KNQJtoPZmz",
        "title": "Simplicity Bias in Overparameterized Machine Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "A thorough theoretical understanding of the surprising generalization ability of deep networks (and other overparameterized models) is still lacking. Here we demonstrate that simplicity bias is a major phenomenon to be reckoned with in overparameterized machine learning.\nIn addition to explaining the outcome of simplicity bias, we also study its source:  following concrete rigorous examples, we argue that (i) simplicity bias can explain generalization in overparameterized learning models such as neural networks; (ii) simplicity bias and excellent generalization are optimizer-independent, as our examples show, and although the optimizer  affects training,  it is not the driving force behind simplicity bias; (iii) simplicity bias in pre-training models, and subsequent posteriors,  is  universal and stems from the subtle fact that uniformly-at-random constructed priors are not uniformly-at-random sampled; and (iv) in neural network models, the biasing mechanism in wide (and shallow) networks is different from the biasing mechanism in deep (and narrow) networks.",
        "keywords": "Simplicity Bias; Overparameterized models; deep learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Yakir Berchenko",
        "authorids": "~Yakir_Berchenko1",
        "gender": "",
        "homepage": "",
        "dblp": "",
        "google_scholar": "",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Yakir_Berchenko1",
        "aff": "Ben Gurion University of the Negev, Technion",
        "aff_domain": "bgu.ac.il",
        "position": "Assistant Professor",
        "bibtex": "@misc{\nberchenko2024simplicity,\ntitle={Simplicity Bias in Overparameterized Machine Learning},\nauthor={Yakir Berchenko},\nyear={2024},\nurl={https://openreview.net/forum?id=KNQJtoPZmz}\n}",
        "github": "",
        "project": "",
        "reviewers": "Y87b;CuZp;prbm;HAQJ",
        "site": "https://openreview.net/forum?id=KNQJtoPZmz",
        "pdf_size": 430259,
        "rating": "3;3;3;3",
        "confidence": "5;4;3;2",
        "soundness": "3;3;2;1",
        "contribution": "3;2;2;1",
        "presentation": "3;3;1;1",
        "wc_summary": "149;103;105;154",
        "wc_strengths": "23;30;27;39",
        "wc_weaknesses": "453;291;98;466",
        "wc_questions": "57;3;29;9",
        "wc_review": "682;427;259;668",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.0,
            1.0
        ],
        "wc_summary_avg": [
            127.75,
            23.826193569263218
        ],
        "wc_strengths_avg": [
            29.75,
            5.889609494694874
        ],
        "wc_weaknesses_avg": [
            327.0,
            149.10902051854544
        ],
        "wc_questions_avg": [
            24.5,
            21.08909670896314
        ],
        "wc_review_avg": [
            509.0,
            176.37601877806404
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12707922684158064925&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0",
        "aff_unique_norm": "Ben Gurion University of the Negev",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.bgu.ac.il",
        "aff_unique_abbr": "BGU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Israel"
    },
    {
        "id": "KNtcoAM5Gy",
        "title": "BaFTA: Backprop-Free Test-Time Adaptation for Zero-shot Vision Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large-scale pretrained vision-language models like CLIP have demonstrated remarkable zero-shot image classification capabilities across diverse domains. To enhance CLIP's performance while preserving the zero-shot paradigm, various test-time prompt tuning methods have been introduced to refine class embeddings through unsupervised learning objectives during inference. However, these methods often encounter challenges in selecting appropriate learning rates to prevent model instability with absence of validation data during test-time training. \n    In this study, we propose a novel backpropagation-free method for test-time adaptation in vision-language models. Instead of fine-tuning text prompts to refine class embeddings, our approach directly estimates class centroids using online clustering within a projected embedding space that aligns text and visual embeddings. We dynamically aggregate predictions from both estimated and original class embeddings, as well as from distinct augmented views, by assessing the reliability of each prediction using R\u00e9nyi entropy.\n    Through extensive experimentation, we demonstrate that our approach consistently outperforms state-of-the-art test-time adaptation methods by a significant margin.",
        "keywords": "test time adaptation; training free; online clustering; vision language model;",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/e937a16a2f7c42e06dc9cf722a064babf76fb91a.pdf",
        "author": "Xuefeng Hu;Ke Zhang;Min Sun;Albert Y. C. Chen;Cheng-Hao Kuo;Ram Nevatia",
        "authorids": "~Xuefeng_Hu1;~Ke_Zhang2;~Min_Sun1;~Albert_Y._C._Chen1;~Cheng-Hao_Kuo4;~Ram_Nevatia1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://xuefenghu.me;http://www-scf.usc.edu/~zhan355/index.html;http://aliensunmin.github.io;;;http://iris.usc.edu/people/nevatia/",
        "dblp": ";20/4152-28;62/2750-1;02/1954;38/3578;n/RamakantNevatia",
        "google_scholar": "https://scholar.google.com/citations?hl=en;biks_VUAAAAJ;1Rf6sGcAAAAJ;n1T0dYkAAAAJ;nvQampwAAAAJ;https://scholar.google.com.tw/citations?user=EUMYhUvzt6IC",
        "orcid": ";;;;;",
        "linkedin": "xuefeng-hu-137b9485/;ke-zhang-2833a987/;;;cheng-hao-kuo-65208353/;",
        "or_profile": "~Xuefeng_Hu1;~Ke_Zhang2;~Min_Sun1;~Albert_Y._C._Chen1;~Cheng-Hao_Kuo4;~Ram_Nevatia1",
        "aff": "University of Southern California;Amazon;National Tsing Hua University;Amazon;Amazon;University of Southern California",
        "aff_domain": "usc.edu;amazon.com;nthu.edu.tw;amazon.com;amazon.com;usc.edu",
        "position": "PhD student;Applied Scientist;Assistant Professor;Applied Scientist Manager;Researcher;Full Professor",
        "bibtex": "@misc{\nhu2024bafta,\ntitle={Ba{FTA}: Backprop-Free Test-Time Adaptation for Zero-shot Vision Language Models},\nauthor={Xuefeng Hu and Ke Zhang and Min Sun and Albert Y. C. Chen and Cheng-Hao Kuo and Ram Nevatia},\nyear={2024},\nurl={https://openreview.net/forum?id=KNtcoAM5Gy}\n}",
        "github": "",
        "project": "",
        "reviewers": "sCvw;mwjV;JA78;mkqJ",
        "site": "https://openreview.net/forum?id=KNtcoAM5Gy",
        "pdf_size": 388702,
        "rating": "5;5;6;6",
        "confidence": "3;3;3;2",
        "soundness": "3;3;2;3",
        "contribution": "2;3;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "22;90;67;89",
        "wc_strengths": "40;24;50;97",
        "wc_weaknesses": "191;115;173;161",
        "wc_questions": "3;26;49;4",
        "wc_review": "256;255;339;351",
        "wc_reply_reviewers": "569;0;0;13",
        "wc_reply_authors": "1221;172;375;354",
        "reply_reviewers": "3;0;0;1",
        "reply_authors": "3;1;1;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            67.0,
            27.55902755904134
        ],
        "wc_strengths_avg": [
            52.75,
            27.178806081209675
        ],
        "wc_weaknesses_avg": [
            160.0,
            28.089143810376278
        ],
        "wc_questions_avg": [
            20.5,
            18.848076824970764
        ],
        "wc_review_avg": [
            300.25,
            44.95205779494416
        ],
        "wc_reply_reviewers_avg": [
            145.5,
            244.56543091778119
        ],
        "wc_reply_authors_avg": [
            530.5,
            406.400356791182
        ],
        "reply_reviewers_avg": [
            1.0,
            1.224744871391589
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:kz1Mj0oMyLYJ:scholar.google.com/&scioq=BaFTA:+Backprop-Free+Test-Time+Adaptation+for+Zero-shot+Vision+Language+Models&hl=en&as_sdt=0,48",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;1;1;0",
        "aff_unique_norm": "University of Southern California;Amazon;National Tsing Hua University",
        "aff_unique_dep": ";Amazon.com, Inc.;",
        "aff_unique_url": "https://www.usc.edu;https://www.amazon.com;https://www.nthu.edu.tw",
        "aff_unique_abbr": "USC;Amazon;NTHU",
        "aff_campus_unique_index": "0;2;0",
        "aff_campus_unique": "Los Angeles;;Taiwan",
        "aff_country_unique_index": "0;0;1;0;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "HiGen: Hierarchical Graph Generative Networks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18909",
        "id": "KNvubydSB5",
        "tldr": "",
        "abstract": "Most real-world graphs exhibit a hierarchical structure, which is often overlooked by existing graph generation methods. To address this limitation, we propose a novel graph generative network that captures the hierarchical nature of graphs and successively generates the graph sub-structures in a coarse-to-fine fashion. At each level of hierarchy, this model generates communities in parallel, followed by the prediction of cross-edges between communities using separate neural networks. This modular approach enables scalable graph generation for large and complex graphs.  Moreover, we model the output distribution of edges in the hierarchical graph with a multinomial distribution and derive a recursive factorization for this distribution. This enables us to generate  community graphs with integer-valued edge weights in an autoregressive manner. Empirical studies demonstrate the effectiveness and scalability of our proposed generative model, achieving state-of-the-art performance in terms of graph quality across various benchmark datasets. \nCode available at https://github.com/Karami-m/HiGen_main.",
        "keywords": "Generative Models;Graph Generative Network;Graph Neural Network;Probabilistic Model",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Mahdi Karami",
        "authorids": "~Mahdi_Karami2",
        "gender": "M",
        "homepage": "https://karami-m.github.io/",
        "dblp": "90/394.html",
        "google_scholar": "https://scholar.google.com/citations?hl=en",
        "orcid": "",
        "linkedin": "mahdi-karami-2957412a/",
        "or_profile": "~Mahdi_Karami2",
        "aff": "University of Waterloo",
        "aff_domain": "cs.uwaterloo.ca",
        "position": "Researcher",
        "bibtex": "@inproceedings{\nkarami2024higen,\ntitle={HiGen: Hierarchical Graph Generative Networks},\nauthor={Mahdi Karami},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=KNvubydSB5}\n}",
        "github": "",
        "project": "",
        "reviewers": "WR6B;oTgM;tztH;D2iQ;fvzA",
        "pdf_size": 31152068,
        "rating": "6;6;6;6;8",
        "confidence": "3;3;3;3;3",
        "soundness": "3;3;3;3;4",
        "contribution": "2;3;3;3;2",
        "presentation": "3;3;3;3;4",
        "wc_summary": "105;71;73;99;74",
        "wc_strengths": "69;52;48;120;66",
        "wc_weaknesses": "142;69;19;58;68",
        "wc_questions": "113;5;11;4;19",
        "wc_review": "429;197;151;281;227",
        "wc_reply_reviewers": "88;0;0;35;0",
        "wc_reply_authors": "387;613;79;502;525",
        "reply_reviewers": "1;0;0;1;0",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            6.4,
            0.7999999999999999
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            3.2,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            3.2,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            84.4,
            14.527215837867903
        ],
        "wc_strengths_avg": [
            71.0,
            25.768197453450252
        ],
        "wc_weaknesses_avg": [
            71.2,
            39.8165794613249
        ],
        "wc_questions_avg": [
            30.4,
            41.64420728024486
        ],
        "wc_review_avg": [
            257.0,
            95.80814161646181
        ],
        "wc_reply_reviewers_avg": [
            24.6,
            34.47665877082638
        ],
        "wc_reply_authors_avg": [
            421.2,
            185.66679832431
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4762710871115878450&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=KNvubydSB5",
        "pdf": "https://openreview.net/pdf?id=KNvubydSB5",
        "email": "cs.uwaterloo.ca",
        "author_num": 1,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Waterloo",
        "aff_unique_dep": "",
        "aff_unique_url": "https://uwaterloo.ca",
        "aff_unique_abbr": "UW",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "KNzL1nglNB",
        "title": "Label-encoding Risk Minimization under Label Insufficient Scenarios",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The Empirical Risk Minimization (ERM) adopts the supervision information, $i.e.$, class labels, to guide the learning of labeled samples and achieves great success in many applications. However, many real-world applications usually face the label insufficient scenario, where there exist limited or even no labeled samples but abundant unlabeled samples. Under those scenarios, the ERM cannot be directly applied to tackle them. To alleviate this issue, we propose a Label-encoding Risk Minimization (LRM), which draws inspiration from the phenomenon of neural collapse. Specifically, the proposed LRM first estimates the label encodings through prediction means for unlabeled samples and then aligns them with their corresponding ground-truth label encodings. As a result, the LRM takes both the prediction discriminability and diversity into account and can be utilized as a plugin in existing models to address scenarios with insufficient labels. Theoretically, we analyze the relationship between the LRM and ERM. Empirically, we demonstrate the superiority of the LRM under several label insufficient scenarios, including semi-supervised learning, unsupervised domain adaptation, and semi-supervised heterogeneous domain adaptation. The code will be released soon.",
        "keywords": "Label insufficient scenario;semi-supervised learning;domain adaptation;heterogeneous domain adaptation;label encoding",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/f14ec826330e6aaf76d271b44bf5bbbd5fceac57.zip",
        "author": "Yulong Zhang;Yuan Yao;Shuhao Chen;Pengrong Jin;Yu Zhang;Jian Jin;Jiangang Lu",
        "authorids": "~Yulong_Zhang2;~Yuan_Yao15;~Shuhao_Chen1;~Pengrong_Jin2;~Yu_Zhang3;~Jian_Jin4;~Jiangang_Lu1",
        "gender": ";M;M;M;M;M;M",
        "homepage": ";https://yyyaoyuan.github.io/;https://scholar.google.com/citations?user=YqX_IbAAAAAJ&hl=zh-CN;http://cse.sustech.edu.cn/faculty/~zhangy/;http://www.caict.ac.cn;https://person.zju.edu.cn/lujg/;",
        "dblp": "32/9374;25/4120-16;43/2127;50/671-6;;20/6851;",
        "google_scholar": "https://scholar.google.com.hk/citations?user=2hY14LYAAAAJ;https://scholar.google.com.hk/citations?user=jD1u0hAAAAAJ;YqX_IbAAAAAJ;https://scholar.google.com.hk/citations?user=jaRS5w4AAAAJ;;;gageqRgAAAAJ",
        "orcid": "0000-0002-4038-1616;;0009-0002-0410-5961;;0000-0002-4128-966X;0000-0002-1551-6179;",
        "linkedin": ";;;;;;",
        "or_profile": "~Yulong_Zhang2;~Yuan_Yao15;~Shuhao_Chen1;~Yu_Zhang3;~Jian_Jin4;~Jiangang_Lu1;~Pengrong_JIN1",
        "aff": "Zhejiang University;Beijing Teleinfo Technology Co., LTD;Southern University of Science and Technology;Southern University of Science and Technology;Pengcheng Labs;;Southern University of Science and Technology",
        "aff_domain": "zju.edu.cn;teleinfo.cn;sustech.edu;sustc.edu.cn;pcl.ac.cn;;sustech.edu.cn",
        "position": "PhD student;Researcher;MS student;Associate Professor;Full Professor;;Researcher",
        "bibtex": "@misc{\nzhang2024labelencoding,\ntitle={Label-encoding Risk Minimization under Label Insufficient Scenarios},\nauthor={Yulong Zhang and Yuan Yao and Shuhao Chen and Pengrong Jin and Yu Zhang and Jian Jin and Jiangang Lu},\nyear={2024},\nurl={https://openreview.net/forum?id=KNzL1nglNB}\n}",
        "github": "",
        "project": "",
        "reviewers": "yg8U;Geja;UtTT;VuKt;2ZQ3",
        "site": "https://openreview.net/forum?id=KNzL1nglNB",
        "pdf_size": 735589,
        "rating": "3;5;5;6;6",
        "confidence": "3;4;3;5;3",
        "soundness": "1;2;3;3;3",
        "contribution": "3;2;2;3;3",
        "presentation": "1;2;2;3;3",
        "wc_summary": "63;83;49;64;67",
        "wc_strengths": "48;36;61;145;89",
        "wc_weaknesses": "765;38;71;18;130",
        "wc_questions": "88;38;71;154;4",
        "wc_review": "964;195;252;381;290",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "1921;519;840;766;627",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "3;1;2;1;1",
        "rating_avg": [
            5.0,
            1.0954451150103321
        ],
        "confidence_avg": [
            3.6,
            0.8
        ],
        "soundness_avg": [
            2.4,
            0.8
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.2,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            65.2,
            10.85172797300043
        ],
        "wc_strengths_avg": [
            75.8,
            38.82988539771911
        ],
        "wc_weaknesses_avg": [
            204.4,
            282.855864354975
        ],
        "wc_questions_avg": [
            71.0,
            50.509405064799566
        ],
        "wc_review_avg": [
            416.4,
            280.4072752265889
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            934.6,
            505.50988120906203
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.6,
            0.8
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.4564354645876385,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Y5ASuteq3pQJ:scholar.google.com/&scioq=Label-encoding+Risk+Minimization+under+Label+Insufficient+Scenarios&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;2;3;2",
        "aff_unique_norm": "Zhejiang University;Beijing Teleinfo Technology Co., LTD;Southern University of Science and Technology;Pengcheng Labs",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.zju.edu.cn;;https://www.sustech.edu.cn;",
        "aff_unique_abbr": "ZJU;;SUSTech;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "KOTsHW6mBI",
        "title": "Advancing Beyond Identification: Multi-bit Watermark for Large Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We propose a method to tackle misuses of large language models beyond the identification of machine-generated text. While existing methods focus on detection, some malicious misuses demand tracing the adversary user for counteracting them. To address this, we propose Multi-bit Watermark via Position Allocation, embedding traceable multi-bit information during language model generation. Leveraging the benefits of zero-bit watermarking, our method enables robust extraction of the watermark without any model access, embedding and extraction of long messages ($\\geq$ 32-bit) without finetuning, and maintaining text quality, while allowing zero-bit detection all at the same time. Moreover, our watermark is relatively robust under strong attacks like interleaving human texts and paraphrasing.",
        "keywords": "watermark;large language model;safety",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "KiYoon Yoo;Wonhyuk Ahn;Nojun Kwak",
        "authorids": "~KiYoon_Yoo1;~Wonhyuk_Ahn1;~Nojun_Kwak1",
        "gender": "M;M;M",
        "homepage": "http://mipal.snu.ac.kr;;http://mipal.snu.ac.kr",
        "dblp": "266/1524;;49/2806",
        "google_scholar": "S93OUYQAAAAJ;SvpXOqsAAAAJ;h_8-1M0AAAAJ",
        "orcid": ";;0000-0002-1792-0327",
        "linkedin": ";wonhyuk-ahn-0a295b116/;",
        "or_profile": "~KiYoon_Yoo1;~Wonhyuk_Ahn1;~Nojun_Kwak1",
        "aff": "Seoul National University;NAVER WEBTOON Corp.;Seoul National University",
        "aff_domain": "snu.ac.kr;webtoonscorp.com;snu.ac.kr",
        "position": "PhD student;Researcher;Full Professor",
        "bibtex": "@misc{\nyoo2024advancing,\ntitle={Advancing Beyond Identification: Multi-bit Watermark for Large Language Models},\nauthor={KiYoon Yoo and Wonhyuk Ahn and Nojun Kwak},\nyear={2024},\nurl={https://openreview.net/forum?id=KOTsHW6mBI}\n}",
        "github": "",
        "project": "",
        "reviewers": "Fyz9;7Lgp;hfyX;eLnz;TksX",
        "site": "https://openreview.net/forum?id=KOTsHW6mBI",
        "pdf_size": 670569,
        "rating": "3;5;6;6;6",
        "confidence": "4;3;5;2;4",
        "soundness": "2;3;3;3;3",
        "contribution": "2;2;2;3;3",
        "presentation": "2;2;4;3;2",
        "wc_summary": "45;129;219;156;76",
        "wc_strengths": "24;112;123;73;84",
        "wc_weaknesses": "252;214;576;196;92",
        "wc_questions": "2;141;172;88;1",
        "wc_review": "323;596;1090;513;253",
        "wc_reply_reviewers": "0;0;0;42;0",
        "wc_reply_authors": "1161;1124;1842;1379;712",
        "reply_reviewers": "0;0;0;1;0",
        "reply_authors": "2;3;4;3;1",
        "rating_avg": [
            5.2,
            1.16619037896906
        ],
        "confidence_avg": [
            3.6,
            1.019803902718557
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.6,
            0.8
        ],
        "wc_summary_avg": [
            125.0,
            61.01475231450178
        ],
        "wc_strengths_avg": [
            83.2,
            34.70677167355097
        ],
        "wc_weaknesses_avg": [
            266.0,
            163.81452927014746
        ],
        "wc_questions_avg": [
            80.8,
            70.10106989197811
        ],
        "wc_review_avg": [
            555.0,
            294.8552187091149
        ],
        "wc_reply_reviewers_avg": [
            8.4,
            16.8
        ],
        "wc_reply_authors_avg": [
            1243.6,
            368.82006453011746
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4
        ],
        "reply_authors_avg": [
            2.6,
            1.019803902718557
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.10090091909944687,
        "gs_citation": 22,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9647950777964169472&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Seoul National University;NAVER WEBTOON Corp.",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.snu.ac.kr;https://www.webtoons.com",
        "aff_unique_abbr": "SNU;Naver Webtoon",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "KOUAayk5Kx",
        "title": "Defying Multi-model Forgetting: Orthogonal Gradient Learning to One-shot Neural Architecture Search",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "One-shot neural architecture search (NAS) trains an over-parameterized network (termed as supernet) that assembles all the architectures as its subnets by using weight sharing, and thereby reduces much computational budget. However, there is an issue of multi-model forgetting about supernet training in one-shot NAS that some weights of the previously well-trained architecture will be overwritten by that of the newly sampled architecture which has overlapped structures with the old one. To overcome the issue, we propose an orthogonal gradient learning (OGL) guided supernet training paradigm for one-shot NAS, where the novelty lies in the fact that the weights of the overlapped structures of current architecture are updated in the orthogonal direction to the gradient space of these overlapped structures of all previously trained architectures. Moreover, a new approach of calculating the projection is designed to effectively find the base vectors of the gradient space to acquire the orthogonal direction. We have theoretically and experimentally proved the effectiveness of the proposed paradigm in overcoming the multi-model forgetting. Besides, we apply the proposed paradigm to two one-shot NAS baselines, and experimental results have demonstrated that our approach is able to mitigate the multi-model forgetting and enhance the predictive ability of the supernet in one-shot NAS with remarkable efficiency on popular test datasets.",
        "keywords": "One-shot neural architecture search;Multimodel forgetting;Orthogonal gradient learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/d15665877b747bbddc1eb3a5f165e0478aed1639.pdf",
        "author": "Lianbo Ma;Ye Ma;Yuee Zhou;Guo Yu;Qing Li;Qiang He",
        "authorids": "~Lianbo_Ma1;~Ye_Ma4;~Yuee_Zhou1;~Guo_Yu4;~Qing_Li15;~Qiang_He5",
        "gender": "M;M;F;M;M;M",
        "homepage": "http://faculty.neu.edu.cn/swc/malb/;;;https://gyresearch.github.io/;https://smartinternet.group/qing-li/;http://faculty.neu.edu.cn/heqiang/zh_CN/index.htm",
        "dblp": "144/0830;;308/5393.html;;181/2689-6;97/6589-2",
        "google_scholar": "https://scholar.google.com.sg/citations?hl=zh-CN;;https://scholar.google.com.hk/citations?user=1KJN4TwAAAAJ;muL7sJ4AAAAJ;54AuaywAAAAJ;",
        "orcid": ";0000-0002-2831-5667;0000-0001-7655-4884;;0000-0002-6071-473X;",
        "linkedin": ";;;;;",
        "or_profile": "~Lianbo_Ma1;~Ye_Ma4;~Yuee_Zhou1;~Guo_Yu4;~Qing_Li15;~Qiang_He5",
        "aff": "Northeastern University;Northeastern University;Northeastern University;Nanjing Tech University;Pengcheng Laboratory;Northeastern University",
        "aff_domain": "neu.edu.cn;neu.edu.cn;neu.edu.cn;njtech.edu.cn;pcl.ac.cn;cn.edu",
        "position": "Full Professor;MS student;PhD student;Associate Professor;Associate Professor;Associate Professor",
        "bibtex": "@misc{\nma2024defying,\ntitle={Defying Multi-model Forgetting: Orthogonal Gradient Learning to One-shot Neural Architecture Search},\nauthor={Lianbo Ma and Ye Ma and Yuee Zhou and Guo Yu and Qing Li and Qiang He},\nyear={2024},\nurl={https://openreview.net/forum?id=KOUAayk5Kx}\n}",
        "github": "",
        "project": "",
        "reviewers": "9XeX;iP4N;74aa",
        "site": "https://openreview.net/forum?id=KOUAayk5Kx",
        "pdf_size": 10591032,
        "rating": "5;5;5",
        "confidence": "3;3;5",
        "soundness": "3;2;2",
        "contribution": "3;2;2",
        "presentation": "3;2;3",
        "wc_summary": "86;77;86",
        "wc_strengths": "40;53;77",
        "wc_weaknesses": "123;62;80",
        "wc_questions": "5;35;2",
        "wc_review": "254;227;245",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1611;900;1425",
        "reply_reviewers": "0;0;0",
        "reply_authors": "4;3;3",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            83.0,
            4.242640687119285
        ],
        "wc_strengths_avg": [
            56.666666666666664,
            15.326085243430198
        ],
        "wc_weaknesses_avg": [
            88.33333333333333,
            25.590796956892312
        ],
        "wc_questions_avg": [
            14.0,
            14.89966442575134
        ],
        "wc_review_avg": [
            242.0,
            11.224972160321824
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1312.0,
            301.0614555202974
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:IHXrMq0GN3kJ:scholar.google.com/&scioq=Defying+Multi-model+Forgetting:+Orthogonal+Gradient+Learning+to+One-shot+Neural+Architecture+Search&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;2;0",
        "aff_unique_norm": "Northeastern University;Nanjing Tech University;Pengcheng Laboratory",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.northeastern.edu;https://www.njtech.edu.cn;",
        "aff_unique_abbr": "NEU;Nanjing Tech;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;1;0",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "Retroformer: Retrospective Large Language Agents with Policy Gradient Optimization",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18908",
        "id": "KOZu91CzbK",
        "author_site": "Weiran Yao, Shelby Heinecke, Juan Carlos Niebles, Zhiwei Liu, Yihao Feng, Le Xue, Rithesh Murthy, Zeyuan Chen, Jianguo Zhang, Devansh Arpit, Ran Xu, Phil Mui, Huan Wang, Caiming Xiong, Silvio Savarese",
        "tldr": "",
        "abstract": "Recent months have seen the emergence of a powerful new trend in which large language models (LLMs) are augmented to become autonomous language agents capable of performing objective oriented multi-step tasks on their own, rather than merely responding to queries from human users. Most existing language agents, however, are not optimized using environment-specific rewards. Although some agents enable iterative refinement through verbal feedback, they do not reason and plan in ways that are compatible with gradient-based learning from rewards. This paper introduces a principled framework for reinforcing large language agents by learning a retrospective model, which automatically tunes the language agent prompts from environment feedback through policy gradient. Specifically, our proposed agent architecture learns from rewards across multiple environments and tasks, for fine-tuning a pre-trained language model which refines the language agent prompt by summarizing the root cause of prior failed attempts and proposing action plans. Experimental results on various tasks demonstrate that the language agents improve over time and that our approach considerably outperforms baselines that do not properly leverage gradients from the environment.",
        "keywords": "Language Agent;AI Agent;Reinforcement Learning",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Weiran Yao;Shelby Heinecke;Juan Carlos Niebles;Zhiwei Liu;Yihao Feng;Le Xue;Rithesh R N;Zeyuan Chen;Jianguo Zhang;Devansh Arpit;Ran Xu;Phil L Mui;Huan Wang;Caiming Xiong;Silvio Savarese",
        "authorids": "~Weiran_Yao1;~Shelby_Heinecke1;~Juan_Carlos_Niebles1;~Zhiwei_Liu3;~Yihao_Feng1;~Le_Xue1;~Rithesh_R_N1;~Zeyuan_Chen1;~Jianguo_Zhang3;~Devansh_Arpit2;~Ran_Xu1;~Phil_L_Mui1;~Huan_Wang1;~Caiming_Xiong1;~Silvio_Savarese1",
        "gender": "M;F;M;;M;M;M;M;M;M;M;M;M;M;M",
        "homepage": ";http://www.shelbyh.ai;http://www.niebles.net/;https://sites.google.com/view/zhiwei-jim;;;https://ritheshrn.github.io/;https://www.linkedin.com/in/zeyuan-chen-0253b6141/;https://jianguoz.github.io/;;;http://www.cs.yale.edu/homes/wang-huan/;http://cmxiong.com/;;",
        "dblp": "192/3295;;26/647;90/9499-1.html;204/3696;304/2195;352/4275;191/1578-1.html;;120/8494;;70/6155-16.html;80/7282;50/3578;",
        "google_scholar": "rr_leUAAAAAJ;tS937l8AAAAJ;hqNhUCYAAAAJ;https://scholar.google.com/citations?;uqnNle0AAAAJ;https://scholar.google.com/citations?view_op=list_works;https://scholar.google.ca/citations?user=Y1XpJucAAAAJ;znf-4mgAAAAJ;mAAVFEsAAAAJ;https://scholar.google.ca/citations?hl=en;sgBB2sUAAAAJ;7NpTttkAAAAJ;vaSdahkAAAAJ;ImpbxLsAAAAJ;",
        "orcid": ";;;0000-0003-1525-1067;;0000-0003-2810-770X;;0009-0003-2471-5449;;;;;;;",
        "linkedin": ";shelbyheinecke;;;;le-tycho-xue-5abbb9157/;rithesh-r-n/;zeyuan-chen-/;jianguo-zhang-3b267712a;;;huanwangyale/;caiming-xiong-150a1417;;philmui/",
        "or_profile": "~Weiran_Yao1;~Shelby_Heinecke1;~Juan_Carlos_Niebles1;~Zhiwei_Liu3;~Yihao_Feng1;~Le_Xue1;~Rithesh_R_N1;~Zeyuan_Chen1;~Jianguo_Zhang3;~Devansh_Arpit2;~Ran_Xu1;~Huan_Wang1;~Caiming_Xiong1;~Silvio_Savarese1;~Phil_Lik_Mui1",
        "aff": "SalesForce.com;Salesforce Research;Stanford University;Salesforce AI Research;Salesforce AI Research;Salesforce;SalesForce.com;Salesforce Inc;SalesForce AI Research;VaniLabs;SalesForce.com;Salesforce.com;Salesforce Research;Stanford University;",
        "aff_domain": "salesforce.com;salesforce.com;stanford.edu;salesforce.com;salesforce.com;salesforce.com;salesforce.com;salesforce.com;salesforce.com;vanilabs.com;salesforce.com;salesforce.com;salesforce.com;stanford.edu;",
        "position": "Researcher;Researcher;Adjunct Professor;Researcher;Researcher;Researcher;Researcher;Researcher;Researcher;Principal Researcher;senior manager;Researcher;Research Scientist;Adjunct Professor;",
        "bibtex": "@inproceedings{\nyao2024retroformer,\ntitle={Retroformer: Retrospective Large Language Agents with Policy Gradient Optimization},\nauthor={Weiran Yao and Shelby Heinecke and Juan Carlos Niebles and Zhiwei Liu and Yihao Feng and Le Xue and Rithesh R N and Zeyuan Chen and Jianguo Zhang and Devansh Arpit and Ran Xu and Phil L Mui and Huan Wang and Caiming Xiong and Silvio Savarese},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=KOZu91CzbK}\n}",
        "github": "",
        "project": "",
        "reviewers": "96C3;Hrx6;SkxB",
        "pdf_size": 1984334,
        "rating": "3;6;8",
        "confidence": "4;3;4",
        "soundness": "3;3;3",
        "contribution": "2;2;3",
        "presentation": "3;3;4",
        "wc_summary": "89;14;139",
        "wc_strengths": "33;20;77",
        "wc_weaknesses": "117;82;90",
        "wc_questions": "135;4;205",
        "wc_review": "374;120;511",
        "wc_reply_reviewers": "519;0;193",
        "wc_reply_authors": "2799;435;1101",
        "reply_reviewers": "3;0;2",
        "reply_authors": "8;2;3",
        "rating_avg": [
            5.666666666666667,
            2.0548046676563256
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            80.66666666666667,
            51.37011669140814
        ],
        "wc_strengths_avg": [
            43.333333333333336,
            24.390344173235622
        ],
        "wc_weaknesses_avg": [
            96.33333333333333,
            14.974051630144135
        ],
        "wc_questions_avg": [
            114.66666666666667,
            83.30799614816229
        ],
        "wc_review_avg": [
            335.0,
            161.9897116074557
        ],
        "wc_reply_reviewers_avg": [
            237.33333333333334,
            214.18735308654948
        ],
        "wc_reply_authors_avg": [
            1445.0,
            995.2808648818684
        ],
        "reply_reviewers_avg": [
            1.6666666666666667,
            1.247219128924647
        ],
        "reply_authors_avg": [
            4.333333333333333,
            2.6246692913372702
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            15,
            0
        ],
        "corr_rating_confidence": -0.1147078669352809,
        "gs_citation": 76,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15394605017148461219&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=KOZu91CzbK",
        "pdf": "https://openreview.net/pdf?id=KOZu91CzbK",
        "email": "salesforce.com;salesforce.com;stanford.edu;salesforce.com;salesforce.com;salesforce.com;salesforce.com;salesforce.com;salesforce.com;vanilabs.com;salesforce.com;salesforce.com;salesforce.com;stanford.edu;",
        "author_num": 15,
        "aff_unique_index": "0;0;1;0;0;0;0;0;0;2;0;0;0;1",
        "aff_unique_norm": "Salesforce;Stanford University;VaniLabs",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.salesforce.com;https://www.stanford.edu;",
        "aff_unique_abbr": "Salesforce;Stanford;",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Stanford",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States;"
    },
    {
        "id": "KP4xJQcG3H",
        "title": "Lagrangian Proximal Gradient Descent for Learning Convex Optimization Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We propose Lagrangian Proximal Gradient Descent (LPGD), a flexible framework for learning convex optimization models. \n    Similar to traditional proximal gradient methods, LPGD can be interpreted as optimizing a smoothed envelope of the possibly non-differentiable loss. The smoothening allows training models that do not provide informative gradients, such as discrete optimization models. \n    We show that the LPGD update can be efficiently computed by rerunning the forward solver on a perturbed input, capturing various previously proposed methods as special cases. \n    Moreover, we prove that the LPGD update converges to the true gradient as the smoothening parameter approaches zero. \n    Finally, we experimentally investigate the benefits of applying LPGD even in a fully differentiable setting.",
        "keywords": "hybrid architectures;neurosymbolic architectures;bilevel optimization;optimization layer;discrete optimization;proximal gradient descent;optimization",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "",
        "author": "Anselm Paulus;Georg Martius;V\u00edt Musil",
        "authorids": "~Anselm_Paulus1;~Georg_Martius1;~V\u00edt_Musil1",
        "gender": ";M;M",
        "homepage": ";https://uni-tuebingen.de/de/264672;http://vejtek.matfyz.cz/",
        "dblp": "255/5245;47/2706;255/4994",
        "google_scholar": "njZL5CQAAAAJ;https://scholar.google.de/citations?user=b-JF-UIAAAAJ;https://scholar.google.cz/citations?user=hA1rlU4AAAAJ",
        "orcid": ";;0000-0001-6083-227X",
        "linkedin": ";;",
        "or_profile": "~Anselm_Paulus1;~Georg_Martius1;~V\u00edt_Musil1",
        "aff": "Facebook AI Research;Max Planck Institute for Intelligent Systems;Masaryk University",
        "aff_domain": "meta.com;tuebingen.mpg.de;muni.cz",
        "position": "Intern;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\npaulus2024lagrangian,\ntitle={Lagrangian Proximal Gradient Descent for Learning Convex Optimization Models},\nauthor={Anselm Paulus and Georg Martius and V{\\'\\i}t Musil},\nyear={2024},\nurl={https://openreview.net/forum?id=KP4xJQcG3H}\n}",
        "github": "",
        "project": "",
        "reviewers": "R9P5;m9w5;t8qX;n99L",
        "site": "https://openreview.net/forum?id=KP4xJQcG3H",
        "pdf_size": 1166022,
        "rating": "3;5;6;8",
        "confidence": "4;3;4;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;2",
        "presentation": "1;3;3;3",
        "wc_summary": "124;64;92;45",
        "wc_strengths": "105;17;44;98",
        "wc_weaknesses": "1163;269;50;159",
        "wc_questions": "360;64;14;89",
        "wc_review": "1752;414;200;391",
        "wc_reply_reviewers": "545;15;14;28",
        "wc_reply_authors": "2651;865;395;689",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "4;2;1;1",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            81.25,
            29.810862114336782
        ],
        "wc_strengths_avg": [
            66.0,
            36.84426685388108
        ],
        "wc_weaknesses_avg": [
            410.25,
            441.44386675997663
        ],
        "wc_questions_avg": [
            131.75,
            134.51835376631695
        ],
        "wc_review_avg": [
            689.25,
            619.1766206019087
        ],
        "wc_reply_reviewers_avg": [
            150.5,
            227.83162642618342
        ],
        "wc_reply_authors_avg": [
            1150.0,
            882.7190946161752
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5547001962252291,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:B1GUI6qjTrYJ:scholar.google.com/&scioq=Lagrangian+Proximal+Gradient+Descent+for+Learning+Convex+Optimization+Models&hl=en&as_sdt=0,5",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Meta;Max Planck Institute for Intelligent Systems;Masaryk University",
        "aff_unique_dep": "Facebook AI Research;Intelligent Systems;",
        "aff_unique_url": "https://research.facebook.com;https://www.mpi-is.mpg.de;https://www.muni.cz",
        "aff_unique_abbr": "FAIR;MPI-IS;MU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2",
        "aff_country_unique": "United States;Germany;Czech Republic"
    },
    {
        "title": "LEAP: Liberate Sparse-View 3D Modeling from Camera Poses",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18907",
        "id": "KPmajBxEaF",
        "author_site": "Hanwen Jiang, Zhenyu Jiang, Yue Zhao, Qixing Huang",
        "tldr": "",
        "abstract": "Are camera poses necessary for multi-view 3D modeling? Existing approaches predominantly assume access to accurate camera poses. While this assumption might hold for dense views, accurately estimating camera poses for sparse views is often elusive. Our analysis reveals that noisy estimated poses lead to degraded performance for existing sparse-view 3D modeling methods. To address this issue, we present LEAP, a novel pose-free approach, therefore challenging the prevailing notion that camera poses are indispensable. LEAP discards pose-based operations and learns geometric knowledge from data. LEAP is equipped with a neural volume, which is shared across scenes and is parameterized to encode geometry and texture priors. For each incoming scene, we update the neural volume by aggregating 2D image features in a feature-similarity-driven manner. The updated neural volume is decoded into the radiance field, enabling novel view synthesis from any viewpoint. On both object-centric and bounded scene-level datasets, we show that LEAP significantly outperforms prior methods when they employ predicted poses from state-of-the-art pose estimators. Notably, LEAP performs on par with prior approaches that use ground-truth poses while running $400\\times$ faster than PixelNeRF. We show LEAP generalizes to novel object categories and scenes, and learns knowledge closely resembles epipolar geometry.",
        "keywords": "3D Reconstruction;Sparse-view 3D;Generalizable NeRF;Pose-free;Camera Pose",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/dc0d2d99ec01d02f10925d5a396bd36d0dc20b19.zip",
        "author": "Hanwen Jiang;Zhenyu Jiang;Yue Zhao;Qixing Huang",
        "authorids": "~Hanwen_Jiang1;~Zhenyu_Jiang1;~Yue_Zhao4;~Qixing_Huang1",
        "gender": "M;M;M;M",
        "homepage": "https://hwjiang1510.github.io/;https://zhenyujiang.me/;https://zhaoyue-zephyrus.github.io/;https://www.cs.utexas.edu/~huangqx/",
        "dblp": "237/9854;55/10479-2;48/76-6;82/241",
        "google_scholar": "https://scholar.google.com.sg/citations?user=HJHSuxUAAAAJ;2KLTzZIAAAAJ;https://scholar.google.com.hk/citations?user=6_U35tAAAAAJ;https://scholar.google.com.tw/citations?user=pamL_rIAAAAJ",
        "orcid": ";0000-0002-9711-7461;0000-0003-2753-5921;",
        "linkedin": ";;;",
        "or_profile": "~Hanwen_Jiang1;~Zhenyu_Jiang1;~Yue_Zhao4;~Qixing_Huang1",
        "aff": "University of Texas at Austin;University of Texas, Austin;University of Texas, Austin;University of Texas at Austin",
        "aff_domain": "utexas.edu;utexas.edu;utexas.edu;utexas.edu",
        "position": "PhD student;PhD student;PhD student;Associate Professor",
        "bibtex": "@inproceedings{\njiang2024leap,\ntitle={{LEAP}: Liberate Sparse-View 3D Modeling from Camera Poses},\nauthor={Hanwen Jiang and Zhenyu Jiang and Yue Zhao and Qixing Huang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=KPmajBxEaF}\n}",
        "github": "",
        "project": "",
        "reviewers": "EgpU;JK8J;bnbd;SJBX;BPaQ",
        "pdf_size": 4779484,
        "rating": "5;6;6;8;10",
        "confidence": "4;5;5;4;4",
        "soundness": "2;4;3;3;4",
        "contribution": "2;3;3;2;4",
        "presentation": "2;4;3;3;4",
        "wc_summary": "129;79;35;247;83",
        "wc_strengths": "89;107;81;105;75",
        "wc_weaknesses": "74;169;105;559;81",
        "wc_questions": "155;2;12;181;3",
        "wc_review": "447;357;233;1092;242",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "607;742;556;1033;211",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "1;1;1;2;1",
        "rating_avg": [
            7.0,
            1.7888543819998317
        ],
        "confidence_avg": [
            4.4,
            0.48989794855663565
        ],
        "soundness_avg": [
            3.2,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.8,
            0.7483314773547882
        ],
        "presentation_avg": [
            3.2,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            114.6,
            72.57988702113003
        ],
        "wc_strengths_avg": [
            91.4,
            12.737346662472527
        ],
        "wc_weaknesses_avg": [
            197.6,
            183.7798683207712
        ],
        "wc_questions_avg": [
            70.6,
            80.02649561239078
        ],
        "wc_review_avg": [
            474.2,
            318.82496765466783
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            629.8,
            267.0276390188851
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.2,
            0.4
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.4564354645876384,
        "gs_citation": 44,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10059705080820052884&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=KPmajBxEaF",
        "pdf": "https://openreview.net/pdf?id=KPmajBxEaF",
        "email": "utexas.edu;utexas.edu;utexas.edu;utexas.edu",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of Texas at Austin",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.utexas.edu",
        "aff_unique_abbr": "UT Austin",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Austin",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Learning Implicit Representation for Reconstructing Articulated Objects",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18906",
        "id": "KQ2i6jazVK",
        "author_site": "Hao Zhang, Fang Li, Samyak Rawlekar, Narendra Ahuja",
        "tldr": "",
        "abstract": "3D Reconstruction of moving articulated objects without additional information about object structure is a challenging problem. Current methods overcome such challenges by employing category-specific skeletal models. Consequently, they do not generalize well to articulated objects in the wild. We treat an articulated object as an unknown, semi-rigid skeletal structure surrounded by nonrigid material (e.g., skin). Our method simultaneously estimates the visible (explicit) representation (3D shapes, colors, camera parameters) and the underlying (implicit) skeletal representation, from motion cues in the object video without 3D supervision. Our implicit representation consists of four parts. (1) skeleton, which specifies which semi-rigid parts are connected. (2) Semi-rigid Part Assignment, which associates each surface vertex with a semi-rigid part. (3) Rigidity Coefficients, specifying the articulation of the local surface. (4) Time-Varying Transformations, which specify the skeletal motion and surface deformation parameters. We introduce an algorithm that uses these constraints as regularization terms and iteratively estimates both implicit and explicit representations. Our method is category-agnostic, thus eliminating the need for category-specific skeletons, we show that our method outperforms state-of-the-art across standard video datasets.",
        "keywords": "3D reconstruction from videos;Articulated Objects",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Hao Zhang;Fang Li;Samyak Rawlekar;Narendra Ahuja",
        "authorids": "~Hao_Zhang47;~Fang_Li8;~Samyak_Rawlekar1;~Narendra_Ahuja1",
        "gender": "M;M;;M",
        "homepage": "https://haoz19.github.io/;https://fangli333.github.io/;http://vision.ai.illinois.edu/ahuja.html;https://samyakr99.github.io",
        "dblp": ";;;",
        "google_scholar": "KeDuEtcAAAAJ;WybiEu0AAAAJ;dY7OSl0AAAAJ;4Jp_SN4AAAAJ",
        "orcid": ";;;",
        "linkedin": ";fang-li-8ab696223/;;",
        "or_profile": "~Hao_Zhang47;~Fang_Li8;~Narendra_Ahuja1;~Samyak_Kabir_Rawlekar1",
        "aff": "University of Illinois, Urbana Champaign;University of Illinois, Urbana Champaign;University of Illinois, Urbana Champaign;University of Illinois, Urbana Champaign",
        "aff_domain": "illinois.edu;illinois.edu;illinois.edu;uiuc.edu",
        "position": "PhD student;PhD student;Research Professor;PhD student",
        "bibtex": "@inproceedings{\nzhang2024learning,\ntitle={Learning Implicit Representation for Reconstructing Articulated Objects},\nauthor={Hao Zhang and Fang Li and Samyak Rawlekar and Narendra Ahuja},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=KQ2i6jazVK}\n}",
        "github": "",
        "project": "",
        "reviewers": "Wx9e;2K9U;dR3E;gF7P;Z1Zw",
        "pdf_size": 10160159,
        "rating": "5;6;6;8;8",
        "confidence": "3;5;3;4;4",
        "soundness": "3;3;2;3;3",
        "contribution": "3;2;2;3;3",
        "presentation": "3;2;2;3;3",
        "wc_summary": "506;75;67;93;78",
        "wc_strengths": "156;113;44;47;130",
        "wc_weaknesses": "267;543;275;107;66",
        "wc_questions": "239;106;20;43;59",
        "wc_review": "1168;837;406;290;333",
        "wc_reply_reviewers": "75;239;92;86;35",
        "wc_reply_authors": "1794;1824;1411;1143;265",
        "reply_reviewers": "1;2;1;1;1",
        "reply_authors": "5;5;4;3;2",
        "rating_avg": [
            6.6,
            1.2
        ],
        "confidence_avg": [
            3.8,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            163.8,
            171.3072094221373
        ],
        "wc_strengths_avg": [
            98.0,
            45.0111097397076
        ],
        "wc_weaknesses_avg": [
            251.6,
            167.96142414256911
        ],
        "wc_questions_avg": [
            93.4,
            78.06305143920521
        ],
        "wc_review_avg": [
            606.8,
            341.63922491423614
        ],
        "wc_reply_reviewers_avg": [
            105.4,
            69.69246731175471
        ],
        "wc_reply_authors_avg": [
            1287.4,
            570.265411891691
        ],
        "reply_reviewers_avg": [
            1.2,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            3.8,
            1.16619037896906
        ],
        "replies_avg": [
            33,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3563483225498991,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6600081253664319894&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=KQ2i6jazVK",
        "pdf": "https://openreview.net/pdf?id=KQ2i6jazVK",
        "email": "illinois.edu;illinois.edu;illinois.edu;uiuc.edu",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of Illinois Urbana-Champaign",
        "aff_unique_dep": "",
        "aff_unique_url": "https://illinois.edu",
        "aff_unique_abbr": "UIUC",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Urbana-Champaign",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "KQALhPTAfj",
        "title": "Navigating Scaling Laws: Accelerating Vision Transformer's Training via Adaptive Strategies",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In recent years, the state-of-the-art in deep learning has been dominated by very large models that have been pre-trained on vast amounts of data. The paradigm is very simple: Investing more computational resources (optimally) leads to better performance, and even predictably so; neural scaling laws have been derived that accurately forecast the performance of a network for a desired level of compute. This leads to the notion of a \"compute-optimal\" model, i.e. a model that allocates a given level of compute during training optimally to maximise performance. In this work, we extend the concept of optimality by allowing for an \"adaptive\" model, i.e. a model that can change its shape during the course of training. By allowing the shape to adapt, we can optimally traverse between the underlying scaling laws, leading to a significant reduction in required compute to reach a given target performance. We focus on vision tasks and the family of Vision Transformers, where the patch size as well as the width naturally serve as adaptive shape parameters. We demonstrate that, guided by scaling laws, we can design compute-optimal adaptive models that beat their \"static\" counterparts.",
        "keywords": "vision transformer;scaling laws",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/5d7ad0f1ebb94ea1651cf969c7b902aa0b57a84f.pdf",
        "author": "Sotiris Anagnostidis;Gregor Bachmann;Thomas Hofmann",
        "authorids": "~Sotiris_Anagnostidis1;~Gregor_Bachmann1;~Thomas_Hofmann1",
        "gender": "M;M;M",
        "homepage": ";http://www.da.inf.ethz.ch/people/GregorBachmann;http://www.da.inf.ethz.ch/",
        "dblp": "286/1763;;h/ThHofmann",
        "google_scholar": "qjzTKWUAAAAJ;bbGqqloAAAAJ;T3hAyLkAAAAJ",
        "orcid": ";;",
        "linkedin": "sotiris-anagnostidis-b064a5129/;;thomas-hofmann-1ab2402/",
        "or_profile": "~Sotiris_Anagnostidis1;~Gregor_Bachmann1;~Thomas_Hofmann1",
        "aff": "ETH Zurich;Swiss Federal Institute of Technology;Swiss Federal Institute of Technology",
        "aff_domain": "inf.ethz.ch;ethz.ch;ethz.ch",
        "position": "PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nanagnostidis2024navigating,\ntitle={Navigating Scaling Laws: Accelerating Vision Transformer's Training via Adaptive Strategies},\nauthor={Sotiris Anagnostidis and Gregor Bachmann and Thomas Hofmann},\nyear={2024},\nurl={https://openreview.net/forum?id=KQALhPTAfj}\n}",
        "github": "",
        "project": "",
        "reviewers": "oGK8;76wg;SgbS;oxcs",
        "site": "https://openreview.net/forum?id=KQALhPTAfj",
        "pdf_size": 3204190,
        "rating": "3;3;3;6",
        "confidence": "3;3;3;4",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "4;2;2;4",
        "wc_summary": "67;204;109;154",
        "wc_strengths": "102;48;45;63",
        "wc_weaknesses": "162;30;164;197",
        "wc_questions": "85;20;33;9",
        "wc_review": "416;302;351;423",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "530;94;299;275",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            1.0
        ],
        "wc_summary_avg": [
            133.5,
            51.022054055084844
        ],
        "wc_strengths_avg": [
            64.5,
            22.699118925632334
        ],
        "wc_weaknesses_avg": [
            138.25,
            64.02489750089414
        ],
        "wc_questions_avg": [
            36.75,
            29.123658767400773
        ],
        "wc_review_avg": [
            373.0,
            49.684001449158664
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            299.5,
            154.8878626619917
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7903665062556988829&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "ETH Zurich;Swiss Federal Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ethz.ch;https://www.ethz.ch",
        "aff_unique_abbr": "ETHZ;ETH Zurich",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Switzerland"
    },
    {
        "title": "Learning from Label Proportions: Bootstrapping Supervised Learners via Belief Propagation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18905",
        "id": "KQe9tHd0k8",
        "author_site": "Shreyas Havaldar, Navodita Sharma, Shubhi Sareen, Karthikeyan Shanmugam, Aravindan Raghuveer",
        "tldr": "",
        "abstract": "Learning from Label Proportions (LLP) is a learning problem where only aggregate level labels are available for groups of instances, called bags, during training, and the aim is to get the best performance at the instance-level on the test data. This setting arises in domains like advertising and medicine due to privacy considerations. We propose a novel algorithmic framework for this problem that iteratively performs two main steps. For the first step (Pseudo Labeling) in every iteration, we define a Gibbs distribution over binary instance labels that incorporates a) covariate information through the constraint that instances with similar covariates should have similar labels and b) the bag level aggregated label. We then use Belief Propagation (BP) to marginalize the Gibbs distribution to obtain pseudo labels. In the second step (Embedding Refinement), we use the pseudo labels to provide supervision for a learner that yields a better embedding. Further, we iterate on the two steps again by using the second step's embeddings as new covariates for the next iteration. In the final iteration, a classifier is trained using the pseudo labels. Our algorithm displays strong gains  against several SOTA baselines (upto **15%**) for the LLP Binary Classification problem on various dataset types - tabular and Image. We achieve these improvements with minimal computational overhead above standard supervised learning due to Belief Propagation, for large bag sizes, even for a million samples.",
        "keywords": "Learning from Label Proportions;Belief Propagation;Pseudo-Labeling;Embedding Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Shreyas Havaldar;Navodita Sharma;Shubhi Sareen;Karthikeyan Shanmugam;Aravindan Raghuveer",
        "authorids": "~Shreyas_Havaldar1;~Navodita_Sharma1;~Shubhi_Sareen1;~Karthikeyan_Shanmugam1;~Aravindan_Raghuveer1",
        "gender": "F;F;M;M;M",
        "homepage": "https://navoditas.github.io/;;https://sites.google.com/corp/view/karthikeyan-shanmugam/;;https://shreyashavaldar7.github.io",
        "dblp": "260/0686;;;20/1664;260/7163.html",
        "google_scholar": "https://scholar.google.co.in/citations?user=hcsR-tMAAAAJ;;https://scholar.google.ca/citations?user=m4DyPcUAAAAJ;;Q2aGAk8AAAAJ",
        "orcid": ";;0009-0008-2879-5868;;",
        "linkedin": "navodita-sharma/;shubhi-sareen;;;shreyas-havaldar-71377b182",
        "or_profile": "~Navodita_Sharma1;~Shubhi_Sareen1;~Karthikeyan_Shanmugam1;~Aravindan_Raghuveer1;~Shreyas_Jayant_Havaldar1",
        "aff": "Google;Google;Google Research;Google;Google Deepmind",
        "aff_domain": "google.com;google.com;google.com;google.com;google.com",
        "position": "Researcher;Researcher;Researcher;Principal Researcher;Researcher",
        "bibtex": "@inproceedings{\nhavaldar2024learning,\ntitle={Learning from Label Proportions: Bootstrapping Supervised Learners via Belief Propagation},\nauthor={Shreyas Havaldar and Navodita Sharma and Shubhi Sareen and Karthikeyan Shanmugam and Aravindan Raghuveer},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=KQe9tHd0k8}\n}",
        "github": "",
        "project": "",
        "reviewers": "hQ1X;TNZ1;Svbj;XP46;c8fH",
        "pdf_size": 698587,
        "rating": "5;5;5;6;8",
        "confidence": "4;3;4;3;4",
        "soundness": "3;2;2;3;3",
        "contribution": "2;2;2;3;3",
        "presentation": "3;2;3;3;4",
        "wc_summary": "67;67;68;55;137",
        "wc_strengths": "28;37;53;75;32",
        "wc_weaknesses": "36;187;249;194;12",
        "wc_questions": "193;113;50;26;163",
        "wc_review": "324;404;420;350;344",
        "wc_reply_reviewers": "0;157;219;182;35",
        "wc_reply_authors": "1330;2610;2742;776;931",
        "reply_reviewers": "0;1;1;1;1",
        "reply_authors": "3;4;6;2;2",
        "rating_avg": [
            5.8,
            1.16619037896906
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            3.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            78.8,
            29.49169374586682
        ],
        "wc_strengths_avg": [
            45.0,
            17.23948955160796
        ],
        "wc_weaknesses_avg": [
            135.6,
            93.92465065146637
        ],
        "wc_questions_avg": [
            109.0,
            63.80909026149801
        ],
        "wc_review_avg": [
            368.4,
            36.9735040265323
        ],
        "wc_reply_reviewers_avg": [
            118.6,
            85.59112103483632
        ],
        "wc_reply_authors_avg": [
            1677.8,
            835.8752059966846
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            3.4,
            1.4966629547095764
        ],
        "replies_avg": [
            30,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.21004201260420152,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8907520181881916381&as_sdt=8005&sciodt=0,7&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=KQe9tHd0k8",
        "pdf": "https://openreview.net/pdf?id=KQe9tHd0k8",
        "email": "google.com;google.com;google.com;google.com;google.com",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0;1",
        "aff_unique_norm": "Google;DeepMind",
        "aff_unique_dep": "Google;DeepMind",
        "aff_unique_url": "https://www.google.com;https://deepmind.com",
        "aff_unique_abbr": "Google;DeepMind",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Mountain View;",
        "aff_country_unique_index": "0;0;0;0;1",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "KQfCboYwDK",
        "title": "Adiabatic replay for continual learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "To avoid catastrophic forgetting, replay-based approaches to continual learning (CL) require, for each learning phase with new data, the replay of samples representing all of the previously learned knowledge. Since this knowledge grows over time, replay approaches invest linearly growing computational resources just re-learning what is already known. In this proof-of-concept study, we propose a generative replay-based CL strategy that we term adiabatic replay (AR), which achieves CL in constant time and memory complexity by making use of the (very common) situation where each new learning phase is adiabatic, i.e., represents only a small addition to existing knowledge.\nAR owes its efficiency to the selective replay of samples that are similar to newly arriving ones. Indiscriminate replay is not required since AR is based on Gaussian Mixture Models (GMMs), which are capable of selectively updating their internal representation without catastrophic forgetting. Thus, the amount of to-be-replayed samples need not to depend on the amount of previously acquired knowledge at all. Based on the challenging CIFAR, SVHN and Fruits datasets in combination with foundation models, we confirm AR's superior scaling behavior while showing better accuracy than deep generative replay using VAEs and vanilla experience replay.",
        "keywords": "continual learning ; replay ; mixture models",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Alexander Krawczyk;Alexander Gepperth",
        "authorids": "~Alexander_Krawczyk1;~Alexander_Gepperth1",
        "gender": "M;M",
        "homepage": "https://hs-fulda.de;http://www.gepperth.net",
        "dblp": ";05/11166",
        "google_scholar": ";QR2zb3IAAAAJ",
        "orcid": ";0000-0003-2216-7808",
        "linkedin": ";",
        "or_profile": "~Alexander_Krawczyk1;~Alexander_Gepperth1",
        "aff": "Hochschule Fulda;HAW Fulda",
        "aff_domain": "hs-fulda.de;informatik.hs-fulda.de",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nkrawczyk2024adiabatic,\ntitle={Adiabatic replay for continual learning},\nauthor={Alexander Krawczyk and Alexander Gepperth},\nyear={2024},\nurl={https://openreview.net/forum?id=KQfCboYwDK}\n}",
        "github": "",
        "project": "",
        "reviewers": "po4B;ew63;M6q9;m3N7",
        "site": "https://openreview.net/forum?id=KQfCboYwDK",
        "pdf_size": 1103553,
        "rating": "3;3;3;5",
        "confidence": "5;5;4;4",
        "soundness": "2;2;2;2",
        "contribution": "2;2;2;3",
        "presentation": "3;1;2;2",
        "wc_summary": "89;59;121;109",
        "wc_strengths": "60;29;33;113",
        "wc_weaknesses": "315;95;235;632",
        "wc_questions": "36;237;31;51",
        "wc_review": "500;420;420;905",
        "wc_reply_reviewers": "0;227;162;191",
        "wc_reply_authors": "697;790;884;794",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "2;3;3;3",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            94.5,
            23.46806340540267
        ],
        "wc_strengths_avg": [
            58.75,
            33.51398961627815
        ],
        "wc_weaknesses_avg": [
            319.25,
            196.98778515430848
        ],
        "wc_questions_avg": [
            88.75,
            85.90801767006383
        ],
        "wc_review_avg": [
            561.25,
            201.13350665664834
        ],
        "wc_reply_reviewers_avg": [
            145.0,
            86.82453570276088
        ],
        "wc_reply_authors_avg": [
            791.25,
            66.13386046496908
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            0.4330127018922193
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15030232459206923851&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Hochschule Fulda;Fulda University of Applied Sciences",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.hs-fulda.de;https://www.haw-fulda.de",
        "aff_unique_abbr": ";HAW Fulda",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Fulda",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "KQm3IUWxwb",
        "title": "Disentangled Heterogeneous Collaborative Filtering",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Modern recommender systems often utilize low-dimensional latent representations to embed users and items based on their observed interactions. However, many existing recommendation models are primarily designed for coarse-grained and homogeneous interactions, which limits their effectiveness in two key dimensions: i) They fail to exploit the relational dependencies across different types of user behaviors, such as page views, add-to-favorites, and purchases. ii) They struggle to encode the fine-grained latent factors that drive user interaction patterns. In this study, we introduce DHCF, an efficient and effective contrastive learning recommendation model that effectively disentangles users' multi-behavior interaction patterns and the latent intent factors behind each behavior. Our model achieves this through the integration of intent disentanglement and multi-behavior modeling using a parameterized heterogeneous hypergraph architecture. Additionally, we propose a novel contrastive learning paradigm that adaptively explores the benefits of multi-behavior contrastive self-supervised augmentation, thereby improving the model's robustness against data sparsity. Through extensive experiments conducted on three public datasets, we demonstrate the effectiveness of DHCF, which significantly outperforms various strong baselines with competitive efficiency.",
        "keywords": "Collaborative Filtering;Recommender System;Contrastive Learning",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/10fa19a1876abe5a0e35ceb47c7c7009a26cf68f.pdf",
        "author": "Lianghao Xia;Meiyan Xie;Long Xia;Yong Xu;Dawei Yin;Chao Huang",
        "authorids": "~Lianghao_Xia1;~Meiyan_Xie3;~Long_Xia1;~Yong_Xu2;~Dawei_Yin1;~Chao_Huang7",
        "gender": "M;F;;M;M;M",
        "homepage": "https://akaxlh.github.io/;https://github.com/xiemy2/DHCF-main;;;https://www.yindawei.com/;",
        "dblp": "270/6586;;160/7582;07/4630-7;;",
        "google_scholar": "fDDjoUEAAAAJ;;https://scholar.google.ca/citations?hl=en;;GuQ9bpAAAAAJ;Zkv9FqwAAAAJ",
        "orcid": "0000-0003-0725-2211;;;;0000-0002-0684-6205;",
        "linkedin": ";;;;dwyin/;",
        "or_profile": "~Lianghao_Xia1;~Meiyan_Xie3;~Long_Xia1;~Yong_Xu2;~Dawei_Yin1;~Chao_Huang7",
        "aff": "University of Hong Kong;;Baidu Inc.;South China University of Technology;Baidu;University of Hong Kong",
        "aff_domain": "hku.hk;;baidu.com;scut.edu.cn;baidu.com;hku.hk",
        "position": "Postdoc;;Research & Develop Engineer;Full Professor;Principal Researcher;Assistant Professor",
        "bibtex": "@misc{\nxia2024disentangled,\ntitle={Disentangled Heterogeneous Collaborative Filtering},\nauthor={Lianghao Xia and Meiyan Xie and Long Xia and Yong Xu and Dawei Yin and Chao Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=KQm3IUWxwb}\n}",
        "github": "",
        "project": "",
        "reviewers": "7WGw;KKy5;TWFu",
        "site": "https://openreview.net/forum?id=KQm3IUWxwb",
        "pdf_size": 1745248,
        "rating": "3;5;6",
        "confidence": "2;2;4",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "3;3;4",
        "wc_summary": "156;55;44",
        "wc_strengths": "135;32;34",
        "wc_weaknesses": "181;79;85",
        "wc_questions": "108;64;51",
        "wc_review": "580;230;214",
        "wc_reply_reviewers": "0;19;31",
        "wc_reply_authors": "601;595;565",
        "reply_reviewers": "0;1;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            85.0,
            50.40502620440412
        ],
        "wc_strengths_avg": [
            67.0,
            48.09019304043878
        ],
        "wc_weaknesses_avg": [
            115.0,
            46.73328578219169
        ],
        "wc_questions_avg": [
            74.33333333333333,
            24.390344173235622
        ],
        "wc_review_avg": [
            341.3333333333333,
            168.88918128629658
        ],
        "wc_reply_reviewers_avg": [
            16.666666666666668,
            12.762793146051099
        ],
        "wc_reply_authors_avg": [
            587.0,
            15.748015748023622
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.7559289460184546,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:1Z7RVr8x_WIJ:scholar.google.com/&scioq=Disentangled+Heterogeneous+Collaborative+Filtering&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;1;0",
        "aff_unique_norm": "University of Hong Kong;Baidu;South China University of Technology",
        "aff_unique_dep": ";Baidu Inc.;",
        "aff_unique_url": "https://www.hku.hk;https://www.baidu.com;https://www.scut.edu.cn",
        "aff_unique_abbr": "HKU;Baidu;SCUT",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Proving Test Set Contamination in Black-Box Language Models",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18904",
        "id": "KS8mIvetg2",
        "author_site": "Yonatan Oren, Nicole Meister, Niladri Chatterji, Faisal Ladhak, Tatsunori Hashimoto",
        "tldr": "",
        "abstract": "Large language models are trained on vast amounts of internet data, prompting concerns that they have memorized public benchmarks. Detecting this type of contamination is challenging because the pretraining data used by proprietary models are often not publicly accessible.\n\nWe propose a procedure for detecting test set contamination of language models with exact false positive guarantees and without access to pretraining data or model weights. Our approach leverages the fact that when there is no data contamination, all orderings of an exchangeable benchmark should be equally likely. In contrast, the tendency for language models to memorize example order means that a contaminated language model will find certain canonical orderings to be much more likely than others. Our test flags potential contamination whenever the likelihood of a canonically ordered benchmark dataset is significantly higher than the likelihood after shuffling the examples.\n\nWe demonstrate that our procedure is sensitive enough to reliably detect contamination in challenging situations, including models as small as 1.4 billion parameters, on small test sets only 1000 examples, and datasets that appear only a few times in the pretraining corpus. Finally, we evaluate LLaMA-2 to apply our test in a realistic setting and find our results to be consistent with existing contamination evaluations.",
        "keywords": "language modeling;memorization;dataset contamination",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/aa53d1c5e16ec98e4af4f92f0eef6c0e5dfe7646.zip",
        "author": "Yonatan Oren;Nicole Meister;Niladri S. Chatterji;Faisal Ladhak;Tatsunori Hashimoto",
        "authorids": "~Yonatan_Oren1;~Nicole_Meister1;~Niladri_S._Chatterji1;~Faisal_Ladhak2;~Tatsunori_Hashimoto1",
        "gender": ";F;;;M",
        "homepage": ";https://nicolemeister.github.io/;;http://www.cs.columbia.edu/~faisal/;https://thashim.github.io",
        "dblp": ";;;194/1214.html;",
        "google_scholar": ";2twOzaMAAAAJ;;uF25ydEAAAAJ;5ygiTwsAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";nicole-meister-063b29177/;;;",
        "or_profile": "~Yonatan_Oren1;~Nicole_Meister1;~Niladri_S._Chatterji1;~Faisal_Ladhak2;~Tatsunori_Hashimoto1",
        "aff": ";Stanford University;;NVIDIA;Stanford University",
        "aff_domain": ";stanford.edu;;nvidia.com;stanford.edu",
        "position": ";PhD student;;Researcher;Assistant Professor",
        "bibtex": "@inproceedings{\noren2024proving,\ntitle={Proving Test Set Contamination in Black-Box Language Models},\nauthor={Yonatan Oren and Nicole Meister and Niladri S. Chatterji and Faisal Ladhak and Tatsunori Hashimoto},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=KS8mIvetg2}\n}",
        "github": "",
        "project": "",
        "reviewers": "FS83;gkwi;Rgfh;jRLi",
        "pdf_size": 6611500,
        "rating": "6;8;8;8",
        "confidence": "3;3;3;3",
        "soundness": "2;3;3;3",
        "contribution": "2;3;4;3",
        "presentation": "3;3;4;3",
        "wc_summary": "108;130;184;117",
        "wc_strengths": "73;107;26;35",
        "wc_weaknesses": "107;60;46;12",
        "wc_questions": "27;11;27;50",
        "wc_review": "315;308;283;214",
        "wc_reply_reviewers": "0;18;0;0",
        "wc_reply_authors": "598;296;365;100",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            134.75,
            29.49046456059992
        ],
        "wc_strengths_avg": [
            60.25,
            32.24418552235426
        ],
        "wc_weaknesses_avg": [
            56.25,
            34.10553474144629
        ],
        "wc_questions_avg": [
            28.75,
            13.899190623917638
        ],
        "wc_review_avg": [
            280.0,
            39.91866731242415
        ],
        "wc_reply_reviewers_avg": [
            4.5,
            7.794228634059948
        ],
        "wc_reply_authors_avg": [
            339.75,
            177.9920995437719
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 137,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17214649765313120025&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=KS8mIvetg2",
        "pdf": "https://openreview.net/pdf?id=KS8mIvetg2",
        "email": ";stanford.edu;;nvidia.com;stanford.edu",
        "author_num": 5,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Stanford University;NVIDIA",
        "aff_unique_dep": ";NVIDIA Corporation",
        "aff_unique_url": "https://www.stanford.edu;https://www.nvidia.com",
        "aff_unique_abbr": "Stanford;NVIDIA",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Stanford;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Memorization in Self-Supervised Learning Improves Downstream Generalization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18903",
        "id": "KSjPaXtxP8",
        "author_site": "Wenhao Wang, Muhammad Ahmad Kaleem, Adam Dziedzic, Michael Backes, Nicolas Papernot, Franziska Boenisch",
        "tldr": "",
        "abstract": "Self-supervised learning (SSL) has recently received significant attention due to its ability to train high-performance encoders purely on unlabeled data---often scraped from the internet. This data can still be sensitive and empirical evidence suggests that SSL encoders memorize private information of their training data and can disclose them at inference time. Since existing theoretical definitions of memorization from supervised learning rely on labels, they do not transfer to SSL. To address this gap, we propose a framework for defining memorization within the context of SSL. Our definition compares the difference in alignment of representations for data points and their augmented views returned by both encoders that were trained on these data points and encoders that were not. Through comprehensive empirical analysis on diverse encoder architectures and datasets we highlight that even though SSL relies on large datasets and strong augmentations---both known in supervised learning as regularization techniques that reduce overfitting---still significant fractions of training data points experience high memorization. Through our empirical results, we show that this memorization is essential for encoders to achieve higher generalization performance on different downstream tasks.",
        "keywords": "self-supervised learning;memorization;encoders;generalization;ssl",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/a2475e370476fec11f57db53e322a0203593e0a5.zip",
        "author": "Wenhao Wang;Muhammad Ahmad Kaleem;Adam Dziedzic;Michael Backes;Nicolas Papernot;Franziska Boenisch",
        "authorids": "~Wenhao_Wang6;~Muhammad_Ahmad_Kaleem1;~Adam_Dziedzic1;~Michael_Backes3;~Nicolas_Papernot1;~Franziska_Boenisch2",
        "gender": "M;;;;M;",
        "homepage": "https://wenhaowang1995.github.io/;;;;https://www.papernot.fr;",
        "dblp": ";;;;162/1405;",
        "google_scholar": ";;;;cGxq0cMAAAAJ;",
        "orcid": "0000-0001-7566-2322;;;;;",
        "linkedin": ";;;;nicolaspapernot;",
        "or_profile": "~Wenhao_Wang6;~Muhammad_Ahmad_Kaleem1;~Adam_Dziedzic1;~Michael_Backes3;~Nicolas_Papernot1;~Franziska_Boenisch2",
        "aff": "CISPA, saarland university, saarland informatics campus;;;;Google;",
        "aff_domain": "cispa.saarland;;;;google.com;",
        "position": "PhD student;;;;Research Scientist;",
        "bibtex": "@inproceedings{\nwang2024memorization,\ntitle={Memorization in Self-Supervised Learning Improves Downstream Generalization},\nauthor={Wenhao Wang and Muhammad Ahmad Kaleem and Adam Dziedzic and Michael Backes and Nicolas Papernot and Franziska Boenisch},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=KSjPaXtxP8}\n}",
        "github": "",
        "project": "",
        "reviewers": "ukN9;mj5F;fWKE;tPGb",
        "pdf_size": 1575093,
        "rating": "6;6;6;8",
        "confidence": "4;4;3;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "84;63;75;97",
        "wc_strengths": "29;74;20;151",
        "wc_weaknesses": "51;257;80;273",
        "wc_questions": "404;323;32;206",
        "wc_review": "568;717;207;727",
        "wc_reply_reviewers": "22;67;0;137",
        "wc_reply_authors": "2523;2348;494;1860",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "4;5;1;6",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            79.75,
            12.43734296383275
        ],
        "wc_strengths_avg": [
            68.5,
            51.838692113131096
        ],
        "wc_weaknesses_avg": [
            165.25,
            100.43499141235588
        ],
        "wc_questions_avg": [
            241.25,
            139.82019703891137
        ],
        "wc_review_avg": [
            554.75,
            210.4166996699644
        ],
        "wc_reply_reviewers_avg": [
            56.5,
            52.376044142336674
        ],
        "wc_reply_authors_avg": [
            1806.25,
            795.630685368532
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.0,
            1.8708286933869707
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12926707889804301102&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 9,
        "openreview": "https://openreview.net/forum?id=KSjPaXtxP8",
        "pdf": "https://openreview.net/pdf?id=KSjPaXtxP8",
        "email": "cispa.saarland;;;;google.com;",
        "author_num": 6,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Saarland University;Google",
        "aff_unique_dep": "CISPA;Google",
        "aff_unique_url": "https://www.uni-saarland.de;https://www.google.com",
        "aff_unique_abbr": "Saarland U;Google",
        "aff_campus_unique_index": "0;1",
        "aff_campus_unique": "Saarland Informatics Campus;Mountain View",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Germany;United States"
    },
    {
        "id": "KSvRZFCy7s",
        "title": "Differentially Private Low-dimensional Synthetic Data from High-dimensional Datasets",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Differentially private synthetic data provide a powerful mechanism to enable data analysis while protecting sensitive information about individuals. However, when the data lie in a high-dimensional space, the accuracy of the synthetic data suffers from the curse of dimensionality. In this paper, we propose a differentially private algorithm to generate low-dimensional synthetic data efficiently from a high-dimensional dataset with a utility guarantee with respect to the Wasserstein distance. A key step of our algorithm is a private principal component analysis (PCA) procedure with a near-optimal accuracy bound that circumvents the curse of dimensionality. Unlike the standard perturbation analysis, our analysis of private PCA works without assuming the spectral gap for the covariance matrix.",
        "keywords": "synthetic data;differential privacy",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Yiyun He;Thomas Strohmer;Roman Vershynin;Yizhe Zhu",
        "authorids": "~Yiyun_He1;~Thomas_Strohmer1;~Roman_Vershynin1;~Yizhe_Zhu1",
        "gender": "M;;M;M",
        "homepage": ";;https://www.math.uci.edu/~rvershyn/;https://sites.google.com/uci.edu/yizhezhu",
        "dblp": "340/3777;;67/6061;200/0318",
        "google_scholar": "sxzaDWoAAAAJ;;;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Yiyun_He1;~Thomas_Strohmer1;~Roman_Vershynin1;~Yizhe_Zhu1",
        "aff": "University of California, Irvine;;University of California, Irvine;University of Southern California",
        "aff_domain": "uci.edu;;uci.edu;usc.edu",
        "position": "PhD student;;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nhe2024differentially,\ntitle={Differentially Private Low-dimensional Synthetic Data from High-dimensional Datasets},\nauthor={Yiyun He and Thomas Strohmer and Roman Vershynin and Yizhe Zhu},\nyear={2024},\nurl={https://openreview.net/forum?id=KSvRZFCy7s}\n}",
        "github": "",
        "project": "",
        "reviewers": "SX6K;nzub;BUYC;7H6Q",
        "site": "https://openreview.net/forum?id=KSvRZFCy7s",
        "pdf_size": 565434,
        "rating": "3;5;5;6",
        "confidence": "4;3;3;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;2;2",
        "presentation": "3;3;2;3",
        "wc_summary": "65;92;43;125",
        "wc_strengths": "32;61;61;59",
        "wc_weaknesses": "194;139;261;118",
        "wc_questions": "115;81;45;196",
        "wc_review": "406;373;410;498",
        "wc_reply_reviewers": "35;0;52;88",
        "wc_reply_authors": "429;559;404;397",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            81.25,
            30.646166155002163
        ],
        "wc_strengths_avg": [
            53.25,
            12.295832627357937
        ],
        "wc_weaknesses_avg": [
            178.0,
            55.37598757584374
        ],
        "wc_questions_avg": [
            109.25,
            55.867588993977535
        ],
        "wc_review_avg": [
            421.75,
            46.30537225851877
        ],
        "wc_reply_reviewers_avg": [
            43.75,
            31.68891762114951
        ],
        "wc_reply_authors_avg": [
            447.25,
            65.60630686145959
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.2294157338705618,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10289060525137970717&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "University of California, Irvine;University of Southern California",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uci.edu;https://www.usc.edu",
        "aff_unique_abbr": "UCI;USC",
        "aff_campus_unique_index": "0;0;1",
        "aff_campus_unique": "Irvine;Los Angeles",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "KTL534o7Ot",
        "title": "Programmable Synthetic Data Generation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large amounts of tabular data remain underutilized due to privacy, data quality, and data sharing limitations. While generating synthetic data resembling the original distribution addresses some of these issues, most applications would benefit from additional customization on the generated data. However, existing synthetic data generation approaches are limited to particular constraints, e.g., differential privacy (DP) or fairness. In this work, we introduce ProgSyn, the first programmable and flexible synthetic tabular data generation framework. Customization is achieved via programmatically declared statistical and logical expressions, supporting a wide range of requirements (e.g., DP or fairness, among others). To ensure high synthetic data quality in the presence of custom specifications, ProgSyn pre-trains a generative model on the original dataset and fine-tunes it on a differentiable loss automatically derived from the provided specifications using novel relaxations. We conduct an extensive experimental evaluation of ProgSyn over four datasets and on numerous custom specifications, where we outperform state-of-the-art specialized approaches on several tasks, while being more general. For instance, at the same fairness level we achieve 2.3% higher downstream accuracy than the state-of-the-art in fair synthetic data generation on the Adult dataset.",
        "keywords": "synthetic data;tabular data;generative modelling",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/f00f3292288b8d3db3332eb3519cb6160063468b.zip",
        "author": "Mark Vero;Mislav Balunovic;Martin Vechev",
        "authorids": "~Mark_Vero1;~Mislav_Balunovic1;~Martin_Vechev1",
        "gender": "M;M;M",
        "homepage": "https://www.sri.inf.ethz.ch/people/markvero;https://www.sri.inf.ethz.ch/people/mislav;https://www.sri.inf.ethz.ch/people/martin",
        "dblp": "319/4985;231/7686;93/2189.html",
        "google_scholar": "vguDYtQAAAAJ;fxkgmGwAAAAJ;https://scholar.google.ch/citations?user=aZ1Rh50AAAAJ",
        "orcid": ";;",
        "linkedin": "https://linkedin.com/in/mark-vero-9a32bb17a;;",
        "or_profile": "~Mark_Vero1;~Mislav_Balunovic1;~Martin_Vechev1",
        "aff": "ETHZ-ETH Zurich;Swiss Federal Institute of Technology;Swiss Federal Institute of Technology",
        "aff_domain": "inf.ethz.ch;ethz.ch;ethz.ch",
        "position": "PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nvero2024programmable,\ntitle={Programmable Synthetic Data Generation},\nauthor={Mark Vero and Mislav Balunovic and Martin Vechev},\nyear={2024},\nurl={https://openreview.net/forum?id=KTL534o7Ot}\n}",
        "github": "",
        "project": "",
        "reviewers": "keAe;XJ8v;Jzns",
        "site": "https://openreview.net/forum?id=KTL534o7Ot",
        "pdf_size": 837862,
        "rating": "5;5;6",
        "confidence": "4;3;5",
        "soundness": "3;3;3",
        "contribution": "2;2;3",
        "presentation": "3;3;3",
        "wc_summary": "55;125;45",
        "wc_strengths": "37;162;80",
        "wc_weaknesses": "277;230;34",
        "wc_questions": "5;212;26",
        "wc_review": "374;729;185",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1422;2698;897",
        "reply_reviewers": "0;0;0",
        "reply_authors": "4;5;3",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            75.0,
            35.59026084010437
        ],
        "wc_strengths_avg": [
            93.0,
            51.85235449491823
        ],
        "wc_weaknesses_avg": [
            180.33333333333334,
            105.23729799310172
        ],
        "wc_questions_avg": [
            81.0,
            93.02687783646186
        ],
        "wc_review_avg": [
            429.3333333333333,
            225.50732927236658
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1672.3333333333333,
            756.2628878607991
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            4.0,
            0.816496580927726
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.8660254037844385,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:oTD1ijduzZwJ:scholar.google.com/&scioq=Programmable+Synthetic+Data+Generation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "ETH Zurich;Swiss Federal Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ethz.ch;https://www.ethz.ch",
        "aff_unique_abbr": "ETHZ;ETH Zurich",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Switzerland"
    },
    {
        "title": "Towards Robust Multi-Modal Reasoning via Model Selection",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18902",
        "id": "KTf4DGAzus",
        "author_site": "Xiangyan Liu, Rongxue LI, Wei Ji, Tao Lin",
        "tldr": "",
        "abstract": "The reasoning capabilities of LLM (Large Language Model) are widely acknowledged in recent research, inspiring studies on tool learning and autonomous agents. LLM serves as the ``brain'' of the agent, orchestrating multiple tools for collaborative multi-step task solving. Unlike methods invoking tools like calculators or weather APIs for straightforward tasks, multi-modal agents excel by integrating diverse AI models for complex challenges. However, current multi-modal agents neglect the significance of model selection: they primarily focus on the planning and execution phases, and will only invoke predefined task-specific models for each subtask, making the execution fragile. Meanwhile, other traditional model selection methods are either incompatible with or suboptimal for the multi-modal agent scenarios, due to ignorance of dependencies among subtasks arising by multi-step reasoning.\n\nTo this end, we identify the key challenges therein and propose the $\\textbf{\\textit{M}}^\\textbf{\\textit{3}}$ framework as a plug-in with negligible runtime overhead at test-time. This framework improves model selection and bolsters the robustness of multi-modal agents in multi-step reasoning. In the absence of suitable benchmarks, we create MS-GQA, a new dataset specifically designed to investigate the model selection challenge in multi-modal agents. Our experiments reveal that our framework enables dynamic model selection, considering both user inputs and subtask dependencies, thereby robustifying the overall reasoning process. Our code and benchmark: https://github.com/LINs-lab/M3.",
        "keywords": "robust model selection;multi-modal learning;multi-step reasoning with LLM",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/e6a59f43f30b8ba137e5e140993d33e386b487d7.zip",
        "author": "Xiangyan Liu;Rongxue LI;Wei Ji;Tao Lin",
        "authorids": "~Xiangyan_Liu1;~Rongxue_LI1;~Wei_Ji1;~Tao_Lin1",
        "gender": "M;;M;M",
        "homepage": "https://github.com/xyliugo;https://github.com/xiaofengzi2019;https://jiwei0523.github.io/;https://lins-lab.github.io/",
        "dblp": ";;52/3220-8;64/4492-4.html",
        "google_scholar": "lsFTg-0AAAAJ;;69OFB-AAAAAJ;QE9pa_cAAAAJ",
        "orcid": ";;0000-0002-8106-9768;0000-0002-3246-6935",
        "linkedin": ";;;",
        "or_profile": "~Xiangyan_Liu1;~Rongxue_LI1;~Wei_Ji1;~Tao_Lin1",
        "aff": "National University of Singapore;Westlake University;Nanjing University;Westlake University",
        "aff_domain": "u.nus.edu;westlake.edu;nju.edu.cn;westlake.edu",
        "position": "MS student;Intern;Associate Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nliu2024towards,\ntitle={Towards Robust Multi-Modal Reasoning via Model Selection},\nauthor={Xiangyan Liu and Rongxue LI and Wei Ji and Tao Lin},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=KTf4DGAzus}\n}",
        "github": "",
        "project": "",
        "reviewers": "1wtR;JZBq;v23h;JtbH",
        "pdf_size": 3749652,
        "rating": "5;5;6;6",
        "confidence": "4;3;4;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;2;3",
        "wc_summary": "172;70;42;51",
        "wc_strengths": "29;67;45;137",
        "wc_weaknesses": "28;250;163;126",
        "wc_questions": "5;2;124;3",
        "wc_review": "234;389;374;317",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "221;1910;953;895",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;4;3;3",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            83.75,
            51.944080509717374
        ],
        "wc_strengths_avg": [
            69.5,
            41.24015033920221
        ],
        "wc_weaknesses_avg": [
            141.75,
            79.6190146887036
        ],
        "wc_questions_avg": [
            33.5,
            52.26136240091718
        ],
        "wc_review_avg": [
            328.5,
            60.81323869027204
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            994.75,
            601.6778103769492
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.75,
            1.0897247358851685
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1803221698623833291&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=KTf4DGAzus",
        "pdf": "https://openreview.net/pdf?id=KTf4DGAzus",
        "email": "u.nus.edu;westlake.edu;nju.edu.cn;westlake.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "National University of Singapore;Westlake University;Nanjing University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.nus.edu.sg;https://www.westlake.edu.cn;https://www.nju.edu.cn",
        "aff_unique_abbr": "NUS;WU;Nanjing U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "Singapore;China"
    },
    {
        "id": "KTq2XSBNsa",
        "title": "MOESART: An Effective Sampling-based Router for Sparse Mixture of Experts",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The sparse Mixture-of-Experts (Sparse-MoE) is a promising framework for efficiently scaling up model capacity. This framework consists of a set of experts (subnetworks) and one or more routers. The routers activate only a small subset of the experts on a per-example basis, which can save on resources. Among the most widely used sparse routers are Top-k and its variants, which activate k experts for each example during training. While very effective at model scaling, these routers are prone to performance issues because of discontinuous nature of the routing problem. Differentiable routers have been shown to mitigate the performance issues of Top-k, but these are not k-sparse during training, which limits their utility. To address this challenge, we propose MOESART: a novel k-sparse routing approach, which maintains k-sparsity during both training and inference. Unlike existing routers, MOESART aims at learning a good k-sparse approximation of the classical, softmax router. We achieve this through carefully designed sampling and expert weighting strategies. We compare MOESART with state-of-the-art MoE routers, through large-scale experiments on 14 datasets from various domains, including recommender systems, vision, and natural language processing. MOESART achieves up to 16% (relative) reduction in out-of-sample loss on standard image datasets, and up to 15% (relative) improvement in AUC on standard recommender systems, over popular k-sparse routers, e.g., Top-k, V-MoE, Expert Choice Router and X-MoE. Moreover, for distilling natural language processing models, MOESART can improve predictive performance by 0.5% (absolute) on average over the Top-k router across 7 GLUE and 2 SQuAD benchmarks.",
        "keywords": "Sparse mixture of experts;Routing in neural networks;Conditional computation",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Shibal Ibrahim;Wenyu Chen;Hussein Hazimeh;Natalia Ponomareva;Rahul Mazumder",
        "authorids": "~Shibal_Ibrahim1;~Wenyu_Chen1;~Hussein_Hazimeh1;~Natalia_Ponomareva1;~Rahul_Mazumder1",
        "gender": "M;;;F;M",
        "homepage": "https://sites.google.com/view/shibal-ibrahim/;;http://www.mit.edu/~hazimeh;;http://www.mit.edu/~rahulmaz/",
        "dblp": "177/1113;;165/0820-1;71/6768-1;11/9365.html",
        "google_scholar": "_ADL3k8AAAAJ;;;eIdQR5oAAAAJ;cyCp3pIAAAAJ",
        "orcid": "0000-0002-3300-0213;;0000-0003-4501-0678;0009-0005-6761-1468;0000-0003-1384-9743",
        "linkedin": "shibal-ibrahim-70097b77;;;;",
        "or_profile": "~Shibal_Ibrahim1;~Wenyu_Chen1;~Hussein_Hazimeh1;~Natalia_Ponomareva1;~Rahul_Mazumder1",
        "aff": "Massachusetts Institute of Technology;;Google;Google;Massachusetts Institute of Technology",
        "aff_domain": "mit.edu;;google.com;google.com;mit.edu",
        "position": "PhD student;;Research Scientist;Software Engineer in Research;Associate Professor",
        "bibtex": "@misc{\nibrahim2024moesart,\ntitle={{MOESART}: An Effective Sampling-based Router for Sparse Mixture of Experts},\nauthor={Shibal Ibrahim and Wenyu Chen and Hussein Hazimeh and Natalia Ponomareva and Rahul Mazumder},\nyear={2024},\nurl={https://openreview.net/forum?id=KTq2XSBNsa}\n}",
        "github": "",
        "project": "",
        "reviewers": "d6Z2;7cYf;Fbe3;diTt",
        "site": "https://openreview.net/forum?id=KTq2XSBNsa",
        "pdf_size": 2616446,
        "rating": "5;5;5;6",
        "confidence": "4;3;4;2",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;2;3",
        "wc_summary": "58;33;47;73",
        "wc_strengths": "40;10;37;59",
        "wc_weaknesses": "284;29;283;86",
        "wc_questions": "55;24;56;63",
        "wc_review": "437;96;423;281",
        "wc_reply_reviewers": "313;0;0;0",
        "wc_reply_authors": "1983;506;972;622",
        "reply_reviewers": "2;0;0;0",
        "reply_authors": "3;1;2;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            52.75,
            14.669270602180601
        ],
        "wc_strengths_avg": [
            36.5,
            17.471405209656147
        ],
        "wc_weaknesses_avg": [
            170.5,
            114.78349184442857
        ],
        "wc_questions_avg": [
            49.5,
            15.041608956491324
        ],
        "wc_review_avg": [
            309.25,
            137.4161107730822
        ],
        "wc_reply_reviewers_avg": [
            78.25,
            135.53297569226464
        ],
        "wc_reply_authors_avg": [
            1020.75,
            581.4358842555214
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.8703882797784891,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:RIdqV4SIf-gJ:scholar.google.com/&scioq=MOESART:+An+Effective+Sampling-based+Router+for+Sparse+Mixture+of+Experts&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;0",
        "aff_unique_norm": "Massachusetts Institute of Technology;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://web.mit.edu;https://www.google.com",
        "aff_unique_abbr": "MIT;Google",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "CORN: Contact-based Object Representation for Nonprehensile Manipulation of General Unseen Objects",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18901",
        "id": "KTtEICH4TO",
        "author_site": "Yoonyoung Cho, Junhyek Han, Yoontae Cho, Beomjoon Kim",
        "tldr": "",
        "abstract": "Nonprehensile manipulation is essential for manipulating objects that are too thin, large, or otherwise ungraspable in the wild. To sidestep the difficulty of contact modeling in conventional modeling-based approaches, reinforcement learning (RL) has recently emerged as a promising alternative. However, previous RL approaches either lack the ability to generalize over diverse object shapes, or use simple action primitives that limit the diversity of robot motions. Furthermore, using RL over diverse object geometry is challenging due to the high cost of training a policy that takes in high-dimensional sensory inputs. We propose a novel contact-based object representation and pretraining pipeline to tackle this. To enable massively parallel training, we leverage a lightweight patch-based transformer architecture for our encoder that processes point clouds, thus scaling our training across thousands of environments. Compared to learning from scratch, or other shape representation baselines, our representation facilitates both time- and data-efficient learning. We validate the efficacy of our overall system by zero-shot transferring the trained policy to novel real-world objects. We highly recommend the video attached in the supplementary material. Code and videos are available at \\url{https://sites.google.com/view/contact-non-prehensile}.",
        "keywords": "pretraining;robotics;manipulation;object representation;representation learning",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/7b9d6b575b4cf1f40ee33003886bcdc8106880b7.zip",
        "author": "Yoonyoung Cho;Junhyek Han;Yoontae Cho;Beomjoon Kim",
        "authorids": "~Yoonyoung_Cho1;~Junhyek_Han1;~Yoontae_Cho1;~Beomjoon_Kim2",
        "gender": ";;M;M",
        "homepage": "https://github.com/yycho0108;https://junhyekh.github.io/;https://github.com/YoontaeCho;https://beomjoonkim.github.io/",
        "dblp": ";;;88/1505",
        "google_scholar": ";;;https://scholar.google.ca/citations?user=dw3rEwgAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Yoonyoung_Cho1;~Junhyek_Han1;~Yoontae_Cho1;~Beomjoon_Kim2",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology (kaist.ac.kr);;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr;;kaist.ac.kr",
        "position": "PhD student;MS student;;Assistant Professor",
        "bibtex": "@inproceedings{\ncho2024corn,\ntitle={{CORN}: Contact-based Object Representation for Nonprehensile Manipulation of General Unseen Objects},\nauthor={Yoonyoung Cho and Junhyek Han and Yoontae Cho and Beomjoon Kim},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=KTtEICH4TO}\n}",
        "github": "",
        "project": "",
        "reviewers": "dbmK;LafH;UC4D;4HBK",
        "pdf_size": 12664919,
        "rating": "5;5;8;10",
        "confidence": "4;3;4;4",
        "soundness": "2;2;3;4",
        "contribution": "2;2;2;4",
        "presentation": "2;3;2;4",
        "wc_summary": "59;81;63;92",
        "wc_strengths": "34;69;70;138",
        "wc_weaknesses": "375;258;98;90",
        "wc_questions": "5;47;48;88",
        "wc_review": "473;455;279;408",
        "wc_reply_reviewers": "526;0;23;0",
        "wc_reply_authors": "2339;811;607;383",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "4;2;1;1",
        "rating_avg": [
            7.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            73.75,
            13.40475661845451
        ],
        "wc_strengths_avg": [
            77.75,
            37.68537514739637
        ],
        "wc_weaknesses_avg": [
            205.25,
            118.72526058088901
        ],
        "wc_questions_avg": [
            47.0,
            29.351320242878344
        ],
        "wc_review_avg": [
            403.75,
            75.83328754577373
        ],
        "wc_reply_reviewers_avg": [
            137.25,
            224.64124176116906
        ],
        "wc_reply_authors_avg": [
            1035.0,
            767.9322886817561
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5443310539518174,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11036191559004000508&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=KTtEICH4TO",
        "pdf": "https://openreview.net/pdf?id=KTtEICH4TO",
        "email": "kaist.ac.kr;kaist.ac.kr;;kaist.ac.kr",
        "author_num": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "KTyMKIHbg3",
        "title": "A UCB-type of Approach for Nonstationary MDPs with General Function Approximation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Function approximation has experienced significant success in the field of reinforcement learning (RL). Despite a handful of progress on developing theory for Nonstationary RL with function approximation under structural assumptions, existing work for nonstationary RL with general function approximation \\citet{Feng:nonstationary:ICML:2023} studied the confidence-set based algorithm relying on an oracle to select the optimistic state-action value function within the confidence set, which is computationally inefficient. To mitigate the drawback of confidence-set based algorithm, in this work, we propose a popular UCB-type of algorithm for nonstationary RL with general function approximation. Our algorithm features the restart mechanism and a new design of bonus term to handle nonstationarity. We then establish a dynamic regret upper bound for the proposed algorithm, and demonstrate the dynamic regret bound for the examples of nonstationary tabular MDPs and nonstationary linear MDPs. To the best of our knowledge, this is the first UCB-type of algorithm for non-stationary RL with general function approximation. Our theory contributes to the recent progress on RL with general function approximation.",
        "keywords": "nonstationary MDP;general function approximation;eluder dimension",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Songtao Feng;Ming Yin;Jie Fu;Jing Yang;Yingbin Liang",
        "authorids": "~Songtao_Feng1;~Ming_Yin4;~Jie_Fu5;~Jing_Yang3;~Yingbin_Liang1",
        "gender": "M;M;F;;F",
        "homepage": ";https://mingyin0312.github.io;https://fujie.ece.ufl.edu/;http://www.ee.psu.edu/yang;https://sites.google.com/view/yingbinliang/home",
        "dblp": "217/1741;89/453.html;16/7565-2;;51/332",
        "google_scholar": "q11fVdcAAAAJ;ncBRYIUAAAAJ;B5sj3WEAAAAJ;https://scholar.google.com/citations?hl=en;lGgLAiIAAAAJ",
        "orcid": ";0000-0001-6458-0751;0000-0002-4470-2827;;",
        "linkedin": ";;;;",
        "or_profile": "~Songtao_Feng1;~Ming_Yin4;~Jie_Fu5;~Jing_Yang3;~Yingbin_Liang1",
        "aff": "University of Florida;Princeton University;University of Florida;Pennsylvania State University;The Ohio State University",
        "aff_domain": "ufl.edu;princeton.edu;ufl.edu;psu.edu;osu.edu",
        "position": "Postdoc;Postdoc;Assistant Professor;Associate Professor;Professor",
        "bibtex": "@misc{\nfeng2024a,\ntitle={A {UCB}-type of Approach for Nonstationary {MDP}s with General Function Approximation},\nauthor={Songtao Feng and Ming Yin and Jie Fu and Jing Yang and Yingbin Liang},\nyear={2024},\nurl={https://openreview.net/forum?id=KTyMKIHbg3}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=KTyMKIHbg3",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:C8J-GJVhtyoJ:scholar.google.com/&scioq=A+UCB-type+of+Approach+for+Nonstationary+MDPs+with+General+Function+Approximation&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;2;3",
        "aff_unique_norm": "University of Florida;Princeton University;Pennsylvania State University;Ohio State University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.ufl.edu;https://www.princeton.edu;https://www.psu.edu;https://www.osu.edu",
        "aff_unique_abbr": "UF;Princeton;PSU;OSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "MathVista: Evaluating Mathematical Reasoning of Foundation Models in Visual Contexts",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18900",
        "id": "KUNzEQMWU7",
        "author_site": "Pan Lu, Hritik Bansal, Tony Xia, Jiacheng Liu, Chunyuan Li, Hannaneh Hajishirzi, Hao Cheng, Kai-Wei Chang, Michel Galley, Jianfeng Gao",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) and Large Multimodal Models (LMMs) exhibit impressive problem-solving skills in many tasks and domains, but their ability in mathematical reasoning in visual contexts has not been systematically studied. To bridge this gap, we present MathVista, a benchmark designed to combine challenges from diverse mathematical and visual tasks. It consists of 6,141 examples, derived from 28 existing multimodal datasets involving mathematics and 3 newly created datasets (i.e., IQTest, FunctionQA, and PaperQA). Completing these tasks requires fine-grained, deep visual understanding and compositional reasoning, which all state-of-the-art foundation models find challenging. With MathVista, we have conducted a comprehensive, quantitative evaluation of 12 prominent foundation models. The best-performing GPT-4V model achieves an overall accuracy of 49.9%, substantially outperforming Bard, the second-best performer, by 15.1%. Our in-depth analysis reveals that the superiority of GPT-4V is mainly attributed to its enhanced visual perception and mathematical reasoning. However, GPT-4V still falls short of human performance by 10.4%, as it often struggles to understand complex figures and perform rigorous reasoning. This significant gap underscores the critical role that MathVista will play in the development of general-purpose AI agents capable of tackling mathematically intensive and visually rich real-world tasks. We further explore the new ability of self-verification, the application of self-consistency, and the interactive chatbot capabilities of GPT-4V, highlighting its promising potential for future research. The project is available at https://mathvista.github.io/.",
        "keywords": "large language models;large multimodal models;mathematical reasoning;vision-language reasoning;foundation models and their evaluations",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Pan Lu;Hritik Bansal;Tony Xia;Jiacheng Liu;Chunyuan Li;Hannaneh Hajishirzi;Hao Cheng;Kai-Wei Chang;Michel Galley;Jianfeng Gao",
        "authorids": "~Pan_Lu2;~Hritik_Bansal2;~Tony_Xia1;~Jiacheng_Liu2;~Chunyuan_Li1;~Hannaneh_Hajishirzi1;~Hao_Cheng4;~Kai-Wei_Chang1;~Michel_Galley1;~Jianfeng_Gao1",
        "gender": "M;M;;F;M;M;M;M;M;M",
        "homepage": "https://sites.google.com/view/hbansal;https://github.com/liujch1998;http://chunyuan.li/;https://homes.cs.washington.edu/~hannaneh/;https://sites.google.com/site/hcheng2site/Home;http://kwchang.net;http://research.microsoft.com/~mgalley;https://www.microsoft.com/en-us/research/people/jfgao/;https://lupantech.github.io/;https://tonyxia2001.github.io/",
        "dblp": "239/5922;289/6273;64/9590;52/1296;09/5158-2;18/2428;05/3289;92/5339;;",
        "google_scholar": "gAKTYtoAAAAJ;GJfoBZAAAAAJ;Zd7WmXUAAAAJ;LOV6_WIAAAAJ;https://scholar.google.com/citations?hl=en;fqDBtzYAAAAJ;rs1M7CAAAAAJ;https://scholar.google.com/citations?hl=en;IyucsdQAAAAJ;",
        "orcid": ";0000-0003-3308-2869;;;0000-0001-7988-3149;0000-0001-5365-0072;0000-0002-3310-1831;;;",
        "linkedin": "hritik-bansal/;liujch1998/;;;;kai-wei-chang-41239040;michelgalley;;pan-lu-9308909a/;",
        "or_profile": "~Hritik_Bansal2;~Jiacheng_Liu2;~Chunyuan_Li1;~Hannaneh_Hajishirzi1;~Hao_Cheng4;~Kai-Wei_Chang1;~Michel_Galley1;~Jianfeng_Gao1;~Pan_Lu1;~Tanglin_Xia1",
        "aff": "University of California, Los Angeles;Meta Facebook;Microsoft Research;University of Washington;Microsoft Research;Amazon;Microsoft;Microsoft Research;University of California, Los Angeles;",
        "aff_domain": "ucla.edu;meta.com;microsoft.com;uw.edu;microsoft.com;amazon.com;microsoft.com;microsoft.com;ucla.edu;",
        "position": "PhD student;Intern;Principal Researcher;Associate Professor;Researcher;Researcher;Researcher;Principal Researcher;PhD student;",
        "bibtex": "@inproceedings{\nlu2024mathvista,\ntitle={MathVista: Evaluating Mathematical Reasoning of Foundation Models in Visual Contexts},\nauthor={Pan Lu and Hritik Bansal and Tony Xia and Jiacheng Liu and Chunyuan Li and Hannaneh Hajishirzi and Hao Cheng and Kai-Wei Chang and Michel Galley and Jianfeng Gao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=KUNzEQMWU7}\n}",
        "github": "",
        "project": "",
        "reviewers": "juci;iJ4P;Vb5K;2daf",
        "pdf_size": 15862101,
        "rating": "5;8;8;8",
        "confidence": "4;4;4;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;4;3;4",
        "wc_summary": "71;48;79;179",
        "wc_strengths": "47;51;90;166",
        "wc_weaknesses": "307;100;249;142",
        "wc_questions": "37;51;2;11",
        "wc_review": "462;250;420;498",
        "wc_reply_reviewers": "0;42;80;89",
        "wc_reply_authors": "1457;1018;2338;1758",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "4;3;5;4",
        "rating_avg": [
            7.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            94.25,
            50.23631654490604
        ],
        "wc_strengths_avg": [
            88.5,
            47.793828053421294
        ],
        "wc_weaknesses_avg": [
            199.5,
            82.48181617787039
        ],
        "wc_questions_avg": [
            25.25,
            19.651653874419832
        ],
        "wc_review_avg": [
            407.5,
            95.03025833912059
        ],
        "wc_reply_reviewers_avg": [
            52.75,
            35.19499254155341
        ],
        "wc_reply_authors_avg": [
            1642.75,
            479.9663399656272
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.0,
            0.7071067811865476
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 541,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8391766948698077395&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=KUNzEQMWU7",
        "pdf": "https://openreview.net/pdf?id=KUNzEQMWU7",
        "email": "ucla.edu;meta.com;microsoft.com;uw.edu;microsoft.com;amazon.com;microsoft.com;microsoft.com;ucla.edu;",
        "author_num": 10,
        "aff_unique_index": "0;1;2;3;2;4;2;2;0",
        "aff_unique_norm": "University of California, Los Angeles;Meta;Microsoft;University of Washington;Amazon",
        "aff_unique_dep": ";Meta Platforms, Inc.;Microsoft Research;;Amazon.com, Inc.",
        "aff_unique_url": "https://www.ucla.edu;https://meta.com;https://www.microsoft.com/en-us/research;https://www.washington.edu;https://www.amazon.com",
        "aff_unique_abbr": "UCLA;Meta;MSR;UW;Amazon",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Los Angeles;",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "KUnFOgAy1D",
        "title": "Efficient Differentiable Approximation of the Generalized Low-rank Regularization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Low-rank regularization (LRR) has been widely applied in various machine learning tasks, but the associated optimization is challenging. Directly optimizing the rank function under constraints is NP-hard in general. To overcome this difficulty, various relaxations of the rank function were studied. However, optimization of these relaxed LRRs typically depends on singular value decomposition, which is a time-consuming and nondifferentiable operator that cannot be optimized with gradient-based techniques. To address these challenges, in this paper we propose an efficient differentiable approximation of the generalized LRR. The considered LRR form subsumes many popular choices like the nuclear norm, the Schatten-$p$ norm, and various nonconvex relaxations. Our method enables LRR terms to be appended to loss functions in a plug-and-play fashion, and be conveniently optimized by off-the-shelf machine learning libraries. Furthermore, the proposed approximation solely depends on matrix multiplication, which is a GPU-friendly operation that enables efficient parallel implementation. In the experimental study, the proposed method is applied to various tasks, which demonstrates its versatility and efficiency.",
        "keywords": "Low-rank regularization;low-rank matrix completion;rank relaxation;back propagation;deep learning",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Naiqi Li;Yuqiu Xie;Tao Dai;Jiawei Li;Bin Chen;Yong Jiang;Shu-Tao Xia",
        "authorids": "~Naiqi_Li1;~Yuqiu_Xie1;~Tao_Dai3;~Jiawei_Li4;~Bin_Chen4;~Yong_Jiang3;~Shu-Tao_Xia1",
        "gender": "M;M;M;M;M;M;M",
        "homepage": "https://naiqili.github.io/;https://www.linkedin.com/in/yuqiu-xie-a63875276/;https://csse.szu.edu.cn/pages/user/index?id=1204;https://livic.top/;https://binchen17tsinghua.wixsite.com/website;;https://www.sigs.tsinghua.edu.cn/xst/list.htm",
        "dblp": "117/4912;;54/875-1;12/3242-6.html;22/5523-11;74/1552-1.html;03/6195",
        "google_scholar": "5K2l_wUAAAAJ;;MqJNdaAAAAAJ;https://scholar.google.com.sg/citations?user=AbdZUcIAAAAJ;Yl0wv7AAAAAJ;;https://scholar.google.com.hk/citations?user=koAXTXgAAAAJ",
        "orcid": ";;0000-0003-0594-6404;0000-0003-3873-8003;0000-0002-4798-230X;;0000-0002-8639-982X",
        "linkedin": ";yuqiu-xie-a63875276/;;https://www.linkedin.cn/incareer/in/thucs-lijiawei/en;;;",
        "or_profile": "~Naiqi_Li1;~Yuqiu_Xie1;~Tao_Dai3;~Jiawei_Li4;~Bin_Chen4;~Yong_Jiang3;~Shu-Tao_Xia1",
        "aff": "Tsinghua University;Tsinghua University;Department of Software Engineering, Shenzhen University;Huawei Technologies Ltd.;Harbin Institute of Technology, Shenzhen;Tsinghua University;Shenzhen International Graduate School, Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;mail.tsinghua.edu.cn;szu.edu;huawei.com;hit.edu.cn;tsinghua.edu.cn;sz.tsinghua.edu.cn",
        "position": "PhD student;MS student;Assistant Professor;Researcher;Assistant Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nli2024efficient,\ntitle={Efficient Differentiable Approximation of the Generalized Low-rank Regularization},\nauthor={Naiqi Li and Yuqiu Xie and Tao Dai and Jiawei Li and Bin Chen and Yong Jiang and Shu-Tao Xia},\nyear={2024},\nurl={https://openreview.net/forum?id=KUnFOgAy1D}\n}",
        "github": "",
        "project": "",
        "reviewers": "89iV;Fxks;LpEL;XkwY;FgtX",
        "site": "https://openreview.net/forum?id=KUnFOgAy1D",
        "pdf_size": 1997842,
        "rating": "3;5;5;5;8",
        "confidence": "3;3;3;5;3",
        "soundness": "2;2;2;2;4",
        "contribution": "1;2;3;3;4",
        "presentation": "2;4;3;2;4",
        "wc_summary": "52;132;62;38;54",
        "wc_strengths": "69;15;71;25;25",
        "wc_weaknesses": "127;29;164;450;38",
        "wc_questions": "2;51;133;6;6",
        "wc_review": "250;227;430;519;123",
        "wc_reply_reviewers": "0;33;0;0;0",
        "wc_reply_authors": "633;435;522;715;85",
        "reply_reviewers": "0;1;0;0;0",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            5.2,
            1.6
        ],
        "confidence_avg": [
            3.4,
            0.8
        ],
        "soundness_avg": [
            2.4,
            0.8
        ],
        "contribution_avg": [
            2.6,
            1.019803902718557
        ],
        "presentation_avg": [
            3.0,
            0.8944271909999159
        ],
        "wc_summary_avg": [
            67.6,
            33.115555257310724
        ],
        "wc_strengths_avg": [
            41.0,
            23.96664348631239
        ],
        "wc_weaknesses_avg": [
            161.6,
            153.12556938669647
        ],
        "wc_questions_avg": [
            39.6,
            50.050374623972594
        ],
        "wc_review_avg": [
            309.8,
            143.90191103665023
        ],
        "wc_reply_reviewers_avg": [
            6.6,
            13.199999999999998
        ],
        "wc_reply_authors_avg": [
            478.0,
            218.37032765465185
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.06249999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:pc1xfB_R7vUJ:scholar.google.com/&scioq=Efficient+Differentiable+Approximation+of+the+Generalized+Low-rank+Regularization&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2;3;0;0",
        "aff_unique_norm": "Tsinghua University;Shenzhen University;Huawei;Harbin Institute of Technology",
        "aff_unique_dep": ";Department of Software Engineering;Huawei Technologies;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.szu.edu.cn;https://www.huawei.com;http://en.hhit.edu.cn/",
        "aff_unique_abbr": "THU;SZU;Huawei;HIT",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Shenzhen",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "KUz8QXAgFV",
        "title": "Bridging Autoregressive and Masked Modeling for Enhanced Visual Representation Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Autoregressive models have demonstrated superior performance in natural language processing due to their ability to handle large-scale training and generating ability. However, their potential in computer vision has not been fully explored due to some key challenges they still face. Currently, masked modeling methods such as MAE are dominant in this field. By analyzing autoregressive and masked modeling methods in a probabilistic way, we find that they can complement each other. Based on this, we propose a general formulation and modeling framework that combines the benefits of both, named \\textbf{G}enerative \\textbf{V}isual \\textbf{P}retraining (GVP). Our unified probabilistic framework allows for different training strategies, including masked modeling and autoregressive modeling, to be realized simultaneously. Our framework can be adapted for various downstream tasks and outperform existing methods in several benchmarks, including linear probing, fine-tuning and transfer learning. This work provides a promising direction for future research in generative masked visual representation learning.",
        "keywords": "Self-supervised learning;Masked image modeling;Autoregressive modeling",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Tianqi Du;Yifei Wang;Yisen Wang",
        "authorids": "~Tianqi_Du1;~Yifei_Wang1;~Yisen_Wang1",
        "gender": "M;M;M",
        "homepage": "https://yifeiwang77.com;https://yisenwang.github.io/;https://github.com/rexdu2003/rexdu.github.io",
        "dblp": "00/555-1;172/1346-1;341/5548",
        "google_scholar": "-CLy6YsAAAAJ;uMWPDboAAAAJ;nQjREpoAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Yifei_Wang1;~Yisen_Wang1;~Du_Tianqi1",
        "aff": "Massachusetts Institute of Technology;Peking University;Peking University",
        "aff_domain": "mit.edu;pku.edu.cn;pku.edu.cn",
        "position": "Postdoc;Assistant Professor;PhD student",
        "bibtex": "@misc{\ndu2024bridging,\ntitle={Bridging Autoregressive and Masked Modeling for Enhanced Visual Representation Learning},\nauthor={Tianqi Du and Yifei Wang and Yisen Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=KUz8QXAgFV}\n}",
        "github": "",
        "project": "",
        "reviewers": "BXi8;kXQF;N26k;mLNs",
        "site": "https://openreview.net/forum?id=KUz8QXAgFV",
        "pdf_size": 486919,
        "rating": "5;5;6;6",
        "confidence": "5;3;4;5",
        "soundness": "3;2;3;2",
        "contribution": "2;2;3;2",
        "presentation": "3;2;2;2",
        "wc_summary": "137;91;113;41",
        "wc_strengths": "135;71;57;64",
        "wc_weaknesses": "226;123;151;304",
        "wc_questions": "82;44;22;53",
        "wc_review": "580;329;343;462",
        "wc_reply_reviewers": "0;164;59;89",
        "wc_reply_authors": "1304;855;261;1336",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "3;3;2;3",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            95.5,
            35.422450508117024
        ],
        "wc_strengths_avg": [
            81.75,
            31.13980571551467
        ],
        "wc_weaknesses_avg": [
            201.0,
            70.3882092399004
        ],
        "wc_questions_avg": [
            50.25,
            21.52179128232592
        ],
        "wc_review_avg": [
            428.5,
            101.59355294505652
        ],
        "wc_reply_reviewers_avg": [
            78.0,
            59.08045362046571
        ],
        "wc_reply_authors_avg": [
            939.0,
            435.1936350637495
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            0.4330127018922193
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.30151134457776363,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:rtvjGcv64moJ:scholar.google.com/&scioq=Bridging+Autoregressive+and+Masked+Modeling+for+Enhanced+Visual+Representation+Learning&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Massachusetts Institute of Technology;Peking University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://web.mit.edu;http://www.pku.edu.cn",
        "aff_unique_abbr": "MIT;Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "KVIeFJmU9J",
        "title": "Motor Imagery Decoding Using Ensemble Curriculum Learning and Collaborative Training",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In this work, we study the problem of cross-subject motor imagery (MI) decoding from electroencephalography (EEG) data. Multi-subject EEG datasets present several kinds of domain shifts due to various inter-individual differences (e.g. brain anatomy, personality and cognitive profile). These domain shifts render multi-subject training a challenging task and also impede robust cross-subject generalization. We propose a  two-stage model ensemble architecture, built with multiple feature extractors (first stage) and a shared classifier (second stage), which we train end-to-end with two novel loss terms. The first loss applies curriculum learning, forcing each feature extractor to specialize to a subset of the training subjects and promoting feature diversity. The second loss is an intra-ensemble distillation objective that allows collaborative exchange of knowledge between the models of the ensemble. We compare our method against several state-of-the-art techniques, conducting subject-independent experiments on two large MI datasets, namely PhysioNet and OpenBMI. Our algorithm outperforms all of the methods in both 5-fold cross-validation and leave-one-subject-out evaluation settings, using a substantially lower number of trainable parameters. We demonstrate that our model ensembling approach combining the powers of curriculum learning and collaborative training, leads to high learning capacity and robust performance. Our work addresses the issue of domain shifts in multi-subject EEG datasets, paving the way for calibration-free brain-computer interfaces.",
        "keywords": "brain-computer interfaces;EEG;motor imagery decoding;model ensemble;domain generalization",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Georgios Zoumpourlis;Ioannis Patras",
        "authorids": "~Georgios_Zoumpourlis1;~Ioannis_Patras2",
        "gender": "M;M",
        "homepage": ";http://www.eecs.qmul.ac.uk/~ioannisp/",
        "dblp": "205/2685;18/1556",
        "google_scholar": "IKUYEHAAAAAJ;https://scholar.google.com.tw/citations?user=OBYLxRkAAAAJ",
        "orcid": ";0000-0003-3913-4738",
        "linkedin": ";ioannis-patras-1053767/",
        "or_profile": "~Georgios_Zoumpourlis1;~Ioannis_Patras2",
        "aff": ";Queen Mary, University of London",
        "aff_domain": ";qmul.ac.uk",
        "position": ";Full Professor",
        "bibtex": "@misc{\nzoumpourlis2024motor,\ntitle={Motor Imagery Decoding Using Ensemble Curriculum Learning and Collaborative Training},\nauthor={Georgios Zoumpourlis and Ioannis Patras},\nyear={2024},\nurl={https://openreview.net/forum?id=KVIeFJmU9J}\n}",
        "github": "",
        "project": "",
        "reviewers": "PLKL;gga1;Ph7j;DjzL",
        "site": "https://openreview.net/forum?id=KVIeFJmU9J",
        "pdf_size": 1588786,
        "rating": "3;3;3;5",
        "confidence": "4;5;3;4",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "2;2;2;3",
        "wc_summary": "150;64;128;77",
        "wc_strengths": "41;37;118;72",
        "wc_weaknesses": "290;238;388;161",
        "wc_questions": "89;114;4;154",
        "wc_review": "570;453;638;464",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            104.75,
            35.42156828826189
        ],
        "wc_strengths_avg": [
            67.0,
            32.41141774128371
        ],
        "wc_weaknesses_avg": [
            269.25,
            82.50265147254359
        ],
        "wc_questions_avg": [
            90.25,
            54.92893135679958
        ],
        "wc_review_avg": [
            531.25,
            76.71823446873631
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14796331819216135621&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0",
        "aff_unique_norm": "Queen Mary, University of London",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.qmul.ac.uk",
        "aff_unique_abbr": "QMUL",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "London",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "KW3aAxkhE1",
        "title": "TextBind: Multi-turn Interleaved Multimodal Instruction-following in the Wild",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models with instruction-following abilities have revolutionized the field of artificial intelligence. These models show exceptional generalizability to tackle various real-world tasks through their natural language interfaces. However, their performance heavily relies on high-quality exemplar data, which is often difficult to obtain. This challenge is further exacerbated when it comes to multimodal instruction following. We introduce TextBind, an almost annotation-free framework for empowering LLMs with multi-turn interleaved multimodal instruction-following capabilities. Our approach requires only image-caption pairs and generates multi-turn multimodal instruction-response conversations from a language model. To accommodate interleaved image-text inputs and outputs, we devise MIM, a language model-centric architecture that seamlessly integrates image encoder and decoder models. Extensive quantitative and qualitative experiments demonstrate that MIM trained on TextBind achieves impressive generation capability in multi-modal conversations  compared to recent baselines.",
        "keywords": "multimodal;instruction-following;real-world applications",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Huayang Li;Siheng Li;Deng Cai;Longyue Wang;Lemao Liu;Taro Watanabe;Yujiu Yang;Shuming Shi",
        "authorids": "~Huayang_Li1;~Siheng_Li1;~Deng_Cai1;~Longyue_Wang3;~Lemao_Liu3;~Taro_Watanabe1;~Yujiu_Yang2;~Shuming_Shi1",
        "gender": "M;M;M;M;M;M;M;M",
        "homepage": "https://sites.google.com/view/huayangli;;https://jcyk.github.io/;http://longyuewang.com/;https://sites.google.com/site/tarowtnb/;https://sites.google.com/view/iigroup-thu;;https://lemaoliu.github.io/homepage/",
        "dblp": "43/5939;312/9450;c/DCai-2;127/3421;50/4741;30/3847;s/ShumingShi;41/10887.html",
        "google_scholar": "_1jSi34AAAAJ;;KpbRLYcAAAAJ;r1ctChkAAAAJ;zsEEy7kAAAAJ;4gH3sxsAAAAJ;Lg31AKMAAAAJ;",
        "orcid": ";;;0000-0002-9062-6183;0000-0001-8349-3522;0000-0002-6427-1024;;",
        "linkedin": "huayang-li-a426a3114/;;;vincentwang0229/;;;;",
        "or_profile": "~Huayang_Li1;~Siheng_Li1;~Deng_Cai1;~Longyue_Wang3;~Taro_Watanabe1;~Yujiu_Yang2;~Shuming_Shi1;~lemao_liu1",
        "aff": "Nara Institute of Science and Technology;Tsinghua University;Tencent AI Lab;Tencent AI Lab;Nara Institute of Science and Technology, Japan;Tsinghua University;Tencent AI Lab;Tencent",
        "aff_domain": "is.naist.jp;tsinghua.edu.cn;tencent.com;tencent.com;naist.jp;tsinghua.edu.cn;tencent.com;tencent.com",
        "position": "PhD student;MS student;Research Scientist;Senior Researcher;Full Professor;Full Professor;Principal Researcher;Researcher",
        "bibtex": "@misc{\nli2024textbind,\ntitle={TextBind: Multi-turn Interleaved Multimodal Instruction-following in the Wild},\nauthor={Huayang Li and Siheng Li and Deng Cai and Longyue Wang and Lemao Liu and Taro Watanabe and Yujiu Yang and Shuming Shi},\nyear={2024},\nurl={https://openreview.net/forum?id=KW3aAxkhE1}\n}",
        "github": "",
        "project": "",
        "reviewers": "bpnq;1Usx;TZuK;E1gM",
        "site": "https://openreview.net/forum?id=KW3aAxkhE1",
        "pdf_size": 14429003,
        "rating": "5;5;6;8",
        "confidence": "4;5;3;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "68;68;98;91",
        "wc_strengths": "52;67;57;77",
        "wc_weaknesses": "102;356;166;47",
        "wc_questions": "61;314;25;20",
        "wc_review": "283;805;346;235",
        "wc_reply_reviewers": "0;11;92;0",
        "wc_reply_authors": "761;2115;799;215",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "2;5;3;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            81.25,
            13.47915056670857
        ],
        "wc_strengths_avg": [
            63.25,
            9.60143218483576
        ],
        "wc_weaknesses_avg": [
            167.75,
            116.55980224760164
        ],
        "wc_questions_avg": [
            105.0,
            121.6983976887124
        ],
        "wc_review_avg": [
            417.25,
            227.30197425451456
        ],
        "wc_reply_reviewers_avg": [
            25.75,
            38.51217340010818
        ],
        "wc_reply_authors_avg": [
            972.5,
            698.9182713307758
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.75,
            1.479019945774904
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.28867513459481287,
        "gs_citation": 17,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5985089916408503744&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2;2;0;1;2;2",
        "aff_unique_norm": "Nara Institute of Science and Technology;Tsinghua University;Tencent",
        "aff_unique_dep": ";;Tencent AI Lab",
        "aff_unique_url": "https://www.nist.go.jp;https://www.tsinghua.edu.cn;https://ai.tencent.com",
        "aff_unique_abbr": "NIST;THU;Tencent AI Lab",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;0;1;1;1",
        "aff_country_unique": "Japan;China"
    },
    {
        "title": "Constraint-Free Structure Learning with Smooth Acyclic Orientations",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18899",
        "id": "KWO8LSUC5W",
        "author_site": "Riccardo Massidda, Francesco Landolfi, Martina Cinquini, Davide Bacciu",
        "tldr": "",
        "abstract": "The structure learning problem consists of fitting data generated by a Directed Acyclic Graph (DAG) to correctly reconstruct its arcs. In this context, differentiable approaches constrain or regularize an optimization problem with a continuous relaxation of the acyclicity property. The computational cost of evaluating graph acyclicity is cubic on the number of nodes and significantly affects scalability. In this paper, we introduce COSMO, a constraint-free continuous optimization scheme for acyclic structure learning. At the core of our method lies a novel differentiable approximation of an orientation matrix parameterized by a single priority vector. Differently from previous works, our parameterization fits a smooth orientation matrix and the resulting acyclic adjacency matrix without evaluating acyclicity at any step. Despite this absence, we prove that COSMO always converges to an acyclic solution. In addition to being asymptotically faster, our empirical analysis highlights how COSMO performance on graph reconstruction compares favorably with competing structure learning methods.",
        "keywords": "Structure Learning;Continuous Acyclic Optimization;Directed Acyclic Graphs;DAG",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/399d3ecaeb8fdd8c5464c7edb77fa4d820482715.zip",
        "author": "Riccardo Massidda;Francesco Landolfi;Martina Cinquini;Davide Bacciu",
        "authorids": "~Riccardo_Massidda1;~Francesco_Landolfi1;~Martina_Cinquini1;~Davide_Bacciu1",
        "gender": "M;;;M",
        "homepage": "https://pages.di.unipi.it/massidda/;https://github.com/flandolfi;http://marti5ini.github.io;http://pages.di.unipi.it/bacciu/",
        "dblp": "255/8428;300/9636;318/5149;07/6626",
        "google_scholar": "3PVuVisAAAAJ;;XQ4kna8AAAAJ;https://scholar.google.it/citations?user=1d5n2WkAAAAJ",
        "orcid": "0000-0003-0137-7793;0000-0001-5674-0663;0000-0003-3101-3659;0000-0001-5213-2468",
        "linkedin": ";;martinacinquini/;bacciu/",
        "or_profile": "~Riccardo_Massidda1;~Francesco_Landolfi1;~Martina_Cinquini1;~Davide_Bacciu1",
        "aff": "University of Pisa;;University of Pisa;University of Pisa",
        "aff_domain": "unipi.it;;unipi.it;unipi.it",
        "position": "PhD student;;PhD student;Full Professor",
        "bibtex": "@inproceedings{\nmassidda2024constraintfree,\ntitle={Constraint-Free Structure Learning with Smooth Acyclic Orientations},\nauthor={Riccardo Massidda and Francesco Landolfi and Martina Cinquini and Davide Bacciu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=KWO8LSUC5W}\n}",
        "github": "",
        "project": "",
        "reviewers": "LvdG;Rsrs;t9PA;tdcC;Ar2D",
        "pdf_size": 797489,
        "rating": "5;5;6;6;6",
        "confidence": "5;3;3;4;3",
        "soundness": "1;3;3;3;3",
        "contribution": "3;2;2;2;3",
        "presentation": "4;2;3;3;2",
        "wc_summary": "101;98;59;89;56",
        "wc_strengths": "98;63;36;40;25",
        "wc_weaknesses": "562;241;263;61;269",
        "wc_questions": "9;4;122;340;2",
        "wc_review": "770;406;480;530;352",
        "wc_reply_reviewers": "366;0;21;49;59",
        "wc_reply_authors": "1117;411;556;427;425",
        "reply_reviewers": "1;0;1;1;1",
        "reply_authors": "3;1;1;1;2",
        "rating_avg": [
            5.6,
            0.48989794855663565
        ],
        "confidence_avg": [
            3.6,
            0.8
        ],
        "soundness_avg": [
            2.6,
            0.8000000000000002
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.8,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            80.6,
            19.293522228976233
        ],
        "wc_strengths_avg": [
            52.4,
            25.943014474035202
        ],
        "wc_weaknesses_avg": [
            279.2,
            160.88057682641494
        ],
        "wc_questions_avg": [
            95.4,
            130.444777588066
        ],
        "wc_review_avg": [
            507.6,
            144.67287237073853
        ],
        "wc_reply_reviewers_avg": [
            99.0,
            135.11032529011246
        ],
        "wc_reply_authors_avg": [
            587.2,
            270.06695466124694
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            1.6,
            0.8
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.40824829046386296,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12847181676729591606&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=KWO8LSUC5W",
        "pdf": "https://openreview.net/pdf?id=KWO8LSUC5W",
        "email": "unipi.it;;unipi.it;unipi.it",
        "author_num": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Pisa",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.unipi.it",
        "aff_unique_abbr": "UNIP",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Italy"
    },
    {
        "id": "KXNLvfCxEr",
        "title": "EvIL: Evolution Strategies for Generalisable Imitation Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We present Evolutionary Imitation Learning (EvIL), a general approach to imitation learning (IL) able to predict agent behaviour across changing environment dynamics. In EvIL, we use Evolution Strategies to jointly meta-optimise the parameters (e.g. reward functions and dynamics) fed to an inner loop reinforcement learning procedure. In effect, this allows us to inherit some of the benefits of the inverse reinforcement learning approach to imitation learning while being significantly more flexible. Specifically, our algorithm can be applied with any policy optimisation method, without requiring the reward or training procedure to be differentiable. \nOur method succeeds at recovering a reward that induces expert-like behaviour across a variety of environments, even when the environment dynamics are not fully known. We test our method's effectiveness and generalisation capabilities in several tabular environments and continuous control settings and find that it outperforms both offline approaches, like behavioural cloning, and traditional inverse reinforcement learning techniques.",
        "keywords": "Reinforcement Learning;Inverse Reinforcement Learning;Imitation Learning;Evolutionary Strategies",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/004ea64f7b927ba74924a9acb66ff1030203df07.pdf",
        "author": "Silvia Sapora;Chris Lu;Gokul Swamy;Yee Whye Teh;Jakob Nicolaus Foerster",
        "authorids": "~Silvia_Sapora1;~Chris_Lu1;~Gokul_Swamy1;~Yee_Whye_Teh2;~Jakob_Nicolaus_Foerster1",
        "gender": "F;;;M;M",
        "homepage": ";;https://gokul.dev/;https://www.jakobfoerster.com;http://csml.stats.ox.ac.uk/people/teh/",
        "dblp": ";77/9579;31/11509;176/5095;88/2483",
        "google_scholar": "FxdgVLkAAAAJ;4WLoIRsAAAAJ;Sbpra_AAAAAJ;6z4lQzMAAAAJ;https://scholar.google.co.uk/citations?user=y-nUzMwAAAAJ",
        "orcid": ";;;;",
        "linkedin": "silvia-sapora/?originalSubdomain=uk;;;;",
        "or_profile": "~Silvia_Sapora1;~Chris_Lu1;~Gokul_Swamy1;~Jakob_Nicolaus_Foerster1;~Yee_Whye_Teh1",
        "aff": "University of Oxford;University of Oxford;Carnegie Mellon University;University of Oxford, University of Oxford;University of Oxford",
        "aff_domain": "oxford.ac.uk;ox.ac.uk;cmu.edu;eng.ox.ac.uk;ox.ac.uk",
        "position": "PhD student;PhD student;PhD student;Associate Professor;Full Professor",
        "bibtex": "@misc{\nsapora2024evil,\ntitle={Ev{IL}: Evolution Strategies for Generalisable Imitation Learning},\nauthor={Silvia Sapora and Chris Lu and Gokul Swamy and Yee Whye Teh and Jakob Nicolaus Foerster},\nyear={2024},\nurl={https://openreview.net/forum?id=KXNLvfCxEr}\n}",
        "github": "",
        "project": "",
        "reviewers": "foS1;vCw2;p69Z;4scx",
        "site": "https://openreview.net/forum?id=KXNLvfCxEr",
        "pdf_size": 871384,
        "rating": "3;3;3;6",
        "confidence": "5;4;3;3",
        "soundness": "1;2;2;3",
        "contribution": "1;1;2;3",
        "presentation": "2;1;2;3",
        "wc_summary": "107;28;112;90",
        "wc_strengths": "43;58;31;51",
        "wc_weaknesses": "200;73;115;106",
        "wc_questions": "235;96;18;18",
        "wc_review": "585;255;276;265",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "553;311;277;329",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            84.25,
            33.48413803579241
        ],
        "wc_strengths_avg": [
            45.75,
            10.034316120194738
        ],
        "wc_weaknesses_avg": [
            123.5,
            46.853495067070504
        ],
        "wc_questions_avg": [
            91.75,
            88.62385401233688
        ],
        "wc_review_avg": [
            345.25,
            138.61885694233666
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            367.5,
            108.7140745257945
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14464008521554697116&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "University of Oxford;Carnegie Mellon University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ox.ac.uk;https://www.cmu.edu",
        "aff_unique_abbr": "Oxford;CMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "id": "KXOB15k1br",
        "title": "Time-Series AutoAugment: Data Augmentation Policy Search for Long-Term Forecasting",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Data augmentation is a popular regularization for addressing overfitting issues\nof neural networks. Recently, automatic augmentation showed strong results on\nimage classification tasks. However, less attention had been given to automatic\naugmentation of time-series problems such as long-term forecasting. Toward\nbridging this gap, we propose an efficient, effective, and easy-to-code time-series\nautomatic augmentation method we refer to as TSAA. We solve the associated\nbilevel optimization problem in two steps: a partial train of the non-augmented\nmodel for a few epochs and an iterative split process. The iterative process alternates\nbetween finding a good augmentation policy via Bayesian optimization and fine-\ntuning the model while pruning poor runs. Our method is evaluated extensively\non challenging univariate and multivariate forecasting benchmark problems. Our\nresults indicate that TSAA outperforms several strong baselines in most cases,\nsuggesting it should be incorporated into prediction pipelines.",
        "keywords": "Time-series forecasting;data augmentation",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Liran Nochumsohn;Omri Azencot",
        "authorids": "~Liran_Nochumsohn1;~Omri_Azencot1",
        "gender": "M;Unspecified",
        "homepage": ";http://omriazencot.com",
        "dblp": ";132/3985.html",
        "google_scholar": ";https://scholar.google.co.il/citations?user=MEGuRmAAAAAJ",
        "orcid": ";",
        "linkedin": "liran-nochumsohn-200ab91b3/;omri-azencot-a8812417/",
        "or_profile": "~Liran_Nochumsohn1;~Omri_Azencot1",
        "aff": ";Ben-Gurion University of the Negev",
        "aff_domain": ";bgu.ac.il",
        "position": ";Assistant Professor",
        "bibtex": "@misc{\nnochumsohn2024timeseries,\ntitle={Time-Series AutoAugment: Data Augmentation Policy Search for Long-Term Forecasting},\nauthor={Liran Nochumsohn and Omri Azencot},\nyear={2024},\nurl={https://openreview.net/forum?id=KXOB15k1br}\n}",
        "github": "",
        "project": "",
        "reviewers": "9xnW;dM8C;dahn;E2oo",
        "site": "https://openreview.net/forum?id=KXOB15k1br",
        "pdf_size": 1273812,
        "rating": "3;5;5;5",
        "confidence": "5;4;4;4",
        "soundness": "2;2;3;3",
        "contribution": "1;2;2;3",
        "presentation": "2;3;3;4",
        "wc_summary": "34;185;76;117",
        "wc_strengths": "20;150;43;236",
        "wc_weaknesses": "412;312;166;73",
        "wc_questions": "6;65;124;66",
        "wc_review": "472;712;409;492",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            103.0,
            55.70008976653449
        ],
        "wc_strengths_avg": [
            112.25,
            86.66710737067437
        ],
        "wc_weaknesses_avg": [
            240.75,
            130.5093387463135
        ],
        "wc_questions_avg": [
            65.25,
            41.72154719087009
        ],
        "wc_review_avg": [
            521.25,
            114.30961245669587
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ZC6CX8BnjlQJ:scholar.google.com/&scioq=Time-Series+AutoAugment:+Data+Augmentation+Policy+Search+for+Long-Term+Forecasting&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Ben-Gurion University of the Negev",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.bgu.ac.il",
        "aff_unique_abbr": "BGU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Israel"
    },
    {
        "title": "NetInfoF Framework: Measuring and Exploiting Network Usable Information",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18898",
        "id": "KY8ZNcljVU",
        "author_site": "Meng-Chieh Lee, Haiyang Yu, Jian Zhang, Vassilis N. Ioannidis, Xiang song, Soji Adeshina, Da Zheng, Christos Faloutsos",
        "tldr": "",
        "abstract": "Given a node-attributed graph, and a graph task (link prediction or node classification), can we tell if a graph neural network (GNN) will perform well? More specifically, do the graph structure and the node features carry enough usable information for the task? Our goals are\n(1) to develop a fast tool to measure how much information is in the graph structure and in the node features, and\n(2) to exploit the information to solve the task, if there is enough.\nWe propose NetInfoF, a framework including NetInfoF_Probe and NetInfoF_Act, for the measurement and the exploitation of network usable information (NUI), respectively. Given a graph data, NetInfoF_Probe measures NUI without any model training, and NetInfoF_Act solves link prediction and node classification, while two modules share the same backbone.\nIn summary, NetInfoF has following notable advantages:\n(a) General, handling both link prediction and node classification;\n(b) Principled, with theoretical guarantee and closed-form solution;\n(c) Effective, thanks to the proposed adjustment to node similarity;\n(d) Scalable, scaling linearly with the input size.\nIn our carefully designed synthetic datasets, NetInfoF correctly identifies the ground truth of NUI and is the only method being robust to all graph scenarios. Applied on real-world datasets, NetInfoF wins in 11 out of 12 times on link prediction compared to general GNN baselines.",
        "keywords": "Graph Neural Networks;Information Theory;Heterophily Graphs",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Meng-Chieh Lee;Haiyang Yu;Jian Zhang;Vassilis N. Ioannidis;Xiang song;Soji Adeshina;Da Zheng;Christos Faloutsos",
        "authorids": "~Meng-Chieh_Lee1;~Haiyang_Yu6;~Jian_Zhang32;~Vassilis_N._Ioannidis1;~Xiang_song1;~Soji_Adeshina1;~Da_Zheng1;~Christos_Faloutsos1",
        "gender": "M;M;M;;M;;M;",
        "homepage": "https://mengchillee.github.io/;https://oceanusity.github.io/;https://scholar.google.com/citations?hl=zh-CN&user=hXsVI48AAAAJ&view_op=list_works&sortby=pubdate;https://scholar.google.com/citations?hl=en&user=mjmiI4sAAAAJ&view_op=list_works&authuser=1;;;https://www.cs.cmu.edu/~christos/;https://zheng-da.github.io/",
        "dblp": "188/8240;90/6643-5;;;;298/4855;f/CFaloutsos;",
        "google_scholar": "iaT-S0QAAAAJ;LZKU1hUAAAAJ;https://scholar.google.com/citations?hl=zh-CN;;https://scholar.google.com/citations?view_op=list_works;O2IS5isAAAAJ;nd8lQQIAAAAJ;",
        "orcid": "0000-0002-6271-8558;;;0000-0002-8367-0733;;;0000-0003-2996-9790;",
        "linkedin": "mengchillee/;;;;;sojiadeshina/;christos-faloutsos-43a7aa2/;",
        "or_profile": "~Meng-Chieh_Lee1;~Haiyang_Yu6;~Jian_Zhang32;~Vassilis_N._Ioannidis1;~Xiang_song1;~Soji_Adeshina1;~Christos_Faloutsos1;~Da_Zheng2",
        "aff": "Carnegie Mellon University;Texas A&M University - College Station;Amazon;Amazon Web Services;;Amazon;Carnegie Mellon University;Amazon",
        "aff_domain": "cs.cmu.edu;tamu.edu;amazon.com;amazon.com;;amazon.com;cmu.edu;amazon.com",
        "position": "PhD student;PhD student;Researcher;Applied Scientist II;;Researcher;Full Professor;Researcher",
        "bibtex": "@inproceedings{\nlee2024netinfof,\ntitle={NetInfoF Framework: Measuring and Exploiting Network Usable Information},\nauthor={Meng-Chieh Lee and Haiyang Yu and Jian Zhang and Vassilis N. Ioannidis and Xiang song and Soji Adeshina and Da Zheng and Christos Faloutsos},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=KY8ZNcljVU}\n}",
        "github": "",
        "project": "",
        "reviewers": "ANgE;WXaL;96be",
        "pdf_size": 781874,
        "rating": "6;8;8",
        "confidence": "4;3;4",
        "soundness": "2;3;3",
        "contribution": "2;3;4",
        "presentation": "2;3;3",
        "wc_summary": "70;105;152",
        "wc_strengths": "3;102;220",
        "wc_weaknesses": "2;102;249",
        "wc_questions": "289;2;120",
        "wc_review": "364;311;741",
        "wc_reply_reviewers": "33;0;161",
        "wc_reply_authors": "754;491;1181",
        "reply_reviewers": "1;0;1",
        "reply_authors": "3;2;4",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            109.0,
            33.595634637057636
        ],
        "wc_strengths_avg": [
            108.33333333333333,
            88.70300007453086
        ],
        "wc_weaknesses_avg": [
            117.66666666666667,
            101.44401849734113
        ],
        "wc_questions_avg": [
            137.0,
            117.78228502905972
        ],
        "wc_review_avg": [
            472.0,
            191.43841481444278
        ],
        "wc_reply_reviewers_avg": [
            64.66666666666667,
            69.43742186714276
        ],
        "wc_reply_authors_avg": [
            808.6666666666666,
            284.3311840481487
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.0,
            0.816496580927726
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:tlvoAYMdMrwJ:scholar.google.com/&scioq=NetInfoF+Framework:+Measuring+and+Exploiting+Network+Usable+Information&hl=en&as_sdt=0,5",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=KY8ZNcljVU",
        "pdf": "https://openreview.net/pdf?id=KY8ZNcljVU",
        "email": "cs.cmu.edu;tamu.edu;amazon.com;amazon.com;;amazon.com;cmu.edu;amazon.com",
        "author_num": 8,
        "aff_unique_index": "0;1;2;2;2;0;2",
        "aff_unique_norm": "Carnegie Mellon University;Texas A&M University;Amazon",
        "aff_unique_dep": ";;Amazon.com, Inc.",
        "aff_unique_url": "https://www.cmu.edu;https://www.tamu.edu;https://www.amazon.com",
        "aff_unique_abbr": "CMU;TAMU;Amazon",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";College Station",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "KZA5gDk2Jj",
        "title": "Recovery of Training Data from Overparameterized Autoencoders: An Inverse Problem Perspective",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We study the recovery of training data from overparameterized autoencoder models. \nGiven a degraded training sample, we define the recovery of the original sample as an inverse problem and formulate it as an optimization task. In our inverse problem, we use the trained autoencoder to implicitly define a regularizer for the particular training dataset that we aim to retrieve from. We develop the intricate optimization task into a practical method that iteratively applies the trained autoencoder and relatively simple computations that estimate and address the unknown degradation operator. We evaluate our method for blind inpainting where the goal is to recover training images from degradation of many missing pixels in an unknown pattern. We examine various deep autoencoder architectures, such as fully connected and U-Net (with various nonlinearities and at diverse train loss values), and show that our method significantly outperforms previous methods for training data recovery from autoencoders. Importantly, our method greatly improves the recovery performance also in settings that were previously considered highly challenging, and even impractical, for such retrieval.",
        "keywords": "Overparameterized machine learning;training data memorization;autoencoders;training data recovery;inverse problem",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Koren Abtibul;Yehuda Dar",
        "authorids": "~Koren_Abtibul1;~Yehuda_Dar1",
        "gender": "M;M",
        "homepage": ";https://sites.google.com/view/yehuda-dar/",
        "dblp": ";144/7559",
        "google_scholar": ";lKeL2F4AAAAJ",
        "orcid": ";",
        "linkedin": "koren-abitbul-computer-science/;",
        "or_profile": "~Koren_Abtibul1;~Yehuda_Dar1",
        "aff": "Ben-Gurion University of the Negev;Ben-Gurion University of the Negev",
        "aff_domain": "bgu.ac.il;bgu.ac.il",
        "position": "MS student;Assistant Professor",
        "bibtex": "@misc{\nabtibul2024recovery,\ntitle={Recovery of Training Data from Overparameterized Autoencoders: An Inverse Problem Perspective},\nauthor={Koren Abtibul and Yehuda Dar},\nyear={2024},\nurl={https://openreview.net/forum?id=KZA5gDk2Jj}\n}",
        "github": "",
        "project": "",
        "reviewers": "1EzY;RTXb;PoRf;VRp5",
        "site": "https://openreview.net/forum?id=KZA5gDk2Jj",
        "pdf_size": 4486620,
        "rating": "3;3;5;6",
        "confidence": "3;4;2;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "3;3;3;3",
        "wc_summary": "66;51;53;119",
        "wc_strengths": "92;37;13;27",
        "wc_weaknesses": "424;295;103;70",
        "wc_questions": "61;318;2;124",
        "wc_review": "643;701;171;340",
        "wc_reply_reviewers": "0;75;0;0",
        "wc_reply_authors": "0;1103;196;0",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "0;2;1;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            72.25,
            27.598686562950782
        ],
        "wc_strengths_avg": [
            42.25,
            29.961433543807612
        ],
        "wc_weaknesses_avg": [
            223.0,
            144.39009661330655
        ],
        "wc_questions_avg": [
            126.25,
            118.81577125954281
        ],
        "wc_review_avg": [
            463.75,
            217.62051259015084
        ],
        "wc_reply_reviewers_avg": [
            18.75,
            32.47595264191645
        ],
        "wc_reply_authors_avg": [
            324.75,
            456.39203268681194
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            0.75,
            0.82915619758885
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5443310539518174,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1912146182195079755&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Ben-Gurion University of the Negev",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.bgu.ac.il",
        "aff_unique_abbr": "BGU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Israel"
    },
    {
        "title": "Depthwise Hyperparameter Transfer in Residual Networks: Dynamics and Scaling Limit",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18897",
        "id": "KZJehvRKGD",
        "author_site": "Blake Bordelon, Lorenzo Noci, Mufan Li, Boris Hanin, Cengiz Pehlevan",
        "tldr": "",
        "abstract": "The cost of hyperparameter tuning in deep learning has been rising with model sizes, prompting practitioners to find new tuning methods using a proxy of smaller networks. One such proposal uses $\\mu$P parameterized networks, where the optimal hyperparameters for small width networks *transfer* to networks with arbitrarily large width. However, in this scheme, hyperparameters do not transfer across depths. As a remedy, we study residual networks with a residual branch scale of $1/\\sqrt{\\text{depth}}$ in combination with the $\\mu$P parameterization. We provide experiments demonstrating that residual architectures including convolutional ResNets and vision transformers trained with this parameterization exhibit transfer of optimal hyperparameters across width and depth on CIFAR-10 and ImageNet.  Furthermore, our empirical findings are supported and motivated by theory. Using recent developments in the dynamical mean field theory (DMFT) description of neural network learning dynamics, we show that this parameterization of ResNets admits a well-defined feature learning joint infinite-width and infinite-depth limit and show convergence of finite-size network dynamics towards this limit.",
        "keywords": "Deep Learning Theory;Hyperparameter Transfer;Training Dynamics;Residual Networks",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/63422527eb1999ff3b4aac54e233de59e72aaa67.zip",
        "author": "Blake Bordelon;Lorenzo Noci;Mufan Bill Li;Boris Hanin;Cengiz Pehlevan",
        "authorids": "~Blake_Bordelon1;~Lorenzo_Noci1;~Mufan_Bill_Li1;~Boris_Hanin1;~Cengiz_Pehlevan2",
        "gender": "M;M;;;M",
        "homepage": "https://blakebordelon.github.io/;;https://hanin.princeton.edu;https://pehlevan.seas.harvard.edu/;https://mufan-li.github.io/",
        "dblp": "228/6993;268/6839;205/2534;145/3480;277/1227",
        "google_scholar": "yeQ8_pgAAAAJ;;;veDLTPEAAAAJ;9dSlc_cAAAAJ",
        "orcid": "0000-0003-0455-9445;;;0000-0001-9767-6063;",
        "linkedin": ";lorenzo-noci-97aa59130;;;",
        "or_profile": "~Blake_Bordelon1;~Lorenzo_Noci1;~Boris_Hanin1;~Cengiz_Pehlevan2;~Mufan_Li1",
        "aff": "Harvard University;ETHZ - ETH Zurich;Princeton University;School of Engineering and Applied Sciences, Harvard University;Princeton University",
        "aff_domain": "harvard.edu;ethz.ch;princeton.edu;seas.harvard.edu;princeton.edu",
        "position": "PhD student;PhD student;Assistant Professor;Assistant Professor;Postdoc",
        "bibtex": "@inproceedings{\nbordelon2024depthwise,\ntitle={Depthwise Hyperparameter Transfer in Residual Networks: Dynamics and Scaling Limit},\nauthor={Blake Bordelon and Lorenzo Noci and Mufan Bill Li and Boris Hanin and Cengiz Pehlevan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=KZJehvRKGD}\n}",
        "github": "",
        "project": "",
        "reviewers": "SFFE;J7oQ;fkzv;vjdW",
        "pdf_size": 1111667,
        "rating": "6;8;8;8",
        "confidence": "4;4;4;3",
        "soundness": "3;3;3;3",
        "contribution": "3;3;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "79;122;173;167",
        "wc_strengths": "76;43;98;16",
        "wc_weaknesses": "224;213;177;18",
        "wc_questions": "3;25;3;1",
        "wc_review": "382;403;451;202",
        "wc_reply_reviewers": "20;259;49;0",
        "wc_reply_authors": "674;1193;829;111",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            135.25,
            37.989307706248084
        ],
        "wc_strengths_avg": [
            58.25,
            31.275989192989563
        ],
        "wc_weaknesses_avg": [
            158.0,
            82.67708267712402
        ],
        "wc_questions_avg": [
            8.0,
            9.848857801796104
        ],
        "wc_review_avg": [
            359.5,
            94.3093314577089
        ],
        "wc_reply_reviewers_avg": [
            82.0,
            103.66532689380765
        ],
        "wc_reply_authors_avg": [
            701.75,
            389.63917603341685
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 28,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14781090968226791719&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 9,
        "openreview": "https://openreview.net/forum?id=KZJehvRKGD",
        "pdf": "https://openreview.net/pdf?id=KZJehvRKGD",
        "email": "harvard.edu;ethz.ch;princeton.edu;seas.harvard.edu;princeton.edu",
        "author_num": 5,
        "aff_unique_index": "0;1;2;0;2",
        "aff_unique_norm": "Harvard University;ETH Zurich;Princeton University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.harvard.edu;https://www.ethz.ch;https://www.princeton.edu",
        "aff_unique_abbr": "Harvard;ETHZ;Princeton",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Cambridge",
        "aff_country_unique_index": "0;1;0;0;0",
        "aff_country_unique": "United States;Switzerland"
    },
    {
        "title": "SNIP: Bridging Mathematical Symbolic and Numeric Realms with Unified Pre-training",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18896",
        "id": "KZSEgJGPxu",
        "author_site": "Kazem Meidani, Parshin Shojaee, Chandan Reddy, Amir Barati Farimani",
        "tldr": "",
        "abstract": "In an era where symbolic mathematical equations are indispensable for modeling complex natural phenomena, scientific inquiry often involves collecting observations and translating them into mathematical expressions. Recently, deep learning has emerged as a powerful tool for extracting insights from data. However, existing models typically specialize in either numeric or symbolic domains, and are usually trained in a supervised manner tailored to specific tasks. This approach neglects the substantial benefits that could arise from a task-agnostic multi-modal understanding between symbolic equations and their numeric counterparts. To bridge the gap, we introduce SNIP, a Symbolic-Numeric Integrated Pre-training model, which employs contrastive learning between symbolic and numeric domains, enhancing their mutual similarities in the embeddings. By performing latent space analysis, we observe that SNIP provides cross-domain insights into the representations, revealing that symbolic supervision enhances the embeddings of numeric data and vice versa. We evaluate SNIP across diverse tasks, including symbolic-to-numeric mathematical property prediction and numeric-to-symbolic equation discovery, commonly known as symbolic regression. Results show that SNIP effectively transfers to various tasks, consistently outperforming fully supervised baselines and competing strongly with established task-specific methods, especially in the low data regime scenarios where available data is limited.",
        "keywords": "Symbolic Mathematics;Pre-training;Transformers;Symbolic Regression;Deep Learning",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/5a6cdb08217fa21d5a0fe9b9e8490721c4f5b222.pdf",
        "author": "Kazem Meidani;Parshin Shojaee;Chandan K. Reddy;Amir Barati Farimani",
        "authorids": "~Kazem_Meidani1;~Parshin_Shojaee1;~Chandan_K._Reddy1;~Amir_Barati_Farimani2",
        "gender": "M;F;M;M",
        "homepage": "https://mmeidani.github.io;https://parshinsh.github.io/;https://creddy.net/;https://sites.google.com/view/barati",
        "dblp": "277/0541;281/9859;42/1341;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;8k3qYv8AAAAJ;LoXnMOIAAAAJ;aH52nxkAAAAJ",
        "orcid": ";;;0000-0002-2952-8576",
        "linkedin": ";parshinshojaee/;;amir-barati-farimani-a0b74169/",
        "or_profile": "~Kazem_Meidani1;~Parshin_Shojaee1;~Chandan_K._Reddy1;~Amir_Barati_Farimani2",
        "aff": "Carnegie Mellon University;Virginia Polytechnic Institute and State University;Amazon;Carnegie Mellon University",
        "aff_domain": "cmu.edu;vt.edu;amazon.com;andrew.cmu.edu",
        "position": "PhD student;PhD student;Amazon Scholar;Associate Professor",
        "bibtex": "@inproceedings{\nmeidani2024snip,\ntitle={{SNIP}: Bridging Mathematical Symbolic and Numeric Realms with Unified Pre-training},\nauthor={Kazem Meidani and Parshin Shojaee and Chandan K. Reddy and Amir Barati Farimani},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=KZSEgJGPxu}\n}",
        "github": "",
        "project": "",
        "reviewers": "PqVT;8R9V;RHHe;7mJN",
        "pdf_size": 9161478,
        "rating": "6;8;8;8",
        "confidence": "5;5;4;4",
        "soundness": "3;4;3;3",
        "contribution": "4;3;3;3",
        "presentation": "3;4;3;3",
        "wc_summary": "306;76;159;165",
        "wc_strengths": "55;168;154;38",
        "wc_weaknesses": "312;43;242;52",
        "wc_questions": "485;333;3;127",
        "wc_review": "1158;620;558;382",
        "wc_reply_reviewers": "24;14;16;0",
        "wc_reply_authors": "2504;753;701;708",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "5;2;2;2",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            176.5,
            82.62717470663026
        ],
        "wc_strengths_avg": [
            103.75,
            57.777049941996864
        ],
        "wc_weaknesses_avg": [
            162.25,
            117.43162904430817
        ],
        "wc_questions_avg": [
            237.0,
            185.4561942885705
        ],
        "wc_review_avg": [
            679.5,
            289.7287524565003
        ],
        "wc_reply_reviewers_avg": [
            13.5,
            8.645808232895291
        ],
        "wc_reply_authors_avg": [
            1166.5,
            772.4637531949314
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            1.299038105676658
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 27,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3536765011137809566&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=KZSEgJGPxu",
        "pdf": "https://openreview.net/pdf?id=KZSEgJGPxu",
        "email": "cmu.edu;vt.edu;amazon.com;andrew.cmu.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Carnegie Mellon University;Virginia Tech;Amazon",
        "aff_unique_dep": ";;Amazon.com, Inc.",
        "aff_unique_url": "https://www.cmu.edu;https://www.vt.edu;https://www.amazon.com",
        "aff_unique_abbr": "CMU;VT;Amazon",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "KZZbdJ4wff",
        "title": "PRO: Pseudo-label Regularized Optimization on Unlabeled Test Data",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Web-scale foundation models like CLIP have impressive zero-shot capabilities on many downstream classification tasks, but they still underperform target domain-specific supervised classifiers. This inspired researchers to investigate adaptation strategies that take advantage of unlabeled data, often via pseudolabeling. However, previous methods for adaptation can be difficult to train; poor hyperparameter choices can result in catastrophic collapses in accuracy, and absent target labels, there is little to guide the search with. In this paper, we propose Pseudo-label Regularized Optimization (PRO), which addresses the collapses in test-time adaptation without any label peeking for hyperparameter tuning.  On the 18 datasets addressed in our experiments PRO improves the accuracy of ViT-B-32 by 2.5\\% on average and in the best case by 6.1\\% from tuning the textual encoder. Our code is available at \\url{https://github.com/anonWAEWA/PRO}.",
        "keywords": "zero-shot classification;unsupervised learning;test-time training;CLIP",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Tzu-Ching Yen;Saurabh Garg;Alex Smola;Zachary Chase Lipton;Francesco Locatello",
        "authorids": "~Tzu-Ching_Yen1;~Saurabh_Garg3;~Alex_Smola1;~Zachary_Chase_Lipton1;~Francesco_Locatello1",
        "gender": ";M;M;Unspecified;M",
        "homepage": ";http://saurabhgarg1996.github.io/;http://alex.smola.org;http://zacklipton.com;https://twitter.com/FrancescoLocat8",
        "dblp": "348/6007;80/208;s/AlexanderJSmola;;195/6074",
        "google_scholar": "OK6RSVkAAAAJ;SAnJ1hIAAAAJ;Tb0ZrYwAAAAJ;MN9Kfg8AAAAJ;",
        "orcid": ";;;;",
        "linkedin": ";saurabh-garg-b680b5b8/;smola;;",
        "or_profile": "~Tzu-Ching_Yen1;~Saurabh_Garg3;~Alex_Smola1;~Zachary_Chase_Lipton1;~Francesco_Locatello1",
        "aff": "Carnegie Mellon University;Carnegie Mellon University;Boson AI;Carnegie Mellon University;Institute of Science and Technology",
        "aff_domain": "cmu.edu;cmu.edu;boson.ai;cmu.edu;ist.ac.at",
        "position": "MS student;PhD student;CEO;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nyen2024pro,\ntitle={{PRO}: Pseudo-label Regularized Optimization on Unlabeled Test Data},\nauthor={Tzu-Ching Yen and Saurabh Garg and Alex Smola and Zachary Chase Lipton and Francesco Locatello},\nyear={2024},\nurl={https://openreview.net/forum?id=KZZbdJ4wff}\n}",
        "github": "",
        "project": "",
        "reviewers": "JWjE;Bw6d;Bx9u;A2sn",
        "site": "https://openreview.net/forum?id=KZZbdJ4wff",
        "pdf_size": 1090189,
        "rating": "3;3;3;6",
        "confidence": "3;4;4;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;1;3",
        "presentation": "2;3;2;3",
        "wc_summary": "63;60;124;104",
        "wc_strengths": "12;51;87;146",
        "wc_weaknesses": "60;153;214;135",
        "wc_questions": "54;2;7;5",
        "wc_review": "189;266;432;390",
        "wc_reply_reviewers": "0;0;193;34",
        "wc_reply_authors": "252;360;173;261",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            87.75,
            27.206387117733954
        ],
        "wc_strengths_avg": [
            74.0,
            49.310242343756535
        ],
        "wc_weaknesses_avg": [
            140.5,
            54.92950027080166
        ],
        "wc_questions_avg": [
            17.0,
            21.435951110226018
        ],
        "wc_review_avg": [
            319.25,
            96.84878677608718
        ],
        "wc_reply_reviewers_avg": [
            56.75,
            79.87920567957596
        ],
        "wc_reply_authors_avg": [
            261.5,
            66.37959023675877
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:FiLqPirBkTwJ:scholar.google.com/&scioq=PRO:+Pseudo-label+Regularized+Optimization+on+Unlabeled+Test+Data&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;2",
        "aff_unique_norm": "Carnegie Mellon University;Boson AI;Institute of Science and Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.cmu.edu;https://www.boson.ai;",
        "aff_unique_abbr": "CMU;Boson AI;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "United States;China;"
    },
    {
        "id": "KZaEdLM4Gn",
        "title": "TPE: Towards Better Compositional Reasoning over Conceptual Tools with Multi-persona Collaboration",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs) have demonstrated exceptional performance in planning the use of various **functional tools** in question-answering, such as calculators and retrievers. In this paper, we first broaden the scope of the tool, centered around **conceptual tools** in the context of dialogue systems. A **conceptual tool** specifies a cognitive concept used to help systematic or investigative thought. Such **conceptual tools** play key roles in practice, such as multiple psychological / tutoring strategies being dynamically applied in a single turn to compose helpful responses. To further enhance the reasoning and planning capability of LLMs over these **conceptual tools**, we present a multi-persona collaboration framework: Think-Plan-Execute (*TPE*), which decouples the response generation process into three roles: thinker, planner, and executor. Specifically, the *Thinker* analyzes the internal status exhibited in the dialogue context, such as user emotions and preferences, to formulate a global guideline. The *Planner* generates executable plans to call different **conceptual tools** (a.k.a, different sources or strategies), while the *Executor* assembles all intermediate results into a coherent response. This structured approach enhances response explainability and controllability, reducing token redundancy simultaneously. We demonstrate the effectiveness of *TPE* across various dialogue response generation tasks, encompassing multi-source (FoCus) and multi-strategy interactions (CIMA and PsyQA), revealing its potential to address real-world dialogue interactions with the more complicated tool learning besides only **functional tools**. Full code and data will be released for reproduction.",
        "keywords": "Tool Learning;Dialogue System;Large Language Models",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/63bb2c5f64fbcc9439f242cd232d671f1ba1b16d.zip",
        "author": "Hongru WANG;Huimin WANG;Lingzhi Wang;Minda Hu;Rui Wang;Boyang XUE;Hongyuan Lu;Fei Mi;Kam-Fai Wong",
        "authorids": "~Hongru_WANG1;~Huimin_WANG1;~Lingzhi_Wang1;~Minda_Hu1;~Rui_Wang30;~Boyang_XUE1;~Hongyuan_Lu2;~Fei_Mi1;~Kam-Fai_Wong2",
        "gender": "M;F;F;M;M;M;M;M;M",
        "homepage": "https://rulegreen.github.io/;;https://scholar.google.com/citations?user=_h8phjoAAAAJ&hl=zh-CN;;;https://amourwaltz.github.io/;https://dblp1.uni-trier.de/pid/139/4326.html;https://mifei.github.io/;http://www.se.cuhk.edu.hk/~kfwong",
        "dblp": "72/1462-3;58/1340.html;;260/5462.html;06/2293-92;285/5446.html;139/4326;161/0068;w/KamFaiWong",
        "google_scholar": "s6UtVYUAAAAJ;OD3XsWIAAAAJ;_h8phjoAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?view_op=list_works;S0BbF6wAAAAJ;;gX3493QAAAAJ;",
        "orcid": "0000-0001-5027-0138;0000-0002-6147-8310;0000-0002-1346-2437;0000-0003-1048-1998;;0000-0003-0731-3977;;;0000-0002-9427-5659",
        "linkedin": ";;lingzhi-wang-baa986290;;;boyang-xue-506561208/;luke-lu-595b68136;;",
        "or_profile": "~Hongru_WANG1;~Huimin_WANG1;~Lingzhi_Wang1;~Minda_Hu1;~Rui_Wang30;~Boyang_XUE1;~Hongyuan_Lu2;~Fei_Mi1;~Kam-Fai_Wong2",
        "aff": "University of Edinburgh;Jarvis Research Center, Tencent YouTu Lab;The Chinese University of Hong Kong;The Chinese University of Hong Kong;Harbin Institute of Technology;Chinese University of Hong Kong, The Chinese University of Hong Kong;The Chinese University of Hong Kong;;The Chinese University of Hong Kong",
        "aff_domain": "ed.ac.uk;tencent.com;cuhk.edu.hk;cse.cuhk.edu.hk;hit.edu.cn;se.cuhk.edu.hk;cuhk.edu.hk;;cuhk.edu.hk",
        "position": "Visiting Student;Researcher;Postdoc;PhD student;MS student;PhD student;Researcher;;Full Professor",
        "bibtex": "@misc{\nwang2024tpe,\ntitle={{TPE}: Towards Better Compositional Reasoning over Conceptual Tools with Multi-persona Collaboration},\nauthor={Hongru WANG and Huimin WANG and Lingzhi Wang and Minda Hu and Rui Wang and Boyang XUE and Hongyuan Lu and Fei Mi and Kam-Fai Wong},\nyear={2024},\nurl={https://openreview.net/forum?id=KZaEdLM4Gn}\n}",
        "github": "",
        "project": "",
        "reviewers": "89Qo;U93G;X47T",
        "site": "https://openreview.net/forum?id=KZaEdLM4Gn",
        "pdf_size": 2536918,
        "rating": "3;5;6",
        "confidence": "4;4;4",
        "soundness": "2;2;3",
        "contribution": "1;3;3",
        "presentation": "1;1;3",
        "wc_summary": "63;327;44",
        "wc_strengths": "18;105;62",
        "wc_weaknesses": "113;150;41",
        "wc_questions": "28;37;92",
        "wc_review": "222;619;239",
        "wc_reply_reviewers": "405;48;0",
        "wc_reply_authors": "2390;684;439",
        "reply_reviewers": "2;1;0",
        "reply_authors": "6;2;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            144.66666666666666,
            129.16225798927832
        ],
        "wc_strengths_avg": [
            61.666666666666664,
            35.51838334659329
        ],
        "wc_weaknesses_avg": [
            101.33333333333333,
            45.25728916121935
        ],
        "wc_questions_avg": [
            52.333333333333336,
            28.288199345702836
        ],
        "wc_review_avg": [
            360.0,
            183.27211098982482
        ],
        "wc_reply_reviewers_avg": [
            151.0,
            180.67097165842662
        ],
        "wc_reply_authors_avg": [
            1171.0,
            867.7468909000289
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            3.0,
            2.160246899469287
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:saHUDBqZqBkJ:scholar.google.com/&scioq=TPE:+Towards+Better+Compositional+Reasoning+over+Conceptual+Tools+with+Multi-persona+Collaboration&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;2;3;2;2;2",
        "aff_unique_norm": "University of Edinburgh;Tencent;Chinese University of Hong Kong;Harbin Institute of Technology",
        "aff_unique_dep": ";Tencent YouTu Lab;;",
        "aff_unique_url": "https://www.ed.ac.uk;https://www.tencent.com;https://www.cuhk.edu.hk;http://www.hit.edu.cn/",
        "aff_unique_abbr": "Edinburgh;Tencent;CUHK;HIT",
        "aff_campus_unique_index": "1;1;2;1;1;1",
        "aff_campus_unique": ";Hong Kong SAR;Harbin",
        "aff_country_unique_index": "0;1;1;1;1;1;1;1",
        "aff_country_unique": "United Kingdom;China"
    },
    {
        "id": "KbDzdqevfV",
        "title": "Correct-by-design Safety Critics using Non-contractive Binary Bellman Operators",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The inability to naturally enforce safety in Reinforcement Learning (RL), with limited failures, is a core challenge impeding its use in real-world applications. One notion of safety of vast practical relevance is the ability to avoid (unsafe) regions of the state space. Though such a safety goal can be captured by means of an action-value-like function, a.k.a. safety critics, the associated operator lacks the desired contraction and uniqueness properties that the classical Bellman operator enjoys. In this work, we overcome the non-contractiveness of safety critic operators by leveraging the fact that safety is a binary property. To that end, we study the properties of the binary safety critic associated with a deterministic dynamical system that seeks to avoid reaching an unsafe region. We formulate the corresponding binary Bellman equation (B2E) for safety and study its properties. While the resulting operator is still non-contractive, we provide a full characterization of the fixed points representing--except for a spurious solution--maximal persistently safe regions of the state space that can always avoid failure. Interestingly, while maximality is often a desired notion for performance, in the context of safety, it means that the learned classification boundary is dangerously close and often crosses the region where failure is unavoidable. We thus further propose a one-sided version of the B2E that allows for more robust fixed points that are non-maximal. Finally,  we provide an algorithm that, by design, leverages axiomatic knowledge of safe data points to avoid spurious fixed points. We provide initial empirical validation of our theory, showing how the proposed safety critic outperforms existing solutions, particularly regarding the number of samples (and failures) needed to secure safe policies.",
        "keywords": "Safe RL;Safety-critics;Reachability analysis",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Agustin Castellano;Hancheng Min;Juan Andres Bazerque;Enrique Mallada",
        "authorids": "~Agustin_Castellano1;~Hancheng_Min1;~Juan_Andres_Bazerque1;~Enrique_Mallada1",
        "gender": "M;M;M;M",
        "homepage": "https://mallada.ece.jhu.edu/people/agustin-castellano/;https://hanchmin.github.io/;;http://mallada.ece.jhu.edu",
        "dblp": ";226/6324;;",
        "google_scholar": "wkgAqeUAAAAJ;XgQjPZIAAAAJ;G_bFkugAAAAJ;ZvRFA04AAAAJ",
        "orcid": ";;;0000-0003-1568-1833",
        "linkedin": ";;;emallada/",
        "or_profile": "~Agustin_Castellano1;~Hancheng_Min1;~Juan_Andres_Bazerque1;~Enrique_Mallada1",
        "aff": "Whiting School of Engineering;University of Pennsylvania;University of Pittsburgh;Johns Hopkins University",
        "aff_domain": "engineering.jhu.edu;seas.upenn.edu;pitt.edu;jhu.edu",
        "position": "PhD student;Postdoc;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\ncastellano2024correctbydesign,\ntitle={Correct-by-design Safety Critics using Non-contractive Binary Bellman Operators},\nauthor={Agustin Castellano and Hancheng Min and Juan Andres Bazerque and Enrique Mallada},\nyear={2024},\nurl={https://openreview.net/forum?id=KbDzdqevfV}\n}",
        "github": "",
        "project": "",
        "reviewers": "XLgV;A9xS;2vzB;WKp6",
        "site": "https://openreview.net/forum?id=KbDzdqevfV",
        "pdf_size": 872437,
        "rating": "3;3;5;5",
        "confidence": "4;4;4;3",
        "soundness": "2;2;3;3",
        "contribution": "1;2;2;2",
        "presentation": "2;3;3;3",
        "wc_summary": "67;128;61;138",
        "wc_strengths": "31;88;43;58",
        "wc_weaknesses": "531;80;366;194",
        "wc_questions": "34;66;4;13",
        "wc_review": "663;362;474;403",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            98.5,
            34.74550330618338
        ],
        "wc_strengths_avg": [
            55.0,
            21.319005605327842
        ],
        "wc_weaknesses_avg": [
            292.75,
            171.13061532057904
        ],
        "wc_questions_avg": [
            29.25,
            23.84716964337697
        ],
        "wc_review_avg": [
            475.5,
            115.43071514982483
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:IaQ3Bvqbk0IJ:scholar.google.com/&scioq=Correct-by-design+Safety+Critics+using+Non-contractive+Binary+Bellman+Operators&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Johns Hopkins University;University of Pennsylvania;University of Pittsburgh",
        "aff_unique_dep": "School of Engineering;;",
        "aff_unique_url": "https://engineering.jhu.edu;https://www.upenn.edu;https://www.pitt.edu",
        "aff_unique_abbr": "JHU Engineering;UPenn;Pitt",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Baltimore;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Online GNN Evaluation Under Test-time Graph Distribution Shifts",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18895",
        "id": "KbetDM33YG",
        "author_site": "Xin Zheng, Dongjin Song, Qingsong Wen, Bo Du, Shirui Pan",
        "tldr": "",
        "abstract": "Evaluating the performance of a well-trained GNN model on real-world graphs is a pivotal step for reliable GNN online deployment and serving. \nDue to a lack of test node labels and unknown potential training-test graph data distribution shifts, conventional model evaluation encounters limitations in calculating performance metrics (e.g., test error) and measuring graph data-level discrepancies, particularly when the training graph used for developing GNNs remains unobserved during test time.\nIn this paper, we study a new research problem, online GNN evaluation, which aims to provide valuable insights into the well-trained GNNs's ability to effectively generalize to real-world unlabeled graphs under the test-time graph distribution shifts.\nConcretely, we develop an effective learning behavior discrepancy score, dubbed LeBeD, to estimate the test-time generalization errors of well-trained GNN models. \nThrough a novel GNN re-training strategy with a parameter-free optimality criterion, the proposed LeBeD comprehensively integrates learning behavior discrepancies from both node prediction and structure reconstruction perspectives.\nThis enables the effective evaluation of the well-trained GNNs' ability to capture test node semantics and structural representations, making it an expressive metric for estimating the generalization error in online GNN evaluation.\nExtensive experiments on real-world test graphs under diverse graph distribution shifts could verify the effectiveness of the proposed method, revealing its strong correlation with ground-truth test errors on various well-trained GNN models.",
        "keywords": "Graph neural networks;Model evaluation;Distribution shift",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Xin Zheng;Dongjin Song;Qingsong Wen;Bo Du;Shirui Pan",
        "authorids": "~Xin_Zheng4;~Dongjin_Song2;~Qingsong_Wen2;~Bo_Du3;~Shirui_Pan1",
        "gender": "F;M;;M;M",
        "homepage": ";https://songdj.github.io/;;;https://sites.google.com/site/qingsongwen8/",
        "dblp": ";41/3281;91/8171;70/6443-1.html;27/561",
        "google_scholar": "WAl7OtMAAAAJ;BJdHw6AAAAAJ;https://scholar.google.com.au/citations?user=frWRJN4AAAAJ;Shy1gnMAAAAJ;vjPJvwYAAAAJ",
        "orcid": "0000-0003-0915-7787;;0000-0003-0794-527X;;0000-0003-4516-2524",
        "linkedin": ";;;;qingsong-wen-22814156/",
        "or_profile": "~Xin_Zheng4;~Dongjin_Song2;~Shirui_Pan1;~Bo_Du1;~Qingsong_Wen1",
        "aff": "Monash University;University of Connecticut;Griffith University;Wuhan University;Squirrel Ai Learning",
        "aff_domain": "monash.edu;uconn.edu;griffith.edu.au;whu.edu.cn;squirrelai.com",
        "position": "PhD student;Assistant Professor;Full Professor;Full Professor;Principal Researcher",
        "bibtex": "@inproceedings{\nzheng2024online,\ntitle={Online {GNN} Evaluation Under Test-time Graph Distribution Shifts},\nauthor={Xin Zheng and Dongjin Song and Qingsong Wen and Bo Du and Shirui Pan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=KbetDM33YG}\n}",
        "github": "",
        "project": "",
        "reviewers": "mCrw;sJ17;CD29;83YC",
        "pdf_size": 1398146,
        "rating": "8;8;8;8",
        "confidence": "4;4;4;4",
        "soundness": "3;3;3;3",
        "contribution": "4;4;3;3",
        "presentation": "3;3;3;4",
        "wc_summary": "130;94;98;95",
        "wc_strengths": "195;166;137;150",
        "wc_weaknesses": "115;78;80;126",
        "wc_questions": "2;2;2;2",
        "wc_review": "442;340;317;373",
        "wc_reply_reviewers": "23;0;0;0",
        "wc_reply_authors": "608;444;497;389",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            104.25,
            14.939461168328663
        ],
        "wc_strengths_avg": [
            162.0,
            21.644860821913362
        ],
        "wc_weaknesses_avg": [
            99.75,
            21.123150806638673
        ],
        "wc_questions_avg": [
            2.0,
            0.0
        ],
        "wc_review_avg": [
            368.0,
            47.13279113313787
        ],
        "wc_reply_reviewers_avg": [
            5.75,
            9.959292143521045
        ],
        "wc_reply_authors_avg": [
            484.5,
            80.88417645003256
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2870478640006343917&as_sdt=5,31&sciodt=0,31&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=KbetDM33YG",
        "pdf": "https://openreview.net/pdf?id=KbetDM33YG",
        "email": "monash.edu;uconn.edu;griffith.edu.au;whu.edu.cn;squirrelai.com",
        "author_num": 5,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "Monash University;University of Connecticut;Griffith University;Wuhan University;Squirrel Ai Learning",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.monash.edu;https://www.uconn.edu;https://www.griffith.edu.au;http://www.whu.edu.cn/;https://www.squirrelai.com/",
        "aff_unique_abbr": "Monash;UConn;Griffith;WHU;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;2;2",
        "aff_country_unique": "Australia;United States;China"
    },
    {
        "id": "KbvKjpqYQR",
        "title": "Equivariant Quantum Graph Neural Network for Mixed-Integer Linear Programming",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Mixted-integer linear programming (MILP) is an essential task for operation research, especially for combinatorial optimization problems. Apart from the classic non-learning solvers that often resort to heuristics, recent machine learning-based models have been actively studied, and graph neural networks (GNNs) have been dominantly adopted. However, recent literature has shown that the GNNs based on message passing mechanism suffer fundamental expressiveness limitations in MILP instance representation, in the sense that two different MILP instances could be eventually embedded into exactly the same feature. In this paper, we resort to the quantum mechanism and develop a tailored quantum counterpart of GNNs, called equivariant quantum GNN (EQGNN), which can guarantee to distinguish any two MILPs, i.e., leading to different graph embeddings. EQGNN designs a novel quantum parametric circuit that can encode node and edge features while maintaining the property of permutation equivariance. To enhance the expressivity power of the model, we also introduce an auxiliary layer with an optional number of auxiliary qubits. Experimental results demonstrate the effectiveness of the method in solving MILP problems and the trainability of the model with increasing system scale. Compared with GNN, EQGNN can achieve better separation power and generalization performance with fewer parameters.",
        "keywords": "Quantum machine learning;Quantum graph circuit;Mixed-integer linear programming",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Xinyu Ye;Jianhao Huang;Hao Xiong;Jia Wang;Junchi Yan",
        "authorids": "~Xinyu_Ye2;~Jianhao_Huang1;~Hao_Xiong5;~Jia_Wang3;~Junchi_Yan2",
        "gender": ";M;;M;",
        "homepage": ";;;https://ee.sjtu.edu.cn/EN/FacultyDetail.aspx?id=25&infoid=153&flag=153;",
        "dblp": ";;;;",
        "google_scholar": ";;;;",
        "orcid": ";0009-0005-4548-4023;;;",
        "linkedin": ";;;;",
        "or_profile": "~Xinyu_Ye2;~Jianhao_Huang1;~Hao_Xiong5;~Jia_Wang3;~Junchi_Yan2",
        "aff": ";Shanghai Jiaotong University;;Shanghai Jiaotong University;",
        "aff_domain": ";sjtu.edu.cn;;sjtu.edu.cn;",
        "position": ";Undergrad student;;Full Professor;",
        "bibtex": "@misc{\nye2024equivariant,\ntitle={Equivariant Quantum Graph Neural Network for Mixed-Integer Linear Programming},\nauthor={Xinyu Ye and Jianhao Huang and Hao Xiong and Jia Wang and Junchi Yan},\nyear={2024},\nurl={https://openreview.net/forum?id=KbvKjpqYQR}\n}",
        "github": "",
        "project": "",
        "reviewers": "AMEi;jrPx;43Zw;pyPd",
        "site": "https://openreview.net/forum?id=KbvKjpqYQR",
        "pdf_size": 758668,
        "rating": "5;5;6;8",
        "confidence": "4;3;3;4",
        "soundness": "3;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "95;163;60;101",
        "wc_strengths": "58;34;62;158",
        "wc_weaknesses": "112;265;205;81",
        "wc_questions": "297;182;49;87",
        "wc_review": "562;644;376;427",
        "wc_reply_reviewers": "111;179;126;19",
        "wc_reply_authors": "4001;4413;4352;633",
        "reply_reviewers": "2;1;1;1",
        "reply_authors": "7;7;7;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            104.75,
            37.09700122651425
        ],
        "wc_strengths_avg": [
            78.0,
            47.41307836451879
        ],
        "wc_weaknesses_avg": [
            165.75,
            73.25085323735144
        ],
        "wc_questions_avg": [
            153.75,
            95.84720914038134
        ],
        "wc_review_avg": [
            502.25,
            106.37757047423108
        ],
        "wc_reply_reviewers_avg": [
            108.75,
            57.6470944627741
        ],
        "wc_reply_authors_avg": [
            3349.75,
            1576.3773937417398
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            5.5,
            2.598076211353316
        ],
        "replies_avg": [
            35,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.40824829046386296,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:PW5EEbHlko4J:scholar.google.com/&scioq=Equivariant+Quantum+Graph+Neural+Network+for+Mixed-Integer+Linear+Programming&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Shanghai Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sjtu.edu.cn",
        "aff_unique_abbr": "SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "KcRbiPwuNS",
        "title": "LINK PREDICTION USING NEUMANN EIGENVALUES",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recently, graph-structured data benefits from the advent of Graph Neural Networks (GNNs). Link prediction (LP) is a crucial task in graph-structured data, aiming to estimate the likelihood of non-observable links based on known graph structure and node/edge features. Despite GNN's success in solving graph-level tasks, their results, compared to classical methods, are worse in solving node-level tasks (e.g., LP). The main reason lies in the limitations of Message Passing GNNs (MPNNs), the most common technique used in GNNs. One of the main limitations of MPNNs is their inability to distinguish between some graphs, e.g., k-regular graphs. Discriminating between k-regular graphs lets us count the sub-structures and triangles, which are crucial in the success of classical methods for the LP task. Encoding Link representation instead of node representation can solve this problem, but the previous methods are prohibitively expensive and thus impractical. We propose a novel light learnable eigenbasis to encode the link representation and induced subgraphs efficiently and explicitly. Specifically, we introduce Neumann eigenvalues and encode its corresponding constraints to the eigenbasis. Given the Neumann constraints, the Neumann basis splits the nodes into two (one-hop and two-hop away nodes) and efficiently encodes the relation between them. By formulating the eigenvalue problem with linear constraints, we efficiently implement our proposed convolutional layer with a novel learnable Lanczos algorithm with linear constraints LLwLC. We also conducted experiments investigating the effect of encoding different linear constraints (subgraphs). Although our theoretical results apply to many problem settings, we report our results on link prediction tasks achieving state-of-the-art in benchmark datasets.",
        "keywords": "graph neural network;link prediction",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Niloofar Azizi;Horst Possegger;Horst Bischof",
        "authorids": "~Niloofar_Azizi2;~Horst_Possegger1;~Horst_Bischof2",
        "gender": "F;M;M",
        "homepage": ";http://icg.tugraz.at/;https://www.tugraz.at/institute/icg/research/team-bischof",
        "dblp": ";135/4917;69/3793.html",
        "google_scholar": "mjCaikQAAAAJ;https://scholar.google.at/citations?user=iWPrl3wAAAAJ;https://scholar.google.at/citations?user=_pq05Q4AAAAJ",
        "orcid": ";0000-0002-5427-9938;0000-0002-9096-6671",
        "linkedin": ";;",
        "or_profile": "~Niloofar_Azizi2;~Horst_Possegger1;~Horst_Bischof2",
        "aff": "Technische Universit\u00e4t Graz;Graz University of Technology;Graz University of Technology",
        "aff_domain": "tugraz.at;tugraz.at;tugraz.at",
        "position": "PhD student;Postdoc;Full Professor",
        "bibtex": "@misc{\nazizi2024link,\ntitle={{LINK} {PREDICTION} {USING} {NEUMANN} {EIGENVALUES}},\nauthor={Niloofar Azizi and Horst Possegger and Horst Bischof},\nyear={2024},\nurl={https://openreview.net/forum?id=KcRbiPwuNS}\n}",
        "github": "",
        "project": "",
        "reviewers": "NmSE;8BZ5;eeNp;ZLDq",
        "site": "https://openreview.net/forum?id=KcRbiPwuNS",
        "pdf_size": 360014,
        "rating": "3;3;6;8",
        "confidence": "4;5;3;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "1;1;2;2",
        "wc_summary": "47;69;57;82",
        "wc_strengths": "9;33;24;59",
        "wc_weaknesses": "162;198;81;126",
        "wc_questions": "2;207;212;58",
        "wc_review": "220;507;374;325",
        "wc_reply_reviewers": "0;323;93;83",
        "wc_reply_authors": "641;1320;670;413",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "1;2;2;2",
        "rating_avg": [
            5.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            63.75,
            13.102957681378658
        ],
        "wc_strengths_avg": [
            31.25,
            18.171062159378575
        ],
        "wc_weaknesses_avg": [
            141.75,
            43.338060639581
        ],
        "wc_questions_avg": [
            119.75,
            91.92490141414349
        ],
        "wc_review_avg": [
            356.5,
            103.17582081088572
        ],
        "wc_reply_reviewers_avg": [
            124.75,
            120.01744664839359
        ],
        "wc_reply_authors_avg": [
            761.0,
            337.73732396642214
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8528028654224419,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ZXjdzumAFZsJ:scholar.google.com/&scioq=LINK+PREDICTION+USING+NEUMANN+EIGENVALUES&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Technische Universit\u00e4t Graz;Graz University of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tugraz.at;https://www.tugraz.at",
        "aff_unique_abbr": "TU Graz;TUGraz",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Austria"
    },
    {
        "title": "ReTaSA: A Nonparametric Functional Estimation Approach for Addressing Continuous Target Shift",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18894",
        "id": "KdVvOA00Or",
        "author_site": "Hwanwoo Kim, Xin Zhang, Jiwei Zhao, Qinglong Tian",
        "tldr": "",
        "abstract": "The presence of distribution shifts poses a significant challenge for deploying modern machine learning models in real-world applications. This work focuses on the target shift problem in a regression setting  (Zhang et al., 2013; Nguyen et al., 2016). More specifically, the target variable $y$ (also known as the response variable), which is continuous, has different marginal distributions in the training source and testing domain, while the conditional distribution of features $\\boldsymbol{x}$ given $y$ remains the same. While most literature focuses on classification tasks with finite target space, the regression problem has an *infinite dimensional* target space, which makes many of the existing methods inapplicable. In this work, we show that the continuous target shift problem can be addressed by estimating the importance weight function from an ill-posed integral equation. We propose a nonparametric regularized approach named *ReTaSA* to solve the ill-posed integral equation and provide theoretical justification for the estimated importance weight function. The effectiveness of the proposed method has been demonstrated with extensive numerical studies on synthetic and real-world datasets.",
        "keywords": "label shift;target shift;distributional shift;domain adaptation;transfer learning;importance weight",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/59d5fb3a4ee292d59f4274a57413b47f6c8cdfee.pdf",
        "author": "Hwanwoo Kim;Xin Zhang;Jiwei Zhao;Qinglong Tian",
        "authorids": "~Hwanwoo_Kim1;~Xin_Zhang16;~Jiwei_Zhao1;~Qinglong_Tian1",
        "gender": ";M;;",
        "homepage": ";https://xinzhang-nac.github.io/;https://pages.stat.wisc.edu/~jiweizhao/;https://scholar.google.com/citations?user=dHTZRgsAAAAJ&hl=en&authuser=1",
        "dblp": "294/8267;76/1584-54.html;194/8067;158/8721",
        "google_scholar": ";9u5Pa0gAAAAJ;GmK5rpcAAAAJ;",
        "orcid": "0000-0001-9875-6444;0000-0002-0784-2038;0000-0002-9298-9412;0000-0002-9455-5466",
        "linkedin": ";;;",
        "or_profile": "~Hwanwoo_Kim1;~Xin_Zhang16;~Jiwei_Zhao1;~Qinglong_Tian1",
        "aff": "Duke University;Meta Facebook;University of Wisconsin - Madison;University of Waterloo",
        "aff_domain": "duke.edu;fb.com;wisc.edu;uwaterloo.ca",
        "position": "Postdoc;Research Scientist;Associate Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nkim2024retasa,\ntitle={ReTa{SA}: A Nonparametric Functional Estimation Approach for Addressing Continuous Target Shift},\nauthor={Hwanwoo Kim and Xin Zhang and Jiwei Zhao and Qinglong Tian},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=KdVvOA00Or}\n}",
        "github": "",
        "project": "",
        "reviewers": "2aLy;D6fP;SE3s;4YDN",
        "pdf_size": 456395,
        "rating": "6;6;8;8",
        "confidence": "3;3;3;4",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;4;3;4",
        "wc_summary": "74;110;195;84",
        "wc_strengths": "44;139;58;21",
        "wc_weaknesses": "118;118;1034;87",
        "wc_questions": "24;4;540;10",
        "wc_review": "260;371;1827;202",
        "wc_reply_reviewers": "0;0;560;115",
        "wc_reply_authors": "631;716;4479;739",
        "reply_reviewers": "0;0;4;1",
        "reply_authors": "2;2;12;3",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            115.75,
            47.604490334421186
        ],
        "wc_strengths_avg": [
            65.5,
            44.44378471732578
        ],
        "wc_weaknesses_avg": [
            339.25,
            401.3137021084628
        ],
        "wc_questions_avg": [
            144.5,
            228.45732643099893
        ],
        "wc_review_avg": [
            665.0,
            673.6234111133609
        ],
        "wc_reply_reviewers_avg": [
            168.75,
            230.71559873575953
        ],
        "wc_reply_authors_avg": [
            1641.25,
            1638.869484583809
        ],
        "reply_reviewers_avg": [
            1.25,
            1.6393596310755
        ],
        "reply_authors_avg": [
            4.75,
            4.205650960315181
        ],
        "replies_avg": [
            31,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4547990726494235471&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=KdVvOA00Or",
        "pdf": "https://openreview.net/pdf?id=KdVvOA00Or",
        "email": "duke.edu;fb.com;wisc.edu;uwaterloo.ca",
        "author_num": 4,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Duke University;Meta;University of Wisconsin-Madison;University of Waterloo",
        "aff_unique_dep": ";Meta Platforms, Inc.;;",
        "aff_unique_url": "https://www.duke.edu;https://meta.com;https://www.wisc.edu;https://uwaterloo.ca",
        "aff_unique_abbr": "Duke;Meta;UW-Madison;UW",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Madison",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "United States;Canada"
    },
    {
        "id": "Kfpaq5CJPy",
        "title": "Leveraging image representations for bounded adversarial attacks and robustness",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Both classical and learned image transformations such as the discrete wavelet transforms (DWTs) and flow-based generative models provide semantically meaningful representations of images. In this paper, we propose a general method for robustness exploiting the expressiveness of image representations by targeting substantially low-dimensional subspaces inside the $L^\\infty$ box. Experiments with DCT, DWTs and Glow produce adversarial examples that are significantly more similar to the original than those found considering the full  $L^\\infty$ box. Further, through adversarial training we show that robustness under the introduced constraints transfers better to robustness against a broad class of common image perturbations compared to the standard  $L^\\infty$ box, without a major sacrifice of natural accuracy.",
        "keywords": "Invertible image transforms;Reversible generative models;DCT;DWT;Bounded white-box attacks;Adversarial training;Corruption robustness.",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Mohamed-Hicham LEGHETTAS;Markus P\u00fcschel",
        "authorids": "~Mohamed-Hicham_LEGHETTAS1;~Markus_P\u00fcschel1",
        "gender": "M;M",
        "homepage": "https://acl.inf.ethz.ch/people/hichaml/;https://acl.inf.ethz.ch/",
        "dblp": ";37/6355",
        "google_scholar": ";az9ZryAAAAAJ",
        "orcid": ";0000-0001-8834-8551",
        "linkedin": ";",
        "or_profile": "~Mohamed-Hicham_LEGHETTAS1;~Markus_P\u00fcschel1",
        "aff": "Department of Computer Science, ETHZ - ETH Zurich;Department of Computer Science, ETHZ - ETH Zurich",
        "aff_domain": "inf.ethz.ch;inf.ethz.ch",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nleghettas2024leveraging,\ntitle={Leveraging image representations for bounded adversarial attacks and robustness},\nauthor={Mohamed-Hicham LEGHETTAS and Markus P{\\\"u}schel},\nyear={2024},\nurl={https://openreview.net/forum?id=Kfpaq5CJPy}\n}",
        "github": "",
        "project": "",
        "reviewers": "bTry;F4jF;8uZy;p6XX",
        "site": "https://openreview.net/forum?id=Kfpaq5CJPy",
        "pdf_size": 3494663,
        "rating": "3;5;5;5",
        "confidence": "3;4;4;3",
        "soundness": "3;3;3;2",
        "contribution": "2;3;3;2",
        "presentation": "2;3;3;3",
        "wc_summary": "97;263;44;126",
        "wc_strengths": "51;88;47;117",
        "wc_weaknesses": "364;643;84;205",
        "wc_questions": "4;63;4;2",
        "wc_review": "516;1057;179;450",
        "wc_reply_reviewers": "154;51;0;0",
        "wc_reply_authors": "335;885;117;430",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            132.5,
            80.87799453497843
        ],
        "wc_strengths_avg": [
            75.75,
            28.682529525828087
        ],
        "wc_weaknesses_avg": [
            324.0,
            209.23790287612806
        ],
        "wc_questions_avg": [
            18.25,
            25.849323008543184
        ],
        "wc_review_avg": [
            550.5,
            318.52982591901815
        ],
        "wc_reply_reviewers_avg": [
            51.25,
            62.8704024163994
        ],
        "wc_reply_authors_avg": [
            441.75,
            279.94050707248493
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Ys34BY9lFVcJ:scholar.google.com/&scioq=Leveraging+image+representations+for+bounded+adversarial+attacks+and+robustness&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "ETH Zurich",
        "aff_unique_dep": "Department of Computer Science",
        "aff_unique_url": "https://www.ethz.ch",
        "aff_unique_abbr": "ETHZ",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Zurich",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Switzerland"
    },
    {
        "id": "Kg0IDQF3wp",
        "title": "LegoMT2: Non-Blocking Federated Learning for Massive Multilingual Machine Translation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "What is the maximal number of languages that a single machine translation model can translate? It is a critical challenge to learn a single model for massive languages. Prior methods focus on increasing the model size and training data size. However, large models are difficult to optimize efficiently even with distributed parallel training and translation capacity can interfere among languages. To address the challenge, we propose LegoMT2,  an efficient approach with a tailored model architecture for massive multilingual neural machine translation.  LegoMT2 organizes 435 languages into 8 language-centric groups and attributes one local encoder-decoder for each group and a global encoder-decoder for all languages. LegoMT2 then trains each local and global encoder-decoder on a group-dedicated set of clients through asynchronous updating of parameters. We trained LegoMT2 on a large dataset with 25 billion sentence pairs beyond English-centric. LegoMT2 is 16.2$\\times$ faster than the distributed training method for the same-size NLLB while improving the translation results by an average of 2.2 BLEU on \\textit{Flores-101}~\\footnote{We will release the model and code to the public.}.",
        "keywords": "Massively Multilingual Machine Translation;Non-blocking;Federated Learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Fei Yuan;Yinquan Lu;Lingpeng Kong;Lei Li;Jingjing Xu",
        "authorids": "~Fei_Yuan2;~Yinquan_Lu1;~Lingpeng_Kong1;~Lei_Li11;~Jingjing_Xu1",
        "gender": ";M;M;M;F",
        "homepage": ";;https://ikekonglp.github.io/;https://www.cs.cmu.edu/~leili;",
        "dblp": ";301/2990;144/7656;13/7007-5.html;25/624",
        "google_scholar": ";;f1hBi5wAAAAJ;BYXqAlwAAAAJ;",
        "orcid": ";;;0000-0003-3095-9776;",
        "linkedin": ";;;;",
        "or_profile": "~Fei_Yuan2;~Yinquan_Lu1;~Lingpeng_Kong1;~Lei_Li11;~Jingjing_Xu1",
        "aff": ";Shanghai AI Laboratory;Department of Computer Science, The University of Hong Kong;School of Computer Science, Carnegie Mellon University;",
        "aff_domain": ";pjlab.org.cn;cs.hku.hk;cs.cmu.edu;",
        "position": ";Researcher;Assistant Professor;Assistant Professor;",
        "bibtex": "@misc{\nyuan2024legomt,\ntitle={Lego{MT}2: Non-Blocking Federated Learning for Massive Multilingual Machine Translation},\nauthor={Fei Yuan and Yinquan Lu and Lingpeng Kong and Lei Li and Jingjing Xu},\nyear={2024},\nurl={https://openreview.net/forum?id=Kg0IDQF3wp}\n}",
        "github": "",
        "project": "",
        "reviewers": "x6EA;fThx;s6KB",
        "site": "https://openreview.net/forum?id=Kg0IDQF3wp",
        "pdf_size": 2193912,
        "rating": "3;5;6",
        "confidence": "5;3;3",
        "soundness": "3;2;4",
        "contribution": "2;2;4",
        "presentation": "3;3;3",
        "wc_summary": "59;67;95",
        "wc_strengths": "27;25;40",
        "wc_weaknesses": "131;31;35",
        "wc_questions": "3;58;46",
        "wc_review": "220;181;216",
        "wc_reply_reviewers": "149;0;0",
        "wc_reply_authors": "2011;513;1688",
        "reply_reviewers": "1;0;0",
        "reply_authors": "4;1;3",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            73.66666666666667,
            15.434449203720302
        ],
        "wc_strengths_avg": [
            30.666666666666668,
            6.649979114420001
        ],
        "wc_weaknesses_avg": [
            65.66666666666667,
            46.22649552895924
        ],
        "wc_questions_avg": [
            35.666666666666664,
            23.612614331233114
        ],
        "wc_review_avg": [
            205.66666666666666,
            17.518244457961217
        ],
        "wc_reply_reviewers_avg": [
            49.666666666666664,
            70.23927359786371
        ],
        "wc_reply_authors_avg": [
            1404.0,
            643.6836697219114
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.944911182523068,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:zN7mvShjGpkJ:scholar.google.com/&scioq=LegoMT2:+Non-Blocking+Federated+Learning+for+Massive+Multilingual+Machine+Translation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Shanghai AI Laboratory;University of Hong Kong;Carnegie Mellon University",
        "aff_unique_dep": ";Department of Computer Science;School of Computer Science",
        "aff_unique_url": "https://www.shanghai-ai-lab.com;https://www.hku.hk;https://www.cmu.edu",
        "aff_unique_abbr": "SAIL;HKU;CMU",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Hong Kong SAR;Pittsburgh",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Language Model Cascades: Token-Level Uncertainty And Beyond",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18893",
        "id": "KgaBScZ4VI",
        "author_site": "Neha Gupta, Harikrishna Narasimhan, Wittawat Jitkrittum, Ankit Singh Rawat, Aditya Krishna Menon, Sanjiv Kumar",
        "tldr": "",
        "abstract": "Recent advances in language models (LMs) have led to significant improvements in quality on complex NLP tasks, but at the expense of increased inference costs. A simple strategy to achieve more favorable cost-quality tradeoffs is cascading: here, a small model is invoked for most \u201ceasy\u201d instances, while a few \u201chard\u201d instances are deferred to the large model. While the principles underpinning effective cascading are well-studied for classification tasks \u2014 with deferral based on predicted class uncertainty favored theoretically and practically \u2014 a similar understanding is lacking for generative LM tasks. In this work, we initiate a systematic study of deferral rules for LM cascades. We begin by examining the natural extension of predicted class uncertainty to generative LM tasks, namely, the predicted sequence uncertainty. We show that this measure suffers from the length bias problem, either over- or under-emphasizing outputs based on their lengths. This is because LMs produce a sequence of uncertainty values, one for each output token; and moreover, the number of output tokens is variable across different examples. To mitigate the length bias, we propose to exploit the richer token-level uncertainty information implicit in generative LMs. We argue that naive predicted sequence uncertainty corresponds to a simple aggregation of these uncertainties. By contrast, we show that incorporating token-level uncertainty through learned post-hoc deferral rules can significantly outperform such simple aggregation strategies, via experiments on a range of natural language benchmarks with FLAN-T5 models. We further show that incorporating embeddings from the smaller model and intermediate layers of the larger model can give an additional boost in the overall cost-quality tradeoff.",
        "keywords": "Cascades;Efficient Inference;Language Models",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Neha Gupta;Harikrishna Narasimhan;Wittawat Jitkrittum;Ankit Singh Rawat;Aditya Krishna Menon;Sanjiv Kumar",
        "authorids": "~Neha_Gupta1;~Harikrishna_Narasimhan1;~Wittawat_Jitkrittum1;~Ankit_Singh_Rawat1;~Aditya_Krishna_Menon1;~Sanjiv_Kumar1",
        "gender": "F;M;M;M;;M",
        "homepage": ";https://hari-research.github.io/;http://wittawat.com;https://ankitsrawat.github.io/home/;http://www.sanjivk.com/;https://akmenon.github.io/",
        "dblp": "09/6861-2;56/7573;95/3398.html;https://dblp.org/pers/hd/r/Rawat:Ankit_Singh;;89/3514",
        "google_scholar": ";7X_oT4YAAAAJ;https://scholar.google.co.uk/citations?hl=en;http://scholar.google.com/citations?user=U0_ab4cAAAAJ;https://scholar.google.com/citations?hl=en;",
        "orcid": ";;0000-0002-9400-9262;;;",
        "linkedin": ";;wittawat-jitkrittum/;;;",
        "or_profile": "~Neha_Gupta1;~Harikrishna_Narasimhan1;~Wittawat_Jitkrittum1;~Ankit_Singh_Rawat1;~Sanjiv_Kumar1;~Aditya_Menon1",
        "aff": "Google;Google;Google Research;Google;Google;Google",
        "aff_domain": "google.com;google.com;google.com;google.com;google.com;google.com",
        "position": "Researcher;Research Scientist;Research Scientist;Research Scientist;Research Scientist;Research Scientist",
        "bibtex": "@inproceedings{\ngupta2024language,\ntitle={Language Model Cascades: Token-Level Uncertainty And Beyond},\nauthor={Neha Gupta and Harikrishna Narasimhan and Wittawat Jitkrittum and Ankit Singh Rawat and Aditya Krishna Menon and Sanjiv Kumar},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=KgaBScZ4VI}\n}",
        "github": "",
        "project": "",
        "reviewers": "Qrz5;MA2R;WdbA;7G2G",
        "pdf_size": 5067760,
        "rating": "6;6;8;8",
        "confidence": "4;3;3;4",
        "soundness": "3;3;3;3",
        "contribution": "3;3;2;3",
        "presentation": "3;3;3;4",
        "wc_summary": "175;77;95;336",
        "wc_strengths": "57;77;41;66",
        "wc_weaknesses": "38;196;35;129",
        "wc_questions": "61;59;175;44",
        "wc_review": "331;409;346;575",
        "wc_reply_reviewers": "0;0;11;11",
        "wc_reply_authors": "316;1611;892;481",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "2;4;3;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            170.75,
            102.28972333524028
        ],
        "wc_strengths_avg": [
            60.25,
            13.179055353097201
        ],
        "wc_weaknesses_avg": [
            99.5,
            67.3145600891813
        ],
        "wc_questions_avg": [
            84.75,
            52.518449139326265
        ],
        "wc_review_avg": [
            415.25,
            96.76356494052914
        ],
        "wc_reply_reviewers_avg": [
            5.5,
            5.5
        ],
        "wc_reply_authors_avg": [
            825.0,
            499.92549444892285
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 36,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10304565890543936450&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=KgaBScZ4VI",
        "pdf": "https://openreview.net/pdf?id=KgaBScZ4VI",
        "email": "google.com;google.com;google.com;google.com;google.com;google.com",
        "author_num": 6,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "Google",
        "aff_unique_dep": "Google",
        "aff_unique_url": "https://www.google.com",
        "aff_unique_abbr": "Google",
        "aff_campus_unique_index": "0;0;0;0;0;0",
        "aff_campus_unique": "Mountain View",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Ki39vo5x1T",
        "title": "Federated Offline Policy Learning with Heterogeneous Observational Data",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We consider the problem of learning personalized decision policies from observational bandit feedback data across multiple heterogeneous data sources. Moreover, we examine the practical considerations of this problem in the federated setting where a central server aims to train a policy on data distributed across the heterogeneous sources, or clients, without collecting any of their raw data. We present a policy learning algorithm amenable to federation based on the aggregation of local policies trained with doubly robust offline policy evaluation and learning strategies. We provide a novel regret analysis for our approach that establishes a finite-sample upper bound on a notion of global regret against a mixture distribution of clients. In addition, for any individual client, we establish a corresponding local regret upper bound characterized by measures of relative distribution shift to all other clients. Our analysis and supporting experimental results provide insights into tradeoffs in the participation of heterogeneous data sources in policy learning.",
        "keywords": "offline policy learning;bandits;federated learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/e3359932abaa54b8760e61f931679b95234ee067.zip",
        "author": "Aldo Gael Carranza;Susan Athey",
        "authorids": "~Aldo_Gael_Carranza1;~Susan_Athey1",
        "gender": ";F",
        "homepage": ";https://athey.people.stanford.edu/",
        "dblp": ";59/6032",
        "google_scholar": ";UdaJi94AAAAJ",
        "orcid": ";0000-0001-6934-562X",
        "linkedin": ";",
        "or_profile": "~Aldo_Gael_Carranza1;~Susan_Athey1",
        "aff": ";Stanford University",
        "aff_domain": ";stanford.edu",
        "position": ";Full Professor",
        "bibtex": "@misc{\ncarranza2024federated,\ntitle={Federated Offline Policy Learning with Heterogeneous Observational Data},\nauthor={Aldo Gael Carranza and Susan Athey},\nyear={2024},\nurl={https://openreview.net/forum?id=Ki39vo5x1T}\n}",
        "github": "",
        "project": "",
        "reviewers": "D9wE;eGKx;38dU;oHDw",
        "site": "https://openreview.net/forum?id=Ki39vo5x1T",
        "pdf_size": 1395275,
        "rating": "5;5;6;6",
        "confidence": "3;3;4;3",
        "soundness": "3;3;3;3",
        "contribution": "2;2;2;2",
        "presentation": "3;3;4;4",
        "wc_summary": "64;100;114;119",
        "wc_strengths": "72;91;69;20",
        "wc_weaknesses": "204;103;53;212",
        "wc_questions": "4;23;54;36",
        "wc_review": "344;317;290;387",
        "wc_reply_reviewers": "0;0;46;0",
        "wc_reply_authors": "716;511;647;1031",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;2;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            99.25,
            21.510172012329424
        ],
        "wc_strengths_avg": [
            63.0,
            26.22022120425379
        ],
        "wc_weaknesses_avg": [
            143.0,
            67.4203233454127
        ],
        "wc_questions_avg": [
            29.25,
            18.267115262131565
        ],
        "wc_review_avg": [
            334.5,
            35.82247897619594
        ],
        "wc_reply_reviewers_avg": [
            11.5,
            19.91858428704209
        ],
        "wc_reply_authors_avg": [
            726.25,
            190.7817797904192
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:agiM6zd0QTwJ:scholar.google.com/&scioq=Federated+Offline+Policy+Learning+with+Heterogeneous+Observational+Data&hl=en&as_sdt=0,44",
        "gs_version_total": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "Stanford University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.stanford.edu",
        "aff_unique_abbr": "Stanford",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Stanford",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "KiH8QXn2pk",
        "title": "PPTSER: A Plug-and-Play Tag-guided Method for Few-shot Semantic Entity Recognition on Visually-rich Documents",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Visually-rich document information extraction (VIE) is a vital aspect of document understanding, wherein Semantic Entity Recognition (SER) plays a significant role. However, the study of few-shot SER on visually-rich documents remains largely unexplored despite its considerable potential for practical applications. To address this issue, we propose a simple yet effective Plug-and-Play Tag-guided method for few-shot Semantic Entity Recognition (PPTSER) on visually-rich documents. PPTSER is a pluggable method building upon off-the-shelf multi-modal pre-trained models. It leverages the semantics of the tags to guide the SER task. In essence, PPTSER reformulates SER into entity typing and span detection, handling both tasks simultaneously via cross-attention. Experimental results illustrate that PPTSER outperforms fine-tuning baseline and existing few-shot methods, especially in low-data regimes. With full training data, PPTSER achieves comparable or superior performance to fine-tuning baseline. Specifically, on the FUNSD benchmark, our method improves the performance of LayoutLMv3 in 1-shot, 3-shot and 5-shot scenarios by 15.61%, 2.13%, and 2.01%, respectively. On the XFUND-zh benchmark, it improves the performance of LayoutLMv3 by 3.73%, 6.16%, and 4.01%, respectively. Overall, PPTSER demonstrates promising generalizability, effectiveness, and plug-and-play nature for few-shot SER on visually-rich documents. The codes will be available.",
        "keywords": "Few-shot Learning;Semantic Entity Recognition;Multi-modal Pre-trained Models;Prompt Learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Wenhui Liao;Jiapeng Wang;Longfei Xiong;Lianwen Jin",
        "authorids": "~Wenhui_Liao2;~Jiapeng_Wang1;~Longfei_Xiong1;~Lianwen_Jin1",
        "gender": "M;M;;M",
        "homepage": "https://github.com/whlscut;;https://pdfa.org/people/xiong-longfei;http://www.dlvc-lab.net/lianwen/",
        "dblp": "26/6292.html;;;54/3221",
        "google_scholar": ";MhBiCbUAAAAJ;;WMUStEUAAAAJ",
        "orcid": ";;;0000-0002-5456-0957",
        "linkedin": ";;;",
        "or_profile": "~Wenhui_Liao2;~Jiapeng_Wang1;~Longfei_Xiong1;~Lianwen_Jin1",
        "aff": "South China University of Technology;South China University of Technology;Kingsoft Office;South China University of Technology",
        "aff_domain": "scut.edu.cn;scut.edu.cn;wps.cn;scut.edu.cn",
        "position": "PhD student;PhD student;technical director;Professor",
        "bibtex": "@misc{\nliao2024pptser,\ntitle={{PPTSER}: A Plug-and-Play Tag-guided Method for Few-shot Semantic Entity Recognition on Visually-rich Documents},\nauthor={Wenhui Liao and Jiapeng Wang and Longfei Xiong and Lianwen Jin},\nyear={2024},\nurl={https://openreview.net/forum?id=KiH8QXn2pk}\n}",
        "github": "",
        "project": "",
        "reviewers": "1jv5;GDwj;Ueti",
        "site": "https://openreview.net/forum?id=KiH8QXn2pk",
        "pdf_size": 2435623,
        "rating": "3;6;8",
        "confidence": "4;3;4",
        "soundness": "2;3;3",
        "contribution": "1;2;3",
        "presentation": "2;3;3",
        "wc_summary": "48;84;162",
        "wc_strengths": "54;50;67",
        "wc_weaknesses": "76;33;72",
        "wc_questions": "329;49;91",
        "wc_review": "507;216;392",
        "wc_reply_reviewers": "0;10;0",
        "wc_reply_authors": "2287;615;469",
        "reply_reviewers": "0;1;0",
        "reply_authors": "4;1;1",
        "rating_avg": [
            5.666666666666667,
            2.0548046676563256
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            98.0,
            47.58150901348127
        ],
        "wc_strengths_avg": [
            57.0,
            7.2571803523590805
        ],
        "wc_weaknesses_avg": [
            60.333333333333336,
            19.39644870130154
        ],
        "wc_questions_avg": [
            156.33333333333334,
            123.29188492714712
        ],
        "wc_review_avg": [
            371.6666666666667,
            119.66713091831951
        ],
        "wc_reply_reviewers_avg": [
            3.3333333333333335,
            4.714045207910316
        ],
        "wc_reply_authors_avg": [
            1123.6666666666667,
            824.7574727693523
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            1.4142135623730951
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.1147078669352809,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3540586067235102257&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "South China University of Technology;Kingsoft Corporation",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.scut.edu.cn;https://www.kingsoft.com",
        "aff_unique_abbr": "SCUT;Kingsoft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "KiK4MNkuiQ",
        "title": "Clustering with Geometric Modularity",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Clustering data is a fundamental problem in unsupervised learning with a range of applications in the natural and social sciences. This wide applicability has led to the development of dozens of clustering algorithms. Broadly, these algorithms can be divided as being (i) parametric, e.g. $k$-means, where the centers are parameters and $k$ a hyperparameter, and (ii) non-parametric, e.g. DB-Scan (Ester et al. 1996), which has hyperparameters, but otherwise only uses a density to find clustering. An attractive feature of DB-Scan is not needing to know the number of clusters (usually unknown in practice) in advance. In this work, we propose a new measure of cluster quality, called \\emph{geometric modularity} and show how it can be used to obtain an improved algorithm based on DB-Scan. Through experiments on a wide-range of datasets we show that using geometric modularity yields a superior method. Interestingly, our experiments also show that this quantity tracks a \\emph{supervised} measure called \\emph{normalized mutual information} well, despite using no label information. Finally, we also provide a theoretical justification of the use of this measure by considering a model for well-clusterable data.",
        "keywords": "clustering;modularity",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Vincent Cohen-Addad;Varun Kanade;Silvio Lattanzi",
        "authorids": "~Vincent_Cohen-Addad1;~Varun_Kanade1;~Silvio_Lattanzi1",
        "gender": ";M;M",
        "homepage": ";;https://sites.google.com/site/silviolattanzi/",
        "dblp": "136/5814;31/6692;46/6611",
        "google_scholar": ";;vxUZ4AUAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Vincent_Cohen-Addad1;~Varun_Kanade1;~Silvio_Lattanzi1",
        "aff": "Google;University of Oxford;Google",
        "aff_domain": "google.com;ox.ac.uk;google.com",
        "position": "Researcher;Associate Professor;Researcher",
        "bibtex": "@misc{\ncohen-addad2024clustering,\ntitle={Clustering with Geometric Modularity},\nauthor={Vincent Cohen-Addad and Varun Kanade and Silvio Lattanzi},\nyear={2024},\nurl={https://openreview.net/forum?id=KiK4MNkuiQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "WBYe;KqpR;AWS2;q8CK",
        "site": "https://openreview.net/forum?id=KiK4MNkuiQ",
        "pdf_size": 1025408,
        "rating": "3;3;6;8",
        "confidence": "3;4;4;4",
        "soundness": "3;2;3;4",
        "contribution": "1;1;3;4",
        "presentation": "3;1;3;4",
        "wc_summary": "61;67;105;63",
        "wc_strengths": "65;36;85;27",
        "wc_weaknesses": "322;223;455;34",
        "wc_questions": "57;34;94;158",
        "wc_review": "505;360;739;282",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "619;504;329;189",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            1.299038105676658
        ],
        "presentation_avg": [
            2.75,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            74.0,
            18.027756377319946
        ],
        "wc_strengths_avg": [
            53.25,
            23.09085316743407
        ],
        "wc_weaknesses_avg": [
            258.5,
            153.54559583394112
        ],
        "wc_questions_avg": [
            85.75,
            46.884832302142236
        ],
        "wc_review_avg": [
            471.5,
            173.94036334330224
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            410.25,
            164.25494665306127
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5443310539518174,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:iqLIGHzMHJ4J:scholar.google.com/&scioq=Clustering+with+Geometric+Modularity&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Google;University of Oxford",
        "aff_unique_dep": "Google;",
        "aff_unique_url": "https://www.google.com;https://www.ox.ac.uk",
        "aff_unique_abbr": "Google;Oxford",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Mountain View;",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "title": "Improving the Convergence of Dynamic NeRFs via Optimal Transport",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18892",
        "id": "KiespDPaRH",
        "author_site": "Sameera Ramasinghe, Violetta Shevchenko, Gil Avraham, Hisham Husain, Anton Hengel",
        "tldr": "",
        "abstract": "Synthesizing novel views for dynamic scenes from a collection of RGB inputs poses significant challenges due to the inherent under-constrained nature of the problem. To mitigate this ill-posedness, practitioners in the field of neural radiance fields (NeRF) often resort to the adoption of intricate geometric regularization techniques, including scene flow, depth estimation, or learned perceptual similarity. While these geometric cues have demonstrated their effectiveness, their incorporation leads to evaluation of computationally expensive off-the-shelf models, introducing substantial computational overhead into the pipeline. Moreover, seamlessly integrating such modules into diverse dynamic NeRF models can be a non-trivial task, hindering their utilization in an architecture-agnostic manner. In this paper, we propose a theoretically grounded, lightweight regularizer by treating the dynamics of a time-varying scene as a low-frequency change of a probability distribution of the light intensity. We constrain the dynamics of this distribution using optimal transport (OT) and provide error bounds under reasonable assumptions. Our regularization is learning-free, architecture agnostic, and can be implemented with just a few lines of code. Finally, we demonstrate the practical efficacy of our regularizer across state-of-the-art architectures.",
        "keywords": "Dynamic NeRF;Optimal transport",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/c9cc05695b256b5370001768553f682767beb15f.zip",
        "author": "Sameera Ramasinghe;Violetta Shevchenko;Gil Avraham;Hisham Husain;Anton van den Hengel",
        "authorids": "~Sameera_Ramasinghe1;~Violetta_Shevchenko1;~Gil_Avraham1;~Hisham_Husain1;~Anton_van_den_Hengel1",
        "gender": "M;F;M;;",
        "homepage": ";;;;",
        "dblp": "181/4514;231/1762;220/5446.html;222/3235;v/AntonvandenHengel",
        "google_scholar": "https://scholar.google.com.au/citations?user=-j0m9aMAAAAJ;aWqA0BIAAAAJ;KzzTXt4AAAAJ;bwq3crYAAAAJ;https://scholar.google.com.au/citations?user=nMGZ2ZQAAAAJ",
        "orcid": ";;;;0000-0003-3027-8364",
        "linkedin": ";violetta-shevchenko-12b62714a/;;;",
        "or_profile": "~Sameera_Ramasinghe1;~Violetta_Shevchenko1;~Gil_Avraham1;~Hisham_Husain1;~Anton_van_den_Hengel1",
        "aff": "Amazon;Amazon;Amazon;Amazon;University of Adelaide",
        "aff_domain": "amazon.com;amazon.com;amazon.com;amazon.com;adelaide.edu.au",
        "position": "Researcher;Researcher;Researcher;Researcher;Professor",
        "bibtex": "@inproceedings{\nramasinghe2024improving,\ntitle={Improving the Convergence of Dynamic Ne{RF}s via Optimal Transport},\nauthor={Sameera Ramasinghe and Violetta Shevchenko and Gil Avraham and Hisham Husain and Anton van den Hengel},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=KiespDPaRH}\n}",
        "github": "",
        "project": "",
        "reviewers": "bXej;HrLW;C1xG;cmoJ",
        "pdf_size": 10521970,
        "rating": "6;6;6;6",
        "confidence": "2;4;4;2",
        "soundness": "3;4;2;3",
        "contribution": "3;2;2;3",
        "presentation": "3;4;3;3",
        "wc_summary": "56;84;72;122",
        "wc_strengths": "25;66;24;164",
        "wc_weaknesses": "55;201;200;155",
        "wc_questions": "116;32;48;53",
        "wc_review": "252;383;344;494",
        "wc_reply_reviewers": "20;0;12;0",
        "wc_reply_authors": "830;821;460;837",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "2;2;1;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            1.0
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            83.5,
            24.346457647879703
        ],
        "wc_strengths_avg": [
            69.75,
            56.992872361375156
        ],
        "wc_weaknesses_avg": [
            152.75,
            59.415381005258226
        ],
        "wc_questions_avg": [
            62.25,
            31.98730216820418
        ],
        "wc_review_avg": [
            368.25,
            86.79393700023061
        ],
        "wc_reply_reviewers_avg": [
            8.0,
            8.48528137423857
        ],
        "wc_reply_authors_avg": [
            737.0,
            160.02656029547094
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3122460879710794230&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=KiespDPaRH",
        "pdf": "https://openreview.net/pdf?id=KiespDPaRH",
        "email": "amazon.com;amazon.com;amazon.com;amazon.com;adelaide.edu.au",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0;1",
        "aff_unique_norm": "Amazon;University of Adelaide",
        "aff_unique_dep": "Amazon.com, Inc.;",
        "aff_unique_url": "https://www.amazon.com;https://www.adelaide.edu.au",
        "aff_unique_abbr": "Amazon;Adelaide",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;1",
        "aff_country_unique": "United States;Australia"
    },
    {
        "title": "Cascading Reinforcement Learning",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18891",
        "id": "KjOAHlKMF5",
        "author_site": "Yihan Du, R. Srikant, Wei Chen",
        "tldr": "",
        "abstract": "Cascading bandits have gained popularity in recent years due to their applicability to recommendation systems and online advertising. In the cascading bandit model, at each timestep, an agent recommends an ordered subset of items (called an item list) from a pool of items, each associated with an unknown attraction probability. Then, the user examines the list, and clicks the first attractive item (if any), and after that, the agent receives a reward. The goal of the agent is to maximize the expected cumulative reward. However, the prior literature on cascading bandits ignores the influences of user states (e.g., historical behaviors) on recommendations and the change of states as the session proceeds. Motivated by this fact, we propose a generalized cascading RL framework, which considers the impact of user states and state transition into decisions. In cascading RL, we need to select items not only with  large attraction probabilities but also leading to good successor states. This imposes a huge computational challenge due to the combinatorial action space. To tackle this challenge, we delve into the properties of value functions, and design an oracle BestPerm to efficiently find the optimal item list. Equipped with BestPerm, we develop two algorithms CascadingVI and CascadingBPI, which are both computationally-efficient and sample-efficient, and provide near-optimal regret and sample complexity guarantees. Furthermore, we present experiments to show the improved computational and sample efficiencies of our algorithms compared to straightforward adaptations of existing RL algorithms in practice.",
        "keywords": "reinforcement learning;cascading bandits;combinatorial action space;computational and sample efficiency",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Yihan Du;R. Srikant;Wei Chen",
        "authorids": "~Yihan_Du2;~R._Srikant1;~Wei_Chen10",
        "gender": "F;;M",
        "homepage": "https://yihandu.github.io/;;https://www.microsoft.com/en-us/research/people/weic/",
        "dblp": "231/1919;s/RSrikant;c/WeiChen13",
        "google_scholar": "https://scholar.google.pl/citations?user=_RSr3vUAAAAJ;;hlEPkxAAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Yihan_Du2;~R._Srikant1;~Wei_Chen10",
        "aff": "University of Illinois, Urbana Champaign;University of Illinois, Urbana Champaign;Microsoft Research",
        "aff_domain": "illinois.edu;illinois.edu;microsoft.com",
        "position": "Postdoc;Full Professor;Pricipal Researcher",
        "bibtex": "@inproceedings{\ndu2024cascading,\ntitle={Cascading Reinforcement Learning},\nauthor={Yihan Du and R. Srikant and Wei Chen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=KjOAHlKMF5}\n}",
        "github": "",
        "project": "",
        "reviewers": "6goX;MkFu;Rma4;z4b8",
        "pdf_size": 1300552,
        "rating": "6;6;8;8",
        "confidence": "3;4;3;4",
        "soundness": "3;3;3;4",
        "contribution": "3;2;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "173;176;106;145",
        "wc_strengths": "46;66;103;116",
        "wc_weaknesses": "201;67;62;109",
        "wc_questions": "135;32;194;5",
        "wc_review": "555;341;465;375",
        "wc_reply_reviewers": "431;10;102;23",
        "wc_reply_authors": "2530;732;715;778",
        "reply_reviewers": "3;1;1;2",
        "reply_authors": "5;3;2;3",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            150.0,
            28.1336097932704
        ],
        "wc_strengths_avg": [
            82.75,
            28.047950014216724
        ],
        "wc_weaknesses_avg": [
            109.75,
            55.755605099397854
        ],
        "wc_questions_avg": [
            91.5,
            76.51960533092156
        ],
        "wc_review_avg": [
            434.0,
            83.26463835266445
        ],
        "wc_reply_reviewers_avg": [
            141.5,
            170.81056758877654
        ],
        "wc_reply_authors_avg": [
            1188.75,
            774.7139391414098
        ],
        "reply_reviewers_avg": [
            1.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.25,
            1.0897247358851685
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7430208045083718497&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=KjOAHlKMF5",
        "pdf": "https://openreview.net/pdf?id=KjOAHlKMF5",
        "email": "illinois.edu;illinois.edu;microsoft.com",
        "author_num": 3,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "University of Illinois Urbana-Champaign;Microsoft",
        "aff_unique_dep": ";Microsoft Research",
        "aff_unique_url": "https://illinois.edu;https://www.microsoft.com/en-us/research",
        "aff_unique_abbr": "UIUC;MSR",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Urbana-Champaign;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "DePT: Decomposed Prompt Tuning for Parameter-Efficient Fine-tuning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18890",
        "id": "KjegfPGRde",
        "author_site": "Zhengxiang Shi, Aldo Lipani",
        "tldr": "",
        "abstract": "Prompt tuning (PT), where a small amount of trainable soft (continuous) prompt vectors is affixed to the input of language models (LM), has shown promising results across various tasks and models for parameter-efficient fine-tuning (PEFT). PT stands out from other PEFT approaches because it maintains competitive performance with fewer trainable parameters and does not drastically scale up its parameters as the model size expands. However, PT introduces additional soft prompt tokens, leading to longer input sequences, which significantly impacts training and inference time and memory usage due to the Transformer's quadratic complexity. Particularly concerning for Large Language Models (LLMs) that face heavy daily querying. To address this issue, we propose Decomposed Prompt Tuning (DePT), which decomposes the soft prompt into a shorter soft prompt and a pair of low-rank matrices that are then optimised with two different learning rates. This allows DePT to achieve better performance while saving substantial memory and time costs compared to vanilla PT and its variants, without changing trainable parameter sizes. Through extensive experiments on 23 natural language processing (NLP) and vision-language (VL) tasks, we demonstrate that DePT outperforms state-of-the-art PEFT approaches, including the full fine-tuning baseline, in some scenarios. Additionally, we empirically show that DEPT grows more efficient as the model size increases. Our further study reveals that DePT integrates seamlessly with parameter-efficient transfer learning in the few-shot learning setting and highlights its adaptability to various model architectures and sizes.",
        "keywords": "Natural Language Processing;Large Language Models;Parameter-efficient Fine-tuning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Zhengxiang Shi;Aldo Lipani",
        "authorids": "~Zhengxiang_Shi1;~Aldo_Lipani1",
        "gender": "M;M",
        "homepage": "https://shizhengyan.github.io/;",
        "dblp": "219/7021;150/5264",
        "google_scholar": "TF8l2ZEAAAAJ;",
        "orcid": "0000-0003-3074-3035;",
        "linkedin": "zhengxiang-shi/;",
        "or_profile": "~Zhengxiang_Shi1;~Aldo_Lipani1",
        "aff": "University College London;University College London, University of London",
        "aff_domain": "ucl.ac.uk;ucl.ac.uk",
        "position": "PhD student;Associate Professor",
        "bibtex": "@inproceedings{\nshi2024dept,\ntitle={De{PT}: Decomposed Prompt Tuning for Parameter-Efficient Fine-tuning},\nauthor={Zhengxiang Shi and Aldo Lipani},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=KjegfPGRde}\n}",
        "github": "",
        "project": "",
        "reviewers": "XBEs;mz3i;BZux;yLsP",
        "pdf_size": 654816,
        "rating": "6;6;6;6",
        "confidence": "5;4;4;3",
        "soundness": "1;4;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;4;3;3",
        "wc_summary": "43;73;98;83",
        "wc_strengths": "20;95;51;46",
        "wc_weaknesses": "223;374;131;31",
        "wc_questions": "5;103;29;188",
        "wc_review": "291;645;309;348",
        "wc_reply_reviewers": "17;107;0;50",
        "wc_reply_authors": "1254;1546;786;837",
        "reply_reviewers": "1;2;0;1",
        "reply_authors": "3;4;1;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            1.0897247358851685
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            74.25,
            20.116846174288852
        ],
        "wc_strengths_avg": [
            53.0,
            26.953663943887108
        ],
        "wc_weaknesses_avg": [
            189.75,
            126.20098058256124
        ],
        "wc_questions_avg": [
            81.25,
            71.43659776333136
        ],
        "wc_review_avg": [
            398.25,
            143.94334823117043
        ],
        "wc_reply_reviewers_avg": [
            43.5,
            40.8319727664486
        ],
        "wc_reply_authors_avg": [
            1105.75,
            312.35586676097506
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 44,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12858078056558804170&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=KjegfPGRde",
        "pdf": "https://openreview.net/pdf?id=KjegfPGRde",
        "email": "ucl.ac.uk;ucl.ac.uk",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University College London",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucl.ac.uk",
        "aff_unique_abbr": "UCL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "KjiNHPinrS",
        "title": "Timesteps meet Bits: Low-Latency, Accurate, & Energy-Efficient Spiking Neural Networks with ANN-to-SNN Conversion",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Spiking Neural Networks (SNN) are now demonstrating comparable accuracy to intricate convolutional neural networks (CNN), all while delivering remarkable energy and latency efficiency when deployed on neuromorphic hardware. In particular, ANN-to-SNN conversion has recently gained significant traction in developing deep SNNs with close to state-of-the-art (SOTA) test accuracy on complex image recognition tasks. However, advanced ANN-to-SNN conversion approaches demonstrate that for lossless conversion, the number of SNN time steps must equal the number of quantization steps in the ANN activation function. Reducing the number of time steps significantly increases the conversion error, incurring a significant drop in test accuracy. Moreover, the spiking activity of the SNN, which dominates the compute energy in neuromorphic chips, does not reduce proportionally with the number of time steps. To mitigate the accuracy concern, we propose a novel ANN-to-SNN conversion framework, that incurs an exponentially lower number of time steps compared to that required in the SOTA conversion approaches. Our framework modifies the SNN integrate-and-fire (IF) neuron model with identical complexity and shifts the bias term of each batch normalization (BN) layer in the trained ANN. To mitigate the spiking activity concern, we propose training the source ANN with a fine-grained $\\ell_1$ regularizer with surrogate gradients that encourages high spike sparsity in the converted SNN. Our proposed framework thus yields lossless SNNs with ultra-low latency, ultra-low compute energy, thanks to the ultra-low timesteps and high spike sparsity, and ultra-high test accuracy, for example, $73.30%$ test accuracy with only $4$ time steps on the ImageNet dataset.",
        "keywords": "ANN-to-SNN conversion;IF neuron model;batch normalization;regularizer;surrogate gradients",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Gourav Datta;Zeyu Liu;James Diffenderfer;Bhavya Kailkhura;Peter Anthony Beerel",
        "authorids": "~Gourav_Datta1;~Zeyu_Liu2;~James_Diffenderfer1;~Bhavya_Kailkhura1;~Peter_Anthony_Beerel1",
        "gender": "M;M;;M;M",
        "homepage": "https://godatta.github.io;;;https://people.llnl.gov/kailkhura1;http://sites.usc.edu/eessc.html",
        "dblp": "250/9607.html;116/0645-3;188/4110;132/8938;29/6330",
        "google_scholar": "hxSN-fcAAAAJ;Gk5kyEEAAAAJ;nRr24_QAAAAJ;SQpJmOgAAAAJ;JSdH7PsAAAAJ",
        "orcid": ";;;;",
        "linkedin": "gourav-datta-959571a3/;zeyu-liu-364982220/;;;peter-beerel-b9902a1/",
        "or_profile": "~Gourav_Datta1;~Zeyu_Liu2;~James_Diffenderfer1;~Bhavya_Kailkhura1;~Peter_Anthony_Beerel1",
        "aff": "Amazon;University of Southern California;Lawrence Livermore National Labs;Lawrence Livermore National Laboratory;University of Southern California",
        "aff_domain": "amazon.com;usc.edu;llnl.gov;llnl.gov;usc.edu",
        "position": "Researcher;PhD student;Researcher;Research Staff;Full Professor",
        "bibtex": "@misc{\ndatta2024timesteps,\ntitle={Timesteps meet Bits: Low-Latency, Accurate, \\& Energy-Efficient Spiking Neural Networks with {ANN}-to-{SNN} Conversion},\nauthor={Gourav Datta and Zeyu Liu and James Diffenderfer and Bhavya Kailkhura and Peter Anthony Beerel},\nyear={2024},\nurl={https://openreview.net/forum?id=KjiNHPinrS}\n}",
        "github": "",
        "project": "",
        "reviewers": "bagt;JeWJ;yJuh;nh19",
        "site": "https://openreview.net/forum?id=KjiNHPinrS",
        "pdf_size": 1025849,
        "rating": "3;5;5;6",
        "confidence": "4;5;5;2",
        "soundness": "2;2;2;3",
        "contribution": "2;3;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "43;59;67;45",
        "wc_strengths": "17;48;13;59",
        "wc_weaknesses": "39;166;290;43",
        "wc_questions": "17;8;25;3",
        "wc_review": "116;281;395;150",
        "wc_reply_reviewers": "0;924;31;0",
        "wc_reply_authors": "622;2772;714;255",
        "reply_reviewers": "0;4;1;0",
        "reply_authors": "2;5;2;2",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            1.224744871391589
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            53.5,
            9.937303457175895
        ],
        "wc_strengths_avg": [
            34.25,
            19.68978161382193
        ],
        "wc_weaknesses_avg": [
            134.5,
            103.27753870033891
        ],
        "wc_questions_avg": [
            13.25,
            8.437268515343103
        ],
        "wc_review_avg": [
            235.5,
            110.79372725926319
        ],
        "wc_reply_reviewers_avg": [
            238.75,
            395.8316403472567
        ],
        "wc_reply_authors_avg": [
            1090.75,
            985.741694106524
        ],
        "reply_reviewers_avg": [
            1.25,
            1.6393596310755
        ],
        "reply_authors_avg": [
            2.75,
            1.299038105676658
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.3746343246326776,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:OUu-pOHxiF8J:scholar.google.com/&scioq=Timesteps+meet+Bits:+Low-Latency,+Accurate,+%26+Energy-Efficient+Spiking+Neural+Networks+with+ANN-to-SNN+Conversion&hl=en&as_sdt=0,24",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;2;1",
        "aff_unique_norm": "Amazon;University of Southern California;Lawrence Livermore National Laboratory",
        "aff_unique_dep": "Amazon.com, Inc.;;",
        "aff_unique_url": "https://www.amazon.com;https://www.usc.edu;https://www.llnl.gov",
        "aff_unique_abbr": "Amazon;USC;LLNL",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Los Angeles",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "KkBU26V20i",
        "title": "Guiding RL Agents with Classical Algorithms and Heuristics to Solve Combinatorial Optimization Problems on Graphs",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Graph Combinatorial Optimization (CO) problems are prevalent in various domains, such as supply chain management and operations. These problems are often challenging to solve at scale due to their complexity and large solution spaces. Deep Reinforcement Learning (DRL) methods have recently been explored as solutions to these problems but generally lag behind traditional heuristics. Existing DRL methods are not easily comparable due to differences in training and problem settings. Moreover, existing environments and libraries for DRL on CO lack comprehensive graph environments and predominantly focus on model design and training, overlooking the best practices of environment design. To address these challenges, we identify and emphasize the concept of \\emph{parenting}, a method that combines traditional algorithms with RL agents to guide action selection. This results in hybrid solutions that surpass the performance of individual approaches. We also introduce \\textit{GraphEnvs}, a package of 15 OpenAI-Gym environments that integrate nuanced aspects of environment design, significantly influencing task difficulty and model performance. Our contributions provide a unified and standardized framework that addresses the fragmentation in the research space, enabling more accurate comparisons and evaluations of DRL methods for graph CO problems.",
        "keywords": "Reinforcement Learning;Combinatorial Optimization;Graphs;Deep Learning",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Ali AhmadiTeshnizi;Yingxi Li;Madeleine Udell",
        "authorids": "~Ali_AhmadiTeshnizi1;~Yingxi_Li1;~Madeleine_Udell1",
        "gender": ";F;F",
        "homepage": "https://teshnizi.github.io/;;https://people.orie.cornell.edu/mru8",
        "dblp": ";;153/2166",
        "google_scholar": "475ARYgAAAAJ;;tZ9pEDMAAAAJ",
        "orcid": ";;0000-0002-3985-915X",
        "linkedin": "teshnizi/;yingxi-li2000/;",
        "or_profile": "~Ali_AhmadiTeshnizi1;~Yingxi_Li1;~Madeleine_Udell1",
        "aff": "Stanford University;Stanford University;Stanford University",
        "aff_domain": "stanford.edu;stanford.edu;stanford.edu",
        "position": "PhD student;PhD student;Assistant Professor",
        "bibtex": "@misc{\nahmaditeshnizi2024guiding,\ntitle={Guiding {RL} Agents with Classical Algorithms and Heuristics to Solve Combinatorial Optimization Problems on Graphs},\nauthor={Ali AhmadiTeshnizi and Yingxi Li and Madeleine Udell},\nyear={2024},\nurl={https://openreview.net/forum?id=KkBU26V20i}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=KkBU26V20i",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:iph1Sox0SkMJ:scholar.google.com/&scioq=Guiding+RL+Agents+with+Classical+Algorithms+and+Heuristics+to+Solve+Combinatorial+Optimization+Problems+on+Graphs&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Stanford University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.stanford.edu",
        "aff_unique_abbr": "Stanford",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Stanford",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "KknWbD5j95",
        "title": "SoundStorm: Efficient Parallel Audio Generation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Modeling the tokens of a neural audio codec unlocked rapid progress in audio generation, producing high-quality, coherent audio. However, this approach requires modeling long sequences, thus affecting the training and inference costs. In this work, we propose SoundStorm, a model for efficient, parallel audio generation, which scales gracefully to long sequences without compromising the quality of the generated audio. SoundStorm receives as input coarse, discrete audio representations, and relies on bidirectional attention and confidence-based parallel decoding to sample the tokens of a neural audio codec. Compared to the autoregressive generation approach of AudioLM, our model produces audio of the same quality and with higher consistency in voice and acoustic conditions, while being two orders of magnitude faster. SoundStorm generates 30 seconds of audio in 0.5 seconds on a TPU-v4. We also demonstrate the ability of our model to synthesize high-quality, natural dialogue segments, given a transcript annotated with speaker turns and a short prompt with the speakers\u2019 voices.",
        "keywords": "audio generation;speech synthesis;dialog synthesis;parallel decoding",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/80b08c36f51c1963422feb5ad24725ad42a8b78c.zip",
        "author": "Zal\u00e1n Borsos;Matt Sharifi;Damien Vincent;Eugene Kharitonov;Neil Zeghidour;Marco Tagliasacchi",
        "authorids": "~Zal\u00e1n_Borsos1;~Matt_Sharifi1;~Damien_Vincent1;~Eugene_Kharitonov1;~Neil_Zeghidour1;~Marco_Tagliasacchi3",
        "gender": "Unspecified;M;;;M;M",
        "homepage": ";;;;;",
        "dblp": "135/7963;;43/9268;117/4229;180/2570;",
        "google_scholar": ";GeQNBz0AAAAJ;;;;https://scholar.google.co.uk/citations?user=zwH1rZQAAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Zal\u00e1n_Borsos1;~Matt_Sharifi1;~Damien_Vincent1;~Eugene_Kharitonov1;~Neil_Zeghidour1;~Marco_Tagliasacchi3",
        "aff": "Google;Google Research;Google;Google;Kyutai;Google",
        "aff_domain": "google.com;google.com;google.com;google.com;kyutai.org;google.com",
        "position": "Research Software Engineer;Researcher;PhD student;Researcher;Researcher;Research Scientist",
        "bibtex": "@misc{\nborsos2024soundstorm,\ntitle={SoundStorm: Efficient Parallel Audio Generation},\nauthor={Zal{\\'a}n Borsos and Matt Sharifi and Damien Vincent and Eugene Kharitonov and Neil Zeghidour and Marco Tagliasacchi},\nyear={2024},\nurl={https://openreview.net/forum?id=KknWbD5j95}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZBFp;joNq;9y1z;A5iV;kvR8",
        "site": "https://openreview.net/forum?id=KknWbD5j95",
        "pdf_size": 541046,
        "rating": "3;5;5;6;8",
        "confidence": "3;4;5;3;5",
        "soundness": "3;2;3;3;4",
        "contribution": "1;2;3;2;3",
        "presentation": "3;3;2;3;3",
        "wc_summary": "102;60;41;60;189",
        "wc_strengths": "66;43;48;45;108",
        "wc_weaknesses": "246;232;221;152;198",
        "wc_questions": "43;68;167;53;139",
        "wc_review": "457;403;477;310;634",
        "wc_reply_reviewers": "0;0;0;14;0",
        "wc_reply_authors": "341;300;439;178;138",
        "reply_reviewers": "0;0;0;1;0",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            5.4,
            1.624807680927192
        ],
        "confidence_avg": [
            4.0,
            0.8944271909999159
        ],
        "soundness_avg": [
            3.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            2.2,
            0.7483314773547882
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            90.4,
            53.18872060879073
        ],
        "wc_strengths_avg": [
            62.0,
            24.40491753725056
        ],
        "wc_weaknesses_avg": [
            209.8,
            32.89012009707474
        ],
        "wc_questions_avg": [
            94.0,
            49.6225755075248
        ],
        "wc_review_avg": [
            456.2,
            106.06677142253365
        ],
        "wc_reply_reviewers_avg": [
            2.8,
            5.6
        ],
        "wc_reply_authors_avg": [
            279.2,
            109.51419999251237
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5504818825631803,
        "gs_citation": 110,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12476111044975033127&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0;1;0",
        "aff_unique_norm": "Google;Kyushu University",
        "aff_unique_dep": "Google;",
        "aff_unique_url": "https://www.google.com;https://www.kyushu-u.ac.jp",
        "aff_unique_abbr": "Google;Kyushu U",
        "aff_campus_unique_index": "0;0;0;0;0",
        "aff_campus_unique": "Mountain View;",
        "aff_country_unique_index": "0;0;0;0;1;0",
        "aff_country_unique": "United States;Japan"
    },
    {
        "title": "An Extensible Framework for Open Heterogeneous Collaborative Perception",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18889",
        "id": "KkrDUGIASk",
        "author_site": "Yifan Lu, Yue Hu, Yiqi Zhong, Dequan Wang, Yanfeng Wang, Siheng Chen",
        "tldr": "",
        "abstract": "Collaborative perception aims to mitigate the limitations of single-agent perception, such as occlusions, by facilitating data exchange among multiple agents. However, most current works consider a homogeneous scenario where all agents use identity sensors and perception models. In reality, heterogeneous agent types may continually emerge and inevitably face a domain gap when collaborating with existing agents. In this paper, we introduce a new open heterogeneous problem: how to accommodate continually emerging new heterogeneous agent types into collaborative perception, while ensuring high perception performance and low integration cost? To address this problem, we propose HEterogeneous ALliance (HEAL), a novel extensible collaborative perception framework. HEAL first establishes a unified feature space with initial agents via a novel multi-scale foreground-aware Pyramid Fusion network. When heterogeneous new agents emerge with previously unseen modalities or models, we align them to the established unified space with an innovative backward alignment. This step only involves individual training on the new agent type, thus presenting extremely low training costs and high extensibility. To enrich agents' data heterogeneity, we bring OPV2V-H, a new large-scale dataset with more diverse sensor types. Extensive experiments on OPV2V-H and DAIR-V2X datasets show that HEAL surpasses SOTA methods in performance while reducing the training parameters by 91.5\\% when integrating 3 new agent types. We further implement a comprehensive codebase at: https://github.com/yifanlu0227/HEAL",
        "keywords": "Collaborative Perception;Sensor and Model Heterogeneity",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yifan Lu;Yue Hu;Yiqi Zhong;Dequan Wang;Yanfeng Wang;Siheng Chen",
        "authorids": "~Yifan_Lu1;~Yue_Hu1;~Yiqi_Zhong1;~Dequan_Wang1;~Yanfeng_Wang1;~Siheng_Chen1",
        "gender": "M;F;F;;M;",
        "homepage": "https://yifanlu0227.github.io;https://phyllish.github.io/;;;https://cmic.sjtu.edu.cn/wangyanfeng/;",
        "dblp": ";;243/3355;;55/5407-1.html;",
        "google_scholar": "hiXGPH8AAAAJ;XBbwb78AAAAJ;Bv8l8jkAAAAJ;;https://scholar.google.com/citations?hl=zh-CN;",
        "orcid": ";;;;0000-0002-3196-2347;",
        "linkedin": "yifan-lu-65ab69229/;;;;;",
        "or_profile": "~Yifan_Lu1;~Yue_Hu1;~Yiqi_Zhong1;~Dequan_Wang1;~Yanfeng_Wang1;~Siheng_Chen1",
        "aff": "NVIDIA;Shanghai Jiaotong University;Microsoft;;Shanghai Jiaotong University;",
        "aff_domain": "nvidia.com;sjtu.edu.cn;microsoft.com;;sjtu.edu.cn;",
        "position": "Intern;PhD student;Researcher;;Full Professor;",
        "bibtex": "@inproceedings{\nlu2024an,\ntitle={An Extensible Framework for Open Heterogeneous Collaborative Perception},\nauthor={Yifan Lu and Yue Hu and Yiqi Zhong and Dequan Wang and Yanfeng Wang and Siheng Chen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=KkrDUGIASk}\n}",
        "github": "",
        "project": "",
        "reviewers": "bqtt;wcWo;prVY;hUnZ",
        "pdf_size": 16931390,
        "rating": "5;6;8;8",
        "confidence": "5;5;5;5",
        "soundness": "3;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "3;3;2;3",
        "wc_summary": "46;115;65;102",
        "wc_strengths": "22;54;42;58",
        "wc_weaknesses": "209;110;163;59",
        "wc_questions": "94;95;45;296",
        "wc_review": "371;374;315;515",
        "wc_reply_reviewers": "504;0;73;0",
        "wc_reply_authors": "6275;1440;1786;2875",
        "reply_reviewers": "6;0;1;0",
        "reply_authors": "13;3;3;5",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            5.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            82.0,
            27.721832551258224
        ],
        "wc_strengths_avg": [
            44.0,
            14.0
        ],
        "wc_weaknesses_avg": [
            135.25,
            56.2599991112691
        ],
        "wc_questions_avg": [
            132.5,
            96.53626261669757
        ],
        "wc_review_avg": [
            393.75,
            73.84231510455236
        ],
        "wc_reply_reviewers_avg": [
            144.25,
            209.82894819352262
        ],
        "wc_reply_authors_avg": [
            3094.0,
            1911.3674424348658
        ],
        "reply_reviewers_avg": [
            1.75,
            2.48746859276655
        ],
        "reply_authors_avg": [
            6.0,
            4.123105625617661
        ],
        "replies_avg": [
            38,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 46,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9983995131346420701&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=KkrDUGIASk",
        "pdf": "https://openreview.net/pdf?id=KkrDUGIASk",
        "email": "nvidia.com;sjtu.edu.cn;microsoft.com;;sjtu.edu.cn;",
        "author_num": 6,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "NVIDIA;Shanghai Jiao Tong University;Microsoft",
        "aff_unique_dep": "NVIDIA Corporation;;Microsoft Corporation",
        "aff_unique_url": "https://www.nvidia.com;https://www.sjtu.edu.cn;https://www.microsoft.com",
        "aff_unique_abbr": "NVIDIA;SJTU;Microsoft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;1",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "KksPo0zXId",
        "title": "A Fast Framework for Post-training Structured Pruning Without Retraining",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Pruning has become a widely adopted technique for compressing and accelerating deep neural networks. However, most pruning approaches rely on lengthy retraining procedures to restore performance, rendering them impractical in many real-world settings where data privacy regulations or computational constraints prohibit extensive retraining. To address this limitation, we propose a novel framework for rapidly pruning pre-trained models without any retraining. Our framework focuses on structured pruning. It first groups coupled structures across layers based on their dependencies, and comprehensively measures and removes the least important channels in a group.\nThen we introduce a two-phase layer reconstruction strategy utilizing a small amount of unlabeled data to recover the accuracy drop induced by pruning. The first phase imposes a sparsity penalty on less important channels to squeeze information into the remaining components before pruning.\nThe second phase executes pruning and calibrates the layer output discrepancy between the pruned and original models to reconstruct the output signal.\nExperiments demonstrate that our framework achieves significant improvements over retraining-free methods and matches the accuracy of pruning approaches that require expensive retraining.\nWith access to about 0.2\\% samples from the ImageNet training set, our method achieves up to 1.73x reduction in FLOPs, while maintaining 72.58\\% accuracy for ResNet-50.\nNotably, our framework prunes networks within a few minutes on a single GPU, which is orders of magnitude faster than retraining-based techniques.",
        "keywords": "Model Compression;Structured pruning;Limited data",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/d186f28ccf3aea56d1f619aea8ce46904abc58e6.zip",
        "author": "Chenhao Li;Lin Li;Zhang Zhibin;Qiang Qiu;Jiafeng Guo;Xueqi Cheng",
        "authorids": "~Chenhao_Li2;~Lin_Li24;~Zhang_Zhibin1;~Qiang_Qiu2;~Jiafeng_Guo1;~Xueqi_Cheng1",
        "gender": "M;F;M;M;M;M",
        "homepage": ";;https://scholar.google.com/citations?user=rynJkPAAAAAJ&hl=zh-TW;http://www.ict.ac.cn/sourcedb_2018_ict_cas/cn/jssrck/202011/t20201120_5772106.html;http://www.bigdatalab.ac.cn/gjf/;https://people.ucas.ac.cn/~cxq?language=en",
        "dblp": ";;;;02/146;44/912",
        "google_scholar": ";;rynJkPAAAAAJ;;https://scholar.google.com/citations?view_op=list_works;hY8aLqAAAAAJ",
        "orcid": ";0009-0004-1656-2419;;;;",
        "linkedin": "https://www.linkedin.cn/incareer/in/chenhao-li-58792923a;;;;;",
        "or_profile": "~Chenhao_Li2;~Lin_Li24;~Zhang_Zhibin1;~Qiang_Qiu2;~Jiafeng_Guo1;~Xueqi_Cheng1",
        "aff": "Chinese Academy of Sciences;University of Chinese Academy of Sciences;;, Chinese Academy of Sciences;Institute of Computing Technolgy, Chinese Academy of Sciences;Institute of Computing Technology, Chinese Academy",
        "aff_domain": "ict.ac.cn;ucas.ac.cn;;ict.ac.cn;ict.ac.cn;ict.ac.cn",
        "position": "PhD student;PhD student;;Associate Professor;Researcher;Full Professor",
        "bibtex": "@misc{\nli2024a,\ntitle={A Fast Framework for Post-training Structured Pruning Without Retraining},\nauthor={Chenhao Li and Lin Li and Zhang Zhibin and Qiang Qiu and Jiafeng Guo and Xueqi Cheng},\nyear={2024},\nurl={https://openreview.net/forum?id=KksPo0zXId}\n}",
        "github": "",
        "project": "",
        "reviewers": "4NdE;2uwp;aCSe;eiUM",
        "site": "https://openreview.net/forum?id=KksPo0zXId",
        "pdf_size": 577822,
        "rating": "5;5;5;5",
        "confidence": "4;3;4;4",
        "soundness": "2;2;2;2",
        "contribution": "3;2;2;1",
        "presentation": "3;2;2;3",
        "wc_summary": "223;176;17;86",
        "wc_strengths": "31;152;20;17",
        "wc_weaknesses": "189;440;139;85",
        "wc_questions": "104;14;28;88",
        "wc_review": "547;782;204;276",
        "wc_reply_reviewers": "61;0;0;30",
        "wc_reply_authors": "561;364;346;448",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "2;2;2;1",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            125.5,
            79.669630349337
        ],
        "wc_strengths_avg": [
            55.0,
            56.244999777758025
        ],
        "wc_weaknesses_avg": [
            213.25,
            135.98230583425183
        ],
        "wc_questions_avg": [
            58.5,
            38.24591481452627
        ],
        "wc_review_avg": [
            452.25,
            229.349487682009
        ],
        "wc_reply_reviewers_avg": [
            22.75,
            25.252475126212875
        ],
        "wc_reply_authors_avg": [
            429.75,
            84.99522045385847
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4932010725539608812&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0;0",
        "aff_unique_norm": "Chinese Academy of Sciences;University of Chinese Academy of Sciences",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cas.cn;http://www.ucas.ac.cn",
        "aff_unique_abbr": "CAS;UCAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "FedHyper: A Universal and Robust Learning Rate Scheduler for Federated Learning with Hypergradient Descent",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18888",
        "id": "Kl9CqKf7h6",
        "author_site": "Ziyao Wang, Jianyu Wang, Ang Li",
        "tldr": "",
        "abstract": "The theoretical landscape of federated learning (FL) undergoes rapid evolution, but its practical application encounters a series of intricate challenges, and hyperparameter optimization is one of these critical challenges. Amongst the diverse adjustments in hyperparameters, the adaptation of the learning rate emerges as a crucial component, holding the promise of significantly enhancing the efficacy of FL systems. In response to this critical need, this paper presents FedHyper, a novel hypergradient-based learning rate adaptation algorithm specifically designed for FL. FedHyper serves as a universal learning rate scheduler that can adapt both global and local rates as the training progresses. In addition, FedHyper not only showcases unparalleled robustness to a spectrum of initial learning rate configurations but also significantly alleviates the necessity for laborious empirical learning rate adjustments. We provide a comprehensive theoretical analysis of FedHyper\u2019s convergence rate and conduct extensive experiments on vision and language benchmark datasets. The results demonstrate that FEDHYPER consistently converges 1.1-3\u00d7 faster than FedAvg and the competing baselines while achieving superior final accuracy. Moreover, FEDHYPER catalyzes a remarkable surge in accuracy, augmenting it by up to 15% compared to FedAvg under suboptimal initial learning rate settings.",
        "keywords": "Federate Learning;Learning rate;Hyperparameter;Hypergradient",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/188daeceec710eaa6c39a3024aac214cfe3f9750.pdf",
        "author": "Ziyao Wang;Jianyu Wang;Ang Li",
        "authorids": "~Ziyao_Wang2;~Jianyu_Wang2;~Ang_Li6",
        "gender": "M;M;M",
        "homepage": "https://ziyaow-about.netlify.app;;https://www.ang-li.com",
        "dblp": ";;33/2805-5",
        "google_scholar": "_PdzpfAAAAAJ;5nrx1YwAAAAJ;JVKSaWIAAAAJ",
        "orcid": ";;",
        "linkedin": "https://www.linkedin.cn/injobs/in/ziyao-wang-370229234;;",
        "or_profile": "~Ziyao_Wang2;~Jianyu_Wang2;~Ang_Li6",
        "aff": "University of Maryland, College Park;Apple;Duke University",
        "aff_domain": "umd.edu;apple.com;duke.edu",
        "position": "PhD student;Researcher;PhD student",
        "bibtex": "@inproceedings{\nwang2024fedhyper,\ntitle={FedHyper: A Universal and Robust Learning Rate Scheduler for Federated Learning with Hypergradient Descent},\nauthor={Ziyao Wang and Jianyu Wang and Ang Li},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Kl9CqKf7h6}\n}",
        "github": "",
        "project": "",
        "reviewers": "xGw7;EDET;aiMM;MWyj",
        "pdf_size": 4792152,
        "rating": "5;8;8;8",
        "confidence": "3;5;4;4",
        "soundness": "2;4;3;4",
        "contribution": "2;4;3;4",
        "presentation": "3;4;3;4",
        "wc_summary": "67;48;89;47",
        "wc_strengths": "49;132;142;70",
        "wc_weaknesses": "45;162;106;66",
        "wc_questions": "84;4;3;42",
        "wc_review": "245;346;340;225",
        "wc_reply_reviewers": "0;0;0;18",
        "wc_reply_authors": "1399;479;568;511",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "5;1;1;3",
        "rating_avg": [
            7.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            3.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            62.75,
            17.122718826167766
        ],
        "wc_strengths_avg": [
            98.25,
            39.61297136040163
        ],
        "wc_weaknesses_avg": [
            94.75,
            44.58348909630111
        ],
        "wc_questions_avg": [
            33.25,
            33.25187964611926
        ],
        "wc_review_avg": [
            289.0,
            54.502293529722216
        ],
        "wc_reply_reviewers_avg": [
            4.5,
            7.794228634059948
        ],
        "wc_reply_authors_avg": [
            739.25,
            382.23839092901176
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            1.6583123951777
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.816496580927726,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15544518412628702734&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=Kl9CqKf7h6",
        "pdf": "https://openreview.net/pdf?id=Kl9CqKf7h6",
        "email": "umd.edu;apple.com;duke.edu",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of Maryland;Apple;Duke University",
        "aff_unique_dep": ";Apple Inc.;",
        "aff_unique_url": "https://www/umd.edu;https://www.apple.com;https://www.duke.edu",
        "aff_unique_abbr": "UMD;Apple;Duke",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "College Park;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "KlhEEcSILs",
        "title": "Reducing distortions in Real World Image Super Resolution using Attention",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In the real-world super-resolution (SR), we focus on enhancing perceptual quality beyond conventional resolution enhancement, aiming to address real-world degradations using Generative Adversarial Networks (GANs). GANs hold the potential for restoring fine details in low-resolution images, yet their generative nature may introduce distortions. Our contribution involves a novel approach that improves perceptual quality while minimizing distortions in real-world SR images through the strategic use of residual connections and an attention map. This approach has a simple structure and can be used to improve the performance of previously published SR models by using them as a backbone. We show in our experiments that our proposed method successfully reduces the distortions derived from GANs, thus improving the perceptual quality.",
        "keywords": "super resolution;deep learning",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/702a426398ff8d9e123a65afbf7e646583921cb7.zip",
        "author": "Seungjun Jung;Changick Kim",
        "authorids": "~Seungjun_Jung1;~Changick_Kim1",
        "gender": "M;M",
        "homepage": "https://www.github.com/seungjun45;https://cilabs.kaist.ac.kr",
        "dblp": "183/6674;40/5999",
        "google_scholar": "l6V2TL0AAAAJ;https://scholar.google.co.kr/citations?user=ABH_2lcAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Seungjun_Jung1;~Changick_Kim1",
        "aff": "KAIST, Korea Advanced Institute of Science and Technology;Korea Advanced Institute of Science & Technology",
        "aff_domain": "ee.kaist.ac.kr;kaist.ac.kr",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\njung2024reducing,\ntitle={Reducing distortions in Real World Image Super Resolution using Attention},\nauthor={Seungjun Jung and Changick Kim},\nyear={2024},\nurl={https://openreview.net/forum?id=KlhEEcSILs}\n}",
        "github": "",
        "project": "",
        "reviewers": "X3jk;Vfas;NLs5;JhX2",
        "site": "https://openreview.net/forum?id=KlhEEcSILs",
        "pdf_size": 10893215,
        "rating": "3;3;3;5",
        "confidence": "4;4;5;5",
        "soundness": "3;4;2;2",
        "contribution": "2;1;2;2",
        "presentation": "3;3;1;3",
        "wc_summary": "38;34;76;53",
        "wc_strengths": "27;29;33;48",
        "wc_weaknesses": "134;164;160;170",
        "wc_questions": "29;63;4;12",
        "wc_review": "228;290;273;283",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            50.25,
            16.467771555374455
        ],
        "wc_strengths_avg": [
            34.25,
            8.227241335952167
        ],
        "wc_weaknesses_avg": [
            157.0,
            13.74772708486752
        ],
        "wc_questions_avg": [
            27.0,
            22.66053838724932
        ],
        "wc_review_avg": [
            268.5,
            24.150569351466643
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:geioms9hZL0J:scholar.google.com/&scioq=Reducing+distortions+in+Real+World+Image+Super+Resolution+using+Attention&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "Km3Kprwyua",
        "title": "Online Speculative Decoding",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Speculative decoding is a pivotal technique to accelerate the inference of large language models (LLMs) by employing a smaller draft model to predict the target model's outputs. However, its efficacy can be limited due to the low predictive accuracy of the draft model, particularly when faced with diverse text inputs and a significant capability gap between the draft and target models. \nWe introduce online speculative decoding to address this challenge. \nThe main idea is to continually update (multiple) draft model(s) on observed user query data using the abundant excess computational power in an LLM serving cluster.\nGiven that LLM inference is memory-bounded, the surplus computational power in a typical LLM serving cluster can be repurposed for online retraining of draft models, thereby making the training cost-neutral.\nSince the query distribution of an LLM service is relatively simple, retraining on query distribution enables the draft model to more accurately predict the target model's outputs, particularly on data originating from query distributions.\nAs the draft model evolves online, it aligns with the query distribution in real time, mitigating distribution shifts. \nWe develop a prototype of online speculative decoding based on online knowledge distillation and evaluate it using both synthetic and real query data on several popular LLMs. The results show a substantial increase in the token acceptance rate by 0.1 to 0.48, which translates into 1.22x to 2.42x latency reduction.",
        "keywords": "Speculative Decoding;Knowledge Distillation;Online Learning",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/a00d1bb0e7ac501ffa8d935d84ee4e90b7cd6952.zip",
        "author": "Xiaoxuan Liu;Lanxiang Hu;Peter Bailis;Ion Stoica;Zhijie Deng;Alvin Cheung;Hao Zhang",
        "authorids": "~Xiaoxuan_Liu2;~Lanxiang_Hu1;~Peter_Bailis2;~Ion_Stoica1;~Zhijie_Deng1;~Alvin_Cheung2;~Hao_Zhang2",
        "gender": ";M;M;M;M;;M",
        "homepage": ";https://snyhlxde1.github.io/;http://www.bailis.org/;http://people.eecs.berkeley.edu/~istoica/;https://thudzj.github.io/;;https://cseweb.ucsd.edu/~haozhang/",
        "dblp": ";;47/8816;s/IonStoica;209/4959;;55/2270-25",
        "google_scholar": ";KufYmg8AAAAJ;qG1LVpQAAAAJ;vN-is70AAAAJ;J3dR0sUAAAAJ;;H1d4BS8AAAAJ",
        "orcid": ";0000-0003-0641-3677;;;0000-0002-0932-1631;;",
        "linkedin": ";hu-lanxiang/;;ionstoica;;;",
        "or_profile": "~Xiaoxuan_Liu2;~Lanxiang_Hu1;~Peter_Bailis2;~Ion_Stoica1;~Zhijie_Deng1;~Alvin_Cheung2;~Hao_Zhang2",
        "aff": ";University of California, San Diego;Stanford University;University of California, Berkeley;Shanghai Jiaotong University;;Carnegie Mellon University",
        "aff_domain": ";ucsd.edu;stanford.edu;berkeley.edu;sjtu.edu.cn;;cmu.edu",
        "position": ";PhD student;Adjunct Professor;Full Professor;Assistant Professor;;PhD student",
        "bibtex": "@misc{\nliu2024online,\ntitle={Online Speculative Decoding},\nauthor={Xiaoxuan Liu and Lanxiang Hu and Peter Bailis and Ion Stoica and Zhijie Deng and Alvin Cheung and Hao Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=Km3Kprwyua}\n}",
        "github": "",
        "project": "",
        "reviewers": "fopk;rfi3;g3SB;y71B",
        "site": "https://openreview.net/forum?id=Km3Kprwyua",
        "pdf_size": 1238355,
        "rating": "6;6;6;6",
        "confidence": "4;4;2;3",
        "soundness": "3;3;3;3",
        "contribution": "3;3;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "121;47;57;45",
        "wc_strengths": "29;34;20;44",
        "wc_weaknesses": "300;288;15;26",
        "wc_questions": "6;4;76;41",
        "wc_review": "456;373;168;156",
        "wc_reply_reviewers": "215;0;104;0",
        "wc_reply_authors": "1691;1126;791;794",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "3;5;4;4",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            67.5,
            31.22098653149833
        ],
        "wc_strengths_avg": [
            31.75,
            8.671072598012312
        ],
        "wc_weaknesses_avg": [
            157.25,
            136.87106158717407
        ],
        "wc_questions_avg": [
            31.75,
            29.4819860253681
        ],
        "wc_review_avg": [
            288.25,
            129.6849547943014
        ],
        "wc_reply_reviewers_avg": [
            79.75,
            88.88299893680455
        ],
        "wc_reply_authors_avg": [
            1100.5,
            367.10795414972966
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            4.0,
            0.7071067811865476
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 67,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4611335299573429966&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "University of California, San Diego;Stanford University;University of California, Berkeley;Shanghai Jiao Tong University;Carnegie Mellon University",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.ucsd.edu;https://www.stanford.edu;https://www.berkeley.edu;https://www.sjtu.edu.cn;https://www.cmu.edu",
        "aff_unique_abbr": "UCSD;Stanford;UC Berkeley;SJTU;CMU",
        "aff_campus_unique_index": "0;1;2",
        "aff_campus_unique": "San Diego;Stanford;Berkeley;",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "KmvYOALQnm",
        "title": "Improving Sample Efficiency in Off-policy RL with Low-dimensional Policy Representation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Off-policy Reinforcement Learning (RL) is fundamental to realizing intelligent decision-making agents by trial and error.\nThe most notorious issue of off-policy RL is known as Deadly Triad, i.e., Bootstrapping, Function Approximation, and Off-policy Learning. Despite recent advances in bootstrapping algorithms with better bias control, improvements in the latter two factors are relatively less studied. In this paper, we propose an efficient and general off-policy RL algorithm based on the low-dimensional policy representation.\nOrthogonal to better bootstrapping, our improvement is two-fold. On the one hand, the policy representation serves as an additional input to the value function, allowing it to offer preferable function approximation with less interference and better generalization. On the other hand, the policy representation empowers off-policy RL methods to perform off-policy learning in a more sufficient manner.  Specifically, we perform additional value learning for proximal historical policies along the learning process. This drives the value generalization from learned policies and in turn, leads to more efficient learning. We evaluate our algorithms on continuous control tasks and the empirical results demonstrate consistent improvements in terms of efficiency and stability.",
        "keywords": "Reinforcement Learning;Off-policy;Representation Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Min Zhang;Jianye HAO;Hongyao Tang;YAN ZHENG",
        "authorids": "~Min_Zhang13;~Jianye_HAO1;~Hongyao_Tang1;~YAN_ZHENG1",
        "gender": "M;M;M;F",
        "homepage": "http://www.icdai.org/jianye.html;https://bluecontra.github.io/;https://yanzzzzz.github.io;",
        "dblp": "21/7664.html;220/4275;10/2381-2;83/5342-40",
        "google_scholar": ";yIqzRH4AAAAJ;https://scholar.google.com.hk/citations?user=tJuhd1kAAAAJ;",
        "orcid": "0000-0002-0422-8235;;;0000-0002-6962-4482",
        "linkedin": ";;;",
        "or_profile": "~Jianye_HAO1;~Hongyao_Tang1;~YAN_ZHENG1;~Zm_TJU1",
        "aff": "Tianjin University;Montreal Institute for Learning Algorithms, University of Montreal, Universit\u00e9 de Montr\u00e9al;Tianjin Unibersity, China;Tianjin University",
        "aff_domain": "tju.edu.cn;mila.umontreal.ca;tju.edu.cn;tju.edu.cn",
        "position": "Associate Professor;Postdoc;Associate Professor;PhD student",
        "bibtex": "@misc{\nzhang2024improving,\ntitle={Improving Sample Efficiency in Off-policy {RL} with Low-dimensional Policy Representation},\nauthor={Min Zhang and Jianye HAO and Hongyao Tang and YAN ZHENG},\nyear={2024},\nurl={https://openreview.net/forum?id=KmvYOALQnm}\n}",
        "github": "",
        "project": "",
        "reviewers": "QhXs;WhXc;PEwK;4bv2",
        "site": "https://openreview.net/forum?id=KmvYOALQnm",
        "pdf_size": 701173,
        "rating": "3;3;3;5",
        "confidence": "3;4;4;4",
        "soundness": "2;2;3;2",
        "contribution": "2;2;2;2",
        "presentation": "1;1;3;2",
        "wc_summary": "36;318;84;52",
        "wc_strengths": "19;22;45;16",
        "wc_weaknesses": "249;29;263;81",
        "wc_questions": "493;884;186;363",
        "wc_review": "797;1253;578;512",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            122.5,
            114.18734605900953
        ],
        "wc_strengths_avg": [
            25.5,
            11.4564392373896
        ],
        "wc_weaknesses_avg": [
            155.5,
            102.28758477938561
        ],
        "wc_questions_avg": [
            481.5,
            256.6617423770048
        ],
        "wc_review_avg": [
            785.0,
            290.0629242078346
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:3ouHzd4dX30J:scholar.google.com/&scioq=Improving+Sample+Efficiency+in+Off-policy+RL+with+Low-dimensional+Policy+Representation&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Tianjin University;University of Montreal",
        "aff_unique_dep": ";Montreal Institute for Learning Algorithms",
        "aff_unique_url": "http://www.tju.edu.cn;https://www.mila.quebec",
        "aff_unique_abbr": "TJU;MILA",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Montreal",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "China;Canada"
    },
    {
        "title": "On the Markov Property of Neural Algorithmic Reasoning: Analyses and Methods",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18887",
        "id": "Kn7tWhuetn",
        "author_site": "Montgomery Bohde, Meng Liu, Alexandra Saxton, Shuiwang Ji",
        "tldr": "",
        "abstract": "Neural algorithmic reasoning is an emerging research direction that endows neural networks with the ability to mimic algorithmic executions step-by-step. A common paradigm in existing designs involves the use of historical embeddings in predicting the results of future execution steps. Our observation in this work is that such historical dependence intrinsically contradicts the Markov nature of algorithmic reasoning tasks. Based on this motivation, we present our ForgetNet, which does not use historical embeddings and thus is consistent with the Markov nature of the tasks. To address challenges in training ForgetNet at early stages, we further introduce G-ForgetNet, which uses a gating mechanism to allow for the selective integration of historical embeddings. Such an enhanced capability provides valuable computational pathways during the model's early training phase. Our extensive experiments, based on the CLRS-30 algorithmic reasoning benchmark, demonstrate that both ForgetNet and G-ForgetNet achieve better generalization capability than existing methods. Furthermore, we investigate the behavior of the gating mechanism, highlighting its degree of alignment with our intuitions and its effectiveness for robust performance. Our code is publicly available at https://github.com/divelab/ForgetNet.",
        "keywords": "Neural Algorithmic Reasoning",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Montgomery Bohde;Meng Liu;Alexandra Saxton;Shuiwang Ji",
        "authorids": "~Montgomery_Bohde1;~Meng_Liu3;~Alexandra_Saxton1;~Shuiwang_Ji1",
        "gender": "M;M;F;M",
        "homepage": "https://www.mbohde.com/;https://mengliu1998.github.io;;http://people.tamu.edu/~sji",
        "dblp": "352/4123;41/7841-15;;84/6405",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;https://scholar.google.com/citations?hl=en;;BZGj6sAAAAAJ",
        "orcid": "0009-0007-7705-1219;;;0000-0002-4205-4563",
        "linkedin": "montgomery-bohde/;meng-liu-4a1813197/;alexandra-saxton-70705a202;shuiwang-ji-9a040715/",
        "or_profile": "~Montgomery_Bohde1;~Meng_Liu3;~Alexandra_Saxton1;~Shuiwang_Ji1",
        "aff": "Massachusetts Institute of Technology;NVIDIA;Texas A&M University - College Station;Texas A&M University",
        "aff_domain": "mit.edu;nvidia.com;tamu.edu;tamu.edu",
        "position": "Intern;Researcher;Undergrad student;Professor",
        "bibtex": "@inproceedings{\nbohde2024on,\ntitle={On the Markov Property of Neural Algorithmic Reasoning: Analyses and Methods},\nauthor={Montgomery Bohde and Meng Liu and Alexandra Saxton and Shuiwang Ji},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Kn7tWhuetn}\n}",
        "github": "",
        "project": "",
        "reviewers": "QaJ5;PbVk;VNPs;gWrY;fqct",
        "pdf_size": 6257447,
        "rating": "6;6;6;8;8",
        "confidence": "3;3;4;2;4",
        "soundness": "3;3;3;3;3",
        "contribution": "3;3;2;3;3",
        "presentation": "4;2;3;4;3",
        "wc_summary": "39;137;156;68;40",
        "wc_strengths": "45;71;25;73;129",
        "wc_weaknesses": "105;96;103;60;160",
        "wc_questions": "2;167;3;5;75",
        "wc_review": "191;471;287;206;404",
        "wc_reply_reviewers": "0;17;20;67;16",
        "wc_reply_authors": "288;1078;513;596;427",
        "reply_reviewers": "0;1;1;2;1",
        "reply_authors": "1;2;1;2;1",
        "rating_avg": [
            6.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.2,
            0.7483314773547882
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.8,
            0.39999999999999997
        ],
        "presentation_avg": [
            3.2,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            88.0,
            49.25444142409901
        ],
        "wc_strengths_avg": [
            68.6,
            35.01770980518287
        ],
        "wc_weaknesses_avg": [
            104.8,
            32.046216625367805
        ],
        "wc_questions_avg": [
            50.4,
            64.57739542595381
        ],
        "wc_review_avg": [
            311.8,
            109.76957684167321
        ],
        "wc_reply_reviewers_avg": [
            24.0,
            22.60088493842664
        ],
        "wc_reply_authors_avg": [
            580.4,
            268.8572855624337
        ],
        "reply_reviewers_avg": [
            1.0,
            0.6324555320336759
        ],
        "reply_authors_avg": [
            1.4,
            0.4898979485566356
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.21821789023599233,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11120054823328360108&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=Kn7tWhuetn",
        "pdf": "https://openreview.net/pdf?id=Kn7tWhuetn",
        "email": "mit.edu;nvidia.com;tamu.edu;tamu.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;2;2",
        "aff_unique_norm": "Massachusetts Institute of Technology;NVIDIA;Texas A&M University",
        "aff_unique_dep": ";NVIDIA Corporation;",
        "aff_unique_url": "https://web.mit.edu;https://www.nvidia.com;https://www.tamu.edu",
        "aff_unique_abbr": "MIT;NVIDIA;TAMU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";College Station",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "KncRpAnprQ",
        "title": "A Novel Approach For Adversarial Robustness",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep learning has made tremendous progress in the last decades; however, it is not robust to adversarial attacks.  \nTo deal with this issue, perhaps the most effective approach is adversarial training at a high computational cost, although it is impractical as it needs prior knowledge about the attackers.\nIn this paper, we propose a novel approach that can train a robust network only through standard training\nwith clean images without awareness of the attacker's strategy. Essentially, we add a specially designed network input layer,\nwhich accomplishes a randomized feature squeezing to greatly reduce the malicious perturbation. \nIt achieves the state of the art of robustness against unseen ${l_1,l_2,\\text{and }l_\\infty}$-attacks at one time in terms of the computational cost of the attacker versus the defender through just 100/50 epochs of standard training with clean images in CIFAR-10/ImageNet.",
        "keywords": "Adversarial Robustness;Randomized Feature Squeezing",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Jing Wang;Liang Cao;Guanrong Li",
        "authorids": "~Jing_Wang4;~Liang_Cao2;~Guanrong_Li1",
        "gender": ";M;M",
        "homepage": "https://cs.nankai.edu.cn/;https://cs.nankai.edu.cn/;https://cs.nankai.edu.cn/",
        "dblp": ";;",
        "google_scholar": ";;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Jing_Wang4;~Liang_Cao2;~Guanrong_Li1",
        "aff": "Nankai University;Nankai University;Nankai University",
        "aff_domain": "nankai.edu.cn;nankai.edu.cn;nankai.edu.cn",
        "position": "Associate Professor;MS student;MS student",
        "bibtex": "@misc{\nwang2024a,\ntitle={A Novel Approach For Adversarial Robustness},\nauthor={Jing Wang and Liang Cao and Guanrong Li},\nyear={2024},\nurl={https://openreview.net/forum?id=KncRpAnprQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "S7uL;S5kz;88kq;CbH6",
        "site": "https://openreview.net/forum?id=KncRpAnprQ",
        "pdf_size": 954881,
        "rating": "1;1;3;3",
        "confidence": "4;5;4;4",
        "soundness": "1;2;1;1",
        "contribution": "1;1;2;1",
        "presentation": "1;1;2;2",
        "wc_summary": "57;69;31;69",
        "wc_strengths": "44;55;49;36",
        "wc_weaknesses": "183;79;149;353",
        "wc_questions": "8;33;3;84",
        "wc_review": "292;236;232;542",
        "wc_reply_reviewers": "0;0;0;20",
        "wc_reply_authors": "195;0;170;514",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;0;1;1",
        "rating_avg": [
            2.0,
            1.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            56.5,
            15.5161206491829
        ],
        "wc_strengths_avg": [
            46.0,
            6.96419413859206
        ],
        "wc_weaknesses_avg": [
            191.0,
            100.7670581092849
        ],
        "wc_questions_avg": [
            32.0,
            32.101401838549044
        ],
        "wc_review_avg": [
            325.5,
            127.22715905025939
        ],
        "wc_reply_reviewers_avg": [
            5.0,
            8.660254037844387
        ],
        "wc_reply_authors_avg": [
            219.75,
            185.7153399695351
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            0.75,
            0.4330127018922193
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Nankai University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.nankai.edu.cn",
        "aff_unique_abbr": "NKU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Mitigating Emergent Robustness Degradation while Scaling Graph Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18886",
        "id": "Koh0i2u8qX",
        "author_site": "Xiangchi Yuan, Chunhui Zhang, Yijun Tian, Yanfang Ye, Chuxu Zhang",
        "tldr": "",
        "abstract": "Although graph neural networks have exhibited remarkable performance in various graph tasks, a significant concern is their vulnerability to adversarial attacks. Consequently, many defense methods have been proposed to alleviate the deleterious effects of adversarial attacks and learn robust graph representations. However, most of them are difficult to *simultaneously* avoid two major limitations: (i) an emergent and severe degradation in robustness when exposed to very intense attacks, and (ii) heavy computation complexity hinders them from scaling to large graphs. In response to these challenges, we introduce an innovative graph defense method for unpredictable real-world scenarios by *designing a graph robust learning framework that is resistant to robustness degradation* and *refraining from unscalable designs with heavy computation*: specifically, our method employs a denoising module, which eliminates edges that are associated with attacked nodes to reconstruct a cleaner graph; Then, it applies Mixture-of-Experts to select differentially private noises with varying magnitudes to counteract the hidden features attacked at different intensities toward robust predictions; Moreover, our overall design avoids the reliance on heavy adjacency matrix computations, such as SVD, thus facilitating its applicability even on large graphs. Comprehensive experiments have been conducted to demonstrate the anti-degraded robustness and scalability of our method, as compared to popular graph adversarial learning methods, under diverse attack intensities and various datasets of different sizes.",
        "keywords": "Graph neural network",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Xiangchi Yuan;Chunhui Zhang;Yijun Tian;Yanfang Ye;Chuxu Zhang",
        "authorids": "~Xiangchi_Yuan1;~Chunhui_Zhang1;~Yijun_Tian1;~Yanfang_Ye1;~Chuxu_Zhang2",
        "gender": "M;M;;;",
        "homepage": "https://xiangchi-yuan.github.io/;https://chunhuizng.github.io;https://www.yijuntian.com/;http://yes-lab.org/;",
        "dblp": "292/1211;62/3401;234/9123-1;;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.com.hk/citations?user=jlqnbkAAAAAJ;dbaBgV0AAAAJ;egjr888AAAAJ;",
        "orcid": ";;0000-0003-2795-6080;;",
        "linkedin": ";chunhui-zhang-541827161/;yijun-tian/;;",
        "or_profile": "~Xiangchi_Yuan1;~Chunhui_Zhang1;~Yijun_Tian1;~Yanfang_Ye1;~Chuxu_Zhang2",
        "aff": "Brandeis University;Dartmouth College;University of Notre Dame;University of Notre Dame;",
        "aff_domain": "brandeis.edu;dartmouth.edu;nd.edu;nd.edu;",
        "position": "MS student;PhD student;PhD student;Associate Professor;",
        "bibtex": "@inproceedings{\nyuan2024mitigating,\ntitle={Mitigating Emergent Robustness Degradation while Scaling Graph Learning},\nauthor={Xiangchi Yuan and Chunhui Zhang and Yijun Tian and Yanfang Ye and Chuxu Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Koh0i2u8qX}\n}",
        "github": "",
        "project": "",
        "reviewers": "Fsb2;qpZP;owAp;kprb",
        "pdf_size": 1397247,
        "rating": "6;6;6;8",
        "confidence": "4;4;3;4",
        "soundness": "3;2;3;4",
        "contribution": "2;2;2;4",
        "presentation": "2;2;3;3",
        "wc_summary": "48;43;51;62",
        "wc_strengths": "32;20;31;103",
        "wc_weaknesses": "99;172;144;75",
        "wc_questions": "154;31;63;4",
        "wc_review": "333;266;289;244",
        "wc_reply_reviewers": "326;18;17;0",
        "wc_reply_authors": "3660;1332;1605;228",
        "reply_reviewers": "3;1;1;0",
        "reply_authors": "7;4;4;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            51.0,
            6.96419413859206
        ],
        "wc_strengths_avg": [
            46.5,
            32.95830699535399
        ],
        "wc_weaknesses_avg": [
            122.5,
            37.818646194701365
        ],
        "wc_questions_avg": [
            63.0,
            56.53759810957661
        ],
        "wc_review_avg": [
            283.0,
            32.96209944769902
        ],
        "wc_reply_reviewers_avg": [
            90.25,
            136.2981566273
        ],
        "wc_reply_authors_avg": [
            1706.25,
            1240.2294898525836
        ],
        "reply_reviewers_avg": [
            1.25,
            1.0897247358851685
        ],
        "reply_authors_avg": [
            4.0,
            2.1213203435596424
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3338413054836813602&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=Koh0i2u8qX",
        "pdf": "https://openreview.net/pdf?id=Koh0i2u8qX",
        "email": "brandeis.edu;dartmouth.edu;nd.edu;nd.edu;",
        "author_num": 5,
        "aff_unique_index": "0;1;2;2",
        "aff_unique_norm": "Brandeis University;Dartmouth College;University of Notre Dame",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.brandeis.edu;https://www.dartmouth.edu;https://www.nd.edu",
        "aff_unique_abbr": "Brandeis;Dartmouth;Notre Dame",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "KpC3dPumJj",
        "title": "Gauging Learnability in Supervised Fine-tuning Data",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Supervised Fine-Tuning (SFT) serves as a crucial phase in aligning Large Language Models (LLMs) to specific task prerequisites. The selection of fine-tuning data profoundly influences the model\u2019s performance, a choice traditionally grounded in data quality and distribution. However, this paper introduces an innovative dimension in data selection: learnability. SFT is regarded as a technique for unlocking the potential of pretrained models. However, given that different models have disparate capabilities, the data appropriate for one may not suit another. Thus, we introduce the term ``learnability\" to define the suitability of data for effective learning by the model. We present the Loss Based SFT Data Selection (LoBaSS)  method, utilizing data learnability as the principal criterion for the selection of secure, efficient, and high-quality data. This method provides a nuanced approach, allowing the alignment of data selection with inherent model capabilities, ensuring optimal compatibility and learning efficiency. In experimental comparisons involving 7B and 13B models, our LoBaSS method surpasses the full-data fine-tuning, requiring merely 6% of the data. When employing 16.7% of the data, LoBaSS harmonizes the model\u2019s capabilities across conversational and mathematical domains, proving its efficacy and adaptability.",
        "keywords": "Large Language Models;Alignment;Supervised Fine-tune",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Haotian Zhou;Tingkai Liu;Qianli Ma;Jianbo Yuan;Pengfei Liu;Yang You;Hongxia Yang",
        "authorids": "~Haotian_Zhou1;~Tingkai_Liu1;~Qianli_Ma4;~Jianbo_Yuan1;~Pengfei_Liu1;~Yang_You1;~Hongxia_Yang2",
        "gender": ";M;M;M;M;M;F",
        "homepage": "https://github.com/ht-zhou;https://tk-21st.github.io/;https://fazzie-key.cool/about/index.html;;http://pfliu.com/;https://www.comp.nus.edu.sg/~youy/;https://www4.comp.polyu.edu.hk/~hongxyang/",
        "dblp": ";270/4091;;134/6790;34/3381-3;33/8167-1.html;",
        "google_scholar": ";hUYLD3_8Z1sC;;https://scholar.google.com/citations?hl=en;oIz_CYEAAAAJ;jF4dPZwAAAAJ;iJlC5mMAAAAJ",
        "orcid": ";0000-0003-3075-7648;;;;;",
        "linkedin": ";;;;;yang-you-0b92914b/;",
        "or_profile": "~Haotian_Zhou1;~Tingkai_Liu1;~Qianli_Ma4;~Jianbo_Yuan1;~Pengfei_Liu1;~Yang_You1;~Hongxia_Yang2",
        "aff": "National University of Singapore;ByteDance Inc.;;Bytedance;Shanghai Jiaotong University;National University of Singapore;ByteDance Inc.",
        "aff_domain": "u.nus.edu;bytedance.com;;bytedance.com;sjtu.edu;nus.edu.sg;bytedance.com",
        "position": "MS student;Researcher;;Researcher;Associate Professor;Professor;Principal Researcher",
        "bibtex": "@misc{\nzhou2024gauging,\ntitle={Gauging Learnability in Supervised Fine-tuning Data},\nauthor={Haotian Zhou and Tingkai Liu and Qianli Ma and Jianbo Yuan and Pengfei Liu and Yang You and Hongxia Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=KpC3dPumJj}\n}",
        "github": "",
        "project": "",
        "reviewers": "b7hv;JK8S;rNQa;MMqo",
        "site": "https://openreview.net/forum?id=KpC3dPumJj",
        "pdf_size": 3867353,
        "rating": "1;3;3;6",
        "confidence": "4;4;3;2",
        "soundness": "2;2;2;3",
        "contribution": "1;2;2;3",
        "presentation": "3;1;3;3",
        "wc_summary": "31;145;18;142",
        "wc_strengths": "11;23;18;77",
        "wc_weaknesses": "135;443;172;259",
        "wc_questions": "1;9;39;84",
        "wc_review": "178;620;247;562",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "626;495;601;572",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            84.0,
            59.68668193156661
        ],
        "wc_strengths_avg": [
            32.25,
            26.185635375144138
        ],
        "wc_weaknesses_avg": [
            252.25,
            118.97347393431865
        ],
        "wc_questions_avg": [
            33.25,
            32.545160930620696
        ],
        "wc_review_avg": [
            401.75,
            191.91453175828036
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            573.5,
            49.18587195526781
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.8866206949335731,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:s4k_pceCYJUJ:scholar.google.com/&scioq=Gauging+Learnability+in+Supervised+Fine-tuning+Data&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;2;0;1",
        "aff_unique_norm": "National University of Singapore;ByteDance;Shanghai Jiao Tong University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.nus.edu.sg;https://www.bytedance.com;https://www.sjtu.edu.cn",
        "aff_unique_abbr": "NUS;ByteDance;SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;0;1",
        "aff_country_unique": "Singapore;China"
    },
    {
        "id": "KpSNPeRuTf",
        "title": "A Novel Autoencoder Based Approach for Counterfactual Estimation Using Sparsity Constraints",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Building upon the abduction-action-step scheme and the structural causal model framework, this paper introduces the Conditional Sparse Autoencoder (CSAE), a novel approach for time series counterfactual estimation using encoder-decoder based architectures with a sparsity constraint to disentangle the roles of the inputs in the expected outputs. We benchmark CSAE with Conditional Variational Autoencoder (CVAE), the most widely adopted encoder-decoder architecture for counterfactual estimation, showing that CSAE clearly outperforms CVAE in this domain. Furthermore, we demonstrate the versatility of CSAE by extending it to image-based counterfactual scenarios, obtaining promising results. This work has important implications for a wide range of applications across various domains including finance, healthcare, and transportation, where being able to perform accurate counterfactual estimations is critical for decision-making.",
        "keywords": "Counterfactuals;Causal Machine Learning;Causality;Time Series",
        "primary_area": "causal reasoning",
        "supplementary_material": "/attachment/655a9823a7dd056dff4ef411a0daea7cf41040de.zip",
        "author": "Tomas Garriga;Gerard Sanz;Eduard Serrahima de Cambra;Axel Brando",
        "authorids": "~Tomas_Garriga1;gerard.sanz_estape@novartis.com;~Eduard_Serrahima_de_Cambra1;~Axel_Brando1",
        "gender": "M;;;M",
        "homepage": ";;;https://axelbrando.github.io",
        "dblp": ";;;223/9914",
        "google_scholar": "https://scholar.google.es/citations?user=HskLxMMAAAAJ;;;https://scholar.google.es/citations?user=sBv2dGAAAAAJ",
        "orcid": ";;;",
        "linkedin": "tomas-garriga-dicuzzo/;;;axelbrando/",
        "or_profile": "~Tomas_Garriga1;gerard.sanz_estape@novartis.com;~Eduard_Serrahima_de_Cambra1;~Axel_Brando1",
        "aff": "Novartis;;;Barcelona Supercomputing Center",
        "aff_domain": "novartis.com;;;bsc.es",
        "position": "PhD student;;;Postdoc",
        "bibtex": "@misc{\ngarriga2024a,\ntitle={A Novel Autoencoder Based Approach for Counterfactual Estimation Using Sparsity Constraints},\nauthor={Tomas Garriga and Gerard Sanz and Eduard Serrahima de Cambra and Axel Brando},\nyear={2024},\nurl={https://openreview.net/forum?id=KpSNPeRuTf}\n}",
        "github": "",
        "project": "",
        "reviewers": "1arB;MHr3;cmfR;moAT",
        "site": "https://openreview.net/forum?id=KpSNPeRuTf",
        "pdf_size": 1102670,
        "rating": "1;3;3;3",
        "confidence": "4;3;3;4",
        "soundness": "1;1;2;3",
        "contribution": "1;1;1;1",
        "presentation": "1;2;3;2",
        "wc_summary": "45;16;19;58",
        "wc_strengths": "21;28;30;20",
        "wc_weaknesses": "339;229;180;126",
        "wc_questions": "25;81;2;134",
        "wc_review": "430;354;231;338",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1470;989;1100;1209",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;2;2;2",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            1.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            34.5,
            17.64227876437735
        ],
        "wc_strengths_avg": [
            24.75,
            4.322904116447646
        ],
        "wc_weaknesses_avg": [
            218.5,
            78.53184067625055
        ],
        "wc_questions_avg": [
            60.5,
            51.24695112882326
        ],
        "wc_review_avg": [
            338.25,
            71.00836218361891
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1192.0,
            178.3577864854798
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:r9jMVl2Ekt0J:scholar.google.com/&scioq=A+Novel+Autoencoder+Based+Approach+for+Counterfactual+Estimation+Using+Sparsity+Constraints&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Novartis;Barcelona Supercomputing Center",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.novartis.com;https://www.bsc.es",
        "aff_unique_abbr": "Novartis;BSC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Switzerland;Spain"
    },
    {
        "title": "Generative Pre-training for Speech with Flow Matching",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18885",
        "id": "KpoQSgxbKH",
        "author_site": "Alexander Liu, Matthew Le, Apoorv Vyas, Bowen Shi, Andros Tjandra, Wei-Ning Hsu",
        "tldr": "",
        "abstract": "Generative models have gained more and more attention in recent years for their remarkable success in tasks that required estimating and sampling data distribution to generate high-fidelity synthetic data. In speech, text-to-speech synthesis and neural vocoder are good examples where generative models have shined. While generative models have been applied to different applications in speech, there exists no general-purpose generative model that models speech directly. In this work, we take a step toward this direction by showing a single pre-trained generative model can be adapted to different downstream tasks with strong performance. Specifically, we pre-trained a generative model, named SpeechFlow, on 60k hours of untranscribed speech with Flow Matching and masked conditions. Experiment results show the pre-trained generative model can be fine-tuned with task-specific data to match or surpass existing expert models on speech enhancement, separation, and synthesis. Our work suggested a foundational model for generation tasks in speech can be built with generative pre-training.",
        "keywords": "speech pre-training;speech generation;generative pre-training;flow matching",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/fb30f8296e052130c0803e17b2dfbb199e7ecbc1.zip",
        "author": "Alexander H. Liu;Matthew Le;Apoorv Vyas;Bowen Shi;Andros Tjandra;Wei-Ning Hsu",
        "authorids": "~Alexander_H._Liu1;~Matthew_Le2;~Apoorv_Vyas1;~Bowen_Shi1;~Andros_Tjandra1;~Wei-Ning_Hsu2",
        "gender": "M;;M;;M;M",
        "homepage": "https://alexander-h-liu.github.io/;https://apoorv2904.github.io/;;https://scholar.google.com/citations?user=Bvox_f8AAAAJ&hl=en;;https://wnhsu.github.io/",
        "dblp": "227/2380;162/6169;;https://dblp.org/search/pid/api?q=author:Andros_Tjandra:;133/1777;160/9923",
        "google_scholar": "LIiCDa0AAAAJ;https://scholar.google.com/citations?hl=en;xqyoorYAAAAJ;Bvox_f8AAAAJ;-8QcdvgAAAAJ;https://scholar.google.com/citations?authorid=N5HDmqoAAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Alexander_H._Liu1;~Apoorv_Vyas1;~Bowen_Shi1;~Andros_Tjandra1;~Matthew_Le1;~Wei-Ning_Hsu1",
        "aff": "NVIDIA;Meta ;Meta Facebook;Meta Facebook;Meta Facebook;Meta Facebook",
        "aff_domain": "nvidia.com;meta.com;meta.com;facebook.com;fb.com;fb.com",
        "position": "Intern;Researcher;Researcher;Researcher;Researcher;Researcher",
        "bibtex": "@inproceedings{\nliu2024generative,\ntitle={Generative Pre-training for Speech with Flow Matching},\nauthor={Alexander H. Liu and Matthew Le and Apoorv Vyas and Bowen Shi and Andros Tjandra and Wei-Ning Hsu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=KpoQSgxbKH}\n}",
        "github": "",
        "project": "",
        "reviewers": "dpH8;STf2;C8mS;d1Li",
        "pdf_size": 982941,
        "rating": "3;6;6;8",
        "confidence": "5;2;4;5",
        "soundness": "3;3;3;4",
        "contribution": "2;3;3;4",
        "presentation": "2;3;3;4",
        "wc_summary": "20;47;44;98",
        "wc_strengths": "11;65;55;135",
        "wc_weaknesses": "152;84;51;65",
        "wc_questions": "90;2;24;160",
        "wc_review": "273;198;174;458",
        "wc_reply_reviewers": "314;11;0;0",
        "wc_reply_authors": "2793;123;195;579",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "5;1;1;1",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.0,
            1.224744871391589
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            52.25,
            28.411045387313717
        ],
        "wc_strengths_avg": [
            66.5,
            44.46065676527957
        ],
        "wc_weaknesses_avg": [
            88.0,
            38.76209488662861
        ],
        "wc_questions_avg": [
            69.0,
            61.71709649683789
        ],
        "wc_review_avg": [
            275.75,
            111.37857738362436
        ],
        "wc_reply_reviewers_avg": [
            81.25,
            134.4532911460333
        ],
        "wc_reply_authors_avg": [
            922.5,
            1093.757171405061
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            1.7320508075688772
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.11433239009500587,
        "gs_citation": 34,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18193947149901429690&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=KpoQSgxbKH",
        "pdf": "https://openreview.net/pdf?id=KpoQSgxbKH",
        "email": "nvidia.com;meta.com;meta.com;facebook.com;fb.com;fb.com",
        "author_num": 6,
        "aff_unique_index": "0;1;1;1;1;1",
        "aff_unique_norm": "NVIDIA;Meta",
        "aff_unique_dep": "NVIDIA Corporation;Meta Platforms, Inc.",
        "aff_unique_url": "https://www.nvidia.com;https://meta.com",
        "aff_unique_abbr": "NVIDIA;Meta",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Kq5avXrkpY",
        "title": "Federated Optimization Algorithms with Random Reshuffling and Gradient Compression",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Gradient compression is a popular technique for improving communication complexity of stochastic first-order methods in distributed training of machine learning models. However, the existing works consider only with-replacement sampling of stochastic gradients. In contrast, it is well-known in practice and recently confirmed in theory that stochastic methods based on without-replacement sampling, e.g., Random Reshuffling (RR) method, perform better than ones that sample the gradients with-replacement. In this work, we close this gap in the literature and provide the first analysis of methods with gradient compression and without-replacement sampling. We first develop a na\u00efve combination of random reshuffling with gradient compression (Q-RR). Perhaps surprisingly, but the theoretical analysis of Q-RR does not show any benefits of using RR. Our extensive numerical experiments confirm this phenomenon. This happens due to the additional compression variance. To reveal the true advantages of RR in the distributed learning with compression, we propose a new method called DIANA-RR that reduces the compression variance and has provably better convergence rates than existing counterparts with with-replacement sampling of stochastic gradients. Next, to have a better fit to Federated Learning applications, we incorporate local computation, i.e., we propose and analyze the variants of Q-RR and DIANA-RR -- Q-NASTYA and DIANA-NASTYA that use local gradient steps and different local and global stepsizes. Finally, we conducted several numerical experiments to illustrate our theoretical results.",
        "keywords": "Machine Learning;Optimization;Federated Learning",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Abdurakhmon Sadiev;Grigory Malinovsky;Eduard Gorbunov;Igor Sokolov;Ahmed Khaled;Konstantin Pavlovich Burlachenko;Peter Richt\u00e1rik",
        "authorids": "~Abdurakhmon_Sadiev1;~Grigory_Malinovsky1;~Eduard_Gorbunov1;~Igor_Sokolov3;~Ahmed_Khaled1;~Konstantin_Pavlovich_Burlachenko1;~Peter_Richt\u00e1rik1",
        "gender": "M;M;M;M;M;M;M",
        "homepage": "https://sadiev.netlify.app;https://grigory-malinovsky.github.io;https://eduardgorbunov.github.io;https://cemse.kaust.edu.sa/people/person/igor-sokolov;https://www.akhaled.net;https://burlachenkok.github.io/;https://richtarik.org",
        "dblp": "264/9455;262/3277.html;215/5512.html;202/5678-1;154/3591-1;;62/8001",
        "google_scholar": "R-xZRIAAAAAJ;4w2W9KQAAAAJ;https://scholar.google.ru/citations?user=85j2RqQAAAAJ;https://scholar.google.ru/citations?user=OBbPecwAAAAJ;Bc3wOdsAAAAJ;3pA-LoQAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;0000-0002-2338-0187;;;0000-0003-4380-5848",
        "linkedin": ";;;igor-sokolov-7a6b47147/;;burlachenkok/;richtarik/",
        "or_profile": "~Abdurakhmon_Sadiev1;~Grigory_Malinovsky1;~Eduard_Gorbunov1;~Igor_Sokolov3;~Ahmed_Khaled1;~Konstantin_Pavlovich_Konstantin_Burlachenko1;~Peter_Richtarik1",
        "aff": "King Abdullah University of Science and Technology;Samsung;Mohamed bin Zayed University of Artificial Intelligence;King Abdullah University of Science and Technology;Princeton University;;King Abdullah University of Science and Technology (KAUST)",
        "aff_domain": "kaust.edu.sa;samsung.com;mbzuai.ac.ae;kaust.edu.sa;princeton.edu;;kaust.edu.sa",
        "position": "PhD student;Intern;Postdoc;PhD student;PhD student;;Full Professor",
        "bibtex": "@misc{\nsadiev2024federated,\ntitle={Federated Optimization Algorithms with Random Reshuffling and Gradient Compression},\nauthor={Abdurakhmon Sadiev and Grigory Malinovsky and Eduard Gorbunov and Igor Sokolov and Ahmed Khaled and Konstantin Pavlovich Burlachenko and Peter Richt{\\'a}rik},\nyear={2024},\nurl={https://openreview.net/forum?id=Kq5avXrkpY}\n}",
        "github": "",
        "project": "",
        "reviewers": "VtDw;mMnw;TutK;iwJs",
        "site": "https://openreview.net/forum?id=Kq5avXrkpY",
        "pdf_size": 1820874,
        "rating": "5;6;6;6",
        "confidence": "5;3;4;4",
        "soundness": "3;4;4;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;4;3",
        "wc_summary": "73;50;120;15",
        "wc_strengths": "44;99;26;48",
        "wc_weaknesses": "176;112;22;134",
        "wc_questions": "9;3;59;96",
        "wc_review": "302;264;227;293",
        "wc_reply_reviewers": "0;0;21;0",
        "wc_reply_authors": "867;747;685;661",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            64.5,
            38.12151623427379
        ],
        "wc_strengths_avg": [
            54.25,
            27.13277538328875
        ],
        "wc_weaknesses_avg": [
            111.0,
            56.293871780150276
        ],
        "wc_questions_avg": [
            41.75,
            38.12725403172906
        ],
        "wc_review_avg": [
            271.5,
            29.278831943914703
        ],
        "wc_reply_reviewers_avg": [
            5.25,
            9.093266739736606
        ],
        "wc_reply_authors_avg": [
            740.0,
            79.75587752636166
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 30,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7051289780121487760&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;2;0;3;0",
        "aff_unique_norm": "King Abdullah University of Science and Technology;Samsung;Mohamed bin Zayed University of Artificial Intelligence;Princeton University",
        "aff_unique_dep": ";Samsung;;",
        "aff_unique_url": "https://www.kast.kau.edu.sa;https://www.samsung.com;https://mbzuai.ac.ae;https://www.princeton.edu",
        "aff_unique_abbr": "KAUST;Samsung;MBZUAI;Princeton",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;0;3;0",
        "aff_country_unique": "Saudi Arabia;South Korea;United Arab Emirates;United States"
    },
    {
        "id": "KqTzfiNjWU",
        "title": "Restorer Guided Diffusion Models for Variational Inverse Problems",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Diffusion models have made remarkable progress in solving various inverse problems, attributing to the generative modeling capability of the data manifold. Posterior sampling from the conditional score function enable the precious data consistency powered by the measurement-based likelihood term. However, most prevailing approaches confined to the insufficient expressive ability of the measurement model with merely digitized measuring deterioration, regardless of complicated unpredictable disturbance in real-world sceneries. To address this, we show that the measurement-based likelihood can be renewed with restoration-based likelihood, licencing the patronage of various off-the-shelf restoration models for powerful diffusion solvers, in what we call restorer guidance. Particularly, assembled with versatile restorer guidance optionally, we can resolve inverse problems with bunch of choices for assorted sample quality and realize the proficient deterioration control with assured realistic. We show that our work can be analogous to the transition from the classifier guidance to classifier-free guidance in the field of inverse problem solver. Experiments on various complicated inverse problems illustrate the effectiveness of our method, including image dehazing, rain streak removal, and motion deblurring. Code will be available soon.",
        "keywords": "Diffusion model;posterior sampling;restorer guidance",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "JingHao Zhang;Zizheng Yang;Man Zhou;Feng Zhao",
        "authorids": "~JingHao_Zhang2;~Zizheng_Yang1;~Man_Zhou5;~Feng_Zhao6",
        "gender": "M;M;M;M",
        "homepage": "https://jinghao99.github.io/;;https://zz.github.io;https://bivlab123.github.io/",
        "dblp": ";308/0448;;181/2734-4",
        "google_scholar": "Lis9e2MAAAAJ;https://scholar.google.com/citations?hl=zh-CN;;https://scholar.google.co.uk/citations?hl=en",
        "orcid": "0000-0002-5407-4641;;;0000-0001-6767-8105",
        "linkedin": ";;;",
        "or_profile": "~JingHao_Zhang2;~Zizheng_Yang1;~Man_Zhou5;~Feng_Zhao6",
        "aff": "University of Science and Technology of China;University of Science and Technology of China;iim;University of Science and Technology of China",
        "aff_domain": "ustc.edu.cn;ustc.edu.cn;iim.cn;ustc.edu.cn",
        "position": "PhD student;PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nzhang2024restorer,\ntitle={Restorer Guided Diffusion Models for Variational Inverse Problems},\nauthor={JingHao Zhang and Zizheng Yang and Man Zhou and Feng Zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=KqTzfiNjWU}\n}",
        "github": "",
        "project": "",
        "reviewers": "gpTn;MTeq;kcN8;tvMe",
        "site": "https://openreview.net/forum?id=KqTzfiNjWU",
        "pdf_size": 22911187,
        "rating": "1;1;3;3",
        "confidence": "5;5;4;5",
        "soundness": "1;1;1;2",
        "contribution": "1;2;2;2",
        "presentation": "1;1;2;2",
        "wc_summary": "53;55;85;83",
        "wc_strengths": "37;21;27;47",
        "wc_weaknesses": "435;459;241;433",
        "wc_questions": "140;172;747;5",
        "wc_review": "665;707;1100;568",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.0,
            1.0
        ],
        "confidence_avg": [
            4.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            69.0,
            15.033296378372908
        ],
        "wc_strengths_avg": [
            33.0,
            9.899494936611665
        ],
        "wc_weaknesses_avg": [
            392.0,
            87.77812939451375
        ],
        "wc_questions_avg": [
            266.0,
            284.6901824791294
        ],
        "wc_review_avg": [
            760.0,
            202.66844845707976
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:4EXU7E7lMhwJ:scholar.google.com/&scioq=Restorer+Guided+Diffusion+Models+for+Variational+Inverse+Problems&hl=en&as_sdt=0,39",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "University of Science and Technology of China;Indian Institute of Management",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.ustc.edu.cn;https://www.iim.edu",
        "aff_unique_abbr": "USTC;IIM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "China;India"
    },
    {
        "title": "Particle Guidance: non-I.I.D. Diverse Sampling with Diffusion Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18884",
        "id": "KqbCvIFBY7",
        "author_site": "Gabriele Corso, Yilun Xu, Valentin De Bortoli, Regina Barzilay, Tommi Jaakkola",
        "tldr": "",
        "abstract": "In light of the widespread success of generative models, a significant amount of research has gone into speeding up their sampling time. However, generative models are often sampled multiple times to obtain a diverse set incurring a cost that is orthogonal to sampling time. We tackle the question of how to improve diversity and sample efficiency by moving beyond the common assumption of independent samples. We propose particle guidance, an extension of diffusion-based generative sampling where a joint-particle time-evolving potential enforces diversity. We analyze theoretically the joint distribution that particle guidance generates, how to learn a potential that achieves optimal diversity, and the connections with methods in other disciplines. Empirically, we test the framework both in the setting of conditional image generation, where we are able to increase diversity without affecting quality, and molecular conformer generation, where we reduce the state-of-the-art median error by 13% on average.",
        "keywords": "diffusion models;score-based models;diversity;guidance;conformer generation;image generation",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Gabriele Corso;Yilun Xu;Valentin De Bortoli;Regina Barzilay;Tommi S. Jaakkola",
        "authorids": "~Gabriele_Corso1;~Yilun_Xu1;~Valentin_De_Bortoli1;~Regina_Barzilay1;~Tommi_S._Jaakkola1",
        "gender": ";M;;female;",
        "homepage": "https://gcorso.github.io/;http://yilun-xu.com;https://vdeborto.github.io/;https://www.regina.csail.mit.edu/;",
        "dblp": "262/6499;;224/9338;b/ReginaBarzilay;",
        "google_scholar": "LUrAYgEAAAAJ;;;;",
        "orcid": ";;;;",
        "linkedin": "gcorso/;;;;",
        "or_profile": "~Gabriele_Corso1;~Yilun_Xu1;~Valentin_De_Bortoli1;~Regina_Barzilay1;~Tommi_S._Jaakkola1",
        "aff": "Massachusetts Institute of Technology;Massachusetts Institute of Technology;University of Oxford;Massachusetts Institute of Technology;",
        "aff_domain": "mit.edu;mit.edu;ox.ac.uk;mit.edu;",
        "position": "PhD student;PhD student;Postdoc;Professor;",
        "bibtex": "@inproceedings{\ncorso2024particle,\ntitle={Particle Guidance: non-I.I.D. Diverse Sampling with Diffusion Models},\nauthor={Gabriele Corso and Yilun Xu and Valentin De Bortoli and Regina Barzilay and Tommi S. Jaakkola},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=KqbCvIFBY7}\n}",
        "github": "",
        "project": "",
        "reviewers": "AGeB;ufFd;iSmF;rfgv",
        "pdf_size": 28179798,
        "rating": "5;5;6;8",
        "confidence": "5;5;4;4",
        "soundness": "3;3;3;4",
        "contribution": "2;2;3;3",
        "presentation": "3;3;4;4",
        "wc_summary": "22;73;96;119",
        "wc_strengths": "46;39;74;57",
        "wc_weaknesses": "184;184;175;354",
        "wc_questions": "78;2;14;247",
        "wc_review": "330;298;359;777",
        "wc_reply_reviewers": "55;0;0;23",
        "wc_reply_authors": "1383;1127;631;1799",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "3;2;1;4",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            77.5,
            35.9339672176619
        ],
        "wc_strengths_avg": [
            54.0,
            13.209844813622906
        ],
        "wc_weaknesses_avg": [
            224.25,
            75.00124998958351
        ],
        "wc_questions_avg": [
            85.25,
            97.75319687866991
        ],
        "wc_review_avg": [
            441.0,
            195.1858089103816
        ],
        "wc_reply_reviewers_avg": [
            19.5,
            22.544400635190993
        ],
        "wc_reply_authors_avg": [
            1235.0,
            423.22570810384383
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.8164965809277259,
        "gs_citation": 27,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8442528353246601752&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=KqbCvIFBY7",
        "pdf": "https://openreview.net/pdf?id=KqbCvIFBY7",
        "email": "mit.edu;mit.edu;ox.ac.uk;mit.edu;",
        "author_num": 5,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Massachusetts Institute of Technology;University of Oxford",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://web.mit.edu;https://www.ox.ac.uk",
        "aff_unique_abbr": "MIT;Oxford",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "Kr7KpDm8MO",
        "title": "Rotational Equilibrium: How Weight Decay Balances Learning Across Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Weight decay can significantly impact the optimization dynamics of deep neural networks. In certain situations the effects of weight decay and gradient updates on the magnitude of a parameter vector cancel out on average, forming a state known as equilibrium. This causes the expected rotation of the vector in each update to remain constant along with its magnitude. Importantly, equilibrium can arise independently for the weight vectors of different layers and neurons. These equilibria are highly homogeneous for some optimizer and normalization configurations, effectively balancing the average rotation\u2014a proxy for the effective learning rate\u2014across network components. In this work we explore the equilibrium states of multiple optimizers including AdamW and SGD with momentum, providing insights into interactions between the learning rate, weight decay, initialization, normalization and learning rate schedule. We show how rotational equilibrium can be enforced throughout training, eliminating the chaotic transient phase corresponding to the transition towards equilibrium, thus simplifying the training dynamics. Finally, we show that rotational behavior may play a key role in the effectiveness of AdamW compared to Adam with $L_2$-regularization, the performance of different normalization layers, and the need for learning rate warmup.",
        "keywords": "Learning dynamics of deep neural networks;weight decay;normalization;effective learning rate;AdamW;Adam with L2 regularization;spherical motion dynamics;optimization;training;scale invariance;equilibrium;rotational;SGDM;Lion",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Atli Kosson;Bettina Messmer;Martin Jaggi",
        "authorids": "~Atli_Kosson1;~Bettina_Messmer1;~Martin_Jaggi1",
        "gender": ";;M",
        "homepage": ";https://people.epfl.ch/bettina.messmer;https://mlo.epfl.ch",
        "dblp": ";;17/4402",
        "google_scholar": ";;https://scholar.google.ch/citations?user=r1TJBr8AAAAJ",
        "orcid": ";;0000-0003-1579-5558",
        "linkedin": ";;",
        "or_profile": "~Atli_Kosson1;~Bettina_Messmer1;~Martin_Jaggi1",
        "aff": ";EPFL - EPF Lausanne;EPFL",
        "aff_domain": ";epfl.ch;epfl.ch",
        "position": ";PhD student;Associate Professor",
        "bibtex": "@misc{\nkosson2024rotational,\ntitle={Rotational Equilibrium: How Weight Decay Balances Learning Across Neural Networks},\nauthor={Atli Kosson and Bettina Messmer and Martin Jaggi},\nyear={2024},\nurl={https://openreview.net/forum?id=Kr7KpDm8MO}\n}",
        "github": "",
        "project": "",
        "reviewers": "tLyV;Fts9;Yv1K;Pvr2",
        "site": "https://openreview.net/forum?id=Kr7KpDm8MO",
        "pdf_size": 886901,
        "rating": "3;5;5;5",
        "confidence": "3;3;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;2",
        "presentation": "1;3;3;3",
        "wc_summary": "104;90;129;42",
        "wc_strengths": "28;18;131;51",
        "wc_weaknesses": "125;245;92;84",
        "wc_questions": "112;36;20;2",
        "wc_review": "369;389;372;179",
        "wc_reply_reviewers": "197;115;0;0",
        "wc_reply_authors": "1607;1503;897;1155",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "4;4;3;3",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            91.25,
            31.68102744546016
        ],
        "wc_strengths_avg": [
            57.0,
            44.367781102958034
        ],
        "wc_weaknesses_avg": [
            136.5,
            64.5
        ],
        "wc_questions_avg": [
            42.5,
            41.88973621306298
        ],
        "wc_review_avg": [
            327.25,
            85.93129523055032
        ],
        "wc_reply_reviewers_avg": [
            78.0,
            83.21358062239601
        ],
        "wc_reply_authors_avg": [
            1290.5,
            282.192753273361
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.5,
            0.5
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14899743428852739833&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "EPFL",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.epfl.ch",
        "aff_unique_abbr": "EPFL",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Lausanne;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Switzerland"
    },
    {
        "id": "KrMnLl9RCl",
        "title": "Improving Generalization for Missing Data Imputation via Dual Corruption Denoising Autoencoders",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Missing data poses challenges for machine learning applications across domains. Prevalent imputation techniques using deep learning have demonstrated limitations: GANs exhibit instability, while AutoEncoders tend to overfit. In real application scenarios, there are diverse types of missingness with varied missing rates, calling for an accurate and generic imputation approach. In this paper, we introduce Dual Corruption Denoising AutoEncoders (DC-DAE), which 1) augments inputs via dual corruptions (i.e., concurrent masking and additive noise corruptions) during training, preventing reliance on fixed missingness patterns, and enabling improved generalization; 2) applies a balanced loss function, allowing control over reconstructing artificial missingness versus denoising observed values. DC-DAE has a simple yet effective architecture without the complexity of attention mechanism or adversarial training. By combining corruption robustness and high-fidelity reconstruction, DC-DAE achieves both accuracy and stability. We demonstrate state-of-the-art performance on multiple tabular datasets with different missing rates, outperforming GAN, DAE, and VAE baselines under varied missingness scenarios. Our results highlight the importance of diverse and proper corruptions when designing models for imputation. The proposed plug-and-play approach offers an effective solution for ubiquitous missing data problems across domains.",
        "keywords": "missing data;imputation;denoising autoencoder;deep learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Xu Jiao;Ying Li;Yiteng Zhai;Yao Yang",
        "authorids": "~Xu_Jiao2;~Ying_Li18;~Yiteng_Zhai2;~Yao_Yang2",
        "gender": ";M;M;M",
        "homepage": ";;;https://portal.zhejianglab.com/portal/employee/001112",
        "dblp": ";;124/8986.html;35/5535",
        "google_scholar": "LSUMYRsAAAAJ;;;6xDMM1YAAAAJ",
        "orcid": "0009-0003-0773-4429;0000-0003-2762-342X;;0000-0002-7007-9071",
        "linkedin": ";;;",
        "or_profile": "~Xu_Jiao2;~Ying_Li18;~Yiteng_Zhai2;~Yao_Yang2",
        "aff": "Zhejiang Lab;Zhejiang Lab, Zhejiang Lab;;Zhejiang Lab China",
        "aff_domain": "zhejianglab.com;zhejianglab.com;;zhejianglab.com",
        "position": "Researcher;Postdoc;;Researcher",
        "bibtex": "@misc{\njiao2024improving,\ntitle={Improving Generalization for Missing Data Imputation via Dual Corruption Denoising Autoencoders},\nauthor={Xu Jiao and Ying Li and Yiteng Zhai and Yao Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=KrMnLl9RCl}\n}",
        "github": "",
        "project": "",
        "reviewers": "NhSr;snV7;JkTL;S9by;z8ed",
        "site": "https://openreview.net/forum?id=KrMnLl9RCl",
        "pdf_size": 2834829,
        "rating": "3;3;3;5;5",
        "confidence": "3;4;5;4;3",
        "soundness": "2;2;3;3;2",
        "contribution": "2;1;2;2;2",
        "presentation": "2;3;4;3;3",
        "wc_summary": "64;75;77;77;93",
        "wc_strengths": "29;29;210;85;51",
        "wc_weaknesses": "284;161;254;106;95",
        "wc_questions": "2;99;176;344;125",
        "wc_review": "379;364;717;612;364",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "351;258;165;573;320",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            3.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.8,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            1.8,
            0.4000000000000001
        ],
        "presentation_avg": [
            3.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            77.2,
            9.26066952223218
        ],
        "wc_strengths_avg": [
            80.8,
            67.77138039025027
        ],
        "wc_weaknesses_avg": [
            180.0,
            76.62114590633581
        ],
        "wc_questions_avg": [
            149.2,
            112.63995738635558
        ],
        "wc_review_avg": [
            487.2,
            148.62489697220988
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            333.4,
            135.60324479893538
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.3273268353539886,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:39NeGzT4KVIJ:scholar.google.com/&scioq=Improving+Generalization+for+Missing+Data+Imputation+via+Dual+Corruption+Denoising+Autoencoders&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Zhejiang Lab",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.zhejianglab.com",
        "aff_unique_abbr": "",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "KrOmLMFYHi",
        "title": "Voila-A: Aligning Vision-Language Models with User's Gaze Attention",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In recent years, the integration of vision and language understanding has led to significant advancements in artificial intelligence, particularly through Vision-Language Models (VLMs). However, existing VLMs face challenges in handling real-world applications with complex scenes and multiple objects, as well as aligning their focus with the diverse attention patterns of human users. In this paper, we introduce gaze information, feasibly collected by AR or VR devices, as a proxy for human attention to guide VLMs and propose a novel approach, Voila-A, for gaze alignment to enhance the interpretability and effectiveness of these models in real-world applications.\nFirst, we collect hundreds of minutes of gaze data to demonstrate that we can mimic human gaze modalities using localized narratives. We then design an automatic data annotation pipeline utilizing GPT-4 to generate the VOILA-COCO dataset. Additionally, we innovate the Voila Perceiver modules to integrate gaze information into VLMs while preserving their pretrained knowledge.\nWe evaluate Voila-A using a hold-out validation set and a newly collected VOILA-GAZE Testset, which features real-life scenarios captured with a gaze-tracking device. Our experimental results demonstrate that Voila-A significantly outperforms several baseline models. By aligning model attention with human gaze patterns, Voila-A paves the way for more intuitive, user-centric VLMs and fosters engaging human-AI interaction across a wide range of applications.",
        "keywords": "Large Language Models;Gaze;Controlled Generative Model;Vision Language Model",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Kun Yan;Lei Ji;Zeyu Wang;Yuntao Wang;Nan Duan;Shuai Ma",
        "authorids": "~Kun_Yan2;~Lei_Ji1;~Zeyu_Wang12;~Yuntao_Wang1;~Nan_Duan1;~Shuai_Ma1",
        "gender": "M;F;F;M;M;M",
        "homepage": ";;;https://pi.cs.tsinghua.edu.cn/lab/people/YuntaoWang/;https://nanduan.github.io/;https://mashuai-ms.github.io/",
        "dblp": ";42/2721-1;;52/4107-1.html;;35/6569",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;;;kHpwoAUAAAAJ;Qaa6OxIAAAAJ;",
        "orcid": "0000-0001-8290-5169;;0009-0007-5048-1665;0000-0002-4249-8893;;",
        "linkedin": ";;;;;",
        "or_profile": "~Kun_Yan2;~Lei_Ji1;~Zeyu_Wang12;~Yuntao_Wang1;~Nan_Duan1;~Shuai_Ma1",
        "aff": "Microsoft Research;Microsoft Research;Tsinghua University;Tsinghua University;Microsoft Research Asia;Beihang  University",
        "aff_domain": "microsoft.com;research.microsoft.com;mail.tsinghua.edu.cn;tsinghua.edu.cn;microsoft.com;buaa.edu.cn",
        "position": "PhD student;Researcher;PhD student;Associate Professor;Principal Researcher;Full Professor",
        "bibtex": "@misc{\nyan2024voilaa,\ntitle={Voila-A: Aligning Vision-Language Models with User's Gaze Attention},\nauthor={Kun Yan and Lei Ji and Zeyu Wang and Yuntao Wang and Nan Duan and Shuai Ma},\nyear={2024},\nurl={https://openreview.net/forum?id=KrOmLMFYHi}\n}",
        "github": "",
        "project": "",
        "reviewers": "428q;gfYi;2Muy;tDrZ",
        "site": "https://openreview.net/forum?id=KrOmLMFYHi",
        "pdf_size": 23261563,
        "rating": "3;5;6;6",
        "confidence": "2;3;3;4",
        "soundness": "1;3;2;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;2;2",
        "wc_summary": "50;96;188;144",
        "wc_strengths": "13;37;44;79",
        "wc_weaknesses": "76;249;226;85",
        "wc_questions": "7;83;138;29",
        "wc_review": "146;465;596;337",
        "wc_reply_reviewers": "0;0;0;3",
        "wc_reply_authors": "657;975;632;440",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            119.5,
            51.659945799429565
        ],
        "wc_strengths_avg": [
            43.25,
            23.62599204266352
        ],
        "wc_weaknesses_avg": [
            159.0,
            78.98417563031218
        ],
        "wc_questions_avg": [
            64.25,
            50.77093164400275
        ],
        "wc_review_avg": [
            386.0,
            166.08883165342576
        ],
        "wc_reply_reviewers_avg": [
            0.75,
            1.299038105676658
        ],
        "wc_reply_authors_avg": [
            676.0,
            191.95963117280675
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.8660254037844386,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11216432953124509692&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;1;1;0;2",
        "aff_unique_norm": "Microsoft;Tsinghua University;Beihang University",
        "aff_unique_dep": "Microsoft Research;;",
        "aff_unique_url": "https://www.microsoft.com/en-us/research;https://www.tsinghua.edu.cn;http://www.buaa.edu.cn/",
        "aff_unique_abbr": "MSR;THU;BUAA",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Asia",
        "aff_country_unique_index": "0;0;1;1;1;1",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "KrRhFdn8kv",
        "title": "Is the Glass Half-Empty or Half-Full? A Mixture-Of-Tasks Perspective on Missing Modality",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "A common issue with multimodal learning setups is the unavailability of one or more modalities. Historically, missing modality has been treated as a matter of robustness, aiming to prevent performance degradation caused by stochastic loss of training and testing modalities. However, this perspective does not align with many scientific and industrial use cases of deep models where unimodal inputs are more common than having multiple modalities. Moreover, it poses practical challenges such as complicating comparisons between studies and causing ambiguity in understanding optimal model behavior. We instead propose a `glass-half-full' approach---the Missing Modality Performance Testbed (MMPT)--- which sheds light on the pivotal elements for enhancing model performance under the effect of missing modalities. MMPT reconceptualizes missing modality robustness analysis as a fundamental aspect of multimodal representation learning. This formulation allows us to connect missing modality to modality competition, an area of work that aims to improve unimodal representations in a multimodal context for late-fusion models. We create a unified framework for both missing modality and modality competition by relaxing their architectural assumptions. Via this linkage, we explore how current approaches to missing modality impact the underlying model representations and the requisite representations for favorable performance. We validate this novel perspective on a wide variety of multimodal datasets with the intention of enabling simple and clear benchmarking for future research. Finally, we present a new state-of-the-art in missing modality performance and identify potential areas for further improvement.",
        "keywords": "missing modality;modality competition;multimodal learning;multimodal fusion",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/15a8fe428e6751c2c5ddbf3e5aec457936e7335c.zip",
        "author": "Daniel Yang;Tiantian Feng;Yoonsoo Nam;Jihwan Lee;Shrikanth Narayanan",
        "authorids": "~Daniel_Yang2;~Tiantian_Feng1;~Yoonsoo_Nam2;~Jihwan_Lee2;~Shrikanth_Narayanan1",
        "gender": "M;M;M;M;M",
        "homepage": ";https://tiantiaf0627.github.io/;;https://void.void;http://sail.usc.edu/people/shri.html",
        "dblp": "02/11178;;;;19/3899",
        "google_scholar": "3rt49-pdH9oC;p7oF-XIAAAAJ;https://scholar.google.com/citations?hl=en;;8EDHmYkAAAAJ",
        "orcid": ";0000-0002-2053-9068;;;0000-0002-1052-6204",
        "linkedin": ";;;;shrikanth-narayanan/",
        "or_profile": "~Daniel_Yang2;~Tiantian_Feng1;~Yoonsoo_Nam2;~Jihwan_Lee2;~Shrikanth_Narayanan1",
        "aff": "University of Southern California;University of Southern California;University of Southern California;University of Southern California;University of Southern California",
        "aff_domain": "usc.edu;usc.edu;usc.edu;usc.edu;usc.edu",
        "position": "PhD student;Postdoc;MS student;PhD student;Full Professor",
        "bibtex": "@misc{\nyang2024is,\ntitle={Is the Glass Half-Empty or Half-Full? A Mixture-Of-Tasks Perspective on Missing Modality},\nauthor={Daniel Yang and Tiantian Feng and Yoonsoo Nam and Jihwan Lee and Shrikanth Narayanan},\nyear={2024},\nurl={https://openreview.net/forum?id=KrRhFdn8kv}\n}",
        "github": "",
        "project": "",
        "reviewers": "PHyn;FaQ6;qtFd;6Lgm",
        "site": "https://openreview.net/forum?id=KrRhFdn8kv",
        "pdf_size": 3435810,
        "rating": "3;3;3;3",
        "confidence": "3;4;2;3",
        "soundness": "1;2;2;2",
        "contribution": "1;1;3;1",
        "presentation": "2;1;2;3",
        "wc_summary": "27;49;211;134",
        "wc_strengths": "31;63;99;87",
        "wc_weaknesses": "25;139;436;255",
        "wc_questions": "150;5;83;178",
        "wc_review": "233;256;829;654",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            105.25,
            72.9670302259863
        ],
        "wc_strengths_avg": [
            70.0,
            25.98076211353316
        ],
        "wc_weaknesses_avg": [
            213.75,
            151.91342106607962
        ],
        "wc_questions_avg": [
            104.0,
            66.7720001198107
        ],
        "wc_review_avg": [
            493.0,
            256.2157294156625
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ppUl2NkiyZgJ:scholar.google.com/&scioq=Is+the+Glass+Half-Empty+or+Half-Full%3F+A+Mixture-Of-Tasks+Perspective+on+Missing+Modality&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "University of Southern California",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.usc.edu",
        "aff_unique_abbr": "USC",
        "aff_campus_unique_index": "0;0;0;0;0",
        "aff_campus_unique": "Los Angeles",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "MetaPhysiCa: Improving OOD Robustness in Physics-informed Machine Learning",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18883",
        "id": "KrWuDiW4Qm",
        "author_site": "S Chandra Mouli, Muhammad Alam, Bruno Ribeiro",
        "tldr": "",
        "abstract": "A fundamental challenge in physics-informed machine learning (PIML) is the design of robust PIML methods for out-of-distribution (OOD) forecasting tasks. These OOD tasks require learning-to-learn from observations of the same (ODE) dynamical system with different unknown ODE parameters, and demand accurate forecasts even under out-of-support initial conditions and out-of-support ODE parameters. In this work we propose to improve the OOD robustness of PIML via a meta-learning procedure for causal structure discovery. Using three different OOD tasks, we empirically observe that the proposed approach significantly outperforms existing state-of-the-art PIML and deep learning methods (with $2\\times$ to $28\\times$ lower OOD errors).",
        "keywords": "physics-informed machine learning;OOD robustness;meta learning;causal structure discovery",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "",
        "author": "S Chandra Mouli;Muhammad Alam;Bruno Ribeiro",
        "authorids": "~S_Chandra_Mouli1;~Muhammad_Alam1;~Bruno_Ribeiro1",
        "gender": "M;M;M",
        "homepage": "https://www.cs.purdue.edu/homes/chandr/;https://sites.google.com/view/alam-research-group/home;https://www.cs.purdue.edu/homes/ribeirob/",
        "dblp": "167/6021;;15/606",
        "google_scholar": "https://scholar.google.com/citations?hl=en;lWkVCnoAAAAJ;KIEleCsAAAAJ",
        "orcid": ";;0000-0002-3527-6192",
        "linkedin": ";;",
        "or_profile": "~S_Chandra_Mouli1;~Muhammad_Alam1;~Bruno_Ribeiro1",
        "aff": ";;Stanford University",
        "aff_domain": ";;stanford.edu",
        "position": ";;Visiting Associate Professor",
        "bibtex": "@inproceedings{\nmouli2024metaphysica,\ntitle={MetaPhysiCa: Improving {OOD} Robustness in Physics-informed Machine Learning},\nauthor={S Chandra Mouli and Muhammad Alam and Bruno Ribeiro},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=KrWuDiW4Qm}\n}",
        "github": "",
        "project": "",
        "reviewers": "AhF2;jJvs;qpSw;HxZg",
        "pdf_size": 1322238,
        "rating": "6;6;8;8",
        "confidence": "5;2;3;3",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;4;4;4",
        "wc_summary": "24;239;169;86",
        "wc_strengths": "37;84;163;54",
        "wc_weaknesses": "131;91;133;201",
        "wc_questions": "5;70;166;73",
        "wc_review": "197;484;631;414",
        "wc_reply_reviewers": "122;0;18;30",
        "wc_reply_authors": "1384;593;1140;608",
        "reply_reviewers": "2;0;1;1",
        "reply_authors": "4;1;3;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.25,
            1.0897247358851685
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            129.5,
            81.50613473843549
        ],
        "wc_strengths_avg": [
            84.5,
            48.34511350695125
        ],
        "wc_weaknesses_avg": [
            139.0,
            39.52214569073901
        ],
        "wc_questions_avg": [
            78.5,
            57.36070083253865
        ],
        "wc_review_avg": [
            431.5,
            156.4073208005303
        ],
        "wc_reply_reviewers_avg": [
            42.5,
            47.124834217215025
        ],
        "wc_reply_authors_avg": [
            931.25,
            341.85623805921693
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.22941573387056177,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12022376896240926813&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=KrWuDiW4Qm",
        "pdf": "https://openreview.net/pdf?id=KrWuDiW4Qm",
        "email": ";;stanford.edu",
        "author_num": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "Stanford University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.stanford.edu",
        "aff_unique_abbr": "Stanford",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Stanford",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "title": "The Wasserstein Believer: Learning Belief Updates for Partially Observable Environments through Reliable Latent Space Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18882",
        "id": "KrtGfTGaGe",
        "author_site": "Raphael Avalos, Florent Delgrange, Ann Nowe, Guillermo Perez, Diederik M. Roijers",
        "tldr": "",
        "abstract": "Partially Observable Markov Decision Processes (POMDPs) are used to model environments where the state cannot be perceived, necessitating reasoning based on past observations and actions. However, remembering the full history is generally intractable due to the exponential growth in the history space. Maintaining a probability distribution that models the belief over the current state can be used as a sufficient statistic of the history, but its computation requires access to the model of the environment and is often intractable. While SOTA algorithms use Recurrent Neural Networks to compress the observation-action history aiming to learn a sufficient statistic, they lack guarantees of success and can lead to sub-optimal policies. To overcome this, we propose the Wasserstein Belief Updater, an RL algorithm that learns a latent model of the POMDP and an approximation of the belief update under the assumption that the state is observable during training. Our approach comes with theoretical guarantees on the quality of our approximation ensuring that our latent beliefs allow for learning the optimal value function.",
        "keywords": "pomdp;guarantees;representation learning;reinforcement learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/2764d940c390b565941601daa56196ff9b610df7.zip",
        "author": "Rapha\u00ebl Avalos;Florent Delgrange;Ann Nowe;Guillermo Perez;Diederik M Roijers",
        "authorids": "~Rapha\u00ebl_Avalos1;~Florent_Delgrange1;~Ann_Nowe1;~Guillermo_Perez1;~Diederik_M_Roijers1",
        "gender": "M;F;M;M;M",
        "homepage": "https://delgrange.me;https://ai.vub.ac.be/team/ann-nowe/?utm_source=www.google.com&utm_medium=organic&utm_campaign=Google&referrer-analytics=1;https://www.uantwerpen.be/en/staff/guillermoalberto-perez/;http://roijers.info;https://www.avalos.fr",
        "dblp": "234/7693;95/232.html;135/6266.html;116/9425;309/6741",
        "google_scholar": "https://scholar.google.com.hk/citations?hl=fr;https://scholar.google.be/citations?user=LH5QKbgAAAAJ;https://scholar.google.nl/citations?user=MP0yUsgAAAAJ;https://scholar.google.nl/citations?user=oi25V4EAAAAJ;nWm5tucAAAAJ",
        "orcid": "0000-0003-2254-0596;;0000-0002-1200-4952;;0000-0002-7353-4009",
        "linkedin": ";;;;",
        "or_profile": "~Florent_Delgrange1;~Ann_Nowe1;~Guillermo_Perez1;~Diederik_M_Roijers1;~Raphael_Avalos_Martinez_de_Escobar1",
        "aff": "Vrije Universiteit Brussel & Universiteit Antwerpen;Vrije Universiteit Brussel;University of Antwerp;Hogeschool Utrecht;Vrije Universiteit Brussel",
        "aff_domain": "vub.ac.be;vub.be;uantwerpen.be;hu.nl;vub.be",
        "position": "PhD student;Full Professor;Associate Professor;Lecturer;PhD student",
        "bibtex": "@inproceedings{\navalos2024the,\ntitle={The Wasserstein Believer: Learning Belief Updates for Partially Observable Environments through Reliable Latent Space Models},\nauthor={Rapha{\\\"e}l Avalos and Florent Delgrange and Ann Nowe and Guillermo Perez and Diederik M Roijers},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=KrtGfTGaGe}\n}",
        "github": "",
        "project": "",
        "reviewers": "Rz6s;Zb4B;Gzjw;yC5B",
        "pdf_size": 3022460,
        "rating": "5;6;6;10",
        "confidence": "3;3;4;5",
        "soundness": "2;2;3;4",
        "contribution": "2;3;3;4",
        "presentation": "2;3;3;4",
        "wc_summary": "87;70;283;187",
        "wc_strengths": "113;134;75;50",
        "wc_weaknesses": "755;164;128;26",
        "wc_questions": "104;57;138;411",
        "wc_review": "1059;425;624;674",
        "wc_reply_reviewers": "0;120;0;125",
        "wc_reply_authors": "1091;909;556;333",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "3;2;1;2",
        "rating_avg": [
            6.75,
            1.920286436967152
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            156.75,
            85.50548228037779
        ],
        "wc_strengths_avg": [
            93.0,
            32.61134771824066
        ],
        "wc_weaknesses_avg": [
            268.25,
            285.5471721099685
        ],
        "wc_questions_avg": [
            177.5,
            137.84502167289176
        ],
        "wc_review_avg": [
            695.5,
            229.60672899547174
        ],
        "wc_reply_reviewers_avg": [
            61.25,
            61.27550489388072
        ],
        "wc_reply_authors_avg": [
            722.25,
            295.806841536838
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.9028289727756884,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7060632041047531814&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 11,
        "openreview": "https://openreview.net/forum?id=KrtGfTGaGe",
        "pdf": "https://openreview.net/pdf?id=KrtGfTGaGe",
        "email": "vub.ac.be;vub.be;uantwerpen.be;hu.nl;vub.be",
        "author_num": 5,
        "aff_unique_index": "0;0;1;2;0",
        "aff_unique_norm": "Vrije Universiteit Brussel;University of Antwerp;Hogeschool Utrecht",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.vub.be;https://www.uantwerp.be;https://www.hu.nl",
        "aff_unique_abbr": "VUB;UA;HU",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Brussels;",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "Belgium;Netherlands"
    },
    {
        "title": "Thin-Shell Object Manipulations With Differentiable Physics Simulations",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18881",
        "id": "KsUh8MMFKQ",
        "author_site": "Yian Wang, Juntian Zheng, Zhehuan Chen, Zhou Xian, Gu Zhang, Chao Liu, Chuang Gan",
        "tldr": "",
        "abstract": "In this work, we aim to teach robots to manipulate various thin-shell materials. \nPrior works studying thin-shell object manipulation mostly rely on heuristic policies or learn policies from real-world video demonstrations, and only focus on limited material types and tasks (e.g., cloth unfolding). However, these approaches face significant challenges when extended to a wider variety of thin-shell materials and a diverse range of tasks.\nOn the other hand, while virtual simulations are shown to be effective in diverse robot skill learning and evaluation, prior thin-shell simulation environments only support a subset of thin-shell materials, which also limits their supported range of tasks. \nTo fill in this gap, we introduce ThinShellLab - a fully differentiable simulation platform tailored for robotic interactions with diverse thin-shell materials possessing varying material properties, enabling flexible thin-shell manipulation skill learning and evaluation. Building on top of our developed simulation engine, we design a diverse set of manipulation tasks centered around different thin-shell objects. Our experiments suggest that manipulating thin-shell objects presents several unique challenges: 1) thin-shell manipulation relies heavily on frictional forces due to the objects' co-dimensional nature, 2) the materials being manipulated are highly sensitive to minimal variations in interaction actions, and 3) the constant and frequent alteration in contact pairs makes trajectory optimization methods susceptible to local optima, and neither standard reinforcement learning algorithms nor trajectory optimization methods (either gradient-based or gradient-free) are able to solve the tasks alone. To overcome these challenges, we present an optimization scheme that couples sampling-based trajectory optimization and gradient-based optimization, boosting both learning efficiency and converged performance across various proposed tasks. In addition, the differentiable nature of our platform facilitates a smooth sim-to-real transition. By tuning simulation parameters with a minimal set of real-world data, we demonstrate successful deployment of the learned skills to real-robot settings.  ThinShellLab will be publicly available. Video demonstration and more information can be found on the project website https://vis-www.cs.umass.edu/ThinShellLab/.",
        "keywords": "differentiable physics simulation;thin-shell object manipulation",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Yian Wang;Juntian Zheng;Zhehuan Chen;Zhou Xian;Gu Zhang;Chao Liu;Chuang Gan",
        "authorids": "~Yian_Wang1;~Juntian_Zheng1;~Zhehuan_Chen1;~Zhou_Xian1;~Gu_Zhang1;~Chao_Liu9;~Chuang_Gan1",
        "gender": "M;M;M;M;;M;M",
        "homepage": "https://github.com/Alif-01;https://www.cnblogs.com/ACMLCZH;;https://www.gu-zhang.com/;https://chaoliu.tech/;http://people.csail.mit.edu/ganchuang/;http://wangyian-me.github.io/",
        "dblp": ";;258/5020;;15/5923-21;139/6993;71/10046",
        "google_scholar": ";LvNUzlEAAAAJ;;ctFTmmgAAAAJ;FSwWMcoAAAAJ;PTeSCbIAAAAJ;dUf3wx4AAAAJ",
        "orcid": ";;;;0000-0002-9912-4729;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Juntian_Zheng1;~Zhehuan_Chen1;~Zhou_Xian1;~Gu_Zhang1;~Chao_Liu9;~Chuang_Gan1;~\u9038\u5b89_\u738b1",
        "aff": "Tsinghua University;University of Massachusetts at Amherst;Carnegie Mellon University;Shanghai Jiaotong University;Computer Science and Artificial Intelligence Laboratory, Electrical Engineering & Computer Science;University of Massachusetts at Amherst;NVIDIA",
        "aff_domain": "tsinghua.edu.cn;umass.edu;cmu.edu;sjtu.edu.cn;csail.mit.edu;umass.edu;nvidia.com",
        "position": "Undergrad student;MS student;PhD student;Undergrad student;Postdoc;Assistant Professor;Intern",
        "bibtex": "@inproceedings{\nwang2024thinshell,\ntitle={Thin-Shell Object Manipulations With Differentiable Physics Simulations},\nauthor={Yian Wang and Juntian Zheng and Zhehuan Chen and Zhou Xian and Gu Zhang and Chao Liu and Chuang Gan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=KsUh8MMFKQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "k5Lf;BtTD;j6Cr;3BVm;Vd5A",
        "pdf_size": 7401204,
        "rating": "8;8;8;8;8",
        "confidence": "4;4;3;3;3",
        "soundness": "4;4;4;3;3",
        "contribution": "4;4;4;3;3",
        "presentation": "3;3;3;2;3",
        "wc_summary": "90;63;68;87;53",
        "wc_strengths": "42;63;105;35;32",
        "wc_weaknesses": "83;76;203;105;634",
        "wc_questions": "113;18;46;160;37",
        "wc_review": "328;220;422;387;756",
        "wc_reply_reviewers": "20;0;53;17;55",
        "wc_reply_authors": "672;180;340;481;2603",
        "reply_reviewers": "1;0;1;1;1",
        "reply_authors": "1;1;1;1;6",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            3.4,
            0.4898979485566356
        ],
        "soundness_avg": [
            3.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            3.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            72.2,
            14.190137420053407
        ],
        "wc_strengths_avg": [
            55.4,
            27.059933481071234
        ],
        "wc_weaknesses_avg": [
            220.2,
            211.85598882259617
        ],
        "wc_questions_avg": [
            74.8,
            53.29690422529249
        ],
        "wc_review_avg": [
            422.6,
            180.232738424516
        ],
        "wc_reply_reviewers_avg": [
            29.0,
            21.531372459738837
        ],
        "wc_reply_authors_avg": [
            855.2,
            888.7878036966979
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            2.0,
            2.0
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13661275665301230181&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=KsUh8MMFKQ",
        "pdf": "https://openreview.net/pdf?id=KsUh8MMFKQ",
        "email": "tsinghua.edu.cn;umass.edu;cmu.edu;sjtu.edu.cn;csail.mit.edu;umass.edu;nvidia.com",
        "author_num": 7,
        "aff_unique_index": "0;1;2;3;4;1;5",
        "aff_unique_norm": "Tsinghua University;University of Massachusetts Amherst;Carnegie Mellon University;Shanghai Jiao Tong University;Massachusetts Institute of Technology;NVIDIA",
        "aff_unique_dep": ";;;;Computer Science and Artificial Intelligence Laboratory;NVIDIA Corporation",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.umass.edu;https://www.cmu.edu;https://www.sjtu.edu.cn;https://www.csail.mit.edu;https://www.nvidia.com",
        "aff_unique_abbr": "THU;UMass Amherst;CMU;SJTU;CSAIL;NVIDIA",
        "aff_campus_unique_index": "1;2;1",
        "aff_campus_unique": ";Amherst;Cambridge",
        "aff_country_unique_index": "0;1;1;0;1;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "KskgLM728l",
        "title": "Bio-RFX: Refining Biomedical Extraction via Advanced Relation Classification and Structural Constraints",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The ever-growing biomedical publications magnify the challenge of extracting structured data from unstructured texts. This task involves two components: biomedical entity identification (Named Entity Recognition) and their interrelation determination (Relation Extraction). However, pre-existing methods often neglect unique features of the biomedical literature, such as ambiguous entities, nested proper nouns, and overlapping relation triplets, and underutilize prior knowledge, leading to an intolerable performance decline in the biomedical domain, especially with limited annotated training data. In this paper, we propose the **Bio**medical **R**elation-**F**irst E**X**traction (Bio-RFX) model by leveraging sentence-level relation classification before entity extraction to tackle entity ambiguity. Moreover, we exploit structural constraints between entities and relations to guide the model's hypothesis space, enhancing extraction performance across different training scenarios. Comprehensive experiments on multiple biomedical datasets show that Bio-RFX achieves significant improvements on both named entity recognition and relation extraction tasks, especially under low-resource training scenarios, achieving a remarkable **5.13%** absolute improvement on average in NER, and **7.20%** absolute improvement on average in RE compared to baselines. The source code and pertinent documentation are readily accessible on established open-source repositories.",
        "keywords": "Named Entity Recognition;Relation Extraction;Biomedical Literature",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Minjia Wang;Fangzhou Liu;Xiuxing Li;Bowen Dong;Zhenyu Li;Tengyu Pan;Jianyong Wang",
        "authorids": "~Minjia_Wang1;~Fangzhou_Liu1;~Xiuxing_Li1;~Bowen_Dong2;~Zhenyu_Li5;~Tengyu_Pan1;~Jianyong_Wang2",
        "gender": ";M;M;M;M;M;M",
        "homepage": ";;;;https://github.com/leezythu;http://dbgroup.cs.tsinghua.edu.cn/wangjy/;https://github.com/ThonyPan",
        "dblp": ";;200/2293;;58/5750-6;24/2006;",
        "google_scholar": ";;https://scholar.google.com/citations?hl=zh-CN;;v0IDKw4AAAAJ;VfBaiG8AAAAJ;",
        "orcid": "0000-0002-7847-4818;0000-0001-6876-5112;;;0009-0006-4964-9910;0000-0002-7555-170X;0009-0002-0869-2411",
        "linkedin": ";;;;;;",
        "or_profile": "~Minjia_Wang1;~Fangzhou_Liu1;~Xiuxing_Li1;~Bowen_Dong2;~Zhenyu_Li5;~Jianyong_Wang2;~Thony_Pan1",
        "aff": "Tsinghua University;Tsinghua University;Institute of Computing Technology, Chinese Academy of Sciences; University of Chinese Academy of Sciences;Tencent AI Lab;Tsinghua University;Tsinghua University;Department of Computer Science and Technology, Tsinghua University",
        "aff_domain": "mails.tsinghua.edu.cn;mails.tsinghua.edu.cn;ict.ac.cn;tencent.com;tsinghua.edu.cn;tsinghua.edu.cn;cs.tsinghua.edu.cn",
        "position": "Undergrad student;Undergrad student;Research associate;Undergrad student;PhD student;Full Professor;MS student",
        "bibtex": "@misc{\nwang2024biorfx,\ntitle={Bio-{RFX}: Refining Biomedical Extraction via Advanced Relation Classification and Structural Constraints},\nauthor={Minjia Wang and Fangzhou Liu and Xiuxing Li and Bowen Dong and Zhenyu Li and Tengyu Pan and Jianyong Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=KskgLM728l}\n}",
        "github": "",
        "project": "",
        "reviewers": "Wvyh;FKtM;apnY;wMCa",
        "site": "https://openreview.net/forum?id=KskgLM728l",
        "pdf_size": 535796,
        "rating": "5;5;6;6",
        "confidence": "3;4;4;4",
        "soundness": "2;3;3;3",
        "contribution": "3;3;3;2",
        "presentation": "2;3;3;3",
        "wc_summary": "85;60;118;60",
        "wc_strengths": "37;81;59;42",
        "wc_weaknesses": "45;116;190;28",
        "wc_questions": "50;25;87;21",
        "wc_review": "217;282;454;151",
        "wc_reply_reviewers": "19;70;21;0",
        "wc_reply_authors": "592;1484;828;274",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "2;4;2;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            80.75,
            23.805199011980555
        ],
        "wc_strengths_avg": [
            54.75,
            17.210098779495716
        ],
        "wc_weaknesses_avg": [
            94.75,
            64.13803473758765
        ],
        "wc_questions_avg": [
            45.75,
            26.280934153869037
        ],
        "wc_review_avg": [
            276.0,
            112.72311209330587
        ],
        "wc_reply_reviewers_avg": [
            27.5,
            25.86986664055306
        ],
        "wc_reply_authors_avg": [
            794.5,
            443.976069174905
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            1.0897247358851685
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10699500062875477445&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;1;2;3;0;0;0",
        "aff_unique_norm": "Tsinghua University;Chinese Academy of Sciences;University of Chinese Academy of Sciences;Tencent",
        "aff_unique_dep": ";Institute of Computing Technology;;Tencent AI Lab",
        "aff_unique_url": "https://www.tsinghua.edu.cn;http://www.ict.ac.cn;http://www.ucas.ac.cn;https://ai.tencent.com",
        "aff_unique_abbr": "THU;CAS;UCAS;Tencent AI Lab",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "KszBlT26pl",
        "title": "FP-IRL: Fokker-Planck-based Inverse Reinforcement Learning --- A Physics-Constrained Approach to Markov Decision Processes",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Inverse Reinforcement Learning (IRL) is a compelling technique for revealing the rationale underlying the behavior of autonomous agents. IRL seeks to estimate the unknown reward function of a Markov decision process (MDP) from observed agent trajectories. While most IRL approaches require the transition function to be prescribed or learned a-priori, we present a new IRL method targeting the class MDPs that follow the It\\^{o} dynamics without this requirement. Instead, the transition is inferred in a physics-constrained manner simultaneously with the reward functions from observed trajectories leveraging the mean-field theory described by the Fokker-Planck (FP) equation. We conjecture an isomorphism between the time-discrete FP and MDP that extends beyond the minimization of free energy (in FP) and maximization of the reward (in MDP). This isomorphism allows us to infer the potential function in FP using variational system identification, which consequently allows the evaluation of reward, transition, and policy by leveraging the conjecture. We demonstrate the effectiveness of FP-IRL by applying it to synthetic benchmarks and a biological problem of cancer cell dynamics, where the transition function is unknown.",
        "keywords": "Inverse Reinforcement Learning;Fokker Planck Equation;Markov Decision Process;Machine Learning for Science;Cancer Cell Biology",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/9aec5d065e063b1f00541ab59775ee228b00fa5f.zip",
        "author": "Chengyang Huang;Siddhartha Srivastava;Xun Huan;Krishna Garikipati",
        "authorids": "~Chengyang_Huang1;~Siddhartha_Srivastava1;~Xun_Huan1;~Krishna_Garikipati1",
        "gender": "M;M;M;M",
        "homepage": "https://chengyanghuang.github.io/;http://www-personal.umich.edu/~sidsriva/;https://uq.engin.umich.edu/;http://websites.umich.edu/~compphys/index.html",
        "dblp": ";212/8720;122/5251;",
        "google_scholar": "lDviwcMAAAAJ;zLj-pQcAAAAJ;QlwjXA0AAAAJ;e6j1OzMAAAAJ",
        "orcid": "0000-0002-6271-6288;0000-0002-4684-4423;0000-0001-6544-2764;0000-0001-6697-0067",
        "linkedin": "chengyanghuang/;;rxhuan/;krishna-garikipati-a9b3a318/",
        "or_profile": "~Chengyang_Huang1;~Siddhartha_Srivastava1;~Xun_Huan1;~Krishna_Garikipati1",
        "aff": "University of Michigan - Ann Arbor;University of Michigan - Ann Arbor;University of Michigan - Ann Arbor;University of Southern California",
        "aff_domain": "umich.edu;umich.edu;umich.edu;usc.edu",
        "position": "PhD student;Researcher;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nhuang2024fpirl,\ntitle={{FP}-{IRL}: Fokker-Planck-based Inverse Reinforcement Learning --- A Physics-Constrained Approach to Markov Decision Processes},\nauthor={Chengyang Huang and Siddhartha Srivastava and Xun Huan and Krishna Garikipati},\nyear={2024},\nurl={https://openreview.net/forum?id=KszBlT26pl}\n}",
        "github": "",
        "project": "",
        "reviewers": "72Xj;hceT;GdP4;fsZH",
        "site": "https://openreview.net/forum?id=KszBlT26pl",
        "pdf_size": 3238796,
        "rating": "3;3;3;8",
        "confidence": "4;4;3;4",
        "soundness": "3;1;3;4",
        "contribution": "2;2;3;4",
        "presentation": "3;2;3;4",
        "wc_summary": "47;72;151;68",
        "wc_strengths": "129;15;46;66",
        "wc_weaknesses": "323;237;50;114",
        "wc_questions": "1;10;173;25",
        "wc_review": "500;334;420;273",
        "wc_reply_reviewers": "361;113;143;114",
        "wc_reply_authors": "1283;798;1368;489",
        "reply_reviewers": "2;1;1;1",
        "reply_authors": "2;1;2;1",
        "rating_avg": [
            4.25,
            2.165063509461097
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            1.0897247358851685
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            84.5,
            39.5506005011302
        ],
        "wc_strengths_avg": [
            64.0,
            41.69532347877877
        ],
        "wc_weaknesses_avg": [
            181.0,
            106.00707523557095
        ],
        "wc_questions_avg": [
            52.25,
            70.24021284136317
        ],
        "wc_review_avg": [
            381.75,
            85.95456648718555
        ],
        "wc_reply_reviewers_avg": [
            182.75,
            103.61557556661064
        ],
        "wc_reply_authors_avg": [
            984.5,
            359.33167130104187
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:wNegTyPHCMcJ:scholar.google.com/&scioq=FP-IRL:+Fokker-Planck-based+Inverse+Reinforcement+Learning+---+A+Physics-Constrained+Approach+to+Markov+Decision+Processes&hl=en&as_sdt=0,44",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "University of Michigan;University of Southern California",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.umich.edu;https://www.usc.edu",
        "aff_unique_abbr": "UM;USC",
        "aff_campus_unique_index": "0;0;0;1",
        "aff_campus_unique": "Ann Arbor;Los Angeles",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Teaching Large Language Models to Self-Debug",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18880",
        "id": "KuPixIqPiq",
        "author_site": "Xinyun Chen, Maxwell Lin, Nathanael Schaerli, Denny Zhou",
        "tldr": "",
        "abstract": "Large language models (LLMs) have achieved impressive performance on code generation. However, for complex programming tasks, generating the correct solution in one go becomes challenging, thus some prior works have designed program repair approaches to improve code generation performance. In this work, we propose self-debugging, which teaches a large language model to debug its predicted program. In particular, we demonstrate that self-debugging can teach the large language model to perform rubber duck debugging; i.e., without any human feedback on the code correctness or error messages, the model is able to identify its mistakes by leveraging code execution and explaining the generated code in natural language. Self-debugging achieves the state-of-the-art performance on several code generation benchmarks, including the Spider dataset for text-to-SQL generation, TransCoder for C++-to-Python translation, and MBPP for text-to-Python generation. On the Spider benchmark where there are no unit tests to verify the correctness of predictions, self-debugging with code explanation consistently improves the baseline by 2-3%, and improves the prediction accuracy on problems of the hardest level by 9%. On TransCoder and MBPP where unit tests are available, self-debugging improves the baseline accuracy by up to 12%. Meanwhile, by leveraging feedback messages and reusing failed predictions, self-debugging notably improves sample efficiency, and can match or outperform baseline models that generate more than 10$\\times$ candidate programs.",
        "keywords": "large language model;self-debugging",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/e114551a2906bd349340c876198c4bd4b9f663ef.pdf",
        "author": "Xinyun Chen;Maxwell Lin;Nathanael Sch\u00e4rli;Denny Zhou",
        "authorids": "~Xinyun_Chen1;~Maxwell_Lin1;~Nathanael_Sch\u00e4rli1;~Denny_Zhou1",
        "gender": ";M;;F",
        "homepage": ";;https://dennyzhou.github.io/;https://jungyhuk.github.io/",
        "dblp": ";;178/3277;",
        "google_scholar": "y9aAz6IAAAAJ;64RoFnUAAAAJ;UwLsYw8AAAAJ;d4W1UT0AAAAJ",
        "orcid": ";;;",
        "linkedin": ";https://ch.linkedin.com/in/nathanael-sch%C3%A4rli-118a3984;;",
        "or_profile": "~Maxwell_Lin1;~Nathanael_Sch\u00e4rli1;~Dengyong_Zhou2;~Xinyun_Chen2",
        "aff": ";Research, Google;Google DeepMind;Google",
        "aff_domain": ";research.google.com;google.com;google.com",
        "position": ";Researcher;Research Scientist;Researcher",
        "bibtex": "@inproceedings{\nchen2024teaching,\ntitle={Teaching Large Language Models to Self-Debug},\nauthor={Xinyun Chen and Maxwell Lin and Nathanael Sch{\\\"a}rli and Denny Zhou},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=KuPixIqPiq}\n}",
        "github": "",
        "project": "",
        "reviewers": "AdYB;UhXy;hHB2;urzn",
        "pdf_size": 1020604,
        "rating": "6;6;6;6",
        "confidence": "5;4;4;3",
        "soundness": "2;3;3;3",
        "contribution": "3;3;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "181;50;37;68",
        "wc_strengths": "21;34;24;108",
        "wc_weaknesses": "399;105;162;92",
        "wc_questions": "9;79;86;1",
        "wc_review": "610;268;309;269",
        "wc_reply_reviewers": "525;15;173;88",
        "wc_reply_authors": "1241;698;1132;520",
        "reply_reviewers": "3;1;3;1",
        "reply_authors": "4;2;5;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            84.0,
            57.074512700504066
        ],
        "wc_strengths_avg": [
            46.75,
            35.688758734369
        ],
        "wc_weaknesses_avg": [
            189.5,
            123.787115646177
        ],
        "wc_questions_avg": [
            43.75,
            38.931831449342326
        ],
        "wc_review_avg": [
            364.0,
            142.98776171407118
        ],
        "wc_reply_reviewers_avg": [
            200.25,
            195.6545105536798
        ],
        "wc_reply_authors_avg": [
            897.75,
            298.0305143773033
        ],
        "reply_reviewers_avg": [
            2.0,
            1.0
        ],
        "reply_authors_avg": [
            3.25,
            1.299038105676658
        ],
        "replies_avg": [
            30,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 636,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5819032650612416073&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=KuPixIqPiq",
        "pdf": "https://openreview.net/pdf?id=KuPixIqPiq",
        "email": ";research.google.com;google.com;google.com",
        "author_num": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Google",
        "aff_unique_dep": "Google Research",
        "aff_unique_url": "https://research.google",
        "aff_unique_abbr": "Google",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Mountain View;",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "title": "Large Multilingual Models Pivot Zero-Shot Multimodal Learning across Languages",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18879",
        "id": "Kuh5qgCGCp",
        "author_site": "Jinyi Hu, Yuan Yao, Chongyi Wang, SHAN WANG, Yinxu Pan, Qianyu Chen, Tianyu Yu, Hanghao Wu, Yue Zhao, Haoye Zhang, Xu Han, Yankai Lin, Jiao Xue, dahai li, Zhiyuan Liu, Maosong Sun",
        "tldr": "",
        "abstract": "Recently there has been a significant surge in multimodal learning in terms of both image-to-text and text-to-image generation. However, the success is typically limited to English, leaving other languages largely behind. Building a competitive counterpart in other languages is highly challenging due to the low-resource nature of non-English multimodal data (i.e., lack of large-scale, high-quality image-text data). In this work, we propose MPM, an effective training paradigm for training large multimodal models in low-resource languages. MPM demonstrates that Multilingual language models can Pivot zero-shot Multimodal learning across languages. Specifically, based on a strong multilingual large language model, multimodal models pretrained on English-only image-text data can well generalize to other languages in a (quasi)-zero-shot manner, even surpassing models trained on image-text data in native languages. Taking Chinese as a practice of MPM, we build large multimodal models VisCPM in image-to-text and text-to-image generation, which achieve state-of-the-art (open-source) performance in Chinese. To facilitate future research, we open-source codes and model weights at https://github.com/OpenBMB/VisCPM.",
        "keywords": "Large Multimodal Models;Multilingual Transfer",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Jinyi Hu;Yuan Yao;Chongyi Wang;SHAN WANG;Yinxu Pan;Qianyu Chen;Tianyu Yu;Hanghao Wu;Yue Zhao;Haoye Zhang;Xu Han;Yankai Lin;Jiao Xue;dahai li;Zhiyuan Liu;Maosong Sun",
        "authorids": "~Jinyi_Hu1;~Yuan_Yao12;~Chongyi_Wang1;~SHAN_WANG4;~Yinxu_Pan1;~Qianyu_Chen2;~Tianyu_Yu1;~Hanghao_Wu1;~Yue_Zhao22;~Haoye_Zhang1;~Xu_Han2;~Yankai_Lin1;~Jiao_Xue1;~dahai_li1;~Zhiyuan_Liu1;~Maosong_Sun1",
        "gender": "M;M;M;F;M;M;M;M;M;F;;M;;M;M;M",
        "homepage": "https://jameshujy.github.io/;https://yaoyuanthu.github.io/;https://github.com/YuzaChongyi;https://galaxyrocky.github.io/;https://github.com/Cppowboy;https://cqylv.github.io/qianyuchen.github.io/;;;https://yuezhao238.github.io/;;;https://linyankai.github.io/;https://github.com/youxuanxue;https://www.bloomberg.com/profile/person/22198764?leadSource=uverify%20wall;http://nlp.csai.tsinghua.edu.cn/~lzy;https://www.cs.tsinghua.edu.cn/csen/info/1312/4394.htm",
        "dblp": "261/9291;;;;;;;222/7971;48/76;127/4983;;161/0001.html;;;53/3245-1;95/3291-1",
        "google_scholar": "https://scholar.google.com.hk/citations?user=Cz70Xr8AAAAJ;https://scholar.google.com.hk/citations?user=3NWfi3YAAAAJ;;;;https://scholar.google.com/citations?view_op=list_works;e-FRHr4AAAAJ;;c7i8o70AAAAJ;;;https://scholar.google.com.hk/citations?user=j8K1FqEAAAAJ;;;dT0v5u0AAAAJ;https://scholar.google.com.tw/citations?user=zIgT0HMAAAAJ",
        "orcid": ";;;;;;0000-0001-9752-6655;;0009-0005-7918-6489;;;0000-0002-9182-8158;;;0000-0002-7709-2543;",
        "linkedin": "%E9%94%A6%E6%AF%85-%E8%83%A1-9574611a6/;;;;;;;;;haoyezhang;;;;;;",
        "or_profile": "~Jinyi_Hu1;~Yuan_Yao12;~Chongyi_Wang1;~SHAN_WANG4;~Yinxu_Pan1;~Qianyu_Chen2;~Tianyu_Yu1;~Hanghao_Wu1;~Yue_Zhao22;~Haoye_Zhang1;~Xu_Han2;~Yankai_Lin1;~Jiao_Xue1;~dahai_li1;~Zhiyuan_Liu1;~Maosong_Sun1",
        "aff": "Massachusetts Institute of Technology;National University of Singapore;;Zhihu;;Chinese University of Hong Kong, The Chinese University of Hong Kong;Tsinghua University;;Beijing University of Posts and Telecommunications;Tsinghua University;;Renmin University of China;Inspur Cloud Information Technology Co., Ltd.;;Tsinghua University;Tsinghua University",
        "aff_domain": "mit.edu;nus.edu;;zhihu.com;;se.cuhk.edu.hk;tsinghua.edu.cn;;bupt.edu.cn;tsinghua.edu.cn;;ruc.edu.cn;inspur.com;;tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "PhD student;Postdoc;;Principal Researcher;;PhD student;MS student;;Undergrad student;MS student;;Assistant Professor;Researcher;;Associate Professor;Full Professor",
        "bibtex": "@inproceedings{\nhu2024large,\ntitle={Large Multilingual Models Pivot Zero-Shot Multimodal Learning across Languages},\nauthor={Jinyi Hu and Yuan Yao and Chongyi Wang and SHAN WANG and Yinxu Pan and Qianyu Chen and Tianyu Yu and Hanghao Wu and Yue Zhao and Haoye Zhang and Xu Han and Yankai Lin and Jiao Xue and dahai li and Zhiyuan Liu and Maosong Sun},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Kuh5qgCGCp}\n}",
        "github": "",
        "project": "",
        "reviewers": "BZ1h;scbv;mPhK;T6ab",
        "pdf_size": 4488139,
        "rating": "3;5;6;8",
        "confidence": "4;4;4;4",
        "soundness": "2;2;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;2;4",
        "wc_summary": "110;93;57;120",
        "wc_strengths": "111;45;62;67",
        "wc_weaknesses": "538;271;226;1",
        "wc_questions": "66;186;4;1",
        "wc_review": "825;595;349;189",
        "wc_reply_reviewers": "137;0;36;0",
        "wc_reply_authors": "1090;630;462;7",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            95.0,
            23.96872962841377
        ],
        "wc_strengths_avg": [
            71.25,
            24.355440870573457
        ],
        "wc_weaknesses_avg": [
            259.0,
            190.81273542402772
        ],
        "wc_questions_avg": [
            64.25,
            74.92788199328739
        ],
        "wc_review_avg": [
            489.5,
            241.72867020690782
        ],
        "wc_reply_reviewers_avg": [
            43.25,
            56.08642883978262
        ],
        "wc_reply_authors_avg": [
            547.25,
            387.479918834512
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            16,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 64,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9368806809247553701&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=Kuh5qgCGCp",
        "pdf": "https://openreview.net/pdf?id=Kuh5qgCGCp",
        "email": "mit.edu;nus.edu;;zhihu.com;;se.cuhk.edu.hk;tsinghua.edu.cn;;bupt.edu.cn;tsinghua.edu.cn;;ruc.edu.cn;inspur.com;;tsinghua.edu.cn;tsinghua.edu.cn",
        "author_num": 16,
        "aff_unique_index": "0;1;2;3;4;5;4;6;7;4;4",
        "aff_unique_norm": "Massachusetts Institute of Technology;National University of Singapore;Zhihu;Chinese University of Hong Kong;Tsinghua University;Beijing University of Posts and Telecommunications;Renmin University of China;Inspur Cloud Information Technology Co., Ltd.",
        "aff_unique_dep": ";;;;;;;",
        "aff_unique_url": "https://web.mit.edu;https://www.nus.edu.sg;https://www.zhihu.com;https://www.cuhk.edu.hk;https://www.tsinghua.edu.cn;http://www.bupt.edu.cn/;http://www.ruc.edu.cn;https://www.inspur.com",
        "aff_unique_abbr": "MIT;NUS;Zhihu;CUHK;THU;BUPT;RUC;",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Hong Kong SAR;Beijing",
        "aff_country_unique_index": "0;1;2;2;2;2;2;2;2;2;2",
        "aff_country_unique": "United States;Singapore;China"
    },
    {
        "title": "Accelerating Sinkhorn algorithm with sparse Newton iterations",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18878",
        "id": "Kuj5gVp5GQ",
        "author_site": "Xun Tang, Michael Shavlovsky, Holakou Rahmanian, Elisa Tardini, Kiran Thekumparampil, Tesi Xiao, Lexing Ying",
        "tldr": "",
        "abstract": "Computing the optimal transport distance between statistical distributions is a fundamental task in machine learning. One remarkable recent advancement is entropic regularization and the Sinkhorn algorithm, which utilizes only matrix scaling and guarantees an approximated solution with near-linear runtime. Despite the success of the Sinkhorn algorithm, its runtime may still be slow due to the potentially large number of iterations needed for convergence. To achieve possibly super-exponential convergence, we introduce Sinkhorn-Newton-Sparse (SNS), an extension to the Sinkhorn algorithm, by introducing early stopping for the matrix scaling steps and a second stage featuring a Newton-type subroutine. Adopting the variational viewpoint that the Sinkhorn algorithm maximizes a concave Lyapunov potential, we offer the insight that the Hessian matrix of the potential function is approximately sparse. Sparsification of the Hessian results in a fast $O(n^2)$ per-iteration complexity, the same as the Sinkhorn algorithm.  In terms of total iteration count, we observe that the SNS algorithm converges orders of magnitude faster across a wide range of practical cases, including optimal transportation between empirical distributions and calculating the Wasserstein $W_1, W_2$ distance of discretized continuous densities. The empirical performance is corroborated by a rigorous bound on the approximate sparsity of the Hessian matrix.",
        "keywords": "Optimal transport;Convex optimization;Quasi-Newton methods;Non-asymptotic analysis;Extremal combinatorics",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/37442484298915fe571ceb84896cce660bd2d434.zip",
        "author": "Xun Tang;Michael Shavlovsky;Holakou Rahmanian;Elisa Tardini;Kiran Koshy Thekumparampil;Tesi Xiao;Lexing Ying",
        "authorids": "xuntang@stanford.edu;~Michael_Shavlovsky1;~Holakou_Rahmanian2;ettardin@amazon.com;~Kiran_Koshy_Thekumparampil1;~Tesi_Xiao1;~Lexing_Ying1",
        "gender": ";M;M;;M;;",
        "homepage": ";;https://holakou.com/;;http://thekump2.web.engr.illinois.edu;;http://web.stanford.edu/~lexing",
        "dblp": ";130/0377;;;142/2840;;68/3945",
        "google_scholar": ";;;;0gJQCIgAAAAJ;;OwA3zyMAAAAJ",
        "orcid": ";;;;;;",
        "linkedin": ";;;;;;",
        "or_profile": "xuntang@stanford.edu;~Michael_Shavlovsky1;~Holakou_Rahmanian2;ettardin@amazon.com;~Kiran_Koshy_Thekumparampil1;~Tesi_Xiao1;~Lexing_Ying1",
        "aff": ";Amazon;Amazon;;Amazon;;Stanford University",
        "aff_domain": ";amazon.com;amazon.com;;amazon.com;;stanford.edu",
        "position": ";PhD student;Applied Scientist;;Researcher;;Professor",
        "bibtex": "@inproceedings{\ntang2024accelerating,\ntitle={Accelerating Sinkhorn algorithm with sparse Newton iterations},\nauthor={Xun Tang and Michael Shavlovsky and Holakou Rahmanian and Elisa Tardini and Kiran Koshy Thekumparampil and Tesi Xiao and Lexing Ying},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Kuj5gVp5GQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "39Qf;ZDaz;orpT;CUDR",
        "pdf_size": 748171,
        "rating": "6;6;8;8",
        "confidence": "3;3;3;4",
        "soundness": "3;2;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;2;3;4",
        "wc_summary": "82;56;146;95",
        "wc_strengths": "37;72;59;86",
        "wc_weaknesses": "26;119;98;121",
        "wc_questions": "37;1;363;79",
        "wc_review": "182;248;666;381",
        "wc_reply_reviewers": "83;0;138;93",
        "wc_reply_authors": "443;1030;1915;791",
        "reply_reviewers": "1;0;2;1",
        "reply_authors": "1;2;4;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            94.75,
            32.751908341347075
        ],
        "wc_strengths_avg": [
            63.5,
            18.034688796871432
        ],
        "wc_weaknesses_avg": [
            91.0,
            38.59404099080582
        ],
        "wc_questions_avg": [
            120.0,
            142.98601330200097
        ],
        "wc_review_avg": [
            369.25,
            185.71668611086082
        ],
        "wc_reply_reviewers_avg": [
            78.5,
            49.83221849366131
        ],
        "wc_reply_authors_avg": [
            1044.75,
            544.0691017692513
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3966969718828038222&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=Kuj5gVp5GQ",
        "pdf": "https://openreview.net/pdf?id=Kuj5gVp5GQ",
        "email": ";amazon.com;amazon.com;;amazon.com;;stanford.edu",
        "author_num": 7,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "Amazon;Stanford University",
        "aff_unique_dep": "Amazon.com, Inc.;",
        "aff_unique_url": "https://www.amazon.com;https://www.stanford.edu",
        "aff_unique_abbr": "Amazon;Stanford",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Stanford",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Kwm1OyINXt",
        "title": "Deep probabilistic 3D angular regression for directional dark matter detectors",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Modern detectors of elementary particles are  approaching a fundamental sensitivity limit where individual quanta of charge can be localized and counted in 3D. This enables novel detectors capable of unambiguously demonstrating the particle nature of dark matter by inferring the 3D directions of elementary particles from complex point cloud data. The most complex scenario involves inferring the initial directions of low-energy electrons from their tortuous trajectories. To address this problem we develop and demonstrate the first probabilistic deep learning model that predicts 3D directions using a heteroscedastic von Mises-Fisher distribution that allows us to model data uncertainty. Our approach generalizes the cosine distance loss which is a special case of our loss function in which the uncertainty is assumed to be uniform across samples. We utilize a sparse 3D convolutional neural network architecture and develop approximations to the negative log-likelihood loss which stabilize training. On a simulated Monte Carlo test set, our end-to-end deep learning approach achieves a mean cosine distance of $0.104$ $(26^\\circ)$ compared to $0.556$ $(64^\\circ) $ achieved by a non-machine learning algorithm. We demonstrate that the model is well-calibrated and allows selecting low-uncertainty samples to improve accuracy. This advancement in probabilistic 3D directional learning could significantly contribute to directional dark matter detection.",
        "keywords": "3D;Directionality;Probabilistic;Particle Physics",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Majd Ghrear;Peter Sadowski;Sven Einar Vahsen",
        "authorids": "~Majd_Ghrear1;~Peter_Sadowski1;~Sven_Einar_Vahsen1",
        "gender": "M;M;M",
        "homepage": ";https://www2.hawaii.edu/~psadow/;https://www.phys.hawaii.edu/~sevahsen/",
        "dblp": ";181/8030;",
        "google_scholar": ";https://scholar.google.es/citations?user=5-s3bS8AAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";0000-0002-7354-5461;0000-0003-1685-9824",
        "linkedin": "majd-ghrear/;peter-sadowski-83348913/;",
        "or_profile": "~Majd_Ghrear1;~Peter_Sadowski1;~Sven_Einar_Vahsen1",
        "aff": ";University of Hawaii Manoa;University of Hawaii at Manoa",
        "aff_domain": ";hawaii.edu;manoa.hawaii.edu",
        "position": ";Associate Professor;Full Professor",
        "bibtex": "@misc{\nghrear2024deep,\ntitle={Deep probabilistic 3D angular regression for directional dark matter detectors},\nauthor={Majd Ghrear and Peter Sadowski and Sven Einar Vahsen},\nyear={2024},\nurl={https://openreview.net/forum?id=Kwm1OyINXt}\n}",
        "github": "",
        "project": "",
        "reviewers": "qwYh;c5Tr;7Dku",
        "site": "https://openreview.net/forum?id=Kwm1OyINXt",
        "pdf_size": 1790066,
        "rating": "3;5;8",
        "confidence": "3;2;3",
        "soundness": "3;3;3",
        "contribution": "2;2;3",
        "presentation": "1;2;3",
        "wc_summary": "92;69;60",
        "wc_strengths": "140;46;72",
        "wc_weaknesses": "179;148;462",
        "wc_questions": "103;55;2",
        "wc_review": "514;318;596",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "278;527;329",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;2;2",
        "rating_avg": [
            5.333333333333333,
            2.0548046676563256
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            73.66666666666667,
            13.474255287605157
        ],
        "wc_strengths_avg": [
            86.0,
            39.6316371938716
        ],
        "wc_weaknesses_avg": [
            263.0,
            141.28222346306228
        ],
        "wc_questions_avg": [
            53.333333333333336,
            41.24991582482994
        ],
        "wc_review_avg": [
            476.0,
            116.63047057551755
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            378.0,
            107.39646176667088
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.1147078669352809,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16549593094817668768&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Hawaii",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.hawaii.edu",
        "aff_unique_abbr": "UH",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Manoa",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "The False Promise of Imitating Proprietary Language Models",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18877",
        "id": "Kz3yckpCN5",
        "author_site": "Arnav Gudibande, Eric Wallace, Charlie Snell, Xinyang Geng, Hao Liu, Pieter Abbeel, Sergey Levine, Dawn Song",
        "tldr": "",
        "abstract": "An emerging method to cheaply improve a weaker language model is to finetune it on outputs from a stronger model, such as a proprietary system like ChatGPT (e.g., Alpaca, Self-Instruct, and others). In this work, we critically analyze this approach of imitating language models. We first finetune a series of LMs that imitate ChatGPT using varying base model sizes (1.5B--13B), data sources, and imitation data amounts (0.3M--150M tokens). We then evaluate the models using crowd raters and canonical NLP benchmarks. Initially, we were surprised by the output quality of our imitation models---they appear far better at following instructions, and crowd workers rate their outputs as competitive with ChatGPT. However, when conducting more targeted automatic evaluations, we find that imitation models close little to none of the gap from the base LM to ChatGPT on tasks that are not heavily supported in the imitation data. We show that these performance discrepancies may slip past human raters because imitation models are adept at mimicking ChatGPT\u2019s style but not its factuality. Overall, we conclude that while model imitation can be useful for training models to follow instructions and avoid toxic outputs, it falls short its full promise in many ways. In particular, there exists a substantial capabilities gap between open and closed LMs that we find cannot be bridged merely by adding more imitation data. Instead, we find that fine-tuning more capable base LMs has a significantly more substantial effect on closing this gap. In turn, we argue that the higher leverage action for improving open-source models is to tackle the difficult challenge of developing better base LMs, rather than taking the shortcut of imitating proprietary systems.",
        "keywords": "Language Models;Model Imitation;Distillation;Instruction-Tuning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Arnav Gudibande;Eric Wallace;Charlie Victor Snell;Xinyang Geng;Hao Liu;Pieter Abbeel;Sergey Levine;Dawn Song",
        "authorids": "~Arnav_Gudibande1;~Eric_Wallace1;~Charlie_Victor_Snell1;~Xinyang_Geng1;~Hao_Liu1;~Pieter_Abbeel2;~Sergey_Levine1;~Dawn_Song2",
        "gender": "M;M;M;M;M;M;F;M",
        "homepage": ";http://www.ericswallace.com/;https://sea-snell.github.io;http://young-geng.xyz/;https://people.eecs.berkeley.edu/~pabbeel/;https://people.eecs.berkeley.edu/~svlevine/;http://people.eecs.berkeley.edu/~dawnsong/;https://haoliu.ai",
        "dblp": ";218/6165;;186/8221;;80/7594;;09/3214-55",
        "google_scholar": "tcfl2hUAAAAJ;SgST3LkAAAAJ;dD7EpwQAAAAJ;vYougn0AAAAJ;https://scholar.google.com.tw/citations?user=vtwH6GkAAAAJ;8R35rCwAAAAJ;84WzBlYAAAAJ;wtK4Yh4AAAAJ",
        "orcid": ";;;;;;;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Arnav_Gudibande1;~Eric_Wallace1;~Charlie_Victor_Snell1;~Xinyang_Geng1;~Pieter_Abbeel2;~Sergey_Levine1;~Dawn_Song2;~Hao_Liu10",
        "aff": ";University of California, Berkeley;University of California, Berkeley;Google;Covariant;Google;University of California, Berkeley;University of California, Berkeley",
        "aff_domain": ";berkeley.edu;berkeley.edu;google.com;covariant.ai;google.com;berkeley.edu;berkeley.edu",
        "position": ";PhD student;PhD student;Researcher;Founder;Research Scientist;Full Professor;PhD student",
        "bibtex": "@inproceedings{\ngudibande2024the,\ntitle={The False Promise of Imitating Proprietary Language Models},\nauthor={Arnav Gudibande and Eric Wallace and Charlie Victor Snell and Xinyang Geng and Hao Liu and Pieter Abbeel and Sergey Levine and Dawn Song},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Kz3yckpCN5}\n}",
        "github": "",
        "project": "",
        "reviewers": "A4hH;msgU;WxVs;TcvA",
        "pdf_size": 988184,
        "rating": "6;6;8;8",
        "confidence": "4;3;4;4",
        "soundness": "2;2;3;3",
        "contribution": "4;2;3;4",
        "presentation": "2;3;3;4",
        "wc_summary": "98;106;61;66",
        "wc_strengths": "77;38;203;52",
        "wc_weaknesses": "294;151;260;76",
        "wc_questions": "88;43;139;18",
        "wc_review": "557;338;663;212",
        "wc_reply_reviewers": "0;100;111;14",
        "wc_reply_authors": "436;544;534;340",
        "reply_reviewers": "0;2;1;1",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            3.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            82.75,
            19.536824204563032
        ],
        "wc_strengths_avg": [
            92.5,
            65.30888147870854
        ],
        "wc_weaknesses_avg": [
            195.25,
            86.77953387752207
        ],
        "wc_questions_avg": [
            72.0,
            46.10314522893205
        ],
        "wc_review_avg": [
            442.5,
            177.32808576195706
        ],
        "wc_reply_reviewers_avg": [
            56.25,
            49.650654577759596
        ],
        "wc_reply_authors_avg": [
            463.5,
            82.85378687784886
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7280198912847181737&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=Kz3yckpCN5",
        "pdf": "https://openreview.net/pdf?id=Kz3yckpCN5",
        "email": ";berkeley.edu;berkeley.edu;google.com;covariant.ai;google.com;berkeley.edu;berkeley.edu",
        "author_num": 8,
        "aff_unique_index": "0;0;1;2;1;0;0",
        "aff_unique_norm": "University of California, Berkeley;Google;Covariant",
        "aff_unique_dep": ";Google;",
        "aff_unique_url": "https://www.berkeley.edu;https://www.google.com;",
        "aff_unique_abbr": "UC Berkeley;Google;",
        "aff_campus_unique_index": "0;0;1;1;0;0",
        "aff_campus_unique": "Berkeley;Mountain View;",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States;"
    },
    {
        "id": "KzMMv0OygD",
        "title": "TeG-Instruct: Towards Premium Instruction-Tuning Data via Text-Grounded Task Design",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The enhancement of language model capabilities heavily relies on the availability of high-quality instruction-tuning data. However, current data collection approaches face limitations due to the high costs associated with manual labeling or the hallucination of relying solely on LLMs. \nTo overcome these challenges, this paper proposes a scalable solution for automatically gathering top-notch instruction-tuning data. The method involves training LLMs to autonomously design tasks utilizing human-written texts, thereby aiding LLMs in mitigating erroneous outputs.\nIn contrast to other approaches that utilize human-written texts, our method employs a task generator capable of simultaneously producing the instruction, input, and output. \nIt aims to minimize the introduction of noise from the original text and ensure coherent and aligned task components.\nAdditionally, we train a discriminator to identify and filter out invalid tasks that might contain misleading or hallucination, thus further improving the quality of the collected data.\nThe results of the automated and manual evaluation experiments validate the reliability and validity of our proposed dataset, demonstrating the applicability it brings to LLMs for both in-domain and out-of-domain generation.",
        "keywords": "Natural Language Processing;Large Language Model;Instruction Tuning",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/e55e70f9df7a68c1c490b1cc1182dad65744c7f9.zip",
        "author": "Yongrui Chen;Haiyun Jiang;Xinting Huang;Shuming Shi;Guilin Qi",
        "authorids": "~Yongrui_Chen1;~Haiyun_Jiang1;~Xinting_Huang1;~Shuming_Shi1;~Guilin_Qi2",
        "gender": "M;M;M;M;M",
        "homepage": ";;https://timhuang1.github.io/;;https://cse.seu.edu.cn/_s191/2023/1024/c23024a469541/page.psp",
        "dblp": "143/0948-2.html;;;s/ShumingShi;71/5935",
        "google_scholar": "8ZjIHyEAAAAJ;fk684xEAAAAJ;QmyPDWQAAAAJ;Lg31AKMAAAAJ;",
        "orcid": "0000-0001-8934-3920;;;;0000-0003-0150-7236",
        "linkedin": ";;xintingh/;;",
        "or_profile": "~Yongrui_Chen1;~Haiyun_Jiang1;~Xinting_Huang1;~Shuming_Shi1;~Guilin_Qi2",
        "aff": "Southeast University;Tencent AI Lab;Tencent;Tencent AI Lab;Southeast University",
        "aff_domain": "seu.edu.cn;tencent.com;tencent.com;tencent.com;seu.edu.cn",
        "position": "PhD student;Researcher;Researcher;Principal Researcher;Full Professor",
        "bibtex": "@misc{\nanonymous2024teginstruct,\ntitle={TeG-Instruct: Towards Premium Instruction-Tuning Data via Text-Grounded Task Design},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=KzMMv0OygD}\n}",
        "github": "",
        "project": "",
        "reviewers": "q6hF;byqM;kxN5;5ypF",
        "site": "https://openreview.net/forum?id=KzMMv0OygD",
        "pdf_size": 676710,
        "rating": "3;3;5;5",
        "confidence": "4;4;3;4",
        "soundness": "3;2;3;3",
        "contribution": "2;1;2;2",
        "presentation": "2;3;3;2",
        "wc_summary": "81;43;109;77",
        "wc_strengths": "42;13;51;44",
        "wc_weaknesses": "36;162;99;96",
        "wc_questions": "48;1;78;90",
        "wc_review": "207;219;337;307",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            77.5,
            23.425413550244958
        ],
        "wc_strengths_avg": [
            37.5,
            14.534441853748634
        ],
        "wc_weaknesses_avg": [
            98.25,
            44.56666355023674
        ],
        "wc_questions_avg": [
            54.25,
            34.339299643411486
        ],
        "wc_review_avg": [
            267.5,
            55.684378419804595
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:rXbZsfyQmq8J:scholar.google.com/&scioq=TeG-Instruct:+Towards+Premium+Instruction-Tuning+Data+via+Text-Grounded+Task+Design&hl=en&as_sdt=0,19",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1;0",
        "aff_unique_norm": "Southeast University;Tencent",
        "aff_unique_dep": ";Tencent AI Lab",
        "aff_unique_url": "https://www.seu.edu.cn/;https://ai.tencent.com",
        "aff_unique_abbr": "SEU;Tencent AI Lab",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "L0b0vryZRX",
        "title": "Self-Distilled Disentanglement for Counterfactual Prediction",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The advancements in disentangled representation learning significantly enhance the accuracy of counterfactual predictions by granting precise control over instrumental variables (IVs), confounders, and adjustable variables. An appealing method for achieving the independent separation of these factors is mutual information minimization (MIM), a task that presents challenges in numerous machine learning scenarios, especially within high-dimensional spaces. To circumvent this challenge, a common strategy is to re-frame the MIM problem from a problem between two high-dimensional representations to one between high-dimensional representations and low-dimensional labels based on the different dependencies of latent factors and known labels. In this paper, we first demonstrate the limitations of this approach in separating instrumental variables and confounding variables, as determined by the d-separation theory. Subsequently, we propose the Self-Distilled Disentanglement framework, referred to as $SD^2$. Grounded in information theory, it ensures theoretically sound disentangled representations without intricate mutual information estimator designs for high-dimensional representations. Our comprehensive experiments, conducted on both synthetic and real-world datasets, provide compelling evidence of the effectiveness of our approach in facilitating counterfactual inference in the presence of both observed and unobserved confounders.",
        "keywords": "counterfactual prediction;disentangled representation learning;information theory;knowledge distillation.",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/cd0eded94fbd24e5c87241647bfefcefa0b9d597.zip",
        "author": "Xinshu Li;Mingming Gong;Lina Yao",
        "authorids": "~Xinshu_Li1;~Mingming_Gong1;~Lina_Yao2",
        "gender": "F;M;F",
        "homepage": ";https://mingming-gong.github.io/;https://www.linayao.com/",
        "dblp": "209/8778;98/8479;56/6651-1",
        "google_scholar": "https://scholar.google.com.au/citations?user=EcgTA8kAAAAJ;https://scholar.google.com.au/citations?user=6BmiCJIAAAAJ;https://scholar.google.com.au/citations?user=EU3snBgAAAAJ",
        "orcid": "0000-0002-1202-3993;0000-0001-7147-5589;",
        "linkedin": ";;linayao/",
        "or_profile": "~Xinshu_Li1;~Mingming_Gong1;~Lina_Yao2",
        "aff": "University of New South Wales;University of Melbourne;CSIRO's Data61",
        "aff_domain": "unsw.edu.au;unimelb.edu.au;data61.csiro.au",
        "position": "PhD student;Assistant Professor;Principal Researcher",
        "bibtex": "@misc{\nli2024selfdistilled,\ntitle={Self-Distilled Disentanglement for Counterfactual Prediction},\nauthor={Xinshu Li and Mingming Gong and Lina Yao},\nyear={2024},\nurl={https://openreview.net/forum?id=L0b0vryZRX}\n}",
        "github": "",
        "project": "",
        "reviewers": "pgv6;FUp5;YeKP;wJ78",
        "site": "https://openreview.net/forum?id=L0b0vryZRX",
        "pdf_size": 4692343,
        "rating": "3;3;6;6",
        "confidence": "3;2;3;4",
        "soundness": "3;1;3;2",
        "contribution": "3;2;3;3",
        "presentation": "2;2;3;4",
        "wc_summary": "98;66;37;57",
        "wc_strengths": "43;65;59;81",
        "wc_weaknesses": "406;332;131;59",
        "wc_questions": "28;13;187;86",
        "wc_review": "575;476;414;283",
        "wc_reply_reviewers": "14;80;166;62",
        "wc_reply_authors": "898;536;668;328",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "3;2;2;1",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            64.5,
            22.005681084665387
        ],
        "wc_strengths_avg": [
            62.0,
            13.601470508735444
        ],
        "wc_weaknesses_avg": [
            232.0,
            141.7797587810051
        ],
        "wc_questions_avg": [
            78.5,
            68.31727453580098
        ],
        "wc_review_avg": [
            437.0,
            105.84186317332097
        ],
        "wc_reply_reviewers_avg": [
            80.5,
            54.943152439589774
        ],
        "wc_reply_authors_avg": [
            607.5,
            206.9317520343362
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.7071067811865476,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:d04bFW7RW1YJ:scholar.google.com/&scioq=Self-Distilled+Disentanglement+for+Counterfactual+Prediction&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of New South Wales;University of Melbourne;CSIRO",
        "aff_unique_dep": ";;Data61",
        "aff_unique_url": "https://www.unsw.edu.au;https://www.unimelb.edu.au;https://www.csiro.au",
        "aff_unique_abbr": "UNSW;UniMelb;CSIRO",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Australia"
    },
    {
        "id": "L0pMPCmEfN",
        "title": "Splitted Wavelet Differential Inclusion",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Wavelet Shrinkage typically selects only a small proportion of large coefficients via soft or hard thresholding, since the \\emph{strong signal} composed by these coefficients has more semantic meaning than others. Typical examples include the object's shape in the image or the burst activity in the low $\\beta$ band in Parkinson's Disease. However, it has been found that there also exists \\emph{weak signal} that should not be ignored. Such a weak signal refers to the set of small coefficients, which in the above examples \\emph{resp.} correspond to the texture of an image or the non-burst/tonic activity in Parkinson's Disease. Although it is not as interpretable as the strong signal, ignorance of it may miss information in signal reconstruction. Existing methods either suffered from failing to disentangle the strong signal apart with a too small threshold parameter, or inaccurate estimation of the whole signal (\\emph{i.e.}, strong and weak signals) due to the bias/errors in the strong signal and over-smoothing of the weak signal. To resolve these problems, we propose a \\emph{Splitted Wavelet Differential Inclusion}, which is provable to achieve better estimation on both the strong signal and the whole signal than Wavelet Shrinkage. Specifically, equipped with an $\\ell_2$ splitting mechanism, we obtain the solution path from the differential inclusion of a couple of parameters, of which the sparse one can remove bias in estimating the strong signal and the dense parameter can additionally capture the weak signal with the $\\ell_2$ shrinkage. The utility of our method is demonstrated by the improved accuracy in a numerical experiment and moreover the additional findings of tonic activity in Parkinson's Disease.",
        "keywords": "Wavelet;Differential Inclusion;Weak Signal;EEG",
        "primary_area": "metric learning, kernel learning, and sparse coding",
        "supplementary_material": "",
        "author": "Xinwei Sun;Xuanjun Guo;Yanwei Fu;Huiling Tan;Shouyan Wang",
        "authorids": "~Xinwei_Sun1;~Xuanjun_Guo1;~Yanwei_Fu2;~Huiling_Tan1;~Shouyan_Wang1",
        "gender": "M;F;M;F;M",
        "homepage": "https://sunxinwei0625.github.io/sunxw.github.io/;;http://yanweifu.github.io;https://www.mrcbndu.ox.ac.uk/groups/tan-group;https://istbi.fudan.edu.cn/info/1774/4601.htm",
        "dblp": "145/6592-1;;63/9065;;",
        "google_scholar": ";;https://scholar.google.co.uk/citations?user=Vg54TcsAAAAJ;67a25uQAAAAJ;",
        "orcid": ";0000-0003-2528-484X;0000-0002-6595-6893;0000-0001-8038-3029;",
        "linkedin": ";;;;",
        "or_profile": "~Xinwei_Sun1;~Xuanjun_Guo1;~Yanwei_Fu2;~Huiling_Tan1;~Shouyan_Wang1",
        "aff": "Fudan University;Fudan University;Fudan University,;University of Oxford;Fudan University",
        "aff_domain": "fudan.edu.cn;fudan.edu.cn;fudan.edu.cn;ox.ac.uk;fudan.edu.cn",
        "position": "Assistant Professor;PhD student;Professor;Prof;Full Professor",
        "bibtex": "@misc{\nsun2024splitted,\ntitle={Splitted Wavelet Differential Inclusion},\nauthor={Xinwei Sun and Xuanjun Guo and Yanwei Fu and Huiling Tan and Shouyan Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=L0pMPCmEfN}\n}",
        "github": "",
        "project": "",
        "reviewers": "Kg8T;iHj3;G1Zr",
        "site": "https://openreview.net/forum?id=L0pMPCmEfN",
        "pdf_size": 8698218,
        "rating": "3;5;5",
        "confidence": "1;4;3",
        "soundness": "2;2;2",
        "contribution": "2;3;3",
        "presentation": "2;3;2",
        "wc_summary": "60;61;23",
        "wc_strengths": "35;32;57",
        "wc_weaknesses": "182;44;160",
        "wc_questions": "81;181;865",
        "wc_review": "358;318;1105",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            48.0,
            17.682382946499793
        ],
        "wc_strengths_avg": [
            41.333333333333336,
            11.14550233153366
        ],
        "wc_weaknesses_avg": [
            128.66666666666666,
            60.53832578531462
        ],
        "wc_questions_avg": [
            375.6666666666667,
            348.4109961270198
        ],
        "wc_review_avg": [
            593.6666666666666,
            361.93584452987733
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.9449111825230678,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:7TcXbfwwkg0J:scholar.google.com/&scioq=Splitted+Wavelet+Differential+Inclusion&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "Fudan University;University of Oxford",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.fudan.edu.cn;https://www.ox.ac.uk",
        "aff_unique_abbr": "Fudan;Oxford",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "title": "Improving Convergence and Generalization Using Parameter Symmetries",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18876",
        "id": "L0r0GphlIL",
        "author_site": "Bo Zhao, Robert M. Gower, Robin Walters, Rose Yu",
        "tldr": "",
        "abstract": "In many neural networks, different values of the parameters may result in the same loss value. Parameter space symmetries are loss-invariant transformations that change the model parameters. Teleportation applies such transformations to accelerate optimization. However, the exact mechanism behind this algorithm's success is not well understood. In this paper, we show that teleportation not only speeds up optimization in the short-term, but gives overall faster time to convergence. Additionally, teleporting to minima with different curvatures improves generalization, which suggests a connection between the curvature of the minimum and generalization ability. Finally, we show that integrating teleportation into a wide range of optimization algorithms and optimization-based meta-learning improves convergence. Our results showcase the versatility of teleportation and demonstrate the potential of incorporating symmetry in optimization.",
        "keywords": "Symmetry;optimization;generalization",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Bo Zhao;Robert M. Gower;Robin Walters;Rose Yu",
        "authorids": "~Bo_Zhao6;~Robert_M._Gower1;~Robin_Walters1;~Rose_Yu1",
        "gender": ";M;M;F",
        "homepage": "https://b-zhao.github.io;https://gowerrobert.github.io/;http://www.robinwalters.com;http://roseyu.com",
        "dblp": ";143/0056;258/3416;164/7314",
        "google_scholar": "ZCCrFoIAAAAJ;okKw87MAAAAJ;fnprJmUAAAAJ;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Bo_Zhao6;~Robert_M._Gower1;~Robin_Walters1;~Rose_Yu1",
        "aff": "University of California, San Diego;Flatiron Institute;Northeastern University ;University of California, San Diego",
        "aff_domain": "ucsd.edu;simonsfoundation.org;northeastern.edu;ucsd.edu",
        "position": "PhD student;Researcher;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nzhao2024improving,\ntitle={Improving Convergence and Generalization Using Parameter Symmetries},\nauthor={Bo Zhao and Robert M. Gower and Robin Walters and Rose Yu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=L0r0GphlIL}\n}",
        "github": "",
        "project": "",
        "reviewers": "dBnH;Ewvi;BdD6;bsXX",
        "pdf_size": 1584300,
        "rating": "6;8;8;8",
        "confidence": "3;3;3;2",
        "soundness": "2;3;4;3",
        "contribution": "3;3;2;4",
        "presentation": "2;4;4;2",
        "wc_summary": "54;53;218;173",
        "wc_strengths": "39;111;99;69",
        "wc_weaknesses": "106;120;104;282",
        "wc_questions": "118;99;138;108",
        "wc_review": "317;383;559;632",
        "wc_reply_reviewers": "46;0;484;8",
        "wc_reply_authors": "1107;541;764;592",
        "reply_reviewers": "1;0;3;1",
        "reply_authors": "3;1;3;1",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            1.0
        ],
        "wc_summary_avg": [
            124.5,
            72.76159701380942
        ],
        "wc_strengths_avg": [
            79.5,
            27.941904015295737
        ],
        "wc_weaknesses_avg": [
            153.0,
            74.73285756613352
        ],
        "wc_questions_avg": [
            115.75,
            14.49784466739798
        ],
        "wc_review_avg": [
            472.75,
            127.58600040756822
        ],
        "wc_reply_reviewers_avg": [
            134.5,
            202.53086184579377
        ],
        "wc_reply_authors_avg": [
            751.0,
            221.5208793770917
        ],
        "reply_reviewers_avg": [
            1.25,
            1.0897247358851685
        ],
        "reply_authors_avg": [
            2.0,
            1.0
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3965756661170938764&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=L0r0GphlIL",
        "pdf": "https://openreview.net/pdf?id=L0r0GphlIL",
        "email": "ucsd.edu;simonsfoundation.org;northeastern.edu;ucsd.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "University of California, San Diego;Flatiron Institute;Northeastern University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ucsd.edu;https://flatironinstitute.org;https://www.northeastern.edu",
        "aff_unique_abbr": "UCSD;Flatiron;NEU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "San Diego;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "L1BXvqwsMv",
        "title": "Specializing SAM: Online Adaptation of the Segment Anything Model for Interactive Segmentation in Uncommon Situations",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Interactive segmentation is the task of segmenting an object with the help of user guidance. It is mostly used to create ground truth segmentation masks for object instances more efficiently. Recently, the Segment Anything Model (SAM) has been published to provide a foundation model for segmentation based on user-generated prompts. Despite being trained on the largest instance segmentation dataset to this date (SA-1B), we show that the model fails at the task of interactive segmentation when confronted with situations that do not comport with the initial training data. Such situations may however occur when the model is used in practice. To alleviate these problems, we use the information that becomes available during the interaction to adapt the model to the dataset while being in use. In order to not impede any real time experience desirable to the user, we construct our method with the aim of minimizing computational overhead. In our experiments we will demonstrate the efficacy of the proposed adaptation method on twelve different datasets which are uncommon to SAM's initial training data, with four of them being medical segmentation datasets. With our method we are able to cause reductions of up to 16.93 percentage points in the $FR_{20}@85$ metric, and reductions of up to 18.43 percentage points in the $FR_{30}@90$ metric. Additionally, there is an improvement of up to 3.311 clicks in the $NoC_{30}@90$ on ten out of twelve datasets.",
        "keywords": "test time adaptation;interactive segmentation;sam;segment anything;segment anything model;online;fine-tuning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Robin Sch\u00f6n;Julian Lorenz;Katja Ludwig;Rainer Lienhart",
        "authorids": "~Robin_Sch\u00f6n1;~Julian_Lorenz1;~Katja_Ludwig1;~Rainer_Lienhart1",
        "gender": "M;;F;M",
        "homepage": "https://www.uni-augsburg.de/de/fakultaet/fai/informatik/prof/mmc/team/schoen/;;https://www.uni-augsburg.de/de/fakultaet/fai/informatik/prof/mmc/team/katja-ludwig/;https://www.uni-augsburg.de/en/fakultaet/fai/informatik/prof/mmc/",
        "dblp": "298/0187;;263/0819;l/RainerLienhart",
        "google_scholar": "Hj9dVdgAAAAJ;;_DpaUF0AAAAJ;eKQPhGgAAAAJ",
        "orcid": "0009-0009-4879-7622;;0000-0002-5721-243X;0000-0003-4007-6889",
        "linkedin": "https://de.linkedin.com/in/robin-sch%C3%B6n-b38a93314;;;",
        "or_profile": "~Robin_Sch\u00f6n1;~Julian_Lorenz1;~Katja_Ludwig1;~Rainer_Lienhart1",
        "aff": "Universit\u00e4t Augsburg;;University of Augsburg;Universit\u00e4t Augsburg",
        "aff_domain": "uni-augsburg.de;;uni-a.de;uni-augsburg.de",
        "position": "PhD student;;PhD student;Full Professor",
        "bibtex": "@misc{\nsch{\\\"o}n2024specializing,\ntitle={Specializing {SAM}: Online Adaptation of the Segment Anything Model for Interactive Segmentation in Uncommon Situations},\nauthor={Robin Sch{\\\"o}n and Julian Lorenz and Katja Ludwig and Rainer Lienhart},\nyear={2024},\nurl={https://openreview.net/forum?id=L1BXvqwsMv}\n}",
        "github": "",
        "project": "",
        "reviewers": "onHB;sPPi;eT7h;WW8e",
        "site": "https://openreview.net/forum?id=L1BXvqwsMv",
        "pdf_size": 11926284,
        "rating": "1;1;3;5",
        "confidence": "5;4;4;3",
        "soundness": "2;2;3;3",
        "contribution": "1;2;2;3",
        "presentation": "2;3;2;2",
        "wc_summary": "76;84;112;61",
        "wc_strengths": "20;79;48;55",
        "wc_weaknesses": "58;401;549;99",
        "wc_questions": "3;83;475;2",
        "wc_review": "157;647;1184;217",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.5,
            1.6583123951777
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            83.25,
            18.538810641462412
        ],
        "wc_strengths_avg": [
            50.5,
            21.02974084481309
        ],
        "wc_weaknesses_avg": [
            276.75,
            205.55093650966418
        ],
        "wc_questions_avg": [
            140.75,
            195.7579819573138
        ],
        "wc_review_avg": [
            551.25,
            411.3078986598726
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8528028654224417,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:OZQDJ-jdbDkJ:scholar.google.com/&scioq=Specializing+SAM:+Online+Adaptation+of+the+Segment+Anything+Model+for+Interactive+Segmentation+in+Uncommon+Situations&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Augsburg",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uni-augsburg.de",
        "aff_unique_abbr": "Uni Augsburg",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "L1FeTLOwzr",
        "title": "Dynamic Adapter Merging for Continual Video Question-Answering Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We present a parameter-efficient method for continual video question-answering (VidQA) learning. Our method, named DAM, uses $\\textbf{D}$ynamic $\\textbf{A}$dapter $\\textbf{M}$erging to address the issues of (i) catastrophic forgetting, (ii) the costly retraining of large VidQA models on continually shifting distribution of training data, and (iii) handling inputs from an unknown domain during test-time inference. Given a set of different VidQA datasets, we sequentially train domain-specific adapters for each VidQA dataset while freezing the parameters of a large pretrained video-language backbone. During inference, given a video-question sample from an unknown domain, our method first uses a non-parametric video-language router function to compute a probability for each domain-specific adapter, reflecting how relevant that adapter is to the current video-question input instance. Afterward, to exploit beneficial cross-domain cues and reduce the impact of potentially incorrect router predictions, we dynamically merge the parameters of several highest-scoring adapters for the final VidQA prediction. Despite the simplicity of our approach, we demonstrate that it works well on continually streaming VidQA datasets across $6$ different domains. In particular, our model outperforms prior prompt-based continual learning approaches by 9.1% while exhibiting 1.9% less forgetting. The code and pretrained models will be publicly released.",
        "keywords": "Continual Learning; Video QA; Multimodal",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Feng Cheng;Ziyang Wang;Yi-Lin Sung;Yan-Bo Lin;Mohit Bansal;Gedas Bertasius",
        "authorids": "~Feng_Cheng2;~Ziyang_Wang3;~Yi-Lin_Sung1;~Yan-Bo_Lin1;~Mohit_Bansal2;~Gedas_Bertasius1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://klauscc.github.io/;https://ziyangw2000.github.io/;https://genjib.github.io;https://www.cs.unc.edu/~mbansal/;https://www.gedasbertasius.com/;https://ylsung.github.io/",
        "dblp": ";;06/11431.html;32/5243.html;155/9783;212/7264",
        "google_scholar": "https://scholar.google.com/citations?hl=en;JuIqLPYAAAAJ;T4pYUkAAAAAJ;DN8QtscAAAAJ;https://scholar.google.com/citations?hl=en;aW2XnF0AAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";;;;;yi-lin-sung-41a427120/",
        "or_profile": "~Feng_Cheng2;~Ziyang_Wang3;~Yan-Bo_Lin1;~Mohit_Bansal2;~Gedas_Bertasius1;~Yi_Lin_Sung1",
        "aff": "University of North Carolina, Chapel Hill;University of North Carolina at Chapel Hill;Department of Computer Science, University of North Carolina at Chapel Hill;University of North Carolina at Chapel Hill;University of North Carolina, Chapel Hill;Department of Computer Science, University of North Carolina, Chapel Hill",
        "aff_domain": "unc.edu;cs.unc.edu;cs.unc.edu;unc.edu;unc.edu;cs.unc.edu",
        "position": "PhD student;PhD student;PhD student;Full Professor;Assistant Professor;PhD student",
        "bibtex": "@misc{\ncheng2024dynamic,\ntitle={Dynamic Adapter Merging for Continual Video Question-Answering Learning},\nauthor={Feng Cheng and Ziyang Wang and Yi-Lin Sung and Yan-Bo Lin and Mohit Bansal and Gedas Bertasius},\nyear={2024},\nurl={https://openreview.net/forum?id=L1FeTLOwzr}\n}",
        "github": "",
        "project": "",
        "reviewers": "yoGd;thbM;t6Nd;DkBm",
        "site": "https://openreview.net/forum?id=L1FeTLOwzr",
        "pdf_size": 1551923,
        "rating": "5;5;5;6",
        "confidence": "5;4;3;4",
        "soundness": "3;3;3;2",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "44;43;43;92",
        "wc_strengths": "14;68;23;53",
        "wc_weaknesses": "96;241;107;242",
        "wc_questions": "2;35;71;42",
        "wc_review": "156;387;244;429",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "506;803;682;697",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            55.5,
            21.07723890835799
        ],
        "wc_strengths_avg": [
            39.5,
            21.891779278989635
        ],
        "wc_weaknesses_avg": [
            171.5,
            70.10884394996113
        ],
        "wc_questions_avg": [
            37.5,
            24.540782383616055
        ],
        "wc_review_avg": [
            304.0,
            109.56504917171351
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            672.0,
            106.58564631318797
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9189154023633774911&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;0;0",
        "aff_unique_norm": "University of North Carolina;University of North Carolina at Chapel Hill",
        "aff_unique_dep": ";Department of Computer Science",
        "aff_unique_url": "https://www.unc.edu;https://www.unc.edu",
        "aff_unique_abbr": "UNC;UNC Chapel Hill",
        "aff_campus_unique_index": "0;0;0;0;0;0",
        "aff_campus_unique": "Chapel Hill",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "L1p3uQ8pzl",
        "title": "Explore Outworld Knowledge in Large Language Models: A Case Study in Pokemon Game",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs) show great power by gathering almost all knowledge in our human world. An appealing curiosity now arises regarding their adaption to a new world setting, e.g from fictions and films, one with disparate fundamental laws, which is much more challenging than transferring between domains of the same human world. This carries significant research potential for expanding AI to multiple universes in the future. This paper chooses \\textsc{Pok\u00e9mon} as the target, a popular strategy game with a unique worldview. We introduce \\textsc{Pokemon-Py}, a Python library that provides an interactive playground as in the pokemon world. Our analysis demonstrates that the outworld context can exacerbate knowledge distortions and logical flaws in today's LLMs, and this phenomenon has a significant negative impact. Based on \\textsc{Pokemon-Py}, we propose \\textit{Self-Training with Self-Competition}, a novel self-supervised learning method to effectively adapt the model to a new or even unknown world setting, where the model is programmed to keep learning through self-competition, and ultimately grows into a superior individual. Our method achieves remarkable improvement to adapt LLaMA2-7b to two downstream tasks within the pokemon world.",
        "keywords": "large language model;outworld knowledge;self-supervised",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Hongqiu Wu;Xingyuan Liu;hai zhao;Min Zhang",
        "authorids": "~Hongqiu_Wu1;~Xingyuan_Liu1;~hai_zhao1;~Min_Zhang9",
        "gender": "M;F;M;M",
        "homepage": "https://gingasan.github.io;https://github.com/Loeyxxx;http://bcmi.sjtu.edu.cn/~zhaohai/;https://zhangmin-nlp-ai.github.io/",
        "dblp": ";;25/1145-1.html;83/5342-5",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;https://scholar.google.com.tw/citations?user=4dU5KS0AAAAJ;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Hongqiu_Wu1;~Xingyuan_Liu1;~hai_zhao1;~Min_Zhang9",
        "aff": "Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;Harbin Institute of Technology, Shenzhen",
        "aff_domain": "sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;hit.edu.cn",
        "position": "PhD student;Undergrad student;Full Professor;Full Professor",
        "bibtex": "@misc{\nwu2024explore,\ntitle={Explore Outworld Knowledge in Large Language Models: A Case Study in Pokemon Game},\nauthor={Hongqiu Wu and Xingyuan Liu and hai zhao and Min Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=L1p3uQ8pzl}\n}",
        "github": "",
        "project": "",
        "reviewers": "oQMe;gZuL;hwhv;jvkM;5UvA",
        "site": "https://openreview.net/forum?id=L1p3uQ8pzl",
        "pdf_size": 1228595,
        "rating": "5;6;6;6;8",
        "confidence": "2;3;3;3;4",
        "soundness": "2;3;3;3;3",
        "contribution": "1;2;3;3;3",
        "presentation": "2;3;2;3;3",
        "wc_summary": "94;85;107;90;231",
        "wc_strengths": "20;53;63;65;64",
        "wc_weaknesses": "91;56;178;97;713",
        "wc_questions": "71;50;77;110;49",
        "wc_review": "276;244;425;362;1057",
        "wc_reply_reviewers": "95;21;160;0;117",
        "wc_reply_authors": "248;276;520;575;870",
        "reply_reviewers": "1;1;1;0;2",
        "reply_authors": "2;2;2;1;3",
        "rating_avg": [
            6.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.4,
            0.8
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            121.4,
            55.28327052553964
        ],
        "wc_strengths_avg": [
            53.0,
            17.052858997833766
        ],
        "wc_weaknesses_avg": [
            227.0,
            246.26571015876328
        ],
        "wc_questions_avg": [
            71.4,
            22.276444958745103
        ],
        "wc_review_avg": [
            472.8,
            298.9751829165759
        ],
        "wc_reply_reviewers_avg": [
            78.6,
            59.77491112498621
        ],
        "wc_reply_authors_avg": [
            497.8,
            226.53070432062844
        ],
        "reply_reviewers_avg": [
            1.0,
            0.6324555320336759
        ],
        "reply_authors_avg": [
            2.0,
            0.6324555320336759
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.9682458365518541,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:aYevuzXwUDIJ:scholar.google.com/&scioq=Explore+Outworld+Knowledge+in+Large+Language+Models:+A+Case+Study+in+Pokemon+Game&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "Shanghai Jiao Tong University;Harbin Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.sjtu.edu.cn;http://en.hhit.edu.cn/",
        "aff_unique_abbr": "SJTU;HIT",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Shenzhen",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "L2kbdthX5M",
        "title": "SignAvatars: A Large-scale 3D Sign Language Holistic Motion Dataset and Benchmark",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this paper, we present SignAvatars, the first large-scale multi-prompt 3D sign language (SL) motion dataset designed to bridge the communication gap for hearing-impaired individuals. While there has been an exponentially growing number of research regarding digital communication, the majority of existing communication technologies primarily cater to spoken or written languages, instead of SL, the essential communication method for hearing-impaired communities. Existing SL datasets, dictionaries, and sign language production (SLP) methods are typically limited to 2D as the annotating 3D models and avatars for SL is usually an entirely manual and labor-intensive process conducted by SL experts, often resulting in unnatural avatars. In response to these challenges, we compile and curate the SignAvatars dataset, which comprises 70,000 videos from 153 signers, totaling 8.34 million frames, covering both isolated signs and continuous, co-articulated signs, with multiple prompts including HamNoSys, spoken language, and words.  To yield 3D holistic annotations, including meshes and biomechanically-valid poses of body, hands, and face, as well as 2D and 3D keypoints, we introduce an automated annotation pipeline operating on our large corpus of SL videos.SignAvatars facilitates various tasks such as 3D sign language recognition (SLR) and the novel 3D SL production (SLP) from diverse inputs like text scripts, individual words, and HamNoSys notation. Hence, to evaluate the potential of SignAvatars, we further propose a unified benchmark of 3D SL holistic motion production. We believe that this work is a significant step forward towards bringing the digital world to the hearing-impaired communities.",
        "keywords": "Sign Language Dataset;Parametric Human;Motion Generation;Sign Language Understanding",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/a7c61c7fd49dcd2bdfda9219ed60a85b357411fc.zip",
        "author": "Zhengdi Yu;Shaoli Huang;Yongkang Cheng;Tolga Birdal",
        "authorids": "~Zhengdi_Yu1;~Shaoli_Huang2;~Yongkang_Cheng2;~Tolga_Birdal3",
        "gender": "M;M;M;M",
        "homepage": "https://github.com/ZhengdiYu;;http://tolgabirdal.github.io;",
        "dblp": ";80/8502;143/7056;",
        "google_scholar": "yo6O6MMAAAAJ;o31BPFsAAAAJ;_Bxd5ggAAAAJ;https://scholar.google.com/citations?view_op=list_works",
        "orcid": ";;0000-0001-7915-7964;",
        "linkedin": ";;https://linkedin.com/in/tbirdal;",
        "or_profile": "~Zhengdi_Yu1;~Shaoli_Huang2;~Tolga_Birdal3;~yongkang_cheng1",
        "aff": "Imperial College London;Tencent AI Lab;Imperial College London;Northwest A&F University",
        "aff_domain": "imperial.ac.uk;tencent.com;imperial.ac.uk;nwafu.edu.cn",
        "position": "PhD student;Researcher;Assistant Professor;MS student",
        "bibtex": "@misc{\nyu2024signavatars,\ntitle={SignAvatars: A Large-scale 3D Sign Language Holistic Motion Dataset and Benchmark},\nauthor={Zhengdi Yu and Shaoli Huang and Yongkang Cheng and Tolga Birdal},\nyear={2024},\nurl={https://openreview.net/forum?id=L2kbdthX5M}\n}",
        "github": "",
        "project": "",
        "reviewers": "Dj8e;qy3Y;XQXu;MwWu",
        "site": "https://openreview.net/forum?id=L2kbdthX5M",
        "pdf_size": 7940654,
        "rating": "5;6;6;8",
        "confidence": "5;2;5;4",
        "soundness": "3;3;2;4",
        "contribution": "2;3;3;4",
        "presentation": "3;3;3;4",
        "wc_summary": "97;21;56;135",
        "wc_strengths": "67;8;35;178",
        "wc_weaknesses": "267;55;180;53",
        "wc_questions": "445;3;6;28",
        "wc_review": "876;87;277;394",
        "wc_reply_reviewers": "0;0;0;18",
        "wc_reply_authors": "1355;714;467;328",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "3;1;1;2",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            1.224744871391589
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            77.25,
            42.83908845902303
        ],
        "wc_strengths_avg": [
            72.0,
            64.6645188646757
        ],
        "wc_weaknesses_avg": [
            138.75,
            90.16200696524008
        ],
        "wc_questions_avg": [
            120.5,
            187.59864072002227
        ],
        "wc_review_avg": [
            408.5,
            291.2992447638682
        ],
        "wc_reply_reviewers_avg": [
            4.5,
            7.794228634059948
        ],
        "wc_reply_authors_avg": [
            716.0,
            393.97652214313484
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.1873171623163388,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6468574892524729892&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "Imperial College London;Tencent;Northwest A&F University",
        "aff_unique_dep": ";Tencent AI Lab;",
        "aff_unique_url": "https://www.imperial.ac.uk;https://ai.tencent.com;https://www.nwsuaf.edu.cn",
        "aff_unique_abbr": "ICL;Tencent AI Lab;NWSUAF",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;1",
        "aff_country_unique": "United Kingdom;China"
    },
    {
        "title": "Batch Calibration: Rethinking Calibration for In-Context Learning and Prompt Engineering",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18875",
        "id": "L3FHMoKZcS",
        "author_site": "Han Zhou, Xingchen Wan, Lev Proleev, Diana Mincu, Jilin Chen, Katherine Heller, Subhrajit Roy",
        "tldr": "",
        "abstract": "Prompting and in-context learning (ICL) have become efficient learning paradigms for large language models (LLMs). However, LLMs suffer from prompt brittleness and various bias factors in the prompt, including but not limited to the formatting, the choice verbalizers, and the ICL examples. To address this problem that results in unexpected performance degradation, calibration methods have been developed to mitigate the effects of these biases while recovering LLM performance. In this work, we first conduct a systematic analysis of the existing calibration methods, where we both provide a unified view and reveal the failure cases. Inspired by these analyses, we propose Batch Calibration (BC), a simple yet intuitive method that controls the contextual bias from the batched input, unifies various prior approaches and effectively addresses the aforementioned issues. BC is zero-shot, inference-only, and incurs negligible additional costs. In the few-shot setup, we further extend BC to allow it to learn the contextual bias from labeled data. We validate the effectiveness of BC with PaLM 2-(S, M, L) and CLIP models and demonstrate state-of-the-art performance over previous calibration baselines across more than 10 natural language understanding and image classification tasks.",
        "keywords": "large language model;in-context learning;calibration;prompt",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Han Zhou;Xingchen Wan;Lev Proleev;Diana Mincu;Jilin Chen;Katherine A Heller;Subhrajit Roy",
        "authorids": "~Han_Zhou4;~Xingchen_Wan1;~Lev_Proleev1;~Diana_Mincu1;~Jilin_Chen1;~Katherine_A_Heller1;~Subhrajit_Roy1",
        "gender": "M;M;;F;;F;M",
        "homepage": "https://hzhou.top;https://xingchen.one;;;;;",
        "dblp": ";255/7214;;;50/6953;32/4403;73/8829",
        "google_scholar": "7pXfJVgAAAAJ;6KkohssAAAAJ;;1Fg7f78AAAAJ;;;",
        "orcid": "0000-0003-3778-4075;0000-0003-0074-0597;;;;;",
        "linkedin": "hanzhou032;;lev-proleev-a9076646/;;;;subhrajit-roy-7aa18123/",
        "or_profile": "~Han_Zhou4;~Xingchen_Wan1;~Lev_Proleev1;~Diana_Mincu1;~Jilin_Chen1;~Katherine_A_Heller1;~Subhrajit_Roy1",
        "aff": "Google;Google;Google;Google;Google;Google;Google",
        "aff_domain": "google.com;google.com;google.com;google.com;google.com;google.com;google.com",
        "position": "Student Researcher;Research Scientist;Software Engineer;Software Engineer;Researcher;Researcher;Researcher",
        "bibtex": "@inproceedings{\nzhou2024batch,\ntitle={Batch Calibration: Rethinking Calibration for In-Context Learning and Prompt Engineering},\nauthor={Han Zhou and Xingchen Wan and Lev Proleev and Diana Mincu and Jilin Chen and Katherine A Heller and Subhrajit Roy},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=L3FHMoKZcS}\n}",
        "github": "",
        "project": "",
        "reviewers": "tiQs;jGRr;99FV;r8cW",
        "pdf_size": 7299269,
        "rating": "6;6;6;6",
        "confidence": "4;4;3;3",
        "soundness": "2;2;2;2",
        "contribution": "2;2;3;2",
        "presentation": "3;3;4;2",
        "wc_summary": "112;85;92;110",
        "wc_strengths": "27;57;79;16",
        "wc_weaknesses": "107;110;102;26",
        "wc_questions": "2;79;47;78",
        "wc_review": "248;331;320;230",
        "wc_reply_reviewers": "115;72;0;22",
        "wc_reply_authors": "1026;1363;1206;777",
        "reply_reviewers": "2;1;0;1",
        "reply_authors": "3;3;3;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            99.75,
            11.54068888758379
        ],
        "wc_strengths_avg": [
            44.75,
            24.823124299733102
        ],
        "wc_weaknesses_avg": [
            86.25,
            34.90254288730264
        ],
        "wc_questions_avg": [
            51.5,
            31.34086788842964
        ],
        "wc_review_avg": [
            282.25,
            43.88835266901687
        ],
        "wc_reply_reviewers_avg": [
            52.25,
            44.64512851364637
        ],
        "wc_reply_authors_avg": [
            1093.0,
            217.95297657981183
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.75,
            0.4330127018922193
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 51,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12387291505950634819&as_sdt=5,24&sciodt=0,24&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=L3FHMoKZcS",
        "pdf": "https://openreview.net/pdf?id=L3FHMoKZcS",
        "email": "google.com;google.com;google.com;google.com;google.com;google.com;google.com",
        "author_num": 7,
        "aff_unique_index": "0;0;0;0;0;0;0",
        "aff_unique_norm": "Google",
        "aff_unique_dep": "Google",
        "aff_unique_url": "https://www.google.com",
        "aff_unique_abbr": "Google",
        "aff_campus_unique_index": "0;0;0;0;0;0;0",
        "aff_campus_unique": "Mountain View",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "L3jATpVEGv",
        "title": "GraphAgent: Exploiting Large Language Models for Interpretable Learning on Text-attributed Graphs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper studies learning on text-attributed graphs, where each node is associated with a textual description. While graph neural networks (GNNs) have been widely employed for solving tasks on such graphs, they struggle with balancing between effectiveness and interpretability. Inspired by recent breakthroughs in large language models (LLMs), which have demonstrated remarkable capabilities with interpretable explanations across a variety of applications, we introduce GraphAgent. GraphAgent reframes learning on text-attributed graphs as an agent planning problem and parameterizes the agent as an LLM. This paradigm shift empowers the agent to take actions explicitly tailored for text-attributed graphs, enabling comprehensive exploration of both structural and textual features. Leveraging the expressive power of LLMs, the agent adeptly capture the intricate relationships inherent in the graph structure and textual descriptions, thereby yielding precise predictions and transparent reasoning processes. Extensive experiments conducted on various datasets underscore the effectiveness and interpretability of GraphAgent, shedding new light on the promising intersection of large language models and graph-based learning.",
        "keywords": "Text-attibuted graph;Large language model;Node classification",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/94c8c60ab6e2061d4e2e68b80987d43385d0f88b.pdf",
        "author": "Xinmiao Yu;Meng Qu;Xiaocheng Feng;Bing Qin",
        "authorids": "~Xinmiao_Yu1;~Meng_Qu2;~Xiaocheng_Feng1;~Bing_Qin2",
        "gender": "M;M;;F",
        "homepage": "https://mnqu.github.io/;http://ir.hit.edu.cn/~xcfeng/;http://ir.hit.edu.cn/~qinb;",
        "dblp": "14/8543.html;;86/5934.html;",
        "google_scholar": "92UwQYkAAAAJ;Xu8NbhYAAAAJ;LKnCub0AAAAJ;yflYWnYAAAAJ",
        "orcid": ";;0000-0002-2543-5604;",
        "linkedin": ";;;",
        "or_profile": "~Meng_Qu2;~Xiaocheng_Feng1;~Bing_Qin2;~Xinmiao_Chelsey_Yu2",
        "aff": ";Harbin Institute of Technology;Harbin Institute of Technology;Harbin Institute of Technology",
        "aff_domain": ";hit.edu.cn;hit.edu.cn;hit.edu.cn",
        "position": ";Full Professor;Full Professor;MS student",
        "bibtex": "@misc{\nyu2024graphagent,\ntitle={GraphAgent: Exploiting Large Language Models for Interpretable Learning on Text-attributed Graphs},\nauthor={Xinmiao Yu and Meng Qu and Xiaocheng Feng and Bing Qin},\nyear={2024},\nurl={https://openreview.net/forum?id=L3jATpVEGv}\n}",
        "github": "",
        "project": "",
        "reviewers": "985C;sBxi;Xvd3;39D5",
        "site": "https://openreview.net/forum?id=L3jATpVEGv",
        "pdf_size": 490221,
        "rating": "3;3;5;5",
        "confidence": "4;5;4;3",
        "soundness": "2;2;2;4",
        "contribution": "2;1;2;3",
        "presentation": "2;2;2;3",
        "wc_summary": "37;70;76;56",
        "wc_strengths": "34;31;59;82",
        "wc_weaknesses": "215;292;156;94",
        "wc_questions": "2;29;43;15",
        "wc_review": "288;422;334;247",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            59.75,
            15.006248698458919
        ],
        "wc_strengths_avg": [
            51.5,
            20.694202086574876
        ],
        "wc_weaknesses_avg": [
            189.25,
            73.1415579544215
        ],
        "wc_questions_avg": [
            22.25,
            15.31951369985353
        ],
        "wc_review_avg": [
            322.75,
            65.04373528634406
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.7071067811865475,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:O67uzmmFbKUJ:scholar.google.com/&scioq=GraphAgent:+Exploiting+Large+Language+Models+for+Interpretable+Learning+on+Text-attributed+Graphs&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Harbin Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.hit.edu.cn/",
        "aff_unique_abbr": "HIT",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Harbin",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "L3yJ54gv3H",
        "title": "Nonparametric Classification on Low Dimensional Manifolds using Overparameterized Convolutional Residual Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Convolutional residual neural networks (ConvResNets), though overparameterized, can achieve remarkable prediction performance in practice, which cannot be well explained by conventional wisdom. To bridge this gap, we study the performance of ConvResNeXts, which cover ConvResNets as a special case, trained with weight decay from the perspective of nonparametric classification. Our analysis allows for infinitely many building blocks in ConvResNeXts, and shows that weight decay implicitly enforces sparsity on these blocks. Specifically, we consider a smooth target function supported on a low-dimensional manifold, then prove that ConvResNeXts can adapt to the function smoothness and low-dimensional structures and efficiently learn the function without suffering from the curse of dimensionality. Our findings partially justify the advantage of overparameterized ConvResNeXts over conventional machine learning models.",
        "keywords": "Nonparametric Classification;  Low Dimensional Manifolds; Overparameterized ResNets; Function Approximation",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Kaiqi Zhang;Zixuan Zhang;Minshuo Chen;Yuma Takeda;Mengdi Wang;Tuo Zhao;Yu-Xiang Wang",
        "authorids": "~Kaiqi_Zhang2;~Zixuan_Zhang5;~Minshuo_Chen1;utklav1511@gmail.com;~Mengdi_Wang1;~Tuo_Zhao2;~Yu-Xiang_Wang1",
        "gender": "M;F;M;;F;;",
        "homepage": ";https://www.isye.gatech.edu/users/zixuan-zhang;https://minshuochen.github.io;;http://mwang.princeton.edu;;http://www.cs.ucsb.edu/~yuxiangw/publications.html",
        "dblp": ";;217/1509;;;;62/1637-3.html",
        "google_scholar": "XA7np8gAAAAJ;;qU9WvTgAAAAJ;;;;HGNZ1fkAAAAJ",
        "orcid": ";;;;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Kaiqi_Zhang2;~Zixuan_Zhang5;~Minshuo_Chen1;utklav1511@gmail.com;~Mengdi_Wang1;~Tuo_Zhao2;~Yu-Xiang_Wang1",
        "aff": "UC Santa Barbara;Georgia Institute of Technology;Princeton University;;Princeton University;;UC Santa Barbara",
        "aff_domain": "ucsb.edu;gatech.edu;princeton.edu;;princeton.edu;;ucsb.edu",
        "position": "PhD student;PhD student;Postdoc;;Full Professor;;Assistant Professor",
        "bibtex": "@misc{\nzhang2024nonparametric,\ntitle={Nonparametric Classification on Low Dimensional Manifolds using Overparameterized Convolutional Residual Networks},\nauthor={Kaiqi Zhang and Zixuan Zhang and Minshuo Chen and Yuma Takeda and Mengdi Wang and Tuo Zhao and Yu-Xiang Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=L3yJ54gv3H}\n}",
        "github": "",
        "project": "",
        "reviewers": "BAzp;cTm8;QcEh;CZj1",
        "site": "https://openreview.net/forum?id=L3yJ54gv3H",
        "pdf_size": 887942,
        "rating": "3;5;5;6",
        "confidence": "3;3;3;3",
        "soundness": "3;4;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;1;3",
        "wc_summary": "67;91;55;71",
        "wc_strengths": "39;17;50;29",
        "wc_weaknesses": "109;300;92;20",
        "wc_questions": "108;2;120;2",
        "wc_review": "323;410;317;122",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "766;767;1261;315",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;2;2;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            71.0,
            12.96148139681572
        ],
        "wc_strengths_avg": [
            33.75,
            12.193748398257199
        ],
        "wc_weaknesses_avg": [
            130.25,
            103.54316732648273
        ],
        "wc_questions_avg": [
            58.0,
            56.16048432839589
        ],
        "wc_review_avg": [
            293.0,
            105.36365597301567
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            777.25,
            334.63440872092036
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=884794093389877077&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2;2;0",
        "aff_unique_norm": "University of California, Santa Barbara;Georgia Institute of Technology;Princeton University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ucsb.edu;https://www.gatech.edu;https://www.princeton.edu",
        "aff_unique_abbr": "UCSB;Georgia Tech;Princeton",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Santa Barbara;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Rephrase, Augment, Reason: Visual Grounding of Questions for Vision-Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18874",
        "id": "L4nOxziGf9",
        "author_site": "Archiki Prasad, Elias Stengel-Eskin, Mohit Bansal",
        "tldr": "",
        "abstract": "An increasing number of vision-language tasks can be handled with little to no training, i.e., in a zero and few-shot manner, by marrying large language models (LLMs) to vision encoders, resulting in large vision-language models (LVLMs). While this has huge upsides, such as not requiring training data or custom architectures, how an input is presented to an LVLM can have a major impact on zero-shot model performance. In particular, inputs phrased in an underspecified way can result in incorrect answers due to factors like missing visual information, complex implicit reasoning, or linguistic ambiguity. Therefore, adding visually-grounded information to the input as a preemptive clarification should improve model performance by reducing underspecification, e.g., by localizing objects and disambiguating references. Similarly, in the VQA setting, changing the way questions are framed can make them easier for models to answer. To this end, we present **Rep**hrase, **A**ugment and **Re**ason (RepARe), a gradient-free framework that extracts salient details about the image using the underlying LVLM as a captioner and reasoner, in order to propose modifications to the original question. We then use the LVLM\u2019s confidence over a generated answer as an unsupervised scoring function to select the rephrased question most likely to improve zero-shot performance. Focusing on three visual question answering tasks, we show that RepARe can result in a 3.85% (absolute) increase in zero-shot accuracy on VQAv2, 6.41%, and 7.94% points increase on A-OKVQA, and VizWiz respectively. Additionally, we find that using gold answers for oracle question candidate selection achieves a substantial gain in VQA accuracy by up to 14.41%. Through extensive analysis, we demonstrate that outputs from RepARe increase syntactic complexity, and effectively utilize vision-language interaction and the frozen LLM.",
        "keywords": "visual question answering;zero-shot;large vision language models;visual reasoning;underspecification;grounding language to vision",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/e7f0b76c868920fd44cd5a2fd7a18b50810a9ab9.zip",
        "author": "Archiki Prasad;Elias Stengel-Eskin;Mohit Bansal",
        "authorids": "~Archiki_Prasad1;~Elias_Stengel-Eskin1;~Mohit_Bansal2",
        "gender": "F;M;M",
        "homepage": "https://archiki.github.io/;https://esteng.github.io;https://www.cs.unc.edu/~mbansal/",
        "dblp": "264/2812;212/6138;32/5243.html",
        "google_scholar": "Svcwv-IAAAAJ;gr_ZVSQAAAAJ;DN8QtscAAAAJ",
        "orcid": ";0000-0002-6689-505X;",
        "linkedin": "archiki-prasad;;",
        "or_profile": "~Archiki_Prasad1;~Elias_Stengel-Eskin1;~Mohit_Bansal2",
        "aff": "University of North Carolina, Chapel Hill;University of North Carolina at Chapel Hill;University of North Carolina at Chapel Hill",
        "aff_domain": "unc.edu;cs.unc.edu;unc.edu",
        "position": "PhD student;Postdoc;Full Professor",
        "bibtex": "@inproceedings{\nprasad2024rephrase,\ntitle={Rephrase, Augment, Reason: Visual Grounding of Questions for Vision-Language Models},\nauthor={Archiki Prasad and Elias Stengel-Eskin and Mohit Bansal},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=L4nOxziGf9}\n}",
        "github": "",
        "project": "",
        "reviewers": "KySW;j2wD;Jt1P",
        "pdf_size": 2646709,
        "rating": "6;6;6",
        "confidence": "4;3;4",
        "soundness": "3;3;3",
        "contribution": "2;2;3",
        "presentation": "3;2;3",
        "wc_summary": "197;60;85",
        "wc_strengths": "53;20;35",
        "wc_weaknesses": "268;49;100",
        "wc_questions": "9;73;7",
        "wc_review": "527;202;227",
        "wc_reply_reviewers": "22;48;0",
        "wc_reply_authors": "868;758;375",
        "reply_reviewers": "1;1;0",
        "reply_authors": "3;2;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            114.0,
            59.570686303472
        ],
        "wc_strengths_avg": [
            36.0,
            13.490737563232042
        ],
        "wc_weaknesses_avg": [
            139.0,
            93.56281312572854
        ],
        "wc_questions_avg": [
            29.666666666666668,
            30.652170486860395
        ],
        "wc_review_avg": [
            318.6666666666667,
            147.66704288891125
        ],
        "wc_reply_reviewers_avg": [
            23.333333333333332,
            19.618585292749547
        ],
        "wc_reply_authors_avg": [
            667.0,
            211.30231107743867
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 20,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15770640180363633658&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=L4nOxziGf9",
        "pdf": "https://openreview.net/pdf?id=L4nOxziGf9",
        "email": "unc.edu;cs.unc.edu;unc.edu",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of North Carolina",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.unc.edu",
        "aff_unique_abbr": "UNC",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Chapel Hill",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "L5yq5KsnEZ",
        "title": "MITIGATING BIAS IN DATASET DISTILLATION",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Dataset distillation (DD) has emerged as a technique for compressing large datasets into smaller synthetic counterparts,  facilitating downstream training tasks. In this paper, we study the impact of bias within the original dataset on the performance of dataset distillation. With a comprehensive empirical evaluation on datasets with color, corruption and background biases, we found that color and background biases in the original dataset will be amplified through the distillation process, resulting in a notable decline in the performance of models trained on the synthetic set, while corruption bias is suppressed through the distillation process. \n  To reduce bias amplification in dataset distillation, \nwe introduce a simple yet highly effective approach based on a sample reweighting scheme utilizing kernel density estimation.\nEmpirical results on multiple datasets demonstrated the effectiveness of the proposed method. \n  Notably, on CMNIST with 5\\% bias-conflict ratio and IPC 50, our method achieves 91.5\\% test accuracy compared to 23.8\\% from vanilla DM, boosting the performance by 67.7\\%, whereas applying state-of-the-art debiasing method on the same synthetic set only achieves 53.7\\%.\n   Our findings highlight the importance of addressing biases in dataset distillation and provide a promising avenue to mitigate bias amplification in the process.",
        "keywords": "dataset distillation;dataset condensation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/d3d5c3de8785305969677a9089f9310c5e7a0b72.zip",
        "author": "Justin Cui;Ruochen Wang;Yuanhao Xiong;Cho-Jui Hsieh",
        "authorids": "~Justin_Cui1;~Ruochen_Wang2;~Yuanhao_Xiong1;~Cho-Jui_Hsieh1",
        "gender": "M;M;M;M",
        "homepage": ";https://ruocwang.github.io/;https://xyh97.github.io/;http://web.cs.ucla.edu/~chohsieh/index.html",
        "dblp": "324/7960;33/120;232/1248;14/2770",
        "google_scholar": "zel3jUcAAAAJ;8fXrlRAAAAAJ;DVKxiMkAAAAJ;Wy89g4IAAAAJ",
        "orcid": ";;;",
        "linkedin": ";ruochen-wang-1699b1113/;;",
        "or_profile": "~Justin_Cui1;~Ruochen_Wang2;~Yuanhao_Xiong1;~Cho-Jui_Hsieh1",
        "aff": ", University of California, Los Angeles;University of California, Los Angeles;University of California, Los Angeles;University of California, Los Angeles",
        "aff_domain": "cs.ucla.edu;ucla.edu;cs.ucla.edu;ucla.edu",
        "position": "PhD student;PhD student;PhD student;Associate Professor",
        "bibtex": "@misc{\ncui2024mitigating,\ntitle={{MITIGATING} {BIAS} {IN} {DATASET} {DISTILLATION}},\nauthor={Justin Cui and Ruochen Wang and Yuanhao Xiong and Cho-Jui Hsieh},\nyear={2024},\nurl={https://openreview.net/forum?id=L5yq5KsnEZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "aohj;seUN;1SmU;ktut",
        "site": "https://openreview.net/forum?id=L5yq5KsnEZ",
        "pdf_size": 1522106,
        "rating": "3;5;5;5",
        "confidence": "4;4;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;2",
        "presentation": "3;2;3;2",
        "wc_summary": "76;48;77;53",
        "wc_strengths": "65;28;28;40",
        "wc_weaknesses": "249;106;133;84",
        "wc_questions": "81;88;85;106",
        "wc_review": "471;270;323;283",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            63.5,
            13.124404748406688
        ],
        "wc_strengths_avg": [
            40.25,
            15.105876340020794
        ],
        "wc_weaknesses_avg": [
            143.0,
            63.612105766119704
        ],
        "wc_questions_avg": [
            90.0,
            9.565563234854496
        ],
        "wc_review_avg": [
            336.75,
            79.93239330834527
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7681562538254647363&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of California, Los Angeles",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucla.edu",
        "aff_unique_abbr": "UCLA",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Los Angeles",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "L6CgvBarc4",
        "title": "Bag of Tricks to Boost Adversarial Transferability",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep neural networks are widely known to be vulnerable to adversarial examples. However, vanilla adversarial examples generated under the white-box setting often exhibit low transferability across different models. Since adversarial transferability poses more severe threats to practical applications, various approaches have been proposed for better transferability, including gradient-based, input transformation-based, and model-related attacks. In this work, we find that several tiny changes in the existing adversarial attacks can significantly affect the attack performance, e.g., the number of iterations and step size. Based on careful studies of existing adversarial attacks, we propose a bag of tricks to enhance adversarial transferability, including momentum initialization, scheduled step size, dual example, spectral-based input transformation, and several ensemble strategies. Extensive experiments on the ImageNet dataset validate the high effectiveness of our proposed tricks and show that combining them can further boost adversarial transferability. Our work provides practical insights and techniques to enhance adversarial transferability and offers guidance to improve the attack performance on real-world applications through simple adjustments.",
        "keywords": "adversarial attack",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/03c67428338bd744a4443989494af79c44e175b3.zip",
        "author": "Zeliang Zhang;Rongyi Zhu;Wei Yao;Xiaosen Wang;Chenliang Xu",
        "authorids": "~Zeliang_Zhang1;~Rongyi_Zhu1;~Wei_Yao2;~Xiaosen_Wang1;~Chenliang_Xu1",
        "gender": "M;;M;M;M",
        "homepage": "https://github.com/ZhangAIPI;;https://yw101004244.github.io/;https://xiaosen-wang.github.io/;https://www.cs.rochester.edu/~cxu22/",
        "dblp": "219/9383;;72/4065-17;241/6284;117/4770",
        "google_scholar": "7nLfsSgAAAAJ;;https://scholar.google.com/citations?hl=zh-CN;sVeDOcsAAAAJ;https://scholar.google.com.tw/citations?user=54HfyDIAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Zeliang_Zhang1;~Rongyi_Zhu1;~Wei_Yao2;~Xiaosen_Wang1;~Chenliang_Xu1",
        "aff": "Microsoft Research;;Shanghai Artificial Intelligence Laboratory;Huawei Technologies Ltd.;University of Rochester",
        "aff_domain": "research.microsoft.com;;pjlab.org.cn;huawei.com;rochester.edu",
        "position": "Intern;;Intern;Researcher;Associate Professor",
        "bibtex": "@misc{\nzhang2024bag,\ntitle={Bag of Tricks to Boost Adversarial Transferability},\nauthor={Zeliang Zhang and Rongyi Zhu and Wei Yao and Xiaosen Wang and Chenliang Xu},\nyear={2024},\nurl={https://openreview.net/forum?id=L6CgvBarc4}\n}",
        "github": "",
        "project": "",
        "reviewers": "Pj5y;A7nY;uKVA;7z2g",
        "site": "https://openreview.net/forum?id=L6CgvBarc4",
        "pdf_size": 2217881,
        "rating": "5;6;6;8",
        "confidence": "4;4;4;3",
        "soundness": "3;2;3;4",
        "contribution": "2;2;3;4",
        "presentation": "3;3;3;4",
        "wc_summary": "49;47;59;128",
        "wc_strengths": "34;38;9;284",
        "wc_weaknesses": "63;181;212;182",
        "wc_questions": "3;35;3;94",
        "wc_review": "149;301;283;688",
        "wc_reply_reviewers": "0;14;12;72",
        "wc_reply_authors": "658;1230;1172;1085",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "2;4;4;3",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            70.75,
            33.36446462930284
        ],
        "wc_strengths_avg": [
            91.25,
            111.83777313591325
        ],
        "wc_weaknesses_avg": [
            159.5,
            57.089841478147406
        ],
        "wc_questions_avg": [
            33.75,
            37.157603528753036
        ],
        "wc_review_avg": [
            355.25,
            200.8884951907401
        ],
        "wc_reply_reviewers_avg": [
            24.5,
            27.941904015295737
        ],
        "wc_reply_authors_avg": [
            1036.25,
            224.39738746251035
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.25,
            0.82915619758885
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9271726499455306,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14671322127006169791&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Microsoft;Shanghai Artificial Intelligence Laboratory;Huawei;University of Rochester",
        "aff_unique_dep": "Microsoft Research;;Huawei Technologies;",
        "aff_unique_url": "https://www.microsoft.com/en-us/research;http://www.shailab.org/;https://www.huawei.com;https://www.rochester.edu",
        "aff_unique_abbr": "MSR;Shanghai AI Lab;Huawei;U of R",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "Massive Editing for Large Language Models via Meta Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18873",
        "id": "L6L1CJQ2PE",
        "author_site": "Chenmien Tan, Ge Zhang, Jie Fu",
        "tldr": "",
        "abstract": "While large language models (LLMs) have enabled learning knowledge from the pre-training corpora, the acquired knowledge may be fundamentally incorrect or outdated over time, which necessitates rectifying the knowledge of the language model (LM) after the training. A promising approach involves employing a hyper-network to generate parameter shift, whereas existing hyper-networks suffer from inferior scalability in synchronous editing operation amount (Hase et al., 2023b; Huang et al., 2023). For instance, Mitchell et al. (2022) mimics gradient accumulation to sum the parameter shifts together, which lacks statistical significance and is prone to cancellation effect. To mitigate the problem, we propose the MAssive Language Model Editing Network (MALMEN), which formulates the parameter shift aggregation as the least square problem, subsequently updating the LM parameter using the normal equation. To accommodate editing multiple facts simultaneously with limited memory budgets, we separate the computation on the hyper-network and LM, enabling arbitrary batch size on both neural networks. Our method is evaluated by editing up to thousands of facts on LMs with different architectures, i.e., BERT-base, GPT-2, and GPT-J (6B), across various knowledge-intensive NLP tasks, i.e., closed book fact-checking and question answering. Remarkably, MALMEN is capable of editing hundreds of times more facts than MEND (Mitchell et al., 2022) with the identical hyper-network architecture and outperforms editor specifically designed for GPT, i.e., MEMIT (Meng et al., 2023).",
        "keywords": "Language Model;Model Editing;Meta Learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/91683f06e966f2eca3d368d3245e11b8d361d4e7.zip",
        "author": "Chenmien Tan;Ge Zhang;Jie Fu",
        "authorids": "~Chenmien_Tan1;~Ge_Zhang5;~Jie_Fu2",
        "gender": "M;M;M",
        "homepage": "https://chenmientan.github.io/;;https://bigaidream.github.io/",
        "dblp": ";;",
        "google_scholar": "1ml8-30AAAAJ;qyTrq4kAAAAJ;66osleIAAAAJ",
        "orcid": ";;0000-0002-4494-843X",
        "linkedin": ";ge-zhang-792797169/;",
        "or_profile": "~Chenmien_Tan1;~Ge_Zhang5;~Jie_Fu1",
        "aff": "University of Edinburgh;University of Waterloo;Hong Kong University of Science and Technology",
        "aff_domain": "ed.ac.uk;cs.uwaterloo.ca;ust.hk",
        "position": "MS student;PhD student;Researcher",
        "bibtex": "@inproceedings{\ntan2024massive,\ntitle={Massive Editing for Large Language Models via Meta Learning},\nauthor={Chenmien Tan and Ge Zhang and Jie Fu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=L6L1CJQ2PE}\n}",
        "github": "",
        "project": "",
        "reviewers": "t22i;NRG8;8rhk;hVjc",
        "pdf_size": 614620,
        "rating": "5;6;6;10",
        "confidence": "4;3;4;4",
        "soundness": "2;3;3;4",
        "contribution": "2;3;3;4",
        "presentation": "2;3;3;4",
        "wc_summary": "363;116;111;81",
        "wc_strengths": "36;135;54;49",
        "wc_weaknesses": "90;172;90;110",
        "wc_questions": "131;31;48;47",
        "wc_review": "620;454;303;287",
        "wc_reply_reviewers": "53;14;0;0",
        "wc_reply_authors": "774;491;443;157",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.75,
            1.920286436967152
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            167.75,
            113.51954677499377
        ],
        "wc_strengths_avg": [
            68.5,
            38.95189340712464
        ],
        "wc_weaknesses_avg": [
            115.5,
            33.62662635472075
        ],
        "wc_questions_avg": [
            64.25,
            39.124001584705006
        ],
        "wc_review_avg": [
            416.0,
            134.60126299556035
        ],
        "wc_reply_reviewers_avg": [
            16.75,
            21.695333599647643
        ],
        "wc_reply_authors_avg": [
            466.25,
            218.8028507583939
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.22549380840084865,
        "gs_citation": 74,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5575967208566872641&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=L6L1CJQ2PE",
        "pdf": "https://openreview.net/pdf?id=L6L1CJQ2PE",
        "email": "ed.ac.uk;cs.uwaterloo.ca;ust.hk",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of Edinburgh;University of Waterloo;Hong Kong University of Science and Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ed.ac.uk;https://uwaterloo.ca;https://www.ust.hk",
        "aff_unique_abbr": "Edinburgh;UW;HKUST",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;1;2",
        "aff_country_unique": "United Kingdom;Canada;China"
    },
    {
        "title": "Select to Perfect: Imitating desired behavior from large multi-agent data",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18872",
        "id": "L6crLU7MIE",
        "author_site": "Tim Franzmeyer, Jakob Foerster, Edith Elkind, Philip Torr, Joao F. Henriques",
        "tldr": "",
        "abstract": "AI agents are commonly trained with large datasets of demonstrations of human behavior.\nHowever, not all behaviors are equally safe or desirable.\nDesired characteristics for an AI agent can be expressed by assigning desirability scores, which we assume are not assigned to individual behaviors but to collective trajectories.\nFor example, in a dataset of vehicle interactions, these scores might relate to the number of incidents that occurred. \nWe first assess the effect of each individual agent's behavior on the collective desirability score, e.g., assessing how likely an agent is to cause incidents.\nThis allows us to selectively imitate agents with a positive effect, e.g., only imitating agents that are unlikely to cause incidents. \nTo enable this, we propose the concept of an agent's \\textit{Exchange Value}, which quantifies an individual agent's contribution to the collective desirability score. \nThe Exchange Value is the expected change in desirability score when substituting the agent for a randomly selected agent.\nWe propose additional methods for estimating Exchange Values from real-world datasets, enabling us to learn desired imitation policies that outperform relevant baselines. The project website can be found at https://tinyurl.com/select-to-perfect.",
        "keywords": "multi-agent systems;imitation learning;credit assignment;learning from human data",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Tim Franzmeyer;Edith Elkind;Philip Torr;Jakob Nicolaus Foerster;Joao F. Henriques",
        "authorids": "~Tim_Franzmeyer1;~Edith_Elkind1;~Philip_Torr1;~Jakob_Nicolaus_Foerster1;~Joao_F._Henriques1",
        "gender": ";F;;M;M",
        "homepage": "https://www.robots.ox.ac.uk/~frtim/;;http://www.robots.ox.ac.uk/~tvg/;https://www.jakobfoerster.com;http://www.robots.ox.ac.uk/~joao/",
        "dblp": "298/1117;31/2621;;176/5095;31/8617.html",
        "google_scholar": "Jvv1rkkAAAAJ;;;6z4lQzMAAAAJ;aCQjyp0AAAAJ",
        "orcid": ";;;;",
        "linkedin": "tim-franzmeyer-370257110/;;;;",
        "or_profile": "~Tim_Franzmeyer1;~Edith_Elkind1;~Philip_Torr1;~Jakob_Nicolaus_Foerster1;~Joao_F._Henriques1",
        "aff": "University of Oxford;Department of Computer Science, University of Oxford;University of Oxford;University of Oxford, University of Oxford;University of Oxford",
        "aff_domain": "ox.ac.uk;cs.ox.ac.uk;ox.ac.uk;eng.ox.ac.uk;ox.ac.uk",
        "position": "PhD student;Full Professor;Full Professor;Associate Professor;Principal Researcher",
        "bibtex": "@inproceedings{\nfranzmeyer2024select,\ntitle={Select to Perfect: Imitating desired behavior from large multi-agent data},\nauthor={Tim Franzmeyer and Edith Elkind and Philip Torr and Jakob Nicolaus Foerster and Joao F. Henriques},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=L6crLU7MIE}\n}",
        "github": "",
        "project": "",
        "reviewers": "VYWJ;fLoZ;wrnL;e3wr;CrLG",
        "pdf_size": 1011071,
        "rating": "5;6;8;8;8",
        "confidence": "3;3;2;3;3",
        "soundness": "3;2;3;4;2",
        "contribution": "2;3;3;3;3",
        "presentation": "2;2;3;3;3",
        "wc_summary": "95;99;74;116;251",
        "wc_strengths": "136;91;106;71;81",
        "wc_weaknesses": "124;115;82;112;212",
        "wc_questions": "138;69;31;90;56",
        "wc_review": "493;374;293;389;600",
        "wc_reply_reviewers": "25;0;0;0;166",
        "wc_reply_authors": "566;700;678;715;996",
        "reply_reviewers": "1;0;0;0;2",
        "reply_authors": "3;3;1;3;6",
        "rating_avg": [
            7.0,
            1.2649110640673518
        ],
        "confidence_avg": [
            2.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.8,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.8,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            127.0,
            63.42554690343632
        ],
        "wc_strengths_avg": [
            97.0,
            22.67156809750927
        ],
        "wc_weaknesses_avg": [
            129.0,
            43.83605821695194
        ],
        "wc_questions_avg": [
            76.8,
            36.085454133209964
        ],
        "wc_review_avg": [
            429.8,
            106.25892903657557
        ],
        "wc_reply_reviewers_avg": [
            38.2,
            64.62940507230437
        ],
        "wc_reply_authors_avg": [
            731.0,
            142.46122279413441
        ],
        "reply_reviewers_avg": [
            0.6,
            0.7999999999999999
        ],
        "reply_authors_avg": [
            3.2,
            1.6
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.3952847075210474,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12906227825813865225&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 8,
        "openreview": "https://openreview.net/forum?id=L6crLU7MIE",
        "pdf": "https://openreview.net/pdf?id=L6crLU7MIE",
        "email": "ox.ac.uk;cs.ox.ac.uk;ox.ac.uk;eng.ox.ac.uk;ox.ac.uk",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "University of Oxford",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ox.ac.uk",
        "aff_unique_abbr": "Oxford",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Oxford",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "L6r9t0HtqQ",
        "title": "KEFI: Kernel-based Feature Identification for Generalizable Classification",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "To achieve satisfactory generalization performance on previously unseen domains, existing domain generalization (DG) methods often assume fixed domain-invariant features from a set of training domains for good generalization on new domains. However, this assumption can be overly strict, especially when the source domains lack shared information or when the target domains utilize information from selective source domains in a compositional manner. This leads to the natural question of how we utilize information from the source domain to the target domain in an appropriate way. In response to this challenge, we propose an innovative framework that includes an attribute-based feature extractor that captures from the source domains semantically meaningful components referred to as \\textit{attributes} and a \\textit{Kernel-based Attribute Identifier} that leverages kernel learning theory to define the decision boundaries for these attributes collected from the source domains. This dynamic learning approach empowers the classifier to effectively identify the learned attributes in the domains it has not encountered before. We empirically validate our method on well-established DG benchmarks,\nachieving competitive results compared to state-of-the-art techniques.",
        "keywords": "Representation Learning;Domain generalization;Image classification",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Long Tung Vuong;Chuanxia Zheng;Manh Luong;Thanh-Toan Do;Trung Le;Dinh Phung",
        "authorids": "~Long_Tung_Vuong1;~Chuanxia_Zheng1;~Manh_Luong3;~Thanh-Toan_Do4;~Trung_Le2;~Dinh_Phung2",
        "gender": "M;M;M;;M;",
        "homepage": ";http://www.chuanxiaz.com/;https://scholar.google.com.au/citations?user=Vb7bL0YAAAAJ&hl=en;;;",
        "dblp": "329/6838;195/8988;;;;",
        "google_scholar": "DCC657sAAAAJ;mvpE6bIAAAAJ;https://scholar.google.com.au/citations?user=Vb7bL0YAAAAJ;;https://scholar.google.com/citations?hl=en;",
        "orcid": ";;;;;",
        "linkedin": "long-vuong-783477131/;chuanxia-zheng-80a3b8110/;;;;",
        "or_profile": "~Long_Tung_Vuong1;~Chuanxia_Zheng1;~Manh_Luong3;~Thanh-Toan_Do4;~Trung_Le2;~Dinh_Phung2",
        "aff": "Monash University;University of Oxford;Monash University;;Monash University;",
        "aff_domain": "monash.edu;ox.ac.uk;monash.edu;;monash.edu;",
        "position": "PhD student;Postdoc;PhD student;;Assistant Professor;",
        "bibtex": "@misc{\nvuong2024kefi,\ntitle={{KEFI}: Kernel-based Feature Identification for Generalizable Classification},\nauthor={Long Tung Vuong and Chuanxia Zheng and Manh Luong and Thanh-Toan Do and Trung Le and Dinh Phung},\nyear={2024},\nurl={https://openreview.net/forum?id=L6r9t0HtqQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "TEu1;N1P7;ysfS;xk2B",
        "site": "https://openreview.net/forum?id=L6r9t0HtqQ",
        "pdf_size": 3175829,
        "rating": "3;3;5;5",
        "confidence": "3;5;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;2",
        "presentation": "2;2;3;2",
        "wc_summary": "97;50;24;119",
        "wc_strengths": "34;44;16;84",
        "wc_weaknesses": "71;72;77;104",
        "wc_questions": "272;8;22;242",
        "wc_review": "474;174;139;549",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1006;878;1333;1483",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;2;3",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            72.5,
            37.486664295453124
        ],
        "wc_strengths_avg": [
            44.5,
            24.914855006601986
        ],
        "wc_weaknesses_avg": [
            81.0,
            13.47219358530748
        ],
        "wc_questions_avg": [
            136.0,
            121.56479753612885
        ],
        "wc_review_avg": [
            334.0,
            179.8958031750602
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1175.0,
            243.20670221028038
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.30151134457776363,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:tu7g612_WugJ:scholar.google.com/&scioq=KEFI:+Kernel-based+Feature+Identification+for+Generalizable+Classification&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Monash University;University of Oxford",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.monash.edu;https://www.ox.ac.uk",
        "aff_unique_abbr": "Monash;Oxford",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "Australia;United Kingdom"
    },
    {
        "id": "L76lvHZqeS",
        "title": "A Unified Framework of Theoretically Robust Contrastive Loss against Label Noise",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Learning from noisy labels is a critical challenge in machine learning, with vast implications for numerous real-world scenarios. While supervised contrastive learning has recently emerged as a powerful tool for navigating label noise, many existing solutions remain heuristic, often devoid of a systematic theoretical foundation for crafting robust supervised contrastive losses. To address the gap, in this paper, we propose a unified theoretical framework for robust losses under the pairwise contrastive paradigm. In particular, we for the first time derive a general robust condition for arbitrary contrastive losses, which serves as a criterion to verify the theoretical robustness of a supervised contrastive loss against label noise. This framework is not only holistic -- encompassing prior techniques such as nearest-neighbor (NN) sample selection and robust contrastive loss -- but also instrumental, guiding us to develop a robust version of the popular InfoNCE loss, termed Symmetric InfoNCE (SymNCE). Extensive experiments on benchmark datasets demonstrate the superiority of SymNCE against label noise.",
        "keywords": "contrastive learning;learning from label noise",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Jingyi Cui;Yi-Ge Zhang;Hengyu Liu;Yisen Wang",
        "authorids": "~Jingyi_Cui1;~Yi-Ge_Zhang1;~Hengyu_Liu2;~Yisen_Wang1",
        "gender": "F;M;M;M",
        "homepage": "https://zero-lab-pku.github.io/personwise/cuijingyi/;https://www.lamda.nju.edu.cn/zhangyg/;https://liuhengyu321.github.io/;https://yisenwang.github.io/",
        "dblp": "216/3282;346/0977;372/3098;172/1346-1",
        "google_scholar": ";;UiejE-oAAAAJ;uMWPDboAAAAJ",
        "orcid": ";;0009-0007-7965-1402;",
        "linkedin": ";;;",
        "or_profile": "~Jingyi_Cui1;~Yi-Ge_Zhang1;~Hengyu_Liu2;~Yisen_Wang1",
        "aff": "Peking University;Nanjing University;Tianjin University;Peking University",
        "aff_domain": "pku.edu.cn;nju.edu.cn;tju.edu.cn;pku.edu.cn",
        "position": "PhD student;MS student;Undergrad student;Assistant Professor",
        "bibtex": "@misc{\ncui2024a,\ntitle={A Unified Framework of Theoretically Robust Contrastive Loss against Label Noise},\nauthor={Jingyi Cui and Yi-Ge Zhang and Hengyu Liu and Yisen Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=L76lvHZqeS}\n}",
        "github": "",
        "project": "",
        "reviewers": "PcdE;zzjJ;qnEx;9C43;73JG",
        "site": "https://openreview.net/forum?id=L76lvHZqeS",
        "pdf_size": 413547,
        "rating": "3;3;5;5;6",
        "confidence": "4;4;4;3;3",
        "soundness": "3;3;3;2;3",
        "contribution": "2;2;2;2;3",
        "presentation": "3;2;2;2;3",
        "wc_summary": "93;132;77;196;67",
        "wc_strengths": "43;60;34;146;30",
        "wc_weaknesses": "235;520;162;786;46",
        "wc_questions": "5;4;5;521;63",
        "wc_review": "376;716;278;1649;206",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            4.4,
            1.2
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            113.0,
            47.03615630554861
        ],
        "wc_strengths_avg": [
            62.6,
            42.958584706668354
        ],
        "wc_weaknesses_avg": [
            349.8,
            268.32100178703865
        ],
        "wc_questions_avg": [
            119.6,
            201.96791824445782
        ],
        "wc_review_avg": [
            645.0,
            531.5689983435828
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.748455199183749,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:702T42sxEscJ:scholar.google.com/&scioq=A+Unified+Framework+of+Theoretically+Robust+Contrastive+Loss+against+Label+Noise&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Peking University;Nanjing University;Tianjin University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.nju.edu.cn;http://www.tju.edu.cn",
        "aff_unique_abbr": "Peking U;Nanjing U;TJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "L7KDMsqWl9",
        "title": "HHD-Ethiopic: A Historical Handwritten Dataset for Ethiopic OCR with Baseline Models and Human-level Performance",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper introduces HHD-Ethiopic, a new OCR dataset for historical handwritten Ethiopic script, characterized by a unique syllabic writing system, low resource availability, and complex orthographic diacritics. The dataset consists of roughly 80,000 annotated text-line images from 1700 pages of $18^{th}$ to $20^{th}$ century documents, including a training set with text-line images from the $19^{th}$ to $20^{th}$ century and two test sets. One is distributed similarly to the training set with nearly 6,000 text-line images, and the other contains only images from the $18^{th}$ century manuscripts, with around 16,000 images. The former test set allows us to check baseline performance in the classical IID setting (Independently and Identically Distributed), while the latter addresses a more realistic setting in which the test set is drawn from a different distribution than the training set (Out-Of-Distribution or OOD). Multiple annotators labeled all text-line images for the HHD-Ethiopic dataset, and an expert supervisor double-checked them. We assessed human-level recognition performance and compared it with state-of-the-art (SOTA) OCR models using the Character Error Rate (CER) and Normalized Edit Distance (NED) metrics. Our results show that the model performed comparably to human-level recognition on the $18^{th}$ century test set and outperformed humans on the IID test set. However, the unique challenges posed by the Ethiopic script, such as detecting complex diacritics, still present difficulties for the models. Our baseline evaluation and HHD-Ethiopic dataset will encourage further research on Ethiopic script recognition. The dataset and source code can be accessed at https://github.com/ethopic/hhd-ethiopic-I.",
        "keywords": "HHD-Ethiopic;Ethiopic script;Human-level recognition performance;Character error rate;low-resource script",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/cd4205fe58094c895d1d77e6c74c6a237e61bf46.pdf",
        "author": "Birhanu Hailu Belay;Isabelle Guyon;Tadele Mengiste;Bezawork Tilahun;Marcus Liwicki;Tesfa Tegegne;Romain Egele",
        "authorids": "~Birhanu_Hailu_Belay1;~Isabelle_Guyon1;~Tadele_Mengiste1;~Bezawork_Tilahun1;~Marcus_Liwicki1;~Tesfa_Tegegne1;~Romain_Egele1",
        "gender": "M;F;;F;Unspecified;;",
        "homepage": "https://sites.google.com/view/birhanu-belay/home;;;;https://www.ltu.se/staff/m/marliw?l=en;;http://deathn0t.github.io",
        "dblp": "254/8159;31/6176;;;;;248/7760",
        "google_scholar": "0ICZbqcAAAAJ;;;;https://scholar.google.ch/citations?user=n1Y4zq4AAAAJ;MBWS0jIAAAAJ;K4yYtFwAAAAJ",
        "orcid": ";;;;;;",
        "linkedin": ";;tadele-mengiste-742644155/;bezawork-tilahun-mindaye-8b8a93132/;;;",
        "or_profile": "~Birhanu_Hailu_Belay1;~Isabelle_Guyon1;~Tadele_Mengiste1;~Bezawork_Tilahun1;~Marcus_Liwicki1;~Tesfa_Tegegne1;~Romain_Egele1",
        "aff": "Universite of Paris-saclay;Universit\u00e9 Paris-Saclay;Bahir Dar Institute of Technology;Bahir Dar University, Bahir Dar Institute of Technology;Lule\u00e5 University of Technology;Bahir Dar University;Argonne National Laboratory",
        "aff_domain": "universite-paris-saclay.fr;universite-paris-saclay.fr;bit.edu.et;bdu.edu.et;ltu.se;bdu.edu.et;anl.gov",
        "position": "Postdoc;Full Professor;Lecturer;Lecturer;Full Professor;Assistant Professor;PhD student",
        "bibtex": "@misc{\nbelay2024hhdethiopic,\ntitle={{HHD}-Ethiopic: A Historical Handwritten Dataset for Ethiopic {OCR} with Baseline Models and Human-level Performance},\nauthor={Birhanu Hailu Belay and Isabelle Guyon and Tadele Mengiste and Bezawork Tilahun and Marcus Liwicki and Tesfa Tegegne and Romain Egele},\nyear={2024},\nurl={https://openreview.net/forum?id=L7KDMsqWl9}\n}",
        "github": "",
        "project": "",
        "reviewers": "tpDS;6Yog;HsR1;idkx",
        "site": "https://openreview.net/forum?id=L7KDMsqWl9",
        "pdf_size": 19505175,
        "rating": "3;3;5;5",
        "confidence": "4;5;5;4",
        "soundness": "2;2;2;2",
        "contribution": "1;1;3;3",
        "presentation": "2;2;2;3",
        "wc_summary": "82;92;134;74",
        "wc_strengths": "21;30;50;94",
        "wc_weaknesses": "39;117;117;273",
        "wc_questions": "12;52;20;121",
        "wc_review": "154;291;321;562",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "206;532;314;704",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            1.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            95.5,
            23.124662159694356
        ],
        "wc_strengths_avg": [
            48.75,
            28.154706533721853
        ],
        "wc_weaknesses_avg": [
            136.5,
            84.99852939904314
        ],
        "wc_questions_avg": [
            51.25,
            42.96146529158427
        ],
        "wc_review_avg": [
            332.0,
            146.95747684279286
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            439.0,
            192.86523792534516
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=944030300266927705&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;1;2;3;4;3;5",
        "aff_unique_norm": "Universit\u00e9 de Paris-Saclay;Universit\u00e9 Paris-Saclay;Bahir Dar Institute of Technology;Bahir Dar University;Lule\u00e5 University of Technology;Argonne National Laboratory",
        "aff_unique_dep": ";;;Bahir Dar Institute of Technology;;",
        "aff_unique_url": "https://www.universite-paris-saclay.fr;https://www.universite-paris-saclay.fr;http://www.bdit.edu.et;https://www.bdu.edu.et;https://www.ltu.se;https://www.anl.gov",
        "aff_unique_abbr": "Paris-Saclay;UPSaclay;BDIT;BDU;LTU;ANL",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Bahir Dar",
        "aff_country_unique_index": "0;0;1;1;2;1;3",
        "aff_country_unique": "France;Ethiopia;Sweden;United States"
    },
    {
        "id": "L7LwHpjMTQ",
        "title": "CLIP as Multi-Task Multi-Kernel Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Contrastive Language-Image Pretraining (CLIP) is a foundational model that learns a latent embedding space through an inner product-based objective. In this paper, we provide a theoretical interpretation of CLIP utilizing Reproducing Kernel Hilbert Space (RKHS) framework. Specifically, we reformulate the problem of estimating the infinite-dimensional mapping with a neural network as selecting an unknown RKHS using multiple kernel learning. Such connection motivates us to propose to estimate the CLIP embedding via the multi-task multi-kernel (MTMK) method: we reformulate the different labels in the CLIP training data as the multiple training tasks, and reformulate learning the unknown CLIP embedding as choosing an optimal kernel from a family of Reproducing Kernel Hilbert Spaces, which is computationally more efficient. Utilizing the MTMK interpretation of CLIP, we also show an optimal statistical rate of the MTMK classifier under the scenario that both the number of covariates and the number of candidate kernels can increase with the sample size. Besides the synthetic simulations, we apply the proposed method to align the medical imaging data with the clinical codes in electronic health records and illustrate that our approach can learn the proper kernel space aligning the imaging embedding with the text embeddings with high accuracy.",
        "keywords": "Contrastive Language-Image Pretraining;Reproducing Kernel Hilbert Space;Multi-Task Multi-Kernel Learning",
        "primary_area": "metric learning, kernel learning, and sparse coding",
        "supplementary_material": "/attachment/0fd909692fc0116728fadfbb7732a36989d0efb5.pdf",
        "author": "Tianjun Ke;Yucong Lin;Xingpeng Xia;Jiaheng Yin;Jiaxing Xu;Tianxi Cai;Junwei Lu",
        "authorids": "~Tianjun_Ke1;~Yucong_Lin2;~Xingpeng_Xia1;~Jiaheng_Yin1;~Jiaxing_Xu1;~Tianxi_Cai1;~Junwei_Lu1",
        "gender": ";M;M;;M;F;M",
        "homepage": "https://keanson.github.io/;;;https://github.com/Felix-Yin729;;https://celehs.hms.harvard.edu/tcai/index.html;https://junwei-lu.github.io/",
        "dblp": ";;;;;;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.com.hk/citations?hl=zh-CN;;;;;",
        "orcid": ";0000-0002-9039-0318;;;;;",
        "linkedin": ";;https://www.linkedin.cn/incareer/in/ACoAAD68YGcBYYYmCpveq4x1NS1KUJ6ZtX6o7hY;;%E5%AE%B6%E5%85%B4-%E5%BE%90-972428201/;;",
        "or_profile": "~Tianjun_Ke1;~Yucong_Lin2;~Xingpeng_Xia1;~Jiaheng_Yin1;~Jiaxing_Xu1;~Tianxi_Cai1;~Junwei_Lu1",
        "aff": "School of Statistics, Renmin University of China;Beijing Institute of Technology;Tsinghua University;;University of Michigan - Ann Arbor;Harvard T.H. Chan School of Public Health;Harvard University",
        "aff_domain": "stat.ruc.edu.cn;bit.edu.cn;tsinghua.edu.cn;;umich.edu;hsph.harvard.edu;harvard.edu",
        "position": "Undergrad student;Postdoc;Undergrad student;;MS student;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nke2024clip,\ntitle={{CLIP} as Multi-Task Multi-Kernel Learning},\nauthor={Tianjun Ke and Yucong Lin and Xingpeng Xia and Jiaheng Yin and Jiaxing Xu and Tianxi Cai and Junwei Lu},\nyear={2024},\nurl={https://openreview.net/forum?id=L7LwHpjMTQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "pvdu;ry4r;F8DR",
        "site": "https://openreview.net/forum?id=L7LwHpjMTQ",
        "pdf_size": 0,
        "rating": "3;6;6",
        "confidence": "3;3;3",
        "soundness": "2;2;3",
        "contribution": "2;3;2",
        "presentation": "2;3;3",
        "wc_summary": "85;76;64",
        "wc_strengths": "41;23;54",
        "wc_weaknesses": "243;73;129",
        "wc_questions": "148;334;4",
        "wc_review": "517;506;251",
        "wc_reply_reviewers": "136;34;0",
        "wc_reply_authors": "1470;648;282",
        "reply_reviewers": "1;1;0",
        "reply_authors": "4;1;1",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            75.0,
            8.602325267042627
        ],
        "wc_strengths_avg": [
            39.333333333333336,
            12.710450643291745
        ],
        "wc_weaknesses_avg": [
            148.33333333333334,
            70.73581522507219
        ],
        "wc_questions_avg": [
            162.0,
            135.08515832614626
        ],
        "wc_review_avg": [
            424.6666666666667,
            122.88296148051698
        ],
        "wc_reply_reviewers_avg": [
            56.666666666666664,
            57.78888782071823
        ],
        "wc_reply_authors_avg": [
            800.0,
            496.7655382572346
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            1.4142135623730951
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:DgIbJDixwQwJ:scholar.google.com/&scioq=CLIP+as+Multi-Task+Multi-Kernel+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;4;4",
        "aff_unique_norm": "Renmin University of China;Beijing Institute of Technology;Tsinghua University;University of Michigan;Harvard University",
        "aff_unique_dep": "School of Statistics;;;;T.H. Chan School of Public Health",
        "aff_unique_url": "http://www.ruc.edu.cn;http://www.bit.edu.cn/;https://www.tsinghua.edu.cn;https://www.umich.edu;https://www.hsph.harvard.edu",
        "aff_unique_abbr": "RUC;BIT;THU;UM;Harvard",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Ann Arbor",
        "aff_country_unique_index": "0;0;0;1;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "L7gQWBcFxK",
        "title": "Efficient Gradient Estimation via Adaptive and Importance Sampling",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Classification tasks in machine learning heavily depend on stochastic gradient descent~(SGD) for optimization. The efficiency of SGD hinges on accurate gradient estimation from a mini-batch of data samples. Adaptive or importance sampling, as opposed to the popular uniform sampling, diminishes gradient-estimation noise by constructing mini-batches that emphasize crucial data points.\nPrior work has shown that data points should be chosen with probability ideally proportional to the magnitude of their gradient. However, computing these magnitudes for each sample incurs a heavy computational overhead. We propose a simplified importance function that depends \\textit{only} on the output layer's loss gradient. \nWe analytically derive this loss gradient for classification problems and establish an upper bound on the loss gradient.\nLeveraging the proposed gradient estimation, we report enhanced convergence in various classification tasks with minimal computational overhead. We demonstrate the effectiveness of our importance-sampling strategy on image and point-cloud datasets.",
        "keywords": "SGD;Importance sampling;Adaptive sampling;Classification",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "corentin salaun;Xingchang Huang;Iliyan Georgiev;Niloy Mitra;Gurprit Singh",
        "authorids": "~corentin_salaun1;~Xingchang_Huang1;~Iliyan_Georgiev1;~Niloy_Mitra1;~Gurprit_Singh1",
        "gender": "M;;;M;M",
        "homepage": "https://iribis.github.io/;;;http://www0.cs.ucl.ac.uk/staff/n.mitra/;https://sampling.mpi-inf.mpg.de/",
        "dblp": ";;;45/1575;148/8790",
        "google_scholar": "jP52FaMAAAAJ;;;https://scholar.google.com.tw/citations?user=dPrZJWMAAAAJ;https://scholar.google.fr/citations?user=s_zFnhQAAAAJ",
        "orcid": ";;;;0000-0003-0970-5835",
        "linkedin": ";;;;",
        "or_profile": "~corentin_salaun1;~Xingchang_Huang1;~Iliyan_Georgiev1;~Niloy_Mitra1;~Gurprit_Singh1",
        "aff": "Saarland Informatics Campus, Max-Planck Institute;;;Adobe Systems;Saarland Informatics Campus, Max-Planck Institute",
        "aff_domain": "mpi-inf.mpg.de;;;adobe.com;mpi-inf.mpg.de",
        "position": "PhD student;;;Researcher;Researcher",
        "bibtex": "@misc{\nsalaun2024efficient,\ntitle={Efficient Gradient Estimation via Adaptive and Importance Sampling},\nauthor={corentin salaun and Xingchang Huang and Iliyan Georgiev and Niloy Mitra and Gurprit Singh},\nyear={2024},\nurl={https://openreview.net/forum?id=L7gQWBcFxK}\n}",
        "github": "",
        "project": "",
        "reviewers": "qfPH;iVwr;FEz4;yYPP",
        "site": "https://openreview.net/forum?id=L7gQWBcFxK",
        "pdf_size": 3544829,
        "rating": "3;5;6;6",
        "confidence": "3;4;4;3",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;2;3;2",
        "wc_summary": "103;65;127;44",
        "wc_strengths": "43;41;52;34",
        "wc_weaknesses": "108;294;220;141",
        "wc_questions": "96;74;196;41",
        "wc_review": "350;474;595;260",
        "wc_reply_reviewers": "0;21;58;0",
        "wc_reply_authors": "379;115;471;296",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            84.75,
            32.2829289253624
        ],
        "wc_strengths_avg": [
            42.5,
            6.422616289332565
        ],
        "wc_weaknesses_avg": [
            190.75,
            72.1781649808306
        ],
        "wc_questions_avg": [
            101.75,
            57.82895036225368
        ],
        "wc_review_avg": [
            419.75,
            126.53136962824674
        ],
        "wc_reply_reviewers_avg": [
            19.75,
            23.689396362085716
        ],
        "wc_reply_authors_avg": [
            315.25,
            131.14186021251948
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.40824829046386296,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:EK9Cm2vuNtwJ:scholar.google.com/&scioq=Efficient+Gradient+Estimation+via+Adaptive+and+Importance+Sampling&hl=en&as_sdt=0,24",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Max-Planck Institute;Adobe",
        "aff_unique_dep": "Informatics;Adobe Systems Incorporated",
        "aff_unique_url": "https://www.mpi-sws.org;https://www.adobe.com",
        "aff_unique_abbr": "MPI-SWS;Adobe",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Saarland;",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Germany;United States"
    },
    {
        "id": "L7jtdGhWzT",
        "title": "Toward $\\textbf{F}$aithfulness-guided $\\textbf{E}$nsemble $\\textbf{I}$nterpretation of Neural Network",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Interpretable and faithful explanations for specific neural inferences are essential for understanding and evaluating the behavior of models. For this purpose, feature attributions are highly favored for their interpretability. To objectively quantify the faithfulness of an attribution to the model, a widely used metric uses perturbations of the input that mask either the highly salient or highly non-salient features. These metrics, however, neglect the faithfulness of the attribution to the hidden-layer encodings of the model, and hence ignore its internal structure. In response, we propose a novel attribution method, $\\textbf{FEI}$, which targets faithfulness to hidden layer representations. Moreover, the method optimizes the quality of the attribution according to the perturbation metrics using a novel smooth approximation of the metrics that allows effective optimization by gradient decent. This improve its performance on faithfullness evaluation. The method provides enhanced qualitative interpretability, while also achieving superior scores in quantitative faithfulness measurements.",
        "keywords": "feature attribution;Interpretability",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/0b25ddfbfba8c334b629109075d6fc9893000ac3.zip",
        "author": "Siyu Zhang;Kenneth McMillan",
        "authorids": "~Siyu_Zhang3;~Kenneth_McMillan1",
        "gender": "M;",
        "homepage": ";http://mcmil.net",
        "dblp": ";m/KennethLMcMillan.html",
        "google_scholar": ";pzFc-eEAAAAJ",
        "orcid": ";",
        "linkedin": "siyu-zhang/;",
        "or_profile": "~Siyu_Zhang3;~Kenneth_McMillan1",
        "aff": "University of Texas at Austin;University of Texas, Austin",
        "aff_domain": "utexas.edu;cs.utexas.edu",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nzhang2024toward,\ntitle={Toward \\${\\textbackslash}textbf\\{F\\}\\$aithfulness-guided \\${\\textbackslash}textbf\\{E\\}\\$nsemble \\${\\textbackslash}textbf\\{I\\}\\$nterpretation of Neural Network},\nauthor={Siyu Zhang and Kenneth McMillan},\nyear={2024},\nurl={https://openreview.net/forum?id=L7jtdGhWzT}\n}",
        "github": "",
        "project": "",
        "reviewers": "xnf4;tHJd;8Ctj",
        "site": "https://openreview.net/forum?id=L7jtdGhWzT",
        "pdf_size": 18064190,
        "rating": "3;5;6",
        "confidence": "2;2;3",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "2;2;3",
        "wc_summary": "45;46;74",
        "wc_strengths": "11;20;47",
        "wc_weaknesses": "155;86;42",
        "wc_questions": "118;66;1",
        "wc_review": "329;218;164",
        "wc_reply_reviewers": "16;0;0",
        "wc_reply_authors": "614;77;132",
        "reply_reviewers": "1;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            55.0,
            13.4412301024373
        ],
        "wc_strengths_avg": [
            26.0,
            15.297058540778355
        ],
        "wc_weaknesses_avg": [
            94.33333333333333,
            46.50686926561375
        ],
        "wc_questions_avg": [
            61.666666666666664,
            47.86323107447813
        ],
        "wc_review_avg": [
            237.0,
            68.68769904429759
        ],
        "wc_reply_reviewers_avg": [
            5.333333333333333,
            7.542472332656507
        ],
        "wc_reply_authors_avg": [
            274.3333333333333,
            241.22787751188477
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.7559289460184545,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Texas at Austin",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.utexas.edu",
        "aff_unique_abbr": "UT Austin",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Austin",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "ODICE: Revealing the Mystery of Distribution Correction Estimation via Orthogonal-gradient Update",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18871",
        "id": "L8UNn7Llt4",
        "author_site": "Liyuan Mao, Haoran Xu, Weinan Zhang, Xianyuan Zhan",
        "tldr": "",
        "abstract": "In this study, we investigate the DIstribution Correction Estimation (DICE) methods, an important line of work in offline reinforcement learning (RL) and imitation learning (IL). DICE-based methods impose state-action-level behavior constraint, which is an ideal choice for offline learning. However, they typically perform much worse than current state-of-the-art (SOTA) methods that solely use action-level behavior constraint. After revisiting DICE-based methods, we find there exist two gradient terms when learning the value function using true-gradient update: forward gradient (taken on the current state) and backward gradient (taken on the next state). Using forward gradient bears a large similarity to many offline RL methods, and thus can be regarded as applying action-level constraint. However, directly adding the backward gradient may degenerate or cancel out its effect if these two gradients have conflicting directions. To resolve this issue, we propose a simple yet effective modification that projects the backward gradient onto the normal plane of the forward gradient, resulting in an orthogonal-gradient update, a new learning rule for DICE-based methods. We conduct thorough theoretical analyses and find that the projected backward gradient brings state-level behavior regularization, which reveals the mystery of DICE-based methods: the value learning objective does try to impose state-action-level constraint, but needs to be used in a corrected way. Through toy examples and extensive experiments on complex offline RL and IL tasks, we demonstrate that DICE-based methods using orthogonal-gradient updates achieve SOTA performance and great robustness.",
        "keywords": "offline reinforcement learning;imitation learning;distribution correction estimation",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Liyuan Mao;Haoran Xu;Weinan Zhang;Xianyuan Zhan",
        "authorids": "~Liyuan_Mao2;~Haoran_Xu4;~Weinan_Zhang1;~Xianyuan_Zhan1",
        "gender": "M;M;M;M",
        "homepage": "https://ryanxhr.github.io/;http://wnzhang.net;http://zhanxianyuan.xyz/;https://github.com/maoliyuan",
        "dblp": ";28/10261-1;181/5081;",
        "google_scholar": "iX8AJI0AAAAJ;Qzss0GEAAAAJ;pDMnGloAAAAJ;",
        "orcid": ";0000-0002-0127-2425;0000-0002-3683-0554;",
        "linkedin": ";;;",
        "or_profile": "~Haoran_Xu4;~Weinan_Zhang1;~Xianyuan_Zhan1;~Liyuan_Richard_Mao1",
        "aff": "University of Texas at Austin;Shanghai Jiaotong University;Tsinghua University;Shanghai Jiaotong University",
        "aff_domain": "utexas.edu;sjtu.edu.cn;tsinghua.edu.cn;sjtu.edu.cn",
        "position": "PhD student;Associate Professor;Associate Professor;Undergrad student",
        "bibtex": "@inproceedings{\nmao2024odice,\ntitle={{ODICE}: Revealing the Mystery of Distribution Correction Estimation via Orthogonal-gradient Update},\nauthor={Liyuan Mao and Haoran Xu and Weinan Zhang and Xianyuan Zhan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=L8UNn7Llt4}\n}",
        "github": "",
        "project": "",
        "reviewers": "SNRk;g7U6;8gZ1;LpDw",
        "pdf_size": 958863,
        "rating": "6;8;8;8",
        "confidence": "4;4;4;3",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;4",
        "presentation": "3;3;3;4",
        "wc_summary": "122;192;137;40",
        "wc_strengths": "57;74;102;2",
        "wc_weaknesses": "130;30;223;2",
        "wc_questions": "211;153;76;77",
        "wc_review": "520;449;538;121",
        "wc_reply_reviewers": "56;50;19;0",
        "wc_reply_authors": "1332;345;1175;189",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "3;2;3;1",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            122.75,
            54.421388258661686
        ],
        "wc_strengths_avg": [
            58.75,
            36.49229370702806
        ],
        "wc_weaknesses_avg": [
            96.25,
            87.287957359535
        ],
        "wc_questions_avg": [
            129.25,
            56.596709268295804
        ],
        "wc_review_avg": [
            407.0,
            168.44138446355754
        ],
        "wc_reply_reviewers_avg": [
            31.25,
            22.862359895688808
        ],
        "wc_reply_authors_avg": [
            760.25,
            499.4183491823263
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 16,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3590969613897808110&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=L8UNn7Llt4",
        "pdf": "https://openreview.net/pdf?id=L8UNn7Llt4",
        "email": "utexas.edu;sjtu.edu.cn;tsinghua.edu.cn;sjtu.edu.cn",
        "author_num": 4,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "University of Texas at Austin;Shanghai Jiao Tong University;Tsinghua University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.utexas.edu;https://www.sjtu.edu.cn;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "UT Austin;SJTU;THU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Austin;",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "L9G9nR8fMF",
        "title": "LayerAct: Advancing CNNs with BatchNorm through Layer-direction Normalization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this work, we propose a novel activation mechanism aimed at establishing layer-level activation (LayerAct) functions for CNNs with BatchNorm. These functions are designed to be more noise-robust compared to existing element-level activation functions by reducing the layer-level fluctuation of the activation outputs due to shift in inputs. Moreover, the LayerAct functions achieve this noise-robustness independent of the activation's saturation state, which limits the activation output space and complicates efficient training. We present an analysis and experiments demonstrating that LayerAct functions exhibit superior noise-robustness compared to element-level activation functions, and empirically show that these functions have a zero-like mean activation. Experimental results with three benchmark datasets for image classification tasks show that LayerAct functions excel in handling noisy datasets, outperforming element-level activation functions, while the performance on clean datasets is also superior in most cases.",
        "keywords": "deep learning;activation function;cnn;convolutional neural network;batch normalization;layer-direction normalization;noise-robustness",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/78ae8c9c416b18af3eafd2effe45a928c734003a.zip",
        "author": "Kihyuk Yoon;Chiehyeon Lim",
        "authorids": "~Kihyuk_Yoon1;~Chiehyeon_Lim1",
        "gender": "M;",
        "homepage": ";http://service.unist.ac.kr/",
        "dblp": ";220/6678.html",
        "google_scholar": ";https://scholar.google.co.kr/citations?user=NW7F08MAAAAJ",
        "orcid": "0000-0003-0492-2865;0000-0001-6112-9674",
        "linkedin": ";chiehyeon",
        "or_profile": "~Kihyuk_Yoon1;~Chiehyeon_Lim1",
        "aff": "Ulsan National Institute of Science and Technology;Ulsan National Institute of Science and Technology",
        "aff_domain": "unist.ac.kr;unist.ac.kr",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\nyoon2024layeract,\ntitle={LayerAct: Advancing {CNN}s with BatchNorm through Layer-direction Normalization},\nauthor={Kihyuk Yoon and Chiehyeon Lim},\nyear={2024},\nurl={https://openreview.net/forum?id=L9G9nR8fMF}\n}",
        "github": "",
        "project": "",
        "reviewers": "1Eep;wLqf;RDYZ",
        "site": "https://openreview.net/forum?id=L9G9nR8fMF",
        "pdf_size": 906608,
        "rating": "5;6;8",
        "confidence": "4;3;2",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "3;3;3",
        "wc_summary": "77;48;107",
        "wc_strengths": "44;42;66",
        "wc_weaknesses": "406;59;2",
        "wc_questions": "2;6;212",
        "wc_review": "529;155;387",
        "wc_reply_reviewers": "383;82;46",
        "wc_reply_authors": "3220;959;4254",
        "reply_reviewers": "1;2;1",
        "reply_authors": "5;3;8",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            77.33333333333333,
            24.087802353519553
        ],
        "wc_strengths_avg": [
            50.666666666666664,
            10.873004286866726
        ],
        "wc_weaknesses_avg": [
            155.66666666666666,
            178.53539953994806
        ],
        "wc_questions_avg": [
            73.33333333333333,
            98.06573758907282
        ],
        "wc_review_avg": [
            357.0,
            154.15144068955914
        ],
        "wc_reply_reviewers_avg": [
            170.33333333333334,
            151.09452523356217
        ],
        "wc_reply_authors_avg": [
            2811.0,
            1375.9159373547016
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            5.333333333333333,
            2.0548046676563256
        ],
        "replies_avg": [
            31,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.9819805060619659,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:d7X3ha-9XqAJ:scholar.google.com/&scioq=LayerAct:+Advancing+CNNs+with+BatchNorm+through+Layer-direction+Normalization&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Ulsan National Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.unist.ac.kr",
        "aff_unique_abbr": "UNIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "L9JKhjbNsN",
        "title": "From Malicious to Marvelous: The Art of Adversarial Attack as Diffusion",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The ubiquitous presence of adversarial attacks in deep learning has been a source of frustration and challenge for researchers for years. However, in this work, we establish a new connection between adversarial attacks and the intricate process of diffusion. Specifically, we formulate an adversarial attack as a diffusion process, and by reverting this adversarial attack process, we have devised an innovative defense mechanism that stands out as a general-purpose defense against both black-box and white-box attacks.\nWe call this new mechanism a Reverse Adversarial Process (RAP), which is ensured by a theoretical treatment for deploying denoising diffusion models on arbitrary distributions.\nEmpirically, we found our model successfully defends against adversarial attacks with an unprecedented level of accuracy. For example, our approach has demonstrated exceptional performance on the \\textit{RobustBench}, a highly-regarded leaderboard for assessing adversarial robustness, outperforming previous state-of-the-art methods by a clear margin.",
        "keywords": "Adversarial Robustness;CIFAR-10;Reverse Adversarial Process;Diffusion Model",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Guangrun Wang;Chen Lin;Philip Torr",
        "authorids": "~Guangrun_Wang1;~Chen_Lin2;~Philip_Torr1",
        "gender": "M;M;",
        "homepage": "https://wanggrun.github.io;https://scholar.google.com/citations?hl=en&user=rObgGWIAAAAJ;http://www.robots.ox.ac.uk/~tvg/",
        "dblp": "165/1374.html;;",
        "google_scholar": "nuHIZx0AAAAJ;https://scholar.google.com/citations?hl=en;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Guangrun_Wang1;~Chen_Lin2;~Philip_Torr1",
        "aff": "University of Oxford;University of Oxford, University of Oxford;University of Oxford",
        "aff_domain": "ox.ac.uk;eng.ox.ac.uk;ox.ac.uk",
        "position": "Researcher;PhD student;Full Professor",
        "bibtex": "@misc{\nwang2024from,\ntitle={From Malicious to Marvelous: The Art of Adversarial Attack as Diffusion},\nauthor={Guangrun Wang and Chen Lin and Philip Torr},\nyear={2024},\nurl={https://openreview.net/forum?id=L9JKhjbNsN}\n}",
        "github": "",
        "project": "",
        "reviewers": "dpgy;ytzM;jmSw;Q6UJ",
        "site": "https://openreview.net/forum?id=L9JKhjbNsN",
        "pdf_size": 3752061,
        "rating": "1;3;6;8",
        "confidence": "4;4;4;4",
        "soundness": "1;2;3;3",
        "contribution": "1;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "86;91;67;306",
        "wc_strengths": "35;111;96;101",
        "wc_weaknesses": "156;416;36;45",
        "wc_questions": "4;46;241;213",
        "wc_review": "281;664;440;665",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            2.692582403567252
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            137.5,
            97.69467743945931
        ],
        "wc_strengths_avg": [
            85.75,
            29.794084983432533
        ],
        "wc_weaknesses_avg": [
            163.25,
            153.38737725119364
        ],
        "wc_questions_avg": [
            126.0,
            102.56461378077724
        ],
        "wc_review_avg": [
            512.5,
            162.06248794832194
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Ce5OXv9T1YEJ:scholar.google.com/&scioq=From+Malicious+to+Marvelous:+The+Art+of+Adversarial+Attack+as+Diffusion&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Oxford",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ox.ac.uk",
        "aff_unique_abbr": "Oxford",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "L9NM2CEol3",
        "title": "Speed Up Federated Learning in Heterogeneous Environment: A Dynamic Tiering Approach",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Federated learning (FL) enables collaboratively training a model while keeping the training data decentralized and private. However, one significant impediment to training a model using FL, especially large models, is the resource constraints of devices with heterogeneous computation and communication capacities as well as varying task sizes. \nSuch heterogeneity would render significant variations in the training time of clients, resulting in a longer overall training time as well as a waste of resources in faster clients. To tackle these heterogeneity issues, we propose the Dynamic Tiering-based Federated Learning (DTFL) system where slower clients dynamically offload part of the model to the server to alleviate resource constrains and speed up training. \nBy leveraging the concept of Split Learning, DTFL offloads different portions of the global model to clients in different tiers and enables each client to update the models in parallel via local-loss-based training. This helps reduce the computation and communication demand on resource-constrained devices and thus mitigates the straggler problem. \nDTFL introduces a dynamic tier scheduler that uses tier profiling to estimate the expected training time of each client, based on their historical training time, communication speed, and dataset size. The dynamic tier scheduler assigns clients to suitable tiers to minimize the overall training time in each round.\nWe first theoretically prove the convergence properties of DTFL. We then train large models (ResNet-56 and ResNet-110) on popular image datasets (CIFAR-10, CIFAR-100, CINIC-10, and HAM10000) under both IID and non-IID systems. Extensive experimental results show that compared with state-of-the-art FL methods, DTFL can significantly reduce the training time while maintaining model accuracy.",
        "keywords": "Federated Learning;Split Learning;Heterogeneous Clients",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/ac10538ae01b1f6276f3ec8c5a5cbd3daa5fffd9.pdf",
        "author": "Seyed Mahmoud Sajjadi Mohammadabadi;Syed Zawad;Feng Yan;Lei Yang",
        "authorids": "~Seyed_Mahmoud_Sajjadi_Mohammadabadi1;~Syed_Zawad1;~Feng_Yan2;~Lei_Yang1",
        "gender": ";;M;M",
        "homepage": ";http://www.cs.uh.edu/~fyan/;https://www.cse.unr.edu/~lyang/;https://www.semanticscholar.org/author/Syed-Zawad/70272436",
        "dblp": "364/0107;62/3960-1.html;50/2484-1;",
        "google_scholar": "tkhCR5IAAAAJ;iLE0_VAAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en",
        "orcid": "0009-0001-9629-9734;;;",
        "linkedin": "mahmoudsajjadi/;;;",
        "or_profile": "~Seyed_Mahmoud_Sajjadi_Mohammadabadi1;~Feng_Yan2;~Lei_Yang1;~Syed_Zawad2",
        "aff": "University of Nevada, Reno;University of Houston;University of Nevada, Reno;University of Nevada, Reno, University of Nevada, Reno",
        "aff_domain": "unr.edu;uh.edu;unr.edu;nevada.unr.edu",
        "position": "PhD student;Associate Professor;Associate Professor;PhD student",
        "bibtex": "@misc{\nmohammadabadi2024speed,\ntitle={Speed Up Federated Learning in Heterogeneous Environment: A Dynamic Tiering Approach},\nauthor={Seyed Mahmoud Sajjadi Mohammadabadi and Syed Zawad and Feng Yan and Lei Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=L9NM2CEol3}\n}",
        "github": "",
        "project": "",
        "reviewers": "Yytj;ncgY;f1S3",
        "site": "https://openreview.net/forum?id=L9NM2CEol3",
        "pdf_size": 705380,
        "rating": "3;3;5",
        "confidence": "5;3;3",
        "soundness": "2;2;2",
        "contribution": "1;2;2",
        "presentation": "2;2;2",
        "wc_summary": "73;59;110",
        "wc_strengths": "49;17;46",
        "wc_weaknesses": "193;158;251",
        "wc_questions": "60;6;36",
        "wc_review": "375;240;443",
        "wc_reply_reviewers": "287;0;202",
        "wc_reply_authors": "1698;633;1431",
        "reply_reviewers": "1;0;1",
        "reply_authors": "3;1;3",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            80.66666666666667,
            21.514852750806565
        ],
        "wc_strengths_avg": [
            37.333333333333336,
            14.429907214608907
        ],
        "wc_weaknesses_avg": [
            200.66666666666666,
            38.35216928530756
        ],
        "wc_questions_avg": [
            34.0,
            22.090722034374522
        ],
        "wc_review_avg": [
            352.6666666666667,
            84.36560647299085
        ],
        "wc_reply_reviewers_avg": [
            163.0,
            120.36887748361977
        ],
        "wc_reply_authors_avg": [
            1254.0,
            452.44005127751456
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5000000000000001,
        "gs_citation": 24,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15142102602003623621&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "University of Nevada;University of Houston;University of Nevada, Reno",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.unr.edu;https://www.uh.edu;https://www.unr.edu",
        "aff_unique_abbr": "UNR;UH;UNR",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Reno;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Concept Bottleneck Generative Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18870",
        "id": "L9U5MJJleF",
        "author_site": "Aya Abdelsalam Ismail, Julius Adebayo, Hector Corrada Bravo, Stephen Ra, Kyunghyun Cho",
        "tldr": "",
        "abstract": "We introduce a generative model with an intrinsically interpretable layer---a concept bottleneck layer---that constrains the model to encode human-understandable concepts. The concept bottleneck layer partitions the generative model into three parts: the pre-concept bottleneck portion, the CB layer, and the post-concept bottleneck portion. To train CB generative models, we complement the traditional task-based loss function for training generative models with a concept loss and an orthogonality loss. The CB layer and these loss terms are model agnostic, which we demonstrate by applying the CB layer to three different families of generative models: generative adversarial networks, variational autoencoders, and diffusion models. On multiple datasets across different types of generative models, steering a generative model, with the CB layer, outperforms all baselines---in some cases, it is \\textit{10 times} more effective. In addition, we show how the CB layer can be used to interpret the output of the generative model and debug the model during or post training.",
        "keywords": "Interpretability;generative models",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/18d6c8c979e6fca094062c3d55655ab4dce53aff.zip",
        "author": "Aya Abdelsalam Ismail;Julius Adebayo;Hector Corrada Bravo;Stephen Ra;Kyunghyun Cho",
        "authorids": "~Aya_Abdelsalam_Ismail1;~Julius_Adebayo1;~Hector_Corrada_Bravo1;~Stephen_Ra1;~Kyunghyun_Cho1",
        "gender": "F;M;M;M;M",
        "homepage": "https://ayaismail.com/;https://juliusadebayo.com/;http://hcbravolab.org;https://www.stephenra.com;http://kyunghyuncho.me",
        "dblp": "218/6661;146/1271;;255/5897;41/9736",
        "google_scholar": "VDhTJHUAAAAJ;y1bnRg4AAAAJ;QEVXP-kAAAAJ;bxl__-MAAAAJ;https://scholar.google.fi/citations?user=0RAmmIAAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Aya_Abdelsalam_Ismail1;~Julius_Adebayo1;~Hector_Corrada_Bravo1;~Stephen_Ra1;~Kyunghyun_Cho1",
        "aff": "Genentech;Guide Labs;Genentech;Prescient Design, Genentech;Genentech",
        "aff_domain": "gene.com;guidelabs.ai;gene.com;gene.com;gene.com",
        "position": "Researcher;Researcher;Principal Scientist;Director of Frontier Research;Senior Director of Frontier Research",
        "bibtex": "@inproceedings{\nismail2024concept,\ntitle={Concept Bottleneck Generative Models},\nauthor={Aya Abdelsalam Ismail and Julius Adebayo and Hector Corrada Bravo and Stephen Ra and Kyunghyun Cho},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=L9U5MJJleF}\n}",
        "github": "",
        "project": "",
        "reviewers": "5NVe;YbNz;9WtF;vC1Y",
        "pdf_size": 12419312,
        "rating": "6;6;6;6",
        "confidence": "4;3;3;3",
        "soundness": "2;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "101;205;29;126",
        "wc_strengths": "65;42;99;76",
        "wc_weaknesses": "387;224;46;176",
        "wc_questions": "118;58;30;153",
        "wc_review": "671;529;204;531",
        "wc_reply_reviewers": "363;58;0;0",
        "wc_reply_authors": "1901;1290;823;785",
        "reply_reviewers": "2;1;0;0",
        "reply_authors": "4;4;2;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            115.25,
            62.87437872456475
        ],
        "wc_strengths_avg": [
            70.5,
            20.524375751773793
        ],
        "wc_weaknesses_avg": [
            208.25,
            122.02945341187102
        ],
        "wc_questions_avg": [
            89.75,
            48.416810097320536
        ],
        "wc_review_avg": [
            483.75,
            171.46628677381452
        ],
        "wc_reply_reviewers_avg": [
            105.25,
            150.68406518275248
        ],
        "wc_reply_authors_avg": [
            1199.75,
            451.06949298306574
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.0,
            1.0
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 22,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9922341001083674528&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=L9U5MJJleF",
        "pdf": "https://openreview.net/pdf?id=L9U5MJJleF",
        "email": "gene.com;guidelabs.ai;gene.com;gene.com;gene.com",
        "author_num": 5,
        "aff_unique_index": "0;1;0;0;0",
        "aff_unique_norm": "Genentech;Guide Labs",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.genentech.com;",
        "aff_unique_abbr": "Genentech;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States;"
    },
    {
        "id": "L9kwewFGQZ",
        "title": "Mitigating Interference in the Knowledge Continuum through Attention-Guided Incremental Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Continual learning (CL) remains a significant challenge for deep neural networks, as it is prone to forgetting previously acquired knowledge. Several approaches have been proposed in the literature, such as experience rehearsal, regularization, and parameter isolation, to address this problem. Although almost zero forgetting can be achieved in task-incremental learning, class-incremental learning remains highly challenging due to the problem of inter-task class separation. Limited access to previous task data makes it difficult to discriminate between classes of current and previous tasks. To address this issue, we propose `Attention-Guided Incremental Learning' (AGILE), a novel rehearsal-based CL approach that incorporates compact task-attention to effectively reduce interference between tasks. AGILE utilizes lightweight, learnable task projection vectors to transform the latent representations of a shared task-attention module toward task distribution. Through extensive empirical evaluation we show that AGILE significantly improves generalization performance by mitigating task interference and outperforms rehearsal-based approaches in several CL scenarios. Furthermore AGILE can scale well to a large number of tasks with minimal overhead while remaining well-calibrated with reduced task-recency bias.",
        "keywords": "Continual Learning;Catastrophic Forgetting;Experience Rehearsal;Class Incremental Learning;Task Incremental Learning;Lifelong Learning;Task Attention",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/ddbb8e151e9a29e5c70bbc8c7de9ab041bd73f78.zip",
        "author": "Prashant Shivaram Bhat;Bharath Chennamkulam Renjith;Bahram Zonooz;Elahe Arani",
        "authorids": "~Prashant_Shivaram_Bhat1;~Bharath_Chennamkulam_Renjith1;~Bahram_Zonooz1;~Elahe_Arani1",
        "gender": "M;M;M;F",
        "homepage": ";;https://sites.google.com/view/bahramzonooz;https://sites.google.com/view/elahe-arani",
        "dblp": "340/2336;;250/9573;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;;e_I_v6cAAAAJ",
        "orcid": ";;;0000-0002-0952-7007",
        "linkedin": "prashant-s-bhat/;bharath-c-renjith/;;elahe-arani-630870b2/",
        "or_profile": "~Prashant_Shivaram_Bhat1;~Bharath_Chennamkulam_Renjith1;~Bahram_Zonooz1;~Elahe_Arani1",
        "aff": "Eindhoven University of Technology;TomTom;Eindhoven University of Technology;Wayve Technologies Ltd",
        "aff_domain": "tue.nl;tomtom.com;tue.nl;wayve.ai",
        "position": "PhD student;Researcher;Assistant Professor;Head of AI Research",
        "bibtex": "@misc{\nbhat2024mitigating,\ntitle={Mitigating Interference in the Knowledge Continuum through Attention-Guided Incremental Learning},\nauthor={Prashant Shivaram Bhat and Bharath Chennamkulam Renjith and Bahram Zonooz and Elahe Arani},\nyear={2024},\nurl={https://openreview.net/forum?id=L9kwewFGQZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "n4fn;zq89;2y3j;5d1d;pnnH",
        "site": "https://openreview.net/forum?id=L9kwewFGQZ",
        "pdf_size": 816257,
        "rating": "3;5;5;5;5",
        "confidence": "5;5;4;3;4",
        "soundness": "2;3;1;3;2",
        "contribution": "2;2;2;2;2",
        "presentation": "3;2;2;2;2",
        "wc_summary": "45;67;116;67;34",
        "wc_strengths": "22;38;140;17;20",
        "wc_weaknesses": "129;31;144;132;91",
        "wc_questions": "37;136;130;46;14",
        "wc_review": "233;272;530;262;159",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "457;1093;913;777;621",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "1;2;2;2;1",
        "rating_avg": [
            4.6,
            0.7999999999999999
        ],
        "confidence_avg": [
            4.2,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.2,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.2,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            65.8,
            28.166646942793882
        ],
        "wc_strengths_avg": [
            47.4,
            46.86832619157633
        ],
        "wc_weaknesses_avg": [
            105.4,
            41.22426469932484
        ],
        "wc_questions_avg": [
            72.6,
            50.444424865390225
        ],
        "wc_review_avg": [
            291.2,
            125.78616776100621
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            772.2,
            221.34714816324154
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.6,
            0.4898979485566356
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5345224838248488,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:XFzb7lw38pkJ:scholar.google.com/&scioq=Mitigating+Interference+in+the+Knowledge+Continuum+through+Attention-Guided+Incremental+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "Eindhoven University of Technology;TomTom;Wayve Technologies",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.tue.nl;https://www.tomtom.com;https://www.wayvetechnologies.com",
        "aff_unique_abbr": "TU/e;TomTom;Wayve",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "Netherlands;United Kingdom"
    },
    {
        "id": "LAEd3kHao9",
        "title": "Prompting Language-Informed Distribution for Compositional Zero-Shot Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Compositional zero-shot learning (CZSL) task aims to recognize unseen compositional visual concepts, e.g., sliced tomatoes, where the model is learned only from the seen compositions, e.g., sliced potatoes and red tomatoes. Thanks to the prompt tuning on large pre-trained visual language models such as CLIP, recent literature shows impressively better CZSL performance than traditional vision-based methods. However, the key aspects that impact the generalization to unseen compositions, including the diversity and informativeness of class context, and the entanglement between visual primitives, i.e., state and object, are not properly addressed in existing CLIP-based CZSL literature. In this paper, we propose a model by prompting the language-informed distribution, aka., PLID, for the CZSL task. Specifically, the PLID leverages pre-trained large language models (LLM) to 1) formulate the language-informed class distributions which are diverse and informative, and 2) enhance the compositionality of the class embedding. Moreover, a visual-language primitive decomposition (VLPD) module and a stochastic logit mixup (SLM) strategy are proposed to dynamically fuse the decisions from the compositional and the primitive logit space. Orthogonal to the existing literature of soft, hard, or distributional prompts, our method advocates prompting the LLM-supported class distribution that leads to a better zero-shot generalization. Experimental results on MIT-States, UT-Zappos, and C-GQA datasets show the superior performance of the PLID to the prior arts. The code and models will be publicly released.",
        "keywords": "Compositional Zero-shot Learning; Visual Language Modeling",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/4343e40d2517be0b96e0340d88318f5126c52cef.pdf",
        "author": "Wentao Bao;Lichang Chen;Heng Huang;Yu Kong",
        "authorids": "~Wentao_Bao3;~Lichang_Chen2;~Heng_Huang1;~Yu_Kong3",
        "gender": ";;M;",
        "homepage": ";;https://www.cs.umd.edu/~heng/;",
        "dblp": ";;03/281;",
        "google_scholar": ";;4OqLaDwAAAAJ;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Wentao_Bao3;~Lichang_Chen2;~Heng_Huang1;~Yu_Kong3",
        "aff": ";;Department of Computer Science, University of Maryland, College Park;",
        "aff_domain": ";;cs.umd.edu;",
        "position": ";;Full Professor;",
        "bibtex": "@misc{\nbao2024prompting,\ntitle={Prompting Language-Informed Distribution for Compositional Zero-Shot Learning},\nauthor={Wentao Bao and Lichang Chen and Heng Huang and Yu Kong},\nyear={2024},\nurl={https://openreview.net/forum?id=LAEd3kHao9}\n}",
        "github": "",
        "project": "",
        "reviewers": "feoJ;BPd3;FS69;4PfY",
        "site": "https://openreview.net/forum?id=LAEd3kHao9",
        "pdf_size": 936533,
        "rating": "5;5;5;6",
        "confidence": "5;4;5;3",
        "soundness": "3;3;2;3",
        "contribution": "3;2;2;3",
        "presentation": "3;2;2;3",
        "wc_summary": "61;318;65;51",
        "wc_strengths": "15;163;31;35",
        "wc_weaknesses": "68;645;142;109",
        "wc_questions": "1;72;2;5",
        "wc_review": "145;1198;240;200",
        "wc_reply_reviewers": "0;221;0;0",
        "wc_reply_authors": "278;1051;384;282",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            123.75,
            112.26614583212519
        ],
        "wc_strengths_avg": [
            61.0,
            59.36328831862332
        ],
        "wc_weaknesses_avg": [
            241.0,
            234.7179158053343
        ],
        "wc_questions_avg": [
            20.0,
            30.058276730378275
        ],
        "wc_review_avg": [
            445.75,
            435.61931488399364
        ],
        "wc_reply_reviewers_avg": [
            55.25,
            95.69580711818047
        ],
        "wc_reply_authors_avg": [
            498.75,
            321.6592723675162
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8703882797784891,
        "gs_citation": 23,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6663377252866769733&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Maryland, College Park",
        "aff_unique_dep": "Department of Computer Science",
        "aff_unique_url": "https://www/umd.edu",
        "aff_unique_abbr": "UMD",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "College Park",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "LBmhxzCJOb",
        "title": "Heterogeneous Value Alignment Evaluation for Large Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The emergent capabilities of Large Language Models (LLMs) have made it crucial to align their values with those of humans. However, current methodologies typically attempt to assign value as an attribute to LLMs, yet lack attention to the ability to pursue value and the importance of transferring heterogeneous values in specific practical applications. In this paper, we propose a Heterogeneous Value Alignment Evaluation (HVAE) system, designed to assess the success of aligning LLMs with heterogeneous values. Specifically, our approach first bring the Social Value Orientation (SVO) framework from social psychology, which corresponds to how much weight a person attaches to the welfare of others in relation to the own. We then assign the LLMs with difference social values and measure whether their behaviors align with the inducing values. We conduct evaluations with new auto-metric \\textit{value rationality} to represents the ablitiy of LLMs to alignment with specific values. Evaluating the value rationality of five mainstream LLMs, we discern a propensity in LLMs towards neutral values over pronounced personal values. By examining the behavior of these LLMs, we contribute to a deeper insight into the value alignment of LLMs within a heterogeneous value system.",
        "keywords": "Value Alignment Evaluation;Social Value Orientation;Value Rationality",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Zhaowei Zhang;Ceyao Zhang;Nian Liu;Siyuan Qi;Ziqi Rong;Song-Chun Zhu;Shuguang Cui;Yaodong Yang",
        "authorids": "~Zhaowei_Zhang2;~Ceyao_Zhang1;~Nian_Liu4;~Siyuan_Qi1;~Ziqi_Rong1;~Song-Chun_Zhu1;~Shuguang_Cui1;~Yaodong_Yang1",
        "gender": "M;M;;;M;M;M;M",
        "homepage": "https://zowiezhang.github.io;;;;https://zqrong.com;https://zhusongchun.net/;https://sse.cuhk.edu.cn/en/content/1415;https://www.yangyaodong.com",
        "dblp": "127/1796;277/1121;;177/5178;;10/10313;48/4914;170/1496-1",
        "google_scholar": "https://scholar.google.com.hk/citations?view_op=list_works;OadTFGMAAAAJ;;ePclJR4AAAAJ;oTH0DJcAAAAJ;https://scholar.google.com.tw/citations?user=Al8dyb4AAAAJ;https://scholar.google.com.hk/citations?user=1o_qvR0AAAAJ;https://scholar.google.co.uk/citations?user=6yL0xw8AAAAJ",
        "orcid": ";0000-0003-2544-0718;;0000-0002-4070-733X;0000-0003-3760-8450;;0000-0003-2608-775X;0000-0001-8132-5613",
        "linkedin": ";ceyao-charles-zhang-02536815b;;;;;;yaodong-yang",
        "or_profile": "~Zhaowei_Zhang2;~Ceyao_Zhang1;~Nian_Liu4;~Siyuan_Qi1;~Ziqi_Rong1;~Song-Chun_Zhu1;~Shuguang_Cui1;~Yaodong_Yang1",
        "aff": "Peking University;The Chinese University of Hong Kong, Shenzhen;;Beijing Institute for General Artificial Intelligence;University of Michigan - Ann Arbor;Peking University;The Chinese University of Hong Kong, Shenzhen;Peking University",
        "aff_domain": "pku.edu.cn;cuhk.edu.cn;;bigai.ai;umich.edu;pku.edu.cn;cuhk.edu.cn;pku.edu.cn",
        "position": "PhD student;PhD student;;Researcher;MS student;Full Professor;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nzhang2024heterogeneous,\ntitle={Heterogeneous Value Alignment Evaluation for Large Language Models},\nauthor={Zhaowei Zhang and Ceyao Zhang and Nian Liu and Siyuan Qi and Ziqi Rong and Song-Chun Zhu and Shuguang Cui and Yaodong Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=LBmhxzCJOb}\n}",
        "github": "",
        "project": "",
        "reviewers": "urTP;eMvm;P3tB;UkcL",
        "site": "https://openreview.net/forum?id=LBmhxzCJOb",
        "pdf_size": 1896724,
        "rating": "3;3;3;3",
        "confidence": "5;4;4;4",
        "soundness": "2;2;3;2",
        "contribution": "2;2;2;2",
        "presentation": "2;3;3;2",
        "wc_summary": "109;125;72;66",
        "wc_strengths": "16;25;59;9",
        "wc_weaknesses": "580;83;153;38",
        "wc_questions": "17;73;1;29",
        "wc_review": "722;306;285;142",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            93.0,
            24.748737341529164
        ],
        "wc_strengths_avg": [
            27.25,
            19.188212527486765
        ],
        "wc_weaknesses_avg": [
            213.5,
            215.53016030245047
        ],
        "wc_questions_avg": [
            30.0,
            26.739483914241877
        ],
        "wc_review_avg": [
            363.75,
            216.247976869149
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3894130910482498756&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;3;0;1;0",
        "aff_unique_norm": "Peking University;Chinese University of Hong Kong;Beijing Institute for General Artificial Intelligence;University of Michigan",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.cuhk.edu.cn;http://www.bigaiai.org/;https://www.umich.edu",
        "aff_unique_abbr": "Peking U;CUHK;BIGAI;UM",
        "aff_campus_unique_index": "1;2;1",
        "aff_campus_unique": ";Shenzhen;Ann Arbor",
        "aff_country_unique_index": "0;0;0;1;0;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "LCQ7YTzgRQ",
        "title": "On the Role of Edge Dependency in Graph Generative Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this work, we introduce a novel evaluation framework for generative models of graphs, emphasizing the importance of model-generated graph *overlap* (Chanpuriya et al., 2021) to ensure both accuracy and edge-diversity. We delineate a hierarchy of graph generative models categorized into three levels of complexity: edge independent, node independent, and fully dependent models. This hierarchy encapsulates a wide range of prevalent methods. We derive  theoretical bounds on the number of triangles and other short-length cycles producible by each level of the hierarchy, contingent on the model overlap. We provide instances demonstrating the asymptotic optimality of our bounds.  Furthermore, we introduce new generative models for each of the three hierarchical levels, leveraging dense subgraph discovery (Gionis & Tsourakakis, 2015). Our evaluation, conducted on real-world datasets, focuses on assessing the output quality and overlap of our proposed models in comparison to other popular models. Our results indicate that our simple, interpretable models provide competitive baselines to popular generative models. Through this investigation, we aim to propel the advancement of graph generative models by offering a structured framework and robust evaluation metrics, thereby facilitating the development of models capable of generating accurate and edge-diverse graphs.",
        "keywords": "graph;network;generative;model;random;dependence;overlap;triangle;cycle;bound",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/58c4b8fa8c5c2f4bc812035cdcd527ab16658bd4.zip",
        "author": "Sudhanshu Chanpuriya;Cameron N Musco;Konstantinos Sotiropoulos;Charalampos Tsourakakis",
        "authorids": "~Sudhanshu_Chanpuriya1;~Cameron_N_Musco1;~Konstantinos_Sotiropoulos1;~Charalampos_Tsourakakis1",
        "gender": ";M;M;M",
        "homepage": ";https://people.cs.umass.edu/~cmusco/;http://cs-people.bu.edu/ksotirop/;https://tsourakakis.com/",
        "dblp": ";149/2327;182/6845;https://dblp.uni-trier.de/pers/hd/t/Tsourakakis:Charalampos_E=",
        "google_scholar": ";EeYGZCwAAAAJ;https://scholar.google.com/citations?hl=en;IkEXPUEAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Sudhanshu_Chanpuriya1;~Cameron_N_Musco1;~Konstantinos_Sotiropoulos1;~Charalampos_Tsourakakis1",
        "aff": ";University of Massachusetts, Amherst;Meta Facebook;Boston University",
        "aff_domain": ";umass.edu;meta.com;bu.edu",
        "position": ";Assistant Professor;Research Scientist;Assistant Professor",
        "bibtex": "@misc{\nchanpuriya2024on,\ntitle={On the Role of Edge Dependency in Graph Generative Models},\nauthor={Sudhanshu Chanpuriya and Cameron N Musco and Konstantinos Sotiropoulos and Charalampos Tsourakakis},\nyear={2024},\nurl={https://openreview.net/forum?id=LCQ7YTzgRQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "4Knv;ofBG;AsDh;V9nt",
        "site": "https://openreview.net/forum?id=LCQ7YTzgRQ",
        "pdf_size": 826970,
        "rating": "5;6;6;8",
        "confidence": "4;4;4;4",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "65;65;130;154",
        "wc_strengths": "26;45;168;36",
        "wc_weaknesses": "163;181;210;56",
        "wc_questions": "120;32;69;152",
        "wc_review": "374;323;577;398",
        "wc_reply_reviewers": "193;0;251;0",
        "wc_reply_authors": "1447;786;1288;789",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "3;1;3;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            103.5,
            39.423977475642914
        ],
        "wc_strengths_avg": [
            68.75,
            57.69477879323223
        ],
        "wc_weaknesses_avg": [
            152.5,
            58.18290126832797
        ],
        "wc_questions_avg": [
            93.25,
            46.116022161500446
        ],
        "wc_review_avg": [
            418.0,
            95.71050099127055
        ],
        "wc_reply_reviewers_avg": [
            111.0,
            112.87825299852935
        ],
        "wc_reply_authors_avg": [
            1077.5,
            295.40015233577657
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            1.0
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11830894031227101403&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of Massachusetts Amherst;Meta;Boston University",
        "aff_unique_dep": ";Meta Platforms, Inc.;",
        "aff_unique_url": "https://www.umass.edu;https://meta.com;https://www.bu.edu",
        "aff_unique_abbr": "UMass Amherst;Meta;BU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Amherst;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "LCpayOuqBx",
        "title": "DOS: Dreaming Outlier Semantics for Out-of-distribution Detection",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Detecting out-of-distribution (OOD) samples is essential when deploying machine learning models in open-world scenarios. Zero-shot OOD detection, requiring no training on in-distribution (ID) data, has been possible with the advent of vision-language models like CLIP. This scenario presents a more practical alternative than traditional OOD detection. By building a text-based classifier with only closed-set labels, the model can achieve impressive OOD detection performance. However, this largely restricts the inherent capability of CLIP to recognize samples from large, open label space, making it insufficient to detect hard OOD samples effectively. In this paper, we provide a new perspective to tackle the constraints posed by exclusively employing closed-set ID labels in zero-shot OOD detection. We propose leveraging the expert knowledge and reasoning capability of large language models (LLM) to Dream potential Outlier Semantics, termed DOS, without access to any actual OOD data. Owing to better consideration of open-world scenarios, DOS can be generalized to different OOD detection tasks, including far, near, and fine-grained OOD detection. Technically, we design (1) LLM prompts based on visual similarity to generate potential outlier class labels specialized for OOD detection, as well as (2) a new score function based on the proportionality between potential outlier and ID class labels to distinguish hard OOD samples effectively. Empirically, our method achieves new state-of-the-art performance across different OOD tasks and can be effectively scaled to the large-scale ImageNet-1K dataset.",
        "keywords": "Out-of-distribution Detection",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Chentao Cao;Zhun Zhong;Zhanke Zhou;Yang Liu;Tongliang Liu;Bo Han",
        "authorids": "~Chentao_Cao1;~Zhun_Zhong1;~Zhanke_Zhou1;~Yang_Liu3;~Tongliang_Liu1;~Bo_Han1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://github.com/Aboriginer;http://zhunzhong.site;https://andrewzhou924.github.io/;http://www.yliuu.com;https://tongliang-liu.github.io/;https://bhanml.github.io/",
        "dblp": "320/1115.html;32/6525;285/5311;51/3710-18;150/6667;241/0472-3",
        "google_scholar": "vZPl_oQAAAAJ;nZizkQ0AAAAJ;GVXErr0AAAAJ;jKrIVCIAAAAJ;https://scholar.google.com.au/citations?user=EiLdZ_YAAAAJ;nTNjqHwAAAAJ",
        "orcid": ";;;0000-0001-8420-6011;;",
        "linkedin": ";;;;;",
        "or_profile": "~Chentao_Cao1;~Zhun_Zhong1;~Zhanke_Zhou1;~Yang_Liu3;~Tongliang_Liu1;~bo_han2",
        "aff": "Hong Kong Baptist University;University of Nottingham;Hong Kong Baptist University;University of California, Santa Cruz;Mohamed bin Zayed University of Artificial Intelligence;MBZUAI",
        "aff_domain": "hkbu.edu.hk;nottingham.ac.uk;hkbu.edu.hk;ucsc.edu;mbzuai.ac.ae;mbzuai.ac.ae",
        "position": "PhD student;Assistant Professor;PhD student;Assistant Professor;Affiliated Associate Professor;Researcher",
        "bibtex": "@misc{\ncao2024dos,\ntitle={{DOS}: Dreaming Outlier Semantics for Out-of-distribution Detection},\nauthor={Chentao Cao and Zhun Zhong and Zhanke Zhou and Yang Liu and Tongliang Liu and Bo Han},\nyear={2024},\nurl={https://openreview.net/forum?id=LCpayOuqBx}\n}",
        "github": "",
        "project": "",
        "reviewers": "WwTG;yFD8;5Vrp;vW8h",
        "site": "https://openreview.net/forum?id=LCpayOuqBx",
        "pdf_size": 5151413,
        "rating": "3;3;6;8",
        "confidence": "3;3;4;4",
        "soundness": "2;2;4;4",
        "contribution": "2;2;3;2",
        "presentation": "3;3;3;4",
        "wc_summary": "20;74;74;68",
        "wc_strengths": "20;70;52;58",
        "wc_weaknesses": "161;253;194;125",
        "wc_questions": "29;5;5;49",
        "wc_review": "230;402;325;300",
        "wc_reply_reviewers": "0;0;0;54",
        "wc_reply_authors": "2645;1570;1763;1347",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "6;4;5;4",
        "rating_avg": [
            5.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            1.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            59.0,
            22.64950330581225
        ],
        "wc_strengths_avg": [
            50.0,
            18.49324200890693
        ],
        "wc_weaknesses_avg": [
            183.25,
            47.087020504593404
        ],
        "wc_questions_avg": [
            22.0,
            18.411952639521967
        ],
        "wc_review_avg": [
            314.25,
            61.475096583901355
        ],
        "wc_reply_reviewers_avg": [
            13.5,
            23.382685902179844
        ],
        "wc_reply_authors_avg": [
            1831.25,
            492.34051986404694
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.75,
            0.82915619758885
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.9428090415820635,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:GuisLRwtqpcJ:scholar.google.com/&scioq=DOS:+Dreaming+Outlier+Semantics+for+Out-of-distribution+Detection&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;2;3;3",
        "aff_unique_norm": "Hong Kong Baptist University;University of Nottingham;University of California, Santa Cruz;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.hkbu.edu.hk;https://www.nottingham.ac.uk;https://www.ucsc.edu;https://mbzuai.ac.ae",
        "aff_unique_abbr": "HKBU;UoN;UCSC;MBZUAI",
        "aff_campus_unique_index": "0;0;2",
        "aff_campus_unique": "Hong Kong SAR;;Santa Cruz",
        "aff_country_unique_index": "0;1;0;2;3;3",
        "aff_country_unique": "China;United Kingdom;United States;United Arab Emirates"
    },
    {
        "title": "ZipIt! Merging Models from Different Tasks without Training",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18869",
        "id": "LEYUkvdUhq",
        "author_site": "George Stoica, Daniel Bolya, Jakob Bjorner, Pratik Ramesh, Taylor Hearn, Judy Hoffman",
        "tldr": "",
        "abstract": "Typical deep visual recognition models are capable of performing the one task they were trained on. In this paper, we tackle the extremely difficult problem of combining distinct models with different initializations, each solving a separate task, into one multi-task model without any additional training. Prior work in model merging permutes one model to the space of the other then averages them together. While this works for models trained on the same task, we find that this fails to account for the differences in models trained on disjoint tasks. Thus, we introduce \"ZipIt!\", a general method for merging two arbitrary models of the same architecture that incorporates two simple strategies. First, in order to account for features that aren't shared between models, we expand the model merging problem to allow for merging features within each model by defining a general \"zip\" operation. Second, we add support for partially zipping the models up until a specified layer, naturally creating a multi-head model. We find that these two changes combined account for 20-60% improvement over prior work, making it more feasible to merge models trained on disjoint tasks without retraining.",
        "keywords": "Model Merging;Mode Connectivity;Classification;Deep Learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "George Stoica;Daniel Bolya;Jakob Brandt Bjorner;Pratik Ramesh;Taylor Hearn;Judy Hoffman",
        "authorids": "~George_Stoica1;~Daniel_Bolya1;~Jakob_Brandt_Bjorner1;~Pratik_Ramesh1;~Taylor_Hearn1;~Judy_Hoffman1",
        "gender": "M;M;;M;M;F",
        "homepage": "https://gstoica27.github.io/;https://dbolya.github.io;;https://pratikramesh1.github.io/;;https://www.cc.gatech.edu/~judy/",
        "dblp": ";239/4186.html;;;;45/10336",
        "google_scholar": "GN_9dYIAAAAJ;K3ht_ZUAAAAJ;;zJyuMYgAAAAJ;;mqpjAt4AAAAJ",
        "orcid": ";;;;;",
        "linkedin": "george--stoica/;daniel-bolya-060398130/;;pratik-ramesh-234471114/;taylor-hearn-521175128/;",
        "or_profile": "~George_Stoica1;~Daniel_Bolya1;~Jakob_Brandt_Bjorner1;~Pratik_Ramesh1;~Taylor_Hearn1;~Judy_Hoffman1",
        "aff": "Georgia Institute of Technology;Georgia Institute of Technology;;Microsoft;;Georgia Institute of Technology",
        "aff_domain": "gatech.edu;gatech.edu;;microsoft.com;;gatech.edu",
        "position": "PhD student;PhD student;;Intern;;Assistant Professor",
        "bibtex": "@inproceedings{\nstoica2024zipit,\ntitle={ZipIt! Merging Models from Different Tasks without Training},\nauthor={George Stoica and Daniel Bolya and Jakob Brandt Bjorner and Pratik Ramesh and Taylor Hearn and Judy Hoffman},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=LEYUkvdUhq}\n}",
        "github": "",
        "project": "",
        "reviewers": "pbds;SEiC;GcCE;3tA9",
        "pdf_size": 1811542,
        "rating": "5;6;6;6",
        "confidence": "4;4;3;3",
        "soundness": "3;3;2;3",
        "contribution": "2;2;3;3",
        "presentation": "2;4;3;4",
        "wc_summary": "66;64;40;85",
        "wc_strengths": "59;48;105;155",
        "wc_weaknesses": "63;145;125;98",
        "wc_questions": "131;92;375;170",
        "wc_review": "319;349;645;508",
        "wc_reply_reviewers": "59;5;0;0",
        "wc_reply_authors": "769;355;1416;432",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            63.75,
            15.974589196595948
        ],
        "wc_strengths_avg": [
            91.75,
            42.31651568832198
        ],
        "wc_weaknesses_avg": [
            107.75,
            30.75203245315665
        ],
        "wc_questions_avg": [
            192.0,
            109.19478009502103
        ],
        "wc_review_avg": [
            455.25,
            130.99689881825446
        ],
        "wc_reply_reviewers_avg": [
            16.0,
            24.9098374141623
        ],
        "wc_reply_authors_avg": [
            743.0,
            418.589894765748
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 100,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4231471510092547910&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=LEYUkvdUhq",
        "pdf": "https://openreview.net/pdf?id=LEYUkvdUhq",
        "email": "gatech.edu;gatech.edu;;microsoft.com;;gatech.edu",
        "author_num": 6,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Georgia Institute of Technology;Microsoft",
        "aff_unique_dep": ";Microsoft Corporation",
        "aff_unique_url": "https://www.gatech.edu;https://www.microsoft.com",
        "aff_unique_abbr": "Georgia Tech;Microsoft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "LEuuOaZNOT",
        "title": "Learning Boolean functions with neural networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Many works have shown learnability of functions on the Boolean hypercube via gradient descent. These analyses of gradient descent use the convexity of the problem to establish guarantees despite the fact that most loss functions are highly non-convex.  In addition, the analyses explicitly show that the hypothesis class can approximate the target function; this is known as a representation theorem.  In this work we give gradient descent guarantees for learning functions on the Boolean hypercube on both the mean squared and hinge losses with $2$-layer neural networks with a single hidden non-linear layer.  Furthermore, all of our analyses apply to the ReLU activation function.  Moreover, on both losses, we don't make use of any convexity of the problem, and don't explicitly prove a representation theorem.  A representation theorem is a consequence of our analysis.  In the hinge loss setting to learn size $k$ parities, with dimension $n$, and $\\epsilon$ error, we obtain bounds of $n^{O(k)}poly(\\frac{1}{\\epsilon})$ and $n^{O(k)}\\log(\\frac{1}{\\epsilon})$ for network width and samples, and iterations needed, respectively. This upper bound matches the SQ lower bounds of $n^{\\Omega(k)}$.  In the mean squared loss setting, given that the Fourier spectrum of an activation function has non-zero Fourier coefficients up to degree $k$, and given that the best degree $k$ polynomial approximation of the target function is $\\epsilon_0$ in mean squared loss,  we give guarantees for network width and samples, and iterations needed of $n^{O(k)}poly(\\frac{1}{\\epsilon})$ and $n^{O(k)}\\log(\\frac{1}{\\epsilon})$ respectively for an error of  $\\epsilon+ \\epsilon_0$.  To the best of our knowledge, our bounds of $n^{O(k)}\\log(\\frac{1}{\\epsilon})$ iterations needed for learning degree $k$ polynomials on both losses are better than any previous bounds in the Boolean setting, which is a consequence of not using any convexity of the problem in our analysis.  Specifically, in other works in the Boolean setting, the bound on iterations is $n^{O(k)}poly(\\frac{1}{\\epsilon})$.  Moreover, as a corollary to our agnostic learning guarantee, we establish that lower degree Fourier components are learned before higher degree ones, a phenomenon observed experimentally.  Finally, as a corollary to our mean squared loss guarantee, we show that neural networks with sparse hidden ReLU units as target functions can be efficiently learned with gradient descent.",
        "keywords": "Deep Learning Theory;Learning Theory;Gradient Descent;Analysis of Boolean functions",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/f697425d6aa1eaee1eb510ae97172250be57f996.zip",
        "author": "Will Burstein",
        "authorids": "~Will_Burstein1",
        "gender": "M",
        "homepage": "",
        "dblp": "",
        "google_scholar": "",
        "orcid": "",
        "linkedin": "will-burstein-6b3a7927/",
        "or_profile": "~Will_Burstein1",
        "aff": "University of Rochester",
        "aff_domain": "rochester.edu",
        "position": "PhD student",
        "bibtex": "@misc{\nburstein2024learning,\ntitle={Learning Boolean functions with neural networks},\nauthor={Will Burstein},\nyear={2024},\nurl={https://openreview.net/forum?id=LEuuOaZNOT}\n}",
        "github": "",
        "project": "",
        "reviewers": "LdZ7;cvKh;gUqw",
        "site": "https://openreview.net/forum?id=LEuuOaZNOT",
        "pdf_size": 276761,
        "rating": "3;3;3",
        "confidence": "3;3;3",
        "soundness": "2;3;2",
        "contribution": "2;2;3",
        "presentation": "1;2;1",
        "wc_summary": "61;78;72",
        "wc_strengths": "12;37;115",
        "wc_weaknesses": "230;148;103",
        "wc_questions": "4;123;258",
        "wc_review": "307;386;548",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            70.33333333333333,
            7.039570693980959
        ],
        "wc_strengths_avg": [
            54.666666666666664,
            43.86595744107522
        ],
        "wc_weaknesses_avg": [
            160.33333333333334,
            52.57587110283787
        ],
        "wc_questions_avg": [
            128.33333333333334,
            103.76362025724087
        ],
        "wc_review_avg": [
            413.6666666666667,
            100.31395161635737
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:7AO23klZOygJ:scholar.google.com/&scioq=Learning+Boolean+functions+with+neural+networks&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Rochester",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.rochester.edu",
        "aff_unique_abbr": "U of R",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "LGXlMmDarK",
        "title": "On the Stochasticity in Graph Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph neural networks (GNNs) that aggregate and transform point masses as \\textit{messages} manifest a wide array of symptoms including limited expressiveness, over-smoothing, and over-squashing.\nWhen stochasticity is injected into the structure of the graph, these problems can be jointly remedied, as shown in the unifying framework herein, which theoretically justifies the superior performance of a number of GNN architectures that incorporate random regularization.\nFor the first time, we discover that simple GNNs can \\textit{exceed} the power of the Weisfeiler-Lehman test when equipped with structural stochasticity.\nWith insights drawn from the theoretical arguments, we design a principled way to quantify the structural uncertainty in GNNs via variational inference, termed Bayesian Rewiring of Node Networks (BRONX), and showcase its competitive performance with real-world experiments.",
        "keywords": "Graph Neural Networks;Variational Inference",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Yuanqing Wang;Theofanis Karaletsos",
        "authorids": "~Yuanqing_Wang1;~Theofanis_Karaletsos1",
        "gender": "M;M",
        "homepage": "https://wangyq.net;http://karaletsos.com/",
        "dblp": "83/7566;31/11191",
        "google_scholar": "Njp5EY4AAAAJ;zrxafGsAAAAJ",
        "orcid": ";",
        "linkedin": "yuanqing-wang/;",
        "or_profile": "~Yuanqing_Wang1;~Theofanis_Karaletsos1",
        "aff": "New York University;Pyramidal, Inc",
        "aff_domain": "nyu.edu;pyramidal.ai",
        "position": "Postdoc;Researcher",
        "bibtex": "@misc{\nwang2024on,\ntitle={On the Stochasticity in Graph Neural Networks},\nauthor={Yuanqing Wang and Theofanis Karaletsos},\nyear={2024},\nurl={https://openreview.net/forum?id=LGXlMmDarK}\n}",
        "github": "",
        "project": "",
        "reviewers": "7ZWa;cENw;NERp",
        "site": "https://openreview.net/forum?id=LGXlMmDarK",
        "pdf_size": 517470,
        "rating": "3;5;6",
        "confidence": "3;4;2",
        "soundness": "2;3;3",
        "contribution": "1;2;3",
        "presentation": "2;2;3",
        "wc_summary": "70;75;104",
        "wc_strengths": "58;6;135",
        "wc_weaknesses": "191;25;128",
        "wc_questions": "74;61;135",
        "wc_review": "393;167;502",
        "wc_reply_reviewers": "68;0;0",
        "wc_reply_authors": "523;177;352",
        "reply_reviewers": "1;0;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            83.0,
            14.98888477061141
        ],
        "wc_strengths_avg": [
            66.33333333333333,
            52.99266196580638
        ],
        "wc_weaknesses_avg": [
            114.66666666666667,
            68.42189383198594
        ],
        "wc_questions_avg": [
            90.0,
            32.25936556516056
        ],
        "wc_review_avg": [
            354.0,
            139.51582944837
        ],
        "wc_reply_reviewers_avg": [
            22.666666666666668,
            32.05550741379015
        ],
        "wc_reply_authors_avg": [
            350.6666666666667,
            141.25705488773139
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.3273268353539886,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Djio57-9e9QJ:scholar.google.com/&scioq=On+the+Stochasticity+in+Graph+Neural+Networks&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "New York University;Pyramidal, Inc",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.nyu.edu;",
        "aff_unique_abbr": "NYU;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "LGzTtvisL3",
        "title": "FLea: Improving federated learning on scarce and label-skewed data via privacy-preserving feature augmentation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Learning a global model by abstracting the knowledge, distributed across multiple clients, without aggregating the raw data is the primary goal of Federated Learning (FL). Typically, this works in rounds alternating between parallel local training at several clients, followed by model aggregation at a server. We found that existing FL methods under-perform when local datasets are small and present severe label skew as these lead to over-fitting and local model bias. This is a realistic setting in many real-world applications. To address the problem, \nwe propose FLea, a unified framework that tackles over-fitting and local bias by encouraging clients to exchange privacy-protected features to aid local training. The features refer to activations from an intermediate layer of the model, which are obfuscated before being shared with other clients to protect sensitive information in the data. FLea leverages a novel way of combining local and shared features as augmentations to enhance local model learning. Our extensive experiments demonstrate that FLea outperforms the start-of-the-art FL methods, sharing only model parameters, by up to $17.6\\%$, and also outperforms the FL methods that share data augmentations by up to $6.3\\%$, while reducing the privacy vulnerability associated with shared data augmentations.",
        "keywords": "Federated learning;label skew;data scaricity;classification",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/5584e7e05cb05206decc8fd6cdf1826154dfbd4b.zip",
        "author": "Tong Xia;Abhirup Ghosh;Cecilia Mascolo",
        "authorids": "~Tong_Xia2;~Abhirup_Ghosh1;~Cecilia_Mascolo1",
        "gender": "M;F;F",
        "homepage": "https://abhirupju.github.io/;http://www.cl.cam.ac.uk/users/cm542;https://xtxiatong.github.io/",
        "dblp": "143/7545;21/6419;",
        "google_scholar": "https://scholar.google.co.uk/citations?user=JY7HrcQAAAAJ;https://scholar.google.com/citations?hl=en;A7QsKzUAAAAJ",
        "orcid": "0000-0003-4044-8523;0000-0001-9614-4380;0000-0002-6994-6318",
        "linkedin": "abhirup-ghosh-cs/;;",
        "or_profile": "~Abhirup_Ghosh1;~Cecilia_Mascolo1;~Tong_Xia1",
        "aff": "University of Birmingham;University of Cambridge;University of Cambridge",
        "aff_domain": "bham.ac.uk;cam.ac.uk;cam.ac.uk",
        "position": "Assistant Professor;Full Professor;PhD student",
        "bibtex": "@misc{\nanonymous2024flea,\ntitle={{FL}ea: Improving federated learning on scarce and label-skewed data via  privacy-preserving feature augmentation},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=LGzTtvisL3}\n}",
        "github": "",
        "project": "",
        "reviewers": "66Ba;mFBA;vPSz;BqfA",
        "site": "https://openreview.net/forum?id=LGzTtvisL3",
        "pdf_size": 6389610,
        "rating": "3;5;5;6",
        "confidence": "5;3;3;4",
        "soundness": "1;2;2;2",
        "contribution": "2;2;2;3",
        "presentation": "2;2;2;3",
        "wc_summary": "56;58;55;89",
        "wc_strengths": "15;31;48;121",
        "wc_weaknesses": "362;224;154;239",
        "wc_questions": "34;39;5;49",
        "wc_review": "467;352;262;498",
        "wc_reply_reviewers": "0;0;0;26",
        "wc_reply_authors": "1324;1615;1066;1135",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "2;3;2;2",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            64.5,
            14.186260959111108
        ],
        "wc_strengths_avg": [
            53.75,
            40.54241606022019
        ],
        "wc_weaknesses_avg": [
            244.75,
            74.91119742735394
        ],
        "wc_questions_avg": [
            31.75,
            16.361158271956175
        ],
        "wc_review_avg": [
            394.75,
            93.98237866749277
        ],
        "wc_reply_reviewers_avg": [
            6.5,
            11.258330249197702
        ],
        "wc_reply_authors_avg": [
            1285.0,
            212.65112273392774
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.6225430174794673,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14323315899600393965&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "University of Birmingham;University of Cambridge",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.birmingham.ac.uk;https://www.cam.ac.uk",
        "aff_unique_abbr": "Birmingham;Cambridge",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Cambridge",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "LH2JNpfwdH",
        "title": "Towards 4D Human Video Stylization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We present a first step towards 4D (3D and time) human video stylization, which addresses style transfer, novel view synthesis and human animation within a unified framework. While numerous video stylization methods have been developed, they are often restricted to rendering images in specific viewpoints of the input video, lacking the capability to generalize to novel views and novel poses in dynamic scenes. To overcome these limitations, we leverage Neural Radiance Fields (NeRFs) to represent videos, conducting stylization in the rendered feature space. Our innovative approach involves the simultaneous representation of both the human subject and the surrounding scene using two NeRFs. This dual representation facilitates the animation of human subjects across various poses and novel viewpoints. Specifically, we introduce a novel geometry-guided tri-plane representation, significantly enhancing feature representation robustness compared to direct tri-plane optimization. Following the video reconstruction, stylization is performed within the NeRFs' rendered feature space. Extensive experiments demonstrate that the proposed method strikes a superior balance between stylized textures and temporal coherence, surpassing existing approaches. Furthermore, our framework uniquely extends its capabilities to accommodate novel poses and viewpoints, making it a versatile tool for creative human video stylization. The source code and trained models will be made available to the public.",
        "keywords": "Video Stylization; Stylization",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/e5d3d6ab3b407716a1890f4ce1c9c7abb11c04f8.zip",
        "author": "Tiantian Wang;Xinxin Zuo;Fangzhou Mu;Jian Wang;Ming-Hsuan Yang",
        "authorids": "~Tiantian_Wang2;~Xinxin_Zuo1;~Fangzhou_Mu1;~Jian_Wang10;~Ming-Hsuan_Yang1",
        "gender": "F;F;M;M;M",
        "homepage": "https://scholar.google.com/citations?user=YeURc_8AAAAJ&hl=en;https://sites.google.com/site/xinxinzuohome/;https://fmu2.github.io/;https://jianwang-cmu.github.io/;https://faculty.ucmerced.edu/mhyang/",
        "dblp": "66/4971-2;167/3181;262/6282;39/449-100;79/3711.html",
        "google_scholar": "YeURc_8AAAAJ;lv0UjhIAAAAJ;OOymFJsAAAAJ;https://scholar.google.ca/citations?user=WNmw2VkAAAAJ;p9-ohHsAAAAJ",
        "orcid": ";0000-0002-7116-9634;0000-0001-5580-2404;0000-0001-5266-3808;0000-0003-4848-2304",
        "linkedin": ";xinxin-zuo-898419199/;;jian-james-wang-62997944/;minghsuanyang/",
        "or_profile": "~Tiantian_Wang2;~Xinxin_Zuo1;~Fangzhou_Mu1;~Jian_Wang10;~Ming-Hsuan_Yang1",
        "aff": "University of California Merced;Huawei Technologies Ltd.;NVIDIA;Snap Inc.;University of California at Merced",
        "aff_domain": "ucmerced.edu;huawei.com;nvidia.com;snapchat.com;umcerced.edu",
        "position": "PhD student;Researcher;Researcher;Researcher;Professor",
        "bibtex": "@misc{\nwang2024towards,\ntitle={Towards 4D Human Video Stylization},\nauthor={Tiantian Wang and Xinxin Zuo and Fangzhou Mu and Jian Wang and Ming-Hsuan Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=LH2JNpfwdH}\n}",
        "github": "",
        "project": "",
        "reviewers": "smP6;uFnH;xdnP",
        "site": "https://openreview.net/forum?id=LH2JNpfwdH",
        "pdf_size": 3705799,
        "rating": "5;6;6",
        "confidence": "3;2;4",
        "soundness": "3;2;3",
        "contribution": "3;3;2",
        "presentation": "3;3;3",
        "wc_summary": "69;56;58",
        "wc_strengths": "48;94;19",
        "wc_weaknesses": "143;33;195",
        "wc_questions": "75;25;8",
        "wc_review": "335;208;280",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "752;554;731",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            61.0,
            5.715476066494082
        ],
        "wc_strengths_avg": [
            53.666666666666664,
            30.879694874715902
        ],
        "wc_weaknesses_avg": [
            123.66666666666667,
            67.53435339802172
        ],
        "wc_questions_avg": [
            36.0,
            28.437065014988214
        ],
        "wc_review_avg": [
            274.3333333333333,
            52.0021367082375
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            679.0,
            88.80315309717331
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:oj-sqDUAgGUJ:scholar.google.com/&scioq=Towards+4D+Human+Video+Stylization&hl=en&as_sdt=0,5",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2;3;0",
        "aff_unique_norm": "University of California, Merced;Huawei;NVIDIA;Snap Inc.",
        "aff_unique_dep": ";Huawei Technologies;NVIDIA Corporation;",
        "aff_unique_url": "https://www.ucmerced.edu;https://www.huawei.com;https://www.nvidia.com;https://www.snapinc.com",
        "aff_unique_abbr": "UC Merced;Huawei;NVIDIA;Snap",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Merced;",
        "aff_country_unique_index": "0;1;0;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "LIBZ7Mp0OJ",
        "title": "Fairness Metric Impossibility: Investigating and Addressing Conflicts",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Fairness-aware ML (FairML) applications are often characterized by intricate social objectives and legal requirements, often encompassing multiple, potentially conflicting notions of fairness. Despite the well-known Impossibility Theorem of Fairness and vast theoretical research on the statistical and socio-technical trade-offs between fairness metrics, many FairML approaches still optimize for a single, user-defined fairness objective. However, this one-sided optimization can inadvertently lead to violations of other pertinent notions of fairness, resulting in adverse social consequences. In this exploratory and empirical study, we address the presence of fairness-metric conflicts by treating fairness metrics as conflicting objectives in a multi-objective (MO) sense. To efficiently explore multiple fairness-accuracy trade-offs and effectively balance conflicts between various fairness objectives, we introduce the ManyFairHPO framework, a novel many-objective (MaO) hyper-parameter optimization (HPO) approach. By enabling fairness practitioners to specify and explore complex and multiple fairness objectives, we open the door to further socio-technical research on effectively combining the complementary benefits of different notions of fairness.",
        "keywords": "Fairness;Multi-objective optimization;Hyperparameter Optimization",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/3ed2e83e546716b8040df5c6d54ec2a6da5caafd.pdf",
        "author": "Jake Robertson;Noor Awad;Thorsten L Schmidt;Frank Hutter",
        "authorids": "~Jake_Robertson1;~Noor_Awad1;~Thorsten_L_Schmidt1;~Frank_Hutter1",
        "gender": "M;F;M;M",
        "homepage": ";https://ml.informatik.uni-freiburg.de/profile/awad/;http://ml.informatik.uni-freiburg.de/~hutter/;https://www.stochastik.uni-freiburg.de/de/professoren/thorsten-schmidt",
        "dblp": ";;89/5383;",
        "google_scholar": ";https://scholar.google.de/citations?user=GW49_WoAAAAJ;https://scholar.google.de/citations?user=YUrxwrkAAAAJ;",
        "orcid": "0000-0001-6231-6834;;0000-0002-2037-3694;0000-0001-9254-4010",
        "linkedin": ";;frank-hutter-9190b24b/;",
        "or_profile": "~Jake_Robertson1;~Noor_Awad1;~Frank_Hutter1;~Thorsten_Schmidt2",
        "aff": "ELLIS Institute T\u00fcbingen;Albert-Ludwigs-Universit\u00e4t Freiburg;Albert-Ludwigs-Universit\u00e4t Freiburg;Albert-Ludwigs-Universit\u00e4t Freiburg",
        "aff_domain": "tue.ellis.eu;uni-freiburg.de;uni-freiburg.de;uni-freiburg.de",
        "position": "PhD student;Postdoc;Full Professor;Full Professor",
        "bibtex": "@misc{\nrobertson2024fairness,\ntitle={Fairness Metric Impossibility: Investigating and Addressing Conflicts},\nauthor={Jake Robertson and Noor Awad and Thorsten L Schmidt and Frank Hutter},\nyear={2024},\nurl={https://openreview.net/forum?id=LIBZ7Mp0OJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "XwAL;k3oE;bcZi;RKvV",
        "site": "https://openreview.net/forum?id=LIBZ7Mp0OJ",
        "pdf_size": 4223111,
        "rating": "3;5;5;6",
        "confidence": "4;4;3;5",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;2",
        "presentation": "2;2;3;4",
        "wc_summary": "61;134;22;177",
        "wc_strengths": "85;65;16;72",
        "wc_weaknesses": "241;188;82;1042",
        "wc_questions": "86;90;1;1",
        "wc_review": "473;477;121;1292",
        "wc_reply_reviewers": "0;85;0;387",
        "wc_reply_authors": "701;1048;338;1268",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "4;6;2;3",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            98.5,
            60.58258825768341
        ],
        "wc_strengths_avg": [
            59.5,
            26.119915773217954
        ],
        "wc_weaknesses_avg": [
            388.25,
            381.759331909516
        ],
        "wc_questions_avg": [
            44.5,
            43.522982434571276
        ],
        "wc_review_avg": [
            590.75,
            429.8897387703038
        ],
        "wc_reply_reviewers_avg": [
            118.0,
            159.1367336600824
        ],
        "wc_reply_authors_avg": [
            838.75,
            352.7629338521835
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.75,
            1.479019945774904
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3244428422615251,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:jev_Lm_K1IMJ:scholar.google.com/&scioq=Fairness+Metric+Impossibility:+Investigating+and+Addressing+Conflicts&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "ELLIS Institute;Albert-Ludwigs-Universit\u00e4t Freiburg",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://ellis.eu/;https://www.uni-freiburg.de",
        "aff_unique_abbr": "ELLIS;Albert-Ludwigs-Universit\u00e4t",
        "aff_campus_unique_index": "0;1;1;1",
        "aff_campus_unique": "T\u00fcbingen;Freiburg",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "LIW88mwqgv",
        "title": "Enhancing Chain-of-Thoughts Prompting with Iterative Bootstrapping in Large Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large language models (LLMs) can achieve impressive performance on various reasoning tasks by incorporating chain-of-thought (CoT) prompting, where step-by-step reasoning is provided to guide LLMs to generate answers to questions, and the question-rationale-answer triplets are utilized as demonstration exemplars. However, the reasoning chains of demonstrations generated by LLMs are observed to be prone to errors, which can subsequently lead to incorrect reasoning during inference. Furthermore, inappropriate exemplars, e.g., overly simplistic or complex exemplars depending on the question's difficulty level, can affect the LLM's performance. To address these issues, we introduce Iter-CoT (Iterative bootstrapping in Chain-of-Thoughts prompting). Iter-CoT has two advantages: (1) it adopts iterative bootstrapping that enables LLMs to rectify errors autonomously, resulting in more precise and comprehensive reasoning chains. (2) it selects exemplars of challenging yet answerable (i.e., the LLM has the potential to answer correctly) questions, enhancing the LLMs' generalizability to answer questions with varying difficulty levels. Experimental results exhibit Iter-CoT superior performance on three distinct reasoning tasks on eleven datasets.",
        "keywords": "Chain-of-Thought;In-context Learning;Large Language Models",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/e993e7b27d2ae2162d1015baae5fc99041aa62c2.zip",
        "author": "Jiashuo Sun;Yi Luo;Yeyun Gong;Chen Lin;yelong shen;Jian Guo;Nan Duan",
        "authorids": "~Jiashuo_Sun1;~Yi_Luo7;~Yeyun_Gong2;~Chen_Lin5;~yelong_shen1;~Jian_Guo2;~Nan_Duan1",
        "gender": "M;F;M;F;;M;M",
        "homepage": "https://github.com/gasolsun36;https://yiluo59.github.io/;;https://xmudm.github.io/publications/;;https://idea.edu.cn/person/guojian/;https://nanduan.github.io/",
        "dblp": "336/2528;;06/10400.html;37/3102-1.html;;96/2596-2;",
        "google_scholar": "https://scholar.google.com.hk/citations?user=JCUiEM4AAAAJ;;piUkwMYAAAAJ;z1l2JSMAAAAJ;;;Qaa6OxIAAAAJ",
        "orcid": ";;;0000-0002-2275-997X;;;",
        "linkedin": "jiashuo-sun-b67857190/;;;;;;",
        "or_profile": "~Jiashuo_Sun1;~Yi_Luo7;~Yeyun_Gong2;~Chen_Lin5;~yelong_shen1;~Jian_Guo2;~Nan_Duan1",
        "aff": "Xiamen University;Xiamen University;Microsoft;Xiamen University;;International Digital Economy Academy, International Digital Economy Academy;Microsoft Research Asia",
        "aff_domain": "xmu.edu.cn;xmu.edu.cn;microsoft.com;xmu.edu.cn;;idea.edu.cn;microsoft.com",
        "position": "MS student;MS student;Researcher;Full Professor;;Researcher;Principal Researcher",
        "bibtex": "@misc{\nsun2024enhancing,\ntitle={Enhancing Chain-of-Thoughts Prompting with Iterative Bootstrapping in Large Language Models},\nauthor={Jiashuo Sun and Yi Luo and Yeyun Gong and Chen Lin and yelong shen and Jian Guo and Nan Duan},\nyear={2024},\nurl={https://openreview.net/forum?id=LIW88mwqgv}\n}",
        "github": "",
        "project": "",
        "reviewers": "uFPN;gmng;TzhJ;3Dhx",
        "site": "https://openreview.net/forum?id=LIW88mwqgv",
        "pdf_size": 1463534,
        "rating": "3;5;6;6",
        "confidence": "4;4;4;4",
        "soundness": "2;3;3;2",
        "contribution": "1;3;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "128;74;66;129",
        "wc_strengths": "63;80;56;111",
        "wc_weaknesses": "150;303;202;209",
        "wc_questions": "89;23;1;12",
        "wc_review": "430;480;325;461",
        "wc_reply_reviewers": "77;0;0;47",
        "wc_reply_authors": "727;676;771;422",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            99.25,
            29.38856069970083
        ],
        "wc_strengths_avg": [
            77.5,
            21.219095173922945
        ],
        "wc_weaknesses_avg": [
            216.0,
            55.15886148208645
        ],
        "wc_questions_avg": [
            31.25,
            34.23722389446901
        ],
        "wc_review_avg": [
            424.0,
            59.87904474855957
        ],
        "wc_reply_reviewers_avg": [
            31.0,
            32.76430985081175
        ],
        "wc_reply_authors_avg": [
            649.0,
            135.30151514303157
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 24,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11507295886826236361&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;1;0;2;1",
        "aff_unique_norm": "Xiamen University;Microsoft;International Digital Economy Academy",
        "aff_unique_dep": ";Microsoft Corporation;",
        "aff_unique_url": "https://www.xmu.edu.cn;https://www.microsoft.com;",
        "aff_unique_abbr": "XMU;Microsoft;",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Asia",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "China;United States;"
    },
    {
        "title": "SWAP: Sparse Entropic Wasserstein Regression for Robust Network Pruning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18868",
        "id": "LJWizuuBUy",
        "author_site": "Lei You, Hei Victor Cheng",
        "tldr": "",
        "abstract": "This study addresses the challenge of inaccurate gradients in computing the empirical Fisher Information Matrix during network pruning. We introduce SWAP, a formulation of Entropic Wasserstein regression (EWR) for network pruning, capitalizing on the geometric properties of the optimal transport problem. The \u201cswap\u201d of the commonly used linear regression with the EWR in optimization is analytically demonstrated to offer noise mitigation effects by incorporating neighborhood interpolation across data points with only marginal additional computational cost. The unique strength of SWAP is its intrinsic ability to balance noise reduction and covariance information preservation effectively. Extensive experiments performed on various networks and datasets show comparable performance of SWAP with state-of-the-art (SoTA) network pruning algorithms. Our proposed method outperforms the SoTA when the network size or the target sparsity is large, the gain is even larger with the existence of noisy gradients, possibly from noisy data, analog memory, or adversarial attacks. Notably, our proposed method achieves a gain of 6% improvement in accuracy and 8% improvement in testing loss for MobileNetV1 with less than one-fourth of the network parameters remaining.",
        "keywords": "Network Pruning;Model Compression;Optimal Transport;Wasserstein Distance;Deep Learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Lei You;Hei Victor Cheng",
        "authorids": "~Lei_You1;~Hei_Victor_Cheng1",
        "gender": "M;M",
        "homepage": "https://leiyou.me;",
        "dblp": "43/2613-2;07/11155.html",
        "google_scholar": "https://scholar.google.dk/citations?user=DTpo_scAAAAJ;https://scholar.google.ca/citations?user=9wyK_RwAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Lei_You1;~Hei_Victor_Cheng1",
        "aff": "Technical University of Denmark;Aarhus University",
        "aff_domain": "dtu.dk;au.dk",
        "position": "Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nyou2024swap,\ntitle={{SWAP}: Sparse Entropic Wasserstein Regression for Robust Network Pruning},\nauthor={Lei You and Hei Victor Cheng},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=LJWizuuBUy}\n}",
        "github": "",
        "project": "",
        "reviewers": "yr3z;u9iD;WJBJ;5Zk8;e6Ww",
        "pdf_size": 861463,
        "rating": "6;6;6;6;8",
        "confidence": "2;2;2;3;3",
        "soundness": "3;2;3;3;3",
        "contribution": "3;2;3;3;3",
        "presentation": "3;3;3;3;2",
        "wc_summary": "97;67;79;60;273",
        "wc_strengths": "25;70;37;28;169",
        "wc_weaknesses": "21;44;32;61;225",
        "wc_questions": "59;33;29;3;62",
        "wc_review": "202;214;177;152;729",
        "wc_reply_reviewers": "5;0;17;22;56",
        "wc_reply_authors": "438;756;445;534;824",
        "reply_reviewers": "1;0;1;1;1",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            6.4,
            0.7999999999999999
        ],
        "confidence_avg": [
            2.4,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.8,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            115.2,
            79.89092564240322
        ],
        "wc_strengths_avg": [
            65.8,
            54.019996297667404
        ],
        "wc_weaknesses_avg": [
            76.6,
            75.37798086974736
        ],
        "wc_questions_avg": [
            37.2,
            21.655484293822663
        ],
        "wc_review_avg": [
            294.8,
            218.14618951519643
        ],
        "wc_reply_reviewers_avg": [
            20.0,
            19.667231630303235
        ],
        "wc_reply_authors_avg": [
            599.4,
            160.70793384273225
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.6123724356957946,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4487078275191443435&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=LJWizuuBUy",
        "pdf": "https://openreview.net/pdf?id=LJWizuuBUy",
        "email": "dtu.dk;au.dk",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Technical University of Denmark;Aarhus University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tek.dk;https://au.dk",
        "aff_unique_abbr": "DTU;AU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Denmark"
    },
    {
        "id": "LKlvfyh68V",
        "title": "GUARD: A Safe Reinforcement Learning Benchmark",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Due to the trial-and-error nature, it is typically challenging to apply RL algorithms to safety-critical real-world applications, such as autonomous driving, human-robot interaction, robot manipulation, etc, where such errors are not tolerable.\nRecently, safe RL (i.e., constrained RL) has emerged rapidly in the literature, in which the agents explore the environment while satisfying constraints. Due to the diversity of algorithms and tasks, it remains difficult to compare existing safe RL algorithms.\nTo fill that gap, we introduce GUARD, a Generalized Unified SAfe Reinforcement Learning Development Benchmark.\nGUARD has several advantages compared to existing benchmarks. First, GUARD is a generalized benchmark with a wide variety of RL agents, tasks, and safety constraint specifications. Second, GUARD comprehensively covers state-of-the-art safe RL algorithms with self-contained implementations. Third, GUARD is highly customizable in tasks and algorithms. We present a comparison of state-of-the-art safe RL algorithms in various task settings using GUARD and establish baselines that future work can build on.",
        "keywords": "Safe Reinforcement Learning;Reinforcement Learning Benchmark;Safe Reinforcement Learning Algorithm;Customizable;Robotics",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/e1738699c099fe32fcdec5a79d1e82ee884f4f50.zip",
        "author": "Weiye Zhao;Rui Chen;Yifan Sun;Ruixuan Liu;Tianhao Wei;Feihan Li;Changliu Liu",
        "authorids": "~Weiye_Zhao1;~Rui_Chen11;~Yifan_Sun9;~Ruixuan_Liu1;~Tianhao_Wei1;~Feihan_Li1;~Changliu_Liu1",
        "gender": "M;M;M;M;M;M;F",
        "homepage": "https://github.com/CaesarAndylaw;https://ruichen.pub/;https://yifansun98.github.io/;https://waynekyrie.github.io/home/;;;http://www.cs.cmu.edu/~cliu6/index.html",
        "dblp": "228/6863;;99/10261-11;;222/5386;;166/3563",
        "google_scholar": "P-79KOcAAAAJ;XiUE0wMAAAAJ;DGhQSYUAAAAJ;3v7sVbwAAAAJ;V22j1C0AAAAJ;;",
        "orcid": "0000-0002-8426-5238;0000-0002-8671-8771;0009-0007-2073-7789;0000-0001-6249-5473;;0000-0003-1770-4664;",
        "linkedin": ";;yifansun1/;ruixuan-wayne-liu-a71b50127/;;;",
        "or_profile": "~Weiye_Zhao1;~Rui_Chen11;~Yifan_Sun9;~Ruixuan_Liu1;~Tianhao_Wei1;~Feihan_Li1;~Changliu_Liu1",
        "aff": "Carnegie Mellon University;Carnegie Mellon University;Carnegie Mellon University;Carnegie Mellon University;Carnegie Mellon University;Tsinghua University;Carnegie Mellon University",
        "aff_domain": "andrew.cmu.edu;andrew.cmu.edu;andrew.cmu.edu;andrew.cmu.edu;andrew.cmu.edu;tsinghua.edu.cn;cmu.edu",
        "position": "PhD student;PhD student;PhD student;PhD student;PhD student;Undergrad student;Assistant Professor",
        "bibtex": "@misc{\nzhao2024guard,\ntitle={{GUARD}: A Safe Reinforcement Learning Benchmark},\nauthor={Weiye Zhao and Rui Chen and Yifan Sun and Ruixuan Liu and Tianhao Wei and Feihan Li and Changliu Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=LKlvfyh68V}\n}",
        "github": "",
        "project": "",
        "reviewers": "pZKJ;GDT3;9XUs;rfzD",
        "site": "https://openreview.net/forum?id=LKlvfyh68V",
        "pdf_size": 5394811,
        "rating": "3;5;5;6",
        "confidence": "4;5;5;3",
        "soundness": "2;3;4;3",
        "contribution": "2;2;3;3",
        "presentation": "3;4;3;3",
        "wc_summary": "66;89;167;133",
        "wc_strengths": "39;108;99;124",
        "wc_weaknesses": "240;141;321;100",
        "wc_questions": "183;68;57;46",
        "wc_review": "528;406;644;403",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            113.75,
            39.04724702203729
        ],
        "wc_strengths_avg": [
            92.5,
            32.159757461772
        ],
        "wc_weaknesses_avg": [
            200.5,
            86.19889790478763
        ],
        "wc_questions_avg": [
            88.5,
            55.111251119893836
        ],
        "wc_review_avg": [
            495.25,
            99.59260765739594
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.20751433915982243,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1913011720971941697&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0;0;1;0",
        "aff_unique_norm": "Carnegie Mellon University;Tsinghua University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cmu.edu;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "CMU;THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;1;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "LKx4rubqkO",
        "title": "Metric Learning for Detection of Large Language Model Generated Texts",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "More efforts are being put into improving Large Language Models' (LLM) capabilities than into dealing with their implications. \nCurrent LLMs are able to generate texts that are seemingly indistinguishable from those written by human experts. While offering great quality of life, such breakthroughs also pose new challenges in education, science, and a multitude of other areas. To add up, current approaches in LLM text detection are either computationally expensive or need accesses to the LLMs' internal computations, both of which hinder their public accessibility. With such motivation, this paper presents a new paradigm of metric-based detection for LLM-generated texts that is able to balance among computational costs, accessibility, and performances. Specifically, the detection is performed through evaluating the similarity between a given text to an equivalent example generated by LLMs and through that determining the former's origination. In terms of architecture, the detection framework includes a text embedding model and a metric model. Currently, the embedding component is a pretrained language model. We focus on designing the metric component which is trained with triplets of same-context instances to signify distances between human responses and LLM ones while reducing that among LLM texts. Additionally, we develop and publish four datasets totaling over 85,000 prompts and triplets of responses in which one from human and two from GPT-3.5 TURBO for benchmarking and uses by the public. Experiment studies show that our best architectures maintain F1 scores in between 0.87 to 0.95 across the tested corpora in both same-corpus and out-of-corpus settings, either with or without paraphrasing.",
        "keywords": "LLM text detection;synthetic text detection;metric learning;same-context triplet training",
        "primary_area": "metric learning, kernel learning, and sparse coding",
        "supplementary_material": "",
        "author": "Linh Le;Shashank Hebbar;My Nguyen",
        "authorids": "~Linh_Le3;~Shashank_Hebbar1;~My_Nguyen2",
        "gender": "M;;",
        "homepage": "https://facultyweb.kennesaw.edu/lle13;;",
        "dblp": ";;",
        "google_scholar": "5C6ZFSUAAAAJ;kc82vdUAAAAJ;",
        "orcid": "0000-0002-0087-3448;;",
        "linkedin": "linhle-ds/;;mytnguyen/",
        "or_profile": "~Linh_Le3;~Shashank_Hebbar1;~My_Nguyen2",
        "aff": "Kennesaw State University;;Boston University, Boston University",
        "aff_domain": "kennesaw.edu;;bu.edu",
        "position": "Assistant Professor;;MS student",
        "bibtex": "@misc{\nle2024metric,\ntitle={Metric Learning for Detection of Large Language Model Generated Texts},\nauthor={Linh Le and Shashank Hebbar and My Nguyen},\nyear={2024},\nurl={https://openreview.net/forum?id=LKx4rubqkO}\n}",
        "github": "",
        "project": "",
        "reviewers": "CEgw;7NGJ;X5RJ;8Zoy",
        "site": "https://openreview.net/forum?id=LKx4rubqkO",
        "pdf_size": 865507,
        "rating": "3;3;3;6",
        "confidence": "5;4;3;4",
        "soundness": "2;2;1;3",
        "contribution": "2;2;2;3",
        "presentation": "1;3;3;3",
        "wc_summary": "59;91;73;97",
        "wc_strengths": "52;9;113;49",
        "wc_weaknesses": "384;244;2;24",
        "wc_questions": "131;6;1;10",
        "wc_review": "626;350;189;180",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "262;63;104;79",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            80.0,
            15.0
        ],
        "wc_strengths_avg": [
            55.75,
            37.157603528753036
        ],
        "wc_weaknesses_avg": [
            163.5,
            158.62140460858365
        ],
        "wc_questions_avg": [
            37.0,
            54.36451048248296
        ],
        "wc_review_avg": [
            336.25,
            180.44441664955997
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            127.0,
            79.30006305167733
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:9S25lcZCtIAJ:scholar.google.com/&scioq=Metric+Learning+for+Detection+of+Large+Language+Model+Generated+Texts&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Kennesaw State University;Boston University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.kennesaw.edu;https://www.bu.edu",
        "aff_unique_abbr": "KSU;BU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Boston",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "LLbHdII8Pg",
        "title": "Two Birds with One Stone: Protecting DNN Models Against Unauthorized Inference and Domain Transfer",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep neural network (DNN) models are valuable intellectual property (IP) owing to their impressive performance, which might be extracted for illegal use. While existing protection schemes primarily focus on preventing attackers from obtaining the well-performed model, the transferability of such extracted models has been largely under-explored, where attackers could transfer the model to another domain with good performance. \nFor the first time, this work jointly considers these two security concerns and proposes DeTrans, a DNN model protection framework that utilizes bi-level optimization to modify weights of highly transferable filters, so as to prevent both unauthorized inference and cross-domain transfer followed by model extraction. \nAdditionally, DeTrans ensures that the model functionality can be preserved for authorized users with specialized hardware support. The experiments demonstrate that DeTrans can significantly reduce accuracy in the source domain to random guessing and achieve up to an 81.23\\% reduction in transferability to the target domain.",
        "keywords": "Deep Neural Networks; IP Protection; Model Leakage; Domain Transfer",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/88b4ad6351b71dd7312b1240a26c9952bc395d49.zip",
        "author": "Tong Zhou;Shijin Duan;Shaolei Ren;Xiaolin Xu",
        "authorids": "~Tong_Zhou3;~Shijin_Duan1;~Shaolei_Ren1;~Xiaolin_Xu3",
        "gender": "F;M;;",
        "homepage": "https://tongzhou0101.github.io/;https://scholar.google.com/citations?user=RJ5CUeAAAAAJ;;",
        "dblp": "30/97-2;300/5409;;",
        "google_scholar": "6ghv7EwAAAAJ;RJ5CUeAAAAAJ;;",
        "orcid": "0000-0002-8645-5246;0000-0002-4317-1489;;",
        "linkedin": "tong-zhou-292a931b5/;;;",
        "or_profile": "~Tong_Zhou3;~Shijin_Duan1;~Shaolei_Ren1;~Xiaolin_Xu3",
        "aff": "Northeastern University;Northeastern University;;",
        "aff_domain": "neu.edu;neu.edu;;",
        "position": "PhD student;PhD student;;",
        "bibtex": "@misc{\nzhou2024two,\ntitle={Two Birds with One Stone: Protecting {DNN} Models Against Unauthorized Inference and Domain Transfer},\nauthor={Tong Zhou and Shijin Duan and Shaolei Ren and Xiaolin Xu},\nyear={2024},\nurl={https://openreview.net/forum?id=LLbHdII8Pg}\n}",
        "github": "",
        "project": "",
        "reviewers": "rJhp;Uryd;a4Uq;RU2E",
        "site": "https://openreview.net/forum?id=LLbHdII8Pg",
        "pdf_size": 1629546,
        "rating": "3;3;5;5",
        "confidence": "4;5;2;4",
        "soundness": "3;2;3;3",
        "contribution": "3;2;3;3",
        "presentation": "3;1;3;3",
        "wc_summary": "51;375;53;69",
        "wc_strengths": "11;37;23;15",
        "wc_weaknesses": "26;271;148;28",
        "wc_questions": "4;87;10;213",
        "wc_review": "92;770;234;325",
        "wc_reply_reviewers": "269;1253;0;0",
        "wc_reply_authors": "480;1782;190;380",
        "reply_reviewers": "2;4;0;0",
        "reply_authors": "2;5;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            137.0,
            137.58633653092156
        ],
        "wc_strengths_avg": [
            21.5,
            9.937303457175895
        ],
        "wc_weaknesses_avg": [
            118.25,
            101.08505082355155
        ],
        "wc_questions_avg": [
            78.5,
            84.26891479068661
        ],
        "wc_review_avg": [
            355.25,
            253.4436574467785
        ],
        "wc_reply_reviewers_avg": [
            380.5,
            515.5698303818795
        ],
        "wc_reply_authors_avg": [
            708.0,
            628.7622762221029
        ],
        "reply_reviewers_avg": [
            1.5,
            1.6583123951777
        ],
        "reply_authors_avg": [
            2.25,
            1.6393596310755
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.6882472016116854,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:lG_0STRDaZMJ:scholar.google.com/&scioq=Two+Birds+with+One+Stone:+Protecting+DNN+Models+Against+Unauthorized+Inference+and+Domain+Transfer&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Northeastern University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.northeastern.edu",
        "aff_unique_abbr": "NEU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "LLrBF8BsUb",
        "title": "RPNet: Robust Non-Interactive Private Inference against Malicious Clients with Adversarial Attacks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The increased deployment of machine learning inference in various applications has sparked privacy concerns. In response, privacy-preserving neural network (PNet) inference protocols have been created to allow parties to perform inference without revealing their sensitive data. Despite the recent advancements in the efficiency of PNet, most current methods assume a semi-honest threat model where the data owner is honest and adheres to the protocol. However, in reality, data owners can have different motivations and act in unpredictable ways, making this assumption unrealistic. To demonstrate how a malicious client can compromise the semi-honest model, we first designed a novel inference manipulation attack against a range of state-of-the-art private inference protocols. This attack allows a malicious client to modify the model output using 3\u00d7 to 8 \u00d7 fewer queries relative to the current black box attacks and accommodates larger and more complex neural networks. Driven by the insights gained from our attack, we proposed and implemented RPNet, a fortified and resilient private inference protocol that can withstand malicious clients. RPNet integrates a distinctive cryptographic protocol that bolsters security by weaving encryption-compatible noise into the logits and features of private inference, thereby efficiently warding off malicious-client attacks. Our extensive experiments on various neural networks and datasets show that RPNet achieves\n19 \u223c 91.9% attack success rate reduction and increases more than 10\u00d7 query number 20 required by malicious client attacks.",
        "keywords": "Robustness;privacy-preserving inference;fully homomorphic encryption;adversarial attack",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/8792a39d7ea4842a68414e4098cb35ad1f8c32c6.zip",
        "author": "Jiaqi Xue;Lei Xu;Lin Chen;Weidong Shi;Kaidi Xu;Yan Solihin;Qian Lou",
        "authorids": "~Jiaqi_Xue1;~Lei_Xu5;~Lin_Chen19;~Weidong_Shi1;~Kaidi_Xu1;~Yan_Solihin1;~Qian_Lou1",
        "gender": "M;Not Specified;M;;M;;M",
        "homepage": "https://jqxue1999.github.io;https://xuleimath.github.io;;;https://kaidixu.com/;https://sites.google.com/view/arpers;https://qlou.org",
        "dblp": ";19/360;13/3479-9.html;;195/8175;11/2624;207/3962.html",
        "google_scholar": "NI2jppcAAAAJ;DEYY1QYAAAAJ;a0DapS0AAAAJ;;lYK0wlsAAAAJ;sUQFclgAAAAJ;SBYgXLoAAAAJ",
        "orcid": ";0000-0002-7662-2119;;;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Jiaqi_Xue1;~Lei_Xu5;~Lin_Chen19;~Weidong_Shi1;~Kaidi_Xu1;~Yan_Solihin1;~Qian_Lou1",
        "aff": "University of Central Florida;Kent State University;Texas Tech University;;Drexel University;University of Central Florida;University of Central Florida",
        "aff_domain": "ucf.edu;kent.edu;ttu.edu;;drexel.edu;ucf.edu;ucf.edu",
        "position": "PhD student;Assistant Professor;Assistant Professor;;Assistant Professor;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nxue2024rpnet,\ntitle={{RPN}et: Robust Non-Interactive Private Inference against Malicious Clients with Adversarial Attacks},\nauthor={Jiaqi Xue and Lei Xu and Lin Chen and Weidong Shi and Kaidi Xu and Yan Solihin and Qian Lou},\nyear={2024},\nurl={https://openreview.net/forum?id=LLrBF8BsUb}\n}",
        "github": "",
        "project": "",
        "reviewers": "PzFf;7dXp;Uygt;gjYP",
        "site": "https://openreview.net/forum?id=LLrBF8BsUb",
        "pdf_size": 1694589,
        "rating": "3;3;3;5",
        "confidence": "3;4;5;2",
        "soundness": "2;1;1;3",
        "contribution": "2;1;1;2",
        "presentation": "1;3;1;3",
        "wc_summary": "39;74;27;84",
        "wc_strengths": "27;25;12;68",
        "wc_weaknesses": "273;111;193;133",
        "wc_questions": "39;41;2;46",
        "wc_review": "378;251;234;331",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            1.0
        ],
        "wc_summary_avg": [
            56.0,
            23.65375234502974
        ],
        "wc_strengths_avg": [
            33.0,
            21.011901389450696
        ],
        "wc_weaknesses_avg": [
            177.5,
            62.77539326838184
        ],
        "wc_questions_avg": [
            32.0,
            17.507141400011598
        ],
        "wc_review_avg": [
            298.5,
            58.72180174347514
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.7745966692414834,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:lsqX1AGIudMJ:scholar.google.com/&scioq=RPNet:+Robust+Non-Interactive+Private+Inference+against+Malicious+Clients+with+Adversarial+Attacks&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;0;0",
        "aff_unique_norm": "University of Central Florida;Kent State University;Texas Tech University;Drexel University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.ucf.edu;https://www.kent.edu;https://www.ttu.edu;https://www.drexel.edu",
        "aff_unique_abbr": "UCF;KSU;TTU;Drexel",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Beyond Imitation: Leveraging Fine-grained Quality Signals for Alignment",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18867",
        "id": "LNLjU5C5dK",
        "author_site": "Geyang Guo, Ranchi Zhao, Tianyi Tang, Xin Zhao, Ji-Rong Wen",
        "tldr": "",
        "abstract": "Alignment with human preference is a desired property of large language models (LLMs). Currently, the main alignment approach is based on reinforcement learning from human feedback (RLHF). Despite the effectiveness of RLHF, it is intricate to implement and train, thus recent studies explore how to develop alternative alignment approaches based on supervised fine-tuning (SFT). A major limitation of SFT is that it essentially does imitation learning, which can't fully understand what are the expected behaviors. To address this issue, we propose an improved alignment approach named $\\textbf{FIGA}$. Different from prior methods, we incorporate fine-grained (i.e., token or phrase level) quality signals that are derived by contrasting good and bad responses. Our approach has made two major contributions. Firstly, we curate a refined alignment dataset that pairs initial responses and the corresponding revised ones. Secondly, we devise a new loss function can leverage fine-grained quailty signals to instruct the learning of LLMs for alignment. Extensive experiments have demonstrated the effectiveness of our approaches by comparing a number of competitive baselines.",
        "keywords": "large language models;alignment;fine-grained SFT",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Geyang Guo;Ranchi Zhao;Tianyi Tang;Xin Zhao;Ji-Rong Wen",
        "authorids": "~Geyang_Guo2;~Ranchi_Zhao1;~Tianyi_Tang1;~Xin_Zhao10;~Ji-Rong_Wen1",
        "gender": ";M;M;M;M",
        "homepage": "https://guochry.github.io;https://github.com/RanchiZhao;https://steventang1998.github.io/;https://gsai.ruc.edu.cn/addons/teacher/index/info.html?user_id=5&ruccode=20140041&ln=cn;https://gsai.ruc.edu.cn/english/jrwen",
        "dblp": "128/5836;;276/9353;https://dblp.uni-trier.de/pid/52/8700.html;w/JRWen",
        "google_scholar": "4zOu3UkAAAAJ;JhIMpkcAAAAJ;t1mRUvQAAAAJ;JNhNacoAAAAJ;tbxCHJgAAAAJ",
        "orcid": ";;;0000-0002-8333-6196;0000-0002-9777-9676",
        "linkedin": ";;;;",
        "or_profile": "~Geyang_Guo2;~Ranchi_Zhao1;~Tianyi_Tang1;~Xin_Zhao10;~Ji-Rong_Wen1",
        "aff": "Renmin University of China;Renmin University of China;Renmin University of China;Renmin University of China;Renmin University of China",
        "aff_domain": "ruc.edu.cn;ruc.edu.cn;ruc.edu.cn;ruc.edu.cn;ruc.edu.cn",
        "position": "Undergrad student;Undergrad student;MS student;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nguo2024beyond,\ntitle={Beyond Imitation: Leveraging Fine-grained Quality Signals for Alignment},\nauthor={Geyang Guo and Ranchi Zhao and Tianyi Tang and Xin Zhao and Ji-Rong Wen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=LNLjU5C5dK}\n}",
        "github": "",
        "project": "",
        "reviewers": "hMwD;772X;J3kJ;1jST",
        "pdf_size": 3903315,
        "rating": "6;6;6;8",
        "confidence": "3;5;3;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;4",
        "presentation": "3;4;3;3",
        "wc_summary": "101;48;225;90",
        "wc_strengths": "88;33;51;38",
        "wc_weaknesses": "246;147;623;194",
        "wc_questions": "60;2;66;313",
        "wc_review": "495;230;965;635",
        "wc_reply_reviewers": "16;65;609;124",
        "wc_reply_authors": "1770;1853;2748;1744",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "9;7;7;7",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            116.0,
            65.96590028188807
        ],
        "wc_strengths_avg": [
            52.5,
            21.523243250030884
        ],
        "wc_weaknesses_avg": [
            302.5,
            188.32485231641627
        ],
        "wc_questions_avg": [
            110.25,
            119.69623009936446
        ],
        "wc_review_avg": [
            581.25,
            265.0324272612693
        ],
        "wc_reply_reviewers_avg": [
            203.5,
            237.21772699357862
        ],
        "wc_reply_authors_avg": [
            2028.75,
            417.2058095233095
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            7.5,
            0.8660254037844386
        ],
        "replies_avg": [
            41,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 23,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15737765960236095288&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=LNLjU5C5dK",
        "pdf": "https://openreview.net/pdf?id=LNLjU5C5dK",
        "email": "ruc.edu.cn;ruc.edu.cn;ruc.edu.cn;ruc.edu.cn;ruc.edu.cn",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Renmin University of China",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.ruc.edu.cn",
        "aff_unique_abbr": "RUC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "LNLr8WXDEh",
        "title": "What Does Stable Diffusion Know about the 3D Scene?",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent advances in generative models like Stable Diffusion enable the generation of highly photo-realistic images. Our objective in this paper is to probe the diffusion network to determine to what extent it 'understands' different properties of the 3D scene depicted in an image. To this end, we make the following contributions: (i) We introduce a protocol to evaluate whether a network models a number of physical 'properties' of the 3D scene by probing for explicit features that represent these properties. The probes are applied on datasets of real images with annotations for the property. (ii) We apply this protocol to properties covering scene geometry, scene material, support relations, lighting, and view dependent measures. (iii) We find that Stable Diffusion is good at a number of properties including scene geometry, support relations, shadows and depth, but less performant for occlusion. (iv) We also apply the probes to other models trained at large-scale, including DINO and CLIP, and find their performance inferior to that of Stable Diffusion.",
        "keywords": "Scene understanding; Self-supervised representation; Benchmark and evaluation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/e316bcc87d625bf0e3ade21539e205cfa16158f1.pdf",
        "author": "Guanqi Zhan;Chuanxia Zheng;Weidi Xie;Andrew Zisserman",
        "authorids": "~Guanqi_Zhan1;~Chuanxia_Zheng1;~Weidi_Xie3;~Andrew_Zisserman1",
        "gender": ";M;M;",
        "homepage": "https://www.robots.ox.ac.uk/~guanqi/;http://www.chuanxiaz.com/;https://weidixie.github.io;",
        "dblp": "254/2030;195/8988;199/1718;",
        "google_scholar": "f_m4WJIAAAAJ;mvpE6bIAAAAJ;https://scholar.google.co.uk/citations?user=Vtrqj4gAAAAJ;",
        "orcid": ";;;",
        "linkedin": ";chuanxia-zheng-80a3b8110/;;",
        "or_profile": "~Guanqi_Zhan1;~Chuanxia_Zheng1;~Weidi_Xie3;~Andrew_Zisserman1",
        "aff": "University of Oxford;University of Oxford;Shanghai Jiaotong University;",
        "aff_domain": "ox.ac.uk;ox.ac.uk;sjtu.edu.cn;",
        "position": "PhD student;Postdoc;Associate Professor;",
        "bibtex": "@misc{\nzhan2024what,\ntitle={What Does Stable Diffusion Know about the 3D Scene?},\nauthor={Guanqi Zhan and Chuanxia Zheng and Weidi Xie and Andrew Zisserman},\nyear={2024},\nurl={https://openreview.net/forum?id=LNLr8WXDEh}\n}",
        "github": "",
        "project": "",
        "reviewers": "G3yb;n8LA;ssWi;oLXV",
        "site": "https://openreview.net/forum?id=LNLr8WXDEh",
        "pdf_size": 8168810,
        "rating": "3;5;5;5",
        "confidence": "4;4;3;3",
        "soundness": "2;3;2;2",
        "contribution": "2;2;3;2",
        "presentation": "2;3;3;4",
        "wc_summary": "112;49;96;76",
        "wc_strengths": "85;63;139;26",
        "wc_weaknesses": "293;340;224;329",
        "wc_questions": "59;8;29;59",
        "wc_review": "549;460;488;490",
        "wc_reply_reviewers": "0;0;37;0",
        "wc_reply_authors": "477;361;588;304",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            83.25,
            23.53056522908024
        ],
        "wc_strengths_avg": [
            78.25,
            40.9229458861407
        ],
        "wc_weaknesses_avg": [
            296.5,
            45.32383478921438
        ],
        "wc_questions_avg": [
            38.75,
            21.568205766822608
        ],
        "wc_review_avg": [
            496.75,
            32.41431011143072
        ],
        "wc_reply_reviewers_avg": [
            9.25,
            16.021469970012117
        ],
        "wc_reply_authors_avg": [
            432.5,
            109.29890209878597
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 29,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18388037511636437452&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "University of Oxford;Shanghai Jiao Tong University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ox.ac.uk;https://www.sjtu.edu.cn",
        "aff_unique_abbr": "Oxford;SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "United Kingdom;China"
    },
    {
        "id": "LNTexdca08",
        "title": "P2P: Transforming from Point Supervision to Explicit Visual Prompt for Object Detection and Segmentation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Point-supervised vision tasks, including detection and segmentation, aiming to learn a network that transforms from point to pseudo labels, have attracted much attention in the vision community in recent years. However, the lack of precise object size and boundary annotations in the point-supervised condition results in a large performance gap between point- and fully-supervised methods. In this paper, we propose a novel iterative learning framework, Point to Prompt (P2P), for point-supervised object detection and segmentation, with the key insight of transforming from point supervision to explicit visual prompt of the foundation model. The P2P is formulated as an iterative refinement process of two stages: Semantic Explicit Prompt Generation (SEPG) and Prompt Guided Spatial Refinement (PGSR). Specifically, SEPG serves as a prompt generator for generating semantic-explicit prompts from point input. In PGSR stage, prompts guide the visual foundation model to further refine the object regions, by leveraging the outstanding generalization ability of the foundation model. The two stages are iterated multiple times to improve the quality of predictions progressively. Experimental results on multiple datasets demonstrate that P2P achieves SOTA performance in both detection and segmentation tasks, further narrowing the performance gap with fully-supervised methods.",
        "keywords": "object detection; point-level supervision; foundation model",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Guangqian Guo;Dian Shao;Chenguang Zhu;Sha Meng;Xuan Wang;Shan Gao",
        "authorids": "~Guangqian_Guo2;~Dian_Shao1;~Chenguang_Zhu3;~Sha_Meng1;~Xuan_Wang10;~Shan_Gao2",
        "gender": "M;F;M;;F;M",
        "homepage": ";;;;https://teacher.nwpu.edu.cn/wangxuan.html;https://teacher.nwpu.edu.cn/2018010158.html",
        "dblp": ";196/6225;;;;",
        "google_scholar": "IhZcxSEAAAAJ;amxDSLoAAAAJ;;;;",
        "orcid": "0000-0002-8940-1382;0000-0002-0862-9941;0009-0008-8494-2690;;;",
        "linkedin": ";;;https://www.linkedin.cn/incareer/in/ACoAAD73EtABRSZmBQi6XqZKJsifkBalhVOhYaQ;;",
        "or_profile": "~Guangqian_Guo2;~Dian_Shao1;~Chenguang_Zhu3;~Sha_Meng1;~Xuan_Wang10;~Shan_Gao2",
        "aff": "Northwestern Polytechnical University;Northwest Polytechnical University Xi'an;Northwest Polytechnical University Xi'an;Northwest Polytechnical University Xi'an;Northwest Polytechnical University Xi'an;Northwest Polytechnical University Xi'an",
        "aff_domain": "mai.nwpu.edu.cn;nwpu.edu.cn;nwpu.edu.cn;nwpu.edu.cn;nwpu.edu.cn;nwpu.edu.cn",
        "position": "PhD student;Associate Professor;MS student;MS student;Full Professor;Associate Professor",
        "bibtex": "@misc{\nguo2024pp,\ntitle={P2P: Transforming from Point Supervision to Explicit Visual Prompt for Object Detection and Segmentation},\nauthor={Guangqian Guo and Dian Shao and Chenguang Zhu and Sha Meng and Xuan Wang and Shan Gao},\nyear={2024},\nurl={https://openreview.net/forum?id=LNTexdca08}\n}",
        "github": "",
        "project": "",
        "reviewers": "6Xmh;j4vZ;iqSb;7jkG",
        "site": "https://openreview.net/forum?id=LNTexdca08",
        "pdf_size": 5315566,
        "rating": "5;6;6;6",
        "confidence": "4;4;3;5",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "91;47;40;100",
        "wc_strengths": "36;20;114;30",
        "wc_weaknesses": "50;80;122;314",
        "wc_questions": "16;3;267;2",
        "wc_review": "193;150;543;446",
        "wc_reply_reviewers": "0;0;0;362",
        "wc_reply_authors": "469;881;829;1496",
        "reply_reviewers": "0;0;0;2",
        "reply_authors": "2;2;2;4",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            69.5,
            26.31064423384574
        ],
        "wc_strengths_avg": [
            50.0,
            37.389838191679836
        ],
        "wc_weaknesses_avg": [
            141.5,
            102.8238785496832
        ],
        "wc_questions_avg": [
            72.0,
            112.71867635844559
        ],
        "wc_review_avg": [
            333.0,
            165.7995778040463
        ],
        "wc_reply_reviewers_avg": [
            90.5,
            156.7505980849834
        ],
        "wc_reply_authors_avg": [
            918.75,
            369.1113483760693
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            2.5,
            0.8660254037844386
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13164873144362292593&as_sdt=5,38&sciodt=0,38&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1;1;1;1",
        "aff_unique_norm": "Northwestern Polytechnical University;Northwest Polytechnical University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.nwpu.edu.cn;http://www.nwpu.edu.cn",
        "aff_unique_abbr": "NWPU;NWPU",
        "aff_campus_unique_index": "1;1;1;1;1",
        "aff_campus_unique": ";Xi'an",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "LOyYjE0blM",
        "title": "Neural scaling laws for phenotypic drug discovery",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recent breakthroughs by deep neural networks (DNNs) in natural language processing (NLP) and computer vision have been driven by a scale-up of models and data rather than the discovery of novel computing paradigms. Here, we investigate if scale can have a similar impact for models designed to aid small molecule drug discovery. We address this question through a large-scale and systematic analysis of how DNN size, data diet, and learning routines interact to impact accuracy on our Phenotypic Chemistry Arena (Pheno-CA) benchmark \u2014 a diverse set of drug discovery tasks posed on image-based high content screening data. Surprisingly, we find that DNNs explicitly supervised to solve tasks in the Pheno-CA do not continuously improve as their data and model size is scaled-up. To address this issue, we introduce a novel precursor task, the Inverse Biological Process (IBP), which is designed to resemble the causal objective functions that have proven successful for NLP. We indeed find that DNNs first trained with IBP then probed for performance on the Pheno-CA significantly outperform task-supervised DNNs. More importantly, the performance of these IBP-trained DNNs monotonically improves with data and model scale. Our findings reveal that the DNN ingredients needed to accurately solve small molecule drug discovery tasks are already in our hands, and project how much more experimental data is needed to achieve any desired level of improvement. We release our Pheno-CA benchmark and code to encourage further study of neural scaling laws for small molecule drug discovery.",
        "keywords": "Drug discovery;neural scaling laws;small molecules;phenotypic screening",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Drew Linsley;John Griffin;Jason Parker Brown;Adam N Roose;Michael Frank;Peter S Linsley;Jeremy William Linsley",
        "authorids": "~Drew_Linsley1;~John_Griffin1;~Jason_Parker_Brown1;~Adam_N_Roose1;~Michael_Frank2;~Peter_S_Linsley1;~Jeremy_William_Linsley1",
        "gender": ";M;M;M;M;M;M",
        "homepage": ";;https://www.linkedin.com/in/jason-parker-brown-37a7344/;;http://ski.clps.brown.edu;https://www.benaroyaresearch.org/our-research/labs-research/lab/linsley-lab;https://www.linkedin.com/in/jeremy-linsley-597b9114/",
        "dblp": "194/2308;;;;33/2026.html;;",
        "google_scholar": "cXZlAuQAAAAJ;;;;f-xyFpUAAAAJ;7baJjYIAAAAJ;",
        "orcid": ";;;;0000-0001-8451-0523;0000-0002-8960-4307;",
        "linkedin": ";john-griffin-0a75a2b/;;adam-roose-9ba5a08a;;peter-linsley-0040266/Immunology;",
        "or_profile": "~Drew_Linsley1;~John_Griffin1;~Jason_Parker_Brown1;~Adam_N_Roose1;~Michael_Frank2;~Peter_S_Linsley1;~Jeremy_William_Linsley1",
        "aff": "Brown University;;;Operant Biopharma;Brown University;Benaroya Research Institute ;Operant BioPharma",
        "aff_domain": "brown.edu;;;operant.bio;brown.edu;benaroyaresearch.org;operant.bio",
        "position": "Assistant Professor;;;Adviser;Full Professor;Full Professor;CSO",
        "bibtex": "@misc{\nlinsley2024neural,\ntitle={Neural scaling laws for phenotypic drug discovery},\nauthor={Drew Linsley and John Griffin and Jason Parker Brown and Adam N Roose and Michael Frank and Peter S Linsley and Jeremy William Linsley},\nyear={2024},\nurl={https://openreview.net/forum?id=LOyYjE0blM}\n}",
        "github": "",
        "project": "",
        "reviewers": "pWEQ;rGf8;7a8P",
        "site": "https://openreview.net/forum?id=LOyYjE0blM",
        "pdf_size": 7899362,
        "rating": "1;3;5",
        "confidence": "2;4;3",
        "soundness": "1;1;2",
        "contribution": "2;2;3",
        "presentation": "1;2;3",
        "wc_summary": "69;50;105",
        "wc_strengths": "58;31;78",
        "wc_weaknesses": "168;30;84",
        "wc_questions": "106;399;79",
        "wc_review": "401;510;346",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            1.632993161855452
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            74.66666666666667,
            22.80838052607467
        ],
        "wc_strengths_avg": [
            55.666666666666664,
            19.258475767539053
        ],
        "wc_weaknesses_avg": [
            94.0,
            56.78027826631356
        ],
        "wc_questions_avg": [
            194.66666666666666,
            144.90533308182813
        ],
        "wc_review_avg": [
            419.0,
            68.15179136799463
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1425913839780026725&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;0;2;1",
        "aff_unique_norm": "Brown University;Operant Biopharma;Benaroya Research Institute",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.brown.edu;;https://benaroyaresearch.org",
        "aff_unique_abbr": "Brown;;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States;"
    },
    {
        "id": "LPFxzTSZtR",
        "title": "Personalization Mitigates the Perils of Local SGD for Heterogeneous Distributed Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "This paper investigates a personalized version of Local Stochastic Gradient Descent (Local SGD). We establish improved convergence guarantees for this personalized approach, eliminating the need for extra assumptions about data or gradient heterogeneity. Our theoretical analysis reveals that personalized Local SGD outperforms both pure local training and federated learning algorithms that produce a consensus model for all devices. This performance gain is primarily due to over-parameterization, which allows for reducing the consensus error between clients with more communication\u2014something that is not observed in non-personalized approaches. We illustrate our observations using experiments on synthetic convex and smooth objectives.",
        "keywords": "Federated Learning;Optimization;Data Heterogenenity;Local SGD;Federated Averaging;Personalization;Convergence Analysis;Privacy Preserving Machine Learning",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/582fdeb3980f4aa1516c69ceebd6b583bd30dc9b.zip",
        "author": "Kumar Kshitij Patel;Nidham Gazagnadou;Lingxiao Wang;Lingjuan Lyu",
        "authorids": "~Kumar_Kshitij_Patel2;~Nidham_Gazagnadou1;~Lingxiao_Wang5;~Lingjuan_Lyu1",
        "gender": "M;M;F;M",
        "homepage": "https://ngazagna.github.io/;https://lingxiaowang-ai.github.io/;https://sites.google.com/view/lingjuan-lyu;https://kishinmh.github.io/",
        "dblp": "236/5973;140/1229-1;178/9876;239/8754",
        "google_scholar": ";VPyxd6kAAAAJ;;https://scholar.google.cl/citations?user=Okd0qN0AAAAJ",
        "orcid": ";;;0000-0002-6886-6826",
        "linkedin": "nidham-gazagnadou-b06415a7/;;;kumar-kshitij-patel-604a4651/",
        "or_profile": "~Nidham_Gazagnadou1;~Lingxiao_Wang5;~Lingjuan_Lyu1;~Kumar_Kshitij_Patel1",
        "aff": "Sony AI;Toyota Technological Institute at Chicago;Sony;Toyota Technological Institute at Chicago",
        "aff_domain": "sony.com;ttic.edu;sony.com;ttic.edu",
        "position": "Researcher;Research assistant professor;scientist;PhD student",
        "bibtex": "@misc{\npatel2024personalization,\ntitle={Personalization Mitigates the Perils of Local {SGD} for Heterogeneous Distributed Learning},\nauthor={Kumar Kshitij Patel and Nidham Gazagnadou and Lingxiao Wang and Lingjuan Lyu},\nyear={2024},\nurl={https://openreview.net/forum?id=LPFxzTSZtR}\n}",
        "github": "",
        "project": "",
        "reviewers": "JN1e;PXND;r2Eb;bZrV",
        "site": "https://openreview.net/forum?id=LPFxzTSZtR",
        "pdf_size": 1005378,
        "rating": "1;3;3;8",
        "confidence": "4;3;3;2",
        "soundness": "1;2;3;3",
        "contribution": "2;2;1;3",
        "presentation": "2;2;2;4",
        "wc_summary": "81;36;60;96",
        "wc_strengths": "10;37;50;74",
        "wc_weaknesses": "484;42;168;2",
        "wc_questions": "228;424;41;92",
        "wc_review": "803;539;319;264",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            2.5860201081971503
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            68.25,
            22.587330519563395
        ],
        "wc_strengths_avg": [
            42.75,
            23.101677428273472
        ],
        "wc_weaknesses_avg": [
            174.0,
            189.1718795170149
        ],
        "wc_questions_avg": [
            196.25,
            148.19644901278843
        ],
        "wc_review_avg": [
            481.25,
            212.35627492494777
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9570202978345285,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:8eMhnBrmEoYJ:scholar.google.com/&scioq=Personalization+Mitigates+the+Perils+of+Local+SGD+for+Heterogeneous+Distributed+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "Sony;Toyota Technological Institute at Chicago;Sony Corporation",
        "aff_unique_dep": "Sony AI;;",
        "aff_unique_url": "https://www.sony.com;https://www.tti-chicago.org;https://www.sony.com",
        "aff_unique_abbr": "Sony AI;TTI Chicago;Sony",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Chicago",
        "aff_country_unique_index": "0;1;0;1",
        "aff_country_unique": "Japan;United States"
    },
    {
        "title": "CCIL: Continuity-Based Data Augmentation for Corrective Imitation Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18866",
        "id": "LQ6LQ8f4y8",
        "author_site": "Liyiming Ke, Yunchu Zhang, Abhay Deshpande, Siddhartha Srinivasa, Abhishek Gupta",
        "tldr": "",
        "abstract": "We present a new technique to enhance the robustness of imitation learning methods by generating corrective data to account for compounding error and disturbances. While existing methods rely on interactive expert labeling, additional offline datasets, or domain-specific invariances, our approach requires minimal additional assumptions beyond expert data. The key insight is to leverage local continuity in the environment dynamics. Our method first constructs a dynamics model from the expert demonstration, enforcing local Lipschitz continuity while skipping the discontinuous regions. In the locally continuous regions, this model allows us to generate corrective labels within the neighborhood of the demonstrations but beyond the actual set of states and actions in the dataset. Training on this augmented data enhances the agent's ability to recover from perturbations and deal with compounding error. We demonstrate the effectiveness of our generated labels through experiments in a variety of robotics domains that have distinct forms of continuity and discontinuity, including classic control, drone flying, high-dimensional navigation, locomotion, and tabletop manipulation.",
        "keywords": "imitation learning;data augmentation;robotics;model-based method",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/9cd7e0095416c3afe1c5bc732cd7337ca18915e8.pdf",
        "author": "Liyiming Ke;Yunchu Zhang;Abhay Deshpande;Siddhartha Srinivasa;Abhishek Gupta",
        "authorids": "~Liyiming_Ke1;~Yunchu_Zhang1;~Abhay_Deshpande1;~Siddhartha_Srinivasa1;~Abhishek_Gupta1",
        "gender": "F;M;M;M;M",
        "homepage": "http://kayke.xyz/;https://yunchuzhang.github.io/;https://abhaybd.github.io/;https://goodrobot.ai;https://homes.cs.washington.edu/~abhgupta/",
        "dblp": "178/8670;;;;18/6404-4",
        "google_scholar": "EhOtO3cAAAAJ;;;https://scholar.google.com.tw/citations?user=RCi98EAAAAAJ;1wLVDP4AAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;abhaybd/;;",
        "or_profile": "~Liyiming_Ke1;~Yunchu_Zhang1;~Abhay_Deshpande1;~Siddhartha_Srinivasa1;~Abhishek_Gupta1",
        "aff": "Paul G Allen School of Computer Science & Engineering, University of Washington;;University of Washington;University of Washington;University of Washington",
        "aff_domain": "cs.washington.edu;;uw.edu;washington.edu;uw.edu",
        "position": "PhD student;;Undergrad student;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nke2024ccil,\ntitle={{CCIL}: Continuity-Based Data Augmentation for Corrective Imitation Learning},\nauthor={Liyiming Ke and Yunchu Zhang and Abhay Deshpande and Siddhartha Srinivasa and Abhishek Gupta},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=LQ6LQ8f4y8}\n}",
        "github": "",
        "project": "",
        "reviewers": "iEcJ;vWGV;mpW3;cJ4u",
        "pdf_size": 990455,
        "rating": "5;6;6;6",
        "confidence": "4;4;4;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;4;3;3",
        "wc_summary": "82;82;50;66",
        "wc_strengths": "43;56;47;109",
        "wc_weaknesses": "154;64;135;226",
        "wc_questions": "5;224;73;5",
        "wc_review": "284;426;305;406",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "721;773;835;1001",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;3;3;3",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            70.0,
            13.2664991614216
        ],
        "wc_strengths_avg": [
            63.75,
            26.54595072699413
        ],
        "wc_weaknesses_avg": [
            144.75,
            57.66877404627222
        ],
        "wc_questions_avg": [
            76.75,
            89.43258634301034
        ],
        "wc_review_avg": [
            355.25,
            61.609151105984246
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            832.5,
            105.32212493108939
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.75,
            0.4330127018922193
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17460872599906172315&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=LQ6LQ8f4y8",
        "pdf": "https://openreview.net/pdf?id=LQ6LQ8f4y8",
        "email": "cs.washington.edu;;uw.edu;washington.edu;uw.edu",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of Washington",
        "aff_unique_dep": "Paul G Allen School of Computer Science & Engineering",
        "aff_unique_url": "https://www.washington.edu",
        "aff_unique_abbr": "UW",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Seattle;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "LQDJO7txyN",
        "title": "Prototypical Influence Function for Fully Test-time Adaptation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Test-time adaptation (TTA) addresses domain shift issues in real-world applications. TTA adapts the model considering real-world constraints: (1) TTA does not have access to the training data or the labels of the test data and (2) TTA has limited computational resources for adaptation since it adapts model while performing inference. Due to the constraints, it has been established that model updates based on model-trusting data whose predictions closely aligned with one-hot vectors are effective. Hence, we propose a PIF regularizer utilizing the influence function to assess the influence of adapting a test data point on the loss for model-trusting data. The influence function is impractical for TTA due to computational complexity and the unavailability of model-trusting data. However, by introducing reasonable\napproximations, we can feasibly use the PIF for TTA. Our experimental results demonstrate consistent performance enhancement when the PIF is applied into the existing TTA methods on various benchmark datasets.",
        "keywords": "test-time adaptation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Juhyeon Shin;Jonghyun Lee;Saehyung Lee;Uiwon Hwang;Sungroh Yoon",
        "authorids": "~Juhyeon_Shin1;~Jonghyun_Lee1;~Saehyung_Lee1;~Uiwon_Hwang1;~Sungroh_Yoon1",
        "gender": "F;M;M;M;",
        "homepage": "https://github.com/newjh12;;;https://sites.google.com/view/uiwon-hwang;http://ailab.snu.ac.kr",
        "dblp": ";;260/0442;207/8512;99/1474",
        "google_scholar": ";;nS24h74AAAAJ;https://scholar.google.co.kr/citations?user=CJ8-pGIAAAAJ;Bphl_fIAAAAJ",
        "orcid": ";;;0000-0001-5054-2236;0000-0002-2367-197X",
        "linkedin": ";jonghyun-lee-0886061a3/;;uiwon-hwang/;",
        "or_profile": "~Juhyeon_Shin1;~Jonghyun_Lee1;~Saehyung_Lee1;~Uiwon_Hwang1;~Sungroh_Yoon1",
        "aff": "Seoul National University;Seoul National University;Adobe Systems;Yonsei University - Mirae Campus;Seoul National University",
        "aff_domain": "snu.ac.kr;snu.ac.kr;adobe.com;yonsei.ac.kr;snu.ac.kr",
        "position": "PhD student;PhD student;Intern;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nshin2024prototypical,\ntitle={Prototypical Influence Function for Fully Test-time Adaptation},\nauthor={Juhyeon Shin and Jonghyun Lee and Saehyung Lee and Uiwon Hwang and Sungroh Yoon},\nyear={2024},\nurl={https://openreview.net/forum?id=LQDJO7txyN}\n}",
        "github": "",
        "project": "",
        "reviewers": "bVft;yBgF;SDLt;nQF9;hjny",
        "site": "https://openreview.net/forum?id=LQDJO7txyN",
        "pdf_size": 539059,
        "rating": "3;5;5;5;5",
        "confidence": "4;4;3;3;3",
        "soundness": "3;3;1;3;2",
        "contribution": "2;3;2;3;3",
        "presentation": "3;4;2;3;2",
        "wc_summary": "54;82;66;57;83",
        "wc_strengths": "53;216;37;16;40",
        "wc_weaknesses": "172;223;405;63;342",
        "wc_questions": "132;88;194;122;8",
        "wc_review": "411;609;702;258;473",
        "wc_reply_reviewers": "133;154;0;16;228",
        "wc_reply_authors": "739;473;685;434;365",
        "reply_reviewers": "1;1;0;1;1",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            4.6,
            0.7999999999999999
        ],
        "confidence_avg": [
            3.4,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.4,
            0.8
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.8,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            68.4,
            12.175385004179539
        ],
        "wc_strengths_avg": [
            72.4,
            72.77527052508977
        ],
        "wc_weaknesses_avg": [
            241.0,
            121.54505337528138
        ],
        "wc_questions_avg": [
            108.8,
            60.93406272357031
        ],
        "wc_review_avg": [
            490.6,
            154.5685608395187
        ],
        "wc_reply_reviewers_avg": [
            106.2,
            86.31662644010133
        ],
        "wc_reply_authors_avg": [
            539.2,
            146.2687936642673
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.6123724356957948,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:WZwg0QqQLhAJ:scholar.google.com/&scioq=Prototypical+Influence+Function+for+Fully+Test-time+Adaptation&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2;0",
        "aff_unique_norm": "Seoul National University;Adobe;Yonsei University",
        "aff_unique_dep": ";Adobe Systems Incorporated;",
        "aff_unique_url": "https://www.snu.ac.kr;https://www.adobe.com;https://www.yonsei.ac.kr",
        "aff_unique_abbr": "SNU;Adobe;Yonsei",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mirae",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "id": "LRpfp86Z38",
        "title": "Logarithmic Linear Units (LogLUs): A Novel Activation Function for Training Deep Neural Networks",
        "track": "main",
        "status": "Desk Reject",
        "tldr": "",
        "abstract": "The Logarithmic Linear Unit (LogLU) introduces a novel approach to activation functions in deep neural networks. By incorporating logarithmic methods into its mathematical equation, LogLU revolutionizes the training process, leading to faster learning and improved accuracy across diverse datasets, including numerical, image, and time series data. Much like Rectified linear unit (ReLU), Leaky ReLU, and Exponential Linear Unit (ELU), LogLU effectively tackles the vanishing gradient problem and mitigates the dead neuron issue that plagues ReLU. LogLU also has the ability to produce negative values, driving the mean unit activation closer to zero. This concept is inspired by stochastic gradient descent, which rapidly approaches the global minimum with a high learning rate before taking smaller steps as it nears the minimum. In experiments, LogLU not only accelerates learning but also yields more generalized models compared to other activation functions. Its primary goal in building deep neural networks is to achieve high generalization, ensuring that training and test accuracies closely align. We evaluated LogLU performance on three diverse datasets and its accuracy was: (i) Breast Cancer \u2013 Numerical Dataset (0.91) (ii) MNIST \u2013 Image Dataset (0.95) (iii) Jena Climate - Time Series Analysis Dataset (0.99). Results demonstrate that LogLU outperforms other activation functions in terms of learning characteristics. It represents a significant advancement in deep learning, offering researchers and practitioners a powerful tool to enhance neural network performance and generalization.",
        "keywords": "Activation Function;Gradient Descent;Model Generalization;Neural Networks;Deep learning.",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Rishi Chaitanya Sri Prasad Nalluri",
        "authorids": "~Rishi_Chaitanya_Sri_Prasad_Nalluri1",
        "gender": "M",
        "homepage": "",
        "dblp": "",
        "google_scholar": "",
        "orcid": "",
        "linkedin": "rishichaitanya/",
        "or_profile": "~Rishi_Chaitanya_Sri_Prasad_Nalluri1",
        "aff": "SRM University",
        "aff_domain": "srmap.edu.in",
        "position": "Undergrad student",
        "bibtex": "@misc{\nprasad2024logarithmic,\ntitle={Logarithmic Linear Units (Log{LU}s): A Novel Activation Function for Training Deep Neural Networks},\nauthor={Rishi Chaitanya Sri Prasad Nalluri},\nyear={2024},\nurl={https://openreview.net/forum?id=LRpfp86Z38}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=LRpfp86Z38",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:b68f2zmOHI4J:scholar.google.com/&scioq=Logarithmic+Linear+Units+(LogLUs):+A+Novel+Activation+Function+for+Training+Deep+Neural+Networks&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "SRM University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.srmuniversity.ac.in",
        "aff_unique_abbr": "SRM",
        "aff_country_unique_index": "0",
        "aff_country_unique": "India"
    },
    {
        "title": "SineNet: Learning Temporal Dynamics in Time-Dependent Partial Differential Equations",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18865",
        "id": "LSYhE2hLWG",
        "author_site": "Xuan Zhang, Jacob Helwig, Yuchao Lin, Yaochen Xie, Cong Fu, Stephan Wojtowytsch, Shuiwang Ji",
        "tldr": "",
        "abstract": "We consider using deep neural networks to solve time-dependent partial differential equations (PDEs), where multi-scale processing is crucial for modeling complex, time-evolving dynamics. While the U-Net architecture with skip connections is commonly used by prior studies to enable multi-scale processing, our analysis shows that the need for features to evolve across layers results in temporally misaligned features in skip connections, which limits the model\u2019s performance. To address this limitation, we propose SineNet, consisting of multiple sequentially connected U-shaped network blocks, referred to as waves. In SineNet, high-resolution features are evolved progressively through multiple stages, thereby reducing the amount of misalignment within each stage. We furthermore analyze the role of skip connections in enabling both parallel and sequential processing of multi-scale information. Our method is rigorously tested on multiple PDE datasets, including the Navier-Stokes equations and shallow water equations, showcasing the advantages of our proposed approach over conventional U-Nets with a comparable parameter budget. We further demonstrate that increasing the number of waves in SineNet while maintaining the same number of parameters leads to a monotonically improved performance. The results highlight the effectiveness of SineNet and the potential of our approach in advancing the state-of-the-art in neural PDE solver design. Our code is available as part of AIRS (https://github.com/divelab/AIRS).",
        "keywords": "Partial differential equations;Physics simulation;Dynamics learning",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Xuan Zhang;Jacob Helwig;Yuchao Lin;Yaochen Xie;Cong Fu;Stephan Wojtowytsch;Shuiwang Ji",
        "authorids": "~Xuan_Zhang3;~Jacob_Helwig1;~Yuchao_Lin1;~Yaochen_Xie1;~Cong_Fu2;~Stephan_Wojtowytsch1;~Shuiwang_Ji1",
        "gender": "M;M;M;M;M;;M",
        "homepage": "https://github.com/floatlazer;https://jacobhelwig.github.io/;https://kruskallin.github.io/;https://ycremar.github.io/;https://congfu.github.io/;http://www.swojtowytsch.com;http://people.tamu.edu/~sji",
        "dblp": ";349/0477.html;322/5499;227/7154;45/3990-3;252/1157;84/6405",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;NtqpyUAAAAAJ;;Xw3ZjnMAAAAJ;https://scholar.google.is/citations?user=7fv5TGMAAAAJ;vnluGycAAAAJ;BZGj6sAAAAAJ",
        "orcid": ";0000-0001-7718-7449;;;;0000-0003-3766-5332;0000-0002-4205-4563",
        "linkedin": ";jacob-helwig/;;;;;shuiwang-ji-9a040715/",
        "or_profile": "~Xuan_Zhang3;~Jacob_Helwig1;~Yuchao_Lin1;~Yaochen_Xie1;~Cong_Fu2;~Stephan_Wojtowytsch1;~Shuiwang_Ji1",
        "aff": "SES AI;Texas A&M University - College Station;Texas A&M;Amazon;Texas A&M;University of Pittsburgh;Texas A&M University",
        "aff_domain": "ses.ai;tamu.edu;tamu.edu;amazon.com;tamu.edu;pitt.edu;tamu.edu",
        "position": "Intern;PhD student;PhD student;Researcher;PhD student;Assistant Professor;Professor",
        "bibtex": "@inproceedings{\nzhang2024sinenet,\ntitle={SineNet: Learning Temporal Dynamics in Time-Dependent Partial Differential Equations},\nauthor={Xuan Zhang and Jacob Helwig and Yuchao Lin and Yaochen Xie and Cong Fu and Stephan Wojtowytsch and Shuiwang Ji},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=LSYhE2hLWG}\n}",
        "github": "",
        "project": "",
        "reviewers": "NgLk;XLvR;uUSa;BgSq",
        "pdf_size": 25620320,
        "rating": "6;6;6;8",
        "confidence": "3;3;5;4",
        "soundness": "2;3;3;3",
        "contribution": "3;3;4;3",
        "presentation": "4;3;3;3",
        "wc_summary": "149;74;60;112",
        "wc_strengths": "42;67;169;98",
        "wc_weaknesses": "264;145;102;158",
        "wc_questions": "157;4;82;178",
        "wc_review": "612;290;413;546",
        "wc_reply_reviewers": "131;317;0;31",
        "wc_reply_authors": "1977;2019;1084;1714",
        "reply_reviewers": "1;2;0;1",
        "reply_authors": "5;7;3;4",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            98.75,
            34.694199803425356
        ],
        "wc_strengths_avg": [
            94.0,
            47.62877281643944
        ],
        "wc_weaknesses_avg": [
            167.25,
            59.57925393960552
        ],
        "wc_questions_avg": [
            105.25,
            68.48859394088916
        ],
        "wc_review_avg": [
            465.25,
            123.9947075483466
        ],
        "wc_reply_reviewers_avg": [
            119.75,
            123.74444431973502
        ],
        "wc_reply_authors_avg": [
            1698.5,
            373.5414970254309
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            4.75,
            1.479019945774904
        ],
        "replies_avg": [
            30,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.17407765595569782,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4678583862751436328&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=LSYhE2hLWG",
        "pdf": "https://openreview.net/pdf?id=LSYhE2hLWG",
        "email": "ses.ai;tamu.edu;tamu.edu;amazon.com;tamu.edu;pitt.edu;tamu.edu",
        "author_num": 7,
        "aff_unique_index": "0;1;1;2;1;3;1",
        "aff_unique_norm": "SES AI;Texas A&M University;Amazon;University of Pittsburgh",
        "aff_unique_dep": ";;Amazon.com, Inc.;",
        "aff_unique_url": ";https://www.tamu.edu;https://www.amazon.com;https://www.pitt.edu",
        "aff_unique_abbr": ";TAMU;Amazon;Pitt",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";College Station",
        "aff_country_unique_index": "1;1;1;1;1;1",
        "aff_country_unique": ";United States"
    },
    {
        "id": "LSrDaGWTnv",
        "title": "Contrastive Representations Make Planning Easy",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Probabilistic inference over time series data is challenging when observations are high-dimensional. In this paper, we show how inference questions relating to prediction and planning can have compact, closed form solutions in terms of learned representations. The key idea is to apply a variant of contrastive learning to time series data. Prior work already shows that the representations learned by contrastive learning encode a probability ratio. By first extending this analysis to show that the marginal distribution over representations is Gaussian, we can then prove that conditional distribution of future representations is also Gaussian. Taken together, these results show that a variant of temporal contrastive learning results in representations distributed according to a Gaussian Markov chain, a graphical model where inference (e.g., filtering, smoothing) has closed form solutions. For example, in one special case the problem of trajectory inference simply corresponds to linear interpolation of the initial and final state representations. We provide brief empirical results validating our theory.",
        "keywords": "contrastive learning;prediction;planning;inference;time-series",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/1e48b87cf1b9d36ece348e80852b90e209a48c3a.zip",
        "author": "Benjamin Eysenbach;Vivek Myers;Sergey Levine;Ruslan Salakhutdinov",
        "authorids": "~Benjamin_Eysenbach1;~Vivek_Myers1;~Sergey_Levine1;~Ruslan_Salakhutdinov1",
        "gender": "M;;M;M",
        "homepage": "https://ben-eysenbach.github.io/;https://people.eecs.berkeley.edu/~vmyers/;https://people.eecs.berkeley.edu/~svlevine/;https://www.cs.cmu.edu/~rsalakhu/",
        "dblp": "192/1863;270/8694;80/7594;",
        "google_scholar": "DRnOvU8AAAAJ;5NGAbT4AAAAJ;8R35rCwAAAAJ;",
        "orcid": "0009-0000-7136-6307;;;",
        "linkedin": "benjamin-eysenbach-a7235775/;;;",
        "or_profile": "~Benjamin_Eysenbach1;~Vivek_Myers1;~Sergey_Levine1;~Russ_Salakhutdinov1",
        "aff": "Princeton University;University of California, Berkeley;Google;School of Computer Science, Carnegie Mellon University",
        "aff_domain": "princeton.edu;berkeley.edu;google.com;cs.cmu.edu",
        "position": "Assistant Professor;PhD student;Research Scientist;Full Professor",
        "bibtex": "@misc{\neysenbach2024contrastive,\ntitle={Contrastive Representations Make Planning Easy},\nauthor={Benjamin Eysenbach and Vivek Myers and Sergey Levine and Ruslan Salakhutdinov},\nyear={2024},\nurl={https://openreview.net/forum?id=LSrDaGWTnv}\n}",
        "github": "",
        "project": "",
        "reviewers": "RwSP;QatW;wbK6",
        "site": "https://openreview.net/forum?id=LSrDaGWTnv",
        "pdf_size": 3794297,
        "rating": "3;5;5",
        "confidence": "3;3;2",
        "soundness": "2;3;3",
        "contribution": "3;1;3",
        "presentation": "2;3;3",
        "wc_summary": "49;66;59",
        "wc_strengths": "30;33;81",
        "wc_weaknesses": "286;168;244",
        "wc_questions": "12;2;207",
        "wc_review": "377;269;591",
        "wc_reply_reviewers": "0;0;15",
        "wc_reply_authors": "725;623;761",
        "reply_reviewers": "0;0;1",
        "reply_authors": "2;2;2",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            58.0,
            6.97614984548545
        ],
        "wc_strengths_avg": [
            48.0,
            23.366642891095847
        ],
        "wc_weaknesses_avg": [
            232.66666666666666,
            48.83532419149983
        ],
        "wc_questions_avg": [
            73.66666666666667,
            94.36925111261377
        ],
        "wc_review_avg": [
            412.3333333333333,
            133.80915099083802
        ],
        "wc_reply_reviewers_avg": [
            5.0,
            7.0710678118654755
        ],
        "wc_reply_authors_avg": [
            703.0,
            58.44655678480983
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=382544054066556590&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Princeton University;University of California, Berkeley;Google;Carnegie Mellon University",
        "aff_unique_dep": ";;Google;School of Computer Science",
        "aff_unique_url": "https://www.princeton.edu;https://www.berkeley.edu;https://www.google.com;https://www.cmu.edu",
        "aff_unique_abbr": "Princeton;UC Berkeley;Google;CMU",
        "aff_campus_unique_index": "1;2;3",
        "aff_campus_unique": ";Berkeley;Mountain View;Pittsburgh",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "LSxE03S4fp",
        "title": "Learn to Achieve Out-of-the-Box Imitation Ability from Only One Demonstration",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Imitation learning (IL) enables agents to mimic expert behaviors. Most previous IL techniques focus on precisely imitating one policy through mass demonstrations. However, in many applications, what humans require is the ability to perform various tasks directly through a few demonstrations of corresponding tasks, where \\textit{the agent would meet many unexpected changes when deployed}. In this scenario, the agent is expected to not only imitate the demonstration but also adapt to unforeseen environmental changes. This motivates us to propose a new topic called imitator learning (ItorL), which aims to derive an imitator module that can \\textit{on-the-fly} reconstruct the imitation policies based on very \\textit{limited} expert demonstrations for different unseen tasks, without any extra adjustment. In this work, we focus on imitator learning based on only one expert demonstration. To solve ItorL, we propose Demo-Attention Actor-Critic (DAAC), which integrates IL into a reinforcement-learning paradigm that can regularize policies' behaviors in unexpected situations. Besides, for autonomous imitation policy building, we design a demonstration-based attention architecture for imitator policy that can effectively output imitated actions by adaptively tracing the suitable states in demonstrations. We develop a new navigation benchmark and a robot environment for \\topic and show that DAAC outperforms previous imitation methods \\textit{with large margins} both on seen and unseen tasks.",
        "keywords": "imitation learning;imitator learning;reinforcement learning;meta learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/30691a48c310f894002950fd9da82b10d26736a3.zip",
        "author": "Xiong-Hui Chen;Junyin Ye;Hang Zhao;Yi-Chen Li;Haoran Shi;Yu-Yan Xu;Zhihao Ye;Si-Hang Yang;Yang Yu;Anqi Huang;Kai Xu;Zongzhang Zhang",
        "authorids": "~Xiong-Hui_Chen1;~Junyin_Ye1;~Hang_Zhao3;~Yi-Chen_Li1;~Haoran_Shi2;~Yu-Yan_Xu1;~Zhihao_Ye3;~Si-Hang_Yang1;~Yang_Yu5;~Anqi_Huang1;~Kai_Xu5;~Zongzhang_Zhang1",
        "gender": "M;M;M;M;M;;M;M;M;M;M;M",
        "homepage": "http://www.lamda.nju.edu.cn/chenxh/;http://www.lamda.nju.edu.cn/yejy/;;http://www.lamda.nju.edu.cn/liyc/;;;https://github.com/Vigilans;;;http://www.lamda.nju.edu.cn/zhangzz;http://kevinkaixu.net/;http://www.lamda.nju.edu.cn/yuy",
        "dblp": "241/7938;;;143/7158-1;;https://dblp.org/rec/conf/ijcai/XuSWY22;;;;90/8724;Xu_0004:Kai;46/2181-1",
        "google_scholar": "H5pguCYAAAAJ;;https://scholar.google.com/citations?hl=en;https://scholar.google.com.hk/citations?user=OA3GmbQAAAAJ;;;;;;sG7WEAgAAAAJ;https://scholar.google.com.hk/citations?user=GuVkg-8AAAAJ;PG2lDSwAAAAJ",
        "orcid": ";;;;;;;;;;;",
        "linkedin": ";;;;https://www.linkedin.cn/in/%E6%B5%A9%E7%84%B6-%E6%96%BD-455853261;%E7%8E%89%E7%87%95-%E8%AE%B8-205459276/;;si-hang-yang-aa0796235/;anqihuang777;;;",
        "or_profile": "~Xiong-Hui_Chen1;~Junyin_Ye1;~Hang_Zhao3;~Yi-Chen_Li1;~Haoran_Shi2;~Yu-Yan_Xu1;~Zhihao_Ye3;~Si-Hang_Yang1;~Anqi_Huang1;~Zongzhang_Zhang1;~Kevin_Xu1;~Yang_Yu2",
        "aff": "Nanjing University;Nanjing University;National University of Defense Technology;Nanjing University;;;Nanjing University;;Nanjing University of Science and Technology;Nanjing University;National University of Defense Technology;Nanjing University",
        "aff_domain": "nju.edu.cn;nju.edu.cn;nudt.edu.cn;nju.edu.cn;;;nju.edu.cn;;njust.edu.cn;nju.edu.cn;nudt.edu.cn;nju.edu.cn",
        "position": "PhD student;MS student;PhD student;PhD student;;;MS student;;PhD student;Associate Professor;Professor;Professor",
        "bibtex": "@misc{\nchen2024learn,\ntitle={Learn to Achieve Out-of-the-Box Imitation Ability from Only One Demonstration},\nauthor={Xiong-Hui Chen and Junyin Ye and Hang Zhao and Yi-Chen Li and Haoran Shi and Yu-Yan Xu and Zhihao Ye and Si-Hang Yang and Yang Yu and Anqi Huang and Kai Xu and Zongzhang Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=LSxE03S4fp}\n}",
        "github": "",
        "project": "",
        "reviewers": "RXZB;nbDi;pYHG;7pta",
        "site": "https://openreview.net/forum?id=LSxE03S4fp",
        "pdf_size": 10838518,
        "rating": "3;5;5;6",
        "confidence": "3;3;4;3",
        "soundness": "1;3;3;3",
        "contribution": "1;3;3;2",
        "presentation": "2;2;4;2",
        "wc_summary": "25;114;63;211",
        "wc_strengths": "6;125;35;90",
        "wc_weaknesses": "150;258;6;106",
        "wc_questions": "9;244;209;84",
        "wc_review": "190;741;313;491",
        "wc_reply_reviewers": "0;31;107;65",
        "wc_reply_authors": "1154;1961;788;862",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "2;3;2;2",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            103.25,
            69.76523131187913
        ],
        "wc_strengths_avg": [
            64.0,
            46.373483802707774
        ],
        "wc_weaknesses_avg": [
            130.0,
            90.46546302318913
        ],
        "wc_questions_avg": [
            136.5,
            94.6374661537385
        ],
        "wc_review_avg": [
            433.75,
            207.16825891048077
        ],
        "wc_reply_reviewers_avg": [
            50.75,
            39.789288759664956
        ],
        "wc_reply_authors_avg": [
            1191.25,
            465.0050402952639
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            12,
            0
        ],
        "corr_rating_confidence": 0.13245323570650439,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:V3Tl4XaapjwJ:scholar.google.com/&scioq=Learn+to+Achieve+Out-of-the-Box+Imitation+Ability+from+Only+One+Demonstration&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;0;2;0;1;0",
        "aff_unique_norm": "Nanjing University;National University of Defense Technology;Nanjing University of Science and Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.nju.edu.cn;http://www.nudt.edu.cn/;http://www.nust.edu.cn/",
        "aff_unique_abbr": "Nanjing U;NUDT;NUST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "LTHWoQ9ac1",
        "title": "Cost Adaptive Recourse Recommendation by Adaptive Preference Elicitation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Algorithmic recourse recommends a cost-efficient action to a subject to reverse an unfavorable machine learning classification decision. Most existing methods in the literature generate recourse under the assumption of complete knowledge about the cost function. In real-world practice, subjects could have distinct preferences, leading to incomplete information about the underlying cost function of the subject. This paper proposes a two-step approach that integrates preference learning to the recourse generation problem. In the first step, we design a question-answering framework to refine the confidence set of the Mahalanobis matrix cost of the subject sequentially. Then we generate recourse by utilizing two methods: gradient-based and graph-based cost-adaptive recourse that ensures validity while considering the whole confidence set of the cost matrix. The numerical evaluation demonstrates the benefits of our approach over state-of-the-art baselines in delivering cost-efficient recourse recommendations.",
        "keywords": "Algorithmic Recourse;Preference Elicitation",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/aa236850b67b965c81ba632d9bb404ef144a3216.zip",
        "author": "Duy Nguyen;Bao Nguyen;Viet Anh Nguyen",
        "authorids": "~Duy_Nguyen2;~Bao_Nguyen2;~Viet_Anh_Nguyen2",
        "gender": "M;M;M",
        "homepage": "https://duykhuongnguyen.github.io/;https://www.researchgate.net/profile/Nguyen-Bao-36;http://www.vietanhnguyen.net",
        "dblp": ";299/2996;",
        "google_scholar": "y323M_cAAAAJ;;3iyf-EoAAAAJ",
        "orcid": ";0000-0002-6770-2408;",
        "linkedin": "duy-nguyen-89272a17b/;bao-nguyen-0a360b197/;",
        "or_profile": "~Duy_Nguyen2;~Bao_Nguyen2;~Viet_Anh_Nguyen2",
        "aff": "VinAI Research;VinUniversity;The Chinese University of Hong Kong",
        "aff_domain": "vinai.io;vinuni.edu.vn;cuhk.edu.hk",
        "position": "Research Resident;Research Assistant;Assistant Professor",
        "bibtex": "@misc{\nnguyen2024cost,\ntitle={Cost Adaptive Recourse Recommendation by Adaptive Preference Elicitation},\nauthor={Duy Nguyen and Bao Nguyen and Viet Anh Nguyen},\nyear={2024},\nurl={https://openreview.net/forum?id=LTHWoQ9ac1}\n}",
        "github": "",
        "project": "",
        "reviewers": "Qous;WLdg;jnH1;r13q",
        "site": "https://openreview.net/forum?id=LTHWoQ9ac1",
        "pdf_size": 994008,
        "rating": "5;5;6;8",
        "confidence": "4;3;3;4",
        "soundness": "3;2;3;4",
        "contribution": "2;2;3;2",
        "presentation": "3;3;4;4",
        "wc_summary": "59;51;50;158",
        "wc_strengths": "53;27;72;224",
        "wc_weaknesses": "299;38;156;198",
        "wc_questions": "209;299;35;96",
        "wc_review": "620;415;313;676",
        "wc_reply_reviewers": "0;0;0;461",
        "wc_reply_authors": "894;749;351;953",
        "reply_reviewers": "0;0;0;2",
        "reply_authors": "2;2;1;3",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            79.5,
            45.45602270326783
        ],
        "wc_strengths_avg": [
            94.0,
            76.73656234155919
        ],
        "wc_weaknesses_avg": [
            172.75,
            93.56114310973332
        ],
        "wc_questions_avg": [
            159.75,
            101.78746239100374
        ],
        "wc_review_avg": [
            506.0,
            147.83943993400408
        ],
        "wc_reply_reviewers_avg": [
            115.25,
            199.6188555723131
        ],
        "wc_reply_authors_avg": [
            736.75,
            234.75772085279752
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.40824829046386296,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5557349933472657710&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "VinAI Research;VinUniversity;Chinese University of Hong Kong",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.vinai.io/;https://vinuni.edu.vn;https://www.cuhk.edu.hk",
        "aff_unique_abbr": "VinAI;VinUni;CUHK",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "Vietnam;China"
    },
    {
        "id": "LUEe72DwPG",
        "title": "Multi-Method Self-Training: Improving Code Generation With Text, And Vice Versa",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large Language Models have many methods for solving the same problem. This introduces novel strengths (different methods may work well for different problems) and weaknesses (it may be difficult for users to know which method to use). In this paper, we introduce Multi-Method Self-Training (MMST), where one method is trained on the filtered outputs of another, allowing us to augment the strengths and ameliorate the weaknesses of each method. Using a 176B parameter model trained on both language and code, we show that MMST can 1) improve the less performant method (up to 30\\%) making the model easier to use, 2) improve the more performant method (up to 32.2\\%) making the model more performant, and 3) improve the performance of related but distinct tasks (up to 10.3\\%) by improving the ability of the model to generate rationales. We then conduct ablation analyses to explore why MMST works. We show that MMST generates more data than traditional self-training, but the improvement in performance is driven by the use of multiple methods. We also analyze prompt-engineering and anti-correlated performance between methods as means of making MMST more effective. We hope the evidence from our paper motivates machine learning researchers to explore ways in which advances in language models allow for new forms of training.",
        "keywords": "self-training;large langauge models;finetuning;bootstrapping;multi-modal",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Shriyash Kaustubh Upadhyay;Etan Jacob Ginsberg",
        "authorids": "~Shriyash_Kaustubh_Upadhyay1;~Etan_Jacob_Ginsberg1",
        "gender": ";M",
        "homepage": ";http://www.etanginsberg.com",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Shriyash_Kaustubh_Upadhyay1;~Etan_Jacob_Ginsberg1",
        "aff": ";",
        "aff_domain": ";",
        "position": ";",
        "bibtex": "@misc{\nupadhyay2024multimethod,\ntitle={Multi-Method Self-Training: Improving Code Generation With Text, And Vice Versa},\nauthor={Shriyash Kaustubh Upadhyay and Etan Jacob Ginsberg},\nyear={2024},\nurl={https://openreview.net/forum?id=LUEe72DwPG}\n}",
        "github": "",
        "project": "",
        "reviewers": "kd49;uxjq;4TSd;jsGy",
        "site": "https://openreview.net/forum?id=LUEe72DwPG",
        "pdf_size": 595044,
        "rating": "3;5;5;6",
        "confidence": "4;3;3;3",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;1;3;4",
        "wc_summary": "70;122;58;107",
        "wc_strengths": "58;74;43;129",
        "wc_weaknesses": "145;80;70;68",
        "wc_questions": "108;8;76;98",
        "wc_review": "381;284;247;402",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            89.25,
            26.14741861063918
        ],
        "wc_strengths_avg": [
            76.0,
            32.50384592629001
        ],
        "wc_weaknesses_avg": [
            90.75,
            31.649447072579324
        ],
        "wc_questions_avg": [
            72.5,
            38.99679474008088
        ],
        "wc_review_avg": [
            328.5,
            64.7707495710834
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.9271726499455306,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:dFpZ0QmTjIgJ:scholar.google.com/&scioq=Multi-Method+Self-Training:+Improving+Code+Generation+With+Text,+And+Vice+Versa&hl=en&as_sdt=0,5",
        "gs_version_total": 3
    },
    {
        "id": "LUcdXA8hAa",
        "title": "Identifiability Matters: Revealing the Hidden Recoverable Condition in Unbiased Learning to Rank",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The application of Unbiased Learning to Rank (ULTR) is widespread in modern systems for training unbiased ranking models from biased click logs. The key is to explicitly model a generation process for user behavior and fit click data based on examination hypothesis. Previous research found empirically that the true latent relevance can be recovered in most cases as long as the clicks are perfectly fitted. However, we demonstrate that this is not always achievable, resulting in a significant reduction in ranking performance. In this work, we aim to answer if or when the true relevance can be recovered from click data, which is a foundation issue for ULTR field. We first define a ranking model as identifiable if it can recover the true relevance up to a scaling transformation, which is enough for pairwise ranking objective. Then we explore an equivalent condition for identifiability that can be novely expressed as a graph connectivity test problem: if and only if a graph (namely identifiability graph, or IG) constructed on the underlying structure of the dataset is connected, we can guarantee that the relevance can be correctly recovered. When the IG is not connected, there may be bad cases leading to poor ranking performance. To address this issue, we propose two methods, namely node intervention and node merging, to modify the dataset and restore connectivity of the IG. Empirical results obtained on a simulation dataset and two LTR benchmark datasets confirm the validity of our proposed theorems and show the effectiveness of our methods in mitigating data bias when the relevance model is unidentifiable.",
        "keywords": "learning to rank;unbiased learning to rank;identifiability;bias;debias;examination hypothesis",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/091e7dea576a2643ab76366cd4cf378ad8d6a97e.zip",
        "author": "Mouxiang Chen;Chenghao Liu;Zemin Liu;Zhuo Li;Jianling Sun",
        "authorids": "~Mouxiang_Chen1;~Chenghao_Liu1;~Zemin_Liu1;lizhuo@zju.edu.cn;~Jianling_Sun2",
        "gender": ";M;M;;",
        "homepage": "https://me.keytoix.vip;;https://zemin-liu.github.io/;;",
        "dblp": "297/0365;;17/964.html;;",
        "google_scholar": "5F0n6-4AAAAJ;https://scholar.google.com/citations?hl=en;IxHO1nkAAAAJ;;",
        "orcid": "0000-0002-8341-1467;;0000-0001-6262-9435;;",
        "linkedin": ";chenghao-liu-40a62a56/;;;",
        "or_profile": "~Mouxiang_Chen1;~Chenghao_Liu1;~Zemin_Liu1;lizhuo@zju.edu.cn;~Jianling_Sun2",
        "aff": "Zhejiang University;Salesforce AI Research;National University of Singapore;;",
        "aff_domain": "zju.edu.cn;salesforce.com;nus.edu;;",
        "position": "PhD student;Researcher;Postdoc;;",
        "bibtex": "@misc{\nchen2024identifiability,\ntitle={Identifiability Matters: Revealing the Hidden Recoverable Condition in Unbiased Learning to Rank},\nauthor={Mouxiang Chen and Chenghao Liu and Zemin Liu and Zhuo Li and Jianling Sun},\nyear={2024},\nurl={https://openreview.net/forum?id=LUcdXA8hAa}\n}",
        "github": "",
        "project": "",
        "reviewers": "CYAM;tHmn;2RKu;ggp4",
        "site": "https://openreview.net/forum?id=LUcdXA8hAa",
        "pdf_size": 714069,
        "rating": "3;5;5;6",
        "confidence": "4;4;4;3",
        "soundness": "1;2;3;2",
        "contribution": "2;3;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "103;97;95;127",
        "wc_strengths": "86;26;51;97",
        "wc_weaknesses": "598;46;57;144",
        "wc_questions": "3;280;160;232",
        "wc_review": "790;449;363;600",
        "wc_reply_reviewers": "0;0;0;95",
        "wc_reply_authors": "1041;578;480;944",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "4;3;3;4",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            105.5,
            12.757350822173073
        ],
        "wc_strengths_avg": [
            65.0,
            28.20460955234091
        ],
        "wc_weaknesses_avg": [
            211.25,
            226.49434319646926
        ],
        "wc_questions_avg": [
            168.75,
            104.79354703415665
        ],
        "wc_review_avg": [
            550.5,
            162.22592271274033
        ],
        "wc_reply_reviewers_avg": [
            23.75,
            41.13620667976084
        ],
        "wc_reply_authors_avg": [
            760.75,
            236.8220587276447
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.5,
            0.5
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.6622661785325219,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6290617749707121515&as_sdt=80005&sciodt=0,11&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Zhejiang University;Salesforce;National University of Singapore",
        "aff_unique_dep": ";Salesforce AI Research;",
        "aff_unique_url": "https://www.zju.edu.cn;https://www.salesforce.com;https://www.nus.edu.sg",
        "aff_unique_abbr": "ZJU;Salesforce AI;NUS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2",
        "aff_country_unique": "China;United States;Singapore"
    },
    {
        "title": "Masked Distillation Advances Self-Supervised Transformer Architecture Search",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18864",
        "id": "LUpC8KTvdV",
        "author_site": "Caixia Yan, Xiaojun Chang, Zhihui Li, Lina Yao, Minnan Luo, Qinghua Zheng",
        "tldr": "",
        "abstract": "Transformer architecture search (TAS) has achieved remarkable progress in automating the neural architecture design process of vision transformers. Recent TAS advancements have discovered outstanding transformer architectures while saving tremendous labor from human experts. However, it is still cumbersome to deploy these methods in real-world applications due to the expensive costs of data labeling under the supervised learning paradigm. To this end, this paper proposes a masked image modelling (MIM) based self-supervised neural architecture search method specifically designed for vision transformers, termed as MaskTAS, which completely avoids the expensive costs of data labeling inherited from supervised learning. Based on the one-shot NAS framework, MaskTAS requires to train various weight-sharing subnets, which can easily diverged without strong supervision in MIM-based self-supervised learning. For this issue, we design the search space of MaskTAS as a siamesed teacher-student architecture to distill knowledge from pre-trained networks, allowing for efficient training of the transformer supernet. To achieve self-supervised transformer architecture search, we further design a novel unsupervised evaluation metric for the evolutionary search algorithm, where each candidate of the student branch is rated by measuring its consistency with the larger teacher network. Extensive experiments demonstrate that the searched architectures can achieve state-of-the-art accuracy on CIFAR-10, CIFAR-100, and ImageNet datasets even without using manual labels. Moreover, the proposed MaskTAS can generalize well to various data domains and tasks by searching specialized transformer architectures in self-supervised manner.",
        "keywords": "Knowledge Distillation;Self-supervised Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Caixia Yan;Xiaojun Chang;Zhihui Li;Lina Yao;Minnan Luo;Qinghua Zheng",
        "authorids": "~Caixia_Yan1;~Xiaojun_Chang4;~Zhihui_Li1;~Lina_Yao2;~Minnan_Luo1;~Qinghua_Zheng1",
        "gender": "F;F;F;F;;M",
        "homepage": ";https://www.zhihui.li;https://www.linayao.com/;https://gr.xjtu.edu.cn/web/minnluo;http://gr.xjtu.edu.cn/web/qhzheng;https://www.xiaojun.ai",
        "dblp": "https://dblp.uni-trier.de/pers/y/Yan:Caixia.html;95/5287-1;56/6651-1;99/10051;32/1858;116/8412",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;https://scholar.google.com.au/citations?user=EU3snBgAAAAJ;https://scholar.google.com/citations?hl=zh-CN;;https://scholar.google.co.uk/citations?user=8suupocAAAAJ",
        "orcid": ";;;0000-0002-0140-7860;;",
        "linkedin": ";;linayao/;;;",
        "or_profile": "~Caixia_Yan1;~Zhihui_Li1;~Lina_Yao2;~Minnan_Luo1;~Qinghua_Zheng1;~Xiaojun_Chang1",
        "aff": ";University of Science and Technology of China;CSIRO's Data61;Xi'an Jiaotong University;Xi'an Jiaotong University;University of Technology Sydney",
        "aff_domain": ";ustc.edu.cn;data61.csiro.au;xjtu.edu.cn;xjtu.edu.cn;uts.edu.au",
        "position": ";Full Professor;Principal Researcher;Full Professor;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nyan2024masked,\ntitle={Masked Distillation Advances Self-Supervised Transformer Architecture Search},\nauthor={Caixia Yan and Xiaojun Chang and Zhihui Li and Lina Yao and Minnan Luo and Qinghua Zheng},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=LUpC8KTvdV}\n}",
        "github": "",
        "project": "",
        "reviewers": "YXCu;zgPr;nfTy;42Bt",
        "pdf_size": 2612880,
        "rating": "6;6;8;8",
        "confidence": "5;4;2;4",
        "soundness": "3;3;3;4",
        "contribution": "3;3;3;3",
        "presentation": "3;3;3;4",
        "wc_summary": "38;71;54;115",
        "wc_strengths": "19;44;68;66",
        "wc_weaknesses": "61;56;82;123",
        "wc_questions": "17;60;5;4",
        "wc_review": "135;231;209;308",
        "wc_reply_reviewers": "50;0;6;18",
        "wc_reply_authors": "447;689;543;504",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            69.5,
            28.74456470360962
        ],
        "wc_strengths_avg": [
            49.25,
            19.84155991851447
        ],
        "wc_weaknesses_avg": [
            80.5,
            26.405491853021786
        ],
        "wc_questions_avg": [
            21.5,
            22.808989455914087
        ],
        "wc_review_avg": [
            220.75,
            61.66188044489075
        ],
        "wc_reply_reviewers_avg": [
            18.5,
            19.30673457630782
        ],
        "wc_reply_authors_avg": [
            545.75,
            89.4745075426515
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.6882472016116854,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6415312304485652713&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=LUpC8KTvdV",
        "pdf": "https://openreview.net/pdf?id=LUpC8KTvdV",
        "email": ";ustc.edu.cn;data61.csiro.au;xjtu.edu.cn;xjtu.edu.cn;uts.edu.au",
        "author_num": 6,
        "aff_unique_index": "0;1;2;2;3",
        "aff_unique_norm": "University of Science and Technology of China;CSIRO;Xi'an Jiao Tong University;University of Technology Sydney",
        "aff_unique_dep": ";Data61;;",
        "aff_unique_url": "http://www.ustc.edu.cn;https://www.csiro.au;https://www.xjtu.edu.cn;https://www.uts.edu.au",
        "aff_unique_abbr": "USTC;CSIRO;XJTU;UTS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;1",
        "aff_country_unique": "China;Australia"
    },
    {
        "id": "LUw8AEQy93",
        "title": "Learning to Prompt Segmentation Foundation Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Segmentation foundation models (SFMs) like SEEM and SAM have demonstrated great potential in learning to segment anything. The core design of SFMs lies with \u201cPromptable Segmentation\u201d, which takes a handcrafted prompt as input and returns the expected segmentation mask. SFMs work with two types of prompts including spatial prompts (e.g., points) and semantic prompts (e.g., texts), which work together to prompt SFMs to segment anything on downstream datasets. Despite the important role of prompts, how to acquire suitable prompts for SFMs is largely under-explored. In this work, we examine the architecture of SFMs and identify two challenges for learning effective prompts for SFMs. To this end, we propose spatial-semantic prompt learning (SSPrompt) that learns effective semantic and spatial prompts for better SFMs. Specifically, SSPrompt introduces spatial prompt learning and semantic prompt learning, which optimize spatial prompts and semantic prompts directly over the embedding space and selectively leverage the knowledge encoded in pre-trained prompt encoders. Extensive experiments show that SSPrompt achieves superior image segmentation performance consistently across multiple widely adopted datasets.",
        "keywords": "segmentation foundation model;image segmentation;prompt learning;transfer learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Jiaxing Huang;Kai Jiang;Jingyi Zhang;Han Qiu;Lewei Lu;Shijian Lu",
        "authorids": "~Jiaxing_Huang2;~Kai_Jiang2;~Jingyi_Zhang7;~Han_Qiu2;~Lewei_Lu1;~Shijian_Lu1",
        "gender": "M;M;M;M;M;F",
        "homepage": "https://jxhuang0508.github.io/;;https://qhqk.github.io/hanqiu.github.io/;;https://personal.ntu.edu.sg/shijian.lu/;",
        "dblp": "62/6016-1.html;;;247/6438;42/2718;15/91-5",
        "google_scholar": "czirNcwAAAAJ;QzspFz4AAAAJ;YThp3g8AAAAJ;https://scholar.google.com.hk/citations?user=zdgKJXIAAAAJ;https://scholar.google.com.sg/scholar?hl=en;https://scholar.google.com/citations?hl=en",
        "orcid": ";0000-0001-9921-2043;;;;",
        "linkedin": ";;;lewei-lu-94015977/;;jingyi-zhang-6510871b0/",
        "or_profile": "~Jiaxing_Huang2;~Kai_Jiang2;~Han_Qiu2;~Lewei_Lu1;~Shijian_Lu1;~JINGYI_ZHANG4",
        "aff": "Nanyang Technological University;Xidian University;Nanyang Technological University;SenseTime;Nanyang Technological University;Nanyang Technological University",
        "aff_domain": "ntu.edu.sg;xidian.edu;ntu.edu.sg;sensetime.com;ntu.edu.sg;ntu.edu.sg",
        "position": "Postdoc;PhD student;PhD student;Researcher;Associate Professor;PhD student",
        "bibtex": "@misc{\nhuang2024learning,\ntitle={Learning to Prompt Segmentation Foundation Models},\nauthor={Jiaxing Huang and Kai Jiang and Jingyi Zhang and Han Qiu and Lewei Lu and Shijian Lu},\nyear={2024},\nurl={https://openreview.net/forum?id=LUw8AEQy93}\n}",
        "github": "",
        "project": "",
        "reviewers": "8VMA;3WRG;VfrA;V4Gx",
        "site": "https://openreview.net/forum?id=LUw8AEQy93",
        "pdf_size": 25856910,
        "rating": "3;5;6;6",
        "confidence": "5;4;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;4;2;3",
        "presentation": "4;3;3;2",
        "wc_summary": "189;47;28;135",
        "wc_strengths": "111;51;85;123",
        "wc_weaknesses": "80;71;132;79",
        "wc_questions": "5;30;17;30",
        "wc_review": "385;199;262;367",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            99.75,
            65.45752439559566
        ],
        "wc_strengths_avg": [
            92.5,
            27.617928959282953
        ],
        "wc_weaknesses_avg": [
            90.5,
            24.212600025606502
        ],
        "wc_questions_avg": [
            20.5,
            10.404326023342406
        ],
        "wc_review_avg": [
            303.25,
            76.34911590843734
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.9428090415820632,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:eSN9lBac_q0J:scholar.google.com/&scioq=Learning+to+Prompt+Segmentation+Foundation+Models&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;2;0;0",
        "aff_unique_norm": "Nanyang Technological University;Xidian University;SenseTime",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ntu.edu.sg;http://www.xidian.edu.cn/;https://www.sensetime.com",
        "aff_unique_abbr": "NTU;Xidian;SenseTime",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;1;0;0",
        "aff_country_unique": "Singapore;China"
    },
    {
        "id": "LVFoynuAQn",
        "title": "A universal metric of dataset similarity for multi-source learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Multi-source learning is a machine learning approach that involves training on data from multiple sources. Applied domains such as healthcare and finance have been increasingly using multi-source learning to improve model performance. However, datasets collected from different sources can be non-identically distributed, leading to degradation in model performance. Most existing methods for assessing dataset similarity are limited by being dataset or task-specific. They propose similarity metrics that are either unbounded and dependent on dataset dimension and scale, or require model-training.  Moreover, these metrics can only be calculated by exchanging data across sources, which can be a privacy concern in domains such as healthcare and finance. To address these challenges, we propose a novel bounded metric for assessing dataset similarity. Our metric exhibits several desirable properties: it is dataset-agnostic, considers label information, and requires no model training. First, we establish a theoretical connection between our metric and the learning process. Next, we extensively evaluate our metric on a range of real-world datasets and demonstrate that our cost metric assigns scores that align with how these data were collected. Further, we show a robust and interpretable relationship between our metric and multi-source learning performance. Finally, we provide a privacy-preserving method to calculate our metric. Our metric can provide valuable insights for deep learning practitioners using multi-source datasets.",
        "keywords": "multi-source learning;dataset similarity;optimal transport;privacy-preservation",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/8c63f31f7a9df207a3cc7eb360d28e1d33e7b9a3.pdf",
        "author": "Ahmed Elhussein;Gamze Gursoy",
        "authorids": "~Ahmed_Elhussein1;~Gamze_Gursoy1",
        "gender": "M;F",
        "homepage": ";https://www.g2lab.org",
        "dblp": ";",
        "google_scholar": "SzRieoEAAAAJ;ja9XsuMAAAAJ",
        "orcid": ";",
        "linkedin": "ahmed-elhussein-5b99501a3/;",
        "or_profile": "~Ahmed_Elhussein1;~Gamze_Gursoy1",
        "aff": "New York Genome Center;Columbia University",
        "aff_domain": "nygenome.org;columbia.edu",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nelhussein2024a,\ntitle={A universal metric of dataset similarity for multi-source learning},\nauthor={Ahmed Elhussein and Gamze Gursoy},\nyear={2024},\nurl={https://openreview.net/forum?id=LVFoynuAQn}\n}",
        "github": "",
        "project": "",
        "reviewers": "qVBz;U4Pq;8TNG",
        "site": "https://openreview.net/forum?id=LVFoynuAQn",
        "pdf_size": 1940542,
        "rating": "3;5;5",
        "confidence": "2;3;3",
        "soundness": "2;2;3",
        "contribution": "2;2;2",
        "presentation": "2;2;3",
        "wc_summary": "60;57;92",
        "wc_strengths": "24;18;179",
        "wc_weaknesses": "287;136;332",
        "wc_questions": "6;1;2",
        "wc_review": "377;212;605",
        "wc_reply_reviewers": "0;65;124",
        "wc_reply_authors": "771;733;726",
        "reply_reviewers": "0;1;1",
        "reply_authors": "1;2;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            69.66666666666667,
            15.839472494022296
        ],
        "wc_strengths_avg": [
            73.66666666666667,
            74.52218163443388
        ],
        "wc_weaknesses_avg": [
            251.66666666666666,
            83.82654048026131
        ],
        "wc_questions_avg": [
            3.0,
            2.160246899469287
        ],
        "wc_review_avg": [
            398.0,
            161.12727888225507
        ],
        "wc_reply_reviewers_avg": [
            63.0,
            50.642538114382326
        ],
        "wc_reply_authors_avg": [
            743.3333333333334,
            19.770910168449223
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.9999999999999998,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:0BprfKv_CvEJ:scholar.google.com/&scioq=A+universal+metric+of+dataset+similarity+for+multi-source+learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "New York Genome Center;Columbia University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.nygenome.org;https://www.columbia.edu",
        "aff_unique_abbr": "NYGC;Columbia",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "LVp217SAtb",
        "title": "ADAPTER-RL: Adaptation of Any Agent using Reinforcement Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Deep Reinforcement Learning (DRL) agents frequently face challenges in adapting to tasks outside their training distribution, facing issues with over-fitting, catastrophic forgetting and sample inefficiency. Although the application of adapters has proven effective in supervised learning contexts such as natural language processing and computer vision, their potential within the DRL domain remains largely unexplored. This paper delves into the integration of adapters in reinforcement learning, presenting an innovative adaptation strategy that demonstrates enhanced training efficiency and imporvement of the base-agent, experimentally in the nanoRTS environment, a real-time strategy game simulation. Our proposed universal approach is not only compatible with pre-trained neural networks but also with rule-based agents, offering a means to integrate human expertise.",
        "keywords": "adapter;reinforcement learning;human expertise",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/138f455ccd0cc4492c143e174841ee73b6fba88c.zip",
        "author": "Yizhao Jin;Gregory Slabaugh;Simon Lucas",
        "authorids": "~Yizhao_Jin1;~Gregory_Slabaugh2;~Simon_Lucas1",
        "gender": "M;M;M",
        "homepage": "https://github.com/decatt;https://www.eecs.qmul.ac.uk/~gslabaugh/publications.html;http://eecs.qmul.ac.uk/people/profiles/lucassimon.html",
        "dblp": ";s/GregoryGSlabaugh.html;50/4174",
        "google_scholar": ";oUK2gu8AAAAJ;https://scholar.google.co.uk/citations?user=Jz8DDVAAAAAJ",
        "orcid": ";0000-0003-4060-5226;0000-0002-3180-7451",
        "linkedin": ";greg-slabaugh-a5b03a1/;simon-lucas-game-AI/",
        "or_profile": "~Yizhao_Jin1;~Gregory_Slabaugh2;~Simon_Mark_Lucas1",
        "aff": "Queen Mary, University of London;Queen Mary University London;Queen Mary University of London",
        "aff_domain": "qmul.ac.uk;qmul.ac.uk;qmul.ac.uk",
        "position": "PhD student;Professor;Full Professor",
        "bibtex": "@misc{\njin2024adapterrl,\ntitle={{ADAPTER}-{RL}: Adaptation of Any Agent using Reinforcement Learning},\nauthor={Yizhao Jin and Gregory Slabaugh and Simon Lucas},\nyear={2024},\nurl={https://openreview.net/forum?id=LVp217SAtb}\n}",
        "github": "",
        "project": "",
        "reviewers": "UG4J;dR9v;tvEM",
        "site": "https://openreview.net/forum?id=LVp217SAtb",
        "pdf_size": 846324,
        "rating": "3;3;3",
        "confidence": "4;4;4",
        "soundness": "2;2;2",
        "contribution": "1;1;2",
        "presentation": "1;2;2",
        "wc_summary": "39;46;9",
        "wc_strengths": "49;13;4",
        "wc_weaknesses": "169;189;108",
        "wc_questions": "52;166;2",
        "wc_review": "309;414;123",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            31.333333333333332,
            16.048537489614297
        ],
        "wc_strengths_avg": [
            22.0,
            19.44222209522358
        ],
        "wc_weaknesses_avg": [
            155.33333333333334,
            34.451253807211266
        ],
        "wc_questions_avg": [
            73.33333333333333,
            68.63105872869966
        ],
        "wc_review_avg": [
            282.0,
            120.32456108376212
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10641288765481154544&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Queen Mary, University of London;Queen Mary University of London",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.qmul.ac.uk;https://www.qmul.ac.uk",
        "aff_unique_abbr": "QMUL;QMUL",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "London",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "LWDRiFzbHQ",
        "title": "Vicinal Assessment of Model Generalization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "This paper studies how to assess the generalization ability of classification models on out-of-distribution test sets without relying on test ground truths. Existing works usually compute an unsupervised indicator of a certain model property, such as confidence and invariance, which is correlated with out-of-distribution accuracy. However, these indicators are generally computed based on a \\textit{single} test sample in isolation (and subsequently averaged over the test set), and thus are subject to spurious model responses, such as excessively high or low confidence. To address this issue, we propose to integrate model responses of \\textit{neighboring} test samples into the correctness indicator of the every test sample. Intuitively, if a model consistently demonstrates high correctness scores for nearby samples, it becomes more likely that the target sample will also be correctly predicted, and vice versa. This score is finally averaged across all test samples to indicate model accuracy holistically. This strategy is developed under the vicinal risk formulation, and, since its computation does not rely on labels, is called vicinal risk proxy (VRP). We show that VRP methodologically can be applied to existing generalization indicators such as average confidence and effective invariance and experimentally brings consistent improvements to these baselines. That is, stronger correlation with model accuracy is observed, especially on severe out-of-distribution test sets.",
        "keywords": "Label-free Evaluation;Vicinal Risk;Model-Centric AI",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/c844a532a69660953df7652a0d186acf1eb898b2.pdf",
        "author": "Yuchi Liu;Yifan Sun;Jingdong Wang;Liang Zheng",
        "authorids": "~Yuchi_Liu1;~Yifan_Sun2;~Jingdong_Wang1;~Liang_Zheng4",
        "gender": "M;M;M;M",
        "homepage": ";https://yifansun-reid.github.io;https://jingdongwang2017.github.io/;http://zheng-lab.cecs.anu.edu.au/",
        "dblp": ";99/10261-3.html;49/3441;61/7360-1",
        "google_scholar": "fBQdhG0AAAAJ;uUZEL7UAAAAJ;z5SPCmgAAAAJ;https://scholar.google.com.au/citations?user=vNHqr3oAAAAJ",
        "orcid": "0000-0001-9061-6180;0000-0003-3532-6521;0000-0002-4888-4445;",
        "linkedin": ";;;liang-zheng-76341311a/",
        "or_profile": "~Yuchi_Liu1;~Yifan_Sun2;~Jingdong_Wang1;~Liang_Zheng4",
        "aff": "Australian National University;Baidu;Baidu;Australian National University",
        "aff_domain": "anu.edu.au;baidu.com;baidu.com;anu.edu.au",
        "position": "PhD student;Senior Expert;Chief Scientist for Computer Vision;Associate Professor",
        "bibtex": "@misc{\nliu2024vicinal,\ntitle={Vicinal Assessment of Model Generalization},\nauthor={Yuchi Liu and Yifan Sun and Jingdong Wang and Liang Zheng},\nyear={2024},\nurl={https://openreview.net/forum?id=LWDRiFzbHQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "fA71;TbRp;R4Lp;FoiT",
        "site": "https://openreview.net/forum?id=LWDRiFzbHQ",
        "pdf_size": 1684472,
        "rating": "3;3;5;6",
        "confidence": "5;3;4;4",
        "soundness": "3;3;2;3",
        "contribution": "1;2;2;3",
        "presentation": "4;2;3;4",
        "wc_summary": "74;55;86;150",
        "wc_strengths": "93;27;121;44",
        "wc_weaknesses": "320;54;245;176",
        "wc_questions": "33;105;81;176",
        "wc_review": "520;241;533;546",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            91.25,
            35.67474596966319
        ],
        "wc_strengths_avg": [
            71.25,
            37.5790832778023
        ],
        "wc_weaknesses_avg": [
            198.75,
            97.86566047393744
        ],
        "wc_questions_avg": [
            98.75,
            51.58669886705293
        ],
        "wc_review_avg": [
            460.0,
            126.77341992704937
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Jqc3Xf5M6JoJ:scholar.google.com/&scioq=Vicinal+Assessment+of+Model+Generalization&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;0",
        "aff_unique_norm": "Australian National University;Baidu",
        "aff_unique_dep": ";Baidu, Inc.",
        "aff_unique_url": "https://www.anu.edu.au;https://www.baidu.com",
        "aff_unique_abbr": "ANU;Baidu",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "Australia;China"
    },
    {
        "id": "LWEqTLCHrw",
        "title": "Kick Bad Guys Out! Zero-Knowledge-Proof-Based Anomaly Detection in Federated Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Federated learning (FL) systems are vulnerable to malicious clients that submit poisoned local models to achieve their adversarial goals, such as preventing the convergence of the global model or inducing the global model to misclassify some data. Many existing defense mechanisms are impractical in real-world FL systems, as they require prior knowledge of the number of malicious clients or rely on re-weighting or modifying submissions. This is because adversaries typically do not announce their intentions before attacking, and re-weighting might change aggregation results even in the absence of attacks. To address these challenges in real FL systems, this paper introduces a cutting-edge anomaly detection approach with the following features: i) Detecting the occurrence of attacks and performing defense operations only when attacks happen; ii) Upon the occurrence of an attack, further detecting the malicious client models and eliminating them without harming the benign ones; iii) Ensuring honest execution of defense mechanisms at the server by leveraging a zero-knowledge proof mechanism. We validate the superior performance of the proposed approach with extensive experiments.",
        "keywords": "anomaly detection;federated learning;attack;defense;privacy;security",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Shanshan Han;Wenxuan Wu;Baturalp Buyukates;Weizhao Jin;Yuhang Yao;Qifan Zhang;Salman Avestimehr;Chaoyang He",
        "authorids": "~Shanshan_Han1;~Wenxuan_Wu3;~Baturalp_Buyukates1;~Weizhao_Jin1;~Yuhang_Yao2;~Qifan_Zhang4;~Salman_Avestimehr1;~Chaoyang_He1",
        "gender": "F;M;M;;;;;M",
        "homepage": "https://www.linkedin.com/in/shanshan-h-b0bb89222/;;https://bbuyukates.github.io;https://weizhaojin.netlify.app/;https://www.andrew.cmu.edu/user/yuhangya/;;;http://chaoyanghe.com",
        "dblp": "12/4476.html;191/2518;230/4023;266/5162;203/0159;;;222/6721-1.html",
        "google_scholar": "h4qm6oAAAAAJ;oFVCquAAAAAJ;JjASH4UAAAAJ;I4E46yEAAAAJ;oQIV0BoAAAAJ;;;2z2camUAAAAJ",
        "orcid": ";;;0000-0003-3269-5823;0000-0002-7045-0002;;;",
        "linkedin": ";;;;yuhang-yao/;;;",
        "or_profile": "~Shanshan_Han1;~Wenxuan_Wu3;~Baturalp_Buyukates1;~Weizhao_Jin1;~Yuhang_Yao2;~Qifan_Zhang4;~Salman_Avestimehr1;~Chaoyang_He1",
        "aff": "University of California, Irvine;Texas A&M University - College Station;University of Southern California;University of Southern California;Carnegie Mellon University;;;TensorOpera AI",
        "aff_domain": "uci.edu;tamu.edu;usc.edu;usc.edu;andrew.cmu.edu;;;tensoropera.ai",
        "position": "PhD student;PhD student;Postdoc;PhD student;PhD student;;;Researcher",
        "bibtex": "@misc{\nhan2024kick,\ntitle={Kick Bad Guys Out! Zero-Knowledge-Proof-Based Anomaly Detection in Federated Learning},\nauthor={Shanshan Han and Wenxuan Wu and Baturalp Buyukates and Weizhao Jin and Yuhang Yao and Qifan Zhang and Salman Avestimehr and Chaoyang He},\nyear={2024},\nurl={https://openreview.net/forum?id=LWEqTLCHrw}\n}",
        "github": "",
        "project": "",
        "reviewers": "TEpF;zU9y;qLTB",
        "site": "https://openreview.net/forum?id=LWEqTLCHrw",
        "pdf_size": 3335447,
        "rating": "3;5;6",
        "confidence": "4;3;2",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "2;3;3",
        "wc_summary": "62;48;40",
        "wc_strengths": "11;27;30",
        "wc_weaknesses": "109;316;21",
        "wc_questions": "4;6;99",
        "wc_review": "186;397;190",
        "wc_reply_reviewers": "138;5;0",
        "wc_reply_authors": "2143;1352;708",
        "reply_reviewers": "1;1;0",
        "reply_authors": "4;2;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            50.0,
            9.092121131323903
        ],
        "wc_strengths_avg": [
            22.666666666666668,
            8.339997335464536
        ],
        "wc_weaknesses_avg": [
            148.66666666666666,
            123.65633380012886
        ],
        "wc_questions_avg": [
            36.333333333333336,
            44.31954672852851
        ],
        "wc_review_avg": [
            257.6666666666667,
            98.5370770601379
        ],
        "wc_reply_reviewers_avg": [
            47.666666666666664,
            63.90791987087534
        ],
        "wc_reply_authors_avg": [
            1401.0,
            586.8600060207432
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.9819805060619659,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6301026245092975040&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;2;3;4",
        "aff_unique_norm": "University of California, Irvine;Texas A&M University;University of Southern California;Carnegie Mellon University;TensorOpera AI",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.uci.edu;https://www.tamu.edu;https://www.usc.edu;https://www.cmu.edu;",
        "aff_unique_abbr": "UCI;TAMU;USC;CMU;",
        "aff_campus_unique_index": "0;1;2;2",
        "aff_campus_unique": "Irvine;College Station;Los Angeles;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States;"
    },
    {
        "title": "Attention-Guided Contrastive Role Representations for Multi-agent Reinforcement Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18863",
        "id": "LWmuPfEYhH",
        "author_site": "Zican Hu, Zongzhang Zhang, Huaxiong Li, Chunlin Chen, Hongyu Ding, Zhi Wang",
        "tldr": "",
        "abstract": "Real-world multi-agent tasks usually involve dynamic team composition with the emergence of roles, which should also be a key to efficient cooperation in multi-agent reinforcement learning (MARL). Drawing inspiration from the correlation between roles and agent's behavior patterns, we propose a novel framework of **A**ttention-guided **CO**ntrastive **R**ole representation learning for **M**ARL (**ACORM**) to promote behavior heterogeneity, knowledge transfer, and skillful coordination across agents. First, we introduce mutual information maximization to formalize role representation learning, derive a contrastive learning objective, and concisely approximate the distribution of negative pairs. Second, we leverage an attention mechanism to prompt the global state to attend to learned role representations in value decomposition, implicitly guiding agent coordination in a skillful role space to yield more expressive credit assignment. Experiments on challenging StarCraft II micromanagement and Google research football tasks demonstrate the state-of-the-art performance of our method and its advantages over existing approaches. Our code is available at [https://github.com/NJU-RL/ACORM](https://github.com/NJU-RL/ACORM).",
        "keywords": "Multi-agent reinforcement learning;contrastive learning;attention mechanism",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/552d0d29275cde1081e289dc905dabd116c9d6df.zip",
        "author": "Zican Hu;Zongzhang Zhang;Huaxiong Li;Chunlin Chen;Hongyu Ding;Zhi Wang",
        "authorids": "~Zican_Hu1;~Zongzhang_Zhang1;~Huaxiong_Li1;~Chunlin_Chen1;~Hongyu_Ding1;~Zhi_Wang7",
        "gender": "F;M;M;M;M;",
        "homepage": "https://github.com/huzican;http://www.lamda.nju.edu.cn/zhangzz;https://sme.nju.edu.cn/5d/12/c6494a154898/page8.htm;https://sme.nju.edu.cn/ccl/list.htm;;",
        "dblp": ";90/8724;92/1251;68/6992.html;;",
        "google_scholar": ";sG7WEAgAAAAJ;https://scholar.google.com.hk/citations?user=AC-EDw0AAAAJ;;;",
        "orcid": ";;0000-0003-0395-1525;;0000-0001-9391-8985;",
        "linkedin": ";;;;;",
        "or_profile": "~Zican_Hu1;~Zongzhang_Zhang1;~Huaxiong_Li1;~Chunlin_Chen1;~Hongyu_Ding1;~Zhi_Wang7",
        "aff": "Nanjing University;Nanjing University;Nanjing University;Nanjing University;;",
        "aff_domain": "nju.edu.cn;nju.edu.cn;nju.edu.cn;nju.edu.cn;;",
        "position": "MS student;Associate Professor;Full Professor;Full Professor;;",
        "bibtex": "@inproceedings{\nhu2024attentionguided,\ntitle={Attention-Guided Contrastive Role Representations for Multi-agent Reinforcement Learning},\nauthor={Zican Hu and Zongzhang Zhang and Huaxiong Li and Chunlin Chen and Hongyu Ding and Zhi Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=LWmuPfEYhH}\n}",
        "github": "",
        "project": "",
        "reviewers": "WWCs;53j5;jtxX;1yPm",
        "pdf_size": 21555673,
        "rating": "3;5;6;6",
        "confidence": "4;3;4;5",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;2",
        "presentation": "3;2;3;3",
        "wc_summary": "75;30;53;94",
        "wc_strengths": "52;32;22;112",
        "wc_weaknesses": "124;204;27;293",
        "wc_questions": "142;280;38;7",
        "wc_review": "393;546;140;506",
        "wc_reply_reviewers": "0;0;0;56",
        "wc_reply_authors": "1121;1329;606;877",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "4;5;2;3",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            63.0,
            23.947860029656095
        ],
        "wc_strengths_avg": [
            54.5,
            34.910600109422354
        ],
        "wc_weaknesses_avg": [
            162.0,
            98.22677842625197
        ],
        "wc_questions_avg": [
            116.75,
            106.69436489337194
        ],
        "wc_review_avg": [
            396.25,
            158.22827655005284
        ],
        "wc_reply_reviewers_avg": [
            14.0,
            24.24871130596428
        ],
        "wc_reply_authors_avg": [
            983.25,
            270.2428306172062
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.5,
            1.118033988749895
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.28867513459481287,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13333751493583840026&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=LWmuPfEYhH",
        "pdf": "https://openreview.net/pdf?id=LWmuPfEYhH",
        "email": "nju.edu.cn;nju.edu.cn;nju.edu.cn;nju.edu.cn;;",
        "author_num": 6,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Nanjing University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nju.edu.cn",
        "aff_unique_abbr": "Nanjing U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "LWqeF78c1q",
        "title": "Vision-Language Integration in Multimodal Video Transformers (Partially) Aligns with the Brain",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Integrating information from multiple modalities is arguably one of the essential prerequisites for grounding artificial intelligence systems with an understanding of the real world. Recent advances in video transformers that jointly learn from vision, text, and sound over time have made some progress toward this goal, but the degree to which these models integrate information from modalities still remains unclear. In this work, we present a promising approach for probing a pre-trained multimodal video transformer model by leveraging neuroscientific evidence of multimodal information processing in the brain. Using brain recordings of participants watching a popular TV show, we analyze the effects of multi-modal connections and interactions in a pre-trained multi-modal video transformer on the alignment with uni- and multi-modal brain regions. We find evidence that vision enhances masked prediction performance during language processing, providing support that cross-modal representations in models can benefit individual modalities. However, we don't find evidence of brain-relevant information captured by the joint multi-modal transformer representations beyond that captured by all of the individual modalities. We finally show that the brain alignment of the pre-trained joint representation can be improved by fine-tuning using a task that requires vision-language inferences. Overall, our results paint an optimistic picture of the ability of multi-modal transformers to integrate vision and language in partially brain-relevant ways but also show that improving the brain alignment of these models may require new approaches.",
        "keywords": "multimodal representations; brain alignment; interpretability; multimodal video transformers; vision and language",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/65c00395baa799a3f3b59c8bb47b76c493bcd170.pdf",
        "author": "Dota Tianai Dong;Mariya Toneva",
        "authorids": "~Dota_Tianai_Dong1;~Mariya_Toneva1",
        "gender": "F;F",
        "homepage": "https://tianaidong.github.io/;https://mtoneva.com",
        "dblp": "330/6074;160/4677",
        "google_scholar": "AuKjLM0AAAAJ;https://scholar.google.ca/citations?user=a61sk-4AAAAJ",
        "orcid": ";0000-0002-2407-9871",
        "linkedin": ";",
        "or_profile": "~Dota_Tianai_Dong1;~Mariya_K_Toneva1",
        "aff": "Max Planck Institute for Psycholinguistics ;Max Planck Institute for Software Systems",
        "aff_domain": "mpi.nl;mpi-sws.org",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\ndong2024visionlanguage,\ntitle={Vision-Language Integration in Multimodal Video Transformers (Partially) Aligns with the Brain},\nauthor={Dota Tianai Dong and Mariya Toneva},\nyear={2024},\nurl={https://openreview.net/forum?id=LWqeF78c1q}\n}",
        "github": "",
        "project": "",
        "reviewers": "raye;PSLv;mgqB;yHuj",
        "site": "https://openreview.net/forum?id=LWqeF78c1q",
        "pdf_size": 2621145,
        "rating": "1;3;5;6",
        "confidence": "5;3;5;1",
        "soundness": "1;2;3;3",
        "contribution": "1;2;2;3",
        "presentation": "2;2;3;2",
        "wc_summary": "72;130;123;128",
        "wc_strengths": "46;59;92;42",
        "wc_weaknesses": "200;123;331;219",
        "wc_questions": "42;52;197;1",
        "wc_review": "360;364;743;390",
        "wc_reply_reviewers": "0;0;289;0",
        "wc_reply_authors": "0;0;1866;0",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "0;0;4;0",
        "rating_avg": [
            3.75,
            1.920286436967152
        ],
        "confidence_avg": [
            3.5,
            1.6583123951777
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            113.25,
            23.951774464536026
        ],
        "wc_strengths_avg": [
            59.75,
            19.651653874419832
        ],
        "wc_weaknesses_avg": [
            218.25,
            74.36186858867924
        ],
        "wc_questions_avg": [
            73.0,
            74.09790820259369
        ],
        "wc_review_avg": [
            464.25,
            161.34803221607632
        ],
        "wc_reply_reviewers_avg": [
            72.25,
            125.14067084685138
        ],
        "wc_reply_authors_avg": [
            466.5,
            808.0017017308812
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            1.7320508075688772
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5888015039841447,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17085625599191987210&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Max Planck Institute for Psycholinguistics;Max Planck Institute for Software Systems",
        "aff_unique_dep": "Psycholinguistics;",
        "aff_unique_url": "https://www.mpi.nl;https://www.mpi-sws.org",
        "aff_unique_abbr": "MPI;MPI-SWS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Netherlands;Germany"
    },
    {
        "title": "A Black-box Approach for Non-stationary Multi-agent Reinforcement Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18862",
        "id": "LWuYsSD94h",
        "author_site": "Haozhe Jiang, Qiwen Cui, Zhihan Xiong, Maryam Fazel, Simon Du",
        "tldr": "",
        "abstract": "We investigate learning the equilibria in non-stationary multi-agent systems and address the challenges that differentiate multi-agent learning from single-agent learning. Specifically, we focus on games with bandit feedback, where testing an equilibrium can result in substantial regret even when the gap to be tested is small, and the existence of multiple optimal solutions (equilibria) in stationary games poses extra challenges. To overcome these obstacles, we propose a versatile black-box approach applicable to a broad spectrum of problems, such as general-sum games, potential games, and Markov games, when equipped with appropriate learning and testing oracles for stationary environments. Our algorithms can achieve $\\widetilde{O}\\left(\\Delta^{1/4}T^{3/4}\\right)$ regret when the degree of nonstationarity, as measured by total variation $\\Delta$, is known, and $\\widetilde{O}\\left(\\Delta^{1/5}T^{4/5}\\right)$ regret when $\\Delta$ is unknown, where $T$ is the number of rounds. Meanwhile, our algorithm inherits the favorable dependence on number of agents from the oracles. As a side contribution that may be independent of interest, we show how to test for various types of equilibria by a black-box reduction to single-agent learning, which includes Nash equilibria, correlated equilibria, and coarse correlated equilibria.",
        "keywords": "regret analysis;learning in non-stationary games;bandit feedback",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Haozhe Jiang;Qiwen Cui;Zhihan Xiong;Maryam Fazel;Simon Shaolei Du",
        "authorids": "~Haozhe_Jiang1;~Qiwen_Cui1;~Zhihan_Xiong1;~Maryam_Fazel1;~Simon_Shaolei_Du1",
        "gender": "M;M;M;F;M",
        "homepage": "https://astro-eric.github.io;;https://homes.cs.washington.edu/~zhihanx/;;http://simonshaoleidu.com",
        "dblp": "303/4241;276/6268;255/6096;10/2309;176/5602",
        "google_scholar": "HQCpSJMAAAAJ;AnSVkUYAAAAJ;OsSiEMEAAAAJ;vlN_kRoAAAAJ;OttawxUAAAAJ",
        "orcid": ";;;;",
        "linkedin": "haozhe-jiang-261b83212/;;zhihan-xiong/;;",
        "or_profile": "~Haozhe_Jiang1;~Qiwen_Cui1;~Zhihan_Xiong1;~Maryam_Fazel1;~Simon_Shaolei_Du1",
        "aff": "Tsinghua University;Department of Computer Science, University of Washington;University of Washington;University of Washington, Seattle;University of Washington",
        "aff_domain": "mails.tsinghua.edu.cn;cs.washington.edu;washington.edu;uw.edu;washington.edu",
        "position": "Undergrad student;PhD student;PhD student;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\njiang2024a,\ntitle={A Black-box Approach for Non-stationary Multi-agent Reinforcement Learning},\nauthor={Haozhe Jiang and Qiwen Cui and Zhihan Xiong and Maryam Fazel and Simon Shaolei Du},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=LWuYsSD94h}\n}",
        "github": "",
        "project": "",
        "reviewers": "nAA2;AT29;FQRF;Zou4",
        "pdf_size": 514125,
        "rating": "6;6;6;6",
        "confidence": "3;2;2;4",
        "soundness": "3;3;3;3",
        "contribution": "3;3;2;3",
        "presentation": "3;2;2;3",
        "wc_summary": "70;337;143;19",
        "wc_strengths": "82;28;108;45",
        "wc_weaknesses": "104;95;277;147",
        "wc_questions": "138;95;185;4",
        "wc_review": "394;555;713;215",
        "wc_reply_reviewers": "56;163;31;0",
        "wc_reply_authors": "449;473;710;847",
        "reply_reviewers": "1;2;1;0",
        "reply_authors": "2;3;3;3",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            142.25,
            120.76707953743023
        ],
        "wc_strengths_avg": [
            65.75,
            31.24399942388938
        ],
        "wc_weaknesses_avg": [
            155.75,
            72.7096107815191
        ],
        "wc_questions_avg": [
            105.5,
            66.68770501374297
        ],
        "wc_review_avg": [
            469.25,
            185.11668617388332
        ],
        "wc_reply_reviewers_avg": [
            62.5,
            61.32087735836792
        ],
        "wc_reply_authors_avg": [
            619.75,
            166.19171910778226
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.75,
            0.4330127018922193
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15934907686079741605&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=LWuYsSD94h",
        "pdf": "https://openreview.net/pdf?id=LWuYsSD94h",
        "email": "mails.tsinghua.edu.cn;cs.washington.edu;washington.edu;uw.edu;washington.edu",
        "author_num": 5,
        "aff_unique_index": "0;1;1;1;1",
        "aff_unique_norm": "Tsinghua University;University of Washington",
        "aff_unique_dep": ";Department of Computer Science",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.washington.edu",
        "aff_unique_abbr": "THU;UW",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Seattle",
        "aff_country_unique_index": "0;1;1;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "LWwYyxF3w9",
        "title": "Training-Free Generalization on Heterogeneous Tabular Data via Meta-Representation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Tabular data is prevalent across various machine learning domains. Yet, the inherent heterogeneities in attribute and class spaces across different tabular datasets hinder the effective sharing of knowledge, limiting a tabular model to benefit from other datasets.\nIn this paper, we propose Tabular data Pre-Training via Meta-representation (TabPTM), which allows one tabular model pre-training on a set of heterogeneous datasets. Then, this pre-trained model can be directly applied to unseen datasets that have diverse attributes and classes *without additional training*. Specifically, TabPTM represents an instance through its distance to a fixed number of prototypes, thereby standardizing heterogeneous tabular datasets. A deep neural network is then trained to associate these meta-representations with dataset-specific classification confidences, endowing TabPTM with the ability of *training-free generalization*. Experiments validate that TabPTM achieves promising performance in new datasets, even under few-shot scenarios.",
        "keywords": "Tabular data;Deep tabular learning;Tabular data pre-training;Training-free generalization",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Han-Jia Ye;Qile Zhou;De-Chuan Zhan",
        "authorids": "~Han-Jia_Ye1;~Qile_Zhou1;~De-Chuan_Zhan1",
        "gender": "M;M;M",
        "homepage": "http://www.lamda.nju.edu.cn/yehj;http://www.lamda.nju.edu.cn/zhouql/;http://www.lamda.nju.edu.cn/zhandc/",
        "dblp": "165/3014;359/3740.html;74/498",
        "google_scholar": "mgOYhtoAAAAJ;;mYJf4TcAAAAJ",
        "orcid": ";;0000-0002-3533-2078",
        "linkedin": ";;",
        "or_profile": "~Han-Jia_Ye1;~Qile_Zhou1;~De-Chuan_Zhan1",
        "aff": "Nanjing University;Nanjing University;Nanjing University",
        "aff_domain": "nju.edu.cn;nju.edu.cn;nju.edu.cn",
        "position": "Associate Professor;MS student;Full Professor",
        "bibtex": "@misc{\nye2024trainingfree,\ntitle={Training-Free Generalization on Heterogeneous Tabular Data via Meta-Representation},\nauthor={Han-Jia Ye and Qile Zhou and De-Chuan Zhan},\nyear={2024},\nurl={https://openreview.net/forum?id=LWwYyxF3w9}\n}",
        "github": "",
        "project": "",
        "reviewers": "65fa;bXAG;jAb7;XUXC",
        "site": "https://openreview.net/forum?id=LWwYyxF3w9",
        "pdf_size": 693537,
        "rating": "1;3;5;6",
        "confidence": "4;4;4;4",
        "soundness": "1;3;2;2",
        "contribution": "1;1;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "143;119;90;65",
        "wc_strengths": "17;11;32;52",
        "wc_weaknesses": "109;163;220;185",
        "wc_questions": "36;31;39;42",
        "wc_review": "305;324;381;344",
        "wc_reply_reviewers": "157;0;136;0",
        "wc_reply_authors": "530;593;907;841",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "2;1;3;2",
        "rating_avg": [
            3.75,
            1.920286436967152
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            1.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            104.25,
            29.422567868899545
        ],
        "wc_strengths_avg": [
            28.0,
            15.827191791344413
        ],
        "wc_weaknesses_avg": [
            169.25,
            40.28880117352712
        ],
        "wc_questions_avg": [
            37.0,
            4.06201920231798
        ],
        "wc_review_avg": [
            338.5,
            28.146935890075138
        ],
        "wc_reply_reviewers_avg": [
            73.25,
            73.62531833547479
        ],
        "wc_reply_authors_avg": [
            717.75,
            159.5452522013739
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16982273619429005045&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Nanjing University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nju.edu.cn",
        "aff_unique_abbr": "Nanjing U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "In-Context Pretraining: Language Modeling Beyond Document Boundaries",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18861",
        "id": "LXVswInHOo",
        "author_site": "Weijia Shi, Sewon Min, Maria Lomeli, Chunting Zhou, Margaret Li, Xi Lin, Noah Smith, Luke Zettlemoyer, Scott Yih, Mike Lewis",
        "tldr": "",
        "abstract": "Language models are currently trained to predict tokens given document prefixes, enabling them to zero shot long form generation and prompting-style tasks which can be reduced to document completion. We instead present IN-CONTEXT PRETRAINING, a new approach where language models are trained on a sequence of related documents, thereby explicitly encouraging them to read and reason across document boundaries. Our approach builds on the fact that current pipelines train by concatenating random sets of shorter documents to create longer context windows; this improves efficiency even though the prior documents provide no signal for predicting the next document. Given this fact, we can do IN-CONTEXT PRETRAINING by simply changing the document ordering so that each context contains related documents, and directly applying existing pretraining pipelines. However, this document sorting problem is challenging. There are billions of documents and we would like the sort to maximize contextual similarity for every document without repeating any data. To do this, we introduce approximate algorithms for finding related documents with efficient nearest neighbor search and constructing coherent batches with a graph cover algorithm. Our experiments show IN-CONTEXT PRETRAINING offers a scalable and simple approach to significantly enhance LM performance: we see notable improvements in tasks that require more complex contextual reasoning, including in-context learning (+8%), reading comprehension (+15%), faithfulness to previous contexts (+16%), long-context reasoning (+5%), and retrieval augmentation (+9%).",
        "keywords": "Large Language Models",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Weijia Shi;Sewon Min;Maria Lomeli;Chunting Zhou;Margaret Li;Xi Victoria Lin;Noah A. Smith;Luke Zettlemoyer;Wen-tau Yih;Mike Lewis",
        "authorids": "~Weijia_Shi1;~Sewon_Min1;~Maria_Lomeli2;~Chunting_Zhou1;~Margaret_Li1;~Xi_Victoria_Lin1;~Noah_A._Smith2;~Luke_Zettlemoyer1;~Wen-tau_Yih1;~Mike_Lewis1",
        "gender": ";F;F;F;F;F;M;M;M;M",
        "homepage": "https://weijiashi.notion.site/;https://www.sewonmin.com;https://mlomeli1.github.io;https://violet-zct.github.io/;https://margs.li;http://victorialin.net;https://www.cs.washington.edu/people/faculty/lsz/;http://scottyih.org;;https://homes.cs.washington.edu/~nasmith/",
        "dblp": "132/80601;203/9401;132/9008;161/2679;230/3760;215/5264;21/6793;07/7129;19/6214;90/5204.html",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.ca/citations?user=jU4IZs4AAAAJ;8SK2fPAAAAAJ;mR5W7EgAAAAJ;cUSS3fYAAAAJ;gYUOJwMAAAAJ;https://scholar.google.com.tw/citations?user=UjpbO6IAAAAJ;8rDNIMsAAAAJ;SnQnQicAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-3200-0000-0011;;;;;;;0000-0003-4263-395X;;0000-0002-2310-6380",
        "linkedin": "weijia-shi-773768112;;;;;xivictorialin/;luke-zettlemoyer-a0109b226/;scottyih/;;",
        "or_profile": "~Weijia_Shi1;~Sewon_Min1;~Maria_Lomeli2;~Chunting_Zhou1;~Margaret_Li1;~Xi_Victoria_Lin1;~Luke_Zettlemoyer1;~Wen-tau_Yih1;~Mike_Lewis1;~Noah_Smith1",
        "aff": "University of Washington, Seattle;Department of Computer Science, University of Washington;Meta;Meta AI;Meta;Meta;Meta;Meta Platforms, Inc.;Facebook AI Research;Allen Institute for Artificial Intelligence",
        "aff_domain": "uw.edu;cs.washington.edu;meta.com;meta.com;meta.com;fb.com;meta.com;meta.com;fb.com;allenai.org",
        "position": "PhD student;PhD student;Researcher;Researcher;Researcher;Research Scientist;Researcher;Research Scientist;Research Scientist;Senior Director of NLP Research",
        "bibtex": "@inproceedings{\nshi2024incontext,\ntitle={In-Context Pretraining: Language Modeling Beyond Document Boundaries},\nauthor={Weijia Shi and Sewon Min and Maria Lomeli and Chunting Zhou and Margaret Li and Xi Victoria Lin and Noah A. Smith and Luke Zettlemoyer and Wen-tau Yih and Mike Lewis},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=LXVswInHOo}\n}",
        "github": "",
        "project": "",
        "reviewers": "MeqG;Gjsg;AJRu;8aRp",
        "pdf_size": 1036999,
        "rating": "6;8;8;8",
        "confidence": "4;3;4;3",
        "soundness": "3;4;4;3",
        "contribution": "3;4;3;4",
        "presentation": "3;3;4;3",
        "wc_summary": "78;109;266;86",
        "wc_strengths": "90;105;118;21",
        "wc_weaknesses": "47;173;113;91",
        "wc_questions": "1;152;38;83",
        "wc_review": "216;539;535;281",
        "wc_reply_reviewers": "15;67;0;13",
        "wc_reply_authors": "267;802;307;380",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "2;3;1;1",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            134.75,
            76.62693716964029
        ],
        "wc_strengths_avg": [
            83.5,
            37.41991448413532
        ],
        "wc_weaknesses_avg": [
            106.0,
            45.39823785126467
        ],
        "wc_questions_avg": [
            68.5,
            56.27832620112293
        ],
        "wc_review_avg": [
            392.75,
            146.07596482652443
        ],
        "wc_reply_reviewers_avg": [
            23.75,
            25.625914617823888
        ],
        "wc_reply_authors_avg": [
            439.0,
            213.45842686574827
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16782825428923904640&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=LXVswInHOo",
        "pdf": "https://openreview.net/pdf?id=LXVswInHOo",
        "email": "uw.edu;cs.washington.edu;meta.com;meta.com;meta.com;fb.com;meta.com;meta.com;fb.com;allenai.org",
        "author_num": 10,
        "aff_unique_index": "0;0;1;1;1;1;1;1;1;2",
        "aff_unique_norm": "University of Washington;Meta;Allen Institute for Artificial Intelligence",
        "aff_unique_dep": ";Meta Platforms, Inc.;",
        "aff_unique_url": "https://www.washington.edu;https://meta.com;https://allenai.org",
        "aff_unique_abbr": "UW;Meta;AI2",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Seattle;",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "LXiG2WqKXR",
        "title": "STARLING: Self-supervised Training of Text-based Reinforcement Learning Agent with Large Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Interactive fiction games have emerged as an important vehicle to improve the generalization capabilities of language-based reinforcement learning (RL) agents. Existing environments for interactive fiction games are domain-specific or time-consuming to generate and do not train the RL agents to master a specific set of skills. In this work, we introduce an interactive environment for self-supervised RL, STARLING, for text-based games that bootstraps the text-based RL agents with automatically generated games (based on the seed set of game ideas)  to boost the performance and generalization capabilities to reach a goal of the target environment. These games let the agent hone their skills on a predefined set of tasks. We create and test an environment with $100$ games, generated using this automated framework that uses large language models (GPT3) and an interactive fiction game engine (based on Inform7) to provide the user with the ability to generate more games under minimal human supervision. Experimental results based on both the human participants and baseline text-based RL agents reveal that current state-of-the-art text-based RL agents cannot use previously learned skills in new situations at the level humans can. These results enforce STARLING\u2019s potential to serve as a sandbox environment for further research in self-supervised text-based RL.",
        "keywords": "Interactive Fiction;Text-based Reinforcement Learning;Self-supervision",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/58f1a081a72af9d038f57514e6b45756aaf51466.zip",
        "author": "Shreyas Basavatia;Keerthiram Murugesan;Shivam Ratnakar",
        "authorids": "~Shreyas_Basavatia1;~Keerthiram_Murugesan1;~Shivam_Ratnakar1",
        "gender": ";M;M",
        "homepage": ";https://keerthi166.github.io;",
        "dblp": ";178/2877;380/4193",
        "google_scholar": ";-698GEMAAAAJ;",
        "orcid": ";0000-0001-6847-522X;",
        "linkedin": "shreyas-basavatia-936387203;https://linkedin.com/in/keerthiram;https://linkedin.com/in/shivam-ratnakar-342b03144",
        "or_profile": "~Shreyas_Basavatia1;~Keerthiram_Murugesan1;~Shivam_Ratnakar1",
        "aff": ";International Business Machines;Equinix",
        "aff_domain": ";ibm.com;equinix.com",
        "position": ";Researcher;Researcher",
        "bibtex": "@misc{\nbasavatia2024starling,\ntitle={{STARLING}: Self-supervised Training of Text-based Reinforcement Learning Agent with Large Language Models},\nauthor={Shreyas Basavatia and Keerthiram Murugesan and Shivam Ratnakar},\nyear={2024},\nurl={https://openreview.net/forum?id=LXiG2WqKXR}\n}",
        "github": "",
        "project": "",
        "reviewers": "vFed;yam5;Fptt;2y7E",
        "site": "https://openreview.net/forum?id=LXiG2WqKXR",
        "pdf_size": 8756044,
        "rating": "3;3;3;5",
        "confidence": "4;4;4;5",
        "soundness": "2;2;2;3",
        "contribution": "2;2;1;2",
        "presentation": "3;3;1;2",
        "wc_summary": "58;94;94;101",
        "wc_strengths": "9;91;36;247",
        "wc_weaknesses": "87;102;78;7",
        "wc_questions": "5;34;208;775",
        "wc_review": "159;321;416;1130",
        "wc_reply_reviewers": "0;0;35;175",
        "wc_reply_authors": "143;188;499;630",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            86.75,
            16.843025262701474
        ],
        "wc_strengths_avg": [
            95.75,
            92.18832626748356
        ],
        "wc_weaknesses_avg": [
            68.5,
            36.52738698565776
        ],
        "wc_questions_avg": [
            255.5,
            309.8180917893595
        ],
        "wc_review_avg": [
            506.5,
            371.5201878767828
        ],
        "wc_reply_reviewers_avg": [
            52.5,
            72.15434844830907
        ],
        "wc_reply_authors_avg": [
            365.0,
            205.42273486642125
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10532940427615035640&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "International Business Machines Corporation;Equinix",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ibm.com;https://www.equinix.com",
        "aff_unique_abbr": "IBM;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "LXnTFMvn8A",
        "title": "A Theoretical Approach to Characterize the Accuracy-Fairness Trade-off Pareto Frontier",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "While the accuracy-fairness trade-off has been frequently observed in the literature of fair machine learning, rigorous theoretical analyses have been scarce. To demystify this long-standing challenge, this work seeks to develop a theoretical framework by characterizing the shape of the accuracy-fairness trade-off Pareto frontier(FairFrontier), determined by a set of all optimal Pareto classifiers that no other classifiers can dominate. Specifically, we first demonstrate the existence of the trade-off in real-world scenarios and then propose four potential categories to characterize the important properties of the accuracy-fairness Pareto frontier. For each category, we identify the necessary conditions that lead to corresponding trade-offs. Experimental results on synthetic data suggest insightful findings of the proposed framework: (1) When sensitive attributes can be fully interpreted by non-sensitive attributes, FairFrontier is mostly continuous. (2) Accuracy can suffer a \\textit{sharp} decline when over-pursuing fairness. (3) Eliminate the trade-off via a two-step streamlined approach. The proposed research enables an in-depth understanding of the accuracy-fairness trade-off, pushing current fair machine-learning research to a new frontier.",
        "keywords": "Algorithmic fairness;Group fairness;Pareto frontier",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Hua Tang;Lu Cheng;Ninghao Liu;Mengnan Du",
        "authorids": "~Hua_Tang1;~Lu_Cheng2;~Ninghao_Liu2;~Mengnan_Du1",
        "gender": ";F;;M",
        "homepage": "https://ytang520.github.io/HuaTang.github.io/;https://lcheng.org/;https://mengnandu.com/;https://cobweb.cs.uga.edu/~ninghaoliu/",
        "dblp": ";17/4969-1;183/5606;145/4489",
        "google_scholar": ";9rpkTSkAAAAJ;0i-Js2gAAAAJ;Nir-EDYAAAAJ",
        "orcid": ";0000-0002-2503-2522;;0000-0002-9170-2424",
        "linkedin": ";;;",
        "or_profile": "~Hua_Tang1;~Lu_Cheng2;~Mengnan_Du1;~Ninghao_Liu1",
        "aff": "Shanghai Jiaotong University;University of Illinois at Chicago;New Jersey Institute of Technology;University of Georgia",
        "aff_domain": "sjtu.edu.cn;uic.edu;njit.edu;uga.edu",
        "position": "Undergrad student;Assistant Professor;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\ntang2024a,\ntitle={A Theoretical Approach to Characterize the Accuracy-Fairness Trade-off Pareto Frontier},\nauthor={Hua Tang and Lu Cheng and Ninghao Liu and Mengnan Du},\nyear={2024},\nurl={https://openreview.net/forum?id=LXnTFMvn8A}\n}",
        "github": "",
        "project": "",
        "reviewers": "HvQJ;vpks;Ypkg;aY8j",
        "site": "https://openreview.net/forum?id=LXnTFMvn8A",
        "pdf_size": 833864,
        "rating": "3;3;3;6",
        "confidence": "3;4;4;4",
        "soundness": "2;1;1;2",
        "contribution": "2;2;1;3",
        "presentation": "2;2;2;1",
        "wc_summary": "92;74;90;85",
        "wc_strengths": "104;39;55;60",
        "wc_weaknesses": "47;411;324;252",
        "wc_questions": "732;20;2;34",
        "wc_review": "975;544;471;431",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            85.25,
            6.977642868476432
        ],
        "wc_strengths_avg": [
            64.5,
            24.088378940891808
        ],
        "wc_weaknesses_avg": [
            258.5,
            134.4628201399926
        ],
        "wc_questions_avg": [
            197.0,
            309.09060160412514
        ],
        "wc_review_avg": [
            605.25,
            217.2859578988021
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16641250687465014012&as_sdt=800005&sciodt=0,15&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Shanghai Jiao Tong University;University of Illinois at Chicago;New Jersey Institute of Technology;University of Georgia",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.sjtu.edu.cn;https://www.uic.edu;https://www.njit.edu;https://www.uga.edu",
        "aff_unique_abbr": "SJTU;UIC;NJIT;UGA",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Chicago",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "LY1eOfqU16",
        "title": "A Soft Labeling Approach for Fairness-aware Learning Under Partially Annotated Sensitive Attributes",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In light of AI's growing ubiquity, concerns about its societal impact have prompted extensive efforts to mitigate different types of bias, often relying on the assumption of complete information regarding individuals' sensitive attributes. In this work, we tackle the problem of algorithmic fairness under partially annotated sensitive attributes. Previous approaches often rely on an attribute classifier as a proxy model to infer \"hard\" pseudo labels, which are then used to optimize the final model using fairness-aware regularization techniques. In contrast, we propose a novel regularization approach, that leverages the output probability of the attribute classifier as \"soft\" pseudo labels, derived from the definition of the fairness criteria. Additionally, we study the effect of the uncertainty on the attribute classifier parameters that naturally arise in the case of limited available sensitive attribute annotations. We adopt the Bayesian viewpoint and we propose to optimize our model with respect to the marginal model of the attribute classifier, while our second approach optimizes the fairness objective with respect to each model of the decision maker's belief. To validate our approach, we conduct extensive experiments on Adult and CelebA datasets with tabular and image modalities, respectively. The results of our study highlight the effectiveness of our method as well as the significance of incorporating uncertainty, in improving both utility and fairness compared to a variety of different baselines.",
        "keywords": "Algorithmic fairness;Model uncertainty",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "andreas athanasopoulos;Christos Dimitrakakis",
        "authorids": "~andreas_athanasopoulos1;~Christos_Dimitrakakis1",
        "gender": "M;M",
        "homepage": ";https://sites.google.com/site/christosdimitrakakis/",
        "dblp": "351/9383.html;17/2535",
        "google_scholar": "https://scholar.google.co.uk/citations?user=NInCblkAAAAJ;9Kw4t_kAAAAJ",
        "orcid": "0009-0000-6807-5939;0000-0002-5367-5189",
        "linkedin": "andreas-athanasopoulos-950636153/;",
        "or_profile": "~andreas_athanasopoulos1;~Christos_Dimitrakakis1",
        "aff": "Universit\u00e9 de Neuch\u00e2tel;Chalmers University",
        "aff_domain": "unine.ch;chalmers.se",
        "position": "PhD student;Senior Researcher",
        "bibtex": "@misc{\nathanasopoulos2024a,\ntitle={A Soft Labeling Approach for Fairness-aware Learning Under Partially Annotated Sensitive Attributes},\nauthor={andreas athanasopoulos and Christos Dimitrakakis},\nyear={2024},\nurl={https://openreview.net/forum?id=LY1eOfqU16}\n}",
        "github": "",
        "project": "",
        "reviewers": "dNWk;jukW;UWvQ",
        "site": "https://openreview.net/forum?id=LY1eOfqU16",
        "pdf_size": 752346,
        "rating": "3;3;5",
        "confidence": "2;4;5",
        "soundness": "3;2;3",
        "contribution": "2;2;2",
        "presentation": "2;2;2",
        "wc_summary": "59;94;82",
        "wc_strengths": "53;36;51",
        "wc_weaknesses": "71;156;143",
        "wc_questions": "80;5;271",
        "wc_review": "263;291;547",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            1.247219128924647
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            78.33333333333333,
            14.522013940527977
        ],
        "wc_strengths_avg": [
            46.666666666666664,
            7.586537784494028
        ],
        "wc_weaknesses_avg": [
            123.33333333333333,
            37.38389433373088
        ],
        "wc_questions_avg": [
            118.66666666666667,
            111.98313365066285
        ],
        "wc_review_avg": [
            367.0,
            127.79149684805584
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.7559289460184545,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:gQyEFx8FRLIJ:scholar.google.com/&scioq=A+Soft+Labeling+Approach+for+Fairness-aware+Learning+Under+Partially+Annotated+Sensitive+Attributes&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Universit\u00e9 de Neuch\u00e2tel;Chalmers University of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.unine.ch;https://www.chalmers.se",
        "aff_unique_abbr": "UNINE;Chalmers",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Switzerland;Sweden"
    },
    {
        "title": "Zoology: Measuring and Improving Recall in Efficient Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18860",
        "id": "LY3ukUANko",
        "author_site": "Simran Arora, Sabri Eyuboglu, Aman Timalsina, Isys Johnson, Michael Poli, James Y Zou, Atri Rudra, Christopher Re",
        "tldr": "",
        "abstract": "Attention-free language models that combine gating and convolutions are growing in popularity due to their efficiency and increasingly competitive performance. To better understand these architectures, we pretrain a suite of 17 attention and gated-convolution language models, finding that SoTA gated-convolution architectures still underperform attention by up to 2.1 perplexity points on the Pile. In fine-grained analysis, we find 82% of the gap is explained by each model's ability to recall information that is previously mentioned in-context, e.g. \"Hakuna Matata means no worries Hakuna Matata it means no\" -> ??. On this task, termed \"associative recall\", we find that attention outperforms gated-convolutions by a large margin: a 70M parameter attention model outperforms a 1.4 billion parameter gated-convolution model on associative recall. This is surprising because prior work shows gated convolutions can perfectly solve synthetic tests for AR capability.  To close the gap between synthetics and real language, we develop a new formalization of the task called multi-query associative recall (MQAR) that better reflects actual language. We perform an empirical and theoretical study of MQAR that elucidates differences in the parameter-efficiency of attention and gated-convolution recall. Informed by our analysis, we evaluate simple convolution-attention hybrids and show that hybrids with input-dependent sparse attention patterns can close 97.4% of the gap to attention, while maintaining sub-quadratic scaling. Code is at: https://github.com/HazyResearch/zoology.",
        "keywords": "nlp;language models;representation learning;in-context learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/698046794178f76cc5660ac57ab32e5d78503ea1.zip",
        "author": "Simran Arora;Sabri Eyuboglu;Aman Timalsina;Isys Johnson;Michael Poli;James Zou;Atri Rudra;Christopher Re",
        "authorids": "~Simran_Arora1;~Sabri_Eyuboglu1;~Aman_Timalsina1;~Isys_Johnson1;~Michael_Poli1;~James_Zou1;~Atri_Rudra1;~Christopher_Re1",
        "gender": ";;M;;M;;M;",
        "homepage": "https://scholar.google.com/citations?user=rGRsWH8AAAAJ&hl=en;http://www.sabrieyuboglu.com/;;https://github.com/isysjo;;;http://www.cse.buffalo.edu/faculty/atri/;",
        "dblp": "243/2342;298/7563;;304/8782.html;;;04/4980;",
        "google_scholar": ";;https://scholar.google.com/citations?hl=en;;RgIBwboAAAAJ;23ZXZvEAAAAJ;https://scholar.google.com.tw/citations?user=_e5H8IoAAAAJ;",
        "orcid": ";;;;;;;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Simran_Arora1;~Sabri_Eyuboglu1;~Aman_Timalsina1;~Isys_Johnson1;~Michael_Poli1;~James_Zou1;~Atri_Rudra1;~Christopher_Re1",
        "aff": "The Wharton School, University of Pennsylvania;Stanford University;Purdue University;State University of New York, Buffalo;Stanford University;Stanford University;State University of New York, Buffalo;",
        "aff_domain": "wharton.upenn.edu;stanford.edu;purdue.edu;buffalo.edu;stanford.edu;stanford.edu;buffalo.edu;",
        "position": "Undergrad student;PhD student;MS student;PhD student;PhD student;Assistant Professor;Professor;",
        "bibtex": "@inproceedings{\narora2024zoology,\ntitle={Zoology: Measuring and Improving  Recall in Efficient Language Models},\nauthor={Simran Arora and Sabri Eyuboglu and Aman Timalsina and Isys Johnson and Michael Poli and James Zou and Atri Rudra and Christopher Re},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=LY3ukUANko}\n}",
        "github": "",
        "project": "",
        "reviewers": "xdZW;5EW4;9Su6",
        "pdf_size": 3381743,
        "rating": "3;8;8",
        "confidence": "3;4;4",
        "soundness": "2;4;3",
        "contribution": "2;4;3",
        "presentation": "1;3;3",
        "wc_summary": "92;74;87",
        "wc_strengths": "13;54;83",
        "wc_weaknesses": "287;25;273",
        "wc_questions": "3;28;119",
        "wc_review": "395;181;562",
        "wc_reply_reviewers": "0;0;26",
        "wc_reply_authors": "1057;476;1437",
        "reply_reviewers": "0;0;1",
        "reply_authors": "3;1;3",
        "rating_avg": [
            6.333333333333333,
            2.357022603955158
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            84.33333333333333,
            7.586537784494029
        ],
        "wc_strengths_avg": [
            50.0,
            28.717010057919794
        ],
        "wc_weaknesses_avg": [
            195.0,
            120.3439515167533
        ],
        "wc_questions_avg": [
            50.0,
            49.846430831772366
        ],
        "wc_review_avg": [
            379.3333333333333,
            155.93659680210484
        ],
        "wc_reply_reviewers_avg": [
            8.666666666666666,
            12.256517540566826
        ],
        "wc_reply_authors_avg": [
            990.0,
            395.17675370227266
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.9999999999999998,
        "gs_citation": 82,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7705889338482939758&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=LY3ukUANko",
        "pdf": "https://openreview.net/pdf?id=LY3ukUANko",
        "email": "wharton.upenn.edu;stanford.edu;purdue.edu;buffalo.edu;stanford.edu;stanford.edu;buffalo.edu;",
        "author_num": 8,
        "aff_unique_index": "0;1;2;3;1;1;3",
        "aff_unique_norm": "University of Pennsylvania;Stanford University;Purdue University;State University of New York at Buffalo",
        "aff_unique_dep": "The Wharton School;;;",
        "aff_unique_url": "https://www.wharton.upenn.edu;https://www.stanford.edu;https://www.purdue.edu;https://www.buffalo.edu",
        "aff_unique_abbr": "UPenn Wharton;Stanford;Purdue;SUNY Buffalo",
        "aff_campus_unique_index": "1;2;1;1;2",
        "aff_campus_unique": ";Stanford;Buffalo",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "H-GAP: Humanoid Control with a Generalist Planner",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18859",
        "id": "LYG6tBlEX0",
        "author_site": "Zhengyao Jiang, Yingchen Xu, Nolan Wagener, Yicheng Luo, Michael Janner, Edward Grefenstette, Tim Rocktaeschel, Yuandong Tian",
        "tldr": "",
        "abstract": "Humanoid control is an important research challenge offering avenues for integration into human-centric infrastructures and enabling physics-driven humanoid animations.\nThe daunting challenges in this field stem from the difficulty of optimizing in high-dimensional action spaces and the instability introduced by the bipedal morphology of humanoids. \nHowever, the extensive collection of human motion-captured data and the derived datasets of humanoid trajectories, such as MoCapAct, paves the way to tackle these challenges. In this context, we present Humanoid Generalist Autoencoding Planner (H-GAP), a state-action trajectory generative model trained on humanoid trajectories derived from human motion-captured data, capable of adeptly handling downstream control tasks with Model Predictive Control (MPC).\nFor 56 degrees of freedom humanoid, we empirically demonstrate that H-GAP learns to represent and generate a wide range of motor behaviors. Further, without any learning from online interactions, it can also flexibly transfer these behaviours to solve novel downstream control tasks via planning. Notably, H-GAP excels established MPC baselines with access to the ground truth model, and is superior or comparable to offline RL methods trained for individual tasks.\nFinally, we do a series of empirical studies on the scaling properties of H-GAP, showing the potential for performance gains via additional data but not computing.",
        "keywords": "Generative Modelling;Humanoid Control;Model Predictive Control;Model-based Reinforcement Learning;Offline Reinforcement Learning",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "zhengyao jiang;Yingchen Xu;Nolan Wagener;Yicheng Luo;Michael Janner;Edward Grefenstette;Tim Rockt\u00e4schel;Yuandong Tian",
        "authorids": "~zhengyao_jiang2;~Yingchen_Xu2;~Nolan_Wagener1;~Yicheng_Luo1;~Michael_Janner1;~Edward_Grefenstette1;~Tim_Rockt\u00e4schel1;~Yuandong_Tian1",
        "gender": "M;F;M;M;M;M;M;M",
        "homepage": "https://zhengyaojiang.github.io/;http://yingchenxu.com/;https://luoyicheng.net/;;http://egrefen.com/;http://yuandong-tian.com;https://nolanwagener.github.io;http://rockt.ai",
        "dblp": ";59/7714;;209/4967;http://dblp.uni-trier.de/pers/hd/g/Grefenstette:Edward;t/YuandongTian;;43/11537",
        "google_scholar": "https://scholar.google.co.jp/citations?user=J8pFrgwAAAAJ;-CqyjXEAAAAJ;635-7jQAAAAJ;;https://scholar.google.co.uk/citations?user=ezllEwMAAAAJ;0mgEF28AAAAJ;SgGIYH0AAAAJ;https://scholar.google.co.uk/citations?user=mWBY8aIAAAAJ",
        "orcid": ";;0000-0003-0547-411X;;;0000-0003-4202-4847;;",
        "linkedin": ";;yichengluo/;;;yuandongtian;nwagener/;rockt/",
        "or_profile": "~zhengyao_jiang2;~Yingchen_Xu2;~Yicheng_Luo1;~Michael_Janner1;~Edward_Grefenstette1;~Yuandong_Tian1;~Nolan_Christopher_Wagener1;~Tim_Rocktaeschel1",
        "aff": ";Meta AI Research;University College London, University of London;University of California, Berkeley;Google DeepMind;Meta AI (FAIR);Overland AI;Google DeepMind",
        "aff_domain": ";meta.com;ucl.ac.uk;berkele;deepmind.com;meta.com;overland.ai;google.com",
        "position": ";Researcher;PhD student;PhD student;Principal Researcher;Research Scientist;Senior Software Engineer;Senior Staff Research Scientist",
        "bibtex": "@inproceedings{\njiang2024hgap,\ntitle={H-{GAP}: Humanoid Control with a Generalist Planner},\nauthor={zhengyao jiang and Yingchen Xu and Nolan Wagener and Yicheng Luo and Michael Janner and Edward Grefenstette and Tim Rockt{\\\"a}schel and Yuandong Tian},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=LYG6tBlEX0}\n}",
        "github": "",
        "project": "",
        "reviewers": "oGKQ;bwbh;kAwr",
        "pdf_size": 1174139,
        "rating": "6;8;8",
        "confidence": "3;3;5",
        "soundness": "3;3;3",
        "contribution": "3;3;2",
        "presentation": "2;4;2",
        "wc_summary": "65;47;100",
        "wc_strengths": "55;84;93",
        "wc_weaknesses": "157;101;264",
        "wc_questions": "70;99;1",
        "wc_review": "347;331;458",
        "wc_reply_reviewers": "0;26;115",
        "wc_reply_authors": "600;912;758",
        "reply_reviewers": "0;1;1",
        "reply_authors": "1;3;2",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            70.66666666666667,
            22.00504992546534
        ],
        "wc_strengths_avg": [
            77.33333333333333,
            16.21384867602041
        ],
        "wc_weaknesses_avg": [
            174.0,
            67.6214955961983
        ],
        "wc_questions_avg": [
            56.666666666666664,
            41.10420362390634
        ],
        "wc_review_avg": [
            378.6666666666667,
            56.47615032520857
        ],
        "wc_reply_reviewers_avg": [
            47.0,
            49.24090440545001
        ],
        "wc_reply_authors_avg": [
            756.6666666666666,
            127.37695587856106
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17151867590349429654&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=LYG6tBlEX0",
        "pdf": "https://openreview.net/pdf?id=LYG6tBlEX0",
        "email": ";meta.com;ucl.ac.uk;berkele;deepmind.com;meta.com;overland.ai;google.com",
        "author_num": 8,
        "aff_unique_index": "0;1;2;3;0;4;3",
        "aff_unique_norm": "Meta;University College London;University of California, Berkeley;Google;Overland AI",
        "aff_unique_dep": "Meta AI Research;;;Google DeepMind;",
        "aff_unique_url": "https://meta.com;https://www.ucl.ac.uk;https://www.berkeley.edu;https://deepmind.com;https://www.overland.ai",
        "aff_unique_abbr": "Meta AI;UCL;UC Berkeley;DeepMind;Overland AI",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Berkeley",
        "aff_country_unique_index": "0;1;0;1;0;0;1",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "LYGHdwyXUb",
        "title": "Efficient Multi-task Reinforcement Learning via Selective Behavior Sharing",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Multi-task Reinforcement Learning (MTRL) offers several avenues to address the issue of sample efficiency through information sharing between tasks. However, prior MTRL methods primarily exploit data and parameter sharing, overlooking the potential of sharing learned behaviors across tasks. The few existing behavior-sharing approaches falter because they directly imitate the policies from other tasks, leading to suboptimality when different tasks require different actions for the same states. To preserve optimality, we introduce a novel, generally applicable behavior-sharing formulation that selectively leverages other task policies as the current task's behavioral policy for data collection to efficiently learn multiple tasks simultaneously. Our proposed MTRL framework estimates the shareability between task policies and incorporates them as temporally extended behaviors to collect training data. Empirically, selective behavior sharing improves sample efficiency on a wide range of manipulation, locomotion, and navigation MTRL task families and is complementary to parameter sharing. Result videos are available at [https://sites.google.com/view/qmp-mtrl](https://sites.google.com/view/qmp-mtrl).",
        "keywords": "Multi-task Reinforcement Learning;Behavior sharing",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/3d680be4ffb1e8027f03f3182b84c7c2ce2d661f.zip",
        "author": "Grace Zhang;Ayush Jain;Injune Hwang;Shao-Hua Sun;Joseph J Lim",
        "authorids": "~Grace_Zhang1;~Ayush_Jain2;~Injune_Hwang1;~Shao-Hua_Sun1;~Joseph_J_Lim1",
        "gender": "F;;M;M;M",
        "homepage": "https://gracehzhang.github.io/;https://ayushj240.github.io/;;http://shaohua0116.github.io;http://people.csail.mit.edu/lim/",
        "dblp": "13/2999;131/6283-3.html;260/3346;158/9680;08/3086",
        "google_scholar": ";-zEc_sAAAAAJ;haW9gXcAAAAJ;uXsfnaQAAAAJ;jTnQTBoAAAAJ",
        "orcid": ";;;0000-0001-7579-6734;",
        "linkedin": ";;;shaohua0116/;",
        "or_profile": "~Grace_Zhang1;~Ayush_Jain2;~Injune_Hwang1;~Shao-Hua_Sun1;~Joseph_J_Lim1",
        "aff": "University of Southern California;University of Southern California;Korea Advanced Institute of Science & Technology;National Taiwan University;Korea Advanced Institute of Science & Technology",
        "aff_domain": "usc.edu;usc.edu;kaist.edu;ntu.edu.tw;kaist.ac.kr",
        "position": "PhD student;PhD student;PhD student;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nzhang2024efficient,\ntitle={Efficient Multi-task Reinforcement Learning via Selective Behavior Sharing},\nauthor={Grace Zhang and Ayush Jain and Injune Hwang and Shao-Hua Sun and Joseph J Lim},\nyear={2024},\nurl={https://openreview.net/forum?id=LYGHdwyXUb}\n}",
        "github": "",
        "project": "",
        "reviewers": "neqy;Zv3o;H9dR;QRge",
        "site": "https://openreview.net/forum?id=LYGHdwyXUb",
        "pdf_size": 6452871,
        "rating": "3;3;5;5",
        "confidence": "4;4;4;4",
        "soundness": "2;2;2;2",
        "contribution": "1;2;2;2",
        "presentation": "2;3;2;3",
        "wc_summary": "75;67;84;42",
        "wc_strengths": "43;37;48;21",
        "wc_weaknesses": "134;51;118;312",
        "wc_questions": "23;237;302;8",
        "wc_review": "275;392;552;383",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "219;621;721;649",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            67.0,
            15.636495771111889
        ],
        "wc_strengths_avg": [
            37.25,
            10.158124826955023
        ],
        "wc_weaknesses_avg": [
            153.75,
            96.5255795113399
        ],
        "wc_questions_avg": [
            142.5,
            129.17139776281743
        ],
        "wc_review_avg": [
            400.5,
            98.8445749649418
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            552.5,
            195.97129891899988
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14235104083531205494&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1;2;1",
        "aff_unique_norm": "University of Southern California;Korea Advanced Institute of Science and Technology;National Taiwan University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.usc.edu;https://www.kaist.ac.kr;https://www.ntu.edu.tw",
        "aff_unique_abbr": "USC;KAIST;NTU",
        "aff_campus_unique_index": "0;0;2",
        "aff_campus_unique": "Los Angeles;;Taiwan",
        "aff_country_unique_index": "0;0;1;2;1",
        "aff_country_unique": "United States;South Korea;China"
    },
    {
        "id": "LYS3RhIYCq",
        "title": "Scaling Laws for Imitation Learning in Single-Agent Games",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Imitation Learning (IL) is one of the most widely used methods in machine learning. Yet, many works find it is often unable to fully recover the underlying expert behavior, even in constrained environments like single-agent games. However, none of these works deeply investigate the role of scaling up the model and data size. Inspired by recent work in Natural Language Processing (NLP) where \u201cscaling up\u201d has resulted in increasingly more capable LLMs, we investigate whether carefully scaling up model and data size can bring similar improvements in the imitation learning setting for single-agent games. We first demonstrate our findings on a variety of Atari games, and thereafter focus on the extremely challenging game of NetHack. In all games, we find that IL *loss* and *mean return* scale smoothly with the compute budget (FLOPs) and are strongly correlated, resulting in power laws for training compute-optimal IL agents. Finally, we forecast and train several NetHack agents with IL and find they outperform prior state-of-the-art by 2x in all settings. Our work both demonstrates the scaling behavior of imitation learning in a variety of single-agent games, as well as the viability of scaling up current approaches for increasingly capable agents in NetHack, a game that remains elusively hard for current AI systems.",
        "keywords": "Imitation Learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/e7630116694c4c7b4705cce7a0b1dbaf4d779acf.zip",
        "author": "Jens Tuyls;Dhruv Madeka;Kari Torkkola;Dean Foster;Karthik R Narasimhan;Sham M. Kakade",
        "authorids": "~Jens_Tuyls1;~Dhruv_Madeka1;~Kari_Torkkola1;~Dean_Foster1;~Karthik_R_Narasimhan1;~Sham_M._Kakade1",
        "gender": "M;;;M;M;M",
        "homepage": "https://jens321.github.io;http://www.dhruvmadeka.com;;http://deanfoster.net;http://www.karthiknarasimhan.com;https://shamulent.github.io",
        "dblp": ";;57/4389;241/9885;147/0322;s/SMKakade",
        "google_scholar": "TPnedXMAAAAJ;hCL5ibIAAAAJ;ewRmEoYAAAAJ;HDzOsYAAAAAJ;euc0GX4AAAAJ;https://scholar.google.com.tw/citations?user=wb-DKCIAAAAJ",
        "orcid": ";;;;;",
        "linkedin": "jens-tuyls-144852128/;;kari-torkkola-a7238b/;deanfoster/;;",
        "or_profile": "~Jens_Tuyls1;~Dhruv_Madeka1;~Kari_Torkkola1;~Dean_Foster1;~Karthik_R_Narasimhan1;~Sham_M._Kakade1",
        "aff": "Princeton University;Amazon;Amazon;;Princeton University;Harvard University",
        "aff_domain": "princeton.edu;amazon.com;amazon.com;;princeton.edu;harvard.edu",
        "position": "PhD student;Amazon;Principal Researcher;;Assistant Professor;Full Professor",
        "bibtex": "@misc{\ntuyls2024scaling,\ntitle={Scaling Laws for Imitation Learning in Single-Agent Games},\nauthor={Jens Tuyls and Dhruv Madeka and Kari Torkkola and Dean Foster and Karthik R Narasimhan and Sham M. Kakade},\nyear={2024},\nurl={https://openreview.net/forum?id=LYS3RhIYCq}\n}",
        "github": "",
        "project": "",
        "reviewers": "rcLB;aGsp;U8oj;fMKL;oGwh",
        "site": "https://openreview.net/forum?id=LYS3RhIYCq",
        "pdf_size": 1782874,
        "rating": "3;6;6;8;8",
        "confidence": "4;4;3;3;3",
        "soundness": "2;3;3;3;4",
        "contribution": "2;2;3;4;4",
        "presentation": "3;3;3;3;4",
        "wc_summary": "183;47;152;66;23",
        "wc_strengths": "93;37;65;139;54",
        "wc_weaknesses": "500;266;149;130;22",
        "wc_questions": "56;28;24;45;42",
        "wc_review": "832;378;390;380;141",
        "wc_reply_reviewers": "180;109;28;18;35",
        "wc_reply_authors": "2714;826;431;579;200",
        "reply_reviewers": "1;1;1;1;1",
        "reply_authors": "5;2;2;2;2",
        "rating_avg": [
            6.2,
            1.8330302779823362
        ],
        "confidence_avg": [
            3.4,
            0.4898979485566356
        ],
        "soundness_avg": [
            3.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            3.0,
            0.8944271909999159
        ],
        "presentation_avg": [
            3.2,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            94.2,
            62.1591505733468
        ],
        "wc_strengths_avg": [
            77.6,
            35.69649842771697
        ],
        "wc_weaknesses_avg": [
            213.4,
            162.8761492668586
        ],
        "wc_questions_avg": [
            39.0,
            11.661903789690601
        ],
        "wc_review_avg": [
            424.2,
            224.39286976194228
        ],
        "wc_reply_reviewers_avg": [
            74.0,
            62.02257653467808
        ],
        "wc_reply_authors_avg": [
            950.0,
            905.1600963365541
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.6,
            1.2000000000000002
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.7572401854185358,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6333335286042744241&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1;0;2",
        "aff_unique_norm": "Princeton University;Amazon;Harvard University",
        "aff_unique_dep": ";Amazon.com, Inc.;",
        "aff_unique_url": "https://www.princeton.edu;https://www.amazon.com;https://www.harvard.edu",
        "aff_unique_abbr": "Princeton;Amazon;Harvard",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Fast Value Tracking for Deep Reinforcement Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18858",
        "id": "LZIOBA2oDU",
        "author_site": "Frank Shih, Faming Liang",
        "tldr": "",
        "abstract": "Reinforcement learning (RL) tackles sequential decision-making problems by creating\nagents that interacts with their environment. However, existing algorithms often view these problem as \nstatic, focusing on point estimates for model parameters to maximize expected rewards, neglecting the stochastic dynamics of agent-environment interactions and the critical role of uncertainty quantification.\nOur research leverages the Kalman filtering paradigm to introduce a novel and scalable sampling algorithm called Langevinized Kalman Temporal-Difference (LKTD) for deep reinforcement learning. This algorithm, grounded in Stochastic Gradient Markov Chain Monte Carlo (SGMCMC), efficiently draws samples from the posterior distribution of deep neural network parameters. Under mild conditions, we prove that the posterior samples generated by the LKTD algorithm converge to a stationary distribution. This convergence not only enables us to quantify uncertainties associated with the value function and model parameters but also allows us to monitor these uncertainties during policy updates throughout the training phase. The LKTD algorithm paves the way for more robust and adaptable reinforcement learning approaches.",
        "keywords": "Reinforcement learning;SGMCMC;uncertainty quantification",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/5eb698b85d42dd6a194bc17a356d7e8c2024abed.zip",
        "author": "Frank Shih;Faming Liang",
        "authorids": "~Frank_Shih3;~Faming_Liang1",
        "gender": "M;M",
        "homepage": ";https://www.stat.purdue.edu/~fmliang/",
        "dblp": ";29/1122",
        "google_scholar": ";TboqoPIAAAAJ",
        "orcid": ";",
        "linkedin": "frank-shih-874029193/;",
        "or_profile": "~Frank_Shih3;~Faming_Liang1",
        "aff": "Purdue University;Purdue University",
        "aff_domain": "purdue.edu;purdue.edu",
        "position": "PhD student;Full Professor",
        "bibtex": "@inproceedings{\nshih2024fast,\ntitle={Fast Value Tracking for Deep Reinforcement Learning},\nauthor={Frank Shih and Faming Liang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=LZIOBA2oDU}\n}",
        "github": "",
        "project": "",
        "reviewers": "n3CS;5LPR;dX3U",
        "pdf_size": 1294113,
        "rating": "5;5;6",
        "confidence": "3;4;3",
        "soundness": "2;2;2",
        "contribution": "3;2;3",
        "presentation": "1;3;3",
        "wc_summary": "30;62;60",
        "wc_strengths": "49;184;184",
        "wc_weaknesses": "196;63;251",
        "wc_questions": "90;2;74",
        "wc_review": "365;311;569",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "694;430;720",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            50.666666666666664,
            14.636332266733433
        ],
        "wc_strengths_avg": [
            139.0,
            63.63961030678928
        ],
        "wc_weaknesses_avg": [
            170.0,
            78.92190232544237
        ],
        "wc_questions_avg": [
            55.333333333333336,
            38.27386691841953
        ],
        "wc_review_avg": [
            415.0,
            111.1035552986492
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            614.6666666666666,
            131.00975366573115
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=257333590969894969&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=LZIOBA2oDU",
        "pdf": "https://openreview.net/pdf?id=LZIOBA2oDU",
        "email": "purdue.edu;purdue.edu",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Purdue University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.purdue.edu",
        "aff_unique_abbr": "Purdue",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "LZT9T57Bg0",
        "title": "Complex Logical Reasoning over Knowledge Graphs using Large Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Reasoning over knowledge graphs (KGs) is a challenging task that requires a deep understanding of the complex relationships between entities and the underlying logic of their relations. Current approaches rely on learning geometries to embed entities in vector space for logical query operations, but they suffer from subpar performance on complex queries and dataset-specific representations. In this paper, we propose a novel decoupled approach, Language-guided Abstract Reasoning over Knowledge graphs (LARK), that formulates complex KG reasoning as a combination of contextual KG search and abstract logical query reasoning, to leverage the strengths of graph extraction algorithms and large language models (LLM), respectively. Our experiments demonstrate that the proposed approach outperforms state-of-the-art KG reasoning methods on standard benchmark datasets across several logical query constructs, with significant performance gain for queries of higher complexity. Furthermore, we show that the performance of our approach improves proportionally to the increase in size of the underlying LLM, enabling the integration of the latest advancements in LLMs for logical reasoning over KGs. Our work presents a new direction for addressing the challenges of complex KG reasoning and paves the way for future research in this area.",
        "keywords": "logical reasoning;knowledge graphs;large language models;complex reasoning",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/2e7234ea37cf5432460a25492d2a43879588d3ee.pdf",
        "author": "Nurendra Choudhary;Chandan K. Reddy",
        "authorids": "~Nurendra_Choudhary1;~Chandan_K._Reddy1",
        "gender": "M;M",
        "homepage": "http://nurendra.me/;https://creddy.net/",
        "dblp": "157/1351;42/1341",
        "google_scholar": "https://scholar.google.co.in/citations?user=MWJfTQYAAAAJ;LoXnMOIAAAAJ",
        "orcid": "0000-0002-4471-8968;",
        "linkedin": "nurendrachoudhary/;",
        "or_profile": "~Nurendra_Choudhary1;~Chandan_K._Reddy1",
        "aff": "Amazon;Amazon",
        "aff_domain": "amazon.com;amazon.com",
        "position": "Researcher;Amazon Scholar",
        "bibtex": "@misc{\nchoudhary2024complex,\ntitle={Complex Logical Reasoning over Knowledge Graphs using Large Language Models},\nauthor={Nurendra Choudhary and Chandan K. Reddy},\nyear={2024},\nurl={https://openreview.net/forum?id=LZT9T57Bg0}\n}",
        "github": "",
        "project": "",
        "reviewers": "vGc3;2XTg;gvan;5TPZ",
        "site": "https://openreview.net/forum?id=LZT9T57Bg0",
        "pdf_size": 1004497,
        "rating": "3;3;5;5",
        "confidence": "3;3;4;4",
        "soundness": "1;2;1;2",
        "contribution": "1;2;3;2",
        "presentation": "3;2;3;2",
        "wc_summary": "61;119;75;63",
        "wc_strengths": "46;105;57;33",
        "wc_weaknesses": "147;378;151;106",
        "wc_questions": "78;384;118;7",
        "wc_review": "332;986;401;209",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            1.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            79.5,
            23.425413550244958
        ],
        "wc_strengths_avg": [
            60.25,
            27.19719654670312
        ],
        "wc_weaknesses_avg": [
            195.5,
            106.82813299875646
        ],
        "wc_questions_avg": [
            146.75,
            142.62779357474474
        ],
        "wc_review_avg": [
            482.0,
            299.0008361192323
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 48,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11871321703562000038&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Amazon",
        "aff_unique_dep": "Amazon.com, Inc.",
        "aff_unique_url": "https://www.amazon.com",
        "aff_unique_abbr": "Amazon",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "LZZD649RsD",
        "title": "FIAT: Fusing learning paradigms with Instruction-Accelerated Tuning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Learning paradigms for large language models (LLMs) currently tend to fall within either in-context learning (ICL) or full fine-tuning. Each of these comes with their own trade-offs based on available data, model size, compute cost, ease-of-use, and final quality with neither solution performing well across-the-board. In this article, we first describe ICL and fine-tuning paradigms in a way that highlights their natural connections. Based on these connections, we propose a new learning paradigm called FIAT that fuses the best of these paradigms together, enabling prompt-engineered instructions and chain-of-thought reasoning with the very largest models while also using similar methods to perform parameter updates on a modestly-sized LLM with parameter-efficient tuning. We evaluate FIAT's effectiveness on a variety of multilingual tasks and observe that FIAT performs better than both ICL and fine-tuning at scales ranging from 100-10,000 training examples. We hope that FIAT provides a practical way of harnessing the full potential of LLMs without needing to make a hard choice between learning paradigms.",
        "keywords": "Data efficient LLM tuning;Multilingual modeling",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Xinyi Wang;John Frederick Wieting;Jonathan H. Clark",
        "authorids": "~Xinyi_Wang1;~John_Frederick_Wieting1;~Jonathan_H._Clark1",
        "gender": "F;M;M",
        "homepage": ";;",
        "dblp": ";156/0158;02/786",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;;WfWxwlIAAAAJ",
        "orcid": ";;0009-0008-2036-2777",
        "linkedin": ";;",
        "or_profile": "~Xinyi_Wang1;~John_Frederick_Wieting1;~Jonathan_H._Clark1",
        "aff": "Google;Google DeepMind;Google DeepMind",
        "aff_domain": "google.com;google.com;google.com",
        "position": "Researcher;Researcher;Researcher",
        "bibtex": "@misc{\nwang2024fiat,\ntitle={{FIAT}: Fusing learning paradigms with Instruction-Accelerated Tuning},\nauthor={Xinyi Wang and John Frederick Wieting and Jonathan H. Clark},\nyear={2024},\nurl={https://openreview.net/forum?id=LZZD649RsD}\n}",
        "github": "",
        "project": "",
        "reviewers": "oPRp;nxJx;qVcA;47ne",
        "site": "https://openreview.net/forum?id=LZZD649RsD",
        "pdf_size": 348068,
        "rating": "1;3;5;6",
        "confidence": "4;4;4;3",
        "soundness": "2;3;3;3",
        "contribution": "1;1;3;3",
        "presentation": "1;2;2;3",
        "wc_summary": "67;21;70;53",
        "wc_strengths": "16;20;44;169",
        "wc_weaknesses": "363;148;134;174",
        "wc_questions": "55;5;121;136",
        "wc_review": "501;194;369;532",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.920286436967152
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            1.0
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            52.75,
            19.421315609401955
        ],
        "wc_strengths_avg": [
            62.25,
            62.55547537985784
        ],
        "wc_weaknesses_avg": [
            204.75,
            92.48614761141259
        ],
        "wc_questions_avg": [
            79.25,
            52.59455770324531
        ],
        "wc_review_avg": [
            399.0,
            133.24601307356255
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.676481425202546,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:R6wlqFzYYC0J:scholar.google.com/&scioq=FIAT:+Fusing+learning+paradigms+with+Instruction-Accelerated+Tuning&hl=en&as_sdt=0,47",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Google",
        "aff_unique_dep": "Google",
        "aff_unique_url": "https://www.google.com",
        "aff_unique_abbr": "Google",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Mountain View;",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "LajkZlgD83",
        "title": "Hybrid Retrieval-Augmented Generation for Real-time Composition Assistance",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Retrieval augmentation enhances performance of traditional language models by incorporating additional context. However, the computational demands for retrieval augmented large language models (LLMs) poses a challenge when applying them to real-time tasks, such as composition assistance. To address this limitation, we propose the Hybrid Retrieval-Augmented Generation (HybridRAG) framework, a novel approach that efficiently combines a cloud-based LLM with a client-side smaller language model through retrieval augmented memory. This integration enables the client model to generate effective responses, benefiting from the LLM's capabilities and contextual information. Additionally, through an asynchronous memory update mechanism, the client model can deliver real-time completions promptly to user inputs without the need to wait for responses from the cloud. Our experiments on Wikitext dataset and Pile subsets demonstrate that HybridRAG significantly improves utility over client-only models while maintaining low latency.",
        "keywords": "hybrid AI systems;retrieval augmentation;natural language generation;efficient AI",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "",
        "author": "Xuchao Zhang;Menglin Xia;Camille Couturier;Guoqing Zheng;Saravan Rajmohan;Victor R\u00fchle",
        "authorids": "~Xuchao_Zhang1;~Menglin_Xia1;~Camille_Couturier1;~Guoqing_Zheng1;~Saravan_Rajmohan3;~Victor_R\u00fchle1",
        "gender": ";;;;;M",
        "homepage": "https://xuczhang.github.io/;;;https://www.microsoft.com/en-us/research/people/zheng/;https://www.microsoft.com/en-us/research/people/saravar/;https://www.microsoft.com/en-us/research/people/virueh/",
        "dblp": ";185/7640;326/7137;https://dblp.org/pers/z/Zheng:Guoqing.html;;277/8100",
        "google_scholar": ";;https://scholar.google.co.uk/citations?user=t9sCvOMAAAAJ;aMhUcoMAAAAJ;;",
        "orcid": ";;0000-0002-0168-1106;;;0000-0002-8957-7628",
        "linkedin": ";;;;;victor-r%C3%BChle-bb752195",
        "or_profile": "~Xuchao_Zhang1;~Menglin_Xia1;~Camille_Couturier1;~Guoqing_Zheng1;~Saravan_Rajmohan3;~Victor_Ruehle1",
        "aff": "Microsoft;Microsoft;Microsoft;Microsoft Research;Microsoft;Microsoft",
        "aff_domain": "microsoft.com;microsoft.com;microsoft.com;microsoft.com;microsoft.com;microsoft.com",
        "position": "Researcher;Researcher;Researcher;Researcher;Partner Director of Applied Research;Principal Researcher",
        "bibtex": "@misc{\nzhang2024hybrid,\ntitle={Hybrid Retrieval-Augmented Generation for Real-time Composition Assistance},\nauthor={Xuchao Zhang and Menglin Xia and Camille Couturier and Guoqing Zheng and Saravan Rajmohan and Victor R{\\\"u}hle},\nyear={2024},\nurl={https://openreview.net/forum?id=LajkZlgD83}\n}",
        "github": "",
        "project": "",
        "reviewers": "wQxv;Z6V6;VfJr;nsQe",
        "site": "https://openreview.net/forum?id=LajkZlgD83",
        "pdf_size": 1283089,
        "rating": "3;5;6;6",
        "confidence": "4;3;4;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;3;2",
        "wc_summary": "67;203;92;34",
        "wc_strengths": "18;65;50;108",
        "wc_weaknesses": "104;434;150;279",
        "wc_questions": "2;65;24;1",
        "wc_review": "191;767;316;422",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            99.0,
            63.470465572579506
        ],
        "wc_strengths_avg": [
            60.25,
            32.37572393013012
        ],
        "wc_weaknesses_avg": [
            241.75,
            128.19979524164614
        ],
        "wc_questions_avg": [
            23.0,
            25.93260495977988
        ],
        "wc_review_avg": [
            424.0,
            214.24635352789554
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.40824829046386296,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7450691887764480459&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "Microsoft",
        "aff_unique_dep": "Microsoft Corporation",
        "aff_unique_url": "https://www.microsoft.com",
        "aff_unique_abbr": "Microsoft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "JoMA: Demystifying Multilayer Transformers via Joint Dynamics of MLP and Attention",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18857",
        "id": "LbJqRGNYCf",
        "author_site": "Yuandong Tian, Yiping Wang, Zhenyu Zhang, Beidi Chen, Simon Du",
        "tldr": "",
        "abstract": "We propose Joint MLP/Attention (JoMA) dynamics, a novel mathematical framework to understand the training procedure of multilayer Transformer architectures. This is achieved by integrating out the self-attention layer in Transformers, producing a modified dynamics of MLP layers only. JoMA removes unrealistic assumptions in previous analysis (e.g., lack of residual connection), and predicts that the attention first becomes sparse (to learn salient tokens), then dense (to learn less salient tokens) in the presence of nonlinear activations, while in the linear case, it is consistent with existing works. We leverage JoMA to qualitatively explains how tokens are combined to form hierarchies in multilayer Transformers, when the input tokens are generated by a latent hierarchical generative model. Experiments on models trained from real-world dataset (Wikitext2/Wikitext103) and various pre- trained models (OPT, Pythia) verify our theoretical findings. The code is at https://github.com/facebookresearch/luckmatters/tree/yuandong3.",
        "keywords": "multilayer transformer;training dynamics;theoretical analysis;self-attention;interpretability;neural network understanding",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Yuandong Tian;Yiping Wang;Zhenyu Zhang;Beidi Chen;Simon Shaolei Du",
        "authorids": "~Yuandong_Tian1;~Yiping_Wang2;~Zhenyu_Zhang4;~Beidi_Chen1;~Simon_Shaolei_Du1",
        "gender": "M;M;M;F;M",
        "homepage": "http://yuandong-tian.com;https://ypwang61.github.io;https://zhenyu.gallery;https://www.andrew.cmu.edu/user/beidic/;http://simonshaoleidu.com",
        "dblp": "t/YuandongTian;13/1444-3;01/1844-15;192/1339;176/5602",
        "google_scholar": "0mgEF28AAAAJ;IuMFxFUAAAAJ;ZLyJRxoAAAAJ;;OttawxUAAAAJ",
        "orcid": "0000-0003-4202-4847;;;;",
        "linkedin": "yuandongtian;yiping-wang-323647294/;zhenyu-allen-zhang-a9b1391a3/;;",
        "or_profile": "~Yuandong_Tian1;~Yiping_Wang2;~Zhenyu_Zhang4;~Beidi_Chen1;~Simon_Shaolei_Du1",
        "aff": "Meta AI (FAIR);Department of Computer Science, University of Washington;University of Texas at Austin;Meta Facebook;University of Washington",
        "aff_domain": "meta.com;cs.washington.edu;utexas.edu;fb.com;washington.edu",
        "position": "Research Scientist;PhD student;PhD student;Researcher;Assistant Professor",
        "bibtex": "@inproceedings{\ntian2024joma,\ntitle={Jo{MA}: Demystifying Multilayer Transformers via Joint Dynamics of {MLP} and Attention},\nauthor={Yuandong Tian and Yiping Wang and Zhenyu Zhang and Beidi Chen and Simon Shaolei Du},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=LbJqRGNYCf}\n}",
        "github": "",
        "project": "",
        "reviewers": "5uGr;cMvf;h5HX;P4nM",
        "pdf_size": 1199971,
        "rating": "5;6;6;6",
        "confidence": "2;3;3;2",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;4;3",
        "wc_summary": "168;80;97;71",
        "wc_strengths": "67;104;44;95",
        "wc_weaknesses": "78;145;30;50",
        "wc_questions": "10;3;1;155",
        "wc_review": "323;332;172;371",
        "wc_reply_reviewers": "0;15;17;14",
        "wc_reply_authors": "278;697;189;772",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            2.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            104.0,
            38.11167800031901
        ],
        "wc_strengths_avg": [
            77.5,
            23.66960075708925
        ],
        "wc_weaknesses_avg": [
            75.75,
            43.464784596268274
        ],
        "wc_questions_avg": [
            42.25,
            65.18195685924135
        ],
        "wc_review_avg": [
            299.5,
            75.79083057995868
        ],
        "wc_reply_reviewers_avg": [
            11.5,
            6.726812023536855
        ],
        "wc_reply_authors_avg": [
            484.0,
            253.8572433475161
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 58,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=610859785780592566&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=LbJqRGNYCf",
        "pdf": "https://openreview.net/pdf?id=LbJqRGNYCf",
        "email": "meta.com;cs.washington.edu;utexas.edu;fb.com;washington.edu",
        "author_num": 5,
        "aff_unique_index": "0;1;2;0;1",
        "aff_unique_norm": "Meta;University of Washington;University of Texas at Austin",
        "aff_unique_dep": "Facebook AI Research (FAIR);Department of Computer Science;",
        "aff_unique_url": "https://ai.facebook.com;https://www.washington.edu;https://www.utexas.edu",
        "aff_unique_abbr": "Meta AI;UW;UT Austin",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Seattle;Austin",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "LbTWAG7btQ",
        "title": "Explaining How a Neural Network Play the Go Game and Let People Learn",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The AI model has surpassed human players in the game of Go (Granter et al., 2017; Fang et al., 2018; Intelligence, 2016), and it is widely believed that the AI model has encoded new knowledge about the Go game beyond human players. In this way, explaining the knowledge encoded by the AI model and using it to teach human players represent a promising-yet-challenging issue in explainable AI. To this end, mathematical supports are required to ensure that human players can learn accurate and verifiable knowledge, rather than specious intuitive analysis. Thus, in this paper, we extract interaction primitives between stones encoded by the value network for the Go game, so as to enable people to learn from the value network. Experiments show the effectiveness of our method.",
        "keywords": "Explainable AI;Go Game;Visualization",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "",
        "author": "Huilin Zhou;Huijie Tang;Mingjie Li;Hao Zhang;Zhen Yu Liu;Quanshi Zhang",
        "authorids": "~Huilin_Zhou1;~Huijie_Tang1;~Mingjie_Li3;~Hao_Zhang22;~Zhen_Yu_Liu1;~Quanshi_Zhang1",
        "gender": ";M;M;M;;M",
        "homepage": "https://zhouhuilin116.github.io/;https://vincent252.github.io;http://lmjjjjjj.github.io;https://haozhang37.github.io;http://deepthinkgo.cn/about_paul.html;http://qszhang.com",
        "dblp": "58/2369;;48/10103;55/2270-63;;http://dblp.uni-trier.de/pers/hd/z/Zhang:Quanshi",
        "google_scholar": "https://scholar.google.co.jp/citations?user=38EPPp8AAAAJ;;7dXDygoAAAAJ;3g6LlgwAAAAJ;;iFFhHK0AAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Huilin_Zhou1;~Huijie_Tang1;~Mingjie_Li3;~Hao_Zhang22;~Zhen_Yu_Liu1;~Quanshi_Zhang1",
        "aff": "Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;;Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;;sjtu.edu.cn",
        "position": "PhD student;Undergrad student;MS student;MS student;;Associate Professor",
        "bibtex": "@misc{\nzhou2024explaining,\ntitle={Explaining How a Neural Network Play the Go Game and Let People Learn},\nauthor={Huilin Zhou and Huijie Tang and Mingjie Li and Hao Zhang and Zhen Yu Liu and Quanshi Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=LbTWAG7btQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZNeH;6nKX;PcUP",
        "site": "https://openreview.net/forum?id=LbTWAG7btQ",
        "pdf_size": 1868921,
        "rating": "1;1;3",
        "confidence": "4;3;3",
        "soundness": "1;1;1",
        "contribution": "1;2;2",
        "presentation": "1;1;1",
        "wc_summary": "133;99;19",
        "wc_strengths": "38;193;17",
        "wc_weaknesses": "528;118;162",
        "wc_questions": "87;92;51",
        "wc_review": "786;502;249",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            1.0,
            0.0
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.0,
            0.0
        ],
        "wc_summary_avg": [
            83.66666666666667,
            47.786562499886465
        ],
        "wc_strengths_avg": [
            82.66666666666667,
            78.4870831552697
        ],
        "wc_weaknesses_avg": [
            269.3333333333333,
            183.78489842445947
        ],
        "wc_questions_avg": [
            76.66666666666667,
            18.263503375736967
        ],
        "wc_review_avg": [
            512.3333333333334,
            219.3510631131951
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3813988012213282728&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Shanghai Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sjtu.edu.cn",
        "aff_unique_abbr": "SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "LbkIwjmua3",
        "title": "Vulnerable Region Discovery through Diverse Adversarial Examples",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep Neural Networks (DNNs) have shown great promise in multiple fields, but ensuring their reliability remains a challenge. \n Current explainable approaches for DNNs mainly aim at understanding DNNs\u2019 behavior by identifying and prioritizing the influential input features that contribute to the model\u2019s predictions, often overlooking \\textit{vulnerable regions} that are highly sensitive to small perturbations. Traditional norm-based adversarial example generation algorithms, due to their lack of spatial constraints, often distribute adversarial perturbations throughout images, making it hard to identify these specific vulnerable regions. To address this oversight, we introduce an innovative method that uncovers these vulnerable regions by employing  adversarial perturbations at diverse locations. Specifically, our method operates within a one-pixel paradigm. This enables detailed pixel-level vulnerability assessments by evaluating the effects of individual perturbations on predictions. By leveraging the robust Sharing Differential Evolution Algorithm, we can simultaneously identify multiple one-pixel perturbations, forming a vulnerable region. We conduct thorough experiments across a variety of network architectures and adversarial training techniques, showing that our approach not only effectively identifies vulnerable regions but also provides invaluable insights into the inherent vulnerabilities present in a diverse range of deep learning models.",
        "keywords": "Explainable DNNs;Adversarial Examples;Vulnerable Regions",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Yunce Zhao;Wei Huang;Wei Liu;Xin Yao",
        "authorids": "~Yunce_Zhao1;~Wei_Huang6;~Wei_Liu15;~Xin_Yao1",
        "gender": "M;M;;",
        "homepage": ";https://weihuang05.github.io/;;http://www.cs.bham.ac.uk/~xin",
        "dblp": ";81/6685-34;;",
        "google_scholar": ";RZfDh4MAAAAJ;;",
        "orcid": "0009-0000-2290-2046;0000-0001-5674-7021;;",
        "linkedin": ";;;",
        "or_profile": "~Yunce_Zhao1;~Wei_Huang6;~Wei_Liu15;~Xin_Yao1",
        "aff": ";RIKEN AIP;;",
        "aff_domain": ";riken.jp;;",
        "position": ";Research Scientist;;",
        "bibtex": "@misc{\nzhao2024vulnerable,\ntitle={Vulnerable Region Discovery through Diverse Adversarial Examples},\nauthor={Yunce Zhao and Wei Huang and Wei Liu and Xin Yao},\nyear={2024},\nurl={https://openreview.net/forum?id=LbkIwjmua3}\n}",
        "github": "",
        "project": "",
        "reviewers": "4smo;DTs6;rfSA",
        "site": "https://openreview.net/forum?id=LbkIwjmua3",
        "pdf_size": 4504426,
        "rating": "5;6;8",
        "confidence": "3;4;5",
        "soundness": "3;4;4",
        "contribution": "2;3;4",
        "presentation": "2;3;3",
        "wc_summary": "174;30;65",
        "wc_strengths": "106;47;161",
        "wc_weaknesses": "98;73;78",
        "wc_questions": "11;2;93",
        "wc_review": "389;152;397",
        "wc_reply_reviewers": "0;263;97",
        "wc_reply_authors": "1705;2614;1325",
        "reply_reviewers": "0;2;1",
        "reply_authors": "4;6;4",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            89.66666666666667,
            61.32065086267613
        ],
        "wc_strengths_avg": [
            104.66666666666667,
            46.54985380094001
        ],
        "wc_weaknesses_avg": [
            83.0,
            10.801234497346433
        ],
        "wc_questions_avg": [
            35.333333333333336,
            40.94169295745136
        ],
        "wc_review_avg": [
            312.6666666666667,
            113.65542466400605
        ],
        "wc_reply_reviewers_avg": [
            120.0,
            108.59404526338756
        ],
        "wc_reply_authors_avg": [
            1881.3333333333333,
            540.8020792201977
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            4.666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.9819805060619659,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:jrQZj1_rpYcJ:scholar.google.com/&scioq=Vulnerable+Region+Discovery+through+Diverse+Adversarial+Examples&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "RIKEN",
        "aff_unique_dep": "Advanced Institute for Computational Science",
        "aff_unique_url": "https://www.aip.riken.jp",
        "aff_unique_abbr": "RIKEN AIP",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Japan"
    },
    {
        "id": "LdiVep1jpj",
        "title": "RASP Quadratures: Efficient Numerical Integration for High-Dimensional Mean-Field Variational Inference",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Efficient high-dimensional integration enables novel approaches to calibrate and control model uncertainty during training. In particular, the recently-proposed projective integral update formulation of variational inference derives model uncertainty from expectations that extract the local loss topography. Thus, we propose random-affinity sigma-point (RASP) quadratures, which are designed to eliminate integration errors from basis functions that drive Gaussian mean-field updates. Using only 3 gradient evaluations, RASP quadratures can extract locally-averaged gradients and Hessian diagonals from the loss, while eliminating errors from over half of all quadratic total-degree terms. Alternatively, we can use 6-point RASP quadratures to obtain 5th-order exactness in all univariate terms as well as 3rd-order exactness for two-thirds of bivariate terms. This work presents the design of RASP quadratures, theoretical guarantees on exactness, and analysis of expected errors. We also provide an open-source PyTorch implementation of RASP quadratures with quasi-Newton variational Bayes (QNVB), i.e. the projective integral update algorithm for Gaussian mean fields. Although RASP quadratures are designed to support QNVB, they are also compatible with other forms of variational inference, such as stochastic gradient variational Bayes (SGVB). Our experiments compare alternative integration schemes and training methods using three different learning tasks and architectures, demonstrating that efficient integration can improve generalizability for architectures with suitable loss structure.",
        "keywords": "quadrature;cubature;sigma points;loss topography;Hessian approximation;variational inference;quasi-Newton variational Bayes",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Jed A. Duersch;Esha Datta;Alexander Safonov",
        "authorids": "~Jed_A._Duersch1;~Esha_Datta1;~Alexander_Safonov1",
        "gender": "M;;M",
        "homepage": ";;https://alexandersafonov.github.io",
        "dblp": "205/4282;;",
        "google_scholar": "2HmqwXwAAAAJ;FB5NpNQAAAAJ;",
        "orcid": "0000-0002-2178-3695;;",
        "linkedin": ";;",
        "or_profile": "~Jed_A._Duersch1;~Esha_Datta1;~Alexander_Safonov1",
        "aff": "Sandia National Laboratories;Sandia National Laboratories;Sandia National Laboratories",
        "aff_domain": "sandia.gov;sandia.gov;sandia.gov",
        "position": "Principal Researcher;Postdoc;Researcher",
        "bibtex": "@misc{\nduersch2024rasp,\ntitle={{RASP} Quadratures: Efficient Numerical Integration for High-Dimensional Mean-Field Variational Inference},\nauthor={Jed A. Duersch and Esha Datta and Alexander Safonov},\nyear={2024},\nurl={https://openreview.net/forum?id=LdiVep1jpj}\n}",
        "github": "",
        "project": "",
        "reviewers": "jXiK;m4a3;rgHx",
        "site": "https://openreview.net/forum?id=LdiVep1jpj",
        "pdf_size": 1738332,
        "rating": "3;6;6",
        "confidence": "4;2;3",
        "soundness": "1;2;4",
        "contribution": "2;2;2",
        "presentation": "2;2;3",
        "wc_summary": "53;31;87",
        "wc_strengths": "12;25;36",
        "wc_weaknesses": "840;23;121",
        "wc_questions": "2;16;188",
        "wc_review": "907;95;432",
        "wc_reply_reviewers": "430;12;0",
        "wc_reply_authors": "1192;124;454",
        "reply_reviewers": "1;1;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            57.0,
            23.03620339089466
        ],
        "wc_strengths_avg": [
            24.333333333333332,
            9.809292646374775
        ],
        "wc_weaknesses_avg": [
            328.0,
            364.2425931527869
        ],
        "wc_questions_avg": [
            68.66666666666667,
            84.57475325940295
        ],
        "wc_review_avg": [
            478.0,
            333.08957754133746
        ],
        "wc_reply_reviewers_avg": [
            147.33333333333334,
            199.9355451694926
        ],
        "wc_reply_authors_avg": [
            590.0,
            446.4885216889679
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8660254037844387,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:3b4YE0sf7g0J:scholar.google.com/&scioq=RASP+Quadratures:+Efficient+Numerical+Integration+for+High-Dimensional+Mean-Field+Variational+Inference&hl=en&as_sdt=0,38",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Sandia National Laboratories",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sandia.gov",
        "aff_unique_abbr": "SNL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Instructive Decoding: Instruction-Tuned Large Language Models are Self-Refiner from Noisy Instructions",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18856",
        "id": "LebzzClHYw",
        "author_site": "Taehyeon Kim, JOONKEE KIM, Gihun Lee, Se-Young Yun",
        "tldr": "",
        "abstract": "While instruction-tuned language models have demonstrated impressive zero-shot generalization, these models often struggle to generate accurate responses when faced with instructions that fall outside their training set. This paper presents Instructive Decoding (ID), a simple yet effective approach that augments the efficacy of instruction-tuned models. Specifically, ID adjusts the logits for next-token prediction in a contrastive manner, utilizing predictions generated from a manipulated version of the original instruction, referred to as a noisy instruction. This noisy instruction aims to elicit responses that could diverge from the intended instruction yet remain plausible. We conduct experiments across a spectrum of such noisy instructions, ranging from those that insert semantic noise via random words to others like 'opposite' that elicit the deviated responses. Our approach achieves considerable performance gains across various instruction-tuned models and tasks without necessitating any additional parameter updates. Notably, utilizing 'opposite' as the noisy instruction in ID, which shows the maximum divergence from the original instruction, consistently produces the most significant performance gains across multiple models and tasks.",
        "keywords": "Instruction Following;Language Model;Decoding",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Taehyeon Kim;Joonkee Kim;Gihun Lee;Se-Young Yun",
        "authorids": "~Taehyeon_Kim1;~Joonkee_Kim1;~Gihun_Lee1;~Se-Young_Yun1",
        "gender": "M;M;M;M",
        "homepage": "https://taehyeon.oopy.io/;;https://github.com/Lee-Gihun;https://fbsqkd.github.io",
        "dblp": ";323/4661;264/0071;23/8862",
        "google_scholar": "https://scholar.google.co.kr/citations?user=wDEaSpwAAAAJ;LL9Yj54AAAAJ;zsZVyckAAAAJ;X_IAjb8AAAAJ",
        "orcid": ";;;",
        "linkedin": "taehyeon-k-6a1239207/;%EC%A4%80%EA%B8%B0-%EA%B9%80-5171831b3/;gihun-l-155159197/;seyoung-yun-395130ab/",
        "or_profile": "~Taehyeon_Kim1;~Joonkee_Kim1;~Gihun_Lee1;~Se-Young_Yun1",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;KAIST",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr;kaist.ac.kr;kaist.ac.kr",
        "position": "PhD student;MS student;PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nkim2024instructive,\ntitle={Instructive Decoding: Instruction-Tuned Large Language Models are Self-Refiner from Noisy Instructions},\nauthor={Taehyeon Kim and Joonkee Kim and Gihun Lee and Se-Young Yun},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=LebzzClHYw}\n}",
        "github": "",
        "project": "",
        "reviewers": "sigH;wghP;yaLP;K2iN",
        "pdf_size": 2274483,
        "rating": "6;8;8;8",
        "confidence": "4;4;3;4",
        "soundness": "3;4;3;4",
        "contribution": "3;3;3;3",
        "presentation": "3;4;3;4",
        "wc_summary": "121;37;57;75",
        "wc_strengths": "47;24;12;82",
        "wc_weaknesses": "136;23;45;192",
        "wc_questions": "59;70;49;265",
        "wc_review": "363;154;163;614",
        "wc_reply_reviewers": "32;20;13;296",
        "wc_reply_authors": "1845;743;1086;2471",
        "reply_reviewers": "1;1;1;2",
        "reply_authors": "6;3;4;7",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            72.5,
            31.060424980994707
        ],
        "wc_strengths_avg": [
            41.25,
            26.677471769266294
        ],
        "wc_weaknesses_avg": [
            99.0,
            68.39225102305085
        ],
        "wc_questions_avg": [
            110.75,
            89.36547152004515
        ],
        "wc_review_avg": [
            323.5,
            187.37729318143113
        ],
        "wc_reply_reviewers_avg": [
            90.25,
            118.98398001411786
        ],
        "wc_reply_authors_avg": [
            1536.25,
            671.0169055247416
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            5.0,
            1.5811388300841898
        ],
        "replies_avg": [
            32,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10334938840593622226&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=LebzzClHYw",
        "pdf": "https://openreview.net/pdf?id=LebzzClHYw",
        "email": "kaist.ac.kr;kaist.ac.kr;kaist.ac.kr;kaist.ac.kr",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "LegZeFYugN",
        "title": "Time2Image: A Unified Image Representation Framework for Time Series Classification",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Time Series Classification (TSC) is a crucial and challenging task that holds significant importance across various domains, of which one of the kernel ingredients is to construct a suitable time series representation for better feature capture. However, extracting informative and robust time series representation with good generalization potential is still a challenging problem. To address this issue, we propose Time2Image, a novel image-based representation framework for TSC. At the heart of our framework is a proposed Adaptive Time Series Gaussian Mapping (ATSGM) module for robust time series encoding in 2D image structure, based on which we employ Vision Transformer (ViT) for subsequent classification tasks considering its prominent long-dependency modeling capability. Experiments were conducted on all 158 public time series datasets from UCR/UEA covering diverse domains, among which our method achieves top 1 performance in 86 datasets compared with existing State-Of-The-Art (SOTA) methods. In addition, our framework flexibly allows handling both univariate and multivariate time series with unequal length across different domains and takes inherent advantage of generalization ability due to our proposed ATSGM representation method. The source code will be publicly available soon.",
        "keywords": "Time series classification; Time series image representation; Adaptive time series gaussian mapping; Vision Transformer",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Xinyue Ren;Duo Li;Xiang Gao;Victor Wai Kin Chan",
        "authorids": "~Xinyue_Ren1;~Duo_Li4;gaoxiang1102@pku.edu.cn;~Victor_Wai_Kin_Chan1",
        "gender": "F;M;;Not Specified",
        "homepage": "https://www.researchgate.net/;;;https://www.sigs.tsinghua.edu.cn/cwj/main.htm",
        "dblp": ";;;60/4361.html",
        "google_scholar": "jGigGhgAAAAJ;https://scholar.google.com/citations?hl=en;;tmYLtDgAAAAJ",
        "orcid": "0000-0001-8162-9991;;;0000-0002-7202-1922",
        "linkedin": ";;;",
        "or_profile": "~Xinyue_Ren1;~Duo_Li4;gaoxiang1102@pku.edu.cn;~Victor_Wai_Kin_Chan1",
        "aff": "Tsinghua University;Tsinghua University;;Shenzhen International Graduate School, Tsinghua University",
        "aff_domain": "mails.tsinghua.edu.cn;tsinghua.edu.cn;;tsinghua.edu.cn",
        "position": "PhD student;MS student;;Full Professor",
        "bibtex": "@misc{\nren2024timeimage,\ntitle={Time2Image: A Unified Image Representation Framework for Time Series Classification},\nauthor={Xinyue Ren and Duo Li and Xiang Gao and Victor Wai Kin Chan},\nyear={2024},\nurl={https://openreview.net/forum?id=LegZeFYugN}\n}",
        "github": "",
        "project": "",
        "reviewers": "e5E4;HAQG;soQ5;mdnq",
        "site": "https://openreview.net/forum?id=LegZeFYugN",
        "pdf_size": 1668611,
        "rating": "5;5;5;6",
        "confidence": "4;4;4;4",
        "soundness": "2;2;3;3",
        "contribution": "1;3;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "53;79;48;112",
        "wc_strengths": "29;171;7;254",
        "wc_weaknesses": "94;384;139;300",
        "wc_questions": "28;40;138;299",
        "wc_review": "204;674;332;965",
        "wc_reply_reviewers": "0;216;0;0",
        "wc_reply_authors": "751;2179;1122;2269",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;4;2;4",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            73.0,
            25.406692031825003
        ],
        "wc_strengths_avg": [
            115.25,
            101.8782974926456
        ],
        "wc_weaknesses_avg": [
            229.25,
            117.67619767820509
        ],
        "wc_questions_avg": [
            126.25,
            108.48127718643434
        ],
        "wc_review_avg": [
            543.75,
            297.7770768544819
        ],
        "wc_reply_reviewers_avg": [
            54.0,
            93.53074360871938
        ],
        "wc_reply_authors_avg": [
            1580.25,
            657.7474344305723
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            1.299038105676658
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:SFKsyQtIYkMJ:scholar.google.com/&scioq=Time2Image:+A+Unified+Image+Representation+Framework+for+Time+Series+Classification&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Tsinghua University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "THU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Shenzhen",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Delta-AI: Local objectives for amortized inference in sparse graphical models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18855",
        "id": "LemSSn8htt",
        "author_site": "Jean-Pierre Falet, Hae Beom Lee, Nikolay Malkin, Chen Sun, Dragos Secrieru, Dinghuai Zhang, Guillaume Lajoie, Yoshua Bengio",
        "tldr": "",
        "abstract": "We present a new algorithm for amortized inference in sparse probabilistic graphical models (PGMs), which we call $\\Delta$-amortized inference ($\\Delta$-AI). Our approach is based on the observation that when the sampling of variables in a PGM is seen as a sequence of actions taken by an agent, sparsity of the PGM enables local credit assignment in the agent's policy learning objective. This yields a local constraint that can be turned into a local loss in the style of generative flow networks (GFlowNets) that enables off-policy training but avoids the need to instantiate all the random variables for each parameter update, thus speeding up training considerably. The $\\Delta$-AI objective matches the conditional distribution of a variable given its Markov blanket in a tractable learned sampler, which has the structure of a Bayesian network, with the same conditional distribution under the target PGM. As such, the trained sampler recovers marginals and conditional distributions of interest and enables inference of partial subsets of variables. We illustrate $\\Delta$-AI's effectiveness for sampling from synthetic PGMs and training latent variable models with sparse factor structure. Code: https://github.com/GFNOrg/Delta-AI.",
        "keywords": "amortized inference;variational inference;graphical models;Markov random fields;generative flow networks;GFlowNets",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/3473a760bd7f00ce8a7b32b4a8823bf0b6b0094a.zip",
        "author": "Jean-Pierre Ren\u00e9 Falet;Hae Beom Lee;Nikolay Malkin;Chen Sun;Dragos Secrieru;Dinghuai Zhang;Guillaume Lajoie;Yoshua Bengio",
        "authorids": "~Jean-Pierre_Ren\u00e9_Falet1;~Hae_Beom_Lee1;~Nikolay_Malkin1;~Chen_Sun7;~Dragos_Secrieru1;~Dinghuai_Zhang1;~Guillaume_Lajoie1;~Yoshua_Bengio1",
        "gender": ";M;;;Not Specified;;M;M",
        "homepage": "https://www.jeanpierrefalet.com;https://haebeom-lee.github.io;;;;;https://dms.umontreal.ca/~lajoie/;http://yoshuabengio.org",
        "dblp": ";326/7260;;01/6072-7;;;31/10384;56/953",
        "google_scholar": "https://scholar.google.ca/citations?hl=en;;;Xvl3OLEAAAAJ;;;;kukA0LcAAAAJ",
        "orcid": "0000-0002-7576-2347;;;0000-0002-2419-794X;;;;",
        "linkedin": ";;;;dragos-secrieru-44411a292/;;;yoshuabengio/?originalSubdomain=ca",
        "or_profile": "~Jean-Pierre_Ren\u00e9_Falet1;~Hae_Beom_Lee1;~Nikolay_Malkin1;~Chen_Sun7;~Dragos_Secrieru1;~Dinghuai_Zhang1;~Guillaume_Lajoie1;~Yoshua_Bengio1",
        "aff": "Universit\u00e9 de Montr\u00e9al;Korea Advanced Institute of Science & Technology;;Google;Universit\u00e9 de Montr\u00e9al;;Mila - Quebec Artificial Intelligence Institute;University of Montreal",
        "aff_domain": "umontreal.ca;kaist.ac.kr;;google.com;umontreal.ca;;mila.quebec;umontreal.ca",
        "position": "PhD student;Postdoc;;Researcher;MS student;;Associate Professor;Full Professor",
        "bibtex": "@inproceedings{\nfalet2024deltaai,\ntitle={Delta-{AI}: Local objectives for amortized inference in sparse graphical models},\nauthor={Jean-Pierre Ren{\\'e} Falet and Hae Beom Lee and Nikolay Malkin and Chen Sun and Dragos Secrieru and Dinghuai Zhang and Guillaume Lajoie and Yoshua Bengio},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=LemSSn8htt}\n}",
        "github": "",
        "project": "",
        "reviewers": "iUke;mXkv;1ZeM",
        "pdf_size": 2287893,
        "rating": "6;6;8",
        "confidence": "2;3;2",
        "soundness": "3;3;3",
        "contribution": "3;2;3",
        "presentation": "2;2;3",
        "wc_summary": "77;96;75",
        "wc_strengths": "39;33;138",
        "wc_weaknesses": "26;119;32",
        "wc_questions": "59;33;82",
        "wc_review": "201;281;327",
        "wc_reply_reviewers": "4;55;26",
        "wc_reply_authors": "507;725;594",
        "reply_reviewers": "1;1;1",
        "reply_authors": "1;2;1",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            82.66666666666667,
            9.46337971105226
        ],
        "wc_strengths_avg": [
            70.0,
            48.14561246884289
        ],
        "wc_weaknesses_avg": [
            59.0,
            42.49705872175156
        ],
        "wc_questions_avg": [
            58.0,
            20.016659728003237
        ],
        "wc_review_avg": [
            269.6666666666667,
            52.05979468094571
        ],
        "wc_reply_reviewers_avg": [
            28.333333333333332,
            20.885933597094056
        ],
        "wc_reply_authors_avg": [
            608.6666666666666,
            89.60034722154944
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10059945914461547549&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=LemSSn8htt",
        "pdf": "https://openreview.net/pdf?id=LemSSn8htt",
        "email": "umontreal.ca;kaist.ac.kr;;google.com;umontreal.ca;;mila.quebec;umontreal.ca",
        "author_num": 8,
        "aff_unique_index": "0;1;2;0;3;4",
        "aff_unique_norm": "Universit\u00e9 de Montr\u00e9al;Korea Advanced Institute of Science and Technology;Google;Quebec Artificial Intelligence Institute;University of Montreal",
        "aff_unique_dep": ";;Google;Artificial Intelligence;",
        "aff_unique_url": "https://www.umontreal.ca;https://www.kaist.ac.kr;https://www.google.com;https://mila.quebec;https://wwwumontreal.ca",
        "aff_unique_abbr": "UdeM;KAIST;Google;Mila;UM",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;2;0;0;0",
        "aff_country_unique": "Canada;South Korea;United States"
    },
    {
        "title": "Confidence-aware Reward Optimization for Fine-tuning Text-to-Image Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18854",
        "id": "Let8OMe20n",
        "author_site": "Kyuyoung Kim, Jongheon Jeong, Minyong An, Mohammad Ghavamzadeh, Krishnamurthy Dvijotham, Jinwoo Shin, Kimin Lee",
        "tldr": "",
        "abstract": "Fine-tuning text-to-image models with reward functions trained on human feedback data has proven effective for aligning model behavior with human intent. However, excessive optimization with such reward models, which serve as mere proxy objectives, can compromise the performance of fine-tuned models, a phenomenon known as reward overoptimization. To investigate this issue in depth, we introduce the Text-Image Alignment Assessment (TIA2) benchmark, which comprises a diverse collection of text prompts, images, and human annotations. Our evaluation of several state-of-the-art reward models on this benchmark reveals their frequent misalignment with human assessment. We empirically demonstrate that overoptimization occurs notably when a poorly aligned reward model is used as the fine-tuning objective. To address this, we propose TextNorm, a simple method that enhances alignment based on a measure of reward model confidence estimated across a set of semantically contrastive text prompts. We demonstrate that incorporating the confidence-calibrated rewards in fine-tuning effectively reduces overoptimization, resulting in twice as many wins in human evaluation for text-image alignment compared against the baseline reward models.",
        "keywords": "text-to-image generation;overoptimization;confidence calibration",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/f9ab1ff78b1acb0aa28d3c3956733f32ca4a22bd.zip",
        "author": "Kyuyoung Kim;Jongheon Jeong;Minyong An;Mohammad Ghavamzadeh;Krishnamurthy Dj Dvijotham;Jinwoo Shin;Kimin Lee",
        "authorids": "~Kyuyoung_Kim1;~Jongheon_Jeong1;~Minyong_An2;~Mohammad_Ghavamzadeh2;~Krishnamurthy_Dj_Dvijotham1;~Jinwoo_Shin1;~Kimin_Lee1",
        "gender": "M;M;M;M;M;;M",
        "homepage": "https://jh-jeong.github.io;;https://sites.google.com/site/mijirim/;https://sites.google.com/view/kiminlee;http://dvij.github.io;https://kykim0.github.io;https://mohammadghavamzadeh.github.io/",
        "dblp": "241/5923;;31/7062;183/6849;16/8758;;88/6389",
        "google_scholar": "mZB2qfcAAAAJ;;https://scholar.google.com.tw/citations?user=m3eDp7kAAAAJ;92M8xv4AAAAJ;BUtloecAAAAJ;9iLSqKAAAAAJ;https://scholar.google.ca/citations?user=LHIPpCsAAAAJ",
        "orcid": "0000-0002-4058-5774;;;;;;",
        "linkedin": "jongheonj/;\ubbfc\uc6a9-\uc548-7ba840255/;;;;;",
        "or_profile": "~Jongheon_Jeong1;~Minyong_An2;~Jinwoo_Shin1;~Kimin_Lee1;~Krishnamurthy_Dvijotham2;~Kyu-Young_Kim1;~Mohammad_Ghavamzadeh1",
        "aff": "Korea Advanced Institute of Science & Technology;Yonsei University;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Google DeepMind;Korea Advanced Institute of Science & Technology;Amazon AGI",
        "aff_domain": "kaist.ac.kr;yonsei.ac.kr;kaist.ac.kr;kaist.edu;google.com;kaist.edu;amazon.com",
        "position": "Postdoc;Undergrad student;Full Professor;Assistant Professor;Researcher;PhD student;Senior Principal Scientist",
        "bibtex": "@inproceedings{\nkim2024confidenceaware,\ntitle={Confidence-aware Reward Optimization for Fine-tuning Text-to-Image Models},\nauthor={Kyuyoung Kim and Jongheon Jeong and Minyong An and Mohammad Ghavamzadeh and Krishnamurthy Dj Dvijotham and Jinwoo Shin and Kimin Lee},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Let8OMe20n}\n}",
        "github": "",
        "project": "",
        "reviewers": "fRcb;exWV;9bKW",
        "pdf_size": 13242963,
        "rating": "6;6;6",
        "confidence": "4;4;3",
        "soundness": "3;3;3",
        "contribution": "3;2;3",
        "presentation": "3;3;2",
        "wc_summary": "88;70;95",
        "wc_strengths": "107;37;50",
        "wc_weaknesses": "120;72;146",
        "wc_questions": "34;56;85",
        "wc_review": "349;235;376",
        "wc_reply_reviewers": "60;0;0",
        "wc_reply_authors": "358;619;922",
        "reply_reviewers": "1;0;0",
        "reply_authors": "2;2;3",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            84.33333333333333,
            10.530379332620877
        ],
        "wc_strengths_avg": [
            64.66666666666667,
            30.40102337458761
        ],
        "wc_weaknesses_avg": [
            112.66666666666667,
            30.652170486860395
        ],
        "wc_questions_avg": [
            58.333333333333336,
            20.885933597094056
        ],
        "wc_review_avg": [
            320.0,
            61.106464469808756
        ],
        "wc_reply_reviewers_avg": [
            20.0,
            28.284271247461902
        ],
        "wc_reply_authors_avg": [
            633.0,
            230.46474784660668
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8633851457947010161&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=Let8OMe20n",
        "pdf": "https://openreview.net/pdf?id=Let8OMe20n",
        "email": "kaist.ac.kr;yonsei.ac.kr;kaist.ac.kr;kaist.edu;google.com;kaist.edu;amazon.com",
        "author_num": 7,
        "aff_unique_index": "0;1;0;0;2;0;3",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology;Yonsei University;Google;Amazon",
        "aff_unique_dep": ";;Google DeepMind;Amazon AGI",
        "aff_unique_url": "https://www.kaist.ac.kr;https://www.yonsei.ac.kr;https://deepmind.com;https://www.amazon.com",
        "aff_unique_abbr": "KAIST;Yonsei;DeepMind;Amazon",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;1;0;2",
        "aff_country_unique": "South Korea;United Kingdom;United States"
    },
    {
        "id": "LfDUzzQa3g",
        "title": "RepCodec: A Speech Representation Codec for Speech Tokenization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "With recent rapid growth of large language models (LLMs), discrete speech tokenization has played an important role for injecting speech into LLMs. However, this discretization gives rise to a loss of information, consequently impairing overall performance. To improve the performance of these discrete speech tokens, we present RepCodec, a novel speech representation codec for semantic speech tokenization. In contrast to audio codecs which reconstruct the raw audio, RepCodec learns a vector quantization codebook through reconstructing speech representations from speech encoders like HuBERT or data2vec. Together, the speech encoder, the codec encoder and the vector quantization codebook form a pipeline for converting speech waveforms into semantic tokens. The extensive experiments illustrate that RepCodec, by virtue of its enhanced information retention capacity, significantly outperforms the widely used k-means clustering approach in both speech understanding and generation. Furthermore, this superiority extends across various speech encoders and languages, affirming the robustness of RepCodec. We believe our method can facilitate large language modeling research on speech processing.",
        "keywords": "Speech;Semantic Tokens",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/c9d4ce42b4a60201eb80428feb99c4ad95fb25cb.zip",
        "author": "Zhichao Huang;Chutong Meng;Tom Ko",
        "authorids": "~Zhichao_Huang1;~Chutong_Meng1;~Tom_Ko2",
        "gender": "M;;M",
        "homepage": ";https://github.com/mct10;https://tomkocse.github.io/",
        "dblp": ";;96/8762",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-TW;;26-lhTQAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Zhichao_Huang1;~Chutong_Meng1;~Tom_Ko2",
        "aff": "Bytedance;;ByteDance AI Lab",
        "aff_domain": "bytedance.com;;bytedance.com",
        "position": "Researcher;;Researcher",
        "bibtex": "@misc{\nhuang2024repcodec,\ntitle={RepCodec: A Speech Representation Codec for Speech Tokenization},\nauthor={Zhichao Huang and Chutong Meng and Tom Ko},\nyear={2024},\nurl={https://openreview.net/forum?id=LfDUzzQa3g}\n}",
        "github": "",
        "project": "",
        "reviewers": "6oit;wBo4;gJKh;XznZ",
        "site": "https://openreview.net/forum?id=LfDUzzQa3g",
        "pdf_size": 769917,
        "rating": "5;5;6;6",
        "confidence": "3;3;3;4",
        "soundness": "3;2;3;3",
        "contribution": "2;2;2;2",
        "presentation": "3;3;3;4",
        "wc_summary": "23;55;81;47",
        "wc_strengths": "27;64;25;45",
        "wc_weaknesses": "117;111;111;94",
        "wc_questions": "9;15;133;5",
        "wc_review": "176;245;350;191",
        "wc_reply_reviewers": "28;66;27;19",
        "wc_reply_authors": "525;404;510;198",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            51.5,
            20.706279240848655
        ],
        "wc_strengths_avg": [
            40.25,
            15.769828787910159
        ],
        "wc_weaknesses_avg": [
            108.25,
            8.584142356694699
        ],
        "wc_questions_avg": [
            40.5,
            53.52335938634644
        ],
        "wc_review_avg": [
            240.5,
            68.22939249326495
        ],
        "wc_reply_reviewers_avg": [
            35.0,
            18.23458252881047
        ],
        "wc_reply_authors_avg": [
            409.25,
            130.57828111902836
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 29,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6060346483384682669&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "ByteDance",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.bytedance.com",
        "aff_unique_abbr": "Bytedance",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "LfhG5znxzR",
        "title": "Codebook Features: Sparse and Discrete Interpretability for Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Understanding neural networks is challenging in part because of the dense, continuous nature of their hidden states. \nWe explore whether we can train neural networks to have hidden states that are sparse, discrete, and more interpretable by quantizing their continuous features into what we call codebook features. Codebook features are produced by finetuning neural networks with a vector quantization bottleneck at each layer, producing a network whose hidden features are the sum of a small number of discrete vector codes chosen from a larger codebook. Surprisingly, we find that neural networks can operate under this extreme bottleneck with only modest degradation in performance. This sparse, discrete bottleneck also provides an intuitive way of controlling neural network behavior: first, find codes that activate when the desired behavior is present, then activate those same codes during generation to elicit that behavior.\nWe validate our approach by training codebook Transformers on several different datasets. First, we explore a finite state machine dataset with far more hidden states than neurons. Our approach overcomes the superposition problem by assigning states to distinct codes, and we find that we can make the neural network behave as if it is in a different state by activating the code for that state. Second, we train Transformer language models with up to 410M parameters on two natural language datasets. We identify codes in these models representing diverse, disentangled concepts (ranging from negative emotions to months of the year) and find that we can guide the model to generate different topics by activating the appropriate codes during inference. Overall, codebook features appear to be a promising unit of analysis and control for neural networks and interpretability. Our codebase and models are open-sourced.",
        "keywords": "mechanistic;interpretability;superposition",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/3c89fc87472701fb2f235c14056757b48c0b738c.zip",
        "author": "Alex Tamkin;Mohammad Taufeeque;Noah Goodman",
        "authorids": "~Alex_Tamkin1;~Mohammad_Taufeeque2;~Noah_Goodman1",
        "gender": ";;",
        "homepage": ";https://taufeeque9.github.io/;https://cocolab.stanford.edu/",
        "dblp": ";286/7826;96/1216",
        "google_scholar": ";OKO5dwcAAAAJ;OUpIbcQAAAAJ",
        "orcid": ";;",
        "linkedin": ";mtaufeeque;",
        "or_profile": "~Alex_Tamkin1;~Mohammad_Taufeeque2;~Noah_Goodman1",
        "aff": ";FAR.AI;Stanford University",
        "aff_domain": ";far.ai;stanford.edu",
        "position": ";Researcher;Full Professor",
        "bibtex": "@misc{\ntamkin2024codebook,\ntitle={Codebook Features: Sparse and Discrete Interpretability for Neural Networks},\nauthor={Alex Tamkin and Mohammad Taufeeque and Noah Goodman},\nyear={2024},\nurl={https://openreview.net/forum?id=LfhG5znxzR}\n}",
        "github": "",
        "project": "",
        "reviewers": "v2JW;AYvz;aakk;XCvz",
        "site": "https://openreview.net/forum?id=LfhG5znxzR",
        "pdf_size": 617497,
        "rating": "5;5;6;6",
        "confidence": "3;3;3;3",
        "soundness": "3;2;3;4",
        "contribution": "3;2;2;3",
        "presentation": "3;3;3;4",
        "wc_summary": "74;109;52;73",
        "wc_strengths": "103;151;44;139",
        "wc_weaknesses": "125;259;37;361",
        "wc_questions": "95;252;67;16",
        "wc_review": "397;771;200;589",
        "wc_reply_reviewers": "0;120;71;53",
        "wc_reply_authors": "312;1145;444;577",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "1;2;2;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            77.0,
            20.457272545478784
        ],
        "wc_strengths_avg": [
            109.25,
            41.60754138374437
        ],
        "wc_weaknesses_avg": [
            195.5,
            124.01108821391739
        ],
        "wc_questions_avg": [
            107.5,
            88.1036321612225
        ],
        "wc_review_avg": [
            489.25,
            213.01921861653705
        ],
        "wc_reply_reviewers_avg": [
            61.0,
            42.91270208225066
        ],
        "wc_reply_authors_avg": [
            619.5,
            317.5346437792261
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 21,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9460788710261450578&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "FAR.AI;Stanford University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.far.ai;https://www.stanford.edu",
        "aff_unique_abbr": "FAR.AI;Stanford",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Stanford",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Layer-wise linear mode connectivity",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18853",
        "id": "LfmZh91tDI",
        "author_site": "Linara Adilova, Maksym Andriushchenko, Michael Kamp, Asja Fischer, Martin Jaggi",
        "tldr": "",
        "abstract": "Averaging neural network parameters is an intuitive method for fusing the knowledge of two independent models. It is most prominently used in federated learning. If models are averaged at the end of training, this can only lead to a good performing model if the loss surface of interest is very particular, i.e., the loss in the midpoint between the two models needs to be sufficiently low. This is impossible to guarantee for the non-convex losses of state-of-the-art networks. For averaging models trained on vastly different datasets, it was proposed to average only the parameters of particular layers or combinations of layers, resulting in better performing models. To get a better understanding of the effect of layer-wise averaging, we analyse the performance of the models that result from averaging single layers, or groups of layers. Based on our empirical and theoretical investigation, we introduce a novel notion of the layer-wise linear connectivity, and show that deep networks do not have layer-wise barriers between them.",
        "keywords": "linear mode connectivity;layer-wise;federated averaging",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Linara Adilova;Maksym Andriushchenko;Michael Kamp;Asja Fischer;Martin Jaggi",
        "authorids": "~Linara_Adilova1;~Maksym_Andriushchenko1;~Michael_Kamp1;~Asja_Fischer1;~Martin_Jaggi1",
        "gender": "F;M;M;F;M",
        "homepage": ";https://www.andriushchenko.me/;http://michaelkamp.org;;https://mlo.epfl.ch",
        "dblp": "223/4636;200/8865;133/7744;76/8485;17/4402",
        "google_scholar": "https://scholar.google.de/citations?user=Z34FjHgAAAAJ;ZNtuJYoAAAAJ;https://scholar.google.de/citations?user=8R5jbvQAAAAJ;FyZbyIUAAAAJ;https://scholar.google.ch/citations?user=r1TJBr8AAAAJ",
        "orcid": ";;0000-0001-6231-0694;0000-0002-1916-7033;0000-0003-1579-5558",
        "linkedin": ";;michael-kamp-29096a95/;;",
        "or_profile": "~Linara_Adilova1;~Maksym_Andriushchenko1;~Michael_Kamp1;~Asja_Fischer1;~Martin_Jaggi1",
        "aff": "Ruhr-Universt\u00e4t Bochum;Swiss Federal Institute of Technology Lausanne;Institute for AI in Medicine IKIM;Ruhr-Universit\u00e4t Bochum;EPFL",
        "aff_domain": "rub.de;epfl.ch;uk-essen.de;ruhr-uni-bochum.de;epfl.ch",
        "position": "PhD student;PhD Student;Research Group Leader;Full Professor;Associate Professor",
        "bibtex": "@inproceedings{\nadilova2024layerwise,\ntitle={Layer-wise linear mode connectivity},\nauthor={Linara Adilova and Maksym Andriushchenko and Michael Kamp and Asja Fischer and Martin Jaggi},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=LfmZh91tDI}\n}",
        "github": "",
        "project": "",
        "reviewers": "G1sx;GMLC;zQV8;VziZ",
        "pdf_size": 12726525,
        "rating": "6;6;6;6",
        "confidence": "3;4;3;4",
        "soundness": "3;3;2;3",
        "contribution": "3;3;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "23;48;104;226",
        "wc_strengths": "45;70;82;172",
        "wc_weaknesses": "123;289;245;341",
        "wc_questions": "36;30;131;66",
        "wc_review": "227;437;562;805",
        "wc_reply_reviewers": "154;28;71;56",
        "wc_reply_authors": "462;433;832;660",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;1;3;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            100.25,
            78.30189972152655
        ],
        "wc_strengths_avg": [
            92.25,
            47.93941489004637
        ],
        "wc_weaknesses_avg": [
            249.5,
            80.5527777298834
        ],
        "wc_questions_avg": [
            65.75,
            40.064791276131714
        ],
        "wc_review_avg": [
            507.75,
            209.24074053587174
        ],
        "wc_reply_reviewers_avg": [
            77.25,
            46.92214296044033
        ],
        "wc_reply_authors_avg": [
            596.75,
            161.4889702115906
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 20,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10787059954319229585&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=LfmZh91tDI",
        "pdf": "https://openreview.net/pdf?id=LfmZh91tDI",
        "email": "rub.de;epfl.ch;uk-essen.de;ruhr-uni-bochum.de;epfl.ch",
        "author_num": 5,
        "aff_unique_index": "0;1;2;0;3",
        "aff_unique_norm": "Ruhr-Universit\u00e4t Bochum;Swiss Federal Institute of Technology Lausanne;Institute for AI in Medicine;EPFL",
        "aff_unique_dep": ";;AI in Medicine;",
        "aff_unique_url": "https://www.ruhr-uni-bochum.de;https://www.epfl.ch;;https://www.epfl.ch",
        "aff_unique_abbr": "RUB;EPFL;IKIM;EPFL",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Lausanne",
        "aff_country_unique_index": "0;1;2;0;1",
        "aff_country_unique": "Germany;Switzerland;Unknown"
    },
    {
        "id": "LhNZqkuVte",
        "title": "HyperMask: Adaptive Hypernetwork-based Masks for Continual Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Artificial neural networks suffer catastrophic forgetting when they are sequentially trained on multiple tasks. To overcome this problem, there exist many continual learning strategies. One of the most effective is the hypernetwork-based approach.  The hypernetwork generates the weights of a target model based on the task's identity. The model's main limitation is that hypernetwork can produce completely different nests for each task. Consequently, each task is solved separately. \nThe model does not use information from the network dedicated to previous tasks. \nWe practically produce a new architecture when we update the prior task.\nTo solve such a problem, we use the lottery ticket hypothesis, which postulates the existence of sparse subnetworks, named winning tickets, that preserve the performance of a full network.\n\nIn the paper, we propose a method called HyperMask, which trains a single network for all tasks. Hypernetwork produces semi-binary masks to obtain target subnetworks dedicated to new tasks. This solution inherits the ability of the hypernetwork to adapt to new tasks with minimal forgetting. Moreover, due to the lottery ticket hypothesis, we can use a single network with weighted subnets dedicated to each task.",
        "keywords": "Continual Learning;Hypernetworks;lottery ticket hypothesis",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/729860b51145d3a28be2ecc38e56f8e7db815e9c.zip",
        "author": "Kamil Ksi\u0105\u017cek;Przemys\u0142aw Spurek",
        "authorids": "~Kamil_Ksi\u0105\u017cek1;~Przemys\u0142aw_Spurek1",
        "gender": "M;M",
        "homepage": "http://ww2.ii.uj.edu.pl/~spurek/;",
        "dblp": "77/10260;206/3285.html",
        "google_scholar": "0kp0MbgAAAAJ;i0N4lY8AAAAJ",
        "orcid": "0000-0003-0097-5521;0000-0002-0201-6220",
        "linkedin": "spurek/;kamil-ksi%C4%85%C5%BCek-6a7098191/?originalSubdomain=en",
        "or_profile": "~Przemys\u0142aw_Spurek1;~Kamil_Micha\u0142_Ksi\u0105\u017cek1",
        "aff": "Jagiellonian University Cracow;Institute of Theoretical and Applied Informatics of Polish Academy of Sciences",
        "aff_domain": "uj.edu.pl;iitis.pl",
        "position": "Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nksi{\\k{a}}{\\.z}ek2024hypermask,\ntitle={HyperMask: Adaptive Hypernetwork-based Masks for Continual Learning},\nauthor={Kamil Ksi{\\k{a}}{\\.z}ek and Przemys{\\l}aw Spurek},\nyear={2024},\nurl={https://openreview.net/forum?id=LhNZqkuVte}\n}",
        "github": "",
        "project": "",
        "reviewers": "1qn2;uLSz;G6Eq",
        "site": "https://openreview.net/forum?id=LhNZqkuVte",
        "pdf_size": 5385063,
        "rating": "3;3;5",
        "confidence": "5;4;5",
        "soundness": "2;2;2",
        "contribution": "1;2;2",
        "presentation": "2;1;2",
        "wc_summary": "62;89;35",
        "wc_strengths": "19;95;41",
        "wc_weaknesses": "171;232;105",
        "wc_questions": "11;121;19",
        "wc_review": "263;537;200",
        "wc_reply_reviewers": "269;118;11",
        "wc_reply_authors": "1973;1436;1358",
        "reply_reviewers": "2;1;1",
        "reply_authors": "5;4;3",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            62.0,
            22.045407685048602
        ],
        "wc_strengths_avg": [
            51.666666666666664,
            31.930480039541457
        ],
        "wc_weaknesses_avg": [
            169.33333333333334,
            51.86092513208336
        ],
        "wc_questions_avg": [
            50.333333333333336,
            50.075498555237125
        ],
        "wc_review_avg": [
            333.3333333333333,
            146.29270506609532
        ],
        "wc_reply_reviewers_avg": [
            132.66666666666666,
            105.83740149661439
        ],
        "wc_reply_authors_avg": [
            1589.0,
            273.389831559259
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            4.0,
            0.816496580927726
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Oap5iVQEJ70J:scholar.google.com/&scioq=HyperMask:+Adaptive+Hypernetwork-based+Masks+for+Continual+Learning&hl=en&as_sdt=0,44",
        "gs_version_total": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Jagiellonian University;Polish Academy of Sciences",
        "aff_unique_dep": ";Institute of Theoretical and Applied Informatics",
        "aff_unique_url": "https://www.uj.edu.pl;https://www.pan.pl",
        "aff_unique_abbr": "UJ;PAS",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Cracow;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Poland"
    },
    {
        "id": "LiNIIxm545",
        "title": "Explanation-aware Soft Ensemble Empowers Large Language Model In-context Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large language models (LLMs) have shown remarkable capabilities in various natural language understanding (NLU) tasks. With only a few demonstration examples, these LLMs can quickly adapt to target tasks without expensive gradient updates. Common strategies to boost such \u201cin-context\u201d learning ability are to ensemble multiple model decoded results and require the model to generate an explanation along with the prediction. However, these models often treat different class predictions equally and neglect the potential discrepancy between the explanations and predictions. To fully unleash the power of explanations, we propose EASE, an Explanation-Aware Soft Ensemble framework to empower in-context learning with LLMs. We design two techniques, explanation-guided ensemble, and soft probability aggregation, to mitigate the effect of unreliable explanations and improve the consistency between explanations and final predictions. Experiments on seven natural language understanding tasks and four varying-size LLMs demonstrate the effectiveness of our proposed framework",
        "keywords": "Large Language Models;In-context Learning;Natural Language Explanations",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Yue Yu;Jiaming Shen;Tianqi Liu;Zhen Qin;Jing Nathan Yan;Jialu Liu;Chao Zhang;Michael Bendersky",
        "authorids": "~Yue_Yu2;~Jiaming_Shen1;~Tianqi_Liu1;~Zhen_Qin5;~Jing_Nathan_Yan1;~Jialu_Liu1;~Chao_Zhang15;~Michael_Bendersky1",
        "gender": "M;;M;M;;M;;",
        "homepage": "https://yueyu1030.github.io;https://mickeysjm.github.io;;http://alumni.cs.ucr.edu/~zqin001/;https://nathanyanjing.github.io/;https://jialu.info/;http://chaozhang.org/;http://bendersky.github.io/",
        "dblp": ";178/3627;134/5653-2;;;14/8399;94/3019-14;80/4305",
        "google_scholar": "zQ3Jh6UAAAAJ;-ZJ0sCoAAAAJ;pUKhiMIAAAAJ;Kv1yk3YAAAAJ;;BUERw4QAAAAJ;https://scholar.google.com/citations?hl=en;C9mxM5IAAAAJ",
        "orcid": "0000-0002-3683-5208;0000-0002-0467-4956;;0000-0001-6739-134X;;;0000-0003-3009-598X;0000-0002-2941-6240",
        "linkedin": ";jiaming-shen-08186710a/;;;;;;",
        "or_profile": "~Yue_Yu2;~Jiaming_Shen1;~Tianqi_Liu1;~Zhen_Qin5;~Jing_Nathan_Yan1;~Jialu_Liu1;~Chao_Zhang15;~Michael_Bendersky1",
        "aff": "Georgia Institute of Technology;Google Research;Google DeepMind;Google Deepmind;Cornell University;Google Research;Georgia Institute of Technology;Google",
        "aff_domain": "gatech.edu;google.com;google.com;google.com;cornell.edu;google.com;gatech.edu;google.com",
        "position": "PhD student;Research Scientist;Software Engineer;Researcher;PhD student;Software Engineer Manager;Assistant Professor;Researcher",
        "bibtex": "@misc{\nyu2024explanationaware,\ntitle={Explanation-aware Soft Ensemble Empowers Large Language Model In-context Learning},\nauthor={Yue Yu and Jiaming Shen and Tianqi Liu and Zhen Qin and Jing Nathan Yan and Jialu Liu and Chao Zhang and Michael Bendersky},\nyear={2024},\nurl={https://openreview.net/forum?id=LiNIIxm545}\n}",
        "github": "",
        "project": "",
        "reviewers": "Bpfu;HfbG;gauf",
        "site": "https://openreview.net/forum?id=LiNIIxm545",
        "pdf_size": 6916469,
        "rating": "5;5;6",
        "confidence": "4;4;4",
        "soundness": "3;2;3",
        "contribution": "2;2;4",
        "presentation": "3;2;4",
        "wc_summary": "124;59;250",
        "wc_strengths": "63;33;157",
        "wc_weaknesses": "110;203;141",
        "wc_questions": "15;1;53",
        "wc_review": "312;296;601",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "969;813;1142",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;2;2",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            144.33333333333334,
            79.28990407920095
        ],
        "wc_strengths_avg": [
            84.33333333333333,
            52.822554105440815
        ],
        "wc_weaknesses_avg": [
            151.33333333333334,
            38.663792996664064
        ],
        "wc_questions_avg": [
            23.0,
            21.96967607104544
        ],
        "wc_review_avg": [
            403.0,
            140.1594330277726
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            974.6666666666666,
            134.373443143436
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14941219556759016353&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;1;2;3;1;0;1",
        "aff_unique_norm": "Georgia Institute of Technology;Google;DeepMind;Cornell University",
        "aff_unique_dep": ";Google Research;DeepMind;",
        "aff_unique_url": "https://www.gatech.edu;https://research.google;https://deepmind.com;https://www.cornell.edu",
        "aff_unique_abbr": "Georgia Tech;Google Research;DeepMind;Cornell",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0;1;1;0;0;0;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "LixGd92Wri",
        "title": "GDL-DS: A Benchmark for Geometric Deep Learning under Distribution Shifts",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Geometric deep learning (GDL) has gained significant attention in various scientific fields, chiefly for its proficiency in modeling data with intricate geometric structures. Yet, very few works have delved into its capability of tackling the distribution shift problem, a prevalent challenge in many relevant applications. To bridge this gap, we propose GDL-DS, a comprehensive benchmark designed for evaluating the performance of GDL models in scenarios with distribution shifts. Our evaluation datasets cover diverse scientific domains from particle physics and material science to biochemistry, and encapsulates a broad spectrum of distribution shifts including conditional, covariate, and concept shifts. \nFurthermore, we study three levels of information access from the out-of-distribution (OOD) testing data, including no OOD information, only OOD features without labels, and OOD features with a few labels. \nOverall, our benchmark results in 30 different experiment settings, and evaluates 3 GDL backbones and 11 learning algorithms in each setting. A thorough analysis of the evaluation results is provided, poised to illuminate insights for DGL researchers and domain practitioners who are to use DGL in their applications.",
        "keywords": "geometric deep learning;distribution shift.",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/d190985417750e083ee3afe74002964a3c11b0ad.zip",
        "author": "Deyu Zou;Shikun Liu;Siqi Miao;Victor Fung;Shiyu Chang;Pan Li",
        "authorids": "~Deyu_Zou1;~Shikun_Liu3;~Siqi_Miao1;~Victor_Fung1;~Shiyu_Chang2;~Pan_Li2",
        "gender": "M;;;;Unspecified;",
        "homepage": "https://github.com/unimpor;https://shikun-liu.com/;https://siqi.plus/;;http://people.csail.mit.edu/chang87/;",
        "dblp": ";;312/7014-1;;28/9988;https://dblp.org/pers/hd/l/Li_0005:Pan",
        "google_scholar": ";BLafTygAAAAJ;bVF_CzUAAAAJ;2QsddMIAAAAJ;r21asW4AAAAJ;IroP0EwAAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";;;;;pan-li-b951105a/",
        "or_profile": "~Deyu_Zou1;~Shikun_Liu3;~Siqi_Miao1;~Victor_Fung1;~Shiyu_Chang2;~Pan_Li2",
        "aff": "University of Science and Technology of China;Georgia Institute of Technology;Georgia Institute of Technology;Georgia Institute of Technology;University of California, Santa Barbara;Purdue University",
        "aff_domain": "ustc.edu.cn;gatech.edu;gatech.edu;gatech.edu;ucsb.edu;purdue.edu",
        "position": "Undergrad student;PhD student;PhD student;Assistant Professor;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nzou2024gdlds,\ntitle={{GDL}-{DS}: A Benchmark for Geometric Deep Learning under Distribution Shifts},\nauthor={Deyu Zou and Shikun Liu and Siqi Miao and Victor Fung and Shiyu Chang and Pan Li},\nyear={2024},\nurl={https://openreview.net/forum?id=LixGd92Wri}\n}",
        "github": "",
        "project": "",
        "reviewers": "GGxS;xYh1;1MFG",
        "site": "https://openreview.net/forum?id=LixGd92Wri",
        "pdf_size": 1273605,
        "rating": "3;6;8",
        "confidence": "5;2;4",
        "soundness": "2;2;4",
        "contribution": "2;2;4",
        "presentation": "2;3;4",
        "wc_summary": "48;71;117",
        "wc_strengths": "55;84;141",
        "wc_weaknesses": "531;40;38",
        "wc_questions": "2;1;50",
        "wc_review": "636;196;346",
        "wc_reply_reviewers": "183;0;48",
        "wc_reply_authors": "2240;214;874",
        "reply_reviewers": "1;0;1",
        "reply_authors": "6;2;3",
        "rating_avg": [
            5.666666666666667,
            2.0548046676563256
        ],
        "confidence_avg": [
            3.6666666666666665,
            1.247219128924647
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            78.66666666666667,
            28.686039965266882
        ],
        "wc_strengths_avg": [
            93.33333333333333,
            35.72425257751689
        ],
        "wc_weaknesses_avg": [
            203.0,
            231.93246143363947
        ],
        "wc_questions_avg": [
            17.666666666666668,
            22.866763848189994
        ],
        "wc_review_avg": [
            392.6666666666667,
            182.63503375736965
        ],
        "wc_reply_reviewers_avg": [
            77.0,
            77.47257579298626
        ],
        "wc_reply_authors_avg": [
            1109.3333333333333,
            843.6845118618426
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            1.699673171197595
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.43355498476206006,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:LuP9s6b629AJ:scholar.google.com/&scioq=GDL-DS:+A+Benchmark+for+Geometric+Deep+Learning+under+Distribution+Shifts&hl=en&as_sdt=0,33",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;1;1;2;3",
        "aff_unique_norm": "University of Science and Technology of China;Georgia Institute of Technology;University of California, Santa Barbara;Purdue University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "http://www.ustc.edu.cn;https://www.gatech.edu;https://www.ucsb.edu;https://www.purdue.edu",
        "aff_unique_abbr": "USTC;Georgia Tech;UCSB;Purdue",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Santa Barbara",
        "aff_country_unique_index": "0;1;1;1;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "LixtB4TYY2",
        "title": "REVO-LION: Evaluating and Refining Vision-Language Instruction Tuning Datasets",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "There is an emerging line of research on multimodal instruction tuning, and various benchmarks have been proposed for evaluating these models correspondingly. Instead of evaluating the models directly, in this paper we try to evaluate the Vision-Language Instruction-Tuning (VLIT) datasets themselves and even seek the way of building a dataset for developing an all-powerful VLIT model, which we believe could be fundamental for establishing a grounded protocol for benchmarking VLIT models. To achieve effective analysis of VLIT datasets, which remains an open question, we propose a tune-cross-evaluation paradigm: tuning on one dataset and evaluating on others in turn. For each tune-evaluation set, we define the Meta Quality (MQ) as the mean score measured by BLEU, METEOR, and ROUGE-L to quantify the quality of a dataset or a sample. On this basis, to evaluate the comprehensiveness of a dataset, we develop the Dataset Quality (DQ) covering all tune-evaluation sets. To lay the foundation for building a comprehensive dataset and developing an all-powerful model, we further create the Sample Quality (SQ) quantifying the all-sided quality of each sample. Extensive experiments validate the rationality of the proposed evaluation paradigm. According to the holistic evaluation, we build a new dataset, REVO-LION (REfining VisiOn-Language InstructiOn tuNing), by collecting samples with higher SQ from each dataset. With only half of the full data, the model trained on REVO-LION can achieve performance comparable to simply adding all VLIT datasets up. In addition to developing an all-powerful model, REVO-LION also includes an evaluation set, which is expected to serve as a convenient evaluation benchmark for future research.",
        "keywords": "Evaluation;Refine;Vision-Language;Instruction Tuning.",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/5fa38cd30e7ffe529a28d845ef968bc43e886abb.zip",
        "author": "Ning Liao;Shaofeng Zhang;Renqiu Xia;Bo Zhang;Min Cao;Yu Qiao;Junchi Yan",
        "authorids": "~Ning_Liao1;~Shaofeng_Zhang1;~Renqiu_Xia2;~Bo_Zhang17;~Min_Cao2;~Yu_Qiao1;~Junchi_Yan2",
        "gender": "M;M;;M;F;;",
        "homepage": "https://scholar.google.com/citations?user=6aARLhMAAAAJ&hl=zh-CN;https://sherrylone.github.io;;https://bobrown.github.io/boZhang.github.io/;;;",
        "dblp": "44/1117;132/2540;;36/2259-69;;;",
        "google_scholar": "6aARLhMAAAAJ;VoVVJIgAAAAJ;;https://scholar.google.com/citations?hl=en;nhMWtZsAAAAJ;;",
        "orcid": "0000-0002-3764-2555;;;0000-0001-8052-782X;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Ning_Liao1;~Shaofeng_Zhang1;~Renqiu_Xia2;~Bo_Zhang17;~Min_Cao2;~Yu_Qiao1;~Junchi_Yan2",
        "aff": "Shanghai Jiaotong University;Shanghai Jiaotong University;;Shanghai Artificial Intelligence Laboratory;Soochow University;;",
        "aff_domain": "sjtu.edu.cn;sjtu.edu.cn;;pjlab.org.cn;suda.edu.cn;;",
        "position": "PhD student;PhD student;;Researcher;Associate Professor;;",
        "bibtex": "@misc{\nliao2024revolion,\ntitle={{REVO}-{LION}: Evaluating and Refining Vision-Language Instruction Tuning Datasets},\nauthor={Ning Liao and Shaofeng Zhang and Renqiu Xia and Bo Zhang and Min Cao and Yu Qiao and Junchi Yan},\nyear={2024},\nurl={https://openreview.net/forum?id=LixtB4TYY2}\n}",
        "github": "",
        "project": "",
        "reviewers": "rLSJ;Pz2X;u7LE;MuLV",
        "site": "https://openreview.net/forum?id=LixtB4TYY2",
        "pdf_size": 7395836,
        "rating": "3;3;3;5",
        "confidence": "3;5;3;4",
        "soundness": "1;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;3;3",
        "wc_summary": "139;595;79;71",
        "wc_strengths": "23;4;38;38",
        "wc_weaknesses": "193;4;161;131",
        "wc_questions": "57;4;10;6",
        "wc_review": "412;607;288;246",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            221.0,
            217.52241263833022
        ],
        "wc_strengths_avg": [
            25.75,
            13.970952007647869
        ],
        "wc_weaknesses_avg": [
            122.25,
            71.70556115114086
        ],
        "wc_questions_avg": [
            19.25,
            21.901769334919038
        ],
        "wc_review_avg": [
            388.25,
            140.26826975478096
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.17407765595569782,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12250311045549498168&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "Shanghai Jiao Tong University;Shanghai Artificial Intelligence Laboratory;Soochow University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.sjtu.edu.cn;http://www.shailab.org/;https://www.soochow.edu.cn",
        "aff_unique_abbr": "SJTU;Shanghai AI Lab;Soochow U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Transformer Fusion with Optimal Transport",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18852",
        "id": "LjeqMvQpen",
        "author_site": "Moritz Imfeld, Jacopo Graldi, Marco Giordano, Thomas Hofmann, Sotiris Anagnostidis, Sidak Pal Singh",
        "tldr": "",
        "abstract": "Fusion is a technique for merging multiple independently-trained neural networks in order to combine their capabilities. Past attempts have been restricted to the case of fully-connected, convolutional, and residual networks. This paper presents a systematic approach for fusing two or more transformer-based networks exploiting Optimal Transport to (soft-)align the various architectural components. We flesh out an abstraction for layer alignment, that can generalize to arbitrary architectures -- in principle -- and we apply this to the key ingredients of Transformers such as multi-head self-attention, layer-normalization, and residual connections, and we discuss how to handle them via various ablation studies. Furthermore, our method allows the fusion of models of different sizes (heterogeneous fusion), providing a new and efficient way to compress Transformers. The proposed approach is evaluated on both image classification tasks via Vision Transformer and natural language modeling tasks using BERT. Our approach consistently outperforms vanilla fusion, and, after a surprisingly short finetuning, also outperforms the individual converged parent models.\nIn our analysis, we uncover intriguing insights about the significant role of soft alignment in the case of Transformers. Our results showcase the potential of fusing multiple Transformers, thus compounding their expertise, in the budding paradigm of model fusion and recombination. Code is available at https://github.com/graldij/transformer-fusion.",
        "keywords": "Fusion;Transformers;Model Merging",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Moritz Imfeld;Jacopo Graldi;Marco Giordano;Thomas Hofmann;Sotiris Anagnostidis;Sidak Pal Singh",
        "authorids": "~Moritz_Imfeld1;~Jacopo_Graldi1;~Marco_Giordano1;~Thomas_Hofmann1;~Sotiris_Anagnostidis1;~Sidak_Pal_Singh1",
        "gender": "M;;M;M;M;",
        "homepage": ";;;http://www.da.inf.ethz.ch/;;http://sidakpal.com/",
        "dblp": ";;;h/ThHofmann;286/1763;189/9168",
        "google_scholar": ";;2JuOJFIAAAAJ;T3hAyLkAAAAJ;qjzTKWUAAAAJ;c59mPS4AAAAJ",
        "orcid": ";;;;;",
        "linkedin": "moritz-imfeld/;jacopo-graldi-811555196/;marco-giordano/;thomas-hofmann-1ab2402/;sotiris-anagnostidis-b064a5129/;",
        "or_profile": "~Moritz_Imfeld1;~Jacopo_Graldi1;~Marco_Giordano1;~Thomas_Hofmann1;~Sotiris_Anagnostidis1;~Sidak_Pal_Singh1",
        "aff": "ETHZ - ETH Zurich;ETHZ - ETH Zurich;ETHZ - ETH Zurich;Swiss Federal Institute of Technology;ETH Zurich;Max Planck Institute for Intelligent Systems",
        "aff_domain": "ethz.ch;ethz.ch;ethz.ch;ethz.ch;inf.ethz.ch;tuebingen.mpg.de",
        "position": "MS student;MS student;PhD student;Full Professor;PhD student;PhD student",
        "bibtex": "@inproceedings{\nimfeld2024transformer,\ntitle={Transformer Fusion with Optimal Transport},\nauthor={Moritz Imfeld and Jacopo Graldi and Marco Giordano and Thomas Hofmann and Sotiris Anagnostidis and Sidak Pal Singh},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=LjeqMvQpen}\n}",
        "github": "",
        "project": "",
        "reviewers": "KSPk;5GYY;GM8g;hByk",
        "pdf_size": 1009144,
        "rating": "6;6;6;8",
        "confidence": "3;4;4;3",
        "soundness": "3;2;3;3",
        "contribution": "3;3;3;2",
        "presentation": "3;2;3;4",
        "wc_summary": "92;72;50;118",
        "wc_strengths": "67;37;26;71",
        "wc_weaknesses": "35;11;30;171",
        "wc_questions": "6;201;4;209",
        "wc_review": "200;321;110;569",
        "wc_reply_reviewers": "11;33;40;0",
        "wc_reply_authors": "1009;763;1419;1459",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "3;2;4;4",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            83.0,
            25.079872407968907
        ],
        "wc_strengths_avg": [
            50.25,
            19.201236939322424
        ],
        "wc_weaknesses_avg": [
            61.75,
            63.707829189197774
        ],
        "wc_questions_avg": [
            105.0,
            100.04249097258624
        ],
        "wc_review_avg": [
            300.0,
            172.4108465265454
        ],
        "wc_reply_reviewers_avg": [
            21.0,
            16.170961628796228
        ],
        "wc_reply_authors_avg": [
            1162.5,
            290.2012232917015
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.25,
            0.82915619758885
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 26,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12367929423814260720&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=LjeqMvQpen",
        "pdf": "https://openreview.net/pdf?id=LjeqMvQpen",
        "email": "ethz.ch;ethz.ch;ethz.ch;ethz.ch;inf.ethz.ch;tuebingen.mpg.de",
        "author_num": 6,
        "aff_unique_index": "0;0;0;1;0;2",
        "aff_unique_norm": "ETH Zurich;Swiss Federal Institute of Technology;Max Planck Institute for Intelligent Systems",
        "aff_unique_dep": ";;Intelligent Systems",
        "aff_unique_url": "https://www.ethz.ch;https://www.ethz.ch;https://www.mpi-is.mpg.de",
        "aff_unique_abbr": "ETHZ;ETH Zurich;MPI-IS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;1",
        "aff_country_unique": "Switzerland;Germany"
    },
    {
        "title": "Efficient Episodic Memory Utilization of Cooperative Multi-Agent Reinforcement Learning",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18851",
        "id": "LjivA1SLZ6",
        "author_site": "Hyungho Na, Yunkyeong Seo, Il-chul Moon",
        "tldr": "",
        "abstract": "In cooperative multi-agent reinforcement learning (MARL), agents aim to achieve a common goal, such as defeating enemies or scoring a goal. Existing MARL algorithms are effective but still require significant learning time and often get trapped in local optima by complex tasks, subsequently failing to discover a goal-reaching policy. To address this, we introduce Efficient episodic Memory Utilization (EMU) for MARL, with two primary objectives: (a) accelerating reinforcement learning by leveraging semantically coherent memory from an episodic buffer and (b) selectively promoting desirable transitions to prevent local convergence. To achieve (a), EMU incorporates a trainable encoder/decoder structure alongside MARL, creating coherent memory embeddings that facilitate exploratory memory recall. To achieve (b), EMU introduces a novel reward structure called episodic incentive based on the desirability of states. This reward improves the TD target in Q-learning and acts as an additional incentive for desirable transitions. We provide theoretical support for the proposed incentive and demonstrate the effectiveness of EMU compared to conventional episodic control. The proposed method is evaluated in StarCraft II and Google Research Football, and empirical results indicate further performance improvement over state-of-the-art methods.",
        "keywords": "Multi-agent reinforcement learning;episodic control;episodic incentive;state embedding",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/aca81eae23a15faf63dd814c4dafba4d4933455a.zip",
        "author": "Hyungho Na;Yunkyeong Seo;Il-chul Moon",
        "authorids": "~Hyungho_Na1;~Yunkyeong_Seo1;~Il-chul_Moon1",
        "gender": ";F;",
        "homepage": ";;",
        "dblp": ";;",
        "google_scholar": ";b905rEsAAAAJ;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Hyungho_Na1;~Yunkyeong_Seo1;~Il-chul_Moon1",
        "aff": ";Korea Advanced Institute of Science & Technology;",
        "aff_domain": ";kaist.ac.kr;",
        "position": ";PhD student;",
        "bibtex": "@inproceedings{\nna2024efficient,\ntitle={Efficient Episodic Memory Utilization of Cooperative Multi-Agent Reinforcement Learning},\nauthor={Hyungho Na and Yunkyeong Seo and Il-chul Moon},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=LjivA1SLZ6}\n}",
        "github": "",
        "project": "",
        "reviewers": "mSGj;7Wwz;t4Jc;8Ngy",
        "pdf_size": 17347735,
        "rating": "6;6;6;6",
        "confidence": "3;5;4;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;2",
        "presentation": "3;4;3;3",
        "wc_summary": "34;87;58;81",
        "wc_strengths": "61;98;78;58",
        "wc_weaknesses": "74;71;423;182",
        "wc_questions": "23;52;64;131",
        "wc_review": "192;308;623;452",
        "wc_reply_reviewers": "8;10;238;54",
        "wc_reply_authors": "405;690;1630;962",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;2;3;3",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            65.0,
            20.91650066335189
        ],
        "wc_strengths_avg": [
            73.75,
            15.943258763502524
        ],
        "wc_weaknesses_avg": [
            187.5,
            143.130185495583
        ],
        "wc_questions_avg": [
            67.5,
            39.57587649060978
        ],
        "wc_review_avg": [
            393.75,
            161.2488372051098
        ],
        "wc_reply_reviewers_avg": [
            77.5,
            94.47089498888005
        ],
        "wc_reply_authors_avg": [
            921.75,
            453.8658254374304
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=953000021673136136&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=LjivA1SLZ6",
        "pdf": "https://openreview.net/pdf?id=LjivA1SLZ6",
        "email": ";kaist.ac.kr;",
        "author_num": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_country_unique_index": "0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "LjygLD0AkT",
        "title": "Rethinking Test-time Likelihood: The Likelihood Path Principle and Its Application to OOD Detection",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "While likelihood is attractive in theory, its estimates by deep generative models (DGMs) are often broken in practice, and perform poorly for OOD Detection. Various recent works started to consider alternative summary statistics and achieved better performances. However, such recipes do not come with provable guarantees, nor is it clear that their choices extract sufficient information.\n\nWe attempt to change this by conducting a case study on variational autoencoders (VAEs). First, we introduce the *likelihood path (LPath) principle*, generalizing the likelihood principle. This narrows the search for informative summary statistics down to the *minimal sufficient statistics* of VAEs' conditional likelihoods. Second, introducing new theoretic tools such as *essential support*, *essential distance* and *co-Lipschitzness*, we obtain non-asymptotic provable OOD detection guarantees for certain distillation of the minimal sufficient statistics. The corresponding LPath algorithm demonstrates SOTA performances, even using simple and small VAEs with poor likelihood estimates. To our best knowledge, this is the first provable unsupervised OOD method that delivers excellent empirical results, better than any other VAEs based techniques.",
        "keywords": "outlier detection;ood;out-of-distribution;anomaly detection;variational autoencoder;VAE",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/3cbace3516a019c9878a6cabfd8bce1da96b6509.zip",
        "author": "Sicong Huang;Jiawei He;Yik Chau Lui",
        "authorids": "~Sicong_Huang1;~Jiawei_He1;~Yik_Chau_Lui1",
        "gender": "M;M;M",
        "homepage": "http://www.cs.toronto.edu/~huang/;https://jiaweimtr.github.io;",
        "dblp": "213/8048.html;172/2564;220/3353",
        "google_scholar": "https://scholar.google.ca/citations?hl=en;https://scholar.google.ca/citations?user=7zKNBtgAAAAJ;",
        "orcid": "0009-0006-8791-0243;;",
        "linkedin": "sicong-sheldon-huang-7a4292106/;;",
        "or_profile": "~Sicong_Huang1;~Jiawei_He1;~Yik_Chau_Lui1",
        "aff": "University of Toronto;Borealis AI;Borealis AI",
        "aff_domain": "cs.toronto.edu;borealisai.com;borealisai.com",
        "position": "PhD student;Researcher;Machine Learning Researcher",
        "bibtex": "@misc{\nhuang2024rethinking,\ntitle={Rethinking Test-time Likelihood: The Likelihood Path Principle and Its Application to {OOD} Detection},\nauthor={Sicong Huang and Jiawei He and Yik Chau Lui},\nyear={2024},\nurl={https://openreview.net/forum?id=LjygLD0AkT}\n}",
        "github": "",
        "project": "",
        "reviewers": "hPfm;tps4;Jhho;6idB",
        "site": "https://openreview.net/forum?id=LjygLD0AkT",
        "pdf_size": 2318160,
        "rating": "3;5;6;6",
        "confidence": "4;3;2;2",
        "soundness": "2;2;2;3",
        "contribution": "2;2;3;2",
        "presentation": "1;1;2;3",
        "wc_summary": "278;129;73;61",
        "wc_strengths": "38;53;32;37",
        "wc_weaknesses": "258;100;65;156",
        "wc_questions": "46;149;33;109",
        "wc_review": "620;431;203;363",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1827;977;503;858",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;2;1;2",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            135.25,
            86.32026123686141
        ],
        "wc_strengths_avg": [
            40.0,
            7.842193570679061
        ],
        "wc_weaknesses_avg": [
            144.75,
            72.997859557661
        ],
        "wc_questions_avg": [
            84.25,
            47.15599113580373
        ],
        "wc_review_avg": [
            404.25,
            149.5549648122723
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1041.25,
            486.0104808540655
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.9847319278346618,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Fhbu2Qwuv48J:scholar.google.com/&scioq=Rethinking+Test-time+Likelihood:+The+Likelihood+Path+Principle+and+Its+Application+to+OOD+Detection&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "University of Toronto;Borealis AI",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.utoronto.ca;https://www.borealisai.com",
        "aff_unique_abbr": "U of T;Borealis AI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "LkB80Rw6Ap",
        "title": "Curvature MPNNs : Improving Message Passing with Local Structural Properties",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph neural networks follow an iterative scheme of updating node representations based on the aggregation from nearby nodes know as the message passing paradigm. Although they are widely used, it has been established that they suffer from a problem of oversquashing that limit their efficiency. Recently, it has been shown that the bottleneck phenomenon comes from certain areas of the graphs, which can be identified by a measure of edge curvature.\nIn this paper we propose a framework appropriate for any MPNN architecture called Curvature Message Passing, that distributes information based on the curvature of the graph's edges.\nExperiments conducted on different datasets show that our method mitigate oversquashing and outperforms existing graph rewiring in several nodes classification tasks.",
        "keywords": "graph representation learning;oversquashing;graph rewiring;graph neural networks;curvature",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/ddcd74dd7b9001b996f879cb3ac6c017b006478b.zip",
        "author": "Hugo Attali;Davide Buscaldi;Nathalie Pernelle",
        "authorids": "~Hugo_Attali1;~Davide_Buscaldi1;~Nathalie_Pernelle1",
        "gender": ";F;M",
        "homepage": "https://sites.google.com/view/hugoattali/profile;;https://buscaldi.eu",
        "dblp": ";55/2273;34/4842",
        "google_scholar": "ld0pUJcAAAAJ;;https://scholar.google.fr/citations?user=3qCGWfoAAAAJ",
        "orcid": ";;0000-0003-1112-3789",
        "linkedin": "https://www.linkedin.com/feed/;;dbuscaldi/",
        "or_profile": "~Hugo_Attali1;~Nathalie_Pernelle1;~Davide_Buscaldi2",
        "aff": "University Paris 13, Universit\u00e9 Paris Nord (Paris XIII);LIPN, Universit\u00e9 Sorbonne Paris Nord;Universit\u00e9 Paris 13",
        "aff_domain": "lipn.univ-paris13.fr;paris13;univ-paris13.fr",
        "position": "PhD student;Full Professor;Associate Professor",
        "bibtex": "@misc{\nattali2024curvature,\ntitle={Curvature {MPNN}s : Improving Message Passing with Local Structural Properties},\nauthor={Hugo Attali and Davide Buscaldi and Nathalie Pernelle},\nyear={2024},\nurl={https://openreview.net/forum?id=LkB80Rw6Ap}\n}",
        "github": "",
        "project": "",
        "reviewers": "8f8F;Z4u7;6GYo;YMEu",
        "site": "https://openreview.net/forum?id=LkB80Rw6Ap",
        "pdf_size": 822150,
        "rating": "1;3;5;5",
        "confidence": "2;4;3;4",
        "soundness": "2;1;2;3",
        "contribution": "1;2;2;2",
        "presentation": "1;2;2;2",
        "wc_summary": "51;65;45;113",
        "wc_strengths": "19;17;39;103",
        "wc_weaknesses": "76;256;92;137",
        "wc_questions": "29;207;246;75",
        "wc_review": "175;545;422;428",
        "wc_reply_reviewers": "53;68;96;90",
        "wc_reply_authors": "176;375;419;268",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;1;2;2",
        "rating_avg": [
            3.5,
            1.6583123951777
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            68.5,
            26.69737814842499
        ],
        "wc_strengths_avg": [
            44.5,
            34.853263835686896
        ],
        "wc_weaknesses_avg": [
            140.25,
            70.47118205337554
        ],
        "wc_questions_avg": [
            139.25,
            89.81752334594847
        ],
        "wc_review_avg": [
            392.5,
            134.80819708014792
        ],
        "wc_reply_reviewers_avg": [
            76.75,
            17.224619008848933
        ],
        "wc_reply_authors_avg": [
            309.5,
            94.6374661537385
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.6363636363636364,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:lqimODX1hOMJ:scholar.google.com/&scioq=Curvature+MPNNs+:+Improving+Message+Passing+with+Local+Structural+Properties&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University Paris 13;Universit\u00e9 Sorbonne Paris Nord;Universit\u00e9 Paris 13",
        "aff_unique_dep": ";LIPN;",
        "aff_unique_url": "https://www.univ-paris13.fr;https://www.univ-paris-nord.fr;https://www.univ-paris13.fr",
        "aff_unique_abbr": "UP13;USPN;UP13",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Paris;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "France"
    },
    {
        "id": "LkQoiVp6XG",
        "title": "G-Local Attention Graph Pooling for Graph Classification",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph pooling is an essential operation in Graph Neural Networks that reduces the size of an input graph while preserving its core structural properties. This compression operation improves the learned representation of the graph, yielding to a performance boost on downstream tasks. Existing pooling methods find a compressed representation considering the Global Topological Structures (e.g., cliques, stars, clusters) or Local information at node level (e.g., top-$k$ informative nodes). However, there is a lack of an effective graph pooling method that integrates both Global and Local properties of the graph. To this end, we propose a two-channel Global-Local Attention Pooling (GLA-Pool) layer that exploits the aforementioned graph properties, generating more robust graph representations. The GLA-Pool can be integrated into any GNN-based architectures. Further, we propose a smart data augmentation technique to enrich small-scale datasets. Exhaustive experiments on eight publicly available graph classification benchmarks, under standard metrics, show that GLA-Pool significantly outperforms thirteen state-of-the-art models on six datasets while being on par for the remaining two. The code will be available at this link.",
        "keywords": "Graph neural networks;graph pooling;pooling layer;data augmentation",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Waqar Ali;Sebastiano Vascon;Thilo Stadelmann;Marcello Pelillo",
        "authorids": "~Waqar_Ali2;~Sebastiano_Vascon1;~Thilo_Stadelmann1;~Marcello_Pelillo1",
        "gender": "M;M;M;M",
        "homepage": ";http://www.sebastianovascon.it;http://stdm.github.io;",
        "dblp": ";133/9513;66/5566;42/1745",
        "google_scholar": "https://scholar.google.es/citations?user=7A2V064AAAAJ;https://scholar.google.it/citations?user=oiaAgVEAAAAJ;https://scholar.google.ch/citations?user=6U6ZXzUAAAAJ;Hz9A7M0AAAAJ",
        "orcid": "0000-0003-2089-0429;0000-0002-7855-1641;0000-0002-3784-0420;0000-0001-8992-9243",
        "linkedin": ";;thilo-stadelmann/;marcello-pelillo-bb185585/?originalSubdomain=it",
        "or_profile": "~Waqar_Ali2;~Sebastiano_Vascon1;~Thilo_Stadelmann1;~Marcello_Pelillo1",
        "aff": "Ca' Foscari University of Venice;University Ca' Foscari of Venice;Zurich University of Applied Sciences;Ca' Foscari University of Venice",
        "aff_domain": "it.edu;unive.it;zhaw.ch;unive.it",
        "position": "PhD student;Assistant Professor;Full Professor;Professor",
        "bibtex": "@misc{\nali2024glocal,\ntitle={G-Local Attention Graph Pooling for Graph Classification},\nauthor={Waqar Ali and Sebastiano Vascon and Thilo Stadelmann and Marcello Pelillo},\nyear={2024},\nurl={https://openreview.net/forum?id=LkQoiVp6XG}\n}",
        "github": "",
        "project": "",
        "reviewers": "mksj;Cm8z;XDBL;iwUJ",
        "site": "https://openreview.net/forum?id=LkQoiVp6XG",
        "pdf_size": 2562034,
        "rating": "3;3;3;3",
        "confidence": "5;5;4;4",
        "soundness": "2;2;2;2",
        "contribution": "2;2;1;2",
        "presentation": "2;3;2;2",
        "wc_summary": "112;30;50;50",
        "wc_strengths": "56;20;34;43",
        "wc_weaknesses": "190;227;317;201",
        "wc_questions": "98;4;84;8",
        "wc_review": "456;281;485;302",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            60.5,
            30.834234221073174
        ],
        "wc_strengths_avg": [
            38.25,
            13.12202347201071
        ],
        "wc_weaknesses_avg": [
            233.75,
            49.90678811544578
        ],
        "wc_questions_avg": [
            48.5,
            42.81062952118317
        ],
        "wc_review_avg": [
            381.0,
            90.39081811777123
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:SYdHswB2wwYJ:scholar.google.com/&scioq=G-Local+Attention+Graph+Pooling+for+Graph+Classification&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Ca' Foscari University of Venice;Zurich University of Applied Sciences",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.unive.it;https://www.zhawk.ch",
        "aff_unique_abbr": "Ca' Foscari;ZHAW",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Venice;",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "Italy;Switzerland"
    },
    {
        "id": "Ll8PmgD0IB",
        "title": "Divide and Orthogonalize: Efficient Continual Learning with Local Model Space Projection",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Continual learning (CL) attracts more and more research interests recently since it enables a learning model's ability to continuously learn new tasks without forgetting the previously learned knowledge. However, existing CL methods require either an extensive amount of resources for computing gradient projections or memorizing lots of old tasks as the candidates for related old tasks selection. Thus, a low-complexity CL approach is necessary for the model deployment on huge data. In this paper, we propose a local model space projection (LMSP) based efficient continual learning framework, which helps to not only reduce the complexity of computation, but also extend to several local model tasks to increase the candidate pool with strong correlations. We also theoretically show that the proposed LMSP approach enables backward knowledge transfer, which is a highly desirable feature in CL. Extensive experiments on several public datasets demonstrate the efficiency of our approach.",
        "keywords": "Continual learning;Low-rank approximation;Optimization",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Jin Shang;Simone Shao;Tian Tong;Fan Yang;Yetian Chen;Yang Jiao;Jia Liu;Yan Gao",
        "authorids": "~Jin_Shang1;~Simone_Shao1;~Tian_Tong1;~Fan_Yang36;~Yetian_Chen1;~Yang_Jiao6;~Jia_Liu1;~Yan_Gao8",
        "gender": "M;F;Not Specified;M;M;M;M;F",
        "homepage": "https://jshang2.github.io/;https://simengshao.github.io/;;;http://web.cs.iastate.edu/~yetianc/;;https://kevinliu-osu.github.io/index.html;",
        "dblp": "45/5084-1;;;29/3081-84.html;149/1344;09/72131;;46/3479-3.html",
        "google_scholar": "CIfBuzcAAAAJ;Dt3f2K0AAAAJ;Qg7x7M8AAAAJ;2MYn3NIAAAAJ;m7xQlmoAAAAJ;https://scholar.google.com/citations?hl=en;Ofx3dScAAAAJ;",
        "orcid": "0000-0002-2028-3787;;0009-0008-3816-8235;0000-0002-0940-4218;;0000-0002-6390-2517;;0000-0002-8012-1392",
        "linkedin": "jin-shang-a84a2611a/;;;fan-yang-882b368b/;yetian-chen/;yang-jiao-1837bb16a/;;yan-gao-16a477b/",
        "or_profile": "~Jin_Shang1;~Simone_Shao1;~Tian_Tong1;~Fan_Yang36;~Yetian_Chen1;~Yang_Jiao6;~Jia_Liu1;~Yan_Gao8",
        "aff": "Amazon;Amazon;Amazon;Amazon;Amazon;Amazon;The Ohio State University;Amazon",
        "aff_domain": "amazon.com;amazon.com;amazon.com;amazon.com;amazon.com;amazon.com;osu.edu;amazon.com",
        "position": "Applied Scientist;Researcher;Applied Scientist;Researcher;Applied Scientist;Researcher;Assistant Professor;Researcher",
        "bibtex": "@misc{\nshang2024divide,\ntitle={Divide and Orthogonalize: Efficient Continual Learning with Local Model Space Projection},\nauthor={Jin Shang and Simone Shao and Tian Tong and Fan Yang and Yetian Chen and Yang Jiao and Jia Liu and Yan Gao},\nyear={2024},\nurl={https://openreview.net/forum?id=Ll8PmgD0IB}\n}",
        "github": "",
        "project": "",
        "reviewers": "apk6;ZQXi;CGvu;Shvn",
        "site": "https://openreview.net/forum?id=Ll8PmgD0IB",
        "pdf_size": 389891,
        "rating": "5;5;6;8",
        "confidence": "4;2;3;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;2;4",
        "wc_summary": "66;83;51;150",
        "wc_strengths": "14;12;40;123",
        "wc_weaknesses": "156;61;110;74",
        "wc_questions": "1;5;36;10",
        "wc_review": "237;161;237;357",
        "wc_reply_reviewers": "0;0;209;0",
        "wc_reply_authors": "1110;838;1938;365",
        "reply_reviewers": "0;0;2;0",
        "reply_authors": "2;2;4;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            87.5,
            37.818646194701365
        ],
        "wc_strengths_avg": [
            47.25,
            45.107510461119446
        ],
        "wc_weaknesses_avg": [
            100.25,
            36.85359548266627
        ],
        "wc_questions_avg": [
            13.0,
            13.656500283747663
        ],
        "wc_review_avg": [
            248.0,
            70.16409338115899
        ],
        "wc_reply_reviewers_avg": [
            52.25,
            90.49965469547384
        ],
        "wc_reply_authors_avg": [
            1062.75,
            571.3280034271031
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            2.25,
            1.0897247358851685
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:uggd5m64NEsJ:scholar.google.com/&scioq=Divide+and+Orthogonalize:+Efficient+Continual+Learning+with+Local+Model+Space+Projection&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0;0;1;0",
        "aff_unique_norm": "Amazon;Ohio State University",
        "aff_unique_dep": "Amazon.com, Inc.;",
        "aff_unique_url": "https://www.amazon.com;https://www.osu.edu",
        "aff_unique_abbr": "Amazon;OSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "LlG0jR7Yjh",
        "title": "AutoHall: Automated Hallucination Dataset Generation for Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "While Large language models (LLMs) have garnered widespread applications across various domains due to their powerful language understanding and generation capabilities, the detection of non-factual or hallucinatory content generated by LLMs remains scarce. Currently, one significant challenge in hallucination detection is the laborious task of time-consuming and expensive manual annotation of the hallucinatory generation. To address this issue, this paper first introduces a method for $\\underline{auto}$matically constructing model-specific $\\underline{hall}$ucination datasets based on existing fact-checking datasets called $\\textbf{AutoHall}$. Furthermore, we propose a zero-resource and black-box hallucination detection method based on self-contradiction. We conduct experiments towards prevalent open-/closed-source LLMs, achieving superior hallucination detection performance compared to extant baselines. Moreover, our experiments reveal variations in hallucination proportions and types among different models.",
        "keywords": "LLM hallucination;hallucination detection;large language models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/cfc5e72719c00195a7bf4580e1f2705f923c963a.zip",
        "author": "zouying cao;Yifei Yang;hai zhao",
        "authorids": "~zouying_cao1;~Yifei_Yang2;~hai_zhao1",
        "gender": "F;;M",
        "homepage": "https://zouyingcao.github.io/;;http://bcmi.sjtu.edu.cn/~zhaohai/",
        "dblp": "333/6656.html;;25/1145-1.html",
        "google_scholar": "IIA4hMEAAAAJ;UxAb3eQAAAAJ;https://scholar.google.com.tw/citations?user=4dU5KS0AAAAJ",
        "orcid": "0000-0003-2200-5630;0000-0003-0997-9422;",
        "linkedin": ";;",
        "or_profile": "~zouying_cao1;~Yifei_Yang2;~hai_zhao1",
        "aff": "Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn",
        "position": "MS student;PhD student;Full Professor",
        "bibtex": "@misc{\ncao2024autohall,\ntitle={AutoHall: Automated Hallucination Dataset Generation for Large Language Models},\nauthor={zouying cao and Yifei Yang and hai zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=LlG0jR7Yjh}\n}",
        "github": "",
        "project": "",
        "reviewers": "n69Q;AdN8;ud13",
        "site": "https://openreview.net/forum?id=LlG0jR7Yjh",
        "pdf_size": 512346,
        "rating": "3;3;5",
        "confidence": "4;4;4",
        "soundness": "2;3;2",
        "contribution": "1;2;2",
        "presentation": "3;2;2",
        "wc_summary": "147;146;97",
        "wc_strengths": "30;25;85",
        "wc_weaknesses": "127;140;456",
        "wc_questions": "75;16;23",
        "wc_review": "379;327;661",
        "wc_reply_reviewers": "0;0;237",
        "wc_reply_authors": "506;672;755",
        "reply_reviewers": "0;0;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            130.0,
            23.338094752285727
        ],
        "wc_strengths_avg": [
            46.666666666666664,
            27.182510717166817
        ],
        "wc_weaknesses_avg": [
            241.0,
            152.12056621859736
        ],
        "wc_questions_avg": [
            38.0,
            26.318561257535844
        ],
        "wc_review_avg": [
            455.6666666666667,
            146.73634708399808
        ],
        "wc_reply_reviewers_avg": [
            79.0,
            111.72287142747452
        ],
        "wc_reply_authors_avg": [
            644.3333333333334,
            103.5191877007457
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 20,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8217763549861211988&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Shanghai Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sjtu.edu.cn",
        "aff_unique_abbr": "SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "A Graph is Worth 1-bit Spikes: When Graph Contrastive Learning Meets Spiking Neural Networks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18850",
        "id": "LnLySuf1vp",
        "author_site": "Jintang Li, Huizhe Zhang, Ruofan Wu, Zulun Zhu, Baokun Wang, Changhua Meng, Zibin Zheng, Liang Chen",
        "tldr": "",
        "abstract": "While contrastive self-supervised learning has become the de-facto learning paradigm for graph neural networks, the pursuit of higher task accuracy requires a larger hidden dimensionality to learn informative and discriminative full-precision representations, raising concerns about computation, memory footprint, and energy consumption burden (largely overlooked) for real-world applications. This work explores a promising direction for graph contrastive learning (GCL) with spiking neural networks (SNNs), which leverage sparse and binary characteristics to learn more biologically plausible and compact representations. We propose SpikeGCL, a novel GCL framework to learn binarized 1-bit representations for graphs, making balanced trade-offs between efficiency and performance. We provide theoretical guarantees to demonstrate that SpikeGCL has comparable expressiveness with its full-precision counterparts. Experimental results demonstrate that, with nearly 32x representation storage compression, SpikeGCL is either comparable to or outperforms many fancy state-of-the-art supervised and self-supervised methods across several graph benchmarks.",
        "keywords": "Graph contrastive learning;spiking neural networks;binarized graph representation learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/43c755e541eedbbbf9b997455cc25f7f99089488.zip",
        "author": "Jintang Li;Huizhe Zhang;Ruofan Wu;Zulun Zhu;Baokun Wang;Changhua Meng;Zibin Zheng;Liang Chen",
        "authorids": "~Jintang_Li1;~Huizhe_Zhang1;~Ruofan_Wu1;~Zulun_Zhu1;~Baokun_Wang1;~Changhua_Meng1;~Zibin_Zheng1;~Liang_Chen7",
        "gender": "M;M;M;M;M;M;M;M",
        "homepage": "https://edisonleeeee.github.io/;https://github.com/Zhhuizhe/Zhhuizhe.github.io;https://rorschach1989.github.io/;https://zulunzhu.github.io/;https://www.linkedin.com/in/changhua-meng-04826021/;https://www.zibinzheng.com/;https://chenliang.tech/;https://ericwbk.github.io/",
        "dblp": "260/6811;;;219/4427;295/9441;z/ZibinZheng;https://dblp.uni-trier.de/pid/01/5394-1;https://dblp.uni-trier.de/pid/228/1263",
        "google_scholar": "mS4fpUIAAAAJ;;;;;WPC6ED4AAAAJ;pGZtPjcAAAAJ;",
        "orcid": "0000-0002-6405-1531;;;0000-0002-5176-6378;;0000-0002-7878-4330;;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Jintang_Li1;~Huizhe_Zhang1;~Ruofan_Wu1;~Zulun_Zhu1;~Changhua_Meng1;~Zibin_Zheng1;~Liang_Chen7;~ericbk_Wang1",
        "aff": "Sun Yat-sen University;SUN YAT-SEN UNIVERSITY;Ant Group;Nanyang Technological University;Ant Group;SUN YAT-SEN UNIVERSITY;;",
        "aff_domain": "sysu.edu.cn;sysu.edu.cn;antgroup.com;ntu.edu.sg;antgroup.com;sysu.edu.cn;;",
        "position": "PhD student;PhD student;Researcher;PhD student;Researcher;Full Professor;;",
        "bibtex": "@inproceedings{\nli2024a,\ntitle={A Graph is Worth 1-bit Spikes: When Graph Contrastive Learning Meets Spiking Neural Networks},\nauthor={Jintang Li and Huizhe Zhang and Ruofan Wu and Zulun Zhu and Baokun Wang and Changhua Meng and Zibin Zheng and Liang Chen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=LnLySuf1vp}\n}",
        "github": "",
        "project": "",
        "reviewers": "n3GK;bEwP;HWYD;jihE",
        "pdf_size": 2189309,
        "rating": "3;6;6;6",
        "confidence": "2;3;2;4",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;2",
        "presentation": "3;2;3;4",
        "wc_summary": "63;23;58;61",
        "wc_strengths": "67;37;50;47",
        "wc_weaknesses": "260;29;49;197",
        "wc_questions": "4;198;21;8",
        "wc_review": "394;287;178;313",
        "wc_reply_reviewers": "0;159;13;0",
        "wc_reply_authors": "983;1510;284;432",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "2;4;1;1",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            51.25,
            16.406934509529805
        ],
        "wc_strengths_avg": [
            50.25,
            10.80219885023415
        ],
        "wc_weaknesses_avg": [
            133.75,
            97.58938210686652
        ],
        "wc_questions_avg": [
            57.75,
            81.21691634136327
        ],
        "wc_review_avg": [
            293.0,
            77.23664933177773
        ],
        "wc_reply_reviewers_avg": [
            43.0,
            67.18258702967607
        ],
        "wc_reply_authors_avg": [
            802.25,
            484.57423321922516
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.5222329678670935,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18161416185986988110&as_sdt=8005&sciodt=0,7&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=LnLySuf1vp",
        "pdf": "https://openreview.net/pdf?id=LnLySuf1vp",
        "email": "sysu.edu.cn;sysu.edu.cn;antgroup.com;ntu.edu.sg;antgroup.com;sysu.edu.cn;;",
        "author_num": 8,
        "aff_unique_index": "0;0;1;2;1;0",
        "aff_unique_norm": "Sun Yat-sen University;Ant Group;Nanyang Technological University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.sysu.edu.cn/;https://www.antgroup.com;https://www.ntu.edu.sg",
        "aff_unique_abbr": "SYSU;Ant Group;NTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0;0",
        "aff_country_unique": "China;Singapore"
    },
    {
        "id": "LndMyiBl3n",
        "title": "SheAttack: A Silhouette Score Motivated Restricted Black-Box Attack on Graphs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph Neural Networks (GNNs) have gained large popularity in various applications, with their vulnerability against adversarial attacks also being brought up.\nDespite the numerous graph attacks proposed, few have focused on the Restrict Black-box attack, where attackers only have access to node features and the graph structure.\nExisting works in this setting aim to perform destructive attacks by degrading the quality of victim graphs yet imposing the homophily assumption or requiring high computational complexity. \nTo address these challenges, we propose the Modified Silhouette Score (MSS) as a measure of a graph's quality, and demonstrate its generalizability across graphs of different homophily levels through theoretical analysis. \nUsing MSS as the objective, we present SheAttack, an efficient attack that effectively reduces the distinguishability of nodes.\nWe conduct experiments on both synthetic and real-world graphs to validate the effectiveness of SheAttack in both homophilic and heterophilic settings.\nWe find that even without prior knowledge of labels or the victim model, our method shows comparable performance to split-unknown white-box attacks.",
        "keywords": "Graph Neural Networks;Graph Adversarial Attack;Graph Representation Learning",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/a9fea5ad7cb5441d35ab8ea46717a2c7fb13f207.zip",
        "author": "Runlin Lei;Haipeng Ding;Zhewei Wei",
        "authorids": "~Runlin_Lei1;~Haipeng_Ding1;~Zhewei_Wei1",
        "gender": "M;M;M",
        "homepage": "https://github.com/Leirunlin;https://dinghaipeng.com;http://weizhewei.com",
        "dblp": "321/1838;78/7918-2.html;94/4260",
        "google_scholar": "pckN2lAAAAAJ;HwaxqqYAAAAJ;https://scholar.google.com.hk/citations?user=qZ7dj4gAAAAJ",
        "orcid": ";0009-0006-4856-3023;0000-0003-3620-5086",
        "linkedin": ";%E6%B5%B7%E9%B9%8F-%E4%B8%81-991aa419b/;",
        "or_profile": "~Runlin_Lei1;~Haipeng_Ding1;~Zhewei_Wei1",
        "aff": "Renmin University of China;Renmin University of China;Renmin University of China",
        "aff_domain": "ruc.edu.cn;ruc.edu.cn;ruc.edu.cn",
        "position": "PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nlei2024sheattack,\ntitle={SheAttack: A Silhouette Score Motivated Restricted Black-Box Attack on Graphs},\nauthor={Runlin Lei and Haipeng Ding and Zhewei Wei},\nyear={2024},\nurl={https://openreview.net/forum?id=LndMyiBl3n}\n}",
        "github": "",
        "project": "",
        "reviewers": "1uf8;8KRc;e7Jw;oiQU",
        "site": "https://openreview.net/forum?id=LndMyiBl3n",
        "pdf_size": 2104007,
        "rating": "3;5;6;6",
        "confidence": "4;5;4;3",
        "soundness": "2;2;3;2",
        "contribution": "2;2;3;3",
        "presentation": "3;2;3;2",
        "wc_summary": "70;69;84;48",
        "wc_strengths": "59;45;59;44",
        "wc_weaknesses": "288;263;105;112",
        "wc_questions": "2;40;38;58",
        "wc_review": "419;417;286;262",
        "wc_reply_reviewers": "190;0;0;20",
        "wc_reply_authors": "1066;589;513;538",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "2;1;1;2",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            67.75,
            12.852528934026953
        ],
        "wc_strengths_avg": [
            51.75,
            7.258615570478987
        ],
        "wc_weaknesses_avg": [
            192.0,
            84.00297613775359
        ],
        "wc_questions_avg": [
            34.5,
            20.316249653910045
        ],
        "wc_review_avg": [
            346.0,
            72.50172411743047
        ],
        "wc_reply_reviewers_avg": [
            52.5,
            79.80444849756184
        ],
        "wc_reply_authors_avg": [
            676.5,
            226.5397316145669
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.28867513459481287,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:8f085u5KIrkJ:scholar.google.com/&scioq=SheAttack:+A+Silhouette+Score+Motivated+Restricted+Black-Box+Attack+on+Graphs&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Renmin University of China",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.ruc.edu.cn",
        "aff_unique_abbr": "RUC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "LnxviiZ1xi",
        "title": "MPXGAT: An Attention based Deep Learning Model for Multiplex Graphs Embedding",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph representation learning is a research area that has attracted a lot of attention in recent years. \nHowever, most of the existing studies focus on the embedding of single-layer graphs, which cannot describe systems where multiple types of relationships exist.\nHere we propose MPXGAT, an attention-based deep learning model for embedding multiplex graphs. \nOur methodology, which is based on GATs, embeds the nodes of a multiplex network by exploiting both their intra-layer and inter-layer connections, enabling link prediction tasks within and across different layers. \nA thorough experimental analysis on three benchmark datasets, shows that MPXGAT outperforms state-of-the-art competing algorithms.",
        "keywords": "Multiplex Graphs;GAT;Link prediction;Multiplex embedding",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/c60528bb2f0d07129343d3e1728ada1ff27f6c19.zip",
        "author": "Marco Bongiovanni;Luca Gallo;Roberto Grasso;Alfredo Pulvirenti",
        "authorids": "~Marco_Bongiovanni1;~Luca_Gallo1;~Roberto_Grasso1;~Alfredo_Pulvirenti1",
        "gender": ";M;M;M",
        "homepage": ";https://lgajo.github.io/cv/;;",
        "dblp": ";;;56/727",
        "google_scholar": ";sKiSU9AAAAAJ;;",
        "orcid": ";0000-0002-2160-8467;0000-0002-7641-1979;",
        "linkedin": "marco-bongiovanni-760898120;luca-gallo-38aa20178/;;",
        "or_profile": "~Marco_Bongiovanni1;~Luca_Gallo1;~Roberto_Grasso1;~Alfredo_Pulvirenti1",
        "aff": "University of Catania;Central European University;University of Catania;University of Catania",
        "aff_domain": "unict.it;ceu.edu;unict.it;unict.it",
        "position": "Undergrad student;Postdoc;PhD student;Associate Professor",
        "bibtex": "@misc{\nbongiovanni2024mpxgat,\ntitle={{MPXGAT}: An Attention based Deep Learning Model for Multiplex Graphs Embedding},\nauthor={Marco Bongiovanni and Luca Gallo and Roberto Grasso and Alfredo Pulvirenti},\nyear={2024},\nurl={https://openreview.net/forum?id=LnxviiZ1xi}\n}",
        "github": "",
        "project": "",
        "reviewers": "x5r2;NRz2;FRGy",
        "site": "https://openreview.net/forum?id=LnxviiZ1xi",
        "pdf_size": 845186,
        "rating": "3;3;3",
        "confidence": "5;4;5",
        "soundness": "2;2;3",
        "contribution": "2;2;2",
        "presentation": "2;3;3",
        "wc_summary": "58;37;33",
        "wc_strengths": "19;14;17",
        "wc_weaknesses": "31;314;150",
        "wc_questions": "363;7;2",
        "wc_review": "471;372;202",
        "wc_reply_reviewers": "0;0;132",
        "wc_reply_authors": "411;836;357",
        "reply_reviewers": "0;0;1",
        "reply_authors": "1;2;1",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            42.666666666666664,
            10.96458946893235
        ],
        "wc_strengths_avg": [
            16.666666666666668,
            2.0548046676563256
        ],
        "wc_weaknesses_avg": [
            165.0,
            116.02011319881854
        ],
        "wc_questions_avg": [
            124.0,
            169.01084777808396
        ],
        "wc_review_avg": [
            348.3333333333333,
            111.08655284156684
        ],
        "wc_reply_reviewers_avg": [
            44.0,
            62.22539674441618
        ],
        "wc_reply_authors_avg": [
            534.6666666666666,
            214.2122519579328
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:xyHHRkSON8EJ:scholar.google.com/&scioq=MPXGAT:+An+Attention+based+Deep+Learning+Model+for+Multiplex+Graphs+Embedding&hl=en&as_sdt=0,23",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "University of Catania;Central European University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.unict.it;https://www.ceu.edu",
        "aff_unique_abbr": "UNICT;CEU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "Italy;Hungary"
    },
    {
        "id": "LojXXo2xaf",
        "title": "GPT Can Solve Mathematical Problems Without a Calculator",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Previous studies have typically assumed that large language models are unable to accurately perform arithmetic operations, particularly multiplication of >8 digits, and operations involving decimals and fractions, without the use of calculator tools. This paper aims to challenge this misconception. With sufficient training data, a 2 billion-parameter language model can accurately perform multi-digit arithmetic operations with almost 100% accuracy without data leakage, significantly surpassing GPT-4 (whose multi-digit multiplication accuracy is only 4.3%). We also demonstrate that our MathGLM, fine-tuned from GLM-10B on a dataset with\nadditional multi-step arithmetic operations and math problems described in text, achieves similar performance to GPT-4 on a 5,000-samples Chinese math problem test set.",
        "keywords": "Large Language Model; Mathematical Reasoning; Arithmetic Tasks; Math Word Problem",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/786d0e5b80f5d92da34de7d09640441632c9ed58.pdf",
        "author": "Zhen Yang;Ming Ding;Qingsong Lv;Zhihuan Jiang;Zehai He;Yuyi Guo;Jinfeng Bai;Jie Tang",
        "authorids": "~Zhen_Yang9;~Ming_Ding1;~Qingsong_Lv4;~Zhihuan_Jiang1;~Zehai_He1;~Yuyi_Guo1;~Jinfeng_Bai1;~Jie_Tang1",
        "gender": "F;M;;M;M;M;M;",
        "homepage": "https://zyang-16.github.io/zhenyang.github.io/;;;;https://github.com/he-zh22;https://github.com/EmiyaArcher233;;",
        "dblp": ";48/3462-4;;;;;120/7270.html;",
        "google_scholar": "zPVItDgAAAAJ;Va50YzkAAAAJ;tJNCPogAAAAJ;https://scholar.google.com/citations?view_op=list_works;https://scholar.google.com.hk/citations?user=2-r0RNUAAAAJ;;;",
        "orcid": ";;;;;;;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Zhen_Yang9;~Ming_Ding1;~Qingsong_Lv4;~Zhihuan_Jiang1;~Zehai_He1;~Yuyi_Guo1;~Jinfeng_Bai1;~Jie_Tang1",
        "aff": "Tsinghua University;ZHIPU AI;Tsinghua University;Tsinghua University;Tsinghua University;Tsinghua University;TAL;",
        "aff_domain": "tsinghua.edu.cn;zhipuai.cn;tsinghua.edu.cn;mail.tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;tal.com;",
        "position": "PhD student;Principal Researcher;MS student;Undergrad student;Undergrad student;Undergrad student;Researcher;",
        "bibtex": "@misc{\nyang2024gpt,\ntitle={{GPT} Can Solve Mathematical Problems Without a Calculator},\nauthor={Zhen Yang and Ming Ding and Qingsong Lv and Zhihuan Jiang and Zehai He and Yuyi Guo and Jinfeng Bai and Jie Tang},\nyear={2024},\nurl={https://openreview.net/forum?id=LojXXo2xaf}\n}",
        "github": "",
        "project": "",
        "reviewers": "mwYm;GLqj;NYtC;Bh6z",
        "site": "https://openreview.net/forum?id=LojXXo2xaf",
        "pdf_size": 2991879,
        "rating": "3;5;8;8",
        "confidence": "4;4;4;3",
        "soundness": "1;2;3;4",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;4",
        "wc_summary": "97;72;140;61",
        "wc_strengths": "81;25;117;39",
        "wc_weaknesses": "155;179;77;41",
        "wc_questions": "442;104;41;26",
        "wc_review": "775;380;375;167",
        "wc_reply_reviewers": "273;0;22;0",
        "wc_reply_authors": "3108;884;1122;511",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "6;2;2;1",
        "rating_avg": [
            6.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            1.118033988749895
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            92.5,
            30.36856927812043
        ],
        "wc_strengths_avg": [
            65.5,
            36.17664992781946
        ],
        "wc_weaknesses_avg": [
            113.0,
            56.124860801609124
        ],
        "wc_questions_avg": [
            153.25,
            169.2592316536974
        ],
        "wc_review_avg": [
            424.25,
            219.99247146209345
        ],
        "wc_reply_reviewers_avg": [
            73.75,
            115.38712016512068
        ],
        "wc_reply_authors_avg": [
            1406.25,
            1006.3509266155619
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.75,
            1.920286436967152
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.5443310539518174,
        "gs_citation": 49,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5126656348861499364&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;0;0;0;2",
        "aff_unique_norm": "Tsinghua University;Zhipu AI;TAL",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.zhipu.ai;",
        "aff_unique_abbr": "THU;ZHIPU AI;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China;"
    },
    {
        "title": "3D Feature Prediction for Masked-AutoEncoder-Based Point Cloud Pretraining",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18849",
        "id": "LokR2TTFMs",
        "author_site": "Siming Yan, Yuqi Yang, Yu-Xiao Guo, Hao Pan, Peng-Shuai Wang, \u7ae5\u6b23 TONG XIN, Yang Liu, Qixing Huang",
        "tldr": "",
        "abstract": "Masked autoencoders (MAE) have recently been introduced to 3D self-supervised pretraining for point clouds due to their great success in NLP and computer vision. Unlike MAEs used in the image domain, where the pretext task is to restore features at the masked pixels, such as colors, the existing 3D MAE works reconstruct the missing geometry only, i.e, the location of the masked points. In contrast to previous studies, we advocate that point location recovery is inessential and restoring intrinsic point features is much superior. To this end, we propose to ignore point position reconstruction and recover high-order features at masked points including surface normals and surface variations, through a novel attention-based decoder which is independent of the encoder design. We validate the effectiveness of our pretext task and decoder design using different encoder structures for 3D training and demonstrate the advantages of our pretrained networks on various point cloud analysis tasks.",
        "keywords": "point cloud;point cloud self-supervised learning;point cloud pre-training",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/9b790dfe56bba9843dfec0c9fe544305c425c053.pdf",
        "author": "Siming Yan;Yuqi Yang;Yu-Xiao Guo;Hao Pan;Peng-Shuai Wang;Xin Tong;Yang Liu;Qixing Huang",
        "authorids": "~Siming_Yan1;~Yuqi_Yang1;~Yu-Xiao_Guo1;~Hao_Pan4;~Peng-Shuai_Wang1;~Xin_Tong1;~Yang_Liu49;~Qixing_Huang1",
        "gender": "M;M;M;M;M;M;;M",
        "homepage": ";https://yukichiii.github.io/;;https://haopan.github.io/;http://wang-ps.github.io/;https://www.microsoft.com/en-us/research/people/xtong/;;https://www.cs.utexas.edu/~huangqx/",
        "dblp": "156/8709;;22/329-1;;https://dblp.uni-trier.de/pid/171/6817;86/2176-1;;82/241",
        "google_scholar": "znWC2vAAAAAJ;;FCHG5J0AAAAJ;iczxr4UAAAAJ;knqNKX0AAAAJ;P91a-UQAAAAJ;;https://scholar.google.com.tw/citations?user=pamL_rIAAAAJ",
        "orcid": ";;;0000-0003-3628-9777;;0000-0001-8788-2453;;",
        "linkedin": ";;;;;xin-tong-8892039/;;",
        "or_profile": "~Siming_Yan1;~Yuqi_Yang1;~Yu-Xiao_Guo1;~Hao_Pan4;~Peng-Shuai_Wang1;~Xin_Tong1;~Yang_Liu49;~Qixing_Huang1",
        "aff": "The University of Texas at Austin;Tsinghua University;Microsoft Research Asia;Microsoft Research;Peking University;Microsoft Research Asia;;University of Texas at Austin",
        "aff_domain": "cs.utexas.edu;tsinghua.edu.cn;microsoft.com;microsoft.com;pku.edu.cn;microsoft.com;;utexas.edu",
        "position": "PhD student;PhD student;Researcher;Researcher;Assistant Professor;Researcher;;Associate Professor",
        "bibtex": "@inproceedings{\nyan2024d,\ntitle={3D Feature Prediction for Masked-AutoEncoder-Based Point Cloud Pretraining},\nauthor={Siming Yan and Yuqi Yang and Yu-Xiao Guo and Hao Pan and Peng-Shuai Wang and Xin Tong and Yang Liu and Qixing Huang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=LokR2TTFMs}\n}",
        "github": "",
        "project": "",
        "reviewers": "UgQs;wYee;HyKn;cRKn",
        "pdf_size": 1632800,
        "rating": "6;6;6;8",
        "confidence": "4;4;4;4",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "71;62;45;67",
        "wc_strengths": "62;53;54;26",
        "wc_weaknesses": "132;309;244;65",
        "wc_questions": "2;54;19;31",
        "wc_review": "267;478;362;189",
        "wc_reply_reviewers": "46;168;82;12",
        "wc_reply_authors": "732;1024;553;402",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "3;3;2;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            61.25,
            9.908960591303208
        ],
        "wc_strengths_avg": [
            48.75,
            13.589977924926883
        ],
        "wc_weaknesses_avg": [
            187.5,
            94.922336675832
        ],
        "wc_questions_avg": [
            26.5,
            18.9274932307477
        ],
        "wc_review_avg": [
            324.0,
            107.97453403465097
        ],
        "wc_reply_reviewers_avg": [
            77.0,
            58.077534382926416
        ],
        "wc_reply_authors_avg": [
            677.75,
            231.53441968744085
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16922868814272096208&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=LokR2TTFMs",
        "pdf": "https://openreview.net/pdf?id=LokR2TTFMs",
        "email": "cs.utexas.edu;tsinghua.edu.cn;microsoft.com;microsoft.com;pku.edu.cn;microsoft.com;;utexas.edu",
        "author_num": 8,
        "aff_unique_index": "0;1;2;2;3;2;0",
        "aff_unique_norm": "University of Texas at Austin;Tsinghua University;Microsoft;Peking University",
        "aff_unique_dep": ";;Research;",
        "aff_unique_url": "https://www.utexas.edu;https://www.tsinghua.edu.cn;https://www.microsoft.com/en-us/research/group/asia;http://www.pku.edu.cn",
        "aff_unique_abbr": "UT Austin;THU;MSR Asia;Peking U",
        "aff_campus_unique_index": "0;2;2;0",
        "aff_campus_unique": "Austin;;Asia",
        "aff_country_unique_index": "0;1;1;0;1;1;0",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "Bilevel Optimization under Unbounded Smoothness: A New Algorithm and Convergence Analysis",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18848",
        "id": "LqRGsGWOTX",
        "author_site": "Jie Hao, Xiaochuan Gong, Mingrui Liu",
        "tldr": "",
        "abstract": "Bilevel optimization is an important formulation for many machine learning problems, such as meta-learning and hyperparameter optimization. Current bilevel optimization algorithms assume that the gradient of the upper-level function is Lipschitz (i.e., the upper-level function has a bounded smoothness parameter). However, recent studies reveal that certain neural networks such as recurrent neural networks (RNNs) and long-short-term memory networks (LSTMs) exhibit potential unbounded smoothness, rendering conventional bilevel optimization algorithms unsuitable for these neural networks. In this paper, we design a new bilevel optimization algorithm, namely BO-REP, to address this challenge. This algorithm updates the upper-level variable using normalized momentum and incorporates two novel techniques for updating the lower-level variable: \\textit{initialization refinement} and \\textit{periodic updates}. Specifically, once the upper-level variable is initialized, a subroutine is invoked to obtain a refined estimate of the corresponding optimal lower-level variable, and the lower-level variable is updated only after every specific period instead of each iteration. When the upper-level problem is nonconvex and unbounded smooth, and the lower-level problem is strongly convex, we prove that our algorithm requires $\\widetilde{O}(1/\\epsilon^4)$ \\footnote{Here $\\widetilde{O}(\\cdot)$ compresses logarithmic factors of $1/\\epsilon$ and $1/\\delta$, where $\\delta\\in(0,1)$ denotes the failure probability.} iterations to find an $\\epsilon$-stationary point in the stochastic setting, where each iteration involves calling a stochastic gradient or Hessian-vector product oracle. Notably, this result matches the state-of-the-art complexity results under the bounded smoothness setting and without mean-squared smoothness of the stochastic gradient, up to logarithmic factors. Our proof relies on novel technical lemmas for the periodically updated lower-level variable, which are of independent interest. Our experiments on hyper-representation learning, hyperparameter optimization, and data hyper-cleaning for text classification tasks demonstrate the effectiveness of our proposed algorithm. The code is available at [https://github.com/MingruiLiu-ML-Lab/Bilevel-Optimization-under-Unbounded-Smoothness](https://github.com/MingruiLiu-ML-Lab/Bilevel-Optimization-under-Unbounded-Smoothness).",
        "keywords": "Bilevel Optimization;Unbounded Smoothness;Deep Learning",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/4b091666fc773fbe140fe445b244cc73438b2120.zip",
        "author": "Jie Hao;Xiaochuan Gong;Mingrui Liu",
        "authorids": "~Jie_Hao3;~Xiaochuan_Gong1;~Mingrui_Liu2",
        "gender": "M;M;",
        "homepage": "https://jhao6.github.io/JieHao.github.io/;;https://mingrliu.github.io",
        "dblp": ";;",
        "google_scholar": "S8ZTkikAAAAJ;byUF8hgAAAAJ;KFoEnFQAAAAJ",
        "orcid": ";;",
        "linkedin": ";;mingrui-liu-447a2aab/",
        "or_profile": "~Jie_Hao3;~Xiaochuan_Gong1;~Mingrui_Liu2",
        "aff": "George Mason University;George Mason University;George Mason University",
        "aff_domain": "gmu.edu;gmu.edu;gmu.edu",
        "position": "PhD student;PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nhao2024bilevel,\ntitle={Bilevel Optimization under Unbounded Smoothness: A New Algorithm and Convergence Analysis},\nauthor={Jie Hao and Xiaochuan Gong and Mingrui Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=LqRGsGWOTX}\n}",
        "github": "",
        "project": "",
        "reviewers": "gGYZ;ZUWL;enk4;fyzv;7Cii",
        "pdf_size": 1865330,
        "rating": "6;6;6;8;8",
        "confidence": "4;3;4;3;4",
        "soundness": "3;2;2;3;4",
        "contribution": "2;3;2;3;3",
        "presentation": "2;3;2;2;4",
        "wc_summary": "40;84;45;96;87",
        "wc_strengths": "28;63;12;115;60",
        "wc_weaknesses": "43;268;179;24;30",
        "wc_questions": "121;66;3;209;31",
        "wc_review": "232;481;239;444;208",
        "wc_reply_reviewers": "12;316;153;25;0",
        "wc_reply_authors": "1517;2079;1757;1188;483",
        "reply_reviewers": "1;2;2;1;0",
        "reply_authors": "5;5;5;4;1",
        "rating_avg": [
            6.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.8,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.6,
            0.8
        ],
        "wc_summary_avg": [
            70.4,
            23.17412350014559
        ],
        "wc_strengths_avg": [
            55.6,
            35.39830504416843
        ],
        "wc_weaknesses_avg": [
            108.8,
            97.98244740768624
        ],
        "wc_questions_avg": [
            86.0,
            73.0315000530593
        ],
        "wc_review_avg": [
            320.8,
            116.74142366786522
        ],
        "wc_reply_reviewers_avg": [
            101.2,
            120.68703327201311
        ],
        "wc_reply_authors_avg": [
            1404.8,
            545.5083500735805
        ],
        "reply_reviewers_avg": [
            1.2,
            0.7483314773547883
        ],
        "reply_authors_avg": [
            4.0,
            1.5491933384829668
        ],
        "replies_avg": [
            34,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.16666666666666663,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16708845905729795361&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=LqRGsGWOTX",
        "pdf": "https://openreview.net/pdf?id=LqRGsGWOTX",
        "email": "gmu.edu;gmu.edu;gmu.edu",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "George Mason University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.gmu.edu",
        "aff_unique_abbr": "GMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Sign2GPT: Leveraging Large Language Models for Gloss-Free Sign Language Translation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18847",
        "id": "LqaEEs3UxU",
        "author_site": "Ryan Wong, Necati Cihan Camgoz, Richard Bowden",
        "tldr": "",
        "abstract": "Automatic Sign Language Translation requires the integration of both computer vision and natural language processing to effectively bridge the communication gap between sign and spoken languages. However, the deficiency in large-scale training data to support sign language translation means we need to leverage resources from spoken language. We introduce, Sign2GPT, a novel framework for sign language translation that utilizes large-scale pretrained vision and language models via lightweight adapters for gloss-free sign language translation. The lightweight adapters are crucial for sign language translation, due to the constraints imposed by limited dataset sizes and the computational requirements when training with long sign videos.\nWe also propose a novel pretraining strategy that directs our encoder to learn sign representations from automatically extracted pseudo-glosses without requiring gloss order information or annotations.\nWe evaluate our approach on two public benchmark sign language translation datasets, namely RWTH-PHOENIX-Weather 2014T and CSL-Daily, and improve on state-of-the-art gloss-free translation performance with a significant margin.",
        "keywords": "sign language translation;sign recognition;large language models",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Ryan Wong;Necati Cihan Camgoz;Richard Bowden",
        "authorids": "~Ryan_Wong1;~Necati_Cihan_Camgoz2;~Richard_Bowden1",
        "gender": "M;M;Not Specified",
        "homepage": "https://www.surrey.ac.uk/people/ryan-wong;https://personalpages.surrey.ac.uk/r.bowden/;https://www.cihancamgoz.com",
        "dblp": "198/1917-3;b/RichardBowden;160/2823",
        "google_scholar": "T3C1SW0AAAAJ;https://scholar.google.co.uk/citations?user=mvvgDvcAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";0000-0003-3285-8020;",
        "linkedin": ";richard-bowden-98505811/;",
        "or_profile": "~Ryan_Wong1;~Richard_Bowden1;~Necati_Cihan_Camgoz1",
        "aff": "University of Surrey;University of Surrey;Meta",
        "aff_domain": "surrey.ac.uk;surrey.ac.uk;meta.com",
        "position": "PhD student;Professor;Researcher",
        "bibtex": "@inproceedings{\nwong2024signgpt,\ntitle={Sign2{GPT}: Leveraging Large Language Models for Gloss-Free Sign Language Translation},\nauthor={Ryan Wong and Necati Cihan Camgoz and Richard Bowden},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=LqaEEs3UxU}\n}",
        "github": "",
        "project": "",
        "reviewers": "3mSZ;hMSD;aj4n;DHgv",
        "pdf_size": 2916564,
        "rating": "5;6;6;6",
        "confidence": "5;5;4;4",
        "soundness": "2;3;4;3",
        "contribution": "2;3;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "51;47;80;117",
        "wc_strengths": "19;44;30;56",
        "wc_weaknesses": "121;245;53;66",
        "wc_questions": "4;2;228;7",
        "wc_review": "195;338;391;246",
        "wc_reply_reviewers": "0;61;0;14",
        "wc_reply_authors": "692;938;608;363",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            73.75,
            28.030117730755254
        ],
        "wc_strengths_avg": [
            37.25,
            13.988834833537782
        ],
        "wc_weaknesses_avg": [
            121.25,
            75.86954263734559
        ],
        "wc_questions_avg": [
            60.25,
            96.86685449626204
        ],
        "wc_review_avg": [
            292.5,
            76.55226972467896
        ],
        "wc_reply_reviewers_avg": [
            18.75,
            25.053692342646823
        ],
        "wc_reply_authors_avg": [
            650.25,
            205.45118033245757
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 36,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5429121486712960836&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 8,
        "openreview": "https://openreview.net/forum?id=LqaEEs3UxU",
        "pdf": "https://openreview.net/pdf?id=LqaEEs3UxU",
        "email": "surrey.ac.uk;surrey.ac.uk;meta.com",
        "author_num": 3,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "University of Surrey;Meta",
        "aff_unique_dep": ";Meta Platforms, Inc.",
        "aff_unique_url": "https://www.surrey.ac.uk;https://meta.com",
        "aff_unique_abbr": "Surrey;Meta",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "id": "LqcLWgi5en",
        "title": "From PDEs to Wingbeats: A Novel Convolutional Fourier Layer-based ResNet Model",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recent advancements in Deep Learning apply Fourier Neural Operators (FNOs) for generating numerical solutions of Partial Differential Equations (PDEs). They are efficient due to their global spectral representations. However, their abilities in applied classification or regression tasks for time series have not been studied previously. We further investigate the motivation behind FNOs and provide a more detailed Discrete Fourier Transform-based definition. Furthermore, we introduce CF-ResNet-1D, a novel ResNet-inspired model built from Convolutional Fourier Layers being parallel units of FNO and 1D-Convolution. CF-ResNet-1D can perform time-series data analysis on raw time-domain signals while also taking advantage of the parallel spectral processing of the FNOs. This combined processing method outperforms spectrogram-based models for insect wingbeat sound classification, achieving state-of-the-art accuracy on benchmark datasets. The outcomes of our research offer promising insights about FNO application in real-world problems, such as mosquito management and the mitigation of insect-related diseases.",
        "keywords": "Fourier Neural Operator;ResNet;Insect wingbeat classification",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/1ab3ff45e52fad0c777f68a867b841baf7f9035b.zip",
        "author": "B\u00e9la J\u00e1nos Szekeres;Natabara M\u00e1t\u00e9 Gy\u00f6ngy\u00f6ssy;J\u00e1nos Botzheim",
        "authorids": "~B\u00e9la_J\u00e1nos_Szekeres1;~Natabara_M\u00e1t\u00e9_Gy\u00f6ngy\u00f6ssy1;~J\u00e1nos_Botzheim1",
        "gender": ";M;",
        "homepage": ";;",
        "dblp": ";38/6149;258/9851",
        "google_scholar": ";-ctFVkkAAAAJ;2UlkRh0AAAAJ",
        "orcid": "0000-0002-4931-7055;0000-0002-7838-6148;0000-0001-8806-7338",
        "linkedin": ";j%C3%A1nos-botzheim-3524a82a/;",
        "or_profile": "~B\u00e9la_J\u00e1nos_Szekeres1;~J\u00e1nos_Botzheim1;~Natabara_Gy\u00f6ngy\u00f6ssy1",
        "aff": "Eotvos Lorand University, E\u00f6tv\u00f6s Lorand University;Eotvos Lorand University, E\u00f6tv\u00f6s Lorand University;Eotvos Lorand University, E\u00f6tv\u00f6s Lorand University",
        "aff_domain": "inf.elte.hu;inf.elte.hu;inf.elte.hu",
        "position": "Assistant Professor;Associate Professor;PhD student",
        "bibtex": "@misc{\nszekeres2024from,\ntitle={From {PDE}s to Wingbeats: A Novel Convolutional Fourier Layer-based ResNet Model},\nauthor={B{\\'e}la J{\\'a}nos Szekeres and Natabara M{\\'a}t{\\'e} Gy{\\\"o}ngy{\\\"o}ssy and J{\\'a}nos Botzheim},\nyear={2024},\nurl={https://openreview.net/forum?id=LqcLWgi5en}\n}",
        "github": "",
        "project": "",
        "reviewers": "EZRu;YK2j;91ro;QZGG",
        "site": "https://openreview.net/forum?id=LqcLWgi5en",
        "pdf_size": 895081,
        "rating": "3;3;3;5",
        "confidence": "5;2;4;4",
        "soundness": "3;1;2;3",
        "contribution": "1;1;2;2",
        "presentation": "2;2;2;3",
        "wc_summary": "52;35;58;34",
        "wc_strengths": "109;14;24;27",
        "wc_weaknesses": "500;83;169;107",
        "wc_questions": "116;6;44;161",
        "wc_review": "777;138;295;329",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            44.75,
            10.473180032826706
        ],
        "wc_strengths_avg": [
            43.5,
            38.12151623427379
        ],
        "wc_weaknesses_avg": [
            214.75,
            167.65198328680756
        ],
        "wc_questions_avg": [
            81.75,
            60.449875930393766
        ],
        "wc_review_avg": [
            384.75,
            237.64929518094516
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.13245323570650439,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:IoXYGunFQAwJ:scholar.google.com/&scioq=From+PDEs+to+Wingbeats:+A+Novel+Convolutional+Fourier+Layer-based+ResNet+Model&hl=en&as_sdt=0,34",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "E\u00f6tv\u00f6s Lor\u00e1nd University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.elte.hu",
        "aff_unique_abbr": "ELTE",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Hungary"
    },
    {
        "id": "Lqwk6tNVEi",
        "title": "Neighborhood-Informed Diffusion Model for Source-Free Domain Adaptation: Retrieving Source Ground Truth from Target Query's Neighbors",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Diffusion models, empowered as an input augmentation technique, have demonstrated promise in domain adaptation. However, to effectively capture shared characteristics between two data densities, such a diffusion model needs to be trained using both source and target data for its generation. This constraint narrows its application to a more demanding yet authentic scenario where source data remains inaccessible during target adaptation, i.e., source-free domain adaptation (SFDA). In the absence of source data during adaptation, which hinders the analytical quantification of domain shift, can we employ the pre-trained source representation to formulate a diffusion model for facilitating the unsupervised clustering in target adaptation? To answer this question, we introduce a novel method, discriminative neighborhood diffusion (DND). DND transforms the pre-trained source representation into a target-to-source diffusion model by parameterizing the prior densities of the diffusion process, leveraging the smoothness indicated by latent k-nearest neighbors (k-NNs). The samples generated from the diffusion model are then used as positive keys for contrastive clustering during adaptation. This process effectively introduces a form of supervision into unsupervised clustering by incorporating the latent geometries from both the source and target domains' latent k-NN. By evaluating DND against various SFDA methods on multiple benchmark datasets, we demonstrate the discriminative potential of diffusion models in the absence of source data. Moreover, the effectiveness of DND is demonstrated as it successfully solves SFDA problems, achieving state-of-the-art performance.",
        "keywords": "discriminative diffusion models;source-free domain adaptation;generative models;contrastive learning;semi-supervised learning;transfer learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/2d356d801dcf1e044a757fd06e2e97d681046d87.zip",
        "author": "Jing Wang;Wonho Bae;Jiahong Chen;Junhyug Noh",
        "authorids": "~Jing_Wang17;~Wonho_Bae1;~Jiahong_Chen1;~Junhyug_Noh1",
        "gender": "M;M;M;M",
        "homepage": "https://sites.google.com/view/jingwang18/home;https://won-bae.github.io/;;https://pai.ewha.ac.kr/",
        "dblp": "02/736-112;259/5393;205/8477;159/7232",
        "google_scholar": "https://scholar.google.ca/citations?user=c1ZNx5AAAAAJ;https://scholar.google.ca/citations?user=EEwA__kAAAAJ;https://scholar.google.ca/citations?user=G_2_Z_gAAAAJ;VJgEpXEAAAAJ",
        "orcid": "0000-0001-9417-1174;;0000-0001-7152-8230;0000-0003-1239-8178",
        "linkedin": "jing-david-wang-682705160/?originalSubdomain=ca;wonho-bae/;jiahong-chen-phd-b0bb82bb/;junhyug/",
        "or_profile": "~Jing_Wang17;~Wonho_Bae1;~Jiahong_Chen1;~Junhyug_Noh1",
        "aff": "University of British Columbia;University of British Columbia;Amazon;Ewha Womans University",
        "aff_domain": "ubc.ca;cs.ubc.ca;amazon.com;ewha.ac.kr",
        "position": "PhD student;PhD student;Researcher;Assistant Professor",
        "bibtex": "@misc{\nwang2024neighborhoodinformed,\ntitle={Neighborhood-Informed Diffusion Model for Source-Free Domain Adaptation: Retrieving Source Ground Truth from Target Query's Neighbors},\nauthor={Jing Wang and Wonho Bae and Jiahong Chen and Junhyug Noh},\nyear={2024},\nurl={https://openreview.net/forum?id=Lqwk6tNVEi}\n}",
        "github": "",
        "project": "",
        "reviewers": "Wxvo;6XN2;oyCL;VVzG",
        "site": "https://openreview.net/forum?id=Lqwk6tNVEi",
        "pdf_size": 6266464,
        "rating": "3;3;5;8",
        "confidence": "4;5;5;5",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;1;3;3",
        "wc_summary": "77;39;56;37",
        "wc_strengths": "53;18;37;26",
        "wc_weaknesses": "343;128;236;5",
        "wc_questions": "75;209;4;10",
        "wc_review": "548;394;333;78",
        "wc_reply_reviewers": "0;392;0;0",
        "wc_reply_authors": "1273;1559;1991;615",
        "reply_reviewers": "0;2;0;0",
        "reply_authors": "3;4;4;1",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            4.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            52.25,
            16.08376510646683
        ],
        "wc_strengths_avg": [
            33.5,
            13.124404748406688
        ],
        "wc_weaknesses_avg": [
            178.0,
            125.51693112883218
        ],
        "wc_questions_avg": [
            74.5,
            82.49393917131124
        ],
        "wc_review_avg": [
            338.25,
            169.45556202143382
        ],
        "wc_reply_reviewers_avg": [
            98.0,
            169.74097914175
        ],
        "wc_reply_authors_avg": [
            1359.5,
            500.0887421248353
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            3.0,
            1.224744871391589
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.49374193110101877,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:vSdJ5rDRwlAJ:scholar.google.com/&scioq=Neighborhood-Informed+Diffusion+Model+for+Source-Free+Domain+Adaptation:+Retrieving+Source+Ground+Truth+from+Target+Query%27s+Neighbors&hl=en&as_sdt=0,47",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "University of British Columbia;Amazon;Ewha Womans University",
        "aff_unique_dep": ";Amazon.com, Inc.;",
        "aff_unique_url": "https://www.ubc.ca;https://www.amazon.com;http://www.ewha.ac.kr",
        "aff_unique_abbr": "UBC;Amazon;Ewha",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;2",
        "aff_country_unique": "Canada;United States;South Korea"
    },
    {
        "title": "LaneSegNet: Map Learning with Lane Segment Perception for Autonomous Driving",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18846",
        "id": "LsURkIPYR5",
        "author_site": "Tianyu Li, Peijin Jia, Bangjun Wang, Li Chen, Kun Jiang, Junchi Yan, Hongyang Li",
        "tldr": "",
        "abstract": "A map, as crucial information for downstream applications of an autonomous driving system, is usually represented in lanelines or centerlines. However, existing literature on map learning primarily focuses on either detecting geometry-based lanelines or perceiving topology relationships of centerlines. Both of these methods ignore the intrinsic relationship of lanelines and centerlines, that lanelines bind centerlines. While simply predicting both types of lane in one model is mutually excluded in learning objective, we advocate lane segment as a new representation that seamlessly incorporates both geometry and topology information. Thus, we introduce LaneSegNet, the first end-to-end mapping network generating lane segments to obtain a complete representation of the road structure. Our algorithm features two key modifications. One is a lane attention module to capture pivotal region details within the long-range feature space. Another is an identical initialization strategy for reference points, which enhances the learning of positional priors for lane attention. On the OpenLane-V2 dataset, LaneSegNet outperforms previous counterparts by a substantial gain across three tasks, i.e., map element detection (+4.8 mAP), centerline perception (+6.9 DET$_l$), and the newly defined one, lane segment perception (+5.6 mAP). Furthermore, it obtains a real-time inference speed of 14.7 FPS. Code is accessible at https://github.com/OpenDriveLab/LaneSegNet.",
        "keywords": "Laneline detection;autonomous driving;topology reasoning",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Tianyu Li;Peijin Jia;Bangjun Wang;Li Chen;KUN JIANG;Junchi Yan;Hongyang Li",
        "authorids": "~Tianyu_Li5;~Peijin_Jia1;~Bangjun_Wang1;~Li_Chen15;~KUN_JIANG1;~Junchi_Yan2;~Hongyang_Li1",
        "gender": "M;F;M;M;M;M;M",
        "homepage": "https://github.com/sephyli;https://github.com/PeggyPeppa;https://ilnehc.github.io/;http://www.svm.tsinghua.edu.cn/;https://datascience.hku.hk/people/hongyang-li/;https://bangjunwang.com;http://thinklab.sjtu.edu.cn/",
        "dblp": ";;181/2847;03/4406-2;95/8433-1;150/4057;60/7949.html",
        "google_scholar": "X6vTmEMAAAAJ;;ulZxvY0AAAAJ;;https://scholar.google.com.hk/citations?user=Hfrih1EAAAAJ;_LeSlzUAAAAJ;ga230VoAAAAJ",
        "orcid": "0009-0008-3838-160X;;;0000-0003-4995-7244;0000-0001-9110-5534;;0000-0001-9639-7679",
        "linkedin": "sephy-li/;;;;hongyangli2020/;bangjun-wong-5510a9238/;",
        "or_profile": "~Tianyu_Li5;~Peijin_Jia1;~Li_Chen15;~KUN_JIANG1;~Hongyang_Li1;~Bangjun_Wong1;~Junchi_Yan1",
        "aff": "Shanghai AI Laboratory;Tsinghua University;Shanghai AI Laboratory;Tsinghua University;Shanghai AI Lab;Shanghai AI Laboratory;Shanghai Jiaotong University",
        "aff_domain": "pjlab.org.cn;tsinghua.edu.cn;pjlab.org.cn;tsinghua.edu.cn;pjlab.org.cn;pjlab.org.cn;sjtu.edu.cn",
        "position": "Intern;MS student;Researcher;Associate Professor;Researcher;Intern;Full Professor",
        "bibtex": "@inproceedings{\nli2024lanesegnet,\ntitle={LaneSegNet: Map Learning with Lane Segment Perception for Autonomous Driving},\nauthor={Tianyu Li and Peijin Jia and Bangjun Wang and Li Chen and KUN JIANG and Junchi Yan and Hongyang Li},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=LsURkIPYR5}\n}",
        "github": "",
        "project": "",
        "reviewers": "jPp9;eWbz;afCW;VcjB",
        "pdf_size": 4783202,
        "rating": "5;5;6;8",
        "confidence": "4;3;4;4",
        "soundness": "3;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "1;3;3;4",
        "wc_summary": "80;42;129;55",
        "wc_strengths": "34;18;98;128",
        "wc_weaknesses": "123;66;94;37",
        "wc_questions": "90;34;36;19",
        "wc_review": "327;160;357;239",
        "wc_reply_reviewers": "0;0;0;16",
        "wc_reply_authors": "1058;666;743;584",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            76.5,
            33.24530041975858
        ],
        "wc_strengths_avg": [
            69.5,
            45.13036671687922
        ],
        "wc_weaknesses_avg": [
            80.0,
            31.976553910638962
        ],
        "wc_questions_avg": [
            44.75,
            26.93858756505248
        ],
        "wc_review_avg": [
            270.75,
            77.26051708343661
        ],
        "wc_reply_reviewers_avg": [
            4.0,
            6.928203230275509
        ],
        "wc_reply_authors_avg": [
            762.75,
            179.4956475795444
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.4714045207910316,
        "gs_citation": 40,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14193102527238766697&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=LsURkIPYR5",
        "pdf": "https://openreview.net/pdf?id=LsURkIPYR5",
        "email": "pjlab.org.cn;tsinghua.edu.cn;pjlab.org.cn;tsinghua.edu.cn;pjlab.org.cn;pjlab.org.cn;sjtu.edu.cn",
        "author_num": 7,
        "aff_unique_index": "0;1;0;1;2;0;3",
        "aff_unique_norm": "Shanghai AI Laboratory;Tsinghua University;Shanghai AI Lab;Shanghai Jiao Tong University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.shanghai-ai-lab.com;https://www.tsinghua.edu.cn;https://www.shanghaiailab.com;https://www.sjtu.edu.cn",
        "aff_unique_abbr": "SAIL;THU;SAIL;SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "InstructScene: Instruction-Driven 3D Indoor Scene Synthesis with Semantic Graph Prior",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18845",
        "id": "LtuRgL03pI",
        "author_site": "Chenguo Lin, Yadong MU",
        "tldr": "",
        "abstract": "Comprehending natural language instructions is a charming property for 3D indoor scene synthesis systems. Existing methods directly model object joint distributions and express object relations implicitly within a scene, thereby hindering the controllability of generation. We introduce InstructScene, a novel generative framework that integrates a semantic graph prior and a layout decoder to improve controllability and fidelity for 3D scene synthesis. The proposed semantic graph prior jointly learns scene appearances and layout distributions, exhibiting versatility across various downstream tasks in a zero-shot manner. To facilitate the benchmarking for text-driven 3D scene synthesis, we curate a high-quality dataset of scene-instruction pairs with large language and multimodal models. Extensive experimental results reveal that the proposed method surpasses existing state-of-the-art approaches by a large margin. Thorough ablation studies confirm the efficacy of crucial design components. Project page: https://chenguolin.github.io/projects/InstructScene.",
        "keywords": "3D indoor scene synthesis;controllable generative models;graph diffusion models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/7e603a6d856da1d26cfc8ca576155a312964fd13.pdf",
        "author": "Chenguo Lin;Yadong MU",
        "authorids": "~Chenguo_Lin1;~Yadong_MU1",
        "gender": "M;M",
        "homepage": "https://chenguolin.github.io;http://www.muyadong.com/",
        "dblp": "286/8465;55/1817",
        "google_scholar": "jZ7MDcMAAAAJ;https://scholar.google.com.tw/citations?user=Fqqx4HsAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Chenguo_Lin1;~Yadong_MU1",
        "aff": "Peking University;Peking University",
        "aff_domain": "pku.edu.cn;pku.edu.cn",
        "position": "PhD student;Associate Professor",
        "bibtex": "@inproceedings{\nlin2024instructscene,\ntitle={InstructScene: Instruction-Driven 3D Indoor Scene Synthesis with Semantic Graph Prior},\nauthor={Chenguo Lin and Yadong MU},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=LtuRgL03pI}\n}",
        "github": "",
        "project": "",
        "reviewers": "qrjz;rQD7;jsgt;Peja",
        "pdf_size": 28160954,
        "rating": "6;8;8;8",
        "confidence": "2;4;4;5",
        "soundness": "3;4;3;4",
        "contribution": "2;3;3;3",
        "presentation": "1;4;3;4",
        "wc_summary": "32;83;107;119",
        "wc_strengths": "50;59;113;136",
        "wc_weaknesses": "276;151;15;532",
        "wc_questions": "79;27;107;93",
        "wc_review": "437;320;342;880",
        "wc_reply_reviewers": "122;30;15;296",
        "wc_reply_authors": "863;552;778;1222",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;1;1;2",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            1.224744871391589
        ],
        "wc_summary_avg": [
            85.25,
            33.36446462930284
        ],
        "wc_strengths_avg": [
            89.5,
            36.07284297085551
        ],
        "wc_weaknesses_avg": [
            243.5,
            190.43174630297335
        ],
        "wc_questions_avg": [
            76.5,
            30.244834269673227
        ],
        "wc_review_avg": [
            494.75,
            226.72822387166534
        ],
        "wc_reply_reviewers_avg": [
            115.75,
            111.84000849427721
        ],
        "wc_reply_authors_avg": [
            853.75,
            241.0833621384935
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.9271726499455306,
        "gs_citation": 35,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10736779147704029981&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=LtuRgL03pI",
        "pdf": "https://openreview.net/pdf?id=LtuRgL03pI",
        "email": "pku.edu.cn;pku.edu.cn",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Peking University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.pku.edu.cn",
        "aff_unique_abbr": "Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "Lu5gGqhFTw",
        "title": "RelationMatch: Matching In-batch Relationships for Semi-supervised Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Semi-supervised learning has gained prominence for its ability to utilize limited labeled data alongside abundant unlabeled data. However, prevailing algorithms often neglect the relationships among data points within a batch, focusing instead on augmentations from identical sources. This paper presents RelationMatch, an innovative semi-supervised learning framework that capitalizes on these relationships through a novel Matrix Cross-Entropy (MCE) loss function. We rigorously derive MCE from both matrix analysis and information geometry perspectives. Our extensive empirical evaluations, including a 15.21% accuracy improvement over FlexMatch on the STL-10 dataset, demonstrate that RelationMatch consistently outperforms existing state-of-the-art methods.",
        "keywords": "semi-supervised learning;self-training;matrix cross-entropy",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/e2f00456d9501b0092a71d621c24c8e2520e46d5.zip",
        "author": "Yifan Zhang;Jingqin Yang;Zhiquan Tan;Yang Yuan",
        "authorids": "~Yifan_Zhang16;~Jingqin_Yang2;~Zhiquan_Tan1;~Yang_Yuan4",
        "gender": ";M;M;M",
        "homepage": ";https://github.com/yjqqqaq;;http://people.iiis.tsinghua.edu.cn/~yuanyang/index.html",
        "dblp": ";267/1955;326/0177;",
        "google_scholar": ";;;",
        "orcid": ";;;",
        "linkedin": ";;https://www.linkedin.cn/incareer/in/ACoAAC1A8_QBFX8OlchWmVI_pNXN4zm_t6vPKCs;",
        "or_profile": "~Yifan_Zhang16;~Jingqin_Yang2;~Zhiquan_Tan1;~Yang_Yuan4",
        "aff": ";Tsinghua University;Tsinghua University;Tsinghua University",
        "aff_domain": ";tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn",
        "position": ";PhD student;PhD student;Assistant Professor",
        "bibtex": "@misc{\nzhang2024relationmatch,\ntitle={RelationMatch: Matching In-batch Relationships for Semi-supervised Learning},\nauthor={Yifan Zhang and Jingqin Yang and Zhiquan Tan and Yang Yuan},\nyear={2024},\nurl={https://openreview.net/forum?id=Lu5gGqhFTw}\n}",
        "github": "",
        "project": "",
        "reviewers": "Hi55;8nMg;BTXg;SHZg",
        "site": "https://openreview.net/forum?id=Lu5gGqhFTw",
        "pdf_size": 625709,
        "rating": "3;5;5;8",
        "confidence": "5;4;3;3",
        "soundness": "2;3;2;4",
        "contribution": "1;3;3;4",
        "presentation": "2;3;2;3",
        "wc_summary": "47;19;60;74",
        "wc_strengths": "43;42;46;68",
        "wc_weaknesses": "178;56;85;90",
        "wc_questions": "2;46;12;27",
        "wc_review": "270;163;203;259",
        "wc_reply_reviewers": "37;0;0;9",
        "wc_reply_authors": "649;530;288;197",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "2;2;2;1",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            1.0897247358851685
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            50.0,
            20.285462775100793
        ],
        "wc_strengths_avg": [
            49.75,
            10.638961415476606
        ],
        "wc_weaknesses_avg": [
            102.25,
            45.62003397631352
        ],
        "wc_questions_avg": [
            21.75,
            16.588776326179094
        ],
        "wc_review_avg": [
            223.75,
            43.30920802785477
        ],
        "wc_reply_reviewers_avg": [
            11.5,
            15.173990905493518
        ],
        "wc_reply_authors_avg": [
            416.0,
            181.4042447132922
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8021806287494232,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16047240496393954029&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Tsinghua University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "Lv9KZ5qCSG",
        "title": "Eye Fairness: A Large-Scale 3D Imaging Dataset for Equitable Eye Diseases Screening and Fair Identity Scaling",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Fairness or equity in machine learning is profoundly important for societal well-being, but limited public datasets hinder its progress, especially in the area of medicine. It is undeniable that fairness in medicine is one of the most important areas for fairness learning's applications. Currently, no large-scale public medical datasets with 3D imaging data for fairness learning are available, while 3D imaging data in modern clinics are standard tests for disease diagnosis. In addition, existing medical fairness datasets are actually repurposed datasets, and therefore they typically have limited demographic identity attributes with at most three identity attributes of age, gender and race for fairness modeling. To address this gap, we introduce our Eye Fairness dataset with 30,000 subjects (EyeFairness-30k) covering three major eye diseases including age-related macular degeneration, diabetic retinopathy and glaucoma affecting 380 million patients globally. Our EyeFairness dataset include both 2D fundus photos and 3D optical coherence tomography scans with six demographic identity attributes including age, gender, race, ethnicity, preferred language, and marital status. We also propose a fair identity scaling (FIS) approach combining group and individual scaling together to improve model fairness. Our FIS approach is compared with various the-state-of-the-art fairness learning methods with superior performance in the racial, gender, and ethnicity fairness tasks with 2D and 3D imaging data, which demonstrate the utilities of our EyeFairness dataset for fairness learning. To facilitate fairness comparisons between different models, we propose performance-scaled disparity measures, which can be to compare model fairness account for overall performance levels. The dataset and code are publicly accessible via https://github.com/anonymous4science/EyeFairness.",
        "keywords": "Equitable Deep Learning;Fairness;Fair Loss Scaling;Healthcare Disparity",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Yan Luo;Yu Tian;Min Shi;Tobias Elze;Mengyu Wang",
        "authorids": "~Yan_Luo2;~Yu_Tian8;~Min_Shi4;~Tobias_Elze1;~Mengyu_Wang4",
        "gender": "M;M;M;M;M",
        "homepage": "https://luoyan407.github.io/;https://yutianyt.com/;;https://ophai.hms.harvard.edu;https://ophai.hms.harvard.edu/team/dr-wang/",
        "dblp": ";15/4658;;69/9815;179/8319-1",
        "google_scholar": "LSgqnKQAAAAJ;knptLuEAAAAJ;https://scholar.google.com/citations?hl=en;;i9B02k4AAAAJ",
        "orcid": "0000-0001-5135-0316;0000-0001-5533-7506;;;",
        "linkedin": ";yutianyt/;;;",
        "or_profile": "~Yan_Luo2;~Yu_Tian8;~Min_Shi4;~Tobias_Elze1;~Mengyu_Wang4",
        "aff": "Harvard Ophthalmology AI Lab;Harvard University;Harvard University;Harvard University;Harvard University",
        "aff_domain": "meei.harvard.edu;harvard.edu;harvard.edu;harvard.edu;harvard.edu",
        "position": "Postdoc;Postdoc;Postdoc;Researcher;Assistant Professor",
        "bibtex": "@misc{\nluo2024eye,\ntitle={Eye Fairness: A Large-Scale 3D Imaging Dataset for Equitable Eye Diseases Screening and Fair Identity Scaling},\nauthor={Yan Luo and Yu Tian and Min Shi and Tobias Elze and Mengyu Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=Lv9KZ5qCSG}\n}",
        "github": "",
        "project": "",
        "reviewers": "8dk2;fenP;7iiL;eXPH",
        "site": "https://openreview.net/forum?id=Lv9KZ5qCSG",
        "pdf_size": 678259,
        "rating": "5;5;6;6",
        "confidence": "5;4;4;3",
        "soundness": "2;3;3;3",
        "contribution": "3;3;4;4",
        "presentation": "2;4;3;2",
        "wc_summary": "48;93;45;34",
        "wc_strengths": "63;29;67;56",
        "wc_weaknesses": "389;27;170;33",
        "wc_questions": "76;251;35;59",
        "wc_review": "576;400;317;182",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1210;859;591;199",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            55.0,
            22.54994456755936
        ],
        "wc_strengths_avg": [
            53.75,
            14.821858857781638
        ],
        "wc_weaknesses_avg": [
            154.75,
            146.84068748136534
        ],
        "wc_questions_avg": [
            105.25,
            85.40016100687399
        ],
        "wc_review_avg": [
            368.75,
            142.72591740815682
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            714.75,
            369.9299764820364
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.7071067811865475,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3739604611912641510&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Harvard University",
        "aff_unique_dep": "Ophthalmology AI Lab",
        "aff_unique_url": "https://www.harvard.edu",
        "aff_unique_abbr": "Harvard",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Unraveling the Key Components of OOD Generalization via Diversification",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18844",
        "id": "Lvf7GnaLru",
        "author_site": "Harold Benoit, Liangze Jiang, Andrei Atanov, Oguzhan Kar, Mattia Rigotti, Amir Zamir",
        "tldr": "",
        "abstract": "Supervised learning datasets may contain multiple cues that explain the training set equally well, i.e., learning any of them would lead to the correct predictions on the training data. However, many of them can be spurious, i.e., lose their predictive power under a distribution shift and consequently fail to generalize to out-of-distribution (OOD) data. Recently developed \"diversification\" methods (Lee et al., 2023; Pagliardini et al., 2023) approach this problem by finding multiple diverse hypotheses that rely on different features. This paper aims to study this class of methods and identify the key components contributing to their OOD generalization abilities.\n\nWe show that (1) diversification methods are highly sensitive to the distribution of the unlabeled data used for diversification and can underperform significantly when away from a method-specific sweet spot. (2) Diversification alone is insufficient for OOD generalization. The choice of the used learning algorithm, e.g., the model's architecture and pretraining, is crucial. In standard experiments (classification on Waterbirds and Office-Home datasets), using the second-best choice leads to an up to 20\\% absolute drop in accuracy. (3) The optimal choice of learning algorithm depends on the unlabeled data and vice versa i.e. they are co-dependent. (4) Finally, we show that, in practice, the above pitfalls cannot be alleviated by increasing the number of diverse hypotheses, the major feature of diversification methods.\n\nThese findings provide a clearer understanding of the critical design factors influencing the OOD generalization abilities of diversification methods. They can guide practitioners in how to use the existing methods best and guide researchers in developing new, better ones.",
        "keywords": "Algorithm Design;Diversity;OOD Generalization;Spurious Correlation;Understanding Neural Networks",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/6bc2ab49e589ab2abe4c9910ae31bb103d0e868d.zip",
        "author": "Harold Luc Benoit;Liangze Jiang;Andrei Atanov;Oguzhan Fatih Kar;Mattia Rigotti;Amir Zamir",
        "authorids": "~Harold_Luc_Benoit1;~Liangze_Jiang1;~Andrei_Atanov1;~Oguzhan_Fatih_Kar1;~Mattia_Rigotti1;~Amir_Zamir1",
        "gender": ";M;M;M;;M",
        "homepage": ";https://liangzejiang.github.io/;https://andrewatanov.github.io;https://ofkar.github.io/;http://www.matrig.net;https://amirzamir.com/",
        "dblp": ";;215/4857;225/3220;01/9816;76/8610",
        "google_scholar": ";zU76rDEAAAAJ;https://scholar.google.ru/citations?user=XriU_R8AAAAJ;https://scholar.google.com.tr/citations?user=Ojtk2_MAAAAJ;TmHt7CwAAAAJ;RKjEFukAAAAJ",
        "orcid": ";;;;0000-0001-6466-2810;",
        "linkedin": "harold-b-9289a11b7/;liangze-jiang-3b60571bb/;;oguzhanfatihkar/;;",
        "or_profile": "~Harold_Luc_Benoit1;~Liangze_Jiang1;~Andrei_Atanov1;~Oguzhan_Fatih_Kar1;~Mattia_Rigotti1;~Amir_Zamir1",
        "aff": "School of Computer and Communication Sciences, EPFL - EPF Lausanne;Swiss Federal Institute of Technology Lausanne;Apple;Google;International Business Machines;Swiss Federal Institute of Technology Lausanne",
        "aff_domain": "ic.epfl.ch;ic.epfl.ch;apple.com;google.com;ibm.com;epfl.ch",
        "position": "Researcher;PhD student;Research Intern;Student researcher;Researcher;Assistant Professor",
        "bibtex": "@inproceedings{\nbenoit2024unraveling,\ntitle={Unraveling the Key Components of {OOD} Generalization via Diversification},\nauthor={Harold Luc Benoit and Liangze Jiang and Andrei Atanov and Oguzhan Fatih Kar and Mattia Rigotti and Amir Zamir},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Lvf7GnaLru}\n}",
        "github": "",
        "project": "",
        "reviewers": "WG9i;MHwE;xY3D;shsk",
        "pdf_size": 9647810,
        "rating": "5;6;6;6",
        "confidence": "3;3;4;4",
        "soundness": "3;3;4;3",
        "contribution": "2;2;3;2",
        "presentation": "2;3;4;2",
        "wc_summary": "42;215;37;286",
        "wc_strengths": "39;85;138;113",
        "wc_weaknesses": "60;688;149;308",
        "wc_questions": "23;88;71;108",
        "wc_review": "164;1076;395;815",
        "wc_reply_reviewers": "12;99;0;296",
        "wc_reply_authors": "457;1057;1116;1016",
        "reply_reviewers": "1;3;0;1",
        "reply_authors": "3;3;3;3",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            145.0,
            108.45966992389383
        ],
        "wc_strengths_avg": [
            93.75,
            36.75170064092273
        ],
        "wc_weaknesses_avg": [
            301.25,
            240.3137272400393
        ],
        "wc_questions_avg": [
            72.5,
            31.4364438192363
        ],
        "wc_review_avg": [
            612.5,
            355.06935942150795
        ],
        "wc_reply_reviewers_avg": [
            101.75,
            118.4786373149185
        ],
        "wc_reply_authors_avg": [
            911.5,
            264.8022847333459
        ],
        "reply_reviewers_avg": [
            1.25,
            1.0897247358851685
        ],
        "reply_authors_avg": [
            3.0,
            0.0
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2808113755760892567&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=Lvf7GnaLru",
        "pdf": "https://openreview.net/pdf?id=Lvf7GnaLru",
        "email": "ic.epfl.ch;ic.epfl.ch;apple.com;google.com;ibm.com;epfl.ch",
        "author_num": 6,
        "aff_unique_index": "0;1;2;3;4;1",
        "aff_unique_norm": "EPFL;Swiss Federal Institute of Technology Lausanne;Apple;Google;International Business Machines Corporation",
        "aff_unique_dep": "School of Computer and Communication Sciences;;Apple Inc.;Google;",
        "aff_unique_url": "https://www.epfl.ch;https://www.epfl.ch;https://www.apple.com;https://www.google.com;https://www.ibm.com",
        "aff_unique_abbr": "EPFL;EPFL;Apple;Google;IBM",
        "aff_campus_unique_index": "0;0;2;0",
        "aff_campus_unique": "Lausanne;;Mountain View",
        "aff_country_unique_index": "0;0;1;1;1;0",
        "aff_country_unique": "Switzerland;United States"
    },
    {
        "id": "LvlqEaXJbe",
        "title": "BioCLIP: A Vision Foundation Model for the Tree of Life",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Images of the natural world, collected by a variety of cameras from drones to individual phones, are increasingly abundant sources of biological information. \nThere is an explosion of computational methods and tools, particularly computer vision, for extracting biologically relevant information from images for science and conservation. \nYet, currently, most of these are bespoke approaches designed for a specific task and are not easily adaptable or extendable to new questions, contexts, and datasets. \nWe develop the first large-scale multimodal model, BioCLIP, as a foundation for general organismal biology questions on images. \nWe leverage the unique properties of biology as the the application domain for computer vision, namely the abundance and variety of images about plants, animals, and fungi, together with the availability of rich structured biological knowledge.\nWe curate and release TreeOfLife-10M (the largest and most diverse available dataset of biology images), train BioCLIP, rigorously benchmark our approach on diverse fine-grained biology classification tasks, and find that BioCLIP consistently and substantially outperforms existing baselines (by 17% to 20% absolute). \nIntrinsic evaluation further reveals that BioCLIP has learned a hierarchical representation conforming to the tree of life, shedding light on its strong generalizability.",
        "keywords": "computer vision;evolutionary biology;biology;clip;domain-specific pretraining",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Samuel Stevens;Jiaman Wu;Matthew J Thompson;Elizabeth G Campolongo;Chan Hee Song;David Edward Carlyn;Li Dong;Wasila M Dahdul;Charles Stewart;Tanya Berger-Wolf;Wei-Lun Chao;Yu Su",
        "authorids": "~Samuel_Stevens1;~Jiaman_Wu2;~Matthew_J_Thompson1;~Elizabeth_G_Campolongo1;~Chan_Hee_Song1;~David_Edward_Carlyn1;~Li_Dong1;~Wasila_M_Dahdul1;~Charles_Stewart1;~Tanya_Berger-Wolf2;~Wei-Lun_Chao1;~Yu_Su2",
        "gender": "M;;M;;;M;M;;M;F;M;M",
        "homepage": "https://samuelstevens.me;;;;https://chanh.ee;https://davidcarlyn.wordpress.com/;http://dong.li;;https://www.cs.rpi.edu/~stewart;https://cse.osu.edu/people/berger-wolf.1;https://sites.google.com/view/wei-lun-harry-chao;http://ysu1989.github.io",
        "dblp": "279/6356;;;;249/5607;;85/5090-4;;43/471;b/TYBergerWolf;64/8842;38/1070-1",
        "google_scholar": "uR-A0LAAAAAJ;;;;IdBL738AAAAJ;UccNZ0YAAAAJ;wEfQgPgAAAAJ;;https://scholar.google.com/citations?hl=en;fDQUHyIAAAAJ;PGKakWwAAAAJ;rIh5OqoAAAAJ",
        "orcid": "0009-0000-9493-7766;;0000-0003-0583-8585;;;;;;;;0000-0003-1269-7231;",
        "linkedin": ";;thompson-m-j/;;;david-carlyn/;;;;;;",
        "or_profile": "~Samuel_Stevens1;~Jiaman_Wu2;~Matthew_J_Thompson1;~Elizabeth_G_Campolongo1;~Chan_Hee_Song1;~David_Edward_Carlyn1;~Li_Dong1;~Wasila_M_Dahdul1;~Charles_Stewart1;~Tanya_Berger-Wolf2;~Wei-Lun_Chao1;~Yu_Su2",
        "aff": "Ohio State University, Columbus;;Ohio State University, Columbus;;The Ohio State University;Ohio State University;Microsoft Research;;Rensselaer Polytechnic Institute;Ohio State University;Ohio State University;Microsoft",
        "aff_domain": "osu.edu;;osu.edu;;osu.edu;osu.edu;microsoft.com;;cs.rpi.edu;osu.edu;osu.edu;microsoft.com",
        "position": "PhD student;;Research Software Engineer;;PhD student;PhD student;Principal Researcher;;Professor;Professor;Assistant Professor;Senior Researcher",
        "bibtex": "@misc{\nstevens2024bioclip,\ntitle={Bio{CLIP}: A Vision Foundation Model for the Tree of Life},\nauthor={Samuel Stevens and Jiaman Wu and Matthew J Thompson and Elizabeth G Campolongo and Chan Hee Song and David Edward Carlyn and Li Dong and Wasila M Dahdul and Charles Stewart and Tanya Berger-Wolf and Wei-Lun Chao and Yu Su},\nyear={2024},\nurl={https://openreview.net/forum?id=LvlqEaXJbe}\n}",
        "github": "",
        "project": "",
        "reviewers": "4dhf;kxWr;oEa6;5Yaa",
        "site": "https://openreview.net/forum?id=LvlqEaXJbe",
        "pdf_size": 13304175,
        "rating": "3;3;6;6",
        "confidence": "4;4;3;5",
        "soundness": "3;2;2;2",
        "contribution": "2;2;3;2",
        "presentation": "3;4;3;2",
        "wc_summary": "38;519;73;74",
        "wc_strengths": "45;79;20;59",
        "wc_weaknesses": "39;809;107;41",
        "wc_questions": "75;187;22;41",
        "wc_review": "197;1594;222;215",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "92;261;88;25",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            176.0,
            198.56107372795907
        ],
        "wc_strengths_avg": [
            50.75,
            21.47527648250425
        ],
        "wc_weaknesses_avg": [
            249.0,
            324.47187859658965
        ],
        "wc_questions_avg": [
            81.25,
            63.938935712130835
        ],
        "wc_review_avg": [
            557.0,
            598.7816797464666
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            116.5,
            87.5571242104262
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            12,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 88,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14622365587808634402&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;0;0;1;2;0;0;1",
        "aff_unique_norm": "Ohio State University;Microsoft;Rensselaer Polytechnic Institute",
        "aff_unique_dep": ";Microsoft Research;",
        "aff_unique_url": "https://www.osu.edu;https://www.microsoft.com/en-us/research;https://www.rpi.edu",
        "aff_unique_abbr": "OSU;MSR;RPI",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Columbus;",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "LxCPyLREX5",
        "title": "Federated Learning under Label Shifts with Guarantees",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We consider the problem of training a global model in a distributed setting and develop an unbiased estimate of the overall *true risk* minimizer of multiple clients under challenging inter-client and intra-client *label shifts* as a stepping stone to provably address distribution shifts in real world. We generalize the family of Maximum Likelihood Label Shift (MLLS) density estimation methods inspired by a board family of Integral Probability Metrics and introduce the Variational Regularized Label Shift (VRLS) family of density ratio estimation methods and show all MLLS methods are special cases of VRLS under specific latent spaces. Our theory shows high-probability estimation error bounds achieved through a versatile regularization term in VRLS. Our extensive numerical experiments demonstrate that VRLS establishes *a new SotA in density ratio estimation*  surpassing all baselines in MNIST, Fashion MNIST, CIFAR-10 datasets and *relaxed label shifts* as a proxy of real-world settings. In distributed settings, our importance-weighted empirical risk minimization with VRLS outperforms federated averaging and other baselines in imbalanced settings under drastic and challenging label shifts.",
        "keywords": "density ratio estimation; label shifts; discrepancy measures; generalization error",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Zhiyuan Wu;Leello Tadesse Dadi;Xiangcheng Cao;Volkan Cevher;Ali Ramezani-Kebrya",
        "authorids": "~Zhiyuan_Wu2;~Leello_Tadesse_Dadi1;~Xiangcheng_Cao1;~Volkan_Cevher1;~Ali_Ramezani-Kebrya1",
        "gender": ";M;M;M;",
        "homepage": ";;;http://lions.epfl.ch;https://alirk.github.io/",
        "dblp": ";314/6241;;70/5301;129/4841",
        "google_scholar": ";bhAxvCIAAAAJ;;https://scholar.google.ch/citations?user=hlWhzU8AAAAJ;qZ8KukkAAAAJ",
        "orcid": ";0000-0003-2580-4913;;;",
        "linkedin": ";;xiangcheng-cao-587838158/;;",
        "or_profile": "~Zhiyuan_Wu2;~Leello_Tadesse_Dadi1;~Xiangcheng_Cao1;~Volkan_Cevher1;~Ali_Ramezani-Kebrya1",
        "aff": ";EPFL;School of Computer and Communication Sciences, EPFL - EPF Lausanne;Amazon Development Center Germany;University of Oslo",
        "aff_domain": ";epfl.ch;ic.epfl.ch;amazon.de;uio.no",
        "position": ";PhD student;MS student;Amazon Scholar;Associate Professor",
        "bibtex": "@misc{\nwu2024federated,\ntitle={Federated Learning under Label Shifts with Guarantees},\nauthor={Zhiyuan Wu and Leello Tadesse Dadi and Xiangcheng Cao and Volkan Cevher and Ali Ramezani-Kebrya},\nyear={2024},\nurl={https://openreview.net/forum?id=LxCPyLREX5}\n}",
        "github": "",
        "project": "",
        "reviewers": "HSCY;VBZD;PGzm",
        "site": "https://openreview.net/forum?id=LxCPyLREX5",
        "pdf_size": 1838247,
        "rating": "3;5;6",
        "confidence": "4;3;3",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "3;2;2",
        "wc_summary": "55;97;81",
        "wc_strengths": "30;60;128",
        "wc_weaknesses": "252;370;68",
        "wc_questions": "39;149;10",
        "wc_review": "376;676;287",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1097;702;574",
        "reply_reviewers": "0;0;0",
        "reply_authors": "4;3;3",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            77.66666666666667,
            17.30767331432956
        ],
        "wc_strengths_avg": [
            72.66666666666667,
            40.99864496405813
        ],
        "wc_weaknesses_avg": [
            230.0,
            124.26852645246369
        ],
        "wc_questions_avg": [
            66.0,
            59.87208587202108
        ],
        "wc_review_avg": [
            446.3333333333333,
            166.41380818776895
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            791.0,
            222.5952979437496
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9449111825230683,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:m4Yj18aEQzQJ:scholar.google.com/&scioq=Federated+Learning+under+Label+Shifts+with+Guarantees&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "EPFL;Amazon;University of Oslo",
        "aff_unique_dep": ";Development Center;",
        "aff_unique_url": "https://www.epfl.ch;https://www.amazon.de;https://www.uio.no",
        "aff_unique_abbr": "EPFL;Amazon;UiO",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Lausanne",
        "aff_country_unique_index": "0;0;1;2",
        "aff_country_unique": "Switzerland;Germany;Norway"
    },
    {
        "id": "Lxc4nBkJuq",
        "title": "Dissecting Gradient Masking and Denoising in Diffusion Models for Adversarial Purification",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Diffusion models exhibit remarkable empirical robustness in adversarial purification. The mechanisms underlying such improvements remain unclear. It is possible that diffusion models effectively purify the adversarial examples via the learned stimuli prior. Alternatively, the substantial randomness added in the diffusion models may cause gradient masking that contaminates the empirical estimate of adversarial robustness. Here, we seek to dissect the contribution of these two potential factors. Theoretically, we illustrate how a purification system with randomness can cause gradient masking, which can not be addressed by the standard expectation-over-time (EOT) method. Inspired by this, we propose and justify that a simple procedure, randomness replay, can provide a better robustness estimate when randomness is involved. Experimentally, we verify that gradient masking indeed happens under previous evaluations of diffusion models. After properly controlling the effect of randomness, the reverse-only diffusion model (RevPure) provides a better robustness improvement than the previous DiffPure framework, suggesting that the robustness improvement is solely attributed to the reverse process. Furthermore, our analyses reveal that robustness improvement is caused by a sequential denoising mechanism that transforms the stimulus to a direction orthogonal to the original adversarial perturbation, rather than reducing the $\\ell_2$ distance between the transformed and clean stimuli. Our results shed new light on the mechanisms underlying the empirical robustness from diffusion models, and shall inform future development of more efficient adversarial purification systems.",
        "keywords": "Adversarial Purification;Diffusion Models;Randomness-Induced Gradient Masking",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Liu Yuezhang;Xue-Xin Wei",
        "authorids": "~Liu_Yuezhang1;~Xue-Xin_Wei3",
        "gender": "M;M",
        "homepage": "http://liuyuezhang.com;",
        "dblp": "230/3943;118/8207",
        "google_scholar": "9ZjcWaYAAAAJ;7Pd1QzwAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Liu_Yuezhang1;~Xue-Xin_Wei3",
        "aff": "University of Texas, Austin;University of Texas, Austin",
        "aff_domain": "utexas.edu;utexas.edu",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nyuezhang2024dissecting,\ntitle={Dissecting Gradient Masking and Denoising in Diffusion Models for Adversarial Purification},\nauthor={Liu Yuezhang and Xue-Xin Wei},\nyear={2024},\nurl={https://openreview.net/forum?id=Lxc4nBkJuq}\n}",
        "github": "",
        "project": "",
        "reviewers": "AzXU;gWaG;AHc3;9RSr",
        "site": "https://openreview.net/forum?id=Lxc4nBkJuq",
        "pdf_size": 924293,
        "rating": "5;5;5;5",
        "confidence": "3;2;4;3",
        "soundness": "2;3;4;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "60;36;95;92",
        "wc_strengths": "24;22;76;56",
        "wc_weaknesses": "57;125;103;112",
        "wc_questions": "4;185;132;21",
        "wc_review": "145;368;406;281",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "590;786;778;611",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            70.75,
            24.304063446263466
        ],
        "wc_strengths_avg": [
            44.5,
            22.643983748448505
        ],
        "wc_weaknesses_avg": [
            99.25,
            25.616157010761782
        ],
        "wc_questions_avg": [
            85.5,
            75.60588601425157
        ],
        "wc_review_avg": [
            300.0,
            100.30702866698823
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            691.25,
            91.09713222709044
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:fejK5VTxRTMJ:scholar.google.com/&scioq=Dissecting+Gradient+Masking+and+Denoising+in+Diffusion+Models+for+Adversarial+Purification&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Texas at Austin",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.utexas.edu",
        "aff_unique_abbr": "UT Austin",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Austin",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "LxruQOI93v",
        "title": "Just How Flexible are Neural Networks in Practice?",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "It is widely believed that a neural network can fit a training set containing at least as many samples as it has parameters, underpinning notions of overparameterized and underparameterized models.  In practice, however, we only find solutions accessible via our training procedure, including the optimizer and regularizers, limiting flexibility.  Moreover, the exact parameterization of the function class, built into an architecture, shapes its loss surface and impacts the minima we find. In this work, we examine the ability of neural networks to fit data in practice.  Our findings indicate that: \n(1) standard optimizers find minima where the model can only fit training sets with significantly fewer samples than it has parameters; (2) convolutional networks are more parameter-efficient than MLPs and ViTs, even on randomly labeled data; (3) whereas stochastic training is thought to have a regularizing effect, SGD actually finds minima that fit more training data than full-batch gradient descent; (4) the difference in capacity to fit correctly labeled and incorrectly labeled samples predicts generalization; (5) ReLU activation functions enable fitting more data despite being designed to avoid vanishing and exploding gradients in deep architectures.",
        "keywords": "neural networks;approximation theory;model complexity;generalization",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Ravid Shwartz-Ziv;Micah Goldblum;Arpit Bansal;C. Bayan Bruss;Yann LeCun;Andrew Gordon Wilson",
        "authorids": "~Ravid_Shwartz-Ziv2;~Micah_Goldblum1;~Arpit_Bansal1;~C._Bayan_Bruss1;~Yann_LeCun1;~Andrew_Gordon_Wilson1",
        "gender": ";M;M;Not Specified;M;M",
        "homepage": ";https://www.cbbruss.com;http://yann.lecun.com;https://cims.nyu.edu/~andrewgw;https://arpitbansal297.github.io/;https://www.ravid-shwartz-ziv.com/",
        "dblp": "241/7231;;l/YannLeCun;65/10453;190/9114;",
        "google_scholar": "pGDKzuUAAAAJ;ClqvGRQAAAAJ;WLN3QrAAAAAJ;https://scholar.google.com.tw/citations?user=twWX2LIAAAAJ;Pchxm4IAAAAJ;https://scholar.google.co.il/citations?user=SqsLFwMAAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";bayan-bruss/;;;arpit-bansal-970865b1/;",
        "or_profile": "~Micah_Goldblum1;~C._Bayan_Bruss1;~Yann_LeCun1;~Andrew_Gordon_Wilson1;~Arpit_Amit_Bansal1;~ravid_ziv1",
        "aff": "New York University;;New York University;New York University;University of Maryland, College Park;New York University",
        "aff_domain": "nyu.edu;;nyu.edu;nyu.edu;umd.edu;nyu.edu",
        "position": "Postdoc;;Full Professor;Associate Professor;PhD student;Postdoc",
        "bibtex": "@misc{\nshwartz-ziv2024just,\ntitle={Just How Flexible are Neural Networks in Practice?},\nauthor={Ravid Shwartz-Ziv and Micah Goldblum and Arpit Bansal and C. Bayan Bruss and Yann LeCun and Andrew Gordon Wilson},\nyear={2024},\nurl={https://openreview.net/forum?id=LxruQOI93v}\n}",
        "github": "",
        "project": "",
        "reviewers": "14iz;HFGD;ftNw",
        "site": "https://openreview.net/forum?id=LxruQOI93v",
        "pdf_size": 714289,
        "rating": "3;6;6",
        "confidence": "4;4;4",
        "soundness": "3;2;3",
        "contribution": "1;3;3",
        "presentation": "2;3;1",
        "wc_summary": "63;89;168",
        "wc_strengths": "24;123;24",
        "wc_weaknesses": "161;391;553",
        "wc_questions": "72;63;93",
        "wc_review": "320;666;838",
        "wc_reply_reviewers": "28;0;143",
        "wc_reply_authors": "703;763;1402",
        "reply_reviewers": "1;0;1",
        "reply_authors": "1;1;2",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            106.66666666666667,
            44.64925033587412
        ],
        "wc_strengths_avg": [
            57.0,
            46.66904755831214
        ],
        "wc_weaknesses_avg": [
            368.3333333333333,
            160.83393782269823
        ],
        "wc_questions_avg": [
            76.0,
            12.569805089976535
        ],
        "wc_review_avg": [
            608.0,
            215.41278204105407
        ],
        "wc_reply_reviewers_avg": [
            57.0,
            61.87622052668267
        ],
        "wc_reply_authors_avg": [
            956.0,
            316.3194587754601
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5506207967979594586&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "New York University;University of Maryland",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.nyu.edu;https://www/umd.edu",
        "aff_unique_abbr": "NYU;UMD",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";College Park",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "LyNsMNNLjY",
        "title": "Large Language Model Routing with Benchmark Datasets",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "There is a rapidly growing number of open-source Large Language Models (LLMs) and benchmark datasets to compare them. While some models dominate these benchmarks, no single model typically achieves the best accuracy in all tasks and use cases. In this work, we address the challenge of selecting the best LLM out of a collection of models for new tasks. We propose a new formulation for the problem, in which benchmark datasets are repurposed to learn a ``router'' model for this LLM selection, and we show that this problem can be reduced to a collection of binary classification tasks. We demonstrate the utility and limitations of learning model routers from various benchmark datasets, where we consistently improve performance upon using any single model for all tasks.",
        "keywords": "benchmark datasets;model selection;Large Language Models",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/49d578a59154651ba47e372479d6707c5ff19a41.zip",
        "author": "Tal Shnitzer;Anthony Ou;M\u00edrian Silva;Kate Soule;Yuekai Sun;Justin Solomon;Neil Thompson;Mikhail Yurochkin",
        "authorids": "~Tal_Shnitzer1;~Anthony_Ou1;~M\u00edrian_Silva1;kate.soule@ibm.com;~Yuekai_Sun1;~Justin_Solomon1;~Neil_Thompson1;~Mikhail_Yurochkin1",
        "gender": "F;;F;;;M;;M",
        "homepage": "https://shnitzer.github.io/;;https://mirianfsilva.github.io/;;https://yuekai.github.io/;http://people.csail.mit.edu/jsolomon/;http://futuretech.mit.edu;https://moonfolk.github.io/",
        "dblp": "179/2670;;;;;80/5094;;191/6719",
        "google_scholar": "GjhaUOMAAAAJ;;6vP2segAAAAJ;;6T1XtW8AAAAJ;pImSVwoAAAAJ;yjttFw4AAAAJ;QjBF9sUAAAAJ",
        "orcid": "0000-0001-9058-1870;;0009-0006-1950-4120;;;0000-0002-7701-7586;;",
        "linkedin": ";anthony-ou-79a8171b3/;mirianfsilva/;;;justin-solomon-8a587914/;;mikhail-yurochkin-a45659114/",
        "or_profile": "~Tal_Shnitzer1;~Anthony_Ou1;~M\u00edrian_Silva1;kate.soule@ibm.com;~Yuekai_Sun1;~Justin_Solomon1;~Neil_Thompson1;~Mikhail_Yurochkin1",
        "aff": "Broad Institute;;Universidade Federal de Minas Gerais, Universidade Federal de Minas Gerais;;University of Michigan - Ann Arbor;Massachusetts Institute of Technology;Massachusetts Institute of Technology;IBM Research",
        "aff_domain": "broadinstitute.org;;dcc.ufmg.br;;umich.edu;mit.edu;mit.edu;ibm.com",
        "position": "Researcher;;MS student;;Assistant \u2192 Associate Professor of Statistics;Associate Professor;Principal Researcher;Researcher",
        "bibtex": "@misc{\nshnitzer2024large,\ntitle={Large Language Model Routing with Benchmark Datasets},\nauthor={Tal Shnitzer and Anthony Ou and M{\\'\\i}rian Silva and Kate Soule and Yuekai Sun and Justin Solomon and Neil Thompson and Mikhail Yurochkin},\nyear={2024},\nurl={https://openreview.net/forum?id=LyNsMNNLjY}\n}",
        "github": "",
        "project": "",
        "reviewers": "214h;oZKe;3SNW;cuLP",
        "site": "https://openreview.net/forum?id=LyNsMNNLjY",
        "pdf_size": 2346543,
        "rating": "3;3;5;6",
        "confidence": "3;4;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;3;2",
        "wc_summary": "54;52;107;62",
        "wc_strengths": "53;31;121;137",
        "wc_weaknesses": "169;60;154;214",
        "wc_questions": "3;214;55;2",
        "wc_review": "279;357;437;415",
        "wc_reply_reviewers": "0;0;48;0",
        "wc_reply_authors": "588;953;1054;798",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "2;3;4;2",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            68.75,
            22.398381637966615
        ],
        "wc_strengths_avg": [
            85.5,
            44.55053310567675
        ],
        "wc_weaknesses_avg": [
            149.25,
            56.05967802262157
        ],
        "wc_questions_avg": [
            68.5,
            86.69630903331468
        ],
        "wc_review_avg": [
            372.0,
            61.1310068623117
        ],
        "wc_reply_reviewers_avg": [
            12.0,
            20.784609690826528
        ],
        "wc_reply_authors_avg": [
            848.25,
            175.7560454152289
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.19245008972987526,
        "gs_citation": 62,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15263326446176584962&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;2;3;3;4",
        "aff_unique_norm": "Broad Institute;Universidade Federal de Minas Gerais;University of Michigan;Massachusetts Institute of Technology;IBM",
        "aff_unique_dep": ";;;;IBM Research",
        "aff_unique_url": "https://www.broadinstitute.org;https://www.ufmg.br;https://www.umich.edu;https://web.mit.edu;https://www.ibm.com/research",
        "aff_unique_abbr": "Broad;UFMG;UM;MIT;IBM",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Ann Arbor",
        "aff_country_unique_index": "0;1;0;0;0;0",
        "aff_country_unique": "United States;Brazil"
    },
    {
        "title": "LoftQ: LoRA-Fine-Tuning-aware Quantization for Large Language Models",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18843",
        "id": "LzPWWPAdY4",
        "author_site": "Yixiao Li, Yifan Yu, Chen Liang, Nikos Karampatziakis, Pengcheng He, Weizhu Chen, Tuo Zhao",
        "tldr": "",
        "abstract": "Quantization is an indispensable technique for serving Large Language Models (LLMs) and has recently found its way into LoRA fine-tuning (Dettmers et al., 2023). In this work we focus on the scenario where quantization and LoRA fine- tuning are applied together on a pre-trained model. In such cases it is common to observe a consistent gap in the performance on downstream tasks between full fine-tuning and quantization plus LoRA fine-tuning approach. In response, we propose LoftQ (LoRA-Fine-Tuning-aware Quantization), a novel quantization framework that simultaneously quantizes an LLM and finds a proper low-rank initialization for LoRA fine-tuning. Such an initialization alleviates the discrep- ancy between the quantized and full-precision model and significantly improves the generalization in downstream tasks. We evaluate our method on natural lan- guage understanding, question answering, summarization, and natural language generation tasks. Experiments show that our method is highly effective and out- performs existing quantization methods, especially in the challenging 2-bit and 2/4-bit mixed precision regimes. We will release our code.",
        "keywords": "quantization;compression;large language models;NLP;machine learning;low rank",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Yixiao Li;Yifan Yu;Chen Liang;Nikos Karampatziakis;Pengcheng He;Weizhu Chen;Tuo Zhao",
        "authorids": "~Yixiao_Li2;~Yifan_Yu4;~Chen_Liang3;~Nikos_Karampatziakis1;~Pengcheng_He2;~Weizhu_Chen1;~Tuo_Zhao1",
        "gender": ";M;F;;M;M;M",
        "homepage": "https://yxli2123.github.io;https://yifan1130.github.io/;https://cliang1453.github.io/;;;https://www.microsoft.com/en-us/research/people/wzchen/;http://www2.isye.gatech.edu/~tzhao80",
        "dblp": ";67/3150-1;35/3221-6;91/8774;116/8665;79/2536;",
        "google_scholar": ";f20i4tgAAAAJ;https://scholar.google.com/citations?hl=en;;https://scholar.google.com/citations?hl=en;LG_E-4EAAAAJ;EJXN6tYAAAAJ",
        "orcid": ";;;;;;",
        "linkedin": "yixiao-li-90710b209/;;;;;;",
        "or_profile": "~Yixiao_Li2;~Yifan_Yu4;~Chen_Liang3;~Nikos_Karampatziakis1;~Pengcheng_He2;~Weizhu_Chen1;~Tuo_Zhao1",
        "aff": "Georgia Institute of Technology;Georgia Institute of Technology;Microsoft;Microsoft;Microsoft;Microsoft GenAI;Georgia Institute of Technology",
        "aff_domain": "gatech.edu;gatech.edu;microsoft.com;microsoft.com;microsoft.com;microsoft.com;gatech.edu",
        "position": "PhD student;Undergrad student;Researcher;Researcher;Principal Researcher;Vice President;Associate Professor",
        "bibtex": "@inproceedings{\nli2024loftq,\ntitle={LoftQ: Lo{RA}-Fine-Tuning-aware Quantization for Large Language Models},\nauthor={Yixiao Li and Yifan Yu and Chen Liang and Nikos Karampatziakis and Pengcheng He and Weizhu Chen and Tuo Zhao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=LzPWWPAdY4}\n}",
        "github": "",
        "project": "",
        "reviewers": "tN6u;BzhB;5E8o",
        "pdf_size": 366134,
        "rating": "6;8;8",
        "confidence": "4;4;4",
        "soundness": "4;3;4",
        "contribution": "3;3;4",
        "presentation": "4;3;4",
        "wc_summary": "111;194;115",
        "wc_strengths": "34;61;55",
        "wc_weaknesses": "8;20;67",
        "wc_questions": "164;199;28",
        "wc_review": "317;474;265",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "349;312;224",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            140.0,
            38.21866908549625
        ],
        "wc_strengths_avg": [
            50.0,
            11.575836902790225
        ],
        "wc_weaknesses_avg": [
            31.666666666666668,
            25.460208605237746
        ],
        "wc_questions_avg": [
            130.33333333333334,
            73.75786210447143
        ],
        "wc_review_avg": [
            352.0,
            88.84068137214317
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            295.0,
            52.42772803266099
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 178,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13848184224730711263&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 8,
        "openreview": "https://openreview.net/forum?id=LzPWWPAdY4",
        "pdf": "https://openreview.net/pdf?id=LzPWWPAdY4",
        "email": "gatech.edu;gatech.edu;microsoft.com;microsoft.com;microsoft.com;microsoft.com;gatech.edu",
        "author_num": 7,
        "aff_unique_index": "0;0;1;1;1;1;0",
        "aff_unique_norm": "Georgia Institute of Technology;Microsoft",
        "aff_unique_dep": ";Microsoft Corporation",
        "aff_unique_url": "https://www.gatech.edu;https://www.microsoft.com",
        "aff_unique_abbr": "Georgia Tech;Microsoft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Ins-DetCLIP: Aligning Detection Model to Follow Human-Language Instruction",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18842",
        "id": "M0MF4t3hE9",
        "author_site": "Renjie Pi, Lewei Yao, Jianhua Han, Xiaodan Liang, Wei Zhang, Hang Xu",
        "tldr": "",
        "abstract": "This paper introduces Instruction-oriented Object Detection (IOD), a new task that enhances human-computer interaction by enabling object detectors to understand user instructions and locate relevant objects. Unlike traditional open-vocabulary object detection tasks that rely on users providing a list of required category names, IOD requires models to comprehend natural-language instructions, contextual reasoning, and output the name and location of the desired categories. This poses fresh challenges for modern object detection systems. To develop an IOD system, we create a dataset called IOD-Bench, which consists of instruction-guided detections, along with specialized evaluation metrics. We leverage large-scale language models (LLMs) to generate a diverse set of instructions (8k+) based on existing public object detection datasets, covering a wide range of real-world scenarios. As an initial approach to the IOD task, we propose a model called Ins-DetCLIP. It harnesses the extensive knowledge within LLMs to empower the detector with instruction-following capabilities. Specifically, our Ins-DetCLIP employs a visual encoder (i.e., DetCLIP, an open-vocabulary detector) to extract object-level features. These features are then aligned with the input instructions using a cross-modal fusion module integrated into a pre-trained LLM. Experimental results conducted on IOD-Bench demonstrate that our model consistently outperforms baseline methods that directly combine LLMs with detection models. This research aims to pave the way for a more adaptable and versatile interaction paradigm in modern object detection systems, making a significant contribution to the field.",
        "keywords": "Multimodal learning;object detection",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Renjie Pi;Lewei Yao;Jianhua Han;Xiaodan Liang;Wei Zhang;Hang Xu",
        "authorids": "~Renjie_Pi1;~Lewei_Yao1;~Jianhua_Han1;~Xiaodan_Liang2;~Wei_Zhang45;~Hang_Xu1",
        "gender": "M;M;M;F;M;M",
        "homepage": ";;;https://www.sysu-hcp.net/;;",
        "dblp": "67/2156;254/1943.html;29/6207;;10/4661-81;",
        "google_scholar": "XUq0HwcAAAAJ;hqDyTg8AAAAJ;OEPMQEMAAAAJ;voxznZAAAAAJ;;https://scholar.google.com.hk/citations?user=J_8TX6sAAAAJ",
        "orcid": ";;;;;0000-0003-3645-8972",
        "linkedin": ";;;;;",
        "or_profile": "~Renjie_Pi1;~Lewei_Yao1;~Jianhua_Han1;~Xiaodan_Liang2;~Wei_Zhang45;~Hang_Xu1",
        "aff": "Hong Kong University of Science and Technology;Hong Kong University of Science and Technology;Huawei Technologies Ltd.;SUN YAT-SEN UNIVERSITY;Huawei Technologies Ltd;Huawei Noah\u2018s Ark Lab",
        "aff_domain": "ust.hk;ust.hk;huawei.com;sysu.edu.cn;huawei.com;huawei.com",
        "position": "PhD student;PhD student;Researcher;Associate Professor;Researcher;Researcher",
        "bibtex": "@inproceedings{\npi2024insdetclip,\ntitle={Ins-Det{CLIP}: Aligning Detection Model to Follow Human-Language Instruction},\nauthor={Renjie Pi and Lewei Yao and Jianhua Han and Xiaodan Liang and Wei Zhang and Hang Xu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=M0MF4t3hE9}\n}",
        "github": "",
        "project": "",
        "reviewers": "t19r;Y4Gg;tem2;rzsX",
        "pdf_size": 21454998,
        "rating": "5;5;6;8",
        "confidence": "4;3;4;3",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;4",
        "presentation": "3;3;3;3",
        "wc_summary": "65;35;148;100",
        "wc_strengths": "20;13;89;77",
        "wc_weaknesses": "189;133;190;86",
        "wc_questions": "56;2;5;20",
        "wc_review": "330;183;432;283",
        "wc_reply_reviewers": "0;0;56;0",
        "wc_reply_authors": "1971;1134;913;655",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "5;4;2;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            87.0,
            42.06542523260641
        ],
        "wc_strengths_avg": [
            49.75,
            33.61082414937188
        ],
        "wc_weaknesses_avg": [
            149.5,
            43.31570154112709
        ],
        "wc_questions_avg": [
            20.75,
            21.46363203188128
        ],
        "wc_review_avg": [
            307.0,
            89.59073612824041
        ],
        "wc_reply_reviewers_avg": [
            14.0,
            24.24871130596428
        ],
        "wc_reply_authors_avg": [
            1168.25,
            493.4974037419042
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            1.5811388300841898
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.40824829046386296,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5861563024523145429&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=M0MF4t3hE9",
        "pdf": "https://openreview.net/pdf?id=M0MF4t3hE9",
        "email": "ust.hk;ust.hk;huawei.com;sysu.edu.cn;huawei.com;huawei.com",
        "author_num": 6,
        "aff_unique_index": "0;0;1;2;1;1",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Huawei;Sun Yat-sen University",
        "aff_unique_dep": ";Huawei Technologies;",
        "aff_unique_url": "https://www.ust.hk;https://www.huawei.com;http://www.sysu.edu.cn",
        "aff_unique_abbr": "HKUST;Huawei;SYSU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "M0QHJI9OuF",
        "title": "TROJFAIR: TROJAN FAIRNESS ATTACKS",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep learning models have been incorporated into high-stakes sectors, including healthcare diagnosis, loan approvals, and candidate recruitment, among others. Consequently, any bias or unfairness in these models can harm those who depend on such models. In response, many algorithms have emerged to ensure fairness in deep learning. However, while the potential for harm is substantial, the resilience of these fair deep learning models against malicious attacks has never been thoroughly explored, especially in the context of emerging Trojan attacks. Moving beyond prior research, we aim to fill this void by introducing \\textit{TrojFair}, a Trojan fairness attack. Unlike existing attacks, TrojFair is model-agnostic and crafts a Trojaned model that functions accurately and equitably for clean inputs. However, it displays discriminatory behaviors - producing both incorrect and unfair results - for specific groups with tainted inputs containing a trigger. TrojFair is a stealthy Fairness attack that is resilient to existing model fairness audition detectors since the model for clean inputs is fair. TrojFair achieves a target group attack success rate exceeding 88.77\\%, with an average accuracy loss less than 0.44\\%. It also maintains a high discriminative score between the target and untarget groups across various datasets and models.",
        "keywords": "Deep Learning;Trojan Fairness Attacks",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Mengxin Zheng;Jiaqi Xue;yi sheng;Lei Yang;Qian Lou;Lei Jiang",
        "authorids": "~Mengxin_Zheng1;~Jiaqi_Xue1;~yi_sheng1;~Lei_Yang16;~Qian_Lou1;~Lei_Jiang1",
        "gender": "F;M;F;F;M;M",
        "homepage": "https://mxzheng.github.io/;https://jqxue1999.github.io;https://jqub.github.io/yi/;https://ist.gmu.edu/profiles/lyang;https://qlou.org;https://www.jianglei.org",
        "dblp": "327/9609;;;50/2484-18;207/3962.html;96/1994-1.html",
        "google_scholar": "CwLrXMAAAAAJ;NI2jppcAAAAJ;;UTTE_wEAAAAJ;SBYgXLoAAAAJ;-1sXorAAAAAJ",
        "orcid": ";;;0000-0002-0646-440X;;",
        "linkedin": "mengxin-zheng-86bb91171/;;;;;",
        "or_profile": "~Mengxin_Zheng1;~Jiaqi_Xue1;~yi_sheng1;~Lei_Yang16;~Qian_Lou1;~Lei_Jiang1",
        "aff": "University of Central Florida;University of Central Florida;George Mason University;George Mason University;University of Central Florida;Indiana University",
        "aff_domain": "ucf.edu;ucf.edu;gmu.edu;gmu.edu;ucf.edu;iu.edu",
        "position": "Assistant Professor;PhD student;PhD student;Assistant Professor;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nzheng2024trojfair,\ntitle={{TROJFAIR}: {TROJAN} {FAIRNESS} {ATTACKS}},\nauthor={Mengxin Zheng and Jiaqi Xue and yi sheng and Lei Yang and Qian Lou and Lei Jiang},\nyear={2024},\nurl={https://openreview.net/forum?id=M0QHJI9OuF}\n}",
        "github": "",
        "project": "",
        "reviewers": "PuQi;oWkK;7Q6Y",
        "site": "https://openreview.net/forum?id=M0QHJI9OuF",
        "pdf_size": 351454,
        "rating": "3;5;6",
        "confidence": "3;4;4",
        "soundness": "3;3;3",
        "contribution": "2;2;2",
        "presentation": "2;3;3",
        "wc_summary": "34;80;102",
        "wc_strengths": "49;40;39",
        "wc_weaknesses": "123;191;81",
        "wc_questions": "252;88;18",
        "wc_review": "458;399;240",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "761;780;586",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            72.0,
            28.331372481167705
        ],
        "wc_strengths_avg": [
            42.666666666666664,
            4.4969125210773475
        ],
        "wc_weaknesses_avg": [
            131.66666666666666,
            45.32352835142275
        ],
        "wc_questions_avg": [
            119.33333333333333,
            98.06573758907282
        ],
        "wc_review_avg": [
            365.6666666666667,
            92.06640115819789
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            709.0,
            87.31933730089038
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.9449111825230683,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6525065527201726710&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;1;0;2",
        "aff_unique_norm": "University of Central Florida;George Mason University;Indiana University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ucf.edu;https://www.gmu.edu;https://www.indiana.edu",
        "aff_unique_abbr": "UCF;GMU;IU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Exploiting Causal Graph Priors with Posterior Sampling for Reinforcement Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18841",
        "id": "M0xK8nPGvt",
        "author_site": "Mirco Mutti, Riccardo De Santi, Marcello Restelli, Alexander Marx, Giorgia Ramponi",
        "tldr": "",
        "abstract": "Posterior sampling allows exploitation of prior knowledge on the environment's transition dynamics to improve the sample efficiency of reinforcement learning. The prior is typically specified as a class of parametric distributions, the design of which can be cumbersome in practice, often resulting in the choice of uninformative priors. In this work, we propose a novel posterior sampling approach in which the prior is given as a (partial) causal graph over the environment's variables. The latter is often more natural to design, such as listing known causal dependencies between biometric features in a medical treatment study. Specifically, we propose a hierarchical Bayesian procedure, called C-PSRL, simultaneously learning the full causal graph at the higher level and the parameters of the resulting factored dynamics at the lower level. We provide an analysis of the Bayesian regret of C-PSRL that explicitly connects the regret rate with the degree of prior knowledge. Our numerical evaluation conducted in illustrative domains confirms that C-PSRL strongly improves the efficiency of posterior sampling with an uninformative prior while performing close to posterior sampling with the full causal graph.",
        "keywords": "Reinforcement learning;Posterior sampling;Causality",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/c9f56bf03de8a4082b5e0420c8ed380f8e8a1e96.zip",
        "author": "Mirco Mutti;Riccardo De Santi;Marcello Restelli;Alexander Marx;Giorgia Ramponi",
        "authorids": "~Mirco_Mutti1;~Riccardo_De_Santi1;~Marcello_Restelli1;~Alexander_Marx1;~Giorgia_Ramponi1",
        "gender": ";M;M;;F",
        "homepage": ";http://www.riccardodesanti.com;http://home.deib.polimi.it/restelli/;http://a-marx.com;https://gioramponi.github.io/",
        "dblp": "222/2815;313/1635;64/1011;;186/4493",
        "google_scholar": "GlLkJ9UAAAAJ;K7qyOj0AAAAJ;https://scholar.google.com.tw/citations?user=xdgxRiEAAAAJ;fJ9u_woAAAAJ;xbIAH5gAAAAJ",
        "orcid": ";;0000-0002-6322-1076;;",
        "linkedin": ";riccardo-de-santi-426139135/;;;",
        "or_profile": "~Mirco_Mutti1;~Riccardo_De_Santi1;~Marcello_Restelli1;~Alexander_Marx1;~Giorgia_Ramponi1",
        "aff": "Technion - Israel Institute of Technology;ETHZ - ETH Zurich;Politecnico di Milano;ETHZ - ETH Zurich;ETHZ - ETH Zurich",
        "aff_domain": "technion.ac.il;ethz.ch;polimi.it;ethz.ch;ethz.ch",
        "position": "Postdoc;PhD student;Associate Professor;Postdoc;Postdoc",
        "bibtex": "@inproceedings{\nmutti2024exploiting,\ntitle={Exploiting Causal Graph Priors with Posterior Sampling for Reinforcement Learning},\nauthor={Mirco Mutti and Riccardo De Santi and Marcello Restelli and Alexander Marx and Giorgia Ramponi},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=M0xK8nPGvt}\n}",
        "github": "",
        "project": "",
        "reviewers": "fSwc;i58j;mWkL;m9sB",
        "pdf_size": 1230250,
        "rating": "6;8;8;8",
        "confidence": "2;3;3;4",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "94;142;64;72",
        "wc_strengths": "94;101;16;34",
        "wc_weaknesses": "152;170;125;85",
        "wc_questions": "71;5;97;129",
        "wc_review": "411;418;302;320",
        "wc_reply_reviewers": "12;19;24;11",
        "wc_reply_authors": "759;515;560;698",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            93.0,
            30.347981810987037
        ],
        "wc_strengths_avg": [
            61.25,
            36.88749788207381
        ],
        "wc_weaknesses_avg": [
            133.0,
            32.00781154655844
        ],
        "wc_questions_avg": [
            75.5,
            45.59331091289599
        ],
        "wc_review_avg": [
            362.75,
            52.19853925159209
        ],
        "wc_reply_reviewers_avg": [
            16.5,
            5.315072906367325
        ],
        "wc_reply_authors_avg": [
            633.0,
            99.18921312320207
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.816496580927726,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8083046711177797698&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=M0xK8nPGvt",
        "pdf": "https://openreview.net/pdf?id=M0xK8nPGvt",
        "email": "technion.ac.il;ethz.ch;polimi.it;ethz.ch;ethz.ch",
        "author_num": 5,
        "aff_unique_index": "0;1;2;1;1",
        "aff_unique_norm": "Technion - Israel Institute of Technology;ETH Zurich;Politecnico di Milano",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.technion.ac.il/en/;https://www.ethz.ch;https://www.polimi.it",
        "aff_unique_abbr": "Technion;ETHZ;Polimi",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;1;1",
        "aff_country_unique": "Israel;Switzerland;Italy"
    },
    {
        "id": "M11LONBkx1",
        "title": "Diffusion with Synthetic Features: Feature Imputation for Graphs with Partially Observed Features",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this paper, we tackle learning tasks on graphs with missing features, improving the applicability of graph neural networks to real-world graph-structured data. Previous diffusion-based imputation methods overlook the presence of channels with low-variance features, and these channels contribute very little to the performance in graph learning tasks. To overcome this issue, we propose a new diffusion-based imputation scheme using synthetic features in addition to observed features. The proposed scheme first identifies channels with low-variance features via pre-diffusion and generates a synthetic feature for a randomly chosen node in each low-variance channel. Then, our diffusion process spreads the synthetic features widely while considering observed features simultaneously. Extensive experiments on graphs with various rates of missing features demonstrate the effectiveness of our scheme, achieving state-of-the-art performance in both semi-supervised node classification and link prediction.",
        "keywords": "Graph neural networks;Missing features",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Daeho Um;Sunoh Kim;Jiwoong Park;Seulki Park;Jin young Choi",
        "authorids": "~Daeho_Um1;~Sunoh_Kim1;~Jiwoong_Park1;~Seulki_Park1;~Jin_young_Choi1",
        "gender": ";M;;F;M",
        "homepage": ";;https://jiwoongpark92.github.io;https://sites.google.com/view/seulkipark/home;https://pil.snu.ac.kr",
        "dblp": ";234/8006;;166/7234;30/1428-2",
        "google_scholar": ";https://scholar.google.co.kr/citations?user=wlhSowsAAAAJ;https://scholar.google.co.kr/citations?user=B8XAbUwAAAAJ;6Wh4hxcAAAAJ;https://scholar.google.co.kr/citations?user=NoEVFWQAAAAJ",
        "orcid": ";0000-0003-4336-4851;;;",
        "linkedin": ";sunoh-kim-a0a1a5162/;;seulki-park-49a775147;",
        "or_profile": "~Daeho_Um1;~Sunoh_Kim1;~Jiwoong_Park1;~Seulki_Park1;~Jin_young_Choi1",
        "aff": ";Seoul National University;Texas A&M University - College Station;University of Michigan - Ann Arbor;",
        "aff_domain": ";snu.ac.kr;tamu.edu;umich.edu;",
        "position": ";PhD student;Postdoc;Postdoc;",
        "bibtex": "@misc{\num2024diffusion,\ntitle={Diffusion with Synthetic Features: Feature Imputation for Graphs with Partially Observed Features},\nauthor={Daeho Um and Sunoh Kim and Jiwoong Park and Seulki Park and Jin young Choi},\nyear={2024},\nurl={https://openreview.net/forum?id=M11LONBkx1}\n}",
        "github": "",
        "project": "",
        "reviewers": "VMHb;8JVT;VoZJ;mYHT",
        "site": "https://openreview.net/forum?id=M11LONBkx1",
        "pdf_size": 4298795,
        "rating": "5;6;6;6",
        "confidence": "3;2;4;5",
        "soundness": "1;3;2;3",
        "contribution": "1;3;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "41;104;36;63",
        "wc_strengths": "16;55;36;49",
        "wc_weaknesses": "86;40;310;330",
        "wc_questions": "15;2;127;3",
        "wc_review": "158;201;509;445",
        "wc_reply_reviewers": "103;0;131;145",
        "wc_reply_authors": "441;504;2549;1809",
        "reply_reviewers": "1;0;1;2",
        "reply_authors": "3;2;6;6",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            61.0,
            26.823497162003317
        ],
        "wc_strengths_avg": [
            39.0,
            14.949916387726054
        ],
        "wc_weaknesses_avg": [
            191.5,
            129.71796328959223
        ],
        "wc_questions_avg": [
            36.75,
            52.356351095163234
        ],
        "wc_review_avg": [
            328.25,
            151.22727101948246
        ],
        "wc_reply_reviewers_avg": [
            94.75,
            56.75550634079481
        ],
        "wc_reply_authors_avg": [
            1325.75,
            892.7383085204757
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            4.25,
            1.7853571071357126
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.2581988897471611,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:4pjl4aE93WsJ:scholar.google.com/&scioq=Diffusion+with+Synthetic+Features:+Feature+Imputation+for+Graphs+with+Partially+Observed+Features&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Seoul National University;Texas A&M University;University of Michigan",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.snu.ac.kr;https://www.tamu.edu;https://www.umich.edu",
        "aff_unique_abbr": "SNU;TAMU;UM",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";College Station;Ann Arbor",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "id": "M1I4OCJ18h",
        "title": "Rethinking Multi-domain Generalization with A General Learning Objective",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Multi-domain generalization (mDG) is universally aimed at diminishing the gap between training and testing distribution, which in turn facilitates the learning of a mapping from marginal distributions to labels. However, in the literature of mDG, a general learning objective paradigm is conspicuously missing, and the constraint of a static target's marginal distribution is often present. In this paper, we propose to leverage a $Y$-mapping $\\psi$ to relax the constraint. We then rethink the learning objective for mDG and design a new general learning objective that can be used to interpret and analyze most existing mDG wisdom. This general objective is bifurcated into two synergistic amis: learning domain-independent conditional features, and maximizing a posterior. Explorations also extend to two effective regularization terms that incorporate prior information and suppress invalid causality, alleviating the issues that come with relaxed constraints. Inspired by the Generalized Jensen-Shannon Divergence, we contribute to deriving an upper bound for the domain alignment of domain-independent conditional features, disclosing that many previous mDG endeavors actually optimize partially the objective and thus lead to limited performance. As such, the general learning objective is simplified into four practical components and can be easily used in various tasks and different frameworks. Overall, our study proposes a general, robust, and flexible mechanism to handle complex domain shifts. Extensive empirical results indicate that the proposed objective with $Y$-mapping leads to substantially better mDG performance.",
        "keywords": "Mult-domain generalization;domain generalization",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/835bc3880b66fc97528e2ce8baec4673389a0e1b.zip",
        "author": "Zhaorui Tan;Xi Yang;Kaizhu Huang",
        "authorids": "~Zhaorui_Tan1;~Xi_Yang7;~Kaizhu_Huang1",
        "gender": "F;F;M",
        "homepage": "https://github.com/zhaorui-tan;https://scholar.xjtlu.edu.cn/en/persons/XiYang01;https://sites.google.com/view/kaizhu-huang-homepage",
        "dblp": "332/0953.html;13/1520-8;99/3390",
        "google_scholar": "BKUdVaYAAAAJ;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0001-5054-8275;0000-0002-8600-2570;",
        "linkedin": ";;",
        "or_profile": "~Zhaorui_Tan1;~Xi_Yang7;~Kaizhu_Huang1",
        "aff": "University of Liverpool;Xi'an Jiaotong-Liverpool University;Xi'an Jiaotong-Liverpool University",
        "aff_domain": "liverpool.ac.uk;xjtlu.edu.cn;xjtlu.edu.cn",
        "position": "PhD student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\ntan2024rethinking,\ntitle={Rethinking Multi-domain Generalization with A General Learning Objective},\nauthor={Zhaorui Tan and Xi Yang and Kaizhu Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=M1I4OCJ18h}\n}",
        "github": "",
        "project": "",
        "reviewers": "tWvp;Mt83;rMjP;6BEZ;YmGa",
        "site": "https://openreview.net/forum?id=M1I4OCJ18h",
        "pdf_size": 6646141,
        "rating": "3;5;5;5;6",
        "confidence": "3;3;3;2;3",
        "soundness": "2;3;3;2;3",
        "contribution": "2;2;3;2;3",
        "presentation": "2;2;3;2;3",
        "wc_summary": "76;90;122;109;26",
        "wc_strengths": "62;60;39;93;131",
        "wc_weaknesses": "120;364;146;121;119",
        "wc_questions": "71;38;4;80;13",
        "wc_review": "329;552;311;403;289",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            4.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            2.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            84.6,
            33.260186409579845
        ],
        "wc_strengths_avg": [
            77.0,
            32.03123475609393
        ],
        "wc_weaknesses_avg": [
            174.0,
            95.53428703873809
        ],
        "wc_questions_avg": [
            41.2,
            30.27474194770287
        ],
        "wc_review_avg": [
            376.8,
            95.60836783462
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.10206207261596574,
        "gs_citation": 18,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8422379385774438378&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "University of Liverpool;Xi'an Jiao Tong-Liverpool University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.liverpool.ac.uk;https://www.xjtu.edu.cn/en",
        "aff_unique_abbr": "Liv Uni;XJTLU",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Xi'an",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "United Kingdom;China"
    },
    {
        "id": "M1xVxglTva",
        "title": "STARformer: STructural Attention tRansformer for Long-term Time Series Forecasting",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In recent years, Transformers have been gaining attention in the fields of Natural Language Processing, Computer Vision and time-series. Despite the lack of a mechanism to exploit the characteristics of time series data, it has demonstrated its potential in a variety of applications. These capability gaps, including lack of decomposability and interpretability, often make them suboptimal in long-term forecasting efforts. To address these issues, this paper introduces STructural Attention tRansformer, called STARformer, an innovative transformer architecture optimized for time series forecasting.\nIn this work, we improve the transformer by replacing self-attention. Many recent studies show performance improvements by replacing self-attention with traditional time series decomposition algorithms or Fourier transform algorithms. This paper follows recent research trends. This architecture obtains structural attention from a single-layer model and amplifies efficiency and accuracy by replacing the self-attention of existing transformers. To obtain structural attention, i) decompose the complex time series into simple trends or seasonality using traditional time series decomposition methods, and ii) have a single-linear layer model to predict the future of simple time series (e.g., trends or seasonality). iii) Structural attention is extracted through a pre-trained single linear layer model. STARformer, which replaced the existing transformer's self-attention with a structural attention block, outperformed the existing baseline by non-trivial margin in experiments using 9 real data sets and 12 baselines.",
        "keywords": "Long-term time series forecasting;time-series transformer",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/df1217f80c48bcd735fcb7e27f6d4bfbe8cfd635.pdf",
        "author": "Sheo yon Jhin;Seojin Kim;Noseong Park",
        "authorids": "~Sheo_yon_Jhin1;~Seojin_Kim3;~Noseong_Park1",
        "gender": "F;F;",
        "homepage": "https://sheoyonj.space/;https://github.com/bwnebs1;",
        "dblp": "280/3334.html;;",
        "google_scholar": "S_EBNdgAAAAJ;https://scholar.google.com/citations?hl=ko;",
        "orcid": ";;",
        "linkedin": "sheoyon-jhin/;sjiinkim;",
        "or_profile": "~Sheo_yon_Jhin1;~Seojin_Kim3;~Noseong_Park1",
        "aff": "Yonsei University;Yonsei University;",
        "aff_domain": "yonsei.ac.kr;yonsei.ac.kr;",
        "position": "MS student;Undergrad student;",
        "bibtex": "@misc{\njhin2024starformer,\ntitle={{STAR}former: {ST}ructural Attention tRansformer for Long-term Time Series Forecasting},\nauthor={Sheo yon Jhin and Seojin Kim and Noseong Park},\nyear={2024},\nurl={https://openreview.net/forum?id=M1xVxglTva}\n}",
        "github": "",
        "project": "",
        "reviewers": "DtH7;XxxW;qcgb;9etD",
        "site": "https://openreview.net/forum?id=M1xVxglTva",
        "pdf_size": 6224409,
        "rating": "1;1;3;6",
        "confidence": "4;4;3;3",
        "soundness": "1;2;2;3",
        "contribution": "2;1;1;3",
        "presentation": "1;1;1;2",
        "wc_summary": "64;5;112;56",
        "wc_strengths": "22;12;78;38",
        "wc_weaknesses": "320;117;340;189",
        "wc_questions": "80;151;10;3",
        "wc_review": "486;285;540;286",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            1.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            59.25,
            37.9432141495683
        ],
        "wc_strengths_avg": [
            37.5,
            25.154522456210533
        ],
        "wc_weaknesses_avg": [
            241.5,
            92.35935253129485
        ],
        "wc_questions_avg": [
            61.0,
            60.054142238483436
        ],
        "wc_review_avg": [
            399.25,
            115.34161217877961
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8551861104941366,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:RKC1jR6i3XkJ:scholar.google.com/&scioq=STARformer:+STructural+Attention+tRansformer+for+Long-term+Time+Series+Forecasting&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Yonsei University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.yonsei.ac.kr",
        "aff_unique_abbr": "Yonsei",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "M2oUA4XBq4",
        "title": "Learning to ignore: Single Source Domain Generalization via Oracle Regularization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Machine learning frequently suffers from the discrepancy in data distribution, commonly known as domain shift. Single-source Domain Generalization (sDG) is a task designed to simulate domain shift artificially, in order to train a model that can generalize well to multiple unseen target domains from a single source domain. A popular approach is to learn robustness via the alignment of augmented samples. However, prior works frequently overlooked what is learned from such alignment. In this paper, we study the effectiveness of augmentation-based sDG methods by analyzing the data generating process. We highlight issues in using augmentation for OOD generalization, namely, the distinction between domain invariance and augmentation invariance. To alleviate these issues, we introduce a novel regularization method that leverages pretrained models to guide the learning process via a feature-level regularization of mutual information, which we name PROF (Progressive mutual information Regularization for Online distillation of Frozen oracles). PROF can be applied to conventional augmentation-based methods to moderate the stochasticity of models repeatedly trained on augmented data. We show that PROF stabilizes the learning process for sDG.",
        "keywords": "Domain Generalization;Out-of-distribution robustness;Causal Representation Learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/b3cac4f26b877379f179f5d10cbae1bf372e1e89.zip",
        "author": "Dong Kyu Cho;Sanghack Lee",
        "authorids": "~Dong_Kyu_Cho1;~Sanghack_Lee1",
        "gender": "M;M",
        "homepage": "https://sites.google.com/view/dongkyu-cho/home;http://www.sanghacklee.me",
        "dblp": ";20/1133",
        "google_scholar": "qmAMshwAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": "0009-0002-3455-4637;0000-0001-7137-6126",
        "linkedin": "umamicode/;sanghack-lee-65b52a28/",
        "or_profile": "~Dong_Kyu_Cho1;~Sanghack_Lee1",
        "aff": "LG AI Research;Seoul National University",
        "aff_domain": "lgresearch.ai;snu.ac.kr",
        "position": "Researcher;Assistant Professor",
        "bibtex": "@misc{\ncho2024learning,\ntitle={Learning to ignore: Single Source Domain Generalization via Oracle Regularization},\nauthor={Dong Kyu Cho and Sanghack Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=M2oUA4XBq4}\n}",
        "github": "",
        "project": "",
        "reviewers": "N8Mf;6mfm;TGW3;DsCE",
        "site": "https://openreview.net/forum?id=M2oUA4XBq4",
        "pdf_size": 1916766,
        "rating": "3;3;3;5",
        "confidence": "5;3;3;3",
        "soundness": "2;2;2;2",
        "contribution": "2;2;1;2",
        "presentation": "2;2;1;2",
        "wc_summary": "111;29;52;72",
        "wc_strengths": "42;50;28;35",
        "wc_weaknesses": "638;132;348;56",
        "wc_questions": "3;2;3;183",
        "wc_review": "794;213;431;346",
        "wc_reply_reviewers": "60;28;120;0",
        "wc_reply_authors": "980;286;781;724",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            66.0,
            30.108138434649195
        ],
        "wc_strengths_avg": [
            38.75,
            8.166241485530538
        ],
        "wc_weaknesses_avg": [
            293.5,
            225.9087205045436
        ],
        "wc_questions_avg": [
            47.75,
            78.08769109149021
        ],
        "wc_review_avg": [
            446.0,
            215.41703739490987
        ],
        "wc_reply_reviewers_avg": [
            52.0,
            44.63182720884279
        ],
        "wc_reply_authors_avg": [
            692.75,
            253.33907614104857
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:9FEcGaaj7VoJ:scholar.google.com/&scioq=Learning+to+ignore:+Single+Source+Domain+Generalization+via+Oracle+Regularization&hl=en&as_sdt=0,44",
        "gs_version_total": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "LG;Seoul National University",
        "aff_unique_dep": "LG AI Research;",
        "aff_unique_url": "https://www.lgaires.com;https://www.snu.ac.kr",
        "aff_unique_abbr": "LG AI;SNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "M36m3buBVD",
        "title": "LSPT: Long-term Spatial Prompt Tuning for Visual Representation Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Visual Prompt Tuning (VPT) techniques have gained prominence for their capacity to adapt pre-trained Vision Transformers (ViTs) to downstream visual tasks using specialized learnable tokens termed as prompts. Contemporary VPT methodologies, especially when employed with self-supervised vision transformers, often default to the introduction of new learnable prompts or gated prompt tokens predominantly sourced from the model's previous block. \nA pivotal oversight in such approaches is their failure to harness the potential of long-range previous blocks as sources of prompts within each self-supervised ViT.\nTo bridge this crucial gap, we introduce Long-term Spatial Prompt Tuning (LSPT) \u2013 a revolutionary approach to visual representation learning. \nDrawing inspiration from the intricacies of the human brain, LSPT ingeniously incorporates long-term gated prompts. \nThis feature serves as temporal coding, curbing the risk of forgetting parameters acquired from earlier blocks. \nFurther enhancing its prowess, LSPT brings into play patch tokens, serving as spatial coding. \nThis is strategically designed to perpetually amass class-conscious features, thereby fortifying the model's prowess in distinguishing and identifying visual categories.\nTo validate the efficacy of our proposed method, we engaged in rigorous experimentation across 5 FGVC and 19 VTAB-1K benchmarks. Our empirical findings underscore the superiority of LSPT, showcasing its ability to set new benchmarks in visual prompt tuning performance.",
        "keywords": "visual prompt tuning;transfer learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Shentong Mo;Yansen Wang;Dongsheng Li",
        "authorids": "~Shentong_Mo1;~Yansen_Wang2;~Dongsheng_Li2",
        "gender": ";;M",
        "homepage": ";;http://recmind.cn",
        "dblp": ";;254/0830-2.html",
        "google_scholar": ";;VNg5rA8AAAAJ",
        "orcid": ";;0000-0003-3103-8442",
        "linkedin": ";;",
        "or_profile": "~Shentong_Mo1;~Yansen_Wang2;~Dongsheng_Li2",
        "aff": ";;Microsoft Research Asia",
        "aff_domain": ";;microsoft.com",
        "position": ";;Principal Researcher",
        "bibtex": "@misc{\nmo2024lspt,\ntitle={{LSPT}: Long-term Spatial Prompt Tuning for Visual Representation Learning},\nauthor={Shentong Mo and Yansen Wang and Dongsheng Li},\nyear={2024},\nurl={https://openreview.net/forum?id=M36m3buBVD}\n}",
        "github": "",
        "project": "",
        "reviewers": "HDEH;zHY5;isM7;7rGz",
        "site": "https://openreview.net/forum?id=M36m3buBVD",
        "pdf_size": 2281983,
        "rating": "3;5;5;6",
        "confidence": "4;5;3;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "47;54;113;170",
        "wc_strengths": "21;26;53;250",
        "wc_weaknesses": "228;199;189;135",
        "wc_questions": "16;101;142;3",
        "wc_review": "312;380;497;558",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1671;1304;872;942",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;3;2;2",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            96.0,
            49.82469267341245
        ],
        "wc_strengths_avg": [
            87.5,
            94.60576092395219
        ],
        "wc_weaknesses_avg": [
            187.75,
            33.65542303997975
        ],
        "wc_questions_avg": [
            65.5,
            58.028010477699475
        ],
        "wc_review_avg": [
            436.75,
            96.32594406492989
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1197.25,
            318.89447706098645
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3458572319330373,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1979789059881375182&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "Microsoft",
        "aff_unique_dep": "Research",
        "aff_unique_url": "https://www.microsoft.com/en-us/research/group/asia",
        "aff_unique_abbr": "MSR Asia",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Asia",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "title": "The Curse of Diversity in Ensemble-Based Exploration",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18840",
        "id": "M3QXCOTTk4",
        "author_site": "Zhixuan Lin, Pierluca D'Oro, Evgenii Nikishin, Aaron Courville",
        "tldr": "",
        "abstract": "We uncover a surprising phenomenon in deep reinforcement learning: training a diverse ensemble of data-sharing agents -- a well-established exploration strategy -- can significantly impair the performance of the individual ensemble members when compared to standard single-agent training. Through careful analysis, we attribute the degradation in performance to the low proportion of self-generated data in the shared training data for each ensemble member, as well as the inefficiency of the individual ensemble members to learn from such highly off-policy data. We thus name this phenomenon *the curse of diversity*. We find that several intuitive solutions -- such as a larger replay buffer or a smaller ensemble size -- either fail to consistently mitigate the performance loss or undermine the advantages of ensembling. Finally, we demonstrate the potential of representation learning to counteract the curse of diversity with a novel method named Cross-Ensemble Representation Learning (CERL) in both discrete and continuous control domains. Our work offers valuable insights into an unexpected pitfall in ensemble-based exploration and raises important caveats for future applications of similar approaches.",
        "keywords": "deep reinforcement learning;ensemble-based exploration;off-policy learning;representation learning;auxiliary tasks",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Zhixuan Lin;Pierluca D'Oro;Evgenii Nikishin;Aaron Courville",
        "authorids": "~Zhixuan_Lin1;~Pierluca_D'Oro1;~Evgenii_Nikishin1;~Aaron_Courville3",
        "gender": "M;M;M;",
        "homepage": "https//www.zhixuanlin.com;https://proceduralia.github.io;http://evgenii-nikishin.github.io/;",
        "dblp": "254/1249;248/8326;294/4770;56/1688",
        "google_scholar": "BiyrJeMAAAAJ;https://scholar.google.it/citations?user=AuVp7pkAAAAJ;ez9FSEAAAAAJ;https://scholar.google.ca/citations?user=km6CP8cAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Zhixuan_Lin1;~Pierluca_D'Oro1;~Evgenii_Nikishin1;~Aaron_Courville3",
        "aff": "Universit\u00e9 de Montr\u00e9al;Universit\u00e9 de Montr\u00e9al;University of Montreal;Universit\u00e9 de Montr\u00e9al",
        "aff_domain": "umontreal.ca;umontreal.ca;umontreal.ca; ",
        "position": "PhD student;PhD student;PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nlin2024the,\ntitle={The Curse of Diversity in Ensemble-Based Exploration},\nauthor={Zhixuan Lin and Pierluca D'Oro and Evgenii Nikishin and Aaron Courville},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=M3QXCOTTk4}\n}",
        "github": "",
        "project": "",
        "reviewers": "H7rr;ZXyY;wgEM;5Qz1",
        "pdf_size": 5738104,
        "rating": "6;8;8;8",
        "confidence": "4;4;5;4",
        "soundness": "3;4;3;3",
        "contribution": "3;3;4;3",
        "presentation": "3;4;4;4",
        "wc_summary": "89;110;101;234",
        "wc_strengths": "47;37;85;148",
        "wc_weaknesses": "324;3;840;133",
        "wc_questions": "5;1;109;11",
        "wc_review": "465;151;1135;526",
        "wc_reply_reviewers": "18;0;76;11",
        "wc_reply_authors": "1109;33;2197;442",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "2;1;3;1",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            133.5,
            58.5
        ],
        "wc_strengths_avg": [
            79.25,
            43.54523510098436
        ],
        "wc_weaknesses_avg": [
            325.0,
            318.50196231734583
        ],
        "wc_questions_avg": [
            31.5,
            44.88596662655267
        ],
        "wc_review_avg": [
            569.25,
            356.28105127834124
        ],
        "wc_reply_reviewers_avg": [
            26.25,
            29.431063521388417
        ],
        "wc_reply_authors_avg": [
            945.25,
            818.4058818825779
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17468070322184178727&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=M3QXCOTTk4",
        "pdf": "https://openreview.net/pdf?id=M3QXCOTTk4",
        "email": "umontreal.ca;umontreal.ca;umontreal.ca; ",
        "author_num": 4,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Universit\u00e9 de Montr\u00e9al;University of Montreal",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.umontreal.ca;https://wwwumontreal.ca",
        "aff_unique_abbr": "UdeM;UM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "title": "AMAGO: Scalable In-Context Reinforcement Learning for Adaptive Agents",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18839",
        "id": "M6XWoEdmwf",
        "author_site": "Jake Grigsby, Jim Fan, Yuke Zhu",
        "tldr": "",
        "abstract": "We introduce AMAGO, an in-context Reinforcement Learning (RL) agent that uses sequence models to tackle the challenges of generalization, long-term memory, and meta-learning. Recent works have shown that off-policy learning can make in-context RL with recurrent policies viable. Nonetheless, these approaches require extensive tuning and limit scalability by creating key bottlenecks in agents' memory capacity, planning horizon, and model size. AMAGO revisits and redesigns the off-policy in-context approach to successfully train long-sequence Transformers over entire rollouts in parallel with end-to-end RL. Our agent is scalable and applicable to a wide range of problems, and we demonstrate its strong performance empirically in meta-RL and long-term memory domains. AMAGO's focus on sparse rewards and off-policy data also allows in-context learning to extend to goal-conditioned problems with challenging exploration. When combined with a multi-goal hindsight relabeling scheme, AMAGO can solve a previously difficult category of open-world domains, where agents complete many possible instructions in procedurally generated environments.",
        "keywords": "Meta-RL;Generalization;Long-Term Memory;Transformers",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/15bfe09275a056c055f122eb6f60d1aa2ef10da3.pdf",
        "author": "Jake Grigsby;Linxi Fan;Yuke Zhu",
        "authorids": "~Jake_Grigsby1;~Linxi_Fan2;~Yuke_Zhu1",
        "gender": "M;;M",
        "homepage": "https://github.com/jakegrigsby;;https://cs.utexas.edu/~yukez/",
        "dblp": "276/6109;154/6778;133/1772",
        "google_scholar": "qgUe3jYAAAAJ;sljtWIUAAAAJ;mWGyYMsAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Jake_Grigsby1;~Linxi_Fan2;~Yuke_Zhu1",
        "aff": "University of Texas at Austin;NVIDIA;Computer Science Department, University of Texas, Austin",
        "aff_domain": "cs.utexas.edu;nvidia.com;cs.utexas.edu",
        "position": "PhD student;Researcher;Assistant Professor",
        "bibtex": "@inproceedings{\ngrigsby2024amago,\ntitle={{AMAGO}: Scalable In-Context Reinforcement Learning for Adaptive Agents},\nauthor={Jake Grigsby and Linxi Fan and Yuke Zhu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=M6XWoEdmwf}\n}",
        "github": "",
        "project": "",
        "reviewers": "KbVB;WXv6;LVWP;t9aE",
        "pdf_size": 9839931,
        "rating": "6;8;8;8",
        "confidence": "4;4;3;3",
        "soundness": "3;3;3;3",
        "contribution": "3;4;2;4",
        "presentation": "3;3;4;2",
        "wc_summary": "125;85;110;40",
        "wc_strengths": "69;130;79;50",
        "wc_weaknesses": "64;288;80;136",
        "wc_questions": "82;230;20;55",
        "wc_review": "340;733;289;281",
        "wc_reply_reviewers": "30;27;5;25",
        "wc_reply_authors": "614;1605;416;439",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;5;1;1",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            90.0,
            32.21024681681281
        ],
        "wc_strengths_avg": [
            82.0,
            29.605742686174924
        ],
        "wc_weaknesses_avg": [
            142.0,
            88.43076387773658
        ],
        "wc_questions_avg": [
            96.75,
            80.01054617986307
        ],
        "wc_review_avg": [
            410.75,
            187.42248397670969
        ],
        "wc_reply_reviewers_avg": [
            21.75,
            9.832980219648569
        ],
        "wc_reply_authors_avg": [
            768.5,
            488.98594049318024
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.0,
            1.7320508075688772
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 31,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3382828115894659692&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=M6XWoEdmwf",
        "pdf": "https://openreview.net/pdf?id=M6XWoEdmwf",
        "email": "cs.utexas.edu;nvidia.com;cs.utexas.edu",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Texas at Austin;NVIDIA",
        "aff_unique_dep": ";NVIDIA Corporation",
        "aff_unique_url": "https://www.utexas.edu;https://www.nvidia.com",
        "aff_unique_abbr": "UT Austin;NVIDIA",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Austin;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "M6kpUtpQZQ",
        "title": "Can Synthetic Data Reduce Conservatism of Distributionally Robust Adversarial Training?",
        "track": "main",
        "status": "Desk Reject",
        "tldr": "",
        "abstract": "When the inputs of a machine learning model are subject to adversarial attacks, standard stationarity assumptions on the training and test sets are violated, typically making empirical risk minimization (ERM) ineffective. Adversarial training, which imitates the adversary during the training stage, has thus emerged as the *de facto* standard for hedging against adversarial attacks. Although adversarial training provides some robustness over ERM, it can still be subject to overfitting, which explains why recent work mixing the training set with synthetic data obtains improved out-of-sample performances. Inspired by these observations, we develop a Wasserstein distributionally robust (DR) counterpart of adversarial training for improved generalization and provide a recipe for further reducing the conservatism of this approach by adjusting its ambiguity set with respect to synthetic data. The underlying optimization problem, DR adversarial training with synthetic data, is nonconvex and comprises infinitely many constraints. To this end, by using results from robust optimization and convex analysis, we develop tractable relaxations. We focus our analyses on the logistic loss function and provide discussions for adapting this framework to several other loss functions. We demonstrate the superiority of this approach on artificial as well as standard benchmark problems.",
        "keywords": "Synthetic Data;Adversarial Robustness;Distributionally Robust Optimization;Classification",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Aras Selvi;Eleonora Kreacic;Mohsen Ghassemi;Vamsi K. Potluru;Tucker Balch;Manuela Veloso",
        "authorids": "~Aras_Selvi1;~Eleonora_Kreacic1;~Mohsen_Ghassemi1;~Vamsi_K._Potluru1;~Tucker_Balch2;~Manuela_Veloso1",
        "gender": "M;F;M;Not Specified;M;F",
        "homepage": "https://www.imperial.ac.uk/people/a.selvi19;;;;;https://www.cs.cmu.edu/~mmv/",
        "dblp": "334/9751;;178/5184;21/4837;;v/ManuelaMVeloso",
        "google_scholar": "LlRWaQMAAAAJ;;;uC_8kekAAAAJ;jM1cT4QAAAAJ;https://scholar.google.com.tw/citations?user=2FbkAzYAAAAJ",
        "orcid": "0000-0001-7019-3635;;;;0000-0002-5148-2033;",
        "linkedin": "arasselvi/;eleonora-kreacic-3b1a84164/?originalSubdomain=uk;mohsenghassemi/;;;",
        "or_profile": "~Aras_Selvi1;~Eleonora_Kreacic1;~Mohsen_Ghassemi1;~Vamsi_K._Potluru1;~Tucker_Balch2;~Manuela_Veloso1",
        "aff": "Imperial College London;J.P. Morgan Chase;JPMorganChase;J.P. Morgan Chase;J.P. Morgan Chase;School of Computer Science, Carnegie Mellon University",
        "aff_domain": "imperial.ac.uk;jpmorgan.com;jpmorgan.com;jpmorgan.com;jpmorgan.com;cs.cmu.edu",
        "position": "PhD student;Researcher;Researcher;Researcher;Managing Director;Full Professor",
        "bibtex": "@misc{\nselvi2024can,\ntitle={Can Synthetic Data Reduce Conservatism of Distributionally Robust Adversarial Training?},\nauthor={Aras Selvi and Eleonora Kreacic and Mohsen Ghassemi and Vamsi K. Potluru and Tucker Balch and Manuela Veloso},\nyear={2024},\nurl={https://openreview.net/forum?id=M6kpUtpQZQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=M6kpUtpQZQ",
        "pdf_size": 497100,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:jw8leBZXsTEJ:scholar.google.com/&scioq=Can+Synthetic+Data+Reduce+Conservatism+of+Distributionally+Robust+Adversarial+Training%3F&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1;1;2",
        "aff_unique_norm": "Imperial College London;JPMorgan Chase & Co.;Carnegie Mellon University",
        "aff_unique_dep": ";;School of Computer Science",
        "aff_unique_url": "https://www.imperial.ac.uk;https://www.jpmorganchase.com;https://www.cmu.edu",
        "aff_unique_abbr": "ICL;JPM;CMU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Pittsburgh",
        "aff_country_unique_index": "0;1;1;1;1;1",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "id": "M8J0b9gNfG",
        "title": "Multilingual Visual Speech Recognition with a Single Model using Visual Speech Unit",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper explores sentence-level Multilingual Visual Speech Recognition with a single model for the first time. As the massive multilingual modeling of visual data requires huge computational costs, we propose a novel strategy, processing with visual speech units. Motivated by the recent success of the audio speech unit, the proposed visual speech unit is obtained by discretizing the visual speech features extracted from the self-supervised visual speech model. To this end, we introduce multilingual AV-HuBERT (mAV-HuBERT) by training the model on 5,512 hours of multilingual audio-visual data. Through analysis, we verify that the visual speech units mainly contain viseme information while suppressing non-linguistic information. By using the visual speech units as the inputs of our system, we pre-train the model to predict corresponding text outputs on massive multilingual data constructed by merging several VSR databases. As both the inputs and outputs are discrete, we can greatly improve the training efficiency compared to the standard VSR training. Specifically, the input data size is reduced to 0.016% of the original video inputs. In order to complement the insufficient visual information in speech recognition, we apply curriculum learning where the inputs of the system begin with audio-visual speech units and gradually change to visual speech units. After pre-training, the model is finetuned on continuous features. We set new state-of-the-art multilingual VSR performances by achieving comparable performances to the previous language-specific VSR models, with a single trained model.",
        "keywords": "Visual Speech Unit;Visual Speech Recognition;Lip Reading;Discrete Tokens;Multilingual Lip Reading;Multilingual Speech Processing",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/6eb6181ff884097a07afec370110d0f6a3bcc56c.zip",
        "author": "Minsu Kim;Jeonghun Yeo;Jeongsoo Choi;Se Jin Park;Yong Man Ro",
        "authorids": "~Minsu_Kim1;~Jeonghun_Yeo1;~Jeongsoo_Choi1;~Se_Jin_Park2;~Yong_Man_Ro3",
        "gender": "M;M;M;F;M",
        "homepage": "https://sites.google.com/view/ms-dot-k;https://github.com/JeongHun0716;https://choijeongsoo.github.io;https://sites.google.com/view/sejinpark/sejinpark;https://www.ivllab.kaist.ac.kr/people/professor",
        "dblp": ";317/6977;324/0718;40/297;02/1221",
        "google_scholar": "TXB0FyoAAAAJ;https://scholar.google.co.kr/citations?user=PJoYv2cAAAAJ;WPcjsEkAAAAJ;X-SyELwAAAAJ;https://scholar.google.co.kr/citations?user=IPzfF7cAAAAJ",
        "orcid": "0000-0002-6514-0018;;0009-0005-6817-604X;0000-0001-8467-3576;0000-0001-5306-6853",
        "linkedin": "minsu-kim-1702a61a3/;;jeongsoo-choi-a2b860288;se-jin-park-497546266;",
        "or_profile": "~Minsu_Kim1;~Jeonghun_Yeo1;~Jeongsoo_Choi1;~Se_Jin_Park2;~Yong_Man_Ro1",
        "aff": "Korea Advanced Institute of Science & Technology;KAIST;Korea Advanced Institute of Science & Technology;KAIST;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;ee.kaist.ac.kr;kaist.ac.kr;ee.kaist.ac.kr;kaist.ac.kr",
        "position": "PhD student;PhD student;PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nkim2024multilingual,\ntitle={Multilingual Visual Speech Recognition with a Single Model using Visual Speech Unit},\nauthor={Minsu Kim and Jeonghun Yeo and Jeongsoo Choi and Se Jin Park and Yong Man Ro},\nyear={2024},\nurl={https://openreview.net/forum?id=M8J0b9gNfG}\n}",
        "github": "",
        "project": "",
        "reviewers": "JHaL;RNNa;tK3Y;uTmt;SxNH",
        "site": "https://openreview.net/forum?id=M8J0b9gNfG",
        "pdf_size": 2243031,
        "rating": "5;6;6;6;8",
        "confidence": "4;3;4;3;4",
        "soundness": "3;3;3;3;3",
        "contribution": "2;3;2;2;3",
        "presentation": "3;3;2;2;3",
        "wc_summary": "71;163;59;89;48",
        "wc_strengths": "29;156;60;83;14",
        "wc_weaknesses": "111;266;126;58;4",
        "wc_questions": "144;95;101;74;196",
        "wc_review": "355;680;346;304;262",
        "wc_reply_reviewers": "0;53;16;188;4",
        "wc_reply_authors": "836;963;759;773;737",
        "reply_reviewers": "0;1;1;1;1",
        "reply_authors": "2;2;1;2;1",
        "rating_avg": [
            6.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            86.0,
            40.831360496559505
        ],
        "wc_strengths_avg": [
            68.4,
            49.9383620075789
        ],
        "wc_weaknesses_avg": [
            113.0,
            87.73596753897458
        ],
        "wc_questions_avg": [
            122.0,
            43.43731115066861
        ],
        "wc_review_avg": [
            389.4,
            149.02295125248327
        ],
        "wc_reply_reviewers_avg": [
            52.2,
            70.42840336114402
        ],
        "wc_reply_authors_avg": [
            813.6,
            81.63234653003673
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            1.6,
            0.4898979485566356
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.16666666666666663,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:9R8n6yfyl08J:scholar.google.com/&scioq=Multilingual+Visual+Speech+Recognition+with+a+Single+Model+using+Visual+Speech+Unit&hl=en&as_sdt=0,23",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "M8Q3XTUJP9",
        "title": "How does overparametrization affect features?",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Overparametrization, the condition where models have more parameters than necessary to fit their training loss, is a crucial factor for the success of deep learning. However, the characteristics of the features learned by overparametrized networks are not well understood. In this work, we explore this question by comparing models with the same architecture but different widths. We first examine the expressivity of the features of these models, and show that the feature space of overparametrized networks cannot be spanned by concatenating many underparametrized features, and vice versa. This reveals that both overparametrized and underparametrized networks acquire some distinctive features. We then evaluate the performance of these models, and find that overparametrized networks outperform underparametrized networks, even when many of the latter are concatenated. We corroborate these findings using a VGG-16 and ResNet18 on CIFAR-10 and a Transformer on the MNLI classification dataset. Finally, we propose a toy setting to explain how overparametrized networks can learn some important features that the underparamaterized networks cannot learn.",
        "keywords": "deep learning;overparametrization",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/62f2ff598e76418daf0815f348561ec82034da7a.zip",
        "author": "Ahmet Cagri Duzgun;Samy Jelassi;Yuanzhi Li",
        "authorids": "~Ahmet_Cagri_Duzgun1;~Samy_Jelassi1;~Yuanzhi_Li1",
        "gender": ";M;M",
        "homepage": ";https://sjelassi.github.io/;",
        "dblp": ";222/3149;73/3628",
        "google_scholar": ";;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Ahmet_Cagri_Duzgun1;~Samy_Jelassi1;~Yuanzhi_Li1",
        "aff": ";Harvard University;Carnegie Mellon University",
        "aff_domain": ";harvard.edu;andrew.cmu.edu",
        "position": ";Postdoc;Assistant Professor",
        "bibtex": "@misc{\nduzgun2024how,\ntitle={How does overparametrization affect features?},\nauthor={Ahmet Cagri Duzgun and Samy Jelassi and Yuanzhi Li},\nyear={2024},\nurl={https://openreview.net/forum?id=M8Q3XTUJP9}\n}",
        "github": "",
        "project": "",
        "reviewers": "Y4Do;Si1X;6Vs9;3arT",
        "site": "https://openreview.net/forum?id=M8Q3XTUJP9",
        "pdf_size": 1013693,
        "rating": "3;3;3;6",
        "confidence": "3;4;4;4",
        "soundness": "2;1;2;4",
        "contribution": "2;2;2;2",
        "presentation": "1;2;2;4",
        "wc_summary": "155;92;95;70",
        "wc_strengths": "28;21;39;48",
        "wc_weaknesses": "297;317;182;197",
        "wc_questions": "151;68;3;81",
        "wc_review": "631;498;319;396",
        "wc_reply_reviewers": "114;104;18;65",
        "wc_reply_authors": "302;367;238;425",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;2;1;2",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            1.0897247358851685
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            103.0,
            31.535694062442957
        ],
        "wc_strengths_avg": [
            34.0,
            10.319883720275147
        ],
        "wc_weaknesses_avg": [
            248.25,
            59.41117319158072
        ],
        "wc_questions_avg": [
            75.75,
            52.54224490826405
        ],
        "wc_review_avg": [
            461.0,
            116.89525225602621
        ],
        "wc_reply_reviewers_avg": [
            75.25,
            37.784752215675574
        ],
        "wc_reply_authors_avg": [
            333.0,
            70.01071346586892
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:z3g-dARe2C0J:scholar.google.com/&scioq=How+does+overparametrization+affect+features%3F&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Harvard University;Carnegie Mellon University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.harvard.edu;https://www.cmu.edu",
        "aff_unique_abbr": "Harvard;CMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "M8mGHjwFZV",
        "title": "How to Guess a Gradient",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "How much can you say about the gradient of a neural network without computing a loss or knowing the label? This may sound like a strange question: surely the answer is \"very little.\" However, in this paper, we show that gradients are more structured than previously thought. Gradients lie in a predictable low-dimensional subspace which depends on the network architecture and incoming features.\n\nExploiting this structure can significantly improve gradient-free optimization schemes based on directional derivatives, which until now have struggled to scale beyond small networks trained on MNIST. We study how to narrow the gap in optimization performance between methods that calculate exact gradients and those that use directional derivatives, demonstrate new phenomena that occur when using these methods, and highlight new challenges in scaling these methods.",
        "keywords": "optimization for deep learning;directional derivative",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Utkarsh Singhal;Brian Cheung;Kartik Chandra;Jonathan Ragan-Kelley;Joshua B. Tenenbaum;Tomaso A Poggio;Stella X. Yu",
        "authorids": "~Utkarsh_Singhal1;~Brian_Cheung1;~Kartik_Chandra2;~Jonathan_Ragan-Kelley1;~Joshua_B._Tenenbaum1;~Tomaso_A_Poggio2;~Stella_X._Yu2",
        "gender": "M;M;;M;;F;M",
        "homepage": ";https://briancheung.github.io/;https://cs.stanford.edu/~kach/;https://people.csail.mit.edu/jrk;;http://www.eecs.umich.edu/~stellayu;https://cbmm.mit.edu/about/people/poggio",
        "dblp": ";;07/5865.html;;t/JoshuaBTenenbaum;58/5089;12/5544",
        "google_scholar": "lvA86MYAAAAJ;7N-ethYAAAAJ;oVcz4nIAAAAJ;https://scholar.google.com.tw/citations?user=nBcay4oAAAAJ;;https://scholar.google.com/citations?hl=en;WgAGy7wAAAAJ",
        "orcid": ";;0000-0002-1835-3707;;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Utkarsh_Singhal1;~Brian_Cheung1;~Kartik_Chandra2;~Jonathan_Ragan-Kelley1;~Joshua_B._Tenenbaum1;~Stella_Yu2;~Tomaso_Poggio1",
        "aff": "University of California, Berkeley;Massachusetts Institute of Technology;Massachusetts Institute of Technology;Adobe Systems;Massachusetts Institute of Technology;University of California, Berkeley;Massachusetts Institute of Technology",
        "aff_domain": "berkeley.edu;mit.edu;mit.edu;adobe.com;mit.edu;berkeley.edu;mit.edu",
        "position": "PhD student;Research Fellow;PhD student;Researcher;Professor;Adjunct Professor;Full Professor",
        "bibtex": "@misc{\nsinghal2024how,\ntitle={How to Guess a Gradient},\nauthor={Utkarsh Singhal and Brian Cheung and Kartik Chandra and Jonathan Ragan-Kelley and Joshua B. Tenenbaum and Tomaso A Poggio and Stella X. Yu},\nyear={2024},\nurl={https://openreview.net/forum?id=M8mGHjwFZV}\n}",
        "github": "",
        "project": "",
        "reviewers": "Gf7u;xG3Y;Nqba;58v1",
        "site": "https://openreview.net/forum?id=M8mGHjwFZV",
        "pdf_size": 5367828,
        "rating": "5;6;6;6",
        "confidence": "4;3;4;4",
        "soundness": "3;2;3;3",
        "contribution": "3;2;3;3",
        "presentation": "4;2;3;3",
        "wc_summary": "171;406;67;140",
        "wc_strengths": "77;134;29;52",
        "wc_weaknesses": "133;1153;45;514",
        "wc_questions": "298;139;2;31",
        "wc_review": "679;1832;143;737",
        "wc_reply_reviewers": "508;165;0;0",
        "wc_reply_authors": "574;1345;175;490",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            196.0,
            126.98621972481897
        ],
        "wc_strengths_avg": [
            73.0,
            39.096035604649224
        ],
        "wc_weaknesses_avg": [
            461.25,
            436.55261710359724
        ],
        "wc_questions_avg": [
            117.5,
            116.04417262404864
        ],
        "wc_review_avg": [
            847.75,
            613.6291123308932
        ],
        "wc_reply_reviewers_avg": [
            168.25,
            207.39861981218678
        ],
        "wc_reply_authors_avg": [
            646.0,
            430.105219684672
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18031787159648163943&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;1;1;2;1;0;1",
        "aff_unique_norm": "University of California, Berkeley;Massachusetts Institute of Technology;Adobe",
        "aff_unique_dep": ";;Adobe Systems Incorporated",
        "aff_unique_url": "https://www.berkeley.edu;https://web.mit.edu;https://www.adobe.com",
        "aff_unique_abbr": "UC Berkeley;MIT;Adobe",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Berkeley;",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "M9nKQX5nYF",
        "title": "On the Effect of Defection in Federated Learning and How to Prevent It",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Federated learning is a machine learning protocol that enables a large population of agents to collaborate. These agents communicate over multiple rounds to produce a single, consensus model. Despite this collaborative framework, there are instances where agents may choose to defect permanently\u2014essentially withdrawing from the collaboration\u2014if they are content with their instantaneous model in that round. This work demonstrates the detrimental impact such defections can have on the final model's robustness and ability to generalize. We also show that current federated optimization algorithms fall short in disincentivizing these harmful defections. To address this, we introduce a novel optimization algorithm with theoretical guarantees to prevent defections while ensuring asymptotic convergence to an effective solution for all participating agents. We also provide numerical experiments to corroborate our findings and demonstrate the effectiveness of our algorithm.",
        "keywords": "Incentive Design;Optimization;Robustness;Federated Learning;Fairness;Adaptive Optimization",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/e309c79061e3598e7e6e995c5e8ff1ee66c46589.zip",
        "author": "Minbiao Han;Kumar Kshitij Patel;Han Shao;Lingxiao Wang",
        "authorids": "~Minbiao_Han1;~Kumar_Kshitij_Patel2;~Han_Shao4;~Lingxiao_Wang5",
        "gender": ";F;M;M",
        "homepage": "https://people.cs.uchicago.edu/~minbiaohan/;https://sites.google.com/view/hanshao/;https://lingxiaowang-ai.github.io/;https://kishinmh.github.io/",
        "dblp": "193/2175;;140/1229-1;239/8754",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;VPyxd6kAAAAJ;https://scholar.google.cl/citations?user=Okd0qN0AAAAJ",
        "orcid": ";0009-0005-9206-1357;;0000-0002-6886-6826",
        "linkedin": ";;;kumar-kshitij-patel-604a4651/",
        "or_profile": "~Minbiao_Han1;~Han_Shao4;~Lingxiao_Wang5;~Kumar_Kshitij_Patel1",
        "aff": "University of Chicago;Toyota Technological Institute at Chicago;Toyota Technological Institute at Chicago;Toyota Technological Institute at Chicago",
        "aff_domain": "uchicago.edu;ttic.edu;ttic.edu;ttic.edu",
        "position": "PhD student;PhD student;Research assistant professor;PhD student",
        "bibtex": "@misc{\nhan2024on,\ntitle={On the Effect of Defection in Federated Learning and How to Prevent It},\nauthor={Minbiao Han and Kumar Kshitij Patel and Han Shao and Lingxiao Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=M9nKQX5nYF}\n}",
        "github": "",
        "project": "",
        "reviewers": "bhy3;sato;y9Cn;VX8w",
        "site": "https://openreview.net/forum?id=M9nKQX5nYF",
        "pdf_size": 2441786,
        "rating": "3;3;3;6",
        "confidence": "4;4;4;3",
        "soundness": "1;3;2;3",
        "contribution": "1;2;2;2",
        "presentation": "2;3;2;3",
        "wc_summary": "74;117;41;101",
        "wc_strengths": "49;76;36;133",
        "wc_weaknesses": "347;118;292;110",
        "wc_questions": "47;48;3;35",
        "wc_review": "517;359;372;379",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1251;505;1074;389",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;2;1",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            83.25,
            28.830322578840494
        ],
        "wc_strengths_avg": [
            73.5,
            37.259227045122664
        ],
        "wc_weaknesses_avg": [
            216.75,
            104.61208104229645
        ],
        "wc_questions_avg": [
            33.25,
            18.198557635153396
        ],
        "wc_review_avg": [
            406.75,
            64.05612773185716
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            804.75,
            365.4903384495957
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:G4hvDxy5vm8J:scholar.google.com/&scioq=On+the+Effect+of+Defection+in+Federated+Learning+and+How+to+Prevent+It&hl=en&as_sdt=0,30",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "University of Chicago;Toyota Technological Institute at Chicago",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uchicago.edu;https://www.tti-chicago.org",
        "aff_unique_abbr": "UChicago;TTI Chicago",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Chicago",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "MACKSU3xed",
        "title": "PeriodNet:Lightweight And Efficient Time Series Prediction Model Based On Periodic Characteristics",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The task of multivariate time series prediction has always been a challenging task. In this field, various related methods emerge in endlessly, whether based on fully connected, convolutional neural networks or attention-based models, all have achieved remarkable results. However, current long-term prediction tasks mainly rely on complex attention mechanisms or causal convolutions, which result in huge computational costs and are not suitable for edge devices or scenarios with limited computing resources. Therefore, our research focuses on lightweight time series prediction model exploration. Our main work focuses on the analysis of time series data, focusing on the importance of periodic features and the fusion of local features and global features. Based on the mathematical idea of Fourier series, we designed a simple and lightweight module for extracting periodic features; and designed a lightweight module that can effectively fuse local information and global information, thereby enhancing Feature representation and prediction performance. By comparing with the current state-of-the-art results, we verified the effectiveness of the module we designed. On 7 benchmark data sets including etth1, etth2 and ili etc., our model achieved significant performance improvements compared to the state-of-the-art results. The specific code of our research results can be found at https://github.com/sep21Be/periodNet.",
        "keywords": "Time Series Analysis;Multivariate Timeseries Forecasting;Local And Global Context",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Xiaofu Wu;Lanqing Jiang",
        "authorids": "~Xiaofu_Wu1;~Lanqing_Jiang1",
        "gender": "M;F",
        "homepage": "https://blog.csdn.net/ngsford;https://blog.csdn.net/ngsford?spm=1000.2115.3001.5343",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Xiaofu_Wu1;~Lanqing_Jiang1",
        "aff": ";",
        "aff_domain": ";",
        "position": ";",
        "bibtex": "@misc{\nwu2024periodnetlightweight,\ntitle={PeriodNet:Lightweight And Efficient Time Series Prediction Model Based On Periodic Characteristics},\nauthor={Xiaofu Wu and Lanqing Jiang},\nyear={2024},\nurl={https://openreview.net/forum?id=MACKSU3xed}\n}",
        "github": "",
        "project": "",
        "reviewers": "2gri;EjZd;43FS;d1My",
        "site": "https://openreview.net/forum?id=MACKSU3xed",
        "pdf_size": 479261,
        "rating": "1;3;3;3",
        "confidence": "4;4;4;4",
        "soundness": "1;1;2;2",
        "contribution": "1;1;2;2",
        "presentation": "2;1;1;3",
        "wc_summary": "100;150;79;72",
        "wc_strengths": "19;53;97;16",
        "wc_weaknesses": "85;183;240;108",
        "wc_questions": "473;347;34;1",
        "wc_review": "677;733;450;197",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            1.5,
            0.5
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            100.25,
            30.515364982251153
        ],
        "wc_strengths_avg": [
            46.25,
            32.706077416896086
        ],
        "wc_weaknesses_avg": [
            154.0,
            61.46950463441201
        ],
        "wc_questions_avg": [
            213.75,
            201.58047400480038
        ],
        "wc_review_avg": [
            514.25,
            211.60975284707462
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:xi-uWF9lzjQJ:scholar.google.com/&scioq=PeriodNet:Lightweight+And+Efficient+Time+Series+Prediction+Model+Based+On+Periodic+Characteristics&hl=en&as_sdt=0,33",
        "gs_version_total": 0
    },
    {
        "id": "MBIGXMT0qC",
        "title": "Multi-Scale Protein Language Model for Unified Molecular Modeling",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Protein language models have shown great potential in protein engineering. However, the current protein language models mainly work in the residue scale, which cannot offer information in the atom scale. The strong power of protein language models could not be fully exploited to benefit the applications that cross protein and small molecules. In this paper, we propose msESM(multi-scale ESM) to realize the multi-scale unified molecular modeling by pre-training on multi-scale code-switch protein sequence and describing relationships among residues and atoms with a multi-scale position encoding. Experimental results show that msESM outperforms previous methods in protein-molecule tasks and is on par with the state-of-the-art in protein-only and molecule-only tasks.",
        "keywords": "Protein Pre-training;Unified Molecular Modeling",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/a827152820041b44e67054d463e72985bafcbffa.zip",
        "author": "Kangjie Zheng;Siyu Long;Tianyu Lu;Xinyu Dai;Ming Zhang;Zaiqing Nie;Wei-Ying Ma;Hao Zhou",
        "authorids": "~Kangjie_Zheng1;~Siyu_Long1;~Tianyu_Lu2;~Xinyu_Dai1;~Ming_Zhang5;~Zaiqing_Nie2;~Wei-Ying_Ma2;~Hao_Zhou5",
        "gender": "M;M;M;M;F;M;M;M",
        "homepage": "https://scholar.google.com/citations?user=n8kbAwQAAAAJ&hl=en;https://longlongman.github.io;https://github.com/lutianyu21?tab=repositories;http://cs.nju.edu.cn/daixinyu;https://cs.pku.edu.cn/info/1080/1371.htm;https://air.tsinghua.edu.cn/en/info/1046/1192.htm;https://air.tsinghua.edu.cn/en/info/1046/1189.htm;https://zhouh.github.io/",
        "dblp": ";234/9275;;39/5815;73/1844-4;n/ZaiqingNie;m/WYMa.html;63/778-12",
        "google_scholar": "n8kbAwQAAAAJ;aOfk1hsAAAAJ;;https://scholar.google.com/citations?hl=en;LbzoQBsAAAAJ;;SToCbu8AAAAJ;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": ";0000-0002-9944-4837;;;0000-0002-9809-3430;0000-0002-1134-2343;;",
        "linkedin": ";siyulong;;;;;wei-ying-ma-16a0171/;",
        "or_profile": "~Kangjie_Zheng1;~Siyu_Long1;~Tianyu_Lu2;~Xinyu_Dai1;~Ming_Zhang5;~Zaiqing_Nie2;~Wei-Ying_Ma2;~Hao_Zhou5",
        "aff": "Tsinghua University;Nanjing University;Tsinghua University;Nanjing University;Peking University;Tsinghua University;Tsinghua University;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;nju.edu.cn;tsinghua.edu.cn;nju.edu.cn;pku.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "Intern;PhD student;Undergrad student;Full Professor;Full Professor;Full Professor;Full Professor;Associate Professor",
        "bibtex": "@misc{\nzheng2024multiscale,\ntitle={Multi-Scale Protein Language Model for Unified Molecular Modeling},\nauthor={Kangjie Zheng and Siyu Long and Tianyu Lu and Xinyu Dai and Ming Zhang and Zaiqing Nie and Wei-Ying Ma and Hao Zhou},\nyear={2024},\nurl={https://openreview.net/forum?id=MBIGXMT0qC}\n}",
        "github": "",
        "project": "",
        "reviewers": "54HD;ZacV;p5PD;VsVJ",
        "site": "https://openreview.net/forum?id=MBIGXMT0qC",
        "pdf_size": 710259,
        "rating": "3;5;6;6",
        "confidence": "5;4;3;3",
        "soundness": "1;2;3;3",
        "contribution": "1;2;2;2",
        "presentation": "3;2;3;3",
        "wc_summary": "98;135;90;37",
        "wc_strengths": "60;23;31;13",
        "wc_weaknesses": "112;155;168;27",
        "wc_questions": "357;2;78;35",
        "wc_review": "627;315;367;112",
        "wc_reply_reviewers": "840;65;25;266",
        "wc_reply_authors": "4206;2239;1523;1555",
        "reply_reviewers": "3;1;1;1",
        "reply_authors": "9;6;5;5",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            90.0,
            34.99285641384538
        ],
        "wc_strengths_avg": [
            31.75,
            17.512495538900218
        ],
        "wc_weaknesses_avg": [
            115.5,
            55.13846207503434
        ],
        "wc_questions_avg": [
            118.0,
            140.59338533515722
        ],
        "wc_review_avg": [
            355.25,
            183.55976547163053
        ],
        "wc_reply_reviewers_avg": [
            299.0,
            325.42357013590765
        ],
        "wc_reply_authors_avg": [
            2380.75,
            1091.9281970441098
        ],
        "reply_reviewers_avg": [
            1.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            6.25,
            1.6393596310755
        ],
        "replies_avg": [
            40,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.9847319278346618,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2040500218801074162&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;0;1;2;0;0;0",
        "aff_unique_norm": "Tsinghua University;Nanjing University;Peking University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.nju.edu.cn;http://www.pku.edu.cn",
        "aff_unique_abbr": "THU;Nanjing U;Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "MBMusjwfBk",
        "title": "Prediction-Consistent Koopman Autoencoders",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Data-driven modeling of high-dimensional spatio-temporal dynamical systems, which are often governed by nonlinear partial differential equations (PDEs), poses a serious challenge in the absence of sufficient or high-quality training data. Recently developed Koopman autoencoders (KAEs) leverage the expressivity of deep neural networks (DNNs) and the spectral structure of Koopman operator to learn a reduced-order feature space exhibiting simpler linear dynamics. However, limited and noisy training datasets present a significant roadblock and results in a lack of generalizability due to inconsistency in training data. In this paper we propose the prediction-consistent Koopman autoencoder (pcKAE) which is capable of generating accurate long-term predictions even with limited and noisy training data. We introduce a consistency regularization term that enforces consistency among predictions at different time-steps, making pcKAE more robust and generalizable compared to its counterparts. An analytical justification is presented for such consistency regularization using the Koopman spectral theory. Experimentally, we demonstrate that with limited training data, pcKAE outperforms existing state-of-the-art KAE models for several test-cases, ranging from simple pendulum to kinetic plasmas, fluid flows and sea surface temperature data.",
        "keywords": "Scientific machine learning;nonlinear dynamics;time-series forecasting;long-term predictions;Koopman operator;Koopman autoencoders;prediction consistency;consistency regularization;limited training data;noisy training data",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/e400eea5674b5a61b59df47bec3c4f12a4aa61cc.pdf",
        "author": "Indranil Nayak;Debdipta Goswami;Mrinal Kumar;Fernando L. Teixeira",
        "authorids": "~Indranil_Nayak1;~Debdipta_Goswami1;~Mrinal_Kumar1;~Fernando_L._Teixeira1",
        "gender": "M;M;M;M",
        "homepage": ";http://goswami78.github.io;https://mae.osu.edu/laddcs;https://u.osu.edu/teixeira.5/",
        "dblp": ";138/6137;;21/8788.html",
        "google_scholar": "up83p8sAAAAJ;https://scholar.google.co.in/citations?user=Jzpca2gAAAAJ;uHeRPbIAAAAJ;",
        "orcid": "0000-0003-4702-941X;;0000-0001-9747-9449;",
        "linkedin": "indranil-nayak-974922106;;mrinal-kumar-a7804a14/;",
        "or_profile": "~Indranil_Nayak1;~Debdipta_Goswami1;~Mrinal_Kumar1;~Fernando_Teixeira1",
        "aff": "Ohio State University, Columbus;Ohio State University, Columbus;Ohio State University, Columbus;Ohio State University",
        "aff_domain": "osu.edu;osu.edu;osu.edu;osu.edu",
        "position": "PhD student;Assistant Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nnayak2024predictionconsistent,\ntitle={Prediction-Consistent Koopman Autoencoders},\nauthor={Indranil Nayak and Debdipta Goswami and Mrinal Kumar and Fernando L. Teixeira},\nyear={2024},\nurl={https://openreview.net/forum?id=MBMusjwfBk}\n}",
        "github": "",
        "project": "",
        "reviewers": "NiJE;dPS3;41Am;RvL6",
        "site": "https://openreview.net/forum?id=MBMusjwfBk",
        "pdf_size": 604078,
        "rating": "1;1;3;8",
        "confidence": "5;5;4;2",
        "soundness": "2;1;3;4",
        "contribution": "1;1;1;3",
        "presentation": "2;1;2;3",
        "wc_summary": "64;66;46;75",
        "wc_strengths": "23;18;20;114",
        "wc_weaknesses": "71;503;141;51",
        "wc_questions": "251;73;2;27",
        "wc_review": "409;660;209;267",
        "wc_reply_reviewers": "75;335;79;0",
        "wc_reply_authors": "555;2035;277;226",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "1;4;2;1",
        "rating_avg": [
            3.25,
            2.8613807855648994
        ],
        "confidence_avg": [
            4.0,
            1.224744871391589
        ],
        "soundness_avg": [
            2.5,
            1.118033988749895
        ],
        "contribution_avg": [
            1.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            62.75,
            10.520812706250407
        ],
        "wc_strengths_avg": [
            43.75,
            40.59787556018172
        ],
        "wc_weaknesses_avg": [
            191.5,
            182.92279792305823
        ],
        "wc_questions_avg": [
            88.25,
            97.35341545112837
        ],
        "wc_review_avg": [
            386.25,
            173.9933547581631
        ],
        "wc_reply_reviewers_avg": [
            122.25,
            126.79782135352326
        ],
        "wc_reply_authors_avg": [
            773.25,
            739.1536968046632
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9987269250089902,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:dr5oGJLyVp8J:scholar.google.com/&scioq=Prediction-Consistent+Koopman+Autoencoders&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Ohio State University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.osu.edu",
        "aff_unique_abbr": "OSU",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Columbus;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "MBYHrkgxKf",
        "title": "BENCHMARKING SEQUENTIAL VISUAL INPUT REASONING AND PREDICTION IN MULTIMODAL LARGE LANGUAGE MODELS",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Multimodal large language models (MLLMs) have shown great potential in perception and interpretation tasks, but their capabilities in predictive reasoning remain under-explored. To address this gap, we introduce a novel benchmark that assesses the predictive reasoning capabilities of MLLMs across diverse scenarios. Our benchmark targets three important domains: abstract pattern reasoning, human activity prediction, and physical interaction prediction. We further develop three evaluation methods powered by large language model to robustly quantify a model's performance in predicting and reasoning the future based on multi-visual context. Empirical experiments confirm the soundness of the proposed benchmark and evaluation methods via rigorous testing and reveal pros and cons of current popular MLLMs in the task of predictive reasoning. Lastly, our proposed benchmark provides a standardized evaluation framework for MLLMs and can facilitate the development of more advanced models that can reason and predict over complex long sequence of multimodal input.",
        "keywords": "multimodal foundation model evaluation;vision-and-language",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/4f2e955eec43b2b034331a83935432187d4196bf.pdf",
        "author": "Mingwei Zhu;Leigang Sha;Yu Shu;Kangjia Zhao;Tiancheng Zhao;Jianwei Yin",
        "authorids": "~Mingwei_Zhu2;shaleigang@zju.edu.cn;shu_yu@zju.edu.cn;konkaz@zju.edu.cn;~Tiancheng_Zhao1;~Jianwei_Yin1",
        "gender": "M;;;;M;M",
        "homepage": "https://github.com/CoderJ-ONE/MLM-PIC;;;;https://www.tianchez.com;https://person.zju.edu.cn/0001038",
        "dblp": ";;;;177/8774;74/3786",
        "google_scholar": ";;;;3RwJTyUAAAAJ;0s1A5fwAAAAJ",
        "orcid": ";;;;0000-0002-4166-6189;0000-0003-4703-7348",
        "linkedin": ";;;;;",
        "or_profile": "~Mingwei_Zhu2;shaleigang@zju.edu.cn;shu_yu@zju.edu.cn;konkaz@zju.edu.cn;~Tiancheng_Zhao1;~Jianwei_Yin1",
        "aff": "Zhejiang University;;;;Binjiang Institute of Zhejiang University;Zhejiang University",
        "aff_domain": "zju.edu.cn;;;;zju-bj.com;zju.edu.cn",
        "position": "MS student;;;;Principal Researcher;Full Professor",
        "bibtex": "@misc{\nzhu2024benchmarking,\ntitle={{BENCHMARKING} {SEQUENTIAL} {VISUAL} {INPUT} {REASONING} {AND} {PREDICTION} {IN} {MULTIMODAL} {LARGE} {LANGUAGE} {MODELS}},\nauthor={Mingwei Zhu and Leigang Sha and Yu Shu and Kangjia Zhao and Tiancheng Zhao and Jianwei Yin},\nyear={2024},\nurl={https://openreview.net/forum?id=MBYHrkgxKf}\n}",
        "github": "",
        "project": "",
        "reviewers": "v1k7;wwba;aC6M;SwvU",
        "site": "https://openreview.net/forum?id=MBYHrkgxKf",
        "pdf_size": 4778635,
        "rating": "3;3;5;5",
        "confidence": "4;4;5;4",
        "soundness": "2;2;2;3",
        "contribution": "2;3;2;2",
        "presentation": "2;2;2;3",
        "wc_summary": "401;93;93;43",
        "wc_strengths": "4;17;103;33",
        "wc_weaknesses": "4;96;199;313",
        "wc_questions": "4;86;3;44",
        "wc_review": "413;292;398;433",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            157.5,
            142.05896663005825
        ],
        "wc_strengths_avg": [
            39.25,
            38.21239981995373
        ],
        "wc_weaknesses_avg": [
            153.0,
            115.28876788308564
        ],
        "wc_questions_avg": [
            34.25,
            34.14948755105997
        ],
        "wc_review_avg": [
            384.0,
            54.54814387309618
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5259172413228558885&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Zhejiang University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.zju.edu.cn",
        "aff_unique_abbr": "ZJU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Binjiang",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Plug-and-Play Policy Planner for Large Language Model Powered Dialogue Agents",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18838",
        "id": "MCNqgUFTHI",
        "author_site": "Yang Deng, Wenxuan Zhang, Wai Lam, See-Kiong Ng, Tat-Seng Chua",
        "tldr": "",
        "abstract": "Proactive dialogues serve as a practical yet challenging dialogue problem in the era of large language models (LLMs), where the dialogue policy planning is the key to improving the proactivity of LLMs. Most existing studies enable the dialogue policy planning of LLMs using various prompting schemes or iteratively enhance this capability in handling the given case with verbal AI feedback. However, these approaches are either bounded by the policy planning capability of the frozen LLMs or hard to be transferred to new cases. In this work, we introduce a new dialogue policy planning paradigm to strategize LLMs for proactive dialogue problems with a tunable language model plug-in as a plug-and-play dialogue policy planner, named PPDPP. Specifically, we develop a novel training framework to facilitate supervised fine-tuning over available human-annotated data as well as reinforcement learning from goal-oriented AI feedback with dynamic interaction data collected by the LLM-based self-play simulation. In this manner, the LLM-powered dialogue agent can not only be generalized to different cases after the training, but also be applicable to different applications by just substituting the learned plug-in. In addition, we propose to evaluate the policy planning capability of dialogue systems under the interactive setting. Experimental results demonstrate that PPDPP consistently and substantially outperforms existing approaches on three different proactive dialogue applications, including negotiation, emotional support, and tutoring dialogues.",
        "keywords": "Dialogue Policy Planning;Proactive Dialogue;Large Language Model",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yang Deng;Wenxuan Zhang;Wai Lam;See-Kiong Ng;Tat-Seng Chua",
        "authorids": "~Yang_Deng4;~Wenxuan_Zhang1;~Wai_Lam1;~See-Kiong_Ng1;~Tat-Seng_Chua2",
        "gender": "M;;M;M;M",
        "homepage": "https://dengyang17.github.io/;https://isakzhang.github.io/;http://www.se.cuhk.edu.hk/~textmine;https://www.comp.nus.edu.sg/~ngsk/;http://www.comp.nus.edu.sg/~chuats/",
        "dblp": "115/6282-2;85/1177-1.html;48/1707;00/5480;",
        "google_scholar": "https://scholar.google.com.hk/citations?user=OshWT3UAAAAJ;https://scholar.google.com/citations?hl=en;ewA4NAcAAAAJ;https://scholar.google.com.tw/citations?user=_wsommYAAAAJ;https://scholar.google.com.tw/citations?user=Z9DWCBEAAAAJ",
        "orcid": ";;;0000-0001-6565-7511;0000-0001-6097-7807",
        "linkedin": ";wenxuan-zhang-608b88153/;;seekiong/?originalSubdomain=sg;",
        "or_profile": "~Yang_Deng4;~Wenxuan_Zhang1;~Wai_Lam1;~See-Kiong_Ng1;~Tat-seng_Chua1",
        "aff": "National University of Singapore;Alibaba Group;The Chinese University of Hong Kong;National University of Singapore;National University of Singapore",
        "aff_domain": "nus.edu.sg;alibaba-inc.com;cuhk.edu.hk;nus.edu.sg;nus.edu.sg",
        "position": "Postdoc;Researcher;Professor;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\ndeng2024plugandplay,\ntitle={Plug-and-Play Policy Planner for Large Language Model Powered Dialogue Agents},\nauthor={Yang Deng and Wenxuan Zhang and Wai Lam and See-Kiong Ng and Tat-Seng Chua},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=MCNqgUFTHI}\n}",
        "github": "",
        "project": "",
        "reviewers": "RDBv;sGxq;dAwq",
        "pdf_size": 490692,
        "rating": "5;6;8",
        "confidence": "3;4;3",
        "soundness": "3;3;3",
        "contribution": "2;2;3",
        "presentation": "3;3;3",
        "wc_summary": "99;105;75",
        "wc_strengths": "49;49;35",
        "wc_weaknesses": "68;69;9",
        "wc_questions": "50;24;15",
        "wc_review": "266;247;134",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1169;1125;149",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;2;1",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            93.0,
            12.96148139681572
        ],
        "wc_strengths_avg": [
            44.333333333333336,
            6.599663291074444
        ],
        "wc_weaknesses_avg": [
            48.666666666666664,
            28.051539866625664
        ],
        "wc_questions_avg": [
            29.666666666666668,
            14.839886193034712
        ],
        "wc_review_avg": [
            215.66666666666666,
            58.265675048770255
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            814.3333333333334,
            470.8045123922337
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.18898223650461363,
        "gs_citation": 35,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3700296327215031669&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=MCNqgUFTHI",
        "pdf": "https://openreview.net/pdf?id=MCNqgUFTHI",
        "email": "nus.edu.sg;alibaba-inc.com;cuhk.edu.hk;nus.edu.sg;nus.edu.sg",
        "author_num": 5,
        "aff_unique_index": "0;1;2;0;0",
        "aff_unique_norm": "National University of Singapore;Alibaba Group;Chinese University of Hong Kong",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.nus.edu.sg;https://www.alibaba.com;https://www.cuhk.edu.hk",
        "aff_unique_abbr": "NUS;Alibaba;CUHK",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;1;1;0;0",
        "aff_country_unique": "Singapore;China"
    },
    {
        "id": "MCQdWMs5iA",
        "title": "Explicit Foundation Model Optimization with Self-Attentive Feed-Forward Neural Units",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Iterative differential approximation methods that rely upon backpropagation have enabled the optimization of neural networks; however, at present, they remain computationally expensive, especially when training models at scale. In this paper, we present a computationally efficient alternative for optimizing neural networks that can both reduce the costs of scaling neural networks and provide high-efficiency optimizations for low-resource applications. This paper will discuss how we derive a general result about feed-forward neural networks, and then extend this solution to compositional (mult-layer) networks, which we then apply to a simplified transformer block, containing both feed-forward and self-attention layers. These developments lead us to train highly-specified and complex multi-layer neural architectures from that we refer to descriptively as self-attentive feed-forward unit (SAFFU) layers, which we apply to our development of a hyper-efficient single-block transformer, which achieves generalization over only a small\u2014cognitively-feasible\u2014volume of data. Results from testing demonstrate explicit solutions grossly outperform those optimized by backpropagation alone, and moreover, that further application of backpropagation after explicit solutions leads to the discovery of better optima from smaller scales of data, i.e., that training highly-performant models from much smaller scales of data is enabled by warm starting models with their explicit solutions. Using the efficiency and consistency of the SAFFU's explicit solution, we carry out ablation experiments training a roadmap of approximately 500 single-block transformer models over $1$-million tokens, each, to determine ideal hyperparamterizations for the SAFFU-based transformer. We find that multiple different architectural variants of the SAFFU-transformer are capable of highly-performant and well-generalized models. Most critically, we discover from this ablation that some of the most performant models are in fact not the most highly parameterized. In other words, we discover not only that generalized models can be reached more efficiently (using less data) than without explicit solutions, but moreover, that the architectural exploration afforded by explicit solution efficiency also pays dividends in guiding our search for more efficient architecture, containing fewer parameters, which could be incorporated into low-resource hardware where AI might be embodied.",
        "keywords": "optimization;neural network;language model;self-attention mechanism;backpropagation",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Jake Ryland Williams;Haoran Zhao",
        "authorids": "~Jake_Ryland_Williams2;~Haoran_Zhao2",
        "gender": "M;M",
        "homepage": "https://hrjzhao.github.io/;https://jakerylandwilliams.github.io/",
        "dblp": ";",
        "google_scholar": "yNRZK2EAAAAJ;",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Haoran_Zhao2;~Jake_Williams1",
        "aff": "Drexel University;Drexel University",
        "aff_domain": "drexel.edu;drexel.edu",
        "position": "Undergrad student;Assistant Professor",
        "bibtex": "@misc{\nwilliams2024explicit,\ntitle={Explicit Foundation Model Optimization with Self-Attentive Feed-Forward Neural Units},\nauthor={Jake Ryland Williams and Haoran Zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=MCQdWMs5iA}\n}",
        "github": "",
        "project": "",
        "reviewers": "kr31;QpKp;Nd49;VevR",
        "site": "https://openreview.net/forum?id=MCQdWMs5iA",
        "pdf_size": 643371,
        "rating": "1;3;3;5",
        "confidence": "3;3;4;3",
        "soundness": "3;3;1;2",
        "contribution": "1;3;2;3",
        "presentation": "1;2;1;1",
        "wc_summary": "28;91;70;34",
        "wc_strengths": "16;28;34;61",
        "wc_weaknesses": "53;268;388;217",
        "wc_questions": "15;28;35;12",
        "wc_review": "112;415;527;324",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            1.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            55.75,
            25.926579026165406
        ],
        "wc_strengths_avg": [
            34.75,
            16.48294573187693
        ],
        "wc_weaknesses_avg": [
            231.5,
            120.30897722115337
        ],
        "wc_questions_avg": [
            22.5,
            9.394147114027968
        ],
        "wc_review_avg": [
            344.5,
            152.27688596763463
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:01FKxU2YOVIJ:scholar.google.com/&scioq=Explicit+Foundation+Model+Optimization+with+Self-Attentive+Feed-Forward+Neural+Units&hl=en&as_sdt=0,14",
        "gs_version_total": 5,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Drexel University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.drexel.edu",
        "aff_unique_abbr": "Drexel",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "MCUvAc1GTg",
        "title": "Network Alignment with Transferable Graph Autoencoders",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Network alignment is the task of establishing one-to-one correspondences between the nodes of different graphs and finds a plethora of applications in high-impact domains. However, this task is known to be NP-hard in its general form, and existing algorithms do not scale up as the size of the graphs increases. To tackle both challenges we propose a novel generalized graph autoencoder architecture, designed to extract powerful and robust node embeddings, that are tailored to the alignment task. We prove that the generated embeddings are associated with the eigenvalues and eigenvectors of the graphs and can achieve more accurate alignment compared to classical spectral methods. Our proposed framework also leverages transfer learning and data augmentation to achieve efficient network alignment at a very large scale without retraining. Extensive experiments on both network and sub-network alignment with real-world graphs provide corroborating evidence supporting the effectiveness and scalability of the proposed approach.",
        "keywords": "Network Alignment;Graph Matching;Graph Neural Network;Graph Autoencoder;Transfer Learning;Self-supervised Learning",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Jiashu He;Charilaos Kanatsoulis;Alejandro Ribeiro",
        "authorids": "~Jiashu_He2;~Charilaos_Kanatsoulis1;~Alejandro_Ribeiro1",
        "gender": "M;;M",
        "homepage": ";https://sites.google.com/site/harikanats;https://alelab.seas.upenn.edu",
        "dblp": "289/5719.html;176/8106;32/15",
        "google_scholar": "https://scholar.google.com/citations?hl=en;3q7W3RMAAAAJ;7mrPM4kAAAAJ",
        "orcid": ";;0000-0003-4230-9906",
        "linkedin": "jiashu-jason-he-b246a0170/;;",
        "or_profile": "~Jiashu_He2;~Charilaos_Kanatsoulis1;~Alejandro_Ribeiro1",
        "aff": "University of Pennsylvania;University of Pennsylvania;University of Pennsylvania",
        "aff_domain": "upenn.edu;seas.upenn.edu;upenn.edu",
        "position": "PhD student;Postdoc;Full Professor",
        "bibtex": "@misc{\nhe2024network,\ntitle={Network Alignment with Transferable Graph Autoencoders},\nauthor={Jiashu He and Charilaos Kanatsoulis and Alejandro Ribeiro},\nyear={2024},\nurl={https://openreview.net/forum?id=MCUvAc1GTg}\n}",
        "github": "",
        "project": "",
        "reviewers": "yfvW;qHgX;zEkT;vYiA",
        "site": "https://openreview.net/forum?id=MCUvAc1GTg",
        "pdf_size": 1348003,
        "rating": "3;5;6;8",
        "confidence": "5;4;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;2;4",
        "wc_summary": "61;64;90;98",
        "wc_strengths": "74;37;72;54",
        "wc_weaknesses": "158;230;94;82",
        "wc_questions": "61;37;151;678",
        "wc_review": "354;368;407;912",
        "wc_reply_reviewers": "384;164;129;48",
        "wc_reply_authors": "1470;1695;822;1923",
        "reply_reviewers": "2;1;1;1",
        "reply_authors": "5;5;3;5",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            78.25,
            16.037066439969625
        ],
        "wc_strengths_avg": [
            59.25,
            15.022899187573616
        ],
        "wc_weaknesses_avg": [
            141.0,
            58.94913061275798
        ],
        "wc_questions_avg": [
            231.75,
            261.12389300866363
        ],
        "wc_review_avg": [
            510.25,
            232.76208346721765
        ],
        "wc_reply_reviewers_avg": [
            181.25,
            124.38925797672402
        ],
        "wc_reply_authors_avg": [
            1477.5,
            410.9479894098522
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.5,
            0.8660254037844386
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8006407690254357,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11717022082796296102&as_sdt=5,34&sciodt=0,34&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Pennsylvania",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.upenn.edu",
        "aff_unique_abbr": "UPenn",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "MCjVArCAZ1",
        "title": "Is Pre-training Truly Better Than Meta-Learning?",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "n the context of few-shot learning, it is currently believed that a fixed pre-trained (PT) model, along with fine-tuning the final layer during evaluation, outperforms standard meta-learning algorithms.\nWe re-evaluate these claims under an in-depth empirical examination of an extensive set of formally diverse datasets and compare PT to Model Agnostic Meta-Learning (MAML).\nUnlike previous work, we emphasize a fair comparison by using: the same architecture, the same optimizer, and all models trained to convergence.\nCrucially, we use a more rigorous statistical tool -- the effect size (Cohen's d) -- to determine the practical significance of the difference between a model trained with PT vs. a MAML.\nWe then use a previously proposed metric -- the diversity coefficient -- to compute the average formal diversity of a dataset.\nUsing this analysis, we demonstrate the following:\n1. when the formal diversity of a data set is low, PT beats MAML on average and\n2. when the formal diversity is high, MAML beats PT on average.\nThe caveat is that the magnitude of the average difference between a PT vs. MAML using the effect size is low (according to classical statistical thresholds) -- less than 0.2.\nNevertheless, this observation is contrary to the currently held belief that a pre-trained model is always better than a meta-learning model.\nOur extensive experiments consider 21 few-shot learning benchmarks, including the large-scale few-shot learning dataset Meta-Data set.\nWe also show no significant difference between a MAML model vs. a PT model with GPT-2 on Openwebtext.\nWe, therefore, conclude that a pre-trained model does not always beat a meta-learned model and that the formal diversity of a dataset is a driving factor.",
        "keywords": "meta-learning;pre-training;data centric machine learning;machine learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/ee1bb58cb908b708ed06e5307117e70cb42e7b2f.pdf",
        "author": "Brando Miranda;Saumya Goyal;Patrick Yu;Yu-Xiong Wang;Sanmi Koyejo",
        "authorids": "~Brando_Miranda1;~Saumya_Goyal1;~Patrick_Yu1;~Yu-Xiong_Wang1;~Sanmi_Koyejo1",
        "gender": "M;M;;;M",
        "homepage": "https://cbmm.mit.edu/about/people/miranda;;;https://yxw.cs.illinois.edu/;https://cs.stanford.edu/~sanmi/",
        "dblp": ";307/2887;230/7692;35/10700;14/8885",
        "google_scholar": "_NQJoBkAAAAJ;;3MpLP34AAAAJ;T_Q-xDkAAAAJ;EaaOeJwAAAAJ",
        "orcid": ";0000-0002-8502-5148;;;0000-0002-4023-419X",
        "linkedin": "brando-miranda-40821046/;saum-g/;;;sanmi-koyejo-984754/",
        "or_profile": "~Brando_Miranda1;~Saumya_Goyal1;~Patrick_Yu1;~Yu-Xiong_Wang1;~Oluwasanmi_O_Koyejo1",
        "aff": "Stanford University;Stanford University;Department of Computer Science, University of Washington;Department of Computer Science, University of Illinois Urbana-Champaign;Google",
        "aff_domain": "stanford.edu;stanford.edu;cs.washington.edu;cs.illinois.edu;google.com",
        "position": "PhD student;MS student;PhD student;Assistant Professor;Research Scientist",
        "bibtex": "@misc{\nmiranda2024is,\ntitle={Is Pre-training Truly Better Than Meta-Learning?},\nauthor={Brando Miranda and Saumya Goyal and Patrick Yu and Yu-Xiong Wang and Sanmi Koyejo},\nyear={2024},\nurl={https://openreview.net/forum?id=MCjVArCAZ1}\n}",
        "github": "",
        "project": "",
        "reviewers": "myHv;TVer;RzB7;ZnA1",
        "site": "https://openreview.net/forum?id=MCjVArCAZ1",
        "pdf_size": 2358656,
        "rating": "3;5;5;5",
        "confidence": "3;4;2;3",
        "soundness": "2;3;2;2",
        "contribution": "2;3;1;2",
        "presentation": "1;3;1;3",
        "wc_summary": "206;166;61;94",
        "wc_strengths": "87;60;49;32",
        "wc_weaknesses": "321;371;123;194",
        "wc_questions": "17;41;2;94",
        "wc_review": "631;638;235;414",
        "wc_reply_reviewers": "0;326;122;201",
        "wc_reply_authors": "829;723;363;334",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.0,
            1.0
        ],
        "wc_summary_avg": [
            131.75,
            57.264190381074975
        ],
        "wc_strengths_avg": [
            57.0,
            19.987496091306685
        ],
        "wc_weaknesses_avg": [
            252.25,
            98.64931576042481
        ],
        "wc_questions_avg": [
            38.5,
            34.93207694941714
        ],
        "wc_review_avg": [
            479.5,
            167.44028786406216
        ],
        "wc_reply_reviewers_avg": [
            162.25,
            118.59674320992124
        ],
        "wc_reply_authors_avg": [
            562.25,
            217.25258916754018
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5932639413414941883&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;2;3",
        "aff_unique_norm": "Stanford University;University of Washington;University of Illinois Urbana-Champaign;Google",
        "aff_unique_dep": ";Department of Computer Science;Department of Computer Science;Google",
        "aff_unique_url": "https://www.stanford.edu;https://www.washington.edu;https://illinois.edu;https://www.google.com",
        "aff_unique_abbr": "Stanford;UW;UIUC;Google",
        "aff_campus_unique_index": "0;0;1;2;3",
        "aff_campus_unique": "Stanford;Seattle;Urbana-Champaign;Mountain View",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Improving Offline RL by Blending Heuristics",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18837",
        "id": "MCl0TLboP1",
        "author_site": "Sinong Geng, Aldo Pacchiano, Andrey Kolobov, Ching-An Cheng",
        "tldr": "",
        "abstract": "We propose **H**e**u**ristic **Bl**ending (HUBL), a simple performance-improving technique for a broad class of offline RL algorithms based on value bootstrapping. HUBL modifies the Bellman operators used in these algorithms, partially replacing the bootstrapped values with heuristic ones that are estimated with Monte-Carlo returns. For trajectories with higher returns, HUBL relies more on the heuristic values and less on bootstrapping; otherwise, it leans more heavily on bootstrapping. HUBL is very easy to combine with many existing offline RL implementations by relabeling the offline datasets with adjusted rewards and discount factors. We derive a theory that explains HUBL's effect on offline RL as reducing offline RL's complexity and thus increasing its finite-sample performance.  Furthermore, we empirically demonstrate that HUBL consistently improves the policy quality of four state-of-the-art bootstrapping-based offline RL algorithms (ATAC, CQL, TD3+BC, and IQL), by 9% on average over 27 datasets of the D4RL and Meta-World benchmarks.",
        "keywords": "offline RL;heuristic;RL;MDP;sequential decision-making",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/1b7439e34830a952f22a2f547e16b7305f0ff7e4.zip",
        "author": "Sinong Geng;Aldo Pacchiano;Andrey Kolobov;Ching-An Cheng",
        "authorids": "~Sinong_Geng1;~Aldo_Pacchiano1;~Andrey_Kolobov1;~Ching-An_Cheng1",
        "gender": "M;M;M;M",
        "homepage": "https://gengsinong.github.io/;https://www.aldopacchiano.ai;https://www.microsoft.com/en-us/research/people/akolobov/;http://www.chinganc.com",
        "dblp": "209/4917;129/6338;95/3462;123/6369",
        "google_scholar": ";no_BfYgAAAAJ;xEWgxBsAAAAJ;bMZFLZ_V4goC",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Sinong_Geng1;~Aldo_Pacchiano1;~Andrey_Kolobov1;~Ching-An_Cheng1",
        "aff": ";Broad Institute;Microsoft;Microsoft Research",
        "aff_domain": ";broadinstitute.org;microsoft.com;microsoft.com",
        "position": ";Postdoc;Researcher;Principal Researcher",
        "bibtex": "@inproceedings{\ngeng2024improving,\ntitle={Improving Offline {RL} by Blending Heuristics},\nauthor={Sinong Geng and Aldo Pacchiano and Andrey Kolobov and Ching-An Cheng},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=MCl0TLboP1}\n}",
        "github": "",
        "project": "",
        "reviewers": "8Sx2;iqAo;zyzv;Gwab",
        "pdf_size": 672172,
        "rating": "5;8;8;8",
        "confidence": "3;4;4;4",
        "soundness": "3;4;3;4",
        "contribution": "3;3;3;4",
        "presentation": "2;4;4;3",
        "wc_summary": "75;158;35;69",
        "wc_strengths": "63;46;95;225",
        "wc_weaknesses": "107;211;1;143",
        "wc_questions": "94;19;214;46",
        "wc_review": "339;434;345;483",
        "wc_reply_reviewers": "0;35;0;0",
        "wc_reply_authors": "409;681;27;541",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            7.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            84.25,
            45.22927702274269
        ],
        "wc_strengths_avg": [
            107.25,
            70.22241451274657
        ],
        "wc_weaknesses_avg": [
            115.5,
            75.92595076783695
        ],
        "wc_questions_avg": [
            93.25,
            74.71069200589699
        ],
        "wc_review_avg": [
            400.25,
            60.808613699047605
        ],
        "wc_reply_reviewers_avg": [
            8.75,
            15.155444566227676
        ],
        "wc_reply_authors_avg": [
            414.5,
            243.5215596204985
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15852979309448239528&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=MCl0TLboP1",
        "pdf": "https://openreview.net/pdf?id=MCl0TLboP1",
        "email": ";broadinstitute.org;microsoft.com;microsoft.com",
        "author_num": 4,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Broad Institute;Microsoft",
        "aff_unique_dep": ";Microsoft Corporation",
        "aff_unique_url": "https://www.broadinstitute.org;https://www.microsoft.com",
        "aff_unique_abbr": "Broad;Microsoft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "MDXfiEpEEP",
        "title": "LNL+K: Enhancing Learning with Noisy Labels Through Noise Source Knowledge Integration",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Learning with noisy labels (LNL) aims to train a high-performing model using a noisy dataset. We observe that noise for a given class often comes from a limited set of categories, yet many LNL methods overlook this. For example, an image mislabeled as a cheetah is more likely a leopard than a hippopotamus due to its visual similarity.  In fact, we find that many datasets have meta-data information that directly provides potential noise sources. Thus, in this paper, we explore a task we refer to as Learning with Noisy Labels with noise source Knowledge integration (LNL+K), which assumes we have some knowledge about likely source(s) of label noise that we can take advantage of. We find that integrating noise source knowledge boosts performance, even supporting settings where LNL methods typically fail.  For example, LNL+K methods are effective on datasets where noise represents the majority of samples, which breaks a critical premise of most methods developed for the LNL task.  We also find that LNL+K methods can boost performance even when the noise sources are estimated rather than provided in the meta-data. Our experiments provide several baseline LNL+K methods that integrate noise source knowledge into state-of-the-art LNL models across five diverse datasets and three types of noise, where we report gains of up to 15% compared to the unadapted methods. Critically, we show that LNL methods fail to generalize on some real-world datasets, even when adapted to integrate noise source knowledge, highlighting the importance of directly exploring our LNL+K task.",
        "keywords": "robust learning;learning with noisy labels",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Siqi Wang;Bryan A. Plummer",
        "authorids": "~Siqi_Wang2;~Bryan_A._Plummer1",
        "gender": "F;M",
        "homepage": "https://cs-people.bu.edu/siqiwang/;http://bryanplummer.com/",
        "dblp": ";163/2330",
        "google_scholar": ";https://scholar.google.com/citations?hl=en",
        "orcid": ";",
        "linkedin": "siqi-wang-bab3b9128/;",
        "or_profile": "~Siqi_Wang2;~Bryan_Allen_Plummer1",
        "aff": "Boston University;Boston University",
        "aff_domain": "bu.edu;bu.edu",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nwang2024lnlk,\ntitle={{LNL}+K: Enhancing Learning with Noisy Labels Through Noise Source Knowledge Integration},\nauthor={Siqi Wang and Bryan A. Plummer},\nyear={2024},\nurl={https://openreview.net/forum?id=MDXfiEpEEP}\n}",
        "github": "",
        "project": "",
        "reviewers": "D5C9;X4gK;unqu;3qaZ;kCaM",
        "site": "https://openreview.net/forum?id=MDXfiEpEEP",
        "pdf_size": 450221,
        "rating": "1;3;3;5;5",
        "confidence": "4;5;2;4;5",
        "soundness": "1;2;1;2;3",
        "contribution": "1;1;2;2;3",
        "presentation": "3;2;1;2;2",
        "wc_summary": "62;90;86;63;49",
        "wc_strengths": "32;15;66;33;52",
        "wc_weaknesses": "92;257;198;90;201",
        "wc_questions": "75;2;627;172;15",
        "wc_review": "261;364;977;358;317",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "1469;1533;1603;982;1099",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "3;2;2;2;2",
        "rating_avg": [
            3.4,
            1.4966629547095767
        ],
        "confidence_avg": [
            4.0,
            1.0954451150103321
        ],
        "soundness_avg": [
            1.8,
            0.7483314773547883
        ],
        "contribution_avg": [
            1.8,
            0.7483314773547883
        ],
        "presentation_avg": [
            2.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            70.0,
            15.556349186104045
        ],
        "wc_strengths_avg": [
            39.6,
            17.647662734764623
        ],
        "wc_weaknesses_avg": [
            167.6,
            65.9836343345833
        ],
        "wc_questions_avg": [
            178.2,
            232.28895798121786
        ],
        "wc_review_avg": [
            455.4,
            263.38306703355096
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1337.2,
            248.70255326393416
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.2,
            0.39999999999999997
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.2439750182371333,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6328382240076478572&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Boston University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.bu.edu",
        "aff_unique_abbr": "BU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "The Effectiveness of Random Forgetting for Robust Generalization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18836",
        "id": "MEGQGNUfPx",
        "author_site": "Vijaya Raghavan T Ramkumar, Bahram Zonooz, Elahe Arani",
        "tldr": "",
        "abstract": "Deep neural networks are susceptible to adversarial attacks, which can compromise their performance and accuracy. Adversarial Training (AT) has emerged as a popular approach for protecting neural networks against such attacks. However, a key challenge of AT is robust overfitting, where the network's robust performance on test data deteriorates with further training, thus hindering generalization. Motivated by the concept of active forgetting in the brain, we introduce a novel learning paradigm called \"Forget to Mitigate Overfitting (FOMO)\". FOMO alternates between the forgetting phase, which randomly forgets a subset of weights and regulates the model's information through weight reinitialization, and the relearning phase, which emphasizes learning generalizable features. Our experiments on benchmark datasets and adversarial attacks show that FOMO alleviates robust overfitting by significantly reducing the gap between the best and last robust test accuracy while improving the state-of-the-art robustness. Furthermore, FOMO provides a better trade-off between the standard and robust accuracy outperforming baseline adversarial methods. Finally, our framework is robust to AutoAttacks and increases generalization in many real-world scenarios.",
        "keywords": "Adversarial training;robust overfitting;forgetting;reinitialization;robust accuracy;generalization",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/3904f1d8a430852e46442521fb0beb94ebd02ab6.pdf",
        "author": "Vijaya Raghavan T Ramkumar;Bahram Zonooz;Elahe Arani",
        "authorids": "~Vijaya_Raghavan_T_Ramkumar1;~Bahram_Zonooz1;~Elahe_Arani1",
        "gender": ";M;F",
        "homepage": ";https://sites.google.com/view/bahramzonooz;https://sites.google.com/view/elahe-arani",
        "dblp": ";250/9573;",
        "google_scholar": ";;e_I_v6cAAAAJ",
        "orcid": ";;0000-0002-0952-7007",
        "linkedin": ";;elahe-arani-630870b2/",
        "or_profile": "~Vijaya_Raghavan_T_Ramkumar1;~Bahram_Zonooz1;~Elahe_Arani1",
        "aff": ";Eindhoven University of Technology;Wayve Technologies Ltd",
        "aff_domain": ";tue.nl;wayve.ai",
        "position": ";Assistant Professor;Head of AI Research",
        "bibtex": "@inproceedings{\nramkumar2024the,\ntitle={The Effectiveness of Random Forgetting for Robust Generalization},\nauthor={Vijaya Raghavan T Ramkumar and Bahram Zonooz and Elahe Arani},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=MEGQGNUfPx}\n}",
        "github": "",
        "project": "",
        "reviewers": "FBLx;WNii;Jeha",
        "pdf_size": 659876,
        "rating": "6;6;6",
        "confidence": "3;5;3",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "2;3;3",
        "wc_summary": "48;25;95",
        "wc_strengths": "33;32;40",
        "wc_weaknesses": "131;37;118",
        "wc_questions": "26;69;6",
        "wc_review": "238;163;259",
        "wc_reply_reviewers": "44;0;0",
        "wc_reply_authors": "569;482;624",
        "reply_reviewers": "1;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            56.0,
            29.13188402192118
        ],
        "wc_strengths_avg": [
            35.0,
            3.559026084010437
        ],
        "wc_weaknesses_avg": [
            95.33333333333333,
            41.58792559812951
        ],
        "wc_questions_avg": [
            33.666666666666664,
            26.284765338288434
        ],
        "wc_review_avg": [
            220.0,
            41.20679555607303
        ],
        "wc_reply_reviewers_avg": [
            14.666666666666666,
            20.741798914805393
        ],
        "wc_reply_authors_avg": [
            558.3333333333334,
            58.459862774005515
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=378389165870628706&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=MEGQGNUfPx",
        "pdf": "https://openreview.net/pdf?id=MEGQGNUfPx",
        "email": ";tue.nl;wayve.ai",
        "author_num": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Eindhoven University of Technology;Wayve Technologies",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tue.nl;https://www.wayvetechnologies.com",
        "aff_unique_abbr": "TU/e;Wayve",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Netherlands;United Kingdom"
    },
    {
        "id": "MEbNz44926",
        "title": "Flexible Residual Binarization for Image Super-Resolution",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Binarized image super-resolution (SR) has attracted much research attention due to its potential to drastically reduce parameters and operations. However, most binary SR works binarize network weights directly, which hinders high-frequency information extraction. Furthermore, as a pixel-wise reconstruction task, binarization often results in heavy representation content distortion. To address these issues, we propose a flexible residual binarization (FRB) method for image SR. We first propose a Second-order Residual Binarization (SRB), to counter the information loss caused by binarization. In addition to the primary weight binarization, we also binarize the reconstruction error, which is added as a residual term in the prediction. Furthermore, to narrow the representation content gap between the binarized and full-precision networks, we propose Distillation-guided Binarization Training (DBT). We uniformly align the contents of different bit widths by constructing a normalized attention form. Finally, we apply our FRB to binarize convolution and Transformer-based SR networks, resulting in two binary baselines: FRBC and FRBT. We conduct extensive experiments and comparisons with recent leading binarization methods. Our proposed baselines, FRBC and FRBT, achieve superior performance both quantitatively and visually. The code and model will be released.",
        "keywords": "Residual Binarization;Image Super-Resolution",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/aa648dffc1cd9b152f4e19eff498cc5e67368cc5.pdf",
        "author": "Yulun Zhang;Haotong Qin;Zixiang Zhao;Xianglong Liu;Martin Danelljan;Fisher Yu",
        "authorids": "~Yulun_Zhang1;~Haotong_Qin1;~Zixiang_Zhao1;~Xianglong_Liu3;~Martin_Danelljan4;~Fisher_Yu2",
        "gender": "M;M;M;;M;M",
        "homepage": "http://yulunzhang.com/;https://htqin.github.io/;https://zhaozixiang1228.github.io/;;https://martin-danelljan.github.io/;https://www.yf.io/",
        "dblp": "166/2763-1.html;262/3626.html;65/5420;;151/8848;117/6314",
        "google_scholar": "ORmLjWoAAAAJ;mK6n-KgAAAAJ;tUv_X8cAAAAJ;;NCSSpMkAAAAJ;-XCiamcAAAAJ",
        "orcid": "0000-0002-2288-5079;;;;;",
        "linkedin": "yulun-zhang-1116b5b9/;;;;;",
        "or_profile": "~Yulun_Zhang1;~Haotong_Qin1;~Zixiang_Zhao1;~Xianglong_Liu3;~Martin_Danelljan4;~Fisher_Yu2",
        "aff": "Swiss Federal Institute of Technology;ETHZ - ETH Zurich;ETHZ - ETH Zurich;;ETH Zurich;Swiss Federal Institute of Technology",
        "aff_domain": "ethz.ch;ethz.ch;ethz.ch;;vision.ee.ethz.ch;ethz.ch",
        "position": "Postdoc;Postdoc;Postdoc;;Principal Researcher;Assistant Professor",
        "bibtex": "@misc{\nzhang2024flexible,\ntitle={Flexible Residual Binarization for Image Super-Resolution},\nauthor={Yulun Zhang and Haotong Qin and Zixiang Zhao and Xianglong Liu and Martin Danelljan and Fisher Yu},\nyear={2024},\nurl={https://openreview.net/forum?id=MEbNz44926}\n}",
        "github": "",
        "project": "",
        "reviewers": "jLFb;iE9s;LkP1;Bydn",
        "site": "https://openreview.net/forum?id=MEbNz44926",
        "pdf_size": 1772994,
        "rating": "8;8;8;8",
        "confidence": "4;5;4;4",
        "soundness": "3;3;3;3",
        "contribution": "3;3;4;2",
        "presentation": "3;4;4;2",
        "wc_summary": "62;54;67;107",
        "wc_strengths": "16;215;256;70",
        "wc_weaknesses": "106;106;172;194",
        "wc_questions": "3;2;59;54",
        "wc_review": "187;377;554;425",
        "wc_reply_reviewers": "40;18;24;0",
        "wc_reply_authors": "887;507;696;1302",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "2;1;1;2",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            72.5,
            20.45116133621756
        ],
        "wc_strengths_avg": [
            139.25,
            99.1901582819586
        ],
        "wc_weaknesses_avg": [
            144.5,
            39.27785635698567
        ],
        "wc_questions_avg": [
            29.5,
            27.060118255469618
        ],
        "wc_review_avg": [
            385.75,
            131.7447816803383
        ],
        "wc_reply_reviewers_avg": [
            20.5,
            14.309088021254185
        ],
        "wc_reply_authors_avg": [
            848.0,
            294.54286615024307
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2208874550807841978&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;1;1;0",
        "aff_unique_norm": "Swiss Federal Institute of Technology;ETH Zurich",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ethz.ch;https://www.ethz.ch",
        "aff_unique_abbr": "ETH Zurich;ETHZ",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Switzerland"
    },
    {
        "id": "MEztAJjcYZ",
        "title": "Enhancing Clinical Note Summarization: Iterative Reflexions with Small-model Supervision and Error2Correct Demonstrations",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Generating clinical notes from doctor-patient dialogues is an important task in medical artificial intelligence. Mainstream methods currently employ large language models with few-shot demonstrations to tackle this challenge. However, the absence of domain knowledge supervision in these models often results in issues like missing key information, irregular writing standards, and non-compliant language styles. To this end, in this paper, we propose a novel iterative reflexion framework with small-model supervision and Error2Correct demonstrations for clinical note summarization. In this framework, we leverage a large model to produce clinical notes and design a small model trained on domain-specific data to evaluate the generated content. To enhance the quality of the generated clinical notes, we further propose Error2Correct demonstrations, which consist of error examples, error analysis, and corresponding correct examples, to help the large model identify and rectify errors effectively. To evaluate the effectiveness of our proposed method, we conduct extensive experiments on both Chinese and English datasets. The results demonstrate that our method achieves state-of-the-art performance on both datasets for the clinical note summarization task.",
        "keywords": "Clinical Note Summarization;Large Language Model;Error2Correct demonstration",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Jingping Liu;Boyang Zhong;Weiyan Zhang;Haiyun Jiang;Weichao Ding;Tong Ruan;Jing Sun;Lifeng Zhu",
        "authorids": "~Jingping_Liu1;~Boyang_Zhong1;~Weiyan_Zhang1;~Haiyun_Jiang1;~Weichao_Ding1;~Tong_Ruan2;sj11788@rjh.com.cn;~Lifeng_Zhu1",
        "gender": "M;M;;M;M;F;;M",
        "homepage": "https://www.scholarmate.com/psnweb/homepage/show;https://github.com/steins048596;;;https://cise.ecust.edu.cn/2021/0313/c12977a123813/page.htm;https://scholar.google.com/citations?user=n8pWWtkAAAAJ;;http://www.rjh.com.cn",
        "dblp": "236/6028;;238/9478;;;86/4212;;",
        "google_scholar": "https://scholar.google.com.hk/citations?hl=zh-CN;;;fk684xEAAAAJ;;n8pWWtkAAAAJ;;",
        "orcid": "0009-0006-1687-2227;;0000-0001-6512-3202;;;0000-0002-3546-8338;;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Jingping_Liu1;~Boyang_Zhong1;~Weiyan_Zhang1;~Haiyun_Jiang1;~Weichao_Ding1;~Tong_Ruan2;sj11788@rjh.com.cn;~Lifeng_Zhu1",
        "aff": "East China University of Science and Technology;East China University of Science and Technology;East China University of Science and Technology;Tencent AI Lab;;East China University of Science and Technology;;",
        "aff_domain": "ecust.edu.cn;ecust.edu.cn;ecust.edu.cn;tencent.com;;ecust.edu.cn;;",
        "position": "Associate Professor;MS student;PhD student;Researcher;;Full Professor;;",
        "bibtex": "@misc{\nanonymous2024enhancing,\ntitle={Enhancing Clinical Note Summarization: Iterative Reflexions with Small-model Supervision and Error2Correct Demonstrations},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=MEztAJjcYZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "vmuM;T7JA;Sjio;Xmzo",
        "site": "https://openreview.net/forum?id=MEztAJjcYZ",
        "pdf_size": 418915,
        "rating": "3;3;3;8",
        "confidence": "3;4;5;5",
        "soundness": "2;2;4;3",
        "contribution": "1;2;3;3",
        "presentation": "2;1;1;4",
        "wc_summary": "53;28;45;137",
        "wc_strengths": "65;32;60;176",
        "wc_weaknesses": "154;314;217;196",
        "wc_questions": "48;101;18;580",
        "wc_review": "320;475;340;1089",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            2.165063509461097
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.0,
            1.224744871391589
        ],
        "wc_summary_avg": [
            65.75,
            42.115169476092575
        ],
        "wc_strengths_avg": [
            83.25,
            55.00624964492671
        ],
        "wc_weaknesses_avg": [
            220.25,
            58.687200478468895
        ],
        "wc_questions_avg": [
            186.75,
            228.97966612780272
        ],
        "wc_review_avg": [
            556.0,
            313.4493579511689
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.5222329678670935,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:emqkHJBQ_XcJ:scholar.google.com/&scioq=Enhancing+Clinical+Note+Summarization:+Iterative+Reflexions+with+Small-model+Supervision+and+Error2Correct+Demonstrations&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "East China University of Science and Technology;Tencent",
        "aff_unique_dep": ";Tencent AI Lab",
        "aff_unique_url": "http://www.ecust.edu.cn;https://ai.tencent.com",
        "aff_unique_abbr": "ECUST;Tencent AI Lab",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Learning interpretable control inputs and dynamics underlying animal locomotion",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18835",
        "id": "MFCjgEOLJT",
        "author_site": "Thomas Soares Mullen, Marine Schimel, Guillaume Hennequin, Christian Machens, Michael B. Orger, Adrien Jouary",
        "tldr": "",
        "abstract": "A central objective in neuroscience is to understand how the brain orchestrates movement. Recent advances in automated tracking technologies have made it possible to document behavior with unprecedented temporal resolution and scale, generating rich datasets which can be exploited to gain insights into the neural control of movement. One common approach is to identify stereotypical motor primitives using cluster analysis. However, this categorical description can limit our ability to model the effect of more continuous control schemes. Here we take a control theoretic approach to behavioral modeling and argue that movements can be understood as the output of a controlled dynamical system. Previously, models of movement dynamics, trained solely on behavioral data, have been effective in reproducing observed features of neural activity. These models addressed specific scenarios where animals were trained to execute particular movements upon receiving a prompt. In this study, we extend this approach to analyze the full natural locomotor repertoire of an animal: the zebrafish larva. Our findings demonstrate that this repertoire can be effectively generated through a sparse control signal driving a latent Recurrent Neural Network (RNN). Our model's learned latent space preserves key kinematic features and disentangles different categories of movements. To further interpret the latent dynamics, we used balanced model reduction to yield a simplified model. Collectively, our methods serve as a case study for interpretable system identification, and offer a novel framework for understanding neural activity in relation to movement.",
        "keywords": "computational neuroscience;interpretable dynamics;motor control;animal behavior;dynamical systems;system identification;unsupervised learning;zebrafish",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/f52eae0fa708dd812a28d689565ca38208b325cd.zip",
        "author": "Thomas Soares Mullen;Marine Schimel;Guillaume Hennequin;Christian K. Machens;Michael Orger;Adrien Jouary",
        "authorids": "~Thomas_Soares_Mullen1;~Marine_Schimel1;~Guillaume_Hennequin1;~Christian_K._Machens1;~Michael_Orger1;~Adrien_Jouary1",
        "gender": ";F;M;M;M;M",
        "homepage": ";;https://cbl-cambridge.org;http://www.machenslab.org;;",
        "dblp": ";;56/10432;61/1246;;215/7566",
        "google_scholar": "t6ApPk4AAAAJ;;-NkKYYcAAAAJ;https://scholar.google.pt/citations?user=-4z7V1oAAAAJ;Zmr_V-oAAAAJ;",
        "orcid": "0000-0002-3695-4477;0000-0002-6937-011X;;0000-0003-1717-1562;0000-0002-9763-8902;0000-0002-6123-5458",
        "linkedin": ";;;;;",
        "or_profile": "~Thomas_Soares_Mullen1;~Marine_Schimel1;~Guillaume_Hennequin1;~Christian_K._Machens1;~Michael_Orger1;~Adrien_Jouary1",
        "aff": "Champalimaud Foundation;University of Cambridge;MediaTek Research;Champalimaud Centre for the Unknown;;Champalimaud Foundation",
        "aff_domain": "research.fchampalimaud.org;cam.ac.uk;mtkresearch.com;champalimaud.org;;fchampalimaud.org",
        "position": "PhD student;PhD student;Researcher;Full Professor;;Postdoc",
        "bibtex": "@inproceedings{\nmullen2024learning,\ntitle={Learning interpretable control inputs and dynamics underlying animal locomotion},\nauthor={Thomas Soares Mullen and Marine Schimel and Guillaume Hennequin and Christian K. Machens and Michael Orger and Adrien Jouary},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=MFCjgEOLJT}\n}",
        "github": "",
        "project": "",
        "reviewers": "9AdG;j5DC;325F;AsPq",
        "pdf_size": 9986750,
        "rating": "5;6;6;6",
        "confidence": "4;3;4;4",
        "soundness": "3;4;3;3",
        "contribution": "2;3;2;3",
        "presentation": "3;4;3;3",
        "wc_summary": "95;207;125;44",
        "wc_strengths": "32;61;60;35",
        "wc_weaknesses": "265;131;83;85",
        "wc_questions": "4;83;265;2",
        "wc_review": "396;482;533;166",
        "wc_reply_reviewers": "0;70;336;20",
        "wc_reply_authors": "796;528;1376;522",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "1;1;3;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            117.75,
            59.10742339165191
        ],
        "wc_strengths_avg": [
            47.0,
            13.546217184144066
        ],
        "wc_weaknesses_avg": [
            141.0,
            74.1215218408257
        ],
        "wc_questions_avg": [
            88.5,
            107.01051350217884
        ],
        "wc_review_avg": [
            394.25,
            140.58160441537152
        ],
        "wc_reply_reviewers_avg": [
            106.5,
            134.93239047760179
        ],
        "wc_reply_authors_avg": [
            805.5,
            347.4690633711151
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12266556013455722939&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=MFCjgEOLJT",
        "pdf": "https://openreview.net/pdf?id=MFCjgEOLJT",
        "email": "research.fchampalimaud.org;cam.ac.uk;mtkresearch.com;champalimaud.org;;fchampalimaud.org",
        "author_num": 6,
        "aff_unique_index": "0;1;2;3;0",
        "aff_unique_norm": "Champalimaud Foundation;University of Cambridge;MediaTek Inc.;Champalimaud Centre for the Unknown",
        "aff_unique_dep": ";;Research;",
        "aff_unique_url": "https://www.champalimaud.org;https://www.cam.ac.uk;https://www.mediatek.com/;https://www.champalimaud.org",
        "aff_unique_abbr": ";Cambridge;MediaTek;CCU",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Cambridge;Taiwan",
        "aff_country_unique_index": "0;1;2;0;0",
        "aff_country_unique": "Portugal;United Kingdom;China"
    },
    {
        "id": "MFwQVbkTQ2",
        "title": "Dissecting Causal Biases",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Accurately measuring discrimination in machine learning-based automated decision systems is required to address the vital issue of fairness between subpopulations and/or individuals. Any bias in measuring discrimination can lead to either amplification or underestimation of the true value of discrimination. This paper focuses on a class of bias originating in the way training data is generated and/or collected.  We call such class causal biases and use tools from the field of causality to formally define and analyze such biases. Four sources of bias are considered, namely, confounding, selection, measurement, and interaction. The main contribution of this paper is to provide, for each source of bias, a closed-form expression in terms of the model parameters. This makes it possible to analyze the behavior of each source of bias, in particular, in which cases they are absent and in which other cases they are maximized. We hope that the provided characterizations help the community better understand the sources of bias in machine learning applications.",
        "keywords": "Fairness;Causality;Sources of bias",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/8d6be02ca9092546be83ccb6b78f6e85b13e07e3.pdf",
        "author": "Ruta Binkyte;Sami Zhioua",
        "authorids": "~Ruta_Binkyte1;~Sami_Zhioua1",
        "gender": "F;M",
        "homepage": "http://www.lix.polytechnique.fr/Labo/Ruta.BINKYTE-SADAUSKIENE/;https://www.lix.polytechnique.fr/~zhioua/",
        "dblp": "291/4280;01/723",
        "google_scholar": "ujrfUKIAAAAJ;Gjym8P0AAAAJ",
        "orcid": "0000-0001-8781-3730;0000-0003-2029-175X",
        "linkedin": "ruta-binkyte/;sami-zhioua-b4b09236/",
        "or_profile": "~Ruta_Binkyte1;~Sami_Zhioua1",
        "aff": "CISPA Helmholtz Center for Information Security;\u00c9cole Polytechnique",
        "aff_domain": "cispa.de;polytechnique.fr",
        "position": "Postdoc;Assistant Professor",
        "bibtex": "@misc{\nbinkyte2024dissecting,\ntitle={Dissecting Causal Biases},\nauthor={Ruta Binkyte and Sami Zhioua},\nyear={2024},\nurl={https://openreview.net/forum?id=MFwQVbkTQ2}\n}",
        "github": "",
        "project": "",
        "reviewers": "tMUj;Ynmd;P3Ft;dVLJ",
        "site": "https://openreview.net/forum?id=MFwQVbkTQ2",
        "pdf_size": 6335993,
        "rating": "3;3;3;6",
        "confidence": "3;3;4;3",
        "soundness": "3;2;3;3",
        "contribution": "1;2;1;4",
        "presentation": "3;2;3;3",
        "wc_summary": "45;63;16;97",
        "wc_strengths": "33;53;11;59",
        "wc_weaknesses": "109;571;304;49",
        "wc_questions": "28;150;22;22",
        "wc_review": "215;837;353;227",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            1.224744871391589
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            55.25,
            29.363029475856198
        ],
        "wc_strengths_avg": [
            39.0,
            18.81488772222678
        ],
        "wc_weaknesses_avg": [
            258.25,
            203.69508462405273
        ],
        "wc_questions_avg": [
            55.5,
            54.61455849862745
        ],
        "wc_review_avg": [
            408.0,
            253.51331325987596
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=344612945209150505&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "CISPA Helmholtz Center for Information Security;Ecole Polytechnique",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cispa.de/;https://www.polytechnique.edu",
        "aff_unique_abbr": "CISPA;X",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Germany;France"
    },
    {
        "id": "MGWsPGogLH",
        "title": "Turing Complete Transformers: Two Transformers Are More Powerful Than One",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper presents Find+Replace transformers, a family of multi-transformer architectures that can provably do things no single transformer can, and which outperforms GPT-4 on several challenging tasks. We first establish that traditional transformers and similar architectures are not Turing Complete, while Find+Replace transformers are. Using this fact, we show how arbitrary programs can be compiled into Find+Replace transformers, potentially aiding interpretability research. We also demonstrate the superior performance of Find+Replace transformers over GPT-4 on a set of composition challenge problems. This work aims to provide a theoretical basis for multi-transformer architectures, and to encourage their further exploration.",
        "keywords": "transformers;computational complexity;computation;generalization;agents;multi-model",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Shriyash Kaustubh Upadhyay;Etan Jacob Ginsberg",
        "authorids": "~Shriyash_Kaustubh_Upadhyay1;~Etan_Jacob_Ginsberg1",
        "gender": ";M",
        "homepage": ";http://www.etanginsberg.com",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Shriyash_Kaustubh_Upadhyay1;~Etan_Jacob_Ginsberg1",
        "aff": ";",
        "aff_domain": ";",
        "position": ";",
        "bibtex": "@misc{\nupadhyay2024turing,\ntitle={Turing Complete Transformers: Two Transformers Are More Powerful Than One},\nauthor={Shriyash Kaustubh Upadhyay and Etan Jacob Ginsberg},\nyear={2024},\nurl={https://openreview.net/forum?id=MGWsPGogLH}\n}",
        "github": "",
        "project": "",
        "reviewers": "erh8;5hCM;zEM4;bz3o",
        "site": "https://openreview.net/forum?id=MGWsPGogLH",
        "pdf_size": 301783,
        "rating": "3;3;3;3",
        "confidence": "3;3;4;4",
        "soundness": "1;2;2;2",
        "contribution": "1;2;2;2",
        "presentation": "1;1;2;2",
        "wc_summary": "44;106;55;73",
        "wc_strengths": "3;23;86;56",
        "wc_weaknesses": "291;338;680;325",
        "wc_questions": "1;112;142;167",
        "wc_review": "339;579;963;621",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            69.5,
            23.47871376374779
        ],
        "wc_strengths_avg": [
            42.0,
            31.678068122914315
        ],
        "wc_weaknesses_avg": [
            408.5,
            157.6871903484871
        ],
        "wc_questions_avg": [
            105.5,
            63.3975551579081
        ],
        "wc_review_avg": [
            625.5,
            222.5820073590855
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:NWrELZyCEEwJ:scholar.google.com/&scioq=Turing+Complete+Transformers:+Two+Transformers+Are+More+Powerful+Than+One&hl=en&as_sdt=0,5",
        "gs_version_total": 2
    },
    {
        "id": "MHQMZ8FOL5",
        "title": "Dual-level Adaptive Self-Labeling for Novel Class Discovery in Point Cloud Segmentation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We tackle the novel class discovery in point cloud segmentation, which discovers novel classes based on existing knowledge. Existing works propose an online point-wise clustering method with a simplified equal class-size \nconstraint on the novel classes to avoid degenerate solutions. However,  the inherent imbalanced distribution of novel classes \nin point clouds contradicts the equal class-size constraint, and point-wise clustering tends to ignore the rich spatial context information of objects, which can result in less expressive representation for semantic segmentation.\nTo solve the above challenges, we propose a novel self-labeling strategy that adaptively generates high-quality pseudo-labels for imbalanced classes during model training. In addition, we develop a dual-level representation that incorporates regional consistency into the point-level classifier learning, reducing the noise in generated segmentation. Finally, we conduct extensive experiments on two widely used datasets, SemanticKITTI and SemanticPOSS, and the results show our method significantly outperforms the state-of-the-art by a large margin.",
        "keywords": "novel class discovery;point clouds semantic segmantation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/19f025ae1e8fd2af9419e02d25949dff39aeb5b2.zip",
        "author": "Ruijie Xu;Chuyu Zhang;Hui Ren;Xuming He",
        "authorids": "~Ruijie_Xu1;~Chuyu_Zhang1;~Hui_Ren2;~Xuming_He3",
        "gender": "F;M;M;M",
        "homepage": "https://github.com/RikkiXu;;https://rhfeiyang.github.io;https://faculty.sist.shanghaitech.edu.cn/faculty/hexm/index.html",
        "dblp": ";270/8658;50/5673-3;03/4230",
        "google_scholar": ";V7IktkcAAAAJ;d4jhC7gAAAAJ;0KyeZ2QAAAAJ",
        "orcid": ";;0009-0000-6109-4731;",
        "linkedin": ";;hui-ren/;",
        "or_profile": "~Ruijie_Xu1;~Chuyu_Zhang1;~Hui_Ren2;~Xuming_He3",
        "aff": "ShanghaiTech University;ShanghaiTech University;Massachusetts Institute of Technology;ShanghaiTech University",
        "aff_domain": "shanghaitech.edu.cn;shanghaitech.edu.cn;mit.edu;shanghaitech.edu.cn",
        "position": "MS student;PhD student;Undergrad student;Associate Professor",
        "bibtex": "@misc{\nxu2024duallevel,\ntitle={Dual-level Adaptive Self-Labeling for Novel Class Discovery in Point Cloud Segmentation},\nauthor={Ruijie Xu and Chuyu Zhang and Hui Ren and Xuming He},\nyear={2024},\nurl={https://openreview.net/forum?id=MHQMZ8FOL5}\n}",
        "github": "",
        "project": "",
        "reviewers": "Zvms;nnmw;cd9p;74h9",
        "site": "https://openreview.net/forum?id=MHQMZ8FOL5",
        "pdf_size": 29039849,
        "rating": "5;5;6;6",
        "confidence": "3;3;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;2",
        "presentation": "1;2;3;3",
        "wc_summary": "49;47;96;118",
        "wc_strengths": "16;39;49;56",
        "wc_weaknesses": "38;36;289;193",
        "wc_questions": "251;47;2;9",
        "wc_review": "354;169;436;376",
        "wc_reply_reviewers": "39;0;0;29",
        "wc_reply_authors": "966;496;1025;895",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "3;2;3;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            77.5,
            30.516389039334257
        ],
        "wc_strengths_avg": [
            40.0,
            15.116216457830975
        ],
        "wc_weaknesses_avg": [
            139.0,
            107.50116278440899
        ],
        "wc_questions_avg": [
            77.25,
            101.76535510673561
        ],
        "wc_review_avg": [
            333.75,
            99.7406010609521
        ],
        "wc_reply_reviewers_avg": [
            17.0,
            17.363755354185336
        ],
        "wc_reply_authors_avg": [
            845.5,
            206.96678477475558
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9580753828379311418&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "ShanghaiTech University;Massachusetts Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.shanghaitech.edu.cn;https://web.mit.edu",
        "aff_unique_abbr": "ShanghaiTech;MIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "High-dimensional SGD aligns with emerging outlier eigenspaces",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18834",
        "id": "MHjigVnI04",
        "author_site": "Gerard Ben Arous, Reza Gheissari, Jiaoyang Huang, Aukosh Jagannath",
        "tldr": "",
        "abstract": "We rigorously study the joint evolution of training dynamics via stochastic gradient descent (SGD) and the spectra of empirical Hessian and gradient matrices. We prove that in two canonical classification tasks for multi-class high-dimensional mixtures and either 1 or 2-layer neural networks, the SGD trajectory rapidly aligns with emerging low-rank outlier eigenspaces of the Hessian and gradient matrices. Moreover, in multi-layer settings this alignment occurs per layer, with the final layer's outlier eigenspace evolving over the course of training, and exhibiting rank deficiency when the SGD converges to sub-optimal classifiers. This establishes  some of the rich predictions that have arisen from extensive numerical studies in the last decade about the spectra of Hessian and information matrices over the course of training in overparametrized networks.",
        "keywords": "stochastic gradient descent;Hessian;multi-layer neural networks;high-dimensional classification;Gaussian mixture model;XOR problem",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Gerard Ben Arous;Reza Gheissari;Jiaoyang Huang;Aukosh Jagannath",
        "authorids": "~Gerard_Ben_Arous1;~Reza_Gheissari1;~Jiaoyang_Huang1;~Aukosh_Jagannath1",
        "gender": "M;M;M;",
        "homepage": "https://cims.nyu.edu/~benarous/;https://sites.northwestern.edu/gheissari/;https://jiaoyang.github.io/;",
        "dblp": ";;;",
        "google_scholar": ";;x9nZCeAAAAAJ;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Gerard_Ben_Arous1;~Reza_Gheissari1;~Jiaoyang_Huang1;~Aukosh_Jagannath1",
        "aff": "New York University;Northwestern University;The Wharton School, University of Pennsylvania;",
        "aff_domain": "nyu.edu;northwestern.edu;wharton.upenn.edu;",
        "position": "Full Professor;Assistant Professor;Assistant Professor;",
        "bibtex": "@inproceedings{\narous2024highdimensional,\ntitle={High-dimensional {SGD} aligns with emerging outlier eigenspaces},\nauthor={Gerard Ben Arous and Reza Gheissari and Jiaoyang Huang and Aukosh Jagannath},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=MHjigVnI04}\n}",
        "github": "",
        "project": "",
        "reviewers": "WpLy;BqTJ;frpP;SJuj;K4sY;tvSQ",
        "pdf_size": 1138133,
        "rating": "6;6;8;8;8;10",
        "confidence": "2;3;3;3;3;5",
        "soundness": "3;3;3;4;4;4",
        "contribution": "3;3;3;3;3;4",
        "presentation": "2;3;3;3;4;4",
        "wc_summary": "138;56;38;87;108;133",
        "wc_strengths": "42;15;91;193;33;118",
        "wc_weaknesses": "33;173;17;138;107;1",
        "wc_questions": "63;74;1;732;57;232",
        "wc_review": "276;318;147;1150;305;484",
        "wc_reply_reviewers": "0;10;0;131;28;28",
        "wc_reply_authors": "128;421;10;657;358;151",
        "reply_reviewers": "0;1;0;2;1;1",
        "reply_authors": "1;1;1;2;1;1",
        "rating_avg": [
            7.666666666666667,
            1.3743685418725535
        ],
        "confidence_avg": [
            3.1666666666666665,
            0.8975274678557507
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.1666666666666665,
            0.3726779962499649
        ],
        "presentation_avg": [
            3.1666666666666665,
            0.6871842709362768
        ],
        "wc_summary_avg": [
            93.33333333333333,
            37.14685570662595
        ],
        "wc_strengths_avg": [
            82.0,
            60.81118318204309
        ],
        "wc_weaknesses_avg": [
            78.16666666666667,
            64.73128215081861
        ],
        "wc_questions_avg": [
            193.16666666666666,
            251.15162529613238
        ],
        "wc_review_avg": [
            446.6666666666667,
            329.55104140161484
        ],
        "wc_reply_reviewers_avg": [
            32.833333333333336,
            45.38875288977313
        ],
        "wc_reply_authors_avg": [
            287.5,
            216.17951645179832
        ],
        "reply_reviewers_avg": [
            0.8333333333333334,
            0.6871842709362768
        ],
        "reply_authors_avg": [
            1.1666666666666667,
            0.3726779962499649
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.8557169633109856,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6109200980725001656&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=MHjigVnI04",
        "pdf": "https://openreview.net/pdf?id=MHjigVnI04",
        "email": "nyu.edu;northwestern.edu;wharton.upenn.edu;",
        "author_num": 4,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "New York University;Northwestern University;University of Pennsylvania",
        "aff_unique_dep": ";;The Wharton School",
        "aff_unique_url": "https://www.nyu.edu;https://www.northwestern.edu;https://www.wharton.upenn.edu",
        "aff_unique_abbr": "NYU;NU;UPenn Wharton",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Symphony: Symmetry-Equivariant Point-Centered Spherical Harmonics for 3D Molecule Generation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18833",
        "id": "MIEnYtlGyv",
        "author_site": "Ameya Daigavane, Song Eun Kim, Mario Geiger, Tess Smidt",
        "tldr": "",
        "abstract": "We present Symphony, an $E(3)$ equivariant autoregressive generative model for 3D molecular geometries\nthat iteratively builds a molecule from molecular fragments.\nExisting autoregressive models such as G-SchNet and G-SphereNet  for molecules utilize rotationally invariant features to respect the 3D symmetries of molecules.\nIn contrast, Symphony uses message-passing with higher-degree $E(3)$-equivariant features.\nThis allows a novel representation of probability distributions via spherical harmonic signals to efficiently model the 3D geometry of\nmolecules. We show that Symphony is able to accurately generate small molecules from the QM9 dataset, outperforming existing\nautoregressive models and approaching the performance of diffusion models. Our code is available at https://github.com/atomicarchitects/symphony.",
        "keywords": "molecule;spherical harmonics;equivariant;symmetry;generation",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/87959bbc4fc72bdbca9a68e79a06226da4439803.zip",
        "author": "Ameya Daigavane;Song Eun Kim;Mario Geiger;Tess Smidt",
        "authorids": "~Ameya_Daigavane1;~Song_Eun_Kim1;~Mario_Geiger1;~Tess_Smidt1",
        "gender": ";F;M;F",
        "homepage": "https://ameya98.github.io/;https://songkim.me;;https://blondegeek.github.io/",
        "dblp": ";;206/7093;215/4978.html",
        "google_scholar": "2hegRsIAAAAJ;;;",
        "orcid": "0000-0002-5116-3075;0000-0003-1039-1204;0000-0001-5433-0900;0000-0001-5581-5344",
        "linkedin": ";;;",
        "or_profile": "~Ameya_Daigavane1;~Song_Eun_Kim1;~Mario_Geiger1;~Tess_Smidt1",
        "aff": "Massachusetts Institute of Technology;Massachusetts Institute of Technology;NVIDIA;Massachusetts Institute of Technology",
        "aff_domain": "mit.edu;mit.edu;nvidia.com;mit.edu",
        "position": "PhD student;Undergrad student;Researcher;Assistant Professor",
        "bibtex": "@inproceedings{\ndaigavane2024symphony,\ntitle={Symphony: Symmetry-Equivariant Point-Centered Spherical Harmonics for 3D Molecule Generation},\nauthor={Ameya Daigavane and Song Eun Kim and Mario Geiger and Tess Smidt},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=MIEnYtlGyv}\n}",
        "github": "",
        "project": "",
        "reviewers": "msmy;cp6D;XBL9;UhEf",
        "pdf_size": 18704667,
        "rating": "6;6;6;8",
        "confidence": "3;4;4;3",
        "soundness": "3;3;3;2",
        "contribution": "3;3;3;2",
        "presentation": "3;3;2;3",
        "wc_summary": "66;93;38;167",
        "wc_strengths": "70;122;126;63",
        "wc_weaknesses": "144;163;391;202",
        "wc_questions": "6;2;63;203",
        "wc_review": "286;380;618;635",
        "wc_reply_reviewers": "10;0;0;55",
        "wc_reply_authors": "354;229;534;647",
        "reply_reviewers": "1;0;0;2",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            91.0,
            47.994791384065834
        ],
        "wc_strengths_avg": [
            95.25,
            28.89095879336648
        ],
        "wc_weaknesses_avg": [
            225.0,
            98.09434234450018
        ],
        "wc_questions_avg": [
            68.5,
            81.31574263326874
        ],
        "wc_review_avg": [
            479.75,
            150.58614644116503
        ],
        "wc_reply_reviewers_avg": [
            16.25,
            22.741756748325315
        ],
        "wc_reply_authors_avg": [
            441.0,
            160.93321596239852
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16307753727675976664&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=MIEnYtlGyv",
        "pdf": "https://openreview.net/pdf?id=MIEnYtlGyv",
        "email": "mit.edu;mit.edu;nvidia.com;mit.edu",
        "author_num": 4,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Massachusetts Institute of Technology;NVIDIA",
        "aff_unique_dep": ";NVIDIA Corporation",
        "aff_unique_url": "https://web.mit.edu;https://www.nvidia.com",
        "aff_unique_abbr": "MIT;NVIDIA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "MIKNVIxd2X",
        "title": "Sequential Indeterminate Probability Theory for Multivariate Time Series Forecasting",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Currently, there is no mathematical analytical form for a general posterior, however, Indeterminate Probability Theory has now discovered a way to address this issue. This is a big discovery in the field of probability and it is also applicable to multivariate time series (MTS) forecasting. Deep models, particularly transformer-based models, have shown better performance for MTS forecasting than traditional statistical models, however, deep models are black-boxes for human. In this paper, we propose a new probabilistic method for MTS forecasting that does not rely on any neural models, and this method does not require any training process. We formulate MTS forecasting problem as a complex posterior and consider the MTS value as an indeterminate probability distribution. Based on the indeterminate probability theory, the posterior becomes analytical tractable, even in the presence of a thousand-dimensional latent space. Experimental results show that our method outperforms LSTM models as well as some transformer-based models.",
        "keywords": "Indeterminate Probability Theory;Continuous Random Variable;Analytical Solution;MTS",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/e1825aa07952799cdd86c3a1c1adeb957769f843.zip",
        "author": "Tao Yang",
        "authorids": "~Tao_Yang19",
        "gender": "M",
        "homepage": "https://github.com/Starfruit007",
        "dblp": "67/1120",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works",
        "orcid": "",
        "linkedin": "https://www.linkedin.com/mwlite/in/tao-yang-754b40217",
        "or_profile": "~Tao_Yang19",
        "aff": "United Automotive Electronic Systems Co., Ltd.",
        "aff_domain": "uaes.com",
        "position": "Researcher",
        "bibtex": "@misc{\nyang2024sequential,\ntitle={Sequential Indeterminate Probability Theory for Multivariate Time Series Forecasting},\nauthor={Tao Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=MIKNVIxd2X}\n}",
        "github": "",
        "project": "",
        "reviewers": "hhu6;xZ9w;6gm7;TTQE",
        "site": "https://openreview.net/forum?id=MIKNVIxd2X",
        "pdf_size": 375193,
        "rating": "1;1;1;3",
        "confidence": "4;4;3;2",
        "soundness": "1;1;2;2",
        "contribution": "2;1;2;2",
        "presentation": "1;1;1;1",
        "wc_summary": "85;43;52;65",
        "wc_strengths": "63;9;56;43",
        "wc_weaknesses": "119;230;167;82",
        "wc_questions": "34;11;77;33",
        "wc_review": "301;293;352;223",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            1.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            1.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.0,
            0.0
        ],
        "wc_summary_avg": [
            61.25,
            15.785673884886892
        ],
        "wc_strengths_avg": [
            42.75,
            20.765054779605084
        ],
        "wc_weaknesses_avg": [
            149.5,
            55.391786394735455
        ],
        "wc_questions_avg": [
            38.75,
            23.920441049445557
        ],
        "wc_review_avg": [
            292.25,
            45.94221914535692
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.8703882797784891,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:UriOYIYSS8YJ:scholar.google.com/&scioq=Sequential+Indeterminate+Probability+Theory+for+Multivariate+Time+Series+Forecasting&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "United Automotive Electronic Systems",
        "aff_unique_dep": "",
        "aff_unique_url": "",
        "aff_unique_abbr": "",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "MIuimtOu0T",
        "title": "Towards Fair Knowledge Distillation using Student Feedback",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "With the advent of large-scale foundation models and their success in diverse fields, Knowledge Distillation (KD) techniques are increasingly used to deploy them to edge devices with limited memory and computation constraints. However, most KD works focus on improving the prediction performance of the student model distilled from large teacher models, and there is little to no work in studying the effect of distillation on key fairness properties, ensuring trustworthy distillation. In this work, we propose a fairness-driven distillation framework, BIRD (BIas-awaRe Distillation), which introduces a FAIRDISTILL operator to collect feedback from the student through a meta learning-based approach and selectively distill teacher knowledge. We demonstrate that BIRD can be augmented with different KD methods to increase the performance of a wide range of foundation models and convolu- tional neural networks after distillation. Extensive experiments across three fairness datasets show the efficacy of our framework over existing state-of-the-art KD meth- ods, opening up new directions to develop trustworthy distillation techniques.",
        "keywords": "Fairness;Foundation Models;Bias-aware Distillation",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/efcf37524c63223e3500b3f456bb4499b37ea637.zip",
        "author": "Abhinav Java;Surgan Jandial;Chirag Agarwal",
        "authorids": "~Abhinav_Java1;~Surgan_Jandial2;~Chirag_Agarwal1",
        "gender": "M;M;M",
        "homepage": "https://java-abhinav07.github.io/;https://surgan12.github.io;https://chirag-agarwall.github.io/",
        "dblp": "284/9013;246/4915;173/8821",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;1sWyXaoAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;",
        "linkedin": "abhinav-java-2b57a4187/;surgan-jandial-9a085a14b/?originalSubdomain=in;chirag-agarwal-0a6a43a1/",
        "or_profile": "~Abhinav_Java1;~Surgan_Jandial2;~Chirag_Agarwal1",
        "aff": "Microsoft;Adobe Systems;Harvard University",
        "aff_domain": "microsoft.com;adobe.com;hbs.edu",
        "position": "Researcher;Researcher;Postdoc",
        "bibtex": "@misc{\njava2024towards,\ntitle={Towards Fair Knowledge Distillation using Student Feedback},\nauthor={Abhinav Java and Surgan Jandial and Chirag Agarwal},\nyear={2024},\nurl={https://openreview.net/forum?id=MIuimtOu0T}\n}",
        "github": "",
        "project": "",
        "reviewers": "UAGV;qaWv;QvRs;qpK3;Gu1U",
        "site": "https://openreview.net/forum?id=MIuimtOu0T",
        "pdf_size": 594119,
        "rating": "5;5;6;6;6",
        "confidence": "5;4;3;3;4",
        "soundness": "2;3;3;3;3",
        "contribution": "1;2;3;3;3",
        "presentation": "4;3;3;3;2",
        "wc_summary": "34;70;50;25;162",
        "wc_strengths": "25;94;36;123;38",
        "wc_weaknesses": "177;187;46;138;176",
        "wc_questions": "45;1;2;28;130",
        "wc_review": "281;352;134;314;506",
        "wc_reply_reviewers": "63;474;0;0;0",
        "wc_reply_authors": "1005;1934;218;754;0",
        "reply_reviewers": "1;3;0;0;0",
        "reply_authors": "3;6;1;1;0",
        "rating_avg": [
            5.6,
            0.48989794855663565
        ],
        "confidence_avg": [
            3.8,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.4,
            0.8
        ],
        "presentation_avg": [
            3.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            68.2,
            49.33315315282411
        ],
        "wc_strengths_avg": [
            63.2,
            38.363524342792076
        ],
        "wc_weaknesses_avg": [
            144.8,
            52.15131829589737
        ],
        "wc_questions_avg": [
            41.2,
            47.38522976624678
        ],
        "wc_review_avg": [
            317.4,
            119.78246950201019
        ],
        "wc_reply_reviewers_avg": [
            107.4,
            184.91684617686948
        ],
        "wc_reply_authors_avg": [
            782.2,
            679.2991682609364
        ],
        "reply_reviewers_avg": [
            0.8,
            1.1661903789690604
        ],
        "reply_authors_avg": [
            2.2,
            2.1354156504062622
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.7637626158259733,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Ht5GGwUcjPkJ:scholar.google.com/&scioq=Towards+Fair+Knowledge+Distillation+using+Student+Feedback&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Microsoft;Adobe;Harvard University",
        "aff_unique_dep": "Microsoft Corporation;Adobe Systems Incorporated;",
        "aff_unique_url": "https://www.microsoft.com;https://www.adobe.com;https://www.harvard.edu",
        "aff_unique_abbr": "Microsoft;Adobe;Harvard",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Knowledge Distillation Based on Transformed Teacher Matching",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18832",
        "id": "MJ3K7uDGGl",
        "author_site": "Kaixiang Zheng, EN-HUI YANG",
        "tldr": "",
        "abstract": "As a technique to bridge logit matching and probability distribution matching, temperature scaling plays a pivotal role in knowledge distillation (KD).  Conventionally, temperature scaling is applied to both teacher's logits and student's logits in KD. Motivated by some recent works, in this paper, we drop instead temperature scaling on the student side, and systematically study the resulting variant of KD, dubbed transformed teacher matching (TTM). By reinterpreting temperature scaling as a power transform of probability distribution, we show that in comparison with the original KD, TTM has an inherent R\u00e9nyi entropy term in its objective function, which serves as an extra regularization term.  Extensive experiment results demonstrate that thanks to this inherent regularization, TTM leads to trained students with better generalization than the original KD. To further enhance student's capability to match teacher's power transformed probability distribution, we introduce a sample-adaptive weighting coefficient into TTM, yielding a novel distillation approach dubbed weighted TTM (WTTM). It is shown, by comprehensive experiments, that although WTTM is simple, it is effective, improves upon TTM, and achieves state-of-the-art accuracy performance. Our source code is available at https://github.com/zkxufo/TTM.",
        "keywords": "Knowledge distillation;temperature scaling;regularization;image classification",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/282e43c0c32b95ab469d3fa813e6003bd1e4df27.zip",
        "author": "Kaixiang Zheng;EN-HUI YANG",
        "authorids": "~Kaixiang_Zheng1;~EN-HUI_YANG1",
        "gender": "M;",
        "homepage": ";https://uwaterloo.ca/multicom-research-group/research-team/about-director",
        "dblp": "361/0324;y/EnHuiYang.html",
        "google_scholar": "https://scholar.google.com/citations?hl=en;",
        "orcid": "0000-0001-8082-6977;",
        "linkedin": "kaixiang-zheng-113665229/;",
        "or_profile": "~Kaixiang_Zheng1;~EN-HUI_YANG1",
        "aff": "University of Waterloo;University of Waterloo",
        "aff_domain": "uwaterloo.ca;uwaterloo.ca",
        "position": "PhD student;Full Professor",
        "bibtex": "@inproceedings{\nzheng2024knowledge,\ntitle={Knowledge Distillation Based on Transformed Teacher Matching},\nauthor={Kaixiang Zheng and EN-HUI YANG},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=MJ3K7uDGGl}\n}",
        "github": "",
        "project": "",
        "reviewers": "2Z26;DiN5;LeDY;fD3s",
        "pdf_size": 677447,
        "rating": "6;6;6;8",
        "confidence": "4;3;2;5",
        "soundness": "2;3;4;2",
        "contribution": "2;2;3;2",
        "presentation": "3;3;2;4",
        "wc_summary": "42;76;87;88",
        "wc_strengths": "38;19;58;200",
        "wc_weaknesses": "99;65;29;223",
        "wc_questions": "1;2;5;45",
        "wc_review": "180;162;179;556",
        "wc_reply_reviewers": "56;0;0;15",
        "wc_reply_authors": "855;605;568;831",
        "reply_reviewers": "2;0;0;1",
        "reply_authors": "4;3;3;3",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            73.25,
            18.64638034579366
        ],
        "wc_strengths_avg": [
            78.75,
            71.34905395308336
        ],
        "wc_weaknesses_avg": [
            104.0,
            73.02739212103907
        ],
        "wc_questions_avg": [
            13.25,
            18.38987493160299
        ],
        "wc_review_avg": [
            269.25,
            165.7096481801829
        ],
        "wc_reply_reviewers_avg": [
            17.75,
            22.916969694966216
        ],
        "wc_reply_authors_avg": [
            714.75,
            129.1943787476839
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.25,
            0.4330127018922193
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.7745966692414834,
        "gs_citation": 26,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16657472950799291941&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=MJ3K7uDGGl",
        "pdf": "https://openreview.net/pdf?id=MJ3K7uDGGl",
        "email": "uwaterloo.ca;uwaterloo.ca",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Waterloo",
        "aff_unique_dep": "",
        "aff_unique_url": "https://uwaterloo.ca",
        "aff_unique_abbr": "UW",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Canada"
    },
    {
        "title": "Discovering Temporally-Aware Reinforcement Learning Algorithms",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18831",
        "id": "MJJcs3zbmi",
        "author_site": "Matthew T Jackson, Chris Lu, Louis Kirsch, Robert Lange, Shimon Whiteson, Jakob Foerster",
        "tldr": "",
        "abstract": "Recent advancements in meta-learning have enabled the automatic discovery of novel reinforcement learning algorithms parameterized by surrogate objective functions. To improve upon manually designed algorithms, the parameterization of this learned objective function must be expressive enough to represent novel principles of learning (instead of merely recovering already established ones) while still generalizing to a wide range of settings outside of its meta-training distribution. However, existing methods focus on discovering objective functions that, like many widely used objective functions in reinforcement learning, do not take into account the total number of steps allowed for training, or \u201ctraining horizon\u201d. In contrast, humans use a plethora of different learning objectives across the course of acquiring a new ability. For instance, students may alter their studying techniques based on the proximity to exam deadlines and their self-assessed capabilities. This paper contends that ignoring the optimization time horizon significantly restricts the expressive potential of discovered learning algorithms. We propose a simple augmentation to two existing objective discovery approaches that allows the discovered algorithm to dynamically update its objective function throughout the agent\u2019s training procedure, resulting in expressive schedules and increased generalization across different training horizons. In the process, we find that commonly used meta-gradient approaches fail to discover such adaptive objective functions while evolution strategies discover highly dynamic learning rules. We demonstrate the effectiveness of our approach on a wide range of tasks and analyze the resulting learned algorithms, which we find effectively balance exploration and exploitation by modifying the structure of their learning rules throughout the agent\u2019s lifetime.",
        "keywords": "Reinforcement Learning;Meta-Learning;Meta-RL;Meta-Optimization;Policy Meta-Optimization;Learned Objective Functions",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/eb7f9b97c84662f6d9aadb1c28dbb55a2b067450.pdf",
        "author": "Matthew Thomas Jackson;Chris Lu;Louis Kirsch;Robert Tjarko Lange;Shimon Whiteson;Jakob Nicolaus Foerster",
        "authorids": "~Matthew_Thomas_Jackson1;~Chris_Lu1;~Louis_Kirsch1;~Robert_Tjarko_Lange1;~Shimon_Whiteson1;~Jakob_Nicolaus_Foerster1",
        "gender": "M;;;;;M",
        "homepage": "https://matthewtjackson.com;;http://louiskirsch.com;https://roberttlange.github.io/;;https://www.jakobfoerster.com",
        "dblp": "331/5748;77/9579;202/2379;245/9152;https://dblp.uni-trier.de/pers/w/Whiteson:Shimon.html;176/5095",
        "google_scholar": "SdGawnwAAAAJ;4WLoIRsAAAAJ;w8AkOEAAAAAJ;https://scholar.google.es/citations?user=cTrc3x4AAAAJ;;6z4lQzMAAAAJ",
        "orcid": ";;;;;",
        "linkedin": "matthew-t-jackson/;;;;;",
        "or_profile": "~Matthew_Thomas_Jackson1;~Chris_Lu1;~Louis_Kirsch1;~Robert_Tjarko_Lange1;~Shimon_Whiteson1;~Jakob_Nicolaus_Foerster1",
        "aff": "Wayve;University of Oxford;Scuola universitaria professionale della Svizzera italiana (SUPSI);TU Berlin;University of Oxford;University of Oxford, University of Oxford",
        "aff_domain": "wayve.ai;ox.ac.uk;supsi.ch;tu-berlin.de;ox.ac.uk;eng.ox.ac.uk",
        "position": "Intern;PhD student;PhD student;PhD student;Professor;Associate Professor",
        "bibtex": "@inproceedings{\njackson2024discovering,\ntitle={Discovering Temporally-Aware Reinforcement Learning Algorithms},\nauthor={Matthew Thomas Jackson and Chris Lu and Louis Kirsch and Robert Tjarko Lange and Shimon Whiteson and Jakob Nicolaus Foerster},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=MJJcs3zbmi}\n}",
        "github": "",
        "project": "",
        "reviewers": "47vA;hAap;c7mC",
        "pdf_size": 3212561,
        "rating": "5;8;8",
        "confidence": "5;4;4",
        "soundness": "3;4;3",
        "contribution": "3;3;3",
        "presentation": "2;3;3",
        "wc_summary": "80;74;66",
        "wc_strengths": "45;85;16",
        "wc_weaknesses": "42;58;70",
        "wc_questions": "277;79;54",
        "wc_review": "444;296;206",
        "wc_reply_reviewers": "0;47;17",
        "wc_reply_authors": "905;519;528",
        "reply_reviewers": "0;1;1",
        "reply_authors": "2;1;2",
        "rating_avg": [
            7.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            73.33333333333333,
            5.734883511361751
        ],
        "wc_strengths_avg": [
            48.666666666666664,
            28.288199345702832
        ],
        "wc_weaknesses_avg": [
            56.666666666666664,
            11.469767022723502
        ],
        "wc_questions_avg": [
            136.66666666666666,
            99.75414221419022
        ],
        "wc_review_avg": [
            315.3333333333333,
            98.12010780444321
        ],
        "wc_reply_reviewers_avg": [
            21.333333333333332,
            19.430788855719562
        ],
        "wc_reply_authors_avg": [
            650.6666666666666,
            179.87835395684002
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 19,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7244159791827313705&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=MJJcs3zbmi",
        "pdf": "https://openreview.net/pdf?id=MJJcs3zbmi",
        "email": "wayve.ai;ox.ac.uk;supsi.ch;tu-berlin.de;ox.ac.uk;eng.ox.ac.uk",
        "author_num": 6,
        "aff_unique_index": "0;1;2;3;1;1",
        "aff_unique_norm": "Wayve;University of Oxford;Scuola universitaria professionale della Svizzera italiana;Technische Universit\u00e4t Berlin",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.wayve.ai;https://www.ox.ac.uk;https://www.supsi.ch;https://www.tu-berlin.de",
        "aff_unique_abbr": ";Oxford;SUPSI;TU Berlin",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Berlin",
        "aff_country_unique_index": "0;0;1;2;0;0",
        "aff_country_unique": "United Kingdom;Switzerland;Germany"
    },
    {
        "id": "MJXqei2uy7",
        "title": "Parameter-Efficient Tuning Helps Language Model Alignment",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Aligning large language models (LLMs) with human preferences is essential for safe and useful LLMs. Previous works mainly adopt reinforcement learning (RLHF) and direct preference optimization (DPO) with human feedback for alignment. Nevertheless, they have certain drawbacks. One such limitation is that they can only align models with one preference at the training time (e.g., they cannot learn to generate concise responses when the preference data prefers detailed responses), or have certain constraints for the data format (e.g., DPO only supports pairwise preference data). To this end, prior works incorporate controllable generations for alignment to make language models learn multiple preferences and provide outputs with different preferences during inference if asked. Controllable generation also offers more flexibility with regard to data format (e.g., it supports pointwise preference data). Specifically, it uses different control tokens for different preferences during training and inference, making LLMs behave differently when required. Current controllable generation methods either use a special token or hand-crafted prompts as control tokens, and optimize them together with LLMs. As control tokens are typically much lighter than LLMs, this optimization strategy may not effectively optimize control tokens. To this end, we first use parameter-efficient tuning (e.g., prompting tuning and low-rank adaptation) to optimize control tokens and then fine-tune models for controllable generations, similar to prior works. Our approach, alignMEnt with parameter-Efficient Tuning (MEET), improves the quality of control tokens, thus improving controllable generation quality consistently by an apparent margin on two well-recognized datasets compared with prior works.",
        "keywords": "Alignment; Large Lanugage Models; Controllable Generations",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/689101889f1f2998e80e64f4899cdbf080e9c194.zip",
        "author": "Tianci Xue;Ziqi Wang;Heng Ji",
        "authorids": "~Tianci_Xue1;~Ziqi_Wang2;~Heng_Ji3",
        "gender": "M;;F",
        "homepage": "https://xuetianci.github.io/;https://www.wzq016.github.io;http://blender.cs.illinois.edu/hengji.html",
        "dblp": "347/9360;38/8097-3;",
        "google_scholar": "wVFSbzkAAAAJ;xYRZiZkAAAAJ;z7GCqT4AAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Tianci_Xue1;~Ziqi_Wang2;~Heng_Ji3",
        "aff": "Nanjing University;Meta Facebook;University of Illinois, Urbana-Champaign",
        "aff_domain": "nju.edu.cn;meta.com;uiuc.edu",
        "position": "MS student;Intern;Full Professor",
        "bibtex": "@misc{\nxue2024parameterefficient,\ntitle={Parameter-Efficient Tuning Helps Language Model Alignment},\nauthor={Tianci Xue and Ziqi Wang and Heng Ji},\nyear={2024},\nurl={https://openreview.net/forum?id=MJXqei2uy7}\n}",
        "github": "",
        "project": "",
        "reviewers": "z7DA;Q2P6;HEu9;Lxvm",
        "site": "https://openreview.net/forum?id=MJXqei2uy7",
        "pdf_size": 622078,
        "rating": "3;3;5;6",
        "confidence": "4;4;4;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;3;2",
        "wc_summary": "124;47;205;54",
        "wc_strengths": "43;35;39;34",
        "wc_weaknesses": "132;233;169;146",
        "wc_questions": "444;6;40;66",
        "wc_review": "743;321;453;300",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            107.5,
            63.83768479511142
        ],
        "wc_strengths_avg": [
            37.75,
            3.5619517121937516
        ],
        "wc_weaknesses_avg": [
            170.0,
            38.6975451417787
        ],
        "wc_questions_avg": [
            139.0,
            177.37248941140788
        ],
        "wc_review_avg": [
            454.25,
            176.7248921346396
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.7777777777777777,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10395394395541584125&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Nanjing University;Meta;University of Illinois",
        "aff_unique_dep": ";Meta Platforms, Inc.;",
        "aff_unique_url": "https://www.nju.edu.cn;https://meta.com;https://illinois.edu",
        "aff_unique_abbr": "Nanjing U;Meta;UIUC",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Urbana-Champaign",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "CARD: Channel Aligned Robust Blend Transformer for Time Series Forecasting",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18830",
        "id": "MJksrOhurE",
        "author_site": "xue wang, Tian Zhou, Qingsong Wen, Jinyang Gao, Bolin Ding, Rong Jin",
        "tldr": "",
        "abstract": "Recent studies have demonstrated the great power of Transformer models for time series forecasting. One of the key elements that lead to the transformer's success is the channel-independent (CI) strategy to improve the training robustness. However, the ignorance of the correlation among different channels in CI would limit the model's forecasting capacity. In this work, we design a special Transformer, i.e., **C**hannel **A**ligned **R**obust Blen**d**  Transformer (CARD for short), that addresses key shortcomings of CI type Transformer in time series forecasting. First, CARD introduces a channel-aligned attention structure that allows it to capture both temporal correlations among signals and dynamical dependence among multiple variables over time. Second, in order to efficiently utilize the multi-scale knowledge, we design a token blend module to generate tokens with different resolutions. Third, we introduce a robust loss function for time series forecasting to alleviate the potential overfitting issue. This new loss function weights the importance of forecasting over a finite horizon based on prediction uncertainties. Our evaluation of multiple long-term and short-term forecasting datasets demonstrates that CARD significantly outperforms state-of-the-art time series forecasting methods. The code is available at the following repository: https://github.com/wxie9/CARD.",
        "keywords": "time series forecasting;transformer;robust learning;token mixing",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Xue Wang;Tian Zhou;Qingsong Wen;Jinyang Gao;Bolin Ding;Rong Jin",
        "authorids": "~Xue_Wang9;~Tian_Zhou2;~Qingsong_Wen2;~Jinyang_Gao1;~Bolin_Ding3;~Rong_Jin1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://scholar.google.com/citations?user=9o5r8bUAAAAJ&hl=en;;https://bolinding.github.io/;https://sites.google.com/site/qingsongwen8/;https://www.cse.msu.edu/~rongjin/;https://www.linkedin.com/in/xue-wang-98739572/",
        "dblp": "31/4578-4.html;131/4047;46/3522.html;27/561;j/RongJin;",
        "google_scholar": "9o5r8bUAAAAJ;;AjYkTi8AAAAJ;vjPJvwYAAAAJ;;",
        "orcid": "0000-0003-1789-5413;;;0000-0003-4516-2524;;",
        "linkedin": ";;bolin-ding-50a0119/;qingsong-wen-22814156/;;",
        "or_profile": "~Tian_Zhou2;~Jinyang_Gao1;~Bolin_Ding3;~Qingsong_Wen1;~Rong_Jin3;~xue_wang1",
        "aff": "Alibaba Group;Alibaba Group;Alibaba Group;Squirrel Ai Learning;Twitter;Alibaba Group US",
        "aff_domain": "alibaba-inc.com;alibaba-inc.com;alibaba-inc.com;squirrelai.com;twitter.com;alibaba-inc.com",
        "position": "Researcher;Researcher;Senior Director;Principal Researcher;Researcher;Researcher",
        "bibtex": "@inproceedings{\nwang2024card,\ntitle={{CARD}: Channel Aligned Robust Blend Transformer for Time Series Forecasting},\nauthor={Xue Wang and Tian Zhou and Qingsong Wen and Jinyang Gao and Bolin Ding and Rong Jin},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=MJksrOhurE}\n}",
        "github": "",
        "project": "",
        "reviewers": "gMyA;fhNE;eTmJ;ajLB",
        "pdf_size": 8763626,
        "rating": "5;6;6;8",
        "confidence": "4;3;4;5",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "58;89;158;23",
        "wc_strengths": "40;81;152;73",
        "wc_weaknesses": "67;160;153;206",
        "wc_questions": "245;37;61;27",
        "wc_review": "410;367;524;329",
        "wc_reply_reviewers": "46;0;0;0",
        "wc_reply_authors": "2210;1197;980;946",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "3;3;2;3",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            82.0,
            49.704124577342675
        ],
        "wc_strengths_avg": [
            86.5,
            40.81972562377165
        ],
        "wc_weaknesses_avg": [
            146.5,
            50.21205034650547
        ],
        "wc_questions_avg": [
            92.5,
            88.90866099542833
        ],
        "wc_review_avg": [
            407.5,
            73.1112166497043
        ],
        "wc_reply_reviewers_avg": [
            11.5,
            19.91858428704209
        ],
        "wc_reply_authors_avg": [
            1333.25,
            515.2675882490572
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            0.4330127018922193
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.6488856845230502,
        "gs_citation": 60,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9011414726034846078&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=MJksrOhurE",
        "pdf": "https://openreview.net/pdf?id=MJksrOhurE",
        "email": "alibaba-inc.com;alibaba-inc.com;alibaba-inc.com;squirrelai.com;twitter.com;alibaba-inc.com",
        "author_num": 6,
        "aff_unique_index": "0;0;0;1;2;0",
        "aff_unique_norm": "Alibaba Group;Squirrel Ai Learning;Twitter, Inc.",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.alibaba.com;https://www.squirrelai.com/;https://twitter.com",
        "aff_unique_abbr": "Alibaba;;Twitter",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "MK7TEe7SJ3",
        "title": "USTAM: UNIFIED SPATIO-TEMPORAL ATTENTION MIXFORMER FOR VISUAL OBJECT TRACKING",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this paper, we present a unified spatio-temporal attention MixFormer framework for visual object tracking. Within the vision transformer framework, we design a cohesive network consisting of target template and search region feature extraction, cross-attention utilizing spatial and temporal information, and task-specific heads, all operating in an end-to-end manner. Incorporating spatial and temporal attention modules within the network enables simultaneous feature extraction and emphasis, allowing the model to concentrate on target-specific discriminative features despite changes in illumination, occlusion, scale, camera pose, and background clutter. Stacking multiple non-hierarchical blocks allows meaningful features to be extracted while irrelevant features are discarded from the provided target template and search region. The simultaneous spatio-temporal attention module is employed to accentuate target appearance features and alleviate variation in the object state across frame sequences. Qualitative and quantitative analysis, including ablation tests based on various tracking benchmarks, validates the robustness of the proposed tracking methodology.",
        "keywords": "Visual object tracking;Spartiotemporal attention",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Minho Park;Jinjoo Song;Gangjoon Yoon;Sang Min Yoon",
        "authorids": "~Minho_Park4;~Jinjoo_Song1;~Gangjoon_Yoon1;~Sang_Min_Yoon1",
        "gender": "M;F;M;M",
        "homepage": "https://www.notion.so/minhobbang/03e65dd136e84908be2dcddfe01456aa;;;",
        "dblp": ";;;",
        "google_scholar": ";https://scholar.google.com/citations?hl=ko;HEl7exQAAAAJ;",
        "orcid": ";0000-0003-3335-5644;0000-0002-0654-491X;0000-0003-0001-1845",
        "linkedin": ";;;",
        "or_profile": "~Minho_Park4;~Jinjoo_Song1;~Gangjoon_Yoon1;~Sang_Min_Yoon1",
        "aff": "Kookmin University;Kookmin University;;Kookmin University",
        "aff_domain": "kookmin.ac.kr;kookmin.ac.kr;;kookmin.ac.kr",
        "position": "MS student;Assistant Professor;;Full Professor",
        "bibtex": "@misc{\npark2024ustam,\ntitle={{USTAM}: {UNIFIED} {SPATIO}-{TEMPORAL} {ATTENTION} {MIXFORMER} {FOR} {VISUAL} {OBJECT} {TRACKING}},\nauthor={Minho Park and Jinjoo Song and Gangjoon Yoon and Sang Min Yoon},\nyear={2024},\nurl={https://openreview.net/forum?id=MK7TEe7SJ3}\n}",
        "github": "",
        "project": "",
        "reviewers": "ciuV;yHrZ;DDtH",
        "site": "https://openreview.net/forum?id=MK7TEe7SJ3",
        "pdf_size": 1891555,
        "rating": "3;5;5",
        "confidence": "5;4;5",
        "soundness": "2;2;2",
        "contribution": "1;2;2",
        "presentation": "2;2;2",
        "wc_summary": "118;18;81",
        "wc_strengths": "61;15;43",
        "wc_weaknesses": "57;31;262",
        "wc_questions": "17;145;262",
        "wc_review": "253;209;648",
        "wc_reply_reviewers": "24;0;0",
        "wc_reply_authors": "184;288;278",
        "reply_reviewers": "1;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            72.33333333333333,
            41.282226468811274
        ],
        "wc_strengths_avg": [
            39.666666666666664,
            18.92675942210452
        ],
        "wc_weaknesses_avg": [
            116.66666666666667,
            103.31290120578143
        ],
        "wc_questions_avg": [
            141.33333333333334,
            100.0544296315205
        ],
        "wc_review_avg": [
            370.0,
            197.3946976660383
        ],
        "wc_reply_reviewers_avg": [
            8.0,
            11.313708498984761
        ],
        "wc_reply_authors_avg": [
            250.0,
            46.847269575362304
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:madi0qJrquQJ:scholar.google.com/&scioq=USTAM:+UNIFIED+SPATIO-TEMPORAL+ATTENTION+MIXFORMER+FOR+VISUAL+OBJECT+TRACKING&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Kookmin University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kookmin.ac.kr",
        "aff_unique_abbr": "KMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "InternVid: A Large-scale Video-Text Dataset for Multimodal Understanding and Generation",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18829",
        "id": "MLBdiWu4Fw",
        "author_site": "Yi Wang, Yinan He, Yizhuo Li, Kunchang Li, Jiashuo Yu, Xin Ma, Xinhao Li, Guo Chen, Xinyuan Chen, Yaohui Wang, Ping Luo, Ziwei Liu, Yali Wang, Limin Wang, Yu Qiao",
        "tldr": "",
        "abstract": "This paper introduces InternVid, a large-scale video-centric multimodal dataset that enables learning powerful and transferable video-text representations for multimodal understanding and generation. InternVid contains over 7 million videos lasting nearly 760K hours, yielding 234M video clips accompanied by detailed descriptions of total 4.1B words. Our core contribution is to develop a scalable approach to autonomously build a high-quality video-text dataset with large language models (LLM), thereby showcasing its efficacy in learning video-language representation at scale. Specifically, we utilize a multi-scale approach to generate video-related descriptions. Furthermore, we introduce ViCLIP, a video-text representation learning model based on ViT-L. Learned on InternVid via contrastive learning, this model demonstrates leading zero-shot action recognition and competitive video retrieval performance. Beyond basic video understanding tasks like recognition and retrieval, our dataset and model have broad applications. They are particularly beneficial for generating interleaved video-text data for learning a video-centric dialogue system, advancing video-to-text and text-to-video generation research. These proposed resources provide a tool for researchers and practitioners interested in multimodal video understanding and generation.",
        "keywords": "video-language dataset;video understanding;video generation;multimodal understanding;action recognition;video retrieval",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/ab6262d86bfdbdf3844255ccbd7ff6bdca41c17b.zip",
        "author": "Yi Wang;Yinan He;Yizhuo Li;Kunchang Li;Jiashuo Yu;Xin Ma;Xinhao Li;Guo Chen;Xinyuan Chen;Yaohui Wang;Ping Luo;Ziwei Liu;Yali Wang;Limin Wang;Yu Qiao",
        "authorids": "~Yi_Wang19;~Yinan_He1;~Yizhuo_Li1;~Kunchang_Li1;~Jiashuo_Yu1;~Xin_Ma3;~Xinhao_Li1;~Guo_Chen2;~Xinyuan_Chen1;~Yaohui_Wang1;~Ping_Luo2;~Ziwei_Liu1;~Yali_Wang1;~Limin_Wang1;~Yu_Qiao1",
        "gender": "M;M;M;M;M;;M;;F;M;;M;M;;",
        "homepage": "https://shepnerd.github.io/;https://yinanhe.github.io;https://liyz15.github.io/;https://andy1621.github.io/;;https://maxin-cn.github.io/;https://leexinhao.github.io;;;https://wyhsirius.github.io/;;https://liuziwei7.github.io/;;;",
        "dblp": "17/221-33;93/7763;249/5913-1;;289/7338;;;;;168/6263-1.html;;05/6300-2;01/773-1;;",
        "google_scholar": "Xm2M8UwAAAAJ;EgfF_CEAAAAJ;pyBSGjgAAAAJ;D4tLSbsAAAAJ;iH0Aq0YAAAAJ;https://scholar.google.com.hk/citations?user=dN8QWCQAAAAJ;https://scholar.google.com.hk/citations?user=evR3uR0AAAAJ;;3fWSC8YAAAAJ;R7LyAb4AAAAJ;;https://scholar.google.com.hk/citations?user=lc45xlcAAAAJ;https://scholar.google.com/citations?hl=en;;",
        "orcid": ";;;0000-0001-5612-0341;;0000-0001-9389-9032;0009-0003-0382-3985;;0000-0002-5517-7255;;;;;;",
        "linkedin": ";;;%E6%98%86%E6%98%8C-%E9%BB%8E-2a4a951b2/;;;;;;;;;;;",
        "or_profile": "~Yi_Wang19;~Yinan_He1;~Yizhuo_Li1;~Kunchang_Li1;~Jiashuo_Yu1;~Xin_Ma3;~Xinhao_Li1;~Guo_Chen2;~Xinyuan_Chen1;~Yaohui_Wang1;~Ping_Luo2;~Ziwei_Liu1;~Yali_Wang1;~Limin_Wang1;~Yu_Qiao1",
        "aff": "Shanghai AI Laboratory;Shanghai Aritifcal Intelligence Laboratory;The University of Hong Kong;Shenzhen Institutes of Advanced Technology, Chinese Academy of Sciences, Chinese Academy of Sciences;Shanghai AI Laboratory;Monash University;Nanjing university;;Shanghai Artificial Intelligence Laboratory;Shanghai AI Laboratory;;Nanyang Technological University;SIAT, Chinese Academy of Sciences;;",
        "aff_domain": "pjlab.org.cn;pjlab.org.cn;cs.hku.hk;siat.ac.cn;pjlab.org.cn;monash.edu;nju.edu.cn;;pjlab.org.cn;pjlab.org.cn;;ntu.edu.sg;siat.ac.cn;;",
        "position": "Researcher;Researcher;PhD student;PhD student;Researcher;PhD student;MS student;;Research Scientist;Research Scientist;;Assistant Professor;Full Professor;;",
        "bibtex": "@inproceedings{\nwang2024internvid,\ntitle={InternVid: A Large-scale Video-Text Dataset for Multimodal Understanding and Generation},\nauthor={Yi Wang and Yinan He and Yizhuo Li and Kunchang Li and Jiashuo Yu and Xin Ma and Xinhao Li and Guo Chen and Xinyuan Chen and Yaohui Wang and Ping Luo and Ziwei Liu and Yali Wang and Limin Wang and Yu Qiao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=MLBdiWu4Fw}\n}",
        "github": "",
        "project": "",
        "reviewers": "1UqW;G48V;6e9v;gWXX",
        "pdf_size": 6007701,
        "rating": "6;6;8;8",
        "confidence": "4;4;5;5",
        "soundness": "2;2;3;3",
        "contribution": "3;3;3;3",
        "presentation": "2;3;3;2",
        "wc_summary": "73;43;59;72",
        "wc_strengths": "158;79;47;28",
        "wc_weaknesses": "281;85;151;163",
        "wc_questions": "96;73;166;4",
        "wc_review": "608;280;423;267",
        "wc_reply_reviewers": "61;27;40;177",
        "wc_reply_authors": "2461;724;2119;2303",
        "reply_reviewers": "1;1;1;2",
        "reply_authors": "5;1;4;5",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            61.75,
            12.152674602736633
        ],
        "wc_strengths_avg": [
            78.0,
            49.65380146574882
        ],
        "wc_weaknesses_avg": [
            170.0,
            70.63285354564121
        ],
        "wc_questions_avg": [
            84.75,
            57.850561795024944
        ],
        "wc_review_avg": [
            394.5,
            137.62358082828683
        ],
        "wc_reply_reviewers_avg": [
            76.25,
            59.41958852095831
        ],
        "wc_reply_authors_avg": [
            1901.75,
            690.6617750389839
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.75,
            1.6393596310755
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            15,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 295,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5470122915354183756&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=MLBdiWu4Fw",
        "pdf": "https://openreview.net/pdf?id=MLBdiWu4Fw",
        "email": "pjlab.org.cn;pjlab.org.cn;cs.hku.hk;siat.ac.cn;pjlab.org.cn;monash.edu;nju.edu.cn;;pjlab.org.cn;pjlab.org.cn;;ntu.edu.sg;siat.ac.cn;;",
        "author_num": 15,
        "aff_unique_index": "0;1;2;3;0;4;5;1;0;6;7",
        "aff_unique_norm": "Shanghai AI Laboratory;Shanghai Artificial Intelligence Laboratory;University of Hong Kong;Chinese Academy of Sciences;Monash University;Nanjing University;Nanyang Technological University;Shenzhen Institute of Advanced Technology",
        "aff_unique_dep": ";;;Shenzhen Institutes of Advanced Technology;;;;",
        "aff_unique_url": "https://www.shanghai-ai-lab.com;http://www.shanghaiai.cn;https://www.hku.hk;http://www.cas.cn;https://www.monash.edu;https://www.nju.edu.cn;https://www.ntu.edu.sg;http://www.siat.ac.cn",
        "aff_unique_abbr": "SAIL;;HKU;CAS;Monash;Nanjing U;NTU;SIAT",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Hong Kong SAR;Shenzhen",
        "aff_country_unique_index": "0;0;0;0;0;1;0;0;0;2;0",
        "aff_country_unique": "China;Australia;Singapore"
    },
    {
        "id": "MLShfiJ3CB",
        "title": "Towards Reliable Backdoor Attacks on Vision Transformers",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Backdoor attacks, which make Convolution Neural Networks (CNNs) exhibit specific behaviors in the presence of a predefined trigger, bring risks to the usage of CNNs. These threats should be also considered on Vision Transformers. However, previous studies found that the existing backdoor attacks are powerful enough in ViTs to bypass common backdoor defenses, \\textit{i.e.}, these defenses either fail to reduce the attack success rate or cause a significant accuracy drop. This study investigates the existing backdoor attacks/defenses and finds that this kind of achievement is over-optimistic, caused by inappropriate adaption of defenses from CNNs to ViTs. Existing backdoor attacks can still be easily defended against with proper inheritance from CNNs. Furthermore, we propose a more reliable attack: adding a small perturbation on the trigger is enough to help existing attacks more persistent against various defenses. We hope our contributions, including the finding that existing attacks are still easy to defend with adaptations and the new backdoor attack, will promote more in-depth research into the backdoor robustness of ViTs.",
        "keywords": "Vision Transformer;Backdoor Attack;Backdoor Defense",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/0d0189f4e4ef335a3b246a176dd82e0385a28c29.pdf",
        "author": "Yichuan Mo;Dongxian Wu;Yifei Wang;Yiwen Guo;Yisen Wang",
        "authorids": "~Yichuan_Mo1;~Dongxian_Wu1;~Yifei_Wang1;~Yiwen_Guo1;~Yisen_Wang1",
        "gender": "M;M;M;;M",
        "homepage": "https://www.linkedin.com/in/%E6%98%93%E5%B7%9D-%E8%8E%AB-446841212/;;https://yifeiwang77.com;;https://yisenwang.github.io/",
        "dblp": "321/6790;259/1755;00/555-1;;172/1346-1",
        "google_scholar": "xvSYG1gAAAAJ;ZQzqQqwAAAAJ;-CLy6YsAAAAJ;;uMWPDboAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Yichuan_Mo1;~Dongxian_Wu1;~Yifei_Wang1;~Yiwen_Guo1;~Yisen_Wang1",
        "aff": "Peking University;The University of Tokyo;Massachusetts Institute of Technology;;Peking University",
        "aff_domain": "stu.pku.edu.cn;u-tokyo.ac.jp;mit.edu;;pku.edu.cn",
        "position": "PhD student;Postdoc;Postdoc;;Assistant Professor",
        "bibtex": "@misc{\nmo2024towards,\ntitle={Towards Reliable Backdoor Attacks on Vision Transformers},\nauthor={Yichuan Mo and Dongxian Wu and Yifei Wang and Yiwen Guo and Yisen Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=MLShfiJ3CB}\n}",
        "github": "",
        "project": "",
        "reviewers": "FJ73;Vd1v;FbZc;jtUw",
        "site": "https://openreview.net/forum?id=MLShfiJ3CB",
        "pdf_size": 2575032,
        "rating": "3;5;5;5",
        "confidence": "3;4;4;3",
        "soundness": "2;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "2;2;3;2",
        "wc_summary": "77;61;88;41",
        "wc_strengths": "46;26;36;15",
        "wc_weaknesses": "173;131;231;128",
        "wc_questions": "4;5;157;1",
        "wc_review": "300;223;512;185",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "978;1677;1335;1421",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;3;3;3",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            66.75,
            17.69710428290459
        ],
        "wc_strengths_avg": [
            30.75,
            11.519006033508273
        ],
        "wc_weaknesses_avg": [
            165.75,
            41.66158302321217
        ],
        "wc_questions_avg": [
            41.75,
            66.55589755987069
        ],
        "wc_review_avg": [
            305.0,
            126.48912996775651
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1352.75,
            250.2742246017356
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            3.0,
            0.0
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:mSdSpdUakFEJ:scholar.google.com/&scioq=Towards+Reliable+Backdoor+Attacks+on+Vision+Transformers&hl=en&as_sdt=0,5",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Peking University;University of Tokyo;Massachusetts Institute of Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.u-tokyo.ac.jp;https://web.mit.edu",
        "aff_unique_abbr": "Peking U;UTokyo;MIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;0",
        "aff_country_unique": "China;Japan;United States"
    },
    {
        "id": "MLt4DO7ibS",
        "title": "Manifold Inspired Graph Contrastive Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recently, graph contrastive learning (GCL) has emerged as a promising and trending paradigm for graph representation learning, providing generalizable node embeddings for various downstream tasks. However, current GCL methods often fail to fully exploit and encode the fine-grained graph structure information, leading to less informative node representations. In this study, we argue for a holistic approach that accounts for both node attributes and fine-grained graph structures, taking inspiration from spectral-based manifold learning techniques. Accordingly, we introduce MIGCL, a cutting-edge contrastive representation learning framework that employs cross-view adjacency reconstruction and feature orthogonalization. This dual approach not only retains the fine-grained graph/manifold structure information but also minimizes feature redundancy, thus averting the risk of representation collapse. To achieve feature orthogonalization, we employ an information-theoretic objective called Total Coding Rate. Our model can also be interpreted as a practical implementation of the Maximum Entropy Principle within the GCL context. Comprehensive experiments across three pivotal tasks: node classification, node clustering, and link prediction, affirm the method's efficacy and superiority.",
        "keywords": "Self-supervised Learning;Graph Representation Learning",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Yunhui Liu;Tieke He;Jianhua Zhao",
        "authorids": "~Yunhui_Liu2;~Tieke_He2;~Jianhua_Zhao1",
        "gender": "M;M;M",
        "homepage": "https://cloudy1225.github.io;https://hetieke.cn/;https://cs.nju.edu.cn/58/18/c2639a153624/page.htm",
        "dblp": "376/8770-2;156/1840;",
        "google_scholar": "-UGa1fsAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com.tw/citations?user=qO7iw2QAAAAJ",
        "orcid": "0009-0006-3337-0886;0000-0001-9649-1796;",
        "linkedin": ";;",
        "or_profile": "~Yunhui_Liu2;~Tieke_He2;~Jianhua_Zhao1",
        "aff": "Nanjing University;Nanjing University;",
        "aff_domain": "nju.edu.cn;nju.edu.cn;",
        "position": "Undergrad student;Assistant Professor;",
        "bibtex": "@misc{\nliu2024manifold,\ntitle={Manifold Inspired Graph Contrastive Learning},\nauthor={Yunhui Liu and Tieke He and Jianhua Zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=MLt4DO7ibS}\n}",
        "github": "",
        "project": "",
        "reviewers": "7ii6;ydcH;iU8b;kqKA;bWNT",
        "site": "https://openreview.net/forum?id=MLt4DO7ibS",
        "pdf_size": 1141306,
        "rating": "3;3;3;5;6",
        "confidence": "5;4;4;4;2",
        "soundness": "3;2;2;3;3",
        "contribution": "2;1;2;2;3",
        "presentation": "2;3;2;3;3",
        "wc_summary": "21;83;74;386;16",
        "wc_strengths": "33;36;48;129;23",
        "wc_weaknesses": "95;256;460;499;293",
        "wc_questions": "23;2;6;287;29",
        "wc_review": "172;377;588;1301;361",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            4.0,
            1.2649110640673518
        ],
        "confidence_avg": [
            3.8,
            0.9797958971132712
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            116.0,
            137.67933759282835
        ],
        "wc_strengths_avg": [
            53.8,
            38.436441042323366
        ],
        "wc_weaknesses_avg": [
            320.6,
            146.34835154520874
        ],
        "wc_questions_avg": [
            69.4,
            109.26774455437432
        ],
        "wc_review_avg": [
            559.8,
            393.3189036901227
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8068715304598785,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:6KymeoO4KhEJ:scholar.google.com/&scioq=Manifold+Inspired+Graph+Contrastive+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Nanjing University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nju.edu.cn",
        "aff_unique_abbr": "Nanjing U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "MLvovAYjo7",
        "title": "Instructed Diffuser with Temporal Condition Guidance for Offline Reinforcement Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recent works have shown the potential of diffusion models in computer vision and natural language processing. Apart from the classical supervised learning fields, diffusion models have also shown strong competitiveness in reinforcement learning (RL) by formulating decision-making as sequential generation. However, incorporating temporal information of sequential data and utilizing it to guide diffusion models to perform better generation is still an open challenge. In this paper, we take one step forward to investigate controllable generation with temporal conditions that are refined from temporal information. We observe the importance of temporal conditions in sequential generation in sufficient explorative scenarios and provide a comprehensive discussion and comparison of different temporal conditions. Based on the observations, we propose an effective temporally-conditional diffusion model coined Temporally-Composable Diffuser (TCD), which extracts temporal information from interaction sequences and explicitly guides generation with temporal conditions. Specifically, we separate the sequences into three parts according to time expansion and identify historical, immediate, and prospective conditions accordingly. Each condition preserves non-overlapping temporal information of sequences, enabling more controllable generation when we jointly use them to guide the diffuser. Finally, we conduct extensive experiments and analysis to reveal the favorable applicability of TCD in offline RL tasks, where our method reaches or matches the best performance compared with prior SOTA baselines.",
        "keywords": "Reinforcement Learning;Diffusion Model",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Jifeng Hu;Yanchao Sun;Sili Huang;Siyuan Guo;Hechang Chen;Li Shen;Lichao Sun;Yi Chang;Dacheng Tao",
        "authorids": "~Jifeng_Hu1;~Yanchao_Sun1;~Sili_Huang1;~Siyuan_Guo2;~Hechang_Chen2;~Li_Shen1;~Lichao_Sun1;~Yi_Chang4;~Dacheng_Tao1",
        "gender": ";F;M;M;M;M;M;M;",
        "homepage": ";https://ycsun2017.github.io/home/index.html;;;http://sai.jlu.edu.cn/info/1094/2387.htm;https://sites.google.com/site/mathshenli/home;https://lichao-sun.github.io/;http://www.yichang-cs.com;",
        "dblp": ";132/6840;26/6752;244/5858;145/1142;91/3680-8;121/0780-1.html;02/5438.html;",
        "google_scholar": ";bloBY_QAAAAJ;ZMhi8A0AAAAJ;JE1Yco4AAAAJ;EezEcbgAAAAJ;yVhgENIAAAAJ;WhGUE7AAAAAJ;https://scholar.google.com.hk/citations?user=drEkR50AAAAJ;",
        "orcid": ";0000-0002-1137-9939;0000-0001-5387-7904;0000-0002-9304-5405;;;;0000-0003-2697-8093;",
        "linkedin": ";;;;;;lichao-sun-b273a290/;;",
        "or_profile": "~Jifeng_Hu1;~Yanchao_Sun1;~Sili_Huang1;~Siyuan_Guo2;~Hechang_Chen2;~Li_Shen1;~Lichao_Sun1;~Yi_Chang4;~Dacheng_Tao1",
        "aff": ";J.P. Morgan AI Research;Jilin University;Jilin University;Jilin University;JD Explore Academy;Lehigh University;Jilin University, China;",
        "aff_domain": ";jpmchase.com;jlu.edu.cn;jlu.edu.cn;jlu.edu.cn;jd.com;lehigh.edu;jlu.edu.cn;",
        "position": ";Researcher;PhD student;PhD student;Associate Professor;Researcher;Assistant Professor;Full Professor;",
        "bibtex": "@misc{\nhu2024instructed,\ntitle={Instructed Diffuser with Temporal Condition Guidance for Offline Reinforcement Learning},\nauthor={Jifeng Hu and Yanchao Sun and Sili Huang and Siyuan Guo and Hechang Chen and Li Shen and Lichao Sun and Yi Chang and Dacheng Tao},\nyear={2024},\nurl={https://openreview.net/forum?id=MLvovAYjo7}\n}",
        "github": "",
        "project": "",
        "reviewers": "8Q3i;kxUN;PzFh",
        "site": "https://openreview.net/forum?id=MLvovAYjo7",
        "pdf_size": 16999882,
        "rating": "3;5;5",
        "confidence": "3;3;3",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "2;3;3",
        "wc_summary": "88;67;129",
        "wc_strengths": "28;87;106",
        "wc_weaknesses": "251;2;195",
        "wc_questions": "44;183;195",
        "wc_review": "411;339;625",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            94.66666666666667,
            25.746628689770024
        ],
        "wc_strengths_avg": [
            73.66666666666667,
            33.209770985191824
        ],
        "wc_weaknesses_avg": [
            149.33333333333334,
            106.65937475075607
        ],
        "wc_questions_avg": [
            140.66666666666666,
            68.52898818910303
        ],
        "wc_review_avg": [
            458.3333333333333,
            121.46147079995734
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 16,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11149178143023433747&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1;1;2;3;1",
        "aff_unique_norm": "J.P. Morgan;Jilin University;JD;Lehigh University",
        "aff_unique_dep": "AI Research;;JD Explore Academy;",
        "aff_unique_url": "https://www.jpmorgan.com;http://www.jlu.edu.cn;;https://www.lehigh.edu",
        "aff_unique_abbr": "JPM;JLU;;Lehigh",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;0;1",
        "aff_country_unique": "United States;China;"
    },
    {
        "id": "MM30SJ4wAf",
        "title": "Point Neighborhood Embeddings",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Point convolution operations rely on different embedding mechanisms to encode the neighborhood information of each point in order to detect patterns in 3D space. However, as convolutions are usually evaluated as a whole, not much work has been done to investigate which is the ideal mechanism to encode such neighborhood information. In this paper, we provide the first extensive study that analyzes such Point Neighborhood Embeddings (PNE) alone in a controlled experimental setup. From our experiments, we derive a set of recommendations for PNE that can help to improve future designs of neural network architectures for point clouds. Our most surprising finding shows that the most commonly used embedding based on a Multi-Layer Perceptron (MLP) with ReLU activation functions provides the lowest performance among all embeddings, even being surpassed on some tasks by a simple linear combination of the point coordinates. Additionally, we show that a neural network architecture using simple convolutions based on such embeddings is able to achieve state-of-the-art results on several tasks, outperforming recent and more complex operations. Lastly, we show that these findings extrapolate to other more complex convolution operations, where we show how following our recommendations we are able to improve recent state-of-the-art architectures.",
        "keywords": "point clouds;3D computer vision;3D scene understanding;neural network architectures",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Pedro Hermosilla",
        "authorids": "~Pedro_Hermosilla1",
        "gender": "M",
        "homepage": "https://phermosilla.github.io/",
        "dblp": "170/7065",
        "google_scholar": "C7F4B6MAAAAJ",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Pedro_Hermosilla1",
        "aff": "Technische Universit\u00e4t Wien",
        "aff_domain": "tuwien.ac.at",
        "position": "Assistant Professor",
        "bibtex": "@misc{\nhermosilla2024point,\ntitle={Point Neighborhood Embeddings},\nauthor={Pedro Hermosilla},\nyear={2024},\nurl={https://openreview.net/forum?id=MM30SJ4wAf}\n}",
        "github": "",
        "project": "",
        "reviewers": "n5A1;1sX7;BoSJ;HsUz",
        "site": "https://openreview.net/forum?id=MM30SJ4wAf",
        "pdf_size": 819332,
        "rating": "3;5;6;8",
        "confidence": "4;3;5;3",
        "soundness": "2;3;3;3",
        "contribution": "1;2;4;3",
        "presentation": "3;3;3;3",
        "wc_summary": "55;36;43;57",
        "wc_strengths": "42;28;301;38",
        "wc_weaknesses": "165;67;271;1",
        "wc_questions": "16;28;5;1",
        "wc_review": "278;159;620;97",
        "wc_reply_reviewers": "22;0;27;0",
        "wc_reply_authors": "496;454;519;30",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            1.118033988749895
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            47.75,
            8.642193008721803
        ],
        "wc_strengths_avg": [
            102.25,
            114.86160150372272
        ],
        "wc_weaknesses_avg": [
            126.0,
            102.04410811016969
        ],
        "wc_questions_avg": [
            12.5,
            10.5
        ],
        "wc_review_avg": [
            288.5,
            202.1416582498521
        ],
        "wc_reply_reviewers_avg": [
            12.25,
            12.376893794486563
        ],
        "wc_reply_authors_avg": [
            374.75,
            200.40131611344273
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.25087260300212727,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:w3yHv92z7N4J:scholar.google.com/&scioq=Point+Neighborhood+Embeddings&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "Technische Universit\u00e4t Wien",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tuwien.ac.at",
        "aff_unique_abbr": "TU Wien",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Austria"
    },
    {
        "title": "SyncDreamer: Generating Multiview-consistent Images from a Single-view Image",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18828",
        "id": "MN3yH2ovHb",
        "author_site": "Yuan Liu, Cheng Lin, Zijiao Zeng, Xiaoxiao Long, Lingjie Liu, Taku Komura, Wenping Wang",
        "tldr": "",
        "abstract": "In this paper, we present a novel diffusion model called SyncDreamer that generates multiview-consistent images from a single-view image. Using pretrained large-scale 2D diffusion models, recent work Zero123 demonstrates the ability to generate plausible novel views from a single-view image of an object. However, maintaining consistency in geometry and colors for the generated images remains a challenge. To address this issue, we propose a synchronized multiview diffusion model that models the joint probability distribution of multiview images, enabling the generation of multiview-consistent images in a single reverse process. SyncDreamer synchronizes the intermediate states of all the generated images at every step of the reverse process through a 3D-aware feature attention mechanism that correlates the corresponding features across different views. Experiments show that SyncDreamer generates images with high consistency across different views, thus making it well-suited for various 3D generation tasks such as novel-view-synthesis, text-to-3D, and image-to-3D. Project page: https://liuyuan-pal.github.io/SyncDreamer/.",
        "keywords": "diffusion model; single-view reconstruction; 3D generation; generative models",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Yuan Liu;Cheng Lin;Zijiao Zeng;Xiaoxiao Long;Lingjie Liu;Taku Komura;Wenping Wang",
        "authorids": "~Yuan_Liu3;~Cheng_Lin1;~Zijiao_Zeng1;~Xiaoxiao_Long2;~Lingjie_Liu1;~Taku_Komura2;~Wenping_Wang1",
        "gender": "M;M;M;F;M;M;M",
        "homepage": "https://liuyuan-pal.github.io/;https://clinplayer.github.io/;;https://lingjie0206.github.io/;https://i.cs.hku.hk/~taku/;https://engineering.tamu.edu/cse/profiles/Wang-Wenping.html;https://xxlong0.github.io/",
        "dblp": "87/2948-25;;;204/0052;;;262/3688",
        "google_scholar": "yRAHVcgAAAAJ;KAL4c2cAAAAJ;https://scholar.google.com/citations?view_op=list_works;https://scholar.google.de/citations?user=HZPnJ9gAAAAJ;;28shvv0AAAAJ;W3G5kZEAAAAJ",
        "orcid": ";;;;0000-0002-2729-5860;0000-0002-2284-3952;0000-0002-3386-8805",
        "linkedin": ";;;;;;",
        "or_profile": "~Yuan_Liu3;~Cheng_Lin1;~Zijiao_Zeng1;~Lingjie_Liu1;~Taku_Komura2;~Wenping_Wang1;~XIAOXIAO_LONG1",
        "aff": "The University of Hong Kong;Tencent;;University of Pennsylvania;the University of Hong Kong, University of Hong Kong;Texas A&M University - College Station;University of Hong Kong",
        "aff_domain": "hku.hk;tencent.com;;upenn.edu;cs.hku.hk;tamu.edu;hku.hk",
        "position": "PhD student;Researcher;;Assistant Professor;Full Professor;Full Professor;Postdoc",
        "bibtex": "@inproceedings{\nliu2024syncdreamer,\ntitle={SyncDreamer: Generating Multiview-consistent Images from a Single-view Image},\nauthor={Yuan Liu and Cheng Lin and Zijiao Zeng and Xiaoxiao Long and Lingjie Liu and Taku Komura and Wenping Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=MN3yH2ovHb}\n}",
        "github": "",
        "project": "",
        "reviewers": "Q4FP;3H3E;mZRr;bdx1;hhwq",
        "pdf_size": 24539640,
        "rating": "6;8;8;8;10",
        "confidence": "5;1;5;4;4",
        "soundness": "3;4;4;2;4",
        "contribution": "3;4;4;3;4",
        "presentation": "4;3;2;3;4",
        "wc_summary": "75;23;91;122;94",
        "wc_strengths": "66;74;66;96;166",
        "wc_weaknesses": "153;42;153;372;216",
        "wc_questions": "26;31;1;126;240",
        "wc_review": "320;170;311;716;716",
        "wc_reply_reviewers": "0;5;18;131;0",
        "wc_reply_authors": "426;456;327;1044;923",
        "reply_reviewers": "0;1;1;2;0",
        "reply_authors": "1;1;2;4;2",
        "rating_avg": [
            8.0,
            1.2649110640673518
        ],
        "confidence_avg": [
            3.8,
            1.469693845669907
        ],
        "soundness_avg": [
            3.4,
            0.8
        ],
        "contribution_avg": [
            3.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            3.2,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            81.0,
            32.71085446759225
        ],
        "wc_strengths_avg": [
            93.6,
            37.829089336118045
        ],
        "wc_weaknesses_avg": [
            187.2,
            108.0766394740325
        ],
        "wc_questions_avg": [
            84.8,
            88.49723159511827
        ],
        "wc_review_avg": [
            446.6,
            226.30740155814613
        ],
        "wc_reply_reviewers_avg": [
            30.8,
            50.53078269728265
        ],
        "wc_reply_authors_avg": [
            635.2,
            290.10715261778705
        ],
        "reply_reviewers_avg": [
            0.8,
            0.7483314773547883
        ],
        "reply_authors_avg": [
            2.0,
            1.0954451150103321
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.21516574145596756,
        "gs_citation": 223,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3037618765426430687&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=MN3yH2ovHb",
        "pdf": "https://openreview.net/pdf?id=MN3yH2ovHb",
        "email": "hku.hk;tencent.com;;upenn.edu;cs.hku.hk;tamu.edu;hku.hk",
        "author_num": 7,
        "aff_unique_index": "0;1;2;0;3;0",
        "aff_unique_norm": "University of Hong Kong;Tencent;University of Pennsylvania;Texas A&M University",
        "aff_unique_dep": ";Tencent Holdings Limited;;",
        "aff_unique_url": "https://www.hku.hk;https://www.tencent.com;https://www.upenn.edu;https://www.tamu.edu",
        "aff_unique_abbr": "HKU;Tencent;UPenn;TAMU",
        "aff_campus_unique_index": "0;0;2;0",
        "aff_campus_unique": "Hong Kong SAR;;College Station",
        "aff_country_unique_index": "0;0;1;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "MNFKm4AStf",
        "title": "Representation Disentanglement via Regularization by Causal Identification",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this work, we argue modern deep representation learning models for disentanglement are ill-posed with collider bias behavior; a source of bias producing dependencies between the underlying generating variables. Under the rubric of causal inference, we show this issue can be explained and reconciled under the condition of causal identification; attainable from a combination of a causal graphical model encoding the data generation process assumptions and data. For this, we propose regularization by identification (ReI), a modular regularization engine designed to align the behavior of large scale models with the disentanglement constraints imposed by causal identification. Empirical evidence on standard disentanglement benchmarks demonstrates the superiority of ReI in removing the effects of collider-bias. In a real-world dataset we show that enforcing ReI in a variational framework results in interpretable representations robust to out-of-distribution examples and that align with the true expected effect from domain knowledge.",
        "keywords": "Causality;disentanglement;deep learning.",
        "primary_area": "causal reasoning",
        "supplementary_material": "",
        "author": "Juan Castorena",
        "authorids": "~Juan_Castorena1",
        "gender": "M",
        "homepage": "",
        "dblp": "",
        "google_scholar": "MEc0TowAAAAJ",
        "orcid": "",
        "linkedin": "juan-castorena-644b48aa/",
        "or_profile": "~Juan_Castorena1",
        "aff": "Los Alamos National Laboratory",
        "aff_domain": "lanl.gov",
        "position": "Researcher",
        "bibtex": "@misc{\ncastorena2024representation,\ntitle={Representation Disentanglement via Regularization by Causal Identification},\nauthor={Juan Castorena},\nyear={2024},\nurl={https://openreview.net/forum?id=MNFKm4AStf}\n}",
        "github": "",
        "project": "",
        "reviewers": "JUu3;jyos;o5A3;osMn",
        "site": "https://openreview.net/forum?id=MNFKm4AStf",
        "pdf_size": 913781,
        "rating": "3;5;5;6",
        "confidence": "4;4;3;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "1;1;3;4",
        "wc_summary": "72;47;112;48",
        "wc_strengths": "22;25;124;16",
        "wc_weaknesses": "353;253;180;25",
        "wc_questions": "2;35;64;100",
        "wc_review": "449;360;480;189",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1190;1253;998;352",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;2;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            1.299038105676658
        ],
        "wc_summary_avg": [
            69.75,
            26.366408553308887
        ],
        "wc_strengths_avg": [
            46.75,
            44.71786555729153
        ],
        "wc_weaknesses_avg": [
            202.75,
            119.59593429544334
        ],
        "wc_questions_avg": [
            50.25,
            36.1412160835797
        ],
        "wc_review_avg": [
            369.5,
            113.13818983879847
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            948.25,
            356.82795224029184
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.13245323570650439,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:3lW5t0tDLeoJ:scholar.google.com/&scioq=Representation+Disentanglement+via+Regularization+by+Causal+Identification&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "Los Alamos National Laboratory",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.lanl.gov",
        "aff_unique_abbr": "LANL",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "title": "GENOME: Generative Neuro-Symbolic Visual Reasoning by Growing and Reusing Modules",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18827",
        "id": "MNShbDSxKH",
        "author_site": "Zhenfang Chen, Rui Sun, Wenjun Liu, Yining Hong, Chuang Gan",
        "tldr": "",
        "abstract": "Recent works have shown that Large Language Models (LLMs) could empower traditional neuro-symbolic models via programming capabilities to translate languages into module descriptions, thus achieving strong visual reasoning results while maintaining the model\u2019s transparency and efficiency. However, these models usually exhaustively generate the entire code snippet given each new instance of a task, which is extremely ineffective. On the contrary, human beings gradually acquire knowledge that can be reused and grow into more profound skills for fast generalization to new tasks since we are an infant. Inspired by this, we propose generative neuro-symbolic visual reasoning by growing and reusing modules. Specifically, our model consists of three unique stages, module initialization, module generation, and module execution. First, given a vision-language task, we adopt LLMs to examine whether we could reuse and grow over established modules to handle this new task. If not, we initialize a new module needed by the task and specify the inputs and outputs of this new module. After that, the new module is created by querying LLMs to generate corresponding code snippets that match the requirements. In order to get a better sense of the new module\u2019s ability, we treat few-shot training examples as test cases to see if our new module could pass these cases. If yes, the new module is added to the module library for future reuse. Finally, we evaluate the performance of our model on the testing set by executing the parsed programs with the newly made visual modules to get the results. We find the proposed GENOME model possesses several advantages. First, it performs competitively on standard tasks like visual question answering and referring expression comprehension; Second, the visual modules learned from one task can be seamlessly transferred to new tasks; Last but not least, it is able to adapt to new visual reasoning tasks by observing a few training examples and reusing modules.",
        "keywords": "Large language models;Neuro-symbolic Visual Reasoning",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "",
        "author": "Zhenfang Chen;Rui Sun;Wenjun Liu;Yining Hong;Chuang Gan",
        "authorids": "~Zhenfang_Chen1;~Rui_Sun10;~Wenjun_Liu2;~Yining_Hong1;~Chuang_Gan1",
        "gender": "M;M;;F;M",
        "homepage": "https://zfchenunique.github.io;https://threesr.github.io/;https://heaplax.github.io/;https://evelinehong.github.io;http://people.csail.mit.edu/ganchuang/",
        "dblp": "207/5321;;;245/3655;139/6993",
        "google_scholar": "QSRdIzAAAAAJ;;;PTYxORcAAAAJ;PTeSCbIAAAAJ",
        "orcid": ";0000-0001-9927-8392;;;",
        "linkedin": "\u632f\u65b9-\u9648-512011bb/;rui-sun-three/;;;",
        "or_profile": "~Zhenfang_Chen1;~Rui_Sun10;~Wenjun_Liu2;~Yining_Hong1;~Chuang_Gan1",
        "aff": "MIT-IBM Watson AI lab;University of California, Los Angeles;Tsinghua University;University of California, Los Angeles;University of Massachusetts at Amherst",
        "aff_domain": "ibm.com;ucla.edu;tsinghua.edu.cn;cs.ucla.edu;umass.edu",
        "position": "Researcher;Research Assistant;Undergrad student;PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nchen2024genome,\ntitle={{GENOME}: Generative Neuro-Symbolic Visual Reasoning by Growing and Reusing Modules},\nauthor={Zhenfang Chen and Rui Sun and Wenjun Liu and Yining Hong and Chuang Gan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=MNShbDSxKH}\n}",
        "github": "",
        "project": "",
        "reviewers": "QVVg;JpcA;vHZ5;CDRY",
        "pdf_size": 6028145,
        "rating": "5;6;6;6",
        "confidence": "5;4;4;3",
        "soundness": "3;3;3;4",
        "contribution": "2;3;3;3",
        "presentation": "4;3;3;2",
        "wc_summary": "154;88;227;55",
        "wc_strengths": "72;44;220;82",
        "wc_weaknesses": "338;235;408;269",
        "wc_questions": "227;42;377;24",
        "wc_review": "791;409;1232;430",
        "wc_reply_reviewers": "0;58;95;49",
        "wc_reply_authors": "2338;1391;2299;1165",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "6;3;4;3",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            131.0,
            65.89764790946639
        ],
        "wc_strengths_avg": [
            104.5,
            68.12305043081967
        ],
        "wc_weaknesses_avg": [
            312.5,
            66.46239538265229
        ],
        "wc_questions_avg": [
            167.5,
            144.71782889471498
        ],
        "wc_review_avg": [
            715.5,
            334.6359962705746
        ],
        "wc_reply_reviewers_avg": [
            50.5,
            33.8710791088799
        ],
        "wc_reply_authors_avg": [
            1798.25,
            526.5308039421815
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.0,
            1.224744871391589
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 18,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15643636114552398723&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=MNShbDSxKH",
        "pdf": "https://openreview.net/pdf?id=MNShbDSxKH",
        "email": "ibm.com;ucla.edu;tsinghua.edu.cn;cs.ucla.edu;umass.edu",
        "author_num": 5,
        "aff_unique_index": "0;1;2;1;3",
        "aff_unique_norm": "Massachusetts Institute of Technology;University of California, Los Angeles;Tsinghua University;University of Massachusetts Amherst",
        "aff_unique_dep": "IBM Watson AI lab;;;",
        "aff_unique_url": "https://www.mitibmwatsonailab.org;https://www.ucla.edu;https://www.tsinghua.edu.cn;https://www.umass.edu",
        "aff_unique_abbr": "MIT-IBM AI Lab;UCLA;THU;UMass Amherst",
        "aff_campus_unique_index": "1;1;2",
        "aff_campus_unique": ";Los Angeles;Amherst",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "MNwXif6AWA",
        "title": "Periodic Set Transformer: Material Property Prediction from Continuous Isometry Invariants",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Material or crystal property prediction using machine learning has grown popular in recent years as it provides an accurate and computationally efficient replacement to classical simulation methods. A crucial first step for any of these algorithms is the representation used for a periodic crystal. While similar objects like molecules and proteins have a fixed number of atoms and their representation can be built based upon a finite point cloud interpretation, periodic crystals are unbounded in size, making their representation more challenging. In the present work, we adapt the Pointwise Distance Distribution (PDD), a continuous isometry invariant for periodic point sets, as a representation for our learning algorithm. While the PDD is effective in distinguishing periodic point sets up to isometry, there is no consideration for the composition of the underlying material. We develop a transformer model with a modified self-attention mechanism that can utilize the PDD and incorporate compositional information via a spatial encoding method. This model is tested thoroughly with and without the use of compositional information on a variety of crystal datasets including the commonly used crystals of the Materials Project.",
        "keywords": "Material Property Prediction",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/4fbeef0bee1b54451467835b82fa73e617ac12b9.zip",
        "author": "Jonathan Balasingham;Viktor Zamaraev;Vitaliy Kurlin",
        "authorids": "~Jonathan_Balasingham1;~Viktor_Zamaraev1;~Vitaliy_Kurlin1",
        "gender": "M;;Not Specified",
        "homepage": ";;http://kurlin.org",
        "dblp": ";;13/7215",
        "google_scholar": ";HpS4Y2wAAAAJ;https://scholar.google.co.uk/citations?user=mtz3cigAAAAJ",
        "orcid": "0000-0002-3265-1436;;0000-0001-5328-5351",
        "linkedin": ";;vitaliy-kurlin-09850621/",
        "or_profile": "~Jonathan_Balasingham1;~Viktor_Zamaraev1;~Vitaliy_Kurlin1",
        "aff": "University of Liverpool;University of Liverpool;University of Liverpool",
        "aff_domain": "liverpool.ac.uk;liverpool.ac.uk;liv.ac.uk",
        "position": "PhD student;Lecturer;Full Professor",
        "bibtex": "@misc{\nbalasingham2024periodic,\ntitle={Periodic Set Transformer: Material Property Prediction from Continuous Isometry Invariants},\nauthor={Jonathan Balasingham and Viktor Zamaraev and Vitaliy Kurlin},\nyear={2024},\nurl={https://openreview.net/forum?id=MNwXif6AWA}\n}",
        "github": "",
        "project": "",
        "reviewers": "DofE;V7SM;yW4J;kc8a",
        "site": "https://openreview.net/forum?id=MNwXif6AWA",
        "pdf_size": 1085148,
        "rating": "3;3;5;6",
        "confidence": "4;5;4;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;2",
        "presentation": "2;2;2;3",
        "wc_summary": "290;91;156;247",
        "wc_strengths": "78;50;170;25",
        "wc_weaknesses": "190;216;126;143",
        "wc_questions": "194;2;275;99",
        "wc_review": "752;359;727;514",
        "wc_reply_reviewers": "356;139;403;318",
        "wc_reply_authors": "1199;687;1668;916",
        "reply_reviewers": "1;1;3;3",
        "reply_authors": "2;1;3;3",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            196.0,
            77.55965446029269
        ],
        "wc_strengths_avg": [
            80.75,
            54.83327001009515
        ],
        "wc_weaknesses_avg": [
            168.75,
            35.967867604293694
        ],
        "wc_questions_avg": [
            142.5,
            102.27536360238472
        ],
        "wc_review_avg": [
            588.0,
            161.34900061667565
        ],
        "wc_reply_reviewers_avg": [
            304.0,
            99.90745717913153
        ],
        "wc_reply_authors_avg": [
            1117.5,
            365.93202920761115
        ],
        "reply_reviewers_avg": [
            2.0,
            1.0
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:gA1zpU70YmgJ:scholar.google.com/&scioq=Periodic+Set+Transformer:+Material+Property+Prediction+from+Continuous+Isometry+Invariants&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Liverpool",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.liverpool.ac.uk",
        "aff_unique_abbr": "Liv Uni",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "title": "SEABO: A Simple Search-Based Method for Offline Imitation Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18826",
        "id": "MNyOI3C7YB",
        "author_site": "Jiafei Lyu, Xiaoteng Ma, Le Wan, Runze Liu, Xiu Li, Zongqing Lu",
        "tldr": "",
        "abstract": "Offline reinforcement learning (RL) has attracted much attention due to its ability in learning from static offline datasets and eliminating the need of interacting with the environment. Nevertheless, the success of offline RL relies heavily on the offline transitions annotated with reward labels. In practice, we often need to hand-craft the reward function, which is sometimes difficult, labor-intensive, or inefficient. To tackle this challenge, we set our focus on the offline imitation learning (IL) setting, and aim at getting a reward function based on the expert data and unlabeled data. To that end, we propose a simple yet effective search-based offline IL method, tagged SEABO. SEABO allocates a larger reward to the transition that is close to its closest neighbor in the expert demonstration, and a smaller reward otherwise, all in an unsupervised learning manner. Experimental results on a variety of D4RL datasets indicate that SEABO can achieve competitive performance to offline RL algorithms with ground-truth rewards, given only a single expert trajectory, and can outperform prior reward learning and offline IL methods across many tasks. Moreover, we demonstrate that SEABO also works well if the expert demonstrations contain only observations. Our code is publicly available at https://github.com/dmksjfl/SEABO.",
        "keywords": "offline imitation learning; reward learning; reinforcement learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/d67ffd7f80a5c2870b5a7c0b55fd1732b863c80a.zip",
        "author": "Jiafei Lyu;Xiaoteng Ma;Le Wan;Runze Liu;Xiu Li;Zongqing Lu",
        "authorids": "~Jiafei_Lyu1;~Xiaoteng_Ma1;~Le_Wan1;~Runze_Liu2;~Xiu_Li1;~Zongqing_Lu2",
        "gender": "M;M;;M;F;",
        "homepage": ";https://xtma.github.io/;https://github.com/vinowan;https://ryanliu112.github.io/;https://thusigsiclab.github.io/thu.github.io/introduction.html;",
        "dblp": "278/1503;238/3249;;235/0682-2;13/1206-1;",
        "google_scholar": "bfgCMr8AAAAJ;CeDFnNMAAAAJ;;LiIfGakAAAAJ;https://scholar.google.com/citations?hl=zh-CN;",
        "orcid": "0000-0001-6616-417X;0000-0002-7250-6268;;0009-0007-4784-5333;0000-0003-0403-1923;",
        "linkedin": ";;;;;",
        "or_profile": "~Jiafei_Lyu1;~Xiaoteng_Ma1;~Le_Wan1;~Runze_Liu2;~Xiu_Li1;~Zongqing_Lu2",
        "aff": "Tsinghua University;;;Shanghai Artificial Intelligence Laboratory;Tsinghua University;",
        "aff_domain": "tsinghua.edu.cn;;;pjlab.org.cn;tsinghua.edu.cn;",
        "position": "PhD student;;;Intern;Professor;",
        "bibtex": "@inproceedings{\nlyu2024seabo,\ntitle={{SEABO}: A Simple Search-Based Method for Offline Imitation Learning},\nauthor={Jiafei Lyu and Xiaoteng Ma and Le Wan and Runze Liu and Xiu Li and Zongqing Lu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=MNyOI3C7YB}\n}",
        "github": "",
        "project": "",
        "reviewers": "u2Fn;KA4c;LUNW;m3fB",
        "pdf_size": 9265000,
        "rating": "6;6;8;8",
        "confidence": "5;4;4;4",
        "soundness": "2;3;4;4",
        "contribution": "3;3;2;3",
        "presentation": "3;3;4;4",
        "wc_summary": "67;70;160;78",
        "wc_strengths": "51;92;85;57",
        "wc_weaknesses": "166;162;210;296",
        "wc_questions": "113;55;75;134",
        "wc_review": "397;379;530;565",
        "wc_reply_reviewers": "65;178;22;0",
        "wc_reply_authors": "1038;1104;1350;1100",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "4;5;4;3",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            93.75,
            38.46020670771284
        ],
        "wc_strengths_avg": [
            71.25,
            17.55526986406076
        ],
        "wc_weaknesses_avg": [
            208.5,
            53.91428382163673
        ],
        "wc_questions_avg": [
            94.25,
            30.994959267597046
        ],
        "wc_review_avg": [
            467.75,
            80.95484852681771
        ],
        "wc_reply_reviewers_avg": [
            66.25,
            68.62352002047112
        ],
        "wc_reply_authors_avg": [
            1148.0,
            119.52405615607262
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.0,
            0.7071067811865476
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12894790935633598959&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=MNyOI3C7YB",
        "pdf": "https://openreview.net/pdf?id=MNyOI3C7YB",
        "email": "tsinghua.edu.cn;;;pjlab.org.cn;tsinghua.edu.cn;",
        "author_num": 6,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Tsinghua University;Shanghai Artificial Intelligence Laboratory",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tsinghua.edu.cn;http://www.shailab.org/",
        "aff_unique_abbr": "THU;Shanghai AI Lab",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Sudden Drops in the Loss: Syntax Acquisition, Phase Transitions, and Simplicity Bias in MLMs",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18825",
        "id": "MO5PiKHELW",
        "author_site": "Angelica Chen, Ravid Shwartz-Ziv, Kyunghyun Cho, Matthew Leavitt, Naomi Saphra",
        "tldr": "",
        "abstract": "Most interpretability research in NLP focuses on understanding the behavior and features of a fully trained model. However, certain insights into model behavior may only be accessible by observing the trajectory of the training process. We present a case study of syntax acquisition in masked language models (MLMs) that demonstrates how analyzing the evolution of interpretable artifacts throughout training deepens our understanding of emergent behavior. In particular, we study Syntactic Attention Structure (SAS), a naturally emerging property of MLMs wherein specific Transformer heads tend to focus on specific syntactic relations. We identify a brief window in pretraining when models abruptly acquire SAS, concurrent with a steep drop in loss. This breakthrough precipitates the subsequent acquisition of linguistic capabilities. We then examine the causal role of SAS by manipulating SAS during training, and demonstrate that SAS is necessary for the development of grammatical capabilities. We further find that SAS competes with other beneficial traits during training, and that briefly suppressing SAS improves model quality. These findings offer an interpretation of a real-world example of both simplicity bias and breakthrough training dynamics.",
        "keywords": "interpretability;BERT;syntax;phase changes;simplicity bias;training dynamics",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/e80e979b639ff6a407bc2c16931593d778fc8a15.pdf",
        "author": "Angelica Chen;Ravid Shwartz-Ziv;Kyunghyun Cho;Matthew L Leavitt;Naomi Saphra",
        "authorids": "~Angelica_Chen1;~Ravid_Shwartz-Ziv2;~Kyunghyun_Cho1;~Matthew_L_Leavitt1;~Naomi_Saphra1",
        "gender": "F;M;M;F;M",
        "homepage": ";http://kyunghyuncho.me;https://mleavitt.net;http://nsaphra.github.io/;https://www.ravid-shwartz-ziv.com/",
        "dblp": "241/5892;41/9736;260/0952;131/6883;",
        "google_scholar": "QbW4GSwAAAAJ;https://scholar.google.fi/citations?user=0RAmmIAAAAAJ;;TPhVfX8AAAAJ;https://scholar.google.co.il/citations?user=SqsLFwMAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;naomi-saphra-028b8060/;",
        "or_profile": "~Angelica_Chen1;~Kyunghyun_Cho1;~Matthew_L_Leavitt1;~Naomi_Saphra1;~ravid_ziv1",
        "aff": "New York University;Genentech;Meta Facebook;Harvard University;New York University",
        "aff_domain": "nyu.edu;gene.com;fb.com;harvard.edu;nyu.edu",
        "position": "PhD student;Senior Director of Frontier Research;AI Resident;Fellow;Postdoc",
        "bibtex": "@inproceedings{\nchen2024sudden,\ntitle={Sudden Drops in the Loss: Syntax Acquisition, Phase Transitions, and Simplicity Bias in {MLM}s},\nauthor={Angelica Chen and Ravid Shwartz-Ziv and Kyunghyun Cho and Matthew L Leavitt and Naomi Saphra},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=MO5PiKHELW}\n}",
        "github": "",
        "project": "",
        "reviewers": "uEHm;4MRy;cVcx;qPGn",
        "pdf_size": 957186,
        "rating": "5;8;8;10",
        "confidence": "4;4;4;3",
        "soundness": "2;4;3;4",
        "contribution": "2;3;3;4",
        "presentation": "2;4;3;3",
        "wc_summary": "156;88;89;181",
        "wc_strengths": "53;37;39;105",
        "wc_weaknesses": "369;49;55;127",
        "wc_questions": "230;98;115;122",
        "wc_review": "808;272;298;535",
        "wc_reply_reviewers": "80;15;0;0",
        "wc_reply_authors": "1570;322;502;796",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "3;1;1;2",
        "rating_avg": [
            7.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            128.5,
            40.96644968751869
        ],
        "wc_strengths_avg": [
            58.5,
            27.54541704167864
        ],
        "wc_weaknesses_avg": [
            150.0,
            130.11149065320865
        ],
        "wc_questions_avg": [
            141.25,
            51.977759666996036
        ],
        "wc_review_avg": [
            478.25,
            216.20866657005217
        ],
        "wc_reply_reviewers_avg": [
            23.75,
            33.04826016600571
        ],
        "wc_reply_authors_avg": [
            797.5,
            477.01650914826837
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.7276068751089989,
        "gs_citation": 62,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13322606554446397588&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=MO5PiKHELW",
        "pdf": "https://openreview.net/pdf?id=MO5PiKHELW",
        "email": "nyu.edu;gene.com;fb.com;harvard.edu;nyu.edu",
        "author_num": 5,
        "aff_unique_index": "0;1;2;3;0",
        "aff_unique_norm": "New York University;Genentech;Meta;Harvard University",
        "aff_unique_dep": ";;Meta Platforms, Inc.;",
        "aff_unique_url": "https://www.nyu.edu;https://www.genentech.com;https://meta.com;https://www.harvard.edu",
        "aff_unique_abbr": "NYU;Genentech;Meta;Harvard",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Differentiable Euler Characteristic Transforms for Shape Classification",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18824",
        "id": "MO632iPq3I",
        "author_site": "Ernst Roell, Bastian Rieck",
        "tldr": "",
        "abstract": "The _Euler Characteristic Transform_ (ECT) is a powerful\n  invariant, combining geometrical and topological characteristics\n  of shapes and graphs.\n  However, the ECT was hitherto unable to learn task-specific\n  representations.\n  We overcome this issue and develop a novel computational layer that\n  enables learning the ECT in an end-to-end fashion.\n  Our method, the _Differentiable Euler Characteristic Transform_ (DECT) \n  is fast and computationally efficient, while exhibiting performance on a par with \n  more complex models in both graph and point cloud classification tasks.\n  Moreover, we show that this seemingly simple statistic\n  provides the same topological expressivity as more complex topological\n  deep learning layers.",
        "keywords": "Differentiable Euler Characteristic Transforms for Shape Classification",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Ernst R\u00f6ell;Bastian Rieck",
        "authorids": "~Ernst_R\u00f6ell1;~Bastian_Rieck1",
        "gender": "M;M",
        "homepage": "https://www.helmholtz-munich.de/;https://bastian.rieck.me",
        "dblp": ";119/8860",
        "google_scholar": ";https://scholar.google.ch/citations?user=La7zuKQAAAAJ",
        "orcid": ";0000-0003-4335-0302",
        "linkedin": ";br-ml/",
        "or_profile": "~Ernst_R\u00f6ell1;~Bastian_Rieck1",
        "aff": "Technische Universit\u00e4t M\u00fcnchen;Helmholtz Zentrum M\u00fcnchen",
        "aff_domain": "tum.de;helmholtz-munich.de",
        "position": "PhD student;Principal Investigator",
        "bibtex": "@inproceedings{\nr{\\\"o}ell2024differentiable,\ntitle={Differentiable Euler Characteristic Transforms for Shape Classification},\nauthor={Ernst R{\\\"o}ell and Bastian Rieck},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=MO632iPq3I}\n}",
        "github": "",
        "project": "",
        "reviewers": "5rSB;Y6Ss;v8eE;DHr6",
        "pdf_size": 592871,
        "rating": "5;6;6;8",
        "confidence": "3;4;3;3",
        "soundness": "3;3;2;3",
        "contribution": "2;3;2;3",
        "presentation": "2;3;3;1",
        "wc_summary": "71;80;188;106",
        "wc_strengths": "53;89;84;73",
        "wc_weaknesses": "152;78;155;209",
        "wc_questions": "14;120;152;77",
        "wc_review": "290;367;579;465",
        "wc_reply_reviewers": "0;0;0;156",
        "wc_reply_authors": "468;457;774;1019",
        "reply_reviewers": "0;0;0;4",
        "reply_authors": "1;1;1;4",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            111.25,
            46.13770150321752
        ],
        "wc_strengths_avg": [
            74.75,
            13.827056809024834
        ],
        "wc_weaknesses_avg": [
            148.5,
            46.5966737010272
        ],
        "wc_questions_avg": [
            90.75,
            51.6883690978928
        ],
        "wc_review_avg": [
            425.25,
            108.28752236522914
        ],
        "wc_reply_reviewers_avg": [
            39.0,
            67.54998149518622
        ],
        "wc_reply_authors_avg": [
            679.5,
            233.6819419638582
        ],
        "reply_reviewers_avg": [
            1.0,
            1.7320508075688772
        ],
        "reply_authors_avg": [
            1.75,
            1.299038105676658
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.13245323570650439,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11820149427515265355&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=MO632iPq3I",
        "pdf": "https://openreview.net/pdf?id=MO632iPq3I",
        "email": "tum.de;helmholtz-munich.de",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Technische Universit\u00e4t M\u00fcnchen;Helmholtz Zentrum M\u00fcnchen",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tum.de;https://www.helmholtz-muenchen.de",
        "aff_unique_abbr": "TUM;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Germany"
    },
    {
        "title": "Achieving Sample and Computational Efficient Reinforcement Learning by Action Space Reduction via Grouping",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18823",
        "id": "MOmqfJovQ6",
        "author_site": "Yining Li, Peizhong Ju, Ness Shroff",
        "tldr": "",
        "abstract": "Reinforcement learning often needs to deal with the exponential growth of states and actions when exploring optimal control in high-dimensional spaces (often known as the curse of dimensionality). In this work, we address this issue by learning the inherent structure of action-wise similar MDP to appropriately balance the performance degradation versus sample/computational complexity.  In particular, we partition the action spaces into multiple groups based on the similarity in transition distribution and reward function, and build a linear decomposition model to capture the difference between the intra-group transition kernel and the intra-group rewards. Both our theoretical analysis and experiments reveal a *surprising and counter-intuitive result*: while a more refined grouping strategy can reduce the approximation error caused by treating actions in the same group as identical, it also leads to increased estimation error when the size of samples or the computation resources is limited. This finding highlights the grouping strategy as a new degree of freedom that can be optimized to minimize the overall performance loss. To address this issue, we formulate a general optimization problem for determining the optimal grouping strategy, which strikes a balance between performance loss and sample/computational complexity. We further propose a computationally efficient method for selecting a nearly-optimal grouping strategy, which maintains its computational complexity independent of the size of the action space.",
        "keywords": "reinforcement learning;abstraction",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Yining Li;Peizhong Ju;Ness Shroff",
        "authorids": "~Yining_Li3;~Peizhong_Ju1;~Ness_Shroff1",
        "gender": "F;M;M",
        "homepage": ";;http://newslab.ece.ohio-state.edu/",
        "dblp": ";167/9021;67/1991",
        "google_scholar": "https://scholar.google.com/citations?hl=en;VDzpfOYAAAAJ;https://scholar.google.com.tw/citations?user=5kL-ZrAAAAAJ",
        "orcid": ";0000-0002-4569-3539;0000-0002-4606-6879",
        "linkedin": ";;nessshroff/",
        "or_profile": "~Yining_Li3;~Peizhong_Ju1;~Ness_Shroff1",
        "aff": "Ohio State University, Columbus;Ohio State University, Columbus;Ohio State University, Columbus",
        "aff_domain": "osu.edu;osu.edu;osu.edu",
        "position": "PhD student;Postdoc;Full Professor",
        "bibtex": "@inproceedings{\nli2024achieving,\ntitle={Achieving Sample and Computational Efficient Reinforcement Learning by Action Space Reduction via Grouping},\nauthor={Yining Li and Peizhong Ju and Ness Shroff},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=MOmqfJovQ6}\n}",
        "github": "",
        "project": "",
        "reviewers": "oqpX;ND6P;4oMe;62eA",
        "pdf_size": 936998,
        "rating": "5;6;6;6",
        "confidence": "3;3;3;3",
        "soundness": "2;3;2;3",
        "contribution": "2;3;3;2",
        "presentation": "2;3;4;3",
        "wc_summary": "125;82;54;119",
        "wc_strengths": "50;35;84;58",
        "wc_weaknesses": "297;53;101;166",
        "wc_questions": "13;41;77;3",
        "wc_review": "485;211;316;346",
        "wc_reply_reviewers": "0;17;0;24",
        "wc_reply_authors": "909;602;600;616",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            95.0,
            28.83574171059243
        ],
        "wc_strengths_avg": [
            56.75,
            17.76759691123141
        ],
        "wc_weaknesses_avg": [
            154.25,
            91.65526444236578
        ],
        "wc_questions_avg": [
            33.5,
            28.718460961548757
        ],
        "wc_review_avg": [
            339.5,
            97.82254341408222
        ],
        "wc_reply_reviewers_avg": [
            10.25,
            10.54454835448157
        ],
        "wc_reply_authors_avg": [
            681.75,
            131.3475827718196
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Mf478mh5Rd4J:scholar.google.com/&scioq=Achieving+Sample+and+Computational+Efficient+Reinforcement+Learning+by+Action+Space+Reduction+via+Grouping&hl=en&as_sdt=0,5",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=MOmqfJovQ6",
        "pdf": "https://openreview.net/pdf?id=MOmqfJovQ6",
        "email": "osu.edu;osu.edu;osu.edu",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Ohio State University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.osu.edu",
        "aff_unique_abbr": "OSU",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Columbus",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "MOtZlKkvdz",
        "title": "Are Large Language Models Post Hoc Explainers?",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) are increasingly used as powerful tools for a plethora of natural language processing (NLP) applications. A recent innovation, in-context learning (ICL), enables LLMs to learn new tasks by supplying a few examples in the prompt during inference time, thereby eliminating the need for model fine-tuning. While LLMs have been utilized in several applications, their applicability in explaining the behavior of other models remains relatively unexplored. Despite the growing number of new explanation techniques, many require white-box access to the model and/or are computationally expensive, highlighting a need for next-generation post hoc explainers. In this work, we present the first framework to study the effectiveness of LLMs in explaining other predictive models. More specifically, we propose a novel framework encompassing multiple prompting strategies: i) Perturbation-based ICL, ii) Prediction-based ICL, iii) Instruction-based ICL, and iv) Explanation-based ICL, with varying levels of information about the underlying ML model and the local neighborhood of the test sample. We conduct extensive experiments with real-world benchmark datasets to demonstrate that LLM generated explanations perform on par with state-of-the-art post hoc explainers using their ability to leverage ICL examples and their internal knowledge in generating model explanations. On average, across four datasets and two ML models, we observe that LLMs identify the most important feature with 72.19% accuracy, opening up new frontiers in explainable artificial intelligence (XAI) to explore LLM-based explanation frameworks.",
        "keywords": "Post hoc explainer;Large Language Models;Prompting;In-context learning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/c39962c8356e94d9fd2c26c54870702df3d5165a.zip",
        "author": "Nicholas Kroeger;Dan Ley;Satyapriya Krishna;Chirag Agarwal;Himabindu Lakkaraju",
        "authorids": "~Nicholas_Kroeger1;~Dan_Ley1;~Satyapriya_Krishna2;~Chirag_Agarwal1;~Himabindu_Lakkaraju1",
        "gender": "M;M;M;M;F",
        "homepage": "https://kroegern1.github.io/;https://www.dan-ley.com/;http://satyapriyakrishna.com/;https://chirag-agarwall.github.io/;http://web.stanford.edu/~himalv",
        "dblp": ";290/1369;251/9225;173/8821;68/9376",
        "google_scholar": "l25TUswAAAAJ;zQ_f9AEAAAAJ;Q5bfPlkAAAAJ;https://scholar.google.com/citations?hl=en;",
        "orcid": "0000-0002-2330-2015;;;;",
        "linkedin": ";dan-ley/;satyapriya-krishna-50553084/;chirag-agarwal-0a6a43a1/;",
        "or_profile": "~Nicholas_Kroeger1;~Dan_Ley1;~Satyapriya_Krishna2;~Chirag_Agarwal1;~Hima_Lakkaraju1",
        "aff": "University of Florida;Harvard University, Harvard University;Harvard University;Harvard University;Harvard University",
        "aff_domain": "ufl.edu;g.harvard.edu;harvard.edu;hbs.edu;harvard.edu",
        "position": "PhD student;PhD student;PhD student;Postdoc;Assistant Professor",
        "bibtex": "@misc{\nkroeger2024are,\ntitle={Are Large Language Models Post Hoc Explainers?},\nauthor={Nicholas Kroeger and Dan Ley and Satyapriya Krishna and Chirag Agarwal and Himabindu Lakkaraju},\nyear={2024},\nurl={https://openreview.net/forum?id=MOtZlKkvdz}\n}",
        "github": "",
        "project": "",
        "reviewers": "nbwF;WeJ2;e81j",
        "site": "https://openreview.net/forum?id=MOtZlKkvdz",
        "pdf_size": 1058643,
        "rating": "3;3;5",
        "confidence": "4;2;3",
        "soundness": "2;1;2",
        "contribution": "2;1;2",
        "presentation": "3;2;2",
        "wc_summary": "63;17;43",
        "wc_strengths": "28;6;87",
        "wc_weaknesses": "256;208;668",
        "wc_questions": "1;81;103",
        "wc_review": "348;312;901",
        "wc_reply_reviewers": "0;511;526",
        "wc_reply_authors": "822;1787;2025",
        "reply_reviewers": "0;1;2",
        "reply_authors": "2;3;4",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            41.0,
            18.83259585576738
        ],
        "wc_strengths_avg": [
            40.333333333333336,
            34.198765409814946
        ],
        "wc_weaknesses_avg": [
            377.3333333333333,
            206.4644171656597
        ],
        "wc_questions_avg": [
            61.666666666666664,
            43.827946437049604
        ],
        "wc_review_avg": [
            520.3333333333334,
            269.5729132452954
        ],
        "wc_reply_reviewers_avg": [
            345.6666666666667,
            244.49994319472188
        ],
        "wc_reply_authors_avg": [
            1544.6666666666667,
            520.1578820148957
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            3.0,
            0.816496580927726
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 36,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16468904723171759859&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;1;1;1",
        "aff_unique_norm": "University of Florida;Harvard University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ufl.edu;https://www.harvard.edu",
        "aff_unique_abbr": "UF;Harvard",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "MOviNImhfq",
        "title": "Effective Graph Representation Learning via Smoothed Contrastive Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph contrastive learning (GCL) aligns node representations through the utilization of positive/negative node pairs, a selection process that typically relies on the correspondences and non-correspondences among nodes within two augmented graphs. The conventional GCL approaches incorporate negative samples uniformly in the contrastive loss, resulting in the equal treatment of misclassified false negative nodes, regardless of their proximity to the true positive. In this paper, we present a Smoothed Graph Contrastive Learning model (SGCL), which leverages the geometric structure of augmented graphs to exploit proximity information associated with positive/negative pairs in contrastive loss. The proposed SGCL adjusts the significance of these pairs in contrastive loss by incorporating three distinct smoothing techniques that yield smoothed positive/negative pairs. To enhance scalability for large-scale graphs, the proposed framework incorporates a graph batch-generating strategy that partitions the given graphs into multiple subgraphs, facilitating efficient training in separate batches. Through extensive experimentation in an unsupervised setting on various benchmark datasets, particularly those of large scale, we demonstrate the superiority of our proposed framework.",
        "keywords": "Graph representation learning;Contrastive learning;Graph neural network;Laplacian smoothing;Batch-generating;Large-scaled graphs",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Maysam Behmanesh;Maks Ovsjanikov",
        "authorids": "~Maysam_Behmanesh1;~Maks_Ovsjanikov1",
        "gender": ";M",
        "homepage": "https://maysambehmanesh.github.io/;http://www.lix.polytechnique.fr/~maks/",
        "dblp": ";94/5668",
        "google_scholar": "XegLXtoAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";0000-0002-5867-4046",
        "linkedin": "maysam-behmanesh/;",
        "or_profile": "~Maysam_Behmanesh1;~Maks_Ovsjanikov1",
        "aff": "\u00c9cole Polytechnique IP-Paris;\u00c9cole Polytechnique",
        "aff_domain": "polytechnique.edu;polytechnique.edu",
        "position": "Postdoc;Full Professor",
        "bibtex": "@misc{\nbehmanesh2024effective,\ntitle={Effective Graph Representation Learning via Smoothed Contrastive Learning},\nauthor={Maysam Behmanesh and Maks Ovsjanikov},\nyear={2024},\nurl={https://openreview.net/forum?id=MOviNImhfq}\n}",
        "github": "",
        "project": "",
        "reviewers": "V43w;EGjE;4ysC;jBXi",
        "site": "https://openreview.net/forum?id=MOviNImhfq",
        "pdf_size": 1069416,
        "rating": "3;3;5;8",
        "confidence": "4;4;3;2",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "1;2;2;4",
        "wc_summary": "88;53;63;103",
        "wc_strengths": "43;49;11;19",
        "wc_weaknesses": "178;180;78;7",
        "wc_questions": "2;109;2;31",
        "wc_review": "311;391;154;160",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1382;1379;1305;347",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;3;4;1",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            76.75,
            19.803724397193573
        ],
        "wc_strengths_avg": [
            30.5,
            15.898113095584646
        ],
        "wc_weaknesses_avg": [
            110.75,
            72.72336282103572
        ],
        "wc_questions_avg": [
            36.0,
            43.777848279695064
        ],
        "wc_review_avg": [
            254.0,
            101.06186224288567
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1103.25,
            437.7090214971585
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.75,
            1.0897247358851685
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.9945577827230725,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:AcWszo6SzrsJ:scholar.google.com/&scioq=Effective+Graph+Representation+Learning+via+Smoothed+Contrastive+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Ecole Polytechnique",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ecolepolytechnique.fr",
        "aff_unique_abbr": "X",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Paris;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "France"
    },
    {
        "id": "MP8xhn6ANf",
        "title": "Dataset Distillation in Latent Space",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Dataset distillation (DD) is a newly emerging research area aiming at alleviating the heavy computational load in training models on large datasets, as it tries to distill a large dataset into a small and condensed one so that models trained on the distilled dataset can perform comparably with those trained on the full dataset in downstream tasks. Among the previous works in this area, there are three key problems that hinder the performance and availability of the existing DD methods: high time complexity, high space complexity, and low info-compactness. In this work, we simultaneously attempt to settle these three problems by moving the DD processes from conventionally used pixel space to latent space. Encoded by a pretrained generic autoencoder, latent codes in the latent space are naturally info-compact representations of the original images in much smaller sizes. After transferring three mainstream DD algorithms to latent space, we significantly reduce time and space consumption while achieving similar performance, allowing us to distill high-resolution datasets or target at greater data ratio that previous methods have failed. Besides, within the same storage budget, we can also quantitatively deliver more info-compact latent codes than pixel-level images, which further boosts the performance of our methods.",
        "keywords": "dataset distillation;representation learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/7de4e08e7e418cab2973a264731beded8da487c6.zip",
        "author": "Yuxuan Duan;Jianfu Zhang;Liqing Zhang",
        "authorids": "~Yuxuan_Duan2;~Jianfu_Zhang2;~Liqing_Zhang2",
        "gender": ";M;M",
        "homepage": ";https://matt-sjtu.github.io/;http://bcmi.sjtu.edu.cn/~zhangliqing/",
        "dblp": ";78/3993-3;20/4627-1.html",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;1smFmxAAAAAJ",
        "orcid": ";0000-0002-2673-5860;",
        "linkedin": ";;",
        "or_profile": "~Yuxuan_Duan2;~Jianfu_Zhang2;~Liqing_Zhang2",
        "aff": ";Shanghai Jiaotong University;Shanghai Jiaotong University",
        "aff_domain": ";sjtu.edu.cn;sjtu.edu.cn",
        "position": ";Assistant Professor;Full Professor",
        "bibtex": "@misc{\nduan2024dataset,\ntitle={Dataset Distillation in Latent Space},\nauthor={Yuxuan Duan and Jianfu Zhang and Liqing Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=MP8xhn6ANf}\n}",
        "github": "",
        "project": "",
        "reviewers": "cyHK;KLWs;Ya4Y;yGia",
        "site": "https://openreview.net/forum?id=MP8xhn6ANf",
        "pdf_size": 5912230,
        "rating": "3;3;5;6",
        "confidence": "5;5;4;3",
        "soundness": "2;3;2;3",
        "contribution": "3;2;2;3",
        "presentation": "2;3;2;2",
        "wc_summary": "69;59;47;63",
        "wc_strengths": "58;23;48;60",
        "wc_weaknesses": "472;164;188;115",
        "wc_questions": "6;94;281;2",
        "wc_review": "605;340;564;240",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1245;680;1444;358",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;2;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            59.5,
            8.04673846971554
        ],
        "wc_strengths_avg": [
            47.25,
            14.720309100015529
        ],
        "wc_weaknesses_avg": [
            234.75,
            139.4800612990975
        ],
        "wc_questions_avg": [
            95.75,
            113.09813216848455
        ],
        "wc_review_avg": [
            437.25,
            152.12720828306814
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            931.75,
            433.90458340515374
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.986440050415621,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2356782390783823556&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Shanghai Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sjtu.edu.cn",
        "aff_unique_abbr": "SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "MQ4JJIYKkh",
        "title": "Concept Alignment as a Prerequisite for Value Alignment",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Value alignment is essential for building AI systems that can safely and reliably interact with people. However, what a person values---and is even capable of valuing---depends on the concepts that they are currently using to understand and evaluate what happens in the world. The dependence of values on concepts means that concept alignment is a prerequisite for value alignment---agents need to align their representation of a situation with that of humans in order to successfully align their values. Here, we formally analyze the concept alignment problem in the inverse reinforcement learning setting, show how neglecting concept alignment can lead to systematic value mis-alignment, and describe an approach that helps minimize such failure modes by jointly reasoning about a person's concepts and values. Additionally, we report experimental results with human participants showing that humans reason about the concepts used by an agent when acting intentionally, in line with our joint reasoning model.",
        "keywords": "Human-AI alignment;concept alignment;cognitive science",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Sunayana Rane;Mark K Ho;Ilia Sucholutsky;Thomas L. Griffiths",
        "authorids": "~Sunayana_Rane1;~Mark_K_Ho1;~Ilia_Sucholutsky1;~Thomas_L._Griffiths1",
        "gender": ";;M;",
        "homepage": ";;https://ilia10000.github.io/;http://cocosci.princeton.edu/tom/",
        "dblp": ";;239/5108;34/4472",
        "google_scholar": ";;https://scholar.google.ca/citations?user=6MfHyuMAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;0000-0003-4121-7479;",
        "linkedin": ";;iliasu/;",
        "or_profile": "~Sunayana_Rane1;~Mark_K_Ho1;~Ilia_Sucholutsky1;~Thomas_L._Griffiths1",
        "aff": ";;Princeton University;Princeton University",
        "aff_domain": ";;princeton.edu;princeton.edu",
        "position": ";;Postdoc;Professor",
        "bibtex": "@misc{\nrane2024concept,\ntitle={Concept Alignment as a Prerequisite for Value Alignment},\nauthor={Sunayana Rane and Mark K Ho and Ilia Sucholutsky and Thomas L. Griffiths},\nyear={2024},\nurl={https://openreview.net/forum?id=MQ4JJIYKkh}\n}",
        "github": "",
        "project": "",
        "reviewers": "LqqC;ouXJ;thM9;cFhp",
        "site": "https://openreview.net/forum?id=MQ4JJIYKkh",
        "pdf_size": 4002498,
        "rating": "1;3;3;6",
        "confidence": "4;3;5;2",
        "soundness": "2;3;3;3",
        "contribution": "1;2;3;3",
        "presentation": "2;3;3;4",
        "wc_summary": "99;76;171;74",
        "wc_strengths": "36;144;129;115",
        "wc_weaknesses": "548;331;337;99",
        "wc_questions": "5;7;76;8",
        "wc_review": "688;558;713;296",
        "wc_reply_reviewers": "457;0;268;79",
        "wc_reply_authors": "1453;650;552;536",
        "reply_reviewers": "2;0;1;1",
        "reply_authors": "3;1;2;2",
        "rating_avg": [
            3.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            105.0,
            39.350984739901996
        ],
        "wc_strengths_avg": [
            106.0,
            41.69532347877877
        ],
        "wc_weaknesses_avg": [
            328.75,
            158.84642740710285
        ],
        "wc_questions_avg": [
            24.0,
            30.041637771599603
        ],
        "wc_review_avg": [
            563.75,
            165.40612896745998
        ],
        "wc_reply_reviewers_avg": [
            201.0,
            176.99576266114394
        ],
        "wc_reply_authors_avg": [
            797.75,
            380.81778779358507
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.6888467201936643,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3748383057690532169&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Princeton University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.princeton.edu",
        "aff_unique_abbr": "Princeton",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "MQrFaQC3kj",
        "title": "Dataset Fairness: Achievable Fairness On Your Data With Utility Guarantees",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In machine learning fairness, training models which minimize disparity across different sensitive groups often leads to diminished accuracy, a phenomenon known as the fairness-accuracy trade-off. The severity of this trade-off fundamentally depends on dataset characteristics such as dataset imbalances or biases, and therefore using a universal fairness requirement across datasets remains questionable and can often lead to models with varying and substantially low utility. To address this, we present a computationally efficient approach to approximate the fairness-accuracy trade-off curve tailored to individual datasets, backed by rigorous statistical guarantees. By utilizing the You-Only-Train-Once (YOTO) framework, our approach mitigates the computational burden of having to train multiple models when approximating the trade-off curve. Moreover, we introduce confidence intervals around this curve, offering a statistically grounded perspective on acceptable range of fairness violations for any given accuracy threshold. Our empirical evaluation which includes applications to tabular data, computer vision and natural language datasets, underscores that our approach can guide practitioners in accuracy-constrained fairness decisions across various data modalities.",
        "keywords": "Fairness",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Muhammad Faaiz Taufiq;Jean-Francois Ton;Yang Liu",
        "authorids": "~Muhammad_Faaiz_Taufiq1;~Jean-Francois_Ton2;~Yang_Liu3",
        "gender": "M;Not Specified;M",
        "homepage": "https://faaizt.github.io/;https://savior287.github.io/JFT-webpage/;http://www.yliuu.com",
        "dblp": "322/2165;;51/3710-18",
        "google_scholar": "oDL6ahoAAAAJ;WWVOu4kAAAAJ;jKrIVCIAAAAJ",
        "orcid": ";;0000-0001-8420-6011",
        "linkedin": "muhammadftaufiq/;;",
        "or_profile": "~Muhammad_Faaiz_Taufiq1;~Jean-Francois_Ton2;~Yang_Liu3",
        "aff": "University of Oxford;Bytedance;University of California, Santa Cruz",
        "aff_domain": "ox.ac.uk;bytedance.com;ucsc.edu",
        "position": "PhD student;Researcher;Assistant Professor",
        "bibtex": "@misc{\ntaufiq2024dataset,\ntitle={Dataset Fairness: Achievable Fairness On Your Data With Utility Guarantees},\nauthor={Muhammad Faaiz Taufiq and Jean-Francois Ton and Yang Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=MQrFaQC3kj}\n}",
        "github": "",
        "project": "",
        "reviewers": "H5sg;SKWL;PBf8",
        "site": "https://openreview.net/forum?id=MQrFaQC3kj",
        "pdf_size": 2332935,
        "rating": "3;3;6",
        "confidence": "4;3;2",
        "soundness": "2;1;2",
        "contribution": "1;2;2",
        "presentation": "2;3;3",
        "wc_summary": "141;60;45",
        "wc_strengths": "33;50;44",
        "wc_weaknesses": "293;291;90",
        "wc_questions": "121;4;45",
        "wc_review": "588;405;224",
        "wc_reply_reviewers": "120;0;0",
        "wc_reply_authors": "1618;2040;474",
        "reply_reviewers": "1;0;0",
        "reply_authors": "3;3;1",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            82.0,
            42.16633728461603
        ],
        "wc_strengths_avg": [
            42.333333333333336,
            7.039570693980959
        ],
        "wc_weaknesses_avg": [
            224.66666666666666,
            95.22721366406886
        ],
        "wc_questions_avg": [
            56.666666666666664,
            48.472214262972926
        ],
        "wc_review_avg": [
            405.6666666666667,
            148.60312543445676
        ],
        "wc_reply_reviewers_avg": [
            40.0,
            56.568542494923804
        ],
        "wc_reply_authors_avg": [
            1377.3333333333333,
            661.5785835577072
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8660254037844387,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:GiyqYDFeSNsJ:scholar.google.com/&scioq=Dataset+Fairness:+Achievable+Fairness+On+Your+Data+With+Utility+Guarantees&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of Oxford;ByteDance;University of California, Santa Cruz",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ox.ac.uk;https://www.bytedance.com;https://www.ucsc.edu",
        "aff_unique_abbr": "Oxford;Bytedance;UCSC",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Santa Cruz",
        "aff_country_unique_index": "0;1;2",
        "aff_country_unique": "United Kingdom;China;United States"
    },
    {
        "title": "One-hot Generalized Linear Model for Switching Brain State Discovery",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18822",
        "id": "MREQ0k6qvD",
        "author_site": "Chengrui Li, Soon Ho Kim, Chris Rodgers, Hannah Choi, Anqi Wu",
        "tldr": "",
        "abstract": "Exposing meaningful and interpretable neural interactions is critical to understanding neural circuits. Inferred neural interactions from neural signals primarily reflect functional connectivity. In a long experiment, subject animals may experience different stages defined by the experiment, stimuli, or behavioral states, and hence functional connectivity can change over time. To model dynamically changing functional connectivity, prior work employs state-switching generalized linear models with hidden Markov models (i.e., HMM-GLMs). However, we argue they lack biological plausibility, as functional connectivities are shaped and confined by the underlying anatomical connectome. Here, we propose two novel prior-informed state-switching GLMs, called Gaussian HMM-GLM (Gaussian prior) and one-hot HMM-GLM (Gumbel-Softmax one-hot prior). We show that the learned prior should capture the state-invariant interaction, shedding light on the underlying anatomical connectome and revealing more likely physical neuron interactions. The state-dependent interaction modeled by each GLM offers traceability to capture functional variations across multiple brain states. Our methods effectively recover true interaction structures in simulated data, achieve the highest predictive likelihood, and enhance the interpretability of interaction patterns and hidden states when applied to real neural data. The code is available at \\url{https://github.com/JerrySoybean/onehot-hmmglm}.",
        "keywords": "Hidden markov models;generalized linear models;functional connectivity inference",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/1c4f41edee4030ec38ad781781e4222aec3ec283.zip",
        "author": "Chengrui Li;Soon Ho Kim;Chris Rodgers;Hannah Choi;Anqi Wu",
        "authorids": "~Chengrui_Li1;~Soon_Ho_Kim1;~Chris_Rodgers1;~Hannah_Choi1;~Anqi_Wu3",
        "gender": "M;;M;F;F",
        "homepage": "https://jerrysoybean.github.io/;https://www.researchgate.net/profile/Soon-Ho-Kim;https://www.chris-rodgers.com;https://hannahchoi.math.gatech.edu/;https://sites.google.com/view/brainml/home",
        "dblp": "174/4237;;;218/9092;15/9453",
        "google_scholar": "https://scholar.google.com/citations?h;sxVhpUkAAAAJ;O4e8l4AAAAAJ;tzVncBMAAAAJ;ptGYJiEAAAAJ",
        "orcid": "0000-0001-5947-2393;;0000-0003-1762-3450;0000-0002-8192-1121;0000-0002-7866-9455",
        "linkedin": ";;;;",
        "or_profile": "~Chengrui_Li1;~Soon_Ho_Kim1;~Chris_Rodgers1;~Hannah_Choi1;~Anqi_Wu3",
        "aff": "Georgia Institute of Technology;Georgia Institute of Technology;Emory University;Georgia Institute of Technology;Georgia Institute of Technology",
        "aff_domain": "gatech.edu;gatech.edu;emory.edu;gatech.edu;gatech.edu",
        "position": "PhD student;Postdoc;Assistant Professor;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nli2024onehot,\ntitle={One-hot Generalized Linear Model for Switching Brain State Discovery},\nauthor={Chengrui Li and Soon Ho Kim and Chris Rodgers and Hannah Choi and Anqi Wu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=MREQ0k6qvD}\n}",
        "github": "",
        "project": "",
        "reviewers": "zShZ;G7kx;hZX1",
        "pdf_size": 3201490,
        "rating": "3;8;8",
        "confidence": "4;5;4",
        "soundness": "2;4;4",
        "contribution": "2;4;3",
        "presentation": "3;4;4",
        "wc_summary": "65;63;129",
        "wc_strengths": "57;105;61",
        "wc_weaknesses": "103;104;264",
        "wc_questions": "90;99;46",
        "wc_review": "315;371;500",
        "wc_reply_reviewers": "0;33;141",
        "wc_reply_authors": "1148;505;1558",
        "reply_reviewers": "0;1;1",
        "reply_authors": "3;1;3",
        "rating_avg": [
            6.333333333333333,
            2.357022603955158
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            85.66666666666667,
            30.652170486860395
        ],
        "wc_strengths_avg": [
            74.33333333333333,
            21.74600857373345
        ],
        "wc_weaknesses_avg": [
            157.0,
            75.66152699137565
        ],
        "wc_questions_avg": [
            78.33333333333333,
            23.156472577277874
        ],
        "wc_review_avg": [
            395.3333333333333,
            77.46110134914312
        ],
        "wc_reply_reviewers_avg": [
            58.0,
            60.21627686929839
        ],
        "wc_reply_authors_avg": [
            1070.3333333333333,
            433.37922833882516
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15915309547499594811&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=MREQ0k6qvD",
        "pdf": "https://openreview.net/pdf?id=MREQ0k6qvD",
        "email": "gatech.edu;gatech.edu;emory.edu;gatech.edu;gatech.edu",
        "author_num": 5,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "Georgia Institute of Technology;Emory University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.gatech.edu;https://www.emory.edu",
        "aff_unique_abbr": "Georgia Tech;Emory",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "MRSNGbgjkf",
        "title": "Dyn-Adapter: Towards Disentangled Representation for Efficient Visual Recognition",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Parameter-efficient transfer learning (PETL) is a promising task, aiming to adapt the large-scale pretrained model to downstream tasks with a relatively modest cost. However, current PETL methods struggle in compressing computational complexity and bear heavy inference burden due to the complete forward process. This paper presents an efficient visual recognition paradigm, called Dynamic Adapter (Dyn-Adapter), that  boosts PETL efficiency by subtly disentangling features in multiple levels. Our approach is simple: first, we devise a dynamic architecture with balanced early heads for multi-level feature extraction, along with adaptive training strategy. Second, we introduce a bidirectional sparsity strategy driven by the pursuit of powerful generalized ability. These qualities enable us to fine-tune efficiently and effectively:  we reduce FLOPs during inference by 50%,  while maintaining or even yielding higher recognition accuracy. Extensive experiments on diverse datasets and pretrained backbones demonstrate the potential of Dyn-Adapter serving as a general efficiency booster for PETL. We will make the code publicly available.",
        "keywords": "parameter-efficient transfer learning;dynamic adapter;inference efficiency",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/f802f894033b2b615e0cf25abd7f155d2f3f08a8.pdf",
        "author": "Yurong Zhang;Honghao Chen;Xinyu Zhang;Xiangxiang Chu;Kaiqi Huang;Li Song",
        "authorids": "~Yurong_Zhang1;~Honghao_Chen1;~Xinyu_Zhang2;~Xiangxiang_Chu1;~Kaiqi_Huang1;~Li_Song3",
        "gender": "F;M;M;M;M;M",
        "homepage": ";;;https://cxxgtxy.github.io/;https://people.ucas.ac.cn/~huangkaiqi?language=en;http://medialab.sjtu.edu.cn",
        "dblp": "261/6606;279/9807;;207/8002;89/7026;20/872-1",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;zGLVABAAAAAJ;jn21pUsAAAAJ;caQ-OmYAAAAJ;jKIoTVoAAAAJ",
        "orcid": ";;;0000-0003-2548-0605;;",
        "linkedin": "%E8%82%B2%E8%8D%A3-%E5%BC%A0-603333238/;;;;;",
        "or_profile": "~Yurong_Zhang1;~Honghao_Chen1;~Xinyu_Zhang2;~Xiangxiang_Chu1;~Kaiqi_Huang1;~Li_Song3",
        "aff": "Shanghai Jiaotong University;Institute of Automation, Chinese Academy of Sciences;Meituan;MeiTuan;Institute of automation, Chinese academy of science;Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn;ia.ac.cn;meituan.com;meituan.com;nlpr.ia.ac.cn;sjtu.edu.cn",
        "position": "MS student;PhD student;Researcher;Senior Engineer;Professor;Full Professor",
        "bibtex": "@misc{\nzhang2024dynadapter,\ntitle={Dyn-Adapter: Towards Disentangled Representation for Efficient Visual Recognition},\nauthor={Yurong Zhang and Honghao Chen and Xinyu Zhang and Xiangxiang Chu and Kaiqi Huang and Li Song},\nyear={2024},\nurl={https://openreview.net/forum?id=MRSNGbgjkf}\n}",
        "github": "",
        "project": "",
        "reviewers": "jPC2;6BHQ;pscv",
        "site": "https://openreview.net/forum?id=MRSNGbgjkf",
        "pdf_size": 584091,
        "rating": "3;5;5",
        "confidence": "4;5;3",
        "soundness": "2;2;3",
        "contribution": "2;2;2",
        "presentation": "2;2;4",
        "wc_summary": "84;64;99",
        "wc_strengths": "25;39;90",
        "wc_weaknesses": "542;54;83",
        "wc_questions": "40;22;2",
        "wc_review": "691;179;274",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            82.33333333333333,
            14.337208778404378
        ],
        "wc_strengths_avg": [
            51.333333333333336,
            27.932458220182163
        ],
        "wc_weaknesses_avg": [
            226.33333333333334,
            223.5237993791464
        ],
        "wc_questions_avg": [
            21.333333333333332,
            15.520595635763755
        ],
        "wc_review_avg": [
            381.3333333333333,
            222.37555820928
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:tRXfSVlBWZMJ:scholar.google.com/&scioq=Dyn-Adapter:+Towards+Disentangled+Representation+for+Efficient+Visual+Recognition&hl=en&as_sdt=0,5",
        "gs_version_total": 9,
        "aff_unique_index": "0;1;2;2;1;0",
        "aff_unique_norm": "Shanghai Jiao Tong University;Chinese Academy of Sciences;Meituan",
        "aff_unique_dep": ";Institute of Automation;",
        "aff_unique_url": "https://www.sjtu.edu.cn;http://www.ia.cas.cn;https://www.meituan.com",
        "aff_unique_abbr": "SJTU;CAS;Meituan",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "DrM: Mastering Visual Reinforcement Learning through Dormant Ratio Minimization",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18821",
        "id": "MSe8YFbhUE",
        "author_site": "Guowei Xu, Ruijie Zheng, Yongyuan Liang, Xiyao Wang, Zhecheng Yuan, Tianying Ji, Yu Luo, Xiaoyu Liu, Jiaxin Yuan, Pu Hua, Shuzhen Li, Yanjie Ze, Hal Daum\u00e9 III, Furong Huang, Huazhe Xu",
        "tldr": "",
        "abstract": "Visual reinforcement learning (RL) has shown promise in continuous control tasks.\nDespite its progress, current algorithms are still unsatisfactory in virtually every aspect of the performance such as sample efficiency, asymptotic performance, and their robustness to the choice of random seeds.\nIn this paper, we identify a major shortcoming in existing visual RL methods that is the agents often exhibit sustained inactivity during early training, thereby limiting their ability to explore effectively. \nExpanding upon this crucial observation, we additionally unveil a significant correlation between the agents' inclination towards motorically inactive exploration and the absence of neuronal activity within their policy networks.\nTo quantify this inactivity, we adopt dormant ratio as a metric to measure inactivity in the RL agent's network.\nEmpirically, we also recognize that the dormant ratio can act as a standalone indicator of an agent's activity level, regardless of the received reward signals.\nLeveraging the aforementioned insights, we introduce DrM, a method that uses three core mechanisms to guide agents' exploration-exploitation trade-offs by actively minimizing the dormant ratio. \nExperiments demonstrate that  DrM achieves significant improvements in sample efficiency and asymptotic performance with no broken seeds (76 seeds in total) across three continuous control benchmark environments, including DeepMind Control Suite, MetaWorld, and Adroit.\nMost importantly, DrM is the first model-free algorithm that consistently solves tasks in both the Dog and Manipulator domains from the DeepMind Control Suite as well as three dexterous hand manipulation tasks without demonstrations in Adroit, all based on pixel observations.",
        "keywords": "Visual RL; Dormant Ratio",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Guowei Xu;Ruijie Zheng;Yongyuan Liang;Xiyao Wang;Zhecheng Yuan;Tianying Ji;Yu Luo;Xiaoyu Liu;Jiaxin Yuan;Pu Hua;Shuzhen Li;Yanjie Ze;Hal Daum\u00e9 III;Furong Huang;Huazhe Xu",
        "authorids": "~Guowei_Xu2;~Ruijie_Zheng1;~Yongyuan_Liang1;~Xiyao_Wang1;~Zhecheng_Yuan1;~Tianying_Ji2;~Yu_Luo5;~Xiaoyu_Liu3;~Jiaxin_Yuan1;~Pu_Hua1;~Shuzhen_Li1;~Yanjie_Ze1;~Hal_Daum\u00e9_III1;~Furong_Huang1;~Huazhe_Xu1",
        "gender": "M;;F;M;M;F;M;F;F;M;M;M;M;F;M",
        "homepage": "https://xugw-kevin.github.io/;http://www.ruijiezheng.com;https://cheryyunl.github.io/;;http://www.github.com;;;;;https://piao-0429.github.io/;https://github.com/stardustLi;http://yanjieze.com;http://hal3.name;https://furong-huang.com;http://hxu.rocks",
        "dblp": "11/7718-1;294/8474;238/4104;;314/5755;124/2199.html;;;;331/5335;;312/5407;77/2856.html;72/8513;164/9006",
        "google_scholar": "7xKdIM4AAAAJ;;GQToORIAAAAJ;puVqfbwAAAAJ;;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com.hk/citations?user=KQjoQOMAAAAJ;;;https://scholar.google.com/citations?hl=en;;BO_b2O8AAAAJ;PbEw81gAAAAJ;13yyuCcAAAAJ;t9HPFawAAAAJ",
        "orcid": ";;;;;;0000-0001-6229-4639;0000-0003-3385-4726;;0009-0008-1301-7131;;;;;",
        "linkedin": ";;https://linkedin.com/in/yongyuan-l-31462a17a;;;;;;jiaxin-margot-yuan/;https://www.linkedin.cn/incareer/in/pu-hua-315462215;;yanjie-ze-a71a0a247/;;;",
        "or_profile": "~Guowei_Xu2;~Ruijie_Zheng1;~Yongyuan_Liang1;~Xiyao_Wang1;~Zhecheng_Yuan1;~Tianying_Ji2;~Yu_Luo5;~Xiaoyu_Liu3;~Jiaxin_Yuan1;~Pu_Hua1;~Shuzhen_Li1;~Yanjie_Ze1;~Hal_Daum\u00e9_III1;~Furong_Huang1;~Huazhe_Xu1",
        "aff": "Tsinghua University;University of Maryland, College Park;University of Maryland, College Park;University of Maryland, College Park;;Tsinghua University;Tsinghua University;University of Maryland, College Park;University of Maryland, College Park;Electronic Engineering, Tsinghua University;Tsinghua University;Stanford University;Microsoft;University of Maryland;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;cs.umd.edu;umd.edu;umd.edu;;tsinghua.edu.cn;tsinghua.edu.cn;umd.edu;umd.edu;mails.tsinghua.edu.cn;tsinghua.edu.cn;stanford.edu;microsoft.com;cs.umd.edu;tsinghua.edu.cn",
        "position": "Undergrad student;PhD student;PhD student;PhD student;;PhD student;PhD student;PhD student;PhD student;Undergrad student;Undergrad student;PhD student;Senior Principle Researcher;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nxu2024drm,\ntitle={DrM: Mastering Visual Reinforcement Learning through Dormant Ratio Minimization},\nauthor={Guowei Xu and Ruijie Zheng and Yongyuan Liang and Xiyao Wang and Zhecheng Yuan and Tianying Ji and Yu Luo and Xiaoyu Liu and Jiaxin Yuan and Pu Hua and Shuzhen Li and Yanjie Ze and Hal Daum{\\'e} III and Furong Huang and Huazhe Xu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=MSe8YFbhUE}\n}",
        "github": "",
        "project": "",
        "reviewers": "Jxw3;R5aS;jJ9Z;2E41",
        "pdf_size": 3222883,
        "rating": "6;6;6;8",
        "confidence": "4;3;4;4",
        "soundness": "3;3;3;3",
        "contribution": "3;3;4;3",
        "presentation": "3;3;3;3",
        "wc_summary": "103;41;93;56",
        "wc_strengths": "125;136;139;115",
        "wc_weaknesses": "428;646;200;203",
        "wc_questions": "43;244;528;73",
        "wc_review": "699;1067;960;447",
        "wc_reply_reviewers": "399;701;219;77",
        "wc_reply_authors": "1754;2448;2133;590",
        "reply_reviewers": "2;4;1;1",
        "reply_authors": "4;6;4;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            73.25,
            25.557533136044253
        ],
        "wc_strengths_avg": [
            128.75,
            9.496709956611289
        ],
        "wc_weaknesses_avg": [
            369.25,
            184.61226259379413
        ],
        "wc_questions_avg": [
            222.0,
            192.58894049243847
        ],
        "wc_review_avg": [
            793.25,
            240.58093752415215
        ],
        "wc_reply_reviewers_avg": [
            349.0,
            233.07080469247967
        ],
        "wc_reply_authors_avg": [
            1731.25,
            703.2252039709612
        ],
        "reply_reviewers_avg": [
            2.0,
            1.224744871391589
        ],
        "reply_authors_avg": [
            4.0,
            1.4142135623730951
        ],
        "replies_avg": [
            31,
            0
        ],
        "authors#_avg": [
            15,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 30,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13457715770660676580&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=MSe8YFbhUE",
        "pdf": "https://openreview.net/pdf?id=MSe8YFbhUE",
        "email": "tsinghua.edu.cn;cs.umd.edu;umd.edu;umd.edu;;tsinghua.edu.cn;tsinghua.edu.cn;umd.edu;umd.edu;mails.tsinghua.edu.cn;tsinghua.edu.cn;stanford.edu;microsoft.com;cs.umd.edu;tsinghua.edu.cn",
        "author_num": 15,
        "aff_unique_index": "0;1;1;1;0;0;1;1;0;0;2;3;1;0",
        "aff_unique_norm": "Tsinghua University;University of Maryland;Stanford University;Microsoft",
        "aff_unique_dep": ";;;Microsoft Corporation",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www/umd.edu;https://www.stanford.edu;https://www.microsoft.com",
        "aff_unique_abbr": "THU;UMD;Stanford;Microsoft",
        "aff_campus_unique_index": "1;1;1;1;1;2",
        "aff_campus_unique": ";College Park;Stanford",
        "aff_country_unique_index": "0;1;1;1;0;0;1;1;0;0;1;1;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "MU6jInwj7p",
        "title": "LRQ: Optimizing Post-Training Quantization for Large Language Models by Learning Low-Rank Weight-Scaling Matrices",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "With the commercialization of large language models (LLMs), weight-activation quantization has emerged to compress and accelerate LLMs, achieving high throughput while reducing inference costs. However, existing post-training quantization (PTQ) techniques for quantizing both weights and activations of LLMs still suffer from non-negligible performance drops, especially on massive multitask language understanding. To address this issue, we propose Low-Rank Quantization (LRQ) - a simple yet effective post-training weight quantization method for LLMs that reconstructs the outputs of an intermediate Transformer block by leveraging low-rank weight-scaling matrices, replacing the conventional full weight-scaling matrices that entail as many learnable scales as their associated weights. Thanks to parameter sharing via low-rank structure, LRQ only need to learn significantly fewer parameters while enabling the individual scaling of weights, thus boosting the generalization capability of quantized LLMs. Through extensive experiments, we demonstrate the superiority of LRQ to prior LLM INT8 PTQ works. Remarkably, we confirm for the first time the possibility of 4-bit weight and 8-bit activation quantization for LLMs with minimal accuracy loss among LLM PTQ studies.",
        "keywords": "Efficient Inference;Post-Training Quantization;Large Language Models",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Jung Hyun Lee;Jeonghoon Kim;June Yong Yang;Se Jung Kwon;Eunho Yang;Dongsoo Lee",
        "authorids": "~Jung_Hyun_Lee1;~Jeonghoon_Kim1;~June_Yong_Yang1;~Se_Jung_Kwon1;~Eunho_Yang1;~Dongsoo_Lee1",
        "gender": "M;M;;M;M;M",
        "homepage": ";;http://mli.kaist.ac.kr/people/;;https://sites.google.com/site/hleehome2/;",
        "dblp": "132/2899;;277/5624;119/5676;96/2621;11/9680",
        "google_scholar": ";https://scholar.google.com/citations?hl=ko;nkLNWg0AAAAJ;https://scholar.google.co.kr/citations?user=8eTxKOkAAAAJ;;ALiieEkAAAAJ",
        "orcid": ";0000-0002-6068-6476;;;;",
        "linkedin": ";jeonghoon-kim-804892175/;;se-jung-kwon-305503175/;;",
        "or_profile": "~Jung_Hyun_Lee1;~Jeonghoon_Kim1;~June_Yong_Yang1;~Se_Jung_Kwon1;~Eunho_Yang1;~Dongsoo_Lee1",
        "aff": "NAVER CLOVA;NAVER;Korea Advanced Institute of Science & Technology;NAVER Cloud;Korea Advanced Institute of Science & Technology;NAVER CLOVA",
        "aff_domain": "navercorp.com;navercorp.com;kaist.ac.kr;navercorp.com;kaist.ac.kr;navercorp.com",
        "position": "Researcher;Researcher;PhD student;AI Researcher;Associate Professor;Executive Officer",
        "bibtex": "@misc{\nlee2024lrq,\ntitle={{LRQ}: Optimizing Post-Training Quantization for Large Language Models by Learning Low-Rank Weight-Scaling Matrices},\nauthor={Jung Hyun Lee and Jeonghoon Kim and June Yong Yang and Se Jung Kwon and Eunho Yang and Dongsoo Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=MU6jInwj7p}\n}",
        "github": "",
        "project": "",
        "reviewers": "VLPY;F2mg;m3qc;ok57",
        "site": "https://openreview.net/forum?id=MU6jInwj7p",
        "pdf_size": 3534635,
        "rating": "3;6;6;6",
        "confidence": "5;3;3;4",
        "soundness": "2;2;3;3",
        "contribution": "1;2;2;3",
        "presentation": "2;3;3;4",
        "wc_summary": "187;62;52;68",
        "wc_strengths": "40;48;27;50",
        "wc_weaknesses": "197;87;98;139",
        "wc_questions": "124;19;6;261",
        "wc_review": "548;216;183;518",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1675;614;215;1473",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;1;1;2",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            92.25,
            55.00170451904195
        ],
        "wc_strengths_avg": [
            41.25,
            9.03811374126261
        ],
        "wc_weaknesses_avg": [
            130.25,
            43.135687081580144
        ],
        "wc_questions_avg": [
            102.5,
            102.3095792191523
        ],
        "wc_review_avg": [
            366.25,
            167.49384317042822
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            994.25,
            600.9248601114786
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.8703882797784892,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17683872861778162333&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;0;1;0",
        "aff_unique_norm": "NAVER Corporation;Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "CLOVA;",
        "aff_unique_url": "https://www.naver.com;https://www.kaist.ac.kr",
        "aff_unique_abbr": "NAVER;KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "MUoR5q3oFm",
        "title": "Implicit Latent Causal Representation Learning through Soft Interventions",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Learning causal representations from observational and interventional data in the absence of known ground-truth graph structures necessitates implicit latent causal representation learning. Implicitly learning causal mechanisms typically involves two categories of interventional data: hard and soft interventions. In real-world scenarios, soft interventions are often more realistic than hard interventions, as the latter require fully controlled environments. Unlike hard interventions, which directly force changes in a causal variable, soft interventions exert influence indirectly by affecting the causal mechanism. In this paper, we tackle implicit latent causal representation learning in a Variational Autoencoder (VAE) framework with soft interventions. Our approach models soft interventions by employing a causal mechanism switch variable designed to toggle between different causal mechanisms. In our experiments, we consistently observe  improved learning of identifiable, causal representations, compared to baseline approaches.",
        "keywords": "Representation Learning;Interventions;Identifiability;Causal Disentanglement;Causality;Variational Inference",
        "primary_area": "causal reasoning",
        "supplementary_material": "/attachment/3d88315c9ab11b54245907d49769fdf7b8a63475.zip",
        "author": "Shayan Shirahmad Gale Bagi;Zahra Gharaee;Oliver Schulte;Mark Crowley",
        "authorids": "~Shayan_Shirahmad_Gale_Bagi1;~Zahra_Gharaee1;~Oliver_Schulte1;~Mark_Crowley1",
        "gender": "M;F;M;M",
        "homepage": "https://uwaterloo.ca/scholar/sshirahm;https://zahrag.github.io/;http://www.cs.sfu.ca/~oschulte/;http://markcrowley.ca",
        "dblp": ";174/4584;s/OliverSchulte;14/5500-1",
        "google_scholar": "3-YdeMMAAAAJ;https://scholar.google.pl/citations?user=nWe8d1MAAAAJ;;https://scholar.google.ca/citations?user=eL_y80EAAAAJ",
        "orcid": ";0000-0003-0140-0025;;0000-0003-3921-4762",
        "linkedin": "shayan-shirahmad-gale-bagi-819571149;zahragh/;;markanthonycrowley/",
        "or_profile": "~Shayan_Shirahmad_Gale_Bagi1;~Zahra_Gharaee1;~Oliver_Schulte1;~Mark_Crowley1",
        "aff": "University of Waterloo;University of Waterloo;Simon Fraser University;University of Waterloo",
        "aff_domain": "uwaterloo.ca;uwaterloo.ca;sfu.ca;uwaterloo.ca",
        "position": "PhD student;Postdoc;Full Professor;Associate Professor",
        "bibtex": "@misc{\nbagi2024implicit,\ntitle={Implicit Latent Causal Representation Learning through Soft Interventions},\nauthor={Shayan Shirahmad Gale Bagi and Zahra Gharaee and Oliver Schulte and Mark Crowley},\nyear={2024},\nurl={https://openreview.net/forum?id=MUoR5q3oFm}\n}",
        "github": "",
        "project": "",
        "reviewers": "mX9b;dD4K;W75o;Uh9i;4MaE;sELc",
        "site": "https://openreview.net/forum?id=MUoR5q3oFm",
        "pdf_size": 2881194,
        "rating": "3;3;3;3;5;5",
        "confidence": "5;3;3;3;4;4",
        "soundness": "1;2;1;2;2;3",
        "contribution": "2;2;1;2;2;3",
        "presentation": "2;2;1;2;2;3",
        "wc_summary": "143;42;33;54;30;118",
        "wc_strengths": "43;30;14;34;6;71",
        "wc_weaknesses": "451;387;789;463;53;144",
        "wc_questions": "12;12;247;6;87;73",
        "wc_review": "649;471;1083;557;176;406",
        "wc_reply_reviewers": "0;0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0;0",
        "reply_authors": "0;0;0;0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.7453559924999298
        ],
        "soundness_avg": [
            1.8333333333333333,
            0.6871842709362769
        ],
        "contribution_avg": [
            2.0,
            0.5773502691896257
        ],
        "presentation_avg": [
            2.0,
            0.5773502691896257
        ],
        "wc_summary_avg": [
            70.0,
            44.04921490030592
        ],
        "wc_strengths_avg": [
            33.0,
            20.992061991778385
        ],
        "wc_weaknesses_avg": [
            381.1666666666667,
            238.70373315518594
        ],
        "wc_questions_avg": [
            72.83333333333333,
            84.06627676356847
        ],
        "wc_review_avg": [
            557.0,
            277.03730194085176
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3162277660168379,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:He9BhUfU704J:scholar.google.com/&scioq=Implicit+Latent+Causal+Representation+Learning+through+Soft+Interventions&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "University of Waterloo;Simon Fraser University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://uwaterloo.ca;https://www.sfu.ca",
        "aff_unique_abbr": "UW;SFU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "title": "A Probabilistic Framework for Modular Continual Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18820",
        "id": "MVe2dnWPCu",
        "author_site": "Lazar Valkov, Akash Srivastava, Swarat Chaudhuri, Charles Sutton",
        "tldr": "",
        "abstract": "Modular approaches that use a different composition of modules for each problem are a promising direction in continual learning (CL). However, searching through the large, discrete space of module compositions is challenging, especially because evaluating a composition\u2019s performance requires a round of neural network training. We address this challenge through a modular CL framework, PICLE, that uses a probabilistic model to cheaply compute the fitness of each composition, allowing PICLE to achieve both perceptual, few-shot and latent transfer. The model combines prior knowledge about good module compositions with dataset-specific information. We evaluate PICLE using two benchmark suites designed to assess different desiderata of CL techniques. Comparing to a wide range of approaches, we show that PICLE is the first modular CL algorithm to achieve perceptual, few-shot and latent transfer while scaling well to large search spaces, outperforming previous state-of-the-art modular CL approaches on long problem sequences.",
        "keywords": "continual learning;modular machine learning;modular continual learning;transfer learning;catastrophic forgetting;Bayesian optimization;probabilistic modelling",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Lazar Valkov;Akash Srivastava;Swarat Chaudhuri;Charles Sutton",
        "authorids": "~Lazar_Valkov1;~Akash_Srivastava1;~Swarat_Chaudhuri1;~Charles_Sutton1",
        "gender": "M;M;M;M",
        "homepage": ";http://akashgit.github.io;http://www.cs.utexas.edu/~swarat;http://homepages.inf.ed.ac.uk/csutton/",
        "dblp": "209/4938;24/9528;37/6100;59/5879",
        "google_scholar": ";https://scholar.google.co.uk/citations?user=2h6SZeEAAAAJ;9j6RBYQAAAAJ;https://scholar.google.co.uk/citations?user=hYtGXD0AAAAJ",
        "orcid": ";;0000-0002-6859-1391;0000-0002-0041-3820",
        "linkedin": ";https://uk.linkedin.com/in/akash-srivastava-aa97361b;swarat-chaudhuri-609b3092/;charles-sutton-772aa126",
        "or_profile": "~Lazar_Valkov1;~Akash_Srivastava1;~Swarat_Chaudhuri1;~Charles_Sutton1",
        "aff": "International Business Machines;International Business Machines;University of Texas at Austin;University of Edinburgh",
        "aff_domain": "ibm.com;ibm.com;utexas.edu;ed.ac.uk",
        "position": "Postdoc;Principal Researcher;Full Professor;Professor",
        "bibtex": "@inproceedings{\nvalkov2024a,\ntitle={A Probabilistic Framework for Modular Continual Learning},\nauthor={Lazar Valkov and Akash Srivastava and Swarat Chaudhuri and Charles Sutton},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=MVe2dnWPCu}\n}",
        "github": "",
        "project": "",
        "reviewers": "gkN4;REkX;K341;g7xb",
        "pdf_size": 1886940,
        "rating": "6;8;8;8",
        "confidence": "4;4;3;4",
        "soundness": "3;4;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "118;189;95;74",
        "wc_strengths": "46;183;51;84",
        "wc_weaknesses": "56;174;4;159",
        "wc_questions": "105;71;92;1",
        "wc_review": "325;617;242;318",
        "wc_reply_reviewers": "17;22;22;0",
        "wc_reply_authors": "664;656;461;324",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            119.0,
            43.30704330706496
        ],
        "wc_strengths_avg": [
            91.0,
            55.08629593646681
        ],
        "wc_weaknesses_avg": [
            98.25,
            70.88150322898069
        ],
        "wc_questions_avg": [
            67.25,
            40.12714168739159
        ],
        "wc_review_avg": [
            375.5,
            143.17908366797155
        ],
        "wc_reply_reviewers_avg": [
            15.25,
            9.03811374126261
        ],
        "wc_reply_authors_avg": [
            526.25,
            142.2785560089784
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11463154643239765344&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=MVe2dnWPCu",
        "pdf": "https://openreview.net/pdf?id=MVe2dnWPCu",
        "email": "ibm.com;ibm.com;utexas.edu;ed.ac.uk",
        "author_num": 4,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "International Business Machines Corporation;University of Texas at Austin;University of Edinburgh",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ibm.com;https://www.utexas.edu;https://www.ed.ac.uk",
        "aff_unique_abbr": "IBM;UT Austin;Edinburgh",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Austin",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "title": "The Need for Speed: Pruning Transformers with One Recipe",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18819",
        "id": "MVmT6uQ3cQ",
        "author_site": "Samir Khaki, Konstantinos Plataniotis",
        "tldr": "",
        "abstract": "We introduce the $\\textbf{O}$ne-shot $\\textbf{P}$runing $\\textbf{T}$echnique for $\\textbf{I}$nterchangeable $\\textbf{N}$etworks ($\\textbf{OPTIN}$) framework as a tool to increase the efficiency of pre-trained transformer architectures $\\textit{without requiring re-training}$. Recent works have explored improving transformer efficiency, however often incur computationally expensive re-training procedures or depend on architecture-specific characteristics, thus impeding practical wide-scale adoption. \nTo address these shortcomings, the OPTIN framework leverages intermediate feature distillation, capturing the long-range dependencies of model parameters (coined $\\textit{trajectory}$), to produce state-of-the-art results on natural language, image classification, transfer learning, and semantic segmentation tasks $\\textit{without re-training}$. Given a FLOP constraint, the OPTIN framework will compress the network while maintaining competitive accuracy performance and improved throughput. Particularly, we show a $\\leq 2$% accuracy degradation from NLP baselines and a $0.5$% improvement from state-of-the-art methods on image classification at competitive FLOPs reductions. We further demonstrate the generalization of tasks and architecture with comparative performance using Mask2Former for semantic segmentation and cnn-style networks. OPTIN presents one of the first one-shot efficient frameworks for compressing transformer architectures that generalizes well across different class domains, in particular: natural language and image-related tasks, without $\\textit{re-training}$.",
        "keywords": "transformers;pruning;re-training;latency;throughput;token reduction;one-shot",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/23a88a332fdcde38fbb0479539d8e2bc1b27c31d.zip",
        "author": "Samir Khaki;Konstantinos N Plataniotis",
        "authorids": "~Samir_Khaki1;~Konstantinos_N_Plataniotis1",
        "gender": "M;M",
        "homepage": "http://samirkhaki.com;https://www.comm.utoronto.ca/~kostas/",
        "dblp": "304/3390.html;p/KonstantinosNPlataniotis",
        "google_scholar": "XUyUZY4AAAAJ;https://scholar.google.ca/citations?hl=en",
        "orcid": "0009-0006-7278-8652;0000-0003-3647-5473",
        "linkedin": "samir-khaki-0125861b7/;",
        "or_profile": "~Samir_Khaki1;~Kostantinos_Plataniotis1",
        "aff": "University of Toronto;Toronto University",
        "aff_domain": "ece.utoronto.ca;utoronto.ca",
        "position": "Undergrad student;Full Professor",
        "bibtex": "@inproceedings{\nkhaki2024the,\ntitle={The Need for Speed: Pruning Transformers with One Recipe},\nauthor={Samir Khaki and Konstantinos N Plataniotis},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=MVmT6uQ3cQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "meSa;oBzK;RsPn",
        "pdf_size": 3132766,
        "rating": "6;6;6",
        "confidence": "3;2;3",
        "soundness": "3;3;3",
        "contribution": "3;3;2",
        "presentation": "3;3;2",
        "wc_summary": "41;34;54",
        "wc_strengths": "48;32;48",
        "wc_weaknesses": "262;55;73",
        "wc_questions": "31;2;129",
        "wc_review": "382;123;304",
        "wc_reply_reviewers": "67;0;17",
        "wc_reply_authors": "826;616;959",
        "reply_reviewers": "1;0;1",
        "reply_authors": "2;1;3",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            43.0,
            8.286535263104035
        ],
        "wc_strengths_avg": [
            42.666666666666664,
            7.542472332656507
        ],
        "wc_weaknesses_avg": [
            130.0,
            93.6269192059634
        ],
        "wc_questions_avg": [
            54.0,
            54.33844556726542
        ],
        "wc_review_avg": [
            269.6666666666667,
            108.48758249475169
        ],
        "wc_reply_reviewers_avg": [
            28.0,
            28.437065014988214
        ],
        "wc_reply_authors_avg": [
            800.3333333333334,
            141.20040919046784
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15651365574649575526&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=MVmT6uQ3cQ",
        "pdf": "https://openreview.net/pdf?id=MVmT6uQ3cQ",
        "email": "ece.utoronto.ca;utoronto.ca",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Toronto",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.utoronto.ca",
        "aff_unique_abbr": "U of T",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "MXI8aSgl53",
        "title": "NAG-GS: Semi-Implicit, Accelerated and Robust Stochastic Optimizer",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Classical machine learning models such as deep neural networks are usually trained by using Stochastic Gradient Descent-based (SGD) algorithms.  The classical SGD can be interpreted as a discretization of the stochastic gradient flow. In this paper we propose a novel, robust and accelerated stochastic optimizer that relies on two key elements: (1) an accelerated Nesterov-like Stochastic Differential Equation (SDE) and (2) its semi-implicit Gauss-Seidel type discretization. The convergence and stability of the obtained method, referred to as NAG-GS, are first studied extensively in the case of the minimization of a quadratic function. This analysis allows us to come up with an optimal learning rate in terms of the convergence rate while ensuring the stability of NAG-GS. This is achieved by the careful analysis of the spectral radius of the iteration matrix and the covariance matrix at stationarity with respect to all hyperparameters of our method. Further, we show that NAG-GS is competitive with state-of-the-art methods such as momentum SGD with weight decay and AdamW for the training of machine learning models such as the logistic regression model, the residual networks models on standard computer vision datasets, Transformers in the frame of the GLUE benchmark and the recent Vision Transformers.",
        "keywords": "Accelerated gradient methods;stochastic optimization;stochastic differential equations;semi-implicit solver;convergence analysis;deep neural networks",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/90c2931200be1c723754d21fc21bd009afe6691f.pdf",
        "author": "Valentin Leplat;Daniil Merkulov;Aleksandr Katrutsa;Daniel Bershatsky;Olga Tsymboi;Ivan Oseledets",
        "authorids": "~Valentin_Leplat1;~Daniil_Merkulov1;~Aleksandr_Katrutsa1;~Daniel_Bershatsky1;~Olga_Tsymboi1;~Ivan_Oseledets1",
        "gender": "M;;;M;F;M",
        "homepage": "https://sites.google.com/view/valentinleplat/;;;https://github.com/daskol;;http://oseledets.github.io",
        "dblp": ";;;;318/0353;56/7175",
        "google_scholar": ";;;XthC2z8AAAAJ;XEqNh2wAAAAJ;https://scholar.google.ru/citations?user=5kMqBQEAAAAJ",
        "orcid": "0000-0002-3313-1547;;;0000-0001-8917-8187;0000-0002-8078-1876;",
        "linkedin": ";;;;;",
        "or_profile": "~Valentin_Leplat1;~Daniil_Merkulov1;~Aleksandr_Katrutsa1;~Daniel_Bershatsky1;~Olga_Tsymboi1;~Ivan_Oseledets1",
        "aff": "Skoltech;;;Skolkovo Institute of Science and Technology;Moscow Institute of Physics and Technology;Institute of Numerical Mathematics",
        "aff_domain": "skoltech.ru;;;skoltech.ru;phystech.edu;inm.ras.ru",
        "position": "Postdoc;;;PhD student;PhD student;Researcher",
        "bibtex": "@misc{\nleplat2024naggs,\ntitle={{NAG}-{GS}: Semi-Implicit, Accelerated and Robust Stochastic Optimizer},\nauthor={Valentin Leplat and Daniil Merkulov and Aleksandr Katrutsa and Daniel Bershatsky and Olga Tsymboi and Ivan Oseledets},\nyear={2024},\nurl={https://openreview.net/forum?id=MXI8aSgl53}\n}",
        "github": "",
        "project": "",
        "reviewers": "f3XV;13Pv;nCbP;MgiM",
        "site": "https://openreview.net/forum?id=MXI8aSgl53",
        "pdf_size": 509294,
        "rating": "3;5;5;6",
        "confidence": "3;4;4;3",
        "soundness": "2;3;3;4",
        "contribution": "2;2;2;4",
        "presentation": "2;2;3;4",
        "wc_summary": "50;75;95;26",
        "wc_strengths": "13;35;31;30",
        "wc_weaknesses": "29;221;231;123",
        "wc_questions": "1;108;2;172",
        "wc_review": "93;439;359;351",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "189;1087;470;740",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            61.5,
            25.96632434519757
        ],
        "wc_strengths_avg": [
            27.25,
            8.437268515343103
        ],
        "wc_weaknesses_avg": [
            151.0,
            82.10968274204937
        ],
        "wc_questions_avg": [
            70.75,
            72.85387772795625
        ],
        "wc_review_avg": [
            310.5,
            130.20272654595217
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            621.5,
            331.9416364362868
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.2294157338705618,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13436589729931682792&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "Skolkovo Institute of Science and Technology;Moscow Institute of Physics and Technology;Institute of Numerical Mathematics",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.skoltech.ru;https://www.mipt.ru/en;",
        "aff_unique_abbr": "Skoltech;MIPT;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Russian Federation;"
    },
    {
        "id": "MXQUdCgNSv",
        "title": "Subgraph Mining for Graph Neural Networks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "While Graph Neural Networks (GNNs) are state-of-the-art models for graph learning, they are only as expressive as the basic first-order Weisfeiler-Leman graph isomorphism test algorithm. To enhance their expressiveness one can incorporate complex structural information as attributes of the nodes in input graphs. However, this approach typically demands significant human effort and specialised domain knowledge, which is not always available. In this paper, we demonstrate the feasibility of automatically extracting such structural information through subgraph mining and feature selection techniques. Our extensive experimental evaluation, conducted across graph classification tasks, reveals that GNNs extended with automatically selected features obtained using subgraph mining can achieve comparable or even superior performance to GNNs relying on manually crafted features.",
        "keywords": "graph learning;graph neural networks;graph representation learning;subgraph mining;subgraph isomorphism",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "",
        "author": "Adem Kikaj;Giuseppe Marra;Luc De Raedt",
        "authorids": "~Adem_Kikaj1;~Giuseppe_Marra1;~Luc_De_Raedt1",
        "gender": "M;M;M",
        "homepage": "https://people.cs.kuleuven.be/~adem.kikaj/;https://www.giuseppemarra.com;https://people.cs.kuleuven.be/~luc.deraedt/",
        "dblp": ";150/7452;r/LucDeRaedt",
        "google_scholar": "iXo8BZkAAAAJ;https://scholar.google.it/citations?user=BBcsk7MAAAAJ;https://scholar.google.com.tw/citations?user=dgobB6AAAAAJ",
        "orcid": "0000-0002-8487-0040;;0000-0002-6860-6303",
        "linkedin": ";;",
        "or_profile": "~Adem_Kikaj1;~Giuseppe_Marra1;~Luc_De_Raedt1",
        "aff": "KU Leuven;KU Leuven;KU Leuven, Belgium",
        "aff_domain": "kuleuven.be;kuleuven.be;cs.kuleuven.be",
        "position": "PhD student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nkikaj2024subgraph,\ntitle={Subgraph Mining for Graph Neural Networks},\nauthor={Adem Kikaj and Giuseppe Marra and Luc De Raedt},\nyear={2024},\nurl={https://openreview.net/forum?id=MXQUdCgNSv}\n}",
        "github": "",
        "project": "",
        "reviewers": "8yY4;qGJB;nYJy;x5SK",
        "site": "https://openreview.net/forum?id=MXQUdCgNSv",
        "pdf_size": 333534,
        "rating": "3;3;3;6",
        "confidence": "4;3;5;3",
        "soundness": "3;2;3;3",
        "contribution": "1;1;2;3",
        "presentation": "2;2;4;3",
        "wc_summary": "67;76;290;123",
        "wc_strengths": "14;70;36;62",
        "wc_weaknesses": "123;128;476;55",
        "wc_questions": "2;105;21;187",
        "wc_review": "206;379;823;427",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            139.0,
            89.73572309844057
        ],
        "wc_strengths_avg": [
            45.5,
            22.107690969434145
        ],
        "wc_weaknesses_avg": [
            195.5,
            164.4939208603163
        ],
        "wc_questions_avg": [
            78.75,
            73.54038006428848
        ],
        "wc_review_avg": [
            458.75,
            225.79235483071608
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:x6C-7OXLk_8J:scholar.google.com/&scioq=Subgraph+Mining+for+Graph+Neural+Networks&hl=en&as_sdt=0,5",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Katholieke Universiteit Leuven;KU Leuven",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.kuleuven.be;https://www.kuleuven.be",
        "aff_unique_abbr": "KU Leuven;KU Leuven",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Belgium"
    },
    {
        "title": "Denoising Task Routing for Diffusion Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18818",
        "id": "MY0qlcFcUg",
        "author_site": "Byeongjun Park, Sangmin Woo, Hyojun Go, Jin-Young Kim, Changick Kim",
        "tldr": "",
        "abstract": "Diffusion models generate highly realistic images by learning a multi-step denoising process, naturally embodying the principles of multi-task learning (MTL). Despite the inherent connection between diffusion models and MTL, there remains an unexplored area in designing neural architectures that explicitly incorporate MTL into the framework of diffusion models. In this paper, we present Denoising Task Routing (DTR), a simple add-on strategy for existing diffusion model architectures to establish distinct information pathways for individual tasks within a single architecture by selectively activating subsets of channels in the model. What makes DTR particularly compelling is its seamless integration of prior knowledge of denoising tasks into the framework: (1) Task Affinity: DTR activates similar channels for tasks at adjacent timesteps and shifts activated channels as sliding windows through timesteps, capitalizing on the inherent strong affinity between tasks at adjacent timesteps. (2) Task Weights: During the early stages (higher timesteps) of the denoising process, DTR assigns a greater number of task-specific channels, leveraging the insight that diffusion models prioritize reconstructing global structure and perceptually rich contents in earlier stages, and focus on simple noise removal in later stages. Our experiments reveal that DTR not only consistently boosts diffusion models' performance across different evaluation protocols without adding extra parameters but also accelerates training convergence. Finally, we show the complementarity between our architectural approach and existing MTL optimization techniques, providing a more complete view of MTL in the context of diffusion training. Significantly, by leveraging this complementarity, we attain matched performance of DiT-XL using the smaller DiT-L with a reduction in training iterations from 7M to 2M. Our project page is available at https://byeongjun-park.github.io/DTR/",
        "keywords": "Diffusion Model Architecture;Multi-Task Learning (MTL);Diffusion Models",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Byeongjun Park;Sangmin Woo;Hyojun Go;Jin-Young Kim;Changick Kim",
        "authorids": "~Byeongjun_Park1;~Sangmin_Woo1;~Hyojun_Go2;~Jin-Young_Kim1;~Changick_Kim1",
        "gender": "M;;M;;M",
        "homepage": "https://byeongjun-park.github.io/;;https://gohyojun15.github.io/;;https://cilabs.kaist.ac.kr",
        "dblp": "305/7147;;283/5331;;40/5999",
        "google_scholar": "VzPQ7dYAAAAJ;;xfiZvzsAAAAJ;;https://scholar.google.co.kr/citations?user=ABH_2lcAAAAJ",
        "orcid": "0000-0002-1930-2266;;0000-0002-5470-042X;;",
        "linkedin": ";;;;",
        "or_profile": "~Byeongjun_Park1;~Sangmin_Woo1;~Hyojun_Go2;~Jin-Young_Kim1;~Changick_Kim1",
        "aff": "Korea Advanced Institute of Science & Technology;;Twelvelabs;;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;;twelvelabs.io;;kaist.ac.kr",
        "position": "PhD student;;Researcher;;Full Professor",
        "bibtex": "@inproceedings{\npark2024denoising,\ntitle={Denoising Task Routing for Diffusion Models},\nauthor={Byeongjun Park and Sangmin Woo and Hyojun Go and Jin-Young Kim and Changick Kim},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=MY0qlcFcUg}\n}",
        "github": "",
        "project": "",
        "reviewers": "wtsR;VZ4w;8VoW",
        "pdf_size": 13419700,
        "rating": "6;8;8",
        "confidence": "3;4;5",
        "soundness": "4;3;3",
        "contribution": "3;3;2",
        "presentation": "3;3;4",
        "wc_summary": "83;81;39",
        "wc_strengths": "50;71;31",
        "wc_weaknesses": "116;122;93",
        "wc_questions": "8;90;2",
        "wc_review": "257;364;165",
        "wc_reply_reviewers": "21;35;104",
        "wc_reply_authors": "503;909;1364",
        "reply_reviewers": "1;1;2",
        "reply_authors": "2;3;4",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            67.66666666666667,
            20.28683207293725
        ],
        "wc_strengths_avg": [
            50.666666666666664,
            16.33673433979046
        ],
        "wc_weaknesses_avg": [
            110.33333333333333,
            12.498888839501783
        ],
        "wc_questions_avg": [
            33.333333333333336,
            40.14418457953226
        ],
        "wc_review_avg": [
            262.0,
            81.31830462243214
        ],
        "wc_reply_reviewers_avg": [
            53.333333333333336,
            36.279777042068794
        ],
        "wc_reply_authors_avg": [
            925.3333333333334,
            351.69146831973177
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.0,
            0.816496580927726
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.8660254037844385,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5989940559555941550&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=MY0qlcFcUg",
        "pdf": "https://openreview.net/pdf?id=MY0qlcFcUg",
        "email": "kaist.ac.kr;;twelvelabs.io;;kaist.ac.kr",
        "author_num": 5,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology;Twelvelabs",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.kaist.ac.kr;https://twelvelabs.com",
        "aff_unique_abbr": "KAIST;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "South Korea;Canada"
    },
    {
        "id": "MY7gMVioiX",
        "title": "Symmetrization of Loss Functions for Robust Training of Neural Networks in the Presence of Noisy Labels and the Multi-class Unhinged Loss Function",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Labeling a training set is not only often expensive but also susceptible to errors. Consequently, the development of robust loss functions to label noise has emerged as a problem of great importance. The symmetry condition leads to theoretical guarantees for robustness to such noise. In this work, we investigate a symmetrization method that follows from the unique decomposition of any multi-class loss function into a sum of a symmetric loss function and a class-insensitive term. We describe how this approach is related to regularization from Dirichlet priors on the outputs of the network. Notably, the special case of the symmetrization of the cross-entropy loss leads to a multi-class extension to the unhinged loss function. This loss function is linear but contrary to the binary case, it must have specific coefficients in order to satisfy the symmetry condition. Under appropriate assumptions, we show that this multi-class unhinged loss function is the unique convex multi-class symmetric loss function. It plays an interesting role among multi-class symmetric loss functions since the linear approximation of any symmetric loss function around points with equal components must be equivalent to the multi-class unhinged loss function. Remarkably, even though the cross-entropy loss is not inherently robust, it also exhibits this property. This means that around points assigning equal probabilities to every class, the cross-entropy will be approximately symmetric. Experiments on CIFAR validate the robustness of our approach.",
        "keywords": "Noisy labels;Symmetric loss functions;Multi-class loss decomposition;Unhinged loss function",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Alexandre Lemire Paquin;Brahim Chaib-draa;Philippe Gigu\u00e8re",
        "authorids": "~Alexandre_Lemire_Paquin1;~Brahim_Chaib-draa1;~Philippe_Gigu\u00e8re1",
        "gender": ";M;M",
        "homepage": ";http://www2.ift.ulaval.ca/~chaib/;https://norlab.ulaval.ca",
        "dblp": ";c/BChaibdraa.html;93/4851",
        "google_scholar": ";JycXWO0AAAAJ;https://scholar.google.ca/citations?user=tgZPkzkAAAAJ",
        "orcid": ";;0000-0002-7520-8290",
        "linkedin": ";;",
        "or_profile": "~Alexandre_Lemire_Paquin1;~Brahim_Chaib-draa1;~Philippe_Gigu\u00e8re1",
        "aff": "Laval university;Universite Laval, Laval university;Universit\u00e9 Laval",
        "aff_domain": "ulaval.ca;ift.ulaval.ca;ulaval.ca",
        "position": "PhD student;Full Professor;Full Professor",
        "bibtex": "@misc{\npaquin2024symmetrization,\ntitle={Symmetrization of Loss Functions for Robust Training of Neural Networks in the Presence of Noisy Labels and the Multi-class Unhinged Loss Function},\nauthor={Alexandre Lemire Paquin and Brahim Chaib-draa and Philippe Gigu{\\`e}re},\nyear={2024},\nurl={https://openreview.net/forum?id=MY7gMVioiX}\n}",
        "github": "",
        "project": "",
        "reviewers": "81Mq;FQCN;7oFd",
        "site": "https://openreview.net/forum?id=MY7gMVioiX",
        "pdf_size": 436534,
        "rating": "3;5;6",
        "confidence": "5;4;4",
        "soundness": "1;3;3",
        "contribution": "1;2;3",
        "presentation": "2;2;4",
        "wc_summary": "58;212;96",
        "wc_strengths": "24;55;46",
        "wc_weaknesses": "385;70;126",
        "wc_questions": "3;29;2",
        "wc_review": "470;366;270",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "237;232;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;0",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            122.0,
            65.50318058435535
        ],
        "wc_strengths_avg": [
            41.666666666666664,
            13.021349989749739
        ],
        "wc_weaknesses_avg": [
            193.66666666666666,
            137.2111106612321
        ],
        "wc_questions_avg": [
            11.333333333333334,
            12.498888839501783
        ],
        "wc_review_avg": [
            368.6666666666667,
            81.67142843260562
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            156.33333333333334,
            110.56320464884428
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.944911182523068,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:TuwGNyYgcSoJ:scholar.google.com/&scioq=Symmetrization+of+Loss+Functions+for+Robust+Training+of+Neural+Networks+in+the+Presence+of+Noisy+Labels+and+the+Multi-class+Unhinged+Loss+Function&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Laval University;Universite Laval;Universit\u00e9 Laval",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.laval.ca;https://www.ulaval.ca;https://www.ulaval.ca",
        "aff_unique_abbr": "Laval;UL;ULaval",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "MY8SBpUece",
        "title": "A Theory of Non-Linear Feature Learning with One Gradient Step in Two-Layer Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Feature learning is thought to be one of the fundamental reasons for the success of deep neural networks. \nIt is rigorously known that in two-layer fully-connected neural networks  under certain conditions, one step of gradient descent on the first layer followed by ridge regression on the second layer can lead to feature learning; characterized by the appearance of a separated rank-one component---spike---in the spectrum of the feature matrix.\nHowever, with a constant gradient descent step size, this spike only carries information from the linear component of the target function and therefore learning non-linear components is impossible.\nWe show that with a learning rate that grows with the sample size,\nsuch training in fact introduces \nmultiple rank-one components, \neach corresponding to a specific polynomial feature.\nWe further prove that the limiting large-dimensional and large sample training and test errors of the updated neural networks are fully characterized by these spikes. \nBy precisely analyzing the improvement in the loss, we demonstrate that these non-linear features can enhance learning.",
        "keywords": "feature learning;deep learning theory;random matrix theory;high dimensional asymptotics",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/7e8fba9146c9d881349a7a3f975bde24400e5f0e.pdf",
        "author": "Behrad Moniri;Donghwan Lee;Hamed Hassani;Edgar Dobriban",
        "authorids": "~Behrad_Moniri1;~Donghwan_Lee5;~Hamed_Hassani2;~Edgar_Dobriban2",
        "gender": "M;M;M;",
        "homepage": "https://bemoniri.com/;;https://www.seas.upenn.edu/~hassani/;https://statistics.wharton.upenn.edu/profile/dobriban/",
        "dblp": ";;73/4984;99/11269",
        "google_scholar": "HvsqQ9kAAAAJ;https://scholar.google.com/citations?hl=en;;aGvH4yMAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;edgar-dobriban/",
        "or_profile": "~Behrad_Moniri1;~Donghwan_Lee5;~Hamed_Hassani2;~Edgar_Dobriban2",
        "aff": "University of Pennsylvania;University of Pennsylvania;University of Pennsylvania;The Wharton School, University of Pennsylvania",
        "aff_domain": "wharton.upenn.edu;upenn.edu;upenn.edu;wharton.upenn.edu",
        "position": "MS student;PhD student;;Associate Professor",
        "bibtex": "@misc{\nmoniri2024a,\ntitle={A Theory of Non-Linear Feature Learning with One Gradient Step in Two-Layer Neural Networks},\nauthor={Behrad Moniri and Donghwan Lee and Hamed Hassani and Edgar Dobriban},\nyear={2024},\nurl={https://openreview.net/forum?id=MY8SBpUece}\n}",
        "github": "",
        "project": "",
        "reviewers": "nmYk;EiLn;boim;w1FP",
        "site": "https://openreview.net/forum?id=MY8SBpUece",
        "pdf_size": 2987417,
        "rating": "5;5;6;6",
        "confidence": "3;4;2;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "63;98;156;90",
        "wc_strengths": "52;80;33;79",
        "wc_weaknesses": "292;190;111;133",
        "wc_questions": "114;589;38;63",
        "wc_review": "521;957;338;365",
        "wc_reply_reviewers": "21;0;0;0",
        "wc_reply_authors": "1130;1949;315;633",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "3;4;1;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            101.75,
            33.89966813996857
        ],
        "wc_strengths_avg": [
            61.0,
            19.685019685029527
        ],
        "wc_weaknesses_avg": [
            181.5,
            70.008928002077
        ],
        "wc_questions_avg": [
            201.0,
            225.6800833037776
        ],
        "wc_review_avg": [
            545.25,
            247.77446902374749
        ],
        "wc_reply_reviewers_avg": [
            5.25,
            9.093266739736606
        ],
        "wc_reply_authors_avg": [
            1006.75,
            616.6913227052898
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            1.299038105676658
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.7071067811865475,
        "gs_citation": 31,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=83613241973691338&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 10,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of Pennsylvania",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.upenn.edu",
        "aff_unique_abbr": "UPenn",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "MYdt71DSgi",
        "title": "Grounding Everything: Emerging Localization Properties in Vision-Language Transformers",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Vision-language models have shown remarkable performance in various fields, ranging from zero-shot classification to captioning and prompt-based image generation. But so far, those models do not seem able to localize referential expressions and objects in images, with the result that they are only used as a post-process labeling step or that they need to be fine-tuned for this task. The following work, we show that vision-language (VL) models trained with image-level objectives hold object localization properties. We propose a Grounding Everything Model (GEM) that allows to leverage these properties without retraining or fine-tuning the pretrained model.  To this end, we extend the idea of v-v attention introduced by CLIPSurgery to a generalized self-self attention path and propose a set of regularizations that allows the model to better generalize across datasets and backbones. We further show how the concept of self-self attention corresponds to clustering, thus enforcing groups of tokens arising from the same object to be similar, while preserving the alignment with the language space. We evaluate the proposed GEM framework on three benchmark datasets and improve the performance in training-free open-vocabulary localization.",
        "keywords": "grounding;vision-language;open-vocabulary localization",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Walid Bousselham;Felix Petersen;Vittorio Ferrari;Hilde Kuehne",
        "authorids": "~Walid_Bousselham1;~Felix_Petersen1;~Vittorio_Ferrari4;~Hilde_Kuehne5",
        "gender": "M;Not Specified;M;F",
        "homepage": "http://walidbousselham.com/;http://www.petersen.ai/;https://sites.google.com/view/vittoferrari/home;https://hildekuehne.github.io",
        "dblp": ";230/3983;16/3608;45/4963",
        "google_scholar": "vbx_PS0AAAAJ;v8Kat6YAAAAJ;4QvYJ00AAAAJ;pxhCcH0AAAAJ",
        "orcid": "0000-0002-9684-523X;;;0000-0003-1079-4441",
        "linkedin": ";;vittorio-ferrari-17062b2b/;hilde-kuehne-8b9aa661",
        "or_profile": "~Walid_Bousselham1;~Felix_Petersen1;~Vittorio_Ferrari4;~Hilde_Kuehne5",
        "aff": "Johann Wolfgang Goethe Universit\u00e4t Frankfurt am Main;Stanford University;Synthesia;Rheinische Friedrich-Wilhelms-Universit\u00e4t Bonn, Rheinische Friedrich-Wilhelms Universit\u00e4t Bonn",
        "aff_domain": "uni-frankfurt.de;stanford.edu;synthesia.io;cs.uni-bonn.de",
        "position": "PhD student;Postdoc;Principal Researcher;Associate Professor",
        "bibtex": "@misc{\nbousselham2024grounding,\ntitle={Grounding Everything: Emerging Localization Properties in Vision-Language Transformers},\nauthor={Walid Bousselham and Felix Petersen and Vittorio Ferrari and Hilde Kuehne},\nyear={2024},\nurl={https://openreview.net/forum?id=MYdt71DSgi}\n}",
        "github": "",
        "project": "",
        "reviewers": "Ursz;PF2u;uWg6;67Tz",
        "site": "https://openreview.net/forum?id=MYdt71DSgi",
        "pdf_size": 3797788,
        "rating": "1;5;5;6",
        "confidence": "4;3;4;3",
        "soundness": "3;2;2;3",
        "contribution": "1;1;2;2",
        "presentation": "3;2;3;3",
        "wc_summary": "81;41;58;80",
        "wc_strengths": "62;44;50;42",
        "wc_weaknesses": "219;204;359;103",
        "wc_questions": "116;40;58;49",
        "wc_review": "478;329;525;274",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "602;550;1061;484",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            4.25,
            1.920286436967152
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            65.0,
            16.62828914831589
        ],
        "wc_strengths_avg": [
            49.5,
            7.794228634059948
        ],
        "wc_weaknesses_avg": [
            221.25,
            91.18764993133665
        ],
        "wc_questions_avg": [
            65.75,
            29.701641368786337
        ],
        "wc_review_avg": [
            401.5,
            103.2194264661454
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            674.25,
            227.172153883349
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.6509445549041193,
        "gs_citation": 47,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2709328473014710332&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Johann Wolfgang Goethe University Frankfurt am Main;Stanford University;Synthesia;Rheinische Friedrich-Wilhelms-Universit\u00e4t Bonn",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.uni-frankfurt.de;https://www.stanford.edu;https://www.synthesia.io;https://www.uni-bonn.de",
        "aff_unique_abbr": "JWGU;Stanford;Synthesia;Uni Bonn",
        "aff_campus_unique_index": "0;1",
        "aff_campus_unique": "Frankfurt am Main;Stanford;",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "Germany;United States"
    },
    {
        "id": "MZs2dgOudB",
        "title": "Exploring Active Learning in Meta-Learning: Enhancing Context Set Labeling",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Most meta-learning methods assume that the (very small) context set used to establish a new task at test time is passively provided.\nIn some settings, however, it is feasible to actively select which points to label; the potential gain from a careful choice is substantial, but the setting requires major differences from typical active learning setups.\nWe clarify the ways in which active meta-learning can be used to label a context set, depending on which parts of the meta-learning process use active learning.\nWithin this framework, we propose a natural algorithm based on fitting Gaussian mixtures for selecting which points to label; though simple, the algorithm also has theoretical motivation.\nThe proposed algorithm outperforms state-of-the-art active learning methods when used with various meta-learning algorithms across several benchmark datasets.",
        "keywords": "Active Learning;Meta Learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/c1699e4c4d0aa80ef729a0f8c62c55d8068c931c.zip",
        "author": "Wonho Bae;Jing Wang;Danica J. Sutherland",
        "authorids": "~Wonho_Bae1;~Jing_Wang17;~Danica_J._Sutherland1",
        "gender": "M;M;F",
        "homepage": "https://won-bae.github.io/;https://sites.google.com/view/jingwang18/home;http://www.djsutherland.ml",
        "dblp": "259/5393;02/736-112;92/10966",
        "google_scholar": "https://scholar.google.ca/citations?user=EEwA__kAAAAJ;https://scholar.google.ca/citations?user=c1ZNx5AAAAAJ;https://scholar.google.co.uk/citations?user=uO_NqicAAAAJ",
        "orcid": ";0000-0001-9417-1174;0000-0002-1525-3532",
        "linkedin": "wonho-bae/;jing-david-wang-682705160/?originalSubdomain=ca;",
        "or_profile": "~Wonho_Bae1;~Jing_Wang17;~Danica_J._Sutherland2",
        "aff": "University of British Columbia;University of British Columbia;University of British Columbia",
        "aff_domain": "cs.ubc.ca;ubc.ca;cs.ubc.ca",
        "position": "PhD student;PhD student;Assistant Professor",
        "bibtex": "@misc{\nbae2024exploring,\ntitle={Exploring Active Learning in Meta-Learning: Enhancing Context Set Labeling},\nauthor={Wonho Bae and Jing Wang and Danica J. Sutherland},\nyear={2024},\nurl={https://openreview.net/forum?id=MZs2dgOudB}\n}",
        "github": "",
        "project": "",
        "reviewers": "EFev;xa6o;r9Lv;PTqo",
        "site": "https://openreview.net/forum?id=MZs2dgOudB",
        "pdf_size": 3062760,
        "rating": "3;5;6;6",
        "confidence": "3;3;3;4",
        "soundness": "2;2;3;3",
        "contribution": "1;2;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "75;158;53;104",
        "wc_strengths": "39;141;34;69",
        "wc_weaknesses": "29;137;142;114",
        "wc_questions": "62;63;94;42",
        "wc_review": "205;499;323;329",
        "wc_reply_reviewers": "0;42;30;41",
        "wc_reply_authors": "554;1098;1833;1491",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "2;4;4;3",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            97.5,
            39.33509883043387
        ],
        "wc_strengths_avg": [
            70.75,
            42.71050807471154
        ],
        "wc_weaknesses_avg": [
            105.5,
            45.41200281863816
        ],
        "wc_questions_avg": [
            65.25,
            18.59267328815305
        ],
        "wc_review_avg": [
            339.0,
            104.77595143924965
        ],
        "wc_reply_reviewers_avg": [
            28.25,
            16.97608612136496
        ],
        "wc_reply_authors_avg": [
            1244.0,
            475.7483578531827
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.25,
            0.82915619758885
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.4714045207910316,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9328367881641464933&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of British Columbia",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ubc.ca",
        "aff_unique_abbr": "UBC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "MZsKW0CraD",
        "title": "Beyond Labeling Oracles: What does it mean to steal ML models?",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Model extraction attacks are designed to steal trained models with only query access, as is often provided through APIs that ML-as-a-Service providers offer.\nML models are expensive to train, in part because data is hard to obtain, and a primary incentive for model extraction is to acquire a model while incurring less cost than training from scratch.\nLiterature on model extraction commonly claims or presumes that the attacker is  able to save on both data acquisition and labeling costs. We show that the attacker often does not. This is because current attacks implicitly rely on the adversary being able to sample from the victim model's data distribution. We thoroughly evaluate factors influencing the success of model extraction. We discover that prior knowledge of the attacker, i.e. access to in-distribution data, dominates other factors like the attack policy the adversary follows to choose which queries to make to the victim model API. \nThus, an adversary looking to develop an equally capable model with a fixed budget has little practical incentive to perform model extraction, since for the attack to work they need to collect in-distribution data, saving only on the cost of labeling. With low labeling costs in the current market, the usefulness of such attacks is questionable. \nUltimately, we demonstrate that the effect of prior knowledge needs to be explicitly decoupled from the attack policy. To this end, we propose a benchmark to evaluate attack policy directly.",
        "keywords": "Model extraction attacks;Adversarial machine learning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Avital Shafran;Ilia Shumailov;Murat A Erdogdu;Nicolas Papernot",
        "authorids": "~Avital_Shafran1;~Ilia_Shumailov1;~Murat_A_Erdogdu1;~Nicolas_Papernot1",
        "gender": ";M;M;Unspecified",
        "homepage": ";http://www.cs.toronto.edu/~erdogdu/;https://www.papernot.fr;https://www.cl.cam.ac.uk/~is410/",
        "dblp": "254/2733;139/1292;162/1405;213/8587",
        "google_scholar": "h58d7XQAAAAJ;Lqc4cdAAAAAJ;cGxq0cMAAAAJ;https://scholar.google.co.uk/citations?hl=en",
        "orcid": ";;;",
        "linkedin": ";;nicolaspapernot;ilia-shumailov/",
        "or_profile": "~Avital_Shafran1;~Murat_A_Erdogdu1;~Nicolas_Papernot1;~I_Shumailov1",
        "aff": "Hebrew University of Jerusalem;Vector Institute;Google;Google DeepMind",
        "aff_domain": "huji.ac.il;vectorinstitute.ai;google.com;google.com",
        "position": "PhD student;Faculty;Research Scientist;Research Scientist",
        "bibtex": "@misc{\nshafran2024beyond,\ntitle={Beyond Labeling Oracles: What does it mean to steal {ML} models?},\nauthor={Avital Shafran and Ilia Shumailov and Murat A Erdogdu and Nicolas Papernot},\nyear={2024},\nurl={https://openreview.net/forum?id=MZsKW0CraD}\n}",
        "github": "",
        "project": "",
        "reviewers": "7cgJ;ersf;5YY3;HWBR",
        "site": "https://openreview.net/forum?id=MZsKW0CraD",
        "pdf_size": 1250216,
        "rating": "3;5;5;5",
        "confidence": "3;3;4;4",
        "soundness": "2;2;3;2",
        "contribution": "2;3;3;2",
        "presentation": "1;3;3;3",
        "wc_summary": "65;76;46;97",
        "wc_strengths": "30;34;9;73",
        "wc_weaknesses": "136;30;16;373",
        "wc_questions": "1;168;214;18",
        "wc_review": "232;308;285;561",
        "wc_reply_reviewers": "118;0;0;56",
        "wc_reply_authors": "453;519;686;1166",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            71.0,
            18.452642087245934
        ],
        "wc_strengths_avg": [
            36.5,
            23.11384866265244
        ],
        "wc_weaknesses_avg": [
            138.75,
            142.9814236185946
        ],
        "wc_questions_avg": [
            100.25,
            92.39149040901981
        ],
        "wc_review_avg": [
            346.5,
            126.87099747381195
        ],
        "wc_reply_reviewers_avg": [
            43.5,
            48.71088174114691
        ],
        "wc_reply_authors_avg": [
            706.0,
            278.8270073002255
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8907533935650595967&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;2",
        "aff_unique_norm": "Hebrew University of Jerusalem;Vector Institute;Google",
        "aff_unique_dep": ";;Google",
        "aff_unique_url": "https://www.huji.ac.il;https://vectorinstitute.ai/;https://www.google.com",
        "aff_unique_abbr": "HUJI;Vector Institute;Google",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Jerusalem;;Mountain View",
        "aff_country_unique_index": "0;1;2;3",
        "aff_country_unique": "Israel;Canada;United States;United Kingdom"
    },
    {
        "id": "MZzlUyU2ih",
        "title": "DoReMi: Grounding Language Model by Detecting and Recovering from Plan-Execution Misalignment",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs) encode a vast amount of semantic knowledge and possess remarkable understanding and reasoning capabilities. Previous work has explored how to ground LLMs in robotic tasks to generate feasible and executable textual plans. However, low-level execution in the physical world may deviate from the high-level textual plan due to environmental perturbations or imperfect controller design. In this paper, we propose DoReMi, a novel language model grounding framework that enables immediate Detection and Recovery from Misalignments between plan and execution. \nSpecifically, we leverage LLMs to play a dual role, aiding not only in high-level planning but also generating constraints that can indicate misalignment during execution. Then vision language models (VLMs) are utilized to detect constraint violations continuously. \nOur pipeline can monitor the low-level execution and enable timely recovery if certain plan-execution misalignment occurs. Experiments on various complex tasks including robot arms and humanoid robots demonstrate that our method can lead to higher task success rates and shorter task completion times. Videos of DoReMi are available at https://sites.google.com/view/doremi-paper.",
        "keywords": "Language model grounding;robotics",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/cfe1bb13465e04763c381e554d20c7aff54e9ed3.zip",
        "author": "Yanjiang Guo;Yen-Jen Wang;Lihan Zha;Zheyuan Jiang;Jianyu Chen",
        "authorids": "~Yanjiang_Guo1;~Yen-Jen_Wang1;~Lihan_Zha1;~Zheyuan_Jiang1;~Jianyu_Chen1",
        "gender": "M;M;M;M;M",
        "homepage": "https://robert-gyj.github.io/;https://wangyenjen.github.io;https://lihzha.github.io;https://merlinjiang.github.io/;http://people.iiis.tsinghua.edu.cn/~jychen/",
        "dblp": ";164/2206;;;",
        "google_scholar": "rBeZZPMAAAAJ;_U-HwfkAAAAJ;3UErXEwAAAAJ;;",
        "orcid": ";;;;",
        "linkedin": ";wangyenjen/;lihan-zha-111682264/;;",
        "or_profile": "~Yanjiang_Guo1;~Yen-Jen_Wang1;~Lihan_Zha1;~Zheyuan_Jiang1;~Jianyu_Chen1",
        "aff": "Tsinghua University;Tsinghua University;Tsinghua University;Institute for Interdisciplinary Information Sciences, Tsinghua University, Tsinghua University;Tsinghua University",
        "aff_domain": "mails.tsinghua.edu.cn;mails.tsinghua.edu.cn;mails.tsinghua.edu.cn;mails.tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "PhD student;MS student;Undergrad student;PhD student;Assistant Professor",
        "bibtex": "@misc{\nguo2024doremi,\ntitle={DoReMi: Grounding Language Model by Detecting and Recovering from Plan-Execution Misalignment},\nauthor={Yanjiang Guo and Yen-Jen Wang and Lihan Zha and Zheyuan Jiang and Jianyu Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=MZzlUyU2ih}\n}",
        "github": "",
        "project": "",
        "reviewers": "VZHX;WGrL;nVnU;fXV5",
        "site": "https://openreview.net/forum?id=MZzlUyU2ih",
        "pdf_size": 18086881,
        "rating": "5;6;6;8",
        "confidence": "4;5;4;3",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "65;119;58;56",
        "wc_strengths": "54;60;116;34",
        "wc_weaknesses": "421;272;126;133",
        "wc_questions": "3;95;104;6",
        "wc_review": "543;546;404;229",
        "wc_reply_reviewers": "285;41;122;19",
        "wc_reply_authors": "2683;960;2373;585",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "6;3;7;3",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            74.5,
            25.90849281606323
        ],
        "wc_strengths_avg": [
            66.0,
            30.430248109405877
        ],
        "wc_weaknesses_avg": [
            238.0,
            120.63788791254595
        ],
        "wc_questions_avg": [
            52.0,
            47.618273803236505
        ],
        "wc_review_avg": [
            430.5,
            129.71218138632932
        ],
        "wc_reply_reviewers_avg": [
            116.75,
            104.4374812986219
        ],
        "wc_reply_authors_avg": [
            1650.25,
            894.4471406964193
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            4.75,
            1.7853571071357126
        ],
        "replies_avg": [
            33,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.6488856845230502,
        "gs_citation": 37,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2130659032626678516&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Tsinghua University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "MamHzZHs0h",
        "title": "SynerGPT: In-Context Learning for Personalized Drug Synergy Prediction and Drug Design",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Predicting synergistic drug combinations can help accelerate discovery of cancer treatments, particularly therapies personalized to a patient's specific tumor via biopsied cells. In this paper, we propose a novel setting and models for in-context drug synergy learning. We are given a small \"personalized dataset\" of 10-20 drug synergy relationships in the context of specific cancer cell targets. Our goal is to predict additional drug synergy relationships in that context. Inspired by recent work that pre-trains a GPT language model (LM) to \"in-context learn\" common function classes, we devise novel pre-training schemes that enable a GPT model to in-context learn \"drug synergy functions\". Our model -- which does not use any textual corpora, molecular fingerprints, protein interaction or any other domain-specific knowledge -- is able to achieve competitive results. We further integrate our in-context approach with a genetic algorithm to optimize model prompts and select synergy candidates to test after conducting a patient biopsy. Finally, we explore a novel task of inverse drug design which can potentially enable the design of drugs that synergize specifically to target a given patient's \"personalized dataset\". Our findings can potentially have an important impact on precision cancer medicine, and also raise intriguing questions on non-textual pre-training for LMs.",
        "keywords": "in-context learning;drug synergy prediction;inverse drug design;precision medicine",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Carl Edwards;Aakanksha Naik;Tushar Khot;Martin D. Burke;Heng Ji;Tom Hope",
        "authorids": "~Carl_Edwards1;~Aakanksha_Naik1;~Tushar_Khot1;~Martin_D._Burke1;~Heng_Ji3;~Tom_Hope2",
        "gender": "M;F;M;M;F;",
        "homepage": "https://cnedwards.com/;http://www.cs.cmu.edu/~anaik/;https://allenai.org/team/tushark/;https://chemistry.illinois.edu/mdburke;http://blender.cs.illinois.edu/hengji.html;",
        "dblp": "300/1001;204/7137;83/8117;;;27/5588",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en;_8mkIjgAAAAJ;u4hmNXAAAAAJ;z7GCqT4AAAAJ;",
        "orcid": ";;;;;",
        "linkedin": "carl-edwards-70a90592;aakanksha-naik-b3494882/;;;;tom-hope-1433a228/",
        "or_profile": "~Carl_Edwards1;~Aakanksha_Naik1;~Tushar_Khot1;~Martin_D._Burke1;~Heng_Ji3;~Tom_Hope2",
        "aff": "Genentech;National Institutes of Health;Allen Institute for Artificial Intelligence;University of Illinois, Urbana Champaign;University of Illinois, Urbana-Champaign;Allen Institute for Artificial Intelligence",
        "aff_domain": "gene.com;nih.gov;allenai.org;illinois.edu;uiuc.edu;allenai.org",
        "position": "Intern;Researcher;Lead Research Scientist;Full Professor;Full Professor;Researcher",
        "bibtex": "@misc{\nedwards2024synergpt,\ntitle={Syner{GPT}: In-Context Learning for Personalized Drug Synergy Prediction and Drug Design},\nauthor={Carl Edwards and Aakanksha Naik and Tushar Khot and Martin D. Burke and Heng Ji and Tom Hope},\nyear={2024},\nurl={https://openreview.net/forum?id=MamHzZHs0h}\n}",
        "github": "",
        "project": "",
        "reviewers": "Af5r;wxAg;UGB1;DAPr",
        "site": "https://openreview.net/forum?id=MamHzZHs0h",
        "pdf_size": 1249507,
        "rating": "3;3;5;5",
        "confidence": "5;4;5;2",
        "soundness": "3;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "3;1;3;1",
        "wc_summary": "80;142;96;64",
        "wc_strengths": "67;42;37;19",
        "wc_weaknesses": "306;185;10;15",
        "wc_questions": "45;59;237;384",
        "wc_review": "498;428;380;482",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            1.224744871391589
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            1.0
        ],
        "wc_summary_avg": [
            95.5,
            29.13331426391443
        ],
        "wc_strengths_avg": [
            41.25,
            17.151894939043906
        ],
        "wc_weaknesses_avg": [
            129.0,
            124.11889461318933
        ],
        "wc_questions_avg": [
            181.25,
            139.3957944128875
        ],
        "wc_review_avg": [
            447.0,
            46.57252408878007
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.40824829046386296,
        "gs_citation": 24,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11956645702647007888&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;2;3;4;2",
        "aff_unique_norm": "Genentech;National Institutes of Health;Allen Institute for Artificial Intelligence;University of Illinois Urbana-Champaign;University of Illinois",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.genentech.com;https://www.nih.gov;https://allenai.org;https://illinois.edu;https://illinois.edu",
        "aff_unique_abbr": "Genentech;NIH;AI2;UIUC;UIUC",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Urbana-Champaign",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "GPT-4 Is Too Smart To Be Safe: Stealthy Chat with LLMs via Cipher",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18817",
        "id": "MbfAK4s61A",
        "author_site": "Youliang Yuan, Wenxiang Jiao, Wenxuan Wang, Jen-tse Huang, Pinjia He, Shuming Shi, Zhaopeng Tu",
        "tldr": "",
        "abstract": "Safety lies at the core of the development of Large Language Models (LLMs). There is ample work on aligning LLMs with human ethics and preferences, including data filtering in pretraining, supervised fine-tuning, reinforcement learning from human feedback, red teaming, etc. In this study, we discover that chat in cipher can bypass the safety alignment techniques of LLMs, which are mainly conducted in natural languages. We propose a novel framework CipherChat to systematically examine the generalizability of safety alignment to non-natural languages -- ciphers. CipherChat enables humans to chat with LLMs through cipher prompts topped with system role descriptions and few-shot enciphered demonstrations. We use CipherChat to assess state-of-the-art LLMs, including ChatGPT and GPT-4 for different representative human ciphers across 11 safety domains in both English and Chinese. Experimental results show that certain ciphers succeed almost 100% of the time in bypassing the safety alignment of GPT-4 in several safety domains, demonstrating the necessity of developing safety alignment for non-natural languages. Notably, we identify that LLMs seem to have a ''secret cipher'', and propose a novel SelfCipher that uses only role play and several unsafe demonstrations in natural language to evoke this capability. SelfCipher surprisingly outperforms existing human ciphers in almost all cases.",
        "keywords": "Safety Alignment;Jailbreak",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Youliang Yuan;Wenxiang Jiao;Wenxuan Wang;Jen-tse Huang;Pinjia He;Shuming Shi;Zhaopeng Tu",
        "authorids": "~Youliang_Yuan1;~Wenxiang_Jiao1;~Wenxuan_Wang2;~Jen-tse_Huang1;~Pinjia_He1;~Shuming_Shi1;~Zhaopeng_Tu1",
        "gender": "M;M;;M;M;M;M",
        "homepage": "https://youliangyuan.github.io;https://wxjiao.github.io/;;https://penguinnnnn.github.io/;https://pinjiahe.github.io/;;http://www.zptu.net",
        "dblp": "302/7588;239/4883;203/1536-1;317/7026;147/1619;s/ShumingShi;71/9281",
        "google_scholar": "cd-wSAsAAAAJ;CvtODukAAAAJ;4v5x0bUAAAAJ;XBzDTAQAAAAJ;vg0moI0AAAAJ;Lg31AKMAAAAJ;IvE2zRgAAAAJ",
        "orcid": ";;;0000-0003-3446-0083;0000-0003-3377-8129;;",
        "linkedin": ";;;jen-tse-huang-08a169200/;;;tuzhaopeng",
        "or_profile": "~Youliang_Yuan1;~Wenxiang_Jiao1;~Wenxuan_Wang2;~Jen-tse_Huang1;~Pinjia_He1;~Shuming_Shi1;~Zhaopeng_Tu1",
        "aff": "The Chinese University of Hong Kong-Shenzhen;Tencent AI Lab;The Chinese University of Hong Kong;The Chinese University of Hong Kong;The Chinese University of Hong Kong, Shenzhen;Tencent AI Lab;Tencent AI Lab",
        "aff_domain": "cuhk.edu.cn;tencent.com;cuhk.edu.hk;cuhk.edu.hk;cuhk.edu.cn;tencent.com;tencent.com",
        "position": "PhD student;Researcher;PhD student;PhD student;Assistant Professor;Principal Researcher;Principal Researcher",
        "bibtex": "@inproceedings{\nyuan2024gpt,\ntitle={{GPT}-4 Is Too Smart To Be Safe: Stealthy Chat with {LLM}s via Cipher},\nauthor={Youliang Yuan and Wenxiang Jiao and Wenxuan Wang and Jen-tse Huang and Pinjia He and Shuming Shi and Zhaopeng Tu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=MbfAK4s61A}\n}",
        "github": "",
        "project": "",
        "reviewers": "BWeM;rwJA;isDE;tYmE",
        "pdf_size": 1012584,
        "rating": "5;6;8;8",
        "confidence": "4;4;4;4",
        "soundness": "2;3;3;4",
        "contribution": "2;2;3;4",
        "presentation": "3;2;3;3",
        "wc_summary": "78;70;39;133",
        "wc_strengths": "28;27;49;109",
        "wc_weaknesses": "250;115;62;226",
        "wc_questions": "26;12;22;159",
        "wc_review": "382;224;172;627",
        "wc_reply_reviewers": "0;0;0;162",
        "wc_reply_authors": "1200;997;559;1777",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "3;3;2;4",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            80.0,
            33.88952640566109
        ],
        "wc_strengths_avg": [
            53.25,
            33.36446462930284
        ],
        "wc_weaknesses_avg": [
            163.25,
            77.52862374632997
        ],
        "wc_questions_avg": [
            54.75,
            60.40436656401588
        ],
        "wc_review_avg": [
            351.25,
            176.9934673935736
        ],
        "wc_reply_reviewers_avg": [
            40.5,
            70.14805770653953
        ],
        "wc_reply_authors_avg": [
            1133.25,
            437.9488411903838
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 236,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10442283041532586737&as_sdt=20000005&sciodt=0,21&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=MbfAK4s61A",
        "pdf": "https://openreview.net/pdf?id=MbfAK4s61A",
        "email": "cuhk.edu.cn;tencent.com;cuhk.edu.hk;cuhk.edu.hk;cuhk.edu.cn;tencent.com;tencent.com",
        "author_num": 7,
        "aff_unique_index": "0;1;0;0;0;1;1",
        "aff_unique_norm": "Chinese University of Hong Kong;Tencent",
        "aff_unique_dep": ";Tencent AI Lab",
        "aff_unique_url": "https://www.cuhk.edu.cn;https://ai.tencent.com",
        "aff_unique_abbr": "CUHK;Tencent AI Lab",
        "aff_campus_unique_index": "0;2;2;0",
        "aff_campus_unique": "Shenzhen;;Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "L2P-MIP: Learning to Presolve for Mixed Integer Programming",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18816",
        "id": "McfYbKnpT8",
        "author_site": "Chang Liu, Zhichen Dong, Haobo Ma, Weilin Luo, Xijun Li, Bowen Pang, Jia Zeng, Junchi Yan",
        "tldr": "",
        "abstract": "Modern solvers for solving mixed integer programming (MIP) often rely on the branch-and-bound (B&B) algorithm which could be of high time complexity, and presolving techniques are well designed to simplify the instance as pre-processing before B&B. However, such presolvers in existing literature or open-source solvers are mostly set by default agnostic to specific input instances, and few studies have been reported on tailoring presolving settings. In this paper, we aim to dive into this open question and show that the MIP solver can be indeed largely improved when switching the default instance-agnostic presolving into instance-specific presolving. Specifically, we propose a combination of supervised learning and classic heuristics to achieve efficient presolving adjusting, avoiding tedious reinforcement learning. Notably, our approach is orthogonal from many recent efforts in incorporating learning modules into the B&B framework after the presolving stage, and to our best knowledge, this is the first work for introducing learning to presolve in MIP solvers. Experiments on multiple real-world datasets show that well-trained neural networks can infer proper presolving for arbitrary incoming MIP instances in less than 0.5s, which is neglectable compared with the solving time often hours or days.",
        "keywords": "Combinatorial Optimization; Mixed Integer Programming; Presolving",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Chang Liu;Zhichen Dong;Haobo Ma;Weilin Luo;Xijun Li;Bowen Pang;Jia Zeng;Junchi Yan",
        "authorids": "~Chang_Liu7;~Zhichen_Dong1;~Haobo_Ma1;~Weilin_Luo2;~Xijun_Li1;~Bowen_Pang2;~Jia_Zeng1;~Junchi_Yan2",
        "gender": "M;F;;M;M;M;M;M",
        "homepage": "https://only-changer.github.io/;https://github.com/niconi19;;;https://xijunlee.github.io/;;;http://thinklab.sjtu.edu.cn/",
        "dblp": "52/5716;;;;203/0784;219/7919;31/435;60/7949.html",
        "google_scholar": "BTu8eaQAAAAJ;;;;QXU_QbMAAAAJ;IbvBs6QAAAAJ;;ga230VoAAAAJ",
        "orcid": ";;0000-0001-8872-8853;;0000-0002-9013-1180;;;0000-0001-9639-7679",
        "linkedin": ";;https://www.linkedin.cn/incareer/in/ACoAADztEPkBupCGNwATUSfVpsIFu7Vnish5icE;https://www.linkedin.cn/incareer/in/ACoAACQ2cDQBC2oP2j_6ed_0hxjMtnWpQYlrHJs;;;;",
        "or_profile": "~Chang_Liu7;~Zhichen_Dong1;~Haobo_Ma1;~Weilin_Luo2;~Xijun_Li1;~Bowen_Pang2;~Jia_Zeng1;~Junchi_Yan1",
        "aff": "Shanghai Jiaotong University;Shanghai Jiaotong University;;Huawei Technologies Ltd.;Huawei Technologies Ltd.;;;Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn;sjtu.edu.cn;;huawei.com;huawei.com;;;sjtu.edu.cn",
        "position": "PhD student;PhD student;;Researcher;Researcher;;;Full Professor",
        "bibtex": "@inproceedings{\nliu2024lpmip,\ntitle={L2P-{MIP}: Learning to Presolve for Mixed Integer Programming},\nauthor={Chang Liu and Zhichen Dong and Haobo Ma and Weilin Luo and Xijun Li and Bowen Pang and Jia Zeng and Junchi Yan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=McfYbKnpT8}\n}",
        "github": "",
        "project": "",
        "reviewers": "32Tw;zK3o;iKXb;hVoV",
        "pdf_size": 823769,
        "rating": "6;6;6;8",
        "confidence": "4;3;4;3",
        "soundness": "3;3;3;3",
        "contribution": "3;4;3;3",
        "presentation": "4;3;2;4",
        "wc_summary": "154;135;74;103",
        "wc_strengths": "144;43;91;33",
        "wc_weaknesses": "56;97;256;132",
        "wc_questions": "107;46;254;7",
        "wc_review": "461;321;675;275",
        "wc_reply_reviewers": "0;77;154;86",
        "wc_reply_authors": "719;990;2231;1156",
        "reply_reviewers": "0;1;2;2",
        "reply_authors": "1;3;5;3",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            116.5,
            30.56550343115585
        ],
        "wc_strengths_avg": [
            77.75,
            44.08727140570167
        ],
        "wc_weaknesses_avg": [
            135.25,
            74.72407577213652
        ],
        "wc_questions_avg": [
            103.5,
            93.91618603840341
        ],
        "wc_review_avg": [
            433.0,
            155.60848305924713
        ],
        "wc_reply_reviewers_avg": [
            79.25,
            54.58651390224512
        ],
        "wc_reply_authors_avg": [
            1274.0,
            574.1197610255198
        ],
        "reply_reviewers_avg": [
            1.25,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.0,
            1.4142135623730951
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17950717652497652641&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=McfYbKnpT8",
        "pdf": "https://openreview.net/pdf?id=McfYbKnpT8",
        "email": "sjtu.edu.cn;sjtu.edu.cn;;huawei.com;huawei.com;;;sjtu.edu.cn",
        "author_num": 8,
        "aff_unique_index": "0;0;1;1;0",
        "aff_unique_norm": "Shanghai Jiao Tong University;Huawei",
        "aff_unique_dep": ";Huawei Technologies",
        "aff_unique_url": "https://www.sjtu.edu.cn;https://www.huawei.com",
        "aff_unique_abbr": "SJTU;Huawei",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "MdHDUsP2lt",
        "title": "Information-Theoretic World Model learning for Denoised Predictions",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Humans excel at isolating relevant information from noisy data to predict the behavior of dynamic systems, effectively disregarding non-informative, temporally-correlated noise.  In contrast, existing reinforcement learning algorithms face challenges in generating noise-free predictions within high-dimensional, noise-saturated environments, especially when trained on world models featuring realistic background noise extracted from natural video streams. We propose a novel information-theoretic approach that learns world models based on minimising the past information and retaining maximal information about the future, aiming at simultaneously learning control policies and at producing denoised predictions. Utilizing Soft Actor-Critic agents augmented with an information-theoretic auxiliary loss, we validate our method's effectiveness on complex variants of the standard DeepMind Control Suite tasks, where natural videos filled with intricate and task-irrelevant information serve as a background. Experimental results indicate that our model surpasses four state-of-the-art approaches across six distinct scenarios where natural videos serve as dynamic background noise, all while maintaining competitive performance in traditional settings",
        "keywords": "Representation Learning;Predictive Information;Information Bottleneck;SAC",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/c19e6067ca712f14491ffeed7b260c22657c8e31.zip",
        "author": "Vedant Dave;Elmar Rueckert",
        "authorids": "~Vedant_Dave1;~Elmar_Rueckert2",
        "gender": "M;M",
        "homepage": "https://vedantdave97.github.io/;https://ai-lab.science",
        "dblp": ";128/5341",
        "google_scholar": "8Gi6AaEAAAAJ;EKUvWkkAAAAJ",
        "orcid": ";0000-0003-1221-8253",
        "linkedin": "vedant-dave-095629178/;https://linkedin.com/in/elmar-rueckert-95b112179",
        "or_profile": "~Vedant_Dave1;~Elmar_Rueckert2",
        "aff": "Montanuniversit\u00e4t Leoben;Montanuniversit\u00e4t Leoben",
        "aff_domain": "cps.unileoben.ac.at;unileoben.ac.at",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\ndave2024informationtheoretic,\ntitle={Information-Theoretic World Model learning for Denoised Predictions},\nauthor={Vedant Dave and Elmar Rueckert},\nyear={2024},\nurl={https://openreview.net/forum?id=MdHDUsP2lt}\n}",
        "github": "",
        "project": "",
        "reviewers": "cwoe;Dg3d;qnYC;7DVA",
        "site": "https://openreview.net/forum?id=MdHDUsP2lt",
        "pdf_size": 1538052,
        "rating": "3;5;5;6",
        "confidence": "4;3;4;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;2",
        "presentation": "1;2;3;3",
        "wc_summary": "301;239;26;95",
        "wc_strengths": "58;34;46;139",
        "wc_weaknesses": "559;127;36;311",
        "wc_questions": "10;98;34;47",
        "wc_review": "928;498;142;592",
        "wc_reply_reviewers": "0;0;0;126",
        "wc_reply_authors": "1374;1033;497;1013",
        "reply_reviewers": "0;0;0;2",
        "reply_authors": "3;3;2;4",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            165.25,
            109.76423597875585
        ],
        "wc_strengths_avg": [
            69.25,
            41.154434754956846
        ],
        "wc_weaknesses_avg": [
            258.25,
            199.90919813755445
        ],
        "wc_questions_avg": [
            47.25,
            32.16655872175325
        ],
        "wc_review_avg": [
            540.0,
            279.91784509030504
        ],
        "wc_reply_reviewers_avg": [
            31.5,
            54.559600438419636
        ],
        "wc_reply_authors_avg": [
            979.25,
            313.21747636426676
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.6882472016116854,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:jtTBQV68J9YJ:scholar.google.com/&scioq=Information-Theoretic+World+Model+learning+for+Denoised+Predictions&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Montanuniversit\u00e4t Leoben",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.montanuni-leoben.at",
        "aff_unique_abbr": "MUL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Austria"
    },
    {
        "id": "Mdk7YP52V3",
        "title": "Understanding Pathologies of Deep Heteroskedastic Regression",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Several recent studies have reported negative results when using heteroskedastic neural regression models to model real-world data. In particular, for overparameterized models, the mean and variance networks are powerful enough to either fit every single data point (while shrinking the predicted variances to zero), or to learn a constant prediction with an output variance exactly matching every predicted residual (i.e., explaining the targets as pure noise). This paper studies these difficulties from the perspective of statistical physics. We show that the observed instabilities are not specific to any neural network architecture but are already present in a field theory of an overparameterized conditional Gaussian likelihood model. Under light assumptions, we derive a nonparametric free energy that can be solved numerically. The resulting solutions show excellent qualitative agreement with empirical model fits on real-world data and, in particular, prove the existence of phase transitions, i.e., abrupt, qualitative differences in the behaviors of the regressors upon varying the regularization strengths on the two networks. Our work thus provides a theoretical explanation for the necessity to carefully regularize heteroskedastic regression models. Moreover, the insights from our theory suggest a scheme for optimizing this regularization which is quadratically more efficient than the naive approach.",
        "keywords": "regression;uncertainty quantification;heteroskedasticity",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/da7a5ef4a35b9b168bc6f6a9a5eca2865c7cc9a4.zip",
        "author": "Eliot Wong-Toi;Alex James Boyd;Vincent Fortuin;Stephan Mandt",
        "authorids": "~Eliot_Wong-Toi1;~Alex_James_Boyd1;~Vincent_Fortuin1;~Stephan_Mandt1",
        "gender": "M;M;M;M",
        "homepage": "https://ewongtoi.github.io/docs/index.html;;https://fortuin.github.io/;https://www.stephanmandt.com",
        "dblp": "350/5006;https://dblp.uni-trier.de/pers/hd/b/Boyd:Alex;218/7489;147/5018",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;https://scholar.google.ch/citations?user=XBlrYTIAAAAJ;HOrGe7wAAAAJ",
        "orcid": ";;0000-0002-0640-2671;",
        "linkedin": "eliot-wong-toi/;ajboyd2;vincent-fortuin-42426b134/;stephan-mandt-8702795a/",
        "or_profile": "~Eliot_Wong-Toi1;~Alex_James_Boyd1;~Vincent_Fortuin1;~Stephan_M_Mandt1",
        "aff": "University of California, Irvine;;Helmholtz AI;University of California, Irvine",
        "aff_domain": "uci.edu;;helmholtz.ai;uci.edu",
        "position": "PhD student;;Principal Researcher;Associate Professor",
        "bibtex": "@misc{\nwong-toi2024understanding,\ntitle={Understanding Pathologies of Deep Heteroskedastic Regression},\nauthor={Eliot Wong-Toi and Alex James Boyd and Vincent Fortuin and Stephan Mandt},\nyear={2024},\nurl={https://openreview.net/forum?id=Mdk7YP52V3}\n}",
        "github": "",
        "project": "",
        "reviewers": "fPxx;MFfv;6L3Q;yMF5",
        "site": "https://openreview.net/forum?id=Mdk7YP52V3",
        "pdf_size": 2275378,
        "rating": "1;3;5;8",
        "confidence": "4;4;4;3",
        "soundness": "1;3;3;3",
        "contribution": "1;2;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "68;116;135;110",
        "wc_strengths": "1;20;30;83",
        "wc_weaknesses": "196;115;161;28",
        "wc_questions": "102;8;4;91",
        "wc_review": "367;259;330;312",
        "wc_reply_reviewers": "0;27;0;39",
        "wc_reply_authors": "446;224;241;118",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.25,
            2.5860201081971503
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            107.25,
            24.468091466234142
        ],
        "wc_strengths_avg": [
            33.5,
            30.41792234851026
        ],
        "wc_weaknesses_avg": [
            125.0,
            62.94044804416314
        ],
        "wc_questions_avg": [
            51.25,
            45.438832511410325
        ],
        "wc_review_avg": [
            317.0,
            38.91657744458009
        ],
        "wc_reply_reviewers_avg": [
            16.5,
            17.03672503740082
        ],
        "wc_reply_authors_avg": [
            257.25,
            118.72947190988428
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8372183582789214,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9937382870833951664&as_sdt=80005&sciodt=0,11&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of California, Irvine;Helmholtz Association of German Research Centres",
        "aff_unique_dep": ";Helmholtz AI",
        "aff_unique_url": "https://www.uci.edu;https://www.helmholtz-ai.de",
        "aff_unique_abbr": "UCI;Helmholtz AI",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Irvine;",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United States;Germany"
    },
    {
        "title": "Hebbian Learning based Orthogonal Projection for Continual Learning of Spiking Neural Networks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18815",
        "id": "MeB86edZ1P",
        "author_site": "Mingqing Xiao, Qingyan Meng, Zongpeng Zhang, Di He, Zhouchen Lin",
        "tldr": "",
        "abstract": "Neuromorphic computing with spiking neural networks is promising for energy-efficient artificial intelligence (AI) applications. However, different from humans who continually learn different tasks in a lifetime, neural network models suffer from catastrophic forgetting. How could neuronal operations solve this problem is an important question for AI and neuroscience. Many previous studies draw inspiration from observed neuroscience phenomena and propose episodic replay or synaptic metaplasticity, but they are not guaranteed to explicitly preserve knowledge for neuron populations. Other works focus on machine learning methods with more mathematical grounding, e.g., orthogonal projection on high dimensional spaces, but there is no neural correspondence for neuromorphic computing. In this work, we develop a new method with neuronal operations based on lateral connections and Hebbian learning, which can protect knowledge by projecting activity traces of neurons into an orthogonal subspace so that synaptic weight update will not interfere with old tasks. We show that Hebbian and anti-Hebbian learning on recurrent lateral connections can effectively extract the principal subspace of neural activities and enable orthogonal projection. This provides new insights into how neural circuits and Hebbian learning can help continual learning, and also how the concept of orthogonal projection can be realized in neuronal systems. Our method is also flexible to utilize arbitrary training methods based on presynaptic activities/traces. Experiments show that our method consistently solves forgetting for spiking neural networks with nearly zero forgetting under various supervised training methods with different error propagation approaches, and outperforms previous approaches under various settings. Our method can pave a solid path for building continual neuromorphic computing systems. The code is available at https://github.com/pkuxmq/HLOP-SNN.",
        "keywords": "Hebbian learning;neuromorphic computing;continual learning;spiking neural networks",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/ae327b57fb59db622023a6e1b0e9f4b69238b690.zip",
        "author": "Mingqing Xiao;Qingyan Meng;Zongpeng Zhang;Di He;Zhouchen Lin",
        "authorids": "~Mingqing_Xiao1;~Qingyan_Meng1;~Zongpeng_Zhang1;~Di_He1;~Zhouchen_Lin1",
        "gender": "M;M;;M;M",
        "homepage": "https://pkuxmq.github.io/;https://zero-lab-pku.github.io/personwise/mengqingyan/;;https://dihe-pku.github.io/;https://zhouchenlin.github.io",
        "dblp": "19/2900-2;83/8497;303/0919;74/184;l/ZhouchenLin",
        "google_scholar": "Hvj-WrwAAAAJ;48VBXzUAAAAJ;;https://scholar.google.co.jp/citations?user=orVoz4IAAAAJ;https://scholar.google.com.tw/citations?user=TanjFwoAAAAJ",
        "orcid": "0000-0001-6191-7726;;0000-0002-4742-1852;;0000-0003-1493-7569",
        "linkedin": ";;;;",
        "or_profile": "~Mingqing_Xiao1;~Qingyan_Meng1;~Zongpeng_Zhang1;~Di_He1;~Zhouchen_Lin1",
        "aff": "Peking University;The Chinese University of Hong Kong, Shenzhen;Peking University;Microsoft;Peking University",
        "aff_domain": "pku.edu.cn;edu.cn;stu.pku.edu.cn;microsoft.com;pku.edu.cn",
        "position": "PhD student;PhD student;PhD student;Senior Researcher;Professor",
        "bibtex": "@inproceedings{\nxiao2024hebbian,\ntitle={Hebbian Learning based Orthogonal Projection for Continual Learning of Spiking Neural Networks},\nauthor={Mingqing Xiao and Qingyan Meng and Zongpeng Zhang and Di He and Zhouchen Lin},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=MeB86edZ1P}\n}",
        "github": "",
        "project": "",
        "reviewers": "Txkh;braR;oRoY;Me3Q",
        "pdf_size": 2764175,
        "rating": "6;6;6;8",
        "confidence": "3;4;3;4",
        "soundness": "3;3;3;4",
        "contribution": "3;3;4;3",
        "presentation": "3;3;3;3",
        "wc_summary": "86;111;139;27",
        "wc_strengths": "76;41;59;146",
        "wc_weaknesses": "191;171;240;113",
        "wc_questions": "2;37;154;100",
        "wc_review": "355;360;592;386",
        "wc_reply_reviewers": "0;393;0;53",
        "wc_reply_authors": "764;2174;1123;929",
        "reply_reviewers": "0;3;0;1",
        "reply_authors": "1;4;2;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            90.75,
            41.30602256330183
        ],
        "wc_strengths_avg": [
            80.5,
            39.790074139161895
        ],
        "wc_weaknesses_avg": [
            178.75,
            45.51030103174445
        ],
        "wc_questions_avg": [
            73.25,
            58.36683561749771
        ],
        "wc_review_avg": [
            423.25,
            98.1360662549707
        ],
        "wc_reply_reviewers_avg": [
            111.5,
            163.9580739091552
        ],
        "wc_reply_authors_avg": [
            1247.5,
            549.7992815564604
        ],
        "reply_reviewers_avg": [
            1.0,
            1.224744871391589
        ],
        "reply_authors_avg": [
            2.25,
            1.0897247358851685
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15283238733922655390&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=MeB86edZ1P",
        "pdf": "https://openreview.net/pdf?id=MeB86edZ1P",
        "email": "pku.edu.cn;edu.cn;stu.pku.edu.cn;microsoft.com;pku.edu.cn",
        "author_num": 5,
        "aff_unique_index": "0;1;0;2;0",
        "aff_unique_norm": "Peking University;Chinese University of Hong Kong;Microsoft",
        "aff_unique_dep": ";;Microsoft Corporation",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.cuhk.edu.cn;https://www.microsoft.com",
        "aff_unique_abbr": "Peking U;CUHK;Microsoft",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Shenzhen",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "The Trickle-down Impact of Reward Inconsistency on RLHF",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18814",
        "id": "MeHmwCDifc",
        "author_site": "Lingfeng Shen, Sihao Chen, Linfeng Song, Lifeng Jin, Baolin Peng, Haitao Mi, Daniel Khashabi, Dong Yu",
        "tldr": "",
        "abstract": "Standard practice within Reinforcement Learning from Human Feedback (RLHF) involves optimizing against a Reward Model (RM), which itself is trained to reflect human preferences for desirable generations. A notable subject that is understudied is the (in-)consistency of RMs --- whether they can recognize the semantic changes to different prompts and \nappropriately adapt their reward assignments\n\n--- and their impact on the downstream RLHF model.\n\nIn this paper, we visit a series of research questions relevant to RM inconsistency:\n(1) How can we measure the consistency of reward models? \n(2) How consistent are the existing RMs and how can we improve them? \n(3) In what ways does reward inconsistency influence the chatbots resulting from the RLHF model training?\n\n\nWe propose **Contrast Instruction** -- a benchmarking strategy for the consistency of RM.  \nEach example in **Contrast Instruction** features a pair of lexically similar instructions with different ground truth responses. A consistent RM is expected to rank the corresponding instruction and response higher than other combinations. We observe that current RMs trained with the standard ranking objective fail miserably on \\contrast{} compared to average humans. To show that RM consistency can be improved efficiently without using extra training budget, we propose two techniques **ConvexDA** and **RewardFusion**, which enhance reward consistency \nthrough extrapolation during the RM training and inference stage, respectively.\nWe show that RLHF models trained with a more consistent RM yield more useful responses, suggesting that reward inconsistency exhibits a trickle-down effect on the downstream RLHF process.",
        "keywords": "Large language model;reward model;RLHF;consistency",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/7d396953ca1c5b08cec84c2768187a79c87fee9b.zip",
        "author": "Lingfeng Shen;Sihao Chen;Linfeng Song;Lifeng Jin;Baolin Peng;Haitao Mi;Daniel Khashabi;Dong Yu",
        "authorids": "~Lingfeng_Shen1;~Sihao_Chen1;~Linfeng_Song1;~Lifeng_Jin1;~Baolin_Peng2;~Haitao_Mi1;~Daniel_Khashabi2;~Dong_Yu2",
        "gender": "M;M;;;M;M;M;M",
        "homepage": ";https://sihaoc.github.io;https://freesunshine0316.github.io/;;;;http://danielkhashabi.com/;https://sites.google.com/view/dongyu888/",
        "dblp": "240/5490.html;;136/3610;66/7607;144/2759;19/70;71/10515;71/4598-1",
        "google_scholar": "PoSTdLAAAAAJ;PQ9dRCgAAAAJ;yWZdmLYAAAAJ;;u1CNjgwAAAAJ;https://scholar.google.com/citations?hl=en;pK2kQvgAAAAJ;tMY31_gAAAAJ",
        "orcid": ";;;;;;;0000-0003-0520-6844",
        "linkedin": ";;;;;;;dongyu/",
        "or_profile": "~Lingfeng_Shen1;~Sihao_Chen1;~Linfeng_Song1;~Lifeng_Jin1;~Baolin_Peng2;~Haitao_Mi1;~Daniel_Khashabi2;~Dong_Yu2",
        "aff": "Johns Hopkins University;University of Pennsylvania;Tencent AI Lab;Tencent AI Lab;Tencent AI Lab;Tencent AI Lab;Johns Hopkins University;Tencent AI Lab",
        "aff_domain": "jh.edu;cis.upenn.edu;tencent.com;tencent.com;tencent.com;tencent.com;jhu.edu;tencent.com",
        "position": "MS student;PhD student;Researcher;Researcher;Researcher;Principal Researcher;Assistant Professor;Distinguished Scientist",
        "bibtex": "@inproceedings{\nshen2024the,\ntitle={The Trickle-down Impact of Reward Inconsistency on {RLHF}},\nauthor={Lingfeng Shen and Sihao Chen and Linfeng Song and Lifeng Jin and Baolin Peng and Haitao Mi and Daniel Khashabi and Dong Yu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=MeHmwCDifc}\n}",
        "github": "",
        "project": "",
        "reviewers": "Kxr1;iZzr;n2Hx;gxZU;5JFN",
        "pdf_size": 1008577,
        "rating": "5;5;6;6;6",
        "confidence": "4;5;4;3;4",
        "soundness": "2;2;2;3;1",
        "contribution": "2;3;3;3;3",
        "presentation": "2;2;3;3;2",
        "wc_summary": "75;116;135;130;288",
        "wc_strengths": "120;106;87;117;90",
        "wc_weaknesses": "386;329;242;126;355",
        "wc_questions": "193;319;147;31;61",
        "wc_review": "774;870;611;404;794",
        "wc_reply_reviewers": "692;0;172;0;111",
        "wc_reply_authors": "2903;1524;1217;472;852",
        "reply_reviewers": "3;0;1;0;1",
        "reply_authors": "6;3;4;2;3",
        "rating_avg": [
            5.6,
            0.48989794855663565
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            2.8,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            148.8,
            72.72248620612471
        ],
        "wc_strengths_avg": [
            104.0,
            13.520355024924458
        ],
        "wc_weaknesses_avg": [
            287.6,
            93.95019957402964
        ],
        "wc_questions_avg": [
            150.2,
            102.47028837668019
        ],
        "wc_review_avg": [
            690.6,
            166.31728713516225
        ],
        "wc_reply_reviewers_avg": [
            195.0,
            257.15520605268716
        ],
        "wc_reply_authors_avg": [
            1393.6,
            832.9654494635417
        ],
        "reply_reviewers_avg": [
            1.0,
            1.0954451150103321
        ],
        "reply_authors_avg": [
            3.6,
            1.3564659966250536
        ],
        "replies_avg": [
            31,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.6454972243679027,
        "gs_citation": 24,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12957011038534764754&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=MeHmwCDifc",
        "pdf": "https://openreview.net/pdf?id=MeHmwCDifc",
        "email": "jh.edu;cis.upenn.edu;tencent.com;tencent.com;tencent.com;tencent.com;jhu.edu;tencent.com",
        "author_num": 8,
        "aff_unique_index": "0;1;2;2;2;2;0;2",
        "aff_unique_norm": "Johns Hopkins University;University of Pennsylvania;Tencent",
        "aff_unique_dep": ";;Tencent AI Lab",
        "aff_unique_url": "https://www.jhu.edu;https://www.upenn.edu;https://ai.tencent.com",
        "aff_unique_abbr": "JHU;UPenn;Tencent AI Lab",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;1;1;1;0;1",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "MfH6IJdmQ0",
        "title": "DAMO: Dynamic Adversarial defense with Multi-branch Orthogonality",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Deep neural networks (DNNs) are vulnerable to adversarial examples, in which DNNs are misled to false outputs due to inputs containing imperceptible perturbations. Ensemble adversarial training, which integrates multiple robust classifiers where each classifier is trained by an adversarial training strategy, becomes one of the widely used strategies to increase the model's robustness. However, we observe that ensemble methodologies exhibit certain limitations whereby erroneous predictions can arise once more than half of the employed classifiers are breached. This suggests that ensemble methods alone may not be sufficient for achieving perfect classification accuracy. Therefore, we raise an intriguing question: can perfect classification be achieved with only one accurate classifier remaining?\n\nIn this paper, we propose Dynamic Adversarial defense with Multi-branch Orthogonality (DAMO). Different from the traditional ensemble adversarial defense, which calculates the prediction confidence for each classifier in the model and votes to return the final prediction, we design a dynamic routing module to dynamically select a robust classifier from the model members for inference of each adversarial sample. The proposed method shows an increased ability to correctly predict the output value, even if only one classifier is not successfully attacked. Then, considering the classifiers in the ensemble model may have large similarities and cause an adversarial sample to trigger all classifiers into error, we propose Branch Orthogonality~(BO) loss, which is used to increase the diversity of each classifier in the ensemble model. Exhaustive experiments are conducted to show that our method goes beyond all state-of-the-art methods. Compared to SOTA baselines, our models achieve 66.27\\% and 40.12\\% robust accuracy on CIFAR-10 and CIFAR-100 (improving upon the state-of-the-art by +6.20\\% and +7.69\\%).",
        "keywords": "Adversarial Robustness;Dynamic Neural Network",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Qingwen Bu;Dong HUANG",
        "authorids": "~Qingwen_Bu1;~Dong_HUANG4",
        "gender": "M;M",
        "homepage": "https://github.com/retsuh-bqw;https://huangd1999.github.io/",
        "dblp": "326/7970;94/3756-5.html",
        "google_scholar": "https://scholar.google.com.hk/citations?user=-JCRysgAAAAJ;UER9hrAAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Qingwen_Bu1;~Dong_HUANG4",
        "aff": "Shanghai Jiaotong University;The University of Hong Kong",
        "aff_domain": "sjtu.edu.cn;cs.hku.hk",
        "position": "PhD student;PhD student",
        "bibtex": "@misc{\nbu2024damo,\ntitle={{DAMO}: Dynamic Adversarial defense with Multi-branch Orthogonality},\nauthor={Qingwen Bu and Dong HUANG},\nyear={2024},\nurl={https://openreview.net/forum?id=MfH6IJdmQ0}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=MfH6IJdmQ0",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:gH6vLIyCdlUJ:scholar.google.com/&scioq=DAMO:+Dynamic+Adversarial+defense+with+Multi-branch+Orthogonality&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Shanghai Jiao Tong University;University of Hong Kong",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.sjtu.edu.cn;https://www.hku.hk",
        "aff_unique_abbr": "SJTU;HKU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "MfWFUJklRI",
        "title": "GSINA: Improving Graph Invariant Learning via Graph Sinkhorn Attention",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Graph invariant learning (GIL) has been extensively studied to discover the invariant relationships between graph data and labels for different graph learning tasks under various distribution shifts. \nMany recent endeavors of GIL focus on discovering invariant features to improve the generalization of graph learning. However, such methods often have limitations in obtaining invariant features that are expressive enough in the solution space. \nIn this paper, we first discuss the limitations of previous works and summarize there design principles of the invariant feature extractor for GIL: 1) the sparsity, to filter out the variant features, 2) the softness, for a broader solution space, and 3) the differentiability, for a soundly end-to-end optimization. \nBy leveraging the Optimal Transport (OT) theory, we propose  Graph Sinkhorn Attention (GSINA) to meet these requirements in one shot. GSINA is a framework for GIL of multiple task levels, which infers differentiable graph invariant features with controllable sparsity and softness. \nExperiments on both synthetic and real-world datasets validate the superiority of our GSINA, which outperforms the state-of-the-art GIL methods (GSAT, CIGA, EERM) by large margins on graph-level tasks and node-level tasks. The PyTorch source code is provided in supplementary materials and will be publicly available on GitHub.",
        "keywords": "Graph Neural Networks;Graph Invariant Learning;Graph Classification;Node Classification",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/8e47e8eedd32c9854c51f0fe704dabca84856662.zip",
        "author": "Fangyu Ding;Haiyang Wang;Zhixuan Chu;Tianming Li;Junchi Yan",
        "authorids": "~Fangyu_Ding1;~Haiyang_Wang4;~Zhixuan_Chu1;~Tianming_Li1;~Junchi_Yan2",
        "gender": "Not Specified;M;M;M;M",
        "homepage": ";;;;http://thinklab.sjtu.edu.cn/",
        "dblp": "238/7298.html;22/3326;258/1233;92/7532;60/7949.html",
        "google_scholar": ";vGjZux0AAAAJ;a4IuTngAAAAJ;https://scholar.google.com/citations?hl=en;ga230VoAAAAJ",
        "orcid": ";;;;0000-0001-9639-7679",
        "linkedin": ";;;;",
        "or_profile": "~Fangyu_Ding1;~Haiyang_Wang4;~Zhixuan_Chu1;~Tianming_Li1;~Junchi_Yan1",
        "aff": "Shanghai Jiaotong University;Ant Group;Ant Group;Ant group;Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn;antgroup.com;antgroup.com;antgroup.com;sjtu.edu.cn",
        "position": "MS student;Researcher;Researcher;Researcher;Full Professor",
        "bibtex": "@misc{\nding2024gsina,\ntitle={{GSINA}: Improving Graph Invariant Learning via Graph Sinkhorn Attention},\nauthor={Fangyu Ding and Haiyang Wang and Zhixuan Chu and Tianming Li and Junchi Yan},\nyear={2024},\nurl={https://openreview.net/forum?id=MfWFUJklRI}\n}",
        "github": "",
        "project": "",
        "reviewers": "mLys;Jtwt;VjfH;8Epa;mZFa",
        "site": "https://openreview.net/forum?id=MfWFUJklRI",
        "pdf_size": 6846057,
        "rating": "3;3;5;5;5",
        "confidence": "3;4;4;4;3",
        "soundness": "2;2;2;3;3",
        "contribution": "2;2;2;2;3",
        "presentation": "3;3;2;2;2",
        "wc_summary": "55;52;99;94;94",
        "wc_strengths": "58;84;41;129;117",
        "wc_weaknesses": "178;180;196;166;140",
        "wc_questions": "4;2;2;112;93",
        "wc_review": "295;318;338;501;444",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "654;1048;742;613;1287",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "1;2;1;1;2",
        "rating_avg": [
            4.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            78.8,
            20.75957610357206
        ],
        "wc_strengths_avg": [
            85.8,
            33.53445988829998
        ],
        "wc_weaknesses_avg": [
            172.0,
            18.633303518163384
        ],
        "wc_questions_avg": [
            42.6,
            49.281233750789966
        ],
        "wc_review_avg": [
            379.2,
            79.45665485030187
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            868.8,
            258.7101853425953
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.4,
            0.4898979485566356
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.16666666666666663,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:deqBUgvow6EJ:scholar.google.com/&scioq=GSINA:+Improving+Graph+Invariant+Learning+via+Graph+Sinkhorn+Attention&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1;0",
        "aff_unique_norm": "Shanghai Jiao Tong University;Ant Group",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.sjtu.edu.cn;https://www.antgroup.com",
        "aff_unique_abbr": "SJTU;Ant Group",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Fast Ensembling with Diffusion Schr\u00f6dinger Bridge",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18813",
        "id": "Mgq6kxl115",
        "author_site": "Hyunsu Kim, Jongmin Yoon, Juho Lee",
        "tldr": "",
        "abstract": "Deep Ensemble approach is a straightforward technique used to enhance the performance of deep neural networks by training them from different initial points, converging towards various local optima. However, a limitation of this methodology lies in its high computational overhead for inference, arising from the necessity to store numerous learned parameters and execute individual forward passes for each parameter during the inference stage.We propose a novel approach called Diffusion Bridge Network to address this challenge. Based on the theory of Schr\\\"odinger bridge, this method directly learns to simulate an Stochastic Differential Equation (SDE) that connects the output distribution of a single ensemble member to the output distribution of the ensembled model, allowing us to obtain ensemble prediction without having to invoke forward pass through all the ensemble models. By substituting the heavy ensembles with this lightweight neural network constructing DBN, we achieved inference with reduced computational cost while maintaining accuracy and uncertainty scores on benchmark datasets such as CIFAR-10, CIFAR-100, and TinyImageNet.",
        "keywords": "Deep Ensemble;Diffusion Schr\\\"odinger Bridge;Bayesian",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/fb4fee1d0ddf4980f638e5328fae4986022cf4f1.zip",
        "author": "Hyunsu Kim;Jongmin Yoon;Juho Lee",
        "authorids": "~Hyunsu_Kim2;~Jongmin_Yoon1;~Juho_Lee2",
        "gender": "M;M;M",
        "homepage": "https://kim-hyunsu.github.io/;https://jmyoon1.github.io;https://juho.lee.github.io",
        "dblp": ";04/390;55/3410-1",
        "google_scholar": ";https://scholar.google.co.kr/citations?user=WKsaDwQAAAAJ;Py4URJUAAAAJ",
        "orcid": ";;",
        "linkedin": ";jongmin-yoon-9915469a;",
        "or_profile": "~Hyunsu_Kim2;~Jongmin_Yoon1;~Juho_Lee2",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr;kaist.ac.kr",
        "position": "PhD student;PhD student;Associate Professor",
        "bibtex": "@inproceedings{\nkim2024fast,\ntitle={Fast Ensembling with Diffusion Schr\\\"odinger Bridge},\nauthor={Hyunsu Kim and Jongmin Yoon and Juho Lee},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Mgq6kxl115}\n}",
        "github": "",
        "project": "",
        "reviewers": "unod;3R6G;Qbom;jMzV;bFwN",
        "pdf_size": 1070109,
        "rating": "5;6;6;8;8",
        "confidence": "4;5;3;3;4",
        "soundness": "2;2;2;3;3",
        "contribution": "2;2;2;3;3",
        "presentation": "4;2;2;3;3",
        "wc_summary": "95;49;99;124;96",
        "wc_strengths": "41;47;68;105;65",
        "wc_weaknesses": "45;130;329;342;186",
        "wc_questions": "295;159;141;67;153",
        "wc_review": "476;385;637;638;500",
        "wc_reply_reviewers": "549;200;0;0;0",
        "wc_reply_authors": "2250;1428;1596;676;1314",
        "reply_reviewers": "1;2;0;0;0",
        "reply_authors": "5;4;4;2;2",
        "rating_avg": [
            6.6,
            1.2
        ],
        "confidence_avg": [
            3.8,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.8,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            92.6,
            24.27014627067583
        ],
        "wc_strengths_avg": [
            65.2,
            22.400000000000002
        ],
        "wc_weaknesses_avg": [
            206.4,
            114.64833186749819
        ],
        "wc_questions_avg": [
            163.0,
            73.81056834898374
        ],
        "wc_review_avg": [
            527.2,
            97.89259420405611
        ],
        "wc_reply_reviewers_avg": [
            149.8,
            214.1031527091556
        ],
        "wc_reply_authors_avg": [
            1452.8,
            505.832541460116
        ],
        "reply_reviewers_avg": [
            0.6,
            0.7999999999999999
        ],
        "reply_authors_avg": [
            3.4,
            1.2000000000000002
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3118047822311618,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15394775937643260746&as_sdt=20000005&sciodt=0,21&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=Mgq6kxl115",
        "pdf": "https://openreview.net/pdf?id=Mgq6kxl115",
        "email": "kaist.ac.kr;kaist.ac.kr;kaist.ac.kr",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "MgsN70BQeT",
        "title": "OUT-OF-DISTRIBUTION DETECTION IN MACHINE- LEARNING BASED SYSTEMS ENABLED BY TINYML",
        "track": "main",
        "status": "Desk Reject",
        "tldr": "",
        "abstract": "Tiny Machine Learning (TinyML) has emerged as a promising approach for in-\ncorporating Machine Learning (ML) into resource-constrained Internet of Things\n(IoT) devices. However, the existing TinyML models face challenges in effec-\ntively handling out-of-distribution (OOD) inputs. While various high-accuracy\nmethods for detecting OOD inputs have been developed, they often overlook the\nconstraints posed by the deployment environment. In this paper, we introduce an\ninnovative and efficient out-of-distribution detection method tailored for TinyML.\nTinyML is an up-and-coming initiative aimed at integrating ML into devices with\nlimited computational resources. This endeavor holds great potential to revolu-\ntionize application domains reliant on embedded command-and-control systems,\nallowing them to harness \u201dML intelligence\u201d within their decision-making pro-\ncesses. We propose a novel framework called multi-level out-of-distribution de-\ntection, which leverages intermediate classifier outputs to dynamically and effi-\nciently infer OOD inputs. We establish a direct correlation between the complex-\nity of OOD data and the optimal exit level, demonstrating that easily detectable\nOOD examples can be identified early on without delving into deeper layers. Our\narchitecture comprises a DNN with a final Gaussian layer combined with the log\nlikelihood ratio statistical test and an additional output neuron dedicated to OOD\ndetection. Instead of relying on actual OOD data, we devise a novel method to\ncreate artificial OOD samples from in-distribution data, used to train our OOD de-\ntector neuron adjusted energy score facilitates the distinction of OOD examples at\neach exit, proving empirically and theoretically suitable for networks employing\nmultiple classifiers. We extensively evaluate framework across 10 OOD datasets\nspanning a diverse range of complexities. Our results not only demonstrate achiev-\ning state-of-the-art performance but also highlight speed and applicability to real-\nworld scenarios.",
        "keywords": "TinyML;Out-Of-Distribution Detection;Ma- chine Learning Based Systems;Deep neural networks",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "zain iqbal;Tullio Vardanega",
        "authorids": "~zain_iqbal1;~Tullio_Vardanega1",
        "gender": "F;M",
        "homepage": ";https://www.didattica.unipd.it/off/docente/BD33E4F435AC4372A99ED59CDD3FB10A",
        "dblp": ";",
        "google_scholar": ";arxht7cAAAAJ",
        "orcid": ";0000-0002-0089-0889",
        "linkedin": "zain-iqbal;",
        "or_profile": "~zain_iqbal1;~Tullio_Vardanega1",
        "aff": ";",
        "aff_domain": ";",
        "position": ";",
        "bibtex": "@misc{\niqbal2024outofdistribution,\ntitle={{OUT}-{OF}-{DISTRIBUTION} {DETECTION} {IN} {MACHINE}- {LEARNING} {BASED} {SYSTEMS} {ENABLED} {BY} {TINYML}},\nauthor={zain iqbal and Tullio Vardanega},\nyear={2024},\nurl={https://openreview.net/forum?id=MgsN70BQeT}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=MgsN70BQeT",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:q0eYK0JjkJYJ:scholar.google.com/&scioq=OUT-OF-DISTRIBUTION+DETECTION+IN+MACHINE-+LEARNING+BASED+SYSTEMS+ENABLED+BY+TINYML&hl=en&as_sdt=0,5",
        "gs_version_total": 0
    },
    {
        "title": "Learning to Act from Actionless Videos through Dense Correspondences",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18812",
        "id": "Mhb5fpA1T0",
        "author_site": "Po-Chen Ko, Jiayuan Mao, Yilun Du, Shao-Hua Sun, Joshua B Tenenbaum",
        "tldr": "",
        "abstract": "In this work, we present an approach to construct a video-based robot policy capable of reliably executing diverse tasks across different robots and environments from few video demonstrations without using any action annotations. Our method leverages images as a task-agnostic representation, encoding both the state and action information, and text as a general representation for specifying robot goals. By synthesizing videos that \"hallucinate\" robot executing actions and in combination with dense correspondences between frames, our approach can infer the closed-formed action to execute to an environment without the need of any explicit action labels. This unique capability allows us to train the policy solely based on RGB videos and deploy learned policies to various robotic tasks. We demonstrate the efficacy of our approach in learning policies on table-top manipulation and navigation tasks. Additionally, we contribute an open-source framework for efficient video modeling, enabling the training of high-fidelity policy models with four GPUs within a single day.",
        "keywords": "Video-Based Policy;Video Dense Correspondence",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/7116e5a638e853835dbcc742ebb57b3d31a4aa97.zip",
        "author": "Po-Chen Ko;Jiayuan Mao;Yilun Du;Shao-Hua Sun;Joshua B. Tenenbaum",
        "authorids": "~Po-Chen_Ko1;~Jiayuan_Mao1;~Yilun_Du1;~Shao-Hua_Sun1;~Joshua_B._Tenenbaum1",
        "gender": "F;;M;;M",
        "homepage": "http://jiayuanm.com;https://yilundu.github.io;http://shaohua0116.github.io;;",
        "dblp": "200/8283;204/4379;158/9680;t/JoshuaBTenenbaum;359/0626",
        "google_scholar": "-xaOIZIAAAAJ;;uXsfnaQAAAAJ;;https://scholar.google.com.tw/citations?user=LihTgFUAAAAJ",
        "orcid": "0000-0003-4798-3748;;0000-0001-7579-6734;;",
        "linkedin": ";;shaohua0116/;;%E6%9F%8F%E8%BE%B0-%E6%9F%AF-1405b427a/edit/forms/contact-info/new/#:~:text=https%3A//www.linkedin.com/in/%25E6%259F%258F%25E8%25BE%25B0%2D%25E6%259F%25AF%2D1405b427a",
        "or_profile": "~Jiayuan_Mao1;~Yilun_Du1;~Shao-Hua_Sun1;~Joshua_B._Tenenbaum1;~Pochen_Ko1",
        "aff": "Massachusetts Institute of Technology;Massachusetts Institute of Technology;National Taiwan University;Massachusetts Institute of Technology;National Taiwan University",
        "aff_domain": "mit.edu;mit.edu;ntu.edu.tw;mit.edu;ntu.edu.tw",
        "position": "PhD student;PhD student;Assistant Professor;Professor;Undergrad student",
        "bibtex": "@inproceedings{\nko2024learning,\ntitle={Learning to Act from Actionless Videos through Dense Correspondences},\nauthor={Po-Chen Ko and Jiayuan Mao and Yilun Du and Shao-Hua Sun and Joshua B. Tenenbaum},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Mhb5fpA1T0}\n}",
        "github": "",
        "project": "",
        "reviewers": "Hwk5;QCWJ;itAQ;cxfp",
        "pdf_size": 11103109,
        "rating": "6;6;8;10",
        "confidence": "4;4;4;3",
        "soundness": "4;3;3;3",
        "contribution": "3;3;3;4",
        "presentation": "4;3;3;4",
        "wc_summary": "113;163;103;149",
        "wc_strengths": "115;46;87;243",
        "wc_weaknesses": "191;241;40;349",
        "wc_questions": "137;2;82;152",
        "wc_review": "556;452;312;893",
        "wc_reply_reviewers": "16;18;0;80",
        "wc_reply_authors": "1431;1360;242;2125",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "3;3;1;4",
        "rating_avg": [
            7.5,
            1.6583123951777
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            132.0,
            24.758836806279895
        ],
        "wc_strengths_avg": [
            122.75,
            73.6355043440323
        ],
        "wc_weaknesses_avg": [
            205.25,
            111.18987139123779
        ],
        "wc_questions_avg": [
            93.25,
            58.77658972754374
        ],
        "wc_review_avg": [
            553.25,
            214.41242384712692
        ],
        "wc_reply_reviewers_avg": [
            28.5,
            30.540956108150905
        ],
        "wc_reply_authors_avg": [
            1289.5,
            674.5941372410525
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            1.0897247358851685
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.8703882797784891,
        "gs_citation": 56,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15498577042110263368&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=Mhb5fpA1T0",
        "pdf": "https://openreview.net/pdf?id=Mhb5fpA1T0",
        "email": "mit.edu;mit.edu;ntu.edu.tw;mit.edu;ntu.edu.tw",
        "author_num": 5,
        "aff_unique_index": "0;0;1;0;1",
        "aff_unique_norm": "Massachusetts Institute of Technology;National Taiwan University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://web.mit.edu;https://www.ntu.edu.tw",
        "aff_unique_abbr": "MIT;NTU",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Taiwan",
        "aff_country_unique_index": "0;0;1;0;1",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "Mhu9iNGKqP",
        "title": "Optimizing Layerwise Polynomial Approximation for Efficient Private Inference on Fully Homomorphically Encryption: A Dynamic Programming Approach",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent research has explored the implementation of privacy-preserving deep neural networks solely using fully homomorphic encryption. However, its practicality has been limited because of prolonged inference times. When using a pre-trained model without retraining, a major factor contributing to these prolonged inference times is the high-degree polynomial approximation of activation functions such as the ReLU function. The high-degree approximation consumes a substantial amount of homomorphic computational resources, resulting in slower inference. Unlike the previous works approximating activation functions uniformly and conservatively, this paper presents a \\emph{layerwise} degree optimization of activation functions to aggressively reduce the inference time while maintaining classification accuracy by taking into account the characteristics of each layer. Instead of the minimax approximation commonly used in state-of-the-art private inference models, we employ the weighted least squares approximation method with the input distributions of activation functions. Then we obtain the layerwise optimized degrees for activation functions through the \\emph{dynamic programming} algorithm considering how each layer's approximation error affects the classification accuracy of the deep neural network. Furthermore, we propose modulating the ciphertext moduli-chain layerwise to reduce the inference time. By these proposed layerwise optimization, we can reduce inference times for the ResNet-20 model and the ResNet-32 model by 3.44 times and 3.16 times, respectively, in comparison to the prior implementations employing uniform degree polynomials and a consistent ciphertext modulus.",
        "keywords": "Privacy preserving machine learning;fully homomorphic encryption;RNS-CKKS",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Junghyun Lee;Eunsang Lee;Young-Sik Kim;Yongwoo Lee;Joon-Woo Lee;Yongjune Kim;Jong-Seon No",
        "authorids": "~Junghyun_Lee2;eslee3209@sejong.ac.kr;ysk@dgist.ac.kr;yongwoo@inha.ac.kr;~Joon-Woo_Lee2;~Yongjune_Kim1;~Jong-Seon_No1",
        "gender": ";;;;M;;M",
        "homepage": "http://ccl.snu.ac.kr/;;;;https://sites.google.com/view/paiclab;https://iil.postech.ac.kr;http://ccl.snu.ac.kr",
        "dblp": ";;;;;124/3256;",
        "google_scholar": ";;;;qAq8TJUAAAAJ;WPKrXEoAAAAJ;",
        "orcid": ";;;;0000-0002-4125-6331;0000-0003-0120-3750;",
        "linkedin": ";;;;;;",
        "or_profile": "~Junghyun_Lee2;eslee3209@sejong.ac.kr;ysk@dgist.ac.kr;yongwoo@inha.ac.kr;~Joon-Woo_Lee2;~Yongjune_Kim1;~Jong-Seon_No1",
        "aff": "Seoul National University;;;;Chung-Ang University;POSTECH;Seoul National University",
        "aff_domain": "snu.ac.kr;;;;cau.ac.kr;postech.ac.kr;snu.ac.kr",
        "position": "PhD student;;;;Assistant Professor;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nlee2024optimizing,\ntitle={Optimizing Layerwise Polynomial Approximation for Efficient Private Inference on Fully Homomorphically Encryption: A Dynamic Programming Approach},\nauthor={Junghyun Lee and Eunsang Lee and Young-Sik Kim and Yongwoo Lee and Joon-Woo Lee and Yongjune Kim and Jong-Seon No},\nyear={2024},\nurl={https://openreview.net/forum?id=Mhu9iNGKqP}\n}",
        "github": "",
        "project": "",
        "reviewers": "ghjk;ov7g;8y16;J1kw",
        "site": "https://openreview.net/forum?id=Mhu9iNGKqP",
        "pdf_size": 336681,
        "rating": "3;5;5;5",
        "confidence": "4;4;3;4",
        "soundness": "2;3;2;2",
        "contribution": "2;2;2;2",
        "presentation": "2;2;3;3",
        "wc_summary": "55;116;59;131",
        "wc_strengths": "45;123;82;30",
        "wc_weaknesses": "345;132;91;304",
        "wc_questions": "54;5;3;3",
        "wc_review": "499;376;235;468",
        "wc_reply_reviewers": "255;93;0;0",
        "wc_reply_authors": "2251;711;244;1215",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "4;1;1;2",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            90.25,
            33.699962907991456
        ],
        "wc_strengths_avg": [
            70.0,
            35.97916063501204
        ],
        "wc_weaknesses_avg": [
            218.0,
            108.45505981741931
        ],
        "wc_questions_avg": [
            16.25,
            21.810261346439663
        ],
        "wc_review_avg": [
            394.5,
            102.59751458977942
        ],
        "wc_reply_reviewers_avg": [
            87.0,
            104.16093317554332
        ],
        "wc_reply_authors_avg": [
            1105.25,
            745.314153562107
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14161441270804166999&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Seoul National University;Chung-Ang University;Pohang University of Science and Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.snu.ac.kr;http://www.cau.ac.kr;https://www.postech.ac.kr",
        "aff_unique_abbr": "SNU;CAU;POSTECH",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Pohang",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "MhzKwuvpm6",
        "title": "RILe: Reinforced Imitation Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Learning to imitate behaviors from a limited set of expert trajectories is a promising way to acquire a policy. In imitation learning (IL), an expert policy is trained directly from data in an efficient way, but requires vast amounts of data. On the other hand, inverse reinforcement learning (IRL)  deduces a reward function from expert data and then learns a policy with reinforcement learning via this reward function. Although this mitigates the data requirement of imitation learning, IRL approaches suffer from efficiency issues because of sequential learning of the reward function and the policy. In this paper, we combine the strengths of imitation learning and inverse reinforcement learning and introduce RILe: Reinforced Imitation Learning. Our novel dual-agent framework enables joint training of a teacher agent and a student agent. The teacher agent learns the reward function from expert data. It observes the student agent\u2019s behavior and provides it with a reward signal. At the same time the student agent learns a policy by using reward signals given by the teacher. Training the student and the teacher jointly in a single learning process offers scalability and efficiency while learning the reward function helps to alleviate data-sensitivity. Experimental comparisons in reinforcement learning benchmarks against imitation learning baselines highlight the superior performance offered by RILe particularly when the number of expert trajectories is limited.",
        "keywords": "Reinforcement Learning;Imitation Learning;Deep Reinforcement Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/0bff4f9ffb9c3a2b10a5351ff5b85feb5a1f7a14.zip",
        "author": "Berat Mert Albaba;Sammy Christen;Christoph Gebhardt;Michael J. Black;Otmar Hilliges",
        "authorids": "~Berat_Mert_Albaba1;~Sammy_Christen1;~Christoph_Gebhardt1;~Michael_J._Black1;~Otmar_Hilliges1",
        "gender": "M;M;M;M;Unspecified",
        "homepage": "https://mertalbaba.github.io;https://ait.ethz.ch/people/gebhardt/;https://ait.ethz.ch/people/hilliges/;https://ps.is.tuebingen.mpg.de/person/black;",
        "dblp": "248/5590;144/5564;82/2289;b/MichaelJBlack.html;243/6983",
        "google_scholar": "AeAVp7YAAAAJ;NR4TTRgAAAAJ;-epU9OsAAAAJ;https://scholar.google.de/citations?hl=en;r1L_2qkAAAAJ",
        "orcid": ";;0000-0002-5068-3474;0000-0001-6077-4540;",
        "linkedin": "mertalbaba/;;;michael-black-41751114/;",
        "or_profile": "~Berat_Mert_Albaba1;~Christoph_Gebhardt1;~Otmar_Hilliges1;~Michael_J_Black1;~Sammy_Joe_Christen1",
        "aff": "ETHZ - ETH Zurich;ETHZ - ETH Zurich;ETHZ - ETH Zurich;Max Planck Institute for Intelligent Systems;ETH Zurich",
        "aff_domain": "ethz.ch;ethz.ch;ethz.ch;mpg.de;ethz.ch",
        "position": "PhD student;Postdoc;Full Professor;Director;PhD student",
        "bibtex": "@misc{\nalbaba2024rile,\ntitle={{RIL}e: Reinforced Imitation Learning},\nauthor={Berat Mert Albaba and Sammy Christen and Christoph Gebhardt and Michael J. Black and Otmar Hilliges},\nyear={2024},\nurl={https://openreview.net/forum?id=MhzKwuvpm6}\n}",
        "github": "",
        "project": "",
        "reviewers": "3koB;KLBr;RQBA",
        "site": "https://openreview.net/forum?id=MhzKwuvpm6",
        "pdf_size": 6103029,
        "rating": "3;3;5",
        "confidence": "5;5;4",
        "soundness": "2;1;2",
        "contribution": "2;2;2",
        "presentation": "3;1;3",
        "wc_summary": "21;78;60",
        "wc_strengths": "29;40;25",
        "wc_weaknesses": "75;257;207",
        "wc_questions": "309;169;4",
        "wc_review": "434;544;296",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "861;1016;693",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;2;1",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            53.0,
            23.790754506740637
        ],
        "wc_strengths_avg": [
            31.333333333333332,
            6.342099196813483
        ],
        "wc_weaknesses_avg": [
            179.66666666666666,
            76.77383813658285
        ],
        "wc_questions_avg": [
            160.66666666666666,
            124.65507967543437
        ],
        "wc_review_avg": [
            424.6666666666667,
            101.46044658990134
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            856.6666666666666,
            131.8997936145298
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1895827857257224709&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "ETH Zurich;Max Planck Institute for Intelligent Systems",
        "aff_unique_dep": ";Intelligent Systems",
        "aff_unique_url": "https://www.ethz.ch;https://www.mpi-is.mpg.de",
        "aff_unique_abbr": "ETHZ;MPI-IS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "Switzerland;Germany"
    },
    {
        "id": "MiMxv6ijvC",
        "title": "CARENET : A NOVEL ARCHITECTURE FOR LOW DATA REGIME MIXING CONVOLUTIONS AND ATTENTION",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In the rapidly evolving landscape of deep learning for computer vision, var-\nious architectures have been proposed to achieve state-of-the-art performance\nin tasks such as object recognition, image segmentation, and classification.\nWhile pretrained models on large datasets like ImageNet have been the corner-\nstone for transfer learning in many applications, this paper introduces CAReNet\n(Convolutional Attention Residual Network), a novel architecture that was trained\nfrom scratch, in the absence of available pretrained weights. CAReNet incorpo-\nrates a unique blend of convolutional layers, attention mechanisms, and residual\nconnections to offer a holistic approach to feature extraction and representation\nlearning. Notably, CAReNet closely follows the performance of ResNet50 on\nthe same training set while utilizing fewer parameters. Training CAReNet from\nscratch proved to be necessary, particularly due to architectural differences that\nrender feature representations incompatible with those from pretrained models.\nFurthermore, we highlight that training new models on large, general-purpose\ndatabases to obtain pretrained weights requires time, accurate labels, and pow-\nerful machines, which causes significant barriers in many domains. Therefore, the\nabsence of pretrained weights for CAReNet is not only a constraint but also an op-\nportunity for architecture-specific optimization. We also emphasize that in certain\ndomains, such as space and medical fields, the features learned from ImageNet\nimages are vastly different and can introduce bias during training, given the gap\nthat exists between the domains of pretraining and the task of transfer learning.\nThis work focuses on the importance of architecture-specific training strategies\nfor optimizing performance and also demonstrates the efficacy of CAReNet in\nachieving competitive results with a more compact model architecture. Experi-\nments were carried out on several benchmark datasets, including Tiny ImageNet,\nfor image classification tasks. Signifying a groundbreaking stride in efficiency\nand performance, CAReNet not only outpaces ResNet50 by achieving a lead of\n2.61% on Tiny-Imagenet and 1.9% on STL10, but it does so with a model that\u2019s\nnearly half the size of ResNet50. This impressive balance between compactness\nand elevated accuracy highlights the prowess of CAReNet in the realm of deep\nlearning architectures.",
        "keywords": "CNN;attention;low-data regime;classification",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Aur\u00e9lie Cools;Sidi Ahmed Mahmoudi;Mohammed Amin Belarbi",
        "authorids": "~Aur\u00e9lie_Cools1;~Sidi_Ahmed_Mahmoudi1;~Mohammed_Amin_Belarbi1",
        "gender": "F;M;M",
        "homepage": ";https://staff.umons.ac.be/sidi.mahmoudi/activites.html;",
        "dblp": ";60/10646;",
        "google_scholar": "https://scholar.google.be/citations?user=EsrNe9gAAAAJ;https://scholar.google.be/citations?user=tSGQcN0AAAAJ;YMWX4X8AAAAJ",
        "orcid": ";0000-0002-1530-9524;",
        "linkedin": ";sidi-ahmed-mahmoudi-95324534/?msgControlName=reply_to_sender&msgConversationId=2-NmJjMTY5NjYtYTk0NS00MGEzLWIzMDEtNTNkN2YxZTA2YjA0XzAxMw%3D%3D&msgOverlay=true;",
        "or_profile": "~Aur\u00e9lie_Cools1;~Sidi_Ahmed_Mahmoudi1;~Mohammed_Amin_Belarbi1",
        "aff": "ILIA;UMONS;university of Mons",
        "aff_domain": "umons.ac.be;umons.ac.be;umons.ac.be",
        "position": "PhD student;Associate Professor;Researcher",
        "bibtex": "@misc{\ncools2024carenet,\ntitle={{CARENET} : A {NOVEL} {ARCHITECTURE} {FOR} {LOW} {DATA} {REGIME} {MIXING} {CONVOLUTIONS} {AND} {ATTENTION}},\nauthor={Aur{\\'e}lie Cools and Sidi Ahmed Mahmoudi and Mohammed Amin Belarbi},\nyear={2024},\nurl={https://openreview.net/forum?id=MiMxv6ijvC}\n}",
        "github": "",
        "project": "",
        "reviewers": "YEgK;qugU;CQ8z;LKri",
        "site": "https://openreview.net/forum?id=MiMxv6ijvC",
        "pdf_size": 190217,
        "rating": "1;3;3;3",
        "confidence": "5;4;4;5",
        "soundness": "2;2;1;2",
        "contribution": "1;2;1;1",
        "presentation": "2;2;2;1",
        "wc_summary": "57;38;49;79",
        "wc_strengths": "161;37;39;24",
        "wc_weaknesses": "399;211;901;315",
        "wc_questions": "4;7;406;102",
        "wc_review": "621;293;1395;520",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;705;693;731",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;1;1;1",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            55.75,
            15.022899187573616
        ],
        "wc_strengths_avg": [
            65.25,
            55.580459695831955
        ],
        "wc_weaknesses_avg": [
            456.5,
            265.13157111140123
        ],
        "wc_questions_avg": [
            129.75,
            164.28994947957102
        ],
        "wc_review_avg": [
            707.25,
            414.4589093022371
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            532.25,
            307.60150763609727
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0.75,
            0.4330127018922193
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7600017074748462802&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "ILIA;University of Mons",
        "aff_unique_dep": ";",
        "aff_unique_url": ";https://www.umons.ac.be",
        "aff_unique_abbr": ";UMONS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "1;1",
        "aff_country_unique": ";Belgium"
    },
    {
        "id": "MiPacpmtmy",
        "title": "Compositional Generalization in Multimodal Foundation Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The rise of large-scale multimodal models has paved the pathway for groundbreaking advances in generative modelling and reasoning, unlocking transformative applications in a variety of complex tasks. However, a pressing question that remains is their genuine capability for stronger forms of generalization, which has been largely underexplored in the multimodal setting. Our study aims to address this by examining sequential compositional generalization using CompAct (Compositional Activities), a carefully constructed, perceptually grounded dataset set within a rich backdrop of egocentric kitchen activity videos. Each instance in our dataset is represented with a combination of raw video footage, naturally occurring sound, and crowd-sourced step-by-step descriptions. More importantly, our setup ensures that the individual concepts are consistently distributed across training and evaluation sets, while their compositions are novel in the evaluation set. We conduct a comprehensive assessment of several unimodal and multimodal models. Our findings reveal that bi-modal and tri-modal models exhibit a clear edge over their text-only counterparts. This highlights the importance of multimodality while charting a trajectory for future model development in this domain.",
        "keywords": "Compositional Generalization;Multimodality;Computer Vision;Natural Language Processing",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Semih Yagcioglu;Osman Batur \u0130nce;Aykut Erdem;Erkut Erdem;Desmond Elliott;Deniz Yuret",
        "authorids": "~Semih_Yagcioglu1;~Osman_Batur_\u0130nce1;~Aykut_Erdem1;~Erkut_Erdem1;~Desmond_Elliott1;~Deniz_Yuret1",
        "gender": "M;M;M;M;;M",
        "homepage": ";https://ospanbatyr.github.io;https://aykuterdem.github.io;https://web.cs.hacettepe.edu.tr/~erkut;;http://www.denizyuret.com/",
        "dblp": "159/1196;359/3145;04/1832;79/6569;46/7536;84/4160",
        "google_scholar": ";3fKgzG4AAAAJ;-xA1_OAAAAAJ;https://scholar.google.com.tr/citations?user=eALwl74AAAAJ;;https://scholar.google.com.tw/citations?user=EJurXJ4AAAAJ",
        "orcid": ";0009-0008-9538-2481;0000-0002-6280-8422;;;",
        "linkedin": ";osmanbatur/;;;;",
        "or_profile": "~Semih_Yagcioglu1;~Osman_Batur_\u0130nce1;~Aykut_Erdem1;~Erkut_Erdem1;~Desmond_Elliott1;~Deniz_Yuret1",
        "aff": "Apziva;Ko\u00e7 University;Ko\u00e7 University;Hacettepe University;University of Copenhagen;Koc University",
        "aff_domain": "apziva.com;ku.edu.tr;ku.edu.tr;hacettepe.edu.tr;ku.dk;ku.edu.tr",
        "position": "Principal Researcher;MS student;Associate Professor;Full Professor;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nyagcioglu2024compositional,\ntitle={Compositional Generalization in Multimodal Foundation Models},\nauthor={Semih Yagcioglu and Osman Batur {\\.I}nce and Aykut Erdem and Erkut Erdem and Desmond Elliott and Deniz Yuret},\nyear={2024},\nurl={https://openreview.net/forum?id=MiPacpmtmy}\n}",
        "github": "",
        "project": "",
        "reviewers": "CZT6;JtuP;w67G;7kwf",
        "site": "https://openreview.net/forum?id=MiPacpmtmy",
        "pdf_size": 16090074,
        "rating": "3;3;5;5",
        "confidence": "4;3;5;4",
        "soundness": "2;3;3;3",
        "contribution": "1;2;2;3",
        "presentation": "2;3;2;3",
        "wc_summary": "52;68;159;145",
        "wc_strengths": "47;23;100;178",
        "wc_weaknesses": "96;19;66;134",
        "wc_questions": "54;1;318;3",
        "wc_review": "249;111;643;460",
        "wc_reply_reviewers": "0;0;40;0",
        "wc_reply_authors": "411;274;776;955",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;2;2",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            106.0,
            46.61008474568567
        ],
        "wc_strengths_avg": [
            87.0,
            59.46847904562551
        ],
        "wc_weaknesses_avg": [
            78.75,
            42.07953778263255
        ],
        "wc_questions_avg": [
            94.0,
            131.0591469528167
        ],
        "wc_review_avg": [
            365.75,
            202.65657526959248
        ],
        "wc_reply_reviewers_avg": [
            10.0,
            17.320508075688775
        ],
        "wc_reply_authors_avg": [
            604.0,
            273.3742855500495
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.7071067811865475,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:KjcpUajgdpAJ:scholar.google.com/&scioq=Compositional+Generalization+in+Multimodal+Foundation+Models&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;2;3;4",
        "aff_unique_norm": "Apziva;Ko\u00e7 University;Hacettepe University;University of Copenhagen;Koc University",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": ";https://www.ku.edu.tr;https://www.hacettepe.edu.tr;https://www.ku.dk;https://www.koc.edu.tr",
        "aff_unique_abbr": ";Ko\u00e7;Hacettepe;UCPH;Koc",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "1;1;1;2;1",
        "aff_country_unique": ";T\u00fcrkiye;Denmark"
    },
    {
        "title": "COCO-Periph: Bridging the Gap Between Human and Machine Perception in the Periphery",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18811",
        "id": "MiRPBbQNHv",
        "author_site": "Anne Harrington, Vasha DuTell, Mark Hamilton, Ayush Tewari, Simon Stent, William Freeman, Ruth Rosenholtz",
        "tldr": "",
        "abstract": "Evaluating deep neural networks (DNNs) as models of human perception has given rich insights into both human visual processing and representational properties of DNNs. We extend this work by analyzing how well DNNs perform compared to humans when constrained by peripheral vision -- which limits human performance on a variety of tasks, but also benefits the visual system significantly. We evaluate this by (1) modifying the Texture Tiling Model (TTM), a well tested model of peripheral vision to be more flexibly used with DNNs, (2) generating a large dataset which we call COCO-Periph that contains images transformed to capture the information available in human peripheral vision, and (3) comparing DNNs to humans at peripheral object detection using a psychophysics experiment. Our results show that common DNNs underperform at object detection compared to humans when simulating peripheral vision with TTM. Training on COCO-Periph begins to reduce the gap between human and DNN performance and leads to small increases in corruption robustness, but DNNs still struggle to capture human-like sensitivity to peripheral clutter. Our work brings us closer to accurately modeling human vision, and paves the way for DNNs to mimic and sometimes benefit from properties of human visual processing.",
        "keywords": "peripheral vision;object detection;dataset;foveation;psychophysics",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "Anne Harrington;Vasha DuTell;Mark Hamilton;Ayush Tewari;Simon Stent;William T. Freeman;Ruth Rosenholtz",
        "authorids": "~Anne_Harrington1;~Vasha_DuTell2;~Mark_Hamilton1;~Ayush_Tewari2;~Simon_Stent1;~William_T._Freeman1;~Ruth_Rosenholtz1",
        "gender": "F;F;M;;M;M;F",
        "homepage": ";https://redwood.berkeley.edu/people/vasha-dutell/;https://mhamilton.net;https://ayushtewari.com;;https://billf.mit.edu/;http://persci.mit.edu/people/rosenholtz",
        "dblp": "29/6192;;91/631;198/1021;146/2461;86/6650;",
        "google_scholar": "7M9eSFMAAAAJ;tvQjbgYAAAAJ;kgZtMGsAAAAJ;pDnzpeoAAAAJ;f3aij5UAAAAJ;https://scholar.google.com.tw/citations?user=0zZnyMEAAAAJ;BfE3-m0AAAAJ",
        "orcid": "0009-0000-9441-2687;0000-0001-8625-1350;;;;;",
        "linkedin": "anne-harrington-4a7a04177;vashadutell/;;;;;",
        "or_profile": "~Anne_Harrington1;~Vasha_DuTell2;~Mark_Hamilton1;~Ayush_Tewari2;~Simon_Stent1;~William_T._Freeman1;~Ruth_Rosenholtz1",
        "aff": "Liquid AI;Massachusetts Institute of Technology;Massachusetts Institute of Technology;Massachusetts Institute of Technology;Woven Planet;Massachusetts Institute of Technology;Massachusetts Institute of Technology",
        "aff_domain": "liquid.ai;mit.edu;mit.edu;mit.edu;woven-planet.global;mit.edu;mit.edu",
        "position": "Researcher;Postdoc;PhD student;Postdoc;Research Manager;Professor;Principal Researcher",
        "bibtex": "@inproceedings{\nharrington2024cocoperiph,\ntitle={{COCO}-Periph: Bridging the Gap Between Human and Machine Perception in the Periphery},\nauthor={Anne Harrington and Vasha DuTell and Mark Hamilton and Ayush Tewari and Simon Stent and William T. Freeman and Ruth Rosenholtz},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=MiRPBbQNHv}\n}",
        "github": "",
        "project": "",
        "reviewers": "eW1M;xwTZ;ogr4",
        "pdf_size": 40569746,
        "rating": "3;6;8",
        "confidence": "4;4;4",
        "soundness": "2;3;2",
        "contribution": "1;2;2",
        "presentation": "3;3;2",
        "wc_summary": "46;96;159",
        "wc_strengths": "37;79;167",
        "wc_weaknesses": "375;58;874",
        "wc_questions": "100;208;76",
        "wc_review": "558;441;1276",
        "wc_reply_reviewers": "0;0;599",
        "wc_reply_authors": "1792;898;2315",
        "reply_reviewers": "0;0;1",
        "reply_authors": "4;2;4",
        "rating_avg": [
            5.666666666666667,
            2.0548046676563256
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            100.33333333333333,
            46.233705838441665
        ],
        "wc_strengths_avg": [
            94.33333333333333,
            54.168461508725
        ],
        "wc_weaknesses_avg": [
            435.6666666666667,
            335.8812620885872
        ],
        "wc_questions_avg": [
            128.0,
            57.41080037762929
        ],
        "wc_review_avg": [
            758.3333333333334,
            369.14887090290404
        ],
        "wc_reply_reviewers_avg": [
            199.66666666666666,
            282.37130795382797
        ],
        "wc_reply_authors_avg": [
            1668.3333333333333,
            585.0597310436679
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12643628496248710865&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=MiRPBbQNHv",
        "pdf": "https://openreview.net/pdf?id=MiRPBbQNHv",
        "email": "liquid.ai;mit.edu;mit.edu;mit.edu;woven-planet.global;mit.edu;mit.edu",
        "author_num": 7,
        "aff_unique_index": "0;1;1;1;2;1;1",
        "aff_unique_norm": "Liquid AI;Massachusetts Institute of Technology;Woven Planet",
        "aff_unique_dep": ";;",
        "aff_unique_url": ";https://web.mit.edu;https://www.woven-planet.com",
        "aff_unique_abbr": ";MIT;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;2;1;1",
        "aff_country_unique": "Unknown;United States;Japan"
    },
    {
        "id": "Mkdwvl3Y8L",
        "title": "Discovering Knowledge-Critical Subnetworks in Neural Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Pretrained language models (LMs) encode implicit representations of knowledge in their parameters. However, localizing these representations and disentangling them from each other remains an open problem. In this work, we investigate whether pretrained language models contain various *knowledge-critical* subnetworks: particular sparse computational subgraphs responsible for encoding specific knowledge the model has memorized. We propose a multi-objective differentiable weight masking scheme to discover these subnetworks and show that we can use them to precisely remove specific knowledge from models while minimizing adverse effects on the behavior of the original language model. We demonstrate our method on multiple GPT2 variants, uncovering highly sparse subnetworks (98\\%+) that are solely responsible for specific collections of relational knowledge. When these subnetworks are removed, the remaining network maintains most of its initial capacity (modeling language and other memorized relational knowledge) but struggles to express the removed knowledge, and suffers performance drops on examples needing this removed knowledge on downstream tasks after finetuning.",
        "keywords": "sparse subnetworks;knowledge graphs;interpretability",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Deniz Bayazit;Negar Foroutan;Zeming Chen;Gail Weiss;Antoine Bosselut",
        "authorids": "~Deniz_Bayazit2;~Negar_Foroutan1;~Zeming_Chen1;~Gail_Weiss1;~Antoine_Bosselut1",
        "gender": "Not Specified;F;M;F;M",
        "homepage": "https://bayazitdeniz.github.io/;http://negar.foroutan.info/;https://eric11eca.github.io/;https://gailweiss.github.io;https://atcbosselut.github.io/",
        "dblp": "246/7625;174/4070;95/10696;210/2407;184/3742",
        "google_scholar": "GzH9mVIAAAAJ;jHeHoScAAAAJ;-gqyv8cAAAAJ;https://scholar.google.co.il/citations?user=qEc_VqcAAAAJ;XD9hkJwAAAAJ",
        "orcid": ";;0000-0002-2389-6968;;",
        "linkedin": ";;zeming-chen-769985123/;;",
        "or_profile": "~Deniz_Bayazit2;~Negar_Foroutan1;~Zeming_Chen1;~Gail_Weiss1;~Antoine_Bosselut1",
        "aff": "EPFL - Lausanne;School of Computer and Communication Sciences, EPFL - EPF Lausanne;Swiss Federal Institute of Technology Lausanne (EPFL);EPFL - EPF Lausanne;Swiss Federal Institute of Technology Lausanne",
        "aff_domain": "epfl.ch;ic.epfl.ch;epfl.ch;epfl.ch;epfl.ch",
        "position": "PhD student;PhD student;PhD student;Postdoc;Assistant Professor",
        "bibtex": "@misc{\nbayazit2024discovering,\ntitle={Discovering Knowledge-Critical Subnetworks in Neural Language Models},\nauthor={Deniz Bayazit and Negar Foroutan and Zeming Chen and Gail Weiss and Antoine Bosselut},\nyear={2024},\nurl={https://openreview.net/forum?id=Mkdwvl3Y8L}\n}",
        "github": "",
        "project": "",
        "reviewers": "njyU;ikUx;VC2F;cTTe",
        "site": "https://openreview.net/forum?id=Mkdwvl3Y8L",
        "pdf_size": 1433061,
        "rating": "3;3;5;5",
        "confidence": "3;4;4;4",
        "soundness": "3;1;2;2",
        "contribution": "2;2;2;2",
        "presentation": "3;2;3;3",
        "wc_summary": "73;138;72;287",
        "wc_strengths": "92;50;151;98",
        "wc_weaknesses": "90;191;437;308",
        "wc_questions": "89;214;84;27",
        "wc_review": "344;593;744;720",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "329;1150;1104;926",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;2;2;2",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            142.5,
            87.6085041534211
        ],
        "wc_strengths_avg": [
            97.75,
            35.87739539041261
        ],
        "wc_weaknesses_avg": [
            256.5,
            129.65820452250603
        ],
        "wc_questions_avg": [
            103.5,
            68.28799308809712
        ],
        "wc_review_avg": [
            600.25,
            158.68266288413488
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            877.25,
            327.3998892791505
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:-k7HD-wXM7YJ:scholar.google.com/&scioq=Discovering+Knowledge-Critical+Subnetworks+in+Neural+Language+Models&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;1",
        "aff_unique_norm": "EPFL;Swiss Federal Institute of Technology Lausanne",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.epfl.ch;https://www.epfl.ch",
        "aff_unique_abbr": "EPFL;EPFL",
        "aff_campus_unique_index": "0;0;0;0;0",
        "aff_campus_unique": "Lausanne",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Switzerland"
    },
    {
        "title": "Experimental Design for Multi-Channel Imaging via Task-Driven Feature Selection",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18810",
        "id": "MloaGA6WwX",
        "author_site": "Stefano Blumberg, Paddy Slator, Daniel Alexander",
        "tldr": "",
        "abstract": "This paper presents a data-driven, task-specific paradigm for experimental design, to shorten acquisition time, reduce costs, and accelerate the deployment of imaging devices.  Current approaches in experimental design focus on model-parameter estimation and require specification of a particular model, whereas in imaging, other tasks may drive the design.  Furthermore, such approaches often lead to intractable optimization problems in real-world imaging applications. Here we present a new paradigm for experimental design that simultaneously optimizes the design (set of image channels) and trains a machine-learning model to execute a user-specified image-analysis task. The approach obtains data densely-sampled over the measurement space (many image channels) for a small number of acquisitions, then identifies a subset of channels of prespecified size that best supports the task.  We propose a method: TADRED for TAsk-DRiven Experimental Design in imaging, to identify the most informative channel-subset  whilst simultaneously training a network to execute the task given the subset. Experiments demonstrate the potential of TADRED in diverse imaging applications: several clinically-relevant tasks in magnetic resonance imaging; and remote sensing and physiological applications of hyperspectral imaging. Results show substantial improvement over classical experimental design, two recent application-specific methods within the new paradigm, and state-of-the-art approaches in supervised feature selection.  We anticipate further applications of our approach.  Code is available: https://github.com/sbb-gh/experimental-design-multichannel",
        "keywords": "Experimental Design;Supervised Feature Selection;Multi-Channel Imaging;Hyperspectral Imaging;Magnetic Resonance Imaging (MRI);Task-based Image Channel Selection",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Stefano B. Blumberg;Paddy J. Slator;Daniel C. Alexander",
        "authorids": "~Stefano_B._Blumberg1;~Paddy_J._Slator1;~Daniel_C._Alexander1",
        "gender": "M;M;",
        "homepage": "http://www.cs.ucl.ac.uk/staff/d.alexander;https://iris.ucl.ac.uk/iris/browse/profile?upi=PJSLA44;",
        "dblp": "37/6152;205/3369;225/5480.html",
        "google_scholar": "https://scholar.google.co.uk/citations?user=mH-ZOQEAAAAJ;1tiGEUYAAAAJ;KISL_FYAAAAJ",
        "orcid": "0000-0003-2439-350X;0000-0001-6967-989X;",
        "linkedin": "daniel-alexander-2b096737;;",
        "or_profile": "~Daniel_C._Alexander1;~Paddy_John_Slator1;~Stefano_B_Blumberg1",
        "aff": "University College London;Cardiff University;University College London",
        "aff_domain": "ucl.ac.uk;cardiff.ac.uk;ucl.ac.uk",
        "position": "Full Professor;Lecturer;PhD student",
        "bibtex": "@inproceedings{\nblumberg2024experimental,\ntitle={Experimental Design for Multi-Channel Imaging via Task-Driven Feature Selection},\nauthor={Stefano B. Blumberg and Paddy J. Slator and Daniel C. Alexander},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=MloaGA6WwX}\n}",
        "github": "",
        "project": "",
        "reviewers": "e6jZ;aeL1;FaxL;Kzed",
        "pdf_size": 2650220,
        "rating": "6;6;6;6",
        "confidence": "2;3;3;2",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;2",
        "presentation": "3;4;2;2",
        "wc_summary": "29;81;59;101",
        "wc_strengths": "30;92;24;29",
        "wc_weaknesses": "69;231;44;107",
        "wc_questions": "48;25;1;111",
        "wc_review": "176;429;128;348",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "544;335;368;777",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;2;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            2.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            67.5,
            26.7348087705897
        ],
        "wc_strengths_avg": [
            43.75,
            27.949731662397046
        ],
        "wc_weaknesses_avg": [
            112.75,
            71.86228148340408
        ],
        "wc_questions_avg": [
            46.25,
            40.91072597742553
        ],
        "wc_review_avg": [
            270.25,
            122.84619448725304
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            506.0,
            175.47791883881004
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6632663124146094678&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=MloaGA6WwX",
        "pdf": "https://openreview.net/pdf?id=MloaGA6WwX",
        "email": "ucl.ac.uk;cardiff.ac.uk;ucl.ac.uk",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University College London;Cardiff University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ucl.ac.uk;https://www.cardiff.ac.uk",
        "aff_unique_abbr": "UCL;Cardiff",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "Mm3TSPRUKc",
        "title": "Dynamics of Instruction Tuning: Each Ability of Large Language Models Has Its Own Growth Pace",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Instruction tuning is a burgeoning method to elicit the general intelligence of Large Language Models (LLMs). However, the creation of instruction data is still largely heuristic, leading to significant variation in quality and distribution across existing datasets. Experimental conclusions drawn from these datasets are also inconsistent, with some studies emphasizing the importance of scaling instruction numbers, while others argue that a limited number of samples suffice. To better understand data construction guidelines, we deepen our focus from the overall model performance to the growth of each underlying ability, such as creative writing, code generation, and logical reasoning. We systematically investigate the effects of data volume, parameter size, and data construction methods on the development of various abilities, using hundreds of model checkpoints (7b to 33b) fully instruction-tuned on a new collection of over 40k human-curated instruction data. This proposed dataset is stringently quality-controlled and categorized into ten distinct LLM abilities. Our study reveals three primary findings: (i) Despite data volume and parameter scale directly impacting models' overall performance, some abilities are more responsive to their increases and can be effectively trained using limited data, while some are highly resistant to these changes. (ii) Human-curated data strongly outperforms synthetic data from GPT-4 in efficiency and can constantly enhance model performance with volume increases, but is unachievable with synthetic data. (iii) Instruction data brings powerful cross-ability generalization, with evaluation results on out-of-domain data mirroring the first two observations. Furthermore, we demonstrate how these findings can guide more efficient data constructions, leading to practical performance improvements on public benchmarks.",
        "keywords": "instruction tuning;large language models;natural language processing",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/672ad79e3abd6d01649e8cfc7178d30ad31bd180.zip",
        "author": "Chiyu Song;Zhanchao Zhou;Jianhao Yan;Yuejiao Fei;Zhenzhong Lan;Yue Zhang",
        "authorids": "~Chiyu_Song1;~Zhanchao_Zhou2;~Jianhao_Yan1;~Yuejiao_Fei1;~Zhenzhong_Lan2;~Yue_Zhang7",
        "gender": ";M;M;;;M",
        "homepage": ";https://dll-wu.github.io/;;https://scholar.google.com.hk/citations?user=gADsyq8AAAAJ&hl=en&oi=ao;;http://frcchang.github.io",
        "dblp": "294/4603;;242/4255;;27/3780;47/722-4",
        "google_scholar": "6kN-MBQAAAAJ;;https://scholar.google.com.hk/citations?user=pnKLj_wAAAAJ;https://scholar.google.com.hk/citations?user=gADsyq8AAAAJ;tlDABkgAAAAJ;",
        "orcid": ";;;;;0000-0002-5214-2268",
        "linkedin": "chiyu-song/;;;;;",
        "or_profile": "~Chiyu_Song1;~Zhanchao_Zhou2;~Jianhao_Yan1;~Yuejiao_Fei1;~Zhenzhong_Lan2;~Yue_Zhang7",
        "aff": "Westlake University;Zhejiang University;Westlake University;Westlake University;Westlake University;Westlake University",
        "aff_domain": "westlake.edu.cn;zju.edu.cn;westlake.edu.cn;westlake.edu;westlake.edu.cn;westlake.edu.cn",
        "position": "PhD student;PhD student;PhD student;PhD student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nsong2024dynamics,\ntitle={Dynamics of Instruction Tuning: Each Ability of Large Language Models Has Its Own Growth Pace},\nauthor={Chiyu Song and Zhanchao Zhou and Jianhao Yan and Yuejiao Fei and Zhenzhong Lan and Yue Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=Mm3TSPRUKc}\n}",
        "github": "",
        "project": "",
        "reviewers": "e9FS;G2Rz;ezqx;29zA",
        "site": "https://openreview.net/forum?id=Mm3TSPRUKc",
        "pdf_size": 0,
        "rating": "3;3;5;6",
        "confidence": "4;4;4;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "64;57;111;98",
        "wc_strengths": "43;43;75;106",
        "wc_weaknesses": "146;226;383;155",
        "wc_questions": "19;71;2;144",
        "wc_review": "272;397;571;503",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            82.5,
            22.610838109190027
        ],
        "wc_strengths_avg": [
            66.75,
            26.156978036462853
        ],
        "wc_weaknesses_avg": [
            227.5,
            94.97499670966037
        ],
        "wc_questions_avg": [
            59.0,
            55.2675311552814
        ],
        "wc_review_avg": [
            435.75,
            113.06054793781958
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.7777777777777777,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6012438074284511124&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;0;0;0",
        "aff_unique_norm": "Westlake University;Zhejiang University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.westlake.edu.cn;https://www.zju.edu.cn",
        "aff_unique_abbr": "WU;ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "Mmd7EXdVXG",
        "title": "Entropy-enhanced context-aware event prediction based on ontology and external knowledge",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Predicting impending events is an attractive task of natural language processing (NLP), which plays an important role in many fields such as emergency management. Current predominant event prediction method is to construct event graphs and learn event representations through graph neural networks (GNNs), which mainly utilizes the semantic and structural information of events to obtain subsequent events, but ignoring the context of event. Meanwhile, these methods does not address the issue of heterogeneity of nodes and edges in event networks. Last, the lack of high-quality event datasets is also a challenge for event prediction. In response to the above issues, this paper proposes the Entropy-enhanced Context-aware Ontology-based model (ECO), which introduces the Entropy calculation module to learn the  heterogeneity of nodes and edges, thereby better learning event representations. Furthermore, external knowledge is introduced to the event graph to enhance the semantic information of events during the prediction. Finally, we design a context-aware event ontology for maritime emergency management, and construct a real-world dataset, Maritime Emergency Events Dataset (MEED), to verify our prediction method. Experiments on node classification and link prediction show effectiveness and practicability of our proposed model in realistic scenarios.",
        "keywords": "Event prediction;Event Graph;Ontology;Graph Entropy;Context Aware;External Knowledge;Graph Neural Networks",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Tong Xin;Wei Liu",
        "authorids": "~Tong_Xin1;~Wei_Liu50",
        "gender": "F;M",
        "homepage": "https://blog.csdn.net/Gina_Xin?type=blog;",
        "dblp": ";49/3283-27",
        "google_scholar": ";jsa0ZNkAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Tong_Xin1;~Wei_Liu50",
        "aff": "Shanghai University;Shanghai University",
        "aff_domain": "shu.edu.cn;shu.edu.cn",
        "position": "MS student;Associate Professor",
        "bibtex": "@misc{\nxin2024entropyenhanced,\ntitle={Entropy-enhanced context-aware event prediction based on ontology and external knowledge},\nauthor={Tong Xin and Wei Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=Mmd7EXdVXG}\n}",
        "github": "",
        "project": "",
        "reviewers": "PDSR;Mc25;gtQg;JEH5",
        "site": "https://openreview.net/forum?id=Mmd7EXdVXG",
        "pdf_size": 4059893,
        "rating": "3;3;3;5",
        "confidence": "4;4;5;4",
        "soundness": "1;2;2;2",
        "contribution": "1;2;2;3",
        "presentation": "1;1;2;3",
        "wc_summary": "69;95;55;101",
        "wc_strengths": "36;57;65;45",
        "wc_weaknesses": "535;196;354;405",
        "wc_questions": "8;4;3;23",
        "wc_review": "648;352;477;574",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            80.0,
            18.788294228055936
        ],
        "wc_strengths_avg": [
            50.75,
            11.098986440211556
        ],
        "wc_weaknesses_avg": [
            372.5,
            121.40531289857128
        ],
        "wc_questions_avg": [
            9.5,
            8.0156097709407
        ],
        "wc_review_avg": [
            512.75,
            110.86337312205505
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:z47H0LAPtWMJ:scholar.google.com/&scioq=Entropy-enhanced+context-aware+event+prediction+based+on+ontology+and+external+knowledge&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Shanghai University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.shu.edu.cn",
        "aff_unique_abbr": "SHU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "DyST: Towards Dynamic Neural Scene Representations on Real-World Videos",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18809",
        "id": "MnMWa94t12",
        "author_site": "Maximilian Seitzer, Sjoerd van Steenkiste, Thomas Kipf, Klaus Greff, Mehdi S. M. Sajjadi",
        "tldr": "",
        "abstract": "Visual understanding of the world goes beyond the semantics and flat structure of individual images. In this work, we aim to capture both the 3D structure and dynamics of real-world scenes from monocular real-world videos. Our Dynamic Scene Transformer (DyST) model leverages recent work in neural scene representation to learn a latent decomposition of monocular real-world videos into scene content, per-view scene dynamics, and camera pose. This separation is achieved through a novel co-training scheme on monocular videos and our new synthetic dataset DySO. DyST learns tangible latent representations for dynamic scenes that enable view generation with separate control over the camera and the content of the scene.",
        "keywords": "neural scene representations;scene representations;representation learning;novel view synthesis",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/0350fddb5115fc6cb18a87230fa541096caec734.zip",
        "author": "Maximilian Seitzer;Sjoerd van Steenkiste;Thomas Kipf;Klaus Greff;Mehdi S. M. Sajjadi",
        "authorids": "~Maximilian_Seitzer1;~Sjoerd_van_Steenkiste1;~Thomas_Kipf2;~Klaus_Greff1;~Mehdi_S._M._Sajjadi1",
        "gender": ";M;;M;Unspecified",
        "homepage": ";http://www.sjoerdvansteenkiste.com/;;http://qwlouse.github.io/;http://msajjadi.com",
        "dblp": ";183/9326;;76/11430;164/6190",
        "google_scholar": ";i-AStBYAAAAJ;;https://scholar.google.ch/citations?user=OcownLgAAAAJ;https://scholar.google.de/citations?user=rHF25YEAAAAJ",
        "orcid": ";;;0000-0001-6982-0937;0000-0002-6002-2370",
        "linkedin": ";;;;",
        "or_profile": "~Maximilian_Seitzer1;~Sjoerd_van_Steenkiste1;~Thomas_Kipf2;~Klaus_Greff1;~Mehdi_S._M._Sajjadi1",
        "aff": ";Google;;Google;Google DeepMind",
        "aff_domain": ";google.com;;google.com;google.com",
        "position": ";Researcher;;Researcher;Researcher",
        "bibtex": "@inproceedings{\nseitzer2024dyst,\ntitle={Dy{ST}: Towards Dynamic Neural Scene Representations on Real-World Videos},\nauthor={Maximilian Seitzer and Sjoerd van Steenkiste and Thomas Kipf and Klaus Greff and Mehdi S. M. Sajjadi},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=MnMWa94t12}\n}",
        "github": "",
        "project": "",
        "reviewers": "XJou;Qe3y;whxo",
        "pdf_size": 4530298,
        "rating": "6;6;8",
        "confidence": "4;3;3",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "3;3;3",
        "wc_summary": "84;97;116",
        "wc_strengths": "88;87;166",
        "wc_weaknesses": "115;234;61",
        "wc_questions": "8;63;63",
        "wc_review": "295;481;406",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "579;1232;393",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;2;1",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            99.0,
            13.140268896284683
        ],
        "wc_strengths_avg": [
            113.66666666666667,
            37.007506746004324
        ],
        "wc_weaknesses_avg": [
            136.66666666666666,
            72.26955713776644
        ],
        "wc_questions_avg": [
            44.666666666666664,
            25.927248643506744
        ],
        "wc_review_avg": [
            394.0,
            76.40680597957227
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            734.6666666666666,
            359.7724589545762
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13474344175386744588&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=MnMWa94t12",
        "pdf": "https://openreview.net/pdf?id=MnMWa94t12",
        "email": ";google.com;;google.com;google.com",
        "author_num": 5,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Google",
        "aff_unique_dep": "Google",
        "aff_unique_url": "https://www.google.com",
        "aff_unique_abbr": "Google",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Mountain View;",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "Mngdhgi711",
        "title": "OKR-Agent: An Object and Key Results Driven Agent System with Hierarchical Self-Collaboration and Self-Evaluation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this study, we introduce the concept of OKR-Agent designed to enhance the capabilities of Large Language Models (LLMs) in task-solving. Our approach utilizes both self-collaboration and self-correction mechanism, facilitated by hierarchical agents, to address the inherent complexities in task-solving. Our key observations are two-fold: first, effective task-solving demands in-depth domain knowledge and intricate reasoning, for which deploying specialized agents for individual sub-tasks can markedly enhance LLM performance. Second, task-solving intrinsically adheres to a hierarchical execution structure, comprising both high-level strategic planning and detailed task execution. Towards this end, our OKR-Agent paradigm aligns closely with this hierarchical structure, promising enhanced efficacy and adaptability across a range of scenarios. Specifically, our framework includes two novel modules: hierarchical \\textbf{O}bjects and \\textbf{K}ey \\textbf{R}esults generation and multi-level evaluation, each contributing to more efficient and robust task-solving. In practical, hierarchical OKR generation decomposes Objects into multiple sub-Objects and assigns new agents based on key results and agent responsibilities. These agents subsequently elaborate on their designated tasks and may further decompose them as necessary. Such generation operates recursively and hierarchically, culminating in a comprehensive set of detailed solutions. The multi-level evaluation module of OKR-Agent refines solution by leveraging feedback from all associated agents, optimizing each step of the process. This ensures solution is accurate, practical, and effectively address intricate task requirements, enhancing the overall reliability and quality of the outcome. Experimental results also show our method outperforms the previous methods on several tasks.",
        "keywords": "Large Language Model;Agent",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/0402b6fa9362d1b4ac080eb276b3df2ab579dbc5.pdf",
        "author": "Yi Zheng;Haibin Huang;Chongyang Ma;Kanle Shi",
        "authorids": "~Yi_Zheng8;~Haibin_Huang1;~Chongyang_Ma1;~Kanle_Shi1",
        "gender": ";M;;",
        "homepage": ";https://brotherhuang.github.io/;;",
        "dblp": ";;;",
        "google_scholar": ";YDl1M80AAAAJ;;",
        "orcid": ";;;",
        "linkedin": "%E5%B1%B9-%E9%83%91-607614144/;;;",
        "or_profile": "~Yi_Zheng8;~Haibin_Huang1;~Chongyang_Ma1;~Kanle_Shi1",
        "aff": "Kuaishou Technology;Kuaishou Technology;;",
        "aff_domain": "kuaishou.com;kuaishou.com;;",
        "position": "Sr.Research Scientist;Sr.Research Scientist;;",
        "bibtex": "@misc{\nzheng2024okragent,\ntitle={{OKR}-Agent: An Object and Key Results Driven Agent System with Hierarchical Self-Collaboration and Self-Evaluation},\nauthor={Yi Zheng and Haibin Huang and Chongyang Ma and Kanle Shi},\nyear={2024},\nurl={https://openreview.net/forum?id=Mngdhgi711}\n}",
        "github": "",
        "project": "",
        "reviewers": "YAvt;ndXE;gKgL;EcJ8",
        "site": "https://openreview.net/forum?id=Mngdhgi711",
        "pdf_size": 23026758,
        "rating": "3;5;5;6",
        "confidence": "4;3;3;4",
        "soundness": "2;3;2;3",
        "contribution": "1;2;3;3",
        "presentation": "3;2;1;2",
        "wc_summary": "44;79;92;163",
        "wc_strengths": "31;27;38;112",
        "wc_weaknesses": "140;88;86;384",
        "wc_questions": "86;25;162;121",
        "wc_review": "301;219;378;780",
        "wc_reply_reviewers": "0;26;0;32",
        "wc_reply_authors": "644;153;515;482",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            94.5,
            43.26950427263987
        ],
        "wc_strengths_avg": [
            52.0,
            34.86402156952063
        ],
        "wc_weaknesses_avg": [
            174.5,
            122.8769709913131
        ],
        "wc_questions_avg": [
            98.5,
            50.24191477242881
        ],
        "wc_review_avg": [
            419.5,
            215.59510662350385
        ],
        "wc_reply_reviewers_avg": [
            14.5,
            14.654350889752845
        ],
        "wc_reply_authors_avg": [
            448.5,
            181.0283127027372
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.2294157338705618,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:-sadFVgq7GYJ:scholar.google.com/&scioq=OKR-Agent:+An+Object+and+Key+Results+Driven+Agent+System+with+Hierarchical+Self-Collaboration+and+Self-Evaluation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Kuaishou Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kuaishou.com",
        "aff_unique_abbr": "Kuaishou",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "MpWRCiw8g5",
        "title": "JOSENet: A Joint Stream Embedding Network for Violence Detection in Surveillance Videos",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Due to the ever-increasing availability of video surveillance cameras and the growing need for crime prevention, the violence detection task is attracting greater attention from the research community. With respect to other action recognition tasks, violence detection in surveillance videos shows additional issues. Indeed, violence detection requires real-world fights from surveillance cameras and available datasets seem to be very small compared with other action recognition datasets. Moreover, in surveillance applications, people in the scenes always differ for each video and the background of the footage differs for each camera. Also, violent actions in real-life surveillance videos must be detected quickly to prevent unwanted consequences, thus models would definitely benefit from a reduction in memory usage and computational costs. Such problems make classical action recognition methods difficult to be adopted. To tackle such problems, we introduce JOSENet, a novel self-supervised framework that provides outstanding performance for violence detection in surveillance videos. The proposed model receives two spatiotemporal video streams, i.e., RGB frames and optical flows, and involves a new regularized self-supervised learning approach for videos. JOSENet provides improved performance while requiring one-fourth of the number of frames per video segment and a reduced frame rate compared to state-of-the-art methods.",
        "keywords": "Self-Supervised Learning;Joint Embedding Architectures;Violence Detection;Action Recognition;Multimodal Deep Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/5df31913327f0402a99db54ae1f1d6459e5bbc8b.zip",
        "author": "Pietro Nardelli;Danilo Comminiello",
        "authorids": "~Pietro_Nardelli1;~Danilo_Comminiello1",
        "gender": "M;M",
        "homepage": "https://github.com/pietro-nardelli;https://danilocomminiello.site.uniroma1.it/",
        "dblp": ";33/9433",
        "google_scholar": "TAHi-44AAAAJ;https://scholar.google.it/citations?user=H3Y52cMAAAAJ",
        "orcid": "0000-0002-9093-1532;0000-0003-4067-4504",
        "linkedin": "pietro-nardelli/;danilocomminiello/",
        "or_profile": "~Pietro_Nardelli1;~Danilo_Comminiello1",
        "aff": ";Sapienza University of Rome",
        "aff_domain": ";uniroma1.it",
        "position": ";Associate Professor",
        "bibtex": "@misc{\nnardelli2024josenet,\ntitle={{JOSEN}et: A Joint Stream Embedding Network for Violence Detection in Surveillance Videos},\nauthor={Pietro Nardelli and Danilo Comminiello},\nyear={2024},\nurl={https://openreview.net/forum?id=MpWRCiw8g5}\n}",
        "github": "",
        "project": "",
        "reviewers": "tKHs;o7vs;94ds;sND9",
        "site": "https://openreview.net/forum?id=MpWRCiw8g5",
        "pdf_size": 3995719,
        "rating": "3;3;3;5",
        "confidence": "3;4;3;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;4",
        "presentation": "1;2;1;3",
        "wc_summary": "92;99;76;74",
        "wc_strengths": "83;39;27;119",
        "wc_weaknesses": "323;231;236;92",
        "wc_questions": "223;2;31;38",
        "wc_review": "721;371;370;323",
        "wc_reply_reviewers": "58;0;0;0",
        "wc_reply_authors": "1145;985;606;787",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "9;5;4;6",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            85.25,
            10.568230693924125
        ],
        "wc_strengths_avg": [
            67.0,
            36.55133376499413
        ],
        "wc_weaknesses_avg": [
            220.5,
            82.71789407377342
        ],
        "wc_questions_avg": [
            73.5,
            87.36274949885677
        ],
        "wc_review_avg": [
            446.25,
            159.80828357754174
        ],
        "wc_reply_reviewers_avg": [
            14.5,
            25.11473670974872
        ],
        "wc_reply_authors_avg": [
            880.75,
            203.08418820774796
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            6.0,
            1.8708286933869707
        ],
        "replies_avg": [
            32,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:a2RoR7QAkHcJ:scholar.google.com/&scioq=JOSENet:+A+Joint+Stream+Embedding+Network+for+Violence+Detection+in+Surveillance+Videos&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "Sapienza University of Rome",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uniroma1.it",
        "aff_unique_abbr": "Sapienza",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Rome",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Italy"
    },
    {
        "title": "DittoGym: Learning to Control Soft Shape-Shifting Robots",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18808",
        "id": "MpyFAhH9CK",
        "author_site": "Suning Huang, Boyuan Chen, Huazhe Xu, Vincent Sitzmann",
        "tldr": "",
        "abstract": "Robot co-design, where the morphology of a robot is optimized jointly with a learned policy to solve a specific task, is an emerging area of research. It holds particular promise for soft robots, which are amenable to novel manufacturing techniques that can realize learned morphologies and actuators. Inspired by nature and recent novel robot designs, we propose to go a step further and explore the novel reconfigurable robots, defined as robots that can change their morphology within their lifetime. We formalize control of reconfigurable soft robots as a high-dimensional reinforcement learning (RL) problem. We unify morphology change, locomotion, and environment interaction in the same action space, and introduce an appropriate, coarse-to-fine curriculum that enables us to discover policies that accomplish fine-grained control of the resulting robots. We also introduce DittoGym, a comprehensive RL benchmark for reconfigurable soft robots that require fine-grained morphology changes to accomplish the tasks. Finally, we evaluate our proposed coarse-to-fine algorithm on DittoGym,  and demonstrate robots that learn to change their morphology several times within a sequence, uniquely enabled by our RL algorithm. More results are available at https://dittogym.github.io.",
        "keywords": "Deep Reinforcement Learning;Soft Robot",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/18886a8879866926e1eb7dfe4771dc70e1541e26.zip",
        "author": "Suning Huang;Boyuan Chen;Huazhe Xu;Vincent Sitzmann",
        "authorids": "~Suning_Huang1;~Boyuan_Chen2;~Huazhe_Xu1;~Vincent_Sitzmann1",
        "gender": ";M;M;M",
        "homepage": ";https://boyuan.space/;http://hxu.rocks;https://vsitzmann.github.io",
        "dblp": ";193/7174-3.html;164/9006;192/1958",
        "google_scholar": ";rEL4-fgAAAAJ;t9HPFawAAAAJ;X44QVV4AAAAJ",
        "orcid": ";0009-0009-1960-9135;;0000-0002-0107-5704",
        "linkedin": ";boyuan99/;;vincentsitzmann/",
        "or_profile": "~Suning_Huang1;~Boyuan_Chen2;~Huazhe_Xu1;~Vincent_Sitzmann1",
        "aff": ";Massachusetts Institute of Technology;Tsinghua University;Massachusetts Institute of Technology",
        "aff_domain": ";mit.edu;tsinghua.edu.cn;mit.edu",
        "position": ";PhD student;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nhuang2024dittogym,\ntitle={DittoGym: Learning to Control Soft Shape-Shifting Robots},\nauthor={Suning Huang and Boyuan Chen and Huazhe Xu and Vincent Sitzmann},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=MpyFAhH9CK}\n}",
        "github": "",
        "project": "",
        "reviewers": "UEFW;NgHH;5Sv3;mQFN",
        "pdf_size": 2385791,
        "rating": "5;5;6;8",
        "confidence": "2;4;2;4",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;2;3",
        "wc_summary": "54;63;114;81",
        "wc_strengths": "33;47;51;54",
        "wc_weaknesses": "247;245;17;231",
        "wc_questions": "45;5;29;40",
        "wc_review": "379;360;211;406",
        "wc_reply_reviewers": "182;0;738;108",
        "wc_reply_authors": "1491;1614;1549;1024",
        "reply_reviewers": "1;0;4;2",
        "reply_authors": "4;3;4;4",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.0,
            1.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            78.0,
            22.94558781116753
        ],
        "wc_strengths_avg": [
            46.25,
            8.042853971072706
        ],
        "wc_weaknesses_avg": [
            185.0,
            97.19053451854249
        ],
        "wc_questions_avg": [
            29.75,
            15.417117110536587
        ],
        "wc_review_avg": [
            339.0,
            75.68685486925719
        ],
        "wc_reply_reviewers_avg": [
            257.0,
            285.147330339949
        ],
        "wc_reply_authors_avg": [
            1419.5,
            232.4505323719436
        ],
        "reply_reviewers_avg": [
            1.75,
            1.479019945774904
        ],
        "reply_authors_avg": [
            3.75,
            0.4330127018922193
        ],
        "replies_avg": [
            31,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.40824829046386296,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2852959165391703351&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=MpyFAhH9CK",
        "pdf": "https://openreview.net/pdf?id=MpyFAhH9CK",
        "email": ";mit.edu;tsinghua.edu.cn;mit.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Massachusetts Institute of Technology;Tsinghua University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://web.mit.edu;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "MIT;THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "MqEQbvPvkE",
        "title": "Causal Estimation of Exposure Shifts with Neural Networks: Evaluating the Health Benefits of Stricter Air Quality Standards in the US",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In policy research, one of the most critical analytic tasks is to estimate the causal effect of a policy-relevant shift to the distribution of a continuous exposure/treatment on an outcome of interest. We call this problem *shift-response function* (SRF) estimation. Existing neural network methods involving robust causal-effect estimators lack theoretical guarantees and practical implementations for SRF estimation. Motivated by a key policy-relevant question in public health, we develop a neural network method and its theoretical underpinnings to estimate SRFs with robustness and efficiency guarantees. We then apply our method to data consisting of 68 million individuals and 27 million deaths across the U.S. to estimate the causal effect from revising the US National Ambient Air Quality Standards (NAAQS) for $\\text{PM}_{2.5}$ from 12 to 9 $\\mu g/m^3$ . This change has been recently proposed by the US Environmental Protection Agency (EPA). Our goal is to estimate, for the first time, the reduction in deaths that would result from this anticipated revision using causal methods for SRFs. Our proposed method, called Targeted Regularization for Exposure Shifts with Neural Networks (TRESNET), contributes to the neural network literature for causal inference in two ways: first, it proposes a targeted regularization loss with theoretical properties that ensure double robustness and achieves asymptotic efficiency specific for SRF estimation; second, it enables loss functions from the exponential family of distributions to accommodate non-continuous outcome distributions (such as hospitalization or mortality counts). We complement our application with benchmark experiments that demonstrate TRESNET's broad applicability and competitiveness.",
        "keywords": "causal inference; neural networks; air pollution; stochastic interventions; doubly robust inference",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Mauricio Tec;Oladimeji Mudele;Kevin Josey;Francesca Dominici",
        "authorids": "~Mauricio_Tec1;~Oladimeji_Mudele1;~Kevin_Josey1;~Francesca_Dominici2",
        "gender": "M;M;M;F",
        "homepage": "https://mauriciogtec.github.io/;;;https://www.hsph.harvard.edu/francesca-dominici/",
        "dblp": ";;;220/5365",
        "google_scholar": ";https://scholar.google.it/citations?user=AE50eSkAAAAJ;;https://scholar.google.co.uk/citations?user=RSwElNMAAAAJ",
        "orcid": "0000-0002-1853-5842;;0000-0003-2490-6272;",
        "linkedin": "mauriciogtec/;;kevjosey/;",
        "or_profile": "~Mauricio_Tec1;~Oladimeji_Mudele1;~Kevin_Josey1;~Francesca_Dominici2",
        "aff": "Harvard University;;;Harvard University",
        "aff_domain": "harvard.edu;;;harvard.edu",
        "position": "Postdoc;;;Full Professor",
        "bibtex": "@misc{\ntec2024causal,\ntitle={Causal Estimation of Exposure Shifts with Neural Networks: Evaluating the Health Benefits of Stricter Air Quality Standards in the {US}},\nauthor={Mauricio Tec and Oladimeji Mudele and Kevin Josey and Francesca Dominici},\nyear={2024},\nurl={https://openreview.net/forum?id=MqEQbvPvkE}\n}",
        "github": "",
        "project": "",
        "reviewers": "vbhD;xEjj;Ka1h;KwaZ",
        "site": "https://openreview.net/forum?id=MqEQbvPvkE",
        "pdf_size": 1476313,
        "rating": "3;5;6;6",
        "confidence": "3;3;4;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;3;4",
        "wc_summary": "73;31;69;87",
        "wc_strengths": "38;156;10;46",
        "wc_weaknesses": "331;2;73;25",
        "wc_questions": "4;151;4;71",
        "wc_review": "446;340;156;229",
        "wc_reply_reviewers": "0;0;33;15",
        "wc_reply_authors": "695;679;529;388",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "2;2;3;3",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            65.0,
            20.73644135332772
        ],
        "wc_strengths_avg": [
            62.5,
            55.61249859518991
        ],
        "wc_weaknesses_avg": [
            107.75,
            131.41418302451223
        ],
        "wc_questions_avg": [
            57.5,
            60.516526668340774
        ],
        "wc_review_avg": [
            292.75,
            110.09399393245755
        ],
        "wc_reply_reviewers_avg": [
            12.0,
            13.583077707206124
        ],
        "wc_reply_authors_avg": [
            572.75,
            124.78055737974566
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.4714045207910316,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:YLiKbmmlYyIJ:scholar.google.com/&scioq=Causal+Estimation+of+Exposure+Shifts+with+Neural+Networks:+Evaluating+the+Health+Benefits+of+Stricter+Air+Quality+Standards+in+the+US&hl=en&as_sdt=0,33",
        "gs_version_total": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Harvard University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.harvard.edu",
        "aff_unique_abbr": "Harvard",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Mqukp3Lsnt",
        "title": "Space-Time Attention with Shifted Non-Local Search",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Efficiently computing attention maps for videos is challenging due to the motion of objects between frames. While a standard non-local search is high-quality for a window surrounding each query point, the window's small size cannot accommodate motion. Methods for long-range motion use an auxiliary network to predict the most similar key coordinates as offsets from each query location. However, accurately predicting this flow field of offsets remains challenging, even for large-scale networks. Small spatial inaccuracies significantly impact the attention module's quality. This paper proposes a search strategy that combines the quality of a non-local search with the range of predicted offsets. The method, named Shifted Non-Local Search, executes a small grid search surrounding the predicted offsets to correct small spatial errors. Our method's in-place computation consumes 10 times less memory and is over 3 times faster than previous work. Experimentally, correcting the small spatial errors improves the video frame alignment quality by over 3 dB PSNR. Our search upgrades existing space-time attention modules, which improves video denoising results by 0.30 dB PSNR for a 7.5\\% increase in overall runtime. We integrate our space-time attention module into a UNet-like architecture to achieve state-of-the-art results on video denoising.",
        "keywords": "space-time attention;non-local search;video denoising",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/bbc4ae4de670a88c9c847009eb4ac6a195346685.zip",
        "author": "Kent Gauen;Stanley H. Chan",
        "authorids": "~Kent_Gauen1;~Stanley_H._Chan2",
        "gender": "M;",
        "homepage": "https://gauenk.github.io/;",
        "dblp": "195/4143;",
        "google_scholar": "CRbbyHMAAAAJ;",
        "orcid": ";",
        "linkedin": "gauenk/;",
        "or_profile": "~Kent_Gauen1;~Stanley_H._Chan2",
        "aff": "Purdue University;",
        "aff_domain": "purdue.edu;",
        "position": "PhD student;",
        "bibtex": "@misc{\ngauen2024spacetime,\ntitle={Space-Time Attention with Shifted Non-Local Search},\nauthor={Kent Gauen and Stanley H. Chan},\nyear={2024},\nurl={https://openreview.net/forum?id=Mqukp3Lsnt}\n}",
        "github": "",
        "project": "",
        "reviewers": "CKa5;UHjC;U4AC",
        "site": "https://openreview.net/forum?id=Mqukp3Lsnt",
        "pdf_size": 8654976,
        "rating": "5;5;5",
        "confidence": "2;3;2",
        "soundness": "2;2;2",
        "contribution": "2;2;2",
        "presentation": "1;2;2",
        "wc_summary": "153;39;71",
        "wc_strengths": "80;43;53",
        "wc_weaknesses": "297;133;111",
        "wc_questions": "2;76;2",
        "wc_review": "532;291;237",
        "wc_reply_reviewers": "0;13;44",
        "wc_reply_authors": "345;731;190",
        "reply_reviewers": "0;1;1",
        "reply_authors": "2;2;2",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            87.66666666666667,
            48.00925836637022
        ],
        "wc_strengths_avg": [
            58.666666666666664,
            15.627610892974722
        ],
        "wc_weaknesses_avg": [
            180.33333333333334,
            82.98326471176115
        ],
        "wc_questions_avg": [
            26.666666666666668,
            34.883934538536344
        ],
        "wc_review_avg": [
            353.3333333333333,
            128.24542443646436
        ],
        "wc_reply_reviewers_avg": [
            19.0,
            18.457157599876172
        ],
        "wc_reply_authors_avg": [
            422.0,
            227.47454069997957
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:KvZynQake0oJ:scholar.google.com/&scioq=Space-Time+Attention+with+Shifted+Non-Local+Search&hl=en&as_sdt=0,33",
        "gs_version_total": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "Purdue University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.purdue.edu",
        "aff_unique_abbr": "Purdue",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "MrOefpTvev",
        "title": "Rethinking Texture Patterns in Transformer Neural NetWork for Medical Image Analysis",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Lesion identification has been known as a major purpose in computer-aided diagnosis (CADs) and one of key tasks in radiomics.  This study aims to explore the potential of transformer neural network by introducing texture patterns and features to fine-tune the learning model for lesion differentiation from the benign tissues.  We proposed texture transformer network (TxTN) by integrating three texture layers in vision transformer (ViT) to enhance the discriminative capability for medical image analysis.  This inspirational idea is stemmed from one important insight into the architecture of ViT and its major shortcomings including topological destruction, the loss of geometrical information and the lack of global characteristics.  By considering the definition and the property of image texture, ViT and texture pattern have a strong complementary relevance since the locality and globality are two basic requirements of the latter.  Moreover, many well-known texture patterns have very good embeddability in attention mechanism since they are always represented by vectors or matrix, such as gray level co-occurrence matrix (GLCM)and histogram.  Hereafter, we figured out a practical way to combine them by developing some texture pattern layers and a histogram layer to embed into transformer network as the substitute of the pixel projection layer which is the major stem of above drawbacks.  Their combinations not only make full use of advantages of texture and ViT but also have strong potentials to fine-tune the deep learning models by mining more heterogeneous properties from patterns instead of pixels in various imaging modalities.  Therefore, many texture patterns could be re-used in our approach, such as gray level co-occurrence matrix (GLCM), vector quantization (VQ), and so on.  In the preliminary study, our approach selected three texture patterns into TxTN, i.e. GLCM, VQ and Laplacian.  To evaluate the effectiveness of our approach, our approach is finally testified over two public medical datasets and demonstrated very striking performances.",
        "keywords": "machine learning;deep learning;Transformer;texture;lesion differentiatioin",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Weiguo Cao",
        "authorids": "~Weiguo_Cao1",
        "gender": "M",
        "homepage": "https://scholar.google.com/citations?user=qhyM8XEAAAAJ&hl=en&oi=sra",
        "dblp": "09/580",
        "google_scholar": "",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~George_WG_Cao1",
        "aff": "",
        "aff_domain": "",
        "position": "",
        "bibtex": "@misc{\ncao2024rethinking,\ntitle={Rethinking Texture Patterns in Transformer Neural NetWork for Medical Image Analysis},\nauthor={Weiguo Cao},\nyear={2024},\nurl={https://openreview.net/forum?id=MrOefpTvev}\n}",
        "github": "",
        "project": "",
        "reviewers": "yqHn;M5DR;ej1o",
        "site": "https://openreview.net/forum?id=MrOefpTvev",
        "pdf_size": 1046043,
        "rating": "1;3;3",
        "confidence": "4;5;5",
        "soundness": "2;2;3",
        "contribution": "1;2;2",
        "presentation": "2;2;4",
        "wc_summary": "73;42;48",
        "wc_strengths": "39;132;9",
        "wc_weaknesses": "75;838;167",
        "wc_questions": "55;167;4",
        "wc_review": "242;1179;228",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            54.333333333333336,
            13.424687043734847
        ],
        "wc_strengths_avg": [
            60.0,
            52.364109846344185
        ],
        "wc_weaknesses_avg": [
            360.0,
            340.0774421608506
        ],
        "wc_questions_avg": [
            75.33333333333333,
            68.08001827914626
        ],
        "wc_review_avg": [
            549.6666666666666,
            445.04256974910714
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:icmbb6ylFcoJ:scholar.google.com/&scioq=Rethinking+Texture+Patterns+in+Transformer+Neural+NetWork+for+Medical+Image+Analysis&hl=en&as_sdt=0,33",
        "gs_version_total": 0
    },
    {
        "title": "Memorization Capacity of Multi-Head Attention in Transformers",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18807",
        "id": "MrR3rMxqqv",
        "author_site": "Sadegh Mahdavi, Renjie Liao, Christos Thrampoulidis",
        "tldr": "",
        "abstract": "Transformers have become the go-to architecture for language and vision tasks, yet their theoretical properties, especially memorization capacity, remain elusive. This paper investigates the memorization abilities of multi-head attention mechanisms, examining how many example sequences they can memorize, as a function of the number of heads and sequence length. Motivated by experimental findings on vision transformers, we introduce novel assumptions about the linear independence of input data, distinct from the commonly used general-position assumption. Under these assumptions, we demonstrate that an attention layer with $H$ heads, dimension $d$, and context size $n < d,$ featuring $\\Theta(Hd^2)$ parameters, can memorize $\\Omega(Hn)$ examples. Our analysis sheds light on how different attention heads handle various example sequences, aided by the softmax operator\u2019s saturation property. We validate our findings through experiments on synthetic data.",
        "keywords": "Learning Theory;Expressivity;Multi-Head Attention;Transformers",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/7cd6fc6411a3670bad397064a9d3d6987e4e9e8c.zip",
        "author": "Sadegh Mahdavi;Renjie Liao;Christos Thrampoulidis",
        "authorids": "~Sadegh_Mahdavi1;~Renjie_Liao1;~Christos_Thrampoulidis1",
        "gender": "M;M;",
        "homepage": "http://smahdavi.com;https://lrjconan.github.io/;https://sites.google.com/view/cthrampo/home",
        "dblp": "332/2137;08/8180;127/6532",
        "google_scholar": ";2wrS35MAAAAJ;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Sadegh_Mahdavi1;~Renjie_Liao1;~Christos_Thrampoulidis1",
        "aff": "University of British Columbia;Department of Electrical and Computer Engineering, The University of British Columbia;University of British Columbia",
        "aff_domain": "ubc.ca;ece.ubc.ca;ubc.ca",
        "position": "PhD student;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nmahdavi2024memorization,\ntitle={Memorization Capacity of Multi-Head Attention in Transformers},\nauthor={Sadegh Mahdavi and Renjie Liao and Christos Thrampoulidis},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=MrR3rMxqqv}\n}",
        "github": "",
        "project": "",
        "reviewers": "6Bvj;oLtn;mRPx;SUAq",
        "pdf_size": 611748,
        "rating": "6;8;8;8",
        "confidence": "3;3;2;3",
        "soundness": "3;4;2;3",
        "contribution": "3;3;2;3",
        "presentation": "2;4;3;3",
        "wc_summary": "122;109;48;82",
        "wc_strengths": "99;84;50;85",
        "wc_weaknesses": "86;18;149;29",
        "wc_questions": "97;55;4;26",
        "wc_review": "404;266;251;222",
        "wc_reply_reviewers": "0;0;11;31",
        "wc_reply_authors": "1198;471;793;362",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "2;1;2;1",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            90.25,
            28.340562803162538
        ],
        "wc_strengths_avg": [
            79.5,
            18.034688796871432
        ],
        "wc_weaknesses_avg": [
            70.5,
            52.15601595214113
        ],
        "wc_questions_avg": [
            45.5,
            34.80301711058971
        ],
        "wc_review_avg": [
            285.75,
            70.07986515397985
        ],
        "wc_reply_reviewers_avg": [
            10.5,
            12.658988901172163
        ],
        "wc_reply_authors_avg": [
            706.0,
            325.266813554657
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 27,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16503038065170149054&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=MrR3rMxqqv",
        "pdf": "https://openreview.net/pdf?id=MrR3rMxqqv",
        "email": "ubc.ca;ece.ubc.ca;ubc.ca",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of British Columbia",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ubc.ca",
        "aff_unique_abbr": "UBC",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Vancouver",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "title": "PeFLL: Personalized Federated Learning by Learning to Learn",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18806",
        "id": "MrYiwlDRQO",
        "author_site": "Jonathan Scott, Hossein Zakerinia, Christoph Lampert",
        "tldr": "",
        "abstract": "We present PeFLL, a new personalized federated learning algorithm that improves over the state-of-the-art in three aspects: 1) it produces more accurate models, especially in the low-data regime, and not only for clients present during its training phase, but also for any that may emerge in the future; 2) it reduces the amount of on-client computation and client-server communication by providing future clients with ready-to-use personalized models that require no additional finetuning or optimization; 3) it comes with theoretical guarantees that establish generalization from the observed clients to future ones. \nAt the core of PeFLL lies a learning-to-learn approach that jointly trains an embedding network and a hypernetwork. The embedding network is used to represent clients in a latent descriptor space in a way that reflects their similarity to each other. The hypernetwork takes as input such descriptors and outputs the parameters of fully personalized client models. In combination, both networks constitute a learning algorithm that achieves state-of-the-art performance in several personalized federated learning benchmarks.",
        "keywords": "Personalized Federated Learning;Learning-to-Learn",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/de474b02a310f897f048f55bf9a333684101c9a3.zip",
        "author": "Jonathan Scott;Hossein Zakerinia;Christoph H Lampert",
        "authorids": "~Jonathan_Scott1;~Hossein_Zakerinia1;~Christoph_H_Lampert1",
        "gender": ";;M",
        "homepage": ";;http://cvml.ist.ac.at/",
        "dblp": "35/4737;;67/2136",
        "google_scholar": ";;https://scholar.google.at/citations?user=iCf3SwgAAAAJ",
        "orcid": ";;0000-0001-8622-7887",
        "linkedin": "jonny-scott-71b245103/;;",
        "or_profile": "~Jonathan_Scott1;~Hossein_Zakerinia1;~Christoph_H_Lampert1",
        "aff": "Institute of Science and Technology;;Institute of Science and Technology Austria",
        "aff_domain": "ist.ac.at;;ist.ac.at",
        "position": "PhD student;;Professor",
        "bibtex": "@inproceedings{\nscott2024pefll,\ntitle={Pe{FLL}: Personalized Federated Learning by Learning to Learn},\nauthor={Jonathan Scott and Hossein Zakerinia and Christoph H Lampert},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=MrYiwlDRQO}\n}",
        "github": "",
        "project": "",
        "reviewers": "Couf;tVNw;Fw5z",
        "pdf_size": 1029219,
        "rating": "5;6;8",
        "confidence": "3;4;4",
        "soundness": "3;3;3",
        "contribution": "3;3;4",
        "presentation": "3;3;4",
        "wc_summary": "114;98;132",
        "wc_strengths": "96;56;41",
        "wc_weaknesses": "147;72;88",
        "wc_questions": "19;32;534",
        "wc_review": "376;258;795",
        "wc_reply_reviewers": "168;88;876",
        "wc_reply_authors": "850;223;2677",
        "reply_reviewers": "1;1;2",
        "reply_authors": "2;1;5",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            114.66666666666667,
            13.888444437333106
        ],
        "wc_strengths_avg": [
            64.33333333333333,
            23.21398046197353
        ],
        "wc_weaknesses_avg": [
            102.33333333333333,
            32.25247621845836
        ],
        "wc_questions_avg": [
            195.0,
            239.76794336747076
        ],
        "wc_review_avg": [
            476.3333333333333,
            230.42328200268497
        ],
        "wc_reply_reviewers_avg": [
            377.3333333333333,
            354.11987926250185
        ],
        "wc_reply_authors_avg": [
            1250.0,
            1041.0024015342135
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            1.699673171197595
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.7559289460184545,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=305623003722442625&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=MrYiwlDRQO",
        "pdf": "https://openreview.net/pdf?id=MrYiwlDRQO",
        "email": "ist.ac.at;;ist.ac.at",
        "author_num": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Institute of Science and Technology;Institute of Science and Technology Austria",
        "aff_unique_dep": ";",
        "aff_unique_url": ";https://www.ist.ac.at",
        "aff_unique_abbr": ";IST Austria",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "1",
        "aff_country_unique": ";Austria"
    },
    {
        "id": "MrslLZmkye",
        "title": "SEE-OoD: Supervised Exploration for Enhanced Out-of-Distribution Detection",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Current techniques for Out-of-Distribution (OoD) detection predominantly rely on quantifying predictive uncertainty and incorporating model regularization during the training phase, using either real or synthetic OoD samples. However, methods that utilize real OoD samples lack exploration and are prone to overfit the OoD samples at hand. Whereas synthetic samples are often generated based on features extracted from training data, rendering them less effective when the training and OoD data are highly overlapped in the feature space. In this work, we propose a Wasserstein-score-based generative adversarial training scheme to enhance OoD detection accuracy, which, for the first time, performs data augmentation and exploration simultaneously under the supervision of limited OoD samples. Specifically, the generator explores OoD spaces and generates synthetic OoD samples using feedback from the discriminator, while the discriminator exploits both the observed and synthesized samples for OoD detection using a predefined Wasserstein score. We provide theoretical guarantees that the optimal solutions of our generative scheme are statistically achievable through adversarial training in empirical settings. We then demonstrate that the proposed method outperforms state-of-the-art techniques on various computer vision datasets and exhibits superior generalizability to unseen OoD data.",
        "keywords": "Out-of-Distribution Detection;Generative Adversarial Training",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/9561cefd2f50ecc2288b548e7aaceaa2e7a61e46.zip",
        "author": "Xiaoyang Song;Wenbo Sun;Maher Nouiehed;Raed Al Kontar;Jionghua Judy Jin",
        "authorids": "~Xiaoyang_Song1;~Wenbo_Sun1;~Maher_Nouiehed1;~Raed_Al_Kontar1;~Jionghua_Judy_Jin1",
        "gender": "M;M;M;M;",
        "homepage": "https://github.com/Xiaoyang-Song;https://sites.google.com/a/umich.edu/wsun/;;https://alkontar.engin.umich.edu/;https://jhjin.engin.umich.edu/",
        "dblp": ";68/10080;;216/2976;",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;ANPFix4AAAAJ;x0ZxAl4AAAAJ;1xV3rs4AAAAJ",
        "orcid": ";0000-0002-3811-5853;;0000-0002-4546-324X;",
        "linkedin": "xiaoyangsong/;;;raed-kontar/;https://www.linkedin.com/feed/?midToken=AQEwjSmrl6zFHw&midSig=37t7bnuoUTgGY1&trk=eml-email_pymk_02-header-0-home_glimmer&trkEmail=eml-email_pymk_02-header-0-home_glimmer-null-25z24x~ln0zo94s~la-null-null&eid=25z24x-ln0zo94s-la&otpToken=MTMwNjFlZTkxNDI4YzhjMmI1MjQwNGVjNGYxYmUwYjM4N2NlZDY0NDk4YTk4NzYxNzBjNDA5Njk0NzVmNTVmNWY0ZGZiMTgyMTRmMWNkZmE2NjlhODZkZWIwZWQ5ZDdiY2I2MjBmOTFiMzgxZmQ1OTliNmMsMSwx",
        "or_profile": "~Xiaoyang_Song1;~Wenbo_Sun1;~Maher_Nouiehed1;~Raed_Al_Kontar1;~Jionghua_Judy_Jin1",
        "aff": "University of Michigan - Ann Arbor;University of Michigan - Ann Arbor;American University of Beirut;University of Michigan - Ann Arbor;University of Michigan - Ann Arbor",
        "aff_domain": "umich.edu;umich.edu;aub.edu.lb;umich.edu;umich.edu",
        "position": "PhD student;Researcher;Assistant Professor;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nsong2024seeood,\ntitle={{SEE}-OoD: Supervised Exploration for Enhanced Out-of-Distribution Detection},\nauthor={Xiaoyang Song and Wenbo Sun and Maher Nouiehed and Raed Al Kontar and Jionghua Judy Jin},\nyear={2024},\nurl={https://openreview.net/forum?id=MrslLZmkye}\n}",
        "github": "",
        "project": "",
        "reviewers": "BP77;cBKA;Qajt;8gYg",
        "site": "https://openreview.net/forum?id=MrslLZmkye",
        "pdf_size": 5648905,
        "rating": "3;3;3;8",
        "confidence": "4;5;5;4",
        "soundness": "3;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "129;57;47;127",
        "wc_strengths": "88;49;49;50",
        "wc_weaknesses": "179;84;273;22",
        "wc_questions": "7;7;12;197",
        "wc_review": "403;197;381;396",
        "wc_reply_reviewers": "0;85;0;81",
        "wc_reply_authors": "631;555;749;468",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.25,
            2.165063509461097
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            90.0,
            38.17066936798463
        ],
        "wc_strengths_avg": [
            59.0,
            16.748134224444225
        ],
        "wc_weaknesses_avg": [
            139.5,
            95.22210877732125
        ],
        "wc_questions_avg": [
            55.75,
            81.57626799504865
        ],
        "wc_review_avg": [
            344.25,
            85.3855227775763
        ],
        "wc_reply_reviewers_avg": [
            41.5,
            41.52408939398912
        ],
        "wc_reply_authors_avg": [
            600.75,
            103.20943513070885
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:dWTOFPJ9jiwJ:scholar.google.com/&scioq=SEE-OoD:+Supervised+Exploration+for+Enhanced+Out-of-Distribution+Detection&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "University of Michigan;American University of Beirut",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.umich.edu;https://www.aub.edu.lb",
        "aff_unique_abbr": "UM;AUB",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Ann Arbor;",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "United States;Lebanon"
    },
    {
        "id": "MsOcVFzv8D",
        "title": "Margin Discrepancy-based Adversarial Training for Multi-Domain Text Classification",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Multi-domain text classification (MDTC) endeavors to harness available resources from correlated domains to enhance the classification accuracy of the target domain. Presently, most MDTC approaches that embrace adversarial training and the shared-private paradigm exhibit cutting-edge performance. Unfortunately, these methods face a non-negligible challenge: the absence of theoretical guarantees in the design of MDTC algorithms. The dearth of theoretical underpinning poses a substantial impediment to the advancement of MDTC algorithms. To tackle this problem, we first provide a theoretical analysis of MDTC by decomposing the MDTC task into multiple domain adaptation tasks. We incorporate the margin discrepancy as the measure of domain divergence and establish a new generalization bound based on Rademacher complexity. Subsequently, we propose a margin discrepancy-based adversarial training (MDAT) approach for MDTC, in accordance with our theoretical analysis. To validate the efficacy of the proposed MDAT method, we conduct empirical studies on two MDTC benchmarks. The experimental results demonstrate that our MDAT approach surpasses state-of-the-art baselines on both datasets.",
        "keywords": "Multi-domain text classification;Adversarial training;Margin discrepancy",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Yuan Wu",
        "authorids": "~Yuan_Wu2",
        "gender": "M",
        "homepage": "",
        "dblp": "41/5176-2",
        "google_scholar": "KVeRu2QAAAAJ",
        "orcid": "",
        "linkedin": "yuan-wu-953208150/",
        "or_profile": "~Yuan_Wu2",
        "aff": "Jilin University",
        "aff_domain": "jlu.edu.cn",
        "position": "Assistant Professor",
        "bibtex": "@misc{\nwu2024margin,\ntitle={Margin Discrepancy-based Adversarial Training for Multi-Domain Text Classification},\nauthor={Yuan Wu},\nyear={2024},\nurl={https://openreview.net/forum?id=MsOcVFzv8D}\n}",
        "github": "",
        "project": "",
        "reviewers": "StYT;1VNZ;iCwD;ktox",
        "site": "https://openreview.net/forum?id=MsOcVFzv8D",
        "pdf_size": 351697,
        "rating": "3;3;5;6",
        "confidence": "4;5;4;5",
        "soundness": "2;2;3;3",
        "contribution": "2;1;2;2",
        "presentation": "2;3;3;3",
        "wc_summary": "52;58;32;26",
        "wc_strengths": "130;20;59;76",
        "wc_weaknesses": "150;384;80;220",
        "wc_questions": "2;2;35;1",
        "wc_review": "334;464;206;323",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            42.0,
            13.341664064126334
        ],
        "wc_strengths_avg": [
            71.25,
            39.53084238920289
        ],
        "wc_weaknesses_avg": [
            208.5,
            112.76856831582106
        ],
        "wc_questions_avg": [
            10.0,
            14.439529078193651
        ],
        "wc_review_avg": [
            331.75,
            91.35747095886576
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0.19245008972987526,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:NT7VUn-2-nYJ:scholar.google.com/&scioq=Margin+Discrepancy-based+Adversarial+Training+for+Multi-Domain+Text+Classification&hl=en&as_sdt=0,5",
        "gs_version_total": 5,
        "aff_unique_index": "0",
        "aff_unique_norm": "Jilin University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.jlu.edu.cn",
        "aff_unique_abbr": "JLU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "MtbelAMXJg",
        "title": "Learning Invariances via Neural Network Pruning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Invariance describes transformations that do not alter data's underlying semantics. Neural networks that preserve natural invariance capture good inductive biases and achieve superior performance. Hence, modern networks are handcrafted around well-known invariances (ex. translations). We propose a framework to learn novel network architectures that capture data-dependent invariances via pruning. Our learned architectures consistently outperform dense neural networks on both vision and tabular datasets in both efficiency and effectiveness. We demonstrate our framework on several neural networks across 3 vision and 40 tabular datasets.",
        "keywords": "Invariance Learning;Neural Network Pruning;Auto ML;Contrastive Learning;Lazy Training;Representation Learning;Self-Supervised Learning;Computer Vision;Tabular Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/9240365814a27b84e1a2812fd7690d47fbed90b7.zip",
        "author": "Derek Qiang Xu;Yizhou Sun;Wei Wang",
        "authorids": "~Derek_Qiang_Xu2;~Yizhou_Sun1;~Wei_Wang13",
        "gender": "M;F;F",
        "homepage": "https://derekqxu.github.io;http://web.cs.ucla.edu/~yzsun/;http://www.cs.ucla.edu/~weiwang",
        "dblp": "155/0712;37/3868;w/WeiWang.html",
        "google_scholar": "07nfvIgAAAAJ;https://scholar.google.com.tw/citations?user=TQgOjK0AAAAJ;UedS9LQAAAAJ",
        "orcid": "0009-0008-2992-9768;;0000-0002-8180-2886",
        "linkedin": "derekqxu/;;wei-wang-8800845/",
        "or_profile": "~Derek_Qiang_Xu2;~Yizhou_Sun1;~Wei_Wang13",
        "aff": "University of California, Los Angeles;University of California, Los Angeles;University of California, Los Angeles",
        "aff_domain": "ucla.edu;ucla.edu;ucla.edu",
        "position": "PhD student;Associate Professor;Full Professor",
        "bibtex": "@misc{\nxu2024learning,\ntitle={Learning Invariances via Neural Network Pruning},\nauthor={Derek Qiang Xu and Yizhou Sun and Wei Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=MtbelAMXJg}\n}",
        "github": "",
        "project": "",
        "reviewers": "paCL;iziS;LdpC",
        "site": "https://openreview.net/forum?id=MtbelAMXJg",
        "pdf_size": 1426503,
        "rating": "3;5;5",
        "confidence": "3;3;5",
        "soundness": "3;2;3",
        "contribution": "2;3;3",
        "presentation": "2;2;2",
        "wc_summary": "89;86;89",
        "wc_strengths": "51;62;78",
        "wc_weaknesses": "387;182;152",
        "wc_questions": "5;140;35",
        "wc_review": "532;470;354",
        "wc_reply_reviewers": "201;196;0",
        "wc_reply_authors": "2097;2051;1415",
        "reply_reviewers": "2;1;0",
        "reply_authors": "5;6;4",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            88.0,
            1.4142135623730951
        ],
        "wc_strengths_avg": [
            63.666666666666664,
            11.08552609887726
        ],
        "wc_weaknesses_avg": [
            240.33333333333334,
            104.42966798547027
        ],
        "wc_questions_avg": [
            60.0,
            57.879184513951124
        ],
        "wc_review_avg": [
            452.0,
            73.7744309816529
        ],
        "wc_reply_reviewers_avg": [
            132.33333333333334,
            93.59605879641632
        ],
        "wc_reply_authors_avg": [
            1854.3333333333333,
            311.22267840817057
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            5.0,
            0.816496580927726
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:2naGwf-xSVMJ:scholar.google.com/&scioq=Learning+Invariances+via+Neural+Network+Pruning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of California, Los Angeles",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucla.edu",
        "aff_unique_abbr": "UCLA",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Los Angeles",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Mtlt3RQTXJ",
        "title": "Bi-level Contrastive Learning for Knowledge Enhanced Molecule Representations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Molecule representation learning underpins diverse downstream applications such as molecular property and side effect understanding and prediction. In this paper, we recognize the two-level structure of individual molecule as having intrinsic graph structure as well as being a node in a large molecule knowledge graph, and present Gode, a new approach that seamlessly integrates graph representations of individual molecules with multi-domain biomedical data from knowledge graphs. By pre-training two graph neural networks (GNNs) on different graph structures, combined with contrastive learning, Gode adeptly fuses molecular structures with their corresponding knowledge graph substructures. This fusion results in a more robust and informative representation, enhancing molecular property prediction by harnessing both chemical and biological information. When fine-tuned across 11 chemical property tasks, our model excels beyond existing benchmarks, registering an average ROC-AUC uplift of 13.8% for classification tasks and an average RMSE/MAE enhancement of 35.1% for regression tasks. Impressively, it surpasses the current leading model in molecule property predictions with average advancements of 2.1% in classification and 6.4% in regression tasks.",
        "keywords": "Molecule Representation;Knowledge Graph;Contrastive Learning",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/68f83f1cfb373364af51c8e09cd2229b86955883.zip",
        "author": "Pengcheng Jiang;Cao Xiao;Tianfan Fu;Jimeng Sun",
        "authorids": "~Pengcheng_Jiang2;~Cao_Xiao2;~Tianfan_Fu1;~Jimeng_Sun3",
        "gender": "M;F;M;",
        "homepage": "https://pat-jj.github.io/;https://sites.google.com/view/danicaxiao/home;https://futianfan.github.io/;http://sunlab.org",
        "dblp": "60/8352;170/1833;;",
        "google_scholar": "TejDN9wAAAAJ;ahaV25EAAAAJ;KPQ49w4AAAAJ;9jmmp5sAAAAJ",
        "orcid": "0000-0001-9925-3777;;;0000-0003-1512-6426",
        "linkedin": "patrick-j-3492b4235/;caoxiao/;;jimengsun/",
        "or_profile": "~Pengcheng_Jiang2;~Cao_Xiao2;~Tianfan_Fu1;~Jimeng_Sun3",
        "aff": "University of Illinois at Urbana Champaign;GE Healthcare;Rensselaer Polytechnic Institute;Georgia Institute of Technology",
        "aff_domain": "cs.illinois.edu;ge.com;rpi.edu;gatech.edu",
        "position": "MS student;VP of AI;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\njiang2024bilevel,\ntitle={Bi-level Contrastive Learning for Knowledge Enhanced Molecule Representations},\nauthor={Pengcheng Jiang and Cao Xiao and Tianfan Fu and Jimeng Sun},\nyear={2024},\nurl={https://openreview.net/forum?id=Mtlt3RQTXJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "1pz2;ar3U;C94D;afSU",
        "site": "https://openreview.net/forum?id=Mtlt3RQTXJ",
        "pdf_size": 1564784,
        "rating": "3;3;5;8",
        "confidence": "4;4;4;4",
        "soundness": "3;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;4",
        "wc_summary": "54;74;54;89",
        "wc_strengths": "23;73;16;35",
        "wc_weaknesses": "137;356;181;31",
        "wc_questions": "3;25;70;123",
        "wc_review": "217;528;321;278",
        "wc_reply_reviewers": "368;181;37;10",
        "wc_reply_authors": "2227;1910;1464;919",
        "reply_reviewers": "1;2;2;1",
        "reply_authors": "7;6;4;3",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            67.75,
            14.737282653189496
        ],
        "wc_strengths_avg": [
            36.75,
            22.00426095100674
        ],
        "wc_weaknesses_avg": [
            176.25,
            117.22920924411288
        ],
        "wc_questions_avg": [
            55.25,
            45.9694191827567
        ],
        "wc_review_avg": [
            336.0,
            116.84819211267242
        ],
        "wc_reply_reviewers_avg": [
            149.0,
            142.1706720811293
        ],
        "wc_reply_authors_avg": [
            1630.0,
            491.90598695279164
        ],
        "reply_reviewers_avg": [
            1.5,
            0.5
        ],
        "reply_authors_avg": [
            5.0,
            1.5811388300841898
        ],
        "replies_avg": [
            32,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1036602345528657207&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "University of Illinois Urbana-Champaign;GE Healthcare;Rensselaer Polytechnic Institute;Georgia Institute of Technology",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://illinois.edu;https://www.gehealthcare.com;https://www.rpi.edu;https://www.gatech.edu",
        "aff_unique_abbr": "UIUC;GEHC;RPI;Georgia Tech",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Urbana-Champaign;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "MtzHEqqUm0",
        "title": "In-Depth Comparison of Regularization Methods For Long-Tailed Learning in Trajectory Prediction",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Autonomous robots have the biggest potential for risk because they operate in open-ended environments where humans interact in complex, diverse ways. To operate, such systems must predict this behaviour, especially if it's part of the unexpected and potentially dangerous long tail of the dataset. Previous works on long-tailed trajectory prediction use models which do not predict a distribution of trajectories with likelihoods associated with each prediction. Furthermore, they report metrics which are biased by the ground-truth. Therefore, we aim to examine regularization methods for long-tailed trajectory prediction by comparing them on the KDE metric, which is designed to compare distributions of trajectories. Moreover, we are the first to report the performance of these methods on both the pedestrian and vehicle classes of the NuScenes dataset.",
        "keywords": "Trajectory Prediction;Long-Tailed Learning;Imbalanced Regression;Autonomous Vehicles",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/3641a5f5713ca559aa46fd5bb26f8535f1bd615f.zip",
        "author": "Divya Thuremella;Lars Kunze",
        "authorids": "~Divya_Thuremella1;~Lars_Kunze1",
        "gender": "F;M",
        "homepage": "https://ori.ox.ac.uk/people/divya-thuremella/;https://people.uwe.ac.uk/Person/LarsKunze",
        "dblp": ";20/8428",
        "google_scholar": ";https://scholar.google.co.uk/citations?user=TLC0azYAAAAJ",
        "orcid": ";0000-0001-5302-1938",
        "linkedin": ";",
        "or_profile": "~Divya_Thuremella1;~Lars_Kunze1",
        "aff": "University of Oxford;University of Oxford, University of Oxford",
        "aff_domain": "ox.ac.uk;eng.ox.ac.uk",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nthuremella2024indepth,\ntitle={In-Depth Comparison of Regularization Methods For Long-Tailed Learning in Trajectory Prediction},\nauthor={Divya Thuremella and Lars Kunze},\nyear={2024},\nurl={https://openreview.net/forum?id=MtzHEqqUm0}\n}",
        "github": "",
        "project": "",
        "reviewers": "bsJi;yYGK;wvR7;2aGX",
        "site": "https://openreview.net/forum?id=MtzHEqqUm0",
        "pdf_size": 641509,
        "rating": "3;3;3;5",
        "confidence": "4;4;5;4",
        "soundness": "2;2;2;3",
        "contribution": "2;1;2;2",
        "presentation": "2;2;2;3",
        "wc_summary": "92;71;83;86",
        "wc_strengths": "11;14;48;92",
        "wc_weaknesses": "50;125;130;345",
        "wc_questions": "1;76;99;97",
        "wc_review": "154;286;360;620",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            83.0,
            7.648529270389178
        ],
        "wc_strengths_avg": [
            41.25,
            32.706077416896086
        ],
        "wc_weaknesses_avg": [
            162.5,
            110.02840542332693
        ],
        "wc_questions_avg": [
            68.25,
            39.85834291588149
        ],
        "wc_review_avg": [
            355.0,
            169.8617084572035
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:lz-9JrgYBhgJ:scholar.google.com/&scioq=In-Depth+Comparison+of+Regularization+Methods+For+Long-Tailed+Learning+in+Trajectory+Prediction&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Oxford",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ox.ac.uk",
        "aff_unique_abbr": "Oxford",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "title": "Causal Structure Recovery with Latent Variables under Milder Distributional and Graphical Assumptions",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18805",
        "id": "MukGKGtgnr",
        "author_site": "Xiuchuan Li, Kun Zhang, Tongliang Liu",
        "tldr": "",
        "abstract": "Traditional causal discovery approaches typically assume the absence of latent variables, a simplification that often does not align with real-world situations. Recently, there has been a surge of causal discovery methods that explicitly consider latent variables. While some works aim to reveal causal relations between observed variables in the presence of latent variables, others seek to identify latent variables and recover the causal structure over them. The latter typically entail strong distributional and graphical assumptions, such as the non-Gaussianity, purity, and two-pure-children assumption. In this paper, we endeavor to recover the whole causal structure involving both latent and observed variables under milder assumptions. We formulate two cases, one allows entirely arbitrary distribution and requires only one pure child per latent variable, and the other requires no pure child and imposes the non-Gaussianity requirement on only a subset of variables, and they both avoid the purity assumption. We prove the identifiability of linear latent variable models in both cases, and our constructive proof leads to theoretically sound and computationally efficient algorithms.",
        "keywords": "causal discovery;latent variables",
        "primary_area": "causal reasoning",
        "supplementary_material": "",
        "author": "Xiu-Chuan Li;Kun Zhang;Tongliang Liu",
        "authorids": "~Xiu-Chuan_Li1;~Kun_Zhang1;~Tongliang_Liu1",
        "gender": ";M;M",
        "homepage": "https://xiuchuanli.github.io/;http://www.andrew.cmu.edu/user/kunz1/;https://tongliang-liu.github.io/",
        "dblp": "291/8244.html;96/3115-1;150/6667",
        "google_scholar": ";RGoypN4AAAAJ;https://scholar.google.com.au/citations?user=EiLdZ_YAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Xiu-Chuan_Li1;~Kun_Zhang1;~Tongliang_Liu1",
        "aff": "University of Sydney;Carnegie Mellon University;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_domain": "usyd.edu.au;cmu.edu;mbzuai.ac.ae",
        "position": "PhD student;Associate Professor;Affiliated Associate Professor",
        "bibtex": "@inproceedings{\nli2024causal,\ntitle={Causal Structure Recovery with Latent Variables under Milder Distributional and Graphical Assumptions},\nauthor={Xiu-Chuan Li and Kun Zhang and Tongliang Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=MukGKGtgnr}\n}",
        "github": "",
        "project": "",
        "reviewers": "7d8K;nXRg;y7UL;YYCe",
        "pdf_size": 1295269,
        "rating": "5;5;6;8",
        "confidence": "3;3;2;3",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "2;2;3;4",
        "wc_summary": "46;128;23;90",
        "wc_strengths": "32;80;45;16",
        "wc_weaknesses": "215;491;106;120",
        "wc_questions": "5;132;135;29",
        "wc_review": "298;831;309;255",
        "wc_reply_reviewers": "77;0;95;11",
        "wc_reply_authors": "1683;1054;718;449",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "5;4;2;2",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            71.75,
            40.42508503392417
        ],
        "wc_strengths_avg": [
            43.25,
            23.573024837725004
        ],
        "wc_weaknesses_avg": [
            233.0,
            154.74656700553973
        ],
        "wc_questions_avg": [
            75.25,
            58.87433651430817
        ],
        "wc_review_avg": [
            423.25,
            236.27777614494343
        ],
        "wc_reply_reviewers_avg": [
            45.75,
            40.93516214698557
        ],
        "wc_reply_authors_avg": [
            976.0,
            461.0385016460122
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.25,
            1.299038105676658
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10029279856857543227&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=MukGKGtgnr",
        "pdf": "https://openreview.net/pdf?id=MukGKGtgnr",
        "email": "usyd.edu.au;cmu.edu;mbzuai.ac.ae",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of Sydney;Carnegie Mellon University;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.sydney.edu.au;https://www.cmu.edu;https://mbzuai.ac.ae",
        "aff_unique_abbr": "USYD;CMU;MBZUAI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2",
        "aff_country_unique": "Australia;United States;United Arab Emirates"
    },
    {
        "id": "MvOaI1mmMY",
        "title": "Learning Label Refinement and Thresholds for Imbalanced Semi-Supervised Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Semi-supervised learning (SSL) has proven to be effective in enhancing generalization when working with limited labeled training data. Existing SSL algorithms based on pseudo-labels rely on heuristic strategies or uncalibrated model confidence and are unreliable when imbalanced class distributions bias pseudo-labels. In this paper, we introduce SEmi-supervised learning with pseudo-label optimization\nbased on VALidation data (SEVAL) to reduce the class bias and enhance the quality of pseudo-labelling for imbalanced SSL. First, we develop a curriculum for adjusting logits, improving the accuracy of the pseudo-labels generated by biased models. Second, we establish a curriculum for class-specific thresholds, ensuring the correctness of pseudo-labels on a per-class basis. SEVAL adapts to specific tasks by learning refinement and thresholding parameters from a partition of the training dataset in a class balanced way. Our experimental findings show that SEVAL surpasses current methods based on pseudo-label refinement and threshold adjustment, delivering more accurate and effective pseudo-labels in various imbalanced SSL situations. Owing to its simplicity and flexibility, SEVAL can readily be incorporated to boost the efficacy of numerous other SSL techniques.",
        "keywords": "semi-supervised learning;class imbalance",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/e229c40d244d3033dd9ddefbced9e4af105944fc.zip",
        "author": "Zeju Li;Ying-Qiu Akina Zheng;Saad Jbabdi",
        "authorids": "~Zeju_Li2;~Ying-Qiu_Akina_Zheng1;~Saad_Jbabdi1",
        "gender": "M;;M",
        "homepage": "https://zerojumpline.github.io/;;https://www.win.ox.ac.uk/people/saad-jbabdi",
        "dblp": "205/4592.html;;",
        "google_scholar": "zeuflXEAAAAJ;NLs-BRQAAAAJ;f3vYYDYAAAAJ",
        "orcid": ";0000-0003-1236-0700;",
        "linkedin": ";;",
        "or_profile": "~Zeju_Li2;~Ying-Qiu_Akina_Zheng1;~Saad_Jbabdi1",
        "aff": "University of Oxford;University of Oxford;University of Oxford",
        "aff_domain": "ox.ac.uk;ox.ac.uk;ox.ac.uk",
        "position": "Postdoc;Postdoc;Full Professor",
        "bibtex": "@misc{\nli2024learning,\ntitle={Learning Label Refinement and Thresholds for Imbalanced Semi-Supervised Learning},\nauthor={Zeju Li and Ying-Qiu Akina Zheng and Saad Jbabdi},\nyear={2024},\nurl={https://openreview.net/forum?id=MvOaI1mmMY}\n}",
        "github": "",
        "project": "",
        "reviewers": "PXgw;axcv;TEBc;S1He",
        "site": "https://openreview.net/forum?id=MvOaI1mmMY",
        "pdf_size": 1958810,
        "rating": "3;3;5;5",
        "confidence": "5;5;3;4",
        "soundness": "1;2;2;3",
        "contribution": "1;2;2;2",
        "presentation": "3;3;2;2",
        "wc_summary": "65;43;51;43",
        "wc_strengths": "16;25;39;47",
        "wc_weaknesses": "138;518;158;163",
        "wc_questions": "4;2;172;75",
        "wc_review": "223;588;420;328",
        "wc_reply_reviewers": "60;116;0;0",
        "wc_reply_authors": "635;1348;887;764",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "1;2;2;2",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            50.5,
            8.986100377805714
        ],
        "wc_strengths_avg": [
            31.75,
            12.028611723719408
        ],
        "wc_weaknesses_avg": [
            244.25,
            158.32620597993247
        ],
        "wc_questions_avg": [
            63.25,
            69.33027837820933
        ],
        "wc_review_avg": [
            389.75,
            134.01189312893092
        ],
        "wc_reply_reviewers_avg": [
            44.0,
            48.249352327259274
        ],
        "wc_reply_authors_avg": [
            908.5,
            268.93540116541
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.9045340337332909,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Rib2i7c9oDcJ:scholar.google.com/&scioq=Learning+Label+Refinement+and+Thresholds+for+Imbalanced+Semi-Supervised+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Oxford",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ox.ac.uk",
        "aff_unique_abbr": "Oxford",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "MxuFXJtVTt",
        "title": "Hot PATE: Private Aggregation of Distributions for Diverse Tasks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The Private Aggregation of Teacher Ensembles (PATE) framework~\\cite{PapernotAEGT:ICLR2017} is a versatile approach to privacy-preserving machine learning. In PATE, teacher models are trained on distinct portions of sensitive data, and their predictions are privately aggregated to label new training examples for a student model.\n Until now, PATE has primarily been explored with classification-like tasks, where each example possesses a ground-truth label, and knowledge transfer to the student is by labeling random examples. \nGenerative AI models, however, excel in open ended \\emph{diverse} tasks with multiple valid responses and scenarios that may not align with traditional labeled examples.\nWe propose \\emph{hot PATE}, tailored for the diverse setting. In hot PATE, each teacher model contributes a response distribution and the aggregation method must preserve both privacy and diversity of responses. We demonstrate, analytically and empirically, that hot PATE achieves privacy-utility tradeoffs that are comparable to, and in diverse settings, significantly surpass, the baseline ``cold'' PATE.",
        "keywords": "PATE;diverse tasks;differential privacy",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Edith Cohen;Xin Lyu;Jelani Nelson;Tamas Sarlos;Uri Stemmer",
        "authorids": "~Edith_Cohen1;~Xin_Lyu1;~Jelani_Nelson2;~Tamas_Sarlos1;~Uri_Stemmer1",
        "gender": "F;M;M;;M",
        "homepage": "http://www.cohenwang.com/edith/;https://people.eecs.berkeley.edu/~xinlyu/;https://sites.google.com/site/stamas/;https://www.uri.co.il/;http://people.eecs.berkeley.edu/~minilek",
        "dblp": "40/1039;;48/959;125/8532;68/3296.html",
        "google_scholar": "O-TV6OgAAAAJ;;c4YtO-MAAAAJ;;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0002-3926-8237;;;;",
        "linkedin": ";;;;minilek/",
        "or_profile": "~Edith_Cohen1;~Xin_Lyu1;~Tamas_Sarlos1;~Uri_Stemmer1;~Jelani_Nelson1",
        "aff": "Google;University of California, Berkeley;Google Research;Tel Aviv University;University of California, Berkeley",
        "aff_domain": "google.com;berkeley.edu;google.com;tau.ac.il;berkeley.edu",
        "position": "Research Scientist;PhD student;Staff Research Scientist;Assistant Professor;Full Professor",
        "bibtex": "@misc{\ncohen2024hot,\ntitle={Hot {PATE}: Private Aggregation of Distributions for Diverse Tasks},\nauthor={Edith Cohen and Xin Lyu and Jelani Nelson and Tamas Sarlos and Uri Stemmer},\nyear={2024},\nurl={https://openreview.net/forum?id=MxuFXJtVTt}\n}",
        "github": "",
        "project": "",
        "reviewers": "mnAY;1aLU;5rq4;JMJ6",
        "site": "https://openreview.net/forum?id=MxuFXJtVTt",
        "pdf_size": 771016,
        "rating": "3;3;3;5",
        "confidence": "3;3;4;3",
        "soundness": "1;2;3;2",
        "contribution": "1;2;2;2",
        "presentation": "1;1;2;1",
        "wc_summary": "90;62;44;92",
        "wc_strengths": "1;20;34;31",
        "wc_weaknesses": "325;180;80;68",
        "wc_questions": "4;217;62;55",
        "wc_review": "420;479;220;246",
        "wc_reply_reviewers": "194;78;46;0",
        "wc_reply_authors": "764;296;523;342",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            72.0,
            20.049937655763422
        ],
        "wc_strengths_avg": [
            21.5,
            12.932517156377562
        ],
        "wc_weaknesses_avg": [
            163.25,
            103.01304529039028
        ],
        "wc_questions_avg": [
            84.5,
            79.7072769576279
        ],
        "wc_review_avg": [
            341.25,
            110.62408191709434
        ],
        "wc_reply_reviewers_avg": [
            79.5,
            71.68507515515346
        ],
        "wc_reply_authors_avg": [
            481.25,
            183.98284566774154
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9266444076350202904&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;2;1",
        "aff_unique_norm": "Google;University of California, Berkeley;Tel Aviv University",
        "aff_unique_dep": "Google;;",
        "aff_unique_url": "https://www.google.com;https://www.berkeley.edu;https://www.tau.ac.il",
        "aff_unique_abbr": "Google;UC Berkeley;TAU",
        "aff_campus_unique_index": "0;1;0;1",
        "aff_campus_unique": "Mountain View;Berkeley;",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "United States;Israel"
    },
    {
        "title": "Forward Learning with Top-Down Feedback: Empirical and Analytical Characterization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18804",
        "id": "My7lkRNnL9",
        "author_site": "Ravi Srinivasan, Francesca Mignacco, Martino Sorbaro, Maria Refinetti, Avi Cooper, Gabriel Kreiman, Giorgia Dellaferrera",
        "tldr": "",
        "abstract": "\"Forward-only\" algorithms, which train neural networks while avoiding a backward pass, have recently gained attention as a way of solving the biologically unrealistic aspects of backpropagation. Here, we first address compelling challenges related to the \"forward-only\" rules, which include reducing the performance gap with backpropagation and providing an analytical understanding of their dynamics. To this end, we show that the forward-only algorithm with top-down feedback is well-approximated by an \"adaptive-feedback-alignment\" algorithm, and we analytically track its performance during learning in a prototype high-dimensional setting. Then, we compare different versions of forward-only algorithms, focusing on the Forward-Forward and PEPITA frameworks, and we show that they share the same learning principles. Overall, our work unveils the connections between three key neuro-inspired learning rules, providing a link between \"forward-only\" algorithms, i.e., Forward-Forward and PEPITA, and an approximation of backpropagation, i.e., Feedback Alignment.",
        "keywords": "Forward-only learning;Biologically inspired learning;Artificial neural networks;Analytical characterization",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/abae6fa98b6b5537144cb3e3d5c6a67165803088.pdf",
        "author": "Ravi Francesco Srinivasan;Francesca Mignacco;Martino Sorbaro;Maria Refinetti;Avi Cooper;Gabriel Kreiman;Giorgia Dellaferrera",
        "authorids": "~Ravi_Francesco_Srinivasan1;~Francesca_Mignacco1;~Martino_Sorbaro1;~Maria_Refinetti1;~Avi_Cooper1;~Gabriel_Kreiman1;~Giorgia_Dellaferrera1",
        "gender": "M;F;M;F;;M;F",
        "homepage": ";;https://martinosorb.github.io;https://sites.google.com/view/mariarefinetti/home;;http://klab.tch.harvard.edu;https://researcher.watson.ibm.com/researcher/view.php?person=zurich-GDE",
        "dblp": "339/8676;259/3071;https://dblp.uni-trier.de/pid/255/4940-1;;;12/1367;251/5602",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;maTV19MAAAAJ;pQmRdm4AAAAJ;045mm50AAAAJ;https://scholar.google.com/citations?hl=en;WxZ_6nsAAAAJ;RjCR8qkAAAAJ",
        "orcid": ";;0000-0002-0182-7443;;;0000-0003-3505-8475;0000-0003-1029-6637",
        "linkedin": ";;;maria-refinetti;avi-cooper/;kreiman/;",
        "or_profile": "~Ravi_Francesco_Srinivasan1;~Francesca_Mignacco1;~Martino_Sorbaro1;~Maria_Refinetti1;~Avi_Cooper1;~Gabriel_Kreiman1;~Giorgia_Dellaferrera1",
        "aff": "Harvard University;City University of New York, City University of New York;Swiss Federal Institute of Technology;;Fujitsu Research and Development Center Co. Ltm.;Harvard Medical School;McKinsey & Company",
        "aff_domain": "harvard.edu;gc.cuny.edu;ethz.ch;;fujitsu.com;harvard.edu;mckinsey.com",
        "position": "MS student;Postdoc;Postdoc;;Researcher;Full Professor;Consultant",
        "bibtex": "@inproceedings{\nsrinivasan2024forward,\ntitle={Forward Learning with Top-Down Feedback: Empirical and Analytical Characterization},\nauthor={Ravi Francesco Srinivasan and Francesca Mignacco and Martino Sorbaro and Maria Refinetti and Avi Cooper and Gabriel Kreiman and Giorgia Dellaferrera},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=My7lkRNnL9}\n}",
        "github": "",
        "project": "",
        "reviewers": "knnT;uKzr;QDBz;sGVa",
        "pdf_size": 2241395,
        "rating": "5;5;8;8",
        "confidence": "3;4;4;3",
        "soundness": "3;2;3;4",
        "contribution": "3;2;3;4",
        "presentation": "2;2;4;3",
        "wc_summary": "82;54;33;166",
        "wc_strengths": "96;18;65;140",
        "wc_weaknesses": "169;340;61;62",
        "wc_questions": "95;75;186;117",
        "wc_review": "442;487;345;485",
        "wc_reply_reviewers": "0;241;19;18",
        "wc_reply_authors": "692;1399;341;404",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "1;3;1;1",
        "rating_avg": [
            6.5,
            1.5
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            83.75,
            50.56864146879961
        ],
        "wc_strengths_avg": [
            79.75,
            44.51053246142985
        ],
        "wc_weaknesses_avg": [
            158.0,
            113.87493139405179
        ],
        "wc_questions_avg": [
            118.25,
            41.841217716505334
        ],
        "wc_review_avg": [
            439.75,
            57.58200673821641
        ],
        "wc_reply_reviewers_avg": [
            69.5,
            99.30382671377775
        ],
        "wc_reply_authors_avg": [
            709.0,
            419.7731530243448
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 21,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8417474447308979922&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 9,
        "openreview": "https://openreview.net/forum?id=My7lkRNnL9",
        "pdf": "https://openreview.net/pdf?id=My7lkRNnL9",
        "email": "harvard.edu;gc.cuny.edu;ethz.ch;;fujitsu.com;harvard.edu;mckinsey.com",
        "author_num": 7,
        "aff_unique_index": "0;1;2;3;0;4",
        "aff_unique_norm": "Harvard University;City University of New York;Swiss Federal Institute of Technology;Fujitsu Research and Development Center;McKinsey & Company",
        "aff_unique_dep": ";;;Research and Development;",
        "aff_unique_url": "https://www.harvard.edu;https://www.cuny.edu;https://www.ethz.ch;https://www.fujitsu.com/global/;https://www.mckinsey.com",
        "aff_unique_abbr": "Harvard;CUNY;ETH Zurich;Fujitsu R&D;McKinsey",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Boston",
        "aff_country_unique_index": "0;0;1;2;0;0",
        "aff_country_unique": "United States;Switzerland;Japan"
    },
    {
        "id": "Mylk5iamJC",
        "title": "A Latent Generative Model for Closed-set and Open-set Recognition",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The classic recognition problem assumes that all possible classes in testing are known in advance during training, which can be termed closed-set recognition (CSR). As a natural extension, open-set recognition (OSR) requires models to reject samples of unknown classes that are not encountered in the training phase. Traditional discriminative models struggle to learn decision boundaries for OSR due to the absence of unknown samples. This has led to existing methods focusing on either CSR or OSR, as optimizing one often results in performance degradation of the other. In this paper, we offer a formalization for OSR based on learning theory, demonstrating that CSR and OSR share the same goal for generative models. Motivated by this core insight, we introduce a neural Latent Gaussian Mixture Model (L-GMM) accompanied by a collaborative training algorithm. The model consists of an encoder that maps inputs to a latent space, and a density estimator that computes probability densities. The end-to-end training algorithm, designed in a collaborative manner, learns the density estimator through maximum likelihood estimation and trains the encoder using a discriminative loss derived from the generative model. This framework yields a model capable of performing both CSR and OSR. Experimental results show that L-GMM outperforms its discriminative counterparts in image recognition and segmentation in CSR with models trained from scratch. These models also outperform other specialized methods when directly applied to OSR without any modifications or prior knowledge.",
        "keywords": "open-set recognition;closed-set recognition",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Cheng Han;Qifan Wang;Ying Nian Wu;Wenguan Wang;Siyuan Qi",
        "authorids": "~Cheng_Han1;~Qifan_Wang2;~Ying_Nian_Wu1;~Wenguan_Wang4;~Siyuan_Qi1",
        "gender": "M;M;M;;M",
        "homepage": "https://chenghan111.github.io/;https://wqfcr.github.io/;https://sites.google.com/view/wenguanwang/;;http://www.stat.ucla.edu/~ywu/",
        "dblp": "53/6096-1.html;33/8610;145/1078;177/5178;18/568.html",
        "google_scholar": "VgkEKZwAAAAJ;LrSyLosAAAAJ;CqAQQkgAAAAJ;ePclJR4AAAAJ;7k_1QFIAAAAJ",
        "orcid": "0000-0002-8145-3436;0000-0002-7570-5756;0000-0002-0802-9567;0000-0002-4070-733X;",
        "linkedin": "chenghan-87129219a/;;wenguanwang;;",
        "or_profile": "~Cheng_Han1;~Qifan_Wang2;~Wenguan_Wang4;~Siyuan_Qi1;~Yingnian_Wu1",
        "aff": "Rochester Institute of Technology;Meta AI;Zhejiang University;Beijing Institute for General Artificial Intelligence;UCLA",
        "aff_domain": "rit.edu;fb.com;zju.edu.cn;bigai.ai;stat.ucla.edu",
        "position": "PhD student;Principal Researcher;Full Professor;Researcher;Full Professor",
        "bibtex": "@misc{\nhan2024a,\ntitle={A Latent Generative Model for Closed-set and Open-set Recognition},\nauthor={Cheng Han and Qifan Wang and Ying Nian Wu and Wenguan Wang and Siyuan Qi},\nyear={2024},\nurl={https://openreview.net/forum?id=Mylk5iamJC}\n}",
        "github": "",
        "project": "",
        "reviewers": "pjen;pChx;YQmr",
        "site": "https://openreview.net/forum?id=Mylk5iamJC",
        "pdf_size": 3132929,
        "rating": "3;5;8",
        "confidence": "4;5;3",
        "soundness": "2;2;4",
        "contribution": "2;2;3",
        "presentation": "2;3;4",
        "wc_summary": "46;70;308",
        "wc_strengths": "18;77;190",
        "wc_weaknesses": "204;474;105",
        "wc_questions": "84;132;77",
        "wc_review": "352;753;680",
        "wc_reply_reviewers": "276;70;0",
        "wc_reply_authors": "390;1770;429",
        "reply_reviewers": "1;1;0",
        "reply_authors": "1;3;1",
        "rating_avg": [
            5.333333333333333,
            2.0548046676563256
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            141.33333333333334,
            118.25772232242971
        ],
        "wc_strengths_avg": [
            95.0,
            71.36292221221512
        ],
        "wc_weaknesses_avg": [
            261.0,
            155.9422970204043
        ],
        "wc_questions_avg": [
            97.66666666666667,
            24.44494948973214
        ],
        "wc_review_avg": [
            595.0,
            174.39227811651142
        ],
        "wc_reply_reviewers_avg": [
            115.33333333333333,
            117.14758023773072
        ],
        "wc_reply_authors_avg": [
            863.0,
            641.5434513733267
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5960395606792698,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:viaVqfBsXJEJ:scholar.google.com/&scioq=A+Latent+Generative+Model+for+Closed-set+and+Open-set+Recognition&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "Rochester Institute of Technology;Meta;Zhejiang University;Beijing Institute for General Artificial Intelligence;University of California, Los Angeles",
        "aff_unique_dep": ";Meta AI;;;",
        "aff_unique_url": "https://www.rit.edu;https://meta.com;https://www.zju.edu.cn;http://www.bigaiai.org/;https://www.ucla.edu",
        "aff_unique_abbr": "RIT;Meta;ZJU;BIGAI;UCLA",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Los Angeles",
        "aff_country_unique_index": "0;0;1;1;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "Mzb7XD0O1Q",
        "title": "CRAFT: Cross-Representation modeling on Audio waveForms and specTrograms",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this paper, we introduce \\underline{C}ross-\\underline{R}epresentation modeling on \\underline{A}udio wave\\underline{F}orms and spec\\underline{T}rograms (CRAFT), an innovative representation modeling designed to extract joint features from diverse representations in the audio modality, and choose acoustic classification to showcase the effectiveness of our approach. Historically, most prior works are focused on utilizing either the frequency-domain spectrogram or the time-domain waveform representations for acoustic modeling. Directly fusing or concatenating individual representations suffers from performance degradation. However, we argue that by aligning these individual representations effectively, they can complement each other and substantially enhance the quality of downstream tasks. \nTo mitigate semantic misalignment, we initially propose a cross-representation contrastive learning framework incorporating spectrogram and waveform based contrastive learning loss in audio pretraining. Subsequently, to alleviate temporal misalignment, we present a cross-representation transformer architecture, which models on spectrogram and waveform tokens together with fusion bottlenecks. The proposed CRAFT is tested on two commonly used datasets, demonstrating superior performances. Notably, our proposed CRAFT method outperforms the spectrogram-based counterpart by an impressive 4.4\\% higher mAP on AudioSet balanced set, and achieves SOTA comparable performances on full set, which suggests the alleviation of semantic misalignment and temporal misalignment boosts cross-representation performances in audio modeling. All codes and models will be open-sourced.",
        "keywords": "Audio representation learning;contrastive learning;audio tagging",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Hanlin Lu;Jianbo Yuan;Xinyu Li",
        "authorids": "~Hanlin_Lu1;~Jianbo_Yuan1;~Xinyu_Li4",
        "gender": "M;M;M",
        "homepage": ";;https://www.arthurlxy.com",
        "dblp": "31/7172;134/6790;88/2359-3.html",
        "google_scholar": "https://scholar.google.at/citations?user=UbWokRoAAAAJ;https://scholar.google.com/citations?hl=en;xMnAUmkAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Hanlin_Lu1;~Jianbo_Yuan1;~Xinyu_Li4",
        "aff": "ByteDance;Bytedance;Amazon",
        "aff_domain": "bytedance.com;bytedance.com;amazon.com",
        "position": "Researcher;Researcher;Researcher",
        "bibtex": "@misc{\nlu2024craft,\ntitle={{CRAFT}: Cross-Representation modeling on Audio waveForms and specTrograms},\nauthor={Hanlin Lu and Jianbo Yuan and Xinyu Li},\nyear={2024},\nurl={https://openreview.net/forum?id=Mzb7XD0O1Q}\n}",
        "github": "",
        "project": "",
        "reviewers": "aBV8;7CEx;Cffs;2yfr",
        "site": "https://openreview.net/forum?id=Mzb7XD0O1Q",
        "pdf_size": 1013804,
        "rating": "3;3;5;5",
        "confidence": "5;2;4;3",
        "soundness": "1;2;3;3",
        "contribution": "2;2;3;2",
        "presentation": "1;2;2;3",
        "wc_summary": "21;44;77;166",
        "wc_strengths": "8;29;57;44",
        "wc_weaknesses": "665;47;400;54",
        "wc_questions": "6;26;2;49",
        "wc_review": "700;146;536;313",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "2360;327;908;412",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "4;1;2;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            77.0,
            55.10444628158421
        ],
        "wc_strengths_avg": [
            34.5,
            18.227726133558185
        ],
        "wc_weaknesses_avg": [
            291.5,
            258.58315877102285
        ],
        "wc_questions_avg": [
            20.75,
            18.673175948402566
        ],
        "wc_review_avg": [
            423.75,
            211.14257623700627
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1001.75,
            814.9731207223954
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:rbr3i10535AJ:scholar.google.com/&scioq=CRAFT:+Cross-Representation+modeling+on+Audio+waveForms+and+specTrograms&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "ByteDance;Amazon",
        "aff_unique_dep": ";Amazon.com, Inc.",
        "aff_unique_url": "https://www.bytedance.com;https://www.amazon.com",
        "aff_unique_abbr": "ByteDance;Amazon",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Learning Multi-Faceted Prototypical User Interests",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18803",
        "id": "MzjiMxlWab",
        "author_site": "Nhu-Thuat Tran, Hady W. Lauw",
        "tldr": "",
        "abstract": "We seek to uncover the latent interest units from behavioral data to better learn user preferences under the VAE framework. Existing practices tend to ignore the multiple facets of item characteristics, which may not capture it at appropriate granularity. Moreover, current studies equate the granularity of item space to that of user interests, which we postulate is not ideal as user interests would likely map to a small subset of item space. In addition, the compositionality of user interests has received inadequate attention, preventing the modeling of interactions between explanatory factors driving a user's decision.\nTo resolve this, we propose to align user interests with multi-faceted item characteristics. First, we involve prototype-based representation learning to discover item characteristics along multiple facets. Second, we compose user interests from uncovered item characteristics via binding mechanism, separating the granularity of user preferences from that of item space. Third, we design a dedicated bi-directional binding block, aiding the derivation of compositional user interests.\nOn real-world datasets, the experimental results demonstrate the strong performance of our proposed method compared to a series of baselines.",
        "keywords": "multi-faceted representation;user interests;item characteristics",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Nhu-Thuat Tran;Hady W. Lauw",
        "authorids": "~Nhu-Thuat_Tran1;~Hady_W._Lauw1",
        "gender": "M;M",
        "homepage": "https://trannhuthuat96.github.io/;http://www.hadylauw.com",
        "dblp": "253/9132;00/2494",
        "google_scholar": "jCZT_wIAAAAJ;HTC1z2gAAAAJ",
        "orcid": "0000-0001-5496-6749;0000-0002-8245-8677",
        "linkedin": "nhu-thuat-tran-84b549161/;hadylauw",
        "or_profile": "~Nhu-Thuat_Tran1;~Hady_W_Lauw1",
        "aff": "Singapore Management University;Singapore Management University",
        "aff_domain": "smu.edu.sg;smu.edu.sg",
        "position": "PhD student;Associate Professor",
        "bibtex": "@inproceedings{\ntran2024learning,\ntitle={Learning Multi-Faceted Prototypical User Interests},\nauthor={Nhu-Thuat Tran and Hady W. Lauw},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=MzjiMxlWab}\n}",
        "github": "",
        "project": "",
        "reviewers": "JT1U;Ruv4;BBhv",
        "pdf_size": 1663766,
        "rating": "5;6;8",
        "confidence": "3;4;3",
        "soundness": "3;3;4",
        "contribution": "2;3;3",
        "presentation": "3;3;4",
        "wc_summary": "41;62;62",
        "wc_strengths": "46;60;29",
        "wc_weaknesses": "225;104;25",
        "wc_questions": "5;2;90",
        "wc_review": "317;228;206",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "497;403;511",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;2;2",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            55.0,
            9.899494936611665
        ],
        "wc_strengths_avg": [
            45.0,
            12.675435561221029
        ],
        "wc_weaknesses_avg": [
            118.0,
            82.24759368313863
        ],
        "wc_questions_avg": [
            32.333333333333336,
            40.79487985301859
        ],
        "wc_review_avg": [
            250.33333333333334,
            47.98842453018112
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            470.3333333333333,
            47.95368135561185
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.18898223650461363,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4475174522408690457&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=MzjiMxlWab",
        "pdf": "https://openreview.net/pdf?id=MzjiMxlWab",
        "email": "smu.edu.sg;smu.edu.sg",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Singapore Management University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.smu.edu.sg",
        "aff_unique_abbr": "SMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Singapore"
    },
    {
        "title": "Vision-Language Models are Zero-Shot Reward Models for Reinforcement Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18802",
        "id": "N0I2RtD8je",
        "author_site": "Juan Rocamonde, Victoriano Montesinos, Elvis Nava, Ethan Perez, David Lindner",
        "tldr": "",
        "abstract": "Reinforcement learning (RL) requires either manually specifying a reward function, which is often infeasible, or learning a reward model from a large amount of human feedback, which is often very expensive. We study a more sample-efficient alternative: using pretrained vision-language models (VLMs) as zero-shot reward models (RMs) to specify tasks via natural language. We propose a natural and general approach to using VLMs as reward models, which we call VLM-RMs. We use VLM-RMs based on CLIP to train a MuJoCo humanoid to learn complex tasks without a manually specified reward function, such as kneeling, doing the splits, and sitting in a lotus position. For each of these tasks, we only provide _a single sentence text prompt_ describing the desired task with minimal prompt engineering. We provide videos of the trained agents at: https://sites.google.com/view/vlm-rm. We can improve performance by providing a second \"baseline\" prompt and projecting out parts of the CLIP embedding space irrelevant to distinguish between goal and baseline. Further, we find a strong scaling effect for VLM-RMs: larger VLMs trained with more compute and data are better reward models. The failure modes of VLM-RMs we encountered are all related to known capability limitations of current VLMs, such as limited spatial reasoning ability or visually unrealistic environments that are far off-distribution for the VLM. We find that VLM-RMs are remarkably robust as long as the VLM is large enough. This suggests that future VLMs will become more and more useful reward models for a wide range of RL applications.",
        "keywords": "deep learning;deep reinforcement learning;reward learning;vision-language models;vision transformer;transformer;CLIP",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Juan Rocamonde;Victoriano Montesinos;Elvis Nava;Ethan Perez;David Lindner",
        "authorids": "~Juan_Rocamonde1;~Victoriano_Montesinos1;~Elvis_Nava1;~Ethan_Perez1;~David_Lindner1",
        "gender": "M;M;M;M;",
        "homepage": "https://rocamonde.com;;https://www.elvisnava.com/;http://ethanperez.net;",
        "dblp": ";215/8756.html;303/0379;192/1812;",
        "google_scholar": "Z5h-zEEAAAAJ;;c5Z7qwgAAAAJ;https://scholar.google.ca/citations?user=za0-taQAAAAJ;",
        "orcid": "0000-0003-1253-9110;;;;",
        "linkedin": "https://linkedin.com/in/Rocamonde;victormontesinos;elvisnava/;https://linkedin.com/in/ethanjperez;",
        "or_profile": "~Juan_Rocamonde1;~Victoriano_Montesinos1;~Elvis_Nava1;~Ethan_Perez1;~David_Lindner1",
        "aff": "New York University;Agile Robots SE;Swiss Federal Institute of Technology;New York University;",
        "aff_domain": "cs.nyu.edu;agile-robots.com;ethz.ch;nyu.edu;",
        "position": "Researcher;Researcher;PhD student;Researcher;",
        "bibtex": "@inproceedings{\nrocamonde2024visionlanguage,\ntitle={Vision-Language Models are Zero-Shot Reward Models for Reinforcement Learning},\nauthor={Juan Rocamonde and Victoriano Montesinos and Elvis Nava and Ethan Perez and David Lindner},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=N0I2RtD8je}\n}",
        "github": "",
        "project": "",
        "reviewers": "13eD;rUuN;Q69H;CqGG;kRKZ",
        "pdf_size": 1000656,
        "rating": "3;3;6;8;8",
        "confidence": "4;4;5;4;4",
        "soundness": "2;2;3;3;4",
        "contribution": "2;2;3;3;4",
        "presentation": "3;2;3;3;4",
        "wc_summary": "71;105;68;266;66",
        "wc_strengths": "108;48;120;107;231",
        "wc_weaknesses": "328;102;50;210;180",
        "wc_questions": "473;1;40;54;131",
        "wc_review": "980;256;278;637;608",
        "wc_reply_reviewers": "0;398;0;0;0",
        "wc_reply_authors": "910;1843;460;680;861",
        "reply_reviewers": "0;2;0;0;0",
        "reply_authors": "2;4;2;2;2",
        "rating_avg": [
            5.6,
            2.244994432064365
        ],
        "confidence_avg": [
            4.2,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.8,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.8,
            0.7483314773547882
        ],
        "presentation_avg": [
            3.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            115.2,
            76.74216572393563
        ],
        "wc_strengths_avg": [
            122.8,
            59.63019369413452
        ],
        "wc_weaknesses_avg": [
            174.0,
            95.50706780128893
        ],
        "wc_questions_avg": [
            139.8,
            171.86436512552567
        ],
        "wc_review_avg": [
            551.8,
            266.92201108188885
        ],
        "wc_reply_reviewers_avg": [
            79.6,
            159.2
        ],
        "wc_reply_authors_avg": [
            950.8,
            473.27936781566973
        ],
        "reply_reviewers_avg": [
            0.4,
            0.8000000000000002
        ],
        "reply_authors_avg": [
            2.4,
            0.8000000000000002
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.08908708063747481,
        "gs_citation": 76,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4871873940418427533&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=N0I2RtD8je",
        "pdf": "https://openreview.net/pdf?id=N0I2RtD8je",
        "email": "cs.nyu.edu;agile-robots.com;ethz.ch;nyu.edu;",
        "author_num": 5,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "New York University;Agile Robots SE;Swiss Federal Institute of Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.nyu.edu;https://www.agilerobots.com;https://www.ethz.ch",
        "aff_unique_abbr": "NYU;;ETH Zurich",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;0",
        "aff_country_unique": "United States;Germany;Switzerland"
    },
    {
        "id": "N0gLRTmmO5",
        "title": "Open-Ended Learning in General-Sum Games: The Role of Diversity in Correlated Equilibrium",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The primary in this work focuses on the challenging and crucial task of identifying and selecting equilibria for $n$-player general-sum games. PSRO serves as a comprehensive framework for tackling complex games by leveraging the concept of the meta-game. However, prior research on PSRO mainly concentrates on solving two-player zero-sum games. Extended approaches such as JPRSO and $\\alpha$-Rank can address multi-player general-sum games, and these methods theoretically ensure uniqueness and convergence. Nonetheless, a noticeable gap often exists between the joint policy distribution derived by the solver and the target equilibrium, which can undermine the robustness of the joint policy. Within the PSRO framework, diversity characterizes the distinctions among policies within the population, representing the exploration of the policy space by players. Consequently, allocating greater sampling probabilities (meta-strategy) to more diverse policies encourages players to employ more exploratory policies, thereby mitigating the risk of exploitation. We begin by incorporating diversity measures into solving equilibria for $n$-player meta-games and introduce a novel equilibrium concept, called Diverse (C)CE, the objective of which is to maximize sum of expectations of each player's diversity. In alignment with this, we present a policy training algorithm, Diverse Correlated Oracle (DCO), which effectively associates policy dynamics with the joint policy distribution. The experimental results conducted on a range of multi-player, general-sum games demonstrate that our algorithm outperforms JPSRO and $\\alpha$-Rank and enhances the approximation of the joint policy distribution towards the target equilibrium by notably reducing the gap.",
        "keywords": "Correlated Equilibrium;Policy Diversity;PSRO",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/4df0e2f3a3008681d3451e6aebc1e17a583db035.pdf",
        "author": "Zeyuan Zhao;Muning Wen;Ying Wen;Yaodong Yang",
        "authorids": "~Zeyuan_Zhao2;~Muning_Wen2;~Ying_Wen1;~Yaodong_Yang1",
        "gender": ";M;M;M",
        "homepage": "https://github.com/Zhao-Zeyuan;https://github.com/morning9393;https://yingwen.io;https://www.yangyaodong.com",
        "dblp": ";295/0261;41/4203-1;170/1496-1",
        "google_scholar": ";Zt1WFtQAAAAJ;_A1CxG8AAAAJ;https://scholar.google.co.uk/citations?user=6yL0xw8AAAAJ",
        "orcid": ";0009-0000-7868-1262;0000-0003-1247-2382;0000-0001-8132-5613",
        "linkedin": ";;wenying45;yaodong-yang",
        "or_profile": "~Zeyuan_Zhao2;~Muning_Wen2;~Ying_Wen1;~Yaodong_Yang1",
        "aff": "Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;Peking University",
        "aff_domain": "sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;pku.edu.cn",
        "position": "PhD student;PhD student;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nzhao2024openended,\ntitle={Open-Ended Learning in General-Sum Games: The Role of Diversity in Correlated Equilibrium},\nauthor={Zeyuan Zhao and Muning Wen and Ying Wen and Yaodong Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=N0gLRTmmO5}\n}",
        "github": "",
        "project": "",
        "reviewers": "4LQy;SpBs;EpNp;unHf",
        "site": "https://openreview.net/forum?id=N0gLRTmmO5",
        "pdf_size": 750529,
        "rating": "3;3;3;3",
        "confidence": "3;3;2;5",
        "soundness": "2;2;3;3",
        "contribution": "2;1;2;2",
        "presentation": "1;1;2;2",
        "wc_summary": "45;79;81;85",
        "wc_strengths": "31;49;37;47",
        "wc_weaknesses": "448;165;1318;202",
        "wc_questions": "74;116;221;100",
        "wc_review": "598;409;1657;434",
        "wc_reply_reviewers": "207;301;13;39",
        "wc_reply_authors": "378;376;664;222",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.25,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            72.5,
            16.023420358962067
        ],
        "wc_strengths_avg": [
            41.0,
            7.3484692283495345
        ],
        "wc_weaknesses_avg": [
            533.25,
            465.9492327496634
        ],
        "wc_questions_avg": [
            127.75,
            55.88548559330947
        ],
        "wc_review_avg": [
            774.5,
            514.657410322634
        ],
        "wc_reply_reviewers_avg": [
            140.0,
            119.10079764636339
        ],
        "wc_reply_authors_avg": [
            410.0,
            159.7185023721422
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:CDakUZN1wccJ:scholar.google.com/&scioq=Open-Ended+Learning+in+General-Sum+Games:+The+Role+of+Diversity+in+Correlated+Equilibrium&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "Shanghai Jiao Tong University;Peking University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.sjtu.edu.cn;http://www.pku.edu.cn",
        "aff_unique_abbr": "SJTU;Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Low Rank Matrix Completion via Robust Alternating Minimization in Nearly Linear Time",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18801",
        "id": "N0gT4A0jNV",
        "author_site": "Yuzhou Gu, Zhao Song, Junze Yin, Lichen Zhang",
        "tldr": "",
        "abstract": "Given a matrix $M\\in \\mathbb{R}^{m\\times n}$, the low rank matrix completion problem asks us to find a rank-$k$ approximation of $M$ as $UV^\\top$ for $U\\in \\mathbb{R}^{m\\times k}$ and $V\\in \\mathbb{R}^{n\\times k}$ by only observing a few entries specified by a set of entries $\\Omega\\subseteq [m]\\times [n]$. In particular, we examine an approach that is widely used in practice --- the alternating minimization framework. Jain, Netrapalli and Sanghavi showed that if $M$ has incoherent rows and columns, then alternating minimization provably recovers the matrix $M$ by observing a nearly linear in $n$ number of entries. While the sample complexity has been subsequently improved, alternating minimization steps are required to be computed exactly. This hinders the development of more efficient algorithms and fails to depict the practical implementation of alternating minimization, where the updates are usually performed approximately in favor of efficiency.\n\nIn this paper, we take a major step towards a more efficient and error-robust alternating minimization framework. To this end, we develop an analytical framework for alternating minimization that can tolerate a moderate amount of errors caused by approximate updates. Moreover, our algorithm runs in time $\\widetilde O(|\\Omega| k)$, which is nearly linear in the time to verify the solution while preserving the sample complexity. This improves upon all prior known alternating minimization approaches which require $\\widetilde O(|\\Omega| k^2)$ time.",
        "keywords": "matrix completion",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Yuzhou Gu;Zhao Song;Junze Yin;Lichen Zhang",
        "authorids": "~Yuzhou_Gu1;~Zhao_Song3;~Junze_Yin1;~Lichen_Zhang2",
        "gender": "M;M;M;M",
        "homepage": "https://sevenkplus.com/;https://www.youtube.com/@zhaosong2031;https://yinj66.github.io/;https://lczh.github.io/",
        "dblp": "182/2497;76/4051-2;339/6793;00/6357-3",
        "google_scholar": "WHoU_9MAAAAJ;yDZct7UAAAAJ;4qdW3UQAAAAJ;https://scholar.google.com/citations?view_op=list_works",
        "orcid": "0000-0003-1722-5241;;0009-0005-1548-8058;",
        "linkedin": ";;junze-yin-8416651bb/;",
        "or_profile": "~Yuzhou_Gu1;~Zhao_Song3;~Junze_Yin1;~Lichen_Zhang2",
        "aff": "Institue for Advanced Study, Princeton;Adobe;Boston University;Amazon",
        "aff_domain": "ias.edu;adobe.com;bu.edu;amazon.com",
        "position": "Postdoc;Researcher;Undergrad student;Intern",
        "bibtex": "@inproceedings{\ngu2024low,\ntitle={Low Rank Matrix Completion via Robust Alternating Minimization in Nearly Linear Time},\nauthor={Yuzhou Gu and Zhao Song and Junze Yin and Lichen Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=N0gT4A0jNV}\n}",
        "github": "",
        "project": "",
        "reviewers": "kPm7;CTEU;QBsW",
        "pdf_size": 545513,
        "rating": "6;6;6",
        "confidence": "3;3;3",
        "soundness": "3;2;3",
        "contribution": "3;3;2",
        "presentation": "2;2;3",
        "wc_summary": "40;275;286",
        "wc_strengths": "28;185;131",
        "wc_weaknesses": "87;217;72",
        "wc_questions": "265;100;45",
        "wc_review": "420;777;534",
        "wc_reply_reviewers": "18;119;0",
        "wc_reply_authors": "139;427;510",
        "reply_reviewers": "1;1;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            200.33333333333334,
            113.46169201785929
        ],
        "wc_strengths_avg": [
            114.66666666666667,
            65.12722591632132
        ],
        "wc_weaknesses_avg": [
            125.33333333333333,
            65.1067499487487
        ],
        "wc_questions_avg": [
            136.66666666666666,
            93.48202441586773
        ],
        "wc_review_avg": [
            577.0,
            148.8825040090339
        ],
        "wc_reply_reviewers_avg": [
            45.666666666666664,
            52.37259673616432
        ],
        "wc_reply_authors_avg": [
            358.6666666666667,
            158.98078150798256
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 30,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15963862328107631345&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=N0gT4A0jNV",
        "pdf": "https://openreview.net/pdf?id=N0gT4A0jNV",
        "email": "ias.edu;adobe.com;bu.edu;amazon.com",
        "author_num": 4,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Institute for Advanced Study;Adobe;Boston University;Amazon",
        "aff_unique_dep": ";Adobe Inc.;;Amazon.com, Inc.",
        "aff_unique_url": "https://wwwIAS.edu;https://www.adobe.com;https://www.bu.edu;https://www.amazon.com",
        "aff_unique_abbr": "IAS;Adobe;BU;Amazon",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Princeton;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "N0isTh3rml",
        "title": "Graph Learning with Distributional Edge Layouts",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph Neural Networks (GNNs) learn from graph-structured data by passing local messages between neighboring nodes along edges on certain topological layouts. Typically, these topological layouts in modern GNNs are deterministically computed (e.g., attention-based GNNs) or locally sampled (e.g., GraphSage) under heuristic assumptions. In this paper, we for the first time pose that these layouts can be globally sampled out of steady-state graphs following Boltzmann distribution equipped with explicit physical energy, leading to more viable pairwise distance configurations in the physical world. We argue that a collection of sampled/optimized layouts can capture the wide energy distribution and better characterize the intrinsic properties of input topology, therefore easing downstream tasks. As such, we propose Distributional Edge Layouts (DELs) to serve as a complement to a variety of GNNs. DEL is a pre-processing strategy independent of subsequent GNN variants, thus being highly flexible. Experimental results demonstrate that DELs consistently and substantially improve a series of GNN baselines, achieving state-of-the-art performance on multiple datasets. DEL is open-sourced at https://anonymous.4open.science/r/DEL.",
        "keywords": "graph neural networks;edge features;graph layout",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Xinjian Zhao;Chaolong Ying;Tianshu Yu",
        "authorids": "~Xinjian_Zhao2;~Chaolong_Ying1;~Tianshu_Yu2",
        "gender": "M;M;M",
        "homepage": "https://sduzxj.github.io//;https://sds.cuhk.edu.cn/node/708;https://mypage.cuhk.edu.cn/academics/yutianshu/",
        "dblp": "02/8613;295/3323;152/6675",
        "google_scholar": "iKuIMsgAAAAJ;1-O3158AAAAJ;MTHO7DsAAAAJ",
        "orcid": "0009-0003-1553-8209;0000-0002-8555-8817;0000-0002-6537-1924",
        "linkedin": ";;",
        "or_profile": "~Xinjian_Zhao2;~Chaolong_Ying1;~Tianshu_Yu2",
        "aff": "Chinese University of Hong Kong (Shenzhen);The Chinese University of Hong Kong, Shenzhen;Chinese University of Hong Kong (Shenzhen)",
        "aff_domain": "cuhk.edu.cn;cuhk.edu.cn;cuhk.edu.cn",
        "position": "PhD student;PhD student;Assistant Professor",
        "bibtex": "@misc{\nzhao2024graph,\ntitle={Graph Learning with Distributional Edge Layouts},\nauthor={Xinjian Zhao and Chaolong Ying and Tianshu Yu},\nyear={2024},\nurl={https://openreview.net/forum?id=N0isTh3rml}\n}",
        "github": "",
        "project": "",
        "reviewers": "YS2Q;VZpe;8jRK",
        "site": "https://openreview.net/forum?id=N0isTh3rml",
        "pdf_size": 1602740,
        "rating": "3;5;6",
        "confidence": "5;3;2",
        "soundness": "2;3;4",
        "contribution": "1;2;4",
        "presentation": "2;3;4",
        "wc_summary": "61;76;82",
        "wc_strengths": "31;51;74",
        "wc_weaknesses": "89;141;157",
        "wc_questions": "85;6;66",
        "wc_review": "266;274;379",
        "wc_reply_reviewers": "47;69;0",
        "wc_reply_authors": "700;376;582",
        "reply_reviewers": "1;1;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            1.247219128924647
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            73.0,
            8.831760866327848
        ],
        "wc_strengths_avg": [
            52.0,
            17.568911937472585
        ],
        "wc_weaknesses_avg": [
            129.0,
            29.028721409436322
        ],
        "wc_questions_avg": [
            52.333333333333336,
            33.66831679124389
        ],
        "wc_review_avg": [
            306.3333333333333,
            51.486783633170255
        ],
        "wc_reply_reviewers_avg": [
            38.666666666666664,
            28.778850258865834
        ],
        "wc_reply_authors_avg": [
            552.6666666666666,
            133.88884278468547
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:fcHDW4qG5IYJ:scholar.google.com/&scioq=Graph+Learning+with+Distributional+Edge+Layouts&hl=en&as_sdt=0,5",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Chinese University of Hong Kong",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cuhk.edu.cn",
        "aff_unique_abbr": "CUHK",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Shenzhen",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "TESTAM: A Time-Enhanced Spatio-Temporal Attention Model with Mixture of Experts",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18800",
        "id": "N0nTk5BSvO",
        "author_site": "Hyunwook Lee, Sungahn Ko",
        "tldr": "",
        "abstract": "Accurate traffic forecasting is challenging due to the complex dependency on road networks, various types of roads, and the abrupt speed change due to the events. Recent works mainly focus on dynamic spatial modeling with adaptive graph embedding or graph attention having less consideration for temporal characteristics and in-situ modeling. In this paper, we propose a novel deep learning model named TESTAM, which individually models recurring and non-recurring traffic patterns by a mixture-of-experts model with three experts on temporal modeling, spatio-temporal modeling with static graph, and dynamic spatio-temporal dependency modeling with dynamic graph. By introducing different experts and properly routing them, TESTAM could better model various circumstances, including spatially isolated nodes, highly related nodes, and recurring and non-recurring events. For the proper routing, we reformulate a gating problem into a classification problem with pseudo labels. Experimental results on three public traffic network datasets, METR-LA, PEMS-BAY, and EXPY-TKY, demonstrate that TESTAM achieves a better indication and modeling of recurring and non-recurring traffic.",
        "keywords": "Traffic Prediction;Deep Learning;Spatio-Temporal data modeling",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/a88ef62f305fa4f6c3fd3f1825f09c9d128caeae.zip",
        "author": "Hyunwook Lee;Sungahn Ko",
        "authorids": "~Hyunwook_Lee1;~Sungahn_Ko1",
        "gender": "M;M",
        "homepage": ";https://sites.google.com/view/haiv/",
        "dblp": ";16/9189",
        "google_scholar": "GTWj-V4AAAAJ;gKnZiVcAAAAJ",
        "orcid": "0000-0002-5506-7347;",
        "linkedin": "hyunwook-lee-2b15ba283;",
        "or_profile": "~Hyunwook_Lee1;~Sungahn_Ko1",
        "aff": "Ulsan National Institute of Science and Technology;Ulsan National Institute of Science and Technology",
        "aff_domain": "unist.ac.kr;unist.ac.kr",
        "position": "PhD student;Associate Professor",
        "bibtex": "@inproceedings{\nlee2024testam,\ntitle={{TESTAM}: A Time-Enhanced Spatio-Temporal Attention Model with Mixture of Experts},\nauthor={Hyunwook Lee and Sungahn Ko},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=N0nTk5BSvO}\n}",
        "github": "",
        "project": "",
        "reviewers": "FrvU;SSH9;gqdu;orKb",
        "pdf_size": 12858369,
        "rating": "5;6;6;6",
        "confidence": "4;4;4;3",
        "soundness": "3;2;3;3",
        "contribution": "2;3;2;3",
        "presentation": "2;2;3;3",
        "wc_summary": "60;62;70;83",
        "wc_strengths": "54;31;63;75",
        "wc_weaknesses": "355;130;128;109",
        "wc_questions": "39;155;4;25",
        "wc_review": "508;378;265;292",
        "wc_reply_reviewers": "23;218;0;0",
        "wc_reply_authors": "671;875;275;220",
        "reply_reviewers": "1;2;0;0",
        "reply_authors": "1;3;1;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            68.75,
            9.03811374126261
        ],
        "wc_strengths_avg": [
            55.75,
            16.11482236948332
        ],
        "wc_weaknesses_avg": [
            180.5,
            101.08041353298867
        ],
        "wc_questions_avg": [
            55.75,
            58.64032315736331
        ],
        "wc_review_avg": [
            360.75,
            94.70315464650584
        ],
        "wc_reply_reviewers_avg": [
            60.25,
            91.55974825216592
        ],
        "wc_reply_authors_avg": [
            510.25,
            273.1623830251889
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 22,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3891364419529492876&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=N0nTk5BSvO",
        "pdf": "https://openreview.net/pdf?id=N0nTk5BSvO",
        "email": "unist.ac.kr;unist.ac.kr",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Ulsan National Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.unist.ac.kr",
        "aff_unique_abbr": "UNIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "N134PpnlKs",
        "title": "Twinned Interventional Flows",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Real-world problems in continuously evolving settings, such as predicting the efficacy of medical treatment, often require estimating the causal effects of interventions. Issues such as irregularly-sampled and missing data, unobserved factors, and ethical concerns make such settings especially challenging. The existing methodology relies on low-dimensional embeddings, potentially incurring information loss.  \n\nWe circumvent this limitation with a novel approach ``twinning\" that augments the partial observations with additional latent variables and appeals to conditional continuous normalizing flows to model the system dynamics, obtaining accurate density estimates. We also introduce a new approach to overcome a key technical challenge, namely, mitigating stiffness of the underlying neural ODE. The model provably benefits from auxiliary non-interventional data during training. We showcase the flexibility of the proposed method with tasks like anomaly detection and counterfactual prediction, and benchmark on standard reinforcement learning (Half-Cheetah) and treatment effect prediction (tumor growth) contexts.",
        "keywords": "counterfactual predictions;normalizing flows;causal reinforcement learning;causal effects;neural differential equations;partially observed MDPs",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/686231b478670a41e577d9dfffb2f1595a5b2b5a.zip",
        "author": "Linda Hemmann;Vikas Garg",
        "authorids": "~Linda_Hemmann1;~Vikas_Garg2",
        "gender": "F;",
        "homepage": ";",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": "linda-hemmann/;",
        "or_profile": "~Linda_Hemmann1;~Vikas_Garg2",
        "aff": "Aalto University;",
        "aff_domain": "aalto.fi;",
        "position": "MS student;",
        "bibtex": "@misc{\nhemmann2024twinned,\ntitle={Twinned Interventional Flows},\nauthor={Linda Hemmann and Vikas Garg},\nyear={2024},\nurl={https://openreview.net/forum?id=N134PpnlKs}\n}",
        "github": "",
        "project": "",
        "reviewers": "Tyhh;dXx9;ELA6",
        "site": "https://openreview.net/forum?id=N134PpnlKs",
        "pdf_size": 1276202,
        "rating": "3;3;6",
        "confidence": "3;3;3",
        "soundness": "2;2;3",
        "contribution": "2;1;3",
        "presentation": "1;1;2",
        "wc_summary": "89;94;87",
        "wc_strengths": "68;56;170",
        "wc_weaknesses": "235;758;203",
        "wc_questions": "399;29;8",
        "wc_review": "791;937;468",
        "wc_reply_reviewers": "399;515;0",
        "wc_reply_authors": "1872;2903;699",
        "reply_reviewers": "1;1;0",
        "reply_authors": "4;5;2",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            90.0,
            2.943920288775949
        ],
        "wc_strengths_avg": [
            98.0,
            51.146847410177685
        ],
        "wc_weaknesses_avg": [
            398.6666666666667,
            254.42265797072574
        ],
        "wc_questions_avg": [
            145.33333333333334,
            179.57418770215526
        ],
        "wc_review_avg": [
            732.0,
            195.96088044981494
        ],
        "wc_reply_reviewers_avg": [
            304.6666666666667,
            220.5755098725957
        ],
        "wc_reply_authors_avg": [
            1824.6666666666667,
            900.4015153746072
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            1.247219128924647
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:8x9idplDOjsJ:scholar.google.com/&scioq=Twinned+Interventional+Flows&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Aalto University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.aalto.fi",
        "aff_unique_abbr": "Aalto",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Finland"
    },
    {
        "id": "N1TyUhkvjW",
        "title": "Time Series Anomaly Detection using Reconstruction and RBF Similarity Scores",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Anomaly detection in time series data is pivotal across various domains. The inherent challenge of scarce labeled data for anomaly detection has increased the attention toward unsupervised learning methods, in particular autoencoders and variations thereof. While these unsupervised approaches have shown promise, those that solely rely on reconstruction error often miss subtle anomalies, especially in high-dimensional or multivariate datasets. Motivated by this challenge, we introduce a novel approach that utilizes a layer of Radial Basis Function (RBF) neurons within the deep learning architectures. This RBF layer fits a nonparametric density in the hidden representation. When the neural network is trained on (predominantly) normal data, then a high RBF output indicates a high density, which in turn implies a high similarity with the normal data. Combining the RBF similarity score with the reconstruction error results in a unique anomaly score that we named the SimRec score. While our method can be adapted to a wide range of architectures, we focus on LSTM and Transformer models.  We evaluate our approach on three real-world benchmark datasets, with results indicating significant improvements over the baselines. Our findings underscore the potential of the SimRec score in capturing subtle anomalies that might be overlooked by scores based on reconstruction error alone, offering a more robust and comprehensive solution for anomaly detection in time series data.",
        "keywords": "Anomaly detection;Time series data;Radial Basis Function (RBF);Similarity score;Reconstruction error;Representation learning;Deep learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/0a63b705bce1e05e4e21eb7f0dbd62380ddb69b9.zip",
        "author": "Ramin Ghorbani;Marcel Reinders;David Tax",
        "authorids": "~Ramin_Ghorbani1;~Marcel_Reinders1;~David_Tax1",
        "gender": "M;M;M",
        "homepage": ";https://www.tudelft.nl/ewi/over-de-faculteit/afdelingen/intelligent-systems/pattern-recognition-bioinformatics/pattern-recognition-bioinformatics/people/marcel-reinders;https://www.tudelft.nl/ewi/over-de-faculteit/afdelingen/intelligent-systems/pattern-recognition-bioinformatics/pattern-recognition-laboratory/people/david-tax/",
        "dblp": ";66/1184.html;40/3077",
        "google_scholar": "B5SP-gsAAAAJ;;",
        "orcid": "0000-0003-3631-0177;0000-0002-1148-1562;",
        "linkedin": "ramin-ghorbanii/;https://linkedin.com/in/mjtreinders;",
        "or_profile": "~Ramin_Ghorbani1;~Marcel_Reinders1;~David_Tax1",
        "aff": "Delft University of Technology;Delft University of Technology;Delft University of Technology",
        "aff_domain": "tudelft.nl;tudelft.nl;tudelft.nl",
        "position": "PhD student;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nghorbani2024time,\ntitle={Time Series Anomaly Detection using Reconstruction and {RBF} Similarity Scores},\nauthor={Ramin Ghorbani and Marcel Reinders and David Tax},\nyear={2024},\nurl={https://openreview.net/forum?id=N1TyUhkvjW}\n}",
        "github": "",
        "project": "",
        "reviewers": "ewvW;L6VE;GeHM",
        "site": "https://openreview.net/forum?id=N1TyUhkvjW",
        "pdf_size": 739457,
        "rating": "5;5;5",
        "confidence": "3;4;4",
        "soundness": "2;3;2",
        "contribution": "2;2;2",
        "presentation": "3;3;3",
        "wc_summary": "81;86;51",
        "wc_strengths": "72;29;27",
        "wc_weaknesses": "201;108;16",
        "wc_questions": "3;87;210",
        "wc_review": "357;310;304",
        "wc_reply_reviewers": "225;13;89",
        "wc_reply_authors": "974;767;1679",
        "reply_reviewers": "1;1;1",
        "reply_authors": "2;1;3",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            72.66666666666667,
            15.456030825826172
        ],
        "wc_strengths_avg": [
            42.666666666666664,
            20.75786330258702
        ],
        "wc_weaknesses_avg": [
            108.33333333333333,
            75.5263015261718
        ],
        "wc_questions_avg": [
            100.0,
            85.00588214941364
        ],
        "wc_review_avg": [
            323.6666666666667,
            23.697163449568293
        ],
        "wc_reply_reviewers_avg": [
            109.0,
            87.69644614616186
        ],
        "wc_reply_authors_avg": [
            1140.0,
            390.38698748805655
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Mcy6BVm-Z2UJ:scholar.google.com/&scioq=Time+Series+Anomaly+Detection+using+Reconstruction+and+RBF+Similarity+Scores&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Delft University of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tudelft.nl",
        "aff_unique_abbr": "TU Delft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Netherlands"
    },
    {
        "id": "N1cjy5iznY",
        "title": "Modeling Time Series as Text Sequence A Frequency-vectorization Transformer for Time Series Forecasting",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Time series is an essential type of sequential feature that widely exists in multiple scenarios (e.g., healthcare, weather prediction) and contains valuable information, so various studies have been conducted for modeling time series. Transformer-based models have achieved great success in modeling sequence data, especially text, but fail to understand time series sequences. The reason is that individual data points of time series are hard to utilize because they are numerical values that cannot be tokenized. To address this challenge, we design a frequency-vectorization time series forecasting method in this paper. Different from most previous studies that adopt frequency domain to extract extra features, we propose to utilize frequency spectrum as a common dictionary for tokenizing time series sequences, which converts single time series into frequency units with weights. Then, the vectorized frequency token sequence can be modeled by transformer layers directly for prediction tasks. Furthermore, to align the frequency and the time domains, we introduce two pretraining tasks: time series reconstruction task and maximum position prediction task. Experimental results on multiple datasets demonstrate that our model outperforms existing SOTA models, particularly showing significant improvements in long-term forecasting. Besides, our model exhibits remarkable transferability across various prediction tasks after pretraining.",
        "keywords": "time series prediction;frequency spectrum vectorization;self-supervised pretraining",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Junkai Li;Weizhi Ma;Yang Liu",
        "authorids": "~Junkai_Li1;~Weizhi_Ma1;~Yang_Liu19",
        "gender": "M;M;M",
        "homepage": "https://github.com/Aressfull;http://mawz12.github.io;http://nlp.csai.tsinghua.edu.cn/~ly/",
        "dblp": ";169/1390;51/3710-5",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;FO3lHi4AAAAJ;https://scholar.google.com.hk/citations?user=lVhoKNcAAAAJ",
        "orcid": ";0000-0001-5604-7527;0000-0002-3087-242X",
        "linkedin": ";;",
        "or_profile": "~Junkai_Li1;~Weizhi_Ma1;~Yang_Liu19",
        "aff": "Tsinghua University;Tsinghua University;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "PhD student;Assistant Professor;Professor",
        "bibtex": "@misc{\nli2024modeling,\ntitle={Modeling Time Series as Text Sequence A Frequency-vectorization Transformer for Time Series Forecasting},\nauthor={Junkai Li and Weizhi Ma and Yang Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=N1cjy5iznY}\n}",
        "github": "",
        "project": "",
        "reviewers": "PGhs;je2G;EgZL;qa3G;ggum",
        "site": "https://openreview.net/forum?id=N1cjy5iznY",
        "pdf_size": 716898,
        "rating": "3;3;5;5;6",
        "confidence": "4;4;4;4;5",
        "soundness": "1;2;2;2;2",
        "contribution": "2;1;3;3;3",
        "presentation": "1;3;3;2;3",
        "wc_summary": "68;33;74;115;83",
        "wc_strengths": "134;53;34;28;53",
        "wc_weaknesses": "1961;146;291;133;38",
        "wc_questions": "175;64;85;131;269",
        "wc_review": "2338;296;484;407;443",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "778;881;837;858;543",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            4.4,
            1.2
        ],
        "confidence_avg": [
            4.2,
            0.39999999999999997
        ],
        "soundness_avg": [
            1.8,
            0.4000000000000001
        ],
        "contribution_avg": [
            2.4,
            0.8
        ],
        "presentation_avg": [
            2.4,
            0.8
        ],
        "wc_summary_avg": [
            74.6,
            26.371196408202643
        ],
        "wc_strengths_avg": [
            60.4,
            38.13974305104847
        ],
        "wc_weaknesses_avg": [
            513.8,
            728.1069701630386
        ],
        "wc_questions_avg": [
            144.8,
            72.98328575776786
        ],
        "wc_review_avg": [
            793.6,
            774.7269454459423
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            779.4,
            123.04893335579955
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.6666666666666666,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:0mBxjJcR1LEJ:scholar.google.com/&scioq=Modeling+Time+Series+as+Text+Sequence+A+Frequency-vectorization+Transformer+for+Time+Series+Forecasting&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Tsinghua University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "N1gmpVd4iE",
        "title": "Language Agents with Reinforcement Learning for Strategic Play in the Werewolf Game",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Agents built with large language models (LLMs) have recently achieved great advancements. However, most of the efforts focus on single-agent or cooperative settings, leaving more general multi-agent environments underexplored. We propose a new framework powered by reinforcement learning (RL) to develop strategic language agents, i.e., LLM-based agents with strategic thinking ability, for a popular language game, Werewolf. Werewolf is a social deduction game with hidden roles that involves both cooperation and competition and emphasizes deceptive communication and diverse gameplay. Our agent tackles this game by first using LLMs to reason about potential deceptions and generate a set of strategically diverse actions. Then an RL policy, which selects an action from the candidates, is learned by population-based training to enhance the agents' decision-making ability. By combining LLMs with the RL policy, our agent produces a variety of emergent strategies, achieves the highest win rate against other LLM-based agents, and stays robust against adversarial human players in the Werewolf game.",
        "keywords": "autonomous agents;reinforcement learning;large language models;social deduction games",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/6430a16fde08fcf3a0dcd069652e11392ea043ee.pdf",
        "author": "Zelai Xu;Chao Yu;Fei Fang;Yu Wang;Yi Wu",
        "authorids": "~Zelai_Xu1;~Chao_Yu1;~Fei_Fang1;~Yu_Wang3;~Yi_Wu1",
        "gender": "M;F;F;M;M",
        "homepage": "https://nicsefc.ee.tsinghua.edu.cn/people/ZelaiXu;http://zoeyuchao.github.io;https://feifang.info/;https://nicsefc.ee.tsinghua.edu.cn;https://jxwuyi.weebly.com",
        "dblp": ";36/6789-5;57/2878;w/YuWang2.html;",
        "google_scholar": "3JjcAnoAAAAJ;BYoq_bwAAAAJ;R6jE0VEAAAAJ;https://scholar.google.com.hk/citations?user=j8JGVvoAAAAJ;dusV5HMAAAAJ",
        "orcid": "0000-0001-5578-199X;0000-0001-6975-0158;;0000-0001-6108-5157;",
        "linkedin": ";;;;",
        "or_profile": "~Zelai_Xu1;~Chao_Yu1;~Fei_Fang1;~Yu_Wang3;~Yi_Wu1",
        "aff": "Tsinghua University;Tsinghua University;Carnegie Mellon University;Tsinghua University;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;mail.tsinghua.edu.cn;cmu.edu;tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "PhD student;Postdoc;Associate Professor;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nxu2024language,\ntitle={Language Agents with Reinforcement Learning for Strategic Play in the Werewolf Game},\nauthor={Zelai Xu and Chao Yu and Fei Fang and Yu Wang and Yi Wu},\nyear={2024},\nurl={https://openreview.net/forum?id=N1gmpVd4iE}\n}",
        "github": "",
        "project": "",
        "reviewers": "11VQ;GVoB;s3DR;WD8F;Np2i",
        "site": "https://openreview.net/forum?id=N1gmpVd4iE",
        "pdf_size": 660739,
        "rating": "5;5;5;6;8",
        "confidence": "4;4;3;4;4",
        "soundness": "2;2;3;2;4",
        "contribution": "2;2;3;3;4",
        "presentation": "3;2;3;2;4",
        "wc_summary": "45;122;104;92;76",
        "wc_strengths": "44;45;90;45;116",
        "wc_weaknesses": "109;304;94;259;316",
        "wc_questions": "4;11;213;458;2",
        "wc_review": "202;482;501;854;510",
        "wc_reply_reviewers": "46;31;55;946;415",
        "wc_reply_authors": "877;1661;1268;3352;1016",
        "reply_reviewers": "1;1;2;2;2",
        "reply_authors": "2;3;4;6;2",
        "rating_avg": [
            5.8,
            1.16619037896906
        ],
        "confidence_avg": [
            3.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.6,
            0.8
        ],
        "contribution_avg": [
            2.8,
            0.7483314773547882
        ],
        "presentation_avg": [
            2.8,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            87.8,
            26.1564523588349
        ],
        "wc_strengths_avg": [
            68.0,
            29.73886346180701
        ],
        "wc_weaknesses_avg": [
            216.4,
            95.83861434724523
        ],
        "wc_questions_avg": [
            137.6,
            179.22343596750954
        ],
        "wc_review_avg": [
            509.8,
            206.9129285472515
        ],
        "wc_reply_reviewers_avg": [
            298.6,
            354.24093495811576
        ],
        "wc_reply_authors_avg": [
            1634.8,
            899.0193323839037
        ],
        "reply_reviewers_avg": [
            1.6,
            0.4898979485566356
        ],
        "reply_authors_avg": [
            3.4,
            1.4966629547095764
        ],
        "replies_avg": [
            34,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.3429971702850177,
        "gs_citation": 88,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2025690588575542688&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "Tsinghua University;Carnegie Mellon University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.cmu.edu",
        "aff_unique_abbr": "THU;CMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "N1hk66bz5m",
        "title": "Query and Response Augmentation Cannot Help Out-of-domain Math Reasoning Generalization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In math reasoning with large language models (LLMs), fine-tuning data augmentation by query evolution and diverse reasoning paths is empirically verified effective, profoundly narrowing the gap between open-sourced LLMs and cutting-edge proprietary LLMs. \nIn this paper, we conduct an investigation for such data augmentation in math reasoning and are intended to answer: \n(1) What strategies of data augmentation are more effective; \n(2) What is the scaling relationship between the amount of augmented data and model performance; and \n(3) Can data augmentation incentivize generalization to out-of-domain mathematical reasoning tasks?\nTo this end, we create a new dataset, AugGSM8K, by complicating and diversifying the queries from GSM8K and sampling multiple reasoning paths.\nWe obtained a series of LLMs called MuggleMath by fine-tuning on subsets of AugGSM8K. MuggleMath substantially achieves new state-of-the-art on GSM8K (from 54\\% to 68.4\\% at the scale of 7B, and from 63.9\\% to 74.0\\% at the scale of 13B).\nA log-linear relationship is presented between MuggleMath\u2019s performance and the amount of augmented data. \nWe also find that MuggleMath is weak in out-of-domain math reasoning generalization to MATH. \nThis is attributed to the differences in query distribution between AugGSM8K and MATH which suggest that augmentation on a single benchmark could not help with overall math reasoning performance.",
        "keywords": "Large Language Model; Math Reasoning; Data augmentation; Scaling relationship; Generalizability",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Chengpeng Li;Zheng Yuan;Hongyi Yuan;Guanting Dong;Keming Lu;Jiancan Wu;Chuanqi Tan;Xiang Wang;Chang Zhou",
        "authorids": "~Chengpeng_Li1;~Zheng_Yuan2;~Hongyi_Yuan1;~Guanting_Dong1;~Keming_Lu1;~Jiancan_Wu1;~Chuanqi_Tan3;~Xiang_Wang6;~Chang_Zhou2",
        "gender": "M;M;M;M;M;M;M;M;M",
        "homepage": ";;;https://dongguanting.github.io/;;https://wujcan.github.io/;;https://github.com/xiangwang1223;",
        "dblp": ";56/2877-2;308/0909;;65/6898.html;257/4945;148/4497;31/2864-10;",
        "google_scholar": "5pidFF8AAAAJ;https://scholar.google.com/citations?hl=zh-CN;FG3O4i8AAAAJ;amozZDkAAAAJ;WuD2op4AAAAJ;z9zW1UgAAAAJ;tOfo4ncAAAAJ;https://scholar.google.com.sg/citations?user=HdhaQB0AAAAJ;QeSoG3sAAAAJ",
        "orcid": ";;;;;0000-0002-6941-5218;0000-0002-6676-3057;0000-0002-6148-6329;",
        "linkedin": ";;;;;;;;",
        "or_profile": "~Chengpeng_Li1;~Zheng_Yuan2;~Hongyi_Yuan1;~Guanting_Dong1;~Keming_Lu1;~Jiancan_Wu1;~Chuanqi_Tan3;~Xiang_Wang6;~Chang_Zhou2",
        "aff": "University of Science and Technology of China;Alibaba Group;Tsinghua University;Beijing University of Posts and Telecommunications;Alibaba Group;University of Science and Technology of China;Alibaba Group;University of Science and Technology of China;Alibaba Group",
        "aff_domain": "ustc.edu.cn;alibaba-inc.com;tsinghua.edu.cn;bupt.edu.cn;alibaba-inc.com;ustc.edu.cn;alibaba-inc.com;ustc.edu.cn;alibaba-inc.com",
        "position": "PhD student;Researcher;PhD student;MS student;Researcher;Postdoc;Full-time employee;Full Professor;Researcher",
        "bibtex": "@misc{\nli2024query,\ntitle={Query and Response Augmentation Cannot Help Out-of-domain Math Reasoning Generalization},\nauthor={Chengpeng Li and Zheng Yuan and Hongyi Yuan and Guanting Dong and Keming Lu and Jiancan Wu and Chuanqi Tan and Xiang Wang and Chang Zhou},\nyear={2024},\nurl={https://openreview.net/forum?id=N1hk66bz5m}\n}",
        "github": "",
        "project": "",
        "reviewers": "12bj;MHWk;gKX2;q1A4",
        "site": "https://openreview.net/forum?id=N1hk66bz5m",
        "pdf_size": 2460208,
        "rating": "3;5;5;6",
        "confidence": "3;3;3;4",
        "soundness": "3;3;3;3",
        "contribution": "1;3;1;3",
        "presentation": "2;2;2;2",
        "wc_summary": "69;51;109;43",
        "wc_strengths": "19;118;75;25",
        "wc_weaknesses": "214;211;162;11",
        "wc_questions": "20;203;65;34",
        "wc_review": "322;583;411;113",
        "wc_reply_reviewers": "0;0;88;0",
        "wc_reply_authors": "215;722;720;228",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            1.0
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            68.0,
            25.475478405713993
        ],
        "wc_strengths_avg": [
            59.25,
            40.28880117352712
        ],
        "wc_weaknesses_avg": [
            149.5,
            82.58480489775344
        ],
        "wc_questions_avg": [
            80.5,
            72.57582242041767
        ],
        "wc_review_avg": [
            357.25,
            169.37587638149654
        ],
        "wc_reply_reviewers_avg": [
            22.0,
            38.1051177665153
        ],
        "wc_reply_authors_avg": [
            471.25,
            249.79328954157276
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.6622661785325219,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1294833622151867887&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;1;0;1;0;1",
        "aff_unique_norm": "University of Science and Technology of China;Alibaba Group;Tsinghua University;Beijing University of Posts and Telecommunications",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "http://www.ustc.edu.cn;https://www.alibaba.com;https://www.tsinghua.edu.cn;http://www.bupt.edu.cn/",
        "aff_unique_abbr": "USTC;Alibaba;THU;BUPT",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Beijing",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Win-Win: Training High-Resolution Vision Transformers from Two Windows",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18799",
        "id": "N23A4ybMJr",
        "author_site": "Vincent Leroy, Jerome Revaud, Thomas Lucas, Philippe Weinzaepfel",
        "tldr": "",
        "abstract": "Transformers have become the standard in state-of-the-art vision architectures, achieving impressive performance on both image-level and dense pixelwise tasks. However, training vision transformers for high-resolution pixelwise tasks has a prohibitive cost. Typical solutions boil down to hierarchical architectures, fast and approximate attention, or training on low-resolution crops. This latter solution does not constrain architectural choices, but it leads to a clear performance drop when testing at resolutions significantly higher than that used for training, thus requiring ad-hoc and slow post-processing schemes. In this paper, we propose a novel strategy for efficient training and inference of high-resolution vision transformers. The key principle is to mask out most of the high-resolution inputs during training, keeping only N random windows. This allows the model to learn local interactions between tokens inside each window, and global interactions between tokens from different windows. As a result, the model can directly process the high-resolution input at test time without any special trick. We show that this strategy is effective when using relative positional embedding such as rotary embeddings. It is 4 times faster to train than a full-resolution network, and it is straightforward to use at test time compared to existing approaches. We apply this strategy to three dense prediction tasks with high-resolution data. First, we show on the task of semantic segmentation that a simple setting with 2 windows performs best, hence the name of our method: Win-Win. Second, we confirm this result on the task of monocular depth prediction. Third, to demonstrate the generality of our contribution, we further extend it to the binocular task of optical flow, reaching state-of-the-art performance on the Spring benchmark that contains Full-HD images with an order of magnitude faster inference than the best competitor",
        "keywords": "Vision transformers;High resolution;Dense tasks;Optical flow",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Vincent Leroy;Jerome Revaud;Thomas Lucas;Philippe Weinzaepfel",
        "authorids": "~Vincent_Leroy3;~Jerome_Revaud1;~Thomas_Lucas1;~Philippe_Weinzaepfel1",
        "gender": "M;M;M;M",
        "homepage": "https://europe.naverlabs.com/people_user/vincent-leroy/;https://europe.naverlabs.com/people_user/Jerome-Revaud/;https://scholar.google.com/citations?user=tIVcDHUAAAAJ&hl=fr;https://europe.naverlabs.com/people_user/Philippe-Weinzaepfel/",
        "dblp": "02/7933-2;17/6506;;29/9989",
        "google_scholar": "https://scholar.google.fr/citations?user=HKFj2wkAAAAJ;https://scholar.google.fr/citations?user=asmBzogAAAAJ;tIVcDHUAAAAJ;https://scholar.google.fr/citations?user=LSxIJ5cAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Vincent_Leroy3;~Jerome_Revaud1;~Thomas_Lucas1;~Philippe_Weinzaepfel1",
        "aff": "Naver Labs Europe;Naver Labs Europe;Naver Labs Europe;Naver Labs Europe",
        "aff_domain": "naverlabs.com;naverlabs.com;naverlabs.com;naverlabs.com",
        "position": "Research Scientist;Principal Researcher;Research scientist;Research Scientist",
        "bibtex": "@inproceedings{\nleroy2024winwin,\ntitle={Win-Win: Training High-Resolution Vision Transformers from Two Windows},\nauthor={Vincent Leroy and Jerome Revaud and Thomas Lucas and Philippe Weinzaepfel},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=N23A4ybMJr}\n}",
        "github": "",
        "project": "",
        "reviewers": "aJaX;yL3d;Jtip;wXRr",
        "pdf_size": 2551525,
        "rating": "5;6;6;6",
        "confidence": "4;3;3;5",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "111;79;92;90",
        "wc_strengths": "66;60;42;99",
        "wc_weaknesses": "219;68;45;78",
        "wc_questions": "9;1;6;171",
        "wc_review": "405;208;185;438",
        "wc_reply_reviewers": "97;94;11;19",
        "wc_reply_authors": "1016;985;245;946",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;2;1;2",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            93.0,
            11.510864433221338
        ],
        "wc_strengths_avg": [
            66.75,
            20.60794749605113
        ],
        "wc_weaknesses_avg": [
            102.5,
            68.31727453580098
        ],
        "wc_questions_avg": [
            46.75,
            71.79267023868105
        ],
        "wc_review_avg": [
            309.0,
            113.39532618234315
        ],
        "wc_reply_reviewers_avg": [
            55.25,
            40.36319486859285
        ],
        "wc_reply_authors_avg": [
            798.0,
            320.236631258824
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.17407765595569782,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7386777293433779438&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=N23A4ybMJr",
        "pdf": "https://openreview.net/pdf?id=N23A4ybMJr",
        "email": "naverlabs.com;naverlabs.com;naverlabs.com;naverlabs.com",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "NAVER LABS",
        "aff_unique_dep": "",
        "aff_unique_url": "https://labs.naver.com",
        "aff_unique_abbr": "NLE",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Unknown"
    },
    {
        "id": "N2Kdq5biZx",
        "title": "Planning to Go Out-of-Distribution in Offline-to-Online Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Offline pretraining with a static dataset followed by online fine-tuning is an important paradigm; it is well matched to a real-world RL deployment process. In this scenario, we aim to find the best-performing policy within a limited budget of online interactions. Previous work in this offline-to-online (OtO) setting has focused on correcting for bias introduced by the policy-constraint mechanisms of offline RL algorithms. Such constraints keep the learned policy close to the behavior policy that collected the dataset, but this unnecessarily limits policy performance if the behavior policy is far from optimal. Instead, we forgo policy constraints and frame OtO RL as an exploration problem: we must maximize the benefit of the online data-collection. We study major online RL exploration paradigms, adapting them to work well with the OtO setting. These adapted methods contribute several strong baselines. Next, we introduce a method for planning to go out of distribution (PTGOOD), which targets online exploration in relatively high-reward regions of the state-action space unlikely to be visited by the behavior policy. By leveraging concepts from the Conditional Entropy Bottleneck, PTGOOD encourages data collected online to provide new information relevant to improving the final deployment policy. In that way, the limited interaction budget is used effectively. We show that PTGOOD significantly improves agent returns during online fine-tuning and finds the optimal policy in as few as 10k online steps in Walker and in as few as 50k in complex control tasks like Humanoid. Also, we find that PTGOOD avoids the suboptimal policy convergence that many of our baselines exhibit in several environments.",
        "keywords": "Reinforcement learning;offline-to-online reinforcement learning;model-based planning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/0d0c51c06906787e2dbc4bddbab13ded6afc1b85.zip",
        "author": "Trevor McInroe;Stefano V Albrecht;Amos Storkey",
        "authorids": "~Trevor_McInroe1;~Stefano_V_Albrecht1;~Amos_Storkey1",
        "gender": "M;;Not Specified",
        "homepage": "https://trevormcinroe.github.io/;https://agents-lab.org/stefano-albrecht/;http://homepages.inf.ed.ac.uk/amos/",
        "dblp": "304/2817;118/3975;",
        "google_scholar": ";https://scholar.google.co.uk/citations?user=ceSFqCcAAAAJ;",
        "orcid": ";0000-0002-8735-1465;",
        "linkedin": ";;",
        "or_profile": "~Trevor_McInroe1;~Stefano_V_Albrecht1;~Amos_Storkey1",
        "aff": "University of Edinburgh, University of Edinburgh;University of Edinburgh;University of Edinburgh",
        "aff_domain": "ed.ac.uk;ed.ac.uk;ed.ac.uk",
        "position": "PhD student;Associate Professor;Full Professor",
        "bibtex": "@misc{\nmcinroe2024planning,\ntitle={Planning to Go Out-of-Distribution in Offline-to-Online Reinforcement Learning},\nauthor={Trevor McInroe and Stefano V Albrecht and Amos Storkey},\nyear={2024},\nurl={https://openreview.net/forum?id=N2Kdq5biZx}\n}",
        "github": "",
        "project": "",
        "reviewers": "3FpJ;Ftkq;Q4z6",
        "site": "https://openreview.net/forum?id=N2Kdq5biZx",
        "pdf_size": 2145424,
        "rating": "5;5;6",
        "confidence": "5;3;3",
        "soundness": "2;3;3",
        "contribution": "2;2;3",
        "presentation": "2;1;3",
        "wc_summary": "68;63;77",
        "wc_strengths": "46;49;84",
        "wc_weaknesses": "239;95;211",
        "wc_questions": "82;43;2",
        "wc_review": "435;250;374",
        "wc_reply_reviewers": "0;63;0",
        "wc_reply_authors": "634;376;497",
        "reply_reviewers": "0;1;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            69.33333333333333,
            5.792715732327588
        ],
        "wc_strengths_avg": [
            59.666666666666664,
            17.249798710580816
        ],
        "wc_weaknesses_avg": [
            181.66666666666666,
            62.339571880325124
        ],
        "wc_questions_avg": [
            42.333333333333336,
            32.6632651290236
        ],
        "wc_review_avg": [
            353.0,
            76.97185632857419
        ],
        "wc_reply_reviewers_avg": [
            21.0,
            29.698484809834994
        ],
        "wc_reply_authors_avg": [
            502.3333333333333,
            105.39555124492789
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=822644896210336681&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Edinburgh",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ed.ac.uk",
        "aff_unique_abbr": "Edinburgh",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "N2M8zxPcKp",
        "title": "Algorithm Design for Learned Algorithms",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Neural networks can learn known algorithms from data even when only trained with input/output pairs and no supervision over the intermediate steps.\nThis means that with labelled examples, we can potentially learn new algorithmic approaches.  \nEngineers designing new algorithms are often faced with trade offs like efficiency versus accuracy or generality and specificity.\nWe show that when learning algorithms from data, the same controls exist and we explore how model hyperparameters control the accuracy, efficiency, and generality of the resulting algorithm.\nOur analysis covers learned approaches to computing prefix sums, solving mazes, and filling Sudoku puzzles.\nAs these domains have existing fast and accurate solvers, they serve as a test-bed for our analysis.\nFinally, we extend our analysis to learning algorithms for constraint satisfiability -- an NP-Complete problem.",
        "keywords": "Algorithmic reasoning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/69182b6be9ce2e2f3137068976f7ad62dbb56756.zip",
        "author": "Avi Schwarzschild;Sean Michael McLeish;Arpit Bansal;Gabriel Diaz;Alex Stein;Aakash Chandnani;Aniruddha Saha;Richard Baraniuk;Long Tran-Thanh;Jonas Geiping;Tom Goldstein",
        "authorids": "~Avi_Schwarzschild1;~Sean_Michael_McLeish1;~Arpit_Bansal1;~Gabriel_Diaz2;~Alex_Stein1;~Aakash_Chandnani1;~Aniruddha_Saha1;~Richard_Baraniuk1;~Long_Tran-Thanh1;~Jonas_Geiping1;~Tom_Goldstein1",
        "gender": "M;M;M;M;M;;;M;M;M;M",
        "homepage": "https://cs.umd.edu/~avi1;https://mcleish7.github.io/;;;https://ani0075saha.github.io/;http://richb.rice.edu/;https://warwick.ac.uk/fac/sci/dcs/people/long_tran-thanh/;https://jonasgeiping.github.io/;https://www.cs.umd.edu/~tomg/;https://alexstein0.github.io/;https://arpitbansal297.github.io/",
        "dblp": "249/9334.html;374/9044;;;221/8102;32/2804;46/8333;190/7229;25/8184;;190/9114",
        "google_scholar": "WNvQ7AcAAAAJ;;;;xfjALj0AAAAJ;https://scholar.google.com.tw/citations?user=N-BBA20AAAAJ;https://scholar.google.co.uk/citations?user=YBQai3gAAAAJ;https://scholar.google.de/citations?user=206vNCEAAAAJ;KmSuVtgAAAAJ;StkYBUEAAAAJ;Pchxm4IAAAAJ",
        "orcid": ";;;;;;;;;;",
        "linkedin": ";sean-m-mcleish/;gabriel-diaz-65b65a173/;aakash-chandnani;;richard-baraniuk;;;;;arpit-bansal-970865b1/",
        "or_profile": "~Avi_Schwarzschild1;~Sean_Michael_McLeish1;~Gabriel_Diaz2;~Aakash_Chandnani1;~Aniruddha_Saha1;~Richard_Baraniuk1;~Long_Tran-Thanh1;~Jonas_Geiping1;~Tom_Goldstein1;~Alexander_Stein1;~Arpit_Amit_Bansal1",
        "aff": "Carnegie Mellon University;University of Maryland, College Park;Rice University;;University of Maryland, College Park;William Marsh Rice University;The university of Warwick;Max Planck Institute for Intelligent Systems, Max-Planck Institute;University of Maryland, College Park;University of Maryland, College Park;University of Maryland, College Park",
        "aff_domain": "cmu.edu;umd.edu;rice.edu;;umd.edu;rice.edu;warwick.ac.uk;tuebingen.mpg.de;umd.edu;umd.edu;umd.edu",
        "position": "Postdoc;PhD student;PhD student;;Postdoc;C. Sidney Burrus Professor;Full Professor;Principal Researcher;Full Professor;PhD student;PhD student",
        "bibtex": "@misc{\nschwarzschild2024algorithm,\ntitle={Algorithm Design for Learned Algorithms},\nauthor={Avi Schwarzschild and Sean Michael McLeish and Arpit Bansal and Gabriel Diaz and Alex Stein and Aakash Chandnani and Aniruddha Saha and Richard Baraniuk and Long Tran-Thanh and Jonas Geiping and Tom Goldstein},\nyear={2024},\nurl={https://openreview.net/forum?id=N2M8zxPcKp}\n}",
        "github": "",
        "project": "",
        "reviewers": "uA8f;iu6m;PJg9;LDuX",
        "site": "https://openreview.net/forum?id=N2M8zxPcKp",
        "pdf_size": 6952508,
        "rating": "1;3;3;5",
        "confidence": "5;4;4;4",
        "soundness": "1;2;2;2",
        "contribution": "1;2;1;2",
        "presentation": "1;3;2;2",
        "wc_summary": "36;70;57;268",
        "wc_strengths": "1;125;24;143",
        "wc_weaknesses": "152;543;622;695",
        "wc_questions": "1;280;3;360",
        "wc_review": "190;1018;706;1466",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            107.75,
            93.31231162070738
        ],
        "wc_strengths_avg": [
            73.25,
            61.621323419738395
        ],
        "wc_weaknesses_avg": [
            503.0,
            209.65805493708083
        ],
        "wc_questions_avg": [
            161.0,
            161.49767800188337
        ],
        "wc_review_avg": [
            845.0,
            464.73540859288954
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0;1;2;1;2;3;4;1;1;1",
        "aff_unique_norm": "Carnegie Mellon University;University of Maryland;Rice University;University of Warwick;Max Planck Institute for Intelligent Systems",
        "aff_unique_dep": ";;;;Intelligent Systems",
        "aff_unique_url": "https://www.cmu.edu;https://www/umd.edu;https://www.rice.edu;https://warwick.ac.uk;https://www.mpi-is.mpg.de",
        "aff_unique_abbr": "CMU;UMD;Rice;Warwick;MPI-IS",
        "aff_campus_unique_index": "1;1;1;1;1",
        "aff_campus_unique": ";College Park",
        "aff_country_unique_index": "0;0;0;0;0;1;2;0;0;0",
        "aff_country_unique": "United States;United Kingdom;Germany"
    },
    {
        "title": "A Sublinear Adversarial Training Algorithm",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18798",
        "id": "N2WchST43h",
        "author_site": "Yeqi Gao, Lianke Qin, Zhao Song, Yitan Wang",
        "tldr": "",
        "abstract": "Adversarial training is a widely used strategy for making neural networks resistant to adversarial perturbations. For a neural network of width $m$, $n$ input training data in $d$ dimension, it takes $\\Omega(mnd)$ time cost per training iteration for the forward and backward computation. In this paper we analyze the convergence guarantee of adversarial training procedure on a two-layer neural network with shifted ReLU activation, and shows that only $o(m)$ neurons will be activated for each input data per iteration. Furthermore, we develop an algorithm for adversarial training with time cost $o(m n d)$ per iteration by applying half-space reporting data structure.",
        "keywords": "Adversarial training",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Yeqi Gao;Lianke Qin;Zhao Song;Yitan Wang",
        "authorids": "~Yeqi_Gao1;~Lianke_Qin2;~Zhao_Song3;~Yitan_Wang1",
        "gender": "M;M;;M",
        "homepage": ";https://www.youtube.com/@zhaosong2031;https://statistics.yale.edu/people/yitan-wang;http://brucechin.github.io",
        "dblp": "289/6991;76/4051-2;220/5769.html;243/2068",
        "google_scholar": ";yDZct7UAAAAJ;;iFCI9BUAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Yeqi_Gao1;~Zhao_Song3;~Yitan_Wang1;~LIANKE_QIN1",
        "aff": "Tsinghua University;Adobe;Yale University;UC Santa Barbara",
        "aff_domain": "thu.edu.cn;adobe.com;yale.edu;ucsb.edu",
        "position": "MS student;Researcher;PhD student;PhD student",
        "bibtex": "@inproceedings{\ngao2024a,\ntitle={A Sublinear Adversarial Training Algorithm},\nauthor={Yeqi Gao and Lianke Qin and Zhao Song and Yitan Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=N2WchST43h}\n}",
        "github": "",
        "project": "",
        "reviewers": "5dfS;RwpB;Wuuy;yRgF",
        "pdf_size": 476911,
        "rating": "3;6;6;8",
        "confidence": "3;3;3;3",
        "soundness": "2;3;4;3",
        "contribution": "2;2;3;3",
        "presentation": "1;3;3;3",
        "wc_summary": "150;45;32;121",
        "wc_strengths": "22;48;65;102",
        "wc_weaknesses": "135;52;50;170",
        "wc_questions": "65;18;130;132",
        "wc_review": "372;163;277;525",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "685;291;77;138",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            87.0,
            49.78453575157651
        ],
        "wc_strengths_avg": [
            59.25,
            29.046299247924853
        ],
        "wc_weaknesses_avg": [
            101.75,
            52.24162612323625
        ],
        "wc_questions_avg": [
            86.25,
            47.74083681713172
        ],
        "wc_review_avg": [
            334.25,
            132.67888867487548
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            297.75,
            236.7798291662531
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 26,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8039697682082809572&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=N2WchST43h",
        "pdf": "https://openreview.net/pdf?id=N2WchST43h",
        "email": "thu.edu.cn;adobe.com;yale.edu;ucsb.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Tsinghua University;Adobe;Yale University;University of California, Santa Barbara",
        "aff_unique_dep": ";Adobe Inc.;;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.adobe.com;https://www.yale.edu;https://www.ucsb.edu",
        "aff_unique_abbr": "THU;Adobe;Yale;UCSB",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Santa Barbara",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "N2ggBozsss",
        "title": "Centroid-Based Learning for Malware Detection and Novel Family Identification",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Detecting out-of-distribution (OOD) data categories while preserving the accuracy of existing classifications is a pressing challenge in many domains. Conventional methods often falter when tasked with generating or identifying new data classes, especially when dealing with graphical data and the problem of graph isomorphism. In this paper, we present a novel approach, the Graph Centroid Model (GCM), which combines Control Flow Graphs (CFGs) with a Graph Neural Network (GNN) to address this challenge effectively. The GCM assigns embeddings produced by a GNN to partitions that support the classification of both known and new classes, even those absent during training.\n\nOur approach quantifies the differences between samples in the embedding space, enabling the identification of multiple distinct representations of familiar classes during training while providing a straightforward mechanism for detecting new classes during testing. This not only improves classification accuracy but also offers intuitive visualizations that provide valuable insights.When applied to a benchmark malware dataset (BODMAS), our method reveals structural commonalities among samples from different malware families while effectively discerning new, previously unseen classes based on their distance from learned representatives in the embedding space.",
        "keywords": "malware; graphs; GNN;",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Saranya Vijayakumar;Zifan Wang;Yuhang Yao;Matt Fredrikson",
        "authorids": "~Saranya_Vijayakumar1;~Zifan_Wang1;~Yuhang_Yao2;~Matt_Fredrikson1",
        "gender": "F;M;;M",
        "homepage": "http://svijayakumar2.github.io;https://www.zifanw.net;https://www.andrew.cmu.edu/user/yuhangya/;https://cs.cmu.edu/~mfredrik",
        "dblp": "338/9494;;203/0159;38/2612",
        "google_scholar": "4Lazaq0AAAAJ;HJOP3wMAAAAJ;oQIV0BoAAAAJ;https://scholar.google.com.tw/citations?user=tMYCvLAAAAAJ",
        "orcid": ";;0000-0002-7045-0002;",
        "linkedin": ";zifan-wang-sail/;yuhang-yao/;",
        "or_profile": "~Saranya_Vijayakumar1;~Zifan_Wang1;~Yuhang_Yao2;~Matt_Fredrikson1",
        "aff": "Carnegie Mellon University;Center for AI Safety;Carnegie Mellon University;Carnegie Mellon University",
        "aff_domain": "cmu.edu;safe.ai;andrew.cmu.edu;cmu.edu",
        "position": "PhD student;Researcher;PhD student;Associate Professor",
        "bibtex": "@misc{\nvijayakumar2024centroidbased,\ntitle={Centroid-Based Learning for Malware Detection and Novel Family Identification},\nauthor={Saranya Vijayakumar and Zifan Wang and Yuhang Yao and Matt Fredrikson},\nyear={2024},\nurl={https://openreview.net/forum?id=N2ggBozsss}\n}",
        "github": "",
        "project": "",
        "reviewers": "nmMx;Dvud;TJg9",
        "site": "https://openreview.net/forum?id=N2ggBozsss",
        "pdf_size": 1852541,
        "rating": "3;3;5",
        "confidence": "4;5;3",
        "soundness": "3;2;3",
        "contribution": "1;1;2",
        "presentation": "3;1;2",
        "wc_summary": "278;18;56",
        "wc_strengths": "13;18;17",
        "wc_weaknesses": "17;173;23",
        "wc_questions": "17;44;94",
        "wc_review": "325;253;190",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "608;709;621",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            117.33333333333333,
            114.66279063216435
        ],
        "wc_strengths_avg": [
            16.0,
            2.160246899469287
        ],
        "wc_weaknesses_avg": [
            71.0,
            72.16647421067486
        ],
        "wc_questions_avg": [
            51.666666666666664,
            31.899146627387317
        ],
        "wc_review_avg": [
            256.0,
            55.154328932550705
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            646.0,
            44.86275366789991
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8660254037844387,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:J5lINl65_qgJ:scholar.google.com/&scioq=Centroid-Based+Learning+for+Malware+Detection+and+Novel+Family+Identification&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Carnegie Mellon University;Center for AI Safety",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cmu.edu;https://www.centerforaisafety.org",
        "aff_unique_abbr": "CMU;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "N3DEoB9fIQ",
        "title": "Debiased Machine Learning and Network Cohesion for Doubly-Robust Differential Reward Models in Contextual Bandits",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "A common approach to learning mobile health (mHealth) intervention policies is linear Thompson sampling. Two desirable features of an mHealth policy are (1) pooling information across individuals and time and (2) modeling the differential reward linear model with a time-varying baseline reward. Previous approaches focused on pooling information across individuals but not time, thereby failing to capture trends in treatment effects over time. In addition, these approaches did not explicitly model the baseline reward, which limited the ability to precisely estimate the parameters in the differential reward model. In this paper, we propose a novel Thompson sampling algorithm, termed \"DML-TS-NNR\" that leverages (1) nearest-neighbors to efficiently pool information on the differential reward function across users $\\textit{and}$ time and (2) the Double Machine Learning (DML) framework to explicitly model baseline rewards and stay agnostic to the supervised learning algorithms used. By explicitly modeling baseline rewards, we obtain smaller confidence sets for the differential reward parameters.  We offer theoretical guarantees on the pseudo-regret, which are supported by empirical results. Importantly, the DML-TS-NNR algorithm demonstrates robustness to potential misspecifications in the baseline reward model.",
        "keywords": "Contextual Bandits;Mobile Health;Doubly Robust;Double Machine Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/34ff8d974221d8e69b4425c633a992b52bbcb035.pdf",
        "author": "Easton Knight Huch;Jieru Shi;Madeline R Abbott;Jessica R Golbus;Alexander Moreno;Walter H. Dempsey",
        "authorids": "~Easton_Knight_Huch1;~Jieru_Shi1;~Madeline_R_Abbott1;~Jessica_R_Golbus1;~Alexander_Moreno1;~Walter_H._Dempsey1",
        "gender": "M;F;;F;M;M",
        "homepage": ";https://herashi.github.io/;;;;",
        "dblp": ";;;;161/6588;203/4443",
        "google_scholar": ";https://scholar.google.com/citations?hl=zh-TW;;;zoqP2-IAAAAJ;TJ5P970AAAAJ",
        "orcid": "0000-0002-3822-1883;0000-0003-1108-1558;;0000-0002-9538-3926;;",
        "linkedin": "eastonhuch;;;;;",
        "or_profile": "~Easton_Knight_Huch1;~Jieru_Shi1;~Madeline_R_Abbott1;~Jessica_R_Golbus1;~Alexander_Moreno1;~Walter_H._Dempsey1",
        "aff": "University of Michigan - Ann Arbor;University of Michigan - Ann Arbor;;University of Michigan - Ann Arbor;STR;University of Michigan - Ann Arbor",
        "aff_domain": "umich.edu;umich.edu;;umich.edu;str.edu;umich.edu",
        "position": "PhD student;PhD student;;Instructor;Researcher;Associate Professor",
        "bibtex": "@misc{\nhuch2024debiased,\ntitle={Debiased Machine Learning and Network Cohesion for Doubly-Robust Differential Reward Models in Contextual Bandits},\nauthor={Easton Knight Huch and Jieru Shi and Madeline R Abbott and Jessica R Golbus and Alexander Moreno and Walter H. Dempsey},\nyear={2024},\nurl={https://openreview.net/forum?id=N3DEoB9fIQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "iXa9;HoU5;isfh;V6y9",
        "site": "https://openreview.net/forum?id=N3DEoB9fIQ",
        "pdf_size": 502261,
        "rating": "5;5;6;6",
        "confidence": "3;3;3;2",
        "soundness": "2;3;2;4",
        "contribution": "2;2;2;3",
        "presentation": "2;2;1;4",
        "wc_summary": "235;60;18;151",
        "wc_strengths": "36;88;29;78",
        "wc_weaknesses": "71;73;260;83",
        "wc_questions": "344;14;109;93",
        "wc_review": "686;235;416;405",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "786;380;1119;585",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            116.0,
            83.85403985497658
        ],
        "wc_strengths_avg": [
            57.75,
            25.616157010761782
        ],
        "wc_weaknesses_avg": [
            121.75,
            79.9480299944908
        ],
        "wc_questions_avg": [
            140.0,
            123.14828460031427
        ],
        "wc_review_avg": [
            435.5,
            161.44735984214793
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            717.5,
            272.65225104517293
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2709957065349894612&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of Michigan;",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.umich.edu;",
        "aff_unique_abbr": "UM;",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Ann Arbor;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States;"
    },
    {
        "id": "N4VbV5t11L",
        "title": "Spectral Self-supervised Feature Selection",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Selecting a meaningful subset of features from high-dimensional observations in unsupervised settings can significantly improve the accuracy of downstream analysis tasks such as clustering or dimensionality reduction and provide insight into the sources of heterogeneity in a given dataset. \nIn this paper, we derive a self-supervised graph-based approach for unsupervised feature selection. The core of our method is the robust computation of pseudo-labels by applying simple processing steps to the graph Laplacian's eigenvectors. The subset of eigenvectors used for computing pseudo-labels is chosen according to a model stability criterion. The importance of each feature is then measured by training a surrogate model to predict the pseudo-labels from the observations. \nWe show that our method is robust to challenging scenarios, such as the existence of outliers and complex substructures. \nOur approach's efficacy is demonstrated through experiments on real-world datasets, showing its robustness across multiple domains and particular effectiveness on biological datasets.",
        "keywords": "Feature Selection;Unsupervised Feature Selection;Spectral Methods;Graph Laplacian",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/24d0445c0d47234e6e653d6065ae37ced76fea96.zip",
        "author": "Daniel Segal;Ofir Lindenbaum;Ariel Jaffe",
        "authorids": "~Daniel_Segal1;~Ofir_Lindenbaum1;~Ariel_Jaffe1",
        "gender": ";M;M",
        "homepage": ";https://www.eng.biu.ac.il/lindeno/;",
        "dblp": ";142/4140;145/1230",
        "google_scholar": ";https://scholar.google.co.il/citations?user=jXxk6gcAAAAJ;",
        "orcid": ";;",
        "linkedin": "daniel-segal-622b6a182/;;",
        "or_profile": "~Daniel_Segal1;~Ofir_Lindenbaum1;~Ariel_Jaffe1",
        "aff": ";Bar-Ilan University;",
        "aff_domain": ";biu.ac.il;",
        "position": ";Assistant Professor;",
        "bibtex": "@misc{\nsegal2024spectral,\ntitle={Spectral Self-supervised Feature Selection},\nauthor={Daniel Segal and Ofir Lindenbaum and Ariel Jaffe},\nyear={2024},\nurl={https://openreview.net/forum?id=N4VbV5t11L}\n}",
        "github": "",
        "project": "",
        "reviewers": "Lxsn;thgm;vbcV;CaMn;v3VG",
        "site": "https://openreview.net/forum?id=N4VbV5t11L",
        "pdf_size": 5722158,
        "rating": "3;3;3;5;6",
        "confidence": "4;4;3;3;3",
        "soundness": "3;3;2;2;3",
        "contribution": "2;2;2;3;3",
        "presentation": "3;2;3;3;2",
        "wc_summary": "34;55;149;59;98",
        "wc_strengths": "21;15;65;198;70",
        "wc_weaknesses": "143;143;505;245;160",
        "wc_questions": "2;89;30;135;56",
        "wc_review": "200;302;749;637;384",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            4.0,
            1.2649110640673518
        ],
        "confidence_avg": [
            3.4,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            79.0,
            40.64972324629038
        ],
        "wc_strengths_avg": [
            73.8,
            65.97393424679174
        ],
        "wc_weaknesses_avg": [
            239.2,
            138.1772774373558
        ],
        "wc_questions_avg": [
            62.4,
            46.29730013726502
        ],
        "wc_review_avg": [
            454.4,
            206.41375923130707
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.6454972243679028,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:P5KgzT1DHLoJ:scholar.google.com/&scioq=Spectral+Self-supervised+Feature+Selection&hl=en&as_sdt=0,33",
        "gs_version_total": 4,
        "aff_unique_index": "0",
        "aff_unique_norm": "Bar-Ilan University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.biu.ac.il",
        "aff_unique_abbr": "BIU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Israel"
    },
    {
        "id": "N4gT8PIjHL",
        "title": "What Large Language Models Bring to Text-oriented VQA?",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Text-rich VQA, namely Visual Question Answering based on text recognition in the images, is a cross-modal task that requires both image comprehension and text recognition. In this work, we focus on investigating the advantages and bottlenecks of LLM-based approaches in addressing this problem. To address the above concern, we separate the vision and language modules, where we leverage external OCR models to recognize texts in the image and Large Language Models (LLMs) to answer the question given texts. The whole framework is training-free benefiting from the in-context ability of LLMs. This pipeline achieved superior performance compared to the majority of existing Multimodal Large Language Models (MLLM) on four text-rich VQA datasets. Besides, based on the ablation study, we find that LLM brings stronger comprehension ability and may introduce helpful knowledge for the VQA problem. The bottleneck for LLM to address text-rich VQA problems may primarily lie in visual part. We also combine the OCR module with MLLMs and pleasantly find that the combination of OCR module with MLLM also works. It's worth noting that not all MLLMs can comprehend the OCR information, which provides insights into how to train an MLLM that preserves the abilities of LLM.",
        "keywords": "Large Language Models;Multimodal Large Language Models;Text-oriented VQA",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Xuejing Liu;Wei Tang;Xinzhe Ni;Jinghui Lu;Rui Zhao;Zechao Li;Fei Tan",
        "authorids": "~Xuejing_Liu2;~Wei_Tang18;~Xinzhe_Ni1;~Jinghui_Lu2;~Rui_Zhao6;~Zechao_Li1;~Fei_Tan1",
        "gender": "F;M;M;M;M;M;M",
        "homepage": ";;;http://zhaorui.xyz/;;;https://georgeluimmortal.github.io/",
        "dblp": ";58/1874-11;;26/2578-1;51/8693;;14/983",
        "google_scholar": "https://scholar.google.com/citations?hl=en;D-27eLIAAAAJ;;1c9oQNMAAAAJ;;IhYATC0AAAAJ;ZzK_UdYAAAAJ",
        "orcid": ";;0000-0001-7845-7762;;;;0000-0001-7149-6961",
        "linkedin": ";;;;;;jinghui-lu-2712aa105",
        "or_profile": "~Xuejing_Liu2;~Wei_Tang18;~Xinzhe_Ni1;~Rui_Zhao6;~Zechao_Li1;~Fei_Tan1;~JINGHUI_LU1",
        "aff": ";Nanjing University of Science and Technology;Microsoft;SenseTime Research;Nanjing University of Science and Techonolgy;Sensetime Research;ByteDance Inc.",
        "aff_domain": ";njust.edu.cn;microsoft.com;sensetime.com;njust.edu.cn;sensetime.com;bytedance.com",
        "position": ";PhD student;Intern;Researcher;Full Professor;Researcher;Researcher",
        "bibtex": "@misc{\nliu2024what,\ntitle={What Large Language Models Bring to Text-oriented {VQA}?},\nauthor={Xuejing Liu and Wei Tang and Xinzhe Ni and Jinghui Lu and Rui Zhao and Zechao Li and Fei Tan},\nyear={2024},\nurl={https://openreview.net/forum?id=N4gT8PIjHL}\n}",
        "github": "",
        "project": "",
        "reviewers": "qy6F;B11c;yJVr;dgPH",
        "site": "https://openreview.net/forum?id=N4gT8PIjHL",
        "pdf_size": 11966071,
        "rating": "3;3;3;5",
        "confidence": "4;4;5;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;2",
        "presentation": "3;3;3;3",
        "wc_summary": "89;49;124;59",
        "wc_strengths": "33;22;66;113",
        "wc_weaknesses": "108;166;195;110",
        "wc_questions": "2;6;81;51",
        "wc_review": "232;243;466;333",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            80.25,
            29.23503890881625
        ],
        "wc_strengths_avg": [
            58.5,
            35.387144558440994
        ],
        "wc_weaknesses_avg": [
            144.75,
            37.19795021234369
        ],
        "wc_questions_avg": [
            35.0,
            32.79481666361317
        ],
        "wc_review_avg": [
            318.5,
            93.74033283491157
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:4XE1I1TuGyMJ:scholar.google.com/&scioq=What+Large+Language+Models+Bring+to+Text-oriented+VQA%3F&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0;2;3",
        "aff_unique_norm": "Nanjing University of Science and Technology;Microsoft;SenseTime;ByteDance",
        "aff_unique_dep": ";Microsoft Corporation;SenseTime Research;",
        "aff_unique_url": "http://www.nust.edu.cn/;https://www.microsoft.com;https://www.sensetime.com;https://www.bytedance.com",
        "aff_unique_abbr": "NUST;Microsoft;SenseTime;ByteDance",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "N581Nje6fH",
        "title": "Long Horizon Episodic Decision Making for Cognitively Inspired Robots",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The Human decision-making process works by recollecting past sequences of observations and using them to decide the best possible action in the present. These past sequences of observations are stored in a derived form which only includes important information the brain thinks might be useful in the future, while forgetting the rest. Transformers have shown great results in multi-modal robotic navigation and human-robot collaboration tasks but lack the ability to scale to large memory sizes and learn long horizon tasks efficiently as the computational requirements needed to run these models scale non-linearly with memory length. Our model for tries to mimic the human brain and improve the memory efficiency of transformers by using a modified TransformerXL architecture which uses Automatic Chunking that chunks the past memories and only attends to the relevant chunks in the transformer block. On top of this, we use ForgetSpan which is technique to remove memories that do not contribute to learning. We also theorize the technique of Similarity based forgetting where the current observations are compared with the elements in the memory and only the new observations are stored, similar to how humans do not store repetitive memories. We test our model in various visual and audio-visual tasks that demand long horizon recollection, audio-visual instruction deciphering and robotic navigation. These tasks test the abilities of the robot that would be required in a human-robot collaboration scenario. We demonstrate that Automatic Chunking with ForgetSpan can improve the memory efficiency and help models to memorize important information and also achieve better performance than the baseline TransformerXL in the tasks previously mentioned. We also show that our model generalizes well by testing the trained models in modified versions of the tasks.",
        "keywords": "Representation learning;Reinforcement learning;Human-Robot Collaboration",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Shweta Singh;Vedant Ghatnekar;Sudaman Rajesh Katti",
        "authorids": "~Shweta_Singh3;~Vedant_Ghatnekar1;~Sudaman_Rajesh_Katti1",
        "gender": ";M;M",
        "homepage": ";;",
        "dblp": ";;",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?view_op=new_profile",
        "orcid": "0009-0003-7055-0251;;0000-0002-9082-0103",
        "linkedin": ";vedant-ghatnekar/;sudaman-katti-5736b8234/",
        "or_profile": "~Shweta_Singh3;~Vedant_Ghatnekar1;~Sudaman_Rajesh_Katti1",
        "aff": "International Institute of Information Technology, Hyderabad, International Institute of Information Technology Hyderabad;;",
        "aff_domain": "research.iiit.ac.in;;",
        "position": "PhD student;;",
        "bibtex": "@misc{\nsingh2024long,\ntitle={Long Horizon Episodic Decision Making for Cognitively Inspired~Robots},\nauthor={Shweta Singh and Vedant Ghatnekar and Sudaman Rajesh Katti},\nyear={2024},\nurl={https://openreview.net/forum?id=N581Nje6fH}\n}",
        "github": "",
        "project": "",
        "reviewers": "KtCs;giAH;Kvk7;nji3",
        "site": "https://openreview.net/forum?id=N581Nje6fH",
        "pdf_size": 1333798,
        "rating": "1;1;1;3",
        "confidence": "4;5;4;5",
        "soundness": "2;1;1;1",
        "contribution": "3;1;2;1",
        "presentation": "1;1;1;1",
        "wc_summary": "95;15;62;100",
        "wc_strengths": "88;20;22;35",
        "wc_weaknesses": "137;46;17;811",
        "wc_questions": "42;5;17;91",
        "wc_review": "362;86;118;1037",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            1.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            1.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            1.0,
            0.0
        ],
        "wc_summary_avg": [
            68.0,
            33.904277016329374
        ],
        "wc_strengths_avg": [
            41.25,
            27.598686562950782
        ],
        "wc_weaknesses_avg": [
            252.75,
            325.3324261428608
        ],
        "wc_questions_avg": [
            38.75,
            32.98768709685479
        ],
        "wc_review_avg": [
            400.75,
            382.5345572624779
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15564415408377572285&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0",
        "aff_unique_norm": "International Institute of Information Technology, Hyderabad",
        "aff_unique_dep": "",
        "aff_unique_url": "https://iiit Hyderabad.ac.in",
        "aff_unique_abbr": "IIIT Hyderabad",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Hyderabad",
        "aff_country_unique_index": "0",
        "aff_country_unique": "India"
    },
    {
        "id": "N5ID99rsUq",
        "title": "Stability and Generalization in Free Adversarial Training",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "While adversarial training methods have resulted in significant improvements in the deep neural nets' robustness against norm-bounded adversarial perturbations, their generalization performance from training samples to test data has been shown to be considerably worse than standard empirical risk minimization methods. Several recent studies seek to connect the generalization behavior of adversarially trained classifiers to various gradient-based min-max optimization algorithms used for their training. In this work, we study the generalization performance of adversarial training methods using the algorithmic stability framework. Specifically, our goal is to compare the generalization performance of vanilla adversarial training scheme fully optimizing the perturbations at every iteration vs. the free adversarial training simultaneously optimizing the norm-bounded perturbations and classifier parameters. Our proven generalization bounds indicate that the free adversarial training method could enjoy a lower generalization gap between training and test samples due to the simultaneous nature of its min-max optimization algorithm. We perform several numerical experiments to evaluate the generalization performance of vanilla, fast, and free adversarial training methods. Our empirical findings also show the improved generalization performance of the free adversarial training method and further demonstrate that the better generalization result could translate to greater robustness against black-box attack schemes and higher transferability of the adversarial examples designed for free adversarially trained neural networks.",
        "keywords": "Adversarial training;generalization in robust learning;min-max optimization;algorithmic stability",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/612b90e4d0f19aaa015eb9bfc954c60bc6e9a9dd.zip",
        "author": "Xiwei Cheng;Kexin Fu;Farzan Farnia",
        "authorids": "~Xiwei_Cheng2;~Kexin_Fu2;~Farzan_Farnia1",
        "gender": "M;F;M",
        "homepage": "https://xiwei-cheng.github.io/;;https://www.cse.cuhk.edu.hk/~farnia/",
        "dblp": ";;132/7757",
        "google_scholar": "IDbEZeoAAAAJ;;GYPCqcYAAAAJ",
        "orcid": ";;0000-0002-6049-9232",
        "linkedin": ";kexin-fu-9a5179247/;farzan-farnia-00798335",
        "or_profile": "~Xiwei_Cheng2;~Kexin_Fu2;~Farzan_Farnia1",
        "aff": "Department of Computer Science and Engineering, The Chinese University of Hong Kong;The Chinese University of Hong Kong;The Chinese University of Hong Kong",
        "aff_domain": "cse.cuhk.edu.hk;cuhk.edu.hk;cuhk.edu.hk",
        "position": "Master of Philosophy student;Undergrad student;Assistant Professor",
        "bibtex": "@misc{\ncheng2024stability,\ntitle={Stability and Generalization in Free Adversarial Training},\nauthor={Xiwei Cheng and Kexin Fu and Farzan Farnia},\nyear={2024},\nurl={https://openreview.net/forum?id=N5ID99rsUq}\n}",
        "github": "",
        "project": "",
        "reviewers": "T7Bj;wev8;ge9g;iGFe",
        "site": "https://openreview.net/forum?id=N5ID99rsUq",
        "pdf_size": 1917096,
        "rating": "3;6;6;6",
        "confidence": "4;4;3;4",
        "soundness": "2;3;2;3",
        "contribution": "2;3;2;2",
        "presentation": "3;3;2;3",
        "wc_summary": "63;41;73;46",
        "wc_strengths": "27;52;15;40",
        "wc_weaknesses": "81;222;171;176",
        "wc_questions": "134;223;2;39",
        "wc_review": "305;538;261;301",
        "wc_reply_reviewers": "0;79;115;0",
        "wc_reply_authors": "632;1211;627;406",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;3;2;1",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            55.75,
            12.871965661856
        ],
        "wc_strengths_avg": [
            33.5,
            13.865424623862047
        ],
        "wc_weaknesses_avg": [
            162.5,
            51.08081831764248
        ],
        "wc_questions_avg": [
            99.5,
            86.03632953584201
        ],
        "wc_review_avg": [
            351.25,
            109.18419070543135
        ],
        "wc_reply_reviewers_avg": [
            48.5,
            50.1422975141746
        ],
        "wc_reply_authors_avg": [
            719.0,
            298.35633058475565
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12770516008989347981&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Chinese University of Hong Kong",
        "aff_unique_dep": "Department of Computer Science and Engineering",
        "aff_unique_url": "https://www.cuhk.edu.hk",
        "aff_unique_abbr": "CUHK",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Query-Dependent Prompt Evaluation and Optimization with Offline Inverse RL",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18797",
        "id": "N6o0ZtPzTg",
        "author_site": "Hao Sun, Alihan H\u00fcy\u00fck, Mihaela van der Schaar",
        "tldr": "",
        "abstract": "In this study, we aim to enhance the arithmetic reasoning ability of Large Language Models (LLMs) through zero-shot prompt optimization. We identify a previously overlooked objective of query dependency in such optimization and elucidate two ensuing challenges that impede the successful and economical design of prompt optimization techniques. One primary issue is the absence of an effective method to evaluate prompts during inference when the golden answer is unavailable. Concurrently, learning via interactions with the LLMs to navigate the expansive natural language prompting space proves to be resource-intensive.\nTo address this, we introduce Prompt-OIRL, which harnesses offline inverse reinforcement learning to draw insights from offline prompting demonstration data. Such data exists as by-products when diverse prompts are benchmarked on open-accessible datasets. With Prompt-OIRL, the query-dependent prompt optimization objective is achieved by first learning an offline reward model. This model can evaluate any query-prompt pairs without accessing LLMs. Subsequently, a best-of-N strategy is deployed to recommend the optimal prompt. Our experimental evaluations across various LLM scales and arithmetic reasoning datasets underscore both the efficacy and economic viability of the proposed approach.",
        "keywords": "Prompting;Large Language Models;Inverse Reinforcement Learning;RLHF;Imitation Learning;Learning from Demonstrations;LLM Alignment;Off-Policy Evaluation;Off-Policy Optimization",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/a771b8b021d74c205fb5c5e13c95199bbb83b3d8.zip",
        "author": "Hao Sun;Alihan H\u00fcy\u00fck;Mihaela van der Schaar",
        "authorids": "~Hao_Sun3;~Alihan_H\u00fcy\u00fck1;~Mihaela_van_der_Schaar2",
        "gender": ";F;M",
        "homepage": ";https://www.vanderschaar-lab.com;https://holarissun.github.io",
        "dblp": "227/2296;;SunLLZL19",
        "google_scholar": "EMq6KwMAAAAJ;DZ3S--MAAAAJ;7ZNoHJkAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Alihan_H\u00fcy\u00fck1;~Mihaela_van_der_Schaar2;~Hao_Sun1",
        "aff": "University of Cambridge;University of California, Los Angeles;University of Cambridge",
        "aff_domain": "cam.ac.uk;ucla.edu;cam.ac.uk",
        "position": "PhD student;Full Professor;PhD student",
        "bibtex": "@inproceedings{\nsun2024querydependent,\ntitle={Query-Dependent Prompt Evaluation and Optimization with Offline Inverse {RL}},\nauthor={Hao Sun and Alihan H{\\\"u}y{\\\"u}k and Mihaela van der Schaar},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=N6o0ZtPzTg}\n}",
        "github": "",
        "project": "",
        "reviewers": "xV9W;QVHX;mPPy;wFdE",
        "pdf_size": 3163212,
        "rating": "6;6;6;6",
        "confidence": "4;4;3;3",
        "soundness": "3;3;2;4",
        "contribution": "3;3;3;3",
        "presentation": "2;3;2;3",
        "wc_summary": "37;133;94;88",
        "wc_strengths": "17;70;46;110",
        "wc_weaknesses": "53;191;247;205",
        "wc_questions": "2;3;331;13",
        "wc_review": "109;397;718;416",
        "wc_reply_reviewers": "0;28;186;46",
        "wc_reply_authors": "1311;1313;3297;1773",
        "reply_reviewers": "0;1;2;1",
        "reply_authors": "3;4;8;5",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            88.0,
            34.13942003022313
        ],
        "wc_strengths_avg": [
            60.75,
            34.06886408438062
        ],
        "wc_weaknesses_avg": [
            174.0,
            72.83543093852057
        ],
        "wc_questions_avg": [
            87.25,
            140.79484187994956
        ],
        "wc_review_avg": [
            410.0,
            215.4472093112371
        ],
        "wc_reply_reviewers_avg": [
            65.0,
            71.75653280364095
        ],
        "wc_reply_authors_avg": [
            1923.5,
            815.0182513293797
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            5.0,
            1.8708286933869707
        ],
        "replies_avg": [
            33,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 33,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16681283569323777959&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=N6o0ZtPzTg",
        "pdf": "https://openreview.net/pdf?id=N6o0ZtPzTg",
        "email": "cam.ac.uk;ucla.edu;cam.ac.uk",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Cambridge;University of California, Los Angeles",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cam.ac.uk;https://www.ucla.edu",
        "aff_unique_abbr": "Cambridge;UCLA",
        "aff_campus_unique_index": "0;1;0",
        "aff_campus_unique": "Cambridge;Los Angeles",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "id": "N7rEyHTZO9",
        "title": "SSC Layer - A replacement for convolutional layers",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Convolutional layers have been used in practically every application of machine learning. We propose the SSC layer, which functions similarly to the convolutional layer but is faster, more memory efficient and competitive in terms of accuracy. The SSC layer splits the input tensor across the channel dimension, shifts each split by a different amount and subtracts the result from the input. This process enables a kernel size equal to the channel size without increasing model size, memory usage and without affecting speed, unlike convolutional layers.\nThe SCC layer functions in multiple dimensions and is able to replace the convolutional layer in a number of applications including image classification, sequence modelling and single-channel speech separation.",
        "keywords": "convolutional layer;lightweight;sequence modelling",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Joel Rixen;Matthias Renz",
        "authorids": "~Joel_Rixen1;~Matthias_Renz1",
        "gender": ";M",
        "homepage": ";https://www.ai.informatik.uni-kiel.de/de/team/prof-dr-matthias-renz",
        "dblp": ";r/MatthiasRenz",
        "google_scholar": ";47gh3JkAAAAJ",
        "orcid": ";0000-0002-2024-7700",
        "linkedin": ";",
        "or_profile": "~Joel_Rixen1;~Matthias_Renz1",
        "aff": ";Christian-Albrechts-Universit\u00e4t Kiel",
        "aff_domain": ";uni-kiel.de",
        "position": ";Full Professor",
        "bibtex": "@misc{\nrixen2024ssc,\ntitle={{SSC} Layer - A replacement for convolutional layers},\nauthor={Joel Rixen and Matthias Renz},\nyear={2024},\nurl={https://openreview.net/forum?id=N7rEyHTZO9}\n}",
        "github": "",
        "project": "",
        "reviewers": "VmEE;EyXj;thRf;UNBR",
        "site": "https://openreview.net/forum?id=N7rEyHTZO9",
        "pdf_size": 251119,
        "rating": "3;3;3;3",
        "confidence": "3;5;4;4",
        "soundness": "2;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "1;2;3;3",
        "wc_summary": "49;63;68;44",
        "wc_strengths": "22;19;30;28",
        "wc_weaknesses": "199;156;86;22",
        "wc_questions": "6;57;19;63",
        "wc_review": "276;295;203;157",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            56.0,
            9.82344135219425
        ],
        "wc_strengths_avg": [
            24.75,
            4.437059837324712
        ],
        "wc_weaknesses_avg": [
            115.75,
            67.49953703544936
        ],
        "wc_questions_avg": [
            36.25,
            24.283482040267618
        ],
        "wc_review_avg": [
            232.75,
            55.60744104883806
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:vDNBYr_-CxcJ:scholar.google.com/&scioq=SSC+Layer+-+A+replacement+for+convolutional+layers&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Christian-Albrechts-Universit\u00e4t",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uni-kiel.de",
        "aff_unique_abbr": "CAU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Kiel",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Germany"
    },
    {
        "title": "MetaMath: Bootstrap Your Own Mathematical Questions for Large Language Models",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18796",
        "id": "N8N0hgNDRt",
        "author_site": "Longhui Yu, Weisen JIANG, Han Shi, Jincheng YU, Zhengying Liu, Yu Zhang, James Kwok, Zhenguo Li, Adrian Weller, Weiyang Liu",
        "tldr": "",
        "abstract": "Large language models (LLMs) have pushed the limits of natural language understanding and exhibited excellent problem-solving ability. Despite the great success, most existing open-source LLMs (\\eg, LLaMA-2) are still far away from satisfactory for solving mathematical problems due to the complex reasoning procedures. To bridge this gap, we propose \\emph{MetaMath}, a finetuned language model that specializes in mathematical reasoning. Specifically, we start by bootstrapping mathematical questions by rewriting the question from multiple perspectives, which results in a new dataset called MetaMathQA. Then we finetune the LLaMA-2 models on MetaMathQA. Experimental results on two popular benchmarks (\\ie, GSM8K and MATH) for mathematical reasoning demonstrate that MetaMath outperforms a suite of open-source LLMs by a significant margin.  Our MetaMath-7B model achieves $66.5\\%$ on GSM8K and $19.8\\%$ on MATH, exceeding the state-of-the-art models of the same size by $11.5\\%$ and $8.7\\%$. Particularly, MetaMath-70B achieves an accuracy of $82.3\\%$ on GSM8K, slightly better than GPT-3.5-Turbo. We release the MetaMathQA dataset, the MetaMath models with different model sizes and the training code for public use.",
        "keywords": "Large Language Model; Mathematical Reasoning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/2ede1d5e80045e7dc50e92989283ab466e746613.zip",
        "author": "Longhui Yu;Weisen Jiang;Han Shi;Jincheng YU;Zhengying Liu;Yu Zhang;James Kwok;Zhenguo Li;Adrian Weller;Weiyang Liu",
        "authorids": "~Longhui_Yu1;~Weisen_Jiang1;~Han_Shi1;~Jincheng_YU1;~Zhengying_Liu2;~Yu_Zhang3;~James_Kwok1;~Zhenguo_Li1;~Adrian_Weller1;~Weiyang_Liu1",
        "gender": "M;M;M;M;M;M;;M;M;M",
        "homepage": "https://yulonghui.github.io/;https://wayson-ust.github.io/;https://han-shi.github.io/;https://lovesykun.cn;;http://cse.sustech.edu.cn/faculty/~zhangy/;;http://www.ee.columbia.edu/~zgli/;http://mlg.eng.cam.ac.uk/adrian/;http://wyliu.com/",
        "dblp": "313/9946;302/7625;;;241/1782;50/671-6;;23/6479;73/8324;137/1532",
        "google_scholar": "https://scholar.google.com.hk/citations?user=3eHjDDgAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com.hk/citations?user=Johp_14AAAAJ;;http:// DFme0joAAAAJ;https://scholar.google.com.hk/citations?user=jaRS5w4AAAAJ;;XboZC1AAAAAJ;https://scholar.google.co.uk/citations?user=Ek4hM10AAAAJ;DMjROf0AAAAJ",
        "orcid": ";;;;;;;;;",
        "linkedin": "%E9%BE%99%E8%BE%89-%E8%99%9E-71655a154/;;;;;;;;;",
        "or_profile": "~Longhui_Yu1;~Weisen_Jiang1;~Han_Shi1;~Jincheng_YU1;~Zhengying_Liu2;~Yu_Zhang3;~James_Kwok1;~Zhenguo_Li1;~Adrian_Weller1;~Weiyang_Liu1",
        "aff": ";Hong Kong University of Science and Technology;Huawei Technologies Ltd.;Hong Kong University of Science and Technology;Huawei Technologies Ltd.;Southern University of Science and Technology;;Huawei Noah's Ark Lab;University of Cambridge;University of Cambridge",
        "aff_domain": ";ust.hk;huawei.com;ust.hk;huawei.com;sustc.edu.cn;;huawei.com;cam.ac.uk;cam.ac.uk",
        "position": ";PhD student;Principal Researcher;MS student;Researcher;Associate Professor;;Principal Researcher;Principal Researcher;Researcher",
        "bibtex": "@inproceedings{\nyu2024metamath,\ntitle={MetaMath: Bootstrap Your Own Mathematical Questions for Large Language Models},\nauthor={Longhui Yu and Weisen Jiang and Han Shi and Jincheng YU and Zhengying Liu and Yu Zhang and James Kwok and Zhenguo Li and Adrian Weller and Weiyang Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=N8N0hgNDRt}\n}",
        "github": "",
        "project": "",
        "reviewers": "mqn7;AmB6;pSoC;nyhB",
        "pdf_size": 596591,
        "rating": "8;8;8;8",
        "confidence": "4;4;4;3",
        "soundness": "4;4;3;3",
        "contribution": "3;3;3;3",
        "presentation": "4;4;4;3",
        "wc_summary": "81;111;66;99",
        "wc_strengths": "54;70;46;102",
        "wc_weaknesses": "77;101;41;76",
        "wc_questions": "31;1;33;77",
        "wc_review": "243;283;186;354",
        "wc_reply_reviewers": "41;0;39;0",
        "wc_reply_authors": "394;426;711;1276",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "2;1;3;3",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            89.25,
            17.151894939043906
        ],
        "wc_strengths_avg": [
            68.0,
            21.447610589527216
        ],
        "wc_weaknesses_avg": [
            73.75,
            21.39363223017541
        ],
        "wc_questions_avg": [
            35.5,
            27.1062723368596
        ],
        "wc_review_avg": [
            266.5,
            61.15758334008956
        ],
        "wc_reply_reviewers_avg": [
            20.0,
            20.0124960961895
        ],
        "wc_reply_authors_avg": [
            701.75,
            353.76431066460054
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 613,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4019642283454829969&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=N8N0hgNDRt",
        "pdf": "https://openreview.net/pdf?id=N8N0hgNDRt",
        "email": ";ust.hk;huawei.com;ust.hk;huawei.com;sustc.edu.cn;;huawei.com;cam.ac.uk;cam.ac.uk",
        "author_num": 10,
        "aff_unique_index": "0;1;0;1;2;1;3;3",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Huawei;Southern University of Science and Technology;University of Cambridge",
        "aff_unique_dep": ";Huawei Technologies;;",
        "aff_unique_url": "https://www.ust.hk;https://www.huawei.com;https://www.sustech.edu.cn;https://www.cam.ac.uk",
        "aff_unique_abbr": "HKUST;Huawei;SUSTech;Cambridge",
        "aff_campus_unique_index": "0;0;2;2",
        "aff_campus_unique": "Hong Kong SAR;;Cambridge",
        "aff_country_unique_index": "0;0;0;0;0;0;1;1",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "id": "N8UGyR3HTI",
        "title": "FragSel: Fragmented Selection for Noisy Label Regression",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "As with many other problems, real-world regression is plagued by the presence of noisy labels,  an inevitable issue that demands our attention. \nFortunately, much real-world data often exhibits an intrinsic property of continuously ordered correlations between labels and features; where data points with similar labels are also represented with closely related features.\nIn response, we propose a novel approach named FragSel wherein we collectively model the regression data by transforming them into disjoint yet contrasting fragmentation pairs. This allows us to train more distinctive representations, enhancing our ability to tackle the issue of noisy labels.\nOur FragSel framework subsequently leverages a mixture of neighboring fragments to discern noisy labels through neighbor agreement within both the prediction and representation spaces.\nTo underscore the effectiveness of our framework, we extensively perform experiments on four benchmark datasets of diverse domains, including age prediction, price prediction, and music production year estimation.\nOur approach consistently outperforms thirteen state-of-the-art baselines, being robust against symmetric and random Gaussian label noise.",
        "keywords": "Noisy Labels;Regression;Mixture Models",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Chris Dongjoo Kim;Dongyeon Woo;Sangwoo Moon;Gunhee Kim",
        "authorids": "~Chris_Dongjoo_Kim2;~Dongyeon_Woo1;~Sangwoo_Moon3;~Gunhee_Kim1",
        "gender": ";M;M;M",
        "homepage": ";;;http://vision.snu.ac.kr/gunhee/",
        "dblp": ";;;45/115",
        "google_scholar": ";dKGgnbMAAAAJ;https://scholar.google.com/citations?view_op=list_works;https://scholar.google.co.kr/citations?user=CiSdOV0AAAAJ",
        "orcid": ";;;0000-0002-9543-7453",
        "linkedin": ";;;",
        "or_profile": "~Chris_Dongjoo_Kim2;~Dongyeon_Woo1;~Sangwoo_Moon3;~Gunhee_Kim1",
        "aff": ";Seoul National University;Seoul National University;Seoul National University",
        "aff_domain": ";snu.ac.kr;snu.ac.kr;snu.ac.kr",
        "position": ";PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nkim2024fragsel,\ntitle={FragSel: Fragmented Selection for Noisy Label Regression},\nauthor={Chris Dongjoo Kim and Dongyeon Woo and Sangwoo Moon and Gunhee Kim},\nyear={2024},\nurl={https://openreview.net/forum?id=N8UGyR3HTI}\n}",
        "github": "",
        "project": "",
        "reviewers": "PSFZ;3QwR;KgTt;yzhv",
        "site": "https://openreview.net/forum?id=N8UGyR3HTI",
        "pdf_size": 3844904,
        "rating": "5;5;6;6",
        "confidence": "4;4;5;2",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "50;85;72;47",
        "wc_strengths": "34;89;69;75",
        "wc_weaknesses": "120;65;236;35",
        "wc_questions": "143;237;16;1",
        "wc_review": "347;476;393;158",
        "wc_reply_reviewers": "109;0;0;0",
        "wc_reply_authors": "3461;1160;504;489",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "6;2;1;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            63.5,
            15.724185193516387
        ],
        "wc_strengths_avg": [
            66.75,
            20.253086184579377
        ],
        "wc_weaknesses_avg": [
            114.0,
            76.74959283279618
        ],
        "wc_questions_avg": [
            99.25,
            96.78939766317383
        ],
        "wc_review_avg": [
            343.5,
            116.65011787392244
        ],
        "wc_reply_reviewers_avg": [
            27.25,
            47.198384506251905
        ],
        "wc_reply_authors_avg": [
            1403.5,
            1218.4015142800833
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            2.0615528128088303
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.22941573387056177,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:H_gxBE7vd5cJ:scholar.google.com/&scioq=FragSel:+Fragmented+Selection+for+Noisy+Label+Regression&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Seoul National University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.snu.ac.kr",
        "aff_unique_abbr": "SNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "N9wD4RFWY0",
        "title": "Benchmarking Large Language Models as AI Research Agents",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Human researchers can perform scientific experimentation loops \u2013 planning, experimenting, observing the results, and generating inferences. Can we build AI research agents to perform the same? To take a step towards building and evaluating research agents capable of such open-ended decision-making, we focus\non the problem of having agents perform machine learning (ML) tasks given a\nresearch problem description and dataset. In this paper, we propose MLAgent-\nBench, a suite of ML tasks for benchmarking AI research agents. Agents can\nperform actions like file system operations, executing code, and inspecting outputs.\nWith these actions, agents could run experiments, analyze the results, and modify\nthe code of entire machine learning pipelines, such as data processing, architecture, training processes, etc. The benchmark then automatically evaluates the agent\u2019s performance objectively over various metrics related to performance and\nefficiency. We also design an LLM-based research agent to automatically perform\nexperimentation loops in such an environment. Empirically, we find that a GPT-4-\nbased research agent can feasibly build compelling ML models over many tasks in\nMLAgentBench, displaying highly interpretable plans and actions. However, the\nsuccess rates vary considerably; they span from almost 90% on well-established\nolder datasets to as low as 10% on recent Kaggle Challenges \u2013 unavailable during\nthe LLM model\u2019s pretraining \u2013 and even 0% on newer research challenges like\nBabyLM. Finally, we identify several key challenges for LLM-based research\nagents such as long-term planning and hallucination. Our code is released at\nhttps://anonymous.4open.science/r/MLAgentBench/.",
        "keywords": "Large Language Model Agents;Benchmark",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/4e4d363498aca0673daa4d13c32d4e629f3195e2.pdf",
        "author": "Qian Huang;Jian Vora;Percy Liang;Jure Leskovec",
        "authorids": "~Qian_Huang2;~Jian_Vora1;~Percy_Liang1;~Jure_Leskovec1",
        "gender": "F;M;;",
        "homepage": "https://q-hwang.github.io/;https://jianvora.github.io;https://cs.stanford.edu/~pliang/;http://cs.stanford.edu/~jure/",
        "dblp": "07/4378.html;;04/1701;l/JureLeskovec",
        "google_scholar": "L3hkmG0AAAAJ;D1Jl19oAAAAJ;pouyVyUAAAAJ;Q_kKkIUAAAAJ",
        "orcid": ";;;0000-0002-5411-923X",
        "linkedin": "qian-huang-b20315149/;;;leskovec/",
        "or_profile": "~Qian_Huang2;~Jian_Vora1;~Percy_Liang1;~Jure_Leskovec1",
        "aff": "Stanford University;Computer Science Department, Stanford University;Stanford University;Kumo.AI",
        "aff_domain": "stanford.edu;cs.stanford.edu;stanford.edu;kumo.ai",
        "position": "PhD student;MS student;Associate Professor;Chief Scientist",
        "bibtex": "@misc{\nhuang2024benchmarking,\ntitle={Benchmarking Large Language Models as {AI} Research Agents},\nauthor={Qian Huang and Jian Vora and Percy Liang and Jure Leskovec},\nyear={2024},\nurl={https://openreview.net/forum?id=N9wD4RFWY0}\n}",
        "github": "",
        "project": "",
        "reviewers": "CHg2;TJMi;UyZC;5hPW",
        "site": "https://openreview.net/forum?id=N9wD4RFWY0",
        "pdf_size": 350505,
        "rating": "3;3;6;10",
        "confidence": "5;3;3;4",
        "soundness": "2;2;2;4",
        "contribution": "2;2;2;4",
        "presentation": "2;3;2;4",
        "wc_summary": "100;113;68;78",
        "wc_strengths": "48;57;31;114",
        "wc_weaknesses": "274;299;31;141",
        "wc_questions": "2;115;57;2",
        "wc_review": "424;584;187;335",
        "wc_reply_reviewers": "392;714;162;178",
        "wc_reply_authors": "417;1639;870;246",
        "reply_reviewers": "1;2;1;1",
        "reply_authors": "1;2;2;1",
        "rating_avg": [
            5.5,
            2.8722813232690143
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            89.75,
            17.725334975678173
        ],
        "wc_strengths_avg": [
            62.5,
            31.164884084494844
        ],
        "wc_weaknesses_avg": [
            186.25,
            107.89201777703484
        ],
        "wc_questions_avg": [
            44.0,
            46.738634982207174
        ],
        "wc_review_avg": [
            382.5,
            143.87581450681697
        ],
        "wc_reply_reviewers_avg": [
            361.5,
            222.85589514302734
        ],
        "wc_reply_authors_avg": [
            793.0,
            539.0338579347313
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.0524863881081478,
        "gs_citation": 49,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8501985565736397839&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "Stanford University;Kumo.AI",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.stanford.edu;https://www.kumo.ai",
        "aff_unique_abbr": "Stanford;Kumo.AI",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Stanford;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "NDfxOMJqgL",
        "title": "CAST: Cluster-Aware Self-Training for Tabular Data",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Self-training has gained attraction because of its simplicity and versatility, yet it is vulnerable to noisy pseudo-labels. Several studies have proposed successful approaches to tackle this issue, but they have diminished the advantages of self-training because they require specific modifications in self-training algorithms or model architectures. Furthermore, most of them are incompatible with gradient boosting decision trees, which dominate the tabular domain. To address this, we revisit the cluster assumption, which states that data samples that are close to each other tend to belong to the same class. Inspired by the assumption, we propose Cluster-Aware Self-Training (CAST) for tabular data. CAST is a simple and universally adaptable approach for enhancing existing self-training algorithms without significant modifications. Concretely, our method regularizes the confidence of the classifier, which represents the value of the pseudo-label, forcing the pseudo-labels in low-density regions to have lower confidence by leveraging prior knowledge for each class within the training data. Extensive empirical evaluations on up to 20 real-world datasets confirm not only the superior performance of CAST but also its robustness in various setups in self-training contexts.",
        "keywords": "Self-Training;Semi-Supervised Learning;Tabular Data;Reliable Confidence;Reliable Pseudo-Labeling;Cluster Assumption",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/8c081b8b49cbe49a7336e0328ddb8fe0da4ae5f2.zip",
        "author": "Minwook Kim;Juseong Kim;Ki Beom Kim;Donggil Kang;Giltae Song",
        "authorids": "~Minwook_Kim2;~Juseong_Kim3;~Ki_Beom_Kim1;~Donggil_Kang1;~Giltae_Song1",
        "gender": "M;M;M;;M",
        "homepage": "https://github.com/Alcoholrithm;https://github.com/Juseong03;https://github.com/tigerkey10;https://github.com/donggil113/donggil113;https://dmb.pusan.ac.kr",
        "dblp": ";;;;",
        "google_scholar": ";;;;1_MMxyAAAAAJ",
        "orcid": ";;;;0000-0001-8796-4678",
        "linkedin": ";;;;",
        "or_profile": "~Minwook_Kim2;~Juseong_Kim3;~Ki_Beom_Kim1;~Donggil_Kang1;~Giltae_Song1",
        "aff": "Pusan National University;Pusan National University;Pusan National University;;Pusan National University",
        "aff_domain": "pusan.ac.kr;pusan.ac.kr;pusan.ac.kr;;pusan.ac.kr",
        "position": "MS student;PhD student;MS student;;Associate Professor",
        "bibtex": "@misc{\nkim2024cast,\ntitle={{CAST}: Cluster-Aware Self-Training for Tabular Data},\nauthor={Minwook Kim and Juseong Kim and Ki Beom Kim and Donggil Kang and Giltae Song},\nyear={2024},\nurl={https://openreview.net/forum?id=NDfxOMJqgL}\n}",
        "github": "",
        "project": "",
        "reviewers": "QRTY;QLpL;DTs7;USSG;b9QV",
        "site": "https://openreview.net/forum?id=NDfxOMJqgL",
        "pdf_size": 1009289,
        "rating": "3;5;5;5;6",
        "confidence": "4;3;3;4;4",
        "soundness": "1;2;3;2;3",
        "contribution": "2;2;2;2;3",
        "presentation": "3;3;2;2;3",
        "wc_summary": "64;126;20;74;32",
        "wc_strengths": "20;32;35;42;57",
        "wc_weaknesses": "355;144;123;110;203",
        "wc_questions": "36;108;4;4;5",
        "wc_review": "475;410;182;230;297",
        "wc_reply_reviewers": "0;267;40;18;0",
        "wc_reply_authors": "1334;2689;573;745;722",
        "reply_reviewers": "0;1;1;1;0",
        "reply_authors": "3;4;2;2;1",
        "rating_avg": [
            4.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.2,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            63.2,
            37.150504707204185
        ],
        "wc_strengths_avg": [
            37.2,
            12.188519188154071
        ],
        "wc_weaknesses_avg": [
            187.0,
            89.83763131338671
        ],
        "wc_questions_avg": [
            31.4,
            40.21740916568346
        ],
        "wc_review_avg": [
            318.8,
            109.35337214736452
        ],
        "wc_reply_reviewers_avg": [
            65.0,
            102.0666448944022
        ],
        "wc_reply_authors_avg": [
            1212.6,
            782.6776092363956
        ],
        "reply_reviewers_avg": [
            0.6,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            2.4,
            1.019803902718557
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.16666666666666663,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:xEZ6deW3QEMJ:scholar.google.com/&scioq=CAST:+Cluster-Aware+Self-Training+for+Tabular+Data&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Pusan National University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.pnu.ac.kr",
        "aff_unique_abbr": "PNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "V-DETR: DETR with Vertex Relative Position Encoding for 3D Object Detection",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18795",
        "id": "NDkpxG94sF",
        "author_site": "Yichao Shen, Zigang Geng, YUHUI YUAN, Yutong Lin, Ze Liu, Chunyu Wang, Han Hu, Nanning Zheng, Baining Guo",
        "tldr": "",
        "abstract": "We introduce a highly performant 3D object detector for point clouds using the DETR framework. The prior attempts all end up with suboptimal results because they fail to learn accurate inductive biases from the limited scale of training data. In particular, the queries often attend to points that are far away from the target objects, violating the locality principle in object detection. To address the limitation, we introduce a novel 3D Vertex Relative Position Encoding (3DV-RPE) method which computes position encoding for each point based on its relative position to the 3D boxes predicted by the queries in each decoder layer, thus providing clear information to guide the model to focus on points near the objects, in accordance with the principle of locality. Furthermore, we have systematically refined our pipeline, including data normalization, to better align with the task requirements. Our approach demonstrates remarkable performance on the demanding ScanNetV2 benchmark, showcasing substantial enhancements over the prior state-of-the-art CAGroup3D. Specifically, we achieve an increase in $AP_{25}$  from $75.1\\%$ to $77.8\\%$ and in  ${AP}_{50}$ from $61.3\\%$ to $66.0\\%$.",
        "keywords": "3D Object Detection;Detection Transformer;Relative Position Encoding",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yichao Shen;Zigang Geng;Yuhui Yuan;Yutong Lin;Ze Liu;Chunyu Wang;Han Hu;Nanning Zheng;Baining Guo",
        "authorids": "~Yichao_Shen1;~Zigang_Geng1;~Yuhui_Yuan1;~Yutong_Lin1;~Ze_Liu1;~Chunyu_Wang1;~Han_Hu1;~Nanning_Zheng1;~Baining_Guo1",
        "gender": "M;;M;M;;M;M;M;M",
        "homepage": "https://github.com/yichaoshen-MS;;;;;https://www.chunyuwang.org/;https://ancientmooner.github.io/;;https://www.microsoft.com/en-us/research/people/bainguo/",
        "dblp": "147/2187-1;;190/7361;261/9395;;63/7235;;07/256-1;",
        "google_scholar": ";;PzyvzksAAAAJ;mjUgH44AAAAJ;;https://scholar.google.co.jp/citations?user=VXQV5xwAAAAJ;Jkss014AAAAJ;https://scholar.google.com/citations?hl=zh-CN;h4kYmRYAAAAJ",
        "orcid": ";;;;;;;;",
        "linkedin": ";;rainbowsecret/;yu-tong-lin/;;;;;",
        "or_profile": "~Yichao_Shen1;~Zigang_Geng1;~Yuhui_Yuan1;~Yutong_Lin1;~Ze_Liu1;~Chunyu_Wang1;~Han_Hu1;~Nanning_Zheng1;~Baining_Guo1",
        "aff": "Xi'an Jiaotong University;;Microsoft Research;Microsoft;;Microsoft Research Asia;Microsft Research Asia;Xi'an Jiaotong University;Microsoft Research",
        "aff_domain": "xjtu.edu.cn;;microsoft.com;microsoft.com;;microsoft.com;microsoft.com;xjtu.edu.cn;microsoft.com",
        "position": "PhD student;;Senior Researcher;PhD student;;Researcher;Researcher;Full Professor;Researcher",
        "bibtex": "@inproceedings{\nshen2024vdetr,\ntitle={V-{DETR}: {DETR} with Vertex Relative Position Encoding for 3D Object Detection},\nauthor={Yichao Shen and Zigang Geng and Yuhui Yuan and Yutong Lin and Ze Liu and Chunyu Wang and Han Hu and Nanning Zheng and Baining Guo},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=NDkpxG94sF}\n}",
        "github": "",
        "project": "",
        "reviewers": "TFsP;YhUd;fSn3;c9AZ",
        "pdf_size": 7182141,
        "rating": "5;5;6;8",
        "confidence": "5;4;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;4",
        "presentation": "2;2;2;4",
        "wc_summary": "113;69;71;77",
        "wc_strengths": "68;30;69;128",
        "wc_weaknesses": "406;181;129;47",
        "wc_questions": "106;2;119;32",
        "wc_review": "693;282;388;284",
        "wc_reply_reviewers": "119;0;106;82",
        "wc_reply_authors": "2080;804;1180;426",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "4;1;3;2",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            82.5,
            17.853571071357123
        ],
        "wc_strengths_avg": [
            73.75,
            35.04550613131447
        ],
        "wc_weaknesses_avg": [
            190.75,
            133.13972923211162
        ],
        "wc_questions_avg": [
            64.75,
            49.12929370548695
        ],
        "wc_review_avg": [
            411.75,
            167.94400108369456
        ],
        "wc_reply_reviewers_avg": [
            76.75,
            46.25675626327467
        ],
        "wc_reply_authors_avg": [
            1122.5,
            613.7318225414093
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -0.28867513459481287,
        "gs_citation": 31,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3969720658565139083&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=NDkpxG94sF",
        "pdf": "https://openreview.net/pdf?id=NDkpxG94sF",
        "email": "xjtu.edu.cn;;microsoft.com;microsoft.com;;microsoft.com;microsoft.com;xjtu.edu.cn;microsoft.com",
        "author_num": 9,
        "aff_unique_index": "0;1;1;1;1;0;1",
        "aff_unique_norm": "Xi'an Jiao Tong University;Microsoft",
        "aff_unique_dep": ";Microsoft Research",
        "aff_unique_url": "https://www.xjtu.edu.cn;https://www.microsoft.com/en-us/research",
        "aff_unique_abbr": "XJTU;MSR",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Asia",
        "aff_country_unique_index": "0;1;1;0;0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "NDwJKMnF4x",
        "title": "ConvNet vs Transformer, Supervised vs CLIP: Beyond ImageNet Accuracy",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Modern computer vision offers a great variety of models to practitioners, and selecting a model from multiple options for specific applications can be challenging. Conventionally, competing model architectures and training protocols are compared by their ImageNet accuracy. However, this single metric does not fully capture performance nuances critical for specialized tasks. In this work, we conduct an in-depth comparative analysis of model behaviors beyond ImageNet accuracy for four leading models: ConvNeXt and Vision Transformer (ViT), across supervised and CLIP training objectives. Although selected models have similar ImageNet accuracies and compute requirements, we find that they differ in many other aspects \u2014 types of mistakes, output calibration, transferability, and feature invariance, among others. This diversity in model characteristics, not captured by traditional metrics, provides insights for better model selection to meet specific goals. Our research highlights the need for more nuanced analysis when choosing among models.",
        "keywords": "Computer Vision;Neural Networks;Model Architectures",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Kirill Vishniakov;Zhiqiang Shen;Zhuang Liu",
        "authorids": "~Kirill_Vishniakov1;~Zhiqiang_Shen1;~Zhuang_Liu1",
        "gender": "M;;",
        "homepage": "https://kirill-vish.github.io/;;",
        "dblp": ";;",
        "google_scholar": "H02tLFMAAAAJ;;",
        "orcid": ";;",
        "linkedin": "https://linkedin.com/in/kirill-vishniakov-605aa0142;;",
        "or_profile": "~Kirill_Vishniakov1;~Zhiqiang_Shen1;~Zhuang_Liu1",
        "aff": "M42;;",
        "aff_domain": "m42.ae;;",
        "position": "Researcher;;",
        "bibtex": "@misc{\nvishniakov2024convnet,\ntitle={ConvNet vs Transformer, Supervised vs {CLIP}: Beyond ImageNet Accuracy},\nauthor={Kirill Vishniakov and Zhiqiang Shen and Zhuang Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=NDwJKMnF4x}\n}",
        "github": "",
        "project": "",
        "reviewers": "vcFp;qUP4;ZNBZ;nmW5",
        "site": "https://openreview.net/forum?id=NDwJKMnF4x",
        "pdf_size": 2381530,
        "rating": "3;5;5;5",
        "confidence": "4;4;3;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;2",
        "presentation": "3;2;4;3",
        "wc_summary": "178;71;56;41",
        "wc_strengths": "40;127;41;37",
        "wc_weaknesses": "150;700;69;31",
        "wc_questions": "117;7;173;90",
        "wc_review": "485;905;339;199",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            86.5,
            53.881815114192285
        ],
        "wc_strengths_avg": [
            61.25,
            37.989307706248084
        ],
        "wc_weaknesses_avg": [
            237.5,
            270.4611802089165
        ],
        "wc_questions_avg": [
            96.75,
            59.84302382065933
        ],
        "wc_review_avg": [
            482.0,
            264.3274484422683
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17098610418011802232&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0",
        "aff_unique_norm": "M42",
        "aff_unique_dep": "",
        "aff_unique_url": "",
        "aff_unique_abbr": ""
    },
    {
        "id": "NEb3ha6mi1",
        "title": "A Neural Syntax Parser for Joint Segmentation and Anatomical Labelling of Vascular Tree Structures",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Automated anatomical labeling plays a crucial part for computer-assisted diagnostic systems targeting coronary artery diseases. \nEstablished from medical practice, the labeling conventions intrinsically carry profound prior knowledge about the results, indicating what outcome is favorable and what is illegal. However, the prior has been largely neglected by existing works.\nDrawing inspiration from syntax parsing in the NLP domain, we propose a neural stochastic grammar parser for anatomical labeling. Our method captures the essential parental and sibling dependencies between vessel segments, incorporates structural prior in a principled and interpretable manner, while retaining the learning capabilities of deep models.\nExperiments show encouraging results both for the robustness and accuracy of our method.",
        "keywords": "Coronary Artery;Anatomical Labeling;Stochastic Grammar;Neural Language Model",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Chen Zhou",
        "authorids": "~Chen_Zhou1",
        "gender": "",
        "homepage": "",
        "dblp": "",
        "google_scholar": "",
        "orcid": "0000-0002-0803-2360",
        "linkedin": "",
        "or_profile": "~Chen_Zhou1",
        "aff": "",
        "aff_domain": "",
        "position": "",
        "bibtex": "@misc{\nzhou2024a,\ntitle={A Neural Syntax Parser for Joint Segmentation and Anatomical Labelling of Vascular Tree Structures},\nauthor={Chen Zhou},\nyear={2024},\nurl={https://openreview.net/forum?id=NEb3ha6mi1}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=NEb3ha6mi1",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:AERNrCvIaXkJ:scholar.google.com/&scioq=A+Neural+Syntax+Parser+for+Joint+Segmentation+and+Anatomical+Labelling+of+Vascular+Tree+Structures&hl=en&as_sdt=0,33",
        "gs_version_total": 0
    },
    {
        "id": "NF5uhYkI9C",
        "title": "Thin-Thick Adapter: Segmenting Thin Scans Using Thick Annotations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Medical imaging segmentation has been a prominent focus in the field of medical imaging analysis. Recent advances in radiological and storage technologies have led to an increased utilization of thin slice computed tomography (CT) acquisitions in clinical practice. These thin slices offer several advantages, including enhanced spatial resolution and sharper diagnostic information for clinicians. However, segmenting thin slices presents significant challenges. Annotations on thick is hard to adapt to the thin slices since there is a domain gap between thick and thin slices. Furthermore, there is no existing dataset which contains pixel-level thin annotations, and manually annotating thin slices is considerably more resource-intensive and time-consuming compared to annotating thick slices, making it impractical to obtain a sufficient quantity of high-quality thin annotations for training robust models in a supervised fashion. In response to these challenges, this paper introduces three key contributions. Firstly, we propose a research topic and setting focused on segmenting thin slice data exclusively, leveraging existing annotations from thick slices. Secondly, we present a newly created dataset called CQ500-Thin, which is a Non-Contrast CT scans featuring Intracranial Hemorrhage (ICH), including a subset of pixel-level thin annotations for evaluation purposes. This dataset serves as a benchmark for our proposed topic and methodology. Lastly, we introduce a robust pipeline named the Thin-Thick Adapter, which utilizes a simple-but-effective data alignment technique and a 3D-CPS for unsupervised domain adaptation. It is designed to address the thin slice segmentation problem and establish a foundational baseline for this emerging research area.",
        "keywords": "Semantic Segmentation;Computed Tomography;Domain Adaptation",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Zeyu Zhang;Bowen Zhang;Abhiram Hiwase;Christen Barras;Feng Chen;Biao Wu;Adam James Wells;Daniel Y Ellis;Benjamin Reddi;Andrew William Burgan;Minh-Son To;Ian Reid;Richard Hartley",
        "authorids": "~Zeyu_Zhang11;~Bowen_Zhang3;~Abhiram_Hiwase1;~Christen_Barras1;~Feng_Chen10;~Biao_Wu1;~Adam_James_Wells1;~Daniel_Y_Ellis1;~Benjamin_Reddi1;~Andrew_William_Burgan1;~Minh-Son_To1;~Ian_Reid1;~Richard_Hartley1",
        "gender": "M;M;M;M;;M;M;M;;M;M;M;M",
        "homepage": "https://steve-zeyu-zhang.github.io/;;;https://scholar.google.com/citations?hl=en&user=-S1Swg4AAAAJ&view_op=list_works&gmla=AP6z3ObQe2-iPe5r__L9BlqDb2uVM4CxuBuhzeoDCn9SEJ5t9jsHKW98vIFyQn31pIBzTjSPktarjcuOcDtl6IsEYA4Yv0N6PwAgHg;;https://www.linkedin.com/in/wu-biao-785624247;https://www.dradamwells.com.au;;https://www.adelaide.edu.au/directory/benjamin.reddi;http://linkedin.com/in/andrew-burgan-572334108;;;http://axiom.anu.edu.au/~hartley/",
        "dblp": "44/8352-6;;;;;;;;;;;r/IanDReid1;h/RIHartley",
        "google_scholar": ";;;https://scholar.google.com/citations?hl=en;;;;;;;NIc4qPsAAAAJ;https://scholar.google.com.au/citations?user=ATkNLcQAAAAJ;https://scholar.google.com.tw/citations?user=cHia5p0AAAAJ",
        "orcid": "0009-0006-8819-3741;0000-0001-6180-6815;0000-0003-2086-7130;;;0009-0001-3487-8327;0000-0002-4373-347X;0000-0003-0898-334X;;;;0000-0001-7790-6423;0000-0002-5005-0191",
        "linkedin": "steve-zeyu-zhang/;;;;;wu-biao-785624247/;;;;;;;",
        "or_profile": "~Zeyu_Zhang11;~Bowen_Zhang3;~Abhiram_Hiwase1;~Christen_Barras1;~Feng_Chen10;~Biao_Wu1;~Adam_James_Wells1;~Daniel_Y_Ellis1;~Benjamin_Reddi1;~Andrew_William_Burgan1;~Minh-Son_To1;~Ian_Reid1;~Richard_Hartley1",
        "aff": "The Australian National University;University of Adelaide;University of Adelaide;University of Adelaide;;University of Technology Sydney;;University of Adelaide;;University of Adelaide;Flinders University of South Australia;University of Adelaide;Google",
        "aff_domain": "anu.edu.au;adelaide.edu.au;adelaide.edu.au;adelaide.edu.au;;uts.edu.au;;adelaide.edu.au;;adelaide.edu.au;flinders.edu.au;adelaide.edu.au;google.com",
        "position": "Undergrad student;PhD student;Undergrad student;Associate Professor;;PhD student;;Lecturer;;Researcher;Researcher;Professor;visitor",
        "bibtex": "@misc{\nzhang2024thinthick,\ntitle={Thin-Thick Adapter: Segmenting Thin Scans Using Thick Annotations},\nauthor={Zeyu Zhang and Bowen Zhang and Abhiram Hiwase and Christen Barras and Feng Chen and Biao Wu and Adam James Wells and Daniel Y Ellis and Benjamin Reddi and Andrew William Burgan and Minh-Son To and Ian Reid and Richard Hartley},\nyear={2024},\nurl={https://openreview.net/forum?id=NF5uhYkI9C}\n}",
        "github": "",
        "project": "",
        "reviewers": "oEQ1;WdYo;KXr5;vpN7",
        "site": "https://openreview.net/forum?id=NF5uhYkI9C",
        "pdf_size": 5111364,
        "rating": "5;5;6;6",
        "confidence": "4;3;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;2",
        "presentation": "3;2;3;4",
        "wc_summary": "63;93;108;97",
        "wc_strengths": "12;106;22;143",
        "wc_weaknesses": "186;109;12;107",
        "wc_questions": "74;95;107;137",
        "wc_review": "335;403;249;484",
        "wc_reply_reviewers": "274;0;24;28",
        "wc_reply_authors": "3349;1668;850;1774",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "7;4;2;3",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            90.25,
            16.663958113245485
        ],
        "wc_strengths_avg": [
            70.75,
            55.431827500092396
        ],
        "wc_weaknesses_avg": [
            103.5,
            61.68670845490137
        ],
        "wc_questions_avg": [
            103.25,
            22.78568629644497
        ],
        "wc_review_avg": [
            367.75,
            86.50252886476788
        ],
        "wc_reply_reviewers_avg": [
            81.5,
            111.65460133823416
        ],
        "wc_reply_authors_avg": [
            1910.25,
            904.3479349785679
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.0,
            1.8708286933869707
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            13,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=908399186114923898&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1;2;1;1;3;1;4",
        "aff_unique_norm": "Australian National University;University of Adelaide;University of Technology Sydney;Flinders University;Google",
        "aff_unique_dep": ";;;;Google",
        "aff_unique_url": "https://www.anu.edu.au;https://www.adelaide.edu.au;https://www.uts.edu.au;https://www.flinders.edu.au;https://www.google.com",
        "aff_unique_abbr": "ANU;Adelaide;UTS;Flinders;Google",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;1",
        "aff_country_unique": "Australia;United States"
    },
    {
        "id": "NFAjyyeSfB",
        "title": "Enhancing Image Restoration Transformer with Adaptive Token Dictionary",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Image restoration is a classic computer vision problem that involves estimating high-quality (HQ) images from low-quality (LQ) ones. To compensate the information loss in the degradation process, prior knowledge of HQ image is indispensable. While deep neural networks (DNNs), especially Transformers for image restoration, have seen significant advancements in recent years, challenges still remain, particularly in the explicit incorporation of external priors, managing computational complexity, and tailoring generalized external priors to image specifics. To address these issues, we propose to enhance Transformer with Adaptive Token Dictionary (ATD), leading to a novel architecture which introduces a token dictionary to explicitly model external prior in the attention mechanism. The proposed ATD calculates the attention between the input features and the token dictionary, which integrates similar features on a global scale. Furthermore, we propose an adaptive dictionary refinement mechanism (ADR) to progressively customize the shared tokens to image specifics from shallow to deep layers. Crucially, benefiting from the condensed token dictionary, the computational complexity of the new attention mechanism is reduced from quadratic to linear with respect to the number of image tokens. This efficiency makes our network notably advantageous in constrained settings. Experimental results show that our method achieves best performance on various image restoration benchmark.",
        "keywords": "image restoration;transformer;dictionary learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Leheng Zhang;Yawei Li;Xingyu Zhou;Xiaorui Zhao;Shuhang Gu",
        "authorids": "~Leheng_Zhang2;~Yawei_Li1;~Xingyu_Zhou4;~Xiaorui_Zhao1;~Shuhang_Gu3",
        "gender": "M;M;M;F;M",
        "homepage": ";https://yaweili.bitbucket.io/;https://zhouxingyu13.github.io;https://github.com/zzzhaoxiaorui;",
        "dblp": ";32/6740-1;;;126/1028",
        "google_scholar": "DH1CJqkAAAAJ;IFLsTGsAAAAJ;dgO3CyMAAAAJ;https://scholar.google.com/citations?view_op=list_works;-kSTt40AAAAJ",
        "orcid": ";0000-0002-8948-7892;0009-0000-2521-6500;;",
        "linkedin": ";yawei-li-89912ba8/;;;",
        "or_profile": "~Leheng_Zhang2;~Yawei_Li1;~Xingyu_Zhou4;~Xiaorui_Zhao1;~Shuhang_Gu3",
        "aff": "University of Electronic Science and Technology of China;ETHZ - ETH Zurich;University of Electronic Science and Technology of China;University of Electronic Science and Technology of China;University of Electronic Science and Technology of China",
        "aff_domain": "uestc.edu.cn;ethz.ch;uestc.edu.cn;uestc.edu.cn;uestc.edu.cn",
        "position": "PhD student;Lecturer;MS student;MS student;Full Professor",
        "bibtex": "@misc{\nzhang2024enhancing,\ntitle={Enhancing Image Restoration Transformer with Adaptive Token Dictionary},\nauthor={Leheng Zhang and Yawei Li and Xingyu Zhou and Xiaorui Zhao and Shuhang Gu},\nyear={2024},\nurl={https://openreview.net/forum?id=NFAjyyeSfB}\n}",
        "github": "",
        "project": "",
        "reviewers": "dEUU;mhzH;Tpyp;wYuy",
        "site": "https://openreview.net/forum?id=NFAjyyeSfB",
        "pdf_size": 34245836,
        "rating": "3;5;5;5",
        "confidence": "5;4;2;4",
        "soundness": "2;2;2;2",
        "contribution": "1;2;2;2",
        "presentation": "2;2;2;2",
        "wc_summary": "59;54;135;61",
        "wc_strengths": "22;16;72;51",
        "wc_weaknesses": "359;117;154;156",
        "wc_questions": "5;2;160;113",
        "wc_review": "445;189;521;381",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            77.25,
            33.439310698637314
        ],
        "wc_strengths_avg": [
            40.25,
            22.609455986378798
        ],
        "wc_weaknesses_avg": [
            196.5,
            95.09600412215016
        ],
        "wc_questions_avg": [
            70.0,
            68.55289928223313
        ],
        "wc_review_avg": [
            384.0,
            123.0081298126266
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.6622661785325219,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:NLVQOeEq1UEJ:scholar.google.com/&scioq=Enhancing+Image+Restoration+Transformer+with+Adaptive+Token+Dictionary&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0;0",
        "aff_unique_norm": "University of Electronic Science and Technology of China;ETH Zurich",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uestc.edu.cn;https://www.ethz.ch",
        "aff_unique_abbr": "UESTC;ETHZ",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;0",
        "aff_country_unique": "China;Switzerland"
    },
    {
        "id": "NFaFvyKKbX",
        "title": "Understanding deep neural networks through the lens of their non-linearity",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The remarkable success of deep neural networks (DNN) is often attributed to their high expressive power and their ability to approximate functions of arbitrary complexity. Indeed, DNNs are highly non-linear models, and activation functions introduced into them are largely responsible for this. While many works studied the expressive power of DNNs through the lens of their approximation capabilities, quantifying the non-linearity of DNNs or of individual activation functions remains an open problem. In this paper, we propose the first theoretically sound solution to track non-linearity propagation in deep neural networks with a specific focus on computer vision applications. Our proposed affinity score allows us to gain insights into the inner workings of a wide range of different architectures and learning paradigms. We provide extensive experimental results that highlight the practical utility of the proposed affinity score and its potential for long-reaching applications.",
        "keywords": "deep neural networks;optimal transport;activation functions",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/de76d3bf2f1ecc33ca4339979879f7cc79b55e54.pdf",
        "author": "Quentin Bouniot;Ievgen Redko;Anton Mallasto;Charlotte Laclau;Oliver Struckmeier;Karol Arndt;Markus Heinonen;Ville Kyrki;Samuel Kaski",
        "authorids": "~Quentin_Bouniot1;~Ievgen_Redko2;~Anton_Mallasto2;~Charlotte_Laclau2;~Oliver_Struckmeier1;~Karol_Arndt1;~Markus_Heinonen1;~Ville_Kyrki1;~Samuel_Kaski1",
        "gender": "M;;M;F;M;M;M;;M",
        "homepage": "https://qbouniot.github.io/;;;https://laclauc.github.io/index.html;;;https://users.aalto.fi/~heinom10/;https://irobotics.aalto.fi;https://people.aalto.fi/samuel.kaski",
        "dblp": "271/7069;150/3980;;153/2640;;;22/7709;07/2806;64/5826",
        "google_scholar": "https://scholar.google.com/citations?hl=fr;https://scholar.google.fr/citations?user=qJ1-XewAAAAJ;OENVuJ4AAAAJ;https://scholar.google.fr/citations?user=47i5TpcAAAAJ;https://scholar.google.fi/citations?user=TSZpN5gAAAAJ;https://scholar.google.fr/citations?user=yBxCckoAAAAJ;hFtfHZoAAAAJ;8OBnyXQAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0002-0982-372X;;;;0000-0003-4536-3190;;;;0000-0003-1925-9154",
        "linkedin": "quentin-bouniot/;;;;oliverstruckmeier/;;;;samuel-kaski-27790/",
        "or_profile": "~Quentin_Bouniot1;~Ievgen_Redko2;~Anton_Mallasto2;~Charlotte_Laclau2;~Oliver_Struckmeier1;~Karol_Arndt1;~Markus_Heinonen1;~Ville_Kyrki1;~Samuel_Kaski1",
        "aff": "T\u00e9l\u00e9com ParisTech;Huawei Technologies Ltd.;Smartly;T\u00e9lecom Paris;Aalto University;Nomagic;Aalto University;Aalto University;Aalto University",
        "aff_domain": "telecom-paristech.fr;huawei.com;smartly.io;telecom-paris.fr;aalto.fi;nomagic.ai;aalto.fi;aalto.fi;aalto.fi",
        "position": "Postdoc;Principal Researcher;Senior Data Scientist;Associate Professor;PhD student;Researcher;Researcher;Full Professor;Full Professor",
        "bibtex": "@misc{\nbouniot2024understanding,\ntitle={Understanding deep neural networks through the lens of their non-linearity},\nauthor={Quentin Bouniot and Ievgen Redko and Anton Mallasto and Charlotte Laclau and Oliver Struckmeier and Karol Arndt and Markus Heinonen and Ville Kyrki and Samuel Kaski},\nyear={2024},\nurl={https://openreview.net/forum?id=NFaFvyKKbX}\n}",
        "github": "",
        "project": "",
        "reviewers": "Hcf9;1uvv;uebp;K2zC",
        "site": "https://openreview.net/forum?id=NFaFvyKKbX",
        "pdf_size": 991527,
        "rating": "5;5;5;5",
        "confidence": "4;3;4;2",
        "soundness": "2;3;2;2",
        "contribution": "2;2;3;3",
        "presentation": "3;2;2;3",
        "wc_summary": "43;56;34;60",
        "wc_strengths": "29;32;17;34",
        "wc_weaknesses": "153;104;65;248",
        "wc_questions": "2;6;59;5",
        "wc_review": "227;198;175;347",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "457;365;227;522",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            48.25,
            10.353139620424328
        ],
        "wc_strengths_avg": [
            28.0,
            6.59545297913646
        ],
        "wc_weaknesses_avg": [
            142.5,
            68.42696836774226
        ],
        "wc_questions_avg": [
            18.0,
            23.717082451262844
        ],
        "wc_review_avg": [
            236.75,
            66.26603579511905
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            392.75,
            110.76636447947544
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8930716317124958061&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;3;4;5;4;4;4",
        "aff_unique_norm": "T\u00e9l\u00e9com ParisTech;Huawei;Smartly;T\u00e9l\u00e9com Paris;Aalto University;Nomagic",
        "aff_unique_dep": ";Huawei Technologies;;;;",
        "aff_unique_url": "https://www.telecom-paristech.fr;https://www.huawei.com;;https://www.telecom-paris.fr;https://www.aalto.fi;",
        "aff_unique_abbr": "TP;Huawei;;T\u00e9l\u00e9com Paris;Aalto;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;3;3;3;3",
        "aff_country_unique": "France;China;;Finland"
    },
    {
        "id": "NFqFA2vCQV",
        "title": "AdaptIP: Transferring Cross-modal Information to Temporal Modeling for Video-Language Representation Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Driven by the data-centric AI paradigm, pre-trained image-text representations exhibit a subtle alignment of visual and textual concepts. In light of images being a subset of videos, recent work is dedicated to transferring pre-trained image-text representations into the video-language domain, attracting widespread attention. Nevertheless, these efforts employ training strategies such as full fine-tuning or post-pretraining, which do not necessarily constitute the most optimal approaches for transferring general pre-trained representations. In this paper, we resort to the increasingly popular parameter-efficient transfer learning (PETL) approach, proposing AdptIP, to adapt the pre-trained CLIP model into the field of video-language representation learning. AdaptIP devises a hierarchical cross-modal adaptation approach, focusing on intra-modal temporal modeling and inter-modal fine-grained alignment within the video-language domain. Additionally, the pre-trained CLIP backbone is frozen to maintain a common prior and ensure efficient model training. Comprehensive experiments on video-text retrieval, video question answering, and video captioning benchmarks highlight the versatility, superiority and efficiency of AdaptIP. Code will be available soon.",
        "keywords": "video-language representation learning;transfer learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yaowei Li;Hongxiang Li;Xuxin Cheng;Bang Yang;Zhihong Zhu;Yuexian Zou",
        "authorids": "~Yaowei_Li2;~Hongxiang_Li3;~Xuxin_Cheng3;~Bang_Yang1;~Zhihong_Zhu1;~Yuexian_Zou4",
        "gender": ";;;M;;",
        "homepage": ";;;;;",
        "dblp": ";;;29/7844.html;;",
        "google_scholar": ";;;brFAJ64AAAAJ;;",
        "orcid": ";;;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Yaowei_Li2;~Hongxiang_Li3;~Xuxin_Cheng3;~Bang_Yang1;~Zhihong_Zhu1;~Yuexian_Zou4",
        "aff": ";;;Peking University;;",
        "aff_domain": ";;;pku.edu.cn;;",
        "position": ";;;PhD student;;",
        "bibtex": "@misc{\nli2024adaptip,\ntitle={Adapt{IP}: Transferring Cross-modal Information to Temporal Modeling for Video-Language Representation Learning},\nauthor={Yaowei Li and Hongxiang Li and Xuxin Cheng and Bang Yang and Zhihong Zhu and Yuexian Zou},\nyear={2024},\nurl={https://openreview.net/forum?id=NFqFA2vCQV}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=NFqFA2vCQV",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:MZLmw79naywJ:scholar.google.com/&scioq=AdaptIP:+Transferring+Cross-modal+Information+to+Temporal+Modeling+for+Video-Language+Representation+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Peking University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.pku.edu.cn",
        "aff_unique_abbr": "Peking U",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "title": "Efficient Streaming Language Models with Attention Sinks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18794",
        "id": "NG7sS51zVF",
        "author_site": "Guangxuan Xiao, Yuandong Tian, Beidi Chen, Song Han, Mike Lewis",
        "tldr": "",
        "abstract": "Deploying Large Language Models (LLMs) in streaming applications such as multi-round dialogue, where long interactions are expected, is urgently needed but poses two major challenges.\nFirstly, during the decoding stage, caching previous tokens' Key and Value states (KV) consumes extensive memory.\nSecondly, popular LLMs cannot generalize to longer texts than the training sequence length.\nWindow attention, where only the most recent KVs are cached, is a natural approach --- but we show that it fails when the text length surpasses the cache size.\nWe observe an interesting phenomenon, namely attention sink, that keeping the KV of initial tokens will largely recover the performance of window attention. In this paper, we first demonstrate that the emergence of attention sink is due to the strong attention scores towards initial tokens as a ``sink'' even if they are not semantically important.\nBased on the above analysis, we introduce StreamingLLM, an efficient framework that enables LLMs trained with a finite length attention window to generalize to infinite sequence length without any fine-tuning.\nWe show that StreamingLLM can enable Llama-2, MPT, Falcon, and Pythia to perform stable and efficient language modeling with up to 4 million tokens and more.\nIn addition, we discover that adding a placeholder token as a dedicated attention sink during pre-training can further improve streaming deployment. In streaming settings, StreamingLLM outperforms the sliding window recomputation baseline by up to 22.2$\\times$ speedup.\nCode and datasets are provided at https://github.com/mit-han-lab/streaming-llm.",
        "keywords": "Large Language Models;Length Extrapolation;Efficiency",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/12ebaa26b5bc5aa293a418d94f6b2dba45cfcd53.pdf",
        "author": "Guangxuan Xiao;Yuandong Tian;Beidi Chen;Song Han;Mike Lewis",
        "authorids": "~Guangxuan_Xiao1;~Yuandong_Tian1;~Beidi_Chen1;~Song_Han5;~Mike_Lewis1",
        "gender": ";M;F;;M",
        "homepage": ";http://yuandong-tian.com;https://www.andrew.cmu.edu/user/beidic/;;",
        "dblp": ";t/YuandongTian;192/1339;;19/6214",
        "google_scholar": ";0mgEF28AAAAJ;;;SnQnQicAAAAJ",
        "orcid": ";0000-0003-4202-4847;;;",
        "linkedin": ";yuandongtian;;;",
        "or_profile": "~Guangxuan_Xiao1;~Yuandong_Tian1;~Beidi_Chen1;~Song_Han5;~Mike_Lewis1",
        "aff": ";Meta AI (FAIR);Meta Facebook;;Facebook AI Research",
        "aff_domain": ";meta.com;fb.com;;fb.com",
        "position": ";Research Scientist;Researcher;;Research Scientist",
        "bibtex": "@inproceedings{\nxiao2024efficient,\ntitle={Efficient Streaming Language Models with Attention Sinks},\nauthor={Guangxuan Xiao and Yuandong Tian and Beidi Chen and Song Han and Mike Lewis},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=NG7sS51zVF}\n}",
        "github": "",
        "project": "",
        "reviewers": "STcB;MUgn;obg3;PzfP",
        "pdf_size": 17728825,
        "rating": "6;8;8;8",
        "confidence": "4;4;4;5",
        "soundness": "3;4;3;4",
        "contribution": "3;4;3;3",
        "presentation": "4;3;4;4",
        "wc_summary": "83;141;144;95",
        "wc_strengths": "46;88;178;39",
        "wc_weaknesses": "240;3;61;80",
        "wc_questions": "318;106;32;170",
        "wc_review": "687;338;415;384",
        "wc_reply_reviewers": "0;0;35;0",
        "wc_reply_authors": "1388;461;550;724",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "4;3;4;3",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            115.75,
            27.105119442644042
        ],
        "wc_strengths_avg": [
            87.75,
            55.37316588384666
        ],
        "wc_weaknesses_avg": [
            96.0,
            87.8436110368876
        ],
        "wc_questions_avg": [
            156.5,
            105.2556411789886
        ],
        "wc_review_avg": [
            456.0,
            136.15248804190102
        ],
        "wc_reply_reviewers_avg": [
            8.75,
            15.155444566227676
        ],
        "wc_reply_authors_avg": [
            780.75,
            363.13177704519336
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.5,
            0.5
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 598,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12541350049673575482&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=NG7sS51zVF",
        "pdf": "https://openreview.net/pdf?id=NG7sS51zVF",
        "email": ";meta.com;fb.com;;fb.com",
        "author_num": 5,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Meta",
        "aff_unique_dep": "Facebook AI Research (FAIR)",
        "aff_unique_url": "https://ai.facebook.com",
        "aff_unique_abbr": "Meta AI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Reclaiming the Source of Programmatic Policies: Programmatic versus Latent Spaces",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18793",
        "id": "NGVljI6HkR",
        "author_site": "Tales Carvalho, Kenneth Tjhia, Levi Lelis",
        "tldr": "",
        "abstract": "Recent works have introduced LEAPS and HPRL, systems that learn latent spaces of domain-specific languages, which are used to define programmatic policies for partially observable Markov decision processes (POMDPs). These systems induce a latent space while optimizing losses such as the behavior loss, which aim to achieve locality in program behavior, meaning that vectors close in the latent space should correspond to similarly behaving programs. In this paper, we show that the programmatic space, induced by the domain-specific language and requiring no training, presents values for the behavior loss similar to those observed in latent spaces presented in previous work. Moreover, algorithms searching in the programmatic space significantly outperform those in LEAPS and HPRL. To explain our results, we measured the \"friendliness\" of the two spaces to local search algorithms. We discovered that algorithms are more likely to stop at local maxima when searching in the latent space than when searching in the programmatic space. This implies that the optimization topology of the programmatic space, induced by the reward function in conjunction with the neighborhood function, is more conducive to search than that of the latent space. This result provides an explanation for the superior performance in the programmatic space.",
        "keywords": "programmatic policy;reinforcement learning",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "",
        "author": "Tales Henrique Carvalho;Kenneth Tjhia;Levi Lelis",
        "authorids": "~Tales_Henrique_Carvalho1;~Kenneth_Tjhia1;~Levi_Lelis1",
        "gender": "M;M;M",
        "homepage": ";http://www.cs.ualberta.ca/~santanad;",
        "dblp": ";82/7788;",
        "google_scholar": ";https://scholar.google.com.br/citations?user=eoXoLFgAAAAJ;",
        "orcid": ";;",
        "linkedin": "tales-h-carvalho/;;kentjhia/",
        "or_profile": "~Tales_Henrique_Carvalho1;~Levi_Lelis1;~Kenneth_G_Tjhia1",
        "aff": "Department of Computing Science, University of Alberta;University of Alberta;University of Alberta",
        "aff_domain": "cs.ualberta.ca;ualberta.ca;ualberta.ca",
        "position": "MS student;Assistant Professor;MS student",
        "bibtex": "@inproceedings{\ncarvalho2024reclaiming,\ntitle={Reclaiming the Source of Programmatic Policies: Programmatic versus Latent Spaces},\nauthor={Tales Henrique Carvalho and Kenneth Tjhia and Levi Lelis},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=NGVljI6HkR}\n}",
        "github": "",
        "project": "",
        "reviewers": "acX2;xg79;BAZd",
        "pdf_size": 1833865,
        "rating": "3;3;5",
        "confidence": "3;4;4",
        "soundness": "2;3;2",
        "contribution": "2;2;2",
        "presentation": "2;3;2",
        "wc_summary": "29;41;67",
        "wc_strengths": "21;68;74",
        "wc_weaknesses": "49;279;603",
        "wc_questions": "39;34;3",
        "wc_review": "138;422;747",
        "wc_reply_reviewers": "19;243;110",
        "wc_reply_authors": "576;942;1164",
        "reply_reviewers": "1;1;2",
        "reply_authors": "3;3;4",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            45.666666666666664,
            15.86050300449376
        ],
        "wc_strengths_avg": [
            54.333333333333336,
            23.697163449568293
        ],
        "wc_weaknesses_avg": [
            310.3333333333333,
            227.25218493021262
        ],
        "wc_questions_avg": [
            25.333333333333332,
            15.923427883328248
        ],
        "wc_review_avg": [
            435.6666666666667,
            248.810950098441
        ],
        "wc_reply_reviewers_avg": [
            124.0,
            91.98188227399277
        ],
        "wc_reply_authors_avg": [
            894.0,
            242.43762084297066
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11151709324111535744&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=NGVljI6HkR",
        "pdf": "https://openreview.net/pdf?id=NGVljI6HkR",
        "email": "cs.ualberta.ca;ualberta.ca;ualberta.ca",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Alberta",
        "aff_unique_dep": "Department of Computing Science",
        "aff_unique_url": "https://www.ualberta.ca",
        "aff_unique_abbr": "UAlberta",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "NHb6mbD99v",
        "title": "Uncertainty-aware Distributional Offline Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Offline reinforcement learning (RL) presents distinct challenges as it relies solely on observational data. A central concern in this context is ensuring the safety of the learned policy by quantifying uncertainties associated with various actions and environmental stochasticity. Traditional approaches primarily emphasize mitigating epistemic uncertainty by learning risk-averse policies, often overlooking environmental stochasticity. In this study, we propose an uncertainty-aware distributional offline RL method to simultaneously address both epistemic uncertainty and environmental stochasticity. We propose a model-free offline RL algorithm capable of learning risk-averse policies and characterizing the entire distribution of discounted cumulative rewards, as opposed to merely maximizing the expected value of accumulated discounted returns. Our method is rigorously evaluated through comprehensive experiments in both risk-sensitive and risk-neutral environments, demonstrating its superior performance.",
        "keywords": "Risk-sensitive;Offline Reinforcement Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Xiaocong Chen;Siyu Wang;Tong Yu;Lina Yao",
        "authorids": "~Xiaocong_Chen2;~Siyu_Wang4;~Tong_Yu3;~Lina_Yao2",
        "gender": ";F;;F",
        "homepage": "https://xiaocongchen.github.io/;https://sylvia-siyuwang.github.io/home/;https://www.linkedin.com/in/tong-yu-42790744;https://www.linayao.com/",
        "dblp": "245/9630.html;168/9309-1;32/1593-1;56/6651-1",
        "google_scholar": "GE0iYnYAAAAJ;;https://scholar.google.com/citations?hl=en;https://scholar.google.com.au/citations?user=EU3snBgAAAAJ",
        "orcid": "0000-0002-8849-4943;0009-0008-8726-5277;0000-0002-5991-2050;",
        "linkedin": ";;tong-yu-42790744;linayao/",
        "or_profile": "~Xiaocong_Chen2;~Siyu_Wang4;~Tong_Yu3;~Lina_Yao2",
        "aff": "Data 61, CSIRO;University of New South Wales;Adobe Research;CSIRO's Data61",
        "aff_domain": "data61.csiro.au;unsw.edu.au;adobe.com;data61.csiro.au",
        "position": "Postdoc;PhD student;Senior Research Scientist;Principal Researcher",
        "bibtex": "@misc{\nchen2024uncertaintyaware,\ntitle={Uncertainty-aware Distributional Offline Reinforcement Learning},\nauthor={Xiaocong Chen and Siyu Wang and Tong Yu and Lina Yao},\nyear={2024},\nurl={https://openreview.net/forum?id=NHb6mbD99v}\n}",
        "github": "",
        "project": "",
        "reviewers": "LtLP;PL45;sAmU",
        "site": "https://openreview.net/forum?id=NHb6mbD99v",
        "pdf_size": 797766,
        "rating": "3;6;6",
        "confidence": "4;4;3",
        "soundness": "2;3;3",
        "contribution": "2;2;2",
        "presentation": "2;3;2",
        "wc_summary": "128;40;93",
        "wc_strengths": "47;50;50",
        "wc_weaknesses": "156;128;140",
        "wc_questions": "504;49;33",
        "wc_review": "835;267;316",
        "wc_reply_reviewers": "566;0;120",
        "wc_reply_authors": "2766;1087;1267",
        "reply_reviewers": "3;0;2",
        "reply_authors": "7;2;4",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            87.0,
            36.175498153676706
        ],
        "wc_strengths_avg": [
            49.0,
            1.4142135623730951
        ],
        "wc_weaknesses_avg": [
            141.33333333333334,
            11.469767022723502
        ],
        "wc_questions_avg": [
            195.33333333333334,
            218.35801387222367
        ],
        "wc_review_avg": [
            472.6666666666667,
            256.98811040374784
        ],
        "wc_reply_reviewers_avg": [
            228.66666666666666,
            243.5095252528921
        ],
        "wc_reply_authors_avg": [
            1706.6666666666667,
            752.6576615936063
        ],
        "reply_reviewers_avg": [
            1.6666666666666667,
            1.247219128924647
        ],
        "reply_authors_avg": [
            4.333333333333333,
            2.0548046676563256
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7150277387271471680&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "CSIRO;University of New South Wales;Adobe",
        "aff_unique_dep": "Data 61;;Adobe Research",
        "aff_unique_url": "https://www.csiro.au;https://www.unsw.edu.au;https://research.adobe.com",
        "aff_unique_abbr": "CSIRO;UNSW;Adobe",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "Australia;United States"
    },
    {
        "id": "NI0RsRuFsW",
        "title": "How Hard is Trojan Detection in DNNs? Fooling Detectors With Evasive Trojans",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Trojan attacks can pose serious risks by injecting deep neural networks with hidden, adversarial functionality. Recent methods for detecting whether a model is trojaned appear highly successful. However, a concerning and relatively unexplored possibility is that trojaned networks could be made harder to detect. To better understand the scope of this risk, we develop a general method for making trojans more evasive based on several novel techniques and observations. In experiments, we find that our evasive trojans reduce the efficacy of a wide range of detectors across numerous evaluation settings while maintaining high attack success rates. Surprisingly, we also find that our evasive trojans are substantially harder to reverse-engineer despite not being explicitly designed with this attribute in mind. These findings underscore the importance of developing more robust monitoring mechanisms for hidden functionality and clarifying the offense-defense balance of trojan detection.",
        "keywords": "trojan detection;neural trojans;trojans;hidden functionality;monitoring;security;ML safety",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Mantas Mazeika;Andy Zou;Akul Arora;Pavel Pleskov;Dawn Song;Dan Hendrycks;Bo Li;David Forsyth",
        "authorids": "~Mantas_Mazeika3;~Andy_Zou1;~Akul_Arora1;~Pavel_Pleskov1;~Dawn_Song2;~Dan_Hendrycks1;~Bo_Li19;~David_Forsyth1",
        "gender": "M;;M;M;F;;F;M",
        "homepage": "https://github.com/mmazeika;;;;http://people.eecs.berkeley.edu/~dawnsong/;;http://boli.cs.illinois.edu/;https://cs.illinois.edu/directory/profile/daf",
        "dblp": "215/4447;274/2362;287/4602;;;182/2504;50/3402-26;f/DavidAForsyth",
        "google_scholar": ";;zjFWUY0AAAAJ;;84WzBlYAAAAJ;;K8vJkTcAAAAJ;https://scholar.google.com.tw/citations?user=5H0arvkAAAAJ",
        "orcid": ";;;;;;;0000-0002-2278-0752",
        "linkedin": ";andy-zou-09ba3616a/;akul-arora/;ppleskov/;;;;",
        "or_profile": "~Mantas_Mazeika3;~Andy_Zou1;~Akul_Arora1;~Pavel_Pleskov1;~Dawn_Song2;~Dan_Hendrycks1;~Bo_Li19;~David_Forsyth1",
        "aff": "University of Illinois, Urbana-Champaign;Carnegie Mellon University;;;University of California, Berkeley;Center for AI Safety;University of Illinois, Urbana Champaign;University of Illinois, Urbana-Champaign",
        "aff_domain": "uiuc.edu;andrew.cmu.edu;;;berkeley.edu;safe.ai;illinois.edu;uiuc.edu",
        "position": "PhD student;PhD student;;;Full Professor;Executive and Research Director;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nmazeika2024how,\ntitle={How Hard is Trojan Detection in {DNN}s? Fooling Detectors With Evasive Trojans},\nauthor={Mantas Mazeika and Andy Zou and Akul Arora and Pavel Pleskov and Dawn Song and Dan Hendrycks and Bo Li and David Forsyth},\nyear={2024},\nurl={https://openreview.net/forum?id=NI0RsRuFsW}\n}",
        "github": "",
        "project": "",
        "reviewers": "YzJY;CPhH;sA9T;jSxM",
        "site": "https://openreview.net/forum?id=NI0RsRuFsW",
        "pdf_size": 589712,
        "rating": "3;3;5;5",
        "confidence": "4;4;5;4",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;2",
        "presentation": "2;3;2;3",
        "wc_summary": "71;49;26;53",
        "wc_strengths": "22;24;41;22",
        "wc_weaknesses": "90;51;119;544",
        "wc_questions": "2;273;14;7",
        "wc_review": "185;397;200;626",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "708;709;174;1180",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            49.75,
            16.021469970012117
        ],
        "wc_strengths_avg": [
            27.25,
            7.980444849756184
        ],
        "wc_weaknesses_avg": [
            201.0,
            199.49561398687442
        ],
        "wc_questions_avg": [
            74.0,
            114.97173565707357
        ],
        "wc_review_avg": [
            352.0,
            178.9511106419851
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            692.75,
            356.02343672853897
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12480705522861604180&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;3;4;0",
        "aff_unique_norm": "University of Illinois;Carnegie Mellon University;University of California, Berkeley;Center for AI Safety;University of Illinois Urbana-Champaign",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://illinois.edu;https://www.cmu.edu;https://www.berkeley.edu;https://www.centerforaisafety.org;https://illinois.edu",
        "aff_unique_abbr": "UIUC;CMU;UC Berkeley;;UIUC",
        "aff_campus_unique_index": "0;2;0;0",
        "aff_campus_unique": "Urbana-Champaign;;Berkeley",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "NIouO0C0ex",
        "title": "Open-Source Can Be Dangerous: On the Vulnerability of Value Alignment in Open-Source LLMs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs) possess immense capabilities but are at risk of malicious exploitation. \nTo mitigate the risk, value alignment is employed to align LLMs with ethical standards.\nHowever, even after this alignment, they remain vulnerable to jailbreak attacks, which, despite their intent, often face high rejection rates and limited harmful output. \nIn this paper, we introduce reverse alignment to highlight the vulnerabilities of value alignment in open-source LLMs.\nIn reverse alignment, we prove that by accessing model parameters, efficient attacks through fine-tuning LLMs become feasible.\nWe investigate two types of reverse alignment techniques: reverse supervised fine-tuning (RSFT) and reverse value alignment (RVA).\nRSFT operates by supervising the fine-tuning of LLMs to reverse their inherent values. \nWe also explore how to prepare data needed for RSFT.\nRVA optimizes LLMs to enhance their preference for harmful content, reversing the models' value alignment.\nOur extensive experiments reveal that open-source high-performance LLMs can be adeptly reverse-aligned to output harmful content, even in the absence of manually curated malicious datasets.\nOur research acts as a whistleblower for the community, emphasizing the need for caution when open-sourcing LLMs.\nIt also underscores the limitations of current alignment approaches and advocates for the adoption of more advanced techniques.",
        "keywords": "Large language model;Harmful;Alignment",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Jingwei Yi;Rui Ye;Qisi Chen;Bin Benjamin Zhu;Siheng Chen;Defu Lian;Guangzhong Sun;Xing Xie;Fangzhao Wu",
        "authorids": "~Jingwei_Yi1;~Rui_Ye1;~Qisi_Chen1;~Bin_Benjamin_Zhu1;~Siheng_Chen1;~Defu_Lian1;~Guangzhong_Sun1;~Xing_Xie3;~Fangzhao_Wu1",
        "gender": "F;M;M;M;;M;M;M;",
        "homepage": ";http://rui-ye.github.io/;https://github.com/allblueJT;https://www.microsoft.com/en-us/research/people/binzhu/;;https://faculty.ustc.edu.cn/liandefu/en/index.htm;;http://research.microsoft.com/en-us/people/xingx/;",
        "dblp": "290/2312;;383/7943.html;85/5693.html;;87/10734;44/1372;08/6809-1;",
        "google_scholar": "BPnONGoAAAAJ;Q4-VTxcAAAAJ;;zyXRIGgAAAAJ;;QW0ad4sAAAAJ;;5EQfAFIAAAAJ;",
        "orcid": "0009-0001-2786-6395;;;0000-0002-3571-7808;;0000-0002-3507-9607;0000-0002-0794-7681;0000-0002-8608-8482;",
        "linkedin": ";;;;;;;xingx/;",
        "or_profile": "~Jingwei_Yi1;~Rui_Ye1;~Qisi_Chen1;~Bin_Benjamin_Zhu1;~Siheng_Chen1;~Defu_Lian1;~Guangzhong_Sun1;~Xing_Xie3;~Fangzhao_Wu1",
        "aff": "University of Science and Technology of China;Shanghai Jiaotong University;University of Science and Technology of China;Microsoft AI Asia;;University of Science and Technology of China;University of Science and Technology of China;Microsoft Research Asia;",
        "aff_domain": "ustc.edu.cn;sjtu.edu.cn;ustc.edu.cn;microsoft.com;;ustc.edu.cn;ustc.edu.cn;microsoft.com;",
        "position": "PhD student;PhD student;Undergrad student;Principal Researcher;;Full Professor;Full Professor;Senior Principal Researcher;",
        "bibtex": "@misc{\nyi2024opensource,\ntitle={Open-Source Can Be Dangerous: On the Vulnerability of Value Alignment in Open-Source {LLM}s},\nauthor={Jingwei Yi and Rui Ye and Qisi Chen and Bin Benjamin Zhu and Siheng Chen and Defu Lian and Guangzhong Sun and Xing Xie and Fangzhao Wu},\nyear={2024},\nurl={https://openreview.net/forum?id=NIouO0C0ex}\n}",
        "github": "",
        "project": "",
        "reviewers": "X8UN;dUB6;RY57",
        "site": "https://openreview.net/forum?id=NIouO0C0ex",
        "pdf_size": 1080951,
        "rating": "5;6;6",
        "confidence": "4;5;3",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "3;2;3",
        "wc_summary": "81;66;45",
        "wc_strengths": "66;61;40",
        "wc_weaknesses": "171;225;121",
        "wc_questions": "2;176;2",
        "wc_review": "320;528;208",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "986;1003;412",
        "reply_reviewers": "0;0;0",
        "reply_authors": "3;3;2",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            64.0,
            14.7648230602334
        ],
        "wc_strengths_avg": [
            55.666666666666664,
            11.2644968324772
        ],
        "wc_weaknesses_avg": [
            172.33333333333334,
            42.4682888230213
        ],
        "wc_questions_avg": [
            60.0,
            82.02438661763951
        ],
        "wc_review_avg": [
            352.0,
            132.58456420966456
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            800.3333333333334,
            274.6808248778126
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11152479973520446670&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;2;0;0;2",
        "aff_unique_norm": "University of Science and Technology of China;Shanghai Jiao Tong University;Microsoft",
        "aff_unique_dep": ";;Microsoft AI",
        "aff_unique_url": "http://www.ustc.edu.cn;https://www.sjtu.edu.cn;https://www.microsoft.com",
        "aff_unique_abbr": "USTC;SJTU;MSFT",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Asia",
        "aff_country_unique_index": "0;0;0;1;0;0;0",
        "aff_country_unique": "China;Unknown"
    },
    {
        "id": "NJ6nyv3XWH",
        "title": "Leveraging Graph Neural Networks to Boost Fine-Grained Image Classification",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Fine-grained image classification, which is a challenging task in computer vision, requires precise differentiation among visually similar object categories. In this paper, we introduce a novel approach that utilizes Graph Neural Network (GNN) blocks to enhance the clustering capability of feature vectors extracted from images within a deep neural network (DNN) framework. These GNN blocks capture intricate dependencies between feature vectors by modeling them as nodes within a graph. This graph-based approach enables our model to learn contextual information and relationships that are essential for fine-grained categorization. In practice, our proposed method demonstrates significant improvements in the accuracy of different fine-grained classifiers, with an average increase of $(+2.78\\%)$ and $(+3.83\\%)$ on the CUB200-2011 and Stanford Dog datasets, respectively, while achieving a state-of-the-art result $(95.79\\%)$ on the Stanford Dog dataset. Furthermore, our method serves as a plug-in refinement module and can be easily integrated into different architectures.",
        "keywords": "Fine-grained classification;Graph Neural Networks;post-hoc",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Bao Quoc Bui;Duy Minh Le;Cong Tran;Anh Tuan Tran;Cuong Pham",
        "authorids": "~Bao_Quoc_Bui1;~Duy_Minh_Le1;~Cong_Tran1;~Anh_Tuan_Tran2;~Cuong_Pham1",
        "gender": "M;M;M;M;M",
        "homepage": ";https://www.facebook.com/le.minhduy.906;https://scholar.google.com/citations?user=wXkxRzwAAAAJ&hl=en;https://sites.google.com/site/anhttranusc/;https://sites.google.com/view/cuongpham/home",
        "dblp": ";;87/1076;150/5269-1;20/6376.html",
        "google_scholar": ";;wXkxRzwAAAAJ;FYZ5ODQAAAAJ;https://scholar.google.co.uk/citations?user=tDWY0U8AAAAJ",
        "orcid": "0000-0002-1158-9696;;;0000-0002-3120-4036;0000-0003-0973-0889",
        "linkedin": ";;;https://linkedin.com/in/anh-tran-97814b19;cuong-pham-74498827/",
        "or_profile": "~Bao_Quoc_Bui1;~Duy_Minh_Le1;~Cong_Tran1;~Anh_Tuan_Tran2;~Cuong_Pham1",
        "aff": "Hanoi University of Science and Technology;Posts & Telecommunications Institute of Technology;Posts & Telecommunications Institute of Technology;VinAI Research;Posts & Telecommunications Institute of Technology and VinAI Research",
        "aff_domain": "hust.edu.vn;ptit.edu.vn;ptit.edu.vn;vinai.io;ptit.edu.vn",
        "position": "MS student;Undergrad student;Assistant Professor;Research Scientist;Associate Professor",
        "bibtex": "@misc{\nbui2024leveraging,\ntitle={Leveraging Graph Neural Networks to Boost Fine-Grained Image Classification},\nauthor={Bao Quoc Bui and Duy Minh Le and Cong Tran and Anh Tuan Tran and Cuong Pham},\nyear={2024},\nurl={https://openreview.net/forum?id=NJ6nyv3XWH}\n}",
        "github": "",
        "project": "",
        "reviewers": "yF85;AgJz;nzxZ;uMuy",
        "site": "https://openreview.net/forum?id=NJ6nyv3XWH",
        "pdf_size": 2348127,
        "rating": "3;3;3;3",
        "confidence": "5;4;4;4",
        "soundness": "2;1;2;2",
        "contribution": "2;2;2;1",
        "presentation": "3;3;3;3",
        "wc_summary": "71;68;65;97",
        "wc_strengths": "35;82;60;39",
        "wc_weaknesses": "346;705;184;187",
        "wc_questions": "104;78;37;206",
        "wc_review": "556;933;346;529",
        "wc_reply_reviewers": "33;0;0;0",
        "wc_reply_authors": "85;220;0;248",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "1;1;0;1",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            75.25,
            12.735285626950029
        ],
        "wc_strengths_avg": [
            54.0,
            18.748333259252675
        ],
        "wc_weaknesses_avg": [
            355.5,
            212.15854920318435
        ],
        "wc_questions_avg": [
            106.25,
            62.34731349464867
        ],
        "wc_review_avg": [
            591.0,
            213.3412758938129
        ],
        "wc_reply_reviewers_avg": [
            8.25,
            14.289419162443238
        ],
        "wc_reply_authors_avg": [
            138.25,
            100.84238940048971
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            0.75,
            0.4330127018922193
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:rJx1ZfRiJEYJ:scholar.google.com/&scioq=Leveraging+Graph+Neural+Networks+to+Boost+Fine-Grained+Image+Classification&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;2;1",
        "aff_unique_norm": "Hanoi University of Science and Technology;Posts & Telecommunications Institute of Technology;VinAI Research",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.hust.edu.vn;http://www.ptit.edu.vn;https://www.vinai.io/",
        "aff_unique_abbr": "HUST;PTIT;VinAI",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Hanoi;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Vietnam"
    },
    {
        "id": "NJyCoAIPln",
        "title": "Branch-level Network Re-parameterization with Neural Substitution",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this paper, we propose the neural substitution method for network re-parameterization at branch-level connectivity. The proposed neural substitution method learns a variety of network topologies, allowing our re-parameterization method to exploit the ensemble effect fully. In addition, we introduce a guiding method for reducing the non-linear activation function in a linear transformation. Because branch-level connectivity necessitates multiple non-linear activation functions, they must be reduced to a single activation with our guided activation method during the re-parameterization process. \nBeing able to reduce the non-linear activation function in this manner is significant as it overcomes the limitation of the existing re-parameterization method, which works only at block-level connectivity.\nIf re-parameterization is applied only at the block-level connectivity, the network topology can only be exploited in a limited way, which makes it harder to learn diverse feature representations.\nOn the other hand, the proposed approach learns a considerably richer representation than existing re-parameterization methods due to the unlimited topology with branch-level connectivity, providing a generalized framework to be applied with other methods. \nThe proposed method improves the re-parameterization performance, but it is also a general framework that enables existing methods to benefit from branch-level connectivity.\nIn our experiments, we show that the proposed re-parameterization method works favorably against existing methods while significantly improving their performance when applied to the proposed branch-level connectivity.\nUpon acceptance, we will make our implementation publicly available.",
        "keywords": "Neural substitution;Re-parameterization;Branch-level connectivity",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/0021155034466a70ed1f270ab60c92e3a961b742.zip",
        "author": "Seungmin Oh;Jongbin Ryu",
        "authorids": "~Seungmin_Oh1;~Jongbin_Ryu1",
        "gender": "M;",
        "homepage": "https://soonge.notion.site/SoongE-6a04587b190d46d08fd3e025b2cbfe03;https://sites.google.com/view/jongbinryu/about-me",
        "dblp": ";139/4068",
        "google_scholar": "dwOJaW8AAAAJ;bfj6WyIAAAAJ",
        "orcid": "0009-0000-1431-2716;0000-0001-5574-5358",
        "linkedin": "seungmin-oh-695091221/;",
        "or_profile": "~Seungmin_Oh1;~Jongbin_Ryu1",
        "aff": "Ajou University;Ajou University",
        "aff_domain": "ajou.ac.kr;ajou.ac.kr",
        "position": "MS student;Assistant Professor",
        "bibtex": "@misc{\noh2024branchlevel,\ntitle={Branch-level Network Re-parameterization with Neural Substitution},\nauthor={Seungmin Oh and Jongbin Ryu},\nyear={2024},\nurl={https://openreview.net/forum?id=NJyCoAIPln}\n}",
        "github": "",
        "project": "",
        "reviewers": "NvSB;Gpid;j2y2;AsUr;LE6H",
        "site": "https://openreview.net/forum?id=NJyCoAIPln",
        "pdf_size": 2008560,
        "rating": "3;3;3;5;6",
        "confidence": "3;2;5;3;3",
        "soundness": "2;2;2;2;3",
        "contribution": "2;2;2;2;3",
        "presentation": "2;1;2;2;3",
        "wc_summary": "99;50;101;66;153",
        "wc_strengths": "30;50;95;60;3",
        "wc_weaknesses": "139;159;245;237;132",
        "wc_questions": "42;5;138;2;52",
        "wc_review": "310;264;579;365;340",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "161;181;292;235;215",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            4.0,
            1.2649110640673518
        ],
        "confidence_avg": [
            3.2,
            0.9797958971132712
        ],
        "soundness_avg": [
            2.2,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            93.8,
            35.425414605901224
        ],
        "wc_strengths_avg": [
            47.6,
            30.67637527479412
        ],
        "wc_weaknesses_avg": [
            182.4,
            48.72617366467431
        ],
        "wc_questions_avg": [
            47.8,
            49.22763451558484
        ],
        "wc_review_avg": [
            371.6,
            109.02219957421516
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            216.8,
            45.573676612711424
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.1613743060919757,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Y4egboNYOikJ:scholar.google.com/&scioq=Branch-level+Network+Re-parameterization+with+Neural+Substitution&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Ajou University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ajou.ac.kr",
        "aff_unique_abbr": "Ajou",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "NL6bspkWft",
        "title": "OpenIns3D: Snap and Lookup for 3D Open-vocabulary Instance Segmentation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Current 3D open-vocabulary scene understanding methods mostly utilize well- aligned 2D images as the bridge to learn 3D features with language. However, applying these approaches becomes challenging in scenarios where 2D images are absent. In this work, we introduce a new pipeline, namely, OpenIns3D, which requires no 2D image inputs, for 3D open-vocabulary scene understanding at the instance level. The OpenIns3D framework employs a \u201cMask-Snap- Lookup\u201d scheme. The \u201cMask\u201d module learns class-agnostic mask proposals in 3D point clouds. The \u201cSnap\u201d module generates synthetic scene-level images at multiple scales and leverages 2D vision language models to extract interesting objects. The \u201cLookup\u201d module searches through the outcomes of \u201cSnap\u201d with the help of Mask2Pixel maps, which contain the precise correspondence between 3D masks and synthetic images, to assign category names to the proposed masks. This 2D input-free and flexible approach achieves state-of-the-art results on a wide range of indoor and outdoor datasets by a large margin. Moreover, OpenIns3D allows for effortless switching of 2D detectors without re-training. When integrated with powerful 2D open-world models such as ODISE and GroundingDINO, excellent results were observed on open-vocabulary instance segmentation. When integrated with LLM-powered 2D models like LISA, it demonstrates a remarkable capacity to process highly complex text queries which require intricate reasoning and world knowledge. The code and model will be made publicly available.",
        "keywords": "Point Cloud Understanding;Open-world understanding;3D scene understanding;3D deep learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/50800571ced2233d7b8b6ebde7d50ab291ec0a18.pdf",
        "author": "Zhening Huang;Xiaoyang Wu;Xi Chen;Hengshuang Zhao;Lei Zhu;Joan Lasenby",
        "authorids": "~Zhening_Huang1;~Xiaoyang_Wu1;~Xi_Chen30;~Hengshuang_Zhao2;~Lei_Zhu1;~Joan_Lasenby1",
        "gender": "M;M;M;M;M;",
        "homepage": "https://zheninghuang.github.io/;https://xywu.me;;https://hszhao.github.io;https://sites.google.com/site/indexlzhu/home?authuser=0;",
        "dblp": "315/8810;56/4409-2;;185/7848;99/549-3;",
        "google_scholar": ";Np1dTpQAAAAJ;INISnXkAAAAJ;4uE10I0AAAAJ;https://scholar.google.com.hk/citations?user=AQtqhaYAAAAJ;",
        "orcid": ";;;0000-0001-8277-2706;;",
        "linkedin": ";;;hengshuang-zhao-347b8391/?originalSubdomain=hk;;",
        "or_profile": "~Zhening_Huang1;~Xiaoyang_Wu1;~Xi_Chen30;~Hengshuang_Zhao2;~Lei_Zhu1;~Joan_Lasenby1",
        "aff": "University of Cambridge;the University of Hong Kong, University of Hong Kong;the University of Hong Kong, University of Hong Kong;The University of Hong Kong;Hong Kong University of Science and Technology (Guangzhou) & HKUST;",
        "aff_domain": "cam.ac.uk;cs.hku.hk;cs.hku.hk;hku.hk;ust.hk;",
        "position": "PhD student;PhD student;PhD student;Assistant Professor;Assistant Professor;",
        "bibtex": "@misc{\nhuang2024openinsd,\ntitle={OpenIns3D: Snap and Lookup for 3D Open-vocabulary Instance Segmentation},\nauthor={Zhening Huang and Xiaoyang Wu and Xi Chen and Hengshuang Zhao and Lei Zhu and Joan Lasenby},\nyear={2024},\nurl={https://openreview.net/forum?id=NL6bspkWft}\n}",
        "github": "",
        "project": "",
        "reviewers": "wuwY;3Uq7;A44f;rEPE",
        "site": "https://openreview.net/forum?id=NL6bspkWft",
        "pdf_size": 21721676,
        "rating": "3;6;6;6",
        "confidence": "4;5;3;3",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;3;3;2",
        "wc_summary": "150;125;52;64",
        "wc_strengths": "39;72;54;64",
        "wc_weaknesses": "754;138;83;104",
        "wc_questions": "62;5;31;86",
        "wc_review": "1005;340;220;318",
        "wc_reply_reviewers": "1567;0;20;13",
        "wc_reply_authors": "3566;436;488;709",
        "reply_reviewers": "4;0;1;1",
        "reply_authors": "8;1;2;1",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            97.75,
            40.94126891047711
        ],
        "wc_strengths_avg": [
            57.25,
            12.316147936753602
        ],
        "wc_weaknesses_avg": [
            269.75,
            280.2698476468705
        ],
        "wc_questions_avg": [
            46.0,
            30.667572450391308
        ],
        "wc_review_avg": [
            470.75,
            311.73977529343284
        ],
        "wc_reply_reviewers_avg": [
            400.0,
            673.80598097672
        ],
        "wc_reply_authors_avg": [
            1299.75,
            1312.4287361605582
        ],
        "reply_reviewers_avg": [
            1.5,
            1.5
        ],
        "reply_authors_avg": [
            3.0,
            2.9154759474226504
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.17407765595569782,
        "gs_citation": 43,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10353236313218189903&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;1;1;2",
        "aff_unique_norm": "University of Cambridge;University of Hong Kong;Hong Kong University of Science and Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.cam.ac.uk;https://www.hku.hk;https://www.ust.hk",
        "aff_unique_abbr": "Cambridge;HKU;HKUST",
        "aff_campus_unique_index": "0;1;1;1;2",
        "aff_campus_unique": "Cambridge;Hong Kong SAR;Guangzhou",
        "aff_country_unique_index": "0;1;1;1;1",
        "aff_country_unique": "United Kingdom;China"
    },
    {
        "title": "Improving LoRA in Privacy-preserving Federated Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18792",
        "id": "NLPzL6HWNl",
        "author_site": "Youbang Sun, Zitao Li, Yaliang Li, Bolin Ding",
        "tldr": "",
        "abstract": "Low-rank adaptation (LoRA) is one of the most popular task-specific parameter-efficient fine-tuning (PEFT) methods on pre-trained language models for its good performance and computational efficiency.\nLoRA injects a product of two trainable rank decomposition matrices over the top of each frozen pre-trained model module.\nHowever, when applied in the setting of privacy-preserving federated learning (FL), LoRA may become unstable due to the following facts: 1) the effects of data heterogeneity and multi-step local updates are non-negligible, 2) additive noise enforced on updating gradients to guarantee differential privacy (DP) can be amplified and 3) the final performance is susceptible to hyper-parameters.\nA key factor leading to these phenomena is the discordance between jointly optimizing the two low-rank matrices by local clients and separately aggregating them by the central server.\nThus, this paper proposes an efficient and effective version of LoRA, Federated Freeze A LoRA (FFA-LoRA), to alleviate these challenges and further halve the communication cost of federated fine-tuning LLMs.\nThe core idea of FFA-LoRA is to fix the randomly initialized non-zero matrices and only fine-tune the zero-initialized matrices.\nCompared to LoRA, FFA-LoRA is motivated by practical and theoretical benefits in privacy-preserved FL. \nOur experiments demonstrate that FFA-LoRA provides more consistent performance with better computational efficiency over vanilla LoRA in various FL tasks.",
        "keywords": "Federated Learning;Parameter-efficient Fine-tuning;Differential Privacy;Large Language Model",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/cb07f43869532c7d26677f0ce985be34d2dfe8b4.pdf",
        "author": "Youbang Sun;Zitao Li;Yaliang Li;Bolin Ding",
        "authorids": "~Youbang_Sun1;~Zitao_Li1;~Yaliang_Li1;~Bolin_Ding3",
        "gender": "M;M;M;M",
        "homepage": ";;https://sites.google.com/site/yaliangli/;https://bolinding.github.io/",
        "dblp": ";220/3927;https://dblp.org/pers/hd/l/Li:Yaliang;46/3522.html",
        "google_scholar": "TUR1VtcAAAAJ;_8DPNucAAAAJ;CCPBcdYAAAAJ;AjYkTi8AAAAJ",
        "orcid": ";;0000-0002-4204-6096;",
        "linkedin": "sun-yb/;;;bolin-ding-50a0119/",
        "or_profile": "~Youbang_Sun1;~Zitao_Li1;~Yaliang_Li1;~Bolin_Ding3",
        "aff": "Northeastern University;Alibaba Group (U.S.);Alibaba Group;Alibaba Group",
        "aff_domain": "northeastern.edu;alibaba-inc.com;alibaba-inc.com;alibaba-inc.com",
        "position": "PhD student;Researcher;Staff Engineer;Senior Director",
        "bibtex": "@inproceedings{\nsun2024improving,\ntitle={Improving Lo{RA} in Privacy-preserving Federated Learning},\nauthor={Youbang Sun and Zitao Li and Yaliang Li and Bolin Ding},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=NLPzL6HWNl}\n}",
        "github": "",
        "project": "",
        "reviewers": "E2bX;WAsF;8DEX;1Jzn",
        "pdf_size": 334422,
        "rating": "5;5;6;6",
        "confidence": "3;3;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;3;4",
        "wc_summary": "61;49;169;146",
        "wc_strengths": "34;37;49;54",
        "wc_weaknesses": "142;10;57;259",
        "wc_questions": "30;47;5;3",
        "wc_review": "267;143;280;462",
        "wc_reply_reviewers": "286;0;22;0",
        "wc_reply_authors": "1712;679;996;947",
        "reply_reviewers": "2;0;1;0",
        "reply_authors": "4;1;2;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            106.25,
            52.06426317542581
        ],
        "wc_strengths_avg": [
            43.5,
            8.261355820929152
        ],
        "wc_weaknesses_avg": [
            117.0,
            94.654635385701
        ],
        "wc_questions_avg": [
            21.25,
            18.280795934531955
        ],
        "wc_review_avg": [
            288.0,
            113.80465719820081
        ],
        "wc_reply_reviewers_avg": [
            77.0,
            121.0
        ],
        "wc_reply_authors_avg": [
            1083.5,
            382.40064068983986
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.25,
            1.0897247358851685
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 76,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5502024821297880587&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=NLPzL6HWNl",
        "pdf": "https://openreview.net/pdf?id=NLPzL6HWNl",
        "email": "northeastern.edu;alibaba-inc.com;alibaba-inc.com;alibaba-inc.com",
        "author_num": 4,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Northeastern University;Alibaba Group",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.northeastern.edu;https://www.alibaba.com",
        "aff_unique_abbr": "NEU;Alibaba",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;1",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "NLRo4qhg6t",
        "title": "HIWE: Scene Importance Weighted Encoding For Fast Neural Radiance Field Training",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Neural radiance fields (NeRFs) have emerged as a powerful scene representa-\ntion technique to implicitly encode radiance information in space. Recent works\ndemonstrated that using a grid-based positional encoding to encode 3D radiance\ninformation in space achieves fast training speeds, often requiring only a few min-\nutes of training on small-scale synthetic datasets. However, training a NeRF model\nthat uses a grid encoding on large outdoor scenes requires several hours of train-\ning. In many scenarios, large scenes may have different amounts of detailing at\ndifferent regions, with reconstruction/representation quality more important for\nsome detailing compared to others. Different regions of the scene are however\ngiven equal importance and thus typically no regions of the scene are prioritized\nin allocating parameters in the learned model. In this work, we propose a new\ngrid-based positional encoding technique that integrates scene importance infor-\nmation in large scenes to accelerate training. Our encoding flexibly allocates more\nmodel parameters to learn the radiance information in regions of the scene that\nare deemed more important. This ensures that the more detailed scene regions are\nrepresented with a larger number of parameters, allowing more detailed radiance\ninformation to be encoded. With our approach, we demonstrate higher quality\nrepresentation for the important parts of the scene compared to state-of-art tech-\nniques for instant NeRF training, while enabling on-par or faster training times as\nstate-of-art NeRF models and small model sizes.",
        "keywords": "NeRFs;Implicit representations;Outdoor scene reconstruction;Fast Training",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Sankeerth Durvasula;Shorya Kumar;Ruofan Liang;Mohannad Shehata;Selvakumar Panneer;Nilesh Jain;Nandita Vijaykumar",
        "authorids": "~Sankeerth_Durvasula1;~Shorya_Kumar1;~Ruofan_Liang1;~Mohannad_Shehata1;~Selvakumar_Panneer1;~Nilesh_Jain1;~Nandita_Vijaykumar1",
        "gender": "M;M;M;M;M;;F",
        "homepage": "http://www.cs.toronto.edu/~sankeerth;https://shoryak.github.io/;https://nexuslrf.github.io/;;;;http://www.cs.toronto.edu/~nandita/",
        "dblp": ";;246/4635;;211/9289;134/6343.html;163/0027",
        "google_scholar": ";;;;rcZzmS0AAAAJ;sWUGELEAAAAJ;",
        "orcid": ";;;;;;",
        "linkedin": "sankeerth-durvasula/;;;mohannad-shehata;selvakumarpanneer/;nilesh-jain-4693532/;",
        "or_profile": "~Sankeerth_Durvasula1;~Shorya_Kumar1;~Ruofan_Liang1;~Mohannad_Shehata1;~Selvakumar_Panneer1;~Nilesh_Jain1;~Nandita_Vijaykumar1",
        "aff": "Department of Computer Science, University of Toronto;Indian Institute of Technology Kanpur;University of Toronto;University of Toronto;Intel;Intel Corp;University of Toronto",
        "aff_domain": "cs.toronto.edu;iitk.ac.in;toronto.edu;utoronto.ca;intel.com;intel.com;cs.toronto.edu",
        "position": "PhD student;Undergrad student;PhD student;Undergrad student;Principal Researcher;Principal Researcher;Assistant Professor",
        "bibtex": "@misc{\ndurvasula2024hiwe,\ntitle={{HIWE}: Scene Importance Weighted Encoding For Fast Neural Radiance Field Training},\nauthor={Sankeerth Durvasula and Shorya Kumar and Ruofan Liang and Mohannad Shehata and Selvakumar Panneer and Nilesh Jain and Nandita Vijaykumar},\nyear={2024},\nurl={https://openreview.net/forum?id=NLRo4qhg6t}\n}",
        "github": "",
        "project": "",
        "reviewers": "8RFz;zZ4B;BBC4;etAT",
        "site": "https://openreview.net/forum?id=NLRo4qhg6t",
        "pdf_size": 5423564,
        "rating": "1;3;3;5",
        "confidence": "4;5;4;5",
        "soundness": "1;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "3;3;1;2",
        "wc_summary": "28;102;77;52",
        "wc_strengths": "56;59;43;18",
        "wc_weaknesses": "247;343;691;117",
        "wc_questions": "2;29;6;163",
        "wc_review": "333;533;817;350",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            64.75,
            27.616797424755827
        ],
        "wc_strengths_avg": [
            44.0,
            16.170961628796228
        ],
        "wc_weaknesses_avg": [
            349.5,
            212.8538230805357
        ],
        "wc_questions_avg": [
            50.0,
            66.04922406811453
        ],
        "wc_review_avg": [
            508.25,
            194.74005109375935
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.7071067811865476,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:shCK8ZlezYMJ:scholar.google.com/&scioq=HIWE:+Scene+Importance+Weighted+Encoding+For+Fast+Neural+Radiance+Field+Training&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0;2;2;0",
        "aff_unique_norm": "University of Toronto;Indian Institute of Technology Kanpur;Intel",
        "aff_unique_dep": "Department of Computer Science;;Intel Corporation",
        "aff_unique_url": "https://www.utoronto.ca;https://www.iitk.ac.in;https://www.intel.com",
        "aff_unique_abbr": "U of T;IIT Kanpur;Intel",
        "aff_campus_unique_index": "0;1",
        "aff_campus_unique": "Toronto;Kanpur;",
        "aff_country_unique_index": "0;1;0;0;2;2;0",
        "aff_country_unique": "Canada;India;United States"
    },
    {
        "title": "Hypergraph Dynamic System",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18791",
        "id": "NLbRvr840Q",
        "author_site": "Jielong Yan, Yifan Feng, Shihui Ying, Yue Gao",
        "tldr": "",
        "abstract": "Recently, hypergraph neural networks (HGNNs) exhibit the potential to tackle tasks with high-order correlations and have achieved success in many tasks. However, existing evolution on the hypergraph has poor controllability and lacks sufficient theoretical support (like dynamic systems), thus yielding sub-optimal performance. One typical scenario is that only one or two layers of HGNNs can achieve good results and more layers lead to degeneration of performance. Under such circumstances, it is important to increase the controllability of HGNNs. In this paper, we first introduce hypergraph dynamic systems (HDS), which bridge hypergraphs and dynamic systems and characterize the continuous dynamics of representations. We then propose a control-diffusion hypergraph dynamic system by an ordinary differential equation (ODE). We design a multi-layer HDS$^{ode}$ as a neural implementation, which contains control steps and diffusion steps. HDS$^{ode}$ has the properties of controllability and stabilization and is allowed to capture long-range correlations among vertices. Experiments on $9$ datasets demonstrate HDS$^{ode}$ beat all compared methods. HDS$^{ode}$ achieves stable performance with increased layers and solves the poor controllability of HGNNs. We also provide the feature visualization of the evolutionary process to demonstrate the controllability and stabilization of HDS$^{ode}$.",
        "keywords": "Hypergraph;Ordinary Differential Equations;Dynamic System",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/1059ad830defa80d6779af276b51dc804532a119.zip",
        "author": "Jielong Yan;Yifan Feng;Shihui Ying;Yue Gao",
        "authorids": "~Jielong_Yan1;~Yifan_Feng1;~Shihui_Ying1;~Yue_Gao4",
        "gender": "M;M;M;M",
        "homepage": ";;;http://www.gaoyue.org",
        "dblp": ";225/5463;52/2125;33/3099-2",
        "google_scholar": "0iiuZJ8AAAAJ;https://scholar.google.com.hk/citations?user=WntYF-sAAAAJ;dU6ePjIAAAAJ;UTDfWocAAAAJ",
        "orcid": ";0000-0003-0878-2986;0000-0001-9423-0146;",
        "linkedin": ";;;",
        "or_profile": "~Jielong_Yan1;~Yifan_Feng1;~Shihui_Ying1;~Yue_Gao4",
        "aff": "Tsinghua University;Tsinghua University;Shanghai University;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;tsinghua.edu.cn;shu.edu.cn;tsinghua.edu.cn",
        "position": "PhD student;PhD student;Full Professor;Associate Professor",
        "bibtex": "@inproceedings{\nyan2024hypergraph,\ntitle={Hypergraph Dynamic System},\nauthor={Jielong Yan and Yifan Feng and Shihui Ying and Yue Gao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=NLbRvr840Q}\n}",
        "github": "",
        "project": "",
        "reviewers": "HBiR;KkAS;3YqS;4j9N",
        "pdf_size": 4078283,
        "rating": "5;5;6;8",
        "confidence": "3;3;4;5",
        "soundness": "3;3;3;4",
        "contribution": "3;3;2;3",
        "presentation": "3;4;3;4",
        "wc_summary": "58;68;59;120",
        "wc_strengths": "53;82;74;258",
        "wc_weaknesses": "110;83;372;25",
        "wc_questions": "63;62;232;61",
        "wc_review": "284;295;737;464",
        "wc_reply_reviewers": "84;119;1032;0",
        "wc_reply_authors": "3484;2157;2226;248",
        "reply_reviewers": "1;1;4;0",
        "reply_authors": "9;6;5;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            76.25,
            25.557533136044253
        ],
        "wc_strengths_avg": [
            116.75,
            82.23556104265356
        ],
        "wc_weaknesses_avg": [
            147.5,
            133.2037912373368
        ],
        "wc_questions_avg": [
            104.5,
            73.61555542139175
        ],
        "wc_review_avg": [
            445.0,
            183.0614650875492
        ],
        "wc_reply_reviewers_avg": [
            308.75,
            419.80196223933973
        ],
        "wc_reply_authors_avg": [
            2028.75,
            1155.873992916183
        ],
        "reply_reviewers_avg": [
            1.5,
            1.5
        ],
        "reply_authors_avg": [
            5.25,
            2.8613807855648994
        ],
        "replies_avg": [
            35,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.9847319278346618,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5496156821441390632&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=NLbRvr840Q",
        "pdf": "https://openreview.net/pdf?id=NLbRvr840Q",
        "email": "tsinghua.edu.cn;tsinghua.edu.cn;shu.edu.cn;tsinghua.edu.cn",
        "author_num": 4,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Tsinghua University;Shanghai University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.shu.edu.cn",
        "aff_unique_abbr": "THU;SHU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Hindsight PRIORs for Reward Learning from Human Preferences",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18790",
        "id": "NLevOah0CJ",
        "author_site": "Mudit Verma, Katherine Metcalf",
        "tldr": "",
        "abstract": "Preference based Reinforcement Learning (PbRL) removes the need to hand specify a reward function by learning one from preference feedback over policy behaviors. Current approaches to PbRL do not address the credit assignment problem inherent in determining which parts of a behavior most contributed to a preference resulting in data intensive approaches and subpar reward models. We address such limitations by introducing a credit assignment strategy (PRIOR) that uses a forward dynamics world model to approximate state importance within a trajectory and then guides rewards to be proportional to state importance through an auxiliary predicted return redistribution objective. Incorporating state importance into reward learning improves the speed of policy learning, overall policy performance, and reward recovery on both locomotion and manipulation tasks. For example, PRIOR achieves 80% success rate with half the amount of data compared to baselines. The performance gains and our ablations demonstrate the benefits even a simple credit assignment strategy can have on reward learning and that state importance in forward dynamics prediction is a strong proxy for a state's contribution to a preference decision.",
        "keywords": "preference based reinforcement learning;world models;return redistribution",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/17208f20711a518faba9e198a3f5c6e5d2bcac0c.pdf",
        "author": "Mudit Verma;Katherine Metcalf",
        "authorids": "~Mudit_Verma2;~Katherine_Metcalf1",
        "gender": "M;",
        "homepage": "https://famishedrover.github.io/;",
        "dblp": "192/7474;141/6401",
        "google_scholar": "8TtypKwAAAAJ;V7baeTMAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Mudit_Verma2;~Rin_Metcalf1",
        "aff": "Arizona State University;Apple",
        "aff_domain": "asu.edu;apple.com",
        "position": "PhD student;Researcher",
        "bibtex": "@inproceedings{\nverma2024hindsight,\ntitle={Hindsight {PRIOR}s for Reward Learning from Human Preferences},\nauthor={Mudit Verma and Katherine Metcalf},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=NLevOah0CJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "gM8u;4UMz;7k1k",
        "pdf_size": 4487239,
        "rating": "5;6;8",
        "confidence": "3;4;3",
        "soundness": "3;3;3",
        "contribution": "1;3;3",
        "presentation": "3;3;3",
        "wc_summary": "91;95;142",
        "wc_strengths": "76;67;97",
        "wc_weaknesses": "148;191;290",
        "wc_questions": "42;5;95",
        "wc_review": "357;358;624",
        "wc_reply_reviewers": "40;13;133",
        "wc_reply_authors": "708;609;643",
        "reply_reviewers": "1;1;1",
        "reply_authors": "2;2;2",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            109.33333333333333,
            23.156472577277874
        ],
        "wc_strengths_avg": [
            80.0,
            12.569805089976535
        ],
        "wc_weaknesses_avg": [
            209.66666666666666,
            59.45493157753097
        ],
        "wc_questions_avg": [
            47.333333333333336,
            36.935379004718804
        ],
        "wc_review_avg": [
            446.3333333333333,
            125.62996811624562
        ],
        "wc_reply_reviewers_avg": [
            62.0,
            51.40038910358559
        ],
        "wc_reply_authors_avg": [
            653.3333333333334,
            41.071752931776466
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.18898223650461363,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3876430070510656700&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=NLevOah0CJ",
        "pdf": "https://openreview.net/pdf?id=NLevOah0CJ",
        "email": "asu.edu;apple.com",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Arizona State University;Apple",
        "aff_unique_dep": ";Apple Inc.",
        "aff_unique_url": "https://www.asu.edu;https://www.apple.com",
        "aff_unique_abbr": "ASU;Apple",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "NMPLBbjYFq",
        "title": "Large Language Models as Rational Players in Competitive Economics Games",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs) have been extensively used as the backbones for general-purpose agents, and some economics literature suggest that LLMs are capable of playing various types of economics games. Following these works, to overcome the limitation of evaluating LLMs using static benchmarks, we propose to explore competitive games as an evaluation for the rationality and strategic reasoning ability of LLMs. By varying the game history revealed to LLMs-based players, we find that most of LLMs are rational in the sense of playing strategies that can increase their payoffs, but not the most rational strategies, i.e. Nash Equilibria (NEs). Moreover, when game history are available, certain types of LLMs, such as GPT-4, can converge faster to the NE strategies, which shows a higher level of rationality compared to other models. In the meantime, certain types of LLMs can win more often when game history are available, and we argue that the winning rate reflects the reasoning ability with respect to the strategies of other players. Throughout all our experiments, we observe that the ability to strictly follow the game rules described by natural languages also vary among the LLMs we tested. We provide an economics arena for the LLMs research community as a dynamic benchmark to test the above mentioned abilities of LLMs, i.e. rationality, strategic reasoning ability, and instruction-following capability.",
        "keywords": "large language models;evaluation;economics;agents;game thoery",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Shangmin Guo;Haochuan Wang;Haoran Bu;Yi Ren;Dianbo Sui;Yu-Ming Shang;Siting Lu",
        "authorids": "~Shangmin_Guo1;~Haochuan_Wang1;~Haoran_Bu2;~Yi_Ren6;~Dianbo_Sui1;~Yu-Ming_Shang1;~Siting_Lu1",
        "gender": "M;M;M;M;M;M;F",
        "homepage": ";https://pinkex.github.io/;https://github.com/Buhaoran0307;https://joshua-ren.github.io/;;https://teacher.bupt.edu.cn/shangyuming/zh_CN/index/260701/list/index.htm;https://www.sitingesteelu.com/",
        "dblp": "183/0949;;;;254/8270;254/1955.html;",
        "google_scholar": "cpOrbSoAAAAJ;https://scholar.google.com/citations?hl=zh-CN;;5QNce38AAAAJ;yi639zEAAAAJ;A9tIaWwAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0003-1716-0994;0009-0006-3069-2679;;;;0000-0003-2903-4223;",
        "linkedin": ";;;;;;",
        "or_profile": "~Shangmin_Guo1;~Haochuan_Wang1;~Haoran_Bu2;~Yi_Ren6;~Dianbo_Sui1;~Yu-Ming_Shang1;~Siting_Lu1",
        "aff": "University of Edinburgh;Harbin Institute of Technology at Weihai;Beijing University of Posts and Telecommunications;University of British Columbia;Harbin Institute of Technology;Beijing University of Posts and Telecommunications;University of Edinburgh",
        "aff_domain": "ed.ac.uk;hitwh.edu.cn;bupt.edu.cn;ubc.ca;hit.edu.cn;bupt.edu.cn;ed.ac.uk",
        "position": "PhD student;Undergrad student;PhD student;PhD student;Lecturer;Associate Professor;PhD student",
        "bibtex": "@misc{\nguo2024large,\ntitle={Large Language Models as Rational Players in Competitive Economics Games},\nauthor={Shangmin Guo and Haochuan Wang and Haoran Bu and Yi Ren and Dianbo Sui and Yu-Ming Shang and Siting Lu},\nyear={2024},\nurl={https://openreview.net/forum?id=NMPLBbjYFq}\n}",
        "github": "",
        "project": "",
        "reviewers": "xNRn;xpxk;8dxE;HCDQ;JmK9",
        "site": "https://openreview.net/forum?id=NMPLBbjYFq",
        "pdf_size": 1641303,
        "rating": "3;3;3;3;3",
        "confidence": "5;4;3;4;3",
        "soundness": "1;2;2;3;1",
        "contribution": "1;1;1;2;1",
        "presentation": "2;3;3;2;3",
        "wc_summary": "37;41;79;93;49",
        "wc_strengths": "10;44;37;68;36",
        "wc_weaknesses": "24;195;65;148;127",
        "wc_questions": "157;26;1;237;87",
        "wc_review": "228;306;182;546;299",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "440;254;189;802;330",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "1;1;1;2;1",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.8,
            0.7483314773547882
        ],
        "soundness_avg": [
            1.8,
            0.7483314773547883
        ],
        "contribution_avg": [
            1.2,
            0.4
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            59.8,
            22.184679398179274
        ],
        "wc_strengths_avg": [
            39.0,
            18.547236990991408
        ],
        "wc_weaknesses_avg": [
            111.8,
            60.60165014254975
        ],
        "wc_questions_avg": [
            101.6,
            86.54617264789933
        ],
        "wc_review_avg": [
            312.2,
            125.63184309720208
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            403.0,
            216.28499716808838
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.2,
            0.4
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10426964735935761610&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;1;2;0",
        "aff_unique_norm": "University of Edinburgh;Harbin Institute of Technology;Beijing University of Posts and Telecommunications;University of British Columbia",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.ed.ac.uk;http://www.hitwh.edu.cn/;http://www.bupt.edu.cn/;https://www.ubc.ca",
        "aff_unique_abbr": "Edinburgh;HIT;BUPT;UBC",
        "aff_campus_unique_index": "1;2;3;2",
        "aff_campus_unique": ";Weihai;Beijing;Harbin",
        "aff_country_unique_index": "0;1;1;2;1;1;0",
        "aff_country_unique": "United Kingdom;China;Canada"
    },
    {
        "id": "NMsZK4dFME",
        "title": "DPAF: Image Synthesis via Differentially Private Aggregation in Forward Phase",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Differentially private synthetic data is a promising alternative for sensitive data release. Many differentially private generative models have been proposed in the literature. Unfortunately, they all suffer from the low utility of the synthetic data, especially for high resolution images. Here, we propose DPAF, an effective differentially private generative model for high-dimensional image synthesis. Unlike previous methods, which add Gaussian noise in the \\textit{backward} phase during model training, DPAF adds differentially private feature aggregation in the \\textit{forward} phase, which brings advantages such as reducing information loss in gradient clipping and low sensitivity to aggregation. Since an inappropriate batch size has a negative impact on the utility of synthetic data, DPAF also addresses the problem of setting an appropriate batch size by proposing a novel training strategy that asymmetrically trains different parts of the discriminator. We extensively evaluate different methods on multiple image datasets (up to images of $128\\times 128$ resolution) to demonstrate the performance of DPAF.",
        "keywords": "Differential Privacy;Synthetic Data;DPSGD;Generative Adversarial Network",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/0a9c2eea2819a77057dcc1da8739717f1eed940d.pdf",
        "author": "Chih-Hsun Lin;Chia-Yi Hsu;Chia-Mu Yu;YANG CAO;Chun-Ying Huang",
        "authorids": "~Chih-Hsun_Lin2;~Chia-Yi_Hsu1;~Chia-Mu_Yu1;~YANG_CAO10;~Chun-Ying_Huang1",
        "gender": "F;M;Unspecified;Not Specified;M",
        "homepage": ";https://chiamuyu.weebly.com/;https://yangcao88.github.io/;https://people.cs.nycu.edu.tw/~chuang/;",
        "dblp": "227/2154;91/1919.html;https://dblp.uni-trier.de/pid/25/7045-11;08/3422;21/8858",
        "google_scholar": ";https://scholar.google.com.tw/citations?user=dW4W4isAAAAJ;https://scholar.google.co.jp/citations?user=S-p4DFMAAAAJ;ixq3XDUAAAAJ;https://scholar.google.com.tw/citations?user=T48_vqUAAAAJ",
        "orcid": ";0000-0002-1677-2131;0000-0002-6424-8633;0000-0001-5503-9541;0000-0002-2668-0556",
        "linkedin": "chia-yi-hsu-136a86155;chia-mu-yu-0b130988?originalSubdomain=tw;;;",
        "or_profile": "~Chia-Yi_Hsu1;~Chia-Mu_Yu1;~YANG_CAO10;~Chun-Ying_Huang1;~CHIH-HSUN_LIN1",
        "aff": "National Yang Ming Chiao Tung University;National Yang Ming Chiao Tung University;Hokkaido University;National Yang Ming Chiao Tung University;National Yang Ming Chiao Tung University",
        "aff_domain": "nycu.edu.tw;nycu.edu.tw;hokudai.ac.jp;nycu.edu.tw;nycu.edu.tw",
        "position": "PhD student;Associate Professor;Associate Professor;Full Professor;PhD student",
        "bibtex": "@misc{\nlin2024dpaf,\ntitle={{DPAF}: Image Synthesis via Differentially Private Aggregation in Forward Phase},\nauthor={Chih-Hsun Lin and Chia-Yi Hsu and Chia-Mu Yu and YANG CAO and Chun-Ying Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=NMsZK4dFME}\n}",
        "github": "",
        "project": "",
        "reviewers": "yCfM;NDSs;xqsU",
        "site": "https://openreview.net/forum?id=NMsZK4dFME",
        "pdf_size": 1194593,
        "rating": "3;3;3",
        "confidence": "4;4;4",
        "soundness": "2;2;1",
        "contribution": "1;2;1",
        "presentation": "1;2;2",
        "wc_summary": "126;74;51",
        "wc_strengths": "39;34;12",
        "wc_weaknesses": "354;464;14",
        "wc_questions": "5;133;550",
        "wc_review": "524;705;627",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            83.66666666666667,
            31.372316175606514
        ],
        "wc_strengths_avg": [
            28.333333333333332,
            11.728408057172787
        ],
        "wc_weaknesses_avg": [
            277.3333333333333,
            191.54343864744857
        ],
        "wc_questions_avg": [
            229.33333333333334,
            232.68911066533005
        ],
        "wc_review_avg": [
            618.6666666666666,
            74.12751775750276
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10862069752022340412&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "National Yang Ming Chiao Tung University;Hokkaido University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.nycu.edu.tw;https://www.hokudai.ac.jp",
        "aff_unique_abbr": "NYCU;Hokkaido U",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Taiwan;",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "China;Japan"
    },
    {
        "id": "NOz4YbdHl9",
        "title": "Confession Networks: Boosting Accuracy and Improving Confidence in Classification",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this paper, we propose a novel method for measuring the confidence of neural networks in classification problems. There are existing statistical approaches to measure neural network confidence for classification. However, in this paper, we propose a new loss function such that the neural network signals the amount of confidence it has for its prediction, independent of the prediction itself. The first goal of this paper is to design an appropriate loss function to output a confidence measure along with classification scores for neural networks. A second goal is to examine whether such a loss function can improve network performance. There are many applications where a confidence measure is important, including autonomous driving to ensure that the predictions relating to the area around the vehicle are correct or in important medical diagnostic decisions. We demonstrate that the proposed approach both improves prediction accuracy and also provides a valuable output for gauging the confidence of the prediction.",
        "keywords": "Neural Networks;Loss function;Confidence;Computer Vision;Confidence bound",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Sina Radpour;Neil Bruce",
        "authorids": "~Sina_Radpour1;~Neil_Bruce1",
        "gender": "M;M",
        "homepage": ";http://socs.uoguelph.ca/~brucen/",
        "dblp": ";https://dblp.uni-trier.de/pers/hd/b/Bruce:Neil_D=_B=",
        "google_scholar": ";Gnezf-4AAAAJ",
        "orcid": ";0000-0002-5710-1107",
        "linkedin": "www.linkedin.com/in/sina-radpour-109725a4;",
        "or_profile": "~Sina_Radpour1;~Neil_Bruce1",
        "aff": "University of Guelph;University of Guelph",
        "aff_domain": "uoguelph.ca;uoguelph.ca",
        "position": "MS student;Associate Professor",
        "bibtex": "@misc{\nradpour2024confession,\ntitle={Confession Networks: Boosting Accuracy and Improving Confidence in Classification},\nauthor={Sina Radpour and Neil Bruce},\nyear={2024},\nurl={https://openreview.net/forum?id=NOz4YbdHl9}\n}",
        "github": "",
        "project": "",
        "reviewers": "8iyk;dbJp;nRM1;TtcN",
        "site": "https://openreview.net/forum?id=NOz4YbdHl9",
        "pdf_size": 406794,
        "rating": "1;3;5;5",
        "confidence": "5;5;3;4",
        "soundness": "1;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "2;2;2;2",
        "wc_summary": "24;47;45;52",
        "wc_strengths": "21;62;63;56",
        "wc_weaknesses": "236;441;42;75",
        "wc_questions": "84;29;16;60",
        "wc_review": "365;579;166;243",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            1.6583123951777
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            42.0,
            10.700467279516348
        ],
        "wc_strengths_avg": [
            50.5,
            17.240939649566666
        ],
        "wc_weaknesses_avg": [
            198.5,
            158.07988486837914
        ],
        "wc_questions_avg": [
            47.25,
            26.564779313971346
        ],
        "wc_review_avg": [
            338.25,
            156.0598843393138
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.8181818181818182,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Mbgw99LNiRMJ:scholar.google.com/&scioq=Confession+Networks:+Boosting+Accuracy+and+Improving+Confidence+in+Classification&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Guelph",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uoguelph.ca",
        "aff_unique_abbr": "U of G",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "NPViqdhTIi",
        "title": "Parameter-Free Molecular Classification and Regression with Gzip",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In recent years, natural language processing approaches to machine learning, most prominently deep neural network-based transformers, have been extensively applied to molecular classification and regression tasks, including the prediction of pharmacokinetic and quantum-chemical properties. However, models based on deep neural networks generally require extensive training, large training data sets, and resource-consuming hyperparameter tuning. Recently, a low-resource and universal alternative to deep learning approaches based on Gzip compression for text classification has been proposed, which reportedly performs surprisingly well compared to large language models such as BERT, given its conceptually simplistic nature. Here, we adapt the proposed method to support multiprocessing, multi-class classification, class-weighing, and regression and apply it to classification and regression tasks on various data sets of molecules from the organic chemistry, biochemistry, drug discovery, and material science domains. We further propose converting numerical descriptors into string representations, enabling the integration of language input with domain-informed descriptors. Our results show that the method can be used to classify and predict a variety of properties of molecules, can reach the performance of large-scale chemical language models in a subset of tasks, and has the potential for application in information retrieval from large chemical databases.",
        "keywords": "cheminformatics;chemistry;language;compression",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Jan Weinreich;Daniel Probst",
        "authorids": "jan.weinreich@epfl.ch;~Daniel_Probst2",
        "gender": ";M",
        "homepage": ";https://danielprobst.science",
        "dblp": ";",
        "google_scholar": ";TNNgroIAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "jan.weinreich@epfl.ch;~Daniel_Probst2",
        "aff": ";EPFL - EPF Lausanne",
        "aff_domain": ";epfl.ch",
        "position": ";Postdoc",
        "bibtex": "@misc{\nweinreich2024parameterfree,\ntitle={Parameter-Free Molecular Classification and Regression with Gzip},\nauthor={Jan Weinreich and Daniel Probst},\nyear={2024},\nurl={https://openreview.net/forum?id=NPViqdhTIi}\n}",
        "github": "",
        "project": "",
        "reviewers": "5hym;o9gf;ovMF;1REg",
        "site": "https://openreview.net/forum?id=NPViqdhTIi",
        "pdf_size": 366589,
        "rating": "3;3;5;8",
        "confidence": "4;5;3;4",
        "soundness": "1;1;3;3",
        "contribution": "2;2;2;3",
        "presentation": "1;3;3;3",
        "wc_summary": "37;35;150;161",
        "wc_strengths": "39;20;100;291",
        "wc_weaknesses": "336;213;90;258",
        "wc_questions": "56;58;595;258",
        "wc_review": "468;326;935;968",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.0,
            1.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            95.75,
            59.88061038433059
        ],
        "wc_strengths_avg": [
            112.5,
            107.21124008237196
        ],
        "wc_weaknesses_avg": [
            224.25,
            89.13017165920864
        ],
        "wc_questions_avg": [
            241.75,
            219.8390035912645
        ],
        "wc_review_avg": [
            674.25,
            282.00033244661256
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.34554737023254406,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8302985482205851432&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0",
        "aff_unique_norm": "EPFL",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.epfl.ch",
        "aff_unique_abbr": "EPFL",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Lausanne",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Switzerland"
    },
    {
        "id": "NQUXBoGiDU",
        "title": "Spiking CenterNet: A Distillation-boosted Spiking Neural Network for Object Detection",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In the era of AI at the edge, self-driving cars, and climate change, the need for energy-efficient, small, embedded AI is growing. \nSpiking Neural Networks (SNNs) are a promising approach to address this challenge, with their event-driven information flow and sparse activations.\nWe propose Spiking CenterNet for object detection on event data.\nIt combines an SNN CenterNet adaptation with an efficient M2U-Net-based decoder.\nOur model significantly outperforms comparable previous work on Prophesee's challenging GEN1 Automotive Detection Dataset while using less than half the energy. \nDistilling the knowledge of a non-spiking teacher into our SNN further increases performance.\nTo the best of our knowledge, our work is the first approach that takes advantage of knowledge distillation in the field of spiking object detection.",
        "keywords": "SNN;Knowledge Distillation;object detection;event data",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Lennard Bodden;Bach Ha;Franziska Schwaiger;Lars Kreuzberg;Sven Behnke",
        "authorids": "~Lennard_Bodden1;~Bach_Ha1;~Franziska_Schwaiger1;~Lars_Kreuzberg1;~Sven_Behnke1",
        "gender": "M;Not Specified;F;;M",
        "homepage": ";;;;http://ais.uni-bonn.de/behnke",
        "dblp": ";;;;16/6112",
        "google_scholar": ";;;;https://scholar.google.de/citations?user=1xx3X_0AAAAJ",
        "orcid": ";0009-0001-9241-6374;;0009-0005-9645-2531;0000-0002-5040-7525",
        "linkedin": "lennard-bodden-040938192/;;franziska-schwaiger-4ba686204;;sven-behnke-a566492",
        "or_profile": "~Lennard_Bodden1;~Bach_Ha1;~Franziska_Schwaiger1;~Lars_Kreuzberg1;~Sven_Behnke1",
        "aff": "Fraunhofer Institute IAIS, Fraunhofer IAIS;Fraunhofer Institute IAIS, Fraunhofer IAIS;Fraunhofer Institute for Cognitive Systems IKS;Fraunhofer Institute IAIS, Fraunhofer IAIS;University of Bonn",
        "aff_domain": "iais.fraunhofer.de;iais.fraunhofer.de;iks.fraunhofer.de;iais.fraunhofer.de;uni-bonn.de",
        "position": "Researcher;Researcher;Researcher;Researcher;Full Professor",
        "bibtex": "@misc{\nbodden2024spiking,\ntitle={Spiking CenterNet: A Distillation-boosted Spiking Neural Network for Object Detection},\nauthor={Lennard Bodden and Bach Ha and Franziska Schwaiger and Lars Kreuzberg and Sven Behnke},\nyear={2024},\nurl={https://openreview.net/forum?id=NQUXBoGiDU}\n}",
        "github": "",
        "project": "",
        "reviewers": "gBpC;Dq9d;DzYu;WJNq",
        "site": "https://openreview.net/forum?id=NQUXBoGiDU",
        "pdf_size": 604654,
        "rating": "1;3;5;6",
        "confidence": "5;4;4;4",
        "soundness": "1;2;3;3",
        "contribution": "1;2;2;2",
        "presentation": "1;3;2;3",
        "wc_summary": "7;91;39;41",
        "wc_strengths": "2;41;63;26",
        "wc_weaknesses": "63;95;121;12",
        "wc_questions": "3;59;2;81",
        "wc_review": "75;286;225;160",
        "wc_reply_reviewers": "0;0;18;17",
        "wc_reply_authors": "116;264;391;253",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            3.75,
            1.920286436967152
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            44.5,
            30.045798375147232
        ],
        "wc_strengths_avg": [
            33.0,
            22.214859891523062
        ],
        "wc_weaknesses_avg": [
            72.75,
            40.64710936831794
        ],
        "wc_questions_avg": [
            36.25,
            34.63650530870573
        ],
        "wc_review_avg": [
            186.5,
            78.28952675805365
        ],
        "wc_reply_reviewers_avg": [
            8.75,
            8.757139944068497
        ],
        "wc_reply_authors_avg": [
            256.0,
            97.33704330829039
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.8268106308031117,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9091751693664892127&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;1;0;2",
        "aff_unique_norm": "Fraunhofer Institute for Intelligent Analysis and Information Systems;Fraunhofer Institute for Cognitive Systems;University of Bonn",
        "aff_unique_dep": "Intelligent Analysis and Information Systems;Cognitive Systems;",
        "aff_unique_url": "https://www.iais.fraunhofer.de/;https://www.iks.fraunhofer.de/;https://www.uni-bonn.de/",
        "aff_unique_abbr": "Fraunhofer IAIS;IKS;UBonn",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "NRIcs2TR7k",
        "title": "Extending Multi-modal Contrastive Representations",
        "track": "main",
        "status": "Desk Reject",
        "tldr": "",
        "abstract": "Multi-modal contrastive representation (MCR) of more than three modalities is critical in multi-modal learning. Although recent methods showcase impressive achievements, the high dependence on large-scale, high-quality paired data and the expensive training costs limit their further development. Inspired by recent C-MCR, this paper proposes Extending Multimodal Contrastive Representation (Ex-MCR), a training-efficient and paired-data-free method to flexibly learn unified contrastive representation space for more than three modalities by integrating the knowledge of existing MCR spaces. Specifically, Ex-MCR aligns multiple existing MCRs into the same based MCR, which can effectively preserve the original semantic alignment of the based MCR. Besides, we comprehensively enhance the entire learning pipeline for aligning MCR spaces from the perspectives of training data, architecture, and learning objectives. With the preserved original modality alignment and the enhanced space alignment, Ex-MCR shows superior representation learning performance and excellent modality extensibility. To demonstrate the effectiveness of Ex-MCR, we align the MCR spaces of CLAP (audio-text) and ULIP (3D-vision) into the CLIP (vision-text), leveraging the overlapping text and image modality, respectively. Remarkably, without using any paired data, Ex-MCR learns a 3D-image-text-audio unified contrastive representation, and it achieves state-of-the-art performance on audio-visual, 3D-image, audio-text, visual-text retrieval, and 3D object classification tasks. More importantly, extensive qualitative results further demonstrate the emergent semantic alignment between the extended modalities (e.g., audio and 3D), which highlights the great potential of modality extensibility.",
        "keywords": "multi-modal representation learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/0251067c424e1cba4d71dff53ae723c96b40b264.zip",
        "author": "Zehan Wang;Ziang Zhang;Luping Liu;Yang Zhao;Haifeng Huang;Tao Jin;Zhou Zhao",
        "authorids": "~Zehan_Wang2;~Ziang_Zhang1;~Luping_Liu2;~Yang_Zhao14;~Haifeng_Huang3;~Tao_Jin2;~Zhou_Zhao3",
        "gender": "M;M;;M;M;M;",
        "homepage": "https://github.com/12zehan17;;;;https://zzzzchs.github.io/;https://hugddygff.github.io/;",
        "dblp": "126/7826-1;;;50/2082-22;;88/4850-4.html;",
        "google_scholar": "euXK0lkAAAAJ;DptGMnYAAAAJ;;;oUm2gZUAAAAJ;;",
        "orcid": "0009-0007-7509-7563;;;;;0000-0003-3564-1628;",
        "linkedin": ";;;;haifeng-huang-784b2b249/;;",
        "or_profile": "~Zehan_Wang2;~Ziang_Zhang1;~Luping_Liu2;~Yang_Zhao14;~Haifeng_Huang3;~Tao_Jin2;~Zhou_Zhao3",
        "aff": "Zhejiang University;Zhejiang University;;ByteDance Inc.;Zhejiang University;Zhejiang University;",
        "aff_domain": "zju.edu.cn;zju.edu.cn;;bytedance.com;zju.edu.cn;zju.edu.cn;",
        "position": "PhD student;Undergrad student;;Researcher;MS student;Assistant Professor;",
        "bibtex": "@misc{\nwang2024extending,\ntitle={Extending Multi-modal Contrastive Representations},\nauthor={Zehan Wang and Ziang Zhang and Luping Liu and Yang Zhao and Haifeng Huang and Tao Jin and Zhou Zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=NRIcs2TR7k}\n}",
        "github": "",
        "project": "",
        "reviewers": "GFCr;CZb4;6GyA;pnPG",
        "site": "https://openreview.net/forum?id=NRIcs2TR7k",
        "pdf_size": 1596711,
        "rating": "6;6;6;6",
        "confidence": "4;5;4;3",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;2;4;2",
        "wc_summary": "28;25;98;118",
        "wc_strengths": "34;50;88;200",
        "wc_weaknesses": "89;46;45;424",
        "wc_questions": "5;33;127;97",
        "wc_review": "156;154;358;839",
        "wc_reply_reviewers": "87;11;0;64",
        "wc_reply_authors": "656;558;1289;862",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "2;2;3;3",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            67.25,
            41.372545244400904
        ],
        "wc_strengths_avg": [
            93.0,
            64.81512169239521
        ],
        "wc_weaknesses_avg": [
            151.0,
            158.61431209068115
        ],
        "wc_questions_avg": [
            65.5,
            48.71088174114691
        ],
        "wc_review_avg": [
            376.75,
            279.45247807095933
        ],
        "wc_reply_reviewers_avg": [
            40.5,
            36.1420807370024
        ],
        "wc_reply_authors_avg": [
            841.25,
            280.8285731545136
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12624363346917589753&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "Zhejiang University;ByteDance",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.zju.edu.cn;https://www.bytedance.com",
        "aff_unique_abbr": "ZJU;ByteDance",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "NRRHkJE03w",
        "title": "Beyond Dynamics: Learning to Discover Conservation Principles",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The discovery of conservation principles is crucial for understanding the fundamental behavior of both classical and quantum physical systems across numerous domains. This paper introduces an innovative method that merges representation learning and topological analysis to explore the topology of conservation law spaces. Notably, the robustness of our approach to noise makes it suitable for complex experimental setups and its aptitude extends to the analysis of quantum systems, as successfully demonstrated in our paper. We exemplify our method's potential to unearth previously unknown conservation principles and endorse interdisciplinary research through a variety of physical simulations. In conclusion, this work emphasizes the significance of data-driven techniques in deepening our comprehension of the essential principles governing classical and quantum physical systems.",
        "keywords": "conservation laws;physics learning;representation learning;topological analysis",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/0363756424146fb4fc75595bfa305083281fb341.zip",
        "author": "Antonii Belyshev;Alexander Kovrigin;Andrey E Ustyuzhanin",
        "authorids": "~Antonii_Belyshev1;~Alexander_Kovrigin1;~Andrey_E_Ustyuzhanin1",
        "gender": "M;M;M",
        "homepage": ";https://alexkovrigin.me;",
        "dblp": ";;",
        "google_scholar": ";;https://scholar.google.ru/citations?user=vfQf9SIAAAAJ",
        "orcid": ";;",
        "linkedin": "https://www.linkedin.com/mwlite/in/antonii-belyshev-32549a276;waleko/;",
        "or_profile": "~Antonii_Belyshev1;~Alexander_Kovrigin1;~Andrey_E_Ustyuzhanin1",
        "aff": "Constructor University;Constructor University;National University of Singapore",
        "aff_domain": "constructor.university;constructor.university;nus.edu.sg",
        "position": "MS student;Undergrad student;Researcher",
        "bibtex": "@misc{\nbelyshev2024beyond,\ntitle={Beyond Dynamics: Learning to Discover Conservation Principles},\nauthor={Antonii Belyshev and Alexander Kovrigin and Andrey E Ustyuzhanin},\nyear={2024},\nurl={https://openreview.net/forum?id=NRRHkJE03w}\n}",
        "github": "",
        "project": "",
        "reviewers": "2euw;dyZf;MLvu;vaAm",
        "site": "https://openreview.net/forum?id=NRRHkJE03w",
        "pdf_size": 9260174,
        "rating": "1;3;3;5",
        "confidence": "2;3;5;3",
        "soundness": "1;2;3;3",
        "contribution": "1;2;2;3",
        "presentation": "1;1;1;2",
        "wc_summary": "1;61;159;67",
        "wc_strengths": "1;28;36;39",
        "wc_weaknesses": "138;129;338;137",
        "wc_questions": "1;174;87;168",
        "wc_review": "141;392;620;411",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.25,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            1.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            72.0,
            56.471231613982
        ],
        "wc_strengths_avg": [
            26.0,
            14.983324063771697
        ],
        "wc_weaknesses_avg": [
            185.5,
            88.11498170004917
        ],
        "wc_questions_avg": [
            107.5,
            70.43614129124337
        ],
        "wc_review_avg": [
            391.0,
            169.81018815135917
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.3244428422615251,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15850435389089946387&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Constructor University;National University of Singapore",
        "aff_unique_dep": ";",
        "aff_unique_url": ";https://www.nus.edu.sg",
        "aff_unique_abbr": ";NUS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "1",
        "aff_country_unique": ";Singapore"
    },
    {
        "id": "NRVW8SShFd",
        "title": "MaskINT: Video Editing via Interpolative Non-autoregressive Masked Transformers",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recent advances in generative AI have significantly enhanced image and video editing, particularly in the context of text prompt control. State-of-the-art approaches predominantly rely on diffusion models to accomplish these tasks. However, the computational demands of diffusion-based methods are substantial, often necessitating large-scale paired datasets for training, causing them challenges to employ in practical applications. This study addresses this challenge by breaking down the text-based video editing process into two stages. In the first stage, we leverage an existing text-to-image diffusion model to simultaneously edit a select few key frames without any additional fine-tuning. In the second stage, we introduce an efficient model called MaskINT, which is built on non-autoregressive masked generative transformers. MaskINT specializes in frame interpolation between the key frames, benefiting from structural guidance provided by intermediate frames. The training of MaskINT incorporates masked token modeling. Our comprehensive set of experiments illustrates the efficacy and efficiency of MaskINT when compared to other diffusion-based methodologies. This research offers a practical solution for text-based video editing and showcases the potential of non-autoregressive masked generative transformers in this domain.",
        "keywords": "video editing;masked generative transformers;frame interpolation;diffusion models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/ad82dacda2c8822c2ee7e2de65f20cbf10ae3425.zip",
        "author": "Haoyu Ma;Shahin Mahdizadehaghdam;Bichen Wu;Zhipeng Fan;Yuchao Gu;Wenliang Zhao;Lior Shapira;Xiaohui Xie",
        "authorids": "~Haoyu_Ma1;~Shahin_Mahdizadehaghdam2;~Bichen_Wu1;~Zhipeng_Fan1;~Yuchao_Gu1;~Wenliang_Zhao1;~Lior_Shapira1;~Xiaohui_Xie2",
        "gender": "M;F;M;M;M;M;;",
        "homepage": "https://www.ics.uci.edu/~haoyum3/;https://www.linkedin.com/in/shahin-m-69512938/;;https://zhipeng-fan.github.io;https://ycgu.site/;;;https://www.ics.uci.edu/~xhx/",
        "dblp": "144/1634;;130/1371;;266/4395;145/0879;;",
        "google_scholar": "8jugwosAAAAJ;;K3QJPdMAAAAJ;Nb6ggPwAAAAJ;YpfrXyQAAAAJ;;;1CR0meYAAAAJ",
        "orcid": "0000-0001-6646-2644;;;0000-0001-9386-717X;;;;",
        "linkedin": "haoyu-ma-53517915a/;;bichenwu/;;;;;",
        "or_profile": "~Haoyu_Ma1;~Shahin_Mahdizadehaghdam2;~Bichen_Wu1;~Zhipeng_Fan1;~Yuchao_Gu1;~Wenliang_Zhao1;~Lior_Shapira1;~Xiaohui_Xie2",
        "aff": "University of California, Irvine;;Meta Facebook;Meta Facebook;National University of Singapore;;;University of California, Irvine",
        "aff_domain": "uci.edu;;fb.com;fb.com;u.nus.edu;;;uci.edu",
        "position": "PhD student;;Research Scientist;Researcher;PhD student;;;Full Professor",
        "bibtex": "@misc{\nma2024maskint,\ntitle={Mask{INT}: Video Editing via Interpolative Non-autoregressive Masked Transformers},\nauthor={Haoyu Ma and Shahin Mahdizadehaghdam and Bichen Wu and Zhipeng Fan and Yuchao Gu and Wenliang Zhao and Lior Shapira and Xiaohui Xie},\nyear={2024},\nurl={https://openreview.net/forum?id=NRVW8SShFd}\n}",
        "github": "",
        "project": "",
        "reviewers": "Np2s;hZt7;gZ41",
        "site": "https://openreview.net/forum?id=NRVW8SShFd",
        "pdf_size": 38225039,
        "rating": "5;5;6",
        "confidence": "3;4;4",
        "soundness": "3;3;3",
        "contribution": "2;3;2",
        "presentation": "3;4;3",
        "wc_summary": "40;75;99",
        "wc_strengths": "16;38;58",
        "wc_weaknesses": "116;41;344",
        "wc_questions": "24;48;64",
        "wc_review": "196;202;565",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "439;226;393",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            71.33333333333333,
            24.225789747475496
        ],
        "wc_strengths_avg": [
            37.333333333333336,
            17.15290710702481
        ],
        "wc_weaknesses_avg": [
            167.0,
            128.84874853874211
        ],
        "wc_questions_avg": [
            45.333333333333336,
            16.438437341250605
        ],
        "wc_review_avg": [
            321.0,
            172.5514416051051
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            352.6666666666667,
            91.51441902175246
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12650805512517867886&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;1;2;0",
        "aff_unique_norm": "University of California, Irvine;Meta;National University of Singapore",
        "aff_unique_dep": ";Meta Platforms, Inc.;",
        "aff_unique_url": "https://www.uci.edu;https://meta.com;https://www.nus.edu.sg",
        "aff_unique_abbr": "UCI;Meta;NUS",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Irvine;",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "United States;Singapore"
    },
    {
        "id": "NSBP7HzA5Z",
        "title": "Inductive Transformers: How Large Language Models Form Concepts, And How to Make Them Even Better At It",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We present a new approach to designing additional inductive bias into transformers to enable tighter conceptual organization, greater conceptual control, and higher levels of conceptual abstraction. This is a paper for those who would like to understand why transformers are structured the way they are and how new versions could be designed for ``neuro-diversity'' -- to learn differently from the same data.  This family of inductive bias requires only modest modifications to transformer activation functions. We explain the approach and give an illustrative example simulation.",
        "keywords": "inductive bias;transformers;encoder;decoder;natural language;large language model;probabilistic graphical models;belief propagation;message passing;open universe;probabilistic program;probabilistic grammar;perturbation convergence experiment;machine learning identifiability;controllability;alignment;neurodiversity;concept learning;generative models",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Ben Vigoda;Thomas Bernard Rochais",
        "authorids": "~Ben_Vigoda1;~Thomas_Bernard_Rochais1",
        "gender": "Not Specified;M",
        "homepage": ";",
        "dblp": "10/7819.html;",
        "google_scholar": ";MvBcdlMAAAAJ",
        "orcid": ";0000-0003-1861-0256",
        "linkedin": "benvigoda/;thomas-rochais/",
        "or_profile": "~Ben_Vigoda1;~Thomas_Bernard_Rochais1",
        "aff": "Product Genius;Product Genius, Inc",
        "aff_domain": "productgenius.ai;productgenius.io",
        "position": "Researcher;Researcher",
        "bibtex": "@misc{\nvigoda2024inductive,\ntitle={Inductive Transformers: How Large Language Models Form Concepts, And How to Make Them Even Better At It},\nauthor={Ben Vigoda and Thomas Bernard Rochais},\nyear={2024},\nurl={https://openreview.net/forum?id=NSBP7HzA5Z}\n}",
        "github": "",
        "project": "",
        "reviewers": "Yhkg;onZM;x6Rf;XTyg",
        "site": "https://openreview.net/forum?id=NSBP7HzA5Z",
        "pdf_size": 557789,
        "rating": "1;3;3;5",
        "confidence": "5;3;2;2",
        "soundness": "2;2;2;2",
        "contribution": "1;2;2;3",
        "presentation": "1;1;1;3",
        "wc_summary": "90;149;35;91",
        "wc_strengths": "52;45;47;82",
        "wc_weaknesses": "113;149;16;126",
        "wc_questions": "1;60;67;106",
        "wc_review": "256;403;165;405",
        "wc_reply_reviewers": "0;35;0;0",
        "wc_reply_authors": "624;1034;629;781",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;3;1;1",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.0,
            1.224744871391589
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            1.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            91.25,
            40.31361432568407
        ],
        "wc_strengths_avg": [
            56.5,
            14.941552797483935
        ],
        "wc_weaknesses_avg": [
            101.0,
            50.73953093988946
        ],
        "wc_questions_avg": [
            58.5,
            37.53997868939193
        ],
        "wc_review_avg": [
            307.25,
            101.96169623932313
        ],
        "wc_reply_reviewers_avg": [
            8.75,
            15.155444566227676
        ],
        "wc_reply_authors_avg": [
            767.0,
            166.56680341532643
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:MdQbDaIQ_oQJ:scholar.google.com/&scioq=Inductive+Transformers:+How+Large+Language+Models+Form+Concepts,+And+How+to+Make+Them+Even+Better+At+It&hl=en&as_sdt=0,47",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Product Genius;Product Genius, Inc",
        "aff_unique_dep": ";",
        "aff_unique_url": ";",
        "aff_unique_abbr": ";",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "1",
        "aff_country_unique": ";United States"
    },
    {
        "title": "Learning Over Molecular Conformer Ensembles: Datasets and Benchmarks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18789",
        "id": "NSDszJ2uIV",
        "author_site": "Yanqiao Zhu, Jeehyun Hwang, Keir Adams, Zhen Liu, Bozhao Nan, Brock Stenfors, Yuanqi Du, Jatin Chauhan, Olaf Wiest, Olexandr Isayev, Connor Coley, Yizhou Sun, Wei Wang",
        "tldr": "",
        "abstract": "Molecular Representation Learning (MRL) has proven impactful in numerous biochemical applications such as drug discovery and enzyme design. While Graph Neural Networks (GNNs) are effective at learning molecular representations from a 2D molecular graph or a single 3D structure, existing works often overlook the flexible nature of molecules, which continuously interconvert across conformations via chemical bond rotations and minor vibrational perturbations. To better account for molecular flexibility, some recent works formulate MRL as an ensemble learning problem, focusing on explicitly learning from a set of conformer structures. However, most of these studies have limited datasets, tasks, and models. In this work, we introduce the first MoleculAR Conformer Ensemble Learning (MARCEL) benchmark to thoroughly evaluate the potential of learning on con- former ensembles and suggest promising research directions. MARCEL includes four datasets covering diverse molecule- and reaction-level properties of chemically diverse molecules including organocatalysts and transition-metal catalysts, extending beyond the scope of common GNN benchmarks that are confined to drug-like molecules. In addition, we conduct a comprehensive empirical study, which benchmarks representative 1D, 2D, and 3D MRL models, along with two strategies that explicitly incorporate conformer ensembles into 3D models. Our findings reveal that direct learning from an accessible conformer space can improve performance on a variety of tasks and models.",
        "keywords": "conformer ensembles;geometric learning",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/2b462d6683facb70cd9e47bb1d3a17471cae4c08.zip",
        "author": "Yanqiao Zhu;Jeehyun Hwang;Keir Adams;Zhen Liu;Bozhao Nan;Brock Stenfors;Yuanqi Du;Jatin Chauhan;Olaf Wiest;Olexandr Isayev;Connor W. Coley;Yizhou Sun;Wei Wang",
        "authorids": "~Yanqiao_Zhu1;~Jeehyun_Hwang1;~Keir_Adams1;~Zhen_Liu15;~Bozhao_Nan1;~Brock_Stenfors1;~Yuanqi_Du1;~Jatin_Chauhan3;~Olaf_Wiest1;~Olexandr_Isayev1;~Connor_W._Coley1;~Yizhou_Sun1;~Wei_Wang13",
        "gender": "M;M;M;M;M;M;M;M;M;M;F;F;M",
        "homepage": "https://sxkdz.github.io;https://github.com/hwanggh96;;;;;https://yuanqidu.github.io/;https://chauhanjatin10.github.io/;https://chemistry.nd.edu/people/olaf-wiest/;http://olexandrisayev.com;http://web.cs.ucla.edu/~yzsun/;http://www.cs.ucla.edu/~weiwang;https://coley.mit.edu",
        "dblp": "67/8383-1;306/1727;;;;;266/2837;242/7749;;;37/3868;w/WeiWang.html;206/6284",
        "google_scholar": "NBbJT3AAAAAJ;;eh75v58AAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=zh-CN;;fAc_zZMAAAAJ;kTiFFPcAAAAJ;bfywzJwAAAAJ;7ICaR4EAAAAJ;https://scholar.google.com.tw/citations?user=TQgOjK0AAAAJ;UedS9LQAAAAJ;l015S80AAAAJ",
        "orcid": "0000-0003-2205-5304;;0000-0001-9035-7959;;;;;;0000-0001-9316-7720;0000-0001-7581-8497;;0000-0002-8180-2886;0000-0002-8271-8723",
        "linkedin": ";;keir-adams-584675167/;liu548/;;brock-stenfors-a45680188;;;;;;wei-wang-8800845/;",
        "or_profile": "~Yanqiao_Zhu1;~Jeehyun_Hwang1;~Keir_Adams1;~Zhen_Liu15;~Bozhao_Nan1;~Brock_Stenfors1;~Yuanqi_Du1;~Jatin_Chauhan3;~Olaf_Wiest1;~Olexandr_Isayev1;~Yizhou_Sun1;~Wei_Wang13;~Connor_Coley1",
        "aff": "University of California, Los Angeles;University of California, Los Angeles;Massachusetts Institute of Technology;Carnegie Mellon University;University of Notre Dame;University of Notre Dame;Cornell University;University of California, Los Angeles;University of Notre Dame;Carnegie Mellon University;University of California, Los Angeles;University of California, Los Angeles;Massachusetts Institute of Technology",
        "aff_domain": "ucla.edu;ucla.edu;mit.edu;cmu.edu;nd.edu;nd.edu;cornell.edu;ucla.edu;nd.edu;cmu.edu;ucla.edu;ucla.edu;mit.edu",
        "position": "PhD student;PhD student;PhD student;PhD student;PhD student;PhD student;PhD student;MS student;Full Professor;Associate Professor;Associate Professor;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nzhu2024learning,\ntitle={Learning Over Molecular Conformer Ensembles: Datasets and Benchmarks},\nauthor={Yanqiao Zhu and Jeehyun Hwang and Keir Adams and Zhen Liu and Bozhao Nan and Brock Stenfors and Yuanqi Du and Jatin Chauhan and Olaf Wiest and Olexandr Isayev and Connor W. Coley and Yizhou Sun and Wei Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=NSDszJ2uIV}\n}",
        "github": "",
        "project": "",
        "reviewers": "pme5;4QFi;m99Y",
        "pdf_size": 1074076,
        "rating": "5;6;8",
        "confidence": "5;3;4",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "4;3;3",
        "wc_summary": "121;80;40",
        "wc_strengths": "190;76;64",
        "wc_weaknesses": "176;1;88",
        "wc_questions": "160;1;16",
        "wc_review": "647;158;208",
        "wc_reply_reviewers": "591;0;21",
        "wc_reply_authors": "2876;86;454",
        "reply_reviewers": "2;0;1",
        "reply_authors": "6;1;1",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            80.33333333333333,
            33.06895153396242
        ],
        "wc_strengths_avg": [
            110.0,
            56.78027826631356
        ],
        "wc_weaknesses_avg": [
            88.33333333333333,
            71.44383963801373
        ],
        "wc_questions_avg": [
            59.0,
            71.6798437498297
        ],
        "wc_review_avg": [
            337.6666666666667,
            219.68209354023878
        ],
        "wc_reply_reviewers_avg": [
            204.0,
            273.78458685616323
        ],
        "wc_reply_authors_avg": [
            1138.6666666666667,
            1237.632506935004
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            2.3570226039551585
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            13,
            0
        ],
        "corr_rating_confidence": -0.3273268353539886,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17621490358999177363&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=NSDszJ2uIV",
        "pdf": "https://openreview.net/pdf?id=NSDszJ2uIV",
        "email": "ucla.edu;ucla.edu;mit.edu;cmu.edu;nd.edu;nd.edu;cornell.edu;ucla.edu;nd.edu;cmu.edu;ucla.edu;ucla.edu;mit.edu",
        "author_num": 13,
        "aff_unique_index": "0;0;1;2;3;3;4;0;3;2;0;0;1",
        "aff_unique_norm": "University of California, Los Angeles;Massachusetts Institute of Technology;Carnegie Mellon University;University of Notre Dame;Cornell University",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.ucla.edu;https://web.mit.edu;https://www.cmu.edu;https://www.nd.edu;https://www.cornell.edu",
        "aff_unique_abbr": "UCLA;MIT;CMU;Notre Dame;Cornell",
        "aff_campus_unique_index": "0;0;0;0;0",
        "aff_campus_unique": "Los Angeles;",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Image Inpainting via Tractable Steering of Diffusion Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18788",
        "id": "NSIVHTbZBR",
        "author_site": "Anji Liu, Mathias Niepert, Guy Van den Broeck",
        "tldr": "",
        "abstract": "Diffusion models are the current state of the art for generating photorealistic images. Controlling the sampling process for constrained image generation tasks such as inpainting, however,  remains challenging since exact conditioning on such constraints is intractable. While existing methods use various techniques to approximate the constrained posterior, this paper proposes to exploit the ability of Tractable Probabilistic Models (TPMs) to exactly and efficiently compute the constrained posterior, and to leverage this signal to steer the denoising process of diffusion models. Specifically, this paper adopts a class of expressive TPMs termed Probabilistic Circuits (PCs). Building upon prior advances, we further scale up PCs and make them capable of guiding the image generation process of diffusion models. Empirical results suggest that our approach can consistently improve the overall quality and semantic coherence of inpainted images across three natural image datasets (i.e., CelebA-HQ, ImageNet, and LSUN) with only ~10% additional computational overhead brought by the TPM. Further, with the help of an image encoder and decoder, our method can readily accept semantic constraints on specific regions of the image, which opens up the potential for more controlled image generation tasks. In addition to proposing a new framework for constrained image generation, this paper highlights the benefit of more tractable models and motivates the development of expressive TPMs.",
        "keywords": "Probabilistic Methods;Tractable Probabilistic Models;Diffusion Models",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/e685aff7689734c05eed249d4cd8fe3cb53fee2b.pdf",
        "author": "Anji Liu;Mathias Niepert;Guy Van den Broeck",
        "authorids": "~Anji_Liu1;~Mathias_Niepert1;~Guy_Van_den_Broeck1",
        "gender": "M;M;M",
        "homepage": "https://liuanji.github.io/;http://www.matlog.net;http://web.cs.ucla.edu/~guyvdb/",
        "dblp": "227/8622;n/MathiasNiepert;96/7521.html",
        "google_scholar": "k_4zYecAAAAJ;https://scholar.google.de/citations?user=p5vLzq0AAAAJ;d0KQ9z0AAAAJ",
        "orcid": ";;0000-0003-3434-2503",
        "linkedin": "anji-liu-7610b7190/;;guyvdb",
        "or_profile": "~Anji_Liu1;~Mathias_Niepert1;~Guy_Van_den_Broek1",
        "aff": "University of California, Los Angeles;NEC;University of California, Los Angeles",
        "aff_domain": "ucla.edu;neclab.eu;ucla.edu",
        "position": "PhD student;Research Scientist;Associate Professor",
        "bibtex": "@inproceedings{\nliu2024image,\ntitle={Image Inpainting via Tractable Steering of Diffusion Models},\nauthor={Anji Liu and Mathias Niepert and Guy Van den Broeck},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=NSIVHTbZBR}\n}",
        "github": "",
        "project": "",
        "reviewers": "dUar;yw5k;rz93;fJmV",
        "pdf_size": 8237016,
        "rating": "5;5;6;6",
        "confidence": "3;3;5;3",
        "soundness": "3;3;3;2",
        "contribution": "3;3;3;2",
        "presentation": "2;3;3;2",
        "wc_summary": "33;104;100;47",
        "wc_strengths": "44;25;77;93",
        "wc_weaknesses": "79;92;79;143",
        "wc_questions": "92;39;9;2",
        "wc_review": "248;260;265;285",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "721;985;729;673",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;3;2;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            71.0,
            31.424512724941337
        ],
        "wc_strengths_avg": [
            59.75,
            26.733639856929322
        ],
        "wc_weaknesses_avg": [
            98.25,
            26.37588861062315
        ],
        "wc_questions_avg": [
            35.5,
            35.4577213029828
        ],
        "wc_review_avg": [
            264.5,
            13.35102992281869
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            777.0,
            121.98360545581525
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=634008965309449932&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=NSIVHTbZBR",
        "pdf": "https://openreview.net/pdf?id=NSIVHTbZBR",
        "email": "ucla.edu;neclab.eu;ucla.edu",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of California, Los Angeles;NEC Corporation",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ucla.edu;https://www.nec.com",
        "aff_unique_abbr": "UCLA;NEC",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Los Angeles;",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United States;Japan"
    },
    {
        "title": "Unified Generative Modeling of 3D Molecules with Bayesian Flow Networks",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18787",
        "id": "NSVtmmzeRB",
        "author_site": "Yuxuan Song, Jingjing Gong, Hao Zhou, Mingyue Zheng, Jingjing Liu, Wei-Ying Ma",
        "tldr": "",
        "abstract": "Advanced generative model (\\textit{e.g.}, diffusion model) derived from simplified continuity assumptions of data distribution, though showing promising progress, has been difficult to apply directly to geometry generation applications due to the \\textit{multi-modality} and \\textit{noise-sensitive} nature of molecule geometry. \nThis work introduces Geometric Bayesian Flow Networks (GeoBFN), which naturally fits molecule geometry by modeling diverse modalities in the differentiable parameter space of distributions. GeoBFN maintains the SE-(3) invariant density modeling property by incorporating equivariant inter-dependency modeling on parameters of distributions and unifying the probabilistic modeling of different modalities. \nThrough optimized training and sampling techniques, we demonstrate that GeoBFN achieves state-of-the-art performance on multiple 3D molecule generation benchmarks in terms of generation quality (90.87\\% molecule stability in QM9 and 85.6\\% atom stability in GEOM-DRUG\\footnote{The scores are reported at 1k sampling steps for fair comparison, and our scores could be further improved if sampling sufficiently longer steps.}). GeoBFN can also conduct sampling with any number of steps to reach an optimal trade-off between efficiency and quality (\\textit{e.g.}, 20$\\times$ speedup without sacrificing performance).",
        "keywords": "Drug Design;Molecule Generation;Deep Learning;Computational Biology",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/2f0308097d267fdb30f1893a268041ec91cfd73d.zip",
        "author": "Yuxuan Song;Jingjing Gong;Hao Zhou;Mingyue Zheng;Jingjing Liu;Wei-Ying Ma",
        "authorids": "~Yuxuan_Song2;~Jingjing_Gong3;~Hao_Zhou5;~Mingyue_Zheng1;~Jingjing_Liu2;~Wei-Ying_Ma2",
        "gender": "M;M;M;M;;M",
        "homepage": "https://yuxuansong.com;;https://zhouh.github.io/;https://www.researchgate.net/profile/Mingyue-Zheng;https://air.tsinghua.edu.cn/en/info/1046/1194.htm#:~:text=Jingjing%20Liu%20is%20Professor%2C%20Principal,CVPR%2C%20ACL%2C%20etc.);https://air.tsinghua.edu.cn/en/info/1046/1189.htm",
        "dblp": ";63/8487;63/778-12;;30/3008-1;m/WYMa.html",
        "google_scholar": "xlnZ1OIAAAAJ;MayCLqYAAAAJ;https://scholar.google.com/citations?hl=zh-CN;vzBQN8EAAAAJ;BzJ_GboAAAAJ;SToCbu8AAAAJ",
        "orcid": ";;;0000-0002-3323-3092;;",
        "linkedin": ";;;;jingjing-liu-65703431/;wei-ying-ma-16a0171/",
        "or_profile": "~Yuxuan_Song2;~Jingjing_Gong3;~Hao_Zhou5;~Mingyue_Zheng1;~Jingjing_Liu2;~Wei-Ying_Ma2",
        "aff": "Tsinghua University;Tsinghua University;Tsinghua University;Shanghai Institute of Materia Medica;Tsinghua University;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;simm.ac.cn;tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "PhD student;Postdoc;Associate Professor;Full Professor;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nsong2024unified,\ntitle={Unified Generative Modeling of 3D Molecules with Bayesian Flow Networks},\nauthor={Yuxuan Song and Jingjing Gong and Hao Zhou and Mingyue Zheng and Jingjing Liu and Wei-Ying Ma},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=NSVtmmzeRB}\n}",
        "github": "",
        "project": "",
        "reviewers": "iwqe;mPXU;xteH;m4nX",
        "pdf_size": 4850168,
        "rating": "8;8;8;8",
        "confidence": "4;2;4;4",
        "soundness": "3;4;2;3",
        "contribution": "3;4;3;2",
        "presentation": "4;4;2;3",
        "wc_summary": "17;69;63;116",
        "wc_strengths": "53;84;59;42",
        "wc_weaknesses": "75;18;203;132",
        "wc_questions": "72;70;215;241",
        "wc_review": "217;241;540;531",
        "wc_reply_reviewers": "29;25;0;632",
        "wc_reply_authors": "1139;235;1423;2338",
        "reply_reviewers": "1;1;0;4",
        "reply_authors": "2;1;4;6",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            66.25,
            35.06690034776384
        ],
        "wc_strengths_avg": [
            59.5,
            15.402921800749363
        ],
        "wc_weaknesses_avg": [
            107.0,
            68.53101487647764
        ],
        "wc_questions_avg": [
            149.5,
            79.03954706347956
        ],
        "wc_review_avg": [
            382.25,
            153.51771070466106
        ],
        "wc_reply_reviewers_avg": [
            171.5,
            266.10195414539896
        ],
        "wc_reply_authors_avg": [
            1283.75,
            750.2770738200655
        ],
        "reply_reviewers_avg": [
            1.5,
            1.5
        ],
        "reply_authors_avg": [
            3.25,
            1.920286436967152
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 26,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1372974972589931859&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=NSVtmmzeRB",
        "pdf": "https://openreview.net/pdf?id=NSVtmmzeRB",
        "email": "tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;simm.ac.cn;tsinghua.edu.cn;tsinghua.edu.cn",
        "author_num": 6,
        "aff_unique_index": "0;0;0;1;0;0",
        "aff_unique_norm": "Tsinghua University;Shanghai Institute of Materia Medica",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tsinghua.edu.cn;http://www.simm.ac.cn",
        "aff_unique_abbr": "THU;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "NSyacfXOyX",
        "title": "PatchSynth: a Patch-Text Pre-trained Model",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In recent years, patch representation learning has emerged as a necessary research direction for exploiting the capabilities of machine learning in software generation. These representations have driven significant performance enhancements across a variety of tasks involving code changes. While the progress is undeniable, a common limitation among existing models is their specialization: they predominantly excel in either predictive tasks, such as security patch classification, or in generative tasks such as patch description generation. This dichotomy is further exacerbated by a prevalent dependency on potentially noisy data sources. Specifically, many models utilize patches integrated with Abstract Syntax Trees (AST) that, unfortunately, may contain parsing inaccuracies, thus acting as a suboptimal source of supervision. In response to these challenges, we introduce PATCHSYNTH, a novel pre-training framework for patches and natural language text. PATCHSYNTH deploys a triple-loss training strategy for (1) patch-description contrastive learning, which enables to separate patches and descriptions in the embedding space, (2) patch-description matching, which ensures that each patch is associated to its description in the embedding space, and (3) patch-description generation, which ensures that the patch embedding is effective for generation. These losses are implemented for joint learning to achieve good performance in both predictive and generative tasks involving patches. Empirical evaluations focusing on patch description generation, demonstrate that PATCHSYNTH sets new state of the art performance, consistently outperforming the state-of-the-art in metrics like BLEU, ROUGE-L, METEOR, and Recall.",
        "keywords": "PatchSynth;Patch-Text Pretraining;Commit message generation;triple-loss joint learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Xunzhu Tang;Zhenghan Chen;Saad Ezzini;Haoye Tian;Jacques Klein;Tegawend\u00e9 F. Bissyand\u00e9",
        "authorids": "~Xunzhu_Tang1;~Zhenghan_Chen3;~Saad_Ezzini1;~Haoye_Tian2;~Jacques_Klein1;~Tegawend\u00e9_F._Bissyand\u00e91",
        "gender": ";;M;;M;M",
        "homepage": ";;https://ezzini.me;;https://jacquesklein2302.github.io/;https://bissyande.github.io/",
        "dblp": ";;216/8359.html;;k/JacquesKlein;00/8006.html",
        "google_scholar": ";;48ebm6wAAAAJ;;https://scholar.google.fr/citations?user=9E_KKT4AAAAJ;t73Mqm8AAAAJ",
        "orcid": ";;0000-0001-7657-4738;;0000-0003-4052-475X;0000-0001-7270-9869",
        "linkedin": ";;saad-ezzini/;;jacques-klein-188b0b5/;",
        "or_profile": "~Xunzhu_Tang1;~Zhenghan_Chen3;~Saad_Ezzini1;~Haoye_Tian2;~Jacques_Klein1;~Tegawend\u00e9_F._Bissyand\u00e91",
        "aff": ";;Lancaster University;;University of Luxemburg;University of Luxemburg",
        "aff_domain": ";;lancaster.ac.uk;;uni.lu;uni.lu",
        "position": ";;Assistant Professor;;Full Professor;Associate Professor",
        "bibtex": "@misc{\ntang2024patchsynth,\ntitle={PatchSynth: a Patch-Text Pre-trained Model},\nauthor={Xunzhu Tang and Zhenghan Chen and Saad Ezzini and Haoye Tian and Jacques Klein and Tegawend{\\'e} F. Bissyand{\\'e}},\nyear={2024},\nurl={https://openreview.net/forum?id=NSyacfXOyX}\n}",
        "github": "",
        "project": "",
        "reviewers": "9sGD;H6rR;639w;xxEb;4kdr",
        "site": "https://openreview.net/forum?id=NSyacfXOyX",
        "pdf_size": 361236,
        "rating": "1;3;3;8;10",
        "confidence": "5;4;5;5;5",
        "soundness": "2;1;2;4;4",
        "contribution": "1;2;1;4;4",
        "presentation": "1;1;1;3;4",
        "wc_summary": "100;113;59;59;75",
        "wc_strengths": "29;234;101;45;108",
        "wc_weaknesses": "324;855;595;9;46",
        "wc_questions": "27;52;91;23;81",
        "wc_review": "480;1254;846;136;310",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            5.0,
            3.40587727318528
        ],
        "confidence_avg": [
            4.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.6,
            1.2000000000000002
        ],
        "contribution_avg": [
            2.4,
            1.3564659966250536
        ],
        "presentation_avg": [
            2.0,
            1.2649110640673518
        ],
        "wc_summary_avg": [
            81.2,
            21.8577217477028
        ],
        "wc_strengths_avg": [
            103.4,
            72.15150726076344
        ],
        "wc_weaknesses_avg": [
            365.8,
            323.47327555765713
        ],
        "wc_questions_avg": [
            54.8,
            27.527440854536405
        ],
        "wc_review_avg": [
            605.2,
            400.4729204328303
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.29361010975735174,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:b8BmkEVfxP4J:scholar.google.com/&scioq=PatchSynth:+a+Patch-Text+Pre-trained+Model&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Lancaster University;University of Luxembourg",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.lancaster.ac.uk;https://wwwen.uniluxembourg.lu",
        "aff_unique_abbr": "Lancaster;Uni Lu",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "United Kingdom;Luxembourg"
    },
    {
        "id": "NTNLlEmx8Y",
        "title": "Self-Supervised Detection of Perfect and Partial Input-Dependent Symmetries",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Group equivariance ensures consistent responses to group transformations of the input, leading to more robust models and enhanced generalization capabilities. Nevertheless, this property can lead to overly constrained models when the symmetries considered in the group differ from those observed in data. While common methods address this by determining the appropriate level of symmetry at the dataset level, they are limited to supervised settings and ignore scenarios in which multiple levels of symmetry co-exist in the same dataset. For instance, pictures of cars and planes exhibit different levels of rotation, yet both are included in the CIFAR-10 dataset. In this paper, we propose a method able to detect the level of symmetry of each input without the need for labels. To this end, we derive a sufficient and necessary condition to learn the distribution of symmetries in the data. Using the learned distribution, we generate pseudolabels that allow us to learn the levels of symmetry of each input in a self-supervised manner. We validate the effectiveness of our approach on synthetic datasets with different per-class levels of symmetries e.g. MNISTMultiple, in which digits are uniformly rotated within a class-dependent interval. We demonstrate that our method can be used for practical applications such as the generation of standardized datasets in which the symmetries are not present, as well as the detection of out-of-distribution symmetries during inference. By doing so, both the generalization and robustness of non-equivariant models can be improved. Our code is publicly available at \\texttt{url-removed-for-double-blind-review}.",
        "keywords": "symmetry detection;self-supervised learning;partial equivariance;group equivariant neural networks",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/4a948c8cf2141073989def64a664847363f33b42.zip",
        "author": "Alonso Urbano;David W. Romero",
        "authorids": "~Alonso_Urbano1;~David_W._Romero1",
        "gender": ";M",
        "homepage": ";https://davidwromero.xyz/",
        "dblp": "365/5566;254/1396",
        "google_scholar": "PdMMvPAAAAAJ;7tdzmVoAAAAJ",
        "orcid": ";",
        "linkedin": "alonso-urbano-garc%C3%ADa-27676a1a7/?locale=en_US;david-w-romero-05893567/",
        "or_profile": "~Alonso_Urbano1;~David_W._Romero1",
        "aff": "Zuse Institute Berlin;NVIDIA",
        "aff_domain": "zib.de;nvidia.com",
        "position": "PhD student;Researcher",
        "bibtex": "@misc{\nurbano2024selfsupervised,\ntitle={Self-Supervised Detection of Perfect and Partial Input-Dependent Symmetries},\nauthor={Alonso Urbano and David W. Romero},\nyear={2024},\nurl={https://openreview.net/forum?id=NTNLlEmx8Y}\n}",
        "github": "",
        "project": "",
        "reviewers": "9nMD;d1fY;9t9K;JVYE",
        "site": "https://openreview.net/forum?id=NTNLlEmx8Y",
        "pdf_size": 15743803,
        "rating": "3;5;5;6",
        "confidence": "2;3;4;4",
        "soundness": "2;2;3;3",
        "contribution": "1;2;2;2",
        "presentation": "1;3;3;3",
        "wc_summary": "60;77;159;117",
        "wc_strengths": "10;100;166;33",
        "wc_weaknesses": "108;208;315;181",
        "wc_questions": "20;65;67;733",
        "wc_review": "198;450;707;1064",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "438;825;1066;1651",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;2;3",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            103.25,
            38.26470305647229
        ],
        "wc_strengths_avg": [
            77.25,
            60.981042136060616
        ],
        "wc_weaknesses_avg": [
            203.0,
            74.29333752093791
        ],
        "wc_questions_avg": [
            221.25,
            296.0560546585731
        ],
        "wc_review_avg": [
            604.75,
            320.4523170457658
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            995.0,
            440.0357939986246
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.899228803025897,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=528453065017473007&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Zuse Institute Berlin;NVIDIA",
        "aff_unique_dep": ";NVIDIA Corporation",
        "aff_unique_url": "https://www.zib.de;https://www.nvidia.com",
        "aff_unique_abbr": "ZIB;NVIDIA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Germany;United States"
    },
    {
        "id": "NTWtNjlThd",
        "title": "Explicitly Disentangled Representations in Object-Centric Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Extracting structured representations from raw visual data is an important and long-standing challenge in machine learning. Recently, techniques for unsupervised learning of object-centric representations have raised growing interest. In this context, enhancing the robustness of the latent features can improve the efficiency and effectiveness of the training of downstream tasks. A promising step in this direction is to disentangle the factors that cause variation in the data. Previously, Invariant Slot Attention disentangled position, scale, and orientation from the remaining features. Extending this approach, we focus on separating the shape and texture components. In particular, we propose a novel architecture that biases object-centric models toward disentangling shape and texture components into two non-overlapping subsets of the latent space dimensions. These subsets are known a priori, hence before the training process. Experiments on a range of object-centric benchmarks reveal that our approach achieves the desired disentanglement while also numerically improving baseline performance in most cases. In addition, we show that our method can generate novel textures for a specific object or transfer textures between objects with distinct shapes.",
        "keywords": "object-centric representation learning;unsupervised learning;disentanglement;computer vision",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/be3bb2b4cf90516d4058fd0a2334808e9d0692e2.zip",
        "author": "Riccardo Majellaro;Jonathan Collu;Aske Plaat;Thomas M. Moerland",
        "authorids": "~Riccardo_Majellaro1;~Jonathan_Collu1;~Aske_Plaat1;~Thomas_M._Moerland1",
        "gender": ";M;M;M",
        "homepage": ";;https://askeplaat.wordpress.com;http://thomasmoerland.nl/",
        "dblp": ";;53/5607;200/7623",
        "google_scholar": ";;scYqr58AAAAJ;c54IheQAAAAJ",
        "orcid": ";;0000-0001-7202-3322;",
        "linkedin": ";https://linkedin.com/in/jonathan-collu-9826571b2;;",
        "or_profile": "~Riccardo_Majellaro1;~Jonathan_Collu1;~Aske_Plaat1;~Thomas_M._Moerland1",
        "aff": ";;Leiden University;Leiden University",
        "aff_domain": ";;leidenuniv.nl;leidenuniv.nl",
        "position": ";;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nmajellaro2024explicitly,\ntitle={Explicitly Disentangled Representations in Object-Centric Learning},\nauthor={Riccardo Majellaro and Jonathan Collu and Aske Plaat and Thomas M. Moerland},\nyear={2024},\nurl={https://openreview.net/forum?id=NTWtNjlThd}\n}",
        "github": "",
        "project": "",
        "reviewers": "Vx4x;Acn7;7UTn;ZUV4",
        "site": "https://openreview.net/forum?id=NTWtNjlThd",
        "pdf_size": 13109757,
        "rating": "5;5;5;6",
        "confidence": "2;4;3;5",
        "soundness": "3;3;3;3",
        "contribution": "3;2;2;2",
        "presentation": "3;3;2;3",
        "wc_summary": "90;55;66;109",
        "wc_strengths": "38;48;27;67",
        "wc_weaknesses": "178;144;89;125",
        "wc_questions": "53;95;34;132",
        "wc_review": "359;342;216;433",
        "wc_reply_reviewers": "154;96;91;54",
        "wc_reply_authors": "837;447;670;343",
        "reply_reviewers": "2;1;1;1",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            80.0,
            20.988091861815356
        ],
        "wc_strengths_avg": [
            45.0,
            14.713938969562161
        ],
        "wc_weaknesses_avg": [
            134.0,
            32.179185819408175
        ],
        "wc_questions_avg": [
            78.5,
            37.963798545456434
        ],
        "wc_review_avg": [
            337.5,
            78.04646052192246
        ],
        "wc_reply_reviewers_avg": [
            98.75,
            35.78669445478305
        ],
        "wc_reply_authors_avg": [
            574.25,
            192.27243042100446
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.7745966692414834,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5025019691789825602&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Leiden University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.leidenuniv.nl",
        "aff_unique_abbr": "LU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Netherlands"
    },
    {
        "id": "NTps1DTdLB",
        "title": "Deep Generalized Prediction Set Classifier and Its Theoretical Guarantees",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "A standard classification rule returns a single-valued prediction for any observation without a confidence guarantee, which may result in severe consequences in many critical applications when the uncertainty is high. In contrast, set-valued classification is a new paradigm to handle the uncertainty in classification by reporting a set of plausible labels to observations in highly ambiguous regions. In this article, we propose the Deep Generalized Prediction Set (DeepGPS) method, a network-based set-valued classifier induced by acceptance region learning. DeepGPS is capable of identifying ambiguous observations and detecting out-of-distribution (OOD) observations. It is the first set-valued classification of this kind with a theoretical guarantee and scalable to large datasets. Our nontrivial proof shows that the risk of DeepGPS, defined as the expected size of the prediction set, attains the optimality within a neural network hypothesis class while simultaneously achieving the user-prescribed class-specific accuracy. Additionally, by using a weighted loss, DeepGPS returns tighter acceptance regions, leading to informative predictions and improved OOD detection performance. Empirically, our method outperforms the baselines on several benchmark datasets.",
        "keywords": "set-valued classification;acceptance region learning;uncertainty quantification;learning to rejection",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Zhou Wang;Xingye Qiao",
        "authorids": "~Zhou_Wang3;~Xingye_Qiao1",
        "gender": "Not Specified;",
        "homepage": ";http://people.math.binghamton.edu/qiao/",
        "dblp": ";21/10859",
        "google_scholar": ";O8NqeoQAAAAJ",
        "orcid": ";0000-0003-0937-9822",
        "linkedin": "zhou-wang-75a269163/;",
        "or_profile": "~Zhou_Wang3;~Xingye_Qiao1",
        "aff": "State University of New York at Binghamton;State University of New York at Binghamton",
        "aff_domain": "binghamton.edu;binghamton.edu",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nwang2024deep,\ntitle={Deep Generalized Prediction Set Classifier and Its Theoretical Guarantees},\nauthor={Zhou Wang and Xingye Qiao},\nyear={2024},\nurl={https://openreview.net/forum?id=NTps1DTdLB}\n}",
        "github": "",
        "project": "",
        "reviewers": "A92f;5AV7;nfKV",
        "site": "https://openreview.net/forum?id=NTps1DTdLB",
        "pdf_size": 872069,
        "rating": "3;3;5",
        "confidence": "4;4;3",
        "soundness": "2;2;3",
        "contribution": "2;1;2",
        "presentation": "2;1;2",
        "wc_summary": "138;79;156",
        "wc_strengths": "68;15;130",
        "wc_weaknesses": "549;136;203",
        "wc_questions": "2;146;18",
        "wc_review": "757;376;507",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            124.33333333333333,
            32.8870119584549
        ],
        "wc_strengths_avg": [
            71.0,
            46.99645376692444
        ],
        "wc_weaknesses_avg": [
            296.0,
            180.9769782780856
        ],
        "wc_questions_avg": [
            55.333333333333336,
            64.44291185917105
        ],
        "wc_review_avg": [
            546.6666666666666,
            158.05132780910833
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14939172933508625166&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "State University of New York at Binghamton",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.binghamton.edu",
        "aff_unique_abbr": "SUNY Binghamton",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Binghamton",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Optimal Sample Complexity of Contrastive Learning",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18786",
        "id": "NU9AYHJvYe",
        "author_site": "Noga Alon, Dmitrii Avdiukhin, Dor Elboim, Orr Fischer, Grigory Yaroslavtsev",
        "tldr": "",
        "abstract": "Contrastive learning is a highly successful technique for learning representations of data from labeled tuples, specifying the distance relations within the tuple. We study the sample complexity of contrastive learning, i.e. the minimum number of labeled tuples sufficient for getting high generalization accuracy. We give tight bounds on the sample complexity in a variety of settings, focusing on arbitrary distance functions,  $\\ell_p$-distances, and tree metrics. Our main result is an (almost) optimal bound on the sample complexity of learning $\\ell_p$-distances for integer $p$. For any $p \\ge 1$, we show that $\\tilde \\Theta(nd)$ labeled tuples are necessary and sufficient for learning $d$-dimensional representations of $n$-point datasets. Our results hold for an arbitrary distribution of the input samples and are based on giving the corresponding bounds on the Vapnik-Chervonenkis/Natarajan dimension of the associated problems. We further show that the theoretical bounds on sample complexity obtained via VC/Natarajan dimension can have strong predictive power for experimental results, in contrast with the folklore belief about a substantial gap between the statistical learning theory and the practice of deep learning.",
        "keywords": "learning theory;sample complexity;vc dimension;contrastive learning;metric learning",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/36c855234f04aea83e5509d335a3040d5b6ea1f8.zip",
        "author": "Noga Alon;Dmitrii Avdiukhin;Dor Elboim;Orr Fischer;Grigory Yaroslavtsev",
        "authorids": "~Noga_Alon1;~Dmitrii_Avdiukhin1;~Dor_Elboim1;~Orr_Fischer1;~Grigory_Yaroslavtsev1",
        "gender": "M;;;;Unspecified",
        "homepage": "https://web.math.princeton.edu/~nalon/;https://dyukha.github.io/;https://sites.google.com/view/dorelboim/;;http://grigory.us",
        "dblp": "a/NAlon;236/4913.html;;;31/7137",
        "google_scholar": ";;3RKTpnkAAAAJ;;AbRFE3IAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Noga_Alon1;~Dmitrii_Avdiukhin1;~Dor_Elboim1;~Orr_Fischer1;~Grigory_Yaroslavtsev1",
        "aff": "Princeton University;Northwestern University;;;George Mason University",
        "aff_domain": "princeton.edu;northwestern.edu;;;gmu.edu",
        "position": "Full Professor;Postdoc;;;Assistant Professor",
        "bibtex": "@inproceedings{\nalon2024optimal,\ntitle={Optimal Sample Complexity of Contrastive Learning},\nauthor={Noga Alon and Dmitrii Avdiukhin and Dor Elboim and Orr Fischer and Grigory Yaroslavtsev},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=NU9AYHJvYe}\n}",
        "github": "",
        "project": "",
        "reviewers": "Tspf;YPGd;m7mJ;MJ3x",
        "pdf_size": 712053,
        "rating": "6;8;8;8",
        "confidence": "3;3;3;2",
        "soundness": "2;4;4;4",
        "contribution": "3;3;3;3",
        "presentation": "2;4;2;4",
        "wc_summary": "134;229;103;197",
        "wc_strengths": "109;18;48;124",
        "wc_weaknesses": "96;2;119;57",
        "wc_questions": "80;90;2;86",
        "wc_review": "419;339;272;464",
        "wc_reply_reviewers": "23;0;0;0",
        "wc_reply_authors": "838;172;256;422",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            1.0
        ],
        "wc_summary_avg": [
            165.75,
            49.806500579743606
        ],
        "wc_strengths_avg": [
            74.75,
            43.401468869152346
        ],
        "wc_weaknesses_avg": [
            68.5,
            44.33114029663573
        ],
        "wc_questions_avg": [
            64.5,
            36.25948151863179
        ],
        "wc_review_avg": [
            373.5,
            73.74449131969112
        ],
        "wc_reply_reviewers_avg": [
            5.75,
            9.959292143521045
        ],
        "wc_reply_authors_avg": [
            422.0,
            256.47222071795613
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13811080757612210486&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=NU9AYHJvYe",
        "pdf": "https://openreview.net/pdf?id=NU9AYHJvYe",
        "email": "princeton.edu;northwestern.edu;;;gmu.edu",
        "author_num": 5,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Princeton University;Northwestern University;George Mason University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.princeton.edu;https://www.northwestern.edu;https://www.gmu.edu",
        "aff_unique_abbr": "Princeton;NU;GMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "NV6rn7j5p5",
        "title": "GEO: Generative Engine Optimization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The advent of large language models (LLMs) has ushered in a new paradigm of search engines that use generative models to gather and summarize information to answer user queries. This emerging technology, which we formalize under the unified framework of generative engines (GEs), has the potential to generate accurate and personalized responses, and is rapidly replacing traditional search engines like Google and Bing. Generative engines typically satisfy queries by synthesizing information from multiple sources and summarizing them with the help of LLMs. While this shift significantly improves user utility and generative search engine traffic, it results in a huge challenge for the third stakeholder - website and content creators. Given the black-box and fast-moving nature of generative engines, content creators have little to no control over when and how their content is displayed. With generative engines here to stay, the right tools should be provided to ensure that creator economy is not severely disadvantaged. To address this, we introduce generative engine optimization (GEO), a novel paradigm to aid content creators in improving their visibility. In this work, we propose several optimizations that can be applied to improve the visibility of content. To evaluate and compare different GEO methods, we propose a benchmark encompassing diverse user queries from multiple domains and settings, along with relevant sources needed to answer those queries. Through rigorous experiments on the proposed benchmark, we demonstrate different GEO methods involving well-designed textual enhancements, are capable of boosting source visibility by up to 40% in Generative engines responses. We find several insights that aid content creators -- for example, adding citations and quotations significantly improves visibility. We also discover that these optimizations are domain dependent, thus requiring a change in the nature of the optimization based on the source. Our work opens a new frontier in the field of information discovery systems, with profound implications for both developers of Generative enginess and content creators.",
        "keywords": "generative models;search engines;datasets and benchmarks",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/fd53c28f29f25d6282d05e4c616e165b9e3f6fea.zip",
        "author": "Pranjal Aggarwal;Vishvak Murahari;Tanmay Rajpurohit;Ashwin Kalyan;Karthik R Narasimhan;Ameet Deshpande",
        "authorids": "~Pranjal_Aggarwal1;~Vishvak_Murahari1;~Tanmay_Rajpurohit1;~Ashwin_Kalyan6;~Karthik_R_Narasimhan1;~Ameet_Deshpande1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://github.com/Pranjal2041/;https://vishvakmurahari.com/;;http://www.karthiknarasimhan.com;https://ameet-1997.github.io;http://ashwinkalyan.com/",
        "dblp": "163/0764;249/5621;;147/0322;220/4337;173/5217",
        "google_scholar": "https://scholar.google.com/citations?hl=en;Y_NYX7MAAAAJ;B4NztA8AAAAJ;euc0GX4AAAAJ;332L1coAAAAJ;KYHL9aIAAAAJ",
        "orcid": "0000-0002-2962-1535;;;;;",
        "linkedin": ";;tanmay-rajpurohit-b13942125/;;;",
        "or_profile": "~Pranjal_Aggarwal1;~Vishvak_Murahari1;~Tanmay_Rajpurohit1;~Karthik_R_Narasimhan1;~Ameet_S_Deshpande1;~Ashwin_Kalyan_Vijayakumar1",
        "aff": "Indian Institute of Technology, Delhi;Princeton University;Independent Researcher;Princeton University;Princeton University;Allen Institute for Artificial Intelligence",
        "aff_domain": "iitd.ac.in;princeton.edu;tanmay.one;princeton.edu;princeton.edu;allenai.org",
        "position": "Undergrad student;PhD student;Researcher;Assistant Professor;PhD student;Research Scientist",
        "bibtex": "@misc{\naggarwal2024geo,\ntitle={{GEO}: Generative Engine Optimization},\nauthor={Pranjal Aggarwal and Vishvak Murahari and Tanmay Rajpurohit and Ashwin Kalyan and Karthik R Narasimhan and Ameet Deshpande},\nyear={2024},\nurl={https://openreview.net/forum?id=NV6rn7j5p5}\n}",
        "github": "",
        "project": "",
        "reviewers": "PP6U;DAsT;Lvo2",
        "site": "https://openreview.net/forum?id=NV6rn7j5p5",
        "pdf_size": 530056,
        "rating": "3;3;3",
        "confidence": "3;3;5",
        "soundness": "2;3;1",
        "contribution": "2;2;2",
        "presentation": "2;2;2",
        "wc_summary": "93;65;38",
        "wc_strengths": "18;85;29",
        "wc_weaknesses": "112;143;119",
        "wc_questions": "47;4;103",
        "wc_review": "270;297;289",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            65.33333333333333,
            22.45489305746572
        ],
        "wc_strengths_avg": [
            44.0,
            29.337120967584166
        ],
        "wc_weaknesses_avg": [
            124.66666666666667,
            13.27487183449325
        ],
        "wc_questions_avg": [
            51.333333333333336,
            40.5325657822064
        ],
        "wc_review_avg": [
            285.3333333333333,
            11.323525167642018
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10081634339433342548&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;2;1;1;3",
        "aff_unique_norm": "Indian Institute of Technology Delhi;Princeton University;Independent Researcher;Allen Institute for Artificial Intelligence",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.iitdelhi.ac.in;https://www.princeton.edu;;https://allenai.org",
        "aff_unique_abbr": "IIT Delhi;Princeton;;AI2",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Delhi;",
        "aff_country_unique_index": "0;1;1;1;1",
        "aff_country_unique": "India;United States;"
    },
    {
        "title": "Long-tailed Diffusion Models with Oriented Calibration",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18785",
        "id": "NW2s5XXwXU",
        "author_site": "Tianjiao Zhang, Huangjie Zheng, Jiangchao Yao, Xiangfeng Wang, Mingyuan Zhou, Ya Zhang, Yanfeng Wang",
        "tldr": "",
        "abstract": "Diffusion models are acclaimed for generating high-quality and diverse images. However, their performance notably degrades when trained on data with a long-tailed distribution. For long tail diffusion model generation, current works focus on the calibration and enhancement of the tail generation with head-tail knowledge transfer. The transfer process relies on the abundant diversity derived from the head class and, more significantly, the condition capacity of the model prediction. However, the dependency on the conditional model prediction to realize the knowledge transfer might exhibit bias during training, leading to unsatisfactory generation results and lack of robustness. Utilizing a Bayesian framework, we develop a weighted denoising score-matching technique for knowledge transfer directly from head to tail classes. Additionally, we incorporate a gating mechanism in the knowledge transfer process. We provide statistical analysis to validate this methodology, revealing that the effectiveness of such knowledge transfer depends on both label distribution and sample similarity, providing the insight to consider sample similarity when re-balancing the label proportion in training. We extensively evaluate our approach with experiments on multiple benchmark datasets, demonstrating its effectiveness and superior performance compared to existing methods. Code: \\url{https://github.com/MediaBrain-SJTU/OC_LT}.",
        "keywords": "diffusion model;long tail distribution;score matching",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Tianjiao Zhang;Huangjie Zheng;Jiangchao Yao;Xiangfeng Wang;Mingyuan Zhou;Ya Zhang;Yanfeng Wang",
        "authorids": "~Tianjiao_Zhang1;~Huangjie_Zheng1;~Jiangchao_Yao1;~Xiangfeng_Wang1;~Mingyuan_Zhou1;~Ya_Zhang1;~Yanfeng_Wang1",
        "gender": "M;M;M;M;M;F;M",
        "homepage": "https://xiaoeyuztj.github.io/;;https://sunarker.github.io/;https://xfwang87.github.io/;http://mingyuanzhou.github.io;https://annzhanglion.github.io/;https://cmic.sjtu.edu.cn/wangyanfeng/",
        "dblp": "82/8577;192/2170;166/5900;84/4695;;85/3714-2;55/5407-1.html",
        "google_scholar": ";Vl5wCXsAAAAJ;w8oDh9QAAAAJ;YpGMkgsAAAAJ;LXwCIisAAAAJ;pbjw9sMAAAAJ;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": ";0000-0003-0508-5034;;;;0000-0002-5390-9053;0000-0002-3196-2347",
        "linkedin": ";;;;;;",
        "or_profile": "~Tianjiao_Zhang1;~Huangjie_Zheng1;~Jiangchao_Yao1;~Xiangfeng_Wang1;~Mingyuan_Zhou1;~Ya_Zhang1;~Yanfeng_Wang1",
        "aff": "Shanghai Jiaotong University;University of Texas, Austin;Shanghai Artificial Intelligence Laboratory;East China Normal University;Google;Shanghai Jiaotong University;Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn;utexas.edu;pjlab.org.cn;ecnu.edu.cn;google.com;sjtu.edu.cn;sjtu.edu.cn",
        "position": "PhD student;PhD student;Researcher;Full Professor;Researcher;Professor;Full Professor",
        "bibtex": "@inproceedings{\nzhang2024longtailed,\ntitle={Long-tailed Diffusion Models with Oriented Calibration},\nauthor={Tianjiao Zhang and Huangjie Zheng and Jiangchao Yao and Xiangfeng Wang and Mingyuan Zhou and Ya Zhang and Yanfeng Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=NW2s5XXwXU}\n}",
        "github": "",
        "project": "",
        "reviewers": "Uefc;PNyr;i52Z",
        "pdf_size": 2013135,
        "rating": "6;6;6",
        "confidence": "4;4;4",
        "soundness": "4;2;2",
        "contribution": "4;2;2",
        "presentation": "4;1;3",
        "wc_summary": "120;145;45",
        "wc_strengths": "75;30;56",
        "wc_weaknesses": "46;83;63",
        "wc_questions": "149;349;231",
        "wc_review": "390;607;395",
        "wc_reply_reviewers": "0;26;0",
        "wc_reply_authors": "690;1553;1115",
        "reply_reviewers": "0;1;0",
        "reply_authors": "1;3;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "presentation_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "wc_summary_avg": [
            103.33333333333333,
            42.49182927993987
        ],
        "wc_strengths_avg": [
            53.666666666666664,
            18.445113776342563
        ],
        "wc_weaknesses_avg": [
            64.0,
            15.121728296285006
        ],
        "wc_questions_avg": [
            243.0,
            82.0893821798329
        ],
        "wc_review_avg": [
            464.0,
            101.13687095548619
        ],
        "wc_reply_reviewers_avg": [
            8.666666666666666,
            12.256517540566824
        ],
        "wc_reply_authors_avg": [
            1119.3333333333333,
            352.33159886044217
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15734963864615711473&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=NW2s5XXwXU",
        "pdf": "https://openreview.net/pdf?id=NW2s5XXwXU",
        "email": "sjtu.edu.cn;utexas.edu;pjlab.org.cn;ecnu.edu.cn;google.com;sjtu.edu.cn;sjtu.edu.cn",
        "author_num": 7,
        "aff_unique_index": "0;1;2;3;4;0;0",
        "aff_unique_norm": "Shanghai Jiao Tong University;University of Texas at Austin;Shanghai Artificial Intelligence Laboratory;East China Normal University;Google",
        "aff_unique_dep": ";;;;Google",
        "aff_unique_url": "https://www.sjtu.edu.cn;https://www.utexas.edu;http://www.shailab.org/;http://www.ecnu.edu.cn;https://www.google.com",
        "aff_unique_abbr": "SJTU;UT Austin;Shanghai AI Lab;ECNU;Google",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Austin;Mountain View",
        "aff_country_unique_index": "0;1;0;0;1;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Federated Text-driven Prompt Generation for Vision-Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18784",
        "id": "NW31gAylIm",
        "author_site": "Chen Qiu, Xingyu Li, Chaithanya Kumar Mummadi, Madan Ganesh, Zhenzhen Li, Lu Peng, Wan-Yi Lin",
        "tldr": "",
        "abstract": "Prompt learning for vision-language models, e.g., CoOp, has shown great success in adapting CLIP to different downstream tasks, making it a promising solution for federated learning due to computational reasons. Existing prompt learning techniques replace hand-crafted text prompts with learned vectors that offer improvements on seen classes, but struggle to generalize to unseen classes. Our work addresses this challenge by proposing Federated Text-driven Prompt Generation (FedTPG), which learns a unified prompt generation network across multiple remote clients in a scalable manner. The prompt generation network is conditioned on task-related text input, thus is context-aware, making it suitable to generalize for both seen and unseen classes. Our comprehensive empirical evaluations on nine diverse image classification datasets show that our method is superior to existing federated prompt learning methods, achieving better overall generalization on both seen and unseen classes, as well as datasets.",
        "keywords": "Vision-Language Models;Prompt Learning;Federated Learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/0c0f58ba3961e3ab14735a85379839953e710ec2.pdf",
        "author": "Chen Qiu;Xingyu Li;Chaithanya Kumar Mummadi;Madan Ravi Ganesh;Zhenzhen Li;Lu Peng;Wan-Yi Lin",
        "authorids": "~Chen_Qiu1;~Xingyu_Li4;~Chaithanya_Kumar_Mummadi1;~Madan_Ravi_Ganesh1;~Zhenzhen_Li2;~Lu_Peng1;~Wan-Yi_Lin1",
        "gender": "M;M;M;M;F;;F",
        "homepage": ";https://nikoxing.github.io/;;https://zeonzir.github.io/;http://lizhenzhen.org/;https://cs.tulane.edu/~lpeng3/;",
        "dblp": ";;208/6386;138/9824;;16/6199-1;123/9786",
        "google_scholar": "uX5Y9XUAAAAJ;stA6f5YAAAAJ;XJLtaG4AAAAJ;2hYXi0UAAAAJ;https://scholar.google.com/citations?view_op=list_works;;kpkMxE8AAAAJ",
        "orcid": ";0000-0002-5547-9894;0000-0002-1173-2720;;;;",
        "linkedin": ";xy-li-link/;;;;;",
        "or_profile": "~Chen_Qiu1;~Xingyu_Li4;~Chaithanya_Kumar_Mummadi1;~Madan_Ravi_Ganesh1;~Zhenzhen_Li2;~Lu_Peng1;~Wan-Yi_Lin1",
        "aff": "Robert Bosch LLC, USA;Tulane University;Bosch Center for Artificial Intelligence;Bosch Center for Artificial Intelligence;Bosch;Tulane University;Bosch research",
        "aff_domain": "us.bosch.com;tulane.edu;bosch.com;bosch.com;bosch.com;tulane.edu;us.bosch.com",
        "position": "Researcher;Postdoc;Researcher;Researcher;Researcher;Full Professor;Senior research scientist",
        "bibtex": "@inproceedings{\nqiu2024federated,\ntitle={Federated Text-driven Prompt Generation for Vision-Language Models},\nauthor={Chen Qiu and Xingyu Li and Chaithanya Kumar Mummadi and Madan Ravi Ganesh and Zhenzhen Li and Lu Peng and Wan-Yi Lin},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=NW31gAylIm}\n}",
        "github": "",
        "project": "",
        "reviewers": "RTLu;qkce;o1Q3;KFdC",
        "pdf_size": 560007,
        "rating": "5;6;6;6",
        "confidence": "5;3;3;3",
        "soundness": "2;3;2;2",
        "contribution": "2;2;2;2",
        "presentation": "2;3;3;3",
        "wc_summary": "64;98;52;97",
        "wc_strengths": "22;48;25;39",
        "wc_weaknesses": "234;104;115;115",
        "wc_questions": "50;1;5;5",
        "wc_review": "370;251;197;256",
        "wc_reply_reviewers": "0;62;0;31",
        "wc_reply_authors": "1722;625;657;961",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "4;1;1;2",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            77.75,
            20.20365066021485
        ],
        "wc_strengths_avg": [
            33.5,
            10.547511554864494
        ],
        "wc_weaknesses_avg": [
            142.0,
            53.30572201931046
        ],
        "wc_questions_avg": [
            15.25,
            20.129269733400662
        ],
        "wc_review_avg": [
            268.5,
            63.00198409574099
        ],
        "wc_reply_reviewers_avg": [
            23.25,
            25.703842125254347
        ],
        "wc_reply_authors_avg": [
            991.25,
            441.8067309355981
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8440154497332608374&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=NW31gAylIm",
        "pdf": "https://openreview.net/pdf?id=NW31gAylIm",
        "email": "us.bosch.com;tulane.edu;bosch.com;bosch.com;bosch.com;tulane.edu;us.bosch.com",
        "author_num": 7,
        "aff_unique_index": "0;1;2;2;3;1;4",
        "aff_unique_norm": "Robert Bosch LLC;Tulane University;Bosch Center for Artificial Intelligence;Robert Bosch GmbH;Bosch",
        "aff_unique_dep": ";;Center for Artificial Intelligence;;Research",
        "aff_unique_url": "https://www.bosch.com;https://www.tulane.edu;https://www.bosch-ai.com;https://www.bosch.com;https://research.bosch.com",
        "aff_unique_abbr": "Bosch;Tulane;BCAI;Bosch;Bosch",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;1;1;0;1",
        "aff_country_unique": "United States;Germany"
    },
    {
        "id": "NX0eNGXezp",
        "title": "Semi-HyperGraph Benchmark: Enhancing Flexibility of Hypergraph Learning with Datasets and Benchmarks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Graphs are widely used to encapsulate a variety of data formats, but real-world networks often involve complex node relations beyond only being pairwise. While hypergraphs have been developed and employed to account for the complex node relations, they reduce the flexibility of machine learning systems by totally disregarding simple edges, which to some extent leads to a drop in performance. Additionally, Graph Neural Networks (GNNs) research are normally separated into simple graphs and hypergraphs, and these two classes of methods tend not to interchange. Therefore, there is a need for a more flexible benchmark that allows GNNs to employ both simple edge and hyperedge information. In this paper, we present the *Semi-HyperGraph Benchmark (SHGB)*, a collection of comprehensive datasets combining hypergraphs and simple edges, with an accessible evaluation framework to fully understand the performance of GNNs on complex graphs. SHGB contains 23 real-world hypergraph datasets with simple edges included, across various domains such as biology, social media, and e-commerce. Furthermore, we provide an extensible evaluation framework and a supporting codebase to facilitate the training and evaluation of GNNs on SHGB. Our empirical study of existing GNNs on SHGB reveals various research opportunities and gaps, including (1) evaluating the actual performance improvement of hypergraph GNNs over simple graph GNNs; (2) comparing the impact of different sampling strategies on hypergraph learning methods; and (3) exploring ways to integrate simple edge and hyperedge information. We make our source code and full datasets publicly available at https://anonymous-url/.",
        "keywords": "Graph Neural Networks;Hypergraph Learning;Datasets and Benchmarks",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/14bc188709daa58fad1167fae9627c072493ee94.pdf",
        "author": "Zehui Li;Xiangyu Zhao;Mingzhu Shen;Guy-Bart Stan;Pietro Lio;Yiren Zhao",
        "authorids": "~Zehui_Li2;~Xiangyu_Zhao3;~Mingzhu_Shen1;~Guy-Bart_Stan1;~Pietro_Lio1;~Yiren_Zhao2",
        "gender": ";;F;M;M;M",
        "homepage": "https://zehui127.github.io/;https://victorzxy.github.io/;;https://gstan.bg-research.cc.ic.ac.uk/welcome.html;https://www.cst.cam.ac.uk/people/pl219;https://aaronzhao.me",
        "dblp": ";;249/2363.html;https://dblp.uni-trier.de/pid/52/7139.html;l/PietroLio.html;https://dblp.uni-trier.de/pers/hd/z/Zhao:Yiren",
        "google_scholar": ";Ek8gF7IAAAAJ;o7vrw6IAAAAJ;s2xYpAYAAAAJ;https://scholar.google.co.uk/citations?user=3YrWf7EAAAAJ;lOOmgEgAAAAJ",
        "orcid": ";;;0000-0002-5560-902X;0000-0002-0540-5053;",
        "linkedin": ";;;guystan/;;yiren-aaron-zhao-baa8b5116/",
        "or_profile": "~Zehui_Li2;~Xiangyu_Zhao3;~Mingzhu_Shen1;~Guy-Bart_Stan1;~Pietro_Lio1;~Yiren_Zhao2",
        "aff": "Imperial College London;Imperial College London;Imperial College London;Imperial College London;University of Cambridge;Imperial College London",
        "aff_domain": "ic.ac.uk;ic.ac.uk;ic.ac.uk;imperial.ac.uk;cam.ac.uk;ic.ac.uk",
        "position": "PhD student;PhD student;PhD student;Full Professor;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nli2024semihypergraph,\ntitle={Semi-HyperGraph Benchmark: Enhancing Flexibility of Hypergraph Learning with Datasets and Benchmarks},\nauthor={Zehui Li and Xiangyu Zhao and Mingzhu Shen and Guy-Bart Stan and Pietro Lio and Yiren Zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=NX0eNGXezp}\n}",
        "github": "",
        "project": "",
        "reviewers": "Smxv;3S38;RFzy",
        "site": "https://openreview.net/forum?id=NX0eNGXezp",
        "pdf_size": 1592190,
        "rating": "5;5;5",
        "confidence": "4;3;4",
        "soundness": "2;2;2",
        "contribution": "2;2;2",
        "presentation": "2;3;3",
        "wc_summary": "91;52;60",
        "wc_strengths": "70;10;45",
        "wc_weaknesses": "286;60;209",
        "wc_questions": "248;74;17",
        "wc_review": "695;196;331",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1936;997;1380",
        "reply_reviewers": "0;0;0",
        "reply_authors": "3;2;2",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            67.66666666666667,
            16.81930108205715
        ],
        "wc_strengths_avg": [
            41.666666666666664,
            24.608038433722335
        ],
        "wc_weaknesses_avg": [
            185.0,
            93.81186847444552
        ],
        "wc_questions_avg": [
            113.0,
            98.25477087653302
        ],
        "wc_review_avg": [
            407.3333333333333,
            210.7452385121798
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1437.6666666666667,
            385.5077459950996
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:exXm54sU1TQJ:scholar.google.com/&scioq=Semi-HyperGraph+Benchmark:+Enhancing+Flexibility+of+Hypergraph+Learning+with+Datasets+and+Benchmarks&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;1;0",
        "aff_unique_norm": "Imperial College London;University of Cambridge",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.imperial.ac.uk;https://www.cam.ac.uk",
        "aff_unique_abbr": "ICL;Cambridge",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Cambridge",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "NY3HzOOL3u",
        "title": "Skill Reinforcement Learning and Planning for Open-World Long-Horizon Tasks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We study building an agent that solves diverse long-horizon tasks in open-world environments. Without human demonstrations, learning to accomplish tasks in a large open-world environment with reinforcement learning (RL) is extremely inefficient. To tackle this challenge, we convert the multi-task learning problem into learning basic skills and planning over the skills, and propose a Finding-skill to improve the sample efficiency for training all the skills. Using the popular open-world game Minecraft as the testbed, we propose three types of fine-grained basic skills, and use RL with intrinsic rewards to acquire skills with high success rates. For skill planning, we leverage the prior knowledge in Large Language Models to find the relationships between skills and build a skill graph. When the agent is solving a task, our skill search algorithm walks on the skill graph and generates the proper skill plans for the agent. In experiments, our method accomplishes 40 diverse Minecraft tasks, where many tasks require sequentially executing for more than 10 skills. Our method outperforms baselines by a large margin and is the most sample-efficient demonstration-free RL method to solve Minecraft Tech Tree tasks.",
        "keywords": "reinforcement learning;open-world environments;multi-task learning;large language models",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Haoqi Yuan;Chi Zhang;Hongcheng Wang;Feiyang Xie;Penglin Cai;Hao Dong;Zongqing Lu",
        "authorids": "~Haoqi_Yuan1;~Chi_Zhang37;~Hongcheng_Wang6;~Feiyang_Xie1;~Penglin_Cai1;~Hao_Dong3;~Zongqing_Lu2",
        "gender": "M;M;M;;M;M;",
        "homepage": ";;;https://github.com/Xiefeiy;;https://zsdonghao.github.io;",
        "dblp": "254/2084;91/195;76/1170;301/5891;344/2100;14/1525-3.html;",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com/citations?hl=zh-CN;;;kGyiuW8AAAAJ;xLFL4sMAAAAJ;",
        "orcid": ";;;;;0000-0003-2261-9122;",
        "linkedin": ";;%E9%B8%BF%E9%93%96-%E7%8E%8B-4a66451b9/;;;;",
        "or_profile": "~Haoqi_Yuan1;~Chi_Zhang37;~Hongcheng_Wang6;~Feiyang_Xie1;~Penglin_Cai1;~Hao_Dong3;~Zongqing_Lu2",
        "aff": "Peking University;Peking University;Peking University;Peking University;Peking University;Peking University;",
        "aff_domain": "pku.edu.cn;pku.edu.cn;pku.edu.cn;pku.edu.cn;pku.edu.cn;pku.edu.cn;",
        "position": "PhD student;Undergrad student;PhD student;Undergrad student;Undergrad student;Assistant Professor;",
        "bibtex": "@misc{\nyuan2024skill,\ntitle={Skill Reinforcement Learning and Planning for Open-World Long-Horizon Tasks},\nauthor={Haoqi Yuan and Chi Zhang and Hongcheng Wang and Feiyang Xie and Penglin Cai and Hao Dong and Zongqing Lu},\nyear={2024},\nurl={https://openreview.net/forum?id=NY3HzOOL3u}\n}",
        "github": "",
        "project": "",
        "reviewers": "Dk5Z;V7Pc;drhA;ALHp",
        "site": "https://openreview.net/forum?id=NY3HzOOL3u",
        "pdf_size": 901567,
        "rating": "3;3;5;5",
        "confidence": "4;3;3;3",
        "soundness": "3;3;2;2",
        "contribution": "2;2;2;2",
        "presentation": "3;1;3;3",
        "wc_summary": "134;157;58;134",
        "wc_strengths": "55;34;31;54",
        "wc_weaknesses": "350;259;55;129",
        "wc_questions": "28;95;113;321",
        "wc_review": "567;545;257;638",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            120.75,
            37.425759845325786
        ],
        "wc_strengths_avg": [
            43.5,
            11.05667219374799
        ],
        "wc_weaknesses_avg": [
            198.25,
            114.05563335495533
        ],
        "wc_questions_avg": [
            139.25,
            109.60924915352719
        ],
        "wc_review_avg": [
            501.75,
            145.42588318452806
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 21,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6848670520345524220&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "Peking University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.pku.edu.cn",
        "aff_unique_abbr": "Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Fake It Till Make It: Federated Learning with Consensus-Oriented Generation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18783",
        "id": "NY3wMJuaLf",
        "author_site": "Rui Ye, Yaxin Du, Zhenyang Ni, Siheng Chen, Yanfeng Wang",
        "tldr": "",
        "abstract": "In federated learning (FL), data heterogeneity is one key bottleneck that causes model divergence and limits performance. Addressing this, existing methods often regard data heterogeneity as an inherent property and propose to mitigate its adverse effects by correcting models. In this paper, we seek to break this inherent property by generating data to complement the original dataset to fundamentally mitigate heterogeneity level. \nAs a novel attempt from the perspective of data, we propose federated learning with consensus-oriented generation (FedCOG). FedCOG consists of two key components at the client side: complementary data generation, which generates data extracted from the shared global model to complement the original dataset, and knowledge-distillation-based model training, which distills knowledge from global model to local model based on the generated data to mitigate over-fitting the original heterogeneous dataset.\nFedCOG has two critical advantages: 1) it can be a plug-and-play module to further improve the performance of most existing FL methods, and 2) it is naturally compatible with standard FL protocols such as Secure Aggregation since it makes no modification in communication process.\nExtensive experiments on classical and real-world FL datasets show that FedCOG consistently outperforms state-of-the-art methods. Code is available at https://github.com/rui-ye/FedCOG.",
        "keywords": "Federated learning;data heterogeneity",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Rui Ye;Yaxin Du;Zhenyang Ni;Yanfeng Wang;Siheng Chen",
        "authorids": "~Rui_Ye1;~Yaxin_Du1;~Zhenyang_Ni1;~Yanfeng_Wang1;~Siheng_Chen1",
        "gender": "M;F;M;M;M",
        "homepage": "http://rui-ye.github.io/;;https://github.com/VincentNi0107;https://cmic.sjtu.edu.cn/wangyanfeng/;https://siheng-chen.github.io/",
        "dblp": ";364/0077.html;318/9114;55/5407-1.html;136/4945",
        "google_scholar": "Q4-VTxcAAAAJ;i_7WSl0AAAAJ;;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;0000-0002-3196-2347;",
        "linkedin": ";;;;",
        "or_profile": "~Rui_Ye1;~Yaxin_Du1;~Zhenyang_Ni1;~Yanfeng_Wang1;~Siheng_Chen2",
        "aff": "Shanghai Jiaotong University;Shanghai Jiao tong University;Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn",
        "position": "PhD student;PhD student;MS student;Full Professor;Associate Professor",
        "bibtex": "@inproceedings{\nye2024fake,\ntitle={Fake It Till Make It: Federated Learning with Consensus-Oriented Generation},\nauthor={Rui Ye and Yaxin Du and Zhenyang Ni and Yanfeng Wang and Siheng Chen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=NY3wMJuaLf}\n}",
        "github": "",
        "project": "",
        "reviewers": "3E8Z;SDr1;wN99;iXGo",
        "pdf_size": 2386148,
        "rating": "6;6;6;6",
        "confidence": "4;3;4;3",
        "soundness": "3;4;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "66;172;51;89",
        "wc_strengths": "56;46;61;40",
        "wc_weaknesses": "178;241;116;110",
        "wc_questions": "41;49;41;2",
        "wc_review": "341;508;269;241",
        "wc_reply_reviewers": "104;10;0;16",
        "wc_reply_authors": "1345;1046;1177;756",
        "reply_reviewers": "2;1;0;1",
        "reply_authors": "3;4;3;3",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            94.5,
            46.74665763453041
        ],
        "wc_strengths_avg": [
            50.75,
            8.227241335952167
        ],
        "wc_weaknesses_avg": [
            161.25,
            53.18540683307781
        ],
        "wc_questions_avg": [
            33.25,
            18.335416548308903
        ],
        "wc_review_avg": [
            339.75,
            103.76264983123744
        ],
        "wc_reply_reviewers_avg": [
            32.5,
            41.674332628129754
        ],
        "wc_reply_authors_avg": [
            1081.0,
            215.50058004562308
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            3.25,
            0.4330127018922193
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17314001153558672143&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=NY3wMJuaLf",
        "pdf": "https://openreview.net/pdf?id=NY3wMJuaLf",
        "email": "sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Shanghai Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sjtu.edu.cn",
        "aff_unique_abbr": "SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "GIM: Learning Generalizable Image Matcher From Internet Videos",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18782",
        "id": "NYN1b8GRGS",
        "author_site": "Xuelun Shen, zhipeng cai, Wei Yin, Matthias M\u00fcller, Zijun Li, Kaixuan Wang, Xiaozhi Chen, Cheng Wang",
        "tldr": "",
        "abstract": "Image matching is a fundamental computer vision problem. While learning-based methods achieve state-of-the-art performance on existing benchmarks, they generalize poorly to in-the-wild images. Such methods typically need to train separate models for different scene types (e.g., indoor vs. outdoor) and are impractical when the scene type is unknown in advance. One of the underlying problems is the limited scalability of existing data construction pipelines, which limits the diversity of standard image matching datasets. To address this problem, we propose GIM, a self-training framework for learning a single generalizable model based on any image matching architecture using internet videos, an abundant and diverse data source. Given an architecture, GIM first trains it on standard domain-specific datasets and then combines it with complementary matching methods to create dense labels on nearby frames of novel videos. These labels are filtered by robust fitting, and then enhanced by propagating them to distant frames. The final model is trained on propagated data with strong augmentations. Not relying on complex 3D reconstruction makes GIM much more efficient and less likely to fail than standard SfM-and-MVS based frameworks. We also propose ZEB, the first zero-shot evaluation benchmark for image matching. By mixing data from diverse domains, ZEB can thoroughly assess the cross-domain generalization performance of different methods. Experiments demonstrate the effectiveness and generality of GIM. Applying GIM consistently improves the zero-shot performance of 3 state-of-the-art image matching architectures as the number of downloaded videos increases (Fig. 1 (a)); with 50 hours of YouTube videos, the relative zero-shot performance improves by 6.9% \u2212 18.1%. GIM also enables generalization to extreme cross-domain data such as Bird Eye View (BEV) images of projected 3D point clouds (Fig. 1 (c)). More importantly, our single zero-shot model consistently outperforms domain-specific baselines when evaluated on downstream tasks inherent to their respective domains. The code will be released upon acceptance.",
        "keywords": "Image Matching;Pose Estimation;3D Reconstruction",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Xuelun Shen;zhipeng cai;Wei Yin;Matthias M\u00fcller;Zijun Li;Kaixuan Wang;Xiaozhi Chen;Cheng Wang",
        "authorids": "~Xuelun_Shen1;~zhipeng_cai3;~Wei_Yin2;~Matthias_M\u00fcller1;~Zijun_Li1;~Kaixuan_Wang2;~Xiaozhi_Chen4;~Cheng_Wang2",
        "gender": ";M;M;;M;M;M;M",
        "homepage": "https://xuelunshen.com/;https://zhipengcai.github.io;https://yvanyin.net/;https://matthias.pw;;https://wang-kx.github.io/;https://chwang.xmu.edu.cn/index_en.htm;",
        "dblp": "222/7841;;67/4051-6;169/4686-1;44/10301-2.html;;54/2062-3;150/3655",
        "google_scholar": "kvvKmvoAAAAJ;;ZIf_rtcAAAAJ;AeMLOMEAAAAJ;https://scholar.google.com/citations?hl=zh-CN;;https://scholar.google.com/citations?hl=en;GArEeWQAAAAJ",
        "orcid": ";;;;0000-0001-7756-2608;;0000-0001-6075-796X;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Xuelun_Shen1;~zhipeng_cai3;~Wei_Yin2;~Matthias_M\u00fcller1;~Zijun_Li1;~Kaixuan_Wang2;~Cheng_Wang2;~Xiaozhi_Chen1",
        "aff": "Xiamen University;Intel; Shenzhen DJI Sciences and Technologies Ltd.;Apple;Xiamen University;;Xiamen University;DJI Innovations",
        "aff_domain": "xmu.edu.cn;intel.com;dji.com;apple.com;xmu.edu.cn;;xmu.edu.cn;dji.com",
        "position": "PhD student;Researcher;Researcher;Researcher;PhD student;;Full Professor;Software Engineer",
        "bibtex": "@inproceedings{\nshen2024gim,\ntitle={{GIM}: Learning Generalizable Image Matcher From Internet Videos},\nauthor={Xuelun Shen and zhipeng cai and Wei Yin and Matthias M{\\\"u}ller and Zijun Li and Kaixuan Wang and Xiaozhi Chen and Cheng Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=NYN1b8GRGS}\n}",
        "github": "",
        "project": "",
        "reviewers": "XccY;jxyk;sN7h;UvwB",
        "pdf_size": 30536381,
        "rating": "6;8;8;10",
        "confidence": "3;2;3;5",
        "soundness": "3;3;3;4",
        "contribution": "3;3;3;4",
        "presentation": "3;3;3;4",
        "wc_summary": "118;100;86;59",
        "wc_strengths": "75;61;136;147",
        "wc_weaknesses": "83;44;193;54",
        "wc_questions": "78;160;7;29",
        "wc_review": "354;365;422;289",
        "wc_reply_reviewers": "0;79;15;0",
        "wc_reply_authors": "771;574;363;160",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            8.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.25,
            1.0897247358851685
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            90.75,
            21.556611514799815
        ],
        "wc_strengths_avg": [
            104.75,
            37.28521825066872
        ],
        "wc_weaknesses_avg": [
            93.5,
            59.20515180286256
        ],
        "wc_questions_avg": [
            68.5,
            58.74734036533058
        ],
        "wc_review_avg": [
            357.5,
            47.225522760473496
        ],
        "wc_reply_reviewers_avg": [
            23.5,
            32.62284475639732
        ],
        "wc_reply_authors_avg": [
            467.0,
            228.54430642656578
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.6488856845230502,
        "gs_citation": 25,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2905833658409503281&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=NYN1b8GRGS",
        "pdf": "https://openreview.net/pdf?id=NYN1b8GRGS",
        "email": "xmu.edu.cn;intel.com;dji.com;apple.com;xmu.edu.cn;;xmu.edu.cn;dji.com",
        "author_num": 8,
        "aff_unique_index": "0;1;2;3;0;0;4",
        "aff_unique_norm": "Xiamen University;Intel;DJI Sciences and Technologies;Apple;DJI Innovations",
        "aff_unique_dep": ";Intel Corporation;;Apple Inc.;",
        "aff_unique_url": "https://www.xmu.edu.cn;https://www.intel.com;https://www.dji.com;https://www.apple.com;https://www.dji.com",
        "aff_unique_abbr": "XMU;Intel;DJI;Apple;DJI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;1;0;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "NZ5KXXDv1T",
        "title": "Reinforcement Learning based Image Generation via Visual Consensus Evaluation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Image generation models are typically trained using the L2 or cross-entropy loss, and evaluated using IS or FID. The inconsistency between the training and evaluation metrics results in suboptimal model performance. To this end, we explore to address the aforementioned issue by finetuning pre-trained generative models with the reinforcement learning. Considering that current evaluation metrics can not be used as training objects since obtaining an accurate score typically demands more than ten thousand images, we introduce an innovative automated metric that captures consensus as a reward signal of the reinforcement learning for finetuning image generation models. It exhibits strong correlation with commonly used metrics such as FID, and demonstrates better robustness to the number of images than FID. Experiments indicate that when introducing varying degrees of noise to the generated images, such as ImageNet contamination or Gaussian noise, our metric quantifies the level of disruption more accurately than IS. By finetuning generative models with our proposed method, we boost the performance for image generation on multiple benchmarks like LSUN 256x256 and ImageNet 64x64.",
        "keywords": "Image Synthesis; Reinforcement Learning; Diffusion Model",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Zihan Qin;Mingzhen Sun;Weining Wang;Xinxin Zhu;Jing Liu",
        "authorids": "~Zihan_Qin1;~Mingzhen_Sun1;~Weining_Wang3;~Xinxin_Zhu1;~Jing_Liu1",
        "gender": "F;F;F;;F",
        "homepage": "https://github.com/qzhqaq;https://github.com/iva-mzsun;;https://scholar.google.com/citations?user=MGL0W4gAAAAJ&hl=zh-CN&oi=ao;http://www.nlpr.ia.ac.cn/iva/liujing/",
        "dblp": ";296/4017;97/6006-1.html;;72/2590-1.html",
        "google_scholar": ";;NDPvobAAAAAJ;MGL0W4gAAAAJ;sOI-S7oAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Zihan_Qin1;~Mingzhen_Sun1;~Weining_Wang3;~Xinxin_Zhu1;~Jing_Liu1",
        "aff": "Institute of Automation, Chinese Academy of Sciences;Institute of Automation, Chinese Academy of Sciences;Institute of Automation, Chinese Academy of Sciences;, Institute of automation, Chinese academy of science;Institute of automation, Chinese academy of science",
        "aff_domain": "ia.ac.cn;ia.ac.cn;ia.ac.cn;nlpr.ia.ac.cn;nlpr.ia.ac.cn",
        "position": "MS student;PhD student;Associate Professor;Associate Professor;Full Professor",
        "bibtex": "@misc{\nqin2024reinforcement,\ntitle={Reinforcement Learning based Image Generation via Visual Consensus Evaluation},\nauthor={Zihan Qin and Mingzhen Sun and Weining Wang and Xinxin Zhu and Jing Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=NZ5KXXDv1T}\n}",
        "github": "",
        "project": "",
        "reviewers": "Ywyw;6u5q;4fJs;9MFC",
        "site": "https://openreview.net/forum?id=NZ5KXXDv1T",
        "pdf_size": 21671117,
        "rating": "1;3;3;3",
        "confidence": "4;3;4;4",
        "soundness": "2;2;2;2",
        "contribution": "2;2;1;2",
        "presentation": "1;2;1;1",
        "wc_summary": "78;102;22;57",
        "wc_strengths": "32;63;22;39",
        "wc_weaknesses": "107;317;135;132",
        "wc_questions": "2;12;64;1",
        "wc_review": "219;494;243;229",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            64.75,
            29.371542349696245
        ],
        "wc_strengths_avg": [
            39.0,
            15.116216457830975
        ],
        "wc_weaknesses_avg": [
            172.75,
            83.98921061660242
        ],
        "wc_questions_avg": [
            19.75,
            25.907286619790966
        ],
        "wc_review_avg": [
            296.25,
            114.48880949682375
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Aqj0VV4T_gkJ:scholar.google.com/&scioq=Reinforcement+Learning+based+Image+Generation+via+Visual+Consensus+Evaluation&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Chinese Academy of Sciences",
        "aff_unique_dep": "Institute of Automation",
        "aff_unique_url": "http://www.ia.cas.cn",
        "aff_unique_abbr": "CAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "NZtF0um8S7",
        "title": "Exploiting the Potential of Seq2Seq Models as Robust Few-Shot Learners",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In-context learning, which offers substantial advantages over fine-tuning, is predominantly observed in decoder-only models, while encoder-decoder (i.e., seq2seq) models excel in methods that rely on weight updates. Recently, a few studies have demonstrated the feasibility of few-shot learning with seq2seq models; however, this has been limited to tasks that align well with the seq2seq architecture, such as summarization and translation. Inspired by these initial studies, we provide a first-ever extensive experiment comparing the in-context few-shot learning capabilities of decoder-only and encoder-decoder models on a broad range of tasks. Furthermore, we propose two methods to more effectively elicit in-context learning ability in seq2seq models: objective-aligned prompting and a fusion-based approach. Remarkably, our approach outperforms a decoder-only model that is six times larger and exhibits significant performance improvements compared to conventional seq2seq models across a variety of settings. We posit that, with the right configuration and prompt design, seq2seq models can be highly effective few-shot learners for a wide spectrum of applications.",
        "keywords": "Encoder-Decoder Model;In-context Learning;Few-shot Learning Abstract:",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/ff2fa3fbab365045c28a5053987cdee520e58550.zip",
        "author": "Jihyeon Lee;Dain Kim;Doohae Jung;Boseop Kim;Kyoung-Woon On",
        "authorids": "~Jihyeon_Lee1;~Dain_Kim1;~Doohae_Jung1;~Boseop_Kim1;~Kyoung-Woon_On1",
        "gender": "F;M;M;;M",
        "homepage": "https://ginajihyeonlee.github.io/;https://github.com/danny980521;;;",
        "dblp": "230/2572;;;214/2673.html;175/0873",
        "google_scholar": "lArnR6gAAAAJ;;;https://scholar.google.co.kr/citations?user=PQJ_t_MAAAAJ;",
        "orcid": ";;;;",
        "linkedin": "ginajihyeonlee;;doohae-jung-5bb9a2205/;;",
        "or_profile": "~Jihyeon_Lee1;~Dain_Kim1;~Doohae_Jung1;~Boseop_Kim1;~Kyoung-Woon_On1",
        "aff": "KakaoBrain;kakaobrain;Sogang University;Kakaobrain;Kakao",
        "aff_domain": "kakaobrain.com;kakaobrain.com;sogang.ac.kr;kakaobrain.com;kakaocorp.com",
        "position": "Researcher;Researcher;Undergrad student;Researcher;Researcher",
        "bibtex": "@misc{\nlee2024exploiting,\ntitle={Exploiting the Potential of Seq2Seq Models as Robust Few-Shot Learners},\nauthor={Jihyeon Lee and Dain Kim and Doohae Jung and Boseop Kim and Kyoung-Woon On},\nyear={2024},\nurl={https://openreview.net/forum?id=NZtF0um8S7}\n}",
        "github": "",
        "project": "",
        "reviewers": "6VXy;6fMx;SaZz;aYaC",
        "site": "https://openreview.net/forum?id=NZtF0um8S7",
        "pdf_size": 1159670,
        "rating": "5;5;6;6",
        "confidence": "3;5;3;3",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "55;56;92;41",
        "wc_strengths": "38;66;51;29",
        "wc_weaknesses": "170;31;58;18",
        "wc_questions": "7;2;18;16",
        "wc_review": "270;155;219;104",
        "wc_reply_reviewers": "39;0;0;0",
        "wc_reply_authors": "914;374;583;536",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "3;1;1;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            61.0,
            18.854707634964804
        ],
        "wc_strengths_avg": [
            46.0,
            13.946325680981353
        ],
        "wc_weaknesses_avg": [
            69.25,
            59.930689133364716
        ],
        "wc_questions_avg": [
            10.75,
            6.53356717268599
        ],
        "wc_review_avg": [
            187.0,
            62.90071541723512
        ],
        "wc_reply_reviewers_avg": [
            9.75,
            16.887495373796554
        ],
        "wc_reply_authors_avg": [
            601.75,
            196.24267502253429
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:xAkd1R-QKVoJ:scholar.google.com/&scioq=Exploiting+the+Potential+of+Seq2Seq+Models+as+Robust+Few-Shot+Learners&hl=en&as_sdt=0,5",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2;1;3",
        "aff_unique_norm": "KakaoBrain;Kakao Brain;Sogang University;Kakao Corp.",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.kakaobrain.com;https://brain.kakao.com;https://www.sogang.ac.kr;https://www.kakao.com",
        "aff_unique_abbr": "KakaoBrain;Kakao Brain;Sogang;Kakao",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "Naiy1jf8UA",
        "title": "MGDC-UNet: Multi-group Deformable Convolution for Medical Image Segmentation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recently, there has been growing interest in developing Vision Transformer (ViT) or Convolutional Neural Network (CNN) methods for 3D medical image segmentation, which necessitates both large receptive fields and adaptations to varying spatial geometries. Previous works in both CNNs and ViTs demonstrated limitations in capturing the complex spatial and semantic structure of 3D medical images. In this paper, we introduce MGDC-UNet, a multi-group deformable convolution network for 3D volumetric medical image segmentation. Our MGDC-UNet employs deformable convolution operators with learnable spatial offsets to improve attention on semantically important regions. Our approach leverages stable spatial distribution across subjects to enhance semantic learning. We also incorporate transformer components to augment feature learning and reduce inductive biases inherent in traditional CNNs. MGDC-UNet demonstrated superior performance accuracy on three challenging segmentation tasks using public datasets: 1). brain tumor segmentation (BraTS21), 2). CT multi-organ segmentation (FLARE21) and 3). cross-modality MR/CT segmentation (AMOS22). Our network also compared favorably with existing methods in terms of computational efficiency.",
        "keywords": "Deformable Convolution;Convolutional Neural Network;Vision Transformer;Medical Image Segmentation;CT;MRI",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Yuheng Li;Mingzhe Hu;Xiaofeng Yang",
        "authorids": "~Yuheng_Li4;mingzhe.hu@emory.edu;~Xiaofeng_Yang6",
        "gender": ";;",
        "homepage": ";;",
        "dblp": ";;",
        "google_scholar": "MxO6qiIAAAAJ;;",
        "orcid": ";;",
        "linkedin": "yuheng-li-a0a0891ab/;;",
        "or_profile": "~Yuheng_Li4;mingzhe.hu@emory.edu;~Xiaofeng_Yang6",
        "aff": "Georgia Institute of Technology;;",
        "aff_domain": "gatech.edu;;",
        "position": "PhD student;;",
        "bibtex": "@misc{\nli2024mgdcunet,\ntitle={{MGDC}-{UN}et: Multi-group Deformable Convolution for Medical Image Segmentation},\nauthor={Yuheng Li and Mingzhe Hu and Xiaofeng Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=Naiy1jf8UA}\n}",
        "github": "",
        "project": "",
        "reviewers": "Ateq;spqz;kXxV;sKkf",
        "site": "https://openreview.net/forum?id=Naiy1jf8UA",
        "pdf_size": 5698961,
        "rating": "5;5;6;8",
        "confidence": "2;4;4;4",
        "soundness": "2;3;2;2",
        "contribution": "2;2;2;3",
        "presentation": "2;3;2;3",
        "wc_summary": "140;65;72;66",
        "wc_strengths": "9;62;23;16",
        "wc_weaknesses": "49;188;356;29",
        "wc_questions": "2;188;6;22",
        "wc_review": "200;503;457;133",
        "wc_reply_reviewers": "246;23;40;32",
        "wc_reply_authors": "1831;1450;2455;776",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "4;3;5;2",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            85.75,
            31.43544973433655
        ],
        "wc_strengths_avg": [
            27.5,
            20.524375751773793
        ],
        "wc_weaknesses_avg": [
            155.5,
            130.95896303804486
        ],
        "wc_questions_avg": [
            54.5,
            77.43868542272654
        ],
        "wc_review_avg": [
            323.25,
            159.36181317994595
        ],
        "wc_reply_reviewers_avg": [
            85.25,
            93.00369616310957
        ],
        "wc_reply_authors_avg": [
            1628.0,
            608.8361848642047
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.5,
            1.118033988749895
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.4714045207910316,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:BQAsazO0W3cJ:scholar.google.com/&scioq=MGDC-UNet:+Multi-group+Deformable+Convolution+for+Medical+Image+Segmentation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Georgia Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.gatech.edu",
        "aff_unique_abbr": "Georgia Tech",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "NaxbdRi8Rv",
        "title": "StyleAdapter: A Unified Stylized Image Generation Model without Test-Time Fine-Tuning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "This work focuses on generating high-quality images with specific style of reference images and content of provided textual descriptions. Current leading algorithms, i.e., DreamBooth and LoRA, require fine-tuning for each style, leading to time-consuming and computationally expensive processes. In this work, we propose StyleAdapter, a unified stylized image generation model capable of producing a variety of stylized images that match both the content of a given prompt and the style of reference images, without the need for test-time fine-tuning. It introduces a two-path cross-attention (TPCA) module to separately process style information and textual prompt, which cooperate with a semantic suppressing vision model (SSVM) to suppress the semantic content of style images. In this way, it can ensure the controllability of the prompt over the content of the generated images while mitigating the negative impact of semantic information in style references. Besides, our StyleAdapter can be integrated with existing controllable synthesis methods, such as T2I-adapter and ControlNet, to attain a more controllable and stable generation process. Extensive experiments demonstrate the superiority of our method over previous works.",
        "keywords": "AIGC;Style Transfer",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Zhouxia Wang;Xintao Wang;Liangbin Xie;Zhongang Qi;Ying Shan;Wenping Wang;Ping Luo",
        "authorids": "~Zhouxia_Wang2;~Xintao_Wang1;~Liangbin_Xie1;~Zhongang_Qi1;~Ying_Shan2;~Wenping_Wang1;~Ping_Luo2",
        "gender": ";;M;M;M;M;",
        "homepage": ";;https://github.com/LiangbinXie;;;https://engineering.tamu.edu/cse/profiles/Wang-Wenping.html;",
        "dblp": ";;263/5192;08/9990;68/5910;;",
        "google_scholar": ";;;zJvrrusAAAAJ;4oXBp9UAAAAJ;28shvv0AAAAJ;",
        "orcid": ";;;;0000-0001-7673-8325;0000-0002-2284-3952;",
        "linkedin": ";;;;YingShanProfile/;;",
        "or_profile": "~Zhouxia_Wang2;~Xintao_Wang1;~Liangbin_Xie1;~Zhongang_Qi1;~Ying_Shan2;~Wenping_Wang1;~Ping_Luo2",
        "aff": ";;University of Macau;Tencent PCG ARC Lab;Tencent PCG ARC Lab;Texas A&M University - College Station;",
        "aff_domain": ";;umac.mo;tencent.com;arc.tencent.com;tamu.edu;",
        "position": ";;PhD student;Researcher;Director;Full Professor;",
        "bibtex": "@misc{\nwang2024styleadapter,\ntitle={StyleAdapter: A Unified Stylized Image Generation Model without Test-Time Fine-Tuning},\nauthor={Zhouxia Wang and Xintao Wang and Liangbin Xie and Zhongang Qi and Ying Shan and Wenping Wang and Ping Luo},\nyear={2024},\nurl={https://openreview.net/forum?id=NaxbdRi8Rv}\n}",
        "github": "",
        "project": "",
        "reviewers": "Civx;scyk;tsHj;6r1g",
        "site": "https://openreview.net/forum?id=NaxbdRi8Rv",
        "pdf_size": 5569601,
        "rating": "3;5;5;5",
        "confidence": "4;3;5;5",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;2",
        "presentation": "3;3;3;3",
        "wc_summary": "61;81;127;165",
        "wc_strengths": "30;30;80;53",
        "wc_weaknesses": "200;114;301;340",
        "wc_questions": "34;3;3;50",
        "wc_review": "325;228;511;608",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            108.5,
            40.4567670482949
        ],
        "wc_strengths_avg": [
            48.25,
            20.595812681222366
        ],
        "wc_weaknesses_avg": [
            238.75,
            88.30451573957019
        ],
        "wc_questions_avg": [
            22.5,
            20.303940504246953
        ],
        "wc_review_avg": [
            418.0,
            149.58108169150267
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.17407765595569782,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:I4rUllt4newJ:scholar.google.com/&scioq=StyleAdapter:+A+Unified+Stylized+Image+Generation+Model+without+Test-Time+Fine-Tuning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "University of Macau;Tencent;Texas A&M University",
        "aff_unique_dep": ";PCG ARC Lab;",
        "aff_unique_url": "https://www.um.edu.mo;https://www.tencent.com;https://www.tamu.edu",
        "aff_unique_abbr": "UM;Tencent;TAMU",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Macau SAR;;College Station",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "NdbUfhttc1",
        "title": "Learning to Optimize for Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In recent years, by leveraging more data, computation, and diverse tasks, learned optimizers have achieved remarkable success in supervised learning, outperforming classical hand-designed optimizers. Reinforcement learning (RL) is essentially different from supervised learning and in practice these learned optimizers do not work well even in simple RL tasks. We investigate this phenomenon and identity three issues. First, the gradients of an RL agent vary across a wide range in logarithms while their absolute values are in a small range, making neural networks hard to obtain accurate parameter updates. Second, the agent-gradient distribution is non-independent and identically distributed, leading to inefficient meta-training. Finally, due to highly stochastic agent-environment interactions, the agent-gradients have high bias and variance, which increase the difficulty of learning an optimizer for RL. We propose gradient processing, pipeline training, and a novel optimizer structure with good inductive bias to address these issues. By applying these techniques, for the first time, we show that learning an optimizer for RL from scratch is possible. Although only trained in toy tasks, our learned optimizer can generalize to unseen complex tasks in Brax.",
        "keywords": "learning to optimize;reinforcement learning",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Qingfeng Lan;A. Rupam Mahmood;Shuicheng YAN;Zhongwen Xu",
        "authorids": "~Qingfeng_Lan1;~A._Rupam_Mahmood1;~Shuicheng_YAN3;~Zhongwen_Xu1",
        "gender": ";;M;M",
        "homepage": ";;https://yanshuicheng.ai/;https://zhongwen.one/",
        "dblp": ";;y/ShuichengYan;130/5077",
        "google_scholar": ";;https://scholar.google.com.hk/citations?user=DNuiPHwAAAAJ;https://scholar.google.co.uk/citations?user=T4xuHn8AAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Qingfeng_Lan1;~A._Rupam_Mahmood1;~Shuicheng_YAN3;~Zhongwen_Xu1",
        "aff": ";;sea Group;Tencent",
        "aff_domain": ";;sea.com;tencent.com",
        "position": ";;Researcher;Principal Researcher",
        "bibtex": "@misc{\nlan2024learning,\ntitle={Learning to Optimize for Reinforcement Learning},\nauthor={Qingfeng Lan and A. Rupam Mahmood and Shuicheng YAN and Zhongwen Xu},\nyear={2024},\nurl={https://openreview.net/forum?id=NdbUfhttc1}\n}",
        "github": "",
        "project": "",
        "reviewers": "wz35;ssUw;8FzQ;tcjw",
        "site": "https://openreview.net/forum?id=NdbUfhttc1",
        "pdf_size": 1647564,
        "rating": "3;5;6;6",
        "confidence": "5;4;4;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "4;3;3;3",
        "wc_summary": "119;39;98;387",
        "wc_strengths": "72;100;84;76",
        "wc_weaknesses": "417;419;65;128",
        "wc_questions": "135;200;236;210",
        "wc_review": "743;758;483;801",
        "wc_reply_reviewers": "393;509;14;161",
        "wc_reply_authors": "328;633;349;139",
        "reply_reviewers": "2;2;1;1",
        "reply_authors": "3;2;1;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            160.75,
            133.87750931355126
        ],
        "wc_strengths_avg": [
            83.0,
            10.723805294763608
        ],
        "wc_weaknesses_avg": [
            257.25,
            162.28736087570098
        ],
        "wc_questions_avg": [
            195.25,
            37.18450618201081
        ],
        "wc_review_avg": [
            696.25,
            124.94673865291563
        ],
        "wc_reply_reviewers_avg": [
            269.25,
            193.43264331544455
        ],
        "wc_reply_authors_avg": [
            362.25,
            176.41906784698756
        ],
        "reply_reviewers_avg": [
            1.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8660254037844386,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5660888123029472187&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Sea Group;Tencent",
        "aff_unique_dep": ";Tencent Holdings Limited",
        "aff_unique_url": ";https://www.tencent.com",
        "aff_unique_abbr": ";Tencent",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "1",
        "aff_country_unique": ";China"
    },
    {
        "title": "Towards Imitation Learning to Branch for MIP: A Hybrid Reinforcement Learning based Sample Augmentation Approach",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18781",
        "id": "NdcQQ82mfy",
        "author_site": "Changwen Zhang, wenli ouyang, Hao Yuan, Liming Gong, Yong Sun, Ziao Guo, Zhichen Dong, Junchi Yan",
        "tldr": "",
        "abstract": "Branch-and-bound (B\\&B) has long been favored for tackling complex Mixed Integer Programming (MIP) problems, where the choice of branching strategy plays a pivotal role. Recently, Imitation Learning (IL)-based policies have emerged as potent alternatives to traditional rule-based approaches. However, it is nontrivial to acquire high-quality training samples, and IL often converges to suboptimal variable choices for branching, restricting the overall performance. In response to these challenges, we propose a novel hybrid online and offline reinforcement learning (RL) approach to enhance the branching policy by cost-effective training sample augmentation. In the online phase, we train an online RL agent to dynamically decide the sample generation processes, drawing from either the learning-based policy or the expert policy. The objective is to strike a balance between exploration and exploitation of the sample generation process. In the offline phase, a value function is trained to fit each decision's cumulative reward and filter the samples with high cumulative returns. This dual-purpose function not only reduces training complexity but also enhances the quality of the samples. To assess the efficacy of our data augmentation mechanism, we conduct comprehensive evaluations across a range of MIP problems. The results consistently show that it excels in making superior branching decisions compared to state-of-the-art learning-based models and the open-source solver SCIP. Notably, it even often outperforms Gurobi.",
        "keywords": "hybrid RL;Sample Augmentation;Learning to branch;Imitation learning",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/a5b1ece5114935237e5c58ee465db632380f39a3.zip",
        "author": "Changwen Zhang;Wenli Ouyang;Hao Yuan;Liming Gong;Yong Sun;Ziao Guo;Zhichen Dong;Junchi Yan",
        "authorids": "~Changwen_Zhang1;~Wenli_Ouyang1;~Hao_Yuan5;~Liming_Gong1;~Yong_Sun1;~Ziao_Guo1;~Zhichen_Dong1;~Junchi_Yan2",
        "gender": "M;;M;M;M;M;F;M",
        "homepage": "https://github.com/xtjjyygy;;https://www.researchgate.net/profile/Hao-Yuan-50/research;https://github.com/kgisme170;https://github.com/LeonSun01;https://github.com/ziao-guo;https://github.com/niconi19;http://thinklab.sjtu.edu.cn/",
        "dblp": "256/7886.html;243/3171;92/867-2.html;;;312/4575;;60/7949.html",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;;;;;;ga230VoAAAAJ",
        "orcid": ";;0000-0002-6780-9627;;;;;0000-0001-9639-7679",
        "linkedin": ";wenli-ouyang-07891641;;;;;;",
        "or_profile": "~Changwen_Zhang1;~Wenli_Ouyang1;~Hao_Yuan5;~Liming_Gong1;~Yong_Sun1;~Ziao_Guo1;~Zhichen_Dong1;~Junchi_Yan1",
        "aff": "lenovo;Lenovo Research ;Lenovo Research;;Lenovo Group Limited;Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University",
        "aff_domain": "lenovo.com;lenovo.com;lenovo.com;;lenovo.com;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn",
        "position": "Researcher;Researcher;Researcher;;Researcher;PhD student;PhD student;Full Professor",
        "bibtex": "@inproceedings{\nzhang2024towards,\ntitle={Towards Imitation Learning to Branch for {MIP}: A Hybrid Reinforcement Learning based Sample Augmentation Approach},\nauthor={Changwen Zhang and Wenli Ouyang and Hao Yuan and Liming Gong and Yong Sun and Ziao Guo and Zhichen Dong and Junchi Yan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=NdcQQ82mfy}\n}",
        "github": "",
        "project": "",
        "reviewers": "f3Ne;pX8W;Gdrc",
        "pdf_size": 642990,
        "rating": "5;6;6",
        "confidence": "4;5;3",
        "soundness": "2;3;3",
        "contribution": "3;2;3",
        "presentation": "2;4;2",
        "wc_summary": "58;83;113",
        "wc_strengths": "99;51;56",
        "wc_weaknesses": "179;588;207",
        "wc_questions": "181;103;264",
        "wc_review": "517;825;640",
        "wc_reply_reviewers": "0;719;211",
        "wc_reply_authors": "784;1765;928",
        "reply_reviewers": "0;3;1",
        "reply_authors": "1;4;2",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            84.66666666666667,
            22.484562605386735
        ],
        "wc_strengths_avg": [
            68.66666666666667,
            21.545816814923082
        ],
        "wc_weaknesses_avg": [
            324.6666666666667,
            186.55532393606163
        ],
        "wc_questions_avg": [
            182.66666666666666,
            65.73853934759697
        ],
        "wc_review_avg": [
            660.6666666666666,
            126.58681693692365
        ],
        "wc_reply_reviewers_avg": [
            310.0,
            301.76259984740767
        ],
        "wc_reply_authors_avg": [
            1159.0,
            432.5205197444394
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            1.247219128924647
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15121898622150575182&as_sdt=5,33&sciodt=0,33&hl=en&oe=ASCII",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=NdcQQ82mfy",
        "pdf": "https://openreview.net/pdf?id=NdcQQ82mfy",
        "email": "lenovo.com;lenovo.com;lenovo.com;;lenovo.com;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn",
        "author_num": 8,
        "aff_unique_index": "0;1;1;0;2;2;2",
        "aff_unique_norm": "Lenovo Group Limited;Lenovo;Shanghai Jiao Tong University",
        "aff_unique_dep": ";Research;",
        "aff_unique_url": "https://www.lenovo.com;https://www.lenovo.com;https://www.sjtu.edu.cn",
        "aff_unique_abbr": "Lenovo;Lenovo;SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Training Socially Aligned Language Models on Simulated Social Interactions",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18780",
        "id": "NddKiWtdUm",
        "author_site": "Ruibo Liu, Ruixin Yang, Chenyan Jia, Ge Zhang, Diyi Yang, Soroush Vosoughi",
        "tldr": "",
        "abstract": "The goal of social alignment for AI systems is to make sure these models can conduct themselves appropriately following social values. Unlike humans who establish a consensus on value judgments through social interaction, current language models (LMs) are trained to rigidly recite the corpus in social isolation, which causes poor generalization in unfamiliar cases and the lack of robustness under adversarial attacks. In this work, we introduce a new training paradigm that enables LMs to learn from simulated social interactions. Compared with existing methods, our method is much more scalable and efficient, and shows superior performance in alignment benchmarks and human evaluation.",
        "keywords": "AI alignment;AI safety;Natural Language Processing",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/b3d44cc2ae546df84b29790eaee520c8490482e8.zip",
        "author": "Ruibo Liu;Ruixin Yang;Chenyan Jia;Ge Zhang;Diyi Yang;Soroush Vosoughi",
        "authorids": "~Ruibo_Liu1;~Ruixin_Yang1;~Chenyan_Jia1;~Ge_Zhang5;~Diyi_Yang2;~Soroush_Vosoughi1",
        "gender": "M;;F;M;F;",
        "homepage": "https://www.cs.dartmouth.edu/~rbliu/;https://99starman.github.io/;https://www.jiachenyan.com/;;https://cs.stanford.edu/~diyiy/;https://www.cs.dartmouth.edu/~soroush/",
        "dblp": ";;278/8322;;70/11145;01/1709",
        "google_scholar": "5lgfeo4AAAAJ;Q7Vn8OAAAAAJ;S34REOAAAAAJ;qyTrq4kAAAAJ;j9jhYqQAAAAJ;45DAXkwAAAAJ",
        "orcid": ";;0000-0002-8407-9224;;;0000-0002-2564-8909",
        "linkedin": ";;;ge-zhang-792797169/;;",
        "or_profile": "~Ruibo_Liu1;~Ruixin_Yang1;~Chenyan_Jia1;~Ge_Zhang5;~Diyi_Yang2;~Soroush_Vosoughi1",
        "aff": "Google DeepMind;University of British Columbia;;University of Waterloo;Stanford University;Dartmouth College",
        "aff_domain": "google.com;ubc.ca;;cs.uwaterloo.ca;stanford.edu;dartmouth.edu",
        "position": "Researcher;Undergrad student;;PhD student;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nliu2024training,\ntitle={Training Socially Aligned Language Models on Simulated Social Interactions},\nauthor={Ruibo Liu and Ruixin Yang and Chenyan Jia and Ge Zhang and Diyi Yang and Soroush Vosoughi},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=NddKiWtdUm}\n}",
        "github": "",
        "project": "",
        "reviewers": "hsFk;BAdV;ysok;MNpe;3QcT",
        "pdf_size": 2396766,
        "rating": "5;6;6;6;8",
        "confidence": "3;3;3;3;3",
        "soundness": "2;2;3;3;4",
        "contribution": "3;3;3;3;3",
        "presentation": "3;4;3;3;3",
        "wc_summary": "53;45;66;187;63",
        "wc_strengths": "110;96;38;101;37",
        "wc_weaknesses": "537;249;76;204;98",
        "wc_questions": "197;19;185;280;3",
        "wc_review": "897;409;365;772;201",
        "wc_reply_reviewers": "93;0;0;350;0",
        "wc_reply_authors": "1198;408;558;1466;295",
        "reply_reviewers": "1;0;0;3;0",
        "reply_authors": "2;1;1;4;1",
        "rating_avg": [
            6.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.8,
            0.7483314773547882
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.2,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            82.8,
            52.628509384173135
        ],
        "wc_strengths_avg": [
            76.4,
            32.078653338318304
        ],
        "wc_weaknesses_avg": [
            232.8,
            165.15859045172311
        ],
        "wc_questions_avg": [
            136.8,
            107.91922905580822
        ],
        "wc_review_avg": [
            528.8,
            262.05068212084467
        ],
        "wc_reply_reviewers_avg": [
            88.6,
            135.57226855076223
        ],
        "wc_reply_authors_avg": [
            785.0,
            462.18784060163244
        ],
        "reply_reviewers_avg": [
            0.8,
            1.1661903789690602
        ],
        "reply_authors_avg": [
            1.8,
            1.1661903789690602
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 54,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3770542821846459112&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=NddKiWtdUm",
        "pdf": "https://openreview.net/pdf?id=NddKiWtdUm",
        "email": "google.com;ubc.ca;;cs.uwaterloo.ca;stanford.edu;dartmouth.edu",
        "author_num": 6,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "Google;University of British Columbia;University of Waterloo;Stanford University;Dartmouth College",
        "aff_unique_dep": "Google DeepMind;;;;",
        "aff_unique_url": "https://deepmind.com;https://www.ubc.ca;https://uwaterloo.ca;https://www.stanford.edu;https://www.dartmouth.edu",
        "aff_unique_abbr": "DeepMind;UBC;UW;Stanford;Dartmouth",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Stanford",
        "aff_country_unique_index": "0;1;1;2;2",
        "aff_country_unique": "United Kingdom;Canada;United States"
    },
    {
        "id": "NdzJKFf0Q2",
        "title": "A Dataset and Benchmark for Copyright Protection from Text-to-Image Diffusion Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Copyright is a legal right that grants creators the exclusive authority to reproduce, distribute, and profit from their creative works. However, the recent advancements in text-to-image generation techniques have posed significant challenges to copyright protection, as these methods have facilitated the learning of unauthorized content, artistic creations, and portraits, which are subsequently utilized to generate and disseminate uncontrolled content. Especially, the use of stable diffusion, an emerging model for text-to-image generation, poses an increased risk of unauthorized copyright infringement and distribution. And there is currently a lack of systematic studies evaluating the potential correlation between content generated by stable diffusion and copyright infringement. Conducting such studies faces several challenges, including i) the inherent ambiguity surrounding copyright infringement in text-to-image models, ii) the absence of a large-scale inference dataset, and iii) the lack of standardized metrics for defining copyright infringement. This work provides the first large-scale standardized dataset and benchmark on copyright protection. Specifically, we propose a pipeline to coordinate CLIP, ChatGPT, and diffusion models to generate a dataset that contains anchor images, corresponding prompts, and images generated by text-to-image models, reflecting the potential abuses of copyright. Furthermore, we propose a suite of evaluation metrics to judge the effectiveness of copyright protection methods. The proposed dataset, benchmark library, and evaluation metrics will be open-sourced to facilitate future research and application.",
        "keywords": "Copyright Protection;Stable diffusion",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/2c9ab2c9223212355756c7cfc868919ecbdc4e5e.pdf",
        "author": "Rui Ma;Qiang Zhou;Bangjun Xiao;Daquan Zhou;Xiuyu Li;Aishani Singh;Yi Qu;Kurt Keutzer;Xiaodong Xie;Jingtong Hu;Zhen Dong;Shanghang Zhang",
        "authorids": "~Rui_Ma3;~Qiang_Zhou6;~Bangjun_Xiao1;~Daquan_Zhou1;~Xiuyu_Li1;~Aishani_Singh1;~Yi_Qu2;~Kurt_Keutzer1;~Xiaodong_Xie1;~Jingtong_Hu1;~Zhen_Dong3;~Shanghang_Zhang4",
        "gender": "M;M;M;Not Specified;F;F;M;M;M;M;M;F",
        "homepage": ";;https://github.com/xbjpku;https://xiuyuli.com/;https://www.linkedin.com/in/aishani-singh-416336219/;http://www.eachyiqu.com;https://people.eecs.berkeley.edu/~keutzer/;http://idm.pku.edu.cn/en/info/1009/1010.htm;http://www.pitt.edu/~jthu/index.html;https://dong-zhen.com/;;https://www.shanghangzhang.com/",
        "dblp": ";;;279/5847;;;k/KurtKeutzer.html;;37/3401;;244/9623;95/11531",
        "google_scholar": "https://scholar.google.com.hk/citations?user=IJTYZlUAAAAJ;https://scholar.google.com.hk/citations?user=CMYTxUEAAAAJ;;https://scholar.google.com/citations?;;;ID9QePIAAAAJ;;OcWo8CYAAAAJ;czxMUzcAAAAJ;DdCAbWwAAAAJ;voqw10cAAAAJ",
        "orcid": ";;;;;;0000-0003-3868-8501;;0000-0003-4029-4034;;;",
        "linkedin": ";;;;aishani-singh-416336219/;;kurtkeutzer/;;;zhen-dong/;;",
        "or_profile": "~Rui_Ma3;~Qiang_Zhou6;~Bangjun_Xiao1;~Xiuyu_Li1;~Aishani_Singh1;~Yi_Qu2;~Kurt_Keutzer1;~Xiaodong_Xie1;~Jingtong_Hu1;~Zhen_Dong3;~Zhou_Daquan1;~Shanghang_Zhang1",
        "aff": "Peking University;University of Pittsburgh;Peking University;University of California, Berkeley;The Harker School;;University of California, Berkeley;Peking University;University of Pittsburgh;Nexusflow.ai Inc;Bytedance;Peking University",
        "aff_domain": "pku.edu.cn;pitt.edu;pku.edu.cn;berkeley.edu;harker.org;;berkeley.edu;pku.edu.cn;pitt.edu;nexusflow.ai;bytedance.com;pku.edu.cn",
        "position": "PhD student;PhD student;Undergrad student;PhD student;Student;;Full Professor;Full Professor;Associate Professor;Principal Researcher;Researcher;Assistant Professor",
        "bibtex": "@misc{\nma2024a,\ntitle={A Dataset and Benchmark for Copyright Protection from Text-to-Image Diffusion Models},\nauthor={Rui Ma and Qiang Zhou and Bangjun Xiao and Daquan Zhou and Xiuyu Li and Aishani Singh and Yi Qu and Kurt Keutzer and Xiaodong Xie and Jingtong Hu and Zhen Dong and Shanghang Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=NdzJKFf0Q2}\n}",
        "github": "",
        "project": "",
        "reviewers": "rnSG;oagV;G9qh",
        "site": "https://openreview.net/forum?id=NdzJKFf0Q2",
        "pdf_size": 7908740,
        "rating": "3;5;6",
        "confidence": "4;5;4",
        "soundness": "1;3;3",
        "contribution": "3;3;3",
        "presentation": "3;3;3",
        "wc_summary": "118;85;23",
        "wc_strengths": "10;73;39",
        "wc_weaknesses": "219;279;98",
        "wc_questions": "82;15;3",
        "wc_review": "429;452;163",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            75.33333333333333,
            39.38132665222045
        ],
        "wc_strengths_avg": [
            40.666666666666664,
            25.746628689770024
        ],
        "wc_weaknesses_avg": [
            198.66666666666666,
            75.2787412812468
        ],
        "wc_questions_avg": [
            33.333333333333336,
            34.75949110994323
        ],
        "wc_review_avg": [
            348.0,
            131.15131210425105
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            12,
            0
        ],
        "corr_rating_confidence": 0.18898223650461357,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7108281601473819350&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;0;2;3;2;0;1;4;5;0",
        "aff_unique_norm": "Peking University;University of Pittsburgh;University of California, Berkeley;Harker School;Nexusflow.ai;ByteDance",
        "aff_unique_dep": ";;;;;",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.pitt.edu;https://www.berkeley.edu;https://www.harker.org;https://www.nexusflow.ai;https://www.bytedance.com",
        "aff_unique_abbr": "Peking U;Pitt;UC Berkeley;;Nexusflow.ai;Bytedance",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Berkeley",
        "aff_country_unique_index": "0;1;0;1;1;1;0;1;1;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "NeKjkOWvwd",
        "title": "Rethinking the OoD Generalization for Deep Neural Network: A Frequency Domain Perspective",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Out-of-distribution (OoD) generalization has long been a challenging problem that remains largely unsolved. Despite numerous attempts to generalize image classification models to OoD datasets, few novel proposals have surpassed the classical Empirical Risk Minimization (ERM) methodology systematically. In this work, we introduce frequency-based analysis into the study of OoD generalization for images. Based on the Shapley value, a theoretical measure in game theory, we quantify the influence of each frequency component on the model's performance. With this analysis, we can explain the model's performance statistically. We observe that although the fallacious outputs of our model on OoD generalization tasks frequently stem from low-frequency components of OoD images, the interference pattern is highly class-wise.  To further exploit our observation, we propose Class-wise Frequency Augmentation (CFA) to augment favorable frequency components and inhibit unfavorable ones. This approach can greatly improve the performance of existing OoD generalization algorithms. Our extensive experiments on five baseline OoD algorithms across seven OoD datasets provide encouraging results that prove the effectiveness of CFA on OoD generalization. Especially,\nCFA  outperforms the state-of-the-art methods with the most substantial improvement on ColoredMNIST, increasing the identification accuracy from 60.2\\% to 73.0\\%.",
        "keywords": "OoD Generalization;Explainability;Deep Neural Networks",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/487fcdab83eae8c790930c280b2aa3b3bbb6ce77.zip",
        "author": "Xue Zhao;Yifei Wu;Jundong Zhou;Zhanxing Zhu;Nanyang Ye",
        "authorids": "~Xue_Zhao4;~Yifei_Wu5;~Jundong_Zhou1;~Zhanxing_Zhu1;~Nanyang_Ye1",
        "gender": "F;;M;M;",
        "homepage": ";;https://github.com/Ulricall;https://zhanxingzhu.github.io/;",
        "dblp": ";;;87/7756.html;175/2581",
        "google_scholar": ";;;a2sHceIAAAAJ;",
        "orcid": "0000-0002-0752-3926;;;;",
        "linkedin": ";;;;",
        "or_profile": "~Xue_Zhao4;~Yifei_Wu5;~Jundong_Zhou1;~Zhanxing_Zhu1;~Nanyang_Ye1",
        "aff": "Shanghai Jiaotong University;;Shanghai Jiaotong University;University of Southampton;Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn;;sjtu.edu.cn;soton.ac.uk;sjtu.edu",
        "position": "PhD student;;Undergrad student;Associate Professor;Associate Professor",
        "bibtex": "@misc{\nanonymous2024rethinking,\ntitle={Rethinking the OoD Generalization for Deep Neural Network: A Frequency Domain Perspective},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=NeKjkOWvwd}\n}",
        "github": "",
        "project": "",
        "reviewers": "BXsg;L2GP;4fGE",
        "site": "https://openreview.net/forum?id=NeKjkOWvwd",
        "pdf_size": 6915769,
        "rating": "5;5;6",
        "confidence": "4;4;3",
        "soundness": "2;1;3",
        "contribution": "3;2;3",
        "presentation": "2;2;3",
        "wc_summary": "107;46;33",
        "wc_strengths": "44;17;60",
        "wc_weaknesses": "551;382;202",
        "wc_questions": "387;195;96",
        "wc_review": "1089;640;391",
        "wc_reply_reviewers": "84;0;18",
        "wc_reply_authors": "775;727;627",
        "reply_reviewers": "1;0;1",
        "reply_authors": "2;1;1",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            62.0,
            32.25936556516056
        ],
        "wc_strengths_avg": [
            40.333333333333336,
            17.745108872274887
        ],
        "wc_weaknesses_avg": [
            378.3333333333333,
            142.50224169776732
        ],
        "wc_questions_avg": [
            226.0,
            120.8056290079233
        ],
        "wc_review_avg": [
            706.6666666666666,
            288.8302077153442
        ],
        "wc_reply_reviewers_avg": [
            34.0,
            36.11094017053558
        ],
        "wc_reply_authors_avg": [
            709.6666666666666,
            61.651349449050095
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9999999999999997,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Zs6iOfFUMK0J:scholar.google.com/&scioq=Rethinking+the+OoD+Generalization+for+Deep+Neural+Network:+A+Frequency+Domain+Perspective&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Shanghai Jiao Tong University;University of Southampton",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.sjtu.edu.cn;https://www.southampton.ac.uk",
        "aff_unique_abbr": "SJTU;Southampton",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "id": "NeWiiF6KLB",
        "title": "Stabilized E(n)-Equivariant Graph Neural Networks-assisted Generative Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Due to its simplicity and computational efficiency, the E(n)-equivariant graph neural network (EGNN) [Satorras, et al., ICML, 2021] has been used as the backbone of equivariant normalizing flows (ENF), equivariant diffusion model (EDM), and beyond for Euclidean equivariant generative modeling. Nonetheless, it has been observed that ENF and EDM can be unstable; in this paper, we investigate the source of their instability by performing a sensitivity analysis of their backpropagation. Based on our theoretical analysis, we propose a regularization to stabilize and improve ENF and EDM. Experiments on benchmark datasets demonstrate that the regularized ENF outperforms the baseline model in terms of stability and computational efficiency by a remarkable margin. Furthermore, our results show that the proposed regularization can stabilize EDM and improve its performance.",
        "keywords": "Equivariance;graph neural networks;generative models;stabilization;regularization",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/e0ff21ae988a2de95bc23fabc1c6d953f4f23544.zip",
        "author": "Justin Baker;Yuhao Huang;Shih-Hsin Wang;Massimiliano Lupo Pasini;Andrea L. Bertozzi;Bao Wang",
        "authorids": "~Justin_Baker1;~Yuhao_Huang5;~Shih-Hsin_Wang1;~Massimiliano_Lupo_Pasini1;~Andrea_L._Bertozzi2;~Bao_Wang1",
        "gender": ";M;M;M;;M",
        "homepage": ";;;https://www.ornl.gov/staff-profile/massimiliano-lupo-pasini;;https://www.math.utah.edu/~bwang/index.html",
        "dblp": ";;;198/9071.html;;",
        "google_scholar": ";;;IjKevD8AAAAJ;;",
        "orcid": ";;;0000-0002-4980-6924;;",
        "linkedin": ";yuhao-huang-b86872195/;shih-hsin-sam-wang-9803671a5/;massimiliano-lupo-pasini-78797388/;;",
        "or_profile": "~Justin_Baker1;~Yuhao_Huang5;~Shih-Hsin_Wang1;~Massimiliano_Lupo_Pasini1;~Andrea_L._Bertozzi2;~Bao_Wang1",
        "aff": ";University of Utah;University of Utah;Oak Ridge National Laboratory;;University of Utah",
        "aff_domain": ";utah.edu;utah.edu;ornl.gov;;utah.edu",
        "position": ";PhD student;PhD student;Researcher;;Assistant Professor",
        "bibtex": "@misc{\nbaker2024stabilized,\ntitle={Stabilized E(n)-Equivariant Graph Neural Networks-assisted Generative Models},\nauthor={Justin Baker and Yuhao Huang and Shih-Hsin Wang and Massimiliano Lupo Pasini and Andrea L. Bertozzi and Bao Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=NeWiiF6KLB}\n}",
        "github": "",
        "project": "",
        "reviewers": "9sae;Tc5b;wjdT",
        "site": "https://openreview.net/forum?id=NeWiiF6KLB",
        "pdf_size": 1603916,
        "rating": "3;5;6",
        "confidence": "3;4;3",
        "soundness": "2;3;3",
        "contribution": "2;2;3",
        "presentation": "3;3;3",
        "wc_summary": "51;53;169",
        "wc_strengths": "20;64;107",
        "wc_weaknesses": "63;241;102",
        "wc_questions": "419;53;30",
        "wc_review": "553;411;408",
        "wc_reply_reviewers": "103;138;0",
        "wc_reply_authors": "1664;517;258",
        "reply_reviewers": "1;1;0",
        "reply_authors": "3;2;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            91.0,
            55.16037224916694
        ],
        "wc_strengths_avg": [
            63.666666666666664,
            35.51838334659329
        ],
        "wc_weaknesses_avg": [
            135.33333333333334,
            76.39517145881814
        ],
        "wc_questions_avg": [
            167.33333333333334,
            178.202755933297
        ],
        "wc_review_avg": [
            457.3333333333333,
            67.65763486522091
        ],
        "wc_reply_reviewers_avg": [
            80.33333333333333,
            58.573790118865354
        ],
        "wc_reply_authors_avg": [
            813.0,
            610.9669931073746
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.18898223650461363,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7346324861243299882&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "University of Utah;Oak Ridge National Laboratory",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.utah.edu;https://www.ornl.gov",
        "aff_unique_abbr": "Utah;ORNL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Replay across Experiments: A Natural Extension of Off-Policy RL",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18779",
        "id": "Nf4Lm6fXN8",
        "author_site": "Dhruva Tirumala, Thomas Lampe, Jose Enrique Chen, Tuomas Haarnoja, Sandy Huang, Guy Lever, Ben Moran, Tim Hertweck, Leonard Hasenclever, Martin Riedmiller, Nicolas Heess, Markus Wulfmeier",
        "tldr": "",
        "abstract": "Replaying data is a principal mechanism underlying the stability and data efficiency of off-policy reinforcement learning (RL).\nWe present an effective yet simple framework to extend the use of replays across multiple experiments, minimally adapting the RL workflow for sizeable improvements in controller performance and research iteration times.\nAt its core, Replay across Experiments (RaE) involves reusing experience from previous experiments to improve exploration and bootstrap learning while reducing required changes to a minimum in comparison to prior work. \nWe empirically show benefits across a number of RL algorithms and challenging control domains spanning both locomotion and manipulation, including hard exploration tasks from egocentric vision. \nThrough comprehensive ablations, we demonstrate  robustness to the quality and amount of data available and various hyperparameter choices. Finally, we discuss how our approach can be applied more broadly across research life cycles and can increase resilience by reloading data across random seeds or hyperparameter variations.",
        "keywords": "reinforcement learning;robotics;data transfer",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Dhruva Tirumala;Thomas Lampe;Jose Enrique Chen;Tuomas Haarnoja;Sandy Huang;Guy Lever;Ben Moran;Tim Hertweck;Leonard Hasenclever;Martin Riedmiller;Nicolas Heess;Markus Wulfmeier",
        "authorids": "~Dhruva_Tirumala1;~Thomas_Lampe1;~Jose_Enrique_Chen1;~Tuomas_Haarnoja1;~Sandy_Huang1;~Guy_Lever1;~Ben_Moran2;~Tim_Hertweck1;~Leonard_Hasenclever1;~Martin_Riedmiller1;~Nicolas_Heess1;~Markus_Wulfmeier1",
        "gender": ";;M;F;M;M;;M;M;;M;",
        "homepage": ";;;https://shhuang.github.io/;;;;;https://www.riedmiller.me/;;;",
        "dblp": "139/5934;;80/9963;153/7841;52/6149;;;150/1667;;76/9181;166/1552;190/7697.html",
        "google_scholar": ";;VT7peyEAAAAJ;eurA6WgAAAAJ;;;https://scholar.google.de/citations?user=dlzWP0UAAAAJ;https://scholar.google.co.uk/citations?user=dD-3S4QAAAAJ;1gVfqpcAAAAJ;79k7bGEAAAAJ;;HqKq-2YAAAAJ",
        "orcid": ";;;;;0000-0002-9254-662X;;;;;;",
        "linkedin": ";jos%C3%A9-enrique-chen-27b38149/;tuomas-haarnoja;;;;;;;;;",
        "or_profile": "~Thomas_Lampe1;~Jose_Enrique_Chen1;~Tuomas_Haarnoja1;~Sandy_Huang1;~Guy_Lever1;~Ben_Moran2;~Tim_Hertweck1;~Leonard_Hasenclever1;~Martin_Riedmiller1;~Nicolas_Heess1;~Markus_Wulfmeier1;~Dhruva_TB1",
        "aff": "Google DeepMind;Google DeepMind;Google DeepMind;Google DeepMind;;Google DeepMind;Google DeepMind;Google DeepMind;;Google DeepMind;Google DeepMind;University College London",
        "aff_domain": "deepmind.com;google.com;deepmind.com;deepmind.com;;deepmind.com;deepmind.com;google.com;;google.com;deepmind.com;ucl.ac.uk",
        "position": "Researcher;Research Engineer;Research Scientist;Research Scientist;;Researcher;Researcher;Research Scientist;;Research Scientist;Research Scientist;PhD student",
        "bibtex": "@inproceedings{\ntirumala2024replay,\ntitle={Replay across Experiments: A Natural Extension of Off-Policy {RL}},\nauthor={Dhruva Tirumala and Thomas Lampe and Jose Enrique Chen and Tuomas Haarnoja and Sandy Huang and Guy Lever and Ben Moran and Tim Hertweck and Leonard Hasenclever and Martin Riedmiller and Nicolas Heess and Markus Wulfmeier},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Nf4Lm6fXN8}\n}",
        "github": "",
        "project": "",
        "reviewers": "u3fY;fgij;wVcc;gauC",
        "pdf_size": 3336148,
        "rating": "6;6;6;8",
        "confidence": "4;4;4;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;2;4",
        "presentation": "3;3;4;3",
        "wc_summary": "23;118;73;49",
        "wc_strengths": "53;84;116;14",
        "wc_weaknesses": "51;334;62;25",
        "wc_questions": "178;50;304;152",
        "wc_review": "305;586;555;240",
        "wc_reply_reviewers": "16;635;81;197",
        "wc_reply_authors": "504;1045;613;758",
        "reply_reviewers": "1;2;1;2",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            65.75,
            34.966948680146515
        ],
        "wc_strengths_avg": [
            66.75,
            37.7317836843158
        ],
        "wc_weaknesses_avg": [
            118.0,
            125.42926293333626
        ],
        "wc_questions_avg": [
            171.0,
            90.47098982546837
        ],
        "wc_review_avg": [
            421.5,
            151.1596837784467
        ],
        "wc_reply_reviewers_avg": [
            232.25,
            241.39736431866856
        ],
        "wc_reply_authors_avg": [
            730.0,
            202.9618190694989
        ],
        "reply_reviewers_avg": [
            1.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            12,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10825926282440356465&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=Nf4Lm6fXN8",
        "pdf": "https://openreview.net/pdf?id=Nf4Lm6fXN8",
        "email": "deepmind.com;google.com;deepmind.com;deepmind.com;;deepmind.com;deepmind.com;google.com;;google.com;deepmind.com;ucl.ac.uk",
        "author_num": 12,
        "aff_unique_index": "0;0;0;0;0;0;0;0;0;1",
        "aff_unique_norm": "Google;University College London",
        "aff_unique_dep": "Google DeepMind;",
        "aff_unique_url": "https://deepmind.com;https://www.ucl.ac.uk",
        "aff_unique_abbr": "DeepMind;UCL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "Nfu3bUkmdH",
        "title": "Democratizing LLMs for Low-Resource Languages by Leveraging their English Dominant Abilities with Linguistically-Diverse Prompts",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs) are known to effectively perform tasks by simply observing few exemplars. However, in low-resource languages, obtaining such hand-picked exemplars can still be challenging, where unsupervised techniques may be necessary. Moreover, competent generative capabilities of LLMs are observed only in high-resource languages, while their performances among under-represented languages fall behind due to pre-training data imbalance. To elicit LLMs' ability onto low-resource languages without any supervised data, we propose to assemble synthetic exemplars from a diverse set of high-resource languages to prompt the LLMs to translate from any language into English. These prompts are then used to create intra-lingual exemplars to perform tasks in the target languages. Our unsupervised prompting method performs on par with supervised few-shot learning in LLMs of different sizes for translations between English and 13 Indic and 21 African low-resource languages. We also show that fine-tuning a 7B model on data generated from our method helps it perform competitively with a 175B model. In non-English translation tasks, our method even outperforms supervised prompting by up to 3 chrF++ in many low-resource languages. When evaluated on zero-shot multilingual summarization, our method surpasses other English-pivoting baselines by up to 4 ROUGE-L and is also favored by GPT-4.",
        "keywords": "Large language models;unsupervised learning;machine translation;low-resource languages;summarization",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Xuan-Phi Nguyen;Mahani Aljunied;Shafiq Joty;Lidong Bing",
        "authorids": "~Xuan-Phi_Nguyen1;~Mahani_Aljunied1;~Shafiq_Joty1;~Lidong_Bing2",
        "gender": "F;M;;M",
        "homepage": ";https://raihanjoty.github.io/;https://lidongbing.github.io;https://nxphi47.github.io/",
        "dblp": "84/9013.html;62/2078;53/6625;252/5270",
        "google_scholar": ";hR249csAAAAJ;https://scholar.google.com/citations?hl=en;HN8VxX4AAAAJ",
        "orcid": ";;;",
        "linkedin": "mahani-aljunied-a3607378/;;;xuanphinguyen/",
        "or_profile": "~Mahani_Aljunied1;~Shafiq_Joty1;~Lidong_Bing3;~Phi_Xuan_Nguyen1",
        "aff": "Alibaba Group;SalesForce.com;Alibaba Group;Alibaba Group",
        "aff_domain": "alibaba-inc.com;salesforce.com;alibaba-inc.com;alibaba-inc.com",
        "position": "Researcher;Principal Researcher;Scientist;Researcher",
        "bibtex": "@misc{\nnguyen2024democratizing,\ntitle={Democratizing {LLM}s for Low-Resource Languages by Leveraging their English Dominant Abilities with Linguistically-Diverse Prompts},\nauthor={Xuan-Phi Nguyen and Mahani Aljunied and Shafiq Joty and Lidong Bing},\nyear={2024},\nurl={https://openreview.net/forum?id=Nfu3bUkmdH}\n}",
        "github": "",
        "project": "",
        "reviewers": "8RdV;y5rc;qSbo",
        "site": "https://openreview.net/forum?id=Nfu3bUkmdH",
        "pdf_size": 576754,
        "rating": "5;6;6",
        "confidence": "4;3;3",
        "soundness": "2;3;2",
        "contribution": "2;3;2",
        "presentation": "3;3;2",
        "wc_summary": "37;65;36",
        "wc_strengths": "25;45;17",
        "wc_weaknesses": "209;147;93",
        "wc_questions": "68;48;24",
        "wc_review": "339;305;170",
        "wc_reply_reviewers": "75;13;9",
        "wc_reply_authors": "1381;951;761",
        "reply_reviewers": "1;1;1",
        "reply_authors": "2;2;2",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            46.0,
            13.4412301024373
        ],
        "wc_strengths_avg": [
            29.0,
            11.775681155103795
        ],
        "wc_weaknesses_avg": [
            149.66666666666666,
            47.39432689913659
        ],
        "wc_questions_avg": [
            46.666666666666664,
            17.98765008430939
        ],
        "wc_review_avg": [
            271.3333333333333,
            72.98553890250375
        ],
        "wc_reply_reviewers_avg": [
            32.333333333333336,
            30.214051182999096
        ],
        "wc_reply_authors_avg": [
            1031.0,
            259.35818218569216
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9999999999999997,
        "gs_citation": 35,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8757510317219133957&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Alibaba Group;Salesforce",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.alibaba.com;https://www.salesforce.com",
        "aff_unique_abbr": "Alibaba;Salesforce",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "Ng7OYC3PT8",
        "title": "ATraDiff: Accelerating Online Reinforcement Learning with Imaginary Trajectories",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Training autonomous agents with sparse rewards is a long-standing problem in online reinforcement learning (RL), due to low-data efficiency. Prior work overcomes this challenge by extracting useful knowledge from offline data, often accomplished through the learning of action distribution from offline data and utilizing the learned distribution to facilitate online RL. However, since the offline data are given and fixed, the extracted knowledge is inherently limited, making it difficult to generalize to new tasks. We propose a novel approach that leverages offline data to learn a generative diffusion model, coined as Adaptive Trajectory Diffuser (ATraDiff). This model generates synthetic trajectories, serving as a form of data augmentation and consequently enhancing the performance of online RL methods. The key strength of our diffuser lies in its adaptability, allowing it to effectively handle varying trajectory lengths and mitigate distribution shifts between online and offline data. Because of its simplicity, ATraDiff seamlessly integrates with a wide spectrum of RL methods. Empirical evaluation shows that ATraDiff consistently achieves state-of-the-art performance across a variety of environments, with particularly pronounced improvements in complicated settings.",
        "keywords": "Reinforcement Learning;Diffusion Model",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/75c8b21158f1582b3c61cf39d7715e7d72c1b57c.pdf",
        "author": "Qianlan Yang;Yu-Xiong Wang",
        "authorids": "~Qianlan_Yang1;~Yu-Xiong_Wang1",
        "gender": "M;",
        "homepage": "https://github.com/yanQval;https://yxw.cs.illinois.edu/",
        "dblp": "294/4952;35/10700",
        "google_scholar": "iV5nuc4AAAAJ;T_Q-xDkAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Qianlan_Yang1;~Yu-Xiong_Wang1",
        "aff": "Amazon;Department of Computer Science, University of Illinois Urbana-Champaign",
        "aff_domain": "amazon.com;cs.illinois.edu",
        "position": "Intern;Assistant Professor",
        "bibtex": "@misc{\nyang2024atradiff,\ntitle={{AT}raDiff: Accelerating Online Reinforcement Learning with Imaginary Trajectories},\nauthor={Qianlan Yang and Yu-Xiong Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=Ng7OYC3PT8}\n}",
        "github": "",
        "project": "",
        "reviewers": "rtc7;GZoQ;8Lyo;cnq2;Kzne",
        "site": "https://openreview.net/forum?id=Ng7OYC3PT8",
        "pdf_size": 1502580,
        "rating": "3;3;5;6;6",
        "confidence": "5;3;3;4;4",
        "soundness": "2;2;3;3;4",
        "contribution": "3;2;2;3;4",
        "presentation": "1;3;3;3;3",
        "wc_summary": "84;53;62;57;215",
        "wc_strengths": "54;35;88;14;70",
        "wc_weaknesses": "453;156;2;130;25",
        "wc_questions": "15;28;128;111;31",
        "wc_review": "606;272;280;312;341",
        "wc_reply_reviewers": "113;0;219;77;0",
        "wc_reply_authors": "1994;818;1430;945;248",
        "reply_reviewers": "1;0;2;1;0",
        "reply_authors": "3;2;3;2;1",
        "rating_avg": [
            4.6,
            1.3564659966250536
        ],
        "confidence_avg": [
            3.8,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.8,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.8,
            0.7483314773547882
        ],
        "presentation_avg": [
            2.6,
            0.8000000000000002
        ],
        "wc_summary_avg": [
            94.2,
            61.34297025739787
        ],
        "wc_strengths_avg": [
            52.2,
            25.910615585122635
        ],
        "wc_weaknesses_avg": [
            153.2,
            161.0731510835993
        ],
        "wc_questions_avg": [
            62.6,
            47.07695827047453
        ],
        "wc_review_avg": [
            362.2,
            124.33889174349271
        ],
        "wc_reply_reviewers_avg": [
            81.8,
            81.48963124226296
        ],
        "wc_reply_authors_avg": [
            1087.0,
            589.363046008146
        ],
        "reply_reviewers_avg": [
            0.8,
            0.7483314773547883
        ],
        "reply_authors_avg": [
            2.2,
            0.7483314773547882
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.07881104062391013,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9121381314508401071&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Amazon;University of Illinois Urbana-Champaign",
        "aff_unique_dep": "Amazon.com, Inc.;Department of Computer Science",
        "aff_unique_url": "https://www.amazon.com;https://illinois.edu",
        "aff_unique_abbr": "Amazon;UIUC",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Urbana-Champaign",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Predictive, scalable and interpretable knowledge tracing on structured domains",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18778",
        "id": "NgaLU2fP5D",
        "author_site": "Hanqi Zhou, Robert Bamler, Charley Wu, \u00c1lvaro Tejero-Cantero",
        "tldr": "",
        "abstract": "Intelligent tutoring systems optimize the selection and timing of learning materials to enhance understanding and long-term retention. This requires estimates of both the learner's progress (\"knowledge tracing\"; KT), and the prerequisite structure of the learning domain (\"knowledge mapping\"). While recent deep learning models achieve high KT accuracy, they do so at the expense of the interpretability of psychologically-inspired models. In this work, we present a solution to this trade-off. PSI-KT is a hierarchical generative approach that explicitly models how both individual cognitive traits and the prerequisite structure of knowledge influence learning dynamics, thus achieving interpretability by design. Moreover, by using scalable Bayesian inference, PSI-KT targets the real-world need for efficient personalization even with a growing body of learners and interaction data. Evaluated on three datasets from online learning platforms, PSI-KT achieves superior multi-step **p**redictive accuracy and **s**calable inference in continual-learning settings, all while providing **i**nterpretable representations of learner-specific traits and the prerequisite structure of knowledge that causally supports learning. In sum, predictive, scalable and interpretable knowledge tracing with solid knowledge mapping lays a key foundation for effective personalized learning to make education accessible to a broad, global audience.",
        "keywords": "knowledge tracing;interpretable representations;knowledge graphs;probabilistic models;variational inference;continual learning",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/5894d4b61a69bee95b6b2de7013fd1b76828d1ee.zip",
        "author": "Hanqi Zhou;Robert Bamler;Charley M Wu;\u00c1lvaro Tejero-Cantero",
        "authorids": "~Hanqi_Zhou1;~Robert_Bamler1;~Charley_M_Wu1;~\u00c1lvaro_Tejero-Cantero1",
        "gender": "F;M;M;M",
        "homepage": "https://www.linkedin.com/in/hanqi-zhou-b521a4175/;https://robamler.github.io/;https://hmc-lab.com;https://mlcolab.org",
        "dblp": ";195/6208.html;212/3980;",
        "google_scholar": ";LwvdNAgAAAAJ;1O2hcVgAAAAJ;https://scholar.google.es/citations?user=VObPwpUAAAAJ",
        "orcid": ";;;0000-0002-8768-4227",
        "linkedin": ";;;",
        "or_profile": "~Hanqi_Zhou1;~Robert_Bamler1;~Charley_M_Wu1;~\u00c1lvaro_Tejero-Cantero1",
        "aff": "Eberhard-Karls-Universit\u00e4t T\u00fcbingen;University of Tuebingen;Eberhard-Karls-Universit\u00e4t T\u00fcbingen;University of Tuebingen",
        "aff_domain": "uni-tuebingen.de;uni-tuebingen.de;uni-tuebingen.de;uni-tuebingen.de",
        "position": "PhD student;Assistant Professor;Principal Researcher;Principal Researcher",
        "bibtex": "@inproceedings{\nzhou2024predictive,\ntitle={Predictive, scalable and interpretable knowledge tracing on structured domains},\nauthor={Hanqi Zhou and Robert Bamler and Charley M Wu and {\\'A}lvaro Tejero-Cantero},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=NgaLU2fP5D}\n}",
        "github": "",
        "project": "",
        "reviewers": "k3Pn;da66;J4qa;rAUs",
        "pdf_size": 1090133,
        "rating": "5;6;8;8",
        "confidence": "4;4;3;3",
        "soundness": "3;2;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "47;45;174;86",
        "wc_strengths": "43;126;165;106",
        "wc_weaknesses": "264;91;151;92",
        "wc_questions": "121;40;136;64",
        "wc_review": "475;302;626;348",
        "wc_reply_reviewers": "0;58;0;0",
        "wc_reply_authors": "1324;966;694;730",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "3;2;1;1",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            88.0,
            52.2733201547405
        ],
        "wc_strengths_avg": [
            110.0,
            44.11915683691156
        ],
        "wc_weaknesses_avg": [
            149.5,
            70.42904230500369
        ],
        "wc_questions_avg": [
            90.25,
            39.53716605929161
        ],
        "wc_review_avg": [
            437.75,
            125.80615048557841
        ],
        "wc_reply_reviewers_avg": [
            14.5,
            25.11473670974872
        ],
        "wc_reply_authors_avg": [
            928.5,
            251.1070488855301
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9622504486493761,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14202142168139878285&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=NgaLU2fP5D",
        "pdf": "https://openreview.net/pdf?id=NgaLU2fP5D",
        "email": "uni-tuebingen.de;uni-tuebingen.de;uni-tuebingen.de;uni-tuebingen.de",
        "author_num": 4,
        "aff_unique_index": "0;1;0;1",
        "aff_unique_norm": "Eberhard Karls University of T\u00fcbingen;University of Tuebingen",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uni-tuebingen.de/;https://www.uni-tuebingen.de/",
        "aff_unique_abbr": "Uni T\u00fcbingen;Uni T\u00fcbingen",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "T\u00fcbingen;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "NgtEafc8NZ",
        "title": "Vlearn: Off-Policy Learning with Efficient State-Value Function Estimation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Existing off-policy reinforcement learning algorithms typically necessitate an explicit state-action-value function representation, which becomes problematic in high-dimensional action spaces. \nThese algorithms often encounter challenges where they struggle with the curse of dimensionality, as maintaining a state-action-value function in such spaces becomes data-inefficient.\nIn this work, we propose a novel off-policy trust region optimization approach, called Vlearn, that eliminates the requirement for an explicit state-action-value function. \nInstead, we demonstrate how to efficiently leverage just a state-value function as the critic, thus overcoming several limitations of existing methods. \nBy doing so, Vlearn addresses the computational challenges posed by high-dimensional action spaces. \nFurthermore, Vlearn introduces an efficient approach to address the challenges associated with pure state-value function learning in the off-policy setting. \nThis approach not only simplifies the implementation of off-policy policy gradient algorithms but also leads to consistent and robust performance across various benchmark tasks. \nSpecifically, by removing the need for a state-action-value function Vlearn simplifies the learning process and allows for more efficient exploration and exploitation in complex environments.",
        "keywords": "Reinforcement learning;Off-Policy;Trust Region Optimization;Value Function",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Fabian Otto;Philipp Becker;Vien Anh Ngo;Gerhard Neumann",
        "authorids": "~Fabian_Otto1;~Philipp_Becker1;~Vien_Anh_Ngo1;~Gerhard_Neumann2",
        "gender": ";M;M;M",
        "homepage": ";;https://vienngo.github.io;https://alr.anthropomatik.kit.edu/",
        "dblp": "284/0547;66/1316;87/439;60/4878",
        "google_scholar": "dV8eLH8AAAAJ;https://scholar.google.de/citations?user=jXx-LuQAAAAJ;https://scholar.google.co.uk/citations?user=xk1gsM8AAAAJ;https://scholar.google.com.tw/citations?user=GL360kMAAAAJ",
        "orcid": "0000-0003-3484-1054;;;",
        "linkedin": "ottofabian/;;;",
        "or_profile": "~Fabian_Otto1;~Philipp_Becker1;~Vien_Anh_Ngo1;~Gerhard_Neumann1",
        "aff": "University of T\u00fcbingen;FZI Forschungszentrum Informatik ;Bosch Center for Artificial Intelligence;Karlsruhe Institute of Technology",
        "aff_domain": "uni-tuebingen.de;fzi.de;bosch.com;kit.edu",
        "position": "PhD student;Researcher;Research Scientist;Full Professor",
        "bibtex": "@misc{\notto2024vlearn,\ntitle={Vlearn: Off-Policy Learning with Efficient State-Value Function Estimation},\nauthor={Fabian Otto and Philipp Becker and Vien Anh Ngo and Gerhard Neumann},\nyear={2024},\nurl={https://openreview.net/forum?id=NgtEafc8NZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "aLJf;syZi;WLtt;FMyp",
        "site": "https://openreview.net/forum?id=NgtEafc8NZ",
        "pdf_size": 387788,
        "rating": "3;5;6;6",
        "confidence": "5;3;2;3",
        "soundness": "1;2;2;3",
        "contribution": "1;2;2;3",
        "presentation": "2;3;2;2",
        "wc_summary": "92;140;70;77",
        "wc_strengths": "51;60;22;31",
        "wc_weaknesses": "513;102;32;89",
        "wc_questions": "59;152;389;2",
        "wc_review": "715;454;513;199",
        "wc_reply_reviewers": "51;340;0;0",
        "wc_reply_authors": "707;907;518;657",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "3;2;2;2",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            94.75,
            27.307279249313726
        ],
        "wc_strengths_avg": [
            41.0,
            15.182226450688976
        ],
        "wc_weaknesses_avg": [
            184.0,
            191.7641780938244
        ],
        "wc_questions_avg": [
            150.5,
            147.74048192692482
        ],
        "wc_review_avg": [
            470.25,
            184.0996673000796
        ],
        "wc_reply_reviewers_avg": [
            97.75,
            141.40434045672006
        ],
        "wc_reply_authors_avg": [
            697.25,
            139.4997759854832
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9365858115816939,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:1YprjAp7vUwJ:scholar.google.com/&scioq=Vlearn:+Off-Policy+Learning+with+Efficient+State-Value+Function+Estimation&hl=en&as_sdt=0,33",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "University of T\u00fcbingen;FZI Forschungszentrum Informatik;Bosch Center for Artificial Intelligence;Karlsruhe Institute of Technology",
        "aff_unique_dep": ";;Center for Artificial Intelligence;",
        "aff_unique_url": "https://www.uni-tuebingen.de/;https://www.fzi.de;https://www.bosch-ai.com;https://www.kit.edu",
        "aff_unique_abbr": "Uni T\u00fcbingen;FZI;BCAI;KIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "Nh6pXEkZkK",
        "title": "Learning Rate Re-scheduling for AdaGrad in training Deep Neural Networks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The adaptive learning rate optimization algorithms have made a great improvement in the training of Deep Neural Networks (DNNs). It has been proved that adaptive learning rate methods can significantly improve training processing and can be adopted into various tasks. AdaGrad, As the first adaptive learning rate optimizer, usually performs worse than the following optimizers, such as Adam, RAdam, Adabelief, etc.  There are mainly two reasons: the first is that the stepsize for these optimizers is bounded so that the training is more stable, and the second is that they can use the decoupled weight decay regularization to improve their generalization performance. However, for AdaGrad, the updating delta constantly decreases to zero. Consequently,  the weights will change very slowly with the number of training iterations increasing. Meanwhile, it also makes the decoupled weight decay regularization perform unfavorably in AdaGrad.  We find that there is a big mistake when using AdaGrad in training DNNs. For other optimizers (e.g.,  Adam), they prove the regret-bound theorem with learning rate schedule $\\frac {1}{\\sqrt{T}}$, but in practice, they usually use more advanced learning rate schedule for training DNNs, such as step-wise decay schedule and cosine decay schedule. However, for AdaGrad, the algorithm implicitly contains a learning rate schedule $\\frac {1}{\\sqrt{T}}$, but in practice, most people directly add another learning rate schedule for AdaGrad. Such two learning rate schedules will largely drop its performance in training DNNs. So in this work, we propose a Learning Rate Re-scheduling (LRR) method for AdaGrad to drop the implicit learning rate $\\frac {1}{\\sqrt{T}}$, which can largely improve AdaGrad and make decoupled weight decay regularization perform well. The proposed LRR method can also be applied to other AdaGrad-type algorithms (ie, Shampoo). Comprehensive experiments indicate the effectiveness of the proposed LRR method. The source code will be made publicly available.",
        "keywords": "Deep neural network;Optimization;AdaGrad;Learning rate schedule",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/92da1b6f1e3280af3e20916ed6eb631bf0480549.pdf",
        "author": "Hongwei Yong",
        "authorids": "~Hongwei_Yong1",
        "gender": "M",
        "homepage": "https://sites.google.com/view/yonghongwei-homepage",
        "dblp": "191/4640",
        "google_scholar": "https://scholar.google.com.hk/citations?hl=zh-CN",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Hongwei_Yong1",
        "aff": "",
        "aff_domain": "",
        "position": "",
        "bibtex": "@misc{\nanonymous2024learning,\ntitle={Learning Rate Re-scheduling for AdaGrad in training Deep Neural Networks},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=Nh6pXEkZkK}\n}",
        "github": "",
        "project": "",
        "reviewers": "mVqq;fweP;49a3",
        "site": "https://openreview.net/forum?id=Nh6pXEkZkK",
        "pdf_size": 378086,
        "rating": "3;3;3",
        "confidence": "4;4;3",
        "soundness": "2;3;2",
        "contribution": "3;1;2",
        "presentation": "2;3;2",
        "wc_summary": "126;53;33",
        "wc_strengths": "65;49;36",
        "wc_weaknesses": "102;134;132",
        "wc_questions": "29;35;132",
        "wc_review": "322;271;333",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            70.66666666666667,
            39.96943276499625
        ],
        "wc_strengths_avg": [
            50.0,
            11.86029791643813
        ],
        "wc_weaknesses_avg": [
            122.66666666666667,
            14.636332266733433
        ],
        "wc_questions_avg": [
            65.33333333333333,
            47.204048790566915
        ],
        "wc_review_avg": [
            308.6666666666667,
            27.010286106510527
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:bz5uv8WuVlMJ:scholar.google.com/&scioq=Learning+Rate+Re-scheduling+for+AdaGrad+in+training+Deep+Neural+Networks&hl=en&as_sdt=0,33",
        "gs_version_total": 0
    },
    {
        "id": "NhLBhx5BVY",
        "title": "Instance Segmentation with Supervoxel Based Topological Loss Function",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Reconstructing the intricate local morphology of neurons as well as their long-range projecting axons can address many connectivity related questions in neuroscience. While whole-brain imaging at single neuron resolution has recently become available with advances in light microscopy, segmenting multiple entangled neuronal arbors remains a challenging instance segmentation problem. Split and merge mistakes in automated tracings of neuronal branches can produce qualitatively different results and represent a bottleneck of reconstruction pipelines. Here, by extending the notion of simple points from digital topology to connected sets of voxels (i.e. supervoxels), we develop a topology-aware neural network based segmentation method with minimal overhead. We demonstrate the merit of our approach on a newly established public dataset that contains 3-d images of the mouse brain where multiple fluorescing neurons are visible as well as the DRIVE 2-d retinal fundus images benchmark.",
        "keywords": "Instance segmentation;deep learning;digital topology",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/b2fbf775ba197aa4478dc275c052e9814e32d30f.pdf",
        "author": "Anna Grim;Jayaram Chandrashekar;Karel Svoboda;Uygar S\u00fcmb\u00fcl",
        "authorids": "~Anna_Grim1;jayaramc@alleninstitute.org;karel.svoboda@alleninstitute.org;~Uygar_S\u00fcmb\u00fcl2",
        "gender": ";;;",
        "homepage": ";;;",
        "dblp": ";;;",
        "google_scholar": ";;;",
        "orcid": ";;;",
        "linkedin": "anna-m-grim/;;;",
        "or_profile": "~Anna_Grim1;jayaramc@alleninstitute.org;karel.svoboda@alleninstitute.org;~Uygar_S\u00fcmb\u00fcl2",
        "aff": "Allen Institute;;;",
        "aff_domain": "alleninstitute.org;;;",
        "position": "Researcher;;;",
        "bibtex": "@misc{\ngrim2024instance,\ntitle={Instance Segmentation with Supervoxel Based Topological Loss Function},\nauthor={Anna Grim and Jayaram Chandrashekar and Karel Svoboda and Uygar S{\\\"u}mb{\\\"u}l},\nyear={2024},\nurl={https://openreview.net/forum?id=NhLBhx5BVY}\n}",
        "github": "",
        "project": "",
        "reviewers": "cPYQ;ZGQy;Jbm6",
        "site": "https://openreview.net/forum?id=NhLBhx5BVY",
        "pdf_size": 1096268,
        "rating": "5;5;6",
        "confidence": "4;5;4",
        "soundness": "3;2;2",
        "contribution": "2;2;3",
        "presentation": "4;2;2",
        "wc_summary": "76;85;135",
        "wc_strengths": "120;38;47",
        "wc_weaknesses": "119;31;105",
        "wc_questions": "146;51;182",
        "wc_review": "461;205;469",
        "wc_reply_reviewers": "60;0;164",
        "wc_reply_authors": "744;311;1134",
        "reply_reviewers": "1;0;1",
        "reply_authors": "3;2;3",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            98.66666666666667,
            25.952948879762307
        ],
        "wc_strengths_avg": [
            68.33333333333333,
            36.718145680606234
        ],
        "wc_weaknesses_avg": [
            85.0,
            38.60915262818736
        ],
        "wc_questions_avg": [
            126.33333333333333,
            55.25898619731958
        ],
        "wc_review_avg": [
            378.3333333333333,
            122.60868194744158
        ],
        "wc_reply_reviewers_avg": [
            74.66666666666667,
            67.75117875153335
        ],
        "wc_reply_authors_avg": [
            729.6666666666666,
            336.1411740458001
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:JCbRTWMiMioJ:scholar.google.com/&scioq=Instance+Segmentation+with+Supervoxel+Based+Topological+Loss+Function&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Allen Institute for Artificial Intelligence",
        "aff_unique_dep": "",
        "aff_unique_url": "https://allenai.org",
        "aff_unique_abbr": "AI2",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "NhUinwpVSQ",
        "title": "Policy Disentangled Variational Autoencoder",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep generative models for video primarily treat videos as visual representations of agents (e.g., people or objects) performing actions, often overlooking the underlying intentions driving those actions. In reinforcement learning, the policy determines actions based on the current context and is analogous to the underlying intention guiding those actions. Through the acquisition of policy representations, we can generate a video capturing how an agent would behave when following a specific policy in a given context. In this paper, we aim to learn the representation of the policy without supervision and the dynamics of the environment conditioned to the policy. We propose Policy Disentangled Variational Autoencoder (PDVAE) which can generate diverse videos aligned with the specified policy where the user can alter the policy during the generation. We demonstrate PDVAE with three video datasets: Moving MNIST, KTH action dataset, and VizDoom.",
        "keywords": "Video generative model;  Disentangled representation learning;  Generating video conditioned to the policy",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/1271c2dcc84b575bbd6cb57bee50698fcdbfc427.pdf",
        "author": "Tae Yoon Lim;Kanghoon Lee;Woohyung Lim",
        "authorids": "~Tae_Yoon_Lim1;~Kanghoon_Lee2;~Woohyung_Lim1",
        "gender": "M;M;M",
        "homepage": "https://github.com/tylim9307;https://www.linkedin.com/in/kanghoon-lee-54aab05b;",
        "dblp": ";161/0056.html;86/7195",
        "google_scholar": ";DiiPFc4AAAAJ;https://scholar.google.co.kr/citations?user=gtvxdcUAAAAJ",
        "orcid": ";;0000-0003-0525-9065",
        "linkedin": ";;woohyunglim/",
        "or_profile": "~Tae_Yoon_Lim1;~Kanghoon_Lee2;~Woohyung_Lim1",
        "aff": "LG AI Research;LG AI Research;LG AI Research",
        "aff_domain": "lgresearch.ai;lgresearch.ai;lgresearch.ai",
        "position": "Researcher;Principal Researcher;Vice President",
        "bibtex": "@misc{\nlim2024policy,\ntitle={Policy Disentangled Variational Autoencoder},\nauthor={Tae Yoon Lim and Kanghoon Lee and Woohyung Lim},\nyear={2024},\nurl={https://openreview.net/forum?id=NhUinwpVSQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "FTr9;bJsN;y3xx;6csw",
        "site": "https://openreview.net/forum?id=NhUinwpVSQ",
        "pdf_size": 6096044,
        "rating": "3;3;3;5",
        "confidence": "4;3;3;2",
        "soundness": "2;2;2;3",
        "contribution": "1;3;2;2",
        "presentation": "3;2;3;3",
        "wc_summary": "54;258;97;83",
        "wc_strengths": "7;68;56;95",
        "wc_weaknesses": "195;206;117;114",
        "wc_questions": "49;14;39;15",
        "wc_review": "305;546;309;307",
        "wc_reply_reviewers": "67;206;52;92",
        "wc_reply_authors": "282;284;587;57",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            123.0,
            79.47012017104291
        ],
        "wc_strengths_avg": [
            56.5,
            31.87867625859016
        ],
        "wc_weaknesses_avg": [
            158.0,
            42.69074841227312
        ],
        "wc_questions_avg": [
            29.25,
            15.171931320698759
        ],
        "wc_review_avg": [
            366.75,
            103.49969806719244
        ],
        "wc_reply_reviewers_avg": [
            104.25,
            60.45814668016214
        ],
        "wc_reply_authors_avg": [
            302.5,
            188.39652332248596
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:YZG_9-z-HBMJ:scholar.google.com/&scioq=Policy+Disentangled+Variational+Autoencoder&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "LG",
        "aff_unique_dep": "LG AI Research",
        "aff_unique_url": "https://www.lgaires.com",
        "aff_unique_abbr": "LG AI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "MOTOR: A Time-to-Event Foundation Model For Structured Medical Records",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18777",
        "id": "NialiwI2V6",
        "author_site": "Ethan Steinberg, Jason Fries, Yizhe Xu, Nigam Shah",
        "tldr": "",
        "abstract": "We present a self-supervised, time-to-event (TTE) foundation model called MOTOR (Many Outcome Time Oriented Representations) which is pretrained on timestamped sequences of events in electronic health records (EHR) and health insurance claims. TTE models are used for estimating the probability distribution of the time until a specific event occurs, which is an important task in medical settings. TTE models provide many advantages over classification using fixed time horizons, including naturally handling censored observations, but are challenging to train with limited labeled data. MOTOR addresses this challenge by pretraining on up to 55M patient records (9B clinical events). We evaluate MOTOR's transfer learning performance on 19 tasks, across 3 patient databases (a private EHR system, MIMIC-IV, and Merative claims data). Task-specific models adapted from MOTOR improve time-dependent C statistics by 4.6\\% over state-of-the-art, improve label efficiency by up to 95\\%, and are more robust to temporal distributional shifts. We further evaluate cross-site portability by adapting our MOTOR foundation model for six prediction tasks on the MIMIC-IV dataset, where it outperforms all baselines. MOTOR is the first foundation model for medical TTE predictions and we release a 143M parameter pretrained model for research use at https://huggingface.co/StanfordShahLab/motor-t-base.",
        "keywords": "foundation models;time-to-event;electronic health records;deep learning;self-supervised learning;transfer learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Ethan Steinberg;Jason Alan Fries;Yizhe Xu;Nigam Shah",
        "authorids": "~Ethan_Steinberg1;~Jason_Alan_Fries1;~Yizhe_Xu1;~Nigam_Shah1",
        "gender": "M;M;F;M",
        "homepage": ";https://web.stanford.edu/~jfries/;https://crystalxur.github.io/;https://shahlab.stanford.edu/nigam_shah",
        "dblp": "241/9476;182/2122;204/4745;s/NHShah",
        "google_scholar": ";wywWmwoAAAAJ;https://scholar.google.com/citations?view_op=list_works;n63DmP8AAAAJ",
        "orcid": "0000-0001-7166-5032;0000-0001-9316-5768;;0000-0001-9385-7158",
        "linkedin": ";jason-fries/;;",
        "or_profile": "~Ethan_Steinberg1;~Jason_Alan_Fries1;~Yizhe_Xu1;~Nigam_Shah1",
        "aff": "Stanford University;Stanford University;;Stanford University",
        "aff_domain": "stanford.edu;stanford.edu;;stanford.edu",
        "position": "PhD student;Research Scientist;;Full Professor",
        "bibtex": "@inproceedings{\nsteinberg2024motor,\ntitle={{MOTOR}: A Time-to-Event Foundation Model For Structured Medical Records},\nauthor={Ethan Steinberg and Jason Alan Fries and Yizhe Xu and Nigam Shah},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=NialiwI2V6}\n}",
        "github": "",
        "project": "",
        "reviewers": "MVk7;epjm;ZCsF;13Zf",
        "pdf_size": 1176601,
        "rating": "6;8;8;8",
        "confidence": "3;4;3;4",
        "soundness": "3;3;3;3",
        "contribution": "4;3;3;4",
        "presentation": "3;4;4;3",
        "wc_summary": "16;110;90;43",
        "wc_strengths": "60;223;49;118",
        "wc_weaknesses": "53;262;86;89",
        "wc_questions": "15;22;43;5",
        "wc_review": "144;617;268;255",
        "wc_reply_reviewers": "0;16;5;17",
        "wc_reply_authors": "420;613;700;641",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.5,
            0.5
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            64.75,
            37.19795021234369
        ],
        "wc_strengths_avg": [
            112.5,
            68.97282073396738
        ],
        "wc_weaknesses_avg": [
            122.5,
            81.76949308880421
        ],
        "wc_questions_avg": [
            21.25,
            13.935117509371782
        ],
        "wc_review_avg": [
            321.0,
            177.5598490650406
        ],
        "wc_reply_reviewers_avg": [
            9.5,
            7.22841614740048
        ],
        "wc_reply_authors_avg": [
            593.5,
            104.97737851556401
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 17,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11035713655393671555&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=NialiwI2V6",
        "pdf": "https://openreview.net/pdf?id=NialiwI2V6",
        "email": "stanford.edu;stanford.edu;;stanford.edu",
        "author_num": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Stanford University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.stanford.edu",
        "aff_unique_abbr": "Stanford",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Stanford",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "NiefAhgJqH",
        "title": "Bayesian Exploration Networks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Bayesian reinforcement learning (RL) offers a principled and elegant approach for sequential decision making under uncertainty. Most notably, Bayesian agents do not face an exploration/exploitation dilemma, a major pathology of frequentist methods. A key challenge for Bayesian RL is the computational complexity of learning Bayes-optimal policies, which is only tractable in toy domains. In this paper we propose a novel model-free approach to address this challenge. Rather than modelling uncertainty in high-dimensional state transition distributions as model-based approaches do, we model uncertainty in a one-dimensional Bellman operator. Our theoretical analysis reveals that existing model-free approaches either do not propagate epistemic uncertainty through the MDP or optimise over a set of contextual policies instead of all history-conditioned policies. Both approximations yield policies that can be arbitrarily Bayes-suboptimal. To overcome these issues, we introduce the Bayesian exploration network   (BEN) which uses normalising flows to model both the aleatoric uncertainty (via density estimation) and epistemic uncertainty (via variational inference) in the Bellman operator. In the limit of complete optimisation, BEN learns true Bayes-optimal policies, but like in variational expectation-maximisation, partial optimisation renders our approach tractable. Empirical results demonstrate that BEN can learn true Bayes-optimal policies in tasks where existing model-free approaches fail.",
        "keywords": "Reinforcement Learning;Bayesian Reinforcement Learning;Bayes-optimal",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/4f92adce34a7c25ad4dee5e788b2267256656f32.zip",
        "author": "Mattie Fellows;Brandon Gary Kaplowitz;Christian Schroeder de Witt;Shimon Whiteson",
        "authorids": "~Mattie_Fellows1;~Brandon_Gary_Kaplowitz1;~Christian_Schroeder_de_Witt1;~Shimon_Whiteson1",
        "gender": "M;M;;Unspecified",
        "homepage": ";https://www.schroederdewitt.com;;http://whirl.cs.ox.ac.uk/member/matthew-fellows/",
        "dblp": ";;https://dblp.uni-trier.de/pers/w/Whiteson:Shimon.html;26/4512",
        "google_scholar": ";DE60h_0AAAAJ;;",
        "orcid": ";;;",
        "linkedin": "brandon-kaplowitz-40271571/;;;",
        "or_profile": "~Brandon_Gary_Kaplowitz1;~Christian_Schroeder_de_Witt1;~Shimon_Whiteson1;~Matthew_Fellows1",
        "aff": "New York University;University of Oxford;University of Oxford;Department of Computer Science",
        "aff_domain": "nyu.edu;oxford.ac.uk;ox.ac.uk;cs.ox.ac.uk",
        "position": "PhD student;Lecturer;Professor;Postdoc",
        "bibtex": "@misc{\nfellows2024bayesian,\ntitle={Bayesian Exploration Networks},\nauthor={Mattie Fellows and Brandon Gary Kaplowitz and Christian Schroeder de Witt and Shimon Whiteson},\nyear={2024},\nurl={https://openreview.net/forum?id=NiefAhgJqH}\n}",
        "github": "",
        "project": "",
        "reviewers": "Z7MF;Hvyz;MKkw",
        "site": "https://openreview.net/forum?id=NiefAhgJqH",
        "pdf_size": 3642434,
        "rating": "3;6;8",
        "confidence": "4;2;3",
        "soundness": "1;3;4",
        "contribution": "2;3;3",
        "presentation": "1;2;4",
        "wc_summary": "74;108;131",
        "wc_strengths": "27;122;85",
        "wc_weaknesses": "466;239;129",
        "wc_questions": "7;1;29",
        "wc_review": "574;470;374",
        "wc_reply_reviewers": "345;18;0",
        "wc_reply_authors": "1682;142;123",
        "reply_reviewers": "2;1;0",
        "reply_authors": "4;1;1",
        "rating_avg": [
            5.666666666666667,
            2.0548046676563256
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "wc_summary_avg": [
            104.33333333333333,
            23.414145771781257
        ],
        "wc_strengths_avg": [
            78.0,
            39.098167049961134
        ],
        "wc_weaknesses_avg": [
            278.0,
            140.31630933952997
        ],
        "wc_questions_avg": [
            12.333333333333334,
            12.036980056845191
        ],
        "wc_review_avg": [
            472.6666666666667,
            81.67142843260562
        ],
        "wc_reply_reviewers_avg": [
            121.0,
            158.56229059899457
        ],
        "wc_reply_authors_avg": [
            649.0,
            730.4824889527926
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            2.0,
            1.4142135623730951
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5960395606792698,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11889924292021021006&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "New York University;University of Oxford;Unknown Institution",
        "aff_unique_dep": ";;Department of Computer Science",
        "aff_unique_url": "https://www.nyu.edu;https://www.ox.ac.uk;",
        "aff_unique_abbr": "NYU;Oxford;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "United States;United Kingdom;"
    },
    {
        "id": "Nil8G449BI",
        "title": "Block-local learning with probabilistic latent representations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The ubiquitous backpropagation algorithm requires sequential updates through the network introducing a locking problem. In addition, backpropagation relies on the transpose of forward weight matrices to compute updates, introducing a weight transport problem across the network. Locking and weight transport are problems because they prevent efficient parallelization and horizontal scaling of the training process. We propose a new method to address both these problems and scale up the training of large models. Our method works by dividing a deep neural network into blocks and introduces a feedback network that propagates the information from the targets backwards to provide auxiliary local losses. Forward and backward propagation can operate in parallel and with different sets of weights, addressing the problems of locking and  weight transport. Our approach derives from a statistical interpretation of training that treats output activations of network blocks as parameters of probability distributions. The resulting learning framework uses these parameters to evaluate the agreement between forward and backward information. Error backpropagation is then performed locally within each block, leading to \"block-local\" learning. Several previously proposed alternatives to error backpropagation emerge as special cases of our model. We present results on a variety of tasks and architectures, demonstrating state-of-the-art performance using block-local learning. These results provide a new principled framework for training networks in a distributed setting.",
        "keywords": "alternative to backprop;locking problem;probabilistic models;weight transport problem",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "David Kappel;Khaleelulla Khan Nazeer;Cabrel Teguemne Fokam;Christian Mayr;Anand Subramoney",
        "authorids": "~David_Kappel2;~Khaleelulla_Khan_Nazeer1;~Cabrel_Teguemne_Fokam1;~Christian_Mayr1;~Anand_Subramoney2",
        "gender": "M;M;M;M;M",
        "homepage": "https://www.ini.rub.de/the_institute/people/david-kappel/;http://khaleelkhan.com/;https://github.com/tfcyoo;https://tu-dresden.de/ing/elektrotechnik/iee/hpsn;https://anandsubramoney.com",
        "dblp": ";322/3902;;44/6754;130/1287",
        "google_scholar": "https://scholar.google.de/citations?user=csoW51sAAAAJ;xhbTUSsAAAAJ;https://scholar.google.de/citations?user=Sq39H9oAAAAJ;;gmu6TWwAAAAJ",
        "orcid": "0000-0001-5942-4033;0000-0001-8525-8702;;;0000-0002-7333-9860",
        "linkedin": ";khaleel-khan/;;;anandsubramoney/",
        "or_profile": "~David_Kappel2;~Khaleelulla_Khan_Nazeer1;~Cabrel_Teguemne_Fokam1;~Christian_Mayr1;~Anand_Subramoney1",
        "aff": "Ruhr-Universt\u00e4t Bochum;Technische Universit\u00e4t Dresden;Ruhr-Universit\u00e4t Bochum;TU Dresden;Royal Holloway, University of London",
        "aff_domain": "rub.de;tu-dresden.de;ruhr-uni-bochum.de;tu-dresden.de;rhul.ac.uk",
        "position": "Postdoc;PhD student;PhD student;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nkappel2024blocklocal,\ntitle={Block-local learning with probabilistic latent representations},\nauthor={David Kappel and Khaleelulla Khan Nazeer and Cabrel Teguemne Fokam and Christian Mayr and Anand Subramoney},\nyear={2024},\nurl={https://openreview.net/forum?id=Nil8G449BI}\n}",
        "github": "",
        "project": "",
        "reviewers": "ACie;ckuE;g9PU;nrns",
        "site": "https://openreview.net/forum?id=Nil8G449BI",
        "pdf_size": 1026431,
        "rating": "5;5;6;6",
        "confidence": "2;5;3;3",
        "soundness": "3;3;3;3",
        "contribution": "4;2;3;3",
        "presentation": "3;2;2;2",
        "wc_summary": "48;61;28;238",
        "wc_strengths": "28;4;39;78",
        "wc_weaknesses": "23;197;196;230",
        "wc_questions": "80;21;333;156",
        "wc_review": "179;283;596;702",
        "wc_reply_reviewers": "0;0;127;197",
        "wc_reply_authors": "351;154;301;322",
        "reply_reviewers": "0;0;2;1",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.25,
            1.0897247358851685
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            93.75,
            84.10818925645707
        ],
        "wc_strengths_avg": [
            37.25,
            26.714930282521795
        ],
        "wc_weaknesses_avg": [
            161.5,
            81.12490369793976
        ],
        "wc_questions_avg": [
            147.5,
            117.30409200023672
        ],
        "wc_review_avg": [
            440.0,
            215.4936193950995
        ],
        "wc_reply_reviewers_avg": [
            81.0,
            84.69651704763308
        ],
        "wc_reply_authors_avg": [
            282.0,
            76.0032894024989
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.22941573387056177,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14713263234123796166&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0;1;2",
        "aff_unique_norm": "Ruhr-Universit\u00e4t Bochum;Technische Universit\u00e4t Dresden;University of London",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ruhr-uni-bochum.de;https://tu-dresden.de;https://www.royalholloway.ac.uk",
        "aff_unique_abbr": "RUB;TUD;RHUL",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Royal Holloway",
        "aff_country_unique_index": "0;0;0;0;1",
        "aff_country_unique": "Germany;United Kingdom"
    },
    {
        "title": "The Expressive Power of Transformers with Chain of Thought",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18776",
        "id": "NjNGlPh8Wh",
        "author_site": "William Merrill, Ashish Sabharwal",
        "tldr": "",
        "abstract": "Recent theoretical work has identified surprisingly simple reasoning problems, such as checking if two nodes in a graph are connected or simulating finite-state machines, that are provably unsolvable by standard transformers that answer immediately after reading their input. However, in practice, transformers' reasoning can be improved by allowing them to use a \"chain of thought\" or \"scratchpad\", i.e., generate and condition on a sequence of intermediate tokens before answering. Motivated by this, we ask: *Does such intermediate generation fundamentally extend the computational power of a decoder-only transformer?* We show that the answer is *yes*, but the amount of increase depends crucially on the amount of intermediate generation. For instance, we find that transformer decoders with a logarithmic number of decoding steps (w.r.t. the input length) push the limits of standard transformers only slightly, while a linear number of decoding steps, assuming projected pre-norm (a slight generalization of standard pre-norm), adds a clear new ability (under standard complexity conjectures): recognizing all regular languages. Our results also imply that linear steps keep transformer decoders within context-sensitive languages, and polynomial steps with generalized pre-norm make them recognize exactly the class of polynomial-time solvable problems\u2014the first exact characterization of a type of transformers in terms of standard complexity classes. Together, this provides a nuanced framework for understanding how the length of a transformer\u2019s chain of thought or scratchpad impacts its reasoning power.",
        "keywords": "The Expressive Power of Transformers with Chain of Thought",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "William Merrill;Ashish Sabharwal",
        "authorids": "~William_Merrill1;~Ashish_Sabharwal1",
        "gender": "M;M",
        "homepage": "http://lambdaviking.com;",
        "dblp": "19/3512;13/154",
        "google_scholar": "CyjChJQAAAAJ;7VspfeAAAAAJ",
        "orcid": ";",
        "linkedin": "william-merrill-15ab0743/;ashish-sabharwal-82a2b661",
        "or_profile": "~William_Merrill1;~Ashish_Sabharwal1",
        "aff": "New York University;Allen Institute for AI",
        "aff_domain": "nyu.edu;allenai.org",
        "position": "Graduate student;Principal Researcher",
        "bibtex": "@inproceedings{\nmerrill2024the,\ntitle={The Expressive Power of Transformers with Chain of Thought},\nauthor={William Merrill and Ashish Sabharwal},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=NjNGlPh8Wh}\n}",
        "github": "",
        "project": "",
        "reviewers": "7d6w;a7kJ;XLkW;DD5G",
        "pdf_size": 367971,
        "rating": "6;8;8;8",
        "confidence": "4;3;3;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "84;131;57;159",
        "wc_strengths": "35;88;35;70",
        "wc_weaknesses": "49;107;38;87",
        "wc_questions": "32;76;2;154",
        "wc_review": "200;402;132;470",
        "wc_reply_reviewers": "63;114;0;39",
        "wc_reply_authors": "213;412;59;405",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            107.75,
            39.707524475847144
        ],
        "wc_strengths_avg": [
            57.0,
            22.901964981197573
        ],
        "wc_weaknesses_avg": [
            70.25,
            27.94078560098123
        ],
        "wc_questions_avg": [
            66.0,
            57.21887800367987
        ],
        "wc_review_avg": [
            301.0,
            139.21566003866087
        ],
        "wc_reply_reviewers_avg": [
            54.0,
            41.29769969380861
        ],
        "wc_reply_authors_avg": [
            272.25,
            146.74701870906952
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 105,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9294951816975038983&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=NjNGlPh8Wh",
        "pdf": "https://openreview.net/pdf?id=NjNGlPh8Wh",
        "email": "nyu.edu;allenai.org",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "New York University;Allen Institute for AI",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.nyu.edu;https://allenai.org",
        "aff_unique_abbr": "NYU;AI2",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "VeRA: Vector-based Random Matrix Adaptation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18775",
        "id": "NjNfLdxr3A",
        "author_site": "Dawid Kopiczko, Tijmen Blankevoort, Yuki Asano",
        "tldr": "",
        "abstract": "Low-rank adapation (LoRA) is a popular method that reduces the number of trainable parameters when finetuning large language models, but still faces acute storage challenges when scaling to even larger models or deploying numerous per-user or per-task adapted models. In this work, we present Vector-based Random Matrix Adaptation (VeRA), which significantly reduces the number of trainable parameters compared to LoRA, yet maintains the same performance. It achieves this by using a single pair of low-rank matrices shared across all layers and learning small scaling vectors instead. We demonstrate its effectiveness on the GLUE and E2E benchmarks, image classification tasks, and show its application in instruction-tuning of 7B and 13B language models. Website: https://dkopi.github.io/vera",
        "keywords": "Parameter-efficient fine-tuning;Transfer learning;Low-rank;NLP",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/221b6211a6c0a2a90d3b2f97b78d7f088afbd46d.zip",
        "author": "Dawid Jan Kopiczko;Tijmen Blankevoort;Yuki M Asano",
        "authorids": "~Dawid_Jan_Kopiczko1;~Tijmen_Blankevoort1;~Yuki_M_Asano1",
        "gender": "M;M;M",
        "homepage": "https://dkopi.github.io;;https://yukimasano.github.io/",
        "dblp": "359/2314;;239/8823",
        "google_scholar": "neYsS3oAAAAJ;OGEyrG8AAAAJ;CdpLhlgAAAAJ",
        "orcid": ";;",
        "linkedin": "dawidkopiczko/;tijmen-blankevoort-a5633a24/;",
        "or_profile": "~Dawid_Jan_Kopiczko1;~Tijmen_Blankevoort1;~Yuki_Asano1",
        "aff": "Vrije Universiteit Amsterdam;Qualcomm Inc, QualComm;University of Amsterdam",
        "aff_domain": "vu.nl;qti.qualcomm.com;uva.nl",
        "position": "MS student;Researcher;Assistant Professor",
        "bibtex": "@inproceedings{\nkopiczko2024vera,\ntitle={Ve{RA}: Vector-based Random Matrix Adaptation},\nauthor={Dawid Jan Kopiczko and Tijmen Blankevoort and Yuki M Asano},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=NjNfLdxr3A}\n}",
        "github": "",
        "project": "",
        "reviewers": "iJDt;rHtj;JAXk;Bg6K",
        "pdf_size": 429513,
        "rating": "5;8;8;8",
        "confidence": "2;4;3;3",
        "soundness": "3;3;4;3",
        "contribution": "2;4;4;3",
        "presentation": "2;4;4;3",
        "wc_summary": "39;135;75;71",
        "wc_strengths": "27;74;36;66",
        "wc_weaknesses": "111;41;9;244",
        "wc_questions": "25;50;50;146",
        "wc_review": "202;300;170;527",
        "wc_reply_reviewers": "24;0;0;0",
        "wc_reply_authors": "840;232;312;896",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "2;1;1;2",
        "rating_avg": [
            7.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            80.0,
            34.68429039204925
        ],
        "wc_strengths_avg": [
            50.75,
            19.715159142142372
        ],
        "wc_weaknesses_avg": [
            101.25,
            90.29500263026742
        ],
        "wc_questions_avg": [
            67.75,
            46.31616888301536
        ],
        "wc_review_avg": [
            299.75,
            139.67171331375584
        ],
        "wc_reply_reviewers_avg": [
            6.0,
            10.392304845413264
        ],
        "wc_reply_authors_avg": [
            570.0,
            299.9933332592576
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.816496580927726,
        "gs_citation": 184,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1098443049958351383&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=NjNfLdxr3A",
        "pdf": "https://openreview.net/pdf?id=NjNfLdxr3A",
        "email": "vu.nl;qti.qualcomm.com;uva.nl",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Vrije Universiteit Amsterdam;Qualcomm Incorporated;University of Amsterdam",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.vu.nl;https://www.qualcomm.com;https://www.uva.nl",
        "aff_unique_abbr": "VU Amsterdam;Qualcomm;UvA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Netherlands;United States"
    },
    {
        "title": "A General Framework for User-Guided Bayesian Optimization",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18774",
        "id": "NjU0jtXcYn",
        "author_site": "Carl Hvarfner, Frank Hutter, Luigi Nardi",
        "tldr": "",
        "abstract": "The optimization of expensive-to-evaluate black-box functions is prevalent in various scientific disciplines. Bayesian optimization is an automatic, general and sample-efficient method to solve these problems with minimal knowledge of the the underlying function dynamics. However, the ability of Bayesian optimization to incorporate prior knowledge or beliefs about the function at hand in order to accelerate the optimization is limited, which reduces its appeal for knowledgeable practitioners with tight  budgets. To allow domain experts to customize the optimization routine, we propose ColaBO, the first Bayesian-principled framework for incorporating prior beliefs beyond the typical kernel structure, such as the likely location of the optimizer or the optimal value. The generality of ColaBO makes it applicable across different Monte Carlo acquisition functions and types of user beliefs. We empirically demonstrate ColaBO's ability to substantially accelerate optimization when the prior information is accurate, and to retain approximately default performance when it is misleading.",
        "keywords": "Bayesian Optimization;Hyperparameter Optimization;Gaussian Processes",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/8e3f5b4a1bd0cc927fd63e4b1e18d622ff96ea53.pdf",
        "author": "Carl Hvarfner;Frank Hutter;Luigi Nardi",
        "authorids": "~Carl_Hvarfner1;~Frank_Hutter1;~Luigi_Nardi1",
        "gender": "M;M;M",
        "homepage": "https://portal.research.lu.se/portal/sv/persons/carl-hvarfner(cd140b82-9fed-4e88-868e-1cf569dcbeb7).html;http://ml.informatik.uni-freiburg.de/~hutter/;",
        "dblp": "319/3033;89/5383;60/7206",
        "google_scholar": "https://scholar.google.se/citations?hl=en;https://scholar.google.de/citations?user=YUrxwrkAAAAJ;https://scholar.google.it/citations?user=Kgs3zQoAAAAJ",
        "orcid": ";0000-0002-2037-3694;0000-0002-4601-2264",
        "linkedin": "carl-hvarfner-a97421153/;frank-hutter-9190b24b/;nardiluigi/",
        "or_profile": "~Carl_Hvarfner1;~Frank_Hutter1;~Luigi_Nardi1",
        "aff": "Lund University;Albert-Ludwigs-Universit\u00e4t Freiburg;Stanford University",
        "aff_domain": "lu.se;uni-freiburg.de;stanford.edu",
        "position": "PhD student;Full Professor;Researcher",
        "bibtex": "@inproceedings{\nhvarfner2024a,\ntitle={A General Framework for User-Guided Bayesian Optimization},\nauthor={Carl Hvarfner and Frank Hutter and Luigi Nardi},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=NjU0jtXcYn}\n}",
        "github": "",
        "project": "",
        "reviewers": "TtXD;ZcGu;ysEZ;tGCg",
        "pdf_size": 1225236,
        "rating": "6;6;8;8",
        "confidence": "3;3;4;4",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;2;2;3",
        "wc_summary": "222;77;54;58",
        "wc_strengths": "83;81;20;31",
        "wc_weaknesses": "34;217;615;20",
        "wc_questions": "93;146;28;21",
        "wc_review": "432;521;717;130",
        "wc_reply_reviewers": "0;0;290;0",
        "wc_reply_authors": "62;1405;1059;184",
        "reply_reviewers": "0;0;2;0",
        "reply_authors": "1;2;3;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            102.75,
            69.39515472999538
        ],
        "wc_strengths_avg": [
            53.75,
            28.525208149985513
        ],
        "wc_weaknesses_avg": [
            221.5,
            240.11507657787755
        ],
        "wc_questions_avg": [
            72.0,
            51.122402134485036
        ],
        "wc_review_avg": [
            450.0,
            211.57386417041212
        ],
        "wc_reply_reviewers_avg": [
            72.5,
            125.5736835487436
        ],
        "wc_reply_authors_avg": [
            677.5,
            569.4692704615412
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9998957565918133743&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=NjU0jtXcYn",
        "pdf": "https://openreview.net/pdf?id=NjU0jtXcYn",
        "email": "lu.se;uni-freiburg.de;stanford.edu",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Lund University;Albert-Ludwigs-Universit\u00e4t Freiburg;Stanford University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.lunduniversity.lu.se;https://www.uni-freiburg.de;https://www.stanford.edu",
        "aff_unique_abbr": "LU;Albert-Ludwigs-Universit\u00e4t;Stanford",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Freiburg;Stanford",
        "aff_country_unique_index": "0;1;2",
        "aff_country_unique": "Sweden;Germany;United States"
    },
    {
        "id": "NkYCuGM7E2",
        "title": "Large Language Models as Decision Makers for Autonomous Driving",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Existing learning-based autonomous driving (AD) systems face challenges in comprehending high-level information, generalizing to rare events, and providing interpretability. To address these problems, this work employs Large Language Models (LLMs) as a decision-making component for complex AD scenarios that require human commonsense understanding. We devise cognitive pathways to enable comprehensive reasoning with LLMs, and develop algorithms for translating LLM decisions into actionable driving commands. Through this approach, LLM decisions are seamlessly integrated with low-level controllers by guided parameter matrix adaptation. Extensive experiments demonstrate that our proposed method not only consistently surpasses baseline approaches in single-vehicle tasks, but also helps handle complex driving behaviors even multi-vehicle coordination, thanks to the commonsense reasoning capabilities of LLMs. This paper presents an initial step toward leveraging LLMs as effective decision-makers for intricate AD scenarios in terms of safety, efficiency, generalizability, and interoperability. We aspire for it to serve as inspiration for future research in this field.",
        "keywords": "Large language model;Autonomous driving",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/264c7d13be22085a9df27077e6bd2e05c87dbfa1.zip",
        "author": "Hao Sha;Yao Mu;Yuxuan Jiang;Guojian Zhan;Li Chen;Chenfeng Xu;Ping Luo;Shengbo Eben Li;Masayoshi Tomizuka;Wei Zhan;Mingyu Ding",
        "authorids": "~Hao_Sha5;~Yao_Mu1;~Yuxuan_Jiang1;~Guojian_Zhan1;~Li_Chen15;~Chenfeng_Xu1;~Ping_Luo2;~Shengbo_Eben_Li2;~Masayoshi_Tomizuka1;~Wei_Zhan2;~Mingyu_Ding1",
        "gender": "M;M;M;M;M;M;;M;M;;M",
        "homepage": "https://scholar.google.com/citations?user=PAtKSmMAAAAJ&hl=zh-CN;https://yaomarkmu.github.io/;https://github.com/jjyyxx;;https://ilnehc.github.io/;;;http://www.idlab-tsinghua.com/thulab/labweb/dpeople.html?11;https://me.berkeley.edu/people/masayoshi-tomizuka/;;https://dingmyu.github.io/",
        "dblp": ";260/0674;;;181/2847;65/1881;;;10/4434;;188/5243",
        "google_scholar": ";;ZcwQMfkAAAAJ;https://scholar.google.co.jp/citations?hl=zh-CN;ulZxvY0AAAAJ;RpqvaTUAAAAJ;;Dxiw1K8AAAAJ;;;w4yTWwoAAAAJ",
        "orcid": ";;0000-0003-4285-0495;;;0000-0002-4941-6985;;;;;0000-0001-6556-8359",
        "linkedin": ";;;;;;;;;;dingmyu/",
        "or_profile": "~Hao_Sha5;~Yao_Mu1;~Yuxuan_Jiang1;~Guojian_Zhan1;~Li_Chen15;~Chenfeng_Xu1;~Ping_Luo2;~Shengbo_Eben_Li2;~Masayoshi_Tomizuka1;~Wei_Zhan2;~Mingyu_Ding1",
        "aff": "Tsinghua University;The University of Hong Kong;Tsinghua University;Tsinghua University;Shanghai AI Laboratory;University of California, Berkeley;;Tsinghua University;University of California, Berkeley;;University of California, Berkeley",
        "aff_domain": "tsinghua.edu.cn;hku.hk;tsinghua.edu.cn;tsinghua.edu.cn;pjlab.org.cn;berkeley.edu;;tsinghua.edu.cn;berkeley.edu;;berkeley.edu",
        "position": "Undergrad student;PhD student;MS student;PhD student;Researcher;PhD student;;Full Professor;Full Professor;;Postdoc",
        "bibtex": "@misc{\nsha2024large,\ntitle={Large Language Models as Decision Makers for Autonomous Driving},\nauthor={Hao Sha and Yao Mu and Yuxuan Jiang and Guojian Zhan and Li Chen and Chenfeng Xu and Ping Luo and Shengbo Eben Li and Masayoshi Tomizuka and Wei Zhan and Mingyu Ding},\nyear={2024},\nurl={https://openreview.net/forum?id=NkYCuGM7E2}\n}",
        "github": "",
        "project": "",
        "reviewers": "aTEF;C5TQ;aAFA;hRfh",
        "site": "https://openreview.net/forum?id=NkYCuGM7E2",
        "pdf_size": 1937897,
        "rating": "3;3;3;6",
        "confidence": "4;4;3;3",
        "soundness": "2;2;2;3",
        "contribution": "1;2;2;3",
        "presentation": "2;3;2;3",
        "wc_summary": "146;77;29;80",
        "wc_strengths": "35;118;25;93",
        "wc_weaknesses": "392;375;85;257",
        "wc_questions": "120;93;95;28",
        "wc_review": "693;663;234;458",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            83.0,
            41.62331077653482
        ],
        "wc_strengths_avg": [
            67.75,
            38.931831449342326
        ],
        "wc_weaknesses_avg": [
            277.25,
            122.5691131566187
        ],
        "wc_questions_avg": [
            84.0,
            34.03674485023502
        ],
        "wc_review_avg": [
            512.0,
            184.22947646888647
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13988666442954206830&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0;2;3;0;3;3",
        "aff_unique_norm": "Tsinghua University;University of Hong Kong;Shanghai AI Laboratory;University of California, Berkeley",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.hku.hk;https://www.shanghai-ai-lab.com;https://www.berkeley.edu",
        "aff_unique_abbr": "THU;HKU;SAIL;UC Berkeley",
        "aff_campus_unique_index": "1;2;2;2",
        "aff_campus_unique": ";Hong Kong SAR;Berkeley",
        "aff_country_unique_index": "0;0;0;0;0;1;0;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "NkcCb3u5rT",
        "title": "RRescue: Ranking LLM Responses to Enhance Reasoning Over Context",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Effectively using a given context is paramount for large language models (LLMs). A context window can include task specifications, retrieved documents, previous conversations, and even model self-reflections, functioning similarly to episodic memory. While efforts are being made to expand the context window, studies indicate that LLMs do not use their context optimally for response generation. In this paper, we present a novel approach to optimize LLMs using ranking metrics, which teaches LLMs to rank a collection of contextually-grounded candidate responses. Rather than a traditional full ordering, we advocate for a partial ordering. This is because achieving consensus on the perfect order for system responses can be challenging. Our partial ordering is more robust, less sensitive to noise, and can be acquired through human labelers, heuristic functions, or model distillation. We test our system's improved contextual understanding using the latest benchmarks, including a new multi-document question answering dataset. We conduct ablation studies to understand crucial factors, such as how to gather candidate responses, determine their most suitable order, and balance supervised fine-tuning with ranking metrics. Our approach, named RRescue, suggests a promising avenue for enhancing LLMs' contextual understanding via response ranking.",
        "keywords": "reasoning;long context;large language models;pairwise preference;ranking of LLM responses",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yikun Wang;Rui Zheng;Haoming Li;Qi Zhang;Tao Gui;Fei Liu",
        "authorids": "~Yikun_Wang1;~Rui_Zheng1;~Haoming_Li4;~Qi_Zhang8;~Tao_Gui1;~Fei_Liu4",
        "gender": "M;M;M;M;M;F",
        "homepage": "https://ekonwang.github.io/;https://github.com/ruizheng20;;http://qizhang.info;;https://www.cs.emory.edu/~fliu40/",
        "dblp": "55/9804;;;52/323-1;135/6973;64/1350-4.html",
        "google_scholar": "https://scholar.google.co.uk/citations?hl=en;https://scholar.google.com.hk/citations?user=7Z0V_SoAAAAJ;;XfqR3yYAAAAJ;;22ohn6AAAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";;https://linkedin.com/in/haoming-li-48696624a;;;feiliu01",
        "or_profile": "~Yikun_Wang1;~Rui_Zheng1;~Haoming_Li4;~Qi_Zhang8;~Tao_Gui1;~Fei_Liu4",
        "aff": "Fudan University;Fudan University;Emory University;Fudan University;Fudan University;Emory University",
        "aff_domain": "fudan.edu.cn;fudan.edu.cn;emory.edu;fudan.edu.cn;fudan.edu.cn;emory.edu",
        "position": "Undergrad student;PhD student;MS student;Full Professor;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nwang2024rrescue,\ntitle={{RR}escue: Ranking {LLM} Responses to Enhance Reasoning Over Context},\nauthor={Yikun Wang and Rui Zheng and Haoming Li and Qi Zhang and Tao Gui and Fei Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=NkcCb3u5rT}\n}",
        "github": "",
        "project": "",
        "reviewers": "atNd;KoAg;Em3N;K8mh",
        "site": "https://openreview.net/forum?id=NkcCb3u5rT",
        "pdf_size": 683427,
        "rating": "3;3;3;3",
        "confidence": "4;3;3;5",
        "soundness": "2;1;1;2",
        "contribution": "3;2;1;2",
        "presentation": "2;1;2;2",
        "wc_summary": "122;55;222;77",
        "wc_strengths": "44;56;26;54",
        "wc_weaknesses": "231;203;386;263",
        "wc_questions": "71;3;607;1",
        "wc_review": "468;317;1241;395",
        "wc_reply_reviewers": "0;0;0;14",
        "wc_reply_authors": "333;223;407;164",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            1.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            119.0,
            64.1833311693932
        ],
        "wc_strengths_avg": [
            45.0,
            11.874342087037917
        ],
        "wc_weaknesses_avg": [
            270.75,
            69.84402265047454
        ],
        "wc_questions_avg": [
            170.5,
            253.5838125748566
        ],
        "wc_review_avg": [
            605.25,
            370.9139893560231
        ],
        "wc_reply_reviewers_avg": [
            3.5,
            6.06217782649107
        ],
        "wc_reply_authors_avg": [
            281.75,
            94.38054619464755
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=788466707516481504&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;0;1",
        "aff_unique_norm": "Fudan University;Emory University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.fudan.edu.cn;https://www.emory.edu",
        "aff_unique_abbr": "Fudan;Emory",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Fantastic Generalization Measures are Nowhere to be Found",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18773",
        "id": "NkmJotfL42",
        "author_site": "Michael Gastpar, Ido Nachum, Jonathan Shafer, Thomas Weinberger",
        "tldr": "",
        "abstract": "We study the notion of a generalization bound being _uniformly tight_, meaning that the difference between the bound and the population loss is small for all learning algorithms and all population distributions. Numerous generalization bounds have been proposed in the literature as potential explanations for the ability of neural networks to generalize in the overparameterized setting. \nHowever, in their paper \"Fantastic Generalization Measures and Where to Find Them,\" Jiang et al. (2020) examine more than a dozen generalization bounds, and show empirically that none of them are uniformly tight. This raises the question of whether uniformly-tight generalization bounds are at all possible in the overparameterized setting. We consider two types of generalization bounds: (1) bounds that may depend on the training set and the learned hypothesis (e.g., margin bounds). We prove mathematically that no such bound can be uniformly tight in the overparameterized setting; (2) bounds that may in addition also depend on the learning algorithm (e.g., stability bounds). For these bounds, we show a trade-off between the algorithm's performance and the bound's tightness. Namely, if the algorithm achieves good accuracy on certain distributions, then no generalization bound can be uniformly tight for it in the overparameterized setting. We explain how these formal results can, in our view, inform research on  generalization bounds for neural networks, while stressing that other interpretations of these results are also possible.",
        "keywords": "overparametrization;generalization",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Michael Gastpar;Ido Nachum;Jonathan Shafer;Thomas Weinberger",
        "authorids": "~Michael_Gastpar1;~Ido_Nachum1;~Jonathan_Shafer1;~Thomas_Weinberger1",
        "gender": ";M;;M",
        "homepage": "https://people.epfl.ch/michael.gastpar;https://idonachum.wordpress.com;;",
        "dblp": ";;;",
        "google_scholar": "https://scholar.google.ch/citations?user=IQ3hcw4AAAAJ;jpY2NNcAAAAJ;;",
        "orcid": "0000-0002-5499-5336;;;",
        "linkedin": ";;;thomas-weinberger-b37684159/",
        "or_profile": "~Michael_Gastpar1;~Ido_Nachum1;~Jonathan_Shafer1;~Thomas_Weinberger1",
        "aff": "School of Computer and Communication Sciences, EPFL - EPF Lausanne;University of Haifa;;EPFL - EPF Lausanne",
        "aff_domain": "ic.epfl.ch;univ.haifa.ac.il;;epfl.ch",
        "position": "Full Professor;Assistant Professor;;PhD student",
        "bibtex": "@inproceedings{\ngastpar2024fantastic,\ntitle={Fantastic Generalization Measures are Nowhere to be Found},\nauthor={Michael Gastpar and Ido Nachum and Jonathan Shafer and Thomas Weinberger},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=NkmJotfL42}\n}",
        "github": "",
        "project": "",
        "reviewers": "bL1w;jDS8;Hb6n;iLzH",
        "pdf_size": 509797,
        "rating": "6;6;8;8",
        "confidence": "4;4;3;3",
        "soundness": "4;4;3;3",
        "contribution": "4;3;3;3",
        "presentation": "3;3;2;4",
        "wc_summary": "567;150;111;87",
        "wc_strengths": "146;48;125;60",
        "wc_weaknesses": "2220;222;413;55",
        "wc_questions": "91;131;52;675",
        "wc_review": "3024;551;701;877",
        "wc_reply_reviewers": "2112;97;495;242",
        "wc_reply_authors": "1860;946;1833;1303",
        "reply_reviewers": "4;1;3;2",
        "reply_authors": "5;3;6;4",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            228.75,
            196.5787056117727
        ],
        "wc_strengths_avg": [
            94.75,
            41.63757317615905
        ],
        "wc_weaknesses_avg": [
            727.5,
            870.9553662501885
        ],
        "wc_questions_avg": [
            237.25,
            254.27384352308044
        ],
        "wc_review_avg": [
            1288.25,
            1008.7560098953562
        ],
        "wc_reply_reviewers_avg": [
            736.5,
            806.8167387951244
        ],
        "wc_reply_authors_avg": [
            1485.5,
            382.5483629555876
        ],
        "reply_reviewers_avg": [
            2.5,
            1.118033988749895
        ],
        "reply_authors_avg": [
            4.5,
            1.118033988749895
        ],
        "replies_avg": [
            55,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1606225073307785463&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=NkmJotfL42",
        "pdf": "https://openreview.net/pdf?id=NkmJotfL42",
        "email": "ic.epfl.ch;univ.haifa.ac.il;;epfl.ch",
        "author_num": 4,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "EPFL;University of Haifa",
        "aff_unique_dep": "School of Computer and Communication Sciences;",
        "aff_unique_url": "https://www.epfl.ch;https://www.haifa.ac.il",
        "aff_unique_abbr": "EPFL;UoH",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Lausanne;",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Switzerland;Israel"
    },
    {
        "id": "NlBuWEJCug",
        "title": "PcLast: Discovering Plannable Continuous Latent States",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Goal-conditioned planning benefits from learned low-dimensional representations of rich, high-dimensional observations. While compact latent representations,  typically learned from variational autoencoders or inverse dynamics, enable goal-conditioned planning they ignore state affordances, thus hampering their sample-efficient planning capabilities. In this paper, we learn a representation that associates reachable states together for effective onward planning. We first learn a latent representation with multi-step inverse dynamics (to remove distracting information); and then transform this representation to  associate reachable states together in $\\ell_2$ space. Our proposals are rigorously tested in various simulation testbeds. Numerical results in reward-based and reward-free settings show significant improvements in sampling efficiency, and yields layered state abstractions that enable computationally efficient hierarchical planning.",
        "keywords": "latent state discovery;control state;continuous latent states",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Anurag Koul;Shivakanth Sujit;Shaoru Chen;Ben Evans;Lili Wu;Lekan P Molu;Byron Xu;Rajan Chari;Riashat Islam;Raihan Seraj;Yonathan Efroni;Miroslav Dud\u00edk;John Langford;Alex Lamb",
        "authorids": "~Anurag_Koul1;~Shivakanth_Sujit1;~Shaoru_Chen1;~Ben_Evans1;~Lili_Wu1;~Lekan_P_Molu1;~Byron_Xu1;~Rajan_Chari1;~Riashat_Islam1;~Raihan_Seraj1;~Yonathan_Efroni2;~Miroslav_Dud\u00edk1;~John_Langford1;~Alex_Lamb1",
        "gender": "M;M;;;M;M;M;M;;M;M;M;M;",
        "homepage": "http://koulanurag.github.io/;https://www.shaoru.site/;;https://github.com/byronxu99;;https://riashat.github.io/;http://raihan-seraj.github.io/;https://sites.google.com/view/yonathan-efroni/;;http://hunch.net/~jl;;https://bennevans.github.io/;https://scriptedonachip.com;https://shivakanthsujit.github.io/",
        "dblp": "209/9666;254/9531;91/1716;;;198/0459;;215/3475;30/2146;77/4488;;87/9175;164/5974.html;320/2346",
        "google_scholar": "K-Q0Xq4AAAAJ;PUIfJYcAAAAJ;x8fnPxAAAAAJ;;;https://scholar.google.ca/citations?user=2_4Rs44AAAAJ;https://scholar.google.ca/citations?user=gtWzuL0AAAAJ;pfTInEgAAAAJ;wYMTld8AAAAJ;LFiqVpwAAAAJ;https://scholar.google.ca/citations?user=BFzFy1YAAAAJ;JPQom2sAAAAJ;JeUaqqEAAAAJ;https://scholar.google.ca/citations?user=oXpK8V8AAAAJ",
        "orcid": ";;;;;;;;;;;;;0000-0002-1744-0841",
        "linkedin": "koulanurag/;;lili-wu-71456674;;rajanchari/;;http://linkedin.com/in/raihan-seraj/;;;;;bnevans/;awesome-lekan/;shivakanthsujit/",
        "or_profile": "~Anurag_Koul1;~Shaoru_Chen1;~Lili_Wu1;~Byron_Xu1;~Rajan_Chari1;~Riashat_Islam1;~Raihan_Seraj1;~Yonathan_Efroni2;~Miroslav_Dud\u00edk1;~John_Langford1;~Alex_Matthew_Lamb1;~Benjamin_Evans1;~Olalekan_Ogunmolu1;~Shiva_Kanth_Sujit1",
        "aff": "Microsoft;Microsoft Research;Microsoft Research NYC;Microsoft;;Saudi Data and AI Authority, Saudi Data and AI Authority;McGill University;Meta;Microsoft;Microsoft;;New York University;Brandeis University;Araya Inc",
        "aff_domain": "microsoft.com;microsoft.com;microsoft.com;microsoft.com;;sdaia.gov.sa;mcgill.ca;meta.com;microsoft.com;microsoft.com;;nyu.edu;brandeis.edu;araya.org",
        "position": "Postdoc;Postdoc;Data and applied scientist;Researcher;;Researcher;PhD student;Researcher;Full Professor;Researcher;;PhD student;Instructor;Researcher",
        "bibtex": "@misc{\nkoul2024pclast,\ntitle={PcLast: Discovering Plannable Continuous Latent States},\nauthor={Anurag Koul and Shivakanth Sujit and Shaoru Chen and Ben Evans and Lili Wu and Lekan P Molu and Byron Xu and Rajan Chari and Riashat Islam and Raihan Seraj and Yonathan Efroni and Miroslav Dud{\\'\\i}k and John Langford and Alex Lamb},\nyear={2024},\nurl={https://openreview.net/forum?id=NlBuWEJCug}\n}",
        "github": "",
        "project": "",
        "reviewers": "uCK9;wVZj;Gktz;AtR8",
        "site": "https://openreview.net/forum?id=NlBuWEJCug",
        "pdf_size": 5194471,
        "rating": "3;5;5;5",
        "confidence": "3;4;4;3",
        "soundness": "2;3;3;2",
        "contribution": "3;2;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "131;107;117;105",
        "wc_strengths": "78;76;85;57",
        "wc_weaknesses": "197;354;493;341",
        "wc_questions": "94;38;34;194",
        "wc_review": "500;575;729;697",
        "wc_reply_reviewers": "0;139;0;59",
        "wc_reply_authors": "240;425;141;416",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            115.0,
            10.295630140987
        ],
        "wc_strengths_avg": [
            74.0,
            10.36822067666386
        ],
        "wc_weaknesses_avg": [
            346.25,
            104.76014270704293
        ],
        "wc_questions_avg": [
            90.0,
            64.5600495662759
        ],
        "wc_review_avg": [
            625.25,
            92.36442767645994
        ],
        "wc_reply_reviewers_avg": [
            49.5,
            57.01096385784054
        ],
        "wc_reply_authors_avg": [
            305.5,
            120.25077962325234
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            14,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15962485069591355743&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;0;0;1;2;3;0;0;4;5;6",
        "aff_unique_norm": "Microsoft;Saudi Data and AI Authority;McGill University;Meta;New York University;Brandeis University;Araya Inc",
        "aff_unique_dep": "Microsoft Corporation;;;Meta Platforms, Inc.;;;",
        "aff_unique_url": "https://www.microsoft.com;https://sdaia.gov.sa;https://www.mcgill.ca;https://meta.com;https://www.nyu.edu;https://www.brandeis.edu;",
        "aff_unique_abbr": "Microsoft;SDAIA;McGill;Meta;NYU;Brandeis;",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";New York City",
        "aff_country_unique_index": "0;0;0;0;1;2;0;0;0;0;0",
        "aff_country_unique": "United States;Saudi Arabia;Canada;"
    },
    {
        "title": "Steve-Eye: Equipping LLM-based Embodied Agents with Visual Perception in Open Worlds",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18772",
        "id": "NltzxpG0nz",
        "author_site": "Sipeng Zheng, jiazheng liu, Yicheng Feng, Zongqing Lu",
        "tldr": "",
        "abstract": "Recent studies have presented compelling evidence that large language models (LLMs) can equip embodied agents with the self-driven capability to interact with the world, which marks an initial step toward versatile robotics. However, these efforts tend to overlook the visual richness of open worlds, rendering the entire interactive process akin to ``a blindfolded text-based game.'' Consequently, LLM-based agents frequently encounter challenges in intuitively comprehending their surroundings and producing responses that are easy to understand. In this paper, we propose Steve-Eye, an end-to-end trained large multimodal model to address this limitation. Steve-Eye integrates the LLM with a visual encoder to process visual-text inputs and generate multimodal feedback. We adopt a semi-automatic strategy to collect an extensive dataset comprising 850K open-world instruction pairs, enabling our model to encompass three essential functions for an agent: multimodal perception, foundational knowledge base, and skill prediction and planning. Lastly, we develop three open-world evaluation benchmarks and carry out experiments from a wide range of perspectives to validate our model's capability to strategically act and plan. The project\u2019s website and code can be found at https://sites.google.com/view/steve-eye.",
        "keywords": "large multimodal pre-training;open-world embodied agent;large language model",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Sipeng Zheng;jiazheng liu;Yicheng Feng;Zongqing Lu",
        "authorids": "~Sipeng_Zheng1;~jiazheng_liu2;~Yicheng_Feng1;~Zongqing_Lu2",
        "gender": "M;;M;",
        "homepage": "https://github.com/zhengsipeng;https://github.com/saki-37;https://takenpeanut.github.io/;",
        "dblp": "251/3691;;340/4016;",
        "google_scholar": "OonuDhcAAAAJ;;;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Sipeng_Zheng1;~jiazheng_liu2;~Yicheng_Feng1;~Zongqing_Lu2",
        "aff": "Beijing Academy of Artificial Intelligence;Peking University;Peking University;",
        "aff_domain": "baai.ac.cn;pku.edu.cn;pku.edu.cn;",
        "position": "Researcher;PhD student;PhD student;",
        "bibtex": "@inproceedings{\nzheng2024steveeye,\ntitle={Steve-Eye: Equipping {LLM}-based Embodied Agents with Visual Perception in Open Worlds},\nauthor={Sipeng Zheng and jiazheng liu and Yicheng Feng and Zongqing Lu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=NltzxpG0nz}\n}",
        "github": "",
        "project": "",
        "reviewers": "k9Af;ijGQ;mQD9;m8nW",
        "pdf_size": 1574941,
        "rating": "5;5;6;6",
        "confidence": "3;4;3;4",
        "soundness": "3;3;3;2",
        "contribution": "3;3;2;3",
        "presentation": "3;3;3;2",
        "wc_summary": "67;76;76;108",
        "wc_strengths": "52;132;52;7",
        "wc_weaknesses": "166;432;124;5",
        "wc_questions": "3;2;2;285",
        "wc_review": "288;642;254;405",
        "wc_reply_reviewers": "175;42;0;91",
        "wc_reply_authors": "1199;1489;387;594",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "3;5;2;3",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            81.75,
            15.594470173750693
        ],
        "wc_strengths_avg": [
            60.75,
            45.05205322735025
        ],
        "wc_weaknesses_avg": [
            181.75,
            156.08391172699382
        ],
        "wc_questions_avg": [
            73.0,
            122.3989379038887
        ],
        "wc_review_avg": [
            397.25,
            152.0022614963343
        ],
        "wc_reply_reviewers_avg": [
            77.0,
            65.10376333208396
        ],
        "wc_reply_authors_avg": [
            917.25,
            444.95414089544107
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.25,
            1.0897247358851685
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 26,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15937960447643573362&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=NltzxpG0nz",
        "pdf": "https://openreview.net/pdf?id=NltzxpG0nz",
        "email": "baai.ac.cn;pku.edu.cn;pku.edu.cn;",
        "author_num": 4,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Beijing Academy of Artificial Intelligence;Peking University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.baaic.cn;http://www.pku.edu.cn",
        "aff_unique_abbr": "BAAI;Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "NmaXXAiJJC",
        "title": "COMPRESSION AND ACCELERATION OF DEEP NEURAL NETWORKS: A VECTOR QUANTIZATION APPROACH",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In the advancing field of deep learning, we witness the emergence of models that are getting larger, with an increasing number of parameters. However, this progress carries a downside, as it requires more powerful hardware, thereby restricting the utilization of deep learning models, particularly on edge devices. Hence, a vital requirement arises for compressing and accelerating deep learning models to enable their widespread deployment. Majority of recent studies proposed compression or acceleration based on pruning, low-precision quantization, matrix factorization and knowledge distillation. In this paper, we present a novel paradigm for compressing and accelerating deep learning models by harnessing vector quantization, a widely-recognized method in data compression. Our technique directly applies vector quantization to the neural network weights. More precisely, a VQ-DNN model divides weight parameters into equally sized segments, with the values of these segments exclusively derived from a compact codebook of values. During training, a VQ-DNN model learns both the codebook values and the mapping to model weight parameters. Our work demonstrates that vector quantization leads to more efficient implementations of matrix multiplications and convolution operations, ultimately reducing the computational cost. This efficiency enables us to accelerate and compress a wide range of models, including both Convolutional Neural Networks (CNNs) and vision transformers. We present experimental results on datasets such as CIFAR-10, ImageNet, and EuroSat using popular architectures like VGG16, ResNet, and ViT models. In all scenarios, VQ-DNN reduces model size by over 95\\%, surpassing state-of-the-art methods. Furthermore, it achieves comparable or superior reductions in Floating Point Operations (FLOPs) compared to existing methods, contingent on the dataset and model configuration.",
        "keywords": "model compression;model acceleration;quantization",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Mohammad Sadegh Norouzzadeh;Shahbaz Rezaei",
        "authorids": "~Mohammad_Sadegh_Norouzzadeh1;~Shahbaz_Rezaei1",
        "gender": "M;M",
        "homepage": ";http://www.shrezaei.com/",
        "dblp": ";",
        "google_scholar": "AMvWPWsAAAAJ;dSQ7ka8AAAAJ",
        "orcid": ";",
        "linkedin": "arashno/;",
        "or_profile": "~Mohammad_Sadegh_Norouzzadeh1;~Shahbaz_Rezaei1",
        "aff": "Bosch;University of California, Davis",
        "aff_domain": "bosch.com;ucdavis.edu",
        "position": "Researcher;Postdoc",
        "bibtex": "@misc{\nnorouzzadeh2024compression,\ntitle={{COMPRESSION} {AND} {ACCELERATION} {OF} {DEEP} {NEURAL} {NETWORKS}: A {VECTOR} {QUANTIZATION} {APPROACH}},\nauthor={Mohammad Sadegh Norouzzadeh and Shahbaz Rezaei},\nyear={2024},\nurl={https://openreview.net/forum?id=NmaXXAiJJC}\n}",
        "github": "",
        "project": "",
        "reviewers": "hXiT;JeiW;Be5z",
        "site": "https://openreview.net/forum?id=NmaXXAiJJC",
        "pdf_size": 5922280,
        "rating": "3;5;6",
        "confidence": "5;3;4",
        "soundness": "2;3;3",
        "contribution": "2;2;3",
        "presentation": "2;2;3",
        "wc_summary": "73;65;68",
        "wc_strengths": "14;20;29",
        "wc_weaknesses": "176;79;309",
        "wc_questions": "72;70;6",
        "wc_review": "335;234;412",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "664;671;756",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            68.66666666666667,
            3.2998316455372216
        ],
        "wc_strengths_avg": [
            21.0,
            6.164414002968976
        ],
        "wc_weaknesses_avg": [
            188.0,
            94.27972563953857
        ],
        "wc_questions_avg": [
            49.333333333333336,
            30.6521704868604
        ],
        "wc_review_avg": [
            327.0,
            72.8880420005001
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            697.0,
            41.817061908587824
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.6546536707079772,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:5qM20DghbVYJ:scholar.google.com/&scioq=COMPRESSION+AND+ACCELERATION+OF+DEEP+NEURAL+NETWORKS:+A+VECTOR+QUANTIZATION+APPROACH&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Robert Bosch GmbH;University of California, Davis",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.bosch.com;https://www.ucdavis.edu",
        "aff_unique_abbr": "Bosch;UC Davis",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Davis",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Germany;United States"
    },
    {
        "title": "Perceptual Group Tokenizer: Building Perception with Iterative Grouping",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18771",
        "id": "NnYaYVODyV",
        "author_site": "Zhiwei Deng, Ting Chen, Yang Li",
        "tldr": "",
        "abstract": "Human visual recognition system shows astonishing capability of compressing visual information into a set of tokens containing rich representations without label supervision. One critical driving principle behind it is perceptual grouping. Despite being widely used in computer vision in the early 2010s, it remains a mystery whether perceptual grouping can be leveraged to derive a neural visual recognition backbone that generates as powerful representations. In this paper, we propose the Perceptual Group Tokenizer, a model that entirely relies on grouping operations to extract visual features and perform self-supervised representation learning, where a series of grouping operations are used to iteratively hypothesize the context for pixels or superpixels to refine feature representations. We show that the proposed model can achieve competitive performance compared to state-of-the-art vision architectures, and inherits desirable properties including adaptive computation without re-training, and interpretability. Specifically, Perceptual Group Tokenizer achieves 79.7% on ImageNet-1K self-supervised learning benchmark with linear probe evaluation, marking a new progress under this paradigm.",
        "keywords": "Self supervised learning;representation learning;image encoder",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Zhiwei Deng;Ting Chen;Yang Li",
        "authorids": "~Zhiwei_Deng3;~Ting_Chen1;~Yang_Li2",
        "gender": "M;M;M",
        "homepage": "http://www.zhiweideng.com;;http://yangl.org",
        "dblp": "160/3578;19/1766;37/4190-58",
        "google_scholar": "tWBPUHwAAAAJ;KoXUMbsAAAAJ;ZZdB48QAAAAJ",
        "orcid": ";;",
        "linkedin": ";;yang-li-127a2a41/",
        "or_profile": "~Zhiwei_Deng3;~Ting_Chen1;~Yang_Li2",
        "aff": "Google Deepmind;Google;Google",
        "aff_domain": "google.com;google.com;google.com",
        "position": "Research Scientist;Research Scientist;Research Scientist",
        "bibtex": "@inproceedings{\ndeng2024perceptual,\ntitle={Perceptual Group Tokenizer: Building Perception with Iterative Grouping},\nauthor={Zhiwei Deng and Ting Chen and Yang Li},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=NnYaYVODyV}\n}",
        "github": "",
        "project": "",
        "reviewers": "ABtJ;P2FR;qQDA;TtGg;8m3b",
        "pdf_size": 4382644,
        "rating": "5;6;6;8;8",
        "confidence": "5;4;3;4;4",
        "soundness": "2;3;3;3;4",
        "contribution": "3;2;3;3;3",
        "presentation": "3;3;3;3;3",
        "wc_summary": "67;36;49;70;90",
        "wc_strengths": "57;25;47;119;97",
        "wc_weaknesses": "128;209;136;141;59",
        "wc_questions": "75;19;2;113;241",
        "wc_review": "327;289;234;443;487",
        "wc_reply_reviewers": "0;183;18;62;0",
        "wc_reply_authors": "504;562;734;573;693",
        "reply_reviewers": "0;1;1;1;0",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            6.6,
            1.2
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            3.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            2.8,
            0.39999999999999997
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            62.4,
            18.5321342537766
        ],
        "wc_strengths_avg": [
            69.0,
            34.199415199678484
        ],
        "wc_weaknesses_avg": [
            134.6,
            47.617643788831046
        ],
        "wc_questions_avg": [
            90.0,
            85.25256594378845
        ],
        "wc_review_avg": [
            356.0,
            94.80928224599108
        ],
        "wc_reply_reviewers_avg": [
            52.6,
            69.02637177195393
        ],
        "wc_reply_authors_avg": [
            613.2,
            86.16588652129101
        ],
        "reply_reviewers_avg": [
            0.6,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.2635231383473649,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:PxjzuRNuBUoJ:scholar.google.com/&scioq=Perceptual+Group+Tokenizer:+Building+Perception+with+Iterative+Grouping&hl=en&as_sdt=0,23",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=NnYaYVODyV",
        "pdf": "https://openreview.net/pdf?id=NnYaYVODyV",
        "email": "google.com;google.com;google.com",
        "author_num": 3,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "DeepMind;Google",
        "aff_unique_dep": "DeepMind;Google",
        "aff_unique_url": "https://deepmind.com;https://www.google.com",
        "aff_unique_abbr": "DeepMind;Google",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "title": "fairret: a Framework for Differentiable Fairness Regularization Terms",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18770",
        "id": "NnyD0Rjx2B",
        "author_site": "Maarten Buyl, MaryBeth Defrance, Tijl De Bie",
        "tldr": "",
        "abstract": "Current tools for machine learning fairness only admit a limited range of fairness definitions and have seen little integration with automatic differentiation libraries, despite the central role these libraries play in modern machine learning pipelines.\n\nWe introduce a framework of fairness regularization terms (fairret) which quantify bias as modular objectives that are easily integrated in automatic differentiation pipelines. By employing a general definition of fairness in terms of linear-fractional statistics, a wide class of fairrets can be computed efficiently. Experiments show the behavior of their gradients and their utility in enforcing fairness with minimal loss of predictive power compared to baselines. Our contribution includes a PyTorch implementation of the fairret framework.",
        "keywords": "fairness;statistics;differentiation;regularization;classification",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/eef9905d701a95dc3cf512c7a8738ffefacccb51.zip",
        "author": "Maarten Buyl;MaryBeth Defrance;Tijl De Bie",
        "authorids": "~Maarten_Buyl1;~MaryBeth_Defrance1;~Tijl_De_Bie1",
        "gender": "M;F;M",
        "homepage": ";;http://www.tijldebie.net",
        "dblp": "259/2365;;49/2018",
        "google_scholar": "A5bU3BUAAAAJ;;https://scholar.google.be/citations?user=eH_c4R4AAAAJ",
        "orcid": "0000-0002-5434-2386;0000-0002-6570-8857;0000-0002-2692-7504",
        "linkedin": "maarten-buyl-44a54715a/;marybeth-defrance-bb514964/;tijldebie/",
        "or_profile": "~Maarten_Buyl1;~MaryBeth_Defrance1;~Tijl_De_Bie1",
        "aff": "School of Engineering and Applied Sciences, Harvard University;Universiteit Gent;Ghent University",
        "aff_domain": "seas.harvard.edu;ugent.be;ugent.be",
        "position": "Postdoc;PhD student;Full Professor",
        "bibtex": "@inproceedings{\nbuyl2024fairret,\ntitle={fairret: a Framework for Differentiable Fairness Regularization Terms},\nauthor={Maarten Buyl and MaryBeth Defrance and Tijl De Bie},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=NnyD0Rjx2B}\n}",
        "github": "",
        "project": "",
        "reviewers": "BABL;eBDd;hHUL;ALkR",
        "pdf_size": 976991,
        "rating": "3;5;8;8",
        "confidence": "5;4;4;4",
        "soundness": "1;3;3;4",
        "contribution": "1;2;2;3",
        "presentation": "2;3;3;4",
        "wc_summary": "51;43;41;68",
        "wc_strengths": "9;48;12;47",
        "wc_weaknesses": "29;85;107;56",
        "wc_questions": "64;46;64;38",
        "wc_review": "153;222;224;209",
        "wc_reply_reviewers": "179;14;68;17",
        "wc_reply_authors": "664;587;524;448",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;1;2;1",
        "rating_avg": [
            6.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            1.0897247358851685
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            50.75,
            10.638961415476606
        ],
        "wc_strengths_avg": [
            29.0,
            18.533752992850637
        ],
        "wc_weaknesses_avg": [
            69.25,
            29.448047473474364
        ],
        "wc_questions_avg": [
            53.0,
            11.357816691600547
        ],
        "wc_review_avg": [
            202.0,
            28.8704000665041
        ],
        "wc_reply_reviewers_avg": [
            69.5,
            66.76263925280367
        ],
        "wc_reply_authors_avg": [
            555.75,
            79.54990571961729
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8164965809277261,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2327841105547174012&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=NnyD0Rjx2B",
        "pdf": "https://openreview.net/pdf?id=NnyD0Rjx2B",
        "email": "seas.harvard.edu;ugent.be;ugent.be",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Harvard University;University of Ghent;Ghent University",
        "aff_unique_dep": "School of Engineering and Applied Sciences;;",
        "aff_unique_url": "https://www.harvard.edu;https://www.ugent.be/en;https://www.ugent.be/en",
        "aff_unique_abbr": "Harvard;UGent;UGent",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Cambridge;",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "United States;Belgium"
    },
    {
        "id": "NoeLQU4J2O",
        "title": "Soon Filter: Advancing Feed-Forward Neural Architectures for Inference at the Edge",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "As Deep Neural Networks become more complex and computationally demanding, efficient models for inference at the edge, particularly multiplication-free ones, have gained significant attention. The Ultra Low-Energy Edge Neural Network (ULEEN) is a notable architecture optimized for feed-forward designs. ULEEN uniquely employs Bloom Filters with binary values to compute neuron activation, boasting better efficiency metrics than Binary Neural Networks (BNNs). This work uncovers a gradient back-propagation bottleneck within ULEEN's Bloom filters and introduces introduces a simplified version of it as a solution: the \"Soon Filter\". Both theoretically and empirically, we demonstrate that our approach improves gradient back-propagation efficiency. Tests on various UCI datasets and MNIST, which are standard benchmarks for feed-forward models, reveal that our method surpasses ULEEN, BNN, and DeepShift. Notably, with MNIST, we achieve 98.6% with only 98KiB, while ULEEN, BNN and DeepShift achieves 98.5% with 262KiB, 98.5% with 355KiB and 98.3% with 408KiB respectively. Furthermore, when using MLPerf Tiny datasets, which are typically more appropriate for CNNs, we consistently outperform other models when they are implemented as Multilayer Perceptrons. This results underscores the promising potential of our solution for efficient inference at the edge in applications that rely on feed-forward architectures.",
        "keywords": "Binary Neural Networks;DeepShift;ULEEN;Weightless Neural Networks",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/1db46ac2fd7cd85df8f193a1839e53005b5d0aca.zip",
        "author": "Alan Tendler Leibel Bacellar;Zachary Susskind;Mauricio Breternitz Jr;Lizy Kurian John;Felipe M.G. Fran\u00e7a;Priscila Machado Vieira Lima",
        "authorids": "~Alan_Tendler_Leibel_Bacellar1;~Zachary_Susskind1;~Mauricio_Breternitz_Jr1;~Lizy_Kurian_John1;~Felipe_M.G._Fran\u00e7a1;~Priscila_Machado_Vieira_Lima1",
        "gender": "M;M;M;F;M;Not Specified",
        "homepage": "https://www.researchgate.net/profile/Alan-Bacellar-2;https://zsknd.com/;;https://www.ece.utexas.edu/people/faculty/lizy-john;https://www.cienciavitae.pt/portal/6D1D-CD3F-CB14;",
        "dblp": "283/4823;277/7756.html;b/MauricioBreternitz.html;j/LizyKurianJohn.html;f/FelipeMaiaGalvaoFranca.html;75/6119.html",
        "google_scholar": "HfYBXYYAAAAJ;https://scholar.google.com/citations?hl=en;pnmGA74AAAAJ;YPu9rWUAAAAJ;https://scholar.google.com/citations?hl=en;",
        "orcid": "0000-0002-3346-7665;0000-0002-7244-6285;0000-0003-1752-6255;0000-0002-8747-5214;0000-0002-8980-6208;0000-0002-8515-9904",
        "linkedin": "alanbacellar/;zsusskind/;;;;",
        "or_profile": "~Alan_Tendler_Leibel_Bacellar1;~Zachary_Susskind1;~Mauricio_Breternitz_Jr1;~Lizy_Kurian_John1;~Felipe_M.G._Fran\u00e7a1;~Priscila_Machado_Vieira_Lima1",
        "aff": "University of Texas at Austin;University of Texas at Austin;ISCTE - Instituto Universit\u00e1rio de Lisboa;University of Texas at Austin;Instituto de Telecomunica\u00e7\u00f5es, Portugal;Universidade Federal do Rio de Janeiro",
        "aff_domain": "utexas.edu;utexas.edu;iscte.pt;utexas.edu;it.pt;ufrj.br",
        "position": "PhD student;PhD student;Principal Researcher;Full Professor;Researcher;Lecturer",
        "bibtex": "@misc{\nbacellar2024soon,\ntitle={Soon Filter: Advancing Feed-Forward Neural Architectures for Inference at the Edge},\nauthor={Alan Tendler Leibel Bacellar and Zachary Susskind and Mauricio Breternitz Jr and Lizy Kurian John and Felipe M.G. Fran{\\c{c}}a and Priscila Machado Vieira Lima},\nyear={2024},\nurl={https://openreview.net/forum?id=NoeLQU4J2O}\n}",
        "github": "",
        "project": "",
        "reviewers": "fhaz;aeHv;N6Ny",
        "site": "https://openreview.net/forum?id=NoeLQU4J2O",
        "pdf_size": 817021,
        "rating": "3;3;5",
        "confidence": "4;5;3",
        "soundness": "2;2;3",
        "contribution": "2;1;2",
        "presentation": "3;3;3",
        "wc_summary": "101;64;92",
        "wc_strengths": "22;17;36",
        "wc_weaknesses": "163;64;83",
        "wc_questions": "35;43;87",
        "wc_review": "321;188;298",
        "wc_reply_reviewers": "17;86;0",
        "wc_reply_authors": "661;471;358",
        "reply_reviewers": "1;1;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            85.66666666666667,
            15.755069730795299
        ],
        "wc_strengths_avg": [
            25.0,
            8.04155872120988
        ],
        "wc_weaknesses_avg": [
            103.33333333333333,
            42.897811391983886
        ],
        "wc_questions_avg": [
            55.0,
            22.861904265976328
        ],
        "wc_review_avg": [
            269.0,
            58.04021594262608
        ],
        "wc_reply_reviewers_avg": [
            34.333333333333336,
            37.18721405118819
        ],
        "wc_reply_authors_avg": [
            496.6666666666667,
            125.02355333651691
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.8660254037844387,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:tS9Ryr6_fBsJ:scholar.google.com/&scioq=Soon+Filter:+Advancing+Feed-Forward+Neural+Architectures+for+Inference+at+the+Edge&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;2;3",
        "aff_unique_norm": "University of Texas at Austin;Instituto Universit\u00e1rio de Lisboa;Instituto de Telecomunica\u00e7\u00f5es;Universidade Federal do Rio de Janeiro",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.utexas.edu;https://www.iscte-iul.pt;https://www.it.pt;https://www.ufrj.br",
        "aff_unique_abbr": "UT Austin;ISCTE;;UFRJ",
        "aff_campus_unique_index": "0;0;0;2",
        "aff_campus_unique": "Austin;;Rio de Janeiro",
        "aff_country_unique_index": "0;0;1;0;1;2",
        "aff_country_unique": "United States;Portugal;Brazil"
    },
    {
        "title": "Intelligent Switching for Reset-Free RL",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18769",
        "id": "Nq45xeghcL",
        "author_site": "Darshan Patil, Janarthanan Rajendran, Glen Berseth, Sarath Chandar",
        "tldr": "",
        "abstract": "In the real world, the strong episode resetting mechanisms that are needed to train\nagents in simulation are unavailable. The resetting assumption limits the potential\nof reinforcement learning in the real world, as providing resets to an agent usually\nrequires the creation of additional handcrafted mechanisms or human interventions.\nRecent work aims to train agents (forward) with learned resets by constructing\na second (backward) agent that returns the forward agent to the initial state. We\nfind that the termination and timing of the transitions between these two agents\nare crucial for algorithm success. With this in mind, we create a new algorithm,\nReset Free RL with Intelligently Switching Controller (RISC) which intelligently\nswitches between the two agents based on the agent\u2019s confidence in achieving its\ncurrent goal. Our new method achieves state-of-the-art performance on several\nchallenging environments for reset-free RL.",
        "keywords": "Reset-Free RL",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Darshan Patil;Janarthanan Rajendran;Glen Berseth;Sarath Chandar",
        "authorids": "~Darshan_Patil1;~Janarthanan_Rajendran1;~Glen_Berseth1;~Sarath_Chandar1",
        "gender": "M;;M;M",
        "homepage": "http://www.darshanpatil.com/;;http://fracturedplane.com/;http://sarathchandar.in/",
        "dblp": "211/8734;;147/5478;45/8542",
        "google_scholar": "https://scholar.google.ca/citations?user=X3HJD0AAAAAJ;;https://scholar.google.ca/citations?user=-WZcuuwAAAAJ;https://scholar.google.co.in/citations?user=yxWtZLAAAAAJ",
        "orcid": ";;0000-0001-7351-8028;",
        "linkedin": ";;glen-berseth-0523278b?trk=hp-identity-name;",
        "or_profile": "~Darshan_Patil1;~Janarthanan_Rajendran1;~Glen_Berseth1;~Sarath_Chandar1",
        "aff": "Universit\u00e9 de Montr\u00e9al;;Montreal Institute for Learning Algorithms, University of Montreal, Universit\u00e9 de Montr\u00e9al;\u00c9cole Polytechnique de Montr\u00e9al",
        "aff_domain": "umontreal.ca;;mila.umontreal.ca;polymtl.ca",
        "position": "PhD student;;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\npatil2024intelligent,\ntitle={Intelligent Switching for Reset-Free {RL}},\nauthor={Darshan Patil and Janarthanan Rajendran and Glen Berseth and Sarath Chandar},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Nq45xeghcL}\n}",
        "github": "",
        "project": "",
        "reviewers": "J5Lq;oJUJ;VmY7;gA9F",
        "pdf_size": 2625537,
        "rating": "5;6;8;8",
        "confidence": "3;3;3;4",
        "soundness": "2;3;2;3",
        "contribution": "2;3;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "91;77;142;128",
        "wc_strengths": "90;54;152;68",
        "wc_weaknesses": "67;46;30;77",
        "wc_questions": "59;51;84;315",
        "wc_review": "307;228;408;588",
        "wc_reply_reviewers": "0;28;100;24",
        "wc_reply_authors": "536;728;730;1088",
        "reply_reviewers": "0;1;2;1",
        "reply_authors": "2;2;2;3",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            109.5,
            26.443335644354704
        ],
        "wc_strengths_avg": [
            91.0,
            37.48332962798263
        ],
        "wc_weaknesses_avg": [
            55.0,
            18.261982367749674
        ],
        "wc_questions_avg": [
            127.25,
            109.07881324986992
        ],
        "wc_review_avg": [
            382.75,
            134.58338493291063
        ],
        "wc_reply_reviewers_avg": [
            38.0,
            37.36308338453881
        ],
        "wc_reply_authors_avg": [
            770.5,
            199.52631405406154
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5555555555555555,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:72SD6jz_ru8J:scholar.google.com/&scioq=Intelligent+Switching+for+Reset-Free+RL&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=Nq45xeghcL",
        "pdf": "https://openreview.net/pdf?id=Nq45xeghcL",
        "email": "umontreal.ca;;mila.umontreal.ca;polymtl.ca",
        "author_num": 4,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Universit\u00e9 de Montr\u00e9al;University of Montreal;\u00c9cole Polytechnique de Montr\u00e9al",
        "aff_unique_dep": ";Montreal Institute for Learning Algorithms;",
        "aff_unique_url": "https://www.umontreal.ca;https://www.mila.quebec;https://www.polymtl.ca",
        "aff_unique_abbr": "UdeM;MILA;Polytechnique Montr\u00e9al",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Montreal;Montr\u00e9al",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "NqQjoncEDR",
        "title": "Selective Mixup Helps with Distribution Shifts, But Not (Only) because of Mixup",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Mixup is a highly successful technique to improve the generalization of neural networks by augmenting the training data with combinations of random pairs. Selective mixup is a family of methods that apply mixup to specific pairs, e.g. only combining examples across classes or domains. These methods have claimed remarkable improvements in benchmarks with distribution shifts, but their mechanisms and limitations remain poorly understood.\n\nWe examine an overlooked aspect of selective mixup that explains its success in a completely new light. We find that the non-random selection of pairs affects the training distribution and improves generalization by means completely unrelated to the mixing. For example, in binary classification, mixup across classes implicitly resamples the data for a uniform class distribution - a classical solution to label shift. We show empirically that this implicit resampling explains much of the improvements in prior work. Theoretically, these results rely on a \"regression toward the mean\", an accidental property that we identify in several datasets.\n\nTakeaways: We have found a new equivalence between two successful methods: selective mixup and resampling. We identify the limits of the former, confirm the effectiveness of the latter, and find better combinations of their respective benefits.",
        "keywords": "mixup;distribution shifts;OOD generalization;weighted training",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/80b1f9574bf14619dbf057629ae318b92d38196b.pdf",
        "author": "Damien Teney;Jindong Wang;Ehsan Abbasnejad",
        "authorids": "~Damien_Teney1;~Jindong_Wang1;~Ehsan_Abbasnejad3",
        "gender": "M;M;M",
        "homepage": "https://www.damienteney.info;https://ehsanabb.github.io/;https://jd92.wang/",
        "dblp": "62/10068;30/11191;19/2969-1",
        "google_scholar": "https://scholar.google.com.au/citations?user=iS_jP_3dpD8J;https://scholar.google.com/citations?hl=en;hBZ_tKsAAAAJ",
        "orcid": ";;0000-0002-4833-0880",
        "linkedin": ";;jindong-wang/",
        "or_profile": "~Damien_Teney1;~Ehsan_M_Abbasnejad1;~Jindong_Wang4",
        "aff": "Idiap Research Institute;University of Adelaide;Microsoft Research",
        "aff_domain": "idiap.ch;adelaide.edu.au;microsoft.com",
        "position": "Researcher;Assistant Professor;Researcher",
        "bibtex": "@misc{\nteney2024selective,\ntitle={Selective Mixup Helps with Distribution Shifts, But Not (Only) because of Mixup},\nauthor={Damien Teney and Jindong Wang and Ehsan Abbasnejad},\nyear={2024},\nurl={https://openreview.net/forum?id=NqQjoncEDR}\n}",
        "github": "",
        "project": "",
        "reviewers": "Cy8e;pzjf;sizd;4eUi",
        "site": "https://openreview.net/forum?id=NqQjoncEDR",
        "pdf_size": 1189919,
        "rating": "3;5;5;6",
        "confidence": "4;4;4;3",
        "soundness": "4;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;2;2",
        "wc_summary": "86;85;91;50",
        "wc_strengths": "40;45;14;46",
        "wc_weaknesses": "190;40;186;37",
        "wc_questions": "2;236;18;72",
        "wc_review": "318;406;309;205",
        "wc_reply_reviewers": "0;405;74;81",
        "wc_reply_authors": "397;538;629;272",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "1;2;2;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            78.0,
            16.32482771731451
        ],
        "wc_strengths_avg": [
            36.25,
            13.045593125649749
        ],
        "wc_weaknesses_avg": [
            113.25,
            74.77090008820277
        ],
        "wc_questions_avg": [
            82.0,
            92.61749294814668
        ],
        "wc_review_avg": [
            309.5,
            71.24780698379425
        ],
        "wc_reply_reviewers_avg": [
            140.0,
            156.25459993229
        ],
        "wc_reply_authors_avg": [
            459.0,
            135.97242367480254
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.6622661785325219,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10502332873890205900&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Idiap Research Institute;University of Adelaide;Microsoft",
        "aff_unique_dep": ";;Microsoft Research",
        "aff_unique_url": "https://www.idiap.ch;https://www.adelaide.edu.au;https://www.microsoft.com/en-us/research",
        "aff_unique_abbr": "Idiap;Adelaide;MSR",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2",
        "aff_country_unique": "Switzerland;Australia;United States"
    },
    {
        "id": "Nqir5R4ACn",
        "title": "Simple Data Sharing for Multi-Tasked Goal-Oriented Problems",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Many important sequential decision problems -- from robotics, games to logistics -- are multi-tasked and goal-oriented. In this work, we frame them as Contextual Goal Oriented (CGO) problems, a goal-reaching special case of the contextual Markov decision process. CGO is a framework for designing multi-task agents that can follow instructions (represented by contexts) to solve goal-oriented tasks. We show that CGO problem can be systematically tackled using datasets that are commonly obtainable: an unsupervised interaction dataset of transitions and a supervised dataset of context-goal pairs. Leveraging the goal-oriented structure of CGO, we propose a simple data sharing technique that can provably solve CGO problems offline under natural assumptions on the datasets' quality. While an offline CGO problem is a special case of offline reinforcement learning (RL) with unlabelled data, running a generic offline RL algorithm here can be overly conservative since the goal-oriented structure of CGO is ignored. In contrast, our approach carefully constructs an augmented Markov Decision Process (MDP) to avoid introducing unnecessary pessimistic bias. In the experiments, we demonstrate our algorithm can learn near-optimal context-conditioned policies in simulated CGO problems, outperforming offline RL baselines.",
        "keywords": "goal-conditioned RL;offline RL",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/357bb6420f8d85202620d7163b22763e6060c5d8.zip",
        "author": "Ying Fan;Jingling Li;Adith Swaminathan;Aditya Modi;Ching-An Cheng",
        "authorids": "~Ying_Fan2;~Jingling_Li1;~Adith_Swaminathan1;~Aditya_Modi1;~Ching-An_Cheng1",
        "gender": ";;M;M;M",
        "homepage": "https://yingfan-bot.github.io/;;https://adith387.github.io/;https://adityamodi.github.io;http://www.chinganc.com",
        "dblp": ";;;147/9396-2;123/6369",
        "google_scholar": "1aj4dZcAAAAJ;;WNHLjp0AAAAJ;BN0O9wgAAAAJ;bMZFLZ_V4goC",
        "orcid": ";;;;",
        "linkedin": "ying-fan-5b7b07147/;;adith-swaminathan-98198a21/;aditya-modi-170a587a/;",
        "or_profile": "~Ying_Fan2;~Jingling_Li1;~Adith_Swaminathan1;~Aditya_Modi1;~Ching-An_Cheng1",
        "aff": "University of Wisconsin-Madison;;Microsoft;Microsoft;Microsoft Research",
        "aff_domain": "cs.wisc.edu;;microsoft.com;microsoft.com;microsoft.com",
        "position": "Graduate student;;Researcher;Researcher;Principal Researcher",
        "bibtex": "@misc{\nfan2024simple,\ntitle={Simple Data Sharing for Multi-Tasked Goal-Oriented Problems},\nauthor={Ying Fan and Jingling Li and Adith Swaminathan and Aditya Modi and Ching-An Cheng},\nyear={2024},\nurl={https://openreview.net/forum?id=Nqir5R4ACn}\n}",
        "github": "",
        "project": "",
        "reviewers": "Fsyr;i3TD;Mndx;wCFi",
        "site": "https://openreview.net/forum?id=Nqir5R4ACn",
        "pdf_size": 2255238,
        "rating": "3;3;5;5",
        "confidence": "2;4;3;2",
        "soundness": "2;1;2;2",
        "contribution": "2;3;2;2",
        "presentation": "2;2;3;2",
        "wc_summary": "73;142;125;71",
        "wc_strengths": "88;88;88;31",
        "wc_weaknesses": "250;678;328;37",
        "wc_questions": "293;509;38;91",
        "wc_review": "704;1417;579;230",
        "wc_reply_reviewers": "66;0;0;82",
        "wc_reply_authors": "1250;933;865;496",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            102.75,
            31.339870771909702
        ],
        "wc_strengths_avg": [
            73.75,
            24.681724007856502
        ],
        "wc_weaknesses_avg": [
            323.25,
            230.85425597116463
        ],
        "wc_questions_avg": [
            232.75,
            185.71803224242927
        ],
        "wc_review_avg": [
            732.5,
            431.6888346946212
        ],
        "wc_reply_reviewers_avg": [
            37.0,
            37.429934544425805
        ],
        "wc_reply_authors_avg": [
            886.0,
            267.9766780897173
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.30151134457776363,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:fGm0cgrK27oJ:scholar.google.com/&scioq=Simple+Data+Sharing+for+Multi-Tasked+Goal-Oriented+Problems&hl=en&as_sdt=0,5",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "University of Wisconsin-Madison;Microsoft",
        "aff_unique_dep": ";Microsoft Corporation",
        "aff_unique_url": "https://www.wisc.edu;https://www.microsoft.com",
        "aff_unique_abbr": "UW-Madison;Microsoft",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Madison;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "NqpdT8DwGc",
        "title": "Stealing the Invisible: Unveiling Pre-Trained CNN Models through Adversarial Examples and Timing Side-Channels",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Machine learning, with its myriad applications, has become an integral component of numerous technological systems. A common practice in this domain is the use of transfer learning, where a pre-trained model's architecture, readily available to the public, is fine-tuned to suit specific tasks. As Machine Learning as a Service (MLaaS) platforms increasingly use pre-trained models in their backends, it's crucial to safeguard these architectures and understand their vulnerabilities. In this work, we present an approach based on the observation that the classification patterns of adversarial images can be used as a means to steal the models. Furthermore, the adversarial image classifications in conjunction with timing side channels can lead to a model stealing method. Our approach, designed for typical user-level access in remote MLaaS environments exploits varying misclassifications of adversarial images across different models to fingerprint several renowned Convolutional Neural Network (CNN) and Vision Transformer (ViT) architectures. We utilize the profiling of remote model inference times to reduce the necessary adversarial images, subsequently decreasing the number of queries required. We have presented our results over 27 pre-trained models of different CNN and ViT architectures using CIFAR-10 dataset and demonstrate a high accuracy of 88.8% while keeping the query budget under $20$.",
        "keywords": "Model stealing;Adversarial images;Timing side-channel;Transfer Learning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Shubhi Shukla;Manaar Alam;Pabitra Mitra;Debdeep Mukhopadhyay",
        "authorids": "~Shubhi_Shukla1;~Manaar_Alam1;~Pabitra_Mitra1;~Debdeep_Mukhopadhyay1",
        "gender": "F;M;M;M",
        "homepage": "https://www.shubhishukla.com/;https://manaaralam.github.io;http://cse.iitkgp.ac.in/~pabitra/;https://sites.google.com/view/debdeepmukhopadhyay/",
        "dblp": ";192/5163;m/PabitraMitra;",
        "google_scholar": "UDQZWrkAAAAJ;46jmlGgAAAAJ;https://scholar.google.com.tw/citations?user=5bXSZPYAAAAJ;https://scholar.google.com.tw/citations?user=2ELnl9IAAAAJ",
        "orcid": ";;0000-0002-1908-9813;",
        "linkedin": ";;pabitra-mitra-8028235/;",
        "or_profile": "~Shubhi_Shukla1;~Manaar_Alam1;~Pabitra_Mitra1;~Debdeep_Mukhopadhyay1",
        "aff": "Indian Institute of Technology Kharagpur;New York University, Abu Dhabi;Indian Institute of Technology Kharagpur;",
        "aff_domain": "iitkgp.ernet.in;nyuad.nyu.edu;iitkgp.ac.in;",
        "position": "PhD student;Postdoc;Full Professor;",
        "bibtex": "@misc{\nshukla2024stealing,\ntitle={Stealing the Invisible: Unveiling Pre-Trained {CNN} Models through Adversarial Examples and Timing Side-Channels},\nauthor={Shubhi Shukla and Manaar Alam and Pabitra Mitra and Debdeep Mukhopadhyay},\nyear={2024},\nurl={https://openreview.net/forum?id=NqpdT8DwGc}\n}",
        "github": "",
        "project": "",
        "reviewers": "5A6W;1hVo;rKcg;QATX",
        "site": "https://openreview.net/forum?id=NqpdT8DwGc",
        "pdf_size": 587929,
        "rating": "1;3;3;3",
        "confidence": "4;4;4;4",
        "soundness": "2;1;3;2",
        "contribution": "1;2;2;2",
        "presentation": "3;2;3;2",
        "wc_summary": "55;26;81;93",
        "wc_strengths": "20;37;30;41",
        "wc_weaknesses": "204;239;204;315",
        "wc_questions": "73;3;73;3",
        "wc_review": "352;305;388;452",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            63.75,
            25.762133063859444
        ],
        "wc_strengths_avg": [
            32.0,
            7.968688725254614
        ],
        "wc_weaknesses_avg": [
            240.5,
            45.32383478921438
        ],
        "wc_questions_avg": [
            38.0,
            35.0
        ],
        "wc_review_avg": [
            374.25,
            53.67669419776147
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6321389293949789881&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Indian Institute of Technology Kharagpur;New York University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.iitkgp.ac.in;https://nyu.edu",
        "aff_unique_abbr": "IIT Kharagpur;NYU",
        "aff_campus_unique_index": "0;1;0",
        "aff_campus_unique": "Kharagpur;Abu Dhabi",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "India;United Arab Emirates"
    },
    {
        "id": "NrI1OkZkiy",
        "title": "NDIM: Neuronal Diversity Inspired Model for Multisensory Emotion Recognition",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Without cross-sensory interaction, a key aspect of multisensory emotion recognition, traditional deep learning methods exhibit inferior performance in this task. On the contrary, the human brain possesses an inherent and remarkable capacity for multisensory recognition. Its diverse neurons exhibit distinct responses to sensory inputs, thus facilitating cross-sensory interaction. Leveraging this superiority, we propose the Neuronal Diversity Inspired Model (NDIM), which incorporates both unisensory and multisensory neurons, aligning with the human brain. To mirror the diverse response characteristics exhibited by various neurons, we introduce innovative connection constraints to regulate feature transmission between neurons. Drawing inspiration from this novel concept of neuronal diversity, our model exhibits biological plausibility, facilitating more effective emotion recognition of multisensory information. Experiments on the RAVDESS and eNTERFAVE'05 datasets show that the NDIM achieves the best accuracy of 99.63\\% and 98.45\\%, respectively, demonstrating the potential of neuronal-diversity-inspired approaches in advancing multisensory interaction and emotion recognition.",
        "keywords": "Brain-inspired Learning;Neuronal Diversity;Multisensery Emotion Recognition;Cross-sensory Interaction",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Qixin Wang;Chaoqiong Fan;Tianyuan Jia;Han Yuyang;Xia Wu",
        "authorids": "~Qixin_Wang2;~Chaoqiong_Fan1;~Tianyuan_Jia1;~Han_Yuyang1;~Xia_Wu3",
        "gender": "F;F;F;M;",
        "homepage": "https://orcid.org/my-orcid?emailVerified=true&orcid=0009-0005-8597-2160;;;https://www.researchgate.net/profile/Han-Yuyang;",
        "dblp": "17/6932.html;;123/2509;;",
        "google_scholar": ";;;;",
        "orcid": "0009-0005-8597-2160;0000-0003-3877-9315;0000-0001-9602-7336;0009-0006-1192-2184;",
        "linkedin": ";;;;",
        "or_profile": "~Qixin_Wang2;~Chaoqiong_Fan1;~Tianyuan_Jia1;~Han_Yuyang1;~Xia_Wu3",
        "aff": ";Beijing Normal University;Beijing Normal University;Beijing Normal University;",
        "aff_domain": ";bnu.edu.cn;bnu.edu.cn;bnu.edu.cn;",
        "position": ";Lecturer;PhD student;MS student;",
        "bibtex": "@misc{\nwang2024ndim,\ntitle={{NDIM}: Neuronal Diversity Inspired Model for Multisensory Emotion Recognition},\nauthor={Qixin Wang and Chaoqiong Fan and Tianyuan Jia and Han Yuyang and Xia Wu},\nyear={2024},\nurl={https://openreview.net/forum?id=NrI1OkZkiy}\n}",
        "github": "",
        "project": "",
        "reviewers": "qHgo;rVfx;1e4r;ucoo",
        "site": "https://openreview.net/forum?id=NrI1OkZkiy",
        "pdf_size": 1418373,
        "rating": "1;3;5;5",
        "confidence": "4;4;3;3",
        "soundness": "1;2;3;3",
        "contribution": "1;2;2;2",
        "presentation": "1;3;3;3",
        "wc_summary": "66;75;173;50",
        "wc_strengths": "29;97;140;32",
        "wc_weaknesses": "422;288;235;159",
        "wc_questions": "53;44;136;1",
        "wc_review": "570;504;684;242",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            1.6583123951777
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            91.0,
            48.181946826586405
        ],
        "wc_strengths_avg": [
            74.5,
            46.56447143477525
        ],
        "wc_weaknesses_avg": [
            276.0,
            95.95571895410924
        ],
        "wc_questions_avg": [
            58.5,
            48.869724779253666
        ],
        "wc_review_avg": [
            500.0,
            162.27754003558226
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9045340337332909,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9977789839318841646&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Beijing Normal University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.bnu.edu.cn",
        "aff_unique_abbr": "BNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "Ns8SXMJ2ic",
        "title": "Randomized Benchmarking of Local Zeroth-Order Optimizers for Variational Quantum Systems",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In the field of quantum information, classical optimizers play an important role. From experimentalists optimizing their physical devices to theorists exploring variational quantum algorithms, many aspects of quantum information require the use of a classical optimizer. For this reason, there are many papers that benchmark the effectiveness of different optimizers for specific quantum learning tasks and choices of parameterized algorithms. However, for researchers exploring new algorithms or physical devices, the insights from these studies don't necessarily translate. To address this concern, we compare the performance of a class optimizers across a series of partially-randomized tasks to more broadly sample the space of quantum learning problems. We focus on local zeroth-order optimizers due to their generally favorable performance and query-efficiency on quantum systems. We discuss insights from these experiments that can help motivate future works to improve these optimizers for use on quantum systems.",
        "keywords": "quantum;optimization;zeroth-order;benchmark",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Lucas Matthew Tecot;Cho-Jui Hsieh",
        "authorids": "~Lucas_Matthew_Tecot1;~Cho-Jui_Hsieh1",
        "gender": "M;M",
        "homepage": ";http://web.cs.ucla.edu/~chohsieh/index.html",
        "dblp": ";14/2770",
        "google_scholar": ";Wy89g4IAAAAJ",
        "orcid": ";",
        "linkedin": "lucas-tecot-a4228156/;",
        "or_profile": "~Lucas_Matthew_Tecot1;~Cho-Jui_Hsieh1",
        "aff": "University of California, Los Angeles;University of California, Los Angeles",
        "aff_domain": "ucla.edu;ucla.edu",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\ntecot2024randomized,\ntitle={Randomized Benchmarking of Local Zeroth-Order Optimizers for Variational Quantum Systems},\nauthor={Lucas Matthew Tecot and Cho-Jui Hsieh},\nyear={2024},\nurl={https://openreview.net/forum?id=Ns8SXMJ2ic}\n}",
        "github": "",
        "project": "",
        "reviewers": "McZo;tcpu;amNq;jfx3",
        "site": "https://openreview.net/forum?id=Ns8SXMJ2ic",
        "pdf_size": 709119,
        "rating": "3;3;3;5",
        "confidence": "4;4;5;4",
        "soundness": "2;3;2;2",
        "contribution": "1;2;1;1",
        "presentation": "2;3;2;2",
        "wc_summary": "77;90;49;42",
        "wc_strengths": "34;86;65;35",
        "wc_weaknesses": "100;289;76;364",
        "wc_questions": "58;90;21;11",
        "wc_review": "269;555;211;452",
        "wc_reply_reviewers": "48;0;0;91",
        "wc_reply_authors": "420;492;223;244",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            64.5,
            19.704060495238032
        ],
        "wc_strengths_avg": [
            55.0,
            21.805962487356524
        ],
        "wc_weaknesses_avg": [
            207.25,
            122.45688016604049
        ],
        "wc_questions_avg": [
            45.0,
            31.32890039564108
        ],
        "wc_review_avg": [
            371.75,
            138.2197073502907
        ],
        "wc_reply_reviewers_avg": [
            34.75,
            37.93003427364653
        ],
        "wc_reply_authors_avg": [
            344.75,
            114.36646142991397
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:YZgxwu19hGAJ:scholar.google.com/&scioq=Randomized+Benchmarking+of+Local+Zeroth-Order+Optimizers+for+Variational+Quantum+Systems&hl=en&as_sdt=0,21",
        "gs_version_total": 7,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of California, Los Angeles",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucla.edu",
        "aff_unique_abbr": "UCLA",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Los Angeles",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "PromptTTS 2: Describing and Generating Voices with Text Prompt",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18768",
        "id": "NsCXDyv2Bn",
        "author_site": "Yichong Leng, ZHifang Guo, Kai Shen, Zeqian Ju, Xu Tan, Eric Liu, Yufei Liu, Dongchao Yang, leying zhang, Kaitao Song, Lei He, Xiangyang Li, sheng zhao, Tao Qin, Jiang Bian",
        "tldr": "",
        "abstract": "Speech conveys more information than text, as the same word can be uttered in various voices to convey diverse information. Compared to traditional text-to-speech (TTS) methods relying on speech prompts (reference speech) for voice variability, using text prompts (descriptions) is more user-friendly since speech prompts can be hard to find or may not exist at all. TTS approaches based on the text prompt face two main challenges: 1) the one-to-many problem, where not all details about voice variability can be described in the text prompt, and 2) the limited availability of text prompt datasets, where vendors and large cost of data labeling are required to write text prompts for speech. In this work, we introduce PromptTTS 2 to address these challenges with a variation network to provide variability information of voice not captured by text prompts, and a prompt generation pipeline to utilize the large language models (LLM) to compose high quality text prompts. Specifically, the variation network predicts the representation extracted from the reference speech (which contains full information about voice variability) based on the text prompt representation. For the prompt generation pipeline, it generates text prompts for speech with a speech language understanding model to recognize voice attributes (e.g., gender, speed) from speech and a large language model to formulate text prompts based on the recognition results. Experiments on a large-scale (44K hours) speech dataset demonstrate that compared to the previous works, PromptTTS 2 generates voices more consistent with text prompts and supports the sampling of diverse voice variability, thereby offering users more choices on voice generation. Additionally, the prompt generation pipeline produces high-quality text prompts, eliminating the large labeling cost. The demo page of PromptTTS 2 is available (https://speechresearch.github.io/prompttts2).",
        "keywords": "Text-to-Speech;Voice Generation;Prompt;Variation Network",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/40f0c30df83d4c0523af29f70577f68d92a43a88.zip",
        "author": "Yichong Leng;Zhifang Guo;Kai Shen;Zeqian Ju;Xu Tan;Eric Liu;Yufei Liu;Dongchao Yang;leying zhang;Kaitao Song;Lei He;Xiangyang Li;sheng zhao;Tao Qin;Jiang Bian",
        "authorids": "~Yichong_Leng1;~Zhifang_Guo3;~Kai_Shen2;~Zeqian_Ju1;~Xu_Tan1;~Eric_Liu1;~Yufei_Liu3;~Dongchao_Yang1;~leying_zhang2;~Kaitao_Song1;~Lei_He6;~Xiangyang_Li4;~sheng_zhao1;~Tao_Qin1;~Jiang_Bian1",
        "gender": "M;M;M;Not Specified;M;M;M;M;F;M;M;;M;M;M",
        "homepage": ";https://github.com/965694547;;;https://tan-xu.github.io/;https://blog.csdn.net/parakpurple;http://www.google.com;http://dongchaoyang.top;;;;http://staff.ustc.edu.cn/~xiangyangli/;https://www.aaai.org/ojs/index.php/AAAI/article/view/4642;https://www.microsoft.com/en-us/research/people/taoqin/;https://sites.google.com/view/jiangbian",
        "dblp": "242/8492;331/5433;;262/3979;96/10484-3;;;;278/7751;222/2082;;l/XiangYangLi;;14/6841;09/851-2.html",
        "google_scholar": "https://scholar.google.ae/citations?user=1jwteOQAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en;uN1JaDEAAAAJ;tob-U1oAAAAJ;dIJFz4UAAAAJ;;WNiojyAAAAAJ;Futd_gYAAAAJ;https://scholar.google.com.hk/citations?user=LLk9dR8AAAAJ;EKl9yY8AAAAJ;JURtNb0AAAAJ;689bIIwAAAAJ;Bl4SRU0AAAAJ;pZBEnY8AAAAJ",
        "orcid": ";0009-0009-6037-2299;;;0000-0001-5631-0639;0000-0002-4150-0680;;;;;;;;;0000-0002-9472-600X",
        "linkedin": ";;;;;;;;leying-zhang-7b48401a5/;;;;;;jbian/",
        "or_profile": "~Yichong_Leng1;~Zhifang_Guo3;~Kai_Shen2;~Zeqian_Ju1;~Xu_Tan1;~Eric_Liu1;~Yufei_Liu3;~Dongchao_Yang1;~leying_zhang2;~Kaitao_Song1;~Lei_He6;~Xiangyang_Li4;~sheng_zhao1;~Tao_Qin1;~Jiang_Bian1",
        "aff": "University of Science and Technology of China;Institute of Computing Technology, Chinese Academy of Sciences;Zhejiang University;Microsoft;Microsoft;Microsoft;;Chinese University of Hong Kong;Microsoft;Microsoft;Microsoft;University of Science and Technology of China;Microsoft;;Microsoft",
        "aff_domain": "ustc.edu.cn;ict.ac.cn;zju.edu.cn;microsoft.com;microsoft.com;microsoft.com;;cuhk.hk;microsoft.com;microsoft.com;microsoft.com;ustc.edu;microsoft.com;;microsoft.com",
        "position": "PhD student;MS student;PhD student;Intern;Principal Researcher;Principal Researcher;;PhD student;Intern;Researcher;Principal Scientist Manager;Full Professor;Researcher;;Partner Research Manager",
        "bibtex": "@inproceedings{\nleng2024prompttts,\ntitle={Prompt{TTS} 2: Describing and Generating Voices with Text Prompt},\nauthor={Yichong Leng and Zhifang Guo and Kai Shen and Zeqian Ju and Xu Tan and Eric Liu and Yufei Liu and Dongchao Yang and leying zhang and Kaitao Song and Lei He and Xiangyang Li and sheng zhao and Tao Qin and Jiang Bian},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=NsCXDyv2Bn}\n}",
        "github": "",
        "project": "",
        "reviewers": "dNEb;2wDM;Ghqv;g23M",
        "pdf_size": 4337134,
        "rating": "6;6;6;6",
        "confidence": "4;5;3;3",
        "soundness": "3;3;2;3",
        "contribution": "2;3;2;3",
        "presentation": "3;3;2;3",
        "wc_summary": "21;96;282;205",
        "wc_strengths": "46;87;20;82",
        "wc_weaknesses": "152;50;113;257",
        "wc_questions": "21;76;398;7",
        "wc_review": "240;309;813;551",
        "wc_reply_reviewers": "62;0;0;282",
        "wc_reply_authors": "588;359;1122;996",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "3;1;2;3",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            151.0,
            100.00249996875078
        ],
        "wc_strengths_avg": [
            58.75,
            27.39867697535777
        ],
        "wc_weaknesses_avg": [
            143.0,
            75.20970682033004
        ],
        "wc_questions_avg": [
            125.5,
            159.42788338305192
        ],
        "wc_review_avg": [
            478.25,
            225.14370410917556
        ],
        "wc_reply_reviewers_avg": [
            86.0,
            115.95688854052612
        ],
        "wc_reply_authors_avg": [
            766.25,
            306.98890452262276
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            15,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 44,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2491055882531395348&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=NsCXDyv2Bn",
        "pdf": "https://openreview.net/pdf?id=NsCXDyv2Bn",
        "email": "ustc.edu.cn;ict.ac.cn;zju.edu.cn;microsoft.com;microsoft.com;microsoft.com;;cuhk.hk;microsoft.com;microsoft.com;microsoft.com;ustc.edu;microsoft.com;;microsoft.com",
        "author_num": 15,
        "aff_unique_index": "0;1;2;3;3;3;4;3;3;3;0;3;3",
        "aff_unique_norm": "University of Science and Technology of China;Chinese Academy of Sciences;Zhejiang University;Microsoft;Chinese University of Hong Kong",
        "aff_unique_dep": ";Institute of Computing Technology;;Microsoft Corporation;",
        "aff_unique_url": "http://www.ustc.edu.cn;http://www.ict.ac.cn;https://www.zju.edu.cn;https://www.microsoft.com;https://www.cuhk.edu.hk",
        "aff_unique_abbr": "USTC;CAS;ZJU;Microsoft;CUHK",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;1;1;1;0;1;1;1;0;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Lagrangian Flow Networks for Conservation Laws",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18767",
        "id": "Nshk5YpdWE",
        "author_site": "Fabricio Arend Torres, Marcello Negri, Marco Inversi, Jonathan Aellen, Volker Roth",
        "tldr": "",
        "abstract": "We introduce Lagrangian Flow Networks (LFlows) for modeling fluid densities and velocities continuously in space and time.\nBy construction, the proposed LFlows satisfy the continuity equation,\na PDE describing mass conservation in its differential form. \nOur model is based on the insight that solutions to the continuity equation can be expressed as\ntime-dependent density transformations via differentiable and invertible maps.\nThis follows from classical theory of the existence and uniqueness of Lagrangian flows for smooth vector fields.\nHence, we model fluid densities by transforming a base density with parameterized diffeomorphisms conditioned on time.\nThe key benefit compared to methods relying on numerical ODE solvers or PINNs is that the analytic expression of the velocity is always consistent with changes in density.\nFurthermore, we require neither expensive numerical solvers, nor additional penalties to enforce the PDE.\nLFlows show higher predictive accuracy in density modeling tasks compared to competing models in 2D and 3D,\nwhile being computationally efficient.\nAs a real-world application, we model bird migration based on sparse weather radar measurements.",
        "keywords": "Physics-informed Neural Network;Fluid Dynamics;Conservation Law;Partial Differential Equation;Conditional Normalizing Flows;Bird-Migration",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/5e9e73c6ab9ffc4b808ff5bcacb15bbf346bfedb.zip",
        "author": "Fabricio Arend Torres;Marcello Massimo Negri;Marco Inversi;Jonathan Aellen;Volker Roth",
        "authorids": "~Fabricio_Arend_Torres1;~Marcello_Massimo_Negri1;~Marco_Inversi1;~Jonathan_Aellen1;~Volker_Roth1",
        "gender": "M;M;M;M;M",
        "homepage": ";;https://dmi.unibas.ch/de/personen/marco-inversi/;;",
        "dblp": ";;;275/8287;23/1185-1",
        "google_scholar": "https://scholar.google.com/citations?authuser=1;;;27rCz4gAAAAJ;https://scholar.google.ch/citations?user=v1qj03cAAAAJ",
        "orcid": ";;;0000-0003-2418-5161;0000-0003-0991-0273",
        "linkedin": ";marcello-negri-b7b025176/;;;",
        "or_profile": "~Fabricio_Arend_Torres1;~Marcello_Massimo_Negri1;~Marco_Inversi1;~Jonathan_Aellen1;~Volker_Roth1",
        "aff": "University of Basel;University of Basel;University of Basel;University of Basel;University of Basel",
        "aff_domain": "unibas.ch;unibas.ch;unibas.ch;unibas.ch;unibas.ch",
        "position": "PhD student;PhD student;PhD student;PhD student;Full Professor",
        "bibtex": "@inproceedings{\ntorres2024lagrangian,\ntitle={Lagrangian Flow Networks for Conservation Laws},\nauthor={Fabricio Arend Torres and Marcello Massimo Negri and Marco Inversi and Jonathan Aellen and Volker Roth},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Nshk5YpdWE}\n}",
        "github": "",
        "project": "",
        "reviewers": "RQ15;fhDc;1yfJ",
        "pdf_size": 8116057,
        "rating": "6;8;8",
        "confidence": "4;3;3",
        "soundness": "3;3;4",
        "contribution": "2;3;4",
        "presentation": "4;3;4",
        "wc_summary": "82;56;55",
        "wc_strengths": "27;38;138",
        "wc_weaknesses": "260;156;18",
        "wc_questions": "155;6;105",
        "wc_review": "524;256;316",
        "wc_reply_reviewers": "234;30;23",
        "wc_reply_authors": "1444;754;593",
        "reply_reviewers": "1;1;1",
        "reply_authors": "2;1;1",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            64.33333333333333,
            12.498888839501783
        ],
        "wc_strengths_avg": [
            67.66666666666667,
            49.93551397107629
        ],
        "wc_weaknesses_avg": [
            144.66666666666666,
            99.12057752499673
        ],
        "wc_questions_avg": [
            88.66666666666667,
            61.91571331702119
        ],
        "wc_review_avg": [
            365.3333333333333,
            114.83708266738387
        ],
        "wc_reply_reviewers_avg": [
            95.66666666666667,
            97.85817401843455
        ],
        "wc_reply_authors_avg": [
            930.3333333333334,
            369.1163622611288
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9999999999999998,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2050640741554526889&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=Nshk5YpdWE",
        "pdf": "https://openreview.net/pdf?id=Nshk5YpdWE",
        "email": "unibas.ch;unibas.ch;unibas.ch;unibas.ch;unibas.ch",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "University of Basel",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.unibas.ch",
        "aff_unique_abbr": "UniBas",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Switzerland"
    },
    {
        "title": "Learning to Jointly Understand Visual and Tactile Signals",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18766",
        "id": "NtQqIcSbqv",
        "author_site": "Yichen Li, Yilun Du, Chao Liu, Chao Liu, Francis Williams, Michael Foshey, Benjamin Eckart, Jan Kautz, Joshua B Tenenbaum, Antonio Torralba, Wojciech Matusik",
        "tldr": "",
        "abstract": "Modeling and analyzing object and shape has been well studied in the past. However, manipulation of these complex tools and articulated objects remains difficult for autonomous agents. Our human hands, however, are dexterous and adaptive. We can easily adapt a manipulation skill on one object to all objects in the class and to other similar classes. Our intuition comes from that there is a close connection between manipulations and topology and articulation of objects. The possible articulation of objects indicates the types of manipulation necessary to operate the object. In this work, we aim to take a manipulation perspective to understand everyday objects and tools. We collect a multi-modal visual-tactile dataset that contains paired full-hand force pressure maps and manipulation videos. We also propose a novel method to learn a cross-modal latent manifold that allow for cross-modal prediction and discovery of latent structure in different data modalities. We conduct extensive experiments to demonstrate the effectiveness of our method.",
        "keywords": "multi-modal perception",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/7cc44733138b8f1f8a3904dacf33d217fdbcc6df.pdf",
        "author": "Yichen Li;Yilun Du;Chao Liu;Chao Liu;Francis Williams;Michael Foshey;Benjamin Eckart;Jan Kautz;Joshua B. Tenenbaum;Antonio Torralba;Wojciech Matusik",
        "authorids": "~Yichen_Li2;~Yilun_Du1;~Chao_Liu9;~Chao_Liu11;~Francis_Williams1;~Michael_Foshey1;~Benjamin_Eckart1;~Jan_Kautz1;~Joshua_B._Tenenbaum1;~Antonio_Torralba1;~Wojciech_Matusik2",
        "gender": "F;;;M;M;;M;;;M;M",
        "homepage": ";https://yilundu.github.io;https://chaoliu.tech/;https://research.nvidia.com/labs/genair/author/chao-liu/;http://fwilliams.info;;https://research.nvidia.com/person/ben-eckart;http://jankautz.com;;http://web.mit.edu/torralba/www//;https://cdfg.mit.edu/wojciech",
        "dblp": ";204/4379;15/5923-21;;195/8005;;23/6784;48/6214;t/JoshuaBTenenbaum;t/AntonioBTorralba;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;FSwWMcoAAAAJ;8gAliWUAAAAJ;aQW6t9EAAAAJ;;9PRX6q8AAAAJ;P9FclNEAAAAJ;;https://scholar.google.com.tw/citations?user=8cxDHS4AAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0002-5659-8748;;0000-0002-9912-4729;;;;;;;;0000-0003-0212-5643",
        "linkedin": ";;;;francis-williams/;michael-foshey/;;;;;wojciech-matusik-67238126/",
        "or_profile": "~Yichen_Li2;~Yilun_Du1;~Chao_Liu9;~Chao_Liu11;~Francis_Williams1;~Michael_Foshey1;~Benjamin_Eckart1;~Jan_Kautz1;~Joshua_B._Tenenbaum1;~Antonio_Torralba1;~Wojciech_Matusik2",
        "aff": "Massachusetts Institute of Technology;Massachusetts Institute of Technology;Computer Science and Artificial Intelligence Laboratory, Electrical Engineering & Computer Science;NVIDIA;NVIDIA;Massachusetts Institute of Technology;NVIDIA;NVIDIA;Massachusetts Institute of Technology;Massachusetts Institute of Technology;Massachusetts Institute of Technology",
        "aff_domain": "mit.edu;mit.edu;csail.mit.edu;nvidia.com;nvidia.com;mit.edu;nvidia.com;nvidia.com;mit.edu;mit.edu;mit.edu",
        "position": "PhD student;PhD student;Postdoc;Researcher;Research Scienteist;Researcher;Research Scientist;VP Research;Professor;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nli2024learning,\ntitle={Learning to Jointly Understand Visual and Tactile Signals},\nauthor={Yichen Li and Yilun Du and Chao Liu and Chao Liu and Francis Williams and Michael Foshey and Benjamin Eckart and Jan Kautz and Joshua B. Tenenbaum and Antonio Torralba and Wojciech Matusik},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=NtQqIcSbqv}\n}",
        "github": "",
        "project": "",
        "reviewers": "RFKG;h9Bd;u4UQ;ksmF",
        "pdf_size": 9569264,
        "rating": "6;6;6;6",
        "confidence": "3;3;2;3",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;2",
        "presentation": "3;2;3;3",
        "wc_summary": "43;67;46;44",
        "wc_strengths": "32;108;66;93",
        "wc_weaknesses": "100;160;98;78",
        "wc_questions": "42;237;96;5",
        "wc_review": "217;572;306;220",
        "wc_reply_reviewers": "12;61;258;20",
        "wc_reply_authors": "816;944;2085;357",
        "reply_reviewers": "1;1;2;1",
        "reply_authors": "3;2;4;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            50.0,
            9.874208829065749
        ],
        "wc_strengths_avg": [
            74.75,
            28.908260065247788
        ],
        "wc_weaknesses_avg": [
            109.0,
            30.675723300355934
        ],
        "wc_questions_avg": [
            95.0,
            88.13909461754189
        ],
        "wc_review_avg": [
            328.75,
            144.91613954284043
        ],
        "wc_reply_reviewers_avg": [
            87.75,
            100.0359310448001
        ],
        "wc_reply_authors_avg": [
            1050.5,
            635.8979871017049
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16427616374143315613&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=NtQqIcSbqv",
        "pdf": "https://openreview.net/pdf?id=NtQqIcSbqv",
        "email": "mit.edu;mit.edu;csail.mit.edu;nvidia.com;nvidia.com;mit.edu;nvidia.com;nvidia.com;mit.edu;mit.edu;mit.edu",
        "author_num": 11,
        "aff_unique_index": "0;0;0;1;1;0;1;1;0;0;0",
        "aff_unique_norm": "Massachusetts Institute of Technology;NVIDIA",
        "aff_unique_dep": ";NVIDIA Corporation",
        "aff_unique_url": "https://web.mit.edu;https://www.nvidia.com",
        "aff_unique_abbr": "MIT;NVIDIA",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Cambridge",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "3D Reconstruction with Generalizable Neural Fields using Scene Priors",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18765",
        "id": "Nu7dDaVF5a",
        "author_site": "Yang Fu, Shalini De Mello, Xueting Li, Amey Kulkarni, Jan Kautz, Xiaolong Wang, Sifei Liu",
        "tldr": "",
        "abstract": "High-fidelity 3D scene reconstruction has been substantially advanced by recent progress in neural fields. However, most existing methods train a separate network from scratch for each individual scene. This is not scalable, inefficient, and unable to yield good results given limited views. While learning-based multi-view stereo methods alleviate this issue to some extent, their multi-view setting makes it less flexible to scale up and to broad applications. Instead, we introduce training generalizable Neural Fields incorporating scene Priors (NFPs). \nThe NFP network maps any single-view RGB-D image into signed distance and radiance values. A complete scene can be reconstructed by merging individual frames in the volumetric space WITHOUT a fusion module, which provides better flexibility.  The scene priors can be trained on large-scale datasets, allowing for fast adaptation to the reconstruction of a new scene with fewer views. NFP not only demonstrates SOTA scene reconstruction performance and efficiency, but it also supports single-image novel-view synthesis, which is under-explored in neural fields. More qualitative results are available at: https://oasisyang.github.io/neural-prior.",
        "keywords": "3D Reconstruction;Generalizable Neural Fields",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/7a7b81273424cd1d46f018344212459877e57b56.zip",
        "author": "Yang Fu;Shalini De Mello;Xueting Li;Amey Kulkarni;Jan Kautz;Xiaolong Wang;Sifei Liu",
        "authorids": "~Yang_Fu1;~Shalini_De_Mello1;~Xueting_Li2;~Amey_Kulkarni1;~Jan_Kautz1;~Xiaolong_Wang3;~Sifei_Liu2",
        "gender": "M;Not Specified;M;;M;F;F",
        "homepage": "https://beckman.illinois.edu/directory/person/yangfu2;https://research.nvidia.com/person/shalini-de-mello;https://www.linkedin.com/in/ameyk/;http://jankautz.com;https://xiaolonw.github.io/;https://www.sifeiliu.net;https://sunshineatnoon.github.io/",
        "dblp": "66/3764;206/7364;145/7531;48/6214;91/952-4;118/1301;",
        "google_scholar": "bioUtz4AAAAJ;xQM4BlMAAAAJ;PUz8SCQAAAAJ;P9FclNEAAAAJ;Y8O9N_0AAAAJ;j4pcHV4AAAAJ;nfXdXswAAAAJ",
        "orcid": ";;0000-0003-3061-8269;;;;",
        "linkedin": ";shalini-de-mello-02b8251/;ameyk/;;;;",
        "or_profile": "~Yang_Fu1;~Shalini_De_Mello1;~Amey_Kulkarni1;~Jan_Kautz1;~Xiaolong_Wang3;~Sifei_Liu2;~Xueting_Li1",
        "aff": "University of California, San Diego;NVIDIA;;NVIDIA;University of California, San Diego;NVIDIA;NVIDIA",
        "aff_domain": "ucsd.edu;nvidia.com;;nvidia.com;ucsd.edu;nvidia.com;nvidia.com",
        "position": "PhD student;Principal Researcher;;VP Research;Assistant Professor;Researcher;Researcher",
        "bibtex": "@inproceedings{\nfu2024d,\ntitle={3D Reconstruction with Generalizable Neural Fields using Scene Priors},\nauthor={Yang Fu and Shalini De Mello and Xueting Li and Amey Kulkarni and Jan Kautz and Xiaolong Wang and Sifei Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Nu7dDaVF5a}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZqzA;2i3p;zLQa;s8AK;EoMe",
        "pdf_size": 29021696,
        "rating": "5;5;6;6;8",
        "confidence": "3;4;4;4;5",
        "soundness": "3;2;3;3;3",
        "contribution": "2;2;3;3;3",
        "presentation": "1;3;3;3;3",
        "wc_summary": "124;42;143;650;48",
        "wc_strengths": "200;32;57;80;101",
        "wc_weaknesses": "214;128;143;122;371",
        "wc_questions": "236;26;111;141;34",
        "wc_review": "774;228;454;993;554",
        "wc_reply_reviewers": "448;0;29;40;0",
        "wc_reply_authors": "1732;807;833;773;544",
        "reply_reviewers": "1;0;1;1;0",
        "reply_authors": "5;3;2;2;3",
        "rating_avg": [
            6.0,
            1.0954451150103321
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.6,
            0.8000000000000002
        ],
        "wc_summary_avg": [
            201.4,
            227.85223281767506
        ],
        "wc_strengths_avg": [
            94.0,
            57.78235024642041
        ],
        "wc_weaknesses_avg": [
            195.6,
            93.65596617407776
        ],
        "wc_questions_avg": [
            109.6,
            77.03142216005102
        ],
        "wc_review_avg": [
            600.6,
            263.26382204928956
        ],
        "wc_reply_reviewers_avg": [
            103.4,
            173.0243913441108
        ],
        "wc_reply_authors_avg": [
            937.8,
            410.1421217090486
        ],
        "reply_reviewers_avg": [
            0.6,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            3.0,
            1.0954451150103321
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.8660254037844387,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8432657061973796226&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=Nu7dDaVF5a",
        "pdf": "https://openreview.net/pdf?id=Nu7dDaVF5a",
        "email": "ucsd.edu;nvidia.com;;nvidia.com;ucsd.edu;nvidia.com;nvidia.com",
        "author_num": 7,
        "aff_unique_index": "0;1;1;0;1;1",
        "aff_unique_norm": "University of California, San Diego;NVIDIA",
        "aff_unique_dep": ";NVIDIA Corporation",
        "aff_unique_url": "https://www.ucsd.edu;https://www.nvidia.com",
        "aff_unique_abbr": "UCSD;NVIDIA",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "San Diego;",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "InstructCV: Instruction-Tuned Text-to-Image Diffusion Models as Vision Generalists",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18764",
        "id": "Nu9mOSq7eH",
        "author_site": "Yulu Gan, Sung Woo Park, Alexander Schubert, Anthony Philippakis, Ahmed Alaa",
        "tldr": "",
        "abstract": "Recent advances in generative diffusion models have enabled text-controlled synthesis of realistic and diverse images with impressive quality. Despite these remarkable advances, the application of text-to-image generative models in computer vision for standard visual recognition tasks remains limited. The current de facto approach for these tasks is to design model architectures and loss functions that are tailored to the task at hand. In this paper, we develop a unified language interface for computer vision tasks that abstracts away task specific design choices and enables task execution by following natural language instructions. Our approach involves casting multiple computer vision tasks as text-to-image generation problems. Here, the text represents an instruction describing the task, and the resulting image is a visually-encoded task output. To train our model, we pool commonly-used computer vision datasets covering a range of tasks, including segmentation, object detection, depth estimation, and classification. We then use a large language model to paraphrase prompt templates that convey the specific tasks to be conducted on each image, and through this process, we create a multi-modal and multi-task training dataset comprising input and output images along with annotated instructions. Following the InstructPix2Pix architecture, we apply instruction-tuning to a text-to-image diffusion model using our constructed dataset, steering its functionality from a generative model to an instruction-guided multi-task vision learner. Experiments demonstrate that our model, dubbed InstructCV, performs competitively compared to other generalist and task-specific vision models. Moreover, it exhibits compelling generalization capabilities to unseen data, categories, and user instructions.",
        "keywords": "Vision generalists;Text-to-image models;Multi-task learning",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/85b09293971fcc775541cb57c97ed79ff83daabc.pdf",
        "author": "Yulu Gan;Sungwoo Park;Alexander Marcel Schubert;Anthony Philippakis;Ahmed Alaa",
        "authorids": "~Yulu_Gan1;~Sungwoo_Park3;~Alexander_Marcel_Schubert1;~Anthony_Philippakis1;~Ahmed_Alaa1",
        "gender": "M;M;M;M;M",
        "homepage": "https://yulugan.com/;;;https://alaalab.berkeley.edu/;",
        "dblp": "307/1107;;;140/7324;92/6585",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;Q-v0BgUAAAAJ;https://scholar.google.com.eg/citations?user=_pv1sEcAAAAJ;B1xpjO8AAAAJ",
        "orcid": "0009-0002-8541-2911;;;;",
        "linkedin": "yulu-g-31a626281/;alexander-schubert-84172ab1/;;;",
        "or_profile": "~Yulu_Gan1;~Alexander_Marcel_Schubert1;~Anthony_Philippakis1;~Ahmed_Alaa1;~Sung_Woo_Park2",
        "aff": "Peking University;University of California, Berkeley;Broad Institute;University of California, Berkeley;University of California, Berkeley",
        "aff_domain": "pku.edu.cn;berkeley.edu;broadinstitute.org;berkeley.edu;berkeley.edu",
        "position": "MS student;PhD student;Researcher;Assistant Professor;Postdoc",
        "bibtex": "@inproceedings{\ngan2024instructcv,\ntitle={Instruct{CV}: Instruction-Tuned Text-to-Image Diffusion Models as Vision Generalists},\nauthor={Yulu Gan and Sungwoo Park and Alexander Marcel Schubert and Anthony Philippakis and Ahmed Alaa},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Nu9mOSq7eH}\n}",
        "github": "",
        "project": "",
        "reviewers": "cJRy;wRB5;ERkX;QhMY",
        "pdf_size": 6671045,
        "rating": "3;5;6;8",
        "confidence": "5;5;3;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;3;4",
        "wc_summary": "45;47;64;86",
        "wc_strengths": "27;48;73;50",
        "wc_weaknesses": "117;563;134;73",
        "wc_questions": "4;2;217;42",
        "wc_review": "193;660;488;251",
        "wc_reply_reviewers": "0;186;0;0",
        "wc_reply_authors": "358;2833;494;128",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;7;1;1",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            4.0,
            1.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            60.5,
            16.469669092000604
        ],
        "wc_strengths_avg": [
            49.5,
            16.28649747490233
        ],
        "wc_weaknesses_avg": [
            221.75,
            198.2742734194227
        ],
        "wc_questions_avg": [
            66.25,
            88.4826960484365
        ],
        "wc_review_avg": [
            398.0,
            187.335260962799
        ],
        "wc_reply_reviewers_avg": [
            46.5,
            80.5403625519528
        ],
        "wc_reply_authors_avg": [
            953.25,
            1093.1297669993257
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            2.598076211353316
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.8320502943378437,
        "gs_citation": 21,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6266646988015186574&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=Nu9mOSq7eH",
        "pdf": "https://openreview.net/pdf?id=Nu9mOSq7eH",
        "email": "pku.edu.cn;berkeley.edu;broadinstitute.org;berkeley.edu;berkeley.edu",
        "author_num": 5,
        "aff_unique_index": "0;1;2;1;1",
        "aff_unique_norm": "Peking University;University of California, Berkeley;Broad Institute",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.berkeley.edu;https://www.broadinstitute.org",
        "aff_unique_abbr": "Peking U;UC Berkeley;Broad",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Berkeley",
        "aff_country_unique_index": "0;1;1;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "NuDmRQJ26K",
        "title": "LUMEN-PRO: Automating Multi-Task Learning on Optical Neural Networks with Weight Sharing and Physical Rotation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "With the demise of Moore's law, the demand for efficient deep neural network accelerators has surged. In addition, the democratization of AI encourages multi-task learning (MTL), demanding more parameters and processing time. To achieve highly energy-efficient MTL, Diffractive Optical Neural Networks (DONNs) have garnered attention due to extremely low energy and high computation speed. However, implementing MTL on DONNs requires manually reconfiguring and replacing specific layers, resulting in rebuilding and duplicating the physical systems. To overcome the challenges, we propose LUMEN-PRO, an automating MTL framework. Specifically, we first propose to automate MTL utilizing an arbitrary backbone DONN and a set of tasks, resulting in a high-accuracy multi-task DONN model with a small memory footprint that surpasses existing MTL methods. Secondly, we leverage the rotatability of the physical system, and replace task-specific layers with the rotation of the corresponding shared layers. This replacement eliminates the storage requirement of task-specific layers, thus further optimizing the memory footprint. LUMEN-PRO provides flexibility in identifying optimal sharing patterns across diverse datasets, facilitating the search for highly energy-efficient DONNs. Experimental results show that LUMEN-PRO provides up to 49.58% higher accuracy and $4\\times$ better cost efficiency than single-task and existing cutting-edge DONN approaches on different datasets. It achieves memory lower bound of multi-task learning, i.e., having the same memory storage as the single task model. Compared to technologies such as IBM TrueNorth and Nanophotonic, LUMEN-PRO achieves $10^5\\times$ and $10\\times$ speedup in throughput, and $5,969\\times$ and $680\\times$ energy efficiency gain, respectively.",
        "keywords": "Diffractive Optical Neural Network;Automating Multi-task Learning;Weight Sharing",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/e08dbb947aa650e3cab67902189788d7a6f82758.zip",
        "author": "Shanglin Zhou;Yingjie Li;Zhijie Shi;CUNXI YU;Caiwen Ding",
        "authorids": "~Shanglin_Zhou1;~Yingjie_Li1;~Zhijie_Shi1;~CUNXI_YU1;~Caiwen_Ding1",
        "gender": "F;F;M;;M",
        "homepage": ";https://www.ece.utah.edu;https://zshi.cse.uconn.edu/;;https://caiwending.cse.uconn.edu/",
        "dblp": ";;;;175/2489",
        "google_scholar": "moYRN60AAAAJ;;https://scholar.google.com.tw/citations?user=JXjb1g0AAAAJ;;7hR0r_EAAAAJ",
        "orcid": "0000-0002-6409-7716;;;;0000-0003-0891-1231",
        "linkedin": "shanglin-zhou-189489104/;;;;caiwen-ding-47144489/",
        "or_profile": "~Shanglin_Zhou1;~Yingjie_Li1;~Zhijie_Shi1;~CUNXI_YU1;~Caiwen_Ding1",
        "aff": "University of Connecticut;University of Utah;University of Connecticut;;University of Connecticut",
        "aff_domain": "uconn.edu;utah.edu;uconn.edu;;uconn.edu",
        "position": "PhD student;PhD student;Associate Professor;;Assistant Professor",
        "bibtex": "@misc{\nzhou2024lumenpro,\ntitle={{LUMEN}-{PRO}: Automating Multi-Task Learning on Optical Neural Networks with Weight Sharing and Physical Rotation},\nauthor={Shanglin Zhou and Yingjie Li and Zhijie Shi and CUNXI YU and Caiwen Ding},\nyear={2024},\nurl={https://openreview.net/forum?id=NuDmRQJ26K}\n}",
        "github": "",
        "project": "",
        "reviewers": "edBq;nw67;njPU",
        "site": "https://openreview.net/forum?id=NuDmRQJ26K",
        "pdf_size": 2371392,
        "rating": "3;6;8",
        "confidence": "4;4;3",
        "soundness": "2;3;3",
        "contribution": "2;2;3",
        "presentation": "2;2;3",
        "wc_summary": "69;28;71",
        "wc_strengths": "56;48;99",
        "wc_weaknesses": "206;106;103",
        "wc_questions": "75;55;2",
        "wc_review": "406;237;275",
        "wc_reply_reviewers": "134;0;76",
        "wc_reply_authors": "2245;723;887",
        "reply_reviewers": "1;0;1",
        "reply_authors": "5;1;2",
        "rating_avg": [
            5.666666666666667,
            2.0548046676563256
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            56.0,
            19.8158185969358
        ],
        "wc_strengths_avg": [
            67.66666666666667,
            22.395436042987765
        ],
        "wc_weaknesses_avg": [
            138.33333333333334,
            47.86323107447813
        ],
        "wc_questions_avg": [
            44.0,
            30.80043289739069
        ],
        "wc_review_avg": [
            306.0,
            72.39244896166082
        ],
        "wc_reply_reviewers_avg": [
            70.0,
            54.86954224947267
        ],
        "wc_reply_authors_avg": [
            1285.0,
            682.1163146169916
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            1.699673171197595
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.8029550685469661,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:6eFnbdLZUIUJ:scholar.google.com/&scioq=LUMEN-PRO:+Automating+Multi-Task+Learning+on+Optical+Neural+Networks+with+Weight+Sharing+and+Physical+Rotation&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "University of Connecticut;University of Utah",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uconn.edu;https://www.utah.edu",
        "aff_unique_abbr": "UConn;Utah",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "NukRlEUICA",
        "title": "AFFINE INVARIANCE IN CONTINUOUS-DOMAIN CONVOLUTIONAL NEURAL NETWORKS",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The notion of group invariance helps neural networks in recognizing patterns and features under geometric transformations. Indeed, it has been shown that group invariance can largely improve deep learning performances in practice, where such transformations are very common. \nThis research studies affine invariance on continuous-domain convolutional neural networks. \nDespite other research considering isometric invariance or similarity invariance, we focus on the full structure of affine transforms generated by the generalized linear group $\\mathrm{GL}_2(\\mathbb{R})$.\nWe introduce a new criterion to assess the similarity of two input signals under affine transformations. Then, unlike conventional methods that involve solving complex optimization problems on the Lie group $G_2$, we  analyze the convolution of lifted signals and compute the corresponding integration over $G_2$. In sum, our research could eventually extend the scope of geometrical transformations that practical deep-learning pipelines can handle.",
        "keywords": "Affine Invariance- Convolutional Neural Networks- Group Representation",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Ali Mohaddes;Johannes Lederer",
        "authorids": "~Ali_Mohaddes1;~Johannes_Lederer1",
        "gender": "M;",
        "homepage": "https://scholar.google.com/citations?user=Ex49DwYAAAAJ&hl=en;",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Ali_Mohaddes1;~Johannes_Lederer1",
        "aff": "Universit\u00e4t Hamburg;",
        "aff_domain": "uni-hamburg.de;",
        "position": "PhD student;",
        "bibtex": "@misc{\nanonymous2024affine,\ntitle={{AFFINE} {INVARIANCE} {IN} {CONTINUOUS}-{DOMAIN} {CONVOLUTIONAL} {NEURAL} {NETWORKS}},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=NukRlEUICA}\n}",
        "github": "",
        "project": "",
        "reviewers": "Ts2r;WzuJ;WvUd;taA6",
        "site": "https://openreview.net/forum?id=NukRlEUICA",
        "pdf_size": 282443,
        "rating": "3;3;3;3",
        "confidence": "3;1;4;3",
        "soundness": "2;2;2;2",
        "contribution": "3;2;3;2",
        "presentation": "2;1;1;2",
        "wc_summary": "76;40;110;108",
        "wc_strengths": "33;36;14;71",
        "wc_weaknesses": "439;69;1035;598",
        "wc_questions": "112;6;3;41",
        "wc_review": "660;151;1162;818",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            2.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            83.5,
            28.508770580296865
        ],
        "wc_strengths_avg": [
            38.5,
            20.573040611440984
        ],
        "wc_weaknesses_avg": [
            535.25,
            346.5330972648933
        ],
        "wc_questions_avg": [
            40.5,
            43.900455578501685
        ],
        "wc_review_avg": [
            697.75,
            364.12523601090874
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8666280981995490290&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Hamburg",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uni-hamburg.de",
        "aff_unique_abbr": "UHH",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "NvJxTjTQtq",
        "title": "EGraFFBench: Evaluation of Equivariant Graph Neural Network Force Fields for Atomistic Simulations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Equivariant graph neural networks force fields (EGraFFs) have shown great promise in modelling complex interactions in atomic systems by exploiting the graphs\u2019 inherent symmetries. Recent works have led to a surge in the development of novel architectures that incorporate equivariance-based inductive biases alongside architectural innovations like graph transformers and message passing to model atomic interactions. However, thorough evaluations of these deploying EGraFFs for the downstream task of real-world atomistic simulations, is lacking. To this end, here we perform a systematic benchmarking of 6 EGraFF algorithms (NequIP, Allegro, BOTNet, MACE, Equiformer, TorchMDNet), with the aim of understanding their capabilities and limitations for realistic atomistic simulations. In addition to our thorough evaluation and analysis on eight existing datasets based on the benchmarking literature, we release two new benchmark datasets, propose four new metrics, and three new challenging tasks. The new datasets and tasks evaluate the performance of EGraFF to out-of-distribution data, in terms of different crystal structures, temperatures, and new molecules. Interestingly, evaluation of the EGraFF models based on dynamic simulations reveals that having a lower error on energy or force does not guarantee stable or reliable simulation or faithful replication of the atomic structures. Moreover, we find that no model clearly outperforms other models on all datasets and tasks. Importantly, we show that the performance of all the models on out-of-distribution datasets is unreliable, pointing to the need for the development of a foundation model for force fields that can be used in real-world simulations. In summary, this work establishes a rigorous framework for evaluating machine learning force fields in the context of atomic simulations and points to open research challenges within this domain.",
        "keywords": "Graph neural network;equivariant neural network;atomistic simulations;molecular dynamics",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Vaibhav Bihani;Utkarsh Pratiush;Sajid Mannan;Tao Du;Zhimin Chen;Santiago Miret;Matthieu Micoulaut;Morten M Smedskjaer;Sayan Ranu;N M Anoop Krishnan",
        "authorids": "~Vaibhav_Bihani1;~Utkarsh_Pratiush1;~Sajid_Mannan1;~Tao_Du2;~Zhimin_Chen2;~Santiago_Miret1;~Matthieu_Micoulaut1;~Morten_M_Smedskjaer1;~Sayan_Ranu2;~N_M_Anoop_Krishnan1",
        "gender": "M;M;M;M;M;M;M;M;M;M",
        "homepage": ";;https://web.iitd.ac.in/~cez218288/;;;https://www.intel.ai/bio/santiago-miret/;https://www.lptmc.jussieu.fr/user/mmi/index.html;https://sites.google.com/view/smedskjaer;https://www.cse.iitd.ac.in/~sayan/index.html;",
        "dblp": ";;;;;241/5030;;;38/768;",
        "google_scholar": "2E4g5E4AAAAJ;BqhnGGAAAAAJ;i8pU7ioAAAAJ;6bi-WuwAAAAJ;;HLQ_te4AAAAJ;;https://scholar.google.dk/citations?user=eDrmG1wAAAAJ;K4w5qYUAAAAJ;https://scholar.google.co.in/citations?user=fGnjHcEAAAAJ",
        "orcid": "0000-0002-9862-1977;;0000-0002-7887-2250;0000-0003-2402-6320;0000-0002-1017-7171;0000-0002-5121-3853;;;0000-0003-4147-9372;0000-0003-1500-4947",
        "linkedin": "vaibhav-bihani-4978171b4/;utkarsh-pratiush-376ab6171/;sajid-mannan-41072116b/?originalSubdomain=in;;;santiago-miret/;;;;",
        "or_profile": "~Vaibhav_Bihani1;~Utkarsh_Pratiush1;~Sajid_Mannan1;~Tao_Du2;~Zhimin_Chen2;~Santiago_Miret1;~Matthieu_Micoulaut1;~Morten_M_Smedskjaer1;~Sayan_Ranu2;~N_M_Anoop_Krishnan1",
        "aff": ";University of Tennessee, Knoxville;Indian Institute of Technology, Delhi;;Aalborg University;Intel;;Aalborg University;Indian Institute of Technology Delhi;Indian Institute of Technology Delhi",
        "aff_domain": ";utk.edu;iitd.ac.in;;aau.dk;intel.com;;aau.dk;iitd.ac.in;iitd.ac.in",
        "position": ";PhD student;PhD student;;PhD student;Researcher;;Full Professor;Associate Professor;Associate Professor",
        "bibtex": "@misc{\nbihani2024egraffbench,\ntitle={{EG}ra{FFB}ench: Evaluation of Equivariant Graph Neural Network Force Fields for Atomistic Simulations},\nauthor={Vaibhav Bihani and Utkarsh Pratiush and Sajid Mannan and Tao Du and Zhimin Chen and Santiago Miret and Matthieu Micoulaut and Morten M Smedskjaer and Sayan Ranu and N M Anoop Krishnan},\nyear={2024},\nurl={https://openreview.net/forum?id=NvJxTjTQtq}\n}",
        "github": "",
        "project": "",
        "reviewers": "Kn6d;ewM6;dGG5",
        "site": "https://openreview.net/forum?id=NvJxTjTQtq",
        "pdf_size": 5950601,
        "rating": "5;5;8",
        "confidence": "4;4;4",
        "soundness": "2;2;3",
        "contribution": "1;2;3",
        "presentation": "3;2;4",
        "wc_summary": "43;82;63",
        "wc_strengths": "48;45;65",
        "wc_weaknesses": "205;120;106",
        "wc_questions": "108;338;79",
        "wc_review": "404;585;313",
        "wc_reply_reviewers": "18;122;0",
        "wc_reply_authors": "1558;2223;510",
        "reply_reviewers": "1;2;0",
        "reply_authors": "4;5;1",
        "rating_avg": [
            6.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            62.666666666666664,
            15.923427883328248
        ],
        "wc_strengths_avg": [
            52.666666666666664,
            8.806563209081938
        ],
        "wc_weaknesses_avg": [
            143.66666666666666,
            43.74420596553966
        ],
        "wc_questions_avg": [
            175.0,
            115.86486381412902
        ],
        "wc_review_avg": [
            434.0,
            113.05161063278429
        ],
        "wc_reply_reviewers_avg": [
            46.666666666666664,
            53.773186213535425
        ],
        "wc_reply_authors_avg": [
            1430.3333333333333,
            705.1318237669385
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            1.699673171197595
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 24,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6062699179133952672&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 12,
        "aff_unique_index": "0;1;2;3;2;1;1",
        "aff_unique_norm": "University of Tennessee;Indian Institute of Technology Delhi;Aalborg University;Intel",
        "aff_unique_dep": ";;;Intel Corporation",
        "aff_unique_url": "https://www.utk.edu;https://www.iitdelhi.ac.in;https://www.aau.dk;https://www.intel.com",
        "aff_unique_abbr": "UT;IIT Delhi;AAU;Intel",
        "aff_campus_unique_index": "0;1;1;1",
        "aff_campus_unique": "Knoxville;Delhi;",
        "aff_country_unique_index": "0;1;2;0;2;1;1",
        "aff_country_unique": "United States;India;Denmark"
    },
    {
        "id": "NvQ4kzcRSL",
        "title": "Graph Clustering with Masked AutoEncoders",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph clustering algorithms with autoencoder structures have recently gained popularity due to their efficient performance and low training cost. However, for existing graph autoencoder clustering algorithms based on GCN or GAT, not only do they lack good generalization ability, but also the number of clusters clustered by such autoencoder models is difficult to determine automatically. To solve this problem, we propose a new framework called \\textit{G}raph \\textit{C}lustering with \\textit{M}asked \\textit{A}utoencoders (\\textit{GCMA}). It employs our designed fusion autoencoder based on the graph masking method for the fusion coding of graph. It introduces our improved density-based clustering algorithm as a second decoder while decoding with multi-target reconstruction. By decoding the mask embedding, our model can capture more generalized and comprehensive knowledge. The number of clusters and clustering results can be output end-to-end while improving the generalization ability. As a nonparametric class method, extensive experiments demonstrate the superiority of \\textit{GCMA} over state-of-the-art baselines.",
        "keywords": "Graph Clustering;Masked Graph Autoencoder;Fusion Network",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Yuanchi Ma;Hui He;Zhongxiang Lei;Zhendong Niu",
        "authorids": "~Yuanchi_Ma1;~Hui_He2;~Zhongxiang_Lei1;~Zhendong_Niu2",
        "gender": "M;F;M;M",
        "homepage": "https://blog.csdn.net/weixin_43288629?type=blog;https://www.researchgate.net/profile/Hui_He43;https://github.com/NPCLEI;",
        "dblp": "338/2501;https://dblp.uni-trier.de/pid/53/1151;;https://dblp.uni-trier.de/pid/06/3613.html",
        "google_scholar": ";1IqAdRwAAAAJ;;",
        "orcid": ";0000-0001-5515-2739;;",
        "linkedin": ";;;",
        "or_profile": "~Yuanchi_Ma1;~Hui_He2;~Zhongxiang_Lei1;~Zhendong_Niu2",
        "aff": "Beijing Institute of Technology;Beijing Institute of Technology;Beijing Institute of Technology;Beijing Institute of Technology",
        "aff_domain": "bit.edu.cn;bit.edu.cn;bit.edu.cn;bit.edu.cn",
        "position": "PhD student;PhD student;MS student;Full Professor",
        "bibtex": "@misc{\nma2024graph,\ntitle={Graph Clustering with Masked AutoEncoders},\nauthor={Yuanchi Ma and Hui He and Zhongxiang Lei and Zhendong Niu},\nyear={2024},\nurl={https://openreview.net/forum?id=NvQ4kzcRSL}\n}",
        "github": "",
        "project": "",
        "reviewers": "5Nk3;sCEC;BL5K;yz1d;CdSX",
        "site": "https://openreview.net/forum?id=NvQ4kzcRSL",
        "pdf_size": 1029973,
        "rating": "3;3;3;5;5",
        "confidence": "4;4;5;2;3",
        "soundness": "3;2;3;3;2",
        "contribution": "1;2;2;3;2",
        "presentation": "2;1;1;3;1",
        "wc_summary": "63;74;105;39;74",
        "wc_strengths": "7;22;35;32;46",
        "wc_weaknesses": "117;279;202;82;91",
        "wc_questions": "17;10;4;2;74",
        "wc_review": "204;385;346;155;285",
        "wc_reply_reviewers": "0;38;318;17;28",
        "wc_reply_authors": "542;1118;1707;545;868",
        "reply_reviewers": "0;1;2;1;1",
        "reply_authors": "2;5;5;2;3",
        "rating_avg": [
            3.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.6,
            1.019803902718557
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            1.6,
            0.8
        ],
        "wc_summary_avg": [
            71.0,
            21.26969675383267
        ],
        "wc_strengths_avg": [
            28.4,
            13.154466921924278
        ],
        "wc_weaknesses_avg": [
            154.2,
            75.43314921173581
        ],
        "wc_questions_avg": [
            21.4,
            26.81492121935099
        ],
        "wc_review_avg": [
            275.0,
            85.65278746193844
        ],
        "wc_reply_reviewers_avg": [
            80.2,
            119.56655050640208
        ],
        "wc_reply_authors_avg": [
            956.0,
            433.1987996289925
        ],
        "reply_reviewers_avg": [
            1.0,
            0.6324555320336759
        ],
        "reply_authors_avg": [
            3.4,
            1.3564659966250538
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8807048459279794,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Beijing Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.bit.edu.cn/",
        "aff_unique_abbr": "BIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "NvSwR4IvLO",
        "title": "Can AI-Generated Text be Reliably Detected?",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The rapid progress of Large Language Models (LLMs) has made them capable of performing astonishingly well on various tasks, including document completion and question answering. The unregulated use of these models, however, can potentially lead to malicious consequences such as plagiarism, generating fake news, spamming, etc. Therefore, reliable detection of AI-generated text can be critical to ensure the responsible use of LLMs. Recent works attempt to tackle this problem either using certain model signatures present in the generated text outputs or by applying watermarking techniques that imprint specific patterns onto them. In this paper, we show that these detectors are not reliable in practical scenarios. In particular, we develop a recursive paraphrasing attack to apply on AI text, which can break a whole range of detectors, including the ones using the watermarking schemes as well as neural network-based detectors, zero-shot classifiers, and retrieval-based detectors. Our experiments include passages around 300 tokens in length, showing the sensitivity of the detectors even in the case of relatively long passages. We also observe that our recursive paraphrasing only degrades text quality slightly, measured via perplexity scores and MTurk human study. Additionally, we show that even LLMs protected by watermarking schemes can be vulnerable against spoofing attacks aimed to mislead detectors to classify human-written text as AI-generated, potentially causing reputational damages to the developers. In particular, we show that an adversary can infer hidden AI text signatures of the LLM outputs without having white-box access to the detection method. Finally, we provide a theoretical connection between the AUROC of the best possible detector and the Total Variation distance between human and AI text distributions that can be used to study the fundamental hardness of the reliable detection problem for advanced language models.",
        "keywords": "AI text detection;reliable ML;security;attacks",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/3f5be85f31fb30eb175350c348c252f6ebc0ae66.zip",
        "author": "Vinu Sankar Sadasivan;Aounon Kumar;Sriram Balasubramanian;Wenxiao Wang;Soheil Feizi",
        "authorids": "~Vinu_Sankar_Sadasivan1;~Aounon_Kumar1;~Sriram_Balasubramanian2;~Wenxiao_Wang1;~Soheil_Feizi2",
        "gender": "M;M;M;M;M",
        "homepage": "https://vinusankars.github.io/;https://aounon.github.io;http://www.sriram.live;https://wangwenxiao.github.io;https://www.cs.umd.edu/~sfeizi/",
        "dblp": "244/8052;191/8334;33/666;243/5853-2;57/2132",
        "google_scholar": "y1IKIw0AAAAJ;NjhpUykAAAAJ;HsiolTEAAAAJ;hn0u5VgAAAAJ;lptAmrMAAAAJ",
        "orcid": ";;;;",
        "linkedin": "vinusankars/;;;wenxiaowang/;",
        "or_profile": "~Vinu_Sankar_Sadasivan1;~Aounon_Kumar1;~Sriram_Balasubramanian2;~Wenxiao_Wang1;~Soheil_Feizi2",
        "aff": "University of Maryland, College Park;School of Engineering and Applied Sciences, Harvard University;University of Maryland, College Park;University of Maryland, College Park;University of Maryland, College Park",
        "aff_domain": "umd.edu;seas.harvard.edu;umd.edu;umd.edu;umd.edu",
        "position": "PhD student;Postdoc;PhD student;PhD student;Associate Professor",
        "bibtex": "@misc{\nsadasivan2024can,\ntitle={Can {AI}-Generated Text be Reliably Detected?},\nauthor={Vinu Sankar Sadasivan and Aounon Kumar and Sriram Balasubramanian and Wenxiao Wang and Soheil Feizi},\nyear={2024},\nurl={https://openreview.net/forum?id=NvSwR4IvLO}\n}",
        "github": "",
        "project": "",
        "reviewers": "Ce9G;JvAi;reDY",
        "site": "https://openreview.net/forum?id=NvSwR4IvLO",
        "pdf_size": 9537712,
        "rating": "3;5;6",
        "confidence": "5;4;3",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "3;2;4",
        "wc_summary": "61;62;89",
        "wc_strengths": "26;67;148",
        "wc_weaknesses": "239;156;224",
        "wc_questions": "94;101;29",
        "wc_review": "420;386;490",
        "wc_reply_reviewers": "0;0;29",
        "wc_reply_authors": "1641;486;1117",
        "reply_reviewers": "0;0;1",
        "reply_authors": "4;2;4",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            70.66666666666667,
            12.970050972229146
        ],
        "wc_strengths_avg": [
            80.33333333333333,
            50.690783733885546
        ],
        "wc_weaknesses_avg": [
            206.33333333333334,
            36.11401697709938
        ],
        "wc_questions_avg": [
            74.66666666666667,
            32.417416443771224
        ],
        "wc_review_avg": [
            432.0,
            43.29742101634538
        ],
        "wc_reply_reviewers_avg": [
            9.666666666666666,
            13.67073110293992
        ],
        "wc_reply_authors_avg": [
            1081.3333333333333,
            472.2007576821066
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9819805060619659,
        "gs_citation": 468,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6956709800612024780&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0;0;0",
        "aff_unique_norm": "University of Maryland;Harvard University",
        "aff_unique_dep": ";School of Engineering and Applied Sciences",
        "aff_unique_url": "https://www/umd.edu;https://www.harvard.edu",
        "aff_unique_abbr": "UMD;Harvard",
        "aff_campus_unique_index": "0;1;0;0;0",
        "aff_campus_unique": "College Park;Cambridge",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "FOSI: Hybrid First and Second Order Optimization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18763",
        "id": "NvbeD9Ttkx",
        "author_site": "Hadar Sivan, Moshe Gabel, Assaf Schuster",
        "tldr": "",
        "abstract": "Popular machine learning approaches forgo second-order information due to the difficulty of computing curvature in high dimensions.\nWe present FOSI, a novel meta-algorithm that improves the performance of any base first-order optimizer by efficiently incorporating second-order information during the optimization process.\nIn each iteration, FOSI implicitly splits the function into two quadratic functions defined on orthogonal subspaces, then uses a second-order method to minimize the first, and the base optimizer to minimize the other.\nWe formally analyze FOSI's convergence and the conditions under which it improves a base optimizer.\nOur empirical evaluation \ndemonstrates that FOSI improves the convergence rate and optimization time of first-order methods such as Heavy-Ball and Adam, and outperforms second-order methods (K-FAC and L-BFGS).",
        "keywords": "convex optimization;nonconvex optimization;first order optimization;second order optimization;deep learning",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Hadar Sivan;Moshe Gabel;Assaf Schuster",
        "authorids": "~Hadar_Sivan1;~Moshe_Gabel1;~Assaf_Schuster2",
        "gender": "F;;M",
        "homepage": "https://hadarsivan.cswp.cs.technion.ac.il;http://www.cs.toronto.edu/~mgabel/;https://assaf.net.technion.ac.il/",
        "dblp": "264/0336;117/8009;s/AssafSchuster",
        "google_scholar": ";Lxs2l1kAAAAJ;https://scholar.google.co.il/citations?user=KfwgjswAAAAJ",
        "orcid": ";;0000-0002-3311-6937",
        "linkedin": "hadar-sivan-b2aa28135;;",
        "or_profile": "~Hadar_Sivan1;~Moshe_Gabel1;~Assaf_Schuster2",
        "aff": "Computer Science Departmen, Technion-Israel Institute of Technology;Department of Computer Science, University of Toronto;Technion - Israel Institute of Technology, Technion",
        "aff_domain": "cs.technion.ac.il;cs.toronto.edu;technion.ac.il",
        "position": "PhD student;Researcher;Full Professor",
        "bibtex": "@inproceedings{\nsivan2024fosi,\ntitle={{FOSI}: Hybrid First and Second Order Optimization},\nauthor={Hadar Sivan and Moshe Gabel and Assaf Schuster},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=NvbeD9Ttkx}\n}",
        "github": "",
        "project": "",
        "reviewers": "dEKh;S4Ex;UYzc;XiKZ",
        "pdf_size": 684164,
        "rating": "5;6;6;8",
        "confidence": "3;2;4;4",
        "soundness": "3;2;3;4",
        "contribution": "2;3;3;3",
        "presentation": "3;2;2;3",
        "wc_summary": "89;29;41;71",
        "wc_strengths": "27;45;62;27",
        "wc_weaknesses": "82;95;91;39",
        "wc_questions": "130;96;5;58",
        "wc_review": "328;265;199;195",
        "wc_reply_reviewers": "0;12;0;0",
        "wc_reply_authors": "760;501;188;171",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            57.5,
            23.76446927663229
        ],
        "wc_strengths_avg": [
            40.25,
            14.549484526951462
        ],
        "wc_weaknesses_avg": [
            76.75,
            22.29770167528483
        ],
        "wc_questions_avg": [
            72.25,
            46.434766070262484
        ],
        "wc_review_avg": [
            246.75,
            54.52694288147833
        ],
        "wc_reply_reviewers_avg": [
            3.0,
            5.196152422706632
        ],
        "wc_reply_authors_avg": [
            405.0,
            243.45738846870103
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.48420012470625223,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5025822871173090652&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=NvbeD9Ttkx",
        "pdf": "https://openreview.net/pdf?id=NvbeD9Ttkx",
        "email": "cs.technion.ac.il;cs.toronto.edu;technion.ac.il",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Technion-Israel Institute of Technology;University of Toronto;Technion - Israel Institute of Technology",
        "aff_unique_dep": "Computer Science Department;Department of Computer Science;",
        "aff_unique_url": "https://www.technion.ac.il;https://www.utoronto.ca;https://www.technion.ac.il",
        "aff_unique_abbr": "Technion;U of T;Technion",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Toronto",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Israel;Canada"
    },
    {
        "id": "NwDiald58I",
        "title": "OFASys: A Multi-Modal Multi-Task Learning System for Building Generalist Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Generalist models, which are capable of performing diverse multi-modal tasks in a task-agnostic way within a single model, have been explored recently. Being, hopefully, an alternative to approaching general-purpose AI, existing generalist models are still at an early stage, where modality and task coverage is limited. To empower multi-modal task-scaling and speed up this line of research, we release a generalist model learning system, OFASys, built on top of a declarative task interface named multi-modal instruction. At the core of OFASys is the idea of decoupling multi-modal task representations from the underlying model implementations. In OFASys, a task involving multiple modalities can be defined declaratively even with just a single line of code. The system automatically generates task plans from such instructions for training and inference. It also facilitates multi-task training for diverse multi-modal workloads. As a starting point, we provide presets of 7 different modalities and 23 highly-diverse example tasks in OFASys, with which we also develop a first-in-kind, single model, OFA+, that can handle text, image, speech, video, and motion data. The single OFA+ model achieves 95% performance in average with only 16% parameters of 15 task-finetuned models, showcasing the performance reliability of multi-modal task-scaling provided by OFASys.",
        "keywords": "generalist models;multi-modal learning;multi-task learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Jinze Bai;Rui Men;Yang Hao;Xuancheng Ren;Kai Dang;Yichang Zhang;Xiaohuan Zhou;Peng Wang;Sinan Tan;An Yang;Zeyu Cui;Yu Han;Shuai Bai;Wenbin Ge;Jianxin Ma;Junyang Lin;Jingren Zhou;Chang Zhou",
        "authorids": "~Jinze_Bai1;~Rui_Men2;~Yang_Hao1;~Xuancheng_Ren1;~Kai_Dang1;~Yichang_Zhang1;~Xiaohuan_Zhou1;~Peng_Wang20;~Sinan_Tan1;~An_Yang1;zeyu.czy@alibaba-inc.com;~Yu_Han5;~Shuai_Bai1;~Wenbin_Ge1;~Jianxin_Ma1;~Junyang_Lin1;~Jingren_Zhou1;~Chang_Zhou2",
        "gender": "M;;M;;M;M;F;M;M;M;;;M;M;M;M;M;M",
        "homepage": ";;https://scholar.google.com.hk/citationAAAAJ&hl=zh-CN;;;;;;https://blog.tinytangent.com;;;;;https://github.com;https://jianxinma.github.io/;;;",
        "dblp": "210/0939;170/0093;;;241/2644.html;;217/2489;95/4442-28;264/0041;63/10551;;;208/8033;;117/8564;215/3823;84/2644;",
        "google_scholar": ";_0aiq2YAAAAJ;;;https://scholar.google.com/citations?view_op=list_works;Y85uFm0AAAAJ;;7fjqA0YAAAAJ;;vO9FZekAAAAJ;;;ylhI1JsAAAAJ;;WdDFFlIAAAAJ;qp6IwtgAAAAJ;;QeSoG3sAAAAJ",
        "orcid": ";;;;;;;;;;;;;;;;;",
        "linkedin": ";;;;;;;;;;;https://www.linkedin.com/feed/;;;;;;",
        "or_profile": "~Jinze_Bai1;~Rui_Men2;~Yang_Hao1;~Xuancheng_Ren1;~Kai_Dang1;~Yichang_Zhang1;~Xiaohuan_Zhou1;~Peng_Wang20;~Sinan_Tan1;~An_Yang1;zeyu.czy@alibaba-inc.com;~Yu_Han5;~Shuai_Bai1;~Wenbin_Ge1;~Jianxin_Ma1;~Junyang_Lin1;~Jingren_Zhou1;~Chang_Zhou2",
        "aff": "Alibaba Group;Alibaba Group;Alibaba Group;;Alibaba Group;Alibaba Group;Alibaba Group;Alibaba Group;;Alibaba Group;;;Alibaba Group;;Alibaba Group;Alibaba Group;Alibaba Group;Alibaba Group",
        "aff_domain": "alibaba-inc.com;alibaba-inc.com;alibaba-inc.com;;alibaba-inc.com;alibaba-inc.com;alibaba-inc.com;alibaba-inc.com;;alibaba-inc.com;;;alibaba-inc.com;;alibaba-inc.com;alibaba-inc.com;alibaba-inc.com;alibaba-inc.com",
        "position": "Researcher;Engineer;Researcher;;Researcher;Researcher;Researcher;Researcher;;Researcher;;;Senior Engineer;;Senior Engineer;Principal Researcher;Researcher;Researcher",
        "bibtex": "@misc{\nbai2024ofasys,\ntitle={{OFAS}ys: A Multi-Modal Multi-Task Learning System for Building Generalist Models},\nauthor={Jinze Bai and Rui Men and Yang Hao and Xuancheng Ren and Kai Dang and Yichang Zhang and Xiaohuan Zhou and Peng Wang and Sinan Tan and An Yang and Zeyu Cui and Yu Han and Shuai Bai and Wenbin Ge and Jianxin Ma and Junyang Lin and Jingren Zhou and Chang Zhou},\nyear={2024},\nurl={https://openreview.net/forum?id=NwDiald58I}\n}",
        "github": "",
        "project": "",
        "reviewers": "G7DQ;DATQ;4hDS",
        "site": "https://openreview.net/forum?id=NwDiald58I",
        "pdf_size": 692160,
        "rating": "1;3;5",
        "confidence": "5;3;4",
        "soundness": "3;3;2",
        "contribution": "3;2;2",
        "presentation": "3;3;3",
        "wc_summary": "125;49;70",
        "wc_strengths": "5;85;28",
        "wc_weaknesses": "5;84;183",
        "wc_questions": "5;64;3",
        "wc_review": "140;282;284",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            1.632993161855452
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            81.33333333333333,
            32.04510709747884
        ],
        "wc_strengths_avg": [
            39.333333333333336,
            33.62869145371091
        ],
        "wc_weaknesses_avg": [
            90.66666666666667,
            72.82093716019376
        ],
        "wc_questions_avg": [
            24.0,
            28.296053906272277
        ],
        "wc_review_avg": [
            235.33333333333334,
            67.41579109443788
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            18,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13384070805893697209&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0;0;0;0;0;0;0;0;0;0",
        "aff_unique_norm": "Alibaba Group",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.alibaba.com",
        "aff_unique_abbr": "Alibaba",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "Nxn6vGgpI9",
        "title": "WEAR: An Outdoor Sports Dataset for Wearable and Egocentric Activity Recognition",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Though research has shown the complementarity of camera- and inertial-based data, datasets which offer both egocentric video and inertial-based sensor data remain scarce. In this paper, we introduce WEAR, an outdoor sports dataset for both vision- and inertial-based human activity recognition (HAR). The dataset comprises data from 18 participants performing a total of 18 different workout activities with untrimmed inertial (acceleration) and camera (egocentric video) data recorded at 10 different outside locations. Unlike previous egocentric datasets, WEAR provides a challenging prediction scenario marked by purposely introduced activity variations as well as an overall small information overlap across modalities. Benchmark results obtained using each modality separately show that each modality interestingly offers complementary strengths and weaknesses in their prediction performance. Further, in light of the recent success of temporal action localization models following the architecture design of the ActionFormer, we demonstrate their versatility by applying them in a plain fashion using vision, inertial and combined (vision + inertial) features as input. Results demonstrate both the applicability of vision-based temporal action localization models for inertial data and fusing both modalities by means of simple concatenation, with the combined approach (vision + inertial features) being able to produce the highest mean average precision and close-to-best F1-score. The dataset and code to reproduce experiments is publicly available via: https://www.anonymous.edu/anon",
        "keywords": "wearable activity recognition;egocentric activity recognition;human activity recognition;benchmark dataset",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/cf520f7f1aea33ace2e072e4fb2f262ece8fb671.zip",
        "author": "Marius Bock;Hilde Kuehne;Kristof Van Laerhoven;Michael Moeller",
        "authorids": "~Marius_Bock1;~Hilde_Kuehne5;~Kristof_Van_Laerhoven1;~Michael_Moeller1",
        "gender": "M;F;M;M",
        "homepage": "https://mariusbock.github.io;https://hildekuehne.github.io;https://ubicomp.eti.uni-siegen.de/home/team/kristof.html.en?lang=en;http://vsa.informatik.uni-siegen.de",
        "dblp": "298/7346;45/4963;;08/5840-1",
        "google_scholar": "7HPBugEAAAAJ;pxhCcH0AAAAJ;;https://scholar.google.de/citations?user=sxzdAGUAAAAJ",
        "orcid": "0000-0001-7401-928X;0000-0003-1079-4441;;",
        "linkedin": "marius-bock/;hilde-kuehne-8b9aa661;;",
        "or_profile": "~Marius_Bock1;~Hilde_Kuehne5;~Kristof_Van_Laerhoven1;~Michael_Moeller1",
        "aff": "Universit\u00e4t Siegen;Rheinische Friedrich-Wilhelms-Universit\u00e4t Bonn, Rheinische Friedrich-Wilhelms Universit\u00e4t Bonn;Universit\u00e4t Siegen;University of Siegen",
        "aff_domain": "uni-siegen.de;cs.uni-bonn.de;uni-siegen.de;uni-siegen.de",
        "position": "PhD student;Associate Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nbock2024wear,\ntitle={{WEAR}: An Outdoor Sports Dataset for Wearable and Egocentric Activity Recognition},\nauthor={Marius Bock and Hilde Kuehne and Kristof Van Laerhoven and Michael Moeller},\nyear={2024},\nurl={https://openreview.net/forum?id=Nxn6vGgpI9}\n}",
        "github": "",
        "project": "",
        "reviewers": "55jH;Ftjo;PuSp;1mvR",
        "site": "https://openreview.net/forum?id=Nxn6vGgpI9",
        "pdf_size": 1120733,
        "rating": "3;5;5;6",
        "confidence": "4;3;3;3",
        "soundness": "3;3;2;3",
        "contribution": "2;3;2;2",
        "presentation": "3;4;3;3",
        "wc_summary": "88;76;70;47",
        "wc_strengths": "44;49;27;141",
        "wc_weaknesses": "104;121;217;258",
        "wc_questions": "1;35;5;94",
        "wc_review": "237;281;319;540",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            70.25,
            14.905955185763842
        ],
        "wc_strengths_avg": [
            65.25,
            44.488060195967186
        ],
        "wc_weaknesses_avg": [
            175.0,
            64.43989447539467
        ],
        "wc_questions_avg": [
            33.75,
            37.18450618201081
        ],
        "wc_review_avg": [
            344.25,
            116.68199304091442
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9271726499455306,
        "gs_citation": 25,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10234792525809221847&as_sdt=8005&sciodt=0,7&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "University of Siegen;Rheinische Friedrich-Wilhelms-Universit\u00e4t Bonn",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uni-siegen.de;https://www.uni-bonn.de",
        "aff_unique_abbr": "Uni Siegen;Uni Bonn",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "title": "Unleashing Large-Scale Video Generative Pre-training for Visual Robot Manipulation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18762",
        "id": "NxoFmGgWC9",
        "author_site": "Hongtao Wu, Ya Jing, Chilam Cheang, Guangzeng Chen, Jiafeng Xu, Xinghang Li, Minghuan Liu, Hang Li, Tao Kong",
        "tldr": "",
        "abstract": "Generative pre-trained models have demonstrated remarkable effectiveness in language and vision domains by learning useful representations. In this paper, we extend the scope of this effectiveness by showing that visual robot manipulation can significantly benefit from large-scale video generative pre-training. We introduce GR-1, a GPT-style model designed for multi-task language-conditioned visual robot manipulation. GR-1 takes as inputs a language instruction, a sequence of observation images, and a sequence of robot states. It predicts robot actions as well as future images in an end-to-end manner. Thanks to a flexible design, GR-1 can be seamlessly finetuned on robot data after pre-trained on a large-scale video dataset. We perform extensive experiments on the challenging CALVIN benchmark and a real robot. On CALVIN benchmark, our method outperforms state-of-the-art baseline methods and improves the success rate from 88.9% to 94.9%. In the setting of zero-shot unseen scene generalization, GR-1 improves the success rate from 53.3% to 85.4%. In real robot experiments, GR-1 also outperforms baseline methods and shows strong potentials in generalization to unseen scenes and objects. We provide inaugural evidence that a unified GPT-style transformer, augmented with large-scale video generative pre-training, exhibits remarkable generalization to multi-task visual robot manipulation. Project page: https://GR1-Manipulation.github.io",
        "keywords": "Visual Robot Manipulation;Video Generative Pre-Training;Causal Transformer",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Hongtao Wu;Ya Jing;Chilam Cheang;Guangzeng Chen;Jiafeng Xu;Xinghang Li;Minghuan Liu;Hang Li;Tao Kong",
        "authorids": "~Hongtao_Wu2;~Ya_Jing2;~Chilam_Cheang1;~Guangzeng_Chen1;~Jiafeng_Xu2;~Xinghang_Li1;~Minghuan_Liu1;~Hang_Li4;~Tao_Kong3",
        "gender": ";;F;M;;M;M;M;M",
        "homepage": ";;;https://orcid.org/0000-0001-6873-747X;;;http://minghuanliu.com;https://hangli-hl.github.io/;http://www.taokong.org",
        "dblp": ";;;;;304/4145;249/7554;https://dblp.org/pers/hd/l/Li_0001:Hang;01/2492",
        "google_scholar": "7u0TYgIAAAAJ;;;;;https://scholar.google.com/citations?hl=zh-CN;;nTl5mSwAAAAJ;kSUXLPkAAAAJ",
        "orcid": ";;;;;;;0000-0001-9628-3487;",
        "linkedin": ";;chilam-cheang-36868319a/;;;;;hang-li-84aa6314/;",
        "or_profile": "~Hongtao_Wu2;~Ya_Jing2;~Chilam_Cheang1;~Guangzeng_Chen1;~Jiafeng_Xu2;~Xinghang_Li1;~Minghuan_Liu1;~Hang_Li4;~Tao_Kong3",
        "aff": "Bytedance Research;;ByteDance Inc.;;;Tsinghua University;Shanghai Jiaotong University;ByteDance Technology;Bytedance",
        "aff_domain": "bytedance.com;;bytedance.com;;;mail.tsinghua.edu.cn;sjtu.edu.cn;bytedance.com;bytedance.com",
        "position": "Researcher;;Researcher;;;PhD student;PhD student;Head of Research;Researcher",
        "bibtex": "@inproceedings{\nwu2024unleashing,\ntitle={Unleashing Large-Scale Video Generative Pre-training for Visual Robot Manipulation},\nauthor={Hongtao Wu and Ya Jing and Chilam Cheang and Guangzeng Chen and Jiafeng Xu and Xinghang Li and Minghuan Liu and Hang Li and Tao Kong},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=NxoFmGgWC9}\n}",
        "github": "",
        "project": "",
        "reviewers": "QyTe;SaZc;Cjar;H1qB",
        "pdf_size": 9438084,
        "rating": "3;5;6;8",
        "confidence": "4;4;3;5",
        "soundness": "1;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "61;70;92;84",
        "wc_strengths": "72;143;119;78",
        "wc_weaknesses": "295;344;506;428",
        "wc_questions": "120;336;66;2",
        "wc_review": "548;893;783;592",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1600;2117;1972;1199",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;4;3;3",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            76.75,
            12.028611723719408
        ],
        "wc_strengths_avg": [
            103.0,
            29.33428028774526
        ],
        "wc_weaknesses_avg": [
            393.25,
            80.6206394169632
        ],
        "wc_questions_avg": [
            131.0,
            125.51095569710239
        ],
        "wc_review_avg": [
            704.0,
            140.3940881946245
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1722.0,
            355.99789325219325
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            3.25,
            0.4330127018922193
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.39223227027636803,
        "gs_citation": 89,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8489360622080099633&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=NxoFmGgWC9",
        "pdf": "https://openreview.net/pdf?id=NxoFmGgWC9",
        "email": "bytedance.com;;bytedance.com;;;mail.tsinghua.edu.cn;sjtu.edu.cn;bytedance.com;bytedance.com",
        "author_num": 9,
        "aff_unique_index": "0;0;1;2;0;0",
        "aff_unique_norm": "ByteDance;Tsinghua University;Shanghai Jiao Tong University",
        "aff_unique_dep": "Bytedance Research;;",
        "aff_unique_url": "https://www.bytedance.com;https://www.tsinghua.edu.cn;https://www.sjtu.edu.cn",
        "aff_unique_abbr": "Bytedance;THU;SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "NxxbLJaDJQ",
        "title": "Adding 32 Parameters to a LLM can improve fine-tuned classification performance by up to 1.5-6 percentage points",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In this paper, we introduce and analyze an architectural augmentation for Large Language Models (LLMs) that enhances their performance in fine-tuned classification tasks through a minimalistic yet effective approach. By incorporating one additional learnable parameter per transformer block, we facilitate a depth-wise pooling mechanism that leverages the hierarchical information encoded in the layers of the pre-trained model. We demonstrate that this method significantly improves classification accuracy, with an observed increase of 1.5-6 percentage points in some models, at a negligible compute cost during training. Our experiments span various models and datasets, underscoring the universality and adaptability of the proposed technique. The augmentation proves particularly effective under data-scarce conditions, highlighting its practical utility in real-world applications. The simplicity and efficacy of our approach advocate for its integration in fine-tuning LLMs for classification, promising enhanced performance and new insights into model interpretability and optimization for diverse NLP tasks.",
        "keywords": "LLM finetuning;LLM classification",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Leon Guertler;M Ganesh Kumar;Cheston Tan",
        "authorids": "~Leon_Guertler1;~M_Ganesh_Kumar1;~Cheston_Tan1",
        "gender": "M;M;M",
        "homepage": ";https://mgkumar138.github.io/;",
        "dblp": ";230/0379;136/9366",
        "google_scholar": ";sFfy1q4AAAAJ;Up0UYEYAAAAJ",
        "orcid": ";0000-0001-5559-6428;",
        "linkedin": "leon-gurtler-6b3847165/;m-ganesh-kumar-28682792/;cheston-tan/",
        "or_profile": "~Leon_Guertler1;~M_Ganesh_Kumar1;~Cheston_Tan1",
        "aff": "Nanyang Technological University;Harvard University;Singapore University of Technology and Design",
        "aff_domain": "ntu.edu.sg;harvard.edu;sutd.edu.sg",
        "position": "Undergrad student;Postdoc;Assistant Professor",
        "bibtex": "@misc{\nguertler2024adding,\ntitle={Adding 32 Parameters to a {LLM} can improve fine-tuned classification performance by up to 1.5-6 percentage points},\nauthor={Leon Guertler and M Ganesh Kumar and Cheston Tan},\nyear={2024},\nurl={https://openreview.net/forum?id=NxxbLJaDJQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "K9mr;NqDp;Th33;XMXP",
        "site": "https://openreview.net/forum?id=NxxbLJaDJQ",
        "pdf_size": 1190636,
        "rating": "3;3;3;5",
        "confidence": "4;4;3;3",
        "soundness": "1;2;3;3",
        "contribution": "1;2;1;3",
        "presentation": "2;3;3;3",
        "wc_summary": "55;121;126;76",
        "wc_strengths": "31;27;54;100",
        "wc_weaknesses": "188;140;75;149",
        "wc_questions": "7;151;8;30",
        "wc_review": "281;439;263;355",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            94.5,
            29.9874973947477
        ],
        "wc_strengths_avg": [
            53.0,
            29.025850547399983
        ],
        "wc_weaknesses_avg": [
            138.0,
            40.601724101323576
        ],
        "wc_questions_avg": [
            49.0,
            59.602852280742404
        ],
        "wc_review_avg": [
            334.5,
            69.48920779516773
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ozYGkvwSm78J:scholar.google.com/&scioq=Adding+32+Parameters+to+a+LLM+can+improve+fine-tuned+classification+performance+by+up+to+1.5-6+percentage+points&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Nanyang Technological University;Harvard University;Singapore University of Technology and Design",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ntu.edu.sg;https://www.harvard.edu;https://www.sutd.edu.sg",
        "aff_unique_abbr": "NTU;Harvard;SUTD",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Singapore;United States"
    },
    {
        "title": "Exposing Text-Image Inconsistency Using Diffusion Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18761",
        "id": "Ny150AblPu",
        "author_site": "Mingzhen Huang, Shan Jia, Zhou Zhou, Yan Ju, Jialing Cai, Siwei Lyu",
        "tldr": "",
        "abstract": "In the battle against widespread online misinformation, a growing problem is text-image inconsistency, where images are misleadingly paired with texts with different intent or meaning. Existing classification-based methods for text-image inconsistency can identify contextual inconsistencies but fail to provide explainable justifications for their decisions that humans can understand. Although more nuanced, human evaluation is impractical at scale and susceptible to errors. To address these limitations, this study introduces D-TIIL (Diffusion-based Text-Image Inconsistency Localization), which employs text-to-image diffusion models to localize semantic inconsistencies in text and image pairs. These models, trained on large-scale datasets act as ``omniscient\" agents that filter out irrelevant information and incorporate background knowledge to identify inconsistencies. In addition, D-TIIL uses text embeddings and modified image regions to visualize these inconsistencies. To evaluate D-TIIL's efficacy, we introduce a new TIIL dataset containing 14K consistent and inconsistent text-image pairs. Unlike existing datasets, TIIL enables assessment at the level of individual words and image regions and is carefully designed to represent various inconsistencies. D-TIIL offers a scalable and evidence-based approach to identifying and localizing text-image inconsistency, providing a robust framework for future research combating misinformation.",
        "keywords": "inconsistency detection;multi-modal learning;diffusion models",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Mingzhen Huang;Shan Jia;Zhou Zhou;Yan Ju;Jialing Cai;Siwei Lyu",
        "authorids": "~Mingzhen_Huang2;~Shan_Jia1;~Zhou_Zhou4;~Yan_Ju1;~Jialing_Cai1;~Siwei_Lyu1",
        "gender": "M;F;M;;F;M",
        "homepage": "https://mingzhen-huang.github.io/;https://shanface33.github.io/;https://scholar.google.com/citations?user=ft3An4YAAAAJ&hl=en&oi=sra;;https://jialingyk.github.io/;https://www.cse.buffalo.edu/~siweilyu",
        "dblp": "274/2202;176/3600;;;;51/4482",
        "google_scholar": "https://scholar.google.com/citations?hl=en;YTAkshQAAAAJ;;;6LwYYN0AAAAJ;wefAEM4AAAAJ",
        "orcid": ";;;;;0000-0002-0992-685X",
        "linkedin": ";;;;;siwei-lyu-0806022/",
        "or_profile": "~Mingzhen_Huang2;~Shan_Jia1;~Zhou_Zhou4;~Yan_Ju1;~Jialing_Cai1;~Siwei_Lyu1",
        "aff": "Meta Facebook;State University of New York at Buffalo;New York University;;State University of New York at Buffalo;State University of New York, Buffalo",
        "aff_domain": "meta.com;buffalo.edu;nyu.edu;;buffalo.edu;buffalo.edu",
        "position": "Intern;Postdoc;MS student;;PhD student;Full Professor",
        "bibtex": "@inproceedings{\nhuang2024exposing,\ntitle={Exposing Text-Image Inconsistency Using Diffusion Models},\nauthor={Mingzhen Huang and Shan Jia and Zhou Zhou and Yan Ju and Jialing Cai and Siwei Lyu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Ny150AblPu}\n}",
        "github": "",
        "project": "",
        "reviewers": "4tYr;LEKC;D7Cn;qTYR",
        "pdf_size": 43696054,
        "rating": "5;5;6;8",
        "confidence": "4;3;3;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;4",
        "presentation": "3;2;2;2",
        "wc_summary": "81;86;50;94",
        "wc_strengths": "42;138;73;25",
        "wc_weaknesses": "239;122;114;48",
        "wc_questions": "79;188;35;9",
        "wc_review": "441;534;272;176",
        "wc_reply_reviewers": "0;91;0;0",
        "wc_reply_authors": "585;825;247;143",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            77.75,
            16.67895380412093
        ],
        "wc_strengths_avg": [
            69.5,
            43.13061557640929
        ],
        "wc_weaknesses_avg": [
            130.75,
            68.7799934574001
        ],
        "wc_questions_avg": [
            77.75,
            68.39362177864248
        ],
        "wc_review_avg": [
            355.75,
            139.96852324719296
        ],
        "wc_reply_reviewers_avg": [
            22.75,
            39.40415587219196
        ],
        "wc_reply_authors_avg": [
            450.0,
            271.2508064504141
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.4714045207910316,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12118617309434410659&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=Ny150AblPu",
        "pdf": "https://openreview.net/pdf?id=Ny150AblPu",
        "email": "meta.com;buffalo.edu;nyu.edu;;buffalo.edu;buffalo.edu",
        "author_num": 6,
        "aff_unique_index": "0;1;2;1;1",
        "aff_unique_norm": "Meta;State University of New York at Buffalo;New York University",
        "aff_unique_dep": "Meta Platforms, Inc.;;",
        "aff_unique_url": "https://meta.com;https://www.buffalo.edu;https://www.nyu.edu",
        "aff_unique_abbr": "Meta;SUNY Buffalo;NYU",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Buffalo",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Masked Audio Generation using a Single Non-Autoregressive Transformer",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18760",
        "id": "Ny8NiVfi95",
        "author_site": "Alon Ziv, Itai Gat, Gael Le Lan, Tal Remez, Felix Kreuk, Jade Copet, Alexandre D\u00e9fossez, Gabriel Synnaeve, Yossi Adi",
        "tldr": "",
        "abstract": "We introduce MAGNeT, a masked generative sequence modeling method that operates directly over several streams of audio tokens. Unlike prior work, MAGNeT is comprised of a single-stage, non-autoregressive transformer. During training, we predict spans of masked tokens obtained from a masking scheduler, while during inference we gradually construct the output sequence using several decoding steps. To further enhance the quality of the generated audio, we introduce a novel rescoring method in which, we leverage an external pre-trained model to rescore and rank predictions from MAGNeT, which will be then used for later decoding steps. Lastly, we explore a hybrid version of MAGNeT, in which we fuse between autoregressive and non-autoregressive models to generate the first few seconds in an autoregressive manner while the rest of the sequence is being decoded in parallel. We demonstrate the efficiency of MAGNeT for the task of text-to-music and text-to-audio generation and conduct an extensive empirical evaluation, considering both objective metrics and human studies. The proposed approach is comparable to the evaluated baselines, while being significantly faster (x$7$ faster than the autoregressive baseline). Through ablation studies and analysis, we shed light on the importance of each of the components comprising MAGNeT, together with pointing to the trade-offs between autoregressive and non-autoregressive modeling, considering latency, throughput, and generation quality. Samples are available on our demo page https://pages.cs.huji.ac.il/adiyoss-lab/MAGNeT.",
        "keywords": "Audio modeling;audio generation;music generation;non-autoregressive models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/6ec11e6907c0034ec179375973aba7efa92c5f72.zip",
        "author": "Alon Ziv;Itai Gat;Gael Le Lan;Tal Remez;Felix Kreuk;Jade Copet;Alexandre D\u00e9fossez;Gabriel Synnaeve;Yossi Adi",
        "authorids": "~Alon_Ziv1;~Itai_Gat1;~Gael_Le_Lan1;~Tal_Remez2;~Felix_Kreuk1;~Jade_Copet1;~Alexandre_D\u00e9fossez1;~Gabriel_Synnaeve1;~Yossi_Adi1",
        "gender": "M;M;M;M;M;;M;M;M",
        "homepage": "https://www.cs.huji.ac.il/w~alonzi/;https://www.linkedin.com/in/itaigat/;;https://talremez.github.io/;https://scholar.google.co.il/citations?user=UiERcYsAAAAJ&hl=en;;https://ai.honu.io/;;http://adiyoss.github.io/",
        "dblp": "29/3343;221/4128;28/9230.html;170/0030;213/7459;;156/0054;http://dblp.uni-trier.de/pers/hd/s/Synnaeve:Gabriel;171/0957.html",
        "google_scholar": "https://scholar.google.com/citations?hl=en;TnJqhXIAAAAJ;QrIyt6sAAAAJ;https://scholar.google.co.il/citations?user=XqHYn7EAAAAJ;;GRMLwjAAAAAJ;https://scholar.google.fr/citations?user=DubNUU0AAAAJ;wN9rBkcAAAAJ;https://scholar.google.co.il/citations?user=4W-HuYYAAAAJ",
        "orcid": ";;;;;;;;0000-0003-2237-3898",
        "linkedin": "alon-ziv-4857a0b9/;;gael-lelan/?locale=en_US;;;jadecopet/?locale=en_US;;;yossi-adi-31a32858?trk=nav_responsive_tab_profile_pic",
        "or_profile": "~Alon_Ziv1;~Itai_Gat1;~Gael_Le_Lan1;~Tal_Remez2;~Felix_Kreuk1;~Jade_Copet1;~Alexandre_D\u00e9fossez1;~Gabriel_Synnaeve1;~Yossi_Adi1",
        "aff": "Hebrew University, Hebrew University of Jerusalem;;Meta;Meta;Meta Facebook;Facebook AI Research;Kyutai;Meta Facebook;Meta",
        "aff_domain": "cs.huji.ac.il;;meta.com;meta.com;fb.com;facebook.com;kyutai.org;fb.com;meta.com",
        "position": "PhD student;;Researcher;Researcher;Researcher;Research Engineering Manager;Researcher;Research Scientist;Research Scientist",
        "bibtex": "@inproceedings{\nziv2024masked,\ntitle={Masked Audio Generation using a Single Non-Autoregressive Transformer},\nauthor={Alon Ziv and Itai Gat and Gael Le Lan and Tal Remez and Felix Kreuk and Jade Copet and Alexandre D{\\'e}fossez and Gabriel Synnaeve and Yossi Adi},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Ny8NiVfi95}\n}",
        "github": "",
        "project": "",
        "reviewers": "Vzfc;f8w3;4Cc9",
        "pdf_size": 722631,
        "rating": "6;8;8",
        "confidence": "4;4;5",
        "soundness": "3;3;4",
        "contribution": "3;3;4",
        "presentation": "3;3;3",
        "wc_summary": "163;128;93",
        "wc_strengths": "57;392;139",
        "wc_weaknesses": "141;103;125",
        "wc_questions": "75;1;95",
        "wc_review": "436;624;452",
        "wc_reply_reviewers": "93;0;0",
        "wc_reply_authors": "1072;208;635",
        "reply_reviewers": "2;0;0",
        "reply_authors": "4;1;2",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            128.0,
            28.577380332470412
        ],
        "wc_strengths_avg": [
            196.0,
            142.57863327534974
        ],
        "wc_weaknesses_avg": [
            123.0,
            15.57776192739723
        ],
        "wc_questions_avg": [
            57.0,
            40.431011200150145
        ],
        "wc_review_avg": [
            504.0,
            85.10385811857573
        ],
        "wc_reply_reviewers_avg": [
            31.0,
            43.840620433565945
        ],
        "wc_reply_authors_avg": [
            638.3333333333334,
            352.7343980327912
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 50,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5521214275734621763&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=Ny8NiVfi95",
        "pdf": "https://openreview.net/pdf?id=Ny8NiVfi95",
        "email": "cs.huji.ac.il;;meta.com;meta.com;fb.com;facebook.com;kyutai.org;fb.com;meta.com",
        "author_num": 9,
        "aff_unique_index": "0;1;1;1;1;2;1;1",
        "aff_unique_norm": "Hebrew University of Jerusalem;Meta;Kyushu University",
        "aff_unique_dep": ";Meta Platforms, Inc.;",
        "aff_unique_url": "https://www.huji.ac.il;https://meta.com;https://www.kyushu-u.ac.jp",
        "aff_unique_abbr": "HUJI;Meta;Kyushu U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;1;2;1;1",
        "aff_country_unique": "Israel;United States;Japan"
    },
    {
        "id": "Nz2UApmv2e",
        "title": "Spiking Hybrid Attentive Mechanism with Decoupled Layer Normalization for Joint Sound Localization and Classification",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Localizing and identifying sound sources simultaneously through binaural cues is a crucial ability of humans, which facilitates our perception of complex surrounding scenes. \nBrain-inspired Spiking Neural Network (SNN) offers an energy-efficient and event-driven paradigm thus it is highly suitable for simulating the signal processing of such perceptions in organisms. \nDespite recent progress, most existing approaches in SNNs solely focus on a single task, disregarding the broad practicality of multitasking, or fail to consider the complementary features from audio modality for explicit enhancement. \nInspired by the biological information sharing within multiple tasks, in this study, we propose a powerful multi-feature oriented sound source localization and classification framework based on SNNs, namely SpikSLC-Net.\nSpecifically, we design a novel Spiking Hybrid Attention Fusion (SHAF) mechanism that incorporates spiking self-attention modules and spiking cross-attention modules, which can effectively capture temporal dependencies and align relationships among diverse features. \nThen, considering the vanilla layer normalization (LN) requires dynamic calculation during runtime and involves a significant amount of floating-point operations, we present a unique training-inference-decoupled LN method (DSLN) for SNNs.\nTo further aggregate the multi-scale audio information, two task-specific heads are introduced for the final direction-of-arrival (DoA) estimation and event class prediction.\nExperimental results demonstrate that the proposed SpikSLC-Net achieves state-of-the-art performance with only 2 time steps on SLoClas dataset.",
        "keywords": "Spiking Neural Networks;Sound Source Localization and Classification;Hybrid Attentive Mechanism;Layer Normalization",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "Jue Chen;Jian Cao;Shilong Huang;Boyu Jia;Haorui Zheng;Yuan Wang;Xing Zhang",
        "authorids": "~Jue_Chen2;~Jian_Cao4;~Shilong_Huang1;~Boyu_Jia1;~Haorui_Zheng1;~Yuan_Wang2;~Xing_Zhang9",
        "gender": ";M;M;M;;M;",
        "homepage": ";https://www.ss.pku.edu.cn/teacherteam/teacherlist/1657-%E6%9B%B9%E5%81%A5.html;;https://github.com/j7631;https://github.com/getsum-zero;http://scholar.pku.edu.cn/wangyuan;",
        "dblp": ";50/2102-2;;217/5511;;;",
        "google_scholar": ";;;;;YOhZM6kAAAAJ;",
        "orcid": "0000-0002-5348-2192;0000-0002-4724-7065;0009-0008-6006-6825;;;0000-0002-4951-4286;0000-0003-0156-4652",
        "linkedin": ";;;;;;",
        "or_profile": "~Jue_Chen2;~Jian_Cao4;~Shilong_Huang1;~Boyu_Jia1;~Haorui_Zheng1;~Yuan_Wang2;~Xing_Zhang9",
        "aff": "Peking University;Peking University;Peking University;Peking University;Peking University;Peking University;Peking University",
        "aff_domain": "pku.edu.cn;pku.edu.cn;pku.edu.cn;pku.edu.cn;pku.edu.cn;pku.edu.cn;pku.edu.cn",
        "position": "MS student;Associate Professor;MS student;MS student;MS student;Full Professor;Full Professor",
        "bibtex": "@misc{\nchen2024spiking,\ntitle={Spiking Hybrid Attentive Mechanism with Decoupled Layer Normalization for Joint Sound Localization and Classification},\nauthor={Jue Chen and Jian Cao and Shilong Huang and Boyu Jia and Haorui Zheng and Yuan Wang and Xing Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=Nz2UApmv2e}\n}",
        "github": "",
        "project": "",
        "reviewers": "zvoL;teCi;VDuB;zsh4",
        "site": "https://openreview.net/forum?id=Nz2UApmv2e",
        "pdf_size": 1437801,
        "rating": "1;5;6;8",
        "confidence": "3;4;3;2",
        "soundness": "1;3;2;3",
        "contribution": "1;2;3;4",
        "presentation": "1;3;3;3",
        "wc_summary": "71;76;52;86",
        "wc_strengths": "37;76;68;138",
        "wc_weaknesses": "139;160;169;88",
        "wc_questions": "859;2;95;12",
        "wc_review": "1106;314;384;324",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1683;1257;759;316",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;2;1;1",
        "rating_avg": [
            5.0,
            2.5495097567963922
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            1.118033988749895
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            71.25,
            12.356678356257397
        ],
        "wc_strengths_avg": [
            79.75,
            36.649522507121425
        ],
        "wc_weaknesses_avg": [
            139.0,
            31.392674304684526
        ],
        "wc_questions_avg": [
            242.0,
            358.04957757271546
        ],
        "wc_review_avg": [
            532.0,
            332.47857073802516
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1003.75,
            514.3974023068157
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.4160251471689218,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:QDcDtNajY8AJ:scholar.google.com/&scioq=Spiking+Hybrid+Attentive+Mechanism+with+Decoupled+Layer+Normalization+for+Joint+Sound+Localization+and+Classification&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0;0;0",
        "aff_unique_norm": "Peking University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.pku.edu.cn",
        "aff_unique_abbr": "Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Toward effective protection against diffusion-based mimicry through score distillation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18759",
        "id": "NzxCMe88HX",
        "author_site": "Haotian Xue, Chumeng Liang, Xiaoyu Wu, Yongxin Chen",
        "tldr": "",
        "abstract": "While generative diffusion models excel in producing high-quality images, they can also be misused to mimic authorized images, posing a significant threat to AI systems. Efforts have been made to add calibrated perturbations to protect images from diffusion-based mimicry pipelines. However, most of the existing methods are too ineffective and even impractical to be used by individual users due to their high computation and memory requirements. In this work, we present novel findings on attacking latent diffusion models (LDM) and propose new plug-and-play strategies for more effective protection. In particular, we explore the bottleneck in attacking an LDM, discovering that the encoder module rather than the denoiser module is the vulnerable point. Based on this insight, we present our strategy using Score Distillation Sampling (SDS) to double the speed of protection and reduce memory occupation by half without compromising its strength. Additionally, we provide a robust protection strategy by counterintuitively minimizing the semantic loss, which can assist in generating more natural perturbations. Finally, we conduct extensive experiments to substantiate our findings and comprehensively evaluate our newly proposed strategies. We hope our insights and protective measures can contribute to better defense against malicious diffusion-based mimicry, advancing the development of secure AI systems.",
        "keywords": "Diffusion models;safety;protection",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/18ce6089e8883338b99f7a18caddc9c93f8027ba.zip",
        "author": "Haotian Xue;Chumeng Liang;Xiaoyu Wu;Yongxin Chen",
        "authorids": "~Haotian_Xue1;~Chumeng_Liang1;~Xiaoyu_Wu1;~Yongxin_Chen1",
        "gender": "M;M;M;M",
        "homepage": "https://github.com/HCH1999;https://github.com/Nicholas0228;https://yongxin.ae.gatech.edu/;https://xavihart.github.io",
        "dblp": ";;;",
        "google_scholar": ";VzQkSAkAAAAJ;X8BYiV4AAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;",
        "linkedin": ";;;haotian-xue-gatech/",
        "or_profile": "~Chumeng_Liang1;~Xiaoyu_Wu1;~Yongxin_Chen1;~Xue_Haotian1",
        "aff": ";Shanghai Jiaotong University;Georgia Institute of Technology;NVIDIA",
        "aff_domain": ";sjtu.edu.cn;gatech.edu;nvidia.com",
        "position": ";MS student;Associate Professor;Research Intern",
        "bibtex": "@inproceedings{\nxue2024toward,\ntitle={Toward effective protection against diffusion-based mimicry through score distillation},\nauthor={Haotian Xue and Chumeng Liang and Xiaoyu Wu and Yongxin Chen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=NzxCMe88HX}\n}",
        "github": "",
        "project": "",
        "reviewers": "9rgQ;7HTv;vkfi;hmR8",
        "pdf_size": 48372800,
        "rating": "5;6;6;6",
        "confidence": "3;4;4;4",
        "soundness": "2;2;3;2",
        "contribution": "3;3;3;3",
        "presentation": "3;2;2;3",
        "wc_summary": "69;76;78;57",
        "wc_strengths": "51;29;35;35",
        "wc_weaknesses": "94;136;368;57",
        "wc_questions": "24;4;107;11",
        "wc_review": "238;245;588;160",
        "wc_reply_reviewers": "49;0;97;0",
        "wc_reply_authors": "651;566;1563;297",
        "reply_reviewers": "1;0;2;0",
        "reply_authors": "3;1;4;2",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            70.0,
            8.215838362577491
        ],
        "wc_strengths_avg": [
            37.5,
            8.170067319184096
        ],
        "wc_weaknesses_avg": [
            163.75,
            121.19070715199247
        ],
        "wc_questions_avg": [
            36.5,
            41.33098111586513
        ],
        "wc_review_avg": [
            307.75,
            165.2064995694782
        ],
        "wc_reply_reviewers_avg": [
            36.5,
            40.252329125157466
        ],
        "wc_reply_authors_avg": [
            769.25,
            476.53770837154116
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 29,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=193991099512577152&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=NzxCMe88HX",
        "pdf": "https://openreview.net/pdf?id=NzxCMe88HX",
        "email": ";sjtu.edu.cn;gatech.edu;nvidia.com",
        "author_num": 4,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Shanghai Jiao Tong University;Georgia Institute of Technology;NVIDIA",
        "aff_unique_dep": ";;NVIDIA Corporation",
        "aff_unique_url": "https://www.sjtu.edu.cn;https://www.gatech.edu;https://www.nvidia.com",
        "aff_unique_abbr": "SJTU;Georgia Tech;NVIDIA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "O04DqGdAqQ",
        "title": "Ada-Instruct: Adapting Instruction Generators For Complex Reasoning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Generating diverse and sophisticated instructions for downstream tasks by Large Language Models (LLMs) is pivotal for advancing the effect. Current approaches leverage closed-source LLMs, employing in-context prompting for instruction generation. However, in this paper, we found that in-context prompting cannot generate complex instructions with length $\\ge 100$ for tasks like code completion.\n\nTo solve this problem, we introduce Ada-Instruct, an adaptive instruction generator developed by fine-tuning open-source LLMs. Our pivotal finding illustrates that fine-tuning open-source LLMs with a mere ten samples generates long instructions that maintain distributional consistency for complex reasoning tasks. We empirically validated Ada-Instruct's efficacy across different applications, including code completion, mathematical reasoning, and commonsense reasoning. The results underscore Ada-Instruct\u2019s superiority, evidencing its improvements over its base models, current self-instruct methods, and other state-of-the-art models.",
        "keywords": "large language model;few-shot learning;self-instruct",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Wanyun Cui;Qianle Wang",
        "authorids": "~Wanyun_Cui1;~Qianle_Wang1",
        "gender": "M;M",
        "homepage": "https://cuiwanyun.github.io/;https://github.com/wangitu",
        "dblp": "116/5305;",
        "google_scholar": "https://scholar.google.com.hk/citations?user=FP7ANisAAAAJ;",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Wanyun_Cui1;~Qianle_Wang1",
        "aff": "Shanghai University of Finance and Economics;SUFE",
        "aff_domain": "shufe.edu.cn;sufe.edu",
        "position": "Associate Professor;MS student",
        "bibtex": "@misc{\ncui2024adainstruct,\ntitle={Ada-Instruct: Adapting Instruction Generators For Complex Reasoning},\nauthor={Wanyun Cui and Qianle Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=O04DqGdAqQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "MKwz;H9NJ;C9NZ;B9Ki",
        "site": "https://openreview.net/forum?id=O04DqGdAqQ",
        "pdf_size": 602120,
        "rating": "5;5;6;6",
        "confidence": "3;3;4;4",
        "soundness": "2;2;2;3",
        "contribution": "3;2;3;3",
        "presentation": "3;3;3;2",
        "wc_summary": "74;68;73;29",
        "wc_strengths": "76;43;27;37",
        "wc_weaknesses": "220;213;100;104",
        "wc_questions": "111;24;87;99",
        "wc_review": "481;348;287;269",
        "wc_reply_reviewers": "226;140;179;196",
        "wc_reply_authors": "488;786;707;512",
        "reply_reviewers": "1;1;2;1",
        "reply_authors": "2;2;4;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            61.0,
            18.614510468986285
        ],
        "wc_strengths_avg": [
            45.75,
            18.376275465937052
        ],
        "wc_weaknesses_avg": [
            159.25,
            57.32091677564134
        ],
        "wc_questions_avg": [
            80.25,
            33.566166000900374
        ],
        "wc_review_avg": [
            346.25,
            83.12453007385966
        ],
        "wc_reply_reviewers_avg": [
            185.25,
            31.075512867851433
        ],
        "wc_reply_authors_avg": [
            623.25,
            126.6597311697763
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            1.0897247358851685
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15777212033482384826&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Shanghai University of Finance and Economics",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.sufe.edu.cn",
        "aff_unique_abbr": "SUFE",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Progressive3D: Progressively Local Editing for Text-to-3D Content Creation with Complex Semantic Prompts",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18758",
        "id": "O072Rc8uUy",
        "author_site": "Xinhua Cheng, Tianyu Yang, Jianan Wang, Yu Li, Lei Zhang, Jian Zhang, Yuan Li",
        "tldr": "",
        "abstract": "Recent text-to-3D generation methods achieve impressive 3D content creation capacity thanks to the advances in image diffusion models and optimizing strategies. However, current methods struggle to generate correct 3D content for a complex prompt in semantics, i.e., a prompt describing multiple interacted objects binding with different attributes. In this work, we propose a general framework named Progressive3D, which decomposes the entire generation into a series of locally progressive editing steps to create precise 3D content for complex prompts, and we constrain the content change to only occur in regions determined by user-defined region prompts in each editing step. Furthermore, we propose an overlapped semantic component suppression technique to encourage the optimization process to focus more on the semantic differences between prompts. Extensive experiments demonstrate that the proposed Progressive3D framework generates precise 3D content for prompts with complex semantics through progressive editing steps and is general for various text-to-3D methods driven by different 3D representations.",
        "keywords": "Text-to-3D Creation;3D Content Editing;Attribute Mismatching",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/07f36586129542ea965f570628aaf2b173d8befc.zip",
        "author": "Xinhua Cheng;Tianyu Yang;Jianan Wang;Yu Li;Lei Zhang;Jian Zhang;Li Yuan",
        "authorids": "~Xinhua_Cheng1;~Tianyu_Yang2;~Jianan_Wang2;~Yu_Li4;~Lei_Zhang23;~Jian_Zhang22;~Li_Yuan2",
        "gender": "M;M;F;M;M;M;M",
        "homepage": "https://cxh0519.github.io/;https://tianyu-yang.com/;https://scholar.google.com/citations?user=mt5mvZ8AAAAJ&hl=en;https://yu-li.github.io/;http://jianzhang.tech/;https://www.leizhang.org/;https://yuanli2333.github.io/",
        "dblp": "260/2943;120/8076-3.html;49/6053,;34/2997-3;07/314-18;z/LeiZhang;98/4583-7",
        "google_scholar": "NI4c3kcAAAAJ;BXsWsf8AAAAJ;mt5mvZ8AAAAJ;j9lwU7kAAAAJ;7brFI_4AAAAJ;fIlGZToAAAAJ;-5juAR0AAAAJ",
        "orcid": ";;;;0000-0001-5486-3125;;0000-0002-2120-5588",
        "linkedin": ";;;;;;",
        "or_profile": "~Xinhua_Cheng1;~Tianyu_Yang2;~Jianan_Wang2;~Yu_Li4;~Jian_Zhang22;~Lei_Zhang1;~Yuan_LI2",
        "aff": "Peking University;International Digital Economy Academy;International Digital Economy Academy (IDEA);International Digital Economy Academy;Peking University;International Digital Economy Academy;Peking University",
        "aff_domain": "pku.edu.cn;idea.edu.cn;idea.edu.cn;idea.edu.cn;pku.edu.cn;idea.edu.cn;pku.edu.cn",
        "position": "PhD student;Researcher;Researcher;Principal Researcher;Assistant Professor;Chief Scientist;Assistant Professor",
        "bibtex": "@inproceedings{\ncheng2024progressived,\ntitle={Progressive3D: Progressively Local Editing for Text-to-3D Content Creation with Complex Semantic Prompts},\nauthor={Xinhua Cheng and Tianyu Yang and Jianan Wang and Yu Li and Lei Zhang and Jian Zhang and Li Yuan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=O072Rc8uUy}\n}",
        "github": "",
        "project": "",
        "reviewers": "S6PX;EZDr;GY6s;dBWG",
        "pdf_size": 4490422,
        "rating": "5;6;6;6",
        "confidence": "4;3;5;4",
        "soundness": "2;3;3;3",
        "contribution": "3;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "102;98;65;57",
        "wc_strengths": "39;107;60;48",
        "wc_weaknesses": "75;249;59;254",
        "wc_questions": "66;96;174;6",
        "wc_review": "282;550;358;365",
        "wc_reply_reviewers": "139;158;14;42",
        "wc_reply_authors": "1290;802;722;853",
        "reply_reviewers": "2;1;1;1",
        "reply_authors": "4;3;3;2",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            80.5,
            19.75474626513841
        ],
        "wc_strengths_avg": [
            63.5,
            26.196373794859472
        ],
        "wc_weaknesses_avg": [
            159.25,
            92.44018336199902
        ],
        "wc_questions_avg": [
            85.5,
            60.50413209029611
        ],
        "wc_review_avg": [
            388.75,
            98.62397021008636
        ],
        "wc_reply_reviewers_avg": [
            88.25,
            61.42627695050385
        ],
        "wc_reply_authors_avg": [
            916.75,
            220.49645688763346
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 42,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1083954863851979662&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=O072Rc8uUy",
        "pdf": "https://openreview.net/pdf?id=O072Rc8uUy",
        "email": "pku.edu.cn;idea.edu.cn;idea.edu.cn;idea.edu.cn;pku.edu.cn;idea.edu.cn;pku.edu.cn",
        "author_num": 7,
        "aff_unique_index": "0;1;1;1;0;1;0",
        "aff_unique_norm": "Peking University;International Digital Economy Academy",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.pku.edu.cn;",
        "aff_unique_abbr": "Peking U;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China;"
    },
    {
        "id": "O0FOVYV4yo",
        "title": "A LOCAL POLYAK-\u0141OJASIEWICZ AND DESCENT LEMMA OF GRADIENT DESCENT FOR OVERPARAMETERIZED LINEAR MODELS",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Most prior work on the convergence of gradient descent (GD) for overparameterized neural networks relies on strong assumptions on the step size (infinitesimal), the hidden-layer width (infinite), or the initialization (large, spectral, balanced). Recent work relaxes these assumptions for two-layer linear networks trained with the squared loss. In this work, we derive a linear convergence rate for training two-layer linear neural networks with GD for general losses and under relaxed assumptions on the step size, width, and initialization. A key challenge in deriving this result is that classical ingredients for deriving convergence rates for nonconvex problems, such as the Polyak-\u0141ojasiewicz (PL) condition and Descent Lemma, do not hold globally for overparameterized neural networks. Here, we prove that these two conditions hold locally with constants that depend on the weights. Then, we provide bounds on these local constants, which depend on the initialization of the weights, the current loss, and the PL and smoothness constants of the non-overparameterized model. Based on these bounds, we derive a linear convergence rate for GD. Our convergence analysis not only improves upon prior results, but also suggests a better choice for the step size, as verified through our numerical experiments.",
        "keywords": "Deep learning theory;optimization;gradient descent;linear convergence",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/52af76ead5a0498ca68e6feeca993cede8539170.pdf",
        "author": "Ziqing Xu;Hancheng Min;Salma Tarmoun;Enrique Mallada;Rene Vidal",
        "authorids": "~Ziqing_Xu1;~Hancheng_Min1;~Salma_Tarmoun1;~Enrique_Mallada1;~Rene_Vidal1",
        "gender": "M;M;F;M;",
        "homepage": ";https://hanchmin.github.io/;;http://mallada.ece.jhu.edu;http://www.vision.jhu.edu",
        "dblp": "294/0111;226/6324;;;v/ReneVidal",
        "google_scholar": "https://scholar.google.com.au/citations?user=hcKJ0BIAAAAJ;XgQjPZIAAAAJ;;ZvRFA04AAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;0000-0003-1568-1833;",
        "linkedin": "ziqing-xu-b01811161/;;salma-tarmoun-94aa5158/;emallada/;rene-vidal-74844928/",
        "or_profile": "~Ziqing_Xu1;~Hancheng_Min1;~Salma_Tarmoun1;~Enrique_Mallada1;~Rene_Vidal1",
        "aff": "The Wharton School, University of Pennsylvania;University of Pennsylvania;University of Pennsylvania;Johns Hopkins University;Amazon",
        "aff_domain": "wharton.upenn.edu;seas.upenn.edu;upenn.edu;jhu.edu;amazon.com",
        "position": "PhD student;Postdoc;PhD student;Associate Professor;Principal Researcher",
        "bibtex": "@misc{\nxu2024a,\ntitle={A {LOCAL} {POLYAK}-{\\L}{OJASIEWICZ} {AND} {DESCENT} {LEMMA} {OF} {GRADIENT} {DESCENT} {FOR} {OVERPARAMETERIZED} {LINEAR} {MODELS}},\nauthor={Ziqing Xu and Hancheng Min and Salma Tarmoun and Enrique Mallada and Rene Vidal},\nyear={2024},\nurl={https://openreview.net/forum?id=O0FOVYV4yo}\n}",
        "github": "",
        "project": "",
        "reviewers": "KJ6o;PUum;7VmP;m2Ce",
        "site": "https://openreview.net/forum?id=O0FOVYV4yo",
        "pdf_size": 674636,
        "rating": "3;5;6;6",
        "confidence": "2;3;4;4",
        "soundness": "2;3;4;3",
        "contribution": "2;2;3;1",
        "presentation": "3;3;3;3",
        "wc_summary": "151;93;274;117",
        "wc_strengths": "164;19;7;32",
        "wc_weaknesses": "154;141;28;68",
        "wc_questions": "35;23;44;146",
        "wc_review": "504;276;353;363",
        "wc_reply_reviewers": "0;0;0;48",
        "wc_reply_authors": "398;482;671;133",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            158.75,
            69.65764495014169
        ],
        "wc_strengths_avg": [
            55.5,
            63.263338514498265
        ],
        "wc_weaknesses_avg": [
            97.75,
            51.924825469133744
        ],
        "wc_questions_avg": [
            62.0,
            49.06628170138838
        ],
        "wc_review_avg": [
            374.0,
            82.25873813765928
        ],
        "wc_reply_reviewers_avg": [
            12.0,
            20.784609690826528
        ],
        "wc_reply_authors_avg": [
            421.0,
            193.45154432053522
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.9847319278346618,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:sfM1YPC5kuQJ:scholar.google.com/&scioq=A+LOCAL+POLYAK-%C5%81OJASIEWICZ+AND+DESCENT+LEMMA+OF+GRADIENT+DESCENT+FOR+OVERPARAMETERIZED+LINEAR+MODELS&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;2",
        "aff_unique_norm": "University of Pennsylvania;Johns Hopkins University;Amazon",
        "aff_unique_dep": "The Wharton School;;Amazon.com, Inc.",
        "aff_unique_url": "https://www.wharton.upenn.edu;https://www.jhu.edu;https://www.amazon.com",
        "aff_unique_abbr": "UPenn Wharton;JHU;Amazon",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "O0dW800ukz",
        "title": "Multimodal Distillation of Protein Sequence, Structure, and Function",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Proteins are the fundamental building blocks of life, carrying out essential biological functions in biology. Learning effective representations of proteins is critical for important applications like drug design and function prediction. Language models (LMs) and graph neural networks (GNNs) have shown promising performance for modeling proteins. However, multiple data modalities exist for proteins, including sequence, structure, and functional annotations. Frameworks integrating these diverse sources without large-scale pre-training remain underdeveloped. In this work, we propose ProteinSSA, a multimodal knowledge distillation framework to incorporate {\\bf Protein} {\\bf S}equence, {\\bf S}tructure, and Gene Ontology (GO) {\\bf A}nnotation for unified representations. Our approach trains a teacher and student model connected via distillation. The student GNN encodes protein sequences and structures, while the teacher model leverages GNN and an auxiliary GO encoder to incorporate the functional knowledge, generating hybrid multimodal embeddings passed to the student to learn the function-enriched representations by distribution approximation. Experiments on tasks like protein fold and enzyme commission (EC) prediction show that ProteinSSA significantly outperforms state-of-the-art baselines, demonstrating the benefits of our multimodal framework.",
        "keywords": "protein sequence;structure;function;knowledge distillation;representation learning",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/d75894c276e7ed56194a3f3483e489b5327a3a15.zip",
        "author": "Bozhen Hu;Cheng Tan;Bin Gao;Zhangyang Gao;Lirong Wu;Jun Xia;Stan Z. Li",
        "authorids": "~Bozhen_Hu1;~Cheng_Tan1;~Bin_Gao5;~Zhangyang_Gao1;~Lirong_Wu1;~Jun_Xia1;~Stan_Z._Li2",
        "gender": "M;M;M;M;;M;M",
        "homepage": ";https://chengtan9907.github.io/;https://faculty.uestc.edu.cn/gaobin/zh_CN/lwcg/153392/list/index.htm;;;http://junxia97.github.io/;https://en.westlake.edu.cn/academics/School_of_Engineering/About/Our_People/Faculty/201912/t20191206_2497.shtml",
        "dblp": "279/8665;70/1533-12.html;;275/3266;15/10330;;l/StanZLi",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;6kTV6aMAAAAJ;https://scholar.google.com.hk/citations?user=mYlmFbAAAAAJ;4SclT-QAAAAJ;Tk7TrCoAAAAJ;aPKKpSYAAAAJ;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": "0000-0002-3428-0114;;;0000-0003-1026-6083;;;",
        "linkedin": ";;;;;;stan-z-li-%E6%9D%8E%E5%AD%90%E9%9D%92-55753224/",
        "or_profile": "~Bozhen_Hu1;~Cheng_Tan1;~Bin_Gao5;~Zhangyang_Gao1;~Lirong_Wu1;~Jun_Xia1;~Stan_Z._Li1",
        "aff": "Westlake University;Zhejiang University & Westlake University;;Westlake University, China;Westlake University;Westlake University, China;Westlake University",
        "aff_domain": "westlake.edu.cn;westlake.edu.cn;;westlake.edu.cn;westlake.edu.cn;westlake.edu.cn;westlake.edu.cn",
        "position": "PhD student;PhD student;;PhD student;PhD student;PhD student;Chair Professor",
        "bibtex": "@misc{\nhu2024multimodal,\ntitle={Multimodal Distillation of Protein Sequence, Structure, and Function},\nauthor={Bozhen Hu and Cheng Tan and Bin Gao and Zhangyang Gao and Lirong Wu and Jun Xia and Stan Z. Li},\nyear={2024},\nurl={https://openreview.net/forum?id=O0dW800ukz}\n}",
        "github": "",
        "project": "",
        "reviewers": "1uow;G223;KkPB",
        "site": "https://openreview.net/forum?id=O0dW800ukz",
        "pdf_size": 783571,
        "rating": "5;6;6",
        "confidence": "4;4;5",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "2;3;2",
        "wc_summary": "68;351;140",
        "wc_strengths": "11;79;66",
        "wc_weaknesses": "180;114;677",
        "wc_questions": "64;79;206",
        "wc_review": "323;623;1089",
        "wc_reply_reviewers": "175;59;727",
        "wc_reply_authors": "1901;2042;4287",
        "reply_reviewers": "3;1;3",
        "reply_authors": "5;4;6",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            186.33333333333334,
            120.08978122869388
        ],
        "wc_strengths_avg": [
            52.0,
            29.473151624260794
        ],
        "wc_weaknesses_avg": [
            323.6666666666667,
            251.29310022804492
        ],
        "wc_questions_avg": [
            116.33333333333333,
            63.69894469734609
        ],
        "wc_review_avg": [
            678.3333333333334,
            315.1563985635633
        ],
        "wc_reply_reviewers_avg": [
            320.3333333333333,
            291.43018984922537
        ],
        "wc_reply_authors_avg": [
            2743.3333333333335,
            1093.0539277130333
        ],
        "reply_reviewers_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            5.0,
            0.816496580927726
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8857438578676792437&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0;0;0",
        "aff_unique_norm": "Westlake University;Zhejiang University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.westlake.edu.cn;http://www.zju.edu.cn",
        "aff_unique_abbr": "WU;ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "O0uiDKkNRB",
        "title": "FMLock: Preventing Unauthorized Use of Large Foundation Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Foundation models--such as CLIP, GPT, and Stable Diffusion--are neural networks pre-trained on a large amount of unlabeled data and can be used to build various downstream intelligent applications. However, these foundation models may be leaked to and/or misused by unauthorized parties, leading to severe consequences such as the generation and propagation of disinformation and sensitive, not safe for work content. To address this issue, in this work, we propose FMLock, the first framework that can transform a foundation model to a locked one. Our locked foundation model aims to achieve two goals: 1) it produces a high-quality output for an input embedded with a particular secret key sampled from a large key space, but 2) it produces a low-quality output for an input without the secret key. An authorized party has access to the secret key, while an unauthorized party does not, preventing it from leveraging the foundation model even if it has access to the model parameters. Our empirical evaluation results show that FMLock achieves the two goals. Moreover, we show that our FMLock is robust against adaptive attacks, in which an unauthorized party uses a randomly guessed secret key or reverse engineers the secret key. In particular, we theoretically show that, with a high probability, a locked foundation model produces low-quality outputs for inputs embedded with a secret key sampled from the key space uniformly at random.",
        "keywords": "Foundation models;security and privacy;semi-supervised learning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/9c471abd5740731c90e3f8ffc23cc493f1506118.pdf",
        "author": "Yupei Liu;Jinyuan Jia;Neil Zhenqiang Gong",
        "authorids": "~Yupei_Liu1;~Jinyuan_Jia2;~Neil_Zhenqiang_Gong1",
        "gender": "M;;M",
        "homepage": "https://liu00222.github.io/;https://jinyuan-jia.github.io/;http://people.duke.edu/~zg70/",
        "dblp": "204/1178;24/5124-1.html;03/9437",
        "google_scholar": "52VEwW8AAAAJ;iyg4ytkAAAAJ;t6uCsYoAAAAJ",
        "orcid": "0000-0003-4300-758X;0000-0002-9785-7769;0000-0002-9900-9309",
        "linkedin": "yupei-liu-39236912b;;",
        "or_profile": "~Yupei_Liu1;~Jinyuan_Jia2;~Neil_Gong2",
        "aff": "MathWorks;Pennsylvania State University;Duke University",
        "aff_domain": "mathworks.com;psu.edu;duke.edu",
        "position": "Software Engineer;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nliu2024fmlock,\ntitle={{FML}ock: Preventing Unauthorized Use of Large Foundation Models},\nauthor={Yupei Liu and Jinyuan Jia and Neil Zhenqiang Gong},\nyear={2024},\nurl={https://openreview.net/forum?id=O0uiDKkNRB}\n}",
        "github": "",
        "project": "",
        "reviewers": "r1iw;4dyf;hoDc;QwY5;zZJV",
        "site": "https://openreview.net/forum?id=O0uiDKkNRB",
        "pdf_size": 1856590,
        "rating": "3;3;3;6;8",
        "confidence": "4;4;5;3;3",
        "soundness": "2;2;2;2;3",
        "contribution": "2;1;2;2;4",
        "presentation": "3;2;3;2;3",
        "wc_summary": "134;58;84;35;59",
        "wc_strengths": "84;7;26;42;37",
        "wc_weaknesses": "260;356;249;52;28",
        "wc_questions": "77;11;71;11;6",
        "wc_review": "555;432;430;140;130",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            4.6,
            2.0591260281974
        ],
        "confidence_avg": [
            3.8,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.2,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.2,
            0.9797958971132712
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            74.0,
            33.769809001532714
        ],
        "wc_strengths_avg": [
            39.2,
            25.419677417308034
        ],
        "wc_weaknesses_avg": [
            189.0,
            127.45195173083854
        ],
        "wc_questions_avg": [
            35.2,
            31.789306378088845
        ],
        "wc_review_avg": [
            337.4,
            171.37981211332914
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8306786106418642,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Q4RQB1vYtzMJ:scholar.google.com/&scioq=FMLock:+Preventing+Unauthorized+Use+of+Large+Foundation+Models&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "MathWorks;Pennsylvania State University;Duke University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.mathworks.com;https://www.psu.edu;https://www.duke.edu",
        "aff_unique_abbr": "MathWorks;PSU;Duke",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "O0vy7hHqyU",
        "title": "Fake News Detection via an Adaptive Feature Matching Optimization Framework",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The rampant proliferation of fake news across online platforms has become a significant cause for concern, necessitating the creation of robust detection techniques. Within the confines of this investigation, we present an optimization methodology built upon salient attributes tailored for the identification of fake news, spanning both unimodal and multimodal data sources. By harnessing the capabilities inherent in a diverse array of modalities, ranging from textual to visual elements, we are able to comprehensively apprehend the multifaceted nature of falsified news stories. Primarily, our methodology introduces an unprecedented array of features, encompassing word-level, sentence-level, and contextual features. This infusion bestows upon it a robust capacity to adeptly accommodate a wide spectrum of textual content. Subsequently, we integrate a feature-centric optimization technique grounded in the principles of simulated annealing. This approach enables us to ascertain the most optimal fusion of features, thereby mitigating potential conflicts and interferences arising from the coexistence of textual and visual components. Empirical insights garnered from exhaustive dataset experimentation decisively underscore the efficacy of our proposed methodology. Our approach outperforms standalone modalities as well as traditional single-classifier models, as evidenced by its superior detection capabilities. This research underscores the indispensable role played by the integration of multimodal data sources and the meticulous optimization of feature amalgamations. These factors collectively contribute to the creation of a resilient framework tailored for the identification of fake news within the intricate landscape of our contemporary, data-rich environment.",
        "keywords": "Multimodal;fake news detection;simulated annealing;explainable AI;adaptive optimization",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Xiaochuan Shi;Jianqiao Lai;Lei WU",
        "authorids": "shixiaochuan@whu.edu.cn;jianqiaolai@whu.edu.cn;~Lei_WU11",
        "gender": ";;",
        "homepage": ";;",
        "dblp": ";;68/5597-5",
        "google_scholar": ";;",
        "orcid": ";;0000-0001-5641-3259",
        "linkedin": ";;",
        "or_profile": "shixiaochuan@whu.edu.cn;jianqiaolai@whu.edu.cn;~Lei_WU11",
        "aff": ";;",
        "aff_domain": ";;",
        "position": ";;",
        "bibtex": "@misc{\nanonymous2024fake,\ntitle={Fake News Detection via an Adaptive Feature Matching Optimization Framework},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=O0vy7hHqyU}\n}",
        "github": "",
        "project": "",
        "reviewers": "PUtn;eXUi;Snvc;Gycm",
        "site": "https://openreview.net/forum?id=O0vy7hHqyU",
        "pdf_size": 398412,
        "rating": "3;3;3;3",
        "confidence": "4;4;5;4",
        "soundness": "1;2;2;2",
        "contribution": "1;2;2;3",
        "presentation": "2;2;2;3",
        "wc_summary": "149;44;97;90",
        "wc_strengths": "39;20;71;38",
        "wc_weaknesses": "81;71;77;239",
        "wc_questions": "275;172;62;7",
        "wc_review": "544;307;307;374",
        "wc_reply_reviewers": "0;0;17;16",
        "wc_reply_authors": "307;114;171;249",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            95.0,
            37.23573552382174
        ],
        "wc_strengths_avg": [
            42.0,
            18.371173070873837
        ],
        "wc_weaknesses_avg": [
            117.0,
            70.52659073002182
        ],
        "wc_questions_avg": [
            129.0,
            103.12371211317017
        ],
        "wc_review_avg": [
            383.0,
            96.89427227653862
        ],
        "wc_reply_reviewers_avg": [
            8.25,
            8.257572282456872
        ],
        "wc_reply_authors_avg": [
            210.25,
            73.5981487538919
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:czbtaniAMtQJ:scholar.google.com/&scioq=Fake+News+Detection+via+an+Adaptive+Feature+Matching+Optimization+Framework&hl=en&as_sdt=0,5",
        "gs_version_total": 0
    },
    {
        "id": "O1b8uIQCZb",
        "title": "VEGA: Visual Expression Guidance for Referring Expression Segmentation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Referring expression segmentation aims to segment a target object described by a given linguistic expression in an image. Unlike the unimodal segmentation taking predefined categories, this task takes the free-form linguistic expression that contains a single attribute or more than one attribute (e.g., location, color and action) related to the target object. However, the given linguistic information is only some part of information on the target object. In contrast, the image contains more additional information for the target object, including the unique information that is hard to describe in linguistic expression. Motivated by this, we propose a novel Visual Expression GuidAnce framework for referring expression segmentation, VEGA, which enables the network to refer to the visual expression that complements the linguistic expression information to improve the guidance capability. Since the image includes information related to both target and non-target regions, it needs to meticulously identify and selectively extract the useful information relevant to the target object. Therefore, we introduce a novel visual information selection module that flexibly selects the semantic visual information related to the target object to produce the visual expression, enhancing the adaptability to diverse linguistic and image contexts for robust segmentation. Furthermore, the proposed module allows each token of the visual expression to consider the visual contextual information by exploiting the global-local linguistic cues, thereby enhancing the capacity to understand the context of the target region. Our method consistently shows strong performance on three public benchmarks for referring expression segmentation, where it surpasses the existing state-of-the-art methods.",
        "keywords": "referring expression segmentation;visual-linguistic guidance set;visual information selection;vision and language",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/0a0babad842598e61d66594576898f307a374b38.zip",
        "author": "Yubin Cho;Hyunwoo Yu;Kyeongbo Kong;Suk-Ju Kang",
        "authorids": "~Yubin_Cho1;~Hyunwoo_Yu1;~Kyeongbo_Kong1;~Suk-Ju_Kang1",
        "gender": "F;M;M;M",
        "homepage": "http://vds.sogang.ac.kr/index.php/2022/01/04/yu-bin-cho/;http://vds.sogang.ac.kr;https://www.pnu-cvsp.com/;http://vds.sogang.ac.kr/",
        "dblp": "267/8194;183/7958;218/1547;99/7096",
        "google_scholar": ";;O9QSF7UAAAAJ;",
        "orcid": ";;0000-0002-1135-7502;",
        "linkedin": ";;;",
        "or_profile": "~Yubin_Cho1;~Hyunwoo_Yu1;~Kyeongbo_Kong1;~Suk-Ju_Kang1",
        "aff": "Sogang University;Sogang University;Pusan National University;Sogang University",
        "aff_domain": "sogang.ac.kr;sogang.ac.kr;pusan.ac.kr;sogang.ac.kr",
        "position": "MS student;PhD student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\ncho2024vega,\ntitle={{VEGA}: Visual Expression Guidance for Referring Expression Segmentation},\nauthor={Yubin Cho and Hyunwoo Yu and Kyeongbo Kong and Suk-Ju Kang},\nyear={2024},\nurl={https://openreview.net/forum?id=O1b8uIQCZb}\n}",
        "github": "",
        "project": "",
        "reviewers": "qp2v;LTim;PVNu",
        "site": "https://openreview.net/forum?id=O1b8uIQCZb",
        "pdf_size": 11458420,
        "rating": "3;3;3",
        "confidence": "5;4;5",
        "soundness": "2;3;2",
        "contribution": "1;2;2",
        "presentation": "2;3;3",
        "wc_summary": "74;87;89",
        "wc_strengths": "23;27;17",
        "wc_weaknesses": "241;48;111",
        "wc_questions": "2;15;3",
        "wc_review": "340;177;220",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            83.33333333333333,
            6.649979114420002
        ],
        "wc_strengths_avg": [
            22.333333333333332,
            4.109609335312651
        ],
        "wc_weaknesses_avg": [
            133.33333333333334,
            80.35891708799687
        ],
        "wc_questions_avg": [
            6.666666666666667,
            5.9066817155564495
        ],
        "wc_review_avg": [
            245.66666666666666,
            68.97503574160405
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:HjX9eUL75uMJ:scholar.google.com/&scioq=VEGA:+Visual+Expression+Guidance+for+Referring+Expression+Segmentation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Sogang University;Pusan National University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.sogang.ac.kr;https://www.pnu.ac.kr",
        "aff_unique_abbr": "Sogang;PNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "O1cLOzgi81",
        "title": "MoDA: Mixture of Domain Adapters for Parameter-efficient Generalizable Person Re-Identification",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Domain Generalizable ReID task has garnered much attention in recent years, as a more challenging task but more closely aligned with practical applications. Mixture-of-experts (MoE) based methods has been studied for DG ReID to exploit the discrepancies and inherent correlations between diverse domains. However, most of DG ReID methods, including MoE-based methods, have to full fine-tune the large amount of parameters of backbones, classifier heads and experts. And in the set of DG ReID, the number of person IDs is particularly large which results in that parameters of classifier heads increases sharply. And make it difficult for MoE-based method to scale up to larger vision models. For this motivation, we propose a novel MoE-based DG ReID method, named mixture of do- main adapters (MoDA), to mitigate the issues men- tioned above. We apply adapter and CLIP to DG ReID in a parameter-efficient way. Extensive experiments verify that MoDA achieves competitive end even better results with state-of-the-art methods with much fewer tunable parameters.",
        "keywords": "Generalizable Person Re-Identification;Domain Generalization;Parameter-efficient Fine-tuning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Zhang Yixing;Yang Wang;Yuxin Deng",
        "authorids": "~Zhang_Yixing1;~Yang_Wang39;~Yuxin_Deng2",
        "gender": "M;M;",
        "homepage": "https://github.com/clarkkent0618;https://faculty.ecnu.edu.cn/_s43/wy2_17738/main.psp;https://faculty.ecnu.edu.cn/_s43/dyx_en/main.psp",
        "dblp": ";w/YangWang19;",
        "google_scholar": ";Wlj7gDEAAAAJ;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Zhang_Yixing1;~Yang_Wang39;~Yuxin_Deng2",
        "aff": "East China Normal University;East China Normal University;East China Normal University",
        "aff_domain": "ecnu.edu.cn;ecnu.edu.cn;sei.ecnu.edu.cn",
        "position": "MS student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nyixing2024moda,\ntitle={Mo{DA}: Mixture of Domain Adapters for Parameter-efficient Generalizable Person Re-Identification},\nauthor={Zhang Yixing and Yang Wang and Yuxin Deng},\nyear={2024},\nurl={https://openreview.net/forum?id=O1cLOzgi81}\n}",
        "github": "",
        "project": "",
        "reviewers": "jvA8;QbiD;ZKXT;DXS9;GQT9",
        "site": "https://openreview.net/forum?id=O1cLOzgi81",
        "pdf_size": 576302,
        "rating": "3;3;3;5;5",
        "confidence": "5;5;4;4;5",
        "soundness": "1;2;2;2;3",
        "contribution": "1;2;2;2;3",
        "presentation": "1;2;2;2;2",
        "wc_summary": "32;56;94;90;29",
        "wc_strengths": "1;15;37;62;27",
        "wc_weaknesses": "227;231;345;87;142",
        "wc_questions": "1;37;2;29;18",
        "wc_review": "261;339;478;268;216",
        "wc_reply_reviewers": "11;0;0;60;0",
        "wc_reply_authors": "241;322;320;153;402",
        "reply_reviewers": "1;0;0;1;0",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            3.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            4.6,
            0.48989794855663565
        ],
        "soundness_avg": [
            2.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            2.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            1.8,
            0.4000000000000001
        ],
        "wc_summary_avg": [
            60.2,
            27.6289703029266
        ],
        "wc_strengths_avg": [
            28.4,
            20.66494616494318
        ],
        "wc_weaknesses_avg": [
            206.4,
            87.91268395402338
        ],
        "wc_questions_avg": [
            17.4,
            14.319217855735
        ],
        "wc_review_avg": [
            312.4,
            91.69209344321897
        ],
        "wc_reply_reviewers_avg": [
            14.2,
            23.292917378465066
        ],
        "wc_reply_authors_avg": [
            287.6,
            84.39099478024892
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.16666666666666669,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:agkK_topgdIJ:scholar.google.com/&scioq=MoDA:+Mixture+of+Domain+Adapters+for+Parameter-efficient+Generalizable+Person+Re-Identification&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "East China Normal University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.ecnu.edu.cn",
        "aff_unique_abbr": "ECNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "O1lR4vSw5x",
        "title": "RECURSIVE NEURAL ORDINARY DIFFERENTIAL EQUATIONS FOR PARTIALLY OBSERVED SYSTEM",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Identifying spatiotemporal dynamics is a difficult task, especially in scenarios where latent states are partially observed and/or represent physical quantities. In this context, first-principle ordinary differential equation (ODE) systems are often designed to describe the system's dynamics. In this work, we address the problem of learning parts of the spatiotemporal dynamics with neural networks when only partial information about the system's state is available. Taking inspiration from recursive state estimation and Neural ODEs, we outline a general framework in which complex dynamics generated by differential equations with distinguishable states can be learned in a principled way. We demonstrate the performance of the proposed approach leveraging both numerical simulations and a real dataset extracted from an electro-mechanical positioning system. We show how the underlying equations fit into our formalism and demonstrate the improved performance of the proposed method when compared with standard baselines.",
        "keywords": "NODE;Second Order Newton Method;Learning from partial observations",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Paul Ghanem;ahmet demirkaya;Zachary Danziger;Alireza Ramezani;Tales Imbiriba;Deniz Erdogmus",
        "authorids": "~Paul_Ghanem1;demirkaya.a@northeastern.edu;zdanziger@gmail.com;a.ramezani@northeastern.edu;~Tales_Imbiriba1;~Deniz_Erdogmus1",
        "gender": "M;;;;M;M",
        "homepage": ";;;;https://talesimbiriba.github.io;",
        "dblp": ";;;;07/1491;57/3284",
        "google_scholar": ";;;;jYxVQtkAAAAJ;",
        "orcid": ";;;;0000-0002-2626-2039;",
        "linkedin": "paul-ghanem-b08108121/;;;;;",
        "or_profile": "~Paul_Ghanem1;demirkaya.a@northeastern.edu;zdanziger@gmail.com;a.ramezani@northeastern.edu;~Tales_Imbiriba1;~Deniz_Erdogmus1",
        "aff": "Northeastern university;;;;Northeastern University;",
        "aff_domain": "northeastern.edu;;;;neu.edu;northeastern.edu, neu.edu",
        "position": "PhD student;;;;Researcher;Full Professor",
        "bibtex": "@misc{\nghanem2024recursive,\ntitle={{RECURSIVE} {NEURAL} {ORDINARY} {DIFFERENTIAL} {EQUATIONS} {FOR} {PARTIALLY} {OBSERVED} {SYSTEM}},\nauthor={Paul Ghanem and ahmet demirkaya and Zachary Danziger and Alireza Ramezani and Tales Imbiriba and Deniz Erdogmus},\nyear={2024},\nurl={https://openreview.net/forum?id=O1lR4vSw5x}\n}",
        "github": "",
        "project": "",
        "reviewers": "QsPz;gkPz;W36z",
        "site": "https://openreview.net/forum?id=O1lR4vSw5x",
        "pdf_size": 1229732,
        "rating": "3;5;6",
        "confidence": "3;3;4",
        "soundness": "3;2;3",
        "contribution": "2;3;3",
        "presentation": "2;3;4",
        "wc_summary": "34;183;81",
        "wc_strengths": "13;35;57",
        "wc_weaknesses": "125;177;458",
        "wc_questions": "699;297;123",
        "wc_review": "871;692;719",
        "wc_reply_reviewers": "0;356;38",
        "wc_reply_authors": "2036;1134;1195",
        "reply_reviewers": "0;1;1",
        "reply_authors": "5;3;4",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            99.33333333333333,
            62.19503374243173
        ],
        "wc_strengths_avg": [
            35.0,
            17.962924780409974
        ],
        "wc_weaknesses_avg": [
            253.33333333333334,
            146.26991792193255
        ],
        "wc_questions_avg": [
            373.0,
            241.21359828998033
        ],
        "wc_review_avg": [
            760.6666666666666,
            78.79227260475625
        ],
        "wc_reply_reviewers_avg": [
            131.33333333333334,
            159.61899079439834
        ],
        "wc_reply_authors_avg": [
            1455.0,
            411.583122426888
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            4.0,
            0.816496580927726
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.7559289460184545,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:7umTQFyamtgJ:scholar.google.com/&scioq=RECURSIVE+NEURAL+ORDINARY+DIFFERENTIAL+EQUATIONS+FOR+PARTIALLY+OBSERVED+SYSTEM&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Northeastern University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.northeastern.edu",
        "aff_unique_abbr": "NEU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Modelling complex vector drawings with stroke-clouds",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18757",
        "id": "O2jyuo89CK",
        "author_site": "Alexander Ashcroft, Ayan Das, Yulia Gryaditskaya, Zhiyu Qu, Yi-Zhe Song",
        "tldr": "",
        "abstract": "Vector drawings are innately interactive as they preserve creational cues. Despite\nthis desirable property they remain relatively under explored due to the difficulties\nin modeling complex vector drawings. This is in part due to the primarily _sequential and auto-regressive nature_ of existing approaches failing to scale beyond simple\ndrawings. In this paper, we define generative models over _highly complex_ vector\ndrawings by first representing them as \u201cstroke-clouds\u201d \u2013 _sets_ of arbitrary cardinality comprised of semantically meaningful strokes. The dimensionality of the\nstrokes is a design choice that allows the model to adapt to a range of complexities.\nWe learn to encode these _set of strokes_ into compact latent codes by a probabilistic\nreconstruction procedure backed by _De-Finetti\u2019s Theorem of Exchangability_. The\nparametric generative model is then defined over the latent vectors of the encoded\nstroke-clouds. The resulting \u201cLatent stroke-cloud generator (LSG)\u201d thus captures\nthe distribution of complex vector drawings on an implicit _set space_. We demonstrate the efficacy of our model on complex drawings (a newly created Anime\nline-art dataset) through a range\nof generative tasks.",
        "keywords": "Generative Model;Representation Learning;Sets;Vector Graphics",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Alexander Ashcroft;Ayan Das;Yulia Gryaditskaya;Zhiyu Qu;Yi-Zhe Song",
        "authorids": "~Alexander_Ashcroft1;~Ayan_Das1;~Yulia_Gryaditskaya1;~Zhiyu_Qu1;~Yi-Zhe_Song2",
        "gender": "M;M;F;M;M",
        "homepage": "https://www.surrey.ac.uk/people/alexander-ashcroft;https://ayandas.me/;https://yulia.gryaditskaya.com/;http://tingxiangshuixie.com;http://personal.ee.surrey.ac.uk/Personal/Y.Song/",
        "dblp": ";269/9613;167/1133;;98/1684",
        "google_scholar": ";x-WI_EgAAAAJ;https://scholar.google.co.uk/citations?user=cBB96b4AAAAJ;HDcnqg0AAAAJ;https://scholar.google.co.uk/citations?user=irZFP_AAAAAJ",
        "orcid": ";0000-0002-7764-1346;0000-0002-1951-6475;;",
        "linkedin": ";ayan-das-a49928a7/;;zhiyu-qu-ab012a249/;",
        "or_profile": "~Alexander_Ashcroft1;~Ayan_Das1;~Yulia_Gryaditskaya1;~Zhiyu_Qu1;~Yi-Zhe_Song2",
        "aff": "University of Surrey;MediaTek Research;University of Surrey;University of Surrey;University of Surrey",
        "aff_domain": "surrey.ac.uk;mtkresearch.com;surrey.ac.uk;surrey.ac.uk;surrey.ac.uk",
        "position": "PhD student;Researcher;Assistant Professor;PhD student;Professor",
        "bibtex": "@inproceedings{\nashcroft2024modelling,\ntitle={Modelling complex vector drawings with stroke-clouds},\nauthor={Alexander Ashcroft and Ayan Das and Yulia Gryaditskaya and Zhiyu Qu and Yi-Zhe Song},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=O2jyuo89CK}\n}",
        "github": "",
        "project": "",
        "reviewers": "DN8s;LS4E;FQwM",
        "pdf_size": 8311833,
        "rating": "5;6;6",
        "confidence": "4;5;4",
        "soundness": "2;3;2",
        "contribution": "2;2;3",
        "presentation": "3;3;2",
        "wc_summary": "269;59;118",
        "wc_strengths": "179;721;135",
        "wc_weaknesses": "717;3;163",
        "wc_questions": "42;87;89",
        "wc_review": "1207;870;505",
        "wc_reply_reviewers": "163;0;0",
        "wc_reply_authors": "736;541;498",
        "reply_reviewers": "2;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            148.66666666666666,
            88.43202034456876
        ],
        "wc_strengths_avg": [
            345.0,
            266.4782667811142
        ],
        "wc_weaknesses_avg": [
            294.3333333333333,
            305.92519056498475
        ],
        "wc_questions_avg": [
            72.66666666666667,
            21.69997439834639
        ],
        "wc_review_avg": [
            860.6666666666666,
            286.66627906950544
        ],
        "wc_reply_reviewers_avg": [
            54.333333333333336,
            76.83893688893816
        ],
        "wc_reply_authors_avg": [
            591.6666666666666,
            103.55782067145977
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6908287775563962205&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=O2jyuo89CK",
        "pdf": "https://openreview.net/pdf?id=O2jyuo89CK",
        "email": "surrey.ac.uk;mtkresearch.com;surrey.ac.uk;surrey.ac.uk;surrey.ac.uk",
        "author_num": 5,
        "aff_unique_index": "0;1;0;0;0",
        "aff_unique_norm": "University of Surrey;MediaTek Inc.",
        "aff_unique_dep": ";Research",
        "aff_unique_url": "https://www.surrey.ac.uk;https://www.mediatek.com/",
        "aff_unique_abbr": "Surrey;MediaTek",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Taiwan",
        "aff_country_unique_index": "0;1;0;0;0",
        "aff_country_unique": "United Kingdom;China"
    },
    {
        "id": "O3BaKCxTAO",
        "title": "OPTIMIZING STABILIZATION IN SINGULARLY PER- TURBED PROBLEMS WITH SUPG SCHEME",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "This paper introduces ConvStabNet, a convolutional neural network that\npredicts optimal stabilization parameters for the Streamline Upwind Petrov\nGalerkin method (SUPG) stabilization scheme. To enhance the accuracy of\nSUPG in solving partial differential equations (PDE) with interior and bound-\nary layers, ConvStabNet incorporates a loss function that combines a strong\nresidual component and a cross-wind derivative term. ConvStabNet utilizes\na shared parameter scheme, enabling the network to learn the correlations\nbetween cell properties and their respective stabilization parameters while\neffectively managing the parameter space. Comparative evaluations against\nstate-of-the-art neural network solvers based on variational formulations\ndemonstrate the superior performance of ConvStabNet. The results affirm\nConvStabNet as a promising approach for accurately predicting stabilization\nparameters in SUPG, thereby establishing it as an improvement over neural\nnetwork-based SUPG solvers",
        "keywords": "Convolutional Neural Network;Singularly Perturbed PDEs;Stabilization Scheme",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Sangeeta Yadav;Sangeeta Yadav;Sashikumaar Ganesan",
        "authorids": "~Sangeeta_Yadav1;sangeetay492@gmail.com;sashi@iisc.ac.in",
        "gender": ";;",
        "homepage": ";;",
        "dblp": ";;",
        "google_scholar": ";;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": ";;",
        "aff": ";;",
        "aff_domain": ";;",
        "position": ";;",
        "bibtex": "@misc{\nyadav2024optimizing,\ntitle={{OPTIMIZING} {STABILIZATION} {IN} {SINGULARLY} {PER}- {TURBED} {PROBLEMS} {WITH} {SUPG} {SCHEME}},\nauthor={Sangeeta Yadav and Sangeeta Yadav and Sashikumaar Ganesan},\nyear={2024},\nurl={https://openreview.net/forum?id=O3BaKCxTAO}\n}",
        "github": "",
        "project": "",
        "reviewers": "WvoG;ptK7;pFUX",
        "site": "https://openreview.net/forum?id=O3BaKCxTAO",
        "pdf_size": 510333,
        "rating": "3;3;5",
        "confidence": "5;5;3",
        "soundness": "1;3;3",
        "contribution": "1;2;2",
        "presentation": "3;3;3",
        "wc_summary": "36;149;89",
        "wc_strengths": "72;62;42",
        "wc_weaknesses": "928;119;281",
        "wc_questions": "139;170;18",
        "wc_review": "1175;500;430",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            91.33333333333333,
            46.161552063258114
        ],
        "wc_strengths_avg": [
            58.666666666666664,
            12.47219128924647
        ],
        "wc_weaknesses_avg": [
            442.6666666666667,
            349.49709901832125
        ],
        "wc_questions_avg": [
            109.0,
            65.57946833168646
        ],
        "wc_review_avg": [
            701.6666666666666,
            335.91500247665164
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:uR1jYyHkIGEJ:scholar.google.com/&scioq=OPTIMIZING+STABILIZATION+IN+SINGULARLY+PER-+TURBED+PROBLEMS+WITH+SUPG+SCHEME&hl=en&as_sdt=0,3",
        "gs_version_total": 0
    },
    {
        "id": "O3Mej5jlda",
        "title": "Benchmarking Few-shot Transferability of Pre-trained Models with Improved Evaluation Protocols",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Few-shot transfer has been made possible by stronger pre-trained models and improved transfer algorithms. However, there lack of a unified, rigorous evaluation protocol that is challenging yet meets real-world usage. To this end, we carefully review previous evaluation principles and establish new standards with recipes from different aspects following our empirical findings, including the report of confidence intervals, the standard for hyperparameter tuning, and variation of ways and shots, etc. With these standards, we create FewTrans, a few-shot transfer benchmark containing 10 challenging datasets from diverse domains with three sub-benchmarks: one that compares pre-trained models, one that compares transfer algorithms for vision-only models, and one that compares transfer algorithms for multimodal models. To facilitate future research, we reimplement and compare some of the recent pre-trained models and transfer algorithms. We observe that, while stronger pre-trained models bring significant performance improvement, the performance of most transfer methods is quite close, and simply finetuning the whole backbone performs well enough, especially for multi-modal models. We hope that the release of FewTrans benchmark will streamline reproducible and\nrigorous advances in few-shot transfer learning research.",
        "keywords": "Few-shot transfer;Benchmarks;Pretrained models",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Xu Luo;Lianli Gao;Jingkuan Song",
        "authorids": "~Xu_Luo1;~Lianli_Gao1;~Jingkuan_Song3",
        "gender": "M;F;M",
        "homepage": "https://frankluox.github.io/;https://lianligao.github.io/;https://cfm.uestc.edu.cn/~songjingkuan/",
        "dblp": "06/2622-3;123/9849.html;70/10575",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.com.au/citations?user=zsm2dpYAAAAJ;F5Zy9V4AAAAJ",
        "orcid": "0000-0001-9827-1244;;",
        "linkedin": ";;",
        "or_profile": "~Xu_Luo1;~Lianli_Gao1;~Jingkuan_Song3",
        "aff": "University of Electronic Science and Technology of China;University of Electronic Science and Technology of China;University of Electronic Science and Technology of China,",
        "aff_domain": "uestc.edu.cn;uestc.edu.cn;uestc.edu.cn",
        "position": "PhD student;Full Professor;Full Professor",
        "bibtex": "@misc{\nluo2024benchmarking,\ntitle={Benchmarking Few-shot Transferability of Pre-trained Models with Improved Evaluation Protocols},\nauthor={Xu Luo and Lianli Gao and Jingkuan Song},\nyear={2024},\nurl={https://openreview.net/forum?id=O3Mej5jlda}\n}",
        "github": "",
        "project": "",
        "reviewers": "m8iP;byha;rvMz;QQrt",
        "site": "https://openreview.net/forum?id=O3Mej5jlda",
        "pdf_size": 309844,
        "rating": "1;5;5;5",
        "confidence": "4;4;5;4",
        "soundness": "1;3;2;3",
        "contribution": "3;2;3;2",
        "presentation": "2;2;3;3",
        "wc_summary": "41;49;74;73",
        "wc_strengths": "231;69;55;75",
        "wc_weaknesses": "1199;230;586;277",
        "wc_questions": "439;2;14;86",
        "wc_review": "1910;350;729;511",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.7320508075688772
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            59.25,
            14.53229162933362
        ],
        "wc_strengths_avg": [
            107.5,
            71.67112389240174
        ],
        "wc_weaknesses_avg": [
            573.0,
            386.42916556595463
        ],
        "wc_questions_avg": [
            135.25,
            178.28821469743872
        ],
        "wc_review_avg": [
            875.0,
            612.5075509738635
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:d5dTi0MIavUJ:scholar.google.com/&scioq=Benchmarking+Few-shot+Transferability+of+Pre-trained+Models+with+Improved+Evaluation+Protocols&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Electronic Science and Technology of China",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uestc.edu.cn",
        "aff_unique_abbr": "UESTC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "O4s319PTpY",
        "title": "Optimization Dynamics of Equivariant and Augmented Neural Networks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We investigate the optimization of multilayer perceptrons on symmetric data. We compare the strategy of constraining the architecture to be equivariant to that of using augmentation. We show that, under natural assumptions on the loss and non-linearities, the sets of equivariant stationary points are identical for the two strategies, and that the set of equivariant layers is invariant under the gradient flow for augmented models. Finally, we show that stationary points may be unstable for augmented training although they are stable for the equivariant models.",
        "keywords": "Neural networks;equivariance;augmentation;training dynamics",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/0e6a662da8986c75324d93f87856917592c2455f.zip",
        "author": "Axel Flinth;Fredrik Ohlsson",
        "authorids": "~Axel_Flinth1;~Fredrik_Ohlsson1",
        "gender": "M;M",
        "homepage": ";",
        "dblp": "174/8089;169/6014",
        "google_scholar": ";jWZnXE4AAAAJ",
        "orcid": "0000-0003-3370-5528;0000-0002-3165-6999",
        "linkedin": ";",
        "or_profile": "~Axel_Flinth1;~Fredrik_Ohlsson1",
        "aff": "Ume\u00e5 University;Umea University",
        "aff_domain": "umu.se;umu.se",
        "position": "Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nflinth2024optimization,\ntitle={Optimization Dynamics of Equivariant and Augmented Neural Networks},\nauthor={Axel Flinth and Fredrik Ohlsson},\nyear={2024},\nurl={https://openreview.net/forum?id=O4s319PTpY}\n}",
        "github": "",
        "project": "",
        "reviewers": "t5ps;fUBC;kDvS",
        "site": "https://openreview.net/forum?id=O4s319PTpY",
        "pdf_size": 370394,
        "rating": "5;5;5",
        "confidence": "4;4;3",
        "soundness": "3;3;3",
        "contribution": "3;2;2",
        "presentation": "4;3;3",
        "wc_summary": "238;139;76",
        "wc_strengths": "29;95;42",
        "wc_weaknesses": "32;506;151",
        "wc_questions": "22;36;167",
        "wc_review": "321;776;436",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            151.0,
            66.6783323126786
        ],
        "wc_strengths_avg": [
            55.333333333333336,
            28.54625875467552
        ],
        "wc_weaknesses_avg": [
            229.66666666666666,
            201.34602608996838
        ],
        "wc_questions_avg": [
            75.0,
            65.30441536884521
        ],
        "wc_review_avg": [
            511.0,
            193.1752227038102
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11121734936114588883&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Ume\u00e5 University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.umu.se",
        "aff_unique_abbr": "UMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Sweden"
    },
    {
        "id": "O7VnoefsB7",
        "title": "Frustratingly Easy Model Generalization by Dummy Risk Minimization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Empirical risk minimization (ERM) is a fundamental machine learning paradigm. However, its generalization ability is limited in various tasks. In this paper, we devise Dummy Risk Minimization (DuRM), a frustratingly easy and general technique to improve the generalization of ERM. DuRMis extremely simple to implement: just enlarging the dimension of the output logits and then optimising using standard gradient descent. Moreover, we validate the efficacy of DuRM on both theoretical and empirical analysis. Theoretically, we show that DuRM derives greater variance of the gradient, which facilitates model generalization by observing better flat local minima. Empirically, we conduct evaluations of DuRM across different datasets, modalities, and network architectures on diverse tasks, including conventional classification, semantic segmentation, out-of-distribution generalization, adversarial training, and long-tailed recognition.\nResults demonstrate that DuRM could consistently improve the performance under all tasks with an almost free-lunch manner. \nThe goal of DuRM is not achieving state-of-the-art performance, but triggering new interest in the fundamental research on risk minimization.",
        "keywords": "Model generalization;empirical risk minimization;classification",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Juncheng Wang;Jindong Wang;Xixu HU;Shujun Wang;Xing Xie",
        "authorids": "~Juncheng_Wang2;~Jindong_Wang1;~Xixu_HU2;~Shujun_Wang1;~Xing_Xie3",
        "gender": ";;;F;M",
        "homepage": ";;;https://emma-sjwang.github.io/;http://research.microsoft.com/en-us/people/xingx/",
        "dblp": ";;;;08/6809-1",
        "google_scholar": "81AjI88AAAAJ;;;https://scholar.google.com.hk/citations?user=WFELH6IAAAAJ;5EQfAFIAAAAJ",
        "orcid": ";;;0000-0003-1495-3278;0000-0002-8608-8482",
        "linkedin": ";;;;xingx/",
        "or_profile": "~Juncheng_Wang2;~Jindong_Wang1;~Xixu_HU2;~Shujun_Wang1;~Xing_Xie3",
        "aff": "The Hong Kong Polytechnic University;;;Hong Kong Polytechnic University;Microsoft Research Asia",
        "aff_domain": "polyu.edu.hk;;;polyu.edu.hk;microsoft.com",
        "position": "PhD student;;;Assistant Professor;Senior Principal Researcher",
        "bibtex": "@misc{\nwang2024frustratingly,\ntitle={Frustratingly Easy Model Generalization by Dummy Risk Minimization},\nauthor={Juncheng Wang and Jindong Wang and Xixu HU and Shujun Wang and Xing Xie},\nyear={2024},\nurl={https://openreview.net/forum?id=O7VnoefsB7}\n}",
        "github": "",
        "project": "",
        "reviewers": "L9Sz;ARGr;TH9t;krmC",
        "site": "https://openreview.net/forum?id=O7VnoefsB7",
        "pdf_size": 3280752,
        "rating": "3;5;5;5",
        "confidence": "3;4;3;3",
        "soundness": "1;3;2;2",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;2",
        "wc_summary": "61;44;92;128",
        "wc_strengths": "15;14;118;89",
        "wc_weaknesses": "894;171;84;269",
        "wc_questions": "2;5;203;149",
        "wc_review": "972;234;497;635",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            81.25,
            32.01074038506451
        ],
        "wc_strengths_avg": [
            59.0,
            45.66727493512176
        ],
        "wc_weaknesses_avg": [
            354.5,
            318.2817148376576
        ],
        "wc_questions_avg": [
            89.75,
            88.3441424204231
        ],
        "wc_review_avg": [
            584.5,
            266.08880096689523
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17042017502979823907&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Hong Kong Polytechnic University;Microsoft",
        "aff_unique_dep": ";Research",
        "aff_unique_url": "https://www.polyu.edu.hk;https://www.microsoft.com/en-us/research/group/asia",
        "aff_unique_abbr": "PolyU;MSR Asia",
        "aff_campus_unique_index": "0;0;1",
        "aff_campus_unique": "Hong Kong SAR;Asia",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "CNN Kernels Can Be the Best Shapelets",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18756",
        "id": "O8ouVV8PjF",
        "author_site": "Eric Qu, Yansen Wang, Xufang Luo, Wenqiang He, Kan Ren, Dongsheng Li",
        "tldr": "",
        "abstract": "Shapelets and CNN are two typical approaches to model time series. Shapelets aim at finding a set of sub-sequences that extract feature-based interpretable shapes, but may suffer from accuracy and efficiency issues. CNN performs well by encoding sequences with a series of hidden representations, but lacks interpretability. In this paper, we demonstrate that shapelets are essentially equivalent to a specific type of CNN kernel with a squared norm and pooling. Based on this finding, we propose ShapeConv, an interpretable CNN layer with its kernel serving as shapelets to conduct time-series modeling tasks in both supervised and unsupervised settings. By incorporating shaping regularization, we enforce the similarity for maximum interpretability. We also find human knowledge can be easily injected to ShapeConv by adjusting its initialization and model performance is boosted with it. Experiments show that ShapeConv can achieve state-of-the-art performance on time-series benchmarks without sacrificing interpretability and controllability.",
        "keywords": "Shapelet;Covolutional Neural Network;Time-series",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/b4abd24de48bab7b0270d60e94970935257d9d0b.zip",
        "author": "Eric Qu;Yansen Wang;Xufang Luo;Wenqiang He;Kan Ren;Dongsheng Li",
        "authorids": "~Eric_Qu1;~Yansen_Wang2;~Xufang_Luo1;~Wenqiang_He1;~Kan_Ren1;~Dongsheng_Li2",
        "gender": "M;F;M;M;M;M",
        "homepage": "https://people.eecs.berkeley.edu/~ericqu/;;;https://saying.ren;http://recmind.cn;",
        "dblp": "312/6521;218/7350;;28/7458;254/0830-2.html;134/7817",
        "google_scholar": "-qOBJlcAAAAJ;;ZbDIbVIAAAAJ;USnQVWgAAAAJ;VNg5rA8AAAAJ;Hvbzb1kAAAAJ",
        "orcid": ";;;;0000-0003-3103-8442;",
        "linkedin": ";;;;;",
        "or_profile": "~Eric_Qu1;~Xufang_Luo1;~Wenqiang_He1;~Kan_Ren1;~Dongsheng_Li2;~Yansen_Wang1",
        "aff": "University of California, Berkeley;Microsoft Research;;ShanghaiTech University;Microsoft Research Asia;Microsoft Research Asia",
        "aff_domain": "berkeley.edu;microsoft.com;;shanghaitech.edu.cn;microsoft.com;microsoft.com",
        "position": "PhD student;Researcher;;Assistant Professor;Principal Researcher;Researcher",
        "bibtex": "@inproceedings{\nqu2024cnn,\ntitle={{CNN} Kernels Can Be the Best Shapelets},\nauthor={Eric Qu and Yansen Wang and Xufang Luo and Wenqiang He and Kan Ren and Dongsheng Li},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=O8ouVV8PjF}\n}",
        "github": "",
        "project": "",
        "reviewers": "Lmj7;JpzU;VPQr;JCHN;nftB",
        "pdf_size": 2609089,
        "rating": "5;5;5;6;8",
        "confidence": "4;5;3;3;5",
        "soundness": "2;2;2;3;3",
        "contribution": "2;3;1;3;3",
        "presentation": "2;3;3;3;3",
        "wc_summary": "114;70;57;72;6",
        "wc_strengths": "36;81;37;62;15",
        "wc_weaknesses": "53;217;250;42;465",
        "wc_questions": "239;274;51;36;1",
        "wc_review": "442;642;395;212;487",
        "wc_reply_reviewers": "0;175;32;0;93",
        "wc_reply_authors": "1336;1683;794;374;1262",
        "reply_reviewers": "0;2;1;0;1",
        "reply_authors": "2;3;2;1;2",
        "rating_avg": [
            5.8,
            1.16619037896906
        ],
        "confidence_avg": [
            4.0,
            0.8944271909999159
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.4,
            0.8
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            63.8,
            34.677946882709186
        ],
        "wc_strengths_avg": [
            46.2,
            22.90327487500423
        ],
        "wc_weaknesses_avg": [
            205.4,
            154.5582090993552
        ],
        "wc_questions_avg": [
            120.2,
            113.00867223359454
        ],
        "wc_review_avg": [
            435.6,
            139.2330420553972
        ],
        "wc_reply_reviewers_avg": [
            60.0,
            66.78023659736465
        ],
        "wc_reply_authors_avg": [
            1089.8,
            456.51304472052055
        ],
        "reply_reviewers_avg": [
            0.8,
            0.7483314773547883
        ],
        "reply_authors_avg": [
            2.0,
            0.6324555320336759
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.3834824944236852,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17148904237337436171&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=O8ouVV8PjF",
        "pdf": "https://openreview.net/pdf?id=O8ouVV8PjF",
        "email": "berkeley.edu;microsoft.com;;shanghaitech.edu.cn;microsoft.com;microsoft.com",
        "author_num": 6,
        "aff_unique_index": "0;1;2;1;1",
        "aff_unique_norm": "University of California, Berkeley;Microsoft;ShanghaiTech University",
        "aff_unique_dep": ";Microsoft Research;",
        "aff_unique_url": "https://www.berkeley.edu;https://www.microsoft.com/en-us/research;https://www.shanghaitech.edu.cn",
        "aff_unique_abbr": "UC Berkeley;MSR;ShanghaiTech",
        "aff_campus_unique_index": "0;2;2",
        "aff_campus_unique": "Berkeley;;Asia",
        "aff_country_unique_index": "0;0;1;1;1",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "Leveraging Optimization for Adaptive Attacks on Image Watermarks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18755",
        "id": "O9PArxKLe1",
        "author_site": "Nils Lukas, Abdelrahman Ahmed, Lucas Fenaux, Florian Kerschbaum",
        "tldr": "",
        "abstract": "Untrustworthy users can misuse image generators to synthesize high-quality deepfakes and engage in unethical activities. Watermarking deters misuse by marking generated content with a hidden message, enabling its detection using a secret watermarking key. A core security property of watermarking is robustness, which states that an attacker can only evade detection by substantially degrading image quality. Assessing robustness requires designing an adaptive attack for the specific watermarking algorithm. When evaluating watermarking algorithms and their (adaptive) attacks, it is challenging to determine whether an adaptive attack is optimal, i.e., the best possible attack. We solve this problem by defining an objective function and then approach adaptive attacks as an optimization problem. The core idea of our adaptive attacks is to replicate secret watermarking keys locally by creating surrogate keys that are differentiable and can be used to optimize the attack's parameters. We demonstrate for Stable Diffusion models that such an attacker can break all five surveyed watermarking methods at no visible degradation in image quality. Optimizing our attacks is efficient and requires less than 1 GPU hour to reduce the detection accuracy to 6.3% or less. Our findings emphasize the need for more rigorous robustness testing against adaptive, learnable attackers.",
        "keywords": "watermarking;adaptive attacks;optimization;stable diffusion",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Nils Lukas;Abdulrahman Diaa;Lucas Fenaux;Florian Kerschbaum",
        "authorids": "~Nils_Lukas1;~Abdulrahman_Diaa1;~Lucas_Fenaux1;~Florian_Kerschbaum1",
        "gender": "M;M;M;",
        "homepage": "https://nilslukas.github.io;https://d-diaa.github.io/;https://www.fenaux.ca/;",
        "dblp": ";;;",
        "google_scholar": "https://scholar.google.com/citations?hl=de;xFX1k1AAAAAJ;EfuNXhcAAAAJ;",
        "orcid": ";;0000-0001-8008-4037;",
        "linkedin": ";abdulrahman-diaa-555300126/;lucas-fenaux-50404910a/;",
        "or_profile": "~Nils_Lukas1;~Abdulrahman_Diaa1;~Lucas_Fenaux1;~Florian_Kerschbaum1",
        "aff": "University of Waterloo;University of Waterloo;University of Waterloo;",
        "aff_domain": "uwaterloo.ca;uwaterloo.ca;uwaterloo.ca;",
        "position": "PhD student;PhD student;MS student;",
        "bibtex": "@inproceedings{\nlukas2024leveraging,\ntitle={Leveraging Optimization for Adaptive Attacks on Image Watermarks},\nauthor={Nils Lukas and Abdulrahman Diaa and Lucas Fenaux and Florian Kerschbaum},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=O9PArxKLe1}\n}",
        "github": "",
        "project": "",
        "reviewers": "2NFv;Agid;f7pQ;LPhx",
        "pdf_size": 1814750,
        "rating": "6;6;6;8",
        "confidence": "3;3;5;5",
        "soundness": "3;2;3;3",
        "contribution": "3;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "93;95;186;81",
        "wc_strengths": "28;61;13;61",
        "wc_weaknesses": "36;45;28;948",
        "wc_questions": "46;89;27;104",
        "wc_review": "203;290;254;1194",
        "wc_reply_reviewers": "0;0;8;510",
        "wc_reply_authors": "286;803;613;2585",
        "reply_reviewers": "0;0;1;2",
        "reply_authors": "1;2;1;4",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            1.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            113.75,
            42.055766548714814
        ],
        "wc_strengths_avg": [
            40.75,
            20.932928605429293
        ],
        "wc_weaknesses_avg": [
            264.25,
            394.8090519479005
        ],
        "wc_questions_avg": [
            66.5,
            31.196954979612993
        ],
        "wc_review_avg": [
            485.25,
            410.36287295514444
        ],
        "wc_reply_reviewers_avg": [
            129.5,
            219.70605362620302
        ],
        "wc_reply_authors_avg": [
            1071.75,
            893.0294997927
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 28,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1315628360356062404&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=O9PArxKLe1",
        "pdf": "https://openreview.net/pdf?id=O9PArxKLe1",
        "email": "uwaterloo.ca;uwaterloo.ca;uwaterloo.ca;",
        "author_num": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Waterloo",
        "aff_unique_dep": "",
        "aff_unique_url": "https://uwaterloo.ca",
        "aff_unique_abbr": "UW",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "O9gstAazBM",
        "title": "Efficient Model-Agnostic Multi-Group Equivariant Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Constructing model-agnostic group equivariant networks, such as equitune (Basu et al., 2023b) and its generalizations (Kim et al., 2023), can be computationally expensive for large product groups. We address this by providing efficient model-agnostic equivariant designs for two related problems: one where the network has multiple inputs each with potentially different groups acting on them, and another where there is a single input but the group acting on it is a large product group. For the first design, we initially consider a linear model and characterize the entire equivariant space that satisfies this constraint. This characterization gives rise to a novel fusion layer between different channels that satisfies an invariance-symmetry (IS) constraint, which we call an IS layer. We then extend this design beyond linear models, similar to equitune, consisting of equivariant and IS layers. We also show that the IS layer is a universal approximator of invariant-symmetric functions. Inspired by the first design, we use the notion of the IS property to design a second efficient model-agnostic equivariant design for large product groups acting on a single input. For the first design, we provide experiments on multi-image classification where each view is transformed independently with transformations such as rotations. We find equivariant models are robust to such transformations and perform competitively otherwise. For the second design, we consider three applications: language compositionality on the SCAN dataset to product groups; fairness in natural language generation from GPT-2 to address intersec- tionality; and robust zero-shot image classification with CLIP. Overall, our methods are simple and general, competitive with equitune and its variants, while also being computationally more efficient.",
        "keywords": "Group equivariant networks;efficient equivariant networks;large equivariant networks",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Razan Baltaji;Sourya Basu;Lav R. Varshney",
        "authorids": "~Razan_Baltaji2;~Sourya_Basu1;~Lav_R._Varshney1",
        "gender": "F;M;M",
        "homepage": ";https://basusourya.github.io/;http://www.varshney.csl.illinois.edu/",
        "dblp": "353/1883;199/8366;36/4028",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.co.in/citations?user=_kpbz3cAAAAJ;https://scholar.google.com.tw/citations?user=JIJGu30AAAAJ",
        "orcid": "0000-0003-0818-8717;;0000-0003-2798-5308",
        "linkedin": "razanbaltaji;;",
        "or_profile": "~Razan_Baltaji2;~Sourya_Basu1;~Lav_R._Varshney1",
        "aff": "University of Illinois at Urbana Champaign;University of Illinois, Urbana Champaign;University of Illinois, Urbana Champaign",
        "aff_domain": "illinois.edu;illinois.edu;illinois.edu",
        "position": "PhD student;PhD student;Associate Professor",
        "bibtex": "@misc{\nbaltaji2024efficient,\ntitle={Efficient Model-Agnostic Multi-Group Equivariant Networks},\nauthor={Razan Baltaji and Sourya Basu and Lav R. Varshney},\nyear={2024},\nurl={https://openreview.net/forum?id=O9gstAazBM}\n}",
        "github": "",
        "project": "",
        "reviewers": "gLGd;ePZ4;mvp1;EpCD",
        "site": "https://openreview.net/forum?id=O9gstAazBM",
        "pdf_size": 2779352,
        "rating": "3;3;5;5",
        "confidence": "2;4;3;2",
        "soundness": "1;2;2;3",
        "contribution": "1;1;2;2",
        "presentation": "2;2;2;2",
        "wc_summary": "14;146;116;82",
        "wc_strengths": "6;73;12;48",
        "wc_weaknesses": "185;526;51;85",
        "wc_questions": "260;102;70;29",
        "wc_review": "465;847;249;244",
        "wc_reply_reviewers": "824;127;0;0",
        "wc_reply_authors": "1953;2106;321;411",
        "reply_reviewers": "3;2;0;0",
        "reply_authors": "5;4;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            89.5,
            49.11975162803656
        ],
        "wc_strengths_avg": [
            34.75,
            27.307279249313726
        ],
        "wc_weaknesses_avg": [
            211.75,
            187.9991688811416
        ],
        "wc_questions_avg": [
            115.25,
            87.48535591743341
        ],
        "wc_review_avg": [
            451.25,
            245.28796851863729
        ],
        "wc_reply_reviewers_avg": [
            237.75,
            342.4196073533173
        ],
        "wc_reply_authors_avg": [
            1197.75,
            834.114313208927
        ],
        "reply_reviewers_avg": [
            1.25,
            1.299038105676658
        ],
        "reply_authors_avg": [
            2.75,
            1.7853571071357126
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.30151134457776363,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16542507397414100840&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Illinois Urbana-Champaign",
        "aff_unique_dep": "",
        "aff_unique_url": "https://illinois.edu",
        "aff_unique_abbr": "UIUC",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Urbana-Champaign",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Biased Temporal Convolution Graph Network for Time Series Forecasting with Missing Values",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18754",
        "id": "O9nZCwdGcG",
        "author_site": "Xiaodan Chen, Xiucheng Li, Bo Liu, Zhijun Li",
        "tldr": "",
        "abstract": "Multivariate time series forecasting plays an important role in various applications ranging from meteorology study, traffic management to economics planning. In the past decades, many efforts have been made toward accurate and reliable forecasting methods development under the assumption of intact input data. However, the time series data from real-world scenarios is often partially observed due to device malfunction or costly data acquisition, which can seriously impede the performance of the existing approaches. A naive employment of imputation methods unavoidably involves error accumulation and leads to suboptimal solutions. Motivated by this, we propose a Biased Temporal Convolution Graph Network that jointly captures the temporal dependencies and spatial structure. In particular, we inject bias into the two carefully developed modules, the Multi-Scale Instance PartialTCN and Biased GCN, to account for missing patterns. The experimental results show that our proposed model is able to achieve up to $9.93$\\% improvements over the existing methods on five real-world benchmark datasets. Our code is available at: https://github.com/chenxiaodanhit/BiTGraph.",
        "keywords": "Spatial and temporal graph neural network;bias;missing values;time series forecasting",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Xiaodan Chen;Xiucheng Li;Bo Liu;Zhijun Li",
        "authorids": "~Xiaodan_Chen1;~Xiucheng_Li2;~Bo_Liu31;~Zhijun_Li3",
        "gender": "F;M;M;M",
        "homepage": "https://github.com/chenxiaodanhit;https://xiucheng.org/;;http://www.hit.edu.cn/lizhijun",
        "dblp": "17/7250;152/8201;;89/6527-2",
        "google_scholar": ";https://scholar.google.com.sg/citations?user=qFSxE6YAAAAJ;;",
        "orcid": ";;0009-0003-0910-5722;",
        "linkedin": ";;;",
        "or_profile": "~Xiaodan_Chen1;~Xiucheng_Li2;~Bo_Liu31;~Zhijun_Li3",
        "aff": "Harbin Institute of Technology;Harbin Institute of Technology;Harbin Institute of Technology;Harbin Institute of Technology",
        "aff_domain": "hit.edu.cn;hit.edu.cn;hit.edu.cn;hit.edu.cn",
        "position": "PhD student;Assistant Professor;PhD student;Full Professor",
        "bibtex": "@inproceedings{\nchen2024biased,\ntitle={Biased Temporal Convolution Graph Network for Time Series Forecasting with Missing Values},\nauthor={Xiaodan Chen and Xiucheng Li and Bo Liu and Zhijun Li},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=O9nZCwdGcG}\n}",
        "github": "",
        "project": "",
        "reviewers": "dZwn;naqz;sYzZ",
        "pdf_size": 1341539,
        "rating": "6;6;6",
        "confidence": "4;4;3",
        "soundness": "3;3;2",
        "contribution": "3;3;3",
        "presentation": "3;4;4",
        "wc_summary": "51;64;35",
        "wc_strengths": "43;219;40",
        "wc_weaknesses": "25;291;246",
        "wc_questions": "201;23;93",
        "wc_review": "320;597;414",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "300;520;526",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            50.0,
            11.86029791643813
        ],
        "wc_strengths_avg": [
            100.66666666666667,
            83.68326528577198
        ],
        "wc_weaknesses_avg": [
            187.33333333333334,
            116.2478195733389
        ],
        "wc_questions_avg": [
            105.66666666666667,
            73.21809126772487
        ],
        "wc_review_avg": [
            443.6666666666667,
            115.01400880858914
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            448.6666666666667,
            105.15174220567575
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6730486938588312244&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=O9nZCwdGcG",
        "pdf": "https://openreview.net/pdf?id=O9nZCwdGcG",
        "email": "hit.edu.cn;hit.edu.cn;hit.edu.cn;hit.edu.cn",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Harbin Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.hit.edu.cn/",
        "aff_unique_abbr": "HIT",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Harbin",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "OBITU0NAKl",
        "title": "How Graph Neural Networks Learn: Lessons from Training Dynamics in Function Space",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "A long-standing goal in deep learning has been to characterize the learning behavior of black-box models in a more interpretable manner. For graph neural networks (GNNs), considerable advances have been made in formalizing what functions they can represent, however it remains less clear whether and how GNNs learn desired functions during the optimization process. To fill this critical gap, we study the learning dynamics of GNNs in function space via the analytic framework of overparameterization. In particular, we find that the seemingly complicated training process of GNNs can be re-cast into a more familiar label propagation framework, due to the graph inductive bias implicit in this process. From this vantage point, we provide explanations for why the learned GNN functions successfully generalize and for their pathological behavior on heterophilic graphs, which are consistent with observations. Practically, sparsifying and implementing the learning dynamics lead to a minimalist semi-supervised learning algorithm with the efficiency of classic algorithms and the effectiveness of modern GNNs.",
        "keywords": "graph neural networks;optimization;generalization",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Chenxiao Yang;Qitian Wu;David Wipf;Ruoyu Sun;Junchi Yan",
        "authorids": "~Chenxiao_Yang1;~Qitian_Wu1;~David_Wipf1;~Ruoyu_Sun1;~Junchi_Yan2",
        "gender": ";;M;;",
        "homepage": ";;http://www.davidwipf.com/;https://ruoyus.github.io/;",
        "dblp": ";;81/6421;30/9879-1;",
        "google_scholar": ";;YJx1WSgAAAAJ;PsfzbCMAAAAJ;",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Chenxiao_Yang1;~Qitian_Wu1;~David_Wipf1;~Ruoyu_Sun1;~Junchi_Yan2",
        "aff": ";;Amazon AI Research Lab;The Chinese University of Hong Kong;",
        "aff_domain": ";;amazon.com;cuhk.edu.cn;",
        "position": ";;Principal Research Scientist;Associate Professor;",
        "bibtex": "@misc{\nyang2024how,\ntitle={How Graph Neural Networks Learn: Lessons from Training Dynamics in Function Space},\nauthor={Chenxiao Yang and Qitian Wu and David Wipf and Ruoyu Sun and Junchi Yan},\nyear={2024},\nurl={https://openreview.net/forum?id=OBITU0NAKl}\n}",
        "github": "",
        "project": "",
        "reviewers": "mA7d;mEP4;ZpWJ",
        "site": "https://openreview.net/forum?id=OBITU0NAKl",
        "pdf_size": 911016,
        "rating": "5;6;8",
        "confidence": "3;2;3",
        "soundness": "3;3;4",
        "contribution": "2;3;4",
        "presentation": "3;3;4",
        "wc_summary": "104;49;69",
        "wc_strengths": "127;100;27",
        "wc_weaknesses": "105;65;34",
        "wc_questions": "50;149;25",
        "wc_review": "386;363;155",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1461;915;742",
        "reply_reviewers": "0;0;0",
        "reply_authors": "3;2;1",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            74.0,
            22.73030282830976
        ],
        "wc_strengths_avg": [
            84.66666666666667,
            42.240054713769275
        ],
        "wc_weaknesses_avg": [
            68.0,
            29.06314963431642
        ],
        "wc_questions_avg": [
            74.66666666666667,
            53.543336549834926
        ],
        "wc_review_avg": [
            301.3333333333333,
            103.89845469923452
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1039.3333333333333,
            306.41402636882594
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.18898223650461363,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18006396591726715766&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Amazon;Chinese University of Hong Kong",
        "aff_unique_dep": "Amazon AI Research Lab;",
        "aff_unique_url": "https://www.amazon.com;https://www.cuhk.edu.hk",
        "aff_unique_abbr": "Amazon AI;CUHK",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "Defining and extracting generalizable interaction primitives from DNNs",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18753",
        "id": "OCqyFVFNeF",
        "author_site": "Lu Chen, Siyu Lou, Benhao Huang, Quanshi Zhang",
        "tldr": "",
        "abstract": "Faithfully summarizing the knowledge encoded by a deep neural network (DNN) into a few symbolic primitive patterns without losing much information represents a core challenge in explainable AI. To this end, Ren et al. (2024) have derived a series of theorems to prove that the inference score of a DNN can be explained as a small set of interactions between input variables. However, the lack of generalization power makes it still hard to consider such interactions as faithful primitive patterns encoded by the DNN. Therefore, given different DNNs trained for the same task, we develop a new method to extract interactions that are shared by these DNNs. Experiments show that the extracted interactions can better reflect common knowledge shared by different DNNs.",
        "keywords": "Transferability;Generalization Power",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Lu Chen;Siyu Lou;Benhao Huang;Quanshi Zhang",
        "authorids": "~Lu_Chen4;~Siyu_Lou1;~Benhao_Huang1;~Quanshi_Zhang1",
        "gender": "F;F;M;M",
        "homepage": ";;https://huskydoge.github.io/;http://qszhang.com",
        "dblp": ";317/1067;;http://dblp.uni-trier.de/pers/hd/z/Zhang:Quanshi",
        "google_scholar": "https://scholar.google.com.hk/citations?view_op=list_works;M2PvE1IAAAAJ;SiAFHb8AAAAJ;iFFhHK0AAAAJ",
        "orcid": ";0000-0002-8046-0052;;",
        "linkedin": ";;benhao-h-6534b629a/;",
        "or_profile": "~Lu_Chen4;~Siyu_Lou1;~Benhao_Huang1;~Quanshi_Zhang1",
        "aff": "Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University",
        "aff_domain": "cs.sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn",
        "position": "PhD student;PhD student;Undergrad student;Associate Professor",
        "bibtex": "@inproceedings{\nchen2024defining,\ntitle={Defining and extracting generalizable interaction primitives from {DNN}s},\nauthor={Lu Chen and Siyu Lou and Benhao Huang and Quanshi Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=OCqyFVFNeF}\n}",
        "github": "",
        "project": "",
        "reviewers": "f9us;GVkW;MRpB",
        "pdf_size": 8455334,
        "rating": "5;6;8",
        "confidence": "4;2;4",
        "soundness": "2;2;3",
        "contribution": "2;3;4",
        "presentation": "2;2;3",
        "wc_summary": "225;99;136",
        "wc_strengths": "85;45;92",
        "wc_weaknesses": "604;232;112",
        "wc_questions": "77;2;100",
        "wc_review": "991;378;440",
        "wc_reply_reviewers": "464;30;0",
        "wc_reply_authors": "4229;1553;916",
        "reply_reviewers": "2;1;0",
        "reply_authors": "9;4;2",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            153.33333333333334,
            52.87931752795437
        ],
        "wc_strengths_avg": [
            74.0,
            20.704266871026046
        ],
        "wc_weaknesses_avg": [
            316.0,
            209.45643938537674
        ],
        "wc_questions_avg": [
            59.666666666666664,
            41.84362423223984
        ],
        "wc_review_avg": [
            603.0,
            275.5225338636872
        ],
        "wc_reply_reviewers_avg": [
            164.66666666666666,
            212.01467454452822
        ],
        "wc_reply_authors_avg": [
            2232.6666666666665,
            1435.3750574520777
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            5.0,
            2.943920288775949
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.18898223650461365,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3411233044791535464&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=OCqyFVFNeF",
        "pdf": "https://openreview.net/pdf?id=OCqyFVFNeF",
        "email": "cs.sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Shanghai Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sjtu.edu.cn",
        "aff_unique_abbr": "SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "OCx7dp58H1",
        "title": "Setting the Record Straight on Transformer Oversmoothing",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Transformer-based models have recently become wildly successful across a diverse set of domains. At the same time, recent work has shown that Transformers are inherently low-pass filters that can oversmooth the input. This causes their performance to quickly saturate as model depth increases. A natural question is: How can Transformers achieve success given this shortcoming? In this work we show that in fact Transformers are not inherently low-pass filters. Instead, whether Transformers oversmooth or not depends on the eigenspectrum of their update equations. Our analysis extends prior work in oversmoothing and in the closely-related phenomenon of rank collapse. We show that many successful Transformer models have attention and weights which satisfy conditions that avoid oversmoothing. Finally, we describe a simple way to reparameterize the weights of the Transformer update equations to ensure that oversmoothing does not occur. Compared to other solutions for oversmoothing, our approach does not require a new architecture, or any additional hyperparameters.",
        "keywords": "transformers;oversmoothing;rank collapse",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Gbetondji Jean-Sebastien Dovonon;Michael M. Bronstein;Matt Kusner",
        "authorids": "~Gbetondji_Jean-Sebastien_Dovonon1;~Michael_M._Bronstein1;~Matt_Kusner1",
        "gender": "M;M;M",
        "homepage": "https://jean72human.github.io;http://www.inf.usi.ch/bronstein/;http://mkusner.github.io",
        "dblp": ";07/2668;120/7700.html",
        "google_scholar": ";UU3N6-UAAAAJ;57KRSu8AAAAJ",
        "orcid": ";;",
        "linkedin": ";mbronstein/;",
        "or_profile": "~Gbetondji_Jean-Sebastien_Dovonon1;~Michael_M._Bronstein1;~Matt_Kusner1",
        "aff": "University College London, University of London;University of Oxford;University College London",
        "aff_domain": "ucl.ac.uk;ox.ac.uk;ucl.ac.uk",
        "position": "PhD student;Full Professor;Associate Professor",
        "bibtex": "@misc{\ndovonon2024setting,\ntitle={Setting the Record Straight on Transformer Oversmoothing},\nauthor={Gbetondji Jean-Sebastien Dovonon and Michael M. Bronstein and Matt Kusner},\nyear={2024},\nurl={https://openreview.net/forum?id=OCx7dp58H1}\n}",
        "github": "",
        "project": "",
        "reviewers": "QJ8g;yd6A;rqLo;m7iA",
        "site": "https://openreview.net/forum?id=OCx7dp58H1",
        "pdf_size": 8759545,
        "rating": "5;6;6;6",
        "confidence": "4;4;4;4",
        "soundness": "4;3;3;3",
        "contribution": "3;2;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "72;84;138;95",
        "wc_strengths": "32;104;37;72",
        "wc_weaknesses": "205;339;296;49",
        "wc_questions": "114;246;53;28",
        "wc_review": "423;773;524;244",
        "wc_reply_reviewers": "0;416;0;0",
        "wc_reply_authors": "1294;2197;1729;566",
        "reply_reviewers": "0;2;0;0",
        "reply_authors": "3;5;3;3",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            97.25,
            24.893523254051445
        ],
        "wc_strengths_avg": [
            61.25,
            29.09789511287715
        ],
        "wc_weaknesses_avg": [
            222.25,
            111.11114930554899
        ],
        "wc_questions_avg": [
            110.25,
            84.38712875788582
        ],
        "wc_review_avg": [
            491.0,
            191.21061686004782
        ],
        "wc_reply_reviewers_avg": [
            104.0,
            180.13328398716322
        ],
        "wc_reply_authors_avg": [
            1446.5,
            600.3317832665533
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            3.5,
            0.8660254037844386
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1238794199568978372&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University College London;University of Oxford",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ucl.ac.uk;https://www.ox.ac.uk",
        "aff_unique_abbr": "UCL;Oxford",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "title": "Aligning Relational Learning with Lipschitz Fairness",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18752",
        "id": "ODSgo2m8aE",
        "author_site": "Yaning Jia, Chunhui Zhang, Soroush Vosoughi",
        "tldr": "",
        "abstract": "Relational learning has gained significant attention, led by the expressiveness of Graph Neural Networks (GNNs) on graph data. While the inherent biases in common graph data are involved in GNN training, it poses a serious challenge to constraining the GNN output perturbations induced by input biases, thereby safeguarding fairness during training. The Lipschitz bound, a technique from robust statistics, can limit the maximum changes in the output concerning the input, taking into account associated irrelevant biased factors. It is an efficient and provable method to examine the output stability of machine learning models without incurring additional computational costs. Recently, its use in controlling the stability of Euclidean neural networks, the calculation of the precise Lipschitz bound remains elusive for non-Euclidean neural networks like GNNs, especially within fairness contexts. However, no existing research has investigated Lipschitz bounds to shed light on stabilizing the GNN outputs, especially when working on graph data with implicit biases. To narrow this gap, we begin with the general GNNs operating on relational data, and formulate a Lipschitz bound to limit the changes in the output regarding biases associated with the input. Additionally, we theoretically analyze how the Lipschitz bound of a GNN model could constrain the output perturbations induced by biases learned from data for fairness training. We experimentally validate the Lipschitz bound's effectiveness in limiting biases of the model output. Finally, from a training dynamics perspective, we demonstrate why the theoretical Lipschitz bound can effectively guide the GNN training to better trade-off between accuracy and fairness.",
        "keywords": "Fairness Alignment;Relational Learning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Yaning Jia;Chunhui Zhang;Soroush Vosoughi",
        "authorids": "~Yaning_Jia1;~Chunhui_Zhang1;~Soroush_Vosoughi1",
        "gender": "M;;M",
        "homepage": "https://chunhuizng.github.io;https://www.cs.dartmouth.edu/~soroush/;https://www.hust.edu.cn/xxgk/xxjj.htm",
        "dblp": "62/3401;01/1709;353/7715",
        "google_scholar": "https://scholar.google.com.hk/citations?user=jlqnbkAAAAAJ;45DAXkwAAAAJ;https://scholar.google.com/citations?view_op=list_works",
        "orcid": ";0000-0002-2564-8909;",
        "linkedin": "chunhui-zhang-541827161/;;",
        "or_profile": "~Chunhui_Zhang1;~Soroush_Vosoughi1;~Yaning_Jia2",
        "aff": "Dartmouth College;Dartmouth College;Huazhong University of Science and Technology",
        "aff_domain": "dartmouth.edu;dartmouth.edu;hust.edu.cn",
        "position": "PhD student;Assistant Professor;MS student",
        "bibtex": "@inproceedings{\njia2024aligning,\ntitle={Aligning Relational Learning with Lipschitz Fairness},\nauthor={Yaning Jia and Chunhui Zhang and Soroush Vosoughi},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ODSgo2m8aE}\n}",
        "github": "",
        "project": "",
        "reviewers": "kSfC;uCQA;7Erc;ANH8",
        "pdf_size": 1185367,
        "rating": "5;6;6;8",
        "confidence": "1;3;3;3",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;2;2;3",
        "wc_summary": "77;70;81;85",
        "wc_strengths": "18;64;82;53",
        "wc_weaknesses": "69;113;90;58",
        "wc_questions": "3;2;118;71",
        "wc_review": "167;249;371;267",
        "wc_reply_reviewers": "0;18;35;21",
        "wc_reply_authors": "1093;1645;1721;1523",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "3;4;4;5",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            2.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            78.25,
            5.539629951540085
        ],
        "wc_strengths_avg": [
            54.25,
            23.34925052330374
        ],
        "wc_weaknesses_avg": [
            82.5,
            21.02974084481309
        ],
        "wc_questions_avg": [
            48.5,
            48.91063279083598
        ],
        "wc_review_avg": [
            263.5,
            72.61370394078517
        ],
        "wc_reply_reviewers_avg": [
            18.5,
            12.459935794377111
        ],
        "wc_reply_authors_avg": [
            1495.5,
            242.8801144597886
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.0,
            0.7071067811865476
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.6622661785325219,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14384778413766330437&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=ODSgo2m8aE",
        "pdf": "https://openreview.net/pdf?id=ODSgo2m8aE",
        "email": "dartmouth.edu;dartmouth.edu;hust.edu.cn",
        "author_num": 3,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Dartmouth College;Huazhong University of Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.dartmouth.edu;http://www.hust.edu.cn",
        "aff_unique_abbr": "Dartmouth;HUST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "OEDM8mzbsl",
        "title": "Evaluating Multi-Agent Coordination Abilities in Large Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "A pivotal aim in contemporary AI research is to develop agents proficient in multi-agent coordination, enabling effective collaboration with both humans and other systems. Large Language Models (LLMs), with their notable ability to understand, generate, and interpret language in a human-like manner, stand out as promising candidates for the development of such agents. In this study, we build and assess the effectiveness of agents crafted using LLMs in various coordination scenarios. We introduce the LLM-Coordination (LLM-Co) Framework, specifically designed to enable LLMs to play coordination games. With the LLM-Co framework, we conduct our evaluation with three game environments and organize the evaluation into five aspects: Theory of Mind, Situated Reasoning, Sustained Coordination, Robustness to Partners, and Explicit Assistance. First, the evaluation of the Theory of Mind and Situated Reasoning reveals the capabilities of LLM to infer the partner's intention and reason actions accordingly. Then, the evaluation around Sustained Coordination and Robustness to Partners further showcases the ability of LLMs to coordinate with an unknown partner in complex long-horizon tasks, outperforming Reinforcement Learning baselines. Lastly, to test Explicit Assistance, which refers to the ability of an agent to offer help proactively, we introduce two novel layouts into the Overcooked-AI benchmark, examining if agents can prioritize helping their partners, sacrificing time that could have been spent on their tasks. This research underscores the promising capabilities of LLMs in sophisticated coordination environments and reveals the potential of LLMs in building strong real-world agents for multi-agent coordination.",
        "keywords": "Large Language Model;Cooperative AI;Planning with Large Language Models;Multi-Agent Coordination",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/fdd2a5ee9d313338818f18d0281a78cb0d2ccba2.zip",
        "author": "Saaket Agashe;Yue Fan;Xin Eric Wang",
        "authorids": "~Saaket_Agashe1;~Yue_Fan3;~Xin_Eric_Wang2",
        "gender": "M;M;M",
        "homepage": "https://saa1605.github.io;http://www.yfan.site;https://eric-xw.github.io",
        "dblp": "326/1062;;10/5630-61",
        "google_scholar": "_23KIVgAAAAJ;;YjqluE0AAAAJ",
        "orcid": ";;0000-0003-2605-5504",
        "linkedin": ";;",
        "or_profile": "~Saaket_Agashe1;~Yue_Fan3;~Xin_Eric_Wang2",
        "aff": "University of California, Santa Cruz;University of California, Santa Cruz;University of California, Santa Cruz",
        "aff_domain": "ucsc.edu;ucsc.edu;ucsc.edu",
        "position": "PhD student;PhD student;Assistant Professor",
        "bibtex": "@misc{\nagashe2024evaluating,\ntitle={Evaluating Multi-Agent Coordination Abilities in Large Language Models},\nauthor={Saaket Agashe and Yue Fan and Xin Eric Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=OEDM8mzbsl}\n}",
        "github": "",
        "project": "",
        "reviewers": "cHGX;GAhq;3Qgp",
        "site": "https://openreview.net/forum?id=OEDM8mzbsl",
        "pdf_size": 1218431,
        "rating": "3;3;5",
        "confidence": "4;4;4",
        "soundness": "3;2;2",
        "contribution": "2;2;2",
        "presentation": "2;3;2",
        "wc_summary": "40;82;140",
        "wc_strengths": "34;64;65",
        "wc_weaknesses": "336;123;509",
        "wc_questions": "78;134;17",
        "wc_review": "488;403;731",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            87.33333333333333,
            40.99864496405812
        ],
        "wc_strengths_avg": [
            54.333333333333336,
            14.383632673594278
        ],
        "wc_weaknesses_avg": [
            322.6666666666667,
            157.8656249965633
        ],
        "wc_questions_avg": [
            76.33333333333333,
            47.779586529070016
        ],
        "wc_review_avg": [
            540.6666666666666,
            138.9876093598115
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 42,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10194799639981894053&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of California, Santa Cruz",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucsc.edu",
        "aff_unique_abbr": "UCSC",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Santa Cruz",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "DragonDiffusion: Enabling Drag-style Manipulation on Diffusion Models",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18751",
        "id": "OEL4FJMg1b",
        "author_site": "Chong Mou, Xintao Wang, Jiechong Song, Ying Shan, Jian Zhang",
        "tldr": "",
        "abstract": "Despite the ability of text-to-image (T2I) diffusion models to generate high-quality images, transferring this ability to accurate image editing remains a challenge. In this paper, we propose a novel image editing method, DragonDiffusion, enabling Drag-style manipulation on Diffusion models. Specifically, we treat image editing as the change of feature correspondence in a pre-trained diffusion model. By leveraging feature correspondence, we develop energy functions that align with the editing target, transforming image editing operations into gradient guidance. Based on this guidance approach, we also construct multi-scale guidance that considers both semantic and geometric alignment. Furthermore, we incorporate a visual cross-attention strategy based on a memory bank design to ensure consistency between the edited result and original image. Benefiting from these efficient designs, all content editing and consistency operations come from the feature correspondence without extra model fine-tuning. Extensive experiments demonstrate that our method has promising performance on various image editing tasks, including within a single image (e.g., object moving, resizing, and content dragging) or across images (e.g., appearance replacing and object pasting). Code is available at https://github.com/MC-E/DragonDiffusion.",
        "keywords": "Diffusion model;Image editing;Image generation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/6137b5c7b4050ec3ee40d347cdf8567872b2a40f.pdf",
        "author": "Chong Mou;Xintao Wang;Jiechong Song;Ying Shan;Jian Zhang",
        "authorids": "~Chong_Mou1;~Xintao_Wang1;~Jiechong_Song1;~Ying_Shan2;~Jian_Zhang22",
        "gender": "M;;F;M;M",
        "homepage": ";;https://villa.jianzhang.tech/people/jiechong-song/;;http://jianzhang.tech/",
        "dblp": "276/3204.html;;304/1384;68/5910;07/314-18",
        "google_scholar": "https://scholar.google.com.hk/citations?user=SYQoDk0AAAAJ;;;4oXBp9UAAAAJ;7brFI_4AAAAJ",
        "orcid": ";;;0000-0001-7673-8325;0000-0001-5486-3125",
        "linkedin": ";;;YingShanProfile/;",
        "or_profile": "~Chong_Mou1;~Xintao_Wang1;~Jiechong_Song1;~Ying_Shan2;~Jian_Zhang22",
        "aff": "Peking University;;Peking University;Tencent PCG ARC Lab;Peking University",
        "aff_domain": "pku.edu.cn;;pku.edu.cn;arc.tencent.com;pku.edu.cn",
        "position": "PhD student;;PhD student;Director;Assistant Professor",
        "bibtex": "@inproceedings{\nmou2024dragondiffusion,\ntitle={DragonDiffusion: Enabling Drag-style Manipulation on Diffusion Models},\nauthor={Chong Mou and Xintao Wang and Jiechong Song and Ying Shan and Jian Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=OEL4FJMg1b}\n}",
        "github": "",
        "project": "",
        "reviewers": "8eDU;dwdi;Fbvf;bwVZ;vgvS",
        "pdf_size": 11852596,
        "rating": "6;6;6;6;6",
        "confidence": "4;4;4;4;5",
        "soundness": "2;4;3;4;4",
        "contribution": "3;2;2;3;3",
        "presentation": "3;3;3;3;3",
        "wc_summary": "50;81;61;140;103",
        "wc_strengths": "76;31;33;64;98",
        "wc_weaknesses": "375;120;78;123;136",
        "wc_questions": "54;38;2;1;12",
        "wc_review": "555;270;174;328;349",
        "wc_reply_reviewers": "145;160;0;18;22",
        "wc_reply_authors": "722;949;795;528;525",
        "reply_reviewers": "2;2;0;1;1",
        "reply_authors": "6;4;3;3;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.2,
            0.39999999999999997
        ],
        "soundness_avg": [
            3.4,
            0.8
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            87.0,
            32.08114711166046
        ],
        "wc_strengths_avg": [
            60.4,
            25.632791498391278
        ],
        "wc_weaknesses_avg": [
            166.4,
            106.10296885572996
        ],
        "wc_questions_avg": [
            21.4,
            21.06751053162191
        ],
        "wc_review_avg": [
            335.2,
            125.53150998852838
        ],
        "wc_reply_reviewers_avg": [
            69.0,
            68.74299964360007
        ],
        "wc_reply_authors_avg": [
            703.8,
            162.2632429110179
        ],
        "reply_reviewers_avg": [
            1.2,
            0.7483314773547883
        ],
        "reply_authors_avg": [
            3.6,
            1.3564659966250538
        ],
        "replies_avg": [
            32,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 149,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10758340381970652714&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=OEL4FJMg1b",
        "pdf": "https://openreview.net/pdf?id=OEL4FJMg1b",
        "email": "pku.edu.cn;;pku.edu.cn;arc.tencent.com;pku.edu.cn",
        "author_num": 5,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Peking University;Tencent",
        "aff_unique_dep": ";PCG ARC Lab",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.tencent.com",
        "aff_unique_abbr": "Peking U;Tencent",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Doubly Robust Instance-Reweighted Adversarial Training",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18750",
        "id": "OF5x1dzWSS",
        "author_site": "Daouda Sow, Sen Lin, Zhangyang Wang, Yingbin Liang",
        "tldr": "",
        "abstract": "Assigning importance weights to adversarial data has achieved great success in training adversarially robust networks under limited model capacity. However, existing instance-reweighted adversarial training (AT) methods heavily depend on heuristics and/or geometric interpretations to determine those importance weights, making these algorithms lack rigorous theoretical justification/guarantee. Moreover, recent research has shown that adversarial training suffers from a severe non-uniform robust performance across the training distribution, e.g., data points belonging to some classes can be much more vulnerable to adversarial attacks than others. To address both issues, in this paper, we propose a novel doubly-robust instance reweighted AT framework, which allows to obtain the importance weights via exploring distributionally robust optimization (DRO) techniques, and at the same time boosts the robustness on the most vulnerable examples. In particular, our importance weights are obtained by optimizing the KL-divergence regularized loss function, which allows us to devise new algorithms with a theoretical convergence guarantee. \nExperiments on standard classification datasets demonstrate that our proposed approach outperforms related state-of-the-art baseline methods in terms of average robust performance, and at the same time improves the robustness against attacks on the weakest data points. Codes can be found in the Supplement.",
        "keywords": "adversarial training;distributionally robust optimization;bilevel optimization;instance reweighting",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/6aaa5bbfc956ee25f2b4d88cbc92830cfb78f891.zip",
        "author": "Daouda Sow;Sen Lin;Zhangyang Wang;Yingbin Liang",
        "authorids": "~Daouda_Sow1;~Sen_Lin1;~Zhangyang_Wang1;~Yingbin_Liang1",
        "gender": "M;;M;F",
        "homepage": "https://sowmaster.github.io;https://slin70.github.io/;https://vita-group.github.io;https://sites.google.com/view/yingbinliang/home",
        "dblp": ";70/9499-1.html;119/4026;51/332",
        "google_scholar": "https://scholar.google.com/citations?hl=en;94-TbUsAAAAJ;pxFyKAIAAAAJ;lGgLAiIAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Daouda_Sow1;~Sen_Lin1;~Zhangyang_Wang1;~Yingbin_Liang1",
        "aff": "Ohio State University;University of Houston;University of Texas at Austin;The Ohio State University",
        "aff_domain": "osu.edu;uh.edu;utexas.edu;osu.edu",
        "position": "PhD student;Assistant Professor;Associate Professor;Professor",
        "bibtex": "@inproceedings{\nsow2024doubly,\ntitle={Doubly Robust Instance-Reweighted Adversarial Training},\nauthor={Daouda Sow and Sen Lin and Zhangyang Wang and Yingbin Liang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=OF5x1dzWSS}\n}",
        "github": "",
        "project": "",
        "reviewers": "bEW4;u17N;6nnk",
        "pdf_size": 2989071,
        "rating": "6;6;8",
        "confidence": "4;5;5",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "3;3;3",
        "wc_summary": "61;190;55",
        "wc_strengths": "30;30;267",
        "wc_weaknesses": "74;30;78",
        "wc_questions": "24;105;3",
        "wc_review": "189;355;403",
        "wc_reply_reviewers": "0;0;36",
        "wc_reply_authors": "681;1228;644",
        "reply_reviewers": "0;0;1",
        "reply_authors": "2;3;3",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            102.0,
            62.27358990776106
        ],
        "wc_strengths_avg": [
            109.0,
            111.72287142747452
        ],
        "wc_weaknesses_avg": [
            60.666666666666664,
            21.746008573733455
        ],
        "wc_questions_avg": [
            44.0,
            43.977266854592045
        ],
        "wc_review_avg": [
            315.6666666666667,
            91.68545262047967
        ],
        "wc_reply_reviewers_avg": [
            12.0,
            16.97056274847714
        ],
        "wc_reply_authors_avg": [
            851.0,
            267.0068663286895
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5927049436860455031&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=OF5x1dzWSS",
        "pdf": "https://openreview.net/pdf?id=OF5x1dzWSS",
        "email": "osu.edu;uh.edu;utexas.edu;osu.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Ohio State University;University of Houston;University of Texas at Austin",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.osu.edu;https://www.uh.edu;https://www.utexas.edu",
        "aff_unique_abbr": "OSU;UH;UT Austin",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Austin",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "OFF38XvszP",
        "title": "Slot Structured World Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The ability to perceive and reason about individual objects enables humans to build a robust understanding of the environment and its dynamics. Replicating such abilities in artificial systems would represent a significant milestone toward building intelligent agents. Contrastive Learning of Structured World Models (C-SWMs) took a step in this direction, proposing an unsupervised approach to embed images as compositions of individual object representations and model their pair-wise relationships. Yet the proposed architecture presents an encoder that cannot disambiguate different objects characterized by the same visual features, and the method has only been tested in settings where encoding just the object position and velocity was sufficient to learn the dynamics of the environment.\nIn this regard, we introduce Slot Structured World Models (SSWMs), a class of world models augmenting C-SWMs with a pretrained object-centric encoder. We further propose a version of the Spriteworld environment that includes simple physics to challenge these models. Quantitative and qualitative measures show that the proposed method outperforms the baseline on the given environment, although it presents severe limitations in multi-step prediction.",
        "keywords": "world models;model-based reinforcement learning;object-centric representation learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/c467f20cb8dd2745d50cc32b2345aee84b95d91e.zip",
        "author": "Jonathan Collu;Riccardo Majellaro;Aske Plaat;Thomas M. Moerland",
        "authorids": "~Jonathan_Collu1;~Riccardo_Majellaro1;~Aske_Plaat1;~Thomas_M._Moerland1",
        "gender": "M;;M;M",
        "homepage": ";;https://askeplaat.wordpress.com;http://thomasmoerland.nl/",
        "dblp": ";;53/5607;200/7623",
        "google_scholar": ";;scYqr58AAAAJ;c54IheQAAAAJ",
        "orcid": ";;0000-0001-7202-3322;",
        "linkedin": "https://linkedin.com/in/jonathan-collu-9826571b2;;;",
        "or_profile": "~Jonathan_Collu1;~Riccardo_Majellaro1;~Aske_Plaat1;~Thomas_M._Moerland1",
        "aff": ";;Leiden University;Leiden University",
        "aff_domain": ";;leidenuniv.nl;leidenuniv.nl",
        "position": ";;Full Professor;Assistant Professor",
        "bibtex": "@misc{\ncollu2024slot,\ntitle={Slot Structured World Models},\nauthor={Jonathan Collu and Riccardo Majellaro and Aske Plaat and Thomas M. Moerland},\nyear={2024},\nurl={https://openreview.net/forum?id=OFF38XvszP}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZMVF;wSZY;ZFTs;puqz",
        "site": "https://openreview.net/forum?id=OFF38XvszP",
        "pdf_size": 746994,
        "rating": "3;3;3;5",
        "confidence": "5;5;4;3",
        "soundness": "2;3;3;2",
        "contribution": "2;2;1;2",
        "presentation": "2;3;2;3",
        "wc_summary": "106;12;89;57",
        "wc_strengths": "36;16;16;39",
        "wc_weaknesses": "128;122;743;175",
        "wc_questions": "152;9;29;17",
        "wc_review": "422;159;877;288",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            66.0,
            35.7980446393375
        ],
        "wc_strengths_avg": [
            26.75,
            10.80219885023415
        ],
        "wc_weaknesses_avg": [
            292.0,
            261.192457777785
        ],
        "wc_questions_avg": [
            51.75,
            58.31541391433315
        ],
        "wc_review_avg": [
            436.5,
            270.79004782303207
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8703882797784891,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15693739404716686008&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Leiden University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.leidenuniv.nl",
        "aff_unique_abbr": "LU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Netherlands"
    },
    {
        "id": "OFgOmMlVUY",
        "title": "Reducing the Need for Backpropagation and Discovering Better Optima With Explicit Optimizations of Neural Networks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Iterative differential approximation methods that rely upon backpropagation have enabled the optimization of neural networks; however, at present, they remain computationally expensive, especially when training models at scale. In this paper, we propose a computationally efficient alternative for optimizing neural networks that can both reduce the costs of scaling neural networks and provide high-efficiency optimizations for low-resource applications. We derive an explicit solution to a simple feed-forward language model by analyzing the continuous bag-of-words (CBOW) form of word2vec. We conjecture that CBOW's optimized parameters are proportional to an existing explicit solution to word2vec's \\textit{skip-gram} form, and find that only slight modification is needed to convert the skip-gram optimization into the CBOW optimization. This solution generalizes from CBOW to the class of \\textit{all} single-layer feed-forward softmax-activated neural models trained on positive-valued features, as is demonstrated by our application of this solution\u2014without additional analysis\u2014across both MNIST digit classification and language modeling. We perform computational experiments that demonstrate the near-optimality of our solution by showing that 1) iterative optimization only marginally improves the explicit solution's parameters and 2) randomly initialized parameters iteratively optimize towards the explicit solution's loss. We finally apply the explicit solution locally to multi-layer networks and discuss how the solution's computational savings increase with model complexity, and moreover, how better optima\u2014than _cannot_ be achieved by backpropagation alone\u2014are discovered _only after_ the multi-layer warm-start is applied.",
        "keywords": "optimization;neural network training;deep learning;backpropagation;natural language processing;image classification;computer vision",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Jake Ryland Williams;Haoran Zhao;Danielle Boccelli",
        "authorids": "~Jake_Ryland_Williams2;~Haoran_Zhao2;~Danielle_Boccelli1",
        "gender": "M;F;M",
        "homepage": "https://hrjzhao.github.io/;https://github.com/danielle-boccelli/danielle-boccelli;https://jakerylandwilliams.github.io/",
        "dblp": ";;",
        "google_scholar": "yNRZK2EAAAAJ;;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Haoran_Zhao2;~Danielle_Boccelli1;~Jake_Williams1",
        "aff": "Drexel University;Drexel University;Drexel University",
        "aff_domain": "drexel.edu;drexel.edu;drexel.edu",
        "position": "Undergrad student;PhD student;Assistant Professor",
        "bibtex": "@misc{\nwilliams2024reducing,\ntitle={Reducing the Need for Backpropagation and Discovering Better Optima With Explicit Optimizations of Neural Networks},\nauthor={Jake Ryland Williams and Haoran Zhao and Danielle Boccelli},\nyear={2024},\nurl={https://openreview.net/forum?id=OFgOmMlVUY}\n}",
        "github": "",
        "project": "",
        "reviewers": "59hn;7Z9Y;cCEC;h8Kh",
        "site": "https://openreview.net/forum?id=OFgOmMlVUY",
        "pdf_size": 1600578,
        "rating": "1;3;3;3",
        "confidence": "4;3;3;4",
        "soundness": "1;2;3;1",
        "contribution": "1;1;1;2",
        "presentation": "1;2;2;1",
        "wc_summary": "74;47;157;65",
        "wc_strengths": "1;42;33;54",
        "wc_weaknesses": "329;105;177;527",
        "wc_questions": "2;80;32;120",
        "wc_review": "406;274;399;766",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            1.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            85.75,
            42.269226394624255
        ],
        "wc_strengths_avg": [
            32.5,
            19.653244007033546
        ],
        "wc_weaknesses_avg": [
            284.5,
            161.6810131091465
        ],
        "wc_questions_avg": [
            58.5,
            45.108203245086145
        ],
        "wc_review_avg": [
            461.25,
            183.61832016441062
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:tEZKkpxSUnoJ:scholar.google.com/&scioq=Reducing+the+Need+for+Backpropagation+and+Discovering+Better+Optima+With+Explicit+Optimizations+of+Neural+Networks&hl=en&as_sdt=0,5",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Drexel University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.drexel.edu",
        "aff_unique_abbr": "Drexel",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Multi-View Causal Representation Learning with Partial Observability",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18749",
        "id": "OGtnhKQJms",
        "author_site": "Dingling Yao, Danru Xu, S\u00e9bastien Lachapelle, Sara Magliacane, Perouz Taslakian, Georg Martius, Julius von K\u00fcgelgen, Francesco Locatello",
        "tldr": "",
        "abstract": "We present a unified framework for studying the identifiability of representations learned from simultaneously observed views, such as different data modalities. We allow a partially observed setting in which each view constitutes a nonlinear mixture of a subset of underlying latent variables, which can be causally related.\nWe prove that the information shared across all subsets of any number of views can be learned up to a smooth bijection using contrastive learning and a single encoder per view. \nWe also provide graphical criteria indicating which latent variables can be identified through a simple set of rules, which we refer to as identifiability algebra. Our general framework and theoretical results unify and extend several previous work on multi-view nonlinear ICA, disentanglement, and causal representation learning. We experimentally validate our claims on numerical, image, and multi-modal data sets. Further, we demonstrate that the performance of prior methods is recovered in different special cases of our setup. \nOverall, we find that access to multiple partial views offers unique opportunities for identifiable representation learning, enabling the discovery of latent structures from purely observational data.",
        "keywords": "causal representation learning; identifiability",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/588f040d55bc584efe7c1d4783ce0a25b7e3fac0.zip",
        "author": "Dingling Yao;Danru Xu;Sebastien Lachapelle;Sara Magliacane;Perouz Taslakian;Georg Martius;Julius von K\u00fcgelgen;Francesco Locatello",
        "authorids": "~Dingling_Yao1;~Danru_Xu1;~Sebastien_Lachapelle1;~Sara_Magliacane1;~Perouz_Taslakian1;~Georg_Martius1;~Julius_von_K\u00fcgelgen2;~Francesco_Locatello1",
        "gender": "F;;M;F;F;M;;M",
        "homepage": ";;https://slachapelle.github.io/;http://saramagliacane.github.io;http://www.perouz.com;https://uni-tuebingen.de/de/264672;;https://twitter.com/FrancescoLocat8",
        "dblp": "298/8057;;224/0080;120/5256;52/1849;47/2706;;195/6074",
        "google_scholar": ";;uxHoJp8AAAAJ;https://scholar.google.nl/citations?user=H3j_zQ4AAAAJ;LJ7gHkQAAAAJ;https://scholar.google.de/citations?user=b-JF-UIAAAAJ;;",
        "orcid": ";;;;;;;",
        "linkedin": "dingling-yao-b28b161a2/;;s%C3%A9bastien-lachapelle-a4321a122/;magliacane/;perouz/;;;",
        "or_profile": "~Dingling_Yao1;~Danru_Xu1;~Sebastien_Lachapelle1;~Sara_Magliacane1;~Perouz_Taslakian1;~Georg_Martius1;~Julius_von_K\u00fcgelgen2;~Francesco_Locatello1",
        "aff": "Institute of Science and Technology;;University of Montreal;University of Amsterdam;ServiceNow;Max Planck Institute for Intelligent Systems;;Institute of Science and Technology",
        "aff_domain": "ist.ac.at;;umontreal.ca;uva.nl;servicenow.com;tuebingen.mpg.de;;ist.ac.at",
        "position": "PhD student;;PhD student;Assistant Professor;Researcher;Assistant Professor;;Assistant Professor",
        "bibtex": "@inproceedings{\nyao2024multiview,\ntitle={Multi-View Causal Representation Learning with Partial Observability},\nauthor={Dingling Yao and Danru Xu and Sebastien Lachapelle and Sara Magliacane and Perouz Taslakian and Georg Martius and Julius von K{\\\"u}gelgen and Francesco Locatello},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=OGtnhKQJms}\n}",
        "github": "",
        "project": "",
        "reviewers": "BPer;QCXK;rWVP;RoXZ",
        "pdf_size": 1713606,
        "rating": "6;6;8;8",
        "confidence": "3;3;4;3",
        "soundness": "3;3;3;3",
        "contribution": "2;2;4;3",
        "presentation": "2;4;4;4",
        "wc_summary": "35;58;295;89",
        "wc_strengths": "92;58;74;102",
        "wc_weaknesses": "83;75;43;37",
        "wc_questions": "62;25;68;54",
        "wc_review": "272;216;480;282",
        "wc_reply_reviewers": "12;42;36;22",
        "wc_reply_authors": "336;135;408;222",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            119.25,
            103.2627110819777
        ],
        "wc_strengths_avg": [
            81.5,
            16.874537030686206
        ],
        "wc_weaknesses_avg": [
            59.5,
            19.817921182606415
        ],
        "wc_questions_avg": [
            52.25,
            16.498105951896417
        ],
        "wc_review_avg": [
            312.5,
            99.92372090750024
        ],
        "wc_reply_reviewers_avg": [
            28.0,
            11.74734012447073
        ],
        "wc_reply_authors_avg": [
            275.25,
            104.66464302714647
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 35,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10791207642454776249&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=OGtnhKQJms",
        "pdf": "https://openreview.net/pdf?id=OGtnhKQJms",
        "email": "ist.ac.at;;umontreal.ca;uva.nl;servicenow.com;tuebingen.mpg.de;;ist.ac.at",
        "author_num": 8,
        "aff_unique_index": "0;1;2;3;4;0",
        "aff_unique_norm": "Institute of Science and Technology;University of Montreal;University of Amsterdam;ServiceNow;Max Planck Institute for Intelligent Systems",
        "aff_unique_dep": ";;;;Intelligent Systems",
        "aff_unique_url": ";https://wwwumontreal.ca;https://www.uva.nl;https://www.servicenow.com;https://www.mpi-is.mpg.de",
        "aff_unique_abbr": ";UM;UvA;ServiceNow;MPI-IS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "1;2;3;4",
        "aff_country_unique": ";Canada;Netherlands;United States;Germany"
    },
    {
        "id": "OHll7EfuSi",
        "title": "Weight-Based Performance Estimation for Diverse Domains",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "One of the limitations of applying machine learning methods in real-world scenarios is the existence of a domain shift between the source (i.e., training) and target (i.e., test) datasets, which typically entails a significant performance drop. This is further complicated by the lack of annotated data in the target domain, making it impossible to quantitatively assess the model performance. As such, there is a pressing need for methods able to estimate a model's performance on unlabeled target data. Most of the existing approaches addressing this train a linear performance predictor, taking as input either an activation-based or a performance-based metric. As we will show, however, the accuracy of such predictors strongly depends on the domain shift. By contrast, we propose to use a weight-based metric as input to the linear predictor. Specifically, we measure the difference between the model's weights before and after fine-tuning it on a self-supervised loss, which we take to be the entropy of the network's predictions. This builds on the intuition that target data close to the source domain will produce more confident predictions, thus leading to small weight changes during fine-tuning. Our extensive experiments on standard object recognition benchmarks, using diverse network architectures, demonstrate the benefits of our method, outperforming both activation-based and performance-based baselines by a large margin.  Our code is available in an anonymous repository: https://anonymous.4open.science/r/79E9/",
        "keywords": "generalizability estimation; domain generalization",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Ekaterina Khramtsova;Mahsa Baktashmotlagh;Guido Zuccon;Xi Wang;Mathieu Salzmann",
        "authorids": "~Ekaterina_Khramtsova1;~Mahsa_Baktashmotlagh1;~Guido_Zuccon1;~Xi_Wang15;~Mathieu_Salzmann1",
        "gender": ";F;;M;M",
        "homepage": ";;http://ielab.io/people/guido-zuccon.html;https://scholar.google.com.hk/citations?user=4VlKpVgAAAAJ&hl=zh-CN;https://people.epfl.ch/mathieu.salzmann",
        "dblp": ";119/1507;22/6562;;18/4533",
        "google_scholar": ";https://scholar.google.com.au/citations?user=3kaiBBYAAAAJ;aEVHhC8AAAAJ;https://scholar.google.com.hk/citations?user=4VlKpVgAAAAJ;https://scholar.google.ch/citations?user=n-B0jr4AAAAJ",
        "orcid": ";;0000-0003-0271-5563;;",
        "linkedin": ";;;;",
        "or_profile": "~Ekaterina_Khramtsova1;~Mahsa_Baktashmotlagh1;~Guido_Zuccon1;~Xi_Wang15;~Mathieu_Salzmann1",
        "aff": ";The University of Queensland;The University of Queensland;Northeastern University;CSIRO",
        "aff_domain": ";uq.edu.au;uq.edu.au;neu.edu;data61.csiro.au",
        "position": ";Assistant Professor;Full Professor;PhD student;Collaborator",
        "bibtex": "@misc{\nkhramtsova2024weightbased,\ntitle={Weight-Based Performance Estimation for Diverse Domains},\nauthor={Ekaterina Khramtsova and Mahsa Baktashmotlagh and Guido Zuccon and Xi Wang and Mathieu Salzmann},\nyear={2024},\nurl={https://openreview.net/forum?id=OHll7EfuSi}\n}",
        "github": "",
        "project": "",
        "reviewers": "j3d2;xDdC;PWrH",
        "site": "https://openreview.net/forum?id=OHll7EfuSi",
        "pdf_size": 3937448,
        "rating": "3;5;6",
        "confidence": "5;4;3",
        "soundness": "2;3;2",
        "contribution": "1;2;2",
        "presentation": "2;3;3",
        "wc_summary": "72;106;238",
        "wc_strengths": "61;60;96",
        "wc_weaknesses": "195;380;130",
        "wc_questions": "33;2;184",
        "wc_review": "361;548;648",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "704;244;535",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            138.66666666666666,
            71.59764117778059
        ],
        "wc_strengths_avg": [
            72.33333333333333,
            16.73983937265296
        ],
        "wc_weaknesses_avg": [
            235.0,
            105.90876576878169
        ],
        "wc_questions_avg": [
            73.0,
            79.50262050188451
        ],
        "wc_review_avg": [
            519.0,
            118.9481679836502
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            494.3333333333333,
            189.9830401787369
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9819805060619659,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:eYDD0TanE5QJ:scholar.google.com/&scioq=Weight-Based+Performance+Estimation+for+Diverse+Domains&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "University of Queensland;Northeastern University;Commonwealth Scientific and Industrial Research Organisation",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.uq.edu.au;https://www.northeastern.edu;https://www.csiro.au",
        "aff_unique_abbr": "UQ;NEU;CSIRO",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "Australia;United States"
    },
    {
        "title": "Protein Multimer Structure Prediction via Prompt Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18748",
        "id": "OHpvivXrQr",
        "author_site": "Ziqi Gao, Xiangguo SUN, Zijing Liu, Yu Li, Hong Cheng, Jia Li",
        "tldr": "",
        "abstract": "Understanding the 3D structures of protein multimers is crucial, as they play a vital role in regulating various cellular processes. It has been empirically confirmed that the multimer structure prediction (MSP) can be well handled in a step-wise assembly fashion using provided dimer structures and predicted protein-protein interactions (PPIs). However, due to the biological gap in the formation of dimers and larger multimers, directly applying PPI prediction techniques can often cause a poor generalization to the MSP task. To address this challenge, we aim to extend the PPI knowledge to multimers of different scales (i.e., chain numbers). Specifically, we propose PromptMSP, a pre-training and Prompt tuning framework for Multimer Structure Prediction. First, we tailor the source and target tasks for effective PPI knowledge learning and efficient inference, respectively. We design PPI-inspired prompt learning to narrow the gaps of two task formats and generalize the PPI knowledge to multimers of different scales. We provide a meta-learning strategy to learn a reliable initialization of the prompt model, enabling our prompting framework to effectively adapt to limited data for large-scale multimers. Empirically, we achieve both significant accuracy (RMSD and TM-Score) and efficiency improvements compared to advanced MSP models.",
        "keywords": "docking path prediction;protein complex structure;prompt learning",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Ziqi Gao;Xiangguo Sun;Zijing Liu;Yu Li;Hong Cheng;Jia Li",
        "authorids": "~Ziqi_Gao1;~Xiangguo_Sun1;~Zijing_Liu1;~Yu_Li4;~Hong_Cheng1;~Jia_Li4",
        "gender": ";M;;M;F;M",
        "homepage": ";https://xgsun.mysxl.cn;https://github.com/zj-liu;https://yu-li.github.io/;https://www1.se.cuhk.edu.hk/~hcheng/;https://sites.google.com/view/lijia",
        "dblp": ";224/0873;205/3211;34/2997-3;85/5637-1;23/6950-9",
        "google_scholar": "https://scholar.google.com.hk/citations?user=UHwNFy8AAAAJ;rKfYQwEAAAAJ;;j9lwU7kAAAAJ;https://scholar.google.com.hk/citations?user=s3lQL7YAAAAJ;1gSbcYoAAAAJ",
        "orcid": ";0000-0002-2224-4634;0000-0002-0189-7409;;0000-0002-4673-2587;0000-0002-6362-4385",
        "linkedin": ";;;;;",
        "or_profile": "~Ziqi_Gao1;~Xiangguo_Sun1;~Zijing_Liu1;~Yu_Li4;~Hong_Cheng1;~Jia_Li4",
        "aff": "Hong Kong University of Science and Technology;The Chinese University of Hong Kong;International Digital Economy Academy;International Digital Economy Academy;The Chinese University of Hong Kong;Hong Kong University of Science and Technology (Guangzhou)",
        "aff_domain": "ust.hk;se.cuhk.edu.hk;idea.edu.cn;idea.edu.cn;cuhk.edu.hk;ust.hk",
        "position": "PhD student;Postdoc;Researcher;Principal Researcher;Professor;Assistant Professor",
        "bibtex": "@inproceedings{\ngao2024protein,\ntitle={Protein Multimer Structure Prediction via Prompt Learning},\nauthor={Ziqi Gao and Xiangguo Sun and Zijing Liu and Yu Li and Hong Cheng and Jia Li},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=OHpvivXrQr}\n}",
        "github": "",
        "project": "",
        "reviewers": "PqHe;UpSS;6yks;y71p",
        "pdf_size": 3579824,
        "rating": "3;5;5;8",
        "confidence": "4;3;3;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;3;3",
        "presentation": "2;1;1;4",
        "wc_summary": "101;140;86;105",
        "wc_strengths": "22;100;58;81",
        "wc_weaknesses": "164;379;150;81",
        "wc_questions": "29;126;53;48",
        "wc_review": "316;745;347;315",
        "wc_reply_reviewers": "0;0;33;18",
        "wc_reply_authors": "1396;1852;1941;881",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "3;4;4;3",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            1.224744871391589
        ],
        "wc_summary_avg": [
            108.0,
            19.78635893740938
        ],
        "wc_strengths_avg": [
            65.25,
            29.063508047033828
        ],
        "wc_weaknesses_avg": [
            193.5,
            111.61205132063472
        ],
        "wc_questions_avg": [
            64.0,
            36.89850945499018
        ],
        "wc_review_avg": [
            430.75,
            181.88784318914776
        ],
        "wc_reply_reviewers_avg": [
            12.75,
            13.808964479641476
        ],
        "wc_reply_authors_avg": [
            1517.5,
            421.64469639733403
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.5,
            0.5
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.7276068751089989,
        "gs_citation": 20,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=317571513978932201&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=OHpvivXrQr",
        "pdf": "https://openreview.net/pdf?id=OHpvivXrQr",
        "email": "ust.hk;se.cuhk.edu.hk;idea.edu.cn;idea.edu.cn;cuhk.edu.hk;ust.hk",
        "author_num": 6,
        "aff_unique_index": "0;1;2;2;1;0",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Chinese University of Hong Kong;International Digital Economy Academy",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ust.hk;https://www.cuhk.edu.hk;",
        "aff_unique_abbr": "HKUST;CUHK;",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China;"
    },
    {
        "title": "GenSim: Generating Robotic Simulation Tasks via Large Language Models",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18747",
        "id": "OI3RoHoWAN",
        "author_site": "Lirui Wang, Yiyang Ling, Zhecheng Yuan, Mohit Shridhar, Chen Bao, Yuzhe Qin, Bailin Wang, Huazhe Xu, Xiaolong Wang",
        "tldr": "",
        "abstract": "Collecting large amounts of real-world interaction data to train general robotic policies is often prohibitively expensive, thus motivating the use of simulation data. However, existing methods for data generation have generally focused on scene-level diversity (e.g., object instances and poses) rather than task-level diversity, due to the human effort required to come up with and verify novel tasks. This has made it challenging for policies trained on simulation data to demonstrate significant task-level generalization. In this paper, we propose to automatically generate rich simulation environments and expert demonstrations by exploiting a large language models' (LLM) grounding and coding ability. Our approach, dubbed GenSim, has two modes: goal-directed generation, wherein a target task is given to the LLM and the LLM proposes a task curriculum to solve the target task, and exploratory generation, wherein the LLM  bootstraps from previous tasks and iteratively proposes novel tasks that would be helpful in solving more complex tasks. We use GPT4 to expand the existing benchmark by ten times to over 100 tasks, on which we conduct supervised finetuning and evaluate several LLMs including finetuned GPTs and Code Llama on code generation for robotic simulation tasks. Furthermore, we observe that LLMs-generated simulation programs can enhance task-level generalization significantly when used for multitask policy training. We further find that with minimal sim-to-real adaptation, the multitask policies pretrained on GPT4-generated simulation tasks exhibit stronger transfer to unseen long-horizon tasks in the real world and outperform baselines by 25%. See our project website (https://gen-sim.github.io) and demo (https://huggingface.co/spaces/Gen-Sim/Gen-Sim) for visualizations and open-source models and datasets.",
        "keywords": "LLM Code Generation;Robotic Simulation;Multi-task Policy Learning",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Lirui Wang;Yiyang Ling;Zhecheng Yuan;Mohit Shridhar;Chen Bao;Yuzhe Qin;Bailin Wang;Huazhe Xu;Xiaolong Wang",
        "authorids": "~Lirui_Wang1;~Yiyang_Ling1;~Zhecheng_Yuan1;~Mohit_Shridhar1;~Chen_Bao2;~Yuzhe_Qin1;~Bailin_Wang3;~Huazhe_Xu1;~Xiaolong_Wang3",
        "gender": "M;;M;M;M;M;M;M;M",
        "homepage": "https://liruiw.github.io/;https://yiyang0207.github.io/;http://www.github.com;http://mohitshridhar.com/;https://chenbao.tech;https://yzqin.github.io/;http://hxu.rocks;https://xiaolonw.github.io/;https://berlino.github.io/",
        "dblp": "221/9612;;314/5755;203/8577.html;;241/9337;164/9006;91/952-4;218/7334",
        "google_scholar": "EM9YhH0AAAAJ;;;CrfsfFSiS0kC;HOngPZAAAAAJ;3KF3AIMAAAAJ;t9HPFawAAAAJ;Y8O9N_0AAAAJ;",
        "orcid": ";;;0000-0001-7382-763X;0009-0007-0042-0821;0000-0002-9321-9305;;;",
        "linkedin": ";;;;;;;;",
        "or_profile": "~Lirui_Wang1;~Yiyang_Ling1;~Zhecheng_Yuan1;~Mohit_Shridhar1;~Chen_Bao2;~Yuzhe_Qin1;~Huazhe_Xu1;~Xiaolong_Wang3;~bailin_wang1",
        "aff": "Massachusetts Institute of Technology;Shanghai Jiaotong University;;Dyson;Carnegie Mellon University;University of California, San Diego;Tsinghua University;University of California, San Diego;Massachusetts Institute of Technology",
        "aff_domain": "mit.edu;sjtu.edu.cn;;dyson.com;cmu.edu;ucsd.edu;tsinghua.edu.cn;ucsd.edu;mit.edu",
        "position": "PhD student;Undergrad student;;Researcher;MS student;PhD student;Assistant Professor;Assistant Professor;Postdoc",
        "bibtex": "@inproceedings{\nwang2024gensim,\ntitle={GenSim: Generating Robotic Simulation Tasks via Large Language Models},\nauthor={Lirui Wang and Yiyang Ling and Zhecheng Yuan and Mohit Shridhar and Chen Bao and Yuzhe Qin and Bailin Wang and Huazhe Xu and Xiaolong Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=OI3RoHoWAN}\n}",
        "github": "",
        "project": "",
        "reviewers": "LF4g;hwME;1vRz;XopG",
        "pdf_size": 15870874,
        "rating": "8;8;8;8",
        "confidence": "4;3;3;4",
        "soundness": "3;4;3;4",
        "contribution": "3;3;3;4",
        "presentation": "3;4;3;4",
        "wc_summary": "106;77;168;70",
        "wc_strengths": "143;72;166;112",
        "wc_weaknesses": "145;69;392;101",
        "wc_questions": "86;114;104;75",
        "wc_review": "480;332;830;358",
        "wc_reply_reviewers": "11;18;134;0",
        "wc_reply_authors": "718;693;1957;630",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "2;2;4;2",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            105.25,
            38.661188548724155
        ],
        "wc_strengths_avg": [
            123.25,
            35.25177300505607
        ],
        "wc_weaknesses_avg": [
            176.75,
            127.16991586063112
        ],
        "wc_questions_avg": [
            94.75,
            15.188400179084036
        ],
        "wc_review_avg": [
            500.0,
            198.5497418784522
        ],
        "wc_reply_reviewers_avg": [
            40.75,
            54.218885086287045
        ],
        "wc_reply_authors_avg": [
            999.5,
            553.7420428322198
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.8660254037844386
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 89,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11550366212044916208&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=OI3RoHoWAN",
        "pdf": "https://openreview.net/pdf?id=OI3RoHoWAN",
        "email": "mit.edu;sjtu.edu.cn;;dyson.com;cmu.edu;ucsd.edu;tsinghua.edu.cn;ucsd.edu;mit.edu",
        "author_num": 9,
        "aff_unique_index": "0;1;2;3;4;5;4;0",
        "aff_unique_norm": "Massachusetts Institute of Technology;Shanghai Jiao Tong University;Dyson;Carnegie Mellon University;University of California, San Diego;Tsinghua University",
        "aff_unique_dep": ";;;;;",
        "aff_unique_url": "https://web.mit.edu;https://www.sjtu.edu.cn;https://www.dyson.com;https://www.cmu.edu;https://www.ucsd.edu;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "MIT;SJTU;;CMU;UCSD;THU",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";San Diego",
        "aff_country_unique_index": "0;1;2;0;0;1;0;0",
        "aff_country_unique": "United States;China;United Kingdom"
    },
    {
        "title": "Diffusion Generative Flow Samplers: Improving learning signals through partial trajectory optimization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18746",
        "id": "OIsahq1UYC",
        "author_site": "Dinghuai Zhang, Ricky T. Q. Chen, Chenghao Liu, Aaron Courville, Yoshua Bengio",
        "tldr": "",
        "abstract": "We tackle the problem of sampling from intractable high-dimensional density functions, a fundamental task that often appears in machine learning and statistics. \nWe extend recent sampling-based approaches that leverage controlled stochastic processes to model approximate samples from these target densities.  \nThe main drawback of these approaches is that the training objective requires full trajectories to compute, resulting in sluggish credit assignment issues due to use of entire trajectories and a learning signal present only at the terminal time.\nIn this work, we present Diffusion Generative Flow Samplers (DGFS), a sampling-based framework where the learning process can be tractably broken down into short partial trajectory segments, via parameterizing an additional ``flow function''.\nOur method takes inspiration from the theory developed for generative flow networks (GFlowNets), allowing us to make use of intermediate learning signals.\nThrough various challenging experiments, we demonstrate that DGFS achieves more accurate estimates of the normalization constant than closely-related prior methods.",
        "keywords": "probabilistic inference;sampling;stochastic optimal control;gflownets",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Dinghuai Zhang;Ricky T. Q. Chen;Cheng-Hao Liu;Aaron Courville;Yoshua Bengio",
        "authorids": "~Dinghuai_Zhang1;~Ricky_T._Q._Chen1;~Cheng-Hao_Liu1;~Aaron_Courville3;~Yoshua_Bengio1",
        "gender": ";;M;;M",
        "homepage": ";;https://pchliu.github.io/;;http://yoshuabengio.org",
        "dblp": ";;;56/1688;56/953",
        "google_scholar": ";;iVJGx0cAAAAJ;https://scholar.google.ca/citations?user=km6CP8cAAAAJ;kukA0LcAAAAJ",
        "orcid": ";;0000-0001-7923-6806;;",
        "linkedin": ";;chenghao-peter-liu/;;yoshuabengio/?originalSubdomain=ca",
        "or_profile": "~Dinghuai_Zhang1;~Ricky_T._Q._Chen1;~Cheng-Hao_Liu1;~Aaron_Courville3;~Yoshua_Bengio1",
        "aff": ";;Montreal Institute for Learning Algorithms, University of Montreal, Universit\u00e9 de Montr\u00e9al;Universit\u00e9 de Montr\u00e9al;University of Montreal",
        "aff_domain": ";;mila.umontreal.ca; ;umontreal.ca",
        "position": ";;PhD student intern;Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\nzhang2024diffusion,\ntitle={Diffusion Generative Flow Samplers: Improving learning signals through partial trajectory optimization},\nauthor={Dinghuai Zhang and Ricky T. Q. Chen and Cheng-Hao Liu and Aaron Courville and Yoshua Bengio},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=OIsahq1UYC}\n}",
        "github": "",
        "project": "",
        "reviewers": "1u4d;hxZf;Tb6D;oYBq",
        "pdf_size": 7237875,
        "rating": "6;8;8;8",
        "confidence": "3;4;4;2",
        "soundness": "3;4;4;3",
        "contribution": "3;3;2;4",
        "presentation": "4;3;3;3",
        "wc_summary": "50;182;131;65",
        "wc_strengths": "98;131;183;85",
        "wc_weaknesses": "89;89;202;191",
        "wc_questions": "3;779;45;40",
        "wc_review": "240;1181;561;381",
        "wc_reply_reviewers": "18;175;195;19",
        "wc_reply_authors": "532;1523;1143;782",
        "reply_reviewers": "1;1;2;1",
        "reply_authors": "1;5;4;2",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            107.0,
            52.94808778416837
        ],
        "wc_strengths_avg": [
            124.25,
            37.83764659700706
        ],
        "wc_weaknesses_avg": [
            142.75,
            53.89051400756909
        ],
        "wc_questions_avg": [
            216.75,
            325.0202878283139
        ],
        "wc_review_avg": [
            590.75,
            359.2703543294381
        ],
        "wc_reply_reviewers_avg": [
            101.75,
            83.55050867589019
        ],
        "wc_reply_authors_avg": [
            995.0,
            374.30802823343237
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            1.5811388300841898
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.17407765595569782,
        "gs_citation": 37,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4601881413729468749&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=OIsahq1UYC",
        "pdf": "https://openreview.net/pdf?id=OIsahq1UYC",
        "email": ";;mila.umontreal.ca; ;umontreal.ca",
        "author_num": 5,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Montreal;Universit\u00e9 de Montr\u00e9al",
        "aff_unique_dep": "Montreal Institute for Learning Algorithms;",
        "aff_unique_url": "https://www.mila.quebec;https://www.umontreal.ca",
        "aff_unique_abbr": "MILA;UdeM",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Montreal;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "OJYIyO4G1t",
        "title": "OLGA: One-cLass Graph Autoencoder",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "One-class learning (OCL) comprises a set of techniques applied when real-world problems have a single class of interest. The usual procedure for OCL is learning a hypersphere that comprises instances of this class and, ideally, repels unseen instances from any other classes. Besides, several OCL algorithms for graphs have been proposed since graph representation learning has succeeded in various fields. These methods may use a two-step strategy, initially representing the graph and, in a second step, classifying its nodes. On the other hand, end-to-end methods learn the node representations while classifying the nodes in one learning process. We highlight three main gaps in the literature on OCL for graphs: (i) non-customized representations for OCL; (ii) the lack of constraints on hypersphere parameters learning; and (iii) the methods' lack of interpretability and visualization. We propose One-cLass Graph Autoencoder (OLGA). OLGA is end-to-end and learns the representations for the graph nodes while encapsulating the interest instances by combining two loss functions. We propose a new hypersphere loss function to encapsulate the interest instances. OLGA combines this new hypersphere loss with the graph autoencoder reconstruction loss to improve model learning. OLGA achieved state-of-the-art results and outperformed six other methods with a statistically significant difference from five methods. Moreover, OLGA learns low-dimensional representations maintaining the classification performance with an interpretable model representation learning and results.",
        "keywords": "Graph Neural Networks;One-Class Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Marcos G\u00f4lo;Jose Gilberto Medeiros;Diego Furtado Silva;Ricardo Marcacini",
        "authorids": "~Marcos_G\u00f4lo1;~Jose_Gilberto_Medeiros1;~Diego_Furtado_Silva1;~Ricardo_Marcacini1",
        "gender": "M;M;M;",
        "homepage": ";https://jose-gilberto.github.io/;https://www.linkedin.com/in/diego-furtado-silva-02a54317/;",
        "dblp": "302/7005;;124/2376;69/8767",
        "google_scholar": "https://scholar.google.com.br/citations?user=CeyvhM8AAAAJ;OvRan0cAAAAJ;HXu5lB4AAAAJ;hPfaIZIAAAAJ",
        "orcid": "0000-0002-9093-8195;0009-0008-8793-6528;0000-0002-5184-9413;0000-0002-2309-3487",
        "linkedin": "marcosgolo/;;;",
        "or_profile": "~Marcos_G\u00f4lo1;~Jose_Gilberto_Medeiros1;~Diego_Furtado_Silva1;~Ricardo_Marcacini1",
        "aff": "Universidade de S\u00e3o Paulo;Universidade de S\u00e3o Paulo;Universidade de S\u00e3o Paulo;Universidade de S\u00e3o Paulo",
        "aff_domain": "usp.br;usp.br;usp.br;usp.br",
        "position": "PhD student;MS student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\ng{\\^o}lo2024olga,\ntitle={{OLGA}: One-cLass Graph Autoencoder},\nauthor={Marcos G{\\^o}lo and Jose Gilberto Medeiros and Diego Furtado Silva and Ricardo Marcacini},\nyear={2024},\nurl={https://openreview.net/forum?id=OJYIyO4G1t}\n}",
        "github": "",
        "project": "",
        "reviewers": "iTUK;PXa1;3sUJ;Yigw",
        "site": "https://openreview.net/forum?id=OJYIyO4G1t",
        "pdf_size": 3192930,
        "rating": "3;3;3;5",
        "confidence": "4;2;4;4",
        "soundness": "1;2;1;2",
        "contribution": "1;2;1;3",
        "presentation": "1;2;2;3",
        "wc_summary": "38;48;71;36",
        "wc_strengths": "23;16;67;32",
        "wc_weaknesses": "345;182;100;100",
        "wc_questions": "6;2;1;2",
        "wc_review": "412;248;239;170",
        "wc_reply_reviewers": "17;0;0;14",
        "wc_reply_authors": "631;600;383;209",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            1.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            48.25,
            13.899190623917638
        ],
        "wc_strengths_avg": [
            34.5,
            19.60229578391266
        ],
        "wc_weaknesses_avg": [
            181.75,
            100.02093530856428
        ],
        "wc_questions_avg": [
            2.75,
            1.920286436967152
        ],
        "wc_review_avg": [
            267.25,
            88.85205399989356
        ],
        "wc_reply_reviewers_avg": [
            7.75,
            7.8222439235810075
        ],
        "wc_reply_authors_avg": [
            455.75,
            171.53625710035766
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2410821005372758904&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Universidade de S\u00e3o Paulo",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.usp.br",
        "aff_unique_abbr": "USP",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Brazil"
    },
    {
        "id": "OJoMzslBIa",
        "title": "ReweightOOD: Loss Reweighting for Distance-based OOD Detection",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Out-of-Distribution (OOD) detection is crucial for ensuring the safety and reliability of neural networks in critical applications. Distance-based OOD detection is based on the assumption that OOD samples are mapped far from In-Distribution (ID) clusters in embedding space. A recent approach for obtaining OOD-detection-friendly embedding space has been contrastive optimization of pulling similar pairs and pushing apart dissimilar pairs. It assigns equal significance to all similarity instances with the implicit objective of maximizing the mean proximity between samples with their corresponding hypothetical class centroids. However, the emphasis should be directed towards reducing the Minimum Enclosing Sphere (MES) for each class and achieving higher inter-class dispersion to effectively mitigate the potential for ID-OOD overlap. Optimizing low-signal dissimilar pairs might potentially act against achieving maximal inter-class dispersion while less-optimized similar pairs prevent achieving smaller MES. Based on this, we propose a reweighting scheme \\textbf{ReweightOOD}, that adopts the similarity optimization which prioritizes the optimization of less-optimized contrasting pairs while assigning lower importance to already well-optimized contrasting pairs. Such a reweighting scheme serves to minimize the MES for each class while achieving maximal inter-class dispersion. Experimental results on a challenging CIFAR100 benchmark using ResNet-18 network demonstrate that the proposed reweighting scheme improves the FPR metric by a whopping ~38\\% in comparison to the baseline. In various classification datasets, our method outperforms existing methods, making it a promising solution for enhancing OOD detection capabilities in neural networks.",
        "keywords": "Out of Distribution Detection",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/232d2d18fd07ddcf23f7af51bcfccfe656f509b3.pdf",
        "author": "Sudarshan Regmi;Bibek Panthi;Yifei Ming;Prashnna Kumar Gyawali;Danail Stoyanov;Binod Bhattarai",
        "authorids": "~Sudarshan_Regmi1;~Bibek_Panthi1;~Yifei_Ming1;~Prashnna_Kumar_Gyawali1;~Danail_Stoyanov1;~Binod_Bhattarai1",
        "gender": ";M;M;;M;",
        "homepage": ";https://bpanthi.com.np;https://alvinmingsf.github.io/;;http://www.cs.ucl.ac.uk/people/Dan.Stoyanov.html/;https://sites.google.com/view/bbinod/home",
        "dblp": ";;277/4125;;53/3543;127/0101",
        "google_scholar": ";wHB4wPIAAAAJ;Dh_4cyQAAAAJ;;https://scholar.google.com.tw/citations?user=pGfEK6UAAAAJ;PDEi58sAAAAJ",
        "orcid": ";0000-0002-1424-9611;;;0000-0002-0980-3227;",
        "linkedin": ";bibek-panthi-b01003161/;;;;",
        "or_profile": "~Sudarshan_Regmi1;~Bibek_Panthi1;~Yifei_Ming1;~Prashnna_Kumar_Gyawali1;~Danail_Stoyanov1;~Binod_Bhattarai1",
        "aff": ";;University of Wisconsin - Madison;;Medtronic;University of Aberdeen",
        "aff_domain": ";;wisc.edu;;medtronic.com;abdn.ac.uk",
        "position": ";;PhD student;;Researcher;Assistant Professor",
        "bibtex": "@misc{\nregmi2024reweightood,\ntitle={Reweight{OOD}: Loss Reweighting for Distance-based {OOD} Detection},\nauthor={Sudarshan Regmi and Bibek Panthi and Yifei Ming and Prashnna Kumar Gyawali and Danail Stoyanov and Binod Bhattarai},\nyear={2024},\nurl={https://openreview.net/forum?id=OJoMzslBIa}\n}",
        "github": "",
        "project": "",
        "reviewers": "8LLh;tSwH;XxBj;NpEj;4EKT",
        "site": "https://openreview.net/forum?id=OJoMzslBIa",
        "pdf_size": 2263432,
        "rating": "3;3;3;5;6",
        "confidence": "4;4;5;4;4",
        "soundness": "2;2;2;3;3",
        "contribution": "1;2;1;2;3",
        "presentation": "3;3;2;2;3",
        "wc_summary": "85;99;54;85;55",
        "wc_strengths": "46;61;43;22;60",
        "wc_weaknesses": "121;161;308;89;184",
        "wc_questions": "42;6;4;2;5",
        "wc_review": "294;327;409;198;304",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "245;191;197;180;600",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            4.0,
            1.2649110640673518
        ],
        "confidence_avg": [
            4.2,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            1.8,
            0.7483314773547883
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            75.6,
            17.97331355092878
        ],
        "wc_strengths_avg": [
            46.4,
            14.178857499812882
        ],
        "wc_weaknesses_avg": [
            172.6,
            75.16541758016115
        ],
        "wc_questions_avg": [
            11.8,
            15.157836257197133
        ],
        "wc_review_avg": [
            306.4,
            67.61834070723711
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            282.6,
            160.2505538211959
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.3952847075210474,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13066243561270360467&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of Wisconsin-Madison;Medtronic;University of Aberdeen",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.wisc.edu;https://www.medtronic.com;https://www.abdn.ac.uk",
        "aff_unique_abbr": "UW-Madison;Medtronic;Aberdeen",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Madison;",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "OKOjkFrhSs",
        "title": "Prompt-Guided Dynamic Network for Image Super Resolution",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Existing single image super-resolution (SISR) methods learn the convolutional kernel solely from a single image modality. However, the SR performance is limited by the diversity of input modality and the insufficient image-level information in low-resolution images. In this paper, we seek to use multi-modal prompts (texts or images) to assist existing SR networks to learn more discriminative features, leading to superior SR performance. To this end, we develop the Dynamic Correlation Module in a plug-and-play form for existing SR networks, which learns meaningful semantic and textural information from multi-modal prompt embeddings extracted from a large-scale vision-language model (such as CLIP). Specifically, Spatially Multi-Modal Attention Module is proposed to generate the pixel-wise cross-modal attention mask which would highlight the interest regions given certain prompts. Moreover, to the best of our knowledge, we are the first ones that introduce multi-modal prompts into convolutional kernel estimation which can better handle spatial variants and retain cross-modal relevance. Extensive experiments and ablation studies demonstrate the effectiveness of the proposed Dynamic Correlation Module which exploits the discriminative prompt features to recover realistic high-resolution images, elevating existing SR performance by a notable gap.",
        "keywords": "single image super resolution",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/252ee258d7a37c84a25d0f67198b6495fd6a3d39.pdf",
        "author": "Cheng Cheng;Lin Song;Xiaohan Ding;Hang Wang;Hongbin Sun",
        "authorids": "~Cheng_Cheng5;~Lin_Song2;~Xiaohan_Ding1;~Hang_Wang7;~Hongbin_Sun2",
        "gender": "M;M;M;M;M",
        "homepage": ";https://linsong.cc;https://dingxiaohan.xyz/;https://gr.xjtu.edu.cn/web/hangwang;http://gr.xjtu.edu.cn/web/hsun/home",
        "dblp": ";;218/7379;;98/6690-1",
        "google_scholar": "https://scholar.google.com.hk/citations?hl=zh-CN;6Ra2TgQAAAAJ;CIjw0KoAAAAJ;;",
        "orcid": ";;;0000-0002-2714-0703;",
        "linkedin": ";\u6797-\u5b8b-9520a5183/;;;",
        "or_profile": "~Cheng_Cheng5;~Lin_Song2;~Xiaohan_Ding1;~Hang_Wang7;~Hongbin_Sun2",
        "aff": "Xi'an Jiaotong University;Tencent AI Lab;Tencent AI Lab;;Xi'an Jiaotong University",
        "aff_domain": "xjtu.edu.cn;tencent.com;tencent.com;;xjtu.edu.cn",
        "position": "PhD student;Researcher;Researcher;;Full Professor",
        "bibtex": "@misc{\ncheng2024promptguided,\ntitle={Prompt-Guided Dynamic Network for Image Super Resolution},\nauthor={Cheng Cheng and Lin Song and Xiaohan Ding and Hang Wang and Hongbin Sun},\nyear={2024},\nurl={https://openreview.net/forum?id=OKOjkFrhSs}\n}",
        "github": "",
        "project": "",
        "reviewers": "NmaN;axMK;WtP4;FNqG",
        "site": "https://openreview.net/forum?id=OKOjkFrhSs",
        "pdf_size": 1039299,
        "rating": "3;3;3;3",
        "confidence": "5;2;5;3",
        "soundness": "3;2;2;4",
        "contribution": "3;2;2;3",
        "presentation": "3;1;2;4",
        "wc_summary": "62;113;81;188",
        "wc_strengths": "46;111;39;77",
        "wc_weaknesses": "55;205;156;163",
        "wc_questions": "29;60;16;230",
        "wc_review": "192;489;292;658",
        "wc_reply_reviewers": "57;0;43;0",
        "wc_reply_authors": "727;815;740;1385",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "1;2;1;2",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            1.299038105676658
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            111.0,
            48.0468521341409
        ],
        "wc_strengths_avg": [
            68.25,
            28.525208149985513
        ],
        "wc_weaknesses_avg": [
            144.75,
            55.10161068426222
        ],
        "wc_questions_avg": [
            83.75,
            85.93711363549511
        ],
        "wc_review_avg": [
            407.75,
            179.7030536746663
        ],
        "wc_reply_reviewers_avg": [
            25.0,
            25.485289874749316
        ],
        "wc_reply_authors_avg": [
            916.75,
            272.42281016831174
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:0yCn1Wvr7p4J:scholar.google.com/&scioq=Prompt-Guided+Dynamic+Network+for+Image+Super+Resolution&hl=en&as_sdt=0,48",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;0",
        "aff_unique_norm": "Xi'an Jiao Tong University;Tencent",
        "aff_unique_dep": ";Tencent AI Lab",
        "aff_unique_url": "https://www.xjtu.edu.cn;https://ai.tencent.com",
        "aff_unique_abbr": "XJTU;Tencent AI Lab",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "MAP IT to Visualize Representations",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18745",
        "id": "OKf6JtXtoy",
        "tldr": "",
        "abstract": "MAP IT visualizes representations by taking a fundamentally different approach to dimensionality reduction. MAP IT aligns distributions over discrete marginal probabilities in the input space versus the target space, thus capturing information in local regions, as opposed to current methods which align based on individual probabilities between pairs of data points (states) only. The MAP IT theory reveals that alignment based on a projective divergence avoids normalization of weights (to obtain true probabilities) entirely, and further reveals a dual viewpoint via continuous densities and kernel smoothing. MAP IT is shown to produce visualizations which capture class structure better than the current state of the art while being inherently scalable.",
        "keywords": "Visualization; Representation learning; Dimensionality reduction; Divergence",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/f3e48e3db41353f30805a57a4dc000973d39d466.pdf",
        "author": "Robert Jenssen",
        "authorids": "~Robert_Jenssen1",
        "gender": "M",
        "homepage": "https://uit.no/ansatte/robert.jenssen",
        "dblp": "45/5813",
        "google_scholar": "HiviXjIAAAAJ",
        "orcid": "0000-0002-7496-8474",
        "linkedin": "robert-jenssen-10b79318/?originalSubdomain=no",
        "or_profile": "~Robert_Jenssen1",
        "aff": "UiT The Arctic University of Norway",
        "aff_domain": "uit.no",
        "position": "Full Professor",
        "bibtex": "@inproceedings{\njenssen2024map,\ntitle={{MAP} {IT} to Visualize Representations},\nauthor={Robert Jenssen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=OKf6JtXtoy}\n}",
        "github": "",
        "project": "",
        "reviewers": "L3aD;vQ36;LbLf;BmiL",
        "pdf_size": 2947441,
        "rating": "3;5;8;8",
        "confidence": "5;4;4;2",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "111;27;27;90",
        "wc_strengths": "51;27;66;56",
        "wc_weaknesses": "91;163;39;150",
        "wc_questions": "654;77;61;12",
        "wc_review": "907;294;193;308",
        "wc_reply_reviewers": "625;198;0;167",
        "wc_reply_authors": "1172;523;151;825",
        "reply_reviewers": "3;1;0;1",
        "reply_authors": "3;1;1;2",
        "rating_avg": [
            6.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            63.75,
            37.49249924984996
        ],
        "wc_strengths_avg": [
            50.0,
            14.33527118683145
        ],
        "wc_weaknesses_avg": [
            110.75,
            49.51956683978567
        ],
        "wc_questions_avg": [
            201.0,
            262.63377543644305
        ],
        "wc_review_avg": [
            425.5,
            281.51243311797083
        ],
        "wc_reply_reviewers_avg": [
            247.5,
            230.5932566229984
        ],
        "wc_reply_authors_avg": [
            667.75,
            376.48995670535487
        ],
        "reply_reviewers_avg": [
            1.25,
            1.0897247358851685
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.7570332986102252,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:lcBkeFEWt4wJ:scholar.google.com/&scioq=MAP+IT+to+Visualize+Representations&hl=en&as_sdt=0,47",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=OKf6JtXtoy",
        "pdf": "https://openreview.net/pdf?id=OKf6JtXtoy",
        "email": "uit.no",
        "author_num": 1,
        "aff_unique_index": "0",
        "aff_unique_norm": "Arctic University of Norway",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uit.no",
        "aff_unique_abbr": "UiT",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Norway"
    },
    {
        "id": "OLi39lZS9Y",
        "title": "Learning to Solve New sequential decision-making Tasks with In-Context Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Training autonomous agents that can generalize to new tasks from a small number of demonstrations is a long-standing problem in machine learning.  Recently, transformers have displayed impressive few-shot learning capabilities on a wide range of domains in language and vision.  However, the sequential decision-making setting poses additional challenges and has a much lower tolerance for errors since the environment's stochasticity or the agent's wrong actions can lead to unseen (and sometimes unrecoverable) states. In this paper, we use an illustrative example to show that a naive approach to using transformers in sequential decision-making problems does not lead to few-shot learning. We then demonstrate how training on sequences of trajectories with certain distributional properties leads to few-shot learning in new sequential decision-making tasks. We investigate different design choices and find that larger model and dataset sizes, as well as more task diversity, environment stochasticity and trajectory burstiness, all result in better in-context learning of new out-of-distribution tasks. Our work demonstrates that by leveraging large offline pretraining datasets, our model is able to generalize to unseen MiniHack and Procgen tasks via in-context learning, from just a handful of expert demonstrations per task.",
        "keywords": "In-Context Learning;Decision Making;Generalization",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Sharath Chandra Raparthy;Eric Hambro;Robert Kirk;Mikael Henaff;Roberta Raileanu",
        "authorids": "~Sharath_Chandra_Raparthy3;~Eric_Hambro1;~Robert_Kirk1;~Mikael_Henaff1;~Roberta_Raileanu2",
        "gender": "M;M;M;M;F",
        "homepage": "https://sharathraparthy.github.io/;https://erichambro.com/;https://robertkirk.github.io;http://www.mikaelhenaff.com;https://rraileanu.github.io/",
        "dblp": "302/4190;290/1986;01/9684;86/10571;215/5579",
        "google_scholar": "https://scholar.google.ca/citations?user=S1R0_UMAAAAJ;ehquBPIAAAAJ;https://scholar.google.co.uk/citations?user=PL5KWdYAAAAJ;bX__wkYAAAAJ;9hVXpJ0AAAAJ",
        "orcid": ";;;;",
        "linkedin": ";eric-hambro;;;roberta-raileanu-44b25660/",
        "or_profile": "~Sharath_Chandra_Raparthy3;~Eric_Hambro1;~Robert_Kirk1;~Mikael_Henaff1;~Roberta_Raileanu1",
        "aff": "Meta Facebook;Anthropic;University College London;Meta;Meta Facebook",
        "aff_domain": "fb.com;anthropic.com;ucl.ac.uk;meta.com;fb.com",
        "position": "Researcher;Researcher;PhD student;Researcher;Researcher",
        "bibtex": "@misc{\nraparthy2024learning,\ntitle={Learning to Solve New sequential decision-making Tasks with In-Context Learning},\nauthor={Sharath Chandra Raparthy and Eric Hambro and Robert Kirk and Mikael Henaff and Roberta Raileanu},\nyear={2024},\nurl={https://openreview.net/forum?id=OLi39lZS9Y}\n}",
        "github": "",
        "project": "",
        "reviewers": "CT2T;F4ph;phhR;qktf",
        "site": "https://openreview.net/forum?id=OLi39lZS9Y",
        "pdf_size": 4818455,
        "rating": "3;3;3;5",
        "confidence": "3;3;4;3",
        "soundness": "3;2;3;3",
        "contribution": "2;1;2;2",
        "presentation": "3;3;2;2",
        "wc_summary": "82;173;86;71",
        "wc_strengths": "49;59;101;99",
        "wc_weaknesses": "128;106;196;499",
        "wc_questions": "3;156;226;41",
        "wc_review": "262;494;609;710",
        "wc_reply_reviewers": "0;175;0;0",
        "wc_reply_authors": "572;460;645;992",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "2;2;2;3",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            103.0,
            40.786027019066225
        ],
        "wc_strengths_avg": [
            77.0,
            23.280893453645632
        ],
        "wc_weaknesses_avg": [
            232.25,
            157.5410660748492
        ],
        "wc_questions_avg": [
            106.5,
            89.06879363727792
        ],
        "wc_review_avg": [
            518.75,
            166.77436103909977
        ],
        "wc_reply_reviewers_avg": [
            43.75,
            75.77722283113839
        ],
        "wc_reply_authors_avg": [
            667.25,
            198.73521957619892
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:9KtNiPFhGM8J:scholar.google.com/&scioq=Learning+to+Solve+New+sequential+decision-making+Tasks+with+In-Context+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;0;0",
        "aff_unique_norm": "Meta;Anthropic;University College London",
        "aff_unique_dep": "Meta Platforms, Inc.;;",
        "aff_unique_url": "https://meta.com;https://www.anthropic.com;https://www.ucl.ac.uk",
        "aff_unique_abbr": "Meta;Anthropic;UCL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "OMVFYTgj0H",
        "title": "Continual Reinforcement Learning by Reweighting Bellman Targets",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "One major obstacle to the general AI agent is the inability to solve new problems without forgetting previously acquired knowledge. This deficiency is highly linked to the fact that most reinforcement learning~(RL) methods are based upon the key assumption that the environment transition dynamics and reward functions are fixed. In this paper, we study the continual RL setting by proposing a general analysis framework of catastrophic forgetting in value-based RL based on the defined MDP difference. Within this theoretical framework, we first show that without incorporating any strategies, the Finetune algorithm, one commonly used baseline regarded as the lower bound a continual RL algorithm can achieve, suffers from complete catastrophic forgetting. Moreover, the sequential multi-task RL algorithm, normally viewed as one soft upper bound baseline, can lead to an optimal action-state value function estimator at the cost of almost intractable computation cost in an online alternating algorithm. Motivated by these results,  a practical continual RL algorithm is proposed by reweighting the historical and current Bellman targets to trade-off between these lower and upper-bound approaches. We conduct rigorous experiments in the tabular setting to demonstrate our analytical results, suggesting the massive potential of our proposed algorithm in real continual RL scenarios.",
        "keywords": "continual reinforcement learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Ke Sun;Jun Jin;Xi Chen;Wulong Liu;Linglong Kong",
        "authorids": "~Ke_Sun6;~Jun_Jin1;~Xi_Chen32;~Wulong_Liu1;~Linglong_Kong2",
        "gender": "M;;M;M;M",
        "homepage": "https://sites.google.com/view/kesun;;https://sites.google.com/site/xichenmcgill/home;;https://www.ualberta.ca/~lkong",
        "dblp": "69/476-13;78/8436.html;16/3283-9.html;36/9257.html;35/8525",
        "google_scholar": "lYdNhFQAAAAJ;a6grwUcAAAAJ;https://scholar.google.ca/citations?user=HMuDi00AAAAJ;https://scholar.google.ca/citations?user=od00FfIAAAAJ;https://scholar.google.ca/citations?hl=en",
        "orcid": ";0000-0003-4413-8565;0000-0001-5395-4295;;0000-0003-3011-9216",
        "linkedin": ";;;wulong-liu-28006155/;",
        "or_profile": "~Ke_Sun6;~Jun_Jin1;~Xi_Chen32;~Wulong_Liu1;~Linglong_Kong2",
        "aff": "University of Alberta;University of Alberta;Huawei Technologies Ltd.;Huawei Noah's Ark Lab;University of Alberta",
        "aff_domain": "ualberta.ca;ualberta.ca;huawei.com;huawei.com;ualberta.ca",
        "position": "PhD student;Assistant Professor;Principal Researcher;Researcher;Full Professor",
        "bibtex": "@misc{\nsun2024continual,\ntitle={Continual Reinforcement Learning by Reweighting Bellman Targets},\nauthor={Ke Sun and Jun Jin and Xi Chen and Wulong Liu and Linglong Kong},\nyear={2024},\nurl={https://openreview.net/forum?id=OMVFYTgj0H}\n}",
        "github": "",
        "project": "",
        "reviewers": "o16F;c22e;EmDp",
        "site": "https://openreview.net/forum?id=OMVFYTgj0H",
        "pdf_size": 399092,
        "rating": "3;3;5",
        "confidence": "4;2;3",
        "soundness": "2;2;2",
        "contribution": "1;2;3",
        "presentation": "3;1;2",
        "wc_summary": "92;113;70",
        "wc_strengths": "17;89;44",
        "wc_weaknesses": "262;203;264",
        "wc_questions": "305;68;2",
        "wc_review": "676;473;380",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            91.66666666666667,
            17.55625877635159
        ],
        "wc_strengths_avg": [
            50.0,
            29.698484809834994
        ],
        "wc_weaknesses_avg": [
            243.0,
            28.296053906272277
        ],
        "wc_questions_avg": [
            125.0,
            130.09996156801893
        ],
        "wc_review_avg": [
            509.6666666666667,
            123.59162143482416
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:nMeIjp860uYJ:scholar.google.com/&scioq=Continual+Reinforcement+Learning+by+Reweighting+Bellman+Targets&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;1;0",
        "aff_unique_norm": "University of Alberta;Huawei",
        "aff_unique_dep": ";Huawei Technologies",
        "aff_unique_url": "https://www.ualberta.ca;https://www.huawei.com",
        "aff_unique_abbr": "UAlberta;Huawei",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;1;0",
        "aff_country_unique": "Canada;China"
    },
    {
        "id": "OMwD6pGYB4",
        "title": "A Distributional Analogue to the Successor Representation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper contributes a new approach for distributional reinforcement learning which allows for a \nclean separation of transition structure and reward in the learning process. Analogous to how the successor representation (SR) describes the expected consequences from behaving according to a given policy, our distributional successor measure (SM) describes the distributional consequences of this behaviour.\nWe model the distributional SM as a distribution over distributions and provide theory connecting it with distributional and model-based reinforcement learning. \nExtending \u03b3-models (Janner et al., 2020), we propose an algorithm that learns the distributional SM from samples by minimizing a two-level maximum mean discrepancy. Key to our method are a number of algorithmic techniques that are independently valuable in the context of learning generative models of state.\nAs an illustration of the practical usefulness of the distributional successor measure, we show that it\nenables zero-shot risk-sensitive policy evaluation in a way that was not previously possible.",
        "keywords": "reinforcement learning;distributional reinforcement learning;successor representation;successor measure;geometric horizon models;gamma models;risk-aware",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/d6ff1b55500a966e58241edb03dc9a4c90281540.zip",
        "author": "Jesse Farebrother;Harley Wiltzer;Arthur Gretton;Yunhao Tang;Andre Barreto;Will Dabney;Marc G Bellemare;Mark Rowland",
        "authorids": "~Jesse_Farebrother1;~Harley_Wiltzer1;~Arthur_Gretton1;~Yunhao_Tang1;~Andre_Barreto1;~Will_Dabney1;~Marc_G_Bellemare1;~Mark_Rowland1",
        "gender": "M;M;M;M;M;M;M;M",
        "homepage": "https://brosa.ca;https://harwiltz.github.io/about;http://www.gatsby.ucl.ac.uk/~gretton/;https://robintyh1.github.io;https://sites.google.com/corp/view/andrebarreto/about;;http://www.marcgbellemare.info;http://sites.google.com/view/markrowland",
        "dblp": "228/6862;321/0992;56/2574;210/2229;72/953;https://dblp.uni-trier.de/pers/hd/d/Dabney:Will;38/4525;86/4090",
        "google_scholar": "cA12XHcAAAAJ;;OUv7J6QAAAAJ;;https://scholar.google.co.uk/citations?user=H-xtdV4AAAAJ;https://scholar.google.co.uk/citations?user=dR-7QW8AAAAJ;https://scholar.google.co.uk/citations?user=uyYPun0AAAAJ;https://scholar.google.co.uk/citations?user=-0U84zMAAAAJ",
        "orcid": "0000-0002-5178-4947;;;;;;;",
        "linkedin": "jessefarebro/;harley-wiltzer-4998547a;;;;;;",
        "or_profile": "~Jesse_Farebrother1;~Harley_Wiltzer1;~Arthur_Gretton1;~Yunhao_Tang1;~Andre_Barreto1;~Will_Dabney1;~Marc_G_Bellemare1;~Mark_Rowland1",
        "aff": "Google DeepMind;Mila;University College London;Google DeepMind;Google DeepMind;Google DeepMind;Google;Google DeepMind",
        "aff_domain": "google.com;mila.quebec;ucl.ac.uk;deepmind.com;google.com;google.com;google.com;google.com",
        "position": "Student Researcher;PhD student;Professor;Research Scientist;Research Scientist;Research Scientist;Research Scientist;Research Scientist",
        "bibtex": "@misc{\nfarebrother2024a,\ntitle={A Distributional Analogue to the Successor Representation},\nauthor={Jesse Farebrother and Harley Wiltzer and Arthur Gretton and Yunhao Tang and Andre Barreto and Will Dabney and Marc G Bellemare and Mark Rowland},\nyear={2024},\nurl={https://openreview.net/forum?id=OMwD6pGYB4}\n}",
        "github": "",
        "project": "",
        "reviewers": "xHdx;jmar;JnMG;9gwA",
        "site": "https://openreview.net/forum?id=OMwD6pGYB4",
        "pdf_size": 1981327,
        "rating": "5;6;6;6",
        "confidence": "2;3;3;2",
        "soundness": "3;3;3;4",
        "contribution": "3;3;2;3",
        "presentation": "3;1;2;4",
        "wc_summary": "72;72;19;37",
        "wc_strengths": "34;59;35;82",
        "wc_weaknesses": "99;234;15;68",
        "wc_questions": "303;2;112;26",
        "wc_review": "508;367;181;213",
        "wc_reply_reviewers": "11;63;48;0",
        "wc_reply_authors": "1500;809;807;695",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "3;2;2;3",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            2.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            50.0,
            22.901964981197573
        ],
        "wc_strengths_avg": [
            52.5,
            19.75474626513841
        ],
        "wc_weaknesses_avg": [
            104.0,
            80.84243934963862
        ],
        "wc_questions_avg": [
            110.75,
            118.29069067344226
        ],
        "wc_review_avg": [
            317.25,
            130.66440793115774
        ],
        "wc_reply_reviewers_avg": [
            30.5,
            25.85053190942113
        ],
        "wc_reply_authors_avg": [
            952.75,
            319.30578995690007
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9561131691410033906&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;2;0;0;0;0;0",
        "aff_unique_norm": "Google;Mila;University College London",
        "aff_unique_dep": "Google DeepMind;Quebec Artificial Intelligence Institute;",
        "aff_unique_url": "https://deepmind.com;https://mila.quebec;https://www.ucl.ac.uk",
        "aff_unique_abbr": "DeepMind;Mila;UCL",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;0;0;0;0;2;0",
        "aff_country_unique": "United Kingdom;Canada;United States"
    },
    {
        "title": "Headless Language Models: Learning without Predicting with Contrastive Weight Tying",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18744",
        "id": "ONPECq0Rk7",
        "author_site": "Nathan Godey, \u00c9ric Clergerie, Beno\u00eet Sagot",
        "tldr": "",
        "abstract": "Self-supervised pre-training of language models usually consists in predicting probability distributions over extensive token vocabularies. In this study, we propose an innovative method that shifts away from probability prediction and instead focuses on reconstructing input embeddings in a contrastive fashion via Constrastive Weight Tying (CWT). We apply this approach to pretrain Headless Language Models in both monolingual and multilingual contexts. Our method offers practical advantages, substantially reducing training computational requirements by up to 20 times, while simultaneously enhancing downstream performance and data efficiency. We observe a significant +1.6 GLUE score increase and a notable +2.7 LAMBADA accuracy improvement compared to classical LMs within similar compute budgets.",
        "keywords": "representation learning;NLP;language modeling;pretraining;contrastive",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/60df7f2227767d9c83f94a93ba7532c32e51f257.zip",
        "author": "Nathan Godey;\u00c9ric Villemonte de la Clergerie;Beno\u00eet Sagot",
        "authorids": "~Nathan_Godey1;~\u00c9ric_Villemonte_de_la_Clergerie1;~Beno\u00eet_Sagot1",
        "gender": "M;M;M",
        "homepage": "https://nathangodey.github.io/;http://alpage.inria.fr/~clerger;http://pauillac.inria.fr/~sagot/",
        "dblp": "336/3367.html;54/5373;66/1016",
        "google_scholar": "YIbsNP8AAAAJ;olKxDUMAAAAJ;https://scholar.google.fr/citations?user=HXUT9ZkAAAAJ",
        "orcid": ";0000-0001-6428-9219;0000-0002-0107-8526",
        "linkedin": "nathan-g-114298175/;eric-de-la-clergerie-5799a71/;beno\u00eet-sagot-4731735/",
        "or_profile": "~Nathan_Godey1;~\u00c9ric_Villemonte_de_la_Clergerie1;~Beno\u00eet_Sagot1",
        "aff": "INRIA;INRIA;Inria",
        "aff_domain": "inria.fr;inria.fr;inria.fr",
        "position": "PhD student;Researcher;Research Director",
        "bibtex": "@inproceedings{\ngodey2024headless,\ntitle={Headless Language Models: Learning without Predicting with Contrastive Weight Tying},\nauthor={Nathan Godey and {\\'E}ric Villemonte de la Clergerie and Beno{\\^\\i}t Sagot},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ONPECq0Rk7}\n}",
        "github": "",
        "project": "",
        "reviewers": "CHGU;ccZo;A6os;QSPQ",
        "pdf_size": 2169508,
        "rating": "6;6;6;8",
        "confidence": "5;4;4;3",
        "soundness": "3;3;3;4",
        "contribution": "2;3;3;3",
        "presentation": "1;3;3;3",
        "wc_summary": "182;161;104;77",
        "wc_strengths": "39;90;175;47",
        "wc_weaknesses": "105;371;135;52",
        "wc_questions": "467;58;140;6",
        "wc_review": "793;680;554;182",
        "wc_reply_reviewers": "120;142;0;0",
        "wc_reply_authors": "688;474;295;29",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "3;2;2;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            131.0,
            42.26700841081611
        ],
        "wc_strengths_avg": [
            87.75,
            53.9785837161369
        ],
        "wc_weaknesses_avg": [
            165.75,
            122.17073094649143
        ],
        "wc_questions_avg": [
            167.75,
            179.25453271814357
        ],
        "wc_review_avg": [
            552.25,
            229.87428629579256
        ],
        "wc_reply_reviewers_avg": [
            65.5,
            65.96021528163776
        ],
        "wc_reply_authors_avg": [
            371.5,
            241.78347751655818
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1119892836825847686&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=ONPECq0Rk7",
        "pdf": "https://openreview.net/pdf?id=ONPECq0Rk7",
        "email": "inria.fr;inria.fr;inria.fr",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "INRIA",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.inria.fr",
        "aff_unique_abbr": "INRIA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "France"
    },
    {
        "id": "ONhLaNbxVV",
        "title": "Improving Prototypical Part Networks with Reward Reweighing, Reselection, and Retraining",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In recent years, work has gone into developing deep interpretable methods for image classification that clearly attributes a model's output to specific features of the data. One such of these methods is the \\textit{prototypical part network} (ProtoPNet), which attempts to classify images based on meaningful parts of the input. While this method results in interpretable classifications, it often learns to classify from spurious or inconsistent parts of the image. Hoping to remedy this, we take inspiration from the recent developments in Reinforcement Learning with Human Feedback (RLHF) to fine-tune these prototypes. By collecting human annotations of prototypes quality via a 1-5 scale on the CUB-200-2011 dataset, we construct a reward model that learns to identify non-spurious prototypes. In place of a full RL update, we propose the \\textit{reweighed, reselected, and retrained prototypical part network} (R3-ProtoPNet), which adds an additional three steps to the ProtoPNet training loop. The first two steps are reward-based reweighting and reselection, which align prototypes with human feedback. The final step is retraining to realign the model's features with the updated prototypes. We find that R3-ProtoPNet improves the overall consistency and meaningfulness of the prototypes, and maintains or improves individual model performance. When multiple trained R3-ProtoPNets are incorporated into an ensemble, we find an increase in interpretability and an increase in predictive performance.",
        "keywords": "interpretability;reinforcement learning with human feedback;vision",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Aaron Jiaxun Li;Robin Netzorg;Bin Yu",
        "authorids": "~Aaron_Jiaxun_Li1;~Robin_Netzorg1;~Bin_Yu5",
        "gender": "M;F;M",
        "homepage": "https://aaron-jx-li.github.io/;https://www.stat.berkeley.edu/~yugroup/people/Robbie.html;https://binyu.stat.berkeley.edu",
        "dblp": "133/7864-2.html;232/1837;27/116",
        "google_scholar": "MGqle3EAAAAJ;;https://scholar.google.com.hk/citations?user=z1iJa3UAAAAJ",
        "orcid": ";;0000-0003-3097-1433",
        "linkedin": "aaronjxli5351/;;bin-yu-b665063/",
        "or_profile": "~Aaron_Jiaxun_Li1;~Robin_Netzorg1;~Bin_Yu5",
        "aff": "Harvard University;University of California, Berkeley;University of California, Berkeley",
        "aff_domain": "g.harvard.edu;berkeley.edu;berkeley.edu",
        "position": "MS student;PhD student;Full Professor",
        "bibtex": "@misc{\nli2024improving,\ntitle={Improving Prototypical Part Networks with Reward Reweighing, Reselection, and Retraining},\nauthor={Aaron Jiaxun Li and Robin Netzorg and Bin Yu},\nyear={2024},\nurl={https://openreview.net/forum?id=ONhLaNbxVV}\n}",
        "github": "",
        "project": "",
        "reviewers": "cp6j;KfuC;Tqnf;Fuan",
        "site": "https://openreview.net/forum?id=ONhLaNbxVV",
        "pdf_size": 14405867,
        "rating": "5;6;6;6",
        "confidence": "4;4;3;4",
        "soundness": "2;3;3;2",
        "contribution": "3;2;2;2",
        "presentation": "3;3;2;3",
        "wc_summary": "81;167;175;53",
        "wc_strengths": "151;153;34;32",
        "wc_weaknesses": "242;77;155;156",
        "wc_questions": "91;110;63;324",
        "wc_review": "565;507;427;565",
        "wc_reply_reviewers": "355;0;0;0",
        "wc_reply_authors": "766;714;359;769",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            119.0,
            53.009433122794285
        ],
        "wc_strengths_avg": [
            92.5,
            59.508402768012516
        ],
        "wc_weaknesses_avg": [
            157.5,
            58.37165407969865
        ],
        "wc_questions_avg": [
            147.0,
            103.54950506883169
        ],
        "wc_review_avg": [
            516.0,
            56.57738063926254
        ],
        "wc_reply_reviewers_avg": [
            88.75,
            153.71950917173785
        ],
        "wc_reply_authors_avg": [
            652.0,
            170.57109954502843
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18064746437319007735&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Harvard University;University of California, Berkeley",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.harvard.edu;https://www.berkeley.edu",
        "aff_unique_abbr": "Harvard;UC Berkeley",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Berkeley",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "ONhwvkaIe6",
        "title": "Hypernymy Understanding Evaluation of Text-to-Image Models via WordNet Hierarchy",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Text-to-image synthesis has recently attracted widespread attention of the community due to rapidly improving generation quality and numerous practical applications.\n  However, little is known about the language understanding capabilities of text-to-image models, making it difficult to reason about prompt formulations that the model would understand well.\n  In this work, we measure the capability of popular text-to-image models to understand *hypernymy*, or the ``is-a\" relation between words.\n  To this end, we design two automatic metrics based on the WordNet semantic hierarchy and existing image classifiers pretrained on ImageNet.\n  These metrics both enable quantitative comparison of linguistic capabilities for text-to-image models and offer a way of finding qualitative differences, such as words that are unknown to models and thus are difficult for them to draw.\n  We comprehensively evaluate our metrics on various popular text-to-image generation models, including GLIDE, Latent Diffusion, and Stable Diffusion, which allows a better understanding of their shortcomings for downstream applications.",
        "keywords": "text-to-image generation;multimodality;wordnet;hypernymy;lexical semantics",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Anton Baryshnikov;Max Ryabinin",
        "authorids": "~Anton_Baryshnikov1;~Max_Ryabinin1",
        "gender": "M;Not Specified",
        "homepage": "https://www.hse.ru/org/persons/305058935;https://mryab.github.io/",
        "dblp": ";276/0192",
        "google_scholar": ";930PERsAAAAJ",
        "orcid": ";",
        "linkedin": "https://linkedin.com/in/anthony-baryshnikov;",
        "or_profile": "~Anton_Baryshnikov1;~Max_Ryabinin1",
        "aff": "Higher School of Economics;Together AI",
        "aff_domain": "hse.ru;together.ai",
        "position": "Undergrad student;Researcher",
        "bibtex": "@misc{\nbaryshnikov2024hypernymy,\ntitle={Hypernymy Understanding Evaluation of Text-to-Image Models via WordNet Hierarchy},\nauthor={Anton Baryshnikov and Max Ryabinin},\nyear={2024},\nurl={https://openreview.net/forum?id=ONhwvkaIe6}\n}",
        "github": "",
        "project": "",
        "reviewers": "4BDw;pgJu;npm8",
        "site": "https://openreview.net/forum?id=ONhwvkaIe6",
        "pdf_size": 1898589,
        "rating": "6;6;6",
        "confidence": "4;4;3",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "2;3;3",
        "wc_summary": "72;69;64",
        "wc_strengths": "66;91;24",
        "wc_weaknesses": "34;143;82",
        "wc_questions": "1;25;30",
        "wc_review": "173;328;200",
        "wc_reply_reviewers": "15;26;43",
        "wc_reply_authors": "151;321;575",
        "reply_reviewers": "1;1;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            68.33333333333333,
            3.2998316455372216
        ],
        "wc_strengths_avg": [
            60.333333333333336,
            27.644569488820444
        ],
        "wc_weaknesses_avg": [
            86.33333333333333,
            44.60443425888905
        ],
        "wc_questions_avg": [
            18.666666666666668,
            12.657891697365017
        ],
        "wc_review_avg": [
            233.66666666666666,
            67.60834925428138
        ],
        "wc_reply_reviewers_avg": [
            28.0,
            11.51810169544733
        ],
        "wc_reply_authors_avg": [
            349.0,
            174.22590699051239
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7631678816098154736&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Higher School of Economics;Together AI",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.hse.ru;https://www.together.ai",
        "aff_unique_abbr": "HSE;Together AI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Russian Federation;United States"
    },
    {
        "id": "ONnZVUrFBT",
        "title": "Communication-Efficient Algorithm for Asynchronous Multi-Agent Bandits",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We study the cooperative asynchronous multi-agent multi-armed bandits problem, where the active (arm pulling) decision rounds of each agent are asynchronous. In each round, only a subset of agents is active to pull arms, and this subset is unknown and time-varying. We propose a fully distributed algorithm that relies on novel asynchronous communication protocols. This algorithm attains near-optimal regret with constant (time-independent) communications for adversarial asynchronicity among agents. Furthermore, to protect the privacy of the learning process, we extend our algorithms to achieve local differential privacy with rigorous guarantees. Lastly, we report numerical simulations of our new asynchronous algorithms with other known baselines.",
        "keywords": "Multi-Agent Multi-Armed Bandits;Distributed Learning;Efficient Communication",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Xuchuang Wang;Yu-Zhen Janice Chen;Xutong Liu;Lin Yang;Mohammad Hajiesmaili;Don Towsley;John C.S. Lui",
        "authorids": "~Xuchuang_Wang1;~Yu-Zhen_Janice_Chen1;~Xutong_Liu1;~Lin_Yang11;~Mohammad_Hajiesmaili1;~Don_Towsley1;~John_C.S._Lui2",
        "gender": "M;F;M;M;M;M;M",
        "homepage": "https://xuchuangw.com;;https://xutongliu.me/;https://yanglin2021.github.io/;https://groups.cs.umass.edu/hajiesmaili/;;http://www.cse.cuhk.edu.hk/~cslui/Index.html",
        "dblp": "319/5123;227/7171;70/3372-2;20/2970;49/7911;t/DonaldFTowsley;l/JohnCSLui",
        "google_scholar": "QJ66dEcAAAAJ;g2HMYpEAAAAJ;KNfY6BIAAAAJ;AikWhjkAAAAJ;XCGuYKIAAAAJ;https://scholar.google.com.tw/citations?user=yYtaDFUAAAAJ;https://scholar.google.com.tw/citations?user=7LVjQ7MAAAAJ",
        "orcid": ";;0000-0002-8628-5873;0000-0001-9056-0500;;;0000-0001-7466-0384",
        "linkedin": ";;;;;;",
        "or_profile": "~Xuchuang_Wang1;~Yu-Zhen_Janice_Chen1;~Xutong_Liu1;~Lin_Yang11;~Mohammad_Hajiesmaili1;~Don_Towsley1;~John_C.S._Lui2",
        "aff": "University of Massachusetts at Amherst;Department of Computer Science, University of Massachusetts at Amherst;The Chinese University of Hong Kong;Nanjing University;College of Information and Computer Science, University of Massachusetts, Amherst;University of Massachusetts, Amherst;The Chinese University of Hong Kong",
        "aff_domain": "cs.umass.edu;cs.umass.edu;cuhk.edu.hk;nju.edu.cn;cics.umass.edu;umass.edu;cse.cuhk.edu.hk",
        "position": "Postdoc;PhD student;Postdoc;Assistant Professor;Assistant Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nwang2024communicationefficient,\ntitle={Communication-Efficient Algorithm for Asynchronous Multi-Agent Bandits},\nauthor={Xuchuang Wang and Yu-Zhen Janice Chen and Xutong Liu and Lin Yang and Mohammad Hajiesmaili and Don Towsley and John C.S. Lui},\nyear={2024},\nurl={https://openreview.net/forum?id=ONnZVUrFBT}\n}",
        "github": "",
        "project": "",
        "reviewers": "andi;Ttd7;F9Jr;vstV",
        "site": "https://openreview.net/forum?id=ONnZVUrFBT",
        "pdf_size": 2384467,
        "rating": "5;5;6;6",
        "confidence": "2;4;4;3",
        "soundness": "3;3;3;2",
        "contribution": "2;2;3;3",
        "presentation": "3;3;2;3",
        "wc_summary": "56;70;98;65",
        "wc_strengths": "83;73;75;129",
        "wc_weaknesses": "238;361;197;38",
        "wc_questions": "94;201;2;7",
        "wc_review": "471;705;372;239",
        "wc_reply_reviewers": "55;484;153;0",
        "wc_reply_authors": "837;1366;1051;332",
        "reply_reviewers": "1;5;1;0",
        "reply_authors": "5;10;8;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            72.25,
            15.690363284513205
        ],
        "wc_strengths_avg": [
            90.0,
            22.825424421026653
        ],
        "wc_weaknesses_avg": [
            208.5,
            115.46536277169876
        ],
        "wc_questions_avg": [
            76.0,
            80.91044431963033
        ],
        "wc_review_avg": [
            446.75,
            170.31496557848345
        ],
        "wc_reply_reviewers_avg": [
            173.0,
            187.73252248877924
        ],
        "wc_reply_authors_avg": [
            896.5,
            376.3313035079596
        ],
        "reply_reviewers_avg": [
            1.75,
            1.920286436967152
        ],
        "reply_authors_avg": [
            6.25,
            3.031088913245535
        ],
        "replies_avg": [
            38,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.30151134457776363,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:dsj6phfUgD0J:scholar.google.com/&scioq=Communication-Efficient+Algorithm+for+Asynchronous+Multi-Agent+Bandits&hl=en&as_sdt=0,33",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;1;2;0;0;1",
        "aff_unique_norm": "University of Massachusetts Amherst;Chinese University of Hong Kong;Nanjing University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.umass.edu;https://www.cuhk.edu.hk;https://www.nju.edu.cn",
        "aff_unique_abbr": "UMass Amherst;CUHK;Nanjing U",
        "aff_campus_unique_index": "0;0;1;0;0;1",
        "aff_campus_unique": "Amherst;Hong Kong SAR;",
        "aff_country_unique_index": "0;0;1;1;0;0;1",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "Large Language Models to Enhance Bayesian Optimization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18743",
        "id": "OOxotBmGol",
        "author_site": "Tennison Liu, Nicol\u00e1s Astorga, Nabeel Seedat, Mihaela van der Schaar",
        "tldr": "",
        "abstract": "Bayesian optimization (BO) is a powerful approach for optimizing complex and expensive-to-evaluate black-box functions. Its importance is underscored in many applications, notably including hyperparameter tuning, but its efficacy depends on efficiently balancing exploration and exploitation. While there has been substantial progress in BO methods, striking this balance remains a delicate process. In this light, we present \\texttt{LLAMBO}, a novel approach that integrates the capabilities of Large Language Models (LLM) within BO. At a high level, we frame the BO problem in natural language, enabling LLMs to iteratively \\emph{propose} and \\emph{evaluate} promising solutions conditioned on historical evaluations. More specifically, we explore how combining contextual understanding, few-shot learning proficiency, and domain knowledge of LLMs can improve model-based BO. Our findings illustrate that \\texttt{LLAMBO} is effective at zero-shot warmstarting, and enhances surrogate modeling and candidate sampling, especially in the early stages of search when observations are sparse. Our approach is performed in context and does not require LLM finetuning. Additionally, it is modular by design, allowing individual components to be integrated into existing BO frameworks, or function cohesively as an end-to-end method. We empirically validate \\texttt{LLAMBO}'s efficacy on the problem of hyperparameter tuning, highlighting strong empirical performance across a range of diverse benchmarks, proprietary, and synthetic tasks.",
        "keywords": "bayesian optimization;LLMs",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Tennison Liu;Nicol\u00e1s Astorga;Nabeel Seedat;Mihaela van der Schaar",
        "authorids": "~Tennison_Liu1;~Nicol\u00e1s_Astorga1;~Nabeel_Seedat1;~Mihaela_van_der_Schaar2",
        "gender": "M;M;;F",
        "homepage": "https://www.vanderschaar-lab.com/research-team/#Tennison;;;https://www.vanderschaar-lab.com",
        "dblp": "256/9899;;227/8368;",
        "google_scholar": "LtdHRjsAAAAJ;oLiBK8cAAAAJ;https://scholar.google.com/citations?hl=en;DZ3S--MAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;nabeel-seedat/;",
        "or_profile": "~Tennison_Liu1;~Nicol\u00e1s_Astorga1;~Nabeel_Seedat1;~Mihaela_van_der_Schaar2",
        "aff": "University of Cambridge;University of Cambridge;AstraZeneca;University of California, Los Angeles",
        "aff_domain": "cam.ac.uk;cam.ac.uk;astrazeneca.com;ucla.edu",
        "position": "PhD student;PhD student;Intern;Full Professor",
        "bibtex": "@inproceedings{\nliu2024large,\ntitle={Large Language Models to Enhance Bayesian Optimization},\nauthor={Tennison Liu and Nicol{\\'a}s Astorga and Nabeel Seedat and Mihaela van der Schaar},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=OOxotBmGol}\n}",
        "github": "",
        "project": "",
        "reviewers": "8Jea;LVtK;x2Jx;ywEG",
        "pdf_size": 1644136,
        "rating": "8;8;8;8",
        "confidence": "5;3;3;3",
        "soundness": "3;3;3;4",
        "contribution": "4;3;3;4",
        "presentation": "4;3;3;4",
        "wc_summary": "105;66;80;132",
        "wc_strengths": "121;51;48;73",
        "wc_weaknesses": "771;181;95;49",
        "wc_questions": "193;135;72;91",
        "wc_review": "1190;433;295;345",
        "wc_reply_reviewers": "190;18;53;0",
        "wc_reply_authors": "2256;1185;688;1153",
        "reply_reviewers": "2;1;1;0",
        "reply_authors": "5;3;1;2",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.5,
            0.5
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            95.75,
            25.16321720289359
        ],
        "wc_strengths_avg": [
            73.25,
            29.20937349550654
        ],
        "wc_weaknesses_avg": [
            274.0,
            290.8281279381346
        ],
        "wc_questions_avg": [
            122.75,
            46.55306112384018
        ],
        "wc_review_avg": [
            565.75,
            363.78109832700216
        ],
        "wc_reply_reviewers_avg": [
            65.25,
            74.5029361837505
        ],
        "wc_reply_authors_avg": [
            1320.5,
            574.8114908385182
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.75,
            1.479019945774904
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 62,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11123379393297107395&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=OOxotBmGol",
        "pdf": "https://openreview.net/pdf?id=OOxotBmGol",
        "email": "cam.ac.uk;cam.ac.uk;astrazeneca.com;ucla.edu",
        "author_num": 4,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "University of Cambridge;AstraZeneca;University of California, Los Angeles",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.cam.ac.uk;https://www.astrazeneca.com;https://www.ucla.edu",
        "aff_unique_abbr": "Cambridge;AZ;UCLA",
        "aff_campus_unique_index": "0;0;2",
        "aff_campus_unique": "Cambridge;;Los Angeles",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "id": "OPNuTXopkq",
        "title": "SPFNO: spectral operator learning for PDEs with Dirichlet and Neumann boundary conditions",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Neural operator has been validated as a promising deep surrogate model for solving partial differential equations (PDEs). Based on the spectral operator learning (SOL) architecture, an enhanced orthogonal polynomial neural operator we have developed significantly improved the method\u2019s accuracy by precisely satisfying the boundary conditions (BCs), but is associated with Gauss-type grids, limiting comparisons on most public datasets. In this paper we introduce SPFNO, a novel SOL method, to learn the target operators on uniform grid datasets for PDEs with non-periodic BCs. Numerical results for various PDEs such as viscous Burgers\u2019 equation, Darcy flow and coupled Allen\u2013Cahn equations demonstrate the computational efficiency, resolution invariant property, and BC-satisfaction behaviour of proposed model. An accuracy improvement of approximately 1.7X\u20134.7X over non-BC-satisfying baseline is also noted. Furthermore, studies on SOL emphasizes the imporance of respecting BCs as a criterion for deep surrogate models of PDEs.",
        "keywords": "neural operator;deep learning-based PDE solver;AI for science;scientific machine learning;spectral method",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Ziyuan Liu;Yuhang Wu;Hong Zhang;Xu Qian;Songhe Song",
        "authorids": "~Ziyuan_Liu4;~Yuhang_Wu6;~Hong_Zhang13;~Xu_Qian4;~Songhe_Song1",
        "gender": "M;;M;M;",
        "homepage": "https://github.com/liu-ziyuan-math;https://mail.nudt.edu.cn/coremail/XT/index.jsp?sid=CAoeYRyyEQEtHfhlgMmDKHBFqVvHuUDv#mail.read%7C%7B%22fid%22%3A1%2C%22mid%22%3A%221%3A1tbiAQIAAWUJx1AEegACsF%22%2C%22mboxa%22%3A%22%22%2C%22start%22%3A1%7D;http://hzhang1991.github.io/;https://www.researchgate.net/profile/Xu-Qian-10;",
        "dblp": ";;;;",
        "google_scholar": ";;;;",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Ziyuan_Liu4;~Yuhang_Wu6;~Hong_Zhang13;~Xu_Qian4;~Songhe_Song1",
        "aff": "National University of Defense Technology;National University of Defense Technology;National University of Defense Technology;National University of Defense Technology;",
        "aff_domain": "nudt.edu.cn;nudt.edu.cn;nudt.edu.cn;nudt.edu.cn;",
        "position": "PhD student;PhD student;Associate Professor;Associate Professor;",
        "bibtex": "@misc{\nliu2024spfno,\ntitle={{SPFNO}: spectral operator learning for {PDE}s with Dirichlet and Neumann boundary conditions},\nauthor={Ziyuan Liu and Yuhang Wu and Hong Zhang and Xu Qian and Songhe Song},\nyear={2024},\nurl={https://openreview.net/forum?id=OPNuTXopkq}\n}",
        "github": "",
        "project": "",
        "reviewers": "YuJS;81kc;FprA;wNAD",
        "site": "https://openreview.net/forum?id=OPNuTXopkq",
        "pdf_size": 14026510,
        "rating": "1;3;3;5",
        "confidence": "4;5;5;4",
        "soundness": "1;2;1;2",
        "contribution": "1;2;1;2",
        "presentation": "1;1;2;3",
        "wc_summary": "82;34;87;109",
        "wc_strengths": "53;28;107;226",
        "wc_weaknesses": "159;152;379;439",
        "wc_questions": "143;91;196;306",
        "wc_review": "437;305;769;1080",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "370;744;538;1222",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            1.5,
            0.5
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            78.0,
            27.358728040608906
        ],
        "wc_strengths_avg": [
            103.5,
            76.27089877535205
        ],
        "wc_weaknesses_avg": [
            282.25,
            128.53671654433998
        ],
        "wc_questions_avg": [
            184.0,
            79.62097713542582
        ],
        "wc_review_avg": [
            647.75,
            301.4277483908872
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            718.5,
            319.45070042183346
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13675855283424510025&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "National University of Defense Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.nudt.edu.cn/",
        "aff_unique_abbr": "NUDT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "OPpqmSp0wK",
        "title": "Multi-label Cluster Discrimination for Visual Representation Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Contrastive Language-Image Pre-training (CLIP) has recently demonstrated success across various tasks due to superior feature representation empowered by image-text contrastive learning. However, the instance discrimination method used by CLIP can hardly encode the semantic structure of training data. To handle this limitation, cluster discrimination has been proposed through iterative classification and cluster assignment. Nevertheless, most cluster discrimination approaches only define a single pseudo-label for each image, neglecting multi-label signals in the image.\nIn this paper, we propose a novel multi-label cluster discrimination method to enhance representation learning. In the clustering step, we first cluster the large-scale LAION 400M dataset into one million centers based on off-the-shelf embedding features. Considering that natural images frequently contain multiple visual targets, we select the multiple closest centers as additional class labels. \nIn the discrimination step, we design an efficient multi-label classification loss, which elegantly separates losses from positive classes and negative classes and facilitates distributed training on large-scale data. We validate the proposed multi-label cluster discrimination method with experiments on different scales of models and pre-training datasets. Experimental results show that our method achieves state-of-the-art performance on multiple downstream tasks including linear probe, zero-shot classification, and image-text retrieval.",
        "keywords": "multi-label classification;feature representation learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/72f5a802fbe260a6c9f70e95aa67f58ca6472da5.zip",
        "author": "Xiang An;Kaicheng Yang;Jing Yang;Ziyong Feng;Jia Guo;Tongliang Liu;Jiankang Deng",
        "authorids": "~Xiang_An1;~Kaicheng_Yang1;~Jing_Yang7;~Ziyong_Feng1;~Jia_Guo1;~Tongliang_Liu1;~Jiankang_Deng1",
        "gender": "M;M;F;M;;M;M",
        "homepage": ";https://kaicheng-yang0828.github.io/;https://jingyang2017.github.io/;https://github.com/fengziyong;https://insightface.ai;https://tongliang-liu.github.io/;https://jiankangdeng.github.io/",
        "dblp": "132/0889;118/4505-2.html;62/5839-38.html;120/4362.html;;150/6667;156/7808",
        "google_scholar": "1ckaPgwAAAAJ;AQMkoXIAAAAJ;https://scholar.google.co.uk/citations?user=a0HJYXcAAAAJ;;H_-hMLUAAAAJ;https://scholar.google.com.au/citations?user=EiLdZ_YAAAAJ;Z_UoQFsAAAAJ",
        "orcid": "0009-0008-4652-8296;0009-0008-6073-9014;0000-0002-8794-4842;0009-0007-8689-8366;;;0000-0002-3709-6216",
        "linkedin": ";;;;;;jiankang-deng-b45b21b4/?originalSubdomain=uk",
        "or_profile": "~Xiang_An1;~Kaicheng_Yang1;~Jing_Yang7;~Ziyong_Feng1;~Jia_Guo1;~Tongliang_Liu1;~Jiankang_Deng1",
        "aff": "deepglint;DeepGlint;University of Cambridge;DeepGlint;InsightFace.AI;Mohamed bin Zayed University of Artificial Intelligence;Imperial College London",
        "aff_domain": "deepglint.com;deepglint.com;cam.ac.uk;deepglint.com;insightface.ai;mbzuai.ac.ae;imperial.ac.uk",
        "position": "Researcher;Researcher;Postdoc;PhD student;Researcher;Affiliated Associate Professor;Lecturer",
        "bibtex": "@misc{\nan2024multilabel,\ntitle={Multi-label Cluster Discrimination for Visual Representation Learning},\nauthor={Xiang An and Kaicheng Yang and Jing Yang and Ziyong Feng and Jia Guo and Tongliang Liu and Jiankang Deng},\nyear={2024},\nurl={https://openreview.net/forum?id=OPpqmSp0wK}\n}",
        "github": "",
        "project": "",
        "reviewers": "KbPe;g3TE;S2Uc",
        "site": "https://openreview.net/forum?id=OPpqmSp0wK",
        "pdf_size": 1734833,
        "rating": "5;5;5",
        "confidence": "3;3;4",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "3;2;4",
        "wc_summary": "77;107;80",
        "wc_strengths": "57;48;92",
        "wc_weaknesses": "96;373;177",
        "wc_questions": "36;32;184",
        "wc_review": "266;560;533",
        "wc_reply_reviewers": "0;195;41",
        "wc_reply_authors": "631;1370;1130",
        "reply_reviewers": "0;1;1",
        "reply_authors": "1;3;2",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            88.0,
            13.490737563232042
        ],
        "wc_strengths_avg": [
            65.66666666666667,
            18.979521127315678
        ],
        "wc_weaknesses_avg": [
            215.33333333333334,
            116.28795676633453
        ],
        "wc_questions_avg": [
            84.0,
            70.72953178599917
        ],
        "wc_review_avg": [
            453.0,
            132.68760303811354
        ],
        "wc_reply_reviewers_avg": [
            78.66666666666667,
            83.94574967732964
        ],
        "wc_reply_authors_avg": [
            1043.6666666666667,
            307.8098258485081
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7701734834527253932&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;0;1;0;2;3;4",
        "aff_unique_norm": "DeepGlint;University of Cambridge;InsightFace.AI;Mohamed bin Zayed University of Artificial Intelligence;Imperial College London",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.deepglint.com;https://www.cam.ac.uk;https://www.insightface.ai;https://mbzuai.ac.ae;https://www.imperial.ac.uk",
        "aff_unique_abbr": "DeepGlint;Cambridge;InsightFace.AI;MBZUAI;ICL",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Cambridge",
        "aff_country_unique_index": "0;0;1;0;0;2;1",
        "aff_country_unique": "China;United Kingdom;United Arab Emirates"
    },
    {
        "id": "OQccFglTb5",
        "title": "FT-SHIELD: A Watermark Against Unauthorized Fine-tuning in Text-to-Image Diffusion Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Text-to-image generative models based on latent diffusion models (LDM) have demonstrated their outstanding ability in generating high-quality and high-resolution images according to language prompt. Based on these powerful latent diffusion models, various fine-tuning methods have been proposed to achieve the personalization of text-to-image diffusion models such as artistic style adaptation and human face transfer. However, the unauthorized usage of data for model personalization has emerged as a prevalent concern in relation to copyright violations. For example, a malicious user may use the fine-tuning technique to generate images which mimic the style of a painter without his/her permission. In light of this concern, we have proposed FT-Shield, a watermarking approach specifically designed for the fine-tuning of text-to-image diffusion models to aid in detecting instances of infringement. We develop a novel algorithm for the generation of the watermark to ensure that the watermark on the training images can be quickly and accurately transferred to the generated images of text-to-image diffusion models. A watermark will be detected on an image by a binary watermark detector if the image is generated by a model that has been fine-tuned using the protected watermarked images. Comprehensive experiments were conducted to validate the effectiveness of FT-Shield.",
        "keywords": "Generative Diffusion Models;Watermarks;Copyright Protection",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Yingqian Cui;Jie Ren;Yuping Lin;Han Xu;Pengfei He;Yue Xing;Wenqi Fan;Hui Liu;Jiliang Tang",
        "authorids": "~Yingqian_Cui1;~Jie_Ren6;~Yuping_Lin3;~Han_Xu1;~Pengfei_He2;~Yue_Xing1;~Wenqi_Fan1;~Hui_Liu8;~Jiliang_Tang1",
        "gender": "F;M;M;M;M;;M;F;M",
        "homepage": "https://yingqiancui.github.io/;https://renjie3.github.io/;;https://cse.msu.edu/~xuhan1/;https://pengfeihepower.github.io/;https://sites.google.com/site/xingyuecuhk/;https://wenqifan03.github.io;https://scholar.google.com/citations?user=EuzF_zsAAAAJ&hl=en;https://www.cse.msu.edu/~tangjili/",
        "dblp": ";181/2887-19.html;82/4964.html;32/34-2;37/10219-2;185/5744-2.html;218/7410;93/4010-31;64/10812",
        "google_scholar": "3p67r08AAAAJ;;liHGqfYAAAAJ;mX2rL3IAAAAJ;nsSrd6kAAAAJ;;https://scholar.google.com/citations?hl=en;;WtzKMWAAAAAJ",
        "orcid": ";;0009-0009-0653-9908;0000-0002-4016-6748;;;0000-0002-4049-1233;0000-0002-3555-3495;0000-0001-7125-3898",
        "linkedin": ";;;;;;wenqi-fan-a425a7196/;;",
        "or_profile": "~Yingqian_Cui1;~Jie_Ren6;~Yuping_Lin3;~Han_Xu1;~Pengfei_He2;~Yue_Xing1;~Wenqi_Fan1;~Hui_Liu8;~Jiliang_Tang1",
        "aff": "Michigan State University;Sony Europe Ltd.;Michigan State University;Michigan State University;Michigan State University;Michigan State University;The Hong Kong Polytechnic University;Michigan State University;Michigan State University",
        "aff_domain": "msu.edu;sony.com;msu.edu;msu.edu;msu.edu;msu.edu;polyu.edu.hk;msu.edu;msu.edu",
        "position": "PhD student;Intern;PhD student;PhD student;PhD student;Assistant Professor;Assistant Professor;Assistant Professor;Full Professor",
        "bibtex": "@misc{\ncui2024ftshield,\ntitle={{FT}-{SHIELD}: A Watermark Against Unauthorized Fine-tuning in Text-to-Image Diffusion Models},\nauthor={Yingqian Cui and Jie Ren and Yuping Lin and Han Xu and Pengfei He and Yue Xing and Wenqi Fan and Hui Liu and Jiliang Tang},\nyear={2024},\nurl={https://openreview.net/forum?id=OQccFglTb5}\n}",
        "github": "",
        "project": "",
        "reviewers": "1g5B;gF4L;DTgk;WhCc",
        "site": "https://openreview.net/forum?id=OQccFglTb5",
        "pdf_size": 6700361,
        "rating": "3;3;3;6",
        "confidence": "4;5;4;3",
        "soundness": "3;2;2;3",
        "contribution": "3;2;2;2",
        "presentation": "2;2;3;2",
        "wc_summary": "90;142;67;61",
        "wc_strengths": "44;16;33;54",
        "wc_weaknesses": "135;40;370;92",
        "wc_questions": "260;25;5;141",
        "wc_review": "529;223;475;348",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            90.0,
            31.913946794465897
        ],
        "wc_strengths_avg": [
            36.75,
            14.095655359010449
        ],
        "wc_weaknesses_avg": [
            159.25,
            126.24059370899678
        ],
        "wc_questions_avg": [
            107.75,
            102.0915642940199
        ],
        "wc_review_avg": [
            393.75,
            118.47230689068226
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 17,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10398311162702863205&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;0;0;0;0;2;0;0",
        "aff_unique_norm": "Michigan State University;Sony Europe;Hong Kong Polytechnic University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.msu.edu;https://www.sony.eu;https://www.polyu.edu.hk",
        "aff_unique_abbr": "MSU;Sony Europe;PolyU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;1;0;0;0;0;2;0;0",
        "aff_country_unique": "United States;United Kingdom;China"
    },
    {
        "id": "OR4Jo158Dd",
        "title": "Synthesizing Programmatic Policy for Domain Generalization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep reinforcement learning has effectively addressed numerous complex control tasks. \nHowever, when the environment undergoes changes, such as increasing the number of discs from three to four in the `Tower of Hanoi', learned policies often struggle with generalization. \nWe propose an algorithm for learning programmatic policies capable of capturing environment variations. \nIn doing so, these policies gain the capability to generalize to instances where certain aspects of the domain exhibit variations, a property we term domain generalization.\nWe design a Domain Specific Language to construct the structure of the policy.\nThrough sampling tasks from a task distribution, we can train the policy with a meta-learning algorithm.\nFurthermore, our approach incorporates Recurrent Neural Network (RNN) into the structure of the programmatic policy to enhance agent-environment interactions.\nExperiment results demonstrate the efficiency of our approach across three environments with domain generalization. \nIn addition, the learned policy shows its ability to generalize to tasks under different variations of environments.",
        "keywords": "programmatic policy;reinforcement learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/3d6eedc3c59dfb005fe59ef073b16d06bfcb3c29.pdf",
        "author": "Tianyi Wu;Liwei Shen;Zhen Dong;Xin Peng;Wenyun Zhao",
        "authorids": "~Tianyi_Wu5;~Liwei_Shen1;~Zhen_Dong5;~Xin_Peng6;wyzhao@fudan.edu.cn",
        "gender": ";M;M;M;",
        "homepage": "https://github.com/V0idwu;;https://zhendong2050.github.io/;https://cspengxin.github.io;",
        "dblp": ";39/2105;60/1749-4;;",
        "google_scholar": ";;jfYe73AAAAAJ;wATYGXEAAAAJ;",
        "orcid": ";;;0000-0003-3376-2581;",
        "linkedin": ";;;;",
        "or_profile": "~Tianyi_Wu5;~Liwei_Shen1;~Zhen_Dong5;~Xin_Peng6;wyzhao@fudan.edu.cn",
        "aff": ";;Fudan University;Fudan University;",
        "aff_domain": ";;fudan.edu.cn;fudan.edu.cn;",
        "position": ";;Associate Professor;Full Professor;",
        "bibtex": "@misc{\nwu2024synthesizing,\ntitle={Synthesizing Programmatic Policy for Domain Generalization},\nauthor={Tianyi Wu and Liwei Shen and Zhen Dong and Xin Peng and Wenyun Zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=OR4Jo158Dd}\n}",
        "github": "",
        "project": "",
        "reviewers": "Ji45;F5nm;iY3T",
        "site": "https://openreview.net/forum?id=OR4Jo158Dd",
        "pdf_size": 4164174,
        "rating": "3;5;5",
        "confidence": "4;4;4",
        "soundness": "2;3;2",
        "contribution": "1;3;3",
        "presentation": "1;3;2",
        "wc_summary": "90;186;76",
        "wc_strengths": "20;170;137",
        "wc_weaknesses": "218;431;233",
        "wc_questions": "99;3;65",
        "wc_review": "427;790;511",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            117.33333333333333,
            48.88989897946428
        ],
        "wc_strengths_avg": [
            109.0,
            64.35837163881635
        ],
        "wc_weaknesses_avg": [
            294.0,
            97.06698717895802
        ],
        "wc_questions_avg": [
            55.666666666666664,
            39.74362282877035
        ],
        "wc_review_avg": [
            576.0,
            155.15798400340216
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:BbyJPcFexwgJ:scholar.google.com/&scioq=Synthesizing+Programmatic+Policy+for+Domain+Generalization&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Fudan University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.fudan.edu.cn",
        "aff_unique_abbr": "Fudan",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "ORHuMEwaC8",
        "title": "The Role of Counterfactual Explanations in Model Extraction Attacks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Counterfactuals provide guidance on achieving a favorable outcome from a model, with minimum input perturbation. However, counterfactuals can also be exploited to leak information about the underlying model, causing privacy concerns. Prior work shows that one can query for counterfactuals with several input instances and train a surrogate model using all the queries and their counterfactuals. In this work, we analyze how model extraction attacks can be improved by further leveraging the fact that the counterfactuals also lie quite close to the decision boundary. Using polytope theory, we derive a novel theoretical relationship between the error in model approximation and the number of queries, when the queries exactly return the \"closest\" counterfactual. Noting the practicalities of counterfactual generation, we also provide additional theoretical guarantees leveraging Lipschitz continuity, that hold when the counterfactuals are reasonably close but may not be the closest ones. Our theoretical results help us arrive at a simple strategy for model extraction, which includes a loss function that treats counterfactuals differently than ordinary instances. Our approach also alleviates the related problem of \"decision boundary shift\". Experimental results demonstrate the performance of our strategy on synthetic data as well as popular real-world tabular datasets.",
        "keywords": "model extraction;counterfactual explanations;decision boundary shift;polytope theory;query complexity",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Pasan Dissanayake;Sanghamitra Dutta",
        "authorids": "~Pasan_Dissanayake1;~Sanghamitra_Dutta2",
        "gender": "M;F",
        "homepage": ";https://sites.google.com/site/sanghamitraweb/",
        "dblp": "292/8397;154/6653",
        "google_scholar": "isO0bMwAAAAJ;BgaqaXwAAAAJ",
        "orcid": "0000-0003-0997-332X;0000-0002-6500-2627",
        "linkedin": "pasandissanayake;",
        "or_profile": "~Pasan_Dissanayake1;~Sanghamitra_Dutta2",
        "aff": "University of Maryland, College Park;University of Maryland, College Park",
        "aff_domain": "umd.edu;umd.edu",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\ndissanayake2024the,\ntitle={The Role of Counterfactual Explanations in Model Extraction Attacks},\nauthor={Pasan Dissanayake and Sanghamitra Dutta},\nyear={2024},\nurl={https://openreview.net/forum?id=ORHuMEwaC8}\n}",
        "github": "",
        "project": "",
        "reviewers": "MQ33;4YsF;q134;vcnE",
        "site": "https://openreview.net/forum?id=ORHuMEwaC8",
        "pdf_size": 3142282,
        "rating": "3;5;6;6",
        "confidence": "4;4;4;3",
        "soundness": "2;3;3;2",
        "contribution": "2;2;3;2",
        "presentation": "2;3;3;3",
        "wc_summary": "62;13;137;182",
        "wc_strengths": "205;41;210;61",
        "wc_weaknesses": "251;61;316;216",
        "wc_questions": "99;51;69;115",
        "wc_review": "617;166;732;574",
        "wc_reply_reviewers": "0;0;148;0",
        "wc_reply_authors": "935;808;879;1084",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            98.5,
            65.37774850818893
        ],
        "wc_strengths_avg": [
            129.25,
            78.58872374584028
        ],
        "wc_weaknesses_avg": [
            211.0,
            93.74166629626338
        ],
        "wc_questions_avg": [
            83.5,
            24.994999499899976
        ],
        "wc_review_avg": [
            522.25,
            213.6379823439643
        ],
        "wc_reply_reviewers_avg": [
            37.0,
            64.08587988004847
        ],
        "wc_reply_authors_avg": [
            926.5,
            101.4605834794971
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.4714045207910316,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Ghz_Xz3RxdQJ:scholar.google.com/&scioq=The+Role+of+Counterfactual+Explanations+in+Model+Extraction+Attacks&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Maryland",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www/umd.edu",
        "aff_unique_abbr": "UMD",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "College Park",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "OROKjdAfjs",
        "title": "TransNormerLLM: A Faster and Better Large Language Model with Improved TransNormer",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We present TransNormerLLM, the first linear attention-based Large Language Model (LLM) that outperforms conventional softmax attention-based models in terms of both accuracy and efficiency. TransNormerLLM evolves from the previous linear attention architecture TransNormer by making advanced modifications that include positional embedding, linear attention acceleration, gating mechanism, tensor normalization, and inference acceleration and stabilization. \nSpecifically, we use LRPE together with an exponential decay to avoid attention dilution issues while allowing the model to retain global interactions between tokens.\nAdditionally, we propose Lightning Attention, a cutting-edge technique that accelerates linear attention by more than twice in runtime and reduces memory usage by a remarkable four times.\nTo further enhance the performance of TransNormer, we leverage a gating mechanism to smooth training and a new tensor normalization scheme to accelerate the model, resulting in an impressive acceleration of over 20\\%. \nFurthermore, we develop a robust inference algorithm that ensures numerical stability and consistent inference speed, regardless of the sequence length, showcasing superior efficiency during both training and inference stages.\nWe also implement an efficient model parallel schema for TransNormerLLM, enabling seamless deployment on large-scale clusters and facilitating expansion to even more extensive models, i.e., LLMs with 175B parameters. We validate our model design through a series of ablations and train models with sizes of 385M, 1B, and 7B on our self-collected corpus. Benchmark results demonstrate that our models not only match the performance of state-of-the-art LLMs with Transformer but are also significantly faster.",
        "keywords": "Linear Transformer;Large Language model",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Zhen Qin;Dong Li;Weigao Sun;Weixuan Sun;Xuyang Shen;Xiaodong Han;Yunshen Wei;Baohong Lv;Xiao Luo;Yu Qiao;Yiran Zhong",
        "authorids": "~Zhen_Qin6;~Dong_Li11;~Weigao_Sun1;~Weixuan_Sun1;~Xuyang_Shen1;~Xiaodong_Han3;~Yunshen_Wei1;~Baohong_Lv1;~Xiao_Luo5;~Yu_Qiao1;~Yiran_Zhong1",
        "gender": ";M;M;M;M;;M;M;M;;M",
        "homepage": "https://github.com/Doraemonzzz;;https://weigao266.github.io/;https://weixuansun.github.io/weixuansun-github.io/;;;https://www.zhihu.com/people/wei-yun-shen;https://github.com/lkjx82;;;",
        "dblp": ";;;186/6724;274/2342;;;;;;158/9624",
        "google_scholar": "https://scholar.google.com.sg/citations?user=IcBRtycAAAAJ;bxmsqZIAAAAJ;https://scholar.google.com/citations?hl=en;vIS56AoAAAAJ;k6Q1mcoAAAAJ;;;;;;https://scholar.google.com.sg/citations?user=E9NVOBUAAAAJ",
        "orcid": ";;;;0000-0002-1968-7055;;;;;;",
        "linkedin": ";;weigao-sun-01ab4a1b3/;;;;;;windlx/;;",
        "or_profile": "~Zhen_Qin6;~Dong_Li11;~Weigao_Sun1;~Weixuan_Sun1;~Xuyang_Shen1;~Xiaodong_Han3;~Yunshen_Wei1;~Baohong_Lv1;~Xiao_Luo5;~Yu_Qiao1;~Yiran_Zhong1",
        "aff": "TapTap;Shanghai AI Lab;Shanghai Artificial Intelligence Laboratory;Tencent;Shanghai AI Lab;;sensetime;SenseTime;;;Shanghai AI Lab",
        "aff_domain": "xd.com;org.cn;pjlab.org.cn;tencent.com;pjlab.org.cn;;sensetime.com;sensetime.com;;;pjlab.org.cn",
        "position": "Researcher;Researcher;Researcher;Researcher;Researcher;;Senior R&D Manager;Deputy Director of R&D;;;PI",
        "bibtex": "@misc{\nqin2024transnormerllm,\ntitle={TransNormer{LLM}: A Faster and Better Large Language Model with Improved TransNormer},\nauthor={Zhen Qin and Dong Li and Weigao Sun and Weixuan Sun and Xuyang Shen and Xiaodong Han and Yunshen Wei and Baohong Lv and Xiao Luo and Yu Qiao and Yiran Zhong},\nyear={2024},\nurl={https://openreview.net/forum?id=OROKjdAfjs}\n}",
        "github": "",
        "project": "",
        "reviewers": "5syF;xvcu;s89T;LFwx",
        "site": "https://openreview.net/forum?id=OROKjdAfjs",
        "pdf_size": 756278,
        "rating": "5;5;6;8",
        "confidence": "4;5;4;4",
        "soundness": "2;3;3;4",
        "contribution": "2;2;3;4",
        "presentation": "3;3;2;4",
        "wc_summary": "69;138;42;91",
        "wc_strengths": "60;113;19;71",
        "wc_weaknesses": "223;116;150;69",
        "wc_questions": "2;69;48;42",
        "wc_review": "354;436;259;273",
        "wc_reply_reviewers": "0;0;52;0",
        "wc_reply_authors": "1052;1152;907;751",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "2;2;2;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            85.0,
            35.17811819867572
        ],
        "wc_strengths_avg": [
            65.75,
            33.46173187388842
        ],
        "wc_weaknesses_avg": [
            139.5,
            56.13599558215744
        ],
        "wc_questions_avg": [
            40.25,
            24.252577182641847
        ],
        "wc_review_avg": [
            330.5,
            70.88899773589694
        ],
        "wc_reply_reviewers_avg": [
            13.0,
            22.516660498395403
        ],
        "wc_reply_authors_avg": [
            965.5,
            151.40756255881013
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": -0.4714045207910316,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16948523380342421242&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;3;1;4;4;1",
        "aff_unique_norm": "TapTap;Shanghai AI Lab;Shanghai Artificial Intelligence Laboratory;Tencent;SenseTime",
        "aff_unique_dep": ";;;Tencent Holdings Limited;",
        "aff_unique_url": "https://www.taptap.io;https://www.shanghaiailab.com;http://www.shailab.org/;https://www.tencent.com;https://www.sensetime.com",
        "aff_unique_abbr": "TapTap;SAIL;Shanghai AI Lab;Tencent;SenseTime",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "CoT3DRef: Chain-of-Thoughts Data-Efficient 3D Visual Grounding",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18742",
        "id": "ORUiqcLpV6",
        "author_site": "eslam Abdelrahman, Mohamed Ayman Mohamed, Mahmoud Ahmed, Habib, Mohamed Elhoseiny",
        "tldr": "",
        "abstract": "3D visual grounding is the ability to localize objects in 3D scenes conditioned by utterances. Most existing methods devote the referring head to localize the referred object directly, causing failure in complex scenarios. In addition, it does not illustrate how and why the network reaches the final decision. In this paper, we address this question \u201cCan we design an interpretable 3D visual grounding framework that has the potential to mimic the human perception system?\u201d. To this end, we formulate the 3D visual grounding problem as a sequence-to-sequence (Seq2Seq) task by first predicting a chain of anchors and then the final target. Interpretability not only improves the overall performance but also helps us identify failure cases. Following the chain of thoughts approach enables us to decompose the referring task into interpretable intermediate steps, boosting the performance and making our framework extremely data-efficient. Moreover, our proposed framework can be easily integrated into any existing architecture. We validate our approach through comprehensive experiments on the Nr3D, Sr3D, and Scanrefer benchmarks and show consistent performance gains compared to existing methods without requiring manually annotated data. Furthermore, our proposed framework, dubbed CoT3DRef, is significantly data-efficient, whereas on the Sr3D dataset, when trained only on 10% of the data, we match the SOTA performance that trained on the entire data. The code is available at github.com/eslambakr/CoT 3DV G.",
        "keywords": "3D referring;3D visual grounding;localization;3D",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/84138ef2b80a9545264ccd23266798e9c97deb18.zip",
        "author": "Eslam Mohamed BAKR;Mohamed Ayman Mohamed;Mahmoud Ahmed;Habib Slim;Mohamed Elhoseiny",
        "authorids": "~Eslam_Mohamed_BAKR1;~Mohamed_Ayman_Mohamed1;~Mahmoud_Ahmed2;~Habib_Slim1;~Mohamed_Elhoseiny1",
        "gender": "M;M;;M;M",
        "homepage": ";;;https://habibslim.github.io/;http://www.mohamed-elhoseiny.com",
        "dblp": "330/8100;;;https://dblp.uni-trier.de/pid/234/5978;125/2894",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.ca/citations?user=UIcj1-QAAAAJ;;bOEvZ3MAAAAJ;iRBUTOAAAAAJ",
        "orcid": ";;;;0000-0001-9659-1551",
        "linkedin": "eslam-bakr-a693a0124/;mohamed-ayman-mohamed-47497b197/;;;mohamed-elhoseiny-8a836215/",
        "or_profile": "~Eslam_Mohamed_BAKR1;~Mohamed_Ayman_Mohamed1;~Mahmoud_Ahmed2;~Habib_Slim1;~Mohamed_Elhoseiny1",
        "aff": "King Abdullah University of Science and Technology; University of Alberta;;King Abdullah University of Science and Technology;KAUST",
        "aff_domain": "kaust.edu.sa;cs.ualberta.ca;;kaust.edu.sa;kaust.edu.sa",
        "position": "PhD student;MS student;;PhD student;Associate Professor",
        "bibtex": "@inproceedings{\nbakr2024cotdref,\ntitle={CoT3{DR}ef: Chain-of-Thoughts Data-Efficient 3D Visual Grounding},\nauthor={Eslam Mohamed BAKR and Mohamed Ayman Mohamed and Mahmoud Ahmed and Habib Slim and Mohamed Elhoseiny},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ORUiqcLpV6}\n}",
        "github": "",
        "project": "",
        "reviewers": "kjGR;6KUg;ywux;hPTL",
        "pdf_size": 23550587,
        "rating": "6;6;6;6",
        "confidence": "3;5;4;4",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "66;103;76;78",
        "wc_strengths": "52;103;171;55",
        "wc_weaknesses": "200;319;84;51",
        "wc_questions": "2;6;20;1",
        "wc_review": "320;531;351;185",
        "wc_reply_reviewers": "0;70;0;13",
        "wc_reply_authors": "722;1378;734;243",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "1;3;1;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            80.75,
            13.626720074911644
        ],
        "wc_strengths_avg": [
            95.25,
            48.18908071337323
        ],
        "wc_weaknesses_avg": [
            163.5,
            105.46207849269803
        ],
        "wc_questions_avg": [
            7.25,
            7.595228765481656
        ],
        "wc_review_avg": [
            346.75,
            123.33364301762921
        ],
        "wc_reply_reviewers_avg": [
            20.75,
            28.925550988702014
        ],
        "wc_reply_authors_avg": [
            769.25,
            403.4199889693122
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1000357450365639540&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=ORUiqcLpV6",
        "pdf": "https://openreview.net/pdf?id=ORUiqcLpV6",
        "email": "kaust.edu.sa;cs.ualberta.ca;;kaust.edu.sa;kaust.edu.sa",
        "author_num": 5,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "King Abdullah University of Science and Technology;University of Alberta",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.kast.kau.edu.sa;https://www.ualberta.ca",
        "aff_unique_abbr": "KAUST;UAlberta",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "Saudi Arabia;Canada"
    },
    {
        "id": "OTMPdMH9JL",
        "title": "Neural Eigenfunctions Are Structured Representation Learners",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper introduces a structured, adaptive-length deep representation called Neural Eigenmap. Unlike prior spectral methods such as Laplacian Eigenmap that operate in a nonparametric manner, Neural Eigenmap leverages NeuralEF to parametrically model eigenfunctions using a neural network. We show that, when the eigenfunction is derived from positive relations in a data augmentation setup, applying NeuralEF results in an objective function that resembles those of popular self-supervised learning methods, with an additional symmetry-breaking property that leads to structured representations where features are ordered by importance. We demonstrate using such representations as adaptive-length codes in image retrieval systems. By truncation according to feature importance, our method requires up to $16\\times$ shorter representation length than leading self-supervised learning ones to achieve similar retrieval performance. We further apply our method to graph data and report strong results on a node representation learning benchmark with more than one million nodes.",
        "keywords": "unsupervised representation learning;neural eigenfunctions",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/6f9ecbb643b8c13efe8c198518f3511178ed80e0.zip",
        "author": "Zhijie Deng;Jiaxin Shi;Hao Zhang;Peng Cui;Cewu Lu;Jun Zhu",
        "authorids": "~Zhijie_Deng1;~Jiaxin_Shi1;~Hao_Zhang2;~Peng_Cui6;~Cewu_Lu3;~Jun_Zhu2",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://thudzj.github.io/;http://jiaxins.io;https://cseweb.ucsd.edu/~haozhang/;https://scholar.google.com/citations?user=c_VTs5MAAAAJ&hl=zh-CN;https://www.mvig.org/;http://ml.cs.tsinghua.edu.cn/~jun",
        "dblp": "209/4959;151/7509;55/2270-25;31/891-7;;50/2644-1",
        "google_scholar": "J3dR0sUAAAAJ;juZXbFoAAAAJ;H1d4BS8AAAAJ;c_VTs5MAAAAJ;https://scholar.google.com.tw/citations?user=QZVQEWAAAAAJ;axsP38wAAAAJ",
        "orcid": "0000-0002-0932-1631;;;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Zhijie_Deng1;~Jiaxin_Shi1;~Hao_Zhang2;~Peng_Cui6;~Cewu_Lu3;~Jun_Zhu2",
        "aff": "Shanghai Jiaotong University;Google DeepMind;Carnegie Mellon University;Tsinghua University;Shanghai Jiaotong University;Tsinghua University",
        "aff_domain": "sjtu.edu.cn;google.com;cmu.edu;cs.tsinghua.edu.cn;sjtu.edu.cn;mail.tsinghua.edu.cn",
        "position": "Assistant Professor;Research Scientist;PhD student;PhD student;Full Professor;Professor",
        "bibtex": "@misc{\ndeng2024neural,\ntitle={Neural Eigenfunctions Are Structured Representation Learners},\nauthor={Zhijie Deng and Jiaxin Shi and Hao Zhang and Peng Cui and Cewu Lu and Jun Zhu},\nyear={2024},\nurl={https://openreview.net/forum?id=OTMPdMH9JL}\n}",
        "github": "",
        "project": "",
        "reviewers": "RwzV;t4xz;oHVo;WyYb",
        "site": "https://openreview.net/forum?id=OTMPdMH9JL",
        "pdf_size": 6017186,
        "rating": "6;6;6;8",
        "confidence": "4;3;3;3",
        "soundness": "3;3;2;3",
        "contribution": "3;3;2;3",
        "presentation": "4;3;2;3",
        "wc_summary": "72;72;61;88",
        "wc_strengths": "55;28;48;135",
        "wc_weaknesses": "13;102;76;127",
        "wc_questions": "64;103;221;144",
        "wc_review": "204;305;406;494",
        "wc_reply_reviewers": "4;0;68;0",
        "wc_reply_authors": "108;686;749;671",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "2;1;4;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            73.25,
            9.627434756984853
        ],
        "wc_strengths_avg": [
            66.5,
            40.77070026379238
        ],
        "wc_weaknesses_avg": [
            79.5,
            42.4175671155242
        ],
        "wc_questions_avg": [
            133.0,
            58.15066637623339
        ],
        "wc_review_avg": [
            352.25,
            108.61946188413934
        ],
        "wc_reply_reviewers_avg": [
            18.0,
            28.91366458960192
        ],
        "wc_reply_authors_avg": [
            553.5,
            258.86917545354834
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13930099210796320128&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;3;0;3",
        "aff_unique_norm": "Shanghai Jiao Tong University;Google;Carnegie Mellon University;Tsinghua University",
        "aff_unique_dep": ";Google DeepMind;;",
        "aff_unique_url": "https://www.sjtu.edu.cn;https://deepmind.com;https://www.cmu.edu;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "SJTU;DeepMind;CMU;THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;0;0;0",
        "aff_country_unique": "China;United Kingdom;United States"
    },
    {
        "id": "OUVKpxeCYB",
        "title": "\u03b1-Rank: Unified Item-Fair Ranking from A Cooperative Game Theory View",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Driven by economic and systematic considerations, the pursuit of item fairness in ranking has emerged as a prominent topic in recommendation and advertising applications. \nPrior research has suggested various fairness aspects can be aligned with the concept of distributive justice in sociology, such as utilitarianism, dealism, and egalitarianism.\nHowever, they fail to distinguish the distinctions and relationships among these fairness dimensions in ranking. \nIn fact, item fairness can be viewed as a unified challenge of fairly allocating the constrained and fluctuating resources, from the perspective of cooperative game theory.\nIn our work, we introduce the smooth \u03b1-fairness objective for different fairness and unify item fairness as a cooperative game problem. In such games, items are considered as the players dividing the cake of user attention.\nIn such games, we analyze the \u03b1-fairness objective from a theoretical way and introduce an efficient approach called \u03b1-rank. Firstly, we re-form several important axioms in cooperative games to tell us how item fairness principles exhibit when the resource ``cake'' changes in ranking. \nThen we designed \u03b1-rank, which applies the optimal transport to conduct item fairness. Theoretical analysis provides an upper bound, showcasing the maximum total utility loss across different fairness degrees. \nwe conducted experiments in two ranking applications: recommendation and advertising. The experimental results demonstrate that \u03b1-rank effectively and efficiently outperforms the baseline methods.",
        "keywords": "item fairness;cooperative game theory;ranking",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/6ceee68360e1f3486a4c952c51f6fec76244d756.zip",
        "author": "Chen Xu;Xiaopeng Ye;Jun Xu;Xiao Zhang;Ji-Rong Wen",
        "authorids": "~Chen_Xu11;~Xiaopeng_Ye1;~Jun_Xu1;~Xiao_Zhang7;~Ji-Rong_Wen1",
        "gender": "M;M;M;M;M",
        "homepage": ";;https://gsai.ruc.edu.cn/~junxu;https://pinkfloyd1989.github.io/Xiao_Zhang/;https://gsai.ruc.edu.cn/english/jrwen",
        "dblp": "54/1474-10;;90/514-1;49/4478-34;w/JRWen",
        "google_scholar": "X0tPJdUAAAAJ;nIolPjQAAAAJ;su14mcEAAAAJ;https://scholar.google.com.hk/citations?user=5FZ6wbAAAAAJ;tbxCHJgAAAAJ",
        "orcid": ";;;0000-0001-7397-5632;0000-0002-9777-9676",
        "linkedin": ";;;;",
        "or_profile": "~Chen_Xu11;~Xiaopeng_Ye1;~Jun_Xu1;~Xiao_Zhang7;~Ji-Rong_Wen1",
        "aff": "Renmin University of China;Renmin University of China;Renmin University of China;Renmin University of China;Renmin University of China",
        "aff_domain": "ruc.edu.cn;ruc.edu.cn;ruc.edu.cn;ruc.edu.cn;ruc.edu.cn",
        "position": "PhD student;PhD student;Full Professor;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nxu2024rank,\ntitle={\\ensuremath{\\alpha}-Rank: Unified Item-Fair Ranking from A Cooperative Game Theory View},\nauthor={Chen Xu and Xiaopeng Ye and Jun Xu and Xiao Zhang and Ji-Rong Wen},\nyear={2024},\nurl={https://openreview.net/forum?id=OUVKpxeCYB}\n}",
        "github": "",
        "project": "",
        "reviewers": "3aBo;u8er;EN7p;9VZx",
        "site": "https://openreview.net/forum?id=OUVKpxeCYB",
        "pdf_size": 11583878,
        "rating": "3;3;5;6",
        "confidence": "4;4;2;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "1;1;2;2",
        "wc_summary": "95;114;63;42",
        "wc_strengths": "46;131;33;35",
        "wc_weaknesses": "339;633;82;18",
        "wc_questions": "3;8;2;91",
        "wc_review": "483;886;180;186",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            78.5,
            27.861263431510064
        ],
        "wc_strengths_avg": [
            61.25,
            40.57323625248546
        ],
        "wc_weaknesses_avg": [
            268.0,
            242.57060827726016
        ],
        "wc_questions_avg": [
            26.0,
            37.59654239421492
        ],
        "wc_review_avg": [
            433.75,
            288.41148988901256
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.7543365091413573,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:VgUNMurytaEJ:scholar.google.com/&scioq=%CE%B1-Rank:+Unified+Item-Fair+Ranking+from+A+Cooperative+Game+Theory+View&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Renmin University of China",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.ruc.edu.cn",
        "aff_unique_abbr": "RUC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "$\\infty$-Diff: Infinite Resolution Diffusion with Subsampled Mollified States",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18741",
        "id": "OUeIBFhyem",
        "author_site": "Sam Bond-Taylor, Chris G Willcocks",
        "tldr": "",
        "abstract": "This paper introduces $\\infty$-Diff, a generative diffusion model defined in an infinite-dimensional Hilbert space, which can model infinite resolution data. By training on randomly sampled subsets of coordinates and denoising content only at those locations, we learn a continuous function for arbitrary resolution sampling. Unlike prior neural field-based infinite-dimensional models, which use point-wise functions requiring latent compression, our method employs non-local integral operators to map between Hilbert spaces, allowing spatial context aggregation. This is achieved with an efficient multi-scale function-space architecture that operates directly on raw sparse coordinates, coupled with a mollified diffusion process that smooths out irregularities. Through experiments on high-resolution datasets, we found that even at an $8\\times$ subsampling rate, our model retains high-quality diffusion. This leads to significant run-time and memory savings, delivers samples with lower FID scores, and scales beyond the training resolution while retaining detail.",
        "keywords": "Generative Models;Diffusion Models;Infinite Resolution",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/bbe85c2185d9fa3f4f41c5bde350f7469effec49.zip",
        "author": "Sam Bond-Taylor;Chris G. Willcocks",
        "authorids": "~Sam_Bond-Taylor1;~Chris_G._Willcocks1",
        "gender": ";M",
        "homepage": "https://www.dur.ac.uk/research/directory/staff/?id=18951;http://cwkx.com",
        "dblp": "https://dblp.uni-trier.de/pid/270/0020;28/11416",
        "google_scholar": "https://scholar.google.co.uk/citations?user=xQ4rXyoAAAAJ;F5QdeesAAAAJ",
        "orcid": "0000-0003-1538-7909;0000-0001-6821-3924",
        "linkedin": ";chris-willcocks/",
        "or_profile": "~Sam_Bond-Taylor1;~Chris_G._Willcocks1",
        "aff": "Durham University;Durham University",
        "aff_domain": "durham.ac.uk;durham.ac.uk",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nbond-taylor2024inftydiff,\ntitle={\\${\\textbackslash}infty\\$-Diff: Infinite Resolution Diffusion with Subsampled Mollified States},\nauthor={Sam Bond-Taylor and Chris G. Willcocks},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=OUeIBFhyem}\n}",
        "github": "",
        "project": "",
        "reviewers": "btvx;gZH8;iaub;RCWm",
        "pdf_size": 16208728,
        "rating": "6;6;8;8",
        "confidence": "4;3;5;3",
        "soundness": "2;3;4;3",
        "contribution": "3;2;4;3",
        "presentation": "2;2;4;1",
        "wc_summary": "95;53;104;34",
        "wc_strengths": "61;110;116;51",
        "wc_weaknesses": "486;49;80;433",
        "wc_questions": "50;54;102;137",
        "wc_review": "692;266;402;655",
        "wc_reply_reviewers": "104;23;110;18",
        "wc_reply_authors": "575;322;351;750",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            71.5,
            28.96981187374195
        ],
        "wc_strengths_avg": [
            84.5,
            28.79670119996386
        ],
        "wc_weaknesses_avg": [
            262.0,
            198.6894561872874
        ],
        "wc_questions_avg": [
            85.75,
            35.97481758119143
        ],
        "wc_review_avg": [
            503.75,
            176.91293762752343
        ],
        "wc_reply_reviewers_avg": [
            63.75,
            43.338060639581
        ],
        "wc_reply_authors_avg": [
            499.5,
            174.6489335781928
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.30151134457776363,
        "gs_citation": 20,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15610487722668296522&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=OUeIBFhyem",
        "pdf": "https://openreview.net/pdf?id=OUeIBFhyem",
        "email": "durham.ac.uk;durham.ac.uk",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Durham University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.dur.ac.uk",
        "aff_unique_abbr": "Durham",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "title": "Reward Design for Justifiable Sequential Decision-Making",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18740",
        "id": "OUkZXbbwQr",
        "author_site": "Aleksa Sukovic, Goran Radanovic",
        "tldr": "",
        "abstract": "Equipping agents with the capacity to justify made decisions using supporting evidence represents a cornerstone of accountable decision-making. Furthermore, ensuring that justifications are in line with human expectations and societal norms is vital, especially in high-stakes situations such as healthcare. In this work, we propose the use of a debate-based reward model for reinforcement learning agents, where the outcome of a zero-sum debate game quantifies the justifiability of a decision in a particular state. This reward model is then used to train a justifiable policy, whose decisions can be more easily corroborated with supporting evidence. In the debate game, two argumentative agents take turns providing supporting evidence for two competing decisions. Given the proposed evidence, a proxy of a human judge evaluates which decision is better justified. We demonstrate the potential of our approach in learning policies for prescribing and justifying treatment decisions of septic patients. We show that augmenting the reward with the feedback signal generated by the debate-based reward model yields policies highly favored by the judge when compared to the policy obtained solely from the environment rewards, while hardly sacrificing any performance. Moreover, in terms of the overall performance and justifiability of trained policies, the debate-based feedback is comparable to the feedback obtained from an ideal judge proxy that evaluates decisions using the full information encoded in the state. This suggests that the debate game outputs key information contained in states that is most relevant for evaluating decisions, which in turn substantiates the practicality of combining our approach with human-in-the-loop evaluations. Lastly, we showcase that agents trained via multi-agent debate learn to propose evidence that is resilient to refutations and closely aligns with human preferences.",
        "keywords": "reinforcement learning;reward design;alignment;preference-based learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/6c40cf387eeadade681c2b81695e4d9bc061fcfe.zip",
        "author": "Aleksa Sukovic;Goran Radanovic",
        "authorids": "~Aleksa_Sukovic1;~Goran_Radanovic1",
        "gender": "M;",
        "homepage": "https://aleksa-sukovic.github.io/;",
        "dblp": "359/1824;133/1771",
        "google_scholar": "HqkjkXIAAAAJ;KBG_JlAAAAAJ",
        "orcid": ";",
        "linkedin": "aleksa-sukovic/;",
        "or_profile": "~Aleksa_Sukovic1;~Goran_Radanovic1",
        "aff": "MPI-SWS;MPI-SWS",
        "aff_domain": "mpi-sws.org;mpi-sws.org",
        "position": "Researcher;Research group leader",
        "bibtex": "@inproceedings{\nsukovic2024reward,\ntitle={Reward Design for Justifiable Sequential Decision-Making},\nauthor={Aleksa Sukovic and Goran Radanovic},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=OUkZXbbwQr}\n}",
        "github": "",
        "project": "",
        "reviewers": "pkzb;2TSd;8w5y;WJVW",
        "pdf_size": 919505,
        "rating": "6;6;8;8",
        "confidence": "2;3;2;3",
        "soundness": "3;3;2;3",
        "contribution": "3;3;3;4",
        "presentation": "4;3;3;2",
        "wc_summary": "27;342;382;278",
        "wc_strengths": "41;86;113;57",
        "wc_weaknesses": "22;458;303;229",
        "wc_questions": "209;39;416;761",
        "wc_review": "299;925;1214;1325",
        "wc_reply_reviewers": "0;94;66;0",
        "wc_reply_authors": "925;2263;2024;2839",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "3;5;4;5",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            2.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            257.25,
            138.01335986055844
        ],
        "wc_strengths_avg": [
            74.25,
            27.580563808595358
        ],
        "wc_weaknesses_avg": [
            253.0,
            156.8932758278697
        ],
        "wc_questions_avg": [
            356.25,
            269.1294994979183
        ],
        "wc_review_avg": [
            940.75,
            398.2476459440784
        ],
        "wc_reply_reviewers_avg": [
            40.0,
            41.20679555607303
        ],
        "wc_reply_authors_avg": [
            2012.75,
            694.3775540007035
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            4.25,
            0.82915619758885
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:i2gCrWUrrggJ:scholar.google.com/&scioq=Reward+Design+for+Justifiable+Sequential+Decision-Making&hl=en&as_sdt=0,23",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=OUkZXbbwQr",
        "pdf": "https://openreview.net/pdf?id=OUkZXbbwQr",
        "email": "mpi-sws.org;mpi-sws.org",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Max Planck Institute for Software Systems",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.mpi-sws.org",
        "aff_unique_abbr": "MPI-SWS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "OVPoEhbsDm",
        "title": "Thermodynamics-inspired Structure Hallucination for Protein-protein Interaction Modeling",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Modeling protein-protein interactions (PPI) represents a central challenge within the field of biology, and accurately predicting the consequences of mutations in this context is crucial for various applications, such as drug design and protein engineering. Recent advances in deep learning (DL) have shown promise in forecasting the effects of such mutations. However, the effectiveness of these models is hindered by two primary constraints. First and foremost, obtaining the structures of mutant proteins is a persistent challenge, as they are often elusive to acquire. Secondly, interactions take place dynamically, but thermodynamics is rarely integrated into the DL architecture design. To address these obstacles, we present a novel framework known as Refine-PPI, which incorporates two key enhancements. On the one hand, we introduce a structure refinement module that is trained by a mask mutation modeling (MMM) task on available wide-type structures and then is transferred to hallucinate the inaccessible mutant protein structures. Additionally, we employ a new kind of geometric networks to capture the dynamic 3D variations and encode the uncertainty associated with PPI. Through comprehensive experiments conducted on the established benchmark dataset SKEMPI, our results substantiate the superiority of the Refine-PPI framework. These findings underscore the effectiveness of our hallucination strategy to address the absence of mutant protein structure and hope to shed light on the prediction of the free energy change.",
        "keywords": "Protein-protein Interaction;Mutation Effect Prediction",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Fang Wu;Stan Z. Li",
        "authorids": "~Fang_Wu1;~Stan_Z._Li2",
        "gender": ";",
        "homepage": ";",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Fang_Wu1;~Stan_Z._Li2",
        "aff": ";",
        "aff_domain": ";",
        "position": ";",
        "bibtex": "@misc{\nwu2024thermodynamicsinspired,\ntitle={Thermodynamics-inspired Structure Hallucination for Protein-protein Interaction Modeling},\nauthor={Fang Wu and Stan Z. Li},\nyear={2024},\nurl={https://openreview.net/forum?id=OVPoEhbsDm}\n}",
        "github": "",
        "project": "",
        "reviewers": "cuXz;Criu;xfqG",
        "site": "https://openreview.net/forum?id=OVPoEhbsDm",
        "pdf_size": 2657801,
        "rating": "3;5;6",
        "confidence": "4;4;4",
        "soundness": "1;2;2",
        "contribution": "2;2;3",
        "presentation": "3;3;3",
        "wc_summary": "49;100;95",
        "wc_strengths": "18;63;52",
        "wc_weaknesses": "96;501;39",
        "wc_questions": "155;288;62",
        "wc_review": "318;952;248",
        "wc_reply_reviewers": "112;232;59",
        "wc_reply_authors": "2508;3524;897",
        "reply_reviewers": "1;1;1",
        "reply_authors": "4;6;2",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            81.33333333333333,
            22.954060400915758
        ],
        "wc_strengths_avg": [
            44.333333333333336,
            19.154343864744856
        ],
        "wc_weaknesses_avg": [
            212.0,
            205.67450012094352
        ],
        "wc_questions_avg": [
            168.33333333333334,
            92.7445715692059
        ],
        "wc_review_avg": [
            506.0,
            316.66175434786356
        ],
        "wc_reply_reviewers_avg": [
            134.33333333333334,
            72.37095795659717
        ],
        "wc_reply_authors_avg": [
            2309.6666666666665,
            1081.5989192959755
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            4.0,
            1.632993161855452
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Ht8tpuyAR0MJ:scholar.google.com/&scioq=Thermodynamics-inspired+Structure+Hallucination+for+Protein-protein+Interaction+Modeling&hl=en&as_sdt=0,33",
        "gs_version_total": 0
    },
    {
        "id": "OWUWWr50PF",
        "title": "Deterministic Error Bounds for Euclidean Clustering",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper gives a closed-form solution to Euclidean clustering, also known as k-means clustering. The key observation behind our solution is that the features of clustered data lie near a subspace whose projection operator encodes the clustering.  In contrast to classical alternating approaches like Lloyd's algorithm or K-means++, which suffer local minima, our solution can be trivially computed with a singular value decomposition. Moreover, we show that if the distinct clusters are sufficiently well-defined (meaning different clusters are sufficiently separated, and data in each cluster not too scattered), our solution is deterministically guaranteed to be correct. We corroborate our theoretical findings with a comprehensive array of experiments, showing that simple relaxations of our solution yield algorithms that not only rival but also surpass the current state-of-the-art in a wide variety of settings, both in terms of accuracy and speed.",
        "keywords": "euclidean;subspace;davis;kahan",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Daniel L. Pimentel-Alarc\u00f3n",
        "authorids": "~Daniel_L._Pimentel-Alarc\u00f3n1",
        "gender": "",
        "homepage": "https://danielpimentel.github.io/",
        "dblp": "150/6256",
        "google_scholar": "",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Daniel_L._Pimentel-Alarc\u00f3n1",
        "aff": "University of Wisconsin, Madison",
        "aff_domain": "wisc.edu",
        "position": "Assistant Professor",
        "bibtex": "@misc{\npimentel-alarc{\\'o}n2024deterministic,\ntitle={Deterministic Error Bounds for Euclidean Clustering},\nauthor={Daniel L. Pimentel-Alarc{\\'o}n},\nyear={2024},\nurl={https://openreview.net/forum?id=OWUWWr50PF}\n}",
        "github": "",
        "project": "",
        "reviewers": "NErf;CV5n;CdDR;aXjr",
        "site": "https://openreview.net/forum?id=OWUWWr50PF",
        "pdf_size": 1132274,
        "rating": "3;3;3;5",
        "confidence": "4;3;3;2",
        "soundness": "3;2;2;2",
        "contribution": "1;1;2;2",
        "presentation": "2;3;2;2",
        "wc_summary": "190;42;69;81",
        "wc_strengths": "28;31;15;34",
        "wc_weaknesses": "700;189;159;228",
        "wc_questions": "79;19;259;117",
        "wc_review": "997;281;502;460",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            95.5,
            56.35822921277779
        ],
        "wc_strengths_avg": [
            27.0,
            7.245688373094719
        ],
        "wc_weaknesses_avg": [
            319.0,
            221.32668162695612
        ],
        "wc_questions_avg": [
            118.5,
            88.32185460009318
        ],
        "wc_review_avg": [
            560.0,
            265.6002635540861
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:hak-ojFJF9oJ:scholar.google.com/&scioq=Deterministic+Error+Bounds+for+Euclidean+Clustering&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Wisconsin",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.wisc.edu",
        "aff_unique_abbr": "UW",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Madison",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "OWpp0TjdTt",
        "title": "Semi-supervised batch learning from logged data",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Offline policy learning methods are intended to learn a policy from logged data, which includes context, action, and reward for each sample point. In this work we build on the counterfactual risk minimization framework, which also assumes access to propensity scores. We propose learning methods for problems where rewards of some samples are missing, so there are samples with rewards and samples missing rewards in the logged data. We refer to this type of learning as semi-supervised batch learning from logged data, which arises in a wide range of application domains. We derive new upper bound for the true risk under inverse propensity score estimation to better address this kind of learning problem. Using this bound, we propose a regularized semi-supervised batch learning method with logged data where the regularization term is reward-independent and, as a result, can be evaluated using the logged missing-reward data. Consequently, even though reward feedback is only present for some samples, a parameterized policy can be learned by leveraging the missing-reward samples. The results of experiments derived from benchmark datasets indicate that these algorithms achieve policies with better performance in comparison with logging policies.",
        "keywords": "Semi-supervised batch learning;off-policy learning;IPS estimator;learning bounds",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/1ed6a42ad588a53aea6fd9ba0636381aecb52856.zip",
        "author": "Gholamali Aminian;Armin Behnamnia;Roberto Vega;Laura Toni;Chengchun Shi;Hamid R. Rabiee;Omar Rivasplata;Miguel R. D. Rodrigues",
        "authorids": "~Gholamali_Aminian1;~Armin_Behnamnia1;~Roberto_Vega1;~Laura_Toni1;~Chengchun_Shi1;~Hamid_R._Rabiee1;~Omar_Rivasplata1;~Miguel_R._D._Rodrigues1",
        "gender": "M;M;M;;M;M;;M",
        "homepage": ";;https://robertoivega.com/en/;https://laspucl2016.com/team/laura-toni/;https://callmespring.github.io/;http://sharif.edu/~rabiee;https://personalpages.manchester.ac.uk/staff/omar.rivasplata/;https://www.ee.ucl.ac.uk/iiml/",
        "dblp": "153/1970;;;81/7871;;01/4547;222/3321;21/6763",
        "google_scholar": "UNNnTjsAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.ca/citations?user=ckG9N-IAAAAJ;fQ-oWKUAAAAJ;dDGy3N0AAAAJ;rKDtrNgAAAAJ;https://scholar.google.co.uk/citations?user=sYdUCVQAAAAJ;",
        "orcid": ";0000-0001-9403-1219;0000-0002-5686-5148;0000-0002-8441-8791;;0000-0002-9835-4493;0000-0002-2467-251X;",
        "linkedin": ";armin-behnamnia-32a4bb23a/;robertoivanvega/;;;hrabiee/;omar-rivasplata-064b4a132/;",
        "or_profile": "~Gholamali_Aminian1;~Armin_Behnamnia1;~Roberto_Vega1;~Laura_Toni1;~Chengchun_Shi1;~Hamid_R._Rabiee1;~Omar_Rivasplata1;~Miguel_R._D._Rodrigues1",
        "aff": "Alan Turing Institute;Sharif University of Technology;;University College London;London School of Economics;Sharif University of Technology;University of Manchester;University College London",
        "aff_domain": "turing.ac.uk;sharif.edu;;ucl.ac.uk;lse.ac.uk;sharif.edu;manchester.ac.uk;ucl.ac.uk",
        "position": "Researcher;PhD student;;Associate Professor;Associate Professor;Full Professor;Associate Professor;Full Professor",
        "bibtex": "@misc{\naminian2024semisupervised,\ntitle={Semi-supervised batch learning from logged data},\nauthor={Gholamali Aminian and Armin Behnamnia and Roberto Vega and Laura Toni and Chengchun Shi and Hamid R. Rabiee and Omar Rivasplata and Miguel R. D. Rodrigues},\nyear={2024},\nurl={https://openreview.net/forum?id=OWpp0TjdTt}\n}",
        "github": "",
        "project": "",
        "reviewers": "KCYk;p1oi;G8No;CHNF",
        "site": "https://openreview.net/forum?id=OWpp0TjdTt",
        "pdf_size": 598971,
        "rating": "5;5;6;8",
        "confidence": "4;3;4;4",
        "soundness": "3;4;3;3",
        "contribution": "3;2;2;2",
        "presentation": "2;2;3;3",
        "wc_summary": "81;77;133;85",
        "wc_strengths": "60;49;44;105",
        "wc_weaknesses": "143;173;62;262",
        "wc_questions": "84;22;85;106",
        "wc_review": "368;321;324;558",
        "wc_reply_reviewers": "0;0;0;63",
        "wc_reply_authors": "1051;1267;870;1682",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "3;3;3;4",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            94.0,
            22.693611435820433
        ],
        "wc_strengths_avg": [
            64.5,
            24.088378940891808
        ],
        "wc_weaknesses_avg": [
            160.0,
            71.52971410539818
        ],
        "wc_questions_avg": [
            74.25,
            31.419540098480116
        ],
        "wc_review_avg": [
            392.75,
            97.204359470139
        ],
        "wc_reply_reviewers_avg": [
            15.75,
            27.279800219209818
        ],
        "wc_reply_authors_avg": [
            1217.5,
            302.77425584088223
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.25,
            0.4330127018922193
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.4714045207910316,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:vyyZfR_d5a8J:scholar.google.com/&scioq=Semi-supervised+batch+learning+from+logged+data&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;3;1;4;2",
        "aff_unique_norm": "Alan Turing Institute;Sharif University of Technology;University College London;London School of Economics;University of Manchester",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.turing.ac.uk;https://www.sharif.edu;https://www.ucl.ac.uk;https://www.lse.ac.uk;https://www.manchester.ac.uk",
        "aff_unique_abbr": "ATI;SUT;UCL;LSE;UoM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;1;0;0",
        "aff_country_unique": "United Kingdom;Iran"
    },
    {
        "id": "OXBsK3GsL6",
        "title": "Soft iEP: On the Exploration Inefficacy of Gradient Based Strong Lottery Exploration",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Edge-popup (EP) is a de facto algorithm to find \\emph{strong lottery tickets (SLT)}, the sparse subnetworks that achieve high performance \\emph{without any weight updates}. EP find the subnetworks by optimizing of a score vector representing the importance of each edge, and select subnetworks given optimized scores. This paper first show that such a simple gradient-based method result in suboptimal solution due to the existence of \\emph{dying edges}. Specifically, we show that, most edges are \\emph{never} selected during the search process, i.e., EP might be trapped around the local minima nearby random subnetworks and need help to search the entire spaces of subnetworks effectively. Unlike the standard iterative pruning that masks out a certain amount of edges and thus induce a similar problem to the dying edges, Soft iEP \\emph{do not} disable the bottom edges at each cycle, i.e., leave a chance to be selected at the end regardless of whether it was chosen at the former cycle. Empirical validations show that iEP with soft pruning stably outperforms both EP and iEP w/ hard pruning on ImageNet, CIFAR-10, and CIFAR-100 and reduces dying edges. Notably, it discovered a subnetwork that is sparser than ResNet-34 but exceeds the performance of trained dense ResNet34 by over 2.4\\% in the accuracy of ImageNet (76.0\\% with 20M parameters). Our results also provide new insight into why iterative pruning helps to find good sparse networks.",
        "keywords": "strong lottery tickets;edge-pop;soft pruning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/fd9dec8e29712885e7e00bad2a00986a4ebab234.pdf",
        "author": "Yusuke Iwasawa;Masato Hirakawa;Yutaka Matsuo",
        "authorids": "~Yusuke_Iwasawa1;~Masato_Hirakawa1;~Yutaka_Matsuo1",
        "gender": "M;M;M",
        "homepage": ";https://weblab.t.u-tokyo.ac.jp/member-students/;http://ymatsuo.com",
        "dblp": "117/7377;;m/YMatsuo.html",
        "google_scholar": "https://scholar.google.co.jp/citations?user=pvvZgj0AAAAJ;;Dy8iau4AAAAJ",
        "orcid": "0000-0002-1321-2622;;",
        "linkedin": ";;",
        "or_profile": "~Yusuke_Iwasawa1;~Masato_Hirakawa1;~Yutaka_Matsuo1",
        "aff": "The University of Tokyo, The University of Tokyo;;The University of Tokyo",
        "aff_domain": "weblab.t.u-tokyo.ac.jp;;u-tokyo.ac.jp",
        "position": "Associate Professor;;Associate Professor",
        "bibtex": "@misc{\niwasawa2024soft,\ntitle={Soft i{EP}: On the Exploration Inefficacy of Gradient Based Strong Lottery Exploration},\nauthor={Yusuke Iwasawa and Masato Hirakawa and Yutaka Matsuo},\nyear={2024},\nurl={https://openreview.net/forum?id=OXBsK3GsL6}\n}",
        "github": "",
        "project": "",
        "reviewers": "tFae;He2e;ce4d;pwgP;qaNa",
        "site": "https://openreview.net/forum?id=OXBsK3GsL6",
        "pdf_size": 961545,
        "rating": "3;5;5;6;6",
        "confidence": "5;4;3;3;3",
        "soundness": "2;3;3;2;3",
        "contribution": "1;2;3;2;3",
        "presentation": "3;3;3;2;3",
        "wc_summary": "65;95;156;40;197",
        "wc_strengths": "31;99;78;65;39",
        "wc_weaknesses": "266;300;296;64;121",
        "wc_questions": "5;6;5;97;99",
        "wc_review": "367;500;535;266;456",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "670;503;519;432;413",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            5.0,
            1.0954451150103321
        ],
        "confidence_avg": [
            3.6,
            0.8
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.2,
            0.7483314773547882
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            110.6,
            58.022754157313145
        ],
        "wc_strengths_avg": [
            62.4,
            24.992798962901297
        ],
        "wc_weaknesses_avg": [
            209.4,
            97.84395740156874
        ],
        "wc_questions_avg": [
            42.4,
            45.40308359572067
        ],
        "wc_review_avg": [
            424.8,
            97.29419304357275
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            507.4,
            90.76254734195157
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.912870929175277,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:tO-89jT0HiQJ:scholar.google.com/&scioq=Soft+iEP:+On+the+Exploration+Inefficacy+of+Gradient+Based+Strong+Lottery+Exploration&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Tokyo",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.u-tokyo.ac.jp",
        "aff_unique_abbr": "UTokyo",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Japan"
    },
    {
        "title": "Evoke: Evoking Critical Thinking Abilities in LLMs via Reviewer-Author Prompt Editing",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18739",
        "id": "OXv0zQ1umU",
        "author_site": "Xinyu Hu, Pengfei Tang, Simiao Zuo, Zihan Wang, Bowen Song, Qiang Lou, Jian Jiao, Denis Charles",
        "tldr": "",
        "abstract": "Large language models (LLMs) have made impressive progress in natural language processing. These models rely on proper human instructions (or prompts) to generate suitable responses. However, the potential of LLMs are not fully harnessed by commonly-used prompting methods: many human-in-the-loop algorithms employ ad-hoc procedures for prompt selection; while auto prompt generation approaches are essentially searching all possible prompts randomly and inefficiently. We propose Evoke, an automatic prompt refinement framework. In Evoke, there are two instances of a same LLM: one as a reviewer (LLM-Reviewer), it scores the current prompt; the other as an author (LLM-Author), it edits the prompt by considering the edit history and the reviewer's feedback. Such an author-reviewer feedback loop ensures that the prompt is refined in each iteration. We further aggregate a data selection approach to Evoke, where only the hard samples are exposed to the LLM. The hard samples are more important because the LLM can develop deeper understanding of the tasks out of them, while the model may already know how to solve the easier cases. Experimental results show that Evoke significantly outperforms existing methods. For instance, in the challenging task of logical fallacy detection, Evoke scores above 80, while all other baseline methods struggle to reach 20.",
        "keywords": "large language models;automatic prompt engineering;in-context learning",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Xinyu Hu;Pengfei Tang;Simiao Zuo;Zihan Wang;Bowen Song;Qiang Lou;Jian Jiao;Denis X Charles",
        "authorids": "~Xinyu_Hu2;~Pengfei_Tang1;~Simiao_Zuo1;~Zihan_Wang14;~Bowen_Song3;~Qiang_Lou1;~Jian_Jiao2;~Denis_X_Charles1",
        "gender": "F;M;;M;;M;M;M",
        "homepage": "https://christine1729.github.io/posts/2022-10-17-dsml/;https://www.linkedin.com/in/pengfei-tang-347a734b/;;https://avinwangzh.github.io/;https://web.stanford.edu/~bowens18/;;;",
        "dblp": ";;232/2089;;;07/4536;29/265-7.html;04/3166.html",
        "google_scholar": ";;J8TSTXMAAAAJ;;https://scholar.google.com/citations?hl=en;;D6KwmF8AAAAJ;Vj8VHusAAAAJ",
        "orcid": ";;;;;;0000-0003-4779-9588;",
        "linkedin": ";;;;;;jian-jiao-82897810/;denis-charles-791508b8/",
        "or_profile": "~Xinyu_Hu2;~Pengfei_Tang1;~Simiao_Zuo1;~Zihan_Wang14;~Bowen_Song3;~Qiang_Lou1;~Jian_Jiao2;~Denis_X_Charles1",
        "aff": "Microsoft;Microsoft;Microsoft;University of Washington;University of Michigan - Ann Arbor;;Microsoft;",
        "aff_domain": "microsoft.com;microsoft.com;microsoft.com;uw.edu;umich.edu;;microsoft.com;",
        "position": "Researcher;Researcher;Researcher;PhD student;PhD student;;Principal Researcher;",
        "bibtex": "@inproceedings{\nhu2024evoke,\ntitle={Evoke: Evoking Critical Thinking Abilities in {LLM}s via Reviewer-Author Prompt Editing},\nauthor={Xinyu Hu and Pengfei Tang and Simiao Zuo and Zihan Wang and Bowen Song and Qiang Lou and Jian Jiao and Denis X Charles},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=OXv0zQ1umU}\n}",
        "github": "",
        "project": "",
        "reviewers": "PdAc;QMNd;7Mrx;hcVA",
        "pdf_size": 1553615,
        "rating": "5;6;6;8",
        "confidence": "4;3;3;4",
        "soundness": "3;2;2;4",
        "contribution": "2;2;3;4",
        "presentation": "2;3;2;4",
        "wc_summary": "70;95;239;114",
        "wc_strengths": "116;28;19;34",
        "wc_weaknesses": "204;25;34;62",
        "wc_questions": "152;19;155;31",
        "wc_review": "542;167;447;241",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1865;531;1091;779",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "4;2;3;2",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            129.5,
            65.11720202834272
        ],
        "wc_strengths_avg": [
            49.25,
            38.90613704802881
        ],
        "wc_weaknesses_avg": [
            81.25,
            72.17123734563513
        ],
        "wc_questions_avg": [
            89.25,
            64.39866070035929
        ],
        "wc_review_avg": [
            349.25,
            151.36111620888636
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1066.5,
            501.9011356831144
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.2294157338705618,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7569736872935848429&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=OXv0zQ1umU",
        "pdf": "https://openreview.net/pdf?id=OXv0zQ1umU",
        "email": "microsoft.com;microsoft.com;microsoft.com;uw.edu;umich.edu;;microsoft.com;",
        "author_num": 8,
        "aff_unique_index": "0;0;0;1;2;0",
        "aff_unique_norm": "Microsoft;University of Washington;University of Michigan",
        "aff_unique_dep": "Microsoft Corporation;;",
        "aff_unique_url": "https://www.microsoft.com;https://www.washington.edu;https://www.umich.edu",
        "aff_unique_abbr": "Microsoft;UW;UM",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Ann Arbor",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "OY1B79JDQA",
        "title": "Regulating Model Reliance on Non-Robust Features by Smoothing Marginal Density of Input",
        "track": "main",
        "status": "Desk Reject",
        "tldr": "",
        "abstract": "Trustworthy machine learning necessitates meticulous regulation of model reliance on non-robust features. We propose a framework to delineate such features by attributing model predictions to the input. Within our framework, robust feature attributions exhibit a certain consistency, while non-robust feature attributions are susceptible to fluctuations. This feature behavior leads to the identification of correlation between model reliance on non-robust features and smoothness of marginal density of the input samples. Hence, we propose to regularize the gradients of the marginal density w.r.t. the input features for robustness. We also devise an efficient implementation of our regularization to address the potential numerical instability of the underlying optimization process. Moreover, we analytically reveal that, as opposed to our marginal density smoothing, the commonly adopted input gradient regularization smooths conditional or joint density of the input, resulting in limited robustness. Our experiments validate the effectiveness of the proposed method, providing clear evidence of mitigating spurious correlations learned by the model, and addressing the feature leakage problem. We demonstrate that our regularization enables the model to exhibit robustness against perturbations in pixel values, input gradients and density.",
        "keywords": "model robustness;interpretability;feature attribution",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/4a8929e0a2cc80680d439343407f5a199e360840.zip",
        "author": "Peiyu Yang;NAVEED AKHTAR;Mubarak Shah;Ajmal Saeed Mian",
        "authorids": "~Peiyu_Yang1;~NAVEED_AKHTAR3;~Mubarak_Shah3;~Ajmal_Saeed_Mian1",
        "gender": "M;;M;M",
        "homepage": "https://ypeiyu.github.io/;;https://www.crcv.ucf.edu/person/mubarak-shah/;https://ajmalsaeed.net/",
        "dblp": "155/8089;;s/MubarakShah;63/807",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;https://scholar.google.com.tw/citations?user=p8gsO3gAAAAJ;X589yaIAAAAJ",
        "orcid": "0000-0002-3827-8476;;0000-0002-8216-1128;0000-0002-5206-3842",
        "linkedin": ";;mubarak-shah-b6aa68213/;",
        "or_profile": "~Peiyu_Yang1;~NAVEED_AKHTAR3;~Mubarak_Shah3;~Ajmal_Saeed_Mian1",
        "aff": "University of Western Australia;;University of Central Florida;University of Western Australia",
        "aff_domain": "uwa.edu.au;;ucf.edu;uwa.edu.au",
        "position": "PhD student;;Full Professor;Professor",
        "bibtex": "@misc{\nyang2024regulating,\ntitle={Regulating Model Reliance on Non-Robust Features by Smoothing Marginal Density of Input},\nauthor={Peiyu Yang and NAVEED AKHTAR and Mubarak Shah and Ajmal Saeed Mian},\nyear={2024},\nurl={https://openreview.net/forum?id=OY1B79JDQA}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=OY1B79JDQA",
        "pdf_size": 4490196,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:qBEGBEOstVwJ:scholar.google.com/&scioq=Regulating+Model+Reliance+on+Non-Robust+Features+by+Smoothing+Marginal+Density+of+Input&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Western Australia;University of Central Florida",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uwa.edu.au;https://www.ucf.edu",
        "aff_unique_abbr": "UWA;UCF",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Australia;United States"
    },
    {
        "id": "OZ3syNYe7D",
        "title": "PEAR: Primitive enabled Adaptive Relabeling for boosting Hierarchical Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Hierarchical reinforcement learning (HRL) has the potential to solve complex long horizon tasks using temporal abstraction and increased exploration. However, hierarchical agents are difficult to train due to inherent non-stationarity. We present primitive enabled adaptive relabeling (PEAR), a two-phase approach where we first perform adaptive relabeling on a few expert demonstrations to generate efficient subgoal supervision, and then jointly optimize HRL agents by employing reinforcement learning (RL) and imitation learning (IL). We perform theoretical analysis to $(i)$ bound the sub-optimality of our approach, and $(ii)$ derive a generalized plug-and-play framework for joint optimization using RL and IL. PEAR uses a handful of expert demonstrations and makes minimal limiting assumptions on the task structure. Additionally, it can be easily integrated with typical model free RL algorithms to produce a practical HRL algorithm. We perform experiments on challenging robotic environments and show that PEAR is able to solve tasks that require long term decision making. We empirically show that PEAR exhibits improved performance and sample efficiency over previous hierarchical and non-hierarchical approaches. We also perform real world robotic experiments on complex tasks and demonstrate that PEAR consistently outperforms the baselines.",
        "keywords": "Hierarchical Reinforcement Learning;Inverse Reinforcement Learning;Imitation Learning;Learning from demonstrations",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/bcd89967df2fc7f67ac01097dad17979457570c6.zip",
        "author": "Utsav Singh;Vinay P Namboodiri",
        "authorids": "~Utsav_Singh1;~Vinay_P_Namboodiri1",
        "gender": "M;M",
        "homepage": "https://www.cse.iitk.ac.in/users/utsavz/;https://vinaypn.github.io",
        "dblp": "241/9336;95/6599",
        "google_scholar": ";https://scholar.google.co.in/citations?user=JyHi9OoAAAAJ",
        "orcid": ";0000-0001-5262-9722",
        "linkedin": ";",
        "or_profile": "~Utsav_Singh1;~Vinay_P_Namboodiri1",
        "aff": "Indian Institute of Technology, Kanpur;University of Bath",
        "aff_domain": "iitk.ac.in;bath.ac.uk",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\nsingh2024pear,\ntitle={{PEAR}: Primitive enabled Adaptive Relabeling for boosting Hierarchical Reinforcement Learning},\nauthor={Utsav Singh and Vinay P Namboodiri},\nyear={2024},\nurl={https://openreview.net/forum?id=OZ3syNYe7D}\n}",
        "github": "",
        "project": "",
        "reviewers": "cZN6;XmJk;hXvK;uEcd",
        "site": "https://openreview.net/forum?id=OZ3syNYe7D",
        "pdf_size": 14542411,
        "rating": "3;5;6;6",
        "confidence": "4;3;3;3",
        "soundness": "2;2;3;2",
        "contribution": "1;3;3;2",
        "presentation": "1;2;3;2",
        "wc_summary": "47;165;45;79",
        "wc_strengths": "58;69;53;21",
        "wc_weaknesses": "121;855;68;251",
        "wc_questions": "4;11;58;170",
        "wc_review": "230;1100;224;521",
        "wc_reply_reviewers": "171;1207;80;309",
        "wc_reply_authors": "1687;3500;654;2172",
        "reply_reviewers": "1;4;1;6",
        "reply_authors": "4;9;3;10",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            84.0,
            48.67237409455183
        ],
        "wc_strengths_avg": [
            50.25,
            17.851820635442202
        ],
        "wc_weaknesses_avg": [
            323.75,
            313.8609365626758
        ],
        "wc_questions_avg": [
            60.75,
            66.40547793668833
        ],
        "wc_review_avg": [
            518.75,
            356.4094380063469
        ],
        "wc_reply_reviewers_avg": [
            441.75,
            449.27684950373305
        ],
        "wc_reply_authors_avg": [
            2003.25,
            1023.3800308292125
        ],
        "reply_reviewers_avg": [
            3.0,
            2.1213203435596424
        ],
        "reply_authors_avg": [
            6.5,
            3.0413812651491097
        ],
        "replies_avg": [
            45,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.9428090415820632,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9454502987684528894&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Indian Institute of Technology Kanpur;University of Bath",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.iitk.ac.in;https://www.bath.ac.uk",
        "aff_unique_abbr": "IIT Kanpur;Bath",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Kanpur;",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "India;United Kingdom"
    },
    {
        "id": "OZWHYyfPwY",
        "title": "Don't trust your eyes: on the (un)reliability of feature visualizations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "How do neural networks extract patterns from pixels? Feature visualizations attempt to answer this important question by visualizing highly activating patterns through optimization. Today, visualization methods form the foundation of our knowledge about the internal workings of neural networks, as a type of mechanistic interpretability. Here we ask: How reliable are feature visualizations? We start our investigation by developing network circuits that trick feature visualizations into showing arbitrary patterns that are completely disconnected from normal network behavior on natural input. We then provide evidence for a similar phenomenon occurring in standard, unmanipulated networks: feature visualizations are processed very differently from standard input, casting doubt on their ability to \"explain\" how neural networks process natural images. This can be used as a sanity check for feature visualizations. We underpin our empirical findings by theory proving that the set of functions that can be reliably understood by feature visualization is extremely small and does not include general black-box neural networks. Therefore, a promising way forward could be the development of networks that enforce certain structures in order to ensure more reliable feature visualizations.",
        "keywords": "feature visualization;interpretability;explainability;deep learning;neural networks;analysis;theory;activation maximization",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/5abcb51f2b8ba8d1607f98634bfa1826a305cfde.zip",
        "author": "Robert Geirhos;Roland S. Zimmermann;Blair Bilodeau;Wieland Brendel;Been Kim",
        "authorids": "~Robert_Geirhos1;~Roland_S._Zimmermann1;~Blair_Bilodeau1;~Wieland_Brendel1;~Been_Kim1",
        "gender": "M;M;M;;M",
        "homepage": "https://robertgeirhos.com/;http://www.blairbilodeau.ca;;https://beenkim.github.io/;https://rzimmermann.com",
        "dblp": "176/0076;;37/11107;https://dblp.uni-trier.de/pers/k/Kim:Been.html;227/2603",
        "google_scholar": "w3kGtMIAAAAJ;;v-JL-hsAAAAJ;;https://scholar.google.de/citations?user=4jdISHwAAAAJ",
        "orcid": "0000-0001-7698-3187;;;;",
        "linkedin": "rgeirhos/;;;;",
        "or_profile": "~Robert_Geirhos1;~Blair_Bilodeau1;~Wieland_Brendel1;~Been_Kim1;~Roland_Simon_Zimmermann1",
        "aff": "Google DeepMind;;ELLIS Institute T\u00fcbingen;Google DeepMind;Max-Planck Institute for Intelligent Systems",
        "aff_domain": "google.com;;tue.ellis.eu;google.com;mpg.tuebingen.de",
        "position": "Research Scientist;;Principal Researcher;Research Scientist;PhD student",
        "bibtex": "@misc{\ngeirhos2024dont,\ntitle={Don't trust your eyes: on the (un)reliability of feature visualizations},\nauthor={Robert Geirhos and Roland S. Zimmermann and Blair Bilodeau and Wieland Brendel and Been Kim},\nyear={2024},\nurl={https://openreview.net/forum?id=OZWHYyfPwY}\n}",
        "github": "",
        "project": "",
        "reviewers": "MuGq;CUhk;o92S;NDh1",
        "site": "https://openreview.net/forum?id=OZWHYyfPwY",
        "pdf_size": 5446749,
        "rating": "6;6;8;8",
        "confidence": "3;3;3;4",
        "soundness": "3;3;3;4",
        "contribution": "2;3;4;3",
        "presentation": "2;3;4;3",
        "wc_summary": "58;75;79;145",
        "wc_strengths": "45;42;24;42",
        "wc_weaknesses": "158;78;55;122",
        "wc_questions": "54;6;63;646",
        "wc_review": "315;201;221;955",
        "wc_reply_reviewers": "22;0;18;75",
        "wc_reply_authors": "1180;378;650;1574",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "3;1;1;4",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            89.25,
            33.138912172852024
        ],
        "wc_strengths_avg": [
            38.25,
            8.317902379807062
        ],
        "wc_weaknesses_avg": [
            103.25,
            39.73270063813936
        ],
        "wc_questions_avg": [
            192.25,
            262.867243109521
        ],
        "wc_review_avg": [
            423.0,
            310.1515758463916
        ],
        "wc_reply_reviewers_avg": [
            28.75,
            27.958674861301994
        ],
        "wc_reply_authors_avg": [
            945.5,
            463.51348416200364
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            1.299038105676658
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 23,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13494620787600136581&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "Google;ELLIS Institute;Max-Planck Institute for Intelligent Systems",
        "aff_unique_dep": "Google DeepMind;;",
        "aff_unique_url": "https://deepmind.com;https://ellis.eu/;https://www.mpi-is.mpg.de",
        "aff_unique_abbr": "DeepMind;ELLIS;MPI-IS",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";T\u00fcbingen",
        "aff_country_unique_index": "0;1;0;1",
        "aff_country_unique": "United Kingdom;Germany"
    },
    {
        "title": "Less or More From Teacher: Exploiting Trilateral Geometry For Knowledge Distillation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18738",
        "id": "OZitfSXpdT",
        "author_site": "Chengming Hu, Haolun Wu, Xuan Li, Chen Ma, Xi Chen, Boyu Wang, Jun Yan, Xue Liu",
        "tldr": "",
        "abstract": "Knowledge distillation aims to train a compact student network using soft supervision from a larger teacher network and hard supervision from ground truths. However, determining an optimal knowledge fusion ratio that balances these supervisory signals remains challenging. Prior methods generally resort to a constant or heuristic-based fusion ratio, which often falls short of a proper balance. In this study, we introduce a novel adaptive method for learning a sample-wise knowledge fusion ratio, exploiting both the correctness of teacher and student, as well as how well the student mimics the teacher on each sample. Our method naturally leads to the \\textit{intra-sample} trilateral geometric relations among the student prediction ($\\mathcal{S}$), teacher prediction ($\\mathcal{T}$), and ground truth ($\\mathcal{G}$). To counterbalance the impact of outliers, we further extend to the \\textit{inter-sample} relations, incorporating the teacher's global average prediction ($\\mathcal{\\bar{T}})$ for samples within the same class.  A simple neural network then learns the implicit mapping from the intra- and inter-sample relations to an adaptive, sample-wise knowledge fusion ratio in a bilevel-optimization manner. Our approach provides a simple, practical, and adaptable solution for knowledge distillation that can be employed across various architectures and model sizes. Extensive experiments demonstrate consistent improvements over other loss re-weighting methods on image classification, attack detection, and click-through rate prediction.",
        "keywords": "Knowledge Distillation;Bilevel Optimization;Re-weighting",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Chengming Hu;Haolun Wu;Xuan Li;Chen Ma;Xi Chen;Boyu Wang;Jun Yan;Xue Liu",
        "authorids": "~Chengming_Hu1;~Haolun_Wu1;~Xuan_Li4;~Chen_Ma3;~Xi_Chen32;~Boyu_Wang3;~Jun_Yan8;~Xue_Liu1",
        "gender": "M;M;M;M;M;M;Not Specified;M",
        "homepage": "https://sites.google.com/view/chengminghu/home;https://haolun-wu.github.io/;https://github.com/Shaunlipy;https://allenjack.github.io;https://sites.google.com/site/xichenmcgill/home;https://sites.google.com/site/borriewang/;https://www.concordia.ca/faculty/jun-yan.html;http://www.cs.mcgill.ca/~xueliu/",
        "dblp": "312/9310;283/5463;;126/4567-1;16/3283-9.html;41/6565-4.html;89/5901-7;l/XueLiu",
        "google_scholar": "nldbrJ8AAAAJ;-KcBDLcAAAAJ;;https://scholar.google.ca/citations?user=sSy7nvsAAAAJ;https://scholar.google.ca/citations?user=HMuDi00AAAAJ;qAZM5KcAAAAJ;3Yi1ZhsAAAAJ;https://scholar.google.com.tw/citations?user=rfLIRakAAAAJ",
        "orcid": ";0000-0001-6255-1535;0000-0001-9352-6375;0000-0001-7933-9813;0000-0001-5395-4295;0000-0002-7413-4162;0000-0002-5148-1399;",
        "linkedin": ";haolun-wu-23ba08133/;;ma-chen-93455693/?locale=en_US;;;jun-yan-9b2a173a/;",
        "or_profile": "~Chengming_Hu1;~Haolun_Wu1;~Xuan_Li4;~Chen_Ma3;~Xi_Chen32;~Boyu_Wang3;~Jun_Yan8;~Xue_Liu1",
        "aff": "McGill University;Google Research;McGill University, McGill University;City University of Hong Kong;Huawei Technologies Ltd.;University of Western Ontario;Concordia University;McGill University",
        "aff_domain": "mcgill.ca;google.com;mail.mcgill.ca;cityu.edu.hk;huawei.com;uwo.ca;concordia.ca;mcgill.ca",
        "position": "PhD student;Intern;PhD student;Assistant Professor;Principal Researcher;Assistant Professor;Associate Professor;Full Professor",
        "bibtex": "@inproceedings{\nhu2024less,\ntitle={Less or More From Teacher: Exploiting Trilateral Geometry For Knowledge Distillation},\nauthor={Chengming Hu and Haolun Wu and Xuan Li and Chen Ma and Xi Chen and Boyu Wang and Jun Yan and Xue Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=OZitfSXpdT}\n}",
        "github": "",
        "project": "",
        "reviewers": "UyVS;Ur13;aFDp;iMjj",
        "pdf_size": 886337,
        "rating": "5;5;8;8",
        "confidence": "4;4;4;5",
        "soundness": "3;2;3;4",
        "contribution": "2;2;3;3",
        "presentation": "4;2;3;3",
        "wc_summary": "93;125;82;46",
        "wc_strengths": "39;187;139;59",
        "wc_weaknesses": "114;98;177;70",
        "wc_questions": "26;4;69;58",
        "wc_review": "272;414;467;233",
        "wc_reply_reviewers": "0;108;38;38",
        "wc_reply_authors": "1288;1765;1285;788",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "3;5;3;3",
        "rating_avg": [
            6.5,
            1.5
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            86.5,
            28.217902119044926
        ],
        "wc_strengths_avg": [
            106.0,
            59.89156868875618
        ],
        "wc_weaknesses_avg": [
            114.75,
            39.23885192000398
        ],
        "wc_questions_avg": [
            39.25,
            25.762133063859444
        ],
        "wc_review_avg": [
            346.5,
            96.83620190817068
        ],
        "wc_reply_reviewers_avg": [
            46.0,
            39.01281840626232
        ],
        "wc_reply_authors_avg": [
            1281.5,
            345.4594766394461
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.5,
            0.8660254037844386
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.5773502691896258,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4364144875763033305&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=OZitfSXpdT",
        "pdf": "https://openreview.net/pdf?id=OZitfSXpdT",
        "email": "mcgill.ca;google.com;mail.mcgill.ca;cityu.edu.hk;huawei.com;uwo.ca;concordia.ca;mcgill.ca",
        "author_num": 8,
        "aff_unique_index": "0;1;0;2;3;4;5;0",
        "aff_unique_norm": "McGill University;Google;City University of Hong Kong;Huawei;University of Western Ontario;Concordia University",
        "aff_unique_dep": ";Google Research;;Huawei Technologies;;",
        "aff_unique_url": "https://www.mcgill.ca;https://research.google;https://www.cityu.edu.hk;https://www.huawei.com;https://www.uwo.ca;https://www.concordia.ca",
        "aff_unique_abbr": "McGill;Google Research;CityU;Huawei;UWO;Concordia",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Mountain View;Hong Kong SAR",
        "aff_country_unique_index": "0;1;0;2;2;0;0;0",
        "aff_country_unique": "Canada;United States;China"
    },
    {
        "id": "Oashk4fDD9",
        "title": "Injecting a Structural Inductive Bias into a Seq2Seq Model by Simulation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Strong inductive biases enable learning from little data and help generalization outside of the training distribution. Popular neural architectures such as Transformers lack strong structural inductive biases for seq2seq NLP tasks on their own. Consequently, they struggle with systematic generalization beyond the training distribution, e.g. with extrapolating to longer inputs, even when pre-trained on large amounts of text. We show how a structural inductive bias can be injected into a seq2seq model by pre-training it to simulate structural transformations on synthetic data. Specifically, we inject an inductive bias towards Finite State Transducers (FSTs) into a Transformer by pre-training it to simulate FSTs given their descriptions. Our experiments show that our method imparts the desired inductive bias, resulting in improved systematic generalization and better few-shot learning for FST-like tasks.",
        "keywords": "systematic generalization;transformers;sequence modelling;finite state methods;natural language processing",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/e5d3f49dcab87ecb83f0f338dff7437a2dbea059.zip",
        "author": "Matthias Lindemann;Alexander Koller;Ivan Titov",
        "authorids": "~Matthias_Lindemann1;~Alexander_Koller2;~Ivan_Titov1",
        "gender": ";;",
        "homepage": "https://namednil.github.io/;;http://ivan-titov.org",
        "dblp": "220/5444;;08/5391",
        "google_scholar": "TEVnGGsAAAAJ;;https://scholar.google.nl/citations?user=FKUc3vsAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Matthias_Lindemann1;~Alexander_Koller2;~Ivan_Titov1",
        "aff": "University of Edinburgh, University of Edinburgh;;University of Amsterdam",
        "aff_domain": "ed.ac.uk;;uva.nl",
        "position": "PhD student;;Associate Professor",
        "bibtex": "@misc{\nlindemann2024injecting,\ntitle={Injecting a Structural Inductive Bias into a Seq2Seq Model by Simulation},\nauthor={Matthias Lindemann and Alexander Koller and Ivan Titov},\nyear={2024},\nurl={https://openreview.net/forum?id=Oashk4fDD9}\n}",
        "github": "",
        "project": "",
        "reviewers": "sUW9;Tami;Lr31",
        "site": "https://openreview.net/forum?id=Oashk4fDD9",
        "pdf_size": 428386,
        "rating": "6;6;6",
        "confidence": "3;3;2",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "3;3;3",
        "wc_summary": "80;78;56",
        "wc_strengths": "43;58;113",
        "wc_weaknesses": "207;82;167",
        "wc_questions": "34;1;84",
        "wc_review": "364;219;420",
        "wc_reply_reviewers": "59;0;114",
        "wc_reply_authors": "716;346;888",
        "reply_reviewers": "1;0;1",
        "reply_authors": "2;2;3",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            71.33333333333333,
            10.873004286866728
        ],
        "wc_strengths_avg": [
            71.33333333333333,
            30.092450142112984
        ],
        "wc_weaknesses_avg": [
            152.0,
            52.121652570372966
        ],
        "wc_questions_avg": [
            39.666666666666664,
            34.120700787384514
        ],
        "wc_review_avg": [
            334.3333333333333,
            84.6968450153579
        ],
        "wc_reply_reviewers_avg": [
            57.666666666666664,
            46.549853800940014
        ],
        "wc_reply_authors_avg": [
            650.0,
            226.13860056758702
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17734716067295128358&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Edinburgh;University of Amsterdam",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ed.ac.uk;https://www.uva.nl",
        "aff_unique_abbr": "Edinburgh;UvA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United Kingdom;Netherlands"
    },
    {
        "id": "OatZMyMuIo",
        "title": "Causal Representation Learning and Inference for Generalizable Cross-Domain Predictions",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Learning generalizable representations for machine learning and computer vision tasks is an active area of research. Typically, methods utilize data from multiple domains and seek to transfer the invariant representations to new and unseen domains. This paper proposes to perform causal inference on transportable, invariant interventional distribution to improve the prediction performance under distribution shifts.\nSpecifically, we first introduce a structural causal model (SCM) with latent representations to capture the underlying causal mechanism that underpins the data generation process. Subject to the proposed SCM model,  we can perform the intervention on the spurious representations that are affected by domain-specific factors and the latent confounders to eliminate the spurious correlations. Guided by the proposed SCM and the invariant interventional distribution, we propose a causal representation learning framework. Compared to state-of-the-art domain generalization approaches, our method is robust and generalizable under distribution shifts.  Furthermore, the empirical study shows that the proposed causal representation scheme outperforms existing causal learning baselines.",
        "keywords": "Generalizable representation learning; Causal Intervention",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/af14dbcbed28aeca8ebbb89727586c19c4e9f8f2.pdf",
        "author": "Naiyu Yin;Hanjing Wang;Amit Dhurandhar;Tian Gao;Qiang Ji",
        "authorids": "~Naiyu_Yin1;~Hanjing_Wang2;~Amit_Dhurandhar1;~Tian_Gao1;~Qiang_Ji1",
        "gender": "F;M;M;;M",
        "homepage": "https://sites.ecse.rpi.edu/~cvrl/Naiyu/Personal_website.html;https://www.ecse.rpi.edu/~cvrl/people_zw.html;https://researcher.watson.ibm.com/researcher/view.php?person=us-adhuran;https://sites.google.com/view/tiangao/home;https://www.ecse.rpi.edu/~qji/",
        "dblp": "200/1678;234/8752;66/3289;;",
        "google_scholar": "oWP6fNMAAAAJ;;km9vIPEAAAAJ;5rweipAAAAAJ;vAXmpVIAAAAJ",
        "orcid": "0009-0001-0120-4852;;;0000-0002-0337-6682;",
        "linkedin": ";;;;",
        "or_profile": "~Naiyu_Yin1;~Hanjing_Wang2;~Amit_Dhurandhar1;~Tian_Gao1;~Qiang_Ji1",
        "aff": "Rensselaer Polytechnic Institute;Rensselaer Polytechnic Institute;International Business Machines;Rensselaer Polytechnic Institute;Rensselaer Polytechnic Institute",
        "aff_domain": "rpi.edu;rpi.edu;ibm.com;rpi.edu;rpi.edu",
        "position": "PhD student;PhD student;Principal Researcher;PhD student;Professor",
        "bibtex": "@misc{\nyin2024causal,\ntitle={Causal Representation Learning and Inference for Generalizable Cross-Domain Predictions},\nauthor={Naiyu Yin and Hanjing Wang and Amit Dhurandhar and Tian Gao and Qiang Ji},\nyear={2024},\nurl={https://openreview.net/forum?id=OatZMyMuIo}\n}",
        "github": "",
        "project": "",
        "reviewers": "ni4b;RUwh;Rf1b;kccw",
        "site": "https://openreview.net/forum?id=OatZMyMuIo",
        "pdf_size": 4677883,
        "rating": "3;3;5;5",
        "confidence": "4;4;3;3",
        "soundness": "1;2;2;2",
        "contribution": "3;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "206;76;54;50",
        "wc_strengths": "72;23;40;28",
        "wc_weaknesses": "355;149;144;113",
        "wc_questions": "2;1;10;48",
        "wc_review": "635;249;248;239",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "864;623;815;471",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;2;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            96.5,
            63.99023362982823
        ],
        "wc_strengths_avg": [
            40.75,
            19.070592544543548
        ],
        "wc_weaknesses_avg": [
            190.25,
            96.11288935413397
        ],
        "wc_questions_avg": [
            15.25,
            19.22725929507375
        ],
        "wc_review_avg": [
            342.75,
            168.77555362077769
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            693.25,
            156.77113095209845
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:TOOOMMyt-nQJ:scholar.google.com/&scioq=Causal+Representation+Learning+and+Inference+for+Generalizable+Cross-Domain+Predictions&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "Rensselaer Polytechnic Institute;International Business Machines Corporation",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.rpi.edu;https://www.ibm.com",
        "aff_unique_abbr": "RPI;IBM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Oc4ji1iCjQ",
        "title": "Catch the Shadow: Automatic Shadow Variables Generation for Treatment Effect Estimation under Collider Bias",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Collider bias, which comes from non-random sample selection caused by both treatments and outcomes, is a significant and challenging problem of treatment effect estimation. Previous studies show that treatment effects are identifiable if some shadow variables are available in the observational data. Shadow variables are assumed to be fully observed covariates independent of the sample selection mechanism after conditioning on the outcome and other observed covariates. However, finding a well-defined shadow variable is often not an easier task than the task of dealing with collider bias itself in real-world scenarios. Therefore, we propose a novel ShadowCatcher that automatically generates representations serving the role of shadow variables from the observed covariates. Specifically, during the generation process, we impose conditional independence constraints on the learned representations to make them satisfy the assumptions of shadow variables. To further ensure that the generated representations are valid, we also use a tester to perform hypothesis testing and iteratively carry out the generation process until the generated representations pass the test. Using the generated representations, we propose a novel ShadowEstimator to estimate treatment effects under collider bias. Experimental results on both synthetic and real-world datasets demonstrate the effectiveness of our proposed ShadowCatcher and ShadowEstimator.",
        "keywords": "Treatment Effect Estimation;Causal Inference;Collider Bias;Selection Bias;Shadow Variable",
        "primary_area": "causal reasoning",
        "supplementary_material": "",
        "author": "Baohong Li;Haoxuan Li;Ruoxuan Xiong;Kun Kuang;Fei Wu",
        "authorids": "~Baohong_Li1;~Haoxuan_Li6;~Ruoxuan_Xiong1;~Kun_Kuang1;~Fei_Wu1",
        "gender": "M;M;;M;M",
        "homepage": ";https://haoxuanli-pku.github.io/;http://www.ruoxuanxiong.com/;http://kunkuang.github.io;https://person.zju.edu.cn/wufei",
        "dblp": "83/3116;145/4965-1.html;222/2927;194/4245;84/3254-1",
        "google_scholar": "M08DvYsAAAAJ;gtDqiucAAAAJ;lg_0u-0AAAAJ;https://scholar.google.com.hk/citations?user=FOsNiMQAAAAJ;XJLn4MYAAAAJ",
        "orcid": "0000-0002-3222-002X;0000-0003-3620-3769;;0009-0000-7528-8131;",
        "linkedin": ";;;;",
        "or_profile": "~Baohong_Li1;~Haoxuan_Li6;~Ruoxuan_Xiong1;~Kun_Kuang1;~Fei_Wu1",
        "aff": "Zhejiang University;Peking University;Emory University;Zhejiang University;Zhejiang University",
        "aff_domain": "zju.edu.cn;pku.edu.cn;emory.edu;zju.edu.cn;zju.edu.cn",
        "position": "PhD student;PhD student;Assistant Professor;Associate Professor;Full Professor",
        "bibtex": "@misc{\nli2024catch,\ntitle={Catch the Shadow: Automatic Shadow Variables Generation for Treatment Effect Estimation under Collider Bias},\nauthor={Baohong Li and Haoxuan Li and Ruoxuan Xiong and Kun Kuang and Fei Wu},\nyear={2024},\nurl={https://openreview.net/forum?id=Oc4ji1iCjQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "Y4SN;JJeK;5YRg;G11c",
        "site": "https://openreview.net/forum?id=Oc4ji1iCjQ",
        "pdf_size": 2327313,
        "rating": "5;6;8;8",
        "confidence": "3;3;4;4",
        "soundness": "2;4;4;3",
        "contribution": "2;4;4;4",
        "presentation": "3;4;3;3",
        "wc_summary": "174;50;151;94",
        "wc_strengths": "51;56;79;318",
        "wc_weaknesses": "123;387;77;130",
        "wc_questions": "158;22;86;2",
        "wc_review": "506;515;393;544",
        "wc_reply_reviewers": "127;40;0;0",
        "wc_reply_authors": "2406;1881;701;294",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "5;4;1;1",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            3.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            117.25,
            48.53542520674976
        ],
        "wc_strengths_avg": [
            126.0,
            111.35304216769293
        ],
        "wc_weaknesses_avg": [
            179.25,
            121.66013110300351
        ],
        "wc_questions_avg": [
            67.0,
            61.0163912403872
        ],
        "wc_review_avg": [
            489.5,
            57.45650528878345
        ],
        "wc_reply_reviewers_avg": [
            41.75,
            51.85737652446371
        ],
        "wc_reply_authors_avg": [
            1320.5,
            855.8552739803617
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.75,
            1.7853571071357126
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.9622504486493761,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ObQrTqTDTNQJ:scholar.google.com/&scioq=Catch+the+Shadow:+Automatic+Shadow+Variables+Generation+for+Treatment+Effect+Estimation+under+Collider+Bias&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0;0",
        "aff_unique_norm": "Zhejiang University;Peking University;Emory University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.zju.edu.cn;http://www.pku.edu.cn;https://www.emory.edu",
        "aff_unique_abbr": "ZJU;Peking U;Emory",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "OcaKeyGb0K",
        "title": "A unified theory of scene representation learning and object representation learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The goal of representation learning is the unsupervised learning of simple and useful representations that model sensory input.\nVarious methods have been proposed in representation learning, but a unified theory has not yet been established.\nTwo problems exist in the representation learning of a visual scene that contains multiple objects: scene representation learning and object representation learning.\nScene representation refers to decomposing a single visual scene that contains multiple objects into a combination of multiple individual objects.\nObject representation refers to decomposing a single object into a combination of multiple attributes, such as position and shape.\nScene representation learning and object representation learning have been formulated in different ways in previous studies.\nRecently, Ohmura et al. (2023) proposed a theory of object representation learning in which transformations between two objects are learned to satisfy algebraic independence so that one attribute of a single object can be transformed while the other remains invariant.\nIn existing methods of object representation learning, independence is often imposed between scalar variables, whereas theory based on algebraic independence successfully weakens the constraint from between scalar variables to between latent vectors.\nThe latent vector is also used to represent an individual object in existing methods of scene representation learning because such a vector can contain more information than the scalar variable.\nFurthermore, one of the main components of algebraic independence is commutativity.\nExisting methods of scene representation learning typically represent a visual scene as the sum of multiple object representations, and the sum satisfies commutativity.\nWe focused on the commonalities between object representation learning and scene representation learning: constraints between latent vectors and commutativity.\nWe proposed a unified theory based on algebraic independence that explains both scene representation learning and object representation learning.\nWe validated our theory in experiments on an image dataset that contained multiple objects.",
        "keywords": "Representation Learning;Multi-Object Representation Learning;Algebraic Independence",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Takayuki Komatsu;Yoshiyuki Ohmura;Yasuo Kuniyoshi",
        "authorids": "~Takayuki_Komatsu1;~Yoshiyuki_Ohmura1;~Yasuo_Kuniyoshi1",
        "gender": ";M;M",
        "homepage": ";http://www.isi.imi.i.u-tokyo.ac.jp/?lang=ja;http://www.isi.imi.i.u-tokyo.ac.jp/",
        "dblp": ";14/5406.html;42/4337",
        "google_scholar": ";;https://scholar.google.co.jp/citations?hl=ja",
        "orcid": ";0000-0002-9158-5360;0000-0001-8443-4161",
        "linkedin": ";;",
        "or_profile": "~Takayuki_Komatsu1;~Yoshiyuki_Ohmura1;~Yasuo_Kuniyoshi1",
        "aff": ";;The University of Tokyo",
        "aff_domain": ";;u-tokyo.ac.jp",
        "position": ";;Full Professor",
        "bibtex": "@misc{\nkomatsu2024a,\ntitle={A unified theory of scene representation learning and object representation learning},\nauthor={Takayuki Komatsu and Yoshiyuki Ohmura and Yasuo Kuniyoshi},\nyear={2024},\nurl={https://openreview.net/forum?id=OcaKeyGb0K}\n}",
        "github": "",
        "project": "",
        "reviewers": "4wri;cTci;wsoP;rWCq",
        "site": "https://openreview.net/forum?id=OcaKeyGb0K",
        "pdf_size": 449256,
        "rating": "3;3;3;3",
        "confidence": "3;3;5;4",
        "soundness": "1;3;1;2",
        "contribution": "1;2;1;2",
        "presentation": "1;2;2;2",
        "wc_summary": "72;27;69;29",
        "wc_strengths": "5;19;45;18",
        "wc_weaknesses": "160;156;338;44",
        "wc_questions": "39;68;4;10",
        "wc_review": "276;270;456;101",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            49.25,
            21.288200957337846
        ],
        "wc_strengths_avg": [
            21.75,
            14.515078366994786
        ],
        "wc_weaknesses_avg": [
            174.5,
            105.2556411789886
        ],
        "wc_questions_avg": [
            30.25,
            25.498774480354932
        ],
        "wc_review_avg": [
            275.75,
            125.55949784862952
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9931558762622843331&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Tokyo",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.u-tokyo.ac.jp",
        "aff_unique_abbr": "UTokyo",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Japan"
    },
    {
        "title": "Efficient Sharpness-Aware Minimization for Molecular Graph Transformer Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18737",
        "id": "Od39h4XQ3Y",
        "author_site": "Yili Wang, Kaixiong Zhou, Ninghao Liu, Ying Wang, Xin Wang",
        "tldr": "",
        "abstract": "Sharpness-aware minimization (SAM) has received increasing attention in computer vision since it can effectively eliminate the sharp local minima from the training trajectory and mitigate generalization degradation. However, SAM requires two sequential gradient computations during the optimization of each step: one to obtain the perturbation gradient and the other to obtain the updating gradient. \nCompared with the base optimizer (e.g., Adam), SAM doubles the time overhead due to the additional perturbation gradient. By dissecting the theory of SAM and observing the training gradient of the molecular graph transformer, we propose a new algorithm named GraphSAM,  which reduces the training cost of SAM and improves the generalization performance of graph transformer models. \nThere are two key factors that contribute to this result: (i) \\textit{gradient approximation}: we use the updating gradient of the previous step to approximate the perturbation gradient at the intermediate steps smoothly (\\textbf{increases efficiency}); (ii) \\textit{loss landscape approximation}: we theoretically prove that the loss landscape of GraphSAM is limited to a small range centered on the expected loss of SAM (\\textbf{guarantees generalization performance}). The extensive experiments on six datasets with different tasks demonstrate the superiority of GraphSAM, especially in optimizing the model update process.",
        "keywords": "Sharpness-Aware Minimization;Molecular Graph",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Yili Wang;Kaixiong Zhou;Ninghao Liu;Ying Wang;Xin Wang",
        "authorids": "~Yili_Wang2;~Kaixiong_Zhou1;~Ninghao_Liu2;~Ying_Wang13;~Xin_Wang54",
        "gender": "M;M;F;M;M",
        "homepage": "https://yl-wang.github.io//;https://kaixiong-zhou.github.io/;https://ccst.jlu.edu.cn/info/1367/19675.htm;https://xinwangjlu.github.io/;https://cobweb.cs.uga.edu/~ninghaoliu/",
        "dblp": "48/6261-4;178/7315;94/3104-9.html;10/5630-35;145/4489",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;zMspIjIAAAAJ;;https://scholar.google.com.hk/citations?user=Eh9n5VAAAAAJ;Nir-EDYAAAAJ",
        "orcid": "0000-0003-0845-9521;0000-0001-5226-8736;0000-0002-3288-5195;0000-0001-9448-7689;0000-0002-9170-2424",
        "linkedin": ";;;;",
        "or_profile": "~Yili_Wang2;~Kaixiong_Zhou1;~Ying_Wang13;~Xin_Wang54;~Ninghao_Liu1",
        "aff": "Jilin University;Massachusetts Institute of Technology;Jilin University;Jilin University;University of Georgia",
        "aff_domain": "jlu.edu.cn;mit.edu;jlu.edu.cn;jlu.edu.cn;uga.edu",
        "position": "PhD student;Postdoc;Full Professor;Associate Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nwang2024efficient,\ntitle={Efficient Sharpness-Aware Minimization for Molecular Graph Transformer Models},\nauthor={Yili Wang and Kaixiong Zhou and Ninghao Liu and Ying Wang and Xin Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Od39h4XQ3Y}\n}",
        "github": "",
        "project": "",
        "reviewers": "1va4;mSQh;sT1K;QvPb",
        "pdf_size": 862502,
        "rating": "6;6;6;6",
        "confidence": "4;5;3;4",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "2;2;3;4",
        "wc_summary": "16;78;97;44",
        "wc_strengths": "73;122;73;41",
        "wc_weaknesses": "63;250;84;303",
        "wc_questions": "76;27;2;108",
        "wc_review": "228;477;256;496",
        "wc_reply_reviewers": "0;0;0;35",
        "wc_reply_authors": "568;956;152;1192",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;2;1;3",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            58.75,
            31.13980571551467
        ],
        "wc_strengths_avg": [
            77.25,
            28.951468011138918
        ],
        "wc_weaknesses_avg": [
            175.0,
            103.48188247224729
        ],
        "wc_questions_avg": [
            53.25,
            41.324175732856425
        ],
        "wc_review_avg": [
            364.25,
            122.8339834899121
        ],
        "wc_reply_reviewers_avg": [
            8.75,
            15.155444566227676
        ],
        "wc_reply_authors_avg": [
            717.0,
            395.02278415301566
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=587789222906698855&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=Od39h4XQ3Y",
        "pdf": "https://openreview.net/pdf?id=Od39h4XQ3Y",
        "email": "jlu.edu.cn;mit.edu;jlu.edu.cn;jlu.edu.cn;uga.edu",
        "author_num": 5,
        "aff_unique_index": "0;1;0;0;2",
        "aff_unique_norm": "Jilin University;Massachusetts Institute of Technology;University of Georgia",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.jlu.edu.cn;https://web.mit.edu;https://www.uga.edu",
        "aff_unique_abbr": "JLU;MIT;UGA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "OdGyza5FO1",
        "title": "Motion PointNet: Solving Dynamic Capture in Point Cloud Video Human Action",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Motion representation plays a pivotal role in understanding video data, thereby elevating the dynamic capture to the forefront of action recognition tasks based on point cloud video. Previous works mainly compute the motion information in an unguided way, e.g. aggregate the spatial variations on adjacent point cloud frames using 4D convolutions or capture a point trajectory with kinematic computation like scene flow. However, the former fails to explicitly consider motion representation in corresponding frames, and the latter's reliance on tracking point trajectories becomes impractical in real-life applications due to the potential inter-frame migration of points. In this paper, we tackle the dynamic capture in point cloud video action by formulating it as solvable partial differential equations (PDEs) in feature space. Based on this intuitive design, we propose Motion PointNet, a novel method that improves the dynamic capture in point cloud video human action by constructing clear guidance for network learning. Motion PointNet is composed of a lightweight yet effective PointNet-like encoder and a PDEs-solving module for dynamic capture. Remarkably, our Motion PointNet, with merely 0.72 M parameters and 0.82 G FLOPs, achieves an impressive accuracy of 97.52 % on the MSRAction-3D dataset, surpassing the current state-of-the-art in all aspects. The code and the trained models will be released for reproduction.",
        "keywords": "3D point cloud;computer vision;action recognition",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/eb47ddff7225e8ed3de0e4c4bb2fc20937213cbe.zip",
        "author": "Zhuoxu Huang;Zhenkun Fan;Tao Xu;Jungong Han",
        "authorids": "~Zhuoxu_Huang1;~Zhenkun_Fan1;~Tao_Xu7;~Jungong_Han1",
        "gender": ";M;;M",
        "homepage": ";;;https://jungonghan.github.io/",
        "dblp": ";;;98/6127",
        "google_scholar": ";;;hNi1gxAAAAAJ",
        "orcid": ";0000-0001-9382-5068;;0000-0003-4361-956X",
        "linkedin": ";;;",
        "or_profile": "~Zhuoxu_Huang1;~Zhenkun_Fan1;~Tao_Xu7;~Jungong_Han1",
        "aff": ";University of Wales, Aberystwyth;;University of Sheffield",
        "aff_domain": ";aber.ac.uk;;sheffield.ac.uk",
        "position": ";PhD student;;Full Professor",
        "bibtex": "@misc{\nanonymous2024motion,\ntitle={Motion PointNet: Solving Dynamic Capture in Point Cloud Video Human Action},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=OdGyza5FO1}\n}",
        "github": "",
        "project": "",
        "reviewers": "isat;KFbJ;RMAg",
        "site": "https://openreview.net/forum?id=OdGyza5FO1",
        "pdf_size": 3590650,
        "rating": "3;6;6",
        "confidence": "4;5;4",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "2;3;2",
        "wc_summary": "80;128;45",
        "wc_strengths": "48;205;18",
        "wc_weaknesses": "188;162;53",
        "wc_questions": "126;5;21",
        "wc_review": "442;500;137",
        "wc_reply_reviewers": "583;0;0",
        "wc_reply_authors": "2666;491;701",
        "reply_reviewers": "2;0;0",
        "reply_authors": "4;1;1",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            84.33333333333333,
            34.022868126534476
        ],
        "wc_strengths_avg": [
            90.33333333333333,
            82.00135500235483
        ],
        "wc_weaknesses_avg": [
            134.33333333333334,
            58.48266599790251
        ],
        "wc_questions_avg": [
            50.666666666666664,
            53.66770185337008
        ],
        "wc_review_avg": [
            359.6666666666667,
            159.21962469773908
        ],
        "wc_reply_reviewers_avg": [
            194.33333333333334,
            274.82883562117144
        ],
        "wc_reply_authors_avg": [
            1286.0,
            979.5662305326782
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            2.0,
            1.4142135623730951
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:2srADIL_MpwJ:scholar.google.com/&scioq=Motion+PointNet:+Solving+Dynamic+Capture+in+Point+Cloud+Video+Human+Action&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Wales;University of Sheffield",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.wales.ac.uk;https://www.sheffield.ac.uk",
        "aff_unique_abbr": "UoW;Sheffield",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Aberystwyth;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "title": "More is Better: when Infinite Overparameterization is Optimal and Overfitting is Obligatory",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18736",
        "id": "OdpIjS0vkO",
        "author_site": "James Simon, Dhruva Karkada, Nikhil Ghosh, Misha Belkin",
        "tldr": "",
        "abstract": "In our era of enormous neural networks, empirical progress has been driven by the philosophy that *more is better.*\nRecent deep learning practice has found repeatedly that larger model size, more data, and more computation (resulting in lower training loss) optimizing to near-interpolation improves performance. In this paper, we give theoretical backing to these empirical observations by showing that these three properties hold in random feature (RF) regression, a class of models equivalent to shallow networks with only the last layer trained.\n\nConcretely, we first show that the test risk of RF regression decreases monotonically with both the number of features and samples, provided the ridge penalty is tuned optimally. In particular, this implies that infinite width RF architectures are preferable to those of any finite width. We then proceed to demonstrate that, for a large class of tasks characterized by powerlaw eigenstructure, training to near-zero training loss is *obligatory:* near-optimal performance can *only* be achieved when the training error is much smaller than the test error. Grounding our theory in real-world data, we find empirically that standard computer vision tasks with convolutional neural kernels clearly fall into this class. Taken together, our results tell a simple, testable story of the benefits of overparameterization and overfitting in random feature models.",
        "keywords": "overparameterization;interpolation;random feature regression;kernel regression;generalization;overfitting",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "James B Simon;Dhruva Karkada;Nikhil Ghosh;Mikhail Belkin",
        "authorids": "~James_B_Simon1;~Dhruva_Karkada1;~Nikhil_Ghosh1;~Mikhail_Belkin1",
        "gender": "M;M;M;",
        "homepage": "https://james-simon.github.io/;https://dkarkada.xyz;;http://misha.belkin-wang.org/",
        "dblp": "294/5406;361/7139;251/8779;",
        "google_scholar": "zjGfh3sAAAAJ;;0Fv4bikAAAAJ;Iwd9DdkAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;nikhil-ghosh-03389199/;",
        "or_profile": "~James_B_Simon1;~Dhruva_Karkada1;~Nikhil_Ghosh1;~Misha_Belkin1",
        "aff": "University of California, Berkeley;University of California, Berkeley;University of California, Berkeley;University of California, San Diego",
        "aff_domain": "berkeley.edu;berkeley.edu;berkeley.edu;ucsd.edu",
        "position": "PhD student;PhD student;PhD student;Professor",
        "bibtex": "@inproceedings{\nsimon2024more,\ntitle={More is Better: when Infinite Overparameterization is Optimal and Overfitting is Obligatory},\nauthor={James B Simon and Dhruva Karkada and Nikhil Ghosh and Mikhail Belkin},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=OdpIjS0vkO}\n}",
        "github": "",
        "project": "",
        "reviewers": "cEFV;xXiV;S1iV",
        "pdf_size": 1961146,
        "rating": "6;6;8",
        "confidence": "2;4;3",
        "soundness": "2;4;4",
        "contribution": "2;2;4",
        "presentation": "3;4;3",
        "wc_summary": "94;109;160",
        "wc_strengths": "67;161;85",
        "wc_weaknesses": "203;215;215",
        "wc_questions": "199;242;2",
        "wc_review": "563;727;462",
        "wc_reply_reviewers": "14;132;0",
        "wc_reply_authors": "634;540;172",
        "reply_reviewers": "1;1;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            121.0,
            28.24889378365107
        ],
        "wc_strengths_avg": [
            104.33333333333333,
            40.737642979872504
        ],
        "wc_weaknesses_avg": [
            211.0,
            5.656854249492381
        ],
        "wc_questions_avg": [
            147.66666666666666,
            104.48710712597777
        ],
        "wc_review_avg": [
            584.0,
            109.20012210005383
        ],
        "wc_reply_reviewers_avg": [
            48.666666666666664,
            59.2021020647822
        ],
        "wc_reply_authors_avg": [
            448.6666666666667,
            199.3612020652185
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5873176839744179521&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=OdpIjS0vkO",
        "pdf": "https://openreview.net/pdf?id=OdpIjS0vkO",
        "email": "berkeley.edu;berkeley.edu;berkeley.edu;ucsd.edu",
        "author_num": 4,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "University of California, Berkeley;University of California, San Diego",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.berkeley.edu;https://www.ucsd.edu",
        "aff_unique_abbr": "UC Berkeley;UCSD",
        "aff_campus_unique_index": "0;0;0;1",
        "aff_campus_unique": "Berkeley;San Diego",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Oe4XdjTP4y",
        "title": "Measuring Local and Shuffled Privacy of Gradient Randomized Response",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Local differential privacy (LDP) provides a strong privacy guarantee in a distributed setting such as federated learning (FL).\nEven if deployed LDP mechanisms honestly provide such privacy guarantees by randomizing gradients, how can we confirm and measure it?\nTo answer the above question, we introduce an empirical privacy test in FL clients by measuring the lower bounds of LDP.\nThe results of this measurement give the client the empirical $\\epsilon$ and probability that the two gradients can be distinguished.\nWe then instantiate five adversaries in FL under LDP to measure empirical LDP at various attack surfaces, including a worst-case attack that reaches the theoretical upper bound of LDP.\nThe empirical privacy test with the adversary instantiations enables FL clients to understand LDP more intuitively and verify that mechanisms claiming $\\epsilon$-LDP actually provide equivalent privacy protection.\nWe also demonstrate numerical observations of the measured privacy in these adversarial settings, and the randomization algorithm LDP-SGD is vulnerable to gradient manipulation and a well-pre-trained model.\nWe further discuss employing a shuffler to measure empirical privacy in a collaborative way and also measuring privacy of shuffled model.",
        "keywords": "Differential Privacy;Privacy Audit;Federated Learning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Marin Matsumoto;Tsubasa Takahashi;Seng Pei Liew;Masato Oguchi",
        "authorids": "~Marin_Matsumoto1;~Tsubasa_Takahashi1;~Seng_Pei_Liew1;~Masato_Oguchi1",
        "gender": ";M;Not Specified;M",
        "homepage": "https://sites.google.com/view/marin-matsumoto;https://sites.google.com/view/tsubasa-takahashi/;https://spliew.github.io/;https://www.is.ocha.ac.jp/~oguchi/",
        "dblp": ";85/5862-1;259/7221;70/2895.html",
        "google_scholar": ";s-jrZ94AAAAJ;KQL8tB8AAAAJ;DaYE4_0AAAAJ",
        "orcid": ";0000-0002-0646-0222;0000-0003-2419-2505;",
        "linkedin": ";;;",
        "or_profile": "~Marin_Matsumoto1;~Tsubasa_Takahashi1;~Seng_Pei_Liew1;~Masato_Oguchi1",
        "aff": "Ochanomizu Women's University;LY Corporation;LY Corporation;Ochanomizu University",
        "aff_domain": "ocha.ac.jp;lycorp.co.jp;lycorp.co.jp;ocha.ac.jp",
        "position": "PhD student;Senior Chief Researcher;Researcher;Full Professor",
        "bibtex": "@misc{\nmatsumoto2024measuring,\ntitle={Measuring Local and Shuffled Privacy of Gradient Randomized Response},\nauthor={Marin Matsumoto and Tsubasa Takahashi and Seng Pei Liew and Masato Oguchi},\nyear={2024},\nurl={https://openreview.net/forum?id=Oe4XdjTP4y}\n}",
        "github": "",
        "project": "",
        "reviewers": "eRua;MFPE;MdJg;Hrxc;HQzw",
        "site": "https://openreview.net/forum?id=Oe4XdjTP4y",
        "pdf_size": 700979,
        "rating": "3;3;5;5;6",
        "confidence": "3;2;3;3;4",
        "soundness": "2;1;3;2;2",
        "contribution": "2;1;2;2;3",
        "presentation": "3;3;2;3;3",
        "wc_summary": "192;95;62;90;95",
        "wc_strengths": "29;60;12;111;54",
        "wc_weaknesses": "35;237;260;228;91",
        "wc_questions": "11;8;14;30;435",
        "wc_review": "267;400;348;459;675",
        "wc_reply_reviewers": "0;0;0;32;296",
        "wc_reply_authors": "133;317;601;341;1062",
        "reply_reviewers": "0;0;0;1;2",
        "reply_authors": "1;1;1;1;2",
        "rating_avg": [
            4.4,
            1.2
        ],
        "confidence_avg": [
            3.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            2.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            106.8,
            44.332380942151076
        ],
        "wc_strengths_avg": [
            53.2,
            33.67729205265768
        ],
        "wc_weaknesses_avg": [
            170.2,
            89.90973250989016
        ],
        "wc_questions_avg": [
            99.6,
            167.87209416695794
        ],
        "wc_review_avg": [
            429.8,
            137.88313892568593
        ],
        "wc_reply_reviewers_avg": [
            65.6,
            115.8647487374827
        ],
        "wc_reply_authors_avg": [
            490.8,
            322.2051520382628
        ],
        "reply_reviewers_avg": [
            0.6,
            0.8
        ],
        "reply_authors_avg": [
            1.2,
            0.4
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.7905694150420948,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:PzoCzBXbiCUJ:scholar.google.com/&scioq=Measuring+Local+and+Shuffled+Privacy+of+Gradient+Randomized+Response&hl=en&as_sdt=0,44",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "Ochanomizu Women's University;LY Corporation;Ochanomizu University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ocha.ac.jp;;https://www.ochanomizu-u.ac.jp",
        "aff_unique_abbr": "OWU;;Ochanomizu U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Japan;"
    },
    {
        "title": "TapMo: Shape-aware Motion Generation of Skeleton-free Characters",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18735",
        "id": "OeH6Fdhv7q",
        "author_site": "Jiaxu Zhang, Shaoli Huang, Zhigang Tu, Xin Chen, Xiaohang Zhan, Gang Yu, Ying Shan",
        "tldr": "",
        "abstract": "Previous motion generation methods are limited to the pre-rigged 3D human model, hindering their applications in the animation of various non-rigged characters. In this work, we present TapMo, a Text-driven Animation PIpeline for synthesizing Motion in a broad spectrum of skeleton-free 3D characters. The pivotal innovation in TapMo is its use of shape deformation-aware features as a condition to guide the diffusion model, thereby enabling the generation of mesh-specific motions for various characters. Specifically, TapMo comprises two main components - Mesh Handle Predictor and Shape-aware Diffusion Module. Mesh Handle Predictor predicts the skinning weights and clusters mesh vertices into adaptive handles for deformation control, which eliminates the need for traditional skeletal rigging. Shape-aware Motion Diffusion synthesizes motion with mesh-specific adaptations. This module employs text-guided motions and mesh features extracted during the first stage, preserving the geometric integrity of the animations by accounting for the character's shape and deformation. Trained in a weakly-supervised manner, TapMo can accommodate a multitude of non-human meshes, both with and without associated text motions. We demonstrate the effectiveness and generalizability of TapMo through rigorous qualitative and quantitative experiments. Our results reveal that TapMo consistently outperforms existing auto-animation methods, delivering superior-quality animations for both seen or unseen heterogeneous 3D characters.",
        "keywords": "3D animation;text-driven animation;motion generation;mesh deformation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/6c976d135afc86bce16c01b1ea69ace374a9c536.zip",
        "author": "Jiaxu Zhang;Shaoli Huang;Zhigang Tu;Xin Chen;Xiaohang Zhan;Gang YU;Ying Shan",
        "authorids": "~Jiaxu_Zhang1;~Shaoli_Huang2;~Zhigang_Tu2;~Xin_Chen16;~Xiaohang_Zhan1;~Gang_YU2;~Ying_Shan2",
        "gender": "M;M;M;M;M;M;M",
        "homepage": "http://kebii.github.io;;http://tuzhigang.cn/English.html;https://chenxin.tech/;https://xiaohangzhan.github.io/;https://skicyyu.org/;",
        "dblp": "244/8986;80/8502;142/4070-1;24/1518-40;211/7010;;68/5910",
        "google_scholar": "jUAyNjEAAAAJ;o31BPFsAAAAJ;https://scholar.google.com/citations?hl=en;7qeAJZ4AAAAJ;QfquhDEAAAAJ;https://scholar.google.com.sg/citations?user=BJdigYsAAAAJ;4oXBp9UAAAAJ",
        "orcid": "0000-0002-9551-2708;;;0000-0002-9347-1367;0000-0003-2136-7592;0000-0001-5570-2710;0000-0001-7673-8325",
        "linkedin": ";;;xin-chen-cs/;xiaohang-zhan-%EF%BC%88%E8%A9%B9%E6%99%93%E8%88%AA%EF%BC%89-7659b2b8/;;YingShanProfile/",
        "or_profile": "~Jiaxu_Zhang1;~Shaoli_Huang2;~Zhigang_Tu2;~Xin_Chen16;~Xiaohang_Zhan1;~Gang_YU2;~Ying_Shan2",
        "aff": "Wuhan University;Tencent AI Lab;Wuhan University;Tencent;Tencent AI Lab;Tencent;Tencent PCG ARC Lab",
        "aff_domain": "whu.edu.cn;tencent.com;whu.edu.cn;tencent.com;tencent.com;tencent.com;arc.tencent.com",
        "position": "PhD student;Researcher;Full Professor;Researcher;Researcher;Research Scientist;Director",
        "bibtex": "@inproceedings{\nzhang2024tapmo,\ntitle={TapMo: Shape-aware Motion Generation of Skeleton-free Characters},\nauthor={Jiaxu Zhang and Shaoli Huang and Zhigang Tu and Xin Chen and Xiaohang Zhan and Gang YU and Ying Shan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=OeH6Fdhv7q}\n}",
        "github": "",
        "project": "",
        "reviewers": "e3Gp;JBvr;6xCW;qE61",
        "pdf_size": 4216451,
        "rating": "6;6;6;8",
        "confidence": "4;4;4;4",
        "soundness": "3;3;3;4",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;4",
        "wc_summary": "64;90;69;110",
        "wc_strengths": "32;64;38;57",
        "wc_weaknesses": "277;237;17;144",
        "wc_questions": "48;142;11;116",
        "wc_review": "421;533;135;427",
        "wc_reply_reviewers": "121;0;0;0",
        "wc_reply_authors": "535;732;310;625",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            83.25,
            18.267115262131565
        ],
        "wc_strengths_avg": [
            47.75,
            13.160072188251856
        ],
        "wc_weaknesses_avg": [
            168.75,
            100.02093530856428
        ],
        "wc_questions_avg": [
            79.25,
            52.25598051897983
        ],
        "wc_review_avg": [
            379.0,
            147.74978849392645
        ],
        "wc_reply_reviewers_avg": [
            30.25,
            52.39453692895854
        ],
        "wc_reply_authors_avg": [
            550.5,
            155.38098339243447
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18020975376479204594&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=OeH6Fdhv7q",
        "pdf": "https://openreview.net/pdf?id=OeH6Fdhv7q",
        "email": "whu.edu.cn;tencent.com;whu.edu.cn;tencent.com;tencent.com;tencent.com;arc.tencent.com",
        "author_num": 7,
        "aff_unique_index": "0;1;0;1;1;1;1",
        "aff_unique_norm": "Wuhan University;Tencent",
        "aff_unique_dep": ";Tencent AI Lab",
        "aff_unique_url": "http://www.whu.edu.cn/;https://ai.tencent.com",
        "aff_unique_abbr": "WHU;Tencent AI Lab",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "OeNcnlQPRz",
        "title": "Deep Regression Representation Learning with Topology",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The information bottleneck (IB) principle is an important framework that provides guiding principles for representation learning. Most works on representation learning and the IB principle focus only on classification and neglect regression. Yet the two operate on different principles to align with the IB principle: classification targets class separation in feature space, while regression requires feature continuity and ordinality with respect to the target. This key difference results in topologically different feature spaces. Why does the IB principle impact the topology of feature space? In this work, we establish two connections between them for regression representation learning. The first connection reveals that a lower intrinsic dimension of the feature space implies a reduced complexity of the representation $Z$, which serves as a learning target of the IB principle. This complexity can be quantified as the entropy of $Z$ conditional on the target space $Y$, and it is shown to be an upper bound on the generalization error. The second connection suggests that to better align with the IB principle, it's beneficial to learn a feature space that is topologically similar to the target space. Motivated by the two connections, we introduce a regularizer named PH-Reg, to lower the intrinsic dimension of feature space and keep the topology of the target space for regression. Experiments on synthetic and real-world regression tasks demonstrate the benefits of PH-Reg.",
        "keywords": "regression;topology;representation learning;information theory;depth estimation;super-resolution;age estimation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Shihao Zhang;Angela Yao",
        "authorids": "~Shihao_Zhang1;~Angela_Yao1",
        "gender": ";",
        "homepage": "https://needylove.github.io/;http://www.angelayao.com",
        "dblp": ";64/8484",
        "google_scholar": "SqS4w6gAAAAJ;https://scholar.google.ch/citations?user=-LJCZMMAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Shihao_Zhang1;~Angela_Yao1",
        "aff": "National University of Singapore;National University of Singapore",
        "aff_domain": "u.nus.edu;nus.edu.sg",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\nzhang2024deep,\ntitle={Deep Regression Representation Learning with Topology},\nauthor={Shihao Zhang and Angela Yao},\nyear={2024},\nurl={https://openreview.net/forum?id=OeNcnlQPRz}\n}",
        "github": "",
        "project": "",
        "reviewers": "iGsx;5Zit;5oRh;7gBF;awEv;pU4H",
        "site": "https://openreview.net/forum?id=OeNcnlQPRz",
        "pdf_size": 3617812,
        "rating": "3;3;3;3;5;5",
        "confidence": "3;3;4;4;3;3",
        "soundness": "2;2;2;1;2;2",
        "contribution": "2;2;2;2;3;2",
        "presentation": "2;2;3;2;2;2",
        "wc_summary": "31;69;123;82;102;138",
        "wc_strengths": "65;55;35;21;77;106",
        "wc_weaknesses": "181;218;380;863;437;685",
        "wc_questions": "33;176;7;37;130;73",
        "wc_review": "310;518;545;1003;746;1002",
        "wc_reply_reviewers": "0;0;0;0;0;0",
        "wc_reply_authors": "256;476;548;393;423;368",
        "reply_reviewers": "0;0;0;0;0;0",
        "reply_authors": "1;1;1;1;1;1",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            1.8333333333333333,
            0.3726779962499649
        ],
        "contribution_avg": [
            2.1666666666666665,
            0.3726779962499649
        ],
        "presentation_avg": [
            2.1666666666666665,
            0.3726779962499649
        ],
        "wc_summary_avg": [
            90.83333333333333,
            35.399701819208715
        ],
        "wc_strengths_avg": [
            59.833333333333336,
            27.691254134754455
        ],
        "wc_weaknesses_avg": [
            460.6666666666667,
            243.70929859613938
        ],
        "wc_questions_avg": [
            76.0,
            59.239626377394835
        ],
        "wc_review_avg": [
            687.3333333333334,
            256.06487893153604
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            410.6666666666667,
            90.67830807616315
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2348977612195873885&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "National University of Singapore",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nus.edu.sg",
        "aff_unique_abbr": "NUS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Singapore"
    },
    {
        "id": "OeOxLvDUuW",
        "title": "CodeScore: Evaluating Code Generation by Learning Code Execution",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "A proper code evaluation metric (CEM) profoundly impacts the evolution of code generation, which is an important research field in NLP and software engineering. Prevailing match-based CEMs (e.g., BLEU, Accuracy, and CodeBLEU) suffer from two significant drawbacks. \n1. They primarily measure the surface differences between codes without considering their functional equivalence. However, functional equivalence is pivotal in evaluating the effectiveness of code generation, as different codes can perform identical operations.\n2. They are predominantly designed for the Ref-only input format. However, code evaluation necessitates versatility in input formats. Aside from Ref-only, there are NL-only and Ref\\&NL formats, which existing match-based CEMs cannot effectively accommodate.\n\nIn this paper, we propose CodeScore, a large language model (LLM)-based CEM, which estimates the functional correctness of generated code on three input types. To acquire CodeScore, we present UniCE, a unified code generation learning framework, for LLMs to learn code execution (i.e., learning PassRatio and Executability of generated code) with unified input. Extensive experimental results on multiple code evaluation datasets demonstrate that CodeScore absolutely improves up to 58.87% correlation with functional correctness compared to other CEMs, achieves state-of-the-art performance, and effectively handles three input formats.",
        "keywords": "Code Evaluation",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/aac336734a57f8e92cd8b3d457a8f121dff5a05e.pdf",
        "author": "Yihong Dong;jiazheng ding;Ge Li;Xue Jiang;Zhuo Li;Zhi Jin",
        "authorids": "~Yihong_Dong1;~jiazheng_ding1;~Ge_Li4;~Xue_Jiang5;~Zhuo_Li10;~Zhi_Jin1",
        "gender": "M;M;M;;;F",
        "homepage": ";https://github.com/Dingjz;https://ligechina.github.io;;;http://faculty.pku.edu.cn/zhijin/en/index.htm",
        "dblp": ";;24/712-1;;;22/3510",
        "google_scholar": "-bNMkykAAAAJ;;PPqcVRwAAAAJ;;;https://scholar.google.com.tw/citations?user=ZC7SObAAAAAJ",
        "orcid": ";;;;;0000-0003-1087-226X",
        "linkedin": ";;;;;",
        "or_profile": "~Yihong_Dong1;~jiazheng_ding1;~Ge_Li4;~Xue_Jiang5;~Zhuo_Li10;~Zhi_Jin1",
        "aff": "Peking University;Peking University;Peking University;;;Peking University",
        "aff_domain": "pku.edu.cn;pku.edu.cn;pku.edu.cn;;;pku.edu.cn",
        "position": "PhD student;MS student;Full Professor;;;Full Professor",
        "bibtex": "@misc{\ndong2024codescore,\ntitle={CodeScore: Evaluating Code Generation by Learning Code Execution},\nauthor={Yihong Dong and jiazheng ding and Ge Li and Xue Jiang and Zhuo Li and Zhi Jin},\nyear={2024},\nurl={https://openreview.net/forum?id=OeOxLvDUuW}\n}",
        "github": "",
        "project": "",
        "reviewers": "2x5Y;kAYJ;hATV;oV3N",
        "site": "https://openreview.net/forum?id=OeOxLvDUuW",
        "pdf_size": 2823991,
        "rating": "3;3;3;5",
        "confidence": "5;4;3;4",
        "soundness": "2;2;2;2",
        "contribution": "3;2;2;2",
        "presentation": "3;2;2;2",
        "wc_summary": "25;155;106;213",
        "wc_strengths": "45;42;70;49",
        "wc_weaknesses": "38;805;417;347",
        "wc_questions": "76;31;284;2",
        "wc_review": "184;1033;877;611",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            124.75,
            68.92885825254905
        ],
        "wc_strengths_avg": [
            51.5,
            10.965856099730654
        ],
        "wc_weaknesses_avg": [
            401.75,
            273.01774209746884
        ],
        "wc_questions_avg": [
            98.25,
            110.43635044676186
        ],
        "wc_review_avg": [
            676.25,
            321.76806476093924
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 54,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15106523673243699730&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Peking University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.pku.edu.cn",
        "aff_unique_abbr": "Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Spectrally Transformed Kernel Regression",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18734",
        "id": "OeQE9zsztS",
        "author_site": "Runtian Zhai, Rattana Pukdee, Roger Jin, Nina Balcan, Pradeep K Ravikumar",
        "tldr": "",
        "abstract": "Unlabeled data is a key component of modern machine learning. In general, the role\nof unlabeled data is to impose a form of smoothness, usually from the similarity\ninformation encoded in a base kernel, such as the \u03f5-neighbor kernel or the adjacency\nmatrix of a graph. This work revisits the classical idea of spectrally transformed\nkernel regression (STKR), and provides a new class of general and scalable STKR\nestimators able to leverage unlabeled data. Intuitively, via spectral transformation,\nSTKR exploits the data distribution for which unlabeled data can provide additional\ninformation. First, we show that STKR is a principled and general approach,\nby characterizing a universal type of \u201ctarget smoothness\u201d, and proving that any\nsufficiently smooth function can be learned by STKR. Second, we provide scalable\nSTKR implementations for the inductive setting and a general transformation\nfunction, while prior work is mostly limited to the transductive setting. Third, we\nderive statistical guarantees for two scenarios: STKR with a known polynomial\ntransformation, and STKR with kernel PCA when the transformation is unknown.\nOverall, we believe that this work helps deepen our understanding of how to work\nwith unlabeled data, and its generality makes it easier to inspire new methods.",
        "keywords": "Learning Theory;Unlabeled Data;Kernel Methods;Semi-supervised Learning;Representation Learning;Label Propagation",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/df1eff62179d298e2e70f547081871cd21b3dff6.zip",
        "author": "Runtian Zhai;Rattana Pukdee;Roger Jin;Maria Florina Balcan;Pradeep Kumar Ravikumar",
        "authorids": "~Runtian_Zhai1;~Rattana_Pukdee1;rrjin@andrew.cmu.edu;~Maria_Florina_Balcan1;~Pradeep_Kumar_Ravikumar1",
        "gender": "M;M;;;M",
        "homepage": "http://www.runtianzhai.com;;;;http://www.cs.cmu.edu/~pradeepr/",
        "dblp": "242/8411;;;;94/3594",
        "google_scholar": "EXd0ES8AAAAJ;KhnQ8zoAAAAJ;;;https://scholar.google.com.tw/citations?user=Q4DTPw4AAAAJ",
        "orcid": "0000-0003-3332-3466;;;;",
        "linkedin": ";rattana-pukdee/;;;",
        "or_profile": "~Runtian_Zhai1;~Rattana_Pukdee1;rrjin@andrew.cmu.edu;~Maria_Florina_Balcan1;~Pradeep_Kumar_Ravikumar1",
        "aff": "Carnegie Mellon University;Carnegie Mellon University;;;Carnegie Mellon University",
        "aff_domain": "cmu.edu;andrew.cmu.edu;;;cmu.edu",
        "position": "PhD student;PhD student;;;Full Professor",
        "bibtex": "@inproceedings{\nzhai2024spectrally,\ntitle={Spectrally Transformed Kernel Regression},\nauthor={Runtian Zhai and Rattana Pukdee and Roger Jin and Maria Florina Balcan and Pradeep Kumar Ravikumar},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=OeQE9zsztS}\n}",
        "github": "",
        "project": "",
        "reviewers": "aR59;j9KG;bYf4;SncV;nUyP",
        "pdf_size": 615803,
        "rating": "8;8;8;8;8",
        "confidence": "4;3;2;3;3",
        "soundness": "3;3;4;3;3",
        "contribution": "4;3;4;3;4",
        "presentation": "3;3;3;4;4",
        "wc_summary": "271;183;138;97;451",
        "wc_strengths": "170;37;44;129;138",
        "wc_weaknesses": "458;2;35;258;169",
        "wc_questions": "155;70;63;614;92",
        "wc_review": "1054;292;280;1098;850",
        "wc_reply_reviewers": "16;23;7;730;0",
        "wc_reply_authors": "711;177;358;2015;640",
        "reply_reviewers": "1;1;1;3;0",
        "reply_authors": "2;1;1;3;1",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            3.2,
            0.39999999999999997
        ],
        "contribution_avg": [
            3.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            3.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            228.0,
            125.58980850371577
        ],
        "wc_strengths_avg": [
            103.6,
            53.33891637444465
        ],
        "wc_weaknesses_avg": [
            184.4,
            164.9855751270395
        ],
        "wc_questions_avg": [
            198.8,
            210.11749094256766
        ],
        "wc_review_avg": [
            714.8,
            359.99688887544573
        ],
        "wc_reply_reviewers_avg": [
            155.2,
            287.5061042830221
        ],
        "wc_reply_authors_avg": [
            780.2,
            646.7269593885815
        ],
        "reply_reviewers_avg": [
            1.2,
            0.9797958971132713
        ],
        "reply_authors_avg": [
            1.6,
            0.8
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7311587873014801723&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=OeQE9zsztS",
        "pdf": "https://openreview.net/pdf?id=OeQE9zsztS",
        "email": "cmu.edu;andrew.cmu.edu;;;cmu.edu",
        "author_num": 5,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Carnegie Mellon University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cmu.edu",
        "aff_unique_abbr": "CMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Of2RhzJ8UJ",
        "title": "Trust Regions for Explanations via Black-Box Probabilistic Certification",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Given the black box nature of machine learning models, a plethora of explainability methods have been developed to decipher the factors behind individual decisions. In this paper, we introduce a novel problem of black box (probabilistic) explanation certification. We ask the question: Given a black box model with only query access, an explanation for an example and a quality metric (viz. fidelity, stability), can we find the largest hypercube (i.e., $\\ell_{\\infty}$ ball) centered at the example such that when the explanation is applied to all examples within the hypercube, (with high probability) a quality criterion is met (viz. fidelity greater than some value)? Being able to efficiently find such a *trust region* has multiple benefits: i) insight into model behavior in a *region*, with a *guarantee*; ii) ascertained *stability* of the explanation; iii) *explanation reuse*, which can save time, energy and money by not having to find explanations for every example; and iv) a possible *meta-metric* to compare explanation methods. Our contributions include formalizing this problem, proposing solutions, providing theoretical guarantees for these solutions that are computable, and experimentally showing their efficacy on synthetic and real data.",
        "keywords": "Explainable AI",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/5bc9f0127aa742ed4f10f94cdaea0ae0dfdab3cc.zip",
        "author": "Amit Dhurandhar;Swagatam Haldar;Dennis Wei;Karthikeyan Natesan Ramamurthy",
        "authorids": "~Amit_Dhurandhar1;~Swagatam_Haldar1;~Dennis_Wei1;~Karthikeyan_Natesan_Ramamurthy1",
        "gender": "M;M;M;",
        "homepage": "https://researcher.watson.ibm.com/researcher/view.php?person=us-adhuran;;https://sites.google.com/site/dennislwei/;https://nrkarthikeyan.github.io/",
        "dblp": "66/3289;304/2070;59/8761;58/7800",
        "google_scholar": "km9vIPEAAAAJ;0VP-lRoAAAAJ;r4ldy4AAAAAJ;mG8HuhEAAAAJ",
        "orcid": ";;;0000-0002-6021-5930",
        "linkedin": ";swagatam-haldar-636a41232/;dennis-wei-4886036b/;",
        "or_profile": "~Amit_Dhurandhar1;~Swagatam_Haldar1;~Dennis_Wei1;~Karthikeyan_Natesan_Ramamurthy1",
        "aff": "International Business Machines;Eberhard-Karls-Universit\u00e4t T\u00fcbingen;International Business Machines;International Business Machines",
        "aff_domain": "ibm.com;uni-tuebingen.de;ibm.com;ibm.com",
        "position": "Principal Researcher;MS student;Research Staff Member;Research Staff Member",
        "bibtex": "@misc{\ndhurandhar2024trust,\ntitle={Trust Regions for Explanations via Black-Box Probabilistic Certification},\nauthor={Amit Dhurandhar and Swagatam Haldar and Dennis Wei and Karthikeyan Natesan Ramamurthy},\nyear={2024},\nurl={https://openreview.net/forum?id=Of2RhzJ8UJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "pTb7;46DG;3Uus;KmSN;ot88",
        "site": "https://openreview.net/forum?id=Of2RhzJ8UJ",
        "pdf_size": 1669051,
        "rating": "3;3;5;6;8",
        "confidence": "4;2;4;4;4",
        "soundness": "2;3;3;4;2",
        "contribution": "2;2;2;3;3",
        "presentation": "1;2;3;3;1",
        "wc_summary": "69;175;111;35;122",
        "wc_strengths": "36;33;37;74;74",
        "wc_weaknesses": "136;127;321;282;295",
        "wc_questions": "111;82;73;22;7",
        "wc_review": "352;417;542;413;498",
        "wc_reply_reviewers": "22;0;22;13;11",
        "wc_reply_authors": "700;513;665;692;853",
        "reply_reviewers": "1;0;1;1;1",
        "reply_authors": "1;1;2;2;3",
        "rating_avg": [
            5.0,
            1.8973665961010275
        ],
        "confidence_avg": [
            3.6,
            0.8000000000000002
        ],
        "soundness_avg": [
            2.8,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.0,
            0.8944271909999159
        ],
        "wc_summary_avg": [
            102.4,
            47.72253136622155
        ],
        "wc_strengths_avg": [
            50.8,
            18.988417522268676
        ],
        "wc_weaknesses_avg": [
            232.2,
            83.2235543581263
        ],
        "wc_questions_avg": [
            59.0,
            38.734997095649824
        ],
        "wc_review_avg": [
            444.4,
            67.33973566921688
        ],
        "wc_reply_reviewers_avg": [
            13.6,
            8.16333265278342
        ],
        "wc_reply_authors_avg": [
            684.6,
            108.14915626115628
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            1.8,
            0.7483314773547883
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5270462766947298,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18017891945076532316&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "International Business Machines Corporation;Eberhard Karls University of T\u00fcbingen",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ibm.com;https://www.uni-tuebingen.de/",
        "aff_unique_abbr": "IBM;Uni T\u00fcbingen",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";T\u00fcbingen",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "United States;Germany"
    },
    {
        "title": "Improved statistical and computational complexity of the mean-field Langevin dynamics under structured data",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18733",
        "id": "Of2nEDc4s7",
        "author_site": "Atsushi Nitanda, Kazusato Oko, Taiji Suzuki, Denny Wu",
        "tldr": "",
        "abstract": "Recent works have shown that neural networks optimized by gradient-based methods can adapt to sparse or low-dimensional target functions through feature learning; an often studied target is the sparse parity function on the unit hypercube. However, such isotropic data setting does not capture the anisotropy and low intrinsic dimensionality exhibited in realistic datasets. In this work, we address this shortcoming by studying how gradient-based feature learning interacts with structured (anisotropic) input data: we consider the classification of $k$-sparse parity on high-dimensional orthotope where the feature coordinates have varying magnitudes, and analyze the learning complexity of the mean-field Langevin dynamics (MFLD), which describes the noisy gradient descent update on two-layer neural network. We show that the statistical complexity (i.e. sample size) and computational complexity (i.e. network width) of MFLD can both be improved when prominent directions of the anisotropic input data align with the support of the target function. Moreover, by employing a coordinate transform determined by the gradient covariance, the width can be made independent of the target degree $k$. Lastly, we demonstrate the benefit of feature learning by establishing a kernel lower bound on the classification error, which applies to neural networks in the lazy regime.",
        "keywords": "neural network optimization;feature learning;mean-field Langevin dynamics",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Atsushi Nitanda;Kazusato Oko;Taiji Suzuki;Denny Wu",
        "authorids": "~Atsushi_Nitanda1;~Kazusato_Oko1;~Taiji_Suzuki1;~Denny_Wu2",
        "gender": "M;M;M;M",
        "homepage": "https://sites.google.com/site/atsushinitanda;;http://ibis.t.u-tokyo.ac.jp/suzuki/;https://dennywu1.github.io/",
        "dblp": "155/1884;;08/312;",
        "google_scholar": "https://scholar.google.co.jp/citations?user=LyVvaf8AAAAJ;;x8osrBsAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;",
        "linkedin": ";kazusatooko/;;",
        "or_profile": "~Atsushi_Nitanda1;~Kazusato_Oko1;~Taiji_Suzuki1;~Denny_Wu2",
        "aff": "A*STAR;The University of Tokyo;The University of Tokyo;New York University",
        "aff_domain": "a-star.edu.sg;u-tokyo.ac.jp;tokyo.ac.jp;nyu.edu",
        "position": "Principal Researcher;MS student;Associate Professor;Postdoc",
        "bibtex": "@inproceedings{\nnitanda2024improved,\ntitle={Improved statistical and computational complexity of the mean-field Langevin dynamics under structured data},\nauthor={Atsushi Nitanda and Kazusato Oko and Taiji Suzuki and Denny Wu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Of2nEDc4s7}\n}",
        "github": "",
        "project": "",
        "reviewers": "Gjnf;e822;obgQ",
        "pdf_size": 498675,
        "rating": "6;6;8",
        "confidence": "3;2;3",
        "soundness": "4;3;3",
        "contribution": "3;2;3",
        "presentation": "4;3;3",
        "wc_summary": "127;56;46",
        "wc_strengths": "70;73;60",
        "wc_weaknesses": "183;110;61",
        "wc_questions": "95;150;72",
        "wc_review": "475;389;239",
        "wc_reply_reviewers": "111;148;38",
        "wc_reply_authors": "1022;816;437",
        "reply_reviewers": "1;1;1",
        "reply_authors": "2;2;1",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            76.33333333333333,
            36.058594290712755
        ],
        "wc_strengths_avg": [
            67.66666666666667,
            5.557777333511022
        ],
        "wc_weaknesses_avg": [
            118.0,
            50.1265066273989
        ],
        "wc_questions_avg": [
            105.66666666666667,
            32.72443871006635
        ],
        "wc_review_avg": [
            367.6666666666667,
            97.52036824285592
        ],
        "wc_reply_reviewers_avg": [
            99.0,
            45.70193285482209
        ],
        "wc_reply_authors_avg": [
            758.3333333333334,
            242.28128739591554
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.49999999999999983,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7491111458468179153&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=Of2nEDc4s7",
        "pdf": "https://openreview.net/pdf?id=Of2nEDc4s7",
        "email": "a-star.edu.sg;u-tokyo.ac.jp;tokyo.ac.jp;nyu.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "Agency for Science, Technology and Research;University of Tokyo;New York University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.a-star.edu.sg;https://www.u-tokyo.ac.jp;https://www.nyu.edu",
        "aff_unique_abbr": "A*STAR;UTokyo;NYU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;2",
        "aff_country_unique": "Singapore;Japan;United States"
    },
    {
        "id": "OfPtOAo8sn",
        "title": "vFedSec: Efficient Secure Aggregation for Vertical Federated Learning via Secure Layer",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Most work in privacy-preserving federated learning (FL) has been focusing on horizontally partitioned datasets where clients share the same sets of features and can train complete models independently. However, in many interesting problems, individual data points are scattered across different clients/organizations in a vertical setting. Solutions for this type of FL require the exchange of intermediate outputs and gradients between participants, posing a potential risk of privacy leakage when privacy and security concerns are not considered. In this work, we present *vFedSec* - a novel design with an innovative *Secure Layer* for training vertical FL securely and efficiently using state-of-the-art security modules in secure aggregation. We theoretically demonstrate that our method does not impact the training performance while protecting private data effectively. Empirical results from extensive experiments substantiate this design producing secure training with negligible computation and communication overhead. Compared to widely-adopted homomorphic encryption (HE) methods, our method can obtain $\\geq 690\\times$ speedup and reduce communication costs by $\\geq 9.6\\times$.",
        "keywords": "Federated Learning;Secure Aggregation",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Xinchi Qiu;Heng Pan;Wanru Zhao;Chenyang Ma;Yan Gao;Pedro Porto Buarque de Gusmao;Nicholas Donald Lane",
        "authorids": "~Xinchi_Qiu1;~Heng_Pan2;~Wanru_Zhao1;~Chenyang_Ma1;~Yan_Gao4;~Pedro_Porto_Buarque_de_Gusmao1;~Nicholas_Donald_Lane1",
        "gender": "F;;;M;M;M;",
        "homepage": ";;;https://dannymcy.github.io/;https://www.cst.cam.ac.uk/people/yg381;https://portobgusmao.com/;",
        "dblp": "265/6559;;;;;88/10808;",
        "google_scholar": "yW6vsS8AAAAJ;;;d4tuNoUAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.it/citations?user=TfdVttMAAAAJ;",
        "orcid": ";;;0009-0007-0737-3175;;0000-0002-7072-9898;",
        "linkedin": "xinchi-qiu-686a7394/;heng-pan-117915247/;;chenyang-ma-66945091/;;pedropgusmao;",
        "or_profile": "~Xinchi_Qiu1;~Heng_Pan2;~Wanru_Zhao1;~Chenyang_Ma1;~Yan_Gao4;~Pedro_Porto_Buarque_de_Gusmao1;~Nicholas_Donald_Lane1",
        "aff": "University of Cambridge;University of Cambridge;;University of Oxford;University of Cambridge;University of Surrey;",
        "aff_domain": "cam.ac.uk;cam.ac.uk;;cs.ox.ac.uk;cam.ac.uk;surrey.ac.uk;",
        "position": "PhD student;Researcher;;PhD student;PhD student;Lecturer;",
        "bibtex": "@misc{\nqiu2024vfedsec,\ntitle={vFedSec: Efficient Secure Aggregation for Vertical Federated Learning via Secure Layer},\nauthor={Xinchi Qiu and Heng Pan and Wanru Zhao and Chenyang Ma and Yan Gao and Pedro Porto Buarque de Gusmao and Nicholas Donald Lane},\nyear={2024},\nurl={https://openreview.net/forum?id=OfPtOAo8sn}\n}",
        "github": "",
        "project": "",
        "reviewers": "8n1Z;aMR8;XS2L",
        "site": "https://openreview.net/forum?id=OfPtOAo8sn",
        "pdf_size": 436691,
        "rating": "3;3;5",
        "confidence": "4;4;3",
        "soundness": "2;2;3",
        "contribution": "2;2;1",
        "presentation": "2;2;2",
        "wc_summary": "77;114;84",
        "wc_strengths": "34;28;10",
        "wc_weaknesses": "298;249;219",
        "wc_questions": "64;12;4",
        "wc_review": "473;403;317",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            91.66666666666667,
            16.048537489614297
        ],
        "wc_strengths_avg": [
            24.0,
            10.198039027185569
        ],
        "wc_weaknesses_avg": [
            255.33333333333334,
            32.561053764001905
        ],
        "wc_questions_avg": [
            26.666666666666668,
            26.59991645768
        ],
        "wc_review_avg": [
            397.6666666666667,
            63.798293254774634
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11404890485363153074&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;1;0;2",
        "aff_unique_norm": "University of Cambridge;University of Oxford;University of Surrey",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.cam.ac.uk;https://www.ox.ac.uk;https://www.surrey.ac.uk",
        "aff_unique_abbr": "Cambridge;Oxford;Surrey",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Cambridge;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "title": "ALAM: Averaged Low-Precision Activation for Memory-Efficient Training of Transformer Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18732",
        "id": "OfXqQ5TRwp",
        "author_site": "Sunghyeon Woo, SunWoo Lee, Dongsuk Jeon",
        "tldr": "",
        "abstract": "One of the key challenges in deep neural network training is the substantial amount of GPU memory required to store activations obtained in the forward pass. Various Activation-Compressed Training (ACT) schemes have been proposed to mitigate this issue; however, it is challenging to adopt those approaches in recent transformer-based large language models (LLMs), which experience significant performance drops when the activations are deeply compressed during training. In this paper, we introduce ALAM, a novel ACT framework that utilizes average quantization and a lightweight sensitivity calculation scheme, enabling large memory saving in LLMs while maintaining training performance. We first demonstrate that compressing activations into their group average values minimizes the gradient variance. Employing this property, we propose Average Quantization which provides high-quality deeply compressed activations with an effective precision of less than 1 bit and improved flexibility of precision allocation. In addition, we present a cost-effective yet accurate sensitivity calculation algorithm that solely relies on the L2 norm of parameter gradients, substantially reducing memory overhead due to sensitivity calculation. In experiments, the ALAM framework significantly reduces activation memory without compromising accuracy, achieving up to a 10$\\times$ compression rate in LLMs.",
        "keywords": "Memory efficient training;Activation-compressed training;Average Quantization;NLP;Transformer",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Sunghyeon Woo;Sunwoo Lee;Dongsuk Jeon",
        "authorids": "~Sunghyeon_Woo1;~Sunwoo_Lee2;~Dongsuk_Jeon1",
        "gender": "M;M;M",
        "homepage": "http://mms.snu.ac.kr/;;http://mms.snu.ac.kr",
        "dblp": "319/4560;;28/9878",
        "google_scholar": ";;_7GzTD4AAAAJ",
        "orcid": ";0000-0001-7760-0168;",
        "linkedin": ";;",
        "or_profile": "~Sunghyeon_Woo1;~Sunwoo_Lee2;~Dongsuk_Jeon1",
        "aff": "NAVER;Seoul National University;Seoul National University",
        "aff_domain": "navercorp.com;snu.ac.kr;snu.ac.kr",
        "position": "Intern;PhD student;Associate Professor",
        "bibtex": "@inproceedings{\nwoo2024alam,\ntitle={{ALAM}: Averaged Low-Precision Activation for Memory-Efficient Training of Transformer Models},\nauthor={Sunghyeon Woo and Sunwoo Lee and Dongsuk Jeon},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=OfXqQ5TRwp}\n}",
        "github": "",
        "project": "",
        "reviewers": "7RJR;UZqy;Eyz9;HytY",
        "pdf_size": 805215,
        "rating": "6;6;6;6",
        "confidence": "4;5;2;2",
        "soundness": "3;3;3;3",
        "contribution": "3;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "35;56;105;89",
        "wc_strengths": "37;16;72;73",
        "wc_weaknesses": "16;83;59;42",
        "wc_questions": "5;12;62;7",
        "wc_review": "93;167;298;211",
        "wc_reply_reviewers": "0;19;0;0",
        "wc_reply_authors": "535;953;1253;471",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "2;4;4;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.25,
            1.299038105676658
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            71.25,
            27.38955092731533
        ],
        "wc_strengths_avg": [
            49.5,
            24.171263930543642
        ],
        "wc_weaknesses_avg": [
            50.0,
            24.443813123160634
        ],
        "wc_questions_avg": [
            21.5,
            23.521266972678152
        ],
        "wc_review_avg": [
            192.25,
            74.20032008017216
        ],
        "wc_reply_reviewers_avg": [
            4.75,
            8.227241335952167
        ],
        "wc_reply_authors_avg": [
            803.0,
            319.0015673942685
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            1.0
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14453786605413099828&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=OfXqQ5TRwp",
        "pdf": "https://openreview.net/pdf?id=OfXqQ5TRwp",
        "email": "navercorp.com;snu.ac.kr;snu.ac.kr",
        "author_num": 3,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "NAVER Corporation;Seoul National University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.naver.com;https://www.snu.ac.kr",
        "aff_unique_abbr": "NAVER;SNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "OgTMbLDQZu",
        "title": "LAMDA: Unified Language-Driven Multi-Task Domain Adaption",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Unsupervised domain adaption (UDA), as a form of transfer learning, seeks to adapt a well-trained model from supervised source domains to an unlabeled target domain. However, most existing UDA approaches have two limitations. Firstly, these approaches assume that the source and target domains share the same language vocabulary, which is not practical in real-world applications where the target domain may have distinct vocabularies. Secondly, existing UDA methods for core vision tasks, such as detection and segmentation, differ significantly in their network architectures and adaption granularities. This leads to redundant research efforts in developing specialized architectures for each UDA task, without the ability to generalize across tasks. To address these limitations, we propose the formulation of unified language-driven multi-task domain adaption (LAMDA). LAMDA incorporates a pre-trained vision-language model into the source domains, allowing for transfer to various tasks in the unlabeled target domain with different vocabularies. This eliminates the need for multiple vocabulary-specific vision models and their respective source datasets. Additionally, LAMDA enables unsupervised transfer to novel domains with custom vocabularies. Extensive experiments on various segmentation and detection datasets validate the effectiveness, extensibility, and practicality of the proposed LAMDA.",
        "keywords": "Transfer Learning;Universe Domain Adaption;Language-driven",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/3aa9be63a3a110ecc14317881c2075d39319526e.pdf",
        "author": "Wenwei Jin;Deyi Ji;Feng Zhao;Mingyuan Tao;Jieping Ye",
        "authorids": "~Wenwei_Jin1;~Deyi_Ji2;~Feng_Zhao6;~Mingyuan_Tao1;~Jieping_Ye4",
        "gender": ";;M;M;M",
        "homepage": ";https://jankyee.github.io;https://bivlab123.github.io/;;http://yelabs.net/",
        "dblp": ";230/2118;181/2734-4;289/5997;03/5454",
        "google_scholar": ";r9-7am4AAAAJ;https://scholar.google.co.uk/citations?hl=en;https://scholar.google.com/citations?hl=en;T9AzhwcAAAAJ",
        "orcid": ";0000-0001-7561-9789;0000-0001-6767-8105;;0000-0001-8662-5818",
        "linkedin": ";;;;",
        "or_profile": "~Wenwei_Jin1;~Deyi_Ji2;~Feng_Zhao6;~Mingyuan_Tao1;~Jieping_Ye4",
        "aff": ";Alibaba Group;University of Science and Technology of China;;Alibaba Group",
        "aff_domain": ";alibaba-inc.com;ustc.edu.cn;;alibaba-inc.com",
        "position": ";Researcher;Full Professor;;Principal Researcher",
        "bibtex": "@misc{\njin2024lamda,\ntitle={{LAMDA}: Unified Language-Driven Multi-Task Domain Adaption},\nauthor={Wenwei Jin and Deyi Ji and Feng Zhao and Mingyuan Tao and Jieping Ye},\nyear={2024},\nurl={https://openreview.net/forum?id=OgTMbLDQZu}\n}",
        "github": "",
        "project": "",
        "reviewers": "VxaA;QBkk;Nx7u",
        "site": "https://openreview.net/forum?id=OgTMbLDQZu",
        "pdf_size": 3227191,
        "rating": "3;5;6",
        "confidence": "4;3;3",
        "soundness": "3;2;3",
        "contribution": "3;2;3",
        "presentation": "2;2;2",
        "wc_summary": "100;23;115",
        "wc_strengths": "38;17;57",
        "wc_weaknesses": "414;156;448",
        "wc_questions": "42;2;30",
        "wc_review": "594;198;650",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "729;716;726",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            79.33333333333333,
            40.30164044083345
        ],
        "wc_strengths_avg": [
            37.333333333333336,
            16.33673433979046
        ],
        "wc_weaknesses_avg": [
            339.3333333333333,
            130.3772304592417
        ],
        "wc_questions_avg": [
            24.666666666666668,
            16.75974011996871
        ],
        "wc_review_avg": [
            480.6666666666667,
            201.17874860155803
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            723.6666666666666,
            5.557777333511022
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9449111825230683,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:MqXjBfj-u6oJ:scholar.google.com/&scioq=LAMDA:+Unified+Language-Driven+Multi-Task+Domain+Adaption&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Alibaba Group;University of Science and Technology of China",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.alibaba.com;http://www.ustc.edu.cn",
        "aff_unique_abbr": "Alibaba;USTC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "Oh7YXI4T4N",
        "title": "Learning Diverse Quadruped Locomotion Gaits via Reward Machines",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Quadruped animals are capable of exhibiting a diverse range of locomotion gaits. While progress has been made in demonstrating such gaits on robots, current methods rely on motion priors, dynamics models, or other forms of extensive manual efforts. People can use natural language to describe dance moves. Could one use a formal language to specify quadruped gaits? To this end, we aim to enable easy gait specification and efficient policy learning. Leveraging Reward Machines~(RMs) for high-level gait specification over foot contacts, our approach is called RM-based Locomotion Learning~(RMLL), and supports adjusting gait frequency at execution time. Gait specification is enabled through the use of a few logical rules per gait (e.g., alternate between moving front feet and back feet) and does not require labor-intensive motion priors. Experimental results in simulation highlight the diversity of learned gaits (including two novel gaits), their energy consumption and stability across different terrains, and the superior sample-efficiency when compared to baselines. We also demonstrate these learned policies with a real quadruped robot.",
        "keywords": "Reward Machine;Quadruped Locomotion;Reinforcement Learning;Robotics",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/c68b715d898d39867a9187af9ca289805a3dc2d5.zip",
        "author": "David DeFazio;Yohei Hayamizu;Shiqi Zhang",
        "authorids": "~David_DeFazio1;~Yohei_Hayamizu1;~Shiqi_Zhang1",
        "gender": "M;M;M",
        "homepage": ";https://yoheihayamizu.github.io/yhayamizu/;http://www.cs.binghamton.edu/~szhang/",
        "dblp": "231/7609;;03/9964-1",
        "google_scholar": "9mCgbWIAAAAJ;J47eozMAAAAJ;D0pzuNoAAAAJ",
        "orcid": ";;0000-0003-4110-8213",
        "linkedin": ";;",
        "or_profile": "~David_DeFazio1;~Yohei_Hayamizu1;~Shiqi_Zhang1",
        "aff": "State University of New York at Binghamton;State University of New York at Binghamton;State University of New York at Binghamton",
        "aff_domain": "binghamton.edu;binghamton.edu;binghamton.edu",
        "position": "PhD student;PhD student;Associate Professor",
        "bibtex": "@misc{\ndefazio2024learning,\ntitle={Learning Diverse Quadruped Locomotion Gaits via Reward Machines},\nauthor={David DeFazio and Yohei Hayamizu and Shiqi Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=Oh7YXI4T4N}\n}",
        "github": "",
        "project": "",
        "reviewers": "UMdH;6Qms;MmwQ;i6Hh",
        "site": "https://openreview.net/forum?id=Oh7YXI4T4N",
        "pdf_size": 13745294,
        "rating": "3;5;5;8",
        "confidence": "5;4;3;4",
        "soundness": "2;2;3;4",
        "contribution": "1;2;2;3",
        "presentation": "2;3;3;4",
        "wc_summary": "83;93;58;30",
        "wc_strengths": "28;53;53;31",
        "wc_weaknesses": "116;307;69;10",
        "wc_questions": "1;3;2;58",
        "wc_review": "228;456;182;129",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "566;765;384;268",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            66.0,
            24.38237068047322
        ],
        "wc_strengths_avg": [
            41.25,
            11.797775213996918
        ],
        "wc_weaknesses_avg": [
            125.5,
            111.31599166337243
        ],
        "wc_questions_avg": [
            16.0,
            24.259018941416407
        ],
        "wc_review_avg": [
            248.75,
            124.67833612941745
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            495.75,
            188.27423482781705
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.39605901719066966,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:l53hgXpsJJwJ:scholar.google.com/&scioq=Learning+Diverse+Quadruped+Locomotion+Gaits+via+Reward+Machines&hl=en&as_sdt=0,48",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "State University of New York at Binghamton",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.binghamton.edu",
        "aff_unique_abbr": "SUNY Binghamton",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Binghamton",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "OhTzuWzO6Q",
        "title": "A Bayesian Approach for Personalized Federated Learning in Heterogeneous Settings",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In several practical applications of federated learning (FL), the clients are highly heterogeneous in terms of both their data and compute resources, and therefore enforcing the same model architecture for each client is very limiting. The need for uncertainty quantification is also often particularly amplified for clients that have limited local data. This paper presents a unified FL framework based on training customized local Bayesian models that can simultaneously address both these constraints. A Bayesian framework provides a natural way of incorporating supervision in the form of prior distributions. We use priors in the functional (output) space of the networks to facilitate collaboration across heterogeneous clients via an unlabelled auxiliary dataset. We further present a differentially private version of the algorithm along with formal differential privacy guarantees that apply to general settings without any assumptions on the learning algorithm. Experiments on standard FL datasets demonstrate that our approach outperforms strong baselines in both homogeneous and heterogeneous settings and under strict privacy constraints, while also providing characterizations of model uncertainties.",
        "keywords": "Federated Learning;Heterogeneous Settings;Bayesian Learning;Privacy-aware",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/c7d2cde5da92f382661aa8f340d9cfa65ba5712b.pdf",
        "author": "Disha Makhija;Joydeep Ghosh;Nhat Ho",
        "authorids": "~Disha_Makhija1;~Joydeep_Ghosh1;~Nhat_Ho1",
        "gender": ";M;M",
        "homepage": ";http://ideal.ece.utexas.edu/ghosh/;https://nhatptnk8912.github.io/",
        "dblp": "169/9962.html;51/2272;203/4479",
        "google_scholar": ";;https://scholar.google.ca/citations?user=Xs7cKMwAAAAJ",
        "orcid": ";;",
        "linkedin": ";;nhat-pham-minh-ho-267b8164/",
        "or_profile": "~Disha_Makhija1;~Joydeep_Ghosh1;~Nhat_Ho1",
        "aff": "University of Texas at Austin;University of Texas, Austin;University of Texas, Austin",
        "aff_domain": "utexas.edu;utexas.edu;utexas.edu",
        "position": "PhD student;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nmakhija2024a,\ntitle={A Bayesian Approach for Personalized Federated Learning in Heterogeneous Settings},\nauthor={Disha Makhija and Joydeep Ghosh and Nhat Ho},\nyear={2024},\nurl={https://openreview.net/forum?id=OhTzuWzO6Q}\n}",
        "github": "",
        "project": "",
        "reviewers": "wAJ2;aEw6;HKw3;j79p",
        "site": "https://openreview.net/forum?id=OhTzuWzO6Q",
        "pdf_size": 543190,
        "rating": "3;5;5;6",
        "confidence": "3;4;4;3",
        "soundness": "2;2;2;3",
        "contribution": "1;3;1;3",
        "presentation": "2;2;2;2",
        "wc_summary": "142;135;77;74",
        "wc_strengths": "63;89;53;94",
        "wc_weaknesses": "79;219;376;149",
        "wc_questions": "260;104;5;60",
        "wc_review": "544;547;511;377",
        "wc_reply_reviewers": "0;0;132;0",
        "wc_reply_authors": "1400;1472;1503;423",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "3;3;4;2",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            1.0
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            107.0,
            31.614869919074472
        ],
        "wc_strengths_avg": [
            74.75,
            17.210098779495716
        ],
        "wc_weaknesses_avg": [
            205.75,
            110.05311217771172
        ],
        "wc_questions_avg": [
            107.25,
            94.90883783926553
        ],
        "wc_review_avg": [
            494.75,
            69.43477154855483
        ],
        "wc_reply_reviewers_avg": [
            33.0,
            57.15767664977295
        ],
        "wc_reply_authors_avg": [
            1199.5,
            449.8669247677584
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.2294157338705618,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:4fQrlryzU0kJ:scholar.google.com/&scioq=A+Bayesian+Approach+for+Personalized+Federated+Learning+in+Heterogeneous+Settings&hl=en&as_sdt=0,5",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Texas at Austin",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.utexas.edu",
        "aff_unique_abbr": "UT Austin",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Austin",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Oho3UxCkKr",
        "title": "SCREWS: A Modular Framework for Reasoning with Revisions",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large language models (LLMs) can improve their accuracy on various tasks through iteratively refining and revising their output based on feedback. We observe that these *revisions* can introduce errors, in which case it is better to roll back to a previous result. Further, revisions are typically homogeneous: they use the same reasoning method that produced the initial answer, which may not correct errors.\nTo enable exploration in this space, we present SCREWS, a modular framework for reasoning with revisions.\nIt is comprised of three main modules: *Sampling*, *Conditional Resampling*, and *Selection*, each consisting of sub-modules that can be hand-selected per task. We show that SCREWS not only unifies several previous approaches under a common framework, but also reveals several novel strategies for identifying improved reasoning chains. We evaluate our framework with state-of-the-art LLMs (ChatGPT and GPT-4) on a diverse set of reasoning tasks and uncover useful new reasoning strategies for each: arithmetic word problems, multi-hop question answering, and code analysis. \nHeterogeneous revision strategies prove to be important, as does selection between original and revised candidates.",
        "keywords": "Reasoning;LLMs",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/1f2ae2107b4674104cf8a0a23fda8367e113f26a.zip",
        "author": "Kumar Shridhar;Harsh Jhamtani;Hao Fang;Benjamin Van Durme;Jason Eisner;Patrick Xia",
        "authorids": "~Kumar_Shridhar1;~Harsh_Jhamtani1;~Hao_Fang2;~Benjamin_Van_Durme2;~Jason_Eisner1;~Patrick_Xia1",
        "gender": "M;;;;M;",
        "homepage": "https://kumar-shridhar.github.io/;;;;http://cs.jhu.edu/~jason;https://patrickxia.me",
        "dblp": ";;06/2484-2;;37/3263;128/4897",
        "google_scholar": "rR2qicwAAAAJ;;;;tjb2UccAAAAJ;k9IJYg8AAAAJ",
        "orcid": ";;;;0000-0002-8861-0772;",
        "linkedin": "kumar-shridhar/;;;;;",
        "or_profile": "~Kumar_Shridhar1;~Harsh_Jhamtani1;~Hao_Fang2;~Benjamin_Van_Durme2;~Jason_Eisner1;~Patrick_Xia1",
        "aff": "Swiss Federal Institute of Technology;;Microsoft;;Microsoft;Microsoft",
        "aff_domain": "ethz.ch;;microsoft.com;;microsoft.com;microsoft.com",
        "position": "PhD student;;Principal Researcher;;Director of Research ;Researcher",
        "bibtex": "@misc{\nshridhar2024screws,\ntitle={{SCREWS}: A Modular Framework for Reasoning with Revisions},\nauthor={Kumar Shridhar and Harsh Jhamtani and Hao Fang and Benjamin Van Durme and Jason Eisner and Patrick Xia},\nyear={2024},\nurl={https://openreview.net/forum?id=Oho3UxCkKr}\n}",
        "github": "",
        "project": "",
        "reviewers": "4Ly4;toqi;2Dnf;Na8j",
        "site": "https://openreview.net/forum?id=Oho3UxCkKr",
        "pdf_size": 1070668,
        "rating": "3;3;3;6",
        "confidence": "4;5;4;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "42;118;125;114",
        "wc_strengths": "18;60;53;84",
        "wc_weaknesses": "195;51;171;6",
        "wc_questions": "30;98;2;28",
        "wc_review": "285;327;351;232",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "188;200;217;81",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            99.75,
            33.573613150806395
        ],
        "wc_strengths_avg": [
            53.75,
            23.62599204266352
        ],
        "wc_weaknesses_avg": [
            105.75,
            79.32646153711887
        ],
        "wc_questions_avg": [
            39.5,
            35.53519382246282
        ],
        "wc_review_avg": [
            298.75,
            45.20163160771965
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            171.5,
            53.25645500782041
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5184583066417081105&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Swiss Federal Institute of Technology;Microsoft",
        "aff_unique_dep": ";Microsoft Corporation",
        "aff_unique_url": "https://www.ethz.ch;https://www.microsoft.com",
        "aff_unique_abbr": "ETH Zurich;Microsoft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "Switzerland;United States"
    },
    {
        "id": "Oi6BhzIu7R",
        "title": "REAL: Rectified Adversarial Sample via Max-Min Entropy for Test-Time Defense",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Adversarial attacks expose the vulnerability of neural networks. But it is difficult for existing defense methods to defend against all attacks, which leads to the lack of generalization in adversarial robustness. Inspired by test-time adaptation which leverages model\u2019s prediction entropy to generalize naturally distributed samples during testing, we try to rationally utilize adversarial samples\u2019 entropy for sample rectification, and then achieve test-time defense. In this article, we investigate the entropy properties of adversarial samples and obtain two observations: 1) adversarial samples are often confidently misclassified despite having low prediction entropy and 2) samples with higher attack strength typically show lower prediction entropy. Therefore, we believe directly minimizing the entropy of adversarial samples is not reasonable and propose a two-stage self-adversarial rectification approach: \\underline{Re}ctified \\underline{A}dversaria\\underline{l} Sample via Max-Min Entropy for Test-Time Defense (REAL), consisting of a max-min entropy optimization scheme and an attack-aware weighting mechanism, which can be embedded in the existing models as a plugged-played block. Experiments on several datasets show that REAL can greatly improve the performance of existing sample rectification model.",
        "keywords": "deeplearning;adversarial defense",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Lina Ma;Lei Zhang",
        "authorids": "~Lina_Ma2;~Lei_Zhang3",
        "gender": "F;M",
        "homepage": "https://github.com/luoxiaohei-max;http://www.leizhang.tk",
        "dblp": ";64/5666-38",
        "google_scholar": ";Nt9es7kAAAAJ",
        "orcid": ";0000-0002-5305-8543",
        "linkedin": ";",
        "or_profile": "~Lina_Ma2;~Lei_Zhang3",
        "aff": "Chongqing University;Chongqing University",
        "aff_domain": "cqu.edu.cn;cqu.edu.cn",
        "position": "MS student;Full Professor",
        "bibtex": "@misc{\nma2024real,\ntitle={{REAL}: Rectified Adversarial Sample via Max-Min Entropy for Test-Time Defense},\nauthor={Lina Ma and Lei Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=Oi6BhzIu7R}\n}",
        "github": "",
        "project": "",
        "reviewers": "nJ3p;f1E9;7jdE",
        "site": "https://openreview.net/forum?id=Oi6BhzIu7R",
        "pdf_size": 987481,
        "rating": "3;3;8",
        "confidence": "4;3;4",
        "soundness": "2;3;3",
        "contribution": "1;2;4",
        "presentation": "1;3;4",
        "wc_summary": "51;46;113",
        "wc_strengths": "29;44;254",
        "wc_weaknesses": "149;91;73",
        "wc_questions": "15;50;60",
        "wc_review": "244;231;500",
        "wc_reply_reviewers": "76;0;0",
        "wc_reply_authors": "1710;2012;261",
        "reply_reviewers": "1;0;0",
        "reply_authors": "4;3;1",
        "rating_avg": [
            4.666666666666667,
            2.357022603955158
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "presentation_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "wc_summary_avg": [
            70.0,
            30.474032661705056
        ],
        "wc_strengths_avg": [
            109.0,
            102.71319292087068
        ],
        "wc_weaknesses_avg": [
            104.33333333333333,
            32.42769735204082
        ],
        "wc_questions_avg": [
            41.666666666666664,
            19.293061504650375
        ],
        "wc_review_avg": [
            325.0,
            123.85744493839144
        ],
        "wc_reply_reviewers_avg": [
            25.333333333333332,
            35.82674358011841
        ],
        "wc_reply_authors_avg": [
            1327.6666666666667,
            764.257519135766
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.5000000000000001,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:CtxudRZFW9kJ:scholar.google.com/&scioq=REAL:+Rectified+Adversarial+Sample+via+Max-Min+Entropy+for+Test-Time+Defense&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Chongqing University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cqu.edu.cn",
        "aff_unique_abbr": "CQU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "OinvjdvPjp",
        "title": "xVal: A Continuous Number Encoding for Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) have not yet been broadly adapted for the analysis of scientific datasets due in part to the unique difficulties of tokenizing numbers. We propose xVal, a numerical encoding scheme that represents any real number using just a single token. xVal represents a given real number by scaling a dedicated embedding vector by the number value. Combined with a modified number-inference approach, this strategy renders the model end-to-end continuous when considered as a map from the numbers of the input string to those of the output string. This leads to an inductive bias that is generally more suitable for applications in scientific domains. We empirically evaluate our proposal on a number of synthetic and real-world datasets. Compared with existing number encoding schemes, we find that xVal is more token-efficient and demonstrates improved generalization.",
        "keywords": "number encoding;Large Language Models",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/5dcccb511a308712894ba20a3e5a5eb9f7c3f796.pdf",
        "author": "Siavash Golkar;Mariel Pettee;Alberto Bietti;Michael Eickenberg;Miles Cranmer;Geraud Krawezik;Francois Lanusse;Michael McCabe;Ruben Ohana;Liam Holden Parker;Bruno R\u00e9galdo-Saint Blancard;Tiberiu Tesileanu;Kyunghyun Cho;Shirley Ho",
        "authorids": "~Siavash_Golkar1;~Mariel_Pettee1;~Alberto_Bietti1;~Michael_Eickenberg5;~Miles_Cranmer2;gkrawezik@flatironinstitute.org;~Francois_Lanusse2;~Michael_McCabe2;~Ruben_Ohana1;~Liam_Holden_Parker1;~Bruno_R\u00e9galdo-Saint_Blancard1;~Tiberiu_Tesileanu1;~Kyunghyun_Cho1;~Shirley_Ho2",
        "gender": ";F;M;M;;;M;M;;M;;M;M;",
        "homepage": ";https://mariel-pettee.github.io/;http://alberto.bietti.me;http://eickenberg.github.io;https://astroautomata.com/;;https://flanusse.net;https://mikemccabe210.github.io/;https://rubenohana.github.io/;;https://users.flatironinstitute.org/~bregaldosaintblancard/;http://www.ttesileanu.com;http://kyunghyuncho.me;https://www.shirleyho.space/",
        "dblp": "222/3276;;166/6461;117/7268;205/2493;;;56/706;251/5608;;;160/0174;41/9736;162/2218",
        "google_scholar": "UzaZt7MAAAAJ;;iT7Tp70AAAAJ;GW0werQAAAAJ;10WfwCQAAAAJ;;fRDCooIAAAAJ;SMXfsHYAAAAJ;https://scholar.google.fr/citations?user=F9qNg2wAAAAJ;CjYa0N4AAAAJ;TfcmfBQAAAAJ;8--imZAAAAAJ;https://scholar.google.fi/citations?user=0RAmmIAAAAAJ;fhOi--4AAAAJ",
        "orcid": ";;;;0000-0002-6458-3423;;;0009-0007-8117-6110;0000-0002-8493-1210;;0000-0003-0055-0953;0000-0003-3107-3088;;",
        "linkedin": ";;;;milescranmer/;;;mmccabe-210/;rubenohana/;liam-parker-96ba14160/;;ttesileanu/;;",
        "or_profile": "~Siavash_Golkar1;~Mariel_Pettee1;~Alberto_Bietti1;~Michael_Eickenberg5;~Miles_Cranmer2;gkrawezik@flatironinstitute.org;~Francois_Lanusse2;~Michael_McCabe2;~Ruben_Ohana1;~Liam_Holden_Parker1;~Bruno_R\u00e9galdo-Saint_Blancard1;~Tiberiu_Tesileanu1;~Kyunghyun_Cho1;~Shirley_Ho2",
        "aff": "New York University;Lawrence Berkeley National Lab;Flatiron Institute;Flatiron Institute;University of Cambridge;;CNRS;University of Colorado, Boulder;Flatiron Institute;Flatiron Institute;Flatiron Institute;Meta;Genentech;Carnegie Mellon University",
        "aff_domain": "nyu.edu;lbnl.gov;flatironinstitute.org;flatironinstitute.org;cam.ac.uk;;cnrs.fr;colorado.edu;flatironinstitute.org;simonsfoundation.org;flatironinstitute.org;meta.com;gene.com;cmu.edu",
        "position": "Research Scientist;Postdoc;Researcher;Researcher;Assistant Professor;;Researcher;PhD student;Postdoc;Researcher;Postdoc;Researcher;Senior Director of Frontier Research;Associate Professor",
        "bibtex": "@misc{\ngolkar2024xval,\ntitle={xVal: A Continuous Number Encoding for Large Language Models},\nauthor={Siavash Golkar and Mariel Pettee and Alberto Bietti and Michael Eickenberg and Miles Cranmer and Geraud Krawezik and Francois Lanusse and Michael McCabe and Ruben Ohana and Liam Holden Parker and Bruno R{\\'e}galdo-Saint Blancard and Tiberiu Tesileanu and Kyunghyun Cho and Shirley Ho},\nyear={2024},\nurl={https://openreview.net/forum?id=OinvjdvPjp}\n}",
        "github": "",
        "project": "",
        "reviewers": "aAmt;iRZg;qrLU;SWrp",
        "site": "https://openreview.net/forum?id=OinvjdvPjp",
        "pdf_size": 2081009,
        "rating": "1;5;6;6",
        "confidence": "4;3;3;3",
        "soundness": "1;3;3;3",
        "contribution": "1;2;3;2",
        "presentation": "1;3;3;3",
        "wc_summary": "17;115;111;74",
        "wc_strengths": "15;177;43;85",
        "wc_weaknesses": "72;221;27;95",
        "wc_questions": "15;133;13;137",
        "wc_review": "119;646;194;391",
        "wc_reply_reviewers": "0;25;0;184",
        "wc_reply_authors": "408;1371;540;1532",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "1;2;1;3",
        "rating_avg": [
            4.5,
            2.0615528128088303
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            79.25,
            39.334304366544984
        ],
        "wc_strengths_avg": [
            80.0,
            61.29437168288782
        ],
        "wc_weaknesses_avg": [
            103.75,
            71.97699285188288
        ],
        "wc_questions_avg": [
            74.5,
            60.52065763026704
        ],
        "wc_review_avg": [
            337.5,
            203.94178090817977
        ],
        "wc_reply_reviewers_avg": [
            52.25,
            76.7475569643751
        ],
        "wc_reply_authors_avg": [
            962.75,
            494.26176010288316
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            14,
            0
        ],
        "corr_rating_confidence": -0.9801960588196067,
        "gs_citation": 59,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15826157415664832629&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;2;3;4;5;2;2;2;6;7;8",
        "aff_unique_norm": "New York University;Lawrence Berkeley National Laboratory;Flatiron Institute;University of Cambridge;Centre National de la Recherche Scientifique;University of Colorado;Meta;Genentech;Carnegie Mellon University",
        "aff_unique_dep": ";;;;;;Meta Platforms, Inc.;;",
        "aff_unique_url": "https://www.nyu.edu;https://www.lbl.gov;https://flatironinstitute.org;https://www.cam.ac.uk;https://www.cnrs.fr;https://www.colorado.edu;https://meta.com;https://www.genentech.com;https://www.cmu.edu",
        "aff_unique_abbr": "NYU;LBNL;Flatiron;Cambridge;CNRS;CU;Meta;Genentech;CMU",
        "aff_campus_unique_index": "1;2;3",
        "aff_campus_unique": ";Berkeley;Cambridge;Boulder",
        "aff_country_unique_index": "0;0;0;0;1;2;0;0;0;0;0;0;0",
        "aff_country_unique": "United States;United Kingdom;France"
    },
    {
        "id": "OivQg0YU3I",
        "title": "First-Explore, then Exploit: Meta-Learning Intelligent Exploration",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Standard reinforcement learning (RL) agents never intelligently explore like a human (i.e. by taking into account complex domain priors and previous explorations). Even the most basic intelligent exploration strategies such as exhaustive search are only inefficiently or poorly approximated by approaches such as novelty search or intrinsic motivation, let alone more complicated strategies like learning new skills, climbing stairs, opening doors, or conducting experiments. This lack of intelligent exploration limits sample efficiency and prevents solving hard exploration domains. We argue a core barrier prohibiting many RL approaches from learning intelligent exploration is that the methods attempt to explore and exploit simultaneously, which harms both exploration and exploitation as the goals often conflict. We propose a novel meta-RL framework (First-Explore) with two policies: one policy learns to only explore and one policy learns to only exploit. Once trained, we can then explore with the explore policy, for as long as desired, and then exploit based on all the information gained during exploration. This approach avoids the conflict of trying to do both exploration and exploitation at once. We demonstrate that First-Explore can learn intelligent exploration strategies such as exhaustive search and more, and that it outperforms dominant standard RL and meta-RL approaches on domains where exploration requires sacrificing reward. Surprisingly and importantly, on such domains, First-Explore not only achieves higher final episode reward, it also achieves higher cumulative reward. First-Explore is a significant step towards creating meta-RL algorithms capable of learning human-level exploration, which is essential to solve challenging unseen hard-exploration domains.",
        "keywords": "Deep Reinforcement Learning;Deep RL;Exploration;Meta-learning;Meta-RL;Learning to Reinforcement Learn;RL^2",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/b72d33c0ee08c767d7e27a035d2511924881d1ae.zip",
        "author": "Ben Norman;Jeff Clune",
        "authorids": "~Ben_Norman1;~Jeff_Clune3",
        "gender": "M;",
        "homepage": ";",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": "ben-t-norman/;",
        "or_profile": "~Ben_Norman1;~Jeff_Clune3",
        "aff": "University of British Columbia;",
        "aff_domain": "cs.ubc.ca;",
        "position": "PhD student;",
        "bibtex": "@misc{\nnorman2024firstexplore,\ntitle={First-Explore, then Exploit: Meta-Learning Intelligent Exploration},\nauthor={Ben Norman and Jeff Clune},\nyear={2024},\nurl={https://openreview.net/forum?id=OivQg0YU3I}\n}",
        "github": "",
        "project": "",
        "reviewers": "fuX7;obj6;RsHA;tz8Y",
        "site": "https://openreview.net/forum?id=OivQg0YU3I",
        "pdf_size": 1258560,
        "rating": "3;3;3;8",
        "confidence": "3;3;4;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "1;1;2;3",
        "wc_summary": "113;69;39;69",
        "wc_strengths": "44;53;23;31",
        "wc_weaknesses": "379;174;225;83",
        "wc_questions": "76;318;8;44",
        "wc_review": "612;614;295;227",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;776;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;1;0;0",
        "rating_avg": [
            4.25,
            2.165063509461097
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            72.5,
            26.396022427631024
        ],
        "wc_strengths_avg": [
            37.75,
            11.562331079847178
        ],
        "wc_weaknesses_avg": [
            215.25,
            107.35542603892921
        ],
        "wc_questions_avg": [
            111.5,
            121.62544963945663
        ],
        "wc_review_avg": [
            437.0,
            177.63586349608573
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            194.0,
            336.0178566683622
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0.25,
            0.4330127018922193
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=511733054883636760&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of British Columbia",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ubc.ca",
        "aff_unique_abbr": "UBC",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Canada"
    },
    {
        "title": "Estimating Conditional Mutual Information for Dynamic Feature Selection",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18731",
        "id": "Oju2Qu9jvn",
        "author_site": "Soham Gadgil, Ian Covert, Su-In Lee",
        "tldr": "",
        "abstract": "Dynamic feature selection, where we sequentially query features to make accurate predictions with a minimal budget, is a promising paradigm to reduce feature acquisition costs and provide transparency into the prediction process. The problem is challenging, however, as it requires both making predictions with arbitrary feature sets and learning a policy to identify the most valuable selections. Here, we take an information-theoretic perspective and prioritize features based on their mutual information with the response variable. The main challenge is implementing this policy, and we design a new approach that estimates the mutual information in a discriminative rather than a generative fashion. Building on our learning approach, we introduce several further improvements: allowing variable feature budgets across samples, enabling non-uniform costs between features, incorporating prior information, and exploring modern architectures to handle partial input information. We find that our method provides consistent gains over recent state-of-the-art methods across a variety of datasets.",
        "keywords": "dynamic feature selection;adaptive;feature selection;mutual information;information theory",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/b722fcd7c9bab66f79ca7928895cd8210ca2c116.zip",
        "author": "Soham Gadgil;Ian Connick Covert;Su-In Lee",
        "authorids": "~Soham_Gadgil1;~Ian_Connick_Covert1;~Su-In_Lee2",
        "gender": "M;F;M",
        "homepage": "https://iancovert.com;http://suinlee.cs.washington.edu/;",
        "dblp": "262/3443;17/1784;136/5972",
        "google_scholar": "Np8Ek3cAAAAJ;;Tg2VT2UAAAAJ",
        "orcid": ";;",
        "linkedin": "ian-covert/;;soham-gadgil-2729a9105/",
        "or_profile": "~Ian_Connick_Covert1;~Su-In_Lee2;~Soham_Uday_Gadgil1",
        "aff": "Stanford University;University of Washington;University of Washington",
        "aff_domain": "stanford.edu;uw.edu;uw.edu",
        "position": "Postdoc;Assistant Professor;PhD student",
        "bibtex": "@inproceedings{\ngadgil2024estimating,\ntitle={Estimating Conditional Mutual Information for Dynamic Feature Selection},\nauthor={Soham Gadgil and Ian Connick Covert and Su-In Lee},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Oju2Qu9jvn}\n}",
        "github": "",
        "project": "",
        "reviewers": "j5dM;s6Fj;iU6i",
        "pdf_size": 1382790,
        "rating": "6;8;8",
        "confidence": "4;4;5",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "4;2;3",
        "wc_summary": "86;130;125",
        "wc_strengths": "9;68;97",
        "wc_weaknesses": "59;145;106",
        "wc_questions": "213;7;456",
        "wc_review": "367;350;784",
        "wc_reply_reviewers": "0;145;227",
        "wc_reply_authors": "1115;1095;1486",
        "reply_reviewers": "0;2;4",
        "reply_authors": "4;3;4",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            113.66666666666667,
            19.669491322575904
        ],
        "wc_strengths_avg": [
            58.0,
            36.615115275889366
        ],
        "wc_weaknesses_avg": [
            103.33333333333333,
            35.15995196558469
        ],
        "wc_questions_avg": [
            225.33333333333334,
            183.51082317460794
        ],
        "wc_review_avg": [
            500.3333333333333,
            200.70265458024105
        ],
        "wc_reply_reviewers_avg": [
            124.0,
            93.85449731721259
        ],
        "wc_reply_authors_avg": [
            1232.0,
            179.79061896179863
        ],
        "reply_reviewers_avg": [
            2.0,
            1.632993161855452
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2515848158543197326&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=Oju2Qu9jvn",
        "pdf": "https://openreview.net/pdf?id=Oju2Qu9jvn",
        "email": "stanford.edu;uw.edu;uw.edu",
        "author_num": 3,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Stanford University;University of Washington",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.stanford.edu;https://www.washington.edu",
        "aff_unique_abbr": "Stanford;UW",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Stanford;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "PILOT: An $\\mathcal{O}(1/K)$-Convergent Approach for Policy Evaluation with Nonlinear Function Approximation",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18730",
        "id": "OkHHJcMroY",
        "author_site": "Zhuqing Liu, Xin Zhang, Jia Liu, Zhengyuan Zhu, Songtao Lu",
        "tldr": "",
        "abstract": "Learning an accurate value function for a given policy is a critical step in solving reinforcement learning (RL) problems. So far, however, the convergence speed and sample complexity performances of most existing policy evaluation algorithms remain unsatisfactory, particularly with non-linear function approximation. This challenge motivates us to develop a new path-integrated primal-dual stochastic gradient (PILOT) method, that is able to achieve a fast convergence speed for RL policy evaluation with nonlinear function approximation. To further alleviate the periodic full gradient evaluation requirement, we further propose an enhanced method with an adaptive-batch adjustment called PILOT$^+$. The main advantages of our methods include: i) PILOT allows the use of {\\em{constant}} step sizes and achieves the $\\mathcal{O}(1/K)$ convergence rate to first-order stationary points of non-convex policy evaluation problems; ii) PILOT is a generic {\\em{single}}-timescale algorithm that is also applicable for solving a large class of non-convex strongly-concave minimax optimization problems; iii) By adaptively adjusting the batch size via historical stochastic gradient information, PILOT$^+$ is more sample-efficient empirically without loss of theoretical convergence rate. Our extensive numerical experiments verify our theoretical findings and showcase the high efficiency of the proposed PILOT and PILOT$^+$ algorithms compared with the state-of-the-art methods.",
        "keywords": "min-max optimization;adaptive batch size;policy evaluation.",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/2af42a2212b05c42e76f6101b4dc0b1a16f55d17.pdf",
        "author": "Zhuqing Liu;Xin Zhang;Jia Liu;Zhengyuan Zhu;Songtao Lu",
        "authorids": "~Zhuqing_Liu2;~Xin_Zhang16;~Jia_Liu1;~Zhengyuan_Zhu1;~Songtao_Lu1",
        "gender": "F;M;M;M;M",
        "homepage": "https://github.com/Zhuqing-Liu;https://xinzhang-nac.github.io/;https://kevinliu-osu.github.io/index.html;;https://songtaogithub.github.io/",
        "dblp": "195/1161;76/1584-54.html;;68/151;05/2887",
        "google_scholar": ";9u5Pa0gAAAAJ;Ofx3dScAAAAJ;ixDds0sAAAAJ;LRsjX7kAAAAJ",
        "orcid": "0000-0003-0146-5101;0000-0002-0784-2038;;;",
        "linkedin": ";;;;",
        "or_profile": "~Zhuqing_Liu2;~Xin_Zhang16;~Jia_Liu1;~Zhengyuan_Zhu1;~Songtao_Lu1",
        "aff": "Ohio State University;Meta Facebook;The Ohio State University;Iowa State University;IBM Thomas J. Watson Research Center",
        "aff_domain": "osu.edu;fb.com;osu.edu;iastate.edu;ibm.com",
        "position": "PhD student;Research Scientist;Assistant Professor;Full Professor;Researcher",
        "bibtex": "@inproceedings{\nliu2024pilot,\ntitle={{PILOT}: An \\${\\textbackslash}mathcal\\{O\\}(1/K)\\$-Convergent Approach for Policy Evaluation with Nonlinear Function Approximation},\nauthor={Zhuqing Liu and Xin Zhang and Jia Liu and Zhengyuan Zhu and Songtao Lu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=OkHHJcMroY}\n}",
        "github": "",
        "project": "",
        "reviewers": "sDVM;V3H9;b5y9;XRvu",
        "pdf_size": 607721,
        "rating": "6;6;8;8",
        "confidence": "3;3;3;3",
        "soundness": "3;3;3;4",
        "contribution": "3;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "62;75;29;56",
        "wc_strengths": "44;47;40;60",
        "wc_weaknesses": "90;50;8;28",
        "wc_questions": "186;1;175;159",
        "wc_review": "382;173;252;303",
        "wc_reply_reviewers": "0;11;0;25",
        "wc_reply_authors": "1750;691;718;853",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "3;1;1;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            55.5,
            16.77050983124842
        ],
        "wc_strengths_avg": [
            47.75,
            7.495832175282475
        ],
        "wc_weaknesses_avg": [
            44.0,
            30.430248109405877
        ],
        "wc_questions_avg": [
            130.25,
            75.23754049674936
        ],
        "wc_review_avg": [
            277.5,
            76.06083091841687
        ],
        "wc_reply_reviewers_avg": [
            9.0,
            10.27131929208707
        ],
        "wc_reply_authors_avg": [
            1003.0,
            435.62541248187074
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:lnKN1_v6JaoJ:scholar.google.com/&scioq=PILOT:+An+%24%5Cmathcal%7BO%7D(1/K)%24-Convergent+Approach+for+Policy+Evaluation+with+Nonlinear+Function+Approximation&hl=en&as_sdt=0,14",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=OkHHJcMroY",
        "pdf": "https://openreview.net/pdf?id=OkHHJcMroY",
        "email": "osu.edu;fb.com;osu.edu;iastate.edu;ibm.com",
        "author_num": 5,
        "aff_unique_index": "0;1;0;2;3",
        "aff_unique_norm": "Ohio State University;Meta;Iowa State University;IBM",
        "aff_unique_dep": ";Meta Platforms, Inc.;;Research",
        "aff_unique_url": "https://www.osu.edu;https://meta.com;https://www.iastate.edu;https://www.ibm.com/research",
        "aff_unique_abbr": "OSU;Meta;ISU;IBM",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Yorktown Heights",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "OkZ5UrVpo6",
        "title": "Traceable Federated Continual Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Federated continual learning (FCL) is a typical mechanism to achieve collaborative model training among clients that own dynamic data. While traditional FCL methods have been proved effective, they do not consider the task repeatability and fail to achieve good performance under this practical scenario. In this paper, we propose a new paradigm, namely \\textit{Traceable Federated Continual Learning (TFCL)}, aiming to cope with repetitive tasks by tracing and augmenting them. Following the new paradigm, we develop \\textbf{TagFed}, a framework that enables accurate and effective \\textbf{T}racing, \\textbf{a}u\\textbf{g}mentation, and \\textbf{Fed}eration for TFCL. The key idea is to decompose the whole model into a series of marked sub-models for optimizing each client task, before conducting group-wise knowledge aggregation, such that the repetitive tasks can be located precisely and federated selectively for improved performance. Extensive experiments on our constructed benchmark demonstrate the effectiveness and efficiency of the proposed framework.",
        "keywords": "Federated Learning;Continual Learning;Repetitive Task",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Qiang Wang;Bingyan Liu",
        "authorids": "~Qiang_Wang18;~Bingyan_Liu2",
        "gender": "M;M",
        "homepage": "https://github.com/P0werWeirdo;https://lebyni.github.io/",
        "dblp": ";198/1547",
        "google_scholar": ";q2TL0g0AAAAJ",
        "orcid": ";0000-0003-2613-9863",
        "linkedin": ";",
        "or_profile": "~Qiang_Wang18;~Bingyan_Liu2",
        "aff": "Beijing University of Posts and Telecommunications;Beijing University of Posts and Telecommunications",
        "aff_domain": "bupt.edu.cn;bupt.edu.cn",
        "position": "Undergrad student;Associate Professor",
        "bibtex": "@misc{\nwang2024traceable,\ntitle={Traceable Federated Continual Learning},\nauthor={Qiang Wang and Bingyan Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=OkZ5UrVpo6}\n}",
        "github": "",
        "project": "",
        "reviewers": "oWSe;drQ8;1NM3;MVcU",
        "site": "https://openreview.net/forum?id=OkZ5UrVpo6",
        "pdf_size": 635756,
        "rating": "3;5;5;5",
        "confidence": "3;3;3;3",
        "soundness": "2;2;2;2",
        "contribution": "2;3;2;2",
        "presentation": "2;3;2;3",
        "wc_summary": "38;69;60;43",
        "wc_strengths": "11;50;31;48",
        "wc_weaknesses": "114;170;438;156",
        "wc_questions": "13;181;6;4",
        "wc_review": "176;470;535;251",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            52.5,
            12.539936203984453
        ],
        "wc_strengths_avg": [
            35.0,
            15.700318468107582
        ],
        "wc_weaknesses_avg": [
            219.5,
            127.82311997443968
        ],
        "wc_questions_avg": [
            51.0,
            75.12988752820011
        ],
        "wc_review_avg": [
            358.0,
            148.6993611284191
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15855715884175083437&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Beijing University of Posts and Telecommunications",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.bupt.edu.cn/",
        "aff_unique_abbr": "BUPT",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Beijing",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "Ol7RxVOet6",
        "title": "Mitigating Accumulated Distribution Divergence in Batch Normalization for Unsupervised Domain Adaptation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Batch Normalization (BN) is a widely used technique in modern deep neural networks that has been proven to be effective in tasks such as Unsupervised Domain Adaptation (UDA) in cross-domain scenarios. However, existing BN variants tend to aggregate source and target domain knowledge in the same channel, which can lead to suboptimal transferability due to unaligned features between domains. To address this issue, we propose a new normalization method called Refined Batch Normalization (RBN), which leverages estimated shift to quantify the difference between estimated population statistics and expected statistics. Our key finding is that the estimated shift can accumulate due to BN stacking in the network, which can adversely affect target domain performance. We further demonstrate that RBN can prevent the accumulation of estimated shift and improve overall performance. To implement this technique, we introduce the RBNBlock, which replaces a BN with RBN in the bottleneck block of a residual network. Our comprehensive experiments on cross-domain benchmarks confirm the effectiveness of $\\mathrm{RBN}$ in improving transferability across domains.",
        "keywords": "Optimized Batch Normalization;Distribution Divergence;Unsupervised Domain Adaptation",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Zhenghan Chen;Mengzhu Wang;Nan Yin;Ye Wang;Junyang Chen",
        "authorids": "~Zhenghan_Chen3;~Mengzhu_Wang1;~Nan_Yin4;~Ye_Wang17;~Junyang_Chen1",
        "gender": ";;M;F;M",
        "homepage": ";;;;https://csse.szu.edu.cn/pages/user/index?id=1101",
        "dblp": ";;135/8983;44/6292.html;196/7893.html",
        "google_scholar": ";;https://scholar.google.com.hk/citations?user=NoOK0pIAAAAJ;;Q0u3dRQAAAAJ",
        "orcid": ";;;;0000-0002-1139-8654",
        "linkedin": ";;yin-nan-b32943173;;",
        "or_profile": "~Zhenghan_Chen3;~Mengzhu_Wang1;~Nan_Yin4;~Ye_Wang17;~Junyang_Chen1",
        "aff": ";;Mohamed bin Zayed University of Artificial Intelligence;;Shenzhen University",
        "aff_domain": ";;mbzuai.ac.ae;;szu.edu",
        "position": ";;Postdoc;;Assistant Professor",
        "bibtex": "@misc{\nchen2024mitigating,\ntitle={Mitigating Accumulated Distribution Divergence in Batch Normalization for Unsupervised Domain Adaptation},\nauthor={Zhenghan Chen and Mengzhu Wang and Nan Yin and Ye Wang and Junyang Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=Ol7RxVOet6}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=Ol7RxVOet6",
        "pdf_size": 828563,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ZN_hk1yBfgAJ:scholar.google.com/&scioq=Mitigating+Accumulated+Distribution+Divergence+in+Batch+Normalization+for+Unsupervised+Domain+Adaptation&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Mohamed bin Zayed University of Artificial Intelligence;Shenzhen University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://mbzuai.ac.ae;https://www.szu.edu.cn",
        "aff_unique_abbr": "MBZUAI;SZU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United Arab Emirates;China"
    },
    {
        "id": "OlwW4ZG3Ta",
        "title": "Reflective Policy Optimization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "On-policy reinforcement learning methods, such as Trust Region Policy Optimization (TRPO) and Proximal Policy Optimization (PPO), often require significant data to be collected at each update, giving rise to issues of sample inefficiency. This paper introduces a novel extension to on-policy methods called Reflective Policy Optimization (RPO). RPO's fundamental objective is amalgamating prior and subsequent state and action information from trajectory data to optimize the current policy. This approach empowers the agent to engage in introspection and introduce modifications to its actions within the current state to a certain degree. Furthermore, theoretical analyses substantiate that our proposed method not only upholds the crucial property of monotonically improving policy performance but also adeptly contracts the solution space of the optimized policy, consequently expediting the training procedure. We empirically demonstrate the feasibility and efficacy of our approach in reinforcement learning benchmarks, culminating in superior performance in terms of sample efficiency.",
        "keywords": "Reinforcement Learning; on-policy",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/93b00e3c1724febbb31684e38e2b9e7d005b10fc.zip",
        "author": "Yaozhong Gan;Renye Yan;Zhe Wu;Junliang Xing",
        "authorids": "~Yaozhong_Gan1;~Renye_Yan1;~Zhe_Wu6;~Junliang_Xing1",
        "gender": "M;M;;M",
        "homepage": ";https://ieeexplore.ieee.org/author/37088970082;https://github.com/GoooKuuu;http://people.ucas.ac.cn/~jlxing?language=en",
        "dblp": "234/8610;;;43/7659.html",
        "google_scholar": "n46Z5BsAAAAJ;;;jSwNd3MAAAAJ",
        "orcid": ";;;0000-0001-6801-0510",
        "linkedin": ";;;https://www.linkedin.cn/incareer/in/ACoAAAvlU14B40ZWH1pxg5JJDtQ6LlgMYkp0e5s",
        "or_profile": "~Yaozhong_Gan1;~Renye_Yan1;~Zhe_Wu6;~Junliang_Xing1",
        "aff": "Qiyuan Laboratory;Peking University;Qiyuan laboratory;Tsinghua University",
        "aff_domain": "qiyuanlab.com;pku.edu.cn;qiyuanlab.com;tsinghua.edu.cn",
        "position": "Assistant Professor;PhD student;Researcher;Full Professor",
        "bibtex": "@misc{\ngan2024reflective,\ntitle={Reflective Policy Optimization},\nauthor={Yaozhong Gan and Renye Yan and Zhe Wu and Junliang Xing},\nyear={2024},\nurl={https://openreview.net/forum?id=OlwW4ZG3Ta}\n}",
        "github": "",
        "project": "",
        "reviewers": "KkoJ;kAky;WKkT;X1ce",
        "site": "https://openreview.net/forum?id=OlwW4ZG3Ta",
        "pdf_size": 7292594,
        "rating": "3;3;5;8",
        "confidence": "5;2;4;4",
        "soundness": "1;2;3;3",
        "contribution": "1;2;2;3",
        "presentation": "2;1;3;4",
        "wc_summary": "108;106;105;49",
        "wc_strengths": "39;171;177;93",
        "wc_weaknesses": "371;1834;320;68",
        "wc_questions": "168;2;174;61",
        "wc_review": "686;2113;776;271",
        "wc_reply_reviewers": "203;341;24;48",
        "wc_reply_authors": "1593;1782;1364;632",
        "reply_reviewers": "2;2;1;1",
        "reply_authors": "5;4;4;2",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            92.0,
            24.849547279578356
        ],
        "wc_strengths_avg": [
            120.0,
            57.3149195236284
        ],
        "wc_weaknesses_avg": [
            648.25,
            694.1377294888962
        ],
        "wc_questions_avg": [
            101.25,
            72.83328565978607
        ],
        "wc_review_avg": [
            961.5,
            691.5657958574875
        ],
        "wc_reply_reviewers_avg": [
            154.0,
            127.97069977147113
        ],
        "wc_reply_authors_avg": [
            1342.75,
            436.2289393197109
        ],
        "reply_reviewers_avg": [
            1.5,
            0.5
        ],
        "reply_authors_avg": [
            3.75,
            1.0897247358851685
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.19619314913492367,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12218754483796030376&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "Qiyuan Laboratory;Peking University;Tsinghua University",
        "aff_unique_dep": ";;",
        "aff_unique_url": ";http://www.pku.edu.cn;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": ";Peking U;THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "1;1",
        "aff_country_unique": ";China"
    },
    {
        "id": "OnLAftJkhV",
        "title": "Latent Conservative Objective Models for Offline Data-Driven Crystal Structure Prediction",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In computational chemistry, crystal structure prediction (CSP) is an optimization problem that involves discovering the lowest energy stable crystal structure for a given chemical formula. This problem is challenging as it requires discovering globally optimal designs with the lowest energies on complex manifolds. One approach to tackle this problem involves building simulators based on density functional theory (DFT) followed by running search in simulation, but these simulators are painfully slow. In this paper, we study present and study an alternate, data-driven approach to crystal structure prediction: instead of directly searching for the most stable structures in simulation, we train a surrogate model of the crystal formation energy from a database of existing crystal structures, and then optimize this model with respect to the parameters of the crystal structure. This surrogate model is trained to be conservative so as to prevent exploitation of its errors by the optimizer. To handle optimization in the non-Euclidean space of crystal structures, we first utilize a state-of-the-art graph variational auto-encoder (CD-VAE) to convert a crystal structure into a vector-based search space and then optimize a conservative surrogate model of the crystal energy, trained on top of this vector representation. We show that our approach, dubbed LCOMs (latent conservative objective models), performs comparably to the best current approaches in terms of success rate of structure prediction, while also drastically reducing computational cost.",
        "keywords": "crystal structure prediction;offline model-based optimization",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Han Qi;Stefano Rando;Xinyang Geng;Iku Ohama;Aviral Kumar;Sergey Levine",
        "authorids": "~Han_Qi1;~Stefano_Rando1;~Xinyang_Geng1;~Iku_Ohama1;~Aviral_Kumar2;~Sergey_Levine1",
        "gender": ";M;M;M;M;M",
        "homepage": "https://han20192019.github.io/;;http://young-geng.xyz/;;https://aviralkumar2907.github.io/;https://people.eecs.berkeley.edu/~svlevine/",
        "dblp": ";;186/8221;129/2635;202/7961;80/7594",
        "google_scholar": ";;vYougn0AAAAJ;Lza-vcwAAAAJ;;8R35rCwAAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";https://it.linkedin.com/in/stefano-rando-94b852183?original_referer=https%3A%2F%2Fwww.google.com%2F;;iku-ohama-ph-d-1644a949/;;",
        "or_profile": "~Han_Qi1;~Stefano_Rando1;~Xinyang_Geng1;~Iku_Ohama1;~Aviral_Kumar2;~Sergey_Levine1",
        "aff": "Harvard University;ItalAI S.R.L.;Google;Panasonic Corporation;Google DeepMind;Google",
        "aff_domain": "harvard.edu;italailabs.com;google.com;panasonic.com;google.com;google.com",
        "position": "PhD student;Researcher;Researcher;Researcher;Researcher;Research Scientist",
        "bibtex": "@misc{\nqi2024latent,\ntitle={Latent Conservative Objective Models for Offline Data-Driven Crystal Structure Prediction},\nauthor={Han Qi and Stefano Rando and Xinyang Geng and Iku Ohama and Aviral Kumar and Sergey Levine},\nyear={2024},\nurl={https://openreview.net/forum?id=OnLAftJkhV}\n}",
        "github": "",
        "project": "",
        "reviewers": "FciH;Ffti;atym;YfQf",
        "site": "https://openreview.net/forum?id=OnLAftJkhV",
        "pdf_size": 1266503,
        "rating": "3;3;3;6",
        "confidence": "4;4;5;2",
        "soundness": "1;2;3;3",
        "contribution": "1;2;1;2",
        "presentation": "2;2;3;3",
        "wc_summary": "54;45;80;35",
        "wc_strengths": "73;15;20;71",
        "wc_weaknesses": "309;307;85;91",
        "wc_questions": "3;6;89;45",
        "wc_review": "439;373;274;242",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            53.5,
            16.710774967068403
        ],
        "wc_strengths_avg": [
            44.75,
            27.316432783216772
        ],
        "wc_weaknesses_avg": [
            198.0,
            110.02272492535349
        ],
        "wc_questions_avg": [
            35.75,
            34.92402468215827
        ],
        "wc_review_avg": [
            332.0,
            78.4123714728741
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.9271726499455307,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=707430922843693877&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;3;2;2",
        "aff_unique_norm": "Harvard University;ItalAI S.R.L.;Google;Panasonic Corporation",
        "aff_unique_dep": ";;Google;",
        "aff_unique_url": "https://www.harvard.edu;;https://www.google.com;https://www.panasonic.com",
        "aff_unique_abbr": "Harvard;;Google;Panasonic",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;0;2;3;0",
        "aff_country_unique": "United States;Italy;Japan;United Kingdom"
    },
    {
        "id": "OnvuFI9iY5",
        "title": "Heterogeneous Domain Generalization for Single-Source Cross-Dataset Person ReID: An Adaptive Adversarial Augmentation Approach",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Despite the significant advances in supervised person re-identification (ReID) methods, these models exhibit performance degradation in unseen domains. Domain generalization (DG) is applied to alleviate this issue, but most existing DG methods assume consistent class spaces between source and target domains. We propose Adaptive Adversarial Augmentation (AAA), a Heterogeneous Domain Generalization (HDG) approach tailored for single-source cross-dataset ReID. AAA jointly trains a feature extractor alongside a Domain Adversarial Network (DAN) and a Class Adversarial Network (CAN) to enhance the feature extractor's robustness to both domain shifts and class space changes. Additionally, we propose a diversity-based perturbation impact factor, dynamically tuning the perturbation influence aligned with the diversity of learned embeddings, thus providing a flexible augmentation strategy. Experimental results demonstrate that our method surpasses state-of-the-art methods on large-scale cross-dataset ReID benchmarks.",
        "keywords": "Heterogeneous Domain Generalization;Transfer Learning;Person Re-ID;Cross-Dataset",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Di Zhao;Gillian Dobbie;Jingfeng Zhang;Hongsheng Hu;Philippe Fournier-Viger;Yun Sing Koh",
        "authorids": "~Di_Zhao4;~Gillian_Dobbie1;~Jingfeng_Zhang1;~Hongsheng_Hu1;~Philippe_Fournier-Viger1;~Yun_Sing_Koh2",
        "gender": "M;F;M;;Not Specified;",
        "homepage": ";https://profiles.auckland.ac.nz/g-dobbie;https://zjfheart.github.io;;http://www.philippe-fournier-viger.com/;https://profiles.auckland.ac.nz/y-koh",
        "dblp": ";d/GDobbie;227/2664.html;;76/2649;23/1879.html",
        "google_scholar": "RmvtaO4AAAAJ;https://scholar.google.com.au/citations?user=v19BUHIAAAAJ;NS0P1FkAAAAJ;;https://scholar.google.ca/citations?user=QG_7KjoAAAAJ;0L38IrAAAAAJ",
        "orcid": ";0000-0001-7245-0367;0000-0003-3491-8074;;0000-0002-7680-9899;0000-0001-7256-4049",
        "linkedin": ";gill-dobbie-3734822/;;;;yun-sing-koh-a7ba358/",
        "or_profile": "~Di_Zhao4;~Gillian_Dobbie1;~Jingfeng_Zhang1;~Hongsheng_Hu1;~Philippe_Fournier-Viger1;~Yun_Sing_Koh2",
        "aff": "University of Auckland;University of Auckland;University of Auckland;;Shenzhen University;University of Auckland",
        "aff_domain": "aucklanduni.ac.nz;auckland.ac.nz;auckland.ac.nz;;szu.edu.cn;auckland.ac.nz",
        "position": "PhD student;Full Professor;Assistant Professor;;Full Professor;Full Professor",
        "bibtex": "@misc{\nzhao2024heterogeneous,\ntitle={Heterogeneous Domain Generalization for Single-Source Cross-Dataset Person Re{ID}: An Adaptive Adversarial Augmentation Approach},\nauthor={Di Zhao and Gillian Dobbie and Jingfeng Zhang and Hongsheng Hu and Philippe Fournier-Viger and Yun Sing Koh},\nyear={2024},\nurl={https://openreview.net/forum?id=OnvuFI9iY5}\n}",
        "github": "",
        "project": "",
        "reviewers": "nbhP;yLHp;hNEm;cRe1",
        "site": "https://openreview.net/forum?id=OnvuFI9iY5",
        "pdf_size": 2965439,
        "rating": "3;3;3;5",
        "confidence": "5;4;4;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;2;2",
        "presentation": "3;2;2;2",
        "wc_summary": "30;55;55;157",
        "wc_strengths": "24;10;51;67",
        "wc_weaknesses": "83;232;58;280",
        "wc_questions": "3;2;93;307",
        "wc_review": "140;299;257;811",
        "wc_reply_reviewers": "0;0;25;50",
        "wc_reply_authors": "36;76;141;79",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            74.25,
            48.853735783458774
        ],
        "wc_strengths_avg": [
            38.0,
            22.304708023195463
        ],
        "wc_weaknesses_avg": [
            163.25,
            94.70315464650584
        ],
        "wc_questions_avg": [
            101.25,
            124.40332592016983
        ],
        "wc_review_avg": [
            376.75,
            257.395002865246
        ],
        "wc_reply_reviewers_avg": [
            18.75,
            20.72890493972125
        ],
        "wc_reply_authors_avg": [
            83.0,
            37.54330832518626
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:aEteycXLDyMJ:scholar.google.com/&scioq=Heterogeneous+Domain+Generalization+for+Single-Source+Cross-Dataset+Person+ReID:+An+Adaptive+Adversarial+Augmentation+Approach&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "University of Auckland;Shenzhen University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.auckland.ac.nz;https://www.szu.edu.cn",
        "aff_unique_abbr": "UoA;SZU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "New Zealand;China"
    },
    {
        "id": "Oo5spZRpH6",
        "title": "HAct: Out-of-Distribution Detection with Neural Net Activation Histograms",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We propose a simple, efficient, and accurate method for detecting out-of-distribution (OOD) data for trained neural networks. We propose a novel descriptor, HAct - activation histograms, for OOD detection, that is, probability distributions (approximated by histograms) of output values of neural network layers under the influence of incoming data. We formulate an OOD detector based on HAct descriptors. We demonstrate that HAct is significantly more accurate than state-of-the-art in OOD detection on multiple image classification benchmarks. For instance, our approach achieves a true positive rate (TPR) of 95% with only 0.03% false-positives using Resnet-50 on standard OOD benchmarks, outperforming previous state-of-the-art by 20.67% in the false positive rate (at the same TPR of 95%). The computational efficiency and the ease of implementation makes HAct suitable for online implementation in monitoring deployed neural networks in practice at scale.",
        "keywords": "out-of-distribution detection;monitoring neural networks",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Sudeepta Mondal;Ganesh Sundaramoorthi",
        "authorids": "~Sudeepta_Mondal1;~Ganesh_Sundaramoorthi1",
        "gender": "M;",
        "homepage": ";",
        "dblp": ";",
        "google_scholar": "fWhWmkMAAAAJ;",
        "orcid": ";",
        "linkedin": "sudeepta-mondal/;",
        "or_profile": "~Sudeepta_Mondal1;~Ganesh_Sundaramoorthi1",
        "aff": "RTX Technology Research Center;",
        "aff_domain": "rtx.com;",
        "position": "Researcher;",
        "bibtex": "@misc{\nmondal2024hact,\ntitle={{HA}ct: Out-of-Distribution Detection with Neural Net Activation Histograms},\nauthor={Sudeepta Mondal and Ganesh Sundaramoorthi},\nyear={2024},\nurl={https://openreview.net/forum?id=Oo5spZRpH6}\n}",
        "github": "",
        "project": "",
        "reviewers": "Pwoh;XeRd;NrJ4",
        "site": "https://openreview.net/forum?id=Oo5spZRpH6",
        "pdf_size": 1451394,
        "rating": "3;3;5",
        "confidence": "4;3;4",
        "soundness": "2;2;3",
        "contribution": "3;3;3",
        "presentation": "3;3;3",
        "wc_summary": "71;85;46",
        "wc_strengths": "34;30;32",
        "wc_weaknesses": "304;11;175",
        "wc_questions": "115;104;35",
        "wc_review": "524;230;288",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            67.33333333333333,
            16.131404843417148
        ],
        "wc_strengths_avg": [
            32.0,
            1.632993161855452
        ],
        "wc_weaknesses_avg": [
            163.33333333333334,
            119.90088499349045
        ],
        "wc_questions_avg": [
            84.66666666666667,
            35.405586502069916
        ],
        "wc_review_avg": [
            347.3333333333333,
            127.14645973137522
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:V4XAB41vI6sJ:scholar.google.com/&scioq=HAct:+Out-of-Distribution+Detection+with+Neural+Net+Activation+Histograms&hl=en&as_sdt=0,18",
        "gs_version_total": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "RTX Technology Research Center",
        "aff_unique_dep": "",
        "aff_unique_url": "",
        "aff_unique_abbr": ""
    },
    {
        "id": "Op1XmdxFk8",
        "title": "ProtoReg: Prioritizing Discriminative Information for Fine-grained Transfer Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Transfer learning leverages a pre-trained model with rich features to fine-tune it for downstream tasks, thereby improving generalization performance. However, we point out the \"granularity gap\" in fine-grained transfer learning, a mismatch between the level of information learned by a pre-trained model and the semantic details required for a fine-grained downstream task. Under these circumstances, excessive non-discriminative information can hinder the sufficient learning of discriminative semantic details. In this study, we address this issue by establishing class-discriminative prototypes and refining the prototypes to gradually encapsulate more fine-grained semantic details, while explicitly aggregating each feature with the corresponding prototype. This approach allows the model to prioritize fine-grained discriminative information, even when the pre-trained model contains excessive non-discriminative information due to the granularity gap. Our proposed simple yet effective method, ProtoReg, significantly outperforms other transfer learning methods in fine-grained classification benchmarks with an average performance improvement of 6.4\\% compared to standard fine-tuning. Particularly in limited data scenarios using only 15\\% of the training data, ProtoReg achieves an even more substantial average improvement of 13.4\\%. Furthermore, ProtoReg demonstrates robustness to shortcut learning when evaluated on out-of-distribution data.",
        "keywords": "Transfer learning;fine-tuning;regularization",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "HyunGi Kim;Seungryong Yoo;Bong Gyun Kang;Saehyung Lee;Sungroh Yoon",
        "authorids": "~HyunGi_Kim1;~Seungryong_Yoo1;~Bong_Gyun_Kang1;~Saehyung_Lee1;~Sungroh_Yoon1",
        "gender": "M;M;M;M;",
        "homepage": ";https://github.com/bastian1209;https://github.com/Pusheen-cat;;http://ailab.snu.ac.kr",
        "dblp": "369/7158;279/3657.html;369/7132;260/0442;99/1474",
        "google_scholar": "https://scholar.google.com/citations?hl=ko;https://scholar.google.co.kr/citations?hl=ko;iuMRdnIAAAAJ;nS24h74AAAAJ;Bphl_fIAAAAJ",
        "orcid": ";;0000-0002-2287-4564;;0000-0002-2367-197X",
        "linkedin": ";;;;",
        "or_profile": "~HyunGi_Kim1;~Seungryong_Yoo1;~Bong_Gyun_Kang1;~Saehyung_Lee1;~Sungroh_Yoon1",
        "aff": "Seoul National University;Seoul National University;Seoul National University;Adobe Systems;Seoul National University",
        "aff_domain": "snu.ac.kr;snu.ac.kr;snu.ac.kr;adobe.com;snu.ac.kr",
        "position": "PhD student;PhD student;PhD student;Intern;Full Professor",
        "bibtex": "@misc{\nkim2024protoreg,\ntitle={ProtoReg: Prioritizing Discriminative Information for Fine-grained Transfer Learning},\nauthor={HyunGi Kim and Seungryong Yoo and Bong Gyun Kang and Saehyung Lee and Sungroh Yoon},\nyear={2024},\nurl={https://openreview.net/forum?id=Op1XmdxFk8}\n}",
        "github": "",
        "project": "",
        "reviewers": "HTua;BWuH;Ka1A;bkLU",
        "site": "https://openreview.net/forum?id=Op1XmdxFk8",
        "pdf_size": 1583898,
        "rating": "3;5;5;6",
        "confidence": "5;4;3;5",
        "soundness": "3;2;3;3",
        "contribution": "2;1;2;3",
        "presentation": "3;3;3;2",
        "wc_summary": "141;69;72;42",
        "wc_strengths": "17;16;127;74",
        "wc_weaknesses": "51;215;199;86",
        "wc_questions": "84;4;75;17",
        "wc_review": "293;304;473;219",
        "wc_reply_reviewers": "0;220;136;0",
        "wc_reply_authors": "1232;1443;1823;389",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "3;3;4;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            81.0,
            36.55817282086182
        ],
        "wc_strengths_avg": [
            58.5,
            45.991847103590004
        ],
        "wc_weaknesses_avg": [
            137.75,
            70.57398600050871
        ],
        "wc_questions_avg": [
            45.0,
            34.94996423460259
        ],
        "wc_review_avg": [
            322.25,
            92.9714337847922
        ],
        "wc_reply_reviewers_avg": [
            89.0,
            93.82430388763883
        ],
        "wc_reply_authors_avg": [
            1221.75,
            525.364337864686
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.75,
            1.0897247358851685
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.20751433915982243,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:haomTs8GyTIJ:scholar.google.com/&scioq=ProtoReg:+Prioritizing+Discriminative+Information+for+Fine-grained+Transfer+Learning&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "Seoul National University;Adobe",
        "aff_unique_dep": ";Adobe Systems Incorporated",
        "aff_unique_url": "https://www.snu.ac.kr;https://www.adobe.com",
        "aff_unique_abbr": "SNU;Adobe",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "id": "OpWg0ldkcB",
        "title": "Affine feature response transforms",
        "track": "main",
        "status": "Desk Reject",
        "tldr": "",
        "abstract": "We introduce affine feature response transforms (AFRT, \\\u2019e-fert \\), - a new family of neural encoding models based on spatial transformer networks (STNs). AFRT factorises receptive fields into a sequential affine component with 3 interpretable parameters (\u0398 for shifting and scaling) and response components with a small number of feature weights per response, which drastically simplifies the state-of-the-art neural encoding models and significantly improves performance of the encoding model. Additionally, our investigation delves into the sizes of the AFRT-generated receptive fields at various depth levels within the neural network. Our findings reveal a correspondence between these sizes and the information complexity present in corresponding brain regions, offering valuable insights into the behavior of the model, which demonstrate the benefits of incorporating spatial specificity into neural encoding models and potentially offers a new avenue for retinotopic mapping.",
        "keywords": "neural encoding;receptive fields;multi-unit activity;visual cortex",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Lynn Le;Nils Kimman;Thirza Dado;Ya\u011fmur G\u00fc\u00e7l\u00fct\u00fcrk;Umut G\u00fc\u00e7l\u00fc",
        "authorids": "~Lynn_Le2;~Nils_Kimman1;~Thirza_Dado1;~Ya\u011fmur_G\u00fc\u00e7l\u00fct\u00fcrk1;~Umut_G\u00fc\u00e7l\u00fc1",
        "gender": ";;F;F;M",
        "homepage": "https://www.lynnle.com;https://nl.linkedin.com/in/nils-kimman;https://www.ru.nl/english/people/dado-t/;;https://neuralcoding.nl",
        "dblp": ";;;https://dblp.uni-trier.de/pers/g/G=uuml==ccedil=l=uuml=t=uuml=rk:Yagmur.html;02/8743",
        "google_scholar": "M68qL4cAAAAJ;;;https://scholar.google.nl/citations?user=X2vDok4AAAAJ;LM9WFngAAAAJ",
        "orcid": ";;;0000-0001-7872-3573;0000-0003-4753-159X",
        "linkedin": ";;thirza-dado-53a199a4/;yagmurgucluturk/;umutguclu",
        "or_profile": "~Lynn_Le2;~Nils_Kimman1;~Thirza_Dado1;~Ya\u011fmur_G\u00fc\u00e7l\u00fct\u00fcrk1;~Umut_G\u00fc\u00e7l\u00fc1",
        "aff": "Radboud University;;Donders Institute for Brain, Cognition and Behaviour;Radboud University Nijmegen;Radboud University Nijmegen",
        "aff_domain": "ru.nl;;donders.ru.nl;ru.nl;ru.nl",
        "position": "PhD student;;PhD student;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nle2024affine,\ntitle={Affine feature response transforms},\nauthor={Lynn Le and Nils Kimman and Thirza Dado and Ya{\\u{g}}mur G{\\\"u}{\\c{c}}l{\\\"u}t{\\\"u}rk and Umut G{\\\"u}{\\c{c}}l{\\\"u}},\nyear={2024},\nurl={https://openreview.net/forum?id=OpWg0ldkcB}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=OpWg0ldkcB",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Radboud University;Donders Institute for Brain, Cognition and Behaviour",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ru.nl;https://www.donders.ru.nl",
        "aff_unique_abbr": "RU;",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Nijmegen",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Netherlands"
    },
    {
        "id": "OqLrv5oH6r",
        "title": "Encoding Expert Knowledge into Federated Learning using Weak Supervision",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Learning from on-device data has enabled intelligent mobile applications ranging from smart keyboards to apps that predict abnormal heartbeats. However, due to the sensitive and distributed nature of such data, it is onerous to acquire the expert annotations required to train traditional supervised machine learning pipelines. Consequently, existing federated learning techniques that learn from on-device data mostly rely on unsupervised approaches, and are unable to capture expert knowledge via data annotations. In this work, we explore how to codify this expert knowledge using programmatic weak supervision, a principled framework that leverages labeling functions (i.e., heuristic rules) in order to annotate vast quantities of data without direct access to the data itself. We introduce Weak Supervision Heuristics for Federated Learning (WSHFL), a method that interactively mines and leverages labeling functions to annotate on-device data in cross-device federated settings. We conduct experiments across two data modalities: text and time-series, and demonstrate that WSHFL achieves competitive performance compared to fully supervised baselines without the need for direct data annotations.",
        "keywords": "Federated Learning;Weak Supervision;Sequential Decision Making;Time-series",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Sebastian Caldas;Mononito Goswami;Artur Dubrawski",
        "authorids": "~Sebastian_Caldas1;~Mononito_Goswami1;~Artur_Dubrawski2",
        "gender": "M;M;M",
        "homepage": ";https://mononito.com;https://www.autonlab.org",
        "dblp": "232/1799;243/3771;76/48",
        "google_scholar": "u15oBdQAAAAJ;https://scholar.google.co.in/citations?hl=en;O3gezzcAAAAJ",
        "orcid": ";0000-0002-4117-5558;0000-0002-2372-0831",
        "linkedin": ";https://linkedin.com/in/mononitogoswami/;artur-dubrawski-33a2a87/",
        "or_profile": "~Sebastian_Caldas1;~Mononito_Goswami1;~Artur_Dubrawski2",
        "aff": "Princeton University;Google;Carnegie Mellon University",
        "aff_domain": "princeton.edu;google.com;cmu.edu",
        "position": "Lecturer;Intern;Research Professor",
        "bibtex": "@misc{\ncaldas2024encoding,\ntitle={Encoding Expert Knowledge into Federated Learning using Weak Supervision},\nauthor={Sebastian Caldas and Mononito Goswami and Artur Dubrawski},\nyear={2024},\nurl={https://openreview.net/forum?id=OqLrv5oH6r}\n}",
        "github": "",
        "project": "",
        "reviewers": "W4Yv;qXVo;mKax",
        "site": "https://openreview.net/forum?id=OqLrv5oH6r",
        "pdf_size": 1525589,
        "rating": "5;6;6",
        "confidence": "3;4;4",
        "soundness": "2;3;2",
        "contribution": "2;4;3",
        "presentation": "3;3;3",
        "wc_summary": "108;52;117",
        "wc_strengths": "25;56;149",
        "wc_weaknesses": "149;51;159",
        "wc_questions": "2;39;45",
        "wc_review": "284;198;470",
        "wc_reply_reviewers": "0;0;64",
        "wc_reply_authors": "300;264;639",
        "reply_reviewers": "0;0;1",
        "reply_authors": "2;2;2",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            92.33333333333333,
            28.75567576825293
        ],
        "wc_strengths_avg": [
            76.66666666666667,
            52.689868307125444
        ],
        "wc_weaknesses_avg": [
            119.66666666666667,
            48.72599123899094
        ],
        "wc_questions_avg": [
            28.666666666666668,
            19.014614262602212
        ],
        "wc_review_avg": [
            317.3333333333333,
            113.517497427587
        ],
        "wc_reply_reviewers_avg": [
            21.333333333333332,
            30.169889330626027
        ],
        "wc_reply_authors_avg": [
            401.0,
            168.9319389576761
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.9999999999999997,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:c4nAD7WiXiQJ:scholar.google.com/&scioq=Encoding+Expert+Knowledge+into+Federated+Learning+using+Weak+Supervision&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Princeton University;Google;Carnegie Mellon University",
        "aff_unique_dep": ";Google;",
        "aff_unique_url": "https://www.princeton.edu;https://www.google.com;https://www.cmu.edu",
        "aff_unique_abbr": "Princeton;Google;CMU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "DiLu: A Knowledge-Driven Approach to Autonomous Driving with Large Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18729",
        "id": "OqTMUPuLuC",
        "author_site": "Licheng Wen, DAOCHENG FU, Xin Li, Xinyu Cai, Tao MA, Pinlong Cai, Min Dou, Botian Shi, Liang He, Yu Qiao",
        "tldr": "",
        "abstract": "Recent advancements in autonomous driving have relied on data-driven approaches, which are widely adopted but face challenges including dataset bias, overfitting, and uninterpretability. \nDrawing inspiration from the knowledge-driven nature of human driving, we explore the question of how to instill similar capabilities into autonomous driving systems and summarize a paradigm that integrates an interactive environment, a driver agent, as well as a memory component to address this question. \nLeveraging large language models (LLMs) with emergent abilities, we propose the DiLu framework, which combines a Reasoning and a Reflection module to enable the system to perform decision-making based on common-sense knowledge and evolve continuously. \nExtensive experiments prove DiLu's capability to accumulate experience and demonstrate a significant advantage in generalization ability over reinforcement learning-based methods.\nMoreover, DiLu is able to directly acquire experiences from real-world datasets which highlights its potential to be deployed on practical autonomous driving systems.\nTo the best of our knowledge, we are the first to leverage knowledge-driven capability in decision-making for autonomous vehicles. Through the proposed DiLu framework, LLM is strengthened to apply knowledge and to reason causally in the autonomous driving domain.\n\nProject page: https://pjlab-adg.github.io/DiLu/",
        "keywords": "Autonmous Driving;Large Language Model;Embodied AI;Knowledge-driven",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/b0f0e69c05614943b33cf3a1dcf9d7c1db9ca6a9.zip",
        "author": "Licheng Wen;Daocheng Fu;Xin Li;Xinyu Cai;Tao MA;Pinlong Cai;Min Dou;Botian Shi;Liang He;Yu Qiao",
        "authorids": "~Licheng_Wen1;~Daocheng_Fu1;~Xin_Li50;~Xinyu_Cai2;~Tao_MA3;~Pinlong_Cai1;~Min_Dou1;~Botian_Shi1;~Liang_He2;~Yu_Qiao1",
        "gender": "M;M;M;;;M;M;M;;",
        "homepage": "https://wenlc.cn;;https://sankin97.github.io/;;;https://pinlong-cai.github.io/;;;;",
        "dblp": ";;;;;;;245/8742;;",
        "google_scholar": "RNnjXTkAAAAJ;vIU6eHYAAAAJ;https://scholar.google.com.hk/citations?user=7atts2cAAAAJ;;;https://scholar.google.com.hk/citations?user=H6mQGfAAAAAJ;;K0PpvLkAAAAJ;;",
        "orcid": ";;;0000-0001-8500-9300;;;;0000-0003-3677-7252;;",
        "linkedin": ";;;;;;%E6%B0%91-%E7%AA%A6-a34b17a3;friskit/;;",
        "or_profile": "~Licheng_Wen1;~Daocheng_Fu1;~Xin_Li50;~Xinyu_Cai2;~Tao_MA3;~Pinlong_Cai1;~Min_Dou1;~Botian_Shi1;~Liang_He2;~Yu_Qiao1",
        "aff": "Shanghai AI Lab;Shanghai Artificial Intelligence Laboratory;East China Normal University;Shanghai Artificial Intelligence Laboratory;;Shanghai Artificial Intelligence Laboratory;Shanghai AI Laboratory;Shanghai AI Lab;;",
        "aff_domain": "pjlab.org.cn;shlab.org.cn;ecnu.edu.cn;pjlab.org.cn;;pjlab.org.cn;pjlab.org.cn;pjlab.org.cn;;",
        "position": "Researcher;Researcher;PhD student;Researcher;;Researcher;Researcher;Researcher;;",
        "bibtex": "@inproceedings{\nwen2024dilu,\ntitle={DiLu: A Knowledge-Driven Approach to Autonomous Driving with Large Language Models},\nauthor={Licheng Wen and Daocheng Fu and Xin Li and Xinyu Cai and Tao MA and Pinlong Cai and Min Dou and Botian Shi and Liang He and Yu Qiao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=OqTMUPuLuC}\n}",
        "github": "",
        "project": "",
        "reviewers": "LJSU;Cxkm;48LR;RmuT",
        "pdf_size": 4329181,
        "rating": "5;6;6;8",
        "confidence": "4;4;4;3",
        "soundness": "3;2;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "160;53;227;66",
        "wc_strengths": "68;62;126;52",
        "wc_weaknesses": "123;174;279;254",
        "wc_questions": "144;492;95;22",
        "wc_review": "495;781;727;394",
        "wc_reply_reviewers": "0;263;0;21",
        "wc_reply_authors": "1146;1854;1663;695",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "3;4;3;2",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            126.5,
            71.21270953980054
        ],
        "wc_strengths_avg": [
            77.0,
            28.861739379323623
        ],
        "wc_weaknesses_avg": [
            207.5,
            62.323751491706595
        ],
        "wc_questions_avg": [
            188.25,
            180.6631880046403
        ],
        "wc_review_avg": [
            599.25,
            159.95995592647554
        ],
        "wc_reply_reviewers_avg": [
            71.0,
            111.18228276123854
        ],
        "wc_reply_authors_avg": [
            1339.5,
            453.37208780426704
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": -0.9271726499455306,
        "gs_citation": 197,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1159947953820843831&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=OqTMUPuLuC",
        "pdf": "https://openreview.net/pdf?id=OqTMUPuLuC",
        "email": "pjlab.org.cn;shlab.org.cn;ecnu.edu.cn;pjlab.org.cn;;pjlab.org.cn;pjlab.org.cn;pjlab.org.cn;;",
        "author_num": 10,
        "aff_unique_index": "0;1;2;1;1;3;0",
        "aff_unique_norm": "Shanghai AI Lab;Shanghai Artificial Intelligence Laboratory;East China Normal University;Shanghai AI Laboratory",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.shanghaiailab.com;http://www.shailab.org/;http://www.ecnu.edu.cn;https://www.shanghai-ai-lab.com",
        "aff_unique_abbr": "SAIL;Shanghai AI Lab;ECNU;SAIL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "OqlmgmS4Wr",
        "title": "AgentTuning: Enabling Generalized Agent Abilities for LLMs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Open large language models (LLMs) with great performance in various tasks have significantly advanced the development of LLMs. However, they are far inferior to commercial models such as ChatGPT and GPT-4 when acting as agents to tackle complex tasks in the real world. These agent tasks employ LLMs as the central controller responsible for planning, memorization, and tool utilization, necessitating both fine-grained prompting methods and robust LLMs to achieve satisfactory performance. Though many prompting methods have been proposed to complete particular agent tasks, there is lack of research focusing on improving the agent capabilities of LLMs themselves without compromising their general abilities. In this work, we present AgentTuning, a simple and general method to enhance the agent abilities of LLMs while maintaining their general LLM capabilities. We construct AgentDataset, a lightweight instruction-tuning dataset containing high-quality interaction trajectories. We employ a hybrid instruction-tuning strategy by combining AgentDataset with open-source instructions from general domains. AgentTuning is used to instruction-tune the Llama 2 series, resulting in AgentLlama. Our evaluations show that AgentTuning enables LLMs' agent capabilities without compromising general abilities. The AgentLlama-70B is comparable to GPT-3.5-turbo on unseen agent tasks, demonstrating generalized agent capabilities. We open source the AgentDataset and AgentLlama-7B, 13B, and 70B models at https://anonymous.4open.science/r/AgentTuning, serving open and powerful alternatives to commercial LLMs for agent tasks.",
        "keywords": "Large language models;Autonomous agents;Instruction tuning;Reasoning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Aohan Zeng;Mingdao Liu;Rui Lu;Bowen Wang;Xiao Liu;Yuxiao Dong;Jie Tang",
        "authorids": "~Aohan_Zeng1;~Mingdao_Liu1;~Rui_Lu5;~Bowen_Wang4;~Xiao_Liu15;~Yuxiao_Dong1;~Jie_Tang1",
        "gender": "M;M;M;Not Specified;M;M;",
        "homepage": ";https://github.com/Btlmd;http://learningrate1.com/;https://abmfy.github.io;https://github.com/xiao9905;https://keg.cs.tsinghua.edu.cn/yuxiao/;",
        "dblp": "286/8519.html;;;;82/1364-36;17/9267;",
        "google_scholar": "STftvjoAAAAJ;aue_jdEAAAAJ;https://scholar.google.com/citations?view_op=list_works;;VKI8EhUAAAAJ;https://scholar.google.com.hk/citations?hl=en;",
        "orcid": ";;;;0000-0002-9226-4569;0000-0002-6092-2002;",
        "linkedin": ";;;;;;",
        "or_profile": "~Aohan_Zeng1;~Mingdao_Liu1;~Rui_Lu5;~Bowen_Wang4;~Xiao_Liu15;~Yuxiao_Dong1;~Jie_Tang1",
        "aff": "Tsinghua University;Tsinghua University;Weiyang college, Tsinghua University, Tsinghua University;Tsinghua University;Tsinghua University;Tsinghua University;",
        "aff_domain": "tsinghua.edu.cn;cs.tsinghua.edu.cn;mails.tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;",
        "position": "PhD student;Undergrad student;Undergrad student;Undergrad student;PhD student;Associate Professor;",
        "bibtex": "@misc{\nzeng2024agenttuning,\ntitle={AgentTuning: Enabling Generalized Agent Abilities for {LLM}s},\nauthor={Aohan Zeng and Mingdao Liu and Rui Lu and Bowen Wang and Xiao Liu and Yuxiao Dong and Jie Tang},\nyear={2024},\nurl={https://openreview.net/forum?id=OqlmgmS4Wr}\n}",
        "github": "",
        "project": "",
        "reviewers": "iTiT;cRHd;7D3A",
        "site": "https://openreview.net/forum?id=OqlmgmS4Wr",
        "pdf_size": 2942842,
        "rating": "6;6;6",
        "confidence": "4;4;4",
        "soundness": "3;2;3",
        "contribution": "2;4;3",
        "presentation": "3;3;3",
        "wc_summary": "148;35;97",
        "wc_strengths": "32;29;34",
        "wc_weaknesses": "282;163;28",
        "wc_questions": "45;36;258",
        "wc_review": "507;263;417",
        "wc_reply_reviewers": "213;0;0",
        "wc_reply_authors": "4419;1093;1539",
        "reply_reviewers": "1;0;0",
        "reply_authors": "7;2;4",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            93.33333333333333,
            46.20485784946091
        ],
        "wc_strengths_avg": [
            31.666666666666668,
            2.0548046676563256
        ],
        "wc_weaknesses_avg": [
            157.66666666666666,
            103.76362025724087
        ],
        "wc_questions_avg": [
            113.0,
            102.59629622944485
        ],
        "wc_review_avg": [
            395.6666666666667,
            100.74831126238405
        ],
        "wc_reply_reviewers_avg": [
            71.0,
            100.40916292848975
        ],
        "wc_reply_authors_avg": [
            2350.3333333333335,
            1474.0568359312185
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            4.333333333333333,
            2.0548046676563256
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 147,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2074244561659281432&as_sdt=8005&sciodt=0,7&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "Tsinghua University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "THU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Beijing",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "Or6xoO2END",
        "title": "Generalization for Discriminator-Guided Diffusion Models via Strong Duality",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In the past few years, score-based generative models (SGMs) and diffusion models have proven to be efficient methods for learning distributions and have been of great practical significance. However, only a few lines of work are attempting to understand the theoretical guarantees of such models, and only one recent work (Oko et al., 2023) focuses on the generalization abilities. In this work, we extend the study of generalization in SGMs and look to answer how model complexity emerges as a key player in the success of these models. For example, in other deep generative models, such as Generative Adversarial Networks (GANs), it has been revealed that the complexity of the discriminator set plays a crucial role in generalization. We prove that when diffusion models are further refined by discriminators (Kim et al., 2022a), the Integral Probability Metric (IPM) can be exactly represented through strong duality. Our findings advocate for discriminator refinement of deep generative models and, more specifically, unveil the generalization effect of using regularized discriminators in this setting. This result validates existing work on discriminator refinement to a great deal of generality. Therefore, our work provides theoretical validation for existing practices, provides a notion of regularization for SGMs, and contributes to the understanding of efficient distributional learning at large.",
        "keywords": "f-divergences;diffusion;integral probability metrics",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/474987ec477c36888adb368ae398785fa655f9e3.pdf",
        "author": "Hisham Husain;Richard Nock",
        "authorids": "~Hisham_Husain1;~Richard_Nock1",
        "gender": ";",
        "homepage": ";http://users.cecs.anu.edu.au/~rnock/",
        "dblp": "222/3235;n/RichardNock",
        "google_scholar": "bwq3crYAAAAJ;https://scholar.google.fr/citations?user=0J2s3YQAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Hisham_Husain1;~Richard_Nock1",
        "aff": "Amazon;Google Research",
        "aff_domain": "amazon.com;google.com",
        "position": "Researcher;Researcher",
        "bibtex": "@misc{\nhusain2024generalization,\ntitle={Generalization for Discriminator-Guided Diffusion Models via Strong Duality},\nauthor={Hisham Husain and Richard Nock},\nyear={2024},\nurl={https://openreview.net/forum?id=Or6xoO2END}\n}",
        "github": "",
        "project": "",
        "reviewers": "G97H;3Spm;F2Tz;mXZv",
        "site": "https://openreview.net/forum?id=Or6xoO2END",
        "pdf_size": 313164,
        "rating": "1;3;5;6",
        "confidence": "2;3;2;3",
        "soundness": "1;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "1;1;2;3",
        "wc_summary": "72;146;11;103",
        "wc_strengths": "81;95;84;52",
        "wc_weaknesses": "752;450;203;58",
        "wc_questions": "13;2;17;20",
        "wc_review": "918;693;315;233",
        "wc_reply_reviewers": "348;0;0;0",
        "wc_reply_authors": "779;616;86;248",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.75,
            1.920286436967152
        ],
        "confidence_avg": [
            2.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            83.0,
            49.178247223747206
        ],
        "wc_strengths_avg": [
            78.0,
            15.890248582070704
        ],
        "wc_weaknesses_avg": [
            365.75,
            263.38410639216636
        ],
        "wc_questions_avg": [
            13.0,
            6.819090848492928
        ],
        "wc_review_avg": [
            539.75,
            278.9116123434089
        ],
        "wc_reply_reviewers_avg": [
            87.0,
            150.68842025849233
        ],
        "wc_reply_authors_avg": [
            432.25,
            277.4151897427392
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.39056673294247163,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18324952986537198936&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Amazon;Google",
        "aff_unique_dep": "Amazon.com, Inc.;Google Research",
        "aff_unique_url": "https://www.amazon.com;https://research.google",
        "aff_unique_abbr": "Amazon;Google Research",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Universal Humanoid Motion Representations for Physics-Based Control",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18728",
        "id": "OrOd8PxOO2",
        "author_site": "Zhengyi Luo, Jinkun Cao, Josh Merel, Alexander Winkler, Jing Huang, Kris Kitani, Weipeng Xu",
        "tldr": "",
        "abstract": "We present a universal motion representation that encompasses a comprehensive range of motor skills for physics-based humanoid control. Due to the high dimensionality of humanoids and the inherent difficulties in reinforcement learning, prior methods have focused on learning skill embeddings for a narrow range of movement styles (e.g. locomotion, game characters) from specialized motion datasets. This limited scope hampers their applicability in complex tasks. We close this gap by significantly increasing the coverage of our motion representation space. To achieve this, we first learn a motion imitator that can imitate all of human motion from a large, unstructured motion dataset. We then create our motion representation by distilling skills directly from the imitator. This is achieved by using an encoder-decoder structure with a variational information bottleneck. Additionally, we jointly learn a prior conditioned on proprioception (humanoid's own pose and velocities) to improve model expressiveness and sampling efficiency for downstream tasks. By sampling from the prior, we can generate long, stable, and diverse human motions. Using this latent space for hierarchical RL, we show that our policies solve tasks using human-like behavior. We demonstrate the effectiveness of our motion representation by solving generative tasks (e.g. strike, terrain traversal) and motion tracking using VR controllers.",
        "keywords": "humanoid control;motion generation;physics simulation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/0303cdb93e98727754534f20790edca61873f3eb.zip",
        "author": "Zhengyi Luo;Jinkun Cao;Josh Merel;Alexander Winkler;Jing Huang;Kris M. Kitani;Weipeng Xu",
        "authorids": "~Zhengyi_Luo1;~Jinkun_Cao1;~Josh_Merel1;~Alexander_Winkler1;~Jing_Huang1;~Kris_M._Kitani1;~Weipeng_Xu1",
        "gender": "M;M;;;M;M;M",
        "homepage": "https://zhengyiluo.github.io/;https://www.jinkuncao.com;;https://alex-winkler.com/;https://superirabbit.github.io/;http://www.cs.cmu.edu/~kkitani/;https://sites.google.com/view/xuweipeng",
        "dblp": ";224/0126;139/1361;161/9871.html;;42/163;190/7431",
        "google_scholar": "lHPTxGsAAAAJ;xDtTbmQAAAAJ;https://scholar.google.co.uk/citations?user=K4OcFXUAAAAJ;https://scholar.google.ch/citations?user=EElBh28AAAAJ;4ipqyusAAAAJ;yv3sH74AAAAJ;https://scholar.google.de/citations?user=vy8xXDQAAAAJ",
        "orcid": ";;;0000-0003-1839-0855;;0000-0002-9389-4060;",
        "linkedin": "zhengyi-zen-luo-726156105/;;;;jing-huang-usc/;;",
        "or_profile": "~Zhengyi_Luo1;~Jinkun_Cao1;~Josh_Merel1;~Alexander_Winkler1;~Jing_Huang1;~Kris_M._Kitani1;~Weipeng_Xu1",
        "aff": "Meta Platforms, Inc.;Carnegie Mellon University;Meta Reality Labs;Meta Facebook;Meta;Carnegie Mellon University;Meta Reality Labs",
        "aff_domain": "meta.com;andrew.cmu.edu;fb.com;fb.com;meta.com;cmu.edu;meta.com",
        "position": "Intern;PhD student;Research Scientist;Researcher;Research Scientist;Associate Professor;Researcher",
        "bibtex": "@inproceedings{\nluo2024universal,\ntitle={Universal Humanoid Motion Representations for Physics-Based Control},\nauthor={Zhengyi Luo and Jinkun Cao and Josh Merel and Alexander Winkler and Jing Huang and Kris M. Kitani and Weipeng Xu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=OrOd8PxOO2}\n}",
        "github": "",
        "project": "",
        "reviewers": "arMx;UBzx;a8Fw",
        "pdf_size": 7593010,
        "rating": "8;8;8",
        "confidence": "4;2;3",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "3;3;3",
        "wc_summary": "102;79;65",
        "wc_strengths": "132;74;23",
        "wc_weaknesses": "155;41;110",
        "wc_questions": "29;36;124",
        "wc_review": "418;230;322",
        "wc_reply_reviewers": "12;25;10",
        "wc_reply_authors": "513;429;1787",
        "reply_reviewers": "1;1;1",
        "reply_authors": "2;2;4",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            82.0,
            15.253414918196734
        ],
        "wc_strengths_avg": [
            76.33333333333333,
            44.52964056545807
        ],
        "wc_weaknesses_avg": [
            102.0,
            46.88283267892417
        ],
        "wc_questions_avg": [
            63.0,
            43.22807729551092
        ],
        "wc_review_avg": [
            323.3333333333333,
            76.75646914466269
        ],
        "wc_reply_reviewers_avg": [
            15.666666666666666,
            6.649979114420002
        ],
        "wc_reply_authors_avg": [
            909.6666666666666,
            621.3154503864272
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 58,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10214443883966147172&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=OrOd8PxOO2",
        "pdf": "https://openreview.net/pdf?id=OrOd8PxOO2",
        "email": "meta.com;andrew.cmu.edu;fb.com;fb.com;meta.com;cmu.edu;meta.com",
        "author_num": 7,
        "aff_unique_index": "0;1;0;0;0;1;0",
        "aff_unique_norm": "Meta;Carnegie Mellon University",
        "aff_unique_dep": "Meta Platforms, Inc.;",
        "aff_unique_url": "https://www.meta.com;https://www.cmu.edu",
        "aff_unique_abbr": "Meta;CMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Learning From Simplicial Data Based on Random Walks and 1D Convolutions",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18727",
        "id": "OsGUnYOzii",
        "author_site": "Florian Frantzen, Michael Schaub",
        "tldr": "",
        "abstract": "Triggered by limitations of graph-based deep learning methods in terms of computational expressivity and model flexibility, recent years have seen a surge of interest in computational models that operate on higher-order topological domains such as hypergraphs and simplicial complexes. While the increased expressivity of these models can indeed lead to a better classification performance and a more faithful representation of the underlying system, the computational cost of these higher-order models can increase dramatically. To this end, we here explore a simplicial complex neural network learning architecture based on random walks and fast 1D convolutions (SCRaWl), in which we can adjust the increase in computational cost by varying the length and number of random walks considered while accounting for higher-order relationships. Importantly, due to the random walk-based design, the expressivity of the proposed architecture is provably incomparable to that of existing message-passing simplicial neural networks. We empirically evaluate SCRaWl on real-world datasets and show that it outperforms other simplicial neural networks.",
        "keywords": "simplicial complex;simplicial neural network;random walks",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/413a9f98abbdd8956b733946fb75fe351a423a1e.zip",
        "author": "Florian Frantzen;Michael T Schaub",
        "authorids": "~Florian_Frantzen1;~Michael_T_Schaub1",
        "gender": "M;",
        "homepage": "https://www.netsci.rwth-aachen.de/cms/netsci/Die-Juniorprofessur/Team/~mcpey/Florian-Frantzen/;https://michaelschaub.github.io/",
        "dblp": "265/6356;72/10263",
        "google_scholar": "https://scholar.google.de/citations?user=AEqf32AAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0003-0187-3738;0000-0003-2426-6404",
        "linkedin": "florian-frantzen-862593267/;",
        "or_profile": "~Florian_Frantzen1;~Michael_T_Schaub1",
        "aff": "RWTH Aachen University;RWTH Aachen University",
        "aff_domain": "rwth-aachen.de;rwth-aachen.de",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nfrantzen2024learning,\ntitle={Learning From Simplicial Data Based on Random Walks and 1D Convolutions},\nauthor={Florian Frantzen and Michael T Schaub},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=OsGUnYOzii}\n}",
        "github": "",
        "project": "",
        "reviewers": "Wmrd;6GSS;vWSA;WBPx",
        "pdf_size": 476415,
        "rating": "5;5;8;8",
        "confidence": "4;2;5;4",
        "soundness": "2;2;4;3",
        "contribution": "2;2;4;3",
        "presentation": "3;3;4;3",
        "wc_summary": "39;18;61;60",
        "wc_strengths": "85;43;89;53",
        "wc_weaknesses": "1009;68;252;135",
        "wc_questions": "55;2;95;28",
        "wc_review": "1188;131;497;276",
        "wc_reply_reviewers": "0;50;15;28",
        "wc_reply_authors": "255;112;330;361",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.5,
            1.5
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            44.5,
            17.64227876437735
        ],
        "wc_strengths_avg": [
            67.5,
            19.868316486305527
        ],
        "wc_weaknesses_avg": [
            366.0,
            377.03116582054594
        ],
        "wc_questions_avg": [
            45.0,
            34.416565778706044
        ],
        "wc_review_avg": [
            523.0,
            405.4546830411507
        ],
        "wc_reply_reviewers_avg": [
            23.25,
            18.34904629674251
        ],
        "wc_reply_authors_avg": [
            264.5,
            96.11061335773485
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.6882472016116854,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:VOOKz7T0d1MJ:scholar.google.com/&scioq=Learning+From+Simplicial+Data+Based+on+Random+Walks+and+1D+Convolutions&hl=en&as_sdt=0,33",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=OsGUnYOzii",
        "pdf": "https://openreview.net/pdf?id=OsGUnYOzii",
        "email": "rwth-aachen.de;rwth-aachen.de",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "RWTH Aachen University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.rwth-aachen.de",
        "aff_unique_abbr": "RWTH",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Aachen",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "OsuV40VuZo",
        "title": "Human-in-the-Loop Test-Time Domain Adaptation for Object Detection",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Prior to deployment, an object detector is trained on a dataset compiled from a previous data collection campaign. However, the environment in which the object detector is deployed will invariably evolve, particularly in outdoor settings where changes in lighting, weather and seasons will significantly affect the appearance of the scene and target objects. It is almost impossible for all potential scenarios that the object detector may come across to be present in a finite training dataset. This necessitates continuous updates to the object detector to maintain satisfactory performance. Test-time domain adaptation techniques enable machine learning models to self-adapt based on the distributions of the testing data.  However, existing methods mainly focus on fully automated adaptation, which make sense for applications such as self-driving cars. Despite the prevalence of full automated approaches, in some applications such as surveillance, there is usually a human operator overseeing the system's operation. We propose to involve the operator in domain adaptation to raise the performance of object detection beyond what is achievable by fully automated adaptation. To reduce manual effort, the proposed method only requires the operator to provide weak labels, which are then used to guide the adaptation process. Furthermore, the proposed method can be performed online, facilitating its applications in scenarios where inference and domain adaptation must be carried out simultaneously. Our experiments show that the proposed method outperforms existing works, demonstrating a great benefit of human-in-the-loop test-time domain adaptation.",
        "keywords": "human-in-the-loop machine learning;test-time domain adaptation;object detection",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/83e53b6848928740157c48fde70e1bfd37a66f19.zip",
        "author": "Dzung Anh Doan;Bach Long Nguyen;Terry Lim;Madhuka Jayawardhana;Ian Reid;Markus Wagner;Tat-Jun Chin",
        "authorids": "~Dzung_Anh_Doan1;~Bach_Long_Nguyen1;~Terry_Lim1;~Madhuka_Jayawardhana1;~Ian_Reid1;~Markus_Wagner1;~Tat-Jun_Chin2",
        "gender": ";M;M;F;M;;",
        "homepage": ";;;https://www.linkedin.com/in/madhukajayawardhana/;;https://cs.adelaide.edu.au/~markus/;",
        "dblp": ";;;;r/IanDReid1;94/7030-7;",
        "google_scholar": ";https://scholar.google.com.au/citations?user=uMihcRgAAAAJ;;;https://scholar.google.com.au/citations?user=ATkNLcQAAAAJ;https://scholar.google.com.au/citations?user=9cbh6PoAAAAJ;",
        "orcid": ";0000-0002-4684-9806;;;0000-0001-7790-6423;;",
        "linkedin": ";;terry-lim-1410;madhukajayawardhana/;;markusandreaswagner/;",
        "or_profile": "~Dzung_Anh_Doan1;~Bach_Long_Nguyen1;~Terry_Lim1;~Madhuka_Jayawardhana1;~Ian_Reid1;~Markus_Wagner1;~Tat-Jun_Chin2",
        "aff": ";Monash University;Safran Electronics and Defense Australasia;;University of Adelaide;The University of Adelaide;",
        "aff_domain": ";monash.edu;safrangroup.com;;adelaide.edu.au;adelaide.edu.au;",
        "position": ";Postdoc;Intern;;Professor;Associate Professor;",
        "bibtex": "@misc{\ndoan2024humanintheloop,\ntitle={Human-in-the-Loop Test-Time Domain Adaptation for Object Detection},\nauthor={Dzung Anh Doan and Bach Long Nguyen and Terry Lim and Madhuka Jayawardhana and Ian Reid and Markus Wagner and Tat-Jun Chin},\nyear={2024},\nurl={https://openreview.net/forum?id=OsuV40VuZo}\n}",
        "github": "",
        "project": "",
        "reviewers": "8iDr;28Gn;Dn7S;ANjN",
        "site": "https://openreview.net/forum?id=OsuV40VuZo",
        "pdf_size": 9380196,
        "rating": "3;3;5;5",
        "confidence": "3;4;5;5",
        "soundness": "2;2;3;3",
        "contribution": "2;1;2;2",
        "presentation": "3;2;3;3",
        "wc_summary": "69;119;84;57",
        "wc_strengths": "9;69;41;157",
        "wc_weaknesses": "119;206;105;263",
        "wc_questions": "3;267;8;78",
        "wc_review": "200;661;238;555",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            82.25,
            23.27418097377435
        ],
        "wc_strengths_avg": [
            69.0,
            55.06359959174482
        ],
        "wc_weaknesses_avg": [
            173.25,
            64.66983454439945
        ],
        "wc_questions_avg": [
            89.0,
            106.96027299890366
        ],
        "wc_review_avg": [
            413.5,
            198.53274289144346
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.9045340337332909,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:pnyF89CkPY0J:scholar.google.com/&scioq=Human-in-the-Loop+Test-Time+Domain+Adaptation+for+Object+Detection&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;2",
        "aff_unique_norm": "Monash University;Safran Electronics and Defense;University of Adelaide",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.monash.edu;https://www.safran-group.com;https://www.adelaide.edu.au",
        "aff_unique_abbr": "Monash;Safran;Adelaide",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Australia"
    },
    {
        "title": "ImagenHub: Standardizing the evaluation of conditional image generation models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18726",
        "id": "OuV9ZrkQlc",
        "author_site": "Max Ku, Tianle Li, Kai Zhang, Yujie Lu, XINGYU FU, Wenwen Zhuang, Wenhu Chen",
        "tldr": "",
        "abstract": "Recently, a myriad of conditional image generation and editing models have been developed to serve different downstream tasks, including text-to-image generation, text-guided image editing, subject-driven image generation, control-guided image generation, etc. However, we observe huge inconsistencies in experimental conditions: datasets, inference, and evaluation metrics -- render fair comparisons difficult.    \nThis paper proposes ImagenHub, which is a one-stop library to standardize the inference and evaluation of all the conditional image generation models. Firstly, we define seven prominent tasks and curate high-quality evaluation datasets for them. Secondly, we built a unified inference pipeline to ensure fair comparison. Thirdly, we design two human evaluation scores, i.e. Semantic Consistency and Perceptual Quality, along with comprehensive guidelines to evaluate generated images. We train expert raters to evaluate the model outputs based on the proposed metrics. Our human evaluation achieves a high inter-worker agreement of Krippendorff\u2019s alpha on 76\\% models with a value higher than 0.4. We comprehensively evaluated a total of around 30 models and observed three key takeaways: (1) the existing models\u2019 performance is generally unsatisfying except for Text-guided Image Generation and Subject-driven Image Generation, with 74\\% models achieving an overall score lower than 0.5. (2) we examined the claims from published papers and found 83\\% of them hold with a few exceptions. (3) None of the existing automatic metrics has a Spearman's correlation higher than 0.2 except subject-driven image generation. Moving forward, we will continue our efforts to evaluate newly published models and update our leaderboard to keep track of the progress in conditional image generation.",
        "keywords": "Image Generation;Image Editing;Evaluation;Benchmark;Diffusion Model",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Max Ku;Tianle Li;Kai Zhang;Yujie Lu;Xingyu Fu;Wenwen Zhuang;Wenhu Chen",
        "authorids": "~Max_Ku1;~Tianle_Li1;~Kai_Zhang10;~Yujie_Lu1;~Xingyu_Fu1;~Wenwen_Zhuang2;~Wenhu_Chen3",
        "gender": "M;F;M;;F;;",
        "homepage": "https://kuwingfung.github.io/;https://www.litianlephoebe.com/;https://drogozhang.github.io;https://yujielu10.github.io/;https://zeyofu.github.io/;;",
        "dblp": "348/0574.html;242/0053;55/957-33;;118/4769;;",
        "google_scholar": "https://scholar.google.com.hk/citations?user=oCFgVhUAAAAJ;g213g7YAAAAJ;sDnAIsgAAAAJ;pcmr6GMAAAAJ;5p_uBNQAAAAJ;;",
        "orcid": ";;;;0009-0006-9533-8427;;",
        "linkedin": "max-ku-650571172/;;kai-zhang-43774b196/;;xingyu-fu-cheers;;",
        "or_profile": "~Max_Ku1;~Tianle_Li1;~Kai_Zhang10;~Yujie_Lu1;~Xingyu_Fu1;~Wenwen_Zhuang2;~Wenhu_Chen3",
        "aff": "University of Waterloo;University of Waterloo;Google DeepMind;UC Santa Barbara;University of Pennsylvania;;",
        "aff_domain": "uwaterloo.ca;uwaterloo.ca;google.com;ucsb.edu;seas.upenn.edu;;",
        "position": "MS student;MS student;Student Researcher;PhD student;PhD student;;",
        "bibtex": "@inproceedings{\nku2024imagenhub,\ntitle={ImagenHub: Standardizing the evaluation of conditional image generation models},\nauthor={Max Ku and Tianle Li and Kai Zhang and Yujie Lu and Xingyu Fu and Wenwen Zhuang and Wenhu Chen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=OuV9ZrkQlc}\n}",
        "github": "",
        "project": "",
        "reviewers": "nZYf;teCT;JKzK;gWLk",
        "pdf_size": 13686075,
        "rating": "5;6;8;8",
        "confidence": "3;3;3;4",
        "soundness": "2;3;3;4",
        "contribution": "2;3;3;4",
        "presentation": "3;3;3;4",
        "wc_summary": "80;43;85;52",
        "wc_strengths": "56;54;34;49",
        "wc_weaknesses": "122;167;85;135",
        "wc_questions": "180;122;31;31",
        "wc_review": "438;386;235;267",
        "wc_reply_reviewers": "0;38;22;18",
        "wc_reply_authors": "744;675;352;506",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "3;2;2;2",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            65.0,
            17.874562931719478
        ],
        "wc_strengths_avg": [
            48.25,
            8.613216588476108
        ],
        "wc_weaknesses_avg": [
            127.25,
            29.38005275693017
        ],
        "wc_questions_avg": [
            91.0,
            63.40741281585301
        ],
        "wc_review_avg": [
            331.5,
            83.34416596259153
        ],
        "wc_reply_reviewers_avg": [
            19.5,
            13.518505834595775
        ],
        "wc_reply_authors_avg": [
            569.25,
            152.41288495399593
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.5555555555555555,
        "gs_citation": 39,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12383053115947892437&as_sdt=5,34&sciodt=0,34&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=OuV9ZrkQlc",
        "pdf": "https://openreview.net/pdf?id=OuV9ZrkQlc",
        "email": "uwaterloo.ca;uwaterloo.ca;google.com;ucsb.edu;seas.upenn.edu;;",
        "author_num": 7,
        "aff_unique_index": "0;0;1;2;3",
        "aff_unique_norm": "University of Waterloo;Google;University of California, Santa Barbara;University of Pennsylvania",
        "aff_unique_dep": ";Google DeepMind;;",
        "aff_unique_url": "https://uwaterloo.ca;https://deepmind.com;https://www.ucsb.edu;https://www.upenn.edu",
        "aff_unique_abbr": "UW;DeepMind;UCSB;UPenn",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Santa Barbara",
        "aff_country_unique_index": "0;0;1;2;2",
        "aff_country_unique": "Canada;United Kingdom;United States"
    },
    {
        "title": "Amortizing intractable inference in large language models",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18725",
        "id": "Ouj6p4ca60",
        "author_site": "Edward Hu, Moksh Jain, Eric Elmoznino, Younesse Kaddar, Guillaume Lajoie, Yoshua Bengio, Nikolay Malkin",
        "tldr": "",
        "abstract": "Autoregressive large language models (LLMs) compress knowledge from their training data through next-token conditional distributions. This limits tractable querying of this knowledge to start-to-end autoregressive sampling. However, many tasks of interest---including sequence continuation, infilling, and other forms of constrained generation---involve sampling from intractable posterior distributions. We address this limitation by using amortized Bayesian inference to sample from these intractable posteriors. Such amortization is algorithmically achieved by fine-tuning LLMs via diversity-seeking reinforcement learning algorithms: generative flow networks (GFlowNets). We empirically demonstrate that this distribution-matching paradigm of LLM fine-tuning can serve as an effective alternative to maximum-likelihood training and reward-maximizing policy optimization. As an important application, we interpret chain-of-thought reasoning as a latent variable modeling problem and demonstrate that our approach enables data-efficient adaptation of LLMs to tasks that require multi-step rationalization and tool use.",
        "keywords": "large language models;LLMs;Bayesian inference;chain-of-thought reasoning;latent variable models;generative flow networks;GFlowNets",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/9bafb37d4a35901d97c44da14d1c222b5809c84f.zip",
        "author": "Edward J Hu;Moksh Jain;Eric Elmoznino;Younesse Kaddar;Guillaume Lajoie;Yoshua Bengio;Nikolay Malkin",
        "authorids": "~Edward_J_Hu1;~Moksh_Jain1;~Eric_Elmoznino1;~Younesse_Kaddar1;~Guillaume_Lajoie1;~Yoshua_Bengio1;~Nikolay_Malkin1",
        "gender": "M;M;;M;M;M;",
        "homepage": "https://edwardjhu.com;https://mj10.github.io;https://ericelmoznino.github.io/;https://younesse.net;https://dms.umontreal.ca/~lajoie/;http://yoshuabengio.org;",
        "dblp": "295/8436;249/9368;;336/2943;31/10384;56/953;",
        "google_scholar": "2eADy_8AAAAJ;TD07G_wAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.ca/citations?user=gdaJCDAAAAAJ;;kukA0LcAAAAJ;",
        "orcid": ";;0000-0002-4608-9712;0000-0001-7366-9889;;;",
        "linkedin": "edwardjhu/;;ericelmo/;kaddar/;;yoshuabengio/?originalSubdomain=ca;",
        "or_profile": "~Edward_J_Hu1;~Moksh_Jain1;~Eric_Elmoznino1;~Younesse_Kaddar1;~Guillaume_Lajoie1;~Yoshua_Bengio1;~Nikolay_Malkin1",
        "aff": "Montreal Institute for Learning Algorithms, University of Montreal, Universit\u00e9 de Montr\u00e9al;Universit\u00e9 de Montr\u00e9al;Universit\u00e9 de Montr\u00e9al;University of Oxford;Mila - Quebec Artificial Intelligence Institute;University of Montreal;",
        "aff_domain": "mila.umontreal.ca;umontreal.ca;umontreal.ca;ox.ac.uk;mila.quebec;umontreal.ca;",
        "position": "PhD student;PhD student;PhD student;PhD student;Associate Professor;Full Professor;",
        "bibtex": "@inproceedings{\nhu2024amortizing,\ntitle={Amortizing intractable inference in large language models},\nauthor={Edward J Hu and Moksh Jain and Eric Elmoznino and Younesse Kaddar and Guillaume Lajoie and Yoshua Bengio and Nikolay Malkin},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Ouj6p4ca60}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZdVU;7WZA;Vqdw;H3x9",
        "pdf_size": 663314,
        "rating": "5;8;8;10",
        "confidence": "4;3;4;4",
        "soundness": "2;4;3;4",
        "contribution": "3;4;3;4",
        "presentation": "2;4;3;3",
        "wc_summary": "86;294;171;88",
        "wc_strengths": "12;282;171;243",
        "wc_weaknesses": "664;132;5;338",
        "wc_questions": "2;74;293;725",
        "wc_review": "764;782;640;1394",
        "wc_reply_reviewers": "361;49;19;153",
        "wc_reply_authors": "1787;253;744;1901",
        "reply_reviewers": "2;1;1;1",
        "reply_authors": "4;2;1;4",
        "rating_avg": [
            7.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            3.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            159.75,
            84.75958647846272
        ],
        "wc_strengths_avg": [
            177.0,
            103.24969733611813
        ],
        "wc_weaknesses_avg": [
            284.75,
            249.12785372173863
        ],
        "wc_questions_avg": [
            273.5,
            281.84437195019524
        ],
        "wc_review_avg": [
            895.0,
            293.23881052821093
        ],
        "wc_reply_reviewers_avg": [
            145.5,
            133.9878725855441
        ],
        "wc_reply_authors_avg": [
            1171.25,
            695.9541561769712
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            1.299038105676658
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.08084520834544431,
        "gs_citation": 66,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17812818733769209330&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=Ouj6p4ca60",
        "pdf": "https://openreview.net/pdf?id=Ouj6p4ca60",
        "email": "mila.umontreal.ca;umontreal.ca;umontreal.ca;ox.ac.uk;mila.quebec;umontreal.ca;",
        "author_num": 7,
        "aff_unique_index": "0;1;1;2;3;0",
        "aff_unique_norm": "University of Montreal;Universit\u00e9 de Montr\u00e9al;University of Oxford;Quebec Artificial Intelligence Institute",
        "aff_unique_dep": "Montreal Institute for Learning Algorithms;;;Artificial Intelligence",
        "aff_unique_url": "https://www.mila.quebec;https://www.umontreal.ca;https://www.ox.ac.uk;https://mila.quebec",
        "aff_unique_abbr": "MILA;UdeM;Oxford;Mila",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Montreal;",
        "aff_country_unique_index": "0;0;0;1;0;0",
        "aff_country_unique": "Canada;United Kingdom"
    },
    {
        "title": "Augmented Bayesian Policy Search",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18724",
        "id": "OvlcyABNQT",
        "author_site": "Mahdi Kallel, Debabrota Basu, Riad Akrour, Carlo D'Eramo",
        "tldr": "",
        "abstract": "Deterministic policies are often preferred over stochastic ones when implemented on physical systems. They can prevent erratic and harmful behaviors while being easier to implement and interpret. However, in practice, exploration is largely performed by stochastic policies.\nFirst-order Bayesian Optimization (BO) methods offer a principled way of performing exploration using deterministic policies. This is done through a learned probabilistic model of the objective function and its gradient. Nonetheless, such approaches treat policy search as a black-box problem, and thus, neglect the reinforcement learning nature of the problem. In this work, we leverage the performance difference lemma to introduce a novel mean function for the probabilistic model. This results in augmenting BO methods with the action-value function. Hence, we call our method Augmented Bayesian Search (ABS).\nInterestingly, this new mean function enhances the posterior gradient with the deterministic policy gradient, effectively bridging the gap between BO and policy gradient methods. The resulting algorithm combines the convenience of the direct policy search with the scalability of reinforcement learning.\nWe validate ABS on high-dimensional locomotion problems and demonstrate competitive performance compared to existing direct policy search schemes.",
        "keywords": "Reinforcement learning;Policy search;Bayesian optimization;Gaussian Processes",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/6582bc170fbef9dca867d1ffb4d5201571d86846.zip",
        "author": "Mahdi Kallel;Debabrota Basu;Riad Akrour;Carlo D'Eramo",
        "authorids": "~Mahdi_Kallel1;~Debabrota_Basu1;~Riad_Akrour1;~Carlo_D'Eramo2",
        "gender": ";;M;M",
        "homepage": "https://www.informatik.uni-wuerzburg.de/rlcdm/team/mahdi-kallel/;https://debabrota-basu.github.io/;https://akrouriad.github.io/;https://carloderamo.wixsite.com/home",
        "dblp": ";126/2209;98/9987.html;182/8953",
        "google_scholar": ";https://scholar.google.co.in/citations?user=e26Maa4AAAAJ;https://scholar.google.de/citations?user=7g1bMNkAAAAJ;https://scholar.google.it/citations?user=1Rt_86gAAAAJ",
        "orcid": ";;0000-0002-8735-6960;0000-0003-2712-118X",
        "linkedin": ";;;carlo-d-eramo-6438a289/",
        "or_profile": "~Mahdi_Kallel1;~Debabrota_Basu1;~Riad_Akrour1;~Carlo_D'Eramo2",
        "aff": "Bayerische Julius-Maximilians-Universit\u00e4t W\u00fcrzburg;INRIA;INRIA;TU Darmstadt",
        "aff_domain": "uni-wuerzburg.de;inria.fr;inria.fr;tu-darmstadt.de",
        "position": "PhD student;Faculty;Researcher;Postdoc",
        "bibtex": "@inproceedings{\nkallel2024augmented,\ntitle={Augmented Bayesian Policy Search},\nauthor={Mahdi Kallel and Debabrota Basu and Riad Akrour and Carlo D'Eramo},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=OvlcyABNQT}\n}",
        "github": "",
        "project": "",
        "reviewers": "fyPW;m5Gu;gD9d;ysm5;yvFW",
        "pdf_size": 993446,
        "rating": "6;6;6;8;8",
        "confidence": "3;4;4;4;4",
        "soundness": "4;3;2;3;3",
        "contribution": "3;3;2;3;2",
        "presentation": "4;3;3;3;2",
        "wc_summary": "160;124;47;50;33",
        "wc_strengths": "159;43;56;91;14",
        "wc_weaknesses": "42;19;210;371;261",
        "wc_questions": "57;123;349;17;93",
        "wc_review": "418;309;662;529;401",
        "wc_reply_reviewers": "53;0;0;0;210",
        "wc_reply_authors": "954;645;1124;441;816",
        "reply_reviewers": "1;0;0;0;3",
        "reply_authors": "2;1;2;1;2",
        "rating_avg": [
            6.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            3.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            3.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            82.8,
            49.98959891817497
        ],
        "wc_strengths_avg": [
            72.6,
            49.77790674586467
        ],
        "wc_weaknesses_avg": [
            180.6,
            133.345566105514
        ],
        "wc_questions_avg": [
            127.8,
            116.14886999019835
        ],
        "wc_review_avg": [
            463.8,
            121.27555400821717
        ],
        "wc_reply_reviewers_avg": [
            52.6,
            81.33289617368854
        ],
        "wc_reply_authors_avg": [
            796.0,
            237.3916594996547
        ],
        "reply_reviewers_avg": [
            0.8,
            1.1661903789690602
        ],
        "reply_authors_avg": [
            1.6,
            0.4898979485566356
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.40824829046386296,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11278418314485600015&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=OvlcyABNQT",
        "pdf": "https://openreview.net/pdf?id=OvlcyABNQT",
        "email": "uni-wuerzburg.de;inria.fr;inria.fr;tu-darmstadt.de",
        "author_num": 4,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "University of W\u00fcrzburg;INRIA;Technische Universit\u00e4t Darmstadt",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.uni-wuerzburg.de;https://www.inria.fr;https://www.tu-darmstadt.de",
        "aff_unique_abbr": "JMU;INRIA;TU Darmstadt",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "W\u00fcrzburg;;Darmstadt",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "Germany;France"
    },
    {
        "id": "OvoRkDRLVr",
        "title": "X-InstructBLIP: A Framework for aligning X-Modal instruction-aware representations to LLMs and Emergent Cross-modal Reasoning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Vision-language pre-training and instruction tuning have demonstrated general-purpose capabilities in 2D visual reasoning tasks by aligning visual encoders with state-of-the-art large language models (LLM). In this paper, we introduce a simple, yet effective, multimodal framework built atop a frozen LLM; this framework is capable of seamlessly integrating and managing an ad-hoc number of modalities. \n To facilitate general-modality training, we collect high-quality instruction tuning data in an automatic and scalable manner, composed of 31K QA samples for audio and 250K QA samples for 3D. We further contribute a novel Discriminative Cross-modal Reasoning (DisCRn) evaluation task, comprising 12K audio-video QA samples and 28K image-3D QA samples.\nLeveraging instruction-aware representations, our model consistently outperforms or matches the leading-edge counterparts, setting state-of-the-art benchmarks in 7 zero-shot scenarios across all investigated modalities. Notably, our approach demonstrates joint reasoning abilities on par with models specifically trained on combined-modality datasets, like video-audio. All associated resources, including codes, datasets, and benchmarks, will be released.",
        "keywords": "multimodal language model;instruction aware representations;multitask;zero-shot;3d;video;audio;image;language;frozenllm;alignment",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Artemis Panagopoulou;Le Xue;Ning Yu;Junnan Li;Dongxu Li;Shafiq Joty;Ran Xu;Silvio Savarese;Caiming Xiong;Juan Carlos Niebles",
        "authorids": "~Artemis_Panagopoulou1;~Le_Xue1;~Ning_Yu2;~Junnan_Li2;~Dongxu_Li3;~Shafiq_Joty1;~Ran_Xu1;~Silvio_Savarese1;~Caiming_Xiong1;~Juan_Carlos_Niebles1",
        "gender": "F;M;;;;M;M;M;M;M",
        "homepage": "https://artemisp.github.io/;;;;;https://raihanjoty.github.io/;;;http://cmxiong.com/;http://www.niebles.net/",
        "dblp": "290/2230;304/2195;;;;62/2078;;50/3578;80/7282;26/647",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?view_op=list_works;;;;hR249csAAAAJ;sgBB2sUAAAAJ;ImpbxLsAAAAJ;vaSdahkAAAAJ;hqNhUCYAAAAJ",
        "orcid": ";0000-0003-2810-770X;;;;;;;;",
        "linkedin": ";le-tycho-xue-5abbb9157/;;;;;;;caiming-xiong-150a1417;",
        "or_profile": "~Artemis_Panagopoulou1;~Le_Xue1;~Ning_Yu2;~Junnan_Li2;~Dongxu_Li3;~Shafiq_Joty1;~Ran_Xu1;~Silvio_Savarese1;~Caiming_Xiong1;~Juan_Carlos_Niebles1",
        "aff": "SalesForce.com;Salesforce;;;;SalesForce.com;SalesForce.com;Stanford University;Salesforce Research;Stanford University",
        "aff_domain": "salesforce.com;salesforce.com;;;;salesforce.com;salesforce.com;stanford.edu;salesforce.com;stanford.edu",
        "position": "Intern;Researcher;;;;Principal Researcher;senior manager;Adjunct Professor;Research Scientist;Adjunct Professor",
        "bibtex": "@misc{\npanagopoulou2024xinstructblip,\ntitle={X-Instruct{BLIP}: A Framework for aligning X-Modal instruction-aware representations to {LLM}s and Emergent Cross-modal Reasoning},\nauthor={Artemis Panagopoulou and Le Xue and Ning Yu and Junnan Li and Dongxu Li and Shafiq Joty and Ran Xu and Silvio Savarese and Caiming Xiong and Juan Carlos Niebles},\nyear={2024},\nurl={https://openreview.net/forum?id=OvoRkDRLVr}\n}",
        "github": "",
        "project": "",
        "reviewers": "fV3B;ANX3;SAp4;hLSA;3Fuk",
        "site": "https://openreview.net/forum?id=OvoRkDRLVr",
        "pdf_size": 2663692,
        "rating": "3;5;5;5;6",
        "confidence": "4;5;4;4;3",
        "soundness": "2;2;2;2;2",
        "contribution": "2;2;2;2;2",
        "presentation": "2;3;2;2;3",
        "wc_summary": "64;55;58;86;52",
        "wc_strengths": "50;43;76;58;51",
        "wc_weaknesses": "168;143;133;147;156",
        "wc_questions": "1;3;292;4;9",
        "wc_review": "283;244;559;295;268",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            4.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            63.0,
            12.165525060596439
        ],
        "wc_strengths_avg": [
            55.6,
            11.253443917308159
        ],
        "wc_weaknesses_avg": [
            149.4,
            11.876026271442818
        ],
        "wc_questions_avg": [
            61.8,
            115.13018717955772
        ],
        "wc_review_avg": [
            329.8,
            115.8574986783333
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": -0.3227486121839514,
        "gs_citation": 56,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3738103060125954064&as_sdt=80005&sciodt=0,11&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0;1;0;1",
        "aff_unique_norm": "Salesforce;Stanford University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.salesforce.com;https://www.stanford.edu",
        "aff_unique_abbr": "Salesforce;Stanford",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Stanford",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Ow3u6br0ub",
        "title": "Progressive Fusion for Multimodal Integration",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Integration of multimodal information from various sources has been shown to boost the performance of machine learning models and thus has received increased attention in recent years. Often such models use deep modality-specific networks to obtain unimodal features which are combined to obtain \"late-fusion\" representations. However, these designs run the risk of information loss in the respective unimodal pipelines. On the other hand, \"early-fusion\" methodologies, which combine features early, suffer from the problems associated with feature heterogeneity and high sample complexity.\nIn this work, we present an iterative representation refinement approach, called Progressive Fusion, a model-agnostic technique which makes late stage fused representations available to early layers through backward connections, improving the expressiveness of the  representations. Progressive Fusion avoid the information loss which occurs when late fusion is used, while retaining the advantages of late fusion designs. We test Progressive Fusion on tasks including affective sentiment detection, multimedia analysis, and time series fusion with different models, demonstrating its versatility. We show that our approach consistently improves performance, for instance attaining a 5\\% reduction in MSE and 40\\% improvement in robustness on multimodal time series prediction.",
        "keywords": "multimodal fusion;sentiment analysis;time-series",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/3ab197b9529238210fdd622b12b984d63165e7a3.pdf",
        "author": "Shiv Shankar;Laure Thompson;Madalina Fiterau",
        "authorids": "~Shiv_Shankar2;~Laure_Thompson1;~Madalina_Fiterau3",
        "gender": ";;F",
        "homepage": ";https://laurejt.github.io/;https://www.cs.umass.edu/~mfiterau",
        "dblp": "203/9123;155/8149;05/8090",
        "google_scholar": ";qOT_38cAAAAJ;NTHsaUQAAAAJ",
        "orcid": ";0000-0001-5752-054X;",
        "linkedin": ";;",
        "or_profile": "~Shiv_Shankar2;~Laure_Thompson1;~Madalina_Fiterau1",
        "aff": "IIT Bombay;University of Massachusetts, Amherst;Department of Computer Science, University of Massachusetts, Amherst",
        "aff_domain": "iitb.ac.in;umass.edu;cs.umass.edu",
        "position": "Researcher;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nshankar2024progressive,\ntitle={Progressive Fusion for Multimodal Integration},\nauthor={Shiv Shankar and Laure Thompson and Madalina Fiterau},\nyear={2024},\nurl={https://openreview.net/forum?id=Ow3u6br0ub}\n}",
        "github": "",
        "project": "",
        "reviewers": "FVUs;mKqA;qtxk;HPuP",
        "site": "https://openreview.net/forum?id=Ow3u6br0ub",
        "pdf_size": 4593413,
        "rating": "3;5;5;5",
        "confidence": "3;3;4;5",
        "soundness": "3;3;3;1",
        "contribution": "2;2;2;2",
        "presentation": "3;2;3;2",
        "wc_summary": "80;51;48;32",
        "wc_strengths": "75;80;76;30",
        "wc_weaknesses": "304;137;104;68",
        "wc_questions": "4;82;269;23",
        "wc_review": "463;350;497;153",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            52.75,
            17.311484627264065
        ],
        "wc_strengths_avg": [
            65.25,
            20.437404434027332
        ],
        "wc_weaknesses_avg": [
            153.25,
            90.39185527468722
        ],
        "wc_questions_avg": [
            94.5,
            104.77237231255194
        ],
        "wc_review_avg": [
            365.75,
            134.3454037174328
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5222329678670935,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=935005585629575724&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Indian Institute of Technology Bombay;University of Massachusetts Amherst",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.iitb.ac.in;https://www.umass.edu",
        "aff_unique_abbr": "IITB;UMass Amherst",
        "aff_campus_unique_index": "0;1;1",
        "aff_campus_unique": "Mumbai;Amherst",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "India;United States"
    },
    {
        "id": "OwHAzbkk5z",
        "title": "Swift Sampler: Efficient Learning of Sampler by 10 parameters",
        "track": "main",
        "status": "Desk Reject",
        "tldr": "",
        "abstract": "Data selection is essential for training deep learning models. An effective data sampler assigns proper sampling probability for training data and helps the model converge to a good local minimum with high performance. Previous studies in data sampling are mainly based on heuristic rules or learning through a huge amount of time-consuming trials. In this paper, we propose an automatic Swift Sampler search algorithm, SS, to explore automatically learning effective samplers efficiently. In particular, SS utilizes a novel formulation to map a sampler to a low dimension of hyper-parameters and uses an approximated local minimum to quickly examine the quality of a sampler. Benefiting from its low computational expense, SS can be applied on large-scale data sets with high efficiency. Comprehensive experiments on various tasks demonstrate that SS powered sampling can achieve obvious improvements (e.g., 1.5% on ImageNet) and transfer among different neural networks.",
        "keywords": "Reinforcement learning;AutoML",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Jiawei Yao;Chuming Li",
        "authorids": "~Jiawei_Yao3;~Chuming_Li3",
        "gender": ";M",
        "homepage": ";https://scholar.google.com.sg/citations?user=ZfB7vEcAAAAJ&hl=en",
        "dblp": ";241/6082",
        "google_scholar": ";https://scholar.google.com.sg/citations?user=ZfB7vEcAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Jiawei_Yao3;~Chuming_Li3",
        "aff": ";",
        "aff_domain": ";",
        "position": ";",
        "bibtex": "@misc{\nyao2024swift,\ntitle={Swift Sampler: Efficient Learning of  Sampler by 10 parameters},\nauthor={Jiawei Yao and Chuming Li},\nyear={2024},\nurl={https://openreview.net/forum?id=OwHAzbkk5z}\n}",
        "github": "",
        "project": "",
        "reviewers": "YacP;BnW4;UJut",
        "site": "https://openreview.net/forum?id=OwHAzbkk5z",
        "pdf_size": 3251120,
        "rating": "5;5;5",
        "confidence": "4;3;2",
        "soundness": "2;3;3",
        "contribution": "2;3;2",
        "presentation": "3;2;3",
        "wc_summary": "87;44;103",
        "wc_strengths": "38;82;54",
        "wc_weaknesses": "109;130;124",
        "wc_questions": "6;2;2",
        "wc_review": "240;258;283",
        "wc_reply_reviewers": "66;41;52",
        "wc_reply_authors": "305;354;256",
        "reply_reviewers": "1;1;1",
        "reply_authors": "3;1;1",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            78.0,
            24.91318258807306
        ],
        "wc_strengths_avg": [
            58.0,
            18.184242262647807
        ],
        "wc_weaknesses_avg": [
            121.0,
            8.831760866327848
        ],
        "wc_questions_avg": [
            3.3333333333333335,
            1.8856180831641267
        ],
        "wc_review_avg": [
            260.3333333333333,
            17.632041540584257
        ],
        "wc_reply_reviewers_avg": [
            53.0,
            10.23067283548187
        ],
        "wc_reply_authors_avg": [
            305.0,
            40.00833246545858
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6501237905469677439&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 4
    },
    {
        "title": "Unlocking the Power of Representations in Long-term Novelty-based Exploration",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18723",
        "id": "OwtMhMSybu",
        "author_site": "Alaa Saade, Steven Kapturowski, Daniele Calandriello, Charles Blundell, Pablo Sprechmann, Leopoldo Sarra, Oliver Groth, Michal Valko, Bilal Piot",
        "tldr": "",
        "abstract": "We introduce Robust Exploration via Clustering-based Online Density Estimation (RECODE), a non-parametric method for novelty-based exploration that estimates visitation counts for clusters of states based on their similarity in a chosen embedding space. By adapting classical clustering to the nonstationary setting of Deep RL, RECODE can efficiently track state visitation counts over thousands of episodes. We further propose a novel generalization of the inverse dynamics loss, which leverages masked transformer architectures for multi-step prediction; which in conjunction with \\DETOCS achieves a new state-of-the-art in a suite of challenging 3D-exploration tasks in DM-Hard-8. RECODE also sets new state-of-the-art in hard exploration Atari games, and is the first agent to reach the end screen in \"Pitfall!\"",
        "keywords": "Deep RL;exploration;density estimation;representation learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Alaa Saade;Steven Kapturowski;Daniele Calandriello;Charles Blundell;Pablo Sprechmann;Leopoldo Sarra;Oliver Groth;Michal Valko;Bilal Piot",
        "authorids": "~Alaa_Saade1;~Steven_Kapturowski1;~Daniele_Calandriello1;~Charles_Blundell1;~Pablo_Sprechmann1;~Leopoldo_Sarra1;~Oliver_Groth1;~Michal_Valko1;~Bilal_Piot1",
        "gender": "Not Specified;;M;;;M;M;M;M",
        "homepage": ";;;http://www.gatsby.ucl.ac.uk/~ucgtcbl/;;https://leopoldo.sarra.eu;https://ogroth.github.io/;https://misovalko.github.io/research.html;",
        "dblp": "145/7346;;129/1542;35/8396;https://dblp.org/pers/s/Sprechmann:Pablo.html;;172/0935;03/5455;",
        "google_scholar": ";;;https://scholar.google.co.uk/citations?user=f31mvPsAAAAJ;YCPycGAAAAAJ;OVQZzUEAAAAJ;https://scholar.google.co.uk/citations?user=h3wt5ocAAAAJ;jrazNCQAAAAJ;https://scholar.google.fr/citations?user=fqxNUREAAAAJ",
        "orcid": ";;;;;0000-0001-7504-8656;;;",
        "linkedin": ";stevenkapturowski/;;;;leopoldo-sarra/;olivergroth/;michalvalko/;",
        "or_profile": "~Alaa_Saade1;~Steven_Kapturowski1;~Daniele_Calandriello1;~Charles_Blundell1;~Pablo_Sprechmann1;~Leopoldo_Sarra1;~Oliver_Groth1;~Michal_Valko1;~Bilal_Piot1",
        "aff": "Google DeepMind;Google DeepMind;Google DeepMind;Google DeepMind;Google DeepMind;Flatiron Institute;Google DeepMind;Meta;University Lille",
        "aff_domain": "deepmind.com;deepmind.com;deepmind.com;google.com;google.com;flatironinstitute.org;deepmind.com;meta.com;univ-lille1.fr",
        "position": "Research Engineer;Staff Research Engineer;Researcher;Research Scientist;Research Scientist;Postdoc;Research Scientist;Principal Researcher;Associate Professor",
        "bibtex": "@inproceedings{\nsaade2024unlocking,\ntitle={Unlocking the Power of Representations in Long-term Novelty-based Exploration},\nauthor={Alaa Saade and Steven Kapturowski and Daniele Calandriello and Charles Blundell and Pablo Sprechmann and Leopoldo Sarra and Oliver Groth and Michal Valko and Bilal Piot},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=OwtMhMSybu}\n}",
        "github": "",
        "project": "",
        "reviewers": "BYvq;CuGy;tYtD",
        "pdf_size": 8132328,
        "rating": "6;8;8",
        "confidence": "4;4;4",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "2;3;3",
        "wc_summary": "191;153;149",
        "wc_strengths": "96;252;104",
        "wc_weaknesses": "77;155;651",
        "wc_questions": "73;69;84",
        "wc_review": "437;629;988",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1075;676;2492",
        "reply_reviewers": "0;0;0",
        "reply_authors": "3;3;5",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            164.33333333333334,
            18.92675942210452
        ],
        "wc_strengths_avg": [
            150.66666666666666,
            71.72788083366808
        ],
        "wc_weaknesses_avg": [
            294.3333333333333,
            254.2037677839484
        ],
        "wc_questions_avg": [
            75.33333333333333,
            6.342099196813483
        ],
        "wc_review_avg": [
            684.6666666666666,
            228.36277182490923
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1414.3333333333333,
            779.2407986124841
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9666048139627554982&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=OwtMhMSybu",
        "pdf": "https://openreview.net/pdf?id=OwtMhMSybu",
        "email": "deepmind.com;deepmind.com;deepmind.com;google.com;google.com;flatironinstitute.org;deepmind.com;meta.com;univ-lille1.fr",
        "author_num": 9,
        "aff_unique_index": "0;0;0;0;0;1;0;2;3",
        "aff_unique_norm": "Google;Flatiron Institute;Meta;University of Lille",
        "aff_unique_dep": "Google DeepMind;;Meta Platforms, Inc.;",
        "aff_unique_url": "https://deepmind.com;https://flatironinstitute.org;https://meta.com;https://www.univ-lille.fr",
        "aff_unique_abbr": "DeepMind;Flatiron;Meta;ULille",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;1;0;1;2",
        "aff_country_unique": "United Kingdom;United States;France"
    },
    {
        "title": "TD-MPC2: Scalable, Robust World Models for Continuous Control",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18722",
        "id": "Oxh5CstDJU",
        "author_site": "Nicklas Hansen, Hao Su, Xiaolong Wang",
        "tldr": "",
        "abstract": "TD-MPC is a model-based reinforcement learning (RL) algorithm that performs local trajectory optimization in the latent space of a learned implicit (decoder-free) world model. In this work, we present TD-MPC2: a series of improvements upon the TD-MPC algorithm. We demonstrate that TD-MPC2 improves significantly over baselines across 104 online RL tasks spanning 4 diverse task domains, achieving consistently strong results with a single set of hyperparameters. We further show that agent capabilities increase with model and data size, and successfully train a single 317M parameter agent to perform 80 tasks across multiple task domains, embodiments, and action spaces. We conclude with an account of lessons, opportunities, and risks associated with large TD-MPC2 agents.\n\nExplore videos, models, data, code, and more at https://tdmpc2.com",
        "keywords": "reinforcement learning;model-based reinforcement learning;world models",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Nicklas Hansen;Hao Su;Xiaolong Wang",
        "authorids": "~Nicklas_Hansen1;~Hao_Su1;~Xiaolong_Wang3",
        "gender": "Non-Binary;M;M",
        "homepage": "https://nicklashansen.github.io;http://ai.ucsd.edu/~haosu;https://xiaolonw.github.io/",
        "dblp": "258/0744.html;09/4945-1;91/952-4",
        "google_scholar": "OFtDgzwAAAAJ;1P8Zu04AAAAJ;Y8O9N_0AAAAJ",
        "orcid": "0000-0001-9897-4003;;",
        "linkedin": "ncklas;;",
        "or_profile": "~Nicklas_Hansen1;~Hao_Su1;~Xiaolong_Wang3",
        "aff": "University of California, San Diego;University of California, San Diego;University of California, San Diego",
        "aff_domain": "ucsd.edu;ucsd.edu;ucsd.edu",
        "position": "PhD student;Associate Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nhansen2024tdmpc,\ntitle={{TD}-{MPC}2: Scalable, Robust World Models for Continuous Control},\nauthor={Nicklas Hansen and Hao Su and Xiaolong Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Oxh5CstDJU}\n}",
        "github": "",
        "project": "",
        "reviewers": "jMX1;8R3o;cggF;BqZp",
        "pdf_size": 7609127,
        "rating": "8;8;8;8",
        "confidence": "5;5;3;4",
        "soundness": "3;3;3;3",
        "contribution": "4;3;3;4",
        "presentation": "4;4;3;4",
        "wc_summary": "147;55;47;115",
        "wc_strengths": "107;25;62;72",
        "wc_weaknesses": "320;66;50;88",
        "wc_questions": "198;125;2;246",
        "wc_review": "772;271;161;521",
        "wc_reply_reviewers": "131;24;87;30",
        "wc_reply_authors": "982;1676;880;924",
        "reply_reviewers": "1;1;2;1",
        "reply_authors": "2;4;2;2",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.5,
            0.5
        ],
        "presentation_avg": [
            3.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            91.0,
            41.66533331199932
        ],
        "wc_strengths_avg": [
            66.5,
            29.21044333795706
        ],
        "wc_weaknesses_avg": [
            131.0,
            109.94998863119541
        ],
        "wc_questions_avg": [
            142.75,
            91.97655951382396
        ],
        "wc_review_avg": [
            431.25,
            236.05123914099667
        ],
        "wc_reply_reviewers_avg": [
            68.0,
            43.90330283703038
        ],
        "wc_reply_authors_avg": [
            1115.5,
            325.62056139009405
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.8660254037844386
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 117,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9795579468654029888&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=Oxh5CstDJU",
        "pdf": "https://openreview.net/pdf?id=Oxh5CstDJU",
        "email": "ucsd.edu;ucsd.edu;ucsd.edu",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of California, San Diego",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucsd.edu",
        "aff_unique_abbr": "UCSD",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "San Diego",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Oy1NtlFDmD",
        "title": "STRUCTDROP: A STRUCTURED RANDOM ALGORITHM TOWARDS EFFICIENT LARGE-SCALE GRAPH TRAINING",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph neural networks (GNNs) have gained considerable success in graph-based learning tasks, yet training GNNs on large graphs is still inefficient. The root cause is the graph-based sparse operations are difficult to accelerate with commodity hardware. Prior art reduces the computation cost of sparse matrix based operations (e.g., linear) via sampling-based approximation. However, two under-explored pain points still persist in this paradigm. Inefficiency Issue: The random-based sampling approaches have the non-zero entries randomly distributing over adjacency matrix, which slows down memory access process and is difficult to accelerate with commodity hardware. Under-fitting Problem: The previous sampling methods only utilize the same subset of nodes during the training, which may cause the under-fitting problem on other remain nodes. Aiming to systematically address these two pain points, we propose StructuredDropout, a.k.a, StructDrop. This method involves the selective random sampling of columns and rows from a sparse matrix for computation. Comprehensive experiments validate the efficiency and generalization of our framework: StructDrop achieves up to 5.09x speedup for a single sparse operation and 6.48x end-to-end speedup with negligible accuracy loss or even better accuracy.",
        "keywords": "Efficient Training;Randomized Algorithm",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Hongyi Liu;Zirui Liu;Kaixiong Zhou;Tong Zhao;Neil Shah;Xia Hu",
        "authorids": "~Hongyi_Liu5;~Zirui_Liu1;~Kaixiong_Zhou1;~Tong_Zhao3;~Neil_Shah2;~Xia_Hu4",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://aladinggit.github.io;https://zirui-ray-liu.github.io/;https://kaixiong-zhou.github.io/;https://tzhao.io/;http://nshah.net;https://cs.rice.edu/~xh37/index.html",
        "dblp": ";196/8629-1.html;178/7315;94/6503-3;71/7771;256/9406.html",
        "google_scholar": ";https://scholar.google.com/citations?hl=zh-CN;zMspIjIAAAAJ;05cRc-MAAAAJ;Qut69OgAAAAJ;https://scholar.google.com.tw/citations?user=pcCS60IAAAAJ",
        "orcid": ";;0000-0001-5226-8736;0000-0001-7660-1732;0000-0003-3261-8430;",
        "linkedin": ";;;;;",
        "or_profile": "~Hongyi_Liu5;~Zirui_Liu1;~Kaixiong_Zhou1;~Tong_Zhao3;~Neil_Shah2;~Xia_Hu2",
        "aff": "Rice University;Rice University;Massachusetts Institute of Technology;Snap Inc.;Snap Inc.;Rice University",
        "aff_domain": "rice.edu;rice.edu;mit.edu;snap.com;snap.com;rice.edu",
        "position": "PhD student;PhD student;Postdoc;Researcher;Research Scientist;Associate Professor",
        "bibtex": "@misc{\nliu2024structdrop,\ntitle={{STRUCTDROP}: A {STRUCTURED} {RANDOM} {ALGORITHM} {TOWARDS} {EFFICIENT} {LARGE}-{SCALE} {GRAPH} {TRAINING}},\nauthor={Hongyi Liu and Zirui Liu and Kaixiong Zhou and Tong Zhao and Neil Shah and Xia Hu},\nyear={2024},\nurl={https://openreview.net/forum?id=Oy1NtlFDmD}\n}",
        "github": "",
        "project": "",
        "reviewers": "hFvm;4Sfp;jrG5;qoGN",
        "site": "https://openreview.net/forum?id=Oy1NtlFDmD",
        "pdf_size": 672097,
        "rating": "3;5;6;6",
        "confidence": "4;4;3;3",
        "soundness": "3;2;3;3",
        "contribution": "2;2;4;3",
        "presentation": "3;3;4;3",
        "wc_summary": "90;61;119;73",
        "wc_strengths": "62;29;79;86",
        "wc_weaknesses": "102;170;52;74",
        "wc_questions": "74;289;51;3",
        "wc_review": "328;549;301;236",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "349;562;190;326",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            85.75,
            21.787324296480282
        ],
        "wc_strengths_avg": [
            64.0,
            22.01136070305514
        ],
        "wc_weaknesses_avg": [
            99.5,
            44.39313009914935
        ],
        "wc_questions_avg": [
            104.25,
            109.69816543589049
        ],
        "wc_review_avg": [
            353.5,
            117.7210686325944
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            356.75,
            133.17164675710816
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.8164965809277259,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:jGokewTNqLsJ:scholar.google.com/&scioq=STRUCTDROP:+A+STRUCTURED+RANDOM+ALGORITHM+TOWARDS+EFFICIENT+LARGE-SCALE+GRAPH+TRAINING&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2;2;0",
        "aff_unique_norm": "Rice University;Massachusetts Institute of Technology;Snap Inc.",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.rice.edu;https://web.mit.edu;https://www.snapinc.com",
        "aff_unique_abbr": "Rice;MIT;Snap",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "OyIzNLAQfE",
        "title": "Adaptive Continual Learning: Rapid Adaptation and Knowledge Refinement",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Continual learning (CL) is an emerging research area aiming to emulate human learning throughout a lifetime. Most existing CL approaches primarily focus on mitigating catastrophic forgetting, a phenomenon where performance on old tasks declines while learning new ones. However, human learning involves not only retaining knowledge but also quickly recognizing the current environment, recalling related knowledge, and refining it for improved performance. In this work, we introduce a new problem setting, Adaptive CL, which captures these aspects in an online, possibly recurring task environment without explicit task boundaries or identities. We propose the LEARN algorithm to efficiently explore, recall, and refine knowledge in such environments. We provide theoretical guarantees from two perspectives: online prediction with tight regret bounds and asymptotic consistency of knowledge. Additionally, we present a scalable implementation that requires only first-order gradients for training deep learning models. Our experiments demonstrate that the LEARN algorithm is highly effective in exploring, recalling, and refining knowledge in adaptive CL environments, resulting in superior performance compared to competing methods.",
        "keywords": "Continual learning;Learning theory",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/f6f65a3830c248a0f1098e48e714a891fa77f75e.zip",
        "author": "Jin Du;Yuhong Yang;Jie Ding",
        "authorids": "~Jin_Du1;~Yuhong_Yang1;~Jie_Ding2",
        "gender": "M;M;M",
        "homepage": ";http://users.stat.umn.edu/~yangx374/;http://jding.org",
        "dblp": ";52/5811;94/1825-2",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;ZyqvoqcAAAAJ",
        "orcid": ";0000-0003-3618-3083;",
        "linkedin": "jin-du-bb354a275;;",
        "or_profile": "~Jin_Du1;~Yuhong_Yang1;~Jie_Ding2",
        "aff": "University of Minnesota - Twin Cities;;University of Minnesota - Twin Cities",
        "aff_domain": "umn.edu;;umn.edu",
        "position": "PhD student;;Associate Professor",
        "bibtex": "@misc{\ndu2024adaptive,\ntitle={Adaptive Continual Learning: Rapid Adaptation and Knowledge Refinement},\nauthor={Jin Du and Yuhong Yang and Jie Ding},\nyear={2024},\nurl={https://openreview.net/forum?id=OyIzNLAQfE}\n}",
        "github": "",
        "project": "",
        "reviewers": "TRLN;XjZn;6Ke7;heNc",
        "site": "https://openreview.net/forum?id=OyIzNLAQfE",
        "pdf_size": 696735,
        "rating": "3;5;5;6",
        "confidence": "3;4;2;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;2;3",
        "wc_summary": "40;49;61;65",
        "wc_strengths": "22;42;15;48",
        "wc_weaknesses": "312;386;53;189",
        "wc_questions": "40;101;5;5",
        "wc_review": "414;578;134;307",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1037;1626;372;314",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;3;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            53.75,
            9.883698700385398
        ],
        "wc_strengths_avg": [
            31.75,
            13.645054048995188
        ],
        "wc_weaknesses_avg": [
            235.0,
            126.4614565786746
        ],
        "wc_questions_avg": [
            37.75,
            39.213358693180055
        ],
        "wc_review_avg": [
            358.25,
            161.48742211082572
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            837.25,
            536.7203065843513
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:nEZIZgMkVcoJ:scholar.google.com/&scioq=Adaptive+Continual+Learning:+Rapid+Adaptation+and+Knowledge+Refinement&hl=en&as_sdt=0,33",
        "gs_version_total": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Minnesota",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.minnesota.edu",
        "aff_unique_abbr": "UMN",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Twin Cities",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Oz6ABL8o8C",
        "title": "Unified Interpretation of Smoothing Methods for Negative Sampling Loss Functions in Knowledge Graph Embedding",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Knowledge Graphs (KGs) are fundamental resources in knowledge-intensive tasks in NLP. Due to the limitation of manually creating KGs, KG Completion (KGC) has an important role in automatically completing KGs by scoring their links with KG Embedding (KGE). To handle many entities in training, KGE relies on Negative Sampling (NS) loss that can reduce the computational cost by sampling. Since the appearance frequencies for each link are at most one in KGs, sparsity is an essential and inevitable problem. The NS loss is no exception. As a solution, the NS loss in KGE relies on smoothing methods like Self-Adversarial Negative Sampling (SANS) and subsampling. However, it is uncertain what kind of smoothing method is suitable for this purpose due to the lack of theoretical understanding. This paper provides theoretical interpretations of the smoothing methods for the NS loss in KGE and induces a new NS loss, Triplet-based SANS (T-SANS), that can cover the characteristics of the conventional smoothing methods. Experimental results on FB15k-237, WN18RR, and YAGO3-10 datasets showed the soundness of our interpretation and performance improvement by our T-SANS.",
        "keywords": "Knowledge Graph;Knowledge Graph Completion;Knowledge Graph Embedding;Negative Sampling;Smoothing Methods;Loss Function",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Xincan Feng;Hidetaka Kamigaito;Katsuhiko Hayashi;Taro Watanabe",
        "authorids": "~Xincan_Feng1;~Hidetaka_Kamigaito2;~Katsuhiko_Hayashi2;~Taro_Watanabe1",
        "gender": "F;M;M;M",
        "homepage": "https://sites.google.com/view/xincanfeng/english;https://sites.google.com/site/hidetakakamigaito/;;https://sites.google.com/site/tarowtnb/",
        "dblp": "357/1220;124/2384;23/9282;50/4741",
        "google_scholar": "DDu7aboAAAAJ;https://scholar.google.co.jp/citations?user=cyZpch8AAAAJ;;zsEEy7kAAAAJ",
        "orcid": "0000-0003-4647-7050;0000-0002-5249-5813;;0000-0001-8349-3522",
        "linkedin": "xincanfeng/;;;",
        "or_profile": "~Xincan_Feng1;~Hidetaka_Kamigaito2;~Katsuhiko_Hayashi2;~Taro_Watanabe1",
        "aff": "Nara Institute of Science and Technology, Japan;Nara Institute of Science and Technology;The University of Tokyo;Nara Institute of Science and Technology, Japan",
        "aff_domain": "naist.jp;naist.jp;u-tokyo.ac.jp;naist.jp",
        "position": "PhD student;Associate Professor;Associate Professor;Full Professor",
        "bibtex": "@misc{\nfeng2024unified,\ntitle={Unified Interpretation of Smoothing Methods for Negative Sampling Loss Functions in Knowledge Graph Embedding},\nauthor={Xincan Feng and Hidetaka Kamigaito and Katsuhiko Hayashi and Taro Watanabe},\nyear={2024},\nurl={https://openreview.net/forum?id=Oz6ABL8o8C}\n}",
        "github": "",
        "project": "",
        "reviewers": "4kKk;s2ka;8iQT;fiTR",
        "site": "https://openreview.net/forum?id=Oz6ABL8o8C",
        "pdf_size": 1043253,
        "rating": "3;5;6;6",
        "confidence": "3;3;2;4",
        "soundness": "2;3;2;2",
        "contribution": "2;3;2;2",
        "presentation": "2;3;2;3",
        "wc_summary": "104;113;74;56",
        "wc_strengths": "65;30;56;63",
        "wc_weaknesses": "262;117;146;113",
        "wc_questions": "36;47;61;43",
        "wc_review": "467;307;337;275",
        "wc_reply_reviewers": "12;12;0;0",
        "wc_reply_authors": "1147;761;559;813",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "4;4;3;5",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            86.75,
            22.884219453588535
        ],
        "wc_strengths_avg": [
            53.5,
            13.97318861248212
        ],
        "wc_weaknesses_avg": [
            159.5,
            60.53304882458838
        ],
        "wc_questions_avg": [
            46.75,
            9.12071817347735
        ],
        "wc_review_avg": [
            346.5,
            72.94347126371215
        ],
        "wc_reply_reviewers_avg": [
            6.0,
            6.0
        ],
        "wc_reply_authors_avg": [
            820.0,
            211.29363454680788
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            4.0,
            0.7071067811865476
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18248912525609153782&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Nara Institute of Science and Technology;University of Tokyo",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.nist.jp;https://www.u-tokyo.ac.jp",
        "aff_unique_abbr": "NIST;UTokyo",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Japan"
    },
    {
        "id": "OzAGE2W9yz",
        "title": "Improving Neural Program Induction by Reflecting on Failures",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "A neural program induction model is considered good if it is capable of learning programs with four objectives: (1) higher data efficiency, (2) a more efficient training process, (3) better performance, and (4) generalization for large-scale tasks. However, the neural program induction/synthesis models suffer from requiring a large amount of training iterations and training examples for training. Besides, the current state-of-the-art neural program induction models are still far from perfect in terms of performance and generalization when dealing with tasks that require complex task-solving logic. To mitigate these challenges, in this work, we present a novel framework called FRGR (Failure Reflection Guided Regularizer). Our proposed framework dynamically summarizes error patterns from the model\u2019s previous behavior and actively constrains the model from repeating mistakes of such patterns during training. In this way, the model is expected to converge faster and more data-efficiently as well as being less likely to fall into local optimum by making fewer mistakes of similar patterns. We evaluate FRGR based on multiple relational reasoning and decision-making tasks under both the data-rich and data-scarce settings. Experimental results show the effectiveness of FRGR in improving training efficiency, performance, generalization as well as data efficiency.",
        "keywords": "program induction",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "/attachment/b813e1fadac6943e1a972ef6178a04617c5926fa.pdf",
        "author": "Zhiming Li;Yushi Cao;Xiufeng Xu;Xu Liu;Yon Shin Teo;Junzhe Jiang;Bozhi Wu;Tianlin Li;Shang-Wei Lin;Yang Liu",
        "authorids": "~Zhiming_Li1;~Yushi_Cao1;~Xiufeng_Xu1;~Xu_Liu9;~Yon_Shin_Teo1;~Junzhe_Jiang2;~Bozhi_Wu1;~Tianlin_Li2;~Shang-Wei_Lin1;~Yang_Liu36",
        "gender": ";M;;M;M;M;;M;M;",
        "homepage": ";;;;;https://scholar.google.com/citations?user=lro9s00AAAAJ&hl=zh-CN;;https://shangweilin.github.io/;https://personal.ntu.edu.sg/yangliu/;https://scholar.google.com/citations?user=ZyhmKvQAAAAJ&hl=en",
        "dblp": "274/2297;;93/3167-14;;;;137/8830;55/4730-1.html;51/3710-3;",
        "google_scholar": "y8SqtE4AAAAJ;;JTzLTycAAAAJ;;;lro9s00AAAAJ;XB6CydwAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com.sg/citations?hl=en;ZyhmKvQAAAAJ",
        "orcid": ";0000-0003-2564-6660;0000-0003-2708-0584;;;;;0000-0002-9726-3434;0000-0001-7300-9215;",
        "linkedin": ";;liuxu-187825160/;yon-shin-teo-246bb0b8;https://linkedin.com/in/junzhejiang;;;shang-wei-lin-7a94091b/;;",
        "or_profile": "~Yushi_Cao1;~Xiufeng_Xu1;~Xu_Liu9;~Yon_Shin_Teo1;~Junzhe_Jiang2;~Bozhi_Wu1;~Tianlin_Li2;~Shang-Wei_Lin1;~Yang_Liu36;~Bob_Zhiming_Li1",
        "aff": "Nanyang Technological University;Nanyang Technological University;National University of Singapore;Continental Automotive;Hong Kong Polytechnic University;Nanyang Technological University;Nanyang Technological University;Nanyang Technological University (NTU);Nanyang Technological University;Nanyang Technological University",
        "aff_domain": "ntu.edu.sg;ntu.edu.sg;nus.edu.sg;continental-corporation.com;polyu.edu.hk;ntu.edu.sg;ntu.edu.sg;ccds.ntu.edu.sg;ntu.edu.sg;ntu.edu.sg",
        "position": "PhD student;PhD student;PhD student;Principal Researcher;PhD student;PhD student;PhD student;Assistant Professor;Full Professor;PhD student",
        "bibtex": "@misc{\nli2024improving,\ntitle={Improving Neural Program Induction by Reflecting on Failures},\nauthor={Zhiming Li and Yushi Cao and Xiufeng Xu and Xu Liu and Yon Shin Teo and Junzhe Jiang and Bozhi Wu and Tianlin Li and Shang-Wei Lin and Yang Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=OzAGE2W9yz}\n}",
        "github": "",
        "project": "",
        "reviewers": "bWPz;YeEy;7KpG;JknR",
        "site": "https://openreview.net/forum?id=OzAGE2W9yz",
        "pdf_size": 1159679,
        "rating": "3;5;5;8",
        "confidence": "3;3;3;4",
        "soundness": "2;3;3;4",
        "contribution": "3;3;2;4",
        "presentation": "2;1;3;3",
        "wc_summary": "88;68;63;101",
        "wc_strengths": "58;31;26;151",
        "wc_weaknesses": "466;244;245;457",
        "wc_questions": "42;294;69;148",
        "wc_review": "654;637;403;857",
        "wc_reply_reviewers": "579;487;290;28",
        "wc_reply_authors": "2682;1270;969;1342",
        "reply_reviewers": "1;1;2;1",
        "reply_authors": "8;5;4;4",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            80.0,
            15.313392831113555
        ],
        "wc_strengths_avg": [
            66.5,
            50.28170641495772
        ],
        "wc_weaknesses_avg": [
            353.0,
            108.5472247457299
        ],
        "wc_questions_avg": [
            138.25,
            97.99585450415746
        ],
        "wc_review_avg": [
            637.75,
            160.81258501746683
        ],
        "wc_reply_reviewers_avg": [
            346.0,
            211.20487683763366
        ],
        "wc_reply_authors_avg": [
            1565.75,
            659.4802404166481
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            5.25,
            1.6393596310755
        ],
        "replies_avg": [
            34,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.8892972917998875,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:13EPJcowIpEJ:scholar.google.com/&scioq=Improving+Neural+Program+Induction+by+Reflecting+on+Failures&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2;3;0;0;0;0;0",
        "aff_unique_norm": "Nanyang Technological University;National University of Singapore;Continental AG;Hong Kong Polytechnic University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.ntu.edu.sg;https://www.nus.edu.sg;https://www.continental-automotive.com;https://www.polyu.edu.hk",
        "aff_unique_abbr": "NTU;NUS;Continental;PolyU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;1;2;0;0;0;0;0",
        "aff_country_unique": "Singapore;Germany;China"
    },
    {
        "title": "Learning Energy Decompositions for Partial Inference in GFlowNets",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18721",
        "id": "P15CHILQlg",
        "author_site": "Hyosoon Jang, Minsu Kim, Sungsoo Ahn",
        "tldr": "",
        "abstract": "This paper studies generative flow networks (GFlowNets) to sample objects from the Boltzmann energy distribution via a sequence of actions. In particular, we focus on improving GFlowNet with partial inference: training flow functions with the evaluation of the intermediate states or transitions. To this end, the recently developed forward-looking GFlowNet reparameterizes the flow functions based on evaluating the energy of intermediate states. However, such an evaluation of intermediate energies may (i) be too expensive or impossible to evaluate and (ii) even provide misleading training signals under large energy fluctuations along the sequence of actions. To resolve this issue, we propose learning energy decompositions for GFlowNets (LED-GFN). Our main idea is to (i) decompose the energy of an object into learnable potential functions defined on state transitions and (ii) reparameterize the flow functions using the potential functions. In particular, to produce informative local credits, we propose to regularize the potential to change smoothly over the sequence of actions. It is also noteworthy that training GFlowNet with our learned potential can preserve the optimal policy. We empirically verify the superiority of LED-GFN in five problems including the generation of unstructured and maximum independent sets, molecular graphs, and RNA sequences.",
        "keywords": "Generative flow networks;reinforcement learning;generative models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/f1868360d56cb347bbcc40415615c66e725a4d97.zip",
        "author": "Hyosoon Jang;Minsu Kim;Sungsoo Ahn",
        "authorids": "~Hyosoon_Jang3;~Minsu_Kim2;~Sungsoo_Ahn1",
        "gender": "M;M;M",
        "homepage": "https://hsjang0.github.io/hsjang/;https://minsuukim.github.io/;https://sungsooahn.super.site/",
        "dblp": "341/1374;;90/5164",
        "google_scholar": "https://scholar.google.co.kr/citations?user=NOJd3GEAAAAJ;https://scholar.google.ca/citations?user=VvyLuhAAAAAJ;XTenHs0AAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Hyosoon_Jang3;~Minsu_Kim2;~Sungsoo_Ahn1",
        "aff": "POSTECH;Korea Advanced Institute of Science & Technology;Pohang University of Science and Technology",
        "aff_domain": "postech.edu;kaist.ac.kr;postech.ac.kr",
        "position": "MS student;PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\njang2024learning,\ntitle={Learning Energy Decompositions for Partial Inference in {GF}lowNets},\nauthor={Hyosoon Jang and Minsu Kim and Sungsoo Ahn},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=P15CHILQlg}\n}",
        "github": "",
        "project": "",
        "reviewers": "qpM8;RMo5;q5Nd;xgzq",
        "pdf_size": 2063815,
        "rating": "8;8;8;8",
        "confidence": "5;5;2;3",
        "soundness": "3;3;3;3",
        "contribution": "3;4;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "239;104;66;206",
        "wc_strengths": "184;53;43;137",
        "wc_weaknesses": "5;422;2;168",
        "wc_questions": "514;171;69;63",
        "wc_review": "942;750;180;574",
        "wc_reply_reviewers": "325;163;0;285",
        "wc_reply_authors": "983;1281;361;1035",
        "reply_reviewers": "2;1;0;2",
        "reply_authors": "2;3;1;2",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            1.299038105676658
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            153.75,
            71.01540325872972
        ],
        "wc_strengths_avg": [
            104.25,
            58.75957368803827
        ],
        "wc_weaknesses_avg": [
            149.25,
            171.19780226393095
        ],
        "wc_questions_avg": [
            204.25,
            183.91217333281665
        ],
        "wc_review_avg": [
            611.5,
            281.074278438992
        ],
        "wc_reply_reviewers_avg": [
            193.25,
            126.5274179772906
        ],
        "wc_reply_authors_avg": [
            915.0,
            339.0781620806625
        ],
        "reply_reviewers_avg": [
            1.25,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 19,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9291142549166206328&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=P15CHILQlg",
        "pdf": "https://openreview.net/pdf?id=P15CHILQlg",
        "email": "postech.edu;kaist.ac.kr;postech.ac.kr",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Pohang University of Science and Technology;Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.postech.ac.kr;https://www.kaist.ac.kr",
        "aff_unique_abbr": "POSTECH;KAIST",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Pohang;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "H2O-SDF: Two-phase Learning for 3D Indoor Reconstruction using Object Surface Fields",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18720",
        "id": "P1ANzoGg3W",
        "author_site": "Minyoung Park, MIRAE DO, Yeon Jae Shin, Jaeseok Yoo, Jongkwang Hong, Joongrock Kim, Chul Lee",
        "tldr": "",
        "abstract": "Advanced techniques using Neural Radiance Fields (NeRF), Signed Distance Fields (SDF), and Occupancy Fields have recently emerged as solutions for 3D indoor scene reconstruction. We introduce a novel two-phase learning approach, H2O-SDF,  that discriminates between object and non-object regions within indoor environments. This method achieves a nuanced balance, carefully preserving the geometric integrity of room layouts while also capturing intricate surface details of specific objects. A cornerstone of our two-phase learning framework is the introduction of the Object Surface Field (OSF), a novel concept designed to mitigate the persistent vanishing gradient problem that has previously hindered the capture of high-frequency details in other methods. Our proposed approach is validated through several experiments that include ablation studies.",
        "keywords": "3D reconstruction;Neural implicit surface learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Minyoung Park;Mirae Do;Yeon Jae Shin;Jaeseok Yoo;Jongkwang Hong;Joongrock Kim;Chul Lee",
        "authorids": "~Minyoung_Park3;~Mirae_Do1;~Yeon_Jae_Shin2;~Jaeseok_Yoo2;~Jongkwang_Hong1;~Joongrock_Kim1;~Chul_Lee1",
        "gender": "F;F;F;M;M;;M",
        "homepage": "https://my-park.github.io/;https://www.linkedin.com/in/%EB%AF%B8%EB%9E%98-%EB%8F%84-776640198/;;https://scholar.google.com/citations?user=k2OAskQAAAAJ&hl=ko&oi=sra;;;https://www.cs.toronto.edu/~leehyun",
        "dblp": ";;;285/1334;;;09/1032.html",
        "google_scholar": ";;;k2OAskQAAAAJ;;;axgc8sIAAAAJ",
        "orcid": ";;;;0000-0002-9961-2351;;",
        "linkedin": "minyoung-park-6636a9203/;;yeonjae-shin-288433120/;%EC%9E%AC%EC%84%9D-%EC%9C%A0-6a28b5292/;;;",
        "or_profile": "~Minyoung_Park3;~Mirae_Do1;~Yeon_Jae_Shin2;~Jaeseok_Yoo2;~Jongkwang_Hong1;~Joongrock_Kim1;~Chul_Lee1",
        "aff": "LG Electronics;LG Electronics;;LG Electronics;LG Electronics;;LG Electronics",
        "aff_domain": "lge.com;lge.com;;lge.com;lge.com;;lge.com",
        "position": "Researcher;Researcher;;Researcher;Researcher;;Researcher",
        "bibtex": "@inproceedings{\npark2024hosdf,\ntitle={H2O-{SDF}: Two-phase Learning for 3D Indoor Reconstruction using Object Surface Fields},\nauthor={Minyoung Park and Mirae Do and Yeon Jae Shin and Jaeseok Yoo and Jongkwang Hong and Joongrock Kim and Chul Lee},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=P1ANzoGg3W}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZNfu;rsDk;93pm;ypMg",
        "pdf_size": 8297428,
        "rating": "6;6;6;8",
        "confidence": "4;5;3;4",
        "soundness": "3;3;3;3",
        "contribution": "3;2;3;3",
        "presentation": "2;2;2;3",
        "wc_summary": "105;116;85;90",
        "wc_strengths": "205;76;47;128",
        "wc_weaknesses": "354;172;213;156",
        "wc_questions": "9;47;74;48",
        "wc_review": "673;411;419;422",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1219;820;1381;328",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;2;4;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            99.0,
            12.267844146385297
        ],
        "wc_strengths_avg": [
            114.0,
            60.02082971769051
        ],
        "wc_weaknesses_avg": [
            223.75,
            78.02043001675908
        ],
        "wc_questions_avg": [
            44.5,
            23.178653972998518
        ],
        "wc_review_avg": [
            481.25,
            110.77990566885315
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            937.0,
            406.5802503811517
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8757723427222323457&as_sdt=5,24&sciodt=0,24&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=P1ANzoGg3W",
        "pdf": "https://openreview.net/pdf?id=P1ANzoGg3W",
        "email": "lge.com;lge.com;;lge.com;lge.com;;lge.com",
        "author_num": 7,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "LG",
        "aff_unique_dep": "LG Electronics",
        "aff_unique_url": "https://www.lg.com",
        "aff_unique_abbr": "LG",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "Implicit bias of SGD in $L_2$-regularized linear DNNs: One-way jumps from high to low rank",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18719",
        "id": "P1aobHnjjj",
        "author_site": "Zihan Wang, Arthur Jacot",
        "tldr": "",
        "abstract": "The $L_{2}$-regularized loss of Deep Linear Networks (DLNs) with\nmore than one hidden layers has multiple local minima, corresponding\nto matrices with different ranks. In tasks such as matrix completion,\nthe goal is to converge to the local minimum with the smallest rank\nthat still fits the training data. While rank-underestimating minima\ncan be avoided since they do not fit the data, GD might get\nstuck at rank-overestimating minima. We show that with SGD, there is always a probability to jump\nfrom a higher rank minimum to a lower rank one, but the probability\nof jumping back is zero. More precisely, we define a sequence of sets\n$B_{1}\\subset B_{2}\\subset\\cdots\\subset B_{R}$ so that $B_{r}$\ncontains all minima of rank $r$ or less (and not more) that are absorbing\nfor small enough ridge parameters $\\lambda$ and learning rates $\\eta$:\nSGD has prob. 0 of leaving $B_{r}$, and from any starting point there\nis a non-zero prob. for SGD to go in $B_{r}$.",
        "keywords": "implicit bias;SGD;low-rank;linear networks",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Zihan Wang;Arthur Jacot",
        "authorids": "~Zihan_Wang20;~Arthur_Jacot1",
        "gender": "M;M",
        "homepage": ";",
        "dblp": ";222/2747",
        "google_scholar": "ZBF2zKMAAAAJ;https://scholar.google.ch/citations?user=G6OhFawAAAAJ",
        "orcid": ";",
        "linkedin": "zihan-wang-3b0050249/;",
        "or_profile": "~Zihan_Wang20;~Arthur_Jacot1",
        "aff": "New York University;NYU, New York University",
        "aff_domain": "nyu.edu;cims.nyu.edu",
        "position": "MS student;Assistant Professor",
        "bibtex": "@inproceedings{\nwang2024implicit,\ntitle={Implicit bias of {SGD} in \\$L\\_2\\$-regularized linear {DNN}s: One-way jumps from high to low rank},\nauthor={Zihan Wang and Arthur Jacot},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=P1aobHnjjj}\n}",
        "github": "",
        "project": "",
        "reviewers": "NbUi;Gs3p;fYKu;M8aA",
        "pdf_size": 970281,
        "rating": "5;8;8;10",
        "confidence": "4;4;3;3",
        "soundness": "2;3;3;4",
        "contribution": "2;3;4;4",
        "presentation": "3;2;3;4",
        "wc_summary": "51;70;225;72",
        "wc_strengths": "41;58;33;42",
        "wc_weaknesses": "139;127;871;15",
        "wc_questions": "117;29;72;54",
        "wc_review": "348;284;1201;183",
        "wc_reply_reviewers": "224;25;376;0",
        "wc_reply_authors": "667;212;563;199",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "2;1;2;1",
        "rating_avg": [
            7.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            104.5,
            70.05176657301371
        ],
        "wc_strengths_avg": [
            43.5,
            9.069178573608527
        ],
        "wc_weaknesses_avg": [
            288.0,
            340.05146669291105
        ],
        "wc_questions_avg": [
            68.0,
            32.14809481135702
        ],
        "wc_review_avg": [
            504.0,
            406.6896851408946
        ],
        "wc_reply_reviewers_avg": [
            156.25,
            153.72113550192114
        ],
        "wc_reply_authors_avg": [
            410.25,
            208.07615793261851
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.7001400420140049,
        "gs_citation": 20,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11574205325592758618&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=P1aobHnjjj",
        "pdf": "https://openreview.net/pdf?id=P1aobHnjjj",
        "email": "nyu.edu;cims.nyu.edu",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "New York University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nyu.edu",
        "aff_unique_abbr": "NYU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";New York",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "P24cWJzMmB",
        "title": "Data Refinement: Mitigating Reward Over-Optimization in Reinforcement Learning with Human Feedback",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Reinforcement Learning with Human Feedback (RLHF) is a pivotal technique that ensures language models are closely aligned with human-centric values. The initial phase of RLHF involves learning human values using a reward model based on pairwise or \n$K$-wise comparisons. However, a study by Gao et al. (2022) showed that the performance of the reward model degrades after one training epoch, and optimizing too much against such reward model eventually hinders the true objective. This paper delves into these issues, using the theoretical insights to introduce improved reward learning algorithms termed \"data refinement\". The core idea is that during each training epoch, we not only update the model with the data but also refine the data using the model, eliminating noisy entries. Our empirical findings highlight the superior performance of this approach over the traditional methods.",
        "keywords": "reinforcement learning with human feedback;reward overoptimization",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Banghua Zhu;John Schulman;Jiantao Jiao",
        "authorids": "~Banghua_Zhu1;~John_Schulman1;~Jiantao_Jiao1",
        "gender": "M;;M",
        "homepage": "https://people.eecs.berkeley.edu/~banghua/;;https://scholar.google.com/citations?user=aO8KpGcAAAAJ&hl=en",
        "dblp": "204/5394;;43/8919",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;aO8KpGcAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Banghua_Zhu1;~John_Schulman1;~Jiantao_Jiao1",
        "aff": "University of California, Berkeley;OpenAI;University of California, Berkeley",
        "aff_domain": "berkeley.edu;openai.com;berkeley.edu",
        "position": "PhD student;Researcher;Assistant Professor",
        "bibtex": "@misc{\nzhu2024data,\ntitle={Data Refinement: Mitigating Reward Over-Optimization in Reinforcement Learning with Human Feedback},\nauthor={Banghua Zhu and John Schulman and Jiantao Jiao},\nyear={2024},\nurl={https://openreview.net/forum?id=P24cWJzMmB}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=P24cWJzMmB",
        "pdf_size": 490252,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:_EFTxj0fv-oJ:scholar.google.com/&scioq=Data+Refinement:+Mitigating+Reward+Over-Optimization+in+Reinforcement+Learning+with+Human+Feedback&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of California, Berkeley;OpenAI",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.berkeley.edu;https://openai.com",
        "aff_unique_abbr": "UC Berkeley;OpenAI",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Berkeley;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "P2AD80rFNu",
        "title": "On the Relation between Gradient Directions and Systematic Generalization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Systematic generalization is a critical property that most general deep learning algorithms lack. In this paper, we investigate the relation between gradient directions and systematic generalization. We propose a formulation to treat reducible training loss as a resource, and the training process consumes it to reduce test loss. We derive a bias that a training gradient is less efficient in using the resource at each step than an alternative gradient that leads to systematic generalization. The bias is avoided if and only if both gradients are zero or point in the same direction. We demonstrate the bias in standard deep learning models, including fully connected, convolutional, residual networks, LSTMs, and (Vision) Transformers. We also discuss a requirement for the generalization. We hope this study provides novel insights for improving systematic generalization.",
        "keywords": "Systematic generalization;Compositional generalization",
        "primary_area": "causal reasoning",
        "supplementary_material": "/attachment/c13cc4fe46ef0c8d673ded957b51ba2a140fe60e.zip",
        "author": "Yuanpeng Li;Liang Zhao;Joel Hestness;Kenneth Church;Mohamed Elhoseiny",
        "authorids": "~Yuanpeng_Li2;~Liang_Zhao2;~Joel_Hestness2;~Kenneth_Church1;~Mohamed_Elhoseiny1",
        "gender": "M;F;M;M;M",
        "homepage": ";;http://www.mohamed-elhoseiny.com;;https://kwchurch.github.io/",
        "dblp": ";63/5422-6;125/2894;60/3063;c/KennethWardChurch",
        "google_scholar": ";9xMR_iQAAAAJ;iRBUTOAAAAAJ;wkbvCf0AAAAJ;E6aqGvYAAAAJ",
        "orcid": ";;0000-0001-9659-1551;0000-0001-6920-0906;0000-0001-8378-6069",
        "linkedin": ";liang-zhao-434b2664/;mohamed-elhoseiny-8a836215/;joelhestness;ken-church-a902772/",
        "or_profile": "~Yuanpeng_Li2;~Liang_Zhao2;~Mohamed_Elhoseiny1;~Joel_Thomas_Hestness1;~Kenneth_Ward_Church1",
        "aff": ";Samsung Research America;KAUST;Cerebras Systems, Inc;Northeastern University",
        "aff_domain": ";samsung.com;kaust.edu.sa;cerebras.net;northeastern.edu",
        "position": ";Staff Researcher;Associate Professor;Research Scientist;Senior Principal Research Scientist",
        "bibtex": "@misc{\nli2024on,\ntitle={On the Relation between Gradient Directions and Systematic Generalization},\nauthor={Yuanpeng Li and Liang Zhao and Joel Hestness and Kenneth Church and Mohamed Elhoseiny},\nyear={2024},\nurl={https://openreview.net/forum?id=P2AD80rFNu}\n}",
        "github": "",
        "project": "",
        "reviewers": "jCQf;ymSN;SN1k",
        "site": "https://openreview.net/forum?id=P2AD80rFNu",
        "pdf_size": 707092,
        "rating": "3;3;3",
        "confidence": "4;3;4",
        "soundness": "2;2;2",
        "contribution": "2;1;2",
        "presentation": "1;1;2",
        "wc_summary": "110;75;73",
        "wc_strengths": "4;39;202",
        "wc_weaknesses": "143;345;733",
        "wc_questions": "148;191;40",
        "wc_review": "405;650;1048",
        "wc_reply_reviewers": "12;289;323",
        "wc_reply_authors": "390;1963;1678",
        "reply_reviewers": "1;2;1",
        "reply_authors": "1;4;3",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            86.0,
            16.990193249832878
        ],
        "wc_strengths_avg": [
            81.66666666666667,
            86.27990624833932
        ],
        "wc_weaknesses_avg": [
            407.0,
            244.8237461249759
        ],
        "wc_questions_avg": [
            126.33333333333333,
            63.52077525415515
        ],
        "wc_review_avg": [
            701.0,
            264.96918059779455
        ],
        "wc_reply_reviewers_avg": [
            208.0,
            139.28627594514353
        ],
        "wc_reply_authors_avg": [
            1343.6666666666667,
            684.3080852624464
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:mC4qrsJSMtsJ:scholar.google.com/&scioq=On+the+Relation+between+Gradient+Directions+and+Systematic+Generalization&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Samsung;King Abdullah University of Science and Technology;Cerebras Systems;Northeastern University",
        "aff_unique_dep": "Samsung Research America;;;",
        "aff_unique_url": "https://www.samsung.com/us/careers/research/;https://www.kaust.edu.sa;https://www.cerebras.com;https://www.northeastern.edu",
        "aff_unique_abbr": "SRA;KAUST;Cerebras;NEU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "United States;Saudi Arabia"
    },
    {
        "id": "P2Fjm0nIit",
        "title": "NeRF Compression via Transform Coding",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Neural Radiance Fields (NeRFs) have emerged as powerful tools for capturing detailed 3D scenes through continuous volumetric representations. Recent NeRFs utilize feature grids to improve rendering quality and speed; however, these representations introduce significant storage overhead. This paper presents a novel method for efficiently compressing a grid-based NeRF model. Our approach is based on the non-linear transform coding paradigm, where we compress the model's feature grids using end-to-end optimized neural compression. Since these neural compressors are overfitted to individual scenes, we develop lightweight decoders and encoder-free compression. To exploit the spatial inhomogeneity of the latent feature grids, we introduce an importance-weighted rate-distortion objective and a sparse entropy model using a masking mechanism. Our experimental results validate that our proposed method surpasses existing works in terms of grid-based NeRF compression efficacy and reconstruction quality.",
        "keywords": "NeRF;neural compression;transform coding;neural rendering",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Tuan Pham;Stephan Mandt",
        "authorids": "~Tuan_Pham4;~Stephan_Mandt1",
        "gender": ";",
        "homepage": ";",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Tuan_Pham4;~Stephan_Mandt1",
        "aff": ";",
        "aff_domain": ";",
        "position": ";",
        "bibtex": "@misc{\npham2024nerf,\ntitle={Ne{RF} Compression via Transform Coding},\nauthor={Tuan Pham and Stephan Mandt},\nyear={2024},\nurl={https://openreview.net/forum?id=P2Fjm0nIit}\n}",
        "github": "",
        "project": "",
        "reviewers": "GuYn;L3yU;n1mE",
        "site": "https://openreview.net/forum?id=P2Fjm0nIit",
        "pdf_size": 13384760,
        "rating": "3;5;5",
        "confidence": "4;4;4",
        "soundness": "2;3;3",
        "contribution": "2;2;2",
        "presentation": "3;3;3",
        "wc_summary": "59;86;57",
        "wc_strengths": "55;45;54",
        "wc_weaknesses": "197;156;96",
        "wc_questions": "96;30;38",
        "wc_review": "407;317;245",
        "wc_reply_reviewers": "0;0;10",
        "wc_reply_authors": "1193;496;549",
        "reply_reviewers": "0;0;1",
        "reply_authors": "3;1;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            67.33333333333333,
            13.224556283251582
        ],
        "wc_strengths_avg": [
            51.333333333333336,
            4.4969125210773475
        ],
        "wc_weaknesses_avg": [
            149.66666666666666,
            41.47556174691576
        ],
        "wc_questions_avg": [
            54.666666666666664,
            29.4089933334837
        ],
        "wc_review_avg": [
            323.0,
            66.27216610312357
        ],
        "wc_reply_reviewers_avg": [
            3.3333333333333335,
            4.714045207910316
        ],
        "wc_reply_authors_avg": [
            746.0,
            316.81645580156766
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:zJZ7eflO4m8J:scholar.google.com/&scioq=NeRF+Compression+via+Transform+Coding&hl=en&as_sdt=0,5",
        "gs_version_total": 0
    },
    {
        "id": "P2gnDEHGu3",
        "title": "Summing Up the Facts: Additive Mechanisms behind Factual Recall in LLMs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "How do large language models (LLMs) store and retrieve knowledge? We focus on the most basic form of this task -- factual recall, where the model is tasked with explicitly surfacing stored facts in prompts of form \\tokens{Fact: The Colosseum is in the country of}. We find that the mechanistic story behind factual recall is more complex than previously thought -- We show there exist four distinct and independent mechanisms that additively combine, constructively interfering on the correct attribute. We term this generic phenomena the \\textbf{additive motif}: models compute correct answers through adding together multiple independent contributions; the contributions from each mechanism are insufficient alone, but together they constructively interfere on the correct attribute when summed. In addition, we extend the method of direct logit attribution to attribute a head's output to individual source tokens. We use this technique to unpack what we call `mixed heads' -- which are themselves a pair of two separate additive updates.",
        "keywords": "Mechanistic Interpretability;Interpretability;Fact;Factual Recall;LLM;Explainability;Transparency",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Bilal Chughtai;Alan Cooney;Neel Nanda",
        "authorids": "~Bilal_Chughtai1;~Alan_Cooney1;~Neel_Nanda1",
        "gender": "M;M;M",
        "homepage": ";;https://neelnanda.io",
        "dblp": ";;285/6389",
        "google_scholar": ";kcCWBDkAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;",
        "linkedin": "https://www.linkedin.com/feed/;alan-cooney-08386045;https://linkedin.com/in/neel-nanda-993580151",
        "or_profile": "~Bilal_Chughtai1;~Alan_Cooney1;~Neel_Nanda1",
        "aff": ";AI Security Institute;Google DeepMind",
        "aff_domain": ";dsit.gov.uk;deepmind.com",
        "position": ";Researcher;Researcher",
        "bibtex": "@misc{\nchughtai2024summing,\ntitle={Summing Up the Facts: Additive Mechanisms behind Factual Recall in {LLM}s},\nauthor={Bilal Chughtai and Alan Cooney and Neel Nanda},\nyear={2024},\nurl={https://openreview.net/forum?id=P2gnDEHGu3}\n}",
        "github": "",
        "project": "",
        "reviewers": "dGcN;npyu;ctMu;vZgL",
        "site": "https://openreview.net/forum?id=P2gnDEHGu3",
        "pdf_size": 1129245,
        "rating": "5;5;5;6",
        "confidence": "3;2;4;2",
        "soundness": "2;3;3;2",
        "contribution": "2;2;2;2",
        "presentation": "3;3;3;3",
        "wc_summary": "83;74;51;243",
        "wc_strengths": "15;15;61;42",
        "wc_weaknesses": "36;371;224;208",
        "wc_questions": "103;207;65;92",
        "wc_review": "237;667;401;585",
        "wc_reply_reviewers": "0;0;40;0",
        "wc_reply_authors": "522;1238;1019;848",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;2;3;2",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            112.75,
            76.09985216805615
        ],
        "wc_strengths_avg": [
            33.25,
            19.447043477094404
        ],
        "wc_weaknesses_avg": [
            209.75,
            118.7399995789119
        ],
        "wc_questions_avg": [
            116.75,
            53.9090669553833
        ],
        "wc_review_avg": [
            472.5,
            166.62757874973758
        ],
        "wc_reply_reviewers_avg": [
            10.0,
            17.320508075688775
        ],
        "wc_reply_authors_avg": [
            906.75,
            261.63464506827074
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6166249522673367673&as_sdt=5,31&sciodt=0,31&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "AI Security Institute;Google",
        "aff_unique_dep": ";Google DeepMind",
        "aff_unique_url": ";https://deepmind.com",
        "aff_unique_abbr": ";DeepMind",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "1",
        "aff_country_unique": ";United Kingdom"
    },
    {
        "id": "P4op21eju0",
        "title": "Informing Reinforcement Learning Agents by Grounding Natural Language to Markov Decision Processes",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "While significant efforts have been made to leverage natural language to accelerate reinforcement learning, utilizing diverse forms of language efficiently remains unsolved. Existing methods focus on mapping natural language to individual elements of MDPs such as reward functions or policies, but such approaches limit the scope of language they consider to make such mappings possible. We present an approach for leveraging general language advice by translating it to a grounded formal language capable of expressing information about *every* element of an MDP and its solution including policies, plans, reward functions, and transition functions. We also introduce a new model-based reinforcement learning algorithm called RLang-Dyna-Q that is capable of leveraging all such advice. We demonstrate the generality of our approach in a number of experiments by informing agents with a variety of natural language advice, leading to significant performance gains.",
        "keywords": "reinforcement learning;natural language;language grounding;rl",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/bd7c8f29db3136c09fbbd858954338334263f84c.zip",
        "author": "Benjamin Adin Spiegel;Ziyi Yang;William Jurayj;Katie Ta;Stefanie Tellex;George Konidaris",
        "authorids": "~Benjamin_Adin_Spiegel1;~Ziyi_Yang3;~William_Jurayj1;~Katie_Ta1;~Stefanie_Tellex1;~George_Konidaris1",
        "gender": "M;;Not Specified;F;F;M",
        "homepage": "https://benjaminaspiegel.com/;https://yzylmc.github.io;https://williamjurayj.com/;;https://h2r.cs.brown.edu/;http://cs.brown.edu/people/gdk/",
        "dblp": ";;321/1018;;50/3149;56/6762",
        "google_scholar": "6t7O43MAAAAJ;sH5h3iAAAAAJ;y4Ez98cAAAAJ;;https://scholar.google.com.tw/citations?user=Pd8-ju0AAAAJ;9UERvVEAAAAJ",
        "orcid": ";;;;;",
        "linkedin": "benjamin-spiegel/;;william-jurayj-01b553173/;katie-ta/;;",
        "or_profile": "~Benjamin_Adin_Spiegel1;~Ziyi_Yang3;~William_Jurayj1;~Katie_Ta1;~Stefanie_Tellex1;~George_Konidaris1",
        "aff": "Brown University;Brown University;Johns Hopkins University;;, Brown University;Brown University",
        "aff_domain": "brown.edu;brown.edu;jhu.edu;;cs.brown.edu;brown.edu",
        "position": "PhD student;PhD student;PhD student;;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nspiegel2024informing,\ntitle={Informing Reinforcement Learning Agents by Grounding Natural Language to Markov Decision Processes},\nauthor={Benjamin Adin Spiegel and Ziyi Yang and William Jurayj and Katie Ta and Stefanie Tellex and George Konidaris},\nyear={2024},\nurl={https://openreview.net/forum?id=P4op21eju0}\n}",
        "github": "",
        "project": "",
        "reviewers": "42jA;Eou7;LPUN;qode",
        "site": "https://openreview.net/forum?id=P4op21eju0",
        "pdf_size": 1422819,
        "rating": "3;3;3;3",
        "confidence": "3;4;4;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "2;2;3;3",
        "wc_summary": "60;99;20;78",
        "wc_strengths": "47;31;22;76",
        "wc_weaknesses": "162;54;215;252",
        "wc_questions": "102;87;14;92",
        "wc_review": "371;271;271;498",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            64.25,
            29.03769102390891
        ],
        "wc_strengths_avg": [
            44.0,
            20.530465167647808
        ],
        "wc_weaknesses_avg": [
            170.75,
            74.61023723323764
        ],
        "wc_questions_avg": [
            73.75,
            34.91686555233731
        ],
        "wc_review_avg": [
            352.75,
            93.2694349720207
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5099414795338191449&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "Brown University;Johns Hopkins University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.brown.edu;https://www.jhu.edu",
        "aff_unique_abbr": "Brown;JHU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "P50qJuu4IY",
        "title": "Self-Supervised Learning with the Matching Gap",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Contrastive learning (CL) is a fundamental paradigm in self-supervised learning. CL methods rely on a loss that nudges the features of various views from one image to stay closer, while pulling away those drawn from different images. Such a loss favors invariance: feature representations of the same perturbed image should collapse to the same vector, while remaining far enough from those of any other\nimage. Although intuitive, CL leaves room for trivial solutions, and has a documented propensity to collapse representations for very different images. This is often mitigated by using a very large variety of augmentations. In this work, we address this tension by introducing a different loss, the matching gap. Given a set of $n$ images transformed in two different ways, the matching gap is the difference between the mean cost (e.g. a squared distance), in representation space, of the $n$ paired images, and the optimal matching cost obtained by running an optimal matching solver across these two families of $n$ images. The matching gap naturally mitigates the problem of data augmentation invariance, since it can be zero without requiring features from the same image to collapse. We implement the matching gap using the Sinkhorn algorithm and show that it can be easily differentiated using Danskin\u2019s theorem. In practice, we show that we can learn competitive features, even without extensive data augmentations: Using only cropping and flipping, we achieve 74.2% top-1 accuracy with a ViT-B/16 on ImageNet-1k, to be compared to 72.9% for I-JEPA (Assran et al., 2023).",
        "keywords": "optimal transport;self-supervised learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Zoe Piran;Michal Klein;Jason Ramapuram;Dan Busbridge;Soledad Villar;Armand Joulin;marco cuturi",
        "authorids": "~Zoe_Piran1;~Michal_Klein1;~Jason_Ramapuram1;~Dan_Busbridge1;~Soledad_Villar2;~Armand_Joulin2;~marco_cuturi2",
        "gender": "F;M;M;M;M;M;F",
        "homepage": "https://www.zoepiran.com/;https://github.com/michalk8;http://jramapuram.github.io;https://github.com/dbusbridge;;http://marcocuturi.net;https://www.ams.jhu.edu/villar/",
        "dblp": "267/2038;332/4607;200/8958;220/3480;;85/5102;https://dblp.uni-trier.de/pers/hd/v/Villar:Soledad",
        "google_scholar": "BlDw0uIAAAAJ;zByzdzcAAAAJ;U-MT4IsAAAAJ;https://scholar.google.co.uk/citations?user=CvA9jjMAAAAJ;;https://scholar.google.fr/citations?user=kQEydDMAAAAJ;JBGlsDoAAAAJ",
        "orcid": "0000-0003-0241-8948;0000-0002-2433-6380;;0000-0002-2178-6917;;;",
        "linkedin": ";michal-klein-148697165/;jramapuram/;danbusbridge/;;;",
        "or_profile": "~Zoe_Piran1;~Michal_Klein1;~Jason_Ramapuram1;~Dan_Busbridge1;~Armand_Joulin2;~marco_cuturi2;~Soledad_Villar1",
        "aff": "The Hebrew University of Jerusalem;Apple;Apple;Apple;Meta Facebook;Ensae ParisTech;Johns Hopkins University",
        "aff_domain": "mail.huji.ac.il;apple.com;apple.com;apple.com;fb.com;ensae.fr;jhu.edu",
        "position": "PhD student;Researcher;Researcher;Researcher;Associate Professor;Full Professor;Assistant Professor",
        "bibtex": "@misc{\npiran2024selfsupervised,\ntitle={Self-Supervised Learning with the Matching Gap},\nauthor={Zoe Piran and Michal Klein and Jason Ramapuram and Dan Busbridge and Soledad Villar and Armand Joulin and marco cuturi},\nyear={2024},\nurl={https://openreview.net/forum?id=P50qJuu4IY}\n}",
        "github": "",
        "project": "",
        "reviewers": "zo3d;PMfK;tJTN;iZps;1FzB",
        "site": "https://openreview.net/forum?id=P50qJuu4IY",
        "pdf_size": 1060159,
        "rating": "1;5;5;5;8",
        "confidence": "5;4;4;4;4",
        "soundness": "2;3;3;2;3",
        "contribution": "1;3;2;2;4",
        "presentation": "2;3;3;3;4",
        "wc_summary": "69;256;97;40;97",
        "wc_strengths": "19;93;91;28;132",
        "wc_weaknesses": "185;269;143;106;184",
        "wc_questions": "10;1;29;4;77",
        "wc_review": "283;619;360;178;490",
        "wc_reply_reviewers": "123;301;86;19;0",
        "wc_reply_authors": "1537;972;732;482;586",
        "reply_reviewers": "1;2;1;1;0",
        "reply_authors": "3;3;2;2;1",
        "rating_avg": [
            4.8,
            2.227105745132009
        ],
        "confidence_avg": [
            4.2,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.4,
            1.019803902718557
        ],
        "presentation_avg": [
            3.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            111.8,
            75.12496256238667
        ],
        "wc_strengths_avg": [
            72.6,
            42.7672772105029
        ],
        "wc_weaknesses_avg": [
            177.4,
            54.35660033519389
        ],
        "wc_questions_avg": [
            24.2,
            28.138230221533124
        ],
        "wc_review_avg": [
            386.0,
            154.69583058376202
        ],
        "wc_reply_reviewers_avg": [
            105.8,
            107.25558260528912
        ],
        "wc_reply_authors_avg": [
            861.8,
            375.55313871674673
        ],
        "reply_reviewers_avg": [
            1.0,
            0.6324555320336759
        ],
        "reply_authors_avg": [
            2.2,
            0.7483314773547882
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.8531251846271808,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:OlO3GB5pWzUJ:scholar.google.com/&scioq=Self-Supervised+Learning+with+the+Matching+Gap&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1;2;3;4",
        "aff_unique_norm": "Hebrew University of Jerusalem;Apple;Meta;ENSAE ParisTech;Johns Hopkins University",
        "aff_unique_dep": ";Apple Inc.;Meta Platforms, Inc.;;",
        "aff_unique_url": "https://www.huji.ac.il;https://www.apple.com;https://meta.com;https://www.ensae.fr;https://www.jhu.edu",
        "aff_unique_abbr": "HUJI;Apple;Meta;Ensae;JHU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;1;2;1",
        "aff_country_unique": "Israel;United States;France"
    },
    {
        "id": "P6PPBq8K2B",
        "title": "Diffusion-based Data Generation for Out-of-Distribution Object Detection",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Generating out-of-distribution (OOD) data is critical for training OOD object detectors, enabling them to identify OOD objects or categories as ``unknown''. Previous methods may generate imprecise OOD features due to incorrect assumptions on in-distribution (ID) data distribution. In this paper, we propose to discard any distribution assumption, leveraging a diffusion model to faithfully model the ID data distribution, and design a filtering strategy to generate accurate OOD data samples for training an unknown-aware object detector. Unlike previous methods that rely on predefined parametric models for modeling distributions, our diffusion model captures the latent feature distributions of ID data, which allows us to synthesize data samples within a compact feature space. We further design a filtering strategy based on K-Nearest Neighbors (KNN) to select low-density data samples proximate to the ID data as generated OOD samples, which are more challenging and effective for improving the OOD detector. Our method is generic and can be easily integrated with existing baseline methods, demonstrating superior performance on multiple benchmark datasets. The code will be made publicly available.",
        "keywords": "OOD detection;diffusion model;object detection",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/237c65cde0ca8d80fc8752f25bf3bc659909f6d9.pdf",
        "author": "Jiahui Liu;Xin Yu;Anlin Zheng;Kevin Li Sun;XIAOJUAN QI",
        "authorids": "~Jiahui_Liu2;~Xin_Yu6;~Anlin_Zheng1;~Kevin_Li_Sun1;~XIAOJUAN_QI2",
        "gender": ";M;M;M;F",
        "homepage": ";https://xinyu-andy.github.io/;;https://sites.google.com/site/lisunspersonalsite/;https://xjqi.github.io/",
        "dblp": ";54/1184-4;208/4164;;176/1445-1.html",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;;JZViN_4AAAAJ;bGn0uacAAAAJ",
        "orcid": ";0000-0002-4531-1254;;;",
        "linkedin": ";;;;",
        "or_profile": "~Jiahui_Liu2;~Xin_Yu6;~Anlin_Zheng1;~Kevin_Li_Sun1;~XIAOJUAN_QI2",
        "aff": ";The University of Hong Kong;University of Hong Kong;University of Sheffield;University of Hong Kong",
        "aff_domain": ";hku.hk;hku.hk;sheffield.ac.uk;hku.hk",
        "position": ";PhD student;PhD student;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nliu2024diffusionbased,\ntitle={Diffusion-based Data Generation for Out-of-Distribution Object Detection},\nauthor={Jiahui Liu and Xin Yu and Anlin Zheng and Kevin Li Sun and XIAOJUAN QI},\nyear={2024},\nurl={https://openreview.net/forum?id=P6PPBq8K2B}\n}",
        "github": "",
        "project": "",
        "reviewers": "7pu6;LV47;vpYS;gKdQ;1VLd;8gzR",
        "site": "https://openreview.net/forum?id=P6PPBq8K2B",
        "pdf_size": 4370448,
        "rating": "1;3;5;5;5;5",
        "confidence": "5;4;4;4;3;3",
        "soundness": "2;1;3;2;2;3",
        "contribution": "1;1;2;2;2;2",
        "presentation": "2;3;3;2;2;3",
        "wc_summary": "107;42;102;103;63;69",
        "wc_strengths": "9;18;42;41;122;66",
        "wc_weaknesses": "259;257;24;127;68;171",
        "wc_questions": "16;55;157;2;162;5",
        "wc_review": "391;372;325;273;415;311",
        "wc_reply_reviewers": "0;0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0;0",
        "reply_authors": "0;0;0;0;0;0",
        "rating_avg": [
            4.0,
            1.5275252316519468
        ],
        "confidence_avg": [
            3.8333333333333335,
            0.6871842709362768
        ],
        "soundness_avg": [
            2.1666666666666665,
            0.6871842709362768
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.47140452079103173
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            81.0,
            24.460853078609777
        ],
        "wc_strengths_avg": [
            49.666666666666664,
            37.16928241916375
        ],
        "wc_weaknesses_avg": [
            151.0,
            88.40625920525461
        ],
        "wc_questions_avg": [
            66.16666666666667,
            68.23346360515166
        ],
        "wc_review_avg": [
            347.8333333333333,
            49.05240961348269
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.7938841860374447,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:XA1e4Ujfv7cJ:scholar.google.com/&scioq=Diffusion-based+Data+Generation+for+Out-of-Distribution+Object+Detection&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "University of Hong Kong;University of Sheffield",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.hku.hk;https://www.sheffield.ac.uk",
        "aff_unique_abbr": "HKU;Sheffield",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "id": "P6gYcTj6YC",
        "title": "Incorporating Domain Knowledge in VAE Learning via Exponential Dissimilarity-Dispersion Family",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Variational autoencoder (VAE) is a prominent generative model that has been actively applied to various unsupervised learning tasks such as representation learning. Despite its representational capability, VAEs with the commonly adopted Gaussian settings typically suffer from performance degradation in generative modeling for high-dimensional natural data, which is often caused by their excessively limited model family. In this paper, we introduce the exponential dissimilarity-dispersion family (EDDF), a novel distribution family that includes a dissimilarity function and a global dispersion parameter. A decoder with this distribution family induces arbitrary dissimilarity functions as the reconstruction loss of the evidence lower bound (ELBO) objective, where the model leverages domain knowledge through this dissimilarity function. For VAEs with EDDF decoders, we also propose an ELBO optimization method that implicitly approximates the stochastic gradient of the normalizing constant using log-expected dissimilarity. Empirical evaluations of the generative performance show the effectiveness of our model family and proposed method in the vision domain, indicating that the effect of dissimilarity determines the criteria of representational informativeness.",
        "keywords": "variational autoencoders;deep generative models;similarity indices;domain knowledge;dispersion parameter",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/c0a348e94f00c1024e8718b42adfed26c0a7f6c5.zip",
        "author": "Ren Togo;Nao Nakagawa;Takahiro Ogawa;Miki Haseyama",
        "authorids": "~Ren_Togo1;~Nao_Nakagawa1;~Takahiro_Ogawa1;~Miki_Haseyama1",
        "gender": "M;M;M;F",
        "homepage": "https://www-lmd.ist.hokudai.ac.jp/member/ren-togo/;https://ganmodokix.com;https://www-lmd.ist.hokudai.ac.jp/member/takahiro-ogawa/;https://www-lmd.ist.hokudai.ac.jp/member/miki-haseyama/",
        "dblp": "187/0069;282/7255;45/6528;29/5984",
        "google_scholar": "https://scholar.google.co.jp/citations?user=HNaVCtUAAAAJ;https://scholar.google.co.jp/citations?user=j8ycATsAAAAJ;https://scholar.google.co.jp/citations?user=vPixFIsAAAAJ;https://scholar.google.co.jp/citations?hl=en",
        "orcid": "0000-0002-4474-3995;0000-0001-9260-0828;0000-0001-5332-8112;0000-0003-1496-1761",
        "linkedin": ";%E7%9C%9F-%E4%B8%AD%E5%B7%9D-753020228/;;",
        "or_profile": "~Ren_Togo1;~Nao_Nakagawa1;~Takahiro_Ogawa1;~Miki_Haseyama1",
        "aff": "Hokkaido University;;Hokkaido University;Hokkaido University ",
        "aff_domain": "hokudai.ac.jp;;hokudai.ac.jp;hokudai.ac.jp",
        "position": "Assistant Professor;;Full Professor;Full Professor",
        "bibtex": "@misc{\ntogo2024incorporating,\ntitle={Incorporating Domain Knowledge in {VAE} Learning via Exponential Dissimilarity-Dispersion Family},\nauthor={Ren Togo and Nao Nakagawa and Takahiro Ogawa and Miki Haseyama},\nyear={2024},\nurl={https://openreview.net/forum?id=P6gYcTj6YC}\n}",
        "github": "",
        "project": "",
        "reviewers": "MY4X;NNHM;NsAA;xCRZ;GpDS",
        "site": "https://openreview.net/forum?id=P6gYcTj6YC",
        "pdf_size": 2240672,
        "rating": "5;5;5;5;6",
        "confidence": "4;2;3;3;4",
        "soundness": "2;2;2;2;3",
        "contribution": "2;2;2;2;2",
        "presentation": "3;3;3;2;3",
        "wc_summary": "46;71;58;77;71",
        "wc_strengths": "21;64;24;15;40",
        "wc_weaknesses": "115;175;49;235;35",
        "wc_questions": "5;63;17;55;315",
        "wc_review": "187;373;148;382;461",
        "wc_reply_reviewers": "315;150;0;42;37",
        "wc_reply_authors": "1220;1243;454;1194;474",
        "reply_reviewers": "2;2;0;1;1",
        "reply_authors": "3;4;3;6;2",
        "rating_avg": [
            5.2,
            0.39999999999999997
        ],
        "confidence_avg": [
            3.2,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.2,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            64.6,
            11.18212859879549
        ],
        "wc_strengths_avg": [
            32.8,
            17.656726763474595
        ],
        "wc_weaknesses_avg": [
            121.8,
            75.53118561230188
        ],
        "wc_questions_avg": [
            91.0,
            114.12975072258767
        ],
        "wc_review_avg": [
            310.2,
            121.10061932129001
        ],
        "wc_reply_reviewers_avg": [
            108.8,
            114.60436291869519
        ],
        "wc_reply_authors_avg": [
            917.0,
            370.25180620761324
        ],
        "reply_reviewers_avg": [
            1.2,
            0.7483314773547883
        ],
        "reply_authors_avg": [
            3.6,
            1.3564659966250536
        ],
        "replies_avg": [
            32,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5345224838248488,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:699-1skpUFoJ:scholar.google.com/&scioq=Incorporating+Domain+Knowledge+in+VAE+Learning+via+Exponential+Dissimilarity-Dispersion+Family&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Hokkaido University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.hokudai.ac.jp",
        "aff_unique_abbr": "Hokkaido U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Japan"
    },
    {
        "id": "P895PSh41Z",
        "title": "Relaxed State-Adversarial Offline Reinforcement Learning: A Leap Towards Robust Model-Free Policies from Historical Data",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Offline reinforcement learning (RL) targets the development of top-tier policies from historical data, eliminating the need for environmental interactions. While many prior studies have focused on model-based RL strategies, we present the Relaxed State-Adversarial Offline RL (RAORL), an innovative model-free offline RL solution. RAORL sidesteps model uncertainty issues by framing the problem within a state adversarial context, eliminating the need for explicit environmental modeling. Our method guarantees the policy's robustness and its capability to adapt to varying transition dynamics.  Anchored in robust theoretical foundations, RAORL promises performance guarantees and presents a conservative value function that reflects average-case outcomes over an uncertainty set. Empirical evaluations on established offline RL benchmarks indicate that RAORL not only meets but frequently surpasses the performance of state-of-the-art methods.",
        "keywords": "Offline Reinforcement Learning; Robust Reinforcement Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/762c126c85010fabd819661d5a30dab428f2fbb7.zip",
        "author": "Yun-Hsuan Lien;Ping-Chun Hsieh;Yu-Shuen Wang",
        "authorids": "~Yun-Hsuan_Lien1;~Ping-Chun_Hsieh1;~Yu-Shuen_Wang1",
        "gender": "F;M;M",
        "homepage": ";https://pinghsieh.github.io/;https://people.cs.nycu.edu.tw/~yushuen/",
        "dblp": ";163/7352;08/742",
        "google_scholar": ";ix38JgoAAAAJ;AKeIOxIAAAAJ",
        "orcid": ";;0000-0003-2550-2990",
        "linkedin": ";;",
        "or_profile": "~Yun-Hsuan_Lien1;~Ping-Chun_Hsieh1;~Yu-Shuen_Wang1",
        "aff": "National Yang Ming Chiao Tung University;National Yang Ming Chiao Tung University;National Yang Ming Chiao Tung University",
        "aff_domain": "nycu.edu.tw;nycu.edu.tw;cs.nycu.edu.tw",
        "position": "PhD student;Associate Professor;Full Professor",
        "bibtex": "@misc{\nlien2024relaxed,\ntitle={Relaxed State-Adversarial Offline Reinforcement Learning: A Leap Towards Robust Model-Free Policies from Historical Data},\nauthor={Yun-Hsuan Lien and Ping-Chun Hsieh and Yu-Shuen Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=P895PSh41Z}\n}",
        "github": "",
        "project": "",
        "reviewers": "K6G5;6xeb;8FWn;YpUx",
        "site": "https://openreview.net/forum?id=P895PSh41Z",
        "pdf_size": 786989,
        "rating": "3;5;5;5",
        "confidence": "3;4;4;3",
        "soundness": "2;3;1;3",
        "contribution": "2;3;2;2",
        "presentation": "2;2;1;2",
        "wc_summary": "62;54;68;122",
        "wc_strengths": "38;39;39;71",
        "wc_weaknesses": "282;261;284;224",
        "wc_questions": "12;107;81;132",
        "wc_review": "394;461;472;549",
        "wc_reply_reviewers": "30;71;36;77",
        "wc_reply_authors": "1029;1223;845;1208",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;3;2;2",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            76.5,
            26.7348087705897
        ],
        "wc_strengths_avg": [
            46.75,
            14.00669482783144
        ],
        "wc_weaknesses_avg": [
            262.75,
            24.118198523106987
        ],
        "wc_questions_avg": [
            83.0,
            44.782809201746154
        ],
        "wc_review_avg": [
            469.0,
            54.99545435761032
        ],
        "wc_reply_reviewers_avg": [
            53.5,
            20.71834935510066
        ],
        "wc_reply_authors_avg": [
            1076.25,
            153.78780023135775
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:BJggF9oxoGUJ:scholar.google.com/&scioq=Relaxed+State-Adversarial+Offline+Reinforcement+Learning:+A+Leap+Towards+Robust+Model-Free+Policies+from+Historical+Data&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "National Yang Ming Chiao Tung University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nycu.edu.tw",
        "aff_unique_abbr": "NYCU",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Taiwan",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "BRUSLEATTACK: A QUERY-EFFICIENT SCORE- BASED BLACK-BOX SPARSE ADVERSARIAL ATTACK",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18718",
        "id": "PAfnMGXief",
        "author_site": "Quoc Viet Vo, Ehsan Abbasnejad, Damith Ranasinghe",
        "tldr": "",
        "abstract": "We study the unique, less-well understood problem of generating sparse adversarial samples simply by observing the score-based replies to model queries. Sparse attacks aim to discover a minimum number\u2014the $l_0$ bounded\u2014perturbations to model inputs to craft adversarial examples and misguide model decisions. But, in contrast to query-based dense attack counterparts against black-box models, constructing sparse adversarial perturbations, even when models serve confidence score information to queries in a score-based setting, is non-trivial. Because, such an attack leads to: i) an NP-hard problem; and ii) a non-differentiable search space. We develop the BRUSLEATTACK\u2014a new, faster (more query-efficient) algorithm formulation for the problem. We conduct extensive attack evaluations including an attack demonstration against a Machine Learning as a Service (MLaaS) offering exemplified by __Google Cloud Vision__ and robustness testing of adversarial training regimes and a recent defense against black-box attacks. The proposed attack scales to achieve state-of-the-art attack success rates and query efficiency on standard computer vision tasks such as ImageNet across different model architectures. Our artifacts and DIY attack samples are available on GitHub. Importantly, our work facilitates faster evaluation of model vulnerabilities and raises our vigilance on the safety, security and reliability of deployed systems.",
        "keywords": "AI Safety;Trustworthy Machine Learning;Machine Learning Robustness;Adversarial Attacks",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Quoc Viet Vo;Ehsan Abbasnejad;Damith Ranasinghe",
        "authorids": "~Quoc_Viet_Vo1;~Ehsan_Abbasnejad3;~Damith_Ranasinghe1",
        "gender": ";M;M",
        "homepage": ";https://ehsanabb.github.io/;https://vietvo89.github.io/",
        "dblp": "56/8102;30/11191;308/6866",
        "google_scholar": "https://scholar.google.com.au/citations?hl=en;https://scholar.google.com/citations?hl=en;https://scholar.google.com.au/citations?user=u5H3IooAAAAJ",
        "orcid": "0000-0002-2008-9255;;0000-0001-6413-8875",
        "linkedin": ";;viet-vo-75097835/",
        "or_profile": "~Damith_Ranasinghe1;~Ehsan_M_Abbasnejad1;~Viet_Vo1",
        "aff": "University of Adelaide;University of Adelaide;University of Adelaide",
        "aff_domain": "adelaide.edu.au;adelaide.edu.au;adelaide.edu.au",
        "position": "Associate Professor;Assistant Professor;Postdoc",
        "bibtex": "@inproceedings{\nvo2024brusleattack,\ntitle={{BRUSLEATTACK}: A {QUERY}-{EFFICIENT} {SCORE}- {BASED} {BLACK}-{BOX} {SPARSE} {ADVERSARIAL} {ATTACK}},\nauthor={Quoc Viet Vo and Ehsan Abbasnejad and Damith Ranasinghe},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=PAfnMGXief}\n}",
        "github": "",
        "project": "",
        "reviewers": "Xni7;tLev;UEvH;kfkC",
        "pdf_size": 19179170,
        "rating": "3;5;6;6",
        "confidence": "4;4;4;3",
        "soundness": "2;2;3;2",
        "contribution": "2;3;3;3",
        "presentation": "3;2;2;1",
        "wc_summary": "97;47;65;227",
        "wc_strengths": "20;40;21;37",
        "wc_weaknesses": "243;108;145;313",
        "wc_questions": "5;131;45;38",
        "wc_review": "365;326;276;615",
        "wc_reply_reviewers": "0;0;28;0",
        "wc_reply_authors": "1027;614;1142;1206",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "2;1;3;3",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            109.0,
            70.44146506142529
        ],
        "wc_strengths_avg": [
            29.5,
            9.069178573608527
        ],
        "wc_weaknesses_avg": [
            202.25,
            80.7569656438378
        ],
        "wc_questions_avg": [
            54.75,
            46.54231945230061
        ],
        "wc_review_avg": [
            395.5,
            130.59575031370662
        ],
        "wc_reply_reviewers_avg": [
            7.0,
            12.12435565298214
        ],
        "wc_reply_authors_avg": [
            997.25,
            230.37727209948468
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.4714045207910316,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4380880442039029802&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=PAfnMGXief",
        "pdf": "https://openreview.net/pdf?id=PAfnMGXief",
        "email": "adelaide.edu.au;adelaide.edu.au;adelaide.edu.au",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Adelaide",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.adelaide.edu.au",
        "aff_unique_abbr": "Adelaide",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Australia"
    },
    {
        "id": "PBEQIxXDDD",
        "title": "TopoFormer: Topology-aware Transformer for Reactive Motion Prediction in Close Interactions",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "With high-quality motion datasets more accessible, data-driven modelling of close interactions between two or more people has attracted more research interest in recent years. Such models can be used to understand the intent of the people by predicting the reactive motion when they are closely interacting with each other. However, failure in synchronising the motions between people as well as implausible motions such as interpenetrations of body parts can still be found in State-of-the-Art (SOTA) interaction prediction approaches. We argue that commonly used motion representations in Euclidean space, such as joint positions and joint angles in previous approaches do not capture the spatial relations between the body parts effectively. In this paper, we propose a new Transformer, called `TopoFormer', for predicting the reactive motion of one of the characters in a Two-person close interaction by giving the motion of the other character and the interaction class label as input. TopoFormer consists of a Topology-Aware Spatio-Temporal Embedding and Spatial Relation-aware Multi-Headed Self Attention (SR-MSA) to facilitate the learning of the latent representation of close interactions. By representing the body parts using a set of articulated chains instead of the commonly used graph-based structure in recent works, the spatial relations can be more effectively represented using a topology-based representation, Gauss Linking Integral (GLI). Experimental results highlight the effectiveness of our proposed method as we achieved SOTA performance in Aligned Mean Error (AME) and a newly proposed metric  Average Interpenetration per Frame (AIF) across different datasets and qualitatively more synchronised and plausible interactions.",
        "keywords": "Motion prediction;3D sekeletal motion;close interaction;transformer;Gauss Linking Integral;human motion",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/de4e41c089929bcdfdc88731cc4264cff22bcf30.zip",
        "author": "Aman Goel;He Wang;Pengpeng Hu;Edmond S. L. Ho",
        "authorids": "~Aman_Goel3;~He_Wang6;~Pengpeng_Hu1;~Edmond_S._L._Ho1",
        "gender": "M;M;M;M",
        "homepage": ";http://drhewang.com/;https://pureportal.coventry.ac.uk/en/persons/pengpeng-hu;http://www.edho.net",
        "dblp": ";01/6368-2;200/7739.html;19/4864",
        "google_scholar": "MX3mYoQAAAAJ;https://scholar.google.co.jp/citations?user=BaaPAVYAAAAJ;7zhyEqsAAAAJ;Py1-xgMAAAAJ",
        "orcid": ";0000-0002-2281-5679;0000-0002-2547-1517;0000-0001-5862-106X",
        "linkedin": ";;pengpeng-hu-02b071121/;edmond-s-l-ho-b151b867/",
        "or_profile": "~Aman_Goel3;~He_Wang6;~Pengpeng_Hu1;~Edmond_S._L._Ho1",
        "aff": ";University College London, University of London;Coventry University;University of Glasgow",
        "aff_domain": ";ucl.ac.uk;cu.ac.uk;glasgow.ac.uk",
        "position": ";Associate Professor;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nanonymous2024topoformer,\ntitle={TopoFormer: Topology-aware Transformer for Reactive Motion Prediction in Close Interactions},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=PBEQIxXDDD}\n}",
        "github": "",
        "project": "",
        "reviewers": "Puux;faxm;MoxH;zYBk",
        "site": "https://openreview.net/forum?id=PBEQIxXDDD",
        "pdf_size": 1458336,
        "rating": "3;3;5;5",
        "confidence": "4;4;3;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;1;2;2",
        "wc_summary": "45;110;101;88",
        "wc_strengths": "53;48;107;39",
        "wc_weaknesses": "82;168;125;275",
        "wc_questions": "135;4;70;22",
        "wc_review": "315;330;403;424",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            86.0,
            24.92990172463582
        ],
        "wc_strengths_avg": [
            61.75,
            26.602396508585464
        ],
        "wc_weaknesses_avg": [
            162.5,
            71.71645557332013
        ],
        "wc_questions_avg": [
            57.75,
            50.706878231656106
        ],
        "wc_review_avg": [
            368.0,
            46.40581860068843
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:cfyssJDcd-oJ:scholar.google.com/&scioq=TopoFormer:+Topology-aware+Transformer+for+Reactive+Motion+Prediction+in+Close+Interactions&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University College London;Coventry University;University of Glasgow",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ucl.ac.uk;https://www.coventry.ac.uk;https://www.gla.ac.uk",
        "aff_unique_abbr": "UCL;CU;Glasgow",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "PBSmr51fCR",
        "title": "URRL-IMVC: Unified and Robust Representation Learning for Incomplete Multi-View Clustering",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Incomplete multi-view clustering (IMVC) aims to cluster multi-view data that are only partially available. This poses two main challenges: effectively leveraging multi-view information and mitigating the impact of missing views. Prevailing solutions employ cross-view contrastive learning and missing view recovery techniques respectively. However, they either neglect valuable complementary information by focusing only on consensus between views or provide unreliable recovered views due to the absence of supervision. To address these limitations, we propose a novel Unified and Robust Representation Learning for Incomplete Multi-View Clustering (URRL-IMVC). URRL-IMVC learns a unified embedding that is robust to view missing conditions by integrating information from multiple views and neighboring samples. Firstly, to overcome the limitations of cross-view contrastive learning, URRL-IMVC incorporates an attention-based auto-encoder framework to fuse multi-view information and generate unified embeddings. Secondly, URRL-IMVC directly enhances the robustness of the unified embedding against view-missing conditions through KNN imputation and data augmentation techniques, eliminating the need for explicit missing view recovery. Finally, incremental improvements are introduced to further enhance the overall performance, such as adaptive masking, dynamic initialization, etc. We extensively evaluate the proposed URRL-IMVC framework on various benchmark datasets, demonstrating its state-of-the-art performance. Furthermore, comprehensive ablation studies are performed to validate the effectiveness of our design.",
        "keywords": "deep learning;representation learning;self-supervised learning;multi-view learning;incomplete multi-view clustering",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Ge Teng;Ting Mao;Chen Shen;Xiang Tian;Xuesong Liu;Yaowu Chen;Jieping Ye",
        "authorids": "~Ge_Teng2;~Ting_Mao3;~Chen_Shen7;~Xiang_Tian2;~Xuesong_Liu3;~Yaowu_Chen2;~Jieping_Ye4",
        "gender": "M;M;M;M;;;M",
        "homepage": ";https://openreview.net/profile?id=~Ting_Mao3;;;https://person.zju.edu.cn/0015654;https://person.zju.edu.cn/0088219;http://yelabs.net/",
        "dblp": ";;55/5393-3;;;;03/5454",
        "google_scholar": ";;b6vn1uMAAAAJ;;;;T9AzhwcAAAAJ",
        "orcid": "0000-0002-1331-9868;;;0000-0003-0735-8454;;;0000-0001-8662-5818",
        "linkedin": ";;;;;;",
        "or_profile": "~Ge_Teng2;~Ting_Mao3;~Chen_Shen7;~Xiang_Tian2;~Xuesong_Liu3;~Yaowu_Chen2;~Jieping_Ye4",
        "aff": "Zhejiang University;Alibaba Group;Alibaba Group;;Zhejiang University;Zhejiang University;Alibaba Group",
        "aff_domain": "zju.edu.cn;alibaba-inc.com;alibaba-inc.com;;zju.edu.cn;zju.edu.cn;alibaba-inc.com",
        "position": "PhD student;Researcher;Researcher;;Associate Professor;Full Professor;Principal Researcher",
        "bibtex": "@misc{\nteng2024urrlimvc,\ntitle={{URRL}-{IMVC}: Unified and Robust Representation Learning for Incomplete Multi-View Clustering},\nauthor={Ge Teng and Ting Mao and Chen Shen and Xiang Tian and Xuesong Liu and Yaowu Chen and Jieping Ye},\nyear={2024},\nurl={https://openreview.net/forum?id=PBSmr51fCR}\n}",
        "github": "",
        "project": "",
        "reviewers": "xehP;LBwN;umVo;3U96",
        "site": "https://openreview.net/forum?id=PBSmr51fCR",
        "pdf_size": 1777066,
        "rating": "5;5;5;5",
        "confidence": "3;4;3;5",
        "soundness": "2;2;2;2",
        "contribution": "2;2;3;2",
        "presentation": "2;3;2;2",
        "wc_summary": "84;53;59;43",
        "wc_strengths": "52;25;53;10",
        "wc_weaknesses": "117;111;98;166",
        "wc_questions": "20;2;110;162",
        "wc_review": "273;191;320;381",
        "wc_reply_reviewers": "0;0;19;0",
        "wc_reply_authors": "1196;1093;1269;2759",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "3;2;3;5",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            59.75,
            15.122417134836613
        ],
        "wc_strengths_avg": [
            35.0,
            18.289341158171883
        ],
        "wc_weaknesses_avg": [
            123.0,
            25.758493744782516
        ],
        "wc_questions_avg": [
            73.5,
            65.45800180268262
        ],
        "wc_review_avg": [
            291.25,
            69.39875719348294
        ],
        "wc_reply_reviewers_avg": [
            4.75,
            8.227241335952167
        ],
        "wc_reply_authors_avg": [
            1579.25,
            683.9928270822728
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.25,
            1.0897247358851685
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:3uji5DsTyEwJ:scholar.google.com/&scioq=URRL-IMVC:+Unified+and+Robust+Representation+Learning+for+Incomplete+Multi-View+Clustering&hl=en&as_sdt=0,33",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1;0;0;1",
        "aff_unique_norm": "Zhejiang University;Alibaba Group",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.zju.edu.cn;https://www.alibaba.com",
        "aff_unique_abbr": "ZJU;Alibaba",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "PCTqol2hvy",
        "title": "Characterizing ResNet's Universal Approximation Capability",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Since its debut in 2016, ResNet has become arguably the most favorable architecture in deep neural network (DNN) design. It effectively addresses the gradient vanishing issue in DNN training, allowing engineers to fully unleash DNN's potential in tackling challenging problems in various domains. Despite its practical success, an essential theoretical question remains largely open: how well can ResNet approximate functions? In this paper, we show that ResNet with bottleneck blocks (b-ResNet) can approximate any $d$-dimensional monomial with degree $p$ to any accuracy $\\epsilon>0$ with $\\mathcal{O}(dp\\log (p/\\epsilon))$ number of weights and we extend the results to polynomials, smooth functions, continuous functions. This is a factor of $d$ reduction in the number of training weights compared with the classical results for ReLU feedforward networks. Our results reveal that a continuous-depth network generated via a dynamical system possesses significant approximation capabilities even if its dynamics function is realized by a shallow ReLU network with absolute constant neurons. Furthermore, our achievability result is order-optimal in terms of $\\epsilon$ as it matches the generalized lower bound. Besides, we apply ResNet can approximate a special function class based on Kolmogrovo Superposition Theorem with $\\mathcal{O}(d^4\\epsilon^{-1})$ tuning weights to overcome the curse of dimension. This work adds to the theoretical justifications for ResNet's stellar practical performance.",
        "keywords": "ResNet;approximation complexity",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/d37db6c7d156023e8c7e913831d413b056fd30e5.pdf",
        "author": "Chenghao Liu;Enming Liang;Minghua Chen",
        "authorids": "~Chenghao_Liu5;~Enming_Liang1;~Minghua_Chen1",
        "gender": "M;M;M",
        "homepage": ";https://emliang.github.io/;https://www.mhchen.com",
        "dblp": ";;12/4395-1.html",
        "google_scholar": ";https://scholar.google.com.sg/citations?user=Todfu6AAAAAJ;https://scholar.google.com.hk/citations?user=WzEQ9QwAAAAJ",
        "orcid": "0009-0001-5374-2767;;0000-0003-4763-0037",
        "linkedin": ";enming-liang-95b5b216a/;",
        "or_profile": "~Chenghao_Liu5;~Enming_Liang1;~Minghua_Chen1",
        "aff": "City University of Hong Kong;City University of Hong Kong;City University of Hong Kong",
        "aff_domain": "cityu.edu.hk;cityu.edu.hk;cityu.edu.hk",
        "position": "PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nliu2024characterizing,\ntitle={Characterizing ResNet's Universal Approximation Capability},\nauthor={Chenghao Liu and Enming Liang and Minghua Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=PCTqol2hvy}\n}",
        "github": "",
        "project": "",
        "reviewers": "Avff;gSxo;mYBU;AdWg",
        "site": "https://openreview.net/forum?id=PCTqol2hvy",
        "pdf_size": 3435462,
        "rating": "3;6;8;8",
        "confidence": "4;4;5;4",
        "soundness": "3;3;4;3",
        "contribution": "1;3;3;3",
        "presentation": "4;3;3;3",
        "wc_summary": "133;147;34;303",
        "wc_strengths": "12;16;48;86",
        "wc_weaknesses": "11;81;874;502",
        "wc_questions": "2;57;185;191",
        "wc_review": "158;301;1141;1082",
        "wc_reply_reviewers": "0;0;33;267",
        "wc_reply_authors": "744;653;875;3351",
        "reply_reviewers": "0;0;1;2",
        "reply_authors": "3;3;3;8",
        "rating_avg": [
            6.25,
            2.0463381929681126
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            154.25,
            96.29479477105707
        ],
        "wc_strengths_avg": [
            40.5,
            29.744747435471695
        ],
        "wc_weaknesses_avg": [
            367.0,
            347.78082178291544
        ],
        "wc_questions_avg": [
            108.75,
            81.62834985469203
        ],
        "wc_review_avg": [
            670.5,
            444.378498579758
        ],
        "wc_reply_reviewers_avg": [
            75.0,
            111.6669154226085
        ],
        "wc_reply_authors_avg": [
            1405.75,
            1125.8595327570843
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            4.25,
            2.165063509461097
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.49374193110101877,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=280982346352879172&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "City University of Hong Kong",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cityu.edu.hk",
        "aff_unique_abbr": "CityU",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "PCXvcULwiI",
        "title": "Benchmarking Structural Inference Methods for Interacting Dynamical Systems with Synthetic Data",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In the quest to unravel the complexities of dynamical systems, the initial imperative is to unveil their inherent topological structure, a key determinant of system organization. Achieving this necessitates the deployment of robust structural inference techniques capable of deriving this structure from observed system behaviors. \nHowever, these methods are often tailor-made for specific domains and datasets, lacking a unified and objective framework for comparative assessment. \nIn response to this pressing challenge, we present a comprehensive benchmarking study encompassing 12 structural inference methodologies sourced from diverse disciplines. \nOur evaluation protocol spans dynamical systems generated via two distinct simulation paradigms and encompasses 11 distinct interaction graph typologies. \nWe gauge the methods' performance in terms of accuracy, scalability, robustness, and sensitivity to graph properties. \nKey findings emerge: 1) Deep learning techniques excel in the context of multi-dimensional data, 2) classical statistics and information-theory-based methods exhibit exceptional accuracy and resilience, and 3) method performance correlates positively with the average shortest path length of the graph. \nOur benchmark not only aids researchers in method selection for specific problem domains but also serves as a catalyst for inspiring novel methodological advancements in the field.",
        "keywords": "Structural Inference;AI4Science;Benchmark",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/c875f4ffa0b5e65ec87c410709ea8898110878af.zip",
        "author": "Aoran Wang;Tsz Pan Tong;Andrzej Mizera;Jun Pang",
        "authorids": "~Aoran_Wang1;~Tsz_Pan_Tong1;~Andrzej_Mizera1;~Jun_Pang1",
        "gender": ";M;M;M",
        "homepage": ";https://satoss.uni.lu/members/tszpan/;https://www.mimuw.edu.pl/~amizera/;https://satoss.uni.lu/members/jun/",
        "dblp": ";;;p/JunPang",
        "google_scholar": ";;6O_oWFUAAAAJ;0JjOM_gAAAAJ",
        "orcid": ";;0000-0002-6351-2877;0000-0002-4521-4112",
        "linkedin": ";;;",
        "or_profile": "~Aoran_Wang1;~Tsz_Pan_Tong1;~Andrzej_Mizera1;~Jun_Pang1",
        "aff": ";University of Luxemburg;University of Warsaw;University of Luxembourg",
        "aff_domain": ";uni.lu;mimuw.edu.pl;uni.lu",
        "position": ";PhD student;Postdoc;Principal Researcher",
        "bibtex": "@misc{\nwang2024benchmarking,\ntitle={Benchmarking Structural Inference Methods for Interacting Dynamical Systems with Synthetic Data},\nauthor={Aoran Wang and Tsz Pan Tong and Andrzej Mizera and Jun Pang},\nyear={2024},\nurl={https://openreview.net/forum?id=PCXvcULwiI}\n}",
        "github": "",
        "project": "",
        "reviewers": "MpHi;HMKQ;gd54;fGzL",
        "site": "https://openreview.net/forum?id=PCXvcULwiI",
        "pdf_size": 786900,
        "rating": "5;5;6;6",
        "confidence": "2;4;2;4",
        "soundness": "2;2;3;3",
        "contribution": "2;3;2;2",
        "presentation": "3;2;3;3",
        "wc_summary": "73;143;75;62",
        "wc_strengths": "37;371;69;44",
        "wc_weaknesses": "60;277;98;43",
        "wc_questions": "12;482;67;6",
        "wc_review": "182;1273;309;155",
        "wc_reply_reviewers": "125;0;49;20",
        "wc_reply_authors": "1228;2194;1413;1568",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "3;4;4;5",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.0,
            1.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            88.25,
            31.995116814914116
        ],
        "wc_strengths_avg": [
            130.25,
            139.50515223460386
        ],
        "wc_weaknesses_avg": [
            119.5,
            93.0873245936309
        ],
        "wc_questions_avg": [
            141.75,
            197.87669771855403
        ],
        "wc_review_avg": [
            479.75,
            461.6597096347049
        ],
        "wc_reply_reviewers_avg": [
            48.5,
            47.47894270094902
        ],
        "wc_reply_authors_avg": [
            1600.75,
            363.04639854982725
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.0,
            0.7071067811865476
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10058773427544546483&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Luxembourg;University of Warsaw",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://wwwen.uniluxembourg.lu;https://www.uw.edu.pl",
        "aff_unique_abbr": "Uni Lu;UW",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Luxembourg;Poland"
    },
    {
        "title": "Safe and Robust Watermark Injection with a Single OoD Image",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18717",
        "id": "PCm1oT8pZI",
        "author_site": "Shuyang Yu, Junyuan Hong, Haobo Zhang, Haotao Wang, Zhangyang Wang, Jiayu Zhou",
        "tldr": "",
        "abstract": "Training a high-performance deep neural network requires large amounts of data and computational resources. \nProtecting the intellectual property (IP) and commercial ownership of a deep model is challenging yet increasingly crucial. \nA major stream of watermarking strategies implants verifiable backdoor triggers by poisoning training samples, but these are often unrealistic due to data privacy and safety concerns and are vulnerable to minor model changes such as fine-tuning. \nTo overcome these challenges, we propose a safe and robust backdoor-based watermark injection technique that leverages the diverse knowledge from a single out-of-distribution (OoD) image, which serves as a secret key for IP verification. \nThe independence of training data makes it agnostic to third-party promises of IP security. \nWe induce robustness via random perturbation of model parameters during watermark injection to defend against common watermark removal attacks, including fine-tuning, pruning, and model extraction. \nOur experimental results demonstrate that the proposed watermarking approach is not only time- and sample-efficient without training data, but also robust against the watermark removal attacks above.",
        "keywords": "Backdoor;Watermarking;robustness",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/5c2468b0365992155176b6a7f40854aecc6b8df8.pdf",
        "author": "Shuyang Yu;Junyuan Hong;Haobo Zhang;Haotao Wang;Zhangyang Wang;Jiayu Zhou",
        "authorids": "~Shuyang_Yu1;~Junyuan_Hong1;~Haobo_Zhang1;~Haotao_Wang1;~Zhangyang_Wang1;~Jiayu_Zhou1",
        "gender": "F;M;;;M;M",
        "homepage": ";https://jyhong.gitlab.io/;;;https://vita-group.github.io;http://jiayuzhou.github.io/",
        "dblp": ";185/1316;;236/5090;119/4026;73/1353",
        "google_scholar": ";7Cbv6doAAAAJ;;aMIJhlEAAAAJ;pxFyKAIAAAAJ;https://scholar.google.com.tw/citations?user=yQKlLTQAAAAJ",
        "orcid": "0000-0003-1889-0163;0000-0002-5718-5187;;;;0000-0003-4336-6777",
        "linkedin": ";;;;;jiayuzhou/",
        "or_profile": "~Shuyang_Yu1;~Junyuan_Hong1;~Haobo_Zhang1;~Haotao_Wang1;~Zhangyang_Wang1;~Jiayu_Zhou1",
        "aff": "Michigan State University;University of Texas at Austin;;Qualcomm Inc, QualComm;University of Texas at Austin;Michigan State University",
        "aff_domain": "msu.edu;utexas.edu;;qti.qualcomm.com;utexas.edu;msu.edu",
        "position": "PhD student;Postdoc;;Researcher;Associate Professor;Associate Professor",
        "bibtex": "@inproceedings{\nyu2024safe,\ntitle={Safe and Robust Watermark Injection with a Single OoD Image},\nauthor={Shuyang Yu and Junyuan Hong and Haobo Zhang and Haotao Wang and Zhangyang Wang and Jiayu Zhou},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=PCm1oT8pZI}\n}",
        "github": "",
        "project": "",
        "reviewers": "MV1f;suCZ;6zjD;URnu",
        "pdf_size": 2685127,
        "rating": "3;6;6;8",
        "confidence": "4;4;2;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "127;52;127;41",
        "wc_strengths": "12;55;195;295",
        "wc_weaknesses": "32;173;334;83",
        "wc_questions": "346;95;5;27",
        "wc_review": "517;375;661;446",
        "wc_reply_reviewers": "273;0;0;14",
        "wc_reply_authors": "1946;673;1053;482",
        "reply_reviewers": "2;0;0;1",
        "reply_authors": "4;2;3;2",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            86.75,
            40.43745170012571
        ],
        "wc_strengths_avg": [
            139.25,
            112.53527224830444
        ],
        "wc_weaknesses_avg": [
            155.5,
            114.75735270561098
        ],
        "wc_questions_avg": [
            118.25,
            135.61226898772838
        ],
        "wc_review_avg": [
            499.75,
            105.77186535180327
        ],
        "wc_reply_reviewers_avg": [
            71.75,
            116.33222898234177
        ],
        "wc_reply_authors_avg": [
            1038.5,
            562.8163554837404
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.08084520834544431,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11129017505172455567&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=PCm1oT8pZI",
        "pdf": "https://openreview.net/pdf?id=PCm1oT8pZI",
        "email": "msu.edu;utexas.edu;;qti.qualcomm.com;utexas.edu;msu.edu",
        "author_num": 6,
        "aff_unique_index": "0;1;2;1;0",
        "aff_unique_norm": "Michigan State University;University of Texas at Austin;Qualcomm Incorporated",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.msu.edu;https://www.utexas.edu;https://www.qualcomm.com",
        "aff_unique_abbr": "MSU;UT Austin;Qualcomm",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Austin",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "PDAflvlxYY",
        "title": "Language Decision Transformers with Exponential Tilt for Interactive Text Environments",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Text-based game environments are challenging because agents must deal with long sequences of text, execute compositional actions using text, and learn from sparse rewards. We address these challenges by proposing Language Decision Transformers (LDTs), a framework that is based on transformer language models and decision transformers (DTs). Our LDTs extend DTs with 3 components: (1) exponential tilt to guide the agent towards high obtainable goals, (2) novel goal conditioning methods yielding better results than the traditional return-to-go (sum of all future rewards), and (3) a model of future observations that improves agent performance. LDTs are the first to address offline RL with DTs on these challenging games. Our experiments show that LDTs achieve the highest scores among many different types of agents on some of the most challenging Jericho games, such as Enchanter.",
        "keywords": "Decision Transformers;Transformers;Language;Jericho;Text Games;Reinforcement Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Nicolas Gontier;Pau Rodriguez;Issam H. Laradji;David Vazquez;Christopher Pal",
        "authorids": "~Nicolas_Gontier1;~Pau_Rodriguez2;~Issam_H._Laradji1;~David_Vazquez1;~Christopher_Pal1",
        "gender": "M;M;;M;",
        "homepage": "https://issamlaradji.github.io/;http://www.david-vazquez.com;https://scholar.google.ca/citations?user=1ScWJOoAAAAJ&hl=en&oi=ao;https://sites.google.com/view/nicolasag;https://prlz77.github.io",
        "dblp": "142/0043;94/8653;45/1217;203/9460;190/7735",
        "google_scholar": "https://scholar.google.ca/citations?user=8vRS7F0AAAAJ;1jHvtfsAAAAJ;https://scholar.google.ca/citations?user=1ScWJOoAAAAJ;https://scholar.google.ca/citations?user=KNaO2qUAAAAJ;https://scholar.google.es/citations?user=IwBx73wAAAAJ",
        "orcid": ";0000-0002-2845-8158;;;0000-0002-1689-8084",
        "linkedin": "issam-laradji-67ba1a99/;https://www.linkedin.com/company/david-vazquez/;;nicolasgontier/;",
        "or_profile": "~Issam_H._Laradji1;~David_Vazquez1;~Christopher_Pal1;~Nicolas_A._Gontier1;~Pau_Rodriguez_Lopez1",
        "aff": "ServiceNow;ServiceNow research;Polytechnique Montreal;Servicenow Research;Apple",
        "aff_domain": "servicenow.com;servicenow.com;polymtl.ca;servicenow.com;apple.com",
        "position": "Researcher;Researcher;Full Professor;Researcher;Researcher",
        "bibtex": "@misc{\ngontier2024language,\ntitle={Language Decision Transformers with Exponential Tilt for Interactive Text Environments},\nauthor={Nicolas Gontier and Pau Rodriguez and Issam H. Laradji and David Vazquez and Christopher Pal},\nyear={2024},\nurl={https://openreview.net/forum?id=PDAflvlxYY}\n}",
        "github": "",
        "project": "",
        "reviewers": "NX9B;r7hd;BF53",
        "site": "https://openreview.net/forum?id=PDAflvlxYY",
        "pdf_size": 1623491,
        "rating": "3;3;3",
        "confidence": "3;4;3",
        "soundness": "3;2;2",
        "contribution": "1;1;1",
        "presentation": "3;1;3",
        "wc_summary": "52;105;108",
        "wc_strengths": "17;44;40",
        "wc_weaknesses": "87;214;160",
        "wc_questions": "128;55;39",
        "wc_review": "284;418;347",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            88.33333333333333,
            25.72072229848057
        ],
        "wc_strengths_avg": [
            33.666666666666664,
            11.897712198383164
        ],
        "wc_weaknesses_avg": [
            153.66666666666666,
            52.04058245467879
        ],
        "wc_questions_avg": [
            74.0,
            38.738439135652676
        ],
        "wc_review_avg": [
            349.6666666666667,
            54.73775865179558
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8446711266725258900&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1;0;2",
        "aff_unique_norm": "ServiceNow;Polytechnique Montreal;Apple",
        "aff_unique_dep": ";;Apple Inc.",
        "aff_unique_url": "https://www.servicenow.com;https://www.polymtl.ca;https://www.apple.com",
        "aff_unique_abbr": "ServiceNow;PolyMTL;Apple",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Montreal",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "United States;Canada"
    },
    {
        "id": "PDL5A6facN",
        "title": "Accelerated Policy Gradient: On the Nesterov Momentum for Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Policy gradient methods have recently been shown to enjoy global convergence at a $\\Theta(1/t)$ rate in the non-regularized tabular softmax setting. Accordingly, one important research question is whether this convergence rate can be further improved, with only first-order updates. In this paper, we answer the above question from the perspective of momentum by \nadapting the celebrated Nesterov's accelerated gradient (NAG) method to reinforcement learning (RL), termed \\textit{Accelerated Policy Gradient} (APG). To demonstrate the potential of APG in achieving faster global convergence, we start from the bandit setting and formally show that with the true gradient, APG with softmax policy parametrization converges to an optimal policy at a $\\tilde{O}(1/t^2)$ rate. \nTo the best of our knowledge, this is the first characterization of the global convergence rate of NAG in the context of RL.\nNotably, our analysis relies on one interesting finding: Regardless of the initialization, APG could end up reaching a locally-concave regime, where APG could benefit significantly from the momentum, within finite iterations.\nBy means of numerical validation, we confirm that APG exhibits $\\tilde{O}(1/t^2)$ rate in the bandit setting and still preserves the $\\tilde{O}(1/t^2)$ rate in various Markov decision process instances, showing that APG could significantly improve the convergence behavior over the standard policy gradient.",
        "keywords": "Reinforcement learning; Accelerated gradient; Nesterov momentum; Global convergence",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/9a3e21a86a08db1ebe92e38a690201584b4cf95a.zip",
        "author": "Yen-Ju Chen;Nai-Chieh Huang;Ping-Chun Hsieh",
        "authorids": "~Yen-Ju_Chen1;~Nai-Chieh_Huang1;~Ping-Chun_Hsieh1",
        "gender": "M;M;M",
        "homepage": ";https://pinghsieh.github.io/;",
        "dblp": ";163/7352;59/1760",
        "google_scholar": "https://scholar.google.com.tw/citations?hl=zh-TW;ix38JgoAAAAJ;",
        "orcid": ";;",
        "linkedin": "https://www.linkedin.com/mwlite/in/nai-chieh-huang-244351207;;Mru0222/",
        "or_profile": "~Nai-Chieh_Huang1;~Ping-Chun_Hsieh1;~Yen_Ju_Chen1",
        "aff": "National Yang-Ming Chiao-Tung University;National Yang Ming Chiao Tung University;National Chiao Tung University",
        "aff_domain": "nycu.edu.tw;nycu.edu.tw;nctu.edu.tw",
        "position": "Undergrad student;Associate Professor;MS student",
        "bibtex": "@misc{\nchen2024accelerated,\ntitle={Accelerated Policy Gradient: On the Nesterov Momentum for Reinforcement Learning},\nauthor={Yen-Ju Chen and Nai-Chieh Huang and Ping-Chun Hsieh},\nyear={2024},\nurl={https://openreview.net/forum?id=PDL5A6facN}\n}",
        "github": "",
        "project": "",
        "reviewers": "y1oq;aHMD;txPi;6oea",
        "site": "https://openreview.net/forum?id=PDL5A6facN",
        "pdf_size": 1079037,
        "rating": "5;5;6;6",
        "confidence": "3;3;3;4",
        "soundness": "2;4;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;4;2;3",
        "wc_summary": "92;97;64;77",
        "wc_strengths": "48;25;80;39",
        "wc_weaknesses": "330;80;248;35",
        "wc_questions": "7;1;5;49",
        "wc_review": "477;203;397;200",
        "wc_reply_reviewers": "0;73;0;0",
        "wc_reply_authors": "1575;883;902;1714",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "3;2;2;4",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            82.5,
            12.971121771072847
        ],
        "wc_strengths_avg": [
            48.0,
            20.211382931407737
        ],
        "wc_weaknesses_avg": [
            173.25,
            120.38142506217477
        ],
        "wc_questions_avg": [
            15.5,
            19.461500456028563
        ],
        "wc_review_avg": [
            319.25,
            121.10403585347599
        ],
        "wc_reply_reviewers_avg": [
            18.25,
            31.60992723813201
        ],
        "wc_reply_authors_avg": [
            1268.5,
            379.2574982778851
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2229805193132966573&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "National Yang-Ming Chiao-Tung University;National Yang Ming Chiao Tung University;National Chiao Tung University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.nycu.edu.tw;https://www.nycu.edu.tw;https://www.nctu.edu.tw",
        "aff_unique_abbr": "NYCU;NYCU;NCTU",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Taiwan",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "PDct7vrcvT",
        "title": "Who\u2019s Harry Potter? Approximate Unlearning for LLMs",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large language models (LLMs) are trained on massive internet corpora that often contain copyrighted content. This poses legal and ethical challenges for the developers and users of these models, as well as the original authors and publishers. In this paper, we propose a novel technique for unlearning a subset of the training data from a LLM, without having to retrain it from scratch.\n\nWe evaluate our technique on the task of unlearning the Harry Potter books from the Llama2-7b model (a generative language model recently open-sourced by Meta). While the model took over 184K GPU-hours to pretrain, we show that in about 1 GPU hour of finetuning, we effectively erase the model's ability to generate or recall Harry Potter-related content, while its performance on common benchmarks (such as WinoGrande, HellaSwag, arc, boolq and piqa) remains almost unaffected. To the best of our knowledge, this is the first paper to present an effective technique for unlearning in generative language models.\n\nOur technique consists of three main components: First, we use a reinforced model that is further trained on the target data to identify the tokens that are most related to the unlearning target, by comparing its logits with those of a baseline model. Second, we replace idiosyncratic expressions in the target data with generic counterparts, and leverage the model's own predictions to generate alternative labels for every token. These labels aim to approximate the next-token predictions of a model that has not been trained on the target data. Third, we finetune the model on these alternative labels, which effectively erases the original text from the model's memory whenever it is prompted with its context.",
        "keywords": "Large Language Models;Unlearning",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/b03f9dffe6d4ce4fbf9c2e5bb340e9ca35ed1afd.zip",
        "author": "Ronen Eldan;Mark Russinovich",
        "authorids": "~Ronen_Eldan1;mark.russinovich@microsoft.com",
        "gender": "M;",
        "homepage": ";",
        "dblp": "85/9583;",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Ronen_Eldan1;mark.russinovich@microsoft.com",
        "aff": "Microsoft Research;",
        "aff_domain": "microsoft.com;",
        "position": "Principal Researcher;",
        "bibtex": "@misc{\neldan2024whos,\ntitle={Who{\\textquoteright}s Harry Potter? Approximate Unlearning for {LLM}s},\nauthor={Ronen Eldan and Mark Russinovich},\nyear={2024},\nurl={https://openreview.net/forum?id=PDct7vrcvT}\n}",
        "github": "",
        "project": "",
        "reviewers": "sssH;2jeo;NBhf;SCdB",
        "site": "https://openreview.net/forum?id=PDct7vrcvT",
        "pdf_size": 184651,
        "rating": "3;5;5;8",
        "confidence": "3;3;4;3",
        "soundness": "2;2;2;4",
        "contribution": "2;2;3;4",
        "presentation": "3;2;4;3",
        "wc_summary": "113;108;102;124",
        "wc_strengths": "64;77;44;57",
        "wc_weaknesses": "353;189;123;48",
        "wc_questions": "29;20;154;31",
        "wc_review": "559;394;423;260",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            111.75,
            8.073877630977572
        ],
        "wc_strengths_avg": [
            60.5,
            11.926860441876563
        ],
        "wc_weaknesses_avg": [
            178.25,
            112.55082185395183
        ],
        "wc_questions_avg": [
            58.5,
            55.29240454167281
        ],
        "wc_review_avg": [
            409.0,
            106.20969823890849
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.08084520834544431,
        "gs_citation": 187,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18434188012260418066&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "Microsoft",
        "aff_unique_dep": "Microsoft Research",
        "aff_unique_url": "https://www.microsoft.com/en-us/research",
        "aff_unique_abbr": "MSR",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "PEoBvQWzHo",
        "title": "Dirichlet-based Uncertainty Quantification for Personalized Federated Learning with Improved Posterior Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In modern federated learning, one of the main challenges is to account for inherent heterogeneity and the diverse nature of data distributions for different agents. This problem is often addressed by introducing personalization of the models towards the data distribution of the particular agent. However, a personalized model might be unreliable when applied to the data that is not typical for this agent. Eventually, it may perform worse for these data than the non-personalized global model trained in a federated way on the data from all the agents. This paper presents a new approach to federated learning that allows selecting a model from global and personalized ones that would perform better for a particular input point. It is achieved through a careful modeling of predictive uncertainties that helps to detect local and global in- and out-of-distribution data and use this information to select the model that is confident in a prediction. The comprehensive experimental evaluation on the popular real-world image datasets shows the superior performance of the model in the presence of out-of-distribution data while performing on par with state-of-the-art personalized federated learning algorithms in the standard scenarios.",
        "keywords": "Uncertainty quantification;federated learning",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/db76fa73a7fa648456c3de0a84f192d5952fb339.zip",
        "author": "Nikita Kotelevskii;Samuel Horv\u00e1th;Karthik Nandakumar;Martin Tak\u00e1\u010d;Maxim Panov",
        "authorids": "~Nikita_Kotelevskii1;~Samuel_Horv\u00e1th1;~Karthik_Nandakumar3;~Martin_Tak\u00e1\u010d1;~Maxim_Panov1",
        "gender": ";M;;;M",
        "homepage": ";https://sites.google.com/view/samuelhorvath;;;",
        "dblp": ";234/8604;;;30/10085",
        "google_scholar": ";k252J7kAAAAJ;;;https://scholar.google.ru/citations?user=BqDhGJQAAAAJ",
        "orcid": ";0000-0003-0619-9260;;;",
        "linkedin": ";samuel-horvath/;;;",
        "or_profile": "~Nikita_Kotelevskii1;~Samuel_Horv\u00e1th1;~Karthik_Nandakumar3;~Martin_Tak\u00e1\u010d1;~Maxim_Panov1",
        "aff": ";MBZUAI;;;Institute for Information Transmission Problems",
        "aff_domain": ";mbzuai.ac.ae;;;iitp.ru",
        "position": ";Assistant Professor;;;Researcher",
        "bibtex": "@misc{\nkotelevskii2024dirichletbased,\ntitle={Dirichlet-based Uncertainty Quantification for Personalized Federated Learning with Improved Posterior Networks},\nauthor={Nikita Kotelevskii and Samuel Horv{\\'a}th and Karthik Nandakumar and Martin Tak{\\'a}{\\v{c}} and Maxim Panov},\nyear={2024},\nurl={https://openreview.net/forum?id=PEoBvQWzHo}\n}",
        "github": "",
        "project": "",
        "reviewers": "g6z9;LHCT;p9yL",
        "site": "https://openreview.net/forum?id=PEoBvQWzHo",
        "pdf_size": 1380742,
        "rating": "3;3;5",
        "confidence": "4;5;4",
        "soundness": "2;3;3",
        "contribution": "3;3;2",
        "presentation": "3;2;3",
        "wc_summary": "80;14;60",
        "wc_strengths": "76;46;33",
        "wc_weaknesses": "260;365;303",
        "wc_questions": "71;94;26",
        "wc_review": "487;519;422",
        "wc_reply_reviewers": "272;36;108",
        "wc_reply_authors": "1336;1621;878",
        "reply_reviewers": "2;1;1",
        "reply_authors": "3;3;2",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            51.333333333333336,
            27.632509034750274
        ],
        "wc_strengths_avg": [
            51.666666666666664,
            18.00617178142601
        ],
        "wc_weaknesses_avg": [
            309.3333333333333,
            43.09936838928798
        ],
        "wc_questions_avg": [
            63.666666666666664,
            28.241026106633512
        ],
        "wc_review_avg": [
            476.0,
            40.3567425180312
        ],
        "wc_reply_reviewers_avg": [
            138.66666666666666,
            98.75671566475309
        ],
        "wc_reply_authors_avg": [
            1278.3333333333333,
            306.057002679058
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11034139080293636000&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Mohamed bin Zayed University of Artificial Intelligence;Institute for Information Transmission Problems",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.mbzuai.ac.ae;http://www.iitp.ru",
        "aff_unique_abbr": "MBZUAI;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United Arab Emirates;Russian Federation"
    },
    {
        "title": "RTFS-Net: Recurrent Time-Frequency Modelling for Efficient Audio-Visual Speech Separation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18716",
        "id": "PEuDO2EiDr",
        "author_site": "Samuel Pegg, Kai Li, Xiaolin Hu",
        "tldr": "",
        "abstract": "Audio-visual speech separation methods aim to integrate different modalities to generate high-quality separated speech, thereby enhancing the performance of downstream tasks such as speech recognition. Most existing state-of-the-art (SOTA) models operate in the time domain. However, their overly simplistic approach to modeling acoustic features often necessitates larger and more computationally intensive models in order to achieve SOTA performance. In this paper, we present a novel time-frequency domain audio-visual speech separation method: Recurrent Time-Frequency Separation Network (RTFS-Net), which applies its algorithms on the complex time-frequency bins yielded by the Short-Time Fourier Transform. We model and capture the time and frequency dimensions of the audio independently using a multi-layered RNN along each dimension. Furthermore, we introduce a unique attention-based fusion technique for the efficient integration of audio and visual information, and a new mask separation approach that takes advantage of the intrinsic spectral nature of the acoustic features for a clearer separation. RTFS-Net outperforms the prior SOTA method in both inference speed and separation quality while reducing the number of parameters by 90% and MACs by 83%. This is the first time-frequency domain audio-visual speech separation method to outperform all contemporary time-domain counterparts.",
        "keywords": "Audio-Visual;Multi-Modal;Time-Frequency-Domain;Speech-Separation;Model-Compression",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/bd50bfad0343759894c1e0c66b81753cf4231fba.zip",
        "author": "Samuel Pegg;Kai Li;Xiaolin Hu",
        "authorids": "~Samuel_Pegg1;~Kai_Li15;~Xiaolin_Hu1",
        "gender": "M;M;M",
        "homepage": ";https://cslikai.cn;http://www.xlhu.cn/",
        "dblp": ";;60/6028-1",
        "google_scholar": "g0egtekAAAAJ;;PksdgoUAAAAJ",
        "orcid": ";;0000-0002-4907-7354",
        "linkedin": "samuel-pegg-axh/;kai-li-0bb2451a4;",
        "or_profile": "~Samuel_Pegg1;~Kai_Li15;~Xiaolin_Hu1",
        "aff": "Cellvoyant;Tsinghua University;Tsinghua University",
        "aff_domain": "cellvoyant.com;tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "Researcher;MS student;Associate Professor",
        "bibtex": "@inproceedings{\npegg2024rtfsnet,\ntitle={{RTFS}-Net: Recurrent Time-Frequency Modelling for Efficient Audio-Visual Speech Separation},\nauthor={Samuel Pegg and Kai Li and Xiaolin Hu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=PEuDO2EiDr}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZTD4;A4oN;siqV;1FXL",
        "pdf_size": 12367721,
        "rating": "6;8;8;8",
        "confidence": "4;4;4;4",
        "soundness": "3;4;3;4",
        "contribution": "3;4;3;3",
        "presentation": "2;3;3;4",
        "wc_summary": "58;73;109;81",
        "wc_strengths": "31;60;88;29",
        "wc_weaknesses": "54;113;65;29",
        "wc_questions": "42;53;1;52",
        "wc_review": "185;299;263;191",
        "wc_reply_reviewers": "94;9;0;20",
        "wc_reply_authors": "1106;592;505;550",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            80.25,
            18.538810641462412
        ],
        "wc_strengths_avg": [
            52.0,
            24.13503677229434
        ],
        "wc_weaknesses_avg": [
            65.25,
            30.498975392625898
        ],
        "wc_questions_avg": [
            37.0,
            21.224985276791124
        ],
        "wc_review_avg": [
            234.5,
            48.257123826436235
        ],
        "wc_reply_reviewers_avg": [
            30.75,
            37.19795021234369
        ],
        "wc_reply_authors_avg": [
            688.25,
            243.14231943452378
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11019712777421299341&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=PEuDO2EiDr",
        "pdf": "https://openreview.net/pdf?id=PEuDO2EiDr",
        "email": "cellvoyant.com;tsinghua.edu.cn;tsinghua.edu.cn",
        "author_num": 3,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Cellvoyant;Tsinghua University",
        "aff_unique_dep": ";",
        "aff_unique_url": ";https://www.tsinghua.edu.cn",
        "aff_unique_abbr": ";THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "PEuO8WTolW",
        "title": "STIMULUS: Achieving Fast Convergence and Low Sample Complexity in Stochastic Multi-Objective Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recently, multi-objective optimization (MOO) problems have received increasing attention due to their wide range of applications in various fields, such as machine learning (ML), operations research, and many engineering applications. However, MOO algorithm design remains in its infancy and many existing MOO methods suffer from unsatisfactory convergence performance. To address this challenge, in this paper, we propose an algorithm called STIMULUS (**ST**ochastic path-**I**ntegrated **MUL**ti-graident rec**U**rsive e**S**timator), a new and robust approach for solving MOO problems. Different from the traditional methods, STIMULUS introduces a simple yet powerful recursive framework for updating stochastic gradient estimates. This methodology improves convergence performance by reducing the variance in multi-gradient estimation, leading to more stable convergence paths. In addition, we introduce an enhanced version of STIMULUS, termed STIMULUS-M, which incorporates the momentum term to further expedite convergence. One of the key contributions of this paper is the theoretical analysis for both STIMULUS and STIMULUS-M, where we establish an $\\mathcal{O}(\\frac{1}{T})$ convergence rate for both methods, which implies a state-of-the-art sample complexity of $O\\left(n+\\sqrt{n}\\epsilon^{-1}\\right)$ under non-convexity settings. In the case where the objectives are strongly convex, we further establish a linear convergence rate of $\\mathcal{O}(e^{-\\mu T})$ of the proposed methods, which suggests an even stronger $\\mathcal{O}\\left(n+ \\sqrt{n} \\ln ({\\mu/\\epsilon})\\right)$ sample complexity. Moreover, to further alleviate the periodic full gradient evaluation requirement in STIMULUS and STIMULUS-M, we further propose enhanced versions with adaptive batching called STIMULUS$^+$/STIMULUS-M$^+$ and provide their theoretical analysis. Our extensive experimental results verify the efficacy of our proposed algorithms and their superiority over existing methods.",
        "keywords": "multi-objective optimization;sample complexity;variance reduction;momentum",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/30730e8f07e1d294b630b4b7d80f18e34880060e.pdf",
        "author": "Zhuqing Liu;Chaosheng Dong;Michinari Momma;Simone Shao;Shaoyuan Xu;Haibo Yang;Jia Liu",
        "authorids": "~Zhuqing_Liu2;~Chaosheng_Dong1;~Michinari_Momma2;~Simone_Shao1;~Shaoyuan_Xu1;~Haibo_Yang1;~Jia_Liu1",
        "gender": "F;M;;F;M;M;M",
        "homepage": "https://github.com/Zhuqing-Liu;https://chaoshengdong.github.io/;;https://simengshao.github.io/;;https://haibo-yang-osu.github.io/homepage/;https://kevinliu-osu.github.io/index.html",
        "dblp": "195/1161;225/6556;34/6761.html;;;43/7829-1;",
        "google_scholar": ";nPratvEAAAAJ;UDoWGDUAAAAJ;Dt3f2K0AAAAJ;cTzILkQAAAAJ;eyy22VoAAAAJ;Ofx3dScAAAAJ",
        "orcid": "0000-0003-0146-5101;0000-0003-4491-0594;;;;0000-0002-3245-2728;",
        "linkedin": ";chaosheng-dong/;;;shaoyuan-xu-1301a0174/;;",
        "or_profile": "~Zhuqing_Liu2;~Chaosheng_Dong1;~Michinari_Momma2;~Simone_Shao1;~Shaoyuan_Xu1;~Haibo_Yang1;~Jia_Liu1",
        "aff": "Ohio State University;Amazon;Amazon;Amazon;Amazon;Rochester Institute of Technology;The Ohio State University",
        "aff_domain": "osu.edu;amazon.com;amazon.com;amazon.com;amazon.com;rit.edu;osu.edu",
        "position": "PhD student;Researcher;Researcher;Researcher;Researcher;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nliu2024stimulus,\ntitle={{STIMULUS}: Achieving Fast Convergence and Low Sample Complexity in Stochastic Multi-Objective Learning},\nauthor={Zhuqing Liu and Chaosheng Dong and Michinari Momma and Simone Shao and Shaoyuan Xu and Haibo Yang and Jia Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=PEuO8WTolW}\n}",
        "github": "",
        "project": "",
        "reviewers": "A8De;RiGJ;zAtp;ccVZ;jjKe",
        "site": "https://openreview.net/forum?id=PEuO8WTolW",
        "pdf_size": 962079,
        "rating": "3;3;5;5;8",
        "confidence": "4;2;3;4;3",
        "soundness": "2;2;2;3;4",
        "contribution": "2;2;2;2;3",
        "presentation": "3;2;3;3;3",
        "wc_summary": "74;13;45;114;84",
        "wc_strengths": "39;13;44;45;56",
        "wc_weaknesses": "190;149;242;201;78",
        "wc_questions": "50;1;297;109;9",
        "wc_review": "353;176;628;469;227",
        "wc_reply_reviewers": "0;0;60;0;0",
        "wc_reply_authors": "2054;1190;3711;1800;460",
        "reply_reviewers": "0;0;1;0;0",
        "reply_authors": "4;3;6;3;1",
        "rating_avg": [
            4.8,
            1.8330302779823362
        ],
        "confidence_avg": [
            3.2,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.6,
            0.8
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            66.0,
            34.47317797940886
        ],
        "wc_strengths_avg": [
            39.4,
            14.319217855734998
        ],
        "wc_weaknesses_avg": [
            172.0,
            55.5517776493246
        ],
        "wc_questions_avg": [
            93.2,
            108.8492535573855
        ],
        "wc_review_avg": [
            370.6,
            164.1567543538797
        ],
        "wc_reply_reviewers_avg": [
            12.0,
            24.0
        ],
        "wc_reply_authors_avg": [
            1843.0,
            1083.964206051104
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            3.4,
            1.624807680927192
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.02916059217599024,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:IAe61kE_WkgJ:scholar.google.com/&scioq=STIMULUS:+Achieving+Fast+Convergence+and+Low+Sample+Complexity+in+Stochastic+Multi-Objective+Learning&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1;1;2;0",
        "aff_unique_norm": "Ohio State University;Amazon;Rochester Institute of Technology",
        "aff_unique_dep": ";Amazon.com, Inc.;",
        "aff_unique_url": "https://www.osu.edu;https://www.amazon.com;https://www.rit.edu",
        "aff_unique_abbr": "OSU;Amazon;RIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "PFUrgJtfs0",
        "title": "Lost in Transformation: Current roadblocks for Transformers in 3D medical image segmentation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In the medical image segmentation domain, sparsely-annotated, limited datasets are common, posing a natural hurdle for Transformer-based segmentation networks. In this work, we systematically dissect 9 such popular Transformer networks on two representative organ and pathology segmentation datasets and explore whether Transformers are still beneficial under these challenging conditions. 1) We demonstrate that these Transformer-based segmentation networks frequently incorporate substantial convolutional backbones, which predominantly contribute to their performance, while Transformers themselves play a peripheral role. 2) Extending beyond accuracy, we analyze error and representational similarity to uncover architectures with underutilized Transformers, demonstrated by indiscernible change on both metrics without the Transformer. 3) We quantify the massive dataset size 'chasm' between medical and natural images, examine the impact of data reduction on performance, showing that Transformers bridge the performance gap to CNNs as the dataset size increases. 4) Additionally, we probe the importance of long-range interactions, showing that even limited receptive fields offer high performance in segmenting medical images, questioning the need for long-range interactions inherent to Transformers. In doing so, we identify significant challenges faced by major architectures employing Transformers for medical image segmentation, which may contribute to potential inefficiencies downstream in the domain.",
        "keywords": "representation learning;transformers;medical image segmentation;semantic segmentation;sparse datasets",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/e55e0096ebe54ae21c772b893aadba1af09189aa.pdf",
        "author": "Saikat Roy;Tassilo Wald;Michael Baumgartner;Constantin Ulrich;Gregor Koehler;David Zimmerer;Fabian Isensee;Klaus Maier-Hein",
        "authorids": "~Saikat_Roy2;~Tassilo_Wald1;~Michael_Baumgartner2;~Constantin_Ulrich1;~Gregor_Koehler1;~David_Zimmerer1;~Fabian_Isensee1;~Klaus_Maier-Hein1",
        "gender": "M;M;M;M;M;M;M;M",
        "homepage": "https://linktr.ee/saikat.roy;https://TaWald.github.io;;;;;;http://www.dkfz.de/en/mic",
        "dblp": "59/8399.html;289/0140;66/4721-1;327/3310;251/8923;192/4608;;133/0183",
        "google_scholar": "https://scholar.google.de/citations?user=dSs0DfoAAAAJ;https://scholar.google.com/citations?view_op=list_works;https://scholar.google.com/citations?hl=de;https://scholar.google.com/citations?hl=de;b8U4UTAAAAAJ;https://scholar.google.de/citations?user=_G7n5uMAAAAJ;PjerEe4AAAAJ;oCrBpVMAAAAJ",
        "orcid": "0000-0002-0809-6524;0009-0007-5222-2683;;;;;0000-0002-3519-5886;0000-0002-6626-2463",
        "linkedin": "mrsaikatroy/;tassilo-wald-342902217/;michael-baumgartner-/;;;;;",
        "or_profile": "~Saikat_Roy2;~Tassilo_Wald1;~Michael_Baumgartner2;~Constantin_Ulrich1;~Gregor_Koehler1;~David_Zimmerer1;~Fabian_Isensee1;~Klaus_Maier-Hein1",
        "aff": "Ruprecht-Karls-Universit\u00e4t Heidelberg;German Cancer Research Center;Deutsches Krebsforschungszentrum;Deutsches Krebsforschungszentrum;German Cancer Research Center (DKFZ);German Cancer Research Center;German Cancer Research Center;German Cancer Research Center",
        "aff_domain": "uni-heidelberg.de;dkfz.de;dkfz.de;dkfz.de;dkfz.de;dkfz.de;dkfz.de;dkfz.de",
        "position": "PhD student;PhD student;PhD student;PhD student;PhD student;Postdoc;Principal Researcher;Full Professor",
        "bibtex": "@misc{\nroy2024lost,\ntitle={Lost in Transformation: Current roadblocks for Transformers in 3D medical image segmentation},\nauthor={Saikat Roy and Tassilo Wald and Michael Baumgartner and Constantin Ulrich and Gregor Koehler and David Zimmerer and Fabian Isensee and Klaus Maier-Hein},\nyear={2024},\nurl={https://openreview.net/forum?id=PFUrgJtfs0}\n}",
        "github": "",
        "project": "",
        "reviewers": "aM1T;kZHs;Z59e;BnaE",
        "site": "https://openreview.net/forum?id=PFUrgJtfs0",
        "pdf_size": 648683,
        "rating": "1;3;5;5",
        "confidence": "4;4;4;3",
        "soundness": "1;3;2;2",
        "contribution": "1;2;2;2",
        "presentation": "1;3;2;2",
        "wc_summary": "30;22;56;65",
        "wc_strengths": "6;46;18;71",
        "wc_weaknesses": "47;92;231;23",
        "wc_questions": "86;159;2;160",
        "wc_review": "169;319;307;319",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "784;686;534;724",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            3.5,
            1.6583123951777
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            43.25,
            17.76759691123141
        ],
        "wc_strengths_avg": [
            35.25,
            25.232667318379164
        ],
        "wc_weaknesses_avg": [
            98.25,
            80.54618240487875
        ],
        "wc_questions_avg": [
            101.75,
            64.93987603930269
        ],
        "wc_review_avg": [
            278.5,
            63.40938416354475
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            682.0,
            92.31467922275417
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:1Q0AgA8V0GwJ:scholar.google.com/&scioq=Lost+in+Transformation:+Current+roadblocks+for+Transformers+in+3D+medical+image+segmentation&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;2;1;1;1;1",
        "aff_unique_norm": "Ruprecht-Karls-Universit\u00e4t Heidelberg;German Cancer Research Center;Deutsches Krebsforschungszentrum",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.uni-heidelberg.de/;https://www.dkfz.de;https://www.dkfz.de",
        "aff_unique_abbr": "Uni Heidelberg;DKFZ;DKFZ",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "PFdjJiZjPj",
        "title": "The Program Testing Ability of Large Language Models for Code",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recent development of large language models (LLMs) for code like CodeX and CodeT5+ demonstrates tremendous promise in achieving code intelligence. Their ability of synthesizing code that completes a program for performing a pre-defined task has been intensively tested and verified on benchmark datasets including HumanEval and MBPP. Yet, evaluation of these LLMs from more perspectives (than just program synthesis) is also anticipated, considering their broad scope of applications in software engineering. In this paper, we explore the ability of LLMs for testing programs/code. By performing thorough analyses of recent LLMs for code in program testing, we show a series of intriguing properties of these models and demonstrate how program testing ability of LLMs can be improved. Following recent work which utilizes generated test cases to enhance program synthesis, we further leverage our findings in improving the quality of the synthesized programs and show +11.77\\% and +4.22\\% higher code pass rates on HumanEval+ comparing with the GPT-3.5-turbo baseline and the recent state-of-the-art, respectively.",
        "keywords": "code generation;test case generation;large language models",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Weimin Xiong;Yiwen Guo;Hao Chen",
        "authorids": "~Weimin_Xiong1;~Yiwen_Guo1;~Hao_Chen5",
        "gender": "M;;",
        "homepage": "https://github.com/WeiminXiong;;https://www.cs.ucdavis.edu/~hchen/",
        "dblp": "342/9246;;86/475-3",
        "google_scholar": "UwYq5tgAAAAJ;;1Aa3qxIAAAAJ",
        "orcid": ";;0000-0002-4072-0710",
        "linkedin": ";;",
        "or_profile": "~Weimin_Xiong1;~Yiwen_Guo1;~Hao_Chen5",
        "aff": "Peking University;;University of California, Davis",
        "aff_domain": "pku.edu.cn;;ucdavis.edu",
        "position": "PhD student;;Full Professor",
        "bibtex": "@misc{\nxiong2024the,\ntitle={The Program Testing Ability of Large Language Models for Code},\nauthor={Weimin Xiong and Yiwen Guo and Hao Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=PFdjJiZjPj}\n}",
        "github": "",
        "project": "",
        "reviewers": "PLSn;EZ26;hLEw;7enN",
        "site": "https://openreview.net/forum?id=PFdjJiZjPj",
        "pdf_size": 515384,
        "rating": "3;3;5;6",
        "confidence": "4;5;4;5",
        "soundness": "3;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;1;3;3",
        "wc_summary": "31;509;197;127",
        "wc_strengths": "45;57;52;99",
        "wc_weaknesses": "341;637;76;176",
        "wc_questions": "78;43;117;152",
        "wc_review": "495;1246;442;554",
        "wc_reply_reviewers": "81;0;0;51",
        "wc_reply_authors": "1344;1652;908;1112",
        "reply_reviewers": "2;0;0;1",
        "reply_authors": "4;4;2;3",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            216.0,
            179.13402803487674
        ],
        "wc_strengths_avg": [
            63.25,
            21.07575621419075
        ],
        "wc_weaknesses_avg": [
            307.5,
            212.47176282979345
        ],
        "wc_questions_avg": [
            97.5,
            40.929817981515626
        ],
        "wc_review_avg": [
            684.25,
            326.7371841404036
        ],
        "wc_reply_reviewers_avg": [
            33.0,
            34.66266002487403
        ],
        "wc_reply_authors_avg": [
            1254.0,
            276.75982367388514
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.25,
            0.82915619758885
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.19245008972987526,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17114932314369922981&as_sdt=8005&sciodt=0,7&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Peking University;University of California, Davis",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.ucdavis.edu",
        "aff_unique_abbr": "Peking U;UC Davis",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Davis",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "PH0L3ABwM2",
        "title": "SEER: Towards Efficient Preference-based Reinforcement Learning via Aligned Experience Estimation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "One of challenge in reinforcement learning lies in the meticulous design of a reward function that quantifies the quality of each decision as a scalar value. Preference-based reinforcement learning (PbRL) provides an alternative approach, avoiding reward engineering by learning rewards based on human preferences among various trajectories. PbRL involves sampling informative trajectories, learning rewards from preferences, optimizing policy with learned rewards, and subsequently generating higher-quality trajectories for the next iteration, thereby creating a virtuous circle. Distinct problems lie in effective reward learning and aligning the policy with human preferences, both of which are essential for achieving efficient learning. Motivated by these considerations, we propose an efficient preference-based RL method, dubbed SEER. We leverage state-action pairs that are well-supported in the current replay memory to bootstrap an empirical Q function ($\\widehat{Q}$), which is aligned with human preference. The empirical Q function helps SEER to sample more informative pairs for effective querying, and regularizes the neural Q function ($Q_\\theta$) thus leading to a policy which is more consistent with human intent. Theoretically, we show that the empirical Q function is a lower-bound of the oracle Q under human preference. Our experimental results over several tasks demonstrate that the empirical Q function is beneficial for preference-based RL to learn a more aligned Q function, outperforming state-of-the-art methods by a large margin.",
        "keywords": "preference-based reinforcement learning;human-in-the-loop reinforcement learning;deep reinforcement learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/1e8e765c18cdf7a45f7f1536ca7e44894d17bbb4.pdf",
        "author": "Fengshuo Bai;Rui Zhao;Hongming Zhang;Sijia Cui;bo xu;Lei Han",
        "authorids": "~Fengshuo_Bai1;~Rui_Zhao1;~Hongming_Zhang3;~Sijia_Cui1;~bo_xu1;~Lei_Han1",
        "gender": ";M;M;;M;M",
        "homepage": "https://changwinde.github.io/;https://ruizhaogit.github.io;https://github.com/initial-h;;;https://www.leihan.org",
        "dblp": "346/1114;26/2578-11;;;;75/2307-1",
        "google_scholar": "https://scholar.google.com/citations?hl=en;N1yNDnQAAAAJ;https://scholar.google.ca/citations?user=mwbsY3AAAAAJ;;;Tz4_zi8AAAAJ",
        "orcid": ";;;0009-0004-7304-9064;;",
        "linkedin": ";rui-zhao-profile/;;;;",
        "or_profile": "~Fengshuo_Bai1;~Rui_Zhao1;~Hongming_Zhang3;~Sijia_Cui1;~bo_xu1;~Lei_Han1",
        "aff": "Shanghai Jiaotong University;Tencent AI Lab;University of Alberta;Institute of Automation, Chinese Academy of Sciences;;Tencent Robotics X",
        "aff_domain": "sjtu.edu.cn;tencent.com;ualberta.ca;ia.ac.cn;;tencent.com",
        "position": "PhD student;Researcher;PhD student;PhD student;;Principal Researcher",
        "bibtex": "@misc{\nbai2024seer,\ntitle={{SEER}: Towards Efficient Preference-based Reinforcement Learning via Aligned Experience Estimation},\nauthor={Fengshuo Bai and Rui Zhao and Hongming Zhang and Sijia Cui and bo xu and Lei Han},\nyear={2024},\nurl={https://openreview.net/forum?id=PH0L3ABwM2}\n}",
        "github": "",
        "project": "",
        "reviewers": "Atku;pCcb;pgTP;AZLG",
        "site": "https://openreview.net/forum?id=PH0L3ABwM2",
        "pdf_size": 6533773,
        "rating": "3;5;5;5",
        "confidence": "3;2;3;2",
        "soundness": "2;2;3;2",
        "contribution": "2;2;3;3",
        "presentation": "2;3;3;2",
        "wc_summary": "85;108;76;116",
        "wc_strengths": "47;16;64;10",
        "wc_weaknesses": "389;67;112;277",
        "wc_questions": "97;30;64;36",
        "wc_review": "618;221;316;439",
        "wc_reply_reviewers": "0;20;24;356",
        "wc_reply_authors": "0;536;891;1049",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "0;2;2;3",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            2.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            96.25,
            16.315253599009733
        ],
        "wc_strengths_avg": [
            34.25,
            22.18529918662356
        ],
        "wc_weaknesses_avg": [
            211.25,
            129.0123540596016
        ],
        "wc_questions_avg": [
            56.75,
            26.54595072699413
        ],
        "wc_review_avg": [
            398.5,
            148.4360131504481
        ],
        "wc_reply_reviewers_avg": [
            100.0,
            148.08105888330215
        ],
        "wc_reply_authors_avg": [
            619.0,
            402.78219920944866
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            1.0897247358851685
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:aEUlaG7la9sJ:scholar.google.com/&scioq=SEER:+Towards+Efficient+Preference-based+Reinforcement+Learning+via+Aligned+Experience+Estimation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;1",
        "aff_unique_norm": "Shanghai Jiao Tong University;Tencent;University of Alberta;Chinese Academy of Sciences",
        "aff_unique_dep": ";Tencent AI Lab;;Institute of Automation",
        "aff_unique_url": "https://www.sjtu.edu.cn;https://ai.tencent.com;https://www.ualberta.ca;http://www.ia.cas.cn",
        "aff_unique_abbr": "SJTU;Tencent AI Lab;UAlberta;CAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "China;Canada"
    },
    {
        "title": "CoVLM: Composing Visual Entities and Relationships in Large Language Models Via Communicative Decoding",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18715",
        "id": "PHGxChm1l5",
        "author_site": "Junyan Li, Delin Chen, Yining Hong, Zhenfang Chen, Peihao Chen, Yikang Shen, Chuang Gan",
        "tldr": "",
        "abstract": "A remarkable ability of human beings resides in compositional reasoning, i.e., the capacity to make \"infinite use of finite means\". However, current large vision-language foundation models (VLMs)  fall short of such compositional abilities due to their ``bag-of-words\" behaviors and inability to construct words that correctly represent visual entities and the relations among the entities. To this end, we propose CoVLM, which can guide the LLM to explicitly compose visual entities and relationships among the text and dynamically communicate with the vision encoder and detection network to achieve vision-language communicative decoding. Specifically, we first devise a set of novel communication tokens for the LLM, for dynamic communication between the visual detection system and the language system. A communication token is generated by the LLM following a visual entity or a relation, to inform the detection network to propose regions that are relevant to the sentence generated so far. The proposed regions-of-interests (ROIs) are then fed back into the LLM for better language generation contingent on the relevant regions. The LLM is thus able to compose the visual entities and relationships through the communication tokens. The vision-to-language and language-to-vision communication are iteratively performed until the entire sentence is generated. Our framework seamlessly bridges the gap between visual perception and LLMs and outperforms previous VLMs by a large margin on compositional reasoning benchmarks (e.g., ~20% in HICO-DET mAP, ~14% in Cola top-1 accuracy, and ~3% on ARO top-1 accuracy). We also achieve state-of-the-art performances on traditional vision-language tasks such as referring expression comprehension and visual question answering.",
        "keywords": "vision-language model;compositionality",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Junyan Li;Delin Chen;Yining Hong;Zhenfang Chen;Peihao Chen;Yikang Shen;Chuang Gan",
        "authorids": "~Junyan_Li1;~Delin_Chen1;~Yining_Hong1;~Zhenfang_Chen1;~Peihao_Chen1;~Yikang_Shen1;~Chuang_Gan1",
        "gender": "M;M;F;M;M;M;M",
        "homepage": "https://senfu.github.io;https://chendl02.github.io/;https://evelinehong.github.io;https://zfchenunique.github.io;https://peihaochen.github.io/;;http://people.csail.mit.edu/ganchuang/",
        "dblp": "32/11514;227/7202;245/3655;207/5321;249/8975;152/8226;139/6993",
        "google_scholar": ";;PTYxORcAAAAJ;QSRdIzAAAAAJ;KkpEXpsAAAAJ;qff5rRYAAAAJ;PTeSCbIAAAAJ",
        "orcid": ";0000-0002-9519-093X;;;0000-0002-6847-1621;;",
        "linkedin": ";;;\u632f\u65b9-\u9648-512011bb/;;;",
        "or_profile": "~Junyan_Li1;~Delin_Chen1;~Yining_Hong1;~Zhenfang_Chen1;~Peihao_Chen1;~Yikang_Shen1;~Chuang_Gan1",
        "aff": "University of Massachusetts at Amherst;Wuhan University;University of California, Los Angeles;MIT-IBM Watson AI lab;South China University of Technology;International Business Machines;University of Massachusetts at Amherst",
        "aff_domain": "umass.edu;whu.edu.cn;cs.ucla.edu;ibm.com;scut.edu.cn;ibm.com;umass.edu",
        "position": "PhD student;Undergrad student;PhD student;Researcher;PhD student;Researcher;Assistant Professor",
        "bibtex": "@inproceedings{\nli2024covlm,\ntitle={Co{VLM}: Composing Visual Entities and Relationships in Large Language Models Via Communicative Decoding},\nauthor={Junyan Li and Delin Chen and Yining Hong and Zhenfang Chen and Peihao Chen and Yikang Shen and Chuang Gan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=PHGxChm1l5}\n}",
        "github": "",
        "project": "",
        "reviewers": "onDF;Aw71;fA94",
        "pdf_size": 38804558,
        "rating": "5;6;8",
        "confidence": "4;4;4",
        "soundness": "3;3;2",
        "contribution": "3;3;3",
        "presentation": "2;4;4",
        "wc_summary": "77;134;136",
        "wc_strengths": "73;120;107",
        "wc_weaknesses": "125;328;211",
        "wc_questions": "113;34;77",
        "wc_review": "388;616;531",
        "wc_reply_reviewers": "0;21;118",
        "wc_reply_authors": "1529;696;2055",
        "reply_reviewers": "0;1;2",
        "reply_authors": "5;2;4",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            115.66666666666667,
            27.35365098523819
        ],
        "wc_strengths_avg": [
            100.0,
            19.8158185969358
        ],
        "wc_weaknesses_avg": [
            221.33333333333334,
            83.1958866504562
        ],
        "wc_questions_avg": [
            74.66666666666667,
            32.293790252754306
        ],
        "wc_review_avg": [
            511.6666666666667,
            94.07916288365287
        ],
        "wc_reply_reviewers_avg": [
            46.333333333333336,
            51.396065564939455
        ],
        "wc_reply_authors_avg": [
            1426.6666666666667,
            559.5083158949075
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            1.247219128924647
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 16,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7795524003680417767&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=PHGxChm1l5",
        "pdf": "https://openreview.net/pdf?id=PHGxChm1l5",
        "email": "umass.edu;whu.edu.cn;cs.ucla.edu;ibm.com;scut.edu.cn;ibm.com;umass.edu",
        "author_num": 7,
        "aff_unique_index": "0;1;2;3;4;5;0",
        "aff_unique_norm": "University of Massachusetts Amherst;Wuhan University;University of California, Los Angeles;Massachusetts Institute of Technology;South China University of Technology;International Business Machines Corporation",
        "aff_unique_dep": ";;;IBM Watson AI lab;;",
        "aff_unique_url": "https://www.umass.edu;http://www.whu.edu.cn/;https://www.ucla.edu;https://www.mitibmwatsonailab.org;https://www.scut.edu.cn;https://www.ibm.com",
        "aff_unique_abbr": "UMass Amherst;WHU;UCLA;MIT-IBM AI Lab;SCUT;IBM",
        "aff_campus_unique_index": "0;2;0",
        "aff_campus_unique": "Amherst;;Los Angeles",
        "aff_country_unique_index": "0;1;0;0;1;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "Unconstrained Stochastic CCA: Unifying Multiview and Self-Supervised Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18714",
        "id": "PHLVmV88Zy",
        "author_site": "James Chapman, Lennie Wells, Ana Lawry Aguila",
        "tldr": "",
        "abstract": "The Canonical Correlation Analysis (CCA) family of methods is foundational in multiview learning.\nRegularised linear CCA methods can be seen to generalise Partial Least Squares (PLS) and be unified with a Generalized Eigenvalue Problem (GEP) framework.\nHowever, classical algorithms for these linear methods are computationally infeasible for large-scale data.\nExtensions to Deep CCA show great promise, but current training procedures are slow and complicated.\nFirst we propose a novel unconstrained objective that characterizes the top subspace of GEPs.\nOur core contribution is a family of fast algorithms for stochastic PLS, stochastic CCA, and Deep CCA, simply obtained by applying stochastic gradient descent (SGD) to the corresponding CCA objectives.\nOur algorithms show far faster convergence and recover higher correlations than the previous state-of-the-art on all standard CCA and Deep CCA benchmarks.\nThese improvements allow us to perform a first-of-its-kind PLS analysis of an extremely large biomedical dataset from the UK Biobank, with over 33,000 individuals and 500,000 features.\nFinally, we apply our algorithms to match the performance of `CCA-family' Self-Supervised Learning (SSL) methods on CIFAR-10 and CIFAR-100 with minimal hyper-parameter tuning, and also present theory to clarify the links between these methods and classical CCA, laying the groundwork for future insights.",
        "keywords": "Canonical Correlation Analysis;Multiview Learning;Self-Supervised Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/ddf315b8970f08875f686d8e2e8446cb5a4695df.zip",
        "author": "James Chapman;Lennie Wells;Ana Lawry Aguila",
        "authorids": "~James_Chapman1;~Lennie_Wells1;~Ana_Lawry_Aguila2",
        "gender": "M;;M",
        "homepage": ";;",
        "dblp": ";;",
        "google_scholar": ";;https://scholar.google.co.uk/citations?user=lgIPETwAAAAJ",
        "orcid": "0000-0002-8098-9212;;",
        "linkedin": "lennie-wells-9569b11a1/;ana-lawry-aguila/;jameswhchapman/",
        "or_profile": "~Lennie_Wells1;~Ana_Lawry_Aguila2;~James_William_Harvey_Chapman1",
        "aff": "University of Cambridge;The University of Tokyo;",
        "aff_domain": "cam.ac.uk;u-tokyo.ac.jp;",
        "position": "PhD student;Postdoc;",
        "bibtex": "@inproceedings{\nchapman2024unconstrained,\ntitle={Unconstrained Stochastic {CCA}: Unifying Multiview and Self-Supervised Learning},\nauthor={James Chapman and Lennie Wells and Ana Lawry Aguila},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=PHLVmV88Zy}\n}",
        "github": "",
        "project": "",
        "reviewers": "73xD;wHCq;NeR6",
        "pdf_size": 1342966,
        "rating": "5;8;8",
        "confidence": "2;2;3",
        "soundness": "3;3;4",
        "contribution": "2;3;4",
        "presentation": "3;3;3",
        "wc_summary": "29;103;96",
        "wc_strengths": "29;164;184",
        "wc_weaknesses": "53;294;167",
        "wc_questions": "8;121;19",
        "wc_review": "119;682;466",
        "wc_reply_reviewers": "0;304;33",
        "wc_reply_authors": "762;1492;138",
        "reply_reviewers": "0;1;1",
        "reply_authors": "1;3;2",
        "rating_avg": [
            7.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            76.0,
            33.35665850571167
        ],
        "wc_strengths_avg": [
            125.66666666666667,
            68.8395880935446
        ],
        "wc_weaknesses_avg": [
            171.33333333333334,
            98.43554010394598
        ],
        "wc_questions_avg": [
            49.333333333333336,
            50.87457343528515
        ],
        "wc_review_avg": [
            422.3333333333333,
            231.90850686327906
        ],
        "wc_reply_reviewers_avg": [
            112.33333333333333,
            136.1967531021043
        ],
        "wc_reply_authors_avg": [
            797.3333333333334,
            553.332530119899
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11278999947201294937&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=PHLVmV88Zy",
        "pdf": "https://openreview.net/pdf?id=PHLVmV88Zy",
        "email": "cam.ac.uk;u-tokyo.ac.jp;",
        "author_num": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Cambridge;University of Tokyo",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cam.ac.uk;https://www.u-tokyo.ac.jp",
        "aff_unique_abbr": "Cambridge;UTokyo",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Cambridge;",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United Kingdom;Japan"
    },
    {
        "id": "PI6yaLXz3C",
        "title": "Fairness-Aware Attention for Contrastive Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Contrastive learning has proven instrumental in learning unbiased representations of data, especially in complex environments characterized by high-cardinality and high-dimensional sensitive information. However, existing approaches within this setting require predefined modelling assumptions of bias-causing interactions that limit the model's ability to learn debiased representations. In this work, we propose a new method for fair contrastive learning that employs an attention mechanism to model bias-causing interactions, enabling the learning of a fairer and semantically richer embedding space. In particular, our attention mechanism avoids bias-causing samples that confound the model and focuses on bias-reducing samples that help learn semantically meaningful representations. We verify the advantages of our method against existing baselines in fair contrastive learning and show that our approach can significantly boost bias removal from learned representations without compromising downstream accuracy.",
        "keywords": "Fairness;Contrastive Learning;Attention",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/5e980e11c5c72435b11ed40e753a1f885e0a462e.zip",
        "author": "Stefan Nielsen;Tan Minh Nguyen",
        "authorids": "~Stefan_Nielsen1;~Tan_Minh_Nguyen1",
        "gender": "M;M",
        "homepage": ";https://tanmnguyen89.github.io/",
        "dblp": "380/3225;255/4725",
        "google_scholar": "https://scholar.google.com/citations?hl=en;OizOh88AAAAJ",
        "orcid": ";",
        "linkedin": "stefan-nielsen-850090b5/;",
        "or_profile": "~Stefan_Nielsen1;~Tan_Minh_Nguyen1",
        "aff": "FPT AI;National University of Singapore",
        "aff_domain": "fpt.com;nus.edu.sg",
        "position": "Researcher;Assistant Professor",
        "bibtex": "@misc{\nnielsen2024fairnessaware,\ntitle={Fairness-Aware Attention for Contrastive Learning},\nauthor={Stefan Nielsen and Tan Minh Nguyen},\nyear={2024},\nurl={https://openreview.net/forum?id=PI6yaLXz3C}\n}",
        "github": "",
        "project": "",
        "reviewers": "Nbdh;nzY3;K853",
        "site": "https://openreview.net/forum?id=PI6yaLXz3C",
        "pdf_size": 675430,
        "rating": "3;3;5",
        "confidence": "4;3;2",
        "soundness": "1;3;2",
        "contribution": "2;2;2",
        "presentation": "1;1;2",
        "wc_summary": "116;131;102",
        "wc_strengths": "110;106;64",
        "wc_weaknesses": "337;370;76",
        "wc_questions": "3;73;7",
        "wc_review": "566;680;249",
        "wc_reply_reviewers": "499;221;0",
        "wc_reply_authors": "1271;807;656",
        "reply_reviewers": "2;1;0",
        "reply_authors": "4;2;1",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            116.33333333333333,
            11.841546445554409
        ],
        "wc_strengths_avg": [
            93.33333333333333,
            20.805982045769646
        ],
        "wc_weaknesses_avg": [
            261.0,
            131.5066538240556
        ],
        "wc_questions_avg": [
            27.666666666666668,
            32.097074979228594
        ],
        "wc_review_avg": [
            498.3333333333333,
            182.34460659848307
        ],
        "wc_reply_reviewers_avg": [
            240.0,
            204.15843520821437
        ],
        "wc_reply_authors_avg": [
            911.3333333333334,
            261.68726033611614
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.8660254037844387,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:qBocQz7PnR0J:scholar.google.com/&scioq=Fairness-Aware+Attention+for+Contrastive+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "FPT Corporation;National University of Singapore",
        "aff_unique_dep": "FPT AI;",
        "aff_unique_url": "https://www.fpt.com.vn;https://www.nus.edu.sg",
        "aff_unique_abbr": "FPT;NUS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Vietnam;Singapore"
    },
    {
        "id": "PIl69UIAWL",
        "title": "GraphLLM: Boosting Graph Reasoning Ability of Large Language Model",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The advancement of Large Language Models (LLMs) has remarkably pushed the boundaries towards artificial general intelligence (AGI), with their exceptional ability on understanding diverse types of information,  including but not limited to images and audio.  Despite this progress, a critical gap remains in empowering LLMs to proficiently understand and reason on graph data. Recent studies underscore LLMs' underwhelming performance on fundamental graph reasoning tasks.  In this paper, we endeavor to unearth the obstacles that impede LLMs in graph reasoning, pinpointing the common practice of converting graphs into natural language descriptions (Graph2Text) as a fundamental bottleneck. To overcome this impediment, we introduce GraphLLM, a pioneering end-to-end approach that synergistically integrates graph learning models with LLMs. This synergy equips LLMs with the ability to proficiently interpret and reason on graph data, harnessing the superior expressive power of graph learning models. Our empirical evaluations across four fundamental graph reasoning tasks validate the effectiveness of GraphLLM. The results exhibit a substantial average accuracy enhancement of 54.44%, alongside a noteworthy context reduction of 96.45% across various graph reasoning tasks.",
        "keywords": "Large Language Models (LLMs); reasoning on graph; graph neural networks;",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Ziwei Chai;Tianjie Zhang;Liang Wu;Kaiqiao Han;Xiaohai Hu;Xuanwen Huang;Yang Yang",
        "authorids": "~Ziwei_Chai1;~Tianjie_Zhang1;~Liang_Wu8;~Kaiqiao_Han1;~Xiaohai_Hu1;~Xuanwen_Huang1;~Yang_Yang35",
        "gender": "Not Specified;;M;M;;M;M",
        "homepage": "https://zwchai.github.io;;https://www.cnblogs.com/liangwu;;;;http://yangy.org",
        "dblp": "325/1758;;;356/3989;;256/9418;",
        "google_scholar": ";;;gFBnb-AAAAAJ;;JFLCWNQAAAAJ;",
        "orcid": "0000-0003-1376-5101;;0000-0002-4036-6897;0009-0008-1389-1291;;;0000-0002-5058-4417",
        "linkedin": ";;;kaiqiao-han-30a6a7329/;;;",
        "or_profile": "~Ziwei_Chai1;~Tianjie_Zhang1;~Liang_Wu8;~Kaiqiao_Han1;~Xiaohai_Hu1;~Xuanwen_Huang1;~Yang_Yang35",
        "aff": "Zhejiang University;;State Grid Zhejiang Electric Power Supply Co. Ltd., China;Zhejiang University;;Zhejiang University;Zhejiang University",
        "aff_domain": "zju.edu.cn;;zj.sgcc.com.cn;zju.edu.cn;;zju.edu.cn;zju.edu.cn",
        "position": "PhD student;;Principal Researcher;Undergrad student;;PhD student;Associate Professor",
        "bibtex": "@misc{\nchai2024graphllm,\ntitle={Graph{LLM}: Boosting Graph Reasoning Ability of Large Language Model},\nauthor={Ziwei Chai and Tianjie Zhang and Liang Wu and Kaiqiao Han and Xiaohai Hu and Xuanwen Huang and Yang Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=PIl69UIAWL}\n}",
        "github": "",
        "project": "",
        "reviewers": "DjB6;wWow;B4te;ryJZ",
        "site": "https://openreview.net/forum?id=PIl69UIAWL",
        "pdf_size": 1404711,
        "rating": "3;3;5;5",
        "confidence": "4;4;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "69;29;85;102",
        "wc_strengths": "61;53;94;82",
        "wc_weaknesses": "323;450;445;327",
        "wc_questions": "3;2;234;6",
        "wc_review": "456;534;858;517",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1331;1636;1188;692",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;3;2;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            71.25,
            27.040478915877213
        ],
        "wc_strengths_avg": [
            72.5,
            16.31716887208072
        ],
        "wc_weaknesses_avg": [
            386.25,
            61.29182245618089
        ],
        "wc_questions_avg": [
            61.25,
            99.74812028304092
        ],
        "wc_review_avg": [
            591.25,
            156.71530716557334
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1211.75,
            340.9225535220573
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 105,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11128121581622757045&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;0;0;0",
        "aff_unique_norm": "Zhejiang University;State Grid Zhejiang Electric Power Supply Company",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.zju.edu.cn;",
        "aff_unique_abbr": "ZJU;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Reinforcement Symbolic Regression Machine",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18713",
        "id": "PJVUWpPnZC",
        "author_site": "Yilong Xu, Yang Liu, Hao Sun",
        "tldr": "",
        "abstract": "In nature, the behavior of many complex systems can be described by parsimonious math equations. Symbolic Regression (SR) is defined as the task of automatically distilling equations from limited data. Keen efforts have been placed on tackling this issue and demonstrated success in SR. However, there still exist bottlenecks that current methods struggle to break, when the expressions we need to explore tend toward infinity and especially when the underlying math formula is intricate. To this end, we propose a novel Reinforcement Symbolic Regression Machine (RSRM) that masters the capability of uncovering complex math equations from only scarce data. The RSRM model is composed of three key modules: (1) a Monte Carlo tree search (MCTS) agent, designed for exploration, that explores optimal math expression trees consisting of pre-defined math operators and variables, (2) a Double Q-learning block,  designed for exploitation, that helps reduce the feasible search space of MCTS via properly understanding the distribution of reward, and (3) a modulated sub-tree discovery block that heuristically learns and defines new math operators to improve representation ability of math expression trees. Binding of these modules yields the SOTA performance of RSRM in SR as demonstrated by multiple benchmark datasets. The RSRM shows clear superiority over several representative baseline models.",
        "keywords": "symbolic regression;reinforcement learning;equation discovery",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "/attachment/9ad1e662acfd5ac67e7d46f460a3c3169645bd6d.pdf",
        "author": "Yilong Xu;Yang Liu;Hao Sun",
        "authorids": "~Yilong_Xu1;~Yang_Liu52;~Hao_Sun4",
        "gender": "M;F;",
        "homepage": "http://39.105.80.129;;",
        "dblp": ";;",
        "google_scholar": ";34upg6YAAAAJ;",
        "orcid": ";0000-0003-0127-4030;",
        "linkedin": ";;",
        "or_profile": "~Yilong_Xu1;~Yang_Liu52;~Hao_Sun4",
        "aff": "Renmin University of China;University of Chinese Academy of Sciences;",
        "aff_domain": "ruc.edu.cn;ucas.ac.cn;",
        "position": "MS student;Associate Professor;",
        "bibtex": "@inproceedings{\nxu2024reinforcement,\ntitle={Reinforcement Symbolic Regression Machine},\nauthor={Yilong Xu and Yang Liu and Hao Sun},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=PJVUWpPnZC}\n}",
        "github": "",
        "project": "",
        "reviewers": "XG8a;d71r;jkfW;AFH1",
        "pdf_size": 2174673,
        "rating": "6;6;6;8",
        "confidence": "4;4;2;3",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;2;2",
        "wc_summary": "60;44;87;56",
        "wc_strengths": "43;20;74;71",
        "wc_weaknesses": "30;163;34;233",
        "wc_questions": "535;7;43;78",
        "wc_review": "668;234;238;438",
        "wc_reply_reviewers": "30;19;37;103",
        "wc_reply_authors": "1369;1044;651;1661",
        "reply_reviewers": "1;1;1;2",
        "reply_authors": "3;4;2;6",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            61.75,
            15.722197683530124
        ],
        "wc_strengths_avg": [
            52.0,
            22.079402165819616
        ],
        "wc_weaknesses_avg": [
            115.0,
            86.62274528090182
        ],
        "wc_questions_avg": [
            165.75,
            214.65946869402245
        ],
        "wc_review_avg": [
            394.5,
            178.148112535609
        ],
        "wc_reply_reviewers_avg": [
            47.25,
            32.8205347305616
        ],
        "wc_reply_authors_avg": [
            1181.25,
            375.96966300487594
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.75,
            1.479019945774904
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.17407765595569782,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9580440273255547807&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=PJVUWpPnZC",
        "pdf": "https://openreview.net/pdf?id=PJVUWpPnZC",
        "email": "ruc.edu.cn;ucas.ac.cn;",
        "author_num": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Renmin University of China;University of Chinese Academy of Sciences",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.ruc.edu.cn;http://www.ucas.ac.cn",
        "aff_unique_abbr": "RUC;UCAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "EasyTPP: Towards Open Benchmarking Temporal Point Processes",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18712",
        "id": "PJwAkg0z7h",
        "author_site": "Siqiao Xue, Xiaoming Shi, Zhixuan Chu, Yan Wang, Hongyan Hao, Fan Zhou, caigao jiang, Chen Pan, James Zhang, Qingsong Wen, JUN ZHOU, Hongyuan Mei",
        "tldr": "",
        "abstract": "Continuous-time event sequences play a vital role in real-world domains such as healthcare, finance, online shopping, social networks, and so on. To model such data, temporal point processes (TPPs) have emerged as the most natural and competitive models, making a significant impact in both academic and application communities. Despite the emergence of many powerful models in recent years, there hasn't been a central benchmark for these models and future research endeavors. This lack of standardization impedes researchers and practitioners from comparing methods and reproducing results, potentially slowing down progress in this field. \nIn this paper, we present EasyTPP, the first central repository of research assets (e.g., data, models, evaluation programs, documentations) in the area of event sequence modeling. Our EasyTPP makes several unique contributions to this area: a unified interface of using existing datasets and adding new datasets; a wide range of evaluation programs that are easy to use and extend as well as facilitate reproducible research; implementations of popular neural TPPs, together with a rich library of modules by composing which one could quickly build complex models. We will actively maintain this benchmark and welcome contributions from other researchers and practitioners. \nOur benchmark will help promote reproducible research in this field, thus accelerating research progress as well as making more significant real-world impacts. The code and data are available at \\url{https://github.com/ant-research/EasyTemporalPointProcess}.",
        "keywords": "Event sequence;Temporal point process;Open benchmarking",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/8b6778b48c7c2c708cc98395039a004183ea81dd.zip",
        "author": "Siqiao Xue;Xiaoming Shi;Zhixuan Chu;Yan Wang;Hongyan Hao;Fan Zhou;Caigao JIANG;Chen Pan;James Y. Zhang;Qingsong Wen;JUN ZHOU;Hongyuan Mei",
        "authorids": "~Siqiao_Xue1;~Xiaoming_Shi2;~Zhixuan_Chu1;~Yan_Wang34;~Hongyan_Hao1;~Fan_Zhou10;~Caigao_JIANG2;~Chen_Pan3;~James_Y._Zhang1;~Qingsong_Wen2;~JUN_ZHOU6;~Hongyuan_Mei1",
        "gender": "M;M;M;;M;M;M;M;M;M;M;M",
        "homepage": "https://www.antgroup.com/en;;;https://ai.nju.edu.cn/main.htm;;;;;https://scholar.google.com/citations?user=Ywakh_sAAAAJ;https://scholar.google.com/citations?user=mCVvloEAAAAJ&hl=en;http://www.cs.jhu.edu/~hmei/;https://sites.google.com/site/qingsongwen8/",
        "dblp": "302/7766;;258/1233;;264/1941;;292/3817;;151/3086;99/3847-11;164/5576;27/561",
        "google_scholar": "pZqTpoEAAAAJ;0WMTWacAAAAJ;a4IuTngAAAAJ;https://scholar.google.com/citations?view_op=list_works;;https://scholar.google.com/citations?view_op=list_works;;;Ywakh_sAAAAJ;mCVvloEAAAAJ;g_zaiVIAAAAJ;vjPJvwYAAAAJ",
        "orcid": ";0000-0003-0764-8961;;0009-0006-2938-357X;0000-0002-0867-7628;;;;0000-0001-6519-676X;0000-0001-6033-6102;;0000-0003-4516-2524",
        "linkedin": ";;;;;https://www.linkedin.com/mwlite/in/moutozf;caigao-jiang-309710194;https://www.linkedin.cn/incareer/in/chen-pan-7b7bb645;jamesymzhang/;;hongyuan-mei-57687858?trk=nav_responsive_tab_profile_pic;qingsong-wen-22814156/",
        "or_profile": "~Siqiao_Xue1;~Xiaoming_Shi2;~Zhixuan_Chu1;~Yan_Wang34;~Hongyan_Hao1;~Fan_Zhou10;~Caigao_JIANG2;~Chen_Pan3;~James_Y._Zhang1;~JUN_ZHOU6;~Hongyuan_Mei1;~Qingsong_Wen1",
        "aff": "Alibaba;Ant Group;Ant Group;Alibaba Group;;AntGroup;Alibaba Group;;Ant Group;Ant Group;Toyota Technological Institute at Chicago;Squirrel Ai Learning",
        "aff_domain": "alibaba-inc.com;antgroup.com;antgroup.com;antgroup.com;;antgroup.com;alibaba-inc.com;;alipay.com;antgroup.com;ttic.edu;squirrelai.com",
        "position": "researcher;Researcher;Researcher;Researcher;;Researcher;Researcher;;managing director;Researcher;Research Assistant Professor;Principal Researcher",
        "bibtex": "@inproceedings{\nxue2024easytpp,\ntitle={Easy{TPP}: Towards Open Benchmarking Temporal Point Processes},\nauthor={Siqiao Xue and Xiaoming Shi and Zhixuan Chu and Yan Wang and Hongyan Hao and Fan Zhou and Caigao JIANG and Chen Pan and James Y. Zhang and Qingsong Wen and JUN ZHOU and Hongyuan Mei},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=PJwAkg0z7h}\n}",
        "github": "",
        "project": "",
        "reviewers": "btMZ;MAje;2AV3;Xrns",
        "pdf_size": 671130,
        "rating": "3;3;8;10",
        "confidence": "3;5;4;4",
        "soundness": "3;1;4;4",
        "contribution": "2;1;4;4",
        "presentation": "2;1;3;3",
        "wc_summary": "43;16;54;147",
        "wc_strengths": "31;3;70;98",
        "wc_weaknesses": "33;8;44;39",
        "wc_questions": "16;43;290;60",
        "wc_review": "123;70;458;344",
        "wc_reply_reviewers": "0;0;23;0",
        "wc_reply_authors": "161;619;857;226",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "3;3;3;1",
        "rating_avg": [
            6.0,
            3.082207001484488
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            1.224744871391589
        ],
        "contribution_avg": [
            2.75,
            1.299038105676658
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            65.0,
            49.320381182630776
        ],
        "wc_strengths_avg": [
            50.5,
            36.30771267926417
        ],
        "wc_weaknesses_avg": [
            31.0,
            13.838352503098047
        ],
        "wc_questions_avg": [
            102.25,
            109.52710851656771
        ],
        "wc_review_avg": [
            248.75,
            158.6054459972923
        ],
        "wc_reply_reviewers_avg": [
            5.75,
            9.959292143521045
        ],
        "wc_reply_authors_avg": [
            465.75,
            285.8822965837514
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.8660254037844386
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            12,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 44,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3784551467323369907&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=PJwAkg0z7h",
        "pdf": "https://openreview.net/pdf?id=PJwAkg0z7h",
        "email": "alibaba-inc.com;antgroup.com;antgroup.com;antgroup.com;;antgroup.com;alibaba-inc.com;;alipay.com;antgroup.com;ttic.edu;squirrelai.com",
        "author_num": 12,
        "aff_unique_index": "0;1;1;2;1;2;1;1;3;4",
        "aff_unique_norm": "Alibaba Group Holding Limited;Ant Group;Alibaba Group;Toyota Technological Institute at Chicago;Squirrel Ai Learning",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.alibaba.com;https://www.antgroup.com;https://www.alibaba.com;https://www.tti-chicago.org;https://www.squirrelai.com/",
        "aff_unique_abbr": "Alibaba;Ant Group;Alibaba;TTI Chicago;",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Chicago",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Overcoming the Pitfalls of Vision-Language Model Finetuning for OOD Generalization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18711",
        "id": "PKICZXVY9M",
        "author_site": "Yuhang Zang, Hanlin Goh, Joshua Susskind, Chen Huang",
        "tldr": "",
        "abstract": "Existing vision-language models exhibit strong generalization on a variety of visual domains and tasks. However, such models mainly perform zero-shot recognition in a closed-set manner, and thus struggle to handle open-domain visual concepts by design. There are recent finetuning methods, such as prompt learning, that not only study the discrimination between in-distribution (ID) and out-of-distribution (OOD) samples, but also show some improvements in both ID and OOD accuracies. In this paper, we first demonstrate that vision-language models, after long enough finetuning but without proper regularization, tend to overfit the known classes in the given dataset, with degraded performance on unknown classes. Then we propose a novel approach OGEN to address this pitfall, with the main focus on improving the OOD GENeralization of finetuned models. Specifically, a class-conditional feature generator is introduced to synthesize OOD features using just the class name of any unknown class. Such synthesized features will provide useful knowledge about unknowns and help regularize the decision boundary between ID and OOD data when optimized jointly. Equally important is our adaptive self-distillation mechanism to regularize our feature generation model during joint optimization, i.e., adaptively transferring knowledge between model states to further prevent overfitting. Experiments validate that our method yields convincing gains in OOD generalization performance in different settings. Code: https://github.com/apple/ml-ogen.",
        "keywords": "Vision-Language Model;Finetuning;Prompt Learning;OOD Generalization",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yuhang Zang;Hanlin Goh;Joshua M. Susskind;Chen Huang",
        "authorids": "~Yuhang_Zang1;~Hanlin_Goh2;~Joshua_M._Susskind1;~Chen_Huang6",
        "gender": "M;M;M;M",
        "homepage": "https://yuhangzang.github.io;;http://www.apple.com;",
        "dblp": "230/4433;96/4057;132/7797;05/8125-1",
        "google_scholar": "hW23VKIAAAAJ;;Sv2TGqsAAAAJ;QZ-JKOUAAAAJ",
        "orcid": "0000-0003-1110-5062;;;",
        "linkedin": "yuhang-zang/;;joshua-susskind-8ab2ab5/;",
        "or_profile": "~Yuhang_Zang1;~Hanlin_Goh2;~Joshua_M._Susskind1;~Chen_Huang6",
        "aff": "Shanghai Artificial Intelligence Laboratory;Apple;Apple;Apple",
        "aff_domain": "pjlab.org.cn;apple.com;apple.com;apple.com",
        "position": "Researcher;Research Scientist;Researcher;Research Scientist",
        "bibtex": "@inproceedings{\nzang2024overcoming,\ntitle={Overcoming the Pitfalls of Vision-Language Model Finetuning for {OOD} Generalization},\nauthor={Yuhang Zang and Hanlin Goh and Joshua M. Susskind and Chen Huang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=PKICZXVY9M}\n}",
        "github": "",
        "project": "",
        "reviewers": "v4h7;sauS;Y9rR;Rp4n",
        "pdf_size": 5080490,
        "rating": "5;5;6;8",
        "confidence": "5;2;3;4",
        "soundness": "3;3;3;3",
        "contribution": "3;3;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "27;96;91;60",
        "wc_strengths": "20;159;27;37",
        "wc_weaknesses": "220;323;73;179",
        "wc_questions": "5;31;2;1",
        "wc_review": "272;609;193;277",
        "wc_reply_reviewers": "0;0;16;80",
        "wc_reply_authors": "517;630;234;165",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            68.5,
            27.64507189355817
        ],
        "wc_strengths_avg": [
            60.75,
            57.0454862368619
        ],
        "wc_weaknesses_avg": [
            198.75,
            89.57224737607068
        ],
        "wc_questions_avg": [
            9.75,
            12.356678356257397
        ],
        "wc_review_avg": [
            337.75,
            160.11148459745166
        ],
        "wc_reply_reviewers_avg": [
            24.0,
            32.984845004941285
        ],
        "wc_reply_authors_avg": [
            386.5,
            192.76994060278173
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.18257418583505536,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1737596794370884311&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=PKICZXVY9M",
        "pdf": "https://openreview.net/pdf?id=PKICZXVY9M",
        "email": "pjlab.org.cn;apple.com;apple.com;apple.com",
        "author_num": 4,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Shanghai Artificial Intelligence Laboratory;Apple",
        "aff_unique_dep": ";Apple Inc.",
        "aff_unique_url": "http://www.shailab.org/;https://www.apple.com",
        "aff_unique_abbr": "Shanghai AI Lab;Apple",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "PKUy1VJqwV",
        "title": "Graph Representation Learning with Multi-granular Semantic Ensemble",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Self-supervised learning (SSL) has garnered increasing attention in the graph learning community, owing to its capability of enabling powerful models pre-trained on large unlabeled graphs for general purposes, facilitating quick adaptation to specific domains. Though promising, existing graph SSL frameworks often struggle to capture both high-level abstract features and fine-grained features simultaneously, leading to sub-optimal generalization abilities across different downstream tasks. To bridge this gap, we present Multi-granularity Graph Semantic Ensemble via Knowledge Distillation, namely MGSE, a plug-and-play graph knowledge distillation framework that can be applied to any existing graph SSL framework to enhance its performance by incorporating the concept of multi-granularity. Specifically, MGSE captures multi-granular knowledge by employing multiple student models to learn from a single teacher model, conditioned by probability distributions with different granularities. We apply it to six state-of-the-art graph SSL frameworks and evaluate their performances over multiple graph datasets across different domains, the experimental results show that MGSE can consistently boost the performance of these existing graph SSL frameworks with up to 9.2\\% improvement.",
        "keywords": "Graph Neural Networks;Graph Self-supervised Learning;Knowledge Distillation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/5f831edf54216bb6d673d949f8687b3e2ffa31fa.zip",
        "author": "Qianlong Wen;Mingxuan Ju;Zhongyu Ouyang;Chuxu Zhang;Yanfang Ye",
        "authorids": "~Qianlong_Wen1;~Mingxuan_Ju1;~Zhongyu_Ouyang1;~Chuxu_Zhang2;~Yanfang_Ye1",
        "gender": "M;M;F;;",
        "homepage": "https://hoytwen.github.io/;https://jumxglhf.github.io;https://zyouyang.github.io/;;http://yes-lab.org/",
        "dblp": "301/6224;234/2715;326/3910;;",
        "google_scholar": "cc-uK9gAAAAJ;qNoO67AAAAAJ;ds4NE-gAAAAJ;;egjr888AAAAJ",
        "orcid": "0000-0003-3812-8395;0009-0008-9054-3856;;;",
        "linkedin": "qianlong-wen-87550a1a7/;;;;",
        "or_profile": "~Qianlong_Wen1;~Mingxuan_Ju1;~Zhongyu_Ouyang1;~Chuxu_Zhang2;~Yanfang_Ye1",
        "aff": "University of Notre Dame;University of Notre Dame;Dartmouth College;;University of Notre Dame",
        "aff_domain": "nd.edu;nd.edu;dartmouth.edu;;nd.edu",
        "position": "PhD student;PhD student;PhD student;;Associate Professor",
        "bibtex": "@misc{\nwen2024graph,\ntitle={Graph Representation Learning with Multi-granular Semantic Ensemble},\nauthor={Qianlong Wen and Mingxuan Ju and Zhongyu Ouyang and Chuxu Zhang and Yanfang Ye},\nyear={2024},\nurl={https://openreview.net/forum?id=PKUy1VJqwV}\n}",
        "github": "",
        "project": "",
        "reviewers": "panV;LCB5;YYfu",
        "site": "https://openreview.net/forum?id=PKUy1VJqwV",
        "pdf_size": 704635,
        "rating": "5;5;6",
        "confidence": "4;3;4",
        "soundness": "2;3;3",
        "contribution": "2;2;2",
        "presentation": "2;3;2",
        "wc_summary": "75;161;83",
        "wc_strengths": "47;34;47",
        "wc_weaknesses": "168;334;42",
        "wc_questions": "133;4;142",
        "wc_review": "423;533;314",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1453;1326;660",
        "reply_reviewers": "0;0;0",
        "reply_authors": "3;3;2",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            106.33333333333333,
            38.79289740260308
        ],
        "wc_strengths_avg": [
            42.666666666666664,
            6.128258770283412
        ],
        "wc_weaknesses_avg": [
            181.33333333333334,
            119.58074910099684
        ],
        "wc_questions_avg": [
            93.0,
            63.03967004989794
        ],
        "wc_review_avg": [
            423.3333333333333,
            89.40668630228701
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1146.3333333333333,
            347.77610933217113
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14610249990063925275&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "University of Notre Dame;Dartmouth College",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.nd.edu;https://www.dartmouth.edu",
        "aff_unique_abbr": "Notre Dame;Dartmouth",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "PKZJX0LSZ1",
        "title": "Efficient Multi-Fidelity NAS with Zero-Cost Proxy-Guided Local Search",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Using zero-cost (ZC) metrics as proxies for network performance is currently trendy in Neural Architecture Search (NAS) because the low computing cost of these metrics allows search algorithms to thoroughly explore the architecture search space. Nevertheless, recent studies indicate that relying exclusively on ZC proxies appears to be less effective than using traditional training-based metrics, such as validation accuracy, in seeking high-performance networks. Training-based metrics are preferred as the main search objective to guide search algorithms to approach truly good architectures while ZC proxies could be used as low-cost surrogates to accelerate the search process.\nZC proxies with high rank-correlations to network test accuracy are supposed to bring better search results than metrics with lower correlations. In this study, we investigate the effectiveness of ZC proxies in NAS by taking a deeper look into their fitness landscapes rather than focusing only on rank correlations. We construct fitness landscapes of ZC proxy-based local searches by utilizing the Local Optima Network (LON), which is a powerful visualization tool to analyze combinatorial optimization problems. Our findings exhibit that a high correlation does not guarantee finding high-performance architectures, and ZC proxies with low correlations could still be better in certain situations. Our results further consolidate the suggestion of favoring training-based metrics over ZC proxies as the search objective.\nAlthough we could figure out the architectures having the optimal ZC proxy scores, their true performance is often poor.\nWe then utilize insights from our landscape analysis to propose $\\textbf{M}$ulti-$\\textbf{F}$idelity $\\textbf{N}$eural $\\textbf{A}$rchitecture $\\textbf{S}$earch (MF-NAS), which is a novel framework that makes use of the efficiency of ZC proxies and the efficacy of training-based metrics. Experimental results on a wide range of NAS benchmarks, i.e., NAS-Bench-101, NAS-Bench-201, and NAS-Bench-ASR, demonstrate the superiority of our proposed approach to state-of-the-art NAS methods under a strict budget.",
        "keywords": "neural architecture search;local search;zero-cost proxies;local optimal network",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/2d3fb0d374f0151520bed8e03ffc5fea1d48f420.zip",
        "author": "Quan Minh Phan;Ngoc Hoang Luong",
        "authorids": "~Quan_Minh_Phan1;~Ngoc_Hoang_Luong1",
        "gender": "M;M",
        "homepage": ";",
        "dblp": ";58/8284.html",
        "google_scholar": "ArapukEfR6AC;p3vHDZYAAAAJ",
        "orcid": ";0000-0002-6768-1950",
        "linkedin": ";",
        "or_profile": "~Quan_Minh_Phan1;~Ngoc_Hoang_Luong1",
        "aff": "University of Information Technology, Vietnam National University Ho Chi Minh City;University of Information Technology, Vietnam National University Ho Chi Minh City",
        "aff_domain": "uit.edu.vn;uit.edu.vn",
        "position": "MS student;Lecturer",
        "bibtex": "@misc{\nphan2024efficient,\ntitle={Efficient Multi-Fidelity {NAS} with Zero-Cost Proxy-Guided Local Search},\nauthor={Quan Minh Phan and Ngoc Hoang Luong},\nyear={2024},\nurl={https://openreview.net/forum?id=PKZJX0LSZ1}\n}",
        "github": "",
        "project": "",
        "reviewers": "K4zY;eGD3;Kzxp",
        "site": "https://openreview.net/forum?id=PKZJX0LSZ1",
        "pdf_size": 21447261,
        "rating": "3;3;3",
        "confidence": "4;5;4",
        "soundness": "2;2;2",
        "contribution": "2;2;2",
        "presentation": "3;3;3",
        "wc_summary": "68;69;74",
        "wc_strengths": "126;37;13",
        "wc_weaknesses": "154;112;62",
        "wc_questions": "40;26;4",
        "wc_review": "388;244;153",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            70.33333333333333,
            2.6246692913372702
        ],
        "wc_strengths_avg": [
            58.666666666666664,
            48.60955553066587
        ],
        "wc_weaknesses_avg": [
            109.33333333333333,
            37.606146069787876
        ],
        "wc_questions_avg": [
            23.333333333333332,
            14.817407180595247
        ],
        "wc_review_avg": [
            261.6666666666667,
            96.74824144253073
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:IyP4eAscorMJ:scholar.google.com/&scioq=Efficient+Multi-Fidelity+NAS+with+Zero-Cost+Proxy-Guided+Local+Search&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Information Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://uit.edu.vn",
        "aff_unique_abbr": "UIT",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Ho Chi Minh City",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Vietnam"
    },
    {
        "id": "PKsTHJXn4d",
        "title": "Understanding Your Agent: Leveraging Large Language Models for Behavior Explanation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Intelligent agents such as robots are increasingly deployed in real-world, safety-critical settings. It is vital that these agents are able to explain the reasoning behind their decisions to human counterparts; however, their behavior is often produced by uninterpretable models such as deep neural networks. We propose an approach to generate natural language explanations for an agent\u2019s behavior based only on observations of states and actions, thus making our method independent from the underlying model\u2019s representation. For such models, we first learn a behavior representation and subsequently use it to produce plausible explanations with minimal hallucination while affording user interaction with a pre-trained large language model. We evaluate our method in a multi-agent search-and-rescue environment and demonstrate the effectiveness of our explanations for agents executing various behaviors. Through user studies and empirical experiments, we show that our approach generates explanations as helpful as those produced by a human domain expert while enabling beneficial interactions such as clarification and counterfactual queries.",
        "keywords": "Explainability;Behavior Modeling;Large Language Models",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Xijia Zhang;Yue Guo;Simon Stepputtis;Katia P. Sycara;Joseph Campbell",
        "authorids": "~Xijia_Zhang1;~Yue_Guo7;~Simon_Stepputtis1;~Katia_P._Sycara1;~Joseph_Campbell1",
        "gender": "F;F;;F;",
        "homepage": "https://xijia.me;http://www.sophieyueguo.com;https://simonstepputtis.com/;;",
        "dblp": ";73/735-3.html;192/7092;s/KatiaPSycara;179/2732",
        "google_scholar": "jylrilYAAAAJ;1OXzO1gAAAAJ;WUQgzsAAAAAJ;VWv6a9kAAAAJ;1NmM6OUAAAAJ",
        "orcid": ";0009-0001-9970-4803;0009-0003-0519-3454;;",
        "linkedin": ";;simon-stepputtis/;;",
        "or_profile": "~Xijia_Zhang1;~Yue_Guo7;~Simon_Stepputtis1;~Katia_P._Sycara1;~Joseph_Campbell1",
        "aff": "Shanghai Jiaotong University;School of Computer Science, Carnegie Mellon University;Carnegie Mellon University;Carnegie Mellon University;Carnegie Mellon University",
        "aff_domain": "sjtu.edu.cn;cs.cmu.edu;cmu.edu;cmu.edu;cmu.edu",
        "position": "Undergrad student;PhD student;Postdoc;Full Professor;Postdoc",
        "bibtex": "@misc{\nzhang2024understanding,\ntitle={Understanding Your Agent: Leveraging Large Language Models for Behavior Explanation},\nauthor={Xijia Zhang and Yue Guo and Simon Stepputtis and Katia P. Sycara and Joseph Campbell},\nyear={2024},\nurl={https://openreview.net/forum?id=PKsTHJXn4d}\n}",
        "github": "",
        "project": "",
        "reviewers": "ccmh;5qZT;Pb35;NiyW",
        "site": "https://openreview.net/forum?id=PKsTHJXn4d",
        "pdf_size": 497497,
        "rating": "3;3;5;5",
        "confidence": "4;2;4;4",
        "soundness": "3;2;3;2",
        "contribution": "1;2;2;2",
        "presentation": "3;3;2;2",
        "wc_summary": "139;151;289;84",
        "wc_strengths": "105;67;169;45",
        "wc_weaknesses": "918;224;794;40",
        "wc_questions": "135;47;68;100",
        "wc_review": "1297;489;1320;269",
        "wc_reply_reviewers": "247;107;0;0",
        "wc_reply_authors": "1062;1299;1514;1108",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "2;3;3;2",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            165.75,
            75.50951926744071
        ],
        "wc_strengths_avg": [
            96.5,
            47.039876700518676
        ],
        "wc_weaknesses_avg": [
            494.0,
            370.4024837929681
        ],
        "wc_questions_avg": [
            87.5,
            33.29038900343461
        ],
        "wc_review_avg": [
            843.75,
            471.2840836480689
        ],
        "wc_reply_reviewers_avg": [
            88.5,
            101.40142997019322
        ],
        "wc_reply_authors_avg": [
            1245.75,
            178.55863882769717
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15222412991834556084&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1;1;1",
        "aff_unique_norm": "Shanghai Jiao Tong University;Carnegie Mellon University",
        "aff_unique_dep": ";School of Computer Science",
        "aff_unique_url": "https://www.sjtu.edu.cn;https://www.cmu.edu",
        "aff_unique_abbr": "SJTU;CMU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Pittsburgh",
        "aff_country_unique_index": "0;1;1;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Embarrassingly Simple Dataset Distillation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18710",
        "id": "PLoWVP7Mjc",
        "author_site": "Yunzhen Feng, Shanmukha Ramakrishna Vedantam, Julia Kempe",
        "tldr": "",
        "abstract": "Dataset distillation extracts a small set of synthetic training samples from a large dataset with the goal of achieving competitive performance on test data when trained on this sample. In this work, we tackle dataset distillation at its core by treating it directly as a bilevel optimization problem. Re-examining the foundational back-propagation through time method, we study the pronounced variance in the gradients, computational burden, and long-term dependencies. We introduce an improved method: Random Truncated Backpropagation Through Time (RaT-BPTT) to address them. RaT-BPTT incorporates a truncation coupled with a random window, effectively stabilizing the gradients and speeding up the optimization while covering long dependencies. This allows us to establish new state-of-the-art for a variety of standard dataset benchmarks. A deeper dive into the nature of distilled data unveils pronounced intercorrelation. In particular, subsets of distilled datasets tend to exhibit much worse performance than directly distilled smaller datasets of the same size. Leveraging RaT-BPTT, we devise a boosting mechanism that generates distilled datasets that contain subsets with near optimal performance across different data budgets.",
        "keywords": "Dataset Distillation;Data Condensation",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Yunzhen Feng;Shanmukha Ramakrishna Vedantam;Julia Kempe",
        "authorids": "~Yunzhen_Feng1;~Shanmukha_Ramakrishna_Vedantam1;~Julia_Kempe1",
        "gender": "M;M;",
        "homepage": "https://fengyzpku.github.io;http://vrama91.github.io;",
        "dblp": "254/4752;154/6748.html;",
        "google_scholar": "QebzOsIAAAAJ;v1CRzeAAAAAJ;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Yunzhen_Feng1;~Shanmukha_Ramakrishna_Vedantam1;~Julia_Kempe1",
        "aff": "Meta FAIR;Self Employed;",
        "aff_domain": "meta.com;ramavedantam.com;",
        "position": "Intern;Researcher;",
        "bibtex": "@inproceedings{\nfeng2024embarrassingly,\ntitle={Embarrassingly Simple Dataset Distillation},\nauthor={Yunzhen Feng and Shanmukha Ramakrishna Vedantam and Julia Kempe},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=PLoWVP7Mjc}\n}",
        "github": "",
        "project": "",
        "reviewers": "Qtcx;wwkm;dNLL",
        "pdf_size": 6028937,
        "rating": "5;6;8",
        "confidence": "2;3;5",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "3;3;3",
        "wc_summary": "52;118;79",
        "wc_strengths": "16;45;42",
        "wc_weaknesses": "38;195;68",
        "wc_questions": "43;68;332",
        "wc_review": "149;426;521",
        "wc_reply_reviewers": "0;267;113",
        "wc_reply_authors": "628;2175;1341",
        "reply_reviewers": "0;3;2",
        "reply_authors": "1;4;3",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            1.247219128924647
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            83.0,
            27.09243436828813
        ],
        "wc_strengths_avg": [
            34.333333333333336,
            13.021349989749739
        ],
        "wc_weaknesses_avg": [
            100.33333333333333,
            68.05063474273321
        ],
        "wc_questions_avg": [
            147.66666666666666,
            130.74232503499223
        ],
        "wc_review_avg": [
            365.3333333333333,
            157.81071643656594
        ],
        "wc_reply_reviewers_avg": [
            126.66666666666667,
            109.42983546039393
        ],
        "wc_reply_authors_avg": [
            1381.3333333333333,
            632.2037294698249
        ],
        "reply_reviewers_avg": [
            1.6666666666666667,
            1.247219128924647
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 22,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10155829175502022150&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 8,
        "openreview": "https://openreview.net/forum?id=PLoWVP7Mjc",
        "pdf": "https://openreview.net/pdf?id=PLoWVP7Mjc",
        "email": "meta.com;ramavedantam.com;",
        "author_num": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Meta;Self Employed",
        "aff_unique_dep": "Meta Platforms, Inc.;",
        "aff_unique_url": "https://meta.com;",
        "aff_unique_abbr": "Meta;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States;"
    },
    {
        "id": "PN0SuVRMxa",
        "title": "Structured Packing in LLM Training Improves Long Context Utilization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent advances in long-context Large Language Models (LCLMs) have generated significant interest, especially in applications such as querying scientific research papers. However, their potential is often limited by inadequate context utilization. We identify the absence of long-range semantic dependencies in typical training data as a primary hindrance. To address this, we delve into the benefits of frequently incorporating related documents into training inputs. Using the inherent directory structure of code data as a source of training examples, we demonstrate improvements in perplexity, even for tasks unrelated to coding. Building on these findings, but with a broader focus, we introduce Structured Packing for Long Context (SPLiCe). SPLiCe is an innovative method for creating training examples by using BM25 to collate the most mutually relevant documents into a single training context. Our results indicate that SPLiCe enhances model performance across various tasks and can be used to train large models to utilize long contexts better. We validate our results by training a large 3B model, showing both perplexity improvements and better long-context performance on a benchmark key-value retrieval task.",
        "keywords": "LLM;long-context;pretraining;context utilization;NLP;language models;data mixtures",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/b1ccfe6a80b9c05aa48f7cba9f848e0f5db6ae36.zip",
        "author": "Konrad Staniszewski;Szymon Tworkowski;Sebastian Jaszczur;\u0141ukasz Kuci\u0144ski;Piotr Mi\u0142o\u015b",
        "authorids": "~Konrad_Staniszewski1;~Szymon_Tworkowski1;~Sebastian_Jaszczur1;~\u0141ukasz_Kuci\u0144ski1;~Piotr_Mi\u0142o\u015b1",
        "gender": ";;M;M;",
        "homepage": ";https://syzymon.github.io;;https://sites.google.com/view/lukaszkucinski;",
        "dblp": ";304/8909;206/3302;250/9699;208/0989.html",
        "google_scholar": ";1V8AeXYAAAAJ;KF__0WgAAAAJ;l6dK-VUAAAAJ;Se68XecAAAAJ",
        "orcid": ";;0000-0003-1628-7176;0000-0002-5617-8129;",
        "linkedin": ";szymon-tworkowski/;sebastian-jaszczur-129866a3;https://linkedin.com/in/lukasz-kucinski;piotr-milos-4b02151/",
        "or_profile": "~Konrad_Staniszewski1;~Szymon_Tworkowski1;~Sebastian_Jaszczur1;~\u0141ukasz_Kuci\u0144ski1;~Piotr_Mi\u0142o\u015b1",
        "aff": ";University of Warsaw;University of Warsaw;Institute of Mathematics Polish Academy of Sciences;IDEAS NCBR",
        "aff_domain": ";uw.edu.pl;uw.edu.pl;impan.pl;ideas-ncbr.pl",
        "position": ";PhD student;PhD student;Assistant Professor;Researcher",
        "bibtex": "@misc{\nstaniszewski2024structured,\ntitle={Structured Packing in {LLM} Training Improves Long Context Utilization},\nauthor={Konrad Staniszewski and Szymon Tworkowski and Sebastian Jaszczur and {\\L}ukasz Kuci{\\'n}ski and Piotr Mi{\\l}o{\\'s}},\nyear={2024},\nurl={https://openreview.net/forum?id=PN0SuVRMxa}\n}",
        "github": "",
        "project": "",
        "reviewers": "ixkc;wDkv;21Pg",
        "site": "https://openreview.net/forum?id=PN0SuVRMxa",
        "pdf_size": 722642,
        "rating": "3;3;6",
        "confidence": "4;3;4",
        "soundness": "3;2;3",
        "contribution": "2;2;3",
        "presentation": "3;1;3",
        "wc_summary": "125;40;115",
        "wc_strengths": "55;28;56",
        "wc_weaknesses": "131;95;117",
        "wc_questions": "41;199;128",
        "wc_review": "352;362;416",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "477;559;404",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;2;2",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            93.33333333333333,
            37.932688922470135
        ],
        "wc_strengths_avg": [
            46.333333333333336,
            12.970050972229146
        ],
        "wc_weaknesses_avg": [
            114.33333333333333,
            14.817407180595245
        ],
        "wc_questions_avg": [
            122.66666666666667,
            64.61338010728807
        ],
        "wc_review_avg": [
            376.6666666666667,
            28.110891523077356
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            480.0,
            63.31403214664713
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10769558654779339777&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "University of Warsaw;Polish Academy of Sciences;Institute for Development, Economic Analysis, and Simulation (IDEAS)",
        "aff_unique_dep": ";Institute of Mathematics;",
        "aff_unique_url": "https://www.uw.edu.pl;https://www.impan.pl/;https://www.ideas-ncbr.gov.pl",
        "aff_unique_abbr": "UW;PAS;IDEAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Poland"
    },
    {
        "id": "PN9uaKA1nV",
        "title": "Knowledge-Infused Prompting: Assessing and Advancing Clinical Text Data Generation with Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Clinical natural language processing requires methods that can address domain-specific challenges, such as complex medical terminology and clinical contexts. Recently, large language models (LLMs) have shown promise in this domain. Yet, their direct deployment can lead to privacy issues and are constrained by resources. To address this challenge, we delve into synthetic clinical text generation using LLMs for clinical NLP tasks. We propose an innovative, resource-efficient approach, ClinGen, which infuses knowledge into the process. Our model involves clinical knowledge extraction and context-informed LLM prompting. Both clinical topics and writing styles are drawn from external domain-specific knowledge graphs and LLMs to guide data generation. Our extensive empirical study across 7 clinical NLP tasks and 16 datasets reveals that ClinGen consistently enhances performance across various tasks, effectively aligning the distribution of real datasets and significantly enriching the diversity of generated training instances. We will publish our code and all the generated data upon acceptance.",
        "keywords": "large language model;clinical nlp;synthetic data generation",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/0f5badda569fd1707eab88db69e5b54ba8fea638.zip",
        "author": "Ran Xu;Hejie Cui;Yue Yu;Xuan Kan;Wenqi Shi;Yuchen Zhuang;Wei Jin;Joyce Ho;Carl Yang",
        "authorids": "~Ran_Xu4;~Hejie_Cui1;~Yue_Yu2;~Xuan_Kan1;~Wenqi_Shi1;~Yuchen_Zhuang1;~Wei_Jin4;~Joyce_Ho1;~Carl_Yang1",
        "gender": "F;F;M;;F;M;;F;M",
        "homepage": "https://ritaranx.github.io/;https://hejiecui.com/;https://yueyu1030.github.io;http://kanxuan.live;https://profiles.utsouthwestern.edu/profile/231462/wenqi-shi.html;https://night-chen.github.io/;http://www.cs.emory.edu/~wjin30/;http://joyceho.github.io/;https://cs.emory.edu/~jyang71/",
        "dblp": "71/1270-2;221/7865;;211/5244;16/4475;191/5231.html;66/2173-9;144/4961;305/0254",
        "google_scholar": "mcC5NzwAAAAJ;r0Vh6GEAAAAJ;zQ3Jh6UAAAAJ;https://scholar.google.com/citations?hl=en;4qkrZTAAAAAJ;T-f6XlEAAAAJ;eWow24EAAAAJ;DrUBb5sAAAAJ;mOINlwcAAAAJ",
        "orcid": ";0000-0001-6388-2619;0000-0002-3683-5208;;0000-0001-8972-7342;;;;0000-0001-9145-4531",
        "linkedin": "ran-rita-xu-4568a9159/;hejie-cui-b1071b13b/;;xuan-kan-90077782/;;;;;",
        "or_profile": "~Ran_Xu4;~Hejie_Cui1;~Yue_Yu2;~Xuan_Kan1;~Wenqi_Shi1;~Yuchen_Zhuang1;~Wei_Jin4;~Joyce_Ho1;~Carl_Yang1",
        "aff": "Amazon;Emory University;Georgia Institute of Technology;Emory University;Georgia Institute of Technology;Georgia Institute of Technology;Emory University;Emory University;Emory University",
        "aff_domain": "amazon.com;emory.edu;gatech.edu;emory.edu;gatech.edu;gatech.edu;emory.edu;emory.edu;emory.edu",
        "position": "Intern;PhD student;PhD student;PhD student;PhD student;PhD student;Assistant Professor;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nxu2024knowledgeinfused,\ntitle={Knowledge-Infused Prompting: Assessing and Advancing Clinical Text Data Generation with Large Language Models},\nauthor={Ran Xu and Hejie Cui and Yue Yu and Xuan Kan and Wenqi Shi and Yuchen Zhuang and Wei Jin and Joyce Ho and Carl Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=PN9uaKA1nV}\n}",
        "github": "",
        "project": "",
        "reviewers": "D87k;zJ5m;jB98;CY6f",
        "site": "https://openreview.net/forum?id=PN9uaKA1nV",
        "pdf_size": 2379819,
        "rating": "3;6;6;8",
        "confidence": "4;4;4;5",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;3;4",
        "wc_summary": "101;50;146;60",
        "wc_strengths": "42;20;17;108",
        "wc_weaknesses": "93;59;18;90",
        "wc_questions": "27;17;146;198",
        "wc_review": "263;146;327;456",
        "wc_reply_reviewers": "0;0;0;11",
        "wc_reply_authors": "883;443;1211;1548",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "2;1;2;3",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            89.25,
            37.93003427364653
        ],
        "wc_strengths_avg": [
            46.75,
            36.656343243700675
        ],
        "wc_weaknesses_avg": [
            65.0,
            30.224162519414826
        ],
        "wc_questions_avg": [
            97.0,
            77.30135833217939
        ],
        "wc_review_avg": [
            298.0,
            111.95311518667089
        ],
        "wc_reply_reviewers_avg": [
            2.75,
            4.763139720814412
        ],
        "wc_reply_authors_avg": [
            1021.25,
            408.3371003227603
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.7276068751089989,
        "gs_citation": 34,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1301700660052891500&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;2;1;2;2;1;1;1",
        "aff_unique_norm": "Amazon;Emory University;Georgia Institute of Technology",
        "aff_unique_dep": "Amazon.com, Inc.;;",
        "aff_unique_url": "https://www.amazon.com;https://www.emory.edu;https://www.gatech.edu",
        "aff_unique_abbr": "Amazon;Emory;Georgia Tech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "ACRF: Compressing Explicit Neural Radiance Fields via Attribute Compression",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18709",
        "id": "POFrdKvpea",
        "author_site": "Guangchi Fang, Qingyong Hu, Longguang Wang, Yulan Guo",
        "tldr": "",
        "abstract": "In this work, we study the problem of explicit NeRF compression. Through analyzing recent explicit NeRF models, we reformulate the task of explicit NeRF compression as 3D data compression. We further introduce our NeRF compression framework, Attributed Compression of Radiance Field (ACRF), which focuses on the compression of the explicit neural 3D representation. The neural 3D structure is pruned and converted to points with features, which are further encoded using importance-guided feature encoding. Furthermore, we employ an importance-prioritized entropy model to estimate the probability distribution of transform coefficients, which are then entropy coded with an arithmetic coder using the predicted distribution. Within this framework, we present two models, ACRF and ACRF-F, to strike a balance between compression performance and encoding time budget. Our experiments, which include both synthetic and real-world datasets such as Synthetic-NeRF and Tanks&Temples, demonstrate the superior performance of our proposed algorithm.",
        "keywords": "NeRF; NeRF Compression; 3D Data Compression",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/d387ee46adc76507ef8cacd8bf09af6eb281e121.pdf",
        "author": "Guangchi Fang;Qingyong Hu;Longguang Wang;Yulan Guo",
        "authorids": "~Guangchi_Fang1;~Qingyong_Hu1;~Longguang_Wang1;~Yulan_Guo3",
        "gender": ";M;M;",
        "homepage": ";https://qingyonghu.github.io/;https://longguangwang.github.io;",
        "dblp": ";192/3850;202/1700;",
        "google_scholar": ";yboFNHEAAAAJ;gbBAujsAAAAJ;",
        "orcid": ";0000-0003-0337-9207;;",
        "linkedin": ";qingyong-hu-b18061171/;;",
        "or_profile": "~Guangchi_Fang1;~Qingyong_Hu1;~Longguang_Wang1;~Yulan_Guo3",
        "aff": ";University of Oxford;Aviation University of Air Force;",
        "aff_domain": ";ox.ac.uk;nudt.edu.cn;",
        "position": ";PhD student;Assistant Professor;",
        "bibtex": "@inproceedings{\nfang2024acrf,\ntitle={{ACRF}: Compressing Explicit Neural Radiance Fields via Attribute Compression},\nauthor={Guangchi Fang and Qingyong Hu and Longguang Wang and Yulan Guo},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=POFrdKvpea}\n}",
        "github": "",
        "project": "",
        "reviewers": "sVJV;MUJE;GWvi;HSPa",
        "pdf_size": 1304828,
        "rating": "6;6;8;8",
        "confidence": "4;4;4;4",
        "soundness": "3;3;3;4",
        "contribution": "3;2;3;3",
        "presentation": "2;2;3;4",
        "wc_summary": "99;90;72;94",
        "wc_strengths": "58;23;70;84",
        "wc_weaknesses": "519;78;169;76",
        "wc_questions": "2;119;74;6",
        "wc_review": "678;310;385;260",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1582;764;484;393",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;2;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            88.75,
            10.18270592720815
        ],
        "wc_strengths_avg": [
            58.75,
            22.598395960775623
        ],
        "wc_weaknesses_avg": [
            210.5,
            182.03090396962818
        ],
        "wc_questions_avg": [
            50.25,
            48.93043531382078
        ],
        "wc_review_avg": [
            408.25,
            161.96971167474493
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            805.75,
            468.55969470282014
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7707515500482581885&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=POFrdKvpea",
        "pdf": "https://openreview.net/pdf?id=POFrdKvpea",
        "email": ";ox.ac.uk;nudt.edu.cn;",
        "author_num": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Oxford;Aviation University of Air Force",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ox.ac.uk;",
        "aff_unique_abbr": "Oxford;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United Kingdom;China"
    },
    {
        "id": "PORUmWsgBN",
        "title": "DiffPoseTalk: Speech-Driven Stylistic 3D Facial Animation and Head Pose Generation via Diffusion Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The generation of stylistic 3D facial animations driven by speech poses a significant challenge as it requires learning a many-to-many mapping between speech, style, and the corresponding natural facial motion. However, existing methods either employ a deterministic model for speech-to-motion mapping or encode the style using a one-hot encoding scheme. Notably, the one-hot encoding approach fails to capture the complexity of the style and thus limits generalization ability. In this paper, we propose DiffPoseTalk, a generative framework based on the diffusion model combined with a style encoder that extracts style embeddings from short reference videos. During inference, we employ classifier-free guidance to guide the generation process based on the speech and style. We extend this to include the generation of head poses, thereby enhancing user perception. Additionally, we address the shortage of scanned 3D talking face data by training our model on reconstructed 3DMM parameters from a high-quality, in-the-wild audio-visual dataset. Our extensive experiments and user study demonstrate that our approach outperforms state-of-the-art methods. The code and dataset will be made publicly available.",
        "keywords": "3D facial animation;speech-driven animation;diffusion model",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/cde7517c129ebaba7643f162132b5a820e5a393c.zip",
        "author": "Zhiyao Sun;Tian Lv;Sheng Ye;Matthieu Gaetan Lin;Jenny Sheng;Yu-Hui Wen;Minjing Yu;Yong-jin Liu",
        "authorids": "~Zhiyao_Sun1;~Tian_Lv3;~Sheng_Ye1;~Matthieu_Gaetan_Lin1;~Jenny_Sheng1;~Yu-Hui_Wen2;~Minjing_Yu2;~Yong-jin_Liu1",
        "gender": ";;M;M;F;;;M",
        "homepage": "https://github.com/RainEggplant;https://lt99.github.io;https://github.com/yec22;https://linyuhongg.github.io;https://www.linkedin.com/in/jennysheng112/;;;https://cg.cs.tsinghua.edu.cn/people/~Yongjin/Yongjin.htm",
        "dblp": "318/3324;;;;;;;27/2098",
        "google_scholar": ";;AyDP3-wAAAAJ;https://scholar.google.com/citations?hl=en;;;;https://scholar.google.com.tw/citations?user=GNDtwWQAAAAJ",
        "orcid": "0000-0002-6377-7103;;;;;;;0000-0001-5774-1916",
        "linkedin": ";;;;;;;",
        "or_profile": "~Zhiyao_Sun1;~Tian_Lv3;~Sheng_Ye1;~Matthieu_Gaetan_Lin1;~Jenny_Sheng1;~Yu-Hui_Wen2;~Minjing_Yu2;~Yong-jin_Liu1",
        "aff": "Tsinghua University;, Tsinghua University;Tsinghua University;Tsinghua University;Computer Science, Tsinghua University, Tsinghua University;;;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;cs.tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;mails.tsinghua.edu.cn;;;tsinghua.edu.cn",
        "position": "PhD student;PhD student;PhD student;PhD student;PhD student;;;Full Professor",
        "bibtex": "@misc{\nsun2024diffposetalk,\ntitle={DiffPoseTalk: Speech-Driven Stylistic 3D Facial Animation and Head Pose Generation via Diffusion Models},\nauthor={Zhiyao Sun and Tian Lv and Sheng Ye and Matthieu Gaetan Lin and Jenny Sheng and Yu-Hui Wen and Minjing Yu and Yong-jin Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=PORUmWsgBN}\n}",
        "github": "",
        "project": "",
        "reviewers": "WSFi;xqkb;rH7c;3BSS",
        "site": "https://openreview.net/forum?id=PORUmWsgBN",
        "pdf_size": 6453206,
        "rating": "5;5;6;8",
        "confidence": "4;4;4;4",
        "soundness": "1;3;4;3",
        "contribution": "2;3;2;3",
        "presentation": "2;3;3;4",
        "wc_summary": "54;144;100;90",
        "wc_strengths": "67;91;38;38",
        "wc_weaknesses": "335;105;201;11",
        "wc_questions": "83;57;57;25",
        "wc_review": "539;397;396;164",
        "wc_reply_reviewers": "0;0;18;0",
        "wc_reply_authors": "1472;755;665;452",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "5;4;1;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            1.0897247358851685
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            97.0,
            32.07802986469088
        ],
        "wc_strengths_avg": [
            58.5,
            22.18670773233379
        ],
        "wc_weaknesses_avg": [
            163.0,
            119.89161772200757
        ],
        "wc_questions_avg": [
            55.5,
            20.56088519495209
        ],
        "wc_review_avg": [
            374.0,
            134.47862283649397
        ],
        "wc_reply_reviewers_avg": [
            4.5,
            7.794228634059948
        ],
        "wc_reply_authors_avg": [
            836.0,
            383.3255796317277
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            1.7853571071357126
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 44,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9548633373060018142&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "Tsinghua University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Transport meets Variational Inference: Controlled Monte Carlo Diffusions",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18708",
        "id": "PP1rudnxiW",
        "author_site": "Francisco Vargas, Shreyas Padhy, Denis Blessing, Nikolas N\u00fcsken",
        "tldr": "",
        "abstract": "Connecting optimal transport and variational inference, we present a principled and systematic framework for sampling and generative modelling centred around divergences on path space. Our work culminates in the development of the Controlled Monte Carlo Diffusion sampler (CMCD) for Bayesian computation, a score-based annealing technique that crucially adapts both forward and backward dynamics in a diffusion model. On the way, we clarify the relationship between the EM-algorithm and iterative proportional fitting (IPF) for Schroedinger bridges, deriving as well a regularised objective that bypasses the iterative bottleneck of standard IPF-updates. Finally, we show that CMCD has a strong foundation in the Jarzinsky and Crooks identities from statistical physics, and that it convincingly outperforms competing approaches across a wide array of experiments.",
        "keywords": "SDEs;Diffusion Models;Optimal Transport;Annealed Importance Sampling;Schroedinger Bridges;Variational Inference",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/409fe51770e81252b57237f2603355598b4312c2.zip",
        "author": "Francisco Vargas;Shreyas Padhy;Denis Blessing;Nikolas N\u00fcsken",
        "authorids": "~Francisco_Vargas1;~Shreyas_Padhy1;~Denis_Blessing1;~Nikolas_N\u00fcsken1",
        "gender": "M;M;M;M",
        "homepage": ";http://shreyaspadhy.github.io;;https://nik-nuesken.com/",
        "dblp": "79/7431-1;267/9851;219/1435;",
        "google_scholar": ";JxbV2R0AAAAJ;https://scholar.google.de/citations?view_op=list_works;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Francisco_Vargas1;~Shreyas_Padhy1;~Denis_Blessing1;~Nikolas_N\u00fcsken1",
        "aff": "University of Cambridge;University of Cambridge;Karlsruher Institut f\u00fcr Technologie;King's College London, University of London",
        "aff_domain": "cam.ac.uk;cam.ac.uk;kit.edu;kcl.ac.uk",
        "position": "PhD student;PhD student;PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nvargas2024transport,\ntitle={Transport meets Variational Inference: Controlled Monte Carlo Diffusions},\nauthor={Francisco Vargas and Shreyas Padhy and Denis Blessing and Nikolas N{\\\"u}sken},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=PP1rudnxiW}\n}",
        "github": "",
        "project": "",
        "reviewers": "ndxa;2i1s;nqRv;LiYc;yH6G",
        "pdf_size": 3353776,
        "rating": "6;6;8;8;8",
        "confidence": "4;3;3;4;3",
        "soundness": "3;3;4;4;4",
        "contribution": "2;3;4;3;2",
        "presentation": "3;3;3;4;1",
        "wc_summary": "30;68;68;100;59",
        "wc_strengths": "25;44;101;103;54",
        "wc_weaknesses": "29;87;33;48;387",
        "wc_questions": "172;23;93;5;14",
        "wc_review": "256;222;295;256;514",
        "wc_reply_reviewers": "308;10;16;48;74",
        "wc_reply_authors": "4105;956;616;846;1305",
        "reply_reviewers": "3;1;1;1;1",
        "reply_authors": "10;4;1;2;2",
        "rating_avg": [
            7.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.4,
            0.4898979485566356
        ],
        "soundness_avg": [
            3.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.8,
            0.7483314773547882
        ],
        "presentation_avg": [
            2.8,
            0.9797958971132712
        ],
        "wc_summary_avg": [
            65.0,
            22.378561169118985
        ],
        "wc_strengths_avg": [
            65.4,
            31.30878470972644
        ],
        "wc_weaknesses_avg": [
            116.8,
            136.64611227546868
        ],
        "wc_questions_avg": [
            61.4,
            63.455811396593134
        ],
        "wc_review_avg": [
            308.6,
            105.26841881590128
        ],
        "wc_reply_reviewers_avg": [
            91.2,
            110.82671158163993
        ],
        "wc_reply_authors_avg": [
            1565.6,
            1289.0028083755287
        ],
        "reply_reviewers_avg": [
            1.4,
            0.8000000000000002
        ],
        "reply_authors_avg": [
            3.8,
            3.249615361854384
        ],
        "replies_avg": [
            34,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.16666666666666663,
        "gs_citation": 44,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11679315813497251225&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=PP1rudnxiW",
        "pdf": "https://openreview.net/pdf?id=PP1rudnxiW",
        "email": "cam.ac.uk;cam.ac.uk;kit.edu;kcl.ac.uk",
        "author_num": 4,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "University of Cambridge;Karlsruher Institut f\u00fcr Technologie;King's College London",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.cam.ac.uk;https://www.kit.edu;https://www.kcl.ac.uk",
        "aff_unique_abbr": "Cambridge;KIT;KCL",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Cambridge;",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "United Kingdom;Germany"
    },
    {
        "id": "PQStRgYfuJ",
        "title": "Topology-aware Embedding Memory for Learning on Expanding Graphs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Memory replay based techniques have shown great success for continual learning with incrementally accumulated Euclidean data. Directly applying them to continually expanding graphs, however, leads to the potential memory explosion problem due to the need to buffer representative nodes and their associated topological neighborhood structures. To this end, we systematically analyze the key challenges in the memory explosion problem, and present a general framework, i.e., Parameter Decoupled Graph Neural Networks (PDGNNs) with Topology-aware Embedding Memory (TEM), to tackle this issue. The proposed framework not only reduces the memory space complexity from $\\mathcal{O}(nd^L)$ to $\\mathcal{O}(n)$ ($n$: memory budget, $d$: average node degree, $L$: the radius of the GNN receptive field), but also fully utilizes the topological information for memory replay. Specifically, PDGNNs decouple trainable parameters from the computation ego-subgraph via Topology-aware Embeddings (TEs), which compress ego-subgraphs into compact vectors (i.e., TEs) to reduce the memory consumption. Based on this framework, we discover a unique \\textit{pseudo-training effect} in continual learning on expanding graphs and this effect motivates us to develop a novel coverage maximization sampling strategy that can enhance the performance with a tight memory budget. Thorough empirical studies demonstrate that, by tackling the memory explosion problem and incorporating topological information into memory replay,  PDGNNs with TEM significantly outperform state-of-the-art techniques, especially in the challenging class-incremental setting.",
        "keywords": "machine learning;deep learning;continual learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Xikun ZHANG;Dongjin Song;Yixin Chen;Dacheng Tao",
        "authorids": "~Xikun_ZHANG2;~Dongjin_Song2;~Yixin_Chen1;~Dacheng_Tao1",
        "gender": ";M;M;",
        "homepage": ";https://songdj.github.io/;https://www.cse.wustl.edu/~yixin.chen/;",
        "dblp": "38/326-2;41/3281;59/983;",
        "google_scholar": "oBlKsZ4AAAAJ;BJdHw6AAAAAJ;NByrsK0AAAAJ;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Xikun_ZHANG2;~Dongjin_Song2;~Yixin_Chen1;~Dacheng_Tao1",
        "aff": "University of Sydney;University of Connecticut;Washington University, Saint Louis;",
        "aff_domain": "sydney.edu.au;uconn.edu;wustl.edu;",
        "position": "PhD student;Assistant Professor;Full Professor;",
        "bibtex": "@misc{\nzhang2024topologyaware,\ntitle={Topology-aware Embedding Memory for Learning on Expanding Graphs},\nauthor={Xikun ZHANG and Dongjin Song and Yixin Chen and Dacheng Tao},\nyear={2024},\nurl={https://openreview.net/forum?id=PQStRgYfuJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "1cA5;cucL;DdYK;jbPM;wMQc",
        "site": "https://openreview.net/forum?id=PQStRgYfuJ",
        "pdf_size": 8075676,
        "rating": "3;6;6;6;6",
        "confidence": "3;4;2;2;3",
        "soundness": "3;3;3;3;3",
        "contribution": "2;3;3;3;2",
        "presentation": "2;3;2;3;4",
        "wc_summary": "41;37;111;74;77",
        "wc_strengths": "23;15;58;27;73",
        "wc_weaknesses": "154;28;160;104;226",
        "wc_questions": "26;21;2;62;33",
        "wc_review": "244;101;331;267;409",
        "wc_reply_reviewers": "0;20;0;74;0",
        "wc_reply_authors": "2569;444;992;612;1186",
        "reply_reviewers": "0;1;0;1;0",
        "reply_authors": "8;2;3;2;3",
        "rating_avg": [
            5.4,
            1.2
        ],
        "confidence_avg": [
            2.8,
            0.7483314773547882
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.8,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            68.0,
            27.040710049848915
        ],
        "wc_strengths_avg": [
            39.2,
            22.32845717912458
        ],
        "wc_weaknesses_avg": [
            134.4,
            65.84102064822507
        ],
        "wc_questions_avg": [
            28.8,
            19.528440797974632
        ],
        "wc_review_avg": [
            270.4,
            102.26162525600695
        ],
        "wc_reply_reviewers_avg": [
            18.8,
            28.666356587470272
        ],
        "wc_reply_authors_avg": [
            1160.6,
            751.949359997068
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            3.6,
            2.244994432064365
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.1336306209562122,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9970057639202802065&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of Sydney;University of Connecticut;Washington University in St. Louis",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.sydney.edu.au;https://www.uconn.edu;https://wustl.edu",
        "aff_unique_abbr": "USYD;UConn;WUSTL",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Saint Louis",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "Australia;United States"
    },
    {
        "title": "Confidential-DPproof: Confidential Proof of Differentially Private Training",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18707",
        "id": "PQY2v6VtGe",
        "author_site": "Ali Shahin Shamsabadi, Gefei Tan, Tudor Cebere, Aur\u00e9lien Bellet, Hamed Haddadi, Nicolas Papernot, Xiao Wang, Adrian Weller",
        "tldr": "",
        "abstract": "Post hoc privacy auditing techniques can be used to test the privacy guarantees of a model, but come with several limitations: (i) they can only establish lower bounds on the privacy loss, (ii) the intermediate model updates and some data must be shared with the auditor to get a better approximation of the privacy loss, and (iii) the auditor typically faces a steep computational cost to run a large number of attacks. In this paper, we propose to proactively generate a cryptographic certificate of privacy during training to forego such auditing limitations. We introduce Confidential-DPproof , a framework for Confidential Proof of Differentially Private Training, which enhances training with a certificate of the $(\\varepsilon,\\delta)$-DP guarantee achieved. To obtain this certificate without revealing information about the training data or model, we design a customized zero-knowledge proof protocol tailored to the requirements introduced by differentially private training, including random noise addition and privacy amplification by subsampling. In experiments on CIFAR-10, Confidential-DPproof trains a model achieving state-of-the-art $91$% test accuracy with a certified privacy guarantee of $(\\varepsilon=0.55,\\delta=10^{-5})$-DP in approximately 100 hours.",
        "keywords": "privacy auditing;zero knowledge proof;differentially private training",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/9a69aba9a1dd47e6f7161a26c76cb6be03518625.zip",
        "author": "Ali Shahin Shamsabadi;Gefei Tan;Tudor Ioan Cebere;Aur\u00e9lien Bellet;Hamed Haddadi;Nicolas Papernot;Xiao Wang;Adrian Weller",
        "authorids": "~Ali_Shahin_Shamsabadi1;~Gefei_Tan1;~Tudor_Ioan_Cebere1;~Aur\u00e9lien_Bellet1;~Hamed_Haddadi1;~Nicolas_Papernot1;~Xiao_Wang11;~Adrian_Weller1",
        "gender": "M;;M;;M;M;M;M",
        "homepage": "https://alishahin.github.io;;https://github.com/tudorcebere;http://researchers.lille.inria.fr/abellet/;https://haddadi.github.io/about/;https://www.papernot.fr;https://wangxiao1254.github.io/;http://mlg.eng.cam.ac.uk/adrian/",
        "dblp": "198/1244;;;61/8017;33/5454;162/1405;150/9413;73/8324",
        "google_scholar": "1kVnWYwAAAAJ;;https://scholar.google.com/citations?hl=ro;https://scholar.google.fr/citations?user=j8svx3IAAAAJ;gkA7zvoAAAAJ;cGxq0cMAAAAJ;QbWLR8QAAAAJ;https://scholar.google.co.uk/citations?user=Ek4hM10AAAAJ",
        "orcid": ";;;0000-0003-3440-1251;;;;",
        "linkedin": "ali-shahin-shamsabadi-492544259/;;;;;nicolaspapernot;;",
        "or_profile": "~Ali_Shahin_Shamsabadi1;~Gefei_Tan1;~Tudor_Ioan_Cebere1;~Aur\u00e9lien_Bellet1;~Hamed_Haddadi1;~Nicolas_Papernot1;~Xiao_Wang11;~Adrian_Weller1",
        "aff": "Brave Software;;INRIA;INRIA;Imperial College London;Google;Northwestern University;University of Cambridge",
        "aff_domain": "brave.com;;inria.fr;inria.fr;imperial.ac.uk;google.com;northwestern.edu;cam.ac.uk",
        "position": "Researcher;;PhD student;Tenured researcher;Full Professor;Research Scientist;Assistant Professor;Principal Researcher",
        "bibtex": "@inproceedings{\nshamsabadi2024confidentialdpproof,\ntitle={Confidential-{DP}proof: Confidential Proof of Differentially Private Training},\nauthor={Ali Shahin Shamsabadi and Gefei Tan and Tudor Ioan Cebere and Aur{\\'e}lien Bellet and Hamed Haddadi and Nicolas Papernot and Xiao Wang and Adrian Weller},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=PQY2v6VtGe}\n}",
        "github": "",
        "project": "",
        "reviewers": "y3Ya;PSjV;yrMg",
        "pdf_size": 376251,
        "rating": "5;6;8",
        "confidence": "2;3;4",
        "soundness": "2;2;4",
        "contribution": "2;3;4",
        "presentation": "3;3;3",
        "wc_summary": "26;28;183",
        "wc_strengths": "4;57;172",
        "wc_weaknesses": "14;332;191",
        "wc_questions": "20;85;351",
        "wc_review": "64;502;897",
        "wc_reply_reviewers": "0;928;308",
        "wc_reply_authors": "443;2880;2131",
        "reply_reviewers": "0;2;2",
        "reply_authors": "1;5;3",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            79.0,
            73.5436378394941
        ],
        "wc_strengths_avg": [
            77.66666666666667,
            70.12528470926557
        ],
        "wc_weaknesses_avg": [
            179.0,
            130.09996156801893
        ],
        "wc_questions_avg": [
            152.0,
            143.19450641231552
        ],
        "wc_review_avg": [
            487.6666666666667,
            340.22182306384883
        ],
        "wc_reply_reviewers_avg": [
            412.0,
            385.92572687845865
        ],
        "wc_reply_authors_avg": [
            1818.0,
            1019.2215984106041
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            3.0,
            1.632993161855452
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.9819805060619659,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1998001113899163543&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=PQY2v6VtGe",
        "pdf": "https://openreview.net/pdf?id=PQY2v6VtGe",
        "email": "brave.com;;inria.fr;inria.fr;imperial.ac.uk;google.com;northwestern.edu;cam.ac.uk",
        "author_num": 8,
        "aff_unique_index": "0;1;1;2;3;4;5",
        "aff_unique_norm": "Brave Software;INRIA;Imperial College London;Google;Northwestern University;University of Cambridge",
        "aff_unique_dep": ";;;Google;;",
        "aff_unique_url": "https://www.brave.com;https://www.inria.fr;https://www.imperial.ac.uk;https://www.google.com;https://www.northwestern.edu;https://www.cam.ac.uk",
        "aff_unique_abbr": "Brave;INRIA;ICL;Google;NU;Cambridge",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Mountain View;Cambridge",
        "aff_country_unique_index": "0;1;1;2;0;0;2",
        "aff_country_unique": "United States;France;United Kingdom"
    },
    {
        "title": "Decentralized Riemannian Conjugate Gradient Method on the Stiefel Manifold",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18706",
        "id": "PQbFUMKLFp",
        "author_site": "Jun Chen, Haishan Ye, Mengmeng Wang, Tianxin Huang, Guang Dai, Ivor Tsang, Yong Liu",
        "tldr": "",
        "abstract": "The conjugate gradient method is a crucial first-order optimization method that generally converges faster than the steepest descent method, and its computational cost is much lower than that of second-order methods. However, while various types of conjugate gradient methods have been studied in Euclidean spaces and on Riemannian manifolds, there is little study for those in distributed scenarios. This paper proposes a decentralized Riemannian conjugate gradient descent (DRCGD) method that aims at minimizing a global function over the Stiefel manifold. The optimization problem is distributed among a network of agents, where each agent is associated with a local function, and the communication between agents occurs over an undirected connected graph. Since the Stiefel manifold is a non-convex set, a global function is represented as a finite sum of possibly non-convex (but smooth) local functions. The proposed method is free from expensive Riemannian geometric operations such as retractions, exponential maps, and vector transports, thereby reducing the computational complexity required by each agent. To the best of our knowledge, DRCGD is the first decentralized Riemannian conjugate gradient algorithm to achieve global convergence over the Stiefel manifold.",
        "keywords": "Decentralized optimization;Stiefel manifold;Conjugate gradient method",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Jun Chen;Haishan Ye;Mengmeng Wang;Tianxin Huang;Guang Dai;Ivor Tsang;Yong Liu",
        "authorids": "~Jun_Chen9;~Haishan_Ye2;~Mengmeng_Wang1;~Tianxin_Huang1;~Guang_Dai1;~Ivor_Tsang1;~Yong_Liu11",
        "gender": "M;M;F;M;M;M;M",
        "homepage": ";;https://sallymmx.github.io/;https://tianxinhuang.github.io/;;https://person.zju.edu.cn/en/yongliu;https://www.a-star.edu.sg/cfar/about-cfar/management/prof-ivor-tsang",
        "dblp": ";162/0002.html;;251/3784;;29/4867-7;35/5873",
        "google_scholar": "YKc2O78AAAAJ;;VSRnUiUAAAAJ;https://scholar.google.com.hk/citations?user=Fg7WYfcAAAAJ;;https://scholar.google.com.hk/citations?user=qYcgBbEAAAAJ;rJMOlVsAAAAJ",
        "orcid": "0000-0001-6568-8801;;;;0000-0002-3529-9087;0000-0003-4822-8939;",
        "linkedin": ";;;;;;",
        "or_profile": "~Jun_Chen9;~Haishan_Ye2;~Mengmeng_Wang1;~Tianxin_Huang1;~Guang_Dai1;~Yong_Liu11;~Ivor_W_Tsang1",
        "aff": "Zhejiang University;Xi'an Jiaotong University;Zhejiang University;National University of Singapore;SGIT AI;Zhejiang University;A*STAR",
        "aff_domain": "zju.edu.cn;xjtu.edu.cn;zju.edu.cn;nus.edu.sg;sgcc.com.cn;zju.edu.cn;cfar.a-star.edu.sg",
        "position": "PhD student;Associate Professor;PhD student;Research Fellow;Principal Researcher;Full Professor;Principal Researcher",
        "bibtex": "@inproceedings{\nchen2024decentralized,\ntitle={Decentralized Riemannian Conjugate Gradient Method on the Stiefel Manifold},\nauthor={Jun Chen and Haishan Ye and Mengmeng Wang and Tianxin Huang and Guang Dai and Ivor Tsang and Yong Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=PQbFUMKLFp}\n}",
        "github": "",
        "project": "",
        "reviewers": "hbTT;86eb;yaab",
        "pdf_size": 702007,
        "rating": "5;6;8",
        "confidence": "3;4;4",
        "soundness": "2;4;3",
        "contribution": "3;3;2",
        "presentation": "2;3;2",
        "wc_summary": "63;32;128",
        "wc_strengths": "56;53;101",
        "wc_weaknesses": "150;70;165",
        "wc_questions": "132;28;196",
        "wc_review": "401;183;590",
        "wc_reply_reviewers": "0;0;68",
        "wc_reply_authors": "442;331;651",
        "reply_reviewers": "0;0;2",
        "reply_authors": "1;1;2",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            74.33333333333333,
            40.00277768133386
        ],
        "wc_strengths_avg": [
            70.0,
            21.95449840010015
        ],
        "wc_weaknesses_avg": [
            128.33333333333334,
            41.69998667732268
        ],
        "wc_questions_avg": [
            118.66666666666667,
            69.23069325731824
        ],
        "wc_review_avg": [
            391.3333333333333,
            166.29759135023238
        ],
        "wc_reply_reviewers_avg": [
            22.666666666666668,
            32.05550741379015
        ],
        "wc_reply_authors_avg": [
            474.6666666666667,
            132.665829143085
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.7559289460184545,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18064972890791534722&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=PQbFUMKLFp",
        "pdf": "https://openreview.net/pdf?id=PQbFUMKLFp",
        "email": "zju.edu.cn;xjtu.edu.cn;zju.edu.cn;nus.edu.sg;sgcc.com.cn;zju.edu.cn;cfar.a-star.edu.sg",
        "author_num": 7,
        "aff_unique_index": "0;1;0;2;3;0;4",
        "aff_unique_norm": "Zhejiang University;Xi'an Jiao Tong University;National University of Singapore;SGIT AI;Agency for Science, Technology and Research",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.zju.edu.cn;https://www.xjtu.edu.cn;https://www.nus.edu.sg;;https://www.a-star.edu.sg",
        "aff_unique_abbr": "ZJU;XJTU;NUS;;A*STAR",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0;1",
        "aff_country_unique": "China;Singapore;"
    },
    {
        "id": "PQzdtBiKie",
        "title": "Fractal Patterns May Unravel the Intelligence in Next-Token Prediction",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We study the fractal structure of language, aiming to provide a precise formalism for quantifying several properties that may have been previously suspected but not  formally shown. We establish that language is: (1) self-similar, exhibiting complexities at all levels of granularity, with no particular characteristic granularity level or context length, and (2) long-range dependent (LRD), with tokens at any instant typically correlated with all subsequent tokens. Based on these findings, we argue that short-term patterns in language, such as in paragraphs, mirror the patterns seen in larger scopes, like entire documents. This may shed some light on how next-token prediction can lead to a comprehension of the structure of text at multiple levels of granularity, from words and clauses to broader contexts and intents. In addition, we demonstrate a connection between fractal parameters, such as the Hurst exponent, and scaling laws when varying the context length at inference time. We hope that these findings offer a fresh perspective on the nature of language and the mechanisms underlying the success of LLMs.",
        "keywords": "Language;Fractals;Self-similarity;long-range dependence;Hurst exponent;scaling laws;PaLM.",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Ibrahim Alabdulmohsin;Mostafa Dehghani",
        "authorids": "~Ibrahim_Alabdulmohsin1;~Mostafa_Dehghani1",
        "gender": "M;M",
        "homepage": "http://ibomohsin.com;http://mostafadehghani.com/",
        "dblp": "153/5393;125/4062",
        "google_scholar": "8WNMsPYAAAAJ;https://scholar.google.nl/citations?user=MiHOX3QAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Ibrahim_Alabdulmohsin1;~Mostafa_Dehghani1",
        "aff": "Google;Google DeepMind",
        "aff_domain": "google.com;google.com",
        "position": "Research Scientist;Research Scientist",
        "bibtex": "@misc{\nalabdulmohsin2024fractal,\ntitle={Fractal Patterns May Unravel the Intelligence in Next-Token Prediction},\nauthor={Ibrahim Alabdulmohsin and Mostafa Dehghani},\nyear={2024},\nurl={https://openreview.net/forum?id=PQzdtBiKie}\n}",
        "github": "",
        "project": "",
        "reviewers": "jKTM;iZo5;hBB9",
        "site": "https://openreview.net/forum?id=PQzdtBiKie",
        "pdf_size": 564116,
        "rating": "1;6;6",
        "confidence": "3;4;3",
        "soundness": "2;4;3",
        "contribution": "1;3;3",
        "presentation": "2;3;3",
        "wc_summary": "55;199;104",
        "wc_strengths": "21;86;83",
        "wc_weaknesses": "279;199;105",
        "wc_questions": "104;1;2",
        "wc_review": "459;485;294",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "823;362;291",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;2;2",
        "rating_avg": [
            4.333333333333333,
            2.357022603955158
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            119.33333333333333,
            59.779223443898594
        ],
        "wc_strengths_avg": [
            63.333333333333336,
            29.95923155816176
        ],
        "wc_weaknesses_avg": [
            194.33333333333334,
            71.11180555216474
        ],
        "wc_questions_avg": [
            35.666666666666664,
            48.32068800098865
        ],
        "wc_review_avg": [
            412.6666666666667,
            84.57869445407368
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            492.0,
            235.84034147419874
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.5000000000000001,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5066280824262018786&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Google",
        "aff_unique_dep": "Google",
        "aff_unique_url": "https://www.google.com",
        "aff_unique_abbr": "Google",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Mountain View;",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "title": "Integrating Planning and Deep Reinforcement Learning via Automatic Induction of Task Substructures",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18705",
        "id": "PR6RMsxuW7",
        "author_site": "Jung-Chun Liu, Chi-Hsien Chang, Shao-Hua Sun, Tian-Li Yu",
        "tldr": "",
        "abstract": "Despite recent advancements, deep reinforcement learning (DRL) still struggles at learning sparse-reward goal-directed tasks. Classical planning excels at addressing hierarchical tasks by employing symbolic knowledge, yet most of the methods rely on assumptions about pre-defined subtasks. To bridge the best of both worlds, we propose a framework that integrates DRL with classical planning by automatically inducing task structures and substructures from a few demonstrations. Specifically, genetic programming is used for substructure induction where the program model reflects prior domain knowledge of effect rules. We compare the proposed framework to state-of-the-art DRL algorithms, imitation learning methods, and an exploration approach in various domains. Experimental results show that our proposed framework outperforms all the abovementioned algorithms in terms of sample efficiency and task performance. Moreover, our framework achieves strong generalization performance by effectively inducing new rules and composing task structures. Ablation studies justify the design of our induction module and the proposed genetic programming procedure.",
        "keywords": "Deep Reinforcement Learning;Classical Planning;Genetic Programming;Symbolic AI;Learning from Demonstration",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Jung-Chun Liu;Chi-Hsien Chang;Shao-Hua Sun;Tian-Li Yu",
        "authorids": "~Jung-Chun_Liu1;~Chi-Hsien_Chang2;~Shao-Hua_Sun1;~Tian-Li_Yu1",
        "gender": "F;;M;",
        "homepage": "https://yore0403.github.io/academic/index.html;https://chi-hsienchang.github.io/salima/;http://shaohua0116.github.io;",
        "dblp": ";;158/9680;01/3372.html",
        "google_scholar": "https://scholar.google.com.tw/citations?user=BmsRPgEAAAAJ;https://scholar.google.com.tw/citations?view_op=list_works;uXsfnaQAAAAJ;",
        "orcid": ";0009-0008-3561-7859;0000-0001-7579-6734;",
        "linkedin": ";;shaohua0116/;",
        "or_profile": "~Jung-Chun_Liu1;~Chi-Hsien_Chang2;~Shao-Hua_Sun1;~Tian-Li_Yu1",
        "aff": "National Taiwan University;National Taiwan University;National Taiwan University;National Taiwan University",
        "aff_domain": "ntu.edu.tw;ntu.edu.tw;ntu.edu.tw;ntu.edu.tw",
        "position": "Researcher;PhD student;Assistant Professor;Associate Professor",
        "bibtex": "@inproceedings{\nliu2024integrating,\ntitle={Integrating Planning and Deep Reinforcement Learning via Automatic Induction of Task Substructures},\nauthor={Jung-Chun Liu and Chi-Hsien Chang and Shao-Hua Sun and Tian-Li Yu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=PR6RMsxuW7}\n}",
        "github": "",
        "project": "",
        "reviewers": "hQ37;n4PR;9Jkh;Yjtd",
        "pdf_size": 2342946,
        "rating": "5;6;6;8",
        "confidence": "4;3;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;2;3",
        "wc_summary": "127;129;73;88",
        "wc_strengths": "73;127;97;34",
        "wc_weaknesses": "221;353;246;81",
        "wc_questions": "379;72;2;4",
        "wc_review": "800;681;418;207",
        "wc_reply_reviewers": "0;119;42;0",
        "wc_reply_authors": "2327;1623;1059;586",
        "reply_reviewers": "0;2;1;0",
        "reply_authors": "5;5;3;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            104.25,
            24.34517405975977
        ],
        "wc_strengths_avg": [
            82.75,
            34.03215391361528
        ],
        "wc_weaknesses_avg": [
            225.25,
            96.92361683305054
        ],
        "wc_questions_avg": [
            114.25,
            155.42904329629002
        ],
        "wc_review_avg": [
            526.5,
            230.50216918719008
        ],
        "wc_reply_reviewers_avg": [
            40.25,
            48.59205181920187
        ],
        "wc_reply_authors_avg": [
            1398.75,
            649.6015605738644
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.5,
            1.6583123951777
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.13245323570650439,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10119917616611535743&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=PR6RMsxuW7",
        "pdf": "https://openreview.net/pdf?id=PR6RMsxuW7",
        "email": "ntu.edu.tw;ntu.edu.tw;ntu.edu.tw;ntu.edu.tw",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "National Taiwan University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ntu.edu.tw",
        "aff_unique_abbr": "NTU",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Taiwan",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "PSZ4R5dDwy",
        "title": "How does Architecture Influence the Base Capabilities of Pre-trained Language Models? A Case Study Based on Wider Transformer Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Pre-trained language models have demonstrated robust base capabilities. They not only perform well in in-distribution language modeling but also demonstrate powerful abilities in out-of-distribution language modeling, transfer learning, and few-shot learning. Based on the fundamental principles of machine learning induction bias, the architecture of a model is a significant factor affecting its capabilities. However, the specifics of how architecture influences the base capabilities of pre-trained language models remain under-explored. This research initiates from the observation that the base capabilities of the FFN-wider Transformers are diminished relative to the vanilla Transformers, and we aim to elucidate how this particular architectural modification impacts base capacities. Our findings indicate that these architectural changes reduce the contribution of the combinatorial function, specifically the multi-head attention layer, to pre-trained language modeling. This alteration may impact the model architecture's expression of linguistic compositionality prior. Consequently, we postulate that this may be the central cause behind the observed base capability discrepancies. To substantiate our hypothesis, we modified the architecture, allowing a certain proportion of the parameters from the wider FFN to be specifically allocated for enhancing the combinatorial function. With incremental adjustments to the ratio, the base capabilities of the wider Transformers showed consistent improvement, ultimately nearing that of the vanilla Transformers, providing substantial evidence for our hypothesis. Moreover, applying our insights to the MoE architectural models, which also manifest base capabilities declines, resulted in notable base capabilities enhancements.",
        "keywords": "Pre-trained Language Models;Base Capabilities",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Xin Lu;Yanyan Zhao;Bing Qin",
        "authorids": "~Xin_Lu8;~Yanyan_Zhao1;~Bing_Qin2",
        "gender": "M;F;",
        "homepage": "https://luxin.xyz/;http://ir.hit.edu.cn/~yanyan/;http://ir.hit.edu.cn/~qinb",
        "dblp": "11/1952;;86/5934.html",
        "google_scholar": "https://scholar.google.com.hk/citations?user=EXZyiCoAAAAJ;mEdfAYoAAAAJ;LKnCub0AAAAJ",
        "orcid": "0000-0002-0784-5394;;0000-0002-2543-5604",
        "linkedin": ";;",
        "or_profile": "~Xin_Lu8;~Yanyan_Zhao1;~Bing_Qin2",
        "aff": "Harbin Institute of Technology;Harbin Institute of Technology;Harbin Institute of Technology",
        "aff_domain": "hit.edu.cn;hit.edu.cn;hit.edu.cn",
        "position": "PhD student;Full Professor;Full Professor",
        "bibtex": "@misc{\nlu2024how,\ntitle={How does Architecture Influence the Base Capabilities of Pre-trained Language Models? A Case Study Based on Wider Transformer Models},\nauthor={Xin Lu and Yanyan Zhao and Bing Qin},\nyear={2024},\nurl={https://openreview.net/forum?id=PSZ4R5dDwy}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=PSZ4R5dDwy",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:gp4dv0RqgLUJ:scholar.google.com/&scioq=How+does+Architecture+Influence+the+Base+Capabilities+of+Pre-trained+Language+Models%3F+A+Case+Study+Based+on+Wider+Transformer+Models&hl=en&as_sdt=0,33",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Harbin Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.hit.edu.cn/",
        "aff_unique_abbr": "HIT",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Harbin",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "PUaSVhBzem",
        "title": "MoMo: Momentum Models for Adaptive Learning Rates",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Training a modern machine learning architecture on a new task requires extensive\nlearning-rate tuning, which comes at a high computational cost. In this work, we develop new adaptive learning rates that can be used with any momentum method, and require less tuning to perform well. We first develop MoMo, a Momentum Model\nbased adaptive learning rate for SGD-M (Stochastic gradient descent with momentum). MoMo uses momentum estimates of the batch losses and gradients sampled at each iteration to build a model of the loss function. Our model also makes use of\nany known lower bound of the loss function by using truncation, e.g. most losses\nare lower-bounded by zero. We then approximately minimize this model at each\niteration to compute the next step. We show how MoMo can be used in combination\nwith any momentum-based method, and showcase this by developing MoMo-Adam - which is Adam with our new model-based adaptive learning rate. Additionally, for losses with unknown lower bounds, we develop on-the-fly estimates of a lower\nbound, that are incorporated in our model. Through extensive numerical experiments, we demonstrate that MoMo and MoMo-Adam improve over SGD-M and Adam in terms of accuracy and robustness to hyperparameter tuning for training image\nclassifiers on MNIST, CIFAR10, CIFAR100, Imagenet, recommender systems\non the Criteo dataset, and a transformer model on the translation task IWSLT14.",
        "keywords": "adaptive learning rates;adaptive step sizes;stochastic gradient;SGD;polyak step size;model based methods;momentum",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/4d5d69ef07835117a963e6d2ee8fd567ccbd4e0b.zip",
        "author": "Fabian Schaipp;Ruben Ohana;Michael Eickenberg;Aaron Defazio;Robert M. Gower",
        "authorids": "~Fabian_Schaipp1;~Ruben_Ohana1;~Michael_Eickenberg5;~Aaron_Defazio1;~Robert_M._Gower1",
        "gender": ";;M;M;M",
        "homepage": ";https://rubenohana.github.io/;http://eickenberg.github.io;https://www.aarondefazio.com/;https://gowerrobert.github.io/",
        "dblp": "276/2086;251/5608;117/7268;116/2969;143/0056",
        "google_scholar": ";https://scholar.google.fr/citations?user=F9qNg2wAAAAJ;GW0werQAAAAJ;KEzJsdkAAAAJ;okKw87MAAAAJ",
        "orcid": "0000-0002-0673-9944;0000-0002-8493-1210;;;",
        "linkedin": ";rubenohana/;;;",
        "or_profile": "~Fabian_Schaipp1;~Ruben_Ohana1;~Michael_Eickenberg5;~Aaron_Defazio1;~Robert_M._Gower1",
        "aff": "Technische Universit\u00e4t M\u00fcnchen;Flatiron Institute;Flatiron Institute;Meta;Flatiron Institute",
        "aff_domain": "tum.de;flatironinstitute.org;flatironinstitute.org;meta.com;simonsfoundation.org",
        "position": "PhD student;Postdoc;Researcher;Research Scientist;Researcher",
        "bibtex": "@misc{\nschaipp2024momo,\ntitle={MoMo: Momentum Models for Adaptive Learning Rates},\nauthor={Fabian Schaipp and Ruben Ohana and Michael Eickenberg and Aaron Defazio and Robert M. Gower},\nyear={2024},\nurl={https://openreview.net/forum?id=PUaSVhBzem}\n}",
        "github": "",
        "project": "",
        "reviewers": "wwBz;ZNHx;NNGe",
        "site": "https://openreview.net/forum?id=PUaSVhBzem",
        "pdf_size": 3170923,
        "rating": "3;3;3",
        "confidence": "4;3;4",
        "soundness": "1;2;3",
        "contribution": "2;2;2",
        "presentation": "2;3;3",
        "wc_summary": "62;71;11",
        "wc_strengths": "30;97;9",
        "wc_weaknesses": "253;122;66",
        "wc_questions": "68;47;205",
        "wc_review": "413;337;291",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            48.0,
            26.419689627245813
        ],
        "wc_strengths_avg": [
            45.333333333333336,
            37.52628708281999
        ],
        "wc_weaknesses_avg": [
            147.0,
            78.36240595251442
        ],
        "wc_questions_avg": [
            106.66666666666667,
            70.05870554201114
        ],
        "wc_review_avg": [
            347.0,
            50.30573194643595
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4379861052436102614&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;1;2;1",
        "aff_unique_norm": "Technische Universit\u00e4t M\u00fcnchen;Flatiron Institute;Meta",
        "aff_unique_dep": ";;Meta Platforms, Inc.",
        "aff_unique_url": "https://www.tum.de;https://flatironinstitute.org;https://meta.com",
        "aff_unique_abbr": "TUM;Flatiron;Meta",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;1",
        "aff_country_unique": "Germany;United States"
    },
    {
        "title": "Understanding the Effects of RLHF on LLM Generalisation and Diversity",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18704",
        "id": "PXD3FAVHJT",
        "author_site": "Robert Kirk, Ishita Mediratta, Christoforos Nalmpantis, Jelena Luketina, Eric Hambro, Edward Grefenstette, Roberta Raileanu",
        "tldr": "",
        "abstract": "Large language models (LLMs) fine-tuned with reinforcement learning from human feedback (RLHF) have been used in some of the most widely deployed AI models to date, such as OpenAI's ChatGPT or Anthropic's Claude. While there has been significant work developing these methods, our understanding of the benefits and downsides of each stage in RLHF is still limited. To fill this gap, we present an extensive analysis of how each stage of the process (i.e. supervised fine-tuning (SFT), reward modelling, and RLHF) affects two key properties: out-of-distribution (OOD) generalisation and output diversity. OOD generalisation is crucial given the wide range of real-world scenarios in which these models are being used, while output diversity refers to the model's ability to generate varied outputs and is important for a variety of use cases. We perform our analysis across two base models on both summarisation and instruction following tasks, the latter being highly relevant for current LLM use cases. We find that RLHF generalises better than SFT to new inputs, particularly as the distribution shift between train and test becomes larger. However, RLHF significantly reduces output diversity compared to SFT across a variety of measures, implying a tradeoff in current LLM fine-tuning methods between generalisation and diversity. Our results provide guidance on which fine-tuning method should be used depending on the application, and show that more research is needed to improve the tradeoff between generalisation and diversity.",
        "keywords": "reinforcement learning;large language models;rlhf;ood generalisation;diversity",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Robert Kirk;Ishita Mediratta;Christoforos Nalmpantis;Jelena Luketina;Eric Hambro;Edward Grefenstette;Roberta Raileanu",
        "authorids": "~Robert_Kirk1;~Ishita_Mediratta1;~Christoforos_Nalmpantis1;~Jelena_Luketina1;~Eric_Hambro1;~Edward_Grefenstette1;~Roberta_Raileanu2",
        "gender": "M;F;;F;M;M;F",
        "homepage": "https://robertkirk.github.io;https://ishita.io;;https://whirl.cs.ox.ac.uk/member/jelena-luketina/;https://erichambro.com/;http://egrefen.com/;https://rraileanu.github.io/",
        "dblp": "01/9684;289/7108;222/6212;172/1124;290/1986;http://dblp.uni-trier.de/pers/hd/g/Grefenstette:Edward;215/5579",
        "google_scholar": "https://scholar.google.co.uk/citations?user=PL5KWdYAAAAJ;hgaAO6QAAAAJ;https://scholar.google.co.uk/citations?user=1Z4PmxIAAAAJ;zpil5xkAAAAJ;ehquBPIAAAAJ;https://scholar.google.co.uk/citations?user=ezllEwMAAAAJ;9hVXpJ0AAAAJ",
        "orcid": ";;0000-0002-7398-5862;;;;",
        "linkedin": ";;christoforos-nalmpantis/;;eric-hambro;;roberta-raileanu-44b25660/",
        "or_profile": "~Robert_Kirk1;~Ishita_Mediratta1;~Christoforos_Nalmpantis1;~Jelena_Luketina1;~Eric_Hambro1;~Edward_Grefenstette1;~Roberta_Raileanu1",
        "aff": "University College London;Meta AI;cfdx;University of Oxford;Anthropic;Google DeepMind;Meta Facebook",
        "aff_domain": "ucl.ac.uk;meta.com;cfdx.io;ox.ac.uk;anthropic.com;deepmind.com;fb.com",
        "position": "PhD student;Researcher;Researcher;PhD student;Researcher;Principal Researcher;Researcher",
        "bibtex": "@inproceedings{\nkirk2024understanding,\ntitle={Understanding the Effects of {RLHF} on {LLM} Generalisation and Diversity},\nauthor={Robert Kirk and Ishita Mediratta and Christoforos Nalmpantis and Jelena Luketina and Eric Hambro and Edward Grefenstette and Roberta Raileanu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=PXD3FAVHJT}\n}",
        "github": "",
        "project": "",
        "reviewers": "GaEc;6G1j;De3y",
        "pdf_size": 688251,
        "rating": "3;6;8",
        "confidence": "4;4;4",
        "soundness": "2;2;3",
        "contribution": "1;3;3",
        "presentation": "3;3;4",
        "wc_summary": "46;59;68",
        "wc_strengths": "49;41;55",
        "wc_weaknesses": "201;161;62",
        "wc_questions": "104;253;9",
        "wc_review": "400;514;194",
        "wc_reply_reviewers": "269;232;91",
        "wc_reply_authors": "2393;1954;366",
        "reply_reviewers": "1;2;1",
        "reply_authors": "6;5;1",
        "rating_avg": [
            5.666666666666667,
            2.0548046676563256
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            57.666666666666664,
            9.030811456096044
        ],
        "wc_strengths_avg": [
            48.333333333333336,
            5.734883511361751
        ],
        "wc_weaknesses_avg": [
            141.33333333333334,
            58.425641250700494
        ],
        "wc_questions_avg": [
            122.0,
            100.42244105112495
        ],
        "wc_review_avg": [
            369.3333333333333,
            132.42691904929634
        ],
        "wc_reply_reviewers_avg": [
            197.33333333333334,
            76.69130039030212
        ],
        "wc_reply_authors_avg": [
            1571.0,
            870.7081409213231
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            4.0,
            2.160246899469287
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 121,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2078395541999084891&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=PXD3FAVHJT",
        "pdf": "https://openreview.net/pdf?id=PXD3FAVHJT",
        "email": "ucl.ac.uk;meta.com;cfdx.io;ox.ac.uk;anthropic.com;deepmind.com;fb.com",
        "author_num": 7,
        "aff_unique_index": "0;1;2;3;4;5;1",
        "aff_unique_norm": "University College London;Meta;cfdx;University of Oxford;Anthropic;Google",
        "aff_unique_dep": ";Meta AI;;;;Google DeepMind",
        "aff_unique_url": "https://www.ucl.ac.uk;https://meta.com;;https://www.ox.ac.uk;https://www.anthropic.com;https://deepmind.com",
        "aff_unique_abbr": "UCL;Meta;;Oxford;Anthropic;DeepMind",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;1;0;1",
        "aff_country_unique": "United Kingdom;United States;"
    },
    {
        "title": "SOHES: Self-supervised Open-world Hierarchical Entity Segmentation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18703",
        "id": "PXNrncg2DF",
        "author_site": "Shengcao Cao, Jiuxiang Gu, Jason Kuen, Hao Tan, Ruiyi Zhang, Handong Zhao, Ani Nenkova, Liangyan Gui, Tong Sun, Yu-Xiong Wang",
        "tldr": "",
        "abstract": "Open-world entity segmentation, as an emerging computer vision task, aims at segmenting entities in images without being restricted by pre-defined classes, offering impressive generalization capabilities on unseen images and concepts. Despite its promise, existing entity segmentation methods like Segment Anything Model (SAM) rely heavily on costly expert annotators. This work presents Self-supervised Open-world Hierarchical Entity Segmentation (SOHES), a novel approach that eliminates the need for human annotations. SOHES operates in three phases: self-exploration, self-instruction, and self-correction. Given a pre-trained self-supervised representation, we produce abundant high-quality pseudo-labels through visual feature clustering. Then, we train a segmentation model on the pseudo-labels, and rectify the noises in pseudo-labels via a teacher-student mutual-learning procedure. Beyond segmenting entities, SOHES also captures their constituent parts, providing a hierarchical understanding of visual entities. Using raw images as the sole training data, our method achieves unprecedented performance in self-supervised open-world segmentation, marking a significant milestone towards high-quality open-world entity segmentation in the absence of human-annotated masks. Project page: https://SOHES.github.io.",
        "keywords": "self-supervised learning;open-world learning;segmentation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Shengcao Cao;Jiuxiang Gu;Jason Kuen;Hao Tan;Ruiyi Zhang;Handong Zhao;Ani Nenkova;Liangyan Gui;Tong Sun;Yu-Xiong Wang",
        "authorids": "~Shengcao_Cao1;~Jiuxiang_Gu2;~Jason_Kuen1;~Hao_Tan1;~Ruiyi_Zhang3;~Handong_Zhao3;~Ani_Nenkova1;~Liangyan_Gui1;~Tong_Sun1;~Yu-Xiong_Wang1",
        "gender": "M;M;M;M;;;;F;F;",
        "homepage": "https://shengcao-cao.github.io/;http://gujiuxiang.com;http://jasonkuen.com/;http://www.cs.unc.edu/~airsplay/;;;;;https://research.adobe.com/person/tong-sun/;https://yxw.cs.illinois.edu/",
        "dblp": "236/4681;173/4935.html;165/1403;94/877-2;;;;155/5055;;35/10700",
        "google_scholar": "yMYTz3AAAAAJ;https://scholar.google.com.sg/citations?user=zPxKV9EAAAAJ;e6u7GlQAAAAJ;OV1Y3FUAAAAJ;;;;3aE0r9QAAAAJ;https://scholar.google.com/citations?hl=en;T_Q-xDkAAAAJ",
        "orcid": ";;;;;;;;;",
        "linkedin": ";;;hao-tan-23677180/;;;;;tong-sun/?trk=hb_tab_pro_top;",
        "or_profile": "~Shengcao_Cao1;~Jiuxiang_Gu2;~Jason_Kuen1;~Hao_Tan1;~Ruiyi_Zhang3;~Handong_Zhao3;~Ani_Nenkova1;~Liangyan_Gui1;~Tong_Sun1;~Yu-Xiong_Wang1",
        "aff": "Adobe Systems;Adobe Systems;Adobe Research;Adobe Systems;;;;UIUC;Adobe Systems;Department of Computer Science, University of Illinois Urbana-Champaign",
        "aff_domain": "adobe.com;adobe.com;adobe.com;adobe.com;;;;cs.illinois.edu;adobe.com;cs.illinois.edu",
        "position": "Intern;Researcher;Researcher;Research Scientist;;;;Assistant Professor;Director, Document Intelligence Lab;Assistant Professor",
        "bibtex": "@inproceedings{\ncao2024sohes,\ntitle={{SOHES}: Self-supervised Open-world Hierarchical Entity Segmentation},\nauthor={Shengcao Cao and Jiuxiang Gu and Jason Kuen and Hao Tan and Ruiyi Zhang and Handong Zhao and Ani Nenkova and Liangyan Gui and Tong Sun and Yu-Xiong Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=PXNrncg2DF}\n}",
        "github": "",
        "project": "",
        "reviewers": "Rono;vWUT;PuvF",
        "pdf_size": 22344422,
        "rating": "6;6;6",
        "confidence": "3;3;5",
        "soundness": "3;3;2",
        "contribution": "2;3;3",
        "presentation": "3;3;2",
        "wc_summary": "70;62;122",
        "wc_strengths": "39;38;62",
        "wc_weaknesses": "27;224;229",
        "wc_questions": "95;2;9",
        "wc_review": "231;326;422",
        "wc_reply_reviewers": "15;32;27",
        "wc_reply_authors": "511;1340;1032",
        "reply_reviewers": "1;1;1",
        "reply_authors": "2;4;4",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            84.66666666666667,
            26.599916457680003
        ],
        "wc_strengths_avg": [
            46.333333333333336,
            11.08552609887726
        ],
        "wc_weaknesses_avg": [
            160.0,
            94.06735175748632
        ],
        "wc_questions_avg": [
            35.333333333333336,
            42.28737662970148
        ],
        "wc_review_avg": [
            326.3333333333333,
            77.97577971538485
        ],
        "wc_reply_reviewers_avg": [
            24.666666666666668,
            7.133644853010899
        ],
        "wc_reply_authors_avg": [
            961.0,
            342.141296347966
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2398978403897960211&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=PXNrncg2DF",
        "pdf": "https://openreview.net/pdf?id=PXNrncg2DF",
        "email": "adobe.com;adobe.com;adobe.com;adobe.com;;;;cs.illinois.edu;adobe.com;cs.illinois.edu",
        "author_num": 10,
        "aff_unique_index": "0;0;0;0;1;0;1",
        "aff_unique_norm": "Adobe;University of Illinois Urbana-Champaign",
        "aff_unique_dep": "Adobe Systems Incorporated;",
        "aff_unique_url": "https://www.adobe.com;https://www illinois.edu",
        "aff_unique_abbr": "Adobe;UIUC",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Urbana-Champaign",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "MixSATGEN: Learning Graph Mixing for SAT Instance Generation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18702",
        "id": "PXXuLvIH5r",
        "author_site": "Xinyan Chen, Yang Li, Runzhong Wang, Junchi Yan",
        "tldr": "",
        "abstract": "The Boolean satisfiability problem (SAT) stands as a canonical NP-complete task. In particular, the scarcity of real-world SAT instances and their usefulness for tuning SAT solvers underscore the necessity for effective and efficient ways of hard instance generation, whereas existing methods either struggle to maintain plausible hardness or suffer from limited applicability. Different from the typical construction-based methods, this paper introduces an adaptive and efficient graph interpolation approach that in place modifies the raw structure of graph-represented SAT instance by replacing it with a counterpart from another instance. Specifically, it involves a two-stage matching and mixing pipeline. The matching aims to find a correspondence map of literal nodes from two instance graphs via learned features from a matching network; while the mixing stage involves iteratively exchanging clause pairs with the highest correspondence scores until a specified replacement ratio is achieved. We further show that under our matching-mixing framework, moderate randomness can avoid hardness degradation of instances by introducing Gumbel noise. Experimental results show the superiority of our method with both resemblance in structure and hardness, and general applicability.",
        "keywords": "Combinatorial Optimization;Boolean Satisfiability Problem;Graph Generation;Graph Matching",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Xinyan Chen;Yang Li;Runzhong Wang;Junchi Yan",
        "authorids": "~Xinyan_Chen1;~Yang_Li32;~Runzhong_Wang1;~Junchi_Yan2",
        "gender": ";M;M;",
        "homepage": ";https://yangco-le.github.io;http://runzhong.wang;",
        "dblp": ";;239/4351;",
        "google_scholar": ";ecE0xDIAAAAJ;uoM0g3cAAAAJ;",
        "orcid": ";0000-0002-5249-3471;0000-0002-9566-738X;",
        "linkedin": ";;;",
        "or_profile": "~Xinyan_Chen1;~Yang_Li32;~Runzhong_Wang1;~Junchi_Yan2",
        "aff": ";Shanghai Jiaotong University;Massachusetts Institute of Technology;",
        "aff_domain": ";sjtu.edu.cn;mit.edu;",
        "position": ";PhD student;Postdoc;",
        "bibtex": "@inproceedings{\nchen2024mixsatgen,\ntitle={Mix{SATGEN}: Learning Graph Mixing for {SAT} Instance Generation},\nauthor={Xinyan Chen and Yang Li and Runzhong Wang and Junchi Yan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=PXXuLvIH5r}\n}",
        "github": "",
        "project": "",
        "reviewers": "SBgK;5Kyc;KdVD",
        "pdf_size": 847808,
        "rating": "5;5;8",
        "confidence": "3;3;3",
        "soundness": "2;2;4",
        "contribution": "2;2;3",
        "presentation": "3;3;3",
        "wc_summary": "143;118;66",
        "wc_strengths": "123;43;20",
        "wc_weaknesses": "348;182;18",
        "wc_questions": "14;70;160",
        "wc_review": "628;413;264",
        "wc_reply_reviewers": "435;82;0",
        "wc_reply_authors": "3299;1592;937",
        "reply_reviewers": "3;2;0",
        "reply_authors": "6;3;2",
        "rating_avg": [
            6.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            109.0,
            32.072833779799794
        ],
        "wc_strengths_avg": [
            62.0,
            44.14370472294625
        ],
        "wc_weaknesses_avg": [
            182.66666666666666,
            134.72276059457147
        ],
        "wc_questions_avg": [
            81.33333333333333,
            60.14057606050086
        ],
        "wc_review_avg": [
            435.0,
            149.4144125132066
        ],
        "wc_reply_reviewers_avg": [
            172.33333333333334,
            188.72613903631776
        ],
        "wc_reply_authors_avg": [
            1942.6666666666667,
            995.652661434811
        ],
        "reply_reviewers_avg": [
            1.6666666666666667,
            1.247219128924647
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            1.699673171197595
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12660021677083380851&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=PXXuLvIH5r",
        "pdf": "https://openreview.net/pdf?id=PXXuLvIH5r",
        "email": ";sjtu.edu.cn;mit.edu;",
        "author_num": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Shanghai Jiao Tong University;Massachusetts Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.sjtu.edu.cn;https://web.mit.edu",
        "aff_unique_abbr": "SJTU;MIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "PYDOCManeN",
        "title": "Representation-space diffusion models for generating periodic materials",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Generative models hold the promise of significantly expediting the materials design process when compared to traditional human-guided or rule-based methodologies. However, effectively generating high-quality periodic structures of materials on limited but diverse datasets remains an ongoing challenge. Here we propose a novel approach for periodic structure generation which fully respect the intrinsic symmetries, periodicity, and invariances of the structure space. Namely, we utilize differentiable, physics-based, structural descriptors which can describe periodic systems and satisfy the necessary invariances, in conjunction with a denoising diffusion model which generates new materials within this descriptor or representation space. Reconstruction is then performed on these representations using gradient-based optimization to recover the corresponding Cartesian positions of the crystal structure. This approach differs significantly from current methods by generating materials in the representation space, rather than in the Cartesian space, which is made possible using an efficient reconstruction algorithm. Consequently, known issues with respecting periodic boundaries and translational and rotational invariances during generation can be avoided, and the model training process can be greatly simplified. We show this approach is able to provide competitive performance on established benchmarks compared to current state of the art methods.",
        "keywords": "generative model;diffusion model;materials generation;periodic generation",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Anshuman Sinha;Shuyi Jia;Victor Fung",
        "authorids": "anshs@gatech.edu;shuyijia@gatech.edu;~Victor_Fung1",
        "gender": ";;",
        "homepage": ";;",
        "dblp": ";;",
        "google_scholar": ";;2QsddMIAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "anshs@gatech.edu;shuyijia@gatech.edu;~Victor_Fung1",
        "aff": ";;Georgia Institute of Technology",
        "aff_domain": ";;gatech.edu",
        "position": ";;Assistant Professor",
        "bibtex": "@misc{\nsinha2024representationspace,\ntitle={Representation-space diffusion models for generating periodic materials},\nauthor={Anshuman Sinha and Shuyi Jia and Victor Fung},\nyear={2024},\nurl={https://openreview.net/forum?id=PYDOCManeN}\n}",
        "github": "",
        "project": "",
        "reviewers": "FkRz;dKZ8;gu8x;iuNS;myBa",
        "site": "https://openreview.net/forum?id=PYDOCManeN",
        "pdf_size": 38333112,
        "rating": "3;3;5;6;6",
        "confidence": "5;4;3;2;4",
        "soundness": "2;3;2;3;1",
        "contribution": "1;1;2;2;2",
        "presentation": "2;3;2;2;3",
        "wc_summary": "22;61;144;68;72",
        "wc_strengths": "72;33;63;60;108",
        "wc_weaknesses": "598;201;218;306;315",
        "wc_questions": "141;1;89;71;29",
        "wc_review": "833;296;514;505;524",
        "wc_reply_reviewers": "122;17;152;15;178",
        "wc_reply_authors": "505;435;831;641;911",
        "reply_reviewers": "1;1;1;1;2",
        "reply_authors": "2;1;2;1;3",
        "rating_avg": [
            4.6,
            1.3564659966250536
        ],
        "confidence_avg": [
            3.6,
            1.019803902718557
        ],
        "soundness_avg": [
            2.2,
            0.7483314773547882
        ],
        "contribution_avg": [
            1.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            73.4,
            39.525181846514
        ],
        "wc_strengths_avg": [
            67.2,
            24.194214184387143
        ],
        "wc_weaknesses_avg": [
            327.6,
            142.6752956891977
        ],
        "wc_questions_avg": [
            66.2,
            48.52380858918641
        ],
        "wc_review_avg": [
            534.4,
            171.6887882186836
        ],
        "wc_reply_reviewers_avg": [
            96.8,
            68.31515205282062
        ],
        "wc_reply_authors_avg": [
            664.6,
            182.83719534055427
        ],
        "reply_reviewers_avg": [
            1.2,
            0.4
        ],
        "reply_authors_avg": [
            1.8,
            0.7483314773547883
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.6939779183594881,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13127948688900998208&as_sdt=5,31&sciodt=0,31&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "Georgia Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.gatech.edu",
        "aff_unique_abbr": "Georgia Tech",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "PYVIXnHZhh",
        "title": "Towards Environmental Robustness in Deep Reinforcement Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Following the widespread application of Deep Reinforcement Learning (DRL) in robotics and other domains, adversarial attacks and robustness in DRL have also been widely studied in various threat models. However, most of them assume runtime access of the victim, which limits the feasibility of the attacks.\nTo evaluate the robustness more practically, in this paper, we propose a threat model in which the attacker can only inflict static environmental perturbations on the initial state. By designing a preliminary non-targeted attack method and performing a case study on policy-based DRL agents, we show that the agents are still assailable in our threat model even though the capability of attackers has been severely limited due to the feasibility consideration. \nWe also propose a defense framework, named Boosted Adversarial Training (BAT), which incorporates a supervised kick-starting stage before adversarial training to avoid failure. Extensive experimental results demonstrate that our BAT framework can significantly enhance the robustness of agents in all situations while the existing robust reinforcement learning algorithms may not be suitable.",
        "keywords": "Deep Reinforcement Learning; Adversarial Perturbation; Adversarial robustness;",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/811c34e8efda8d97b948ae2c37e3bf63fa7d2c8e.zip",
        "author": "Chenxu Wang;Huaping Liu",
        "authorids": "~Chenxu_Wang2;~Huaping_Liu3",
        "gender": "M;M",
        "homepage": ";https://sites.google.com/site/thuliuhuaping/",
        "dblp": ";69/1097-1",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.com.hk/citations?user=HXnkIkwAAAAJ",
        "orcid": "0000-0002-6532-532X;",
        "linkedin": ";",
        "or_profile": "~Chenxu_Wang2;~Huaping_Liu3",
        "aff": "Tsinghua University;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nwang2024towards,\ntitle={Towards Environmental Robustness in Deep Reinforcement Learning},\nauthor={Chenxu Wang and Huaping Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=PYVIXnHZhh}\n}",
        "github": "",
        "project": "",
        "reviewers": "hrzc;Zxv9;HcCU;24xp",
        "site": "https://openreview.net/forum?id=PYVIXnHZhh",
        "pdf_size": 696150,
        "rating": "3;3;5;6",
        "confidence": "3;4;4;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;4",
        "wc_summary": "49;108;91;131",
        "wc_strengths": "36;85;77;91",
        "wc_weaknesses": "236;378;204;65",
        "wc_questions": "34;73;116;429",
        "wc_review": "355;644;488;716",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            94.75,
            29.98645527567405
        ],
        "wc_strengths_avg": [
            72.25,
            21.510172012329424
        ],
        "wc_weaknesses_avg": [
            220.75,
            111.24157271452071
        ],
        "wc_questions_avg": [
            163.0,
            156.28979493236275
        ],
        "wc_review_avg": [
            550.75,
            139.87382707283018
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.5555555555555555,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:5uDQxRry6tAJ:scholar.google.com/&scioq=Towards+Environmental+Robustness+in+Deep+Reinforcement+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Tsinghua University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "PYdk0V880P",
        "title": "Fast Neural Architecture Search with Random Neural Tangent Kernel",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Neural architecture search (NAS) is very useful for automating the design of DNN architectures. In recent years, a number of methods for training-free NAS have been proposed, and reducing search cost has raised expectations for real-world applications. In a state-of-the-art (SOTA) training-free NAS based on theoretical background, i.e., NASI, however, the proxy for estimating the test performance of candidate architectures is based on the training error, not the generalization error. In this research, we propose a NAS based on a proxy theoretically derived from the bias-variance decomposition of the normalized generalization error, called NAS-NGE. Specifically, we propose a surrogate of the normalized 2nd order moment of Neural Tangent Kernel (NTK) and use it together with the normalized bias to construct NAS-NGE. We use NAS Benchmarks to demonstrate the effectiveness of the proposed method by comparing it to SOTA training-free NAS in a short search time.",
        "keywords": "Neural Architecture Search;Neural Tangent Kernel;Initialization;Generalization performance",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/ccbc378f8c38cdab41bc90aaa7383157a0d177a4.zip",
        "author": "Keigo Wakayama;Takafumi Kanamori",
        "authorids": "~Keigo_Wakayama1;~Takafumi_Kanamori1",
        "gender": ";M",
        "homepage": ";",
        "dblp": "126/0770;76/6882",
        "google_scholar": ";",
        "orcid": "0009-0008-6663-845X;",
        "linkedin": ";",
        "or_profile": "~Keigo_Wakayama1;~Takafumi_Kanamori1",
        "aff": "NTT Corporation;Tokyo Institute of Technology",
        "aff_domain": "ntt.com;titech.ac.jp",
        "position": "Researcher;Full Professor",
        "bibtex": "@misc{\nwakayama2024fast,\ntitle={Fast Neural Architecture Search with Random Neural Tangent Kernel},\nauthor={Keigo Wakayama and Takafumi Kanamori},\nyear={2024},\nurl={https://openreview.net/forum?id=PYdk0V880P}\n}",
        "github": "",
        "project": "",
        "reviewers": "vdk2;6Yvs;C4Cd",
        "site": "https://openreview.net/forum?id=PYdk0V880P",
        "pdf_size": 413633,
        "rating": "3;6;6",
        "confidence": "4;3;4",
        "soundness": "2;3;3",
        "contribution": "2;3;2",
        "presentation": "2;3;3",
        "wc_summary": "86;48;46",
        "wc_strengths": "99;70;58",
        "wc_weaknesses": "141;125;257",
        "wc_questions": "235;149;29",
        "wc_review": "561;392;390",
        "wc_reply_reviewers": "0;45;0",
        "wc_reply_authors": "732;197;270",
        "reply_reviewers": "0;1;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            60.0,
            18.40289832245635
        ],
        "wc_strengths_avg": [
            75.66666666666667,
            17.21110752456745
        ],
        "wc_weaknesses_avg": [
            174.33333333333334,
            58.817986666967414
        ],
        "wc_questions_avg": [
            137.66666666666666,
            84.48010942753855
        ],
        "wc_review_avg": [
            447.6666666666667,
            80.14292787819078
        ],
        "wc_reply_reviewers_avg": [
            15.0,
            21.213203435596427
        ],
        "wc_reply_authors_avg": [
            399.6666666666667,
            236.877370993704
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:qnsZrFN3rIoJ:scholar.google.com/&scioq=Fast+Neural+Architecture+Search+with+Random+Neural+Tangent+Kernel&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "NTT Corporation;Tokyo Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ntt.co.jp;https://www.titech.ac.jp",
        "aff_unique_abbr": "NTT;Titech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Japan"
    },
    {
        "id": "PYwYYwsbSo",
        "title": "InstructZero: Efficient Instruction Optimization for Black-Box Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models~(LLMs) are instruction followers, but it can be challenging to find the best instruction for different situations, especially for black-box LLMs on which backpropagation is forbidden. Instead of directly optimizing the discrete instruction, we optimize a low-dimensional soft prompt applied to an open-source LLM to generate the instruction for the black-box LLM. On each iteration of the proposed method, which we call InstructZero, a soft prompt is converted into an instruction using the open-source LLM, which is then submitted to the black-box LLM for zero-shot evaluation, and the performance is sent to Bayesian optimization to produce new soft prompts improving the zero-shot performance. We evaluate InstructZero on different combinations of open-source LLMs and APIs including Vicuna and ChatGPT. Our results show that InstructZero outperforms SOTA auto-instruction methods across a variety of downstream tasks.",
        "keywords": "Instruction optimization; large language models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/7b09cf4d617d343d161ce06cb514e95f1ee589a8.zip",
        "author": "Lichang Chen;Jiuhai Chen;Tom Goldstein;Heng Huang;Tianyi Zhou",
        "authorids": "~Lichang_Chen2;~Jiuhai_Chen1;~Tom_Goldstein1;~Heng_Huang1;~Tianyi_Zhou1",
        "gender": "M;M;M;M;M",
        "homepage": "https://www.linkedin.com/in/jiuhai-chen-6a486715a/;https://www.cs.umd.edu/~tomg/;https://www.cs.umd.edu/~heng/;https://tianyizhou.github.io/;",
        "dblp": ";25/8184;03/281;88/8205-1;151/6212",
        "google_scholar": ";KmSuVtgAAAAJ;4OqLaDwAAAAJ;OKvgizMAAAAJ;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": ";;;0000-0001-5348-0632;",
        "linkedin": ";;;tianyizhou;lichang-chen-b7a506173/",
        "or_profile": "~Jiuhai_Chen1;~Tom_Goldstein1;~Heng_Huang1;~Tianyi_Zhou1;~LICHANG_CHEN1",
        "aff": "University of Maryland, College Park;University of Maryland, College Park;Department of Computer Science, University of Maryland, College Park;University of Maryland, College Park;Department of Computer Science, University of Maryland, College Park",
        "aff_domain": "umd.edu;umd.edu;cs.umd.edu;umd.edu;cs.umd.edu",
        "position": "PhD student;Full Professor;Full Professor;Assistant Professor;PhD student",
        "bibtex": "@misc{\nchen2024instructzero,\ntitle={InstructZero: Efficient Instruction Optimization for Black-Box Large Language Models},\nauthor={Lichang Chen and Jiuhai Chen and Tom Goldstein and Heng Huang and Tianyi Zhou},\nyear={2024},\nurl={https://openreview.net/forum?id=PYwYYwsbSo}\n}",
        "github": "",
        "project": "",
        "reviewers": "4arY;FwK3;6Tou",
        "site": "https://openreview.net/forum?id=PYwYYwsbSo",
        "pdf_size": 2243487,
        "rating": "3;6;8",
        "confidence": "4;3;3",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "3;4;4",
        "wc_summary": "66;136;67",
        "wc_strengths": "67;61;16",
        "wc_weaknesses": "394;257;29",
        "wc_questions": "7;14;65",
        "wc_review": "534;468;177",
        "wc_reply_reviewers": "0;89;0",
        "wc_reply_authors": "433;688;47",
        "reply_reviewers": "0;1;0",
        "reply_authors": "3;4;1",
        "rating_avg": [
            5.666666666666667,
            2.0548046676563256
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            89.66666666666667,
            32.76515764582181
        ],
        "wc_strengths_avg": [
            48.0,
            22.759613353482084
        ],
        "wc_weaknesses_avg": [
            226.66666666666666,
            150.54641218648229
        ],
        "wc_questions_avg": [
            28.666666666666668,
            25.849994627121728
        ],
        "wc_review_avg": [
            393.0,
            155.09352017411945
        ],
        "wc_reply_reviewers_avg": [
            29.666666666666668,
            41.95500235040182
        ],
        "wc_reply_authors_avg": [
            389.3333333333333,
            263.50247732337465
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9176629354822472,
        "gs_citation": 87,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11656455885715424620&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;1;0;1",
        "aff_unique_norm": "University of Maryland;University of Maryland, College Park",
        "aff_unique_dep": ";Department of Computer Science",
        "aff_unique_url": "https://www/umd.edu;https://www/umd.edu",
        "aff_unique_abbr": "UMD;UMD",
        "aff_campus_unique_index": "0;0;0;0;0",
        "aff_campus_unique": "College Park",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Pa4hecILrt",
        "title": "Incremental Successive Halving for Hyperparameter Optimization with Budget Constraints",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Hyperparameter optimization (HPO) is indispensable for achieving optimal performance in machine learning tasks. While some approaches focus on sampling more promising hyperparameter configurations, methods based on the successive halving algorithm (SHA) focus on efficiently evaluating hyperparameter configurations through the adaptive allocation of evaluation resources and stopping unpromising candidates early. Yet, SHA comes with several hyperparameters itself, one of which is the maximum budget that can be allocated to evaluate a single hyperparameter configuration. Asynchronous extensions of SHA (ASHA) devise a strategy of autonomously increasing the maximum budget and simultaneously allowing for better parallelization. However, while working well in practice with many considered hyperparameter configurations, there are limitations to the soundness of these adaptations when the overall budget for HPO is limited. This paper provides a theoretical analysis of ASHA in applications with budget constraints. We propose incremental SHA (iSHA), a synchronous extension of SHA, allowing to increment the maximum budget. A theoretical and empirical analysis of iSHA shows that soundness is maintained while guaranteeing to be more resource-efficient than SHA. In an extensive set of experiments, we also demonstrate that, in general, iSHA performs superior to ASHA and progressive ASHA.",
        "keywords": "hyperparameter optimization;sustainability;multi-fidelity",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/d54d6b5740b4bf2d01c39f5928bc527764da8843.pdf",
        "author": "Jasmin Brandt;Marcel Wever;Dimitrios Iliadis;Viktor Bengs;Eyke H\u00fcllermeier",
        "authorids": "~Jasmin_Brandt1;~Marcel_Wever1;~Dimitrios_Iliadis1;~Viktor_Bengs1;~Eyke_H\u00fcllermeier1",
        "gender": "F;M;M;M;M",
        "homepage": ";https://www.marcelwever.de;;https://www.kiml.ifi.lmu.de/;https://cs.uni-paderborn.de/index.php?id=60202",
        "dblp": "308/9792.html;202/9010;;244/9484;h/EykeHullermeier",
        "google_scholar": "254uAJAAAAAJ;ZaE04WUAAAAJ;j2T4koYAAAAJ;J1eEtpwAAAAJ;https://scholar.google.de/citations?user=usVJeNN3xFAC",
        "orcid": ";0000-0001-9782-6818;;0000-0001-6988-6186;0000-0002-9944-4108",
        "linkedin": "jasmin-brandt-270198136/;;;;",
        "or_profile": "~Jasmin_Brandt1;~Marcel_Wever1;~Dimitrios_Iliadis1;~Viktor_Bengs1;~Eyke_H\u00fcllermeier1",
        "aff": "Universit\u00e4t Paderborn;Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen;;Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen;Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen",
        "aff_domain": "uni-paderborn.de;lmu.de;;lmu.de;lmu.de",
        "position": "PhD student;Postdoc;;Postdoc;Full Professor",
        "bibtex": "@misc{\nbrandt2024incremental,\ntitle={Incremental Successive Halving for Hyperparameter Optimization with Budget Constraints},\nauthor={Jasmin Brandt and Marcel Wever and Dimitrios Iliadis and Viktor Bengs and Eyke H{\\\"u}llermeier},\nyear={2024},\nurl={https://openreview.net/forum?id=Pa4hecILrt}\n}",
        "github": "",
        "project": "",
        "reviewers": "nzDd;1KJi;DLma;rzKT",
        "site": "https://openreview.net/forum?id=Pa4hecILrt",
        "pdf_size": 421832,
        "rating": "3;3;3;5",
        "confidence": "4;5;5;2",
        "soundness": "2;2;2;2",
        "contribution": "2;2;1;3",
        "presentation": "1;2;2;3",
        "wc_summary": "55;110;102;153",
        "wc_strengths": "8;63;47;31",
        "wc_weaknesses": "364;312;65;248",
        "wc_questions": "79;20;58;50",
        "wc_review": "506;505;272;482",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            1.224744871391589
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            105.0,
            34.777866524558405
        ],
        "wc_strengths_avg": [
            37.25,
            20.327014045353536
        ],
        "wc_weaknesses_avg": [
            247.25,
            112.95878673215289
        ],
        "wc_questions_avg": [
            51.75,
            21.1704392963396
        ],
        "wc_review_avg": [
            441.25,
            98.18700270402391
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9428090415820632,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8682141098325319715&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "University of Paderborn;Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uni-paderborn.de;https://www.lmu.de",
        "aff_unique_abbr": "UPB;LMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "Pa6SiS66p0",
        "title": "Beyond Unimodal Learning: The Importance of Integrating Multiple Modalities for Lifelong Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "While humans excel at continual learning (CL), deep neural networks (DNNs) exhibit catastrophic forgetting. A salient feature of the brain that allows effective CL is that it utilizes multiple modalities for learning and inference, which is underexplored in DNNs. Therefore, we study the role and interactions of multiple modalities in mitigating forgetting and introduce a benchmark for multi-modal continual learning. Our findings demonstrate that leveraging multiple views and complementary information from multiple modalities enables the model to learn more accurate and robust representations of the objects that are less vulnerable to modality-specific regularities and considerably mitigates forgetting. Furthermore, we observe that individual modalities exhibit varying degrees of robustness to distribution shift. Finally, we propose a method for integrating and aligning the information from different modalities by utilizing the relational structural similarities between the data points in each modality. Our method sets a strong baseline that enables both single- and multimodal inference. Our study provides a promising case for further exploring the role of multiple modalities in enabling CL and provides a standard benchmark for future research.",
        "keywords": "continual learning;lifelong learning;multimodal learning;class incremental learning;multi modal continual learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Fahad Sarfraz;Bahram Zonooz;Elahe Arani",
        "authorids": "~Fahad_Sarfraz1;~Bahram_Zonooz1;~Elahe_Arani1",
        "gender": "M;M;F",
        "homepage": "https://www.fahadsarfraz.com/;https://sites.google.com/view/bahramzonooz;https://sites.google.com/view/elahe-arani",
        "dblp": "250/9424;250/9573;",
        "google_scholar": "Zhx_sM4AAAAJ;;e_I_v6cAAAAJ",
        "orcid": ";;0000-0002-0952-7007",
        "linkedin": "fahadsarfraz/;;elahe-arani-630870b2/",
        "or_profile": "~Fahad_Sarfraz1;~Bahram_Zonooz1;~Elahe_Arani1",
        "aff": "Eindhoven University of Technology;Eindhoven University of Technology;Wayve Technologies Ltd",
        "aff_domain": "tue.nl;tue.nl;wayve.ai",
        "position": "PhD student;Assistant Professor;Head of AI Research",
        "bibtex": "@misc{\nsarfraz2024beyond,\ntitle={Beyond Unimodal Learning: The Importance of Integrating Multiple Modalities for Lifelong Learning},\nauthor={Fahad Sarfraz and Bahram Zonooz and Elahe Arani},\nyear={2024},\nurl={https://openreview.net/forum?id=Pa6SiS66p0}\n}",
        "github": "",
        "project": "",
        "reviewers": "i2PA;eqa5;67Cp",
        "site": "https://openreview.net/forum?id=Pa6SiS66p0",
        "pdf_size": 2569193,
        "rating": "3;5;5",
        "confidence": "5;3;4",
        "soundness": "2;3;2",
        "contribution": "2;2;3",
        "presentation": "3;3;2",
        "wc_summary": "59;62;76",
        "wc_strengths": "19;48;82",
        "wc_weaknesses": "153;217;246",
        "wc_questions": "1;2;24",
        "wc_review": "232;329;428",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1034;1019;830",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;3;2",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            65.66666666666667,
            7.408703590297623
        ],
        "wc_strengths_avg": [
            49.666666666666664,
            25.746628689770024
        ],
        "wc_weaknesses_avg": [
            205.33333333333334,
            38.852999312222416
        ],
        "wc_questions_avg": [
            9.0,
            10.614455552060438
        ],
        "wc_review_avg": [
            329.6666666666667,
            80.018053518496
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            961.0,
            92.83318372220141
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2963227774230116021&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Eindhoven University of Technology;Wayve Technologies",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tue.nl;https://www.wayvetechnologies.com",
        "aff_unique_abbr": "TU/e;Wayve",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "Netherlands;United Kingdom"
    },
    {
        "id": "PaOuEBMvTG",
        "title": "Multiple Object Stitching for Unsupervised Representation Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Contrastive learning for single object centric images has achieved remarkable progress on unsupervised representation, but suffering inferior performance on the widespread images with multiple objects. In this paper, we propose a simple but effective method, Multiple Object Stitching (MOS), to refine the unsupervised representation for multi-object images. Specifically, we construct the multi-object images by stitching the single object centric ones, where the objects in the synthesized multi-object images are predetermined. Hence, compared to the existing contrastive methods, our method provides additional object correspondences between multi-object images without human annotations. In this manner, our method pays more attention to the representations of each object in multi-object image, thus providing more detailed representations for complicated downstream tasks, such as object detection and semantic segmentation. Experimental results on ImageNet, CIFAR and COCO datasets demonstrate that our proposed method achieves the leading unsupervised representation performance on both single object centric images and multi-object ones. The source code can be found in the supplementary material.",
        "keywords": "unsupervised learning;representation learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/d3674a98893c8772a385612b731676938e34e5fb.zip",
        "author": "Chengchao Shen;Dawei Liu;Jianxin Wang",
        "authorids": "~Chengchao_Shen2;~Dawei_Liu3;~Jianxin_Wang1",
        "gender": ";M;",
        "homepage": ";;https://faculty.csu.edu.cn/wangjianxin1/zh_CN/index/106082/list/",
        "dblp": ";;75/2669-1.html",
        "google_scholar": ";;7pgY2F0AAAAJ",
        "orcid": ";0000-0002-1557-431X;0000-0003-1516-0480",
        "linkedin": ";;",
        "or_profile": "~Chengchao_Shen2;~Dawei_Liu3;~Jianxin_Wang1",
        "aff": ";Central South University;Central South University",
        "aff_domain": ";csu.edu.cn;csu.edu.cn",
        "position": ";MS student;Full Professor",
        "bibtex": "@misc{\nshen2024multiple,\ntitle={Multiple Object Stitching for Unsupervised Representation Learning},\nauthor={Chengchao Shen and Dawei Liu and Jianxin Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=PaOuEBMvTG}\n}",
        "github": "",
        "project": "",
        "reviewers": "gfC6;AZJE;R2AJ;Kxdm",
        "site": "https://openreview.net/forum?id=PaOuEBMvTG",
        "pdf_size": 15007933,
        "rating": "3;5;5;8",
        "confidence": "5;4;5;3",
        "soundness": "2;2;2;3",
        "contribution": "1;2;2;3",
        "presentation": "2;1;2;3",
        "wc_summary": "77;77;70;87",
        "wc_strengths": "9;26;16;44",
        "wc_weaknesses": "167;419;394;23",
        "wc_questions": "13;22;15;47",
        "wc_review": "266;544;495;201",
        "wc_reply_reviewers": "0;376;0;0",
        "wc_reply_authors": "692;754;937;189",
        "reply_reviewers": "0;2;0;0",
        "reply_authors": "1;2;2;1",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            77.75,
            6.057020719792859
        ],
        "wc_strengths_avg": [
            23.75,
            13.160072188251856
        ],
        "wc_weaknesses_avg": [
            250.75,
            164.09810327971496
        ],
        "wc_questions_avg": [
            24.25,
            13.5531361684298
        ],
        "wc_review_avg": [
            376.5,
            145.86723415489854
        ],
        "wc_reply_reviewers_avg": [
            94.0,
            162.81277591147446
        ],
        "wc_reply_authors_avg": [
            643.0,
            277.1615052636278
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8866206949335731,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=383126868492264825&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Central South University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.csu.edu.cn",
        "aff_unique_abbr": "CSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "Pb9PIECnNF",
        "title": "Can Pre-trained Networks Detect Familiar Out-of-Distribution Data?",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Out-of-distribution (OOD) detection is critical for safety-sensitive machine learning applications and has been extensively studied, yielding a plethora of methods developed in the literature. However, most studies for OOD detection did not use pre-trained models and trained a backbone from scratch. In recent years, transferring knowledge from large pre-trained models to downstream tasks by lightweight tuning has become mainstream for training in-distribution (ID) classifiers. To bridge the gap between the practice of OOD detection and current classifiers, the unique and crucial problem is that the samples whose information networks know often come as OOD input. We consider that such data may significantly affect the performance of large pre-trained networks because the discriminability of these OOD data depends on the pre-training algorithm. Here, we define such OOD data as PT-OOD (Pre-Trained OOD) data. In this paper, we aim to reveal the effect of PT-OOD on the OOD detection performance of pre-trained networks from the perspective of pre-training algorithms. To achieve this, we explore the PT-OOD detection performance of supervised and self-supervised pre-training algorithms with linear-probing tuning, the most common efficient tuning method. Through our experiments and analysis, we find that the low linear separability of PT-OOD in the feature space heavily degrades the PT-OOD detection performance, and self-supervised models are more vulnerable to PT-OOD than supervised pre-trained models, even with state-of-the-art detection methods. To solve this vulnerability, we further propose a unique solution to large-scale pre-trained models: Leveraging powerful instance-by-instance discriminative representations of pre-trained models and detecting OOD in the feature space independent of the ID decision boundaries. This study provides significant insights to OOD detection with pre-trained models.",
        "keywords": "out-of-distribution detection;pre-trained model;transferability",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/4d19c7cca9b7516cac7355698bdff226909b41c1.zip",
        "author": "Atsuyuki Miyai;Qing Yu;Go Irie;Kiyoharu Aizawa",
        "authorids": "~Atsuyuki_Miyai1;~Qing_Yu2;~Go_Irie3;~Kiyoharu_Aizawa1",
        "gender": "M;M;M;M",
        "homepage": "https://atsumiyai.github.io/;http://yu1ut.com/;;https://sites.google.com/view/aizawa-kiyoharu",
        "dblp": "331/8141;;98/7454;71/5426",
        "google_scholar": "https://scholar.google.co.jp/citations?hl=ja;As3ImtEAAAAJ;2bCSG1AAAAAJ;https://scholar.google.co.jp/citations?user=CJRhhi0AAAAJ",
        "orcid": ";0000-0001-6965-9581;0000-0002-4309-4700;0000-0003-2146-6275",
        "linkedin": ";;;",
        "or_profile": "~Atsuyuki_Miyai1;~Qing_Yu2;~Go_Irie3;~Kiyoharu_Aizawa1",
        "aff": "The University of Tokyo;LY Corporation;Keio University;The University of Tokyo",
        "aff_domain": "t.u-tokyo.ac.jp;lycorp.co.jp;keio.ac.jp;u-tokyo.ac.jp",
        "position": "MS student;Researcher;Visiting Associate Professor;Full Professor",
        "bibtex": "@misc{\nmiyai2024can,\ntitle={Can Pre-trained Networks Detect Familiar Out-of-Distribution Data?},\nauthor={Atsuyuki Miyai and Qing Yu and Go Irie and Kiyoharu Aizawa},\nyear={2024},\nurl={https://openreview.net/forum?id=Pb9PIECnNF}\n}",
        "github": "",
        "project": "",
        "reviewers": "cmE8;PtvE;rG3x;wQPP",
        "site": "https://openreview.net/forum?id=Pb9PIECnNF",
        "pdf_size": 854857,
        "rating": "3;3;5;5",
        "confidence": "4;3;5;3",
        "soundness": "2;1;2;3",
        "contribution": "2;3;2;2",
        "presentation": "3;2;2;3",
        "wc_summary": "116;50;47;74",
        "wc_strengths": "115;20;17;30",
        "wc_weaknesses": "179;213;128;38",
        "wc_questions": "180;101;8;53",
        "wc_review": "590;384;200;195",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            71.75,
            27.60774347895894
        ],
        "wc_strengths_avg": [
            45.5,
            40.413487847499624
        ],
        "wc_weaknesses_avg": [
            139.5,
            65.94884381094182
        ],
        "wc_questions_avg": [
            85.5,
            63.704395452747214
        ],
        "wc_review_avg": [
            342.25,
            162.04995371798168
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.30151134457776363,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6772679062799793031&as_sdt=80005&sciodt=0,11&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "University of Tokyo;LY Corporation;Keio University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.u-tokyo.ac.jp;;https://www.keio.ac.jp",
        "aff_unique_abbr": "UTokyo;;Keio",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Japan;"
    },
    {
        "id": "PbGs8PGoCn",
        "title": "Stateless Mean-Field Games: A Framework for Independent Learning with Large Populations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Competitive games played by thousands or even millions of players are omnipresent in the real world, for instance in transportation, communications, or computer networks. However, learning in such large-scale multi-agent settings is known to be challenging due to the so-called \"curse of many agents\". In order to tackle large population independent learning in a general class of such problems, we formulate and analyze the Stateless Mean-Field Game (SMFG): we show that SMFG is a relevant and powerful special case of certain mean-field game formulations and a generalization of other interaction models. Furthermore, we show that SMFG can model many real-world interactions, and we prove explicit finite sample complexity guarantees with independent learning under different feedback models with repeated play. Theoretically, we contribute techniques from variational inequality (VI) literature to analyze independent learning by showing that SMFG is a VI problem at the infinite agent limit. We formulate learning and exploration algorithms which converge efficiently to approximate Nash equilibria even with finitely many agents. Finally, we validate our theoretical results in numerical examples as well as in the real-world problems of city traffic and network access.",
        "keywords": "mean field games;independent learning;variational inequality",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/f12b1f997b08a46f606ee7af14d5c1a5ff9c9f4a.zip",
        "author": "Batuhan Yardim;Semih Cayci;Niao He",
        "authorids": "~Batuhan_Yardim1;~Semih_Cayci1;~Niao_He3",
        "gender": ";M;",
        "homepage": ";https://www.semihcayci.com;http://people.inf.ethz.ch/niaohe",
        "dblp": "https://dblp.uni-trier.de/pers/y/Yardim:Ali_Batuhan.html;;https://dblp.uni-trier.de/pers/h/He:Niao.html",
        "google_scholar": ";pt_pXpcAAAAJ;iNcA81MAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Batuhan_Yardim1;~Semih_Cayci1;~Niao_He1",
        "aff": "ETHZ - ETH Zurich;Rheinisch Westf\u00e4lische Technische Hochschule Aachen;Swiss Federal Institute of Technology",
        "aff_domain": "ethz.ch;rwth-aachen.de;ethz.ch",
        "position": "PhD student;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nyardim2024stateless,\ntitle={Stateless Mean-Field Games: A Framework for Independent Learning with Large Populations},\nauthor={Batuhan Yardim and Semih Cayci and Niao He},\nyear={2024},\nurl={https://openreview.net/forum?id=PbGs8PGoCn}\n}",
        "github": "",
        "project": "",
        "reviewers": "qRij;qCUR;rayu",
        "site": "https://openreview.net/forum?id=PbGs8PGoCn",
        "pdf_size": 18707046,
        "rating": "3;5;8",
        "confidence": "3;2;2",
        "soundness": "3;2;3",
        "contribution": "2;2;3",
        "presentation": "4;3;3",
        "wc_summary": "77;56;31",
        "wc_strengths": "79;38;17",
        "wc_weaknesses": "259;297;36",
        "wc_questions": "2;9;10",
        "wc_review": "417;400;94",
        "wc_reply_reviewers": "155;143;0",
        "wc_reply_authors": "754;1223;174",
        "reply_reviewers": "1;1;0",
        "reply_authors": "1;2;1",
        "rating_avg": [
            5.333333333333333,
            2.0548046676563256
        ],
        "confidence_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            54.666666666666664,
            18.803073034893938
        ],
        "wc_strengths_avg": [
            44.666666666666664,
            25.746628689770024
        ],
        "wc_weaknesses_avg": [
            197.33333333333334,
            115.12987835001343
        ],
        "wc_questions_avg": [
            7.0,
            3.559026084010437
        ],
        "wc_review_avg": [
            303.6666666666667,
            148.419076342033
        ],
        "wc_reply_reviewers_avg": [
            99.33333333333333,
            70.40991091853161
        ],
        "wc_reply_authors_avg": [
            717.0,
            429.05089053242466
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8029550685469661,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11521786063556799221&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "ETH Zurich;RWTH Aachen University;Swiss Federal Institute of Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ethz.ch;https://www.rwth-aachen.de;https://www.ethz.ch",
        "aff_unique_abbr": "ETHZ;RWTH;ETH Zurich",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Aachen",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Switzerland;Germany"
    },
    {
        "id": "PbpJnyewVM",
        "title": "Zero-shot Cross-task Preference Alignment for Offline RL via Optimal Transport",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In preference-based Reinforcement Learning (PbRL), aligning rewards with human intentions often necessitates a substantial volume of human-provided labels. Furthermore, the expensive preference data from prior tasks often lacks reusability for subsequent tasks, resulting in repetitive labeling for each new task. In this paper, we propose a novel zero-shot cross-task preference-based RL algorithm that leverages labeled preference data from source tasks to infer labels for target tasks, eliminating the requirement for human queries. Our approach utilizes Gromov-Wasserstein distance to align trajectory distributions between source and target tasks. The solved optimal transport matrix serves as a correspondence between trajectories of two tasks, making it possible to identify corresponding trajectory pairs between tasks and transfer the preference labels. However, direct learning from these inferred labels might introduce noisy or inaccurate reward functions. To this end, we introduce Robust Preference Transformer, which considers both reward mean and uncertainty by modeling rewards as Gaussian distributions. Through extensive empirical validation on robotic manipulation tasks from Meta-World and Robomimic, our approach exhibits strong capabilities of transferring preferences between tasks in a zero-shot way and learns reward functions from noisy labels robustly. Notably, our approach significantly surpasses existing methods in limited-data scenarios. The videos of our method are available on the website: https://sites.google.com/view/pot-rpt.",
        "keywords": "preference-based reinforcement learning;offline reinforcement learning;deep reinforcement learning;optimal transport",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Runze Liu;Yali Du;Fengshuo Bai;Jiafei Lyu;Xiu Li",
        "authorids": "~Runze_Liu2;~Yali_Du1;~Fengshuo_Bai1;~Jiafei_Lyu1;~Xiu_Li1",
        "gender": "M;;;M;F",
        "homepage": "https://ryanliu112.github.io/;;https://changwinde.github.io/;;https://thusigsiclab.github.io/thu.github.io/introduction.html",
        "dblp": "235/0682-2;;346/1114;278/1503;13/1206-1",
        "google_scholar": "LiIfGakAAAAJ;;https://scholar.google.com/citations?hl=en;bfgCMr8AAAAJ;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": "0009-0007-4784-5333;;;0000-0001-6616-417X;0000-0003-0403-1923",
        "linkedin": ";;;;",
        "or_profile": "~Runze_Liu2;~Yali_Du1;~Fengshuo_Bai1;~Jiafei_Lyu1;~Xiu_Li1",
        "aff": "Shanghai Artificial Intelligence Laboratory;;Shanghai Jiaotong University;Tsinghua University;Tsinghua University",
        "aff_domain": "pjlab.org.cn;;sjtu.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "Intern;;PhD student;PhD student;Professor",
        "bibtex": "@misc{\nliu2024zeroshot,\ntitle={Zero-shot Cross-task Preference Alignment for Offline {RL} via Optimal Transport},\nauthor={Runze Liu and Yali Du and Fengshuo Bai and Jiafei Lyu and Xiu Li},\nyear={2024},\nurl={https://openreview.net/forum?id=PbpJnyewVM}\n}",
        "github": "",
        "project": "",
        "reviewers": "Lako;g2DT;gYxn;43na",
        "site": "https://openreview.net/forum?id=PbpJnyewVM",
        "pdf_size": 3325529,
        "rating": "3;3;5;5",
        "confidence": "3;4;3;4",
        "soundness": "1;2;3;3",
        "contribution": "2;2;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "132;84;77;120",
        "wc_strengths": "8;36;20;88",
        "wc_weaknesses": "146;128;58;204",
        "wc_questions": "27;74;17;105",
        "wc_review": "313;322;172;517",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "289;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            103.25,
            23.27418097377435
        ],
        "wc_strengths_avg": [
            38.0,
            30.528675044947494
        ],
        "wc_weaknesses_avg": [
            134.0,
            52.09606511052442
        ],
        "wc_questions_avg": [
            55.75,
            35.66072769868837
        ],
        "wc_review_avg": [
            331.0,
            122.76196479366074
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            72.25,
            125.14067084685138
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0.25,
            0.4330127018922193
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10527505781036925482&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;2",
        "aff_unique_norm": "Shanghai Artificial Intelligence Laboratory;Shanghai Jiao Tong University;Tsinghua University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.shailab.org/;https://www.sjtu.edu.cn;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "Shanghai AI Lab;SJTU;THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Synapse: Trajectory-as-Exemplar Prompting with Memory for Computer Control",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18701",
        "id": "Pc8AU1aF5e",
        "author_site": "Longtao Zheng, Rundong Wang, Xinrun Wang, Bo An",
        "tldr": "",
        "abstract": "Building agents with large language models (LLMs) for computer control is a burgeoning research area, where the agent receives computer states and performs actions to complete complex tasks. Previous computer agents have demonstrated the benefits of in-context learning (ICL); however, their performance is hindered by several issues. First, the limited context length of LLMs and complex computer states restrict the number of exemplars, as a single webpage can consume the entire context. Second, the exemplars in current methods, such as high-level plans and multi-choice questions, cannot represent complete trajectories, leading to suboptimal performance in long-horizon tasks. Third, existing computer agents rely on task-specific exemplars and overlook the similarity among tasks, resulting in poor generalization to novel tasks. To address these challenges, we introduce Synapse, a computer agent featuring three key components: i) state abstraction, which filters out task-irrelevant information from raw states, allowing more exemplars within the limited context, ii) trajectory-as-exemplar prompting, which prompts the LLM with complete trajectories of the abstracted states and actions to improve multi-step decision-making, and iii) exemplar memory, which stores the embeddings of exemplars and retrieves them via similarity search for generalization to novel tasks. We evaluate Synapse on MiniWoB++, a standard task suite, and Mind2Web, a real-world website benchmark. In MiniWoB++, Synapse achieves a 99.2% average success rate (a 10% relative improvement) across 64 tasks using demonstrations from only 48 tasks. Notably, Synapse is the first ICL method to solve the book-flight task in MiniWoB++. Synapse also exhibits a 56% relative improvement in average step success rate over the previous state-of-the-art prompting scheme in Mind2Web.",
        "keywords": "AI Agents;Large Language Models;Prompting",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/8e82228af20fc4640fbedc7ef60e0278632efab6.zip",
        "author": "Longtao Zheng;Rundong Wang;Xinrun Wang;Bo An",
        "authorids": "~Longtao_Zheng1;~Rundong_Wang1;~Xinrun_Wang1;~Bo_An2",
        "gender": "M;M;M;M",
        "homepage": "https://ltzheng.github.io/;;https://rainwangphy.github.io/;https://personal.ntu.edu.sg/boan/",
        "dblp": "293/7155;254/1228;199/6413;42/6178-1.html",
        "google_scholar": "https://scholar.google.com/citations?hl=en;JEVpgE8AAAAJ;ROANfPUAAAAJ;PEEpuNwAAAAJ",
        "orcid": ";;;0000-0002-7064-7438",
        "linkedin": "longtaozheng;;;",
        "or_profile": "~Longtao_Zheng1;~Rundong_Wang1;~Xinrun_Wang1;~Bo_An2",
        "aff": "Nanyang Technological University, Singapore;Tencent TiMi Studio;Nanyang Technological University;Nanyang Technological University",
        "aff_domain": "ntu.edu.sg;tencent.com;ntu.edu.sg;ntu.edu.sg",
        "position": "PhD student;Researcher;Postdoc;Full Professor",
        "bibtex": "@inproceedings{\nzheng2024synapse,\ntitle={Synapse: Trajectory-as-Exemplar Prompting with Memory for Computer Control},\nauthor={Longtao Zheng and Rundong Wang and Xinrun Wang and Bo An},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Pc8AU1aF5e}\n}",
        "github": "",
        "project": "",
        "reviewers": "mGYB;bu8M;z7sh",
        "pdf_size": 1275695,
        "rating": "6;8;8",
        "confidence": "2;4;3",
        "soundness": "3;3;3",
        "contribution": "3;2;3",
        "presentation": "3;3;3",
        "wc_summary": "36;120;209",
        "wc_strengths": "25;79;199",
        "wc_weaknesses": "9;234;450",
        "wc_questions": "278;19;34",
        "wc_review": "348;452;892",
        "wc_reply_reviewers": "0;190;0",
        "wc_reply_authors": "923;1493;1451",
        "reply_reviewers": "0;1;0",
        "reply_authors": "2;3;3",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            121.66666666666667,
            70.63678613552258
        ],
        "wc_strengths_avg": [
            101.0,
            72.71863585079137
        ],
        "wc_weaknesses_avg": [
            231.0,
            180.0499930574839
        ],
        "wc_questions_avg": [
            110.33333333333333,
            118.71628176267801
        ],
        "wc_review_avg": [
            564.0,
            235.78521299408635
        ],
        "wc_reply_reviewers_avg": [
            63.333333333333336,
            89.56685895029602
        ],
        "wc_reply_authors_avg": [
            1289.0,
            259.3684637730655
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.8660254037844385,
        "gs_citation": 65,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1851636395999475370&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=Pc8AU1aF5e",
        "pdf": "https://openreview.net/pdf?id=Pc8AU1aF5e",
        "email": "ntu.edu.sg;tencent.com;ntu.edu.sg;ntu.edu.sg",
        "author_num": 4,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Nanyang Technological University;Tencent",
        "aff_unique_dep": ";TiMi Studio",
        "aff_unique_url": "https://www.ntu.edu.sg;https://timi.qq.com",
        "aff_unique_abbr": "NTU;Tencent",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "Singapore;China"
    },
    {
        "id": "PcBJ4pA6bF",
        "title": "Overcoming Data and Model heterogeneities in Decentralized Federated Learning via Synthetic Anchors",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Conventional Federated Learning (FL) involves collaborative training of a global model by multiple client local models. In this emerging paradigm, the central server assumes a critical role in aggregating local models and maintaining the global model. However, it encounters various challenges, including scalability, management, and inefficiencies arising from idle client devices. \nRecently, studies on serverless decentralized FL have shown advantages in overcoming these challenges, enabling clients to own different local models and separately optimize local data. Despite the promising advancements in decentralized FL, it is crucial to thoroughly investigate the implications of data and model heterogeneity, which pose unique challenges that must be overcome. Therefore, the research question to be answered in this study is: How can every client's local model learn generalizable representation?\nTo address this question, we propose a novel Decentralized FL technique by introducing Synthetic Anchors, dubbed as DeSA. Inspired by the theory of domain adaptation and Knowledge distillation (KD), we leverage the synthetic anchors to design two effective regularization terms for local training: 1) anchor loss that matches the distribution of the client's latent embedding with an anchor and 2) KD loss that enables clients learning from others. \nIn contrast to previous KD-based heterogeneous FL methods, we don\u2019t presume access to real public or a global data generator. \nDeSA enables each client's model to become robust to distribution shift across different client-domains. Through extensive experiments on diverse client data distributions, we showcase the effectiveness of \\ours{} in enhancing both inter and intra-domain accuracy of each client.",
        "keywords": "Federated Learning;Data Heterogeneity;Model Heterogeneity",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/9f59eb9a0983d84551769b886e45eac851ffafb7.zip",
        "author": "Chun-Yin Huang;Kartik Srinivas;Xin Zhang;Xiaoxiao Li",
        "authorids": "~Chun-Yin_Huang1;~Kartik_Srinivas1;~Xin_Zhang16;~Xiaoxiao_Li1",
        "gender": "M;M;M;Unspecified",
        "homepage": ";https://kartiksrinivas007.github.io/;https://xinzhang-nac.github.io/;https://xxlya.github.io/",
        "dblp": ";;76/1584-54.html;71/8042",
        "google_scholar": "moi11dgAAAAJ;https://scholar.google.co.in/citations?user=TxnwVpgAAAAJ;9u5Pa0gAAAAJ;sdENOQ4AAAAJ",
        "orcid": ";;0000-0002-0784-2038;",
        "linkedin": ";;;",
        "or_profile": "~Chun-Yin_Huang1;~Kartik_Srinivas1;~Xin_Zhang16;~Xiaoxiao_Li1",
        "aff": "University of British Columbia;Indian Institute of Technology, Hyderabad;Meta Facebook;University of British Columbia",
        "aff_domain": "ubc.ca;cse.iith.ac.in;fb.com;ece.ubc.ca",
        "position": "PhD student;Undergrad student;Research Scientist;Assistant Professor",
        "bibtex": "@misc{\nhuang2024overcoming,\ntitle={Overcoming Data and Model heterogeneities in Decentralized Federated Learning via Synthetic Anchors},\nauthor={Chun-Yin Huang and Kartik Srinivas and Xin Zhang and Xiaoxiao Li},\nyear={2024},\nurl={https://openreview.net/forum?id=PcBJ4pA6bF}\n}",
        "github": "",
        "project": "",
        "reviewers": "phME;VrA4;xb5U;2BZe;R93g",
        "site": "https://openreview.net/forum?id=PcBJ4pA6bF",
        "pdf_size": 3872454,
        "rating": "3;3;6;6;6",
        "confidence": "5;4;3;4;3",
        "soundness": "3;2;3;2;3",
        "contribution": "2;2;3;3;3",
        "presentation": "2;1;2;3;3",
        "wc_summary": "84;105;85;88;92",
        "wc_strengths": "217;24;75;55;102",
        "wc_weaknesses": "375;201;124;59;263",
        "wc_questions": "158;9;87;2;3",
        "wc_review": "834;339;371;204;460",
        "wc_reply_reviewers": "391;30;0;16;0",
        "wc_reply_authors": "3116;1086;517;261;711",
        "reply_reviewers": "2;1;0;1;0",
        "reply_authors": "18;5;6;2;6",
        "rating_avg": [
            4.8,
            1.469693845669907
        ],
        "confidence_avg": [
            3.8,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.2,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            90.8,
            7.6262703859750465
        ],
        "wc_strengths_avg": [
            94.6,
            66.2920809750305
        ],
        "wc_weaknesses_avg": [
            204.4,
            109.68609756938206
        ],
        "wc_questions_avg": [
            51.8,
            61.98515951419339
        ],
        "wc_review_avg": [
            441.6,
            212.73514049164515
        ],
        "wc_reply_reviewers_avg": [
            87.4,
            152.21248306232968
        ],
        "wc_reply_authors_avg": [
            1138.2,
            1024.9182211279103
        ],
        "reply_reviewers_avg": [
            0.8,
            0.7483314773547883
        ],
        "reply_authors_avg": [
            7.4,
            5.499090833947008
        ],
        "replies_avg": [
            49,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.7637626158259733,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16641722536636542082&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "University of British Columbia;Indian Institute of Technology Hyderabad;Meta",
        "aff_unique_dep": ";;Meta Platforms, Inc.",
        "aff_unique_url": "https://www.ubc.ca;https://www.iith.ac.in;https://meta.com",
        "aff_unique_abbr": "UBC;IIT Hyderabad;Meta",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hyderabad",
        "aff_country_unique_index": "0;1;2;0",
        "aff_country_unique": "Canada;India;United States"
    },
    {
        "title": "Pre-training with Synthetic Data Helps Offline Reinforcement Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18700",
        "id": "PcxQgtHGj2",
        "author_site": "Zecheng Wang, Che Wang, Zixuan Dong, Keith Ross",
        "tldr": "",
        "abstract": "Recently, it has been shown that for offline deep reinforcement learning (DRL), pre-training Decision Transformer with a large language corpus can improve downstream performance (Reid et al., 2022). A natural question to ask is whether this performance gain can only be achieved with language pre-training, or can be achieved with simpler pre-training schemes which do not involve language. In this paper, we first show that language is not essential for improved performance, and indeed pre-training with synthetic IID data for a small number of updates can match the performance gains from pre-training with a large language corpus; moreover, pre-training with data generated by a one-step Markov chain can further improve the performance. Inspired by these experimental results, we then consider pre-training Conservative Q-Learning (CQL), a popular offline DRL algorithm, which is Q-learning-based and typically employs a Multi-Layer Perceptron (MLP) backbone. Surprisingly, pre-training with simple synthetic data for a small number of updates can also improve CQL, providing consistent performance improvement on D4RL Gym locomotion datasets. The results of this paper not only illustrate the importance of pre-training for offline DRL but also show that the pre-training data can be synthetic and generated with remarkably simple mechanisms.",
        "keywords": "Deep Reinforcement Learning;Offline Reinforcement Learning;Pretraining",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/25fde91c047ce8d710162318c68b791ee8f6d088.pdf",
        "author": "Zecheng Wang;Che Wang;Zixuan Dong;Keith W. Ross",
        "authorids": "~Zecheng_Wang1;~Che_Wang1;~Zixuan_Dong1;~Keith_W._Ross1",
        "gender": "M;M;M;M",
        "homepage": "https://victor-wang-902.github.io;https://watchernyu.github.io/me/;https://cs.shanghai.nyu.edu/phd-students/zixuan-dong-dongzixuan;http://www.nyu.edu/projects/keithwross/",
        "dblp": ";130/6621;329/4319;r/KWRoss",
        "google_scholar": "z7ZFaCgAAAAJ;cx_Kg8MAAAAJ;lbtEL90AAAAJ;https://scholar.google.com.tw/citations?user=RhUcYmQAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Zecheng_Wang1;~Che_Wang1;~Zixuan_Dong1;~Keith_W._Ross1",
        "aff": "New York University, Abu Dhabi;Amazon;New York University;New York University",
        "aff_domain": "nyuad.nyu.edu;amazon.com;nyu.edu;nyu.edu",
        "position": "Researcher;Postdoc;PhD student;Full Professor",
        "bibtex": "@inproceedings{\nwang2024pretraining,\ntitle={Pre-training with Synthetic Data Helps Offline Reinforcement Learning},\nauthor={Zecheng Wang and Che Wang and Zixuan Dong and Keith W. Ross},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=PcxQgtHGj2}\n}",
        "github": "",
        "project": "",
        "reviewers": "WUkY;jxkz;dSfS",
        "pdf_size": 6492461,
        "rating": "5;6;6",
        "confidence": "3;5;2",
        "soundness": "3;4;3",
        "contribution": "2;3;3",
        "presentation": "2;4;3",
        "wc_summary": "60;182;57",
        "wc_strengths": "30;66;71",
        "wc_weaknesses": "31;108;123",
        "wc_questions": "11;66;67",
        "wc_review": "132;422;318",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "741;657;1380",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;2",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.3333333333333335,
            1.247219128924647
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            99.66666666666667,
            58.23133940490197
        ],
        "wc_strengths_avg": [
            55.666666666666664,
            18.263503375736967
        ],
        "wc_weaknesses_avg": [
            87.33333333333333,
            40.30164044083345
        ],
        "wc_questions_avg": [
            48.0,
            26.166135875720485
        ],
        "wc_review_avg": [
            290.6666666666667,
            119.9592523410438
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            926.0,
            322.8529076839792
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.18898223650461363,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16637727662641275267&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=PcxQgtHGj2",
        "pdf": "https://openreview.net/pdf?id=PcxQgtHGj2",
        "email": "nyuad.nyu.edu;amazon.com;nyu.edu;nyu.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "New York University;Amazon",
        "aff_unique_dep": ";Amazon.com, Inc.",
        "aff_unique_url": "https://nyu.edu;https://www.amazon.com",
        "aff_unique_abbr": "NYU;Amazon",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Abu Dhabi;",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "United Arab Emirates;United States"
    },
    {
        "title": "CrossQ: Batch Normalization in Deep Reinforcement Learning for Greater Sample Efficiency and Simplicity",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18699",
        "id": "PczQtTsTIX",
        "author_site": "Aditya Bhatt, Daniel Palenicek, Boris Belousov, Max Argus, Artemij Amiranashvili, Thomas Brox, Jan Peters",
        "tldr": "",
        "abstract": "Sample efficiency is a crucial problem in deep reinforcement learning. Recent algorithms, such as REDQ and DroQ, found a way to improve the sample efficiency by increasing the update-to-data (UTD) ratio to 20 gradient update steps on the critic per environment sample.\nHowever, this comes at the expense of a greatly increased computational cost. To reduce this computational burden, we introduce CrossQ:\nA lightweight algorithm for continuous control tasks that makes careful use of Batch Normalization and removes target networks to surpass the current state-of-the-art in sample efficiency while maintaining a low UTD ratio of 1. Notably, CrossQ does not rely on advanced bias-reduction schemes used in current methods. CrossQ's contributions are threefold: (1) it matches or surpasses current state-of-the-art methods in terms of sample efficiency, (2) it substantially reduces the computational cost compared to REDQ and DroQ, (3) it is easy to implement, requiring just a few lines of code on top of SAC.",
        "keywords": "Deep Reinforcement Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Aditya Bhatt;Daniel Palenicek;Boris Belousov;Max Argus;Artemij Amiranashvili;Thomas Brox;Jan Peters",
        "authorids": "~Aditya_Bhatt1;~Daniel_Palenicek1;~Boris_Belousov1;~Max_Argus2;~Artemij_Amiranashvili1;~Thomas_Brox1;~Jan_Peters3",
        "gender": ";M;;;M;M;M",
        "homepage": ";;;;https://scholar.google.de/citations?user=BgYdP1sAAAAJ&hl=en;https://lmb.informatik.uni-freiburg.de/people/brox/index.en.html;https://www.jan-peters.net",
        "dblp": ";267/9480;;;;97/4586;p/JanPeters1",
        "google_scholar": ";AtX0UHsAAAAJ;;;;https://scholar.google.com/citations?hl=de;https://scholar.google.de/citations?user=-kIVAcAAAAAJ",
        "orcid": ";0000-0002-8292-1318;;;;0000-0002-6282-8861;0000-0002-5266-8091",
        "linkedin": ";danielpalenicek/;;;;;janrpeters/",
        "or_profile": "~Aditya_Bhatt1;~Daniel_Palenicek1;~Boris_Belousov1;~Max_Argus2;~Artemij_Amiranashvili1;~Thomas_Brox1;~Jan_Peters3",
        "aff": ";Technische Universit\u00e4t Darmstadt;;;University of Freiburg;University of Freiburg;TU Darmstadt",
        "aff_domain": ";tu-darmstadt.de;;;uni-freiburg.de;uni-freiburg.de;tu-darmstadt.de",
        "position": ";PhD student;;;PhD student;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nbhatt2024crossq,\ntitle={CrossQ: Batch Normalization in Deep Reinforcement Learning for Greater Sample Efficiency and Simplicity},\nauthor={Aditya Bhatt and Daniel Palenicek and Boris Belousov and Max Argus and Artemij Amiranashvili and Thomas Brox and Jan Peters},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=PczQtTsTIX}\n}",
        "github": "",
        "project": "",
        "reviewers": "7EH3;enbH;e62k;stzr",
        "pdf_size": 2429256,
        "rating": "6;6;8;8",
        "confidence": "4;3;5;5",
        "soundness": "2;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "3;4;4;4",
        "wc_summary": "45;103;124;73",
        "wc_strengths": "47;90;152;132",
        "wc_weaknesses": "149;211;284;242",
        "wc_questions": "66;2;185;119",
        "wc_review": "307;406;745;566",
        "wc_reply_reviewers": "53;197;117;39",
        "wc_reply_authors": "820;784;1599;977",
        "reply_reviewers": "1;2;1;1",
        "reply_authors": "2;2;3;3",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            86.25,
            29.92803869283786
        ],
        "wc_strengths_avg": [
            105.25,
            40.39415180443822
        ],
        "wc_weaknesses_avg": [
            221.5,
            49.22651724426582
        ],
        "wc_questions_avg": [
            93.0,
            67.3609679265374
        ],
        "wc_review_avg": [
            506.0,
            166.07377878521342
        ],
        "wc_reply_reviewers_avg": [
            101.5,
            62.48799884777876
        ],
        "wc_reply_authors_avg": [
            1045.0,
            327.9809445684307
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.9045340337332909,
        "gs_citation": 36,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2503800354588177841&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "openreview": "https://openreview.net/forum?id=PczQtTsTIX",
        "pdf": "https://openreview.net/pdf?id=PczQtTsTIX",
        "email": ";tu-darmstadt.de;;;uni-freiburg.de;uni-freiburg.de;tu-darmstadt.de",
        "author_num": 7,
        "aff_unique_index": "0;1;1;0",
        "aff_unique_norm": "Technische Universit\u00e4t Darmstadt;University of Freiburg",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tu-darmstadt.de;https://www.uni-freiburg.de",
        "aff_unique_abbr": "TUD;UoF",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Darmstadt",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "PdTe8S0Mkl",
        "title": "Humans vs ChatGPT: Uncovering the Non-trivial Distinctions by Evaluating Parallel Responses",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The advent of ChatGPT and similar Large Language Models has set the world in an uproar as it is able to generate human-like natural language. Due to the high similarity between the human text and ChatGPT text, it begs the question if the two are truly indistinguishable. In this study, the human-generated content is compared to ChatGPT-3.5, ChatGPT-4, and Davinci-3 using the same technical questions as found on StackOverflow and general questions found on Yahoo Answers. We leveraged Roget's thesaurus to uncover thematic similarities and differences between the human corpora and GPT corpora. We performed a chi-square test on Roget's 1034 categories and found a significant difference in the appearance of words for 365 of them. To uncover the differences in the neighborhoods of the word embedding we utilized the MIT Embedding Comparator to distinguish GloVe base vectors with respect to its trained version on human and ChatGPT corpora. Pre-trained BERT and Sentence-BERT were used to measure the semantic similarity in the answers (on the same questions) given by humans and ChatGPT, which came out highly similar. While that might indicate difficulty in distinguishing ChatGPT and human text, the significant differences in the appearance of words suggested a move towards classification using machine learning models. We observed that various machine learning models performed very well. In summary, we discern disparities and parallels that can be attributed to conceptual, contextual, or lexicographic factors. We endeavor to establish connections between each methodology and these respective categories.",
        "keywords": "ChatGPT;Natural Language Processing;Machine Learning;Roget's Thesaurus",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Emon Sarker;Labib Rahman;Nabeel Mohammed;Mohammad Ruhul Amin",
        "authorids": "~Emon_Sarker1;~Labib_Rahman1;~Nabeel_Mohammed1;~Mohammad_Ruhul_Amin1",
        "gender": "M;;M;M",
        "homepage": ";https://labib-portfolio.web.app/;http://ece.northsouth.edu/people/dr-nabeel-mohammed/;https://ruhulsbu.github.io",
        "dblp": ";;127/2798;193/0290.html",
        "google_scholar": ";;https://scholar.google.com.au/citations?hl=en;N_yWGjIAAAAJ",
        "orcid": ";;0000-0002-7661-3570;0000-0001-6540-3415",
        "linkedin": "emon-sarker-a18a4b208/;;;shajibsust/",
        "or_profile": "~Emon_Sarker1;~Labib_Rahman1;~Nabeel_Mohammed1;~Mohammad_Ruhul_Amin1",
        "aff": ";;North South University;Fordham University",
        "aff_domain": ";;northsouth.edu;fordham.edu",
        "position": ";;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nsarker2024humans,\ntitle={Humans vs Chat{GPT}: Uncovering the Non-trivial Distinctions by Evaluating Parallel Responses},\nauthor={Emon Sarker and Labib Rahman and Nabeel Mohammed and Mohammad Ruhul Amin},\nyear={2024},\nurl={https://openreview.net/forum?id=PdTe8S0Mkl}\n}",
        "github": "",
        "project": "",
        "reviewers": "3Tnm;spBk;k3D5;UaJh",
        "site": "https://openreview.net/forum?id=PdTe8S0Mkl",
        "pdf_size": 1352667,
        "rating": "1;3;3;5",
        "confidence": "5;5;4;2",
        "soundness": "1;1;3;2",
        "contribution": "1;1;2;1",
        "presentation": "1;2;2;3",
        "wc_summary": "97;127;44;96",
        "wc_strengths": "50;72;67;12",
        "wc_weaknesses": "197;407;157;83",
        "wc_questions": "59;217;5;70",
        "wc_review": "403;823;273;261",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.0,
            1.224744871391589
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            1.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            91.0,
            29.857997253667232
        ],
        "wc_strengths_avg": [
            50.25,
            23.54118731075389
        ],
        "wc_weaknesses_avg": [
            211.0,
            120.32456108376212
        ],
        "wc_questions_avg": [
            87.75,
            78.57281654618218
        ],
        "wc_review_avg": [
            440.0,
            228.028506989806
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:NX_GlxgGAXwJ:scholar.google.com/&scioq=Humans+vs+ChatGPT:+Uncovering+the+Non-trivial+Distinctions+by+Evaluating+Parallel+Responses&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "North South University;Fordham University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.northsouth.edu/;https://www.fordham.edu",
        "aff_unique_abbr": "NSU;Fordham",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Bangladesh;United States"
    },
    {
        "title": "Never Train from Scratch: Fair Comparison of Long-Sequence Models Requires Data-Driven Priors",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18698",
        "id": "PdaPky8MUn",
        "author_site": "Ido Amos, Jonathan Berant, Ankit Gupta",
        "tldr": "",
        "abstract": "Modeling long-range dependencies across sequences is a longstanding goal in machine learning and has led to architectures, such as state space models, that dramatically outperform Transformers on long sequences. However, these impressive empirical gains have been by and large demonstrated on benchmarks (e.g. Long Range Arena), where models are randomly initialized and trained to predict a target label from an input sequence. In this work, we show that random initialization leads to gross overestimation of the differences between architectures and that pretraining with standard denoising objectives, *using only the downstream task data*, leads to dramatic gains across multiple architectures and to very small gaps between Transformers and state space models (SSMs). In stark contrast to prior works, we find vanilla Transformers to match the performance of S4 on Long Range Arena when properly pretrained, and we improve the best reported results of SSMs on the PathX-256 task by 20 absolute points. Subsequently, we analyze the utility of previously-proposed structured parameterizations for SSMs and show they become mostly redundant in the presence of data-driven initialization obtained through pretraining. Our work shows that, when evaluating different architectures on supervised tasks, incorporation of data-driven priors via pretraining is essential for reliable performance estimation, and can be done efficiently.",
        "keywords": "Pre Training;Transformers;State Space Models;Long Range Models;Fair Evaluation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Ido Amos;Jonathan Berant;Ankit Gupta",
        "authorids": "~Ido_Amos1;~Jonathan_Berant1;~Ankit_Gupta3",
        "gender": ";M;M",
        "homepage": ";http://www.cs.tau.ac.il/~joberant/;https://sites.google.com/view/ag1988/",
        "dblp": ";31/8178;65/2886-1",
        "google_scholar": ";https://scholar.google.co.il/citations?user=xCYHonIAAAAJ;fdH955UAAAAJ",
        "orcid": ";;",
        "linkedin": ";;ag1988",
        "or_profile": "~Ido_Amos1;~Jonathan_Berant1;~Ankit_Gupta3",
        "aff": ";Tel Aviv University;International Business Machines",
        "aff_domain": ";tau.ac.il;ibm.com",
        "position": ";Associate Professor;Researcher",
        "bibtex": "@inproceedings{\namos2024never,\ntitle={Never Train from Scratch: Fair Comparison of Long-Sequence Models Requires Data-Driven Priors},\nauthor={Ido Amos and Jonathan Berant and Ankit Gupta},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=PdaPky8MUn}\n}",
        "github": "",
        "project": "",
        "reviewers": "yToF;7n9E;fh2t;YbGG",
        "pdf_size": 490395,
        "rating": "8;8;8;8",
        "confidence": "4;4;4;3",
        "soundness": "3;3;3;4",
        "contribution": "3;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "79;81;100;105",
        "wc_strengths": "100;34;44;100",
        "wc_weaknesses": "404;42;41;34",
        "wc_questions": "193;194;39;46",
        "wc_review": "776;351;224;285",
        "wc_reply_reviewers": "29;140;28;24",
        "wc_reply_authors": "826;717;363;237",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;3;2;2",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            91.25,
            11.409973707244026
        ],
        "wc_strengths_avg": [
            69.5,
            30.70423423568808
        ],
        "wc_weaknesses_avg": [
            130.25,
            158.07968718339495
        ],
        "wc_questions_avg": [
            118.0,
            75.54137938904744
        ],
        "wc_review_avg": [
            409.0,
            216.59524463847308
        ],
        "wc_reply_reviewers_avg": [
            55.25,
            48.96618731328793
        ],
        "wc_reply_authors_avg": [
            535.75,
            242.99729936770902
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 33,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14647936572033038416&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=PdaPky8MUn",
        "pdf": "https://openreview.net/pdf?id=PdaPky8MUn",
        "email": ";tau.ac.il;ibm.com",
        "author_num": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Tel Aviv University;International Business Machines Corporation",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tau.ac.il;https://www.ibm.com",
        "aff_unique_abbr": "TAU;IBM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Israel;United States"
    },
    {
        "id": "PdwrCm5Msr",
        "title": "MapLearn: Indoor Mapping using Audio",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Cameras and LIDARs are established methods to generate the map (or floorplan) of an indoor environment. This paper investigates the feasibility of using audio to learn the map. We aim to transmit audio beacons from a mobile device (say a smartphone) and record its reflections from the environment. Assuming known user locations, and recordings from multiple locations along walked paths, we aim to learn the 2D floorplan of the area. We use a conditional GAN (cGAN) architecture but prevent it from over-fitting using knowledge of indoor signal propagation. We pre-train our model on simulated data -- thousands of high-fidelity audio measurements on hundreds of synthetic floor plans -- and then test on 4 real environments in our home and office buildings. Results show that the generated maps are fairly accurate (in terms of precision and recall) even though no training was performed in real rooms. We have assumed clutter-free rooms; coping with clutter remains a topic for continued research.",
        "keywords": "Indoor mapping;signal processing;machine learning",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Zhijian Yang;Romit Roy Choudhury",
        "authorids": "~Zhijian_Yang3;~Romit_Roy_Choudhury3",
        "gender": ";M",
        "homepage": "https://zhijianyang.web.illinois.edu;http://croy.web.engr.illinois.edu/",
        "dblp": "66/1682;19/6964",
        "google_scholar": ";https://scholar.google.com.tw/citations?user=dq2wG-AAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Zhijian_Yang3;~romit_choudhury1",
        "aff": "Samsung;University of Illinois, Urbana Champaign",
        "aff_domain": "samsung.com;illinois.edu",
        "position": "Researcher;Full Professor",
        "bibtex": "@misc{\nyang2024maplearn,\ntitle={MapLearn: Indoor Mapping using Audio},\nauthor={Zhijian Yang and Romit Roy Choudhury},\nyear={2024},\nurl={https://openreview.net/forum?id=PdwrCm5Msr}\n}",
        "github": "",
        "project": "",
        "reviewers": "R9N4;Cs1q;ycoX;qNkX",
        "site": "https://openreview.net/forum?id=PdwrCm5Msr",
        "pdf_size": 4200892,
        "rating": "3;5;5;6",
        "confidence": "3;4;3;4",
        "soundness": "2;3;2;3",
        "contribution": "2;3;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "25;55;193;51",
        "wc_strengths": "18;23;41;145",
        "wc_weaknesses": "86;102;212;202",
        "wc_questions": "32;4;7;5",
        "wc_review": "161;184;453;403",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "560;359;570;574",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            81.0,
            65.68104749469211
        ],
        "wc_strengths_avg": [
            56.75,
            51.664180047688745
        ],
        "wc_weaknesses_avg": [
            150.5,
            56.8924423803373
        ],
        "wc_questions_avg": [
            12.0,
            11.597413504743201
        ],
        "wc_review_avg": [
            300.25,
            129.22340151845563
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            515.75,
            90.64318783008461
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.6882472016116854,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16036301060610667473&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Samsung;University of Illinois Urbana-Champaign",
        "aff_unique_dep": "Samsung;",
        "aff_unique_url": "https://www.samsung.com;https://illinois.edu",
        "aff_unique_abbr": "Samsung;UIUC",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Urbana-Champaign",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "title": "Making RL with Preference-based Feedback Efficient via Randomization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18697",
        "id": "Pe2lo3QOvo",
        "author_site": "Runzhe Wu, Wen Sun",
        "tldr": "",
        "abstract": "Reinforcement Learning algorithms that learn from human feedback (RLHF) need to be efficient in terms of *statistical complexity, computational complexity, and query complexity*. In this work, we consider the RLHF setting where the feedback is given in the format of preferences over pairs of trajectories. In the linear MDP model, using randomization in algorithm design, we present an algorithm that is sample efficient (i.e., has near-optimal worst-case regret bounds) and has polynomial running time (i.e., computational complexity is polynomial with respect to relevant parameters). Our algorithm further minimizes the query complexity through a novel randomized active learning procedure. In particular, our algorithm demonstrates a near-optimal tradeoff between the regret bound and the query complexity. To extend the results to more general nonlinear function approximation, we design a model-based randomized algorithm inspired by the idea of Thompson sampling. Our algorithm minimizes Bayesian regret bound and query complexity, again achieving a near-optimal tradeoff between these two quantities. Computation-wise, similar to the prior Thompson sampling algorithms under the regular RL setting, the main computation primitives of our algorithm are Bayesian supervised learning oracles which have been heavily investigated on the empirical side when applying Thompson sampling algorithms to RL benchmark problems.",
        "keywords": "reinforcement learning;preference-based feedback;theory;active learning;posterior sampling",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/46b146bdee8975568a261fcbfc355687aada35bd.pdf",
        "author": "Runzhe Wu;Wen Sun",
        "authorids": "~Runzhe_Wu1;~Wen_Sun1",
        "gender": "M;",
        "homepage": "https://ziqian2000.github.io/;https://wensun.github.io",
        "dblp": "294/9552;",
        "google_scholar": "eBtFiuAAAAAJ;iOLC30YAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Runzhe_Wu1;~Wen_Sun1",
        "aff": "Cornell University;Cornell University",
        "aff_domain": "cornell.edu;cornell.edu",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nwu2024making,\ntitle={Making {RL} with Preference-based Feedback Efficient via Randomization},\nauthor={Runzhe Wu and Wen Sun},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Pe2lo3QOvo}\n}",
        "github": "",
        "project": "",
        "reviewers": "8PN9;V7cf;eu8c;ynpG",
        "pdf_size": 694137,
        "rating": "5;6;6;8",
        "confidence": "4;3;2;3",
        "soundness": "3;3;3;4",
        "contribution": "2;3;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "25;82;120;67",
        "wc_strengths": "6;111;34;125",
        "wc_weaknesses": "211;84;68;2",
        "wc_questions": "2;38;112;150",
        "wc_review": "244;315;334;344",
        "wc_reply_reviewers": "0;0;16;28",
        "wc_reply_authors": "1969;323;990;501",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "4;1;2;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            73.5,
            34.01837738634811
        ],
        "wc_strengths_avg": [
            69.0,
            50.23445033042563
        ],
        "wc_weaknesses_avg": [
            91.25,
            75.66166466580022
        ],
        "wc_questions_avg": [
            75.5,
            58.504273348192264
        ],
        "wc_review_avg": [
            309.25,
            39.08564314425439
        ],
        "wc_reply_reviewers_avg": [
            11.0,
            11.789826122551595
        ],
        "wc_reply_authors_avg": [
            945.75,
            639.2610480077759
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.3244428422615251,
        "gs_citation": 32,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6454764550896500313&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=Pe2lo3QOvo",
        "pdf": "https://openreview.net/pdf?id=Pe2lo3QOvo",
        "email": "cornell.edu;cornell.edu",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Cornell University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cornell.edu",
        "aff_unique_abbr": "Cornell",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Pev2ufTzMv",
        "title": "Why Sanity Check for Saliency Metrics Fails?",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Saliency maps are widely leveraged as a post-ad-hoc approach to explain the decision-making process of Deep Learning-based image classification models. However, despite their popularity, ensuring the fidelity of saliency maps remains a complex problem. Researchers have, therefore, introduced saliency metrics to evaluate the fidelity of saliency maps. However, previous studies observed several statistical inconsistencies in the existing saliency metrics without investigating the reason behind the inconsistencies. In this study, we investigate the reason behind the observed statistical inconsistencies. We analyze the inconsistencies by studying the variation in pixel importance ranks, specifically by choosing a case study of varying levels of Gaussian blur (with different \u03c3 values for the width of the Gaussian Kernel) as the perturbation mechanism. Our findings indicate that the effect of perturbations on prediction probability and pixel importance ranks varies widely across different levels of Gaussian Blur. Consequently, the existing saliency metrics that rely on pixel importance become unreliable for measuring the fidelity of saliency maps. This insight necessitates careful use of saliency metrics and the perturbation technique used while assessing the fidelity of saliency maps in eXplainable AI (XAI). We used Gaussian Blur as our perturbation mechanism, but our approach applies to any perturbation.",
        "keywords": "Saliency Maps;Saliency Metrics;Fidelity Metrics;XAI;Perturbation",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/ff4251e02b996f5224378573e579069223615017.pdf",
        "author": "Revoti Prasad Bora;Kiran Raja;Philipp Terh\u00f6rst;Raymond Veldhuis;Raghavendra Ramachandra",
        "authorids": "~Revoti_Prasad_Bora1;~Kiran_Raja1;~Philipp_Terh\u00f6rst1;~Raymond_Veldhuis1;~Raghavendra_Ramachandra1",
        "gender": "M;M;M;M;M",
        "homepage": "https://www.ntnu.no/ansatte/revoti.p.bora;;;;https://www.ntnu.edu/employees/raghavendra.ramachandra",
        "dblp": "86/2369;136/1813;203/2506;;92/10647",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.no/citations?user=U9xl9xoAAAAJ;https://scholar.google.de/citations?user=4iERqCYAAAAJ;7BpMrY0AAAAJ;OIYIrmIAAAAJ",
        "orcid": ";0000-0002-9489-5161;0000-0001-8250-5712;;",
        "linkedin": "revotiprasadbora/;;;;raghavendra-ramachandra-b46a641b/",
        "or_profile": "~Revoti_Prasad_Bora1;~Kiran_Raja1;~Philipp_Terh\u00f6rst1;~Raymond_Veldhuis1;~Raghavendra_Ramachandra1",
        "aff": "Norwegian University of Science and Technology;Norwegian University of Science and Technology;Universit\u00e4t Paderborn;University of Twente;Norwegian University of Science and Technology (NTNU)",
        "aff_domain": "ntnu.no;ntnu.no;uni-paderborn.de;utwente.nl;ntnu.no",
        "position": "PhD candidate;Associate Professor;Assistant Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nbora2024why,\ntitle={Why Sanity Check for Saliency Metrics Fails?},\nauthor={Revoti Prasad Bora and Kiran Raja and Philipp Terh{\\\"o}rst and Raymond Veldhuis and Raghavendra Ramachandra},\nyear={2024},\nurl={https://openreview.net/forum?id=Pev2ufTzMv}\n}",
        "github": "",
        "project": "",
        "reviewers": "VUjF;WPYL;1hvD;k88p",
        "site": "https://openreview.net/forum?id=Pev2ufTzMv",
        "pdf_size": 11823662,
        "rating": "1;3;3;8",
        "confidence": "4;5;1;2",
        "soundness": "2;1;2;3",
        "contribution": "1;1;2;3",
        "presentation": "1;1;1;3",
        "wc_summary": "85;66;48;47",
        "wc_strengths": "32;27;25;30",
        "wc_weaknesses": "149;199;209;34",
        "wc_questions": "112;417;5;2",
        "wc_review": "378;709;287;113",
        "wc_reply_reviewers": "349;627;0;0",
        "wc_reply_authors": "1734;1601;788;106",
        "reply_reviewers": "2;1;0;0",
        "reply_authors": "3;2;1;1",
        "rating_avg": [
            3.75,
            2.5860201081971503
        ],
        "confidence_avg": [
            3.0,
            1.5811388300841898
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            1.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            61.5,
            15.532224567009067
        ],
        "wc_strengths_avg": [
            28.5,
            2.692582403567252
        ],
        "wc_weaknesses_avg": [
            147.75,
            69.4959531195882
        ],
        "wc_questions_avg": [
            134.0,
            169.29116929125394
        ],
        "wc_review_avg": [
            371.75,
            216.74336783394318
        ],
        "wc_reply_reviewers_avg": [
            244.0,
            263.05227617338727
        ],
        "wc_reply_authors_avg": [
            1057.25,
            657.8424488431862
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.42799248836102016,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:AMv-wwXkT4EJ:scholar.google.com/&scioq=Why+Sanity+Check+for+Saliency+Metrics+Fails%3F&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2;0",
        "aff_unique_norm": "Norwegian University of Science and Technology;University of Paderborn;University of Twente",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ntnu.no;https://www.uni-paderborn.de;https://www.utwente.nl",
        "aff_unique_abbr": "NTNU;UPB;UT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;2;0",
        "aff_country_unique": "Norway;Germany;Netherlands"
    },
    {
        "id": "PfAqPxPsAj",
        "title": "Language Conditioned Equivariant Grasp",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The ability to control robots with simple natural language instructions enables non-experts to employ robots as general tools and has long been a goal in robot learning. In this paper, we examine the problem of training a robotic grasping policy conditioned on language instructions. This is inherently challenging since efficient manipulation policy learning often exploits symmetry and geometry in the task, but it is unclear how to incorporate language into such a framework. In this work, we present $\\text{L}$anguage-conditioned $\\text{E}$quivariant $\\text{G}$rasp ($\\text{LEG}$), which leverages the $\\mathrm{SE}(2)$ symmetries of language-conditioned robotic grasping by mapping the language instruction to an $\\mathrm{SO}(2)$-steerable kernel. We demonstrate the sample efficiency and performance of this method on the Language-Grasp Benchmark which includes 10 different language-conditioned grasping tasks and evaluate it on a real robot.",
        "keywords": "Robot Learning;Geometric Deep Learning;Robotic Manipulation;Equivariant Deep Learning",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/c4f2f47bd3e41b6aab01389f0cdb1fa3fa4283da.zip",
        "author": "Haojie Huang;Mingxi Jia;Zhewen Zhang;Ondrej Biza;Linfeng Zhao;Robin Walters;Robert Platt",
        "authorids": "~Haojie_Huang1;~Mingxi_Jia1;zhang.zhew@northeastern.edu;~Ondrej_Biza1;~Linfeng_Zhao1;~Robin_Walters1;~Robert_Platt1",
        "gender": "M;M;;M;;M;",
        "homepage": "https://haojhuang.github.io/;https://saulbatman.github.io/;;https://sites.google.com/view/obiza;http://lfzhao.com;http://www.robinwalters.com;http://www.ccs.neu.edu/home/rplatt/",
        "dblp": "144/2195;315/4688;;230/8616.html;221/4652;258/3416;39/5434",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;1iNSPQIAAAAJ;;Gi9Xq8YAAAAJ;;fnprJmUAAAAJ;Z4Y5S2oAAAAJ",
        "orcid": ";;;0000-0003-3390-8050;;;",
        "linkedin": ";https://www.linkedin.com/mwlite/in/mingxi-jia-6997b9183;;ond%C5%99ej-b%C3%AD%C5%BEa-a9405353/;;;",
        "or_profile": "~Haojie_Huang1;~Mingxi_Jia1;zhang.zhew@northeastern.edu;~Ondrej_Biza1;~Linfeng_Zhao1;~Robin_Walters1;~Robert_Platt1",
        "aff": "Northeastern University;Brown University;;Northeastern University;Meta;Northeastern University ;Northeastern University",
        "aff_domain": "northeastern.edu;brown.edu;;northeastern.edu;meta.com;northeastern.edu;neu.edu",
        "position": "PhD student;PhD student;;PhD student;ML PhD Intern;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nhuang2024language,\ntitle={Language Conditioned Equivariant Grasp},\nauthor={Haojie Huang and Mingxi Jia and Zhewen Zhang and Ondrej Biza and Linfeng Zhao and Robin Walters and Robert Platt},\nyear={2024},\nurl={https://openreview.net/forum?id=PfAqPxPsAj}\n}",
        "github": "",
        "project": "",
        "reviewers": "C3bk;fe34;FTbR;n2g1;vD3Z",
        "site": "https://openreview.net/forum?id=PfAqPxPsAj",
        "pdf_size": 29381435,
        "rating": "3;5;5;6;6",
        "confidence": "4;2;3;2;3",
        "soundness": "2;2;3;3;3",
        "contribution": "2;2;2;3;3",
        "presentation": "2;2;3;3;2",
        "wc_summary": "54;74;106;72;109",
        "wc_strengths": "59;62;64;48;31",
        "wc_weaknesses": "110;295;170;77;140",
        "wc_questions": "26;157;138;54;1",
        "wc_review": "249;588;478;251;281",
        "wc_reply_reviewers": "0;82;0;54;0",
        "wc_reply_authors": "878;1707;1206;834;704",
        "reply_reviewers": "0;1;0;1;0",
        "reply_authors": "2;4;2;2;1",
        "rating_avg": [
            5.0,
            1.0954451150103321
        ],
        "confidence_avg": [
            2.8,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            83.0,
            21.203773249117717
        ],
        "wc_strengths_avg": [
            52.8,
            12.221292893961751
        ],
        "wc_weaknesses_avg": [
            158.4,
            74.9682599504617
        ],
        "wc_questions_avg": [
            75.2,
            61.661657454207315
        ],
        "wc_review_avg": [
            369.4,
            138.49851984768645
        ],
        "wc_reply_reviewers_avg": [
            27.2,
            34.46969683649684
        ],
        "wc_reply_authors_avg": [
            1065.8,
            360.74722452154776
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            2.2,
            0.9797958971132712
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.7319250547113999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ri9y6251nGMJ:scholar.google.com/&scioq=Language+Conditioned+Equivariant+Grasp&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;2;0;0",
        "aff_unique_norm": "Northeastern University;Brown University;Meta",
        "aff_unique_dep": ";;Meta Platforms, Inc.",
        "aff_unique_url": "https://www.northeastern.edu;https://www.brown.edu;https://meta.com",
        "aff_unique_abbr": "NEU;Brown;Meta",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "PfFpK0JAsQ",
        "title": "Unsupervised Feature Selection using a Basis of Feature Space and Self-Representation Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In recent years, there has been extensive research into unsupervised feature selection methods based on self-representation.\nHowever, there exists a major gap in the mathematical principles that underlie these approaches and their capacity to represent the feature space.\nIn this paper, a novel representation learning method, Graph Regularized Self-Representation and Sparse Subspace Learning (GRSSLFS), is proposed for the unsupervised feature selection.\nFirstly, GRSSLFS expresses the self-representation problem based on the concept of ``a basis of feature space'' to represent the original feature space as a low-dimensional space made of linearly independent features. Furthermore, the manifold structure corresponding to the newly constructed subspace is learned in order to preserve the geometric structure of the feature vectors. Secondly, the objective function of GRSSLFS is developed based on a self-representation framework that combines subspace learning and matrix factorization of the basis matrix. Finally, the effectiveness of GRSSLFS is explored through experiments on widely-used datasets. Results show that GRSSLFS achieves a high level of performance in comparison with several classic and state-of-the-art feature selection methods.",
        "keywords": "Unsupervised Feature Selection;Self-Representation Learning;Graph Regularization;Sparse Subspace Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Prayag Tiwari;Farid Saberi Movahed;Saeed Karami;Farshad Saberi-Movahed;Jens Lehmann;Sahar Vahdati",
        "authorids": "~Prayag_Tiwari1;~Farid_Saberi_Movahed1;~Saeed_Karami1;~Farshad_Saberi-Movahed1;~Jens_Lehmann3;~Sahar_Vahdati3",
        "gender": "M;;;M;M;F",
        "homepage": "https://prayagtiwari.github.io/;https://www.researchgate.net/profile/Farid-Saberi-Movahed;;;http://jens-lehmann.org;",
        "dblp": "198/3643;;;;71/4882.html;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;fs-LzXwAAAAJ;;https://scholar.google.com.au/citations?user=RguDLfsAAAAJ;https://scholar.google.de/citations?user=sEaQ5rgAAAAJ;https://scholar.google.de/citations?user=VJkh9moAAAAJ",
        "orcid": "0000-0002-2851-4260;0000-0003-2718-229X;;;0000-0001-9108-4278;",
        "linkedin": ";;;farshad-movahed/;jenslehmann82/;",
        "or_profile": "~Prayag_Tiwari1;~Farid_Saberi_Movahed1;~Saeed_Karami1;~Farshad_Saberi-Movahed1;~Jens_Lehmann3;~Sahar_Vahdati3",
        "aff": "Halmstad University;;;NVIDIA;Fraunhofer IAIS;InfAI",
        "aff_domain": "hh.se;;;nvidia.com;iais.fraunhofer.de;infai.org",
        "position": "Assistant Professor;;;Researcher;Lead Scientist;Postdoc",
        "bibtex": "@misc{\ntiwari2024unsupervised,\ntitle={Unsupervised Feature Selection using a Basis of Feature Space and Self-Representation Learning},\nauthor={Prayag Tiwari and Farid Saberi Movahed and Saeed Karami and Farshad Saberi-Movahed and Jens Lehmann and Sahar Vahdati},\nyear={2024},\nurl={https://openreview.net/forum?id=PfFpK0JAsQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "yUvs;PMap;2CBB",
        "site": "https://openreview.net/forum?id=PfFpK0JAsQ",
        "pdf_size": 8301746,
        "rating": "5;5;6",
        "confidence": "4;2;5",
        "soundness": "3;2;3",
        "contribution": "2;2;2",
        "presentation": "2;2;3",
        "wc_summary": "43;87;44",
        "wc_strengths": "50;31;106",
        "wc_weaknesses": "67;52;114",
        "wc_questions": "407;2;112",
        "wc_review": "567;172;376",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "2988;1541;950",
        "reply_reviewers": "0;0;0",
        "reply_authors": "10;4;3",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            1.247219128924647
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            58.0,
            20.51016008388688
        ],
        "wc_strengths_avg": [
            62.333333333333336,
            31.836387288063257
        ],
        "wc_weaknesses_avg": [
            77.66666666666667,
            26.411277052720408
        ],
        "wc_questions_avg": [
            173.66666666666666,
            170.99382704907475
        ],
        "wc_review_avg": [
            371.6666666666667,
            161.2871834819976
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1826.3333333333333,
            856.1239526039569
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            5.666666666666667,
            3.0912061651652345
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.7559289460184545,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:EPyvIL32m2wJ:scholar.google.com/&scioq=Unsupervised+Feature+Selection+using+a+Basis+of+Feature+Space+and+Self-Representation+Learning&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Halmstad University;NVIDIA;Fraunhofer Institute for Applied Information Technology;Institute of Computer Science, University of Innsbruck",
        "aff_unique_dep": ";NVIDIA Corporation;;Institute of Computer Science",
        "aff_unique_url": "https://www.hh.se;https://www.nvidia.com;https://www.iais.fraunhofer.de/;https://www.uibk.ac.at/compsci/",
        "aff_unique_abbr": "HH;NVIDIA;Fraunhofer IAIS;InfAI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;3",
        "aff_country_unique": "Sweden;United States;Germany;Austria"
    },
    {
        "title": "From Molecules to Materials: Pre-training Large Generalizable Models for Atomic Property Prediction",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18696",
        "id": "PfPnugdxup",
        "author_site": "Nima Shoghi, Adeesh Kolluru, John Kitchin, Zachary Ulissi, Larry Zitnick, Brandon Wood",
        "tldr": "",
        "abstract": "Foundation models have been transformational in machine learning fields such as natural language processing and computer vision. Similar success in atomic property prediction has been limited due to the challenges of training effective models across multiple chemical domains. To address this, we introduce Joint Multi-domain Pre-training (JMP), a supervised pre-training strategy that simultaneously trains on multiple datasets from different chemical domains, treating each dataset as a unique pre-training task within a multi-task framework. Our combined training dataset consists of $\\sim$120M systems from OC20, OC22, ANI-1x, and Transition-1x. We evaluate performance and generalization by fine-tuning over a diverse set of downstream tasks and datasets including: QM9, rMD17, MatBench, QMOF, SPICE, and MD22. JMP demonstrates an average improvement of 59% over training from scratch and matches or sets state-of-the-art on 34 out of 40 tasks. Our work highlights the potential of pre-training strategies that utilize diverse data to advance property prediction across chemical domains, especially for low-data tasks.",
        "keywords": "atomic property prediction;pre-training;3D atomic pre-training;graph neural networks;multi-task learning;molecules;materials",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Nima Shoghi;Adeesh Kolluru;John R. Kitchin;Zachary Ward Ulissi;C. Lawrence Zitnick;Brandon M Wood",
        "authorids": "~Nima_Shoghi1;~Adeesh_Kolluru1;~John_R._Kitchin1;~Zachary_Ward_Ulissi1;~C._Lawrence_Zitnick2;~Brandon_M_Wood1",
        "gender": "M;;;M;;M",
        "homepage": "https://nima.sh;https://adeeshkolluru.github.io/;https://zulissi.github.io/;https://www.bmwood.org;http://larryzitnick.org/;https://kitchingroup.cheme.cmu.edu",
        "dblp": "276/1749;295/8440;126/3959;276/7546;10/6888;199/6691",
        "google_scholar": "p6bW1bIAAAAJ;;E0tlVgQAAAAJ;KbqboRgAAAAJ;ZeJjFQMAAAAJ;jD_4h7sAAAAJ",
        "orcid": "0000-0002-6846-8721;0000-0001-8125-6881;0000-0002-9401-4918;0000-0002-7251-337X;;0000-0003-2625-9232",
        "linkedin": "https://linkedin.com/in/nimashoghi;;zulissi/;;;john-kitchin-6b959038/",
        "or_profile": "~Nima_Shoghi1;~Adeesh_Kolluru1;~Zachary_Ward_Ulissi1;~Brandon_M_Wood1;~Larry_Zitnick1;~John_Kitchin1",
        "aff": "Georgia Institute of Technology;Carnegie Mellon University;Carnegie Mellon University;FAIR at Meta;Meta;Carnegie Mellon University",
        "aff_domain": "gatech.edu;cmu.edu;cmu.edu;meta.com;meta.com;cmu.edu",
        "position": "PhD student;PhD student;Associate Professor;Researcher;Researcher;Full Professor",
        "bibtex": "@inproceedings{\nshoghi2024from,\ntitle={From Molecules to Materials: Pre-training Large Generalizable Models for Atomic Property Prediction},\nauthor={Nima Shoghi and Adeesh Kolluru and John R. Kitchin and Zachary Ward Ulissi and C. Lawrence Zitnick and Brandon M Wood},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=PfPnugdxup}\n}",
        "github": "",
        "project": "",
        "reviewers": "avot;KadD;XFKt;R7em",
        "pdf_size": 3282530,
        "rating": "5;5;5;8",
        "confidence": "4;4;4;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;2;3;4",
        "wc_summary": "97;19;60;80",
        "wc_strengths": "94;49;123;209",
        "wc_weaknesses": "225;54;265;41",
        "wc_questions": "185;23;207;1",
        "wc_review": "601;145;655;331",
        "wc_reply_reviewers": "162;0;0;9",
        "wc_reply_authors": "2018;546;2075;274",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "5;1;5;1",
        "rating_avg": [
            5.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            64.0,
            29.09467305195231
        ],
        "wc_strengths_avg": [
            118.75,
            58.396810700585355
        ],
        "wc_weaknesses_avg": [
            146.25,
            99.86334412586031
        ],
        "wc_questions_avg": [
            104.0,
            92.65527507918802
        ],
        "wc_review_avg": [
            433.0,
            206.67365579579803
        ],
        "wc_reply_reviewers_avg": [
            42.75,
            68.94699050720052
        ],
        "wc_reply_authors_avg": [
            1228.25,
            824.1281377916907
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.0,
            2.0
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 46,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14723727243238484286&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=PfPnugdxup",
        "pdf": "https://openreview.net/pdf?id=PfPnugdxup",
        "email": "gatech.edu;cmu.edu;cmu.edu;meta.com;meta.com;cmu.edu",
        "author_num": 6,
        "aff_unique_index": "0;1;1;2;2;1",
        "aff_unique_norm": "Georgia Institute of Technology;Carnegie Mellon University;Meta",
        "aff_unique_dep": ";;AI Research",
        "aff_unique_url": "https://www.gatech.edu;https://www.cmu.edu;https://ai.facebook.com",
        "aff_unique_abbr": "Georgia Tech;CMU;FAIR",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "PfaPgIQTul",
        "title": "Learning HJB Viscosity Solutions with PINNs for Continuous-Time Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Despite recent advances in Reinforcement Learning (RL), the Markov Decision\nProcesses are not always the best choice to model complex dynamical systems\nrequiring interactions at high frequency. Being able to work with arbitrary time\nintervals, Continuous Time Reinforcement Learning (CTRL) is more suitable for\nthose problems. Instead of the Bellman equation operating in discrete time, it\nis the Hamiltonian Jacobi Bellman (HJB) equation that describes value function\nevolution in CTRL. Even though the value function is a solution of the HJB\nequation, it may not be its unique solution. To distinguish the value function\nfrom other solutions, it is important to look for the viscosity solutions of the HJB\nequation. The viscosity solutions constitute a special class of solutions that possess\nuniqueness and stability properties. This paper proposes a novel approach to\napproximate the value function by training a Physics Informed Neural Network\n(PINN) through a speci\ufb01c \u000f$\\epsilon$-scheduling iterative process constraining the PINN\nto converge towards the viscosity solution and shows experimental results with\nclassical control tasks.",
        "keywords": "continuous time reinforcement learning;optimal control;Hamiltonian Jacobi Bellman equation;viscosity solutions;Physics Informed Neural Networks",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Alena SHILOVA;Thomas Delliaux;Philippe Preux;Bruno Raffin",
        "authorids": "~Alena_SHILOVA1;~Thomas_Delliaux1;~Philippe_Preux1;~Bruno_Raffin1",
        "gender": "F;M;M;M",
        "homepage": "https://aleshi94.github.io/home/;;https://philippe-preux.codeberg.page;http://datamove.imag.fr/bruno.raffin/",
        "dblp": "237/9915;;16/4835;74/2662",
        "google_scholar": "https://scholar.google.com/citations?hl=en;FBES9RwAAAAJ;JTXxmeAAAAAJ;3WLNxi4AAAAJ",
        "orcid": "0000-0002-1795-8421;;0000-0002-2067-2838;",
        "linkedin": ";thomas-delliaux-640a58206/;;",
        "or_profile": "~Alena_SHILOVA1;~Thomas_Delliaux1;~Philippe_Preux1;~Bruno_Raffin1",
        "aff": "INRIA;Institut Sup\u00e9rieur de l'A\u00e9ronautique et de l'Espace;Universit\u00e9 de Lille;INRIA",
        "aff_domain": "inria.fr;isae-supaero.fr;univ-lille.fr;inria.fr",
        "position": "Postdoc;PhD student;Full Professor;Principal Researcher",
        "bibtex": "@misc{\nshilova2024learning,\ntitle={Learning {HJB} Viscosity Solutions with {PINN}s for Continuous-Time Reinforcement Learning},\nauthor={Alena SHILOVA and Thomas Delliaux and Philippe Preux and Bruno Raffin},\nyear={2024},\nurl={https://openreview.net/forum?id=PfaPgIQTul}\n}",
        "github": "",
        "project": "",
        "reviewers": "N25p;DLUu;2hDe;S2st",
        "site": "https://openreview.net/forum?id=PfaPgIQTul",
        "pdf_size": 9325253,
        "rating": "3;5;5;8",
        "confidence": "4;4;3;4",
        "soundness": "2;3;3;4",
        "contribution": "2;3;3;4",
        "presentation": "3;2;3;3",
        "wc_summary": "102;71;71;66",
        "wc_strengths": "86;108;13;35",
        "wc_weaknesses": "267;395;116;65",
        "wc_questions": "18;168;59;56",
        "wc_review": "473;742;259;222",
        "wc_reply_reviewers": "0;199;0;0",
        "wc_reply_authors": "1166;2274;840;424",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "3;3;2;1",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            77.5,
            14.291605927956452
        ],
        "wc_strengths_avg": [
            60.5,
            38.12151623427379
        ],
        "wc_weaknesses_avg": [
            210.75,
            129.74277436528016
        ],
        "wc_questions_avg": [
            75.25,
            55.93467171620836
        ],
        "wc_review_avg": [
            424.0,
            207.09538864977173
        ],
        "wc_reply_reviewers_avg": [
            49.75,
            86.16952767655164
        ],
        "wc_reply_authors_avg": [
            1176.0,
            686.3133395177454
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.08084520834544431,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5826018213556308471&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 13,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "INRIA;Institut Sup\u00e9rieur de l'A\u00e9ronautique et de l'Espace;Universit\u00e9 de Lille",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.inria.fr;https://www.isae-supaero.fr;https://www.univ-lille.fr",
        "aff_unique_abbr": "INRIA;ISAE-SUPAERO;UdeL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "France"
    },
    {
        "id": "PfqBfC7bO9",
        "title": "Causal Unsupervised Semantic Segmentation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Unsupervised semantic segmentation aims to achieve high-quality semantic grouping without human-labeled annotations. With the advent of self-supervised pre-training, various frameworks utilize the pre-trained features to train prediction heads for unsupervised dense prediction. However, a significant challenge in this unsupervised setup is determining the appropriate level of clustering required for segmenting concepts. To address it, we propose a novel framework, CAusal Unsupervised Semantic sEgmentation (CAUSE), which leverages insights from causal inference. Specifically, we bridge intervention-oriented approach (i.e., frontdoor adjustment) to define suitable two-step tasks for unsupervised prediction. The first step involves constructing a concept clusterbook as a mediator, which represents possible concept prototypes at different levels of granularity in a discretized form. Then, the mediator establishes an explicit link to the subsequent concept-wise self-supervised learning for pixel-level grouping. Through extensive experiments and analyses on various datasets, we corroborate the effectiveness of CAUSE and achieve state-of-the-art performance in unsupervised semantic segmentation.",
        "keywords": "Unsupervised Semantic Segmentation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/a95e8003a8bce4c8bb9b2b5e2f4fb21e9fc8e33e.zip",
        "author": "Junho Kim;Byung-Kwan Lee;Yong Man Ro",
        "authorids": "~Junho_Kim4;~Byung-Kwan_Lee1;~Yong_Man_Ro3",
        "gender": "M;M;M",
        "homepage": "https://jhkim0911.github.io/;https://sites.google.com/view/byungkwanlee;https://www.ivllab.kaist.ac.kr/people/professor",
        "dblp": ";68/55.html/;02/1221",
        "google_scholar": "ZxE16ZUAAAAJ;https://scholar.google.co.kr/citations?hl=en;https://scholar.google.co.kr/citations?user=IPzfF7cAAAAJ",
        "orcid": "0000-0002-7769-910X;;0000-0001-5306-6853",
        "linkedin": "junhokim-kaist/;byung-kwan-lee-82333716a/;",
        "or_profile": "~Junho_Kim4;~Byung-Kwan_Lee1;~Yong_Man_Ro1",
        "aff": "Korea Advanced Institute of Science & Technology;KAIST;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr;kaist.ac.kr",
        "position": "PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nkim2024causal,\ntitle={Causal Unsupervised Semantic Segmentation},\nauthor={Junho Kim and Byung-Kwan Lee and Yong Man Ro},\nyear={2024},\nurl={https://openreview.net/forum?id=PfqBfC7bO9}\n}",
        "github": "",
        "project": "",
        "reviewers": "vbSV;zoBW;ivD5;1Vow",
        "site": "https://openreview.net/forum?id=PfqBfC7bO9",
        "pdf_size": 5885342,
        "rating": "5;5;6;6",
        "confidence": "4;4;4;3",
        "soundness": "2;3;2;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;2;2",
        "wc_summary": "67;43;78;57",
        "wc_strengths": "17;18;96;28",
        "wc_weaknesses": "110;43;104;229",
        "wc_questions": "2;140;72;2",
        "wc_review": "196;244;350;316",
        "wc_reply_reviewers": "221;0;0;0",
        "wc_reply_authors": "2073;1221;1036;1238",
        "reply_reviewers": "3;0;0;0",
        "reply_authors": "6;3;3;3",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            61.25,
            12.891373084353738
        ],
        "wc_strengths_avg": [
            39.75,
            32.7595405950694
        ],
        "wc_weaknesses_avg": [
            121.5,
            67.37395639265962
        ],
        "wc_questions_avg": [
            54.0,
            57.28874234961002
        ],
        "wc_review_avg": [
            276.5,
            60.205896721168436
        ],
        "wc_reply_reviewers_avg": [
            55.25,
            95.69580711818047
        ],
        "wc_reply_authors_avg": [
            1392.0,
            401.07792260357587
        ],
        "reply_reviewers_avg": [
            0.75,
            1.299038105676658
        ],
        "reply_authors_avg": [
            3.75,
            1.299038105676658
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 27,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8653052658585378604&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "PfrpYGKGPL",
        "title": "The Entity-Deduction Arena: A playground for probing the conversational reasoning and planning capabilities of LLMs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs) are currently effective at answering questions that are clearly asked. However, when faced with ambiguous queries they can act unpredictably and produce incorrect outputs. This underscores the need for the development of intelligent agents capable of asking clarification questions to resolve ambiguities effectively. This capability requires complex understanding, state tracking, reasoning and planning over multiple conversational turns. However, directly measuring this can be challenging.\nIn this paper, we offer a surrogate problem which assesses an LLMs's capability to deduce an entity unknown to itself, but revealed to an judge, by asking the judge a series of queries. This entity-deducing game can serve as an evaluation framework to probe the conversational reasoning and planning capabilities of language models.\nWe systematically evaluate various LLMs and discover significant differences in their performance on this task. We find that strong LLMs like GPT-4 outperform human players by a large margin. \nWe further employ Behavior Cloning (BC) to examine whether a weaker model is capable of imitating a stronger model and generalizing to data or domains, using only the demonstrations from a stronger model. \nWe finally propose to use Reinforcement Learning to enhance reasoning and planning capacity of Vicuna models through episodes of game playing, which lead to significant performance improvement. \nWe hope that this problem offers insights into how autonomous agents could be trained to behave more intelligently in ambiguous circumstances.",
        "keywords": "LLM;reasoning;planning;conversational model;evaluation;benchmarks",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/8fde220e13601e05619d12ac46949e95d7991b1d.pdf",
        "author": "Yizhe Zhang;Jiarui Lu;Navdeep Jaitly",
        "authorids": "~Yizhe_Zhang2;~Jiarui_Lu1;~Navdeep_Jaitly1",
        "gender": "M;M;M",
        "homepage": "https://dreasysnail.github.io;;http://www.cs.toronto.edu/~ndjaitly/",
        "dblp": "132/4966-2.html;255/8650;04/6137",
        "google_scholar": "WDVMfggAAAAJ;7C1fI9gAAAAJ;kjMNMLkAAAAJ",
        "orcid": ";;",
        "linkedin": ";Jiarui-Lu;",
        "or_profile": "~Yizhe_Zhang2;~Jiarui_Lu1;~Navdeep_Jaitly1",
        "aff": "Apple;Apple;Apple",
        "aff_domain": "apple.com;apple.com;apple.com",
        "position": "Researcher;Researcher;Principal Researcher",
        "bibtex": "@misc{\nzhang2024the,\ntitle={The Entity-Deduction Arena: A playground for probing the conversational reasoning and planning capabilities of {LLM}s},\nauthor={Yizhe Zhang and Jiarui Lu and Navdeep Jaitly},\nyear={2024},\nurl={https://openreview.net/forum?id=PfrpYGKGPL}\n}",
        "github": "",
        "project": "",
        "reviewers": "DwoQ;HCV6;TYnB;oYKG",
        "site": "https://openreview.net/forum?id=PfrpYGKGPL",
        "pdf_size": 2596841,
        "rating": "3;5;6;8",
        "confidence": "5;4;3;3",
        "soundness": "2;2;3;3",
        "contribution": "2;3;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "96;62;72;101",
        "wc_strengths": "43;117;95;105",
        "wc_weaknesses": "235;463;63;60",
        "wc_questions": "3;57;1;49",
        "wc_review": "377;699;231;315",
        "wc_reply_reviewers": "0;87;13;0",
        "wc_reply_authors": "1031;1620;101;343",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "2;4;1;1",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            82.75,
            16.23845743905498
        ],
        "wc_strengths_avg": [
            90.0,
            28.231188426986208
        ],
        "wc_weaknesses_avg": [
            205.25,
            164.81258295409364
        ],
        "wc_questions_avg": [
            27.5,
            25.666125535421198
        ],
        "wc_review_avg": [
            405.5,
            177.1969243525406
        ],
        "wc_reply_reviewers_avg": [
            25.0,
            36.18701424544446
        ],
        "wc_reply_authors_avg": [
            773.75,
            595.9141611843102
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.9198662110077999,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17472082278688910108&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Apple",
        "aff_unique_dep": "Apple Inc.",
        "aff_unique_url": "https://www.apple.com",
        "aff_unique_abbr": "Apple",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "PgBunNWJV1",
        "title": "Sparse Iso-FLOP Transformations for Maximizing Training Efficiency",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recent studies have explored the application of weight sparsity to enhance the\ntraining efficiency of DNNs in terms of test accuracy~w.r.t training FLOPs.\nThese studies have focused on reducing training FLOPs, but training with sparse\nweights often results in accuracy degradation or necessitates prolonged training\nschedules to attain performance similar to the original dense models; making the\nactual training efficiency gains less evident. In contrast, our work emphasizes\nleveraging sparsity to increase accuracy while maintaining the same FLOPs as the\ndense model, thereby demonstrating improved training efficiency through higher\naccuracy. We introduce Sparse-IFT, a family of Sparse Iso-FLOP Transformations\nthat serve as drop-in replacements for dense layers, enhancing their\nrepresentational capacity and FLOP efficiency. Each transformation is\nparameterized by a single hyperparameter (i.e., sparsity level), offering a\nbroader search space for identifying optimal sparse masks. Substituting dense\nlayers with Sparse-IFT, without altering any training hyperparameters, yields\nsubstantial improvements across a range of computer vision and natural language\nprocessing tasks; ResNet-18 on ImageNet (+3.5\\%) and GPT-3 Small on\nWikiText-103 (-0.4 PPL), both matching larger dense models that use 2x\nor more FLOPs. To our knowledge, this is the first work to demonstrate the use\nof sparsity for improving the accuracy of dense models, all while maintaining\nconsistent training FLOPs budgets via a simple set of sparse transformations.",
        "keywords": "sparsity;sparse training;efficient training",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/6e340975edb14c07d0e6b3c44d2344d42dae4cc9.zip",
        "author": "Shreyas Saxena;Vithursan Thangarasa;Abhay Gupta;Sean Lie",
        "authorids": "~Shreyas_Saxena1;~Vithursan_Thangarasa1;~Abhay_Gupta1;~Sean_Lie1",
        "gender": "M;M;M;Not Specified",
        "homepage": ";https://vithursant.com;;",
        "dblp": "96/10387;223/9965;;",
        "google_scholar": "ePbtJPEAAAAJ;UUKxm4gAAAAJ;Pae7GxYAAAAJ;",
        "orcid": ";;;",
        "linkedin": ";vithursant/;gupta-abhay;sean-lie-4a80097/",
        "or_profile": "~Shreyas_Saxena1;~Vithursan_Thangarasa1;~Abhay_Gupta1;~Sean_Lie1",
        "aff": "Cerebras Systems, Inc;Cerebras Systems, Inc;Cerebras Systems, Inc;Cerebras Systems, Inc",
        "aff_domain": "cerebras.net;cerebras.net;cerebras.net;cerebras.net",
        "position": "Principal Researcher;Researcher;Researcher;Researcher",
        "bibtex": "@misc{\nsaxena2024sparse,\ntitle={Sparse Iso-{FLOP} Transformations for Maximizing Training Efficiency},\nauthor={Shreyas Saxena and Vithursan Thangarasa and Abhay Gupta and Sean Lie},\nyear={2024},\nurl={https://openreview.net/forum?id=PgBunNWJV1}\n}",
        "github": "",
        "project": "",
        "reviewers": "Azx4;WRvo;aB9B;Vqzr",
        "site": "https://openreview.net/forum?id=PgBunNWJV1",
        "pdf_size": 735245,
        "rating": "3;3;5;5",
        "confidence": "4;3;4;4",
        "soundness": "3;2;3;4",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;4",
        "wc_summary": "55;81;46;81",
        "wc_strengths": "20;107;49;109",
        "wc_weaknesses": "204;293;90;320",
        "wc_questions": "116;32;74;12",
        "wc_review": "395;513;259;522",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            65.75,
            15.578430601315397
        ],
        "wc_strengths_avg": [
            71.25,
            38.160024895170075
        ],
        "wc_weaknesses_avg": [
            226.75,
            89.86482904896666
        ],
        "wc_questions_avg": [
            58.5,
            40.03436024217197
        ],
        "wc_review_avg": [
            422.25,
            106.74590156066883
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2586882879546043114&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Cerebras Systems",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cerebras.com",
        "aff_unique_abbr": "Cerebras",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "PhJUd3mbhP",
        "title": "AutoAgents: A Framework for Automatic Agent Generation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs) have enabled remarkable advances in automated task-solving with multi-agent systems. \nHowever, most existing LLM-based multi-agent approaches rely on predefined agents to handle simple tasks, limiting the adaptability of multi-agent collaboration to different scenarios.\nTherefore, we introduce AutoAgents, an innovative framework that adaptively generates and coordinates multiple specialized agents to build an AI team according to different tasks.\nSpecifically, AutoAgents couples the relationship between tasks and roles by dynamically generating multiple required agents based on task content and planning solutions for the current task based on the generated expert agents.\nMultiple specialized agents collaborate with each other to efficiently accomplish tasks. \nConcurrently, an observer role is incorporated into the framework to reflect on the designated plans and agents' responses and improve upon them.\nOur experiments on various benchmarks demonstrate that AutoAgents generates more coherent and accurate solutions than the existing multi-agent methods.\nThis underscores the significance of assigning different roles to different tasks and of team cooperation, offering new perspectives for tackling complex tasks.",
        "keywords": "Multi-Agent Framework;Large Language Models;Agent Generation",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/95a8649c84c522eb5bf7145fd5bb6e29132c486c.zip",
        "author": "Guangyao Chen;Siwei Dong;Yu Shu;Ge Zhang;Jaward Sesay;B\u00f6rje F. Karlsson;Jie Fu;Yemin Shi",
        "authorids": "~Guangyao_Chen1;~Siwei_Dong1;~Yu_Shu1;~Ge_Zhang5;~Jaward_Sesay1;~B\u00f6rje_F._Karlsson1;~Jie_Fu2;~Yemin_Shi2",
        "gender": "M;;M;M;M;;;",
        "homepage": "http://icgy96.github.io/;;;;https://github.com/Jaykef;;;",
        "dblp": ";;;;;;;",
        "google_scholar": "ZauoVgYAAAAJ;;;qyTrq4kAAAAJ;;;;",
        "orcid": "0000-0002-7255-2109;;0000-0001-8035-0008;;;;;",
        "linkedin": "guangyao-chen-976335145;;;ge-zhang-792797169/;;;;",
        "or_profile": "~Guangyao_Chen1;~Siwei_Dong1;~Yu_Shu1;~Ge_Zhang5;~Jaward_Sesay1;~B\u00f6rje_F._Karlsson1;~Jie_Fu2;~Yemin_Shi2",
        "aff": "Cornell University;;;University of Waterloo;Beijing Institute of Technology;;;",
        "aff_domain": "cornell.edu;;;cs.uwaterloo.ca;bit.edu.cn;;;",
        "position": "Postdoc;;;PhD student;MS student;;;",
        "bibtex": "@misc{\nchen2024autoagents,\ntitle={AutoAgents: A Framework for Automatic Agent Generation},\nauthor={Guangyao Chen and Siwei Dong and Yu Shu and Ge Zhang and Jaward Sesay and B{\\\"o}rje F. Karlsson and Jie Fu and Yemin Shi},\nyear={2024},\nurl={https://openreview.net/forum?id=PhJUd3mbhP}\n}",
        "github": "",
        "project": "",
        "reviewers": "Tafn;ypGp;uXv7;paZk",
        "site": "https://openreview.net/forum?id=PhJUd3mbhP",
        "pdf_size": 20722810,
        "rating": "5;6;6;6",
        "confidence": "3;3;3;4",
        "soundness": "2;2;2;2",
        "contribution": "2;3;3;3",
        "presentation": "2;1;2;2",
        "wc_summary": "77;35;79;112",
        "wc_strengths": "50;41;75;90",
        "wc_weaknesses": "304;329;118;116",
        "wc_questions": "222;184;61;189",
        "wc_review": "653;589;333;507",
        "wc_reply_reviewers": "179;26;23;12",
        "wc_reply_authors": "3712;2327;1462;1391",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "9;6;5;6",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            75.75,
            27.325583250865844
        ],
        "wc_strengths_avg": [
            64.0,
            19.50640920313116
        ],
        "wc_weaknesses_avg": [
            216.75,
            100.14333477571036
        ],
        "wc_questions_avg": [
            164.0,
            61.23316095058298
        ],
        "wc_review_avg": [
            520.5,
            119.98645756917736
        ],
        "wc_reply_reviewers_avg": [
            60.0,
            68.9021044671351
        ],
        "wc_reply_authors_avg": [
            2223.0,
            935.3183949864346
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            6.5,
            1.5
        ],
        "replies_avg": [
            37,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 99,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12020722103275705860&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Cornell University;University of Waterloo;Beijing Institute of Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.cornell.edu;https://uwaterloo.ca;http://www.bit.edu.cn/",
        "aff_unique_abbr": "Cornell;UW;BIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2",
        "aff_country_unique": "United States;Canada;China"
    },
    {
        "title": "Fusing Models with Complementary Expertise",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18695",
        "id": "PhMrGCMIRL",
        "author_site": "Hongyi Wang, Felipe Polo, Yuekai Sun, Souvik Kundu, Eric Xing, Mikhail Yurochkin",
        "tldr": "",
        "abstract": "Training AI models that generalize across tasks and domains has long been among the open problems driving AI research. The emergence of Foundation Models made it easier to obtain expert models for a given task, but the heterogeneity of data that may be encountered at test time often means that any single expert is insufficient. We consider the Fusion of Experts (FoE) problem of fusing outputs of expert models with complementary knowledge of the data distribution and formulate it as an instance of supervised learning. Our method is applicable to both discriminative and generative tasks and leads to significant performance improvements in image and text classification, text summarization, multiple-choice QA, and automatic evaluation of generated text. We also extend our method to the \"frugal\" setting where it is desired to reduce the number of expert model evaluations at test time. Our implementation is publicly available at https://github.com/hwang595/FoE-ICLR2024.",
        "keywords": "Fusion of Experts;Mixture of Experts;Expert Models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/6f5fd02b767de1912107f0f2f5c361d00785fa29.pdf",
        "author": "Hongyi Wang;Felipe Maia Polo;Yuekai Sun;Souvik Kundu;Eric Xing;Mikhail Yurochkin",
        "authorids": "~Hongyi_Wang1;~Felipe_Maia_Polo1;~Yuekai_Sun1;~Souvik_Kundu2;~Eric_Xing1;~Mikhail_Yurochkin1",
        "gender": "M;M;;M;M;M",
        "homepage": "https://hwang595.github.io/;https://felipemaiapolo.github.io/;https://yuekai.github.io/;https://ksouvik52.github.io;http://www.cs.cmu.edu/~epxing/;https://moonfolk.github.io/",
        "dblp": "15/832-1.html;261/9581;;126/2210;36/3855;191/6719",
        "google_scholar": "zYdZORsAAAAJ;CJbgmnkAAAAJ;6T1XtW8AAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com.tw/citations?user=5pKTRxEAAAAJ;QjBF9sUAAAAJ",
        "orcid": ";0000-0002-4950-2795;;0000-0002-3533-9405;;",
        "linkedin": "hongyi-wang-b89651102/;;;souvik-kundu-64922b50/;;mikhail-yurochkin-a45659114/",
        "or_profile": "~Hongyi_Wang1;~Felipe_Maia_Polo1;~Yuekai_Sun1;~Souvik_Kundu2;~Eric_Xing1;~Mikhail_Yurochkin1",
        "aff": "Carnegie Mellon University;University of Michigan - Ann Arbor;University of Michigan - Ann Arbor;Intel;School of Computer Science, Carnegie Mellon University;IBM Research",
        "aff_domain": "andrew.cmu.edu;umich.edu;umich.edu;intel.com;cs.cmu.edu;ibm.com",
        "position": "Researcher;PhD student;Assistant \u2192 Associate Professor of Statistics;Researcher;Full Professor;Researcher",
        "bibtex": "@inproceedings{\nwang2024fusing,\ntitle={Fusing Models with Complementary Expertise},\nauthor={Hongyi Wang and Felipe Maia Polo and Yuekai Sun and Souvik Kundu and Eric Xing and Mikhail Yurochkin},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=PhMrGCMIRL}\n}",
        "github": "",
        "project": "",
        "reviewers": "w4J8;75JM;2UmK;HyG2",
        "pdf_size": 1074839,
        "rating": "6;6;6;8",
        "confidence": "3;4;3;4",
        "soundness": "3;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "119;120;80;124",
        "wc_strengths": "96;124;57;75",
        "wc_weaknesses": "208;305;123;16",
        "wc_questions": "55;206;6;334",
        "wc_review": "478;755;266;549",
        "wc_reply_reviewers": "231;186;0;65",
        "wc_reply_authors": "1184;1822;338;504",
        "reply_reviewers": "3;1;0;1",
        "reply_authors": "5;4;2;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            110.75,
            17.851820635442202
        ],
        "wc_strengths_avg": [
            88.0,
            24.9499498997493
        ],
        "wc_weaknesses_avg": [
            163.0,
            106.5340321211959
        ],
        "wc_questions_avg": [
            150.25,
            129.18276781366777
        ],
        "wc_review_avg": [
            512.0,
            174.70689740247806
        ],
        "wc_reply_reviewers_avg": [
            120.5,
            92.33228037907436
        ],
        "wc_reply_authors_avg": [
            962.0,
            589.0721517776918
        ],
        "reply_reviewers_avg": [
            1.25,
            1.0897247358851685
        ],
        "reply_authors_avg": [
            3.25,
            1.299038105676658
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 45,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3475479812495458822&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=PhMrGCMIRL",
        "pdf": "https://openreview.net/pdf?id=PhMrGCMIRL",
        "email": "andrew.cmu.edu;umich.edu;umich.edu;intel.com;cs.cmu.edu;ibm.com",
        "author_num": 6,
        "aff_unique_index": "0;1;1;2;0;3",
        "aff_unique_norm": "Carnegie Mellon University;University of Michigan;Intel;IBM",
        "aff_unique_dep": ";;Intel Corporation;IBM Research",
        "aff_unique_url": "https://www.cmu.edu;https://www.umich.edu;https://www.intel.com;https://www.ibm.com/research",
        "aff_unique_abbr": "CMU;UM;Intel;IBM",
        "aff_campus_unique_index": "1;1;2",
        "aff_campus_unique": ";Ann Arbor;Pittsburgh",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "PhanPLSHRt",
        "title": "EXCOST: Semi-Supervised Classification with Exemplar-Contrastive Self-Training",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Similar to the way of human learning, the aim of semi-supervised learning (SSL) method is to harness vast unlabeled data alongside a limited set of labeled samples. Inspired by theories of category representation in cognitive psychology, an innovative SSL algorithm named Exemplar-Contrastive Self-Training (EXCOST) is proposed in this paper. This algorithm ascertains pseudo-labels for unlabeled samples characterized by both substantial confidence and exemplar similarity, subsequently leveraging these pseudo-labels for self-training. Furthermore, a novel regularization term named Category-Invariant Loss (CIL) is applied for SSL. CIL promotes the generation of consistent class probabilities across different representations of the same sample under various perturbations, such as rotation or translation. Notably, the proposed approach does not depend on either the prevalent weak and strong data augmentation strategy or the use of exponential moving average (EMA). The efficacy of the proposed EXCOST is demonstrated through comprehensive evaluations on semi-supervised image classification tasks, where it attains state-of-the-art performance on benchmark datasets, including MNIST with 2, 5 and 10 labels per class, SVHN with 25 labels per class, and CIFAR-10 with 25 labels per class.",
        "keywords": "Semi-supervised Learning;Image Classification;Cognitive Psychology",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/6ff948d6b9458c114a2906a24c13b519b70a17d9.zip",
        "author": "Huajun Liu;Yongrui Bai;Anmin Zhu",
        "authorids": "~Huajun_Liu4;~Yongrui_Bai1;~Anmin_Zhu1",
        "gender": "M;;M",
        "homepage": "https://github.com/poerin;https://github.com/baiyongrui;https://csse.szu.edu.cn/staff/azhu/",
        "dblp": ";;",
        "google_scholar": ";;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Huajun_Liu4;~Yongrui_Bai1;~Anmin_Zhu1",
        "aff": "Shenzhen University;;",
        "aff_domain": "szu.edu.cn;;",
        "position": "MS student;;",
        "bibtex": "@misc{\nliu2024excost,\ntitle={{EXCOST}: Semi-Supervised Classification with Exemplar-Contrastive Self-Training},\nauthor={Huajun Liu and Yongrui Bai and Anmin Zhu},\nyear={2024},\nurl={https://openreview.net/forum?id=PhanPLSHRt}\n}",
        "github": "",
        "project": "",
        "reviewers": "SpjF;N7m5;nk72;GnDx",
        "site": "https://openreview.net/forum?id=PhanPLSHRt",
        "pdf_size": 444361,
        "rating": "3;3;5;5",
        "confidence": "4;3;4;3",
        "soundness": "3;3;2;2",
        "contribution": "2;3;2;2",
        "presentation": "2;2;2;2",
        "wc_summary": "34;49;61;76",
        "wc_strengths": "44;22;42;58",
        "wc_weaknesses": "129;137;350;142",
        "wc_questions": "5;3;4;4",
        "wc_review": "212;211;457;280",
        "wc_reply_reviewers": "0;0;35;0",
        "wc_reply_authors": "1750;869;1538;1037",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "3;2;3;2",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            55.0,
            15.443445211480501
        ],
        "wc_strengths_avg": [
            41.5,
            12.835497652993435
        ],
        "wc_weaknesses_avg": [
            189.5,
            92.78065531133093
        ],
        "wc_questions_avg": [
            4.0,
            0.7071067811865476
        ],
        "wc_review_avg": [
            290.0,
            100.39173272735161
        ],
        "wc_reply_reviewers_avg": [
            8.75,
            15.155444566227676
        ],
        "wc_reply_authors_avg": [
            1298.5,
            358.49163170149455
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:EhZb0MhZDesJ:scholar.google.com/&scioq=EXCOST:+Semi-Supervised+Classification+with+Exemplar-Contrastive+Self-Training&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Shenzhen University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.szu.edu.cn",
        "aff_unique_abbr": "SZU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "PhnGhO4VfF",
        "title": "Towards Understanding the Effect of Pretraining Label Granularity",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this paper, we study how the granularity of pretraining labels affects the generalization of deep neural networks in image classification tasks. \nWe focus on the \"fine-to-coarse\" transfer learning setting, where the pretraining label space is more fine-grained than that of the target problem. \nEmpirically, we show that pretraining on the leaf labels of ImageNet21k produces better transfer results on ImageNet1k than pretraining on other coarser granularity levels, which supports the common practice used in the community.\nTheoretically, we explain the benefit of fine-grained pretraining by proving that, for a data distribution satisfying certain hierarchy conditions, 1) coarse-grained pretraining only allows a neural network to learn the \"common\" or \"easy-to-learn\" features well, while 2) fine-grained pretraining helps the network learn the \"rarer\" or \"fine-grained\" features in addition to the common ones, thus improving its accuracy on hard downstream test samples in which common features are missing or weak in strength.\nFurthermore, we perform comprehensive experiments using the label hierarchies of iNaturalist 2021 and observe that the following conditions, in addition to proper choice of label granularity, enable the transfer to work well in practice: 1) the pretraining dataset needs to have a meaningful label hierarchy, and 2) the pretraining and target label functions need to align well.",
        "keywords": "Learning theory;transfer learning;generalization",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Guan Zhe Hong;Yin Cui;Ariel Fuxman;Stanley H. Chan;Enming Luo",
        "authorids": "~Guan_Zhe_Hong1;~Yin_Cui1;~Ariel_Fuxman1;~Stanley_H._Chan2;~Enming_Luo2",
        "gender": "M;M;Not Specified;;M",
        "homepage": "https://guanzhehong.github.io/;https://ycui.me/;;;",
        "dblp": "241/7042;47/8023.html;90/1367;;98/7627",
        "google_scholar": "https://scholar.google.com/citations?hl=en;iP5m52IAAAAJ;pyzFbV0AAAAJ;;HC-IzqEAAAAJ",
        "orcid": ";0000-0003-2882-2033;;;",
        "linkedin": "guanzhe-hong-551349136;;ariel-fuxman-b821984;;enming-luo-a1018614/",
        "or_profile": "~Guan_Zhe_Hong1;~Yin_Cui1;~Ariel_Fuxman1;~Stanley_H._Chan2;~Enming_Luo2",
        "aff": "Google;NVIDIA;Google;;Google",
        "aff_domain": "google.com;nvidia.com;google.com;;google.com",
        "position": "Intern;Research Scientist;Researcher;;Researcher",
        "bibtex": "@misc{\nhong2024towards,\ntitle={Towards Understanding the Effect of Pretraining Label Granularity},\nauthor={Guan Zhe Hong and Yin Cui and Ariel Fuxman and Stanley H. Chan and Enming Luo},\nyear={2024},\nurl={https://openreview.net/forum?id=PhnGhO4VfF}\n}",
        "github": "",
        "project": "",
        "reviewers": "4iRU;X3dd;fC1j",
        "site": "https://openreview.net/forum?id=PhnGhO4VfF",
        "pdf_size": 811933,
        "rating": "5;6;6",
        "confidence": "2;3;2",
        "soundness": "3;3;3",
        "contribution": "2;4;3",
        "presentation": "3;4;4",
        "wc_summary": "176;44;113",
        "wc_strengths": "75;31;31",
        "wc_weaknesses": "153;109;173",
        "wc_questions": "44;32;292",
        "wc_review": "448;216;609",
        "wc_reply_reviewers": "0;0;18",
        "wc_reply_authors": "741;457;1977",
        "reply_reviewers": "0;0;1",
        "reply_authors": "2;1;3",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            111.0,
            53.907327887774215
        ],
        "wc_strengths_avg": [
            45.666666666666664,
            20.741798914805393
        ],
        "wc_weaknesses_avg": [
            145.0,
            26.733250207684563
        ],
        "wc_questions_avg": [
            122.66666666666667,
            119.83692623264703
        ],
        "wc_review_avg": [
            424.3333333333333,
            161.3119820582326
        ],
        "wc_reply_reviewers_avg": [
            6.0,
            8.48528137423857
        ],
        "wc_reply_authors_avg": [
            1058.3333333333333,
            659.8612648798904
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17908270080897503817&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Google;NVIDIA",
        "aff_unique_dep": "Google;NVIDIA Corporation",
        "aff_unique_url": "https://www.google.com;https://www.nvidia.com",
        "aff_unique_abbr": "Google;NVIDIA",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Mountain View;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "PiPaNgOaVP",
        "title": "De Novo Drug Design with Joint Transformers",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "\\emph{De novo} drug design requires generating novel molecules outside of the training data and simultaneously predicting their target properties, making it a hard task for machine learning models. To address this, we propose Joint Transformer that combines a Transformer decoder, Transformer encoder and a predictor in a joint generative model with shared weights. We show that training the model with a penalized log-likelihood objective results in simultaneously matching state-of-the-art performance in a molecule generation task and successfully predicting molecular properties of newly sampled molecules. Notably, the jointly trained model decreases the prediction error, as compared to a fine-tuned decoder-only Transformer, by $42$%. We propose a probabilistic black box optimization algorithm employing Joint Transformer for  the problem of \\emph{de novo} drug design, which generates novel molecules with corresponding target properties better than in the data, outperforming other SMILES-based optimization methods.",
        "keywords": "generative model;joint model;transformer;molecule generation;drug design",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/520c5d0779d9535c79ebad9e79707bc6b2ca9547.pdf",
        "author": "Adam Izdebski;Ewelina Weglarz-Tomczak;Ewa Maria Szczurek;Jakub M. Tomczak",
        "authorids": "~Adam_Izdebski1;~Ewelina_Weglarz-Tomczak1;~Ewa_Maria_Szczurek1;~Jakub_M._Tomczak1",
        "gender": "M;F;F;M",
        "homepage": ";https://e-weglarz-tomczak.github.io/;https://www.mimuw.edu.pl/~szczurek/;https://jmtomczak.github.io/",
        "dblp": ";;48/1715;80/8238",
        "google_scholar": "3zY8eccAAAAJ;lNofuWcAAAAJ;https://scholar.google.pl/citations?user=hltmGf0AAAAJ;https://scholar.google.pl/citations?user=XB99pR4AAAAJ",
        "orcid": ";;0000-0002-1320-6695;0000-0001-8634-6878",
        "linkedin": ";;;jakub-tomczak-04305314a/",
        "or_profile": "~Adam_Izdebski1;~Ewelina_Weglarz-Tomczak1;~Ewa_Maria_Szczurek1;~Jakub_Mikolaj_Tomczak1",
        "aff": "University of Warsaw;NatInLab;University of Warsaw;Eindhoven University of Technology",
        "aff_domain": "uw.edu.pl;natinlab.com;uw.edu.pl;tue.nl",
        "position": "PhD student;CSO;Associate Professor;Associate Professor",
        "bibtex": "@misc{\nizdebski2024de,\ntitle={De Novo Drug Design with Joint Transformers},\nauthor={Adam Izdebski and Ewelina Weglarz-Tomczak and Ewa Maria Szczurek and Jakub M. Tomczak},\nyear={2024},\nurl={https://openreview.net/forum?id=PiPaNgOaVP}\n}",
        "github": "",
        "project": "",
        "reviewers": "jRVR;FkeG;etCU;LFPx",
        "site": "https://openreview.net/forum?id=PiPaNgOaVP",
        "pdf_size": 567905,
        "rating": "3;3;3;5",
        "confidence": "4;4;4;4",
        "soundness": "2;2;1;2",
        "contribution": "1;1;2;3",
        "presentation": "2;2;2;3",
        "wc_summary": "43;32;57;118",
        "wc_strengths": "17;18;34;86",
        "wc_weaknesses": "14;156;534;137",
        "wc_questions": "399;23;117;165",
        "wc_review": "473;229;742;506",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            62.5,
            33.24530041975858
        ],
        "wc_strengths_avg": [
            38.75,
            28.101378969723175
        ],
        "wc_weaknesses_avg": [
            210.25,
            194.70281841822424
        ],
        "wc_questions_avg": [
            176.0,
            138.50992744204294
        ],
        "wc_review_avg": [
            487.5,
            181.7587687018153
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6434982725837267444&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "University of Warsaw;National Institute of Natural Sciences;Eindhoven University of Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.uw.edu.pl;https://www.nins.go.jp;https://www.tue.nl",
        "aff_unique_abbr": "UW;NINS;TU/e",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;2",
        "aff_country_unique": "Poland;Japan;Netherlands"
    },
    {
        "id": "Piod76RSrx",
        "title": "Slicing Mutual Information Generalization Bounds for Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The ability of machine learning (ML) algorithms to generalize to unseen data has been studied through the lens of information theory, by bounding the generalization error with the input-output mutual information (MI), i.e. the MI between the training data and the learned hypothesis. These bounds have limited empirical use for modern ML applications (e.g., deep learning) since the evaluation of MI is difficult in high-dimensional settings. Motivated by recent reports of significant low-loss compressibility of neural networks, we study the generalization capacity of algorithms that slice the parameter space, i.e. train on a random lower-dimensional subspace. We derive information-theoretic bounds on generalization error in this regime and discuss an intriguing connection to the $k$-Sliced Mutual Information, an alternative measure of statistical dependence that scales well with dimension. We also propose a rate-distortion framework that allows generalization bounds to be obtained if the weights are simply close to the random subspace, and we propose a training procedure that exploits this flexibility. The computational and statistical benefits of our approach allow us to empirically estimate the input-output information of these neural networks and compute their information-theoretic generalization bounds, a task which was previously out of reach.",
        "keywords": "generalization bounds;input-output mutual information;rate-distortion bounds",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/0b64d01d720fc2390a5e11b749ec85e13ddec05d.zip",
        "author": "Kimia Nadjahi;Kristjan Greenewald;Rickard Br\u00fcel Gabrielsson;Justin Solomon",
        "authorids": "~Kimia_Nadjahi1;~Kristjan_Greenewald1;~Rickard_Br\u00fcel_Gabrielsson1;~Justin_Solomon1",
        "gender": "F;;Not Specified;M",
        "homepage": "http://kimiandj.github.io/;https://researcher.watson.ibm.com/researcher/view.php?person=ibm-Kristjan.H.Greenewald;http://bruel.org/;http://people.csail.mit.edu/jsolomon/",
        "dblp": "236/4646;146/0563;228/6813;80/5094",
        "google_scholar": "x0_peq4AAAAJ;L3zNUG4AAAAJ;y9Oh5XwAAAAJ;pImSVwoAAAAJ",
        "orcid": ";;;0000-0002-7701-7586",
        "linkedin": ";;;justin-solomon-8a587914/",
        "or_profile": "~Kimia_Nadjahi1;~Kristjan_Greenewald1;~Rickard_Br\u00fcel_Gabrielsson1;~Justin_Solomon1",
        "aff": "Massachusetts Institute of Technology;MIT-IBM Watson AI Lab, IBM Research;Massachusetts Institute of Technology;Massachusetts Institute of Technology",
        "aff_domain": "mit.edu;ibm.com;mit.edu;mit.edu",
        "position": "Postdoc;Research Scientist;PhD student;Associate Professor",
        "bibtex": "@misc{\nnadjahi2024slicing,\ntitle={Slicing Mutual Information Generalization Bounds for Neural Networks},\nauthor={Kimia Nadjahi and Kristjan Greenewald and Rickard Br{\\\"u}el Gabrielsson and Justin Solomon},\nyear={2024},\nurl={https://openreview.net/forum?id=Piod76RSrx}\n}",
        "github": "",
        "project": "",
        "reviewers": "JYMx;X27N;KfBv;qRo1",
        "site": "https://openreview.net/forum?id=Piod76RSrx",
        "pdf_size": 652475,
        "rating": "5;5;6;6",
        "confidence": "5;4;3;4",
        "soundness": "3;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "81;193;158;86",
        "wc_strengths": "47;44;117;38",
        "wc_weaknesses": "197;80;536;120",
        "wc_questions": "4;266;179;349",
        "wc_review": "329;583;990;593",
        "wc_reply_reviewers": "125;71;97;69",
        "wc_reply_authors": "829;791;668;956",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "3;2;2;3",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            129.5,
            47.668123520860355
        ],
        "wc_strengths_avg": [
            61.5,
            32.20636583037583
        ],
        "wc_weaknesses_avg": [
            233.25,
            179.7795525080647
        ],
        "wc_questions_avg": [
            199.5,
            127.87982639963194
        ],
        "wc_review_avg": [
            623.75,
            236.44383582576222
        ],
        "wc_reply_reviewers_avg": [
            90.5,
            22.776083947860748
        ],
        "wc_reply_authors_avg": [
            811.0,
            102.71075893011404
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.7071067811865475,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4214553080359995200&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 10,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Massachusetts Institute of Technology;IBM",
        "aff_unique_dep": ";AI Lab",
        "aff_unique_url": "https://web.mit.edu;https://www.ibmwatsonai.org/",
        "aff_unique_abbr": "MIT;MIT-IBM AI Lab",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Pj3ErOxlLo",
        "title": "NaviFormer: A Deep Reinforcement Learning Transformer-like Model to Holistically Solve the Navigation Problem",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Automatic path planning is a highly relevant research area with multiple applications, but it is usually solved by addressing either the (high-level) route planning problem (waypoint sequencing to achieve the final goal) or the (low-level) path planning problem (trajectory prediction between two waypoints avoiding collisions). However, real-world problems usually require simultaneous solutions to the route and path planning subproblems with a holistic and more efficient approach. In this paper, we introduce NaviFormer, a deep reinforcement learning model based on a Transformer architecture that solves the global navigation problem by predicting both high-level routes and low-level trajectories. To evaluate NaviFormer, several experiments have been conducted, including comparisons with other algorithms. Results show high competitive accuracy from NaviFormer since it can understand the constraints and difficulties of each high- and low-level planning and act consequently to improve the performance. Moreover, its superior computation speed proves its suitability for real-time applications.",
        "keywords": "deep reinforcement learning;transformer;path planning;route planning;navigation",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Daniel Fuertes;Andrea Cavallaro;Carlos R del-Blanco;Fernando Jaureguizar;Narciso Garc\u00eda",
        "authorids": "~Daniel_Fuertes1;~Andrea_Cavallaro1;~Carlos_R_del-Blanco1;~Fernando_Jaureguizar1;~Narciso_Garc\u00eda1",
        "gender": "M;;M;;M",
        "homepage": ";;;;http://www.gti.ssr.upm.es",
        "dblp": ";;;75/1443;05/4319",
        "google_scholar": ";;f5e24TkAAAAJ;https://scholar.google.es/citations?hl=es;https://scholar.google.es/citations?user=dJsf9l8AAAAJ",
        "orcid": "0000-0002-5746-2199;;0000-0003-0618-3488;0000-0001-6449-5151;0000-0002-0397-894X",
        "linkedin": ";;;;",
        "or_profile": "~Daniel_Fuertes1;~Andrea_Cavallaro1;~Carlos_R_del-Blanco1;~Fernando_Jaureguizar1;~Narciso_Garc\u00eda1",
        "aff": "Universidad Polit\u00e9cnica de Madrid;;Universidad Polit\u00e9cnica de Madrid;Universidad Polit\u00e9cnica de Madrid;Universidad Polit\u00e9cnica de Madrid",
        "aff_domain": "upm.es;;upm.es;upm.es;upm.es",
        "position": "PhD student;;Associate Professor;Associate Professor;Full Professor",
        "bibtex": "@misc{\nfuertes2024naviformer,\ntitle={NaviFormer: A Deep Reinforcement Learning Transformer-like Model to Holistically Solve the Navigation Problem},\nauthor={Daniel Fuertes and Andrea Cavallaro and Carlos R del-Blanco and Fernando Jaureguizar and Narciso Garc{\\'\\i}a},\nyear={2024},\nurl={https://openreview.net/forum?id=Pj3ErOxlLo}\n}",
        "github": "",
        "project": "",
        "reviewers": "wH3n;ZnEn;yhHi;ayad",
        "site": "https://openreview.net/forum?id=Pj3ErOxlLo",
        "pdf_size": 4378181,
        "rating": "6;6;6;6",
        "confidence": "3;3;4;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;2",
        "presentation": "2;2;2;3",
        "wc_summary": "89;43;229;108",
        "wc_strengths": "33;30;117;32",
        "wc_weaknesses": "119;84;584;86",
        "wc_questions": "285;93;110;124",
        "wc_review": "526;250;1040;350",
        "wc_reply_reviewers": "64;7;50;65",
        "wc_reply_authors": "1003;1149;1149;496",
        "reply_reviewers": "1;1;1;2",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            117.25,
            68.71089797113702
        ],
        "wc_strengths_avg": [
            53.0,
            36.966200778549045
        ],
        "wc_weaknesses_avg": [
            218.25,
            211.6227480683492
        ],
        "wc_questions_avg": [
            153.0,
            76.99675317829967
        ],
        "wc_review_avg": [
            541.5,
            304.2971409658658
        ],
        "wc_reply_reviewers_avg": [
            46.5,
            23.56374333589636
        ],
        "wc_reply_authors_avg": [
            949.25,
            268.3862654831651
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:HLY6RMK-9-8J:scholar.google.com/&scioq=NaviFormer:+A+Deep+Reinforcement+Learning+Transformer-like+Model+to+Holistically+Solve+the+Navigation+Problem&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Universidad Polit\u00e9cnica de Madrid",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.upm.es",
        "aff_unique_abbr": "UPM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Spain"
    },
    {
        "id": "Pj52xO5ysY",
        "title": "Interpretable word-level context-based sentiment analysis",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We propose an attention-based multiple instance classification model (AMIC) to conduct interpretable word-level sentiment analysis (SA) using only document sentiment labels. The word-level SA adds more interpretability compared to other models while maintaining competitive performance at the document level. Furthermore, we decompose our model into interpretable outputs that provide context weighting, indication of word neutrality, and negation. This structure provides insights on how context influences sentiment and the inner workings in the model\u2019s decision-making process. AMIC is built on a straightforward modeling framework (i.e., multiple instance classification model) which incorporates blocks of self-attention and positional encoded self-attention to achieve competitive prediction performance. The architecture is transparent yet effective at conducting interpretable SA. Model performance is reported on two document sentiment classification datasets, with extensive analysis of model interpretation.",
        "keywords": "Language Models;Sentiment Analysis;Interpretable Learning",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Chenyu Yang;Eric Larson;Jing Cao",
        "authorids": "~Chenyu_Yang3;~Eric_Larson1;~Jing_Cao1",
        "gender": "M;M;F",
        "homepage": ";http://www.eclarson.com/;https://www.smu.edu/Dedman/Academics/Departments/Statistics/People/FacultyDirectory/JCao",
        "dblp": ";22/4287;",
        "google_scholar": ";https://scholar.google.no/citations?user=vThE9GIAAAAJ;",
        "orcid": ";0000-0001-6040-868X;",
        "linkedin": "chenyu-devon-yang/;;",
        "or_profile": "~Chenyu_Yang3;~Eric_Larson1;~Jing_Cao1",
        "aff": ";Southern Methodist University, Southern Methodist University;Southern Methodist University",
        "aff_domain": ";smu.edu;smu.edu",
        "position": ";Associate Professor;Full Professor",
        "bibtex": "@misc{\nyang2024interpretable,\ntitle={Interpretable word-level context-based sentiment analysis},\nauthor={Chenyu Yang and Eric Larson and Jing Cao},\nyear={2024},\nurl={https://openreview.net/forum?id=Pj52xO5ysY}\n}",
        "github": "",
        "project": "",
        "reviewers": "7yoE;UzwB;kPxy",
        "site": "https://openreview.net/forum?id=Pj52xO5ysY",
        "pdf_size": 269213,
        "rating": "3;3;3",
        "confidence": "4;3;4",
        "soundness": "2;2;2",
        "contribution": "1;2;1",
        "presentation": "3;2;2",
        "wc_summary": "37;51;52",
        "wc_strengths": "37;13;24",
        "wc_weaknesses": "256;685;170",
        "wc_questions": "2;4;5",
        "wc_review": "332;753;251",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            46.666666666666664,
            6.847546194724712
        ],
        "wc_strengths_avg": [
            24.666666666666668,
            9.809292646374775
        ],
        "wc_weaknesses_avg": [
            370.3333333333333,
            225.25590385652987
        ],
        "wc_questions_avg": [
            3.6666666666666665,
            1.247219128924647
        ],
        "wc_review_avg": [
            445.3333333333333,
            220.05201405324354
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:lzKiIVCr2okJ:scholar.google.com/&scioq=Interpretable+word-level+context-based+sentiment+analysis&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Southern Methodist University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.smu.edu",
        "aff_unique_abbr": "SMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Pjz3jkCAir",
        "title": "CONFIDE: CONtextual FInite DifferencE modelling of PDEs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We introduce a method for inferring an explicit PDE from a data sample generated by  previously unseen dynamics, based on a learned context. \nThe training phase integrates knowledge of the form of the equation with a differential scheme, while the inference phase yields a PDE that fits the data sample and enables both signal prediction and data explanation.\nWe include results of extensive experimentation, comparing our method to SOTA approaches, together with ablation studies that examine different flavors of our solution in terms of prediction error and explainability.",
        "keywords": "partial differential equations;hybrid modelling;physics informed models;time series modeling",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/47f2a4fd1c7b5906415931992a08c456f18ef74a.zip",
        "author": "Ori Linial;Orly Avner;Dotan Di Castro",
        "authorids": "~Ori_Linial2;~Orly_Avner1;~Dotan_Di_Castro1",
        "gender": "M;F;M",
        "homepage": ";;",
        "dblp": ";07/11045;72/538",
        "google_scholar": "CjRCqYUAAAAJ;qANr6GYAAAAJ;zhQaFaMAAAAJ",
        "orcid": ";;",
        "linkedin": "ori-linial-b7a17b109/;;dotan-di-castro-b0a99039/",
        "or_profile": "~Ori_Linial2;~Orly_Avner1;~Dotan_Di_Castro1",
        "aff": "Technion - Israel Institute of Technology, Technion;Bosch Center for Artificial Inteligence;Bosch",
        "aff_domain": "technion.ac.il;bosch.com;bosch.com",
        "position": "PhD student;Researcher;Bosch Center for Artificial Inteligence",
        "bibtex": "@misc{\nlinial2024confide,\ntitle={{CONFIDE}: {CON}textual {FI}nite DifferencE modelling of {PDE}s},\nauthor={Ori Linial and Orly Avner and Dotan Di Castro},\nyear={2024},\nurl={https://openreview.net/forum?id=Pjz3jkCAir}\n}",
        "github": "",
        "project": "",
        "reviewers": "EEcP;RwBU;VkbV",
        "site": "https://openreview.net/forum?id=Pjz3jkCAir",
        "pdf_size": 1145193,
        "rating": "5;5;6",
        "confidence": "4;4;2",
        "soundness": "3;2;3",
        "contribution": "2;2;3",
        "presentation": "3;2;3",
        "wc_summary": "49;70;56",
        "wc_strengths": "26;158;61",
        "wc_weaknesses": "139;702;25",
        "wc_questions": "152;256;1",
        "wc_review": "366;1186;143",
        "wc_reply_reviewers": "406;0;0",
        "wc_reply_authors": "1254;767;107",
        "reply_reviewers": "2;0;0",
        "reply_authors": "3;2;1",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            58.333333333333336,
            8.73053390247253
        ],
        "wc_strengths_avg": [
            81.66666666666667,
            55.83507459971335
        ],
        "wc_weaknesses_avg": [
            288.6666666666667,
            295.9530743584568
        ],
        "wc_questions_avg": [
            136.33333333333334,
            104.69107995537262
        ],
        "wc_review_avg": [
            565.0,
            448.45140948230573
        ],
        "wc_reply_reviewers_avg": [
            135.33333333333334,
            191.39023544115884
        ],
        "wc_reply_authors_avg": [
            709.3333333333334,
            470.0328593714368
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:bRKJclokkdUJ:scholar.google.com/&scioq=CONFIDE:+CONtextual+FInite+DifferencE+modelling+of+PDEs&hl=en&as_sdt=0,5",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Technion - Israel Institute of Technology;Bosch Center for Artificial Intelligence;Robert Bosch GmbH",
        "aff_unique_dep": ";Center for Artificial Intelligence;",
        "aff_unique_url": "https://www.technion.ac.il;https://www.bosch-ai.com;https://www.bosch.com",
        "aff_unique_abbr": "Technion;BCAI;Bosch",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "Israel;Germany"
    },
    {
        "id": "PlZIXgfWPH",
        "title": "On the Hyperparameter Loss Landscapes of Machine Learning Algorithms",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Hyperparameter optimization (HPO) is often formulated as a black-box, expensive optimization problem. Despite the recent success in a plethora of HPO algorithms, little has been known about the intricate play of model hyperparameters (HPs) and the resulting losses, especially when faced with different scenarios. In this paper, we aim to shed light on this black box by conducting comprehensive fitness landscape anaysis (FLA) on the HP loss landscapes of ML models under $i)$ training and test setups, and different $ii)$ fidelities, $iii)$ datasets, $iv)$ models. We do so by developing a dedicated landscape analysis framework that incorporates a combination of visual and quantitative measures, characterizing both topological structures and configuration rankings of the landscapes. We apply this framework to analyze $1,476$ HP loss landscapes of $5$ ML models, $63$ datasets with over $11$ million model evaluations of different fidelities. Our empirical results reveal a universal picture of HP loss landscapes. In this picture, landscapes feature a fairly smooth and neutral terrain where configurations are clustered with respect to their losses; there is a large plateau consisting of prominent configurations, where the landscape becomes flatter around the optimum. We also show that landscapes of different fidelities, datasets share considerable similarities that can be exploited to accelerate HPO, whereas test landscapes could significantly deviate from training landscapes due to overfitting.",
        "keywords": "Landscape analysis;hyperparameter optimization;exploratory analysis",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Mingyu Huang;Ke Li",
        "authorids": "~Mingyu_Huang1;~Ke_Li5",
        "gender": "M;M",
        "homepage": "https://colalab.ai/;https://colalab.ai/",
        "dblp": ";75/6627-1.html",
        "google_scholar": "MPEjwKYAAAAJ;https://scholar.google.co.uk/citations?user=lUFU8KsAAAAJ",
        "orcid": "0000-0003-2829-8673;0000-0001-7200-4244",
        "linkedin": ";ke-li-29423226/",
        "or_profile": "~Mingyu_Huang1;~Ke_Li5",
        "aff": "University of Electronic Science and Technology of China;University of Exeter",
        "aff_domain": "uestc.edu.cn;exeter.ac.uk",
        "position": "MS student;Associate Professor",
        "bibtex": "@misc{\nhuang2024on,\ntitle={On the Hyperparameter Loss Landscapes of Machine Learning Algorithms},\nauthor={Mingyu Huang and Ke Li},\nyear={2024},\nurl={https://openreview.net/forum?id=PlZIXgfWPH}\n}",
        "github": "",
        "project": "",
        "reviewers": "NkWq;1UHx;q8yg;N7RA",
        "site": "https://openreview.net/forum?id=PlZIXgfWPH",
        "pdf_size": 19302572,
        "rating": "5;5;5;8",
        "confidence": "5;4;4;4",
        "soundness": "3;3;2;2",
        "contribution": "3;1;3;2",
        "presentation": "3;2;3;3",
        "wc_summary": "142;67;102;129",
        "wc_strengths": "178;76;133;60",
        "wc_weaknesses": "523;153;913;50",
        "wc_questions": "215;73;291;304",
        "wc_review": "1058;369;1439;543",
        "wc_reply_reviewers": "0;42;0;100",
        "wc_reply_authors": "2529;1194;2276;1055",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "4;3;4;3",
        "rating_avg": [
            5.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            110.0,
            28.71410803072246
        ],
        "wc_strengths_avg": [
            111.75,
            46.89549551929268
        ],
        "wc_weaknesses_avg": [
            409.75,
            339.64199902250016
        ],
        "wc_questions_avg": [
            220.75,
            91.826943213852
        ],
        "wc_review_avg": [
            852.25,
            423.01736075485127
        ],
        "wc_reply_reviewers_avg": [
            35.5,
            40.996951106149346
        ],
        "wc_reply_authors_avg": [
            1763.5,
            647.0991036927805
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.5,
            0.5
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5452105531286034180&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Electronic Science and Technology of China;University of Exeter",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uestc.edu.cn;https://www.exeter.ac.uk",
        "aff_unique_abbr": "UESTC;Exeter",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "id": "PlpPflNCKV",
        "title": "Video2StyleGAN: Disentangling Local and Global Variations in a Video",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Image editing using a pre-trained StyleGAN generator has emerged as a powerful paradigm for facial editing, providing disentangled controls over age, expression, illumination, etc. However, the approach cannot be directly adopted for video manipulations. We hypothesize that the main missing ingredient is the lack of fine-grained and disentangled control over face location, face pose, and local facial expressions. In this work, we demonstrate that such a fine-grained control is indeed achievable using pre-trained StyleGAN by simultaneously working across multiple (latent) spaces (i.e., positional,  W+,  and  S spaces)\nand combining the optimization results. Building on this, we introduce Video2StyleGAN, which takes a target image and driving video(s) to reenact the local and global locations and expressions from the driving video in the identity of the target image. As a result, we are able to generate high-quality videos at 1024x10242 resolution without training on video data. \nWe evaluate the effectiveness of our method over multiple challenging scenarios and demonstrate clear improvements in terms of LPIPS over alternative approaches trained on video data (FOMM, LIA, and TPS and comparable scores in terms of FID, keypoint distance, and identity preservation.",
        "keywords": "Video Editing;face reenactment;StyleGAN",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/cdbd55a1c69979670f2c3109d9b24285892df505.zip",
        "author": "Rameen Abdal;Peihao Zhu;Niloy Mitra;Peter Wonka",
        "authorids": "~Rameen_Abdal1;~Peihao_Zhu1;~Niloy_Mitra1;~Peter_Wonka1",
        "gender": "M;M;M;M",
        "homepage": "https://rameenabdal.github.io/;;http://www0.cs.ucl.ac.uk/staff/n.mitra/;http://peterwonka.net",
        "dblp": "239/4322;255/9066;45/1575;98/5522",
        "google_scholar": "https://scholar.google.co.in/citations?user=kEQimk0AAAAJ;Gn8URq0AAAAJ;https://scholar.google.com.tw/citations?user=dPrZJWMAAAAJ;https://scholar.google.com.tw/citations?user=0EKXSXgAAAAJ",
        "orcid": ";0000-0002-7122-1551;;0000-0003-0627-9746",
        "linkedin": ";;;",
        "or_profile": "~Rameen_Abdal1;~Peihao_Zhu1;~Niloy_Mitra1;~Peter_Wonka1",
        "aff": "Stanford University;ByteDance;Adobe Systems;KAUST",
        "aff_domain": "stanford.edu;bytedance.com;adobe.com;kaust.edu.sa",
        "position": "Postdoc;Researcher;Researcher;Full Professor",
        "bibtex": "@misc{\nabdal2024videostylegan,\ntitle={Video2Style{GAN}: Disentangling Local and Global Variations in a Video},\nauthor={Rameen Abdal and Peihao Zhu and Niloy Mitra and Peter Wonka},\nyear={2024},\nurl={https://openreview.net/forum?id=PlpPflNCKV}\n}",
        "github": "",
        "project": "",
        "reviewers": "uEde;hUSe;7M9K;1vN3",
        "site": "https://openreview.net/forum?id=PlpPflNCKV",
        "pdf_size": 9887220,
        "rating": "3;5;5;8",
        "confidence": "4;4;4;4",
        "soundness": "2;3;3;4",
        "contribution": "2;2;2;4",
        "presentation": "2;2;3;3",
        "wc_summary": "139;44;77;127",
        "wc_strengths": "26;73;49;66",
        "wc_weaknesses": "70;494;100;37",
        "wc_questions": "59;57;90;91",
        "wc_review": "294;668;316;321",
        "wc_reply_reviewers": "141;0;88;0",
        "wc_reply_authors": "591;746;536;281",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            96.75,
            38.316934898292686
        ],
        "wc_strengths_avg": [
            53.5,
            18.117670931993437
        ],
        "wc_weaknesses_avg": [
            175.25,
            185.3744521232632
        ],
        "wc_questions_avg": [
            74.25,
            16.269219403523945
        ],
        "wc_review_avg": [
            399.75,
            155.20691833806893
        ],
        "wc_reply_reviewers_avg": [
            57.25,
            60.23858813086508
        ],
        "wc_reply_authors_avg": [
            538.5,
            167.4253565025322
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12200979342583528918&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Stanford University;ByteDance;Adobe;King Abdullah University of Science and Technology",
        "aff_unique_dep": ";;Adobe Systems Incorporated;",
        "aff_unique_url": "https://www.stanford.edu;https://www.bytedance.com;https://www.adobe.com;https://www.kaust.edu.sa",
        "aff_unique_abbr": "Stanford;ByteDance;Adobe;KAUST",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Stanford;",
        "aff_country_unique_index": "0;1;0;2",
        "aff_country_unique": "United States;China;Saudi Arabia"
    },
    {
        "id": "Pmrc0nEvxf",
        "title": "MemStranding: Adversarial attacks on temporal graph neural networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Temporal graph neural networks (TGNN) have achieved significant momentum in many real-world dynamic graph tasks. While this trend raises an urgent to study their robustness against adversarial attacks, developing an attack on TGNN is challenging due to the dynamic nature of their input dynamic graphs. \nOn the one hand, subsequent graph changes after the attacks may diminish the impact of attacks on seen nodes.\nOn the other hand, targeting future nodes, which are unseen during the attack, poses significant challenges due to missing knowledge about them.\nTo tackle these unique challenges in attacking TGNNs, we propose a practical and effective adversarial attack framework, MemStranding, that leverages node memories in TGNN models to yield long-lasting and spreading adversarial noises in dynamic graphs.\nThe MemStranding allows the attacker to inject noises into nodes' memory by adding fake nodes/edges at arbitrary timestamps.\nDuring future updates, the noises in nodes will persist with the support from their neighbors and be propagated to the future nodes by molding their memories into similar noisy states.\nThe experimental results demonstrate that MemStranding can significantly decrease the TGNN models' performances in various tasks.",
        "keywords": "Adversarial Attack;Temporal Graph Neural Networks;Dynamic Graphs",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Yue Dai;Liang Liu;Xulong Tang;Youtao Zhang;Jun Yang",
        "authorids": "~Yue_Dai1;~Liang_Liu7;~Xulong_Tang1;~Youtao_Zhang1;~Jun_Yang1",
        "gender": ";M;M;M;F",
        "homepage": "https://yud42.github.io/;;http://xzt102.github.io/;https://people.cs.pitt.edu/~zhangyt/;https://sites.pitt.edu/~juy9/",
        "dblp": ";;66/10956;z/YoutaoZhang.html;",
        "google_scholar": "f3zYpYwAAAAJ;;jmjRUi4AAAAJ;zvbUOD8AAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";0000-0002-7047-1794;;;",
        "linkedin": "yue-dai-aa8a9012b/;;;;",
        "or_profile": "~Yue_Dai1;~Liang_Liu7;~Xulong_Tang1;~Youtao_Zhang1;~Jun_Yang1",
        "aff": "University of Pittsburgh;University of Pittsburgh;University of Pittsburgh;University of Pittsburgh;",
        "aff_domain": "pitt.edu;pitt.edu;pitt.edu;pitt.edu;",
        "position": "PhD student;PhD student;Assistant Professor;Full Professor;",
        "bibtex": "@misc{\ndai2024memstranding,\ntitle={MemStranding: Adversarial attacks on temporal graph neural networks},\nauthor={Yue Dai and Liang Liu and Xulong Tang and Youtao Zhang and Jun Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=Pmrc0nEvxf}\n}",
        "github": "",
        "project": "",
        "reviewers": "aaPY;4nwA;LiVK",
        "site": "https://openreview.net/forum?id=Pmrc0nEvxf",
        "pdf_size": 6929151,
        "rating": "5;6;6",
        "confidence": "4;4;2",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "2;3;3",
        "wc_summary": "49;58;53",
        "wc_strengths": "52;57;120",
        "wc_weaknesses": "15;93;48",
        "wc_questions": "245;165;63",
        "wc_review": "361;373;284",
        "wc_reply_reviewers": "62;19;11",
        "wc_reply_authors": "3823;2124;2390",
        "reply_reviewers": "1;1;1",
        "reply_authors": "8;4;5",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            53.333333333333336,
            3.6817870057290873
        ],
        "wc_strengths_avg": [
            76.33333333333333,
            30.944394574067136
        ],
        "wc_weaknesses_avg": [
            52.0,
            31.96873472629156
        ],
        "wc_questions_avg": [
            157.66666666666666,
            74.481914284983
        ],
        "wc_review_avg": [
            339.3333333333333,
            39.432079439066975
        ],
        "wc_reply_reviewers_avg": [
            30.666666666666668,
            22.395436042987768
        ],
        "wc_reply_authors_avg": [
            2779.0,
            746.1639676818137
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            5.666666666666667,
            1.699673171197595
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:BmloT9jbRSUJ:scholar.google.com/&scioq=MemStranding:+Adversarial+attacks+on+temporal+graph+neural+networks&hl=en&as_sdt=0,31",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of Pittsburgh",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.pitt.edu",
        "aff_unique_abbr": "Pitt",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Deep Geodesic Canonical Correlation Analysis for Covariance-Based Neuroimaging Data",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18694",
        "id": "PnR1MNen7u",
        "author_site": "Ce Ju, Reinmar Kobler, Liyao Tang, Cuntai Guan, Motoaki Kawanabe",
        "tldr": "",
        "abstract": "In human neuroimaging, multi-modal imaging techniques are frequently combined to enhance our comprehension of whole-brain dynamics and improve diagnosis in clinical practice. Modalities like electroencephalography and functional magnetic resonance imaging provide distinct views to the brain dynamics due to diametral spatiotemporal sensitivities and underlying neurophysiological coupling mechanisms. These distinct views pose a considerable challenge to learning a shared representation space, especially when dealing with covariance-based data characterized by their geometric structure. To capitalize on the geometric structure, we introduce a measure called geodesic correlation which expands traditional correlation consistency to covariance-based data on the symmetric positive definite (SPD) manifold. This measure is derived from classical canonical correlation analysis and serves to evaluate the consistency of latent representations obtained from paired views. For multi-view, self-supervised learning where one or both latent views are SPD we propose an innovative geometric deep learning framework termed DeepGeoCCA. Its primary objective is to enhance the geodesic correlation of unlabeled, paired data, thereby generating novel representations while retaining the geometric structures. In simulations and experiments with multi-view and multi-modal human neuroimaging data, we find that DeepGeoCCA learns latent representations with high geodesic correlation for unseen data while retaining relevant information for downstream tasks.",
        "keywords": "Geometric Deep Learning;Self-Supervised Learning;Brain-Computer Interfaces;Neuroimaging;Neuroscience",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "Ce Ju;Reinmar J Kobler;Liyao Tang;Cuntai Guan;Motoaki Kawanabe",
        "authorids": "~Ce_Ju1;~Reinmar_J_Kobler1;~Liyao_Tang1;~Cuntai_Guan1;~Motoaki_Kawanabe1",
        "gender": ";M;;M;M",
        "homepage": ";;https://github.com/LiyaoTang;https://personal.ntu.edu.sg/ctguan/index.html;",
        "dblp": ";194/9354;315/9210;95/7006;28/5971",
        "google_scholar": ";https://scholar.google.at/citations?user=hE8CJYIAAAAJ;Q4ozmNYAAAAJ;https://scholar.google.com.tw/citations?user=sg4vxPoAAAAJ;",
        "orcid": ";0000-0003-4007-279X;;0000-0002-0872-3276;",
        "linkedin": ";;;;",
        "or_profile": "~Ce_Ju1;~Reinmar_J_Kobler1;~Liyao_Tang1;~Cuntai_Guan1;~Motoaki_Kawanabe1",
        "aff": ";ATR;University of Sydney, University of Sydney;Nanyang Technological University;ATR",
        "aff_domain": ";atr.jp;uni.sydney.edu.au;ntu.edu.sg;atr.jp",
        "position": ";Researcher;PhD student;Full Professor;Department Head",
        "bibtex": "@inproceedings{\nju2024deep,\ntitle={Deep Geodesic Canonical Correlation Analysis for Covariance-Based Neuroimaging Data},\nauthor={Ce Ju and Reinmar J Kobler and Liyao Tang and Cuntai Guan and Motoaki Kawanabe},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=PnR1MNen7u}\n}",
        "github": "",
        "project": "",
        "reviewers": "7bLk;2nXA;Mrh1",
        "pdf_size": 2805853,
        "rating": "6;8;8",
        "confidence": "1;2;4",
        "soundness": "3;3;3",
        "contribution": "3;3;2",
        "presentation": "3;3;3",
        "wc_summary": "81;109;112",
        "wc_strengths": "266;62;66",
        "wc_weaknesses": "90;100;160",
        "wc_questions": "58;75;85",
        "wc_review": "495;346;423",
        "wc_reply_reviewers": "0;30;0",
        "wc_reply_authors": "531;1838;3047",
        "reply_reviewers": "0;1;0",
        "reply_authors": "1;5;6",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            100.66666666666667,
            13.960261060914616
        ],
        "wc_strengths_avg": [
            131.33333333333334,
            95.23771428495238
        ],
        "wc_weaknesses_avg": [
            116.66666666666667,
            30.912061651652344
        ],
        "wc_questions_avg": [
            72.66666666666667,
            11.14550233153366
        ],
        "wc_review_avg": [
            421.3333333333333,
            60.8404105472305
        ],
        "wc_reply_reviewers_avg": [
            10.0,
            14.142135623730951
        ],
        "wc_reply_authors_avg": [
            1805.3333333333333,
            1027.4123915070434
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            4.0,
            2.160246899469287
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.7559289460184545,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=956534150578563837&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=PnR1MNen7u",
        "pdf": "https://openreview.net/pdf?id=PnR1MNen7u",
        "email": ";atr.jp;uni.sydney.edu.au;ntu.edu.sg;atr.jp",
        "author_num": 5,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Advanced Telecommunications Research Institute;University of Sydney;Nanyang Technological University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.atr.jp;https://www.sydney.edu.au;https://www.ntu.edu.sg",
        "aff_unique_abbr": "ATR;USYD;NTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;0",
        "aff_country_unique": "Japan;Australia;Singapore"
    },
    {
        "id": "Po6lYYsrB4",
        "title": "ALP: Action-Aware Embodied Learning for Perception",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Current methods in training and benchmarking vision models exhibit an over-reliance on passive, curated datasets. Although models trained on these datasets have shown strong performance in a wide variety of tasks such as classification, detection, and segmentation, they fundamentally are unable to generalize to an ever-evolving world due to constant out-of-distribution shifts of input data. Therefore, instead of training on fixed datasets, can we approach learning in a more human-centric and adaptive manner? In this paper, we introduce Action-Aware Embodied Learning for Perception (ALP), an embodied learning framework that incorporates action information into representation learning through a combination of optimizing a reinforcement learning policy and an inverse dynamics prediction objective. Our method actively explores in complex 3D environments to both learn generalizable task-agnostic visual representations as well as collect downstream training data. We show that ALP outperforms existing baselines in several downstream perception tasks. In addition, we show that by training on actively collected data more relevant to the environment and task, our method generalizes more robustly to downstream tasks compared to models pre-trained on fixed datasets such as ImageNet.",
        "keywords": "embodied AI;active exploration;computer vision;pretraining and finetuning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/e67b02c03af3f7dcb113455aa132ef345df62a40.zip",
        "author": "Xinran Liang;Anthony Han;Wilson Yan;Aditi Raghunathan;Pieter Abbeel",
        "authorids": "~Xinran_Liang1;~Anthony_Han1;~Wilson_Yan1;~Aditi_Raghunathan1;~Pieter_Abbeel2",
        "gender": "F;M;M;F;M",
        "homepage": "https://xinranliang.github.io/xinranliang/;;https://wilson1yan.github.io/;https://www.cs.cmu.edu/~aditirag/;https://people.eecs.berkeley.edu/~pabbeel/",
        "dblp": ";;;166/1409;",
        "google_scholar": "jAbh0hcAAAAJ;;tR2Qw0YAAAAJ;Ch9iRwQAAAAJ;https://scholar.google.com.tw/citations?user=vtwH6GkAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";anthony-han-09b0761b5/;;;",
        "or_profile": "~Xinran_Liang1;~Anthony_Han1;~Wilson_Yan1;~Aditi_Raghunathan1;~Pieter_Abbeel2",
        "aff": "Princeton University;;University of California, Berkeley;Carnegie Mellon University;Covariant",
        "aff_domain": "princeton.edu;;berkeley.edu;cmu.edu;covariant.ai",
        "position": "PhD student;;PhD student;Assistant Professor;Founder",
        "bibtex": "@misc{\nliang2024alp,\ntitle={{ALP}: Action-Aware Embodied Learning for Perception},\nauthor={Xinran Liang and Anthony Han and Wilson Yan and Aditi Raghunathan and Pieter Abbeel},\nyear={2024},\nurl={https://openreview.net/forum?id=Po6lYYsrB4}\n}",
        "github": "",
        "project": "",
        "reviewers": "e8e8;h74j;DHKz;mMb6",
        "site": "https://openreview.net/forum?id=Po6lYYsrB4",
        "pdf_size": 720010,
        "rating": "3;3;6;6",
        "confidence": "4;4;3;3",
        "soundness": "3;3;4;4",
        "contribution": "3;2;3;3",
        "presentation": "3;4;3;4",
        "wc_summary": "109;50;70;131",
        "wc_strengths": "116;19;33;96",
        "wc_weaknesses": "417;71;122;170",
        "wc_questions": "190;44;44;190",
        "wc_review": "832;184;269;587",
        "wc_reply_reviewers": "0;0;73;29",
        "wc_reply_authors": "1401;1266;973;1244",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "3;3;3;3",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            90.0,
            31.788362650504666
        ],
        "wc_strengths_avg": [
            66.0,
            40.92065493122025
        ],
        "wc_weaknesses_avg": [
            195.0,
            132.8664743266713
        ],
        "wc_questions_avg": [
            117.0,
            73.0
        ],
        "wc_review_avg": [
            468.0,
            258.3186017304987
        ],
        "wc_reply_reviewers_avg": [
            25.5,
            29.87055406248769
        ],
        "wc_reply_authors_avg": [
            1221.0,
            155.28844129554523
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.0,
            0.0
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4416806629962231222&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Princeton University;University of California, Berkeley;Carnegie Mellon University;Covariant",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.princeton.edu;https://www.berkeley.edu;https://www.cmu.edu;",
        "aff_unique_abbr": "Princeton;UC Berkeley;CMU;",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Berkeley",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States;"
    },
    {
        "id": "PoB6QGAM38",
        "title": "Neural Networks Decoded: Targeted and Robust Analysis of Neural Network Decisions via Causal Explanations and Reasoning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Despite their continued success and widespread adoption, deep neural networks (DNNs) remain enigmatic \u201cblack boxes\u201d due to their complex architectures and opaque decision-making processes taking place within, which poses significant trust challenges to critical applications. While various methods have been proposed to address this lack of interpretability, existing solutions often offer inconsistent, or overly simplified explanations, or require alterations that compromise model performance. In this work, we introduce TRACER, a novel explainability method grounded in causal inference theory and designed to shed light on the causal dynamics underpinning DNN decisions without altering their architecture or compromising their performance. We further propose an efficient methodology for counterfactual generation, offering contrastive explanations for misclassifications, thereby identifying potential model biases. Through comprehensive evaluations across diverse datasets, we demonstrate the superiority of TRACER compared to prevalent explainability methods, and underscore its ability to transcend explainability from mere associations to causal relationships. We subsequently highlight TRACER\u2019s potential to enable the creation of highly compressed and highly efficient models, showcasing its versatility in both understanding and optimizing DNNs.",
        "keywords": "AI Explainability;Causal Discovery;Counterfactuals Reasoning",
        "primary_area": "causal reasoning",
        "supplementary_material": "",
        "author": "Alec F Diallo;Paul Patras",
        "authorids": "~Alec_F_Diallo1;~Paul_Patras1",
        "gender": "M;",
        "homepage": "https://alec-diallo.github.io/;http://homepages.inf.ed.ac.uk/ppatras/",
        "dblp": "298/4347;03/7603.html",
        "google_scholar": "IyHaFk0AAAAJ;https://scholar.google.co.uk/citations?user=0kC3nVgAAAAJ",
        "orcid": "0000-0002-0793-0492;0000-0002-1037-0158",
        "linkedin": "https://uk.linkedin.com/in/alecfrenn;paulpatras/",
        "or_profile": "~Alec_F_Diallo1;~Paul_Patras1",
        "aff": "University of Edinburgh;University of Edinburgh",
        "aff_domain": "ed.ac.uk;ed.ac.uk",
        "position": "Postdoc;Associate Professor",
        "bibtex": "@misc{\ndiallo2024neural,\ntitle={Neural Networks Decoded: Targeted and Robust Analysis of Neural Network Decisions via Causal Explanations and Reasoning},\nauthor={Alec F Diallo and Paul Patras},\nyear={2024},\nurl={https://openreview.net/forum?id=PoB6QGAM38}\n}",
        "github": "",
        "project": "",
        "reviewers": "Gfne;5com;XGi8",
        "site": "https://openreview.net/forum?id=PoB6QGAM38",
        "pdf_size": 4174173,
        "rating": "3;3;3",
        "confidence": "5;3;4",
        "soundness": "2;1;3",
        "contribution": "2;2;2",
        "presentation": "2;1;2",
        "wc_summary": "31;62;30",
        "wc_strengths": "20;10;61",
        "wc_weaknesses": "61;670;734",
        "wc_questions": "1;40;3",
        "wc_review": "113;782;828",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            41.0,
            14.854853303438128
        ],
        "wc_strengths_avg": [
            30.333333333333332,
            22.065558884580486
        ],
        "wc_weaknesses_avg": [
            488.3333333333333,
            303.2978001165777
        ],
        "wc_questions_avg": [
            14.666666666666666,
            17.93197020841702
        ],
        "wc_review_avg": [
            574.3333333333334,
            326.75202966299827
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:03fyZyKks-UJ:scholar.google.com/&scioq=Neural+Networks+Decoded:+Targeted+and+Robust+Analysis+of+Neural+Network+Decisions+via+Causal+Explanations+and+Reasoning&hl=en&as_sdt=0,5",
        "gs_version_total": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Edinburgh",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ed.ac.uk",
        "aff_unique_abbr": "Edinburgh",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "PoBB8n52oi",
        "title": "SummaryMixing: A Linear-Complexity Alternative to Self-Attention for Speech Recognition and Understanding",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Modern speech processing systems rely on self-attention. Unfortunately, token\nmixing with self-attention takes quadratic time in the length of the speech utterance,\nslowing down inference as well as training and increasing memory consumption.\nCheaper alternatives to self-attention for ASR have been developed, but they fail to\nconsistently reach the same level of accuracy. However, attention layers in trained\nspeech recognizers tend to not capture fine-grained pair-wise information. This\npaper, therefore, proposes a novel linear-time alternative to self-attention. It sum-\nmarises a whole utterance with the mean over vectors for all time steps. This single\nsummary is then combined with time-specific information. We call this method\n\u201cSummaryMixing\u201d. Introducing SummaryMixing in state-of-the-art ASR models\nmakes it feasible to preserve or exceed previous speech recognition performance\nwhile lowering the training and inference times by up to 28% and reducing the\nmemory budget by a factor of two. The benefits of SummaryMixing can also be\ngeneralized to other speech-processing tasks, such as speech understanding.",
        "keywords": "efficient deep learning;speech recognition;spoken language understanding",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/e9e371171d8ff337c9a9a12483d705f988fa85df.pdf",
        "author": "Titouan Parcollet;Rogier van Dalen;Shucong Zhang;Sourav Bhattacharya",
        "authorids": "~Titouan_Parcollet1;~Rogier_van_Dalen2;~Shucong_Zhang2;~Sourav_Bhattacharya1",
        "gender": "M;;;M",
        "homepage": "http://www.darnault-parcollet.fr/Parcollet/index.html;;;",
        "dblp": "https://dblp.org/pers/hd/p/Parcollet:Titouan;;;69/3637",
        "google_scholar": ";;;EU-ESvsAAAAJ",
        "orcid": ";;;",
        "linkedin": "titouan-parcollet-b233a698;;;",
        "or_profile": "~Titouan_Parcollet1;~Rogier_van_Dalen2;~Shucong_Zhang2;~Sourav_Bhattacharya1",
        "aff": "University of Cambridge;;;Samsung AI Center",
        "aff_domain": "cam.ac.uk;;;samsung.com",
        "position": "Adjunct Researcher;;;Principal Researcher",
        "bibtex": "@misc{\nparcollet2024summarymixing,\ntitle={SummaryMixing: A Linear-Complexity Alternative to Self-Attention for Speech Recognition and Understanding},\nauthor={Titouan Parcollet and Rogier van Dalen and Shucong Zhang and Sourav Bhattacharya},\nyear={2024},\nurl={https://openreview.net/forum?id=PoBB8n52oi}\n}",
        "github": "",
        "project": "",
        "reviewers": "wGqz;gqu7;yNSy;fkrd",
        "site": "https://openreview.net/forum?id=PoBB8n52oi",
        "pdf_size": 293159,
        "rating": "3;5;6;8",
        "confidence": "5;4;4;5",
        "soundness": "3;3;3;4",
        "contribution": "3;2;2;3",
        "presentation": "2;3;2;3",
        "wc_summary": "64;60;72;75",
        "wc_strengths": "47;27;49;103",
        "wc_weaknesses": "177;114;162;183",
        "wc_questions": "116;282;269;80",
        "wc_review": "404;483;552;441",
        "wc_reply_reviewers": "0;21;305;0",
        "wc_reply_authors": "1598;1552;1761;1075",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "4;4;4;3",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            67.75,
            6.015604707757983
        ],
        "wc_strengths_avg": [
            56.5,
            28.191310718020897
        ],
        "wc_weaknesses_avg": [
            159.0,
            27.08320512790168
        ],
        "wc_questions_avg": [
            186.75,
            89.77576231923625
        ],
        "wc_review_avg": [
            470.0,
            54.97726802961384
        ],
        "wc_reply_reviewers_avg": [
            81.5,
            129.32227186374357
        ],
        "wc_reply_authors_avg": [
            1496.5,
            255.44324222809263
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.75,
            0.4330127018922193
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11407183970955005460&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Cambridge;Samsung",
        "aff_unique_dep": ";AI Center",
        "aff_unique_url": "https://www.cam.ac.uk;https://www.samsung.com/global/careers/ai-center/",
        "aff_unique_abbr": "Cambridge;Samsung AI",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Cambridge;",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United Kingdom;South Korea"
    },
    {
        "title": "A Linear Algebraic Framework for Counterfactual Generation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18693",
        "id": "PoDkdFQIu3",
        "author_site": "Jong-Hoon Ahn, Akshay Vashist",
        "tldr": "",
        "abstract": "Estimating individual treatment effects in clinical data is essential for understanding how different patients uniquely respond to treatments and identifying the most effective interventions for specific patient subgroups, thereby enhancing the precision and personalization of healthcare. However, counterfactual data are not accessible, and the true calculation of causal effects cannot be performed at the individual level. This paper proposes a linear algebraic framework to generate counterfactual longitudinal data that exactly matches pre-treatment factual data. Because causation travels forward in time, not in reverse, counterfactual predictability is further strengthened by blocking causal effects from flowing back to the past, thus limiting counterfactual dependence on the future. Using simulated LDL cholesterol datasets, we show that our method significantly outperforms the most cited methods of counterfactual generation. We also provide a formula that can estimate the time-varying variance of individual treatment effects, interpreted as a confidence level in the generated counterfactuals compared to true values.",
        "keywords": "counterfactual generation;individual treatment effect;synthetic data;Gaussian mixture model",
        "primary_area": "causal reasoning",
        "supplementary_material": "",
        "author": "Jong-Hoon Ahn;Akshay Vashist",
        "authorids": "~Jong-Hoon_Ahn1;~Akshay_Vashist1",
        "gender": ";M",
        "homepage": ";",
        "dblp": ";88/4733",
        "google_scholar": ";OI_ba2QAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Jong-Hoon_Ahn1;~Akshay_Vashist1",
        "aff": ";",
        "aff_domain": ";",
        "position": ";",
        "bibtex": "@inproceedings{\nahn2024a,\ntitle={A Linear Algebraic Framework for Counterfactual Generation},\nauthor={Jong-Hoon Ahn and Akshay Vashist},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=PoDkdFQIu3}\n}",
        "github": "",
        "project": "",
        "reviewers": "EGeA;aGd4;TJyJ;njab",
        "pdf_size": 1256440,
        "rating": "3;6;6;6",
        "confidence": "4;3;3;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "54;106;82;45",
        "wc_strengths": "31;61;32;29",
        "wc_weaknesses": "106;150;175;45",
        "wc_questions": "12;3;14;41",
        "wc_review": "203;320;303;160",
        "wc_reply_reviewers": "0;0;23;0",
        "wc_reply_authors": "325;470;861;236",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;3;1",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            71.75,
            24.02472684548151
        ],
        "wc_strengths_avg": [
            38.25,
            13.179055353097201
        ],
        "wc_weaknesses_avg": [
            119.0,
            49.35078520145348
        ],
        "wc_questions_avg": [
            17.5,
            14.186260959111108
        ],
        "wc_review_avg": [
            246.5,
            67.02424934305493
        ],
        "wc_reply_reviewers_avg": [
            5.75,
            9.959292143521045
        ],
        "wc_reply_authors_avg": [
            473.0,
            239.0742562468824
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:gOUb3ND_JLwJ:scholar.google.com/&scioq=A+Linear+Algebraic+Framework+for+Counterfactual+Generation&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=PoDkdFQIu3",
        "pdf": "https://openreview.net/pdf?id=PoDkdFQIu3",
        "email": ";",
        "author_num": 2
    },
    {
        "id": "Pp2j9BvpgC",
        "title": "Attribute Recognition with Image-Conditioned Prefix Language Modeling",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Predicting object identity and visual attributes is a fundamental task in many computer vision applications. While large vision-language models such as CLIP had largely solved the task of zero-shot object recognition, zero-shot visual attribute recognition remains challenging because CLIP's contrastively learned language-vision representation does not effectively encode object-attribute dependencies. In this paper, we revisit the problem of attribute recognition and propose a solution using generative prompting, which reformulates attribute recognition as the measurement of the probability of generating a prompt expressing the attribute relation. Unlike contrastive prompting, generative prompting is order-sensitive and designed specifically for downstream object-attribute decomposition. We demonstrate through experiments that generative prompting consistently outperforms contrastive prompting on two visual reasoning datasets, Visual Attribute in the Wild (VAW) and a proposed modified formulation of Visual Genome, which we call Visual Genome Attribute Ranking (VGAR).",
        "keywords": "Attribute Recognition;Language Modeling;Image Attributes",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/985ab5d421a1f9dec77e04e01a8010e48ea87e9c.pdf",
        "author": "William Yicheng Zhu;Keren Ye;Junjie Ke;Jiahui Yu;Leonidas Guibas;Peyman Milanfar;Feng Yang",
        "authorids": "~William_Yicheng_Zhu1;~Keren_Ye3;~Junjie_Ke1;~Jiahui_Yu1;~Leonidas_Guibas1;~Peyman_Milanfar1;~Feng_Yang2",
        "gender": ";M;F;M;M;M;M",
        "homepage": ";https://people.cs.pitt.edu/~yekeren/;;http://jiahuiyu.com/;http://geometry.stanford.edu/;http://www.milanfar.org;https://sites.google.com/corp/view/feng-yang",
        "dblp": "334/4301;203/8508;;185/1060;g/LeonidasJGuibas;48/6882;22/4613-8",
        "google_scholar": ";uEws9hcAAAAJ;;-CLCMk4AAAAJ;https://scholar.google.com.tw/citations?user=5JlEyTAAAAAJ;iGzDl8IAAAAJ;XI8oQn8AAAAJ",
        "orcid": ";;;;;;",
        "linkedin": "william-yicheng-zhu;;junjie-ke/;jiahuiyuu/;;;feng-yang-214a281a",
        "or_profile": "~William_Yicheng_Zhu1;~Keren_Ye3;~Junjie_Ke1;~Jiahui_Yu1;~Leonidas_Guibas1;~Peyman_Milanfar1;~Feng_Yang2",
        "aff": "Google;Google;Research, Google;Google Brain;Stanford University;Google;Google",
        "aff_domain": "google.com;google.com;research.google.com;google.com;stanford.edu;google.com;google.com",
        "position": "Researcher;Researcher;Researcher;Research Scientist;Full Professor;Distinguished Scientist;Senior Staff Software Engineer",
        "bibtex": "@misc{\nzhu2024attribute,\ntitle={Attribute Recognition with Image-Conditioned Prefix Language Modeling},\nauthor={William Yicheng Zhu and Keren Ye and Junjie Ke and Jiahui Yu and Leonidas Guibas and Peyman Milanfar and Feng Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=Pp2j9BvpgC}\n}",
        "github": "",
        "project": "",
        "reviewers": "pzC1;fA8W;ZMSV;yHgE",
        "site": "https://openreview.net/forum?id=Pp2j9BvpgC",
        "pdf_size": 1715169,
        "rating": "5;5;5;8",
        "confidence": "4;4;4;3",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;2",
        "wc_summary": "56;110;24;117",
        "wc_strengths": "42;23;17;65",
        "wc_weaknesses": "161;184;134;9",
        "wc_questions": "20;8;8;1",
        "wc_review": "279;325;183;192",
        "wc_reply_reviewers": "17;0;0;0",
        "wc_reply_authors": "756;730;742;166",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            76.75,
            38.5316428406576
        ],
        "wc_strengths_avg": [
            36.75,
            18.73999733191016
        ],
        "wc_weaknesses_avg": [
            122.0,
            67.59807689572241
        ],
        "wc_questions_avg": [
            9.25,
            6.832825184358224
        ],
        "wc_review_avg": [
            244.75,
            59.60023070425147
        ],
        "wc_reply_reviewers_avg": [
            4.25,
            7.361215932167728
        ],
        "wc_reply_authors_avg": [
            598.5,
            249.87346797929547
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:SVaSHTT_7VMJ:scholar.google.com/&scioq=Attribute+Recognition+with+Image-Conditioned+Prefix+Language+Modeling&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;1;0;0",
        "aff_unique_norm": "Google;Stanford University",
        "aff_unique_dep": "Google;",
        "aff_unique_url": "https://www.google.com;https://www.stanford.edu",
        "aff_unique_abbr": "Google;Stanford",
        "aff_campus_unique_index": "0;0;0;0;1;0;0",
        "aff_campus_unique": "Mountain View;Stanford",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Pp8Kb4hejU",
        "title": "Adjustable Quantile-Guided Diffusion Policy for Diverse Behavior Generation in Offline RL",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Offline Reinforcement Learning (RL) addresses the challenge of learning optimal policies from pre-collected data, making it a promising approach for real-world applications where online interactions with an environment are costly or impractical. We propose an offline RL method named Quantile-Guided Diffusion Policy~(qGDP), which trains a quantile network to label the training dataset and uses these labeled samples to train the diffusion model and generate new samples with the trained model according to classifier-free guidance.\nqGDP can adjust the preference of sample generation between imitating and improving behavioral policies by adjusting the input condition and changing the guidance scale without re-training the model, which will significantly reduce the cost of tuning the algorithm.\nqGDP exhibits exceptional generalization capabilities and allows easy adjustment of action generation preferences without model retraining, reducing computational costs. Experimental results on the D4RL dataset demonstrate state-of-the-art performance and computational efficiency compared to other diffusion-based methods.",
        "keywords": "offline reinforcement learning;diffusion",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/c1c195e34c4fb981b6d123a5d750e09adc6639cb.zip",
        "author": "Wenzhen Huang;Tong Li;Junge Zhang;Depeng Jin;Yong Li",
        "authorids": "~Wenzhen_Huang1;t.li@connect.ust.hk;~Junge_Zhang1;~Depeng_Jin1;~Yong_Li7",
        "gender": "M;;;;M",
        "homepage": ";;;;http://fi.ee.tsinghua.edu.cn/~liyong/",
        "dblp": "30/8809;;;46/5770;",
        "google_scholar": "e9vUaIIAAAAJ;;gbStvusAAAAJ;;https://scholar.google.com/citations?hl=en",
        "orcid": ";;0000-0002-9970-394X;;",
        "linkedin": ";;;;",
        "or_profile": "~Wenzhen_Huang1;t.li@connect.ust.hk;~Junge_Zhang1;~Depeng_Jin1;~Yong_Li7",
        "aff": "Tsinghua University;;Institute of automation, Chinese academy of science;Tsinghua University;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;;ia.ac.cn;tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "Postdoc;;Full Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nhuang2024adjustable,\ntitle={Adjustable Quantile-Guided Diffusion Policy for Diverse Behavior Generation in Offline {RL}},\nauthor={Wenzhen Huang and Tong Li and Junge Zhang and Depeng Jin and Yong Li},\nyear={2024},\nurl={https://openreview.net/forum?id=Pp8Kb4hejU}\n}",
        "github": "",
        "project": "",
        "reviewers": "1jYd;nVWg;Rvvy;eP2Y",
        "site": "https://openreview.net/forum?id=Pp8Kb4hejU",
        "pdf_size": 1170978,
        "rating": "3;3;5;5",
        "confidence": "3;4;4;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;2",
        "presentation": "3;2;4;3",
        "wc_summary": "94;53;58;99",
        "wc_strengths": "44;32;47;59",
        "wc_weaknesses": "251;312;298;174",
        "wc_questions": "39;9;15;5",
        "wc_review": "428;406;418;337",
        "wc_reply_reviewers": "143;124;22;95",
        "wc_reply_authors": "913;898;633;772",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;2;1;2",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            76.0,
            20.65187642806338
        ],
        "wc_strengths_avg": [
            45.5,
            9.604686356149273
        ],
        "wc_weaknesses_avg": [
            258.75,
            53.89515284327525
        ],
        "wc_questions_avg": [
            17.0,
            13.19090595827292
        ],
        "wc_review_avg": [
            397.25,
            35.64670391494843
        ],
        "wc_reply_reviewers_avg": [
            96.0,
            46.016301459374155
        ],
        "wc_reply_authors_avg": [
            804.0,
            112.89596981292114
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:M59dInd_6DIJ:scholar.google.com/&scioq=Adjustable+Quantile-Guided+Diffusion+Policy+for+Diverse+Behavior+Generation+in+Offline+RL&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Tsinghua University;Chinese Academy of Sciences",
        "aff_unique_dep": ";Institute of Automation",
        "aff_unique_url": "https://www.tsinghua.edu.cn;http://www.ia.cas.cn",
        "aff_unique_abbr": "THU;CAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "PqGPjts7Ug",
        "title": "Probabilistic Neural Transfer Function Estimation with Bayesian System Identification",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Neural population responses in sensory systems are driven by external physical stimuli. This stimulus-response relationship is typically characterized by receptive fields, which have been estimated by neural system identification approaches. Such models usually requires a large amount of training data, yet, the recording time for animal experiments is limited, giving rise to epistemic uncertainty for the learned neural transfer functions. While deep neural network models have demonstrated excellent power on neural prediction, they usually do not provide the uncertainty of the resulting neural representations and derived statistics, such as the stimuli driving neurons optimally, from in silico experiments. Here, we present a Bayesian system identification approach to predict neural responses to visual stimuli, and explore whether explicitly modeling network weight variability can be beneficial for identifying neural response properties. To this end, we use variational inference to estimate the posterior distribution of each model weight given the training data. Tests with different neural datasets demonstrate that this method can achieve higher or comparable performance on neural prediction, with a much higher data efficiency compared to Monte Carlo dropout methods and traditional models using point estimates of the model parameters. At the same time, our variational method allows to estimate the uncertainty of stimulus-response function, which we have found to be negatively correlated with the predictive performance and may serve to evaluate models. Furthermore, our approach enables to identify response properties with credible intervals and perform statistical test for the learned neural features, which avoid the idiosyncrasy of a single model. Finally, in silico experiments show that our model generates stimuli driving neuronal activity significantly better than traditional models, particularly in the limited-data regime.",
        "keywords": "neural system identification;Bayes;neuron;vision;receptive field;neural prediction;uncertainty;most exciting input;variational inference;stimulus-response function",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/2ae2a68cc97aa7dd00c9d2b8a2c4ac7add96f7e2.pdf",
        "author": "Nan Wu;Isabel Valera;Fabian H. Sinz;Alexander S Ecker;Thomas Euler;Yongrong Qiu",
        "authorids": "~Nan_Wu4;~Isabel_Valera1;~Fabian_H._Sinz1;~Alexander_S_Ecker1;~Thomas_Euler1;~Yongrong_Qiu1",
        "gender": "F;F;M;M;;",
        "homepage": ";https://ivaleram.github.io/;https://sinzlab.org;http://eckerlab.org;https://eulerlab.de/;",
        "dblp": ";126/1768.html;53/5834;26/7228;196/3259;",
        "google_scholar": ";https://scholar.google.es/citations?user=cpdQqpsAAAAJ;https://scholar.google.com/citations?hl=de;VgYU_m8AAAAJ;https://scholar.google.de/citations?user=XeqGapgAAAAJ;",
        "orcid": ";;0000-0002-1348-9736;0000-0003-2392-5105;0000-0002-4567-6966;",
        "linkedin": "nan-wu-58b379274/;;;alexecker/;thomas-euler-9b67102b2/;",
        "or_profile": "~Nan_Wu4;~Isabel_Valera1;~Fabian_H._Sinz1;~Alexander_S_Ecker1;~Thomas_Euler1;~Yongrong_Qiu1",
        "aff": ";Universit\u00e4t des Saarlandes;Baylor College of Medicine;Max Planck Institute for Dynamics and Self-Organization;University of Tuebingen;",
        "aff_domain": ";uni-saarland.de;bcm.edu;ds.mpg.de;uni-tuebingen.de;",
        "position": ";Full Professor;Assistant Professor;Principal Researcher;Full Professor;",
        "bibtex": "@misc{\nwu2024probabilistic,\ntitle={Probabilistic Neural Transfer Function Estimation with Bayesian System Identification},\nauthor={Nan Wu and Isabel Valera and Fabian H. Sinz and Alexander S Ecker and Thomas Euler and Yongrong Qiu},\nyear={2024},\nurl={https://openreview.net/forum?id=PqGPjts7Ug}\n}",
        "github": "",
        "project": "",
        "reviewers": "cZAF;dEtx;yDsD",
        "site": "https://openreview.net/forum?id=PqGPjts7Ug",
        "pdf_size": 1391223,
        "rating": "3;3;8",
        "confidence": "4;4;2",
        "soundness": "2;2;3",
        "contribution": "1;2;3",
        "presentation": "3;2;3",
        "wc_summary": "65;103;39",
        "wc_strengths": "25;45;47",
        "wc_weaknesses": "491;360;8",
        "wc_questions": "107;381;1",
        "wc_review": "688;889;95",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.666666666666667,
            2.357022603955158
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            69.0,
            26.280537792569366
        ],
        "wc_strengths_avg": [
            39.0,
            9.93310961716756
        ],
        "wc_weaknesses_avg": [
            286.3333333333333,
            203.94825051686246
        ],
        "wc_questions_avg": [
            163.0,
            160.10829668279737
        ],
        "wc_review_avg": [
            557.3333333333334,
            337.0601660765561
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:zU2BtB4CUm4J:scholar.google.com/&scioq=Probabilistic+Neural+Transfer+Function+Estimation+with+Bayesian+System+Identification&hl=en&as_sdt=0,33",
        "gs_version_total": 13,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Universit\u00e4t des Saarlandes;Baylor College of Medicine;Max Planck Institute for Dynamics and Self-Organization;University of Tuebingen",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.uni-saarland.de;https://www.bcm.edu;https://www.mpids.org;https://www.uni-tuebingen.de/",
        "aff_unique_abbr": "UDS;BCM;MPIDS;Uni T\u00fcbingen",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "Germany;United States"
    },
    {
        "id": "PqjQmLNuJt",
        "title": "DUAL DENOISING LOGICAL REASONING FOR INDUC\u0002TIVE KNOWLEDGE GRAPH COMPLETION",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In recent years, message-passing Graph Neural Networks (GNNs) have been widely used to tackle the problem of inductive knowledge graph completion. Though great progress has been made in GNN-based knowledge graph reasoning, it still suffers from the noise existing in irrelevant entities. These noises accumulated exponentially as the reasoning process continues, significantly impacting the overall performance of the model. To tackle this problem, several node-based sampling methods have been proposed for denoising. However, they do have inherent limitations. Firstly, they rely on node scores to evaluate node importance, which cannot effectively assess the quality of paths in GNN-based reasoning. Secondly, they often overlook noise interference caused by irrelevant edges. To address these problems, we propose a dual denoising logical reasoning (DDLR) framework, which integrates path-based and edge-based sampling to achieve comprehensive denoising. Specifically, DDLR employs a path-scoring mechanism to evaluate the importance of paths, aiming to remove irrelevant paths. Moreover, DDLR leverages rules within the knowledge graph to remove irrelevant edges. Through the dual denoising process, we can achieve more effective logical reasoning. To demonstrate the effectiveness of the DDLR framework, conduct experiments on three benchmark datasets, and our approach achieves state-of-the-art performance.",
        "keywords": "Inductive Knowledge Graph Completion;Dual Denoising",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/08a73535bdbf21b6292ac3f4279d74ddd86ad85e.pdf",
        "author": "Sun Kai;Huajie Jiang;Yongli Hu;Baocai Yin",
        "authorids": "~Sun_Kai2;~Huajie_Jiang3;~Yongli_Hu1;~Baocai_Yin1",
        "gender": "M;M;M;M",
        "homepage": "https://www.aminer.cn/user/scholar;;https://www.bjut.edu.cn/info/1059/1568.htm;http://vipl.ict.ac.cn/people/~hjjiang",
        "dblp": ";72/4503;;176/1538.html",
        "google_scholar": ";qeG9e2AAAAAJ;;lC86MmMAAAAJ",
        "orcid": ";;0000-0003-3121-1823;0000-0002-1158-6321",
        "linkedin": ";;;",
        "or_profile": "~Sun_Kai2;~Yongli_Hu1;~Baocai_Yin1;~Huajie_Jiang1",
        "aff": "Beijing University Of Technology;Beijing University of Technology;Beijing University of Technology;Beijing University of Technology",
        "aff_domain": "bjut.edu.cn;bjut.edu.cn;bjut.edu.cn;bjut.edu.cn",
        "position": "PhD student;Full Professor;Full Professor;Postdoc",
        "bibtex": "@misc{\nkai2024dual,\ntitle={{DUAL} {DENOISING} {LOGICAL} {REASONING} {FOR} {INDUC}\u0002{TIVE} {KNOWLEDGE} {GRAPH} {COMPLETION}},\nauthor={Sun Kai and Huajie Jiang and Yongli Hu and Baocai Yin},\nyear={2024},\nurl={https://openreview.net/forum?id=PqjQmLNuJt}\n}",
        "github": "",
        "project": "",
        "reviewers": "QaFK;m7i6;PQGA;AW5P",
        "site": "https://openreview.net/forum?id=PqjQmLNuJt",
        "pdf_size": 618577,
        "rating": "1;1;3;5",
        "confidence": "5;4;4;4",
        "soundness": "1;1;3;2",
        "contribution": "1;1;2;1",
        "presentation": "1;2;3;2",
        "wc_summary": "46;101;98;36",
        "wc_strengths": "1;46;37;21",
        "wc_weaknesses": "522;68;91;42",
        "wc_questions": "1;5;6;19",
        "wc_review": "570;220;232;118",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.5,
            1.6583123951777
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            1.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            70.25,
            29.4819860253681
        ],
        "wc_strengths_avg": [
            26.25,
            17.108112110925624
        ],
        "wc_weaknesses_avg": [
            180.75,
            197.78191904216118
        ],
        "wc_questions_avg": [
            7.75,
            6.7592529172978875
        ],
        "wc_review_avg": [
            285.0,
            170.40246477090642
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:uL9MPFZtRnMJ:scholar.google.com/&scioq=DUAL+DENOISING+LOGICAL+REASONING+FOR+INDUC%3FTIVE+KNOWLEDGE+GRAPH+COMPLETION&hl=en&as_sdt=0,48",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Beijing University of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.bjut.edu.cn",
        "aff_unique_abbr": "BJUT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "PrkyCAspfx",
        "title": "Bayesian Uncertainty Quantification Meets Topology",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Computational topology recently started to emerge as an overarching paradigm for characterising the \u2018shape\u2019 of high-dimensional data, leading to powerful algorithms in (un)supervised representation learning. While capable of capturing prominent features at multiple scales, topological methods cannot readily quantify the uncertainty of their respective descriptors. We develop a novel approach that bridges this gap, making it possible to employ topology-based loss functions to perform parameter estimation with Bayesian uncertainty quantification. Our method affords easy integration into topological machine learning algorithms. We demonstrate its efficacy for parameter estimation in different simulation settings.",
        "keywords": "bayesian uncertainty quantification;topological data analysis;persistent homology;topological machine learning;topology;bayesian methods",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/4e775b9894a08b2f05e9eff9f887fdce0516b9fd.zip",
        "author": "Sebastian M Schmon;Julius von Rohrscheidt;Bastian Rieck",
        "authorids": "~Sebastian_M_Schmon1;~Julius_von_Rohrscheidt2;~Bastian_Rieck1",
        "gender": "M;M;",
        "homepage": "https://schmons.github.io/;https://bastian.rieck.me;https://rohrscheidt.com/",
        "dblp": "242/3324;119/8860;330/4381",
        "google_scholar": "https://scholar.google.de/citations?user=hs2WrYYAAAAJ;https://scholar.google.ch/citations?user=La7zuKQAAAAJ;",
        "orcid": ";0000-0003-4335-0302;",
        "linkedin": ";br-ml/;",
        "or_profile": "~Sebastian_M_Schmon1;~Bastian_Rieck1;~Julius_Von_Rohrscheidt1",
        "aff": "Altos Labs, Inc.;Helmholtz Zentrum M\u00fcnchen;Technische Universit\u00e4t M\u00fcnchen",
        "aff_domain": "altoslabs.com;helmholtz-munich.de;tum.de",
        "position": "Researcher;Principal Investigator;PhD student",
        "bibtex": "@misc{\nschmon2024bayesian,\ntitle={Bayesian Uncertainty Quantification Meets Topology},\nauthor={Sebastian M Schmon and Julius von Rohrscheidt and Bastian Rieck},\nyear={2024},\nurl={https://openreview.net/forum?id=PrkyCAspfx}\n}",
        "github": "",
        "project": "",
        "reviewers": "Ym1e;wkBh;b9zn",
        "site": "https://openreview.net/forum?id=PrkyCAspfx",
        "pdf_size": 2047671,
        "rating": "3;3;3",
        "confidence": "3;2;4",
        "soundness": "1;2;3",
        "contribution": "3;2;1",
        "presentation": "2;2;2",
        "wc_summary": "115;187;16",
        "wc_strengths": "22;137;16",
        "wc_weaknesses": "301;294;298",
        "wc_questions": "113;155;14",
        "wc_review": "551;773;344",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            106.0,
            70.09992867328754
        ],
        "wc_strengths_avg": [
            58.333333333333336,
            55.679639207004755
        ],
        "wc_weaknesses_avg": [
            297.6666666666667,
            2.8674417556808756
        ],
        "wc_questions_avg": [
            94.0,
            59.1100668245266
        ],
        "wc_review_avg": [
            556.0,
            175.1741990134392
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:wwU0SMT_mCsJ:scholar.google.com/&scioq=Bayesian+Uncertainty+Quantification+Meets+Topology&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Altos Labs;Helmholtz Zentrum M\u00fcnchen;Technische Universit\u00e4t M\u00fcnchen",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.altoslabs.com;https://www.helmholtz-muenchen.de;https://www.tum.de",
        "aff_unique_abbr": "Altos Labs;;TUM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "United States;Germany"
    },
    {
        "title": "Learning to Solve Bilevel Programs with Binary Tender",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18692",
        "id": "PsDFgTosqb",
        "author_site": "Bo Zhou, Ruiwei Jiang, Siqian Shen",
        "tldr": "",
        "abstract": "Bilevel programs (BPs) find a wide range of applications in fields such as energy, transportation, and machine learning. As compared to BPs with continuous (linear/convex) optimization problems in both levels, the BPs with discrete decision variables have received much less attention, largely due to the ensuing computational intractability and the incapability of gradient-based algorithms for handling discrete optimization formulations. In this paper, we develop deep learning techniques to address this challenge. Specifically, we consider a BP with binary tender, wherein the upper and lower levels are linked via binary variables. We train a neural network to approximate the optimal value of the lower-level problem, as a function of the binary tender. Then, we obtain a single-level reformulation of the BP through a mixed-integer representation of the value function. Furthermore, we conduct a comparative analysis between two types of neural networks: general neural networks and the novel input supermodular neural networks, studying their representational capacities. To solve high-dimensional BPs, we introduce an enhanced sampling method to generate higher-quality samples and implement an iterative process to refine solutions. We demonstrate the performance of these approaches through extensive numerical experiments, whose lower-level problems are linear and mixed-integer programs, respectively.",
        "keywords": "Deep Learning;Bilevel Program;Binary Tender;Enhanced Sampling;Input Supermodular Neural Network",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Bo Zhou;Ruiwei Jiang;Siqian Shen",
        "authorids": "~Bo_Zhou10;~Ruiwei_Jiang1;~Siqian_Shen1",
        "gender": "M;;F",
        "homepage": "https://bozlamberth.github.io/;https://sites.google.com/site/ruiweijianguf;https://websites.umich.edu/~siqian/",
        "dblp": ";;86/8756",
        "google_scholar": "https://scholar.google.com/citations?hl=en;4I4Tyd8AAAAJ;MRZIjFkAAAAJ",
        "orcid": ";;0000-0002-2854-163X",
        "linkedin": ";;",
        "or_profile": "~Bo_Zhou10;~Ruiwei_Jiang1;~Siqian_Shen1",
        "aff": "University of Michigan - Ann Arbor;University of Michigan - Ann Arbor;University of Michigan - Ann Arbor",
        "aff_domain": "umich.edu;umich.edu;umich.edu",
        "position": "Postdoc;Associate Professor;Full Professor",
        "bibtex": "@inproceedings{\nzhou2024learning,\ntitle={Learning to Solve Bilevel Programs with Binary Tender},\nauthor={Bo Zhou and Ruiwei Jiang and Siqian Shen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=PsDFgTosqb}\n}",
        "github": "",
        "project": "",
        "reviewers": "YfM6;nqbY;skLM",
        "pdf_size": 5003872,
        "rating": "3;6;6",
        "confidence": "4;3;4",
        "soundness": "3;2;2",
        "contribution": "2;2;2",
        "presentation": "3;2;3",
        "wc_summary": "74;60;66",
        "wc_strengths": "44;47;84",
        "wc_weaknesses": "135;197;151",
        "wc_questions": "239;29;289",
        "wc_review": "492;333;590",
        "wc_reply_reviewers": "0;17;123",
        "wc_reply_authors": "2054;924;2004",
        "reply_reviewers": "0;1;1",
        "reply_authors": "4;3;5",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            66.66666666666667,
            5.734883511361751
        ],
        "wc_strengths_avg": [
            58.333333333333336,
            18.190351532856337
        ],
        "wc_weaknesses_avg": [
            161.0,
            26.280537792569366
        ],
        "wc_questions_avg": [
            185.66666666666666,
            112.64496832477201
        ],
        "wc_review_avg": [
            471.6666666666667,
            105.90037246813105
        ],
        "wc_reply_reviewers_avg": [
            46.666666666666664,
            54.42017599710199
        ],
        "wc_reply_authors_avg": [
            1660.6666666666667,
            521.3017893270227
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            4.0,
            0.816496580927726
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3646993390171086419&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=PsDFgTosqb",
        "pdf": "https://openreview.net/pdf?id=PsDFgTosqb",
        "email": "umich.edu;umich.edu;umich.edu",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Michigan",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.umich.edu",
        "aff_unique_abbr": "UM",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Ann Arbor",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "PsRL00864k",
        "title": "Correct and speak: accent reduction with minimum supervision",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Accent conversion(AC) aims to convert non-native accented speech to native speech by changing the pronunciation pattern and prosody of source speakers while preserving linguistic content and speaker identity. This problem is quite challenging since 1) the parallel data with same speaker speaking the same content in different accent is rarely existed; 2) the accent features not only affect the prosody but also corrupt the pronunciation units in some heavy accents like Indian accent. In this work, we propose a new framework with a correction module and speaking module based on speech generative models in which the accent removal is achieved by correcting the source accented semantic tokens to the target native ones.\nSpecifically, a separate sequence-to-sequence task based on autoregressive decoder-only transformer has been designed to accomplish the correction. Conditioned on this corrected semantic token, a speech generative model based on TF-Codec, trained with large amounts of native speech has been proposed to generate speech with native prosody. Different from multi-stage generation used in other generative models, we use a single-stage autoregressive generation to reduce the complexity and latency of the generation process. To relieve the dependence of the parallel data, we pretrain the correction module with a pretext task in a self-supervised manner using large amounts of native speech to learn the probability space of the target native semantic tokens first so that small amounts of parallel data are needed to learn the mapping of specific corrupted pronunciation units with their native targets. Experimental results show the proposed framework achieved the state-of-the-art performance in terms of accentedness, speech quality and speaker maintanence. With the pretraining, only 15 minutes of parallel data which is not constrained to the same speaker are required to achieve a good correction quality. The proposed generative model also achieves higher speech quality and speaker similarity with lower complexity and latency(50 AR steps/1 sec of audio) compared with multi-stage speech generation methods(75 AR steps+7 NAR steps/1 sec of audio). With less supervision from parallel data, this framework can be easily extended to other accents with low-resource data.",
        "keywords": "Voice Conversion;Spoken Language Models;speech tokenizer;In-context Learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/8de11027d653823718d198942b320a76398cfe2e.zip",
        "author": "zhijun jia;Huaying Xue;Xiulian Peng;Yan Lu",
        "authorids": "~zhijun_jia1;~Huaying_Xue1;~Xiulian_Peng1;~Yan_Lu7",
        "gender": ";F;;M",
        "homepage": ";https://www.microsoft.com/en-us/research/people/huxue/;;https://www.microsoft.com/en-us/research/people/yanlu/",
        "dblp": ";;;15/4830-1",
        "google_scholar": ";;;djk5l-4AAAAJ",
        "orcid": ";;;0000-0001-5383-6424",
        "linkedin": ";;;",
        "or_profile": "~zhijun_jia1;~Huaying_Xue1;~Xiulian_Peng1;~Yan_Lu7",
        "aff": ";Microsoft Research;;Microsoft Research Asia",
        "aff_domain": ";research.microsoft.com;;microsoft.com",
        "position": ";Researcher;;Partner Research Manager",
        "bibtex": "@misc{\njia2024correct,\ntitle={Correct and speak: accent reduction with minimum supervision},\nauthor={zhijun jia and Huaying Xue and Xiulian Peng and Yan Lu},\nyear={2024},\nurl={https://openreview.net/forum?id=PsRL00864k}\n}",
        "github": "",
        "project": "",
        "reviewers": "Q9U6;o8oG;KUHy;SdoC",
        "site": "https://openreview.net/forum?id=PsRL00864k",
        "pdf_size": 682087,
        "rating": "5;5;6;8",
        "confidence": "3;4;5;4",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;2;3",
        "wc_summary": "104;66;79;113",
        "wc_strengths": "112;58;5;231",
        "wc_weaknesses": "107;25;42;89",
        "wc_questions": "152;232;301;198",
        "wc_review": "475;381;427;631",
        "wc_reply_reviewers": "83;48;345;33",
        "wc_reply_authors": "858;755;1691;613",
        "reply_reviewers": "2;1;2;1",
        "reply_authors": "3;2;4;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            90.5,
            18.848076824970764
        ],
        "wc_strengths_avg": [
            101.5,
            83.79289946051514
        ],
        "wc_weaknesses_avg": [
            65.75,
            33.41687447981932
        ],
        "wc_questions_avg": [
            220.75,
            54.338637266681616
        ],
        "wc_review_avg": [
            478.5,
            94.11030761824127
        ],
        "wc_reply_reviewers_avg": [
            127.25,
            127.020421586452
        ],
        "wc_reply_authors_avg": [
            979.25,
            420.03474558660025
        ],
        "reply_reviewers_avg": [
            1.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.28867513459481287,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:p-Dt0tdGE7kJ:scholar.google.com/&scioq=Correct+and+speak:+accent+reduction+with+minimum+supervision&hl=en&as_sdt=0,38",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Microsoft",
        "aff_unique_dep": "Microsoft Research",
        "aff_unique_url": "https://www.microsoft.com/en-us/research",
        "aff_unique_abbr": "MSR",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Asia",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "Copilot4D: Learning Unsupervised World Models for Autonomous Driving via Discrete Diffusion",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18691",
        "id": "Psl75UCoZM",
        "author_site": "Lunjun Zhang, Yuwen Xiong, Ze Yang, Sergio Casas, Rui Hu, Raquel Urtasun",
        "tldr": "",
        "abstract": "Learning world models can teach an agent how the world works in an unsupervised manner. Even though it can be viewed as a special case of sequence modeling, progress for scaling world models on robotic applications such as autonomous driving has been somewhat less rapid than scaling language models with Generative Pre-trained Transformers (GPT). We identify two reasons as major bottlenecks: dealing with complex and unstructured observation space, and having a scalable generative model. Consequently, we propose Copilot4D, a novel world modeling approach that first tokenizes sensor observations with VQVAE, then predicts the future via discrete diffusion. To efficiently decode and denoise tokens in parallel, we recast Masked Generative Image Transformer as discrete diffusion and enhance it with a few simple changes, resulting in notable improvement. When applied to learning world models on point cloud observations, Copilot4D reduces prior SOTA Chamfer distance by more than 65% for 1s prediction, and more than 50% for 3s prediction, across NuScenes, KITTI Odometry, and Argoverse2 datasets. Our results demonstrate that discrete diffusion on tokenized agent experience can unlock the power of GPT-like unsupervised learning for robotics.",
        "keywords": "discrete diffusion; world model; autonomous driving",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Lunjun Zhang;Yuwen Xiong;Ze Yang;Sergio Casas;Rui Hu;Raquel Urtasun",
        "authorids": "~Lunjun_Zhang1;~Yuwen_Xiong1;~Ze_Yang5;~Sergio_Casas2;~Rui_Hu1;~Raquel_Urtasun1",
        "gender": ";M;;F;M;M",
        "homepage": "https://lunjunzhang.github.io/;http://www.yuwenxiong.com;;http://www.cs.toronto.edu/~urtasun/;http://www.cs.toronto.edu/~sergio/;https://www.cs.toronto.edu/~zeyang/",
        "dblp": "274/6535;178/3589;08/3712;u/RaquelUrtasun;46/6535-2;158/1178-3",
        "google_scholar": "OqD5GcgAAAAJ;7YALCcIAAAAJ;;https://scholar.google.ca/citations?user=jyxO2akAAAAJ;Vgo1x9YAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;;;",
        "linkedin": ";;;;sergio-casas/;ze-yang-ab0a34b5/",
        "or_profile": "~Lunjun_Zhang1;~Yuwen_Xiong1;~Rui_Hu1;~Raquel_Urtasun1;~Sergio_Casas_Romero1;~Ze_Yang1",
        "aff": "Waabi Innovation;Department of Computer Science, University of Toronto;Waabi;Department of Computer Science, University of Toronto;University of Toronto;Department of Computer Science, University of Toronto",
        "aff_domain": "waabi.ai;cs.toronto.edu;waabi.ai;cs.toronto.edu;toronto.edu;cs.toronto.edu",
        "position": "Researcher;PhD student;Software Engineer;Full Professor;PhD student;PhD student",
        "bibtex": "@inproceedings{\nzhang2024copilotd,\ntitle={Copilot4D: Learning Unsupervised World Models for Autonomous Driving via Discrete Diffusion},\nauthor={Lunjun Zhang and Yuwen Xiong and Ze Yang and Sergio Casas and Rui Hu and Raquel Urtasun},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Psl75UCoZM}\n}",
        "github": "",
        "project": "",
        "reviewers": "4daR;2kSt;2hr7;amws;9NMX",
        "pdf_size": 43107835,
        "rating": "6;6;6;8;10",
        "confidence": "4;4;3;4;4",
        "soundness": "3;3;3;3;4",
        "contribution": "3;3;3;4;4",
        "presentation": "3;2;4;3;4",
        "wc_summary": "95;83;152;134;73",
        "wc_strengths": "79;181;111;58;66",
        "wc_weaknesses": "290;148;72;177;43",
        "wc_questions": "49;83;82;91;42",
        "wc_review": "513;495;417;460;224",
        "wc_reply_reviewers": "308;0;129;24;14",
        "wc_reply_authors": "1457;1214;867;625;363",
        "reply_reviewers": "1;0;1;1;1",
        "reply_authors": "3;3;2;1;1",
        "rating_avg": [
            7.2,
            1.6
        ],
        "confidence_avg": [
            3.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            3.2,
            0.39999999999999997
        ],
        "contribution_avg": [
            3.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            3.2,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            107.4,
            30.42761903271434
        ],
        "wc_strengths_avg": [
            99.0,
            44.80624956409541
        ],
        "wc_weaknesses_avg": [
            146.0,
            86.93215745626011
        ],
        "wc_questions_avg": [
            69.4,
            19.885673234768795
        ],
        "wc_review_avg": [
            421.8,
            104.19481752947218
        ],
        "wc_reply_reviewers_avg": [
            95.0,
            115.88960263975366
        ],
        "wc_reply_authors_avg": [
            905.2,
            393.3936450935627
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            2.0,
            0.8944271909999159
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.37500000000000006,
        "gs_citation": 56,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6817448836514718538&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=Psl75UCoZM",
        "pdf": "https://openreview.net/pdf?id=Psl75UCoZM",
        "email": "waabi.ai;cs.toronto.edu;waabi.ai;cs.toronto.edu;toronto.edu;cs.toronto.edu",
        "author_num": 6,
        "aff_unique_index": "0;1;2;1;1;1",
        "aff_unique_norm": "Waabi Innovation;University of Toronto;Waabi",
        "aff_unique_dep": ";Department of Computer Science;",
        "aff_unique_url": "https://waabi.ai;https://www.utoronto.ca;",
        "aff_unique_abbr": ";U of T;",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Toronto",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Canada;"
    },
    {
        "id": "PtB6l1vNtk",
        "title": "PREDICTING ACCURATE LAGRANGIAN MULTIPLIERS FOR MIXED INTEGER LINEAR PROGRAMS",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Lagrangian relaxation stands among the most efficient approaches for solving a\nMixed Integer Linear Programs (MILP) with difficult constraints. Given any duals\nfor these constraints, called Lagrangian Multipliers (LMs), it returns a bound on\nthe optimal value of the MILP, and Lagrangian methods seek the LMs giving the\nbest such bound. But these methods generally rely on iterative algorithms resem-\nbling gradient descent to maximize the concave piecewise linear dual function:\nthe computational burden grows quickly with the number of relaxed constraints.\nWe introduce a deep learning approach that bypasses the descent, effectively\namortizing the local, per instance, optimization. A probabilistic encoder based\non a graph convolutional network computes high-dimensional representations of\nrelaxed constraints in MILP instances. A decoder then turns these representations\ninto LMs. We train the encoder and decoder jointly by directly optimizing the\nbound obtained from the predicted multipliers. Numerical experiments show that\nour approach closes up to 85 % of the gap between the continuous relaxation and\nthe best Lagrangian bound, and provides a high quality warm-start for descent\nbased Lagrangian methods.",
        "keywords": "Lagrangian Relaxation;Mixed Integer Linear Programming;Combinatorial Optimization;Graph Neural Networks",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Francesco Demelas;Joseph Le Roux;Mathieu Lacroix;Axel Parmentier",
        "authorids": "~Francesco_Demelas1;~Joseph_Le_Roux1;~Mathieu_Lacroix1;~Axel_Parmentier1",
        "gender": ";M;M;M",
        "homepage": ";https://www.lipn.fr/~leroux;https://lipn.univ-paris13.fr/~lacroix/;https://cermics.enpc.fr/~parmenta/",
        "dblp": ";25/5993;84/8724;150/6250",
        "google_scholar": ";WVUs6rEAAAAJ;;https://scholar.google.fr/citations?hl=fr",
        "orcid": "0000-0003-1888-3182;;0000-0001-8385-3890;0000-0003-1762-4947",
        "linkedin": ";;;axel-parmentier-466548148/",
        "or_profile": "~Francesco_Demelas1;~Joseph_Le_Roux1;~Mathieu_Lacroix1;~Axel_Parmentier1",
        "aff": "University Paris 13, Universit\u00e9 Paris Nord (Paris XIII);Universit\u00e9 Paris 13;Universit\u00e9 Paris Nord (Paris XIII);Ecole Nationale des Ponts et Chausees",
        "aff_domain": "lipn.univ-paris13.fr;univ-paris13.fr;univ-paris13.fr;enpc.fr",
        "position": "PhD student;Associate Professor;Associate Professor;Associate Professor",
        "bibtex": "@misc{\ndemelas2024predicting,\ntitle={{PREDICTING} {ACCURATE} {LAGRANGIAN} {MULTIPLIERS} {FOR} {MIXED} {INTEGER} {LINEAR} {PROGRAMS}},\nauthor={Francesco Demelas and Joseph Le Roux and Mathieu Lacroix and Axel Parmentier},\nyear={2024},\nurl={https://openreview.net/forum?id=PtB6l1vNtk}\n}",
        "github": "",
        "project": "",
        "reviewers": "Qm6g;F7ni;4s9N;Gopm",
        "site": "https://openreview.net/forum?id=PtB6l1vNtk",
        "pdf_size": 413673,
        "rating": "3;3;5;5",
        "confidence": "4;3;4;3",
        "soundness": "2;3;2;2",
        "contribution": "2;1;2;2",
        "presentation": "3;2;3;3",
        "wc_summary": "112;168;263;50",
        "wc_strengths": "38;75;96;22",
        "wc_weaknesses": "198;80;565;104",
        "wc_questions": "50;28;81;32",
        "wc_review": "398;351;1005;208",
        "wc_reply_reviewers": "0;0;0;118",
        "wc_reply_authors": "565;211;300;472",
        "reply_reviewers": "0;0;0;2",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            148.25,
            78.30189972152655
        ],
        "wc_strengths_avg": [
            57.75,
            29.277764600460877
        ],
        "wc_weaknesses_avg": [
            236.75,
            194.578229768903
        ],
        "wc_questions_avg": [
            47.75,
            20.90902915010642
        ],
        "wc_review_avg": [
            490.5,
            305.17740742066735
        ],
        "wc_reply_reviewers_avg": [
            29.5,
            51.09549882328188
        ],
        "wc_reply_authors_avg": [
            387.0,
            139.15279371970942
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17533841052794546739&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "University Paris 13;Universit\u00e9 Paris 13;Universit\u00e9 Paris Nord;Ecole Nationale des Ponts et Chaussees",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.univ-paris13.fr;https://www.univ-paris13.fr;https://www.univ-paris13.fr;https://www.enpc.fr",
        "aff_unique_abbr": "UP13;UP13;UP13;ENPC",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Paris;;Paris XIII",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "France"
    },
    {
        "id": "Pu3qMB9aKD",
        "title": "Form follows Function: Text-to-Text Conditional Graph Generation based on Functional Requirements",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This work focuses on the novel problem setting of generating graphs conditioned on a description of the graph's functional requirements in a downstream task. We pose the problem as a text-to-text generation problem and focus on the approach of fine-tuning a pretrained large language model (LLM) to generate graphs. We propose an inductive bias which incorporates information about the structure of the graph into the LLM's generation process by incorporating message passing layers into an LLM's architecture. To evaluate our proposed method, we design a novel set of experiments using publicly available and widely studied molecule and knowledge graph data sets. Results suggest our proposed approach generates graphs which more closely meet the requested functional requirements, outperforming baselines developed on similar tasks by a statistically significant margin.",
        "keywords": "Generative Modelling;Graph Structured Data;Multimodal Conditional Generation;Molecule Generation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/941a9251accc820d6378c2a226e7e70209ec5602.zip",
        "author": "Peter Zachares;Vahan Hovhannisyan;Alan Mosca;Yarin Gal",
        "authorids": "~Peter_Zachares1;~Vahan_Hovhannisyan1;~Alan_Mosca1;~Yarin_Gal1",
        "gender": "M;M;M;",
        "homepage": ";;www.dcs.bbk.ac.uk/~amosca02;http://www.cs.ox.ac.uk/people/yarin.gal/website//",
        "dblp": "245/9839;;;67/9076",
        "google_scholar": ";jwJGzB8AAAAJ;https://scholar.google.co.uk/citations?user=0Nx6kPwAAAAJ;https://scholar.google.co.uk/citations?user=SIayDoQAAAAJ",
        "orcid": ";;;",
        "linkedin": "pzachares/;vahan1/;;",
        "or_profile": "~Peter_Zachares1;~Vahan_Hovhannisyan1;~Alan_Mosca1;~Yarin_Gal1",
        "aff": ";;;University of Oxford",
        "aff_domain": ";;;ox.ac.uk",
        "position": ";;;Associate Professor",
        "bibtex": "@misc{\nzachares2024form,\ntitle={Form follows Function: Text-to-Text Conditional Graph Generation based on Functional Requirements},\nauthor={Peter Zachares and Vahan Hovhannisyan and Alan Mosca and Yarin Gal},\nyear={2024},\nurl={https://openreview.net/forum?id=Pu3qMB9aKD}\n}",
        "github": "",
        "project": "",
        "reviewers": "fDhs;Q4ZR;cSty;kFQj",
        "site": "https://openreview.net/forum?id=Pu3qMB9aKD",
        "pdf_size": 760658,
        "rating": "3;5;5;5",
        "confidence": "4;4;3;4",
        "soundness": "2;2;2;2",
        "contribution": "2;3;2;3",
        "presentation": "2;2;2;4",
        "wc_summary": "39;90;231;78",
        "wc_strengths": "21;115;2;80",
        "wc_weaknesses": "166;153;4;88",
        "wc_questions": "3;15;3;300",
        "wc_review": "229;373;240;546",
        "wc_reply_reviewers": "106;50;0;0",
        "wc_reply_authors": "702;546;391;695",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "7;5;3;6",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            109.5,
            72.6378000768195
        ],
        "wc_strengths_avg": [
            54.5,
            45.24654682956479
        ],
        "wc_weaknesses_avg": [
            102.75,
            64.21594428177475
        ],
        "wc_questions_avg": [
            80.25,
            126.96726940436264
        ],
        "wc_review_avg": [
            347.0,
            128.11127975318956
        ],
        "wc_reply_reviewers_avg": [
            39.0,
            43.73785545725808
        ],
        "wc_reply_authors_avg": [
            583.5,
            127.41369628105136
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            5.25,
            1.479019945774904
        ],
        "replies_avg": [
            31,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6783003254046947696&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Oxford",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ox.ac.uk",
        "aff_unique_abbr": "Oxford",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "PuCno7nwgH",
        "title": "Categorical Features of entities in Recommendation Systems Using Graph Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The paper tackles the challenge of capturing entity attribute-specific preferences in recommender systems, with a particular focus on the role of categorical features within GNN-based user-item recommender engines. Despite the significant influence of categorical features such as brand, category, and price bucket on the user decision-making process, there are not many studies dedicated to understanding the GNN's capability to extract and model such preferences effectively. The study extensively compares and tests various techniques for incorporating categorical features into the GNN framework to address this gap. These techniques include one-hot encoding-based node features, category-value nodes, and hyperedges. Three real-world datasets are used to answer what is the most optimal way to incorporate such information. In addition, the paper introduces a novel hyperedge-based method designed to leverage categorical features more effectively compared to existing approaches. The advantage of the hyperedge approach is demonstrated through extensive experiments in effectively modeling categorical features and extracting user attribute-specific preferences.",
        "keywords": "Graph Neural Networks;Representation learning;recommender engines;Hyper edges",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Tinatini Buturishvili;Nils Morten Kriege",
        "authorids": "~Tinatini_Buturishvili1;~Nils_Morten_Kriege1",
        "gender": ";M",
        "homepage": "https://dm.cs.univie.ac.at/team/phd-students/;https://kriegegroup.univie.ac.at/",
        "dblp": ";97/8178",
        "google_scholar": ";https://scholar.google.de/citations?user=wGT17PcAAAAJ",
        "orcid": ";0000-0003-2645-947X",
        "linkedin": ";",
        "or_profile": "~Tinatini_Buturishvili1;~Nils_Morten_Kriege1",
        "aff": "Universit\u00e4t Vienna;Universit\u00e4t Vienna",
        "aff_domain": "univie.ac.at;univie.ac.at",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\nbuturishvili2024categorical,\ntitle={Categorical Features of entities in Recommendation Systems Using Graph Neural Networks},\nauthor={Tinatini Buturishvili and Nils Morten Kriege},\nyear={2024},\nurl={https://openreview.net/forum?id=PuCno7nwgH}\n}",
        "github": "",
        "project": "",
        "reviewers": "FdC6;p2X9;t3i6;ziNY",
        "site": "https://openreview.net/forum?id=PuCno7nwgH",
        "pdf_size": 291131,
        "rating": "3;3;3;6",
        "confidence": "4;4;4;4",
        "soundness": "2;2;3;2",
        "contribution": "1;1;1;3",
        "presentation": "3;3;2;3",
        "wc_summary": "71;58;49;216",
        "wc_strengths": "47;31;32;45",
        "wc_weaknesses": "210;102;194;75",
        "wc_questions": "124;46;20;93",
        "wc_review": "452;237;295;429",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            98.5,
            68.28799308809712
        ],
        "wc_strengths_avg": [
            38.75,
            7.292976072907411
        ],
        "wc_weaknesses_avg": [
            145.25,
            57.824627106450066
        ],
        "wc_questions_avg": [
            70.75,
            40.36938815488786
        ],
        "wc_review_avg": [
            353.25,
            89.99548599790992
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:B5Pun2H3laYJ:scholar.google.com/&scioq=Categorical+Features+of+entities+in+Recommendation+Systems+Using+Graph+Neural+Networks&hl=en&as_sdt=0,48",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Vienna",
        "aff_unique_dep": "",
        "aff_unique_url": "https://univie.ac.at",
        "aff_unique_abbr": "UV",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Austria"
    },
    {
        "id": "PuKRVPXXpR",
        "title": "ResTran: A GNN Alternative To Learn Graph With Features",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper considers a vertex classification task where we are given a graph and associated vector features.\nThe modern approach to this task is graph neural networks (GNNs). \nHowever, due to the nature of GNN architectures, GNNs are known to be biased to primarily learn homophilous information.\nTo overcome this bias in GNN architectures, we take a simpler alternative approach to GNNs.\nOur approach is to obtain a vector representation capturing both features and the graph topology.\nWe then apply standard vector-based learning methods to this vector representation.\nFor this approach, we propose a simple transformation of features, which we call \\textit{Resistance Transformation} (abbreviated as \\textit{ResTran}).\nWe provide theoretical justifications for ResTran from the effective resistance, $k$-means, and spectral clustering points of view.\nWe empirically demonstrate that ResTran is more robust to the homophilous bias than established GNN methods.",
        "keywords": "GNN;Spectral Clustering",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/9bd283b0534a45c6873464a6447c24f0ede45df8.zip",
        "author": "Shota Saito;Takanori Maehara;Mark Herbster",
        "authorids": "~Shota_Saito2;~Takanori_Maehara1;~Mark_Herbster1",
        "gender": "M;M;M",
        "homepage": "http://sites.google.com/site/ssaito1989/;https://tmaehara.gitlab.io;http://www0.cs.ucl.ac.uk/staff/M.Herbster/",
        "dblp": ";05/8510;76/6979",
        "google_scholar": "https://scholar.google.co.jp/citations?user=B4jqiWUAAAAJ;3ei4ZqoAAAAJ;https://scholar.google.com.tw/citations?user=MBwWHlgAAAAJ",
        "orcid": ";0000-0002-2101-1484;",
        "linkedin": ";;",
        "or_profile": "~Shota_Saito2;~Takanori_Maehara1;~Mark_Herbster1",
        "aff": "University College London;Roku;University College London",
        "aff_domain": "ucl.ac.uk;roku.com;ucl.edu",
        "position": "PhD student;Senior Software Engineer;Professor",
        "bibtex": "@misc{\nsaito2024restran,\ntitle={ResTran: A {GNN} Alternative To Learn Graph With Features},\nauthor={Shota Saito and Takanori Maehara and Mark Herbster},\nyear={2024},\nurl={https://openreview.net/forum?id=PuKRVPXXpR}\n}",
        "github": "",
        "project": "",
        "reviewers": "Fupb;MjNb;gotZ;hGqh",
        "site": "https://openreview.net/forum?id=PuKRVPXXpR",
        "pdf_size": 619185,
        "rating": "3;3;3;5",
        "confidence": "5;4;4;2",
        "soundness": "1;2;2;2",
        "contribution": "1;1;2;2",
        "presentation": "2;3;3;2",
        "wc_summary": "30;72;111;81",
        "wc_strengths": "11;21;28;44",
        "wc_weaknesses": "487;206;389;106",
        "wc_questions": "26;82;45;112",
        "wc_review": "554;381;573;343",
        "wc_reply_reviewers": "10;0;30;11",
        "wc_reply_authors": "267;245;531;135",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            73.5,
            28.96981187374195
        ],
        "wc_strengths_avg": [
            26.0,
            12.020815280171307
        ],
        "wc_weaknesses_avg": [
            297.0,
            149.4372778124655
        ],
        "wc_questions_avg": [
            66.25,
            33.214266513051285
        ],
        "wc_review_avg": [
            462.75,
            101.8635729787641
        ],
        "wc_reply_reviewers_avg": [
            12.75,
            10.848386976873567
        ],
        "wc_reply_authors_avg": [
            294.5,
            145.41234473042513
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.9271726499455306,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8687047905539339605&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University College London;Roku",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ucl.ac.uk;https://www.roku.com",
        "aff_unique_abbr": "UCL;Roku",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "id": "PuRhqpBTmj",
        "title": "Forget-Me-Not: Learning to Forget in Text-to-Image Diffusion Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The unlearning problem of deep learning models, once primarily an academic concern, has become a prevalent issue in the industry. The significant advances in text-to-image generation techniques have prompted global discussions on privacy, copyright, and safety, as numerous unauthorized personal IDs, content, artistic creations, and potentially harmful materials have been learned by these models and later utilized to generate and distribute uncontrolled content. To address this challenge, we propose Forget-Me-Not, an efficient and low-cost solution designed to safely remove specified IDs, objects, or styles from a well-configured text-to-image model in as little as 30 seconds, without impairing its ability to generate other content. Alongside our method, we introduce the Memorization Score (M-Score) and ConceptBench to measure the models' capacity to generate general concepts, grouped into three primary categories: ID, object, and style. Using M-Score and ConceptBench, we demonstrate that Forget-Me-Not can effectively eliminate targeted concepts while maintaining the model's performance on other concepts. Furthermore, Forget-Me-Not offers two practical extensions: a) removal of potentially harmful or NSFW content, and b) enhancement of model accuracy, inclusion and diversity through concept correction and disentanglement. It can also be adapted as a lightweight model patch for Stable Diffusion, allowing for concept manipulation and convenient distribution. To encourage future research in this critical area and promote the development of safe and inclusive generative models, we will open-source our code and ConceptBench.",
        "keywords": "computer vision;text-to-image generation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Eric Zhang;Kai Wang;Xingqian Xu;Zhangyang Wang;Humphrey Shi",
        "authorids": "~Eric_Zhang1;~Kai_Wang10;~Xingqian_Xu2;~Zhangyang_Wang1;~Humphrey_Shi1",
        "gender": "M;M;M;M;M",
        "homepage": ";https://kaiwang.com;https://xingqian2018.github.io/;https://vita-group.github.io;https://www.humphreyshi.com",
        "dblp": ";78/2022-58.html;256/1005;119/4026;176/5516",
        "google_scholar": "m67w1RwAAAAJ;_yK8SN0AAAAJ;s1X82zMAAAAJ;pxFyKAIAAAAJ;WBvt5A8AAAAJ",
        "orcid": ";;;;0000-0002-2922-5663",
        "linkedin": "gong-zhang-a3820a77/;;xingqian-xu-97b46526/;;humphreyshi",
        "or_profile": "~Eric_Zhang1;~Kai_Wang10;~Xingqian_Xu2;~Zhangyang_Wang1;~Honghui_Shi1",
        "aff": "Georgia Institute of Technology;Georgia Institute of Technology;PicsArt Inc.;University of Texas at Austin;University of Illinois, Urbana Champaign",
        "aff_domain": "gatech.edu;gatech.edu;picsart.com;utexas.edu;illinois.edu",
        "position": "PhD student;PhD student;Senior Research Scientist;Associate Professor;Adjunct Assistant Professor",
        "bibtex": "@misc{\nzhang2024forgetmenot,\ntitle={Forget-Me-Not: Learning to Forget in Text-to-Image Diffusion Models},\nauthor={Eric Zhang and Kai Wang and Xingqian Xu and Zhangyang Wang and Humphrey Shi},\nyear={2024},\nurl={https://openreview.net/forum?id=PuRhqpBTmj}\n}",
        "github": "",
        "project": "",
        "reviewers": "r3ea;Tnea;hT3k;Kf75",
        "site": "https://openreview.net/forum?id=PuRhqpBTmj",
        "pdf_size": 10886198,
        "rating": "1;5;5;5",
        "confidence": "2;4;5;3",
        "soundness": "1;2;2;2",
        "contribution": "3;2;3;3",
        "presentation": "1;3;2;2",
        "wc_summary": "12;101;36;75",
        "wc_strengths": "12;32;45;86",
        "wc_weaknesses": "95;61;84;199",
        "wc_questions": "12;27;56;78",
        "wc_review": "131;221;221;438",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.7320508075688772
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            56.0,
            34.35840508521896
        ],
        "wc_strengths_avg": [
            43.75,
            27.07743525520835
        ],
        "wc_weaknesses_avg": [
            109.75,
            52.96874078171011
        ],
        "wc_questions_avg": [
            43.25,
            25.54774941164094
        ],
        "wc_review_avg": [
            252.75,
            113.08928994383155
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.7745966692414834,
        "gs_citation": 202,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2509113659052210909&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;1;2;3",
        "aff_unique_norm": "Georgia Institute of Technology;Picsart;University of Texas at Austin;University of Illinois Urbana-Champaign",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.gatech.edu;https://www.picsart.com;https://www.utexas.edu;https://illinois.edu",
        "aff_unique_abbr": "Georgia Tech;PicsArt;UT Austin;UIUC",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Austin;Urbana-Champaign",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "PuTJF5Tzfa",
        "title": "Audio Image Generation for Denoising",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Time-frequency domain analysis has emerged as an effective method to remove noise in audio signals. However, the image generation quality of the frequency domain is not yet well explored. In this paper, we turn the audio denoising task into an image generation problem. We present an audio image generation model for audio denoising named AIGD and use it to estimate the posterior distribution of clean complex images conditioned on noisy complex images. Given any noisy audio signals, our AIGD model could directly generate denoised complex images and output clean audio signals. We further optimize complex L2 and complex absolute structure similarity losses to improve the quality of generated images. An SDR loss is proposed to reconstruct better-denoised audios. Extensive experimental results demonstrate that by generating high-quality frequency domain images, our AIGD model achieves state-of-the-art performance audio denoising.",
        "keywords": "Audio Denoise; Diffusion models",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/fc9f1e35dd743aba428f56d76ea51df533a265d2.zip",
        "author": "Jialu Li;Youshan Zhang",
        "authorids": "~Jialu_Li3;~Youshan_Zhang1",
        "gender": "F;M",
        "homepage": "https://www.researchgate.net/profile/Jialu-Li-28;https://sites.google.com/view/youshanzhang",
        "dblp": ";228/8382.html",
        "google_scholar": ";6f1D9MkAAAAJ",
        "orcid": ";0000-0002-0074-0979",
        "linkedin": ";youshan-zhang-623a12167",
        "or_profile": "~Jialu_Li3;~Youshan_Zhang1",
        "aff": "Yeshiva University;Yeshiva University",
        "aff_domain": "mail.yu.edu;yu.edu",
        "position": "MS student;Assistant Professor",
        "bibtex": "@misc{\nli2024audio,\ntitle={Audio Image Generation for Denoising},\nauthor={Jialu Li and Youshan Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=PuTJF5Tzfa}\n}",
        "github": "",
        "project": "",
        "reviewers": "bMBJ;dehP;GkZX;ZeJc",
        "site": "https://openreview.net/forum?id=PuTJF5Tzfa",
        "pdf_size": 2657281,
        "rating": "3;3;3;5",
        "confidence": "4;3;4;4",
        "soundness": "2;1;1;3",
        "contribution": "3;2;2;3",
        "presentation": "1;2;1;2",
        "wc_summary": "46;93;68;79",
        "wc_strengths": "65;18;56;32",
        "wc_weaknesses": "181;174;231;220",
        "wc_questions": "14;305;9;5",
        "wc_review": "306;590;364;336",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            71.5,
            17.18284027743958
        ],
        "wc_strengths_avg": [
            42.75,
            18.699933154960743
        ],
        "wc_weaknesses_avg": [
            201.5,
            24.438698819699873
        ],
        "wc_questions_avg": [
            83.25,
            128.06712107328718
        ],
        "wc_review_avg": [
            399.0,
            112.16505694733989
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:EOUxcgHYH4oJ:scholar.google.com/&scioq=Audio+Image+Generation+for+Denoising&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Yeshiva University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.yu.edu",
        "aff_unique_abbr": "YU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Geographic Location Encoding with Spherical Harmonics and Sinusoidal Representation Networks",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18690",
        "id": "PudduufFLa",
        "author_site": "Marc Ru\u00dfwurm, Konstantin Klemmer, Esther Rolf, Robin Zbinden, Devis Tuia",
        "tldr": "",
        "abstract": "Learning representations of geographical space is vital for any machine learning model that integrates geolocated data, spanning application domains such as remote sensing, ecology, or epidemiology. Recent work embeds coordinates using sine and cosine projections based on Double Fourier Sphere (DFS) features. These embeddings assume a rectangular data domain even on global data, which can lead to artifacts, especially at the poles. At the same time, little attention has been paid to the exact design of the neural network architectures with which these functional embeddings are combined. This work proposes a novel location encoder for globally distributed geographic data that combines spherical harmonic basis functions, natively defined on spherical surfaces, with sinusoidal representation networks (SirenNets) that can be interpreted as learned Double Fourier Sphere embedding. We systematically evaluate positional embeddings and neural network architectures across various benchmarks and synthetic evaluation datasets. In contrast to previous approaches that require the combination of both positional encoding and neural networks to learn meaningful representations, we show that both spherical harmonics and sinusoidal representation networks are competitive on their own but set state-of-the-art performances across tasks when combined. The model code and experiments are available at https://github.com/marccoru/locationencoder.",
        "keywords": "Location Encoding;Positional Encoding;Implicit Neural Representations;Species Distribution Modeling",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Marc Ru\u00dfwurm;Konstantin Klemmer;Esther Rolf;Robin Zbinden;Devis Tuia",
        "authorids": "~Marc_Ru\u00dfwurm1;~Konstantin_Klemmer1;~Esther_Rolf1;~Robin_Zbinden1;~Devis_Tuia1",
        "gender": "M;;;M;",
        "homepage": ";https://konstantinklemmer.github.io/;;;",
        "dblp": ";189/0395;;;99/606",
        "google_scholar": ";https://scholar.google.co.uk/citations?user=ltmGyokAAAAJ;;;p3iJiLIAAAAJ",
        "orcid": "0000-0001-6612-5744;0000-0002-7096-0133;;;",
        "linkedin": ";;;robin-zbinden-545b801a5/;",
        "or_profile": "~Marc_Ru\u00dfwurm1;~Konstantin_Klemmer1;~Esther_Rolf1;~Robin_Zbinden1;~Devis_Tuia1",
        "aff": "Wageningen University;Microsoft;;EPFL - EPF Lausanne;EPFL - EPF Lausanne",
        "aff_domain": "wur.nl;microsoft.com;;epfl.ch;epfl.ch",
        "position": "Assistant Professor;Postdoc;;PhD student;Associate Professor",
        "bibtex": "@inproceedings{\nru{\\ss}wurm2024geographic,\ntitle={Geographic Location Encoding with Spherical Harmonics and Sinusoidal Representation Networks},\nauthor={Marc Ru{\\ss}wurm and Konstantin Klemmer and Esther Rolf and Robin Zbinden and Devis Tuia},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=PudduufFLa}\n}",
        "github": "",
        "project": "",
        "reviewers": "YTje;K9PX;g3zK;BVXQ",
        "pdf_size": 8944580,
        "rating": "5;6;8;8",
        "confidence": "4;4;3;3",
        "soundness": "4;2;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;4;3;3",
        "wc_summary": "111;168;125;84",
        "wc_strengths": "69;88;83;34",
        "wc_weaknesses": "222;328;117;66",
        "wc_questions": "88;127;170;32",
        "wc_review": "490;711;495;216",
        "wc_reply_reviewers": "7;125;22;0",
        "wc_reply_authors": "776;844;749;180",
        "reply_reviewers": "1;2;1;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            122.0,
            30.37268509697488
        ],
        "wc_strengths_avg": [
            68.5,
            21.10094784600919
        ],
        "wc_weaknesses_avg": [
            183.25,
            100.735730999482
        ],
        "wc_questions_avg": [
            104.25,
            50.80538849374149
        ],
        "wc_review_avg": [
            478.0,
            175.61748204549568
        ],
        "wc_reply_reviewers_avg": [
            38.5,
            50.56925943693461
        ],
        "wc_reply_authors_avg": [
            637.25,
            266.25305162570436
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9622504486493761,
        "gs_citation": 42,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18289063981731178069&as_sdt=5,30&sciodt=0,30&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=PudduufFLa",
        "pdf": "https://openreview.net/pdf?id=PudduufFLa",
        "email": "wur.nl;microsoft.com;;epfl.ch;epfl.ch",
        "author_num": 5,
        "aff_unique_index": "0;1;2;2",
        "aff_unique_norm": "Wageningen University;Microsoft;EPFL",
        "aff_unique_dep": ";Microsoft Corporation;",
        "aff_unique_url": "https://www.wageningenur.nl;https://www.microsoft.com;https://www.epfl.ch",
        "aff_unique_abbr": "WU;Microsoft;EPFL",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Lausanne",
        "aff_country_unique_index": "0;1;2;2",
        "aff_country_unique": "Netherlands;United States;Switzerland"
    },
    {
        "title": "Quadratic models for understanding catapult dynamics of neural networks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18689",
        "id": "PvJnX3dwsD",
        "author_site": "Libin Zhu, Chaoyue Liu, Adityanarayanan Radhakrishnan, Misha Belkin",
        "tldr": "",
        "abstract": "While neural networks can be approximated by linear models as their width increases, certain properties of wide neural networks cannot be captured by linear models. In this work we show that recently proposed Neural Quadratic Models can exhibit the \"catapult phase\" Lewkowycz et al. (2020) that arises when training such models with large learning rates. We then empirically show that the behaviour of quadratic models parallels that of neural networks in generalization, especially in the catapult phase regime. Our analysis further demonstrates that quadratic models are an effective tool for analysis of neural networks.",
        "keywords": "quadratic models;wide neural networks;catapult phase;optimization dynamics",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Libin Zhu;Chaoyue Liu;Adityanarayanan Radhakrishnan;Mikhail Belkin",
        "authorids": "~Libin_Zhu1;~Chaoyue_Liu2;~Adityanarayanan_Radhakrishnan1;~Mikhail_Belkin1",
        "gender": "M;M;M;",
        "homepage": ";https://cliu212.github.io/;https://aditradha.com/;http://misha.belkin-wang.org/",
        "dblp": "260/0355;191/6684-1;;",
        "google_scholar": "hyTGiUcAAAAJ;sRjoMX0AAAAJ;jd7_Ed0AAAAJ;Iwd9DdkAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;aditradha/;",
        "or_profile": "~Libin_Zhu1;~Chaoyue_Liu2;~Adityanarayanan_Radhakrishnan1;~Misha_Belkin1",
        "aff": "University of California, San Diego;University of California, San Diego;;University of California, San Diego",
        "aff_domain": "ucsd.edu;ucsd.edu;;ucsd.edu",
        "position": "PhD student;Postdoc;;Professor",
        "bibtex": "@inproceedings{\nzhu2024quadratic,\ntitle={Quadratic models for understanding catapult dynamics of neural networks},\nauthor={Libin Zhu and Chaoyue Liu and Adityanarayanan Radhakrishnan and Mikhail Belkin},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=PvJnX3dwsD}\n}",
        "github": "",
        "project": "",
        "reviewers": "5b1y;F9oB;Unww;JHXp;e4J5",
        "pdf_size": 2147273,
        "rating": "5;5;6;8;8",
        "confidence": "3;4;1;3;1",
        "soundness": "3;3;2;3;3",
        "contribution": "1;3;3;3;3",
        "presentation": "2;3;4;3;3",
        "wc_summary": "13;185;106;130;90",
        "wc_strengths": "30;27;94;61;86",
        "wc_weaknesses": "189;294;333;171;21",
        "wc_questions": "44;15;154;88;46",
        "wc_review": "276;521;687;450;243",
        "wc_reply_reviewers": "315;0;810;175;13",
        "wc_reply_authors": "342;758;2228;983;258",
        "reply_reviewers": "2;0;3;1;1",
        "reply_authors": "2;1;4;2;1",
        "rating_avg": [
            6.4,
            1.3564659966250536
        ],
        "confidence_avg": [
            2.4,
            1.2000000000000002
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.6,
            0.8000000000000002
        ],
        "presentation_avg": [
            3.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            104.8,
            56.06210841557781
        ],
        "wc_strengths_avg": [
            59.6,
            27.644891028904418
        ],
        "wc_weaknesses_avg": [
            201.6,
            109.10105407373477
        ],
        "wc_questions_avg": [
            69.4,
            48.28084506302681
        ],
        "wc_review_avg": [
            435.4,
            163.26003797622982
        ],
        "wc_reply_reviewers_avg": [
            262.6,
            297.09432845478557
        ],
        "wc_reply_authors_avg": [
            913.8,
            708.9728908780645
        ],
        "reply_reviewers_avg": [
            1.4,
            1.019803902718557
        ],
        "reply_authors_avg": [
            2.0,
            1.0954451150103321
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.466899527823841,
        "gs_citation": 24,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4864174287092130591&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=PvJnX3dwsD",
        "pdf": "https://openreview.net/pdf?id=PvJnX3dwsD",
        "email": "ucsd.edu;ucsd.edu;;ucsd.edu",
        "author_num": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of California, San Diego",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucsd.edu",
        "aff_unique_abbr": "UCSD",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "San Diego",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Masked Completion via Structured Diffusion with White-Box Transformers",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18688",
        "id": "PvyOYleymy",
        "author_site": "Druv Pai, Sam Buchanan, Ziyang Wu, Yaodong Yu, Yi Ma",
        "tldr": "",
        "abstract": "Modern learning frameworks often train deep neural networks with massive amounts of unlabeled data to learn representations by solving simple pretext tasks, then use the representations as foundations for downstream tasks. These networks are empirically designed; as such, they are usually not interpretable, their representations are not structured, and their designs are potentially redundant. White-box deep networks, in which each layer explicitly identifies and transforms structures in the data, present a promising alternative. However, existing white-box architectures have only been shown to work at scale in supervised settings with labeled data, such as classification. In this work, we provide the first instantiation of the white-box design paradigm that can be applied to large-scale unsupervised representation learning. We do this by exploiting a fundamental connection between diffusion, compression, and (masked) completion, deriving a deep transformer-like masked autoencoder architecture, called CRATE-MAE, in which the role of each layer is  mathematically fully interpretable:  they transform the data distribution to and from a structured representation. Extensive empirical evaluations confirm our analytical insights. CRATE-MAE demonstrates highly promising performance on large-scale imagery datasets while using only ~30% of the parameters compared to the standard masked autoencoder with the same model configuration. The representations learned by CRATE-MAE have explicit structure and also contain semantic meaning.",
        "keywords": "masked autoencoding;matrix completion;structured representation learning;white-box transformers",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Druv Pai;Sam Buchanan;Ziyang Wu;Yaodong Yu;Yi Ma",
        "authorids": "~Druv_Pai1;~Sam_Buchanan1;~Ziyang_Wu1;~Yaodong_Yu4;~Yi_Ma4",
        "gender": "M;M;;M;M",
        "homepage": "https://druvpai.github.io;http://sdbuchanan.com;https://robinwu218.github.io/;https://yaodongyu.github.io;http://people.eecs.berkeley.edu/~yima/",
        "dblp": ";226/5790;236/5238;;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;5WT38A0AAAAJ;9RAHYd0AAAAJ;bZ9oyW8AAAAJ;https://scholar.google.com.hk/citations?user=XqLiBQMAAAAJ",
        "orcid": ";;;;",
        "linkedin": "https://linkedin.com/in/druvpai;;;;",
        "or_profile": "~Druv_Pai1;~Sam_Buchanan1;~Ziyang_Wu1;~Yaodong_Yu4;~Yi_Ma4",
        "aff": "Electrical Engineering & Computer Science Department, University of California, Berkeley;Toyota Technological Institute at Chicago;University of California, Berkeley;Electrical Engineering & Computer Science Department, University of California Berkeley;University of California, Berkeley",
        "aff_domain": "eecs.berkeley.edu;ttic.edu;berkeley.edu;eecs.berkeley.edu;berkeley.edu",
        "position": "PhD student;Research Assistant Professor;PhD student;PhD student;Full Professor",
        "bibtex": "@inproceedings{\npai2024masked,\ntitle={Masked Completion via Structured Diffusion with White-Box Transformers},\nauthor={Druv Pai and Sam Buchanan and Ziyang Wu and Yaodong Yu and Yi Ma},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=PvyOYleymy}\n}",
        "github": "",
        "project": "",
        "reviewers": "vMuz;86oH;2DR1;pN5Y",
        "pdf_size": 43511458,
        "rating": "5;6;8;8",
        "confidence": "4;4;4;3",
        "soundness": "3;3;2;3",
        "contribution": "3;3;3;4",
        "presentation": "3;3;3;3",
        "wc_summary": "46;38;90;94",
        "wc_strengths": "68;42;91;59",
        "wc_weaknesses": "136;151;200;98",
        "wc_questions": "165;9;16;118",
        "wc_review": "415;240;397;369",
        "wc_reply_reviewers": "86;35;139;203",
        "wc_reply_authors": "1141;682;681;1087",
        "reply_reviewers": "1;1;2;1",
        "reply_authors": "3;2;3;3",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            67.0,
            25.199206336708304
        ],
        "wc_strengths_avg": [
            65.0,
            17.67766952966369
        ],
        "wc_weaknesses_avg": [
            146.25,
            36.55389856089224
        ],
        "wc_questions_avg": [
            77.0,
            66.65208173793224
        ],
        "wc_review_avg": [
            355.25,
            68.52873484896682
        ],
        "wc_reply_reviewers_avg": [
            115.75,
            62.3673592514546
        ],
        "wc_reply_authors_avg": [
            897.75,
            217.09142659257643
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            0.4330127018922193
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5555555555555555,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3116975818191988495&as_sdt=5,34&sciodt=0,34&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=PvyOYleymy",
        "pdf": "https://openreview.net/pdf?id=PvyOYleymy",
        "email": "eecs.berkeley.edu;ttic.edu;berkeley.edu;eecs.berkeley.edu;berkeley.edu",
        "author_num": 5,
        "aff_unique_index": "0;1;0;0;0",
        "aff_unique_norm": "University of California, Berkeley;Toyota Technological Institute at Chicago",
        "aff_unique_dep": "Electrical Engineering & Computer Science Department;",
        "aff_unique_url": "https://www.berkeley.edu;https://www.tti-chicago.org",
        "aff_unique_abbr": "UC Berkeley;TTI Chicago",
        "aff_campus_unique_index": "0;1;0;0;0",
        "aff_campus_unique": "Berkeley;Chicago",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "PwoplYNsBI",
        "title": "Demystifying the Myths and Legends of Nonconvex Convergence of SGD",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Stochastic gradient descent (SGD) and its variants are the main workhorses for solving large-scale optimization problems with nonconvex objective functions. Although the convergence of SGDs in the (strongly) convex case is well-understood, their convergence for nonconvex functions stands on weak mathematical foundations. Most existing studies on the nonconvex convergence of SGD show the complexity results based on either the minimum of the expected gradient norm or the functional sub-optimality gap (for functions with extra structural property) by searching the entire range of iterates. Hence the last iterations of SGDs do not necessarily maintain the same complexity guarantee. This paper shows that an $\\epsilon$-stationary point exists in the final iterates of SGDs, given a large enough total iteration budget, $T$, not just anywhere in the entire range of iterates --- a much stronger result than the existing one. Additionally, our analyses allow us to measure the \\emph{density of the $\\epsilon$-stationary points} in the final iterates of SGD, and we recover the classical ${O(\\frac{1}{\\sqrt{T}})}$ asymptotic rate under various existing assumptions on the objective function and the bounds on the stochastic gradient. As a result of our analyses, we addressed certain myths and legends related to the nonconvex convergence of SGD and posed some thought-provoking questions that could set new directions for research.",
        "keywords": "Stochastic gradient descent;nonconvex optimization;nonsmooth optimization;random-reshuffling stochstic gradient descent;nonconvex convergence",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/de2d42aa6f5eab5925d1244e9d0f9550a7cdfeb7.pdf",
        "author": "Aritra Dutta;El houcine Bergou;Soumia Boucherouite;Nicklas Werge;Melih Kandemir;Xin Li",
        "authorids": "~Aritra_Dutta1;~El_houcine_Bergou1;~Soumia_Boucherouite1;~Nicklas_Werge1;~Melih_Kandemir1;~Xin_Li39",
        "gender": "M;M;F;;M;M",
        "homepage": "https://sciences.ucf.edu/math/person/aritra-dutta/;https://ecrc.kaust.edu.sa/Pages/Bergou.aspx;;https://nicklaswerge.github.io;https://imada.sdu.dk/~kandemir/;https://sciences.ucf.edu/math/xli/",
        "dblp": "189/9262;https://dblp.uni-trier.de/pers/b/Bergou:El_Houcine.html;;297/5413;95/7056;",
        "google_scholar": "vquoiHsAAAAJ;;;7ixNlWUAAAAJ;Jxm1UeYAAAAJ;",
        "orcid": "0000-0001-6994-1659;;;0000-0001-9906-364X;0000-0001-6293-3656;",
        "linkedin": "aritra-dutta-7b28052b/;ehbergou/;soumia-boucherouite;nicklas-werge-925789b0/;melih-kandemir-64681a16/;",
        "or_profile": "~Aritra_Dutta1;~El_houcine_Bergou1;~Soumia_Boucherouite1;~Nicklas_Werge1;~Melih_Kandemir1;~Xin_Li39",
        "aff": "University of Central Florida;;College of Computing - Mohammed VI Polytechnic University;University of Southern Denmark - SDU;University of Southern Denmark;University of Central Florida",
        "aff_domain": "ucf.edu;;um6p.ma;sdu.dk;sdu.dk;ucf.edu",
        "position": "Assistant Professor;;PhD student;Postdoc;Associate Professor;Full Professor",
        "bibtex": "@misc{\ndutta2024demystifying,\ntitle={Demystifying the Myths and Legends of Nonconvex Convergence of {SGD}},\nauthor={Aritra Dutta and El houcine Bergou and Soumia Boucherouite and Nicklas Werge and Melih Kandemir and Xin Li},\nyear={2024},\nurl={https://openreview.net/forum?id=PwoplYNsBI}\n}",
        "github": "",
        "project": "",
        "reviewers": "5pB8;onbN;9YpN;n2mz",
        "site": "https://openreview.net/forum?id=PwoplYNsBI",
        "pdf_size": 692144,
        "rating": "1;3;3;3",
        "confidence": "4;4;4;4",
        "soundness": "1;1;2;2",
        "contribution": "1;1;1;1",
        "presentation": "1;2;1;2",
        "wc_summary": "23;83;70;21",
        "wc_strengths": "8;54;17;66",
        "wc_weaknesses": "111;438;346;398",
        "wc_questions": "4;70;1;1",
        "wc_review": "146;645;434;486",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            1.5,
            0.5
        ],
        "contribution_avg": [
            1.0,
            0.0
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            49.25,
            27.643941470058138
        ],
        "wc_strengths_avg": [
            36.25,
            24.33490291741473
        ],
        "wc_weaknesses_avg": [
            323.25,
            126.80965065798424
        ],
        "wc_questions_avg": [
            19.0,
            29.47032405658275
        ],
        "wc_review_avg": [
            427.75,
            180.28640409082433
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:pMYvuZ_xCXoJ:scholar.google.com/&scioq=Demystifying+the+Myths+and+Legends+of+Nonconvex+Convergence+of+SGD&hl=en&as_sdt=0,44",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;2;2;0",
        "aff_unique_norm": "University of Central Florida;Mohammed VI Polytechnic University;University of Southern Denmark",
        "aff_unique_dep": ";College of Computing;",
        "aff_unique_url": "https://www.ucf.edu;https://www.um6p.ma;https://www.sdu.dk",
        "aff_unique_abbr": "UCF;UM6P;SDU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;2;0",
        "aff_country_unique": "United States;Morocco;Denmark"
    },
    {
        "id": "PxL35zAxvT",
        "title": "Test Time Adaptation with Auxiliary Tasks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This work work tackles a key challenge in Test Time Adaptation~(TTA): adapting on limited data. This challenge arises naturally from two scenarios. (i) Current TTA methods are limited by the bandwidth with which the stream reveals data, since conducting several adaptation steps on each revealed batch from the stream will lead to overfitting. (ii) In many realistic scenarios, the stream reveals insufficient data for the model to fully adapt to a given distribution shift. We tackle the first scenario problem with auxiliary tasks where we leverage unlabeled data from the training distribution. In particular, we propose distilling the predictions of an originally pretrained model on clean data during adaptation. We found that our proposed auxiliary task significantly accelerates the adaptation to distribution shifts. We report a performance improvement over the state of the art by 1.5% and 6% on average across all corruptions on ImageNet-C under episodic and continual evaluation, respectively. To combat the second scenario of limited data, we analyze the effectiveness of combining federated adaptation with our proposed auxiliary task across different models even when different clients observe different distribution shifts. We find that not only federated averaging enhances adaptation, but combining it with our auxiliary task provides a notable 6% performance improvement over previous TTA methods.",
        "keywords": "Test Time Adaptation;Auxiliary Tasks",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/0857372995e93e49d2118d944d94cc7a57a3f4f3.pdf",
        "author": "Motasem Alfarra;Alvaro Correia;Bernard Ghanem;Christos Louizos",
        "authorids": "~Motasem_Alfarra1;~Alvaro_Correia1;~Bernard_Ghanem1;~Christos_Louizos1",
        "gender": "M;;M;",
        "homepage": "https://motasemalfarra.netlify.app/;;https://ivul.kaust.edu.sa;",
        "dblp": "255/5192;;37/2516;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;rVsGTeEAAAAJ;",
        "orcid": ";;0000-0002-5534-587X;",
        "linkedin": ";;bernardghanem/;",
        "or_profile": "~Motasem_Alfarra1;~Alvaro_Correia1;~Bernard_Ghanem1;~Christos_Louizos1",
        "aff": "KAUST;;King Abdullah University of Science and Technology;",
        "aff_domain": "kaust.edu.sa;;kaust.edu.sa;",
        "position": "PhD student;;Full Professor;",
        "bibtex": "@misc{\nalfarra2024test,\ntitle={Test Time Adaptation with Auxiliary Tasks},\nauthor={Motasem Alfarra and Alvaro Correia and Bernard Ghanem and Christos Louizos},\nyear={2024},\nurl={https://openreview.net/forum?id=PxL35zAxvT}\n}",
        "github": "",
        "project": "",
        "reviewers": "JXKk;A87N;XCKF",
        "site": "https://openreview.net/forum?id=PxL35zAxvT",
        "pdf_size": 585473,
        "rating": "3;5;6",
        "confidence": "5;3;4",
        "soundness": "2;2;2",
        "contribution": "2;2;2",
        "presentation": "1;3;3",
        "wc_summary": "50;127;69",
        "wc_strengths": "103;33;43",
        "wc_weaknesses": "762;146;174",
        "wc_questions": "238;133;148",
        "wc_review": "1153;439;434",
        "wc_reply_reviewers": "525;114;0",
        "wc_reply_authors": "2278;2069;1464",
        "reply_reviewers": "1;1;0",
        "reply_authors": "4;3;3",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            82.0,
            32.751590292177674
        ],
        "wc_strengths_avg": [
            59.666666666666664,
            30.912061651652348
        ],
        "wc_weaknesses_avg": [
            360.6666666666667,
            284.01564902112153
        ],
        "wc_questions_avg": [
            173.0,
            46.36809247747852
        ],
        "wc_review_avg": [
            675.3333333333334,
            337.7675071537949
        ],
        "wc_reply_reviewers_avg": [
            213.0,
            225.4728365014287
        ],
        "wc_reply_authors_avg": [
            1937.0,
            345.173386382361
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.6546536707079772,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:TRIeXsiCYucJ:scholar.google.com/&scioq=Test+Time+Adaptation+with+Auxiliary+Tasks&hl=en&as_sdt=0,7",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "King Abdullah University of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaust.edu.sa",
        "aff_unique_abbr": "KAUST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Saudi Arabia"
    },
    {
        "title": "A Simple and Effective Pruning Approach for Large Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18687",
        "id": "PxoFut3dWW",
        "author_site": "Mingjie Sun, Zhuang Liu, Anna Bair, J Kolter",
        "tldr": "",
        "abstract": "As their size increases, Large Languages Models (LLMs) are natural candidates for network pruning methods: approaches that drop a subset of network weights while striving to preserve performance. Existing methods, however, require either retraining, which is rarely affordable for billion-scale LLMs, or solving a weight reconstruction problem reliant on second-order information, which may also be computationally expensive. In this paper, we introduce a novel, straightforward yet effective pruning method, termed Wanda (Pruning by Weights and activations), designed to induce sparsity in pretrained LLMs. Motivated by the recent observation of emergent large magnitude features in LLMs, our approach prunes weights with the smallest magnitudes multiplied by the corresponding input activations, on a per-output basis. Notably, Wanda requires no retraining or weight update, and the pruned LLM can be used as is. We conduct a thorough evaluation of our method Wanda on LLaMA and LLaMA-2 across various language benchmarks. Wanda significantly outperforms the established baseline of magnitude pruning and performs competitively against recent method involving intensive weight update.",
        "keywords": "network pruning;sparsity;large language models;network architectures;outlier features",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/9ffbef2e35dad703bdd5f15b74bf4ea7464fd468.zip",
        "author": "Mingjie Sun;Zhuang Liu;Anna Bair;J Zico Kolter",
        "authorids": "~Mingjie_Sun1;~Zhuang_Liu1;~Anna_Bair1;~J_Zico_Kolter1",
        "gender": "M;;M;M",
        "homepage": "https://eric-mingjie.github.io/;https://annaebair.github.io/;http://www.zicokolter.com;https://liuzhuang13.github.io/",
        "dblp": "54/3913;206/3739;67/2526;56/11346-3",
        "google_scholar": "wCZbouUAAAAJ;;UXh1I6UAAAAJ;7OTD-LEAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;zhuang-liu-19306b1b1/",
        "or_profile": "~Mingjie_Sun1;~Anna_Bair1;~Zico_Kolter1;~Zhuang_Liu2",
        "aff": "Computer Science Department, Carnegie Mellon University;Carnegie Mellon University;Carnegie Mellon University;FAIR, Meta",
        "aff_domain": "cs.cmu.edu;cmu.edu;cmu.edu;meta.com",
        "position": "PhD student;PhD student;Full Professor;Research Scientist",
        "bibtex": "@inproceedings{\nsun2024a,\ntitle={A Simple and Effective Pruning Approach for Large Language Models},\nauthor={Mingjie Sun and Zhuang Liu and Anna Bair and J Zico Kolter},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=PxoFut3dWW}\n}",
        "github": "",
        "project": "",
        "reviewers": "NmjJ;V88x;JuRf;tLFR",
        "pdf_size": 785800,
        "rating": "5;6;6;8",
        "confidence": "4;4;4;4",
        "soundness": "3;3;4;4",
        "contribution": "3;2;3;3",
        "presentation": "3;3;4;4",
        "wc_summary": "60;77;68;122",
        "wc_strengths": "34;66;142;121",
        "wc_weaknesses": "154;221;120;49",
        "wc_questions": "6;9;59;257",
        "wc_review": "254;373;389;549",
        "wc_reply_reviewers": "100;135;14;28",
        "wc_reply_authors": "925;994;441;602",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            81.75,
            24.00390593216029
        ],
        "wc_strengths_avg": [
            90.75,
            42.93818230898928
        ],
        "wc_weaknesses_avg": [
            136.0,
            61.99596761080514
        ],
        "wc_questions_avg": [
            82.75,
            102.78223338690398
        ],
        "wc_review_avg": [
            391.25,
            104.95326340805225
        ],
        "wc_reply_reviewers_avg": [
            69.25,
            50.05684268908697
        ],
        "wc_reply_authors_avg": [
            740.5,
            227.58789510868104
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 582,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8181806601256870843&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=PxoFut3dWW",
        "pdf": "https://openreview.net/pdf?id=PxoFut3dWW",
        "email": "cs.cmu.edu;cmu.edu;cmu.edu;meta.com",
        "author_num": 4,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "Carnegie Mellon University;Meta",
        "aff_unique_dep": "Computer Science Department;Facebook AI Research (FAIR)",
        "aff_unique_url": "https://www.cmu.edu;https://meta.com",
        "aff_unique_abbr": "CMU;Meta",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "PyERBFX0wJ",
        "title": "Reflected Schr\\\"odinger Bridge for Constrained Generative Modeling",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Diffusion models have become the go-to method for large-scale generative models in real-world applications. These applications often involve data distributions confined within bounded domains, typically requiring ad-hoc thresholding techniques for boundary enforcement. Reflected diffusion models aim to enhance generalizability by generating the data distribution through a backward process governed by reflected Brownian motion. However, reflected diffusion models lack the flexibility to adapt to diverse domains and do not guarantee optimal transport properties. To overcome these limitations, we introduce the Reflected Schr\u00f6dinger Bridge algorithm\u2014an entropy-regularized optimal transport approach tailored for generating data within diverse bounded domains. We derive elegant reflected forward-backward stochastic differential equations with Neumann and Robin boundary conditions, extend divergence-based likelihood training to bounded domains, and explore natural connections to entropic optimal transport for the study of approximate linear convergence\u2014a valuable insight for practical training. Our algorithm yields robust generative modeling in diverse domains, and its scalability is demonstrated in real-world constrained generative modeling through standard image benchmarks.",
        "keywords": "reflected Brownian motion;Schr\\\"{o}dinger Bridge;iterative proportional fitting (IPF);entropic optimal transport;forward-backward stochastic differential equations;generative models;diffusion models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/94e0d084ab499036047274efc70b8d87486296f3.zip",
        "author": "Wei Deng;Yu Chen;Nicole Tianjiao Yang;Hengrong Du;Qi Feng;Ricky T. Q. Chen",
        "authorids": "~Wei_Deng1;~Yu_Chen15;~Nicole_Tianjiao_Yang1;~Hengrong_Du1;~Qi_Feng3;~Ricky_T._Q._Chen1",
        "gender": "M;M;;M;M;",
        "homepage": "https://waynedw.github.io/;;;https://hengrongdu.netlify.app/;https://sites.google.com/site/qifengmath/;",
        "dblp": "69/508-2;;;366/8373;;",
        "google_scholar": "IYiyxssAAAAJ;;;OtzsCPcAAAAJ;bNZM-X4AAAAJ;",
        "orcid": ";;;0000-0003-2392-8963;;",
        "linkedin": ";yu-chen-b0249b79/;;;;",
        "or_profile": "~Wei_Deng1;~Yu_Chen15;~Nicole_Tianjiao_Yang1;~Hengrong_Du1;~Qi_Feng3;~Ricky_T._Q._Chen1",
        "aff": "Morgan Stanley;Morgan Stanley;;Vanderbilt University;Florida State University;",
        "aff_domain": "morganstanley.com;morganstanley.com;;vanderbilt.edu;fsu.edu;",
        "position": "Researcher;Researcher;;Postdoc;Assistant Professor;",
        "bibtex": "@misc{\ndeng2024reflected,\ntitle={Reflected Schr{\\textbackslash}''odinger Bridge for Constrained Generative Modeling},\nauthor={Wei Deng and Yu Chen and Nicole Tianjiao Yang and Hengrong Du and Qi Feng and Ricky T. Q. Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=PyERBFX0wJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "bpMp;vVua;qZiS",
        "site": "https://openreview.net/forum?id=PyERBFX0wJ",
        "pdf_size": 15075446,
        "rating": "3;5;5",
        "confidence": "3;4;4",
        "soundness": "3;3;4",
        "contribution": "2;2;3",
        "presentation": "2;3;3",
        "wc_summary": "162;47;56",
        "wc_strengths": "71;48;63",
        "wc_weaknesses": "554;356;94",
        "wc_questions": "35;28;1",
        "wc_review": "822;479;214",
        "wc_reply_reviewers": "0;275;66",
        "wc_reply_authors": "971;567;156",
        "reply_reviewers": "0;1;1",
        "reply_authors": "3;2;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            88.33333333333333,
            52.21962168465882
        ],
        "wc_strengths_avg": [
            60.666666666666664,
            9.533566430716727
        ],
        "wc_weaknesses_avg": [
            334.6666666666667,
            188.39910356002818
        ],
        "wc_questions_avg": [
            21.333333333333332,
            14.65908895153068
        ],
        "wc_review_avg": [
            505.0,
            248.89489080064834
        ],
        "wc_reply_reviewers_avg": [
            113.66666666666667,
            117.21869399640238
        ],
        "wc_reply_authors_avg": [
            564.6666666666666,
            332.72644753444064
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.9999999999999998,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17476728020209185244&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "Morgan Stanley;Vanderbilt University;Florida State University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.morganstanley.com;https://www.vanderbilt.edu;https://www.fsu.edu",
        "aff_unique_abbr": "Morgan Stanley;Vanderbilt;FSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "PyHRUMxKbT",
        "title": "InfoNet: An Efficient Feed-Forward Neural Estimator for Mutual Information",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Estimating mutual correlations between random variables or data streams is crucial for intelligent behavior and decision-making. As a fundamental quantity for measuring statistical relationships, mutual information has been widely studied and used for its generality and equitability. However, existing methods either lack the efficiency required for real-time applications or the differentiability necessary with end-to-end learning frameworks. In this paper, we present InfoNet, a feed-forward neural estimator for mutual information that leverages the attention mechanism and the computational efficiency of deep learning infrastructures. By training InfoNet to maximize a dual formulation of mutual information via a feed-forward prediction, our approach circumvents the time-consuming test-time optimization and comes with the capability to avoid local minima in gradient descent. We evaluate the effectiveness of our proposed scheme on various families of distributions and check its generalization to another important correlation metric, i.e., the Hirschfeld-Gebelein-R\u00e9nyi Maximum Correlation Coefficient. Our results demonstrate a graceful efficiency-accuracy trade-off and order-preserving properties of InfoNet, providing a comprehensive toolbox for estimating both the Shannon Mutual Information and the HGR Correlation Coefficient. We will make the code and trained models publicly available and hope it can facilitate studies in different fields that require real-time mutual correlation estimation.",
        "keywords": "Deep Learning;Efficient Mutual Information Estimation;Real-Time Correlation Computation;Maximum Correlation Coefficient",
        "primary_area": "metric learning, kernel learning, and sparse coding",
        "supplementary_material": "",
        "author": "Zhengyang Hu;Song Kang;Qunsong Zeng;Kaibin Huang;Yanchao Yang",
        "authorids": "~Zhengyang_Hu1;~Song_Kang1;~Qunsong_Zeng1;~Kaibin_Huang1;~Yanchao_Yang1",
        "gender": "M;M;;M;M",
        "homepage": ";;;https://www.eee.hku.hk/~huangkb/;https://yanchaoyang.github.io/",
        "dblp": "219/6927-2;;;;84/8637-1",
        "google_scholar": "qe-fgwYAAAAJ;https://scholar.google.com/citations?hl=en;;HfuA3uIAAAAJ;r2tKnV4AAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Zhengyang_Hu1;~Song_Kang1;~Qunsong_Zeng1;~Kaibin_Huang1;~Yanchao_Yang1",
        "aff": "Hong Kong University;University of Science and Technology of China;;;University of Hong Kong",
        "aff_domain": "connect.hku.hk;ustc.edu.cn;;;hku.hk",
        "position": "PhD student;Undergrad student;;;Assistant Professor",
        "bibtex": "@misc{\nhu2024infonet,\ntitle={InfoNet: An Efficient Feed-Forward Neural Estimator for Mutual Information},\nauthor={Zhengyang Hu and Song Kang and Qunsong Zeng and Kaibin Huang and Yanchao Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=PyHRUMxKbT}\n}",
        "github": "",
        "project": "",
        "reviewers": "9kNo;zWhA;C35n;FUUK",
        "site": "https://openreview.net/forum?id=PyHRUMxKbT",
        "pdf_size": 10096804,
        "rating": "3;6;6;8",
        "confidence": "4;4;4;4",
        "soundness": "2;3;2;3",
        "contribution": "2;3;2;3",
        "presentation": "3;3;2;4",
        "wc_summary": "54;154;68;66",
        "wc_strengths": "22;252;82;15",
        "wc_weaknesses": "199;346;18;188",
        "wc_questions": "4;63;274;5",
        "wc_review": "279;815;442;274",
        "wc_reply_reviewers": "0;458;114;46",
        "wc_reply_authors": "1733;2102;1303;1189",
        "reply_reviewers": "0;2;1;1",
        "reply_authors": "3;5;3;2",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            85.5,
            39.909272105614754
        ],
        "wc_strengths_avg": [
            92.75,
            95.55986343648676
        ],
        "wc_weaknesses_avg": [
            187.75,
            116.17309283995154
        ],
        "wc_questions_avg": [
            86.5,
            110.8568897272515
        ],
        "wc_review_avg": [
            452.5,
            219.93237597043324
        ],
        "wc_reply_reviewers_avg": [
            154.5,
            179.85758254797042
        ],
        "wc_reply_authors_avg": [
            1581.75,
            362.45370394024116
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            3.25,
            1.0897247358851685
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:gRHkt0kJcugJ:scholar.google.com/&scioq=InfoNet:+An+Efficient+Feed-Forward+Neural+Estimator+for+Mutual+Information&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Hong Kong University;University of Science and Technology of China;University of Hong Kong",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.hku.hk;http://www.ustc.edu.cn;https://www.hku.hk",
        "aff_unique_abbr": "HKU;USTC;HKU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "Pzir15nPfc",
        "title": "Contextual Vision Transformers for Robust Representation Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We introduce Contextual Vision Transformers (ContextViT), a method designed to generate robust image representations for datasets experiencing shifts in latent factors across various groups. Derived from the concept of in-context learning, ContextViT incorporates an additional context token to encapsulate group-specific information. This integration allows the model to adjust the image representation in accordance with the  group-specific context. Specifically, for a given input image, ContextViT maps images with identical group membership into this context token, which is appended to the input image tokens. Additionally, we introduce a context inference network to predict such tokens on-the-fly, given a batch of samples from the group. This enables ContextViT to adapt to new testing distributions during inference time. We demonstrate the efficacy of ContextViT across a wide range of applications. In supervised fine-tuning,  we show that augmenting pre-trained ViTs with our proposed context conditioning mechanism results in consistent improvements in out-of-distribution generalization on iWildCam and FMoW. We also investigate self-supervised representation learning with ContextViT. Our experiments on the Camelyon17 pathology imaging benchmark and the JUMP-CP microscopy imaging benchmark demonstrate that ContextViT excels in learning stable image featurizations amidst distribution shift, consistently outperforming its ViT counterpart.",
        "keywords": "vision transformer;distribution shift;self-supervised learning;representation learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Yujia Bao;Theofanis Karaletsos",
        "authorids": "~Yujia_Bao1;~Theofanis_Karaletsos1",
        "gender": "M;M",
        "homepage": "https://people.csail.mit.edu/yujia/;http://karaletsos.com/",
        "dblp": "214/4122;31/11191",
        "google_scholar": "https://scholar.google.com/citations?authorid=Ee4Peu4AAAAJ;zrxafGsAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Yujia_Bao1;~Theofanis_Karaletsos1",
        "aff": "Accenture;Pyramidal, Inc",
        "aff_domain": "accenture.com;pyramidal.ai",
        "position": "Researcher;Researcher",
        "bibtex": "@misc{\nbao2024contextual,\ntitle={Contextual Vision Transformers for Robust Representation Learning},\nauthor={Yujia Bao and Theofanis Karaletsos},\nyear={2024},\nurl={https://openreview.net/forum?id=Pzir15nPfc}\n}",
        "github": "",
        "project": "",
        "reviewers": "hyoq;4Dw1;kTos;Y1Xv",
        "site": "https://openreview.net/forum?id=Pzir15nPfc",
        "pdf_size": 1198761,
        "rating": "5;5;5;6",
        "confidence": "4;3;4;2",
        "soundness": "3;3;2;4",
        "contribution": "3;2;2;3",
        "presentation": "3;3;2;4",
        "wc_summary": "261;52;54;55",
        "wc_strengths": "32;32;45;68",
        "wc_weaknesses": "101;126;159;77",
        "wc_questions": "1;3;42;60",
        "wc_review": "395;213;300;260",
        "wc_reply_reviewers": "36;0;69;28",
        "wc_reply_authors": "474;382;751;542",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            105.5,
            89.78446413494932
        ],
        "wc_strengths_avg": [
            44.25,
            14.703315952532613
        ],
        "wc_weaknesses_avg": [
            115.75,
            30.392227624838558
        ],
        "wc_questions_avg": [
            26.5,
            25.3229145242012
        ],
        "wc_review_avg": [
            292.0,
            66.9664094901317
        ],
        "wc_reply_reviewers_avg": [
            33.25,
            24.5903944661325
        ],
        "wc_reply_authors_avg": [
            537.25,
            135.84435026897512
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.8703882797784891,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12070186471925200805&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Accenture;Pyramidal, Inc",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.accenture.com;",
        "aff_unique_abbr": "Accenture;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Q00CO1Tm6M",
        "title": "Theoretical Hardness and Tractability of POMDPs in RL with Partial Online State Information",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Partially observable Markov decision processes (POMDPs) have been widely applied to capture many real-world applications. However, existing theoretical results have shown that learning in general POMDPs could be intractable, where the main challenge lies in the lack of latent state information. A key fundamental question here is how much online state information (OSI) is sufficient to achieve tractability. In this paper, we establish a lower bound that reveals a surprising hardness result: unless we have full OSI, we need an exponentially scaling sample complexity to obtain an $\\epsilon$-optimal policy solution for POMDPs. Nonetheless, inspired by the key insights in our lower bound design, we find that there exist important tractable classes of POMDPs even with only partial OSI. In particular, for two novel classes of POMDPs with partial OSI, we provide new algorithms that are proved to be near-optimal by establishing new regret upper and lower bounds.",
        "keywords": "reinforcement learning;partially observable Markov decision process;partial online state information;sample complexity;regret analysis;lower bound",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Ming Shi;Yingbin Liang;Ness Shroff",
        "authorids": "~Ming_Shi1;~Yingbin_Liang1;~Ness_Shroff1",
        "gender": ";F;M",
        "homepage": "https://mingshihomepage.com;https://sites.google.com/view/yingbinliang/home;http://newslab.ece.ohio-state.edu/",
        "dblp": "118/0461-3.html;51/332;67/1991",
        "google_scholar": ";lGgLAiIAAAAJ;https://scholar.google.com.tw/citations?user=5kL-ZrAAAAAJ",
        "orcid": ";;0000-0002-4606-6879",
        "linkedin": ";;nessshroff/",
        "or_profile": "~Ming_Shi1;~Yingbin_Liang1;~Ness_Shroff1",
        "aff": "The Ohio State University, Columbus, OH;The Ohio State University;Ohio State University, Columbus",
        "aff_domain": "osu.edu;osu.edu;osu.edu",
        "position": "Postdoc;Professor;Full Professor",
        "bibtex": "@misc{\nshi2024theoretical,\ntitle={Theoretical Hardness and Tractability of {POMDP}s in {RL} with Partial Online State Information},\nauthor={Ming Shi and Yingbin Liang and Ness Shroff},\nyear={2024},\nurl={https://openreview.net/forum?id=Q00CO1Tm6M}\n}",
        "github": "",
        "project": "",
        "reviewers": "oftj;VorK;yDo3;Z1AA",
        "site": "https://openreview.net/forum?id=Q00CO1Tm6M",
        "pdf_size": 654317,
        "rating": "5;6;6;6",
        "confidence": "4;4;3;3",
        "soundness": "2;3;2;3",
        "contribution": "2;3;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "64;54;132;109",
        "wc_strengths": "42;98;51;221",
        "wc_weaknesses": "74;69;348;138",
        "wc_questions": "361;187;74;2",
        "wc_review": "541;408;605;470",
        "wc_reply_reviewers": "47;0;46;0",
        "wc_reply_authors": "1303;871;987;485",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "3;2;3;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            89.75,
            32.00292955340183
        ],
        "wc_strengths_avg": [
            103.0,
            71.36876067300034
        ],
        "wc_weaknesses_avg": [
            157.25,
            113.4402375702731
        ],
        "wc_questions_avg": [
            156.0,
            135.4861616549823
        ],
        "wc_review_avg": [
            506.0,
            74.03715283558654
        ],
        "wc_reply_reviewers_avg": [
            23.25,
            23.25268801665734
        ],
        "wc_reply_authors_avg": [
            911.5,
            292.62390538026796
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16495472596473280973&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Ohio State University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.osu.edu",
        "aff_unique_abbr": "OSU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Columbus;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "SpQR: A Sparse-Quantized Representation for Near-Lossless LLM Weight Compression",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18686",
        "id": "Q1u25ahSuy",
        "author_site": "Tim Dettmers, Ruslan Svirschevski, Vage Egiazarian, Denis Kuznedelev, Elias Frantar, Saleh Ashkboos, Alexander Borzunov, Torsten Hoefler, Dan Alistarh",
        "tldr": "",
        "abstract": "Recent advances in large language model (LLM) pretraining have led to high-quality LLMs with impressive abilities. By compressing such LLMs via quantization to 3-4 bits per parameter, they can fit into memory-limited devices such as laptops and mobile phones, enabling personalized use. Quantizing models to 3-4 bits per parameter can lead to moderate to high accuracy losses, especially for smaller models (1-10B parameters), which are suitable for edge deployment. To address this accuracy issue, we introduce the Sparse-Quantized Representation (SpQR), a new compressed format and quantization technique that enables for the first time \\emph{near-lossless} compression of LLMs across model scales while reaching similar compression levels to previous methods. SpQR works by identifying and isolating \\emph{outlier weights}, which cause particularly large quantization errors, and storing them in higher precision while compressing all other weights to 3-4 bits, and achieves relative accuracy losses of less than $1\\%$ in perplexity for highly-accurate LLaMA and Falcon LLMs. This makes it possible to run a 33B parameter LLM on a single 24 GB consumer GPU without performance degradation at 15\\% speedup, thus making powerful LLMs available to consumers without any downsides. SpQR comes with efficient algorithms for both encoding weights into its format, as well as decoding them efficiently at runtime. Specifically, we provide an efficient GPU inference algorithm for SpQR, which yields faster inference than 16-bit baselines at similar accuracy while enabling memory compression gains of more than 4x.",
        "keywords": "quantization;sparsity;large language models",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/66e9b6f3a5df285809ba706f76c5486d037d27c8.zip",
        "author": "Tim Dettmers;Ruslan A. Svirschevski;Vage Egiazarian;Denis Kuznedelev;Elias Frantar;Saleh Ashkboos;Alexander Borzunov;Torsten Hoefler;Dan Alistarh",
        "authorids": "~Tim_Dettmers2;~Ruslan_A._Svirschevski1;~Vage_Egiazarian1;~Denis_Kuznedelev1;~Elias_Frantar1;~Saleh_Ashkboos2;~Alexander_Borzunov1;~Torsten_Hoefler1;~Dan_Alistarh7",
        "gender": "M;;M;M;M;;M;;",
        "homepage": "https://timdettmers.com/;;;https://github.com/Godofnothing;;;https://github.com/borzunov;;",
        "dblp": "172/1045;;232/3274;322/8616;259/2210;;295/8854;16/3869;",
        "google_scholar": "lHI3w5kAAAAJ;;Bktg6JEAAAAJ;;hjdlwz8AAAAJ;;https://scholar.google.ru/citations?user=HdwzsCMAAAAJ;;",
        "orcid": ";;0000-0003-4444-9769;0009-0005-2420-9620;;;;;",
        "linkedin": ";;;;elias-frantar-5b43181a4;;;;",
        "or_profile": "~Tim_Dettmers2;~Ruslan_A._Svirschevski1;~Vage_Egiazarian1;~Denis_Kuznedelev1;~Elias_Frantar1;~Saleh_Ashkboos2;~Alexander_Borzunov1;~Torsten_Hoefler1;~Dan_Alistarh7",
        "aff": "University of Washington;;Yandex;Yandex;Institute of Science and Technology Austria;;HSE University;Swiss Federal Institute of Technology;",
        "aff_domain": "cs.washington.edu;;yandex-team.ru;yandex-team.ru;ist.ac.at;;hse.ru;ethz.ch;",
        "position": "PhD student;;Researcher;Researcher;PhD student;;Instructor;Professor;",
        "bibtex": "@inproceedings{\ndettmers2024spqr,\ntitle={Sp{QR}: A Sparse-Quantized Representation for Near-Lossless {LLM} Weight Compression},\nauthor={Tim Dettmers and Ruslan A. Svirschevski and Vage Egiazarian and Denis Kuznedelev and Elias Frantar and Saleh Ashkboos and Alexander Borzunov and Torsten Hoefler and Dan Alistarh},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Q1u25ahSuy}\n}",
        "github": "",
        "project": "",
        "reviewers": "54fV;DynX;YH3C;Sumn",
        "pdf_size": 2827068,
        "rating": "6;6;6;8",
        "confidence": "4;5;4;5",
        "soundness": "2;3;3;3",
        "contribution": "3;3;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "94;73;96;58",
        "wc_strengths": "72;72;40;82",
        "wc_weaknesses": "512;54;150;14",
        "wc_questions": "38;173;43;10",
        "wc_review": "716;372;329;164",
        "wc_reply_reviewers": "83;0;0;12",
        "wc_reply_authors": "1030;770;781;159",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            80.25,
            15.690363284513205
        ],
        "wc_strengths_avg": [
            66.5,
            15.835087622113116
        ],
        "wc_weaknesses_avg": [
            182.5,
            196.55215592814037
        ],
        "wc_questions_avg": [
            66.0,
            63.04363568196238
        ],
        "wc_review_avg": [
            395.25,
            200.80260829979275
        ],
        "wc_reply_reviewers_avg": [
            23.75,
            34.55701810052482
        ],
        "wc_reply_authors_avg": [
            685.0,
            320.9914329074843
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 247,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11991578202313088643&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 22,
        "openreview": "https://openreview.net/forum?id=Q1u25ahSuy",
        "pdf": "https://openreview.net/pdf?id=Q1u25ahSuy",
        "email": "cs.washington.edu;;yandex-team.ru;yandex-team.ru;ist.ac.at;;hse.ru;ethz.ch;",
        "author_num": 9,
        "aff_unique_index": "0;1;1;2;3;4",
        "aff_unique_norm": "University of Washington;Yandex;Institute of Science and Technology Austria;Higher School of Economics;Swiss Federal Institute of Technology",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.washington.edu;https://yandex.com;https://www.ist.ac.at;https://hse.ru;https://www.ethz.ch",
        "aff_unique_abbr": "UW;Yandex;IST Austria;HSE;ETH Zurich",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;2;1;3",
        "aff_country_unique": "United States;Russian Federation;Austria;Switzerland"
    },
    {
        "title": "MixSup: Mixed-grained Supervision for Label-efficient LiDAR-based 3D Object Detection",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18685",
        "id": "Q1vkAhdI6j",
        "author_site": "Yuxue Yang, Lue Fan, Zhaoxiang Zhang",
        "tldr": "",
        "abstract": "Label-efficient LiDAR-based 3D object detection is currently dominated by weakly/semi-supervised methods. Instead of exclusively following one of them, we propose MixSup, a more practical paradigm simultaneously utilizing massive cheap coarse labels and a limited number of accurate labels for Mixed-grained Supervision. We start by observing that point clouds are usually textureless, making it hard to learn semantics. However, point clouds are geometrically rich and scale-invariant to the distances from sensors, making it relatively easy to learn the geometry of objects, such as poses and shapes. Thus, MixSup leverages massive coarse cluster-level labels to learn semantics and a few expensive box-level labels to learn accurate poses and shapes. We redesign the label assignment in mainstream detectors, which allows them seamlessly integrated into MixSup, enabling practicality and universality. We validate its effectiveness in nuScenes, Waymo Open Dataset, and KITTI, employing various detectors. MixSup achieves up to 97.31% of fully supervised performance, using cheap cluster annotations and only 10% box annotations. Furthermore, we propose PointSAM based on the Segment Anything Model for automated coarse labeling, further reducing the annotation burden. The code is available at https://github.com/BraveGroup/PointSAM-for-MixSup.",
        "keywords": "Label-efficient;LiDAR-based 3D object detection",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yuxue Yang;Lue Fan;Zhaoxiang Zhang",
        "authorids": "~Yuxue_Yang1;~Lue_Fan1;~Zhaoxiang_Zhang3",
        "gender": "M;;M",
        "homepage": "https://yuxueyang1204.github.io;;http://zhaoxiangzhang.net",
        "dblp": "227/9479;287/9792;55/2285-1.html",
        "google_scholar": "_kwKlZQAAAAJ;https://scholar.google.com/citations?hl=en;qxWfV6cAAAAJ",
        "orcid": "0000-0002-0039-4359;;",
        "linkedin": ";;",
        "or_profile": "~Yuxue_Yang1;~Lue_Fan1;~Zhaoxiang_Zhang3",
        "aff": "Institute of Automation, Chinese Academy of Sciences;Institute of Automation, Chinese Academy of Sciences;Institute of Automation, Chinese Academy of Sciences",
        "aff_domain": "ia.ac.cn;ia.ac.cn;ia.ac.cn",
        "position": "PhD student;PhD student;Full Professor",
        "bibtex": "@inproceedings{\nyang2024mixsup,\ntitle={MixSup: Mixed-grained Supervision for Label-efficient Li{DAR}-based 3D Object Detection},\nauthor={Yuxue Yang and Lue Fan and Zhaoxiang Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Q1vkAhdI6j}\n}",
        "github": "",
        "project": "",
        "reviewers": "unqt;yY5M;joqH",
        "pdf_size": 4971058,
        "rating": "6;6;8",
        "confidence": "4;4;4",
        "soundness": "3;3;3",
        "contribution": "3;2;3",
        "presentation": "3;2;3",
        "wc_summary": "65;111;207",
        "wc_strengths": "15;67;58",
        "wc_weaknesses": "216;660;41",
        "wc_questions": "76;62;456",
        "wc_review": "372;900;762",
        "wc_reply_reviewers": "78;49;85",
        "wc_reply_authors": "2202;1829;1581",
        "reply_reviewers": "2;1;1",
        "reply_authors": "5;3;4",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            127.66666666666667,
            59.157041470610714
        ],
        "wc_strengths_avg": [
            46.666666666666664,
            22.691163233490013
        ],
        "wc_weaknesses_avg": [
            305.6666666666667,
            260.53833157948606
        ],
        "wc_questions_avg": [
            198.0,
            182.52305790410884
        ],
        "wc_review_avg": [
            678.0,
            223.58890849055996
        ],
        "wc_reply_reviewers_avg": [
            70.66666666666667,
            15.58489297008128
        ],
        "wc_reply_authors_avg": [
            1870.6666666666667,
            255.22843798361413
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            4.0,
            0.816496580927726
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6206549142409698178&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=Q1vkAhdI6j",
        "pdf": "https://openreview.net/pdf?id=Q1vkAhdI6j",
        "email": "ia.ac.cn;ia.ac.cn;ia.ac.cn",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Chinese Academy of Sciences",
        "aff_unique_dep": "Institute of Automation",
        "aff_unique_url": "http://www.ia.cas.cn",
        "aff_unique_abbr": "CAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "Q3Foe1fDjh",
        "title": "Expected Probabilistic Hierarchies",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Hierarchical clustering has usually been addressed by discrete optimization using heuristics or continuous optimization of relaxed scores for hierarchies. In this work, we propose to optimize expected scores under a probabilistic model over hierarchies. (1) We show theoretically that the global optimal values of the expected Dasgupta cost and Tree-Sampling divergence (TSD), two unsupervised metrics for hierarchical clustering, are equal to the optimal values of their discrete counterparts contrary to some relaxed scores. (2) We propose Expected Probabilistic Hierarchies (EPH), a probabilistic model to learn hierarchies in data by optimizing expected scores. EPH uses differentiable hierarchy sampling enabling end-to-end gradient descent based optimization, and an unbiased subgraph sampling approach to scale to large datasets. (3) We evaluate EPH on synthetic and real-world datasets including vector and graph datasets. EPH outperforms all other approaches on quantitative results and provides meaningful hierarchies in qualitative evaluations.",
        "keywords": "hierarchical clustering;graph clustering;clustering;unsupervised learning;probabilistic models",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Marcel Kollovieh;Bertrand Charpentier;Daniel Z\u00fcgner;Stephan G\u00fcnnemann",
        "authorids": "~Marcel_Kollovieh1;~Bertrand_Charpentier2;~Daniel_Z\u00fcgner1;~Stephan_G\u00fcnnemann1",
        "gender": "M;;M;M",
        "homepage": "https://marcelkollovieh.de;https://sharpenb.github.io/;;http://www.daml.in.tum.de",
        "dblp": "299/1647;222/1875;172/6951;43/3011",
        "google_scholar": "4oq7nmIAAAAJ;0rqI-ycAAAAJ;;",
        "orcid": ";;;",
        "linkedin": "marcel-kollovieh-8a2ab21b7/;bertrand-charpentier-76995ab6/;;",
        "or_profile": "~Marcel_Kollovieh1;~Bertrand_Charpentier2;~Daniel_Z\u00fcgner1;~Stephan_G\u00fcnnemann1",
        "aff": "Department of Informatics, Technische Universit\u00e4t M\u00fcnchen;Technical University Munich;Microsoft;Technical University Munich",
        "aff_domain": "in.tum.de;tum.de;microsoft.com;tum.de",
        "position": "PhD student;PhD student;Postdoc;Professor",
        "bibtex": "@misc{\nkollovieh2024expected,\ntitle={Expected Probabilistic Hierarchies},\nauthor={Marcel Kollovieh and Bertrand Charpentier and Daniel Z{\\\"u}gner and Stephan G{\\\"u}nnemann},\nyear={2024},\nurl={https://openreview.net/forum?id=Q3Foe1fDjh}\n}",
        "github": "",
        "project": "",
        "reviewers": "geHj;gKno;jgu2",
        "site": "https://openreview.net/forum?id=Q3Foe1fDjh",
        "pdf_size": 2526490,
        "rating": "5;5;8",
        "confidence": "3;3;3",
        "soundness": "3;3;3",
        "contribution": "2;2;3",
        "presentation": "2;3;4",
        "wc_summary": "150;84;73",
        "wc_strengths": "127;18;150",
        "wc_weaknesses": "52;44;101",
        "wc_questions": "47;21;24",
        "wc_review": "376;167;348",
        "wc_reply_reviewers": "76;4;421",
        "wc_reply_authors": "424;350;1095",
        "reply_reviewers": "2;1;2",
        "reply_authors": "2;2;2",
        "rating_avg": [
            6.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            102.33333333333333,
            34.00326781681758
        ],
        "wc_strengths_avg": [
            98.33333333333333,
            57.57507176625044
        ],
        "wc_weaknesses_avg": [
            65.66666666666667,
            25.197001585285676
        ],
        "wc_questions_avg": [
            30.666666666666668,
            11.61416759345623
        ],
        "wc_review_avg": [
            297.0,
            92.63188795801727
        ],
        "wc_reply_reviewers_avg": [
            167.0,
            181.99450541156455
        ],
        "wc_reply_authors_avg": [
            623.0,
            335.11888437786774
        ],
        "reply_reviewers_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:HtTTiWxtClYJ:scholar.google.com/&scioq=Expected+Probabilistic+Hierarchies&hl=en&as_sdt=0,33",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "Technische Universit\u00e4t M\u00fcnchen;Technical University of Munich;Microsoft",
        "aff_unique_dep": "Department of Informatics;;Microsoft Corporation",
        "aff_unique_url": "https://www.tum.de;https://www.tum.de;https://www.microsoft.com",
        "aff_unique_abbr": "TUM;TUM;Microsoft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "Germany;United States"
    },
    {
        "id": "Q3GVrWRKuB",
        "title": "How Far Have We Gone in Vulnerability Detection Using Large Language Model",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In an era where software grows increasingly complex and suffers from vulnerabilities, automated vulnerability detection is vitally important yet remains a challenging task. The remarkable generalizability exhibited by Large Language Models (LLMs) across various domains heightens our anticipation of their capabilities in vulnerability detection. Still, the lack of quantitative performance measurements hinders a clear understanding of these models' potential.\nAddressing this, we present \\dsname, a high-quality, comprehensive vulnerability benchmark. \\dsname has amassed high-quality vulnerability data derived from an extensive array of CTF challenges and real-world applications. This benchmark annotates each vulnerable function, specifying the vulnerability type and root cause of the vulnerability.\nWe conduct extensive experiments involving existing solutions, assessing a total of 16 LLMs and 6 state-of-the-art (SOTA) methods in vulnerability detection. The evaluation result uncovers a paradox in performance levels and highlights the untapped potential of LLMs. Our work makes a significant advancement toward understanding and harnessing the power of LLMs for more secure software systems.",
        "keywords": "LLM;Vulnerability;Security",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Zeyu Gao;Hao Wang;Yuchen Zhou;Wenyu Zhu;Chao Zhang",
        "authorids": "~Zeyu_Gao3;~Hao_Wang41;~Yuchen_Zhou6;~Wenyu_Zhu1;~Chao_Zhang18",
        "gender": ";M;M;M;M",
        "homepage": "https://github.com/zeyugao;;;https://github.com/Learner0x5a/;http://netsec.ccert.edu.cn/people/chaoz/",
        "dblp": ";;;;94/3019-8",
        "google_scholar": ";BSz8DXoAAAAJ;;;YreXlgsAAAAJ",
        "orcid": ";;0000-0002-7021-1183;;0000-0001-7894-8828",
        "linkedin": ";;;;",
        "or_profile": "~Zeyu_Gao3;~Hao_Wang41;~Yuchen_Zhou6;~Wenyu_Zhu1;~Chao_Zhang18",
        "aff": "Tsinghua University;Tsinghua University;Beijing University of Technology;Tsinghua University;Tsinghua University",
        "aff_domain": "mail.tsinghua.edu.cn;tsinghua.edu.cn;bjut.edu.cn;mails.tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "PhD student;PhD student;Undergrad student;PhD student;Associate Professor",
        "bibtex": "@misc{\ngao2024how,\ntitle={How Far Have We Gone in Vulnerability Detection Using Large Language Model},\nauthor={Zeyu Gao and Hao Wang and Yuchen Zhou and Wenyu Zhu and Chao Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=Q3GVrWRKuB}\n}",
        "github": "",
        "project": "",
        "reviewers": "YnvL;91Jf;Ni1D;FRwA",
        "site": "https://openreview.net/forum?id=Q3GVrWRKuB",
        "pdf_size": 1401437,
        "rating": "3;5;5;5",
        "confidence": "4;4;4;4",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;2",
        "presentation": "2;3;2;2",
        "wc_summary": "94;78;57;79",
        "wc_strengths": "161;77;32;47",
        "wc_weaknesses": "664;192;261;113",
        "wc_questions": "56;22;98;105",
        "wc_review": "975;369;448;344",
        "wc_reply_reviewers": "29;13;0;36",
        "wc_reply_authors": "441;407;597;359",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            77.0,
            13.171939872319491
        ],
        "wc_strengths_avg": [
            79.25,
            49.90177852541931
        ],
        "wc_weaknesses_avg": [
            307.5,
            212.3823203564741
        ],
        "wc_questions_avg": [
            70.25,
            33.573613150806395
        ],
        "wc_review_avg": [
            534.0,
            257.48883470939086
        ],
        "wc_reply_reviewers_avg": [
            19.5,
            14.0089257261219
        ],
        "wc_reply_authors_avg": [
            451.0,
            89.1852005660132
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 43,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16412544068943907259&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "Tsinghua University;Beijing University of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tsinghua.edu.cn;http://www.bjut.edu.cn",
        "aff_unique_abbr": "THU;BJUT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Lemur: Integrating Large Language Models in Automated Program Verification",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18684",
        "id": "Q3YaCghZNt",
        "author_site": "Haoze Wu, Clark Barrett, Nina Narodytska",
        "tldr": "",
        "abstract": "The demonstrated code-understanding capability of LLMs raises the question of whether they can be used for automated program verification, a task that demands high-level abstract reasoning about program properties that is challenging for verification tools. We propose a general methodology to combine the power of LLMs and automated reasoners for automated program verification. We formally describe this methodology as a set of derivation rules and prove its soundness. We instantiate the calculus as a sound automated verification procedure, which led to practical improvements on a set of synthetic and competition benchmarks.",
        "keywords": "Large Language Models;Formal verification",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "",
        "author": "Haoze Wu;Clark Barrett;Nina Narodytska",
        "authorids": "~Haoze_Wu1;~Clark_Barrett1;~Nina_Narodytska1",
        "gender": ";M;F",
        "homepage": "https://wu-haoze.github.io/;http://theory.stanford.edu/~barrett;",
        "dblp": "195/8725-1;b/ClarkWBarrett;87/3366",
        "google_scholar": "uKegaWoAAAAJ;https://scholar.google.com.tw/citations?user=BtwmZfQAAAAJ;",
        "orcid": ";0000-0002-9522-3084;",
        "linkedin": ";clark-barrett-a5b157/;",
        "or_profile": "~Haoze_Wu1;~Clark_Barrett1;~Nina_Narodytska1",
        "aff": "Stanford University;Stanford University;VMware",
        "aff_domain": "stanford.edu;stanford.edu;vmware.com",
        "position": "PhD student;Professor (Research);Researcher",
        "bibtex": "@inproceedings{\nwu2024lemur,\ntitle={Lemur: Integrating Large Language Models in Automated Program Verification},\nauthor={Haoze Wu and Clark Barrett and Nina Narodytska},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Q3YaCghZNt}\n}",
        "github": "",
        "project": "",
        "reviewers": "ERFy;YmWA;2ahy;mzY5",
        "pdf_size": 319931,
        "rating": "5;5;5;8",
        "confidence": "3;3;5;5",
        "soundness": "2;2;4;4",
        "contribution": "2;2;2;4",
        "presentation": "3;1;3;4",
        "wc_summary": "53;65;143;148",
        "wc_strengths": "37;13;90;110",
        "wc_weaknesses": "93;33;316;184",
        "wc_questions": "72;111;202;194",
        "wc_review": "255;222;751;636",
        "wc_reply_reviewers": "108;0;853;13",
        "wc_reply_authors": "511;370;1134;585",
        "reply_reviewers": "1;0;2;1",
        "reply_authors": "2;1;4;1",
        "rating_avg": [
            5.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            1.0
        ],
        "soundness_avg": [
            3.0,
            1.0
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            2.75,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            102.25,
            43.49353400219393
        ],
        "wc_strengths_avg": [
            62.5,
            39.092838218783754
        ],
        "wc_weaknesses_avg": [
            156.5,
            106.63137436983544
        ],
        "wc_questions_avg": [
            144.75,
            55.07892065028145
        ],
        "wc_review_avg": [
            466.0,
            231.39900604799493
        ],
        "wc_reply_reviewers_avg": [
            243.5,
            354.35610619827054
        ],
        "wc_reply_authors_avg": [
            650.0,
            289.91464261054495
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 30,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14009534725437761957&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=Q3YaCghZNt",
        "pdf": "https://openreview.net/pdf?id=Q3YaCghZNt",
        "email": "stanford.edu;stanford.edu;vmware.com",
        "author_num": 3,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Stanford University;VMware, Inc.",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.stanford.edu;https://www.vmware.com",
        "aff_unique_abbr": "Stanford;VMware",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Stanford;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Q3aKBKCqG8",
        "title": "UBERT: Unsupervised adaptive early exits in BERT",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Inference latency is an issue in pre-trained networks like BERT due to their large size. To overcome this, side branches are attached at the intermediary layers with provision for early inference instead of inference only at the last layer. This facilitates the early exit of 'easy' samples and requires only 'hard' samples to pass through all layers, thus reducing inference latency.  However, the hardness of the samples is unknown a priori. This leads to the question of how to exit so that the accuracy and latency are well balanced. Also, the optimal choice of parameters involved in deciding exits can depend on the sample domain and hence need to be adapted. We develop an online learning algorithm named UBERT to decide if a sample can exit early. The decisions are based on confidence in inference exceeding a threshold at each exit point, and the algorithm simultaneously learns the optimal thresholds for all the exits. UBERT learns the optimal threshold for the sample domain using confidence observed at the intermediary layers without requiring any ground truth labels. We perform extensive experiments on five datasets with one and two early exits. We compare the performance against the case with no early exits, i.e., all samples exit at the last layer. UBERT achieves a 10\\%-53\\% reduction in time with a drop in accuracy in the range of 0.3\\% - 5.7\\% with one early exit. For the case with two exits, the time reduction increases to 32\\%-70\\% with only a marginal drop in accuracy of 0.1\\%-3.9\\%. The anonymized source code is available at https://anonymous.4open.science/r/UBERT-F2DF/README.md.",
        "keywords": "Early exits;Deep Neural Networks;BERT",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Divya Jyoti Bajpai;Manjesh Kumar Hanawal",
        "authorids": "~Divya_Jyoti_Bajpai1;~Manjesh_Kumar_Hanawal1",
        "gender": "M;M",
        "homepage": "https://www.ieor.iitb.ac.in/node/2823;https://www.ieor.iitb.ac.in/mlions",
        "dblp": "357/1369;01/8397",
        "google_scholar": "J-z9diIAAAAJ;vtVK3KUAAAAJ",
        "orcid": ";0000-0002-1807-5487",
        "linkedin": "divya-jyoti-bajpai-139128209;manjesh-kumar-hanawal-a260055/",
        "or_profile": "~Divya_Jyoti_Bajpai1;~Manjesh_Kumar_Hanawal1",
        "aff": "Indian Institute of Technology, Bombay, Dhirubhai Ambani Institute Of Information and Communication Technology;Indian Institute of Technology Bombay",
        "aff_domain": "iitb.ac.in;iitb.ac.in",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\nbajpai2024ubert,\ntitle={{UBERT}: Unsupervised adaptive early exits in {BERT}},\nauthor={Divya Jyoti Bajpai and Manjesh Kumar Hanawal},\nyear={2024},\nurl={https://openreview.net/forum?id=Q3aKBKCqG8}\n}",
        "github": "",
        "project": "",
        "reviewers": "isHH;nNLW;P3Sw;sWQ2",
        "site": "https://openreview.net/forum?id=Q3aKBKCqG8",
        "pdf_size": 6785077,
        "rating": "3;3;5;5",
        "confidence": "4;4;4;1",
        "soundness": "2;2;1;2",
        "contribution": "2;3;3;2",
        "presentation": "2;2;2;2",
        "wc_summary": "75;30;207;55",
        "wc_strengths": "18;22;40;11",
        "wc_weaknesses": "238;50;365;39",
        "wc_questions": "2;583;42;4",
        "wc_review": "333;685;654;109",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "684;1117;817;128",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.25,
            1.299038105676658
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            91.75,
            68.42285802273975
        ],
        "wc_strengths_avg": [
            22.75,
            10.709224995301948
        ],
        "wc_weaknesses_avg": [
            173.0,
            136.17452037734517
        ],
        "wc_questions_avg": [
            157.75,
            246.03493146299368
        ],
        "wc_review_avg": [
            445.25,
            238.076012021371
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            686.5,
            358.56972822590586
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5773502691896258,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:1jwclinOeOAJ:scholar.google.com/&scioq=UBERT:+Unsupervised+adaptive+early+exits+in+BERT&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Indian Institute of Technology, Bombay;Indian Institute of Technology Bombay",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.iitb.ac.in;https://www.iitb.ac.in",
        "aff_unique_abbr": "IIT Bombay;IIT Bombay",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Bombay",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "India"
    },
    {
        "id": "Q4FmJPQwuJ",
        "title": "CrossTVR: Multi-Grained Re-Ranker for Text Video Retrieval with Frozen Image Encoders",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "State-of-the-art text-video retrieval (TVR) methods commonly use CLIP and cosine similarity for efficient retrieval. \nMeanwhile, cross attention methods, which employ a transformer decoder to compute attention between text queries and video frames, offer a more comprehensive interaction between multimodal information.\nComplementary to the existed one-stage text video retrieval approaches above, we propose a re-ranker called CrossTVR that further explores the fine-grained and comprehensive interaction between text and all the vision tokens of a given video at the frame level and the video (clips or segments) level. \nFurthermore, we employ the frozen CLIP model strategy for fine-grained retrieval, enabling scalability to larger pre-trained vision models like ViT-G and resulting in further improved retrieval performance.\nSubsequently,  a two-stage text-video retrieval architecture can be proposed.\nIn the first stage, we leverage existed TVR methods with cosine similarity network to efficently obtain text video candidate pairs.\nIn the second stage, the proposed re-ranker is applied for fine-grained retrieval. \nExperimental results on text-video retrieval datasets demonstrate the effectiveness and scalability of the proposed re-ranker when combined with existing mainstream one-stage text-video retrieval approaches.",
        "keywords": "Text-Video Retrieval;CLIP;Frozen;Multimodal",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/1a203262dc44b942656bfa2864dde71260b1d49f.pdf",
        "author": "Zuozhuo Dai;Fangtao Shao;Qingkun Su;Zilong Dong;Yao Yao;Long Qin;Siyu Zhu",
        "authorids": "~Zuozhuo_Dai2;~Fangtao_Shao1;~Qingkun_Su1;~Zilong_Dong2;~Yao_Yao1;~Long_Qin2;~Siyu_Zhu1",
        "gender": "M;M;M;M;M;M;M",
        "homepage": ";https://me.csdn.net/qitazhang;;https://yoyo000.github.io/;https://www.cs.cmu.edu/~lqin/cmu.html;https://sites.google.com/site/zhusiyucs;https://baike.baidu.com/item/%E8%91%A3%E5%AD%90%E9%BE%99/62931048",
        "dblp": "230/4159;270/0580;;07/4410-8;;81/8842-1;81/1423",
        "google_scholar": "1W9jiEEAAAAJ;;https://scholar.google.com.hk/citations?user=J-_00TIAAAAJ;MGxaDVEAAAAJ;d52-H6EAAAAJ;vNCnDiMAAAAJ;GHOQKCwAAAAJ",
        "orcid": ";;;;;;0000-0002-6833-9102",
        "linkedin": ";;;;;;",
        "or_profile": "~Zuozhuo_Dai2;~Fangtao_Shao1;~Qingkun_Su1;~Yao_Yao1;~Long_Qin2;~Siyu_Zhu1;~Zlong_Dong1",
        "aff": "Alibaba Group;Alibaba Group;Alibaba Group;Nanjing University;Alibaba Group;Fudan University;Alibaba Group",
        "aff_domain": "alibaba-inc.com;alibaba-inc.com;alibaba-inc.com;nju.edu.cn;alibaba-inc.com;fudan.edu.cn;alibaba-inc.com",
        "position": "Researcher;Full-Time Employee;Researcher;Associate Professor;Principal Researcher;Full Professor;Researcher",
        "bibtex": "@misc{\ndai2024crosstvr,\ntitle={Cross{TVR}: Multi-Grained Re-Ranker for Text Video Retrieval with Frozen Image Encoders},\nauthor={Zuozhuo Dai and Fangtao Shao and Qingkun Su and Zilong Dong and Yao Yao and Long Qin and Siyu Zhu},\nyear={2024},\nurl={https://openreview.net/forum?id=Q4FmJPQwuJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "TCyW;dEsS;qf6J",
        "site": "https://openreview.net/forum?id=Q4FmJPQwuJ",
        "pdf_size": 15883934,
        "rating": "5;5;6",
        "confidence": "5;4;5",
        "soundness": "3;2;3",
        "contribution": "3;2;2",
        "presentation": "2;2;3",
        "wc_summary": "66;36;113",
        "wc_strengths": "45;54;95",
        "wc_weaknesses": "52;200;135",
        "wc_questions": "37;1;165",
        "wc_review": "200;291;508",
        "wc_reply_reviewers": "0;0;74",
        "wc_reply_authors": "363;643;794",
        "reply_reviewers": "0;0;2",
        "reply_authors": "1;1;2",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            71.66666666666667,
            31.689465477067017
        ],
        "wc_strengths_avg": [
            64.66666666666667,
            21.761331658599286
        ],
        "wc_weaknesses_avg": [
            129.0,
            60.569519287069355
        ],
        "wc_questions_avg": [
            67.66666666666667,
            70.37676384211545
        ],
        "wc_review_avg": [
            333.0,
            129.2001031991332
        ],
        "wc_reply_reviewers_avg": [
            24.666666666666668,
            34.883934538536344
        ],
        "wc_reply_authors_avg": [
            600.0,
            178.56278074298314
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:dk2xSyp5F5oJ:scholar.google.com/&scioq=CrossTVR:+Multi-Grained+Re-Ranker+for+Text+Video+Retrieval+with+Frozen+Image+Encoders&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;0;2;0",
        "aff_unique_norm": "Alibaba Group;Nanjing University;Fudan University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.alibaba.com;https://www.nju.edu.cn;https://www.fudan.edu.cn",
        "aff_unique_abbr": "Alibaba;Nanjing U;Fudan",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Masked Autoencoders with Multi-Window Local-Global Attention Are Better Audio Learners",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18683",
        "id": "Q53QLftNkA",
        "author_site": "Sarthak Yadav, Sergios Theodoridis, Lars Kai Hansen, Zheng-Hua Tan",
        "tldr": "",
        "abstract": "In this work, we propose a Multi-Window Masked Autoencoder (MW-MAE) fitted with a novel Multi-Window Multi-Head Attention (MW-MHA) module that facilitates the modelling of local-global interactions in every decoder transformer block through attention heads of several distinct local and global windows. Empirical results on ten downstream audio tasks show that MW-MAEs consistently outperform standard MAEs in overall performance and learn better general-purpose audio representations, along with demonstrating considerably better scaling characteristics. Investigating attention distances and entropies reveals that MW-MAE encoders learn heads with broader local and global attention. Analyzing attention head feature representations through Projection Weighted Canonical Correlation Analysis (PWCCA) shows that attention heads with the same window sizes across the decoder layers of the MW-MAE learn correlated feature representations which enables each block to independently capture local and global information, leading to a decoupled decoder feature hierarchy.",
        "keywords": "self-supervised learning;masked autoencoder;audio representation learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Sarthak Yadav;Sergios Theodoridis;Lars Kai Hansen;Zheng-Hua Tan",
        "authorids": "~Sarthak_Yadav1;~Sergios_Theodoridis1;~Lars_Kai_Hansen1;~Zheng-Hua_Tan1",
        "gender": ";M;M;M",
        "homepage": ";https://cgi.di.uoa.gr/~stheodor/;http://cogsys.imm.dtu.dk/staff/lkhansen/lkhansen.html;https://zhenghuatan.es.aau.dk/",
        "dblp": ";06/3006;80/3468;39/4898",
        "google_scholar": ";3dBjdv4AAAAJ;https://scholar.google.dk/citations?user=gQVuJh8AAAAJ;fugL2E8AAAAJ",
        "orcid": ";0000-0001-5040-161X;0000-0003-0442-5877;0000-0001-6856-8928",
        "linkedin": ";;;zhenghuatan/",
        "or_profile": "~Sarthak_Yadav1;~Sergios_Theodoridis1;~Lars_Kai_Hansen1;~Zheng-Hua_Tan1",
        "aff": ";;Technical University of Denmark;Aalborg University",
        "aff_domain": ";;dtu.dk;aau.dk",
        "position": ";;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nyadav2024masked,\ntitle={Masked Autoencoders with Multi-Window Local-Global Attention Are Better Audio Learners},\nauthor={Sarthak Yadav and Sergios Theodoridis and Lars Kai Hansen and Zheng-Hua Tan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Q53QLftNkA}\n}",
        "github": "",
        "project": "",
        "reviewers": "M3PT;4eUM;fDLB;a4K8",
        "pdf_size": 714183,
        "rating": "3;6;6;6",
        "confidence": "3;3;2;3",
        "soundness": "2;2;2;2",
        "contribution": "2;3;1;2",
        "presentation": "2;2;3;3",
        "wc_summary": "19;105;73;94",
        "wc_strengths": "10;141;71;67",
        "wc_weaknesses": "326;148;82;123",
        "wc_questions": "74;48;35;60",
        "wc_review": "429;442;261;344",
        "wc_reply_reviewers": "0;116;114;284",
        "wc_reply_authors": "1358;1078;1041;1571",
        "reply_reviewers": "0;1;1;4",
        "reply_authors": "4;4;3;5",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            72.75,
            33.09361720936531
        ],
        "wc_strengths_avg": [
            72.25,
            46.45091495331389
        ],
        "wc_weaknesses_avg": [
            169.75,
            93.23726454588852
        ],
        "wc_questions_avg": [
            54.25,
            14.428704030508076
        ],
        "wc_review_avg": [
            369.0,
            72.8319984622144
        ],
        "wc_reply_reviewers_avg": [
            128.5,
            101.31510252672106
        ],
        "wc_reply_authors_avg": [
            1262.0,
            216.44514316565295
        ],
        "reply_reviewers_avg": [
            1.5,
            1.5
        ],
        "reply_authors_avg": [
            4.0,
            0.7071067811865476
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16058959663183319179&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=Q53QLftNkA",
        "pdf": "https://openreview.net/pdf?id=Q53QLftNkA",
        "email": ";;dtu.dk;aau.dk",
        "author_num": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Technical University of Denmark;Aalborg University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tek.dk;https://www.aau.dk",
        "aff_unique_abbr": "DTU;AAU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Denmark"
    },
    {
        "id": "Q5LuORNY2A",
        "title": "Implicit NNs are Almost Equivalent to Not-so-deep Explicit NNs for High-dimensional Gaussian Mixtures",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Implicit neural networks (NNs) have demonstrated remarkable success in various tasks. However,   there is a lack of theoretical understanding of the connections and  differences between implicit and explicit networks.\nIn this paper, we employ random matrix theory (RMT) to analyze the eigenspectra of neural tangent kernels (NTKs) and conjugate kernels (CKs) for a broad range of implicit NNs, when the input data are drawn from a high-dimensional Gaussian mixture model.\nSurprisingly, the spectral behavior of Implicit-CKs and NTKs depend on the activation function and initial weight variances, but \\emph{only} via a system of four nonlinear equations.\nAs a direct (and important!) consequence of our theoretical analysis, we demonstrate that (as shallow as) a two-hidden-layer explicit NN with well-designed activations can share the same CK or NTK eigenspectra with \\emph{any} given implicit NN. \nThese findings offer practical benefits, and allow for the design of memory-efficient explicit NNs that match implicit NNs' performance without incurring  the computational overhead of fixed-point iterations.  \nThe proposed theory is supported by empirical results on both synthetic and real-world datasets.",
        "keywords": "random matrix theory;implicit neural networks;deep equilibrium models;high-dimensional statistics",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/0f5fe59a7e8d892e99f4347c438612455dc7108c.zip",
        "author": "Zenan Ling;Zhanbo Feng;Longbo Li;Robert C Qiu;Zhenyu Liao",
        "authorids": "~Zenan_Ling1;~Zhanbo_Feng1;~Longbo_Li1;~Robert_C_Qiu1;~Zhenyu_Liao1",
        "gender": "M;M;M;M;M",
        "homepage": "https://scholar.google.com/citations?user=BabePTkAAAAJ&hl=zh-CN;http://SadAngel.cn/;https://github.com/StephenLi24;https://zhenyu-liao.github.io/;",
        "dblp": "183/7798;234/7758;;49/10218-1;",
        "google_scholar": "BabePTkAAAAJ;;;https://scholar.google.fr/citations?user=SPYhJV8AAAAJ;FTLNXX8AAAAJ",
        "orcid": ";;;0000-0002-1915-8559;",
        "linkedin": ";;;;",
        "or_profile": "~Zenan_Ling1;~Zhanbo_Feng1;~Longbo_Li1;~Zhenyu_Liao1;~Caiming_Qiu1",
        "aff": "Huazhong University of Science and Technology;Shanghai Jiaotong University;Huazhong University of Science and Technology;Huazhong University of Science and Technology;Huazhong University of Science and Technology",
        "aff_domain": "hust.edu.cn;sjtu.edu.cn;hust.edu.cn;hust.edu.cn;hust.edu.cn",
        "position": "Researcher;PhD student;MS student;Associate Professor;Full Professor",
        "bibtex": "@misc{\nling2024implicit,\ntitle={Implicit {NN}s are Almost Equivalent to Not-so-deep Explicit {NN}s for High-dimensional Gaussian Mixtures},\nauthor={Zenan Ling and Zhanbo Feng and Longbo Li and Robert C Qiu and Zhenyu Liao},\nyear={2024},\nurl={https://openreview.net/forum?id=Q5LuORNY2A}\n}",
        "github": "",
        "project": "",
        "reviewers": "9wKK;9F3o;aCT6;yQj9",
        "site": "https://openreview.net/forum?id=Q5LuORNY2A",
        "pdf_size": 765973,
        "rating": "3;3;5;8",
        "confidence": "2;4;3;2",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "142;56;100;48",
        "wc_strengths": "41;38;54;11",
        "wc_weaknesses": "1090;370;81;24",
        "wc_questions": "44;3;22;38",
        "wc_review": "1317;467;257;121",
        "wc_reply_reviewers": "663;225;72;0",
        "wc_reply_authors": "2727;814;493;380",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "5;3;1;1",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            86.5,
            37.66629793329841
        ],
        "wc_strengths_avg": [
            36.0,
            15.636495771111889
        ],
        "wc_weaknesses_avg": [
            391.25,
            424.21420002164
        ],
        "wc_questions_avg": [
            26.75,
            15.896147331979533
        ],
        "wc_review_avg": [
            540.5,
            464.94811538493195
        ],
        "wc_reply_reviewers_avg": [
            240.0,
            257.38006915843346
        ],
        "wc_reply_authors_avg": [
            1103.5,
            950.7529910549848
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            1.6583123951777
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.47886115464444223,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Cu-yCBb1WHAJ:scholar.google.com/&scioq=Implicit+NNs+are+Almost+Equivalent+to+Not-so-deep+Explicit+NNs+for+High-dimensional+Gaussian+Mixtures&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0;0",
        "aff_unique_norm": "Huazhong University of Science and Technology;Shanghai Jiao Tong University",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.hust.edu.cn;https://www.sjtu.edu.cn",
        "aff_unique_abbr": "HUST;SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "Q6HYM1EMu8",
        "title": "LARG2, Language-based Automatic Reward and Goal Generation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Robotic tasks currently addressed with reinforcement learning such as locomotion, navigation, and manipulation are challenged with the problem of defining reward functions to maximize and goals to reach. \nAlternative methodologies, like imitation learning, often require labor-intensive human annotations to produce datasets of task descriptions  associated with trajectories.\nAs a response, this paper introduces \"Language-based Automatic Reward and Goal Generation\" (LARG), a framework that harnesses code generation capabilities of LLMs to enables the conversion of text-based task descriptions into corresponding reward and goal-generation functions.\nWe leverages Chain-of-thought mechanisms and the common-sense knowledge embedded in Large Language Models (LLMs) for this purpose.\nIt is complemented by automatic error discovery and correction mechanisms.\nWe validate the effectiveness of LARG by conducting extensive experiments in the context of robotic manipulation demonstrating its ability to train and execute without human annotation of any kind.",
        "keywords": "Robots Learning;Goal Conditioned Reward Learning;MTRL;Reward shapping;Large Language Models;Code generation;Chain-of-Thought",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "julien perez;Denys Marie Proux;Claude Roux;Michael Niemaz",
        "authorids": "~julien_perez1;~Denys_Marie_Proux1;~Claude_Roux1;~Michael_Niemaz1",
        "gender": "M;Not Specified;M;M",
        "homepage": ";https://europe.naverlabs.com/people_user/denys-proux/;https://github.com/naver/tamgu;",
        "dblp": "91/5931;33/1980.html;;",
        "google_scholar": "https://scholar.google.fr/citations?hl=fr;https://scholar.google.fr/citations?user=bF_nk6IAAAAJ;;zejSOXwAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~julien_perez1;~Denys_Marie_Proux1;~Claude_Roux1;~Michael_Niemaz1",
        "aff": "Ecole Pour l'Informatique et les Techniques Avancees;;Naver Labs Europe;Naver Labs Europe",
        "aff_domain": "epita.fr;;naverlabs.com;naverlabs.com",
        "position": "Associate Professor;;Researcher;Researcher",
        "bibtex": "@misc{\nperez2024larg,\ntitle={{LARG}2, Language-based Automatic Reward and Goal Generation},\nauthor={julien perez and Denys Marie Proux and Claude Roux and Michael Niemaz},\nyear={2024},\nurl={https://openreview.net/forum?id=Q6HYM1EMu8}\n}",
        "github": "",
        "project": "",
        "reviewers": "j1KR;zRqc;Ev2L;S7zE",
        "site": "https://openreview.net/forum?id=Q6HYM1EMu8",
        "pdf_size": 1809462,
        "rating": "3;3;3;3",
        "confidence": "4;4;4;3",
        "soundness": "2;2;2;1",
        "contribution": "2;2;2;2",
        "presentation": "2;1;1;1",
        "wc_summary": "41;35;50;57",
        "wc_strengths": "30;10;57;30",
        "wc_weaknesses": "1250;36;192;313",
        "wc_questions": "22;238;61;65",
        "wc_review": "1343;319;360;465",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "159;159;159;159",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            45.75,
            8.407585860400118
        ],
        "wc_strengths_avg": [
            31.75,
            16.708904811506947
        ],
        "wc_weaknesses_avg": [
            447.75,
            473.47353410724025
        ],
        "wc_questions_avg": [
            96.5,
            83.40413658806139
        ],
        "wc_review_avg": [
            621.75,
            419.80434430815507
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            159.0,
            0.0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14196407682685790509&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Ecole Pour l'Informatique et les Techniques Avancees;NAVER LABS",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.epita.fr;https://labs.naver.com",
        "aff_unique_abbr": "EPITA;NLE",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "France;Unknown"
    },
    {
        "id": "Q6xxuIZ0GK",
        "title": "Gradient-norm Constrained Algorithm on Offline and Online Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Reinforcement learning (RL) has displayed great potential on both discrete and continuous tasks. However, its applicability in in realistic settings is curbed by the inherent uncertainty in value estimates and policy estimates, especially for continuous control problem. We propose an off-policy actor-critic method for deep reinforcement learning (DRL), where the value and policy are estimated by function approximation.\nThe gradient decent approach to update parameters of multiple neural networks alternatively will inevitably cause the saddle point problem, which will degrade the overall convergence performance of training processes.\nBesides, off-policy methods can induce distribution mismatch, causing a deadly cycle of overestimation, when the candidate policies are conspicuously different from the policy which produces the data in replay buffer.\nTherefore, despite enjoying the advantage in sample complexity, the off-policy actor-critic methods is highly sensitive to network initialization, especially in the absence of expert demonstrations.\nWe attempt to tackle these two issues by proposing a novel policy regularization and related value penalty, respectively. The policy regularization makes the training less content with the saddle point which pretends to be an optimal one and encourages the training to skip it. And the value penalty discourages over-optimistic value estimates.\nThe proposed method is further combined with behavior cloning to apply to offline RL and tested on D4RL benchmarks.",
        "keywords": "Gradient-norm; Constrained; Reinforcement learning; Offline; Online",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/72199a22066d254a505bc2476b65696ccca18101.pdf",
        "author": "Huihui Zhang",
        "authorids": "~Huihui_Zhang1",
        "gender": "M",
        "homepage": "",
        "dblp": "https://dblp.uni-trier.de/pid/32/7555",
        "google_scholar": "",
        "orcid": "",
        "linkedin": "https://www.linkedin.com/feed/",
        "or_profile": "~Huihui_Zhang1",
        "aff": "",
        "aff_domain": "",
        "position": "",
        "bibtex": "@misc{\nzhang2024gradientnorm,\ntitle={Gradient-norm Constrained Algorithm on Offline and Online Learning},\nauthor={Huihui Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=Q6xxuIZ0GK}\n}",
        "github": "",
        "project": "",
        "reviewers": "daqm;ar2S;FbbA",
        "site": "https://openreview.net/forum?id=Q6xxuIZ0GK",
        "pdf_size": 3381116,
        "rating": "1;3;5",
        "confidence": "5;3;3",
        "soundness": "1;2;3",
        "contribution": "1;2;2",
        "presentation": "2;1;3",
        "wc_summary": "85;170;44",
        "wc_strengths": "13;45;51",
        "wc_weaknesses": "162;159;89",
        "wc_questions": "4;99;72",
        "wc_review": "264;473;256",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            1.632993161855452
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            99.66666666666667,
            52.4743323497837
        ],
        "wc_strengths_avg": [
            36.333333333333336,
            16.679994670929073
        ],
        "wc_weaknesses_avg": [
            136.66666666666666,
            33.7276675083759
        ],
        "wc_questions_avg": [
            58.333333333333336,
            39.96943276499625
        ],
        "wc_review_avg": [
            331.0,
            100.46226488919442
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.8660254037844387,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:UhWGk3NC9d8J:scholar.google.com/&scioq=Gradient-norm+Constrained+Algorithm+on+Offline+and+Online+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 2
    },
    {
        "id": "Q7jXHlWVLC",
        "title": "Re-imagine the Negative Prompt Algorithm for 2D/3D Diffusion",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Although text-to-image diffusion models have made significant strides in generating images from text, they are sometimes more inclined to generate images like the data on which the model was trained rather than the provided text. This limitation has hindered their usage in both 2D and 3D applications. To address this problem, we explored the use of negative prompts but found that the current implementation fails to produce desired results, particularly when there is an overlap between the main and negative prompts. To overcome this issue, we propose Perp-Neg, a new algorithm that leverages the geometrical properties of the score space to address the shortcomings of the current negative prompts algorithm. Perp-Neg does not require any training or fine-tuning of the model. Moreover, we experimentally demonstrate that Perp-Neg provides greater flexibility in generating images by enabling users to edit out unwanted concepts from the initially generated images in 2D cases. Furthermore, to extend the application of Perp-Neg to 3D, we integrate Perp-Neg with the state-of-the-art text-to-3D (DreamFusion) method. Our experimental studies clearly show the effectiveness of Perp-Neg in addressing the Janus (multi-head) problem. Perp-Neg has enabled the generation of 3D assets that were previously unattainable due to the persistent Janus problem, even after multiple attempts.",
        "keywords": "Text-to-3D;Diffusion;DreamFusion;Text-2-Image",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/f698b3c046211ad7996fc137740b0d9416001b7e.zip",
        "author": "Mohammadreza Armandpour;Ali Sadeghian;Huangjie Zheng;Amir Sadeghian;Mingyuan Zhou",
        "authorids": "~Mohammadreza_Armandpour1;~Ali_Sadeghian1;~Huangjie_Zheng1;~Amir_Sadeghian2;~Mingyuan_Zhou1",
        "gender": "M;;M;M;M",
        "homepage": "https://www.stat.tamu.edu/~armand/;;;;http://mingyuanzhou.github.io",
        "dblp": "245/3399;132/8958;192/2170;159/8747;",
        "google_scholar": "QijqTxwAAAAJ;0asq4zoAAAAJ;Vl5wCXsAAAAJ;;LXwCIisAAAAJ",
        "orcid": ";;0000-0003-0508-5034;;",
        "linkedin": "mohammadreza-armandpour-903a67121/;;;;",
        "or_profile": "~Mohammadreza_Armandpour1;~Ali_Sadeghian1;~Huangjie_Zheng1;~Amir_Sadeghian2;~Mingyuan_Zhou1",
        "aff": "Apple;;University of Texas, Austin;;Google",
        "aff_domain": "apple.com;;utexas.edu;;google.com",
        "position": "Researcher;;PhD student;;Researcher",
        "bibtex": "@misc{\narmandpour2024reimagine,\ntitle={Re-imagine the Negative Prompt Algorithm for 2D/3D Diffusion},\nauthor={Mohammadreza Armandpour and Ali Sadeghian and Huangjie Zheng and Amir Sadeghian and Mingyuan Zhou},\nyear={2024},\nurl={https://openreview.net/forum?id=Q7jXHlWVLC}\n}",
        "github": "",
        "project": "",
        "reviewers": "Vwgv;vLLW;6H1W;j2ct",
        "site": "https://openreview.net/forum?id=Q7jXHlWVLC",
        "pdf_size": 43442654,
        "rating": "5;5;6;6",
        "confidence": "5;5;4;4",
        "soundness": "3;3;4;2",
        "contribution": "2;2;4;3",
        "presentation": "3;3;4;2",
        "wc_summary": "121;53;62;67",
        "wc_strengths": "88;47;29;58",
        "wc_weaknesses": "118;71;35;215",
        "wc_questions": "73;6;8;31",
        "wc_review": "400;177;134;371",
        "wc_reply_reviewers": "0;121;0;12",
        "wc_reply_authors": "597;634;85;612",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            75.75,
            26.602396508585464
        ],
        "wc_strengths_avg": [
            55.5,
            21.43011899173684
        ],
        "wc_weaknesses_avg": [
            109.75,
            67.51805314136361
        ],
        "wc_questions_avg": [
            29.5,
            26.9675731203236
        ],
        "wc_review_avg": [
            270.5,
            116.45278012997372
        ],
        "wc_reply_reviewers_avg": [
            33.25,
            50.898796645893306
        ],
        "wc_reply_authors_avg": [
            482.0,
            229.58549605756895
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:tcMHssMGDlAJ:scholar.google.com/&scioq=Re-imagine+the+Negative+Prompt+Algorithm+for+2D/3D+Diffusion&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Apple;University of Texas at Austin;Google",
        "aff_unique_dep": "Apple Inc.;;Google",
        "aff_unique_url": "https://www.apple.com;https://www.utexas.edu;https://www.google.com",
        "aff_unique_abbr": "Apple;UT Austin;Google",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Austin;Mountain View",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Q8RGmICUkJ",
        "title": "SiBBlInGS: Similarity-driven Building Block Inference using Graphs across States",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Data in many scientific domains are often collected under multiple distinct states (e.g., different clinical interventions), wherein latent processes (e.g., internal biological factors) can create complex variability between individual trials both within single states and between states. A promising approach for addressing this complexity is uncovering fundamental representational units within the data, i.e., functional Building Blocks (BBs), that can adjust their temporal activity and component structure across trials to capture the diverse spectrum of cross-trial variability. However, existing methods for understanding such multi-dimensional data often rely on tensor factorization under assumptions that may not align with the characteristics of real-world data, and struggle to accommodate trials of different durations, missing samples, and varied sampling rates. Here, we present a framework for Similarity-driven Building Block Inference using Graphs across States (SiBBlInGS). SiBBlInGS employs a robust graph-based dictionary learning approach for BB discovery that considers shared temporal activity, inter- and intra-state relationships, non-orthogonal components, and variations in session counts and duration across states, while remaining resilient to noise, random initializations, and missing samples. Additionally, it enables the identification of state-specific vs. state-invariant BBs and allows for cross-state controlled variations in BB structure and per-trial temporal variability. We demonstrate SiBBlInGS on synthetic and several real-world examples to highlight its ability to provide insights into the underlying mechanisms of complex phenomena across fields.",
        "keywords": "tensor factorization;matrix factorization;neural ensembles;neuroscience;sparsity;trial variability;dictionary learning;graph-based filtering;multi-state analysis;multi-dimensional time series data",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/e55136e37f18c24bfcb3c01a2e464024d47ab684.zip",
        "author": "Noga Mudrik;Gal Mishne;Adam Shabti Charles",
        "authorids": "~Noga_Mudrik1;~Gal_Mishne1;~Adam_Shabti_Charles1",
        "gender": ";F;M",
        "homepage": ";http://mishne.ucsd.edu/;https://www.bme.jhu.edu/ascharles/",
        "dblp": ";125/3214;04/10257",
        "google_scholar": ";KrwpdXYAAAAJ;c8RKLp0AAAAJ",
        "orcid": ";0000-0002-5287-3626;",
        "linkedin": ";;",
        "or_profile": "~Noga_Mudrik1;~Gal_Mishne1;~Adam_Shabti_Charles1",
        "aff": ";University of California, San Diego;Johns Hopkins University",
        "aff_domain": ";ucsd.edu;jhu.edu",
        "position": ";Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nmudrik2024sibblings,\ntitle={Si{BB}lIn{GS}: Similarity-driven Building Block Inference using Graphs across States},\nauthor={Noga Mudrik and Gal Mishne and Adam Shabti Charles},\nyear={2024},\nurl={https://openreview.net/forum?id=Q8RGmICUkJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "xmKq;WRaP;T8G6",
        "site": "https://openreview.net/forum?id=Q8RGmICUkJ",
        "pdf_size": 23121285,
        "rating": "5;6;6",
        "confidence": "4;3;2",
        "soundness": "3;3;3",
        "contribution": "3;2;3",
        "presentation": "2;3;3",
        "wc_summary": "45;90;130",
        "wc_strengths": "44;77;107",
        "wc_weaknesses": "260;57;116",
        "wc_questions": "2;82;136",
        "wc_review": "351;306;489",
        "wc_reply_reviewers": "10;10;9",
        "wc_reply_authors": "1354;1566;1867",
        "reply_reviewers": "1;1;1",
        "reply_authors": "4;4;4",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            88.33333333333333,
            34.721111093332766
        ],
        "wc_strengths_avg": [
            76.0,
            25.729360660537214
        ],
        "wc_weaknesses_avg": [
            144.33333333333334,
            85.26168867407891
        ],
        "wc_questions_avg": [
            73.33333333333333,
            55.04745427558137
        ],
        "wc_review_avg": [
            382.0,
            77.85884663928692
        ],
        "wc_reply_reviewers_avg": [
            9.666666666666666,
            0.4714045207910317
        ],
        "wc_reply_authors_avg": [
            1595.6666666666667,
            210.479347099794
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            4.0,
            0.0
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=389601076059086212&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of California, San Diego;Johns Hopkins University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ucsd.edu;https://www.jhu.edu",
        "aff_unique_abbr": "UCSD;JHU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "San Diego;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Q8cVivO5k5",
        "title": "Large-Batch, Iteration-Efficient Neural Bayesian Design Optimization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Bayesian optimization (BO) provides a powerful framework for optimizing black-box, expensive-to-evaluate functions. It is therefore an attractive tool for engineering design problems, typically involving multiple objectives. Thanks to the rapid advances in fabrication and measurement methods as well as parallel computing infrastructure, querying many design problems can be heavily parallelized. This class of problems challenges BO with an unprecedented setup where it has to deal with very large batches, shifting its focus from sample efficiency to iteration efficiency. We present a novel Bayesian optimization framework specifically tailored to address these limitations. Our key contribution is a highly scalable, sample-based acquisition function that performs a non-dominated sorting of not only the objectives but also their associated uncertainty. We show that our acquisition function in combination with different Bayesian neural network surrogates is effective in data-intensive environments with a minimal number of iterations. We demonstrate the superiority of our method by comparing it with state-of-the-art multi-objective optimizations. We perform our evaluation on two real-world problems - airfoil design and 3D printing -showcasing the applicability and efficiency of our approach. Our code is available at: https://github.com/an-on-ym-ous/lbn_mobo",
        "keywords": "Bayesian optimization;Neural inverse design;Paretofront discovery;Multi-objective optimization;Uncertainty-aware-surrogate model",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/5322e0d73db36fc60305070375c600eeeb53f1d4.zip",
        "author": "Navid Ansari;Hans-peter Seidel;Vahid Babaei",
        "authorids": "~Navid_Ansari1;~Hans-peter_Seidel1;~Vahid_Babaei1",
        "gender": "M;M;",
        "homepage": "https://people.mpi-inf.mpg.de/~nansari/;https://people.mpi-inf.mpg.de/~hpseidel/;http://cam.mpi-inf.mpg.de/?view=people_vahid",
        "dblp": "280/1651;s/HansPeterSeidel.html;124/2206",
        "google_scholar": "https://scholar.google.de/citations?user=k2TvtoAAAAAJ;https://scholar.google.de/citations?user=s2Ibok8AAAAJ;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Navid_Ansari1;~Hans-peter_Seidel1;~Vahid_Babaei1",
        "aff": "Saarland Informatics Campus, Max-Planck Institute;Max-Planck Institute;Saarland Informatics Campus, Max-Planck Institute",
        "aff_domain": "mpi-inf.mpg.de;mpg.de;mpi-inf.mpg.de",
        "position": "PhD student;Scientific Director;Researcher",
        "bibtex": "@misc{\nansari2024largebatch,\ntitle={Large-Batch, Iteration-Efficient Neural Bayesian Design Optimization},\nauthor={Navid Ansari and Hans-peter Seidel and Vahid Babaei},\nyear={2024},\nurl={https://openreview.net/forum?id=Q8cVivO5k5}\n}",
        "github": "",
        "project": "",
        "reviewers": "acfL;9JiQ;s2Pz;2FsD",
        "site": "https://openreview.net/forum?id=Q8cVivO5k5",
        "pdf_size": 7788836,
        "rating": "3;5;6;8",
        "confidence": "4;3;4;3",
        "soundness": "2;2;3;4",
        "contribution": "2;2;2;3",
        "presentation": "2;2;2;4",
        "wc_summary": "107;71;52;182",
        "wc_strengths": "69;72;60;109",
        "wc_weaknesses": "326;216;235;61",
        "wc_questions": "240;121;5;44",
        "wc_review": "742;480;352;396",
        "wc_reply_reviewers": "231;87;0;0",
        "wc_reply_authors": "1805;1493;414;187",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "3;3;1;1",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            103.0,
            49.704124577342675
        ],
        "wc_strengths_avg": [
            77.5,
            18.714967272212903
        ],
        "wc_weaknesses_avg": [
            209.5,
            95.28509852017785
        ],
        "wc_questions_avg": [
            102.5,
            89.68974300331114
        ],
        "wc_review_avg": [
            492.5,
            151.21094537102795
        ],
        "wc_reply_reviewers_avg": [
            79.5,
            94.40471386535738
        ],
        "wc_reply_authors_avg": [
            974.75,
            687.9114677776495
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            1.0
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5547001962252291,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9470051895202635514&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Max-Planck Institute;Max-Planck-Gesellschaft zur F\u00f6rderung der Wissenschaften e.V.",
        "aff_unique_dep": "Informatics;",
        "aff_unique_url": "https://www.mpi-sws.org;https://www.mpg.de",
        "aff_unique_abbr": "MPI-SWS;MPG",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Saarland;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "Q8ibi56aM6",
        "title": "SINGLE-IMAGE COHERENT RECONSTRUCTION OF OBJECTS AND HUMANS",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Existing methods for reconstruction of objects and humans from a monocular image suffer from severe mesh collisions and performance limitations for interacting occluding objects. In this paper, we introduce a method that deduces spatial configurations and achieves globally consistent 3D reconstruction for interacting objects and people captured within a single image. Our contributions encompass: 1) an optimization framework, featuring a novel collision loss, tailored to handle complex human-object and human-human interactions, ensuring spatially coherent scene reconstruction; and 2) a novel technique for robustly estimating 6 degrees of freedom (DOF) poses, particularly for heavily occluded objects, exploiting image inpainting. Notably, our proposed method operates effectively on images from real-world scenarios, without necessitating scene or object-level 3D supervision. Through both qualitative and quantitative assessments, we demonstrate the superior quality of our reconstructions, showcasing a significant reduction in collisions in scenes with multiple interacting humans and objects.",
        "keywords": "Scene Reconstruction;Mesh Collisions;Human-Human Interactions;Human-Object Interactions;Image Inpainting;Pose Estimation",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "sarthak batra;Partha Pratim Chakrabarti;Simon Hadfield;Armin Mustafa",
        "authorids": "~sarthak_batra1;~Partha_Pratim_Chakrabarti1;~Simon_Hadfield1;~Armin_Mustafa4",
        "gender": "M;M;M;F",
        "homepage": ";http://www.iitkgp.ac.in/department/CS/faculty/cs-ppchak;http://personal.ee.surrey.ac.uk/Personal/S.Hadfield/biography.html;https://arminmustafa.github.io/",
        "dblp": ";c/PPChakrabarti.html;33/10771;43/10169",
        "google_scholar": ";;https://scholar.google.co.uk/citations?user=KuQs_N0AAAAJ;https://scholar.google.co.uk/citations?user=0xOHqkMAAAAJ",
        "orcid": ";0000-0002-3553-8834;0000-0001-8637-5054;",
        "linkedin": "sarthak-batra1/;;;armin-mustafa-8b7b886/",
        "or_profile": "~sarthak_batra1;~Partha_Pratim_Chakrabarti1;~Simon_Hadfield1;~Armin_Mustafa4",
        "aff": "University of Surrey;Indian Institute of Technology Kharagpur;University of Surrey;University of Surrey",
        "aff_domain": "surrey.ac.uk;iitkgp.ac.in;surrey.ac.uk;surrey.ac.uk",
        "position": "PhD student;Professor;Associate Professor;Lecturer",
        "bibtex": "@misc{\nbatra2024singleimage,\ntitle={{SINGLE}-{IMAGE} {COHERENT} {RECONSTRUCTION} {OF} {OBJECTS} {AND} {HUMANS}},\nauthor={sarthak batra and Partha Pratim Chakrabarti and Simon Hadfield and Armin Mustafa},\nyear={2024},\nurl={https://openreview.net/forum?id=Q8ibi56aM6}\n}",
        "github": "",
        "project": "",
        "reviewers": "NYAH;6q9o;1ipB;HiJk",
        "site": "https://openreview.net/forum?id=Q8ibi56aM6",
        "pdf_size": 12944684,
        "rating": "3;3;5;5",
        "confidence": "2;5;3;4",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "3;3;4;2",
        "wc_summary": "122;76;86;69",
        "wc_strengths": "57;60;71;45",
        "wc_weaknesses": "198;82;120;73",
        "wc_questions": "12;352;41;12",
        "wc_review": "389;570;318;199",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            88.25,
            20.40067400847335
        ],
        "wc_strengths_avg": [
            58.25,
            9.256754290786809
        ],
        "wc_weaknesses_avg": [
            118.25,
            49.30707352905869
        ],
        "wc_questions_avg": [
            104.25,
            143.52765412978783
        ],
        "wc_review_avg": [
            369.0,
            134.44515610463623
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:WeDSeOZDGp0J:scholar.google.com/&scioq=SINGLE-IMAGE+COHERENT+RECONSTRUCTION+OF+OBJECTS+AND+HUMANS&hl=en&as_sdt=0,33",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "University of Surrey;Indian Institute of Technology Kharagpur",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.surrey.ac.uk;https://www.iitkgp.ac.in",
        "aff_unique_abbr": "Surrey;IIT Kharagpur",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Kharagpur",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "United Kingdom;India"
    },
    {
        "id": "Q8ypeYHKFO",
        "title": "SafeDiffuser: Safe Planning with Diffusion Probabilistic Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Diffusion model-based approaches have shown promise in data-driven planning. Although these planners are typically used in decision-critical applications, there are yet no known safety guarantees established for them.  In this paper, we address this limitation by introducing SafeDiffuser, a method to equip probabilistic diffusion models with safety guarantees via control barrier functions. The key idea of our approach is to embed finite-time diffusion invariance, i.e., a form of specification mainly consisting of safety constraints, into the denoising diffusion procedure. This way we enable data generation under safety constraints. We show that SafeDiffusers maintain the generative performance of diffusion models while also providing robustness in safe data generation. We finally test our method on a series of planning tasks, including maze path generation, legged robot locomotion, and 3D space manipulation, and demonstrate the advantages of robustness over vanilla diffusion models.",
        "keywords": "Diffusion;Safe Planning;Specification Guarantees",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/26d69d5e643fab91cdbab17bc366af624fd6f9f9.zip",
        "author": "Wei Xiao;Tsun-Hsuan Wang;Chuang Gan;Ramin Hasani;Mathias Lechner;Daniela Rus",
        "authorids": "~Wei_Xiao2;~Tsun-Hsuan_Wang2;~Chuang_Gan1;~Ramin_Hasani1;~Mathias_Lechner1;~Daniela_Rus1",
        "gender": "M;M;M;Unspecified;F;M",
        "homepage": ";https://zswang666.github.io/;http://people.csail.mit.edu/ganchuang/;https://mlech26l.github.io/pages/;https://www.csail.mit.edu/person/daniela-rus;http://www.raminhasani.com",
        "dblp": "20/4794-3;217/1809.html;139/6993;209/9862;r/DanielaRus;190/3168",
        "google_scholar": "BxdZJNQAAAAJ;xE3WSuYAAAAJ;PTeSCbIAAAAJ;https://scholar.google.at/citations?hl=en;https://scholar.google.com/citations?hl=en;https://scholar.google.at/citations?user=YarJF3QAAAAJ",
        "orcid": ";;;;;0000-0002-9889-5222",
        "linkedin": ";;;;;raminhasani/",
        "or_profile": "~Wei_Xiao2;~Tsun-Hsuan_Wang2;~Chuang_Gan1;~Mathias_Lechner1;~Daniela_Rus1;~Ramin_M._Hasani1",
        "aff": "Massachusetts Institute of Technology;Liquid AI;University of Massachusetts at Amherst;;Massachusetts Institute of Technology;Massachusetts Institute of Technology",
        "aff_domain": "mit.edu;liquid.ai;umass.edu;;mit.edu;mit.edu",
        "position": "Postdoc;Researcher;Assistant Professor;;Full Professor;Researcher",
        "bibtex": "@misc{\nxiao2024safediffuser,\ntitle={SafeDiffuser: Safe Planning with Diffusion Probabilistic Models},\nauthor={Wei Xiao and Tsun-Hsuan Wang and Chuang Gan and Ramin Hasani and Mathias Lechner and Daniela Rus},\nyear={2024},\nurl={https://openreview.net/forum?id=Q8ypeYHKFO}\n}",
        "github": "",
        "project": "",
        "reviewers": "3To6;HJX4;dMwB",
        "site": "https://openreview.net/forum?id=Q8ypeYHKFO",
        "pdf_size": 2149360,
        "rating": "1;3;6",
        "confidence": "3;2;3",
        "soundness": "2;1;2",
        "contribution": "2;2;3",
        "presentation": "1;1;3",
        "wc_summary": "43;68;143",
        "wc_strengths": "46;36;63",
        "wc_weaknesses": "148;98;49",
        "wc_questions": "194;51;162",
        "wc_review": "431;253;417",
        "wc_reply_reviewers": "0;92;69",
        "wc_reply_authors": "809;536;578",
        "reply_reviewers": "0;1;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            3.3333333333333335,
            2.0548046676563256
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            84.66666666666667,
            42.49182927993987
        ],
        "wc_strengths_avg": [
            48.333333333333336,
            11.145502331533658
        ],
        "wc_weaknesses_avg": [
            98.33333333333333,
            40.41726803676314
        ],
        "wc_questions_avg": [
            135.66666666666666,
            61.27714817849219
        ],
        "wc_review_avg": [
            367.0,
            80.81254028099022
        ],
        "wc_reply_reviewers_avg": [
            53.666666666666664,
            39.09248293754469
        ],
        "wc_reply_authors_avg": [
            641.0,
            120.02499739637572
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.1147078669352809,
        "gs_citation": 36,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16488877408013518570&as_sdt=80005&sciodt=0,11&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;0;0",
        "aff_unique_norm": "Massachusetts Institute of Technology;Liquid AI;University of Massachusetts Amherst",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://web.mit.edu;;https://www.umass.edu",
        "aff_unique_abbr": "MIT;;UMass Amherst",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Amherst",
        "aff_country_unique_index": "0;1;0;0;0",
        "aff_country_unique": "United States;Unknown"
    },
    {
        "id": "Q9NMLp2lft",
        "title": "A Generalized Convolutional Neural Network for Small Dataset Classification",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We propose a novel variant of neural networks, Generalized Convolutional Neural Networks, GConvNets, characterized by structured neurons. In contrast to conventional neural networks such as ConvNets, which predominantly employ 'scalar' neurons, GConvNets utilize structured 'tensor' neurons. In other words, we generalize ConvNets by substituting each scalar neuron in ConvNets with a tensor neuron in GConvNets,  while preserving the weight-sharing mechanism. These structured neurons manifest as tensors with adaptable shapes and dimensions across different layers. To ensure their practical applicability, we have developed a mechanism that enables seamless handling of hybrid structured tensor neurons as they transition from one layer to the next.  We conducted a comparative analysis between GConvNets and the currently popular ConvNets, which include ResNets, MobileNets, EfficientNets, RegNets, among others, using datasets such as CIFAR10, CIFAR100, and Tiny ImageNet. The experimental results demonstrate that GConvNets exhibit superior efficiency in terms of parameter usage.",
        "keywords": "Generalized;ConvNets;Classification",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/653830295d059dce16cd52acbafd3923a976e6f4.zip",
        "author": "Zhenhua Chen;David J. Crandall",
        "authorids": "~Zhenhua_Chen1;~David_J._Crandall1",
        "gender": "M;M",
        "homepage": "https://vision.soic.indiana.edu/people/;https://www.cs.indiana.edu/~djcran/",
        "dblp": ";c/DavidCrandall",
        "google_scholar": ";https://scholar.google.com.tw/citations?user=8bQRH5YAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Zhenhua_Chen1;~David_Crandall1",
        "aff": "Indiana University, Bloomington;Indiana University",
        "aff_domain": "iu.edu;indiana.edu",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nchen2024a,\ntitle={A Generalized Convolutional Neural Network for Small Dataset Classification},\nauthor={Zhenhua Chen and David J. Crandall},\nyear={2024},\nurl={https://openreview.net/forum?id=Q9NMLp2lft}\n}",
        "github": "",
        "project": "",
        "reviewers": "wHyx;JBwA;zai5;8QHt",
        "site": "https://openreview.net/forum?id=Q9NMLp2lft",
        "pdf_size": 308236,
        "rating": "1;3;5;6",
        "confidence": "4;3;2;3",
        "soundness": "1;2;2;3",
        "contribution": "1;1;2;2",
        "presentation": "1;1;1;3",
        "wc_summary": "35;30;70;86",
        "wc_strengths": "35;37;40;49",
        "wc_weaknesses": "82;62;240;3",
        "wc_questions": "47;26;5;172",
        "wc_review": "199;155;355;310",
        "wc_reply_reviewers": "33;0;22;0",
        "wc_reply_authors": "257;307;308;276",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "2;1;2;1",
        "rating_avg": [
            3.75,
            1.920286436967152
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            1.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            55.25,
            23.509306667785847
        ],
        "wc_strengths_avg": [
            40.25,
            5.356071321407137
        ],
        "wc_weaknesses_avg": [
            96.75,
            87.6566454982165
        ],
        "wc_questions_avg": [
            62.5,
            64.94035725186612
        ],
        "wc_review_avg": [
            254.75,
            80.8714257324551
        ],
        "wc_reply_reviewers_avg": [
            13.75,
            14.289419162443238
        ],
        "wc_reply_authors_avg": [
            287.0,
            21.575449010391416
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.7364596943186587,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:qvcPlk83AsMJ:scholar.google.com/&scioq=A+Generalized+Convolutional+Neural+Network+for+Small+Dataset+Classification&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Indiana University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.indiana.edu",
        "aff_unique_abbr": "IU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Bloomington;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Q9R10ZKd8z",
        "title": "PolyNet: Learning Diverse Solution Strategies for Neural Combinatorial Optimization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In recent years, learning-based approaches have made remarkable strides in tackling combinatorial optimization problems. Reinforcement learning-based construction methods, in particular, have shown promise in producing high-quality solutions, often surpassing established operations research heuristics for simple routing problems. Nonetheless, inherent limitations, such as a lack of solution diversity and limited applicability to complex problems, have hindered their widespread adoption. This paper introduces PolyNet, a novel approach that uses a single-decoder model to learn complementary solution strategies for combinatorial optimization problems, allowing the rapid creation of diverse solutions for a given instance. Moreover, PolyNet's diversity mechanism enhances training exploration without relying on solution space symmetries, enabling it to effectively tackle more complex problems. We evaluate PolyNet on three combinatorial optimization problems of varying difficulty. Our comprehensive experiments consistently demonstrate significant improvements over state-of-the-art machine learning methods, both in terms of swift solution generation and extensive search.",
        "keywords": "neural combinatorial optimization;learning to optimize;reinforcement learning;routing problems",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Andr\u00e9 Hottung;Mridul Mahajan;Kevin Tierney",
        "authorids": "~Andr\u00e9_Hottung1;~Mridul_Mahajan1;~Kevin_Tierney1",
        "gender": ";;M",
        "homepage": ";https://mridulmahajan44.github.io/;http://www.tierney.de",
        "dblp": ";;13/7407",
        "google_scholar": "zzqATFsAAAAJ;myoAmX4AAAAJ;https://scholar.google.de/citations?user=G-EGfLEAAAAJ",
        "orcid": "0000-0002-7251-9093;;0000-0002-5931-4907",
        "linkedin": ";;kevinbtierney/",
        "or_profile": "~Andr\u00e9_Hottung1;~Mridul_Mahajan1;~Kevin_Tierney1",
        "aff": "Bielefeld University;Max Planck Institute for Intelligent Systems;Bielefeld University",
        "aff_domain": "uni-bielefeld.de;tuebingen.mpg.de;uni-bielefeld.de",
        "position": "Postdoc;Intern;Full Professor",
        "bibtex": "@misc{\nhottung2024polynet,\ntitle={PolyNet: Learning Diverse Solution Strategies for Neural Combinatorial Optimization},\nauthor={Andr{\\'e} Hottung and Mridul Mahajan and Kevin Tierney},\nyear={2024},\nurl={https://openreview.net/forum?id=Q9R10ZKd8z}\n}",
        "github": "",
        "project": "",
        "reviewers": "eigK;3QzE;2arF;2aWJ",
        "site": "https://openreview.net/forum?id=Q9R10ZKd8z",
        "pdf_size": 698808,
        "rating": "5;5;5;5",
        "confidence": "1;3;5;3",
        "soundness": "3;2;2;3",
        "contribution": "3;2;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "24;65;85;41",
        "wc_strengths": "17;30;24;107",
        "wc_weaknesses": "105;50;419;31",
        "wc_questions": "38;236;5;109",
        "wc_review": "184;381;533;288",
        "wc_reply_reviewers": "9;60;341;14",
        "wc_reply_authors": "341;449;754;687",
        "reply_reviewers": "1;1;2;1",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            1.4142135623730951
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            53.75,
            23.1880896151451
        ],
        "wc_strengths_avg": [
            44.5,
            36.376503405357695
        ],
        "wc_weaknesses_avg": [
            151.25,
            156.95600498228796
        ],
        "wc_questions_avg": [
            97.0,
            88.61433292645158
        ],
        "wc_review_avg": [
            346.5,
            128.25852798157322
        ],
        "wc_reply_reviewers_avg": [
            106.0,
            137.12585460080095
        ],
        "wc_reply_authors_avg": [
            557.75,
            168.8392356651735
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 17,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9186270371498958398&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Bielefeld University;Max Planck Institute for Intelligent Systems",
        "aff_unique_dep": ";Intelligent Systems",
        "aff_unique_url": "https://www.uni-bielefeld.de/;https://www.mpi-is.mpg.de",
        "aff_unique_abbr": "Uni Bielefeld;MPI-IS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "Q9vYgjcvrX",
        "title": "SASS: Self-Alignment with Semi-Supervised Instruction Data Generation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Instruction tuning is instrumental in enabling Large Language Models~(LLMs) to follow user instructions to complete various open-domain tasks.\nThe success of instruction tuning depends on the availability of high-quality instruction data.\nOwing to the exorbitant cost and substandard quality of human annotation, recent works have been deeply engaged in the exploration of the utilization of powerful closed-source models to generate instruction data automatically.\nHowever, these methods carry potential risks arising from the usage requirements of powerful closed-source models, which strictly forbid the utilization of their outputs to develop machine learning models.\nTo deal with this problem, in this work, we explore alternative approaches to generate high-quality instruction data that do not rely on closed-source models.\nOur exploration includes an investigation of various existing instruction generation methods, culminating in the integration of the most efficient variant with two novel strategies to enhance the quality further. \nEvaluation results from two benchmarks and the GPT-4 model demonstrate the effectiveness of our generated instruction data, which can outperform Alpaca, a method reliant on closed-source models.\nWe hope that more progress can be achieved in generating high-quality instruction data without using closed-source models.",
        "keywords": "Instruction Tuning;Data Generation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yue Wang;Haoke Zhang;Juntao Li;Jinxiong Chang;Qishen Zhang;Zhongyi Liu;Guannan Zhang;Min Zhang",
        "authorids": "~Yue_Wang17;~Haoke_Zhang1;~Juntao_Li2;~Jinxiong_Chang1;~Qishen_Zhang1;~Zhongyi_Liu1;~Guannan_Zhang2;~Min_Zhang9",
        "gender": "M;M;M;M;M;;M;M",
        "homepage": "https://wangyuenlp.github.io/;https://banner-z.github.io/;https://lijuntaopku.github.io/;;;;https://orcid.org/0000-0002-7091-2318;https://zhangmin-nlp-ai.github.io/",
        "dblp": "33/4822-39.html;;;;;46/394;;83/5342-5",
        "google_scholar": ";;sZSygsYAAAAJ;;;;;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": ";;0000-0002-6286-7529;;;;0000-0002-7091-2318;",
        "linkedin": ";;;jinxiong-c-b0634762;qishen-zhang-45a61a77/;;;",
        "or_profile": "~Yue_Wang17;~Haoke_Zhang1;~Juntao_Li2;~Jinxiong_Chang1;~Qishen_Zhang1;~Zhongyi_Liu1;~Guannan_Zhang2;~Min_Zhang9",
        "aff": "Soochow University, China;Baidu;Soochow University, China;Alibaba Group;;Ant Group;;Harbin Institute of Technology, Shenzhen",
        "aff_domain": "suda.edu.cn;baidu.com;suda.edu.cn;antgroup.com;;alipay.com;;hit.edu.cn",
        "position": "PhD student;Intern;Associate Professor;Researcher;;Director of Alipay Search;;Full Professor",
        "bibtex": "@misc{\nwang2024sass,\ntitle={{SASS}: Self-Alignment with Semi-Supervised Instruction Data Generation},\nauthor={Yue Wang and Haoke Zhang and Juntao Li and Jinxiong Chang and Qishen Zhang and Zhongyi Liu and Guannan Zhang and Min Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=Q9vYgjcvrX}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZkP4;d3RB;oFCh;jPLq",
        "site": "https://openreview.net/forum?id=Q9vYgjcvrX",
        "pdf_size": 843993,
        "rating": "3;3;3;5",
        "confidence": "3;5;4;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "2;2;2;2",
        "wc_summary": "84;136;93;58",
        "wc_strengths": "38;25;115;64",
        "wc_weaknesses": "210;201;485;170",
        "wc_questions": "44;45;7;9",
        "wc_review": "376;407;700;301",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            92.75,
            28.083580612165537
        ],
        "wc_strengths_avg": [
            60.5,
            34.4564943080401
        ],
        "wc_weaknesses_avg": [
            266.5,
            127.02066760964532
        ],
        "wc_questions_avg": [
            26.25,
            18.267115262131565
        ],
        "wc_review_avg": [
            446.0,
            151.62618507368705
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13863318631663143437&as_sdt=4005&sciodt=0,6&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;2;3;4",
        "aff_unique_norm": "Soochow University;Baidu;Alibaba Group;Ant Group;Harbin Institute of Technology",
        "aff_unique_dep": ";Baidu, Inc.;;;",
        "aff_unique_url": "https://www.soochow.edu.cn;https://www.baidu.com;https://www.alibaba.com;https://www.antgroup.com;http://en.hhit.edu.cn/",
        "aff_unique_abbr": "Soochow U;Baidu;Alibaba;Ant Group;HIT",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Shenzhen",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "QAgwFiIY4p",
        "title": "Graph as Point Set",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graphs, fundamental data structures with diverse real-world applications, consist of interconnected nodes. Existing Graph Neural Networks (GNNs) have predominantly concentrated on encoding these intricate interconnections. They employ either edge-based mechanisms for guiding message passing between nodes or complex neural network architectures designed to handle adjacency matrices as inputs, resulting in a plethora of intricate designs. Departing from this conventional trajectory, this paper introduces a paradigm-shifting approach by unveiling a novel graph-to-set conversion method. This innovative technique bijectively transforms interconnected nodes into independent points, amenable to processing by a set encoder. Utilizing the Transformer, a standard set model, we facilitate point learning. Theoretically, our proposed method outperforms various existing models in terms of both short-range and long-range expressivity. Extensive experimental validation further substantiates our model's real-world performance.",
        "keywords": "Graph Neural Network",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/ede6aca19e245e32b98940046681584fc9e8ea9c.zip",
        "author": "Xiyuan Wang;Pan Li;Muhan Zhang",
        "authorids": "~Xiyuan_Wang1;~Pan_Li2;~Muhan_Zhang1",
        "gender": ";;M",
        "homepage": ";;https://muhanzhang.github.io/",
        "dblp": "95/8542;https://dblp.org/pers/hd/l/Li_0005:Pan;157/5518",
        "google_scholar": ";IroP0EwAAAAJ;https://scholar.google.com.hk/citations?user=OBBqkosAAAAJ",
        "orcid": ";;0000-0002-7680-6401",
        "linkedin": "%E5%B8%8C%E5%85%83-%E7%8E%8B-969660221/;pan-li-b951105a/;jerry-muhan-zhang-a33a1777/",
        "or_profile": "~Xiyuan_Wang1;~Pan_Li2;~Muhan_Zhang1",
        "aff": "Peking University;Purdue University;Peking University",
        "aff_domain": "pku.edu.cn;purdue.edu;pku.edu.cn",
        "position": "PhD student;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nwang2024graph,\ntitle={Graph as Point Set},\nauthor={Xiyuan Wang and Pan Li and Muhan Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=QAgwFiIY4p}\n}",
        "github": "",
        "project": "",
        "reviewers": "WPLr;h4E8;8zdN;knXN",
        "site": "https://openreview.net/forum?id=QAgwFiIY4p",
        "pdf_size": 1156035,
        "rating": "5;5;6;8",
        "confidence": "4;3;5;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;2;3",
        "wc_summary": "97;88;54;122",
        "wc_strengths": "65;43;47;52",
        "wc_weaknesses": "341;127;234;265",
        "wc_questions": "86;3;107;109",
        "wc_review": "589;261;442;548",
        "wc_reply_reviewers": "0;117;92;119",
        "wc_reply_authors": "1257;1471;1683;1033",
        "reply_reviewers": "0;1;2;1",
        "reply_authors": "4;5;3;3",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            90.25,
            24.355440870573457
        ],
        "wc_strengths_avg": [
            51.75,
            8.287792227125388
        ],
        "wc_weaknesses_avg": [
            241.75,
            76.84196444651842
        ],
        "wc_questions_avg": [
            76.25,
            43.239883209833025
        ],
        "wc_review_avg": [
            460.0,
            126.7970819853517
        ],
        "wc_reply_reviewers_avg": [
            82.0,
            48.52319033204639
        ],
        "wc_reply_authors_avg": [
            1361.0,
            241.96280705926685
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            3.75,
            0.82915619758885
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.28867513459481287,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12876007589269967137&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Peking University;Purdue University",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.purdue.edu",
        "aff_unique_abbr": "Peking U;Purdue",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "QAq5JTFJmp",
        "title": "AN ENTROPY PERSPECTIVE IN KNOWLEDGE DISTILLATION",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Knowledge distillation is a widely studied technique for transferring knowledge from a large teacher model to a smaller student model, with the aim of maintaining high performance while reducing computational complexity. However, the performance of the student model often suffers when the teacher model is overly large. \nWe observe significant differences in the ability of teacher and student models to minimize losses, with student models exhibiting higher entropy. This underscores the inherent difficulty in transferring knowledge from the more complex teacher model to the simpler student model. Through theoretical analysis, we propose a straightforward intermediate alignment module to narrow the entropy gap between the student and the teacher, thus enhancing the student performance. \nCompared with vanilla distillation, the proposed method has the potential to improve the performance of the student model when the teacher model is significantly large, paving the way for more efficient and powerful model learning techniques in the field of knowledge distillation.",
        "keywords": "Knowledge Distillation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/707aaec1470c011c3a21de6942acf3becfc422cd.zip",
        "author": "Jia Guo;Minghao Chen;Yilun Zhao;Boyuan Pan;Yao Hu;Heda Wang;Chen Zhu;Xiaofei He;Deng Cai",
        "authorids": "~Jia_Guo2;~Minghao_Chen2;~Yilun_Zhao1;~Boyuan_Pan1;~Yao_Hu2;~Heda_Wang1;~Chen_Zhu5;~Xiaofei_He2;~Deng_Cai4",
        "gender": "M;M;;M;M;M;;M;M",
        "homepage": "https://forjiuzhou.github.io/;;https://yilunzhao.github.io/;http://panboyuan.net/;;https://github.com/wangheda;;https://person.zju.edu.cn/0007101;http://www.cad.zju.edu.cn/home/dengcai/",
        "dblp": ";39/332-1;271/8391;203/8799;41/8206;;;h/XiaofeiHe.html;c/DCai",
        "google_scholar": ";xxPcRRQAAAAJ;https://scholar.google.com/citations?hl=zh-CN;lVFNAxcAAAAJ;IUpJ8jwAAAAJ;;;QLLFowsAAAAJ;vzxDyJoAAAAJ",
        "orcid": ";;;;;;;0009-0001-9107-2354;",
        "linkedin": ";;;;;;;;",
        "or_profile": "~Jia_Guo2;~Minghao_Chen2;~Yilun_Zhao1;~Boyuan_Pan1;~Yao_Hu2;~Heda_Wang1;~Chen_Zhu5;~Xiaofei_He2;~Deng_Cai4",
        "aff": ";Hangzhou Dianzi University;Yale University;Xiaohongshu;;;;Zhejiang University;Zhejiang University",
        "aff_domain": ";hdu.edu.cn;yale.edu;xiaohongshu.com;;;;zju.edu.cn;zju.edu.cn",
        "position": ";Lecturer;PhD student;Researcher;;;;Professor;Professor",
        "bibtex": "@misc{\nguo2024an,\ntitle={{AN} {ENTROPY} {PERSPECTIVE} {IN} {KNOWLEDGE} {DISTILLATION}},\nauthor={Jia Guo and Minghao Chen and Yilun Zhao and Boyuan Pan and Yao Hu and Heda Wang and Chen Zhu and Xiaofei He and Deng Cai},\nyear={2024},\nurl={https://openreview.net/forum?id=QAq5JTFJmp}\n}",
        "github": "",
        "project": "",
        "reviewers": "kj6Z;YbW2;dqtM",
        "site": "https://openreview.net/forum?id=QAq5JTFJmp",
        "pdf_size": 492603,
        "rating": "3;3;3",
        "confidence": "4;4;2",
        "soundness": "2;3;2",
        "contribution": "2;2;2",
        "presentation": "2;3;2",
        "wc_summary": "65;44;54",
        "wc_strengths": "30;22;18",
        "wc_weaknesses": "167;45;109",
        "wc_questions": "99;71;19",
        "wc_review": "361;182;200",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            54.333333333333336,
            8.576453553512405
        ],
        "wc_strengths_avg": [
            23.333333333333332,
            4.988876515698588
        ],
        "wc_weaknesses_avg": [
            107.0,
            49.82636517614612
        ],
        "wc_questions_avg": [
            63.0,
            33.14614105241614
        ],
        "wc_review_avg": [
            247.66666666666666,
            80.47497885816573
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:esjNsR5WU-0J:scholar.google.com/&scioq=AN+ENTROPY+PERSPECTIVE+IN+KNOWLEDGE+DISTILLATION&hl=en&as_sdt=0,23",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;3",
        "aff_unique_norm": "Hangzhou Dianzi University;Yale University;Xiaohongshu;Zhejiang University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "http://www.hdu.edu.cn/;https://www.yale.edu;https://www.xiaohongshu.com;https://www.zju.edu.cn",
        "aff_unique_abbr": "HGHDU;Yale;XHS;ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "QAwaaLJNCk",
        "title": "Improving Factuality and Reasoning in Language Models through Multiagent Debate",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs) have demonstrated remarkable capabilities in language generation, understanding, and few-shot learning in recent years. An extensive body of work has explored how their performance may be further improved through the tools of prompting, ranging from verification, self-consistency, or intermediate scratchpads. In this paper, we present a complementary approach to improve language responses where multiple language model instances propose and debate their individual responses and reasoning processes over multiple rounds to arrive at a common final answer. Our findings indicate that this approach significantly enhances mathematical and strategic reasoning across a number of tasks. We also demonstrate that our approach improves the factual validity of generated content, reducing fallacious answers and hallucinations that contemporary models are prone to. Our approach may be directly applied to existing black-box models and uses identical procedure and prompts for all tasks we investigate. Overall, our findings suggest that such \"society of minds\" approach has the potential to significantly advance the capabilities of LLMs and pave the way for further breakthroughs in language generation and understanding.",
        "keywords": "Large Language Models;Factuality;Reasoning;Multiagent Reasoning",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Yilun Du;Shuang Li;Antonio Torralba;Joshua B. Tenenbaum;Igor Mordatch",
        "authorids": "~Yilun_Du1;~Shuang_Li5;~Antonio_Torralba1;~Joshua_B._Tenenbaum1;~Igor_Mordatch4",
        "gender": ";;M;;",
        "homepage": "https://yilundu.github.io;;http://web.mit.edu/torralba/www//;;",
        "dblp": "204/4379;;t/AntonioBTorralba;t/JoshuaBTenenbaum;",
        "google_scholar": ";;https://scholar.google.com.tw/citations?user=8cxDHS4AAAAJ;;",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Yilun_Du1;~Shuang_Li5;~Antonio_Torralba1;~Joshua_B._Tenenbaum1;~Igor_Mordatch4",
        "aff": "Massachusetts Institute of Technology;;Massachusetts Institute of Technology;Massachusetts Institute of Technology;",
        "aff_domain": "mit.edu;;mit.edu;mit.edu;",
        "position": "PhD student;;Full Professor;Professor;",
        "bibtex": "@misc{\ndu2024improving,\ntitle={Improving Factuality and Reasoning in Language Models through Multiagent Debate},\nauthor={Yilun Du and Shuang Li and Antonio Torralba and Joshua B. Tenenbaum and Igor Mordatch},\nyear={2024},\nurl={https://openreview.net/forum?id=QAwaaLJNCk}\n}",
        "github": "",
        "project": "",
        "reviewers": "Kfe5;CMZe;JxCs;ML3o",
        "site": "https://openreview.net/forum?id=QAwaaLJNCk",
        "pdf_size": 1832489,
        "rating": "5;5;6;8",
        "confidence": "4;5;4;3",
        "soundness": "2;3;3;4",
        "contribution": "2;3;3;3",
        "presentation": "3;3;2;4",
        "wc_summary": "87;57;67;69",
        "wc_strengths": "43;93;48;79",
        "wc_weaknesses": "109;122;188;3",
        "wc_questions": "1;97;40;170",
        "wc_review": "240;369;343;321",
        "wc_reply_reviewers": "0;43;30;41",
        "wc_reply_authors": "385;1102;630;246",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "2;3;2;2",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            70.0,
            10.816653826391969
        ],
        "wc_strengths_avg": [
            65.75,
            20.92098229051399
        ],
        "wc_weaknesses_avg": [
            105.5,
            66.32684222846736
        ],
        "wc_questions_avg": [
            77.0,
            63.62782410235321
        ],
        "wc_review_avg": [
            318.25,
            48.26683644076956
        ],
        "wc_reply_reviewers_avg": [
            28.5,
            17.18284027743958
        ],
        "wc_reply_authors_avg": [
            590.75,
            325.6158587968344
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.8660254037844386,
        "gs_citation": 620,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4306390936519288835&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Massachusetts Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://web.mit.edu",
        "aff_unique_abbr": "MIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "QBlegfNZNE",
        "title": "Language as Kernels",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In the realm of natural language understanding, the synergy between large language models (LLMs) and prompt engineering has unfurled an impressive tapestry of performance. Nonetheless, this prowess has often been overshadowed by the formidable computational resource requirements, rendering LLMs inaccessible in resource-constrained milieus. In this study, we embark on a journey to reconcile this paradox by introducing a nimble and elegant solution --- the kernel machine paradigm. Within these hallowed pages, we present a compelling proof, demonstrating the mathematical equivalence of zero-shot learning and kernel machines. This novel approach, marked by its computational thriftiness, bestows upon us the ability to harness the latent potential of LLMs, even when confined to the humble CPUs. The marriage of this approach with neural nets, renowned for their boundless abstraction capabilities, culminates in remarkable accomplishments with in the realm of language understanding. Our paramount contribution lies in unveiling a path less traveled, where the integration of kernel machines and LLMs unveils a promising vista, enabling the realization of sophisticated language processing tasks in resource-constrained environments.",
        "keywords": "Zero-shot learning;LLMs;Kernel Machines",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Shohei Ohsawa",
        "authorids": "~Shohei_Ohsawa1",
        "gender": "M",
        "homepage": "",
        "dblp": "32/9489",
        "google_scholar": "",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Shohei_Ohsawa1",
        "aff": "Daisy, inc.",
        "aff_domain": "daisy.id",
        "position": "Founder & CEO",
        "bibtex": "@misc{\nohsawa2024language,\ntitle={Language as Kernels},\nauthor={Shohei Ohsawa},\nyear={2024},\nurl={https://openreview.net/forum?id=QBlegfNZNE}\n}",
        "github": "",
        "project": "",
        "reviewers": "9mKW;USwM;hAMM;cZbU",
        "site": "https://openreview.net/forum?id=QBlegfNZNE",
        "pdf_size": 2375157,
        "rating": "1;3;5;5",
        "confidence": "4;4;4;1",
        "soundness": "1;1;2;3",
        "contribution": "1;1;2;3",
        "presentation": "1;1;2;2",
        "wc_summary": "62;82;28;66",
        "wc_strengths": "29;8;20;83",
        "wc_weaknesses": "145;220;92;81",
        "wc_questions": "2;37;32;26",
        "wc_review": "238;347;172;256",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "304;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;0;0;0",
        "rating_avg": [
            3.5,
            1.6583123951777
        ],
        "confidence_avg": [
            3.25,
            1.299038105676658
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            59.5,
            19.665960439297137
        ],
        "wc_strengths_avg": [
            35.0,
            28.696689704563486
        ],
        "wc_weaknesses_avg": [
            134.5,
            54.974994315597705
        ],
        "wc_questions_avg": [
            24.25,
            13.423393758658799
        ],
        "wc_review_avg": [
            253.25,
            62.51149894219463
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            76.0,
            131.63586137523467
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0.25,
            0.4330127018922193
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:JeHJrnwy6lMJ:scholar.google.com/&scioq=Language+as+Kernels&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Daisy Inc.",
        "aff_unique_dep": "",
        "aff_unique_url": "",
        "aff_unique_abbr": ""
    },
    {
        "id": "QDrG0ALevs",
        "title": "Advantage-Conditioned Diffusion: Offline RL via Generalization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Reinforcement learning algorithms typically involve an explicit maximization step somewhere in the process. \nFor example, policy gradient methods maximize an estimate of the expected return, and TD methods maximize the target value while training a critic network. \nHowever, explicit maximization of neural function approximators leads to learning out-of-distribution actions during offline training, which in turn can lead to overestimation and distributional shift of the learned policy. \nCan we instead devise an offline RL method that maximizes the value implicitly, via generalization? \nIn this paper, we show how expressive conditional generative models combined with implicit Q-learning backups can enable this, providing an offline RL method that attains good results through generalization alone, and state-of-the-art results when combined with a simple filtering step that maximizes over samples from the policy only at evaluation time.\nWe believe that our work provides evidence that the next big advancements in offline RL will involve powerful generative models.",
        "keywords": "offline RL;diffusion models",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Jakub Grudzien Kuba;Pieter Abbeel;Sergey Levine",
        "authorids": "~Jakub_Grudzien_Kuba1;~Pieter_Abbeel2;~Sergey_Levine1",
        "gender": "M;M;M",
        "homepage": "https://people.eecs.berkeley.edu/~pabbeel/;https://people.eecs.berkeley.edu/~svlevine/;",
        "dblp": ";80/7594;",
        "google_scholar": "https://scholar.google.com.tw/citations?user=vtwH6GkAAAAJ;8R35rCwAAAAJ;",
        "orcid": ";;",
        "linkedin": ";;kuba-grudzie%C5%84-58039114b/",
        "or_profile": "~Pieter_Abbeel2;~Sergey_Levine1;~Jakub_Grudzien1",
        "aff": "Covariant;Google;University of California, Berkeley",
        "aff_domain": "covariant.ai;google.com;berkeley.edu",
        "position": "Founder;Research Scientist;PhD student",
        "bibtex": "@misc{\nkuba2024advantageconditioned,\ntitle={Advantage-Conditioned Diffusion: Offline {RL} via Generalization},\nauthor={Jakub Grudzien Kuba and Pieter Abbeel and Sergey Levine},\nyear={2024},\nurl={https://openreview.net/forum?id=QDrG0ALevs}\n}",
        "github": "",
        "project": "",
        "reviewers": "CsHK;PrNq;sXjs;9qGT",
        "site": "https://openreview.net/forum?id=QDrG0ALevs",
        "pdf_size": 297417,
        "rating": "3;3;5;6",
        "confidence": "4;3;4;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "156;72;72;328",
        "wc_strengths": "33;13;128;75",
        "wc_weaknesses": "232;55;109;95",
        "wc_questions": "1;106;90;213",
        "wc_review": "422;246;399;711",
        "wc_reply_reviewers": "93;126;76;0",
        "wc_reply_authors": "169;198;175;318",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            157.0,
            104.513157066467
        ],
        "wc_strengths_avg": [
            62.25,
            44.064583284084286
        ],
        "wc_weaknesses_avg": [
            122.75,
            66.11495670421331
        ],
        "wc_questions_avg": [
            102.5,
            75.30106240950388
        ],
        "wc_review_avg": [
            444.5,
            168.0781068432174
        ],
        "wc_reply_reviewers_avg": [
            73.75,
            46.21890846828817
        ],
        "wc_reply_authors_avg": [
            215.0,
            60.44418913344772
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5555555555555555,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:GiafcHi9nOwJ:scholar.google.com/&scioq=Advantage-Conditioned+Diffusion:+Offline+RL+via+Generalization&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Covariant;Google;University of California, Berkeley",
        "aff_unique_dep": ";Google;",
        "aff_unique_url": ";https://www.google.com;https://www.berkeley.edu",
        "aff_unique_abbr": ";Google;UC Berkeley",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Mountain View;Berkeley",
        "aff_country_unique_index": "1;1",
        "aff_country_unique": ";United States"
    },
    {
        "id": "QFD4kMFhtV",
        "title": "Mo\u00fbsai: Efficient Text-to-Music Diffusion Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recent years have seen the rapid development of large generative models for text; however, much less research has explored the connection between text and another \u201clanguage\u201d of communication \u2013 music. In our work, we bridge text and music via a text-to-music generation model that is highly efficient, expressive, and can handle long-term structure. Specifically, we develop Mo\u00fbsai, a cascading two-stage latent diffusion model that can generate multiple minutes of high-quality stereo music at 48kHz from textual descriptions. Moreover, our model features high efficiency, which enables real-time inference on a single consumer GPU with a reasonable speed. Through experiments and property analyses, we show our model\u2019s competence over a variety of criteria compared with existing music generation models.",
        "keywords": "Music Generation;Stable Diffusion",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Flavio Schneider;Ojasv Kamal;Zhijing Jin;Bernhard Sch\u00f6lkopf",
        "authorids": "~Flavio_Schneider1;~Ojasv_Kamal1;~Zhijing_Jin1;~Bernhard_Sch\u00f6lkopf1",
        "gender": "M;M;;",
        "homepage": "https://flavioschneider.com;;;",
        "dblp": ";;;",
        "google_scholar": ";34PgtWEAAAAJ;;",
        "orcid": ";;;",
        "linkedin": ";ojasv-kamal-996397182/;;",
        "or_profile": "~Flavio_Schneider1;~Ojasv_Kamal1;~Zhijing_Jin1;~Bernhard_Sch\u00f6lkopf1",
        "aff": ";Mirelo AI;;",
        "aff_domain": ";mirelo.ai;;",
        "position": ";Researcher;;",
        "bibtex": "@misc{\nschneider2024mosai,\ntitle={Mo\\^usai: Efficient Text-to-Music Diffusion Models},\nauthor={Flavio Schneider and Ojasv Kamal and Zhijing Jin and Bernhard Sch{\\\"o}lkopf},\nyear={2024},\nurl={https://openreview.net/forum?id=QFD4kMFhtV}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=QFD4kMFhtV",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 18,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4343420762685257816&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "Mirelo AI",
        "aff_unique_dep": "",
        "aff_unique_url": "",
        "aff_unique_abbr": ""
    },
    {
        "title": "Adaptive Sharpness-Aware Pruning for Robust Sparse Networks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18682",
        "id": "QFYVVwiAM8",
        "author_site": "Anna Bair, Hongxu Yin, Maying Shen, Pavlo Molchanov, Jose M. Alvarez",
        "tldr": "",
        "abstract": "Robustness and compactness are two essential attributes of deep learning models that are deployed in the real world. \nThe goals of robustness and compactness may seem to be at odds, since robustness requires generalization across domains, while the process of compression exploits specificity in one domain. \nWe introduce \\textit{Adaptive Sharpness-Aware Pruning (AdaSAP)}, which unifies these goals through the lens of network sharpness. \nThe AdaSAP method produces sparse networks that are robust to input variations which are \\textit{unseen at training time}. \nWe achieve this by strategically incorporating weight perturbations in order to optimize the loss landscape. This allows the model to be both primed for pruning and regularized for improved robustness. \nAdaSAP improves the robust accuracy of pruned models on image classification by up to +6\\% on ImageNet C and +4\\% on ImageNet V2, and on object detection by +4\\% on a corrupted Pascal VOC dataset, over a wide range of compression ratios, pruning criteria, and network architectures, outperforming recent pruning art by large margins.",
        "keywords": "sparsity;pruning;natural robustness;flatness;sharpness;generalization;deep learning;out of distribution",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/30b30e0f3de615500820acf86fcf8678f4ceb7ce.pdf",
        "author": "Anna Bair;Hongxu Yin;Maying Shen;Pavlo Molchanov;Jose M. Alvarez",
        "authorids": "~Anna_Bair1;~Hongxu_Yin2;~Maying_Shen1;~Pavlo_Molchanov1;~Jose_M._Alvarez2",
        "gender": ";;;M;",
        "homepage": "https://annaebair.github.io/;;https://mayings.github.io/;;",
        "dblp": "206/3739;;195/2178;165/8169.html;",
        "google_scholar": ";;https://scholar.google.com/citations?hl=en;J9PoyoIAAAAJ;",
        "orcid": ";;0009-0000-9416-680X;;",
        "linkedin": ";;;;",
        "or_profile": "~Anna_Bair1;~Hongxu_Yin2;~Maying_Shen1;~Pavlo_Molchanov1;~Jose_M._Alvarez2",
        "aff": "Carnegie Mellon University;;NVIDIA;NVIDIA Research;",
        "aff_domain": "cmu.edu;;nvidia.com;nvidia.com;",
        "position": "PhD student;;Deep Learning R&D Engineer;Research Scientist;",
        "bibtex": "@inproceedings{\nbair2024adaptive,\ntitle={Adaptive Sharpness-Aware Pruning for Robust Sparse Networks},\nauthor={Anna Bair and Hongxu Yin and Maying Shen and Pavlo Molchanov and Jose M. Alvarez},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=QFYVVwiAM8}\n}",
        "github": "",
        "project": "",
        "reviewers": "e15Q;76yJ;xHva;Gd1H",
        "pdf_size": 1329124,
        "rating": "6;6;6;6",
        "confidence": "4;2;4;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;2;3;2",
        "wc_summary": "32;75;121;131",
        "wc_strengths": "36;27;27;55",
        "wc_weaknesses": "127;51;211;158",
        "wc_questions": "27;104;6;27",
        "wc_review": "222;257;365;371",
        "wc_reply_reviewers": "0;94;0;20",
        "wc_reply_authors": "780;696;478;662",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            89.75,
            39.46754996196242
        ],
        "wc_strengths_avg": [
            36.25,
            11.431863365173676
        ],
        "wc_weaknesses_avg": [
            136.75,
            57.90671377310234
        ],
        "wc_questions_avg": [
            41.0,
            37.36977388210959
        ],
        "wc_review_avg": [
            303.75,
            65.46516249120596
        ],
        "wc_reply_reviewers_avg": [
            28.5,
            38.687853390954636
        ],
        "wc_reply_authors_avg": [
            654.0,
            110.3177229641729
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9717419844739977535&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=QFYVVwiAM8",
        "pdf": "https://openreview.net/pdf?id=QFYVVwiAM8",
        "email": "cmu.edu;;nvidia.com;nvidia.com;",
        "author_num": 5,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Carnegie Mellon University;NVIDIA",
        "aff_unique_dep": ";NVIDIA Corporation",
        "aff_unique_url": "https://www.cmu.edu;https://www.nvidia.com",
        "aff_unique_abbr": "CMU;NVIDIA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "QFo2wxQEW6",
        "title": "Autonomous Catheterization with Open-source Simulator and Expert Trajectory",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Endovascular robots have been actively developed in both academia and industry. However, progress toward autonomous catheterization is often hampered by the widespread use of closed-source simulators and physical phantoms. Additionally, the acquisition of large-scale data for machine learning algorithms training for endovascular robots is usually infeasible due to the expensive medical setup and complicated medical procedures. We introduce CathSim, the first open-source and real-time simulator for endovascular intervention to address these limitations. CathSim's emphasis on sample efficiency enables rapid development and testing of learning algorithms. We validate our CathSim with real robot experiments and achieve competitive performance. Based on CathSim, we develop a multi-modal expert navigation network and demonstrate its effectiveness in downstream endovascular navigation tasks. Our results suggest that CathSim has the potential to significantly accelerate research in the field of autonomous endovascular navigation systems. Our project is available at https://anonymous.4open.science/r/cathsim-E168.",
        "keywords": "Endovascular Navigation;Expert Trajectory",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Tudor Jianu;Baoru Huang;Tuan Van Vo;Minh Nhat VU;Jingxuan Kang;Hoan Cong Nguyen;Olatunji Mumini Omisore;Pierre Berthet-rayne;Sebastiano Fichera;Anh Nguyen",
        "authorids": "~Tudor_Jianu1;~Baoru_Huang1;~Tuan_Van_Vo2;~Minh_Nhat_VU2;~Jingxuan_Kang1;~Hoan_Cong_Nguyen1;~Olatunji_Mumini_Omisore1;~Pierre_Berthet-rayne2;~Sebastiano_Fichera1;~Anh_Nguyen2",
        "gender": "M;F;;M;;M;Not Specified;M;M;M",
        "homepage": ";https://baoru.netlify.app/;;https://www.acin.tuwien.ac.at/en/;;;https://sites.google.com/view/moom1/news;https://takskal.wordpress.com/;https://www.liverpool.ac.uk/engineering/staff/sebastiano-fichera/;https://www.csc.liv.ac.uk/~anguyen/",
        "dblp": ";238/1618;;204/6820;;;;;;52/5285-3.html",
        "google_scholar": ";unbPvWAAAAAJ;;;;R0xlxccAAAAJ;i0w0p8oAAAAJ;;;https://scholar.google.co.uk/citations?user=gEbaF0sAAAAJ",
        "orcid": "0000-0003-0324-0950;;;0000-0003-0692-8830;;;;;0000-0003-1006-4959;0000-0002-1449-211X",
        "linkedin": ";;;;;;;;;",
        "or_profile": "~Tudor_Jianu1;~Baoru_Huang1;~Tuan_Van_Vo2;~Minh_Nhat_VU2;~Jingxuan_Kang1;~Hoan_Cong_Nguyen1;~Olatunji_Mumini_Omisore1;~Pierre_Berthet-rayne2;~Sebastiano_Fichera1;~Anh_Nguyen2",
        "aff": "University of Liverpool;University College London, University of London;;Technische Universit\u00e4t Wien (TU Wien);;University of Information Technology, VNUHCM;Shenzhen Institutes of Advanced Technology, Chinese Academy of Sciences, Chinese Academy of Sciences;University of Liverpool;University of Liverpool;University of Liverpool",
        "aff_domain": "liverpool.ac.uk;ucl.ac.uk;;tuwien.ac.at;;uit.edu.vn;siat.ac.cn;liverpool.ac.uk;liverpool.ac.uk;liverpool.ac.uk",
        "position": "PhD student;Postdoc;;Researcher;;Assistant Professor;Principal Researcher;Researcher;Lecturer;Associate Professor",
        "bibtex": "@misc{\njianu2024autonomous,\ntitle={Autonomous Catheterization with Open-source Simulator and Expert Trajectory},\nauthor={Tudor Jianu and Baoru Huang and Tuan Van Vo and Minh Nhat VU and Jingxuan Kang and Hoan Cong Nguyen and Olatunji Mumini Omisore and Pierre Berthet-rayne and Sebastiano Fichera and Anh Nguyen},\nyear={2024},\nurl={https://openreview.net/forum?id=QFo2wxQEW6}\n}",
        "github": "",
        "project": "",
        "reviewers": "eFcL;HLTP;3umj",
        "site": "https://openreview.net/forum?id=QFo2wxQEW6",
        "pdf_size": 4076188,
        "rating": "5;5;5",
        "confidence": "3;4;3",
        "soundness": "3;3;2",
        "contribution": "2;3;2",
        "presentation": "3;3;2",
        "wc_summary": "65;219;78",
        "wc_strengths": "22;74;58",
        "wc_weaknesses": "117;354;183",
        "wc_questions": "32;59;2",
        "wc_review": "236;706;321",
        "wc_reply_reviewers": "52;0;0",
        "wc_reply_authors": "802;1537;874",
        "reply_reviewers": "1;0;0",
        "reply_authors": "3;5;4",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            120.66666666666667,
            69.73441681758649
        ],
        "wc_strengths_avg": [
            51.333333333333336,
            21.74600857373345
        ],
        "wc_weaknesses_avg": [
            218.0,
            99.86991538997117
        ],
        "wc_questions_avg": [
            31.0,
            23.280893453645632
        ],
        "wc_review_avg": [
            421.0,
            204.49123860612383
        ],
        "wc_reply_reviewers_avg": [
            17.333333333333332,
            24.513035081133648
        ],
        "wc_reply_authors_avg": [
            1071.0,
            330.82019285406386
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            4.0,
            0.816496580927726
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4035796042124269663&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;3;4;0;0;0",
        "aff_unique_norm": "University of Liverpool;University College London;Technische Universit\u00e4t Wien;University of Information Technology;Chinese Academy of Sciences",
        "aff_unique_dep": ";;;;Shenzhen Institutes of Advanced Technology",
        "aff_unique_url": "https://www.liverpool.ac.uk;https://www.ucl.ac.uk;https://www.tuwien.ac.at;https://uit.vnu.edu.vn;http://www.cas.cn",
        "aff_unique_abbr": "Liv Uni;UCL;TU Wien;UIT;CAS",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Shenzhen",
        "aff_country_unique_index": "0;0;1;2;3;0;0;0",
        "aff_country_unique": "United Kingdom;Austria;Vietnam;China"
    },
    {
        "id": "QGR5IeMNDF",
        "title": "Pure Message Passing Can Estimate Common Neighbor for Link Prediction",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Message Passing Neural Networks (MPNNs) have emerged as the *de facto* standard in graph representation learning. However, when it comes to link prediction, they are not always superior to simple heuristics such as Common Neighbor (CN). This discrepancy stems from a fundamental limitation: while MPNNs excel in node-level representation, they stumble with encoding the joint structural features essential to link prediction, like CN. To bridge this gap, we posit that, by harnessing the orthogonality of input vectors, pure message-passing can indeed capture joint structural features. Specifically, we study the proficiency of MPNNs in approximating CN heuristics. Based on our findings, we introduce the Message Passing Link Predictor (MPLP), a novel link prediction model. MPLP taps into quasi-orthogonal vectors to estimate link-level structural features, all while preserving the node-level complexities. Moreover, our approach demonstrates that leveraging message-passing to capture structural features could offset MPNNs' expressiveness limitations at the expense of estimation variance. We conduct experiments on benchmark datasets from various domains, where our method consistently outperforms the baseline methods.",
        "keywords": "Graph Neural Networks;Link Prediction",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Kaiwen Dong;Zhichun Guo;Nitesh V Chawla",
        "authorids": "~Kaiwen_Dong1;~Zhichun_Guo1;~Nitesh_V_Chawla1",
        "gender": "M;;",
        "homepage": "https://barcavin.github.io/;;",
        "dblp": "301/7629;;",
        "google_scholar": "bKccdZYAAAAJ;;",
        "orcid": "0000-0001-8244-9562;;",
        "linkedin": ";;",
        "or_profile": "~Kaiwen_Dong1;~Zhichun_Guo1;~Nitesh_V_Chawla1",
        "aff": "University of Notre Dame;;",
        "aff_domain": "nd.edu;;",
        "position": "PhD student;;",
        "bibtex": "@misc{\ndong2024pure,\ntitle={Pure Message Passing Can Estimate Common Neighbor for Link Prediction},\nauthor={Kaiwen Dong and Zhichun Guo and Nitesh V Chawla},\nyear={2024},\nurl={https://openreview.net/forum?id=QGR5IeMNDF}\n}",
        "github": "",
        "project": "",
        "reviewers": "vrGo;tZSC;UTLj;kuzb",
        "site": "https://openreview.net/forum?id=QGR5IeMNDF",
        "pdf_size": 11723299,
        "rating": "5;5;5;8",
        "confidence": "4;4;5;4",
        "soundness": "3;2;3;4",
        "contribution": "3;2;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "75;101;71;104",
        "wc_strengths": "48;239;59;162",
        "wc_weaknesses": "43;266;153;92",
        "wc_questions": "245;140;270;114",
        "wc_review": "411;746;553;472",
        "wc_reply_reviewers": "0;541;340;24",
        "wc_reply_authors": "1209;1404;3108;990",
        "reply_reviewers": "0;2;1;1",
        "reply_authors": "4;3;6;2",
        "rating_avg": [
            5.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            87.75,
            14.85555451674558
        ],
        "wc_strengths_avg": [
            127.0,
            78.47611101475404
        ],
        "wc_weaknesses_avg": [
            138.5,
            83.29015548070493
        ],
        "wc_questions_avg": [
            192.25,
            66.48449067263734
        ],
        "wc_review_avg": [
            545.5,
            126.24282157810003
        ],
        "wc_reply_reviewers_avg": [
            226.25,
            225.88755499141604
        ],
        "wc_reply_authors_avg": [
            1677.75,
            838.6418708244896
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            3.75,
            1.479019945774904
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7173311046947546504&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Notre Dame",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nd.edu",
        "aff_unique_abbr": "Notre Dame",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "QGk2UhrC0Z",
        "title": "IGTO: Individual Global Transform Optimization for Multi-Agent Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The rigorous equivalency of individual-global actions is accustomedly assumed for  Centralized Training with Decentralized Execution (CTDE) in Multi-Agent Reinforcement Learning (MARL), wherever Individual-Global-Max (IGM) or Individual-Global-Optimal (IGO) it is. To release the restriction, in this work, we pose an individual-global action-transformed condition, named individual-global-Transform-Optimal (IGTO), to permit inconsistent individual-global actions while guaranteeing the equivalency of their policy distributions. Conditioned by IGTO, accordingly, we design a Individual-Global Normalized Transformation (IGNT) rule, which could be seamlessly implanted into many existing CTDE-based algorithms. Theoretically, we prove that individual-global policies can converge to the optimum under this rule. Empirically, we integrate IGNT into Multi-agent Actor-Critic (named IGNT-MAC) as well as various MARL algorithms, then test on StarCraft Multi-Agent Challenge (SMAC) and Multi-Agent Particle Environment (MPE). Extensive experiments demonstrate that our method can achieve remarkable improvement over the existing MARL baselines.",
        "keywords": "Individual-Global Normalized Transformation;Reinforcement Learning;Multi-agent Cooperative Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/8402a2aeb68bfc9461e7c6ed9db024ea6f9ad311.pdf",
        "author": "Xiaoliang Hu;Zhen Cui",
        "authorids": "~Xiaoliang_Hu1;~Zhen_Cui4",
        "gender": "M;M",
        "homepage": ";http://aip.seu.edu.cn/zcui/",
        "dblp": "253/8994;59/8491-1",
        "google_scholar": "-vrBiR8AAAAJ;ChRyl3kAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Xiaoliang_Hu1;~Zhen_Cui4",
        "aff": "Nanjing University of Science and Technology;Nanjing University of Science and Technology",
        "aff_domain": "njust.edu.cn;njust.edu.cn",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nhu2024igto,\ntitle={{IGTO}: Individual Global Transform Optimization for Multi-Agent Reinforcement Learning},\nauthor={Xiaoliang Hu and Zhen Cui},\nyear={2024},\nurl={https://openreview.net/forum?id=QGk2UhrC0Z}\n}",
        "github": "",
        "project": "",
        "reviewers": "gq26;ujuj;s6zd;H7GA;Kp6o",
        "site": "https://openreview.net/forum?id=QGk2UhrC0Z",
        "pdf_size": 1928654,
        "rating": "5;5;6;6;8",
        "confidence": "3;3;4;4;4",
        "soundness": "2;2;2;3;4",
        "contribution": "2;2;2;3;4",
        "presentation": "2;3;3;3;4",
        "wc_summary": "84;66;52;54;53",
        "wc_strengths": "44;39;40;2;54",
        "wc_weaknesses": "89;192;83;2;57",
        "wc_questions": "84;2;162;165;64",
        "wc_review": "301;299;337;223;228",
        "wc_reply_reviewers": "87;207;0;0;0",
        "wc_reply_authors": "1051;1448;1117;600;689",
        "reply_reviewers": "1;3;0;0;0",
        "reply_authors": "3;5;2;1;1",
        "rating_avg": [
            6.0,
            1.0954451150103321
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.6,
            0.8
        ],
        "contribution_avg": [
            2.6,
            0.8
        ],
        "presentation_avg": [
            3.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            61.8,
            12.204917041913886
        ],
        "wc_strengths_avg": [
            35.8,
            17.713271860387625
        ],
        "wc_weaknesses_avg": [
            84.6,
            61.872772687184465
        ],
        "wc_questions_avg": [
            95.4,
            61.83720562897389
        ],
        "wc_review_avg": [
            277.6,
            44.665870639672974
        ],
        "wc_reply_reviewers_avg": [
            58.8,
            81.40122849195826
        ],
        "wc_reply_authors_avg": [
            981.0,
            307.21653601328165
        ],
        "reply_reviewers_avg": [
            0.8,
            1.1661903789690604
        ],
        "reply_authors_avg": [
            2.4,
            1.4966629547095764
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.74535599249993,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:BVnIXUt9vZwJ:scholar.google.com/&scioq=IGTO:+Individual+Global+Transform+Optimization+for+Multi-Agent+Reinforcement+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Nanjing University of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.nust.edu.cn/",
        "aff_unique_abbr": "NUST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Less is More: One-shot Subgraph Reasoning on Large-scale Knowledge Graphs",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18681",
        "id": "QHROe7Mfcb",
        "author_site": "Zhanke Zhou, Yongqi Zhang, Jiangchao Yao, Quanming Yao, Bo Han",
        "tldr": "",
        "abstract": "To deduce new facts on a knowledge graph (KG), a link predictor learns from the graph structure and collects local evidence to find the answer to a given query. However, existing methods suffer from a severe scalability problem due to the utilization of the whole KG for prediction, which hinders their promise on large scale KGs and cannot be directly addressed by vanilla sampling methods. In this work, we propose the one-shot-subgraph link prediction to achieve efficient and adaptive prediction. The design principle is that, instead of directly acting on the whole KG, the prediction procedure is decoupled into two steps, i.e., (i) extracting only one subgraph according to the query and (ii) predicting on this single, query dependent subgraph. We reveal that the non-parametric and computation-efficient heuristics Personalized PageRank (PPR) can effectively identify the potential answers and supporting evidence. With efficient subgraph-based prediction, we further introduce the automated searching of the optimal configurations in both data and model spaces. Empirically, we achieve promoted efficiency and leading performances on five large-scale benchmarks. The code is publicly available at: https://github.com/tmlr-group/one-shot-subgraph.",
        "keywords": "knowledge graph reasoning;graph sampling",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "",
        "author": "Zhanke Zhou;Yongqi Zhang;Jiangchao Yao;quanming yao;Bo Han",
        "authorids": "~Zhanke_Zhou1;~Yongqi_Zhang2;~Jiangchao_Yao1;~quanming_yao1;~Bo_Han1",
        "gender": "M;M;M;M;M",
        "homepage": "https://andrewzhou924.github.io/;https://yzhangee.github.io/;https://sunarker.github.io/;https://lars-group.github.io/;https://bhanml.github.io/",
        "dblp": "285/5311;;166/5900;158/1014;241/0472-3",
        "google_scholar": "GVXErr0AAAAJ;https://scholar.google.com.hk/citations?user=nVk-7EAAAAAJ;w8oDh9QAAAAJ;https://scholar.google.com/schhp?hl=en;nTNjqHwAAAAJ",
        "orcid": ";0000-0003-2085-7418;;;",
        "linkedin": ";;;;",
        "or_profile": "~Zhanke_Zhou1;~Yongqi_Zhang2;~Jiangchao_Yao1;~quanming_yao1;~bo_han2",
        "aff": "Hong Kong Baptist University;4Paradigm. Inc;Shanghai Artificial Intelligence Laboratory;Department of Electronic Engineering;MBZUAI",
        "aff_domain": "hkbu.edu.hk;4paradigm.com;pjlab.org.cn;tsinghua.edu.cn;mbzuai.ac.ae",
        "position": "PhD student;Researcher;Researcher;Assistant Professor;Researcher",
        "bibtex": "@inproceedings{\nzhou2024less,\ntitle={Less is More: One-shot Subgraph Reasoning on Large-scale Knowledge Graphs},\nauthor={Zhanke Zhou and Yongqi Zhang and Jiangchao Yao and quanming yao and Bo Han},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=QHROe7Mfcb}\n}",
        "github": "",
        "project": "",
        "reviewers": "7ny9;FPeS;RRjT",
        "pdf_size": 9499814,
        "rating": "3;5;6",
        "confidence": "4;4;3",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "2;3;3",
        "wc_summary": "87;61;62",
        "wc_strengths": "53;65;34",
        "wc_weaknesses": "86;196;69",
        "wc_questions": "210;98;33",
        "wc_review": "436;420;198",
        "wc_reply_reviewers": "58;0;0",
        "wc_reply_authors": "1644;1925;1775",
        "reply_reviewers": "1;0;0",
        "reply_authors": "5;6;5",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            70.0,
            12.027745701779143
        ],
        "wc_strengths_avg": [
            50.666666666666664,
            12.762793146051099
        ],
        "wc_weaknesses_avg": [
            117.0,
            56.290911048469155
        ],
        "wc_questions_avg": [
            113.66666666666667,
            73.10418744656302
        ],
        "wc_review_avg": [
            351.3333333333333,
            108.6196217182799
        ],
        "wc_reply_reviewers_avg": [
            19.333333333333332,
            27.34146220587984
        ],
        "wc_reply_authors_avg": [
            1781.3333333333333,
            114.80514893602212
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.7559289460184545,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9528290394153016645&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=QHROe7Mfcb",
        "pdf": "https://openreview.net/pdf?id=QHROe7Mfcb",
        "email": "hkbu.edu.hk;4paradigm.com;pjlab.org.cn;tsinghua.edu.cn;mbzuai.ac.ae",
        "author_num": 5,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "Hong Kong Baptist University;4Paradigm;Shanghai Artificial Intelligence Laboratory;Institution Name Not Provided;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_unique_dep": ";;;Department of Electronic Engineering;",
        "aff_unique_url": "https://www.hkbu.edu.hk;https://www.4paradigm.com/;http://www.shailab.org/;;https://www.mbzuai.ac.ae",
        "aff_unique_abbr": "HKBU;;Shanghai AI Lab;;MBZUAI",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;2",
        "aff_country_unique": "China;;United Arab Emirates"
    },
    {
        "id": "QHVTxso1Is",
        "title": "Efficient Unsupervised Knowledge Distillation with Space Similarity",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this paper, we aim to boost performance of knowledge distillation without the ground-truth labels. Hence, a student can only rely on the response generated by its teacher. Many existing approaches under this setting rely on some form of feature/embedding queue to capture neighbourhood information. These queues can be as large as over 100k samples. Also, some of these methods rely on multitude of operations which as a result increases the memory requirement for training many folds. In this work, we show that merely working with the input batch (often of size $256$) it is possible to not only incorporate neighbourhood information but also obtain state of the art unsupervised distillation performance. We achieve this by introducing a simple space similarity loss component which works alongside the well known normalized cosine similarity computed on the final features. In this loss, we motivate each dimension of a student's feature space to be similar to the corresponding dimension of its teacher. With this seemingly simple addition, we are able to compete against many contemporary methods which either rely on large number of queued features or heavy pre-processing. We perform extensive experiments comparing our proposed approach to other state of the art methods on various computer vision tasks for established architectures.",
        "keywords": "unsupervised knowledge distillation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Aditya Singh;Haohan Wang",
        "authorids": "~Aditya_Singh3;~Haohan_Wang1",
        "gender": "M;M",
        "homepage": ";http://cs.cmu.edu/~haohanw",
        "dblp": ";132/4066",
        "google_scholar": "kkE_sOoAAAAJ;nZxJGeUAAAAJ",
        "orcid": ";",
        "linkedin": ";haohanwang/",
        "or_profile": "~Aditya_Singh3;~Haohan_Wang1",
        "aff": "Zebra Technologies;University of Illinois, Urbana Champaign",
        "aff_domain": "zebra.com;illinois.edu",
        "position": "Computer Vision Researcher II;Assistant Professor",
        "bibtex": "@misc{\nsingh2024efficient,\ntitle={Efficient Unsupervised Knowledge Distillation with Space Similarity},\nauthor={Aditya Singh and Haohan Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=QHVTxso1Is}\n}",
        "github": "",
        "project": "",
        "reviewers": "sCnR;u1Un;jpJi;VMp2;ahHP",
        "site": "https://openreview.net/forum?id=QHVTxso1Is",
        "pdf_size": 4316388,
        "rating": "3;5;5;6;6",
        "confidence": "4;4;3;3;4",
        "soundness": "3;2;2;2;3",
        "contribution": "2;2;3;2;2",
        "presentation": "3;2;2;3;2",
        "wc_summary": "61;124;84;78;60",
        "wc_strengths": "55;155;66;35;21",
        "wc_weaknesses": "191;417;124;138;34",
        "wc_questions": "141;123;73;119;127",
        "wc_review": "448;819;347;370;242",
        "wc_reply_reviewers": "43;782;23;197;0",
        "wc_reply_authors": "1581;2666;785;1785;594",
        "reply_reviewers": "1;4;1;2;0",
        "reply_authors": "5;8;2;5;1",
        "rating_avg": [
            5.0,
            1.0954451150103321
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            81.4,
            23.268863315598377
        ],
        "wc_strengths_avg": [
            66.4,
            46.96211238860535
        ],
        "wc_weaknesses_avg": [
            180.8,
            128.4545055652
        ],
        "wc_questions_avg": [
            116.6,
            23.026940743398807
        ],
        "wc_review_avg": [
            445.2,
            198.152870279489
        ],
        "wc_reply_reviewers_avg": [
            209.0,
            294.722242119593
        ],
        "wc_reply_authors_avg": [
            1482.2,
            745.361496188259
        ],
        "reply_reviewers_avg": [
            1.6,
            1.3564659966250538
        ],
        "reply_authors_avg": [
            4.2,
            2.4819347291981715
        ],
        "replies_avg": [
            37,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.372677996249965,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:0828UcWQywoJ:scholar.google.com/&scioq=Efficient+Unsupervised+Knowledge+Distillation+with+Space+Similarity&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Zebra Technologies Corporation;University of Illinois Urbana-Champaign",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.zebra.com;https://illinois.edu",
        "aff_unique_abbr": "Zebra;UIUC",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Urbana-Champaign",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "QHfIe4chR5",
        "title": "Long-distance Targeted Poisoning Attacks on Graph Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "GNNs are vulnerable to targeted poisoning in which an attacker manipulates the graph to cause a target node to be mis-classified to a label chosen by the attacker. However, most existing targeted attacks inject or modify nodes within the target node's $k$-hop neighborhood to poison a $k$-layer GNN model. In this paper, we investigate the feasibility of {\\em long-distance} attacks, i.e., attacks where the injected nodes lie outside the target node's $k$-hop neighborhood. We show such attacks are feasible by developing a bilevel optimization-based approach, inspired by meta-learning. While this principled approach can successfully attack small graphs, scaling it to large graphs requires significant memory and computation resources, and is thus impractical. Therefore, we develop a much less expensive, but approximate, heuristic-based approach that can attack much larger graphs, albeit with lower attack success rate. Our evaluation shows that long-distance targeted poisoning is effective and difficult to detect by existing GNN defense mechanisms.  To the best of our knowledge, our work is the first to study long-distance targeted poisoning attacks.",
        "keywords": "Graph Neural Network;Adversarial Attacks;Node Classification",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Anqi Zhang;Aurojit Panda;Jinyang Li;Siddhartha Sen",
        "authorids": "~Anqi_Zhang1;~Aurojit_Panda1;~Jinyang_Li1;~Siddhartha_Sen1",
        "gender": ";;;",
        "homepage": ";;;http://sidsen.org",
        "dblp": ";;;",
        "google_scholar": ";;;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Anqi_Zhang1;~Aurojit_Panda1;~Jinyang_Li1;~Siddhartha_Sen1",
        "aff": ";;;Microsoft Research",
        "aff_domain": ";;;research.microsoft.com",
        "position": ";;;Principal Researcher",
        "bibtex": "@misc{\nzhang2024longdistance,\ntitle={Long-distance Targeted Poisoning Attacks on Graph Neural Networks},\nauthor={Anqi Zhang and Aurojit Panda and Jinyang Li and Siddhartha Sen},\nyear={2024},\nurl={https://openreview.net/forum?id=QHfIe4chR5}\n}",
        "github": "",
        "project": "",
        "reviewers": "E2SS;2Mxw;eKgy;xnBR",
        "site": "https://openreview.net/forum?id=QHfIe4chR5",
        "pdf_size": 826123,
        "rating": "3;3;6;6",
        "confidence": "4;4;3;3",
        "soundness": "3;2;3;2",
        "contribution": "2;2;3;3",
        "presentation": "2;2;3;2",
        "wc_summary": "58;88;89;56",
        "wc_strengths": "5;48;46;31",
        "wc_weaknesses": "11;168;82;69",
        "wc_questions": "188;154;109;33",
        "wc_review": "262;458;326;189",
        "wc_reply_reviewers": "0;310;15;19",
        "wc_reply_authors": "383;1260;662;766",
        "reply_reviewers": "0;3;1;1",
        "reply_authors": "1;4;1;1",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            72.75,
            15.769828787910159
        ],
        "wc_strengths_avg": [
            32.5,
            17.18284027743958
        ],
        "wc_weaknesses_avg": [
            82.5,
            56.13599558215744
        ],
        "wc_questions_avg": [
            121.0,
            58.02154772151464
        ],
        "wc_review_avg": [
            308.75,
            98.86701927336537
        ],
        "wc_reply_reviewers_avg": [
            86.0,
            129.5202686840944
        ],
        "wc_reply_authors_avg": [
            767.75,
            316.8314812325316
        ],
        "reply_reviewers_avg": [
            1.25,
            1.0897247358851685
        ],
        "reply_authors_avg": [
            1.75,
            1.299038105676658
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:04t7BrdSynUJ:scholar.google.com/&scioq=Long-distance+Targeted+Poisoning+Attacks+on+Graph+Neural+Networks&hl=en&as_sdt=0,47",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Microsoft",
        "aff_unique_dep": "Microsoft Research",
        "aff_unique_url": "https://www.microsoft.com/en-us/research",
        "aff_unique_abbr": "MSR",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "QHzzAU7Qf9",
        "title": "Soft Merging of Experts with Adaptive Routing",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Neural networks that learn to route their inputs through different \"expert\" subnetworks provide a form of modularity that standard dense models lack.\nDespite their possible benefits, modular models with learned routing often underperform their parameter-matched dense counterparts as well as models that use non-learned heuristic routing strategies.\nIn this paper, we hypothesize that these shortcomings stem from the gradient estimation techniques used to train modular models that use non-differentiable discrete routing decisions.\nTo address this issue, we introduce $\\textbf{S}$oft $\\textbf{M}$erging of $\\textbf{E}$xperts with $\\textbf{A}$daptive $\\textbf{R}$outing (SMEAR), which avoids discrete routing by using a single \"merged\" expert constructed via a weighted average of all of the experts' parameters.\nBy routing activations through a single merged expert, SMEAR does not incur a significant increase in computational costs and enables standard gradient-based training.\nWe empirically validate that models using SMEAR outperform models that route based on metadata or learn routing through gradient estimation.\nFurthermore, we provide qualitative analysis demonstrating that the experts learned via SMEAR exhibit a significant amount of specialization.",
        "keywords": "Modular models;Routing;Weight Averaging",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/4995b400c65c088cac7ef85183b7a2a88dbac830.zip",
        "author": "Mohammed Muqeeth;Haokun Liu;Colin Raffel",
        "authorids": "~Mohammed_Muqeeth1;~Haokun_Liu1;~Colin_Raffel1",
        "gender": ";;",
        "homepage": "https://muqeeth.github.io;https://haokunliu.github.io/;http://colinraffel.com",
        "dblp": "320/4437;169/0460;149/0082",
        "google_scholar": "dsAzIX4AAAAJ;T3dz_MQAAAAJ;I66ZBYwAAAAJ",
        "orcid": ";;",
        "linkedin": "muqeeth-mohammed/;;",
        "or_profile": "~Mohammed_Muqeeth1;~Haokun_Liu1;~Colin_Raffel1",
        "aff": "IBM, International Business Machines;Department of Computer Science, University of Toronto;Hugging Face",
        "aff_domain": "us.ibm.com;cs.toronto.edu;huggingface.co",
        "position": "Researcher;PhD student;Researcher",
        "bibtex": "@misc{\nmuqeeth2024soft,\ntitle={Soft Merging of Experts with Adaptive Routing},\nauthor={Mohammed Muqeeth and Haokun Liu and Colin Raffel},\nyear={2024},\nurl={https://openreview.net/forum?id=QHzzAU7Qf9}\n}",
        "github": "",
        "project": "",
        "reviewers": "y2t1;uHR4;dSc4",
        "site": "https://openreview.net/forum?id=QHzzAU7Qf9",
        "pdf_size": 1652229,
        "rating": "6;6;6",
        "confidence": "3;3;5",
        "soundness": "2;3;3",
        "contribution": "3;2;3",
        "presentation": "3;2;4",
        "wc_summary": "48;70;87",
        "wc_strengths": "44;27;114",
        "wc_weaknesses": "172;87;167",
        "wc_questions": "47;69;190",
        "wc_review": "311;253;558",
        "wc_reply_reviewers": "154;4;19",
        "wc_reply_authors": "847;416;1292",
        "reply_reviewers": "1;1;1",
        "reply_authors": "2;1;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            68.33333333333333,
            15.965240019770729
        ],
        "wc_strengths_avg": [
            61.666666666666664,
            37.65043898224236
        ],
        "wc_weaknesses_avg": [
            142.0,
            38.94440481849308
        ],
        "wc_questions_avg": [
            102.0,
            62.8702367314349
        ],
        "wc_review_avg": [
            374.0,
            132.24472264202709
        ],
        "wc_reply_reviewers_avg": [
            59.0,
            67.45368781616021
        ],
        "wc_reply_authors_avg": [
            851.6666666666666,
            357.6407259931241
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 49,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9257510206662098791&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "International Business Machines;University of Toronto;Hugging Face",
        "aff_unique_dep": ";Department of Computer Science;",
        "aff_unique_url": "https://www.ibm.com;https://www.utoronto.ca;https://huggingface.co",
        "aff_unique_abbr": "IBM;U of T;Hugging Face",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Toronto",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United States;Canada"
    },
    {
        "id": "QIrYb3Vlze",
        "title": "Isometric Representation Learning for Disentangled Latent Space of Diffusion Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Diffusion models have made remarkable progress in capturing and reproducing real-world data. Despite their success and further potential, however, their latent space, the core of diffusion models still remains underexplored. In fact, the latent spaces of existing diffusion models still do not perfectly align with the human perception, entangling multiple concepts in a distorted space. In this paper, we present \\textit{Isometric Diffusion}, equipping a diffusion model with isometric representation learning to better reflect human intuition and understanding of visual data. Specifically, we propose a novel loss to promote isometry between the latent space and the data manifold, enabling a semantically clear and geometrically sound latent space. This approach allows smoother interpolation and more precise control over attributes directly in the latent space. Our extensive experiments demonstrate the effectiveness of Isometric Diffusion, marking a significant advance in aligning latent spaces with perceptual semantics. This work paves the way for fine-grained data generation and manipulation.",
        "keywords": "isometric diffusion;disentanglement;diffusion",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/d7bbe777902feea174f69d91b951054b879c2fcd.zip",
        "author": "Jaehoon Hahm;Junho Lee;Sunghyun Kim;Joonseok Lee",
        "authorids": "~Jaehoon_Hahm1;~Junho_Lee2;~Sunghyun_Kim4;~Joonseok_Lee1",
        "gender": "M;M;F;M",
        "homepage": "https://jaehoon-hahm.github.io/;https://sites.google.com/view/junopage;http://viplab.snu.ac.kr/viplab/members.html;http://www.joonseok.net",
        "dblp": ";;;77/1319.html",
        "google_scholar": "z9RfcGQAAAAJ;s_orZYMAAAAJ;;https://scholar.google.co.kr/citations?user=M-MfqpMAAAAJ",
        "orcid": ";;;",
        "linkedin": ";junho-lee-457748229/;;joonseoklee",
        "or_profile": "~Jaehoon_Hahm1;~Junho_Lee2;~Sunghyun_Kim4;~Joonseok_Lee1",
        "aff": "Seoul National University;Seoul National University;Seoul National University;Google Research",
        "aff_domain": "snu.ac.kr;snu.ac.kr;snu.ac.kr;google.com",
        "position": "MS student;PhD student;MS student;Research Scientist",
        "bibtex": "@misc{\nhahm2024isometric,\ntitle={Isometric Representation Learning for Disentangled Latent Space of Diffusion Models},\nauthor={Jaehoon Hahm and Junho Lee and Sunghyun Kim and Joonseok Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=QIrYb3Vlze}\n}",
        "github": "",
        "project": "",
        "reviewers": "KgHU;foMH;JaPd;81Dq",
        "site": "https://openreview.net/forum?id=QIrYb3Vlze",
        "pdf_size": 27840635,
        "rating": "5;6;6;8",
        "confidence": "4;4;3;3",
        "soundness": "2;4;3;4",
        "contribution": "2;3;3;4",
        "presentation": "2;4;3;4",
        "wc_summary": "57;56;147;94",
        "wc_strengths": "23;48;56;224",
        "wc_weaknesses": "188;359;170;41",
        "wc_questions": "398;226;14;11",
        "wc_review": "666;689;387;370",
        "wc_reply_reviewers": "303;49;481;0",
        "wc_reply_authors": "2938;1538;1259;171",
        "reply_reviewers": "1;2;2;0",
        "reply_authors": "5;5;3;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            88.5,
            37.08436328157732
        ],
        "wc_strengths_avg": [
            87.75,
            79.60017273850603
        ],
        "wc_weaknesses_avg": [
            189.5,
            113.09840847686584
        ],
        "wc_questions_avg": [
            162.25,
            161.62978531199008
        ],
        "wc_review_avg": [
            528.0,
            149.84158301352798
        ],
        "wc_reply_reviewers_avg": [
            208.25,
            194.99919871630243
        ],
        "wc_reply_authors_avg": [
            1476.5,
            986.3317139786188
        ],
        "reply_reviewers_avg": [
            1.25,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.5,
            1.6583123951777
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.6882472016116854,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8686601567271018086&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "Seoul National University;Google",
        "aff_unique_dep": ";Google Research",
        "aff_unique_url": "https://www.snu.ac.kr;https://research.google",
        "aff_unique_abbr": "SNU;Google Research",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "title": "Guaranteed Approximation Bounds for Mixed-Precision Neural Operators",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18680",
        "id": "QJGj07PD9C",
        "author_site": "Renbo Tu, Colin White, Jean Kossaifi, Boris Bonev, Gennady Pekhimenko, Kamyar Azizzadenesheli, anima anandkumar",
        "tldr": "",
        "abstract": "Neural operators, such as Fourier Neural Operators (FNO), form a principled approach for learning solution operators for partial differential equations (PDE) and other mappings between function spaces. However, many real-world problems require high-resolution training data, and the training time and limited GPU memory pose big barriers. One solution is to train neural operators in mixed precision to reduce the memory requirement and increase training speed. However, existing mixed-precision training techniques are designed for standard neural networks, and we find that their direct application to FNO leads to numerical overflow and poor memory efficiency. Further, at first glance, it may appear that mixed precision in FNO will lead to drastic accuracy degradation since reducing the precision of the Fourier transform yields poor results in classical numerical solvers. We show that this is not the case; in fact, we prove that reducing the precision in FNO still guarantees a good approximation bound, when done in a targeted manner. Specifically, we build on the intuition that neural operator learning inherently induces an approximation error, arising from discretizing the infinite-dimensional ground-truth input function, implying that training in full precision is not needed. We formalize this intuition by rigorously characterizing the approximation and precision errors of FNO and bounding these errors for general input functions. We prove that the precision error is asymptotically comparable to the approximation error. Based on this, we design a simple method to optimize the memory-intensive half-precision tensor contractions by greedily finding the optimal contraction order. Through extensive experiments on different state-of-the-art neural operators, datasets, and GPUs, we demonstrate that our approach reduces GPU memory usage by up to 50% and improves throughput by 58% with little or no reduction in accuracy.",
        "keywords": "neural operators",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Renbo Tu;Colin White;Jean Kossaifi;Boris Bonev;Gennady Pekhimenko;Kamyar Azizzadenesheli;Anima Anandkumar",
        "authorids": "~Renbo_Tu1;~Colin_White1;~Jean_Kossaifi1;~Boris_Bonev1;~Gennady_Pekhimenko1;~Kamyar_Azizzadenesheli1;~Anima_Anandkumar1",
        "gender": ";M;M;M;M;M;F",
        "homepage": "https://rtu715.github.io;https://crwhite.ml/;http://jeankossaifi.com/;https://bonevbs.github.io;http://www.cs.toronto.edu/~pekhimenko/;https://kamyar.page/;http://tensorlab.cms.caltech.edu/users/anima/",
        "dblp": ";136/9162;155/6766;199/1689;118/8979;176/5584;",
        "google_scholar": ";LS6HY-gAAAAJ;https://scholar.google.co.uk/citations?user=hJS2TXwAAAAJ;sYo-KS4AAAAJ;https://scholar.google.com.tw/citations?user=ZgqVLuMAAAAJ;CxAS4SQAAAAJ;bEcLezcAAAAJ",
        "orcid": ";;;0000-0002-4041-238X;;;",
        "linkedin": ";;;;;;anima-anandkumar-35171b1/",
        "or_profile": "~Renbo_Tu1;~Colin_White1;~Jean_Kossaifi1;~Boris_Bonev1;~Gennady_Pekhimenko1;~Kamyar_Azizzadenesheli1;~anima_anandkumar1",
        "aff": "University of Toronto;Abacus.AI;NVIDIA AI;NVIDIA;Department of Computer Science, University of Toronto;NVIDIA;California Institute of Technology",
        "aff_domain": "toronto.edu;abacus.ai;nvidia.com;nvidia.com;cs.toronto.edu;nvidia.com;caltech.edu",
        "position": "PhD student;Head of Research;Researcher;Researcher;Assistant Professor;Researcher;Full Professor",
        "bibtex": "@inproceedings{\ntu2024guaranteed,\ntitle={Guaranteed Approximation Bounds for Mixed-Precision Neural Operators},\nauthor={Renbo Tu and Colin White and Jean Kossaifi and Boris Bonev and Gennady Pekhimenko and Kamyar Azizzadenesheli and Anima Anandkumar},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=QJGj07PD9C}\n}",
        "github": "",
        "project": "",
        "reviewers": "dRFB;5SPZ;NM9S;XXPr",
        "pdf_size": 1649021,
        "rating": "5;6;8;8",
        "confidence": "4;3;3;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;4",
        "presentation": "3;3;4;4",
        "wc_summary": "206;70;39;150",
        "wc_strengths": "102;79;11;191",
        "wc_weaknesses": "138;57;38;95",
        "wc_questions": "52;1;4;66",
        "wc_review": "498;207;92;502",
        "wc_reply_reviewers": "0;17;0;13",
        "wc_reply_authors": "1217;385;464;921",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "2;1;1;2",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            116.25,
            65.76615771048206
        ],
        "wc_strengths_avg": [
            95.75,
            64.37148048631475
        ],
        "wc_weaknesses_avg": [
            82.0,
            38.294908277733214
        ],
        "wc_questions_avg": [
            30.75,
            28.699956445959984
        ],
        "wc_review_avg": [
            324.75,
            179.91022066575317
        ],
        "wc_reply_reviewers_avg": [
            7.5,
            7.632168761236874
        ],
        "wc_reply_authors_avg": [
            746.75,
            339.9664505506389
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.19245008972987526,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18065523846989231274&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=QJGj07PD9C",
        "pdf": "https://openreview.net/pdf?id=QJGj07PD9C",
        "email": "toronto.edu;abacus.ai;nvidia.com;nvidia.com;cs.toronto.edu;nvidia.com;caltech.edu",
        "author_num": 7,
        "aff_unique_index": "0;1;2;2;0;2;3",
        "aff_unique_norm": "University of Toronto;Abacus.AI;NVIDIA;California Institute of Technology",
        "aff_unique_dep": ";;NVIDIA AI;",
        "aff_unique_url": "https://www.utoronto.ca;https://www.abacus.ai;https://www.nvidia.com/en-us/research/;https://www.caltech.edu",
        "aff_unique_abbr": "U of T;Abacus.AI;NVIDIA;Caltech",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Toronto;Pasadena",
        "aff_country_unique_index": "0;1;1;1;0;1;1",
        "aff_country_unique": "Canada;United States"
    },
    {
        "id": "QJNOnYDsYA",
        "title": "Marginal Benefit Induced Unsupervised Environment Design",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Training generally capable Reinforcement Learning (RL) agents in complex environments is a challenging task that involves designing appropriate distributions of environments. Recent research has highlighted the potential of the Unsupervised Environment Design (UED) framework, which generates environments at the frontier of the agent\u2019s capabilities through adaptive curriculum learning using a regret-based objective. While regret-based approaches have shown great promise in generating feasible environments, they can produce difficult environments that are challenging for the agent to learn from. This is because regret represents the best-case learning potential of an environment, without indicating how much the agent can actually learn from it. To address this limitation, we propose an alternative objective that employs marginal benefit, focusing on the improvement in the agent policy associated with the environment. This new objective generates environments at a suitable pace for the agent's learning and thus achieves rapid convergence. Additionally, to improve the generalizability of the student agent, we introduce a novel diversity metric that aims to generate varied experiences for the agent. Finally, we provide detailed experimental results and ablation analysis to showcase the effectiveness of our new methods. Notably, our approach signifies the potential future interest in controlled environment generation within UED, particularly in a landscape currently dominated by algorithms based on random generation.",
        "keywords": "Unsupervised Environment Design;Marginal Benefit;Diversity;Curriculum;RL",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/5af34c75f6d1ee4d13fbe4440984952c4bac88ff.zip",
        "author": "Dexun Li;Wenjun Li;Pradeep Varakantham",
        "authorids": "~Dexun_Li1;~Wenjun_Li1;~Pradeep_Varakantham1",
        "gender": "M;M;M",
        "homepage": ";;http://www.mysmu.edu.sg/faculty/pradeepv",
        "dblp": "https://dblp.uni-trier.de/pid/130/1878.html;;72/759",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com.sg/citations?user=BAdQpFkAAAAJ",
        "orcid": ";;",
        "linkedin": ";wenjun-li-004375116/;",
        "or_profile": "~Dexun_Li1;~Wenjun_Li1;~Pradeep_Varakantham1",
        "aff": "Singapore Management University;Singapore Management University;Singapore Management University",
        "aff_domain": "smu.edu.sg;smu.edu.sg;smu.edu.sg",
        "position": "PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nli2024marginal,\ntitle={Marginal Benefit Induced Unsupervised Environment Design},\nauthor={Dexun Li and Wenjun Li and Pradeep Varakantham},\nyear={2024},\nurl={https://openreview.net/forum?id=QJNOnYDsYA}\n}",
        "github": "",
        "project": "",
        "reviewers": "32af;QN2d;oFUv;vj8C;gp3R",
        "site": "https://openreview.net/forum?id=QJNOnYDsYA",
        "pdf_size": 8495970,
        "rating": "3;3;3;5;5",
        "confidence": "4;3;4;4;5",
        "soundness": "3;3;3;2;2",
        "contribution": "2;2;2;2;3",
        "presentation": "1;2;2;2;3",
        "wc_summary": "57;99;126;63;53",
        "wc_strengths": "30;65;60;38;27",
        "wc_weaknesses": "237;375;513;59;239",
        "wc_questions": "310;18;11;48;46",
        "wc_review": "634;557;710;208;365",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            3.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            79.6,
            28.366177042386237
        ],
        "wc_strengths_avg": [
            44.0,
            15.607690412101336
        ],
        "wc_weaknesses_avg": [
            284.6,
            152.03894237990477
        ],
        "wc_questions_avg": [
            86.6,
            112.66516764288775
        ],
        "wc_review_avg": [
            494.8,
            183.66208100748506
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.6454972243679028,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:wqB3en-LLQgJ:scholar.google.com/&scioq=Marginal+Benefit+Induced+Unsupervised+Environment+Design&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Singapore Management University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.smu.edu.sg",
        "aff_unique_abbr": "SMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Singapore"
    },
    {
        "id": "QJvUyuwjsf",
        "title": "Find Your Optimal Assignments On-the-fly: A Holistic Framework for Clustered Federated Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Federated Learning (FL) is an emerging distributed machine learning approach that preserves client privacy by storing data on edge devices. However, data heterogeneity among clients presents challenges in training models that perform well on all local distributions. Recent studies have proposed clustering as a solution to tackle client heterogeneity in FL by grouping clients with distribution shifts into different clusters. However, the diverse learning frameworks used in current clustered FL methods make it challenging to integrate various clustered FL methods, gather their benefits, and make further improvements.\n\nTo this end, this paper presents a comprehensive investigation into current clustered FL methods and proposes a four-tier framework, namely HCFL, to encompass and extend existing approaches. Based on the HCFL, we identify the remaining challenges associated with current clustering methods in each tier and propose an enhanced clustering method called HCFL$^{+}$ to address these challenges. Through extensive numerical evaluations, we showcase the effectiveness of our clustering framework and the improved components. Our code will be publicly available.",
        "keywords": "Federated Learning;Clustering;Adaptive Clustering",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/7a922f2aa98cc338165607c1cc51fec56c5a8318.zip",
        "author": "Yongxin Guo;Xiaoying Tang;Tao Lin",
        "authorids": "~Yongxin_Guo1;~Xiaoying_Tang2;~Tao_Lin1",
        "gender": "M;F;M",
        "homepage": "https://gyxxyg.github.io/yongxinguo/;https://sse.cuhk.edu.cn/en/faculty/tangxiaoying;https://lins-lab.github.io/",
        "dblp": ";134/9714-2;64/4492-4.html",
        "google_scholar": "5Cl1GZwAAAAJ;https://scholar.google.com/citations?hl=zh-TW;QE9pa_cAAAAJ",
        "orcid": "0009-0001-8652-0722;0000-0003-3955-1195;0000-0002-3246-6935",
        "linkedin": ";;",
        "or_profile": "~Yongxin_Guo1;~Xiaoying_Tang2;~Tao_Lin1",
        "aff": "Tencent;The Chinese University of Hong Kong, Shenzhen;Westlake University",
        "aff_domain": "tencent.com;cuhk.edu.cn;westlake.edu",
        "position": "Intern;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nguo2024find,\ntitle={Find Your Optimal Assignments On-the-fly: A Holistic Framework for Clustered Federated Learning},\nauthor={Yongxin Guo and Xiaoying Tang and Tao Lin},\nyear={2024},\nurl={https://openreview.net/forum?id=QJvUyuwjsf}\n}",
        "github": "",
        "project": "",
        "reviewers": "fHet;8sHW;PAju",
        "site": "https://openreview.net/forum?id=QJvUyuwjsf",
        "pdf_size": 1003392,
        "rating": "3;3;5",
        "confidence": "5;4;3",
        "soundness": "3;2;2",
        "contribution": "2;2;2",
        "presentation": "3;2;2",
        "wc_summary": "52;33;47",
        "wc_strengths": "19;23;26",
        "wc_weaknesses": "66;179;51",
        "wc_questions": "7;105;40",
        "wc_review": "144;340;164",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            44.0,
            8.04155872120988
        ],
        "wc_strengths_avg": [
            22.666666666666668,
            2.8674417556808756
        ],
        "wc_weaknesses_avg": [
            98.66666666666667,
            57.13337222869154
        ],
        "wc_questions_avg": [
            50.666666666666664,
            40.71308825863687
        ],
        "wc_review_avg": [
            216.0,
            88.0605852051113
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8660254037844387,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10453303178900667577&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Tencent;Chinese University of Hong Kong;Westlake University",
        "aff_unique_dep": "Tencent Holdings Limited;;",
        "aff_unique_url": "https://www.tencent.com;https://www.cuhk.edu.cn;https://www.westlake.edu.cn",
        "aff_unique_abbr": "Tencent;CUHK;WU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Shenzhen",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "QKqWnNkwPL",
        "title": "Self-distillation for diffusion models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In recent years, diffusion models have demonstrated powerful generative capabilities. As they continue to grow in both ability and complexity, performance optimization becomes more relevant. Knowledge Distillation (KD), where the output from a pre-trained teacher model is used to train a smaller student model, has been shown to greatly reduce the number of network evaluations required, while retaining comparable image sample quality. KD is especially useful in diffusion, because it can be used not only to distill a large model into a small one, but also to distill a large number of denoising iterations into a small one. Here, we show that a form of _self-distillation_&mdash;training a subnetwork to mimic the output of the larger network, effectively distilling a network into itself&mdash;can improve distillation in diffusion models. We show first that when a pre-trained teacher model is distilled to a student network, we can turn this into a self-distillation procedure by unifying the teacher and the student. Our results indicate that this leads to faster convergence for a competitive sample quality. Additionally, we show in small-scale experiments that when diffusion models are trained from scratch, adding a self-distillation term to the loss can, in specific cases, help the model to convergence produce high-quality samples more quickly.",
        "keywords": "Generative models;Diffusion;Self-Distillation;Denoising Diffusion Models;DDIM",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/163f8922722f9368e80e05ac13c9219e1cb40d37.zip",
        "author": "Damion Woods;Peter Bloem",
        "authorids": "~Damion_Woods1;~Peter_Bloem1",
        "gender": "M;M",
        "homepage": "https://github.com/Pmobilee;http://peterbloem.nl",
        "dblp": ";151/0108",
        "google_scholar": ";https://scholar.google.nlcitations/?user=zVntAfQAAAAJ",
        "orcid": ";0000-0002-0189-5817",
        "linkedin": "damion-mul-363b1415b/;",
        "or_profile": "~Damion_Woods1;~Peter_Bloem1",
        "aff": ";Vrije Universiteit Amsterdam",
        "aff_domain": ";vu.nl",
        "position": ";Assistant Professor",
        "bibtex": "@misc{\nwoods2024selfdistillation,\ntitle={Self-distillation for diffusion models},\nauthor={Damion Woods and Peter Bloem},\nyear={2024},\nurl={https://openreview.net/forum?id=QKqWnNkwPL}\n}",
        "github": "",
        "project": "",
        "reviewers": "Robz;EnYo;tQwJ",
        "site": "https://openreview.net/forum?id=QKqWnNkwPL",
        "pdf_size": 30341259,
        "rating": "3;3;3",
        "confidence": "4;4;4",
        "soundness": "2;2;2",
        "contribution": "1;2;2",
        "presentation": "2;1;3",
        "wc_summary": "145;78;138",
        "wc_strengths": "99;51;19",
        "wc_weaknesses": "424;279;149",
        "wc_questions": "299;5;2",
        "wc_review": "967;413;308",
        "wc_reply_reviewers": "221;0;0",
        "wc_reply_authors": "1015;192;351",
        "reply_reviewers": "2;0;0",
        "reply_authors": "3;1;1",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            120.33333333333333,
            30.070288030250428
        ],
        "wc_strengths_avg": [
            56.333333333333336,
            32.87687468250121
        ],
        "wc_weaknesses_avg": [
            284.0,
            112.32393630329497
        ],
        "wc_questions_avg": [
            102.0,
            139.30541985149034
        ],
        "wc_review_avg": [
            562.6666666666666,
            289.10244243558753
        ],
        "wc_reply_reviewers_avg": [
            73.66666666666667,
            104.18039909481799
        ],
        "wc_reply_authors_avg": [
            519.3333333333334,
            356.44946657586996
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Vek1BcHTUJkJ:scholar.google.com/&scioq=Self-distillation+for+diffusion+models&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Vrije Universiteit Amsterdam",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.vu.nl",
        "aff_unique_abbr": "VU Amsterdam",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Netherlands"
    },
    {
        "id": "QL3Zuth6E7",
        "title": "Prompt-Free Diffusion: Taking \u201cText\u201d out of Text-to-Image Diffusion Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Text-to-image (T2I) research has grown explosively in the past year, owing to the large-scale pre-trained diffusion models and many emerging personalization and editing approaches. Yet, \\textbf{one pain point persists: the text prompt engineering}, and searching high-quality text prompts for customized results is more art than science. Moreover, as commonly argued: ``an image is worth a thousand words\" - the attempt to describe a desired image with texts often ends up being ambiguous and cannot comprehensively cover delicate visual details, hence necessitating more additional controls from the visual domain. In this paper, we take a bold step forward: taking \u201cText\u201d out of a pre-trained T2I diffusion model, to reduce the burdensome prompt engineering efforts for users. Our proposed framework, \\textbf{Prompt-Free Diffusion}, relies on \\textbf{only visual inputs to generate new images}: it takes a reference image as ``context\u201d, an optional image structural conditioning, and an initial noise, with absolutely no text prompt. The core architecture behind the scene is \\textbf{Se}mantic Context \\textbf{E}n\\textbf{coder} (\\textbf{SeeCoder}), substituting the commonly used CLIP-based or LLM-based text encoder.  The reusability of SeeCoder also makes it a convenient drop-in component: one can also pre-train a SeeCoder in one T2I model and reuse it for another. Through extensive experiments, Prompt-Free Diffusion is experimentally found to (i) outperform prior exemplar-based image synthesis approaches; (ii) perform on par with state-of-the-art T2I models using prompts following the best practice; and (iii) be naturally extensible to other downstream applications such as anime figure generation and virtual try-on, with promising quality. Our code and models will be open-sourced.",
        "keywords": "Text-to-Image;Diffusion Models;Image-Variation;Generative Models;High-Quality Image Generation;Representation Learning",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Xingqian Xu;Jiayi Guo;Zhangyang Wang;Gao Huang;Irfan Essa;Humphrey Shi",
        "authorids": "~Xingqian_Xu2;~Jiayi_Guo2;~Zhangyang_Wang1;~Gao_Huang1;~Irfan_Essa1;~Humphrey_Shi1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://xingqian2018.github.io/;https://jiayiguo821.github.io/;https://vita-group.github.io;http://www.gaohuang.net;http://www.irfanessa.com/;https://www.humphreyshi.com",
        "dblp": "256/1005;;119/4026;;e/IrfanAEssa;176/5516",
        "google_scholar": "s1X82zMAAAAJ;2p6GCEEAAAAJ;pxFyKAIAAAAJ;-P9LwcgAAAAJ;https://scholar.google.com.tw/citations?user=XM97iScAAAAJ;WBvt5A8AAAAJ",
        "orcid": ";;;;0000-0002-6236-2969;0000-0002-2922-5663",
        "linkedin": "xingqian-xu-97b46526/;;;;irfanessa/;humphreyshi",
        "or_profile": "~Xingqian_Xu2;~Jiayi_Guo2;~Zhangyang_Wang1;~Gao_Huang1;~Irfan_Essa1;~Honghui_Shi1",
        "aff": "PicsArt Inc.;Tsinghua University;University of Texas at Austin;Tsinghua University;Georgia Institute of Technology;University of Illinois, Urbana Champaign",
        "aff_domain": "picsart.com;tsinghua.edu.cn;utexas.edu;tsinghua.edu.cn;gatech.edu;illinois.edu",
        "position": "Senior Research Scientist;PhD student;Associate Professor;Associate Professor;Full Professor;Adjunct Assistant Professor",
        "bibtex": "@misc{\nxu2024promptfree,\ntitle={Prompt-Free Diffusion: Taking {\\textquotedblleft}Text{\\textquotedblright} out of Text-to-Image Diffusion Models},\nauthor={Xingqian Xu and Jiayi Guo and Zhangyang Wang and Gao Huang and Irfan Essa and Humphrey Shi},\nyear={2024},\nurl={https://openreview.net/forum?id=QL3Zuth6E7}\n}",
        "github": "",
        "project": "",
        "reviewers": "ESh9;9Xqi;KASv;tGkr",
        "site": "https://openreview.net/forum?id=QL3Zuth6E7",
        "pdf_size": 5833982,
        "rating": "1;3;3;5",
        "confidence": "5;3;4;5",
        "soundness": "2;2;2;2",
        "contribution": "2;2;1;2",
        "presentation": "2;1;1;3",
        "wc_summary": "51;58;108;41",
        "wc_strengths": "8;34;18;52",
        "wc_weaknesses": "149;176;37;118",
        "wc_questions": "10;154;26;33",
        "wc_review": "218;422;189;244",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            64.5,
            25.83118270617898
        ],
        "wc_strengths_avg": [
            28.0,
            16.673332000533065
        ],
        "wc_weaknesses_avg": [
            120.0,
            52.12964607591346
        ],
        "wc_questions_avg": [
            55.75,
            57.333999511633586
        ],
        "wc_review_avg": [
            268.25,
            90.87457015029013
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 59,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2852268377797631085&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;2;1;3;4",
        "aff_unique_norm": "Picsart;Tsinghua University;University of Texas at Austin;Georgia Institute of Technology;University of Illinois Urbana-Champaign",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.picsart.com;https://www.tsinghua.edu.cn;https://www.utexas.edu;https://www.gatech.edu;https://illinois.edu",
        "aff_unique_abbr": "PicsArt;THU;UT Austin;Georgia Tech;UIUC",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Austin;Urbana-Champaign",
        "aff_country_unique_index": "0;1;0;1;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "QLKgDBUXTR",
        "title": "How many views does your deep neural network use for prediction?",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The generalization ability of Deep Neural Networks (DNNs) is still not fully understood, despite numerous theoretical and empirical analyses. Recently, Allen-Zhu \\& Li (2023) introduced the concept of *multi-views* to explain the generalization ability of DNNs, but their main target is ensemble or distilled models, and no method for estimating multi-views used in a prediction of a specific input is discussed. In this paper, we propose *Minimal Sufficient Views (MSVs)*, which is similar to multi-views but can be efficiently computed for real images. MSVs is a set of minimal and distinct features in an input, each of which preserves a model's prediction for the input. We empirically show that there is a clear relationship between the number of MSVs and prediction accuracy across models, including convolutional and transformer models, suggesting that a multi-view like perspective is also important for understanding the generalization ability of (non-ensemble or non-distilled) DNNs.",
        "keywords": "multi-view;generalizaion ability of deep neural networks;explainable AI",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Keisuke Kawano;Takuro Kutsuna;Keisuke Sano",
        "authorids": "~Keisuke_Kawano1;~Takuro_Kutsuna1;~Keisuke_Sano1",
        "gender": "M;M;M",
        "homepage": ";;",
        "dblp": "99/5720;70/9023;",
        "google_scholar": "NOR5hV0AAAAJ;;",
        "orcid": ";0000-0001-6965-1512;0009-0000-3270-1045",
        "linkedin": ";;",
        "or_profile": "~Keisuke_Kawano1;~Takuro_Kutsuna1;~Keisuke_Sano1",
        "aff": "University of Tsukuba, Tsukuba University;Toyota Central R&D Labs., Inc.;DENSO CORPORATION",
        "aff_domain": "cs.tsukuba.ac.jp;tytlabs.co.jp;jp.denso.com",
        "position": "PhD student;Researcher;Engineer",
        "bibtex": "@misc{\nkawano2024how,\ntitle={How many views does your deep neural network use for prediction?},\nauthor={Keisuke Kawano and Takuro Kutsuna and Keisuke Sano},\nyear={2024},\nurl={https://openreview.net/forum?id=QLKgDBUXTR}\n}",
        "github": "",
        "project": "",
        "reviewers": "qNfq;pywZ;XK9X;xok8",
        "site": "https://openreview.net/forum?id=QLKgDBUXTR",
        "pdf_size": 9760164,
        "rating": "3;5;5;6",
        "confidence": "4;5;4;3",
        "soundness": "2;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "2;3;3;3",
        "wc_summary": "55;33;79;70",
        "wc_strengths": "17;12;65;58",
        "wc_weaknesses": "213;131;156;484",
        "wc_questions": "4;3;2;65",
        "wc_review": "289;179;302;677",
        "wc_reply_reviewers": "42;0;0;163",
        "wc_reply_authors": "561;867;798;2270",
        "reply_reviewers": "1;0;0;2",
        "reply_authors": "2;2;2;5",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            59.25,
            17.41228014936585
        ],
        "wc_strengths_avg": [
            38.0,
            23.695991222145572
        ],
        "wc_weaknesses_avg": [
            246.0,
            140.58627244507196
        ],
        "wc_questions_avg": [
            18.5,
            26.85609800399157
        ],
        "wc_review_avg": [
            361.75,
            188.17727678973358
        ],
        "wc_reply_reviewers_avg": [
            51.25,
            66.758426434421
        ],
        "wc_reply_authors_avg": [
            1124.0,
            671.3065618627603
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.75,
            1.299038105676658
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3244428422615251,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:aRKczL1hhPgJ:scholar.google.com/&scioq=How+many+views+does+your+deep+neural+network+use+for+prediction%3F&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of Tsukuba;Toyota Central R&D Labs;DENSO Corporation",
        "aff_unique_dep": ";R&D;",
        "aff_unique_url": "https://www.tsukuba.ac.jp;https://www.toyota-global.com;https://www.denso.com",
        "aff_unique_abbr": "UT;Toyota R&D;DENSO",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Tsukuba;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Japan"
    },
    {
        "title": "Decodable and Sample Invariant Continuous Object Encoder",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18679",
        "id": "QLoepRnoue",
        "author_site": "Dehao Yuan, Furong Huang, Cornelia Fermuller, Yiannis Aloimonos",
        "tldr": "",
        "abstract": "We propose Hyper-Dimensional Function Encoding (HDFE). Given samples of a continuous object (e.g. a function), HDFE produces an explicit vector representation of the given object, invariant to the sample distribution and density. Sample distribution and density invariance enables HDFE to consistently encode continuous objects regardless of their sampling, and therefore allows neural networks to receive continuous objects as inputs for machine learning tasks, such as classification and regression. Besides, HDFE does not require any training and is proved to map the object into an organized embedding space, which facilitates the training of the downstream tasks.  In addition, the encoding is decodable, which enables neural networks to regress continuous objects \nby regressing their encodings.  Therefore, HDFE serves as an interface for processing continuous objects. \n\nWe apply HDFE to function-to-function mapping, where vanilla HDFE achieves competitive performance with the state-of-the-art algorithm. We apply HDFE to point cloud surface normal estimation, where a simple replacement from PointNet to HDFE leads to  12\\% and 15\\% error reductions in two benchmarks. \nIn addition, by integrating HDFE into the PointNet-based SOTA network, we improve the SOTA baseline by 2.5\\% and 1.7\\% on the same benchmarks.",
        "keywords": "Point Cloud;PointNet;Function Mapping;Encoder;Noise Robustness",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/edd0c45111962cbba768f069db18e32be783c469.pdf",
        "author": "Dehao Yuan;Furong Huang;Cornelia Fermuller;Yiannis Aloimonos",
        "authorids": "~Dehao_Yuan1;~Furong_Huang1;~Cornelia_Fermuller3;~Yiannis_Aloimonos1",
        "gender": "M;F;F;M",
        "homepage": "https://www.cs.umd.edu/~dhyuan/;https://furong-huang.com;http://users.umiacs.umd.edu/users/fer/;http://www.prg.cs.umd.edu",
        "dblp": "321/3498;72/8513;f/CorneliaFermuller;a/YiannisAloimonos",
        "google_scholar": "B3zkxloAAAAJ;13yyuCcAAAAJ;0gEOJSEAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0003-1957-6360;;0000-0003-2044-2386;",
        "linkedin": "dehao-yuan-875ba115b/;;cornelia-fermuller-594b855/;yiannis-aloimonos-6374865/",
        "or_profile": "~Dehao_Yuan1;~Furong_Huang1;~Cornelia_Fermuller3;~Yiannis_Aloimonos1",
        "aff": "University of Maryland, College Park;University of Maryland;University of Maryland, College Park;University of Maryland, College Park",
        "aff_domain": "umd.edu;cs.umd.edu;umd.edu;umd.edu",
        "position": "PhD student;Assistant Professor;Research Scientist;Full Professor",
        "bibtex": "@inproceedings{\nyuan2024decodable,\ntitle={Decodable and Sample Invariant Continuous Object Encoder},\nauthor={Dehao Yuan and Furong Huang and Cornelia Fermuller and Yiannis Aloimonos},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=QLoepRnoue}\n}",
        "github": "",
        "project": "",
        "reviewers": "421T;jCpW;oyrE",
        "pdf_size": 4347830,
        "rating": "6;8;8",
        "confidence": "4;2;3",
        "soundness": "3;4;4",
        "contribution": "2;4;3",
        "presentation": "2;4;3",
        "wc_summary": "79;40;155",
        "wc_strengths": "69;62;54",
        "wc_weaknesses": "294;28;196",
        "wc_questions": "198;30;253",
        "wc_review": "640;160;658",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1339;318;1544",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;1;3",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            91.33333333333333,
            47.75167245471327
        ],
        "wc_strengths_avg": [
            61.666666666666664,
            6.128258770283412
        ],
        "wc_weaknesses_avg": [
            172.66666666666666,
            109.84028809543832
        ],
        "wc_questions_avg": [
            160.33333333333334,
            94.85544557670664
        ],
        "wc_review_avg": [
            486.0,
            230.63390904201404
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1067.0,
            536.1946164096266
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=775957978288341065&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=QLoepRnoue",
        "pdf": "https://openreview.net/pdf?id=QLoepRnoue",
        "email": "umd.edu;cs.umd.edu;umd.edu;umd.edu",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of Maryland",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www/umd.edu",
        "aff_unique_abbr": "UMD",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "College Park;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "QMQBza9BCx",
        "title": "Persistent homology for high-dimensional data based on spectral methods",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Persistent homology is a popular computational tool for detecting non-trivial topology of point clouds, such as the presence of loops or voids. However, many real-world datasets with low intrinsic dimensionality reside in an ambient space of much higher dimensionality. We show that in this case vanilla persistent homology becomes very sensitive to noise and fails to detect the correct topology. The same holds true for most existing refinements of persistent homology. As a remedy, we find that spectral distances on the $k$-nearest-neighbor graph of the data, such as diffusion distance and effective resistance, allow persistent homology to detect the correct topology even in the presence of high-dimensional noise. Furthermore, we derive a novel closed-form expression for effective resistance in terms of the eigendecomposition of the graph Laplacian, and describe its relation to diffusion distances. Finally, we apply these methods to several high-dimensional single-cell RNA-sequencing datasets and show that spectral distances on the $k$-nearest-neighbor graph allow robust detection of cell cycle loops.",
        "keywords": "persistent homology;topological data analysis;diffusion distance;effective resistance;single-cell RNA sequencing;curse of dimensionality;spectral methods;topology",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/2a623ceb1bd3181104a3a44f8f3dce374c2ec573.zip",
        "author": "Sebastian Damrich;Philipp Berens;Dmitry Kobak",
        "authorids": "~Sebastian_Damrich1;~Philipp_Berens1;~Dmitry_Kobak2",
        "gender": ";M;",
        "homepage": ";http://www.berenslab.org;https://dkobak.github.io/",
        "dblp": "252/5237;78/3560;236/5191",
        "google_scholar": "-ClpooYAAAAJ;https://scholar.google.de/citations?user=lPQLk3QAAAAJ;BUQbD5kAAAAJ",
        "orcid": "0000-0003-1394-6236;;",
        "linkedin": "sebastian-damrich-a44a8131;;",
        "or_profile": "~Sebastian_Damrich1;~Philipp_Berens1;~Dmitry_Kobak2",
        "aff": "Eberhard-Karls-Universit\u00e4t T\u00fcbingen;University of Tuebingen;Eberhard-Karls-Universit\u00e4t T\u00fcbingen",
        "aff_domain": "uni-tuebingen.de;uni-tuebingen.de;uni-tuebingen.de",
        "position": "Postdoc;Full Professor;Researcher",
        "bibtex": "@misc{\ndamrich2024persistent,\ntitle={Persistent homology for high-dimensional data based on spectral methods},\nauthor={Sebastian Damrich and Philipp Berens and Dmitry Kobak},\nyear={2024},\nurl={https://openreview.net/forum?id=QMQBza9BCx}\n}",
        "github": "",
        "project": "",
        "reviewers": "qoEF;k35W;BdHd;TJmS",
        "site": "https://openreview.net/forum?id=QMQBza9BCx",
        "pdf_size": 3156201,
        "rating": "3;3;6;6",
        "confidence": "4;4;5;3",
        "soundness": "3;2;3;2",
        "contribution": "2;3;2;2",
        "presentation": "3;2;3;3",
        "wc_summary": "90;104;79;33",
        "wc_strengths": "64;48;110;28",
        "wc_weaknesses": "154;37;406;106",
        "wc_questions": "49;427;2;1615",
        "wc_review": "357;616;597;1782",
        "wc_reply_reviewers": "131;1036;71;429",
        "wc_reply_authors": "577;2087;834;4143",
        "reply_reviewers": "1;2;1;1",
        "reply_authors": "2;5;2;8",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            76.5,
            26.63174797117155
        ],
        "wc_strengths_avg": [
            62.5,
            30.244834269673227
        ],
        "wc_weaknesses_avg": [
            175.75,
            139.2881455831759
        ],
        "wc_questions_avg": [
            523.25,
            651.4976496504036
        ],
        "wc_review_avg": [
            838.0,
            554.4957168454956
        ],
        "wc_reply_reviewers_avg": [
            416.75,
            382.3665616917881
        ],
        "wc_reply_authors_avg": [
            1910.25,
            1409.9896054581395
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.25,
            2.48746859276655
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14355986058280832432&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Eberhard Karls University of T\u00fcbingen;University of Tuebingen",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uni-tuebingen.de/;https://www.uni-tuebingen.de/",
        "aff_unique_abbr": "Uni T\u00fcbingen;Uni T\u00fcbingen",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "T\u00fcbingen;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "QMkYEau02q",
        "title": "Physics-Guided Learning of Meteorological Dynamics for Weather Forecasting and Downscaling",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Weather forecasting is of paramount importance for a myriad of societal and scientific applications. Traditionally, numerical weather prediction (NWP) methods based on physical principles are computationally intensive and can struggle with the inherent complexity of atmospheric dynamics. Recently, deep learning techniques have shown promise in weather prediction, but the long-term generalization and physical consistency of pure data-driven approaches remain challenging. In this paper, we introduce a novel physics-guided approach for numerical weather prediction that combines the strengths of both physical mechanism and deep learning, namely PhyDL-NWP. Our method can capture the nonlinear dynamics of meteorology and align deep learning models with the underlying physical mechanism to improve generalization. Extensive experiments on real-world weather datasets show that our model can significantly improve the performance of deep learning methods in a wide range of tasks from forecasting to downscaling.",
        "keywords": "Weather Forecasting;Weather Downscaling;Spatiotemporal Modeling;Partial Differential Equations;Physics-Guided Learning",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/567c290bd8ad3d6c0e4029accff29999f21cf00c.pdf",
        "author": "Yingtao Luo;Shikai Fang;Binqing Wu;Qingsong Wen;Liang Sun",
        "authorids": "~Yingtao_Luo1;~Shikai_Fang2;~Binqing_Wu1;~Qingsong_Wen2;~Liang_Sun2",
        "gender": ";F;M;M;M",
        "homepage": "https://yingtaoluo.github.io/;;https://www.linkedin.com/in/liang-sun-a0a87621/;https://sites.google.com/site/qingsongwen8/;https://www.cs.utah.edu/~shikai/",
        "dblp": "278/2956;300/8286.html;18/5837-1;27/561;270/2142",
        "google_scholar": "g_MmNEoAAAAJ;;D_cOMBgAAAAJ;vjPJvwYAAAAJ;h280gfwAAAAJ",
        "orcid": "0000-0003-1794-3657;0000-0001-8276-0801;0009-0002-5835-7259;0000-0003-4516-2524;0009-0006-4527-5878",
        "linkedin": ";;;qingsong-wen-22814156/;shikai-fang-34b143119/",
        "or_profile": "~Yingtao_Luo1;~Binqing_Wu1;~Liang_Sun2;~Qingsong_Wen1;~shikai_fang1",
        "aff": "Carnegie Mellon University;Zhejiang University;Alibaba Group;Squirrel Ai Learning;University of Utah",
        "aff_domain": "andrew.cmu.edu;zju.edu.cn;alibaba-inc.com;squirrelai.com;utah.edu",
        "position": "PhD student;PhD student;Staff Software Engineer;Principal Researcher;PhD student",
        "bibtex": "@misc{\nluo2024physicsguided,\ntitle={Physics-Guided Learning of Meteorological Dynamics for Weather Forecasting and Downscaling},\nauthor={Yingtao Luo and Shikai Fang and Binqing Wu and Qingsong Wen and Liang Sun},\nyear={2024},\nurl={https://openreview.net/forum?id=QMkYEau02q}\n}",
        "github": "",
        "project": "",
        "reviewers": "W7oo;MMEb;HSXq;hFQ3",
        "site": "https://openreview.net/forum?id=QMkYEau02q",
        "pdf_size": 856667,
        "rating": "3;3;5;6",
        "confidence": "3;3;4;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;2;4",
        "wc_summary": "85;244;42;77",
        "wc_strengths": "62;63;87;52",
        "wc_weaknesses": "799;309;215;93",
        "wc_questions": "59;32;5;4",
        "wc_review": "1005;648;349;226",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "2007;919;1769;740",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "4;2;3;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            112.0,
            77.90699583477725
        ],
        "wc_strengths_avg": [
            66.0,
            12.864680330268607
        ],
        "wc_weaknesses_avg": [
            354.0,
            268.09140232390894
        ],
        "wc_questions_avg": [
            25.0,
            22.616365755797283
        ],
        "wc_review_avg": [
            557.0,
            300.75322109663267
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1358.75,
            539.6213371430007
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.9622504486493761,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:nZyNJlXN_tgJ:scholar.google.com/&scioq=Physics-Guided+Learning+of+Meteorological+Dynamics+for+Weather+Forecasting+and+Downscaling&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "Carnegie Mellon University;Zhejiang University;Alibaba Group;Squirrel Ai Learning;University of Utah",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.cmu.edu;https://www.zju.edu.cn;https://www.alibaba.com;https://www.squirrelai.com/;https://www.utah.edu",
        "aff_unique_abbr": "CMU;ZJU;Alibaba;;Utah",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "QNW42cjkym",
        "title": "A Data-Driven Solution for the Cold Start Problem in Biomedical Image Classification",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The demand for large quantities of high-quality annotated images poses a significant bottleneck for developing an effective deep learning-based classifiers in the biomedical domain. \nWe present a simple yet powerful solution to the cold start problem, i.e., selecting the most informative data for annotation within unlabeled datasets. \nOur framework encompasses three key components: \n(i) Pretraining an encoder using self-supervised learning  to construct a meaningful data representation of unlabeled data, \n(ii) sampling the most informative data points for annotation, and \n(iii) initializing a model ensemble to overcome the lack of validation data in such contexts. \nWe test our approach on four challenging public biomedical datasets. \nOur strategy outperforms the state-of-the-art in all datasets and achieves a $7\\%$ improvement on leukemia blood cell classification task with $8$ times faster performance.\nOur work facilitates the application of deep learning-based classifiers in the biomedical fields, offering a practical and efficient solution to the challenges associated with tedious and costly, high-quality data annotation.",
        "keywords": "cold start learning problem;representation learning;representative data sampling;biomedical imaging",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Salome Kazeminia;Miroslav B\u0159ez\u00edk;Carsten Marr;Sayedali Shetab Boushehri",
        "authorids": "~Salome_Kazeminia2;~Miroslav_B\u0159ez\u00edk1;~Carsten_Marr1;~Sayedali_Shetab_Boushehri2",
        "gender": "F;M;M;M",
        "homepage": ";;https://www.helmholtz-muenchen.de/icb/research/groups/marr-lab/overview/index.html;",
        "dblp": ";;;",
        "google_scholar": "dYzerwkAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.de/citations?user=Wg9zjqEAAAAJ;v231nOcAAAAJ",
        "orcid": "0000-0002-5500-9761;0009-0003-8346-0386;0000-0003-2154-4552;0000-0003-3391-9294",
        "linkedin": "salome-kazeminia/;;;https://linkedin.com/in/aliechoes/",
        "or_profile": "~Salome_Kazeminia2;~Miroslav_B\u0159ez\u00edk1;~Carsten_Marr1;~Sayedali_Shetab_Boushehri2",
        "aff": "Technische Universit\u00e4t M\u00fcnchen;Technische Universit\u00e4t M\u00fcnchen;Helmholtz Munich;",
        "aff_domain": "tum.de;tum.de;helmholtz-muenchen.de;",
        "position": "PhD student;MS student;Principal Researcher;",
        "bibtex": "@misc{\nkazeminia2024a,\ntitle={A Data-Driven Solution for the Cold Start Problem in Biomedical Image Classification},\nauthor={Salome Kazeminia and Miroslav B{\\v{r}}ez{\\'\\i}k and Carsten Marr and Sayedali Shetab Boushehri},\nyear={2024},\nurl={https://openreview.net/forum?id=QNW42cjkym}\n}",
        "github": "",
        "project": "",
        "reviewers": "4VCU;eBNR;GNyG;yiXC",
        "site": "https://openreview.net/forum?id=QNW42cjkym",
        "pdf_size": 25731637,
        "rating": "3;3;3;5",
        "confidence": "5;5;3;2",
        "soundness": "3;1;2;2",
        "contribution": "1;1;2;2",
        "presentation": "2;2;2;2",
        "wc_summary": "80;67;66;73",
        "wc_strengths": "53;37;75;90",
        "wc_weaknesses": "144;153;92;71",
        "wc_questions": "9;39;9;41",
        "wc_review": "286;296;242;275",
        "wc_reply_reviewers": "32;49;38;35",
        "wc_reply_authors": "405;618;178;549",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            1.299038105676658
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            71.5,
            5.5901699437494745
        ],
        "wc_strengths_avg": [
            63.75,
            20.29008378494283
        ],
        "wc_weaknesses_avg": [
            115.0,
            34.46012188022556
        ],
        "wc_questions_avg": [
            24.5,
            15.5161206491829
        ],
        "wc_review_avg": [
            274.75,
            20.314711418083203
        ],
        "wc_reply_reviewers_avg": [
            38.5,
            6.422616289332565
        ],
        "wc_reply_authors_avg": [
            437.5,
            168.38126380331036
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.7777777777777777,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6632559427445679196&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Technische Universit\u00e4t M\u00fcnchen;Helmholtz Zentrum M\u00fcnchen",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tum.de;https://www.helmholtz-muenchen.de",
        "aff_unique_abbr": "TUM;HMGU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "QO3yH7X8JJ",
        "title": "Dissecting Arbitrary-scale Super-resolution Capability from Pre-trained Diffusion Generative Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Diffusion-based Generative Models (DGMs) have achieved unparalleled performance in synthesizing high-quality visual content, opening up the opportunity to improve image super-resolution (SR) tasks. Recent solutions for these tasks often train architecture-specific DGMs from scratch, or require iterative fine-tuning and distillation on pre-trained DGMs, both of which take considerable time and hardware investments. More seriously, since the DGMs are established with a discrete pre-defined upsampling scale, they cannot well match the emerging requirements of arbitrary-scale super-resolution (ASSR), where a unified model adapts to arbitrary upsampling scales, instead of preparing a series of distinct models for each case. These limitations beg an intriguing question: can we identify the ASSR capability of existing pre-trained DGMs without the need for distillation or fine-tuning? In this paper, we take a step towards resolving this matter by proposing Diff-SR, a first ASSR attempt based solely on pre-trained DGMs, without additional training efforts. It is motivated by an exciting finding that a simple methodology, which first injects a specific amount of noise into the low-resolution images before invoking a DGM\u2019s backward diffusion process, outperforms current leading solutions. The key insight is determining a suitable amount of noise to inject, i.e., small amounts lead to poor low-level fidelity, while over-large amounts degrade the high-level signature. Through a finely-grained theoretical analysis, we propose the Perceptual Recoverable Field (PRF), a metric that achieves the optimal trade-off between these two factors. Extensive experiments verify the effectiveness, flexibility, and adaptability of Diff-SR, demonstrating superior performance to state-of-the-art solutions under diverse ASSR environments.",
        "keywords": "Diffusion model;Arbitrary-scale Super-resolution;Pretrained Model",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/0b61296a408028cee50b16a4b38558f484363898.pdf",
        "author": "Ruibin Li;Qihua Zhou;Song Guo;Jie ZHANG;Jingcai Guo;XINYANG JIANG;Yifei Shen;Zhenhua Han",
        "authorids": "~Ruibin_Li1;~Qihua_Zhou1;~Song_Guo5;~Jie_ZHANG18;~Jingcai_Guo1;~XINYANG_JIANG2;~Yifei_Shen1;~Zhenhua_Han1",
        "gender": "M;M;M;F;M;M;M;M",
        "homepage": "http://peilab.comp.polyu.edu.hk/people/ruibin-li/avatar_hu3c09cb03f3d6a3287c02a261288bd65e_3300992_270x270_fill_q100_lanczos_center.jpg;https://qihuazhou.github.io;https://cse.hkust.edu.hk/~songguo/;https://cugzj.github.io/zhangjie.github.io/;https://jingcaiguo.github.io/;;https://openreview.net/profile?id=~Yifei_Shen1;https://hzhua.github.io/",
        "dblp": "259/8982;213/0984;01/267-1;84/6889-76;192/7270;155/6316;51/609.html;147/1606.html",
        "google_scholar": ";vsD8e8QAAAAJ;https://scholar.google.com/citations?hl=en;JRCNlI8AAAAJ;YjSHPjcAAAAJ;JiTfWVMAAAAJ;;https://scholar.google.com.hk/citations?user=NJr2G5AAAAAJ",
        "orcid": "0000-0003-0001-9281;;;0000-0002-8073-2118;0000-0002-0449-4525;;;0000-0002-2880-7100",
        "linkedin": ";;;;jingcai-guo;xinyang-jiang-ab5416b0/;;",
        "or_profile": "~Ruibin_Li1;~Qihua_Zhou1;~Song_Guo5;~Jie_ZHANG18;~Jingcai_Guo1;~XINYANG_JIANG2;~Yifei_Shen1;~Zhenhua_Han1",
        "aff": "Hong Kong Polytechnic University;Hong Kong University of Science and Technology;Department of Computer Science and Engineering, Hong Kong University of Science and Technology;The Hong Kong Polytechnic University;The Hong Kong Polytechnic University;Microsoft;Microsoft Research Asia;Microsoft",
        "aff_domain": "polyu.edu.hk;cse.ust.hk;cse.ust.hk;polyu.edu.hk;polyu.edu.hk;microsoft.com;microsoft.com;microsoft.com",
        "position": "PhD student;Postdoc;Full Professor;Postdoc;Assistant Professor;Senior Researcher;Research Cheerleader;Researcher",
        "bibtex": "@misc{\nli2024dissecting,\ntitle={Dissecting Arbitrary-scale Super-resolution Capability from Pre-trained Diffusion Generative Models},\nauthor={Ruibin Li and Qihua Zhou and Song Guo and Jie ZHANG and Jingcai Guo and XINYANG JIANG and Yifei Shen and Zhenhua Han},\nyear={2024},\nurl={https://openreview.net/forum?id=QO3yH7X8JJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "oyvV;cxpS;c56f;aha2",
        "site": "https://openreview.net/forum?id=QO3yH7X8JJ",
        "pdf_size": 44788643,
        "rating": "5;5;5;6",
        "confidence": "5;4;3;4",
        "soundness": "3;3;2;3",
        "contribution": "3;2;2;3",
        "presentation": "3;3;1;3",
        "wc_summary": "69;100;55;88",
        "wc_strengths": "56;78;75;24",
        "wc_weaknesses": "5;178;203;144",
        "wc_questions": "199;146;17;3",
        "wc_review": "329;502;350;259",
        "wc_reply_reviewers": "0;393;0;0",
        "wc_reply_authors": "1070;1128;343;988",
        "reply_reviewers": "0;5;0;0",
        "reply_authors": "2;4;1;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            78.0,
            17.277152543170995
        ],
        "wc_strengths_avg": [
            58.25,
            21.498546462493692
        ],
        "wc_weaknesses_avg": [
            132.5,
            76.53267276137689
        ],
        "wc_questions_avg": [
            91.25,
            83.5295606357414
        ],
        "wc_review_avg": [
            360.0,
            88.63689976527834
        ],
        "wc_reply_reviewers_avg": [
            98.25,
            170.1739918436422
        ],
        "wc_reply_authors_avg": [
            882.25,
            315.2842963104886
        ],
        "reply_reviewers_avg": [
            1.25,
            2.165063509461097
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16160463894559178015&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1;0;0;2;2;2",
        "aff_unique_norm": "Hong Kong Polytechnic University;Hong Kong University of Science and Technology;Microsoft",
        "aff_unique_dep": ";;Microsoft Corporation",
        "aff_unique_url": "https://www.polyu.edu.hk;https://www.ust.hk;https://www.microsoft.com",
        "aff_unique_abbr": "PolyU;HKUST;Microsoft",
        "aff_campus_unique_index": "0;0;0;0;0;2",
        "aff_campus_unique": "Hong Kong SAR;;Asia",
        "aff_country_unique_index": "0;0;0;0;0;1;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "QQ5eVDIMu4",
        "title": "Distribution Shift Resilient GNN via Mixture of Aligned Experts",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The ability of Graph Neural Networks (GNNs) to generalize to diverse and unseen distributions holds paramount importance for real-world applications. However, previous works mostly focus on addressing specific types of distribution shifts, e.g., larger graph size or node degree, which is highly limited when confronted with multiple and nuanced distribution shifts. For example, a node in a social graph may have both increased interactions and features alternation, while its neighbor nodes may see different shifts. Failing to consider such complex distribution shifts will largely hinder the generalization effect in practice. Here we introduce GraphMETRO, a novel framework based on a mixture-of-experts (MoE) architecture, enhancing GNN generalizability for both node- and graph-level tasks. The core concept of GraphMETRO includes the construction of a hierarchical architecture composed of a gating model and multiple expert models that are aligned in a common representation space. Specifically, the gating model identifies the significant mixture components that govern the distribution shift on a node or graph instance. Each aligned expert produces representations invariant to a type of mixture component. Finally, GraphMETRO aggregates the representations from multiple experts to produce an invariant representation w.r.t. the complex distribution shift for the prediction task. Moreover, GraphMETRO provides interpretations on the distribution shift type via the gating model and offers insights into real-world distribution shifts. Through the systematic experiments, we validate the effectiveness of GraphMETRO which outperforms Empirical Risk Minimization (ERM) by 4.6% averagely on synthetic distribution shifts and achieves state-of-the-art performances on four real-world datasets from GOOD benchmark, including a 67% and 4.2% relative improvement over the best previous method on WebKB and Twitch datasets.",
        "keywords": "Graph Neural Networks;Generalization;Distribution Shifts;Mixture-of-experts",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Shirley Wu;Kaidi Cao;Bruno Ribeiro;James Zou;Jure Leskovec",
        "authorids": "~Shirley_Wu1;~Kaidi_Cao1;~Bruno_Ribeiro1;~James_Zou1;~Jure_Leskovec1",
        "gender": "M;M;;;F",
        "homepage": "https://ai.stanford.edu/~kaidicao/;https://www.cs.purdue.edu/homes/ribeirob/;;http://cs.stanford.edu/~jure/;https://cs.stanford.edu/~shirwu",
        "dblp": "203/8207;15/606;;l/JureLeskovec;79/4173-2",
        "google_scholar": "https://scholar.google.com.hk/citations?user=4Zw1PJ8AAAAJ;KIEleCsAAAAJ;23ZXZvEAAAAJ;Q_kKkIUAAAAJ;r2cVEucAAAAJ",
        "orcid": ";0000-0002-3527-6192;;0000-0002-5411-923X;",
        "linkedin": ";;;leskovec/;",
        "or_profile": "~Kaidi_Cao1;~Bruno_Ribeiro1;~James_Zou1;~Jure_Leskovec1;~Yingxin_Wu1",
        "aff": "Stanford University;Stanford University;Stanford University;Kumo.AI;Computer Science Department, Stanford University",
        "aff_domain": "stanford.edu;stanford.edu;stanford.edu;kumo.ai;cs.stanford.edu",
        "position": "PhD student;Visiting Associate Professor;Assistant Professor;Chief Scientist;PhD student",
        "bibtex": "@misc{\nwu2024distribution,\ntitle={Distribution Shift Resilient {GNN} via Mixture of Aligned Experts},\nauthor={Shirley Wu and Kaidi Cao and Bruno Ribeiro and James Zou and Jure Leskovec},\nyear={2024},\nurl={https://openreview.net/forum?id=QQ5eVDIMu4}\n}",
        "github": "",
        "project": "",
        "reviewers": "m8JS;NLg1;FURX;C9mM",
        "site": "https://openreview.net/forum?id=QQ5eVDIMu4",
        "pdf_size": 2269603,
        "rating": "3;5;6;6",
        "confidence": "3;4;3;3",
        "soundness": "2;3;3;2",
        "contribution": "2;2;3;2",
        "presentation": "2;3;3;2",
        "wc_summary": "80;71;99;70",
        "wc_strengths": "40;38;181;9",
        "wc_weaknesses": "196;150;275;183",
        "wc_questions": "3;75;5;99",
        "wc_review": "319;334;560;361",
        "wc_reply_reviewers": "150;0;191;50",
        "wc_reply_authors": "2044;1881;1282;2099",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "5;4;3;4",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            80.0,
            11.640446726822816
        ],
        "wc_strengths_avg": [
            67.0,
            66.95147496508199
        ],
        "wc_weaknesses_avg": [
            201.0,
            45.896622969451684
        ],
        "wc_questions_avg": [
            45.5,
            42.36448984704053
        ],
        "wc_review_avg": [
            393.5,
            97.29979444993704
        ],
        "wc_reply_reviewers_avg": [
            97.75,
            76.25737669235679
        ],
        "wc_reply_authors_avg": [
            1826.5,
            324.42757281094345
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.0,
            0.7071067811865476
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Yk_2HjkH9wkJ:scholar.google.com/&scioq=Distribution+Shift+Resilient+GNN+via+Mixture+of+Aligned+Experts&hl=en&as_sdt=0,19",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "Stanford University;Kumo.AI",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.stanford.edu;https://www.kumo.ai",
        "aff_unique_abbr": "Stanford;Kumo.AI",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Stanford;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "MovingParts: Motion-based 3D Part Discovery in Dynamic Radiance Field",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18678",
        "id": "QQ6RgKYiQq",
        "author_site": "Kaizhi Yang, Xiaoshuai Zhang, Zhiao Huang, Xuejin Chen, Zexiang Xu, Hao Su",
        "tldr": "",
        "abstract": "We present MovingParts, a NeRF-based method for dynamic scene reconstruction and part discovery. We consider motion as an important cue for identifying parts, that all particles on the same part share the common motion pattern. From the perspective of fluid simulation, existing deformation-based methods for dynamic NeRF can be seen as parameterizing the scene motion under the Eulerian view, i.e., focusing on specific locations in space through which the fluid flows as time passes. However, it is intractable to extract the motion of constituting objects or parts using the Eulerian view representation. In this work, we introduce the dual Lagrangian view and enforce representations under the Eulerian/Lagrangian views to be cycle-consistent. Under the Lagrangian view, we parameterize the scene motion by tracking the trajectory of particles on objects. The Lagrangian view makes it convenient to discover parts by factorizing the scene motion as a composition of part-level rigid motions. Experimentally, our method can achieve fast and high-quality dynamic scene reconstruction from even a single moving camera, and the induced part-based representation allows direct applications of part tracking, animation, 3D scene editing, etc.",
        "keywords": "NeRF;Dynamic;Motion;Part discovery",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/04132093fe2838a0c9a47b411960f05d348c40fa.zip",
        "author": "Kaizhi Yang;Xiaoshuai Zhang;Zhiao Huang;Xuejin Chen;Zexiang Xu;Hao Su",
        "authorids": "~Kaizhi_Yang1;~Xiaoshuai_Zhang1;~Zhiao_Huang1;~Xuejin_Chen1;~Zexiang_Xu1;~Hao_Su1",
        "gender": "M;M;M;;M;M",
        "homepage": "https://silenkzyoung.github.io/KaizhiYang/;https://i.buriedjet.com;;;https://cseweb.ucsd.edu/~zex014/;http://ai.ucsd.edu/~haosu",
        "dblp": ";175/5693;172/1410;;154/0366;09/4945-1",
        "google_scholar": ";cTGxuQQAAAAJ;;;_RRIYvEAAAAJ;1P8Zu04AAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Kaizhi_Yang1;~Xiaoshuai_Zhang1;~Zhiao_Huang1;~Xuejin_Chen1;~Zexiang_Xu1;~Hao_Su1",
        "aff": "University of Science and Technology of China;University of California, San Diego;University of California, San Diego, University of California, San Diego;;Adobe Research;University of California, San Diego",
        "aff_domain": "ustc.edu.cn;ucsd.edu;eng.ucsd.edu;;adobe.com;ucsd.edu",
        "position": "PhD student;PhD student;PhD student;;Researcher;Associate Professor",
        "bibtex": "@inproceedings{\nyang2024movingparts,\ntitle={MovingParts: Motion-based 3D Part Discovery in Dynamic Radiance Field},\nauthor={Kaizhi Yang and Xiaoshuai Zhang and Zhiao Huang and Xuejin Chen and Zexiang Xu and Hao Su},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=QQ6RgKYiQq}\n}",
        "github": "",
        "project": "",
        "reviewers": "qQod;NTzN;WRpS;5UoR",
        "pdf_size": 36436600,
        "rating": "8;8;8;8",
        "confidence": "5;5;4;3",
        "soundness": "2;3;4;3",
        "contribution": "3;2;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "93;96;92;194",
        "wc_strengths": "91;34;77;51",
        "wc_weaknesses": "928;48;128;75",
        "wc_questions": "62;387;43;39",
        "wc_review": "1174;565;340;359",
        "wc_reply_reviewers": "429;44;27;43",
        "wc_reply_authors": "1493;360;298;451",
        "reply_reviewers": "2;1;1;1",
        "reply_authors": "3;3;2;2",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            118.75,
            43.47053599853584
        ],
        "wc_strengths_avg": [
            63.25,
            22.16275028059469
        ],
        "wc_weaknesses_avg": [
            294.75,
            366.7379002775688
        ],
        "wc_questions_avg": [
            132.75,
            147.0482488845073
        ],
        "wc_review_avg": [
            609.5,
            337.6466348121953
        ],
        "wc_reply_reviewers_avg": [
            135.75,
            169.442283683855
        ],
        "wc_reply_authors_avg": [
            650.5,
            489.45198947394215
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13430613383787934266&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=QQ6RgKYiQq",
        "pdf": "https://openreview.net/pdf?id=QQ6RgKYiQq",
        "email": "ustc.edu.cn;ucsd.edu;eng.ucsd.edu;;adobe.com;ucsd.edu",
        "author_num": 6,
        "aff_unique_index": "0;1;1;2;1",
        "aff_unique_norm": "University of Science and Technology of China;University of California, San Diego;Adobe",
        "aff_unique_dep": ";;Adobe Research",
        "aff_unique_url": "http://www.ustc.edu.cn;https://www.ucsd.edu;https://research.adobe.com",
        "aff_unique_abbr": "USTC;UCSD;Adobe",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";San Diego",
        "aff_country_unique_index": "0;1;1;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "QQ81YsbSij",
        "title": "Learning Conditional Policy for Crystal Design using Offline Reinforcement Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Navigating through the exponentially large chemical space to search for desirable materials is an extremely challenging task in material discovery. Recent developments in generative and geometric deep learning have shown promising results in molecule and material discovery but often lack evaluation with high-accuracy computational methods. This work aims to design novel and stable crystalline materials conditioned on a desired band gap. To achieve conditional generation, we:  1. Formulate crystal design as a sequential decision-making problem, create relevant trajectories based on high-quality materials data and use conservative Q-learning to learn a conditional policy from these trajectories. To do so, we formulate a reward function that incorporates constraints for energetic and electronic properties obtained directly from density functional theory (DFT) calculations;  2. Evaluate the generated materials from the policy using DFT calculations for both energy and band gap; 3. Compare our results to relevant baselines, including a random policy, behavioral cloning, and unconditioned policy learning. Our experiments show that our conditioned policies achieve more targeted crystal structure designs and demonstrate the capability to perform crystal structure design evaluated with accurate and computationally expensive DFT calculations.",
        "keywords": "Material discovery;crystal design;offline reinforcement learning;density functional theory;AI for science",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/b36df95db0600a9511ef6adc31c9f890daf123a0.zip",
        "author": "Prashant Govindarajan;Santiago Miret;Jarrid Rector-Brooks;Mariano Phielipp;Janarthanan Rajendran;Sarath Chandar",
        "authorids": "~Prashant_Govindarajan1;~Santiago_Miret1;~Jarrid_Rector-Brooks2;~Mariano_Phielipp2;~Janarthanan_Rajendran1;~Sarath_Chandar1",
        "gender": "M;M;M;M;;M",
        "homepage": "https://www.linkedin.com/in/prashant-govindarajan-477925161/;https://www.intel.ai/bio/santiago-miret/;;https://www.intel.com/content/www/us/en/research/researchers/mariano-phielipp.html;;http://sarathchandar.in/",
        "dblp": ";241/5030;230/4010;23/4518;;45/8542",
        "google_scholar": "https://scholar.google.ca/citations?user=r3XLLrEAAAAJ;HLQ_te4AAAAJ;gxRPZh4AAAAJ;YArRsvEAAAAJ;;https://scholar.google.co.in/citations?user=yxWtZLAAAAAJ",
        "orcid": ";0000-0002-5121-3853;;;;",
        "linkedin": "prashant-govindarajan-477925161/;santiago-miret/;;mariano-phielipp-941624;;",
        "or_profile": "~Prashant_Govindarajan1;~Santiago_Miret1;~Jarrid_Rector-Brooks2;~Mariano_Phielipp2;~Janarthanan_Rajendran1;~Sarath_Chandar1",
        "aff": "Mila - Quebec AI Institute, \u00c9cole Polytechnique de Montr\u00e9al;Intel;Montreal Institute for Learning Algorithms, University of Montreal, University of Montreal;Intel Labs;;\u00c9cole Polytechnique de Montr\u00e9al",
        "aff_domain": "mila.quebec;intel.com;mila.umontreal.ca;intel.com;;polymtl.ca",
        "position": "PhD student;Researcher;PhD student;Principal Researcher;;Assistant Professor",
        "bibtex": "@misc{\ngovindarajan2024learning,\ntitle={Learning Conditional Policy for Crystal Design using Offline Reinforcement Learning},\nauthor={Prashant Govindarajan and Santiago Miret and Jarrid Rector-Brooks and Mariano Phielipp and Janarthanan Rajendran and Sarath Chandar},\nyear={2024},\nurl={https://openreview.net/forum?id=QQ81YsbSij}\n}",
        "github": "",
        "project": "",
        "reviewers": "b3qf;ffhH;NogB;W7dF",
        "site": "https://openreview.net/forum?id=QQ81YsbSij",
        "pdf_size": 11796023,
        "rating": "3;3;5;5",
        "confidence": "5;4;2;2",
        "soundness": "2;2;3;3",
        "contribution": "1;2;2;2",
        "presentation": "2;2;3;3",
        "wc_summary": "120;81;63;56",
        "wc_strengths": "77;91;94;27",
        "wc_weaknesses": "103;420;54;105",
        "wc_questions": "33;39;29;2",
        "wc_review": "333;631;240;190",
        "wc_reply_reviewers": "0;202;52;0",
        "wc_reply_authors": "985;1713;403;651",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "2;3;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.25,
            1.299038105676658
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            80.0,
            24.829418035870273
        ],
        "wc_strengths_avg": [
            72.25,
            26.901440481877547
        ],
        "wc_weaknesses_avg": [
            170.5,
            145.48969035639604
        ],
        "wc_questions_avg": [
            25.75,
            14.16642156650719
        ],
        "wc_review_avg": [
            348.5,
            170.98318630789402
        ],
        "wc_reply_reviewers_avg": [
            63.5,
            82.73300429695516
        ],
        "wc_reply_authors_avg": [
            938.0,
            492.8052353618009
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.9622504486493763,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4992200014654807777&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;2;1;0",
        "aff_unique_norm": "\u00c9cole Polytechnique de Montr\u00e9al;Intel;University of Montreal",
        "aff_unique_dep": "Mila - Quebec AI Institute;Intel Corporation;Montreal Institute for Learning Algorithms",
        "aff_unique_url": "https://www.polymtl.ca;https://www.intel.com;https://www.umontreal.ca",
        "aff_unique_abbr": "Polytechnique Montr\u00e9al;Intel;UM",
        "aff_campus_unique_index": "0;2;0",
        "aff_campus_unique": "Montr\u00e9al;;Montreal",
        "aff_country_unique_index": "0;1;0;1;0",
        "aff_country_unique": "Canada;United States"
    },
    {
        "title": "MOFI: Learning Image Representations from Noisy Entity Annotated Images",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18677",
        "id": "QQYpgReSRk",
        "author_site": "Wentao Wu, Aleksei Timofeev, Chen Chen, Bowen Zhang, Kun Duan, Shuangning Liu, Yantao Zheng, Jonathon Shlens, Xianzhi Du, Yinfei Yang",
        "tldr": "",
        "abstract": "We present MOFI, Manifold OF Images, a new vision foundation model designed to learn image representations from noisy entity annotated images. MOFI differs from previous work in two key aspects: 1. pre-training data, and 2. training recipe. Regarding data, we introduce a new approach to automatically assign entity labels to images from noisy image-text pairs. Our approach involves employing a named entity recognition model to extract entities from the alt-text, and then using a CLIP model to select the correct entities as labels of the paired image.  It's a simple, cost-effective method that can scale to handle billions of web-mined image-text pairs. Through this method, we have created Image-to-Entities (I2E), a new dataset with 1 billion images and 2 million distinct entities, covering rich visual concepts in the wild. Building upon the I2E dataset, we study different training recipes like supervised pre-training, contrastive pre-training, and multi-task learning. For constrastive pre-training, we treat entity names as free-form text, and further enrich them with entity descriptions. Experiments show that supervised pre-training with large-scale fine-grained entity labels is highly effective for image retrieval tasks, and multi-task training further improves the performance. The final MOFI model achieves 86.66\\% mAP on the challenging GPR1200 dataset, surpassing the previous state-of-the-art performance of 72.19% from OpenAI's CLIP model. Further experiments on zero-shot and linear probe image classification also show that MOFI outperforms a CLIP model trained on the original image-text data, demonstrating the effectiveness of the I2E dataset in learning strong image representations. We release our code and model weights at https://github.com/apple/ml-mofi.",
        "keywords": "Image representation;image embedding;image based search",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Wentao Wu;Aleksei Timofeev;Chen Chen;Bowen Zhang;Kun Duan;Shuangning Liu;Yantao Zheng;Jonathon Shlens;Xianzhi Du;Yinfei Yang",
        "authorids": "~Wentao_Wu3;~Aleksei_Timofeev1;~Chen_Chen38;~Bowen_Zhang2;~Kun_Duan1;~Shuangning_Liu1;~Yantao_Zheng1;~Jonathon_Shlens1;~Xianzhi_Du4;~Yinfei_Yang1",
        "gender": "M;;;M;;;M;;M;",
        "homepage": "https://www.linkedin.com/in/wentao-wu-45819168/;;https://github.com/alex8937;https://zbwglory.github.io;;;;;;",
        "dblp": ";;;85/7433-2;;;32/4440;;;117/4082",
        "google_scholar": ";;;nI3cKV8AAAAJ;;;;;l1hP40AAAAAJ;kvDbu90AAAAJ",
        "orcid": ";;;;;;;;;",
        "linkedin": ";;chen-8937/;;;;;;xianzhi-du-1b128934/;",
        "or_profile": "~Wentao_Wu3;~Aleksei_Timofeev1;~Chen_Chen38;~Bowen_Zhang2;~Kun_Duan1;~Shuangning_Liu1;~Yantao_Zheng1;~Jonathon_Shlens1;~Xianzhi_Du4;~Yinfei_Yang1",
        "aff": "Apple;;Apple;Apple;;;;;Apple;Apple",
        "aff_domain": "apple.com;;apple.com;apple.com;;;;;apple.com;apple.com",
        "position": "Researcher;;Researcher;Research Scientist;;;;;Researcher;Researcher",
        "bibtex": "@inproceedings{\nwu2024mofi,\ntitle={{MOFI}: Learning Image Representations from Noisy Entity Annotated Images},\nauthor={Wentao Wu and Aleksei Timofeev and Chen Chen and Bowen Zhang and Kun Duan and Shuangning Liu and Yantao Zheng and Jonathon Shlens and Xianzhi Du and Yinfei Yang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=QQYpgReSRk}\n}",
        "github": "",
        "project": "",
        "reviewers": "4Nss;NPAD;fBZj;FYZT",
        "pdf_size": 5913947,
        "rating": "5;6;6;8",
        "confidence": "4;4;5;4",
        "soundness": "3;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "3;3;4;4",
        "wc_summary": "61;45;435;103",
        "wc_strengths": "49;55;297;107",
        "wc_weaknesses": "116;119;899;44",
        "wc_questions": "35;44;307;3",
        "wc_review": "261;263;1938;257",
        "wc_reply_reviewers": "0;70;1189;0",
        "wc_reply_authors": "421;620;2425;32",
        "reply_reviewers": "0;2;3;0",
        "reply_authors": "2;3;7;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            161.0,
            159.60576430693223
        ],
        "wc_strengths_avg": [
            127.0,
            100.70749723828906
        ],
        "wc_weaknesses_avg": [
            294.5,
            350.29737366985785
        ],
        "wc_questions_avg": [
            97.25,
            122.05403516475808
        ],
        "wc_review_avg": [
            679.75,
            726.4541881633005
        ],
        "wc_reply_reviewers_avg": [
            314.75,
            505.5568093696296
        ],
        "wc_reply_authors_avg": [
            874.5,
            919.821857752902
        ],
        "reply_reviewers_avg": [
            1.25,
            1.299038105676658
        ],
        "reply_authors_avg": [
            3.25,
            2.277608394786075
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": -0.13245323570650439,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15623810552392737745&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=QQYpgReSRk",
        "pdf": "https://openreview.net/pdf?id=QQYpgReSRk",
        "email": "apple.com;;apple.com;apple.com;;;;;apple.com;apple.com",
        "author_num": 10,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Apple",
        "aff_unique_dep": "Apple Inc.",
        "aff_unique_url": "https://www.apple.com",
        "aff_unique_abbr": "Apple",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "QQscjhKXIF",
        "title": "Class-Incremental Continual Learning for Multi-View Clustering",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Multi-view clustering (MVC) aims to explore common semantics for multi-view data and has become an active research topic. However, existing MVC methods focus on learning from static training data and ignore streaming multi-view data with incremental classes, which is frequent in real-world applications given the continually evolving nature of our world. Meanwhile, the existing continual clustering methods only consider single-view data, which cannot effectively mine the semantics of multi-view data. In this paper, we propose a novel Class-incremental Continual Multi-View Clustering (CCMVC) method to handle class-incremental continual learning for multi-view clustering, where multi-view data with incremental semantic classes come sequentially. Our method conducts two iterative optimization phases, i.e., multi-view cluster search and multi-view cluster consolidation, for sequential multi-view training data. In the test, our CCMVC can perform online multi-view clustering for all emerged classes. Firstly, CCMVC learns the common feature space for multi-view data and searches clusters for the incoming data. Secondly, CCMVC harmonizes and consolidates all learned clusters in a unified MVC model with data replay for all emerged classes. In particular, we propose a cross-view synchronous loss to mitigate the asynchronous convergence problem inherent in multi-view continual learning. Extensive experiments on six public MVC datasets reveal the superiority of CCMVC compared with the state-of-the-art methods.",
        "keywords": "Class-incremental continual learning;multi-view clustering;data mining;multi-view learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Shengsheng Qian;Shengjie Zhang;Dizhan Xue;Huaiwen Zhang;Changsheng Xu",
        "authorids": "~Shengsheng_Qian1;~Shengjie_Zhang4;~Dizhan_Xue1;~Huaiwen_Zhang2;~Changsheng_Xu1",
        "gender": "M;M;M;M;M",
        "homepage": "http://nlpr-web.ia.ac.cn/mmc/homepage/ssqian/;;https://scholar.google.com/citations?hl=zh-CN&user=V5Aeh_oAAAAJ#d=gs_hdr_drw;;http://huaiwen.me",
        "dblp": "138/4249;;293/9621;85/1301;180/5703",
        "google_scholar": "bPX5POgAAAAJ;https://scholar.google.com.hk/citations?hl=zh-CN;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com.sg/citations?user=hI9NRDkAAAAJ;Jxf3fSgAAAAJ",
        "orcid": "0000-0001-9488-2208;0009-0007-6166-642X;0000-0002-0173-1556;;0000-0002-3183-9218",
        "linkedin": ";;;;",
        "or_profile": "~Shengsheng_Qian1;~Shengjie_Zhang4;~Dizhan_Xue1;~Changsheng_Xu1;~huaiwen_zhang1",
        "aff": "Institute of Automation, Chinese Academy of Sciences;Zhengzhou University;Institute of Automation, Chinese Academy of Sciences;Institute of Automation, Chinese Academy of Sciences;Inner Mongolia University",
        "aff_domain": "ia.ac.cn;zzu.edu.cn;ia.ac.cn;ia.ac.cn;imu.edu.cn",
        "position": "Associate Professor;MS student;PhD student;Full Professor;Full Professor",
        "bibtex": "@misc{\nqian2024classincremental,\ntitle={Class-Incremental Continual Learning for Multi-View Clustering},\nauthor={Shengsheng Qian and Shengjie Zhang and Dizhan Xue and Huaiwen Zhang and Changsheng Xu},\nyear={2024},\nurl={https://openreview.net/forum?id=QQscjhKXIF}\n}",
        "github": "",
        "project": "",
        "reviewers": "6odo;krpX;6hBX;UeiP",
        "site": "https://openreview.net/forum?id=QQscjhKXIF",
        "pdf_size": 9032376,
        "rating": "3;3;3;5",
        "confidence": "4;4;5;5",
        "soundness": "3;2;1;2",
        "contribution": "2;2;2;2",
        "presentation": "2;3;2;2",
        "wc_summary": "60;74;30;79",
        "wc_strengths": "40;71;35;36",
        "wc_weaknesses": "72;133;144;194",
        "wc_questions": "156;100;3;194",
        "wc_review": "328;378;212;503",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            60.75,
            19.070592544543548
        ],
        "wc_strengths_avg": [
            45.5,
            14.84082207965583
        ],
        "wc_weaknesses_avg": [
            135.75,
            43.395708313150045
        ],
        "wc_questions_avg": [
            113.25,
            71.90053894095648
        ],
        "wc_review_avg": [
            355.25,
            104.41593508655659
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:jvEBAReCHJQJ:scholar.google.com/&scioq=Class-Incremental+Continual+Learning+for+Multi-View+Clustering&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0;2",
        "aff_unique_norm": "Chinese Academy of Sciences;Zhengzhou University;Inner Mongolia University",
        "aff_unique_dep": "Institute of Automation;;",
        "aff_unique_url": "http://www.ia.cas.cn;http://www.zzu.edu.cn;http://www.imu.edu.cn/",
        "aff_unique_abbr": "CAS;ZZU;IMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "QQt0MwXA81",
        "title": "Do LLMs exhibit human-like response biases? A case study in survey design",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "As large language models (LLMs) become more capable, there is growing excitement about the possibility of using LLMs as proxies for humans in real-world tasks where subjective labels serve as the ground truth. A barrier to the adoption of LLMs as human proxies is their sensitivity to prompt wording. But interestingly, humans also suffer from issues of sensitivity to instruction changes. As such, it is necessary to investigate the extent to which LLMs also reflect human sensitivities, if at all. In this work, we use survey design as a case study, where human response biases caused by permutations in wordings of \"prompts\" have been extensively studied. Drawing from prior work in social psychology, we design a dataset and propose a framework to evaluate whether LLMs exhibit human-like response biases in survey questionnaires. Over the seven models we evaluated, we find that all but one (Llama2-70b), in particular instruction fine-tuned models, do not consistently display human-like response biases, and even sometimes show a significant change in the opposite expected direction of change in humans. Furthermore, even if a model shows a significant change in the same direction as humans, we find that perturbations that are not meant to elicit biased behavior may also result in a similar change, suggesting that such a result could be partially due to other spurious correlations. These results highlight the potential pitfalls of using LLMs to substitute humans in parts of the annotation pipeline, and further underscore the importance of finer-grained characterizations of model behavior.",
        "keywords": "large language models;evaluation;biases;computational social science",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/fde09229bf27cc0adbb99f4d200fb1bf238de682.zip",
        "author": "Lindia Tjuatja;Valerie Chen;Tongshuang Wu;Ameet Talwalkar;Graham Neubig",
        "authorids": "~Lindia_Tjuatja1;~Valerie_Chen2;~Tongshuang_Wu1;~Ameet_Talwalkar1;~Graham_Neubig1",
        "gender": ";F;F;M;M",
        "homepage": "https://lindiatjuatja.github.io/;https://valeriechen.github.io/;http://cs.cmu.edu/~sherryw;http://www.cs.cmu.edu/~atalwalk/;http://phontron.com",
        "dblp": "348/7029;234/6033;179/3791;56/5528;03/8155",
        "google_scholar": "0Vz8NDEAAAAJ;94yn2j0AAAAJ;CeQd_DsAAAAJ;https://scholar.google.com.tw/citations?user=TW7U1W0AAAAJ;wlosgkoAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Lindia_Tjuatja1;~Valerie_Chen2;~Tongshuang_Wu1;~Ameet_Talwalkar1;~Graham_Neubig1",
        "aff": "Carnegie Mellon University;Carnegie Mellon University;School of Computer Science, Carnegie Mellon University;Carnegie Mellon University;Carnegie Mellon University",
        "aff_domain": "andrew.cmu.edu;cmu.edu;cs.cmu.edu;cmu.edu;cmu.edu",
        "position": "PhD student;PhD student;Assistant Professor;Associate Professor;Associate Professor",
        "bibtex": "@misc{\ntjuatja2024do,\ntitle={Do {LLM}s exhibit human-like response biases? A case study in survey design},\nauthor={Lindia Tjuatja and Valerie Chen and Tongshuang Wu and Ameet Talwalkar and Graham Neubig},\nyear={2024},\nurl={https://openreview.net/forum?id=QQt0MwXA81}\n}",
        "github": "",
        "project": "",
        "reviewers": "6vwz;voCN;vQr1;9LjM;BoSQ",
        "site": "https://openreview.net/forum?id=QQt0MwXA81",
        "pdf_size": 450030,
        "rating": "5;5;5;8;8",
        "confidence": "3;4;4;4;4",
        "soundness": "2;3;3;3;3",
        "contribution": "3;2;2;3;3",
        "presentation": "3;2;3;3;4",
        "wc_summary": "211;84;56;277;73",
        "wc_strengths": "70;39;85;98;111",
        "wc_weaknesses": "198;68;36;236;153",
        "wc_questions": "37;37;5;82;23",
        "wc_review": "516;228;182;693;360",
        "wc_reply_reviewers": "47;10;0;18;37",
        "wc_reply_authors": "567;458;173;452;296",
        "reply_reviewers": "1;1;0;1;1",
        "reply_authors": "2;2;2;1;2",
        "rating_avg": [
            6.2,
            1.469693845669907
        ],
        "confidence_avg": [
            3.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            3.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            140.2,
            87.7391588744729
        ],
        "wc_strengths_avg": [
            80.6,
            24.856387509048858
        ],
        "wc_weaknesses_avg": [
            138.2,
            75.8060683586743
        ],
        "wc_questions_avg": [
            36.8,
            25.474693324945054
        ],
        "wc_review_avg": [
            395.8,
            188.63976251045273
        ],
        "wc_reply_reviewers_avg": [
            22.4,
            17.281203661782357
        ],
        "wc_reply_authors_avg": [
            389.2,
            138.36097715757865
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4
        ],
        "reply_authors_avg": [
            1.8,
            0.4
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.40824829046386313,
        "gs_citation": 80,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15202564560648208026&as_sdt=5,34&sciodt=0,34&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Carnegie Mellon University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cmu.edu",
        "aff_unique_abbr": "CMU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Pittsburgh",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "QRWrvzRU4w",
        "title": "OneSpike: Ultra-low latency spiking neural networks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "With the development of deep learning models, there has been growing research interest in spiking neural networks (SNNs) due to their energy efficiency resulting from their multiplier-less nature. The existing methodologies for SNN development include the conversion of artificial neural networks (ANNs) into equivalent SNNs or the emulation of ANNs, with two crucial challenges yet remaining. The first challenge involves preserving the accuracy of the original ANN models during the conversion to SNNs. The second challenge is to run complex SNNs with lower latencies. To solve the problem of high latency while maintaining high accuracy, we proposed a parallel spike-generation (PSG) method to generate all the spikes in a single timestep, while achieving a better model performance than the standard Integrate-and-Fire model. Based on PSG, we propose OneSpike, a highly effective framework that helps to convert any rate-encoded convolutional SNN into one that uses only one timestep without accuracy loss. Our OneSpike model achieves a state-of-the-art (for SNN) accuracy of $81.92\\%$ on the ImageNet dataset using just a single time step. To the best of our knowledge, this study is the first to explore converting multi-timestep SNNs into equivalent single-timestep ones, while maintaining accuracy. These results highlight the potential of our approach in addressing the key challenges in SNN research, paving the way for more efficient and accurate SNNs in practical applications.",
        "keywords": "Spiking Neural Network; Energy efficiency; Model Scaling",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/c3f5b90e0d704be93c3d20a88e3d9d26d57badc2.pdf",
        "author": "Kaiwen Tang;Zhanglu Yan;Weng-Fai Wong",
        "authorids": "~Kaiwen_Tang1;~Zhanglu_Yan1;~Weng-Fai_Wong1",
        "gender": ";M;M",
        "homepage": ";;https://www.comp.nus.edu.sg/~wongwf/",
        "dblp": "283/3219;280/2812;37/1143",
        "google_scholar": ";pBjJBj0AAAAJ;https://scholar.google.com.tw/citations?user=SL1cTsIAAAAJ",
        "orcid": ";;0000-0002-4281-2053",
        "linkedin": "kaiwen-tang-1824741bb/;;",
        "or_profile": "~Kaiwen_Tang1;~Zhanglu_Yan1;~Weng-Fai_Wong1",
        "aff": "National University of Singapore;National University of Singapore;National University of Singapore",
        "aff_domain": "nus.edu.sg;nus.edu.sg;nus.edu.sg",
        "position": "PhD student;PhD student;Associate Professor",
        "bibtex": "@misc{\ntang2024onespike,\ntitle={OneSpike: Ultra-low latency spiking neural networks},\nauthor={Kaiwen Tang and Zhanglu Yan and Weng-Fai Wong},\nyear={2024},\nurl={https://openreview.net/forum?id=QRWrvzRU4w}\n}",
        "github": "",
        "project": "",
        "reviewers": "2hLo;t2PL;nUrX;yNko",
        "site": "https://openreview.net/forum?id=QRWrvzRU4w",
        "pdf_size": 644043,
        "rating": "3;3;3;6",
        "confidence": "5;5;3;3",
        "soundness": "3;1;2;3",
        "contribution": "1;1;2;3",
        "presentation": "4;2;2;3",
        "wc_summary": "76;21;86;33",
        "wc_strengths": "15;17;8;20",
        "wc_weaknesses": "57;300;48;145",
        "wc_questions": "7;3;426;47",
        "wc_review": "155;341;568;245",
        "wc_reply_reviewers": "0;0;129;0",
        "wc_reply_authors": "44;254;530;176",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            1.0
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            54.0,
            27.55902755904134
        ],
        "wc_strengths_avg": [
            15.0,
            4.415880433163924
        ],
        "wc_weaknesses_avg": [
            137.5,
            101.18423790294612
        ],
        "wc_questions_avg": [
            120.75,
            177.07396053626857
        ],
        "wc_review_avg": [
            327.25,
            153.77316898601003
        ],
        "wc_reply_reviewers_avg": [
            32.25,
            55.858638544096294
        ],
        "wc_reply_authors_avg": [
            251.0,
            177.71043863543863
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7017151639143751234&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "National University of Singapore",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nus.edu.sg",
        "aff_unique_abbr": "NUS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Singapore"
    },
    {
        "id": "QRgT26JlAx",
        "title": "Learning with Temporal Label Noise",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Many sequential classification tasks are affected by label noise that changes over time. Such noise might arise from label quality improving, worsening, or periodically changing over time. In this work, we formalize the problem of label noise in sequential classification, where the labels are corrupted by a temporal, or time-dependent, noise function. We call this novel problem setting temporal label noise and develop a method to learn a sequential classifier that is robust to such noise. Our method can estimate the temporal label noise function directly from data, without a priori knowledge of the noise function. We first demonstrate the importance of modelling the temporal label noise function and how existing methods will consistently underperform. In experiments on both synthetic and real-world sequential classification tasks, we show that our algorithm leads to state-of-the-art performance in the presence of diverse temporal label noise functions.",
        "keywords": "Time Series;Label Noise;Healthcare;Crowdsourced Annotations;Mental Health;Subjective Annotations",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Sujay Nagaraj;Walter Gerych;Sana Tonekaboni;Anna Goldenberg;Berk Ustun;Thomas Hartvigsen",
        "authorids": "~Sujay_Nagaraj1;~Walter_Gerych2;~Sana_Tonekaboni1;~Anna_Goldenberg1;~Berk_Ustun1;~Thomas_Hartvigsen1",
        "gender": "M;M;;F;M;M",
        "homepage": "https://sujaynagaraj.github.io/;https://waltergerych.github.io/;;http://goldenberglab.ca/;http://www.berkustun.com;https://www.tomhartvigsen.com",
        "dblp": ";237/9060;;06/3543;138/5585;211/5752",
        "google_scholar": "8YrBnPsAAAAJ;https://scholar.google.com/citations?hl=en;;https://scholar.google.com.tw/citations?user=cEepZOEAAAAJ;6z_XWYcAAAAJ;rIjeeRsAAAAJ",
        "orcid": ";;;0000-0002-2416-833X;0000-0001-5188-3155;",
        "linkedin": ";walter-gerych-84165112b/;;;berkustun/;",
        "or_profile": "~Sujay_Nagaraj1;~Walter_Gerych2;~Sana_Tonekaboni1;~Anna_Goldenberg1;~Berk_Ustun1;~Thomas_Hartvigsen1",
        "aff": "Department of Computer Science, University of Toronto;Massachusetts Institute of Technology;;University of Toronto;School of Engineering and Applied Sciences, Harvard University;University of Virginia, Charlottesville",
        "aff_domain": "cs.toronto.edu;mit.edu;;utoronto.ca;seas.harvard.edu;virginia.edu",
        "position": "PhD student;Postdoc;;Full Professor;Associate ;Assistant Professor",
        "bibtex": "@misc{\nnagaraj2024learning,\ntitle={Learning with Temporal Label Noise},\nauthor={Sujay Nagaraj and Walter Gerych and Sana Tonekaboni and Anna Goldenberg and Berk Ustun and Thomas Hartvigsen},\nyear={2024},\nurl={https://openreview.net/forum?id=QRgT26JlAx}\n}",
        "github": "",
        "project": "",
        "reviewers": "PKMs;Q9Ck;4PX9;ynzB",
        "site": "https://openreview.net/forum?id=QRgT26JlAx",
        "pdf_size": 1020286,
        "rating": "3;5;5;8",
        "confidence": "4;4;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;2;3",
        "wc_summary": "80;88;203;63",
        "wc_strengths": "108;43;60;41",
        "wc_weaknesses": "139;71;202;47",
        "wc_questions": "163;117;9;3",
        "wc_review": "490;319;474;154",
        "wc_reply_reviewers": "219;0;0;0",
        "wc_reply_authors": "372;1638;864;321",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "1;3;2;1",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            108.5,
            55.30144663568938
        ],
        "wc_strengths_avg": [
            63.0,
            27.00925767213901
        ],
        "wc_weaknesses_avg": [
            114.75,
            60.631571808753236
        ],
        "wc_questions_avg": [
            73.0,
            68.97825744392213
        ],
        "wc_review_avg": [
            359.25,
            136.02458417506742
        ],
        "wc_reply_reviewers_avg": [
            54.75,
            94.82978171439603
        ],
        "wc_reply_authors_avg": [
            798.75,
            528.9042328248092
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0;1;0;2;3",
        "aff_unique_norm": "University of Toronto;Massachusetts Institute of Technology;Harvard University;University of Virginia",
        "aff_unique_dep": "Department of Computer Science;;School of Engineering and Applied Sciences;",
        "aff_unique_url": "https://www.utoronto.ca;https://web.mit.edu;https://www.harvard.edu;https://www.virginia.edu",
        "aff_unique_abbr": "U of T;MIT;Harvard;UVA",
        "aff_campus_unique_index": "0;2;3",
        "aff_campus_unique": "Toronto;;Cambridge;Charlottesville",
        "aff_country_unique_index": "0;1;0;1;1",
        "aff_country_unique": "Canada;United States"
    },
    {
        "id": "QRvBXm7WK3",
        "title": "MOESR: MULTI-OBJECTIVE EVOLUTIONARY ALGORITHM FOR IMAGE SUPER-RESOLUTION",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In recent years, deep neural networks have gained substantial traction in the field of super-resolution. However, existing deep learning methods primarily focus on enhancing the peak signal-to-noise ratio~(PSNR) of images, resulting in suboptimal performance across various evaluation metrics and a lack of fine details in image visual quality. To address these limitations, we introduce a comprehensive algorithmic framework, Multi-Objective Evolutionary Algorithm for Image Super-Resolution (MOESR), which aims to achieve a balanced optimization of multi-objective in image super-resolution. Specifically, MOESR first decomposes the multi-objective super-resolution problem into sub-problems and employs a novel approach to generate an initial population for the evolutionary algorithm. Subsequently, it enhances mutation, crossover, and update processes using an improved differential evolution algorithm, yielding a more Pareto-efficient set of solutions. Compared to traditional gradient-based methods, our approach does not require gradient calculations for each objective. As a result, it avoids issues such as gradient vanishing or local optima. Furthermore, our method has lower computational complexity, making it particularly advantageous for addressing high-dimensional problems and deep networks. Extensive experiments are conducted on five widely-used benchmarks and two multi-objective tasks, resulting in promising performance compared to previous state-of-the-art methods. In addition, our approach can not only address multi-objective optimization problems but also represents the first method capable of addressing the balance between objective and perceptual metrics. Our code will be released soon.",
        "keywords": "MULTI-OBJECTIVE EVOLUTIONARY ; SUPER-RESOLUTION",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/6d9321d027f28ee8988dcfe117589acd9c5b4436.zip",
        "author": "Senqiao Yang;Guodong DU;Zhang Bohao;Ho-Kin Tang;Sim Kuan Goh",
        "authorids": "~Senqiao_Yang1;~Guodong_DU2;~Zhang_Bohao1;~Ho-Kin_Tang1;~Sim_Kuan_Goh2",
        "gender": ";M;;M;M",
        "homepage": ";https://duguodong7.github.io;https://user.qzone.qq.com/3461663223/infocenter;http://faculty.hitsz.edu.cn/denghaojian;https://simkuangoh.github.io/",
        "dblp": ";213/8915-4;;;152/7784",
        "google_scholar": ";https://scholar.google.com/citations?hl=zh-CN;;https://scholar.google.com.hk/citations?user=a4yjxI4AAAAJ;",
        "orcid": ";;;0000-0002-8378-815X;",
        "linkedin": ";\u56fd\u4e1c-\u675c-30b496169/;;;",
        "or_profile": "~Senqiao_Yang1;~Guodong_DU2;~Zhang_Bohao1;~Ho-Kin_Tang1;~Sim_Kuan_Goh2",
        "aff": ";Harbin Institute of Technology;;Harbin Institute of Technology;Xiamen University Malaysia",
        "aff_domain": ";hit.edu.cn;;hit.edu.cn;xmu.edu.cn",
        "position": ";Researcher;;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nyang2024moesr,\ntitle={{MOESR}: {MULTI}-{OBJECTIVE} {EVOLUTIONARY} {ALGORITHM} {FOR} {IMAGE} {SUPER}-{RESOLUTION}},\nauthor={Senqiao Yang and Guodong DU and Zhang Bohao and Ho-Kin Tang and Sim Kuan Goh},\nyear={2024},\nurl={https://openreview.net/forum?id=QRvBXm7WK3}\n}",
        "github": "",
        "project": "",
        "reviewers": "omD1;AESC;rNa3;EdLo",
        "site": "https://openreview.net/forum?id=QRvBXm7WK3",
        "pdf_size": 11130697,
        "rating": "1;3;5;5",
        "confidence": "4;4;5;3",
        "soundness": "1;2;3;2",
        "contribution": "1;2;2;2",
        "presentation": "2;3;2;2",
        "wc_summary": "64;49;98;48",
        "wc_strengths": "22;26;46;16",
        "wc_weaknesses": "351;68;98;142",
        "wc_questions": "417;5;4;39",
        "wc_review": "854;148;246;245",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            1.6583123951777
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            64.75,
            20.216020874544032
        ],
        "wc_strengths_avg": [
            27.5,
            11.258330249197702
        ],
        "wc_weaknesses_avg": [
            164.75,
            110.70540863029231
        ],
        "wc_questions_avg": [
            116.25,
            174.2087469101365
        ],
        "wc_review_avg": [
            373.25,
            280.4009406189644
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:YVUQ1xJYTjMJ:scholar.google.com/&scioq=MOESR:+MULTI-OBJECTIVE+EVOLUTIONARY+ALGORITHM+FOR+IMAGE+SUPER-RESOLUTION&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Harbin Institute of Technology;Xiamen University",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.hit.edu.cn/;https://www.xmu.edu.my",
        "aff_unique_abbr": "HIT;XMU",
        "aff_campus_unique_index": "0;0;1",
        "aff_campus_unique": "Harbin;Malaysia",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "China;Malaysia"
    },
    {
        "id": "QScN74WrEZ",
        "title": "Test-Time Training for Semantic Segmentation with Output Contrastive Loss",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Although deep learning-based segmentation models have achieved impressive performance on public benchmarks, generalizing well to unseen environments remains a major challenge. To improve the model's generalization ability to the new domain during evaluation, the test-time training (TTT) is a challenging paradigm that adapts the source-pretrained model in an online fashion. Early efforts on TTT mainly focus on the image classification task. Directly extending these methods to semantic segmentation easily experiences unstable adaption due to segmentation's inherent characteristics, such as extreme class imbalance and complex decision spaces. To stabilize the adaptation process, we introduce contrastive loss (CL), known for its capability to learn robust and generalized representations. Nevertheless, the traditional CL operates in the representation space and cannot directly enhance predictions. In this paper, we resolve this limitation by adapting the CL to the output space, employing a high temperature, and simplifying the formulation, resulting in a straightforward yet effective loss function called Output Contrastive Loss (OCL). Our comprehensive experiments validate the efficacy of our approach across diverse evaluation scenarios. Notably, our method excels even when applied to models initially pre-trained using domain adaptation methods on test domain data, showcasing its resilience and adaptability.",
        "keywords": "Test time training;Semantic segmentation;Contrastive learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/74ecdd972422e25f0bbc7ad6be8c15d0609680f8.zip",
        "author": "Yunlong Zhang;Yuxuan Sun;Sunyi Zheng;Chenglu Zhu;Zhongyi Shui;Lin Yang",
        "authorids": "~Yunlong_Zhang1;~Yuxuan_Sun3;~Sunyi_Zheng1;~Chenglu_Zhu1;~Zhongyi_Shui1;~Lin_Yang13",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://www.researchgate.net/profile/Zhang-Yunlong-3;;;https://hzzcl.github.io/resume.io/;https://github.com/windyzy;https://www.yanglinlab.com",
        "dblp": ";;239/5250;296/3987;;",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;K3HiLBwAAAAJ;https://scholar.google.com/citations?hl=zh-CN;;",
        "orcid": ";;;0000-0001-5705-3718;;",
        "linkedin": ";;;;;",
        "or_profile": "~Yunlong_Zhang1;~Yuxuan_Sun3;~Sunyi_Zheng1;~Chenglu_Zhu1;~Zhongyi_Shui1;~Lin_Yang13",
        "aff": "Westlake University;Zhejiang University;;Westlake University;Zhejiang University;Westlake University ",
        "aff_domain": "westlake.edu;zju.edu.cn;;westlake.edu;zju.edu.cn;westlake.edu.cn",
        "position": "PhD student;PhD student;;Researcher;PhD student;Full Professor",
        "bibtex": "@misc{\nzhang2024testtime,\ntitle={Test-Time Training for Semantic Segmentation with Output Contrastive Loss},\nauthor={Yunlong Zhang and Yuxuan Sun and Sunyi Zheng and Chenglu Zhu and Zhongyi Shui and Lin Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=QScN74WrEZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "Bbfh;GWxQ;hEgU;sv9T",
        "site": "https://openreview.net/forum?id=QScN74WrEZ",
        "pdf_size": 1061830,
        "rating": "3;3;5;6",
        "confidence": "3;4;2;3",
        "soundness": "2;2;2;3",
        "contribution": "2;1;2;3",
        "presentation": "2;2;2;2",
        "wc_summary": "57;50;81;62",
        "wc_strengths": "30;61;19;55",
        "wc_weaknesses": "417;168;282;237",
        "wc_questions": "5;2;97;32",
        "wc_review": "509;281;479;386",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            62.5,
            11.5
        ],
        "wc_strengths_avg": [
            41.25,
            17.32591988899868
        ],
        "wc_weaknesses_avg": [
            276.0,
            90.96977520033784
        ],
        "wc_questions_avg": [
            34.0,
            38.203402989786134
        ],
        "wc_review_avg": [
            413.75,
            89.05440752708425
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5443310539518174,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14321906742515330753&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;1;0",
        "aff_unique_norm": "Westlake University;Zhejiang University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.westlake.edu.cn;https://www.zju.edu.cn",
        "aff_unique_abbr": "WU;ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "QSrtzF0qzn",
        "title": "Advancing Vision Transformers with Group-Mix Attention",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Vision Transformers (ViTs) have shown to enhance visual recognition through modeling long-range dependencies with multi-head self-attentions (MHSA), which is typically formulated as Query-Key-Value computation. However, the attention map generated from the Query and Key only captures token-to-token correlations at one single granularity. In this paper, we argue that self-attention should have a more comprehensive mechanism to capture correlations among tokens and groups (i.e., multiple adjacent tokens) for higher representational capacity. Thereby, we propose Group-Mix Attention (GMA) as an advanced replacement for traditional self-attention, which can simultaneously capture token-to-token, token-to-group, and group-to-group correlations with various group sizes. To this end, GMA splits the Query, Key, and Value into segments uniformly and performs different group aggregations to generate group proxies. The attention map is computed based on the mixtures of tokens and group proxies and used to re-combine the tokens and groups in Value. Based on GMA, we introduce a powerful backbone, namely GroupMixFormer, which achieves state-of-the-art performance in image classification, object detection, and semantic segmentation with fewer parameters than existing models. For instance, GroupMixFormer-L (with 70.3M parameters and 384^2 input) attains 86.2% Top-1 accuracy on ImageNet-1K without external data, while GroupMixFormer-B (with 45.8M parameters) attains 51.2% mIoU on ADE20K. Codes and trained models will be released.",
        "keywords": "Transformer;Backbone;Group-mix Attention",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/1a474dbe165f1780394549ecec9896f5f81bef23.zip",
        "author": "Chongjian GE;Xiaohan Ding;Zhan Tong;Li Yuan;Jiangliu Wang;Yibing Song;Ping Luo",
        "authorids": "~Chongjian_GE1;~Xiaohan_Ding1;~Zhan_Tong1;~Li_Yuan2;~Jiangliu_Wang1;~Yibing_Song1;~Ping_Luo2",
        "gender": "M;M;M;F;;M;",
        "homepage": "https://chongjiange.github.io;https://dingxiaohan.xyz/;https://github.com/yztongzhan;;https://ybsong00.github.io/;https://yuanli2333.github.io/;http://luoping.me/",
        "dblp": "287/4197;218/7379;236/0753;237/9027;77/2117;98/4583-7;54/4989-2.html",
        "google_scholar": "https://scholar.google.com.hk/citations?user=7DA_vcUAAAAJ;CIjw0KoAAAAJ;6FsgWBMAAAAJ;q6bsitMAAAAJ;oRhJHmIAAAAJ;-5juAR0AAAAJ;https://scholar.google.com.hk/citations?hl=en",
        "orcid": ";;0000-0002-3169-0599;;;0000-0002-2120-5588;0000-0002-6685-7950",
        "linkedin": "chongjian-ge-%EF%BC%88%E8%91%9B%E5%B4%87%E5%89%91%EF%BC%89-3b393310b/;;;;;;",
        "or_profile": "~Chongjian_GE1;~Xiaohan_Ding1;~Zhan_Tong1;~Jiangliu_Wang1;~Yibing_Song1;~Yuan_LI2;~Luo_Ping2",
        "aff": "The University of Hong Kong;Tencent AI Lab;Ant Research;The Chinese University of Hong Kong;Alibaba DAMO Academy;Peking University;The University of Hong Kong",
        "aff_domain": "hku.hk;tencent.com;antgroup.com;cuhk.edu.hk;alibaba-inc.com;pku.edu.cn;hku.hk",
        "position": "PhD student;Researcher;Researcher;Research Assitant Professor;Staff Scientist;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nge2024advancing,\ntitle={Advancing Vision Transformers with Group-Mix Attention},\nauthor={Chongjian GE and Xiaohan Ding and Zhan Tong and Li Yuan and Jiangliu Wang and Yibing Song and Ping Luo},\nyear={2024},\nurl={https://openreview.net/forum?id=QSrtzF0qzn}\n}",
        "github": "",
        "project": "",
        "reviewers": "D4yq;h9Yj;MwpJ;GTUk",
        "site": "https://openreview.net/forum?id=QSrtzF0qzn",
        "pdf_size": 1901212,
        "rating": "3;3;5;6",
        "confidence": "4;5;5;3",
        "soundness": "3;3;3;3",
        "contribution": "2;1;3;2",
        "presentation": "2;3;3;3",
        "wc_summary": "58;82;39;175",
        "wc_strengths": "27;55;42;181",
        "wc_weaknesses": "201;263;195;137",
        "wc_questions": "20;13;3;2",
        "wc_review": "306;413;279;495",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            88.5,
            52.21350400040204
        ],
        "wc_strengths_avg": [
            76.25,
            61.283664218125864
        ],
        "wc_weaknesses_avg": [
            199.0,
            44.609416046390926
        ],
        "wc_questions_avg": [
            9.5,
            7.433034373659253
        ],
        "wc_review_avg": [
            373.25,
            86.32605342537096
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 30,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2404609559896732144&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;3;4;5;0",
        "aff_unique_norm": "University of Hong Kong;Tencent;Ant Research;Chinese University of Hong Kong;Alibaba Group;Peking University",
        "aff_unique_dep": ";Tencent AI Lab;;;DAMO Academy;",
        "aff_unique_url": "https://www.hku.hk;https://ai.tencent.com;https://www.antgroup.com;https://www.cuhk.edu.hk;https://www.alibaba-group.com;http://www.pku.edu.cn",
        "aff_unique_abbr": "HKU;Tencent AI Lab;Ant Research;CUHK;Alibaba DAMO;Peking U",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "QTImFg6MHU",
        "title": "Quantifying Uncertainty in Answers from any Language Model and Enhancing their Trustworthiness",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We introduce BSdetector, a method for detecting bad and speculative answers from a pretrained Large Language Model by estimating a numeric confidence score for any output it generated. Our uncertainty quantification technique works for any LLM accessible only via a black-box API, whose training data remains unknown. By expending a bit of extra computation, users of any LLM API can now get the same response as they would ordinarily, as well as a confidence estimate that cautions when not to trust this response. Experiments on both closed and open-form Question-Answer benchmarks reveal that BSdetector more accurately identifies incorrect LLM responses than alternative uncertainty estimation procedures (for both GPT-3 and ChatGPT). \nBy sampling multiple responses from the LLM and considering the one with the highest confidence score, we can additionally obtain more accurate responses from the same LLM, without any extra training steps. In applications involving automated evaluation with LLMs, accounting for our confidence scores leads to more reliable evaluation in both human-in-the-loop and fully-automated settings (across both GPT 3.5 and 4).",
        "keywords": "Language model; uncertainty Quantification",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/b54b87f0337d628603e7577648e7493526e9117b.zip",
        "author": "Jiuhai Chen;Jonas Mueller",
        "authorids": "~Jiuhai_Chen1;~Jonas_Mueller1",
        "gender": "M;M",
        "homepage": "https://www.linkedin.com/in/jiuhai-chen-6a486715a/;",
        "dblp": ";178/3250",
        "google_scholar": ";HeVcLzAAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Jiuhai_Chen1;~Jonas_Mueller1",
        "aff": "University of Maryland, College Park;Cleanlab",
        "aff_domain": "umd.edu;cleanlab.ai",
        "position": "PhD student;Researcher",
        "bibtex": "@misc{\nchen2024quantifying,\ntitle={Quantifying Uncertainty in Answers from any Language Model and Enhancing their Trustworthiness},\nauthor={Jiuhai Chen and Jonas Mueller},\nyear={2024},\nurl={https://openreview.net/forum?id=QTImFg6MHU}\n}",
        "github": "",
        "project": "",
        "reviewers": "rA28;5FRv;8Bjv",
        "site": "https://openreview.net/forum?id=QTImFg6MHU",
        "pdf_size": 943448,
        "rating": "3;3;5",
        "confidence": "4;4;4",
        "soundness": "2;2;2",
        "contribution": "2;2;2",
        "presentation": "2;2;1",
        "wc_summary": "100;106;223",
        "wc_strengths": "87;39;42",
        "wc_weaknesses": "100;387;467",
        "wc_questions": "130;73;131",
        "wc_review": "417;605;863",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "466;256;434",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            143.0,
            56.621550667568265
        ],
        "wc_strengths_avg": [
            56.0,
            21.95449840010015
        ],
        "wc_weaknesses_avg": [
            318.0,
            157.57114795122445
        ],
        "wc_questions_avg": [
            111.33333333333333,
            27.10883414846328
        ],
        "wc_review_avg": [
            628.3333333333334,
            182.82474911479815
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            385.3333333333333,
            92.38085419729686
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 46,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8891971822703481847&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Maryland;Cleanlab",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www/umd.edu;https://www.cleanlab.ai",
        "aff_unique_abbr": "UMD;",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "College Park;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "QUhCObWGw5",
        "title": "PATHS: Parameter-wise Adaptive Two-Stage Training Harnessing Scene Transition Mask Adapters for Video Retrieval",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Image-text pre-trained model, e.g., CLIP, has gained significant traction even in the field of video-text learning. Recent approaches extended CLIP to video tasks, and have achieved unprecedented performances in the foundational study of video understanding: text-video retrieval. However, unlike conventional transfer learning within the same domain, transfer learning across different modalities from images to videos often requires fine-tuning the whole pre-trained weights rather than keeping them frozen. This may result in overfitting and distorting the pre-trained weights, leading to a degradation in performance. To address this challenge, we introduce a learning strategy, termed Parameter-wise Adaptive Two-stage training Harnessing Scene transition mask adapter (PATHS). Our two-stage learning process alleviates the deviations of the pre-trained weights. A novel method of finding the optimal weights is used in the first stage, which efficiently narrows down to strong candidates by only monitoring the fluctuations of parameters. Once the parameters are fixed to optimal values, the second stage is dedicated to acquiring knowledge of scenes with an adapter module. PATHS can be applied to any existing models in a plug-and-play manner, and always achieves performance improvements from the base models. We report state-of-the-art performances across key text-video benchmark datasets, including MSRVTT and LSMDC. Our code is available at https://anonymous.4open.science/r/PATHS_.",
        "keywords": "text to video retrieval;transfer learning;adapter;CLIP",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/049a976b8247128cdcb89a55cb601eb8ec368794.pdf",
        "author": "SeongMin Kang;Yoon-Sik Cho",
        "authorids": "~SeongMin_Kang1;~Yoon-Sik_Cho1",
        "gender": "M;",
        "homepage": ";https://sites.google.com/aicampus.cau.ac.kr/dsl",
        "dblp": ";56/9828",
        "google_scholar": ";",
        "orcid": "0009-0005-8231-5763;",
        "linkedin": ";yoon-sik-cho-0101734b",
        "or_profile": "~SeongMin_Kang1;~Yoon-Sik_Cho1",
        "aff": "Chung-Ang University;Chung-Ang University",
        "aff_domain": "cau.ac.kr;cau.ac.kr",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\nkang2024paths,\ntitle={{PATHS}: Parameter-wise Adaptive Two-Stage Training Harnessing Scene Transition Mask Adapters for Video Retrieval},\nauthor={SeongMin Kang and Yoon-Sik Cho},\nyear={2024},\nurl={https://openreview.net/forum?id=QUhCObWGw5}\n}",
        "github": "",
        "project": "",
        "reviewers": "zzzT;Cekr;tWWe;hfBT",
        "site": "https://openreview.net/forum?id=QUhCObWGw5",
        "pdf_size": 11046106,
        "rating": "3;5;5;8",
        "confidence": "4;4;3;3",
        "soundness": "2;2;2;4",
        "contribution": "2;2;2;3",
        "presentation": "2;1;3;4",
        "wc_summary": "67;91;93;85",
        "wc_strengths": "11;42;35;45",
        "wc_weaknesses": "88;199;105;54",
        "wc_questions": "70;6;35;121",
        "wc_review": "236;338;268;305",
        "wc_reply_reviewers": "267;0;0;16",
        "wc_reply_authors": "822;1061;786;830",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "2;3;2;2",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            84.0,
            10.246950765959598
        ],
        "wc_strengths_avg": [
            33.25,
            13.348689074212494
        ],
        "wc_weaknesses_avg": [
            111.5,
            53.751744157748035
        ],
        "wc_questions_avg": [
            58.0,
            42.85440467443224
        ],
        "wc_review_avg": [
            286.75,
            38.362579423182694
        ],
        "wc_reply_reviewers_avg": [
            70.75,
            113.49311653135621
        ],
        "wc_reply_authors_avg": [
            874.75,
            108.801137402143
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.7001400420140049,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:zY0VOOvy_8wJ:scholar.google.com/&scioq=PATHS:+Parameter-wise+Adaptive+Two-Stage+Training+Harnessing+Scene+Transition+Mask+Adapters+for+Video+Retrieval&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Chung-Ang University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.cau.ac.kr",
        "aff_unique_abbr": "CAU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "QUkcfqa6GX",
        "title": "Spatio-Temporal Graph Learning with Large Language Model",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Spatio-temporal prediction holds immense significance in urban computing as it enables decision-makers to anticipate critical phenomena such as traffic flow, crime rates, and air quality. Researchers have made remarkable progress in this field by leveraging the graph structure inherent in spatio-temporal data and harnessing the power of Graph Neural Networks (GNNs) to capture intricate relationships and dependencies across different time slots and locations. These advancements have significantly improved representation learning, leading to more accurate predictions. This study focuses on exploring the capacity of Large Language Models (LLMs) to handle the dynamic nature of spatio-temporal data in urban systems. The proposed approach, called STLLM, integrates LLMs with a cross-view mutual information maximization paradigm to capture implicit spatio-temporal dependencies and preserve spatial semantics in urban space. By harnessing the power of LLMs, the approach effectively captures intricate and implicit spatial and temporal patterns, resulting in the generation of robust and invariant LLM-based knowledge representations. In our framework, the cross-view knowledge alignment ensures effective alignment and information preservation across different views while also facilitating spatio-temporal data augmentation. The effectiveness of STLLM is evaluated through theoretical analyses, extensive experiments, and additional investigations, demonstrating its ability to align LLM-based spatio-temporal knowledge and outperform state-of-the-art baselines in various prediction tasks.",
        "keywords": "Spatio-Temporal Graph;Contrastive Learning;Large Language Model",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/d5333afda2bfe3cdab63f4a7a0b4ce4805be5fb8.pdf",
        "author": "Qianru Zhang;Xubin Ren;Lianghao Xia;Siu Ming Yiu;Chao Huang",
        "authorids": "~Qianru_Zhang2;~Xubin_Ren1;~Lianghao_Xia1;~Siu_Ming_Yiu1;~Chao_Huang7",
        "gender": ";M;M;M;M",
        "homepage": ";https://ren-xubin.github.io;https://akaxlh.github.io/;https://www.cs.hku.hk/index.php/people/academic-staff/smyiu;",
        "dblp": ";318/9196.html;270/6586;y/SiuMingYiu.html;",
        "google_scholar": ";https://scholar.google.com/scholar?hl=en;fDDjoUEAAAAJ;QFNVqjEAAAAJ;Zkv9FqwAAAAJ",
        "orcid": ";0000-0003-3332-1073;0000-0003-0725-2211;0000-0002-3975-8500;",
        "linkedin": ";;;;",
        "or_profile": "~Qianru_Zhang2;~Xubin_Ren1;~Lianghao_Xia1;~Siu_Ming_Yiu1;~Chao_Huang7",
        "aff": ";The University of Hong Kong;University of Hong Kong;University of Hong Kong;University of Hong Kong",
        "aff_domain": ";hku.hk;hku.hk;hku.hk;hku.hk",
        "position": ";PhD student;Postdoc;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nzhang2024spatiotemporal,\ntitle={Spatio-Temporal Graph Learning with Large Language Model},\nauthor={Qianru Zhang and Xubin Ren and Lianghao Xia and Siu Ming Yiu and Chao Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=QUkcfqa6GX}\n}",
        "github": "",
        "project": "",
        "reviewers": "YTgQ;tWtM;sLZZ;eK7t",
        "site": "https://openreview.net/forum?id=QUkcfqa6GX",
        "pdf_size": 809706,
        "rating": "3;5;5;6",
        "confidence": "5;4;4;3",
        "soundness": "1;2;2;3",
        "contribution": "1;2;2;3",
        "presentation": "1;3;3;3",
        "wc_summary": "73;78;74;90",
        "wc_strengths": "69;34;100;36",
        "wc_weaknesses": "73;172;291;125",
        "wc_questions": "132;70;205;9",
        "wc_review": "347;354;670;260",
        "wc_reply_reviewers": "0;16;0;0",
        "wc_reply_authors": "602;447;652;252",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            78.75,
            6.7592529172978875
        ],
        "wc_strengths_avg": [
            59.75,
            27.07743525520835
        ],
        "wc_weaknesses_avg": [
            165.25,
            80.60513321122917
        ],
        "wc_questions_avg": [
            104.0,
            72.74269722796922
        ],
        "wc_review_avg": [
            407.75,
            155.87234360206432
        ],
        "wc_reply_reviewers_avg": [
            4.0,
            6.928203230275509
        ],
        "wc_reply_authors_avg": [
            488.25,
            155.939691868363
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9733285267845754,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14758999225889418960&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of Hong Kong",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.hku.hk",
        "aff_unique_abbr": "HKU",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "QUkgKycSl3",
        "title": "Is Scale All You Need For Anomaly Detection?",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Scaling up neural representations has led to an unprecedented boost in anomaly detection methods' performance. This paper tackles the question: can we solve anomaly detection with arbitrary accuracy by continuing to scale up neural representations? We begin by highlighting that overly expressive representations are often unable to detect even simple anomalies when evaluated beyond well-studied object-centric datasets. We explain this phenomenon by introducing a theoretical toy model for anomaly detection performance. The model provides evidence for a no-free-lunch theorem in anomaly detection stating that increasing representation expressivity will eventually result in performance degradation. To break this deadlock, it is necessary to provide guidance to focus the representation on the attributes relevant to the anomalies of interest. We conducted an extensive empirical investigation demonstrating that state-of-the-art representations often suffer from over-expressivity, failing to detect many types of anomalies in practical settings. Our paper underscores that achieving breakthroughs in anomaly detection requires more than just scale; it requires making informed assumptions about the nature of the anomalies.",
        "keywords": "anomaly detection",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/fde837dee8f8101fcdf020692f0c403cf2df8330.zip",
        "author": "Tal Reiss;Niv Cohen;Yedid Hoshen",
        "authorids": "~Tal_Reiss1;~Niv_Cohen1;~Yedid_Hoshen3",
        "gender": "M;M;M",
        "homepage": ";https://www.cs.huji.ac.il/w~nivc/;https://www.cs.huji.ac.il/~ydidh/",
        "dblp": "276/6114;259/2291;136/0280",
        "google_scholar": "sgMIT6EAAAAJ;https://scholar.google.co.il/citations?user=ZMdC3OQAAAAJ;https://scholar.google.co.il/citations?user=6y1-qS4AAAAJ",
        "orcid": ";;",
        "linkedin": ";niv-cohen-39b49521/;",
        "or_profile": "~Tal_Reiss1;~Niv_Cohen1;~Yedid_Hoshen3",
        "aff": "Hebrew University of Jerusalem;Hebrew University of Jerusalem;Google",
        "aff_domain": "huji.ac.il;huji.ac.il;google.com",
        "position": "PhD student;PhD student;Researcher",
        "bibtex": "@misc{\nreiss2024is,\ntitle={Is Scale All You Need For Anomaly Detection?},\nauthor={Tal Reiss and Niv Cohen and Yedid Hoshen},\nyear={2024},\nurl={https://openreview.net/forum?id=QUkgKycSl3}\n}",
        "github": "",
        "project": "",
        "reviewers": "EGsk;ML7M;aDHc",
        "site": "https://openreview.net/forum?id=QUkgKycSl3",
        "pdf_size": 1514766,
        "rating": "3;3;5",
        "confidence": "4;4;4",
        "soundness": "2;1;2",
        "contribution": "1;1;2",
        "presentation": "3;2;3",
        "wc_summary": "65;35;142",
        "wc_strengths": "80;24;59",
        "wc_weaknesses": "379;231;150",
        "wc_questions": "11;1;3",
        "wc_review": "535;291;354",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "221;173;148",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            80.66666666666667,
            45.065384597148274
        ],
        "wc_strengths_avg": [
            54.333333333333336,
            23.098821518760552
        ],
        "wc_weaknesses_avg": [
            253.33333333333334,
            94.81326676976991
        ],
        "wc_questions_avg": [
            5.0,
            4.320493798938574
        ],
        "wc_review_avg": [
            393.3333333333333,
            103.42254213768979
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            180.66666666666666,
            30.291179500896884
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:-otTS-OBpZEJ:scholar.google.com/&scioq=Is+Scale+All+You+Need+For+Anomaly+Detection%3F&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Hebrew University of Jerusalem;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.huji.ac.il;https://www.google.com",
        "aff_unique_abbr": "HUJI;Google",
        "aff_campus_unique_index": "0;0;1",
        "aff_campus_unique": "Jerusalem;Mountain View",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "Israel;United States"
    },
    {
        "id": "QV6uB196cR",
        "title": "A/B testing under Identity Fragmentation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Randomized online experimentation is a key cornerstone of the online world. The infrastructure enabling such methodologies is critically dependent on user identification. However, nowadays consumers routinely interact with online businesses across multiple devices which are often recorded with different identifiers for the same consumer. The inability to match different device identities across consumers leads to an incorrect estimation of various causal effects. Moreover, without strong assumptions about the device-user graph, the causal effects are not identifiable. In this paper, we consider the task of estimating global treatment effects (GATE) from a fragmented view of exposures and outcomes. Our experiments validate our theoretical analysis, and estimators obtained through our procedure are shown be superior to standard estimators, with a lower bias and increased robustness.",
        "keywords": "online experimentation;causal inference;A/B testing;privacy",
        "primary_area": "causal reasoning",
        "supplementary_material": "/attachment/84aa9398fb8a2bba1bc5c1a3455c8420f5c99715.pdf",
        "author": "Shiv Shankar;Ritwik Sinha;Saayan Mitra;Madalina Fiterau",
        "authorids": "~Shiv_Shankar2;~Ritwik_Sinha1;~Saayan_Mitra1;~Madalina_Fiterau3",
        "gender": ";M;;",
        "homepage": ";https://research.adobe.com/person/ritwik-sinha/;;",
        "dblp": "203/9123;127/3163;;",
        "google_scholar": ";https://scholar.google.co.in/citations?user=4SDTMIQAAAAJ;;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Shiv_Shankar2;~Ritwik_Sinha1;~Saayan_Mitra1;~Madalina_Fiterau3",
        "aff": "IIT Bombay;Adobe Systems;;",
        "aff_domain": "iitb.ac.in;adobe.com;;",
        "position": "Researcher;Researcher;;",
        "bibtex": "@misc{\nshankar2024ab,\ntitle={A/B testing under Identity Fragmentation},\nauthor={Shiv Shankar and Ritwik Sinha and Saayan Mitra and Madalina Fiterau},\nyear={2024},\nurl={https://openreview.net/forum?id=QV6uB196cR}\n}",
        "github": "",
        "project": "",
        "reviewers": "QWuy;ZXoD;iRkW;Up8V",
        "site": "https://openreview.net/forum?id=QV6uB196cR",
        "pdf_size": 795081,
        "rating": "3;5;5;6",
        "confidence": "4;1;4;3",
        "soundness": "3;2;3;3",
        "contribution": "2;2;2;2",
        "presentation": "1;3;2;4",
        "wc_summary": "36;34;81;71",
        "wc_strengths": "32;31;24;105",
        "wc_weaknesses": "138;107;165;380",
        "wc_questions": "165;57;9;26",
        "wc_review": "371;229;279;582",
        "wc_reply_reviewers": "20;0;0;18",
        "wc_reply_authors": "774;502;346;411",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.0,
            1.224744871391589
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            55.5,
            20.81465829649865
        ],
        "wc_strengths_avg": [
            48.0,
            33.05298776207682
        ],
        "wc_weaknesses_avg": [
            197.5,
            107.34640189591825
        ],
        "wc_questions_avg": [
            64.25,
            60.660427792754646
        ],
        "wc_review_avg": [
            365.25,
            135.10805860495518
        ],
        "wc_reply_reviewers_avg": [
            9.5,
            9.526279441628825
        ],
        "wc_reply_authors_avg": [
            508.25,
            163.12935817932959
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.3746343246326776,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:KjozH98aJ5EJ:scholar.google.com/&scioq=A/B+testing+under+Identity+Fragmentation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Indian Institute of Technology Bombay;Adobe",
        "aff_unique_dep": ";Adobe Systems Incorporated",
        "aff_unique_url": "https://www.iitb.ac.in;https://www.adobe.com",
        "aff_unique_abbr": "IITB;Adobe",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Mumbai;",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "India;United States"
    },
    {
        "id": "QVVSb0GMXK",
        "title": "NewTime: Numerically Multi-Scaled Embedding for Large-Scale Time Series Pretraining",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recent research on time-series self-supervised models shows great promise in learning semantic representations. However, it has been limited to small-scale datasets, e.g., thousands of temporal sequences. In this work, we make key technical contributions that are tailored to the numerical properties of time-series data and allow the model to scale to large datasets, e.g., millions of temporal sequences. We adopt the Transformer architecture by first partitioning the input into non-overlapping windows. Each window is then characterized by its normalized shape and two scalar values denoting the mean and standard deviation within each window. To embed scalar values that may possess arbitrary numerical scales to high-dimensional vectors, we propose a numerically multi-scaled embedding module enumerating all possible scales for the scalar values. The model undergoes pretraining using the proposed numerically multi-scaled embedding with a simple contrastive objective on a large-scale dataset containing over a million sequences. We study its transfer performance on a number of univariate and multivariate classification benchmarks. Our method exhibits remarkable improvement against previous representation learning approaches and establishes the new state of the art, even compared with domain-specific non-learning-based methods.",
        "keywords": "time series;self-supervised pretraining;data encoding;representation learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Chenguo Lin;Xumeng Wen;Wei Cao;Congrui Huang;Jiang Bian;Stephen Lin;Zhirong Wu",
        "authorids": "~Chenguo_Lin1;~Xumeng_Wen1;~Wei_Cao1;~Congrui_Huang2;~Jiang_Bian1;~Stephen_Lin1;~Zhirong_Wu4",
        "gender": "M;M;M;;M;;M",
        "homepage": "https://chenguolin.github.io;https://github.com/xumwen;;https://dblp.org/pid/26/8737.html;https://sites.google.com/view/jiangbian;https://www.microsoft.com/en-us/research/people/stevelin/;https://www.microsoft.com/en-us/research/people/wuzhiron/",
        "dblp": "286/8465;358/9194.html;54/6265;;09/851-2.html;55/4755-1.html;147/5025",
        "google_scholar": "jZ7MDcMAAAAJ;;;;pZBEnY8AAAAJ;c3PYmxUAAAAJ;lH4zgcIAAAAJ",
        "orcid": ";;;;0000-0002-9472-600X;;",
        "linkedin": ";;;;jbian/;;",
        "or_profile": "~Chenguo_Lin1;~Xumeng_Wen1;~Wei_Cao1;~Congrui_Huang2;~Jiang_Bian1;~Stephen_Lin1;~Zhirong_Wu1",
        "aff": "Peking University;Microsoft Research Asia;;Microsoft;Microsoft;Microsoft Research;Microsoft Research",
        "aff_domain": "pku.edu.cn;microsoft.com;;microsoft.com;microsoft.com;microsoft.com;microsoft.com",
        "position": "PhD student;Researcher;;Principal Software Engineer;Partner Research Manager;Researcher;Researcher",
        "bibtex": "@misc{\nlin2024newtime,\ntitle={NewTime: Numerically Multi-Scaled Embedding for Large-Scale Time Series Pretraining},\nauthor={Chenguo Lin and Xumeng Wen and Wei Cao and Congrui Huang and Jiang Bian and Stephen Lin and Zhirong Wu},\nyear={2024},\nurl={https://openreview.net/forum?id=QVVSb0GMXK}\n}",
        "github": "",
        "project": "",
        "reviewers": "5cTs;bUUu;iwoT;3jGr",
        "site": "https://openreview.net/forum?id=QVVSb0GMXK",
        "pdf_size": 1197135,
        "rating": "3;5;5;5",
        "confidence": "4;3;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "37;72;67;124",
        "wc_strengths": "71;51;83;91",
        "wc_weaknesses": "281;85;327;173",
        "wc_questions": "102;184;2;317",
        "wc_review": "491;392;479;705",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            75.0,
            31.29696470905765
        ],
        "wc_strengths_avg": [
            74.0,
            15.066519173319364
        ],
        "wc_weaknesses_avg": [
            216.5,
            94.28016758576535
        ],
        "wc_questions_avg": [
            151.25,
            115.37628655837386
        ],
        "wc_review_avg": [
            516.75,
            115.20498036109376
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17955497537085632478&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1;1;1;1",
        "aff_unique_norm": "Peking University;Microsoft",
        "aff_unique_dep": ";Research",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.microsoft.com/en-us/research/group/asia",
        "aff_unique_abbr": "Peking U;MSR Asia",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Asia",
        "aff_country_unique_index": "0;0;1;1;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "QWgUAx7nIi",
        "title": "Contrastive Graph Autoencoder for Geometric Polygon Retrieval from Building Datasets",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Retrieval of polygon geometries with similar shapes from maps is a challenging geographic information task. Existing approaches can not process geometry polygons with complex shapes, (multiple) holes and are sensitive to geometric transformations (e.g., rotation and reflection). We propose Contrastive Graph Autoencoder (CGAE), a robust and effective graph representation autoencoder for extracting polygon geometries of similar shapes from real-world building maps based on template queries. By leveraging graph message-passing layer, graph feature augmentation and contrastive learning, the proposed CGAE reconstructs graph features of w.r.t input graph representations of polygons. The CGAE outperforms existing graph-based autoencoder on multiple polygon datasets in the task of similar shape retrieval of polygons. Experimentally, we show that our approach is capable of identifying and extracting similar complex polygon geometries with or without holes from polygonal datasets, based on template queries. Further experiments demonstrate that our approach is highly robust to geometrical transformations in contrast to existing GAE model, indicating the strong generalizability and versatility of CGAE in identifying complex real-world building footprints.",
        "keywords": "polygon shape retrieval;graph autoencoder;graph contrastive learning;unsupervised graph clustering;building footprints",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Zexian Huang;Kourosh Khoshelham;Martin Tomko",
        "authorids": "~Zexian_Huang1;~Kourosh_Khoshelham1;~Martin_Tomko1",
        "gender": "M;M;M",
        "homepage": ";https://findanexpert.unimelb.edu.au/profile/710868-kourosh-khoshelham;https://www.tomko.org",
        "dblp": ";87/7132;76/4384",
        "google_scholar": "https://scholar.google.com.au/citations?user=7FYALQ0AAAAJ;TiNk1ukAAAAJ;Ww8A0yAAAAAJ",
        "orcid": "0000-0003-0270-1604;;0000-0002-5736-4679",
        "linkedin": ";;",
        "or_profile": "~Zexian_Huang1;~Kourosh_Khoshelham1;~Martin_Tomko1",
        "aff": "University of Melbourne;University of Melbourne;University of Melbourne",
        "aff_domain": "unimelb.edu;unimelb.edu;unimelb.edu",
        "position": "PhD student;Associate Professor;Associate Professor",
        "bibtex": "@misc{\nhuang2024contrastive,\ntitle={Contrastive Graph Autoencoder for Geometric Polygon Retrieval from Building Datasets},\nauthor={Zexian Huang and Kourosh Khoshelham and Martin Tomko},\nyear={2024},\nurl={https://openreview.net/forum?id=QWgUAx7nIi}\n}",
        "github": "",
        "project": "",
        "reviewers": "sEzw;SxCs;sWPL;R5mS",
        "site": "https://openreview.net/forum?id=QWgUAx7nIi",
        "pdf_size": 20885549,
        "rating": "3;5;5;8",
        "confidence": "4;3;4;4",
        "soundness": "3;2;4;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "65;80;55;98",
        "wc_strengths": "45;47;25;68",
        "wc_weaknesses": "331;13;158;132",
        "wc_questions": "10;194;184;132",
        "wc_review": "451;334;422;430",
        "wc_reply_reviewers": "134;0;549;0",
        "wc_reply_authors": "649;742;1046;703",
        "reply_reviewers": "1;0;2;0",
        "reply_authors": "2;2;3;1",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            74.5,
            16.224980739587952
        ],
        "wc_strengths_avg": [
            46.25,
            15.22128443988877
        ],
        "wc_weaknesses_avg": [
            158.5,
            113.61007877824925
        ],
        "wc_questions_avg": [
            130.0,
            73.17103251970687
        ],
        "wc_review_avg": [
            409.25,
            44.71786555729153
        ],
        "wc_reply_reviewers_avg": [
            170.75,
            225.13037889187677
        ],
        "wc_reply_authors_avg": [
            785.0,
            154.26438344608258
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.08084520834544431,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:l86dPN5VuGwJ:scholar.google.com/&scioq=Contrastive+Graph+Autoencoder+for+Geometric+Polygon+Retrieval+from+Building+Datasets&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Melbourne",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.unimelb.edu.au",
        "aff_unique_abbr": "UniMelb",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Australia"
    },
    {
        "id": "QXCjvHnDmu",
        "title": "Open Sesame! Universal Black Box Jailbreaking of Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs), designed to provide helpful and safe responses, often rely on alignment techniques to align with user intent and social guidelines. Unfortunately, this alignment can be exploited by malicious actors seeking to manipulate an LLM\u2019s outputs for unintended purposes. In this paper we introduce a novel approach that employs a genetic algorithm (GA) to manipulate LLMs when model architecture and parameters are inaccessible. The GA attack works by optimizing a universal adversarial prompt that\u2014when combined with a user\u2019s query\u2014disrupts the attacked model\u2019s alignment, resulting in unintended and potentially harmful outputs. Our novel approach systematically reveals a model\u2019s limitations and vulnerabilities by uncovering instances where its responses deviate from expected behavior. Through extensive experiments we demonstrate the efficacy of our technique, thus contributing to the ongoing discussion on responsible AI development by providing a diagnostic tool for evaluating and enhancing alignment of LLMs with human intent. To our knowledge this is the first automated universal black box jailbreak attack.",
        "keywords": "Deep Learning;Large Language Models;Adversarial Attack;Evolutionary Algorithm",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Raz Lapid;Ron Langberg;Moshe Sipper",
        "authorids": "~Raz_Lapid1;~Ron_Langberg1;~Moshe_Sipper1",
        "gender": "M;M;M",
        "homepage": ";https://www.linkedin.com/in/ron-langberg-023144209;http://www.moshesipper.com/",
        "dblp": "322/9203;;s/MosheSipper",
        "google_scholar": "ZvgO_hkAAAAJ;;k2xM7QgAAAAJ",
        "orcid": ";;0000-0003-1811-472X",
        "linkedin": ";ron-langberg-023144209;moshesipper/",
        "or_profile": "~Raz_Lapid1;~Ron_Langberg1;~Moshe_Sipper1",
        "aff": "Ben-Gurion University of the Negev;;Ben-Gurion University of the Negev",
        "aff_domain": "bgu.ac.il;;bgu.ac.il",
        "position": "PhD student;;Full Professor",
        "bibtex": "@misc{\nlapid2024open,\ntitle={Open Sesame! Universal Black Box Jailbreaking of Large Language Models},\nauthor={Raz Lapid and Ron Langberg and Moshe Sipper},\nyear={2024},\nurl={https://openreview.net/forum?id=QXCjvHnDmu}\n}",
        "github": "",
        "project": "",
        "reviewers": "1qTf;HedS;53vJ;CXBa",
        "site": "https://openreview.net/forum?id=QXCjvHnDmu",
        "pdf_size": 7846777,
        "rating": "5;5;5;5",
        "confidence": "4;4;5;4",
        "soundness": "3;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;2;4",
        "wc_summary": "71;192;61;89",
        "wc_strengths": "101;163;38;41",
        "wc_weaknesses": "87;1742;123;52",
        "wc_questions": "43;2;141;84",
        "wc_review": "302;2099;363;266",
        "wc_reply_reviewers": "16;620;101;0",
        "wc_reply_authors": "316;592;454;309",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "2;2;2;1",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            103.25,
            52.212905492799386
        ],
        "wc_strengths_avg": [
            85.75,
            51.192650839744566
        ],
        "wc_weaknesses_avg": [
            501.0,
            716.9313077275954
        ],
        "wc_questions_avg": [
            67.5,
            51.39309292113095
        ],
        "wc_review_avg": [
            757.5,
            775.291074371426
        ],
        "wc_reply_reviewers_avg": [
            184.25,
            254.4920185388925
        ],
        "wc_reply_authors_avg": [
            417.75,
            116.03528558158506
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 157,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16022915083580913904&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Ben-Gurion University of the Negev",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.bgu.ac.il",
        "aff_unique_abbr": "BGU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Israel"
    },
    {
        "id": "QXRScRrwNr",
        "title": "In-Context Learning with Retrieval Augmented Encoder-Decoder Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In this paper, we investigate the in-context learning ability of retrieval-augmented encoder-decoder language models. We first conduct a comprehensive analysis of the state-of-the-art ATLAS model and identify its limitations in in-context learning, primarily due to a mismatch between pretraining and testing, as well as a restricted context length. To address these issues, we propose RAVEN, a model that combines retrieval-augmented masked language modeling and prefix language modeling. We further introduce Fusion-in-Context Learning to enhance the few-shot performance by enabling the model to leverage more in-context examples without requiring additional training or model modifications. Through extensive experiments, we demonstrate that RAVEN significantly outperforms ATLAS and achieves results comparable to the most advanced language models in certain scenarios, despite having substantially fewer parameters. Our work underscores the potential of retrieval-augmented encoder-decoder language models for in-context learning and encourages further research in this direction.",
        "keywords": "Retrieval-Augmented Language Models;In-Context Learning;Open-Domain Question Answering",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Jie Huang;Wei Ping;Peng Xu;Mohammad Shoeybi;Kevin Chang;Bryan Catanzaro",
        "authorids": "~Jie_Huang3;~Wei_Ping1;~Peng_Xu7;~Mohammad_Shoeybi1;~Kevin_Chang1;~Bryan_Catanzaro1",
        "gender": ";M;M;M;M;M",
        "homepage": "https://jeffhj.github.io/;https://wpingnet.github.io/;https://scholar.google.com.hk/citations?user=PQ26NTIAAAAJ&hl=en;;https://siebelschool.illinois.edu/about/people/faculty/kcchang;https://ctnzr.io",
        "dblp": "29/6643-9;08/8399.html;84/586-8;53/9742;c/KCCChang;14/4826",
        "google_scholar": "GIoPkMoAAAAJ;6gKEYRgAAAAJ;https://scholar.google.com.hk/citations?user=PQ26NTIAAAAJ;62ElavIAAAAJ;https://scholar.google.com.tw/citations?user=sugWZ6MAAAAJ;UZ6kI2AAAAAJ",
        "orcid": ";;;;0000-0003-0997-6803;0000-0003-0034-7728",
        "linkedin": "jie-huang-4b0104151/;wei-ping/;;shoeybi/;;bryancatanzaro/",
        "or_profile": "~Jie_Huang3;~Wei_Ping1;~Peng_Xu7;~Mohammad_Shoeybi1;~Kevin_Chang1;~Bryan_Catanzaro1",
        "aff": "University of Illinois, Urbana Champaign;NVIDIA;NVIDIA;NVIDIA;University of Illinois, Urbana Champaign;NVIDIA",
        "aff_domain": "illinois.edu;nvidia.com;nvidia.com;nvidia.com;illinois.edu;nvidia.com",
        "position": "PhD student;Principal Researcher;Researcher;Director of Applied Resesrch;Full Professor;Vice President",
        "bibtex": "@misc{\nhuang2024incontext,\ntitle={In-Context Learning with Retrieval Augmented Encoder-Decoder Language Models},\nauthor={Jie Huang and Wei Ping and Peng Xu and Mohammad Shoeybi and Kevin Chang and Bryan Catanzaro},\nyear={2024},\nurl={https://openreview.net/forum?id=QXRScRrwNr}\n}",
        "github": "",
        "project": "",
        "reviewers": "2TC1;y5kL;5UMJ",
        "site": "https://openreview.net/forum?id=QXRScRrwNr",
        "pdf_size": 1900626,
        "rating": "5;5;6",
        "confidence": "4;2;3",
        "soundness": "3;2;4",
        "contribution": "2;2;4",
        "presentation": "3;3;4",
        "wc_summary": "65;109;126",
        "wc_strengths": "94;69;70",
        "wc_weaknesses": "292;128;58",
        "wc_questions": "57;98;1",
        "wc_review": "508;404;255",
        "wc_reply_reviewers": "291;119;0",
        "wc_reply_authors": "1660;626;100",
        "reply_reviewers": "2;1;0",
        "reply_authors": "4;2;1",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            100.0,
            25.703436864876
        ],
        "wc_strengths_avg": [
            77.66666666666667,
            11.55662388223981
        ],
        "wc_weaknesses_avg": [
            159.33333333333334,
            98.06573758907281
        ],
        "wc_questions_avg": [
            52.0,
            39.75759885439093
        ],
        "wc_review_avg": [
            389.0,
            103.82998924524006
        ],
        "wc_reply_reviewers_avg": [
            136.66666666666666,
            119.4552449897264
        ],
        "wc_reply_authors_avg": [
            795.3333333333334,
            648.0253767321839
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:db9Dm5v-9i8J:scholar.google.com/&scioq=In-Context+Learning+with+Retrieval+Augmented+Encoder-Decoder+Language+Models&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1;0;1",
        "aff_unique_norm": "University of Illinois Urbana-Champaign;NVIDIA",
        "aff_unique_dep": ";NVIDIA Corporation",
        "aff_unique_url": "https://illinois.edu;https://www.nvidia.com",
        "aff_unique_abbr": "UIUC;NVIDIA",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Urbana-Champaign;",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "QYovwMLF7p",
        "title": "ProFITi: Probabilistic Forecasting of Irregular Time Series via Conditional Flows",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Probabilistic forecasting of irregularly sampled multivariate time series with missing values\nis an important problem in many fields, including astronomy, finance, and healthcare.\nTraditional methods for this task often rely on differential equations\nbased models and make an assumption on the target distribution.\nIn recent years, normalizing flow models have emerged as a promising approach for\ndensity estimation and uncertainty quantification, offering a flexible framework\nthat can capture complex dependencies.\nIn this work, we propose a novel model ProFITi\nfor probabilistic forecasting of irregular time series with missing values using conditional normalizing flows.\nIn this approach, the model learns a {joint} probability distribution over the future values of the time series\nconditioned on the past observations and query (future) time-channel information.\nAs components of our model, we introduce a novel invertible triangular attention layer,\nand an invertible non-linear activation function on and onto the whole real line.\nWe conduct extensive experiments on $3$ datasets,\nand demonstrate that the proposed model, ProFITi, provides significantly better forecasting likelihoods compared to the existing baseline models.\nSpecifically, on average, ProFITi provides $4$ times higher likelihood over the previously best model.",
        "keywords": "Time Series;Irregularly Sampled Time Series with Missing Values;Probabilistic Forecasting;Normalizing Flows;Conditional Normalizing Flows",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/ca88854d3a5736a2db8c8edcd65813564c9463e9.pdf",
        "author": "Vijaya Krishna Yalavarthi;Randolf Scholz;Stefan Born;Lars Schmidt-Thieme",
        "authorids": "~Vijaya_Krishna_Yalavarthi1;~Randolf_Scholz1;~Stefan_Born1;~Lars_Schmidt-Thieme1",
        "gender": "M;M;M;M",
        "homepage": "https://sites.google.com/site/vijayakrishnayalavarthi3/;https://www.ismll.uni-hildesheim.de/personen/rscholz_en.html;;https://www.ismll.uni-hildesheim.de/personen/lst_en.html",
        "dblp": "182/3227;241/7010;;s/LarsSchmidtThieme",
        "google_scholar": ";;;https://scholar.google.de/citations?user=l3taTdYAAAAJ",
        "orcid": ";;0000-0001-7838-9157;0000-0001-5729-6023",
        "linkedin": ";;;",
        "or_profile": "~Vijaya_Krishna_Yalavarthi1;~Randolf_Scholz1;~Stefan_Born1;~Lars_Schmidt-Thieme1",
        "aff": "University of Hildesheim;Universit\u00e4t Hildesheim;Technische Universit\u00e4t Berlin;University of Hildesheim",
        "aff_domain": "uni-hildesheim.de;uni-hildesheim.de;tu-berlin.de;uni-hildesheim.de",
        "position": "PhD student;PhD student;Lecturer;Full Professor",
        "bibtex": "@misc{\nyalavarthi2024profiti,\ntitle={Pro{FIT}i: Probabilistic Forecasting of Irregular Time Series via Conditional Flows},\nauthor={Vijaya Krishna Yalavarthi and Randolf Scholz and Stefan Born and Lars Schmidt-Thieme},\nyear={2024},\nurl={https://openreview.net/forum?id=QYovwMLF7p}\n}",
        "github": "",
        "project": "",
        "reviewers": "DHMB;jB4x;qpff;JdGh",
        "site": "https://openreview.net/forum?id=QYovwMLF7p",
        "pdf_size": 1257822,
        "rating": "5;6;6;6",
        "confidence": "4;4;3;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "1;3;3;2",
        "wc_summary": "91;37;14;76",
        "wc_strengths": "90;80;35;97",
        "wc_weaknesses": "273;68;128;54",
        "wc_questions": "314;19;375;66",
        "wc_review": "768;204;552;293",
        "wc_reply_reviewers": "215;0;16;14",
        "wc_reply_authors": "1252;253;689;286",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "3;1;1;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            54.5,
            30.581857366746057
        ],
        "wc_strengths_avg": [
            75.5,
            24.150569351466643
        ],
        "wc_weaknesses_avg": [
            130.75,
            86.70459907063754
        ],
        "wc_questions_avg": [
            193.5,
            153.43483958997058
        ],
        "wc_review_avg": [
            454.25,
            221.7096919397075
        ],
        "wc_reply_reviewers_avg": [
            61.25,
            88.9813885034393
        ],
        "wc_reply_authors_avg": [
            620.0,
            403.24620270995734
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:7XDFTqCbdt4J:scholar.google.com/&scioq=ProFITi:+Probabilistic+Forecasting+of+Irregular+Time+Series+via+Conditional+Flows&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "University of Hildesheim;Universit\u00e4t Hildesheim;Technische Universit\u00e4t Berlin",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.uni-hildesheim.de/;https://www.uni-hildesheim.de/;https://www.tu-berlin.de",
        "aff_unique_abbr": ";;TU Berlin",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "title": "OpenTab: Advancing Large Language Models as Open-domain Table Reasoners",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18676",
        "id": "Qa0ULgosc9",
        "author_site": "Kezhi Kong, Jiani Zhang, Zhengyuan Shen, Balasubramaniam Srinivasan, Chuan Lei, Christos Faloutsos, Huzefa Rangwala, George Karypis",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) trained on large volumes of data excel at various natural language tasks, but they cannot handle tasks requiring knowledge that has not been trained on previously. One solution is to use a retriever that fetches relevant information to expand LLM's knowledge scope. However, existing textual-oriented retrieval-based LLMs are not ideal on structured table data due to diversified data modalities and large table sizes. In this work, we propose OpenTab, an open-domain table reasoning framework powered by LLMs. Overall, OpenTab leverages table retriever to fetch relevant tables and then generates SQL programs to parse the retrieved tables efficiently. Utilizing the intermediate data derived from the SQL executions, it conducts grounded inference to produce accurate response. Extensive experimental evaluation shows that OpenTab significantly outperforms baselines in both open- and closed-domain settings, achieving up to 21.5% higher accuracy. We further run ablation studies to validate the efficacy of our proposed designs of the system.",
        "keywords": "Large Language Models;Table Reasoning",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Kezhi Kong;Jiani Zhang;Zhengyuan Shen;Balasubramaniam Srinivasan;Chuan Lei;Christos Faloutsos;Huzefa Rangwala;George Karypis",
        "authorids": "~Kezhi_Kong1;~Jiani_Zhang2;~Zhengyuan_Shen1;~Balasubramaniam_Srinivasan1;~Chuan_Lei1;~Christos_Faloutsos1;~Huzefa_Rangwala2;~George_Karypis1",
        "gender": "M;F;M;;;M;M;M",
        "homepage": "https://devnkong.github.io;https://jennyzhang0215.github.io/;;;;https://www.cs.cmu.edu/~christos/;http://www.cs.gmu.edu/~rangwala;",
        "dblp": "228/8866;186/6870;;230/3792;;f/CFaloutsos;30/444;",
        "google_scholar": ";CBmDAOEAAAAJ;mX2LPRwAAAAJ;uM4EhgEAAAAJ;;nd8lQQIAAAAJ;yWJ9BqEAAAAJ;ElqwScwAAAAJ",
        "orcid": ";0000-0003-0074-6761;;;;0000-0003-2996-9790;;",
        "linkedin": ";;donshen16/;;;christos-faloutsos-43a7aa2/;;",
        "or_profile": "~Kezhi_Kong1;~Jiani_Zhang2;~Zhengyuan_Shen1;~Balasubramaniam_Srinivasan1;~Chuan_Lei1;~Christos_Faloutsos1;~Huzefa_Rangwala2;~George_Karypis1",
        "aff": "University of Maryland, College Park;AWS;Amazon;Amazon;;Carnegie Mellon University;Computer Science, George Mason University;University of Minnesota, Minneapolis",
        "aff_domain": "umd.edu;amazon.com;amazon.com;amazon.com;;cmu.edu;cs.gmu.edu;umn.edu",
        "position": "PhD student;Researcher;Researcher;Senior Applied Scientist;;Full Professor;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nkong2024opentab,\ntitle={OpenTab: Advancing Large Language Models as Open-domain Table Reasoners},\nauthor={Kezhi Kong and Jiani Zhang and Zhengyuan Shen and Balasubramaniam Srinivasan and Chuan Lei and Christos Faloutsos and Huzefa Rangwala and George Karypis},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Qa0ULgosc9}\n}",
        "github": "",
        "project": "",
        "reviewers": "VJ1H;9EJC;zsjW",
        "pdf_size": 605777,
        "rating": "6;6;8",
        "confidence": "3;4;4",
        "soundness": "3;3;4",
        "contribution": "3;3;3",
        "presentation": "4;3;3",
        "wc_summary": "106;125;150",
        "wc_strengths": "47;54;18",
        "wc_weaknesses": "121;126;45",
        "wc_questions": "32;375;7",
        "wc_review": "306;680;220",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "277;1554;271",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;3;1",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            127.0,
            18.01850900231944
        ],
        "wc_strengths_avg": [
            39.666666666666664,
            15.584892970081281
        ],
        "wc_weaknesses_avg": [
            97.33333333333333,
            37.06151043273271
        ],
        "wc_questions_avg": [
            138.0,
            167.89480833744284
        ],
        "wc_review_avg": [
            402.0,
            199.68642083693788
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            700.6666666666666,
            603.4027584365926
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.49999999999999983,
        "gs_citation": 22,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3657259788374906367&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=Qa0ULgosc9",
        "pdf": "https://openreview.net/pdf?id=Qa0ULgosc9",
        "email": "umd.edu;amazon.com;amazon.com;amazon.com;;cmu.edu;cs.gmu.edu;umn.edu",
        "author_num": 8,
        "aff_unique_index": "0;1;1;1;2;3;4",
        "aff_unique_norm": "University of Maryland;Amazon;Carnegie Mellon University;George Mason University;University of Minnesota",
        "aff_unique_dep": ";Amazon Web Services;;Computer Science;",
        "aff_unique_url": "https://www/umd.edu;https://aws.amazon.com;https://www.cmu.edu;https://www.gmu.edu;https://www.minnesota.edu",
        "aff_unique_abbr": "UMD;AWS;CMU;GMU;UMN",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "College Park;;Minneapolis",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "QaODpeRaOK",
        "title": "Making PPO even better: Value-Guided Monte-Carlo Tree Search decoding",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Inference-time search algorithms such as Monte-Carlo Tree Search (MCTS) may seem unnecessary when generating natural language text based on state-of-the-art reinforcement learning such as Proximal Policy Optimization (PPO). In this paper, we demonstrate that it is possible to get extra mileage out of PPO by integrating MCTS on top. The key idea is *not* to throw out the *value network*, a byproduct of PPO training for evaluating partial output sequences, when decoding text out of the *policy network*. More concretely, we present a novel *value-guided* decoding algorithm called **PPO-MCTS**, which can integrate the value network from PPO to work closely with the policy network during inference-time generation. Compared to prior approaches based on MCTS for controlled text generation, the key strength of our approach is to reduce the fundamental mismatch of the scoring mechanisms of the partial outputs between training and test. Evaluation on four text generation tasks demonstrate that **PPO-MCTS** greatly improves the preferability of generated text compared to the standard practice of using only the PPO policy. Our results demonstrate the promise of search algorithms even on top of the aligned language models from PPO, and the under-explored benefit of the value network.",
        "keywords": "natural language processing;text generation;decoding;PPO;Monte-Carlo Tree Search",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Jiacheng Liu;Andrew Cohen;Ramakanth Pasunuru;Yejin Choi;Hannaneh Hajishirzi;Asli Celikyilmaz",
        "authorids": "~Jiacheng_Liu2;~Andrew_Cohen4;~Ramakanth_Pasunuru2;~Yejin_Choi1;~Hannaneh_Hajishirzi1;~Asli_Celikyilmaz1",
        "gender": "M;M;M;F;F;F",
        "homepage": "https://github.com/liujch1998;;http://rama-kanth.com;https://yejinc.github.io/;https://homes.cs.washington.edu/~hannaneh/;https://asli.us",
        "dblp": "289/6273;;199/1748;89/579-1;52/1296;15/3724",
        "google_scholar": "GJfoBZAAAAAJ;;https://scholar.google.com/citations?hl=en;vhP-tlcAAAAJ;LOV6_WIAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0003-3308-2869;;;;;",
        "linkedin": "liujch1998/;andrew-cohen-17a7aa15b;;;;aslicelikyilmaz/",
        "or_profile": "~Jiacheng_Liu2;~Andrew_Cohen4;~Ramakanth_Pasunuru2;~Yejin_Choi1;~Hannaneh_Hajishirzi1;~Asli_Celikyilmaz1",
        "aff": "Meta Facebook;Meta Platforms;Meta Platforms Inc;Department of Computer Science, University of Washington;University of Washington;FAIR ",
        "aff_domain": "meta.com;meta.com;meta.com;cs.washington.edu;uw.edu;meta.com",
        "position": "Intern;Researcher;Researcher;Full Professor;Associate Professor;Principal Researcher",
        "bibtex": "@misc{\nliu2024making,\ntitle={Making {PPO} even better: Value-Guided Monte-Carlo Tree Search decoding},\nauthor={Jiacheng Liu and Andrew Cohen and Ramakanth Pasunuru and Yejin Choi and Hannaneh Hajishirzi and Asli Celikyilmaz},\nyear={2024},\nurl={https://openreview.net/forum?id=QaODpeRaOK}\n}",
        "github": "",
        "project": "",
        "reviewers": "Svcj;GmAu;mGKi;ZQMA",
        "site": "https://openreview.net/forum?id=QaODpeRaOK",
        "pdf_size": 1867661,
        "rating": "3;3;5;5",
        "confidence": "5;4;4;3",
        "soundness": "2;2;2;3",
        "contribution": "2;3;2;2",
        "presentation": "2;1;3;2",
        "wc_summary": "54;19;71;107",
        "wc_strengths": "14;33;27;114",
        "wc_weaknesses": "11;650;250;542",
        "wc_questions": "317;43;172;187",
        "wc_review": "396;745;520;950",
        "wc_reply_reviewers": "100;277;46;27",
        "wc_reply_authors": "476;534;549;794",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;2;1;3",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            62.75,
            31.68891762114951
        ],
        "wc_strengths_avg": [
            47.0,
            39.287402561126385
        ],
        "wc_weaknesses_avg": [
            363.25,
            250.54079009215246
        ],
        "wc_questions_avg": [
            179.75,
            97.01900586998406
        ],
        "wc_review_avg": [
            652.75,
            212.37393319331824
        ],
        "wc_reply_reviewers_avg": [
            112.5,
            98.67750503534228
        ],
        "wc_reply_authors_avg": [
            588.25,
            121.87775637908666
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.7071067811865475,
        "gs_citation": 27,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12825384516892808854&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0;1;1;0",
        "aff_unique_norm": "Meta;University of Washington",
        "aff_unique_dep": "Meta Platforms, Inc.;Department of Computer Science",
        "aff_unique_url": "https://meta.com;https://www.washington.edu",
        "aff_unique_abbr": "Meta;UW",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Seattle",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "QbXo9pbJpp",
        "title": "Improved Invariant Learning for Node-level Out-of-distribution Generalization on Graphs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Enhancing OOD generalization on graph data is a recent hot research topic. Among this, node-level OOD generalization remains an underexplored and challenging subject. The difficulty of node-level OOD tasks lies in the fact that representations between nodes are coupled through edges, making it difficult go characterize distribution shifts and capture invariant features. Furthermore, environment labels for nodes is typically expensive to obtain in practice, rendering invariant learning strategies based on environment partitioning infeasible. By establishing a theoretical model, we highlight that even with ground-truth environment partitioning, classical invariant learning methods like IRM and VREx designed for independently distributed training data  will still capture spurious features when the depth of the GNN exceeds the width of a node's causal pattern (i.e., the invariant and predictive neighboring subgraph). Intriguingly, however, we theoretically and empirically find that by enforcing Cross-environment Intra-class Alignment (CIA) of node representations, we can remove the reliance on these spurious features. To harness the advantages of CIA and adapt it on graphs, we further propose Localized Reweighting CIA (LoRe-CIA), which does not require environment labels or intricate environment partitioning processes. Leveraging the neighbouring structural information of graphs, LoRe-CIA adaptively select node pairs that exhibit large differences in spurious features but minimal differences in causal features for alignment, enabling more efficient elimination of spurious features. The experiments on GOOD benchmark shows that LoRe-CIA achieves optimal OOD generalization performance on average.",
        "keywords": "Machine Learning;Out-of-distribution Generalization;Graph Machine Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/f62ab9fba9d5b071d4b26ccc06a49eaccf0528fb.pdf",
        "author": "Qixun Wang;Yisen Wang;Xianghua Ying",
        "authorids": "~Qixun_Wang1;~Yisen_Wang1;~Xianghua_Ying1",
        "gender": ";M;M",
        "homepage": "https://novaglow646.github.io/QixunWang-Homepage.github.io/;https://yisenwang.github.io/;http://www.cis.pku.edu.cn/info/1084/1268.htm",
        "dblp": "256/6758;172/1346-1;00/131",
        "google_scholar": ";uMWPDboAAAAJ;27o9L1wAAAAJ",
        "orcid": ";;0000-0002-9785-0727",
        "linkedin": ";;",
        "or_profile": "~Qixun_Wang1;~Yisen_Wang1;~Xianghua_Ying3",
        "aff": "Peking University;Peking University;Peking University",
        "aff_domain": "pku.edu.cn;pku.edu.cn;pku.edu.cn",
        "position": "PhD student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nwang2024improved,\ntitle={Improved Invariant Learning for Node-level Out-of-distribution Generalization on Graphs},\nauthor={Qixun Wang and Yisen Wang and Xianghua Ying},\nyear={2024},\nurl={https://openreview.net/forum?id=QbXo9pbJpp}\n}",
        "github": "",
        "project": "",
        "reviewers": "xLkZ;q5yH;vEQV;v4b8",
        "site": "https://openreview.net/forum?id=QbXo9pbJpp",
        "pdf_size": 7177598,
        "rating": "5;5;5;6",
        "confidence": "4;4;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;3;2",
        "wc_summary": "77;117;83;80",
        "wc_strengths": "63;27;43;101",
        "wc_weaknesses": "42;33;251;241",
        "wc_questions": "25;344;2;63",
        "wc_review": "207;521;379;485",
        "wc_reply_reviewers": "0;384;0;93",
        "wc_reply_authors": "495;2664;913;1084",
        "reply_reviewers": "0;2;0;1",
        "reply_authors": "1;5;3;3",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            89.25,
            16.161296358893985
        ],
        "wc_strengths_avg": [
            58.5,
            27.654113618049667
        ],
        "wc_weaknesses_avg": [
            141.75,
            104.35845677279825
        ],
        "wc_questions_avg": [
            108.5,
            137.6998547566409
        ],
        "wc_review_avg": [
            398.0,
            122.00409829181969
        ],
        "wc_reply_reviewers_avg": [
            119.25,
            157.49821427559107
        ],
        "wc_reply_authors_avg": [
            1289.0,
            822.262427695684
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.0,
            1.4142135623730951
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17917030049813263716&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Peking University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.pku.edu.cn",
        "aff_unique_abbr": "Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Scaling Supervised Local Learning with Augmented Auxiliary Networks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18675",
        "id": "Qbf1hy8b7m",
        "author_site": "Chenxiang Ma, Jibin Wu, Chenyang Si, KC Tan",
        "tldr": "",
        "abstract": "Deep neural networks are typically trained using global error signals that backpropagate (BP) end-to-end, which is not only biologically implausible but also suffers from the update locking problem and requires huge memory consumption. Local learning, which updates each layer independently with a gradient-isolated auxiliary network, offers a promising alternative to address the above problems. However, existing local learning methods are confronted with a large accuracy gap with the BP counterpart, particularly for large-scale networks. This is due to the weak coupling between local layers and their subsequent network layers, as there is no gradient communication across layers. To tackle this issue, we put forward an augmented local learning method, dubbed AugLocal. AugLocal constructs each hidden layer\u2019s auxiliary network by uniformly selecting a small subset of layers from its subsequent network layers to enhance their synergy. We also propose to linearly reduce the depth of auxiliary networks as the hidden layer goes deeper, ensuring sufficient network capacity while reducing the computational cost of auxiliary networks. Our extensive experiments on four image classification datasets (i.e., CIFAR-10, SVHN, STL-10, and ImageNet) demonstrate that AugLocal can effectively scale up to tens of local layers with a comparable accuracy to BP-trained networks while reducing GPU memory usage by around 40%. The proposed AugLocal method, therefore, opens up a myriad of opportunities for training high-performance deep neural networks on resource-constrained platforms. Code is available at \\url{https://github.com/ChenxiangMA/AugLocal}.",
        "keywords": "Local Learning;Biologically Motivated Learning;Deep Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/d54824a174c504a75d7a7767fd455feb649e0181.pdf",
        "author": "Chenxiang Ma;Jibin Wu;Chenyang Si;KC Tan",
        "authorids": "~Chenxiang_Ma1;~Jibin_Wu1;~Chenyang_Si2;~KC_Tan1",
        "gender": "M;M;M;",
        "homepage": ";https://www.jibinwu.com/;http://chenyangsi.top/;",
        "dblp": "264/5441;228/1824;220/3068;",
        "google_scholar": ";https://scholar.google.com.sg/citations?user=QwDyvrgAAAAJ;XdahAuoAAAAJ;",
        "orcid": "0000-0003-2065-7571;;;",
        "linkedin": ";;;",
        "or_profile": "~Chenxiang_Ma1;~Jibin_Wu1;~Chenyang_Si2;~KC_Tan1",
        "aff": "The Hong Kong Polytechnic University;Hong Kong Polytechnic University;Nanyang Technological University;",
        "aff_domain": "comp.polyu.edu.hk;polyu.edu.hk;ntu.edu.sg;",
        "position": "PhD student;Assistant Professor;Postdoc;",
        "bibtex": "@inproceedings{\nma2024scaling,\ntitle={Scaling Supervised Local Learning with Augmented Auxiliary Networks},\nauthor={Chenxiang Ma and Jibin Wu and Chenyang Si and KC Tan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Qbf1hy8b7m}\n}",
        "github": "",
        "project": "",
        "reviewers": "SLqf;ptT3;BcQr;6ww4",
        "pdf_size": 570412,
        "rating": "5;6;6;8",
        "confidence": "3;4;4;5",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "90;128;130;51",
        "wc_strengths": "21;123;61;75",
        "wc_weaknesses": "80;56;145;181",
        "wc_questions": "320;4;85;331",
        "wc_review": "511;311;421;638",
        "wc_reply_reviewers": "0;9;0;62",
        "wc_reply_authors": "1677;463;715;653",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "4;2;1;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            99.75,
            32.34482184214345
        ],
        "wc_strengths_avg": [
            70.0,
            36.45545226711637
        ],
        "wc_weaknesses_avg": [
            115.5,
            49.90240475167504
        ],
        "wc_questions_avg": [
            185.0,
            143.44162575765796
        ],
        "wc_review_avg": [
            470.25,
            119.98619712283576
        ],
        "wc_reply_reviewers_avg": [
            17.75,
            25.810608284191986
        ],
        "wc_reply_authors_avg": [
            877.0,
            471.1199422652367
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.9733285267845754,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2463281919436953265&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=Qbf1hy8b7m",
        "pdf": "https://openreview.net/pdf?id=Qbf1hy8b7m",
        "email": "comp.polyu.edu.hk;polyu.edu.hk;ntu.edu.sg;",
        "author_num": 4,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Hong Kong Polytechnic University;Nanyang Technological University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.polyu.edu.hk;https://www.ntu.edu.sg",
        "aff_unique_abbr": "PolyU;NTU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "China;Singapore"
    },
    {
        "title": "Scalable and Effective Implicit Graph Neural Networks on Large Graphs",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18674",
        "id": "QcMdPYBwTu",
        "author_site": "Juncheng Liu, Bryan Hooi, Kenji Kawaguchi, Yiwei Wang, Chaosheng Dong, Xiaokui Xiao",
        "tldr": "",
        "abstract": "Graph Neural Networks (GNNs) have become the de facto standard for modeling graph-structured data in various applications. Among them, implicit GNNs have shown a superior ability to effectively capture long-range dependencies in underlying graphs. However, implicit GNNs tend to be computationally expensive and have high memory usage, due to 1) their use of full-batch training; and 2) they require a large number of iterations to solve a fixed-point equation. These compromise the scalability and efficiency of implicit GNNs especially on large graphs. In this paper, we aim to answer the question: how can we efficiently train implicit GNNs to provide effective predictions on large graphs? We propose a new scalable and effective implicit GNN (SEIGNN) with a mini-batch training method and a stochastic solver, which can be trained efficiently on large graphs. Specifically, SEIGNN can more effectively incorporate global and long-range information by introducing coarse-level nodes in the mini-batch training method. It also achieves reduced training time by obtaining unbiased approximate solutions with fewer iterations in the proposed solver. Comprehensive experiments on various large graphs demonstrate that SEIGNN outperforms baselines and achieves higher accuracy with less training time compared with existing implicit GNNs.",
        "keywords": "graph neural networks;implicit graph neural networks;implicit models;graph learning",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/1fc552633f46c4f6c371431e4be78dd309ddb6fb.pdf",
        "author": "Juncheng Liu;Bryan Hooi;Kenji Kawaguchi;Yiwei Wang;Chaosheng Dong;Xiaokui Xiao",
        "authorids": "~Juncheng_Liu2;~Bryan_Hooi1;~Kenji_Kawaguchi1;~Yiwei_Wang2;~Chaosheng_Dong1;~Xiaokui_Xiao2",
        "gender": ";;;M;M;",
        "homepage": "https://liu-jc.github.io/;http://bhooi.github.io;https://ml.comp.nus.edu.sg/#members;;https://chaoshengdong.github.io/;",
        "dblp": "32/5712;169/9975;;50/5889-1;225/6556;",
        "google_scholar": "B6nRB7wAAAAJ;;aLl3rYoAAAAJ;https://scholar.google.com.hk/citations?user=Sh9QvBkAAAAJ;nPratvEAAAAJ;",
        "orcid": ";0000-0002-5645-1754;;;0000-0003-4491-0594;",
        "linkedin": "juncheng-liu/;;;;chaosheng-dong/;",
        "or_profile": "~Juncheng_Liu2;~Bryan_Hooi1;~Kenji_Kawaguchi1;~Yiwei_Wang2;~Chaosheng_Dong1;~Xiaokui_Xiao2",
        "aff": "National University of Singapore;National University of Singapore;National University of Singapore;UCLA Computer Science Department, University of California, Los Angeles;Amazon;",
        "aff_domain": "nus.edu;nus.edu.sg;nus.edu;cs.ucla.edu;amazon.com;",
        "position": "PhD student;Assistant Professor;Presidential Young Professor;Postdoc;Researcher;",
        "bibtex": "@inproceedings{\nliu2024scalable,\ntitle={Scalable and Effective Implicit Graph Neural Networks on Large Graphs},\nauthor={Juncheng Liu and Bryan Hooi and Kenji Kawaguchi and Yiwei Wang and Chaosheng Dong and Xiaokui Xiao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=QcMdPYBwTu}\n}",
        "github": "",
        "project": "",
        "reviewers": "K2Aq;4DC8;Jpev;m8F2",
        "pdf_size": 390505,
        "rating": "3;6;6;8",
        "confidence": "5;3;3;4",
        "soundness": "3;2;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;4;4",
        "wc_summary": "139;27;114;102",
        "wc_strengths": "76;23;104;31",
        "wc_weaknesses": "335;48;103;4",
        "wc_questions": "6;2;72;119",
        "wc_review": "556;100;393;256",
        "wc_reply_reviewers": "135;0;98;0",
        "wc_reply_authors": "1685;188;1032;370",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "4;1;4;1",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            95.5,
            41.740268326880695
        ],
        "wc_strengths_avg": [
            58.5,
            33.139855159611066
        ],
        "wc_weaknesses_avg": [
            122.5,
            127.60192004825005
        ],
        "wc_questions_avg": [
            49.75,
            48.694840589121966
        ],
        "wc_review_avg": [
            326.25,
            168.34841104091242
        ],
        "wc_reply_reviewers_avg": [
            58.25,
            59.700816577329995
        ],
        "wc_reply_authors_avg": [
            818.75,
            590.5689523671219
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            1.5
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5488604301969737,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=418223177954229712&as_sdt=5,24&sciodt=0,24&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=QcMdPYBwTu",
        "pdf": "https://openreview.net/pdf?id=QcMdPYBwTu",
        "email": "nus.edu;nus.edu.sg;nus.edu;cs.ucla.edu;amazon.com;",
        "author_num": 6,
        "aff_unique_index": "0;0;0;1;2",
        "aff_unique_norm": "National University of Singapore;University of California, Los Angeles;Amazon",
        "aff_unique_dep": ";Computer Science Department;Amazon.com, Inc.",
        "aff_unique_url": "https://www.nus.edu.sg;https://www.ucla.edu;https://www.amazon.com",
        "aff_unique_abbr": "NUS;UCLA;Amazon",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Los Angeles",
        "aff_country_unique_index": "0;0;0;1;1",
        "aff_country_unique": "Singapore;United States"
    },
    {
        "id": "QcPokaTxyp",
        "title": "Visual Grounding Helps Learn Word Meanings in Low-Data Regimes",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Modern neural language models (LMs) are powerful tools for modeling human sentence production and comprehension, and their internal representations are remarkably well-aligned with representations of language in the human brain. But to achieve these results, LMs must be trained in distinctly un-human-like ways---requiring orders of magnitude more language data than children receive during development, and without any of the accompanying grounding in perception, action, or social behavior.\nDo models trained more naturalistically---with grounded supervision---exhibit more human-like language learning?\nWe investigate this question in the context of *word learning*, a key sub-task in language acquisition.\nWe train a diverse set of LM architectures, with and without auxiliary supervision from image captioning tasks, on datasets of varying scales. We then evaluate these models on a broad set of benchmarks characterizing models' learning of syntactic categories, lexical relations, semantic features, semantic similarity, and alignment with human neural representations. \nWe find that visual supervision can indeed improve the efficiency of word learning. However, these improvements are limited: present almost exclusively in the low-data regime, and sometimes canceled out by the inclusion of rich distributional signals from text. The information conveyed by text and images is not redundant---we find that models mainly driven by visual information yield qualitatively different from those mainly driven by word co-occurrences. However, our results suggest that current multi-modal modeling approaches fail to effectively leverage visual information to build more human-like word representations from human-sized datasets.",
        "keywords": "Large-scale Language Models;Word learning;Grounded learning;Multi-modality;Vision-language cotraining",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Chengxu Zhuang;Evelina Fedorenko;Jacob Andreas",
        "authorids": "~Chengxu_Zhuang1;~Evelina_Fedorenko1;~Jacob_Andreas1",
        "gender": "M;F;M",
        "homepage": ";http://evlab.mit.edu;http://web.mit.edu/jda/www",
        "dblp": "154/6347;;97/8154",
        "google_scholar": ";1CgET20AAAAJ;dnZ8udEAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Chengxu_Zhuang1;~Evelina_Fedorenko1;~Jacob_Andreas1",
        "aff": "Massachusetts Institute of Technology;Massachusetts Institute of Technology;Microsoft",
        "aff_domain": "mit.edu;mit.edu;microsoft.com",
        "position": "Postdoc;Associate Professor;Researcher",
        "bibtex": "@misc{\nzhuang2024visual,\ntitle={Visual Grounding Helps Learn Word Meanings in Low-Data Regimes},\nauthor={Chengxu Zhuang and Evelina Fedorenko and Jacob Andreas},\nyear={2024},\nurl={https://openreview.net/forum?id=QcPokaTxyp}\n}",
        "github": "",
        "project": "",
        "reviewers": "ooAw;QLPJ;XApH;ZHy9",
        "site": "https://openreview.net/forum?id=QcPokaTxyp",
        "pdf_size": 3820959,
        "rating": "3;5;6;6",
        "confidence": "4;4;4;3",
        "soundness": "2;2;4;2",
        "contribution": "2;2;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "48;53;142;358",
        "wc_strengths": "40;22;59;91",
        "wc_weaknesses": "139;215;61;50",
        "wc_questions": "39;368;189;84",
        "wc_review": "266;658;451;583",
        "wc_reply_reviewers": "73;574;83;120",
        "wc_reply_authors": "848;2269;851;645",
        "reply_reviewers": "1;2;1;1",
        "reply_authors": "3;4;3;2",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            150.25,
            125.63911612232872
        ],
        "wc_strengths_avg": [
            53.0,
            25.544079548889602
        ],
        "wc_weaknesses_avg": [
            116.25,
            66.54087089901965
        ],
        "wc_questions_avg": [
            170.0,
            126.6116108419761
        ],
        "wc_review_avg": [
            489.5,
            148.80272174930136
        ],
        "wc_reply_reviewers_avg": [
            212.5,
            209.4451002052805
        ],
        "wc_reply_authors_avg": [
            1153.25,
            649.566923034109
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.4714045207910316,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=184277621704044508&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Massachusetts Institute of Technology;Microsoft",
        "aff_unique_dep": ";Microsoft Corporation",
        "aff_unique_url": "https://web.mit.edu;https://www.microsoft.com",
        "aff_unique_abbr": "MIT;Microsoft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "QcgvtqxRhI",
        "title": "BOSS: Diversity-Difficulty Balanced One-Shot Subset Selection for Data-Efficient Deep Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Subset or core-set selection offers a data-efficient way for training deep learning models by identifying important data samples so that the model can be trained using the selected subset with similar performance as trained on the full set. However, most existing methods tend to choose either diverse or difficult data samples, which is likely to form a suboptimal subset, leading to a model with compromised generalization performance. One key limitation is due to the misalignment with the underlying goal of subset selection as an optimal subset should faithfully represent the joint data distribution that is comprised of both feature and label information. To this end, we propose to conduct diversity-difficulty Balanced One-shot Subset Selection (BOSS), aiming to construct an optimal subset for data-efficient deep learning. Samples are selected into the subset so that a novel balanced core-set loss bound is minimized, which theoretically justifies the need to simultaneously consider both diversity and difficulty to form an optimal subset. The loss bound also unveils the key relationship between the type of data samples to be included in the subset and the subset size. This further inspires the design of an expressive importance function to optimally balance diversity and difficulty depending on the subset size. The proposed approach is inspired by a theoretical loss bound analysis and utilizes a fine-grained importance control mechanism. A comprehensive experimental study is conducted on both synthetic and real datasets to justify the important theoretical properties and demonstrate the superior performance of BOSS as compared with the competitive baselines.",
        "keywords": "subset selection;data-efficient deep learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Abhinab Acharya;Dayou Yu;Qi Yu;Xumin Liu",
        "authorids": "~Abhinab_Acharya1;~Dayou_Yu1;~Qi_Yu1;~Xumin_Liu1",
        "gender": "M;;M;F",
        "homepage": ";https://people.rit.edu/~dy2507/;https://www.rit.edu/mining/;https://www.cs.rit.edu/people/faculty/xl/",
        "dblp": ";319/4611;58/6957-1;61/5010",
        "google_scholar": "jSwlu-YAAAAJ;Obh2NOwAAAAJ;L3gWdfEAAAAJ;https://scholar.google.com.tw/citations?user=2Qq9lnUAAAAJ",
        "orcid": ";0009-0002-2373-4907;0000-0002-0426-5407;",
        "linkedin": "abhi303/;;;",
        "or_profile": "~Abhinab_Acharya1;~Dayou_Yu1;~Qi_Yu1;~Xumin_Liu1",
        "aff": "Rochester Institute of Technology;Rochester Institute of Technology;Rochester Institute of Technology;Rochester Institute of Technology",
        "aff_domain": "rit.edu;rit.edu;rit.edu;rit.edu",
        "position": "PhD student;PhD student;Professor;Full Professor",
        "bibtex": "@misc{\nacharya2024boss,\ntitle={{BOSS}: Diversity-Difficulty Balanced One-Shot Subset Selection for Data-Efficient Deep Learning},\nauthor={Abhinab Acharya and Dayou Yu and Qi Yu and Xumin Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=QcgvtqxRhI}\n}",
        "github": "",
        "project": "",
        "reviewers": "AoWq;BNoZ;jBvt",
        "site": "https://openreview.net/forum?id=QcgvtqxRhI",
        "pdf_size": 2870467,
        "rating": "5;5;5",
        "confidence": "4;3;5",
        "soundness": "3;2;3",
        "contribution": "3;2;3",
        "presentation": "3;3;3",
        "wc_summary": "148;78;78",
        "wc_strengths": "100;37;48",
        "wc_weaknesses": "164;92;184",
        "wc_questions": "6;63;12",
        "wc_review": "418;270;322",
        "wc_reply_reviewers": "52;0;0",
        "wc_reply_authors": "816;900;1011",
        "reply_reviewers": "1;0;0",
        "reply_authors": "2;3;3",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            101.33333333333333,
            32.99831645537222
        ],
        "wc_strengths_avg": [
            61.666666666666664,
            27.475241379993168
        ],
        "wc_weaknesses_avg": [
            146.66666666666666,
            39.50808637341081
        ],
        "wc_questions_avg": [
            27.0,
            25.573423705088842
        ],
        "wc_review_avg": [
            336.6666666666667,
            61.30434097372079
        ],
        "wc_reply_reviewers_avg": [
            17.333333333333332,
            24.513035081133648
        ],
        "wc_reply_authors_avg": [
            909.0,
            79.86238163240563
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:-BeFtBjjEPgJ:scholar.google.com/&scioq=BOSS:+Diversity-Difficulty+Balanced+One-Shot+Subset+Selection+for+Data-Efficient+Deep+Learning&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Rochester Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.rit.edu",
        "aff_unique_abbr": "RIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "QdHg1SdDY2",
        "title": "LEA: Learning Latent Embedding Alignment Model for fMRI Decoding and Encoding",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The connection between brain activity and  visual stimuli is crucial to understand the human brain. While deep generative models have exhibited advances in recovering brain recordings by generating images conditioned on fMRI signals, it is still challenge to  generate consistent semantics. Moreover, the prediction of fMRI signal from visual stimuli remains a hard problem. In this paper, we introduce a unified framework that addresses both fMRI decoding and encoding. With training two latent spaces capable of representing and reconstructing fMRI signals and visual images, respectively, we align the fMRI signals and visual images within the latent space, thereby enabling a bidirectional transformation between the two domains. Our Latent Embedding Alignment (LEA) model concurrently recovers visual stimuli from fMRI signals and predicts brain activity from images within a unified framework under user-specified direction. The performance of LEA surpasses that of existing methods on multiple benchmark fMRI decoding and encoding datasets. LEA offers a comprehensive solution for modeling the relationship between fMRI signal and visual stimuli.",
        "keywords": "Neural Encoding;Neural Decoding;Latent Embedding Alignment",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "Xuelin Qian;Yikai Wang;Xinwei Sun;Yanwei Fu;Jianfeng Feng",
        "authorids": "~Xuelin_Qian1;~Yikai_Wang1;~Xinwei_Sun1;~Yanwei_Fu2;~Jianfeng_Feng2",
        "gender": ";M;M;M;",
        "homepage": ";https://yikai-wang.github.io;https://sunxinwei0625.github.io/sunxw.github.io/;http://yanweifu.github.io;",
        "dblp": ";85/9555-2;145/6592-1;63/9065;",
        "google_scholar": ";x8HOE_cAAAAJ;;https://scholar.google.co.uk/citations?user=Vg54TcsAAAAJ;",
        "orcid": ";0000-0001-6107-5063;;0000-0002-6595-6893;",
        "linkedin": ";;;;",
        "or_profile": "~Xuelin_Qian1;~Yikai_Wang1;~Xinwei_Sun1;~Yanwei_Fu2;~Jianfeng_Feng2",
        "aff": ";Fudan University;Fudan University;Fudan University,;",
        "aff_domain": ";fudan.edu.cn;fudan.edu.cn;fudan.edu.cn;",
        "position": ";PhD student;Assistant Professor;Professor;",
        "bibtex": "@misc{\nqian2024lea,\ntitle={{LEA}: Learning Latent Embedding Alignment Model for f{MRI} Decoding and Encoding},\nauthor={Xuelin Qian and Yikai Wang and Xinwei Sun and Yanwei Fu and Jianfeng Feng},\nyear={2024},\nurl={https://openreview.net/forum?id=QdHg1SdDY2}\n}",
        "github": "",
        "project": "",
        "reviewers": "hPu2;wxSH;vgyk",
        "site": "https://openreview.net/forum?id=QdHg1SdDY2",
        "pdf_size": 4418018,
        "rating": "3;3;3",
        "confidence": "4;4;4",
        "soundness": "2;2;2",
        "contribution": "2;2;3",
        "presentation": "1;3;1",
        "wc_summary": "115;83;75",
        "wc_strengths": "55;17;16",
        "wc_weaknesses": "681;311;381",
        "wc_questions": "192;21;2",
        "wc_review": "1043;432;474",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            91.0,
            17.281975195754296
        ],
        "wc_strengths_avg": [
            29.333333333333332,
            18.153665072253467
        ],
        "wc_weaknesses_avg": [
            457.6666666666667,
            160.48537489614296
        ],
        "wc_questions_avg": [
            71.66666666666667,
            85.4413379004696
        ],
        "wc_review_avg": [
            649.6666666666666,
            278.6566983863039
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3877754853195764732&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Fudan University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.fudan.edu.cn",
        "aff_unique_abbr": "Fudan",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "QeX0YFt4iW",
        "title": "Multi-modality Adversarial Attacks on Latent Diffusion Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Latent diffusion models (LDMs) achieve unprecedented success in image editing, which can accurately edit the target image with text guidance. However, the multi-modal adversarial robustness of latent diffusion models has not been studied. Previous works only focus on single modality perturbation, such as image or text, making them less effective while more noticeable to humans. Therefore, in this paper, we aim to analyze the multi-modal robustness of latent diffusion models through adversarial attacks. We propose the first Multi-Modality adversarial Attack algorithm (MMA), which modifies the image and text simultaneously in a unified framework to determine updating text or image in each step. In each iteration, MMA constructs the perturbed candidates for both text and image based on the input attribution. Then, MMA selects the perturbed candidate with the largest $L_2$ distortion on the cross attention module in one step. The unified query ranking framework properly combines the updating from both modalities. Extensive experiments on both white-box and black-box settings validate two advantages of MMA: (1) MMA can easily trigger the failure of LDMs (high effectiveness). (2) MMA requires less perturbation budget compared with single modality attacks (high invisibility).",
        "keywords": "multi-modality adversarial attack;latent diffusion models;adversarial robustness",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Jianping Zhang;Zhuoer Xu;shiwen cui;Changhua Meng;Yizhan Huang;Weibin Wu;Michael Lyu",
        "authorids": "~Jianping_Zhang3;~Zhuoer_Xu1;~shiwen_cui1;~Changhua_Meng1;~Yizhan_Huang1;~Weibin_Wu1;~Michael_Lyu1",
        "gender": ";M;M;M;M;;M",
        "homepage": ";https://github.com/Unkrible;;https://www.linkedin.com/in/changhua-meng-04826021/;https://www.cse.cuhk.edu.hk/~yzhuang22/;;http://www.cse.cuhk.edu.hk/~lyu",
        "dblp": ";276/7035;;295/9441;317/6982;07/10638-2;l/MichaelRLyu",
        "google_scholar": "https://scholar.google.com.hk/citations?hl=zh-CN;na24qQoAAAAJ;;;v-suAwMAAAAJ;https://scholar.google.com.hk/citations?user=6mtEjCEAAAAJ;uQnBgK0AAAAJ",
        "orcid": ";;;;;;0000-0002-3666-5798",
        "linkedin": ";;%E4%B8%96%E6%96%87-%E5%B4%94-435538133/;;;;michael-lyu-58b154/",
        "or_profile": "~Jianping_Zhang3;~Zhuoer_Xu1;~shiwen_cui1;~Changhua_Meng1;~Yizhan_Huang1;~Weibin_Wu1;~Michael_Lyu1",
        "aff": "The Chinese University of Hong Kong;Ant Group;ant group;Ant Group;The Chinese University of Hong Kong;Sun Yat-sen University;The Chinese University of Hong Kong",
        "aff_domain": "cuhk.edu.hk;antgroup.com;antgroup.com;antgroup.com;cse.cuhk.edu.hk;sysu.edu.cn;cuhk.edu.hk",
        "position": "PhD student;Researcher;Researcher;Researcher;PhD student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nzhang2024multimodality,\ntitle={Multi-modality Adversarial Attacks on Latent Diffusion Models},\nauthor={Jianping Zhang and Zhuoer Xu and shiwen cui and Changhua Meng and Yizhan Huang and Weibin Wu and Michael Lyu},\nyear={2024},\nurl={https://openreview.net/forum?id=QeX0YFt4iW}\n}",
        "github": "",
        "project": "",
        "reviewers": "FHsv;gcjf;dU51;ufds",
        "site": "https://openreview.net/forum?id=QeX0YFt4iW",
        "pdf_size": 1398982,
        "rating": "3;5;5;6",
        "confidence": "4;3;4;4",
        "soundness": "2;3;3;2",
        "contribution": "2;2;2;3",
        "presentation": "1;2;3;3",
        "wc_summary": "53;35;35;51",
        "wc_strengths": "34;8;17;62",
        "wc_weaknesses": "180;104;13;65",
        "wc_questions": "1;4;189;92",
        "wc_review": "268;151;254;270",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "742;490;606;738",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            43.5,
            8.52936105461599
        ],
        "wc_strengths_avg": [
            30.25,
            20.571521577170707
        ],
        "wc_weaknesses_avg": [
            90.5,
            60.92823647538143
        ],
        "wc_questions_avg": [
            71.5,
            77.06004152607238
        ],
        "wc_review_avg": [
            235.75,
            49.31721301939111
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            644.0,
            104.4030650891055
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.13245323570650439,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:nZtAl1Q1TjwJ:scholar.google.com/&scioq=Multi-modality+Adversarial+Attacks+on+Latent+Diffusion+Models&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1;0;2;0",
        "aff_unique_norm": "Chinese University of Hong Kong;Ant Group;Sun Yat-sen University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.cuhk.edu.hk;https://www.antgroup.com;http://www.sysu.edu.cn/",
        "aff_unique_abbr": "CUHK;Ant Group;SYSU",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "QeemQCJAdQ",
        "title": "Deep Reinforcement Learning for Efficient and Fair Allocation of Health Care Resources",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Scarcity of health care resources could result in the unavoidable consequence of rationing. For example, ventilators are often limited in supply, especially during public health emergencies or in resource-constrained health care settings, such as amid the pandemic of COVID-19. Currently, there is no universally accepted standard for health care resource allocation protocols, resulting in different governments prioritizing patients based on various criteria and heuristic-based protocols. In this study, we investigate the use of reinforcement learning for critical care resource allocation policy optimization to fairly and effectively ration resources. We propose a transformer-based deep Q-network to integrate the disease progression of individual patients and the interaction effects among patients during the critical care resource allocation. We aim to improve both fairness of allocation and overall patient outcomes. Our experiments demonstrate that our method significantly reduces excess deaths and achieves a more equitable distribution under different levels of ventilator shortage, when compared to existing severity-based and comorbidity-based methods in use by different governments.",
        "keywords": "Reinforcement Learning;RL4H;Resource Allocation;Fairness",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/b7d86837eb13e42cd4f94040a7878672e765fcc3.zip",
        "author": "Yikuan Li;Chengsheng Mao;Kaixuan Huang;Zheng Yu;Hanyin Wang;Mengdi Wang;Yuan Luo",
        "authorids": "~Yikuan_Li1;~Chengsheng_Mao1;~Kaixuan_Huang1;~Zheng_Yu1;~Hanyin_Wang1;~Mengdi_Wang1;~Yuan_Luo3",
        "gender": "M;M;M;M;F;F;M",
        "homepage": ";;https://hackyhuang.github.io/;https://sites.google.com/view/zhengyu/;;http://mwang.princeton.edu;https://www.feinberg.northwestern.edu/faculty-profiles/az/profile.html?xid=33821",
        "dblp": ";;;28/4466;;;90/6959-4",
        "google_scholar": "1RvQidMAAAAJ;https://scholar.google.com/citations?hl=en;EfxwV6oAAAAJ;;YfIObrUAAAAJ;;txsHQx4AAAAJ",
        "orcid": " 0000-0001-7546-9979;;;;0000-0001-9884-9683;;",
        "linkedin": ";;;;hanyinwang2022/;;yuan-luo-16797137/",
        "or_profile": "~Yikuan_Li1;~Chengsheng_Mao1;~Kaixuan_Huang1;~Zheng_Yu1;~Hanyin_Wang1;~Mengdi_Wang1;~Yuan_Luo3",
        "aff": "Northwestern University;Northwestern University;Princeton University;Alibaba Group;Northwestern University, Northwestern University;Princeton University;Northwestern University",
        "aff_domain": "northwestern.edu;northwestern.edu;princeton.edu;alibaba-inc.com;u.northwestern.edu;princeton.edu;northwestern.edu",
        "position": "PhD student;Assistant Professor;PhD student;Researcher;PhD student;Full Professor;Full Professor",
        "bibtex": "@misc{\nli2024deep,\ntitle={Deep Reinforcement Learning for Efficient and Fair Allocation of Health Care Resources},\nauthor={Yikuan Li and Chengsheng Mao and Kaixuan Huang and Zheng Yu and Hanyin Wang and Mengdi Wang and Yuan Luo},\nyear={2024},\nurl={https://openreview.net/forum?id=QeemQCJAdQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "om5H;dm6i;GCVq",
        "site": "https://openreview.net/forum?id=QeemQCJAdQ",
        "pdf_size": 1139367,
        "rating": "5;5;10",
        "confidence": "3;3;4",
        "soundness": "2;2;4",
        "contribution": "2;2;4",
        "presentation": "3;2;4",
        "wc_summary": "66;53;97",
        "wc_strengths": "22;184;17",
        "wc_weaknesses": "94;338;26",
        "wc_questions": "5;101;22",
        "wc_review": "187;676;162",
        "wc_reply_reviewers": "663;0;22",
        "wc_reply_authors": "1442;1770;56",
        "reply_reviewers": "3;0;1",
        "reply_authors": "4;3;1",
        "rating_avg": [
            6.666666666666667,
            2.357022603955158
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            72.0,
            18.457157599876172
        ],
        "wc_strengths_avg": [
            74.33333333333333,
            77.57290477709054
        ],
        "wc_weaknesses_avg": [
            152.66666666666666,
            133.95853421446836
        ],
        "wc_questions_avg": [
            42.666666666666664,
            41.82768886223043
        ],
        "wc_review_avg": [
            341.6666666666667,
            236.62957455811724
        ],
        "wc_reply_reviewers_avg": [
            228.33333333333334,
            307.486946425734
        ],
        "wc_reply_authors_avg": [
            1089.3333333333333,
            742.845579885588
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            1.247219128924647
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.9999999999999998,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8548054260698722535&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;2;0;1;0",
        "aff_unique_norm": "Northwestern University;Princeton University;Alibaba Group",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.northwestern.edu;https://www.princeton.edu;https://www.alibaba.com",
        "aff_unique_abbr": "NU;Princeton;Alibaba",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "Qfqb8ueIdy",
        "title": "A Unified Framework for Consistency Generative Modeling",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Consistency modeling, a novel generative paradigm inspired by diffusion models, has gained traction for its capacity to facilitate real-time generation through single-step sampling. While its advantages are evident, the understanding of its underlying principles and effective algorithmic enhancements remain elusive. In response,  we present a unified framework for consistency generative modeling, without resorting to the predefined diffusion process. Instead, it directly constructs a probability density path that bridges the two distributions. Building upon this novel perspective, we introduce a more general consistency training objective that encapsulates previous consistency models and paves the way for innovative, consistency generation techniques.  In particular, we introduce two novel models: Poisson Consistency Models (PCMs) and Coupling Consistency Models (CCMs), which extend the prior distribution of latent variables beyond the Gaussian form. This extension significantly augments the flexibility of generative modeling. Furthermore, we harness the principles of Optimal Transport (OT) to mitigate variance during consistency training, substantially improving convergence and generative quality. Extensive experiments on the generation of synthetic and real-world datasets, as well as image-to-image translation tasks (I2I), demonstrate the effectiveness of the proposed approaches.",
        "keywords": "Consistency models; Generative modeling;",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Hongkun Dou;Junzhe Lu;Jinyang Du;Chengwei Fu;Wen Yao;Xiao qian Chen;Yue Deng",
        "authorids": "~Hongkun_Dou3;~Junzhe_Lu1;~Jinyang_Du1;~Chengwei_Fu1;~Wen_Yao1;~Xiao_qian_Chen1;~Yue_Deng4",
        "gender": "M;M;M;F;;M;M",
        "homepage": ";;https://github.com/fff835966680;;;;",
        "dblp": "244/4109-1.html;;;;61/538.html;35/8109-1;285/8223",
        "google_scholar": "hnJ4NIYAAAAJ;;;;;;pSNEkEwAAAAJ",
        "orcid": "0000-0002-5780-4574;0009-0008-3201-0832;;0000-0001-5224-9834;;;0000-0001-6185-5369",
        "linkedin": ";;;;;;",
        "or_profile": "~Junzhe_Lu1;~Jinyang_Du1;~Chengwei_Fu1;~Wen_Yao1;~Xiao_qian_Chen1;~Yue_Deng4;~hongkun_dou1",
        "aff": "Beihang University;Beihang University;Beihang University;National University of Defense Technology;;Beihang University;Beihang University",
        "aff_domain": "buaa.edu.cn;buaa.edu.cn;buaa.edu.cn;nudt.edu.cn;;buaa.edu.cn;buaa.edu.cn",
        "position": "Undergrad student;MS student;MS student;Principal Researcher;;Full Professor;PhD student",
        "bibtex": "@misc{\nanonymous2024a,\ntitle={A Unified Framework for Consistency Generative Modeling},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=Qfqb8ueIdy}\n}",
        "github": "",
        "project": "",
        "reviewers": "i9Sm;Dtgk;Qpyg;drKn",
        "site": "https://openreview.net/forum?id=Qfqb8ueIdy",
        "pdf_size": 38021334,
        "rating": "3;5;6;6",
        "confidence": "4;3;2;3",
        "soundness": "2;2;3;3",
        "contribution": "1;2;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "269;88;63;71",
        "wc_strengths": "23;44;55;58",
        "wc_weaknesses": "362;46;73;47",
        "wc_questions": "2;46;39;25",
        "wc_review": "656;224;230;201",
        "wc_reply_reviewers": "550;0;0;0",
        "wc_reply_authors": "1440;632;468;306",
        "reply_reviewers": "4;0;0;0",
        "reply_authors": "6;2;2;2",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            122.75,
            84.91871113011548
        ],
        "wc_strengths_avg": [
            45.0,
            13.729530217745982
        ],
        "wc_weaknesses_avg": [
            132.0,
            133.2310023980905
        ],
        "wc_questions_avg": [
            28.0,
            16.80773631397161
        ],
        "wc_review_avg": [
            327.75,
            189.82409620488122
        ],
        "wc_reply_reviewers_avg": [
            137.5,
            238.15698604072062
        ],
        "wc_reply_authors_avg": [
            711.5,
            436.10635170792915
        ],
        "reply_reviewers_avg": [
            1.0,
            1.7320508075688772
        ],
        "reply_authors_avg": [
            3.0,
            1.7320508075688772
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.8660254037844386,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:OSj7-iXzvBMJ:scholar.google.com/&scioq=A+Unified+Framework+for+Consistency+Generative+Modeling&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;0;0",
        "aff_unique_norm": "Beihang University;National University of Defense Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.buaa.edu.cn/;http://www.nudt.edu.cn/",
        "aff_unique_abbr": "BUAA;NUDT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "QfwNfZUg6V",
        "title": "MAMS: MODEL-AGNOSTIC MODULE SELECTION FRAMEWORK FOR VIDEO CAPTIONING",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Multi-modal transformers are rapidly gaining attention in video captioning tasks. Existing multi-modal methods extract a fixed number of frames, but this has a few critical challenges. If a limited number of frames is extracted, it is challenging to retrieve sufficient information for caption generation. Conversely, extracting an excessive number of frames can lead to the frames containing redundant information. We refer to the aforementioned challenges as information loss and excessive information similarity, respectively. This paper proposes a new model-agnostic module selection framework that can choose a module with an appropriate size through the flow selector and token selector. The proposed framework can select an appropriate size of features for each video data during training and inference. Using this framework, we moderate the issues of information loss and excessive information similarity that arise from extracting a fixed number of frames. In addition, we further moderate the excessive information similarity issue in each flow by adding diversity-promoting losses. Our numerical experiments with two different datasets demonstrate that the proposed framework significantly improves the performances of three different existing representative/state-of-the-art video captioning models.",
        "keywords": "Video;VideoCaptioning;Multi-modal;model-agnostic;module selector;token selector",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Sangho LEE;Hogun Park",
        "authorids": "~Sangho_LEE8;~Hogun_Park2",
        "gender": "M;",
        "homepage": "https://learndatalab.github.io/team/;https://hogunpark.com",
        "dblp": ";05/3540",
        "google_scholar": ";0YEYuGIAAAAJ",
        "orcid": ";0000-0003-0576-5806",
        "linkedin": ";hogunpark/en",
        "or_profile": "~Sangho_LEE8;~Hogun_Park2",
        "aff": "Sung Kyun Kwan University;Sungkyunkwan University",
        "aff_domain": "skku.edu;skku.edu",
        "position": "MS student;Assistant Professor",
        "bibtex": "@misc{\nlee2024mams,\ntitle={{MAMS}: {MODEL}-{AGNOSTIC} {MODULE} {SELECTION} {FRAMEWORK} {FOR} {VIDEO} {CAPTIONING}},\nauthor={Sangho LEE and Hogun Park},\nyear={2024},\nurl={https://openreview.net/forum?id=QfwNfZUg6V}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=QfwNfZUg6V",
        "pdf_size": 671185,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:81UDt1Q3rQoJ:scholar.google.com/&scioq=MAMS:+MODEL-AGNOSTIC+MODULE+SELECTION+FRAMEWORK+FOR+VIDEO+CAPTIONING&hl=en&as_sdt=0,33",
        "gs_version_total": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Sungkyunkwan University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.skku.edu",
        "aff_unique_abbr": "SKKU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "QgMaqtB444",
        "title": "Omnipotent Adversarial Training in the Wild",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Adversarial training is an important topic in robust deep learning, but the community lacks attention to its practical usage. In this paper, we aim to resolve a real-world challenge, i.e., training a model on an imbalanced and noisy dataset to achieve high clean accuracy and adversarial robustness, with our proposed Omnipotent Adversarial Training (OAT) strategy. OAT consists of two innovative methodologies to address the imperfection in the training set. We first introduce an oracle into the adversarial training process to help the model learn a correct data-label conditional distribution. This carefully-designed oracle can provide correct label annotations for adversarial training. We further propose logits adjustment adversarial training to overcome the data imbalance issue, which can help the model learn a Bayes-optimal distribution. Our comprehensive evaluation results show that OAT outperforms other baselines by more than 20\\% clean accuracy improvement and 10\\% robust accuracy improvement under complex combinations of data imbalance and label noise scenarios.",
        "keywords": "adversarial training",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/625b547d8b69d3a56e9ff0178e3644987409f646.zip",
        "author": "Guanlin Li;Kangjie Chen;Yuan Xu;Han Qiu;Shangwei Guo;Jiwei Li;Tianwei Zhang",
        "authorids": "~Guanlin_Li2;~Kangjie_Chen1;~Yuan_Xu3;~Han_Qiu3;~Shangwei_Guo1;~Jiwei_Li1;~Tianwei_Zhang1",
        "gender": "M;M;M;M;M;M;M",
        "homepage": "https://guanlinlee.github.io/;https://kangjie.me;;https://qiuhan.info;http://www.cs.cqu.edu.cn/info/1332/5290.htm;https://nlp.stanford.edu/~bdlijiwei/;https://personal.ntu.edu.sg/tianwei.zhang/index.html",
        "dblp": ";204/3003;89/3127;15/4507-1;176/6479;73/5746-1;77/7902-4",
        "google_scholar": "3LB0_wMAAAAJ;vEPnP6oAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.fr/citations?user=6JWNv6gAAAAJ;wQrVkBYAAAAJ;PwU16JEAAAAJ;9vpiYDIAAAAJ",
        "orcid": ";0000-0001-5099-7054;;;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Guanlin_Li2;~Kangjie_Chen1;~Yuan_Xu3;~Han_Qiu3;~Shangwei_Guo1;~Jiwei_Li1;~Tianwei_Zhang1",
        "aff": "Nanyang Technological University;Nanyang Technological University;;Tsinghua University;Chongqing University;Zhejiang University;Nanyang Technological University",
        "aff_domain": "ntu.edu.sg;ntu.edu.sg;;tsinghua.edu.cn;cqu.edu.cn;zju.edu.cn;ntu.edu.sg",
        "position": "PhD student;PhD student;;Assistant Professor;Associate Professor;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nli2024omnipotent,\ntitle={Omnipotent Adversarial Training in the Wild},\nauthor={Guanlin Li and Kangjie Chen and Yuan Xu and Han Qiu and Shangwei Guo and Jiwei Li and Tianwei Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=QgMaqtB444}\n}",
        "github": "",
        "project": "",
        "reviewers": "zhDe;TYeL;j17w",
        "site": "https://openreview.net/forum?id=QgMaqtB444",
        "pdf_size": 863416,
        "rating": "3;5;5",
        "confidence": "4;4;4",
        "soundness": "3;3;2",
        "contribution": "2;2;2",
        "presentation": "3;3;2",
        "wc_summary": "66;65;47",
        "wc_strengths": "17;72;21",
        "wc_weaknesses": "67;212;117",
        "wc_questions": "20;97;31",
        "wc_review": "170;446;216",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            59.333333333333336,
            8.73053390247253
        ],
        "wc_strengths_avg": [
            36.666666666666664,
            25.037749277618563
        ],
        "wc_weaknesses_avg": [
            132.0,
            60.13872850889572
        ],
        "wc_questions_avg": [
            49.333333333333336,
            34.00326781681758
        ],
        "wc_review_avg": [
            277.3333333333333,
            120.73478740151444
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:dfR8hUw_mrwJ:scholar.google.com/&scioq=Omnipotent+Adversarial+Training+in+the+Wild&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1;2;3;0",
        "aff_unique_norm": "Nanyang Technological University;Tsinghua University;Chongqing University;Zhejiang University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.ntu.edu.sg;https://www.tsinghua.edu.cn;https://www.cqu.edu.cn;https://www.zju.edu.cn",
        "aff_unique_abbr": "NTU;THU;CQU;ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;1;1;0",
        "aff_country_unique": "Singapore;China"
    },
    {
        "id": "QgSwyVsOzK",
        "title": "Modeling Knowledge as Functionals for Knowledge Reasoning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "A bottleneck for developing general artificial intelligence is empowering machines with knowledge-reasoning capabilities to facilitate NLP tasks such as semantic search, reading comprehension, and question-answering.\nPrior arts focus on integrating distributed knowledge embeddings and representations of pre-trained neural language models to produce outputs; however, there are still large areas for improvement in performance, explainability, and sustainability.\nIn this paper, we propose to represent ${\\bf K}$nowledge ${\\bf as}$ the ${\\bf F}$unctional representation (${\\it KasF}$) with a dynamics-based mechanism that simulates the semantic flow amongst tokens to facilitate knowledge reasoning.\nThe method utilizes a superposition of semantic fields to represent knowledge by building a dynamical mechanism to compute the similarity between semantic units.\nThis mechanism comprehensively captures the semantic features and eliminates ambiguities in representing entities and relations.\nWe first evaluate our ${\\it KasF}$ on the WikiQA dataset to demonstrate its superiority in capturing semantic patterns.\nNext, we evaluate our ${\\it KasF}$ modules on the SQuAD2.0 dataset by replacing the last layer of pre-trained language models fine-tuned on this dataset.\nWe observe consistent improvements in accuracy with fewer parameters.\nThen we evaluate ${\\it KasF}$ on the CommonsenseQA benchmark.\nOn the official blind test set, we achieve state-of-the-art with a single model, \noutperforming the prior best ensemble and single models by $0.4\\%$ and $3.1\\%$, respectively.\nIt is worth noting that the prior best single model is $47\\times$ larger than ours.\nFurther experiments also demonstrate that ${\\it KasF}$ exhibits superiority in dealing with sophisticated sentences.",
        "keywords": "semantic analysis;knowledge reasoning;commonsense reasoning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/558e23219fd9e47cd9a35134f6d52baa90f22ff9.zip",
        "author": "Zhengqi Pei;Shuhui Wang;Qingming Huang",
        "authorids": "~Zhengqi_Pei1;~Shuhui_Wang1;~Qingming_Huang1",
        "gender": "M;M;",
        "homepage": ";https://vipl.ict.ac.cn/people/shwang/;https://qmhuang-ucas.github.io/",
        "dblp": "223/2296;37/2537;68/4388",
        "google_scholar": "Qs5zacQAAAAJ;h-JxBSYAAAAJ;https://scholar.google.com.hk/citations?user=J1vMnRgAAAAJ",
        "orcid": ";0000-0002-5931-0527;",
        "linkedin": ";;",
        "or_profile": "~Zhengqi_Pei1;~Shuhui_Wang1;~Qingming_Huang2",
        "aff": "University of Chinese Academy of Sciences;Institute of Computing Technology, Chinese Academy of Sciences;University of Chinese Academy of Sciences",
        "aff_domain": "ucas.ac.cn;ict.ac.cn;ucas.ac.cn",
        "position": "MS student;Full Professor;Full Professor",
        "bibtex": "@misc{\npei2024modeling,\ntitle={Modeling Knowledge as Functionals for Knowledge Reasoning},\nauthor={Zhengqi Pei and Shuhui Wang and Qingming Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=QgSwyVsOzK}\n}",
        "github": "",
        "project": "",
        "reviewers": "b9xY;Ajiu;wgCm;CBXQ;xHsK",
        "site": "https://openreview.net/forum?id=QgSwyVsOzK",
        "pdf_size": 1879485,
        "rating": "1;5;5;6;8",
        "confidence": "2;2;3;3;3",
        "soundness": "1;3;3;3;3",
        "contribution": "1;2;3;3;3",
        "presentation": "1;2;3;3;3",
        "wc_summary": "341;82;87;69;108",
        "wc_strengths": "57;51;96;60;24",
        "wc_weaknesses": "32;90;62;94;8",
        "wc_questions": "39;43;176;64;21",
        "wc_review": "469;266;421;287;161",
        "wc_reply_reviewers": "0;0;0;33;0",
        "wc_reply_authors": "485;618;892;1062;288",
        "reply_reviewers": "0;0;0;1;0",
        "reply_authors": "1;1;2;2;1",
        "rating_avg": [
            5.0,
            2.280350850198276
        ],
        "confidence_avg": [
            2.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.6,
            0.8000000000000002
        ],
        "contribution_avg": [
            2.4,
            0.8
        ],
        "presentation_avg": [
            2.4,
            0.8
        ],
        "wc_summary_avg": [
            137.4,
            102.57212096861409
        ],
        "wc_strengths_avg": [
            57.6,
            23.03562458454296
        ],
        "wc_weaknesses_avg": [
            57.2,
            33.19277029715959
        ],
        "wc_questions_avg": [
            68.6,
            55.41335579081996
        ],
        "wc_review_avg": [
            320.8,
            111.07186862567858
        ],
        "wc_reply_reviewers_avg": [
            6.6,
            13.199999999999998
        ],
        "wc_reply_authors_avg": [
            669.0,
            277.7754488791261
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4
        ],
        "reply_authors_avg": [
            1.4,
            0.4898979485566356
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.716114874039433,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:_LTOMslOA50J:scholar.google.com/&scioq=Modeling+Knowledge+as+Functionals+for+Knowledge+Reasoning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Chinese Academy of Sciences;Chinese Academy of Sciences",
        "aff_unique_dep": ";Institute of Computing Technology",
        "aff_unique_url": "http://www.ucas.ac.cn;http://www.ict.ac.cn",
        "aff_unique_abbr": "UCAS;CAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Learning Hierarchical Polynomials with Three-Layer Neural Networks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18673",
        "id": "QgwAYFrh9t",
        "author_site": "Zihao Wang, Eshaan Nichani, Jason Lee",
        "tldr": "",
        "abstract": "We study the problem of learning hierarchical polynomials over the standard Gaussian distribution with three-layer neural networks. We specifically consider target functions of the form $h = g \\circ p$ where $p : \\mathbb{R}^d \\rightarrow \\mathbb{R}$ is a degree $k$ polynomial and $g: \\mathbb{R} \\rightarrow \\mathbb{R}$ is a degree $q$ polynomial. This function class generalizes the single-index model, which corresponds to $k=1$, and is a natural class of functions possessing an underlying hierarchical structure. Our main result shows that for a large subclass of degree $k$ polynomials $p$, a three-layer neural network trained via layerwise gradient descent on the square loss learns the target $h$ up to vanishing test error in $\\widetilde O(d^k)$ samples and polynomial time. This is a strict improvement over kernel methods, which require $\\widetilde \\Theta(d^{kq})$ samples, as well as existing guarantees for two-layer networks, which require the target function to be low-rank. Our result also generalizes prior works on three-layer neural networks, which were restricted to the case of $p$ being a quadratic. When $p$ is indeed a quadratic, we achieve the information-theoretically optimal sample complexity $\\widetilde O(d^2)$, which is an improvement over prior work (Nichani et al., 2023) requiring a sample size of $\\widetilde\\Theta(d^4)$. Our proof proceeds by showing that during the initial stage of training the network performs feature learning to recover the feature $p$ with $\\widetilde O(d^k)$ samples. This work demonstrates the ability of three-layer neural networks to learn complex features and as a result, learn a broad class of hierarchical functions.",
        "keywords": "Hierarchical polynomials;feature learning;three-layer networks;sample complexity;gradient descent",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Zihao Wang;Eshaan Nichani;Jason D. Lee",
        "authorids": "~Zihao_Wang25;~Eshaan_Nichani1;~Jason_D._Lee1",
        "gender": "Not Specified;;M",
        "homepage": ";https://eshaannichani.com/;https://jasondlee88.github.io/",
        "dblp": ";260/6510;88/3262",
        "google_scholar": "GMvmr8QAAAAJ;;GR_DsT0AAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Zihao_Wang25;~Eshaan_Nichani1;~Jason_D._Lee1",
        "aff": "Peking University;Princeton University;Princeton University",
        "aff_domain": "pku.edu.cn;princeton.edu;princeton.edu",
        "position": "Undergrad student;PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nwang2024learning,\ntitle={Learning Hierarchical Polynomials with Three-Layer Neural Networks},\nauthor={Zihao Wang and Eshaan Nichani and Jason D. Lee},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=QgwAYFrh9t}\n}",
        "github": "",
        "project": "",
        "reviewers": "RCBe;znhr;oysL;1ASh",
        "pdf_size": 624146,
        "rating": "5;5;5;8",
        "confidence": "5;2;4;3",
        "soundness": "3;3;4;4",
        "contribution": "3;3;2;4",
        "presentation": "3;2;4;4",
        "wc_summary": "67;65;124;147",
        "wc_strengths": "91;15;133;212",
        "wc_weaknesses": "162;40;221;79",
        "wc_questions": "63;181;35;94",
        "wc_review": "383;301;513;532",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "479;725;693;313",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            100.75,
            35.695763053897586
        ],
        "wc_strengths_avg": [
            112.75,
            71.21929162804135
        ],
        "wc_weaknesses_avg": [
            125.5,
            70.57797106746553
        ],
        "wc_questions_avg": [
            93.25,
            54.792221163227175
        ],
        "wc_review_avg": [
            432.25,
            95.02992949592249
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            552.5,
            167.52537121284047
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.2581988897471611,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9889246335139845473&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=QgwAYFrh9t",
        "pdf": "https://openreview.net/pdf?id=QgwAYFrh9t",
        "email": "pku.edu.cn;princeton.edu;princeton.edu",
        "author_num": 3,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Peking University;Princeton University",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.princeton.edu",
        "aff_unique_abbr": "Peking U;Princeton",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "QhXisLeIqR",
        "title": "WinNet:time series forecasting with a window-enhanced period extracting and interacting",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recently, Transformer-based methods have significantly improved state-of-the-art time series forecasting results, but they suffer from high computational costs and the inability to capture the long and short periodicity of time series. We present a highly accurate and simply structured CNN-based model for long-term time series forecasting tasks, called WinNet, including (i) Inter-Intra Period Encoder (I2PE) to transform 1D sequence into 2D tensor with long and short periodicity according to the predefined periodic window, (ii) Two-Dimensional Period Decomposition (TDPD) to model period-trend and oscillation terms, and (iii) Decomposition Correlation Block (DCB) to leverage the correlations of the period-trend and oscillation terms to support the prediction tasks by CNNs. Results on nine benchmark datasets show that the WinNet can achieve SOTA performance and lower computational complexity over CNN-, MLP-, Transformer-based approaches. The WinNet provides potential for the CNN-based methods in the time series forecasting tasks, with perfect tradeoff between performance and efficiency.",
        "keywords": "time series forecasting;periodic window;CNN network",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/1b2a841341cc1f5007effb69a6209541e51bc1b4.pdf",
        "author": "Wenjie Ou;Dongyue Guo;Zheng Zhang;Zhishuo Zhao;Yi Lin",
        "authorids": "~Wenjie_Ou2;~Dongyue_Guo1;~Zheng_Zhang25;~Zhishuo_Zhao1;~Yi_Lin1",
        "gender": "M;M;;M;M",
        "homepage": "https://ouwen18.github.io/;;https://github.com/MusDev7/;http://mail.stu.scu.edu.cn/coremail/XT5/index.jsp?sid=BAzIhADDwjuGNoTNhQhoFsxMOqYFlSbZ#mail.read%7C%7B%22fid%22%3A1%2C%22mid%22%3A%221%3A1tbiAQIKE2TagUhHmAABsz%22%2C%22mboxa%22%3A%22%22%2C%22start%22%3A0%7D;https://sculyi.github.io/",
        "dblp": "219/8417;;;;42/5120-6.html",
        "google_scholar": ";hJCKsa0AAAAJ;;;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": ";0000-0003-0393-5197;0009-0001-6568-4621;;",
        "linkedin": ";;;;",
        "or_profile": "~Wenjie_Ou2;~Dongyue_Guo1;~Zheng_Zhang25;~Zhishuo_Zhao1;~Yi_Lin1",
        "aff": "Sichuan University;Sichuan University;Sichuan University;Sichuan University;Sichuan University",
        "aff_domain": "scu.edu.cn;scu.edu.cn;scu.edu.cn;scu.edu.cn;scu.edu.cn",
        "position": "MS student;Assistant Professor;MS student;MS student;Associate Professor",
        "bibtex": "@misc{\nou2024winnettime,\ntitle={WinNet:time series forecasting with a window-enhanced period extracting and interacting},\nauthor={Wenjie Ou and Dongyue Guo and Zheng Zhang and Zhishuo Zhao and Yi Lin},\nyear={2024},\nurl={https://openreview.net/forum?id=QhXisLeIqR}\n}",
        "github": "",
        "project": "",
        "reviewers": "7BDu;8wnu;jnhX;PKs2",
        "site": "https://openreview.net/forum?id=QhXisLeIqR",
        "pdf_size": 4504391,
        "rating": "5;5;5;5",
        "confidence": "2;5;3;4",
        "soundness": "2;2;2;2",
        "contribution": "2;2;3;2",
        "presentation": "2;2;2;2",
        "wc_summary": "196;94;128;27",
        "wc_strengths": "117;22;173;23",
        "wc_weaknesses": "175;366;113;120",
        "wc_questions": "99;4;90;5",
        "wc_review": "587;486;504;175",
        "wc_reply_reviewers": "0;21;0;0",
        "wc_reply_authors": "635;1972;718;452",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;3;1;1",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            111.25,
            60.94823623370901
        ],
        "wc_strengths_avg": [
            83.75,
            64.37148048631475
        ],
        "wc_weaknesses_avg": [
            193.5,
            102.44632741099116
        ],
        "wc_questions_avg": [
            49.5,
            45.11374513382812
        ],
        "wc_review_avg": [
            438.0,
            156.54871446294283
        ],
        "wc_reply_reviewers_avg": [
            5.25,
            9.093266739736606
        ],
        "wc_reply_authors_avg": [
            944.25,
            601.1249350176716
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17347309933115137714&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Sichuan University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.scu.edu.cn",
        "aff_unique_abbr": "SCU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "QhYNXVcZYz",
        "title": "SketchEdit: Editing Freehand Sketches At The Stroke-Level",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Freehand sketching is a representation of human cognition of the real world. Recent sketch synthesis methods have demonstrated the capability of generating lifelike outcomes. However, these methods directly encode the whole sketch instances and makes it challenging to decouple the strokes from the sketches and have difficulty in controlling local sketch synthesis, e.g., stroke editing. Besides, the sketch editing task encounters the issue of accurately positioning the edited strokes, because users may not be able to draw on the exact position and the same stroke may appear on various locations in different sketches. We propose SketchEdit to realize flexible editing of sketches at the stroke-level for the first time. To tackle the challenge of decoupling strokes, our SketchEdit divides a drawing sequence of a sketch into a series of strokes based on the pen state, align the stroke segments to have the same starting position, and learns the embeddings of every stroke by a proposed stroke encoder. This design allows users to conveniently select the strokes for editing at any locations. Moreover, we overcome the problem of stroke placement via a diffusion process, which progressively generate the locations for the strokes to be synthesized, using the stroke features as the guiding condition. Both the stroke embeddings and the generated locations are fed into a sequence decoder to synthesize the manipulated sketch. The stroke encoder and the sequence decoder are jointly pre-trained under the autoencoder paradigm, with an extra image decoder to learn the local structure of sketches. Experiments demonstrate that the SketchEdit is effective for stroke-level sketch editing and outperforms state-of-the-art methods in the sketch reconstruction task.",
        "keywords": "Sketch synthesis\uff0csketch edit\uff0c sketch representation learning\uff0c diffusion model",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/7773291107c76c9abb1413635ae344f4a474cee1.zip",
        "author": "Tengjie Li;Shikui Tu;Lei Xu",
        "authorids": "~Tengjie_Li2;~Shikui_Tu1;~Lei_Xu7",
        "gender": "M;M;M",
        "homepage": "http://www.cs.sjtu.edu.cn/~tushikui;http://www.cse.cuhk.edu.hk/~lxu/;https://github.com/TjieLee",
        "dblp": "04/115;19/360-1;",
        "google_scholar": "Yewd61kAAAAJ;rN2ny9kAAAAJ;",
        "orcid": "0000-0001-6270-0449;0000-0002-2752-1573;",
        "linkedin": ";;",
        "or_profile": "~Shikui_Tu1;~Lei_Xu7;~tengjie_li1",
        "aff": "Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn",
        "position": "Associate Professor;Full Professor;PhD student",
        "bibtex": "@misc{\nli2024sketchedit,\ntitle={SketchEdit: Editing Freehand Sketches At The Stroke-Level},\nauthor={Tengjie Li and Shikui Tu and Lei Xu},\nyear={2024},\nurl={https://openreview.net/forum?id=QhYNXVcZYz}\n}",
        "github": "",
        "project": "",
        "reviewers": "ihan;1sUL;zvBb",
        "site": "https://openreview.net/forum?id=QhYNXVcZYz",
        "pdf_size": 5658534,
        "rating": "3;3;5",
        "confidence": "4;4;5",
        "soundness": "2;2;3",
        "contribution": "2;2;2",
        "presentation": "1;3;2",
        "wc_summary": "99;128;86",
        "wc_strengths": "93;37;72",
        "wc_weaknesses": "334;552;248",
        "wc_questions": "26;9;66",
        "wc_review": "552;726;472",
        "wc_reply_reviewers": "72;110;0",
        "wc_reply_authors": "626;738;587",
        "reply_reviewers": "1;1;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            104.33333333333333,
            17.556258776351587
        ],
        "wc_strengths_avg": [
            67.33333333333333,
            23.098821518760552
        ],
        "wc_weaknesses_avg": [
            378.0,
            127.9479060659715
        ],
        "wc_questions_avg": [
            33.666666666666664,
            23.893281249943232
        ],
        "wc_review_avg": [
            583.3333333333334,
            106.03563342365413
        ],
        "wc_reply_reviewers_avg": [
            60.666666666666664,
            45.616761052149336
        ],
        "wc_reply_authors_avg": [
            650.3333333333334,
            64.00173608756424
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9402996233520344418&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Shanghai Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sjtu.edu.cn",
        "aff_unique_abbr": "SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "QhoehDVFeJ",
        "title": "Efficient Meshy Neural Fields for Animatable Human Avatars",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Efficiently digitizing high-fidelity animatable human avatars from videos is a challenging and active research topic. Recent volume rendering-based neural representations open a new way for human digitization with their friendly usability and photo-realistic reconstruction quality. However, they are inefficient for long optimization times and slow inference speed; their implicit nature results in entangled geometry, materials, and dynamics of humans, which are hard to edit afterward. Such drawbacks prevent their direct applicability to downstream applications, especially the prominent rasterization-based graphic ones. We present EMA, a method that Efficiently learns Meshy neural fields to reconstruct animatable human Avatars. It jointly optimizes explicit triangular canonical mesh, spatial-varying material, and motion dynamics, via inverse rendering in an end-to-end fashion. Each above component is derived from separate neural fields, relaxing the requirement of a template, or rigging. The mesh representation is highly compatible with the efficient rasterization-based renderer, thus our method only takes about an hour of training and can render in real-time. Moreover, only minutes of optimization is enough for plausible reconstruction results. The disentanglement of meshes enables direct downstream applications. Extensive experiments illustrate the very competitive performance and significant speed boost against previous methods. We also showcase applications including novel pose synthesis, material editing, and relighting.",
        "keywords": "Human digitization;3D reconstruction;Representation learning;Differentiable rendering",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/10640e57cece69ee3b8c6b93a4bbd4beebff0fc2.zip",
        "author": "Xiaoke Huang;Yiji Cheng;Yansong Tang;Xiu Li;Jie Zhou;Jiwen Lu",
        "authorids": "~Xiaoke_Huang1;~Yiji_Cheng1;~Yansong_Tang1;~Xiu_Li1;~Jie_Zhou3;~Jiwen_Lu1",
        "gender": "M;;M;F;M;M",
        "homepage": "https://xk-huang.github.io;;https://andytang15.github.io/;https://thusigsiclab.github.io/thu.github.io/introduction.html;https://www.tsinghua.edu.cn/publish/auen/1713/2011/20110506105532098625469/20110506105532098625469_.html;http://ivg.au.tsinghua.edu.cn/Jiwen_Lu/",
        "dblp": "151/3120;;214/9568;13/1206-1;00/5012-1;http://dblp.uni-trier.de/pers/hd/l/Lu:Jiwen",
        "google_scholar": "BD9AT04AAAAJ;Plo8ZSYAAAAJ;TIbistUAAAAJ;https://scholar.google.com/citations?hl=zh-CN;;TN8uDQoAAAAJ",
        "orcid": ";;;0000-0003-0403-1923;;0000-0002-6121-5529",
        "linkedin": ";yiji-cheng-a8b922213/;;;;",
        "or_profile": "~Xiaoke_Huang1;~Yiji_Cheng1;~Yansong_Tang1;~Xiu_Li1;~Jie_Zhou3;~Jiwen_Lu1",
        "aff": "Tsinghua University;Tsinghua University;Tsinghua University;Tsinghua University;Tsinghua University;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "MS student;MS student;Assistant Professor;Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nhuang2024efficient,\ntitle={Efficient Meshy Neural Fields for Animatable Human Avatars},\nauthor={Xiaoke Huang and Yiji Cheng and Yansong Tang and Xiu Li and Jie Zhou and Jiwen Lu},\nyear={2024},\nurl={https://openreview.net/forum?id=QhoehDVFeJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "XfaE;QZey;imbQ;PTA7",
        "site": "https://openreview.net/forum?id=QhoehDVFeJ",
        "pdf_size": 9813395,
        "rating": "5;6;6;6",
        "confidence": "4;4;4;3",
        "soundness": "2;2;3;4",
        "contribution": "2;2;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "167;88;121;117",
        "wc_strengths": "45;17;113;57",
        "wc_weaknesses": "304;39;203;40",
        "wc_questions": "88;301;244;50",
        "wc_review": "604;445;681;264",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "930;622;652;317",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;2;2;2",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            123.25,
            28.287585616308792
        ],
        "wc_strengths_avg": [
            58.0,
            34.91418050019218
        ],
        "wc_weaknesses_avg": [
            146.5,
            112.80181736124645
        ],
        "wc_questions_avg": [
            170.75,
            104.59296104423089
        ],
        "wc_review_avg": [
            498.5,
            159.9132577368118
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            630.25,
            217.0925781780667
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4042942027951460245&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "Tsinghua University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "QhsZwzBYaU",
        "title": "Tailoring Mixup to Data using Kernel Warping functions",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Data augmentation is an essential building block for learning efficient deep learning models. Among all augmentation techniques proposed so far, linear interpolation of training data points, also called *mixup*, has found to be effective for a large panel of applications. While the majority of works have focused on selecting the right points to mix, or applying complex non-linear interpolation, we are interested in mixing similar points more frequently and strongly than less similar ones. To this end, we propose to dynamically change the underlying distribution of interpolation coefficients through warping functions, depending on the similarity between data points to combine. We define an efficient and flexible framework to do so without losing in diversity. We provide extensive experiments for classification and regression tasks, showing that our proposed method improves both performance and calibration of models.",
        "keywords": "mixup;classification;regression;calibration",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/e449c10d86cbcdef6f8c4b00ecc91b3667ea5ca6.zip",
        "author": "Quentin Bouniot;Pavlo Mozharovskyi;Florence d'Alch\u00e9-Buc",
        "authorids": "~Quentin_Bouniot1;~Pavlo_Mozharovskyi1;~Florence_d'Alch\u00e9-Buc2",
        "gender": "M;M;F",
        "homepage": "https://qbouniot.github.io/;https://perso.telecom-paristech.fr/mozharovskyi/;https://perso.telecom-paristech.fr/fdalche/",
        "dblp": "271/7069;117/3535.html;https://dblp.uni-trier.de/pers/d/d=Alch=eacute==Buc:Florence.html",
        "google_scholar": "https://scholar.google.com/citations?hl=fr;tVhEYZsAAAAJ;-qbL7z0AAAAJ",
        "orcid": "0000-0002-0982-372X;0000-0002-1925-3337;0000-0002-8353-0589",
        "linkedin": "quentin-bouniot/;pavlomozharovskyi/;",
        "or_profile": "~Quentin_Bouniot1;~Pavlo_Mozharovskyi1;~Florence_D'Alch\u00e92",
        "aff": "T\u00e9l\u00e9com ParisTech;T\u00e9l\u00e9com Paris;T\u00e9l\u00e9com ParisTech, Institut Polytechnique de paris",
        "aff_domain": "telecom-paristech.fr;telecom-paris.fr;telecom-paristech.fr",
        "position": "Postdoc;Full Professor;Full Professor",
        "bibtex": "@misc{\nbouniot2024tailoring,\ntitle={Tailoring Mixup to Data using Kernel Warping functions},\nauthor={Quentin Bouniot and Pavlo Mozharovskyi and Florence d'Alch{\\'e}-Buc},\nyear={2024},\nurl={https://openreview.net/forum?id=QhsZwzBYaU}\n}",
        "github": "",
        "project": "",
        "reviewers": "iaPi;2Wwo;djAy;YFeL",
        "site": "https://openreview.net/forum?id=QhsZwzBYaU",
        "pdf_size": 3579194,
        "rating": "3;5;6;8",
        "confidence": "5;3;3;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;4;4",
        "wc_summary": "80;104;103;170",
        "wc_strengths": "108;44;75;12",
        "wc_weaknesses": "446;203;277;39",
        "wc_questions": "7;190;157;5",
        "wc_review": "641;541;612;226",
        "wc_reply_reviewers": "227;172;49;0",
        "wc_reply_authors": "1679;1011;2555;129",
        "reply_reviewers": "1;2;1;0",
        "reply_authors": "3;2;4;1",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            114.25,
            33.58850249713434
        ],
        "wc_strengths_avg": [
            59.75,
            35.66773752286512
        ],
        "wc_weaknesses_avg": [
            241.25,
            146.26068337048068
        ],
        "wc_questions_avg": [
            89.75,
            84.56173780144303
        ],
        "wc_review_avg": [
            505.0,
            165.13782122820925
        ],
        "wc_reply_reviewers_avg": [
            112.0,
            91.2934827903942
        ],
        "wc_reply_authors_avg": [
            1343.5,
            889.6430463955754
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8006407690254357,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "T\u00e9l\u00e9com ParisTech;T\u00e9l\u00e9com Paris",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.telecom-paristech.fr;https://www.telecom-paris.fr",
        "aff_unique_abbr": "TP;T\u00e9l\u00e9com Paris",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Paris",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "France"
    },
    {
        "title": "Efficient Heterogeneous Meta-Learning via Channel Shuffling Modulation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18672",
        "id": "QiJuMJl0QS",
        "author_site": "Minh Hoang, Carl Kingsford",
        "tldr": "",
        "abstract": "We tackle the problem of meta-learning across heterogenous tasks. This problem seeks to extract and generalize transferable meta-knowledge through streaming task sets from a multi-modal task distribution. The extracted meta-knowledge can be used to create predictors for new tasks using a small number of labeled samples. Most meta-learning methods assume a homogeneous task distribution, thus limiting their generalization capacity when handling multi-modal task distributions. Recent work has shown that the generalization of meta-learning depends on the similarity of tasks in the training distribution, and this has led to many clustering approaches that aim to detect homogeneous clusters of tasks. However, these methods suffer from a significant increase in parameter complexity. To overcome this weakness, we propose a new heterogeneous meta-learning strategy that efficiently captures the multi-modality of the task distribution via modulating the routing between convolution channels in the network, instead of directly modulating the network weights. This new mechanism can be cast as a permutation learning problem. We further introduce a novel neural permutation layer based on the classical Benes routing network, which has sub-quadratic parameter complexity in the total number of channels, as compared to the quadratic complexity of the state-of-the-art Gumbel-Sinkhorn layer. We demonstrate our approach on various multi-modal meta-learning benchmarks, showing that our framework outperforms previous methods in both generalization accuracy and convergence speed.",
        "keywords": "Meta Learning; Deep Learning Architecture; General Machine Learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/409c8e2d977efaa256cdcc689b5c11bb53dba048.pdf",
        "author": "Minh Hoang;Carl Kingsford",
        "authorids": "~Minh_Hoang1;~Carl_Kingsford1",
        "gender": "M;",
        "homepage": ";",
        "dblp": ";",
        "google_scholar": "56Mb6DY0_NUC;",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Minh_Hoang1;~Carl_Kingsford1",
        "aff": "Princeton University;",
        "aff_domain": "princeton.edu;",
        "position": "Postdoc;",
        "bibtex": "@inproceedings{\nhoang2024efficient,\ntitle={Efficient Heterogeneous Meta-Learning via Channel Shuffling Modulation},\nauthor={Minh Hoang and Carl Kingsford},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=QiJuMJl0QS}\n}",
        "github": "",
        "project": "",
        "reviewers": "KAtC;d54Q;aRVA;ppvH",
        "pdf_size": 4230067,
        "rating": "6;6;6;6",
        "confidence": "5;4;5;4",
        "soundness": "3;3;2;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "73;132;142;111",
        "wc_strengths": "101;78;83;65",
        "wc_weaknesses": "100;64;344;210",
        "wc_questions": "67;146;165;3",
        "wc_review": "341;420;734;389",
        "wc_reply_reviewers": "0;59;1287;15",
        "wc_reply_authors": "405;219;1409;254",
        "reply_reviewers": "0;1;4;1",
        "reply_authors": "1;2;5;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            114.5,
            26.443335644354704
        ],
        "wc_strengths_avg": [
            81.75,
            12.910751333675357
        ],
        "wc_weaknesses_avg": [
            179.5,
            109.14554503047754
        ],
        "wc_questions_avg": [
            95.25,
            64.70848089701998
        ],
        "wc_review_avg": [
            471.0,
            154.42959560913187
        ],
        "wc_reply_reviewers_avg": [
            340.25,
            547.0362762194112
        ],
        "wc_reply_authors_avg": [
            571.75,
            488.41343910666507
        ],
        "reply_reviewers_avg": [
            1.5,
            1.5
        ],
        "reply_authors_avg": [
            2.25,
            1.6393596310755
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:r6xBUAS-6AAJ:scholar.google.com/&scioq=Efficient+Heterogeneous+Meta-Learning+via+Channel+Shuffling+Modulation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=QiJuMJl0QS",
        "pdf": "https://openreview.net/pdf?id=QiJuMJl0QS",
        "email": "princeton.edu;",
        "author_num": 2,
        "aff_unique_index": "0",
        "aff_unique_norm": "Princeton University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.princeton.edu",
        "aff_unique_abbr": "Princeton",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Early Neuron Alignment in Two-layer ReLU Networks with Small Initialization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18671",
        "id": "QibPzdVrRu",
        "author_site": "Hancheng Min, Enrique Mallada, Rene Vidal",
        "tldr": "",
        "abstract": "This paper studies the problem of training a two-layer ReLU network for binary classification using gradient flow with small initialization. We consider a training dataset with well-separated input vectors: Any pair of input data with the same label are positively correlated, and any pair with different labels are negatively correlated. Our analysis shows that, during the early phase of training, neurons in the first layer try to align with either the positive data or the negative data, depending on its corresponding weight on the second layer. A careful analysis of the neurons' directional dynamics allows us to provide an $\\mathcal{O}(\\frac{\\log n}{\\sqrt{\\mu}})$ upper bound on the time it takes for all neurons to achieve good alignment with the input data, where $n$ is the number of data points and $\\mu$ measures how well the data are separated. After the early alignment phase, the loss converges to zero at a $\\mathcal{O}(\\frac{1}{t})$ rate, and the weight matrix on the first layer is approximately low-rank. Numerical experiments on the MNIST dataset illustrate our theoretical findings.",
        "keywords": "Neural Networks;Small Initialization;Gradient Flow;Neuron Alignment",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Hancheng Min;Enrique Mallada;Rene Vidal",
        "authorids": "~Hancheng_Min1;~Enrique_Mallada1;~Rene_Vidal1",
        "gender": "M;M;",
        "homepage": "https://hanchmin.github.io/;http://mallada.ece.jhu.edu;http://www.vision.jhu.edu",
        "dblp": "226/6324;;v/ReneVidal",
        "google_scholar": "XgQjPZIAAAAJ;ZvRFA04AAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";0000-0003-1568-1833;",
        "linkedin": ";emallada/;rene-vidal-74844928/",
        "or_profile": "~Hancheng_Min1;~Enrique_Mallada1;~Rene_Vidal1",
        "aff": "University of Pennsylvania;Johns Hopkins University;Amazon",
        "aff_domain": "seas.upenn.edu;jhu.edu;amazon.com",
        "position": "Postdoc;Associate Professor;Principal Researcher",
        "bibtex": "@inproceedings{\nmin2024early,\ntitle={Early Neuron Alignment in Two-layer Re{LU} Networks with Small Initialization},\nauthor={Hancheng Min and Enrique Mallada and Rene Vidal},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=QibPzdVrRu}\n}",
        "github": "",
        "project": "",
        "reviewers": "Qg2K;osUg;5S56;Qhf5",
        "pdf_size": 2230050,
        "rating": "5;5;8;8",
        "confidence": "3;3;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;1;3;3",
        "presentation": "3;4;4;3",
        "wc_summary": "18;127;49;60",
        "wc_strengths": "42;10;47;26",
        "wc_weaknesses": "162;29;18;61",
        "wc_questions": "28;1;19;298",
        "wc_review": "250;167;133;445",
        "wc_reply_reviewers": "0;131;0;28",
        "wc_reply_authors": "789;429;200;621",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            6.5,
            1.5
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            63.5,
            39.764934301467164
        ],
        "wc_strengths_avg": [
            31.25,
            14.515078366994786
        ],
        "wc_weaknesses_avg": [
            67.5,
            56.8000880281008
        ],
        "wc_questions_avg": [
            86.5,
            122.49591829934579
        ],
        "wc_review_avg": [
            248.75,
            121.0338279160004
        ],
        "wc_reply_reviewers_avg": [
            39.75,
            53.9090669553833
        ],
        "wc_reply_authors_avg": [
            509.75,
            219.5579365452317
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 20,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12917620771432979180&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 8,
        "openreview": "https://openreview.net/forum?id=QibPzdVrRu",
        "pdf": "https://openreview.net/pdf?id=QibPzdVrRu",
        "email": "seas.upenn.edu;jhu.edu;amazon.com",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of Pennsylvania;Johns Hopkins University;Amazon",
        "aff_unique_dep": ";;Amazon.com, Inc.",
        "aff_unique_url": "https://www.upenn.edu;https://www.jhu.edu;https://www.amazon.com",
        "aff_unique_abbr": "UPenn;JHU;Amazon",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "QlFlo5533z",
        "title": "Auto DP-SGD: Dual Improvements of Privacy and Accuracy via Automatic Clipping Threshold and Noise Multiplier Estimation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Differentially Private Stochastic Gradient Descent (DP-SGD) has emerged as a popular method to protect personally identifiable information in deep learning (DL) applications. Unfortunately, DP-SGD's per-sample gradient clipping and uniform noise addition during training can significantly degrade model utility. To enhance the model's utility, researchers proposed various adaptive/dynamic DP-SGD methods by adapting the noise multiplier and clipping threshold. However, we examined and discovered that these established techniques result in greater privacy leakage or lower accuracy than the traditional DP-SGD method, or a lack of evaluation on a complex data set such as CIFAR100. To address these limitations, we propose an automatic DP-SGD (Auto DP-SGD). Our method automates clipping threshold estimation based on the DL model's total gradient norm and scales the gradients of each training sample instead of simply clipping them without losing gradient information or requiring an additional privacy budget. This helps to improve the algorithm's utility while using a less privacy budget. To further improve accuracy, we introduce automatic noise multiplier decay mechanisms to decrease the noise multiplier after every epoch. Finally, we develop closed-form mathematical expressions using the truncated concentrated differential privacy (tCDP) accountant, which offers a straightforward and tight privacy-bound analysis for automatic noise multiplier and automatic clipping estimation. Through extensive experimentation, we demonstrate that Auto DP-SGD outperforms existing state-of-the-art (SOTA) classification results in privacy and accuracy on various benchmark datasets. We also show that privacy can be improved by lowering the scale factor and using learning rate schedulers without significantly reducing privacy. Moreover, we also explain how to select the best Auto DP-SGD variant without additional privacy leakage. Specifically, Auto DP-SGD, when used with a step noise multiplier (Auto DP-SGD-S), improves accuracy by 3.20\\%, 1.57\\%, 6.73\\%, and 1.42\\% for the MNIST, CIFAR10, CIFAR100, and AG News Corpus datasets, respectively. Furthermore, we achieve a substantial reduction in the privacy budget ($\\epsilon$) of 94.9\\%, 79.16\\%, 67.36\\%, and 53.37\\% for the corresponding data sets.",
        "keywords": "Differential Privacy;tCDP;Auto DP-SGD;clipping threshold estimation;noise multiplier decay",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/f601b53e7873638b5a6c92b154086480f6e4e27b.pdf",
        "author": "Sai Venkatesh Chilukoti;Md Imran Hossen;Liqun Shan;Vijay Srinivas Tida;Xiali Hei",
        "authorids": "~Sai_Venkatesh_Chilukoti1;~Md_Imran_Hossen1;~Liqun_Shan1;~Vijay_Srinivas_Tida1;~Xiali_Hei2",
        "gender": "M;M;F;M;F",
        "homepage": ";;;;https://www.xialihei.com/",
        "dblp": "329/4491;283/5666;276/6779;294/3450;07/8968",
        "google_scholar": "Eo_ZU6gAAAAJ;DoVUjOwAAAAJ;-UOya7IAAAAJ;iZ7DIXcAAAAJ;PzflF_cAAAAJ",
        "orcid": ";;0000-0003-2489-8671;;0000-0002-2438-5430",
        "linkedin": "sai-venkatesh-chilukoti-b844b4180/;;;;sharon-xiali-hei-3a284a24/",
        "or_profile": "~Sai_Venkatesh_Chilukoti1;~Md_Imran_Hossen1;~Liqun_Shan1;~Vijay_Srinivas_Tida1;~Xiali_Hei2",
        "aff": "University of Louisiana at Lafeyette;;University of Louisiana at Lafeyette;Saint John's University (MN);Delaware State University",
        "aff_domain": "louisiana.edu;;louisiana.edu;csbsju.edu;desu.edu",
        "position": "PhD student;;PhD student;Assistant Professor;",
        "bibtex": "@misc{\nchilukoti2024auto,\ntitle={Auto {DP}-{SGD}: Dual Improvements of Privacy and Accuracy via Automatic Clipping Threshold and Noise Multiplier Estimation},\nauthor={Sai Venkatesh Chilukoti and Md Imran Hossen and Liqun Shan and Vijay Srinivas Tida and Xiali Hei},\nyear={2024},\nurl={https://openreview.net/forum?id=QlFlo5533z}\n}",
        "github": "",
        "project": "",
        "reviewers": "U13W;Qfup;CCmh;m4LY",
        "site": "https://openreview.net/forum?id=QlFlo5533z",
        "pdf_size": 431276,
        "rating": "1;3;3;5",
        "confidence": "4;3;4;5",
        "soundness": "2;2;2;2",
        "contribution": "1;2;2;2",
        "presentation": "2;2;2;2",
        "wc_summary": "34;45;25;30",
        "wc_strengths": "19;32;10;30",
        "wc_weaknesses": "263;233;271;89",
        "wc_questions": "2;4;5;31",
        "wc_review": "318;314;311;180",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            33.5,
            7.365459931328117
        ],
        "wc_strengths_avg": [
            22.75,
            8.870597499605086
        ],
        "wc_weaknesses_avg": [
            214.0,
            73.54590403278758
        ],
        "wc_questions_avg": [
            10.5,
            11.884864324004713
        ],
        "wc_review_avg": [
            280.75,
            58.22102283539856
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:jeSLOL-5EVMJ:scholar.google.com/&scioq=Auto+DP-SGD:+Dual+Improvements+of+Privacy+and+Accuracy+via+Automatic+Clipping+Threshold+and+Noise+Multiplier+Estimation&hl=en&as_sdt=0,40",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "University of Louisiana at Lafayette;Saint John's University;Delaware State University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.louisiana.edu;https://www.csbsju.edu;https://www.desu.edu",
        "aff_unique_abbr": "UL Lafayette;SJU;DSU",
        "aff_campus_unique_index": "0;0;1",
        "aff_campus_unique": "Lafayette;MN;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Towards Category Unification of 3D Single Object Tracking on Point Clouds",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18670",
        "id": "QlqdXrzzD1",
        "author_site": "Jiahao Nie, Zhiwei He, Xudong Lv, Xueyi Zhou, Dong-Kyu Chae, Fei Xie",
        "tldr": "",
        "abstract": "Category-specific models are provenly valuable methods in 3D single object tracking (SOT) regardless of Siamese or motion-centric paradigms. However, such over-specialized model designs incur redundant parameters, thus limiting the broader applicability of 3D SOT task. This paper first introduces unified models that can simultaneously track objects across all categories using a single network with shared model parameters. Specifically, we propose to explicitly encode distinct attributes associated to different object categories, enabling the model to adapt to cross-category data. We find that the attribute variances of point cloud objects primarily occur from the varying size and shape (e.g., large and square vehicles v.s. small and slender humans). Based on this observation, we design a novel point set representation learning network inheriting transformer architecture, termed AdaFormer, which adaptively encodes the dynamically varying shape and size information from cross-category data in a unified manner. We further incorporate the size and shape prior derived from the known template targets into the model\u2019s inputs and learning objective, facilitating the learning of unified representation. Equipped with such designs, we construct two category-unified models SiamCUT and MoCUT. Extensive experiments demonstrate that SiamCUT and MoCUT exhibit strong generalization and training stability. Furthermore, our category-unified models outperform the category-specific counterparts by a significant margin (e.g., on KITTI dataset, $\\sim$12\\% and $\\sim$3\\% performance gains on the Siamese and motion paradigms).",
        "keywords": "3D single object tracking;Category-unified model;Point clouds",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/682cae3ae621a9a8536a2c6ff45bcf7b30c35ce3.zip",
        "author": "Jiahao Nie;Zhiwei He;Xudong Lv;Xueyi Zhou;Dong-Kyu Chae;Fei Xie",
        "authorids": "~Jiahao_Nie2;~Zhiwei_He2;~Xudong_Lv2;~Xueyi_Zhou1;~Dong-Kyu_Chae1;~Fei_Xie3",
        "gender": "M;M;M;F;M;M",
        "homepage": ";;;https://hokyeejau.github.io/;http://dilab.hanyang.ac.kr;https://phiphiphi31.github.io/",
        "dblp": "319/4607;52/6077-1.html;85/3058;292/7151.html;129/2357;",
        "google_scholar": "R0uN6pcAAAAJ;OZkiufUAAAAJ;;YflJMZcAAAAJ;https://scholar.google.com/citations?hl=ko;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": "0000-0002-1474-1817;0000-0001-7264-2019;0000-0003-3269-4396;0000-0003-0703-2446;;0009-0001-2733-2393",
        "linkedin": ";;;;;",
        "or_profile": "~Jiahao_Nie2;~Zhiwei_He2;~Xudong_Lv2;~Xueyi_Zhou1;~Dong-Kyu_Chae1;~Fei_Xie3",
        "aff": "Hangzhou Dianzi University;Hangzhou Dianzi University;Hangzhou Dianzi University;Hanyang University;Hanyang University;Shanghai Jiaotong University",
        "aff_domain": "hdu.edu.cn;hdu.edu.cn;hdu.edu.cn;hanyang.ac.kr;hanyang.ac.kr;sjtu.edu.cn",
        "position": "PhD student;Full Professor;Postdoc;PhD student;Assistant Professor;PhD student",
        "bibtex": "@inproceedings{\nnie2024towards,\ntitle={Towards Category Unification of 3D Single Object Tracking on Point Clouds},\nauthor={Jiahao Nie and Zhiwei He and Xudong Lv and Xueyi Zhou and Dong-Kyu Chae and Fei Xie},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=QlqdXrzzD1}\n}",
        "github": "",
        "project": "",
        "reviewers": "zjK7;5oVT;vKoh",
        "pdf_size": 3486635,
        "rating": "6;6;8",
        "confidence": "4;5;4",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "3;3;4",
        "wc_summary": "47;111;80",
        "wc_strengths": "43;111;33",
        "wc_weaknesses": "157;164;6",
        "wc_questions": "4;164;11",
        "wc_review": "251;550;130",
        "wc_reply_reviewers": "0;12;25",
        "wc_reply_authors": "711;486;148",
        "reply_reviewers": "0;1;1",
        "reply_authors": "1;2;2",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            79.33333333333333,
            26.132142830026183
        ],
        "wc_strengths_avg": [
            62.333333333333336,
            34.65384378231207
        ],
        "wc_weaknesses_avg": [
            109.0,
            72.8880420005001
        ],
        "wc_questions_avg": [
            59.666666666666664,
            73.8301353709235
        ],
        "wc_review_avg": [
            310.3333333333333,
            176.52258275422503
        ],
        "wc_reply_reviewers_avg": [
            12.333333333333334,
            10.208928554075703
        ],
        "wc_reply_authors_avg": [
            448.3333333333333,
            231.38183929503964
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5906134840040733279&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=QlqdXrzzD1",
        "pdf": "https://openreview.net/pdf?id=QlqdXrzzD1",
        "email": "hdu.edu.cn;hdu.edu.cn;hdu.edu.cn;hanyang.ac.kr;hanyang.ac.kr;sjtu.edu.cn",
        "author_num": 6,
        "aff_unique_index": "0;0;0;1;1;2",
        "aff_unique_norm": "Hangzhou Dianzi University;Hanyang University;Shanghai Jiao Tong University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.hdu.edu.cn/;https://www.hanyang.ac.kr;https://www.sjtu.edu.cn",
        "aff_unique_abbr": "HGHDU;HYU;SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;1;0",
        "aff_country_unique": "China;South Korea"
    },
    {
        "id": "QmJSs8NaXc",
        "title": "Distributed Training of Large Graph Neural Networks with Variable Communication Rates",
        "track": "main",
        "status": "Desk Reject",
        "tldr": "",
        "abstract": "Training Graph Neural Networks (GNNs) on large graphs presents unique challenges due to the large memory and compute requirements. \n  Distributed GNN training, where the graph is partitioned across multiple machines, is a common approach to train GNNs on large graphs. \n  However, as the graph cannot generally be decomposed into small non-interacting components, data communication between the training machines quickly limits training speeds. \n  Compressing the communicated node activations by a fixed amount improves the training speeds, but lowers the accuracy of the trained GNN. \n  In this paper, we introduce a variable compression scheme for reducing the communication volume in distributed GNN training without compromising the accuracy of the learned model. \n  Based on our theoretical analysis, we derive a variable compression method that converges to a solution that is equivalent to the full communication case. \n  Our empirical results show that our method attains a comparable performance to the one obtained with full communication and that for any communication budget, we outperform full communication and any fixed compression ratio.",
        "keywords": "Graph Neural Networks;Distributed Training;Variable Compression;Large Scale Graphs",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/8843516a7d49001a9874cfdf5c7f97820d0e447b.zip",
        "author": "Juan Cervino;Md Asadullah Turja;Hesham Mostafa;Nageen Himayat;Alejandro Ribeiro",
        "authorids": "~Juan_Cervino1;~Md_Asadullah_Turja1;~Hesham_Mostafa1;~Nageen_Himayat1;~Alejandro_Ribeiro1",
        "gender": "M;M;M;;M",
        "homepage": "https://juancervino.github.io/;;;https://www.linkedin.com/in/nageen-himayat-3292603/;https://alelab.seas.upenn.edu",
        "dblp": ";;137/2994;20/4102.html;32/15",
        "google_scholar": "lbyYN_sAAAAJ;;;frmNZH4AAAAJ;7mrPM4kAAAAJ",
        "orcid": ";;;;0000-0003-4230-9906",
        "linkedin": ";mturja/;;;",
        "or_profile": "~Juan_Cervino1;~Md_Asadullah_Turja1;~Hesham_Mostafa1;~Nageen_Himayat1;~Alejandro_Ribeiro1",
        "aff": "University of Pennsylvania;;Intel;Intel;University of Pennsylvania",
        "aff_domain": "upenn.edu;;intel.com;intel.com;upenn.edu",
        "position": "PhD student;;Researcher;Principal Researcher;Full Professor",
        "bibtex": "@misc{\ncervino2024distributed,\ntitle={Distributed Training of Large Graph Neural Networks with Variable Communication Rates},\nauthor={Juan Cervino and Md Asadullah Turja and Hesham Mostafa and Nageen Himayat and Alejandro Ribeiro},\nyear={2024},\nurl={https://openreview.net/forum?id=QmJSs8NaXc}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=QmJSs8NaXc",
        "pdf_size": 496870,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1589303037668433765&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1;0",
        "aff_unique_norm": "University of Pennsylvania;Intel",
        "aff_unique_dep": ";Intel Corporation",
        "aff_unique_url": "https://www.upenn.edu;https://www.intel.com",
        "aff_unique_abbr": "UPenn;Intel",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Get more for less: Principled Data Selection for Warming Up Fine-Tuning in LLMs",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18669",
        "id": "QmYNBVukex",
        "author_site": "Feiyang Kang, Hoang Anh Just, Yifan Sun, Himanshu Jahagirdar, Yuanzhi Zhang, Rongxing Du, Anit Kumar Sahu, Ruoxi Jia",
        "tldr": "",
        "abstract": "This work focuses on leveraging and selecting from vast, unlabeled, open data to *pre-fine-tune* a pre-trained language model. The goal is to minimize the need for costly domain-specific data for subsequent fine-tuning while achieving desired performance levels. While many data selection algorithms have been designed for small-scale applications, rendering them unsuitable for our context, some emerging methods do cater to language data scales. However, they often prioritize data that aligns with the target distribution. While this strategy may be effective when training a model from scratch, it can yield limited results when the model has already been pre-trained on a different distribution. Differing from prior work, our key idea is to select data that nudges the pre-training distribution closer to the target distribution. We show the optimality of this approach for fine-tuning tasks under certain conditions. We demonstrate the efficacy of our methodology across a diverse array of tasks (NLU, NLG, zero-shot) with models up to 2.7B, showing that it consistently surpasses other selection methods. Moreover, our proposed method is significantly faster than existing techniques, scaling to millions of samples within a single GPU hour. Our code is open-sourced. While fine-tuning offers significant potential for enhancing performance across diverse tasks, its associated costs often limit its widespread adoption; with this work, we hope to lay the groundwork for cost-effective fine-tuning, making its benefits more accessible.",
        "keywords": "Data Selection;Large Language Model;Optimal Transport;Data-centric AI;Data Efficiency",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Feiyang Kang;Hoang Anh Just;Yifan Sun;Himanshu Jahagirdar;Yuanzhi Zhang;Rongxing Du;Anit Kumar Sahu;Ruoxi Jia",
        "authorids": "~Feiyang_Kang1;~Hoang_Anh_Just1;~Yifan_Sun8;~Himanshu_Jahagirdar1;~Yuanzhi_Zhang3;~Rongxing_Du2;~Anit_Kumar_Sahu1;~Ruoxi_Jia1",
        "gender": "M;;M;;;M;;",
        "homepage": ";https://justhoanganh.com;https://yifansun99.github.io/;https://linkedin.com/in/himanshu-jahagirdar;;https://rongxingdu.github.io;;https://ruoxijia.info/",
        "dblp": "218/1175;307/2901;99/10261-10.html;331/2669;;;;147/5355-1",
        "google_scholar": "_6mV_iEAAAAJ;XcBDQhAAAAAJ;;;;;;JCrug-YAAAAJ",
        "orcid": ";;;;;;;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Feiyang_Kang1;~Hoang_Anh_Just1;~Yifan_Sun8;~Himanshu_Jahagirdar1;~Yuanzhi_Zhang3;~Rongxing_Du2;~Anit_Kumar_Sahu1;~Ruoxi_Jia1",
        "aff": "NVIDIA;Virginia Polytechnic Institute and State University;Tsinghua University;;;Virginia Polytechnic Institute and State University;;Virginia Tech",
        "aff_domain": "nvidia.com;vt.edu;mail.tsinghua.edu.cn;;;vt.edu;;vt.edu",
        "position": "Intern;PhD student;MS student;;;Intern;;Assistant Professor",
        "bibtex": "@inproceedings{\nkang2024get,\ntitle={Get more for less: Principled Data Selection for Warming Up Fine-Tuning in {LLM}s},\nauthor={Feiyang Kang and Hoang Anh Just and Yifan Sun and Himanshu Jahagirdar and Yuanzhi Zhang and Rongxing Du and Anit Kumar Sahu and Ruoxi Jia},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=QmYNBVukex}\n}",
        "github": "",
        "project": "",
        "reviewers": "2m8a;cFNr;GWmY;nPTw",
        "pdf_size": 6110704,
        "rating": "3;5;6;8",
        "confidence": "4;3;3;4",
        "soundness": "2;2;3;4",
        "contribution": "2;3;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "73;115;79;57",
        "wc_strengths": "81;57;66;44",
        "wc_weaknesses": "210;341;70;88",
        "wc_questions": "80;390;52;2",
        "wc_review": "444;903;267;191",
        "wc_reply_reviewers": "306;475;18;0",
        "wc_reply_authors": "3280;4540;1478;469",
        "reply_reviewers": "4;1;1;0",
        "reply_authors": "12;17;6;3",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            81.0,
            21.213203435596427
        ],
        "wc_strengths_avg": [
            62.0,
            13.47219358530748
        ],
        "wc_weaknesses_avg": [
            177.25,
            108.80573284528715
        ],
        "wc_questions_avg": [
            131.0,
            152.12166183683374
        ],
        "wc_review_avg": [
            451.25,
            276.4998869800854
        ],
        "wc_reply_reviewers_avg": [
            199.75,
            199.99046852287736
        ],
        "wc_reply_authors_avg": [
            2441.75,
            1575.2676558286848
        ],
        "reply_reviewers_avg": [
            1.5,
            1.5
        ],
        "reply_authors_avg": [
            9.5,
            5.408326913195984
        ],
        "replies_avg": [
            54,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14285598915605936204&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=QmYNBVukex",
        "pdf": "https://openreview.net/pdf?id=QmYNBVukex",
        "email": "nvidia.com;vt.edu;mail.tsinghua.edu.cn;;;vt.edu;;vt.edu",
        "author_num": 8,
        "aff_unique_index": "0;1;2;1;1",
        "aff_unique_norm": "NVIDIA;Virginia Tech;Tsinghua University",
        "aff_unique_dep": "NVIDIA Corporation;;",
        "aff_unique_url": "https://www.nvidia.com;https://www.vt.edu;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "NVIDIA;VT;THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "LanguageBind: Extending Video-Language Pretraining to N-modality by Language-based Semantic Alignment",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18668",
        "id": "QmZKc7UZCy",
        "author_site": "Bin Zhu, Bin Lin, Munan Ning, YANG YAN, Jiaxi Cui, WANG HongFa, Yatian Pang, Wenhao Jiang, Junwu Zhang, Zongwei Li, Cai Zhang, Zhifeng Li, Wei Liu, Yuan Li",
        "tldr": "",
        "abstract": "The video-language (VL) pretraining has achieved remarkable improvement in multiple downstream tasks. However, the current VL pretraining framework is hard to extend to multiple modalities (N modalities, N \u2265 3) beyond vision and language. We thus propose LanguageBind, taking the language as the bind across different modalities because the language modality is well-explored and contains rich semantics. Specifically, we freeze the language encoder acquired by VL pretraining and then train encoders for other modalities with contrastive learning. As a result, all modalities are mapped to a shared feature space, implementing multi-modal semantic alignment. While LanguageBind ensures that we can extend VL modalities to N modalities, we also need a high-quality dataset with alignment data pairs centered on language. We thus propose VIDAL-10M with 10 Million data with Video, Infrared, Depth, Audio and their corresponding Language. In our VIDAL-10M, all videos are from short video platforms with complete semantics rather than truncated segments from long videos, and all the video, depth, infrared, and audio modalities are aligned to their textual descriptions. LanguageBind has achieved superior performance on a wide range of 15 benchmarks covering video, audio, depth, and infrared. Moreover, multiple experiments have provided evidence for the effectiveness of LanguageBind in achieving indirect alignment and complementarity among diverse modalities.",
        "keywords": "LanguageBind;Multi-modal Pretraining;Multi-modal Dataset",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Bin Zhu;Bin Lin;Munan Ning;Yang Yan;Jiaxi Cui;WANG HongFa;Yatian Pang;Wenhao Jiang;Junwu Zhang;Zongwei Li;Cai Wan Zhang;Zhifeng Li;Wei Liu;Li Yuan",
        "authorids": "~Bin_Zhu6;~Bin_Lin1;~Munan_Ning1;~Yang_Yan3;~Jiaxi_Cui1;~WANG_HongFa1;~Yatian_Pang1;~Wenhao_Jiang1;~Junwu_Zhang2;~Zongwei_Li1;~Cai_Wan_Zhang1;~Zhifeng_Li5;~Wei_Liu3;~Li_Yuan2",
        "gender": "M;M;M;M;M;M;M;M;M;M;M;M;M;M",
        "homepage": "https://scholar.google.com/citations?hl=zh-CN&user=2ageYbMAAAAJ;;https://github.com/yanyang1024;https://github.com/JessyTsu1;;https://pang-yatian.github.io/;https://cswhjiang.github.io/;https://github.com/junwuzhang19;https://faculty.sustech.edu.cn/?p=78524&tagid=fengzheng&cat=2&iscss=1&snapid=1&go=1&orderby=date;http://www.sgepri.sgcc.com.cn;;https://sites.google.com/view/cuweiliu;;https://yuanli2333.github.io/",
        "dblp": ";214/9635;;;91/330;;;;;;;49/3283-5;;98/4583-7",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;zdBKgeUAAAAJ;;QRV7CjgAAAAJ;https://scholar.google.com.hk/citations?user=q9Fn50QAAAAJ;AZQyNWkAAAAJ;rAlT64IAAAAJ;;;;VTrRNN4AAAAJ;AjxoEpIAAAAJ;GCOVDKoAAAAJ;-5juAR0AAAAJ",
        "orcid": ";;;;0000-0001-8230-9471;;;;;;;0000-0002-3865-8145;;0000-0002-2120-5588",
        "linkedin": ";;;;;;;;;;;;;",
        "or_profile": "~Bin_Zhu6;~Munan_Ning1;~Yang_Yan3;~Jiaxi_Cui1;~WANG_HongFa1;~Yatian_Pang1;~Wenhao_Jiang1;~Junwu_Zhang2;~Zongwei_Li1;~Cai_Wan_Zhang1;~Zhifeng_Li5;~Wei_Liu3;~Lin_Bin1;~Yuan_LI2",
        "aff": "Peking University;Peking University;Peking University;;Tsinghua University;National University of Singapore;Guangming Laboratory;Peking University;Tencent data platform;Nanrui Group Co., Ltd;Tencent;Tencent;Peking University;Peking University",
        "aff_domain": "pku.edu.cn;pku.edu.cn;pku.edu.cn;;tsinghua.edu.cn;u.nus.edu;gml.ac.cn;pku.edu.cn;tencent.com;sgepri.sgcc.com.cn;tencent.com;tencent.com;pku.edu.cn;pku.edu.cn",
        "position": "MS student;PhD student;MS student;;PhD student;PhD student;Researcher;MS student;Researcher;Principal Researcher;Principal Researcher;Distinguished Scientist;MS student;Assistant Professor",
        "bibtex": "@inproceedings{\nzhu2024languagebind,\ntitle={LanguageBind: Extending Video-Language Pretraining to N-modality by Language-based Semantic Alignment},\nauthor={Bin Zhu and Bin Lin and Munan Ning and Yang Yan and Jiaxi Cui and WANG HongFa and Yatian Pang and Wenhao Jiang and Junwu Zhang and Zongwei Li and Cai Wan Zhang and Zhifeng Li and Wei Liu and Li Yuan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=QmZKc7UZCy}\n}",
        "github": "",
        "project": "",
        "reviewers": "ePEX;Bowz;ZKDg;fQRK",
        "pdf_size": 2225360,
        "rating": "6;6;6;8",
        "confidence": "5;4;4;3",
        "soundness": "3;3;3;3",
        "contribution": "3;3;2;3",
        "presentation": "3;3;3;2",
        "wc_summary": "40;89;105;103",
        "wc_strengths": "32;165;72;200",
        "wc_weaknesses": "106;274;207;199",
        "wc_questions": "4;30;113;393",
        "wc_review": "182;558;497;895",
        "wc_reply_reviewers": "0;0;103;0",
        "wc_reply_authors": "659;605;1454;1004",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;3;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            84.25,
            26.280934153869037
        ],
        "wc_strengths_avg": [
            117.25,
            67.9020434154967
        ],
        "wc_weaknesses_avg": [
            196.5,
            59.81847540685068
        ],
        "wc_questions_avg": [
            135.0,
            154.3000324044036
        ],
        "wc_review_avg": [
            533.0,
            253.06422109812362
        ],
        "wc_reply_reviewers_avg": [
            25.75,
            44.60030829489859
        ],
        "wc_reply_authors_avg": [
            930.5,
            338.7908646938403
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            14,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 222,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1118289122120059240&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=QmZKc7UZCy",
        "pdf": "https://openreview.net/pdf?id=QmZKc7UZCy",
        "email": "pku.edu.cn;pku.edu.cn;pku.edu.cn;;tsinghua.edu.cn;u.nus.edu;gml.ac.cn;pku.edu.cn;tencent.com;sgepri.sgcc.com.cn;tencent.com;tencent.com;pku.edu.cn;pku.edu.cn",
        "author_num": 14,
        "aff_unique_index": "0;0;0;1;2;3;0;4;5;4;4;0;0",
        "aff_unique_norm": "Peking University;Tsinghua University;National University of Singapore;Guangming Laboratory;Tencent;Nanrui Group",
        "aff_unique_dep": ";;;;data platform;",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.tsinghua.edu.cn;https://www.nus.edu.sg;;https://www.tencent.com;",
        "aff_unique_abbr": "Peking U;THU;NUS;;Tencent;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;1;0;0;0;0;0;0;0;0",
        "aff_country_unique": "China;Singapore"
    },
    {
        "title": "Localizing and Editing Knowledge In Text-to-Image Generative Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18667",
        "id": "Qmw9ne6SOQ",
        "author_site": "Samyadeep Basu, Nanxuan Zhao, Vlad Morariu, Soheil Feizi, Varun Manjunatha",
        "tldr": "",
        "abstract": "Text-to-Image Diffusion Models such as Stable-Diffusion and Imagen have achieved unprecedented quality of photorealism with state-of-the-art FID scores on MS-COCO and other generation benchmarks. Given a caption, image generation requires fine-grained knowledge about attributes such as object structure, style, and viewpoint amongst others. Where does this information reside in text-to-image generative models? In our paper, we tackle this question and understand how knowledge corresponding to distinct visual attributes is stored in large-scale text-to-image diffusion models. We adapt Causal Mediation Analysis for text-to-image models and trace knowledge about distinct visual attributes to various (causal) components in the (i) UNet and (ii) text-encoder of the diffusion model. \nIn particular, we show that unlike large-language models, knowledge about different attributes is not localized in isolated components, but is instead distributed amongst a set of components in the conditional UNet. These sets of components are often distinct for different visual attributes (e.g.,  style} / objects).  Remarkably, we find that the text-encoder in public text-to-image models such as Stable-Diffusion contains {\\it only} one causal state across different visual attributes, and this is the first self-attention layer corresponding to the last subject token of the attribute in the caption. This is in stark contrast to the causal states in other language models which are often the mid-MLP layers.  Based on this observation of only one causal state in the text-encoder, we introduce a fast, data-free model editing method DiffQuickFix which can effectively edit concepts (remove or update knowledge) in text-to-image models. DiffQuickFix can edit (ablate) concepts in under a second with a closed-form update, providing a significant 1000x speedup and comparable editing performance to existing fine-tuning based editing methods.",
        "keywords": "text-to-image;interpretability;model editing",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/dc142f95fb3de8fa1890c32c73e4cda76f6bf7a8.zip",
        "author": "Samyadeep Basu;Nanxuan Zhao;Vlad I Morariu;Soheil Feizi;Varun Manjunatha",
        "authorids": "~Samyadeep_Basu1;~Nanxuan_Zhao1;~Vlad_I_Morariu1;~Soheil_Feizi2;~Varun_Manjunatha1",
        "gender": "M;F;M;M;M",
        "homepage": "https://samyadeepbasu.github.io/;http://nxzhao.com;https://research.adobe.com/person/vlad-morariu/;https://www.cs.umd.edu/~sfeizi/;https://research.adobe.com/person/varun-manjunatha/",
        "dblp": "250/9138;224/0709;27/6671;57/2132;https://dblp.org/pers/m/Manjunatha:Varun.html",
        "google_scholar": "6aRwDecAAAAJ;;oyWpVa8AAAAJ;lptAmrMAAAAJ;nO-We6sAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Samyadeep_Basu1;~Nanxuan_Zhao1;~Vlad_I_Morariu1;~Soheil_Feizi2;~Varun_Manjunatha1",
        "aff": "Adobe Systems;Adobe Research;Adobe;University of Maryland, College Park;Adobe Systems",
        "aff_domain": "adobe.com;adobe.com;adobe.com;umd.edu;adobe.com",
        "position": "Intern;Researcher;Senior Research Scientist;Associate Professor;Research Scientist",
        "bibtex": "@inproceedings{\nbasu2024localizing,\ntitle={Localizing and Editing Knowledge In Text-to-Image Generative Models},\nauthor={Samyadeep Basu and Nanxuan Zhao and Vlad I Morariu and Soheil Feizi and Varun Manjunatha},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Qmw9ne6SOQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "cjqU;TjyF;cqRW;Qvyq",
        "pdf_size": 4948685,
        "rating": "5;5;8;8",
        "confidence": "3;4;3;4",
        "soundness": "2;2;3;4",
        "contribution": "2;2;3;4",
        "presentation": "3;3;4;3",
        "wc_summary": "45;162;61;102",
        "wc_strengths": "50;104;58;285",
        "wc_weaknesses": "136;159;168;263",
        "wc_questions": "31;154;2;2",
        "wc_review": "262;579;289;652",
        "wc_reply_reviewers": "0;188;0;0",
        "wc_reply_authors": "1165;1831;486;819",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "3;4;2;2",
        "rating_avg": [
            6.5,
            1.5
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            92.5,
            45.191260216993285
        ],
        "wc_strengths_avg": [
            124.25,
            95.06938255821376
        ],
        "wc_weaknesses_avg": [
            181.5,
            48.479377058704046
        ],
        "wc_questions_avg": [
            47.25,
            62.75896350323195
        ],
        "wc_review_avg": [
            445.5,
            172.2128044019956
        ],
        "wc_reply_reviewers_avg": [
            47.0,
            81.40638795573723
        ],
        "wc_reply_authors_avg": [
            1075.25,
            498.0192641856337
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 21,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4704298193308859590&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=Qmw9ne6SOQ",
        "pdf": "https://openreview.net/pdf?id=Qmw9ne6SOQ",
        "email": "adobe.com;adobe.com;adobe.com;umd.edu;adobe.com",
        "author_num": 5,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "Adobe;University of Maryland",
        "aff_unique_dep": "Adobe Systems Incorporated;",
        "aff_unique_url": "https://www.adobe.com;https://www/umd.edu",
        "aff_unique_abbr": "Adobe;UMD",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";College Park",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Qn4HEhezKW",
        "title": "Diffusion Language Models Can Perform Many Tasks with Scaling and Instruction-Finetuning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The recent surge of generative AI has been fueled by the generative power of diffusion probabilistic models and the scalable capabilities of large language models. Despite their potential, it remains elusive whether diffusion language models can solve general language tasks comparable to their autoregressive counterparts. This paper demonstrates that scaling diffusion models w.r.t. data, sizes, and tasks can effectively make them strong language learners. We build competent diffusion language models at scale by first acquiring knowledge from massive data via masked language modeling pretraining thanks to their intrinsic connections. We then reprogram pretrained masked language models into diffusion language models via diffusive adaptation, wherein task-specific finetuning and instruction finetuning are explored to unlock their versatility in solving general language tasks. Experiments show that scaling diffusion language models consistently improves performance across downstream language tasks. We further discover that instruction finetuning can elicit zero-shot and few-shot in-context learning abilities that help tackle many unseen tasks by following natural language instructions, and show promise in advanced and challenging abilities such as reasoning.",
        "keywords": "Diffusion Models;Large Language Models;Instruction-Finetuning;Reasoning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Jiasheng Ye;Zaixiang Zheng;Yu Bao;Lihua Qian;Quanquan Gu",
        "authorids": "~Jiasheng_Ye1;~Zaixiang_Zheng2;~Yu_Bao1;~Lihua_Qian1;~Quanquan_Gu1",
        "gender": "Not Specified;M;M;;M",
        "homepage": "https://github.com/yegcjs;https://zhengzx-nlp.github.io/;https://baoy-nlp.github.io/;https://to.be.done;http://web.cs.ucla.edu/~qgu/",
        "dblp": "298/0158;205/2769;;167/5564;50/4597",
        "google_scholar": ";JPSrehMAAAAJ;https://scholar.google.com/citations?authuser=1;;GU9HgNAAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Jiasheng_Ye1;~Zaixiang_Zheng2;~Yu_Bao1;~Lihua_Qian1;~Quanquan_Gu1",
        "aff": "Fudan University;ByteDance Research;ByteDance Research;ByteDance;University of California, Los Angeles",
        "aff_domain": "fudan.edu.cn;bytedance.com;bytedance.com;bytedance.com;cs.ucla.edu",
        "position": "MS student;Research Scientist;Researcher;Researcher;Associate Professor",
        "bibtex": "@misc{\nye2024diffusion,\ntitle={Diffusion Language Models Can Perform Many Tasks with Scaling and Instruction-Finetuning},\nauthor={Jiasheng Ye and Zaixiang Zheng and Yu Bao and Lihua Qian and Quanquan Gu},\nyear={2024},\nurl={https://openreview.net/forum?id=Qn4HEhezKW}\n}",
        "github": "",
        "project": "",
        "reviewers": "xgDh;VY65;bJbT;gyd2",
        "site": "https://openreview.net/forum?id=Qn4HEhezKW",
        "pdf_size": 2762088,
        "rating": "5;5;5;5",
        "confidence": "4;3;4;3",
        "soundness": "2;3;4;4",
        "contribution": "2;3;2;2",
        "presentation": "3;2;3;3",
        "wc_summary": "83;81;56;269",
        "wc_strengths": "101;86;65;96",
        "wc_weaknesses": "446;298;189;305",
        "wc_questions": "202;162;216;43",
        "wc_review": "832;627;526;713",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1870;1652;1095;1494",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "4;4;3;3",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            122.25,
            85.39137837041864
        ],
        "wc_strengths_avg": [
            87.0,
            13.80217374184226
        ],
        "wc_weaknesses_avg": [
            309.5,
            91.24828765516644
        ],
        "wc_questions_avg": [
            155.75,
            68.04548111373745
        ],
        "wc_review_avg": [
            674.5,
            112.46888458591559
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1527.75,
            283.2775802989005
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            3.5,
            0.5
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3161538818345911838&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1;1;2",
        "aff_unique_norm": "Fudan University;ByteDance;University of California, Los Angeles",
        "aff_unique_dep": ";Research;",
        "aff_unique_url": "https://www.fudan.edu.cn;https://www.bytedance.com;https://www.ucla.edu",
        "aff_unique_abbr": "Fudan;ByteDance;UCLA",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Los Angeles",
        "aff_country_unique_index": "0;0;0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "QoufMIejek",
        "title": "PointMLLM: Aligning multi-modality with LLM for point cloud understanding, generation and editing",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We introduce UniPoint-LLM, which integrates point cloud understanding ability\ninto Image Multimodal Large Language Model(MLLM) and enable more flexible\nand controllable natural language-driven 3D generation, realized the unified pro-\ncess of point cloud understanding and generation. Unlike traditional text-to-3D\nmethods with limited prompt inputs or constrained parameters, UniPoint-LLM al-\nlows users to input natural language description to specify their requirements. By\naligning image and point cloud modalities through joint training and weights shar-\ning, UniPoint-LLM also achieves two modalities\u2019 understanding. Experiments\ndemonstrate that UniPoint-LLM offers users greater flexibility and control in gen-\nerating desired 3D objects and the effectiveness of our Multimodal Universal To-\nken Space(MUTS) in understanding both images and point clouds. These exper-\niments validates its potential value in practical applications of 3D generation and\ninteractive desig",
        "keywords": "UNIPOINT-LLM: UNIFYING POINT CLOUD UNDER- STANDING AND MORE CONTROLLABLE 3D GENERA- TION",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Dingning Liu;Xiaoshui Huang;Zhihui Wang;Zhenfei Yin;Peng Gao;Yujiao Wu;Yuenan Hou;Xinzhu Ma;Wanli Ouyang",
        "authorids": "~Dingning_Liu4;~Xiaoshui_Huang1;~Zhihui_Wang4;~Zhenfei_Yin2;~Peng_Gao3;~Yujiao_Wu1;~Yuenan_Hou1;~Xinzhu_Ma1;~Wanli_Ouyang1",
        "gender": "M;Not Specified;F;M;;F;M;M;",
        "homepage": "https://kns.cnki.net/kcms2/author/detail?v=3uoqIhG8C45UgIk_lOaz14XyqsX58x7M0WXtgcAez4UGRerJDCMVB19_2vmVIoiOmRpSmGxuOzT3rAn8jqEtaGKLY-8Ou370UN3Z1Bw5YL9O5zP0gfzFSLVtJxToOC4s&uniplatform=NZKPT;https://xiaoshuihuang.github.io/;http://dlutir.dlut.edu.cn/Scholar/Detail/6293;https://yinzhenfei.github.io/;;https://sites.google.com/view/yujiaowu/contact;https://cardwing.github.io/;https://github.com/xinzhuma;",
        "dblp": ";167/9599;65/2749-1.html;271/0669;;;210/3047;191/3902;",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.ca/citations?user=rp7mYNsAAAAJ;;https://scholar.google.com.hk/citations?user=ngPR1dIAAAAJ;;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com.hk/citations?user=o9mX9sUAAAAJ;8PuKa_8AAAAJ;",
        "orcid": ";;;0000-0002-8666-1103;;0000-0001-6366-9834;0000-0002-2844-7416;;",
        "linkedin": ";;;zhenfei-yin/;;;yuenan-hou-859589136/;;",
        "or_profile": "~Dingning_Liu4;~Xiaoshui_Huang1;~Zhihui_Wang4;~Zhenfei_Yin2;~Peng_Gao3;~Yujiao_Wu1;~Yuenan_Hou1;~Xinzhu_Ma1;~Wanli_Ouyang1",
        "aff": "Shanghai AI Laboratory;Shanghai AI Laboratory;Dalian University of Technology;Shanghai AI Laboratory;;CSIRO;Shanghai AI Laboratory;The Chinese University of Hong Kong;",
        "aff_domain": "org.cn;pjlab.org.cn;dlut.edu.cn;pjlab.org.cn;;csiro.au;pjlab.org.cn;cuhk.edu.hk;",
        "position": "Intern;Research Fellow;Full Professor;Intern;;Postdoc;Researcher;Postdoc;",
        "bibtex": "@misc{\nliu2024pointmllm,\ntitle={Point{MLLM}: Aligning multi-modality with {LLM} for point cloud understanding, generation and editing},\nauthor={Dingning Liu and Xiaoshui Huang and Zhihui Wang and Zhenfei Yin and Peng Gao and Yujiao Wu and Yuenan Hou and Xinzhu Ma and Wanli Ouyang},\nyear={2024},\nurl={https://openreview.net/forum?id=QoufMIejek}\n}",
        "github": "",
        "project": "",
        "reviewers": "JaY5;AdrN;UrQG",
        "site": "https://openreview.net/forum?id=QoufMIejek",
        "pdf_size": 335960,
        "rating": "3;3;6",
        "confidence": "3;4;5",
        "soundness": "2;1;3",
        "contribution": "2;1;3",
        "presentation": "2;1;4",
        "wc_summary": "102;68;68",
        "wc_strengths": "18;21;41",
        "wc_weaknesses": "97;156;202",
        "wc_questions": "4;2;213",
        "wc_review": "221;247;524",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "wc_summary_avg": [
            79.33333333333333,
            16.027753706895076
        ],
        "wc_strengths_avg": [
            26.666666666666668,
            10.208928554075703
        ],
        "wc_weaknesses_avg": [
            151.66666666666666,
            42.975445185464785
        ],
        "wc_questions_avg": [
            73.0,
            98.99831648400222
        ],
        "wc_review_avg": [
            330.6666666666667,
            137.11876441813337
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.8660254037844387,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:AjbaruhBT7QJ:scholar.google.com/&scioq=PointMLLM:+Aligning+multi-modality+with+LLM+for+point+cloud+understanding,+generation+and+editing&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;2;0;3",
        "aff_unique_norm": "Shanghai AI Laboratory;Dalian University of Technology;Commonwealth Scientific and Industrial Research Organisation;Chinese University of Hong Kong",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.shanghai-ai-lab.com;http://www.dlut.edu.cn/;https://www.csiro.au;https://www.cuhk.edu.hk",
        "aff_unique_abbr": "SAIL;DUT;CSIRO;CUHK",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;1;0;0",
        "aff_country_unique": "China;Australia"
    },
    {
        "title": "Learning Multi-Agent Communication from Graph Modeling Perspective",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18666",
        "id": "Qox9rO0kN0",
        "author_site": "Shengchao Hu, Li Shen, Ya Zhang, Dacheng Tao",
        "tldr": "",
        "abstract": "In numerous artificial intelligence applications, the collaborative efforts of multiple intelligent agents are imperative for the successful attainment of target objectives. To enhance coordination among these agents, a distributed communication framework is often employed. However, information sharing among all agents proves to be resource-intensive, while the adoption of a manually pre-defined communication architecture imposes limitations on inter-agent communication, thereby constraining the potential for collaborative efforts. In this study, we introduce a novel approach wherein we conceptualize the communication architecture among agents as a learnable graph. We formulate this problem as the task of determining the communication graph while enabling the architecture parameters to update normally, thus necessitating a bi-level optimization process. Utilizing continuous relaxation of the graph representation and incorporating attention units, our proposed approach, CommFormer, efficiently optimizes the communication graph and concurrently refines architectural parameters through gradient descent in an end-to-end manner. Extensive experiments on a variety of cooperative tasks substantiate the robustness of our model across diverse cooperative scenarios, where agents are able to develop more coordinated and sophisticated strategies regardless of changes in the number of agents.",
        "keywords": "communication learning;multi-agent reinforcement learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Shengchao Hu;Li Shen;Ya Zhang;Dacheng Tao",
        "authorids": "~Shengchao_Hu1;~Li_Shen1;~Ya_Zhang1;~Dacheng_Tao1",
        "gender": ";M;F;",
        "homepage": ";https://sites.google.com/site/mathshenli/home;https://annzhanglion.github.io/;",
        "dblp": ";91/3680-8;85/3714-2;",
        "google_scholar": ";yVhgENIAAAAJ;pbjw9sMAAAAJ;",
        "orcid": ";;0000-0002-5390-9053;",
        "linkedin": ";;;",
        "or_profile": "~Shengchao_Hu1;~Li_Shen1;~Ya_Zhang1;~Dacheng_Tao1",
        "aff": ";JD Explore Academy;Shanghai Jiaotong University;",
        "aff_domain": ";jd.com;sjtu.edu.cn;",
        "position": ";Researcher;Professor;",
        "bibtex": "@inproceedings{\nhu2024learning,\ntitle={Learning Multi-Agent Communication from Graph Modeling Perspective},\nauthor={Shengchao Hu and Li Shen and Ya Zhang and Dacheng Tao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Qox9rO0kN0}\n}",
        "github": "",
        "project": "",
        "reviewers": "WiJp;Ux29;q3Zy;9cgB",
        "pdf_size": 2553298,
        "rating": "6;6;8;8",
        "confidence": "3;5;3;5",
        "soundness": "3;3;3;4",
        "contribution": "2;2;2;4",
        "presentation": "2;2;3;4",
        "wc_summary": "90;592;31;125",
        "wc_strengths": "44;2;45;98",
        "wc_weaknesses": "64;2;87;171",
        "wc_questions": "129;2;228;75",
        "wc_review": "327;598;391;469",
        "wc_reply_reviewers": "0;101;0;0",
        "wc_reply_authors": "1357;1640;1988;1006",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "3;3;3;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            1.0
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            209.5,
            223.37692360671457
        ],
        "wc_strengths_avg": [
            47.25,
            34.05418476487141
        ],
        "wc_weaknesses_avg": [
            81.0,
            60.55163086160438
        ],
        "wc_questions_avg": [
            108.5,
            82.40904076616837
        ],
        "wc_review_avg": [
            446.25,
            101.01825330107425
        ],
        "wc_reply_reviewers_avg": [
            25.25,
            43.73428289111415
        ],
        "wc_reply_authors_avg": [
            1497.75,
            361.32006241004666
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            0.4330127018922193
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 32,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10170930341055465685&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=Qox9rO0kN0",
        "pdf": "https://openreview.net/pdf?id=Qox9rO0kN0",
        "email": ";jd.com;sjtu.edu.cn;",
        "author_num": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "JD;Shanghai Jiao Tong University",
        "aff_unique_dep": "JD Explore Academy;",
        "aff_unique_url": ";https://www.sjtu.edu.cn",
        "aff_unique_abbr": ";SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "1",
        "aff_country_unique": ";China"
    },
    {
        "id": "Qp33jnRKda",
        "title": "Growing Tiny Networks: Spotting Expressivity Bottlenecks and Fixing Them Optimally",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Machine learning tasks are generally formulated as optimization problems, where one searches for an optimal function within a certain functional space.\nIn practice, parameterized functional spaces are considered, in order to be able to perform gradient descent. \nNeural networks need first to choose and fix an architecture (number and type of layers), then to optimize its parameters (connection weights). Any changes on layer structure requires to train again the network. This process restricts the search in the functional space within the realm of what is expressible by the chosen architecture. The common solution is a costly and slow hyper-parameter optimization regarding the architectural choice to crudely address this expressivity bottleneck.\nWith a careful characterization of the neural networks expressivity, we show that the information about desirable architectural changes can be directly extracted during the backpropagation pass. \nTo do this, we propose a new mathematically well-grounded method to detect expressivity bottlenecks \\emph{on the fly} and solve them by adding suitable neurons when and where needed. Thus, while the standard approach requires large networks, in terms of number of neurons per layer, for expressivity and optimization reasons, we are able to start with  very small neural networks and let them grow appropriately.  As a proof of concept, we show  results~on the CIFAR dataset, matching large neural network accuracy, with competitive training time,while removing the need for standard architectural hyper-parameter search.",
        "keywords": "neural network;expressivity;optimization;quadratic programmings;layer growth",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/b6a59f750dae993030adf5eb3f7395b2c889ea6a.pdf",
        "author": "Manon Verbockhaven;Sylvain Chevallier;Guillaume Charpiat",
        "authorids": "~Manon_Verbockhaven1;~Sylvain_Chevallier1;~Guillaume_Charpiat1",
        "gender": "F;M;M",
        "homepage": "https://mywebpage-public-f1a2e3.gitlab.io;https://sylvchev.github.io/;https://www.lri.fr/~gcharpia/index_en.html",
        "dblp": "274/7209;56/5283;https://dblp.org/pers/hd/c/Charpiat:Guillaume",
        "google_scholar": ";https://scholar.google.co.uk/citations?user=j5Tu_SQAAAAJ;https://scholar.google.fr/citations?user=SfBBevUAAAAJ",
        "orcid": "0000-0002-4921-0741;0000-0003-3027-8241;0009-0003-6000-9410",
        "linkedin": "manon-verbockhaven-4737891a2;;",
        "or_profile": "~Manon_Verbockhaven1;~Sylvain_Chevallier1;~Guillaume_Charpiat1",
        "aff": "INRIA;LISN, Universite Paris-Saclay;INRIA",
        "aff_domain": "inria.fr;universite-paris-saclay.fr;inria.fr",
        "position": "PhD student;Full Professor;Researcher",
        "bibtex": "@misc{\nverbockhaven2024growing,\ntitle={Growing Tiny Networks: Spotting Expressivity Bottlenecks and Fixing Them Optimally},\nauthor={Manon Verbockhaven and Sylvain Chevallier and Guillaume Charpiat},\nyear={2024},\nurl={https://openreview.net/forum?id=Qp33jnRKda}\n}",
        "github": "",
        "project": "",
        "reviewers": "vNAT;XQVK;7xtb;qBe2",
        "site": "https://openreview.net/forum?id=Qp33jnRKda",
        "pdf_size": 2202868,
        "rating": "5;5;5;6",
        "confidence": "3;2;4;3",
        "soundness": "3;3;1;3",
        "contribution": "2;3;2;4",
        "presentation": "2;1;2;3",
        "wc_summary": "76;56;48;245",
        "wc_strengths": "76;52;59;49",
        "wc_weaknesses": "314;75;1397;36",
        "wc_questions": "81;92;208;288",
        "wc_review": "547;275;1712;618",
        "wc_reply_reviewers": "300;0;335;0",
        "wc_reply_authors": "916;394;752;1470",
        "reply_reviewers": "2;0;1;0",
        "reply_authors": "2;1;2;2",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            106.25,
            80.75386987630995
        ],
        "wc_strengths_avg": [
            59.0,
            10.464224768228174
        ],
        "wc_weaknesses_avg": [
            455.5,
            553.8964253360009
        ],
        "wc_questions_avg": [
            167.25,
            85.64862812678321
        ],
        "wc_review_avg": [
            788.0,
            548.6178086792298
        ],
        "wc_reply_reviewers_avg": [
            158.75,
            159.23155309171608
        ],
        "wc_reply_authors_avg": [
            883.0,
            387.9239616213466
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5764267128691427905&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 14,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "INRIA;Universite Paris-Saclay",
        "aff_unique_dep": ";LISN",
        "aff_unique_url": "https://www.inria.fr;https://www.universite-paris-saclay.fr",
        "aff_unique_abbr": "INRIA;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "France"
    },
    {
        "id": "QpLuWhiiaH",
        "title": "DiffImpute: Tabular Data Imputation With Denoising Diffusion Probabilistic Model",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Tabular data plays a crucial role in various domains but often suffers from missing values, thereby curtailing its potential utility. Traditional imputation techniques frequently yield suboptimal results and impose substantial computational burdens, leading to inaccuracies in subsequent modeling tasks. To address these challenges, we propose DiffImpute, a novel Denoising Diffusion Probabilistic Model (DDPM). Specifically, DiffImpute is trained on complete tabular datasets, ensuring that it can produce credible imputations for missing entries without undermining the authenticity of the existing data. Innovatively, it can be applied to various settings of Missing Completely At Random (MCAR) and Missing At Random (MAR). To effectively handle the tabular features in DDPM, we tailor four tabular denoising networks, spanning MLP, ResNet, Transformer, and U-Net. We also propose Harmonization to enhance coherence between observed and imputed data by infusing the data back and denoising them multiple times during the sampling stage. To enable efficient inference while maintaining imputation performance, we propose a refined non-Markovian sampling process that works along with Harmonization. Empirical evaluations on seven diverse datasets underscore the prowess of DiffImpute. Specifically, when paired with the Transformer as the denoising network, it consistently outperforms its competitors, boasting an average ranking of 1.7 and the most minimal standard deviation. In contrast, the next best method lags with a ranking of 2.8 and a standard deviation of 0.9. The code is available at https://anonymous.4open.science/r/anonymization-C1B5.",
        "keywords": "Missing data imputation;Diffusion model",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/24b52e4f313aca170a45d0084a5a3f74b5fb02bf.pdf",
        "author": "Yizhu Wen;Kai Yi;Jing Ke;Yiqing Shen",
        "authorids": "~Yizhu_Wen1;~Kai_Yi2;~Jing_Ke1;~Yiqing_Shen1",
        "gender": "M;M;F;",
        "homepage": "https://www.linkedin.com/in/yizhuwen;;;",
        "dblp": "372/4109;;192/3852;",
        "google_scholar": ";A_YCRFwAAAAJ;;",
        "orcid": "0009-0008-0479-4991;;;",
        "linkedin": "yizhuwen;;;",
        "or_profile": "~Yizhu_Wen1;~Kai_Yi2;~Jing_Ke1;~Yiqing_Shen1",
        "aff": "University of Hawaii System;University of New South Wales;Shanghai Jiaotong University;",
        "aff_domain": "hawaii.edu;unsw.edu.au;sjtu.edu.cn;",
        "position": "PhD student;PhD student;Assistant Professor;",
        "bibtex": "@misc{\nwen2024diffimpute,\ntitle={DiffImpute: Tabular Data Imputation With Denoising Diffusion Probabilistic Model},\nauthor={Yizhu Wen and Kai Yi and Jing Ke and Yiqing Shen},\nyear={2024},\nurl={https://openreview.net/forum?id=QpLuWhiiaH}\n}",
        "github": "",
        "project": "",
        "reviewers": "kcNk;gUrr;Y6jJ;eAqk",
        "site": "https://openreview.net/forum?id=QpLuWhiiaH",
        "pdf_size": 1450734,
        "rating": "3;3;5;5",
        "confidence": "4;2;5;4",
        "soundness": "1;2;2;2",
        "contribution": "1;2;2;2",
        "presentation": "2;2;2;1",
        "wc_summary": "44;48;52;99",
        "wc_strengths": "26;26;50;33",
        "wc_weaknesses": "212;177;546;91",
        "wc_questions": "55;28;128;74",
        "wc_review": "337;279;776;297",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            60.75,
            22.26404051379713
        ],
        "wc_strengths_avg": [
            33.75,
            9.807522622966516
        ],
        "wc_weaknesses_avg": [
            256.5,
            172.84458336899075
        ],
        "wc_questions_avg": [
            71.25,
            36.615399765672365
        ],
        "wc_review_avg": [
            422.25,
            205.31363203645296
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.6882472016116854,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13804175793627443837&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of Hawaii;University of New South Wales;Shanghai Jiao Tong University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.hawaii.edu;https://www.unsw.edu.au;https://www.sjtu.edu.cn",
        "aff_unique_abbr": "UH;UNSW;SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2",
        "aff_country_unique": "United States;Australia;China"
    },
    {
        "id": "QqdloE1QH2",
        "title": "Multilingual Mathematical Autoformalization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Autoformalization is the task of translating natural language materials into machine-verifiable formalisations. Progress in autoformalization research is hindered by the lack of a sizeable dataset consisting of informal-formal pairs expressing the same essence. Existing methods tend to circumvent this challenge by manually curating small corpora or using few-shot learning with large language models. But these methods suffer from data scarcity and formal language acquisition difficulty. In this work, we create MMA, a large, flexible, multilingual, and multi-domain dataset of informal-formal pairs, by using a language model to translate in the reverse direction, that is, from formal mathematical statements into corresponding informal ones. Experiments show that language models fine-tuned on MMA produce 16 \u2212 18\\% of statements acceptable with minimal corrections on the $\\texttt{miniF2F}$ and $\\texttt{ProofNet}$ benchmarks, up from 0\\% with the base model. We demonstrate that fine-tuning on multilingual formal data results in more capable autoformalization models even when deployed on monolingual tasks.",
        "keywords": "Autoformalization;parallel corpus;theorem proving;automated reasoning;language models;dataset",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/85079efca252086bd75c84b24d388ff26f5287e8.zip",
        "author": "Albert Qiaochu Jiang;Wenda Li;Mateja Jamnik",
        "authorids": "~Albert_Qiaochu_Jiang1;~Wenda_Li1;~Mateja_Jamnik1",
        "gender": "M;F;",
        "homepage": "https://wenda302.github.io;http://www.cl.cam.ac.uk/~mj201;https://albertqjiang.github.io/",
        "dblp": "132/9868.html;41/1392;321/1049",
        "google_scholar": "ufYxQkEAAAAJ;d5QiyJkAAAAJ;Fe_RBHMAAAAJ",
        "orcid": ";0000-0003-2772-2532;",
        "linkedin": ";;",
        "or_profile": "~Wenda_Li1;~Mateja_Jamnik1;~Albert_Jiang1",
        "aff": "University of Edinburgh;University of Cambridge;University of Cambridge",
        "aff_domain": "ed.ac.uk;cam.ac.uk;cam.ac.uk",
        "position": "Lecturer;Professor in Artificial Intelligence;PhD student",
        "bibtex": "@misc{\njiang2024multilingual,\ntitle={Multilingual Mathematical Autoformalization},\nauthor={Albert Qiaochu Jiang and Wenda Li and Mateja Jamnik},\nyear={2024},\nurl={https://openreview.net/forum?id=QqdloE1QH2}\n}",
        "github": "",
        "project": "",
        "reviewers": "rYoT;d1G8;Gtv6;1cNi",
        "site": "https://openreview.net/forum?id=QqdloE1QH2",
        "pdf_size": 362467,
        "rating": "3;5;6;8",
        "confidence": "4;4;3;4",
        "soundness": "3;3;2;4",
        "contribution": "2;2;4;3",
        "presentation": "3;3;3;3",
        "wc_summary": "29;56;75;62",
        "wc_strengths": "7;55;45;84",
        "wc_weaknesses": "239;64;108;119",
        "wc_questions": "26;10;43;92",
        "wc_review": "301;185;271;357",
        "wc_reply_reviewers": "0;0;106;30",
        "wc_reply_authors": "830;236;421;366",
        "reply_reviewers": "0;0;2;1",
        "reply_authors": "3;2;2;2",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            55.5,
            16.77050983124842
        ],
        "wc_strengths_avg": [
            47.75,
            27.544282528321553
        ],
        "wc_weaknesses_avg": [
            132.5,
            64.8401881551866
        ],
        "wc_questions_avg": [
            42.75,
            30.73576906472327
        ],
        "wc_review_avg": [
            278.5,
            62.18319708731612
        ],
        "wc_reply_reviewers_avg": [
            34.0,
            43.3358973600409
        ],
        "wc_reply_authors_avg": [
            463.25,
            222.14339400486344
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.16012815380508713,
        "gs_citation": 21,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13423034013304409298&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "University of Edinburgh;University of Cambridge",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ed.ac.uk;https://www.cam.ac.uk",
        "aff_unique_abbr": "Edinburgh;Cambridge",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Cambridge",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "title": "It's Never Too Late: Fusing Acoustic Information into Large Language Models for Automatic Speech Recognition",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18665",
        "id": "QqjFHyQwtF",
        "author_site": "CHEN CHEN, Ruizhe Li, Yuchen Hu, Sabato Siniscalchi, Pin-Yu Chen, Ensiong Chng, Chao-Han Huck Yang",
        "tldr": "",
        "abstract": "Recent studies have successfully shown that large language models (LLMs) can be successfully used for generative error correction (GER) on top of the automatic speech recognition (ASR) output. Specifically, an LLM is utilized to carry out a direct mapping from the N-best hypotheses list generated by an ASR system to the predicted output transcription. However, despite its effectiveness, GER introduces extra data uncertainty since the LLM is trained without taking into account acoustic information available in the speech signal. In this work, we aim to overcome such a limitation by infusing acoustic information before generating the predicted transcription through a novel late fusion solution termed Uncertainty-Aware Dynamic Fusion (UADF). UADF is a multimodal fusion approach implemented into an auto-regressive decoding process and works in two stages: (i) It first analyzes and calibrates the token-level LLM decision, and (ii) it then dynamically assimilates the information from the acoustic modality. Experimental evidence collected from various ASR tasks shows that UADF surpasses existing fusion mechanisms in several ways. It yields significant improvements in word error rate (WER) while mitigating data uncertainty issues in LLM and addressing the poor generalization relied with sole modality during fusion. We also demonstrate that UADF seamlessly adapts to audio-visual speech recognition.",
        "keywords": "Automatic speech recognition;large language model;generative error correction.",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "CHEN CHEN;Ruizhe Li;Yuchen Hu;Sabato Marco Siniscalchi;Pin-Yu Chen;EngSiong Chng;Chao-Han Huck Yang",
        "authorids": "~CHEN_CHEN37;~Ruizhe_Li2;~Yuchen_Hu1;~Sabato_Marco_Siniscalchi1;~Pin-Yu_Chen1;~EngSiong_Chng1;~Chao-Han_Huck_Yang1",
        "gender": "M;M;M;M;M;M;M",
        "homepage": ";https://www.ruizhe.space/;https://yuchen005.github.io/;https://www.ntnu.edu/employees/marco.siniscalchi;http://www.pinyuchen.com;https://personal.ntu.edu.sg/aseschng/intro1.html;https://huckiyang.github.io/",
        "dblp": "65/4423;14/10102-1;;58/6344;39/8969;c/ChngEngSiong;230/4012",
        "google_scholar": "uUmSp1QAAAAJ;f_5wLsUAAAAJ;Neo-1mIAAAAJ;https://scholar.google.it/citations?user=iHhGIcEAAAAJ;jxwlCUUAAAAJ;https://scholar.google.com.tw/citations?user=FJodrCcAAAAJ;TT3XJW8AAAAJ",
        "orcid": ";0000-0003-2512-845X;;0000-0002-0770-0507;0000-0003-1039-8369;;0000-0003-2879-8811",
        "linkedin": ";ruizhe-li-3490b4b3/;;;pin-yu-chen-940062a2;;",
        "or_profile": "~CHEN_CHEN37;~Ruizhe_Li2;~Yuchen_Hu1;~Sabato_Marco_Siniscalchi1;~Pin-Yu_Chen1;~EngSiong_Chng1;~Chao-Han_Huck_Yang1",
        "aff": "Nanyang Technological University;University of Aberdeen;Nanyang Technological University;Norwegian Institute of Technology;International Business Machines;Nanyang Technological University;NVIDIA Research",
        "aff_domain": "ntu.edu;abdn.ac.uk;ntu.edu.sg;ntnu.no;ibm.com;ntu.edu.sg;nvidia.com",
        "position": "PhD student;Assistant Professor;PhD student;Adjunct Professor;Principal Researcher;Associate Professor;Researcher",
        "bibtex": "@inproceedings{\nchen2024its,\ntitle={It's Never Too Late: Fusing Acoustic Information into Large Language Models for Automatic Speech Recognition},\nauthor={CHEN CHEN and Ruizhe Li and Yuchen Hu and Sabato Marco Siniscalchi and Pin-Yu Chen and EngSiong Chng and Chao-Han Huck Yang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=QqjFHyQwtF}\n}",
        "github": "",
        "project": "",
        "reviewers": "kWJM;3ovr;1EWw;2SYt;GWCM",
        "pdf_size": 494631,
        "rating": "5;6;6;6;10",
        "confidence": "3;5;3;4;4",
        "soundness": "3;3;3;2;3",
        "contribution": "2;3;3;3;4",
        "presentation": "3;3;3;2;3",
        "wc_summary": "99;111;30;153;67",
        "wc_strengths": "11;205;75;63;54",
        "wc_weaknesses": "280;1195;31;213;128",
        "wc_questions": "8;82;33;206;36",
        "wc_review": "398;1593;169;635;285",
        "wc_reply_reviewers": "216;94;20;0;10",
        "wc_reply_authors": "768;619;330;614;176",
        "reply_reviewers": "1;1;1;0;1",
        "reply_authors": "2;1;1;1;1",
        "rating_avg": [
            6.6,
            1.7435595774162693
        ],
        "confidence_avg": [
            3.8,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            3.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            92.0,
            41.47288270665544
        ],
        "wc_strengths_avg": [
            81.6,
            65.36543429060958
        ],
        "wc_weaknesses_avg": [
            369.4,
            421.15488837243714
        ],
        "wc_questions_avg": [
            73.0,
            70.65974808899335
        ],
        "wc_review_avg": [
            616.0,
            512.2077703432466
        ],
        "wc_reply_reviewers_avg": [
            68.0,
            81.08267385822941
        ],
        "wc_reply_authors_avg": [
            501.4,
            215.79953660747282
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4
        ],
        "reply_authors_avg": [
            1.2,
            0.4000000000000001
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.24525573579398635,
        "gs_citation": 27,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9360955248593552591&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 9,
        "openreview": "https://openreview.net/forum?id=QqjFHyQwtF",
        "pdf": "https://openreview.net/pdf?id=QqjFHyQwtF",
        "email": "ntu.edu;abdn.ac.uk;ntu.edu.sg;ntnu.no;ibm.com;ntu.edu.sg;nvidia.com",
        "author_num": 7,
        "aff_unique_index": "0;1;0;2;3;0;4",
        "aff_unique_norm": "Nanyang Technological University;University of Aberdeen;Norwegian Institute of Technology;International Business Machines Corporation;NVIDIA",
        "aff_unique_dep": ";;;;NVIDIA Research",
        "aff_unique_url": "https://www.ntu.edu.sg;https://www.abdn.ac.uk;https://www.ntnu.no;https://www.ibm.com;https://www.nvidia.com/research",
        "aff_unique_abbr": "NTU;Aberdeen;NTNU;IBM;NVIDIA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;2;3;0;3",
        "aff_country_unique": "Singapore;United Kingdom;Norway;United States"
    },
    {
        "id": "QqqkskOFO9",
        "title": "Rethinking Actor-Critic: Successive Actors for Critic Maximization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Value-based actor-critic approaches have been widely employed for continuous and large discrete action space reinforcement learning tasks. Traditionally, an actor-network is trained to find the action that maximizes the critic (action-value function) with gradient ascent.\nWe identify that often an actor fails to maximize the critic because (i) certain tasks have challenging action-value landscapes with several local optima, and (ii) the critic landscape varies non-stationarily over training. This inability to find the optimal action often leads to sample-inefficient training and suboptimal convergence. To address the challenge of better maximization of the critic's landscape, we present a novel reformulation of the actor by employing a sequence of sub-actors with increasingly tractable action-value landscapes.\nIn large discrete and continuous action space tasks, we demonstrate that our approach finds actions that better maximize the action-value function than conventional actor-network approaches, enabling better performance. [https://sites.google.com/view/complexaction](https://sites.google.com/view/complexaction)",
        "keywords": "Off-policy reinforcement learning;actor-critic methods;TD3;discrete action spaces;continuous action spaces",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/06ed3b42d4021a7e183e68853a2ff653714983c1.zip",
        "author": "Ayush Jain;Norio Kosaka;Xinhu Li;Kyung-Min Kim;Joseph J Lim",
        "authorids": "~Ayush_Jain2;~Norio_Kosaka1;~Xinhu_Li1;~Kyung-Min_Kim1;~Joseph_J_Lim1",
        "gender": ";M;M;M;M",
        "homepage": "https://ayushj240.github.io/;https://rowing0914.github.io/;;;http://people.csail.mit.edu/lim/",
        "dblp": "131/6283-3.html;;;85/8572;08/3086",
        "google_scholar": "-zEc_sAAAAAJ;dIpkfPAAAAAJ;;https://scholar.google.com/citations?hl=en;jTnQTBoAAAAJ",
        "orcid": ";;;0000-0003-2426-2198;",
        "linkedin": ";norio-kosaka-b73701117/;%E6%98%95%E8%99%8E-%E6%9D%8E-2ba449200/;;",
        "or_profile": "~Ayush_Jain2;~Norio_Kosaka1;~Xinhu_Li1;~Kyung-Min_Kim1;~Joseph_J_Lim1",
        "aff": "University of Southern California;LINE;;NAVER;Korea Advanced Institute of Science & Technology",
        "aff_domain": "usc.edu;linecorp.com;;navercorp.com;kaist.ac.kr",
        "position": "PhD student;Researcher;;Leader;Associate Professor",
        "bibtex": "@misc{\njain2024rethinking,\ntitle={Rethinking Actor-Critic: Successive Actors for Critic Maximization},\nauthor={Ayush Jain and Norio Kosaka and Xinhu Li and Kyung-Min Kim and Joseph J Lim},\nyear={2024},\nurl={https://openreview.net/forum?id=QqqkskOFO9}\n}",
        "github": "",
        "project": "",
        "reviewers": "MBmv;ZeCv;ojfo;oxP1",
        "site": "https://openreview.net/forum?id=QqqkskOFO9",
        "pdf_size": 4725302,
        "rating": "3;3;5;5",
        "confidence": "5;3;4;3",
        "soundness": "1;2;3;2",
        "contribution": "2;2;3;2",
        "presentation": "1;3;3;3",
        "wc_summary": "54;99;71;95",
        "wc_strengths": "29;28;55;61",
        "wc_weaknesses": "98;416;126;843",
        "wc_questions": "165;2;66;66",
        "wc_review": "346;545;318;1065",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "770;581;460;1173",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            79.75,
            18.32177666057525
        ],
        "wc_strengths_avg": [
            43.25,
            14.905955185763842
        ],
        "wc_weaknesses_avg": [
            370.75,
            299.73436156036564
        ],
        "wc_questions_avg": [
            74.75,
            58.28968605165068
        ],
        "wc_review_avg": [
            568.5,
            299.7169498043112
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            746.0,
            270.1508837668313
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.30151134457776363,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:XG1Zy0GH8fIJ:scholar.google.com/&scioq=Rethinking+Actor-Critic:+Successive+Actors+for+Critic+Maximization&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;2;3",
        "aff_unique_norm": "University of Southern California;;NAVER Corporation;Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.usc.edu;;https://www.naver.com;https://www.kaist.ac.kr",
        "aff_unique_abbr": "USC;;NAVER;KAIST",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Los Angeles;",
        "aff_country_unique_index": "0;2;2",
        "aff_country_unique": "United States;;South Korea"
    },
    {
        "id": "Qqu5mMgIBV",
        "title": "Castor: Causal Temporal Regime Structure Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The task of uncovering causal relationships among variables from time series data stands as an essential and challenging objective that cuts across a broad array of disciplines ranging from climate science to healthcare. Time series entail linear or non-linear relationships, and  usually follow multiple a priori unknown regimes.  Existing causal discovery methods can infer summary causal graphs from heterogeneous data with known regime indices, but they fall short in comprehensively learning both regime indices and the full temporal causal graph.\nIn this paper, we introduce CASTOR, a novel framework designed to learn causal relationships in heterogeneous time series data composed of various regimes, each governed by a distinct causal graph.  Through the maximization of a score function via the EM algorithm, CASTOR infers the number of regimes and learns linear or non-linear causal relationships inherent in each regime. We demonstrate the robust convergence properties of CASTOR, specifically highlighting its proficiency in accurately identifying unique regimes. Empirical evidence, garnered from exhaustive synthetic experiments and two real-world benchmarks, confirm CASTOR's superior performance in causal discovery compared to relevant baselines. \nBy learning a full temporal causal graph for each regime, CASTOR establishes itself as a distinctly interpretable method for causal discovery in heterogeneous time series.",
        "keywords": "Causal structure learning;time series;heterogeneous time series;Causal discovery",
        "primary_area": "causal reasoning",
        "supplementary_material": "/attachment/b50061a6c13be0ad5afc52bf9ed075b293721854.pdf",
        "author": "Abdellah Rahmani;Pascal Frossard",
        "authorids": "~Abdellah_Rahmani1;~Pascal_Frossard1",
        "gender": "M;",
        "homepage": "https://people.epfl.ch/abdellah.rahmani;",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Abdellah_Rahmani1;~Pascal_Frossard1",
        "aff": "EPFL - EPF Lausanne;",
        "aff_domain": "epfl.ch;",
        "position": "PhD student;",
        "bibtex": "@misc{\nrahmani2024castor,\ntitle={Castor: Causal Temporal Regime Structure Learning},\nauthor={Abdellah Rahmani and Pascal Frossard},\nyear={2024},\nurl={https://openreview.net/forum?id=Qqu5mMgIBV}\n}",
        "github": "",
        "project": "",
        "reviewers": "VxPv;4Xkb;Xsp2;eyWr",
        "site": "https://openreview.net/forum?id=Qqu5mMgIBV",
        "pdf_size": 951804,
        "rating": "3;3;5;5",
        "confidence": "4;3;4;3",
        "soundness": "1;2;3;3",
        "contribution": "2;2;1;2",
        "presentation": "3;1;2;2",
        "wc_summary": "28;52;129;97",
        "wc_strengths": "22;19;51;137",
        "wc_weaknesses": "160;270;647;202",
        "wc_questions": "4;7;4;125",
        "wc_review": "214;348;831;561",
        "wc_reply_reviewers": "93;0;586;75",
        "wc_reply_authors": "216;547;2210;418",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "1;1;4;2",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            76.5,
            39.14396505209967
        ],
        "wc_strengths_avg": [
            57.25,
            47.70940682926167
        ],
        "wc_weaknesses_avg": [
            319.75,
            192.97198630889406
        ],
        "wc_questions_avg": [
            35.0,
            51.97595597966429
        ],
        "wc_review_avg": [
            488.5,
            233.26647851759583
        ],
        "wc_reply_reviewers_avg": [
            188.5,
            232.13196677752074
        ],
        "wc_reply_authors_avg": [
            847.75,
            795.2937743375086
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7818542885449028986&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0",
        "aff_unique_norm": "EPFL",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.epfl.ch",
        "aff_unique_abbr": "EPFL",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Lausanne",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Switzerland"
    },
    {
        "title": "PRIME: Prioritizing Interpretability in Failure Mode Extraction",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18664",
        "id": "QrEHs9w5UF",
        "author_site": "Keivan Rezaei, Mehrdad Saberi, Mazda Moayeri, Soheil Feizi",
        "tldr": "",
        "abstract": "In this work, we study the challenge of providing human-understandable descriptions for failure modes in trained image classification models.\nExisting works address this problem by first identifying clusters (or directions) of incorrectly classified samples in a latent space and then aiming to provide human-understandable text descriptions for them.\nWe observe that in some cases, describing text does not match well\nwith identified failure modes, partially owing to the fact that shared interpretable attributes of failure modes may not be captured using clustering in the feature space.\nTo improve on these shortcomings, we propose a novel approach that prioritizes interpretability in this problem: we start by obtaining human-understandable concepts (tags) of images in the dataset and\nthen analyze the model's behavior based on the presence or absence of combinations of these tags.\nOur method also ensures that the tags describing a failure mode form a minimal set,\navoiding redundant and noisy descriptions.\nThrough several experiments on different datasets, we show that our method successfully identifies failure modes and generates high-quality text descriptions associated with them.\nThese results highlight the importance of prioritizing interpretability in understanding model failures.",
        "keywords": "interpretability;failure modes;bias",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/12c909bde4ffec3733107f0e9a8dcc340e9e7a50.zip",
        "author": "Keivan Rezaei;Mehrdad Saberi;Mazda Moayeri;Soheil Feizi",
        "authorids": "~Keivan_Rezaei1;~Mehrdad_Saberi1;~Mazda_Moayeri1;~Soheil_Feizi2",
        "gender": "M;M;;M",
        "homepage": "https://k1rezaei.github.io;https://mehrdadsaberi.github.io/;https://www.cs.umd.edu/people/mmoayeri;https://www.cs.umd.edu/~sfeizi/",
        "dblp": "339/7254;289/1707;261/8493;57/2132",
        "google_scholar": "NsJKrKIAAAAJ;qCZacxgAAAAJ;4f4m6O0AAAAJ;lptAmrMAAAAJ",
        "orcid": ";;;",
        "linkedin": "keivan-rezaei-1b434680/;mehrdads/;;",
        "or_profile": "~Keivan_Rezaei1;~Mehrdad_Saberi1;~Mazda_Moayeri1;~Soheil_Feizi2",
        "aff": "University of Maryland, College Park;Department of Computer Science, University of Maryland, College Park;University of Maryland, College Park;University of Maryland, College Park",
        "aff_domain": "umd.edu;cs.umd.edu;umd.edu;umd.edu",
        "position": "PhD student;PhD student;PhD student;Associate Professor",
        "bibtex": "@inproceedings{\nrezaei2024prime,\ntitle={{PRIME}: Prioritizing Interpretability in Failure Mode Extraction},\nauthor={Keivan Rezaei and Mehrdad Saberi and Mazda Moayeri and Soheil Feizi},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=QrEHs9w5UF}\n}",
        "github": "",
        "project": "",
        "reviewers": "WEiw;eU94;dBy1;j2ri",
        "pdf_size": 6590233,
        "rating": "5;6;6;8",
        "confidence": "4;4;4;3",
        "soundness": "1;3;3;3",
        "contribution": "2;3;3;4",
        "presentation": "2;3;3;3",
        "wc_summary": "85;73;172;103",
        "wc_strengths": "40;111;157;216",
        "wc_weaknesses": "600;156;576;180",
        "wc_questions": "54;4;231;10",
        "wc_review": "779;344;1136;509",
        "wc_reply_reviewers": "757;0;521;29",
        "wc_reply_authors": "1351;534;1060;284",
        "reply_reviewers": "1;0;2;1",
        "reply_authors": "3;2;2;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            108.25,
            38.323458873123656
        ],
        "wc_strengths_avg": [
            131.0,
            64.38555738673077
        ],
        "wc_weaknesses_avg": [
            378.0,
            210.34257771549724
        ],
        "wc_questions_avg": [
            74.75,
            92.25338747168041
        ],
        "wc_review_avg": [
            692.0,
            299.7073572670514
        ],
        "wc_reply_reviewers_avg": [
            326.75,
            323.36850109433976
        ],
        "wc_reply_authors_avg": [
            807.25,
            420.7144964224551
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9271726499455306,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=216963040812269590&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=QrEHs9w5UF",
        "pdf": "https://openreview.net/pdf?id=QrEHs9w5UF",
        "email": "umd.edu;cs.umd.edu;umd.edu;umd.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "University of Maryland;University of Maryland, College Park",
        "aff_unique_dep": ";Department of Computer Science",
        "aff_unique_url": "https://www/umd.edu;https://www/umd.edu",
        "aff_unique_abbr": "UMD;UMD",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "College Park",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Qs81lLhOor",
        "title": "HGAMLP: A Scalable Training Framework for Heterogeneous Graph Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Heterogeneous graphs contain rich semantic information that can be exploited by heterogeneous graph neural networks (HGNNs). However, scaling HGNNs to large graphs is challenging due to the high computational cost.\nExisting scalable HGNNs use general subgraph construction method and mean aggregator to reduce the complexity.\nDespite their high scalability, they ignore two key characteristics of heterogeneous graphs, leading to low predictive performance.\nFirst, they adopt a fixed knowledge extractor during the local feature aggregation and the global semantic fusion of multiple meta-paths.\nBesides, they bury the graph structure information of the higher-order meta-paths and fail to fully leverage the higher-order global information.\nIn this paper, we address these two limitations and propose a scalable HGNN framework called Heterogeneous Graph Attention Multi-Layer Perceptron (HGAMLP). Our framework employs a local multi-knowledge extractor to enhance the node representation, and leverages the de-redundancy mechanism to extract the pure graph structure information from higher-order meta-paths.\nBesides, it also adopts a node-adaptive weight adjustment mechanism to fuse the global knowledge from each local knowledge extractor.\nWe evaluate our framework on five commonly used heterogeneous graph datasets and show that it outperforms the state-of-the-art baselines in both accuracy and speed. Notably, our framework achieves the best performance on the large public heterogeneous graph dataset (i.e., Ogbn-mag) of Open Graph Benchmark.",
        "keywords": "heterogeneous graph;graph neural networks;scalability",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/998e24cb3adaff2f1708677f18542896ae611ba5.zip",
        "author": "Yuxuan Liang;Wentao Zhang;Zeang Sheng;Ling Yang;Jiawei Jiang;Yunhai Tong;Bin CUI",
        "authorids": "~Yuxuan_Liang2;~Wentao_Zhang1;~Zeang_Sheng1;~Ling_Yang1;~Jiawei_Jiang1;~Yunhai_Tong1;~Bin_CUI2",
        "gender": "M;M;M;M;M;M;M",
        "homepage": "https://www.pku.edu.cn/;https://scholar.google.com/citations?user=cIaU0iIAAAAJ&hl=en;https://yangling0818.github.io/;http://bluesjjw.github.io/;http://www.cis.pku.edu.cn/faculty/system/tongyunhai/tongyunhai.htm;https://cuibinpku.github.io/index.html;https://zwt233.github.io/",
        "dblp": ";298/0674;01/24-6.html;185/1521-1;14/1705;55/5031.html;41/3249-1.html",
        "google_scholar": ";cIaU0iIAAAAJ;https://scholar.google.com.hk/citations?user=sIKujqAAAAAJ;G_Hg-j0AAAAJ;T4gqdPkAAAAJ;IJAU8KoAAAAJ;JE4VON0AAAAJ",
        "orcid": ";0009-0002-4427-3038;0000-0003-1905-8053;0000-0003-0051-0046;;0000-0003-1681-4677;0000-0002-7532-5550",
        "linkedin": ";;;;;;",
        "or_profile": "~Yuxuan_Liang2;~Zeang_Sheng1;~Ling_Yang1;~Jiawei_Jiang1;~Yunhai_Tong1;~Bin_CUI2;~Zhang_wen_tao1",
        "aff": "Peking University;Peking University;Peking University;Wuhan University;Peking University;Peking University;Peking University",
        "aff_domain": "pku.edu.cn;pku.edu.cn;pku.edu.cn;whu.edu.cn;pku.edu.cn;pku.edu.cn;pku.edu.cn",
        "position": "PhD student;PhD student;PhD student;Full Professor;Full Professor;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nliang2024hgamlp,\ntitle={{HGAMLP}: A Scalable Training Framework for Heterogeneous Graph Learning},\nauthor={Yuxuan Liang and Wentao Zhang and Zeang Sheng and Ling Yang and Jiawei Jiang and Yunhai Tong and Bin CUI},\nyear={2024},\nurl={https://openreview.net/forum?id=Qs81lLhOor}\n}",
        "github": "",
        "project": "",
        "reviewers": "Qrvt;W1yU;TS4L",
        "site": "https://openreview.net/forum?id=Qs81lLhOor",
        "pdf_size": 824160,
        "rating": "3;3;5",
        "confidence": "4;4;5",
        "soundness": "2;2;3",
        "contribution": "2;2;2",
        "presentation": "3;3;3",
        "wc_summary": "18;49;68",
        "wc_strengths": "28;60;39",
        "wc_weaknesses": "333;93;160",
        "wc_questions": "11;134;124",
        "wc_review": "390;336;391",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            45.0,
            20.607442021431645
        ],
        "wc_strengths_avg": [
            42.333333333333336,
            13.27487183449325
        ],
        "wc_weaknesses_avg": [
            195.33333333333334,
            101.11489614405102
        ],
        "wc_questions_avg": [
            89.66666666666667,
            55.77534301901593
        ],
        "wc_review_avg": [
            372.3333333333333,
            25.69478978746902
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:KKoTHO0YmxAJ:scholar.google.com/&scioq=HGAMLP:+A+Scalable+Training+Framework+for+Heterogeneous+Graph+Learning&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;0;0;0",
        "aff_unique_norm": "Peking University;Wuhan University",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.pku.edu.cn;http://www.whu.edu.cn/",
        "aff_unique_abbr": "Peking U;WHU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "QtCpQHsO1Q",
        "title": "Alleviating Label Shift Through Self-trained Intermediate Distribution: Theory and Algorithms",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "As an obstacle towards real-world problems with the changing environment, label shift, which assumes the source and target label marginal distributions differ, loosens the homogeneous distribution assumption in classical learning scenarios. To correct the label shift, importance weighting is one of the most popular strategies with rigorous theoretical guarantees. However, the importance weight estimation of most existing methods results in high variance under large label shift or few source samples. In this paper, we introduce an ideal intermediate distribution instead of the source distribution to reduce the variation to the target label distribution. Our approach learns a self-trained intermediate distribution constructed from the labeled source and unlabeled target samples to approximate the ideal intermediate distribution. It balances the bias from pseudo target labels and the variance from importance weighting. Besides, we prove the sample complexity and generalization guarantees for our approach, which has a tighter generalization bound than the existing label shift methods under mild conditions. Extensive experimental results validate the effectiveness of our approach over existing state-of-the-arts methods.",
        "keywords": "Label Shift; Self-trained; Intermediate Distribution",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Ruidong Fan;Xiao Ouyang;Tingjin Luo;Yuhua Qian;Chenping Hou",
        "authorids": "~Ruidong_Fan1;~Xiao_Ouyang1;~Tingjin_Luo2;~Yuhua_Qian1;~Chenping_Hou1",
        "gender": "M;F;M;M;M",
        "homepage": ";https://sciprofiles.com/profile/1218194;https://scholar.google.com/citations?user=w0YDfhcAAAAJ&hl=zh-CN;http://yuhuaqian.net/;",
        "dblp": "274/2595.html;;175/8608;;59/3444",
        "google_scholar": ";;;;",
        "orcid": ";;;0000-0001-6772-4247;0000-0002-9335-0469",
        "linkedin": ";;;;",
        "or_profile": "~Ruidong_Fan1;~Xiao_Ouyang1;~Tingjin_Luo2;~Yuhua_Qian1;~Chenping_Hou1",
        "aff": "National University of Defense Technology;National University of Defense Technology;National University of Defense Technology;Shanxi University;National University of Defense Technology",
        "aff_domain": "nudt.edu.cn;nudt.edu.cn;nudt.edu.cn;sxu.edu.cn;nudt.edu.cn",
        "position": "PhD student;MS student;Associate Professor;Full Professor;Professor",
        "bibtex": "@misc{\nfan2024alleviating,\ntitle={Alleviating Label Shift Through Self-trained Intermediate Distribution: Theory and Algorithms},\nauthor={Ruidong Fan and Xiao Ouyang and Tingjin Luo and Yuhua Qian and Chenping Hou},\nyear={2024},\nurl={https://openreview.net/forum?id=QtCpQHsO1Q}\n}",
        "github": "",
        "project": "",
        "reviewers": "zjuc;dogK;goif;MY42",
        "site": "https://openreview.net/forum?id=QtCpQHsO1Q",
        "pdf_size": 344241,
        "rating": "3;3;6;6",
        "confidence": "4;4;3;4",
        "soundness": "2;1;3;3",
        "contribution": "2;1;3;3",
        "presentation": "2;1;4;3",
        "wc_summary": "84;67;34;55",
        "wc_strengths": "42;30;37;68",
        "wc_weaknesses": "158;189;242;47",
        "wc_questions": "64;8;10;215",
        "wc_review": "348;294;323;385",
        "wc_reply_reviewers": "163;53;16;24",
        "wc_reply_authors": "255;219;227;177",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            60.0,
            18.207141456033124
        ],
        "wc_strengths_avg": [
            44.25,
            14.359230480774379
        ],
        "wc_weaknesses_avg": [
            159.0,
            71.29866758923339
        ],
        "wc_questions_avg": [
            74.25,
            84.31006760761137
        ],
        "wc_review_avg": [
            337.5,
            33.425289826716536
        ],
        "wc_reply_reviewers_avg": [
            64.0,
            58.79200625935468
        ],
        "wc_reply_authors_avg": [
            219.5,
            27.941904015295737
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5773502691896258,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:c7bGdM8ZTGAJ:scholar.google.com/&scioq=Alleviating+Label+Shift+Through+Self-trained+Intermediate+Distribution:+Theory+and+Algorithms&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "National University of Defense Technology;Shanxi University",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.nudt.edu.cn/;http://www.sxu.edu.cn",
        "aff_unique_abbr": "NUDT;SXU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "QuFHei1vuE",
        "title": "Clearer Frames, Anytime: Resolving Velocity Ambiguity in Video Frame Interpolation",
        "track": "main",
        "status": "Desk Reject",
        "tldr": "",
        "abstract": "Existing video frame interpolation (VFI) methods blindly predict where each object is at a specific timestep t (\"time indexing\"), which struggles to predict precise object movements. Given two images of a baseball, there are infinitely many possible trajectories: accelerating or decelerating, straight or curved. This often results in blurry frames as the method averages out these possibilities.\nInstead of forcing the network to learn this complicated time-to-location mapping implicitly together with predicting the frames, we provide the network with an explicit hint on how far the object has traveled between start and end frames, a novel approach termed \"distance indexing\". This method offers a clearer learning goal for models, reducing the uncertainty tied to object speeds.\nWe further observed that, even with this extra guidance, objects can still be blurry especially when they are equally far from both input frames (i.e., halfway in-between), due to the directional ambiguity in long-range motion. To solve this, we propose an iterative reference-based estimation strategy that breaks down a long-range prediction into several short-range steps.\nWhen integrating our plug-and-play strategies into state-of-the-art learning-based models, they exhibit markedly sharper outputs and superior perceptual quality in arbitrary time interpolations, using a uniform distance indexing map in the same format as time indexing.\nAdditionally, distance indexing can be specified pixel-wise, which enables temporal manipulation of each object independently, offering a novel tool for video editing tasks like re-timing.",
        "keywords": "Video frame interpolation;interpolate anything;velocity ambiguity",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/057ed6e012d413861752833cca82017db136f063.zip",
        "author": "Zhihang Zhong;Gurunandan Krishnan;Xiao Sun;Yu Qiao;Sizhuo Ma;Jian Wang",
        "authorids": "~Zhihang_Zhong1;~Gurunandan_Krishnan1;~Xiao_Sun8;~Yu_Qiao1;~Sizhuo_Ma1;~Jian_Wang10",
        "gender": "M;M;;;;M",
        "homepage": "https://zzh-tech.github.io/;;;;https://sizhuoma.netlify.app/;https://jianwang-cmu.github.io/",
        "dblp": "259/7061;;;;227/4634;39/449-100",
        "google_scholar": "_4d1GUcAAAAJ;BKYVv4MAAAAJ;;;_SyW0ukAAAAJ;https://scholar.google.ca/citations?user=WNmw2VkAAAAJ",
        "orcid": "0000-0002-1801-8095;0000-0002-1533-2169;;;;0000-0001-5266-3808",
        "linkedin": "zhihang-zhong-551979180/;krishnanguru/;;;;jian-james-wang-62997944/",
        "or_profile": "~Zhihang_Zhong1;~Gurunandan_Krishnan1;~Xiao_Sun8;~Yu_Qiao1;~Sizhuo_Ma1;~Jian_Wang10",
        "aff": "Shanghai AI Lab;Snap Inc.;;;Snap Inc.;Snap Inc.",
        "aff_domain": "pjlab.org.cn;snap.com;;;snapchat.com;snapchat.com",
        "position": "Researcher;Principal Researcher;;;Researcher;Researcher",
        "bibtex": "@misc{\nzhong2024clearer,\ntitle={Clearer Frames, Anytime: Resolving Velocity Ambiguity in Video Frame Interpolation},\nauthor={Zhihang Zhong and Gurunandan Krishnan and Xiao Sun and Yu Qiao and Sizhuo Ma and Jian Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=QuFHei1vuE}\n}",
        "github": "",
        "project": "",
        "reviewers": "PtYf;aknz;BPE4;1WoD",
        "site": "https://openreview.net/forum?id=QuFHei1vuE",
        "pdf_size": 9072342,
        "rating": "6;6;8;8",
        "confidence": "5;4;2;4",
        "soundness": "3;3;3;4",
        "contribution": "3;2;3;4",
        "presentation": "3;2;3;4",
        "wc_summary": "94;84;83;94",
        "wc_strengths": "47;42;68;55",
        "wc_weaknesses": "139;757;16;151",
        "wc_questions": "30;16;1;66",
        "wc_review": "310;899;168;366",
        "wc_reply_reviewers": "0;0;0;26",
        "wc_reply_authors": "1252;2903;277;1003",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "2;5;1;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            88.75,
            5.261891294962297
        ],
        "wc_strengths_avg": [
            53.0,
            9.82344135219425
        ],
        "wc_weaknesses_avg": [
            265.75,
            288.5024913237319
        ],
        "wc_questions_avg": [
            28.25,
            24.087081599894994
        ],
        "wc_review_avg": [
            435.75,
            277.0238031289008
        ],
        "wc_reply_reviewers_avg": [
            6.5,
            11.258330249197702
        ],
        "wc_reply_authors_avg": [
            1358.75,
            960.838793710995
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            1.5
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.6882472016116854,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2857671192203028596&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Shanghai AI Lab;Snap Inc.",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.shanghaiailab.com;https://www.snapinc.com",
        "aff_unique_abbr": "SAIL;Snap",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Algorithms for Caching and MTS with reduced number of predictions",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18663",
        "id": "QuIiLSktO4",
        "author_site": "Karim Ahmed Abdel Sadek, Marek Elias",
        "tldr": "",
        "abstract": "ML-augmented algorithms utilize predictions to achieve performance beyond their worst-case bounds. Producing these predictions might be a costly operation \u2013 this motivated Im et al. [2022] to introduce the study of algorithms which use predictions parsimoniously. We design parsimonious algorithms for caching and MTS with action predictions, proposed by Antoniadis et al. [2023], focusing on the parameters of consistency (performance with perfect predictions) and smoothness (dependence of their performance on prediction error). Our algorithm for caching is 1-consistent, robust, and its smoothness deteriorates with decreasing number of available predictions. We propose an algorithm for general MTS whose consistency and smoothness both scale linearly with the decreasing number of predictions. Without restriction on the number of available predictions, both algorithms match the earlier guarantees achieved by Antoniadis et al. [2023].",
        "keywords": "ML-Augmented Algorithms;Caching;Metrical Task Systems",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Karim Ahmed Abdel Sadek;Marek Elias",
        "authorids": "~Karim_Ahmed_Abdel_Sadek1;~Marek_Elias1",
        "gender": "M;",
        "homepage": "https://karim-abdel.github.io/;https://elias.ba30.eu",
        "dblp": "375/1932;173/4575",
        "google_scholar": "mopk5EAAAAAJ;",
        "orcid": ";",
        "linkedin": "karimabdell/;",
        "or_profile": "~Karim_Ahmed_Abdel_Sadek1;~Marek_Elias1",
        "aff": "University of Cambridge;Bocconi University",
        "aff_domain": "cam.ac.uk;unibocconi.it",
        "position": "Intern;Assistant Professor",
        "bibtex": "@inproceedings{\nsadek2024algorithms,\ntitle={Algorithms for Caching and {MTS} with reduced number of predictions},\nauthor={Karim Ahmed Abdel Sadek and Marek Elias},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=QuIiLSktO4}\n}",
        "github": "",
        "project": "",
        "reviewers": "utqC;bwNg;NjU5;dLjd",
        "pdf_size": 783367,
        "rating": "8;8;8;8",
        "confidence": "3;4;4;3",
        "soundness": "3;4;3;3",
        "contribution": "3;4;4;3",
        "presentation": "3;4;3;3",
        "wc_summary": "266;252;361;204",
        "wc_strengths": "64;55;81;87",
        "wc_weaknesses": "16;46;78;71",
        "wc_questions": "332;353;31;6",
        "wc_review": "678;706;551;368",
        "wc_reply_reviewers": "5;0;8;0",
        "wc_reply_authors": "259;461;314;10",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            270.75,
            56.95338005772792
        ],
        "wc_strengths_avg": [
            71.75,
            12.833062767710599
        ],
        "wc_weaknesses_avg": [
            52.75,
            24.324627438051337
        ],
        "wc_questions_avg": [
            180.5,
            162.41074471844527
        ],
        "wc_review_avg": [
            575.75,
            133.40984783740666
        ],
        "wc_reply_reviewers_avg": [
            3.25,
            3.418698582794336
        ],
        "wc_reply_authors_avg": [
            261.0,
            162.64531963754752
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8983770404268483957&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=QuIiLSktO4",
        "pdf": "https://openreview.net/pdf?id=QuIiLSktO4",
        "email": "cam.ac.uk;unibocconi.it",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Cambridge;Bocconi University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cam.ac.uk;https://www.bocconi.edu",
        "aff_unique_abbr": "Cambridge;Bocconi",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Cambridge;",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United Kingdom;Italy"
    },
    {
        "title": "Pseudo-Generalized Dynamic View Synthesis from a Video",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18662",
        "id": "QuVlUn4T2G",
        "author_site": "Xiaoming Zhao, R Colburn, Fangchang Ma, MIGUEL ANGEL BAUTISTA, Joshua Susskind, Alex Schwing",
        "tldr": "",
        "abstract": "Rendering scenes observed in a monocular video from novel viewpoints is a challenging problem. For static scenes the community has studied both scene-specific optimization techniques, which optimize on every test scene, and generalized techniques, which only run a deep net forward pass on a test scene. In contrast, for dynamic scenes, scene-specific optimization techniques exist, but, to our best knowledge, there is currently no generalized method for dynamic novel view synthesis from a given monocular video. To explore whether generalized dynamic novel view synthesis from monocular videos is possible today, we establish an analysis framework based on existing techniques and work toward the generalized approach. We find a pseudo-generalized process without scene-specific \\emph{appearance} optimization is possible, but geometrically and temporally consistent depth estimates  are  needed. Despite no scene-specific appearance optimization, the pseudo-generalized approach improves upon some scene-specific methods.For more information see project page at https://xiaoming-zhao.github.io/projects/pgdvs.",
        "keywords": "dynamic novel view synthesis;generalized novel view synthesis",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/392105ce04022b28d5e49654646950a052724ea1.zip",
        "author": "Xiaoming Zhao;R Alex Colburn;Fangchang Ma;Miguel \u00c1ngel Bautista;Joshua M. Susskind;Alex Schwing",
        "authorids": "~Xiaoming_Zhao1;~R_Alex_Colburn1;~Fangchang_Ma2;~Miguel_\u00c1ngel_Bautista1;~Joshua_M._Susskind1;~Alex_Schwing1",
        "gender": ";M;M;M;M;Unspecified",
        "homepage": "https://xiaoming-zhao.com/;https://colburn.org;https://fangchangma.github.io/;;http://www.apple.com;https://ece.illinois.edu/directory/profile/aschwing",
        "dblp": "64/3046-1;53/4319;143/0493;38/10085;132/7797;79/9775",
        "google_scholar": "tDyRAbkAAAAJ;PghQbXMAAAAJ;kf07AjoAAAAJ;ZrRs-qoAAAAJ;Sv2TGqsAAAAJ;3B2c31wAAAAJ",
        "orcid": ";0000-0003-4125-4309;;;;",
        "linkedin": ";;fangchangma;;joshua-susskind-8ab2ab5/;",
        "or_profile": "~Xiaoming_Zhao1;~R_Alex_Colburn1;~Fangchang_Ma2;~Miguel_\u00c1ngel_Bautista1;~Joshua_M._Susskind1;~Alex_Schwing1",
        "aff": "University of Illinois Urbana Champaign;University of Washington;Apple;Apple;Apple;University of Illinois, Urbana Champaign",
        "aff_domain": "illinois.edu;uw.edu;apple.com;apple.com;apple.com;illinois.edu",
        "position": "PhD student;Affiliate Faculty;Researcher;Research Scientist;Researcher;Associate Professor",
        "bibtex": "@inproceedings{\nzhao2024pseudogeneralized,\ntitle={Pseudo-Generalized Dynamic View Synthesis from a Video},\nauthor={Xiaoming Zhao and R Alex Colburn and Fangchang Ma and Miguel {\\'A}ngel Bautista and Joshua M. Susskind and Alex Schwing},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=QuVlUn4T2G}\n}",
        "github": "",
        "project": "",
        "reviewers": "BQLw;bWXg;3K58;YL5S",
        "pdf_size": 9915067,
        "rating": "3;8;8;8",
        "confidence": "5;5;4;4",
        "soundness": "2;3;3;2",
        "contribution": "1;3;3;3",
        "presentation": "2;4;3;4",
        "wc_summary": "82;128;63;246",
        "wc_strengths": "14;92;36;87",
        "wc_weaknesses": "488;456;44;263",
        "wc_questions": "4;84;32;167",
        "wc_review": "588;760;175;763",
        "wc_reply_reviewers": "0;117;22;27",
        "wc_reply_authors": "866;1044;329;764",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "4;3;4;4",
        "rating_avg": [
            6.75,
            2.165063509461097
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            129.75,
            71.15607844731187
        ],
        "wc_strengths_avg": [
            57.25,
            33.22179254645962
        ],
        "wc_weaknesses_avg": [
            312.75,
            177.43643227928135
        ],
        "wc_questions_avg": [
            71.75,
            62.03376096933024
        ],
        "wc_review_avg": [
            571.5,
            239.62940136802914
        ],
        "wc_reply_reviewers_avg": [
            41.5,
            44.75768090506924
        ],
        "wc_reply_authors_avg": [
            750.75,
            263.3091101728157
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.75,
            0.4330127018922193
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4563982593807248121&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=QuVlUn4T2G",
        "pdf": "https://openreview.net/pdf?id=QuVlUn4T2G",
        "email": "illinois.edu;uw.edu;apple.com;apple.com;apple.com;illinois.edu",
        "author_num": 6,
        "aff_unique_index": "0;1;2;2;2;0",
        "aff_unique_norm": "University of Illinois Urbana-Champaign;University of Washington;Apple",
        "aff_unique_dep": ";;Apple Inc.",
        "aff_unique_url": "https://illinois.edu;https://www.washington.edu;https://www.apple.com",
        "aff_unique_abbr": "UIUC;UW;Apple",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Urbana-Champaign;",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Qufas3h0mY",
        "title": "Enabling Model Parallelism for Neural Networks Based on Decoupled Supervised Contrastive Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "End-to-end backpropagation (BP) is the current standard for training deep neural networks. However, as networks become deeper, BP becomes inefficient for various reasons. This paper introduces a new methodology that decouples BP, transforming a long gradient flow into multiple short ones. This design enables the \\emph{simultaneous} computation of parameter gradients in different layers so as to realize better model parallelism. Thorough experiments are presented to demonstrate the efficiency and effectiveness of our model compared to BP, Early Exit, GPipe, and associated learning (AL), a state-of-the-art methodology for backpropagation decoupling. The experimental code is released for reproducibility at \\url{https://anonymous.4open.science/r/SCPL-802C/}",
        "keywords": "model parallelism;contrastive learning;supervised contrastive learning;bubbles",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/483df494f1692cf3764a2f53b487cd1f1e9f1c0e.pdf",
        "author": "Ming-Yao Ho;Cheng-Kai Wang;Hung-Hsuan Chen",
        "authorids": "~Ming-Yao_Ho1;~Cheng-Kai_Wang1;~Hung-Hsuan_Chen1",
        "gender": ";M;",
        "homepage": "https://github.com/minyaho;https://github.com/ChengKai-Wang/;",
        "dblp": ";;13/1892",
        "google_scholar": ";;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Ming-Yao_Ho1;~Cheng-Kai_Wang1;~Hung-Hsuan_Chen1",
        "aff": "National Central University;;National Central University, Taiwan",
        "aff_domain": "ncu.edu.tw;;ncu.edu.tw",
        "position": "MS student;;Associa",
        "bibtex": "@misc{\nho2024enabling,\ntitle={Enabling Model Parallelism for Neural Networks Based on Decoupled Supervised Contrastive Learning},\nauthor={Ming-Yao Ho and Cheng-Kai Wang and Hung-Hsuan Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=Qufas3h0mY}\n}",
        "github": "",
        "project": "",
        "reviewers": "sXbp;iF7K;3oSN;KKRG",
        "site": "https://openreview.net/forum?id=Qufas3h0mY",
        "pdf_size": 876300,
        "rating": "3;3;5;5",
        "confidence": "4;2;4;4",
        "soundness": "3;3;3;2",
        "contribution": "2;2;2;3",
        "presentation": "3;4;2;3",
        "wc_summary": "51;117;95;578",
        "wc_strengths": "49;41;39;73",
        "wc_weaknesses": "137;128;429;188",
        "wc_questions": "285;25;186;649",
        "wc_review": "522;311;749;1488",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            210.25,
            213.646173614226
        ],
        "wc_strengths_avg": [
            50.5,
            13.518505834595775
        ],
        "wc_weaknesses_avg": [
            220.5,
            122.53264871045594
        ],
        "wc_questions_avg": [
            286.25,
            229.06917623285767
        ],
        "wc_review_avg": [
            767.5,
            443.8820226141176
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:3XDXS0f9-nIJ:scholar.google.com/&scioq=Enabling+Model+Parallelism+for+Neural+Networks+Based+on+Decoupled+Supervised+Contrastive+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "National Central University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ncu.edu.tw",
        "aff_unique_abbr": "NCU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Taiwan",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "Qvoe4wXWFi",
        "title": "NeuralFuse: Learning to Recover the Accuracy of Access-Limited Neural Network Inference in Low-Voltage Regimes",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep neural networks (DNNs) have become ubiquitous in machine learning, but their energy consumption remains a notable issue. Lowering the supply voltage is an effective strategy for reducing energy consumption. However, aggressively scaling down the supply voltage can lead to accuracy degradation due to random bit flips in static random access memory (SRAM) where model parameters are stored. To address this challenge, we introduce NeuralFuse, a novel add-on module that addresses the accuracy-energy tradeoff in low-voltage regimes by learning input transformations to generate error-resistant data representations. NeuralFuse protects DNN accuracy in both nominal and low-voltage scenarios. Moreover, NeuralFuse is easy to implement and can be readily applied to DNNs with limited access, such as non-configurable hardware or remote access to cloud-based APIs. Experimental results demonstrate that, at a 1% bit error rate, NeuralFuse can reduce SRAM memory access energy by up to 24% while recovering accuracy by up to 57%. To the best of our knowledge, this is the first model-agnostic approach (i.e., no model retraining) to address low-voltage-induced bit errors.",
        "keywords": "machine learning;energy efficient inference;bit error resilience",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "/attachment/dc513aab6d91234f008ffd32261ead559695367e.pdf",
        "author": "Hao-Lun Sun;Lei Hsiung;Nandhini Chandramoorthy;Pin-Yu Chen;Tsung-Yi Ho",
        "authorids": "~Hao-Lun_Sun1;~Lei_Hsiung1;~Nandhini_Chandramoorthy1;~Pin-Yu_Chen1;~Tsung-Yi_Ho2",
        "gender": "M;;F;M;M",
        "homepage": ";https://hsiung.cc/;;http://www.pinyuchen.com;https://www.cse.cuhk.edu.hk/people/faculty/tsung-yi-ho/",
        "dblp": "283/1534;313/9417;29/11469.html;39/8969;63/4181.html",
        "google_scholar": "g2MolmMAAAAJ;CJaZ2NcAAAAJ;;jxwlCUUAAAAJ;TRDUYkAAAAAJ",
        "orcid": ";;;0000-0003-1039-8369;0000-0001-7348-5625",
        "linkedin": "hao-lun-sun-24b910233/;l-hsiung/;;pin-yu-chen-940062a2;",
        "or_profile": "~Hao-Lun_Sun1;~Lei_Hsiung1;~Nandhini_Chandramoorthy1;~Pin-Yu_Chen1;~Tsung-Yi_Ho2",
        "aff": "Mediatek;Dartmouth College;;International Business Machines;Department of Computer Science and Engineering, The Chinese University of Hong Kong",
        "aff_domain": "mediatek.com;dartmouth.edu;;ibm.com;cse.cuhk.edu.hk",
        "position": "Engineer;PhD student;;Principal Researcher;Full Professor",
        "bibtex": "@misc{\nsun2024neuralfuse,\ntitle={NeuralFuse: Learning to Recover the Accuracy of Access-Limited Neural Network Inference in Low-Voltage Regimes},\nauthor={Hao-Lun Sun and Lei Hsiung and Nandhini Chandramoorthy and Pin-Yu Chen and Tsung-Yi Ho},\nyear={2024},\nurl={https://openreview.net/forum?id=Qvoe4wXWFi}\n}",
        "github": "",
        "project": "",
        "reviewers": "7gLE;uT9R;YHTK;Qmac",
        "site": "https://openreview.net/forum?id=Qvoe4wXWFi",
        "pdf_size": 5099181,
        "rating": "5;5;5;8",
        "confidence": "4;4;5;3",
        "soundness": "3;2;2;3",
        "contribution": "3;2;2;4",
        "presentation": "3;2;4;4",
        "wc_summary": "73;51;63;76",
        "wc_strengths": "58;36;26;103",
        "wc_weaknesses": "147;77;141;41",
        "wc_questions": "5;132;61;29",
        "wc_review": "283;296;291;249",
        "wc_reply_reviewers": "0;91;61;27",
        "wc_reply_authors": "1000;986;799;435",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "3;2;2;2",
        "rating_avg": [
            5.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            65.75,
            9.781998773256925
        ],
        "wc_strengths_avg": [
            55.75,
            29.634228520412
        ],
        "wc_weaknesses_avg": [
            101.5,
            44.4156503948777
        ],
        "wc_questions_avg": [
            56.75,
            47.77224612680463
        ],
        "wc_review_avg": [
            279.75,
            18.34904629674251
        ],
        "wc_reply_reviewers_avg": [
            44.75,
            34.35385713424331
        ],
        "wc_reply_authors_avg": [
            805.0,
            227.88264523653396
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16994568417590757467&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "MediaTek Inc.;Dartmouth College;International Business Machines Corporation;Chinese University of Hong Kong",
        "aff_unique_dep": ";;;Department of Computer Science and Engineering",
        "aff_unique_url": "https://www.mediatek.com/;https://www.dartmouth.edu;https://www.ibm.com;https://www.cuhk.edu.hk",
        "aff_unique_abbr": "MediaTek;Dartmouth;IBM;CUHK",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Taiwan;;Hong Kong SAR",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "QwNj5TP9gm",
        "title": "Evidential Conservative Q-Learning for Dynamic Recommendations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Reinforcement learning (RL) has been leveraged in recommender systems (RS) to capture users' evolving preferences and continuously improve the quality of recommendations. In this paper, we propose a novel evidential conservative Q-learning framework (ECQL) that learns an effective and conservative recommendation policy by integrating evidence-based uncertainty and conservative learning. ECQL conducts evidence-aware explorations to discover items that locate beyond current observation but reflect users' long-term interests. Also, it provides an uncertainty-aware conservative view on policy evaluation to discourage deviating too much from users' current interests. Two central components of ECQL include a uniquely designed sequential state encoder and a novel conservative evidential-actor-critic (CEAC) module. The former generates the current state of the environment by aggregating historical information and a sliding window that contains the current user interactions as well as newly recommended items from RL exploration that may represent future interests. The latter performs an evidence-based rating prediction by maximizing the conservative evidential Q-value and leverages a ranking score to explore the item space for a more diverse and valuable recommendation. Experiments on multiple real-world dynamic datasets demonstrate the state-of-the-art performance of ECQL and its capability to capture users' long-term interests.",
        "keywords": "dynamic recommendation;evidential uncertainty",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Dingrong Wang;Krishna Prasad Neupane;Ervine Zheng;Qi Yu",
        "authorids": "~Dingrong_Wang1;~Krishna_Prasad_Neupane1;~Ervine_Zheng1;~Qi_Yu1",
        "gender": "M;M;;M",
        "homepage": "https://wdr123.github.io;;;https://www.rit.edu/mining/",
        "dblp": "276/3229;;;58/6957-1",
        "google_scholar": "v--3Zr0AAAAJ;8UHcQU0AAAAJ;;L3gWdfEAAAAJ",
        "orcid": "0009-0005-2407-2337;;;0000-0002-0426-5407",
        "linkedin": "dingrong-wang-56a203179/;;;",
        "or_profile": "~Dingrong_Wang1;~Krishna_Prasad_Neupane1;~Ervine_Zheng1;~Qi_Yu1",
        "aff": "Rochester Institute of Technology;;;Rochester Institute of Technology",
        "aff_domain": "rit.edu;;;rit.edu",
        "position": "PhD student;;;Professor",
        "bibtex": "@misc{\nwang2024evidential,\ntitle={Evidential Conservative Q-Learning for Dynamic Recommendations},\nauthor={Dingrong Wang and Krishna Prasad Neupane and Ervine Zheng and Qi Yu},\nyear={2024},\nurl={https://openreview.net/forum?id=QwNj5TP9gm}\n}",
        "github": "",
        "project": "",
        "reviewers": "Yout;gFnt;GVwA;jjM8",
        "site": "https://openreview.net/forum?id=QwNj5TP9gm",
        "pdf_size": 873782,
        "rating": "3;5;5;5",
        "confidence": "4;5;4;4",
        "soundness": "2;3;3;2",
        "contribution": "2;2;3;2",
        "presentation": "2;2;3;3",
        "wc_summary": "73;189;59;200",
        "wc_strengths": "33;100;98;71",
        "wc_weaknesses": "343;196;177;118",
        "wc_questions": "8;48;59;26",
        "wc_review": "457;533;393;415",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "938;896;850;1286",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;2;2;3",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            130.25,
            64.55762929352348
        ],
        "wc_strengths_avg": [
            75.5,
            27.07858932810201
        ],
        "wc_weaknesses_avg": [
            208.5,
            82.80851405501731
        ],
        "wc_questions_avg": [
            35.25,
            19.715159142142372
        ],
        "wc_review_avg": [
            449.5,
            53.41114115987413
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            992.5,
            172.2868248009696
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:4cWKrYt4BygJ:scholar.google.com/&scioq=Evidential+Conservative+Q-Learning+for+Dynamic+Recommendations&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Rochester Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.rit.edu",
        "aff_unique_abbr": "RIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Is attention required for ICL? Exploring the Relationship Between Model Architecture and In-Context Learning Ability",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18661",
        "id": "Qwq4cpLtoX",
        "author_site": "Ivan Lee, Nan Jiang, Taylor Berg-Kirkpatrick",
        "tldr": "",
        "abstract": "What is the relationship between model architecture and the ability to perform in-context learning? In this empirical study, we take the first steps toward answering this question. We evaluate thirteen model architectures capable of causal language modeling across a suite of synthetic in-context learning tasks. These selected architectures represent a broad range of paradigms, including recurrent and convolution-based neural networks, transformers, state space model inspired, and other emerging attention alternatives. We discover that all the considered architectures can perform in-context learning under a wider range of conditions than previously documented. Additionally, we observe stark differences in statistical efficiency and consistency by varying the number of in-context examples and task difficulty. We also measure each architecture's predisposition towards in-context learning when presented with the option to memorize rather than leverage in-context examples. Finally, and somewhat surprisingly, we find that several attention alternatives are sometimes competitive with or better in-context learners than transformers. However, no single architecture demonstrates consistency across all tasks, with performance either plateauing or declining when confronted with a significantly larger number of in-context examples than those encountered during gradient-based training.",
        "keywords": "in-context learning;neural architectures",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Ivan Lee;Nan Jiang;Taylor Berg-Kirkpatrick",
        "authorids": "~Ivan_Lee2;~Nan_Jiang11;~Taylor_Berg-Kirkpatrick1",
        "gender": ";M;M",
        "homepage": "https://ivnle.github.io/;https://www.nanjiangwill.com/;https://cseweb.ucsd.edu/~tberg/",
        "dblp": ";;22/8160",
        "google_scholar": ";HDt26BUAAAAJ;mN6_BKAAAAAJ",
        "orcid": ";;",
        "linkedin": ";nan-jiang-4b1906188/;",
        "or_profile": "~Ivan_Lee2;~Nan_Jiang11;~Taylor_Berg-Kirkpatrick1",
        "aff": "University of California, San Diego;University of California, San Diego;University of California, San Diego",
        "aff_domain": "ucsd.edu;ucsd.edu;ucsd.edu",
        "position": "PhD student;Undergrad student;Associate Professor",
        "bibtex": "@inproceedings{\nlee2024is,\ntitle={Is attention required for {ICL}? Exploring the Relationship Between Model Architecture and In-Context Learning Ability},\nauthor={Ivan Lee and Nan Jiang and Taylor Berg-Kirkpatrick},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Qwq4cpLtoX}\n}",
        "github": "",
        "project": "",
        "reviewers": "9CgZ;Rxok;n4qL;7V5r",
        "pdf_size": 6329246,
        "rating": "5;5;6;6",
        "confidence": "4;2;3;4",
        "soundness": "3;2;3;3",
        "contribution": "2;1;2;3",
        "presentation": "3;3;3;2",
        "wc_summary": "163;103;71;90",
        "wc_strengths": "108;26;26;49",
        "wc_weaknesses": "508;84;216;107",
        "wc_questions": "163;77;186;52",
        "wc_review": "942;290;499;298",
        "wc_reply_reviewers": "264;112;106;26",
        "wc_reply_authors": "1756;346;739;241",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "3;2;2;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            106.75,
            34.412025514346
        ],
        "wc_strengths_avg": [
            52.25,
            33.52890543993347
        ],
        "wc_weaknesses_avg": [
            228.75,
            168.7592590052469
        ],
        "wc_questions_avg": [
            119.5,
            56.29609222672565
        ],
        "wc_review_avg": [
            507.25,
            264.6028864166073
        ],
        "wc_reply_reviewers_avg": [
            127.0,
            86.07554821202127
        ],
        "wc_reply_authors_avg": [
            770.5,
            598.4924811557786
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.30151134457776363,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12165997581642287012&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=Qwq4cpLtoX",
        "pdf": "https://openreview.net/pdf?id=Qwq4cpLtoX",
        "email": "ucsd.edu;ucsd.edu;ucsd.edu",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of California, San Diego",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucsd.edu",
        "aff_unique_abbr": "UCSD",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "San Diego",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Qwxe8WKSgy",
        "title": "BTBS-LNS: A Binarized-Tightening, Branch and Search Approach of Learning Large Neighborhood Search Policies for MIP",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Learning to solve large-scale Mixed Integer Program (MIP) problems is an emerging research topic, and policy learning-based Large Neighborhood Search (LNS) has recently shown its effectiveness. However, prevailing approaches predominantly concentrated on binary variables and local search strategies, often susceptible to becoming ensnared in local optima. In response to these challenges, we introduce a novel technique, termed Binarized-Tightening Branch-and-Search LNS (BTBS-LNS). Specifically, we propose the ``Binarized Tightening\" technique for integer variables to deal with their wide range by encoding and bound tightening, and design an attention-based tripartite graph to capture global correlations within MIP instances. Furthermore, we devised an extra branching network at each step, to identify and optimize some wrongly-fixed backdoor variables by pure LNS. We empirically show that our approach can effectively escape local optimum. Extensive experiments on different problems, including instances from Mixed Integer Programming Library (MIPLIB), show that it significantly outperforms the open-source solver SCIP and LNS baselines. It performs competitively with, and sometimes even better than the commercial solver Gurobi (v9.5.0), especially at an early stage. Source code will be made publicly available.",
        "keywords": "large neighborhood search;bound tightening;hybrid branch and search;reinforcement learning",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/628c9eae313541eb6540b41b15dc5ec0ad38075c.zip",
        "author": "Hao Yuan;Wenli Ouyang;Changwen Zhang;Yong Sun;Liming Gong;Ziao Guo;Zhichen Dong;Junchi Yan",
        "authorids": "~Hao_Yuan5;~Wenli_Ouyang1;~Changwen_Zhang1;~Yong_Sun1;~Liming_Gong1;~Ziao_Guo1;~Zhichen_Dong1;~Junchi_Yan2",
        "gender": "M;;M;M;M;M;F;M",
        "homepage": "https://www.researchgate.net/profile/Hao-Yuan-50/research;;https://github.com/xtjjyygy;https://github.com/LeonSun01;https://github.com/kgisme170;https://github.com/ziao-guo;https://github.com/niconi19;http://thinklab.sjtu.edu.cn/",
        "dblp": "92/867-2.html;243/3171;256/7886.html;;;312/4575;;60/7949.html",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;;;;;;ga230VoAAAAJ",
        "orcid": "0000-0002-6780-9627;;;;;;;0000-0001-9639-7679",
        "linkedin": ";wenli-ouyang-07891641;;;;;;",
        "or_profile": "~Hao_Yuan5;~Wenli_Ouyang1;~Changwen_Zhang1;~Yong_Sun1;~Liming_Gong1;~Ziao_Guo1;~Zhichen_Dong1;~Junchi_Yan1",
        "aff": "Lenovo Research;Lenovo Research ;lenovo;Lenovo Group Limited;;Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University",
        "aff_domain": "lenovo.com;lenovo.com;lenovo.com;lenovo.com;;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn",
        "position": "Researcher;Researcher;Researcher;Researcher;;PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nyuan2024btbslns,\ntitle={{BTBS}-{LNS}: A Binarized-Tightening, Branch and Search Approach of Learning Large Neighborhood Search Policies for {MIP}},\nauthor={Hao Yuan and Wenli Ouyang and Changwen Zhang and Yong Sun and Liming Gong and Ziao Guo and Zhichen Dong and Junchi Yan},\nyear={2024},\nurl={https://openreview.net/forum?id=Qwxe8WKSgy}\n}",
        "github": "",
        "project": "",
        "reviewers": "zCZB;38AJ;5yM1;uy5T",
        "site": "https://openreview.net/forum?id=Qwxe8WKSgy",
        "pdf_size": 777704,
        "rating": "5;5;5;6",
        "confidence": "4;4;5;3",
        "soundness": "2;2;2;4",
        "contribution": "2;3;3;4",
        "presentation": "3;1;1;1",
        "wc_summary": "70;152;70;99",
        "wc_strengths": "69;128;47;30",
        "wc_weaknesses": "274;608;159;387",
        "wc_questions": "6;44;3;16",
        "wc_review": "419;932;279;532",
        "wc_reply_reviewers": "0;181;0;30",
        "wc_reply_authors": "588;2315;963;471",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "1;4;2;2",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            1.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            97.75,
            33.48413803579241
        ],
        "wc_strengths_avg": [
            68.5,
            37.030392922571046
        ],
        "wc_weaknesses_avg": [
            357.0,
            165.82671678592686
        ],
        "wc_questions_avg": [
            17.25,
            16.17675801883678
        ],
        "wc_review_avg": [
            540.5,
            243.15067345166864
        ],
        "wc_reply_reviewers_avg": [
            52.75,
            75.05123250153858
        ],
        "wc_reply_authors_avg": [
            1084.25,
            733.4484900113981
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            1.0897247358851685
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:OE-F1dX6dLsJ:scholar.google.com/&scioq=BTBS-LNS:+A+Binarized-Tightening,+Branch+and+Search+Approach+of+Learning+Large+Neighborhood+Search+Policies+for+MIP&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;1;2;2;2",
        "aff_unique_norm": "Lenovo;Lenovo Group Limited;Shanghai Jiao Tong University",
        "aff_unique_dep": "Research;;",
        "aff_unique_url": "https://www.lenovo.com;https://www.lenovo.com;https://www.sjtu.edu.cn",
        "aff_unique_abbr": "Lenovo;Lenovo;SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "TorchRL: A data-driven decision-making library for PyTorch",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18660",
        "id": "QxItoEAVMb",
        "author_site": "Albert Bou, Matteo Bettini, Sebastian Dittert, Vikash Kumar, Shagun Sodhani, Xiaomeng Yang, Gianni De Fabritiis, Vincent Moens",
        "tldr": "",
        "abstract": "PyTorch has ascended as a premier machine learning framework, yet it lacks a native and comprehensive library for decision and control tasks suitable for large development teams dealing with complex real-world data and environments. To address this issue, we propose TorchRL, a generalistic control library for PyTorch that provides well-integrated, yet standalone components. We introduce a new and flexible PyTorch primitive, the TensorDict, which facilitates streamlined algorithm development across the many branches of Reinforcement Learning (RL) and control. We provide a detailed description of the building blocks and an extensive overview of the library across domains and tasks. Finally, we experimentally demonstrate its reliability and flexibility, and show comparative benchmarks to demonstrate its computational efficiency. TorchRL fosters long-term support and is publicly available on GitHub for greater reproducibility and collaboration within the research community. The code is open-sourced on GitHub.",
        "keywords": "Reinforcement Learning;pytorch;control;robotics",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Albert Bou;Matteo Bettini;Sebastian Dittert;Vikash Kumar;Shagun Sodhani;Xiaomeng Yang;Gianni De Fabritiis;Vincent Moens",
        "authorids": "~Albert_Bou1;~Matteo_Bettini1;~Sebastian_Dittert1;~Vikash_Kumar2;~Shagun_Sodhani1;~Xiaomeng_Yang1;~Gianni_De_Fabritiis1;~Vincent_Moens3",
        "gender": "M;M;M;M;M;M;M;M",
        "homepage": "https://www.linkedin.com/in/albert-bou-873b8b98/;http://matteobettini.com;;http://vikashplus.github.io/;https://shagunsodhani.com;;https://www.compscience.org;https://github.com/vmoens",
        "dblp": ";324/2168;;82/7475;http://dblp.uni-trier.de/pers/hd/s/Sodhani:Shagun;;29/605;220/5625",
        "google_scholar": ";hcvR_W0AAAAJ;;nu3W--sAAAAJ;ixp-vqMAAAAJ;t8v3JXsAAAAJ;-_kX4kMAAAAJ;8l-tvFoAAAAJ",
        "orcid": ";0000-0001-8679-0151;;;;0009-0007-3917-6811;;",
        "linkedin": ";bettinimatteo/;sebastian-dittert/;;shagun-sodhani-b2239879;xiaomeng-yang-356a976b;gdefabritiis/;vincent-moens-9bb91972/",
        "or_profile": "~Albert_Bou1;~Matteo_Bettini1;~Sebastian_Dittert1;~Vikash_Kumar2;~Shagun_Sodhani1;~Xiaomeng_Yang1;~Gianni_De_Fabritiis1;~Vincent_Moens3",
        "aff": "Universitat Pompeu Fabra;University of Cambridge;Universitat Pompeu Fabra;Meta Facebook;Meta Facebook;Moonshot AI;Universitat Pompeu Fabra;Meta",
        "aff_domain": "upf.edu;cam.ac.uk;upf.es;facebook.com;fb.com;msh.team;upf.edu;fb.com",
        "position": "PhD student;PhD student;PhD student;Researcher;Researcher;Member of Technical Staff;Full Professor;Applied ML Scientist",
        "bibtex": "@inproceedings{\nbou2024torchrl,\ntitle={Torch{RL}: A data-driven decision-making library for PyTorch},\nauthor={Albert Bou and Matteo Bettini and Sebastian Dittert and Vikash Kumar and Shagun Sodhani and Xiaomeng Yang and Gianni De Fabritiis and Vincent Moens},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=QxItoEAVMb}\n}",
        "github": "",
        "project": "",
        "reviewers": "gnLZ;tnNy;C5vY;77b1",
        "pdf_size": 5677864,
        "rating": "6;6;6;8",
        "confidence": "5;3;3;4",
        "soundness": "3;2;3;4",
        "contribution": "3;3;3;4",
        "presentation": "3;2;3;3",
        "wc_summary": "79;134;99;106",
        "wc_strengths": "126;76;61;149",
        "wc_weaknesses": "197;311;250;141",
        "wc_questions": "48;111;142;198",
        "wc_review": "450;632;552;594",
        "wc_reply_reviewers": "0;504;0;0",
        "wc_reply_authors": "793;1097;771;770",
        "reply_reviewers": "0;2;0;0",
        "reply_authors": "2;3;1;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            104.5,
            19.704060495238032
        ],
        "wc_strengths_avg": [
            103.0,
            35.83992187491485
        ],
        "wc_weaknesses_avg": [
            224.75,
            62.96973479378804
        ],
        "wc_questions_avg": [
            124.75,
            54.181985013471035
        ],
        "wc_review_avg": [
            557.0,
            67.94850991743675
        ],
        "wc_reply_reviewers_avg": [
            126.0,
            218.23840175367854
        ],
        "wc_reply_authors_avg": [
            857.75,
            138.43658295407323
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.17407765595569782,
        "gs_citation": 46,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12217649906039997267&as_sdt=5,34&sciodt=0,34&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=QxItoEAVMb",
        "pdf": "https://openreview.net/pdf?id=QxItoEAVMb",
        "email": "upf.edu;cam.ac.uk;upf.es;facebook.com;fb.com;msh.team;upf.edu;fb.com",
        "author_num": 8,
        "aff_unique_index": "0;1;0;2;2;3;0;2",
        "aff_unique_norm": "Universitat Pompeu Fabra;University of Cambridge;Meta;Moonshot AI",
        "aff_unique_dep": ";;Meta Platforms, Inc.;",
        "aff_unique_url": "https://www.upf.edu/;https://www.cam.ac.uk;https://meta.com;https://moonshot.ai",
        "aff_unique_abbr": "UPF;Cambridge;Meta;Moonshot AI",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Cambridge",
        "aff_country_unique_index": "0;1;0;2;2;2;0;2",
        "aff_country_unique": "Spain;United Kingdom;United States"
    },
    {
        "title": "Spatio-Temporal Few-Shot Learning via Diffusive Neural Network Generation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18659",
        "id": "QyFm3D3Tzi",
        "author_site": "Yuan Yuan, Chenyang Shao, Jingtao Ding, Depeng Jin, Yong Li",
        "tldr": "",
        "abstract": "Spatio-temporal modeling is foundational for smart city applications, yet it is often hindered by data scarcity in many cities and regions. To bridge this gap, we propose a novel generative pre-training framework, GPD, for spatio-temporal few-shot learning with urban knowledge transfer. Unlike conventional approaches that heavily rely on common feature extraction or intricate few-shot learning designs, our solution takes a novel approach by performing generative pre-training on a collection of neural network parameters optimized with data from source cities.  We recast spatio-temporal few-shot learning as pre-training a generative diffusion model, which generates tailored neural networks guided by prompts, allowing for adaptability to diverse data distributions and city-specific characteristics. GPD employs a Transformer-based denoising diffusion model, which is model-agnostic to integrate with powerful spatio-temporal neural networks.  By addressing challenges arising from data gaps and the complexity of generalizing knowledge across cities, our framework consistently outperforms state-of-the-art baselines on multiple real-world datasets for tasks such as traffic speed prediction and crowd flow prediction. The implementation of our approach is available: https://github.com/tsinghua-fib-lab/GPD.",
        "keywords": "Spatio-Temporal Few-Shot Learning;Diffusion models;Neural Network Generation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/24b53c0e2c5bd20680672770c7f57a362924cacc.pdf",
        "author": "Yuan Yuan;Chenyang Shao;Jingtao Ding;Depeng Jin;Yong Li",
        "authorids": "~Yuan_Yuan15;~Chenyang_Shao1;~Jingtao_Ding1;~Depeng_Jin1;~Yong_Li7",
        "gender": "F;M;M;;M",
        "homepage": "https://scholar.google.com/citations?user=1AaWLJ8AAAAJ;https://github.com/PLUTO-SCY/PLUTO-SCY;https://fi.ee.tsinghua.edu.cn/~dingjingtao/;;http://fi.ee.tsinghua.edu.cn/~liyong/",
        "dblp": "64/5845-32;;166/5946;46/5770;",
        "google_scholar": "1AaWLJ8AAAAJ;;_TAJECAAAAAJ;;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0003-1701-2588;;0000-0001-7985-6263;;",
        "linkedin": ";;jingtao-ding-7a2638139/;;",
        "or_profile": "~Yuan_Yuan15;~Chenyang_Shao1;~Jingtao_Ding1;~Depeng_Jin1;~Yong_Li7",
        "aff": "Tsinghua University;Electronic Engineering, Tsinghua University, Tsinghua University;Tsinghua University;Tsinghua University;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;mails.tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "PhD student;Undergrad student;Postdoc;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nyuan2024spatiotemporal,\ntitle={Spatio-Temporal Few-Shot Learning via Diffusive Neural Network Generation},\nauthor={Yuan Yuan and Chenyang Shao and Jingtao Ding and Depeng Jin and Yong Li},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=QyFm3D3Tzi}\n}",
        "github": "",
        "project": "",
        "reviewers": "fmNn;yfzH;zXEa;cSYa",
        "pdf_size": 3708525,
        "rating": "6;6;6;8",
        "confidence": "4;5;5;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "62;95;111;49",
        "wc_strengths": "39;134;68;101",
        "wc_weaknesses": "452;57;119;102",
        "wc_questions": "101;6;4;53",
        "wc_review": "654;292;302;305",
        "wc_reply_reviewers": "72;0;0;17",
        "wc_reply_authors": "2786;378;1082;852",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "8;1;2;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            79.25,
            24.843258642939738
        ],
        "wc_strengths_avg": [
            85.5,
            35.57035282366482
        ],
        "wc_weaknesses_avg": [
            182.5,
            157.23628716043888
        ],
        "wc_questions_avg": [
            41.0,
            39.805778474990284
        ],
        "wc_review_avg": [
            388.25,
            153.50631094518556
        ],
        "wc_reply_reviewers_avg": [
            22.25,
            29.549746191803408
        ],
        "wc_reply_authors_avg": [
            1274.5,
            908.8326303561068
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.25,
            2.7726341266023544
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 22,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5556010599872836573&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=QyFm3D3Tzi",
        "pdf": "https://openreview.net/pdf?id=QyFm3D3Tzi",
        "email": "tsinghua.edu.cn;mails.tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Tsinghua University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "Qyp3Rni2g1",
        "title": "Efficiency Pentathlon: A Standardized Benchmark for Efficiency Evaluation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Rising computational demands of modern natural language processing (NLP) systems have increased the barrier to entry for cutting-edge research while posing serious environmental concerns. Yet, progress on model efficiency has been impeded by practical challenges in model evaluation and comparison. For example, hardware is challenging to control due to disparate levels of accessibility across different institutions. Moreover, improvements in metrics such as FLOPs often fail to translate to progress in real-world applications. In response, we introduce Pentathlon, a benchmark for holistic and realistic evaluation of model efficiency. Pentathlon focuses on inference, which accounts for a majority of the compute in a model\u2019s lifecycle. It offers a strictly-controlled hardware platform, and is designed to mirror real-world applications scenarios. It incorporates a suite of metrics that target different aspects of efficiency, including latency, throughput, memory overhead, and energy consumption. Pentathlon also comes with a software library that can be seamlessly integrated into any codebase and enable evaluation. As a standardized and centralized evaluation platform, Pentathlon can drastically reduce the workload to make fair and reproducible efficiency comparisons. While initially focused on natural language processing (NLP) models, Pentathlon is designed to allow flexible extension to other fields. We envision Pentathlon will stimulate algorithmic innovations in building efficient models, and foster an increased awareness of the social and environmental implications in the development of future-generation NLP models.",
        "keywords": "Efficiency;evaluation;benchmark;natural language processing",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Hao Peng;Qingqing Cao;Jesse Dodge;Matthew E Peters;Jared Fernandez;Tom Sherborne;Kyle Lo;Sam Skjonsberg;Emma Strubell;Darrell Plessas;Iz Beltagy;Evan Pete Walsh;Noah A. Smith;Hannaneh Hajishirzi",
        "authorids": "~Hao_Peng4;~Qingqing_Cao1;~Jesse_Dodge1;~Matthew_E_Peters1;~Jared_Fernandez1;~Tom_Sherborne2;~Kyle_Lo1;~Sam_Skjonsberg1;~Emma_Strubell1;~Darrell_Plessas1;~Iz_Beltagy1;~Evan_Pete_Walsh1;~Noah_A._Smith2;~Hannaneh_Hajishirzi1",
        "gender": "M;M;M;M;;M;Non-Binary;Not Specified;M;M;F;M;M;M",
        "homepage": "https://awk.ai/;http://www.cs.cmu.edu/~jessed/;;https://jaredfern.com;https://kyleclo.github.io/;https://codeviking.net;http://strubell.github.io;https://allenai.org;http://beltagy.net/;https://github.com/epwalsh/;https://homes.cs.washington.edu/~hannaneh/;https://haopeng-nlp.github.io/;https://homes.cs.washington.edu/~nasmith/;https://tomsherborne.github.io/",
        "dblp": ";49/11425;48/9898;205/9049;220/2020;220/2080;153/2253;;;;52/1296;;90/5204.html;203/6427",
        "google_scholar": "vLpPyUUAAAAJ;nHy_1doAAAAJ;;CQHpFLIAAAAJ;VJS12uMAAAAJ;2xelBIYAAAAJ;UCDMtM0AAAAJ;;jkV6H1gAAAAJ;;LOV6_WIAAAAJ;6Y37nm0AAAAJ;https://scholar.google.com/citations?hl=en;50nZ2yAAAAAJ",
        "orcid": "0000-0002-8564-9241;;;;;;;;;;;;0000-0002-2310-6380;0000-0002-2005-6541",
        "linkedin": "qqcao;;;;kylelo/;https://linkedin.com/in/skone;;;beltagy/;;;;;",
        "or_profile": "~Qingqing_Cao1;~Jesse_Dodge1;~Matthew_E_Peters1;~Jared_Fernandez1;~Kyle_Lo1;~Sam_Skjonsberg1;~Emma_Strubell1;~Darrell_Plessas1;~Iz_Beltagy1;~Evan_Pete_Walsh1;~Hannaneh_Hajishirzi1;~Hao_Peng1;~Noah_Smith1;~Thomas_Sherborne1",
        "aff": "University of Washington, Seattle;Allen Institute for Artificial Intelligence;Allen Institute for Artificial Intelligence;Carnegie Mellon University;Allen Institute for Artificial Intelligence;Allen Institute for Artificial Intelligence;Allen Institute for Artificial Intelligence;;Allen Institute for Artificial Intelligence;Allen Institute for Artificial Intelligence;University of Washington;University of Illinois Urbana-Champaign;Allen Institute for Artificial Intelligence;University of Edinburgh",
        "aff_domain": "uw.edu;allenai.org;allenai.org;cmu.edu;allenai.org;allenai.org;allenai.org;;allenai.org;allenai.org;uw.edu;illinois.edu;allenai.org;ed.ac.uk",
        "position": "Postdoc;Researcher;Researcher;PhD student;Researcher;Senior Engineering Manager;Visiting Researcher;;Research Scientist;Researcher;Associate Professor;Assistant Professor;Senior Director of NLP Research;PhD student",
        "bibtex": "@misc{\npeng2024efficiency,\ntitle={Efficiency Pentathlon: A Standardized Benchmark for Efficiency Evaluation},\nauthor={Hao Peng and Qingqing Cao and Jesse Dodge and Matthew E Peters and Jared Fernandez and Tom Sherborne and Kyle Lo and Sam Skjonsberg and Emma Strubell and Darrell Plessas and Iz Beltagy and Evan Pete Walsh and Noah A. Smith and Hannaneh Hajishirzi},\nyear={2024},\nurl={https://openreview.net/forum?id=Qyp3Rni2g1}\n}",
        "github": "",
        "project": "",
        "reviewers": "uM5U;pV3M;5UHy;HHde",
        "site": "https://openreview.net/forum?id=Qyp3Rni2g1",
        "pdf_size": 1029510,
        "rating": "3;5;5;8",
        "confidence": "4;3;3;4",
        "soundness": "2;2;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;2;4;3",
        "wc_summary": "56;106;91;44",
        "wc_strengths": "30;23;172;29",
        "wc_weaknesses": "92;47;250;23",
        "wc_questions": "2;77;66;16",
        "wc_review": "180;253;579;112",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "184;368;830;81",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            74.25,
            25.183079636930824
        ],
        "wc_strengths_avg": [
            63.5,
            62.69968101992226
        ],
        "wc_weaknesses_avg": [
            103.0,
            88.41097216974825
        ],
        "wc_questions_avg": [
            40.25,
            31.877695964420013
        ],
        "wc_review_avg": [
            281.0,
            179.12984117672858
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            365.75,
            287.07522968727204
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            14,
            0
        ],
        "corr_rating_confidence": 0.14002800840280097,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14372256312551936233&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;1;2;1;1;1;1;1;0;3;1;4",
        "aff_unique_norm": "University of Washington;Allen Institute for Artificial Intelligence;Carnegie Mellon University;University of Illinois Urbana-Champaign;University of Edinburgh",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.washington.edu;https://allenai.org;https://www.cmu.edu;https://illinois.edu;https://www.ed.ac.uk",
        "aff_unique_abbr": "UW;AI2;CMU;UIUC;Edinburgh",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Seattle;;Urbana-Champaign",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0;0;0;1",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "QzQSR56JZr",
        "title": "Harnessing the Power of Large Language Models for Natural Language to First-Order Logic Translation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Translating natural language sentences to first-order logic (NL-FOL translation) remains a critical task in many logic-based NLP systems, as it enables ML models to reason logically over text.\nHowever, existing translation methods still struggle to scale to real-world tasks due to the lack of a large and high-quality dataset and a model family with high precision and coverage.\n\nIn this work, we approach this longstanding challenge by harnessing the power of pre-trained large language models (LLMs).\nTo do so, we present MALLS (large language **M**odel gener**A**ted N**L**-FO**L** pair**S**), a dataset of 28K diverse and verified sentence-level NL-FOL pairs collected from GPT-4.\nWe create MALLS by implementing an adaptive pipeline that prompts GPT-4 for pairs with rich and diverse contexts. \nTo ensure the validity of FOL rules and their alignment with the NL sentences, we utilized a combined strategy of FOL rule parsing, human annotation, and automatic filtering.\n\nWe also present LogicLLaMA, an LLaMA2-7B/13B model family fine-tuned on MALLS for NL-FOL translation. \nLogicLLaMA is capable of directly translating natural language into FOL rules, which outperforms GPT-3.5. \nLogicLLaMA is also equipped to correct FOL rules predicted by GPT-3.5, and can achieve similar performance as GPT-4 with a fraction of the cost.\nThis correction ability was achieved by a novel reinforcement learning with human feedback (RLHF) framework, which initially trains on synthetically perturbed NL-FOL pairs to encourage chain-of-thought reasoning and then fine-tunes with RLHF on GPT-3.5 outputs using a FOL verifier as the reward model. \nCodes and data are available [here](https://www.dropbox.com/sh/t0f69776773e9er/AABKaWuvepUvhSp-0u2w-b2Pa?dl=0).",
        "keywords": "Large Language Models;Natrual Language to First-Order Logic Translation",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/4a53df33d02c875ae138919f0b3aa325aeda1389.pdf",
        "author": "Yuan Yang;Siheng Xiong;Ali Payani;Ehsan Shareghi;Faramarz Fekri",
        "authorids": "~Yuan_Yang1;~Siheng_Xiong1;~Ali_Payani1;~Ehsan_Shareghi1;~Faramarz_Fekri1",
        "gender": "M;M;M;M;M",
        "homepage": "https://gblackout.github.io/;https://xiongsiheng.github.io;;https://eehsan.github.io/;http://Fekri.ece.gatech.edu",
        "dblp": ";277/4221;184/3921;09/7859;77/2313",
        "google_scholar": "Lt4tmL8AAAAJ;PbNzCQoAAAAJ;9rHwD8wAAAAJ;https://scholar.google.com.au/citations?user=EhnQJFwAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;0000-0003-4054-2958;;",
        "linkedin": ";;ali-payani-59267515;;",
        "or_profile": "~Yuan_Yang1;~Siheng_Xiong1;~Ali_Payani1;~Ehsan_Shareghi1;~Faramarz_Fekri1",
        "aff": "Georgia Institute of Technology;Georgia Institute of Technology;Cisco;Monash University;Georgia Institute of Technology",
        "aff_domain": "gatech.edu;gatech.edu;cisco.com;monash.edu;gatech.edu",
        "position": "PhD student;PhD student;Researcher;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nyang2024harnessing,\ntitle={Harnessing the Power of Large Language Models for Natural Language to First-Order Logic Translation},\nauthor={Yuan Yang and Siheng Xiong and Ali Payani and Ehsan Shareghi and Faramarz Fekri},\nyear={2024},\nurl={https://openreview.net/forum?id=QzQSR56JZr}\n}",
        "github": "",
        "project": "",
        "reviewers": "6TG1;8JQp;wVqn",
        "site": "https://openreview.net/forum?id=QzQSR56JZr",
        "pdf_size": 749189,
        "rating": "3;6;8",
        "confidence": "4;4;4",
        "soundness": "3;2;3",
        "contribution": "2;2;3",
        "presentation": "2;2;3",
        "wc_summary": "66;69;51",
        "wc_strengths": "22;22;62",
        "wc_weaknesses": "99;36;81",
        "wc_questions": "187;26;93",
        "wc_review": "374;153;287",
        "wc_reply_reviewers": "235;0;48",
        "wc_reply_authors": "1510;554;204",
        "reply_reviewers": "1;0;1",
        "reply_authors": "3;1;1",
        "rating_avg": [
            5.666666666666667,
            2.0548046676563256
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            62.0,
            7.874007874011811
        ],
        "wc_strengths_avg": [
            35.333333333333336,
            18.856180831641264
        ],
        "wc_weaknesses_avg": [
            72.0,
            26.49528259898354
        ],
        "wc_questions_avg": [
            102.0,
            66.03534407169138
        ],
        "wc_review_avg": [
            271.3333333333333,
            90.90043393124638
        ],
        "wc_reply_reviewers_avg": [
            94.33333333333333,
            101.37827950579728
        ],
        "wc_reply_authors_avg": [
            756.0,
            551.9734293121968
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 36,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=930638003664489081&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;0;1;2;0",
        "aff_unique_norm": "Georgia Institute of Technology;Cisco Systems;Monash University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.gatech.edu;https://www.cisco.com;https://www.monash.edu",
        "aff_unique_abbr": "Georgia Tech;Cisco;Monash",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "United States;Australia"
    },
    {
        "title": "Large Brain Model for Learning Generic Representations with Tremendous EEG Data in BCI",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18658",
        "id": "QzTpTRVtrP",
        "author_site": "Wei-Bang Jiang, Liming Zhao, Bao-liang Lu",
        "tldr": "",
        "abstract": "The current electroencephalogram (EEG) based deep learning models are typically designed for specific datasets and applications in brain-computer interaction (BCI), limiting the scale of the models and thus diminishing their perceptual capabilities and generalizability. Recently, Large Language Models (LLMs) have achieved unprecedented success in text processing, prompting us to explore the capabilities of Large EEG Models (LEMs). We hope that LEMs can break through the limitations of different task types of EEG datasets, and obtain universal perceptual capabilities of EEG signals through unsupervised pre-training. Then the models can be fine-tuned for different downstream tasks. However, compared to text data, the volume of EEG datasets is generally small and the format varies widely. For example, there can be mismatched numbers of electrodes, unequal length data samples, varied task designs, and low signal-to-noise ratio. To overcome these challenges, we propose a unified foundation model for EEG called Large Brain Model (LaBraM). LaBraM enables cross-dataset learning by segmenting the EEG signals into EEG channel patches. Vector-quantized neural spectrum prediction is used to train a semantically rich neural tokenizer that encodes continuous raw EEG channel patches into compact neural codes. We then pre-train neural Transformers by predicting the original neural codes for the masked EEG channel patches. The LaBraMs were pre-trained on about 2,500 hours of various types of EEG signals from around 20 datasets and validated on multiple different types of downstream tasks. Experiments on abnormal detection, event type classification, emotion recognition, and gait prediction show that our LaBraM outperforms all compared SOTA methods in their respective fields. Our code is available at https://github.com/935963004/LaBraM.",
        "keywords": "EEG;brain-computer interface;representation learning",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "Weibang Jiang;Liming Zhao;Bao-liang Lu",
        "authorids": "~Weibang_Jiang2;~Liming_Zhao3;~Bao-liang_Lu1",
        "gender": "M;M;M",
        "homepage": "https://935963004.github.io/;https://bcmi.sjtu.edu.cn/home/zhaoliming/;http://bcmi.sjtu.edu.cn/~blu/",
        "dblp": "311/0002;;09/3116.html",
        "google_scholar": "wevIfuYAAAAJ;;https://scholar.google.com.tw/citations?user=709il6EAAAAJ",
        "orcid": "0000-0003-3759-5100;;0000-0001-8359-0058",
        "linkedin": ";;",
        "or_profile": "~Weibang_Jiang2;~Liming_Zhao3;~Bao-liang_Lu1",
        "aff": "Shanghai Jiaotong University;;Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn;;sjtu.edu.cn",
        "position": "PhD student;;Full Professor",
        "bibtex": "@inproceedings{\njiang2024large,\ntitle={Large Brain Model for Learning Generic Representations with Tremendous {EEG} Data in {BCI}},\nauthor={Weibang Jiang and Liming Zhao and Bao-liang Lu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=QzTpTRVtrP}\n}",
        "github": "",
        "project": "",
        "reviewers": "tjUb;ztTZ;WxGC",
        "pdf_size": 963261,
        "rating": "6;8;8",
        "confidence": "3;2;4",
        "soundness": "3;3;3",
        "contribution": "3;4;3",
        "presentation": "3;4;4",
        "wc_summary": "112;172;162",
        "wc_strengths": "28;130;169",
        "wc_weaknesses": "222;195;208",
        "wc_questions": "54;11;502",
        "wc_review": "416;508;1041",
        "wc_reply_reviewers": "66;23;188",
        "wc_reply_authors": "1056;587;1920",
        "reply_reviewers": "1;1;1",
        "reply_authors": "2;1;4",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            148.66666666666666,
            26.2466929133727
        ],
        "wc_strengths_avg": [
            109.0,
            59.447455790807396
        ],
        "wc_weaknesses_avg": [
            208.33333333333334,
            11.025223605694151
        ],
        "wc_questions_avg": [
            189.0,
            222.01951866146064
        ],
        "wc_review_avg": [
            655.0,
            275.515274833659
        ],
        "wc_reply_reviewers_avg": [
            92.33333333333333,
            69.88721072000385
        ],
        "wc_reply_authors_avg": [
            1187.6666666666667,
            552.1016412058764
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 77,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6205678326303960335&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=QzTpTRVtrP",
        "pdf": "https://openreview.net/pdf?id=QzTpTRVtrP",
        "email": "sjtu.edu.cn;;sjtu.edu.cn",
        "author_num": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Shanghai Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sjtu.edu.cn",
        "aff_unique_abbr": "SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "MetaTool Benchmark for Large Language Models: Deciding Whether to Use Tools and Which to Use",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18657",
        "id": "R0c2qtalgG",
        "author_site": "Yue Huang, Jiawen Shi, Yuan Li, Chenrui Fan, Siyuan Wu, Qihui Zhang, Yixin Liu, Pan Zhou, Yao Wan, Neil Gong, Lichao Sun",
        "tldr": "",
        "abstract": "Large language models (LLMs) have garnered significant attention due to their impressive natural language processing (NLP) capabilities. Recently, many studies have focused on the tool utilization ability of LLMs. They primarily investigated how LLMs effectively collaborate with given specific tools. However, in scenarios where LLMs serve as intelligent agents, as seen in applications like AutoGPT and MetaGPT, LLMs are expected to engage in intricate decision-making processes that involve deciding whether to employ a tool and selecting the most suitable tool(s) from a collection of available tools to fulfill user requests. Therefore, in this paper, we introduce MetaTool, a benchmark designed to evaluate whether LLMs have tool usage awareness and can correctly choose tools. Specifically, we create a dataset called ToolE within the benchmark. This dataset contains various types of user queries in the form of prompts that trigger LLMs to use tools, including both single-tool and multi-tool scenarios. Subsequently, we set the tasks for both tool usage awareness and tool selection. We define four subtasks from different perspectives in tool selection, including tool selection with similar choices, tool selection in specific scenarios, tool selection with possible reliability issues, and multi-tool selection. We conduct experiments involving eight popular LLMs and find that the majority of them still struggle to effectively select tools, highlighting the existing gaps between LLMs and genuine intelligent agents. However, through the error analysis, we found there is still significant room for improvement. Finally, we conclude with insights for tool developers -- we strongly recommend that tool developers choose an appropriate rewrite model for generating new descriptions based on the downstream LLM the tool will apply to.",
        "keywords": "Tool usage;large language model;benchmark;dataset",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/409615476ac45be788f04e0f94de029a5b1f5baf.zip",
        "author": "Yue Huang;Jiawen Shi;Yuan Li;Chenrui Fan;Siyuan Wu;Qihui Zhang;Yixin Liu;Pan Zhou;Yao Wan;Neil Zhenqiang Gong;Lichao Sun",
        "authorids": "~Yue_Huang9;~Jiawen_Shi1;~Yuan_Li18;~Chenrui_Fan1;~Siyuan_Wu6;~Qihui_Zhang1;~Yixin_Liu4;~Pan_Zhou5;~Yao_Wan2;~Neil_Zhenqiang_Gong1;~Lichao_Sun1",
        "gender": ";F;M;M;;M;;M;M;;M",
        "homepage": ";https://github.com/ShiJiawenwen?tab=projects;;https://www.linkedin.com/in/chenrui-fan-a1b102298/;https://github.com/nauyisu022;https://github.com/Mask-Hui;;http://faculty.hust.edu.cn/pzhou/zh_CN/index.htm;http://wanyao.me;;https://lichao-sun.github.io/",
        "dblp": ";;;342/1752.html;44/3983-1;160/4750;;84/6614-1;167/0275.html;;121/0780-1.html",
        "google_scholar": ";https://scholar.google.com/citations?hl=zh-CN;;IR8PuQUAAAAJ;v8qD1HsAAAAJ;;;cTpFPJgAAAAJ;c3MtqtMAAAAJ;;WhGUE7AAAAAJ",
        "orcid": ";;;0000-0003-3183-2224;;;;;0000-0001-6937-4180;;",
        "linkedin": ";;yuan-li-087605195/;chenrui-fan-a1b102298/;;;;;;;lichao-sun-b273a290/",
        "or_profile": "~Yue_Huang9;~Jiawen_Shi1;~Yuan_Li18;~Chenrui_Fan1;~Siyuan_Wu6;~Qihui_Zhang1;~Yixin_Liu4;~Pan_Zhou5;~Yao_Wan2;~Neil_Zhenqiang_Gong1;~Lichao_Sun1",
        "aff": ";Huazhong University of Science and Technology;University of Cambridge;Huazhong University of Science and Technology;University of Waterloo;Huazhong University of Science and Technology;;Huazhong University of Science and Technology;Huazhong University of Science and Technology;;Lehigh University",
        "aff_domain": ";hust.edu.cn;cam.ac.uk;hust.edu.cn;uwaterloo.ca;hust.edu.cn;;hust.edu.cn;hust.edu.cn;;lehigh.edu",
        "position": ";PhD student;MS student;Undergrad student;Intern;Intern;;Professor;Assistant Professor;;Assistant Professor",
        "bibtex": "@inproceedings{\nhuang2024metatool,\ntitle={MetaTool Benchmark for Large Language Models: Deciding Whether to Use Tools and Which to Use},\nauthor={Yue Huang and Jiawen Shi and Yuan Li and Chenrui Fan and Siyuan Wu and Qihui Zhang and Yixin Liu and Pan Zhou and Yao Wan and Neil Zhenqiang Gong and Lichao Sun},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=R0c2qtalgG}\n}",
        "github": "",
        "project": "",
        "reviewers": "MgrT;xJ5F;hidW;sQgt",
        "pdf_size": 5208800,
        "rating": "5;6;6;8",
        "confidence": "4;4;4;4",
        "soundness": "3;3;4;3",
        "contribution": "2;3;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "553;194;134;165",
        "wc_strengths": "32;64;124;125",
        "wc_weaknesses": "44;336;211;93",
        "wc_questions": "3;20;2;190",
        "wc_review": "632;614;471;573",
        "wc_reply_reviewers": "0;30;39;15",
        "wc_reply_authors": "1736;3290;1083;735",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "4;10;4;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            261.5,
            169.62974385407767
        ],
        "wc_strengths_avg": [
            86.25,
            39.889691650851354
        ],
        "wc_weaknesses_avg": [
            171.0,
            112.95795678038799
        ],
        "wc_questions_avg": [
            53.75,
            78.98852764800722
        ],
        "wc_review_avg": [
            572.5,
            62.37988457828373
        ],
        "wc_reply_reviewers_avg": [
            21.0,
            14.849242404917497
        ],
        "wc_reply_authors_avg": [
            1711.0,
            979.9012705369863
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.75,
            3.2691742076555053
        ],
        "replies_avg": [
            30,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 80,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7916318734415826501&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=R0c2qtalgG",
        "pdf": "https://openreview.net/pdf?id=R0c2qtalgG",
        "email": ";hust.edu.cn;cam.ac.uk;hust.edu.cn;uwaterloo.ca;hust.edu.cn;;hust.edu.cn;hust.edu.cn;;lehigh.edu",
        "author_num": 11,
        "aff_unique_index": "0;1;0;2;0;0;0;3",
        "aff_unique_norm": "Huazhong University of Science and Technology;University of Cambridge;University of Waterloo;Lehigh University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "http://www.hust.edu.cn;https://www.cam.ac.uk;https://uwaterloo.ca;https://www.lehigh.edu",
        "aff_unique_abbr": "HUST;Cambridge;UW;Lehigh",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Cambridge",
        "aff_country_unique_index": "0;1;0;2;0;0;0;3",
        "aff_country_unique": "China;United Kingdom;Canada;United States"
    },
    {
        "id": "R1crLHQ4kf",
        "title": "Leveraging characteristics of the output distribution for identifying adversarial audio examples",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Adversarial attacks can mislead automatic speech recognition (ASR) systems into producing an arbitrary desired output. \nThis is easily achieved by adding imperceptible noise to the audio signal, thus posing a clear security threat. \nTo prevent such attacks, we propose a simple but efficient adversarial example detection strategy applicable to any ASR system that predicts a probability distribution over output tokens in each time step. \nWe measure a set of characteristics of this distribution: the median, maximum, and minimum over the output probabilities, the entropy of the distribution, as well as the Kullback-Leibler and the Jensen-Shannon divergence with respect to the distributions of the subsequent time step. \nThen, by leveraging the characteristics observed for both benign and adversarial data, we apply binary classifiers, including simple threshold-based classification, ensembles of these simple classifiers, and neural networks.\nIn an extensive analysis of different state-of-the-art ASR systems and language data sets, we demonstrate the supreme performance of this approach, receiving a mean area under the receiving operator characteristic (AUROC) for distinguishing adversarial examples against clean and noisy data higher than 99\\% and 98\\%, respectively.\nTo assess the robustness of our method, we propose adaptive attacks that are constructed with an awareness of the defense mechanism in place. This results in a decrease in the AUROC, but at the same time, the adversarial clips become noisier, which makes them easier to detect through filtering and creates another avenue for preserving the system's robustness.",
        "keywords": "Audio adversarial examples;ASR;machine learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Matias Patricio Pizarro Bustamante;Dorothea Kolossa;Asja Fischer",
        "authorids": "~Matias_Patricio_Pizarro_Bustamante1;~Dorothea_Kolossa1;~Asja_Fischer1",
        "gender": "M;F;F",
        "homepage": ";https://www.tu.berlin/mtec/ueber-uns;",
        "dblp": ";44/3463;76/8485",
        "google_scholar": ";https://scholar.google.de/citations?user=pRumO9sAAAAJ;FyZbyIUAAAAJ",
        "orcid": ";;0000-0002-1916-7033",
        "linkedin": "matiuste/;;",
        "or_profile": "~Matias_Patricio_Pizarro_Bustamante1;~Dorothea_Kolossa1;~Asja_Fischer1",
        "aff": "Ruhr-Universt\u00e4t Bochum;Technische Universit\u00e4t Berlin;Ruhr-Universit\u00e4t Bochum",
        "aff_domain": "rub.de;tu-berlin.de;ruhr-uni-bochum.de",
        "position": "PhD student;Full Professor;Full Professor",
        "bibtex": "@misc{\nbustamante2024leveraging,\ntitle={Leveraging characteristics of the output distribution for identifying adversarial audio examples},\nauthor={Matias Patricio Pizarro Bustamante and Dorothea Kolossa and Asja Fischer},\nyear={2024},\nurl={https://openreview.net/forum?id=R1crLHQ4kf}\n}",
        "github": "",
        "project": "",
        "reviewers": "DwAh;NsBd;jXR8;2Aka",
        "site": "https://openreview.net/forum?id=R1crLHQ4kf",
        "pdf_size": 762630,
        "rating": "5;5;5;5",
        "confidence": "4;4;3;3",
        "soundness": "3;2;3;2",
        "contribution": "3;2;3;2",
        "presentation": "3;2;3;3",
        "wc_summary": "86;92;91;77",
        "wc_strengths": "48;10;83;64",
        "wc_weaknesses": "182;127;124;207",
        "wc_questions": "46;2;160;5",
        "wc_review": "362;231;458;353",
        "wc_reply_reviewers": "24;0;0;74",
        "wc_reply_authors": "500;174;435;674",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            86.5,
            5.937171043518958
        ],
        "wc_strengths_avg": [
            51.25,
            26.845623479442605
        ],
        "wc_weaknesses_avg": [
            160.0,
            35.63004350263974
        ],
        "wc_questions_avg": [
            53.25,
            64.03661062236195
        ],
        "wc_review_avg": [
            351.0,
            80.58225611137975
        ],
        "wc_reply_reviewers_avg": [
            24.5,
            30.211752680041588
        ],
        "wc_reply_authors_avg": [
            445.75,
            179.58615620364506
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:qLO-Jy-LUeYJ:scholar.google.com/&scioq=Leveraging+characteristics+of+the+output+distribution+for+identifying+adversarial+audio+examples&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Ruhr-Universit\u00e4t Bochum;Technische Universit\u00e4t Berlin",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ruhr-uni-bochum.de;https://www.tu-berlin.de",
        "aff_unique_abbr": "RUB;TU Berlin",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "R3CDj2DLln",
        "title": "Disentangled Acoustic Fields For Multimodal Physical Scene Understanding",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We study the problem of multimodal physical scene understanding, where an embodied agent needs to find fallen objects by inferring object properties, direction, and distance of an impact sound source. Previous works adopt feed-forward neural networks to directly regress the variables from sound, leading to poor generalization and domain adaptation issues. In this paper, we illustrate that learning an inverse model of acoustic formation, referred to as disentangled acoustic field (DAF), to capture the sound generation and propagation process, enables the embodied agent to construct a spatial uncertainty map over where the objects may have fallen. We demonstrate that our analysis-by-synthesis framework can jointly infer sound properties by explicitly decomposing and factorizing the latent space of the inverse model. We further show that the spatial uncertainty map can significantly improve the success rate for the localization of fallen objects by proposing multiple plausible exploration locations.",
        "keywords": "neural implicit representation;physical scene understanding;audio-visual navigation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Jie Yin;Andrew Luo;Yilun Du;Anoop Cherian;Tim K. Marks;Jonathan Le Roux;Chuang Gan",
        "authorids": "~Jie_Yin4;~Andrew_Luo2;~Yilun_Du1;~Anoop_Cherian1;~Tim_K._Marks1;~Jonathan_Le_Roux2;~Chuang_Gan1",
        "gender": "M;M;;;;;M",
        "homepage": "https://github.com/sjtuyinjie;https://andrewluo.net/;https://yilundu.github.io;;;;http://people.csail.mit.edu/ganchuang/",
        "dblp": ";234/8054;204/4379;;;;139/6993",
        "google_scholar": ";bWYvvkUAAAAJ;;;;;PTeSCbIAAAAJ",
        "orcid": "0000-0003-2452-9374;;;;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Jie_Yin4;~Andrew_Luo2;~Yilun_Du1;~Anoop_Cherian1;~Tim_K._Marks1;~Jonathan_Le_Roux2;~Chuang_Gan1",
        "aff": "Shanghai Jiaotong University;Carnegie Mellon University;Massachusetts Institute of Technology;;;;University of Massachusetts at Amherst",
        "aff_domain": "sjtu.edu.cn;cmu.edu;mit.edu;;;;umass.edu",
        "position": "MS student;PhD student;PhD student;;;;Assistant Professor",
        "bibtex": "@misc{\nyin2024disentangled,\ntitle={Disentangled Acoustic Fields For Multimodal Physical Scene Understanding},\nauthor={Jie Yin and Andrew Luo and Yilun Du and Anoop Cherian and Tim K. Marks and Jonathan Le Roux and Chuang Gan},\nyear={2024},\nurl={https://openreview.net/forum?id=R3CDj2DLln}\n}",
        "github": "",
        "project": "",
        "reviewers": "RUoW;reBa;oZCW;KbFD",
        "site": "https://openreview.net/forum?id=R3CDj2DLln",
        "pdf_size": 812176,
        "rating": "5;5;5;6",
        "confidence": "4;4;3;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;2;3",
        "wc_summary": "103;38;90;60",
        "wc_strengths": "51;46;4;64",
        "wc_weaknesses": "200;66;102;92",
        "wc_questions": "6;66;21;3",
        "wc_review": "360;216;217;219",
        "wc_reply_reviewers": "59;24;0;0",
        "wc_reply_authors": "888;551;635;825",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            72.75,
            25.410381736605217
        ],
        "wc_strengths_avg": [
            41.25,
            22.487496525847426
        ],
        "wc_weaknesses_avg": [
            115.0,
            50.80354318352215
        ],
        "wc_questions_avg": [
            24.0,
            25.18928343562
        ],
        "wc_review_avg": [
            253.0,
            61.78592072632729
        ],
        "wc_reply_reviewers_avg": [
            20.75,
            24.159625411003375
        ],
        "wc_reply_authors_avg": [
            724.75,
            136.88019396537982
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:jq-LeKnWUc0J:scholar.google.com/&scioq=Disentangled+Acoustic+Fields+For+Multimodal+Physical+Scene+Understanding&hl=en&as_sdt=0,33",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Shanghai Jiao Tong University;Carnegie Mellon University;Massachusetts Institute of Technology;University of Massachusetts Amherst",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.sjtu.edu.cn;https://www.cmu.edu;https://web.mit.edu;https://www.umass.edu",
        "aff_unique_abbr": "SJTU;CMU;MIT;UMass Amherst",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Amherst",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Memory-Consistent Neural Networks for Imitation Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18656",
        "id": "R3Tf7LDdX4",
        "author_site": "Kaustubh Sridhar, Souradeep Dutta, Dinesh Jayaraman, James Weimer, Insup Lee",
        "tldr": "",
        "abstract": "Imitation learning considerably simplifies policy synthesis compared to alternative approaches by exploiting access to expert demonstrations. For such imitation policies, errors away from the training samples are particularly critical. Even rare slip-ups in the policy action outputs can compound quickly over time, since they lead to unfamiliar future states where the policy is still more likely to err, eventually causing task failures. We revisit simple supervised \"behavior cloning\" for conveniently training the policy from nothing more than pre-recorded demonstrations, but carefully design the model class to counter the compounding error phenomenon. Our \"memory-consistent neural network\" (MCNN) outputs are hard-constrained to stay within clearly specified permissible regions anchored to prototypical \"memory\" training samples. We provide a guaranteed upper bound for the sub-optimality gap induced by MCNN policies. Using MCNNs on 10 imitation learning tasks, with MLP, Transformer, and Diffusion backbones, spanning dexterous robotic manipulation and driving, proprioceptive inputs and visual inputs, and varying sizes and types of demonstration data, we find large and consistent gains in performance, validating that MCNNs are better-suited than vanilla deep neural networks for imitation learning applications. Website: https://sites.google.com/view/mcnn-imitation",
        "keywords": "Imitation Learning;Behavior Cloning;Deep Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Kaustubh Sridhar;Souradeep Dutta;Dinesh Jayaraman;James Weimer;Insup Lee",
        "authorids": "~Kaustubh_Sridhar1;~Souradeep_Dutta2;~Dinesh_Jayaraman2;~James_Weimer1;~Insup_Lee1",
        "gender": "M;M;M;M;",
        "homepage": "https://kaustubhsridhar.github.io/;https://sites.google.com/site/duttasouradeep39/;https://www.seas.upenn.edu/~dineshj/;https://jamesweimer.net;https://www.cis.upenn.edu/~lee/",
        "dblp": "289/5808;;145/3870;79/11048.html;l/InsupLee.html",
        "google_scholar": "V-HiOnUAAAAJ;;QxLpghAAAAAJ;IeuLakwAAAAJ;qPlUgrgAAAAJ",
        "orcid": ";;0000-0002-6888-3095;0000-0001-8167-9163;0000-0003-2672-1132",
        "linkedin": "kaustubh-sridhar-8636797a/;;dinesh-jayaraman-44b31539/;;",
        "or_profile": "~Kaustubh_Sridhar1;~Souradeep_Dutta2;~Dinesh_Jayaraman2;~James_Weimer1;~Insup_Lee1",
        "aff": "University of Pennsylvania;University of Pennsylvania;University of Pennsylvania;Vanderbilt University;University of Pennsylvania",
        "aff_domain": "seas.upenn.edu;upenn.edu;upenn.edu;vanderbilt.edu;upenn.edu",
        "position": "PhD student;Postdoc;Assistant Professor;Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\nsridhar2024memoryconsistent,\ntitle={Memory-Consistent Neural Networks for Imitation Learning},\nauthor={Kaustubh Sridhar and Souradeep Dutta and Dinesh Jayaraman and James Weimer and Insup Lee},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=R3Tf7LDdX4}\n}",
        "github": "",
        "project": "",
        "reviewers": "L3an;5EEF;kyQU;Cf33",
        "pdf_size": 10819706,
        "rating": "6;6;6;6",
        "confidence": "4;3;4;4",
        "soundness": "3;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "88;75;369;68",
        "wc_strengths": "27;135;239;74",
        "wc_weaknesses": "92;194;339;174",
        "wc_questions": "16;14;110;160",
        "wc_review": "223;418;1057;476",
        "wc_reply_reviewers": "94;21;5;25",
        "wc_reply_authors": "770;983;1154;1124",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;5;4;4",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            150.0,
            126.64319958055387
        ],
        "wc_strengths_avg": [
            118.75,
            79.28548101638786
        ],
        "wc_weaknesses_avg": [
            199.75,
            89.01790550220781
        ],
        "wc_questions_avg": [
            75.0,
            62.55397669213365
        ],
        "wc_review_avg": [
            543.5,
            310.9296544236333
        ],
        "wc_reply_reviewers_avg": [
            36.25,
            34.17144275561101
        ],
        "wc_reply_authors_avg": [
            1007.75,
            151.69109235548407
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.75,
            1.0897247358851685
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13235954091986549275&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=R3Tf7LDdX4",
        "pdf": "https://openreview.net/pdf?id=R3Tf7LDdX4",
        "email": "seas.upenn.edu;upenn.edu;upenn.edu;vanderbilt.edu;upenn.edu",
        "author_num": 5,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "University of Pennsylvania;Vanderbilt University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.upenn.edu;https://www.vanderbilt.edu",
        "aff_unique_abbr": "UPenn;Vanderbilt",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "R4gqcDRJ9l",
        "title": "TopoFR: A Closer Look at Topology Alignment on Face Recognition",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The field of face recognition (FR) has undergone significant advancements with the rise of deep learning. Recently, the success of unsupervised learning and graph neural networks has demonstrated the effectiveness of data structure information. Considering that the FR task can leverage large-scale training data, which intrinsically contains significant structure information, we aim to investigate how to encode such critical structure information into the latent space. As revealed from our observations, directly aligning the structure information between the input and latent spaces inevitably suffers from an overfitting problem, leading to a structure collapse phenomenon in the latent space. To address this problem, we propose TopoFR, a novel FR model that leverages a topological structure alignment strategy called PTSA and a hard sample mining strategy named SDE. Concretely, PTSA uses persistent homology to align the topological structures of the input and latent spaces, effectively preserving the structure information and improving the generalization performance of FR model. To mitigate the impact of hard samples on the latent space structure, SDE accurately identifies hard samples by automatically computing structure damage score (SDS) for each sample, and directs the model to prioritize optimizing these samples. Experimental results on several face benchmarks demonstrate the superiority of our TopoFR over the state-of-the-art methods. Code and models are available at: \\url{https://anonymous.4open.science/r/TopoFR-82BB}.",
        "keywords": "Face Recognition;Persistent Homology;Structure Alignment",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Jun Dan;Yang Liu;Haoyu Xie;Jiankang Deng;Siyuan Li;Baigui Sun;Xuansong Xie",
        "authorids": "~Jun_Dan1;~Yang_Liu51;~Haoyu_Xie4;~Jiankang_Deng1;~Siyuan_Li6;~Baigui_Sun1;~Xuansong_Xie1",
        "gender": "M;M;M;M;M;M;M",
        "homepage": ";;;https://jiankangdeng.github.io/;https://lupin1998.github.io/;;",
        "dblp": "156/9683;27/3367-5;;156/7808;63/9705-2;186/8016;234/8028",
        "google_scholar": "https://scholar.google.com.hk/citations?user=NB9Mn5MAAAAJ;t1emSE0AAAAJ;https://scholar.google.com.hk/citations?hl=zh-CN;Z_UoQFsAAAAJ;https://scholar.google.com/citations?hl=zh-CN;ZNhTHywAAAAJ;M0Ei1zkAAAAJ",
        "orcid": "0000-0001-7945-3608;;;0000-0002-3709-6216;0000-0001-6806-2468;0000-0001-7722-4748;",
        "linkedin": ";;;jiankang-deng-b45b21b4/?originalSubdomain=uk;https://www.linkedin.cn/incareer/in/siyuan-li-lupin1998/;;",
        "or_profile": "~Jun_Dan1;~Yang_Liu51;~Haoyu_Xie4;~Jiankang_Deng1;~Siyuan_Li6;~Baigui_Sun1;~Xuansong_Xie1",
        "aff": "Zhejiang University;Alibaba Group;;Imperial College London;Alibaba Group;Alibaba Group;Alibaba Group",
        "aff_domain": "zju.edu.cn;alibaba-inc.com;;imperial.ac.uk;alibaba-inc.com;alibaba-inc.com;alibaba-inc.com",
        "position": "PhD student;Researcher at Alibaba Group;;Lecturer;Intern;Researcher;Researcher",
        "bibtex": "@misc{\ndan2024topofr,\ntitle={Topo{FR}: A Closer Look at Topology Alignment on Face Recognition},\nauthor={Jun Dan and Yang Liu and Haoyu Xie and Jiankang Deng and Siyuan Li and Baigui Sun and Xuansong Xie},\nyear={2024},\nurl={https://openreview.net/forum?id=R4gqcDRJ9l}\n}",
        "github": "",
        "project": "",
        "reviewers": "neNy;21zk;7Xi6;nN2M",
        "site": "https://openreview.net/forum?id=R4gqcDRJ9l",
        "pdf_size": 16499506,
        "rating": "5;6;6;6",
        "confidence": "4;4;3;3",
        "soundness": "3;3;3;4",
        "contribution": "2;3;3;4",
        "presentation": "3;3;3;3",
        "wc_summary": "86;53;210;94",
        "wc_strengths": "32;43;23;88",
        "wc_weaknesses": "241;139;449;103",
        "wc_questions": "8;2;47;66",
        "wc_review": "367;237;729;351",
        "wc_reply_reviewers": "117;0;0;0",
        "wc_reply_authors": "1594;449;1866;497",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "4;1;3;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            110.75,
            59.326954245098406
        ],
        "wc_strengths_avg": [
            46.5,
            24.984995497297973
        ],
        "wc_weaknesses_avg": [
            233.0,
            134.58826100369973
        ],
        "wc_questions_avg": [
            30.75,
            26.69620759583653
        ],
        "wc_review_avg": [
            421.0,
            184.75389035146188
        ],
        "wc_reply_reviewers_avg": [
            29.25,
            50.66248612138966
        ],
        "wc_reply_authors_avg": [
            1101.5,
            636.0410757175986
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            1.299038105676658
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17058788301119815867&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;1;1;1",
        "aff_unique_norm": "Zhejiang University;Alibaba Group;Imperial College London",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.zju.edu.cn;https://www.alibaba.com;https://www.imperial.ac.uk",
        "aff_unique_abbr": "ZJU;Alibaba;ICL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0;0",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "id": "R6AA1NZhLd",
        "title": "Topoformer: brain-like topographic organization in Transformer language models through spatial querying and reweighting",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Spatial functional organization is a hallmark of biological brains: neurons are arranged topographically according to their response properties at different scales. In contrast, representations within most machine learning models lack spatial biases, and instead manifest as disorganized vector spaces that are difficult to visualize and interpret. Here, we propose a novel form of self-attention that turn Transformers into \"Topoformers\" with topographic organization. Our primary contribution is Spatial Querying, where keys and queries are arranged on 2D grids, and local pools of queries are associated with a given key. Our secondary contribution is Spatial Reweighting, where we convert the standard fully connected layer of self-attention into a locally connected layer. We first demonstrate the feasibility of our approach using by training a 1-layer Topoformer on a sentiment classification task. We show that training with Spatial Querying results in corresponding topographic organization between queries and keys, and Spatial Reweighting results in corresponding topographic organization between values and self-attention outputs. This emergent organization is \\textit{semantically interpretable}: the internal activation magnitudes show spatial biases for sentences with positive and negative sentiment. Moreover, generic topographic organization is seen in the low dimensional structure of activations revealed through principal component analysis. After establishing that we can indeed obtain interpretable topography, we apply the Topoformer motifs at scale. We train the widely used BERT architecture on larger corpora with a masked language modeling objective. We find that the topographic variant of this model performs on par with a non-topographic control architecture on downstream NLP benchmarks. Finally, we analyze an fMRI dataset of human brain responses to a large set of naturalistic sentences, demonstrating that the Topoformer yields similar forms of topographic organization for linguistic information as that present in the language network of individual subjects. Scaling up Topoformers holds promise for greater interpretability in NLP research, and for more accurate models of the organization of linguistic and semantic information in the human brain.",
        "keywords": "Transformer;Topographic organization;Cortex;Neuroscience;Language",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "Taha Osama A Binhuraib;Greta Tuckute;Nicholas Blauch",
        "authorids": "~Taha_Osama_A_Binhuraib1;~Greta_Tuckute1;~Nicholas_Blauch1",
        "gender": "M;F;M",
        "homepage": "https://github.com/TahaBinhuraib;http://tuckute.com/;https://nblauch.github.io",
        "dblp": ";240/4412;",
        "google_scholar": ";https://scholar.google.dk/citations?user=pJB4fIEAAAAJ;mKI-uQ4AAAAJ",
        "orcid": ";;",
        "linkedin": "taha-b-1563b3188/;;",
        "or_profile": "~Taha_Osama_A_Binhuraib1;~Greta_Tuckute1;~Nicholas_Blauch1",
        "aff": "Georgia Institute of Technology;Massachusetts Institute of Technology;Harvard University",
        "aff_domain": "gatech.edu;mit.edu;fas.harvard.edu",
        "position": "PhD student;PhD student;Postdoc",
        "bibtex": "@misc{\nbinhuraib2024topoformer,\ntitle={Topoformer: brain-like topographic organization in Transformer language models through spatial querying and reweighting},\nauthor={Taha Osama A Binhuraib and Greta Tuckute and Nicholas Blauch},\nyear={2024},\nurl={https://openreview.net/forum?id=R6AA1NZhLd}\n}",
        "github": "",
        "project": "",
        "reviewers": "DNiv;LDRr;73Ff;P2Yw;S9Nw",
        "site": "https://openreview.net/forum?id=R6AA1NZhLd",
        "pdf_size": 7427011,
        "rating": "5;5;6;6;8",
        "confidence": "4;4;4;3;4",
        "soundness": "3;3;3;2;3",
        "contribution": "3;2;3;2;3",
        "presentation": "3;2;2;1;4",
        "wc_summary": "71;95;133;101;183",
        "wc_strengths": "68;82;70;29;163",
        "wc_weaknesses": "34;263;45;655;335",
        "wc_questions": "22;35;261;77;158",
        "wc_review": "195;475;509;862;839",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "205;477;533;1178;844",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "1;1;1;2;2",
        "rating_avg": [
            6.0,
            1.0954451150103321
        ],
        "confidence_avg": [
            3.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.4,
            1.019803902718557
        ],
        "wc_summary_avg": [
            116.6,
            38.6450514296462
        ],
        "wc_strengths_avg": [
            82.4,
            44.06631366474849
        ],
        "wc_weaknesses_avg": [
            266.4,
            227.4885491623699
        ],
        "wc_questions_avg": [
            110.6,
            88.95077290276909
        ],
        "wc_review_avg": [
            576.0,
            249.32549007271598
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            647.4,
            334.07460244681874
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.4,
            0.4898979485566356
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16368049247943964748&as_sdt=5,31&sciodt=0,31&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Georgia Institute of Technology;Massachusetts Institute of Technology;Harvard University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.gatech.edu;https://web.mit.edu;https://www.harvard.edu",
        "aff_unique_abbr": "Georgia Tech;MIT;Harvard",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "R6klub5OXr",
        "title": "An Extensive Analysis on the Underlying Premises Behind Deep Reinforcement Learning Algorithm Design",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The progress in reinforcement learning algorithm development is at one of its highest points starting from the initial study that enabled sequential decision making from high-dimensional observations. Currently, deep reinforcement learning research has had quite recent breakthroughs from learning without the presence of rewards to learning functioning policies without even knowing the rules of the game. In our paper we focus on the underlying premises that are actively used in deep reinforcement learning algorithm development. We theoretically demonstrate that the performance profiles of the algorithms developed for the data-abundant regime do not transfer to the data-limited regime monotonically. We conduct large-scale experiments in the Arcade Learning Environment and our results demonstrate that the baseline algorithms perform significantly better in the data-limited regime compared to the set of algorithms that were initially designed and compared in the data-abundant regime.",
        "keywords": "Scientific Rigor;Reliable Progress;Evaluation;Reinforcement Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Ezgi Korkmaz",
        "authorids": "~Ezgi_Korkmaz2",
        "gender": "",
        "homepage": "https://ezgikorkmaz.github.io/",
        "dblp": "300/7830.html",
        "google_scholar": "",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Ezgi_Korkmaz2",
        "aff": "University College London, University of London",
        "aff_domain": "ucl.ac.uk",
        "position": "PhD student",
        "bibtex": "@misc{\nkorkmaz2024an,\ntitle={An Extensive Analysis on the Underlying Premises Behind Deep Reinforcement Learning Algorithm Design},\nauthor={Ezgi Korkmaz},\nyear={2024},\nurl={https://openreview.net/forum?id=R6klub5OXr}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZufK;sAik;4G4M;ReTn",
        "site": "https://openreview.net/forum?id=R6klub5OXr",
        "pdf_size": 5939388,
        "rating": "5;5;5;6",
        "confidence": "4;4;3;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;1;3",
        "presentation": "2;2;2;2",
        "wc_summary": "43;85;67;87",
        "wc_strengths": "29;33;153;73",
        "wc_weaknesses": "89;523;286;47",
        "wc_questions": "51;69;88;127",
        "wc_review": "212;710;594;334",
        "wc_reply_reviewers": "51;0;483;0",
        "wc_reply_authors": "218;119;1672;286",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "1;1;3;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            70.5,
            17.684739183827393
        ],
        "wc_strengths_avg": [
            72.0,
            49.82971001320397
        ],
        "wc_weaknesses_avg": [
            236.25,
            188.5462476423225
        ],
        "wc_questions_avg": [
            83.75,
            28.19020219863632
        ],
        "wc_review_avg": [
            462.5,
            198.62716329847737
        ],
        "wc_reply_reviewers_avg": [
            133.5,
            202.8552439548951
        ],
        "wc_reply_authors_avg": [
            573.75,
            636.8494229407764
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:9Pdp_5D4bI0J:scholar.google.com/&scioq=An+Extensive+Analysis+on+the+Underlying+Premises+Behind+Deep+Reinforcement+Learning+Algorithm+Design&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "University College London",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucl.ac.uk",
        "aff_unique_abbr": "UCL",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "R7946uagL2",
        "title": "LIPEx -- Locally Interpretable Probabilistic Explanations -- To Look Beyond The True Class",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In this work, we instantiate a novel perturbation-based multi-class explanation framework, LIPEx (Locally Interpretable Probabilistic Explanation). We demonstrate that LIPEx not only locally replicates the probability distributions output by the widely used complex classification models but also provides insight into how every feature deemed to be important affects the prediction probability for each of the possible classes. We achieve this by defining the explanation as a matrix obtained via regression with respect to the Hellinger distance in the space of probability distributions. Ablation tests on text and image data, show that LIPEx-guided removal of important features from the data causes more change in predictions for the underlying model than similar tests on other saliency-based or feature importance-based XAI methods. It is also shown that compared to LIME, LIPEx is much more data efficient in terms of the number of perturbations needed for reliable evaluation of the explanation.",
        "keywords": "XAI;LIME",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Hongbo Zhu;Anirbit Mukherjee;Procheta Sen;Angelo Cangelosi",
        "authorids": "~Hongbo_Zhu3;~Anirbit_Mukherjee1;~Procheta_Sen2;~Angelo_Cangelosi2",
        "gender": "M;M;M;F",
        "homepage": ";;;https://procheta.github.io/sprocheta/",
        "dblp": ";;;185/6249",
        "google_scholar": "38aTVIcAAAAJ;https://scholar.google.com/citations?pli=1;https://scholar.google.co.uk/citations?user=NyoHewcAAAAJ;hRKyQdoAAAAJ",
        "orcid": "0000-0001-5429-8226;;;0000-0002-3814-5462",
        "linkedin": "hongbo-zhu-3397b7195/?originalSubdomain=uk;anirbit-mukherjee/;;procheta-sen-94086898/?originalSubdomain=uk",
        "or_profile": "~Hongbo_Zhu3;~Anirbit_Mukherjee1;~Angelo_Cangelosi2;~Procheta_Sen1",
        "aff": "University of Manchester;University of Manchester;University of Manchester;University of Liverpool",
        "aff_domain": "cs.manchester.ac.uk;manchester.ac.uk;manchester.ac.uk;liverpool.ac.uk",
        "position": "PhD student;Assistant Professor;Full Professor;Lecturer",
        "bibtex": "@misc{\nzhu2024lipex,\ntitle={{LIPE}x -- Locally Interpretable Probabilistic Explanations -- To Look Beyond The True Class},\nauthor={Hongbo Zhu and Anirbit Mukherjee and Procheta Sen and Angelo Cangelosi},\nyear={2024},\nurl={https://openreview.net/forum?id=R7946uagL2}\n}",
        "github": "",
        "project": "",
        "reviewers": "BvXE;KfmR;LRFa;pXhu",
        "site": "https://openreview.net/forum?id=R7946uagL2",
        "pdf_size": 13867960,
        "rating": "3;3;3;5",
        "confidence": "5;4;4;3",
        "soundness": "2;2;1;4",
        "contribution": "1;2;2;2",
        "presentation": "4;2;1;3",
        "wc_summary": "81;168;87;213",
        "wc_strengths": "41;84;69;33",
        "wc_weaknesses": "463;196;415;114",
        "wc_questions": "2;76;34;134",
        "wc_review": "587;524;605;494",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            1.0897247358851685
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            137.25,
            55.616431924387236
        ],
        "wc_strengths_avg": [
            56.75,
            20.64430914319973
        ],
        "wc_weaknesses_avg": [
            297.0,
            145.91949835440087
        ],
        "wc_questions_avg": [
            61.5,
            49.40394721072396
        ],
        "wc_review_avg": [
            552.5,
            45.224440295044005
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:auHviRogED0J:scholar.google.com/&scioq=LIPEx+--+Locally+Interpretable+Probabilistic+Explanations+--+To+Look+Beyond+The+True+Class&hl=en&as_sdt=0,47",
        "gs_version_total": 8,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "University of Manchester;University of Liverpool",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.manchester.ac.uk;https://www.liverpool.ac.uk",
        "aff_unique_abbr": "UoM;Liv Uni",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "title": "PAE: Reinforcement Learning from External Knowledge for Efficient Exploration",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18655",
        "id": "R7rZUSGOPD",
        "author_site": "Zhe Wu, Haofei Lu, Junliang Xing, You Wu, Renye Yan, Yaozhong Gan, Yuanchun Shi",
        "tldr": "",
        "abstract": "Human intelligence is adept at absorbing valuable insights from external knowledge.\nThis capability is equally crucial for artificial intelligence. \nIn contrast, classical reinforcement learning agents lack such capabilities and often resort to extensive trial and error to explore the environment. \nThis paper introduces $\\textbf{PAE}$: $\\textbf{P}$lanner-$\\textbf{A}$ctor-$\\textbf{E}$valuator, a novel framework for teaching agents to $\\textit{learn to absorb external knowledge}$. \nPAE integrates the Planner's knowledge-state alignment mechanism, the Actor's mutual information skill control, and the Evaluator's adaptive intrinsic exploration reward to achieve 1) effective cross-modal information fusion, 2) enhanced linkage between knowledge and state, and 3) hierarchical mastery of complex tasks.\nComprehensive experiments across\n 11 challenging tasks from the BabyAI and MiniHack environment suites demonstrate PAE's superior exploration efficiency with good interpretability.",
        "keywords": "Reinforcement learning;exploration;intrinsic motivation;knowledge",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/05e9456ab6e27ad1bfa86b07e3188c5f4eb5dcfb.zip",
        "author": "Zhe Wu;Haofei Lu;Junliang Xing;You Wu;Renye Yan;Yaozhong Gan;Yuanchun Shi",
        "authorids": "~Zhe_Wu6;~Haofei_Lu1;~Junliang_Xing1;~You_Wu5;~Renye_Yan1;~Yaozhong_Gan1;~Yuanchun_Shi1",
        "gender": ";;M;M;M;M;F",
        "homepage": "https://github.com/GoooKuuu;;http://people.ucas.ac.cn/~jlxing?language=en;https://github.com/ashuaibuhuifei;https://ieeexplore.ieee.org/author/37088970082;;http://media.cs.tsinghua.edu.cn/en/shiyc",
        "dblp": ";;43/7659.html;;;234/8610;08/5313",
        "google_scholar": ";;jSwNd3MAAAAJ;;;n46Z5BsAAAAJ;",
        "orcid": ";;0000-0001-6801-0510;;;;",
        "linkedin": ";;https://www.linkedin.cn/incareer/in/ACoAAAvlU14B40ZWH1pxg5JJDtQ6LlgMYkp0e5s;;;;",
        "or_profile": "~Zhe_Wu6;~Haofei_Lu1;~Junliang_Xing1;~You_Wu5;~Renye_Yan1;~Yaozhong_Gan1;~Yuanchun_Shi1",
        "aff": "Qiyuan laboratory;;Tsinghua University;Nanjing University;Peking University;Qiyuan Laboratory;, Tsinghua University",
        "aff_domain": "qiyuanlab.com;;tsinghua.edu.cn;nju.edu.cn;pku.edu.cn;qiyuanlab.com;cs.tsinghua.edu.cn",
        "position": "Researcher;;Full Professor;MS student;PhD student;Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\nwu2024pae,\ntitle={{PAE}: Reinforcement Learning from External Knowledge for Efficient Exploration},\nauthor={Zhe Wu and Haofei Lu and Junliang Xing and You Wu and Renye Yan and Yaozhong Gan and Yuanchun Shi},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=R7rZUSGOPD}\n}",
        "github": "",
        "project": "",
        "reviewers": "umQ7;rZvG;2pSJ;qGp8",
        "pdf_size": 13403244,
        "rating": "6;6;6;8",
        "confidence": "3;4;4;4",
        "soundness": "2;3;3;4",
        "contribution": "2;3;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "96;48;99;128",
        "wc_strengths": "41;40;122;143",
        "wc_weaknesses": "43;72;184;151",
        "wc_questions": "40;81;10;48",
        "wc_review": "220;241;415;470",
        "wc_reply_reviewers": "18;22;353;107",
        "wc_reply_authors": "975;1632;1864;1922",
        "reply_reviewers": "1;1;3;2",
        "reply_authors": "4;5;4;5",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            92.75,
            28.699956445959984
        ],
        "wc_strengths_avg": [
            86.5,
            46.5966737010272
        ],
        "wc_weaknesses_avg": [
            112.5,
            57.151115474678186
        ],
        "wc_questions_avg": [
            44.75,
            25.272267409158207
        ],
        "wc_review_avg": [
            336.5,
            108.02430282117075
        ],
        "wc_reply_reviewers_avg": [
            125.0,
            136.35065089686958
        ],
        "wc_reply_authors_avg": [
            1598.25,
            375.83798038516545
        ],
        "reply_reviewers_avg": [
            1.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            4.5,
            0.5
        ],
        "replies_avg": [
            32,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17236482661875819212&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=R7rZUSGOPD",
        "pdf": "https://openreview.net/pdf?id=R7rZUSGOPD",
        "email": "qiyuanlab.com;;tsinghua.edu.cn;nju.edu.cn;pku.edu.cn;qiyuanlab.com;cs.tsinghua.edu.cn",
        "author_num": 7,
        "aff_unique_index": "0;1;2;3;0;1",
        "aff_unique_norm": "Qiyuan Laboratory;Tsinghua University;Nanjing University;Peking University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": ";https://www.tsinghua.edu.cn;https://www.nju.edu.cn;http://www.pku.edu.cn",
        "aff_unique_abbr": ";THU;Nanjing U;Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "1;1;1;1",
        "aff_country_unique": ";China"
    },
    {
        "id": "R9CXfU2mD5",
        "title": "Score Propagation as a Catalyst for Graph Out-of-distribution Detection: A Theoretical and Empirical Study",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The field of graph learning has been substantially advanced by the development of deep learning models, in particular graph neural networks. However, one salient yet largely under-explored challenge is detecting Out-of-Distribution (OOD) nodes on graphs. Prevailing OOD detection techniques developed in other domains like computer vision, do not cater to the interconnected nature of graphs. \nThis work aims to fill this gap by exploring the potential of a simple yet effective method -- OOD score propagation, which propagates OOD scores among neighboring nodes along the graph structure. This post hoc solution can be easily integrated with existing OOD scoring functions, showcasing its excellent flexibility and effectiveness in most scenarios. However, the conditions under which score propagation proves beneficial remain not fully elucidated. Our study meticulously derives these conditions and, inspired by this discovery, introduces an innovative edge augmentation strategy with theoretical guarantee. Empirical evaluations affirm the superiority of our proposed method, outperforming strong OOD detection baselines in various scenarios and settings.",
        "keywords": "Graph Neural Network;Out-of-distribution Detection",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Longfei Ma;Yiyou Sun;Kaize Ding;Fei Wu",
        "authorids": "~Longfei_Ma1;~Yiyou_Sun1;~Kaize_Ding1;~Fei_Wu1",
        "gender": ";M;M;M",
        "homepage": "https://github.com/ma-longfei;https://sunyiyou.github.io/;https://kaize0409.github.io/;https://person.zju.edu.cn/wufei",
        "dblp": ";211/5630;234/6878;84/3254-1",
        "google_scholar": ";IKqlQo4AAAAJ;PI3myr8AAAAJ;XJLn4MYAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Longfei_Ma1;~Yiyou_Sun1;~Kaize_Ding1;~Fei_Wu1",
        "aff": "Zhejiang University;University of California, Berkeley;Northwestern University;Zhejiang University",
        "aff_domain": "cs.zju.edu.cn;berkeley.edu;northwestern.edu;zju.edu.cn",
        "position": "PhD student;Postdoc;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nma2024score,\ntitle={Score Propagation as a Catalyst for Graph Out-of-distribution Detection: A Theoretical and Empirical Study},\nauthor={Longfei Ma and Yiyou Sun and Kaize Ding and Fei Wu},\nyear={2024},\nurl={https://openreview.net/forum?id=R9CXfU2mD5}\n}",
        "github": "",
        "project": "",
        "reviewers": "EGVF;13zH;hJQH",
        "site": "https://openreview.net/forum?id=R9CXfU2mD5",
        "pdf_size": 1193423,
        "rating": "5;6;6",
        "confidence": "5;3;3",
        "soundness": "2;3;2",
        "contribution": "2;2;3",
        "presentation": "3;3;3",
        "wc_summary": "86;175;75",
        "wc_strengths": "38;80;102",
        "wc_weaknesses": "101;66;79",
        "wc_questions": "112;41;40",
        "wc_review": "337;362;296",
        "wc_reply_reviewers": "124;0;0",
        "wc_reply_authors": "1691;1837;609",
        "reply_reviewers": "1;0;0",
        "reply_authors": "4;3;1",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            112.0,
            44.773504069557326
        ],
        "wc_strengths_avg": [
            73.33333333333333,
            26.549743668986505
        ],
        "wc_weaknesses_avg": [
            82.0,
            14.445299120013633
        ],
        "wc_questions_avg": [
            64.33333333333333,
            33.70789554721894
        ],
        "wc_review_avg": [
            331.6666666666667,
            27.207025236549146
        ],
        "wc_reply_reviewers_avg": [
            41.333333333333336,
            58.45416057808793
        ],
        "wc_reply_authors_avg": [
            1379.0,
            547.7249918222343
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8648758117025901604&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Zhejiang University;University of California, Berkeley;Northwestern University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.zju.edu.cn;https://www.berkeley.edu;https://www.northwestern.edu",
        "aff_unique_abbr": "ZJU;UC Berkeley;NU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Berkeley",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "RAA0vCLMhp",
        "title": "Semantic Memory Guided Diffusion Networks for Image-to-Long Text Generation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Automatic describing image with comprehensive textual content is often demanded by different real-world applications, which motivates image-to-text generation tasks such as image captioning. However, conventional tasks mainly focus on generating short text, which often fail to deal with challenging scenarios that long text is inevitable required to describe enriched and diversified visual contents. Therefore, a more generic solution, which should be able to generate text with arbitrary length (long text in most cases), is expected to overcome limitations from existing approaches such as inability to generate sufficiently comprehensive and complete textual content and ensure semantic coherence in it. To address such limitations, we propose a dedicated solution, semantic memory guided diffusion networks (SeMDiff), for image-to-long text generation (I2LTG), which explicitly captures salient semantics from the visual contents, and further record and calibrate them by memory networks to facilitate the text generation process. Specifically, we employ semantic concepts as the vehicle to deliver and process semantics embedded in images, where they are predicted from each image and enhanced in memory, then serve as the condition to guide diffusion networks for iterative generation. Experimental results on three public datasets and a new proposed one with more than 54K instances demonstrate the superiority of our approach compared to previous state-of-the-art solutions. Further analyses illustrate that our approach offers an effective diffusion-based solution with external guidance for long text generation under different cross-modal settings.",
        "keywords": "Diffusion Model;Semantic Guidance;Image-to-Long Text Generation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Chang Liu;Yuanhe Tian;Weidong Chen;Yan Song;Zhendong Mao;Yongdong Zhang",
        "authorids": "~Chang_Liu24;~Yuanhe_Tian1;~Weidong_Chen1;~Yan_Song1;~Zhendong_Mao1;~Yongdong_Zhang2",
        "gender": "M;;M;;;M",
        "homepage": "https://github.com/AlonzoLeeeooo;;;https://clksong.github.io;;https://imcc.ustc.edu.cn/_upload/tpl/0d/13/3347/template3347/zhangyongdong.html",
        "dblp": ";https://dblp.uni-trier.de/pid/246/0133;;09/1398;;z/YongdongZhang",
        "google_scholar": "Y3NKd1wAAAAJ;5GCwWZ8AAAAJ;Z-vKGdoAAAAJ;;;https://scholar.google.com.hk/citations?user=hxGs4ukAAAAJ",
        "orcid": "0009-0003-1751-6206;;0000-0003-2774-2875;;;0000-0003-0066-3448",
        "linkedin": ";;;;;",
        "or_profile": "~Chang_Liu24;~Yuanhe_Tian1;~Weidong_Chen1;~Yan_Song1;~Zhendong_Mao1;~Yongdong_Zhang2",
        "aff": "University of Science and Technology of China;University of Washington, Seattle;University of Science and Technology of China;University of Science and Technology of China;;University of Science and Technology of China",
        "aff_domain": "ustc.edu.cn;uw.edu;ustc.edu.cn;ustc.edu.cn;;ustc.edu.cn",
        "position": "PhD student;PhD student;Postdoc;Full Professor;;Full Professor",
        "bibtex": "@misc{\nliu2024semantic,\ntitle={Semantic Memory Guided Diffusion Networks for Image-to-Long Text Generation},\nauthor={Chang Liu and Yuanhe Tian and Weidong Chen and Yan Song and Zhendong Mao and Yongdong Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=RAA0vCLMhp}\n}",
        "github": "",
        "project": "",
        "reviewers": "52FQ;Hjjf;FnS9;1tdH",
        "site": "https://openreview.net/forum?id=RAA0vCLMhp",
        "pdf_size": 1755694,
        "rating": "5;5;5;5",
        "confidence": "3;3;2;4",
        "soundness": "3;3;3;2",
        "contribution": "3;3;2;2",
        "presentation": "2;2;2;2",
        "wc_summary": "78;97;51;75",
        "wc_strengths": "28;77;25;47",
        "wc_weaknesses": "65;261;256;204",
        "wc_questions": "24;5;67;68",
        "wc_review": "195;440;399;394",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "366;659;678;778",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            75.25,
            16.345871038277526
        ],
        "wc_strengths_avg": [
            44.25,
            20.7047699818182
        ],
        "wc_weaknesses_avg": [
            196.5,
            79.13437938089866
        ],
        "wc_questions_avg": [
            41.0,
            27.340446228984632
        ],
        "wc_review_avg": [
            357.0,
            95.21817053483016
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            620.25,
            153.59423003485514
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:-8dT8QNpMhUJ:scholar.google.com/&scioq=Semantic+Memory+Guided+Diffusion+Networks+for+Image-to-Long+Text+Generation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0;0",
        "aff_unique_norm": "University of Science and Technology of China;University of Washington",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.ustc.edu.cn;https://www.washington.edu",
        "aff_unique_abbr": "USTC;UW",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Seattle",
        "aff_country_unique_index": "0;1;0;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "RAB5gmMBPS",
        "title": "A Critical Look at Classic Test-Time Adaptation Methods in Semantic Segmentation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Test-time adaptation (TTA) aims to adapt a model, initially trained on training data, to potential distribution shifts in the test data. Most existing TTA studies, however, focus on classification tasks, leaving a notable gap in the exploration of TTA for semantic segmentation. This pronounced emphasis on classification might lead numerous newcomers and engineers to mistakenly assume that classic TTA methods designed for classification can be directly applied to segmentation. Nonetheless, this assumption remains unverified, posing an open question. To address this, we conduct a systematic, empirical study to disclose the unique challenges of segmentation TTA, and to determine whether classic TTA strategies can effectively address this task. Our comprehensive results have led to three key observations. First, the classic batch norm updating strategy, commonly used in classification TTA, only brings slight performance improvement, and in some cases it might even adversely affect the results. Even with the application of advanced distribution estimation techniques like batch renormalization, the problem remains unresolved. Second, the teacher-student scheme does enhance training stability for segmentation TTA in the presence of noisy pseudo-labels. However, it cannot directly result in performance improvement compared to the original model without TTA. Third, segmentation TTA suffers a severe long-tailed imbalance problem, which is substantially more complex than that in TTA for classification. This long-tailed challenge significantly affects segmentation TTA performance, even when the accuracy of pseudo-labels is high. In light of these observations, we conclude that TTA for segmentation presents significant challenges, and simply using classic TTA methods cannot address this problem well. Therefore, we hope the community can give more attention to this challenging, yet important, segmentation TTA task in the future. The source code will be publicly available.",
        "keywords": "Test-Time Adaptation;Batch Normalization;Teacher-Student Architecture; Long-Tail Distribution",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Chang'an Yi;Haotian Chen;Yifan Zhang;Yonghui Xu;Lizhen Cui",
        "authorids": "~Chang'an_Yi1;~Haotian_Chen2;~Yifan_Zhang1;~Yonghui_Xu1;~Lizhen_Cui1",
        "gender": "M;M;M;M;M",
        "homepage": ";https://gitee.com/haotian_chen;https://sites.google.com/view/yifan-zhang/%E9%A6%96%E9%A1%B5;https://faculty.sdu.edu.cn/xuyonghui1/zh_CN/index.htm;https://faculty.sdu.edu.cn/cuilizhen/zh_CN/index.htm",
        "dblp": "118/1065.html;;57/4707-4;;",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;;https://scholar.google.com.hk/citations?user=zuYIUJEAAAAJ;;",
        "orcid": ";0000-0001-5493-2549;;;",
        "linkedin": ";;;;",
        "or_profile": "~Chang'an_Yi1;~Haotian_Chen2;~Yifan_Zhang1;~Yonghui_Xu1;~Lizhen_Cui1",
        "aff": "Foshan University;Shandong University;National University of Singapore;Shandong University;Shandong University",
        "aff_domain": "fosu.edu.cn;sdu.edu.cn;nus.edu;sdu.edu.cn;sdu.edu.cn",
        "position": "Associate Professor;PhD student;PhD student;Full Professor;Full Professor",
        "bibtex": "@misc{\nyi2024a,\ntitle={A Critical Look at Classic Test-Time Adaptation Methods in Semantic Segmentation},\nauthor={Chang'an Yi and Haotian Chen and Yifan Zhang and Yonghui Xu and Lizhen Cui},\nyear={2024},\nurl={https://openreview.net/forum?id=RAB5gmMBPS}\n}",
        "github": "",
        "project": "",
        "reviewers": "U5Rv;51SV;dCev;MvYz;GYgc",
        "site": "https://openreview.net/forum?id=RAB5gmMBPS",
        "pdf_size": 439843,
        "rating": "3;3;3;5;5",
        "confidence": "3;4;4;4;5",
        "soundness": "2;3;2;2;3",
        "contribution": "1;1;2;2;2",
        "presentation": "1;2;2;3;3",
        "wc_summary": "103;40;129;46;71",
        "wc_strengths": "23;17;99;31;173",
        "wc_weaknesses": "207;150;661;55;229",
        "wc_questions": "34;4;535;14;168",
        "wc_review": "367;211;1424;146;641",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            3.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            1.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.2,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            77.8,
            33.89041162334857
        ],
        "wc_strengths_avg": [
            68.6,
            59.965323312728
        ],
        "wc_weaknesses_avg": [
            260.4,
            209.138805581365
        ],
        "wc_questions_avg": [
            151.0,
            200.90395715366085
        ],
        "wc_review_avg": [
            557.8,
            465.50591832972435
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.6454972243679028,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:dGm3oZ934N4J:scholar.google.com/&scioq=A+Critical+Look+at+Classic+Test-Time+Adaptation+Methods+in+Semantic+Segmentation&hl=en&as_sdt=0,5",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;1;1",
        "aff_unique_norm": "Foshan University;Shandong University;National University of Singapore",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.fosuniv.edu.cn;http://www.sdu.edu.cn;https://www.nus.edu.sg",
        "aff_unique_abbr": "Foshan U;SDU;NUS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "China;Singapore"
    },
    {
        "id": "RAwfHdvisZ",
        "title": "Multi-modal Domain Adapter Through Hyperbolic and Topic Space",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "As multi-modal search relies on jointly learning image-text representations and has been investigated in the literature,\nwe explore spaces or representations that coexist with and enhance these models.\nBecause the core of multi-modal search is learning their modalities in a shared semantic space and measuring their similarities,\nsearch quality depends on which expressive space is used for learning.\nWe find that topic and Hyperbolic space can complement this space,\nand propose a model-agnostic adaptation framework, Chimera.\nThe novelty of this framework lies in 1) designing the topic and Hyperbolic spaces to reveal relationships buried in traditional spaces,\n2) leveraging token level interactions,\nand 3) performing contrastive/metric learning tasks to ensure the cooperation of these spaces with pre-trained models.\nExperiments show that Chimera empowers pre-trained models for multi-modal search tasks and demonstrate the ability of the layers it introduces.",
        "keywords": "Multi-modal search;Hyperbolic space;Hyperbolic geometry;Lorentz model;Domain adapter",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Noriaki Kawamae",
        "authorids": "~Noriaki_Kawamae1",
        "gender": "",
        "homepage": "",
        "dblp": "70/1704",
        "google_scholar": "https://scholar.google.co.jp/citations?user=ylU8pzwAAAAJ",
        "orcid": "0000-0002-0746-9624",
        "linkedin": "",
        "or_profile": "~Noriaki_Kawamae1",
        "aff": "NTT Comware",
        "aff_domain": "nttcom.co.jp",
        "position": "Evangelist",
        "bibtex": "@misc{\nkawamae2024multimodal,\ntitle={Multi-modal Domain Adapter Through Hyperbolic and Topic Space},\nauthor={Noriaki Kawamae},\nyear={2024},\nurl={https://openreview.net/forum?id=RAwfHdvisZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=RAwfHdvisZ",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:YE6mO1Da73EJ:scholar.google.com/&scioq=Multi-modal+Domain+Adapter+Through+Hyperbolic+and+Topic+Space&hl=en&as_sdt=0,47",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "NTT Comware",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ntt-comware.co.jp",
        "aff_unique_abbr": "",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Japan"
    },
    {
        "id": "RB0RQ3XkYB",
        "title": "Harmonized Learning with Concurrent Arbitration: A Brain-inspired Motion Planning Approach",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Motion planning, regarded as a sequential decision-making problem, poses a challenge for robots in high-dimensional continuous environments due to inefficient sampling. In contrast, humans inherently possess a distinctive advantage in decision-making by leveraging limited information, primarily relying on the concurrent reasoning mechanism in the prefrontal cortex. Motivated by this, we propose a brain-inspired Deep Reinforcement Learning scheme for planning, called Harmonized Learning with Concurrent Arbitration (HLCA). The approach effectively mimics human capacity for concurrent inference tracks and the ability to harmonize strategies. Specifically, in the planning process, a general Concurrent Arbitration Module (CAM) is meticulously crafted to balance the exploration-exploitation dilemma simply and efficiently. Besides, the harmonized style facilitates robots self-improving learning during the learning process, enabling the selection of appropriate strategies to guide planning. Experimental results show that HLCA outperforms the state-of-the-art benchmarks in terms of three representative metrics, which confirms the potential of emulating human-like capabilities to enhance the intelligence and efficiency of robotic planning.",
        "keywords": "Brain-inspired learning;Motion planning;Deep reinforcement learning;",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/8a8084862ce4d4a28391b2fb3c6943e980af0f3f.zip",
        "author": "Tianyuan Jia;Chaoqiong Fan;Qixin Wang;Han Yuyang;Xia Wu",
        "authorids": "~Tianyuan_Jia1;~Chaoqiong_Fan1;~Qixin_Wang2;~Han_Yuyang1;~Xia_Wu3",
        "gender": "F;F;F;M;",
        "homepage": ";;https://orcid.org/my-orcid?emailVerified=true&orcid=0009-0005-8597-2160;https://www.researchgate.net/profile/Han-Yuyang;",
        "dblp": "123/2509;;17/6932.html;;",
        "google_scholar": ";;;;",
        "orcid": "0000-0001-9602-7336;0000-0003-3877-9315;0009-0005-8597-2160;0009-0006-1192-2184;",
        "linkedin": ";;;;",
        "or_profile": "~Tianyuan_Jia1;~Chaoqiong_Fan1;~Qixin_Wang2;~Han_Yuyang1;~Xia_Wu3",
        "aff": "Beijing Normal University;Beijing Normal University;;Beijing Normal University;",
        "aff_domain": "bnu.edu.cn;bnu.edu.cn;;bnu.edu.cn;",
        "position": "PhD student;Lecturer;;MS student;",
        "bibtex": "@misc{\nanonymous2024harmonized,\ntitle={Harmonized Learning with Concurrent Arbitration: A Brain-inspired Motion Planning Approach},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=RB0RQ3XkYB}\n}",
        "github": "",
        "project": "",
        "reviewers": "a5bK;azvY;Api9",
        "site": "https://openreview.net/forum?id=RB0RQ3XkYB",
        "pdf_size": 2539125,
        "rating": "3;5;6",
        "confidence": "4;4;4",
        "soundness": "2;1;3",
        "contribution": "1;2;3",
        "presentation": "2;1;3",
        "wc_summary": "32;325;169",
        "wc_strengths": "5;154;34",
        "wc_weaknesses": "118;336;158",
        "wc_questions": "69;114;899",
        "wc_review": "224;929;1260",
        "wc_reply_reviewers": "0;0;19",
        "wc_reply_authors": "907;988;1610",
        "reply_reviewers": "0;0;1",
        "reply_authors": "2;2;4",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            175.33333333333334,
            119.70055230541847
        ],
        "wc_strengths_avg": [
            64.33333333333333,
            64.49978466802987
        ],
        "wc_weaknesses_avg": [
            204.0,
            94.75582655787804
        ],
        "wc_questions_avg": [
            360.6666666666667,
            381.1022026817595
        ],
        "wc_review_avg": [
            804.3333333333334,
            432.03420646466816
        ],
        "wc_reply_reviewers_avg": [
            6.333333333333333,
            8.956685895029603
        ],
        "wc_reply_authors_avg": [
            1168.3333333333333,
            314.0513050796354
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:qCJwTxmDqA4J:scholar.google.com/&scioq=Harmonized+Learning+with+Concurrent+Arbitration:+A+Brain-inspired+Motion+Planning+Approach&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Beijing Normal University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.bnu.edu.cn",
        "aff_unique_abbr": "BNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "RBqowcUwFP",
        "title": "L(M)V-IQL: Multiple Intention Inverse Reinforcement Learning for Animal Behavior Characterization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In the pursuit of comprehending decision-making, behavioral neuroscience has made significant progress, aided by mathematical models in recent years. Among various approaches, Inverse Reinforcement Learning (IRL) stands out as a promising technique, distinguishing itself from other paradigms through its ability to circumvent the necessity for a reward function in characterizing observed behavior. Nevertheless, the widespread adoption of IRL within the field of neuroscience remains limited. This constraint may be attributed, in part, to the prevailing assumption in many existing IRL frameworks that animals exhibit a singular intention throughout a given task, wherein their behavior is optimized based on a single static reward function. In an effort to overcome this limitation, we propose the class of Latent (Markov) Variable Inverse Q-learning (L(M)V-IQL) algorithms, a novel IRL framework designed to accommodate multiple discrete intrinsic rewards. We formulate an Expectation-Maximization approach to cluster observed trajectories into multiple intentions, and subsequently solve the IRL problem independently for each intention. We illustrate the application of L(M)V-IQL through simulated experiments, followed by its utilization on a dataset of mice engaged in a two-armed bandit task. Our methods exhibit exceptional proficiency in discerning animal intentions and yield interpretable reward functions corresponding to each identified intention. We anticipate that this progress will open up new possibilities in neuroscience and psychology, serving as an important advancement in elucidating the intricacies of animal decision-making and uncovering underlying brain mechanisms.",
        "keywords": "Inverse Reinforcement Learning;Neuroscience;Decision-making",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "Hao Zhu;Brice De La Crompe;Gabriel Kalweit;Artur Schneider;Maria Kalweit;Ilka Diester;Joschka Boedecker",
        "authorids": "~Hao_Zhu17;~Brice_De_La_Crompe1;~Gabriel_Kalweit1;~Artur_Schneider1;~Maria_Kalweit1;ilka.diester@biologie.uni-freiburg.de;~Joschka_Boedecker1",
        "gender": "M;M;;M;F;;",
        "homepage": "https://nr.informatik.uni-freiburg.de/people/hao-zhu;;https://nr.informatik.uni-freiburg.de/people/gabriel-kalweit;https://www.optophysiology.uni-freiburg.de/;https://nr.informatik.uni-freiburg.de/people/maria-huegle;;",
        "dblp": ";;208/0991;;;;",
        "google_scholar": "bWdrl34AAAAJ;-U7Jf2gAAAAJ;xLNPWK8AAAAJ;;https://scholar.google.de/citations?user=6VtPzQ8AAAAJ;;",
        "orcid": "0000-0002-6947-2132;0000-0002-4006-3191;;0000-0002-2107-1807;;;",
        "linkedin": ";brice-de-la-crompe-61314b30/;;;;;",
        "or_profile": "~Hao_Zhu17;~Brice_De_La_Crompe1;~Gabriel_Kalweit1;~Artur_Schneider1;~Maria_Kalweit1;ilka.diester@biologie.uni-freiburg.de;~Joschka_Boedecker1",
        "aff": "Albert-Ludwigs-Universit\u00e4t Freiburg;;Universit\u00e4t Freiburg;Albert-Ludwigs-Universit\u00e4t Freiburg;Collaborative Research Institute Intelligent Oncology;;",
        "aff_domain": "uni-freiburg.de;;uni-freiburg.de;uni-freiburg.de;criion.org;;",
        "position": "PhD student;;PhD student;Postdoc;Researcher;;",
        "bibtex": "@misc{\nzhu2024lmviql,\ntitle={L(M)V-{IQL}: Multiple Intention Inverse Reinforcement Learning for Animal Behavior Characterization},\nauthor={Hao Zhu and Brice De La Crompe and Gabriel Kalweit and Artur Schneider and Maria Kalweit and Ilka Diester and Joschka Boedecker},\nyear={2024},\nurl={https://openreview.net/forum?id=RBqowcUwFP}\n}",
        "github": "",
        "project": "",
        "reviewers": "o7yT;bHzC;M3j1;yMx7",
        "site": "https://openreview.net/forum?id=RBqowcUwFP",
        "pdf_size": 1070426,
        "rating": "5;5;5;6",
        "confidence": "4;3;3;4",
        "soundness": "3;3;3;3",
        "contribution": "2;3;2;2",
        "presentation": "3;2;2;3",
        "wc_summary": "77;46;46;109",
        "wc_strengths": "15;90;36;136",
        "wc_weaknesses": "123;258;130;130",
        "wc_questions": "60;333;34;666",
        "wc_review": "275;727;246;1041",
        "wc_reply_reviewers": "147;0;41;454",
        "wc_reply_authors": "790;111;492;2155",
        "reply_reviewers": "2;0;1;2",
        "reply_authors": "2;1;1;3",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            69.5,
            26.081602711489953
        ],
        "wc_strengths_avg": [
            69.25,
            47.261903262564445
        ],
        "wc_weaknesses_avg": [
            160.25,
            56.508295851140296
        ],
        "wc_questions_avg": [
            273.25,
            255.2149829065684
        ],
        "wc_review_avg": [
            572.25,
            331.0856195910659
        ],
        "wc_reply_reviewers_avg": [
            160.5,
            177.7392753445338
        ],
        "wc_reply_authors_avg": [
            887.0,
            770.622151251831
        ],
        "reply_reviewers_avg": [
            1.25,
            0.82915619758885
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:zNUo3o9U8rkJ:scholar.google.com/&scioq=L(M)V-IQL:+Multiple+Intention+Inverse+Reinforcement+Learning+for+Animal+Behavior+Characterization&hl=en&as_sdt=0,5",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "Albert-Ludwigs-Universit\u00e4t Freiburg;University of Freiburg;Collaborative Research Institute",
        "aff_unique_dep": ";;Intelligent Oncology",
        "aff_unique_url": "https://www.uni-freiburg.de;https://www.uni-freiburg.de;",
        "aff_unique_abbr": "Albert-Ludwigs-Universit\u00e4t;Uni Freiburg;",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Freiburg;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Germany;"
    },
    {
        "id": "RBs0IfPj5e",
        "title": "Backdiff: a diffusion model for generalized transferable protein backmapping",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Coarse-grained (CG) models play a crucial role in the study of protein structures, protein thermodynamic properties and protein conformation dynamics. Due to the information loss in the coarse-graining process, backmapping from CG to all-atom configuations is essential in many protein design and drug discovery applications when detailed atomic representations are needed for in-depth studies. Despite recent progress in data-driven backmapping approaches, devising a backmapping method that can be universally applied across various CG models and proteins remains unresolved. In this work, we propose BackDiff, a new generative model designed to achieve generalization and reliability in the  protein backmapping problem. BackDiff leverages the conditional score-based diffusion model with geometric representations. Since different CG models can contain different coarse-grained sites which include selected atoms (CG atoms) and simple auxiliary functions of atomistic coordinates (auxiliary variables), we design a self-supervised training framework to adapt to different CG atoms, and constrain the diffusion sampling paths with arbitrary auxiliary variables as conditions. Our method facilitates end-to-end training and allows efficient sampling across different proteins and diverse CG models without the need for retraining. Comprehensive experiments over multiple popular CG models demonstrate BackDiff's superior performance to existing state-of-the-art approaches, and generalization and flexibility that these approaches cannot achieve. A pretrained BackDiff model can offer a convenient yet reliable plug-and-play solution for protein researchers, enabling them to investigate further from their own CG models.",
        "keywords": "computational biology;protein conformation generation;generative model;score-based diffusion model",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/1d2dd37839ab06fb19f402e545f6f62133b2c185.zip",
        "author": "Yikai Liu;Guang Lin;Ming Chen",
        "authorids": "~Yikai_Liu1;~Guang_Lin1;~Ming_Chen14",
        "gender": "M;M;",
        "homepage": "https://engineering.purdue.edu/ComplexFlowLab/people;http://www.math.purdue.edu/~lin491/;https://www.chengroup.xyz/",
        "dblp": ";;",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;_G7_EKcAAAAJ",
        "orcid": ";0000-0002-0976-1987;",
        "linkedin": ";;",
        "or_profile": "~Yikai_Liu1;~Guang_Lin1;~Ming_Chen14",
        "aff": "Purdue University;Purdue University;Purdue University",
        "aff_domain": "purdue.edu;purdue.edu;purdue.edu",
        "position": "PhD student;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nliu2024backdiff,\ntitle={Backdiff: a diffusion model for generalized transferable protein backmapping},\nauthor={Yikai Liu and Guang Lin and Ming Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=RBs0IfPj5e}\n}",
        "github": "",
        "project": "",
        "reviewers": "gYSb;np12;pCxU",
        "site": "https://openreview.net/forum?id=RBs0IfPj5e",
        "pdf_size": 7182920,
        "rating": "3;6;6",
        "confidence": "4;4;4",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "2;3;3",
        "wc_summary": "53;137;190",
        "wc_strengths": "28;33;19",
        "wc_weaknesses": "105;324;86",
        "wc_questions": "117;11;35",
        "wc_review": "303;505;330",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1091;1096;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;2;0",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            126.66666666666667,
            56.405279500730735
        ],
        "wc_strengths_avg": [
            26.666666666666668,
            5.792715732327588
        ],
        "wc_weaknesses_avg": [
            171.66666666666666,
            107.99485584456738
        ],
        "wc_questions_avg": [
            54.333333333333336,
            45.382326466980025
        ],
        "wc_review_avg": [
            379.3333333333333,
            89.54080385810458
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            729.0,
            515.4848850031073
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.9428090415820634
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6611233997805466183&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Purdue University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.purdue.edu",
        "aff_unique_abbr": "Purdue",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "RC2h1WQvPo",
        "title": "Interpretable Latent Distributions Using Space-Filling Curves",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep generative models are well-known neural network-based architectures that learn a latent distribution whose samples can be mapped to sensible real-world data such as images, video, and speech. Such latent distributions are, however, often difficult to interpret. In generative adversarial networks (GANs), some earlier supervised methods aim to create an interpretable (structured) latent distribution or discover interpretable directions for image editing which require exploiting the data labels or annotated synthesized samples during training, respectively. In contrast, we propose using an unsupervised structured distribution modeling technique that incorporates space-filling curves into vector quantization, which makes the latent distribution interpretable by capturing its underlying morphological structure. We apply this technique to model the latent distribution of pretrained StyleGAN2 and BigGAN networks on various image datasets. Our experiments show that the proposed approach yields an interpretable model of the latent distribution such that it determines which part of the latent distribution corresponds to specific generative factors such as age, pose, hairstyle, background, data class, etc. Furthermore, we can use the points and direction of a space-filling line for controllable data augmentation and applying intelligible image transformations, respectively. The implementation of our proposed method is publicly available.",
        "keywords": "Interpretable Latent Space;Discovering Interpretable Directions;Generative Adversarial Networks;Image Editing;Space-Filling Curve;Vector Quantization",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Mohammad Hassan Vali;Tom B\u00e4ckstr\u00f6m",
        "authorids": "~Mohammad_Hassan_Vali1;~Tom_B\u00e4ckstr\u00f6m1",
        "gender": "M;M",
        "homepage": "https://research.aalto.fi/en/persons/mohammadhassan-vali;https://research.aalto.fi/en/persons/tom-b%C3%A4ckstr%C3%B6m",
        "dblp": "225/4913;43/3827",
        "google_scholar": "Fk3KDc4AAAAJ;gYkjY24AAAAJ",
        "orcid": "0000-0001-8023-6352;0000-0002-5590-2349",
        "linkedin": "mh-vali/;tombackstrom/",
        "or_profile": "~Mohammad_Hassan_Vali1;~Tom_B\u00e4ckstr\u00f6m1",
        "aff": "Aalto University;Aalto University",
        "aff_domain": "aalto.fi;aalto.fi",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\nvali2024interpretable,\ntitle={Interpretable Latent Distributions Using Space-Filling Curves},\nauthor={Mohammad Hassan Vali and Tom B{\\\"a}ckstr{\\\"o}m},\nyear={2024},\nurl={https://openreview.net/forum?id=RC2h1WQvPo}\n}",
        "github": "",
        "project": "",
        "reviewers": "Bd8w;XT3P;SucH",
        "site": "https://openreview.net/forum?id=RC2h1WQvPo",
        "pdf_size": 21573420,
        "rating": "3;3;5",
        "confidence": "4;5;3",
        "soundness": "2;2;3",
        "contribution": "1;1;3",
        "presentation": "2;1;3",
        "wc_summary": "68;97;74",
        "wc_strengths": "25;21;102",
        "wc_weaknesses": "132;300;129",
        "wc_questions": "1;112;4",
        "wc_review": "226;530;309",
        "wc_reply_reviewers": "126;134;80",
        "wc_reply_authors": "370;592;324",
        "reply_reviewers": "1;1;1",
        "reply_authors": "1;2;1",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            79.66666666666667,
            12.498888839501783
        ],
        "wc_strengths_avg": [
            49.333333333333336,
            37.27674282385138
        ],
        "wc_weaknesses_avg": [
            187.0,
            79.91245209602819
        ],
        "wc_questions_avg": [
            39.0,
            51.633322573702344
        ],
        "wc_review_avg": [
            355.0,
            128.29912964111125
        ],
        "wc_reply_reviewers_avg": [
            113.33333333333333,
            23.79542439676633
        ],
        "wc_reply_authors_avg": [
            428.6666666666667,
            117.0109206679255
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.8660254037844387,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:RZpc-fpJJigJ:scholar.google.com/&scioq=Interpretable+Latent+Distributions+Using+Space-Filling+Curves&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Aalto University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.aalto.fi",
        "aff_unique_abbr": "Aalto",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Finland"
    },
    {
        "id": "RC2yS5QZQc",
        "title": "Gradient Constrained Sharpness-aware Prompt Learning for Vision-Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "This paper targets a novel trade-off problem in generalizable prompt learning for vision-language models (VLM), i.e., improving the performance on unseen classes while maintaining the performance on seen classes. Comparing with existing generalizable methods that neglect the seen classes degradation, the setting of this problem is stricter and fits more closely with practical applications. To solve this problem, we start from the optimization perspective, and leverage the relationship between loss landscape geometry and model generalization ability. By analyzing the loss landscapes of the state-of-the-art method and vanilla Sharpness-aware Minimization (SAM) based method, we conclude that the trade-off performance correlates to both loss value and loss sharpness, while each of them is indispensable. However, we find the optimizing gradient of existing methods cannot maintain high relevance to both loss value and loss sharpness during optimization, which severely affects their trade-off performance. To this end, we propose a novel SAM-based method for prompt learning, denoted as Gradient Constrained Sharpness-aware Context Optimization (GCSCoOp), to dynamically constrain the optimizing gradient, thus achieving above two-fold optimization objective simultaneously. Extensive experiments verify the effectiveness of GCSCoOp in the trade-off problem.",
        "keywords": "prompt learning;vision language model fine-tuning;sharpness aware optimization",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/6c1b4b8bff6da77b77b932a8389d308c7162fa1f.zip",
        "author": "Liangchen Liu;Nannan Wang;Dawei Zhou;Xinbo Gao;Decheng Liu;Xi Yang;Tongliang Liu",
        "authorids": "~Liangchen_Liu4;~Nannan_Wang1;~Dawei_Zhou3;~Xinbo_Gao5;~Decheng_Liu2;~Xi_Yang4;~Tongliang_Liu1",
        "gender": "M;M;M;M;F;M;M",
        "homepage": ";;https://faculty.cqupt.edu.cn/gaoxinbo/zh_CN/index.htm;;https://web.xidian.edu.cn/yangx/;https://tongliang-liu.github.io/;",
        "dblp": "155/3055-1.html;10/8359-1;;;13/1520-11;150/6667;39/3130-4",
        "google_scholar": "9SaSFgMAAAAJ;SRBn7oUAAAAJ;https://scholar.google.com/citations?hl=zh-CN;c5TFU9sAAAAJ;W5c-LSYAAAAJ;https://scholar.google.com.au/citations?user=EiLdZ_YAAAAJ;https://scholar.google.com.hk/citations?user=7H-LIigAAAAJ",
        "orcid": ";;0000-0002-7985-0037;0000-0002-6550-212X;0000-0002-5791-3674;;0000-0002-0694-3603",
        "linkedin": ";;xinbo-gao-151a2224/;;;;",
        "or_profile": "~Liangchen_Liu4;~Nannan_Wang1;~Xinbo_Gao5;~Decheng_Liu2;~Xi_Yang4;~Tongliang_Liu1;~Zhou_Dawei1",
        "aff": "Xidian University;Xidian University;Chongqing University of Post and Telecommunications;Xidian University ;Xidian University;Mohamed bin Zayed University of Artificial Intelligence;Xidian University",
        "aff_domain": "xidian.edu;xidian.edu.cn;cqupt.edu.cn;xidian.edu.cn;xidian.edu;mbzuai.ac.ae;xidian.edu.cn",
        "position": "PhD student;Full Professor;Full Professor;Assistant Professor;Full Professor;Affiliated Associate Professor;PhD student",
        "bibtex": "@misc{\nliu2024gradient,\ntitle={Gradient Constrained Sharpness-aware Prompt Learning for Vision-Language Models},\nauthor={Liangchen Liu and Nannan Wang and Dawei Zhou and Xinbo Gao and Decheng Liu and Xi Yang and Tongliang Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=RC2yS5QZQc}\n}",
        "github": "",
        "project": "",
        "reviewers": "DgeK;GqHE;SWWN;wX3D",
        "site": "https://openreview.net/forum?id=RC2yS5QZQc",
        "pdf_size": 1263666,
        "rating": "5;5;5;5",
        "confidence": "4;3;4;5",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "4;3;2;2",
        "wc_summary": "75;55;29;29",
        "wc_strengths": "38;52;66;30",
        "wc_weaknesses": "390;176;104;363",
        "wc_questions": "1;122;19;21",
        "wc_review": "504;405;218;443",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            47.0,
            19.339079605813716
        ],
        "wc_strengths_avg": [
            46.5,
            13.738631664034086
        ],
        "wc_weaknesses_avg": [
            258.25,
            121.33502173733683
        ],
        "wc_questions_avg": [
            40.75,
            47.5519452809241
        ],
        "wc_review_avg": [
            392.5,
            106.7579036886731
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=594640885720690793&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1;0;0;2;0",
        "aff_unique_norm": "Xidian University;Chongqing University of Post and Telecommunications;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.xidian.edu.cn/;http://www.cqupt.edu.cn;https://mbzuai.ac.ae",
        "aff_unique_abbr": "Xidian;CQUPT;MBZUAI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;1;0",
        "aff_country_unique": "China;United Arab Emirates"
    },
    {
        "id": "RCKeTZKE5o",
        "title": "Meta Compression: Learning to compress Deep Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deploying large pretrained deep learning models is hindered by the limitations of realistic scenarios such as resource constraints on the user/edge devices. Issues such as selecting the right pretrained model, compression method, and compression level to suit a target application and hardware become especially important. We address these challenges using a  novel meta learning framework that can provide high quality recommendations tailored to the specified resource, performance, and efficiency constraints.\nFor scenarios with limited to no access to unseen samples that resemble the distribution used for pretraining, we invoke diffusion models to improve generalization to test data and thereby demonstrate the promise of augmenting meta-learners with generative models. When learning across several state-of-the-art compression algorithms and DNN architectures trained on the CIFAR10 dataset, our top recommendation shows only 1\\% drop in average accuracy loss compared to the optimal compression method. This is in contrast to 25\\% average accuracy drop achieved by selecting the single best compression method across all constraints.",
        "keywords": "Model compression;meta learning;efficient inference;deep learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Ashutosh Vaishnav;Ankit Khatri;Vikas Garg;Mario Di Francesco",
        "authorids": "~Ashutosh_Vaishnav1;~Ankit_Khatri1;~Vikas_Garg2;~Mario_Di_Francesco1",
        "gender": "M;M;;",
        "homepage": ";https://ankitknitj.github.io/;;",
        "dblp": "319/9373;;;",
        "google_scholar": ";cijF4EYAAAAJ;;",
        "orcid": "0000-0002-8365-6237;0000-0002-0631-6554;;",
        "linkedin": ";ankit-khatri-66283814b;;",
        "or_profile": "~Ashutosh_Vaishnav1;~Ankit_Khatri1;~Vikas_Garg2;~Mario_Di_Francesco1",
        "aff": "Aalto University;;;",
        "aff_domain": "aalto.fi;;;",
        "position": "PhD student;;;",
        "bibtex": "@misc{\nvaishnav2024meta,\ntitle={Meta Compression: Learning to compress Deep Neural Networks},\nauthor={Ashutosh Vaishnav and Ankit Khatri and Vikas Garg and Mario Di Francesco},\nyear={2024},\nurl={https://openreview.net/forum?id=RCKeTZKE5o}\n}",
        "github": "",
        "project": "",
        "reviewers": "a7if;aDqZ;KXmL;FBBW",
        "site": "https://openreview.net/forum?id=RCKeTZKE5o",
        "pdf_size": 490707,
        "rating": "3;3;5;5",
        "confidence": "5;3;4;3",
        "soundness": "2;2;2;2",
        "contribution": "1;2;2;2",
        "presentation": "3;2;1;3",
        "wc_summary": "61;19;100;47",
        "wc_strengths": "60;39;69;28",
        "wc_weaknesses": "170;108;181;97",
        "wc_questions": "31;11;70;29",
        "wc_review": "322;177;420;201",
        "wc_reply_reviewers": "0;0;0;56",
        "wc_reply_authors": "569;371;206;363",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            56.75,
            29.192250684042847
        ],
        "wc_strengths_avg": [
            49.0,
            16.294170736800325
        ],
        "wc_weaknesses_avg": [
            139.0,
            36.9120576505835
        ],
        "wc_questions_avg": [
            35.25,
            21.52179128232592
        ],
        "wc_review_avg": [
            280.0,
            97.74200734586947
        ],
        "wc_reply_reviewers_avg": [
            14.0,
            24.24871130596428
        ],
        "wc_reply_authors_avg": [
            377.25,
            128.77960824602627
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.30151134457776363,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:iZMlWB0mXhoJ:scholar.google.com/&scioq=Meta+Compression:+Learning+to+compress+Deep+Neural+Networks&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Aalto University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.aalto.fi",
        "aff_unique_abbr": "Aalto",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Finland"
    },
    {
        "id": "RCKoQGpPEN",
        "title": "MaXTron: Mask Transformer with Trajectory Attention for Video Panoptic Segmentation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Video panoptic segmentation requires consistently segmenting (for both \u2018thing\u2019 and \u2018stuff\u2019 classes) and tracking objects in a video over time. In this work, we present MaXTron, a general framework that exploits Mask XFormer with Trajectory Attention to tackle the task. MaXTron enriches an off-the-shelf mask transformer by leveraging trajectory attention. The deployed mask transformer takes as input a short clip consisting of only a few frames and predicts the clip-level segmentation. To enhance the temporal consistency, MaXTron employs within-clip and cross-clip tracking modules, efficiently utilizing trajectory attention. Originally designed for video classification, trajectory attention learns to model the temporal correspondences between neighboring frames and aggregates information along the estimated motion paths. However, it is nontrivial to directly extend trajectory attention to the per-pixel dense prediction tasks due to its quadratic dependency on input size. To alleviate the issue, we propose to adapt the trajectory attention for both the dense pixel features and object queries, aiming to improve the short-term and long-term tracking results, respectively. Particularly, in our within-clip tracking module, we propose axial-trajectory attention that effectively computes the trajectory attention for tracking dense pixels sequentially along the height- and width-axes. The axial decomposition significantly reduces the computational complexity for dense pixel features. In our cross-clip tracking module, since the object queries in mask transformer are learned to encode the object information, we are able to capture the long-term temporal connections by applying trajectory attention to object queries, which learns to track each object across different clips. Without bells and whistles, MaXTron demonstrates state-of-the-art performances on video segmentation benchmarks. Code will be publicly available.",
        "keywords": "Video Panoptic Segmentation;Video Instance Segmentation;Trajectory Attention",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/4afd80719b6856d51c1adaca72f632ffe0eea68d.zip",
        "author": "Ju He;Qihang Yu;Inkyu Shin;Xueqing Deng;Alan Yuille;Xiaohui Shen;Liang-Chieh Chen",
        "authorids": "~Ju_He1;~Qihang_Yu1;~Inkyu_Shin1;~Xueqing_Deng2;~Alan_Yuille1;~Xiaohui_Shen2;~Liang-Chieh_Chen1",
        "gender": "M;;M;M;;;F",
        "homepage": "https://tacju.github.io/;;https://dlsrbgg33.github.io/;;https://xiaohuishen.github.io/;http://liangchiehchen.com/;https://sites.google.com/view/xueqingdeng7/home",
        "dblp": ";;232/3141;y/AlanLYuille;88/6582;138/2443;209/9919",
        "google_scholar": "NyTPm_zUV_kC;7zZdZxsAAAAJ;XpHl_HEAAAAJ;;pViZYwIAAAAJ;ACjYGPUAAAAJ;UGhyv2UAAAAJ",
        "orcid": ";;;;;;",
        "linkedin": "ju-he-43b884190/;;;;;;",
        "or_profile": "~Ju_He1;~Qihang_Yu1;~Inkyu_Shin1;~Alan_Yuille1;~Xiaohui_Shen2;~Liang-Chieh_Chen1;~Xueqing_Deng1",
        "aff": "Johns Hopkins University;ByteDance;Korea Advanced Institute of Science & Technology;Johns Hopkins University;ByteDance Inc.;ByteDance / TikTok;ByteDance Research",
        "aff_domain": "jhu.edu;bytedance.com;kaist.ac.kr;johnshopkins.edu;bytedance.com;bytedance.com;bytedance.com",
        "position": "PhD student;Researcher;PhD student;Full Professor;Researcher;Research Scientist;Researcher",
        "bibtex": "@misc{\nhe2024maxtron,\ntitle={Ma{XT}ron: Mask Transformer with Trajectory Attention for Video Panoptic Segmentation},\nauthor={Ju He and Qihang Yu and Inkyu Shin and Xueqing Deng and Alan Yuille and Xiaohui Shen and Liang-Chieh Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=RCKoQGpPEN}\n}",
        "github": "",
        "project": "",
        "reviewers": "tzju;TBSQ;LGcv;tzTu",
        "site": "https://openreview.net/forum?id=RCKoQGpPEN",
        "pdf_size": 28298487,
        "rating": "3;5;6;6",
        "confidence": "5;4;3;4",
        "soundness": "2;3;3;4",
        "contribution": "1;2;2;3",
        "presentation": "2;3;2;3",
        "wc_summary": "144;46;51;105",
        "wc_strengths": "57;46;28;121",
        "wc_weaknesses": "123;146;66;77",
        "wc_questions": "34;98;2;74",
        "wc_review": "358;336;147;377",
        "wc_reply_reviewers": "564;123;0;26",
        "wc_reply_authors": "3236;2053;364;541",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "6;4;1;2",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            86.5,
            40.46294601237038
        ],
        "wc_strengths_avg": [
            63.0,
            35.04996433664377
        ],
        "wc_weaknesses_avg": [
            103.0,
            32.76430985081175
        ],
        "wc_questions_avg": [
            52.0,
            36.823905279043935
        ],
        "wc_review_avg": [
            304.5,
            92.08284313595014
        ],
        "wc_reply_reviewers_avg": [
            178.25,
            227.38115027415972
        ],
        "wc_reply_authors_avg": [
            1548.5,
            1174.763061217027
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.25,
            1.920286436967152
        ],
        "replies_avg": [
            30,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.8660254037844386,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16077632788009321917&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;0;1;1;1",
        "aff_unique_norm": "Johns Hopkins University;ByteDance;Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.jhu.edu;https://www.bytedance.com;https://www.kaist.ac.kr",
        "aff_unique_abbr": "JHU;ByteDance;KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;0;1;1;1",
        "aff_country_unique": "United States;China;South Korea"
    },
    {
        "id": "RD7Fo7RezT",
        "title": "Model-Based Transfer RL with Task-Agnostic Offline Pretraining",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Pretraining RL models on offline datasets is a promising way to improve their training efficiency in online tasks, but challenging due to the inherent mismatch in dynamics and behaviors across tasks or data domains. We present Vid2Act, a model-based RL method that learns to transfer potentially useful dynamics and action demonstrations from various offline datasets to a novel task. The main idea is to use the world models not only as simulators for behavior learning but also as tools to measure the task relevance for both dynamics representation transfer and policy transfer. Specifically, we build a time-varying, task-selective distillation loss to generate a set of offline-to-online similarity weights. These weights serve two purposes: (i) adaptively transferring the task-agnostic knowledge of physical dynamics to facilitate world model training, and (ii) learning to replay relevant source actions to guide the target policy. We demonstrate the advantages of Vid2Act over the state-of-the-art methods in Meta-World and DeepMind Control Suite.",
        "keywords": "World model;visual reinforcement learning;transfer learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/b3bebf04b138d8053fdf97696f710965955204c9.zip",
        "author": "Minting Pan;Yitao Zheng;Haijian Chen;Yumeng He;Yunbo Wang;Xiaokang Yang",
        "authorids": "~Minting_Pan1;~Yitao_Zheng3;~Haijian_Chen1;~Yumeng_He1;~Yunbo_Wang2;~Xiaokang_Yang1",
        "gender": ";M;M;F;M;M",
        "homepage": ";http://ytzheng.github.io;https://github.com/higersky;https://github.com/ymhe12;https://icne.sjtu.edu.cn/info/1064/1078.htm;https://wyb15.github.io/",
        "dblp": "279/0648;279/5713;;;06/3071-1.html;84/3894",
        "google_scholar": ";;;;yDEavdMAAAAJ;C8bGfr0AAAAJ",
        "orcid": "0000-0002-4666-510X;;;;0000-0003-4029-3322;",
        "linkedin": ";;;;;",
        "or_profile": "~Minting_Pan1;~Yitao_Zheng3;~Haijian_Chen1;~Yumeng_He1;~Xiaokang_Yang1;~Yunbo_Wang1",
        "aff": "Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn",
        "position": "PhD student;PhD student;MS student;PhD student;Full Professor;Associate Professor",
        "bibtex": "@misc{\npan2024modelbased,\ntitle={Model-Based Transfer {RL} with Task-Agnostic Offline Pretraining},\nauthor={Minting Pan and Yitao Zheng and Haijian Chen and Yumeng He and Yunbo Wang and Xiaokang Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=RD7Fo7RezT}\n}",
        "github": "",
        "project": "",
        "reviewers": "xfrk;E2SU;9i9x;oHAr",
        "site": "https://openreview.net/forum?id=RD7Fo7RezT",
        "pdf_size": 6254365,
        "rating": "3;3;5;5",
        "confidence": "4;4;3;4",
        "soundness": "2;2;3;2",
        "contribution": "2;2;2;3",
        "presentation": "3;1;3;3",
        "wc_summary": "86;80;68;175",
        "wc_strengths": "22;28;34;75",
        "wc_weaknesses": "95;142;194;215",
        "wc_questions": "77;684;66;150",
        "wc_review": "280;934;362;615",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            102.25,
            42.49926469952157
        ],
        "wc_strengths_avg": [
            39.75,
            20.78911975048487
        ],
        "wc_weaknesses_avg": [
            161.5,
            46.69314724882014
        ],
        "wc_questions_avg": [
            244.25,
            255.93395144060116
        ],
        "wc_review_avg": [
            547.75,
            254.9042712470703
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:HaT6hgxVOO8J:scholar.google.com/&scioq=Model-Based+Transfer+RL+with+Task-Agnostic+Offline+Pretraining&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "Shanghai Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sjtu.edu.cn",
        "aff_unique_abbr": "SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Scaling for Training Time and Post-hoc Out-of-distribution Detection Enhancement",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18654",
        "id": "RDSTjtnqCg",
        "author_site": "Kai Xu, Rongyu Chen, Gianni Franchi, Angela Yao",
        "tldr": "",
        "abstract": "Activation shaping has proven highly effective for identifying out-of-distribution (OOD) samples post-hoc. Activation shaping prunes and scales network activations before estimating the OOD energy score; such an extremely simple approach achieves state-of-the-art OOD detection with minimal in-distribution (ID) accuracy drops. This paper analyzes the working mechanism behind activation shaping. We directly show that the benefits for OOD detection derive only from scaling, while pruning is detrimental. Based on our analysis, we propose SCALE, an even simpler yet more effective post-hoc network enhancement method for OOD detection. SCALE attains state-of-the-art OOD detection performance without any compromises on ID accuracy. Furthermore, we integrate scaling concepts into learning and propose Intermediate Tensor SHaping (ISH) for training-time OOD detection enhancement. ISH achieves significant AUROC improvements for both near- and far-OOD, highlighting the importance of activation distributions in emphasizing ID data characteristics. Our code and models are available at https://github.com/kai422/SCALE.",
        "keywords": "out-of distribution detection",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/e1fdf1a798f87026327abcf28a9dd4a549f9ccef.zip",
        "author": "Kai Xu;Rongyu Chen;Gianni Franchi;Angela Yao",
        "authorids": "~Kai_Xu7;~Rongyu_Chen1;~Gianni_Franchi1;~Angela_Yao1",
        "gender": "M;M;M;",
        "homepage": "https://kai422.github.io/;https://gloryyrolg.github.io/;https://giannifranchi.github.io/;http://www.angelayao.com",
        "dblp": ";279/0280;155/3061;64/8484",
        "google_scholar": "https://scholar.google.com/citations?hl=en;gP_jm9UAAAAJ;ZCW6-psAAAAJ;https://scholar.google.ch/citations?user=-LJCZMMAAAAJ",
        "orcid": ";0009-0004-3358-0053;0000-0002-2184-1381;",
        "linkedin": ";rongyu-glory-chen-6a3482189/;gianni-franchi-94435754/;",
        "or_profile": "~Kai_Xu7;~Rongyu_Chen1;~Gianni_Franchi1;~Angela_Yao1",
        "aff": "National University of Singapore;Alibaba Group;ENSTA Paris;National University of Singapore",
        "aff_domain": "nus.edu.sg;alibaba-inc.com;ensta-paristech.fr;nus.edu.sg",
        "position": "PhD student;Intern;Assistant Professor;Associate Professor",
        "bibtex": "@inproceedings{\nxu2024scaling,\ntitle={Scaling for Training Time and Post-hoc Out-of-distribution Detection Enhancement},\nauthor={Kai Xu and Rongyu Chen and Gianni Franchi and Angela Yao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=RDSTjtnqCg}\n}",
        "github": "",
        "project": "",
        "reviewers": "5qNg;DQbC;RAx2;AeGx",
        "pdf_size": 1153471,
        "rating": "5;6;6;8",
        "confidence": "4;3;3;5",
        "soundness": "2;3;3;4",
        "contribution": "2;4;3;4",
        "presentation": "3;4;3;4",
        "wc_summary": "75;12;36;94",
        "wc_strengths": "35;24;24;199",
        "wc_weaknesses": "260;30;47;147",
        "wc_questions": "2;14;24;30",
        "wc_review": "372;80;131;470",
        "wc_reply_reviewers": "0;0;9;17",
        "wc_reply_authors": "609;187;239;163",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            54.25,
            32.12767498590584
        ],
        "wc_strengths_avg": [
            70.5,
            74.32529851941396
        ],
        "wc_weaknesses_avg": [
            121.0,
            91.86130850363497
        ],
        "wc_questions_avg": [
            17.5,
            10.618380290797651
        ],
        "wc_review_avg": [
            263.25,
            162.51365327257892
        ],
        "wc_reply_reviewers_avg": [
            6.5,
            7.088723439378913
        ],
        "wc_reply_authors_avg": [
            299.5,
            180.789241936571
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.6225430174794673,
        "gs_citation": 31,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8343836957133992189&as_sdt=5,39&sciodt=0,39&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=RDSTjtnqCg",
        "pdf": "https://openreview.net/pdf?id=RDSTjtnqCg",
        "email": "nus.edu.sg;alibaba-inc.com;ensta-paristech.fr;nus.edu.sg",
        "author_num": 4,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "National University of Singapore;Alibaba Group;\u00c9cole Nationale Sup\u00e9rieure de Techniques Avanc\u00e9es",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.nus.edu.sg;https://www.alibaba.com;https://www.ensta.fr",
        "aff_unique_abbr": "NUS;Alibaba;ENSTA",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Paris",
        "aff_country_unique_index": "0;1;2;0",
        "aff_country_unique": "Singapore;China;France"
    },
    {
        "title": "Demystifying Linear MDPs and Novel Dynamics Aggregation Framework",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18653",
        "id": "RDSj6S8WJe",
        "author_site": "Joongkyu Lee, Min-hwan Oh",
        "tldr": "",
        "abstract": "In this work, we prove that, in linear MDPs, the feature dimension $d$ is lower bounded by $S/U$ in order to aptly represent transition probabilities, where $S$ is the size of the state space and $U$ is the maximum size of directly reachable states.\nHence, $d$ can still scale with $S$ depending on the direct reachability of the environment.  To address this limitation of linear MDPs, we propose a novel structural aggregation framework based on dynamics, named as the *dynamics aggregation*.\n    For this newly proposed framework,\n    we design a provably efficient hierarchical reinforcement learning algorithm in linear function approximation that leverages aggregated sub-structures. Our proposed algorithm exhibits statistical efficiency, achieving a regret of $\\tilde{O} \\big( d_{\\psi}^{3/2} H^{3/2}\\sqrt{ NT} \\big)$, where $d_{\\psi}$ represents the feature dimension of *aggregated subMDPs* and $N$ signifies the number of aggregated subMDPs. \n    We establish that the condition $d_{\\psi}^3 N \\ll d^{3}$ is readily met in most real-world environments with hierarchical structures, enabling a substantial improvement in the regret bound compared to LSVI-UCB, which enjoys a regret of $\\tilde{O}(d^{3/2} H^{3/2} \\sqrt{ T})$.\n    To the best of our knowledge, this work presents the first HRL algorithm with linear function approximation that offers provable guarantees.",
        "keywords": "linear MDPs;hierarchical reinforcement learning;linear function approximation;aggregation",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/c47c210909ea1555f774c5b14a14306c9f3a3544.zip",
        "author": "Joongkyu Lee;Min-hwan Oh",
        "authorids": "~Joongkyu_Lee1;~Min-hwan_Oh1",
        "gender": "M;",
        "homepage": "https://joongkyulee.com/;https://minoh.io",
        "dblp": "368/2751;172/0531",
        "google_scholar": "YWZakwkAAAAJ;KzVALFwAAAAJ",
        "orcid": ";",
        "linkedin": "joongkyu-lee-939aa91a7;",
        "or_profile": "~Joongkyu_Lee1;~Min-hwan_Oh1",
        "aff": "Seoul National University;Seoul National University",
        "aff_domain": "snu.ac.kr;snu.ac.kr",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nlee2024demystifying,\ntitle={Demystifying Linear {MDP}s and Novel Dynamics Aggregation Framework},\nauthor={Joongkyu Lee and Min-hwan Oh},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=RDSj6S8WJe}\n}",
        "github": "",
        "project": "",
        "reviewers": "hMDT;Taww;JZay;M46L;kJCM",
        "pdf_size": 1630158,
        "rating": "5;6;6;6;6",
        "confidence": "3;4;3;2;4",
        "soundness": "2;3;3;3;3",
        "contribution": "2;3;2;3;3",
        "presentation": "3;3;3;2;3",
        "wc_summary": "103;76;92;52;168",
        "wc_strengths": "100;53;115;41;90",
        "wc_weaknesses": "122;54;348;122;47",
        "wc_questions": "84;25;77;95;169",
        "wc_review": "409;208;632;310;474",
        "wc_reply_reviewers": "0;14;213;94;12",
        "wc_reply_authors": "2052;461;2343;1170;968",
        "reply_reviewers": "0;1;1;1;1",
        "reply_authors": "4;2;4;3;3",
        "rating_avg": [
            5.8,
            0.39999999999999997
        ],
        "confidence_avg": [
            3.2,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            98.2,
            38.886501514021546
        ],
        "wc_strengths_avg": [
            79.8,
            28.195035023918663
        ],
        "wc_weaknesses_avg": [
            138.6,
            109.49630130739577
        ],
        "wc_questions_avg": [
            90.0,
            46.25148646259923
        ],
        "wc_review_avg": [
            406.6,
            144.31022139820865
        ],
        "wc_reply_reviewers_avg": [
            66.6,
            80.45769074488778
        ],
        "wc_reply_authors_avg": [
            1398.8,
            697.9385073199501
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            3.2,
            0.7483314773547882
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.13363062095621223,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17695882877155083213&as_sdt=5,31&sciodt=0,31&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=RDSj6S8WJe",
        "pdf": "https://openreview.net/pdf?id=RDSj6S8WJe",
        "email": "snu.ac.kr;snu.ac.kr",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Seoul National University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.snu.ac.kr",
        "aff_unique_abbr": "SNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "RDU6p4Fydz",
        "title": "Enhancing Parameter Efficiency in Summarization via Expertise Separation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "A proficient summarization model should exhibit both flexibility -- the capacity to handle a range of in-domain summarization tasks, and adaptability -- the competence to acquire new knowledge and adjust to unseen out-of-domain tasks. Unlike large language models (LLMs) that achieve this through parameter scaling, we propose a more parameter-efficient approach in this study. Our motivation rests on the principle that while the general summarization ability to capture salient information can be shared across different tasks, the domain-specific summarization abilities need to be distinct and tailored. Concretely, we propose MoeSumm, a Mixture-of-Expert Summarization architecture, which utilizes a main expert for gaining the general summarization capability and deputy experts that selectively collaborate to meet specific summarization task requirements. We further propose a max-margin loss to stimulate the separation of these abilities. Our model's distinct separation of general and domain-specific summarization abilities grants it with notable flexibility and adaptability, all while maintaining parameter efficiency. MoeSumm achieves flexibility by managing summarization across multiple domains with a single model, utilizing a shared main expert and selected deputy experts. It exhibits adaptability by tailoring deputy experts to cater to out-of-domain few-shot and zero-shot scenarios. Experimental results on 11 datasets show the superiority of our model compared with recent baselines and LLMs. We also provide statistical and visual evidence of the distinct separation of the two abilities in MoeSumm.",
        "keywords": "summarization;parameter-efficient",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/ce9f6cce9b7adca2af240fe8be10fbcaef653c2a.zip",
        "author": "Xiuying Chen;Mingzhe Li;Shen Gao;Xin Cheng;Qingqing Zhu;Rui Yan;Xin Gao;Xiangliang Zhang",
        "authorids": "~Xiuying_Chen1;~Mingzhe_Li1;~Shen_Gao1;~Xin_Cheng2;~Qingqing_Zhu1;~Rui_Yan2;~Xin_Gao1;~Xiangliang_Zhang1",
        "gender": "F;F;M;;;M;M;F",
        "homepage": "https://iriscxy.github.io/;;https://shengaopku.github.io/;;;https://gsai.ruc.edu.cn/english/ruiyan;http://cemse.kaust.edu.sa/sfb;https://sites.nd.edu/xiangliang-zhang/",
        "dblp": "33/11343.html;71/4662;85/7967;;;19/2405-1;56/2203-1.html;74/1890-1",
        "google_scholar": "COUnAF4AAAAJ;https://scholar.google.com.hk/citations?hl=zh-CN;Xb5yz-YAAAAJ;;;eLw6g-UAAAAJ;https://scholar.google.ca/citations?user=wqdK8ugAAAAJ;BhRJe4wAAAAJ",
        "orcid": ";;0000-0003-1301-3700;;;0000-0002-3356-6823;0000-0002-7108-3574;0000-0002-3574-5665",
        "linkedin": ";;;;;;;",
        "or_profile": "~Xiuying_Chen1;~Mingzhe_Li1;~Shen_Gao1;~Xin_Cheng2;~Qingqing_Zhu1;~Rui_Yan2;~Xin_Gao1;~Xiangliang_Zhang1",
        "aff": "King Abdullah University of Science and Technology;Alibaba Group;Shandong University;;;Renmin University of China;King Abdullah University of Science and Technology;University of Notre Dame",
        "aff_domain": "kaust.edu.sa;antgroup.com;sdu.edu.cn;;;ruc.edu.cn;kaust.edu.sa;nd.edu",
        "position": "PhD student;Researcher;Assistant Professor;;;Associate Professor;Full Professor;Associate Professor",
        "bibtex": "@misc{\nchen2024enhancing,\ntitle={Enhancing Parameter Efficiency in Summarization via Expertise Separation},\nauthor={Xiuying Chen and Mingzhe Li and Shen Gao and Xin Cheng and Qingqing Zhu and Rui Yan and Xin Gao and Xiangliang Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=RDU6p4Fydz}\n}",
        "github": "",
        "project": "",
        "reviewers": "BPBZ;wwvd;WEzF;gCW9",
        "site": "https://openreview.net/forum?id=RDU6p4Fydz",
        "pdf_size": 663742,
        "rating": "5;6;6;6",
        "confidence": "4;3;3;4",
        "soundness": "1;3;3;3",
        "contribution": "3;3;2;3",
        "presentation": "3;4;3;4",
        "wc_summary": "99;73;92;60",
        "wc_strengths": "61;67;51;44",
        "wc_weaknesses": "211;90;352;263",
        "wc_questions": "37;2;23;52",
        "wc_review": "408;232;518;419",
        "wc_reply_reviewers": "80;22;82;23",
        "wc_reply_authors": "870;246;777;618",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            81.0,
            15.411035007422441
        ],
        "wc_strengths_avg": [
            55.75,
            8.870597499605086
        ],
        "wc_weaknesses_avg": [
            229.0,
            94.7760518274527
        ],
        "wc_questions_avg": [
            28.5,
            18.418740456393863
        ],
        "wc_review_avg": [
            394.25,
            103.00576440180423
        ],
        "wc_reply_reviewers_avg": [
            51.75,
            29.260681810238122
        ],
        "wc_reply_authors_avg": [
            627.75,
            238.11171222768527
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:gAF2q47EHD4J:scholar.google.com/&scioq=Enhancing+Parameter+Efficiency+in+Summarization+via+Expertise+Separation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;0;4",
        "aff_unique_norm": "King Abdullah University of Science and Technology;Alibaba Group;Shandong University;Renmin University of China;University of Notre Dame",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.kast.kau.edu.sa;https://www.alibaba.com;http://www.sdu.edu.cn;http://www.ruc.edu.cn;https://www.nd.edu",
        "aff_unique_abbr": "KAUST;Alibaba;SDU;RUC;Notre Dame",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;0;2",
        "aff_country_unique": "Saudi Arabia;China;United States"
    },
    {
        "id": "RE0aibEQ1J",
        "title": "IG-Net: Image-Goal Network for Offline Visual Navigation on A Large-Scale Game Map",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Navigating vast and visually intricate gaming environments poses unique challenges, especially when agents are deprived of absolute positions and orientations during testing. This paper addresses the challenge of training agents in such environments using a limited set of offline navigation data and a more substantial set of offline position data. We introduce the \\textit{Image-Goal Network} (IG-Net), an innovative solution tailored for these challenges. IG-Net is designed as an image-goal-conditioned navigation agent, which is trained end-to-end, directly outputting actions based on inputs without intermediary mapping steps. Furthermore, IG-Net harnesses position prediction, path prediction and distance prediction to bolster representation learning to encode spatial map information implicitly, an aspect overlooked in prior works. Our experiments and results demonstrate IG-Net's potential in navigating large-scale gaming environments, providing both advancements in the field and tools for the broader research community.",
        "keywords": "visual navigation;offline training",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/da8ccc4e20800713424960d3fbedd1d7becc8c7a.zip",
        "author": "Baiting Zhu;Pushi Zhang;Xin-Qiang Cai;Li Zhao;Masashi Sugiyama;Jiang Bian",
        "authorids": "~Baiting_Zhu1;~Pushi_Zhang1;~Xin-Qiang_Cai1;~Li_Zhao1;~Masashi_Sugiyama1;~Jiang_Bian1",
        "gender": "M;;M;F;M;M",
        "homepage": "https://baitingzbt.github.io/;https://zpschang.github.io/;https://caixq1996.github.io/;https://www.microsoft.com/en-us/research/people/lizo/;http://www.ms.k.u-tokyo.ac.jp/sugi/;https://sites.google.com/view/jiangbian",
        "dblp": ";288/4226;248/8034.html;97/4708-7;35/1228;09/851-2.html",
        "google_scholar": "SDAr2FEAAAAJ;_DLMSkIAAAAJ;rtMUMooAAAAJ;b-LJkLQAAAAJ;https://scholar.google.co.jp/citations?user=GkYIrlIAAAAJ;pZBEnY8AAAAJ",
        "orcid": ";;;;0000-0001-6658-6743;0000-0002-9472-600X",
        "linkedin": "baitingzbt/;;;;;jbian/",
        "or_profile": "~Baiting_Zhu1;~Pushi_Zhang1;~Xin-Qiang_Cai1;~Li_Zhao1;~Masashi_Sugiyama1;~Jiang_Bian1",
        "aff": "Stanford University;Microsoft;The University of Tokyo;Microsoft;The University of Tokyo;Microsoft",
        "aff_domain": "stanford.edu;microsoft.com;u-tokyo.ac.jp;microsoft.com;u-tokyo.ac.jp;microsoft.com",
        "position": "MS student;Researcher;PhD student;Researcher;Full Professor;Partner Research Manager",
        "bibtex": "@misc{\nzhu2024ignet,\ntitle={{IG}-Net: Image-Goal Network for Offline Visual Navigation on A Large-Scale Game Map},\nauthor={Baiting Zhu and Pushi Zhang and Xin-Qiang Cai and Li Zhao and Masashi Sugiyama and Jiang Bian},\nyear={2024},\nurl={https://openreview.net/forum?id=RE0aibEQ1J}\n}",
        "github": "",
        "project": "",
        "reviewers": "UHPS;JFQf;m9pY;Sxb4;rCRb",
        "site": "https://openreview.net/forum?id=RE0aibEQ1J",
        "pdf_size": 6537173,
        "rating": "3;3;3;5;6",
        "confidence": "5;4;4;4;4",
        "soundness": "2;2;2;2;2",
        "contribution": "1;2;2;2;3",
        "presentation": "3;3;2;2;3",
        "wc_summary": "83;70;101;93;58",
        "wc_strengths": "41;90;51;101;121",
        "wc_weaknesses": "612;279;119;429;113",
        "wc_questions": "117;153;54;50;203",
        "wc_review": "853;592;325;673;495",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "919;469;319;736;386",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "2;1;1;1;1",
        "rating_avg": [
            4.0,
            1.2649110640673518
        ],
        "confidence_avg": [
            4.2,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            81.0,
            15.479018056711478
        ],
        "wc_strengths_avg": [
            80.8,
            30.268135059828182
        ],
        "wc_weaknesses_avg": [
            310.4,
            190.58604356038245
        ],
        "wc_questions_avg": [
            115.4,
            58.544342168991875
        ],
        "wc_review_avg": [
            587.6,
            176.22894200442786
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            565.8,
            226.41855047676637
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.2,
            0.4000000000000001
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.39528470752104744,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:xNu0YF-h8zsJ:scholar.google.com/&scioq=IG-Net:+Image-Goal+Network+for+Offline+Visual+Navigation+on+A+Large-Scale+Game+Map&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;1;2;1",
        "aff_unique_norm": "Stanford University;Microsoft;University of Tokyo",
        "aff_unique_dep": ";Microsoft Corporation;",
        "aff_unique_url": "https://www.stanford.edu;https://www.microsoft.com;https://www.u-tokyo.ac.jp",
        "aff_unique_abbr": "Stanford;Microsoft;UTokyo",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Stanford;",
        "aff_country_unique_index": "0;0;1;0;1;0",
        "aff_country_unique": "United States;Japan"
    },
    {
        "id": "REKRLIXtQG",
        "title": "Supermodular Rank: Set Function Decomposition and Optimization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We define the supermodular rank of a function on a lattice. This is the smallest number of terms needed to decompose it into a sum of supermodular functions. The supermodular summands are defined with respect to different partial orders. We characterize the maximum possible value of the supermodular rank and describe the functions with fixed supermodular rank. We analogously define the submodular rank. We use submodular decompositions to optimize set functions. Given a bound on the submodular rank of a set function, we formulate an algorithm that splits an optimization problem into submodular subproblems. We show that this method improves the approximation ratio guarantees of several algorithms for monotone set function maximization and ratio of set functions minimization, at a computation overhead that depends on the submodular rank.",
        "keywords": "supermodular cone;imset inequality;set function optimization;greedy algorithm;approximation ratio",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Rishi Sonthalia;Anna Seigal;Guido Montufar",
        "authorids": "~Rishi_Sonthalia1;~Anna_Seigal1;~Guido_Montufar1",
        "gender": "M;;M",
        "homepage": "https://sites.google.com/umich.edu/rsonthal/home;https://people.math.harvard.edu/~aseigal/;http://www.math.ucla.edu/~montufar/",
        "dblp": "223/5758;;",
        "google_scholar": "HYozgRsAAAAJ;;https://scholar.google.de/citations?user=pDIuuVwAAAAJ",
        "orcid": ";;0000-0002-0131-2669",
        "linkedin": "rishi-sonthalia-53b44795/;;",
        "or_profile": "~Rishi_Sonthalia1;~Anna_Seigal1;~Guido_Montufar1",
        "aff": "University of California, Los Angeles;Harvard University;UCLA ",
        "aff_domain": "ucla.edu;harvard.edu;math.ucla.edu",
        "position": "Postdoc;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nsonthalia2024supermodular,\ntitle={Supermodular Rank: Set Function Decomposition and Optimization},\nauthor={Rishi Sonthalia and Anna Seigal and Guido Montufar},\nyear={2024},\nurl={https://openreview.net/forum?id=REKRLIXtQG}\n}",
        "github": "",
        "project": "",
        "reviewers": "Pie2;HVke;jvwD;1L31",
        "site": "https://openreview.net/forum?id=REKRLIXtQG",
        "pdf_size": 608996,
        "rating": "3;5;6;6",
        "confidence": "5;3;3;2",
        "soundness": "3;3;3;3",
        "contribution": "1;3;3;3",
        "presentation": "1;1;1;2",
        "wc_summary": "112;202;143;85",
        "wc_strengths": "29;58;93;54",
        "wc_weaknesses": "150;51;202;84",
        "wc_questions": "20;14;6;4",
        "wc_review": "311;325;444;227",
        "wc_reply_reviewers": "21;110;51;0",
        "wc_reply_authors": "725;222;650;206",
        "reply_reviewers": "1;2;1;0",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            1.0897247358851685
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            1.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            135.5,
            43.53446910208048
        ],
        "wc_strengths_avg": [
            58.5,
            22.808989455914087
        ],
        "wc_weaknesses_avg": [
            121.75,
            58.45671475544961
        ],
        "wc_questions_avg": [
            11.0,
            6.4031242374328485
        ],
        "wc_review_avg": [
            326.75,
            77.37691839301951
        ],
        "wc_reply_reviewers_avg": [
            45.5,
            41.415576779757636
        ],
        "wc_reply_authors_avg": [
            450.75,
            238.29747690649182
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.9365858115816939,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:tZIYHPmSef0J:scholar.google.com/&scioq=Supermodular+Rank:+Set+Function+Decomposition+and+Optimization&hl=en&as_sdt=0,47",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of California, Los Angeles;Harvard University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ucla.edu;https://www.harvard.edu",
        "aff_unique_abbr": "UCLA;Harvard",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Los Angeles;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "RFJGFrMvYj",
        "title": "TCIG: Two-Stage Controlled Image Generation with Quality Enhancement through Diffusion",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In recent years, significant progress has been made in the development of text-to-image generation models. However, these models still face limitations when it comes to achieving full controllability during the generation process. Often, specific training or the use of limited models is required, and even then, they have certain restrictions. To address these challenges, \nA two-stage method that effectively combines controllability and high quality in the generation of images is proposed. This approach leverages the expertise of pre-trained models to achieve precise control over the generated images, while also harnessing the power of diffusion models to achieve state-of-the-art quality. By separating controllability from high quality, This method achieves outstanding results. It is compatible with both latent and image space diffusion models, ensuring versatility and flexibility. Moreover, This approach consistently produces comparable outcomes to the current state-of-the-art methods in the field. Overall, This proposed method represents a significant advancement in text-to-image generation, enabling improved controllability without compromising on the quality of the generated images.",
        "keywords": "Image generation;Text-to-image;Diffusion;Segmentations mask guided generation;Sketch image generation",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Salaheldin Mohamed",
        "authorids": "~Salaheldin_Mohamed1",
        "gender": "M",
        "homepage": "",
        "dblp": "",
        "google_scholar": "",
        "orcid": "",
        "linkedin": "salaheldinmohamed/",
        "or_profile": "~Salaheldin_Mohamed1",
        "aff": "Huawei Technologies Ltd.",
        "aff_domain": "huawei.com",
        "position": "Intern",
        "bibtex": "@misc{\nmohamed2024tcig,\ntitle={{TCIG}: Two-Stage Controlled Image Generation with Quality Enhancement through Diffusion},\nauthor={Salaheldin Mohamed},\nyear={2024},\nurl={https://openreview.net/forum?id=RFJGFrMvYj}\n}",
        "github": "",
        "project": "",
        "reviewers": "nTLn;pNhh;anks;UDgM",
        "site": "https://openreview.net/forum?id=RFJGFrMvYj",
        "pdf_size": 9224248,
        "rating": "1;1;1;3",
        "confidence": "5;5;5;4",
        "soundness": "1;1;1;3",
        "contribution": "1;1;1;2",
        "presentation": "1;1;1;2",
        "wc_summary": "35;25;49;35",
        "wc_strengths": "16;1;14;15",
        "wc_weaknesses": "35;14;159;32",
        "wc_questions": "76;14;4;23",
        "wc_review": "162;54;226;105",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            1.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            1.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            36.0,
            8.54400374531753
        ],
        "wc_strengths_avg": [
            11.5,
            6.103277807866851
        ],
        "wc_weaknesses_avg": [
            60.0,
            57.719147602853596
        ],
        "wc_questions_avg": [
            29.25,
            27.815238629211866
        ],
        "wc_review_avg": [
            136.75,
            64.1458299502002
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:J1l_jNpsUH4J:scholar.google.com/&scioq=TCIG:+Two-Stage+Controlled+Image+Generation+with+Quality+Enhancement+through+Diffusion&hl=en&as_sdt=0,7",
        "gs_version_total": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "Huawei",
        "aff_unique_dep": "Huawei Technologies",
        "aff_unique_url": "https://www.huawei.com",
        "aff_unique_abbr": "Huawei",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "RFLZFxoLnE",
        "title": "Modify Training Direction in Function Space to Reduce Generalization Error",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "To improve generalization performance by modifying the training dynamics, we present theoretical analyses of a modified natural gradient descent method in the neural network function space, leveraging the neural tangent kernel theory. Firstly, we provide an analytical expression for the function acquired through this modified natural gradient descent under the assumptions of an infinite network width limit and a Gaussian conditional output distribution. Subsequently, we explicitly derive the generalization error associated with the learned neural network function. By interpreting the generalization error as stemming from the distribution discrepancy between the training data and the true data, we propose a criterion for modification in the eigenspaces of the Fisher information matrix to reduce the generalization error bound. Through this approach, we establish that modifying the training direction of the neural network in function space leads to a reduction in generalization error. These theoretical results are also illustrated through numerical experiments. Additionally, we demonstrate the connections between this theoretical framework and existing results of generalization-enhancing methods.",
        "keywords": "Neural tangent kernel;Generalization enhancement;Natural gradient",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/a5fc4ca4fc083ae40fa8e9d71784d380f538d32a.zip",
        "author": "Yi Yu;Boyu Chen;Wenlian Lu",
        "authorids": "~Yi_Yu7;~Boyu_Chen2;~Wenlian_Lu1",
        "gender": "M;M;M",
        "homepage": "https://21veu.github.io/;;",
        "dblp": ";166/5205.html;41/2305",
        "google_scholar": ";;",
        "orcid": ";0000-0003-0022-6651;",
        "linkedin": ";;",
        "or_profile": "~Yi_Yu7;~Boyu_Chen2;~Wenlian_Lu1",
        "aff": "Fudan University;Huawei Technologies Ltd.;Fudan University",
        "aff_domain": "fudan.edu.cn;huawei.com;fudan.edu.cn",
        "position": "PhD student;Postdoc;Full Professor",
        "bibtex": "@misc{\nyu2024modify,\ntitle={Modify Training Direction in Function Space to Reduce Generalization Error},\nauthor={Yi Yu and Boyu Chen and Wenlian Lu},\nyear={2024},\nurl={https://openreview.net/forum?id=RFLZFxoLnE}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZET7;6uvN;vsfs;KgvZ",
        "site": "https://openreview.net/forum?id=RFLZFxoLnE",
        "pdf_size": 624788,
        "rating": "3;3;3;5",
        "confidence": "3;4;3;2",
        "soundness": "2;3;2;2",
        "contribution": "2;2;2;3",
        "presentation": "2;3;2;3",
        "wc_summary": "182;84;64;93",
        "wc_strengths": "103;53;4;48",
        "wc_weaknesses": "589;126;101;163",
        "wc_questions": "187;21;80;165",
        "wc_review": "1061;284;249;469",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            105.75,
            45.256905550424015
        ],
        "wc_strengths_avg": [
            52.0,
            35.078483433580764
        ],
        "wc_weaknesses_avg": [
            244.75,
            199.97296692303186
        ],
        "wc_questions_avg": [
            113.25,
            66.58218605603153
        ],
        "wc_review_avg": [
            515.75,
            325.7095139844705
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:L_TFaLi_aFEJ:scholar.google.com/&scioq=Modify+Training+Direction+in+Function+Space+to+Reduce+Generalization+Error&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Fudan University;Huawei",
        "aff_unique_dep": ";Huawei Technologies",
        "aff_unique_url": "https://www.fudan.edu.cn;https://www.huawei.com",
        "aff_unique_abbr": "Fudan;Huawei",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "RFjhxXrTlX",
        "title": "Learning Unorthogonalized Matrices for Rotation Estimation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Estimating 3D rotations is a common procedure for 3D computer vision. The accuracy depends heavily on the rotation representation. Rotation matrices, recently,\nhave been popular due to their continuity, especially for pose estimation tasks. The\nlearning process usually incorporates orthogonalizations to generate orthonormal\nmatrices. We observe that common orthogonalization procedures like Gram-\nSchmidt-based and SVD-based may slow down the training efficiency via a gradi-\nent analysis. To this end, we advocate removing orthogonalization from the learn-\ning process and learning unorthogonalized \u2018Pseudo\u2019 Rotation Matrices (PRoM).\nTo prove the superiority of PRoM over orthogonalization incorporated methods,\nwe conduct an optimization analysis to explicitly demonstrate that PRoM can con-\nverge at a higher rate and to a better solution. By replacing the orthogonalization\nincorporated representation with our proposed PRoM in various rotation-related\ntasks, we can achieve state-of-the-art results on large-scale benchmarks",
        "keywords": "geometry;optimization;pose estimation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Kerui Gu;Zhihao Li;Shiyong Liu;Jianzhuang Liu;Songcen Xu;Youliang Yan;Michael Bi Mi;Kenji Kawaguchi;Angela Yao",
        "authorids": "~Kerui_Gu1;~Zhihao_Li5;~Shiyong_Liu1;~Jianzhuang_Liu3;~Songcen_Xu1;~Youliang_Yan1;~Michael_Bi_Mi2;~Kenji_Kawaguchi1;~Angela_Yao1",
        "gender": "M;M;M;M;M;M;M;;",
        "homepage": "https://www.comp.nus.edu.sg/~keruigu/;https://github.com/zhihaolee;https://liushiyong.cn/;;http://www.xusongcen.com/;;;https://ml.comp.nus.edu.sg/#members;http://www.angelayao.com",
        "dblp": "315/5511;;76/6861;l/JianzhuangLiu;131/6572;135/5316.html;;;64/8484",
        "google_scholar": "if-RXSEAAAAJ;;https://scholar.google.com/citations?hl=zh-CN;sKauaAwAAAAJ;_xVW9SgAAAAJ;;;aLl3rYoAAAAJ;https://scholar.google.ch/citations?user=-LJCZMMAAAAJ",
        "orcid": ";;;;;;;;",
        "linkedin": ";%E5%BF%97%E8%B1%AA-%E6%9D%8E-31a17b153/;;;songcen-xu-2b313465/;;https://sg.linkedin.com/in/michael-bi-mi-2b040284?trk=people-guest_people_search-card;;",
        "or_profile": "~Kerui_Gu1;~Zhihao_Li5;~Shiyong_Liu1;~Jianzhuang_Liu3;~Songcen_Xu1;~Youliang_Yan1;~Michael_Bi_Mi2;~Kenji_Kawaguchi1;~Angela_Yao1",
        "aff": "National University of Singapore;Huawei Noah's Ark Lab;Huawei Technologies Ltd.;Shenzhen Institute of Advanced Technology, Chinese Academy of Sciences;Huawei Noah's Ark Lab;Huawei Technologies Ltd.;Huawei Technologies Ltd.;National University of Singapore;National University of Singapore",
        "aff_domain": "nus.edu.sg;huawei.com;huawei.com;siat.ac.cn;huawei.com;huawei.com;huawei.com;nus.edu;nus.edu.sg",
        "position": "PhD student;Researcher;Researcher;Full Professor;Principal Engineer;Principal Researcher;Principal Researcher;Presidential Young Professor;Associate Professor",
        "bibtex": "@misc{\ngu2024learning,\ntitle={Learning Unorthogonalized Matrices for Rotation Estimation},\nauthor={Kerui Gu and Zhihao Li and Shiyong Liu and Jianzhuang Liu and Songcen Xu and Youliang Yan and Michael Bi Mi and Kenji Kawaguchi and Angela Yao},\nyear={2024},\nurl={https://openreview.net/forum?id=RFjhxXrTlX}\n}",
        "github": "",
        "project": "",
        "reviewers": "h3do;v4Yx;drye",
        "site": "https://openreview.net/forum?id=RFjhxXrTlX",
        "pdf_size": 1999835,
        "rating": "3;5;6",
        "confidence": "5;4;3",
        "soundness": "1;3;3",
        "contribution": "1;2;2",
        "presentation": "2;3;2",
        "wc_summary": "103;95;91",
        "wc_strengths": "16;69;109",
        "wc_weaknesses": "480;379;178",
        "wc_questions": "5;55;105",
        "wc_review": "604;598;483",
        "wc_reply_reviewers": "135;0;0",
        "wc_reply_authors": "644;276;217",
        "reply_reviewers": "1;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            96.33333333333333,
            4.988876515698588
        ],
        "wc_strengths_avg": [
            64.66666666666667,
            38.09053542402481
        ],
        "wc_weaknesses_avg": [
            345.6666666666667,
            125.52379145891913
        ],
        "wc_questions_avg": [
            55.0,
            40.824829046386306
        ],
        "wc_review_avg": [
            561.6666666666666,
            55.67963920700477
        ],
        "wc_reply_reviewers_avg": [
            45.0,
            63.63961030678928
        ],
        "wc_reply_authors_avg": [
            379.0,
            188.9250292223523
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -0.9819805060619659,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12950729241600871211&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1;2;1;1;1;0;0",
        "aff_unique_norm": "National University of Singapore;Huawei;Shenzhen Institute of Advanced Technology",
        "aff_unique_dep": ";Noah's Ark Lab;",
        "aff_unique_url": "https://www.nus.edu.sg;https://www.huawei.com;http://www.siat.cas.cn",
        "aff_unique_abbr": "NUS;Huawei;SIAT",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Shenzhen",
        "aff_country_unique_index": "0;1;1;1;1;1;1;0;0",
        "aff_country_unique": "Singapore;China"
    },
    {
        "id": "RG98EkuHdT",
        "title": "Transforming Transformers for Resilient Lifelong Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Lifelong learning without catastrophic forgetting (i.e., resiliency) remains an open problem for deep neural networks. The prior art mostly focuses on convolutional neural networks.  With the increasing dominance of Transformers in deep learning, it is a pressing need to study resilient lifelong learning with Transformers. Due to the complexity of training Transformers in practice, for lifelong learning, a question naturally arises: Can the Transformer be learned to grow in a task aware way, that is to be dynamically tranformed by introducing lightweight learnable plastic components to the architecture, while retaining the parameter-heavy, but stable components at streaming tasks?\nTo that end, motivated by the lifelong learning capability maintained by the functionality of Hippocampi in human brain, \nthis paper explores what would be, and how to implement, Artificial Hippocampi (ArtiHippo) in Transformers. It presents a method of identifying, and then learning to grow, ArtiHippo in Vision Transformers (ViTs) for resilient lifelong learning in four aspects: (i) Where to place ArtiHippo in ViTs to enable plasticity while preserving the core function of ViTs at streaming tasks? (ii) What representational scheme to use to realize ArtiHippo to ensure expressivity and adaptivity for tackling tasks of different nature in lifelong learning? (iii) How to learn to grow ArtiHippo to exploit task synergies (i.e., the learned knowledge) and to overcome catastrophic forgetting? (iv) How to harness the best of our proposed ArtiHippo and prompting-based approaches? In experiments, the proposed method is tested on the challenging Visual Domain Decathlon (VDD) benchmark and the recently proposed 5-Dataset benchmark under the task-incremental lifelong learning setting. It obtains consistently better performance than the prior art with sensible ArtiHippo learned continually. To our knowledge, it is the first attempt of lifelong learning with ViTs on the challenging VDD benchmark.",
        "keywords": "Lifelong Learning;Continual Learning;Neural Architecture Search;Vision Transformer;Mixture of Experts",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/84dc11088f5d1c21412e825f7a31d1468c753c98.zip",
        "author": "Chinmay Savadikar;Michelle Dai;Tianfu Wu",
        "authorids": "~Chinmay_Savadikar1;~Michelle_Dai1;~Tianfu_Wu1",
        "gender": "M;F;M",
        "homepage": "https://savadikarc.github.io/;;https://research.ece.ncsu.edu/ivmcl/",
        "dblp": "233/8189;220/1752;08/4148-1",
        "google_scholar": "0SpINWEAAAAJ;;8XcYgk0AAAAJ",
        "orcid": ";;0000-0001-8911-5506",
        "linkedin": "savadikar-chinmay;michelle-dai-65b6a3204/;",
        "or_profile": "~Chinmay_Savadikar1;~Michelle_Dai1;~Tianfu_Wu1",
        "aff": "North Carolina State University;Johns Hopkins University;North Carolina State University",
        "aff_domain": "ncsu.edu;jhu.edu;ncsu.edu",
        "position": "MS student;PhD student;Associate Professor",
        "bibtex": "@misc{\nsavadikar2024transforming,\ntitle={Transforming Transformers for Resilient Lifelong Learning},\nauthor={Chinmay Savadikar and Michelle Dai and Tianfu Wu},\nyear={2024},\nurl={https://openreview.net/forum?id=RG98EkuHdT}\n}",
        "github": "",
        "project": "",
        "reviewers": "UTmX;QBWR;Z1nR;6RhY",
        "site": "https://openreview.net/forum?id=RG98EkuHdT",
        "pdf_size": 1119468,
        "rating": "5;5;6;6",
        "confidence": "4;2;4;4",
        "soundness": "3;3;3;2",
        "contribution": "1;2;3;2",
        "presentation": "3;4;3;3",
        "wc_summary": "119;63;111;101",
        "wc_strengths": "65;58;50;34",
        "wc_weaknesses": "165;95;122;42",
        "wc_questions": "27;176;30;32",
        "wc_review": "376;392;313;209",
        "wc_reply_reviewers": "132;0;0;55",
        "wc_reply_authors": "1038;1321;610;401",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            98.5,
            21.465087933665682
        ],
        "wc_strengths_avg": [
            51.75,
            11.54068888758379
        ],
        "wc_weaknesses_avg": [
            106.0,
            44.5926002830066
        ],
        "wc_questions_avg": [
            66.25,
            63.38917494336079
        ],
        "wc_review_avg": [
            322.5,
            71.87663041629038
        ],
        "wc_reply_reviewers_avg": [
            46.75,
            54.0988678254915
        ],
        "wc_reply_authors_avg": [
            842.5,
            359.22172818469653
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:vMYAUv216y4J:scholar.google.com/&scioq=Transforming+Transformers+for+Resilient+Lifelong+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "North Carolina State University;Johns Hopkins University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ncsu.edu;https://www.jhu.edu",
        "aff_unique_abbr": "NCSU;JHU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "RGE8Bs5Tra",
        "title": "CLASS-INCREMENTAL LEARNING USING GENERATIVE EXPERIENCE REPLAY BASED ON TIME-AWARE REGULARIZATION",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Learning new tasks accumulatively without forgetting remains a critical challenge in continual learning. Generative experience replay addresses this challenge by synthesizing pseudo-data points for past learned tasks and later replaying them for concurrent training along with the new tasks' data. Generative replay is the best strategy for continual learning under a strict class-incremental setting when certain constraints need to be met: (i) constant model size, (ii) no pre-training dataset, and (iii) no memory buffer for storing past tasks data. Inspired by the biological nervous system mechanisms, we introduce a time-aware regularization method to dynamically fine-tune the three training objective terms used for generative replay:  supervised learning, latent regularization, and data reconstruction. Experimental results on major benchmarks indicate that our method pushes the limit of a brain-inspired continual learner under such strict settings, improves memory retention, and increases the average performance over continually arriving tasks.",
        "keywords": "lifelong learning;continual learning;class-incremental learning;regularization",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Zizhao Hu;Mohammad Rostami",
        "authorids": "~Zizhao_Hu1;~Mohammad_Rostami1",
        "gender": "M;M",
        "homepage": ";https://viterbi.usc.edu/directory/faculty/Rostami/Mohammad",
        "dblp": "305/0384;83/9890",
        "google_scholar": "https://scholar.google.com/citations?hl=en;Uzx8nLoAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Zizhao_Hu1;~Mohammad_Rostami1",
        "aff": "University of Southern California;USC/ISI",
        "aff_domain": "usc.edu;isi.edu",
        "position": "PhD student;Research Scientist",
        "bibtex": "@misc{\nhu2024classincremental,\ntitle={{CLASS}-{INCREMENTAL} {LEARNING} {USING} {GENERATIVE} {EXPERIENCE} {REPLAY} {BASED} {ON} {TIME}-{AWARE} {REGULARIZATION}},\nauthor={Zizhao Hu and Mohammad Rostami},\nyear={2024},\nurl={https://openreview.net/forum?id=RGE8Bs5Tra}\n}",
        "github": "",
        "project": "",
        "reviewers": "EsQv;yfoE;2WvB;ur9z",
        "site": "https://openreview.net/forum?id=RGE8Bs5Tra",
        "pdf_size": 7749634,
        "rating": "3;3;3;6",
        "confidence": "2;4;3;4",
        "soundness": "3;1;3;3",
        "contribution": "2;2;1;2",
        "presentation": "3;2;3;3",
        "wc_summary": "60;88;86;93",
        "wc_strengths": "35;80;78;39",
        "wc_weaknesses": "144;255;242;197",
        "wc_questions": "139;189;83;20",
        "wc_review": "378;612;489;349",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            81.75,
            12.813567028739499
        ],
        "wc_strengths_avg": [
            58.0,
            21.059439688652688
        ],
        "wc_weaknesses_avg": [
            209.5,
            43.51149273467873
        ],
        "wc_questions_avg": [
            107.75,
            63.02925907862157
        ],
        "wc_review_avg": [
            457.0,
            103.6267340023799
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.5222329678670935,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16004800141665303318&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Southern California",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.usc.edu",
        "aff_unique_abbr": "USC",
        "aff_campus_unique_index": "0;1",
        "aff_campus_unique": "Los Angeles;ISI",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "RHRN3zY3IA",
        "title": "A Data-Centric Approach for Financial Large Language Models with Abductive Augmentation Reasoning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large language models (LLMs) show promise for natural language tasks but struggle when applied directly to complex domains like finance. LLMs have difficulty reasoning about and integrating all relevant information. We propose a data-centric approach to enable LLMs to better handle financial tasks. Our key insight is that rather than overloading the LLM with everything at once, it is more effective to preprocess and pre-understand the data. We create a financial LLM (FLLM) using multitask prompt-based finetuning to achieve data pre-processing and pre-understanding. However, labeled data is scarce for each task. To overcome manual annotation costs, we employ abductive augmentation reasoning (AAR) to automatically generate training data by modifying the pseudo labels from FLLM's own outputs. Experiments show our data-centric FLLM with AAR substantially outperforms baseline financial LLMs designed for raw text, achieving state-of-the-art on financial analysis and interpretation tasks. We also open source a new benchmark for financial analysis and interpretation. Our methodology provides a promising path to unlock LLMs' potential for complex real-world domains.",
        "keywords": "Data centic;LLM;Finance",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/8ac62c6cf354cae3c7ac5d2834602f03677f103e.zip",
        "author": "Zhixuan Chu;Huaiyu Guo;Xinyuan Zhou;yijia wang;Fei Yu;Hong Chen;Wanqing Xu;Xin Lu;Qing Cui;Longfei Li;JUN ZHOU;Sheng Li",
        "authorids": "~Zhixuan_Chu1;~Huaiyu_Guo1;~Xinyuan_Zhou3;~yijia_wang3;~Fei_Yu7;~Hong_Chen10;~Wanqing_Xu1;~Xin_Lu11;~Qing_Cui1;~Longfei_Li3;~JUN_ZHOU6;~Sheng_Li3",
        "gender": "M;M;M;F;;M;M;M;M;M;M;M",
        "homepage": ";https://github.com/Badrain;;;https://de.linkedin.com/in/fred-yu-2b3a8b112;https://antwork.antgroup-inc.cn/nwpipe/u/;http://www.antgroup.com;;;https://scholar.google.com/citations?user=mCVvloEAAAAJ&hl=en;http://sheng-li.org;http://www.douban.com/people`/nullpointer",
        "dblp": "258/1233;;;;;;;18/4013;;99/3847-11;23/3439-1;",
        "google_scholar": "a4IuTngAAAAJ;;https://scholar.google.com.hk/citations?hl=zh-CN;ea5X3y8AAAAJ;;;;_SfHjS4AAAAJ;x5rfjSEAAAAJ;mCVvloEAAAAJ;DEncVcYAAAAJ;",
        "orcid": ";;;;;;;0000-0002-4909-4568;;0000-0001-6033-6102;0000-0003-1205-8632;",
        "linkedin": ";;;;;;;;;;sheng-li-15a70022/;",
        "or_profile": "~Zhixuan_Chu1;~Huaiyu_Guo1;~Xinyuan_Zhou3;~yijia_wang3;~Fei_Yu7;~Wanqing_Xu1;~Xin_Lu11;~Qing_Cui1;~Longfei_Li3;~JUN_ZHOU6;~Sheng_Li3;~Nullpointer_Chen1",
        "aff": "Ant Group;;;Ant Group;Ant Group;;;Ant Group;Alibaba Group;Ant Group;University of Virginia, Charlottesville;Alipay",
        "aff_domain": "antgroup.com;;;antgroup.com;antgroup.com;;;antgroup.com;alibaba-inc.com;antgroup.com;virginia.edu;alipay.com",
        "position": "Researcher;;;algorithm engineer;Principal Researcher;;;Researcher;Researcher;Researcher;Associate Professor;Researcher",
        "bibtex": "@misc{\nchu2024a,\ntitle={A Data-Centric Approach for Financial Large Language Models with Abductive Augmentation Reasoning},\nauthor={Zhixuan Chu and Huaiyu Guo and Xinyuan Zhou and yijia wang and Fei Yu and Hong Chen and Wanqing Xu and Xin Lu and Qing Cui and Longfei Li and JUN ZHOU and Sheng Li},\nyear={2024},\nurl={https://openreview.net/forum?id=RHRN3zY3IA}\n}",
        "github": "",
        "project": "",
        "reviewers": "xmH1;2L6F;z1t5;e2qX",
        "site": "https://openreview.net/forum?id=RHRN3zY3IA",
        "pdf_size": 4238299,
        "rating": "3;3;3;5",
        "confidence": "4;4;4;4",
        "soundness": "2;3;2;3",
        "contribution": "2;2;1;3",
        "presentation": "2;3;2;2",
        "wc_summary": "84;121;94;117",
        "wc_strengths": "32;39;51;49",
        "wc_weaknesses": "188;199;86;207",
        "wc_questions": "59;5;105;20",
        "wc_review": "363;364;336;393",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            104.0,
            15.47578754054216
        ],
        "wc_strengths_avg": [
            42.75,
            7.693341276714559
        ],
        "wc_weaknesses_avg": [
            170.0,
            48.964272689380365
        ],
        "wc_questions_avg": [
            47.25,
            38.73225400102607
        ],
        "wc_review_avg": [
            364.0,
            20.161845153655953
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            12,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Z_Czlm6wQNsJ:scholar.google.com/&scioq=A+Data-Centric+Approach+for+Financial+Large+Language+Models+with+Abductive+Augmentation+Reasoning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;1;0;2;3",
        "aff_unique_norm": "Ant Group;Alibaba Group;University of Virginia;Alipay",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.antgroup.com;https://www.alibaba.com;https://www.virginia.edu;https://www.alipay.com",
        "aff_unique_abbr": "Ant Group;Alibaba;UVA;Alipay",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Charlottesville",
        "aff_country_unique_index": "0;0;0;0;0;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Graph Generation with $K^2$-trees",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18652",
        "id": "RIEW6M9YoV",
        "author_site": "Yunhui Jang, Dongwoo Kim, Sungsoo Ahn",
        "tldr": "",
        "abstract": "Generating graphs from a target distribution is a significant challenge across many domains, including drug discovery and social network analysis. In this work, we introduce a novel graph generation method leveraging $K^2$ representation, originally designed for lossless graph compression. The $K^2$ representation enables compact generation while concurrently capturing an inherent hierarchical structure of a graph. In addition, we make contributions by (1) presenting a sequential $K^2$ representation that incorporates pruning, flattening, and tokenization processes and (2) introducing a Transformer-based architecture designed to generate the sequence by incorporating a specialized tree positional encoding scheme. Finally, we extensively evaluate our algorithm on four general and two molecular graph datasets to confirm its superiority for graph generation.",
        "keywords": "Graph generative models;graph neural networks",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/5d134a4d0a743ced7c2075d4a398b575b215cf47.zip",
        "author": "Yunhui Jang;Dongwoo Kim;Sungsoo Ahn",
        "authorids": "~Yunhui_Jang1;~Dongwoo_Kim1;~Sungsoo_Ahn1",
        "gender": "F;M;M",
        "homepage": "https://yunhuijang.github.io;http://dongwookim-ml.github.io/;https://sungsooahn.super.site/",
        "dblp": ";15/398-2;90/5164",
        "google_scholar": "https://scholar.google.co.kr/citations?user=mYHCTYQAAAAJ;https://scholar.google.co.kr/citations?user=RkspD6IAAAAJ;XTenHs0AAAAJ",
        "orcid": ";0000-0002-6515-5260;",
        "linkedin": ";;",
        "or_profile": "~Yunhui_Jang1;~Dongwoo_Kim1;~Sungsoo_Ahn1",
        "aff": "Pohang University of Science and Technology;POSTECH;Pohang University of Science and Technology",
        "aff_domain": "postech.edu;postech.ac.kr;postech.ac.kr",
        "position": "PhD student;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\njang2024graph,\ntitle={Graph Generation with  \\$K{\\textasciicircum}2\\$-trees},\nauthor={Yunhui Jang and Dongwoo Kim and Sungsoo Ahn},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=RIEW6M9YoV}\n}",
        "github": "",
        "project": "",
        "reviewers": "XLS2;K9N3;JeGt;Nzff",
        "pdf_size": 29358549,
        "rating": "5;5;8;8",
        "confidence": "3;4;4;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;4;3;4",
        "wc_summary": "96;98;58;138",
        "wc_strengths": "64;98;26;58",
        "wc_weaknesses": "94;411;39;13",
        "wc_questions": "12;24;76;33",
        "wc_review": "266;631;199;242",
        "wc_reply_reviewers": "0;359;0;15",
        "wc_reply_authors": "684;2763;629;138",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "2;5;1;2",
        "rating_avg": [
            6.5,
            1.5
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            97.5,
            28.297526393662043
        ],
        "wc_strengths_avg": [
            61.5,
            25.548972582082435
        ],
        "wc_weaknesses_avg": [
            139.25,
            159.59695329172172
        ],
        "wc_questions_avg": [
            36.25,
            24.128561913218117
        ],
        "wc_review_avg": [
            334.5,
            172.8590466246994
        ],
        "wc_reply_reviewers_avg": [
            93.5,
            153.40876767642715
        ],
        "wc_reply_authors_avg": [
            1053.5,
            1009.6114351571103
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            1.5
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=756192739401123961&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=RIEW6M9YoV",
        "pdf": "https://openreview.net/pdf?id=RIEW6M9YoV",
        "email": "postech.edu;postech.ac.kr;postech.ac.kr",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Pohang University of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.postech.ac.kr",
        "aff_unique_abbr": "POSTECH",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Pohang",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "RIK99GXapC",
        "title": "ControlVideo: Conditional Control for Text-driven Video Editing and Beyond",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "This paper presents ControlVideo for text-driven video editing -- generating a video that aligns with a given text while preserving the structure of the source video. Building on a pre-trained text-to-image diffusion model, ControlVideo enhances the fidelity and temporal consistency by incorporating additional conditions (such as edge maps), and fine-tuning the key-frame and temporal attention on the source video-text pair via an in-depth exploration of the design space. Extensive experimental results demonstrate that ControlVideo outperforms various competitive baselines by delivering videos that exhibit high fidelity w.r.t. the source content, and temporal consistency, all while aligning with the text. By incorporating Low-rank adaptation layers into the model before training, ControlVideo is further empowered to generate videos that align seamlessly with reference images. Moreover, ControlVideo can be readily extended to the more challenging task of long video editing, where maintaining long-range temporal consistency across hundreds of frames is crucial. To achieve this, we construct a fused ControlVideo by applying basic ControlVideo to overlapping short video segments and key frame videos and then merging them by defined weight functions. Empirical results corroborate its ability to create visually realistic videos spanning hundreds of frames.",
        "keywords": "video editing;diffusion models;text-driven editing",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/9bc9ea3da811ee461b298d7d9111a80d52751939.zip",
        "author": "Min Zhao;Rongzhen Wang;Fan Bao;Chongxuan Li;Jun Zhu",
        "authorids": "~Min_Zhao3;~Rongzhen_Wang1;~Fan_Bao1;~Chongxuan_Li1;~Jun_Zhu2",
        "gender": "F;F;M;M;M",
        "homepage": ";https://github.com/rongzhenwang;https://baofff.github.io/;http://ml.cs.tsinghua.edu.cn/~chongxuan;http://ml.cs.tsinghua.edu.cn/~jun",
        "dblp": "67/1336-13.html;245/1816;71/3877;161/9965;50/2644-1",
        "google_scholar": "ExIZrLAAAAAJ;;;UKMcQn4AAAAJ;axsP38wAAAAJ",
        "orcid": ";;;0000-0002-0912-9076;",
        "linkedin": ";;;;",
        "or_profile": "~Min_Zhao3;~Rongzhen_Wang1;~Fan_Bao1;~Chongxuan_Li1;~Jun_Zhu2",
        "aff": "Institute of Automation, Chinese Academy of Sciences;Renmin University of China;Tsinghua University;Renmin University of China;Tsinghua University",
        "aff_domain": "ia.ac.cn;ruc.edu.cn;tsinghua.edu.cn;ruc.edu.cn;mail.tsinghua.edu.cn",
        "position": "PhD student;PhD student;PhD student;Associate Professor;Professor",
        "bibtex": "@misc{\nzhao2024controlvideo,\ntitle={ControlVideo: Conditional Control for Text-driven Video Editing and Beyond},\nauthor={Min Zhao and Rongzhen Wang and Fan Bao and Chongxuan Li and Jun Zhu},\nyear={2024},\nurl={https://openreview.net/forum?id=RIK99GXapC}\n}",
        "github": "",
        "project": "",
        "reviewers": "qeRf;ZCzg;R3D6;ibYi",
        "site": "https://openreview.net/forum?id=RIK99GXapC",
        "pdf_size": 20741589,
        "rating": "3;3;5;5",
        "confidence": "2;4;5;4",
        "soundness": "2;2;3;3",
        "contribution": "2;1;2;2",
        "presentation": "2;3;3;3",
        "wc_summary": "21;110;96;57",
        "wc_strengths": "18;58;63;39",
        "wc_weaknesses": "277;256;147;137",
        "wc_questions": "16;79;5;11",
        "wc_review": "332;503;311;244",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            71.0,
            34.792240514229604
        ],
        "wc_strengths_avg": [
            44.5,
            17.727097901235837
        ],
        "wc_weaknesses_avg": [
            204.25,
            62.79082337412052
        ],
        "wc_questions_avg": [
            27.75,
            29.844388082183894
        ],
        "wc_review_avg": [
            347.5,
            95.47905529486559
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.6882472016116854,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:YNDieQ16tmsJ:scholar.google.com/&scioq=ControlVideo:+Conditional+Control+for+Text-driven+Video+Editing+and+Beyond&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;1;2",
        "aff_unique_norm": "Chinese Academy of Sciences;Renmin University of China;Tsinghua University",
        "aff_unique_dep": "Institute of Automation;;",
        "aff_unique_url": "http://www.ia.cas.cn;http://www.ruc.edu.cn;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "CAS;RUC;THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "RIaIpdUCPb",
        "title": "Brain-inspired Geometry Constrain on Represention for Compositional Generalization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Compositional Generalization (CG), referring as the generalization ability to new combinations of essential concepts, is thought to be one mechanism underlying human\u2019s remarkable capability of rapid generalization to new knowledge and tasks. Recent research on brain neural codes has found that the geometry structure of the neural representations is highly related to human compositional generalization ability. In this paper, we extend the above neural science observation into artificial neural networks (ANN) and find that the geometry structure of the representations in ANN impacts their compositional generalization. More importantly, we reveal that only good geometry structure is not sufficient for strong CG ability, a regularization is essential to ensure the classifier can fit the representation geometry structure. We propose a loss to optimize the representation extractor to form a well-organized representation space, and a regularization on the classifier to force it align with the geometry structure of representation space.  With our proposed methods, the CG performance gains as large as 43\\% on the synthetic and 63\\% on real-world datasets, verifying the effectiveness of our brain-inspired ANN-enhancing approach towards human-like strong generalization ability.",
        "keywords": "Represention Learning;Compositional Generalization.",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Chenming Shang;Shiji Zhou;Yujiu Yang;Hengyuan Zhang;Yuwang Wang",
        "authorids": "~Chenming_Shang1;~Shiji_Zhou1;~Yujiu_Yang2;~Hengyuan_Zhang1;~Yuwang_Wang3",
        "gender": "M;M;M;M;M",
        "homepage": "https://helloscm.github.io/;https://arnoldshijizhou.github.io;https://sites.google.com/view/iigroup-thu;https://rattlesnakey.github.io/;",
        "dblp": ";294/8684;30/3847;;161/2633",
        "google_scholar": "XQHqeVQAAAAJ;Do5jf8oAAAAJ;4gH3sxsAAAAJ;;",
        "orcid": ";0009-0000-0677-7396;0000-0002-6427-1024;0009-0000-1991-2163;",
        "linkedin": ";shiji-zhou-05b766ba/;;;",
        "or_profile": "~Chenming_Shang1;~Shiji_Zhou1;~Yujiu_Yang2;~Hengyuan_Zhang1;~Yuwang_Wang3",
        "aff": "Tsinghua University;Tsinghua University;Tsinghua University;Microsoft Research;Tsinghua University",
        "aff_domain": "mail.tsinghua.edu.cn;mail.tsinghua.edu.cn;tsinghua.edu.cn;microsoft.com;tsinghua.edu.cn",
        "position": "MS student;Postdoc;Full Professor;Intern;Researcher",
        "bibtex": "@misc{\nshang2024braininspired,\ntitle={Brain-inspired Geometry Constrain on Represention for Compositional Generalization},\nauthor={Chenming Shang and Shiji Zhou and Yujiu Yang and Hengyuan Zhang and Yuwang Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=RIaIpdUCPb}\n}",
        "github": "",
        "project": "",
        "reviewers": "qK2u;p9Td;VqBo;FGTz",
        "site": "https://openreview.net/forum?id=RIaIpdUCPb",
        "pdf_size": 34079,
        "rating": "1;3;3;5",
        "confidence": "3;4;3;4",
        "soundness": "2;2;3;3",
        "contribution": "1;2;1;3",
        "presentation": "1;1;1;1",
        "wc_summary": "62;100;27;232",
        "wc_strengths": "27;25;10;132",
        "wc_weaknesses": "298;84;14;135",
        "wc_questions": "35;92;1;54",
        "wc_review": "422;301;52;553",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            1.0,
            0.0
        ],
        "wc_summary_avg": [
            105.25,
            77.59953285941869
        ],
        "wc_strengths_avg": [
            48.5,
            48.654393429576324
        ],
        "wc_weaknesses_avg": [
            132.75,
            104.63119754642972
        ],
        "wc_questions_avg": [
            45.5,
            32.882366094914765
        ],
        "wc_review_avg": [
            332.0,
            184.5955037372254
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.7071067811865476,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:5DqgsUmPE9AJ:scholar.google.com/&scioq=Brain-inspired+Geometry+Constrain+on+Represention+for+Compositional+Generalization&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "Tsinghua University;Microsoft",
        "aff_unique_dep": ";Microsoft Research",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.microsoft.com/en-us/research",
        "aff_unique_abbr": "THU;MSR",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "RIbH5ekQpr",
        "title": "IMP: Benchmarking Image Polysemy in Vision-Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Current vision-language models predominantly use contrastive losses to learn from the co-occurrence of image and text. While effective for certain tasks, this approach assumes semantic equivalence between these two modalities. This assumption runs counter to the diverse meanings that a single image can convey, which in turn may compromise visual understanding. To investigate the impact of this assumption, we introduce a novel dataset: $\\textbf{IMP}$, designed to challenge and evaluate vision-language models on image polysemy. Our empirical results reveal that current models fall short in recognizing the multiple semantic dimensions of images, underscoring the need for more robust approaches for learning vision-language representations. Code and data will be made available on publication.",
        "keywords": "Image Polysemy;Vision-Language Representation Learning;Benchmark",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Wangyuan Ding;Nanne Van Noord",
        "authorids": "~Wangyuan_Ding1;~Nanne_Van_Noord1",
        "gender": "M;M",
        "homepage": "https://multix.io/;https://nanne.github.io/",
        "dblp": ";123/5104.html",
        "google_scholar": ";wFDJzDkAAAAJ",
        "orcid": ";0000-0002-5145-3603",
        "linkedin": ";",
        "or_profile": "~Wangyuan_Ding1;~Nanne_Van_Noord1",
        "aff": "University of Amsterdam;University of Amsterdam",
        "aff_domain": "uva.nl;uva.nl",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nding2024imp,\ntitle={{IMP}: Benchmarking Image Polysemy in Vision-Language Models},\nauthor={Wangyuan Ding and Nanne Van Noord},\nyear={2024},\nurl={https://openreview.net/forum?id=RIbH5ekQpr}\n}",
        "github": "",
        "project": "",
        "reviewers": "VqT9;KVAJ;6sQn;9GYX;FPXN",
        "site": "https://openreview.net/forum?id=RIbH5ekQpr",
        "pdf_size": 23457430,
        "rating": "3;5;5;5;8",
        "confidence": "4;2;3;3;4",
        "soundness": "3;2;3;2;3",
        "contribution": "3;2;3;2;3",
        "presentation": "3;3;3;2;3",
        "wc_summary": "53;113;60;47;129",
        "wc_strengths": "32;24;60;43;21",
        "wc_weaknesses": "299;100;281;526;46",
        "wc_questions": "5;213;24;3;114",
        "wc_review": "389;450;425;619;310",
        "wc_reply_reviewers": "197;312;0;0;0",
        "wc_reply_authors": "1159;890;879;1301;580",
        "reply_reviewers": "1;2;0;0;0",
        "reply_authors": "2;2;2;2;1",
        "rating_avg": [
            5.2,
            1.6
        ],
        "confidence_avg": [
            3.2,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            80.4,
            33.78520386204588
        ],
        "wc_strengths_avg": [
            36.0,
            14.212670403551895
        ],
        "wc_weaknesses_avg": [
            250.4,
            169.50115043857372
        ],
        "wc_questions_avg": [
            71.8,
            81.48472249446516
        ],
        "wc_review_avg": [
            438.6,
            101.84026708527428
        ],
        "wc_reply_reviewers_avg": [
            101.8,
            129.87440086483556
        ],
        "wc_reply_authors_avg": [
            961.8,
            249.69052845472532
        ],
        "reply_reviewers_avg": [
            0.6,
            0.7999999999999999
        ],
        "reply_authors_avg": [
            1.8,
            0.4
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.13363062095621217,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:_hgHVXqaJNQJ:scholar.google.com/&scioq=IMP:+Benchmarking+Image+Polysemy+in+Vision-Language+Models&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Amsterdam",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uva.nl",
        "aff_unique_abbr": "UvA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Netherlands"
    },
    {
        "title": "Don't Judge by the Look: Towards Motion Coherent Video Representation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18651",
        "id": "RIcYTbpO38",
        "author_site": "Yitian Zhang, Yue Bai, Huan Wang, Yizhou Wang, Yun Fu",
        "tldr": "",
        "abstract": "Current training pipelines in object recognition neglect Hue Jittering when doing data augmentation as it not only brings appearance changes that are detrimental to classification, but also the implementation is inefficient in practice. In this study, we investigate the effect of hue variance in the context of video understanding and find this variance to be beneficial since static appearances are less important in videos that contain motion information. Based on this observation, we propose a data augmentation method for video understanding, named Motion Coherent Augmentation (MCA), that introduces appearance variation in videos and implicitly encourages the model to prioritize motion patterns, rather than static appearances. Concretely, we propose an operation SwapMix to efficiently modify the appearance of video samples, and introduce Variation Alignment (VA) to resolve the distribution shift caused by SwapMix, enforcing the model to learn appearance invariant representations. Comprehensive empirical evaluation across various architectures and different datasets solidly validates the effectiveness and generalization ability of MCA, and the application of VA in other augmentation methods. Code is available at https://github.com/BeSpontaneous/MCA-pytorch.",
        "keywords": "Video Understanding;Data Augmentation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yitian Zhang;Yue Bai;Huan Wang;Yizhou Wang;Yun Fu",
        "authorids": "~Yitian_Zhang1;~Yue_Bai1;~Huan_Wang3;~Yizhou_Wang3;~Yun_Fu1",
        "gender": ";M;M;M;M",
        "homepage": ";https://yueb17.github.io/;https://huanwang.tech/;https://wyzjack.github.io/;http://www1.ece.neu.edu/~yunfu/",
        "dblp": ";119/0848;70/6155-14;71/3387-6;00/5815-1",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;0-On0y4AAAAJ;H4kqV1MAAAAJ;https://scholar.google.com.tw/citations?user=h-JEcQ8AAAAJ",
        "orcid": ";;0000-0001-6951-901X;0000-0003-1601-9649;0000-0002-5098-2853",
        "linkedin": ";;huanwang-zju/;yizhou-wang-786603155/;furaymond/",
        "or_profile": "~Yitian_Zhang1;~Yue_Bai1;~Huan_Wang3;~Yizhou_Wang3;~Yun_Fu1",
        "aff": ";Northeastern University;Northeastern University;Northeastern University;Northeastern University",
        "aff_domain": ";neu.edu;neu.edu;northeastern.edu;northeastern.edu",
        "position": ";PhD student;PhD student;PhD student;Full Professor",
        "bibtex": "@inproceedings{\nzhang2024dont,\ntitle={Don't Judge by the Look: Towards Motion Coherent Video Representation},\nauthor={Yitian Zhang and Yue Bai and Huan Wang and Yizhou Wang and Yun Fu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=RIcYTbpO38}\n}",
        "github": "",
        "project": "",
        "reviewers": "7MY2;SoaL;sFSx;4nis",
        "pdf_size": 2097389,
        "rating": "3;6;6;8",
        "confidence": "5;3;2;4",
        "soundness": "2;3;3;3",
        "contribution": "1;3;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "168;121;75;61",
        "wc_strengths": "52;241;41;119",
        "wc_weaknesses": "401;197;35;19",
        "wc_questions": "34;187;38;11",
        "wc_review": "655;746;189;210",
        "wc_reply_reviewers": "165;0;34;0",
        "wc_reply_authors": "2600;441;704;379",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "5;1;1;1",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            106.25,
            41.99627959712622
        ],
        "wc_strengths_avg": [
            113.25,
            79.56875957308873
        ],
        "wc_weaknesses_avg": [
            163.0,
            154.04544783926593
        ],
        "wc_questions_avg": [
            67.5,
            69.75851202541521
        ],
        "wc_review_avg": [
            450.0,
            252.66677660507722
        ],
        "wc_reply_reviewers_avg": [
            49.75,
            67.97196113104285
        ],
        "wc_reply_authors_avg": [
            1031.0,
            914.0423950780402
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            1.7320508075688772
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.4383570037596046,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:UyoXeXTI8j0J:scholar.google.com/&scioq=Don%27t+Judge+by+the+Look:+Towards+Motion+Coherent+Video+Representation&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=RIcYTbpO38",
        "pdf": "https://openreview.net/pdf?id=RIcYTbpO38",
        "email": ";neu.edu;neu.edu;northeastern.edu;northeastern.edu",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Northeastern University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.northeastern.edu",
        "aff_unique_abbr": "NEU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "RIk0DJIO8O",
        "title": "UniInsertion: A Unified Model-based Insertion Skill Learning via Differentiable Physics-based Simulation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Manipulating and inserting deformable objects into tight spaces remains challenging in robotics due to their flexibility, intricate configurations, and complex contact dynamics. Prior methods relying on analytical models or human demonstrations often struggle to generalize across diverse scenarios. This paper presents a model-based framework leveraging differentiable physics simulation and the innovative concept of \"learning from reversal\" to enable robotic insertion of both rigid and deformable objects.\nOur key insight is that while insertion presents difficulties, the reverse process of insertion can provide clearer intermediate waypoints, and we posit that frames with a higher number of collision points during the insertion process are more likely to represent critical waypoints. By discerning these waypoints through learning from reversals, we obtain a smooth, differentiable transition from waypoint identification to trajectory optimization via the differentiable simulator.\nFurthermore, we construct an extensive dataset with the simulator, encompassing diverse object shapes, materials, and container geometries, with corresponding demonstrations. This powers imitation learning to train robust policies, showcasing adaptability to novel objects and containers.\nOur framework, integrating learning from reversals, differentiable physics, and imitation learning, pioneers a paradigm shift in robotic insertion capabilities. Evaluations demonstrate superiority over competing approaches in sample efficiency, performance, and sim-to-real transfer.  Supplementary and Videos are on the website: https://sites.google.com/view/uniinsertion",
        "keywords": "Differentiable Simulation; Robot Manipulation",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Chenrui Tie;Wang Debang;Gaurav Chaudhary;Weikun Peng;Tianyi Chen;Gang Yang;Yao Mu;Lin Shao",
        "authorids": "~Chenrui_Tie1;~Wang_Debang1;~Gaurav_Chaudhary1;~Weikun_Peng1;~Tianyi_Chen7;~Gang_Yang8;~Yao_Mu1;~Lin_Shao2",
        "gender": "M;M;;;M;M;M;M",
        "homepage": "https://crtie.github.io/;;;;https://github.com/control-cyber;https://github.com/LapUtopia;https://yaomarkmu.github.io/;https://linsats.github.io/",
        "dblp": ";;;317/1295;93/4437-1;;260/0674;26/8546-2",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;;;https://scholar.google.com/citations?hl=zh-CN;;;;https://scholar.google.com/citations?hl=en",
        "orcid": ";0000-0002-4635-0861;;0009-0002-6720-2734;0009-0000-1203-6746;;;",
        "linkedin": ";;;weikun-peng-7731281b4/;;;;",
        "or_profile": "~Chenrui_Tie1;~Wang_Debang1;~Gaurav_Chaudhary1;~Weikun_Peng1;~Tianyi_Chen7;~Gang_Yang8;~Yao_Mu1;~Lin_Shao2",
        "aff": "Peking University;National University of Singapore;;national university of singapore, National University of Singapore;Shanghai Jiaotong University;;The University of Hong Kong;National University of Singapore",
        "aff_domain": "pku.edu.au;u.nus.edu;;u.nus.edu;sjtu.edu.cn;;hku.hk;nus.edu.sg",
        "position": "Undergrad student;MS student;;MS student;Undergrad student;;PhD student;Assistant Professor",
        "bibtex": "@misc{\ntie2024uniinsertion,\ntitle={UniInsertion: A Unified Model-based Insertion Skill Learning via Differentiable Physics-based Simulation},\nauthor={Chenrui Tie and Wang Debang and Gaurav Chaudhary and Weikun Peng and Tianyi Chen and Gang Yang and Yao Mu and Lin Shao},\nyear={2024},\nurl={https://openreview.net/forum?id=RIk0DJIO8O}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=RIk0DJIO8O",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:7a4bgOHaPWwJ:scholar.google.com/&scioq=UniInsertion:+A+Unified+Model-based+Insertion+Skill+Learning+via+Differentiable+Physics-based+Simulation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;2;3;1",
        "aff_unique_norm": "Peking University;National University of Singapore;Shanghai Jiao Tong University;University of Hong Kong",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.nus.edu.sg;https://www.sjtu.edu.cn;https://www.hku.hk",
        "aff_unique_abbr": "Peking U;NUS;SJTU;HKU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;1;1;0;0;1",
        "aff_country_unique": "China;Singapore"
    },
    {
        "title": "Quantifying Language Models' Sensitivity to Spurious Features in Prompt Design or: How I learned to start worrying about prompt formatting",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18650",
        "id": "RIu5lyNXjT",
        "author_site": "Melanie Sclar, Yejin Choi, Yulia Tsvetkov, Alane Suhr",
        "tldr": "",
        "abstract": "As large language models (LLMs) are adopted as a fundamental component of language technologies, it is crucial to accurately characterize their performance. Because choices in prompt design can strongly influence model behavior, this design process is critical in effectively using any modern pre-trained generative language model. In this work, we focus on LLM sensitivity to a quintessential class of meaning-preserving design choices: prompt formatting. We find that several widely used open-source LLMs are extremely sensitive to subtle changes in prompt formatting in few-shot settings, with performance differences of up to 76 accuracy points when evaluated using LLaMA-2-13B. Sensitivity remains even when increasing model size, the number of few-shot examples, or performing instruction tuning. Our analysis suggests that work evaluating LLMs with prompting-based methods would benefit from reporting a range of performance across plausible prompt formats, instead of the currently-standard practice of reporting performance on a single format. We also show that format performance only weakly correlates between models, which puts into question the methodological validity of comparing models with an arbitrarily chosen, fixed prompt format. To facilitate systematic analysis we propose FormatSpread, an algorithm that rapidly evaluates a sampled set of plausible prompt formats for a given task, and reports the interval of expected performance without accessing model weights. Furthermore, we present a suite of analyses that characterize the nature of this sensitivity, including exploring the influence of particular atomic perturbations and the internal representation of particular formats.",
        "keywords": "large language models;sensitivity analysis;prompt engineering;evaluation;prompting;robustness;in-context learning;spurious features",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Melanie Sclar;Yejin Choi;Yulia Tsvetkov;Alane Suhr",
        "authorids": "~Melanie_Sclar1;~Yejin_Choi1;~Yulia_Tsvetkov1;~Alane_Suhr1",
        "gender": "F;F;F;Not Specified",
        "homepage": "https://msclar.github.io;https://yejinc.github.io/;https://homes.cs.washington.edu/~yuliats/;http://www.alanesuhr.com",
        "dblp": "274/6796;89/579-1;75/8157;203/9306",
        "google_scholar": "4uNPtZgAAAAJ;vhP-tlcAAAAJ;SEDPkrsAAAAJ;daslsUkAAAAJ",
        "orcid": ";;0000-0002-4634-7128;",
        "linkedin": "melanie-sclar-077047b5/;;;",
        "or_profile": "~Melanie_Sclar1;~Yejin_Choi1;~Yulia_Tsvetkov1;~Alane_Suhr1",
        "aff": "University of Washington, Seattle;Department of Computer Science, University of Washington;Department of Computer Science, University of Washington;University of California, Berkeley",
        "aff_domain": "uw.edu;cs.washington.edu;cs.washington.edu;berkeley.edu",
        "position": "PhD student;Full Professor;Associate Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nsclar2024quantifying,\ntitle={Quantifying Language Models' Sensitivity to Spurious Features in Prompt Design or: How I learned to start worrying about prompt formatting},\nauthor={Melanie Sclar and Yejin Choi and Yulia Tsvetkov and Alane Suhr},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=RIu5lyNXjT}\n}",
        "github": "",
        "project": "",
        "reviewers": "c9z9;RFEF;fgsZ",
        "pdf_size": 2297318,
        "rating": "6;6;8",
        "confidence": "2;3;4",
        "soundness": "3;3;3",
        "contribution": "3;3;4",
        "presentation": "3;3;3",
        "wc_summary": "169;66;138",
        "wc_strengths": "104;55;66",
        "wc_weaknesses": "172;107;97",
        "wc_questions": "89;33;44",
        "wc_review": "534;261;345",
        "wc_reply_reviewers": "28;0;0",
        "wc_reply_authors": "703;494;378",
        "reply_reviewers": "1;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            124.33333333333333,
            43.14574782705192
        ],
        "wc_strengths_avg": [
            75.0,
            20.992061991778385
        ],
        "wc_weaknesses_avg": [
            125.33333333333333,
            33.2498955721
        ],
        "wc_questions_avg": [
            55.333333333333336,
            24.225789747475496
        ],
        "wc_review_avg": [
            380.0,
            114.16654501210063
        ],
        "wc_reply_reviewers_avg": [
            9.333333333333334,
            13.199326582148887
        ],
        "wc_reply_authors_avg": [
            525.0,
            134.47924251224302
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.8660254037844385,
        "gs_citation": 318,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9327009222765162484&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=RIu5lyNXjT",
        "pdf": "https://openreview.net/pdf?id=RIu5lyNXjT",
        "email": "uw.edu;cs.washington.edu;cs.washington.edu;berkeley.edu",
        "author_num": 4,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "University of Washington;University of California, Berkeley",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.washington.edu;https://www.berkeley.edu",
        "aff_unique_abbr": "UW;UC Berkeley",
        "aff_campus_unique_index": "0;0;0;1",
        "aff_campus_unique": "Seattle;Berkeley",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "ConR: Contrastive Regularizer for Deep Imbalanced Regression",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18649",
        "id": "RIuevDSK5V",
        "author_site": "Mahsa Keramati, Lili Meng, R. Evans",
        "tldr": "",
        "abstract": "Imbalanced distributions are ubiquitous in real-world data. They create constraints on Deep Neural Networks to represent the minority labels and avoid bias towards majority labels. The extensive body of imbalanced approaches address categorical label spaces but fail to effectively extend to regression problems where the label space is continuous. Local and global correlations among continuous labels provide valuable insights towards effectively modelling relationships in feature space. In this work, we propose ConR, a contrastive regularizer that models global and local label similarities in feature space and prevents the features of minority samples from being collapsed into their majority neighbours. ConR discerns the disagreements between the label space and feature space, and imposes\na penalty on these disagreements. ConR minds the continuous nature of label space with two main strategies in a contrastive manner: incorrect proximities are penalized proportionate to the label similarities and the correct ones are encouraged to model local similarities. ConR consolidates essential considerations into a generic, easy-to-integrate, and efficient method that effectively addresses deep imbalanced regression. Moreover, ConR is orthogonal to existing approaches and smoothly extends to uni- and multi-dimensional label spaces. Our comprehensive experiments show that ConR significantly boosts the performance of all the state-of-the-art methods on four large-scale deep imbalanced regression benchmarks.",
        "keywords": "Deep imbalanced regression;Contrastive learning;Representation learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Mahsa Keramati;Lili Meng;R. David Evans",
        "authorids": "~Mahsa_Keramati1;~Lili_Meng2;~R._David_Evans1",
        "gender": "F;;",
        "homepage": ";;",
        "dblp": "204/1425;;",
        "google_scholar": "https://scholar.google.ca/citations?user=KdCmoNsAAAAJ;;",
        "orcid": ";;",
        "linkedin": "mahsa-keramati-0171244b/;;",
        "or_profile": "~Mahsa_Keramati1;~Lili_Meng2;~R._David_Evans1",
        "aff": "Simon Fraser University;;",
        "aff_domain": "sfu.ca;;",
        "position": "PhD student;;",
        "bibtex": "@inproceedings{\nkeramati2024conr,\ntitle={ConR: Contrastive Regularizer for Deep Imbalanced Regression},\nauthor={Mahsa Keramati and Lili Meng and R. David Evans},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=RIuevDSK5V}\n}",
        "github": "",
        "project": "",
        "reviewers": "Yj3F;ECg6;viAu;M28F",
        "pdf_size": 3473793,
        "rating": "6;6;6;8",
        "confidence": "4;4;4;4",
        "soundness": "3;3;2;3",
        "contribution": "3;3;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "205;81;27;101",
        "wc_strengths": "57;51;29;63",
        "wc_weaknesses": "54;93;115;349",
        "wc_questions": "278;260;44;52",
        "wc_review": "594;485;215;565",
        "wc_reply_reviewers": "152;0;28;214",
        "wc_reply_authors": "1952;1144;1340;1603",
        "reply_reviewers": "2;0;1;2",
        "reply_authors": "4;2;3;4",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            103.5,
            64.55036793078719
        ],
        "wc_strengths_avg": [
            50.0,
            12.84523257866513
        ],
        "wc_weaknesses_avg": [
            152.75,
            115.39145332302562
        ],
        "wc_questions_avg": [
            158.5,
            110.71923952050972
        ],
        "wc_review_avg": [
            464.75,
            149.61680219814886
        ],
        "wc_reply_reviewers_avg": [
            98.5,
            87.85641695402789
        ],
        "wc_reply_authors_avg": [
            1509.75,
            302.8484563275831
        ],
        "reply_reviewers_avg": [
            1.25,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.25,
            0.82915619758885
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16083075459309578599&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=RIuevDSK5V",
        "pdf": "https://openreview.net/pdf?id=RIuevDSK5V",
        "email": "sfu.ca;;",
        "author_num": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "Simon Fraser University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sfu.ca",
        "aff_unique_abbr": "SFU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Canada"
    },
    {
        "title": "Weakly Supervised Virus Capsid Detection with Image-Level Annotations in Electron Microscopy Images",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18648",
        "id": "RJDjSXNuAZ",
        "author_site": "Hannah Kniesel, Leon Sick, Tristan Payer, Tim Bergner, Kavitha Shaga Devan, Clarissa Read, Paul Walther, Timo Ropinski, Pedro Hermosilla",
        "tldr": "",
        "abstract": "Current state-of-the-art methods for object detection rely on annotated bounding boxes of large data sets for training. However, obtaining such annotations is expensive and can require up to hundreds of hours of manual labor. This poses a challenge, especially since such annotations can only be provided by experts, as they require knowledge about the scientific domain. To tackle this challenge, we propose a domain-specific weakly supervised object detection algorithm that only relies on image-level annotations, which are significantly easier to acquire. Our method  distills the knowledge of a pre-trained model, on the task of predicting the presence or absence of a virus in an image, to obtain a set of pseudo-labels that can be used to later train a state-of-the-art object detection model. To do so, we use an optimization approach with a shrinking receptive field to extract virus particles directly without specific network architectures. Through a set of extensive studies, we show how the proposed pseudo-labels are easier to obtain, and, more importantly, are able to outperform other existing weak labeling methods, and even ground truth labels, in cases where the time to obtain the annotation is limited.",
        "keywords": "Weakly Supervised Object Detection;Limited Annotation Time;Bounding Box Regression;Electron Microscopy",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/44c25469ea832f5d37b596337c52b6d389d5a4c7.zip",
        "author": "Hannah Kniesel;Leon Sick;Tristan Payer;Tim Bergner;Kavitha Shaga Devan;Clarissa Read;Paul Walther;Timo Ropinski;Pedro Hermosilla",
        "authorids": "~Hannah_Kniesel1;~Leon_Sick1;~Tristan_Payer1;~Tim_Bergner1;~Kavitha_Shaga_Devan1;~Clarissa_Read1;~Paul_Walther1;~Timo_Ropinski2;~Pedro_Hermosilla1",
        "gender": "F;M;M;M;F;F;M;M;M",
        "homepage": "https://viscom.uni-ulm.de/members/hannah-kniesel/;https://leonsick.github.io;https://viscom.uni-ulm.de/members/tristan-payer/;https://www.uni-ulm.de/einrichtungen/elektronenmikroskopie/;;https://www.uni-ulm.de/einrichtungen/elektronenmikroskopie/;https://www.uni-ulm.de/einrichtungen/elektronenmikroskopie/members/paul-walther/;https://viscom.uni-ulm.de/members/timo-ropinski/;https://phermosilla.github.io/",
        "dblp": "https://dblp.org/rec/conf/vcbm/KnieselRH20;356/2434;;;;;;92/5590;170/7065",
        "google_scholar": "https://scholar.google.com/citations?hl=de;https://scholar.google.de/citations?user=KL3_OLwAAAAJ;;;;ZkoDNAwAAAAJ;;FuY-lbcAAAAJ;C7F4B6MAAAAJ",
        "orcid": "0000-0001-5898-8152;;;0000-0002-6411-1071;;0000-0002-4632-2684;;0000-0002-7857-5512;",
        "linkedin": ";leon-sick-632293108/;;;kavitha-shaga-devan-330a6290/;;;;",
        "or_profile": "~Hannah_Kniesel1;~Leon_Sick1;~Tristan_Payer1;~Tim_Bergner1;~Kavitha_Shaga_Devan1;~Clarissa_Read1;~Paul_Walther1;~Timo_Ropinski2;~Pedro_Hermosilla1",
        "aff": "Universit\u00e4t Ulm;Universit\u00e4t Ulm;;Universit\u00e4t Ulm;;Universit\u00e4t Ulm;Universit\u00e4t Ulm;Ulm University;Technische Universit\u00e4t Wien",
        "aff_domain": "uni-ulm.de;uni-ulm.de;;uni-ulm.de;;uni-ulm.de;uni-ulm.de;uni-ulm.de;tuwien.ac.at",
        "position": "PhD student;PhD student;;PhD student;;Principal Researcher;Full Professor;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nkniesel2024weakly,\ntitle={Weakly Supervised Virus Capsid Detection with Image-Level Annotations in Electron Microscopy Images},\nauthor={Hannah Kniesel and Leon Sick and Tristan Payer and Tim Bergner and Kavitha Shaga Devan and Clarissa Read and Paul Walther and Timo Ropinski and Pedro Hermosilla},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=RJDjSXNuAZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "KB1H;6zGs;zGyY;xKLD",
        "pdf_size": 23271499,
        "rating": "5;5;6;6",
        "confidence": "4;4;5;3",
        "soundness": "3;4;3;3",
        "contribution": "3;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "92;137;90;46",
        "wc_strengths": "96;95;64;66",
        "wc_weaknesses": "134;642;253;33",
        "wc_questions": "71;2;147;34",
        "wc_review": "393;876;554;179",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "262;1257;1261;490",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;6;9;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            91.25,
            32.18209906143476
        ],
        "wc_strengths_avg": [
            80.25,
            15.270478054075452
        ],
        "wc_weaknesses_avg": [
            265.5,
            230.89878735064852
        ],
        "wc_questions_avg": [
            63.5,
            54.03933752369657
        ],
        "wc_review_avg": [
            500.5,
            254.3526095796935
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            817.5,
            448.8009024055099
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            4.25,
            3.418698582794336
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10699631745296544349&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=RJDjSXNuAZ",
        "pdf": "https://openreview.net/pdf?id=RJDjSXNuAZ",
        "email": "uni-ulm.de;uni-ulm.de;;uni-ulm.de;;uni-ulm.de;uni-ulm.de;uni-ulm.de;tuwien.ac.at",
        "author_num": 9,
        "aff_unique_index": "0;0;0;0;0;1;2",
        "aff_unique_norm": "University of Ulm;Ulm University;Technische Universit\u00e4t Wien",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.uni-ulm.de;https://www.uni-ulm.de/;https://www.tuwien.ac.at",
        "aff_unique_abbr": "Ulm;U Ulm;TU Wien",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;1",
        "aff_country_unique": "Germany;Austria"
    },
    {
        "id": "RKh7DI23tz",
        "title": "Why Do We Need Weight Decay in Modern Deep Learning?",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Weight decay is a broadly used technique for training state-of-the-art deep networks, including large language models. Despite its widespread usage, its role remains poorly understood. In this work, we argue that the role of weight decay in modern deep learning is different from its regularization effect studied in classical learning theory. For overparameterized deep networks, we show how weight decay modifies the optimization dynamics enhancing the ever-present implicit regularization of SGD via the *loss stabilization mechanism*. In contrast, for underparameterized large language models trained with nearly online SGD, we describe how weight decay balances the *bias-variance tradeoff* in stochastic optimization leading to lower training loss. Moreover, we show that weight decay also prevents sudden loss divergences for $\\texttt{bfloat16}$ mixed-precision training which is a crucial tool for LLM training.  Overall, we present a unifying perspective from ResNets on vision tasks to LLMs: weight decay is never useful as an explicit regularizer but instead changes the training dynamics in a desirable way.",
        "keywords": "Weight decay;overparameterization;implicit regularization;large language models;optimization dynamics.",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Maksym Andriushchenko;Francesco D'Angelo;Aditya Varre;Nicolas Flammarion",
        "authorids": "~Maksym_Andriushchenko1;~Francesco_D'Angelo1;~Aditya_Varre1;~Nicolas_Flammarion1",
        "gender": "M;M;M;M",
        "homepage": "https://www.andriushchenko.me/;;;",
        "dblp": "200/8865;32/10646;164/7417;224/6338",
        "google_scholar": "ZNtuJYoAAAAJ;Hg_3f5kAAAAJ;;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Maksym_Andriushchenko1;~Francesco_D'Angelo1;~Nicolas_Flammarion1;~Aditya_Vardhan_Varre1",
        "aff": "Swiss Federal Institute of Technology Lausanne;ETH;Swiss Federal Institute of Technology Lausanne;EPFL - EPF Lausanne",
        "aff_domain": "epfl.ch;ethz.ch;epfl.ch;epfl.ch",
        "position": "PhD Student;MS student;Assistant Professor;PhD student",
        "bibtex": "@misc{\nandriushchenko2024why,\ntitle={Why Do We Need Weight Decay in Modern Deep Learning?},\nauthor={Maksym Andriushchenko and Francesco D'Angelo and Aditya Varre and Nicolas Flammarion},\nyear={2024},\nurl={https://openreview.net/forum?id=RKh7DI23tz}\n}",
        "github": "",
        "project": "",
        "reviewers": "8iM1;Crhm;aeLC;hANA;i8U2",
        "site": "https://openreview.net/forum?id=RKh7DI23tz",
        "pdf_size": 1940922,
        "rating": "3;3;5;5;5",
        "confidence": "3;3;4;4;3",
        "soundness": "2;2;3;2;2",
        "contribution": "1;2;2;3;2",
        "presentation": "2;2;3;4;2",
        "wc_summary": "101;20;111;73;106",
        "wc_strengths": "67;6;20;50;36",
        "wc_weaknesses": "277;297;142;169;158",
        "wc_questions": "9;141;8;168;51",
        "wc_review": "454;464;281;460;351",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            4.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.4,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.2,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            2.6,
            0.8
        ],
        "wc_summary_avg": [
            82.2,
            33.772177898382566
        ],
        "wc_strengths_avg": [
            35.8,
            21.5072080940321
        ],
        "wc_weaknesses_avg": [
            208.6,
            64.89560848008131
        ],
        "wc_questions_avg": [
            75.4,
            66.97044124089373
        ],
        "wc_review_avg": [
            402.0,
            73.69396176078472
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.6666666666666667,
        "gs_citation": 27,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16154366594828211100&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "Swiss Federal Institute of Technology Lausanne;ETH Zurich;EPFL",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.epfl.ch;https://www.ethz.ch;https://www.epfl.ch",
        "aff_unique_abbr": "EPFL;ETH;EPFL",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Lausanne;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Switzerland"
    },
    {
        "id": "RKw6AzP2BY",
        "title": "Decoding LLM's: The Interplay of Transformation Matrices and Input Complexity",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In the realm of Large Language Models (LLMs) like GPT-3, methodologies such as In-Context Learning (ICL) and the \"Chain of Thoughts\" (CoT) approach have become prominent. Yet, a significant research gap persists: the underlying mechanics explaining their efficacy remain vague. While existing hypotheses provide some insights, they fall short in offering a comprehensive understanding. To bridge this gap, we introduce a rigorous mathematical analysis, interpreting LLM parameters as transformation matrices that convert the complexities of textual data into high-dimensional vector spaces. Our analysis robustly postulates the correctness of this interpretation, providing a fresh perspective on LLM behaviors. At their heart, LLMs primarily operate as pattern matchers. They recognize patterns from the input text, drawing from their vast training, and produce outputs. Here, the complexity of the input prompts becomes crucial. A complex input can nudge the LLM to generate a more refined response, hinting at the concept of intrinsic dimensionality, which gauges the inherent complexity of input. In light of our insights, we advocate for a strategic shift in fine-tuning LLMs. We propose fine-tuning them on logical reasoning tasks, specifically leveraging reasoning questions (Verbal Reasoning, Probability, Assertion and Reason). This approach, rooted in our mathematical framework, enables LLMs with the technique to decipher the logical layers in the data, promising to harness the true potential of LLMs, guiding them beyond mere pattern matching to deeper textual comprehension. This in turn also improves their causal inferencing ability. In essence, our paper offers a structured blueprint, seamlessly transitioning from identifying research gaps to actionable strategies, aiming to elevate the capabilities and understanding of Large Language Models.",
        "keywords": "Transformation Matrices;Intrinsic Dimensionality;Causal Inferencing;In-Context Learning (ICL)",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Rudransh Agnihotri;Ankit Kumar Pandey",
        "authorids": "~Rudransh_Agnihotri1;~Ankit_Kumar_Pandey1",
        "gender": "M;M",
        "homepage": ";",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": "rudransh2004/;ankit0513/",
        "or_profile": "~Rudransh_Agnihotri1;~Ankit_Kumar_Pandey1",
        "aff": "Delhi Skill and Entrepreneureship University ;",
        "aff_domain": "dseu.ac.in;",
        "position": "Undergrad student;",
        "bibtex": "@misc{\nagnihotri2024decoding,\ntitle={Decoding {LLM}'s: The Interplay of Transformation Matrices and Input Complexity},\nauthor={Rudransh Agnihotri and Ankit Kumar Pandey},\nyear={2024},\nurl={https://openreview.net/forum?id=RKw6AzP2BY}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=RKw6AzP2BY",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Nz5eiw-ZI6AJ:scholar.google.com/&scioq=Decoding+LLM%27s:+The+Interplay+of+Transformation+Matrices+and+Input+Complexity&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Delhi Skill and Entrepreneurship University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.dseu.ac.in",
        "aff_unique_abbr": "DSEU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "India"
    },
    {
        "title": "Generalized Neural Sorting Networks with Error-Free Differentiable Swap Functions",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18647",
        "id": "RLSWbk9kPw",
        "author_site": "Jungtaek Kim, Jeongbeen Yoon, Minsu Cho",
        "tldr": "",
        "abstract": "Sorting is a fundamental operation of all computer systems, having been a long-standing significant research topic. Beyond the problem formulation of traditional sorting algorithms, we consider sorting problems for more abstract yet expressive inputs, e.g., multi-digit images and image fragments, through a neural sorting network. To learn a mapping from a high-dimensional input to an ordinal variable, the differentiability of sorting networks needs to be guaranteed. In this paper we define a softening error by a differentiable swap function, and develop an error-free swap function that holds a non-decreasing condition and differentiability. Furthermore, a permutation-equivariant Transformer network with multi-head attention is adopted to capture dependency between given inputs and also leverage its model capacity with self-attention. Experiments on diverse sorting benchmarks show that our methods perform better than or comparable to baseline methods.",
        "keywords": "Sorting networks;Neural sorting networks;Differentiable swap functions",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Jungtaek Kim;Jeongbeen Yoon;Minsu Cho",
        "authorids": "~Jungtaek_Kim1;~Jeongbeen_Yoon1;~Minsu_Cho1",
        "gender": "M;F;M",
        "homepage": "https://jungtaekkim.github.io;http://cvlab.postech.ac.kr;http://cvlab.postech.ac.kr/~mcho/",
        "dblp": "31/3193-1;307/5305;",
        "google_scholar": "KXNUYWgAAAAJ;;5TyoF5QAAAAJ",
        "orcid": "0000-0002-1905-1399;;",
        "linkedin": "jungtaekkim;;minsu-cho-062b3750/",
        "or_profile": "~Jungtaek_Kim1;~Jeongbeen_Yoon1;~Minsu_Cho1",
        "aff": "University of Pittsburgh;POSTECH;POSTECH",
        "aff_domain": "pitt.edu;postech.ac.kr;postech.ac.kr",
        "position": "Postdoc;PhD student;Associate Professor",
        "bibtex": "@inproceedings{\nkim2024generalized,\ntitle={Generalized Neural Sorting Networks with Error-Free Differentiable Swap Functions},\nauthor={Jungtaek Kim and Jeongbeen Yoon and Minsu Cho},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=RLSWbk9kPw}\n}",
        "github": "",
        "project": "",
        "reviewers": "M9Vx;rtfd;Stfx;LP9f",
        "pdf_size": 1108835,
        "rating": "6;6;6;6",
        "confidence": "3;3;3;1",
        "soundness": "3;3;3;2",
        "contribution": "3;2;3;2",
        "presentation": "3;2;3;3",
        "wc_summary": "78;48;76;65",
        "wc_strengths": "15;129;88;109",
        "wc_weaknesses": "203;436;132;106",
        "wc_questions": "22;22;52;28",
        "wc_review": "318;635;348;308",
        "wc_reply_reviewers": "95;225;0;25",
        "wc_reply_authors": "778;1064;1122;674",
        "reply_reviewers": "3;1;0;1",
        "reply_authors": "4;5;4;3",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            2.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            66.75,
            11.903255857117413
        ],
        "wc_strengths_avg": [
            85.25,
            43.071887583434275
        ],
        "wc_weaknesses_avg": [
            219.25,
            130.07954297275188
        ],
        "wc_questions_avg": [
            31.0,
            12.36931687685298
        ],
        "wc_review_avg": [
            402.25,
            135.18205317274922
        ],
        "wc_reply_reviewers_avg": [
            86.25,
            87.34808240596928
        ],
        "wc_reply_authors_avg": [
            909.5,
            188.26776144629756
        ],
        "reply_reviewers_avg": [
            1.25,
            1.0897247358851685
        ],
        "reply_authors_avg": [
            4.0,
            0.7071067811865476
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15888746511869566001&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=RLSWbk9kPw",
        "pdf": "https://openreview.net/pdf?id=RLSWbk9kPw",
        "email": "pitt.edu;postech.ac.kr;postech.ac.kr",
        "author_num": 3,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "University of Pittsburgh;Pohang University of Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.pitt.edu;https://www.postech.ac.kr",
        "aff_unique_abbr": "Pitt;POSTECH",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Pohang",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "United States;South Korea"
    },
    {
        "id": "RLhS1TrjK3",
        "title": "Defect Spectrum: A Granular Look of Large-Scale Defect Datasets with Rich Semantics",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Defect inspection is paramount within the closed-loop manufacturing system. However, existing datasets for defect inspection often lack the precision and semantic granularity required for practical applications. In this paper, we introduce the Defect Spectrum, a comprehensive benchmark that offers precise, semantic-abundant, and large-scale annotations for a wide range of industrial defects. Building on four key industrial benchmarks, our dataset refines existing annotations and introduces rich semantic details, distinguishing multiple defect types within a single image. \nFurthermore, we introduce Defect-Gen, a two-stage diffusion-based generator designed to create high-quality and diverse defective images, even when working with limited datasets. The synthetic images generated by Defect-Gen significantly enhance the efficacy of defect inspection models. \nOverall, The Defect Spectrum dataset demonstrates its potential in defect inspection research, offering a solid platform for testing and refining advanced models.",
        "keywords": "dataset",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/fe22cd980e6adca9e492f85f7057d90eeada89af.pdf",
        "author": "Shuai Yang;ZhiFei Chen;Pengguang Chen;Xi Fang;Shu Liu;Ying-Cong Chen",
        "authorids": "~Shuai_Yang7;~ZhiFei_Chen1;~Pengguang_Chen1;~Xi_Fang1;~Shu_Liu4;~Ying-Cong_Chen1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://github.com/AndysonYs;;https://github.com/akuxcw;;https://shuliu1993.github.io/;https://www.yingcong.me/",
        "dblp": ";;189/7442.html;;57/1180-5;137/6578",
        "google_scholar": ";;https://scholar.google.com.hk/citations?user=lMnVrgIAAAAJ;f1IADCIAAAAJ;BUEDUFkAAAAJ;https://scholar.google.com.hk/citations?user=n7j4bJUAAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";zhifei-chen-10a26a146/;;https://www.linkedin.cn/incareer/in/%E6%9B%A6-%E6%96%B9-503886103;;",
        "or_profile": "~Shuai_Yang7;~ZhiFei_Chen1;~Pengguang_Chen1;~Xi_Fang1;~Shu_Liu4;~Ying-Cong_Chen1",
        "aff": "Hong Kong University of Science and Technology (Gunagzhou);The Hong Kong University of Science and Technology(Guangzhou);SmartMore;SmartMore;SmartMore Ltd.;Hong Kong University of Science and Technology",
        "aff_domain": "hkust.edu;connect.hkust-gz.edu.cn;smartmore.com;smartmore.com;smartmore.com;hkust-gz.edu.cn",
        "position": "PhD student;PhD student;Researcher;Researcher;Principal Researcher;Assistant Professor",
        "bibtex": "@misc{\nyang2024defect,\ntitle={Defect Spectrum: A Granular Look of Large-Scale Defect Datasets with Rich Semantics},\nauthor={Shuai Yang and ZhiFei Chen and Pengguang Chen and Xi Fang and Shu Liu and Ying-Cong Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=RLhS1TrjK3}\n}",
        "github": "",
        "project": "",
        "reviewers": "VeNd;EDJD;J4Kk;qXne",
        "site": "https://openreview.net/forum?id=RLhS1TrjK3",
        "pdf_size": 16479701,
        "rating": "1;5;6;8",
        "confidence": "4;4;4;4",
        "soundness": "2;2;2;4",
        "contribution": "1;3;3;4",
        "presentation": "1;3;3;3",
        "wc_summary": "31;77;87;68",
        "wc_strengths": "24;85;72;103",
        "wc_weaknesses": "138;129;13;206",
        "wc_questions": "3;97;137;43",
        "wc_review": "196;388;309;420",
        "wc_reply_reviewers": "176;162;25;17",
        "wc_reply_authors": "1151;1321;567;372",
        "reply_reviewers": "2;2;1;1",
        "reply_authors": "4;4;2;2",
        "rating_avg": [
            5.0,
            2.5495097567963922
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.75,
            1.0897247358851685
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            65.75,
            21.158627082114755
        ],
        "wc_strengths_avg": [
            71.0,
            29.283100928692644
        ],
        "wc_weaknesses_avg": [
            121.5,
            69.35596585730747
        ],
        "wc_questions_avg": [
            70.0,
            51.07837115648854
        ],
        "wc_review_avg": [
            328.25,
            86.38395394979325
        ],
        "wc_reply_reviewers_avg": [
            95.0,
            74.21926973502232
        ],
        "wc_reply_authors_avg": [
            852.75,
            394.0129280873916
        ],
        "reply_reviewers_avg": [
            1.5,
            0.5
        ],
        "reply_authors_avg": [
            3.0,
            1.0
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13354757491071847648&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;1;1;1;0",
        "aff_unique_norm": "Hong Kong University of Science and Technology;SmartMore",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ust.hk;",
        "aff_unique_abbr": "HKUST;",
        "aff_campus_unique_index": "0;1;0",
        "aff_campus_unique": "Hong Kong SAR;Guangzhou;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China;"
    },
    {
        "title": "Offline Data Enhanced On-Policy Policy Gradient with Provable Guarantees",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18646",
        "id": "RMgqvQGTwH",
        "author_site": "Yifei Zhou, Ayush Sekhari, Yuda Song, Wen Sun",
        "tldr": "",
        "abstract": "Hybrid RL is the setting where an RL agent has access to both offline data and online data by interacting with the real-world environment. In this work, we propose a new hybrid RL algorithm that combines an on-policy actor-critic method with offline data. On-policy methods such as policy gradient and natural policy gradient (NPG) have shown to be more robust to model misspecification, though sometimes it may not be as sample efficient as methods that rely on off-policy learning. On the other hand, offline methods that depend on off-policy training often require strong assumptions in theory and are less stable to train in practice. Our new approach integrates a procedure of off-policy training on the offline data into an on-policy NPG framework. We show that our approach, in theory, can obtain a *best-of-both-worlds* type of result --- it achieves the state-of-art theoretical guarantees of offline RL when offline RL-specific assumptions hold, while at the same time maintaining the theoretical guarantees of on-policy NPG regardless of the offline RL assumptions' validity. Experimentally, in challenging rich-observation environments, we show that our approach outperforms a state-of-the-art hybrid RL baseline which only relies on off-policy policy optimization, demonstrating the empirical benefit of combining on-policy and off-policy learning.",
        "keywords": "reinforcement learning theory;hybrid reinforcement learning;actor critic method;online reinforcement learning;offline reinforcement learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/95eae6bdb77217d13837317965c6104b16a9db47.zip",
        "author": "Yifei Zhou;Ayush Sekhari;Yuda Song;Wen Sun",
        "authorids": "~Yifei_Zhou1;~Ayush_Sekhari1;~Yuda_Song2;~Wen_Sun1",
        "gender": "M;M;M;",
        "homepage": "https://yifeizhou02.github.io/;https://ayush.sekhari.com/;https://yudasong.github.io/;https://wensun.github.io",
        "dblp": "50/7699;203/8152;250/4880-1;",
        "google_scholar": ";jH9i188AAAAJ;0QDCG8IAAAAJ;iOLC30YAAAAJ",
        "orcid": ";;;",
        "linkedin": "yifei-zhou-57aa9b222/;;;",
        "or_profile": "~Yifei_Zhou1;~Ayush_Sekhari1;~Yuda_Song2;~Wen_Sun1",
        "aff": "University of California, Berkeley;Massachusetts Institute of Technology;Carnegie Mellon University;Cornell University",
        "aff_domain": "berkeley.edu;mit.edu;andrew.cmu.edu;cornell.edu",
        "position": "PhD student;Postdoc;PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nzhou2024offline,\ntitle={Offline Data Enhanced On-Policy Policy Gradient with Provable Guarantees},\nauthor={Yifei Zhou and Ayush Sekhari and Yuda Song and Wen Sun},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=RMgqvQGTwH}\n}",
        "github": "",
        "project": "",
        "reviewers": "CW8P;HGgg;mti6;M4D3",
        "pdf_size": 1994013,
        "rating": "6;6;8;8",
        "confidence": "4;4;3;3",
        "soundness": "3;2;4;3",
        "contribution": "3;2;4;3",
        "presentation": "3;2;4;4",
        "wc_summary": "69;98;53;138",
        "wc_strengths": "32;76;51;88",
        "wc_weaknesses": "208;217;41;181",
        "wc_questions": "95;48;2;110",
        "wc_review": "404;439;147;517",
        "wc_reply_reviewers": "15;151;0;12",
        "wc_reply_authors": "732;694;24;604",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            89.5,
            32.31485726411305
        ],
        "wc_strengths_avg": [
            61.75,
            21.75287337341897
        ],
        "wc_weaknesses_avg": [
            161.75,
            70.96257816624195
        ],
        "wc_questions_avg": [
            63.75,
            42.35785051203614
        ],
        "wc_review_avg": [
            376.75,
            138.80989698144725
        ],
        "wc_reply_reviewers_avg": [
            44.5,
            61.743420702128255
        ],
        "wc_reply_authors_avg": [
            513.5,
            286.410108061849
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13647468546423181212&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=RMgqvQGTwH",
        "pdf": "https://openreview.net/pdf?id=RMgqvQGTwH",
        "email": "berkeley.edu;mit.edu;andrew.cmu.edu;cornell.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "University of California, Berkeley;Massachusetts Institute of Technology;Carnegie Mellon University;Cornell University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.berkeley.edu;https://web.mit.edu;https://www.cmu.edu;https://www.cornell.edu",
        "aff_unique_abbr": "UC Berkeley;MIT;CMU;Cornell",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Berkeley;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "RN2lIjrtSR",
        "title": "ZeroI2V: Zero-Cost Adaptation of Pre-Trained Transformers from Image to Video",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Adapting image models to video domain is becoming an efficient paradigm for solving video recognition tasks. Due to the huge number of parameters and effective transferability of image models, performing full fine-tuning is less efficient and even unnecessary. Thus, recent research is shifting its focus towards parameter-efficient image-to-video adaptation. However, these adaptation strategies inevitably introduce extra computational cost to deal with the domain gap and temporal modeling in videos. In this paper, our goal is to present a zero-cost adaptation paradigm (ZeroI2V) to transfer the image transformers to video recognition tasks (i.e., introduce zero extra cost to the adapted models during inference). To achieve this goal, we present two core designs. First, to capture the dynamics in videos and reduce the difficulty of achieving image-to-video adaptation, we exploit the flexibility of self-attention and introduce the spatial-temporal dual-headed attention (STDHA) that efficiently endow the image transformers with temporal modeling capability at zero extra parameters and computation. Second, to handle the domain gap between images and videos, we propose a linear adaption strategy which utilizes lightweight densely placed linear adapters to fully transfer the frozen image models to video recognition. Due to its customized linear design, all newly added adapters could be easily merged with the original modules through structural reparameterization after training, thus achieving zero extra cost during inference. Extensive experiments on four widely-used video recognition benchmarks show that our ZeroI2V can match or even outperform previous state-of-the-art methods while enjoying superior parameter and inference efficiency.",
        "keywords": "video understanding;action recognition;parameter-efficient transfer learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Xinhao Li;Limin Wang",
        "authorids": "~Xinhao_Li1;~Limin_Wang1",
        "gender": "M;M",
        "homepage": "https://leexinhao.github.io;https://wanglimin.github.io",
        "dblp": ";68/6610-2",
        "google_scholar": "https://scholar.google.com.hk/citations?user=evR3uR0AAAAJ;HEuN8PcAAAAJ",
        "orcid": "0009-0003-0382-3985;",
        "linkedin": ";",
        "or_profile": "~Xinhao_Li1;~Limin_Wang2",
        "aff": "Nanjing university;Nanjing University",
        "aff_domain": "nju.edu.cn;nju.edu.cn",
        "position": "MS student;Full Professor",
        "bibtex": "@misc{\nli2024zeroiv,\ntitle={ZeroI2V: Zero-Cost Adaptation of Pre-Trained Transformers from Image to Video},\nauthor={Xinhao Li and Limin Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=RN2lIjrtSR}\n}",
        "github": "",
        "project": "",
        "reviewers": "X4CJ;Z2GV;PNMk;HQJm",
        "site": "https://openreview.net/forum?id=RN2lIjrtSR",
        "pdf_size": 3642686,
        "rating": "5;5;6;8",
        "confidence": "4;3;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "56;102;43;83",
        "wc_strengths": "52;54;23;76",
        "wc_weaknesses": "83;112;154;143",
        "wc_questions": "76;377;8;5",
        "wc_review": "267;645;228;307",
        "wc_reply_reviewers": "202;235;0;0",
        "wc_reply_authors": "867;1124;810;304",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "3;4;2;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            71.0,
            22.9891278651453
        ],
        "wc_strengths_avg": [
            51.25,
            18.833148966649205
        ],
        "wc_weaknesses_avg": [
            123.0,
            27.75788176356402
        ],
        "wc_questions_avg": [
            116.5,
            153.05636216766686
        ],
        "wc_review_avg": [
            361.75,
            165.90264464438172
        ],
        "wc_reply_reviewers_avg": [
            109.25,
            109.87123144845515
        ],
        "wc_reply_authors_avg": [
            776.25,
            297.2056316761175
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.40824829046386296,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15122384732705909777&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Nanjing University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nju.edu.cn",
        "aff_unique_abbr": "Nanjing U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "RN7RzMxwjC",
        "title": "Harmony World Models: Boosting Sample Efficiency for Model-based Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Model-based reinforcement learning (MBRL) holds the promise of sample-efficient learning by utilizing a world model, which models how the environment works and typically encompasses components for two tasks: observation modeling and reward modeling. In this paper, through a dedicated empirical investigation, we gain a deeper understanding of the role each task plays in world models and uncover the overlooked potential of more efficient MBRL by harmonizing the interference between observation and reward modeling. Our key insight is that while prevalent approaches of explicit MBRL attempt to restore abundant details of the environment through observation models, it is difficult due to the environment's complexity and limited model capacity. On the other hand, reward models, while dominating in implicit MBRL and adept at learning task-centric dynamics, are inadequate for sample-efficient learning without richer learning signals. Capitalizing on these insights and discoveries, we propose a simple yet effective method, Harmony World Models (HarmonyWM), that introduces a lightweight harmonizer to maintain a dynamic equilibrium between the two tasks in world model learning. Our experiments on three visual control domains show that the base MBRL method equipped with HarmonyWM gains 10%-55% absolute performance boosts.",
        "keywords": "model-based reinforcemet learning;world model",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Haoyu Ma;Jialong Wu;Ningya Feng;Jianmin Wang;Mingsheng Long",
        "authorids": "~Haoyu_Ma3;~Jialong_Wu1;~Ningya_Feng1;~Jianmin_Wang1;~Mingsheng_Long5",
        "gender": ";M;M;M;",
        "homepage": ";https://manchery.github.io/;https://github.com/fny21;https://www.thss.tsinghua.edu.cn/en/faculty/jianminwang.htm;",
        "dblp": ";73/498-1.html;358/4461;06/3456-1.html;",
        "google_scholar": ";FfTZ66gAAAAJ;;https://scholar.google.com.tw/citations?user=MiovcboAAAAJ;",
        "orcid": ";0009-0008-7846-053X;0009-0006-8448-2570;0000-0001-6841-7943;",
        "linkedin": ";;;;",
        "or_profile": "~Haoyu_Ma3;~Jialong_Wu1;~Ningya_Feng1;~Jianmin_Wang1;~Mingsheng_Long5",
        "aff": ";Tsinghua University;Tsinghua University;Tsinghua University;",
        "aff_domain": ";tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;",
        "position": ";PhD student;Undergrad student;Full Professor;",
        "bibtex": "@misc{\nma2024harmony,\ntitle={Harmony World Models: Boosting Sample Efficiency for Model-based Reinforcement Learning},\nauthor={Haoyu Ma and Jialong Wu and Ningya Feng and Jianmin Wang and Mingsheng Long},\nyear={2024},\nurl={https://openreview.net/forum?id=RN7RzMxwjC}\n}",
        "github": "",
        "project": "",
        "reviewers": "72ZS;pH7N;WtCd;QvDA",
        "site": "https://openreview.net/forum?id=RN7RzMxwjC",
        "pdf_size": 2445628,
        "rating": "3;5;6;6",
        "confidence": "3;4;4;3",
        "soundness": "3;2;3;3",
        "contribution": "2;2;2;2",
        "presentation": "3;3;3;3",
        "wc_summary": "47;68;96;44",
        "wc_strengths": "28;27;49;23",
        "wc_weaknesses": "147;169;52;220",
        "wc_questions": "3;83;118;146",
        "wc_review": "225;347;315;433",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1220;858;921;834",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "4;3;3;3",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            63.75,
            20.78911975048487
        ],
        "wc_strengths_avg": [
            31.75,
            10.133484099755622
        ],
        "wc_weaknesses_avg": [
            147.0,
            60.905664761169795
        ],
        "wc_questions_avg": [
            87.5,
            53.649324320069496
        ],
        "wc_review_avg": [
            330.0,
            74.41102068914255
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            958.25,
            154.42534604138012
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            3.25,
            0.4330127018922193
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.40824829046386296,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2925972663929524240&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Tsinghua University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Weaker MVI Condition: Extragradient Methods with Multi-Step Exploration",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18645",
        "id": "RNGUbTYSjk",
        "author_site": "Yifeng Fan, Yongqiang Li, Bo Chen",
        "tldr": "",
        "abstract": "This paper proposes a new framework of algorithms that is extended from the celebrated extragradient algorithm. The min-max problem has attracted increasing attention because of its applications in machine learning tasks such as generative adversarial networks (GANs) training. While there has been exhaustive research on convex-concave setting, problem of nonconvex-nonconcave setting faces many challenges, such as convergence to limit cycles. Given that general min-max optimization has been found to be intractable, recent research efforts have shifted towards tackling structured problems. One of these follows the weak Minty variational inequality (weak MVI), which is motivated by relaxing Minty variational inequality (mvi) without compromising convergence guarantee of extragradient algorithm. Existing extragradient-type algorithms involve one exploration step and one update step per iteration. We analyze the algorithms with multiple exploration steps and show that current assumption can be further relaxed when more exploration is introduced. Furthermore, we design an adaptive algorithm that explores until the optimal improvement is achieved. This process exploits information from the whole trajectory and effectively tackles cyclic behaviors.",
        "keywords": "extragradient;minimax;nonconvex-nonconcave;variational inequilities;saddle point problem",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/4dad8bde5410b34bdfc90e5ba79e91d3223f74d1.zip",
        "author": "Yifeng Fan;Yongqiang Li;Bo Chen",
        "authorids": "~Yifeng_Fan3;~Yongqiang_Li2;~Bo_Chen13",
        "gender": "M;M;M",
        "homepage": "https://github.com/alexfan07;https://homepage.zjut.edu.cn/liyq/;https://www.researchgate.net/profile/Bo-Chen-22",
        "dblp": ";;",
        "google_scholar": ";;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Yifeng_Fan3;~Yongqiang_Li2;~Bo_Chen13",
        "aff": "Zhejiang University of Technology;Zhejiang University of Technology;Zhejiang University of Technology",
        "aff_domain": "zjut.edu.cn;zjut.edu.cn;zjut.edu.cn",
        "position": "MS student;Associate Professor;Full Professor",
        "bibtex": "@inproceedings{\nfan2024weaker,\ntitle={Weaker {MVI} Condition: Extragradient Methods with Multi-Step Exploration},\nauthor={Yifeng Fan and Yongqiang Li and Bo Chen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=RNGUbTYSjk}\n}",
        "github": "",
        "project": "",
        "reviewers": "mxmH;xJXM;xeFY;ii6f",
        "pdf_size": 4885025,
        "rating": "5;5;6;8",
        "confidence": "4;3;3;5",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "1;2;3;3",
        "wc_summary": "73;97;224;142",
        "wc_strengths": "33;35;113;47",
        "wc_weaknesses": "665;589;97;481",
        "wc_questions": "4;67;102;93",
        "wc_review": "775;788;536;763",
        "wc_reply_reviewers": "0;0;196;623",
        "wc_reply_authors": "598;648;614;920",
        "reply_reviewers": "0;0;1;4",
        "reply_authors": "1;1;2;3",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            134.0,
            57.56300895540468
        ],
        "wc_strengths_avg": [
            57.0,
            32.77193921634788
        ],
        "wc_weaknesses_avg": [
            458.0,
            218.4376341201305
        ],
        "wc_questions_avg": [
            66.5,
            38.30469945058961
        ],
        "wc_review_avg": [
            715.5,
            104.01081674518281
        ],
        "wc_reply_reviewers_avg": [
            204.75,
            254.38885097425162
        ],
        "wc_reply_authors_avg": [
            695.0,
            131.15258289488622
        ],
        "reply_reviewers_avg": [
            1.25,
            1.6393596310755
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.7385489458759963,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5204380624395700519&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=RNGUbTYSjk",
        "pdf": "https://openreview.net/pdf?id=RNGUbTYSjk",
        "email": "zjut.edu.cn;zjut.edu.cn;zjut.edu.cn",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Zhejiang University of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.zjut.edu.cn",
        "aff_unique_abbr": "ZJUT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "RNgZTA4CTP",
        "title": "Best Possible Q-Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Fully decentralized learning, where the global information, \\textit{i.e.}, the actions of other agents, is inaccessible, is a fundamental challenge in cooperative multi-agent reinforcement learning. However, the convergence and optimality of most decentralized algorithms are not theoretically guaranteed, since the transition probabilities are non-stationary as all agents are updating policies simultaneously. To tackle this challenge, we propose \\textit{best possible operator}, a novel decentralized operator, and prove that the policies of agents will converge to the optimal joint policy if each agent independently updates its individual state-action value by the operator. Further, to make the update more efficient and practical, we simplify the operator and prove that the convergence and optimality still hold with the simplified one. By instantiating the simplified operator, the derived fully decentralized algorithm, \\textit{best possible Q-learning} (BQL), does not suffer from non-stationarity. Empirically, we show that BQL achieves remarkable improvement over baselines in a variety of cooperative multi-agent tasks.",
        "keywords": "multi-agent reinforcement learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Jiechuan Jiang;Zongqing Lu",
        "authorids": "~Jiechuan_Jiang1;~Zongqing_Lu2",
        "gender": ";",
        "homepage": ";",
        "dblp": "220/4026;",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Jiechuan_Jiang1;~Zongqing_Lu2",
        "aff": "Tsinghua University;",
        "aff_domain": "mail.tsinghua.edu.cn;",
        "position": "Intern;",
        "bibtex": "@misc{\njiang2024best,\ntitle={Best Possible Q-Learning},\nauthor={Jiechuan Jiang and Zongqing Lu},\nyear={2024},\nurl={https://openreview.net/forum?id=RNgZTA4CTP}\n}",
        "github": "",
        "project": "",
        "reviewers": "jF9W;FC5t;tj5R;XrJf",
        "site": "https://openreview.net/forum?id=RNgZTA4CTP",
        "pdf_size": 1331783,
        "rating": "3;5;6;8",
        "confidence": "2;2;3;4",
        "soundness": "1;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;1;3;3",
        "wc_summary": "61;99;101;87",
        "wc_strengths": "21;44;253;44",
        "wc_weaknesses": "510;57;185;27",
        "wc_questions": "12;362;61;119",
        "wc_review": "604;562;600;277",
        "wc_reply_reviewers": "1566;454;0;13",
        "wc_reply_authors": "1664;1065;560;440",
        "reply_reviewers": "5;3;0;1",
        "reply_authors": "8;4;1;1",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            87.0,
            15.937377450509228
        ],
        "wc_strengths_avg": [
            90.5,
            94.28812226362342
        ],
        "wc_weaknesses_avg": [
            194.75,
            191.43716331997817
        ],
        "wc_questions_avg": [
            138.5,
            134.48141135487833
        ],
        "wc_review_avg": [
            510.75,
            135.94737033131608
        ],
        "wc_reply_reviewers_avg": [
            508.25,
            637.4497529217499
        ],
        "wc_reply_authors_avg": [
            932.25,
            483.2082237503828
        ],
        "reply_reviewers_avg": [
            2.25,
            1.920286436967152
        ],
        "reply_authors_avg": [
            3.5,
            2.8722813232690143
        ],
        "replies_avg": [
            30,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.9198662110077999,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5705688867311444067&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0",
        "aff_unique_norm": "Tsinghua University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "THU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "ROC3UASRV7",
        "title": "A Region-Shrinking-Based Acceleration for Classification-Based Derivative-Free Optimization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Derivative-free optimization algorithms play an important role in scientific and engineering design optimization problems, especially when derivative information is not accessible. In this paper, we study the framework of classification-based derivative-free optimization algorithms. By introducing a concept called hypothesis-target shattering rate, we revisit the computational complexity upper bound of this type of algorithms. Inspired by the revisited upper bound, we propose an algorithm named \u201cRACE-CARS\u201d, which adds a random region-shrinking\nstep compared with \u201cSRACOS\u201d (Hu et al., 2017). We further establish a theorem showing the acceleration of region-shrinking. Experiments on the synthetic functions as well as black-box tuning for language-model-as-a-service demonstrate empirically the efficiency of \u201cRACE-CARS\u201d. An ablation experiment on the introduced hyperparameters is also conducted, revealing the mechanism of \u201cRACE-CARS\u201d and putting forward an empirical hyperparameter-tuning guidance.",
        "keywords": "Black-Box Optimization;Derivative-Free Optimization;Classification-Based Optimization",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/c3bdd634bef124db4f7e6edac61002b9ccb5705f.zip",
        "author": "Tianyi Han;Jingya LI;Zhipeng GUO;Yuan JIN",
        "authorids": "~Tianyi_Han3;~Jingya_LI1;~Zhipeng_GUO2;~Yuan_JIN3",
        "gender": "M;F;M;M",
        "homepage": ";;http://hr.ae.tsinghua.edu.cn/info/1011/1048.htm;",
        "dblp": ";;;",
        "google_scholar": ";;;",
        "orcid": "0009-0002-8711-8265;;;",
        "linkedin": ";julie-li-jingya-68ba55134/;\u5fd7\u9e4f-\u90ed-78b8901a7/?originalSubdomain=cn;yuan-jin-18038831/",
        "or_profile": "~Tianyi_Han3;~Jingya_LI1;~Zhipeng_GUO2;~Yuan_JIN3",
        "aff": ";;;",
        "aff_domain": ";;;",
        "position": ";;;",
        "bibtex": "@misc{\nhan2024a,\ntitle={A Region-Shrinking-Based Acceleration for Classification-Based Derivative-Free Optimization},\nauthor={Tianyi Han and Jingya LI and Zhipeng GUO and Yuan JIN},\nyear={2024},\nurl={https://openreview.net/forum?id=ROC3UASRV7}\n}",
        "github": "",
        "project": "",
        "reviewers": "6mCc;ogoo;3VLh;boX1",
        "site": "https://openreview.net/forum?id=ROC3UASRV7",
        "pdf_size": 5883665,
        "rating": "1;3;6;6",
        "confidence": "3;4;2;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "1;3;2;4",
        "wc_summary": "44;47;108;37",
        "wc_strengths": "8;38;116;36",
        "wc_weaknesses": "66;338;87;84",
        "wc_questions": "7;54;86;42",
        "wc_review": "125;477;397;199",
        "wc_reply_reviewers": "0;0;14;0",
        "wc_reply_authors": "41;591;286;308",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            59.0,
            28.521921393903323
        ],
        "wc_strengths_avg": [
            49.5,
            40.18395202067612
        ],
        "wc_weaknesses_avg": [
            143.75,
            112.43748262923712
        ],
        "wc_questions_avg": [
            47.25,
            28.261059781968545
        ],
        "wc_review_avg": [
            299.5,
            142.79618342238703
        ],
        "wc_reply_reviewers_avg": [
            3.5,
            6.06217782649107
        ],
        "wc_reply_authors_avg": [
            306.5,
            194.8416023337932
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5000000000000001,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=443836580561696422&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4
    },
    {
        "id": "ROxsH4rMe4",
        "title": "Systolic Array Acceleration of Spiking Neural Networks with Application-Independent Split-Time Temporal Coding",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Spiking Neural Networks (SNNs) are brain-inspired computing models with event-driven based low-power operations and unique temporal dynamics.\nHowever, spatial and temporal dynamics in SNNs pose a significant overhead in accelerating neural computations and limit the computing capabilities of neuromorphic accelerators.\nEspecially, unstructured sparsity emergent in both space and time, i.e., across neurons and time points, and iterative computations across time points cause a primary bottleneck in data movement.\n\nIn this work, we propose a novel technique and architecture that allow the exploitation of temporal information compression with structured sparsity and parallelism across time, and significantly improves data movement on a systolic array.\nWe split a full range of temporal domain into several time windows (TWs) where a TW packs multiple time points, and encode the temporal information in each TW with Split-Time Temporal coding (STT) by limiting the number of spikes within a TW up to one.\nSTT enables sparsification and structurization of irregular firing activities and dramatically reduces computational overhead while delivering competitive classification accuracy without a huge drop. \nTo further improve the data reuse, we propose an Integration Through Time (ITT) technique that processes integration steps across different TWs in parallel with a systolic array.\nThe proposed architecture with STT and ITT offers an application-independent solution for spike-based models across various types of layers and networks.\nThe proposed architecture delivers 77X and 60X latency and energy efficiency improvements for different benchmarks on average over a conventional SNN baseline.",
        "keywords": "spiking-neural-network;machine learning accelerator",
        "primary_area": "infrastructure, software libraries, hardware, etc.",
        "supplementary_material": "",
        "author": "Jeongjun Lee;Peng Li",
        "authorids": "~Jeongjun_Lee2;~Peng_Li8",
        "gender": ";M",
        "homepage": "https://scholar.google.com/citations?user=XisPT8QAAAAJ&hl=en&authuser=2;https://www.ece.ucsb.edu/~lip/",
        "dblp": ";83/6353-1.html",
        "google_scholar": "XisPT8QAAAAJ;QYQUS7gAAAAJ",
        "orcid": ";0000-0003-3548-4589",
        "linkedin": ";peng-li-ucsb/",
        "or_profile": "~Jeongjun_Lee2;~Peng_Li8",
        "aff": ";UC Santa Barbara",
        "aff_domain": ";ucsb.edu",
        "position": ";Professor",
        "bibtex": "@misc{\nlee2024systolic,\ntitle={Systolic Array Acceleration of Spiking Neural Networks with Application-Independent Split-Time Temporal Coding},\nauthor={Jeongjun Lee and Peng Li},\nyear={2024},\nurl={https://openreview.net/forum?id=ROxsH4rMe4}\n}",
        "github": "",
        "project": "",
        "reviewers": "MbsR;3xhW;5XJK;iKT8;mhhP",
        "site": "https://openreview.net/forum?id=ROxsH4rMe4",
        "pdf_size": 2933156,
        "rating": "3;3;5;5;5",
        "confidence": "4;4;4;2;3",
        "soundness": "3;1;2;2;2",
        "contribution": "2;1;2;2;2",
        "presentation": "3;2;3;1;3",
        "wc_summary": "57;63;64;101;70",
        "wc_strengths": "36;53;35;23;35",
        "wc_weaknesses": "70;321;64;117;286",
        "wc_questions": "36;161;58;152;45",
        "wc_review": "199;598;221;393;436",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            4.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.4,
            0.8
        ],
        "soundness_avg": [
            2.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            1.8,
            0.4000000000000001
        ],
        "presentation_avg": [
            2.4,
            0.8
        ],
        "wc_summary_avg": [
            71.0,
            15.556349186104045
        ],
        "wc_strengths_avg": [
            36.4,
            9.58331884056875
        ],
        "wc_weaknesses_avg": [
            171.6,
            109.80819641538604
        ],
        "wc_questions_avg": [
            90.4,
            54.49623840229709
        ],
        "wc_review_avg": [
            369.4,
            147.17961815414526
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.6123724356957946,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:dCeMntADn0MJ:scholar.google.com/&scioq=Systolic+Array+Acceleration+of+Spiking+Neural+Networks+with+Application-Independent+Split-Time+Temporal+Coding&hl=en&as_sdt=0,48",
        "gs_version_total": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of California, Santa Barbara",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucsb.edu",
        "aff_unique_abbr": "UCSB",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Santa Barbara",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "RPWs9kOv0I",
        "title": "Logic-Based Adaptive Reward Shaping for Reinforcement Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "There is a growing interest in using formal languages such as Linear Temporal Logic (LTL) to specify complex tasks and reward functions for reinforcement learning (RL) precisely and succinctly. Nevertheless, existing methods often assign sparse rewards, which may require millions of exploratory episodes to converge to a quality policy. To address this limitation, we adopt the notion of task progression to measure the degree to which a task specified by a co-safe LTL formula is partially completed and design several reward functions to incentivize a RL agent to satisfy the task specification as much as possible. We also develop an adaptive reward shaping approach that dynamically updates reward functions during the learning process. Experimental results on a range of benchmark RL environments demonstrate that the proposed approach generally outperforms baselines, achieving earlier convergence to a policy with a higher success rate of task completion and a higher normalized expected discounted return.",
        "keywords": "Reward Shaping;Linear Temporal Logic",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Minjae Kwon;Ingy Elsayed-Aly;Lu Feng",
        "authorids": "~Minjae_Kwon1;ie3ne@virginia.edu;~Lu_Feng4",
        "gender": ";;F",
        "homepage": "http://github.com/kmj901122;;https://www.cs.virginia.edu/~lufeng/",
        "dblp": ";;48/4233-1",
        "google_scholar": ";;https://scholar.google.com/citations?hl=en",
        "orcid": ";;0000-0002-4651-8441",
        "linkedin": ";;",
        "or_profile": "~Minjae_Kwon1;ie3ne@virginia.edu;~Lu_Feng4",
        "aff": "University of Virginia, Charlottesville;;University of Virginia, Charlottesville",
        "aff_domain": "virginia.edu;;virginia.edu",
        "position": "PhD student;;Associate Professor",
        "bibtex": "@misc{\nkwon2024logicbased,\ntitle={Logic-Based Adaptive Reward Shaping for Reinforcement Learning},\nauthor={Minjae Kwon and Ingy Elsayed-Aly and Lu Feng},\nyear={2024},\nurl={https://openreview.net/forum?id=RPWs9kOv0I}\n}",
        "github": "",
        "project": "",
        "reviewers": "XaAF;RWQj;JMof;r63y",
        "site": "https://openreview.net/forum?id=RPWs9kOv0I",
        "pdf_size": 8512466,
        "rating": "3;3;3;5",
        "confidence": "4;3;4;4",
        "soundness": "2;2;1;1",
        "contribution": "2;2;1;2",
        "presentation": "3;2;2;3",
        "wc_summary": "127;43;126;57",
        "wc_strengths": "146;44;45;40",
        "wc_weaknesses": "275;109;174;178",
        "wc_questions": "210;84;304;63",
        "wc_review": "758;280;649;338",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            88.25,
            38.57055223872222
        ],
        "wc_strengths_avg": [
            68.75,
            44.63952844733018
        ],
        "wc_weaknesses_avg": [
            184.0,
            59.24947257149214
        ],
        "wc_questions_avg": [
            165.25,
            97.86566047393744
        ],
        "wc_review_avg": [
            506.25,
            202.02274005665797
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:oWYWihfCTSkJ:scholar.google.com/&scioq=Logic-Based+Adaptive+Reward+Shaping+for+Reinforcement+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Virginia",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.virginia.edu",
        "aff_unique_abbr": "UVA",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Charlottesville",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "RPhoFFj0jg",
        "title": "ResBit: Residual Bit Vector for Categorical Values",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The one-hot vector has long been widely used in machine learning as a simple and generic method for representing discrete data. However, this method increases the number of dimensions linearly with the categorical data to be represented, which is problematic from the viewpoint of spatial computational complexity in deep learning, which requires a large amount of data. Recently, Analog Bits, a method for representing discrete data as a sequence of bits, was proposed on the basis of the high expressiveness of diffusion models. However, since the number of category types to be represented in a generation task is not necessarily at a power of two, there is a discrepancy between the range that Analog Bits can represent and the range represented as category data. If such a value is generated, the problem is that the original category value cannot be restored. To address this issue, we propose $\\textbf{Res}$idual $\\textbf{Bit}$ Vector (ResBit), which is a hierarchical bit representation. Although it is a general-purpose representation method, in this paper, we treat it as numerical data and show that it can be used as an extension of Analog Bits using Table Residual Bit Diffusion (TRBD), which is incorporated into TabDDPM, a tabular data generation method. We experimentally confirmed that TRBD can generate diverse and high-quality data from small-scale table data to table data containing diverse category values faster than TabDDPM. Furthermore, we show that ResBit can also serve as an alternative to the one-hot vector by utilizing ResBit for conditioning in GANs and as a label expression in image classification.",
        "keywords": "Discrete/Categorical Data;Tabular Data Generation;Diffusion Models;Representation for Discrete Data;Conditional GANs;dimensionality reduction;one-hot vector",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Masane Fuchi;Amar Zanashir;Hiroto Minami;Tomohiro Takagi",
        "authorids": "~Masane_Fuchi1;~Amar_Zanashir1;~Hiroto_Minami1;~Tomohiro_Takagi2",
        "gender": "M;;M;M",
        "homepage": ";;;https://takagiken-meiji.com/tomohiro-takagi/",
        "dblp": "358/3858;;;",
        "google_scholar": "https://scholar.google.co.jp/citations?user=OIG8xOMAAAAJ;;;",
        "orcid": ";;;",
        "linkedin": ";amar-zanashir-6aab5333;hiroto-minami-65103a292/;",
        "or_profile": "~Masane_Fuchi1;~Amar_Zanashir1;~Hiroto_Minami1;~Tomohiro_Takagi2",
        "aff": "Meiji University;;;Meiji University",
        "aff_domain": "meiji.ac.jp;;;meiji.ac.jp",
        "position": "MS student;;;Full Professor",
        "bibtex": "@misc{\nfuchi2024resbit,\ntitle={ResBit: Residual Bit Vector for Categorical Values},\nauthor={Masane Fuchi and Amar Zanashir and Hiroto Minami and Tomohiro Takagi},\nyear={2024},\nurl={https://openreview.net/forum?id=RPhoFFj0jg}\n}",
        "github": "",
        "project": "",
        "reviewers": "Zunf;42Kk;Dspo",
        "site": "https://openreview.net/forum?id=RPhoFFj0jg",
        "pdf_size": 9315621,
        "rating": "3;3;5",
        "confidence": "3;4;2",
        "soundness": "3;1;3",
        "contribution": "1;1;2",
        "presentation": "2;1;2",
        "wc_summary": "235;99;54",
        "wc_strengths": "10;16;17",
        "wc_weaknesses": "252;278;137",
        "wc_questions": "8;51;51",
        "wc_review": "505;444;259",
        "wc_reply_reviewers": "0;59;0",
        "wc_reply_authors": "943;914;974",
        "reply_reviewers": "0;1;0",
        "reply_authors": "2;2;2",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "contribution_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            129.33333333333334,
            76.94298033103618
        ],
        "wc_strengths_avg": [
            14.333333333333334,
            3.0912061651652345
        ],
        "wc_weaknesses_avg": [
            222.33333333333334,
            61.26626768096418
        ],
        "wc_questions_avg": [
            36.666666666666664,
            20.270394394014364
        ],
        "wc_review_avg": [
            402.6666666666667,
            104.5955172185798
        ],
        "wc_reply_reviewers_avg": [
            19.666666666666668,
            27.812866726670865
        ],
        "wc_reply_authors_avg": [
            943.6666666666666,
            24.499433100017278
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8660254037844387,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16579364194598556450&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Meiji University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.meiji.ac.jp",
        "aff_unique_abbr": "Meiji",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Japan"
    },
    {
        "id": "RQk9srYfhj",
        "title": "Repositioning the Subject within Image",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Current image manipulation primarily centers on static manipulation, such as replacing specific regions within an image or altering its overall style. In this paper, we introduce an innovative dynamic manipulation task, subject repositioning. This task involves relocating a user-specified subject to a desired position while preserving the image's fidelity. Our research reveals that the fundamental sub-tasks of subject repositioning, which include filling the void left by the moved subject and reconstructing obscured portions of the subject, can be effectively reformulated as a unified, prompt-guided inpainting task. Consequently, we can employ a single diffusion generative model to address these sub-tasks using various task prompts learned through our proposed task inversion technique. Additionally, we integrate pre-processing and post-processing techniques to further enhance the quality of subject repositioning. These elements together form the foundation of our SEgment-gEnerate-and-bLEnd (SEELE) framework. To assess SEELE's effectiveness in subject repositioning, we assemble a real-world subject repositioning dataset called ReS. Our results on ReS demonstrate the exceptional quality of repositioned image generation.",
        "keywords": "image manipulation;inpainting;diffusion models;textual inversion;prompt tuning",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Yikai Wang;Chenjie Cao;Qiaole Dong;Yifan Li;Yanwei Fu",
        "authorids": "~Yikai_Wang1;~Chenjie_Cao1;~Qiaole_Dong1;~Yifan_Li4;~Yanwei_Fu2",
        "gender": "M;M;M;F;M",
        "homepage": "https://yikai-wang.github.io;https://ewrfcas.github.io/;https://dqiaole.github.io/;https://github.com/Clementine24;http://yanweifu.github.io",
        "dblp": "85/9555-2;https://dblp.uni-trier.de/pid/193/0823;315/0341;;63/9065",
        "google_scholar": "x8HOE_cAAAAJ;1INK-I0AAAAJ;8Q9k5NoAAAAJ;;https://scholar.google.co.uk/citations?user=Vg54TcsAAAAJ",
        "orcid": "0000-0001-6107-5063;;0000-0002-3083-5143;;0000-0002-6595-6893",
        "linkedin": ";;;;",
        "or_profile": "~Yikai_Wang1;~Chenjie_Cao1;~Qiaole_Dong1;~Yifan_Li4;~Yanwei_Fu2",
        "aff": "Fudan University;Fudan University;Fudan University;Fudan University;Fudan University,",
        "aff_domain": "fudan.edu.cn;fudan.edu.cn;fudan.edu.cn;fudan.edu.cn;fudan.edu.cn",
        "position": "PhD student;PhD student;PhD student;MS student;Professor",
        "bibtex": "@misc{\nwang2024repositioning,\ntitle={Repositioning the Subject within Image},\nauthor={Yikai Wang and Chenjie Cao and Qiaole Dong and Yifan Li and Yanwei Fu},\nyear={2024},\nurl={https://openreview.net/forum?id=RQk9srYfhj}\n}",
        "github": "",
        "project": "",
        "reviewers": "RbUq;RPVi;X5B9;qrCL",
        "site": "https://openreview.net/forum?id=RQk9srYfhj",
        "pdf_size": 50101453,
        "rating": "3;5;5;5",
        "confidence": "5;4;4;4",
        "soundness": "3;3;3;2",
        "contribution": "2;3;2;2",
        "presentation": "2;2;3;3",
        "wc_summary": "49;89;84;49",
        "wc_strengths": "67;53;32;49",
        "wc_weaknesses": "594;127;230;92",
        "wc_questions": "31;75;16;3",
        "wc_review": "741;344;362;193",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1494;697;938;458",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "5;1;2;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            67.75,
            18.833148966649205
        ],
        "wc_strengths_avg": [
            50.25,
            12.47747971346778
        ],
        "wc_weaknesses_avg": [
            260.75,
            198.97660038306012
        ],
        "wc_questions_avg": [
            31.25,
            27.13277538328875
        ],
        "wc_review_avg": [
            410.0,
            202.05815994411114
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            896.75,
            384.3210734529138
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.25,
            1.6393596310755
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9197870857474752350&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Fudan University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.fudan.edu.cn",
        "aff_unique_abbr": "Fudan",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Efficient Continual Finite-Sum Minimization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18644",
        "id": "RR70yWYenC",
        "author_site": "Ioannis Mavrothalassitis, Stratis Skoulakis, Leello Dadi, Volkan Cevher",
        "tldr": "",
        "abstract": "Given a sequence of functions $f_1,\\ldots,f_n$ with $f_i:\\mathcal{D}\\mapsto \\mathbb{R}$, finite-sum minimization seeks a point ${x}^\\star \\in \\mathcal{D}$ minimizing $\\sum_{j=1}^nf_j(x)/n$. In this work, we propose a key twist into the finite-sum minimization, dubbed as *continual finite-sum minimization*, that asks for a sequence of points $x_1^\\star, \\ldots, x_n^\\star \\in D$ such that each ${x}^\\star_i \\in D$ minimizes the prefix-sum $\\sum_{j=1}^if_j(x)/i$. Assuming that each prefix-sum is strongly convex, we develop a first-order continual stochastic variance reduction gradient method ($\\mathrm{CSVRG}$) producing an $\\epsilon$-optimal sequence with $\\tilde{\\mathcal{O}}(n/\\epsilon^{1/3} + 1/\\sqrt{\\epsilon})$ overall *first-order oracles* (FO). An FO corresponds to the computation of a single gradient $\\nabla f_j(x)$ at a given $x \\in \\mathcal{D}$ for some $j \\in [n]$. Our approach significantly improves upon the $\\mathcal{O}(n/\\epsilon)$ FOs that $\\mathrm{StochasticGradientDescent}$ requires and the $\\mathcal{O}(n^2 \\log (1/\\epsilon))$ FOs that state-of-the-art variance reduction methods such as $\\mathrm{Katyusha}$ require. We also prove that there is no natural first-order method with $\\mathcal{O}\\left(n/\\epsilon^\\alpha\\right)$ gradient complexity for $\\alpha < 1/4$, establishing that the first-order complexity of our method is nearly tight.",
        "keywords": "Finite Sum Minimization;Variance Reduction;Optimization",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/5f88bad9683884a02818df25fc5221c5356d5a98.zip",
        "author": "Ioannis Mavrothalassitis;Stratis Skoulakis;Leello Tadesse Dadi;Volkan Cevher",
        "authorids": "~Ioannis_Mavrothalassitis1;~Stratis_Skoulakis2;~Leello_Tadesse_Dadi1;~Volkan_Cevher1",
        "gender": "M;M;M;M",
        "homepage": ";http://www.corelab.ntua.gr/~sskoul/;;http://lions.epfl.ch",
        "dblp": ";183/0979.html;314/6241;70/5301",
        "google_scholar": ";Juo2Tk8AAAAJ;bhAxvCIAAAAJ;https://scholar.google.ch/citations?user=hlWhzU8AAAAJ",
        "orcid": ";;0000-0003-2580-4913;",
        "linkedin": "john-mavrothalassitis;;;",
        "or_profile": "~Ioannis_Mavrothalassitis1;~Stratis_Skoulakis2;~Leello_Tadesse_Dadi1;~Volkan_Cevher1",
        "aff": "EPFL - EPF Lausanne;EPFL - EPF Lausanne;EPFL;Amazon Development Center Germany",
        "aff_domain": "epfl.ch;epfl.ch;epfl.ch;amazon.de",
        "position": "PhD student;Postdoc;PhD student;Amazon Scholar",
        "bibtex": "@inproceedings{\nmavrothalassitis2024efficient,\ntitle={Efficient Continual Finite-Sum Minimization},\nauthor={Ioannis Mavrothalassitis and Stratis Skoulakis and Leello Tadesse Dadi and Volkan Cevher},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=RR70yWYenC}\n}",
        "github": "",
        "project": "",
        "reviewers": "jqUd;FDce;s2LS;zvPG",
        "pdf_size": 951861,
        "rating": "5;6;6;8",
        "confidence": "4;3;2;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;4;3;3",
        "wc_summary": "69;151;130;134",
        "wc_strengths": "7;116;41;78",
        "wc_weaknesses": "253;75;236;79",
        "wc_questions": "50;36;3;47",
        "wc_review": "379;378;410;338",
        "wc_reply_reviewers": "17;11;133;11",
        "wc_reply_authors": "1188;149;1347;60",
        "reply_reviewers": "1;1;2;1",
        "reply_authors": "4;1;5;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            121.0,
            31.040296390337513
        ],
        "wc_strengths_avg": [
            60.5,
            40.70933553866975
        ],
        "wc_weaknesses_avg": [
            160.75,
            83.9773034813574
        ],
        "wc_questions_avg": [
            34.0,
            18.641351882307248
        ],
        "wc_review_avg": [
            376.25,
            25.557533136044253
        ],
        "wc_reply_reviewers_avg": [
            43.0,
            52.01922721455981
        ],
        "wc_reply_authors_avg": [
            686.0,
            585.0576894631845
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            1.7853571071357126
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.3244428422615251,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:dcqp8q-PlVEJ:scholar.google.com/&scioq=Efficient+Continual+Finite-Sum+Minimization&hl=en&as_sdt=0,5",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=RR70yWYenC",
        "pdf": "https://openreview.net/pdf?id=RR70yWYenC",
        "email": "epfl.ch;epfl.ch;epfl.ch;amazon.de",
        "author_num": 4,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "EPFL;Amazon",
        "aff_unique_dep": ";Development Center",
        "aff_unique_url": "https://www.epfl.ch;https://www.amazon.de",
        "aff_unique_abbr": "EPFL;Amazon",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Lausanne;",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "Switzerland;Germany"
    },
    {
        "title": "Ensemble Distillation for Unsupervised Constituency Parsing",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18643",
        "id": "RR8y0WKrFv",
        "author_site": "Behzad Shayegh, Yanshuai Cao, Xiaodan Zhu, Jackie Cheung, Lili Mou",
        "tldr": "",
        "abstract": "We investigate the unsupervised constituency parsing task, which organizes words and phrases of a sentence into a hierarchical structure without using linguistically annotated data. We observe that existing unsupervised parsers capture different aspects of parsing structures, which can be leveraged to enhance unsupervised parsing performance.\nTo this end, we propose a notion of \"tree averaging,\" based on which we further propose a novel ensemble method for unsupervised parsing.\nTo improve inference efficiency, we further distill the ensemble knowledge into a student model; such an ensemble-then-distill process is an effective approach to mitigate the over-smoothing problem existing in common multi-teacher distilling methods.\nExperiments show that our method surpasses all previous approaches, consistently demonstrating its effectiveness and robustness across various runs, with different ensemble components, and under domain-shift conditions.",
        "keywords": "Constituency Parsing;Unsupervised Grammar Induction;Knowledge Distillation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/13f69a89832f171a99810492537b96fb1bb580e0.pdf",
        "author": "Behzad Shayegh;Yanshuai Cao;Xiaodan Zhu;Jackie CK Cheung;Lili Mou",
        "authorids": "~Behzad_Shayegh1;~Yanshuai_Cao1;~Xiaodan_Zhu1;~Jackie_CK_Cheung1;~Lili_Mou1",
        "gender": "M;;M;M;M",
        "homepage": "https://TheShayegh.github.io/;;http://www.xiaodanzhu.com;http://cs.mcgill.ca/~jcheung/;https://lili-mou.github.io/",
        "dblp": "358/6424.html;;93/310.html;00/9012;",
        "google_scholar": "https://scholar.google.ca/citations?user=mYwraykAAAAJ;https://scholar.google.ca/citations?user=RTVRTSsAAAAJ;https://scholar.google.ca/citations?user=a6MYnuUAAAAJ;https://scholar.google.com.tw/citations?user=Um-wmYQAAAAJ;https://scholar.google.com.hk/schhp?hl=en",
        "orcid": ";;0000-0003-3856-3696;;",
        "linkedin": "TheShayegh/;yanshuai-cao-b59878a4/;xiaodan-zhu-066833101/?originalSubdomain=ca;;",
        "or_profile": "~Behzad_Shayegh1;~Yanshuai_Cao1;~Xiaodan_Zhu1;~Jackie_CK_Cheung1;~Lili_Mou1",
        "aff": "University of Alberta;Borealis AI;Queen's University;Microsoft;University of Alberta",
        "aff_domain": "ualberta.ca;borealisai.com;queensu.ca;microsoft.com;ualberta.ca",
        "position": "MS student;Researcher;Associate Professor;Consulting Researcher;Assistant Professor",
        "bibtex": "@inproceedings{\nshayegh2024ensemble,\ntitle={Ensemble Distillation for Unsupervised Constituency Parsing},\nauthor={Behzad Shayegh and Yanshuai Cao and Xiaodan Zhu and Jackie CK Cheung and Lili Mou},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=RR8y0WKrFv}\n}",
        "github": "",
        "project": "",
        "reviewers": "QZms;BQVw;mYw3;ZbQV;yYrJ",
        "pdf_size": 602319,
        "rating": "3;6;8;8;8",
        "confidence": "5;4;5;4;2",
        "soundness": "3;4;3;4;4",
        "contribution": "2;3;3;3;3",
        "presentation": "2;3;4;4;3",
        "wc_summary": "83;60;28;79;76",
        "wc_strengths": "65;26;85;49;104",
        "wc_weaknesses": "246;14;365;86;26",
        "wc_questions": "266;89;30;42;23",
        "wc_review": "660;189;508;256;229",
        "wc_reply_reviewers": "0;0;0;31;0",
        "wc_reply_authors": "681;296;423;385;197",
        "reply_reviewers": "0;0;0;1;0",
        "reply_authors": "1;1;1;2;1",
        "rating_avg": [
            6.6,
            1.9595917942265424
        ],
        "confidence_avg": [
            4.0,
            1.0954451150103321
        ],
        "soundness_avg": [
            3.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.8,
            0.39999999999999997
        ],
        "presentation_avg": [
            3.2,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            65.2,
            20.173249614278806
        ],
        "wc_strengths_avg": [
            65.8,
            27.18381871628782
        ],
        "wc_weaknesses_avg": [
            147.4,
            136.65665003943278
        ],
        "wc_questions_avg": [
            90.0,
            90.96153033013462
        ],
        "wc_review_avg": [
            368.4,
            183.72218156771382
        ],
        "wc_reply_reviewers_avg": [
            6.2,
            12.400000000000002
        ],
        "wc_reply_authors_avg": [
            396.4,
            162.2807443907009
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4
        ],
        "reply_authors_avg": [
            1.2,
            0.4
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.46584749531245623,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12639443149191622069&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=RR8y0WKrFv",
        "pdf": "https://openreview.net/pdf?id=RR8y0WKrFv",
        "email": "ualberta.ca;borealisai.com;queensu.ca;microsoft.com;ualberta.ca",
        "author_num": 5,
        "aff_unique_index": "0;1;2;3;0",
        "aff_unique_norm": "University of Alberta;Borealis AI;Queen's University;Microsoft",
        "aff_unique_dep": ";;;Microsoft Corporation",
        "aff_unique_url": "https://www.ualberta.ca;https://www.borealisai.com;https://www.queensu.ca;https://www.microsoft.com",
        "aff_unique_abbr": "UAlberta;Borealis AI;Queen's;Microsoft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "Canada;United States"
    },
    {
        "id": "RRKggDJxo2",
        "title": "Real-time learning of decay trajectory of Higgs boson using reservoir-in-reservoir architecture",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Real-time learning of the decay trajectory in Higgs bosons as they interact in the Higgs Field is the key to understanding and furthering of the mass providing mechanism and particle interaction mechanism beyond the Standard model in particle physics. We propose a novel machine learning architecture called reservoir-in-reservoir, to learn this complex high dimensional weak and electromagnetic interaction model involving a large number of arbitrary parameters whose full understanding remains elusive to physicists, making it harder to handcraft features or represent in a closed-form equation. Reservoir-in-reservoir is a reservoir computing (RC) approach, where we built a large reservoir using a pool of small reservoirs that are individually specialized to learn patterns from discrete time samples of decay trajectory without any prior knowledge. Each small reservoir consists of a paired primary and secondary reservoir of recurrently-connected neurons, known as learner and generator, respectively, with a readout connected to the head. During the training phase, we activate the learner-generator pairs within the pool. Then we excite each learners with an unit impulse and individual time windows of the incoming system. We train the internal recurrent connections and readouts using a recursive least squares-based First-Order and Reduced Control Error (FORCE) algorithm. To enhance adaptability and performance, we implement a time-varying forgetting factor optimization during training. This optimization helps control the fading and adaptation of the covariance matrix based on variations in the incoming decay trajectory and patterns. This comprehensive training strategy aims to guarantee that the entire reservoir pool evolves in harmony with the desired output dynamics. We optimize hyper-parameters such as the number of learner-generator pairs within the pool, their network sizes, batch sizes, and the number of training trials. During testing, we excite the generators in the pool, with only an unit impulse, to mimic the dynamic system. We facilitate real-time learning by re-triggering the training process involving learner-generator pairs whenever the error rate exceeds a predefined threshold. We evaluate our reservoir-in-reservoir architecture using Higgs boson decay trajectories as\ndetected in the Compact Muon Solenoid (CMS) detector of CERN\u2019s Large Hadron Collider (LHC). The reservoir pool is used to model the dynamics of momentum components (and transverse momentum) as Higgs boson decays into photons and leptons (electrons and muons) with invariant masses between 120-130 GeV. Our results indicate that reservoir-in-reservoir architecture is a well suited machine\nlearning paradigm in learning dynamical systems such as Higgs boson decay.",
        "keywords": "Real time learning;Higgs boson;reservoir computing;recurrent neural networks;non linear dynamic systems;machine learning;particle decay",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Ankita Paul;Anup Das",
        "authorids": "~Ankita_Paul1;~Anup_Das1",
        "gender": "F;M",
        "homepage": ";http://www.anupkdas.com",
        "dblp": ";95/9639.html",
        "google_scholar": "hFLSbBIAAAAJ;https://scholar.google.ca/citations?hl=en",
        "orcid": ";",
        "linkedin": "ankita-paul-3b3b17a3/;",
        "or_profile": "~Ankita_Paul1;~Anup_Das1",
        "aff": "Drexel University;Drexel University",
        "aff_domain": "drexel.edu;drexel.edu",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\npaul2024realtime,\ntitle={Real-time learning of decay trajectory of Higgs boson using reservoir-in-reservoir architecture},\nauthor={Ankita Paul and Anup Das},\nyear={2024},\nurl={https://openreview.net/forum?id=RRKggDJxo2}\n}",
        "github": "",
        "project": "",
        "reviewers": "f57r;vBzV;Jf1c;Y31L",
        "site": "https://openreview.net/forum?id=RRKggDJxo2",
        "pdf_size": 11254629,
        "rating": "1;5;5;6",
        "confidence": "4;2;3;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "1;2;1;1",
        "wc_summary": "33;36;73;80",
        "wc_strengths": "17;13;25;62",
        "wc_weaknesses": "131;29;70;315",
        "wc_questions": "84;63;117;183",
        "wc_review": "265;141;285;640",
        "wc_reply_reviewers": "0;0;0;21",
        "wc_reply_authors": "425;229;812;545",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.25,
            1.920286436967152
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            55.5,
            21.17191535974013
        ],
        "wc_strengths_avg": [
            29.25,
            19.395553614166314
        ],
        "wc_weaknesses_avg": [
            136.25,
            109.39692637364178
        ],
        "wc_questions_avg": [
            111.75,
            45.41681957160805
        ],
        "wc_review_avg": [
            332.75,
            185.76917801400748
        ],
        "wc_reply_reviewers_avg": [
            5.25,
            9.093266739736606
        ],
        "wc_reply_authors_avg": [
            502.75,
            211.18993228844977
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.3532809023904868,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:uYUdcPCeclIJ:scholar.google.com/&scioq=Real-time+learning+of+decay+trajectory+of+Higgs+boson+using+reservoir-in-reservoir+architecture&hl=en&as_sdt=0,23",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Drexel University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.drexel.edu",
        "aff_unique_abbr": "Drexel",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "TAIL: Task-specific Adapters for Imitation Learning with Large Pretrained Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18642",
        "id": "RRayv1ZPN3",
        "author_site": "Zuxin Liu, Jesse Zhang, Kavosh Asadi, Yao Liu, DING ZHAO, Shoham Sabach, Rasool Fakoor",
        "tldr": "",
        "abstract": "The full potential of large pretrained models remains largely untapped in control domains like robotics. This is mainly because of the scarcity of data and the computational challenges associated with training or fine-tuning these large models for such applications. Prior work mainly emphasizes either effective \\emph{pretraining} of large models for decision-making or single-task adaptation. But real-world problems will require data-efficient, \\emph{continual adaptation} for new control tasks. Recognizing these constraints, we introduce TAIL (Task-specific Adapters for Imitation Learning), a framework for efficient adaptation to new control tasks. Inspired by recent advancements in parameter-efficient fine-tuning in language domains, we explore efficient fine-tuning techniques---e.g., Bottleneck Adapters, P-Tuning, and Low-Rank Adaptation (LoRA)---in TAIL to adapt large pretrained models for new tasks with limited demonstration data. Our extensive experiments comparing prevalent parameter-efficient fine-tuning techniques and adaptation baselines suggest that TAIL with LoRA can achieve the best post-adaptation performance with only 1\\% of the trainable parameters of full fine-tuning, while avoiding catastrophic forgetting and preserving adaptation plasticity in continual learning settings.",
        "keywords": "Efficient Adaptation;Continual Learning;Robot Learning;Language-Conditioned Visuomotor Control;Few-shot Adaptation;Large Pretrained Models;Imitation Learning;Transfer Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Zuxin Liu;Jesse Zhang;Kavosh Asadi;Yao Liu;Ding Zhao;Shoham Sabach;Rasool Fakoor",
        "authorids": "~Zuxin_Liu1;~Jesse_Zhang3;~Kavosh_Asadi1;~Yao_Liu1;~Ding_Zhao1;~Shoham_Sabach1;~Rasool_Fakoor1",
        "gender": "M;M;;M;;M;M",
        "homepage": "https://www.zuxin.me;https://jessezhang.net;http://cs.brown.edu/~kasadiat/;http://yao-liu.com/;https://safeai-lab.github.io;https://ssabach.net.technion.ac.il/;http://rasoolfa.github.io",
        "dblp": "227/3137;;192/1404;64/424-9.html;;;123/2447",
        "google_scholar": "5ApCTCoAAAAJ;fSXCOfEAAAAJ;-2qyBJEAAAAJ;umAny5UAAAAJ;z7tPc9IAAAAJ;https://scholar.google.ca/citations?user=42D12TkAAAAJ;nVsOPtQAAAAJ",
        "orcid": "0000-0001-7412-5074;;;;;;",
        "linkedin": "zuxin-liu/;;;;;;rasool-fakoor-695b5845/",
        "or_profile": "~Zuxin_Liu1;~Jesse_Zhang3;~Kavosh_Asadi1;~Yao_Liu1;~Ding_Zhao1;~Shoham_Sabach1;~Rasool_Fakoor1",
        "aff": "Salesforce AI Research;NVIDIA;Amazon;Amazon;Carnegie Mellon University;Technion - Israel Institute of Technology, Technion;Amazon Web Services",
        "aff_domain": "salesforce.com;nvidia.com;amazon.com;amazon.com;cmu.edu;technion.ac.il;amazon.com",
        "position": "Researcher;Intern;Researcher;Researcher;Associate Professor;Associate Professor;Researcher",
        "bibtex": "@inproceedings{\nliu2024tail,\ntitle={{TAIL}: Task-specific Adapters for Imitation Learning with Large Pretrained Models},\nauthor={Zuxin Liu and Jesse Zhang and Kavosh Asadi and Yao Liu and Ding Zhao and Shoham Sabach and Rasool Fakoor},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=RRayv1ZPN3}\n}",
        "github": "",
        "project": "",
        "reviewers": "FCxQ;JmE1;86yf;q7Ls;Lua3",
        "pdf_size": 1306665,
        "rating": "5;6;6;6;8",
        "confidence": "4;3;3;4;4",
        "soundness": "2;3;3;3;3",
        "contribution": "2;2;3;3;2",
        "presentation": "3;2;3;3;4",
        "wc_summary": "103;59;82;126;100",
        "wc_strengths": "38;48;68;54;231",
        "wc_weaknesses": "427;84;302;224;178",
        "wc_questions": "147;56;138;71;121",
        "wc_review": "715;247;590;475;630",
        "wc_reply_reviewers": "85;91;77;0;72",
        "wc_reply_authors": "978;1103;919;547;619",
        "reply_reviewers": "1;1;2;0;1",
        "reply_authors": "3;3;2;2;2",
        "rating_avg": [
            6.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            3.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            94.0,
            22.40535650240808
        ],
        "wc_strengths_avg": [
            87.8,
            72.25621080571551
        ],
        "wc_weaknesses_avg": [
            243.0,
            115.93446424596958
        ],
        "wc_questions_avg": [
            106.6,
            36.477938538245276
        ],
        "wc_review_avg": [
            531.4,
            161.82039426475268
        ],
        "wc_reply_reviewers_avg": [
            65.0,
            33.148152286364315
        ],
        "wc_reply_authors_avg": [
            833.2,
            213.96859582658385
        ],
        "reply_reviewers_avg": [
            1.0,
            0.6324555320336759
        ],
        "reply_authors_avg": [
            2.4,
            0.4898979485566356
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.16666666666666663,
        "gs_citation": 24,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6036267029333961030&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=RRayv1ZPN3",
        "pdf": "https://openreview.net/pdf?id=RRayv1ZPN3",
        "email": "salesforce.com;nvidia.com;amazon.com;amazon.com;cmu.edu;technion.ac.il;amazon.com",
        "author_num": 7,
        "aff_unique_index": "0;1;2;2;3;4;2",
        "aff_unique_norm": "Salesforce;NVIDIA;Amazon;Carnegie Mellon University;Technion - Israel Institute of Technology",
        "aff_unique_dep": "Salesforce AI Research;NVIDIA Corporation;Amazon.com, Inc.;;",
        "aff_unique_url": "https://www.salesforce.com;https://www.nvidia.com;https://www.amazon.com;https://www.cmu.edu;https://www.technion.ac.il",
        "aff_unique_abbr": "Salesforce AI;NVIDIA;Amazon;CMU;Technion",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;1;0",
        "aff_country_unique": "United States;Israel"
    },
    {
        "id": "RS827PjAUs",
        "title": "InstructProtein: Aligning Human and Protein Language via Knowledge Instruction",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) have revolutionized the field of natural language processing, but they fall short in comprehending biological sequences such as proteins. To address this challenge, we propose InstructProtein, an innovative LLM that possesses bidirectional generation capabilities in both human and protein languages: (i) taking a protein sequence as input to predict its textual function description and (ii) using natural language to prompt protein sequence generation. To achieve this, we first pre-train an LLM on both protein and natural language corpora, enabling it to comprehend individual languages. Then supervised instruction tuning is employed to facilitate the alignment of these two distinct languages. Herein, we introduce a knowledge graph-based instruction generation framework to construct a high-quality instruction dataset, addressing annotation imbalance and instruction deficits in existing protein-text corpus. In particular, the instructions inherit the structural relations between proteins and function annotations in knowledge graphs, which empowers our model to engage in the causal modeling of protein functions, akin to the chain-of-thought processes in natural languages. Extensive experiments on bidirectional protein-text generation tasks show that InstructProtein outperforms state-of-the-art LLMs by large margins. Moreover, InstructProtein serves as a pioneering step towards text-based protein function prediction and sequence design, effectively bridging the gap between protein and human language understanding.",
        "keywords": "large language model; insturction tuning; knowledge graph; protein;",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/f0fe53cdf8a3c62b3a504a5c7bda886b7cb629ca.zip",
        "author": "Zeyuan Wang;Qiang Zhang;Keyan Ding;Ming Qin;Xiang Zhuang;Xiaotong Li;Huajun Chen",
        "authorids": "~Zeyuan_Wang3;~Qiang_Zhang6;~Keyan_Ding1;~Ming_Qin3;~Xiang_Zhuang1;~Xiaotong_Li3;~Huajun_Chen1",
        "gender": "M;;M;M;;;M",
        "homepage": ";https://qiangairesearcher.github.io;;;;https://github.com/MercuryDemo;",
        "dblp": ";72/3527-26;195/3500;76/3104;;;94/5089",
        "google_scholar": ";https://scholar.google.com/citations?hl=zh-CN;A7u-ZowAAAAJ;;;;",
        "orcid": ";;;0000-0001-8607-8965;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Zeyuan_Wang3;~Qiang_Zhang6;~Keyan_Ding1;~Ming_Qin3;~Xiang_Zhuang1;~Xiaotong_Li3;~Huajun_Chen1",
        "aff": "Zhejiang University;Zhejiang University;Zhejiang University;Zhejiang University;;Zhejiang University;Zhejiang University",
        "aff_domain": "zju.edu.cn;zju.edu.cn;zju.edu.cn;zju.edu.cn;;zju.edu.cn;zju.edu.cn",
        "position": "PhD student;Principal Researcher;Researcher;PhD student;;MS student;Full Professor",
        "bibtex": "@misc{\nwang2024instructprotein,\ntitle={InstructProtein: Aligning Human and Protein Language via Knowledge Instruction},\nauthor={Zeyuan Wang and Qiang Zhang and Keyan Ding and Ming Qin and Xiang Zhuang and Xiaotong Li and Huajun Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=RS827PjAUs}\n}",
        "github": "",
        "project": "",
        "reviewers": "Cqaz;modh;DyDT;Ex2Y",
        "site": "https://openreview.net/forum?id=RS827PjAUs",
        "pdf_size": 19214287,
        "rating": "3;5;6;6",
        "confidence": "4;4;3;4",
        "soundness": "2;2;2;2",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "107;23;141;164",
        "wc_strengths": "82;45;133;100",
        "wc_weaknesses": "273;324;259;89",
        "wc_questions": "56;2;9;11",
        "wc_review": "518;394;542;364",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1182;1056;1106;459",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;2;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            108.75,
            53.49941588466177
        ],
        "wc_strengths_avg": [
            90.0,
            31.77262973063451
        ],
        "wc_weaknesses_avg": [
            236.25,
            88.38940830212634
        ],
        "wc_questions_avg": [
            19.5,
            21.33658829335187
        ],
        "wc_review_avg": [
            454.5,
            76.71212420471747
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            950.75,
            287.4346664896216
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.4714045207910316,
        "gs_citation": 33,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=139916066266967787&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "Zhejiang University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.zju.edu.cn",
        "aff_unique_abbr": "ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "RSQL6xvUYW",
        "title": "Let's reward step by step: Step-Level reward model as the Navigators for Reasoning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recent years have seen considerable advancements in multi-step reasoning by Large Language Models (LLMs). Numerous studies elucidate the merits of integrating feedback or search mechanisms to augment reasoning outcomes. The Process-Supervised Reward Model (PRM), typically furnishes LLMs with step-by-step feedback during the training phase, akin to Proximal Policy Optimization (PPO) or reject sampling. Our objective is to examine the efficacy of PRM in the reasoning phase and to discern optimal implementation methods. To this end, we have devised a heuristic greedy search algorithm that employs step-level feedback from PRM, aiming to optimize the reasoning pathways explored by LLMs. Our tailored PRM demonstrated enhanced results compared to the Chain of Thought (CoT) on mathematical benchmarks like GSM8K and MATH. To explore the versatility of our methodology, we formulated a PRM dataset specifically for coding tasks and observed improved performance in the code generation task HumanEval, highlighting the promising, robust potential of our approach in a variety of reasoning tasks.",
        "keywords": "Large Launage model;Process-Supervised Reward Model;Multi-step Reasoning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Qianli Ma;Haotian Zhou;Tingkai Liu;Jianbo Yuan;Pengfei Liu;Yang You;Hongxia Yang",
        "authorids": "~Qianli_Ma4;~Haotian_Zhou1;~Tingkai_Liu1;~Jianbo_Yuan1;~Pengfei_Liu1;~Yang_You1;~Hongxia_Yang2",
        "gender": "M;;M;M;M;M;F",
        "homepage": "https://fazzie-key.cool/about/index.html;https://github.com/ht-zhou;https://tk-21st.github.io/;;http://pfliu.com/;https://www.comp.nus.edu.sg/~youy/;https://www4.comp.polyu.edu.hk/~hongxyang/",
        "dblp": ";;270/4091;134/6790;34/3381-3;33/8167-1.html;",
        "google_scholar": ";;hUYLD3_8Z1sC;https://scholar.google.com/citations?hl=en;oIz_CYEAAAAJ;jF4dPZwAAAAJ;iJlC5mMAAAAJ",
        "orcid": ";;0000-0003-3075-7648;;;;",
        "linkedin": ";;;;;yang-you-0b92914b/;",
        "or_profile": "~Qianli_Ma4;~Haotian_Zhou1;~Tingkai_Liu1;~Jianbo_Yuan1;~Pengfei_Liu1;~Yang_You1;~Hongxia_Yang2",
        "aff": ";National University of Singapore;ByteDance Inc.;Bytedance;Shanghai Jiaotong University;National University of Singapore;ByteDance Inc.",
        "aff_domain": ";u.nus.edu;bytedance.com;bytedance.com;sjtu.edu;nus.edu.sg;bytedance.com",
        "position": ";MS student;Researcher;Researcher;Associate Professor;Professor;Principal Researcher",
        "bibtex": "@misc{\nma2024lets,\ntitle={Let's reward step by step: Step-Level reward model as the Navigators for  Reasoning},\nauthor={Qianli Ma and Haotian Zhou and Tingkai Liu and Jianbo Yuan and Pengfei Liu and Yang You and Hongxia Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=RSQL6xvUYW}\n}",
        "github": "",
        "project": "",
        "reviewers": "A78C;abh9;X471;M8mk;Q37j",
        "site": "https://openreview.net/forum?id=RSQL6xvUYW",
        "pdf_size": 518724,
        "rating": "3;5;5;5;5",
        "confidence": "4;5;3;3;2",
        "soundness": "2;3;2;3;2",
        "contribution": "1;3;2;2;2",
        "presentation": "2;3;2;1;2",
        "wc_summary": "103;92;60;96;53",
        "wc_strengths": "26;82;64;42;81",
        "wc_weaknesses": "144;162;340;74;132",
        "wc_questions": "69;275;1;20;64",
        "wc_review": "342;611;465;232;330",
        "wc_reply_reviewers": "32;13;0;0;0",
        "wc_reply_authors": "413;633;336;137;392",
        "reply_reviewers": "1;1;0;0;0",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            4.6,
            0.7999999999999999
        ],
        "confidence_avg": [
            3.4,
            1.019803902718557
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            2.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            80.8,
            20.272148381461694
        ],
        "wc_strengths_avg": [
            59.0,
            21.98181066245454
        ],
        "wc_weaknesses_avg": [
            170.4,
            89.77661165359271
        ],
        "wc_questions_avg": [
            85.8,
            98.0559024230566
        ],
        "wc_review_avg": [
            396.0,
            130.50210726267986
        ],
        "wc_reply_reviewers_avg": [
            9.0,
            12.553883861180172
        ],
        "wc_reply_authors_avg": [
            382.2,
            158.87277929211157
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.2941742027072761,
        "gs_citation": 47,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6979285739745506359&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1;2;0;1",
        "aff_unique_norm": "National University of Singapore;ByteDance;Shanghai Jiao Tong University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.nus.edu.sg;https://www.bytedance.com;https://www.sjtu.edu.cn",
        "aff_unique_abbr": "NUS;ByteDance;SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;0;1",
        "aff_country_unique": "Singapore;China"
    },
    {
        "id": "RSincg5RBe",
        "title": "Hierarchical Graph Latent Diffusion Model for Molecule Generation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recently, generative models based on the diffusion process have emerged as a promising direction for automating the design of molecules. However, directly adding continuous Gaussian noise to discrete graphs leads to the problem of the final noisy data not conforming to the standard Gaussian distribution. Current graph diffusion models either corrupt discrete data through a transition matrix or relax the discrete data to continuous space for the diffusion process. These approaches not only require significant computation resources due to the inclusion of the bond type matrix but also cannot easily perform scalable conditional generation, such as adding cross-attention layers, due to the lack of embedding representations. In this paper, we first introduce the Graph Latent Diffusion Model (GLDM), a novel variant of latent diffusion models that overcomes the mismatch problem of continuous diffusion space and discrete data space. Meanwhile, the latent diffusion framework avoids the issues of computational resource consumption and lack of embeddings for conditional generation faced by current graph diffusion models. However, it only utilizes graph-level embeddings for molecule generation, losing node-level and structural information. Therefore, we further ex- tend the GLDM to the Hierarchical Graph Latent Diffusion Model (HGLDM). By including node embeddings and subgraph embeddings that contain structural in- formation, our model significantly reduces computation time compared to the cur- rent graph diffusion models. We evaluate our model on three benchmarks through unconditional generation and conditional generation tasks, which demonstrate its superior performance.",
        "keywords": "Hierarchical Graph Latent Diffusion;Molecule Generation",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Tian Bian;Yifan Niu;Heng Chang;Divin Yan;Tingyang Xu;Yu Rong;Jia Li;Hong Cheng",
        "authorids": "~Tian_Bian1;~Yifan_Niu1;~Heng_Chang2;~Divin_Yan1;~Tingyang_Xu1;~Yu_Rong1;~Jia_Li4;~Hong_Cheng1",
        "gender": ";Non-Binary;M;M;M;M;M;F",
        "homepage": ";https://nyf0808.github.io/;https://hchang95.github.io;https://divinyan.com/;;https://royrong.me/;https://sites.google.com/view/lijia;https://www1.se.cuhk.edu.hk/~hcheng/",
        "dblp": ";;79/5668;359/6307.html;157/0940;24/10036-1;23/6950-9;85/5637-1",
        "google_scholar": ";;e9NeskoAAAAJ;-Vv6hJsAAAAJ;6gIs5YMAAAAJ;https://scholar.google.com.hk/citations?user=itezhEMAAAAJ;1gSbcYoAAAAJ;https://scholar.google.com.hk/citations?user=s3lQL7YAAAAJ",
        "orcid": ";;0000-0002-4978-8041;0009-0009-2880-3124;0009-0002-0106-8376;0000-0001-7387-302X;0000-0002-6362-4385;0000-0002-4673-2587",
        "linkedin": ";;;;;;;",
        "or_profile": "~Tian_Bian1;~Yifan_Niu1;~Heng_Chang2;~Divin_Yan1;~Tingyang_Xu1;~Yu_Rong1;~Jia_Li4;~Hong_Cheng1",
        "aff": ";Hong Kong University of Science and Technology;Tsinghua University;ISTBI & School of Data Science, Fudan University;Tencent AI Lab;Tencent AI Lab;Hong Kong University of Science and Technology (Guangzhou);The Chinese University of Hong Kong",
        "aff_domain": ";connect.hkust-gz.edu.cn;tsinghua.edu.cn;fudan.edu.cn;tencent.com;tencent.com;ust.hk;cuhk.edu.hk",
        "position": ";PhD student;Researcher;Applied Mathmatics Research Master Student;Researcher;Principal Researcher;Assistant Professor;Professor",
        "bibtex": "@misc{\nbian2024hierarchical,\ntitle={Hierarchical Graph Latent Diffusion Model for Molecule Generation},\nauthor={Tian Bian and Yifan Niu and Heng Chang and Divin Yan and Tingyang Xu and Yu Rong and Jia Li and Hong Cheng},\nyear={2024},\nurl={https://openreview.net/forum?id=RSincg5RBe}\n}",
        "github": "",
        "project": "",
        "reviewers": "vEbk;y9cz;bWg3;NAaX",
        "site": "https://openreview.net/forum?id=RSincg5RBe",
        "pdf_size": 1250676,
        "rating": "3;5;5;8",
        "confidence": "4;3;4;4",
        "soundness": "3;2;2;3",
        "contribution": "1;3;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "113;56;40;81",
        "wc_strengths": "61;71;15;94",
        "wc_weaknesses": "324;424;232;36",
        "wc_questions": "124;25;93;103",
        "wc_review": "622;576;380;314",
        "wc_reply_reviewers": "311;143;68;53",
        "wc_reply_authors": "1710;1977;1896;1436",
        "reply_reviewers": "1;1;1;2",
        "reply_authors": "3;4;4;4",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            72.5,
            27.572631357924475
        ],
        "wc_strengths_avg": [
            60.25,
            28.734778579275673
        ],
        "wc_weaknesses_avg": [
            254.0,
            143.01048912579805
        ],
        "wc_questions_avg": [
            86.25,
            37.09026152509578
        ],
        "wc_review_avg": [
            473.0,
            129.17043005270207
        ],
        "wc_reply_reviewers_avg": [
            143.75,
            102.40452870845117
        ],
        "wc_reply_authors_avg": [
            1754.75,
            207.93673917804907
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.75,
            0.4330127018922193
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.08084520834544431,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:S4t9aVqZTIgJ:scholar.google.com/&scioq=Hierarchical+Graph+Latent+Diffusion+Model+for+Molecule+Generation&hl=en&as_sdt=0,39",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;3;0;4",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Tsinghua University;Fudan University;Tencent;Chinese University of Hong Kong",
        "aff_unique_dep": ";;School of Data Science;Tencent AI Lab;",
        "aff_unique_url": "https://www.ust.hk;https://www.tsinghua.edu.cn;https://www.fudan.edu.cn;https://ai.tencent.com;https://www.cuhk.edu.hk",
        "aff_unique_abbr": "HKUST;THU;Fudan;Tencent AI Lab;CUHK",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "RT5yHR0zwp",
        "title": "PEPNet: A Lightweight Point-based Event Camera 6-DOFs Pose Relocalization Network",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Event cameras exhibit remarkable attributes such as high dynamic range, asynchronicity, and low latency, making them highly suitable for vision tasks that involve high-speed motion in challenging lighting conditions. These cameras inherently capture movement and depth information in events, making them appealing sensors for Camera Pose Relocalization (CPR) tasks. Nevertheless, existing CPR networks based on events neglect the pivotal fine-grained temporal information in events, resulting in unsatisfactory performance. Moreover, the energy-efficient features are further compromised by the use of excessively complex models, hindering efficient deployment on edge devices. In this paper, we introduce PEPNet, a lightweight point-based network designed to regress six degrees of freedom (6-DOFs) event camera poses. We rethink the relationship between the event camera and CPR tasks, leveraging the raw point cloud directly as network input to harness the high-temporal resolution and inherent sparsity of events. PEPNet is adept at abstracting the spatial and implicit temporal features through hierarchical structure and explicit temporal features by Attentive Bi-directional Long Short-Term Memory (A-Bi-LSTM). By employing a carefully crafted lightweight design, PEPNet delivers state-of-the-art (SOTA) performance on public datasets with meager computational resources. Specifically, PEPNet attains a significant 38\\% performance improvement on the random split DAVIS 240C CPR Dataset, utilizing merely 6\\% of the parameters compared to traditional frame-based approaches. Moreover, PEPNet$_{tiny}$ accomplishes results comparable to the SOTA while employing a mere 0.5\\% of the parameters.",
        "keywords": "Event camera;Pose estimation;Point cloud",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Hongwei Ren;Jiadong Zhu;Yue Zhou;Haotian FU;Yulong Huang;Bojun Cheng",
        "authorids": "~Hongwei_Ren2;~Jiadong_Zhu1;~Yue_Zhou8;~Haotian_FU4;~Yulong_Huang2;~Bojun_Cheng1",
        "gender": "M;M;F;M;;M",
        "homepage": "http://rhwdmx.github.io;https://github.com/jdzhu19;;;;https://personal.hkust-gz.edu.cn/bojuncheng/index.html",
        "dblp": ";;;;;285/0564",
        "google_scholar": "https://scholar.google.com.hk/citations?user=eD60q1YAAAAJ;;;;;https://scholar.google.ch/citations?user=Zisp-_IAAAAJ",
        "orcid": ";;0000-0001-9323-4524;0000-0001-5445-4487;;",
        "linkedin": ";;;;;",
        "or_profile": "~Hongwei_Ren2;~Jiadong_Zhu1;~Yue_Zhou8;~Haotian_FU4;~Yulong_Huang2;~Bojun_Cheng1",
        "aff": "Hong Kong University of Science and Technology;The Hong Kong University of Science and Technology (Guangzhou);Hong Kong University of Science and Technology;Hong Kong University of Science and Technology;;The Hong Kong University of Science and Technology (Guangzhou)",
        "aff_domain": "connect.hkust-gz.edu.cn;hkust-gz.edu;hkust.edu;hkust.edu;;hkust-gz.edu.cn",
        "position": "PhD student;MS student;PhD student;PhD student;;Assistant Professor",
        "bibtex": "@misc{\nren2024pepnet,\ntitle={{PEPN}et: A Lightweight Point-based Event Camera 6-{DOF}s Pose Relocalization Network},\nauthor={Hongwei Ren and Jiadong Zhu and Yue Zhou and Haotian FU and Yulong Huang and Bojun Cheng},\nyear={2024},\nurl={https://openreview.net/forum?id=RT5yHR0zwp}\n}",
        "github": "",
        "project": "",
        "reviewers": "9ZiA;ofst;ndwh",
        "site": "https://openreview.net/forum?id=RT5yHR0zwp",
        "pdf_size": 3487911,
        "rating": "3;5;6",
        "confidence": "4;4;4",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "3;3;3",
        "wc_summary": "33;56;46",
        "wc_strengths": "36;30;12",
        "wc_weaknesses": "172;60;113",
        "wc_questions": "139;109;2",
        "wc_review": "380;255;173",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "733;633;631",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            45.0,
            9.41629792788369
        ],
        "wc_strengths_avg": [
            26.0,
            10.198039027185569
        ],
        "wc_weaknesses_avg": [
            115.0,
            45.745673748089736
        ],
        "wc_questions_avg": [
            83.33333333333333,
            58.80098260705816
        ],
        "wc_review_avg": [
            269.3333333333333,
            85.11299678793023
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            665.6666666666666,
            47.61885714247619
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:HbOnexcBDpAJ:scholar.google.com/&scioq=PEPNet:+A+Lightweight+Point-based+Event+Camera+6-DOFs+Pose+Relocalization+Network&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Hong Kong University of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ust.hk",
        "aff_unique_abbr": "HKUST",
        "aff_campus_unique_index": "0;1;0;0;1",
        "aff_campus_unique": "Hong Kong SAR;Guangzhou",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "RTI6MLwWbs",
        "title": "Physics-infused Intention Network for Crowd Simulation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Crowd simulation has garnered significant attention in domains including traffic management, urban planning, and emergency management. Existing methods can be classified as either rule-based or learning-based approaches, with the former lacking authenticity and the latter lacking generalization. Recent research has attempted to combine these approaches and propose physics-infused methods to address the aforementioned limitations. However, they continue to adhere strictly to the framework of the physical model, neglecting to depict the attention mechanism as a critical component of behavior. This limitation results in deficiencies in both the fidelity and generalizability of the simulations. This paper introduces a novel framework called Physics-infused Intention NEtwork (PINE) for crowd simulation. Our model introduces a physical bias while endowing pedestrians with the ability to selectively enhance the fine-grained information most relevant to one\u2019s current behavior. In addition, we design a variable-step rollout training approach with an optimized loss function to address cumulative errors in simulation. By conducting extensive experiments on four publicly available real-world datasets, we demonstrate that our PINE outperforms state-of-the-art simulation methods in accuracy, physical fidelity, and generalizability.",
        "keywords": "crowd simulation;physics-informed;agent-based pedestrian simulation",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/d0e81a481ba29aae76fc08ceb2aee98b5e0c2c97.zip",
        "author": "Luping Li;Xin Guo;Yang Liu;Zhongming Jin;Xing Su;Jieping Ye",
        "authorids": "~Luping_Li1;~Xin_Guo7;~Yang_Liu42;~Zhongming_Jin1;~Xing_Su2;~Jieping_Ye4",
        "gender": "M;M;M;M;;M",
        "homepage": ";https://sites.google.com/view/xinguo;;https://sites.google.com/site/zjuzhongmingjin/;;http://yelabs.net/",
        "dblp": ";17/1430-6;51/3710-212.html;;;03/5454",
        "google_scholar": ";xQcFve8AAAAJ;DzQAV2gAAAAJ;fOC90nQAAAAJ;;T9AzhwcAAAAJ",
        "orcid": "0009-0001-9855-5746;0000-0002-9329-8680;;;;0000-0001-8662-5818",
        "linkedin": ";;;;;",
        "or_profile": "~Luping_Li1;~Xin_Guo7;~Yang_Liu42;~Zhongming_Jin1;~Xing_Su2;~Jieping_Ye4",
        "aff": "Zhejiang University;Alibaba Group;Alibaba Group;Alibaba Cloud Computing;;Alibaba Group",
        "aff_domain": "zju.edu.cn;alibaba-inc.com;alibaba-inc.com;alibaba-inc.com;;alibaba-inc.com",
        "position": "PhD student;Researcher;Researcher;Researcher;;Principal Researcher",
        "bibtex": "@misc{\nli2024physicsinfused,\ntitle={Physics-infused Intention Network for Crowd Simulation},\nauthor={Luping Li and Xin Guo and Yang Liu and Zhongming Jin and Xing Su and Jieping Ye},\nyear={2024},\nurl={https://openreview.net/forum?id=RTI6MLwWbs}\n}",
        "github": "",
        "project": "",
        "reviewers": "nLKg;9dce;j7Sd",
        "site": "https://openreview.net/forum?id=RTI6MLwWbs",
        "pdf_size": 717570,
        "rating": "3;5;8",
        "confidence": "4;3;2",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "2;3;4",
        "wc_summary": "83;60;172",
        "wc_strengths": "70;32;319",
        "wc_weaknesses": "188;34;100",
        "wc_questions": "330;65;308",
        "wc_review": "671;191;899",
        "wc_reply_reviewers": "0;0;44",
        "wc_reply_authors": "1679;1114;548",
        "reply_reviewers": "0;0;1",
        "reply_authors": "3;2;1",
        "rating_avg": [
            5.333333333333333,
            2.0548046676563256
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            105.0,
            48.29768800539697
        ],
        "wc_strengths_avg": [
            140.33333333333334,
            127.28533126623647
        ],
        "wc_weaknesses_avg": [
            107.33333333333333,
            63.08371862497927
        ],
        "wc_questions_avg": [
            234.33333333333334,
            120.07312586734616
        ],
        "wc_review_avg": [
            587.0,
            295.07965026412785
        ],
        "wc_reply_reviewers_avg": [
            14.666666666666666,
            20.741798914805393
        ],
        "wc_reply_authors_avg": [
            1113.6666666666667,
            461.7288766749981
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.9933992677987828,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Zom08JdYLg0J:scholar.google.com/&scioq=Physics-infused+Intention+Network+for+Crowd+Simulation&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1;1",
        "aff_unique_norm": "Zhejiang University;Alibaba Group",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.zju.edu.cn;https://www.alibaba.com",
        "aff_unique_abbr": "ZJU;Alibaba",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "RTL8fWgJaS",
        "title": "Self-Specialization: Uncovering Latent Expertise within Large Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recent works have demonstrated the effectiveness of self-alignment in which a large language model is, by itself, aligned to follow general instructions through the automatic generation of instructional data using a handful of human-written seeds. Instead of general alignment, in this work, we focus on self-alignment for expert domain specialization (e.g., biomedicine), discovering it to be very effective for improving zero-shot and few-shot performance in target domains of interest. As a preliminary, we first present the benchmark results of existing aligned models within a specialized domain, which reveals the marginal effect that \"generic\" instruction-following training has on downstream expert domains' performance. To remedy this, we explore self-specialization that leverages domain-specific unlabelled data and a few labeled seeds for the self-alignment process. When augmented with retrieval to reduce hallucination and enhance concurrency of the alignment, self-specialization offers an effective (and efficient) way of \"carving out\" an expert model out of a \"generalist\", pre-trained LLM where different domains of expertise are originally combined in a form of \"superposition\". Our experimental results on a biomedical domain show that our self-specialized model (30B) outperforms its base model, MPT-30B by a large margin and even surpasses larger popular models based on LLaMA-65B, highlighting its potential and practicality for specialization, especially considering its efficiency in terms of data and parameters. Our code will be released upon acceptance.",
        "keywords": "Large Language Models;Self-Alignment;Instruction-Tuning;Specialization",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Junmo Kang;Hongyin Luo;Yada Zhu;James R. Glass;David Daniel Cox;Alan Ritter;Rogerio Feris;Leonid Karlinsky",
        "authorids": "~Junmo_Kang1;~Hongyin_Luo1;~Yada_Zhu1;~James_R._Glass1;~David_Daniel_Cox1;~Alan_Ritter1;~Rogerio_Feris1;~Leonid_Karlinsky3",
        "gender": "M;M;;;;M;M;M",
        "homepage": "https://jm-kang.github.io/;;https://researcher.watson.ibm.com/researcher/view.php?person=us-yzhu;;;http://aritter.github.io/;http://rogerioferis.com;",
        "dblp": "251/8697;147/4317;56/8808;;48/7659;47/3133;;05/4463",
        "google_scholar": "BGiZE6MAAAAJ;;AJb408gAAAAJ;;;https://scholar.google.com/citations?hl=en;xt3XLjcAAAAJ;https://scholar.google.co.il/citations?user=WbO7tjYAAAAJ",
        "orcid": ";;0000-0002-3338-6371;;;;;",
        "linkedin": ";;yadazhu/;;;;;",
        "or_profile": "~Junmo_Kang1;~Hongyin_Luo1;~Yada_Zhu1;~James_R._Glass1;~David_Daniel_Cox1;~Alan_Ritter1;~Rogerio_Feris1;~Leonid_Karlinsky3",
        "aff": "MIT-IBM Watson AI Lab;Massachusetts Institute of Technology;IBM Research;;International Business Machines;Georgia Institute of Technology;International Business Machines;International Business Machines",
        "aff_domain": "ibm.com;mit.edu;us.ibm.com;;ibm.com;gatech.edu;ibm.com;ibm.com",
        "position": "Research Intern;Postdoc;Principal Research Scientist;;IBM Director, MIT-IBM Watson AI Lab;Associate Professor;Research Manager;Principal Researcher",
        "bibtex": "@misc{\nkang2024selfspecialization,\ntitle={Self-Specialization: Uncovering Latent Expertise within Large Language Models},\nauthor={Junmo Kang and Hongyin Luo and Yada Zhu and James R. Glass and David Daniel Cox and Alan Ritter and Rogerio Feris and Leonid Karlinsky},\nyear={2024},\nurl={https://openreview.net/forum?id=RTL8fWgJaS}\n}",
        "github": "",
        "project": "",
        "reviewers": "CV1V;PQqS;T5kV;Kzpe",
        "site": "https://openreview.net/forum?id=RTL8fWgJaS",
        "pdf_size": 3414760,
        "rating": "3;5;5;6",
        "confidence": "3;5;4;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;4;3;3",
        "wc_summary": "84;108;128;75",
        "wc_strengths": "27;112;59;61",
        "wc_weaknesses": "443;147;202;87",
        "wc_questions": "9;31;2;35",
        "wc_review": "563;398;391;258",
        "wc_reply_reviewers": "35;101;39;26",
        "wc_reply_authors": "1496;880;1067;857",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "4;3;4;3",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            98.75,
            20.753011829611623
        ],
        "wc_strengths_avg": [
            64.75,
            30.433328769623607
        ],
        "wc_weaknesses_avg": [
            219.75,
            135.15800938161232
        ],
        "wc_questions_avg": [
            19.25,
            14.042346669983617
        ],
        "wc_review_avg": [
            402.5,
            108.15844858354802
        ],
        "wc_reply_reviewers_avg": [
            50.25,
            29.67637949615822
        ],
        "wc_reply_authors_avg": [
            1075.0,
            256.3464452649968
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.5,
            0.5
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.20751433915982243,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5003461227766357517&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;1;2;3;2;2",
        "aff_unique_norm": "Massachusetts Institute of Technology;IBM;International Business Machines Corporation;Georgia Institute of Technology",
        "aff_unique_dep": "IBM Watson AI Lab;IBM Research;;",
        "aff_unique_url": "https://www.mitibmwatsonailab.org;https://www.ibm.com/research;https://www.ibm.com;https://www.gatech.edu",
        "aff_unique_abbr": "MIT-IBM AI Lab;IBM;IBM;Georgia Tech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "RTLjdy6Ntk",
        "title": "FL-GNN: A Fuzzy-logic Graph Neural Network",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper presents a novel hybrid fuzzy-logic Graph Neural Network (FL-GNN) by combining Fuzzy Neural network (FNN) with GNN (Graph Neural Network) to effectively capture and aggregate local information flows within graph structural data. FL-GNN by design has three novel features. First, we introduce a specific structure fuzzy rule to boost the graph inference capability of FL-GNN to be on par with the representative GNN models. Second, we enhance the interpretability of FL-GNN by adding the analytic exploration methods to its graph inference ability from two perspectives: Fuzzy Inference System and Message Passing Algorithm (MPA). Finally, we ameliorate the structure of FL-GNN based on MPA to address the inherent limitations of FL-GNN. This optimization can reduce the calculation complexity of FL-GNN and further improve its learning efficiency. Extensive experiments are conducted to validate the graph inference capability of FL-GNN and report the performance comparison against other widely used GNN models. The results demonstrate that FL-GNN can outperform existing representative graph neural networks for graph inference tasks.",
        "keywords": "fuzzy neural network;fuzzy system;fuzzy-logic Graph Neural Network;graph inference",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/59258a1a0fcf3b2826e33f4790e2c1e4050d8d62.zip",
        "author": "Boyu Du;Jingya Zhou;Ling Liu;Xiaolong She",
        "authorids": "~Boyu_Du3;~Jingya_Zhou1;~Ling_Liu3;~Xiaolong_She1",
        "gender": "M;M;;M",
        "homepage": "http://web.suda.edu.cn/jy_zhou;http://web.suda.edu.cn/jy_zhou;;http://web.suda.edu.cn/jy_zhou",
        "dblp": ";50/6002;;",
        "google_scholar": ";leNH9TcAAAAJ;;",
        "orcid": ";0000-0003-0721-7424;;",
        "linkedin": ";;;",
        "or_profile": "~Boyu_Du3;~Jingya_Zhou1;~Ling_Liu3;~Xiaolong_She1",
        "aff": ";Soochow University;;",
        "aff_domain": ";suda.edu.cn;;",
        "position": ";Full Professor;;",
        "bibtex": "@misc{\ndu2024flgnn,\ntitle={{FL}-{GNN}: A Fuzzy-logic Graph Neural Network},\nauthor={Boyu Du and Jingya Zhou and Ling Liu and Xiaolong She},\nyear={2024},\nurl={https://openreview.net/forum?id=RTLjdy6Ntk}\n}",
        "github": "",
        "project": "",
        "reviewers": "CtCE;bUeC;Wx81",
        "site": "https://openreview.net/forum?id=RTLjdy6Ntk",
        "pdf_size": 2062366,
        "rating": "5;6;6",
        "confidence": "3;3;3",
        "soundness": "3;3;2",
        "contribution": "2;2;2",
        "presentation": "2;3;2",
        "wc_summary": "49;68;239",
        "wc_strengths": "47;57;82",
        "wc_weaknesses": "53;68;415",
        "wc_questions": "87;2;57",
        "wc_review": "236;195;793",
        "wc_reply_reviewers": "172;0;170",
        "wc_reply_authors": "2085;387;2503",
        "reply_reviewers": "1;0;2",
        "reply_authors": "4;1;6",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            118.66666666666667,
            85.44133790046959
        ],
        "wc_strengths_avg": [
            62.0,
            14.719601443879744
        ],
        "wc_weaknesses_avg": [
            178.66666666666666,
            167.22506457532683
        ],
        "wc_questions_avg": [
            48.666666666666664,
            35.19785346990479
        ],
        "wc_review_avg": [
            408.0,
            272.75019095624236
        ],
        "wc_reply_reviewers_avg": [
            114.0,
            80.61430807658567
        ],
        "wc_reply_authors_avg": [
            1658.3333333333333,
            915.0217969474219
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            2.0548046676563256
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:gHMcCY4wW0UJ:scholar.google.com/&scioq=FL-GNN:+A+Fuzzy-logic+Graph+Neural+Network&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Soochow University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.soochow.edu.cn",
        "aff_unique_abbr": "Soochow U",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "RUHli7EjbH",
        "title": "Zero redundancy distributed learning with differential privacy",
        "track": "main",
        "status": "Desk Reject",
        "tldr": "",
        "abstract": "Deep learning using large models have achieved great success in a wide range of domains. However, training these models on billions of parameters is very challenging in terms of the training speed, memory cost, and communication efficiency, especially under the privacy-preserving regime with differential privacy (DP). On the one hand, DP optimization has comparable efficiency to the standard non-private optimization on a single GPU, but on multiple GPUs, existing DP distributed learning (such as pipeline parallel) has suffered from significantly worse efficiency. On the other hand, the Zero Redundancy Optimizer (ZeRO) is a state-of-the-art solution to the standard distributed learning, exhibiting excellent training efficiency on large models, but to work compatibly with DP is technically complicated. In this work, we develop a new systematic solution, DP-ZeRO, (I) to scale up the trainable DP model size, e.g. to GPT-100B, (II) to obtain the same computation and communication efficiency as the standard ZeRO, and (III) to enable mixed-precision DP training. Our DP-ZeRO, like the standard ZeRO, has the potential to train models with arbitrary size and is evaluated on the world's largest DP models in terms of the number of trainable parameters.",
        "keywords": "deep learning;differential privacy;distributed learning;system design",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Zhiqi Bu;Ruixuan Liu;Justin Chiu;Sheng Zha;George Karypis",
        "authorids": "~Zhiqi_Bu1;~Ruixuan_Liu2;justchiu@amazon.com;~Sheng_Zha1;~George_Karypis1",
        "gender": "M;F;;M;M",
        "homepage": "https://sites.google.com/view/zhiqi-bu;;;https://github.com/szha;",
        "dblp": "245/2573;243/0195.html;;218/5471;",
        "google_scholar": "MEvTLxIAAAAJ;sXWB1UQAAAAJ;;;ElqwScwAAAAJ",
        "orcid": ";0000-0002-0823-3760;;;",
        "linkedin": ";;;shengzha/;",
        "or_profile": "~Zhiqi_Bu1;~Ruixuan_Liu2;justchiu@amazon.com;~Sheng_Zha1;~George_Karypis1",
        "aff": "Amazon;Emory University;;Amazon;University of Minnesota, Minneapolis",
        "aff_domain": "amazon.com;emory.edu;;amazon.com;umn.edu",
        "position": "Researcher;Postdoc;;Researcher;Full Professor",
        "bibtex": "@misc{\nbu2024zero,\ntitle={Zero redundancy distributed learning with differential privacy},\nauthor={Zhiqi Bu and Ruixuan Liu and Justin Chiu and Sheng Zha and George Karypis},\nyear={2024},\nurl={https://openreview.net/forum?id=RUHli7EjbH}\n}",
        "github": "",
        "project": "",
        "reviewers": "otjb;zq48",
        "site": "https://openreview.net/forum?id=RUHli7EjbH",
        "pdf_size": 748061,
        "rating": "5;8",
        "confidence": "2;2",
        "soundness": "2;3",
        "contribution": "2;3",
        "presentation": "2;3",
        "wc_summary": "49;50",
        "wc_strengths": "38;27",
        "wc_weaknesses": "288;20",
        "wc_questions": "29;3",
        "wc_review": "404;100",
        "wc_reply_reviewers": "0;0",
        "wc_reply_authors": "1285;75",
        "reply_reviewers": "0;0",
        "reply_authors": "2;1",
        "rating_avg": [
            6.5,
            1.5
        ],
        "confidence_avg": [
            2.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            49.5,
            0.5
        ],
        "wc_strengths_avg": [
            32.5,
            5.5
        ],
        "wc_weaknesses_avg": [
            154.0,
            134.0
        ],
        "wc_questions_avg": [
            16.0,
            13.0
        ],
        "wc_review_avg": [
            252.0,
            152.0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            680.0,
            605.0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8261767098792980150&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "Amazon;Emory University;University of Minnesota",
        "aff_unique_dep": "Amazon.com, Inc.;;",
        "aff_unique_url": "https://www.amazon.com;https://www.emory.edu;https://www.minnesota.edu",
        "aff_unique_abbr": "Amazon;Emory;UMN",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Minneapolis",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "RUKTunGWJe",
        "title": "INRSTEG: FLEXIBLE CROSS-MODAL LARGE CAPACITY STEGANOGRAPHY VIA IMPLICIT REPRESENTATIONS",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We present INRSteg, an innovative lossless steganography framework based on a novel data form Implicit Neural Representations (INR) that is modal-agnostic. Our framework is considered for effectively hiding multiple data without altering the original INR ensuring high-quality stego data. The neural representations of secret data are first concatenated to have independent paths that do not overlap, then weight freezing techniques are applied to the diagonal blocks of the weight matrices for the concatenated network to preserve the weights of secret data while additional free weights in the off-diagonal blocks of weight matrices are fitted to the cover data. Our framework can perform unexplored cross-modal steganography for various modalities including image, audio, video, and 3D shapes, and it achieves state-of-the-art performance compared to previous intra-modal steganographic methods.",
        "keywords": "Steganography;Implicit Neural Representation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Seoyun Yang;Sojeong Song;Chang D. Yoo;Junmo Kim",
        "authorids": "~Seoyun_Yang1;~Sojeong_Song1;~Chang_D._Yoo1;~Junmo_Kim1",
        "gender": "F;;M;M",
        "homepage": "https://github.com/seoyunYang;;https://sanctusfactory.com/family.php;https://siit.kaist.ac.kr/Faculty",
        "dblp": ";;31/7819;40/240-2.html",
        "google_scholar": ";;gFWgUQEAAAAJ;https://scholar.google.com.tw/citations?user=GdQtWNQAAAAJ",
        "orcid": ";;0000-0002-0756-7179;",
        "linkedin": ";;;",
        "or_profile": "~Seoyun_Yang1;~Sojeong_Song1;~Chang_D._Yoo1;~Junmo_Kim1",
        "aff": "Korea Advanced Institute of Science & Technology;;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.edu;;kaist.ac.kr;kaist.ac.kr",
        "position": "MS student;;Full Professor;Associate Professor",
        "bibtex": "@misc{\nyang2024inrsteg,\ntitle={{INRSTEG}: {FLEXIBLE} {CROSS}-{MODAL} {LARGE} {CAPACITY} {STEGANOGRAPHY} {VIA} {IMPLICIT} {REPRESENTATIONS}},\nauthor={Seoyun Yang and Sojeong Song and Chang D. Yoo and Junmo Kim},\nyear={2024},\nurl={https://openreview.net/forum?id=RUKTunGWJe}\n}",
        "github": "",
        "project": "",
        "reviewers": "9yJK;7Brn;AyWV;bYYf",
        "site": "https://openreview.net/forum?id=RUKTunGWJe",
        "pdf_size": 5605601,
        "rating": "3;5;5;5",
        "confidence": "5;3;4;4",
        "soundness": "2;3;3;4",
        "contribution": "2;3;2;3",
        "presentation": "1;3;3;3",
        "wc_summary": "24;74;85;75",
        "wc_strengths": "1;9;46;57",
        "wc_weaknesses": "1;102;153;138",
        "wc_questions": "100;14;39;87",
        "wc_review": "126;199;323;357",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "503;480;628;638",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            64.5,
            23.77498685593748
        ],
        "wc_strengths_avg": [
            28.25,
            23.742103950576915
        ],
        "wc_weaknesses_avg": [
            98.5,
            59.26423879541523
        ],
        "wc_questions_avg": [
            60.0,
            34.94996423460259
        ],
        "wc_review_avg": [
            251.25,
            93.20508301589565
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            562.25,
            71.3034886944531
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Gv8dRkIXBt0J:scholar.google.com/&scioq=INRSTEG:+FLEXIBLE+CROSS-MODAL+LARGE+CAPACITY+STEGANOGRAPHY+VIA+IMPLICIT+REPRESENTATIONS&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "RUeQzKLjSS",
        "title": "Meta Domain Reweighting for Partially Known Out-of-Distribution Generalization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Distribution shift poses a significant challenge for modern machine learning methods when applied to real-world scenarios.\nExisting researches typically assume that either unlabeled data from the target domain is available (domain adaptation) or nothing is known about the target dataset (domain generalization).\nHowever, distribution shifts are often caused by environmental changes or human intervention, and some facets of the distribution shift can be predicted while others remain unknown.\nTo address this issue of partial knowledge in out-of-distribution generalization, this paper proposes a model-agnostic reweighting method named \\emph{Meta Domain Reweighting for Partially Known Out-of-Distribution Generalization} (PKOOD).\nSpecifically, we utilize a bilevel meta-learning framework to simulate the known distribution shift and automatically determine an effective reweighting of the training samples to achieve strong generalization performance on unknown test datasets. \nAdditionally, we derive the upper bound of the risk gap between the reweighted training samples and the target dataset theoretically and incorporate it as a regularizer to guide loss design for reducing the variance and bias of both known and unknown distribution shifts.\nThe proposed method is evaluated on a real-world people income prediction dataset Adult and a recent out-of-distribution image classification benchmark NICO++, demonstrating its superiority over state-of-the-art algorithms regarding partially known out-of-distribution generalization performance.",
        "keywords": "Out-of-Distribution Generalization;Domain Reweighting;Meta-Learning",
        "primary_area": "causal reasoning",
        "supplementary_material": "/attachment/22e7b32c2ba452f3b7af8ef63f26792fa546f186.pdf",
        "author": "Ke Tu;Zhuo Zhang;LI YU;Zhengwei WU;Zhiqiang Zhang;JUN ZHOU;Lihong Gu;Jinjie GU;Peng Cui",
        "authorids": "~Ke_Tu1;~Zhuo_Zhang4;~LI_YU6;~Zhengwei_WU1;~Zhiqiang_Zhang4;~JUN_ZHOU6;~Lihong_Gu1;~Jinjie_GU1;~Peng_Cui1",
        "gender": "M;M;M;M;M;M;M;M;M",
        "homepage": ";https://scholar.google.com.hk/citations?view_op=list_works&hl=zh-CN&user=pZ2chb4AAAAJ;;;;https://scholar.google.com/citations?user=mCVvloEAAAAJ&hl=en;;https://scholar.google.com/citations?user=Mz2HnKwAAAAJ&hl=zh-CN&oi=ao;http://pengcui.thumedialab.com/",
        "dblp": "168/1886;16/1234;70/5913;53/8405;67/2010-12;99/3847-11;128/4619;251/9600;31/891-1",
        "google_scholar": "vFHAJXMAAAAJ;https://scholar.google.com.hk/citations?view_op=list_works;4Vk5qUUAAAAJ;H-tN5jYAAAAJ;TMx0g8kAAAAJ;mCVvloEAAAAJ;;Mz2HnKwAAAAJ;https://scholar.google.com.tw/citations?user=G8x97ZgAAAAJ",
        "orcid": ";;;;0000-0002-2321-7259;0000-0001-6033-6102;0000-0002-0706-3448;0000-0001-7596-4945;0000-0003-2957-8511",
        "linkedin": ";;;;;;lihong-gu-026172a6/;;",
        "or_profile": "~Ke_Tu1;~Zhuo_Zhang4;~LI_YU6;~Zhengwei_WU1;~Zhiqiang_Zhang4;~JUN_ZHOU6;~Lihong_Gu1;~Jinjie_GU1;~Peng_Cui1",
        "aff": ";University of Science and Technology of China;;;Ant Group;Ant Group;;Fudan University;Tsinghua University",
        "aff_domain": ";ustc.edu.cn;;;antfin.com;antgroup.com;;fudan.edu.cn;tsinghua.edu.cn",
        "position": ";Undergrad student;;;Researcher;Researcher;;PhD student;Associate Professor",
        "bibtex": "@misc{\ntu2024meta,\ntitle={Meta Domain Reweighting for Partially Known Out-of-Distribution Generalization},\nauthor={Ke Tu and Zhuo Zhang and LI YU and Zhengwei WU and Zhiqiang Zhang and JUN ZHOU and Lihong Gu and Jinjie GU and Peng Cui},\nyear={2024},\nurl={https://openreview.net/forum?id=RUeQzKLjSS}\n}",
        "github": "",
        "project": "",
        "reviewers": "2X6w;Wby4;3iTa;kPru",
        "site": "https://openreview.net/forum?id=RUeQzKLjSS",
        "pdf_size": 1754915,
        "rating": "3;3;5;5",
        "confidence": "4;4;3;3",
        "soundness": "1;3;3;2",
        "contribution": "1;2;2;2",
        "presentation": "2;2;3;2",
        "wc_summary": "229;124;101;127",
        "wc_strengths": "11;42;26;85",
        "wc_weaknesses": "212;151;169;276",
        "wc_questions": "679;6;26;43",
        "wc_review": "1131;323;322;531",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            145.25,
            49.38813116529112
        ],
        "wc_strengths_avg": [
            41.0,
            27.667670664513846
        ],
        "wc_weaknesses_avg": [
            202.0,
            48.130032204435516
        ],
        "wc_questions_avg": [
            188.5,
            283.4929452385015
        ],
        "wc_review_avg": [
            576.75,
            331.1241270279168
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:2oHuXOloKw4J:scholar.google.com/&scioq=Meta+Domain+Reweighting+for+Partially+Known+Out-of-Distribution+Generalization&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;2;3",
        "aff_unique_norm": "University of Science and Technology of China;Ant Group;Fudan University;Tsinghua University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "http://www.ustc.edu.cn;https://www.antgroup.com;https://www.fudan.edu.cn;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "USTC;Ant Group;Fudan;THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "RUgBoMu0ad",
        "title": "Hierarchical Classification by Training to Diffuse on the Manifold",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Hierarchical classification, the problem of requiring classifying images according to a hierarchical taxonomy, has broad applications owing to the principle of ``making better mistakes'', i.e., better to predict correct coarse labels than incorrect fine labels.\nDespite the importance, the literature has found it sufficient to use the wide-adopted top-1 classification accuracy to rank methods and unnecessary to use hierarchical metrics.\nImportantly, the method of training deep neural networks using CE loss (or a flat softmax classifier on leaf classes only) performs well, and other ad-hoc methods do not necessarily rival the flat-softmax method.\nAs a result, hierarchical classification has been under-explored and there lacks training and inference methods for this problem.\nIn this paper, we study hierarchical classification from a novel perspective of hierarchical manifolds, assuming data from a hierarchical taxonomy lie in a hierarchical manifold in the feature space.\nThis motivates our novel strategies for training models of hierarchical clasification and inference.\nFor training, we propose a hierarchical cross-modal contrastive learning method to finetune a vision-language pre-trained model, aiming to craft an embedding space that mirrors hierarchical taxonomy.\nFor inference, we present a diffusion method, re-conceptualizing hierarchical classification by treating its structure as a graph. \nOur method distinguishes from the conventional top-down and bottom-up methods for hierarchical classification.\nExtensive experiments validate our methods, achieving the state-of-the-art on two large-scale datasets, iNaturalist2018 and iNaturalist2021, with respect to both the top-1 accuracy and diverse hierarchical metrics.",
        "keywords": "hierarchical classification;diffusion;hierarchical contrastive learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Kaixiang Song;Guoyuan An;Yuchi Huo;Yanan Li;Wei Hua;Sung-eui Yoon;Shu Kong",
        "authorids": "~Kaixiang_Song1;~Guoyuan_An1;~Yuchi_Huo1;~Yanan_Li4;~Wei_Hua1;~Sung-eui_Yoon1;~Shu_Kong1",
        "gender": "M;M;M;F;M;M;M",
        "homepage": ";https://sgvr.kaist.ac.kr/member/;https://www.zju.edu.cn/home/huo/;https://yananlix1.github.io/;https://portal.zhejianglab.com/portal/employee;http://sglab.kaist.ac.kr/~sungeui/;https://aimerykong.github.io/",
        "dblp": ";299/8567;;61/7498-2.html;;96/4574;26/11141",
        "google_scholar": ";https://scholar.google.com.hk/citations?user=yiHeGiMAAAAJ;;9cTdt_kAAAAJ;;https://scholar.google.com.tw/citations?user=uLQzQW4AAAAJ;sm9FdLoAAAAJ",
        "orcid": ";0009-0008-6233-757X;;0000-0001-8482-7221;0000-0003-2868-1920;;0000-0002-1362-5937",
        "linkedin": "kaixiang-song-796055261/;guoyuan-an-743833168/?originalSubdomain=kr;;;;;aimerykong/",
        "or_profile": "~Kaixiang_Song1;~Guoyuan_An1;~Yuchi_Huo1;~Yanan_Li4;~Wei_Hua1;~Sung-eui_Yoon1;~Shu_Kong1",
        "aff": "Zhejiang Lab;KAIST;Zhejiang University;Zhejiang Lab;Zhejiang Lab;KAIST;Texas A&M University - College Station",
        "aff_domain": "cn.edu;kaist.ac.kr;zju.edu.cn;zhejianglab.com;zhejianglab.com;kaist.edu;tamu.edu",
        "position": "Researcher;PhD student;Assistant Professor;Researcher;Full Professor;Professor;Assistant Professor",
        "bibtex": "@misc{\nsong2024hierarchical,\ntitle={Hierarchical Classification by Training to Diffuse on the Manifold},\nauthor={Kaixiang Song and Guoyuan An and Yuchi Huo and Yanan Li and Wei Hua and Sung-eui Yoon and Shu Kong},\nyear={2024},\nurl={https://openreview.net/forum?id=RUgBoMu0ad}\n}",
        "github": "",
        "project": "",
        "reviewers": "uzTo;ijE5;fjJY",
        "site": "https://openreview.net/forum?id=RUgBoMu0ad",
        "pdf_size": 660053,
        "rating": "3;5;6",
        "confidence": "4;3;4",
        "soundness": "2;2;3",
        "contribution": "2;3;3",
        "presentation": "3;3;3",
        "wc_summary": "79;54;130",
        "wc_strengths": "57;63;102",
        "wc_weaknesses": "251;118;582",
        "wc_questions": "6;78;123",
        "wc_review": "393;313;937",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            87.66666666666667,
            31.626290048347787
        ],
        "wc_strengths_avg": [
            74.0,
            19.949937343260004
        ],
        "wc_weaknesses_avg": [
            317.0,
            195.0914315562492
        ],
        "wc_questions_avg": [
            69.0,
            48.187135212627034
        ],
        "wc_review_avg": [
            547.6666666666666,
            277.2307502584966
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.18898223650461363,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:oqrCP2yI9KkJ:scholar.google.com/&scioq=Hierarchical+Classification+by+Training+to+Diffuse+on+the+Manifold&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0;0;1;3",
        "aff_unique_norm": "Zhejiang Lab;Korea Advanced Institute of Science and Technology;Zhejiang University;Texas A&M University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "http://www.zhejianglab.com;https://www.kaist.ac.kr;https://www.zju.edu.cn;https://www.tamu.edu",
        "aff_unique_abbr": ";KAIST;ZJU;TAMU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";College Station",
        "aff_country_unique_index": "0;1;0;0;0;1;2",
        "aff_country_unique": "China;South Korea;United States"
    },
    {
        "id": "RUvzlotXY0",
        "title": "HiCBridge: Resolution Enhancement of Hi-C Data Using Direct Diffusion Bridge",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Hi-C analysis provides valuable insights into the spatial organization of chromatin, which affects many aspects of genomic processes. However, the usefulness of Hi-C is hindered by its resolution limitations. Here, we propose Hi-C enhancement using Direct Diffusion Bridge (HiCBridge) that learns transformation from low-resolution Hi-C data to high-resolution ones using direct diffusion bridge (DDB). Instead of relying on standard supervised feed-forward networks  and GANs, which often produces overly smooth textures or falls into mode collapsing, the main idea of HiCBridge is building a diffusion process, by directly bridging the low and high-resolution Hi-C data. Furthermore, to make our model applicable in real-world situations, we further train our model by increasing the variation of the real-world data with diffusion model-based data augmentation. We demonstrate that our model can be used to improve  downstream analyses such as three-dimensional structure matching, loop position reconstruction, and recovery of biologically significant contact domain boundaries. Experimental results confirm that HiCBridge surpasses existing deep learning-based models on standard vision metrics, and exhibits strong reproducibility in Hi-C analysis of human cells.",
        "keywords": "Hi-C;Image Translation;Diffusion Bridge;High Resolution",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/9ccf837d2597859e338ca3d8434f80162452dd85.zip",
        "author": "Jaemin Kim;Jong Chul Ye",
        "authorids": "~Jaemin_Kim2;~Jong_Chul_Ye1",
        "gender": "M;M",
        "homepage": ";https://bispl.weebly.com/",
        "dblp": ";15/5613",
        "google_scholar": ";HNMjoNEAAAAJ",
        "orcid": ";",
        "linkedin": "jaemin-kim-b144b2292/;",
        "or_profile": "~Jaemin_Kim2;~Jong_Chul_Ye1",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr",
        "position": "MS student;Full Professor",
        "bibtex": "@misc{\nkim2024hicbridge,\ntitle={Hi{CB}ridge: Resolution Enhancement of Hi-C Data Using Direct Diffusion Bridge},\nauthor={Jaemin Kim and Jong Chul Ye},\nyear={2024},\nurl={https://openreview.net/forum?id=RUvzlotXY0}\n}",
        "github": "",
        "project": "",
        "reviewers": "LnZX;eQMG;iBuE;CoBE;jkUa",
        "site": "https://openreview.net/forum?id=RUvzlotXY0",
        "pdf_size": 36445469,
        "rating": "3;6;6;6;6",
        "confidence": "4;4;3;4;3",
        "soundness": "3;3;3;3;3",
        "contribution": "2;3;2;3;3",
        "presentation": "3;2;3;3;3",
        "wc_summary": "46;47;70;51;221",
        "wc_strengths": "28;115;93;59;136",
        "wc_weaknesses": "114;149;172;55;138",
        "wc_questions": "6;32;6;38;2",
        "wc_review": "194;343;341;203;497",
        "wc_reply_reviewers": "0;0;0;14;0",
        "wc_reply_authors": "524;454;373;243;427",
        "reply_reviewers": "0;0;0;1;0",
        "reply_authors": "3;1;1;1;1",
        "rating_avg": [
            5.4,
            1.2
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            87.0,
            67.5603433975879
        ],
        "wc_strengths_avg": [
            86.2,
            38.685397761946305
        ],
        "wc_weaknesses_avg": [
            125.6,
            39.93294379331431
        ],
        "wc_questions_avg": [
            16.8,
            15.051910177781423
        ],
        "wc_review_avg": [
            315.6,
            111.1460300685544
        ],
        "wc_reply_reviewers_avg": [
            2.8,
            5.6
        ],
        "wc_reply_authors_avg": [
            404.2,
            94.13904609671802
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4
        ],
        "reply_authors_avg": [
            1.4,
            0.8000000000000002
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.4082482904638631,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17958384840943711432&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "RVaUSKSh9t",
        "title": "Continual Graph Learning for Thermal Analysis of Composite Materials under Interface Variations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Thermal analysis is an important topic in many fields, such as building, machinery, and microelectronics. As the types of materials in a system are increasingly diverse, conventional numerical methods or machine learning-based surrogate models face tremendous challenges in computation cost and accuracy. Furthermore, a realistic system usually suffers from random fabrication variations that induce significant errors in model prediction. To overcome these issues, we propose Graph Neural Networks (GNN) as a framework for thermal analysis of composite materials with diverse thermal conductivity and thermal interface variations. Using chiplets in microelectronics as the study case, we first partition the system into sub-blocks based on their material property. Then we develop a physics-constrained GNN as the aggregator to integrate local models of each sub-block into a system, with the edge to represent the thermal interaction. In the presence of interface variations, we introduce continual adaptation of the GNN model, using a minimum number of training samples. Compared with previous solutions, our GNN model is robust for various material and interface conditions, and efficient in the prediction of hot-spot.",
        "keywords": "Graph Neural Network;Continual Graph Learning;Thermal Analysis",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Jingbo Sun;Zhenyu Wang;Frank Liu;Vidya Chhabria;Yu Cao",
        "authorids": "~Jingbo_Sun1;zwang586@asu.edu;~Frank_Liu2;vachhabr@asu.edu;yucao@umn.edu",
        "gender": "M;;;;",
        "homepage": ";;;;",
        "dblp": ";;;;",
        "google_scholar": ";;;;",
        "orcid": ";;;;",
        "linkedin": "jingbo-sun-44843380;;;;",
        "or_profile": "~Jingbo_Sun1;zwang586@asu.edu;~Frank_Liu2;vachhabr@asu.edu;yucao@umn.edu",
        "aff": "Arizona State University;;;;",
        "aff_domain": "asu.edu;;;;",
        "position": "PhD student;;;;",
        "bibtex": "@misc{\nsun2024continual,\ntitle={Continual Graph Learning for Thermal Analysis of Composite Materials under Interface Variations},\nauthor={Jingbo Sun and Zhenyu Wang and Frank Liu and Vidya Chhabria and Yu Cao},\nyear={2024},\nurl={https://openreview.net/forum?id=RVaUSKSh9t}\n}",
        "github": "",
        "project": "",
        "reviewers": "sWQE;bfnq;EZT6",
        "site": "https://openreview.net/forum?id=RVaUSKSh9t",
        "pdf_size": 1245368,
        "rating": "3;3;5",
        "confidence": "3;3;4",
        "soundness": "3;2;3",
        "contribution": "2;2;1",
        "presentation": "2;2;2",
        "wc_summary": "97;111;428",
        "wc_strengths": "21;45;5",
        "wc_weaknesses": "104;343;5",
        "wc_questions": "39;39;5",
        "wc_review": "261;538;443",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "465;651;676",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            212.0,
            152.8419663137931
        ],
        "wc_strengths_avg": [
            23.666666666666668,
            16.438437341250605
        ],
        "wc_weaknesses_avg": [
            150.66666666666666,
            141.87866490616395
        ],
        "wc_questions_avg": [
            27.666666666666668,
            16.027753706895076
        ],
        "wc_review_avg": [
            414.0,
            114.9289635673561
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            597.3333333333334,
            94.12875342966261
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:wjoyFXtm1REJ:scholar.google.com/&scioq=Continual+Graph+Learning+for+Thermal+Analysis+of+Composite+Materials+under+Interface+Variations&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Arizona State University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.asu.edu",
        "aff_unique_abbr": "ASU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Sufficient conditions for offline reactivation in recurrent neural networks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18641",
        "id": "RVrINT6MT7",
        "author_site": "Nanda H Krishna, Colin Bredenberg, Daniel Levenstein, Blake A Richards, Guillaume Lajoie",
        "tldr": "",
        "abstract": "During periods of quiescence, such as sleep, neural activity in many brain circuits resembles that observed during periods of task engagement. However, the precise conditions under which task-optimized networks can autonomously reactivate the same network states responsible for online behavior is poorly understood. In this study, we develop a mathematical framework that outlines sufficient conditions for the emergence of neural reactivation in circuits that encode features of smoothly varying stimuli. We demonstrate mathematically that noisy recurrent networks optimized to track environmental state variables using change-based sensory information naturally develop denoising dynamics, which, in the absence of input, cause the network to revisit state configurations observed during periods of online activity. We validate our findings using numerical experiments on two canonical neuroscience tasks: spatial position estimation based on self-motion cues, and head direction estimation based on angular velocity cues. Overall, our work provides theoretical support for modeling offline reactivation as an emergent consequence of task optimization in noisy neural circuits.",
        "keywords": "computational neuroscience;offline reactivation;replay;recurrent neural networks;path integration;noise",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/c1af0b91b38721f0d7b100aa6f4448c35767cdae.zip",
        "author": "Nanda H Krishna;Colin Bredenberg;Daniel Levenstein;Blake Aaron Richards;Guillaume Lajoie",
        "authorids": "~Nanda_H_Krishna1;~Colin_Bredenberg1;~Daniel_Levenstein1;~Blake_Aaron_Richards1;~Guillaume_Lajoie1",
        "gender": "M;M;M;M;M",
        "homepage": "http://www.colinbredenberg.com/;;http://linclab.org;https://dms.umontreal.ca/~lajoie/;https://nandahkrishna.com",
        "dblp": "280/1131;;70/10850;31/10384;245/4163",
        "google_scholar": "qIs3yv0AAAAJ;bHxpXt4AAAAJ;https://scholar.google.ca/citations?user=1CPY1LsAAAAJ;;OIdDa5kAAAAJ",
        "orcid": ";;0000-0001-9662-2151;;0000-0001-8036-2789",
        "linkedin": ";;;;https://linkedin.com/in/nandahkrishna",
        "or_profile": "~Colin_Bredenberg1;~Daniel_Levenstein1;~Blake_Aaron_Richards1;~Guillaume_Lajoie1;~Nanda_Harishankar_Krishna1",
        "aff": "Mila- Quebec AI Institute;McGill University;Mila - Quebec Artificial Intelligence Institute;Mila - Quebec Artificial Intelligence Institute;Mila \u2013 Quebec AI Institute",
        "aff_domain": "mila.quebec;mcgill.ca;mila.quebec;mila.quebec;mila.quebec",
        "position": "Postdoc;Postdoc;Associate Professor;Associate Professor;PhD student",
        "bibtex": "@inproceedings{\nkrishna2024sufficient,\ntitle={Sufficient conditions for offline reactivation in recurrent neural networks},\nauthor={Nanda H Krishna and Colin Bredenberg and Daniel Levenstein and Blake Aaron Richards and Guillaume Lajoie},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=RVrINT6MT7}\n}",
        "github": "",
        "project": "",
        "reviewers": "xvHM;NzXs;aZpo;pnLC",
        "pdf_size": 4054299,
        "rating": "5;6;6;6",
        "confidence": "4;5;4;3",
        "soundness": "2;3;2;2",
        "contribution": "2;2;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "66;59;96;48",
        "wc_strengths": "61;201;79;58",
        "wc_weaknesses": "473;362;364;401",
        "wc_questions": "73;140;44;63",
        "wc_review": "673;762;583;570",
        "wc_reply_reviewers": "84;136;135;69",
        "wc_reply_authors": "2485;2744;1167;1713",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "5;7;4;4",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            67.25,
            17.795715776557007
        ],
        "wc_strengths_avg": [
            99.75,
            59.00582598354166
        ],
        "wc_weaknesses_avg": [
            400.0,
            44.91658936295141
        ],
        "wc_questions_avg": [
            80.0,
            36.173194495371845
        ],
        "wc_review_avg": [
            647.0,
            77.34015774486112
        ],
        "wc_reply_reviewers_avg": [
            106.0,
            29.974989574643725
        ],
        "wc_reply_authors_avg": [
            2027.25,
            624.9097434830089
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            5.0,
            1.224744871391589
        ],
        "replies_avg": [
            32,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4333759204512999663&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=RVrINT6MT7",
        "pdf": "https://openreview.net/pdf?id=RVrINT6MT7",
        "email": "mila.quebec;mcgill.ca;mila.quebec;mila.quebec;mila.quebec",
        "author_num": 5,
        "aff_unique_index": "0;1;2;2;0",
        "aff_unique_norm": "Quebec AI Institute;McGill University;Quebec Artificial Intelligence Institute",
        "aff_unique_dep": "AI;;Artificial Intelligence",
        "aff_unique_url": "https://mila.quebec;https://www.mcgill.ca;https://mila.quebec",
        "aff_unique_abbr": "Mila;McGill;Mila",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "title": "Harnessing Explanations: LLM-to-LM Interpreter for Enhanced Text-Attributed Graph Representation Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18640",
        "id": "RXFVcynVe1",
        "author_site": "Xiaoxin He, Xavier Bresson, Thomas Laurent, Adam Perold, Yann LeCun, Bryan Hooi",
        "tldr": "",
        "abstract": "Representation learning on text-attributed graphs (TAGs) has become a critical research problem in recent years. A typical example of a TAG is a paper citation graph, where the text of each paper serves as node attributes. Initial graph neural network (GNN) pipelines handled these text attributes by transforming them into shallow or hand-crafted features, such as skip-gram or bag-of-words features. Recent efforts have focused on enhancing these pipelines with language models (LMs), which typically demand intricate designs and substantial computational resources. With the advent of powerful large language models (LLMs) such as GPT or Llama2, which demonstrate an ability to reason and to utilize general knowledge, there is a growing need for techniques which combine the textual modelling abilities of LLMs with the structural learning capabilities of GNNs. Hence, in this work, we focus on leveraging LLMs to capture textual information as features, which can be used to boost GNN performance on downstream tasks. A key innovation is our use of \\emph{explanations as features}: we prompt an LLM to perform zero-shot classification, request textual explanations for its decision-making process, and design an \\emph{LLM-to-LM interpreter} to translate these explanations into informative features for downstream GNNs. Our experiments demonstrate that our method achieves state-of-the-art results on well-established TAG datasets, including \\texttt{Cora}, \\texttt{PubMed}, \\texttt{ogbn-arxiv}, as well as our newly introduced dataset, \\texttt{tape-arxiv23}. Furthermore, our method significantly speeds up training, achieving a 2.88 times improvement over the closest baseline on \\texttt{ogbn-arxiv}. Lastly, we believe the versatility of the proposed method extends beyond TAGs and holds the potential to enhance other tasks involving graph-text data~\\footnote{Our codes and datasets are available at: \\url{https://github.com/XiaoxinHe/TAPE}}.",
        "keywords": "large language models (LLM);feature learning;text attributed graphs (TAG);graph neural networks (GNN)",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Xiaoxin He;Xavier Bresson;Thomas Laurent;Adam Perold;Yann LeCun;Bryan Hooi",
        "authorids": "~Xiaoxin_He1;~Xavier_Bresson6;~Thomas_Laurent1;~Adam_Perold1;~Yann_LeCun1;~Bryan_Hooi1",
        "gender": "F;M;M;M;;M",
        "homepage": "https://xiaoxinhe.github.io/;https://www.comp.nus.edu.sg/cs/people/xaviercs/;http://thomaslaurent.lmu.build/homepage.html;http://yann.lecun.com;http://bhooi.github.io;",
        "dblp": "72/5872;95/378;47/8889-1;l/YannLeCun;169/9975;",
        "google_scholar": "icT6GMsAAAAJ;https://scholar.google.com.sg/citations?hl=en;_Ag_9uAAAAAJ;WLN3QrAAAAAJ;;",
        "orcid": ";;;;0000-0002-5645-1754;",
        "linkedin": "he-xiaoxin-a130601b4/;;;;;adam-perold-50a21251/",
        "or_profile": "~Xiaoxin_He1;~Xavier_Bresson6;~Thomas_Laurent1;~Yann_LeCun1;~Bryan_Hooi1;~Adam_Perold2",
        "aff": "National University of Singapore;National University of Singapore;Loyola Marymount University;New York University;National University of Singapore;Provenance AI Inc",
        "aff_domain": "nus.edu;nus.edu.sg;lmu.edu;nyu.edu;nus.edu.sg;provenance.ai",
        "position": "PhD student;Associate Professor;Full Professor;Full Professor;Assistant Professor;Researcher",
        "bibtex": "@inproceedings{\nhe2024harnessing,\ntitle={Harnessing Explanations: {LLM}-to-{LM} Interpreter for Enhanced Text-Attributed Graph Representation Learning},\nauthor={Xiaoxin He and Xavier Bresson and Thomas Laurent and Adam Perold and Yann LeCun and Bryan Hooi},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=RXFVcynVe1}\n}",
        "github": "",
        "project": "",
        "reviewers": "HEW1;Dm45;NoEV",
        "pdf_size": 710453,
        "rating": "5;6;6",
        "confidence": "5;3;5",
        "soundness": "2;2;3",
        "contribution": "2;2;2",
        "presentation": "2;3;3",
        "wc_summary": "61;65;85",
        "wc_strengths": "19;133;40",
        "wc_weaknesses": "194;129;58",
        "wc_questions": "10;3;2",
        "wc_review": "284;330;185",
        "wc_reply_reviewers": "33;10;0",
        "wc_reply_authors": "1636;779;785",
        "reply_reviewers": "1;1;0",
        "reply_authors": "4;3;2",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            70.33333333333333,
            10.498677165349081
        ],
        "wc_strengths_avg": [
            64.0,
            49.53786430600334
        ],
        "wc_weaknesses_avg": [
            127.0,
            55.53977553669682
        ],
        "wc_questions_avg": [
            5.0,
            3.559026084010437
        ],
        "wc_review_avg": [
            266.3333333333333,
            60.49977043115306
        ],
        "wc_reply_reviewers_avg": [
            14.333333333333334,
            13.816254517375135
        ],
        "wc_reply_authors_avg": [
            1066.6666666666667,
            402.5869126315735
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.0,
            0.816496580927726
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 129,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8074505652304006161&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=RXFVcynVe1",
        "pdf": "https://openreview.net/pdf?id=RXFVcynVe1",
        "email": "nus.edu;nus.edu.sg;lmu.edu;nyu.edu;nus.edu.sg;provenance.ai",
        "author_num": 6,
        "aff_unique_index": "0;0;1;2;0;3",
        "aff_unique_norm": "National University of Singapore;Loyola Marymount University;New York University;Provenance AI Inc",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.nus.edu.sg;https://www.lmu.edu;https://www.nyu.edu;",
        "aff_unique_abbr": "NUS;LMU;NYU;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;1;0;1",
        "aff_country_unique": "Singapore;United States"
    },
    {
        "id": "RXU6qde675",
        "title": "Adversarial enhanced representation for link prediction in multi-layer networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Multi-layer networks are widely utilized in various applications, including social networks, biological networks, and Internet typologies. In these networks, link prediction is a longstanding issue that predicts missing links based on the observed structures across all layers, thereby assisting in tasks such as network recovery and drug-target prediction. However, existing link prediction methods tend to learn nontransferable intra-layer representations that cannot generalize well to other layers, which results in inefficient utilization of the structural correlations between layers in multi-layer networks. To address this, we propose a novel graph embedding method called Adversarial Enhanced Representation (AER) for link prediction in multi-layer networks. AER comprises three modules: a representation generator, a layer discriminator, and a link predictor. The representation generator is designed to learn and fuse the links\u2019 inter-layer and intra-layer representations. Also, the layer discriminator aims to identify the layer sources of learned inter-layer representations. During a minimax two-player game, the representation generator attempts to learn inter-layer transferable representations to deceive the layer discriminator. In order not to be deceived, the layer discriminator attempts to accurately distinguish the layer sources of learned inter-layer representations. Finally, the link predictor works in collaboration with the representation generator to predict whether a link is a missing link based on the adaptive fusion between inter-layer transferable and intra-layer representations. To validate the effectiveness of our proposed method, we conduct extensive experiments on real-world datasets. The experimental results demonstrate that AER outperforms state-of-the-art methods in link prediction performance for multi-layer networks.",
        "keywords": "Link prediction; Multi-layer networks; Supervised representation learning; Adversarial training; Adaptive fusion",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/469518c6095c7665c6a01466804b0c6dd9873873.zip",
        "author": "Ruohan Yang;Junyang Chen;Huan Wang;Mengzhu Wang;Ziwen Cui;Victor C. M. Leung;Di Wang",
        "authorids": "~Ruohan_Yang5;~Junyang_Chen1;~Huan_Wang13;~Mengzhu_Wang1;~Ziwen_Cui1;~Victor_C._M._Leung1;~Di_Wang1",
        "gender": ";M;M;;M;M;",
        "homepage": ";https://csse.szu.edu.cn/pages/user/index?id=1101;https://faculty.hzau.edu.cn/wanghuan/en/index.htm;;;https://people.ece.ubc.ca/vleung/;",
        "dblp": ";196/7893.html;70/6155-5;;309/4502;36/4847.html;",
        "google_scholar": ";Q0u3dRQAAAAJ;https://scholar.google.com/citations?hl=zh-CN;;https://scholar.google.com.hk/citations?user=P9rbSEwAAAAJ;https://scholar.google.ca/citations?user=ajvCoo4AAAAJ;",
        "orcid": ";0000-0002-1139-8654;0000-0002-3162-2350;;;0000-0003-3529-2640;",
        "linkedin": ";;;;;vcmleung/;",
        "or_profile": "~Ruohan_Yang5;~Junyang_Chen1;~Huan_Wang13;~Mengzhu_Wang1;~Ziwen_Cui1;~Victor_C._M._Leung1;~Di_Wang1",
        "aff": ";Shenzhen University;Huazhong Agricultural University;;Huazhong Agricultural University;University of British Columbia;",
        "aff_domain": ";szu.edu;hzau.edu.cn;;hzau.edu.cn;ece.ubc.ca;",
        "position": ";Assistant Professor;Associate Professor;;MS student;Emeritus;",
        "bibtex": "@misc{\nyang2024adversarial,\ntitle={Adversarial enhanced representation for link prediction in multi-layer networks},\nauthor={Ruohan Yang and Junyang Chen and Huan Wang and Mengzhu Wang and Ziwen Cui and Victor C. M. Leung and Di Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=RXU6qde675}\n}",
        "github": "",
        "project": "",
        "reviewers": "zmKs;rv4f;m29U;L4YV",
        "site": "https://openreview.net/forum?id=RXU6qde675",
        "pdf_size": 1538859,
        "rating": "1;3;3;3",
        "confidence": "4;5;5;4",
        "soundness": "1;3;2;2",
        "contribution": "1;1;2;2",
        "presentation": "2;3;1;2",
        "wc_summary": "172;64;75;81",
        "wc_strengths": "28;66;19;52",
        "wc_weaknesses": "233;248;238;177",
        "wc_questions": "271;9;33;41",
        "wc_review": "704;387;365;351",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            98.0,
            43.15669125408017
        ],
        "wc_strengths_avg": [
            41.25,
            18.699933154960743
        ],
        "wc_weaknesses_avg": [
            224.0,
            27.667670664513846
        ],
        "wc_questions_avg": [
            88.5,
            106.022403292889
        ],
        "wc_review_avg": [
            451.75,
            146.20084644077818
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:OuvQadcgq3UJ:scholar.google.com/&scioq=Adversarial+enhanced+representation+for+link+prediction+in+multi-layer+networks&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "Shenzhen University;Huazhong Agricultural University;University of British Columbia",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.szu.edu.cn;http://www.hzau.edu.cn/;https://www.ubc.ca",
        "aff_unique_abbr": "SZU;HAU;UBC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "China;Canada"
    },
    {
        "id": "RXVYOCGO7g",
        "title": "Mitigating Backdoor Attacks in Federated Learning through Noise-Guided Aggregation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Backdoor attack in federated learning (FL) has attracted much attention in the literature due to its destructive power. Advanced backdoor defense methods mainly involve modifying the server's aggregation rule to filter out malicious models through some pre-defined metrics. However, calculating these metrics involves malicious models, leading to biased metrics and defense failure. Therefore, a straightforward approach is to design a metric not tainted by malicious models. For instance, if the server has private data to evaluate model performance, then model performance would be an effective metric for backdoor defense. However, directly introducing data-related information may cause privacy issues, we thus propose $\\textit{n}$oise-gu$\\textit{i}$ded $\\textit{r}$obust $\\textit{a}$ggregation, Nira, which trains and evaluates models using pure noise. Specifically, Nira constructs a noise dataset and shares it across the server and clients, enabling clients to train their models over the shared noise and local data. To ensure the generalizability of models trained on noise, Nira encourages clients to align their local data to shared noise in the representation space. Consequently, Nira can filter out models prior to aggregation according to the model performance, e.g., prediction accuracy on noise. We conduct extensive experiments to verify the effectiveness of Nira against backdoor attacks, demonstrating the superiority over previous works by a substantial margin.",
        "keywords": "Federated Learning;Backdoor Attacks;Generative Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Haoqiang Zhang;Yonggang Zhang;Qizhou Wang;Bo Han;Defu Lian;Enhong Chen",
        "authorids": "~Haoqiang_Zhang1;~Yonggang_Zhang1;~Qizhou_Wang1;~Bo_Han1;~Defu_Lian1;~Enhong_Chen1",
        "gender": ";M;;;M;M",
        "homepage": "https://github.com/zhq615;https://yonggangzhangben.github.io/index.html;;;https://faculty.ustc.edu.cn/liandefu/en/index.htm;http://staff.ustc.edu.cn/~cheneh",
        "dblp": ";27/6859-3;;;87/10734;07/258",
        "google_scholar": ";XSbEr98AAAAJ;;;QW0ad4sAAAAJ;Q9h02J0AAAAJ",
        "orcid": ";0000-0002-4080-7592;;;0000-0002-3507-9607;0000-0002-4835-4102",
        "linkedin": ";;;;;",
        "or_profile": "~Haoqiang_Zhang1;~Yonggang_Zhang1;~Qizhou_Wang1;~Bo_Han1;~Defu_Lian1;~Enhong_Chen1",
        "aff": "University of Science and Technology of China;Hong Kong Baptist University;;;University of Science and Technology of China;University of Science and Technology of China",
        "aff_domain": "ustc.edu.cn;hkbu.edu.hk;;;ustc.edu.cn;ustc.edu.cn",
        "position": "MS student;Postdoc;;;Full Professor;Full Professor",
        "bibtex": "@misc{\nzhang2024mitigating,\ntitle={Mitigating Backdoor Attacks in Federated Learning through Noise-Guided Aggregation},\nauthor={Haoqiang Zhang and Yonggang Zhang and Qizhou Wang and Bo Han and Defu Lian and Enhong Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=RXVYOCGO7g}\n}",
        "github": "",
        "project": "",
        "reviewers": "ig5G;yMFU;nxZi",
        "site": "https://openreview.net/forum?id=RXVYOCGO7g",
        "pdf_size": 12997546,
        "rating": "3;6;6",
        "confidence": "5;4;3",
        "soundness": "2;3;3",
        "contribution": "2;3;2",
        "presentation": "3;2;3",
        "wc_summary": "43;18;97",
        "wc_strengths": "34;57;74",
        "wc_weaknesses": "247;234;189",
        "wc_questions": "24;265;3",
        "wc_review": "348;574;363",
        "wc_reply_reviewers": "233;183;0",
        "wc_reply_authors": "2577;1672;440",
        "reply_reviewers": "1;2;0",
        "reply_authors": "7;5;1",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            52.666666666666664,
            32.96799795087486
        ],
        "wc_strengths_avg": [
            55.0,
            16.391054470858997
        ],
        "wc_weaknesses_avg": [
            223.33333333333334,
            24.850665092821068
        ],
        "wc_questions_avg": [
            97.33333333333333,
            118.86780706127104
        ],
        "wc_review_avg": [
            428.3333333333333,
            103.18376271918412
        ],
        "wc_reply_reviewers_avg": [
            138.66666666666666,
            100.15432536285634
        ],
        "wc_reply_authors_avg": [
            1563.0,
            875.8245638634867
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            4.333333333333333,
            2.494438257849294
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.8660254037844387,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:lnUFwQg3_00J:scholar.google.com/&scioq=Mitigating+Backdoor+Attacks+in+Federated+Learning+through+Noise-Guided+Aggregation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "University of Science and Technology of China;Hong Kong Baptist University",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.ustc.edu.cn;https://www.hkbu.edu.hk",
        "aff_unique_abbr": "USTC;HKBU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "RY0yYsTxGM",
        "title": "Phi-Former: A Pairwise Hierarchical Approach for Compound-Protein Interaction Prediction",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Predicting compound-protein interactions (CPIs) is critical for AI-aided drug design. Recent deep learning (DL) methods have successfully modeled molecular interactions at the atomic level, achieving both efficiency and accuracy improvements compared to traditional energy-based methods. However, these models do not always align with the chemical realities of CPIs, as molecular fragments (i.e., motifs) often participate in the interactions dominantly. In this paper, we aim to fill this gap by considering the role of motifs for CPIs. We propose a pair-wise hierarchical interaction representation learning (Phi-former) method. Phi-former represents the compound or protein hierarchically and employs a pair-wise specific pre-training framework for modeling the interactions in a more systematic way~(i.e., atom-atom, motif-motif, and atom-motif). We propose an intra-level and inter-level Phi-former pipeline for learning the pair-wise biomolecular graph representation, making learning the different interaction levels mutually beneficial. We demonstrate that Phi-former can achieve superior performance on CPI-related tasks. Furthermore, a case study indicates that our method can accurately identify the specific atoms or motifs activated in CPIs, and thus provide good model explanations that may give insights into molecular structural optimization.",
        "keywords": "compound-protein interaction;graph transformer;hierarchy graph;biomolecule affinity prediction",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/ff6d00f2d1472e0f35086ff2ff5b50f710b19c95.pdf",
        "author": "ZHE WANG;Siyuan Liu;Chun Cai;Zijing Liu;Chencheng Xu;Jia Li;Yuan Yao",
        "authorids": "~ZHE_WANG32;~Siyuan_Liu3;~Chun_Cai1;~Zijing_Liu1;~Chencheng_Xu1;~Jia_Li4;~Yuan_Yao1",
        "gender": "M;M;M;;F;M;Unspecified",
        "homepage": ";;;https://github.com/zj-liu;;https://sites.google.com/view/lijia;https://yao-lab.github.io/",
        "dblp": ";;;205/3211;261/4841.html;23/6950-9;25/4120-11.html",
        "google_scholar": "bb7F_OQAAAAJ;;;;gthKG_8AAAAJ;1gSbcYoAAAAJ;OOlHr-wAAAAJ",
        "orcid": ";0000-0002-1318-6540;0000-0001-6242-0439;0000-0002-0189-7409;;0000-0002-6362-4385;0000-0001-5814-1162",
        "linkedin": ";;caic99;;;;",
        "or_profile": "~ZHE_WANG32;~Siyuan_Liu3;~Chun_Cai1;~Zijing_Liu1;~Chencheng_Xu1;~Jia_Li4;~Yuan_Yao1",
        "aff": "Hong Kong University of Science and Technology;DP Technology;Beijing DP Technology Co., Ltd.;International Digital Economy Academy;;Hong Kong University of Science and Technology (Guangzhou);Hong Kong University of Science and Technology",
        "aff_domain": "ust.hk;dp.tech;dp.tech;idea.edu.cn;;ust.hk;ust.hk",
        "position": "PhD student;Researcher;Researcher;Researcher;;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nwang2024phiformer,\ntitle={Phi-Former: A Pairwise Hierarchical Approach for Compound-Protein Interaction Prediction},\nauthor={ZHE WANG and Siyuan Liu and Chun Cai and Zijing Liu and Chencheng Xu and Jia Li and Yuan Yao},\nyear={2024},\nurl={https://openreview.net/forum?id=RY0yYsTxGM}\n}",
        "github": "",
        "project": "",
        "reviewers": "1zG2;M7EC;b38p;smio",
        "site": "https://openreview.net/forum?id=RY0yYsTxGM",
        "pdf_size": 2188323,
        "rating": "1;3;3;5",
        "confidence": "4;4;4;5",
        "soundness": "2;3;2;3",
        "contribution": "2;2;1;2",
        "presentation": "1;2;2;3",
        "wc_summary": "56;91;89;118",
        "wc_strengths": "57;31;33;115",
        "wc_weaknesses": "470;58;354;190",
        "wc_questions": "5;48;81;105",
        "wc_review": "588;228;557;528",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            88.5,
            21.982947936980608
        ],
        "wc_strengths_avg": [
            59.0,
            33.91164991562634
        ],
        "wc_weaknesses_avg": [
            268.0,
            156.83111936092274
        ],
        "wc_questions_avg": [
            59.75,
            37.53248592885902
        ],
        "wc_review_avg": [
            475.25,
            144.31800823182115
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:JaWUn2G-FAYJ:scholar.google.com/&scioq=Phi-Former:+A+Pairwise+Hierarchical+Approach+for+Compound-Protein+Interaction+Prediction&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;0;0",
        "aff_unique_norm": "Hong Kong University of Science and Technology;DP Technology;Beijing DP Technology Co., Ltd.;International Digital Economy Academy",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.ust.hk;;;",
        "aff_unique_abbr": "HKUST;;;",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China;"
    },
    {
        "title": "Zero-Mean Regularized Spectral Contrastive Learning: Implicitly Mitigating Wrong Connections in Positive-Pair Graphs",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18639",
        "id": "RZBy8oHTz4",
        "author_site": "Xiong Zhou, Xianming Liu, feilong zhang, Gang Wu, Deming Zhai, Junjun Jiang, Xiangyang Ji",
        "tldr": "",
        "abstract": "Contrastive learning has emerged as a popular paradigm of self-supervised learning that learns representations by encouraging representations of positive pairs to be similar while representations of negative pairs to be far apart. The spectral contrastive loss, in synergy with the notion of positive-pair graphs, offers valuable theoretical insights into the empirical successes of contrastive learning. In this paper, we propose incorporating an additive factor into the term of spectral contrastive loss involving negative pairs. This simple modification can be equivalently viewed as introducing a regularization term that enforces the mean of representations to be zero, which thus is referred to as *zero-mean regularization*. It intuitively relaxes the orthogonality of representations between negative pairs and implicitly alleviates the adverse effect of wrong connections in the positive-pair graph, leading to better performance and robustness. To clarify this, we thoroughly investigate the role of zero-mean regularized spectral contrastive loss in both unsupervised and supervised scenarios with respect to theoretical analysis and quantitative evaluation. These results highlight the potential of zero-mean regularized spectral contrastive learning to be a promising approach in various tasks.",
        "keywords": "Contrastive Learning;Unsupervised Domain Adaptation;Learning with Noisy Labels",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/78f00f07c2ed5e3d8b626f9ea7a7c7d25c43f0c0.zip",
        "author": "Xiong Zhou;Xianming Liu;Feilong Zhang;Gang Wu;Deming Zhai;Junjun Jiang;Xiangyang Ji",
        "authorids": "~Xiong_Zhou3;~Xianming_Liu5;~Feilong_Zhang1;~Gang_Wu5;~Deming_Zhai2;~Junjun_Jiang2;~Xiangyang_Ji1",
        "gender": "M;M;;M;F;M;",
        "homepage": "https://hitcszx.github.io/;http://homepage.hit.edu.cn/xmliu;;http://www.aitica.cn;;http://homepage.hit.edu.cn/jiangjunjun;",
        "dblp": ";89/58201.html;;99/6515-10;69/8937;https://dblp.uni-trier.de/pers/hd/j/Jiang:Junjun;",
        "google_scholar": "BMGootgAAAAJ;;;JSqb7QIAAAAJ;;WNH2_rgAAAAJ;",
        "orcid": "0000-0002-0856-6696;0000-0002-8857-1785;;0009-0007-5003-3117;;0000-0002-5694-505X;",
        "linkedin": ";;;;;;",
        "or_profile": "~Xiong_Zhou3;~Xianming_Liu5;~Feilong_Zhang1;~Gang_Wu5;~Deming_Zhai2;~Junjun_Jiang2;~Xiangyang_Ji1",
        "aff": "Harbin Institute of Technology;Harbin Institute of Technology;;Harbin Institute of Technology;Harbin Institute of Technology;Harbin Institute of Technology;",
        "aff_domain": "hit.edu.cn;hit.edu.cn;;hit.edu.cn;hit.edu.cn;hit.edu.cn;",
        "position": "PhD student;Full Professor;;PhD student;Associate Professor;Full Professor;",
        "bibtex": "@inproceedings{\nzhou2024zeromean,\ntitle={Zero-Mean Regularized Spectral Contrastive Learning: Implicitly Mitigating Wrong Connections in Positive-Pair Graphs},\nauthor={Xiong Zhou and Xianming Liu and Feilong Zhang and Gang Wu and Deming Zhai and Junjun Jiang and Xiangyang Ji},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=RZBy8oHTz4}\n}",
        "github": "",
        "project": "",
        "reviewers": "41KY;9yLv;Ef5A",
        "pdf_size": 1724835,
        "rating": "6;6;6",
        "confidence": "3;3;5",
        "soundness": "3;3;4",
        "contribution": "2;3;2",
        "presentation": "3;3;4",
        "wc_summary": "37;31;61",
        "wc_strengths": "88;24;50",
        "wc_weaknesses": "92;70;43",
        "wc_questions": "114;18;33",
        "wc_review": "331;143;187",
        "wc_reply_reviewers": "0;20;0",
        "wc_reply_authors": "1312;917;517",
        "reply_reviewers": "0;1;0",
        "reply_authors": "3;3;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            43.0,
            12.96148139681572
        ],
        "wc_strengths_avg": [
            54.0,
            26.280537792569366
        ],
        "wc_weaknesses_avg": [
            68.33333333333333,
            20.038851153585515
        ],
        "wc_questions_avg": [
            55.0,
            42.16633728461603
        ],
        "wc_review_avg": [
            220.33333333333334,
            80.28836915906452
        ],
        "wc_reply_reviewers_avg": [
            6.666666666666667,
            9.428090415820632
        ],
        "wc_reply_authors_avg": [
            915.3333333333334,
            324.55953057781073
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5570454177756521133&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=RZBy8oHTz4",
        "pdf": "https://openreview.net/pdf?id=RZBy8oHTz4",
        "email": "hit.edu.cn;hit.edu.cn;;hit.edu.cn;hit.edu.cn;hit.edu.cn;",
        "author_num": 7,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Harbin Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.hit.edu.cn/",
        "aff_unique_abbr": "HIT",
        "aff_campus_unique_index": "0;0;0;0;0",
        "aff_campus_unique": "Harbin",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "RacYdzHxcz",
        "title": "Human-Producible Adversarial Examples",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Visual adversarial examples have been so far restricted to pixel-level image manipulations in the digital world, or have required sophisticated equipment such as 2D or 3D printers to be produced in the physical real world. We present the first ever method of generating human-producible adversarial examples for the real world that requires nothing more complicated than a marker pen. We call them $\\textbf{\\textit{adversarial tags}}$. First, building on top of differential rendering, we demonstrate that it is possible to build potent adversarial examples with just lines. We find that by drawing just $4$ lines we can disrupt  a YOLO-based model in $54.8$% of the cases. Increase this to $9$ lines disrupts $81.8$% of tested cases. Next, we devise an improved method for placement of the lines to be invariant to human drawing error. We thoroughly evaluate our system in both digital and analogue worlds and demonstrate that our tags can be applied by untrained humans. We demonstrate the effectiveness of our method for producing real world adversarial examples by conducting a user study whereby participants were asked to draw over printed-out images using the digital equivalents as guides. We further evaluate the effectiveness of both targeted and untargeted attacks, and discuss various trade-offs and method limitations, as well as the practical and ethical implications of our work. The source code will be released publicly.",
        "keywords": "adversarial;cnn;human;example;yolo;real world",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "David Khachaturov;Yue Gao;Ilia Shumailov;Robert D. Mullins;Ross Anderson;Kassem Fawaz",
        "authorids": "~David_Khachaturov1;~Yue_Gao7;~Ilia_Shumailov1;~Robert_D._Mullins1;~Ross_Anderson3;~Kassem_Fawaz1",
        "gender": ";M;M;;Unspecified;M",
        "homepage": "https://davidobot.net/;https://pages.cs.wisc.edu/~gy/;https://www.cl.cam.ac.uk/~rja14;https://kassemfawaz.com;https://www.cl.cam.ac.uk/~is410/;https://www.csat.cam.ac.uk/~rdm34",
        "dblp": ";33/3099-11;;97/535.html;213/8587;31/789",
        "google_scholar": "https://scholar.google.co.uk/citations?user=6Lt77koAAAAJ;LKuguQ8AAAAJ;WgyDcoUAAAAJ;8TINuv4AAAAJ;https://scholar.google.co.uk/citations?hl=en;zjXO2HMAAAAJ",
        "orcid": ";0000-0002-5825-8712;;0000-0002-4609-7691;;",
        "linkedin": ";;;kmfawaz/;ilia-shumailov/;",
        "or_profile": "~David_Khachaturov1;~Yue_Gao7;~Ross_Anderson3;~Kassem_Fawaz1;~I_Shumailov1;~Robert_Mullins1",
        "aff": "University of Cambridge;Department of Computer Science, University of Wisconsin - Madison;University of Cambridge;University of Wisconsin - Madison;Google DeepMind;University of Cambridge",
        "aff_domain": "cam.ac.uk;cs.wisc.edu;cam.ac.uk;wisc.edu;google.com;cam.ac.uk",
        "position": "PhD student;PhD student;Full Professor;Associate Professor;Research Scientist;Full Professor",
        "bibtex": "@misc{\nkhachaturov2024humanproducible,\ntitle={Human-Producible Adversarial Examples},\nauthor={David Khachaturov and Yue Gao and Ilia Shumailov and Robert D. Mullins and Ross Anderson and Kassem Fawaz},\nyear={2024},\nurl={https://openreview.net/forum?id=RacYdzHxcz}\n}",
        "github": "",
        "project": "",
        "reviewers": "Xsun;zAVL;HZPa;e2cA",
        "site": "https://openreview.net/forum?id=RacYdzHxcz",
        "pdf_size": 2889045,
        "rating": "3;3;3;5",
        "confidence": "5;3;4;4",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "3;2;4;2",
        "wc_summary": "79;34;195;48",
        "wc_strengths": "46;74;188;35",
        "wc_weaknesses": "440;157;453;83",
        "wc_questions": "4;58;165;98",
        "wc_review": "569;323;1001;264",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "812;343;1344;662",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            89.0,
            63.32850858815483
        ],
        "wc_strengths_avg": [
            85.75,
            60.722215868658814
        ],
        "wc_weaknesses_avg": [
            283.25,
            165.39706013106763
        ],
        "wc_questions_avg": [
            81.25,
            58.74255271947245
        ],
        "wc_review_avg": [
            539.25,
            290.09685882477254
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            790.25,
            361.7985454641851
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6642318423500530348&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;1;2;0",
        "aff_unique_norm": "University of Cambridge;University of Wisconsin-Madison;Google",
        "aff_unique_dep": ";Department of Computer Science;Google DeepMind",
        "aff_unique_url": "https://www.cam.ac.uk;https://www.wisc.edu;https://deepmind.com",
        "aff_unique_abbr": "Cambridge;UW-Madison;DeepMind",
        "aff_campus_unique_index": "0;1;0;1;0",
        "aff_campus_unique": "Cambridge;Madison;",
        "aff_country_unique_index": "0;1;0;1;0;0",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "id": "RadQVWAucN",
        "title": "LLM-Rec: Personalized Recommendation via Prompting Large Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Text-based recommendation holds a wide range of practical applications due to its versatility, as textual descriptions can represent nearly any type of item. However, directly employing the original item descriptions as input features may not yield optimal recommendation performance. This limitation arises because these descriptions often lack comprehensive information that can be effectively exploited to align with user preferences. Recent advances in large language models (LLMs) have showcased their remarkable ability to harness commonsense knowledge and reasoning. In this study, we investigate diverse prompting strategies aimed at $\\textit{augmenting the input text}$ to enhance personalized text-based recommendations. Our novel approach, coined  $\\textbf{LLM-Rec}$, encompasses four distinct prompting techniques: (1) basic prompting, (2) recommendation-driven prompting, (3) engagement-guided prompting, and (4) recommendation-driven + engagement-guided prompting. Our empirical experiments show that incorporating the augmented input text generated by the LLMs yields discernible improvements in recommendation performance. Notably, the recommendation-driven and engagement-guided prompting strategies exhibit the capability to tap into the language model's comprehension of both general and personalized item characteristics. This underscores the  significance of leveraging a spectrum of prompts and input augmentation techniques to enhance the recommendation prowess of LLMs.",
        "keywords": "recommendation;large language model;input augmentation;personalization",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/c155a43669252cce13b3bb12b1f3748b59666501.pdf",
        "author": "Hanjia Lyu;Song Jiang;Hanqing Zeng;Yinglong Xia;Qifan Wang;Si Zhang;Chris Leung;Ren Chen;Jiajie Tang;Jiebo Luo",
        "authorids": "~Hanjia_Lyu1;~Song_Jiang1;~Hanqing_Zeng1;~Yinglong_Xia1;~Qifan_Wang2;~Si_Zhang1;~Chris_Leung1;~Ren_Chen1;~Jiajie_Tang1;~Jiebo_Luo1",
        "gender": ";M;M;M;M;M;M;M;F;M",
        "homepage": "https://brucelyu17.github.io/;https://songjiang0909.github.io/;https://hanqingzeng.com;;https://wqfcr.github.io/;https://sizhang2.web.illinois.edu/;http://www.christopherleung.ca/;;;https://www.cs.rochester.edu/u/jluo/",
        "dblp": "256/5541;08/237-2;136/2474;61/3251;33/8610;119/2063;;;;25/5545",
        "google_scholar": "tPhwyYsAAAAJ;SjbhMQEAAAAJ;ubUx3R0AAAAJ;;LrSyLosAAAAJ;JCs-EyYAAAAJ;;;;CcbnBvgAAAAJ",
        "orcid": "0000-0002-3876-0094;;;0000-0002-8155-5440;0000-0002-7570-5756;;;;;0000-0002-4516-9729",
        "linkedin": ";;hanqing-zeng-a9477995/;;;;;ren-chen-usc/;jiajietang/;jieboluo/",
        "or_profile": "~Hanjia_Lyu1;~Song_Jiang1;~Hanqing_Zeng1;~Yinglong_Xia1;~Qifan_Wang2;~Si_Zhang1;~Chris_Leung1;~Ren_Chen1;~Jiajie_Tang1;~Jiebo_Luo3",
        "aff": "University of Rochester;University of California, Los Angeles;Meta AI;Meta;Meta AI;Meta;College of Computing, Georgia Institute of Technology;;;University of Rochester",
        "aff_domain": "rochester.edu;ucla.edu;meta.com;meta.com;fb.com;fb.com;cc.gatech.edu;;;rochester.edu",
        "position": "PhD student;PhD student;Researcher;Researcher;Principal Researcher;Researcher;Researcher;;;Full Professor",
        "bibtex": "@misc{\nlyu2024llmrec,\ntitle={{LLM}-Rec: Personalized Recommendation via Prompting Large Language Models},\nauthor={Hanjia Lyu and Song Jiang and Hanqing Zeng and Yinglong Xia and Qifan Wang and Si Zhang and Chris Leung and Ren Chen and Jiajie Tang and Jiebo Luo},\nyear={2024},\nurl={https://openreview.net/forum?id=RadQVWAucN}\n}",
        "github": "",
        "project": "",
        "reviewers": "vwfB;mt1T;UhyT;u86v",
        "site": "https://openreview.net/forum?id=RadQVWAucN",
        "pdf_size": 1181628,
        "rating": "3;3;3;6",
        "confidence": "4;4;5;3",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;2;4",
        "wc_summary": "36;103;100;157",
        "wc_strengths": "24;28;85;79",
        "wc_weaknesses": "116;28;204;88",
        "wc_questions": "12;177;34;4",
        "wc_review": "188;336;423;328",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "141;409;1037;33",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            99.0,
            42.86607049870562
        ],
        "wc_strengths_avg": [
            54.0,
            28.115831839019098
        ],
        "wc_weaknesses_avg": [
            109.0,
            63.39558344238185
        ],
        "wc_questions_avg": [
            56.75,
            70.29002418551298
        ],
        "wc_review_avg": [
            318.75,
            84.18246551390617
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            405.0,
            389.71784665319086
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 128,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4356677214877592971&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;2;2;2;2;3;0",
        "aff_unique_norm": "University of Rochester;University of California, Los Angeles;Meta;Georgia Institute of Technology",
        "aff_unique_dep": ";;Meta AI;College of Computing",
        "aff_unique_url": "https://www.rochester.edu;https://www.ucla.edu;https://meta.com;https://www.gatech.edu",
        "aff_unique_abbr": "U of R;UCLA;Meta;Georgia Tech",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Los Angeles;Atlanta",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "RagoEXCtmn",
        "title": "Open Domain Generalized Semantic Segmentation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Conventional domain generalized semantic segmentation (DGS) aims to learn a generalized segmentation model for unknown target domains by utilizing only the labeled source domain under distribution shifts. Typically, it assumes that the category sets are consistent across domains. However, in real-world applications, it is not always possible to find labeled source data that precisely cover the category sets of the target domains. Therefore, in this paper, we study a more practical and challenging problem of open domain generalized semantic segmentation (ODGS), which is a non-trivial task as it involves both distribution shifts and category set shifts (i.e., open categories in unknown target domains). To tackle these shifts, we introduce three Semantic-oriented components which together form a simple yet effective CLIP-adapted framework called SoCLIP. (1) Semantic Definition Prompt mitigates the visual-language ambiguity by incorporating category definitions into the text prompt template. (2) Semantic Prompt Tuning first queries a powerful large language model, e.g., ChatGPT, to obtain domain-agnostic semantic cues, and then project and tune these cue prompts to assist the fixed image encoder in exploring domain-invariant pixel-level knowledge. (3) Semantic-preserved Randomization leverages the Fourier Transform to randomize the source domain with semantic preservation, preventing overfitting to the training domain. With the integration of these components, SoCLIP significantly outperforms state-of-the-art methods in both open-set and closed-set (i.e., conventional) settings.",
        "keywords": "domain generalization;out-of-distribution;semantic segmentation",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Lin Chen",
        "authorids": "~Lin_Chen18",
        "gender": "M",
        "homepage": "https://lin-chen.site",
        "dblp": "13/3479-19",
        "google_scholar": "https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0002-1546-791X",
        "linkedin": "",
        "or_profile": "~Lin_Chen18",
        "aff": "University of Science and Technology of China",
        "aff_domain": "ustc.edu.cn",
        "position": "MS student",
        "bibtex": "@misc{\nchen2024open,\ntitle={Open Domain Generalized Semantic Segmentation},\nauthor={Lin Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=RagoEXCtmn}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=RagoEXCtmn",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:XdWJgvZAuUAJ:scholar.google.com/&scioq=Open+Domain+Generalized+Semantic+Segmentation&hl=en&as_sdt=0,21",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Science and Technology of China",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.ustc.edu.cn",
        "aff_unique_abbr": "USTC",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "title": "Tree Search-Based Policy Optimization under Stochastic Execution Delay",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18638",
        "id": "RaqZX9LSGA",
        "author_site": "David Valensi, Esther Derman, Shie Mannor, Gal Dalal",
        "tldr": "",
        "abstract": "The standard formulation of Markov decision processes (MDPs) assumes that the agent's decisions are executed immediately.\nHowever, in numerous realistic applications such as robotics or healthcare, actions are performed with a delay whose value can even be stochastic. In this work, we introduce stochastic delayed execution MDPs, a new formalism addressing random delays without resorting to state augmentation. We show that given observed delay values, it is sufficient to perform a policy search in the class of Markov policies in order to reach optimal performance, thus extending the deterministic fixed delay case. Armed with this insight, we devise DEZ, a model-based algorithm that optimizes over the class of Markov policies. DEZ leverages Monte-Carlo tree search similar to its non-delayed variant EfficientZero to accurately infer future states from the action queue. Thus, it handles delayed execution while preserving the sample efficiency of EfficientZero. Through empirical analysis, we stress that none of the prior benchmarks consistently outperforms others across different delays. We demonstrate that our algorithm surpasses all benchmark methods in Atari games when dealing with constant or stochastic delays. The code is available at \\url{https://github.com/davidva1/Delayed-EZ}.",
        "keywords": "Reinforcement Learning;Delay;EfficientZero;Tree-search;Sample efficiency",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/f629821f2c338399309992cc79dc12d8436ea6df.pdf",
        "author": "David Valensi;Esther Derman;Shie Mannor;Gal Dalal",
        "authorids": "~David_Valensi1;~Esther_Derman1;~Shie_Mannor2;~Gal_Dalal2",
        "gender": "M;;M;",
        "homepage": ";;https://shie.net.technion.ac.il;",
        "dblp": ";;20/1669;",
        "google_scholar": ";;https://scholar.google.com.tw/citations?user=q1HlbIUAAAAJ;",
        "orcid": ";;;",
        "linkedin": "david-valensi-650ba514a/;;;",
        "or_profile": "~David_Valensi1;~Esther_Derman1;~Shie_Mannor2;~Gal_Dalal2",
        "aff": "Technion - Israel Institute of Technology, Technion - Israel Institute of Technology;;Technion - Israel Institute of Technology, Technion;",
        "aff_domain": "campus.technion.ac.il;;technion.il;",
        "position": "MS student;;Full Professor;",
        "bibtex": "@inproceedings{\nvalensi2024tree,\ntitle={Tree Search-Based Policy Optimization under Stochastic Execution Delay},\nauthor={David Valensi and Esther Derman and Shie Mannor and Gal Dalal},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=RaqZX9LSGA}\n}",
        "github": "",
        "project": "",
        "reviewers": "yeMT;Rzwe;zW4Z;eDQ2",
        "pdf_size": 6355074,
        "rating": "5;6;6;6",
        "confidence": "3;4;3;3",
        "soundness": "2;2;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;2;2;3",
        "wc_summary": "70;63;85;66",
        "wc_strengths": "187;24;66;89",
        "wc_weaknesses": "151;54;129;70",
        "wc_questions": "35;286;58;2",
        "wc_review": "443;427;338;227",
        "wc_reply_reviewers": "0;28;0;11",
        "wc_reply_authors": "558;401;156;100",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            71.0,
            8.455767262643882
        ],
        "wc_strengths_avg": [
            91.5,
            59.860253925288355
        ],
        "wc_weaknesses_avg": [
            101.0,
            40.168395536789866
        ],
        "wc_questions_avg": [
            95.25,
            111.91375027225207
        ],
        "wc_review_avg": [
            358.75,
            85.94293164652926
        ],
        "wc_reply_reviewers_avg": [
            9.75,
            11.453711188955307
        ],
        "wc_reply_authors_avg": [
            303.75,
            185.36770889235265
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16790466620997191064&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=RaqZX9LSGA",
        "pdf": "https://openreview.net/pdf?id=RaqZX9LSGA",
        "email": "campus.technion.ac.il;;technion.il;",
        "author_num": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Technion - Israel Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.technion.ac.il/en/",
        "aff_unique_abbr": "Technion",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Israel"
    },
    {
        "id": "RauUgiw7VX",
        "title": "Fine-grained Text-to-Image Synthesis with Semantic Refinement",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent advance in text-to-image synthesis greatly benefits from large-scale vision-language models such as CLIP. Despite the capability of producing high-quality and creative images, existing methods often struggle in capturing details of the text prompt, especially when the text is lengthy. We reveal that such an issue is partially caused by the imperfect text-image matching using CLIP, where fine-grained semantics may get obscured by the dominant ones. This work presents a new diffusion-based method that favors fine-grained synthesis with semantic refinement. Concretely, instead of getting a synthesis using the entire descriptive sentence as the prompt, users can emphasize some specific words of their own interests. For this purpose, we incorporate a semantic-induced gradient as a reference input in each denoising step to help the model understand the selected sub-concept. We find out that our framework supports the combination of multiple semantics by directly adding up their corresponding gradients. Extensive results on various datasets suggest that our approach outperforms existing text-to-image generation methods by synthesizing semantic details with finer granularity.",
        "keywords": "Text-to-image Synthesis;Diffusion model",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Jianxin Sun;Lianghua Huang;Yingya Zhang;Yujun Shen;Ruili Feng;Qi Li;Deli Zhao;Zhenan Sun;Jingren Zhou",
        "authorids": "~Jianxin_Sun2;~Lianghua_Huang2;~Yingya_Zhang3;~Yujun_Shen1;~Ruili_Feng1;~Qi_Li2;~Deli_Zhao1;~Zhenan_Sun1;~Jingren_Zhou1",
        "gender": "M;M;M;;;M;M;M;M",
        "homepage": "https://www.ia.ac.cn;;;;https://github.com/RuiLiFeng;https://liqi-casia.github.io/;https://zhaodeli.github.io;http://cripac.ia.ac.cn/people/znsun/index.html;",
        "dblp": "98/10799;166/6155;142/2510;;20/9594;181/2688-5;77/1992;13/5916;84/2644",
        "google_scholar": ";JYVCn3AAAAAJ;16RDSEUAAAAJ;;;https://scholar.google.com.hk/citations?user=OZxJfuMAAAAJ;https://scholar.google.com/citations?hl=en;PuZGODYAAAAJ;",
        "orcid": ";0000-0002-9686-9354;;;;;0000-0002-8838-578X;0000-0003-4029-9935;",
        "linkedin": ";;;;;;;;",
        "or_profile": "~Jianxin_Sun2;~Lianghua_Huang2;~Yingya_Zhang3;~Yujun_Shen1;~Ruili_Feng1;~Qi_Li2;~Deli_Zhao1;~Zhenan_Sun1;~Jingren_Zhou1",
        "aff": "Institute of Automation, Chinese Academy of Sciences;Alibaba Group;Alibaba Group;;University of Science and Technology of China;Institute of Automation, Chinese Academy of Sciences;Alibaba Group;Institute of Automation, Chinese Academy of Sciences;Alibaba Group",
        "aff_domain": "ia.ac.cn;aliabba-inc.com;alibaba-inc.com;;mail.ustc.edu.cn;ia.ac.cn;alibaba-inc.com;ia.ac.cn;alibaba-inc.com",
        "position": "PhD student;Researcher;Researcher;;PhD student;Associate Professor;Director;Full Professor;Researcher",
        "bibtex": "@misc{\nsun2024finegrained,\ntitle={Fine-grained Text-to-Image Synthesis with Semantic Refinement},\nauthor={Jianxin Sun and Lianghua Huang and Yingya Zhang and Yujun Shen and Ruili Feng and Qi Li and Deli Zhao and Zhenan Sun and Jingren Zhou},\nyear={2024},\nurl={https://openreview.net/forum?id=RauUgiw7VX}\n}",
        "github": "",
        "project": "",
        "reviewers": "qacC;AM6U;mHH3;KP2Z",
        "site": "https://openreview.net/forum?id=RauUgiw7VX",
        "pdf_size": 20792212,
        "rating": "3;5;5;6",
        "confidence": "4;4;5;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;2",
        "wc_summary": "20;45;55;102",
        "wc_strengths": "36;31;42;74",
        "wc_weaknesses": "38;206;171;35",
        "wc_questions": "226;15;62;39",
        "wc_review": "320;297;330;250",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            55.5,
            29.71952220342716
        ],
        "wc_strengths_avg": [
            45.75,
            16.768646337734005
        ],
        "wc_weaknesses_avg": [
            112.5,
            77.00811645534515
        ],
        "wc_questions_avg": [
            85.5,
            82.80247580839597
        ],
        "wc_review_avg": [
            299.25,
            30.849432733844555
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -0.3244428422615251,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ygOAw78CZ9cJ:scholar.google.com/&scioq=Fine-grained+Text-to-Image+Synthesis+with+Semantic+Refinement&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;2;0;1;0;1",
        "aff_unique_norm": "Chinese Academy of Sciences;Alibaba Group;University of Science and Technology of China",
        "aff_unique_dep": "Institute of Automation;;",
        "aff_unique_url": "http://www.ia.cas.cn;https://www.alibaba.com;http://www.ustc.edu.cn",
        "aff_unique_abbr": "CAS;Alibaba;USTC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "RbKThNNFxr",
        "title": "LoRA-FA: Memory-efficient Low-rank Adaptation for Large Language Models Fine-tuning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The low-rank adaptation (LoRA) method can largely reduce the amount of trainable parameters for fine-tuning large language models (LLMs) and it becomes a very common technique in fine-tuning LLMs. However, during fine-tuning, it still requires very expensive activation memory to update low-rank weights. Though there exist studies trying to reduce the storage of activations, they either would sacrifice model performance or take much longer time for fine-tuning models. To this end, we propose a memory-efficient fine-tuning method, named LoRA-FA, that significantly reduces the activation memory without performance degradation and extra computational costs. Specifically, LoRA-FA freezes the projection-down weight of $A$ and updates the projection-up weight of $B$ in each LoRA layer. It ensures the change of model weight reside in a low-rank space as like LoRA to preserve the fine-tuning performance while eliminating the requirement to store full-rank input activations so as to reduce the overall memory consumption. We conduct extensive experiments across multiple model types (RoBERTa, T5, LLaMA) and model scales. Our results show that LoRA-FA always preserves the fine-tuning accuracy across different tasks and it reduces the overall memory costs by up to 4$\\times$ and 1.4$\\times$ compared to full-parameter fine-tuning and LoRA, respectively. Furthermore, LoRA-FA is also compatible with other advanced memory optimization methods like FlashAttention, QLoRA, and ZeRO.",
        "keywords": "Low-rank adaptation;Memory-efficient;Large language models;Fine-tuning.",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Longteng Zhang;Lin Zhang;Shaohuai Shi;Xiaowen Chu;Bo Li",
        "authorids": "~Longteng_Zhang2;~Lin_Zhang11;~Shaohuai_Shi1;~Xiaowen_Chu2;~Bo_Li33",
        "gender": "M;;M;M;",
        "homepage": "https://github.com/AaronZLT;https://lzhangbv.github.io/;https://shaohuais.github.io/;https://facultyprofiles.hkust-gz.edu.cn/faculty-personal-page/CHU-Xiaowen/xwchu;",
        "dblp": ";;79/8378;24/2536;",
        "google_scholar": ";;https://scholar.google.com.hk/citations?user=Wr4B6fQAAAAJ;https://scholar.google.com.hk/citations?user=v4rX24EAAAAJ;",
        "orcid": ";0000-0001-8493-4705;0000-0002-1418-5160;0000-0001-9745-4372;",
        "linkedin": ";;;;",
        "or_profile": "~Longteng_Zhang2;~Lin_Zhang11;~Shaohuai_Shi1;~Xiaowen_Chu2;~Bo_Li33",
        "aff": "Hong Kong University of Science and Technology (GuangZhou);Huawei Technologies Ltd.;Harbin Institute of Technology, Shenzhen;Hong Kong University of Science and Technology (Guangzhou);",
        "aff_domain": "hkust.edu;huawei.com;hit.edu.cn;ust.hk;",
        "position": "PhD student;Researcher;Full Professor;Full Professor;",
        "bibtex": "@misc{\nzhang2024lorafa,\ntitle={Lo{RA}-{FA}: Memory-efficient Low-rank Adaptation for Large Language Models Fine-tuning},\nauthor={Longteng Zhang and Lin Zhang and Shaohuai Shi and Xiaowen Chu and Bo Li},\nyear={2024},\nurl={https://openreview.net/forum?id=RbKThNNFxr}\n}",
        "github": "",
        "project": "",
        "reviewers": "XvzM;s6YB;wXxt",
        "site": "https://openreview.net/forum?id=RbKThNNFxr",
        "pdf_size": 538078,
        "rating": "5;5;6",
        "confidence": "4;3;5",
        "soundness": "3;2;3",
        "contribution": "2;2;3",
        "presentation": "3;1;2",
        "wc_summary": "90;88;39",
        "wc_strengths": "103;78;25",
        "wc_weaknesses": "154;279;285",
        "wc_questions": "117;5;33",
        "wc_review": "464;450;382",
        "wc_reply_reviewers": "202;604;97",
        "wc_reply_authors": "474;2223;239",
        "reply_reviewers": "1;2;1",
        "reply_authors": "1;5;1",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            72.33333333333333,
            23.584363935078308
        ],
        "wc_strengths_avg": [
            68.66666666666667,
            32.52007926736274
        ],
        "wc_weaknesses_avg": [
            239.33333333333334,
            60.389476640296266
        ],
        "wc_questions_avg": [
            51.666666666666664,
            47.59084879353266
        ],
        "wc_review_avg": [
            432.0,
            35.81433604950212
        ],
        "wc_reply_reviewers_avg": [
            301.0,
            218.4994279168712
        ],
        "wc_reply_authors_avg": [
            978.6666666666666,
            885.0914579233544
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            1.8856180831641267
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.8660254037844385,
        "gs_citation": 115,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=229068356493021704&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Huawei;Harbin Institute of Technology",
        "aff_unique_dep": ";Huawei Technologies;",
        "aff_unique_url": "https://www.ust.hk;https://www.huawei.com;http://en.hhit.edu.cn/",
        "aff_unique_abbr": "HKUST;Huawei;HIT",
        "aff_campus_unique_index": "0;2;0",
        "aff_campus_unique": "Hong Kong SAR;;Shenzhen",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "Rc3RP9OoEJ",
        "title": "In-context Prompt Learning for Test-time Vision Recognition with Frozen Vision-Language Model",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Existing pre-trained vision-language models, e.g., CLIP, have displayed impressive zero-shot generalization capabilities in various downstream tasks. When facing test inputs with different distributions, however, the performance of these models will degrade significantly. To this end, we explore the concept of test-time prompt tuning (TTPT), which enables the adaptation of the CLIP model to novel downstream tasks through only one step of optimization on an unsupervised objective that involves the test sample. One noteworthy aspect is that TTPT operates without specific task supervision, such as fine-tuning. This makes it a particularly intriguing approach, as it allows us to investigate how a pre-trained visual-language model like CLIP can adapt to downstream tasks without requiring task-specific supervision or model modifications. \n\nDrawing inspiration from recent advancements in in-context learning within the field of natural language processing (NLP), we introduce the concept of \\textit{visual in-context prompting}. This involves associating a new test sample with very few or even just one labeled example as its in-context prompt. As a result, we can reliably estimate a label for the test sample, thereby facilitating the adaptation process. Our approach employs a token net to represent language descriptions as visual prompts that the vision encoder of a CLIP model can comprehend. Paired with in-context examples, we further propose a semi-supervised loss to optimize test sample-aware visual prompts. This optimization allows a pre-trained, frozen CLIP model to be adapted to a test sample from any task using its learned adaptive prompt. To further enhance the integration of visual and text prompts, we design a cyclic learning strategy. Our method has demonstrated superior performance and achieved state-of-the-art results across various downstream datasets.",
        "keywords": "prompt learning;in-context examples;test-time adaptation;vision and language model;vision recognition",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/bdb214c2aee480b653c63fefd4b10c8cb69eab32.pdf",
        "author": "Junhui Yin;Xinyu Zhang;Lin Yuanbo Wu;Xianghua Xie;Xiaojie Wang",
        "authorids": "~Junhui_Yin1;~Xinyu_Zhang3;~Lin_Yuanbo_Wu1;~Xianghua_Xie1;~Xiaojie_Wang1",
        "gender": "M;;F;;M",
        "homepage": ";;https://sites.google.com/site/linwuuq/home;http://csvision.swan.ac.uk;",
        "dblp": "260/6446;;65/6292-1;;99/7033-6",
        "google_scholar": "MB1AIQYAAAAJ;;https://scholar.google.com.au/citations?user=mMiJUegAAAAJ;;",
        "orcid": ";;0000-0001-6119-058X;;",
        "linkedin": ";;;;xiaojie-wang-4b732936/",
        "or_profile": "~Junhui_Yin1;~Xinyu_Zhang3;~Lin_Yuanbo_Wu1;~Xianghua_Xie1;~Xiaojie_Wang1",
        "aff": "Institute of Automation, Chinese Academy of Sciences;;Swansea University;Swansea University;Beijing University of Post and Telecommunication",
        "aff_domain": "ia.ac.cn;;swansea.ac.uk;swansea.ac.uk;bupt.edu.cn",
        "position": "Visiting Postdoc;;Associate Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nyin2024incontext,\ntitle={In-context Prompt Learning for Test-time Vision Recognition with Frozen Vision-Language Model},\nauthor={Junhui Yin and Xinyu Zhang and Lin Yuanbo Wu and Xianghua Xie and Xiaojie Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=Rc3RP9OoEJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "8csS;QS1Q;k8E2;3epP",
        "site": "https://openreview.net/forum?id=Rc3RP9OoEJ",
        "pdf_size": 6983598,
        "rating": "5;5;5;5",
        "confidence": "3;5;4;2",
        "soundness": "2;3;3;2",
        "contribution": "2;3;3;2",
        "presentation": "3;2;2;2",
        "wc_summary": "29;134;54;76",
        "wc_strengths": "8;44;28;58",
        "wc_weaknesses": "12;430;195;121",
        "wc_questions": "169;6;147;5",
        "wc_review": "218;614;424;260",
        "wc_reply_reviewers": "49;104;0;0",
        "wc_reply_authors": "723;1572;1218;764",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "2;3;2;1",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            73.25,
            38.81607270191048
        ],
        "wc_strengths_avg": [
            34.5,
            18.621224449536072
        ],
        "wc_weaknesses_avg": [
            189.5,
            153.3533501427341
        ],
        "wc_questions_avg": [
            81.75,
            76.6465100314424
        ],
        "wc_review_avg": [
            379.0,
            155.99038431903423
        ],
        "wc_reply_reviewers_avg": [
            38.25,
            42.90906081470439
        ],
        "wc_reply_authors_avg": [
            1069.25,
            349.2673581942636
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9497051980497091996&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "Chinese Academy of Sciences;Swansea University;Beijing University of Posts and Telecommunications",
        "aff_unique_dep": "Institute of Automation;;",
        "aff_unique_url": "http://www.ia.cas.cn;https://www.swansea.ac.uk;http://www.bupt.edu.cn/",
        "aff_unique_abbr": "CAS;Swansea;BUPT",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Beijing",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "title": "NaturalSpeech 2: Latent Diffusion Models are Natural and Zero-Shot Speech and Singing Synthesizers",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18637",
        "id": "Rc7dAwVL3v",
        "author_site": "Kai Shen, Zeqian Ju, Xu Tan, Eric Liu, Yichong Leng, Lei He, Tao Qin, sheng zhao, Jiang Bian",
        "tldr": "",
        "abstract": "Scaling text-to-speech (TTS) to large-scale, multi-speaker, and in-the-wild datasets is important to capture the diversity in human speech such as speaker identities, prosodies, and styles (e.g., singing). Current large TTS systems usually quantize speech into discrete tokens and use language models to generate these tokens one by one, which suffer from unstable prosody, word skipping/repeating issue, and poor voice quality. In this paper, we develop NaturalSpeech 2, a TTS system that leverages a neural audio codec with residual vector quantizers to get the quantized latent vectors and uses a diffusion model to generate these latent vectors conditioned on text input. To enhance the zero-shot capability that is important to achieve diverse speech synthesis, we design a speech prompting mechanism to facilitate in-context learning in the diffusion model and the duration/pitch predictor. We scale NaturalSpeech 2 to large-scale datasets with 44K hours of speech and singing data and evaluate its voice quality on unseen speakers. NaturalSpeech 2 outperforms previous TTS systems by a large margin in terms of prosody/timbre similarity, robustness, and voice quality in a zero-shot setting, and performs novel zero-shot singing synthesis with only a speech prompt. Audio samples are available at https://naturalspeech2.github.io/.",
        "keywords": "text-to-speech;large-scale corpus;non-autoregressive;diffusion",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Kai Shen;Zeqian Ju;Xu Tan;Eric Liu;Yichong Leng;Lei He;Tao Qin;sheng zhao;Jiang Bian",
        "authorids": "~Kai_Shen2;~Zeqian_Ju1;~Xu_Tan1;~Eric_Liu1;~Yichong_Leng1;~Lei_He6;~Tao_Qin1;~sheng_zhao1;~Jiang_Bian1",
        "gender": "M;Not Specified;M;M;M;M;M;M;M",
        "homepage": ";;https://tan-xu.github.io/;https://blog.csdn.net/parakpurple;;;https://www.microsoft.com/en-us/research/people/taoqin/;https://www.aaai.org/ojs/index.php/AAAI/article/view/4642;https://sites.google.com/view/jiangbian",
        "dblp": ";262/3979;96/10484-3;;242/8492;;14/6841;;09/851-2.html",
        "google_scholar": "https://scholar.google.com/citations?hl=en;uN1JaDEAAAAJ;tob-U1oAAAAJ;dIJFz4UAAAAJ;https://scholar.google.ae/citations?user=1jwteOQAAAAJ;EKl9yY8AAAAJ;Bl4SRU0AAAAJ;689bIIwAAAAJ;pZBEnY8AAAAJ",
        "orcid": ";;0000-0001-5631-0639;0000-0002-4150-0680;;;;;0000-0002-9472-600X",
        "linkedin": ";;;;;;;;jbian/",
        "or_profile": "~Kai_Shen2;~Zeqian_Ju1;~Xu_Tan1;~Eric_Liu1;~Yichong_Leng1;~Lei_He6;~Tao_Qin1;~sheng_zhao1;~Jiang_Bian1",
        "aff": "Zhejiang University;Microsoft;Microsoft;Microsoft;University of Science and Technology of China;Microsoft;;Microsoft;Microsoft",
        "aff_domain": "zju.edu.cn;microsoft.com;microsoft.com;microsoft.com;ustc.edu.cn;microsoft.com;;microsoft.com;microsoft.com",
        "position": "PhD student;Intern;Principal Researcher;Principal Researcher;PhD student;Principal Scientist Manager;;Researcher;Partner Research Manager",
        "bibtex": "@inproceedings{\nshen2024naturalspeech,\ntitle={NaturalSpeech 2: Latent Diffusion Models are Natural and Zero-Shot Speech and Singing Synthesizers},\nauthor={Kai Shen and Zeqian Ju and Xu Tan and Eric Liu and Yichong Leng and Lei He and Tao Qin and sheng zhao and Jiang Bian},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Rc7dAwVL3v}\n}",
        "github": "",
        "project": "",
        "reviewers": "8Wev;69Md;9oT1;c9Qd",
        "pdf_size": 668208,
        "rating": "8;8;8;8",
        "confidence": "5;4;5;3",
        "soundness": "4;4;3;3",
        "contribution": "3;3;3;3",
        "presentation": "4;3;2;2",
        "wc_summary": "62;131;77;77",
        "wc_strengths": "120;97;50;37",
        "wc_weaknesses": "159;54;286;81",
        "wc_questions": "175;89;359;37",
        "wc_review": "516;371;772;232",
        "wc_reply_reviewers": "226;31;28;92",
        "wc_reply_authors": "896;647;1998;516",
        "reply_reviewers": "2;1;1;1",
        "reply_authors": "4;2;4;2",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            86.75,
            26.271419832205492
        ],
        "wc_strengths_avg": [
            76.0,
            33.81567683782183
        ],
        "wc_weaknesses_avg": [
            145.0,
            90.07496877601457
        ],
        "wc_questions_avg": [
            165.0,
            122.36829654775782
        ],
        "wc_review_avg": [
            472.75,
            199.83414998443084
        ],
        "wc_reply_reviewers_avg": [
            94.25,
            80.23831690657525
        ],
        "wc_reply_authors_avg": [
            1014.25,
            584.1388426564356
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            1.0
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 260,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14054874329026525619&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=Rc7dAwVL3v",
        "pdf": "https://openreview.net/pdf?id=Rc7dAwVL3v",
        "email": "zju.edu.cn;microsoft.com;microsoft.com;microsoft.com;ustc.edu.cn;microsoft.com;;microsoft.com;microsoft.com",
        "author_num": 9,
        "aff_unique_index": "0;1;1;1;2;1;1;1",
        "aff_unique_norm": "Zhejiang University;Microsoft;University of Science and Technology of China",
        "aff_unique_dep": ";Microsoft Corporation;",
        "aff_unique_url": "https://www.zju.edu.cn;https://www.microsoft.com;http://www.ustc.edu.cn",
        "aff_unique_abbr": "ZJU;Microsoft;USTC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;0;1;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "RcANissyP4",
        "title": "SelfEval: Leveraging the discriminative nature of generative models for evaluation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this work, we show that text-to-image generative models can be `inverted' to assess their own text-image understanding capabilities in a completely automated manner. Our method, called SelfEval, uses the generative model to compute the likelihood of real images given text prompts, making the generative model directly applicable to discriminative tasks. Using SelfEval, we repurpose standard datasets created for evaluating multimodal text-image discriminative models to evaluate generative models in a fine-grained manner: assessing their performance on attribute binding, color recognition, counting, shape recognition, spatial understanding. To the best of our knowledge SelfEval is the first automated metric to show a high degree of agreement for measuring text-faithfulness with the gold-standard human evaluations across multiple models and benchmarks. Moreover, SelfEval enables us to evaluate generative models on challenging tasks such as Winoground image-score where they demonstrate competitive performance to discriminative models. We also show severe drawbacks of standard automated metrics such as CLIP-score to measure text faithfulness on benchmarks such as DrawBench, and how SelfEval sidesteps these issues. We hope SelfEval enables easy and reliable automated evaluation for diffusion models.",
        "keywords": "generative models;diffusion models;generative model evaluation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/03e5679068136b1ec1d2c2aebe5a719f2e6c2c53.pdf",
        "author": "Sai Saketh Rambhatla;Ishan Misra",
        "authorids": "~Sai_Saketh_Rambhatla1;~Ishan_Misra2",
        "gender": "M;M",
        "homepage": "https://rssaketh.github.io;http://imisra.github.io/",
        "dblp": "180/2805;12/10954",
        "google_scholar": "-nT3BLcAAAAJ;WvufSLAAAAAJ",
        "orcid": ";",
        "linkedin": "rambhatla-saketh-67703b84/;ishan-misra-7a140215",
        "or_profile": "~Sai_Saketh_Rambhatla1;~Ishan_Misra1",
        "aff": "Meta;Meta Facebook",
        "aff_domain": "meta.com;fb.com",
        "position": "Postdoc;Research Scientist",
        "bibtex": "@misc{\nrambhatla2024selfeval,\ntitle={SelfEval: Leveraging the discriminative nature of generative models for evaluation},\nauthor={Sai Saketh Rambhatla and Ishan Misra},\nyear={2024},\nurl={https://openreview.net/forum?id=RcANissyP4}\n}",
        "github": "",
        "project": "",
        "reviewers": "M8yh;jCGn;VHYX",
        "site": "https://openreview.net/forum?id=RcANissyP4",
        "pdf_size": 2389701,
        "rating": "5;6;6",
        "confidence": "4;3;3",
        "soundness": "2;3;3",
        "contribution": "2;2;2",
        "presentation": "3;2;3",
        "wc_summary": "57;58;110",
        "wc_strengths": "25;28;74",
        "wc_weaknesses": "226;115;74",
        "wc_questions": "16;85;62",
        "wc_review": "324;286;320",
        "wc_reply_reviewers": "653;0;0",
        "wc_reply_authors": "1552;627;589",
        "reply_reviewers": "4;0;0",
        "reply_authors": "5;2;3",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            75.0,
            24.752104287649296
        ],
        "wc_strengths_avg": [
            42.333333333333336,
            22.425184255405547
        ],
        "wc_weaknesses_avg": [
            138.33333333333334,
            64.20972581228554
        ],
        "wc_questions_avg": [
            54.333333333333336,
            28.686039965266882
        ],
        "wc_review_avg": [
            310.0,
            17.048949136725895
        ],
        "wc_reply_reviewers_avg": [
            217.66666666666666,
            307.8271520765437
        ],
        "wc_reply_authors_avg": [
            922.6666666666666,
            445.2761939390976
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            1.8856180831641267
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            1.247219128924647
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.9999999999999997,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3710992102078169074&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Meta",
        "aff_unique_dep": "Meta Platforms, Inc.",
        "aff_unique_url": "https://meta.com",
        "aff_unique_abbr": "Meta",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Rd1pjx84rk",
        "title": "Size Generalization of Graph Neural Networks on Biological Data: Insights and Practices from the Spectral Perspective",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We investigate size-induced distribution shifts in graphs and assess their impact on the ability of graph neural networks (GNNs) to generalize to larger graphs relative to the training data. Existing literature presents conflicting conclusions on GNNs\u2019 size generalizability, primarily due to disparities in application domains and underlying assumptions concerning size-induced distribution shifts. Motivated by this, we take a data-driven approach: we focus on real biological datasets and seek to characterize the types of size-induced distribution shifts. Diverging from prior approaches, we adopt a spectral perspective and identify that spectrum differences induced by size are related to differences in subgraph patterns (e.g., average cycle lengths). We further find that common GNNs cannot capture these subgraph patterns, resulting in performance decline when testing on larger graphs. Based on these spectral insights, we introduce and compare three model-agnostic strategies aimed at making GNNs aware of important subgraph patterns to enhance their size generalizability: self-supervision, augmentation, and size-insensitive attention. Our empirical results reveal that all strategies enhance GNNs\u2019 size generalizability, with simple size-insensitive attention surprisingly emerging as the most effective method. Notably, this strategy substantially enhances graph classification performance on large test graphs, which are 2-10 times larger than the training graphs, resulting in an improvement in F1 scores by up to 8%.",
        "keywords": "Graph neural networks;Out of distribution;Size-induced distribution shifts",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/b4596b661b17f0af98d1b08541bf7a6b50995d45.pdf",
        "author": "Yujun Yan;Gaotang Li;Danai Koutra",
        "authorids": "~Yujun_Yan1;~Gaotang_Li1;~Danai_Koutra1",
        "gender": "F;M;F",
        "homepage": "https://sites.google.com/umich.edu/yujunyan/home;https://gaotangli.github.io/;http://web.eecs.umich.edu/~dkoutra/",
        "dblp": "219/1736;348/5271;91/9987",
        "google_scholar": "5TQUP58AAAAJ;0aVJRykAAAAJ;https://scholar.google.com.tw/citations?user=bDrA1-8AAAAJ",
        "orcid": "0000-0003-3776-4293;0009-0004-3294-1347;0000-0002-3206-8179",
        "linkedin": ";;",
        "or_profile": "~Yujun_Yan1;~Gaotang_Li1;~Danai_Koutra1",
        "aff": "Dartmouth College;University of Michigan - Ann Arbor;Amazon",
        "aff_domain": "dartmouth.edu;umich.edu;amazon.com",
        "position": "Assistant Professor;Undergrad student;Scholar",
        "bibtex": "@misc{\nyan2024size,\ntitle={Size Generalization of Graph Neural Networks on Biological Data: Insights and Practices from the Spectral Perspective},\nauthor={Yujun Yan and Gaotang Li and Danai Koutra},\nyear={2024},\nurl={https://openreview.net/forum?id=Rd1pjx84rk}\n}",
        "github": "",
        "project": "",
        "reviewers": "XnPU;dD3c;Xenz;eDSS",
        "site": "https://openreview.net/forum?id=Rd1pjx84rk",
        "pdf_size": 2381284,
        "rating": "3;5;6;6",
        "confidence": "5;4;3;4",
        "soundness": "2;2;3;3",
        "contribution": "2;3;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "49;94;84;86",
        "wc_strengths": "39;20;59;24",
        "wc_weaknesses": "193;34;45;24",
        "wc_questions": "27;231;47;286",
        "wc_review": "308;379;235;420",
        "wc_reply_reviewers": "0;0;0;151",
        "wc_reply_authors": "269;549;376;1043",
        "reply_reviewers": "0;0;0;2",
        "reply_authors": "1;1;1;3",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            78.25,
            17.297037318569906
        ],
        "wc_strengths_avg": [
            35.5,
            15.305227865013967
        ],
        "wc_weaknesses_avg": [
            74.0,
            69.10499258374897
        ],
        "wc_questions_avg": [
            147.75,
            112.66626602492869
        ],
        "wc_review_avg": [
            335.5,
            70.5141829705202
        ],
        "wc_reply_reviewers_avg": [
            37.75,
            65.38491798572512
        ],
        "wc_reply_authors_avg": [
            559.25,
            296.6246576062078
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8660254037844386,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1064387237945864026&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Dartmouth College;University of Michigan;Amazon",
        "aff_unique_dep": ";;Amazon.com, Inc.",
        "aff_unique_url": "https://www.dartmouth.edu;https://www.umich.edu;https://www.amazon.com",
        "aff_unique_abbr": "Dartmouth;UM;Amazon",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Ann Arbor",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Rd4pGjTcTj",
        "title": "Parrot: Enhancing Multi-Turn Chat Models by Learning to Ask Questions",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Impressive progress has been made on chat models based on Large Language Models (LLMs) recently; however, there is a noticeable lag in multi-turn conversations between open-source chat models (e.g., Alpaca and Vicuna) and the leading chat models (e.g., ChatGPT and GPT-4). Through a series of analyses, we attribute the lag to the lack of enough high-quality multi-turn instruction-tuning\ndata. The available instruction-tuning data for the community are either singleturn conversations or multi-turn ones with certain issues, such as non-human-like instructions, less detailed responses, or rare topic shifts. In this paper, we address these challenges by introducing Parrot, a highly scalable solution designed to automatically generate high-quality instruction-tuning data, which are then used to enhance the effectiveness of chat models in multi-turn conversations. Specifically, we start by training the Parrot-Ask model, which is designed to emulate real users in generating instructions. We then utilize Parrot-Ask to engage in multiturn conversations with ChatGPT across a diverse range of topics, resulting in a collection of 40K high-quality multi-turn dialogues (Parrot-40K). These data are subsequently employed to train a chat model that we have named Parrot-Chat. We demonstrate that the dialogues gathered from Parrot-Ask markedly outperform existing multi-turn instruction-following datasets in critical metrics, including topic diversity, number of turns, and resemblance to human conversation. With only 40K training examples, Parrot-Chat achieves strong performance against other 13B open-source models across a range of instruction-following benchmarks, and particularly excels in evaluations of multi-turn capabilities. All codes and datasets will be publicly available to facilitate future research.",
        "keywords": "large language model;instruction tuning;multi-turn conversation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/5074c9b8abfe1b7c35990bf50a2b38045a9655c7.pdf",
        "author": "Yuchong Sun;Che Liu;Jinwen Huang;Ruihua Song;Fuzheng Zhang;Zhongyuan Wang;Di ZHANG;Kun Gai",
        "authorids": "~Yuchong_Sun1;~Che_Liu1;~Jinwen_Huang1;~Ruihua_Song1;~Fuzheng_Zhang1;~Zhongyuan_Wang6;~Di_ZHANG3;~Kun_Gai1",
        "gender": "M;M;M;F;M;M;M;M",
        "homepage": ";;https://github.com/andreashuang;;https://zhfzhmsra.github.io/;;;",
        "dblp": "206/8045;;;s/RuihuaSong;;;59/2902;84/6394-6.html",
        "google_scholar": "DuSxNqgAAAAJ;s3jVzK8AAAAJ;;v5LctN8AAAAJ;8R0hla4AAAAJ;;PXO4ygEAAAAJ;4XVJrRAAAAAJ",
        "orcid": ";;;;;0009-0006-5475-2728;;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Yuchong_Sun1;~Che_Liu1;~Jinwen_Huang1;~Ruihua_Song1;~Fuzheng_Zhang1;~Di_ZHANG3;~Kun_Gai1;~Zhongyuan_Wang5",
        "aff": "Renmin University of China;Kuaishou- \u5feb\u624b\u79d1\u6280;;Renmin University of China;Kuaishou- \u5feb\u624b\u79d1\u6280;Kuaishou Technology;Kuaishou- \u5feb\u624b\u79d1\u6280;Kuaishou Inc.",
        "aff_domain": "ruc.edu.cn;kuaishou.com;;ruc.edu.cn;kuaishou.com;kuaishou.com;kuaishou.com;kuaishou.com",
        "position": "PhD student;Principal Researcher;;Associate Professor;Principal Researcher;VP;Instructor;Principal Researcher",
        "bibtex": "@misc{\nsun2024parrot,\ntitle={Parrot: Enhancing Multi-Turn Chat Models by Learning to Ask Questions},\nauthor={Yuchong Sun and Che Liu and Jinwen Huang and Ruihua Song and Fuzheng Zhang and Zhongyuan Wang and Di ZHANG and Kun Gai},\nyear={2024},\nurl={https://openreview.net/forum?id=Rd4pGjTcTj}\n}",
        "github": "",
        "project": "",
        "reviewers": "myqY;sPEb;NNDS;tuRa",
        "site": "https://openreview.net/forum?id=Rd4pGjTcTj",
        "pdf_size": 1293784,
        "rating": "3;5;6;8",
        "confidence": "5;4;4;4",
        "soundness": "3;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "98;78;78;36",
        "wc_strengths": "37;56;70;101",
        "wc_weaknesses": "285;57;34;19",
        "wc_questions": "11;2;39;43",
        "wc_review": "431;193;221;199",
        "wc_reply_reviewers": "0;0;32;20",
        "wc_reply_authors": "1176;472;528;787",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "3;2;2;3",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            72.5,
            22.599778759979046
        ],
        "wc_strengths_avg": [
            66.0,
            23.355941428253324
        ],
        "wc_weaknesses_avg": [
            98.75,
            108.37982976550572
        ],
        "wc_questions_avg": [
            23.75,
            17.597940220378067
        ],
        "wc_review_avg": [
            261.0,
            98.70157040290697
        ],
        "wc_reply_reviewers_avg": [
            13.0,
            13.674794331177344
        ],
        "wc_reply_authors_avg": [
            740.75,
            277.97065942289663
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.8006407690254357,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3822689750080374514&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;1;1;1;2",
        "aff_unique_norm": "Renmin University of China;Kuaishou Technology;Kuaishou Inc.",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.ruc.edu.cn;https://www.kuaishou.com;https://www.kuaishou.com",
        "aff_unique_abbr": "RUC;Kuaishou;Kuaishou",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "Rd576tDapL",
        "title": "Unsupervised Event Outlier Detection in Continuous Time",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Event sequence data record the occurrence times of various events. Event sequence forecasting based on temporal point processes (TPPs) has been extensively studied, but outlier or anomaly detection, especially unsupervised detection of abnormal events, is still underexplored. In this work, we develop, to the best our knowledge, the first unsupervised outlier detection approach to detecting abnormal events. Our novel unsupervised outlier detection framework is based on ideas from generative adversarial networks (GANs) and reinforcement learning (RL). We try to train a \u201cgenerator\u201d that corrects outliers in the data with the help of a \u201cdiscriminator\u201d that learns to discriminate the corrected data from the real data, which may contain outliers. Different from typical GAN-based outlier detection approaches, our method employs the generator to detect outliers in an online manner. The experimental results show that our method can detect event outliers more accurately than the state-of-the-art approaches.",
        "keywords": "Temporal Point Process;Outlier Detection;Reinforcement Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Somjit Nath;Yik Chau Lui;Siqi Liu",
        "authorids": "~Somjit_Nath1;~Yik_Chau_Lui1;~Siqi_Liu6",
        "gender": "M;M;",
        "homepage": ";;",
        "dblp": ";220/3353;",
        "google_scholar": "fNjl1AwAAAAJ;;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Somjit_Nath1;~Yik_Chau_Lui1;~Siqi_Liu6",
        "aff": "McGill University;Borealis AI;",
        "aff_domain": "mcgill.ca;borealisai.com;",
        "position": "PhD student;Machine Learning Researcher;",
        "bibtex": "@misc{\nnath2024unsupervised,\ntitle={Unsupervised Event Outlier Detection in Continuous Time},\nauthor={Somjit Nath and Yik Chau Lui and Siqi Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=Rd576tDapL}\n}",
        "github": "",
        "project": "",
        "reviewers": "bmi9;T8fJ;XqpQ;aHPA",
        "site": "https://openreview.net/forum?id=Rd576tDapL",
        "pdf_size": 912521,
        "rating": "3;5;5;6",
        "confidence": "4;4;4;3",
        "soundness": "3;1;3;3",
        "contribution": "3;2;2;3",
        "presentation": "2;3;2;3",
        "wc_summary": "87;158;161;48",
        "wc_strengths": "72;100;11;51",
        "wc_weaknesses": "140;263;207;101",
        "wc_questions": "56;91;29;86",
        "wc_review": "355;612;408;286",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            113.5,
            48.03384223648989
        ],
        "wc_strengths_avg": [
            58.5,
            32.46921619010844
        ],
        "wc_weaknesses_avg": [
            177.75,
            62.126383284398585
        ],
        "wc_questions_avg": [
            65.5,
            24.964975465639856
        ],
        "wc_review_avg": [
            415.25,
            121.55117235140104
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.6622661785325219,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:yW3AEinQN2MJ:scholar.google.com/&scioq=Unsupervised+Event+Outlier+Detection+in+Continuous+Time&hl=en&as_sdt=0,5",
        "gs_version_total": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "McGill University;Borealis AI",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.mcgill.ca;https://www.borealisai.com",
        "aff_unique_abbr": "McGill;Borealis AI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "Re5KnZcXhf",
        "title": "Constrained Variational Generation for Generalizable Graph Learning",
        "track": "main",
        "status": "Desk Reject",
        "tldr": "",
        "abstract": "Out-of-distribution (OOD) generalization aims at dealing with scenarios where the test data distribution can largely differ from training data distributions. \nExisting works for OOD generalization on graphs generally propose to extract invariant subgraphs that can provide crucial classification information even under unseen test domains. However, such a strategy is suboptimal due to two challenges: (1) \\textit{intra-graph correlations}, i.e., correlated structures that are partial invariant, and (2) \\textit{inter-graph distinctions}, i.e., significant distribution shifts among graphs. To achieve better generalizability of learned graph representation, we innovatively propose a \\textbf{\\underline{C}}onstrained \\textbf{\\underline{V}}ariational \\textbf{\\underline{G}}eneration (CVG) framework to generate generalizable graphs. Our framework is implemented based on the Variation Graph Auto-Encoder (VGAE) structure and optimized under the guidance of the Graph Information Bottleneck (GIB) principle, with its effectiveness validated by our theoretical analysis.\nWe conduct extensive experiments on real-world datasets and demonstrate the superiority of our framework over state-of-the-art baselines.",
        "keywords": "Graph Neural Networks;Information Bottleneck;Variational Inference",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/ff53445c7b450f3c565b49c5b15fb6ef5576f034.pdf",
        "author": "Song Wang;Jundong Li",
        "authorids": "~Song_Wang6;~Jundong_Li2",
        "gender": "M;M",
        "homepage": "https://songw-sw.github.io/;https://jundongli.github.io/",
        "dblp": ";144/7997.html",
        "google_scholar": ";uY6ek7sAAAAJ",
        "orcid": "0000-0003-1273-7694;",
        "linkedin": ";",
        "or_profile": "~Song_Wang6;~Jundong_Li2",
        "aff": "University of Virginia;University of Virginia",
        "aff_domain": "virginia.edu;virginia.edu",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nwang2024constrained,\ntitle={Constrained Variational Generation for Generalizable Graph Learning},\nauthor={Song Wang and Jundong Li},\nyear={2024},\nurl={https://openreview.net/forum?id=Re5KnZcXhf}\n}",
        "github": "",
        "project": "",
        "reviewers": "Vcij;Vto5;ZRDy;nauu",
        "site": "https://openreview.net/forum?id=Re5KnZcXhf",
        "pdf_size": 843974,
        "rating": "6;6;6;8",
        "confidence": "4;4;4;3",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "14;104;95;117",
        "wc_strengths": "17;47;66;62",
        "wc_weaknesses": "55;155;163;165",
        "wc_questions": "20;61;7;4",
        "wc_review": "106;367;331;348",
        "wc_reply_reviewers": "44;16;0;0",
        "wc_reply_authors": "1043;1324;387;260",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "5;3;1;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            82.5,
            40.31438949060249
        ],
        "wc_strengths_avg": [
            48.0,
            19.248376554920156
        ],
        "wc_weaknesses_avg": [
            134.5,
            46.051601492239115
        ],
        "wc_questions_avg": [
            23.0,
            22.74862633215465
        ],
        "wc_review_avg": [
            288.0,
            105.84658709660883
        ],
        "wc_reply_reviewers_avg": [
            15.0,
            17.97220075561143
        ],
        "wc_reply_authors_avg": [
            753.5,
            443.6059625388279
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            1.6583123951777
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:xJOdosNiDYIJ:scholar.google.com/&scioq=Constrained+Variational+Generation+for+Generalizable+Graph+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Virginia",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.virginia.edu",
        "aff_unique_abbr": "UVA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "RDesign: Hierarchical Data-efficient Representation Learning for Tertiary Structure-based RNA Design",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18636",
        "id": "RemfXx7ebP",
        "author_site": "Cheng Tan, Yijie Zhang, Zhangyang Gao, Bozhen Hu, Siyuan Li, Zicheng Liu, Stan Z Li",
        "tldr": "",
        "abstract": "While artificial intelligence has made remarkable strides in revealing the relationship between biological macromolecules' primary sequence and tertiary structure, designing RNA sequences based on specified tertiary structures remains challenging. Though existing approaches in protein design have thoroughly explored structure-to-sequence dependencies in proteins, RNA design still confronts difficulties due to structural complexity and data scarcity. Moreover, direct transplantation of protein design methodologies into RNA design fails to achieve satisfactory outcomes although sharing similar structural components. In this study, we aim to systematically construct a data-driven RNA design pipeline. We crafted a large, well-curated benchmark dataset and designed a comprehensive structural modeling approach to represent the complex RNA tertiary structure. More importantly, we proposed a hierarchical data-efficient representation learning framework that learns structural representations through contrastive learning at both cluster-level and sample-level to fully leverage the limited data. By constraining data representations within a limited hyperspherical space, the intrinsic relationships between data points could be explicitly imposed. Moreover, we incorporated extracted secondary structures with base pairs as prior knowledge to facilitate the RNA design process. Extensive experiments demonstrate the effectiveness of our proposed method, providing a reliable baseline for future RNA design tasks. The source code and benchmark dataset are available at https://github.com/A4Bio/RDesign.",
        "keywords": "Bioinformatics",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/3660e5eac893d45ad3cf7699a48a1aac28ad831f.zip",
        "author": "Cheng Tan;Yijie Zhang;Zhangyang Gao;Bozhen Hu;Siyuan Li;Zicheng Liu;Stan Z. Li",
        "authorids": "~Cheng_Tan1;~Yijie_Zhang3;~Zhangyang_Gao1;~Bozhen_Hu1;~Siyuan_Li6;~Zicheng_Liu2;~Stan_Z._Li2",
        "gender": "M;F;M;M;M;M;M",
        "homepage": "https://chengtan9907.github.io/;https://forrest-yijie-zhang.github.io/;;;https://lupin1998.github.io/;;https://en.westlake.edu.cn/academics/School_of_Engineering/About/Our_People/Faculty/201912/t20191206_2497.shtml",
        "dblp": "70/1533-12.html;;275/3266;279/8665;63/9705-2;l/ZichengLiu-6;l/StanZLi",
        "google_scholar": "6kTV6aMAAAAJ;Q9Gby5wAAAAJ;4SclT-QAAAAJ;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": ";;0000-0003-1026-6083;0000-0002-3428-0114;0000-0001-6806-2468;;",
        "linkedin": ";;;;https://www.linkedin.cn/incareer/in/siyuan-li-lupin1998/;;stan-z-li-%E6%9D%8E%E5%AD%90%E9%9D%92-55753224/",
        "or_profile": "~Cheng_Tan1;~Yijie_Zhang3;~Zhangyang_Gao1;~Bozhen_Hu1;~Siyuan_Li6;~Zicheng_Liu2;~Stan_Z._Li1",
        "aff": "Zhejiang University & Westlake University;McGill University;Westlake University, China;Westlake University;Alibaba Group;Zhejiang University;Westlake University",
        "aff_domain": "westlake.edu.cn;mail.mcgill.ca;westlake.edu.cn;westlake.edu.cn;alibaba-inc.com;zju.edu.cn;westlake.edu.cn",
        "position": "PhD student;MS student;PhD student;PhD student;Intern;PhD student;Chair Professor",
        "bibtex": "@inproceedings{\ntan2024rdesign,\ntitle={{RD}esign: Hierarchical Data-efficient Representation Learning for Tertiary Structure-based {RNA} Design},\nauthor={Cheng Tan and Yijie Zhang and Zhangyang Gao and Bozhen Hu and Siyuan Li and Zicheng Liu and Stan Z. Li},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=RemfXx7ebP}\n}",
        "github": "",
        "project": "",
        "reviewers": "kDxF;J4ia;cP6M",
        "pdf_size": 5267316,
        "rating": "3;3;6",
        "confidence": "5;4;4",
        "soundness": "2;3;2",
        "contribution": "1;2;3",
        "presentation": "1;4;3",
        "wc_summary": "22;94;151",
        "wc_strengths": "18;160;186",
        "wc_weaknesses": "276;592;123",
        "wc_questions": "51;123;364",
        "wc_review": "367;969;824",
        "wc_reply_reviewers": "0;170;33",
        "wc_reply_authors": "740;790;908",
        "reply_reviewers": "0;1;1",
        "reply_authors": "2;2;2",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "wc_summary_avg": [
            89.0,
            52.78257288158659
        ],
        "wc_strengths_avg": [
            121.33333333333333,
            73.83465010112498
        ],
        "wc_weaknesses_avg": [
            330.3333333333333,
            195.28497694964204
        ],
        "wc_questions_avg": [
            179.33333333333334,
            133.84651242706659
        ],
        "wc_review_avg": [
            720.0,
            256.5319993035307
        ],
        "wc_reply_reviewers_avg": [
            67.66666666666667,
            73.60404578252172
        ],
        "wc_reply_authors_avg": [
            812.6666666666666,
            70.43357785097169
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11026505393679124810&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=RemfXx7ebP",
        "pdf": "https://openreview.net/pdf?id=RemfXx7ebP",
        "email": "westlake.edu.cn;mail.mcgill.ca;westlake.edu.cn;westlake.edu.cn;alibaba-inc.com;zju.edu.cn;westlake.edu.cn",
        "author_num": 7,
        "aff_unique_index": "0;1;2;2;3;0;2",
        "aff_unique_norm": "Zhejiang University;McGill University;Westlake University;Alibaba Group",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "http://www.zju.edu.cn;https://www.mcgill.ca;https://www.westlake.edu.cn;https://www.alibaba.com",
        "aff_unique_abbr": "ZJU;McGill;WU;Alibaba",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;0;0;0",
        "aff_country_unique": "China;Canada"
    },
    {
        "id": "RfCGvKBmMq",
        "title": "Representation Matching Information Bottleneck for Text Matching in Asymmetrical Domains",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent studies have shown that the domain matching of text representations will help improve the generalization ability of asymmetrical domains text matching tasks. This requires that the distribution of text representations should be as similar as possible, similar to matching with heterogeneous data domains, in order to make the data after feature extraction indistinguishable. However, how to align the distribution of text representations remains an open question, and the role of text representations distribution alignment is still unclear. In this work, we explicitly narrow the distribution of text representations by aligning them with the same prior distribution. We theoretically prove that narrowing the distribution of text representations in asymmetrical domains text matching is equivalent to optimizing the information bottleneck (IB). Since the interaction between text representations plays an important role in asymmetrical domains text matching, IB does not restrict the interaction between text representations.  Therefore, we propose the adequacy of interaction and the incompleteness of a single text representation on the basis of IB and obtain the representation matching information bottleneck (RMIB). We theoretically prove that the constraints on text representations in RMIB is equivalent to maximizing the mutual information between text representations on the premise that the task information is given. On four text matching models and five text matching datasets, we verify that RMIB can improve the performance of asymmetrical domains text matching.",
        "keywords": "Text Matching;Asymmetrical Domains;Information Bottleneck;Representation Matching Information Bottleneck",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/0283f7ae4edb42f17752c5bcac4d2de92f659500.zip",
        "author": "Haihui Pan;Zhifang Liao;Wenrui Xie",
        "authorids": "~Haihui_Pan1;~Zhifang_Liao1;~Wenrui_Xie1",
        "gender": "M;F;",
        "homepage": "https://github.com/chenxingphh;https://faculty.csu.edu.cn/liaozhifang/en/index.htm;https://sm1les.com",
        "dblp": "255/5454.html;42/2640.html;294/5512",
        "google_scholar": ";;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Haihui_Pan1;~Zhifang_Liao1;~Wenrui_Xie1",
        "aff": "Cheetah Mobile;Central South University;Baidu",
        "aff_domain": "cmcm.com;csu.edu.cn;baidu.com",
        "position": "Researcher;Full Professor;Researcher",
        "bibtex": "@misc{\npan2024representation,\ntitle={Representation Matching Information Bottleneck for Text Matching in Asymmetrical Domains},\nauthor={Haihui Pan and Zhifang Liao and Wenrui Xie},\nyear={2024},\nurl={https://openreview.net/forum?id=RfCGvKBmMq}\n}",
        "github": "",
        "project": "",
        "reviewers": "4HVN;fokd;jW8Q;xd94",
        "site": "https://openreview.net/forum?id=RfCGvKBmMq",
        "pdf_size": 1313045,
        "rating": "5;6;6;6",
        "confidence": "4;2;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "87;79;83;40",
        "wc_strengths": "31;75;108;4",
        "wc_weaknesses": "221;117;115;7",
        "wc_questions": "116;10;125;21",
        "wc_review": "455;281;431;72",
        "wc_reply_reviewers": "25;0;14;0",
        "wc_reply_authors": "1313;285;545;167",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            72.25,
            18.833148966649205
        ],
        "wc_strengths_avg": [
            54.5,
            39.953097501945955
        ],
        "wc_weaknesses_avg": [
            115.0,
            75.67033764957046
        ],
        "wc_questions_avg": [
            68.0,
            52.73992794837702
        ],
        "wc_review_avg": [
            309.75,
            152.60303896056593
        ],
        "wc_reply_reviewers_avg": [
            9.75,
            10.497023387608508
        ],
        "wc_reply_authors_avg": [
            577.5,
            446.1174172793526
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:gHKFl1zYnV0J:scholar.google.com/&scioq=Representation+Matching+Information+Bottleneck+for+Text+Matching+in+Asymmetrical+Domains&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Cheetah Mobile;Central South University;Baidu",
        "aff_unique_dep": ";;Baidu, Inc.",
        "aff_unique_url": "https://www.cheetahmobile.com;https://www.csu.edu.cn;https://www.baidu.com",
        "aff_unique_abbr": "Cheetah Mobile;CSU;Baidu",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Learning to Make Adherence-aware Advice",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18635",
        "id": "RgELE1dQXx",
        "author_site": "Guanting Chen, Xiaocheng Li, Chunlin Sun, Hanzhao Wang",
        "tldr": "",
        "abstract": "As artificial intelligence (AI) systems play an increasingly prominent role in human decision-making, challenges surface in the realm of human-AI interactions. One challenge arises from the suboptimal AI policies due to the inadequate consideration of humans disregarding AI recommendations, as well as the need for AI to provide advice selectively when it is most pertinent. This paper presents a sequential decision-making model that (i) takes into account the human's adherence level (the probability that the human follows/rejects machine advice) and (ii) incorporates a defer option so that the machine can temporarily refrain from making advice. We provide learning algorithms that learn the optimal advice policy and make advice only at critical time stamps. Compared to problem-agnostic reinforcement learning algorithms, our specialized learning algorithms not only enjoy better theoretical convergence properties but also show strong empirical performance.",
        "keywords": "Human-AI interaction;Reinforcement Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/1e0d36661bd1ba4d7dd88f5f6fb9664bacdefda4.pdf",
        "author": "Guanting Chen;Xiaocheng Li;Chunlin Sun;Hanzhao Wang",
        "authorids": "~Guanting_Chen1;~Xiaocheng_Li1;~Chunlin_Sun1;~Hanzhao_Wang1",
        "gender": ";M;M;M",
        "homepage": ";http://xiaocheng-li.github.io/;https://chunlinsun.github.io/;https://hanzhao-wang.github.io",
        "dblp": ";171/2155;260/0567;309/6777",
        "google_scholar": ";;2MMNRmoAAAAJ;",
        "orcid": ";;;",
        "linkedin": ";;chunlin-sun-ab8334139/;",
        "or_profile": "~Guanting_Chen1;~Xiaocheng_Li1;~Chunlin_Sun1;~Hanzhao_Wang1",
        "aff": ";Imperial College London;Stanford University;Imperial College London",
        "aff_domain": ";imperial.ac.uk;stanford.edu;ic.ac.uk",
        "position": ";Assistant Professor;PhD student;PhD student",
        "bibtex": "@inproceedings{\nchen2024learning,\ntitle={Learning to Make Adherence-aware Advice},\nauthor={Guanting Chen and Xiaocheng Li and Chunlin Sun and Hanzhao Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=RgELE1dQXx}\n}",
        "github": "",
        "project": "",
        "reviewers": "tRbR;7r6M;X7E8",
        "pdf_size": 1236739,
        "rating": "5;5;6",
        "confidence": "3;3;3",
        "soundness": "3;2;3",
        "contribution": "2;2;3",
        "presentation": "1;3;2",
        "wc_summary": "46;166;77",
        "wc_strengths": "83;73;62",
        "wc_weaknesses": "266;299;196",
        "wc_questions": "51;30;5",
        "wc_review": "446;568;340",
        "wc_reply_reviewers": "33;0;43",
        "wc_reply_authors": "417;648;659",
        "reply_reviewers": "1;0;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            96.33333333333333,
            50.86146762421321
        ],
        "wc_strengths_avg": [
            72.66666666666667,
            8.576453553512405
        ],
        "wc_weaknesses_avg": [
            253.66666666666666,
            42.94440850939994
        ],
        "wc_questions_avg": [
            28.666666666666668,
            18.80307303489394
        ],
        "wc_review_avg": [
            451.3333333333333,
            93.15697624022701
        ],
        "wc_reply_reviewers_avg": [
            25.333333333333332,
            18.372685039360892
        ],
        "wc_reply_authors_avg": [
            574.6666666666666,
            111.57757640115489
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11584082478482930716&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=RgELE1dQXx",
        "pdf": "https://openreview.net/pdf?id=RgELE1dQXx",
        "email": ";imperial.ac.uk;stanford.edu;ic.ac.uk",
        "author_num": 4,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Imperial College London;Stanford University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.imperial.ac.uk;https://www.stanford.edu",
        "aff_unique_abbr": "ICL;Stanford",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Stanford",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "id": "Rh1aThKliu",
        "title": "LLM Lies: Hallucinations are not Bugs, but Features as Adversarial Examples",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large Language Models (LLMs), including GPT-3.5, LLaMA, and PaLM, seem to be knowledgeable and able to adapt to many tasks. \nHowever, we still can not completely trust their answer, since LLMs suffer from \\textbf{hallucination}\\textemdash fabricating non-existent facts to cheat users without perception. \nAnd the reasons for their existence and pervasiveness remain unclear. \nIn this paper, we demonstrate that non-sense prompts composed of random tokens can also elicit the LLMs to respond with hallucinations. \nThis phenomenon forces us to revisit that \\emph{hallucination may be another view of adversarial examples}, and it shares similar features with conventional adversarial examples as the basic feature of LLMs. \nTherefore, we formalize an automatic hallucination triggering method as the \\textit{hallucination attack} in an adversarial way. Finally, we explore basic feature of attacked adversarial prompts and propose a simple yet effective defense strategy.",
        "keywords": "LLMs;Hallucination;Adversarial Examples",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Jia-Yu Yao;Kun-Peng Ning;Zhenhui Liu;Munan Ning;Li Yuan",
        "authorids": "~Jia-Yu_Yao1;~Kun-Peng_Ning1;~Zhenhui_Liu1;~Munan_Ning1;~Li_Yuan2",
        "gender": "M;M;Non-Binary;M;M",
        "homepage": "https://parnec.nuaa.edu.cn/2020/0623/c12783a205851/page.htm;https://ningkp.github.io;;;https://yuanli2333.github.io/",
        "dblp": ";267/5408;;214/9635;98/4583-7",
        "google_scholar": ";https://scholar.google.com.hk/citations?user=oE8ge7sAAAAJ;55nAQMsAAAAJ;zdBKgeUAAAAJ;-5juAR0AAAAJ",
        "orcid": ";;;;0000-0002-2120-5588",
        "linkedin": ";;;;",
        "or_profile": "~Jia-Yu_Yao1;~Kun-Peng_Ning1;~Zhenhui_Liu1;~Munan_Ning1;~Yuan_LI2",
        "aff": "Peking University;Peking University;Peking University;Peking University;Peking University",
        "aff_domain": "pku.edu.cn;pku.edu.cn;pku.edu.cn;pku.edu.cn;pku.edu.cn",
        "position": "RA;PhD student;MS student;PhD student;Assistant Professor",
        "bibtex": "@misc{\nyao2024llm,\ntitle={{LLM} Lies: Hallucinations are not Bugs, but Features as  Adversarial Examples},\nauthor={Jia-Yu Yao and Kun-Peng Ning and Zhenhui Liu and Munan Ning and Li Yuan},\nyear={2024},\nurl={https://openreview.net/forum?id=Rh1aThKliu}\n}",
        "github": "",
        "project": "",
        "reviewers": "RvtD;NSE9;Vsro;7xzS",
        "site": "https://openreview.net/forum?id=Rh1aThKliu",
        "pdf_size": 3213631,
        "rating": "3;3;3;5",
        "confidence": "4;3;2;3",
        "soundness": "1;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "4;3;1;2",
        "wc_summary": "36;50;68;113",
        "wc_strengths": "23;48;34;37",
        "wc_weaknesses": "81;313;189;489",
        "wc_questions": "55;159;75;6",
        "wc_review": "195;570;366;645",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            66.75,
            29.011851026778693
        ],
        "wc_strengths_avg": [
            35.5,
            8.902246907382429
        ],
        "wc_weaknesses_avg": [
            268.0,
            151.7201370945861
        ],
        "wc_questions_avg": [
            73.75,
            55.251131210139036
        ],
        "wc_review_avg": [
            444.0,
            176.32498404933997
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 223,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10191032762010016992&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Peking University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.pku.edu.cn",
        "aff_unique_abbr": "Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "Rh4DmXaf8R",
        "title": "Multi-timestep models for Model-based Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In model-based reinforcement learning (MBRL), most algorithms rely on simulating trajectories from one-step dynamics models learned on data. A critical challenge of this approach is the compounding of one-step prediction errors as length of the trajectory grows. In this paper we tackle this issue by using a multi-timestep objective to train one-step models. Our objective is a weighted sum of a loss function (e.g., negative log-likelihood) at various future horizons. We explore and test a range of weights profiles. We find that exponentially decaying weights lead to models that significantly improve the long-horizon R2 score. This improvement is particularly noticeable when the models were evaluated on noisy data. Finally, using a soft actor-critic (SAC) agent in pure batch reinforcement learning (RL) and iterated batch RL scenarios, we found that our multi-timestep models outperform or match standard one-step models. This was especially evident in a noisy variant of the considered environment, highlighting the potential of our approach in real-world applications.",
        "keywords": "Model-based Reinforcement Learning;Compounding errors;Multi-timestep models",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/2ec6d30ca2b0b08ec3784f29cfb866aacbec292d.pdf",
        "author": "Abdelhakim Benechehab;Giuseppe Paolo;Albert Thomas;Maurizio Filippone;Bal\u00e1zs K\u00e9gl",
        "authorids": "~Abdelhakim_Benechehab1;~Giuseppe_Paolo1;~Albert_Thomas1;~Maurizio_Filippone1;~Bal\u00e1zs_K\u00e9gl2",
        "gender": "M;;;M;M",
        "homepage": ";https://www.giupaolo.com/;https://albertcthomas.github.io/;;https://scholar.google.com/citations?user=s0njcGgAAAAJ&hl=en&oi=ao",
        "dblp": ";198/1004;172/7718-1;35/5597;k/BalazsKegl.html",
        "google_scholar": "JxgqOKwAAAAJ;https://scholar.google.fr/citations?user=khT6tDsAAAAJ;GzXiITUAAAAJ;https://scholar.google.com.tw/citations?user=ILUeAloAAAAJ;s0njcGgAAAAJ",
        "orcid": ";0000-0003-4201-5967;;;",
        "linkedin": "abdelhakim-benechehab/;gpaolo93/;;;balazskegl",
        "or_profile": "~Abdelhakim_Benechehab1;~Giuseppe_Paolo1;~Albert_Thomas1;~Maurizio_Filippone1;~Balazs_Kegl1",
        "aff": "Huawei Technologies Ltd.;Huawei Technologies Ltd.;Huawei Technologies Ltd.;Eurecom;CNRS (on leave)",
        "aff_domain": "huawei.com;huawei.com;huawei.com;eurecom.fr;in2p3.fr",
        "position": "PhD student;Researcher;Researcher;Associate Professor;Principal Researcher",
        "bibtex": "@misc{\nbenechehab2024multitimestep,\ntitle={Multi-timestep models for Model-based Reinforcement Learning},\nauthor={Abdelhakim Benechehab and Giuseppe Paolo and Albert Thomas and Maurizio Filippone and Bal{\\'a}zs K{\\'e}gl},\nyear={2024},\nurl={https://openreview.net/forum?id=Rh4DmXaf8R}\n}",
        "github": "",
        "project": "",
        "reviewers": "XNaE;pXQz;huS2;yoeH",
        "site": "https://openreview.net/forum?id=Rh4DmXaf8R",
        "pdf_size": 1707083,
        "rating": "1;3;3;3",
        "confidence": "4;4;4;4",
        "soundness": "2;1;2;2",
        "contribution": "1;2;1;2",
        "presentation": "3;3;2;2",
        "wc_summary": "55;78;62;147",
        "wc_strengths": "10;19;72;29",
        "wc_weaknesses": "345;67;194;201",
        "wc_questions": "42;322;18;61",
        "wc_review": "452;486;346;438",
        "wc_reply_reviewers": "0;0;0;11",
        "wc_reply_authors": "404;146;70;155",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            85.5,
            36.47259244967377
        ],
        "wc_strengths_avg": [
            32.5,
            23.77498685593748
        ],
        "wc_weaknesses_avg": [
            201.75,
            98.41080987371255
        ],
        "wc_questions_avg": [
            110.75,
            122.91333328813437
        ],
        "wc_review_avg": [
            430.5,
            51.81457323958193
        ],
        "wc_reply_reviewers_avg": [
            2.75,
            4.763139720814412
        ],
        "wc_reply_authors_avg": [
            193.75,
            125.79820149747769
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=484689636045499045&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;1;2",
        "aff_unique_norm": "Huawei;EURECOM;CNRS",
        "aff_unique_dep": "Huawei Technologies;;",
        "aff_unique_url": "https://www.huawei.com;https://www.eurecom.fr;https://www.cnrs.fr",
        "aff_unique_abbr": "Huawei;;CNRS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;1",
        "aff_country_unique": "China;France"
    },
    {
        "title": "Achieving Human Parity in Content-Grounded Datasets Generation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18634",
        "id": "RjYKTQ0L0W",
        "author_site": "Asaf Yehudai, Boaz Carmeli, Yosi Mass, Ofir Arviv, Nathaniel Mills, Eyal Shnarch, Leshem Choshen",
        "tldr": "",
        "abstract": "The lack of high-quality data for content-grounded generation tasks has been identified as a major obstacle to advancing these tasks. To address this gap, we propose Genie, a novel method for automatically generating high-quality content-grounded data.\nIt consists of three stages: (a) Content Preparation, (b) Generation: creating task-specific examples from the content (e.g., question-answer pairs or summaries). (c) Filtering mechanism aiming to ensure the quality and faithfulness of the generated data. We showcase this methodology by generating three large-scale synthetic data, making wishes, for Long-Form Question-Answering (LFQA), summarization, and information extraction. In a human evaluation, our generated data was found to be natural and of high quality. Furthermore, we compare models trained on our data with models trained on human-written data -- ELI5 and ASQA for LFQA and CNN-DailyMail for Summarization. We show that our models are on par with or outperforming models trained on human-generated data and consistently outperforming them in faithfulness. Finally, we applied our method to create LFQA data within the medical domain and compared a model trained on it with models trained on other domains.",
        "keywords": "Data Generation;content grounded long-form question-answering;summarization",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/6f7a6e7380ad5f438de62d0d0281322fd74aab20.zip",
        "author": "Asaf Yehudai;Boaz Carmeli;Yosi Mass;Ofir Arviv;Nathaniel Mills;Eyal Shnarch;Leshem Choshen",
        "authorids": "~Asaf_Yehudai1;~Boaz_Carmeli1;~Yosi_Mass1;~Ofir_Arviv1;~Nathaniel_Mills1;~Eyal_Shnarch1;~Leshem_Choshen1",
        "gender": "M;M;M;M;M;M;Not Specified",
        "homepage": ";https://researcher.watson.ibm.com/researcher/view.php?person=il-BOAZC;;;;https://researcher.watson.ibm.com/researcher/view.php?person=il-EYALS;https://ktilana.wixsite.com/leshem-choshen",
        "dblp": ";68/2688;23/1530;;;67/2631;218/5237",
        "google_scholar": ";l5xTrKoAAAAJ;;vMC7k0MAAAAJ;;https://scholar.google.co.il/citations?user=UHLsHeMAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;;;;0000-0002-0085-6496",
        "linkedin": "asaf-yehudai/;boaz-carmeli-5456794/?originalSubdomain=il;;ofir-arviv-0523a8b9/;nathaniel-mills-1689181/;;leshemchoshen/",
        "or_profile": "~Asaf_Yehudai1;~Boaz_Carmeli1;~Yosi_Mass1;~Ofir_Arviv1;~Nathaniel_Mills1;~Eyal_Shnarch1;~Leshem_Choshen1",
        "aff": ";International Business Machines;IBM Research, Israel;International Business Machines;International Business Machines;International Business Machines;International Business Machines",
        "aff_domain": ";ibm.com;il.ibm.com;ibm.com;ibm.com;ibm.com;ibm.com",
        "position": ";Researcher;Researcher;Researcher;Researcher;Principal Researcher;Researcher",
        "bibtex": "@inproceedings{\nyehudai2024achieving,\ntitle={Achieving Human Parity in Content-Grounded Datasets Generation},\nauthor={Asaf Yehudai and Boaz Carmeli and Yosi Mass and Ofir Arviv and Nathaniel Mills and Eyal Shnarch and Leshem Choshen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=RjYKTQ0L0W}\n}",
        "github": "",
        "project": "",
        "reviewers": "Y1CY;pq6E;xd6k",
        "pdf_size": 727170,
        "rating": "5;5;6",
        "confidence": "4;3;3",
        "soundness": "2;2;3",
        "contribution": "2;2;2",
        "presentation": "2;2;3",
        "wc_summary": "79;44;68",
        "wc_strengths": "57;27;34",
        "wc_weaknesses": "122;169;95",
        "wc_questions": "4;11;28",
        "wc_review": "262;251;225",
        "wc_reply_reviewers": "0;0;280",
        "wc_reply_authors": "858;1107;823",
        "reply_reviewers": "0;0;1",
        "reply_authors": "2;3;2",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            63.666666666666664,
            14.613540144521982
        ],
        "wc_strengths_avg": [
            39.333333333333336,
            12.81492185782739
        ],
        "wc_weaknesses_avg": [
            128.66666666666666,
            30.57595278791634
        ],
        "wc_questions_avg": [
            14.333333333333334,
            10.077477638553983
        ],
        "wc_review_avg": [
            246.0,
            15.513435037626794
        ],
        "wc_reply_reviewers_avg": [
            93.33333333333333,
            131.99326582148888
        ],
        "wc_reply_authors_avg": [
            929.3333333333334,
            126.4392695679981
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14228767679166360515&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=RjYKTQ0L0W",
        "pdf": "https://openreview.net/pdf?id=RjYKTQ0L0W",
        "email": ";ibm.com;il.ibm.com;ibm.com;ibm.com;ibm.com;ibm.com",
        "author_num": 7,
        "aff_unique_index": "0;1;0;0;0;0",
        "aff_unique_norm": "International Business Machines Corporation;IBM",
        "aff_unique_dep": ";IBM Research",
        "aff_unique_url": "https://www.ibm.com;https://www.ibm.com/research",
        "aff_unique_abbr": "IBM;IBM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;0;0",
        "aff_country_unique": "United States;Israel"
    },
    {
        "id": "RkEWQ5jmY0",
        "title": "Early Weight Averaging Meets High Learning Rates for LLM Pre-training",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Training Large Language Models (LLMs) incurs significant cost; hence, any strategy that accelerates model convergence is helpful. In this paper, we investigate the ability of a simple idea \u2013 checkpoint averaging along the trajectory of a training run \u2013 to improve both convergence and generalization quite early during training. Here we show that models trained with high learning rates observe higher gains due to checkpoint averaging. Furthermore, these gains are amplified when checkpoints are sampled with considerable spacing in training steps. Our training recipe outperforms conventional training and popular checkpoint averaging baselines such as exponential moving average (EMA) and stochastic moving average (SWA). We evaluate our training recipe by pre-training LLMs, where high learning rates are inherently preferred due to extremely large batch sizes. Specifically, we pre-trained nanoGPT-2 models of varying sizes\u2014small (125M), medium (335M), and large (770M)\u2014on the OpenWebText dataset, comprised of 9B tokens. Additionally, we present results for publicly available Pythia LLMs, ranging from 1B to 12B, which were trained on the PILE-deduped dataset containing 207B tokens. Our code will be available on Github.",
        "keywords": "LLMs; pre-training; early weight averaging; high learning rates; faster convergence; better generalization",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/e800246171869e50f892a3b869969e07f8da9b91.zip",
        "author": "Sunny Sanyal;Atula Tejaswi Neerkaje;Jean Kaddour;Abhishek Kumar;sujay sanghavi",
        "authorids": "~Sunny_Sanyal1;~Atula_Tejaswi_Neerkaje1;~Jean_Kaddour1;~Abhishek_Kumar1;~sujay_sanghavi1",
        "gender": "M;M;M;;M",
        "homepage": "https://sites.google.com/view/sunnysanyal/home;https://atutej.github.io/;https://jeankaddour.com/;http://inductivebias.ml;https://sites.utexas.edu/sanghavi",
        "dblp": "198/3765;315/4311;;67/6188-1;69/4911.html",
        "google_scholar": "https://scholar.google.co.uk/citations?user=xx9rrGMAAAAJ;https://scholar.google.com/citations?hl=en;z90bmSMAAAAJ;6vghMS0AAAAJ;O-DazBUAAAAJ",
        "orcid": "0000-0002-2357-5152;;;;",
        "linkedin": "sunny-sanyal/;atula-tejaswi-neerkaje-4b989b157;;;",
        "or_profile": "~Sunny_Sanyal1;~Atula_Tejaswi_Neerkaje1;~Jean_Kaddour1;~Abhishek_Kumar1;~sujay_sanghavi1",
        "aff": "University of Texas at Austin;University of Texas at Austin;University College London;Google DeepMind;University of Texas, Austin",
        "aff_domain": "utexas.edu;utexas.edu;ucl.ac.uk;google.com;utexas.edu",
        "position": "PhD student;MS student;PhD student;Research Scientist;Associate Professor",
        "bibtex": "@misc{\nsanyal2024early,\ntitle={Early Weight Averaging Meets High Learning Rates for {LLM} Pre-training},\nauthor={Sunny Sanyal and Atula Tejaswi Neerkaje and Jean Kaddour and Abhishek Kumar and sujay sanghavi},\nyear={2024},\nurl={https://openreview.net/forum?id=RkEWQ5jmY0}\n}",
        "github": "",
        "project": "",
        "reviewers": "EwGY;Y53G;eRWc;7tZF",
        "site": "https://openreview.net/forum?id=RkEWQ5jmY0",
        "pdf_size": 746020,
        "rating": "3;3;3;3",
        "confidence": "4;3;3;4",
        "soundness": "3;3;3;1",
        "contribution": "1;1;2;1",
        "presentation": "3;3;2;2",
        "wc_summary": "68;76;73;146",
        "wc_strengths": "20;82;36;169",
        "wc_weaknesses": "125;83;110;669",
        "wc_questions": "126;117;47;62",
        "wc_review": "339;358;266;1046",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            1.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            90.75,
            32.02635633349507
        ],
        "wc_strengths_avg": [
            76.75,
            57.91966419101547
        ],
        "wc_weaknesses_avg": [
            246.75,
            244.2502558852293
        ],
        "wc_questions_avg": [
            88.0,
            34.066112193791646
        ],
        "wc_review_avg": [
            502.25,
            315.8071998862597
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5289143267520065667&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;2;0",
        "aff_unique_norm": "University of Texas at Austin;University College London;Google",
        "aff_unique_dep": ";;Google DeepMind",
        "aff_unique_url": "https://www.utexas.edu;https://www.ucl.ac.uk;https://deepmind.com",
        "aff_unique_abbr": "UT Austin;UCL;DeepMind",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Austin;",
        "aff_country_unique_index": "0;0;1;1;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "RlbFGQYsJr",
        "title": "Learning Dynamics on Manifolds with Neural Ordinary Differential Equations",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Neural ordinary differential equations (Neural ODEs) have garnered significant attention for their ability to efficiently learn dynamics from data. However, for high-dimensional systems, capturing dynamics remains to be a challenging task. Existing methods often rely on learning ODEs on low-dimensional manifolds but usually require the knowledge of the manifold. Nevertheless, such knowledge is usually unknown in many scenarios. Therefore, we propose a novel approach to jointly learn data dynamics and the underlying manifold. Specifically, we employ an encoder to project the original data into the manifold and leverage the Jacobian matrix of its corresponding decoder for recovery. Our experimental evaluations encompass multiple datasets, where we compare the accuracy, number of function evaluations (NFE), and convergence speed of our model against existing baselines. Our results demonstrate superior performance, underscoring the effectiveness of our approach in addressing the challenges of high-dimensional dynamic learning.",
        "keywords": "Manifolds;Neural ODE;Dynamics Learning;Classification",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Muhao Guo;Haoran Li;Yang Weng",
        "authorids": "~Muhao_Guo1;~Haoran_Li6;~Yang_Weng1",
        "gender": "M;M;",
        "homepage": ";;",
        "dblp": "345/6430;;",
        "google_scholar": "wIOmifAAAAAJ;https://scholar.google.com/citations?hl=en;",
        "orcid": "0000-0002-9890-8214;;",
        "linkedin": "muhaoguo/;;",
        "or_profile": "~Muhao_Guo1;~Haoran_Li6;~Yang_Weng1",
        "aff": "Arizona State University;Arizona State University;",
        "aff_domain": "asu.edu;asu.edu;",
        "position": "PhD student;PhD student;",
        "bibtex": "@misc{\nguo2024learning,\ntitle={Learning Dynamics on Manifolds with Neural Ordinary Differential Equations},\nauthor={Muhao Guo and Haoran Li and Yang Weng},\nyear={2024},\nurl={https://openreview.net/forum?id=RlbFGQYsJr}\n}",
        "github": "",
        "project": "",
        "reviewers": "V8a6;ivZK;Ha6r;ckcW",
        "site": "https://openreview.net/forum?id=RlbFGQYsJr",
        "pdf_size": 8565566,
        "rating": "1;3;3;5",
        "confidence": "4;4;3;4",
        "soundness": "2;1;3;2",
        "contribution": "2;1;3;2",
        "presentation": "1;4;3;2",
        "wc_summary": "58;44;86;50",
        "wc_strengths": "52;51;83;20",
        "wc_weaknesses": "184;572;71;181",
        "wc_questions": "20;202;15;2",
        "wc_review": "314;869;255;253",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            59.5,
            16.08570794214541
        ],
        "wc_strengths_avg": [
            51.5,
            22.276669409945463
        ],
        "wc_weaknesses_avg": [
            252.0,
            190.28005675845276
        ],
        "wc_questions_avg": [
            59.75,
            82.39045757853272
        ],
        "wc_review_avg": [
            422.75,
            258.8053080985782
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Vjgr-jvpPdQJ:scholar.google.com/&scioq=Learning+Dynamics+on+Manifolds+with+Neural+Ordinary+Differential+Equations&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Arizona State University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.asu.edu",
        "aff_unique_abbr": "ASU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "RlcWvyf5rm",
        "title": "UniBoost: Boost Zero-shot Vision-Language Tasks via Multitask Fine-tuning with Unsupervised Unimodal Pre-training",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large-scale joint training of multimodal models, e.g., CLIP, have demonstrated great performance in many vision-language tasks. However, pre-training with image-text pairs limits itself to cover a wide range of unimodal data, where noise can also be introduced as misaligned pairs during pre-processing. Conversely, unsupervised training of unimodal models on text or image data alone can achieve broader coverage of diverse real-world data. This motivates us to build a method based on unsupervised pre-trained unimodal models to enhance the zero-shot performance for vision-language tasks. Overall, our method is a multitask fine-tuning framework initialized from separate unsupervised pre-trained vision and language encoders, which allows the model to benefit from both the unsupervised pre-training and a variety of supervised data. Experiments show that our method outperforms state-of-the-art CLIP-based models by 6.5\\% (52.3\\% $\\rightarrow$ 58.8\\%) on PASCAL-5$^i$ and 6.2\\% (27.2\\% $\\rightarrow$ 33.4\\%) on COCO-20$^i$ under zero-shot language-guided semantic segmentation setting respectively. By learning representations of both modalities, unimodal pre-training offers strong generalization ability, while multitask fine-tuning shares knowledge across tasks and enhance domain adaptation, resulting in better performance especially for zero-shot vision-language tasks.",
        "keywords": "vision-language learning;multitask fine-tuning;unsupervised pre-training",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/35e8abd4c79ba64503669ea2d5cf2f7b853ae012.pdf",
        "author": "Yanan SUN;Qi Fan;Zihan Zhong;Chi-Keung Tang;Yu-Wing Tai",
        "authorids": "~Yanan_SUN1;~Qi_Fan2;~Zihan_Zhong3;~Chi-Keung_Tang1;~Yu-Wing_Tai2",
        "gender": "F;M;F;M;Not Specified",
        "homepage": "http://nowsyn.github.io/;https://fanq15.github.io/;https://github.com/Harry-zzh;https://yuwingtai.github.io/;http://www.cse.ust.hk/~cktang/",
        "dblp": "44/8711-5;;338/6823;40/566;34/4366",
        "google_scholar": "6TA1oPkAAAAJ;https://scholar.google.com.tw/citations?user=da23smAAAAAJ;ZaNQ6mQAAAAJ;nFhLmFkAAAAJ;https://scholar.google.com.tw/citations?user=EWfpM74AAAAJ",
        "orcid": ";;;0000-0002-3148-0380;",
        "linkedin": ";qi-fan-3a8526108/;;;",
        "or_profile": "~Yanan_SUN1;~Qi_Fan2;~Zihan_Zhong3;~Yu-Wing_Tai2;~ChiKeung_Tang1",
        "aff": "Shanghai Artificial Intelligence Laboratory;Nanjing University;Tsinghua University;Dartmouth College;Hong Kong University of Science and Technology",
        "aff_domain": "pjlab.org.cn;nju.edu.cn;tsinghua.edu.cn;dartmouth.edu;ust.hk",
        "position": "Researcher;Assistant Professor;MS student;Associate Professor;Professor",
        "bibtex": "@misc{\nsun2024uniboost,\ntitle={UniBoost: Boost Zero-shot Vision-Language Tasks via Multitask Fine-tuning with Unsupervised Unimodal Pre-training},\nauthor={Yanan SUN and Qi Fan and Zihan Zhong and Chi-Keung Tang and Yu-Wing Tai},\nyear={2024},\nurl={https://openreview.net/forum?id=RlcWvyf5rm}\n}",
        "github": "",
        "project": "",
        "reviewers": "eQGs;BiMn;tHnr",
        "site": "https://openreview.net/forum?id=RlcWvyf5rm",
        "pdf_size": 517475,
        "rating": "3;3;5",
        "confidence": "3;4;3",
        "soundness": "2;3;3",
        "contribution": "2;1;3",
        "presentation": "1;2;3",
        "wc_summary": "61;65;125",
        "wc_strengths": "37;40;42",
        "wc_weaknesses": "234;376;353",
        "wc_questions": "49;103;134",
        "wc_review": "381;584;654",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            83.66666666666667,
            29.272664533466866
        ],
        "wc_strengths_avg": [
            39.666666666666664,
            2.0548046676563256
        ],
        "wc_weaknesses_avg": [
            321.0,
            62.23075338340897
        ],
        "wc_questions_avg": [
            95.33333333333333,
            35.122009560324926
        ],
        "wc_review_avg": [
            539.6666666666666,
            115.77660481384926
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:hf8siRUD72AJ:scholar.google.com/&scioq=UniBoost:+Boost+Zero-shot+Vision-Language+Tasks+via+Multitask+Fine-tuning+with+Unsupervised+Unimodal+Pre-training&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "Shanghai Artificial Intelligence Laboratory;Nanjing University;Tsinghua University;Dartmouth College;Hong Kong University of Science and Technology",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "http://www.shailab.org/;https://www.nju.edu.cn;https://www.tsinghua.edu.cn;https://www.dartmouth.edu;https://www.ust.hk",
        "aff_unique_abbr": "Shanghai AI Lab;Nanjing U;THU;Dartmouth;HKUST",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "RlfD5cE1ep",
        "title": "Feature Normalization Prevents Collapse of Non-contrastive Learning Dynamics",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Contrastive learning is a self-supervised representation learning framework, where two positive views generated through data augmentation are made similar by an attraction force in a data representation space, while a repulsive force makes them far from negative examples.\n  Non-contrastive learning represented by BYOL and SimSiam further gets rid of negative examples and improves computational efficiency.\n  While learned representations may collapse into a single point without the repulsive force at first sight, \\cite{Tian2021ICML} revealed that non-collapse solutions are possible if data augmentation is sufficiently stronger than regularization, through the study of the learning dynamics.\n  However, their analysis does not take into account of commonly-used \\emph{feature normalization}, and hence strong regularization may collapse the dynamics.\n  Instead of the L2 loss used in \\cite{Tian2021ICML}, we extend their analysis by considering the cosine loss, which involves feature normalization.\n  We show that the cosine loss induces a sixth-order dynamics (while the L2 loss induces a third-order one), in which a stable equilibrium dynamically emerges even if there is only a collapsed solution with given initial parameters.\n  Thus, we can understand that feature normalization plays an important role in preventing the dynamics collapse.",
        "keywords": "self-supervised learning;contrastive learning;learning dynamics",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Han Bao",
        "authorids": "~Han_Bao2",
        "gender": "M",
        "homepage": "https://hermite.jp/",
        "dblp": "120/1444-2",
        "google_scholar": "MqMzjeMAAAAJ",
        "orcid": "0000-0002-4473-2604",
        "linkedin": "",
        "or_profile": "~Han_Bao2",
        "aff": "Kyoto University, Kyoto University",
        "aff_domain": "i.kyoto-u.ac.jp",
        "position": "Assistant Professor",
        "bibtex": "@misc{\nbao2024feature,\ntitle={Feature Normalization Prevents Collapse of Non-contrastive Learning Dynamics},\nauthor={Han Bao},\nyear={2024},\nurl={https://openreview.net/forum?id=RlfD5cE1ep}\n}",
        "github": "",
        "project": "",
        "reviewers": "HYk4;ZH8r;JjF9;sECc",
        "site": "https://openreview.net/forum?id=RlfD5cE1ep",
        "pdf_size": 1240652,
        "rating": "5;5;6;8",
        "confidence": "4;2;3;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "122;59;73;67",
        "wc_strengths": "25;11;72;39",
        "wc_weaknesses": "207;84;27;309",
        "wc_questions": "3;82;21;110",
        "wc_review": "357;236;193;525",
        "wc_reply_reviewers": "88;0;0;265",
        "wc_reply_authors": "568;245;132;693",
        "reply_reviewers": "2;0;0;1",
        "reply_authors": "3;1;1;2",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            80.25,
            24.610719209320152
        ],
        "wc_strengths_avg": [
            36.75,
            22.63155982251334
        ],
        "wc_weaknesses_avg": [
            156.75,
            109.35349788644166
        ],
        "wc_questions_avg": [
            54.0,
            43.617656975128774
        ],
        "wc_review_avg": [
            327.75,
            128.78154953253204
        ],
        "wc_reply_reviewers_avg": [
            88.25,
            108.18589325785501
        ],
        "wc_reply_authors_avg": [
            409.5,
            228.88916531806393
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0.4923659639173309,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6070432955867601107&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0",
        "aff_unique_norm": "Kyoto University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kyoto-u.ac.jp",
        "aff_unique_abbr": "Kyoto U",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Kyoto",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Japan"
    },
    {
        "id": "RmOXAa5H5Y",
        "title": "An Empirical Study of Simplicial Representation Learning with Wasserstein Distance",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this paper, we delve into the problem of simplicial representation learning utilizing the 1-Wasserstein distance on a tree structure (a.k.a., Tree-Wasserstein distance (TWD)), where TWD is defined as the L1 distance between two tree-embedded vectors. Specifically, we consider a framework for simplicial representation estimation employing a self-supervised learning approach based on SimCLR with a negative TWD as a similarity measure. In SimCLR, the cosine similarity with real-vector embeddings is often utilized; however, it has not \n been well studied utilizing L1-based measures with simplicial embeddings. A key challenge is that training the L1 distance is numerically challenging and often yields unsatisfactory outcomes, and there are numerous choices for probability models. Thus, this study empirically investigates a strategy for optimizing self-supervised learning with TWD and find a stable training procedure. More specifically, we evaluate the combination of two types of TWD (total variation and ClusterTree) and several simplicial models including the softmax function, the ArcFace probability model, and simplicial embedding. Moreover, we propose a simple yet effective Jeffrey divergence-based regularization method to stabilize the optimization. Through empirical experiments on STL10, CIFAR10, CIFAR100, and SVHN, we first found that the simple combination of softmax function and TWD can obtain significantly lower results than the standard SimCLR (non-simplicial model and cosine similarity). We found that the model performance depends on the combination of TWD and the simplicial model, and the Jeffrey divergence regularization usually helps model training. Finally, we inferred that the appropriate choice of combination of TWD and simplicial models outperformed cosine similarity based representation learning.",
        "keywords": "Wasserstein diistance;Self-supervised Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Makoto Yamada;Yuki Takezawa;Guillaume Houry;Kira Michaela D\u00fcsterwald;Deborah Sulem;Han Zhao;Yao-Hung Hubert Tsai",
        "authorids": "~Makoto_Yamada3;~Yuki_Takezawa1;~Guillaume_Houry1;~Kira_Michaela_D\u00fcsterwald1;~Deborah_Sulem1;~Han_Zhao1;~Yao-Hung_Hubert_Tsai1",
        "gender": "M;M;M;F;M;M;M",
        "homepage": "https://groups.oist.jp/mlds;https://yukitakezawa.github.io/;;;https://dsulem.github.io/;https://hanzhaoml.github.io/;",
        "dblp": "56/4937;284/1294;;;;03/3520-2;154/3702",
        "google_scholar": "1cKNu1gAAAAJ;eaKQb8IAAAAJ;https://scholar.google.com/citations?hl=en;U7NxV-MAAAAJ;FMBP1AsAAAAJ;x942ipYAAAAJ;",
        "orcid": ";0000-0002-8532-2775;;0000-0003-3217-5326;;0000-0002-8579-1600;",
        "linkedin": ";;;kira-d\u00fcsterwald-653746106/;;;",
        "or_profile": "~Makoto_Yamada3;~Yuki_Takezawa1;~Guillaume_Houry1;~Kira_Michaela_D\u00fcsterwald1;~Deborah_Sulem1;~Han_Zhao1;~Yao-Hung_Hubert_Tsai1",
        "aff": "Okinawa Institute of Science and Technology (OIST);Kyoto University;;University College London;Barcelona School of Economics;University of Illinois, Urbana Champaign;Apple",
        "aff_domain": "oist.jp;kyoto-u.ac.jp;;ucl.ac.uk;bse.eu;illinois.edu;apple.com",
        "position": "Associate Professor;PhD student;;PhD student;Postdoc;Assistant Professor;Principal Researcher",
        "bibtex": "@misc{\nyamada2024an,\ntitle={An Empirical Study of Simplicial Representation Learning with Wasserstein Distance},\nauthor={Makoto Yamada and Yuki Takezawa and Guillaume Houry and Kira Michaela D{\\\"u}sterwald and Deborah Sulem and Han Zhao and Yao-Hung Hubert Tsai},\nyear={2024},\nurl={https://openreview.net/forum?id=RmOXAa5H5Y}\n}",
        "github": "",
        "project": "",
        "reviewers": "hH8o;hLXp;dnmG;pYGX",
        "site": "https://openreview.net/forum?id=RmOXAa5H5Y",
        "pdf_size": 857016,
        "rating": "3;3;3;3",
        "confidence": "3;3;3;3",
        "soundness": "2;2;2;3",
        "contribution": "2;1;2;2",
        "presentation": "2;3;2;3",
        "wc_summary": "68;74;127;107",
        "wc_strengths": "34;84;12;194",
        "wc_weaknesses": "87;192;232;181",
        "wc_questions": "235;114;57;70",
        "wc_review": "424;464;428;552",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            94.0,
            24.155744658362327
        ],
        "wc_strengths_avg": [
            81.0,
            70.26378868236469
        ],
        "wc_weaknesses_avg": [
            173.0,
            53.1554324599095
        ],
        "wc_questions_avg": [
            119.0,
            70.22463955051674
        ],
        "wc_review_avg": [
            467.0,
            51.487862647424
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13472917338183343579&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;4;5",
        "aff_unique_norm": "Okinawa Institute of Science and Technology;Kyoto University;University College London;Barcelona School of Economics;University of Illinois Urbana-Champaign;Apple",
        "aff_unique_dep": ";;;;;Apple Inc.",
        "aff_unique_url": "https://www.oist.jp;https://www.kyoto-u.ac.jp;https://www.ucl.ac.uk;https://www.barcelonaschoolofeconomics.com;https://illinois.edu;https://www.apple.com",
        "aff_unique_abbr": "OIST;Kyoto U;UCL;BSE;UIUC;Apple",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Urbana-Champaign",
        "aff_country_unique_index": "0;0;1;2;3;3",
        "aff_country_unique": "Japan;United Kingdom;Spain;United States"
    },
    {
        "id": "RmQAKu1wCe",
        "title": "Temporal Flexibility in Spiking Neural Networks: A Novel Training Method for Enhanced Generalization Across Time Steps",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Spiking Neural Networks (SNNs), models inspired by neural mechanisms in the brain, allow for an energy-efficient implementation on neuromorphic hardware. However, the limitation of current direct training approaches lies in their ability to only optimize parameters for an SNN operating at a specific time step. This leads to the necessity for fine-tuning when generalizing to additional time steps, resulting in considerable computational inefficiency. In this study, we initially examine the feasibility of parameter sharing across structurally identical SNNs operating at different time steps. Subsequently, we propose an innovative training methodology-mixed time step training (MTT) that facilitates the development of a temporal flexible SNN (TFSNN). Throughout the training process, various time steps are arbitrarily assigned to distinct SNN blocks, accompanied by the establishment of novel inter-block communication protocols. Following training, the TFSNN can be simplified to an SNN operating at any chosen fixed time step, eliminating the need for fine-tuning. Experimental results across all primary datasets demonstrate that the TFSNN exhibits robust generalization capabilities surpassing existing training methodologies reliant on a fixed time step. Notably, we achieved a 96.84% accuracy rate on the CIFAR10 dataset, an 81.98% accuracy rate on the CIFAR100 dataset, and a 68.34% accuracy rate on the ImageNet dataset with T = 6.",
        "keywords": "Spiking Neural Networks;Direct Training",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/d2d7848b9c1b40fddd0ea65099981c98260a917a.zip",
        "author": "Kangrui Du;Yuhang Wu;Shikuang Deng;Shi Gu",
        "authorids": "~Kangrui_Du3;~Yuhang_Wu5;~Shikuang_Deng1;~Shi_Gu1",
        "gender": "M;M;;M",
        "homepage": "https://github.com/WHYwyh;https://www.guslab.org/;https://nangongwubu.github.io/;https://rockdu.github.io",
        "dblp": ";286/8188;175/1269;",
        "google_scholar": ";rtlmA3gAAAAJ;9_jlOXUAAAAJ;",
        "orcid": ";;0000-0003-2303-6770;",
        "linkedin": ";;;",
        "or_profile": "~Yuhang_Wu5;~Shikuang_Deng1;~Shi_Gu1;~KANGRUI_DU2",
        "aff": "University of Electronic Science and Technology of China;University of Electronic Science and Technology of China;University of Electronic Science and Technology of China, Tsinghua University;University of Electronic Science and Technology of China",
        "aff_domain": "uestc.edu.cn;uestc.edu.cn;uestc.edu.cn;uestc.edu.cn",
        "position": "MS student;PhD student;Full Professor;Undergrad student",
        "bibtex": "@misc{\ndu2024temporal,\ntitle={Temporal Flexibility in Spiking Neural Networks: A Novel Training Method for Enhanced Generalization Across Time Steps},\nauthor={Kangrui Du and Yuhang Wu and Shikuang Deng and Shi Gu},\nyear={2024},\nurl={https://openreview.net/forum?id=RmQAKu1wCe}\n}",
        "github": "",
        "project": "",
        "reviewers": "1Uof;wYLe;6ah9",
        "site": "https://openreview.net/forum?id=RmQAKu1wCe",
        "pdf_size": 2237939,
        "rating": "3;6;6",
        "confidence": "5;4;4",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "2;2;3",
        "wc_summary": "31;92;83",
        "wc_strengths": "44;52;71",
        "wc_weaknesses": "272;162;151",
        "wc_questions": "3;2;20",
        "wc_review": "350;308;325",
        "wc_reply_reviewers": "0;270;129",
        "wc_reply_authors": "2478;1019;1001",
        "reply_reviewers": "0;1;1",
        "reply_authors": "5;3;3",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            68.66666666666667,
            26.88659310676771
        ],
        "wc_strengths_avg": [
            55.666666666666664,
            11.323525167642018
        ],
        "wc_weaknesses_avg": [
            195.0,
            54.63210289442158
        ],
        "wc_questions_avg": [
            8.333333333333334,
            8.259674462242577
        ],
        "wc_review_avg": [
            327.6666666666667,
            17.249798710580816
        ],
        "wc_reply_reviewers_avg": [
            133.0,
            110.26332119068425
        ],
        "wc_reply_authors_avg": [
            1499.3333333333333,
            692.0608515312958
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:EUzStwnbX_8J:scholar.google.com/&scioq=Temporal+Flexibility+in+Spiking+Neural+Networks:+A+Novel+Training+Method+for+Enhanced+Generalization+Across+Time+Steps&hl=en&as_sdt=0,47",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of Electronic Science and Technology of China",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uestc.edu.cn",
        "aff_unique_abbr": "UESTC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "RmRA7Q0lwQ",
        "title": "Stay on Topic with Classifier-Free Guidance",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Classifier-Free Guidance (CFG) has recently emerged in text-to-image generation as a lightweight technique to encourage prompt-adherence in generations. In this work, we demonstrate that CFG can be used broadly as an inference-time technique in pure language modeling. We show that CFG (1) improves the performance of Pythia, GPT-2 and LLaMA-family models across an array of tasks: Q&A, reasoning, code generation, and machine translation, achieving SOTA on LAMBADA with LLaMA-7B over PaLM-540B; (2) brings improvements equivalent to a model with twice the parameter-count; (3) can stack alongside other inference-time methods like Chain-of-Thought and Self-Consistency, yielding further improvements in difficult tasks; (4) can be used to increase the faithfulness and coherence of assistants in challenging form-driven and content-driven prompts: in a human evaluation we show a 75% preference for GPT4All using CFG over baseline.",
        "keywords": "transformers;nlp;inference;classifier;free;guidance;cfg;contrastive",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Guillaume Sanchez;Alexander Spangher;Honglu Fan;Elad Levi;Pawan Sasanka Ammanamanchi;Stella Biderman",
        "authorids": "~Guillaume_Sanchez1;~Alexander_Spangher2;~Honglu_Fan1;~Elad_Levi1;~Pawan_Sasanka_Ammanamanchi1;~Stella_Biderman1",
        "gender": "M;M;Not Specified;M;;F",
        "homepage": ";http://alexander-spangher.com/;https://honglu.fan;;;http://www.stellabiderman.com",
        "dblp": ";227/2512;;232/2420;;239/5641",
        "google_scholar": "ke4fCUgAAAAJ;https://scholar.google.com/citations?hl=en;XqlOVeAAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?view_op=list_works;bO7H0DAAAAAJ",
        "orcid": ";;;;;0000-0001-8228-1042",
        "linkedin": ";;;;;stellabiderman",
        "or_profile": "~Guillaume_Sanchez1;~Alexander_Spangher2;~Honglu_Fan1;~Elad_Levi1;~Pawan_Sasanka_Ammanamanchi1;~Stella_Biderman1",
        "aff": ";University of Southern California;University of Geneva;;International Institute of Information Technology Hyderabad;Booz Allen Hamilton",
        "aff_domain": ";usc.edu;unige.ch;;iiit.ac.in;boozallen.com",
        "position": ";PhD student;Postdoc;;MS student;Industry researcher",
        "bibtex": "@misc{\nsanchez2024stay,\ntitle={Stay on Topic with Classifier-Free Guidance},\nauthor={Guillaume Sanchez and Alexander Spangher and Honglu Fan and Elad Levi and Pawan Sasanka Ammanamanchi and Stella Biderman},\nyear={2024},\nurl={https://openreview.net/forum?id=RmRA7Q0lwQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "YQBo;RjYY;3Gz2",
        "site": "https://openreview.net/forum?id=RmRA7Q0lwQ",
        "pdf_size": 2302836,
        "rating": "5;5;6",
        "confidence": "3;4;3",
        "soundness": "3;3;3",
        "contribution": "2;2;3",
        "presentation": "4;4;2",
        "wc_summary": "35;72;85",
        "wc_strengths": "57;19;59",
        "wc_weaknesses": "52;34;142",
        "wc_questions": "51;50;31",
        "wc_review": "195;175;317",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "576;662;693",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;2;2",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            64.0,
            21.18175315375634
        ],
        "wc_strengths_avg": [
            45.0,
            18.40289832245635
        ],
        "wc_weaknesses_avg": [
            76.0,
            47.24404724407086
        ],
        "wc_questions_avg": [
            44.0,
            9.201449161228174
        ],
        "wc_review_avg": [
            229.0,
            62.758797524065635
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            643.6666666666666,
            49.492984912566705
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 43,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11081534836631603439&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "University of Southern California;University of Geneva;International Institute of Information Technology;Booz Allen Hamilton",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.usc.edu;https://www.unige.ch;https://iiit Hyderabad.ac.in;https://www.boozallen.com",
        "aff_unique_abbr": "USC;UNIGE;IIIT Hyderabad;BAH",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Los Angeles;;Hyderabad",
        "aff_country_unique_index": "0;1;2;0",
        "aff_country_unique": "United States;Switzerland;India"
    },
    {
        "id": "Rn3qJGOitY",
        "title": "Linear Attention via Orthogonal Memory",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Efficient attentions have greatly improved the computational efficiency of Transformers. However, most existing linear attention mechanisms suffer from an efficiency degradation problem, leading to inefficiencies in causal language modeling and hindering their application in long-range language models. This problem is more pronounced under language modeling with unbounded contexts. In this paper, we propose Linear Attention Via Orthogonal memory (LAVO) to address these limitations, achieving strong performance while maintaining linear complexity. LAVO employs orthogonal decomposition to compress a context into a fixed-size orthogonal memory while effectively minimizing redundancy within the context. Given that orthogonal memory compresses global information, we further dissect the context to amplify fine-grained local information. Additionally, we embed the relative position encoding into LAVO to improve the extrapolation ability. Experimental results show that LAVO greatly improves the efficiency of the causal language model with the best extrapolation performance and outperforms other efficient baselines. Further, we endeavor to employ LAVO for unbounded language modeling and successfully scale the context length to 128K.",
        "keywords": "Efficient attention; Efficiency degradation; Unbounded language modeling",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Jun Zhang;Shuyang Jiang;Jiangtao Feng;Lin Zheng;Lingpeng Kong",
        "authorids": "~Jun_Zhang27;~Shuyang_Jiang2;~Jiangtao_Feng1;~Lin_Zheng1;~Lingpeng_Kong1",
        "gender": "M;M;M;M;M",
        "homepage": ";;https://jiangtaofeng.github.io/;https://lzhengisme.github.io/;https://ikekonglp.github.io/",
        "dblp": ";153/1949;183/0908;;144/7656",
        "google_scholar": ";slwTiOUAAAAJ;7ufSFeIAAAAJ;3NXH0t8AAAAJ;f1hBi5wAAAAJ",
        "orcid": "0000-0002-3152-5091;;;;",
        "linkedin": ";%E4%B9%A6%E6%B4%8B-%E6%B1%9F-b8288223a/;;;",
        "or_profile": "~Jun_Zhang27;~Shuyang_Jiang2;~Jiangtao_Feng1;~Lin_Zheng1;~Lingpeng_Kong1",
        "aff": "ByteDance;Fudan University;No Affiliation;The University of Hong Kong;Department of Computer Science, The University of Hong Kong",
        "aff_domain": "bytedance.com;fudan.edu.cn;noaffiliation.com;hku.hk;cs.hku.hk",
        "position": "Researcher;PhD student;Researcher;PhD student;Assistant Professor",
        "bibtex": "@misc{\nzhang2024linear,\ntitle={Linear Attention via Orthogonal Memory},\nauthor={Jun Zhang and Shuyang Jiang and Jiangtao Feng and Lin Zheng and Lingpeng Kong},\nyear={2024},\nurl={https://openreview.net/forum?id=Rn3qJGOitY}\n}",
        "github": "",
        "project": "",
        "reviewers": "MBtz;o7Yu;uFEK;FEXD",
        "site": "https://openreview.net/forum?id=Rn3qJGOitY",
        "pdf_size": 6166677,
        "rating": "3;5;5;6",
        "confidence": "4;3;5;3",
        "soundness": "1;3;4;3",
        "contribution": "2;3;2;3",
        "presentation": "3;3;4;2",
        "wc_summary": "33;78;129;73",
        "wc_strengths": "19;85;80;39",
        "wc_weaknesses": "120;136;259;22",
        "wc_questions": "6;1;101;101",
        "wc_review": "178;300;569;235",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            1.0897247358851685
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            78.25,
            34.098203765007916
        ],
        "wc_strengths_avg": [
            55.75,
            27.725214156071004
        ],
        "wc_weaknesses_avg": [
            134.25,
            84.21512631350735
        ],
        "wc_questions_avg": [
            52.25,
            48.782040752719645
        ],
        "wc_review_avg": [
            320.5,
            149.82406348781225
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.3458572319330373,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12204904729137865163&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;3;3",
        "aff_unique_norm": "ByteDance;Fudan University;;University of Hong Kong",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.bytedance.com;https://www.fudan.edu.cn;;https://www.hku.hk",
        "aff_unique_abbr": "ByteDance;Fudan;;HKU",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China;"
    },
    {
        "id": "RnYd44LR2v",
        "title": "OODRobustBench: benchmarking and analyzing adversarial robustness under distribution shift",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Existing works have made great progress in improving adversarial robustness, but typically test their method only on data from the same distribution as the training data, i.e. in-distribution (ID) testing. \nAs a result, it is unclear how such robustness generalizes under input distribution shifts, i.e. out-of-distribution (OOD) testing. This is a concerning omission as such distribution shifts are unavoidable when methods are deployed in the wild. \nTo address this issue we propose a benchmark named OODRobustBench to comprehensively assess OOD adversarial robustness using 23 dataset-wise shifts (i.e. naturalistic shifts in input distribution) and 6 threat-wise shifts (i.e., unforeseen adversarial threat models). \nOODRobustBench is used to assess 706 robust models using 60.7K adversarial evaluations. This large-scale analysis shows that: 1) adversarial robustness suffers from a severe OOD generalization issue; 2) ID robustness correlates strongly with OOD robustness, in a positive linear way, under many distribution shifts. The latter enables the prediction of OOD robustness from ID robustness. Based on this, we are able to predict the upper limit of OOD robustness for existing robust training schemes. The results suggest that achieving OOD robustness requires designing novel methods beyond the conventional ones. Last, we discover that extra data, data augmentation, advanced model architectures and particular regularization approaches can improve OOD robustness. Noticeably, the discovered training schemes, compared to the baseline, exhibit dramatically higher robustness under threat shift while keeping high ID robustness, demonstrating new promising solutions for robustness against both multi-attack and unforeseen attacks.",
        "keywords": "adversarial robustness;OOD generalization;robustness benchmark;distribution shift",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/97293bb96d5b261698a88e4febd783d5dde65a08.zip",
        "author": "Lin Li;Yifei Wang;Chawin Sitawarin;David Wagner;Michael W. Spratling",
        "authorids": "~Lin_Li12;~Yifei_Wang1;~Chawin_Sitawarin1;~David_Wagner3;~Michael_W._Spratling1",
        "gender": "M;M;M;;",
        "homepage": "https://treelli.github.io/;https://yifeiwang77.com;https://chawins.github.io/;https://people.eecs.berkeley.edu/~daw/;",
        "dblp": ";00/555-1;211/7105;42/5626;",
        "google_scholar": "dxP6Y_oAAAAJ;-CLy6YsAAAAJ;https://scholar.google.com/citations?hl=en;67kghxAAAAAJ;",
        "orcid": "0000-0001-6369-2663;;0000-0002-4949-9661;0000-0002-9944-9232;",
        "linkedin": "lin-li-aa729a14b/;;chawins/;;",
        "or_profile": "~Lin_Li12;~Yifei_Wang1;~Chawin_Sitawarin1;~David_Wagner3;~Michael_W._Spratling1",
        "aff": "King's College London;Massachusetts Institute of Technology;University of California, Berkeley;University of California, Berkeley;",
        "aff_domain": "kcl.ac.uk;mit.edu;berkeley.edu;berkeley.edu;",
        "position": "PhD student;Postdoc;PhD student;Professor;",
        "bibtex": "@misc{\nli2024oodrobustbench,\ntitle={{OODR}obustBench: benchmarking and analyzing adversarial robustness under distribution shift},\nauthor={Lin Li and Yifei Wang and Chawin Sitawarin and David Wagner and Michael W. Spratling},\nyear={2024},\nurl={https://openreview.net/forum?id=RnYd44LR2v}\n}",
        "github": "",
        "project": "",
        "reviewers": "1Jrx;YQdD;ogvR;UQFk",
        "site": "https://openreview.net/forum?id=RnYd44LR2v",
        "pdf_size": 30631643,
        "rating": "5;6;6;6",
        "confidence": "4;3;5;5",
        "soundness": "3;3;4;4",
        "contribution": "2;2;3;2",
        "presentation": "2;3;3;3",
        "wc_summary": "78;123;106;71",
        "wc_strengths": "97;138;69;42",
        "wc_weaknesses": "341;248;146;88",
        "wc_questions": "43;106;32;81",
        "wc_review": "559;615;353;282",
        "wc_reply_reviewers": "39;0;51;0",
        "wc_reply_authors": "749;1148;567;758",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "1;2;2;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            94.5,
            21.02974084481309
        ],
        "wc_strengths_avg": [
            86.5,
            35.52815784698103
        ],
        "wc_weaknesses_avg": [
            205.75,
            96.84104243552937
        ],
        "wc_questions_avg": [
            65.5,
            29.618406439239774
        ],
        "wc_review_avg": [
            452.25,
            138.49074878850212
        ],
        "wc_reply_reviewers_avg": [
            22.5,
            22.89650628371062
        ],
        "wc_reply_authors_avg": [
            805.5,
            211.9180266046284
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.17407765595569782,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0;1;2;2",
        "aff_unique_norm": "King's College London;Massachusetts Institute of Technology;University of California, Berkeley",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.kcl.ac.uk;https://web.mit.edu;https://www.berkeley.edu",
        "aff_unique_abbr": "KCL;MIT;UC Berkeley",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Berkeley",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "id": "Rnxam2SRgB",
        "title": "Describe-and-Dissect: Interpreting Neurons in Vision Networks with Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this paper, we propose Describe-and-Dissect, a novel method to describe the roles of hidden neurons in vision networks. Describe-and-Dissect utilizes recent advancements in multimodal deep learning to produce complex natural language descriptions, without the need for labeled training data or a predefined set of concepts to choose from. Additionally, Describe-and-Dissect is training-free, meaning we don't train any new models and can easily leverage more capable general purpose models in the future. We show on a large scale user study that our method outperforms the state-of-the-art baseline methods including CLIP-Dissect, MILAN, and Network Dissection. Our method on average provides the highest quality labels and is more than 2$\\times$ as likely to be selected as the best explanation for a neuron than the best baseline.",
        "keywords": "Interpretability;Explainability;Deep Learning",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Nicholas Bai;Rahul Ajay Iyer;Tuomas Oikarinen;Tsui-Wei Weng",
        "authorids": "~Nicholas_Bai1;~Rahul_Ajay_Iyer1;~Tuomas_Oikarinen1;~Tsui-Wei_Weng1",
        "gender": "M;M;M;F",
        "homepage": ";;https://tuomaso.github.io/;https://lilywenglab.github.io",
        "dblp": ";;243/3532;177/9197",
        "google_scholar": ";;M3KZnPwAAAAJ;v8GM4xoAAAAJ",
        "orcid": ";;;",
        "linkedin": "nicholas-bai-193987292;rahul-iyer-7826b0292/;;",
        "or_profile": "~Nicholas_Bai1;~Rahul_Ajay_Iyer1;~Tuomas_Oikarinen1;~Tsui-Wei_Weng1",
        "aff": "University of California, San Diego;;GenenTech;University of California, San Diego",
        "aff_domain": "ucsd.edu;;gene.com;ucsd.edu",
        "position": "Intern;;Intern;Assistant Professor",
        "bibtex": "@misc{\nbai2024describeanddissect,\ntitle={Describe-and-Dissect: Interpreting Neurons in Vision Networks with Language Models},\nauthor={Nicholas Bai and Rahul Ajay Iyer and Tuomas Oikarinen and Tsui-Wei Weng},\nyear={2024},\nurl={https://openreview.net/forum?id=Rnxam2SRgB}\n}",
        "github": "",
        "project": "",
        "reviewers": "orxh;gXLM;YsCF;pUSu",
        "site": "https://openreview.net/forum?id=Rnxam2SRgB",
        "pdf_size": 46172038,
        "rating": "3;5;5;6",
        "confidence": "4;4;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;2",
        "presentation": "3;2;2;3",
        "wc_summary": "95;107;21;146",
        "wc_strengths": "199;69;57;113",
        "wc_weaknesses": "456;528;65;177",
        "wc_questions": "5;113;5;57",
        "wc_review": "755;817;148;493",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1911;2087;892;1839",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;3;2;3",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            92.25,
            45.25138119439008
        ],
        "wc_strengths_avg": [
            109.5,
            55.72028355993893
        ],
        "wc_weaknesses_avg": [
            306.5,
            191.37985787433325
        ],
        "wc_questions_avg": [
            45.0,
            44.63182720884279
        ],
        "wc_review_avg": [
            553.25,
            263.6876703602199
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1682.25,
            465.0846025187245
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.75,
            0.4330127018922193
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.13245323570650439,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12661412523466312799&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of California, San Diego;Genentech",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ucsd.edu;https://www.genentech.com",
        "aff_unique_abbr": "UCSD;Genentech",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "San Diego;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Ro3EBZiKhT",
        "title": "HiLoRL: A Hierarchical Logical Model for Learning Composite Tasks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We propose HiLoRL, a hierarchical model to learn policies for composite tasks. Recent studies mostly focus on using human-specified logical specifications, which is laborious and produces models that perform poorly when facing tasks not entirely human-predictable. HiLoRL is composed of a high-level logical planner and low-level action policies. It initially learns a rough rule at its upper level with the help of low-level policies and then uses joint training with surrogate rewards to refine the rough rule and low-level policies. Furthermore, HiLoRL can incorporate specialized predicates derived from expert knowledge, thereby enhancing its training speed and performance. We also design a synthesis algorithm to illustrate our high-level planner's logical structure as an automaton, demonstrating our model's interpretability. HiLoRL outperforms state-of-the-art baselines in several benchmarks with continuous state and action spaces. Additionally, HiLoRL does not require human to hard-code logical structures, so it can solve logically uncertain tasks.",
        "keywords": "Hierarchical Reinforcement Learning;Adaptive Logic Planner;Interpretability;Expert Knowledge Instruction",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "",
        "author": "Chuan Hu;Jingyu Cao;Jinpeng Zhang;Yunze Wu;Yi Wu;Zhilei Xu;Jianzhu Ma;Yuan Zhou",
        "authorids": "~Chuan_Hu2;~Jingyu_Cao1;~Jinpeng_Zhang4;~Yunze_Wu1;~Yi_Wu1;~Zhilei_Xu1;~Jianzhu_Ma2;~Yuan_Zhou1",
        "gender": "M;;M;M;M;M;M;M",
        "homepage": "https://github.com/modrichu;https://github.com/caojy1998;https://github.com/APeng-666;https://github.com/Skywuuuu;https://jxwuyi.weebly.com;;https://majianzhu.com/;http://yuanz.web.illinois.edu",
        "dblp": ";;;;;;24/9080.html;40/7018",
        "google_scholar": ";;;;dusV5HMAAAAJ;14uAc_MAAAAJ;;https://scholar.google.com.tw/citations?user=aR34e1gAAAAJ",
        "orcid": ";;;;;;;",
        "linkedin": ";;jinpeng-zhang-ab9464248;;;;;",
        "or_profile": "~Chuan_Hu2;~Jingyu_Cao1;~Jinpeng_Zhang4;~Yunze_Wu1;~Yi_Wu1;~Zhilei_Xu1;~Jianzhu_Ma2;~Yuan_Zhou1",
        "aff": "Shanghai Jiaotong University;Shanghai Jiaotong University;Tsinghua University;Shanghai Jiaotong University;Tsinghua University;Shanghai Jiaotong University;Tsinghua University;",
        "aff_domain": "sjtu.edu.cn;sjtu.edu.cn;tsinghua.edu.cn;sjtu.edu.cn;tsinghua.edu.cn;sjtu.edu.cn;tsinghua.edu.cn;",
        "position": "MS student;MS student;PhD student;PhD student;Assistant Professor;Associate Professor;Associate Professor;",
        "bibtex": "@misc{\nhu2024hilorl,\ntitle={HiLo{RL}: A Hierarchical Logical Model for Learning Composite Tasks},\nauthor={Chuan Hu and Jingyu Cao and Jinpeng Zhang and Yunze Wu and Yi Wu and Zhilei Xu and Jianzhu Ma and Yuan Zhou},\nyear={2024},\nurl={https://openreview.net/forum?id=Ro3EBZiKhT}\n}",
        "github": "",
        "project": "",
        "reviewers": "S5sm;CNH4;zuiu;732B",
        "site": "https://openreview.net/forum?id=Ro3EBZiKhT",
        "pdf_size": 481833,
        "rating": "3;3;5;6",
        "confidence": "4;3;4;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;2;3",
        "wc_summary": "100;65;82;73",
        "wc_strengths": "55;30;196;73",
        "wc_weaknesses": "233;663;499;187",
        "wc_questions": "79;167;54;111",
        "wc_review": "467;925;831;444",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            80.0,
            13.019216566291536
        ],
        "wc_strengths_avg": [
            88.5,
            63.91596044807588
        ],
        "wc_weaknesses_avg": [
            395.5,
            195.03012587802942
        ],
        "wc_questions_avg": [
            102.75,
            42.23964370114881
        ],
        "wc_review_avg": [
            666.75,
            214.00277451472445
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.19245008972987526,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:J66yP9xGtMgJ:scholar.google.com/&scioq=HiLoRL:+A+Hierarchical+Logical+Model+for+Learning+Composite+Tasks&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;1;0;1",
        "aff_unique_norm": "Shanghai Jiao Tong University;Tsinghua University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.sjtu.edu.cn;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "SJTU;THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "RofU5v2BvZ",
        "title": "Efficient Human-AI Coordination via Preparatory Language-based Convention",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Developing intelligent agents capable of seamless coordination with humans is a critical step towards achieving artificial general intelligence. Existing methods for human-AI coordination typically train an agent to coordinate with a diverse set of policies or with human models fitted from real human data. However, the massively diverse styles of human behavior present obstacles for AI systems with constrained capacity, while high quality human data may not be readily available in real-world scenarios. In this study, we observe that prior to coordination, humans engage in communication to establish \\textit{conventions} that specify individual roles and actions, making their coordination proceed in an orderly manner. Building upon this observation, we propose employing the large language model (LLM) to develop an action plan (or equivalently, a convention) that effectively guides both human and AI. By inputting task requirements, human preferences, the number of agents, and other pertinent information into the LLM, it can generate a comprehensive convention that facilitates a clear understanding of tasks and responsibilities for all parties involved. Furthermore, we demonstrate that decomposing the convention formulation problem into sub-problems with \\textit{multiple} new sessions being sequentially employed and human feedback, will yield a more efficient coordination convention. Experimental evaluations conducted in the \\textit{Overcooked-AI} environment, utilizing a human proxy model, highlight the superior performance of our proposed method compared to existing learning-based approaches. When coordinating with real humans, our method achieves better alignment with human preferences and an average performance improvement of 15\\% compared to the state-of-the-art.",
        "keywords": "Human-AI coordination;Multi-agent Reinforcement Learning;Large Language Model;Coordination and Cooperation",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/75483e38422d20242d0f5d6e81eb0f556e7c1040.zip",
        "author": "Cong Guan;Lichao Zhang;Chunpeng Fan;Yi-Chen Li;Feng Chen;Lihe Li;Yunjia Tian;Lei Yuan;Yang Yu",
        "authorids": "~Cong_Guan1;~Lichao_Zhang3;~Chunpeng_Fan1;~Yi-Chen_Li1;~Feng_Chen12;~Lihe_Li1;~Yunjia_Tian1;~Lei_Yuan2;~Yang_Yu5",
        "gender": "M;M;;M;M;M;F;M;",
        "homepage": "http://www.lamda.nju.edu.cn/guanc/;http://polixir.ai/;;http://www.lamda.nju.edu.cn/liyc/;;http://lilh.site;;http://www.lamda.nju.edu.cn/yuanl/;",
        "dblp": "191/7206;126/8027;;143/7158-1;21/3047-42;347/1926;;23/6750-1;",
        "google_scholar": ";;;https://scholar.google.com.hk/citations?user=OA3GmbQAAAAJ;QgorT8QAAAAJ;q0tENOAAAAAJ;;https://scholar.google.com/citations?hl=zh-CN;",
        "orcid": ";;;;;;;;",
        "linkedin": ";;;;;;;;",
        "or_profile": "~Cong_Guan1;~Lichao_Zhang3;~Chunpeng_Fan1;~Yi-Chen_Li1;~Feng_Chen12;~Lihe_Li1;~Yunjia_Tian1;~Lei_Yuan2;~Yang_Yu5",
        "aff": "Nanjing University;POLIXIR;;Nanjing University;Nanjing University;Nanjing University;;Nanjing University;",
        "aff_domain": "nju.edu.cn;polixir.ai;;nju.edu.cn;lamda.nju.edu.cn;nju.edu.cn;;nju.edu.cn;",
        "position": "PhD student;Researcher;;PhD student;MS student;MS student;;Researcher;",
        "bibtex": "@misc{\nguan2024efficient,\ntitle={Efficient Human-{AI} Coordination via Preparatory Language-based Convention},\nauthor={Cong Guan and Lichao Zhang and Chunpeng Fan and Yi-Chen Li and Feng Chen and Lihe Li and Yunjia Tian and Lei Yuan and Yang Yu},\nyear={2024},\nurl={https://openreview.net/forum?id=RofU5v2BvZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "fw9C;nmM1;i2dJ;nsKW",
        "site": "https://openreview.net/forum?id=RofU5v2BvZ",
        "pdf_size": 1607088,
        "rating": "5;5;6;6",
        "confidence": "4;3;3;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;2;2",
        "wc_summary": "148;97;43;197",
        "wc_strengths": "86;86;60;78",
        "wc_weaknesses": "646;342;107;319",
        "wc_questions": "17;47;70;206",
        "wc_review": "897;572;280;800",
        "wc_reply_reviewers": "63;239;0;316",
        "wc_reply_authors": "1208;1552;624;2366",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "4;4;2;5",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            121.25,
            57.3688722217894
        ],
        "wc_strengths_avg": [
            77.5,
            10.618380290797651
        ],
        "wc_weaknesses_avg": [
            353.5,
            192.12040495480952
        ],
        "wc_questions_avg": [
            85.0,
            72.34293331072497
        ],
        "wc_review_avg": [
            637.25,
            237.61457762519538
        ],
        "wc_reply_reviewers_avg": [
            154.5,
            127.93064527313227
        ],
        "wc_reply_authors_avg": [
            1437.5,
            630.4115719115568
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.75,
            1.0897247358851685
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11496336654345969589&as_sdt=5,24&sciodt=0,24&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0;0;0;0",
        "aff_unique_norm": "Nanjing University;Polixir",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.nju.edu.cn;",
        "aff_unique_abbr": "Nanjing U;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China;"
    },
    {
        "id": "RpKA1wqgk0",
        "title": "MetaFormer with Holistic Attention Modelling Improves Few-Shot Classification",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Pre-trained vision transformers have revolutionized few-shot image classification, and it has been recently demonstrated that the previous common practice of meta-learning in synergy with these pre-trained transformers still holds significance and contributes to further advancing their performance. Unfortunately, the majority of working insights such as task conditioning are specifically tailored for convolutional neural networks, thus failing to translate effectively to vision transformers. This work sets out to bridge this gap via a coherent and lightweight framework called MetaFormer, which maintains compatibility with off-the-shelf pre-trained vision transformers. The proposed MetaFormer consists of two attention modules, i.e., the Sample-level Attention Module (SAM) and the Task-level Attention Module (TAM). SAM works in conjunction with the patch-level attention in Transformers to enforce consistency in the attended features across samples within a task, while TAM regularizes learning of the current task with an attended task in the pool. Empirical results on four few-shot learning benchmarks, i.e., miniImageNet, tieredImageNet, CIFAR-FS, and FC100, showcase that our approach achieves the new state-of-the-art at a very modest increase in computational overhead. Furthermore, our approach excels in cross-domain task generalization scenarios.",
        "keywords": "Meta-Learning;Vision Transformers",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Xu Yang;Ying Wei",
        "authorids": "~Xu_Yang10;~Ying_Wei1",
        "gender": ";F",
        "homepage": ";https://wei-ying.net/",
        "dblp": ";14/4899-1",
        "google_scholar": ";5UpFdKsAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Xu_Yang10;~Ying_Wei1",
        "aff": ";Nanyang Technological University",
        "aff_domain": ";ntu.edu.sg",
        "position": ";Assistant Professor",
        "bibtex": "@misc{\nyang2024metaformer,\ntitle={MetaFormer with Holistic Attention Modelling Improves Few-Shot Classification},\nauthor={Xu Yang and Ying Wei},\nyear={2024},\nurl={https://openreview.net/forum?id=RpKA1wqgk0}\n}",
        "github": "",
        "project": "",
        "reviewers": "xXZf;xYfp;kzi2;5apc",
        "site": "https://openreview.net/forum?id=RpKA1wqgk0",
        "pdf_size": 24663327,
        "rating": "5;5;5;6",
        "confidence": "4;3;3;5",
        "soundness": "3;3;3;2",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "88;49;92;56",
        "wc_strengths": "64;66;25;60",
        "wc_weaknesses": "184;204;156;118",
        "wc_questions": "45;22;75;83",
        "wc_review": "381;341;348;317",
        "wc_reply_reviewers": "27;0;0;0",
        "wc_reply_authors": "1425;2071;1729;1061",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "4;5;4;3",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            71.25,
            18.965429075030176
        ],
        "wc_strengths_avg": [
            53.75,
            16.7388022271607
        ],
        "wc_weaknesses_avg": [
            165.5,
            32.29163978493505
        ],
        "wc_questions_avg": [
            56.25,
            24.324627438051337
        ],
        "wc_review_avg": [
            346.75,
            22.873292285982796
        ],
        "wc_reply_reviewers_avg": [
            6.75,
            11.691342951089922
        ],
        "wc_reply_authors_avg": [
            1571.5,
            372.9540856459411
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.0,
            0.7071067811865476
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.8703882797784891,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:fZvd6qoxcT8J:scholar.google.com/&scioq=MetaFormer+with+Holistic+Attention+Modelling+Improves+Few-Shot+Classification&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Nanyang Technological University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ntu.edu.sg",
        "aff_unique_abbr": "NTU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Singapore"
    },
    {
        "id": "RqUMWdDg52",
        "title": "FireAct: Toward Language Agent Finetuning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent efforts have augmented language models (LMs) with external tools or environments, leading to the development of language agents that can reason and act. However, most of these agents rely on few-shot prompting techniques, which can result in a lack of robustness in agent performance due to the limited learning support. In this paper, we investigate the less explored direction of fine-tuning LMs to obtain language agents.  With a simple, controlled setup that uses a Google search API for question answering (QA), we systematically explore a variety of base LMs, agent methods, fine-tuning data, and QA tasks.  Our experiments reveal novel insights around the scaling effects of the base LM and fine-tuning data, combining trajectory data collected from different tasks and different agent methods, as well as robustness to different types of data perturbations.  Overall, these findings illustrate overlooked advantages of fine-tuned language agents over existing prompting-based ones, provide empirical guidelines for fine-tuning, and indicate future directions in creating better tasks and methods for language agents.",
        "keywords": "language agent;language model;large language model;finetuning;agent;tool use",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Baian Chen;Chang Shu;Ehsan Shareghi;Nigel Collier;Karthik R Narasimhan;Shunyu Yao",
        "authorids": "~Baian_Chen1;~Chang_Shu5;~Ehsan_Shareghi1;~Nigel_Collier1;~Karthik_R_Narasimhan1;~Shunyu_Yao1",
        "gender": ";M;M;M;M;M",
        "homepage": ";https://ciaranshu.github.io;https://eehsan.github.io/;https://sites.google.com/site/nhcollier/;http://www.karthiknarasimhan.com;https://ysymyth.github.io",
        "dblp": ";;09/7859;90/2619;147/0322;156/1038",
        "google_scholar": "IFKToXUAAAAJ;SxQjvCUAAAAJ;https://scholar.google.com.au/citations?user=EhnQJFwAAAAJ;https://scholar.google.co.uk/citations?user=ZMelBa0AAAAJ;euc0GX4AAAAJ;qJBXk9cAAAAJ",
        "orcid": ";;;0000-0002-7230-4164;;",
        "linkedin": ";;;;;",
        "or_profile": "~Baian_Chen1;~Chang_Shu5;~Ehsan_Shareghi1;~Nigel_Collier1;~Karthik_R_Narasimhan1;~Shunyu_Yao1",
        "aff": ";University of Cambridge;Monash University;University of Cambridge;Princeton University;Princeton University",
        "aff_domain": ";cam.ac.uk;monash.edu;cam.ac.uk;princeton.edu;princeton.edu",
        "position": ";PhD student;Assistant Professor;Full Professor;Assistant Professor;PhD student",
        "bibtex": "@misc{\nchen2024fireact,\ntitle={FireAct: Toward Language Agent Finetuning},\nauthor={Baian Chen and Chang Shu and Ehsan Shareghi and Nigel Collier and Karthik R Narasimhan and Shunyu Yao},\nyear={2024},\nurl={https://openreview.net/forum?id=RqUMWdDg52}\n}",
        "github": "",
        "project": "",
        "reviewers": "3cXG;6Re8;GhVh;iJYa",
        "site": "https://openreview.net/forum?id=RqUMWdDg52",
        "pdf_size": 627376,
        "rating": "3;3;5;6",
        "confidence": "5;3;4;5",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;2",
        "presentation": "3;2;3;3",
        "wc_summary": "53;97;108;119",
        "wc_strengths": "30;33;138;72",
        "wc_weaknesses": "216;222;175;75",
        "wc_questions": "50;2;116;35",
        "wc_review": "349;354;537;301",
        "wc_reply_reviewers": "0;0;27;0",
        "wc_reply_authors": "370;370;362;278",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            94.25,
            25.053692342646823
        ],
        "wc_strengths_avg": [
            68.25,
            43.54523510098436
        ],
        "wc_weaknesses_avg": [
            172.0,
            58.8515080520457
        ],
        "wc_questions_avg": [
            50.75,
            41.4811704270745
        ],
        "wc_review_avg": [
            385.25,
            90.0232608829518
        ],
        "wc_reply_reviewers_avg": [
            6.75,
            11.691342951089922
        ],
        "wc_reply_authors_avg": [
            345.0,
            38.82009788756334
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.4061811972299616,
        "gs_citation": 110,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12301932591202926060&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;2;2",
        "aff_unique_norm": "University of Cambridge;Monash University;Princeton University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.cam.ac.uk;https://www.monash.edu;https://www.princeton.edu",
        "aff_unique_abbr": "Cambridge;Monash;Princeton",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Cambridge;",
        "aff_country_unique_index": "0;1;0;2;2",
        "aff_country_unique": "United Kingdom;Australia;United States"
    },
    {
        "id": "Rriucj4UmC",
        "title": "Reconstruction of Cortical Surfaces with Spherical Topology from Infant Brain MRI via Recurrent Deformation Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Cortical surface reconstruction (CSR) from MRI is key to investigating brain structure and function. While recent deep learning approaches have significantly improved the speed of CSR, a substantial amount of runtime is still needed to map the cortex to a topologically-correct spherical manifold to facilitate downstream geometric analyses. Moreover, this mapping is possible only if the topology of the surface mesh is homotopic to a sphere. Here, we present a method for simultaneous CSR and spherical mapping efficiently within seconds. Our approach seamlessly connects two sub-networks for white and pial surface generation. Residual diffeomorphic deformations are learned iteratively to gradually warp a spherical template mesh to the white and pial surfaces while preserving mesh topology and uniformity. The one-to-one vertex correspondence between the template sphere and the cortical surfaces allows easy and direct mapping of geometric features like convexity and curvature to the sphere for visualization and downstream processing. We demonstrate the efficacy of our approach on infant brain MRI, which poses significant challenges to CSR due to  tissue contrast changes associated with rapid brain development  during the first postnatal year. Performance evaluation based on a dataset of infants from 0 to 12 months demonstrates that our method substantially enhances mesh regularity and reduces geometric errors, outperforming state-of-the-art deep learning approaches, all while maintaining high computational efficiency.",
        "keywords": "Cortical surface reconstruction;infant brain;diffeomorphic",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/0dbf9b19485a4eb1668c412e99f8d2b308a1ba7a.pdf",
        "author": "Xiaoyang Chen;Junjie Zhao;Siyuan Liu;Sahar Ahmad;Pew-Thian Yap",
        "authorids": "~Xiaoyang_Chen1;~Junjie_Zhao3;~Siyuan_Liu2;~Sahar_Ahmad1;~Pew-Thian_Yap1",
        "gender": "M;M;M;F;M",
        "homepage": "https://github.com/xychen2022;https://www.med.unc.edu/bric/ideagroup/members/;;https://sites.google.com/view/sahar-ahmad;https://www.yaplab.io",
        "dblp": ";;;http://dblp.uni-trier.de/pers/hd/a/Ahmad:Sahar;93/5188",
        "google_scholar": "Ypmtq7MAAAAJ;;SCEzr3EAAAAJ;https://scholar.google.com/citations?hl=en;QGdnthwAAAAJ",
        "orcid": "0000-0003-2390-9797;0009-0006-2040-3060;0000-0002-0946-4683;0000-0001-7243-9977;0000-0003-1489-2102",
        "linkedin": ";;;sahar-ahmad967;pew-thian-yap-5405944/",
        "or_profile": "~Xiaoyang_Chen1;~Junjie_Zhao3;~Siyuan_Liu2;~Sahar_Ahmad1;~Pew-Thian_Yap1",
        "aff": "University of Pennsylvania;University of North Carolina at Chapel Hill;Dalian Martime University;The University of North Carolina at Chapel Hill, USA;University of North Carolina at Chapel Hill",
        "aff_domain": "upenn.edu;unc.edu;dlmu.edu.cn;unc.edu;unc.edu",
        "position": "Postdoc;PhD student;Associate Professor;Instructor;Full Professor",
        "bibtex": "@misc{\nchen2024reconstruction,\ntitle={Reconstruction of Cortical Surfaces with Spherical Topology from Infant Brain {MRI} via Recurrent Deformation Learning},\nauthor={Xiaoyang Chen and Junjie Zhao and Siyuan Liu and Sahar Ahmad and Pew-Thian Yap},\nyear={2024},\nurl={https://openreview.net/forum?id=Rriucj4UmC}\n}",
        "github": "",
        "project": "",
        "reviewers": "o2xm;o99L;Ciwf",
        "site": "https://openreview.net/forum?id=Rriucj4UmC",
        "pdf_size": 47446234,
        "rating": "3;3;5",
        "confidence": "4;4;4",
        "soundness": "2;3;2",
        "contribution": "2;2;2",
        "presentation": "2;3;2",
        "wc_summary": "129;15;22",
        "wc_strengths": "59;31;8",
        "wc_weaknesses": "618;137;31",
        "wc_questions": "15;37;31",
        "wc_review": "821;220;92",
        "wc_reply_reviewers": "369;0;0",
        "wc_reply_authors": "947;668;553",
        "reply_reviewers": "1;0;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            55.333333333333336,
            52.16853031814827
        ],
        "wc_strengths_avg": [
            32.666666666666664,
            20.8539897594894
        ],
        "wc_weaknesses_avg": [
            262.0,
            255.42252576205308
        ],
        "wc_questions_avg": [
            27.666666666666668,
            9.285592184789413
        ],
        "wc_review_avg": [
            377.6666666666667,
            317.8095166745151
        ],
        "wc_reply_reviewers_avg": [
            123.0,
            173.9482681718907
        ],
        "wc_reply_authors_avg": [
            722.6666666666666,
            165.42940756978152
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:BUKfxk94t8MJ:scholar.google.com/&scioq=Reconstruction+of+Cortical+Surfaces+with+Spherical+Topology+from+Infant+Brain+MRI+via+Recurrent+Deformation+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;3;1",
        "aff_unique_norm": "University of Pennsylvania;University of North Carolina;Dalian Maritime University;University of North Carolina at Chapel Hill",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.upenn.edu;https://www.unc.edu;http://www.dlmu.edu.cn/;https://www.unc.edu",
        "aff_unique_abbr": "UPenn;UNC;DMU;UNC Chapel Hill",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Chapel Hill",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "MT-Ranker: Reference-free machine translation evaluation by inter-system ranking",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18633",
        "id": "Rry1SeSOQL",
        "author_site": "Ibraheem Muhammad Moosa, Rui Zhang, Wenpeng Yin",
        "tldr": "",
        "abstract": "Traditionally, Machine Translation (MT) Evaluation has been treated as a regression problem -- producing an absolute translation-quality score. This approach has two limitations: i) the scores lack interpretability, and human annotators struggle with giving consistent scores; ii) most scoring methods are based on (reference, translation) pairs, limiting their applicability in real-world scenarios where references are absent. In practice, we often care about whether a new MT system is better or worse than some competitors. In addition, reference-free MT evaluation is increasingly practical and necessary. Unfortunately, these two practical considerations have yet to be jointly explored. In this work, we formulate the reference-free MT evaluation into a pairwise ranking problem. Given the source sentence and a pair of translations, our system predicts which translation is better. In addition to proposing this new formulation, we further show that this new paradigm can demonstrate superior correlation with human judgments by merely using indirect supervision from natural language inference and weak supervision from our synthetic data. In the context of reference-free evaluation, MT-Ranker, trained without any human annotations, achieves state-of-the-art results on the WMT Shared Metrics Task benchmarks DARR20, MQM20, and MQM21. On a more challenging benchmark, ACES, which contains fine-grained evaluation criteria such as addition, omission, and mistranslation errors, MT-Ranker marks state-of-the-art against reference-free as well as reference-based baselines.",
        "keywords": "Machine Translation Evaluation",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Ibraheem Muhammad Moosa;Rui Zhang;Wenpeng Yin",
        "authorids": "~Ibraheem_Muhammad_Moosa1;~Rui_Zhang7;~Wenpeng_Yin1",
        "gender": "M;M;",
        "homepage": "https://ibraheem-moosa.github.io/;https://ryanzhumich.github.io/;http://wenpengyin.org/",
        "dblp": "242/0165;60/2536-37;117/7310-1",
        "google_scholar": "G7mYYS4AAAAJ;nhuB5CEAAAAJ;mRg16LkAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Ibraheem_Muhammad_Moosa1;~Rui_Zhang7;~Wenpeng_Yin1",
        "aff": "Pennsylvania State University;Pennsylvania State University;Pennsylvania State University",
        "aff_domain": "psu.edu;psu.edu;psu.edu",
        "position": "PhD student;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nmoosa2024mtranker,\ntitle={{MT}-Ranker: Reference-free machine translation evaluation by inter-system ranking},\nauthor={Ibraheem Muhammad Moosa and Rui Zhang and Wenpeng Yin},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Rry1SeSOQL}\n}",
        "github": "",
        "project": "",
        "reviewers": "DxQx;2G4a;GQxu;Qwxh",
        "pdf_size": 406415,
        "rating": "5;6;8;8",
        "confidence": "4;3;4;4",
        "soundness": "2;2;3;4",
        "contribution": "2;2;3;4",
        "presentation": "3;3;3;4",
        "wc_summary": "25;116;104;149",
        "wc_strengths": "40;37;87;53",
        "wc_weaknesses": "290;172;98;50",
        "wc_questions": "104;83;180;41",
        "wc_review": "459;408;469;293",
        "wc_reply_reviewers": "219;0;48;0",
        "wc_reply_authors": "1453;912;722;368",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "3;2;1;1",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            98.5,
            45.521972716480555
        ],
        "wc_strengths_avg": [
            54.25,
            19.84155991851447
        ],
        "wc_weaknesses_avg": [
            152.5,
            90.50276238878016
        ],
        "wc_questions_avg": [
            102.0,
            50.42320894191484
        ],
        "wc_review_avg": [
            407.25,
            69.9012696594275
        ],
        "wc_reply_reviewers_avg": [
            66.75,
            90.05935542740687
        ],
        "wc_reply_authors_avg": [
            863.75,
            392.2386868986791
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7676435155792417877&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=Rry1SeSOQL",
        "pdf": "https://openreview.net/pdf?id=Rry1SeSOQL",
        "email": "psu.edu;psu.edu;psu.edu",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Pennsylvania State University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.psu.edu",
        "aff_unique_abbr": "PSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Optimal Sketching for Residual Error Estimation for Matrix and Vector Norms",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18632",
        "id": "RsJwmWvE6Q",
        "author_site": "Yi Li, Honghao Lin, David Woodruff",
        "tldr": "",
        "abstract": "We study the problem of residual error estimation for matrix and vector norms using a linear sketch. Such estimates can be used, for example, to quickly assess how useful a more expensive low-rank approximation computation will be. The matrix case concerns the Frobenius norm and the task is to approximate the $k$-residual $\\|A - A_k\\|_F$ of the input matrix $A$ within a $(1+\\epsilon)$-factor, where $A_k$ is the optimal rank-$k$ approximation. We provide a tight bound of $\\Theta(k^2/\\epsilon^4)$ on the size of bilinear sketches, which have the form of a matrix product $SAT$. This improves the previous $O(k^2/\\epsilon^6)$ upper bound in (Andoni et al. SODA 2013) and gives the first non-trivial lower bound, to the best of our knowledge. \nIn our algorithm, our sketching matrices $S$ and $T$ can both be sparse matrices, allowing for a very fast update time. \nWe demonstrate that this gives a substantial advantage empirically, for roughly the same sketch size and accuracy as in previous work. \n\nFor the vector case, we consider the $\\ell_p$-norm for $p>2$, where the task is to approximate the $k$-residual $\\|x - x_k\\|_p$ up to a constant factor, where $x_k$ is the optimal $k$-sparse approximation to $x$. Such vector norms are frequently studied in the data stream literature and are useful for finding frequent items or so-called heavy hitters. We establish an upper bound of $O(k^{2/p}n^{1-2/p}\\operatorname{poly}(\\log n))$ for constant $\\epsilon$ on the dimension of a linear sketch for this problem. Our algorithm can be extended to the $\\ell_p$ sparse recovery problem with the same sketching dimension, which seems to be the first such bound for $p > 2$. We also show an $\\Omega(k^{2/p}n^{1-2/p})$ lower bound for the sparse recovery problem, which is tight up to a $\\mathrm{poly}(\\log n)$ factor.",
        "keywords": "Sketching;Residual error;Low-rank approximation;sparse recovery",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Yi Li;Honghao Lin;David Woodruff",
        "authorids": "~Yi_Li8;~Honghao_Lin1;~David_Woodruff1",
        "gender": "M;M;M",
        "homepage": ";https://honghlin.github.io;http://www.cs.cmu.edu/~dwoodruf/",
        "dblp": "59/871-2;https://dblp.uni-trier.de/pid/264/2663.html;w/DPWoodruff",
        "google_scholar": ";;https://scholar.google.com.tw/citations?user=0G2t-6sAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Yi_Li8;~Honghao_Lin1;~David_Woodruff1",
        "aff": "Nanyang Technological University;Carnegie Mellon University;Carnegie Mellon University",
        "aff_domain": "ntu.edu.sg;cmu.edu;cmu.edu",
        "position": "Associate Professor;PhD student;Full Professor",
        "bibtex": "@inproceedings{\nli2024optimal,\ntitle={Optimal Sketching for Residual Error Estimation for Matrix and Vector Norms},\nauthor={Yi Li and Honghao Lin and David Woodruff},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=RsJwmWvE6Q}\n}",
        "github": "",
        "project": "",
        "reviewers": "k2z9;FqHJ;Mz93;QAtz",
        "pdf_size": 326537,
        "rating": "5;6;8;8",
        "confidence": "4;3;4;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;4;3;3",
        "wc_summary": "92;102;211;263",
        "wc_strengths": "69;25;142;192",
        "wc_weaknesses": "770;48;29;128",
        "wc_questions": "193;2;2;149",
        "wc_review": "1124;177;384;732",
        "wc_reply_reviewers": "911;0;10;18",
        "wc_reply_authors": "1477;190;20;269",
        "reply_reviewers": "2;0;1;1",
        "reply_authors": "3;1;1;1",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            167.0,
            72.46033397659716
        ],
        "wc_strengths_avg": [
            107.0,
            64.45541094431096
        ],
        "wc_weaknesses_avg": [
            243.75,
            306.09342936430374
        ],
        "wc_questions_avg": [
            86.5,
            85.92002094971812
        ],
        "wc_review_avg": [
            604.25,
            359.69179515246105
        ],
        "wc_reply_reviewers_avg": [
            234.75,
            390.4851949818328
        ],
        "wc_reply_authors_avg": [
            489.0,
            577.4742418497989
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.19245008972987526,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12312366481473821443&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=RsJwmWvE6Q",
        "pdf": "https://openreview.net/pdf?id=RsJwmWvE6Q",
        "email": "ntu.edu.sg;cmu.edu;cmu.edu",
        "author_num": 3,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Nanyang Technological University;Carnegie Mellon University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ntu.edu.sg;https://www.cmu.edu",
        "aff_unique_abbr": "NTU;CMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "Singapore;United States"
    },
    {
        "id": "RsnWEcuymH",
        "title": "Accelerating Simulation-Based Influence Maximization via Bayesian Optimization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Influence Maximization (IM) has garnered significant attention due to its broad applicability in areas such as viral marketing, social network recommendations, and disease containment. The primary goal of IM is to identify an optimal seed set that maximizes influence spread. Existing methodologies for IM are largely categorized into proxy-based and simulation-based approaches, each with its own limitations. Proxy-based methods often fail to capture complex seed interactions and are model-specific, while simulation-based techniques are computationally expensive for large-scale graphs. Additionally, current research lacks a comprehensive model to understand the relationship between seed set configurations and their resulting influence spreads. To address these challenges, we present a Bayesian Optimization Influence Maximization (BOIM) framework that employs Bayesian optimization to minimize the number of required simulations. Our approach utilizes a Gaussian Process (GP) as the surrogate function to model the complex interplay between seed sets and influence spreads. In GP, we also introduce a specialized kernel for graph-level Bayesian optimization and implement stratified sampling to ensure uniform instance distribution. Our methodology offers a computationally efficient yet accurate alternative to traditional IM approaches, effectively bridging the gap between computational efficiency and approximation fidelity. Extensive experimentation has demonstrated that our approach has effectiveness and efficiency that surpasses standard simulation methods.",
        "keywords": "influence maximization;Bayesian optimization;simulation",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/2bdd958e40caadaedf0babbac369063e7d9c435f.zip",
        "author": "Zonghan Zhang;Zhiqian Chen",
        "authorids": "~Zonghan_Zhang1;~Zhiqian_Chen1",
        "gender": "M;M",
        "homepage": "https://zonghan-zhang.github.io/;https://imczq.com",
        "dblp": "324/1739;131/7787.html",
        "google_scholar": ";https://scholar.google.com/citations?hl=en",
        "orcid": ";0000-0003-4112-9647",
        "linkedin": "zonghan-zhang-a7ab8961/;",
        "or_profile": "~Zonghan_Zhang1;~Zhiqian_Chen1",
        "aff": "Mississippi State University;Mississippi State University",
        "aff_domain": "msstate.edu;msstate.edu",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nzhang2024accelerating,\ntitle={Accelerating Simulation-Based Influence Maximization via Bayesian Optimization},\nauthor={Zonghan Zhang and Zhiqian Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=RsnWEcuymH}\n}",
        "github": "",
        "project": "",
        "reviewers": "sPAd;CMuJ;U1hZ;sqPq",
        "site": "https://openreview.net/forum?id=RsnWEcuymH",
        "pdf_size": 453203,
        "rating": "3;3;3;6",
        "confidence": "4;4;4;4",
        "soundness": "2;2;2;3",
        "contribution": "2;1;2;3",
        "presentation": "1;3;2;3",
        "wc_summary": "70;69;45;61",
        "wc_strengths": "41;31;26;56",
        "wc_weaknesses": "134;232;428;215",
        "wc_questions": "86;69;5;6",
        "wc_review": "331;401;504;338",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            61.25,
            10.0093706095838
        ],
        "wc_strengths_avg": [
            38.5,
            11.4564392373896
        ],
        "wc_weaknesses_avg": [
            252.25,
            108.01475593639972
        ],
        "wc_questions_avg": [
            41.5,
            36.5
        ],
        "wc_review_avg": [
            393.5,
            69.37759004174187
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ftL01DUIh1MJ:scholar.google.com/&scioq=Accelerating+Simulation-Based+Influence+Maximization+via+Bayesian+Optimization&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Mississippi State University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.msstate.edu",
        "aff_unique_abbr": "MSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "A Primal-Dual Approach to Solving Variational Inequalities with General Constraints",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18631",
        "id": "RsztjXcvUf",
        "author_site": "Tatjana Chavdarova, Tong Yang, Matteo Pagliardini, Michael Jordan",
        "tldr": "",
        "abstract": "Yang et al. (2023) recently showed how to use first-order gradient methods to solve general variational inequalities (VIs) under a limiting assumption that analytic solutions of specific subproblems are available.  In this paper, we circumvent this assumption via a warm-starting technique where we solve subproblems approximately and initialize variables with the approximate solution found at the previous iteration. \nWe prove the convergence of this method and show that the gap function of the last iterate of the method decreases at a rate of $\\mathcal{O}(\\frac{1}{\\sqrt{K}})$ when the operator is $L$-Lipschitz and monotone. \nIn numerical experiments, we show that this technique can converge much faster than its exact counterpart. \nFurthermore, for the cases when the inequality constraints are simple, we introduce an alternative variant of ACVI and establish its convergence under the same conditions.\nFinally, we relax the smoothness assumptions in Yang et al., yielding, to our knowledge, the first convergence result for VIs with general constraints that does not rely on the assumption that the operator is $L$-Lipschitz.",
        "keywords": "Variational Inequaly;optimization;constraints;primal-dual;interior-point method;Monotone operator;last iterate convergence",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Tatjana Chavdarova;Tong Yang;Matteo Pagliardini;Michael Jordan",
        "authorids": "~Tatjana_Chavdarova2;~Tong_Yang4;~Matteo_Pagliardini1;~Michael_Jordan1",
        "gender": "F;F;M;M",
        "homepage": "https://chavdarova.github.io;https://pptmiao.github.io;;http://www.cs.berkeley.edu/~jordan/",
        "dblp": "160/6038;;140/7789;j/MichaelIJordan",
        "google_scholar": ";;https://scholar.google.ch/citations?user=FXacC3oAAAAJ;https://scholar.google.com.tw/citations?user=yxUduqMAAAAJ",
        "orcid": ";;;0000-0001-8935-817X",
        "linkedin": ";;;",
        "or_profile": "~Tatjana_Chavdarova2;~Tong_Yang4;~Matteo_Pagliardini1;~Michael_Jordan1",
        "aff": "University of California, Berkeley;Carnegie Mellon University;Swiss Federal Institute of Technology Lausanne;University of California, Berkeley",
        "aff_domain": "berkeley.edu;cmu.edu;epfl.ch;berkeley.edu",
        "position": "Postdoc;PhD student;PhD student;Full Professor",
        "bibtex": "@inproceedings{\nchavdarova2024a,\ntitle={A Primal-Dual Approach to Solving Variational Inequalities with General Constraints},\nauthor={Tatjana Chavdarova and Tong Yang and Matteo Pagliardini and Michael Jordan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=RsztjXcvUf}\n}",
        "github": "",
        "project": "",
        "reviewers": "uGBX;MAK9;mjvt;VTND",
        "pdf_size": 2774637,
        "rating": "6;6;6;8",
        "confidence": "2;4;4;3",
        "soundness": "3;3;2;4",
        "contribution": "3;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "89;281;90;162",
        "wc_strengths": "102;38;93;325",
        "wc_weaknesses": "95;111;100;317",
        "wc_questions": "2;75;100;160",
        "wc_review": "288;505;383;964",
        "wc_reply_reviewers": "0;0;44;41",
        "wc_reply_authors": "616;167;1137;503",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            155.5,
            78.27036476214992
        ],
        "wc_strengths_avg": [
            139.5,
            109.86468950486321
        ],
        "wc_weaknesses_avg": [
            155.75,
            93.27747584492197
        ],
        "wc_questions_avg": [
            84.25,
            56.64969108477115
        ],
        "wc_review_avg": [
            535.0,
            259.35207730033704
        ],
        "wc_reply_reviewers_avg": [
            21.25,
            21.276454121869087
        ],
        "wc_reply_authors_avg": [
            605.75,
            348.3499497631656
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.17407765595569782,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5498380828978644173&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=RsztjXcvUf",
        "pdf": "https://openreview.net/pdf?id=RsztjXcvUf",
        "email": "berkeley.edu;cmu.edu;epfl.ch;berkeley.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "University of California, Berkeley;Carnegie Mellon University;Swiss Federal Institute of Technology Lausanne",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.berkeley.edu;https://www.cmu.edu;https://www.epfl.ch",
        "aff_unique_abbr": "UC Berkeley;CMU;EPFL",
        "aff_campus_unique_index": "0;2;0",
        "aff_campus_unique": "Berkeley;;Lausanne",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "United States;Switzerland"
    },
    {
        "id": "Rt6btdXS2b",
        "title": "Continuous Indeterminate Probability Neural Network",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Currently, there is no mathematical analytical form for a general posterior, however, Indeterminate Probability Theory has now discovered a way to address this issue. This is a big discovery in the field of probability and it is applicable in various fields.\nThis paper introduces a general model called CIPNN - Continuous Indeterminate Probability Neural Network, which is an analytical probability neural network with continuous latent random variables.  \nOur contributions are Four-fold. First, we apply the analytical form of the posterior for continuous latent random variables and propose a general classification model (CIPNN). Second, we propose a general auto-encoder called CIPAE - Continuous Indeterminate Probability Auto-Encoder, instead of using a neural network as the decoder component, we first employ a probabilistic equation. Third, we propose a new method to visualize the latent random variables, we use one of N dimensional latent variables as a decoder to reconstruct the input image, which can work even for classification tasks, in this way, we can see what each latent variable has learned. Fourth, IPNN has shown great classification capability, CIPNN has pushed this classification capability to infinity.\nTheoretical advantages are reflected in experimental results.",
        "keywords": "Indeterminate Probability Theory;Continuous Random Variable;Analytical Solution;DLVMs;Auto-Encoder",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/1e130832cc26bcf9fc8269d8e06cafa2eed7f4d7.zip",
        "author": "Tao Yang",
        "authorids": "~Tao_Yang19",
        "gender": "M",
        "homepage": "https://github.com/Starfruit007",
        "dblp": "67/1120",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works",
        "orcid": "",
        "linkedin": "https://www.linkedin.com/mwlite/in/tao-yang-754b40217",
        "or_profile": "~Tao_Yang19",
        "aff": "United Automotive Electronic Systems Co., Ltd.",
        "aff_domain": "uaes.com",
        "position": "Researcher",
        "bibtex": "@misc{\nyang2024continuous,\ntitle={Continuous Indeterminate Probability Neural Network},\nauthor={Tao Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=Rt6btdXS2b}\n}",
        "github": "",
        "project": "",
        "reviewers": "7gbu;EMUS;Vwsb",
        "site": "https://openreview.net/forum?id=Rt6btdXS2b",
        "pdf_size": 3261823,
        "rating": "3;3;8",
        "confidence": "2;3;3",
        "soundness": "2;1;3",
        "contribution": "2;1;3",
        "presentation": "1;1;2",
        "wc_summary": "45;21;86",
        "wc_strengths": "44;19;83",
        "wc_weaknesses": "751;189;133",
        "wc_questions": "7;2;442",
        "wc_review": "847;231;744",
        "wc_reply_reviewers": "97;0;353",
        "wc_reply_authors": "713;369;931",
        "reply_reviewers": "1;0;1",
        "reply_authors": "1;1;2",
        "rating_avg": [
            4.666666666666667,
            2.357022603955158
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            50.666666666666664,
            26.83695627716046
        ],
        "wc_strengths_avg": [
            48.666666666666664,
            26.335442953471574
        ],
        "wc_weaknesses_avg": [
            357.6666666666667,
            279.0666985188706
        ],
        "wc_questions_avg": [
            150.33333333333334,
            206.24957912414968
        ],
        "wc_review_avg": [
            607.3333333333334,
            269.4096426551128
        ],
        "wc_reply_reviewers_avg": [
            150.0,
            148.90489134567295
        ],
        "wc_reply_authors_avg": [
            671.0,
            231.3496632084574
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0.5000000000000001,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0",
        "aff_unique_norm": "United Automotive Electronic Systems",
        "aff_unique_dep": "",
        "aff_unique_url": "",
        "aff_unique_abbr": "",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "Rt7ekFkSJZ",
        "title": "Fair Feature Importance Scores for Interpreting Tree-Based Methods and Surrogates",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Across various sectors such as healthcare, criminal justice, national security, finance, and technology, large-scale machine learning (ML) and artificial intelligence (AI) systems are being deployed to make critical data-driven decisions. Many have asked if we can and should trust these ML systems to be making these decisions.  Two critical components are prerequisites for trust in ML systems: interpretability, or the ability to understand why the ML system makes the decisions it does, and fairness, which ensures that ML systems do not exhibit bias against certain individuals or groups. Both interpretability and fairness are important and have separately received abundant attention in the ML literature, but so far, there have been very few methods developed to directly interpret models with regard to their fairness. In this paper, we focus on arguably the most popular type of ML interpretation: feature importance scores. Inspired by the use of decision trees in knowledge distillation, we propose to leverage trees as interpretable surrogates for complex black-box ML models. Specifically, we develop a novel fair feature importance score for trees that can be used to interpret trees, tree-based ensembles, or tree-based surrogates of any complex ML system.  Like the popular mean decrease in impurity for trees, our Fair Feature Importance Score is defined based on the mean decrease (or increase) in group bias.  Through simulations as well as real examples on benchmark fairness datasets, we demonstrate that our Fair Feature Importance Score offers valid interpretations for both tree-based ensembles and tree-based surrogates of other ML systems.",
        "keywords": "Interpretability;fairness;interpretable surrogates;knowledge distillation;decision trees;group fairness",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/1b8b321981751c71bd17866ffb8026236b80c35e.zip",
        "author": "Camille Olivia Little;Debolina Halder Lina;Genevera I. Allen",
        "authorids": "~Camille_Olivia_Little1;~Debolina_Halder_Lina1;~Genevera_I._Allen1",
        "gender": "F;F;",
        "homepage": ";;https://genevera-allen.com/",
        "dblp": ";;89/10367",
        "google_scholar": ";;gIUd12QAAAAJ",
        "orcid": ";;",
        "linkedin": "www.linkedin.com/in/camille-little-bb5a95169;debolina-halder-lina-74b26a1b9;",
        "or_profile": "~Camille_Olivia_Little1;~Debolina_Halder_Lina1;~Genevera_I._Allen1",
        "aff": "Rice University;Rice University;Columbia University",
        "aff_domain": "rice.edu;rice.edu;columbia.edu",
        "position": "PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nlittle2024fair,\ntitle={Fair Feature Importance Scores for Interpreting Tree-Based Methods and Surrogates},\nauthor={Camille Olivia Little and Debolina Halder Lina and Genevera I. Allen},\nyear={2024},\nurl={https://openreview.net/forum?id=Rt7ekFkSJZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "Vvdg;oKhh;rM4n;q1kB",
        "site": "https://openreview.net/forum?id=Rt7ekFkSJZ",
        "pdf_size": 336595,
        "rating": "3;5;5;5",
        "confidence": "4;4;2;3",
        "soundness": "1;3;2;3",
        "contribution": "1;2;2;2",
        "presentation": "2;2;3;2",
        "wc_summary": "41;79;81;78",
        "wc_strengths": "33;51;53;50",
        "wc_weaknesses": "435;302;195;255",
        "wc_questions": "8;2;26;2",
        "wc_review": "517;434;355;385",
        "wc_reply_reviewers": "0;137;213;0",
        "wc_reply_authors": "753;967;371;669",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            69.75,
            16.63392617513977
        ],
        "wc_strengths_avg": [
            46.75,
            8.011710179481033
        ],
        "wc_weaknesses_avg": [
            296.75,
            88.36960733193285
        ],
        "wc_questions_avg": [
            9.5,
            9.836157786453
        ],
        "wc_review_avg": [
            422.75,
            61.287743472900026
        ],
        "wc_reply_reviewers_avg": [
            87.5,
            91.53278101314305
        ],
        "wc_reply_authors_avg": [
            690.0,
            213.83404780343096
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13274230766224176327&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Rice University;Columbia University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.rice.edu;https://www.columbia.edu",
        "aff_unique_abbr": "Rice;Columbia",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "On Error Propagation of Diffusion Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18630",
        "id": "RtAct1E2zS",
        "author_site": "Yangming Li, Mihaela van der Schaar",
        "tldr": "",
        "abstract": "Although diffusion models (DMs) have shown promising performances in a number of tasks (e.g., speech synthesis and image generation), they might suffer from error propagation because of their sequential structure. However, this is not certain because some sequential models, such as Conditional Random Field (CRF), are free from this problem. To address this issue, we develop a theoretical framework to mathematically formulate error propagation in the architecture of DMs, The framework contains three elements, including modular error, cumulative error, and propagation equation. The modular and cumulative errors are related by the equation, which interprets that DMs are indeed affected by error propagation. Our theoretical study also suggests that the cumulative error is closely related to the generation quality of DMs. Based on this finding, we apply the cumulative error as a regularization term to reduce error propagation. Because the term is computationally intractable, we derive its upper bound and design a bootstrap algorithm to efficiently estimate the bound for optimization. We have conducted extensive experiments on multiple image datasets, showing that our proposed regularization reduces error propagation, significantly improves vanilla DMs, and outperforms previous baselines.",
        "keywords": "Diffusion Models;Error Propagation;Theoretical Explanation;Regularization",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Yangming Li;Mihaela van der Schaar",
        "authorids": "~Yangming_Li1;~Mihaela_van_der_Schaar2",
        "gender": ";F",
        "homepage": ";https://www.vanderschaar-lab.com",
        "dblp": ";",
        "google_scholar": ";DZ3S--MAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Yangming_Li1;~Mihaela_van_der_Schaar2",
        "aff": ";University of California, Los Angeles",
        "aff_domain": ";ucla.edu",
        "position": ";Full Professor",
        "bibtex": "@inproceedings{\nli2024on,\ntitle={On Error Propagation of Diffusion Models},\nauthor={Yangming Li and Mihaela van der Schaar},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=RtAct1E2zS}\n}",
        "github": "",
        "project": "",
        "reviewers": "e2Ed;ebh3;hknr;MiNJ",
        "pdf_size": 403975,
        "rating": "6;8;8;8",
        "confidence": "4;4;2;2",
        "soundness": "3;3;3;3",
        "contribution": "3;3;2;3",
        "presentation": "3;4;3;2",
        "wc_summary": "65;81;65;54",
        "wc_strengths": "37;29;43;104",
        "wc_weaknesses": "140;322;19;70",
        "wc_questions": "90;9;83;56",
        "wc_review": "332;441;210;284",
        "wc_reply_reviewers": "65;14;0;52",
        "wc_reply_authors": "950;1343;598;536",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "5;3;1;2",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            1.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            66.25,
            9.627434756984853
        ],
        "wc_strengths_avg": [
            53.25,
            29.71847068743612
        ],
        "wc_weaknesses_avg": [
            137.75,
            114.72221885929508
        ],
        "wc_questions_avg": [
            59.5,
            31.80015723231569
        ],
        "wc_review_avg": [
            316.75,
            83.87304394142376
        ],
        "wc_reply_reviewers_avg": [
            32.75,
            26.621185172715357
        ],
        "wc_reply_authors_avg": [
            856.75,
            322.0895644071692
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            1.479019945774904
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9922758134583846435&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=RtAct1E2zS",
        "pdf": "https://openreview.net/pdf?id=RtAct1E2zS",
        "email": ";ucla.edu",
        "author_num": 2,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of California, Los Angeles",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucla.edu",
        "aff_unique_abbr": "UCLA",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Los Angeles",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Simplifying Transformer Blocks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18629",
        "id": "RtDok9eS3s",
        "author_site": "Bobby He, Thomas Hofmann",
        "tldr": "",
        "abstract": "A simple design recipe for deep Transformers is to compose identical building blocks. But standard transformer blocks are far from simple, interweaving attention and MLP sub-blocks with skip connections \\& normalisation layers in precise arrangements. This complexity leads to brittle architectures, where seemingly minor changes can significantly reduce training speed, or render models untrainable.\n\nIn this work, we ask to what extent the standard transformer block can be simplified? Combining signal propagation theory and empirical observations, we motivate modifications that allow many block components to be removed with no loss of training speed, including skip connections, projection or value parameters, sequential sub-blocks and normalisation layers. In experiments on both autoregressive decoder-only and BERT encoder-only models, our simplified transformers match the per-iteration training speed and performance of standard transformers, while enjoying 16\\% faster training throughput, and using 15\\% fewer parameters.",
        "keywords": "transformers;signal propagation theory;self-attention;initialisation;simpler architectures;skip connections;normalisation;fast training speed",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Bobby He;Thomas Hofmann",
        "authorids": "~Bobby_He1;~Thomas_Hofmann1",
        "gender": ";M",
        "homepage": "http://csml.stats.ox.ac.uk/people/he/;http://www.da.inf.ethz.ch/",
        "dblp": "270/3685;h/ThHofmann",
        "google_scholar": ";T3hAyLkAAAAJ",
        "orcid": ";",
        "linkedin": ";thomas-hofmann-1ab2402/",
        "or_profile": "~Bobby_He1;~Thomas_Hofmann1",
        "aff": "Department of Computer Science, ETHZ - ETH Zurich;Swiss Federal Institute of Technology",
        "aff_domain": "inf.ethz.ch;ethz.ch",
        "position": "Postdoc;Full Professor",
        "bibtex": "@inproceedings{\nhe2024simplifying,\ntitle={Simplifying Transformer Blocks},\nauthor={Bobby He and Thomas Hofmann},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=RtDok9eS3s}\n}",
        "github": "",
        "project": "",
        "reviewers": "iboi;wksT;W1bM",
        "pdf_size": 5197151,
        "rating": "6;8;8",
        "confidence": "3;5;4",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "3;4;4",
        "wc_summary": "121;106;128",
        "wc_strengths": "72;82;81",
        "wc_weaknesses": "57;148;168",
        "wc_questions": "201;185;188",
        "wc_review": "451;521;565",
        "wc_reply_reviewers": "0;101;176",
        "wc_reply_authors": "1175;591;1282",
        "reply_reviewers": "0;1;1",
        "reply_authors": "2;2;3",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            118.33333333333333,
            9.177266598624136
        ],
        "wc_strengths_avg": [
            78.33333333333333,
            4.496912521077347
        ],
        "wc_weaknesses_avg": [
            124.33333333333333,
            48.30688931773144
        ],
        "wc_questions_avg": [
            191.33333333333334,
            6.944222218666553
        ],
        "wc_review_avg": [
            512.3333333333334,
            46.942044646090515
        ],
        "wc_reply_reviewers_avg": [
            92.33333333333333,
            72.11256632669664
        ],
        "wc_reply_authors_avg": [
            1016.0,
            303.67855812794335
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.8660254037844385,
        "gs_citation": 44,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5277513278713890436&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=RtDok9eS3s",
        "pdf": "https://openreview.net/pdf?id=RtDok9eS3s",
        "email": "inf.ethz.ch;ethz.ch",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "ETH Zurich;Swiss Federal Institute of Technology",
        "aff_unique_dep": "Department of Computer Science;",
        "aff_unique_url": "https://www.ethz.ch;https://www.ethz.ch",
        "aff_unique_abbr": "ETHZ;ETH Zurich",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Zurich;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Switzerland"
    },
    {
        "id": "RtOTTdWbZd",
        "title": "Fine-Tuning Language Models with Advantage-Induced Policy Alignment",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Reinforcement learning from human feedback (RLHF) has emerged as a reliable approach to aligning large language models (LLMs) to human preferences.\nAmong the plethora of RLHF techniques, proximal policy optimization (PPO) is of the most widely used methods. Despite its popularity, however, PPO may suffer from mode collapse, instability, and poor sample efficiency.\nWe show that these issues can be alleviated by a novel algorithm that we refer to as Advantage-Induced Policy Alignment (APA), which leverages a squared error loss function based on the estimated advantages.\nWe demonstrate empirically that APA consistently outperforms PPO in language tasks by a large margin, when a separate reward model is employed as the evaluator.\nIn addition, compared with PPO, APA offers a more stable form of control over the deviation from the model's initial policy, ensuring that the model improves its performance without collapsing to deterministic output.\nIn addition to empirical results, we also provide a theoretical justification supporting the design of our loss function.",
        "keywords": "reinforcement learning with human feedback",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/648c17b71214c554712de14dc84ad33c9dce16ac.zip",
        "author": "Banghua Zhu;Hiteshi Sharma;Felipe Vieira Frujeri;Shi Dong;Chenguang Zhu;Michael Jordan;Jiantao Jiao",
        "authorids": "~Banghua_Zhu1;~Hiteshi_Sharma1;~Felipe_Vieira_Frujeri1;~Shi_Dong1;~Chenguang_Zhu1;~Michael_Jordan1;~Jiantao_Jiao1",
        "gender": "M;F;;M;M;M;M",
        "homepage": "https://people.eecs.berkeley.edu/~banghua/;https://hiteshis.github.io/;;https://dongshi.me;;http://www.cs.berkeley.edu/~jordan/;https://scholar.google.com/citations?user=aO8KpGcAAAAJ&hl=en",
        "dblp": "204/5394;158/3418;;04/8548;48/7536-1.html;j/MichaelIJordan;43/8919",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;wy0FA1cAAAAJ;;1b2kKWoAAAAJ;https://scholar.google.com.tw/citations?user=yxUduqMAAAAJ;aO8KpGcAAAAJ",
        "orcid": ";;;;;0000-0001-8935-817X;",
        "linkedin": ";;;;;;",
        "or_profile": "~Banghua_Zhu1;~Hiteshi_Sharma1;~Felipe_Vieira_Frujeri1;~Shi_Dong1;~Chenguang_Zhu1;~Michael_Jordan1;~Jiantao_Jiao1",
        "aff": "University of California, Berkeley;Microsoft;;Google;Meta Facebook;University of California, Berkeley;University of California, Berkeley",
        "aff_domain": "berkeley.edu;microsoft.com;;google.com;meta.com;berkeley.edu;berkeley.edu",
        "position": "PhD student;Researcher;;Researcher;Principal Researcher;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nzhu2024finetuning,\ntitle={Fine-Tuning Language Models with Advantage-Induced Policy Alignment},\nauthor={Banghua Zhu and Hiteshi Sharma and Felipe Vieira Frujeri and Shi Dong and Chenguang Zhu and Michael Jordan and Jiantao Jiao},\nyear={2024},\nurl={https://openreview.net/forum?id=RtOTTdWbZd}\n}",
        "github": "",
        "project": "",
        "reviewers": "2o5E;59is;GAYy;qc78",
        "site": "https://openreview.net/forum?id=RtOTTdWbZd",
        "pdf_size": 1540874,
        "rating": "3;5;5;8",
        "confidence": "4;3;4;5",
        "soundness": "2;2;2;4",
        "contribution": "2;2;2;3",
        "presentation": "4;3;2;3",
        "wc_summary": "48;31;105;65",
        "wc_strengths": "107;31;67;43",
        "wc_weaknesses": "466;375;169;46",
        "wc_questions": "2;91;38;52",
        "wc_review": "623;528;379;206",
        "wc_reply_reviewers": "86;23;84;0",
        "wc_reply_authors": "1066;919;535;300",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            62.25,
            27.453369556395078
        ],
        "wc_strengths_avg": [
            62.0,
            29.03446228191595
        ],
        "wc_weaknesses_avg": [
            264.0,
            165.58532543676688
        ],
        "wc_questions_avg": [
            45.75,
            31.86200715585884
        ],
        "wc_review_avg": [
            434.0,
            157.77040280103236
        ],
        "wc_reply_reviewers_avg": [
            48.25,
            37.64555086593899
        ],
        "wc_reply_authors_avg": [
            705.0,
            303.74413574586094
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.5940885257860046,
        "gs_citation": 43,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7726101249171983080&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2;3;0;0",
        "aff_unique_norm": "University of California, Berkeley;Microsoft;Google;Meta",
        "aff_unique_dep": ";Microsoft Corporation;Google;Meta Platforms, Inc.",
        "aff_unique_url": "https://www.berkeley.edu;https://www.microsoft.com;https://www.google.com;https://meta.com",
        "aff_unique_abbr": "UC Berkeley;Microsoft;Google;Meta",
        "aff_campus_unique_index": "0;2;0;0",
        "aff_campus_unique": "Berkeley;;Mountain View",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Meta-Evolve: Continuous Robot Evolution for One-to-many Policy Transfer",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18628",
        "id": "RthOl4jHw5",
        "author_site": "Xingyu Liu, Deepak Pathak, DING ZHAO",
        "tldr": "",
        "abstract": "We investigate the problem of transferring an expert policy from a source robot to multiple different robots. To solve this problem, we propose a method named *Meta-Evolve* that uses continuous robot evolution to efficiently transfer the policy to each target robot through a set of tree-structured evolutionary robot sequences. The robot evolution tree allows the robot evolution paths to be shared, so our approach can significantly outperform naive one-to-one policy transfer. We present a heuristic approach to determine an optimized robot evolution tree. Experiments have shown that our method is able to improve the efficiency of one-to-three transfer of manipulation policy by up to 3.2$\\times$ and one-to-six transfer of agile locomotion policy by 2.4$\\times$ in terms of simulation cost over the baseline of launching multiple independent one-to-one policy transfers. Supplementary videos available at the project website: https://sites.google.com/view/meta-evolve.",
        "keywords": "policy transfer;transfer learning;imitation learning;reinforcement learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/7d992d58ecc7b3f07e28cec44a1985f9fbd50744.zip",
        "author": "Xingyu Liu;Deepak Pathak;Ding Zhao",
        "authorids": "~Xingyu_Liu1;~Deepak_Pathak1;~Ding_Zhao1",
        "gender": "M;M;",
        "homepage": "https://xingyul.github.io;https://www.cs.cmu.edu/~dpathak/;https://safeai-lab.github.io",
        "dblp": ";155/9860;",
        "google_scholar": "ZVABLi8AAAAJ;https://scholar.google.cl/citations?user=AEsPCAUAAAAJ;z7tPc9IAAAAJ",
        "orcid": ";;",
        "linkedin": "xing-yu-liu/;pathak22/;",
        "or_profile": "~Xingyu_Liu1;~Deepak_Pathak1;~Ding_Zhao1",
        "aff": "Carnegie Mellon University;Carnegie Mellon University;Carnegie Mellon University",
        "aff_domain": "cmu.edu;cmu.edu;cmu.edu",
        "position": "Postdoc;Assistant Professor;Associate Professor",
        "bibtex": "@inproceedings{\nliu2024metaevolve,\ntitle={Meta-Evolve: Continuous Robot Evolution for One-to-many Policy Transfer},\nauthor={Xingyu Liu and Deepak Pathak and Ding Zhao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=RthOl4jHw5}\n}",
        "github": "",
        "project": "",
        "reviewers": "Escv;6cdy;e334;NXFw",
        "pdf_size": 7934138,
        "rating": "5;5;6;8",
        "confidence": "4;5;4;3",
        "soundness": "3;3;3;4",
        "contribution": "3;2;2;3",
        "presentation": "3;3;3;4",
        "wc_summary": "119;60;97;107",
        "wc_strengths": "92;46;42;54",
        "wc_weaknesses": "252;292;57;229",
        "wc_questions": "65;49;15;139",
        "wc_review": "528;447;211;529",
        "wc_reply_reviewers": "0;936;9;251",
        "wc_reply_authors": "901;2277;248;1888",
        "reply_reviewers": "0;3;1;1",
        "reply_authors": "3;5;2;3",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            95.75,
            22.060994991160303
        ],
        "wc_strengths_avg": [
            58.5,
            19.817921182606415
        ],
        "wc_weaknesses_avg": [
            207.5,
            89.76775590377649
        ],
        "wc_questions_avg": [
            67.0,
            45.32107677449864
        ],
        "wc_review_avg": [
            428.75,
            130.04686655202423
        ],
        "wc_reply_reviewers_avg": [
            299.0,
            381.3049960333591
        ],
        "wc_reply_authors_avg": [
            1328.5,
            800.4575254190569
        ],
        "reply_reviewers_avg": [
            1.25,
            1.0897247358851685
        ],
        "reply_authors_avg": [
            3.25,
            1.0897247358851685
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8660254037844386,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1435581517321653528&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=RthOl4jHw5",
        "pdf": "https://openreview.net/pdf?id=RthOl4jHw5",
        "email": "cmu.edu;cmu.edu;cmu.edu",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Carnegie Mellon University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cmu.edu",
        "aff_unique_abbr": "CMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Rtw2xd4ZdK",
        "title": "LeCO-NeRF: Learning Compact Occupancy for Large-scale Neural Radiance Fields",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Neural Radiance Fields (NeRFs) have shown impressive results in modeling large-scale scenes. A critical problem is how to effectively estimate the occupancy to guide empty-space skipping and point sampling. Although grid-based methods show their advantages in occupancy estimation for small-scale scenes, large-scale scenes typically have irregular scene bounds and more complex scene geometry and appearance distributions, which present severe challenges to the grid-based methods for handling large scenes, because of the limitations of predefined bounding boxes and grid resolutions, and high memory usage for grid updating. In this paper, we propose to learn a compact and efficient occupancy representation of large-scale scenes. Our main contribution is to learn and encode the occupancy of a scene into a compact MLP in an efficient and self-supervised manner. We achieve this by three core designs. First, we propose a novel Heterogeneous Mixture of Experts (HMoE) structure with common Scene Experts and a tiny Empty-Space Expert. The heterogeneous structure can be effectively used to model the imbalanced unoccupied and occupied regions in NeRF where unoccupied regions need much fewer parameters. Second, we propose a novel imbalanced gate loss for HMoE, motivated by the prior that most of the 3D points are unoccupied. It enables the gating network of HMoE to accurately dispatch the unoccupied and occupied points. Third, we also design an explicit density loss to guide the gating network. Then, the occupancy of the entire large-scale scene can be encoded into a very compact gating network of the HMoE. As far as we know, we are the first to learn the compact occupancy of large-scale NeRF by an MLP. We show in the experiments that our occupancy network can very quickly learn more accurate, smooth, and clean occupancy compared to the occupancy grid. With our learned occupancy as guidance for empty space skipping, our method can consistently obtain $2.5\\times$ speed-up on the state-of-the-art method Switch-NeRF, while achieving highly competitive performances on several challenging large-scale benchmarks.",
        "keywords": "Occupancy;Neural Radiance Fields;Mixture of Experts;Large-scale scene;Novel view synthesis",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/8c42f7829bdeb53069593443af87760164e68039.zip",
        "author": "Zhenxing Mi;Dan Xu",
        "authorids": "~Zhenxing_Mi2;~Dan_Xu4",
        "gender": "M;M",
        "homepage": "https://www.danxurgb.net;https://mizhenxing.github.io/",
        "dblp": "16/3823-2.html;229/1252",
        "google_scholar": "OuSPv-AAAAAJ;ennCRJAAAAAJ",
        "orcid": "0000-0003-0136-9603;",
        "linkedin": ";",
        "or_profile": "~Dan_Xu4;~Zhenxing_MI1",
        "aff": "VGG, University of Oxford;Snap Inc.",
        "aff_domain": "ox.ac.uk;snapchat.com",
        "position": "Postdoc;Intern",
        "bibtex": "@misc{\nmi2024leconerf,\ntitle={Le{CO}-Ne{RF}: Learning Compact Occupancy for Large-scale Neural Radiance Fields},\nauthor={Zhenxing Mi and Dan Xu},\nyear={2024},\nurl={https://openreview.net/forum?id=Rtw2xd4ZdK}\n}",
        "github": "",
        "project": "",
        "reviewers": "iRL2;uh8i;KM5v;Zume",
        "site": "https://openreview.net/forum?id=Rtw2xd4ZdK",
        "pdf_size": 3584968,
        "rating": "5;5;5;8",
        "confidence": "4;5;4;2",
        "soundness": "2;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "2;3;3;4",
        "wc_summary": "142;94;112;77",
        "wc_strengths": "129;55;119;90",
        "wc_weaknesses": "215;279;163;31",
        "wc_questions": "38;22;56;142",
        "wc_review": "524;450;450;340",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "545;869;1221;423",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;2;2;1",
        "rating_avg": [
            5.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            106.25,
            24.06631463269771
        ],
        "wc_strengths_avg": [
            98.25,
            28.78693279944913
        ],
        "wc_weaknesses_avg": [
            172.0,
            91.18662182579197
        ],
        "wc_questions_avg": [
            64.5,
            46.33303357217181
        ],
        "wc_review_avg": [
            441.0,
            65.67343450741707
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            764.5,
            309.8850593365224
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.9271726499455307,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:5Kwrkp9OaZMJ:scholar.google.com/&scioq=LeCO-NeRF:+Learning+Compact+Occupancy+for+Large-scale+Neural+Radiance+Fields&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Oxford;Snap Inc.",
        "aff_unique_dep": "VGG;",
        "aff_unique_url": "https://www.ox.ac.uk;https://www.snapinc.com",
        "aff_unique_abbr": "Oxford;Snap",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Oxford;",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "title": "Realistic Evaluation of Semi-supervised Learning Algorithms in Open Environments",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18627",
        "id": "RvUVMjfp8i",
        "author_site": "Lin-Han Jia, Lan-Zhe Guo, Zhi Zhou, Yu-Feng Li",
        "tldr": "",
        "abstract": "Semi-supervised learning (SSL) is a powerful paradigm for leveraging unlabeled data and has been proven to be successful across various tasks. Conventional SSL studies typically assume close environment scenarios where labeled and unlabeled examples are independently sampled from the same distribution. However, real-world tasks often involve open environment scenarios where the data distribution, label space, and feature space could differ between labeled and unlabeled data. This inconsistency introduces robustness challenges for SSL algorithms. In this paper, we first propose several robustness metrics for SSL based on the Robustness Analysis Curve (RAC), secondly, we establish a theoretical framework for studying the generalization performance and robustness of SSL algorithms in open environments, thirdly, we re-implement widely adopted SSL algorithms within a unified SSL toolkit and evaluate their performance on proposed open environment SSL benchmarks, including both image, text, and tabular datasets. By investigating the empirical and theoretical results, insightful discussions on enhancing the robustness of SSL algorithms in open environments are presented. The re-implementation and benchmark datasets are all publicly available. More details can be found at https://ygzwqzd.github.io/Robust-SSL-Benchmark.",
        "keywords": "Semi-Supervised Learning; Robustness; Open Environments",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Lin-Han Jia;Lan-Zhe Guo;Zhi Zhou;Yu-Feng Li",
        "authorids": "~Lin-Han_Jia1;~Lan-Zhe_Guo2;~Zhi_Zhou2;~Yu-Feng_Li1",
        "gender": "M;M;M;M",
        "homepage": "http://www.lamda.nju.edu.cn/jialh/;http://www.lamda.nju.edu.cn/guolz;http://www.lamda.nju.edu.cn/zhouz/;https://cs.nju.edu.cn/liyf/index.htm",
        "dblp": "326/5447;216/4845;04/2090-7;57/413",
        "google_scholar": ";dpunvqgAAAAJ;VzvP5a8AAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;0000-0002-2220-5248",
        "linkedin": ";;;",
        "or_profile": "~Lin-Han_Jia1;~Lan-Zhe_Guo2;~Zhi_Zhou2;~Yu-feng_Li2",
        "aff": "Nanjing University;Nanjing University;Nanjing University;Nanjing University",
        "aff_domain": "nju.edu.cn;nju.edu.cn;nju.edu.cn;nju.edu.cn",
        "position": "PhD student;Assistant Professor;PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\njia2024realistic,\ntitle={Realistic Evaluation of Semi-supervised Learning Algorithms in Open Environments},\nauthor={Lin-Han Jia and Lan-Zhe Guo and Zhi Zhou and Yu-Feng Li},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=RvUVMjfp8i}\n}",
        "github": "",
        "project": "",
        "reviewers": "Et8T;ynTZ;dSe9;2gQd",
        "pdf_size": 309734,
        "rating": "8;8;8;8",
        "confidence": "5;5;4;5",
        "soundness": "3;3;4;3",
        "contribution": "4;3;4;4",
        "presentation": "4;3;3;3",
        "wc_summary": "101;72;75;53",
        "wc_strengths": "282;93;123;76",
        "wc_weaknesses": "134;19;70;31",
        "wc_questions": "41;23;55;20",
        "wc_review": "558;207;323;180",
        "wc_reply_reviewers": "24;28;0;29",
        "wc_reply_authors": "261;120;237;203",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            4.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            75.25,
            17.09349291397168
        ],
        "wc_strengths_avg": [
            143.5,
            81.71444180804272
        ],
        "wc_weaknesses_avg": [
            63.5,
            44.85810963471376
        ],
        "wc_questions_avg": [
            34.75,
            14.184057952504283
        ],
        "wc_review_avg": [
            317.0,
            149.15260641369966
        ],
        "wc_reply_reviewers_avg": [
            20.25,
            11.840080236214618
        ],
        "wc_reply_authors_avg": [
            205.25,
            53.35904328227784
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5254316322128975446&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=RvUVMjfp8i",
        "pdf": "https://openreview.net/pdf?id=RvUVMjfp8i",
        "email": "nju.edu.cn;nju.edu.cn;nju.edu.cn;nju.edu.cn",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Nanjing University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nju.edu.cn",
        "aff_unique_abbr": "Nanjing U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "What's In My Big Data?",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18626",
        "id": "RvfPnOkPV4",
        "author_site": "Yanai Elazar, Akshita Bhagia, Ian Magnusson, Abhilasha Ravichander, Dustin Schwenk, Alane Suhr, Pete Walsh, Dirk Groeneveld, Luca Soldaini, Sameer Singh, Hannaneh Hajishirzi, Noah Smith, Jesse Dodge",
        "tldr": "",
        "abstract": "Large text corpora are the backbone of language models.\nHowever, we have a limited understanding of the content of these corpora, including general statistics, quality, social factors, and inclusion of evaluation data (contamination).\nIn this work, we propose What's In My Big Data? (WIMBD), a platform and a set of sixteen analyses that allow us to reveal and compare the contents of large text corpora. WIMBD builds on two basic capabilities---count and search---*at scale*, which allows us to analyze more than 35 terabytes on a standard compute node. \nWe apply WIMBD to ten different corpora used to train popular language models, including *C4*, *The Pile*, and *RedPajama*.\nOur analysis uncovers several surprising and previously undocumented findings about these corpora, including the high prevalence of duplicate, synthetic, and low-quality content, personally identifiable information, toxic language, and benchmark contamination. \nFor instance, we find that about 50% of the documents in *RedPajama* and *LAION-2B-en* are duplicates. In addition, several datasets used for benchmarking models trained on such corpora are contaminated with respect to important benchmarks, including the Winograd Schema Challenge and parts of GLUE and SuperGLUE.\nWe open-source WIMBD's code and artifacts to provide a standard set of evaluations for new text-based corpora and to encourage more analyses and transparency around them.",
        "keywords": "nlp;dataset;analaysis;data-statistics;data-quality;PII",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Yanai Elazar;Akshita Bhagia;Ian Helgi Magnusson;Abhilasha Ravichander;Dustin Schwenk;Alane Suhr;Evan Pete Walsh;Dirk Groeneveld;Luca Soldaini;Sameer Singh;Hannaneh Hajishirzi;Noah A. Smith;Jesse Dodge",
        "authorids": "~Yanai_Elazar1;~Akshita_Bhagia1;~Ian_Helgi_Magnusson1;~Abhilasha_Ravichander2;~Dustin_Schwenk1;~Alane_Suhr1;~Evan_Pete_Walsh1;~Dirk_Groeneveld1;~Luca_Soldaini1;~Sameer_Singh1;~Hannaneh_Hajishirzi1;~Noah_A._Smith2;~Jesse_Dodge1",
        "gender": "M;F;;;;Not Specified;M;;Non-Binary;M;F;;M",
        "homepage": "https://yanaiela.github.io;https://akshitab.github.io/;;https://www.cs.cmu.edu/~aravicha/;;http://www.alanesuhr.com;https://github.com/epwalsh/;;https://soldaini.net;http://sameersingh.org;https://homes.cs.washington.edu/~hannaneh/;;http://www.cs.cmu.edu/~jessed/",
        "dblp": "223/4533;321/0726;;170/4795.html;208/4259;203/9306;;185/7781;160/1741;13/3568-1;52/1296;;49/11425",
        "google_scholar": "https://scholar.google.co.il/citations?user=7p_Ce8kAAAAJ;fzH3_G4AAAAJ;;6vLsKGsAAAAJ;4yiNcJyuYb4C;daslsUkAAAAJ;;KEhvGNMAAAAJ;3KPvwcgAAAAJ;-hGZC54AAAAJ;LOV6_WIAAAAJ;;nHy_1doAAAAJ",
        "orcid": ";0000-0003-4848-3884;;;;;;0000-0002-8274-768X;0000-0001-6998-9863;0000-0003-0621-6323;;;",
        "linkedin": "yanai-elazar-7b345b95/;;;abhilasha-ravichander-57524958;;;;mechanicaldirk/;soldni/;sameersingh/;;;",
        "or_profile": "~Yanai_Elazar1;~Akshita_Bhagia1;~Ian_Helgi_Magnusson1;~Abhilasha_Ravichander2;~Dustin_Schwenk1;~Alane_Suhr1;~Evan_Pete_Walsh1;~Dirk_Groeneveld1;~Luca_Soldaini1;~Sameer_Singh1;~Hannaneh_Hajishirzi1;~Noah_A._Smith2;~Jesse_Dodge1",
        "aff": "Department of Computer Science;Allen Institute for Artificial Intelligence;;Allen Institute for Artificial Intelligence;Allen Institute for Artificial Intelligence;University of California, Berkeley;Allen Institute for Artificial Intelligence;Allen Institute for Artificial Intelligence;Allen Institute for Artificial Intelligence;University of California, Irvine;University of Washington;;Allen Institute for Artificial Intelligence",
        "aff_domain": "cs.washington.edu;allenai.org;;allenai.org;allenai.org;berkeley.edu;allenai.org;allenai.org;allenai.org;uci.edu;uw.edu;;allenai.org",
        "position": "Postdoc;Researcher;;Postdoc;Researcher;Assistant Professor;Researcher;Principal Researcher;Researcher;Full Professor;Associate Professor;;Researcher",
        "bibtex": "@inproceedings{\nelazar2024whats,\ntitle={What's In My Big Data?},\nauthor={Yanai Elazar and Akshita Bhagia and Ian Helgi Magnusson and Abhilasha Ravichander and Dustin Schwenk and Alane Suhr and Evan Pete Walsh and Dirk Groeneveld and Luca Soldaini and Sameer Singh and Hannaneh Hajishirzi and Noah A. Smith and Jesse Dodge},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=RvfPnOkPV4}\n}",
        "github": "",
        "project": "",
        "reviewers": "5Nw1;c8KC;XCiq;jsfy",
        "pdf_size": 7626885,
        "rating": "5;5;8;10",
        "confidence": "4;4;4;5",
        "soundness": "2;3;3;4",
        "contribution": "2;3;3;4",
        "presentation": "3;3;4;4",
        "wc_summary": "18;112;41;64",
        "wc_strengths": "51;62;134;110",
        "wc_weaknesses": "100;54;214;37",
        "wc_questions": "5;202;82;1",
        "wc_review": "174;430;471;212",
        "wc_reply_reviewers": "0;0;4;0",
        "wc_reply_authors": "630;797;785;252",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            7.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            58.75,
            34.78056210011563
        ],
        "wc_strengths_avg": [
            89.25,
            34.05418476487141
        ],
        "wc_weaknesses_avg": [
            101.25,
            69.05568405279901
        ],
        "wc_questions_avg": [
            72.5,
            81.43862719864573
        ],
        "wc_review_avg": [
            321.75,
            130.25815713420792
        ],
        "wc_reply_reviewers_avg": [
            1.0,
            1.7320508075688772
        ],
        "wc_reply_authors_avg": [
            616.0,
            220.23510165275653
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            13,
            0
        ],
        "corr_rating_confidence": 0.8164965809277261,
        "gs_citation": 94,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12917018283156450996&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=RvfPnOkPV4",
        "pdf": "https://openreview.net/pdf?id=RvfPnOkPV4",
        "email": "cs.washington.edu;allenai.org;;allenai.org;allenai.org;berkeley.edu;allenai.org;allenai.org;allenai.org;uci.edu;uw.edu;;allenai.org",
        "author_num": 13,
        "aff_unique_index": "0;1;1;1;2;1;1;1;3;4;1",
        "aff_unique_norm": "Unknown Institution;Allen Institute for Artificial Intelligence;University of California, Berkeley;University of California, Irvine;University of Washington",
        "aff_unique_dep": "Department of Computer Science;;;;",
        "aff_unique_url": ";https://allenai.org;https://www.berkeley.edu;https://www.uci.edu;https://www.washington.edu",
        "aff_unique_abbr": ";AI2;UC Berkeley;UCI;UW",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Berkeley;Irvine",
        "aff_country_unique_index": "1;1;1;1;1;1;1;1;1;1",
        "aff_country_unique": ";United States"
    },
    {
        "id": "RvmrhrPy7j",
        "title": "Causal Inference Using LLM-Guided Discovery",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "At the core of causal inference lies the critical challenge of determining reliable causal graphs solely based on observational data. Since the well-known backdoor criterion depends on the graph, any errors in the graph can propagate downstream to effect inference. In this work, we initially show that complete graph information is not necessary for causal effect inference; the topological order over graph variables (causal order) alone suffices. Further, given a node pair, causal order is easier to elicit from domain experts compared to graph edges since determining the existence of an edge can depend extensively on other variables. Interestingly, we find that the same principle holds for Large Language Models (LLMs) such as GPT-3.5-turbo and GPT-4, motivating an automated method to obtain causal order (and hence causal effect) with LLMs acting as virtual domain experts. To this end, we employ different prompting strategies and contextual cues to propose a robust technique of obtaining causal order from LLMs.  Acknowledging LLMs' limitations, we also study possible techniques to integrate LLMs with established causal discovery algorithms, including constraint-based and score-based methods, to enhance their performance. Extensive experiments demonstrate that our approach significantly improves causal ordering accuracy as compared to established discovery algorithms, highlighting the potential of LLMs to enhance causal inference across diverse fields.",
        "keywords": "Causal Inference;Large Language Models;Causal Discovery;Causal Order",
        "primary_area": "causal reasoning",
        "supplementary_material": "",
        "author": "Aniket Vashishtha;Abbavaram Gowtham Reddy;Abhinav Kumar;Saketh Bachu;Vineeth N. Balasubramanian;Amit Sharma",
        "authorids": "~Aniket_Vashishtha1;~Abbavaram_Gowtham_Reddy1;~Abhinav_Kumar3;~Saketh_Bachu1;~Vineeth_N._Balasubramanian2;~Amit_Sharma3",
        "gender": "M;M;M;M;M;M",
        "homepage": ";https://gautam0707.github.io;https://abhinavkumar.info/;https://sakethbachu.github.io/;http://amitsharma.in/;https://people.iith.ac.in/vineethnb/",
        "dblp": "289/5566;294/8798;115/6458;;72/2540-7;88/4691",
        "google_scholar": "csskfZUAAAAJ;Iewg-GAAAAAJ;n0fNl3oAAAAJ;HfhRAl0AAAAJ;https://scholar.google.co.in/citations?user=CXgQufgAAAAJ;https://scholar.google.co.in/citations?user=7soDcboAAAAJ",
        "orcid": "0000-0001-6247-2474;;;;0000-0002-2086-3191;0000-0003-2656-0375",
        "linkedin": "aniket-vashishtha-476413198/;;abhinav-kumar-99b29a16b/;saketh-bachu-7133ab171/;;vineethnb?originalSubdomain=in",
        "or_profile": "~Aniket_Vashishtha1;~Abbavaram_Gowtham_Reddy1;~Abhinav_Kumar3;~Saketh_Bachu1;~Amit_Sharma3;~Vineeth_Balasubramanian1",
        "aff": "Microsoft Research;Indian Institute of Technology Hyderabad;Massachusetts Institute of Technology;University of California, Riverside;Microsoft Research;Indian Institute of Technology Hyderabad",
        "aff_domain": "microsoft.com;iith.ac.in;mit.edu;ucr.edu;microsoft.com;iith.ac.in",
        "position": "Research Fellow;PhD student;PhD student;MS student;Principal Researcher;Full Professor",
        "bibtex": "@misc{\nvashishtha2024causal,\ntitle={Causal Inference Using {LLM}-Guided Discovery},\nauthor={Aniket Vashishtha and Abbavaram Gowtham Reddy and Abhinav Kumar and Saketh Bachu and Vineeth N. Balasubramanian and Amit Sharma},\nyear={2024},\nurl={https://openreview.net/forum?id=RvmrhrPy7j}\n}",
        "github": "",
        "project": "",
        "reviewers": "2Neo;vBFn;cXcH",
        "site": "https://openreview.net/forum?id=RvmrhrPy7j",
        "pdf_size": 606724,
        "rating": "3;3;5",
        "confidence": "4;3;3",
        "soundness": "2;3;4",
        "contribution": "2;1;2",
        "presentation": "3;2;3",
        "wc_summary": "99;88;83",
        "wc_strengths": "81;30;33",
        "wc_weaknesses": "399;9;134",
        "wc_questions": "71;260;203",
        "wc_review": "650;387;453",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "772;355;928",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;2",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            90.0,
            6.683312551921141
        ],
        "wc_strengths_avg": [
            48.0,
            23.366642891095847
        ],
        "wc_weaknesses_avg": [
            180.66666666666666,
            162.60039633681367
        ],
        "wc_questions_avg": [
            178.0,
            79.1580697086532
        ],
        "wc_review_avg": [
            496.6666666666667,
            111.72088236115734
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            685.0,
            241.88013560439393
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 40,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2126569612009118423&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;2;3;0;1",
        "aff_unique_norm": "Microsoft;Indian Institute of Technology Hyderabad;Massachusetts Institute of Technology;University of California, Riverside",
        "aff_unique_dep": "Microsoft Research;;;",
        "aff_unique_url": "https://www.microsoft.com/en-us/research;https://www.iith.ac.in;https://web.mit.edu;https://www.ucr.edu",
        "aff_unique_abbr": "MSR;IIT Hyderabad;MIT;UCR",
        "aff_campus_unique_index": "1;2;1",
        "aff_campus_unique": ";Hyderabad;Riverside",
        "aff_country_unique_index": "0;1;0;0;0;1",
        "aff_country_unique": "United States;India"
    },
    {
        "title": "BrainLM: A foundation model for brain activity recordings",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18625",
        "id": "RwI7ZEfR27",
        "author_site": "Josue Ortega Caro, Antonio Henrique de Oliveira Fonseca, Syed Rizvi, Matteo Rosati, Christopher Averill, James Cross, Prateek Mittal, Emanuele Zappala, Rahul Dhodapkar, Chadi Abdallah, David Dijk",
        "tldr": "",
        "abstract": "We introduce the Brain Language Model (BrainLM), a foundation model for brain activity dynamics trained on 6,700 hours of fMRI recordings. Utilizing self-supervised masked-prediction training, BrainLM demonstrates proficiency in both fine-tuning and zero-shot inference tasks. Fine-tuning allows for the accurate prediction of clinical variables like age, anxiety, and PTSD as well as forecasting of future brain states. Critically, the model generalizes well to entirely new external cohorts not seen during training. In zero-shot inference mode, BrainLM can identify intrinsic functional networks directly from raw fMRI data without any network-based supervision during training. The model also generates interpretable latent representations that reveal relationships between brain activity patterns and cognitive states. Overall, BrainLM offers a versatile and interpretable framework for elucidating the complex spatiotemporal dynamics of human brain activity. It serves as a powerful \"lens\" through which massive repositories of fMRI data can be analyzed in new ways, enabling more effective interpretation and utilization at scale. The work demonstrates the potential of foundation models to advance computational neuroscience research.",
        "keywords": "foundation model;fMRI",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/39368d42f1acf1d915509057a285819a7fb0149a.pdf",
        "author": "Josue Ortega Caro;Antonio Henrique de Oliveira Fonseca;Syed A Rizvi;Matteo Rosati;Christopher Averill;James L Cross;Prateek Mittal;Emanuele Zappala;Rahul Madhav Dhodapkar;Chadi Abdallah;David van Dijk",
        "authorids": "~Josue_Ortega_Caro1;~Antonio_Henrique_de_Oliveira_Fonseca1;~Syed_A_Rizvi1;~Matteo_Rosati1;christopher.averill@bcm.edu;j.cross@yale.edu;prateekmittal154@gmail.com;~Emanuele_Zappala1;~Rahul_Madhav_Dhodapkar1;~Chadi_Abdallah1;~David_van_Dijk1",
        "gender": ";M;M;M;;;;M;M;M;M",
        "homepage": ";https://ahof1704.github.io/;https://syedarizvi.com/;;;;;https://eazappala.com/;;;http://www.vandijklab.org",
        "dblp": ";;;;;;;;;;136/9930",
        "google_scholar": ";;2rhnnZ4AAAAJ;;;;;J4OOzEwAAAAJ;ivfFMbEAAAAJ;HJsH1PEAAAAJ;fjjZr6UAAAAJ",
        "orcid": ";;0000-0002-7932-9524;;;;;;0000-0002-2014-7515;0000-0001-5783-6181;",
        "linkedin": ";;syed-a-rizvi-01/;matteo-rosati-49233a170/;;;;;;;",
        "or_profile": "~Josue_Ortega_Caro1;~Antonio_Henrique_de_Oliveira_Fonseca1;~Syed_A_Rizvi1;~Matteo_Rosati1;christopher.averill@bcm.edu;j.cross@yale.edu;prateekmittal154@gmail.com;~Emanuele_Zappala1;~Rahul_Madhav_Dhodapkar1;~Chadi_Abdallah1;~David_van_Dijk1",
        "aff": ";Yale University;Yale University;;;;;Idaho State University;;Baylor College of Medicine;Yale University",
        "aff_domain": ";yale.edu;yale.edu;;;;;isu.edu;;bcm.edu;yale.edu",
        "position": ";PhD student;PhD student;;;;;Assistant Professor;;Associate Professor;Assistant Professor",
        "bibtex": "@inproceedings{\ncaro2024brainlm,\ntitle={Brain{LM}: A foundation model for brain activity recordings},\nauthor={Josue Ortega Caro and Antonio Henrique de Oliveira Fonseca and Syed A Rizvi and Matteo Rosati and Christopher Averill and James L Cross and Prateek Mittal and Emanuele Zappala and Rahul Madhav Dhodapkar and Chadi Abdallah and David van Dijk},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=RwI7ZEfR27}\n}",
        "github": "",
        "project": "",
        "reviewers": "xyph;mZsL;NWMt;4kZC",
        "pdf_size": 7447692,
        "rating": "6;6;6;6",
        "confidence": "3;5;4;4",
        "soundness": "3;3;2;2",
        "contribution": "3;3;3;3",
        "presentation": "3;4;3;3",
        "wc_summary": "58;108;57;77",
        "wc_strengths": "44;130;48;65",
        "wc_weaknesses": "269;236;441;81",
        "wc_questions": "26;254;178;8",
        "wc_review": "397;728;724;231",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "500;617;1517;718",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;3;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            75.0,
            20.65187642806338
        ],
        "wc_strengths_avg": [
            71.75,
            34.54254622925183
        ],
        "wc_weaknesses_avg": [
            256.75,
            127.883491897899
        ],
        "wc_questions_avg": [
            116.5,
            103.26059267697431
        ],
        "wc_review_avg": [
            520.0,
            214.20200746024767
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            838.0,
            399.5391094749048
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 34,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18344764806936896452&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=RwI7ZEfR27",
        "pdf": "https://openreview.net/pdf?id=RwI7ZEfR27",
        "email": ";yale.edu;yale.edu;;;;;isu.edu;;bcm.edu;yale.edu",
        "author_num": 11,
        "aff_unique_index": "0;0;1;2;0",
        "aff_unique_norm": "Yale University;Idaho State University;Baylor College of Medicine",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.yale.edu;https://www.isu.edu;https://www.bcm.edu",
        "aff_unique_abbr": "Yale;ISU;BCM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "RwhRZojoYw",
        "title": "On information dropping and oversmoothing in graph neural networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph Neural Networks (GNNs) are widespread in graph representation learning. *Random dropping* approaches, notably DropEdge and DropMessage, claim to alleviate the key issues of overfitting and oversmoothing by randomly removing elements of the graph representation. However, their effectiveness is largely unverified. In this work, we find experimentally that they have a limited effect in reducing oversmoothing, contrary to what is typically assumed in the literature. These approaches are also non-parametric and motivate us to question if *learned* dropping can alleviate the  propagation of redundant or noisy edges. We propose a new information-theoretic approach, in which we learn to perform dropping on the data exchanged by nodes during message passing via optimizing an information bottleneck. Our approach is superior to previous dropping methods in oversmoothing reduction and has promising performance in the case of deep GNNs.",
        "keywords": "Oversmoothing",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/c0c0d6732d5cf2a17cc73ff4c39b3f0f4de23a95.pdf",
        "author": "Han Xuanyuan;Tianxiang Zhao;Dongsheng Luo",
        "authorids": "~Han_Xuanyuan1;~Tianxiang_Zhao1;~Dongsheng_Luo1",
        "gender": "M;M;M",
        "homepage": "https://github.com/xuyhan;https://tianxiangzhao.github.io/;https://users.cs.fiu.edu/~dluo/",
        "dblp": ";232/5561;",
        "google_scholar": ";pXkPq3YAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";0000-0003-4504-7809;0000-0003-4192-0826",
        "linkedin": ";;",
        "or_profile": "~Han_Xuanyuan1;~Tianxiang_Zhao1;~Dongsheng_Luo1",
        "aff": ";Pennsylvania State University;Florida International University",
        "aff_domain": ";psu.edu;fiu.edu",
        "position": ";PhD student;Assistant Professor",
        "bibtex": "@misc{\nxuanyuan2024on,\ntitle={On information dropping and oversmoothing in graph neural networks},\nauthor={Han Xuanyuan and Tianxiang Zhao and Dongsheng Luo},\nyear={2024},\nurl={https://openreview.net/forum?id=RwhRZojoYw}\n}",
        "github": "",
        "project": "",
        "reviewers": "yTML;K9Rv;nv43;xrXy",
        "site": "https://openreview.net/forum?id=RwhRZojoYw",
        "pdf_size": 529163,
        "rating": "3;3;3;6",
        "confidence": "3;4;3;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;2;3",
        "wc_summary": "77;78;49;64",
        "wc_strengths": "40;103;53;41",
        "wc_weaknesses": "4;538;131;227",
        "wc_questions": "351;20;18;75",
        "wc_review": "472;739;251;407",
        "wc_reply_reviewers": "358;123;52;0",
        "wc_reply_authors": "1007;1133;1071;455",
        "reply_reviewers": "2;1;1;0",
        "reply_authors": "2;3;3;2",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            67.0,
            11.76860229593982
        ],
        "wc_strengths_avg": [
            59.25,
            25.77183540223707
        ],
        "wc_weaknesses_avg": [
            225.0,
            197.26251544578864
        ],
        "wc_questions_avg": [
            116.0,
            137.59178754562353
        ],
        "wc_review_avg": [
            467.25,
            176.25602826570216
        ],
        "wc_reply_reviewers_avg": [
            133.25,
            136.9075874449623
        ],
        "wc_reply_authors_avg": [
            916.5,
            270.1457939705891
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:zPCNTb-OTUgJ:scholar.google.com/&scioq=On+information+dropping+and+oversmoothing+in+graph+neural+networks&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Pennsylvania State University;Florida International University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.psu.edu;https://www.fiu.edu",
        "aff_unique_abbr": "PSU;FIU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "RwwM7pKGWv",
        "title": "Towards Dynamic EHR Phenotyping: A Generative Clustering Model",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In healthcare, identifying clinical phenotypes\u2014subgroups defined by specific\nclinical traits\u2014is essential for optimizing patient care. The wealth of Electronic\nHealth Record (EHR) information has fueled data-driven approaches to tackle\nthis challenge. Unfortunately, the heterogeneity, multi-modality, and dynamic\nnature of EHR data pose significant hurdles. We propose DeepGC, a novel\ngenerative, clustering, outcome-sensitive end-to-end deep learning (DL) model for\nuncovering dynamic phenotypes within temporal EHR data. DeepGC leverages\npatient trajectories and outcomes to identify clinically meaningful phenotypes that\nevolve over time. Our generative model employs a dynamic sequential approach\nbased on a Markovian Dirichlet distribution and Variational Auto-Encoders (VAEs),\nwhich is capable of providing insights into the evolution of patient phenotypes\nand health status. Preliminary evaluation indicates that DeepGC shows promise\nin identifying distinct and interpretable phenotypes, and outperforming existing\nbenchmarks, particularly with regard to outcome sensitivity (3 % increase in F1).\nWe also showcase the model\u2019s potential to yield valuable insights into the future\nevolution of patients\u2019 health status",
        "keywords": "Clustering;Healthcare;Time-Series;Generative",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Henrique Aguiar;Mauro Santos;Peter Watkinson;Tingting Zhu",
        "authorids": "~Henrique_Aguiar1;~Mauro_Santos1;~Peter_Watkinson1;~Tingting_Zhu1",
        "gender": "M;;M;F",
        "homepage": ";;https://www.ndcn.ox.ac.uk/team/peter-watkinson;https://eng.ox.ac.uk/people/tingting-zhu/",
        "dblp": ";;;29/7666-1",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;https://scholar.google.co.uk/citations?user=pbIn-FUAAAAJ;https://scholar.google.com.vn/citations?user=fjGMIl0AAAAJ",
        "orcid": ";;0000-0003-1023-3927;0000-0002-1552-5630",
        "linkedin": ";;;",
        "or_profile": "~Henrique_Aguiar1;~Mauro_Santos1;~Peter_Watkinson1;~Tingting_Zhu1",
        "aff": ";;University of Oxford;University of Oxford",
        "aff_domain": ";;ox.ac.uk;eng.ox.ac.uk",
        "position": ";;Full Professor;RAEng Research Fellow",
        "bibtex": "@misc{\naguiar2024towards,\ntitle={Towards Dynamic {EHR} Phenotyping: A Generative Clustering Model},\nauthor={Henrique Aguiar and Mauro Santos and Peter Watkinson and Tingting Zhu},\nyear={2024},\nurl={https://openreview.net/forum?id=RwwM7pKGWv}\n}",
        "github": "",
        "project": "",
        "reviewers": "4mzC;rHc6;BDLh;1hAY",
        "site": "https://openreview.net/forum?id=RwwM7pKGWv",
        "pdf_size": 377613,
        "rating": "3;3;5;5",
        "confidence": "4;5;3;3",
        "soundness": "3;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;2;3",
        "wc_summary": "155;81;81;64",
        "wc_strengths": "56;18;54;22",
        "wc_weaknesses": "263;352;99;118",
        "wc_questions": "132;5;90;2",
        "wc_review": "606;456;324;206",
        "wc_reply_reviewers": "484;0;0;0",
        "wc_reply_authors": "1047;1025;493;594",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            95.25,
            35.187888541371734
        ],
        "wc_strengths_avg": [
            37.5,
            17.57128339080558
        ],
        "wc_weaknesses_avg": [
            208.0,
            104.57294105073262
        ],
        "wc_questions_avg": [
            57.25,
            55.7735376321065
        ],
        "wc_review_avg": [
            398.0,
            149.13752042997095
        ],
        "wc_reply_reviewers_avg": [
            121.0,
            209.57814771583415
        ],
        "wc_reply_authors_avg": [
            789.75,
            248.94715804764672
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9045340337332909,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:1VdbMeR9FGcJ:scholar.google.com/&scioq=Towards+Dynamic+EHR+Phenotyping:+A+Generative+Clustering+Model&hl=en&as_sdt=0,24",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Oxford",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ox.ac.uk",
        "aff_unique_abbr": "Oxford",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "RxhOEngX8s",
        "title": "Expecting The Unexpected: Towards Broad Out-Of-Distribution Detection",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deployed machine learning systems can be improved using methods detecting out-of-distribution (OOD) inputs. Existing research mainly focuses on one type of distribution shift: detecting samples from novel classes, absent from the training set. However, real-world systems encounter a broad variety of anomalous inputs, and the OOD literature neglects this diversity. This work categorizes five distinct types of distribution shifts and critically evaluates the performance of recent OOD detection methods on each of them. We publicly release our benchmark under the name BROAD (Benchmarking Resilience Over Anomaly Diversity). We find that while these methods excel in detecting novel classes, their performances are inconsistent across other types of distribution shifts. In other words, they can only reliably detect unexpected inputs that they have been specifically designed to expect. As a first step toward broad OOD detection, we learn a Gaussian mixture generative model for existing detection scores, enabling an ensemble detection approach that is more consistent and comprehensive for broad OOD detection, with improved performances over existing methods. Our code to download BROAD and reproduce our experiments will be released upon publication.",
        "keywords": "OOD detection;adversarial detection;BROAD;broad OOD detection;outlier detection",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Charles Guille-Escuret;Pierre-Andre Noel;Ioannis Mitliagkas;David Vazquez;Joao Monteiro",
        "authorids": "~Charles_Guille-Escuret1;~Pierre-Andre_Noel1;~Ioannis_Mitliagkas1;~David_Vazquez1;~Joao_Monteiro1",
        "gender": "M;M;M;M;M",
        "homepage": ";;http://mitliagkas.github.io/;http://www.david-vazquez.com;",
        "dblp": "243/7039;47/9226.html;83/8757;94/8653;215/5354-2",
        "google_scholar": "VNgVRmgAAAAJ;https://scholar.google.com/citations?hl=en;K757SxgAAAAJ;1jHvtfsAAAAJ;https://scholar.google.ca/citations?hl=en",
        "orcid": ";0000-0001-6979-1873;;0000-0002-2845-8158;",
        "linkedin": ";panoel/;;https://www.linkedin.com/company/david-vazquez/;joao-monteiro-47180256/",
        "or_profile": "~Charles_Guille-Escuret1;~Pierre-Andre_Noel1;~Ioannis_Mitliagkas1;~David_Vazquez1;~Joao_Monteiro1",
        "aff": "ServiceNow;ServiceNow;Mila - Quebec AI Institute;ServiceNow research;ServiceNow Research",
        "aff_domain": "servicenow.com;servicenow.com;mila.quebec;servicenow.com;servicenow.com",
        "position": "Intern;Researcher;Principal Researcher;Researcher;Researcher",
        "bibtex": "@misc{\nguille-escuret2024expecting,\ntitle={Expecting The Unexpected: Towards Broad Out-Of-Distribution Detection},\nauthor={Charles Guille-Escuret and Pierre-Andre Noel and Ioannis Mitliagkas and David Vazquez and Joao Monteiro},\nyear={2024},\nurl={https://openreview.net/forum?id=RxhOEngX8s}\n}",
        "github": "",
        "project": "",
        "reviewers": "xuax;WvA2;GVGN;Jh7c",
        "site": "https://openreview.net/forum?id=RxhOEngX8s",
        "pdf_size": 2040858,
        "rating": "3;3;5;6",
        "confidence": "4;2;3;4",
        "soundness": "1;3;2;3",
        "contribution": "1;1;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "77;132;53;86",
        "wc_strengths": "24;136;41;99",
        "wc_weaknesses": "141;133;197;147",
        "wc_questions": "48;22;62;2",
        "wc_review": "290;423;353;334",
        "wc_reply_reviewers": "96;0;191;22",
        "wc_reply_authors": "681;386;720;265",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            1.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            87.0,
            28.64437117480501
        ],
        "wc_strengths_avg": [
            75.0,
            44.87204029236914
        ],
        "wc_weaknesses_avg": [
            154.5,
            25.034975534240093
        ],
        "wc_questions_avg": [
            33.5,
            23.16786567640619
        ],
        "wc_review_avg": [
            350.0,
            47.94267410147248
        ],
        "wc_reply_reviewers_avg": [
            77.25,
            74.68391727808606
        ],
        "wc_reply_authors_avg": [
            513.0,
            192.81208468350732
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.4061811972299616,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16811754698536378445&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "ServiceNow;Quebec AI Institute",
        "aff_unique_dep": ";AI Institute",
        "aff_unique_url": "https://www.servicenow.com;https://mila.quebec",
        "aff_unique_abbr": "ServiceNow;Mila",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "United States;Canada"
    },
    {
        "id": "Ry1SZkcYbX",
        "title": "Edge-Sampler: Efficient Importance Sampling for Neural Implicit Surfaces Reconstruction",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Neural implicit surfaces have attracted much attention in the 3D reconstruction field. Equipped with signed distance functions (SDFs), neural implicit surfaces significantly improve geometry reconstruction quality compared to neural radiance fields (NeRFs). However, compared with NeRFs, training SDFs is more challenging and time-consuming because it requires large sample counts to sample the thin edges of implicit surface density functions. Up till today, the error bounded sampling has been the sole volume importance sampling technique dedicated to implicit SDFs, which theoretically bounds the errors of sample weights and thus prevents missing important thin surface edges, but at the cost of large sample counts. In this work, we introduce an efficient edge-sampler technique to significantly reduce the required sample counts by up to 10x while still preserving the theoretical error bound by reducing Riemann integral bias. Specifically, the technique first proposes a double-sampling strategy to detect the thin intervals of surface edges containing all valid samples. Then, it fits the density functions of the intervals with bounded cumulated distribution functions (CDF) errors and produces the final Riemann sum with sparse uniform samples. Extensive results in various scenes demonstrate the superiority of our sampling technique, including improving geometry reconstruction details, significantly reducing sample counts and training time, and the capability to be generalized to various implicit SDF frameworks.",
        "keywords": "Neural implicit surfaces;sampling algorithm;computer vision",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Qi Wang;Yuchi Huo;Fujun Luan;Zixuan Xie;Rengan Xie;Qi Ye;Rui Wang;Hujun Bao",
        "authorids": "~Qi_Wang29;~Yuchi_Huo1;~Fujun_Luan2;~Zixuan_Xie1;~Rengan_Xie1;~Qi_Ye2;~Rui_Wang15;~Hujun_Bao1",
        "gender": "M;M;M;M;M;;M;M",
        "homepage": ";https://www.zju.edu.cn/home/huo/;https://luanfujun.com/;;;https://sites.google.com/site/qiyeincv/;http://www.cad.zju.edu.cn/home/rwang/;http://www.cad.zju.edu.cn/home/bao/",
        "dblp": ";;183/9337;;;;w/RuiWang4.html;b/HujunBao",
        "google_scholar": ";;NLxrmYQAAAAJ;;sedvzUoAAAAJ;4D-HZ98AAAAJ;https://scholar.google.com/citations?view_op=list_works;AZCcDmsAAAAJ",
        "orcid": "0000-0002-6326-3209;;;0009-0001-9086-1351;;0000-0003-2285-3402;;0000-0002-2662-0334",
        "linkedin": ";;luanfujun/;;;;;",
        "or_profile": "~Qi_Wang29;~Yuchi_Huo1;~Fujun_Luan2;~Zixuan_Xie1;~Rengan_Xie1;~Qi_Ye2;~Rui_Wang15;~Hujun_Bao1",
        "aff": "College of Computer Science and Technology, Zhejiang University;Zhejiang University;Adobe Systems;University of Chinese Academy of Sciences;Zhejiang University;Zhejiang University;Zhejiang University;Zhejiang University",
        "aff_domain": "cs.zju.edu.cn;zju.edu.cn;adobe.com;ucas.ac.cn;zju.edu.cn;zju.edu.cn;zju.edu.cn;zju.edu.cn",
        "position": "PhD student;Assistant Professor;Researcher;PhD student;PhD student;Assistant Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nwang2024edgesampler,\ntitle={Edge-Sampler: Efficient Importance Sampling for Neural Implicit Surfaces Reconstruction},\nauthor={Qi Wang and Yuchi Huo and Fujun Luan and Zixuan Xie and Rengan Xie and Qi Ye and Rui Wang and Hujun Bao},\nyear={2024},\nurl={https://openreview.net/forum?id=Ry1SZkcYbX}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZFpx;17Yv;qAAj;Xm98",
        "site": "https://openreview.net/forum?id=Ry1SZkcYbX",
        "pdf_size": 13167814,
        "rating": "1;3;5;5",
        "confidence": "5;5;2;3",
        "soundness": "1;3;3;3",
        "contribution": "1;2;3;2",
        "presentation": "2;2;3;2",
        "wc_summary": "45;44;143;117",
        "wc_strengths": "12;24;62;27",
        "wc_weaknesses": "502;192;58;140",
        "wc_questions": "46;2;58;41",
        "wc_review": "605;262;321;325",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            1.6583123951777
        ],
        "confidence_avg": [
            3.75,
            1.299038105676658
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            87.25,
            43.728566178186085
        ],
        "wc_strengths_avg": [
            31.25,
            18.619546181365433
        ],
        "wc_weaknesses_avg": [
            223.0,
            168.01488029338353
        ],
        "wc_questions_avg": [
            36.75,
            20.99255820523073
        ],
        "wc_review_avg": [
            378.25,
            133.2692293817294
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.8703882797784891,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:kHjappRJeqsJ:scholar.google.com/&scioq=Edge-Sampler:+Efficient+Importance+Sampling+for+Neural+Implicit+Surfaces+Reconstruction&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2;0;0;0;0",
        "aff_unique_norm": "Zhejiang University;Adobe;University of Chinese Academy of Sciences",
        "aff_unique_dep": "College of Computer Science and Technology;Adobe Systems Incorporated;",
        "aff_unique_url": "http://www.zju.edu.cn;https://www.adobe.com;http://www.ucas.ac.cn",
        "aff_unique_abbr": "ZJU;Adobe;UCAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0;0;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "A Stable, Fast, and Fully Automatic Learning Algorithm for Predictive Coding Networks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18624",
        "id": "RyUvzda8GH",
        "author_site": "Tommaso Salvatori, Yuhang Song, Yordan Yordanov, Beren Millidge, Lei Sha, Cornelius Emde, Zhenghua Xu, Rafal Bogacz, Thomas Lukasiewicz",
        "tldr": "",
        "abstract": "Predictive coding networks are neuroscience-inspired models with roots in both Bayesian statistics and neuroscience. Training such models, however, is quite inefficient and unstable. In this work, we show how by simply changing the temporal scheduling of the update rule for the synaptic weights leads to an algorithm that is much more efficient and stable than the original one, and has theoretical guarantees in terms of convergence. The proposed algorithm, that we call incremental predictive coding (iPC) is also more biologically plausible than the original one, as it it fully automatic. In an extensive set of experiments, we show that iPC constantly performs better than the original formulation on a large number of benchmarks for image classification, as well as for the training of both conditional and masked language models, in terms of test accuracy, efficiency, and convergence with respect to a large set of hyperparameters.",
        "keywords": "Cognitive Science;parallelization",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "Tommaso Salvatori;Yuhang Song;Yordan Yordanov;Beren Millidge;Lei Sha;Cornelius Emde;Zhenghua Xu;Rafal Bogacz;Thomas Lukasiewicz",
        "authorids": "~Tommaso_Salvatori1;~Yuhang_Song1;~Yordan_Yordanov1;~Beren_Millidge1;~Lei_Sha1;~Cornelius_Emde1;~Zhenghua_Xu1;~Rafal_Bogacz1;~Thomas_Lukasiewicz2",
        "gender": "M;M;M;M;M;;M;;",
        "homepage": "https://www.cs.ox.ac.uk/people/tommaso.salvatori/;https://sites.google.com/view/yuhangsong/;https://www.cs.ox.ac.uk/people/yordan.yordanov/;http://beren.io/;https://shalei120.github.io;;http://www.zhenghuaxu.info;;https://www.cs.ox.ac.uk/people/thomas.lukasiewicz/",
        "dblp": "270/2016;177/8908-1;;244/9967;93/3906;;80/11498;46/45;l/ThomasLukasiewicz",
        "google_scholar": "https://scholar.google.com/citations?hl=en;cyd3EsgAAAAJ;;3GGkFTkAAAAJ;https://scholar.google.com.hk/citations?user=EbZ_P6gAAAAJ;;;;arjucpEAAAAJ",
        "orcid": ";;;;;;;;",
        "linkedin": ";;;beren-millidge-377065142/;;;;;",
        "or_profile": "~Tommaso_Salvatori1;~Yuhang_Song1;~Yordan_Yordanov1;~Beren_Millidge1;~Lei_Sha1;~Cornelius_Emde1;~Zhenghua_Xu1;~Rafal_Bogacz1;~Thomas_Lukasiewicz2",
        "aff": "VERSES;;;;Beihang University;;;University of Oxford;Department of Computer Science, University of Oxford",
        "aff_domain": "verses.ai;;;;buaa.edu.cn;;;ox.ac.uk;cs.ox.ac.uk",
        "position": "Researcher;;;;Full Professor;;;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nsalvatori2024a,\ntitle={A Stable, Fast, and Fully Automatic Learning Algorithm for Predictive Coding Networks},\nauthor={Tommaso Salvatori and Yuhang Song and Yordan Yordanov and Beren Millidge and Lei Sha and Cornelius Emde and Zhenghua Xu and Rafal Bogacz and Thomas Lukasiewicz},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=RyUvzda8GH}\n}",
        "github": "",
        "project": "",
        "reviewers": "seiB;sVBr;Tect;Ctxj",
        "pdf_size": 7190631,
        "rating": "3;6;6;6",
        "confidence": "4;4;4;4",
        "soundness": "3;3;4;3",
        "contribution": "2;2;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "173;79;67;59",
        "wc_strengths": "72;55;55;34",
        "wc_weaknesses": "77;267;89;36",
        "wc_questions": "1;47;83;11",
        "wc_review": "323;448;294;140",
        "wc_reply_reviewers": "37;199;136;132",
        "wc_reply_authors": "542;545;711;277",
        "reply_reviewers": "1;2;1;1",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            94.5,
            45.8775544247947
        ],
        "wc_strengths_avg": [
            54.0,
            13.47219358530748
        ],
        "wc_weaknesses_avg": [
            117.25,
            88.66333797009901
        ],
        "wc_questions_avg": [
            35.5,
            32.32259271778797
        ],
        "wc_review_avg": [
            301.25,
            109.61609142822051
        ],
        "wc_reply_reviewers_avg": [
            126.0,
            57.848941217622986
        ],
        "wc_reply_authors_avg": [
            518.75,
            155.42904329629002
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8961266719798775095&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=RyUvzda8GH",
        "pdf": "https://openreview.net/pdf?id=RyUvzda8GH",
        "email": "verses.ai;;;;buaa.edu.cn;;;ox.ac.uk;cs.ox.ac.uk",
        "author_num": 9,
        "aff_unique_index": "1;2;2",
        "aff_unique_norm": ";Beihang University;University of Oxford",
        "aff_unique_dep": ";;",
        "aff_unique_url": ";http://www.buaa.edu.cn/;https://www.ox.ac.uk",
        "aff_unique_abbr": ";BUAA;Oxford",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Oxford",
        "aff_country_unique_index": "1;2;2",
        "aff_country_unique": ";China;United Kingdom"
    },
    {
        "id": "RzEWcuZQcA",
        "title": "How Powerful are Graph Neural Networks with Random Weights?",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Thanks to the great success of graph neural networks (GNNs) in structural information learning, extensive variants by virtue of sampling or pooling have been developed to further improve the performance, scalability, and applicability. However, there is still room for improvement in learning efficiency because current GNNs are trained via batch gradient descent with many graphs in each iteration. The good potential of random features in speeding up the training phase motivates us to consider the expressive power of GNNs with random weights. Based on the framework of Graph Isomorphism Network, we propose a novel model called Hashing Graph Isomorphism Network (HashGIN) with only one epoch of training by revising the convolutional layer with random hash functions and adjusting the learning objective with regularized least squares loss. In light of the property of $k$ random hash functions, we theoretically show that the injective phase in the Weisfeiler-Lehman test can be approximated by a hash family. An approximation upper bound is further provided with rigorous mathematical proof for the convergence of our model. Our experiments on several benchmark datasets show that HashGIN is effective and efficient for graph classification tasks. Compared to the state-of-the-art methods, HashGIN achieves better or comparable accuracies with less training time and memory cost.",
        "keywords": "Graph Neural Networks;Graph Isomorphism;Neighborhood Aggregation;Graph Classification",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Ziqi Zhao;Shangzhe Li;Junran Wu;Ke Xu",
        "authorids": "~Ziqi_Zhao3;~Shangzhe_Li1;~Junran_Wu1;~Ke_Xu4",
        "gender": "M;;;",
        "homepage": ";https://github.com/lsz19960814;https://github.com/Wu-Junran;",
        "dblp": ";;241/7211;x/KeXu",
        "google_scholar": ";;pbjk-2UAAAAJ;",
        "orcid": "0009-0003-6776-3029;;;",
        "linkedin": ";;;",
        "or_profile": "~Ziqi_Zhao3;~Shangzhe_Li1;~Junran_Wu1;~Ke_Xu4",
        "aff": "Beihang University;;National University of Singapore;Beihang University",
        "aff_domain": "buaa.edu.cn;;nus.edu.sg;buaa.edu.cn",
        "position": "MS student;;Postdoc;Full Professor",
        "bibtex": "@misc{\nzhao2024how,\ntitle={How Powerful are Graph Neural Networks with Random Weights?},\nauthor={Ziqi Zhao and Shangzhe Li and Junran Wu and Ke Xu},\nyear={2024},\nurl={https://openreview.net/forum?id=RzEWcuZQcA}\n}",
        "github": "",
        "project": "",
        "reviewers": "iT8Z;bYNF;btEt",
        "site": "https://openreview.net/forum?id=RzEWcuZQcA",
        "pdf_size": 334131,
        "rating": "1;1;6",
        "confidence": "5;4;3",
        "soundness": "1;1;3",
        "contribution": "1;2;3",
        "presentation": "1;1;3",
        "wc_summary": "122;109;71",
        "wc_strengths": "21;26;89",
        "wc_weaknesses": "21;442;1",
        "wc_questions": "21;4;27",
        "wc_review": "185;581;188",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            2.6666666666666665,
            2.3570226039551585
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            100.66666666666667,
            21.638443156156644
        ],
        "wc_strengths_avg": [
            45.333333333333336,
            30.944394574067136
        ],
        "wc_weaknesses_avg": [
            154.66666666666666,
            203.33934417345034
        ],
        "wc_questions_avg": [
            17.333333333333332,
            9.741092797468305
        ],
        "wc_review_avg": [
            318.0,
            185.9731163367437
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8660254037844386,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:48fXN1tmaVAJ:scholar.google.com/&scioq=How+Powerful+are+Graph+Neural+Networks+with+Random+Weights%3F&hl=en&as_sdt=0,48",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Beihang University;National University of Singapore",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.buaa.edu.cn/;https://www.nus.edu.sg",
        "aff_unique_abbr": "BUAA;NUS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "China;Singapore"
    },
    {
        "title": "$t^3$-Variational Autoencoder: Learning Heavy-tailed Data with Student's t and Power Divergence",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18623",
        "id": "RzNlECeoOB",
        "author_site": "Juno Kim, Jaehyuk Kwon, Mincheol Cho, Hyunjong Lee, Joong-Ho Won",
        "tldr": "",
        "abstract": "The variational autoencoder (VAE) typically employs a standard normal prior as a regularizer for the probabilistic latent encoder. However, the Gaussian tail often decays too quickly to effectively accommodate the encoded points, failing to preserve crucial structures hidden in the data. In this paper, we explore the use of heavy-tailed models to combat over-regularization. Drawing upon insights from information geometry, we propose $t^3$VAE, a modified VAE framework that incorporates Student's t-distributions for the prior, encoder, and decoder. This results in a joint model distribution of a power form which we argue can better fit real-world datasets. We derive a new objective by reformulating the evidence lower bound as joint optimization of KL divergence between two statistical manifolds and replacing with $\\gamma$-power divergence, a natural alternative for power families. $t^3$VAE demonstrates superior generation of low-density regions when trained on heavy-tailed synthetic data. Furthermore, we show that $t^3$VAE significantly outperforms other models on CelebA and imbalanced CIFAR-100 datasets.",
        "keywords": "Variational autoencoder;Information geometry;Heavy-tail learning;Generative model",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/2c01181d799d3e99445d9421496d57688b8f55ba.zip",
        "author": "Juno Kim;Jaehyuk Kwon;Mincheol Cho;Hyunjong Lee;Joong-Ho Won",
        "authorids": "~Juno_Kim1;~Jaehyuk_Kwon1;~Mincheol_Cho1;~Hyunjong_Lee1;~Joong-Ho_Won1",
        "gender": "M;M;M;M;",
        "homepage": "https://junokim1.github.io/;https://github.com/SelBias;;https://leehyunjong.github.io/;",
        "dblp": "59/8200;;;;",
        "google_scholar": "PEHQlgkAAAAJ;;;https://scholar.google.com/citations?hl=ko;",
        "orcid": ";;;;",
        "linkedin": ";;mincheol-cho-758565211/;;",
        "or_profile": "~Juno_Kim1;~Jaehyuk_Kwon1;~Mincheol_Cho1;~Hyunjong_Lee1;~Joong-Ho_Won1",
        "aff": "RIKEN;Seoul National University;Seoul National University;Seoul National University;",
        "aff_domain": "riken.jp;snu.ac.kr;snu.ac.kr;snu.ac.kr;",
        "position": "Researcher;Undergrad student;MS student;PhD student;",
        "bibtex": "@inproceedings{\nkim2024tvariational,\ntitle={\\$t{\\textasciicircum}3\\$-Variational Autoencoder: Learning Heavy-tailed Data with Student's t and Power Divergence},\nauthor={Juno Kim and Jaehyuk Kwon and Mincheol Cho and Hyunjong Lee and Joong-Ho Won},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=RzNlECeoOB}\n}",
        "github": "",
        "project": "",
        "reviewers": "5yMY;1fkZ;fEQe",
        "pdf_size": 2246028,
        "rating": "6;8;8",
        "confidence": "4;4;3",
        "soundness": "3;3;4",
        "contribution": "3;3;3",
        "presentation": "3;3;3",
        "wc_summary": "84;81;191",
        "wc_strengths": "79;51;114",
        "wc_weaknesses": "174;80;107",
        "wc_questions": "2;10;145",
        "wc_review": "339;222;557",
        "wc_reply_reviewers": "15;15;0",
        "wc_reply_authors": "723;163;904",
        "reply_reviewers": "1;1;0",
        "reply_authors": "1;1;2",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            118.66666666666667,
            51.162051909159736
        ],
        "wc_strengths_avg": [
            81.33333333333333,
            25.772509040103607
        ],
        "wc_weaknesses_avg": [
            120.33333333333333,
            39.5165225640561
        ],
        "wc_questions_avg": [
            52.333333333333336,
            65.60657148656848
        ],
        "wc_review_avg": [
            372.6666666666667,
            138.8196271745782
        ],
        "wc_reply_reviewers_avg": [
            10.0,
            7.0710678118654755
        ],
        "wc_reply_authors_avg": [
            596.6666666666666,
            315.42599061516086
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3434475026735347221&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=RzNlECeoOB",
        "pdf": "https://openreview.net/pdf?id=RzNlECeoOB",
        "email": "riken.jp;snu.ac.kr;snu.ac.kr;snu.ac.kr;",
        "author_num": 5,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "RIKEN;Seoul National University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.riken.jp;https://www.snu.ac.kr",
        "aff_unique_abbr": "RIKEN;SNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "Japan;South Korea"
    },
    {
        "id": "RzOm9oOSzm",
        "title": "Unveiling Linear Mode Connectivity of Re-basin from Neuron Distribution Perspective",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In deep learning, stochastic gradient descent (SGD) finds many minima that are functionally similar but divergent in parameter space, and connecting the two SGD solutions will depict a loss landscape called linear mode connectivity (LMC), where barriers usually exist. \nImproving LMC plays an important role in model ensemble, model fusion, and federated learning. Previous works of re-basin map different solutions into the same basin to reduce the barriers in LMC, using permutation symmetry. It is found that the re-basin methods work poorly in early training and emerge to improve LMC after several epochs. Also, the performances of re-basins are usually suboptimal that they can find permutations to reduce the barrier but cannot eliminate it (or the reduction is marginal). However, there is no unified theory on when and why re-basins will improve LMC above chance, and unveiling the behind mechanism is fundamental to improving re-basin approaches and further understanding the loss landscape and training dynamics of deep learning. Therefore, in this paper, we propose a theory from the neuron distribution perspective to demystify the mechanism behind the LMC of re-basin. In our theory, we use Shannon entropy to depict the uniformity of neuron distributions and derive that non-uniformity (entropy decrease) will result in better LMC after re-basin. In accordance with our theory, we present the following observations, all of which can be aptly explained by our theory. i) The LMC of re-basin changes in various non-uniform initializations. ii) The re-basin's LMC improvement emerges after training due to the neuron distribution change. iii) The LMC of re-basin changes when pruning with different pruning ratios. \nBuilding upon these findings, we further showcase how to apply our theory to refine the performances of other neuron alignment methods beyond re-basin, e.g., OTFusion and FedMA.",
        "keywords": "linear mode connectivity;non-uniformity and entropy;neuron alignment;permutation invariance;model fusion",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Zhiqi Li;Zexi Li;Mian Wu;Cheng Wan;Chao Wu",
        "authorids": "~Zhiqi_Li4;~Zexi_Li1;~Mian_Wu2;~Cheng_Wan4;~Chao_Wu1",
        "gender": "M;M;M;M;M",
        "homepage": "https://zhiqili-cg.github.io;https://zexilee.github.io/about-zexili/;;https://jornywan.github.io/;",
        "dblp": "143/0347-4.html;151/9187-1;;;45/3158-1",
        "google_scholar": "gh_nHawAAAAJ;https://scholar.google.com.hk/citations?user=6lMg5eoAAAAJ;;;gpTPt58AAAAJ",
        "orcid": "0000-0002-6892-8097;0000-0003-0831-3549;;0009-0000-5880-3242;0000-0003-0885-6869",
        "linkedin": "li-zhiqi;;mian-wu-65264024b/;chengwanjorny/;",
        "or_profile": "~Zhiqi_Li4;~Zexi_Li1;~Mian_Wu2;~Cheng_Wan4;~Chao_Wu1",
        "aff": "Georgia Institute of Technology;Zhejiang University;Georgia Institute of Technology;Georgia Institute of Technology;Zhejiang University",
        "aff_domain": "gatech.edu;zju.edu.cn;gatech.edu;gatech.edu;zju.edu.cn",
        "position": "MS student;PhD student;MS student;MS student;Associate Professor",
        "bibtex": "@misc{\nli2024unveiling,\ntitle={Unveiling Linear Mode Connectivity of Re-basin from Neuron Distribution Perspective},\nauthor={Zhiqi Li and Zexi Li and Mian Wu and Cheng Wan and Chao Wu},\nyear={2024},\nurl={https://openreview.net/forum?id=RzOm9oOSzm}\n}",
        "github": "",
        "project": "",
        "reviewers": "ehnr;3GTP;y1Dw;Lp2L",
        "site": "https://openreview.net/forum?id=RzOm9oOSzm",
        "pdf_size": 1170883,
        "rating": "3;3;3;5",
        "confidence": "5;4;3;3",
        "soundness": "2;2;1;2",
        "contribution": "2;2;1;2",
        "presentation": "2;1;2;2",
        "wc_summary": "65;133;125;68",
        "wc_strengths": "86;46;65;50",
        "wc_weaknesses": "355;627;422;44",
        "wc_questions": "56;7;273;1",
        "wc_review": "562;813;885;163",
        "wc_reply_reviewers": "0;19;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            97.75,
            31.395660528168538
        ],
        "wc_strengths_avg": [
            61.75,
            15.690363284513205
        ],
        "wc_weaknesses_avg": [
            362.0,
            209.1638114014946
        ],
        "wc_questions_avg": [
            84.25,
            111.04362881318315
        ],
        "wc_review_avg": [
            605.75,
            282.3449795905711
        ],
        "wc_reply_reviewers_avg": [
            4.75,
            8.227241335952167
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:-lrqNOt7ZFgJ:scholar.google.com/&scioq=Unveiling+Linear+Mode+Connectivity+of+Re-basin+from+Neuron+Distribution+Perspective&hl=en&as_sdt=0,47",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0;1",
        "aff_unique_norm": "Georgia Institute of Technology;Zhejiang University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.gatech.edu;https://www.zju.edu.cn",
        "aff_unique_abbr": "Georgia Tech;ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;1",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "RzV7QRowUl",
        "title": "Test like you Train in Implicit Deep Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Implicit deep learning has recently gained popularity with applications ranging from meta-learning to Deep Equilibrium Networks~(DEQs). In its very general formulation, it relies on expressing some components of deep learning pipelines implicitly, typically via a root equation called the inner problem. In practice, the solution of the inner problem is approximated with an iterative procedure, usually with a fixed number of inner iterations during training. At inference time, the inner problems needs to be solved with new data. A popular belief is that increasing the number of inner iterations relative to the one used in training yields better performances. In this paper, we question such an assumption and provide a detailed theoretical analysis in a simple affine setting. We demonstrate that overparametrization plays a key role: increasing the number of iterations at test time cannot improve performances for overparametrized networks. We validate our theory on an array of implicit deep-learning problems. We show that DEQs, which are typically overparametrized, do not benefit from increasing the number of iterations at inference while meta-learning, which is typically not overparametrized, benefits from it.",
        "keywords": "deep equilibrium models;implicit differentiation;bilevel optimization;bilevel;implicit deep learning;meta-learning",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/2de07ae48ab5f80dc072aa44d594906b189864fc.zip",
        "author": "Zaccharie Ramzi;Pierre Ablin;Gabriel Peyr\u00e9;Thomas Moreau",
        "authorids": "~Zaccharie_Ramzi1;~Pierre_Ablin2;~Gabriel_Peyr\u00e92;~Thomas_Moreau2",
        "gender": "M;M;M;M",
        "homepage": "https://zaccharieramzi.fr/;https://pierreablin.com/;http://gpeyre.com/;https://tommoral.github.io",
        "dblp": "266/7212;174/0980.html;65/1759;150/2391-1",
        "google_scholar": "rTgYLN8AAAAJ;1ZsunaYAAAAJ;https://scholar.google.fr/citations?user=KqA1dYcAAAAJ;https://scholar.google.fr/citations?user=HEO_PsAAAAAJ",
        "orcid": "0000-0002-5888-8749;;;0000-0002-1523-3419",
        "linkedin": "zaccharie-ramzi-043476a5/;;;thomasmoreau2010",
        "or_profile": "~Zaccharie_Ramzi1;~Pierre_Ablin2;~Gabriel_Peyr\u00e92;~Thomas_Martin_Moreau1",
        "aff": "Meta;Apple;CNRS;INRIA",
        "aff_domain": "meta.com;apple.com;cnrs.fr;inria.fr",
        "position": "Researcher;Researcher;Researcher;Researcher",
        "bibtex": "@misc{\nramzi2024test,\ntitle={Test like you Train in Implicit Deep Learning},\nauthor={Zaccharie Ramzi and Pierre Ablin and Gabriel Peyr{\\'e} and Thomas Moreau},\nyear={2024},\nurl={https://openreview.net/forum?id=RzV7QRowUl}\n}",
        "github": "",
        "project": "",
        "reviewers": "UkB2;uPNB;YcSM",
        "site": "https://openreview.net/forum?id=RzV7QRowUl",
        "pdf_size": 1033078,
        "rating": "3;5;6",
        "confidence": "3;3;2",
        "soundness": "2;2;3",
        "contribution": "2;2;2",
        "presentation": "3;2;2",
        "wc_summary": "149;65;68",
        "wc_strengths": "100;15;33",
        "wc_weaknesses": "326;58;55",
        "wc_questions": "57;121;5",
        "wc_review": "632;259;161",
        "wc_reply_reviewers": "0;9;0",
        "wc_reply_authors": "386;281;170",
        "reply_reviewers": "0;1;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            94.0,
            38.91015291668744
        ],
        "wc_strengths_avg": [
            49.333333333333336,
            36.572606627851336
        ],
        "wc_weaknesses_avg": [
            146.33333333333334,
            127.04942170492377
        ],
        "wc_questions_avg": [
            61.0,
            47.44119166575252
        ],
        "wc_review_avg": [
            350.6666666666667,
            202.91596509118963
        ],
        "wc_reply_reviewers_avg": [
            3.0,
            4.242640687119285
        ],
        "wc_reply_authors_avg": [
            279.0,
            88.19297024139736
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.7559289460184545,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11247328656477464763&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Meta;Apple;Centre National de la Recherche Scientifique;INRIA",
        "aff_unique_dep": "Meta Platforms, Inc.;Apple Inc.;;",
        "aff_unique_url": "https://meta.com;https://www.apple.com;https://www.cnrs.fr;https://www.inria.fr",
        "aff_unique_abbr": "Meta;Apple;CNRS;INRIA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;1",
        "aff_country_unique": "United States;France"
    },
    {
        "title": "Kill Two Birds with One Stone: Rethinking Data Augmentation for Deep Long-tailed Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18622",
        "id": "RzY9qQHUXy",
        "author_site": "Binwu Wang, Pengkun Wang, Wei Xu, Xu Wang, Yudong Zhang, Kun Wang, Yang Wang",
        "tldr": "",
        "abstract": "Real-world tasks are universally associated with training samples that exhibit a long-tailed class distribution, and traditional deep learning models are not suitable for fitting this distribution, thus resulting in a biased trained model. To surmount this dilemma, massive deep long-tailed learning studies have been proposed to achieve inter-class fairness models by designing sophisticated sampling strategies or improving existing model structures and loss functions. Habitually, these studies tend to apply data augmentation strategies to improve the generalization performance of their models. However, this augmentation strategy applied to balanced distributions may not be the best option for long-tailed distributions. For a profound understanding of data augmentation, we first theoretically analyze the gains of traditional augmentation strategies in long-tailed learning, and observe that augmentation methods cause the long-tailed distribution to be imbalanced again, resulting in an intertwined imbalance: inherent data-wise imbalance and extrinsic augmentation-wise imbalance, i.e., two 'birds' co-exist in long-tailed learning. Motivated by this observation, we propose an adaptive Dynamic Optional Data Augmentation (DODA) to address this intertwined imbalance, i.e., one 'stone' simultaneously 'kills' two 'birds', which allows each class to choose appropriate augmentation methods by maintaining a corresponding augmentation probability distribution for each class during training. Extensive experiments across mainstream long-tailed recognition benchmarks (e.g., CIFAR-100-LT, ImageNet-LT, and iNaturalist 2018) prove the effectiveness and flexibility of the DODA in overcoming the intertwined imbalance.",
        "keywords": "Long-tailed learning;data augmentation;imbalance;fairness",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/075ec5602cc9213e20606e680ffdebb51234c229.zip",
        "author": "Binwu Wang;Pengkun Wang;Wei Xu;Xu Wang;Yudong Zhang;Kun Wang;Yang Wang",
        "authorids": "~Binwu_Wang1;~Pengkun_Wang1;~Wei_Xu21;~Xu_Wang16;~Yudong_Zhang3;~Kun_Wang15;~Yang_Wang32",
        "gender": "M;M;;M;M;M;M",
        "homepage": "https://continualgoing.github.io/;http://home.ustc.edu.cn/~pengkun/index.html;https://home.cnblogs.com/u/Embiid;http://home.ustc.edu.cn/~wx309/;http://home.ustc.edu.cn/~zyd2020/;http://home.ustc.edu.cn/~wk520529/#home;http://staff.ustc.edu.cn/~angyan/",
        "dblp": "262/4302;;;181/2815-29;39/2699-5;;",
        "google_scholar": ";https://scholar.google.com/citations?hl=zh-CN;;7hYGPC8AAAAJ;LM55u08AAAAJ;UnyqjWQAAAAJ;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": "0000-0002-4638-0382;0000-0002-2680-4563;;0000-0002-1492-3477;0000-0003-4941-0214;0000-0003-0602-169X;0000-0002-6079-7053",
        "linkedin": ";;;;;;",
        "or_profile": "~Binwu_Wang1;~Pengkun_Wang1;~Wei_Xu21;~Xu_Wang16;~Yudong_Zhang3;~Kun_Wang15;~Yang_Wang32",
        "aff": "University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China",
        "aff_domain": "ustc.edu.cn;ustc.edu.cn;ustc.edu.cn;ustc.edu.cn;ustc.edu.cn;ustc.edu.cn;ustc.edu.cn",
        "position": "PhD student;Researcher;MS student;Associate Researcher;PhD student;PhD student;Associate Professor",
        "bibtex": "@inproceedings{\nwang2024kill,\ntitle={Kill Two Birds with One Stone: Rethinking Data Augmentation for Deep Long-tailed Learning},\nauthor={Binwu Wang and Pengkun Wang and Wei Xu and Xu Wang and Yudong Zhang and Kun Wang and Yang Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=RzY9qQHUXy}\n}",
        "github": "",
        "project": "",
        "reviewers": "rRZN;ZxxQ;rn58;PqHc",
        "pdf_size": 3379402,
        "rating": "5;6;8;8",
        "confidence": "5;3;4;5",
        "soundness": "2;3;4;4",
        "contribution": "2;3;3;4",
        "presentation": "3;3;3;3",
        "wc_summary": "67;81;85;83",
        "wc_strengths": "43;37;59;123",
        "wc_weaknesses": "201;130;7;83",
        "wc_questions": "22;106;4;91",
        "wc_review": "333;354;155;380",
        "wc_reply_reviewers": "365;218;0;0",
        "wc_reply_authors": "1372;651;19;405",
        "reply_reviewers": "1;3;0;0",
        "reply_authors": "3;5;1;1",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            79.0,
            7.0710678118654755
        ],
        "wc_strengths_avg": [
            65.5,
            34.15772240650714
        ],
        "wc_weaknesses_avg": [
            105.25,
            70.5846123457514
        ],
        "wc_questions_avg": [
            55.75,
            43.54523510098436
        ],
        "wc_review_avg": [
            305.5,
            88.47174690261292
        ],
        "wc_reply_reviewers_avg": [
            145.75,
            154.73909493078986
        ],
        "wc_reply_authors_avg": [
            611.75,
            493.3606059466037
        ],
        "reply_reviewers_avg": [
            1.0,
            1.224744871391589
        ],
        "reply_authors_avg": [
            2.5,
            1.6583123951777
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.058025885318565944,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9990747009449399838&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=RzY9qQHUXy",
        "pdf": "https://openreview.net/pdf?id=RzY9qQHUXy",
        "email": "ustc.edu.cn;ustc.edu.cn;ustc.edu.cn;ustc.edu.cn;ustc.edu.cn;ustc.edu.cn;ustc.edu.cn",
        "author_num": 7,
        "aff_unique_index": "0;0;0;0;0;0;0",
        "aff_unique_norm": "University of Science and Technology of China",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.ustc.edu.cn",
        "aff_unique_abbr": "USTC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "S0DUtGgkTM",
        "title": "Riemannian Multiclass Logistics Regression for SPD Neural Networks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Deep neural networks for learning Symmetric Positive Definite (SPD) matrices are gaining increasing attention in machine learning. Despite the significant progress, most existing SPD networks use traditional Euclidean classifiers on approximated spaces rather than intrinsic classifiers that accurately capture the geometry of SPD manifolds. Inspired by the success of Hyperbolic Neural Networks (HNNs), we propose Riemannian multiclass logistics regression (RMLR) for the classification layers in SPD networks. We focus on the metrics pulled back from the Euclidean space, such as Log-Euclidean Metric (LEM) and Log-Cholesky Metric (LCM), and introduce a unified framework for building Riemannian classifiers under these metrics. We first generalize the existing LEM and LCM by the concept of deformation and then design the specific SPD classifiers. Our framework encompasses the most popular LogEig classifier in existing SPD networks as a special case. The effectiveness of our method is demonstrated in three applications: radar recognition, human action recognition, and electroencephalography (EEG) classification.",
        "keywords": "Riemannian manifolds;Riemannian classifiers;SPD Neural Networks",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/3c96ee491cadc0d1f883d41e5a29459290bbecd7.pdf",
        "author": "Ziheng Chen;Yue Song;Gaowen Liu;Ramana Rao Kompella;Xiaojun Wu;Nicu Sebe",
        "authorids": "~Ziheng_Chen2;~Yue_Song1;~Gaowen_Liu4;~Ramana_Rao_Kompella1;~Xiaojun_Wu2;~Nicu_Sebe1",
        "gender": "M;M;F;M;M;M",
        "homepage": "https://gitzh-chen.github.io/;https://kingjamessong.github.io/;;https://linkedin.com/en/rkompella;https://scholar.google.com/citations?user=5IST34sAAAAJ&hl=en;http://disi.unitn.it/~sebe/",
        "dblp": ";11/1346;136/1007;98/2327;13/5168-1.html;20/3519",
        "google_scholar": "47Y-sn4AAAAJ;Uza2i10AAAAJ;NIv_aeQAAAAJ;uf9RZboAAAAJ;5IST34sAAAAJ;https://scholar.google.it/citations?user=stFCYOAAAAAJ",
        "orcid": "0000-0002-5366-7293;;0009-0000-9194-1233;;0009-0000-0199-5001;0000-0002-6597-7248",
        "linkedin": "ziheng-chen-geometrier/;;;;;",
        "or_profile": "~Ziheng_Chen2;~Yue_Song1;~Gaowen_Liu4;~Ramana_Rao_Kompella1;~Xiaojun_Wu2;~Nicu_Sebe1",
        "aff": "University of Trento;University of Trento, Italy;Cisco Systems;Cisco;Jiangnan University;University of Trento",
        "aff_domain": "unitn.it;unitn.it;cisco.com;cisco.com;jiangnan.edu.cn;unitn.it",
        "position": "PhD student;PhD student;Researcher;Researcher;Full Professor;Full Professor",
        "bibtex": "@misc{\nchen2024riemannian,\ntitle={Riemannian Multiclass Logistics Regression for {SPD} Neural Networks},\nauthor={Ziheng Chen and Yue Song and Gaowen Liu and Ramana Rao Kompella and Xiaojun Wu and Nicu Sebe},\nyear={2024},\nurl={https://openreview.net/forum?id=S0DUtGgkTM}\n}",
        "github": "",
        "project": "",
        "reviewers": "vpbo;fcxe;myc6;9moa",
        "site": "https://openreview.net/forum?id=S0DUtGgkTM",
        "pdf_size": 855810,
        "rating": "3;3;5;5",
        "confidence": "5;4;3;4",
        "soundness": "2;3;3;3",
        "contribution": "1;2;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "32;51;67;82",
        "wc_strengths": "27;18;201;72",
        "wc_weaknesses": "88;42;345;327",
        "wc_questions": "117;502;337;73",
        "wc_review": "264;613;950;554",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            58.0,
            18.587630295441105
        ],
        "wc_strengths_avg": [
            79.5,
            73.07017175291159
        ],
        "wc_weaknesses_avg": [
            200.5,
            136.62082564528734
        ],
        "wc_questions_avg": [
            257.25,
            173.11899809090855
        ],
        "wc_review_avg": [
            595.25,
            243.71640794168948
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.7071067811865475,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0;0;1;1;2;0",
        "aff_unique_norm": "University of Trento;Cisco Systems;Jiangnan University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.unitn.it;https://www.cisco.com;https://www.jnu.edu.cn",
        "aff_unique_abbr": "UniTN;Cisco;JNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;1;2;0",
        "aff_country_unique": "Italy;United States;China"
    },
    {
        "title": "Guiding Instruction-based Image Editing via Multimodal Large Language Models",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18621",
        "id": "S1RKWSyZ2Y",
        "author_site": "Tsu-Jui Fu, Wenze Hu, Xianzhi Du, William Wang, Yinfei Yang, Zhe Gan",
        "tldr": "",
        "abstract": "Instruction-based image editing improves the controllability and flexibility of image manipulation via natural commands without elaborate descriptions or regional masks. However, human instructions are sometimes too brief for current methods to capture and follow. Multimodal large language models (MLLMs) show promising capabilities in cross-modal understanding and visual-aware response generation via LMs. We investigate how MLLMs facilitate edit instructions and present MLLM-Guided Image Editing (MGIE). MGIE learns to derive expressive instructions and provides explicit guidance. The editing model jointly captures this visual imagination and performs manipulation through end-to-end training. We evaluate various aspects of Photoshop-style modification, global photo optimization, and local editing. Extensive experimental results demonstrate that expressive instructions are crucial to instruction-based image editing, and our MGIE can lead to a notable improvement in automatic metrics and human evaluation while maintaining competitive inference efficiency.",
        "keywords": "image editing;multimodal large language model",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/0294fd04bb989d844f3463edf644165df9783a95.pdf",
        "author": "Tsu-Jui Fu;Wenze Hu;Xianzhi Du;William Yang Wang;Yinfei Yang;Zhe Gan",
        "authorids": "~Tsu-Jui_Fu2;~Wenze_Hu4;~Xianzhi_Du4;~William_Yang_Wang2;~Yinfei_Yang1;~Zhe_Gan1",
        "gender": "M;M;M;;M;M",
        "homepage": "https://tsujuifu.github.io;http://www.stat.ucla.edu/~wzhu/;;;http://zhegan27.github.io/;https://www.cs.ucsb.edu/~william/",
        "dblp": "218/5366.html;;;117/4082;41/7845;08/9282",
        "google_scholar": "https://scholar.google.com.tw/citations?user=7QRDcC0AAAAJ;0YPYs5UAAAAJ;l1hP40AAAAAJ;kvDbu90AAAAJ;E64XWyMAAAAJ;gf8Ms_8AAAAJ",
        "orcid": ";;;;;",
        "linkedin": "tsujuifu1996;;xianzhi-du-1b128934/;;zhe-gan-a2229a78/;",
        "or_profile": "~Tsu-Jui_Fu2;~Wenze_Hu4;~Xianzhi_Du4;~Yinfei_Yang1;~Zhe_Gan1;~William_Wang1",
        "aff": "UC Santa Barbara;Apple;Apple;Apple;Apple;UC Santa Barbara",
        "aff_domain": "ucsb.edu;apple.com;apple.com;apple.com;apple.com;ucsb.edu",
        "position": "PhD student;Researcher;Researcher;Researcher;Principal Researcher;Full Professor",
        "bibtex": "@inproceedings{\nfu2024guiding,\ntitle={Guiding Instruction-based Image Editing via Multimodal Large Language Models},\nauthor={Tsu-Jui Fu and Wenze Hu and Xianzhi Du and William Yang Wang and Yinfei Yang and Zhe Gan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=S1RKWSyZ2Y}\n}",
        "github": "",
        "project": "",
        "reviewers": "fMJn;BZAL;TXUn;RXEx",
        "pdf_size": 11519957,
        "rating": "6;6;8;8",
        "confidence": "3;3;4;4",
        "soundness": "3;3;4;3",
        "contribution": "2;2;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "146;65;27;41",
        "wc_strengths": "177;113;21;23",
        "wc_weaknesses": "305;391;33;91",
        "wc_questions": "166;135;66;48",
        "wc_review": "794;704;147;203",
        "wc_reply_reviewers": "96;33;29;0",
        "wc_reply_authors": "794;1200;237;612",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "2;3;1;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            69.75,
            46.072632874625256
        ],
        "wc_strengths_avg": [
            83.5,
            65.5343421421166
        ],
        "wc_weaknesses_avg": [
            205.0,
            147.6279106402309
        ],
        "wc_questions_avg": [
            103.75,
            48.43745967740257
        ],
        "wc_review_avg": [
            462.0,
            289.4365215379704
        ],
        "wc_reply_reviewers_avg": [
            39.5,
            35.01785258978626
        ],
        "wc_reply_authors_avg": [
            710.75,
            346.5857577858617
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 115,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11018103266329124223&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=S1RKWSyZ2Y",
        "pdf": "https://openreview.net/pdf?id=S1RKWSyZ2Y",
        "email": "ucsb.edu;apple.com;apple.com;apple.com;apple.com;ucsb.edu",
        "author_num": 6,
        "aff_unique_index": "0;1;1;1;1;0",
        "aff_unique_norm": "University of California, Santa Barbara;Apple",
        "aff_unique_dep": ";Apple Inc.",
        "aff_unique_url": "https://www.ucsb.edu;https://www.apple.com",
        "aff_unique_abbr": "UCSB;Apple",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Santa Barbara;",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "S1hTxWE7cJ",
        "title": "X-SHOT: A Single System to Handle Frequent, Few-shot and Zero-shot Labels in Classification",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In recent years, few-shot and zero-shot learning, which focus on labels with limited annotated instances, have garnered significant attention. Traditional approaches often treat freq-shot (labels with numerous instances), few-shot, and zero-shot learning as distinct challenges, optimizing systems for just one of these scenarios. Yet, in real-world settings, label occurrences vary greatly. Some labels might appear thousands of times, while others might only appear sporadically or not at all. Ideally, a system should accommodate any label, regardless of its training frequency. Notably, while few-shot systems often falter on zero-shot tasks, zero-shot systems don't leverage available annotations when certain downstream labels possess them. For practical deployment, it's crucial that a system can adapt to any label occurrence. We introduce a novel classification challenge: $X$-shot, reflecting a real-world context where freq-shot, few-shot, and zero-shot labels emerge without predefined limits. Here, $X$ can span from 0 to positive infinity. The crux of $X$-shot centers on open-domain generalization and devising a system versatile enough to manage various label scenarios. Our solution leverages Instruction Learning, bolstered by data autonomously generated by pre-trained Language Models (PLMs). Our unified system, $X$-shot, surpasses preceding state-of-the-art techniques on three benchmark datasets across diverse domains in both single-label and multi-label classifications. This is the first work addressing $X$-shot learning, where $X$ remains variable.",
        "keywords": "Natural Language Processing;Few-shot Learning;Zero-shot Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Hanzi Xu;Slobodan Vucetic;Wenpeng Yin",
        "authorids": "~Hanzi_Xu1;~Slobodan_Vucetic1;~Wenpeng_Yin1",
        "gender": "F;;",
        "homepage": ";;http://wenpengyin.org/",
        "dblp": "229/0397;;117/7310-1",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;mRg16LkAAAAJ",
        "orcid": ";;",
        "linkedin": "hanzixu/;;",
        "or_profile": "~Hanzi_Xu1;~Slobodan_Vucetic1;~Wenpeng_Yin1",
        "aff": "Temple University;;Pennsylvania State University",
        "aff_domain": "temple.edu;;psu.edu",
        "position": "PhD student;;Assistant Professor",
        "bibtex": "@misc{\nxu2024xshot,\ntitle={X-{SHOT}: A Single System to Handle Frequent, Few-shot and Zero-shot Labels in Classification},\nauthor={Hanzi Xu and Slobodan Vucetic and Wenpeng Yin},\nyear={2024},\nurl={https://openreview.net/forum?id=S1hTxWE7cJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "hFW1;mNFM;GeK1;WJCJ",
        "site": "https://openreview.net/forum?id=S1hTxWE7cJ",
        "pdf_size": 372173,
        "rating": "3;5;5;6",
        "confidence": "3;3;4;3",
        "soundness": "3;3;2;2",
        "contribution": "2;3;2;3",
        "presentation": "4;3;2;3",
        "wc_summary": "83;60;69;88",
        "wc_strengths": "33;28;53;235",
        "wc_weaknesses": "63;79;115;284",
        "wc_questions": "81;64;5;91",
        "wc_review": "260;231;242;698",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            75.0,
            11.113055385446435
        ],
        "wc_strengths_avg": [
            87.25,
            85.81484428698802
        ],
        "wc_weaknesses_avg": [
            135.25,
            87.92148486007274
        ],
        "wc_questions_avg": [
            60.25,
            33.32697856091968
        ],
        "wc_review_avg": [
            357.75,
            196.71600722869505
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.13245323570650439,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:NlvgKK3pqA4J:scholar.google.com/&scioq=X-SHOT:+A+Single+System+to+Handle+Frequent,+Few-shot+and+Zero-shot+Labels+in+Classification&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Temple University;Pennsylvania State University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.temple.edu;https://www.psu.edu",
        "aff_unique_abbr": "Temple;PSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "S1qSHSFOew",
        "title": "CSI: Enhancing the Robustness of 3D Point Cloud Recognition against Corruption",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Despite recent advancements in deep neural networks for point cloud recognition, real-world safety-critical applications present challenges due to unavoidable data corruption. Current models often fall short in generalizing to unforeseen distribution shifts. In this study, we harness the inherent set property of point cloud data to introduce a novel critical subset identification (CSI) method, aiming to bolster recognition robustness in the face of data corruption. Our CSI framework integrates two pivotal components: density-aware sampling (DAS) and self-entropy minimization (SEM), which cater to static and dynamic CSI, respectively. DAS ensures efficient robust anchor point sampling by factoring in local density, while SEM is employed during training to accentuate the most salient point-to-point attention. Evaluations reveal that our CSI approach yields error rates of 18.4\\% and 16.3\\% on ModelNet40-C and PointCloud-C, respectively, marking a notable improvement over state-of-the-art methods by margins of 5.2\\% and 4.2\\% on the respective benchmarks.",
        "keywords": "Corruption Robustness;Point Cloud Classification",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Zhuoyuan Wu;Jiachen Sun;Chaowei Xiao",
        "authorids": "~Zhuoyuan_Wu1;~Jiachen_Sun1;~Chaowei_Xiao2",
        "gender": ";M;M",
        "homepage": ";https://web.eecs.umich.edu/~jiachens/;https://xiaocw11.github.io/",
        "dblp": ";;150/3317",
        "google_scholar": "B414FiAAAAAJ;Knnv3p4AAAAJ;Juoqtj8AAAAJ",
        "orcid": ";;0000-0002-7043-4926",
        "linkedin": ";jiachensun23/;",
        "or_profile": "~Zhuoyuan_Wu1;~Jiachen_Sun1;~chaowei_xiao1",
        "aff": "Meituan;LinkedIn;NVIDIA",
        "aff_domain": "meituan.com;linkedin.com;nvidia.com",
        "position": "Researcher;Researcher;Researcher",
        "bibtex": "@misc{\nwu2024csi,\ntitle={{CSI}: Enhancing the Robustness of 3D Point Cloud Recognition against Corruption},\nauthor={Zhuoyuan Wu and Jiachen Sun and Chaowei Xiao},\nyear={2024},\nurl={https://openreview.net/forum?id=S1qSHSFOew}\n}",
        "github": "",
        "project": "",
        "reviewers": "Jv1W;xKH7;WsBz;sAPs",
        "site": "https://openreview.net/forum?id=S1qSHSFOew",
        "pdf_size": 2181769,
        "rating": "3;5;6;8",
        "confidence": "4;4;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;4;3;3",
        "wc_summary": "30;108;45;88",
        "wc_strengths": "19;76;111;107",
        "wc_weaknesses": "354;83;147;79",
        "wc_questions": "129;187;8;15",
        "wc_review": "532;454;311;289",
        "wc_reply_reviewers": "296;185;0;33",
        "wc_reply_authors": "2516;1037;279;436",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "4;2;1;1",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            67.75,
            31.514877439076294
        ],
        "wc_strengths_avg": [
            78.25,
            36.79249244071404
        ],
        "wc_weaknesses_avg": [
            165.75,
            111.98521107717751
        ],
        "wc_questions_avg": [
            84.75,
            76.10642219944386
        ],
        "wc_review_avg": [
            396.5,
            100.66404521973077
        ],
        "wc_reply_reviewers_avg": [
            128.5,
            119.24868972026485
        ],
        "wc_reply_authors_avg": [
            1067.0,
            883.1203202282235
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.16012815380508713,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:wUEy1PNzzVMJ:scholar.google.com/&scioq=CSI:+Enhancing+the+Robustness+of+3D+Point+Cloud+Recognition+against+Corruption&hl=en&as_sdt=0,47",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Meituan;LinkedIn Corporation;NVIDIA",
        "aff_unique_dep": ";;NVIDIA Corporation",
        "aff_unique_url": "https://www.meituan.com;https://www.linkedin.com;https://www.nvidia.com",
        "aff_unique_abbr": "Meituan;LinkedIn;NVIDIA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "S24zdyiWDT",
        "title": "Is Inverse Reinforcement Learning Harder than Standard Reinforcement Learning?",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Inverse Reinforcement Learning (IRL)---the problem of learning reward functions from demonstrations of an \\emph{expert policy}---plays a critical role in developing intelligent systems, such as those that understand and imitate human behavior. While widely used in applications, theoretical understandings of IRL admit unique challenges and remain less developed compared with standard RL theory. For example, it remains open how to do IRL efficiently in standard \\emph{offline} settings with pre-collected data, where states are obtained from a \\emph{behavior policy} (which could be the expert policy itself), and actions are sampled from the expert policy.\n\nThis paper provides the first line of results for efficient IRL in vanilla offline and online settings using polynomial samples and runtime. We first design a new IRL algorithm for the offline setting, Reward Learning with Pessimism (RLP), and show that it achieves polynomial sample complexity in terms of the size of the MDP, a concentrability coefficient between the behavior policy and the expert policy, and the desired accuracy. Building on RLP, we further design an algorithm Reward Learning with Exploration (RLE), which operates in a natural online setting where the learner can both actively explore the environment and query the expert policy, and obtain a stronger notion of IRL guarantee from polynomial samples. We establish sample complexity lower bounds for both settings showing that RLP and RLE are nearly optimal. Finally, as an application, we show that the learned reward functions can \\emph{transfer} to another target MDP with suitable guarantees when the target MDP satisfies certain similarity assumptions with the original (source) MDP.",
        "keywords": "reinforcement learning theory;inverse reinforcement learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/ab6c9bd1c9e4b1f98ae4e6f6a9cdf5e9fd93b435.pdf",
        "author": "Lei Zhao;Mengdi Wang;Yu Bai",
        "authorids": "~Lei_Zhao18;~Mengdi_Wang1;~Yu_Bai1",
        "gender": "F;;M",
        "homepage": "http://mwang.princeton.edu;https://yubai.org;",
        "dblp": ";03/6325-17.html;",
        "google_scholar": ";owqhKD8AAAAJ;",
        "orcid": ";;",
        "linkedin": ";;https://www.linkedin.com/",
        "or_profile": "~Mengdi_Wang1;~Yu_Bai1;~Zhao_Lei2",
        "aff": "Princeton University;Salesforce Research;University of Science and Technology of China",
        "aff_domain": "princeton.edu;salesforce.com;ustc.edu.cn",
        "position": "Full Professor;Research Scientist;Undergrad student",
        "bibtex": "@misc{\nzhao2024is,\ntitle={Is Inverse Reinforcement Learning Harder than Standard Reinforcement Learning?},\nauthor={Lei Zhao and Mengdi Wang and Yu Bai},\nyear={2024},\nurl={https://openreview.net/forum?id=S24zdyiWDT}\n}",
        "github": "",
        "project": "",
        "reviewers": "RnbG;9kcm;cGXj;uRxz",
        "site": "https://openreview.net/forum?id=S24zdyiWDT",
        "pdf_size": 721154,
        "rating": "5;5;6;8",
        "confidence": "3;5;3;2",
        "soundness": "3;4;3;3",
        "contribution": "3;2;3;3",
        "presentation": "1;4;2;3",
        "wc_summary": "16;133;131;23",
        "wc_strengths": "50;45;171;40",
        "wc_weaknesses": "449;67;354;34",
        "wc_questions": "1;549;150;1",
        "wc_review": "516;794;806;98",
        "wc_reply_reviewers": "119;569;13;11",
        "wc_reply_authors": "586;1925;861;116",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "3;3;2;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            1.0897247358851685
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            75.75,
            56.3088580953299
        ],
        "wc_strengths_avg": [
            76.5,
            54.67403405639646
        ],
        "wc_weaknesses_avg": [
            226.0,
            179.06563042638865
        ],
        "wc_questions_avg": [
            175.25,
            224.19453048636134
        ],
        "wc_review_avg": [
            553.5,
            287.43825423906264
        ],
        "wc_reply_reviewers_avg": [
            178.0,
            229.9325988197411
        ],
        "wc_reply_authors_avg": [
            872.0,
            663.7510828616403
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.7492686492653551,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Princeton University;Salesforce;University of Science and Technology of China",
        "aff_unique_dep": ";Salesforce Research;",
        "aff_unique_url": "https://www.princeton.edu;https://research.salesforce.com;http://www.ustc.edu.cn",
        "aff_unique_abbr": "Princeton;Salesforce;USTC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "S2EN8MCHiz",
        "title": "Understanding Vision and Language Representations under the Lens of Intrinsic Dimension",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Current multimodal representation learning is mainly achieved by intuitive and heuristic approaches. However, the cooperation and the utility of each modality remain unclear. We empirically investigate the intrinsic dimension (ID) of a large-scale vision-language pre-training model BLIP and explore the relationships among intrinsic dimension, modality, and prunability. It is shown that the ID geometric characteristics of visual and language representations differ significantly in terms of range and shape, resulting in distinct prunability for each modality. Unified multimodal learning can be manifested as the overlay of ID variations of vision and language. By investigating the IDs of attention representations, it is evident that the current cross-modal attention mechanism struggles to embed modalities into the same low-dimensional manifold due to the varying levels of IDs between vision and language. Moreover, We study the contribution of different modalities toward model prunability and explore predicting model performance through the distributions of IDs. An importance metric based on ID is proposed, which yields superior performance for multimodal model pruning. The experimental results show that visual representations are more sensitive and fragile to pruning, while language representations are robust and, therefore, have a higher prunability. 90% BLIP weights in language modality can be pruned with only 3.8 drops on the CIDEr metric. Our observations suggest the potential for more effective pruning of multimodal models using intrinsic dimension (ID) as a guiding metric.",
        "keywords": "Intrinsic Dimension;vision and language;cross modal representation;pruning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Hanzhang Wang;jiawen zhang;Qingyuan Ma",
        "authorids": "~Hanzhang_Wang1;~jiawen_zhang3;~Qingyuan_Ma1",
        "gender": "F;;F",
        "homepage": "https://hanzhang-wang.github.io;https://github.com/Nofear18;",
        "dblp": ";;",
        "google_scholar": ";;",
        "orcid": "0000-0002-4649-7361;;",
        "linkedin": ";;\u6e05\u6e90-\u9a6c-003078260",
        "or_profile": "~Hanzhang_Wang1;~jiawen_zhang3;~Qingyuan_Ma1",
        "aff": "Shanghai University;Shanghai University;Shanghai University",
        "aff_domain": "shu.edu.cn;shu.edu.cn;shu.edu.cn",
        "position": "Assistant Professor;MS student;Undergrad student",
        "bibtex": "@misc{\nwang2024understanding,\ntitle={Understanding Vision and Language Representations under the Lens of Intrinsic Dimension},\nauthor={Hanzhang Wang and jiawen zhang and Qingyuan Ma},\nyear={2024},\nurl={https://openreview.net/forum?id=S2EN8MCHiz}\n}",
        "github": "",
        "project": "",
        "reviewers": "sCrT;RpzU;Vq7s;r1cw",
        "site": "https://openreview.net/forum?id=S2EN8MCHiz",
        "pdf_size": 17165048,
        "rating": "3;3;5;5",
        "confidence": "4;4;4;2",
        "soundness": "2;2;2;3",
        "contribution": "1;2;3;2",
        "presentation": "1;2;2;3",
        "wc_summary": "93;81;77;51",
        "wc_strengths": "54;60;67;63",
        "wc_weaknesses": "158;322;105;53",
        "wc_questions": "68;3;3;3",
        "wc_review": "373;466;252;170",
        "wc_reply_reviewers": "36;138;0;0",
        "wc_reply_authors": "547;720;299;286",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            75.5,
            15.321553446044563
        ],
        "wc_strengths_avg": [
            61.0,
            4.743416490252569
        ],
        "wc_weaknesses_avg": [
            159.5,
            100.89722493706158
        ],
        "wc_questions_avg": [
            19.25,
            28.145825622994256
        ],
        "wc_review_avg": [
            315.25,
            113.09150056480814
        ],
        "wc_reply_reviewers_avg": [
            43.5,
            56.50442460551209
        ],
        "wc_reply_authors_avg": [
            463.0,
            181.19740616245036
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:nVzdctak7mAJ:scholar.google.com/&scioq=Understanding+Vision+and+Language+Representations+under+the+Lens+of+Intrinsic+Dimension&hl=en&as_sdt=0,34",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Shanghai University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.shu.edu.cn",
        "aff_unique_abbr": "SHU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "SmartPlay : A Benchmark for LLMs as Intelligent Agents",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18620",
        "id": "S2oTVrlcp3",
        "author_site": "Yue Wu, Xuan Tang, Tom Mitchell, Yuanzhi Li",
        "tldr": "",
        "abstract": "Recent large language models (LLMs) have demonstrated great potential toward intelligent agents and next-gen automation, but there currently lacks a systematic benchmark for evaluating LLMs' abilities as agents. We introduce SmartPlay: both a challenging benchmark and a methodology for evaluating LLMs as agents. SmartPlay consists of 6 different games, including Rock-Paper-Scissors, Tower of Hanoi, Minecraft. Each game features a unique setting, providing up to 20 evaluation settings and infinite environment variations. Each game in SmartPlay uniquely challenges a subset of 9 important capabilities of an intelligent LLM agent, including reasoning with object dependencies, planning ahead, spatial reasoning, learning from history, and understanding randomness. The distinction between the set of capabilities each game test allows us to analyze each capability separately.\nSmartPlay serves not only as a rigorous testing ground for evaluating the overall performance of LLM agents but also as a road-map for identifying gaps in current methodologies. \nWe release our benchmark at https://github.com/microsoft/SmartPlay",
        "keywords": "Large Language Models",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Yue Wu;Xuan Tang;Tom Mitchell;Yuanzhi Li",
        "authorids": "~Yue_Wu17;~Xuan_Tang2;~Tom_Mitchell2;~Yuanzhi_Li1",
        "gender": "M;F;M;M",
        "homepage": "https://www.yuewu.ml;;http://www.cs.cmu.edu/~tom;",
        "dblp": "41/5979;;;73/3628",
        "google_scholar": "LcrSIhgAAAAJ;;;",
        "orcid": ";;;",
        "linkedin": ";xuan-tang;;",
        "or_profile": "~Yue_Wu17;~Xuan_Tang2;~Tom_Mitchell2;~Yuanzhi_Li1",
        "aff": "Carnegie Mellon University;Carnegie Mellon University;School of Computer Science, Carnegie Mellon University;Carnegie Mellon University",
        "aff_domain": "cmu.edu;cmu.edu;cs.cmu.edu;andrew.cmu.edu",
        "position": "PhD student;Undergrad student;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nwu2024smartplay,\ntitle={SmartPlay : A Benchmark for {LLM}s as Intelligent Agents},\nauthor={Yue Wu and Xuan Tang and Tom Mitchell and Yuanzhi Li},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=S2oTVrlcp3}\n}",
        "github": "",
        "project": "",
        "reviewers": "j3e9;E24b;itPd;Jri2",
        "pdf_size": 13746132,
        "rating": "5;6;8;8",
        "confidence": "4;2;4;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;4;3",
        "presentation": "2;2;3;3",
        "wc_summary": "172;142;58;135",
        "wc_strengths": "76;144;190;142",
        "wc_weaknesses": "287;126;173;112",
        "wc_questions": "111;15;446;3",
        "wc_review": "646;427;867;392",
        "wc_reply_reviewers": "63;0;905;0",
        "wc_reply_authors": "1025;443;687;224",
        "reply_reviewers": "1;0;2;0",
        "reply_authors": "3;1;3;1",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            126.75,
            42.055766548714814
        ],
        "wc_strengths_avg": [
            138.0,
            40.620192023179804
        ],
        "wc_weaknesses_avg": [
            174.5,
            68.76954267697292
        ],
        "wc_questions_avg": [
            143.75,
            179.4538589721603
        ],
        "wc_review_avg": [
            583.0,
            190.68429405695687
        ],
        "wc_reply_reviewers_avg": [
            242.0,
            383.6463214993727
        ],
        "wc_reply_authors_avg": [
            594.75,
            297.5351869947486
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.0,
            1.0
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.058025885318565944,
        "gs_citation": 65,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9244124546017802154&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=S2oTVrlcp3",
        "pdf": "https://openreview.net/pdf?id=S2oTVrlcp3",
        "email": "cmu.edu;cmu.edu;cs.cmu.edu;andrew.cmu.edu",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Carnegie Mellon University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cmu.edu",
        "aff_unique_abbr": "CMU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Pittsburgh",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "S3nF4eO0tg",
        "title": "StyleDreamer: Make Your 3D Style Avatar from a Single View with Consistency Score Distillation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recent generative methods have shown remarkable capabilities in producing stylized 3D head avatars. Nonetheless, current methods necessitate multi-view images for constructing 3D models, which limits their usage in the real world where most images are captured from a single angle. In this paper, we investigate a practical $\\textit{One-to-Style}$ task, generating the 3D style avatar with a single view. \nThe task presents two challenges: 1) $\\textbf{Content}$ consistency and 2) $\\textbf{Style}$ consistency across multiple views of the generated images. We propose a novel Consistency Score Distillation (CSD) to ensure consistent stylization across multiple views while preserving the identity of each view using the 3D GAN. In this method, the style distribution of the rendered images from all views is supervised to match the style of the given single view, based on the provided edit instruction. We have formulated a dataset for One-to-Style with in-the-wild face images and the most commonly used style. Experimental results show that our approach outperforms existing methods in terms of stability and quality, indicating its potential applications in the real world. Result videos can be found on the project website: https://one-to-style.github.io/.",
        "keywords": "3D generation;Stylized 3D head avatar;Single view",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/dda8da99e621d6e88d6b8ff4ff59b6ca2de3e6b1.pdf",
        "author": "Zhenglin Zhou;Fan Ma;Hehe Fan;Yi Yang",
        "authorids": "~Zhenglin_Zhou1;~Fan_Ma2;~Hehe_Fan1;~Yi_Yang4",
        "gender": ";M;M;M",
        "homepage": ";;https://hehefan.github.io;http://reler.net/",
        "dblp": ";126/0861;184/5722.html;",
        "google_scholar": ";FyglsaAAAAAJ;hVuflMQAAAAJ;https://scholar.google.com.au/citations?user=RMSuNFwAAAAJ",
        "orcid": ";;0000-0001-9572-2345;",
        "linkedin": ";;;",
        "or_profile": "~Zhenglin_Zhou1;~Fan_Ma2;~Hehe_Fan1;~Yi_Yang4",
        "aff": ";Zhejiang University;Zhejiang University;Zhejiang University",
        "aff_domain": ";zju.edu.cn;zju.edu.cn;zju.edu.cn",
        "position": ";Postdoc;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nzhou2024styledreamer,\ntitle={StyleDreamer: Make Your 3D Style Avatar from a Single View with Consistency Score Distillation},\nauthor={Zhenglin Zhou and Fan Ma and Hehe Fan and Yi Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=S3nF4eO0tg}\n}",
        "github": "",
        "project": "",
        "reviewers": "cZ1J;7NEF;Sr2S;hk3d",
        "site": "https://openreview.net/forum?id=S3nF4eO0tg",
        "pdf_size": 0,
        "rating": "3;3;5;5",
        "confidence": "4;5;2;4",
        "soundness": "3;2;3;3",
        "contribution": "1;2;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "92;137;130;67",
        "wc_strengths": "56;69;133;45",
        "wc_weaknesses": "105;350;219;125",
        "wc_questions": "71;101;176;21",
        "wc_review": "324;657;658;258",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            106.5,
            28.5175384631984
        ],
        "wc_strengths_avg": [
            75.75,
            34.127518222103404
        ],
        "wc_weaknesses_avg": [
            199.75,
            96.83846085104823
        ],
        "wc_questions_avg": [
            92.25,
            56.166604846652426
        ],
        "wc_review_avg": [
            474.25,
            184.7300395171289
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.6882472016116854,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:TzuOs0INoXIJ:scholar.google.com/&scioq=StyleDreamer:+Make+Your+3D+Style+Avatar+from+a+Single+View+with+Consistency+Score+Distillation&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Zhejiang University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.zju.edu.cn",
        "aff_unique_abbr": "ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "S3x7IcbwY8",
        "title": "Masked AutoDecoder is Effective Multi-Task Vision Generalist",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Inspired by the success of general-purpose models in NLP, recent studies attempt to unify different vision tasks in the same sequence format and employ auto-regressive Transformers for sequence prediction. They apply uni-directional attention to capture sequential dependencies and generate task sequences recursively. However, such autoregressive Transformers may not fit vision tasks well, as vision task sequences usually lack the sequential dependencies typically observed in natural languages. In this work, we design Masked AutoDecoder~(MAD), an effective multi-task vision generalist. MAD consists of two core designs. First, we develop a parallel decoding framework that introduces bi-directional attention to capture contextual dependencies comprehensively and decode vision task sequences in parallel. Second, we design a masked sequence modeling approach that learns rich task contexts by masking and reconstructing task sequences. In this way, MAD handles all the tasks by a single network branch and a simple cross-entropy loss with minimal task-specific designs. Extensive experiments demonstrate the great potential of MAD as a new paradigm for unifying various vision tasks. MAD achieves superior performance and inference efficiency compared to auto-regressive counterparts while obtaining competitive accuracy with task-specific models.",
        "keywords": "vision generalist model;multi-task learning;masked sequence modeling",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Han Qiu;Jiaxing Huang;Peng Gao;Lewei Lu;Shijian Lu",
        "authorids": "~Han_Qiu2;~Jiaxing_Huang2;~Peng_Gao3;~Lewei_Lu1;~Shijian_Lu1",
        "gender": "M;M;M;M;M",
        "homepage": "https://qhqk.github.io/hanqiu.github.io/;https://jxhuang0508.github.io/;;https://personal.ntu.edu.sg/shijian.lu/;",
        "dblp": ";62/6016-1.html;247/6438;42/2718;",
        "google_scholar": "YThp3g8AAAAJ;czirNcwAAAAJ;https://scholar.google.com.hk/citations?user=zdgKJXIAAAAJ;https://scholar.google.com.sg/scholar?hl=en;miFIAFMAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;lewei-lu-94015977/;;",
        "or_profile": "~Han_Qiu2;~Jiaxing_Huang2;~Lewei_Lu1;~Shijian_Lu1;~Gao_Peng1",
        "aff": "Nanyang Technological University;Nanyang Technological University;SenseTime;Nanyang Technological University;shanghai ai lab ",
        "aff_domain": "ntu.edu.sg;ntu.edu.sg;sensetime.com;ntu.edu.sg;pjlab.org.cn",
        "position": "PhD student;Postdoc;Researcher;Associate Professor;Researcher",
        "bibtex": "@misc{\nqiu2024masked,\ntitle={Masked AutoDecoder is Effective Multi-Task Vision Generalist},\nauthor={Han Qiu and Jiaxing Huang and Peng Gao and Lewei Lu and Shijian Lu},\nyear={2024},\nurl={https://openreview.net/forum?id=S3x7IcbwY8}\n}",
        "github": "",
        "project": "",
        "reviewers": "qumq;A9Bs;1kN4;iGd5",
        "site": "https://openreview.net/forum?id=S3x7IcbwY8",
        "pdf_size": 765099,
        "rating": "3;5;5;6",
        "confidence": "4;4;4;2",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;2;3",
        "wc_summary": "74;146;94;109",
        "wc_strengths": "27;62;22;89",
        "wc_weaknesses": "213;269;222;100",
        "wc_questions": "51;69;2;1",
        "wc_review": "365;546;340;299",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            105.75,
            26.34743820563965
        ],
        "wc_strengths_avg": [
            50.0,
            27.285527299284507
        ],
        "wc_weaknesses_avg": [
            201.0,
            62.0685105347309
        ],
        "wc_questions_avg": [
            30.75,
            29.93639089803579
        ],
        "wc_review_avg": [
            387.5,
            94.4947088465804
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.6622661785325219,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7203895408189627602&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;1;0;2",
        "aff_unique_norm": "Nanyang Technological University;SenseTime;Shanghai AI Lab",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ntu.edu.sg;https://www.sensetime.com;https://www.shanghaiailab.com",
        "aff_unique_abbr": "NTU;SenseTime;Shanghai AI Lab",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;1",
        "aff_country_unique": "Singapore;China"
    },
    {
        "title": "A Variational Framework for Estimating Continuous Treatment Effects with Measurement Error",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18619",
        "id": "S46Knicu56",
        "author_site": "Erdun Gao, Howard Bondell, Wei Huang, Mingming Gong",
        "tldr": "",
        "abstract": "Estimating treatment effects has numerous real-world applications in various fields, such as epidemiology and political science. While much attention has been devoted to addressing the challenge using fully observational data, there has been comparatively limited exploration of this issue in cases when the treatment is not directly observed. In this paper, we tackle this problem by developing a general variational framework, which is flexible to integrate with advanced neural network-based approaches, to identify the average dose-response function (ADRF) with the continuously valued error-contaminated treatment. Our approach begins with the formulation of a probabilistic data generation model, treating the unobserved treatment as a latent variable. In this model, we leverage a learnable density estimation neural network to derive its prior distribution conditioned on covariates. This module also doubles as a generalized propensity score estimator, effectively mitigating selection bias arising from observed confounding variables. Subsequently, we calculate the posterior distribution of the treatment, taking into account the observed measurement and outcome. To mitigate the impact of treatment error, we introduce a re-parametrized treatment value, replacing the error-affected one, to make more accurate predictions regarding the outcome. To demonstrate the adaptability of our framework, we incorporate two state-of-the-art ADRF estimation methods and rigorously assess its efficacy through extensive simulations and experiments using semi-synthetic data.",
        "keywords": "treatment effect estimation;continuous treatment;measurement error",
        "primary_area": "causal reasoning",
        "supplementary_material": "",
        "author": "Erdun Gao;Howard Bondell;Wei Huang;Mingming Gong",
        "authorids": "~Erdun_Gao1;~Howard_Bondell2;~Wei_Huang8;~Mingming_Gong1",
        "gender": "M;;F;M",
        "homepage": ";;https://sites.google.com/view/w-huang/home;https://mingming-gong.github.io/",
        "dblp": "246/5884;;;98/8479",
        "google_scholar": ";;https://scholar.google.com.au/citations?user=qOd4sB0AAAAJ;https://scholar.google.com.au/citations?user=6BmiCJIAAAAJ",
        "orcid": "0000-0003-1736-2764;;0000-0002-5691-7411;0000-0001-7147-5589",
        "linkedin": ";;;",
        "or_profile": "~Erdun_Gao1;~Howard_Bondell2;~Wei_Huang8;~Mingming_Gong1",
        "aff": "University of Melbourne;;University of Melbourne;University of Melbourne",
        "aff_domain": "unimelb.edu.au;;unimelb.edu.au;unimelb.edu.au",
        "position": "PhD student;;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\ngao2024a,\ntitle={A Variational Framework for Estimating Continuous Treatment Effects with Measurement Error},\nauthor={Erdun Gao and Howard Bondell and Wei Huang and Mingming Gong},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=S46Knicu56}\n}",
        "github": "",
        "project": "",
        "reviewers": "gZZT;2KQn;bqN4",
        "pdf_size": 1513962,
        "rating": "6;8;8",
        "confidence": "3;4;4",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "4;3;3",
        "wc_summary": "44;43;108",
        "wc_strengths": "68;38;112",
        "wc_weaknesses": "104;176;64",
        "wc_questions": "29;6;247",
        "wc_review": "245;263;531",
        "wc_reply_reviewers": "0;236;0",
        "wc_reply_authors": "1512;2708;964",
        "reply_reviewers": "0;3;0",
        "reply_authors": "3;5;2",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            65.0,
            30.40833219146796
        ],
        "wc_strengths_avg": [
            72.66666666666667,
            30.390056853443948
        ],
        "wc_weaknesses_avg": [
            114.66666666666667,
            46.34172585862071
        ],
        "wc_questions_avg": [
            94.0,
            108.59404526338756
        ],
        "wc_review_avg": [
            346.3333333333333,
            130.78566010419067
        ],
        "wc_reply_reviewers_avg": [
            78.66666666666667,
            111.25146690668346
        ],
        "wc_reply_authors_avg": [
            1728.0,
            728.18312715049
        ],
        "reply_reviewers_avg": [
            1.0,
            1.4142135623730951
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            1.247219128924647
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.9999999999999998,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6744510395241615060&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=S46Knicu56",
        "pdf": "https://openreview.net/pdf?id=S46Knicu56",
        "email": "unimelb.edu.au;;unimelb.edu.au;unimelb.edu.au",
        "author_num": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Melbourne",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.unimelb.edu.au",
        "aff_unique_abbr": "UniMelb",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Australia"
    },
    {
        "id": "S4YVoQ70b2",
        "title": "Characterising Partial Identifiability in Inverse Reinforcement Learning For Agents With Non-Exponential Discounting",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The aim of inverse reinforcement learning (IRL) is to infer an agent's *preferences* from their *behaviour*. Usually, preferences are modelled as a reward function, $R$, and behaviour is modelled as a policy, $\\pi$. One of the central difficulties in IRL is that multiple preferences may lead to the same behaviour. That is, $R$ is typically underdetermined by $\\pi$, which means that $R$ is only *partially identifiable*. Recent work has characterised the extent of this partial identifiability for different types of agents, including *optimal* agents and *Boltzmann-rational* agents. However, work so far has only considered agents that discount future reward exponentially. This is a serious limitation, for instance because extensive work in the behavioural sciences suggests that humans are better modeled as discounting *hyperbolically*. In this work, we characterise the partial identifiability in IRL for agents that use non-exponential discounting. Our results are relevant for agents that discount hyperbolically, but they also more generally apply to agents that use other types of discounting. We show that IRL, in these cases, is unable to infer enough information about $R$ to identify the correct optimal policy. This suggests that IRL alone is insufficient to adequately characterise the preferences of such agents.",
        "keywords": "inverse reinforcement learning;partial identifiability;hyperbolic discounting;discounting;reward learning;preference elicitation",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/f13f10bfaa362827c26b46505d652b7d42bd8f1f.pdf",
        "author": "Joar Max Viktor Skalse;Alessandro Abate",
        "authorids": "~Joar_Max_Viktor_Skalse1;~Alessandro_Abate1",
        "gender": "M;M",
        "homepage": ";https://www.cs.ox.ac.uk/people/alessandro.abate/",
        "dblp": "242/8125;19/3904",
        "google_scholar": "GuzLUmQAAAAJ;https://scholar.google.co.uk/citations?hl=en",
        "orcid": ";0000-0002-5627-9093",
        "linkedin": ";",
        "or_profile": "~Joar_Max_Viktor_Skalse1;~Alessandro_Abate1",
        "aff": "University of Oxford;University of Oxford",
        "aff_domain": "ox.ac.uk;ox.ac.uk",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nskalse2024characterising,\ntitle={Characterising Partial Identifiability in Inverse Reinforcement Learning For Agents With Non-Exponential Discounting},\nauthor={Joar Max Viktor Skalse and Alessandro Abate},\nyear={2024},\nurl={https://openreview.net/forum?id=S4YVoQ70b2}\n}",
        "github": "",
        "project": "",
        "reviewers": "nfpA;HKSo;wg8J",
        "site": "https://openreview.net/forum?id=S4YVoQ70b2",
        "pdf_size": 295202,
        "rating": "3;5;5",
        "confidence": "3;2;2",
        "soundness": "2;2;3",
        "contribution": "2;2;2",
        "presentation": "2;3;3",
        "wc_summary": "54;197;31",
        "wc_strengths": "28;66;37",
        "wc_weaknesses": "142;267;24",
        "wc_questions": "105;61;50",
        "wc_review": "329;591;142",
        "wc_reply_reviewers": "0;121;0",
        "wc_reply_authors": "643;984;343",
        "reply_reviewers": "0;1;0",
        "reply_authors": "1;2;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            94.0,
            73.43477831835993
        ],
        "wc_strengths_avg": [
            43.666666666666664,
            16.21384867602041
        ],
        "wc_weaknesses_avg": [
            144.33333333333334,
            99.21805391269385
        ],
        "wc_questions_avg": [
            72.0,
            23.762715894162152
        ],
        "wc_review_avg": [
            354.0,
            184.15392112759008
        ],
        "wc_reply_reviewers_avg": [
            40.333333333333336,
            57.03994701571483
        ],
        "wc_reply_authors_avg": [
            656.6666666666666,
            261.86552952909926
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.9999999999999998,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16128787091604335626&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Oxford",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ox.ac.uk",
        "aff_unique_abbr": "Oxford",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "S4wo3MnlTr",
        "title": "A trainable manifold for accurate approximation with ReLU Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We present a novel technique for exercising greater control of the weights of ReLU activated neural networks to produce more accurate function approximations. Many theoretical works encode complex operations into ReLU networks using smaller base components. In these works, a common base component is a constant width approximation to $x^2$, which has exponentially decaying error with respect to depth. We extend this block to represent a greater range of convex one-dimensional functions. We derive a manifold of weights such that the output of these new networks utilizes exponentially many piecewise-linear segments. This manifold guides their training process to overcome drawbacks associated with random initialization and unassisted gradient descent. We train these networks to approximate functions which do not necessarily lie on the manifold, showing a significant reduction of error values over conventional approaches.",
        "keywords": "Deep ReLU Networks;Function Approximation;ReLU Network Efficiency",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/52d8b3f59bc63e2e73f98e4aa2d45f3eeda6738f.zip",
        "author": "Max Milkert;Forrest John Laine",
        "authorids": "~Max_Milkert1;~Forrest_John_Laine1",
        "gender": "M;M",
        "homepage": ";",
        "dblp": ";",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;https://scholar.google.com/citations?hl=en",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Max_Milkert1;~Forrest_John_Laine1",
        "aff": "Vanderbilt University;Vanderbilt University",
        "aff_domain": "vanderbilt.edu;vanderbilt.edu",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nmilkert2024a,\ntitle={A trainable manifold for accurate approximation with Re{LU} Networks},\nauthor={Max Milkert and Forrest John Laine},\nyear={2024},\nurl={https://openreview.net/forum?id=S4wo3MnlTr}\n}",
        "github": "",
        "project": "",
        "reviewers": "FQgq;xLCZ;PUUB;jsTK",
        "site": "https://openreview.net/forum?id=S4wo3MnlTr",
        "pdf_size": 628727,
        "rating": "3;3;3;8",
        "confidence": "3;4;2;4",
        "soundness": "2;3;2;3",
        "contribution": "2;1;2;3",
        "presentation": "3;2;2;4",
        "wc_summary": "73;154;60;130",
        "wc_strengths": "59;28;51;203",
        "wc_weaknesses": "136;127;27;96",
        "wc_questions": "2;43;62;125",
        "wc_review": "270;352;200;554",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;176;0;310",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;1;0;1",
        "rating_avg": [
            4.25,
            2.165063509461097
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            104.25,
            38.963925623581616
        ],
        "wc_strengths_avg": [
            85.25,
            68.92885825254905
        ],
        "wc_weaknesses_avg": [
            96.5,
            42.78142120126446
        ],
        "wc_questions_avg": [
            58.0,
            44.34523649728345
        ],
        "wc_review_avg": [
            344.0,
            132.64237633576985
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            121.5,
            130.40993060346287
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0.5,
            0.5
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.5222329678670935,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:NUYnOox0XgUJ:scholar.google.com/&scioq=A+trainable+manifold+for+accurate+approximation+with+ReLU+Networks&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Vanderbilt University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.vanderbilt.edu",
        "aff_unique_abbr": "Vanderbilt",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "S4zpk61r6G",
        "title": "DiffMaSIF: Score-Based Diffusion Models for Protein Surfaces",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Predicting protein-protein complexes is one of the central challenges of computational structural biology. Inspired by recent generative machine learning (ML) techniques which have shown promise in the realms of protein docking, we introduce DiffMaSIF, a novel score-based diffusion model for rigid protein-protein docking. While existing methods rely on co-evolution learned on a residue level, this information is not sufficient for transient, weakly evolved, or newly designed interfaces. DiffMaSIF\u2019s efficacy hinges on its surface-based molecular representation which can capture the complementarity inherent in the physical surfaces of interacting protein interfaces. We follow an end-to-end two-tier prediction schema: initially identifying contact sites on the protein surface and constraining each molecular graph to these sites, followed by an equivariant network to position the two proteins. This data reduction step enables the use of more sophisticated networks and more training steps. In addition to developing this model, we introduce new dataset splits accounting for structural leakage at the interface and thus tailored for benchmarking protein-protein interface prediction performance. Our results demonstrate that DiffMaSIF not only outperforms contemporary ML methods in rigid protein docking, but also matches traditional docking tools at considerably fewer numbers of generated decoys. Through DiffMaSIF, we pave the way for surface-centric interface prediction methods, thus advancing accurate prediction of protein interactions across a wide spectrum of difficult and novelty.",
        "keywords": "geometric deep learning;protein-protein docking;diffusion model;equivariant network;protein surface",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Freyr Sverrisson;Mehmet Akdel;Dylan Abramson;Jean Feydy;Alexander Goncearenco;Yusuf Adeshina;Daniel Kovtun;C\u00e9line Marquet;Xuejin Zhang;David Baugher;Zachary Carpenter;Luca Naef;Michael M. Bronstein;Bruno Correia",
        "authorids": "~Freyr_Sverrisson1;~Mehmet_Akdel1;~Dylan_Abramson1;~Jean_Feydy1;~Alexander_Goncearenco1;~Yusuf_Adeshina1;~Daniel_Kovtun1;~C\u00e9line_Marquet1;~Xuejin_Zhang1;~David_Baugher1;zach@vant.ai;~Luca_Naef1;~Michael_M._Bronstein1;~Bruno_Correia1",
        "gender": ";M;M;M;M;;M;;F;M;;M;M;M",
        "homepage": ";https://github.com/akdel;https://twitter.com/IDreamOfProtein;https://www.jeanfeydy.com;https://github.com/neksa;https://www.linkedin.com/in/yusuf-a-6922a9103/;https://github.com/danielkovtun;;https://www.linkedin.com/in/xuejin-zhang;;;;http://www.inf.usi.ch/bronstein/;https://people.epfl.ch/bruno.correia/?lang=en",
        "dblp": ";185/8459;;205/3460;18/7099.html;;;;;;;;07/2668;",
        "google_scholar": "9zu2LYUAAAAJ;jh2yPVYAAAAJ;;hmn_ITgAAAAJ;https://scholar.google.com/citations?hl=en;;https://scholar.google.com/citations?hl=en;;;;;qHKY1AQAAAAJ;UU3N6-UAAAAJ;https://scholar.google.ch/citations?user=Va246xYAAAAJ",
        "orcid": "0000-0001-9894-0380;0000-0002-6092-3494;;0000-0001-6049-563X;0000-0002-9738-7146;0000-0001-8389-4203;0009-0005-5616-9707;;;;;;;",
        "linkedin": ";;;;goncearenco/;;daniel-kovtun-646204118/;;;davidbaugher;;;mbronstein/;",
        "or_profile": "~Freyr_Sverrisson1;~Mehmet_Akdel1;~Dylan_Abramson1;~Jean_Feydy1;~Alexander_Goncearenco1;~Yusuf_Adeshina1;~Daniel_Kovtun1;~C\u00e9line_Marquet1;~Xuejin_Zhang1;~David_Baugher1;zach@vant.ai;~Luca_Naef1;~Michael_M._Bronstein1;~Bruno_Correia1",
        "aff": "Swiss Federal Institute of Technology Lausanne;VantAI;;INRIA;;;VantAI;;;;;;University of Oxford;",
        "aff_domain": "epfl.ch;vant.ai;;inria.fr;;;vant.ai;;;;;;ox.ac.uk;",
        "position": "PhD student;Researcher;;Associate Professor;;;Researcher;;;;;;Full Professor;",
        "bibtex": "@misc{\nsverrisson2024diffmasif,\ntitle={DiffMa{SIF}: Score-Based Diffusion Models for Protein Surfaces},\nauthor={Freyr Sverrisson and Mehmet Akdel and Dylan Abramson and Jean Feydy and Alexander Goncearenco and Yusuf Adeshina and Daniel Kovtun and C{\\'e}line Marquet and Xuejin Zhang and David Baugher and Zachary Carpenter and Luca Naef and Michael M. Bronstein and Bruno Correia},\nyear={2024},\nurl={https://openreview.net/forum?id=S4zpk61r6G}\n}",
        "github": "",
        "project": "",
        "reviewers": "z8Wu;mUha;J4YD",
        "site": "https://openreview.net/forum?id=S4zpk61r6G",
        "pdf_size": 4801567,
        "rating": "3;5;6",
        "confidence": "4;5;4",
        "soundness": "2;3;3",
        "contribution": "2;2;3",
        "presentation": "1;2;3",
        "wc_summary": "91;42;63",
        "wc_strengths": "68;42;74",
        "wc_weaknesses": "136;220;26",
        "wc_questions": "865;55;232",
        "wc_review": "1160;359;395",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            65.33333333333333,
            20.07209228976613
        ],
        "wc_strengths_avg": [
            61.333333333333336,
            13.888444437333106
        ],
        "wc_weaknesses_avg": [
            127.33333333333333,
            79.43690717935978
        ],
        "wc_questions_avg": [
            384.0,
            347.70964898892294
        ],
        "wc_review_avg": [
            638.0,
            369.40221980924804
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            14,
            0
        ],
        "corr_rating_confidence": 0.18898223650461357,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ogXxZW60VCYJ:scholar.google.com/&scioq=DiffMaSIF:+Score-Based+Diffusion+Models+for+Protein+Surfaces&hl=en&as_sdt=0,23",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;1;3",
        "aff_unique_norm": "Swiss Federal Institute of Technology Lausanne;VantAI;INRIA;University of Oxford",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.epfl.ch;https://www.vantai.cn;https://www.inria.fr;https://www.ox.ac.uk",
        "aff_unique_abbr": "EPFL;;INRIA;Oxford",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Lausanne;",
        "aff_country_unique_index": "0;1;2;1;3",
        "aff_country_unique": "Switzerland;China;France;United Kingdom"
    },
    {
        "title": "Do Generated Data Always Help Contrastive Learning?",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18618",
        "id": "S5EqslEHnz",
        "author_site": "Yifei Wang, Jizhe Zhang, Yisen Wang",
        "tldr": "",
        "abstract": "Contrastive Learning (CL) has emerged as one of the most successful paradigms for unsupervised visual representation learning, yet it often depends on intensive manual data augmentations. With the rise of generative models, especially diffusion models, the ability to generate realistic images close to the real data distribution has been well recognized. These generated high-equality images have been successfully applied to enhance contrastive representation learning, a technique termed ``data inflation''. However, we find that the generated data (even from a good diffusion model like DDPM) may sometimes even harm contrastive learning. We investigate the causes behind this failure from the perspective of both data inflation and data augmentation. For the first time, we reveal the complementary roles that stronger data inflation should be accompanied by weaker augmentations, and vice versa. We also provide rigorous theoretical explanations for these phenomena via deriving its generalization bounds under data inflation. Drawing from these insights, we propose **Adaptive Inflation (AdaInf)**, a purely data-centric strategy without introducing any extra computation cost. On benchmark datasets, AdaInf can bring significant improvements for various contrastive learning methods. Notably, without using external data, AdaInf obtains 94.70% linear accuracy on CIFAR-10 with SimCLR, setting a new record that surpasses many sophisticated methods. Code is available at https://github.com/PKU-ML/adainf.",
        "keywords": "Contrastive Learning;Diffusion Model;Representation Learning;Self-supervised Learning;Deep Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Yifei Wang;Jizhe Zhang;Yisen Wang",
        "authorids": "~Yifei_Wang1;~Jizhe_Zhang1;~Yisen_Wang1",
        "gender": "M;M;M",
        "homepage": "https://yifeiwang77.com;https://github.com/ZHANG-ji-zhe;https://yisenwang.github.io/",
        "dblp": "00/555-1;;172/1346-1",
        "google_scholar": "-CLy6YsAAAAJ;;uMWPDboAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Yifei_Wang1;~Jizhe_Zhang1;~Yisen_Wang1",
        "aff": "Massachusetts Institute of Technology;Xi'an Jiaotong University;Peking University",
        "aff_domain": "mit.edu;xjtu.edu.cn;pku.edu.cn",
        "position": "Postdoc;Undergrad student;Assistant Professor",
        "bibtex": "@inproceedings{\nwang2024do,\ntitle={Do Generated Data Always Help Contrastive Learning?},\nauthor={Yifei Wang and Jizhe Zhang and Yisen Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=S5EqslEHnz}\n}",
        "github": "",
        "project": "",
        "reviewers": "17xG;pGvU;XrzN;umDF;gCqn",
        "pdf_size": 8333412,
        "rating": "3;5;6;6;8",
        "confidence": "3;3;4;4;3",
        "soundness": "2;2;3;3;3",
        "contribution": "2;2;3;3;4",
        "presentation": "3;2;3;4;3",
        "wc_summary": "50;87;105;212;104",
        "wc_strengths": "38;27;75;100;53",
        "wc_weaknesses": "429;60;90;73;266",
        "wc_questions": "196;384;209;195;2",
        "wc_review": "713;558;479;580;425",
        "wc_reply_reviewers": "0;115;147;0;0",
        "wc_reply_authors": "2629;2063;1802;743;687",
        "reply_reviewers": "0;2;2;0;0",
        "reply_authors": "5;6;3;1;1",
        "rating_avg": [
            5.6,
            1.624807680927192
        ],
        "confidence_avg": [
            3.4,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.8,
            0.7483314773547882
        ],
        "presentation_avg": [
            3.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            111.6,
            54.002222176499366
        ],
        "wc_strengths_avg": [
            58.6,
            26.219077024182223
        ],
        "wc_weaknesses_avg": [
            183.6,
            143.72278872885815
        ],
        "wc_questions_avg": [
            197.2,
            120.94858411738434
        ],
        "wc_review_avg": [
            551.0,
            98.17739047255228
        ],
        "wc_reply_reviewers_avg": [
            52.4,
            64.9695313204582
        ],
        "wc_reply_authors_avg": [
            1584.8,
            759.0621581925949
        ],
        "reply_reviewers_avg": [
            0.8,
            0.9797958971132713
        ],
        "reply_authors_avg": [
            3.2,
            2.039607805437114
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.2010075630518424,
        "gs_citation": 32,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15329480813033951720&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=S5EqslEHnz",
        "pdf": "https://openreview.net/pdf?id=S5EqslEHnz",
        "email": "mit.edu;xjtu.edu.cn;pku.edu.cn",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Massachusetts Institute of Technology;Xi'an Jiao Tong University;Peking University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://web.mit.edu;https://www.xjtu.edu.cn;http://www.pku.edu.cn",
        "aff_unique_abbr": "MIT;XJTU;Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "Complex priors and flexible inference in recurrent circuits with dendritic nonlinearities",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18617",
        "id": "S5aUhpuyap",
        "author_site": "Benjamin Lyo, Cristina Savin",
        "tldr": "",
        "abstract": "Despite many successful examples in which probabilistic inference can account for perception, we have little understanding of how the brain represents and uses structured priors that capture the complexity of natural input statistics. Here we construct a recurrent circuit model that can implicitly represent priors over latent variables, and combine them with sensory and contextual sources of information to encode task-specific posteriors. Inspired by the recent success of diffusion models as means of learning and using priors over images, our model uses dendritic nonlinearities optimized for denoising, and stochastic somatic integration with the degree of noise modulated by an oscillating global signal. Combining these elements into a recurrent network yields a stochastic dynamical system that samples from the prior at a rate prescribed by the period of the global oscillator. Additional inputs reflecting sensory or top-down contextual information alter these dynamics to generate samples from the corresponding posterior, with different input gating patterns selecting different inference tasks. We demonstrate that this architecture can sample from low dimensional nonlinear manifolds and multimodal posteriors. Overall, the model provides a new framework for circuit-level representation of probabilistic information, in a format that facilitates flexible inference.",
        "keywords": "computational neuroscience;probabilistic coding;neural sampling;priors",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "Benjamin S. H. Lyo;Cristina Savin",
        "authorids": "~Benjamin_S._H._Lyo1;~Cristina_Savin1",
        "gender": ";F",
        "homepage": ";http://csavin.wixsite.com/savinlab",
        "dblp": ";23/10829",
        "google_scholar": "8brh8mEAAAAJ;muNtwgcAAAAJ",
        "orcid": "0000-0003-1816-8744;0000-0002-3414-8244",
        "linkedin": "blyo/;cristina-savin-1889199b/",
        "or_profile": "~Benjamin_S._H._Lyo1;~Cristina_Savin1",
        "aff": "New York University;New York University",
        "aff_domain": "nyu.edu;nyu.edu",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nlyo2024complex,\ntitle={Complex priors and flexible inference in recurrent circuits with dendritic nonlinearities},\nauthor={Benjamin S. H. Lyo and Cristina Savin},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=S5aUhpuyap}\n}",
        "github": "",
        "project": "",
        "reviewers": "7hMe;A1Uf;XKTM;8Gad",
        "pdf_size": 5025075,
        "rating": "5;6;6;6",
        "confidence": "2;2;3;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;2",
        "presentation": "2;3;3;3",
        "wc_summary": "44;64;82;138",
        "wc_strengths": "63;51;102;110",
        "wc_weaknesses": "329;213;77;354",
        "wc_questions": "142;149;16;375",
        "wc_review": "578;477;277;977",
        "wc_reply_reviewers": "0;0;0;102",
        "wc_reply_authors": "648;479;304;874",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            2.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            82.0,
            35.014282800023196
        ],
        "wc_strengths_avg": [
            81.5,
            25.024987512484397
        ],
        "wc_weaknesses_avg": [
            243.25,
            109.741457526315
        ],
        "wc_questions_avg": [
            170.5,
            129.38798244041058
        ],
        "wc_review_avg": [
            577.25,
            254.95134339712743
        ],
        "wc_reply_reviewers_avg": [
            25.5,
            44.16729559300637
        ],
        "wc_reply_authors_avg": [
            576.25,
            210.58297058404318
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:oVSlPs3nTcIJ:scholar.google.com/&scioq=Complex+priors+and+flexible+inference+in+recurrent+circuits+with+dendritic+nonlinearities&hl=en&as_sdt=0,33",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=S5aUhpuyap",
        "pdf": "https://openreview.net/pdf?id=S5aUhpuyap",
        "email": "nyu.edu;nyu.edu",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "New York University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nyu.edu",
        "aff_unique_abbr": "NYU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Understanding Transferable Representation Learning and Zero-shot Transfer in CLIP",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18616",
        "id": "S5yOuNfSA0",
        "author_site": "Zixiang Chen, Yihe Deng, Yuanzhi Li, Quanquan Gu",
        "tldr": "",
        "abstract": "Multi-modal learning has become increasingly popular due to its ability to leverage information from different data sources (e.g., text and images) to improve the model performance. Recently, CLIP has emerged as an effective approach that employs vision-language contrastive pretraining to learn joint image and text representations and exhibits remarkable performance in zero-shot learning and text-guided natural image generation. Despite the substantial practical success of CLIP, its theoretical understanding remains elusive. In this paper, we formally study transferrable representation learning underlying CLIP and demonstrate how features from different modalities get aligned. We also analyze its zero-shot transfer performance on the downstream tasks. In addition, we conduct empirical evaluations on real data to back\nup our theory. Inspired by our analysis, we propose a new CLIP-type approach, which achieves better performance than CLIP and other state-of-the-art methods on benchmark datasets.",
        "keywords": "Representation Learning;Multimodal learning;Learning Theory",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Zixiang Chen;Yihe Deng;Yuanzhi Li;Quanquan Gu",
        "authorids": "~Zixiang_Chen1;~Yihe_Deng1;~Yuanzhi_Li1;~Quanquan_Gu1",
        "gender": "M;F;M;M",
        "homepage": "https://sites.google.com/view/zxchen;;;http://web.cs.ucla.edu/~qgu/",
        "dblp": "137/3624;230/8011;73/3628;50/4597",
        "google_scholar": "6nrCHr0AAAAJ;7Lix1poAAAAJ;;GU9HgNAAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Zixiang_Chen1;~Yihe_Deng1;~Yuanzhi_Li1;~Quanquan_Gu1",
        "aff": " University of California, Los Angeles;University of California, Los Angeles;Carnegie Mellon University;University of California, Los Angeles",
        "aff_domain": "cs.ucla.edu;ucla.edu;andrew.cmu.edu;cs.ucla.edu",
        "position": "PhD student;PhD student;Assistant Professor;Associate Professor",
        "bibtex": "@inproceedings{\nchen2024understanding,\ntitle={Understanding Transferable Representation Learning and Zero-shot Transfer in {CLIP}},\nauthor={Zixiang Chen and Yihe Deng and Yuanzhi Li and Quanquan Gu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=S5yOuNfSA0}\n}",
        "github": "",
        "project": "",
        "reviewers": "nFDE;CWhP;7qr5;P1Cv",
        "pdf_size": 2809842,
        "rating": "6;6;6;8",
        "confidence": "3;2;3;3",
        "soundness": "3;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;2;3",
        "wc_summary": "128;34;189;39",
        "wc_strengths": "47;26;12;41",
        "wc_weaknesses": "41;204;199;118",
        "wc_questions": "18;3;8;3",
        "wc_review": "234;267;408;201",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "564;1047;1259;953",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;3;3;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            97.5,
            64.72441579496875
        ],
        "wc_strengths_avg": [
            31.5,
            13.6106575888162
        ],
        "wc_weaknesses_avg": [
            140.5,
            66.82252614201292
        ],
        "wc_questions_avg": [
            8.0,
            6.123724356957945
        ],
        "wc_review_avg": [
            277.5,
            78.87490095080945
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            955.75,
            251.8743486343935
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17581328169069294236&as_sdt=5,31&sciodt=0,31&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=S5yOuNfSA0",
        "pdf": "https://openreview.net/pdf?id=S5yOuNfSA0",
        "email": "cs.ucla.edu;ucla.edu;andrew.cmu.edu;cs.ucla.edu",
        "author_num": 4,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "University of California, Los Angeles;Carnegie Mellon University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ucla.edu;https://www.cmu.edu",
        "aff_unique_abbr": "UCLA;CMU",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Los Angeles;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "S62iZf0cba",
        "title": "Multi-Objective Molecular Design through Learning Latent Pareto Set",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Molecular design inherently involves the optimization of multiple conflicting objectives, such as enhancing bio-activity and ensuring synthesizability. Evaluating these objectives often requires resource-intensive computations or physical experiments. Current molecular design methodologies typically approximate the Pareto set using a limited number of molecules. In this paper, we present an innovative approach, called Multi-Objective Molecular Design through Learning Latent Pareto Set (MLPS). MLPS initially utilizes an encoder-decoder model to seamlessly transform the discrete chemical space into a continuous latent space. We then employ local Bayesian optimization models to efficiently search for local optimal solutions (i.e., molecules) within predefined trust regions. Using surrogate objective values derived from these local models, we train a global Pareto set learning model to understand the mapping between direction vectors (called ``preferences'') in the objective space and the entire Pareto set in the continuous latent space. Both the global Pareto set learning model and local Bayesian optimization models collaborate to discover high-quality solutions and adapt the trust regions dynamically. Our work is the first endeavor towards learning the Pareto set for multi-objective molecular design, providing decision-makers with the capability to fine-tune their preferences and thoroughly explore the Pareto set. Experimental results demonstrate that MLPS achieves state-of-the-art performance across various multi-objective scenarios, encompassing diverse objective types and varying numbers of objectives.",
        "keywords": "multi-objective optimization;molecular design;Pareto set learning;Bayesian optimization",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Yiping Liu;Jiahao Yang;Zhang Xinyi;Yuansheng Liu;Bosheng Song;xiangxiang Zeng;Hisao Ishibuchi",
        "authorids": "~Yiping_Liu3;~Jiahao_Yang6;~Zhang_Xinyi2;~Yuansheng_Liu1;~Bosheng_Song1;~xiangxiang_Zeng1;~Hisao_Ishibuchi1",
        "gender": "M;M;F;M;M;M;M",
        "homepage": ";;;;http://csee.hnu.edu.cn/people/songbosheng;https://xzenglab.github.io/xzeng/en;",
        "dblp": ";;;11/4724;16/10049.html;20/3839.html;i/HisaoIshibuchi",
        "google_scholar": "2eX_3XEAAAAJ;;https://scholar.google.com.hk/citations?view_op=list_works;https://scholar.google.com.au/citations?user=H6yrNMQAAAAJ;https://scholar.google.com.hk/citations?user=n2szdRoAAAAJ;B20HBMIAAAAJ;vx9EZN4AAAAJ",
        "orcid": ";0009-0008-9197-0884;;;;0000-0003-1081-7658;0000-0001-9186-6472",
        "linkedin": ";;;;;;",
        "or_profile": "~Yiping_Liu3;~Jiahao_Yang6;~Zhang_Xinyi2;~Yuansheng_Liu1;~Bosheng_Song1;~xiangxiang_Zeng1;~Hisao_Ishibuchi1",
        "aff": "Hunan University;Hunan University;Hunan University;Hunan University;Hunan University;Hunan University;Southern University of Science and Technology",
        "aff_domain": "hnu.edu.cn;hnu.edu.cn;hnu.edu.cn;hnu.edu.cn;hnu.edu.cn;hnu.edu.cn;sustech.edu.cn",
        "position": "Associate Professor;MS student;MS student;Associate Professor;Associate Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nliu2024multiobjective,\ntitle={Multi-Objective Molecular Design through Learning Latent Pareto Set},\nauthor={Yiping Liu and Jiahao Yang and Zhang Xinyi and Yuansheng Liu and Bosheng Song and xiangxiang Zeng and Hisao Ishibuchi},\nyear={2024},\nurl={https://openreview.net/forum?id=S62iZf0cba}\n}",
        "github": "",
        "project": "",
        "reviewers": "U6hC;Ngzz;bnCR",
        "site": "https://openreview.net/forum?id=S62iZf0cba",
        "pdf_size": 9547969,
        "rating": "3;5;6",
        "confidence": "3;5;4",
        "soundness": "2;3;4",
        "contribution": "2;2;3",
        "presentation": "2;3;3",
        "wc_summary": "49;51;191",
        "wc_strengths": "14;19;77",
        "wc_weaknesses": "279;217;504",
        "wc_questions": "31;37;5",
        "wc_review": "373;324;777",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1483;1663;2997",
        "reply_reviewers": "0;0;0",
        "reply_authors": "5;4;8",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            97.0,
            66.47305218407432
        ],
        "wc_strengths_avg": [
            36.666666666666664,
            28.592928418676454
        ],
        "wc_weaknesses_avg": [
            333.3333333333333,
            123.30540224265205
        ],
        "wc_questions_avg": [
            24.333333333333332,
            13.888444437333106
        ],
        "wc_review_avg": [
            491.3333333333333,
            202.98494744411192
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            2047.6666666666667,
            675.290225672554
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            5.666666666666667,
            1.699673171197595
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.6546536707079772,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14444245214211350119&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0;0;1",
        "aff_unique_norm": "Hunan University;Southern University of Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.hunu.edu.cn/;https://www.sustech.edu.cn",
        "aff_unique_abbr": "HNU;SUSTech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "S6Dn3uyM2p",
        "title": "Differentially Private One Permutation Hashing",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Minwise hashing (MinHash) is a standard algorithm for large-scale search and learning with the binary Jaccard similarity. One permutation hashing (OPH) is an effective and efficient alternative of MinHash which splits the data into K bins and generates hash values within each bin. In this paper, we combine differential privacy (DP) with OPH, and propose DP-OPH framework with three variants: DP-OPH-fix, DP-OPH-re and DP-OPH-rand, depending on the densification strategy to deal with empty bins in OPH. A detailed roadmap to the algorithm design is presented along with the privacy analysis. Analytical comparison of our DP-OPH methods with the DP minwise hashing (DP-MH) alternative is provided to justify the advantage of DP-OPH. Experiments on similarity search confirms the merits of our proposed DP-OPH algorithms, and provide guidance on the choice of proper variant in different practical scenarios.",
        "keywords": "differential privacy;hashing",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Xiaoyun Li;Ping Li",
        "authorids": "~Xiaoyun_Li2;~Ping_Li3",
        "gender": "M;M",
        "homepage": ";http://www.stat.rutgers.edu/home/pingli/",
        "dblp": "48/1982;62/5860-1",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Xiaoyun_Li2;~Ping_Li3",
        "aff": "LinkedIn;LinkedIn",
        "aff_domain": "linkedin.com;linkedin.com",
        "position": "Researcher;Engineer",
        "bibtex": "@misc{\nli2024differentially,\ntitle={Differentially Private One Permutation Hashing},\nauthor={Xiaoyun Li and Ping Li},\nyear={2024},\nurl={https://openreview.net/forum?id=S6Dn3uyM2p}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZyNs;zun1;BuXH;mGib;QDZh",
        "site": "https://openreview.net/forum?id=S6Dn3uyM2p",
        "pdf_size": 395946,
        "rating": "3;5;5;5;5",
        "confidence": "3;3;3;3;2",
        "soundness": "3;3;3;2;3",
        "contribution": "2;2;2;2;2",
        "presentation": "3;2;2;3;3",
        "wc_summary": "114;75;51;76;146",
        "wc_strengths": "41;66;76;89;32",
        "wc_weaknesses": "310;164;357;108;15",
        "wc_questions": "11;74;134;234;9",
        "wc_review": "476;379;618;507;202",
        "wc_reply_reviewers": "690;95;0;0;12",
        "wc_reply_authors": "779;1325;798;496;193",
        "reply_reviewers": "2;1;0;0;1",
        "reply_authors": "2;3;1;1;1",
        "rating_avg": [
            4.6,
            0.7999999999999999
        ],
        "confidence_avg": [
            2.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            92.4,
            33.541615941990635
        ],
        "wc_strengths_avg": [
            60.8,
            21.32979137263185
        ],
        "wc_weaknesses_avg": [
            190.8,
            126.73657719853412
        ],
        "wc_questions_avg": [
            92.4,
            84.49994082838165
        ],
        "wc_review_avg": [
            436.4,
            139.8350456788283
        ],
        "wc_reply_reviewers_avg": [
            159.4,
            267.66665836446646
        ],
        "wc_reply_authors_avg": [
            718.2,
            375.0943348012604
        ],
        "reply_reviewers_avg": [
            0.8,
            0.7483314773547883
        ],
        "reply_authors_avg": [
            1.6,
            0.8
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.2500000000000001,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:JiiMw6f6EUkJ:scholar.google.com/&scioq=Differentially+Private+One+Permutation+Hashing&hl=en&as_sdt=0,5",
        "gs_version_total": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "LinkedIn Corporation",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.linkedin.com",
        "aff_unique_abbr": "LinkedIn",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "S6Xf70Y5CJ",
        "title": "Simplifying and Stabilizing Model Selection in Unsupervised Domain Adaptation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Unsupervised domain adaptation (UDA) is a potent approach for enhancing model performance in an unlabeled target domain by leveraging relevant labeled data from a source domain. Despite the significant progress in UDA facilitated by deep learning, model selection, already a challenging task with deep models, becomes considerably more demanding in UDA scenarios due to the absence of labeled target data and substantial distribution shifts between domains. Existing model selection methods in UDA often struggle to maintain stable selections across diverse UDA methods and various UDA scenarios, frequently resulting in suboptimal or even the worst choices. This limitation significantly impairs their practicality and reliability for researchers and practitioners in the community. To address this challenge, we introduce a novel ensemble-based validation approach called EnsV, aiming to simplify and stabilize model selection in UDA. EnsV relies solely on predictions of unlabeled target data without making any assumptions about distribution shifts, offering high simplicity and versatility. Additionally, EnsV is built upon an off-the-shelf ensemble that is theoretically guaranteed to outperform the worst candidate model, ensuring high stability. In our experiments, we compare EnsV to 8 competitive model selection approaches. Our evaluation involves 12 UDA methods across 5 diverse UDA benchmarks and 5 popular UDA scenarios. The results consistently demonstrate that EnsV stands out as a highly simple, versatile, and stable approach for practical model selection in UDA scenarios.",
        "keywords": "Unsupervised Domain Adaptation; Unsupervised Model Selection; Unsupervised Hyperparameter Selection",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Dapeng Hu;Mi Luo;Jian Liang;Chuan-Sheng Foo",
        "authorids": "~Dapeng_Hu2;~Mi_Luo1;~Jian_Liang1;~Chuan-Sheng_Foo1",
        "gender": "M;F;M;M",
        "homepage": "https://lhxxhb.github.io/;https://romyluo.com/;https://liangjian.xyz;http://ai.stanford.edu/~csfoo",
        "dblp": "247/3382;257/3359;19/2208-1;73/1823",
        "google_scholar": "wv9HjA0AAAAJ;eL-xIlAAAAAJ;https://scholar.google.com/citations?hl=en;AgbeqGkAAAAJ",
        "orcid": ";;0000-0003-3890-1894;0000-0002-4748-5792",
        "linkedin": ";;;",
        "or_profile": "~Dapeng_Hu2;~Mi_Luo1;~Jian_Liang1;~Chuan-Sheng_Foo1",
        "aff": "Apple;University of Texas at Austin;Institute of Automation, Chinese Academy of Sciences;Institute for Infocomm Research, A*STAR",
        "aff_domain": "apple.com;cs.utexas.edu;ia.ac.cn;i2r.a-star.edu.sg",
        "position": "Siri Engineer;PhD student;Associate Professor;Principal Scientist",
        "bibtex": "@misc{\nhu2024simplifying,\ntitle={Simplifying and Stabilizing Model Selection in Unsupervised Domain Adaptation},\nauthor={Dapeng Hu and Mi Luo and Jian Liang and Chuan-Sheng Foo},\nyear={2024},\nurl={https://openreview.net/forum?id=S6Xf70Y5CJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "x2YN;y3mw;DSsh",
        "site": "https://openreview.net/forum?id=S6Xf70Y5CJ",
        "pdf_size": 3586884,
        "rating": "3;5;5",
        "confidence": "4;4;4",
        "soundness": "2;2;2",
        "contribution": "2;3;2",
        "presentation": "2;3;3",
        "wc_summary": "46;62;35",
        "wc_strengths": "37;56;31",
        "wc_weaknesses": "209;88;92",
        "wc_questions": "2;85;121",
        "wc_review": "294;291;279",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            47.666666666666664,
            11.08552609887726
        ],
        "wc_strengths_avg": [
            41.333333333333336,
            10.656244908763853
        ],
        "wc_weaknesses_avg": [
            129.66666666666666,
            56.12090123613087
        ],
        "wc_questions_avg": [
            69.33333333333333,
            49.82859509246562
        ],
        "wc_review_avg": [
            288.0,
            6.48074069840786
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4065182659985068529&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Apple;University of Texas at Austin;Chinese Academy of Sciences;Institute for Infocomm Research",
        "aff_unique_dep": "Apple Inc.;;Institute of Automation;",
        "aff_unique_url": "https://www.apple.com;https://www.utexas.edu;http://www.ia.cas.cn;https://www.i2r.a-star.edu.sg",
        "aff_unique_abbr": "Apple;UT Austin;CAS;I2R",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Austin",
        "aff_country_unique_index": "0;0;1;2",
        "aff_country_unique": "United States;China;Singapore"
    },
    {
        "id": "S6j6VQFmpw",
        "title": "Attend to Context for Refining Embeddings in Deep Metric Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The primary objective of deep metric learning (DML) is to find an effective embedding function that can map an image to a vector in the latent space. The quality of this embedding is typically evaluated by ensuring that similar images are placed close to each other. However, the evaluation step, which involves finding the sample and its neighbors and determining which neighbors share the same label, is often overlooked in the current literature on DML, where most of the focus is placed on training the embedding function. To address this issue, we propose a mechanism that leverages the statistics of the nearest neighbors of a sample. Our approach utilizes cross-attention to learn meaningful information from other samples, thereby improving the local embedding of the image. This method can be easily incorporated into DML approaches at a negligible additional cost during inference. Experimental results on various standard DML benchmark datasets demonstrate that our approach outperforms the state of the art.",
        "keywords": "deep metric learning;supervised representation learning;survey",
        "primary_area": "metric learning, kernel learning, and sparse coding",
        "supplementary_material": "/attachment/3dec9a5e51521e54e7f1cfef57367b590fe02b30.pdf",
        "author": "Dmytro Kotovenko;Pingchuan Ma;Marcel Fischer;Bj\u00f6rn Ommer",
        "authorids": "~Dmytro_Kotovenko2;~Pingchuan_Ma2;~Marcel_Fischer1;~Bj\u00f6rn_Ommer2",
        "gender": "M;M;;M",
        "homepage": ";;https://ommer-lab.com/people/ommer/;",
        "dblp": "250/4448;;11/4098;223/9997",
        "google_scholar": "a5JMcsgAAAAJ;;zWbvIUcAAAAJ;https://scholar.google.de/citations?user=T_U8yxwAAAAJ",
        "orcid": "0000-0002-1367-6195;;;",
        "linkedin": ";marcel-fischer-62b290264/;;",
        "or_profile": "~Pingchuan_Ma2;~Marcel_Fischer1;~Bjorn_Ommer1;~Dmytro_Kotovenko1",
        "aff": "Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen;;Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen;Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen",
        "aff_domain": "lmu.de;;lmu.de;lmu.de",
        "position": "PhD student;;Full Professor;PhD student",
        "bibtex": "@misc{\nkotovenko2024attend,\ntitle={Attend to Context for Refining Embeddings in Deep Metric Learning},\nauthor={Dmytro Kotovenko and Pingchuan Ma and Marcel Fischer and Bj{\\\"o}rn Ommer},\nyear={2024},\nurl={https://openreview.net/forum?id=S6j6VQFmpw}\n}",
        "github": "",
        "project": "",
        "reviewers": "DDGY;6eUw;haCf;NTPu",
        "site": "https://openreview.net/forum?id=S6j6VQFmpw",
        "pdf_size": 14912864,
        "rating": "1;3;5;6",
        "confidence": "5;5;4;3",
        "soundness": "1;1;3;2",
        "contribution": "1;2;2;3",
        "presentation": "1;2;3;3",
        "wc_summary": "34;54;84;24",
        "wc_strengths": "34;39;72;25",
        "wc_weaknesses": "199;158;384;104",
        "wc_questions": "3;2;59;28",
        "wc_review": "270;253;599;181",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.920286436967152
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            49.0,
            22.9128784747792
        ],
        "wc_strengths_avg": [
            42.5,
            17.755280904564703
        ],
        "wc_weaknesses_avg": [
            211.25,
            105.27434397800825
        ],
        "wc_questions_avg": [
            23.0,
            23.24865587512534
        ],
        "wc_review_avg": [
            325.75,
            161.25968963135207
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9028289727756884,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:4LSFUfJIXC4J:scholar.google.com/&scioq=Attend+to+Context+for+Refining+Embeddings+in+Deep+Metric+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.lmu.de",
        "aff_unique_abbr": "LMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "S77skzM12O",
        "title": "PROTO: Iterative Policy Regularizied Offline-to-Online Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Offline-to-online reinforcement learning (RL), by combining the benefits of offline pretraining and online finetuning, promises enhanced sample efficiency and policy performance. However, existing methods, effective as they are, suffer from suboptimal performance, limited adaptability, and unsatisfactory computational efficiency. We propose a novel framework, PROTO, which overcomes the aforementioned limitations by augmenting standard RL objective with an iteratively evolving regularization term. Performing a trust-region-style update, PROTO yields stable initial finetuning and optimal final performance by gradually evolving the regularization term to relax the constraint strength. By adjusting only a few lines of code, PROTO can bridge any offline policy pretraining and standard off-policy RL finetuning to form a powerful offline-to-online RL pathway, birthing great adaptability to diverse methods. Simple yet elegant, PROTO imposes minimal additional computation and enables highly efficient online finetuning. Extensive experiments demonstrate that PROTO achieves superior performance over SOTA baselines, offering an adaptable and efficient offline-to-online RL framework.",
        "keywords": "Offline-to-online RL;Iterative policy regularization",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Jianxiong Li;Xiao Hu;Haoran Xu;Jingjing Liu;Xianyuan Zhan;Ya-Qin Zhang",
        "authorids": "~Jianxiong_Li1;~Xiao_Hu7;~Haoran_Xu4;~Jingjing_Liu2;~Xianyuan_Zhan1;~Ya-Qin_Zhang1",
        "gender": "M;M;;M;M;M",
        "homepage": "https://github.com/huxiao09;https://ryanxhr.github.io/;https://air.tsinghua.edu.cn/en/info/1046/1194.htm#:~:text=Jingjing%20Liu%20is%20Professor%2C%20Principal,CVPR%2C%20ACL%2C%20etc.);http://zhanxianyuan.xyz/;https://air.tsinghua.edu.cn/en/info/1046/1188.htm;https://facebear-ljx.github.io/",
        "dblp": "19/1374;;30/3008-1;181/5081;09/2187;43/1987",
        "google_scholar": "_9btJRYAAAAJ;iX8AJI0AAAAJ;BzJ_GboAAAAJ;pDMnGloAAAAJ;mDOMfxIAAAAJ;TRLwpiUAAAAJ",
        "orcid": ";;;0000-0002-3683-0554;;",
        "linkedin": ";;jingjing-liu-65703431/;;;",
        "or_profile": "~Xiao_Hu7;~Haoran_Xu4;~Jingjing_Liu2;~Xianyuan_Zhan1;~Ya-Qin_Zhang1;~Li_Jianxiong1",
        "aff": "Tsinghua University;University of Texas at Austin;Tsinghua University;Tsinghua University;AIR, Tsinghua University;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;utexas.edu;tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "PhD student;PhD student;Full Professor;Associate Professor;Full Professor;PhD student",
        "bibtex": "@misc{\nli2024proto,\ntitle={{PROTO}: Iterative Policy Regularizied Offline-to-Online Reinforcement Learning},\nauthor={Jianxiong Li and Xiao Hu and Haoran Xu and Jingjing Liu and Xianyuan Zhan and Ya-Qin Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=S77skzM12O}\n}",
        "github": "",
        "project": "",
        "reviewers": "LmwG;6tXk;Ykto;xy7L",
        "site": "https://openreview.net/forum?id=S77skzM12O",
        "pdf_size": 18618250,
        "rating": "3;6;6;8",
        "confidence": "5;4;2;4",
        "soundness": "2;4;3;4",
        "contribution": "2;3;3;3",
        "presentation": "2;4;3;4",
        "wc_summary": "75;80;90;39",
        "wc_strengths": "45;54;29;64",
        "wc_weaknesses": "351;154;89;26",
        "wc_questions": "78;6;164;30",
        "wc_review": "549;294;372;159",
        "wc_reply_reviewers": "569;28;7;21",
        "wc_reply_authors": "2859;613;627;188",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "7;1;1;2",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            71.0,
            19.248376554920156
        ],
        "wc_strengths_avg": [
            48.0,
            12.864680330268607
        ],
        "wc_weaknesses_avg": [
            155.0,
            121.87493589741904
        ],
        "wc_questions_avg": [
            69.5,
            60.404883908505276
        ],
        "wc_review_avg": [
            343.5,
            141.00797849767224
        ],
        "wc_reply_reviewers_avg": [
            156.25,
            238.4212396159369
        ],
        "wc_reply_authors_avg": [
            1071.75,
            1046.8441562620485
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.75,
            2.48746859276655
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.4176201680321031,
        "gs_citation": 23,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8674771826292184822&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0;0;0;0",
        "aff_unique_norm": "Tsinghua University;University of Texas at Austin",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.utexas.edu",
        "aff_unique_abbr": "THU;UT Austin",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Austin",
        "aff_country_unique_index": "0;1;0;0;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "S7T0slMrTD",
        "title": "Resolving Knowledge Conflicts in Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs) often encounter knowledge conflicts, scenarios where discrepancy arises between the internal parametric knowledge of LLMs and non-parametric information provided in the prompt context. In this work we ask what are the desiderata for LLMs when a knowledge conflict arises and whether existing LLMs fulfill them. We posit that LLMs should 1) identify knowledge conflicts, 2) pinpoint conflicting information segments, and 3) provide distinct answers or viewpoints in conflicting scenarios. To this end, we introduce KNOWLEDGE CONFLICT, an evaluation framework for simulating contextual knowledge conflicts and quantitatively evaluating to what extent LLMs achieve these goals. KNOWLEDGE CONFLICT includes diverse and complex situations of knowledge conflict, knowledge from diverse entities and domains, two synthetic conflict creation methods, and settings with progressively increasing difficulty to reflect realistic knowledge conflicts. Extensive experiments with the KNOWLEDGE CONFLICT framework reveal that while LLMs perform well in identifying the existence of knowledge conflicts, they struggle to determine the specific conflicting knowledge and produce a response with distinct answers amidst conflicting information. To address these challenges, we propose new instruction-based approaches that augment LLMs to better achieve the three goals. Further analysis shows that abilities to tackle knowledge conflicts are greatly impacted by factors such as knowledge domain and prompt text, while generating robust responses to knowledge conflict scenarios remains an open research question.",
        "keywords": "Knowledge Conflict;Large Language Model",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yike Wang;Shangbin Feng;Heng Wang;Weijia Shi;Vidhisha Balachandran;Tianxing He;Yulia Tsvetkov",
        "authorids": "~Yike_Wang1;~Shangbin_Feng1;~Heng_Wang10;~Weijia_Shi1;~Vidhisha_Balachandran1;~Tianxing_He1;~Yulia_Tsvetkov1",
        "gender": "F;M;M;;F;M;F",
        "homepage": "https://yikee.github.io/;https://bunsenfeng.github.io/;https://arthur-heng.github.io;https://weijiashi.notion.site/;https://vidhishanair.github.io/;https://cloudygoose.github.io/;https://homes.cs.washington.edu/~yuliats/",
        "dblp": "157/0173-2;295/9571;61/5618-8.html;132/80601;234/4867;149/0111;75/8157",
        "google_scholar": "8sVzP6wAAAAJ;Y3rLP9UAAAAJ;SLyDEswAAAAJ;https://scholar.google.com/citations?hl=en;LgitgaIAAAAJ;egmfjjwAAAAJ;SEDPkrsAAAAJ",
        "orcid": ";0000-0002-4133-1987;;0000-3200-0000-0011;;;0000-0002-4634-7128",
        "linkedin": ";;;weijia-shi-773768112;;;",
        "or_profile": "~Yike_Wang1;~Shangbin_Feng1;~Heng_Wang10;~Weijia_Shi1;~Vidhisha_Balachandran1;~Tianxing_He1;~Yulia_Tsvetkov1",
        "aff": "University of California, Berkeley;University of Washington;Xi'an Jiaotong University;University of Washington, Seattle;Carnegie Mellon University;University of Washington;Department of Computer Science, University of Washington",
        "aff_domain": "berkeley.edu;cs.washington.edu;xjtu.edu.cn;uw.edu;cmu.edu;cs.washington.edu;cs.washington.edu",
        "position": "MS student;PhD student;Undergrad student;PhD student;PhD student;Postdoc;Associate Professor",
        "bibtex": "@misc{\nwang2024resolving,\ntitle={Resolving Knowledge Conflicts in Large Language Models},\nauthor={Yike Wang and Shangbin Feng and Heng Wang and Weijia Shi and Vidhisha Balachandran and Tianxing He and Yulia Tsvetkov},\nyear={2024},\nurl={https://openreview.net/forum?id=S7T0slMrTD}\n}",
        "github": "",
        "project": "",
        "reviewers": "o2Z4;PtZ2;pvzs",
        "site": "https://openreview.net/forum?id=S7T0slMrTD",
        "pdf_size": 378775,
        "rating": "5;6;6",
        "confidence": "4;3;4",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "3;1;3",
        "wc_summary": "50;46;117",
        "wc_strengths": "71;34;31",
        "wc_weaknesses": "188;20;30",
        "wc_questions": "3;266;16",
        "wc_review": "312;366;194",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "835;926;575",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;2;1",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            71.0,
            32.567877834864625
        ],
        "wc_strengths_avg": [
            45.333333333333336,
            18.190351532856337
        ],
        "wc_weaknesses_avg": [
            79.33333333333333,
            76.94731242148025
        ],
        "wc_questions_avg": [
            95.0,
            121.03167629454144
        ],
        "wc_review_avg": [
            290.6666666666667,
            71.82076456166575
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            778.6666666666666,
            148.7286866149978
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 37,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10432022793289857722&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2;1;3;1;1",
        "aff_unique_norm": "University of California, Berkeley;University of Washington;Xi'an Jiao Tong University;Carnegie Mellon University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.berkeley.edu;https://www.washington.edu;https://www.xjtu.edu.cn;https://www.cmu.edu",
        "aff_unique_abbr": "UC Berkeley;UW;XJTU;CMU",
        "aff_campus_unique_index": "0;2;2",
        "aff_campus_unique": "Berkeley;;Seattle",
        "aff_country_unique_index": "0;0;1;0;0;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "S7ZQgHfW3w",
        "title": "CoDBench: A Critical Evaluation of Data-driven Models for Continuous Dynamical Systems",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Continuous dynamical systems, characterized by differential equations, are ubiq- uitously used to model several important problems: plasma dynamics, flow through porous media, weather forecasting, and epidemic dynamics. Recently, a wide range of data-driven models has been used successfully to model these systems. However, in contrast to established fields like computer vision, limited studies are available analyzing the strengths and potential applications of different classes of these models that could steer decision-making in scientific machine learning. Here, we introduce CoDBench, an exhaustive benchmarking suite comprising 11 state-of-the-art data-driven models for solving differential equations. Specifically, we comprehensively evaluate 4 distinct categories of models, viz., feed forward neural networks, deep operator regression models, frequency- based neural operators, and transformer architectures against 8 widely applicable benchmark datasets encompassing challenges from fluid and solid mechanics. We conduct extensive experiments, assessing the operators\u2019 capabilities in learning, zero-shot super-resolution, data efficiency, robustness to noise, and computational efficiency. Interestingly, our findings highlight that current operators struggle with the newer mechanics datasets, motivating the need for more robust neural oper- ators. All the datasets and codes are shared in an easy-to-use fashion for the scientific community. We hope this resource will be an impetus for accelerated progress and exploration in modeling dynamical systems. For codes and datasets, see: https://anonymous.4open.science/r/cod-bench-7525.",
        "keywords": "neural operators;dynamical systems;differential equations",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Priyanshu Burark;Karn Tiwari;Meer Mehran Rashid;Prathosh AP;N M Anoop Krishnan",
        "authorids": "~Priyanshu_Burark1;~Karn_Tiwari1;~Meer_Mehran_Rashid1;~Prathosh_AP1;~N_M_Anoop_Krishnan1",
        "gender": "M;M;M;M;M",
        "homepage": ";;;https://sites.google.com/view/prathosh;",
        "dblp": ";;;218/5887;",
        "google_scholar": ";;;https://scholar.google.co.in/citations?user=OEwV4bsAAAAJ;https://scholar.google.co.in/citations?user=fGnjHcEAAAAJ",
        "orcid": ";;;;0000-0003-1500-4947",
        "linkedin": "priyanshu-burark-6a139b1ab;karn3003/;meermehran;prathosh-ap-phd-50ab9511/;",
        "or_profile": "~Priyanshu_Burark1;~Karn_Tiwari1;~Meer_Mehran_Rashid1;~Prathosh_AP1;~N_M_Anoop_Krishnan1",
        "aff": "Indian Institute of Science, Indian institute of science, Bangalore;Indian Institute of Science, Indian institute of science, Bangalore;Johns Hopkins University ;Indian Institute of Science, Indian institute of science, Bangalore;Indian Institute of Technology Delhi",
        "aff_domain": "iisc.ac.in;iisc.ac.in;jhu.edu;iisc.ac.in;iitd.ac.in",
        "position": "MS student;PhD student;PhD student;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nburark2024codbench,\ntitle={Co{DB}ench: A Critical Evaluation of Data-driven Models for Continuous Dynamical Systems},\nauthor={Priyanshu Burark and Karn Tiwari and Meer Mehran Rashid and Prathosh AP and N M Anoop Krishnan},\nyear={2024},\nurl={https://openreview.net/forum?id=S7ZQgHfW3w}\n}",
        "github": "",
        "project": "",
        "reviewers": "M9NG;fbDR;3R3p;eLXu",
        "site": "https://openreview.net/forum?id=S7ZQgHfW3w",
        "pdf_size": 1087149,
        "rating": "3;3;6;6",
        "confidence": "3;3;3;2",
        "soundness": "3;2;4;3",
        "contribution": "2;1;2;3",
        "presentation": "3;2;4;3",
        "wc_summary": "35;63;96;52",
        "wc_strengths": "15;104;58;45",
        "wc_weaknesses": "87;245;52;58",
        "wc_questions": "2;33;161;17",
        "wc_review": "139;445;367;172",
        "wc_reply_reviewers": "59;113;0;0",
        "wc_reply_authors": "466;1490;721;334",
        "reply_reviewers": "1;2;0;0",
        "reply_authors": "2;3;2;2",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            61.5,
            22.276669409945463
        ],
        "wc_strengths_avg": [
            55.5,
            32.05074102107469
        ],
        "wc_weaknesses_avg": [
            110.5,
            78.77340921910134
        ],
        "wc_questions_avg": [
            53.25,
            63.16793094601089
        ],
        "wc_review_avg": [
            280.75,
            128.77960824602627
        ],
        "wc_reply_reviewers_avg": [
            43.0,
            47.04784798479097
        ],
        "wc_reply_authors_avg": [
            752.75,
            447.806529094876
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5773502691896258,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13400656010792064604&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;1;0;2",
        "aff_unique_norm": "Indian Institute of Science;Johns Hopkins University;Indian Institute of Technology Delhi",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.iisc.ac.in;https://www.jhu.edu;https://www.iitd.ac.in",
        "aff_unique_abbr": "IISc;JHU;IIT Delhi",
        "aff_campus_unique_index": "0;0;0;2",
        "aff_campus_unique": "Bangalore;;Delhi",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "India;United States"
    },
    {
        "id": "S7j1sNVIm9",
        "title": "Locally Adaptive Federated Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Federated learning is a paradigm of distributed machine learning in which multiple clients coordinate with a central server to learn a model, without sharing their own training data. Standard federated optimization methods such as Federated Averaging (FedAvg) ensure balance among the clients by using the same stepsize for local updates on all clients. However, this means that all clients need to respect the global geometry of the function which could yield slow convergence. In this work, we propose locally adaptive federated learning algorithms, that leverage the local geometric information for each client function. We show that such locally adaptive methods with uncoordinated stepsizes across all clients can be particularly efficient in interpolated (overparameterized) settings, and analyze their convergence in the presence of heterogeneous data for convex and strongly convex settings. We validate our theoretical claims by performing illustrative experiments for both i.i.d. non-i.i.d. cases. Our proposed algorithms match the optimization performance of tuned FedAvg in the convex setting, outperform FedAvg as well as state-of-the-art adaptive federated algorithms like FedAMS for non-convex experiments, and come with superior generalization performance.",
        "keywords": "Adaptive Optimization;Stochastic Optimization;Convex Optimization;Stochastic Polyak Stepsize;Distributed Optimization;Federated Learning;Adaptive Federated Optimization;Local Adaptivity",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Sohom Mukherjee;Nicolas Loizou;Sebastian U Stich",
        "authorids": "~Sohom_Mukherjee1;~Nicolas_Loizou1;~Sebastian_U_Stich1",
        "gender": "M;M;M",
        "homepage": "https://www.wiwi.uni-wuerzburg.de/en/bwl11/team/researchers/sohom-mukherjee/;https://nicolasloizou.github.io/;https://www.sstich.ch",
        "dblp": "227/2545;173/4958;04/10549",
        "google_scholar": "S2Za7bQAAAAJ;https://scholar.google.co.uk/citations?user=mvDmzAQAAAAJ;https://scholar.google.ch/citations?user=8l-mDfQAAAAJ",
        "orcid": "0000-0003-0085-1203;;",
        "linkedin": ";;",
        "or_profile": "~Sohom_Mukherjee1;~Nicolas_Loizou1;~Sebastian_U_Stich1",
        "aff": "Saarland University;Johns Hopkins University;CISPA Helmholtz Center for Information Security",
        "aff_domain": "uni-saarland.de;jhu.edu;cispa.de",
        "position": "MS student;Assistant Professor;Tenure Track Faculty",
        "bibtex": "@misc{\nmukherjee2024locally,\ntitle={Locally Adaptive Federated Learning},\nauthor={Sohom Mukherjee and Nicolas Loizou and Sebastian U Stich},\nyear={2024},\nurl={https://openreview.net/forum?id=S7j1sNVIm9}\n}",
        "github": "",
        "project": "",
        "reviewers": "e5wf;g1co;vVZ6",
        "site": "https://openreview.net/forum?id=S7j1sNVIm9",
        "pdf_size": 1584684,
        "rating": "5;5;6",
        "confidence": "3;4;4",
        "soundness": "2;3;3",
        "contribution": "2;2;2",
        "presentation": "2;3;3",
        "wc_summary": "113;59;58",
        "wc_strengths": "47;83;41",
        "wc_weaknesses": "277;143;410",
        "wc_questions": "110;4;149",
        "wc_review": "547;289;658",
        "wc_reply_reviewers": "0;0;153",
        "wc_reply_authors": "604;322;738",
        "reply_reviewers": "0;0;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            76.66666666666667,
            25.69478978746902
        ],
        "wc_strengths_avg": [
            57.0,
            18.547236990991408
        ],
        "wc_weaknesses_avg": [
            276.6666666666667,
            109.00254839018929
        ],
        "wc_questions_avg": [
            87.66666666666667,
            61.266267680964184
        ],
        "wc_review_avg": [
            498.0,
            154.57684173251826
        ],
        "wc_reply_reviewers_avg": [
            51.0,
            72.12489168102785
        ],
        "wc_reply_authors_avg": [
            554.6666666666666,
            173.3769175973421
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17625615533682397058&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Saarland University;Johns Hopkins University;CISPA Helmholtz Center for Information Security",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.uni-saarland.de;https://www.jhu.edu;https://www.cispa.de/",
        "aff_unique_abbr": "UdS;JHU;CISPA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Germany;United States"
    },
    {
        "id": "S83ldgJZLh",
        "title": "A Structured Pruning Algorithm for Model-based Deep Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "There is a growing interest in model-based deep learning (MBDL) for solving imaging inverse problems. MBDL networks can be seen as iterative algorithms that estimate the desired image using a physical measurement model and a learned image prior specified using a convolutional neural net (CNNs). The iterative nature of MBDL networks increases the test-time computational complexity, which limits their applicability in certain large-scale applications. We address this issue by presenting structured pruning algorithm for model-based deep learning (SPADE) as the first structured pruning algorithm for MBDL networks. SPADE reduces the computational complexity of CNNs used within MBDL networks by pruning its non-essential weights. We propose three distinct strategies to fine-tune the pruned MBDL networks to minimize the performance loss. Each fine-tuning strategy has a unique benefit that depends on the presence of a pre-trained model and a high-quality ground truth. We validate SPADE on two distinct inverse problems, namely compressed sensing MRI and image super-resolution. Our results highlight that MBDL models pruned by SPADE can achieve substantial speed up in testing time while maintaining competitive performance.",
        "keywords": "imaging inverse problem;computational imaging;model-based deep learning;network pruning",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/cb8310cc2f3494b639d2f876ddfd705fbf1e4853.pdf",
        "author": "Chicago Park;Weijie Gan;Zihao Zou;Yuyang Hu;Zhixin Sun;Ulugbek Kamilov",
        "authorids": "~Chicago_Park1;~Weijie_Gan1;~Zihao_Zou1;~Yuyang_Hu1;~Zhixin_Sun2;~Ulugbek_Kamilov1",
        "gender": "M;M;M;M;F;Not Specified",
        "homepage": "https://chicagopark.github.io/;https://wjgancn.github.io;https://zihaozou.github.io/;https://hu-yuyang.github.io/;https://flora-sun-zhixin.github.io/;https://ukmlv.github.io",
        "dblp": ";275/3691;;;;73/9223",
        "google_scholar": "bovdw6kAAAAJ;Ib20Ge0AAAAJ;g7UmvMEAAAAJ;FvRrgTsAAAAJ;;https://scholar.google.com.tw/citations?user=3qYUSDwAAAAJ",
        "orcid": "0000-0002-5868-6557;;;;;0000-0001-6770-3278",
        "linkedin": "young-il-park/;;;;;",
        "or_profile": "~Chicago_Park1;~Weijie_Gan1;~Zihao_Zou1;~Yuyang_Hu1;~Zhixin_Sun2;~Ulugbek_Kamilov1",
        "aff": "Washington University, Saint Louis;Washington University, Saint Louis;Department of Computer Science, University of North Carolina at Chapel Hill;Mitsubishi Electric Research Labs;Washington University, Saint Louis;Google",
        "aff_domain": "wustl.edu;wustl.edu;cs.unc.edu;merl.com;wustl.edu;google.com",
        "position": "Undergrad student;PhD student;PhD student;Intern;PhD student;Visiting Faculty Researcher",
        "bibtex": "@misc{\npark2024a,\ntitle={A Structured Pruning Algorithm for Model-based Deep Learning},\nauthor={Chicago Park and Weijie Gan and Zihao Zou and Yuyang Hu and Zhixin Sun and Ulugbek Kamilov},\nyear={2024},\nurl={https://openreview.net/forum?id=S83ldgJZLh}\n}",
        "github": "",
        "project": "",
        "reviewers": "vSdx;NVrb;ifBm;hcWa",
        "site": "https://openreview.net/forum?id=S83ldgJZLh",
        "pdf_size": 3991844,
        "rating": "3;5;5;6",
        "confidence": "4;2;4;3",
        "soundness": "2;2;3;3",
        "contribution": "1;2;2;2",
        "presentation": "2;3;3;2",
        "wc_summary": "32;145;69;55",
        "wc_strengths": "20;173;51;14",
        "wc_weaknesses": "88;167;151;244",
        "wc_questions": "373;3;132;50",
        "wc_review": "513;488;403;363",
        "wc_reply_reviewers": "0;0;0;42",
        "wc_reply_authors": "616;347;903;556",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;2;2",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            75.25,
            42.381452311123084
        ],
        "wc_strengths_avg": [
            64.5,
            64.19696254496782
        ],
        "wc_weaknesses_avg": [
            162.5,
            55.55402775677025
        ],
        "wc_questions_avg": [
            139.5,
            142.49649118487093
        ],
        "wc_review_avg": [
            441.75,
            61.07116750153054
        ],
        "wc_reply_reviewers_avg": [
            10.5,
            18.186533479473212
        ],
        "wc_reply_authors_avg": [
            605.5,
            198.67624417629804
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.48420012470625223,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17309829704387642081&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;2;0;3",
        "aff_unique_norm": "Washington University in St. Louis;University of North Carolina at Chapel Hill;Mitsubishi Electric Research Laboratories;Google",
        "aff_unique_dep": ";Department of Computer Science;;Google",
        "aff_unique_url": "https://wustl.edu;https://www.unc.edu;https://www.merl.com;https://www.google.com",
        "aff_unique_abbr": "WUSTL;UNC Chapel Hill;MERL;Google",
        "aff_campus_unique_index": "0;0;1;0;3",
        "aff_campus_unique": "Saint Louis;Chapel Hill;;Mountain View",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "S9YfP4rsfX",
        "title": "Exploring the Limitations of Graph-based Logical Reasoning in Large Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Pretrained Large Language Models have demonstrated various types of reasoning capabilities through language-based prompts alone. However, in this paper, we test the depth of logical reasoning for 5 different LLMs (GPT-4, GPT-3.5, Claude-2, Llama-2 and Palm-2) through the problems of graph reasoning. In particular, we design 10 distinct problems of graph traversal, each representing increasing levels of complexities. Further, we analyse the performance of models across various settings such as varying size of graphs as well as different forms of k-shot prompting. These models are evaluated using two distinct metrics -- absolute accuracy, which evaluates model responses using a binary label (Correct/Wrong), and partial credit, which evaluates the sequence of predicted nodes against the actual solution step by step, and awards score for the number of nodes correctly predicted before deviating from the correct response. We find that apart from certain powerful, language models do not possess strong reasoning capabilities The reasoning capabilities has an inverse relation to the average degrees of freedom of traversal per node in graphs. Further, we note that k-shot prompts has an overall negative impact on the reasoning abilities of language models. We finally conclude that powerful models (including GPT-4, Claude-2 and GPT-3.5) possess an estimated variable tracking depth of less than 10 nodes, making them unsuitable for complex reasoning tasks.",
        "keywords": "graph reasoning;LLMs;logical reasoning",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Palaash Agrawal;Shavak Vasania;Cheston Tan",
        "authorids": "~Palaash_Agrawal1;~Shavak_Vasania1;~Cheston_Tan1",
        "gender": "M;M;M",
        "homepage": ";;",
        "dblp": ";;136/9366",
        "google_scholar": "nvebgE0AAAAJ;;Up0UYEYAAAAJ",
        "orcid": "0000-0001-5902-585X;;",
        "linkedin": "palaashagrawal/;shavak-vasania-061455223/;cheston-tan/",
        "or_profile": "~Palaash_Agrawal1;~Shavak_Vasania1;~Cheston_Tan1",
        "aff": "A*STAR;A*STAR;Singapore University of Technology and Design",
        "aff_domain": "cfar.a-star.edu.sg;a-star.edu.sg;sutd.edu.sg",
        "position": "Researcher;Intern;Assistant Professor",
        "bibtex": "@misc{\nagrawal2024exploring,\ntitle={Exploring the Limitations of Graph-based Logical Reasoning in Large Language Models},\nauthor={Palaash Agrawal and Shavak Vasania and Cheston Tan},\nyear={2024},\nurl={https://openreview.net/forum?id=S9YfP4rsfX}\n}",
        "github": "",
        "project": "",
        "reviewers": "aBCN;WkiA;eQSj;HHfy",
        "site": "https://openreview.net/forum?id=S9YfP4rsfX",
        "pdf_size": 502787,
        "rating": "1;3;3;3",
        "confidence": "4;4;4;4",
        "soundness": "2;2;2;3",
        "contribution": "1;1;2;2",
        "presentation": "1;1;2;2",
        "wc_summary": "27;94;57;49",
        "wc_strengths": "10;21;18;72",
        "wc_weaknesses": "313;186;86;35",
        "wc_questions": "2;27;6;43",
        "wc_review": "352;328;167;199",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            56.75,
            24.149275351446885
        ],
        "wc_strengths_avg": [
            30.25,
            24.437420076595647
        ],
        "wc_weaknesses_avg": [
            155.0,
            106.16732077244862
        ],
        "wc_questions_avg": [
            19.5,
            16.560495161679196
        ],
        "wc_review_avg": [
            261.5,
            79.76371355447287
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:byXdpYbDs5YJ:scholar.google.com/&scioq=Exploring+the+Limitations+of+Graph-based+Logical+Reasoning+in+Large+Language+Models&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Agency for Science, Technology and Research;Singapore University of Technology and Design",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.a-star.edu.sg;https://www.sutd.edu.sg",
        "aff_unique_abbr": "A*STAR;SUTD",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Singapore"
    },
    {
        "title": "A Study of Bayesian Neural Network Surrogates for Bayesian Optimization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18615",
        "id": "SA19ijj44B",
        "author_site": "Yucen Li, Tim G. J. Rudner, Andrew Gordon Wilson",
        "tldr": "",
        "abstract": "Bayesian optimization is a highly efficient approach to optimizing objective functions which are expensive to query. These objectives are typically represented by Gaussian process (GP) surrogate models which are easy to optimize and support exact inference. While standard GP surrogates have been well-established in Bayesian optimization, Bayesian neural networks (BNNs) have recently become practical function approximators, with many benefits over standard GPs such as the ability to naturally handle non-stationarity and learn representations for high-dimensional data. In this paper, we study BNNs as alternatives to standard GP surrogates for optimization. We consider a variety of approximate inference procedures for finite-width BNNs, including high-quality Hamiltonian Monte Carlo, low-cost stochastic MCMC, and heuristics such as deep ensembles. We also consider infinite-width BNNs, linearized Laplace approximations, and partially stochastic models such as deep kernel learning. We evaluate this collection of surrogate models on diverse problems with varying dimensionality, number of objectives, non-stationarity, and discrete and continuous inputs. We find: (i) the ranking of methods is highly problem dependent, suggesting the need for tailored inductive biases; (ii) HMC is the most successful approximate inference procedure for fully stochastic BNNs; (iii) full stochasticity may be unnecessary as deep kernel learning is relatively competitive; (iv) deep ensembles perform relatively poorly; (v) infinite-width BNNs are particularly promising, especially in high dimensions.",
        "keywords": "Bayesian Optimization;Gaussian Processes;Bayesian Neural Networks",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/832a6cbfec835884149decb1e7ad8fe0ebcf3ebe.zip",
        "author": "Yucen Lily Li;Tim G. J. Rudner;Andrew Gordon Wilson",
        "authorids": "~Yucen_Lily_Li1;~Tim_G._J._Rudner2;~Andrew_Gordon_Wilson1",
        "gender": ";Not Specified;Not Specified",
        "homepage": "https://yucenli.com;https://cims.nyu.edu/~andrewgw;https://timrudner.com",
        "dblp": "252/6123;65/10453;230/3480",
        "google_scholar": ";https://scholar.google.com.tw/citations?user=twWX2LIAAAAJ;https://scholar.google.de/citations?user=MbBntPgAAAAJ",
        "orcid": ";;",
        "linkedin": ";;trudner",
        "or_profile": "~Yucen_Lily_Li1;~Andrew_Gordon_Wilson1;~Tim_Georg_Johann_Rudner1",
        "aff": "New York University;New York University;New York University",
        "aff_domain": "nyu.edu;nyu.edu;nyu.edu",
        "position": "PhD student;Associate Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nli2024a,\ntitle={A Study of Bayesian Neural Network Surrogates for Bayesian Optimization},\nauthor={Yucen Lily Li and Tim G. J. Rudner and Andrew Gordon Wilson},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=SA19ijj44B}\n}",
        "github": "",
        "project": "",
        "reviewers": "v5S3;XqQk;6qj4",
        "pdf_size": 2432204,
        "rating": "6;8;8",
        "confidence": "4;3;4",
        "soundness": "3;3;3",
        "contribution": "1;3;3",
        "presentation": "2;4;3",
        "wc_summary": "64;107;78",
        "wc_strengths": "24;77;150",
        "wc_weaknesses": "143;46;363",
        "wc_questions": "86;324;68",
        "wc_review": "317;554;659",
        "wc_reply_reviewers": "13;23;0",
        "wc_reply_authors": "1071;867;251",
        "reply_reviewers": "1;1;0",
        "reply_authors": "4;2;1",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            83.0,
            17.90716802475106
        ],
        "wc_strengths_avg": [
            83.66666666666667,
            51.65483735549094
        ],
        "wc_weaknesses_avg": [
            184.0,
            132.62227062852855
        ],
        "wc_questions_avg": [
            159.33333333333334,
            116.6685714130226
        ],
        "wc_review_avg": [
            510.0,
            143.04544732356916
        ],
        "wc_reply_reviewers_avg": [
            12.0,
            9.41629792788369
        ],
        "wc_reply_authors_avg": [
            729.6666666666666,
            348.56403843323955
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 29,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1463667222575472131&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=SA19ijj44B",
        "pdf": "https://openreview.net/pdf?id=SA19ijj44B",
        "email": "nyu.edu;nyu.edu;nyu.edu",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "New York University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nyu.edu",
        "aff_unique_abbr": "NYU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Demystifying Local & Global Fairness Trade-offs in Federated Learning Using Partial Information Decomposition",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18614",
        "id": "SBj2Qdhgew",
        "author_site": "Faisal Hamman, Sanghamitra Dutta",
        "tldr": "",
        "abstract": "This work presents an information-theoretic perspective to group fairness trade-offs in federated learning (FL) with respect to sensitive attributes, such as gender, race, etc. Existing works often focus on either $\\textit{global fairness}$ (overall disparity of the model across all clients) or $\\textit{local fairness}$ (disparity of the model at each client), without always considering their trade-offs. There is a lack of understanding regarding the interplay between global and local fairness in FL, particularly under data heterogeneity, and if and when one implies the other. To address this gap, we leverage a body of work in information theory called partial information decomposition (PID), which first identifies three sources of unfairness in FL, namely, $\\textit{Unique Disparity}$, $\\textit{Redundant  Disparity}$, and $\\textit{Masked Disparity}$. We demonstrate how these three disparities contribute to global and local fairness using canonical examples. This decomposition helps us derive fundamental limits on the trade-off between global and local fairness, highlighting where they agree or disagree.  We introduce the $\\textit{Accuracy and Global-Local Fairness Optimality Problem}$ (AGLFOP), a convex optimization that defines the theoretical limits of accuracy and fairness trade-offs, identifying the best possible performance any FL strategy can attain given a dataset and client distribution. We also present experimental results on synthetic datasets and the ADULT dataset to support our theoretical findings.",
        "keywords": "Fairness;Federated Learning;Machine Learning;Information Theory",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Faisal Hamman;Sanghamitra Dutta",
        "authorids": "~Faisal_Hamman1;~Sanghamitra_Dutta2",
        "gender": "M;F",
        "homepage": "https://www.faisalhamman.com/;https://sites.google.com/site/sanghamitraweb/",
        "dblp": "332/3468;154/6653",
        "google_scholar": "Zeoc1A8AAAAJ;BgaqaXwAAAAJ",
        "orcid": ";0000-0002-6500-2627",
        "linkedin": ";",
        "or_profile": "~Faisal_Hamman1;~Sanghamitra_Dutta2",
        "aff": "J.P. Morgan Chase;University of Maryland, College Park",
        "aff_domain": "jpmorganchase.com;umd.edu",
        "position": "Intern;Assistant Professor",
        "bibtex": "@inproceedings{\nhamman2024demystifying,\ntitle={Demystifying Local \\& Global Fairness Trade-offs in Federated Learning Using Partial Information Decomposition},\nauthor={Faisal Hamman and Sanghamitra Dutta},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=SBj2Qdhgew}\n}",
        "github": "",
        "project": "",
        "reviewers": "rTkq;GNty;P5hg",
        "pdf_size": 918155,
        "rating": "6;8;8",
        "confidence": "2;3;3",
        "soundness": "3;3;4",
        "contribution": "3;4;4",
        "presentation": "3;2;4",
        "wc_summary": "65;198;68",
        "wc_strengths": "30;118;88",
        "wc_weaknesses": "224;328;57",
        "wc_questions": "102;22;58",
        "wc_review": "421;666;271",
        "wc_reply_reviewers": "91;105;0",
        "wc_reply_authors": "1283;1540;936",
        "reply_reviewers": "1;1;0",
        "reply_authors": "3;4;2",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            110.33333333333333,
            62.00179208879549
        ],
        "wc_strengths_avg": [
            78.66666666666667,
            36.527006751473934
        ],
        "wc_weaknesses_avg": [
            203.0,
            111.62735626479142
        ],
        "wc_questions_avg": [
            60.666666666666664,
            32.71425105702746
        ],
        "wc_review_avg": [
            452.6666666666667,
            162.8052688200095
        ],
        "wc_reply_reviewers_avg": [
            65.33333333333333,
            46.54985380094001
        ],
        "wc_reply_authors_avg": [
            1253.0,
            247.49276083689128
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.0,
            0.816496580927726
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.9999999999999998,
        "gs_citation": 19,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12012399170945114324&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=SBj2Qdhgew",
        "pdf": "https://openreview.net/pdf?id=SBj2Qdhgew",
        "email": "jpmorganchase.com;umd.edu",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "JPMorgan Chase & Co.;University of Maryland",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.jpmorganchase.com;https://www/umd.edu",
        "aff_unique_abbr": "JPM;UMD",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";College Park",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "THOUGHT PROPAGATION: AN ANALOGICAL APPROACH TO COMPLEX REASONING WITH LARGE LANGUAGE MODELS",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18613",
        "id": "SBoRhRCzM3",
        "author_site": "Junchi Yu, Ran He, Rex Ying",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) have achieved remarkable success in reasoning tasks with the development of prompting methods. \nHowever, existing prompting approaches cannot reuse insights of solving similar problems and suffer from accumulated errors in multi-step reasoning, since they prompt LLMs to reason \\textit{from scratch}.\nTo address these issues, we propose \\textbf{\\textit{Thought Propagation} (TP)}, which explores the analogous problems and leverages their solutions to enhance the complex reasoning ability of LLMs.\nThese analogous problems are related to the input one, with reusable solutions and problem-solving strategies.\nThus, it is promising to propagate insights of solving previous analogous problems to inspire new problem-solving. \nTo achieve this, TP first prompts LLMs to propose and solve a set of analogous problems that are related to the input one. \nThen, TP reuses the results of analogous problems to directly yield a new solution or derive a knowledge-intensive plan for execution to amend the initial solution obtained from scratch.\nTP is compatible with existing prompting approaches, allowing plug-and-play generalization and enhancement in a wide range of tasks without much labor in task-specific prompt engineering. \nExperiments across three challenging tasks demonstrate TP enjoys a substantial improvement over the baselines by an average of 12\\% absolute increase in finding the optimal solutions in Shortest-path Reasoning, 13\\% improvement of human preference in Creative Writing, and 15\\% enhancement in the task completion rate of LLM-Agent Planning.",
        "keywords": "LLM Complex Reasoning;Language Model Reasoning",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Junchi Yu;Ran He;Zhitao Ying",
        "authorids": "~Junchi_Yu1;~Ran_He1;~Zhitao_Ying1",
        "gender": "Not Specified;M;M",
        "homepage": "https://samyu0304.github.io/;https://rhe-web.github.io/;https://www.cs.yale.edu/homes/ying-rex",
        "dblp": "246/3163;61/6198-1;209/4936",
        "google_scholar": "https://scholar.google.com.hk/citations?user=gg8DmokAAAAJ;ayrg9AUAAAAJ;6fqNXooAAAAJ",
        "orcid": ";0000-0002-3807-991X;",
        "linkedin": ";;rex-ying-92770148/",
        "or_profile": "~Junchi_Yu1;~Ran_He1;~Zhitao_Ying1",
        "aff": "Institute of Automation, Chinese Academy of Sciences;Institute of Automation, Chinese Academy of Sciences;Yale University",
        "aff_domain": "ia.ac.cn;ia.ac.cn;yale.edu",
        "position": "PhD student;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nyu2024thought,\ntitle={{THOUGHT} {PROPAGATION}: {AN} {ANALOGICAL} {APPROACH} {TO} {COMPLEX} {REASONING} {WITH} {LARGE} {LANGUAGE} {MODELS}},\nauthor={Junchi Yu and Ran He and Zhitao Ying},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=SBoRhRCzM3}\n}",
        "github": "",
        "project": "",
        "reviewers": "yu29;39VY;VZuc",
        "pdf_size": 1574330,
        "rating": "6;6;8",
        "confidence": "4;4;4",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "2;3;3",
        "wc_summary": "85;62;172",
        "wc_strengths": "86;99;173",
        "wc_weaknesses": "395;45;74",
        "wc_questions": "1;12;5",
        "wc_review": "567;218;424",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1328;744;565",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            106.33333333333333,
            47.37322262863508
        ],
        "wc_strengths_avg": [
            119.33333333333333,
            38.31738798799081
        ],
        "wc_weaknesses_avg": [
            171.33333333333334,
            158.59872494933734
        ],
        "wc_questions_avg": [
            6.0,
            4.546060565661952
        ],
        "wc_review_avg": [
            403.0,
            143.25036358301736
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            879.0,
            325.79236741622213
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 49,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11332276861438268972&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=SBoRhRCzM3",
        "pdf": "https://openreview.net/pdf?id=SBoRhRCzM3",
        "email": "ia.ac.cn;ia.ac.cn;yale.edu",
        "author_num": 3,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Chinese Academy of Sciences;Yale University",
        "aff_unique_dep": "Institute of Automation;",
        "aff_unique_url": "http://www.ia.cas.cn;https://www.yale.edu",
        "aff_unique_abbr": "CAS;Yale",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Prediction without Preclusion: Recourse Verification with Reachable Sets",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18612",
        "id": "SCQfYpdoGE",
        "author_site": "Avni Kothari, Bogdan Kulynych, Tsui-Wei Weng, Berk Ustun",
        "tldr": "",
        "abstract": "Machine learning models are often used to decide who receives a loan, a job interview, or a public benefit. Models in such settings use features without considering their *actionability*. As a result, they can assign predictions that are \\emph{fixed} -- meaning that individuals who are denied loans and interviews are, in fact, *precluded from access* to credit and employment. In this work, we introduce a procedure called *recourse verification* to test if a model assigns fixed predictions to its decision subjects. We propose a model-agnostic approach for verification with *reachable sets* -- i.e., the set of all points that a person can reach through their actions in feature space. We develop methods to construct reachable sets for discrete feature spaces, which can certify the responsiveness of *any model* by simply querying its predictions. We conduct a comprehensive empirical study on the infeasibility of recourse on datasets from consumer finance. Our results highlight how models can inadvertently preclude access by assigning fixed predictions and underscore the need to account for actionability in model development.",
        "keywords": "algorithmic recourse;fairness;robustness;consumer finance;integer programming;trustworthy AI",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/4802b32e1a45b938ad19ecea4701efe327c6eb7b.pdf",
        "author": "Avni Kothari;Bogdan Kulynych;Tsui-Wei Weng;Berk Ustun",
        "authorids": "~Avni_Kothari1;~Bogdan_Kulynych1;~Tsui-Wei_Weng1;~Berk_Ustun1",
        "gender": "F;Not Specified;F;M",
        "homepage": "https://avni510.github.io/;https://kulyny.ch;https://lilywenglab.github.io;http://www.berkustun.com",
        "dblp": ";203/9056;177/9197;138/5585",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;v8GM4xoAAAAJ;6z_XWYcAAAAJ",
        "orcid": ";;;0000-0001-5188-3155",
        "linkedin": "avni-kothari-aa7b5949/;;;berkustun/",
        "or_profile": "~Avni_Kothari1;~Bogdan_Kulynych1;~Tsui-Wei_Weng1;~Berk_Ustun1",
        "aff": "University of California, San Francisco;CHUV - University Hospital Lausanne;University of California, San Diego;School of Engineering and Applied Sciences, Harvard University",
        "aff_domain": "ucsf.edu;chuv.ch;ucsd.edu;seas.harvard.edu",
        "position": "Researcher;Postdoc;Assistant Professor;Associate ",
        "bibtex": "@inproceedings{\nkothari2024prediction,\ntitle={Prediction without Preclusion: Recourse Verification with Reachable Sets},\nauthor={Avni Kothari and Bogdan Kulynych and Tsui-Wei Weng and Berk Ustun},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=SCQfYpdoGE}\n}",
        "github": "",
        "project": "",
        "reviewers": "2QxH;z4uU;fbZh;jEod",
        "pdf_size": 753993,
        "rating": "5;5;6;8",
        "confidence": "3;2;3;3",
        "soundness": "2;2;2;2",
        "contribution": "2;2;2;3",
        "presentation": "4;2;2;3",
        "wc_summary": "31;43;112;222",
        "wc_strengths": "35;26;101;79",
        "wc_weaknesses": "101;163;52;265",
        "wc_questions": "128;2;243;116",
        "wc_review": "295;234;508;682",
        "wc_reply_reviewers": "358;20;82;75",
        "wc_reply_authors": "1810;795;753;773",
        "reply_reviewers": "2;1;1;1",
        "reply_authors": "3;1;1;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            102.0,
            75.86501169841075
        ],
        "wc_strengths_avg": [
            60.25,
            30.914195768287424
        ],
        "wc_weaknesses_avg": [
            145.25,
            79.5436201087177
        ],
        "wc_questions_avg": [
            122.25,
            85.31229395579514
        ],
        "wc_review_avg": [
            429.75,
            177.64342796737515
        ],
        "wc_reply_reviewers_avg": [
            133.75,
            131.67834863788352
        ],
        "wc_reply_authors_avg": [
            1032.75,
            448.9913000270718
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.4714045207910316,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13933242212211326537&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=SCQfYpdoGE",
        "pdf": "https://openreview.net/pdf?id=SCQfYpdoGE",
        "email": "ucsf.edu;chuv.ch;ucsd.edu;seas.harvard.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "University of California, San Francisco;University Hospital Lausanne;University of California, San Diego;Harvard University",
        "aff_unique_dep": ";;;School of Engineering and Applied Sciences",
        "aff_unique_url": "https://www.ucsf.edu;https://www.chuv.ch;https://www.ucsd.edu;https://www.harvard.edu",
        "aff_unique_abbr": "UCSF;CHUV;UCSD;Harvard",
        "aff_campus_unique_index": "0;1;2;3",
        "aff_campus_unique": "San Francisco;Lausanne;San Diego;Cambridge",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "United States;Switzerland"
    },
    {
        "id": "SEPaEuPwpr",
        "title": "SOI: Scaling down computational complexity by estimating partial states of the model",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Consumer electronics used to follow the miniaturization trend described by Moore\u2019s Law. Despite the continuous growth in the processing power of Microcontroller Units (MCUs), the MCUs used in the smallest appliances are still not capable of running even moderately big, state-of-the-art artificial neural networks (ANNs). Deploying ANNs on this class of devices becomes even more challenging when they are required to operate in a time-sensitive manner, as the model\u2019s inference cannot be distributed over time. In this work, we present a novel method called Scattered Online Inference (SOI) that aims to reduce the computational complexity of ANNs. SOI is developed based on the premise that time-series data is continuous and/or seasonal, and so are the model\u2019s predictions. This applied extrapolation leads to processing speed improvements, especially in the deeper layers of the model. The application of strides forces the ANN to produce more general inner partial states of the model, as they are based on a higher number of input samples that lie further apart from each other. As a result, SOI allows skipping full model recalculation at each inference by performing only the strictly necessary operations. We present two possible patterns of inference achievable with SOI - Partially Predictive (PP) and Fully Predictive (FP). For the audio separation task, we achieved a 64.4% reduction in computational complexity at the cost of 9.8% of SI-SNRi for the PP variant, and a 41.9% reduction at the cost of 7.70% SI-SNRi with the FP variant. Moreover, the latter variant reduces inference time by an additional 28.7%. Similar results are also presented for the acoustic scene classification task with a model based on the GhostNet architecture.",
        "keywords": "Convolutional neural networks;Time series data;Inference at the edge;Computational complexity reduction;Causality;Real-Time results",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Grzegorz Stefa\u0144ski;Pawe\u0142 Daniluk;Artur Szumaczuk;Jakub Tkaczuk",
        "authorids": "~Grzegorz_Stefa\u0144ski1;~Pawe\u0142_Daniluk1;~Artur_Szumaczuk1;~Jakub_Tkaczuk1",
        "gender": "M;;M;M",
        "homepage": "https://github.com/GrzegorzStefanski;;;https://www.linkedin.com/in/tkaczukjakub/",
        "dblp": "339/8733.html;57/7064;293/5618;119/7322",
        "google_scholar": "UdGFCFsAAAAJ;https://scholar.google.pl/citations?user=5PIIXdwAAAAJ;;",
        "orcid": "0000-0002-0858-0180;;0000-0002-0329-5022;",
        "linkedin": "g-stefanski/;;;",
        "or_profile": "~Grzegorz_Stefa\u0144ski1;~Pawe\u0142_Daniluk1;~Artur_Szumaczuk1;~Jakub_Tkaczuk1",
        "aff": "Samsung;Samsung;Samsung;",
        "aff_domain": "samsung.com;samsung.com;samsung.com;",
        "position": "Researcher;Principal Researcher;Data Scientist;",
        "bibtex": "@misc{\nstefa{\\'n}ski2024soi,\ntitle={{SOI}: Scaling down computational complexity by estimating partial states of the model},\nauthor={Grzegorz Stefa{\\'n}ski and Pawe{\\l} Daniluk and Artur Szumaczuk and Jakub Tkaczuk},\nyear={2024},\nurl={https://openreview.net/forum?id=SEPaEuPwpr}\n}",
        "github": "",
        "project": "",
        "reviewers": "LqQF;iRws;sLXH;o3ho",
        "site": "https://openreview.net/forum?id=SEPaEuPwpr",
        "pdf_size": 2402610,
        "rating": "5;5;5;6",
        "confidence": "3;3;3;3",
        "soundness": "3;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;2;3",
        "wc_summary": "89;241;53;96",
        "wc_strengths": "150;286;16;121",
        "wc_weaknesses": "249;126;95;50",
        "wc_questions": "111;55;59;3",
        "wc_review": "599;708;223;270",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "931;720;823;498",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            119.75,
            71.87967376108492
        ],
        "wc_strengths_avg": [
            143.25,
            96.3207532154935
        ],
        "wc_weaknesses_avg": [
            130.0,
            73.8275016508076
        ],
        "wc_questions_avg": [
            57.0,
            38.2099463490856
        ],
        "wc_review_avg": [
            450.0,
            207.7823380367061
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            743.0,
            159.9202926460554
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:n-y4bRpJ3AcJ:scholar.google.com/&scioq=SOI:+Scaling+down+computational+complexity+by+estimating+partial+states+of+the+model&hl=en&as_sdt=0,14",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Samsung",
        "aff_unique_dep": "Samsung",
        "aff_unique_url": "https://www.samsung.com",
        "aff_unique_abbr": "Samsung",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "Mask-Based Modeling for Neural Radiance Fields",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18611",
        "id": "SEiuSzlD1d",
        "author_site": "Ganlin Yang, Guoqiang Wei, Zhizheng Zhang, Yan Lu, Dong Liu",
        "tldr": "",
        "abstract": "Most Neural Radiance Fields (NeRFs) exhibit limited generalization capabilities,which restrict their applicability in representing multiple scenes using a single model. To address this problem, existing generalizable NeRF methods simply condition the model on image features. These methods still struggle to learn precise global representations over diverse scenes since they lack an effective mechanism for interacting among different points and views. In this work, we unveil that 3D implicit representation learning can be significantly improved by mask-based modeling. Specifically, we propose **m**asked **r**ay and **v**iew **m**odeling for generalizable **NeRF** (**MRVM-NeRF**), which is a self-supervised pretraining target to predict complete scene representations from partially masked features along each ray. With this pretraining target, MRVM-NeRF enables better use of correlations across different rays and views as the geometry priors, which thereby strengthens the capability of capturing intricate details within the scenes and boosts the generalization capability across different scenes. Extensive experiments demonstrate the effectiveness of our proposed MRVM-NeRF on both synthetic and real-world datasets, qualitatively and quantitatively. Besides, we also conduct experiments to show the compatibility of our proposed method with various backbones and its superiority under few-shot cases.",
        "keywords": "NeRF;Pretraining;Mask-Based Modeling",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/8348e2596c3909db9717a51bccd3b47c107c78de.pdf",
        "author": "Ganlin Yang;Guoqiang Wei;Zhizheng Zhang;Yan Lu;Dong Liu",
        "authorids": "~Ganlin_Yang1;~Guoqiang_Wei1;~Zhizheng_Zhang1;~Yan_Lu7;~Dong_Liu6",
        "gender": "M;M;M;M;M",
        "homepage": "http://home.ustc.edu.cn/~ygl666/;https://guoqiangwei.xyz/;;https://www.microsoft.com/en-us/research/people/yanlu/;http://faculty.ustc.edu.cn/dongeliu/",
        "dblp": "344/5802;234/8900;67/4758;15/4830-1;98/1737-2",
        "google_scholar": "321C4TQAAAAJ;https://scholar.google.com/citations?hl=en;X7M0I8kAAAAJ;djk5l-4AAAAJ;lOWByxoAAAAJ",
        "orcid": ";0000-0003-1846-5693;;0000-0001-5383-6424;0000-0001-9100-2906",
        "linkedin": ";;;;",
        "or_profile": "~Ganlin_Yang1;~Guoqiang_Wei1;~Zhizheng_Zhang1;~Yan_Lu7;~Dong_Liu6",
        "aff": "University of Science and Technology of China;ByteDance;Beijing Galbot Co., Ltd;Microsoft Research Asia;University of Science and Technology of China",
        "aff_domain": "ustc.edu.cn;bytedance.com;galbot.com;microsoft.com;ustc.edu.cn",
        "position": "PhD student;Researcher;Principal Researcher;Partner Research Manager;Professor",
        "bibtex": "@inproceedings{\nyang2024maskbased,\ntitle={Mask-Based Modeling for Neural Radiance Fields},\nauthor={Ganlin Yang and Guoqiang Wei and Zhizheng Zhang and Yan Lu and Dong Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=SEiuSzlD1d}\n}",
        "github": "",
        "project": "",
        "reviewers": "y3Pz;Jc3W;s7zj;GXVJ;fmpu;chDn;P3FF",
        "pdf_size": 7082013,
        "rating": "6;6;6;8;8;8;8",
        "confidence": "4;4;4;4;4;4;4",
        "soundness": "3;4;3;4;3;3;3",
        "contribution": "2;3;3;3;3;3;3",
        "presentation": "3;4;3;3;3;3;3",
        "wc_summary": "79;114;97;91;98;68;53",
        "wc_strengths": "49;128;55;34;34;157;50",
        "wc_weaknesses": "118;171;72;81;129;124;94",
        "wc_questions": "27;53;46;30;78;16;32",
        "wc_review": "273;466;270;236;339;365;229",
        "wc_reply_reviewers": "32;0;44;28;39;19;28",
        "wc_reply_authors": "369;724;327;297;316;377;478",
        "reply_reviewers": "1;0;1;1;1;1;1",
        "reply_authors": "1;1;1;1;1;1;1",
        "rating_avg": [
            7.142857142857143,
            0.9897433186107869
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.2857142857142856,
            0.45175395145262565
        ],
        "contribution_avg": [
            2.857142857142857,
            0.34992710611188266
        ],
        "presentation_avg": [
            3.142857142857143,
            0.34992710611188266
        ],
        "wc_summary_avg": [
            85.71428571428571,
            19.03165998100673
        ],
        "wc_strengths_avg": [
            72.42857142857143,
            45.5909049289976
        ],
        "wc_weaknesses_avg": [
            112.71428571428571,
            31.239692177531754
        ],
        "wc_questions_avg": [
            40.285714285714285,
            19.114050820679278
        ],
        "wc_review_avg": [
            311.14285714285717,
            78.55740134527395
        ],
        "wc_reply_reviewers_avg": [
            27.142857142857142,
            13.37832544964932
        ],
        "wc_reply_authors_avg": [
            412.57142857142856,
            138.5835046284443
        ],
        "reply_reviewers_avg": [
            0.8571428571428571,
            0.3499271061118826
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:_3-bWd548qkJ:scholar.google.com/&scioq=Mask-Based+Modeling+for+Neural+Radiance+Fields&hl=en&as_sdt=0,33",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=SEiuSzlD1d",
        "pdf": "https://openreview.net/pdf?id=SEiuSzlD1d",
        "email": "ustc.edu.cn;bytedance.com;galbot.com;microsoft.com;ustc.edu.cn",
        "author_num": 5,
        "aff_unique_index": "0;1;2;3;0",
        "aff_unique_norm": "University of Science and Technology of China;ByteDance;Galbot;Microsoft",
        "aff_unique_dep": ";;;Research",
        "aff_unique_url": "http://www.ustc.edu.cn;https://www.bytedance.com;;https://www.microsoft.com/en-us/research/group/asia",
        "aff_unique_abbr": "USTC;ByteDance;;MSR Asia",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Asia",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "SFCHv2G33F",
        "title": "Protein Language Models Enable Accurate Cryptic Ligand Binding Pocket Prediction",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Accurate prediction of protein-ligand binding pockets is a critical task in protein functional analysis and small molecule pharmaceutical design.  However, the flexible and dynamic nature of proteins conceal an unknown number of potentially invaluable \"cryptic\" pockets.  Current approaches for cryptic pocket discovery rely on molecular dynamics (MD), leading to poor scalability and bias.  Even recent ML-based cryptic pocket discovery approaches require large, post-processed MD datasets to train their models.  In contrast, this work presents ``Efficient Sequence-based cryptic Pocket prediction'' (ESP) leveraging advanced Protein Language Models (PLMs), and demonstrates significant improvement in predictive efficacy compared to ML-based cryptic pocket prediction SOTA (ROCAUC 0.93 vs 0.87).  ESP achieves detection of cryptic pockets via training on readily available, non cryptic-pocket-specific data from the PDBBind dataset, rather than costly simulation and post-processing.  Further, while SOTA's predictions often include positive signal broadly distributed over a target structure, ESP produces more spatially-focused predictions which increase downstream utility.",
        "keywords": "Protein Language Models;Protein Binding Pockets;Protein Binding Sites;Cryptic Protein Binding Pockets",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "David A Bloore;Joseph Chahn Kim;Karan Kapoor;Eric Chen;Kaifu Gao;Mengdi Wang;Ming-Hong Hao",
        "authorids": "~David_A_Bloore1;~Joseph_Chahn_Kim1;~Karan_Kapoor1;eric.chen@ensemtx.com;kaifu.gao@ensemtx.com;~Mengdi_Wang1;~Ming-Hong_Hao1",
        "gender": ";M;M;;;F;",
        "homepage": ";https://www.hadtomakeaurl.com/;https://www.ks.uiuc.edu/~kkapoor/;;;http://mwang.princeton.edu;",
        "dblp": ";;;;;;",
        "google_scholar": ";;28Ka7I8AAAAJ;;;;",
        "orcid": ";;;;;;",
        "linkedin": "david-bloore-9896b94b/;;;;;;",
        "or_profile": "~David_A_Bloore1;~Joseph_Chahn_Kim1;~Karan_Kapoor1;eric.chen@ensemtx.com;kaifu.gao@ensemtx.com;~Mengdi_Wang1;~Ming-Hong_Hao1",
        "aff": "Fidelity Investments;Princeton University;Ensem Therapeutics;;;Princeton University;",
        "aff_domain": "fidelity.com;princeton.edu;ensemtx.com;;;princeton.edu;",
        "position": "Principal Researcher;PhD student;Researcher;;;Full Professor;",
        "bibtex": "@misc{\nbloore2024protein,\ntitle={Protein Language Models Enable Accurate Cryptic Ligand Binding Pocket Prediction},\nauthor={David A Bloore and Joseph Chahn Kim and Karan Kapoor and Eric Chen and Kaifu Gao and Mengdi Wang and Ming-Hong Hao},\nyear={2024},\nurl={https://openreview.net/forum?id=SFCHv2G33F}\n}",
        "github": "",
        "project": "",
        "reviewers": "YdiM;1nRq;tBzC;3uqW",
        "site": "https://openreview.net/forum?id=SFCHv2G33F",
        "pdf_size": 1554104,
        "rating": "3;3;3;5",
        "confidence": "5;3;3;4",
        "soundness": "1;2;2;3",
        "contribution": "1;1;2;2",
        "presentation": "3;2;2;3",
        "wc_summary": "57;35;29;109",
        "wc_strengths": "52;26;33;65",
        "wc_weaknesses": "461;47;98;71",
        "wc_questions": "96;77;2;274",
        "wc_review": "666;185;162;519",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "296;243;93;450",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            57.5,
            31.5079355083763
        ],
        "wc_strengths_avg": [
            44.0,
            15.411035007422441
        ],
        "wc_weaknesses_avg": [
            169.25,
            169.4053939519046
        ],
        "wc_questions_avg": [
            112.25,
            99.78069703103903
        ],
        "wc_review_avg": [
            383.0,
            216.0034721943145
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            270.5,
            127.6058384244232
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.17407765595569782,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4114328159716425911&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "Fidelity Investments;Princeton University;Ensem Therapeutics",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.fidelity.com;https://www.princeton.edu;https://www.ensemtherapeutics.com",
        "aff_unique_abbr": "Fidelity;Princeton;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "SGQ9aDvObu",
        "title": "DIFAIR: Towards learning differenciated and interpretable representations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Neural network classifiers are generally trained to differentiate between the same classes during training and testing. In order to prevent incorrect predictions, when an input image contains a class that was not part of the training set, it should be detected. The process of detection of \\`\\`unknown'' classes is called Open Set Recogniton (OSR). Given that a neural network extracts a representation (a feature vector) describing an image, its capacity to detect the presence of a class in an image, through the recognition of specific features, should also imply the ability to detect the absence of a \\`\\`known'' class, through the absence of those features in the representation. In this article, we present DIFAIR, a novel approach introducing the key characteristics that a feature representation should exhibit to ensure: (i) class separability, through predefined class positions in the representation space; and (ii) interpretability by associating each dimension of the representation with a class. We present a loss function to optimize a model, in a supervised way, in order to produce the proposed representation. Our approach assumes that unknown classes should share only a limited number of features with known classes and therefore we evaluate its performance in OSR. Finally, we visually inspect learned representations to identify the flaws of our loss function and present directions for future improvement.",
        "keywords": "OSR;open set recognition;representation learning;interpretability;feature visualization;computer vision",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/bceba0734b845645f4a96097afcc3faf4f570bda.zip",
        "author": "Quentin Christoffel;Aline Deruyver;Ali Ayadi;Anne Jeannin-Girardon",
        "authorids": "~Quentin_Christoffel1;~Aline_Deruyver1;~Ali_Ayadi1;~Anne_Jeannin-Girardon1",
        "gender": "M;;M;",
        "homepage": ";https://cstb.icube.unistra.fr/index.php/Aline_Deruyver;https://cstb.icube.unistra.fr/index.php/Ali_Ayadi;https://ajeannin.github.io/",
        "dblp": ";https://dblp.org/search?q=Aline%20Deruyver;191/9244.html;",
        "google_scholar": ";;https://scholar.google.fr/citations?user=yGn8v_kAAAAJ;",
        "orcid": "0009-0000-2806-7344;0000-0001-5804-7491;0000-0003-1660-4100;",
        "linkedin": "qchristoffel/;;ali-ayadi-77546a72/?originalSubdomain=fr;",
        "or_profile": "~Quentin_Christoffel1;~Aline_Deruyver1;~Ali_Ayadi1;~Anne_Jeannin-Girardon1",
        "aff": "Universit\u00e9 de Strasbourg;Universit\u00e9 de Strasbourg;Universit\u00e9 de Strasbourg;Universit\u00e9 de Strasbourg",
        "aff_domain": "unistra.fr;unistra.fr;unistra.fr;unistra.fr",
        "position": "PhD student;Associate Professor;Associate Professor;Associate Professor",
        "bibtex": "@misc{\nchristoffel2024difair,\ntitle={{DIFAIR}: Towards learning differenciated and interpretable representations},\nauthor={Quentin Christoffel and Aline Deruyver and Ali Ayadi and Anne Jeannin-Girardon},\nyear={2024},\nurl={https://openreview.net/forum?id=SGQ9aDvObu}\n}",
        "github": "",
        "project": "",
        "reviewers": "8kv1;QmgY;agmg;xU1y;FwaY;Veq2",
        "site": "https://openreview.net/forum?id=SGQ9aDvObu",
        "pdf_size": 1055523,
        "rating": "3;3;3;3;5;5",
        "confidence": "4;3;4;4;3;3",
        "soundness": "1;1;2;3;3;2",
        "contribution": "1;2;2;2;2;2",
        "presentation": "2;1;4;2;2;3",
        "wc_summary": "103;33;90;48;156;95",
        "wc_strengths": "53;10;55;39;30;28",
        "wc_weaknesses": "232;143;318;90;71;90",
        "wc_questions": "25;44;2;4;30;17",
        "wc_review": "413;230;465;181;287;230",
        "wc_reply_reviewers": "0;39;19;0;0;0",
        "wc_reply_authors": "112;426;263;223;266;0",
        "reply_reviewers": "0;1;1;0;0;0",
        "reply_authors": "1;1;1;1;1;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            1.8333333333333333,
            0.3726779962499649
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            87.5,
            39.84448937222478
        ],
        "wc_strengths_avg": [
            35.833333333333336,
            15.46411616901816
        ],
        "wc_weaknesses_avg": [
            157.33333333333334,
            89.550110118426
        ],
        "wc_questions_avg": [
            20.333333333333332,
            14.659088951530682
        ],
        "wc_review_avg": [
            301.0,
            103.37472289362296
        ],
        "wc_reply_reviewers_avg": [
            9.666666666666666,
            14.83988619303471
        ],
        "wc_reply_authors_avg": [
            215.0,
            133.11899438722736
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            0.8333333333333334,
            0.37267799624996495
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.7071067811865474,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:E0oYhFLpXj8J:scholar.google.com/&scioq=DIFAIR:+Towards+learning+differenciated+and+interpretable+representations&hl=en&as_sdt=0,47",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Universit\u00e9 de Strasbourg",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.unistra.fr",
        "aff_unique_abbr": "Unistra",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "France"
    },
    {
        "id": "SHUQtRK0eU",
        "title": "Generalized Activation via Multivariate Projection",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Activation functions are essential to introduce nonlinearity into neural networks, with the Rectified Linear Unit (ReLU) often favored for its simplicity and effectiveness. Motivated by the structural similarity between a shallow Feedforward Neural Network (FNN) and a single iteration of the Projected Gradient Descent (PGD) algorithm, a standard approach for solving constrained optimization problems, we consider ReLU as a projection from $\\mathbb{R}$ onto the nonnegative half-line $\\mathbb{R}_+$. \nBuilding on this interpretation, we extend ReLU by substituting it with a generalized projection operator onto a convex cone, such as the Second-Order Cone (SOC) projection, thereby naturally extending it to a Multivariate Projection Unit (MPU), an activation function with multiple inputs and multiple outputs.\nWe further provide a mathematical proof establishing that FNNs activated by SOC projections outperform those utilizing ReLU in terms of expressive power. Experimental evaluations on widely-adopted architectures further corroborate MPU's effectiveness against a broader range of existing activation functions.",
        "keywords": "Neural Network;Activation;Deep Learning",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/b3df3f7dd7e20581b83913252cab7873e0d8d4cb.zip",
        "author": "Jiayun Li;Yuxiao Cheng;Zhuofan Xia;Yilin Mo;Gao Huang",
        "authorids": "~Jiayun_Li2;~Yuxiao_Cheng1;~Zhuofan_Xia2;~Yilin_Mo1;~Gao_Huang1",
        "gender": "F;M;;M;M",
        "homepage": ";;;https://yilinmo.github.io/;http://www.gaohuang.net",
        "dblp": ";324/5268;;;",
        "google_scholar": "PB8eXQQAAAAJ;f44eGhAAAAAJ;;UcpEexUAAAAJ;-P9LwcgAAAAJ",
        "orcid": "0000-0003-1943-9411;0000-0002-9097-1454;;;",
        "linkedin": ";;;;",
        "or_profile": "~Jiayun_Li2;~Yuxiao_Cheng1;~Zhuofan_Xia2;~Yilin_Mo1;~Gao_Huang1",
        "aff": "Tsinghua University;Tsinghua University;;Tsinghua University;Tsinghua University",
        "aff_domain": "mail.tsinghua.edu.cn;tsinghua.edu.cn;;tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "PhD student;PhD student;;Associate Professor;Associate Professor",
        "bibtex": "@misc{\nli2024generalized,\ntitle={Generalized Activation via Multivariate Projection},\nauthor={Jiayun Li and Yuxiao Cheng and Zhuofan Xia and Yilin Mo and Gao Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=SHUQtRK0eU}\n}",
        "github": "",
        "project": "",
        "reviewers": "WKdp;L1wf;MyBG",
        "site": "https://openreview.net/forum?id=SHUQtRK0eU",
        "pdf_size": 1459067,
        "rating": "6;6;8",
        "confidence": "4;3;4",
        "soundness": "3;3;3",
        "contribution": "2;3;2",
        "presentation": "2;4;3",
        "wc_summary": "47;199;142",
        "wc_strengths": "38;56;65",
        "wc_weaknesses": "27;216;289",
        "wc_questions": "208;174;183",
        "wc_review": "320;645;679",
        "wc_reply_reviewers": "31;146;117",
        "wc_reply_authors": "1504;2344;1381",
        "reply_reviewers": "1;1;1",
        "reply_authors": "3;4;4",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            129.33333333333334,
            62.69680126520721
        ],
        "wc_strengths_avg": [
            53.0,
            11.224972160321824
        ],
        "wc_weaknesses_avg": [
            177.33333333333334,
            110.400281803183
        ],
        "wc_questions_avg": [
            188.33333333333334,
            14.38363267359428
        ],
        "wc_review_avg": [
            548.0,
            161.81676880554335
        ],
        "wc_reply_reviewers_avg": [
            98.0,
            48.83304891839815
        ],
        "wc_reply_authors_avg": [
            1743.0,
            427.9275639638092
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.49999999999999983,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:xM_gb-mUQr0J:scholar.google.com/&scioq=Generalized+Activation+via+Multivariate+Projection&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Tsinghua University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Label-Agnostic Forgetting: A Supervision-Free Unlearning in Deep Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18610",
        "id": "SIZWiya7FE",
        "author_site": "Shaofei Shen, Chenhao Zhang, Yawen Zhao, Alina Bialkowski, Weitong Chen, Miao Xu",
        "tldr": "",
        "abstract": "Machine unlearning aims to remove information derived from forgotten data while preserving that of the remaining dataset in a well-trained model. With the increasing emphasis on data privacy, several approaches to machine unlearning have emerged. However, these methods typically rely on complete supervision throughout the unlearning process. Unfortunately, obtaining such supervision, whether for the forgetting or remaining data, can be impractical due to the substantial cost associated with annotating real-world datasets. This challenge prompts us to propose a supervision-free unlearning approach that operates without the need for labels during the unlearning process. Specifically, we introduce a variational approach to approximate the distribution of representations for the remaining data. Leveraging this approximation, we adapt the original model to eliminate information from the forgotten data at the representation level. To further address the issue of lacking supervision information, which hinders alignment with ground truth, we introduce a contrastive loss to facilitate the matching of representations between the remaining data and those of the original model, thus preserving predictive performance. Experimental results across various unlearning tasks demonstrate the effectiveness of our proposed method, Label-Agnostic Forgetting (LAF) without using any labels, which achieves comparable performance to state-of-the-art methods that rely on full supervision information. Furthermore, our approach excels in semi-supervised scenarios, leveraging limited supervision information to outperform fully supervised baselines. This work not only showcases the viability of supervision-free unlearning in deep models but also opens up a new possibility for future research in unlearning at the representation level.",
        "keywords": "Machine Unlearning;Unsupervised Learning;Deep Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/71ba9f76e45f5aefec4990400971b91c1721a4ac.pdf",
        "author": "Shaofei Shen;Chenhao Zhang;Yawen Zhao;Alina Bialkowski;Weitong Tony Chen;Miao Xu",
        "authorids": "~Shaofei_Shen1;~Chenhao_Zhang1;~Yawen_Zhao1;~Alina_Bialkowski4;~Weitong_Tony_Chen1;~Miao_Xu3",
        "gender": "M;;F;F;;F",
        "homepage": ";;;;;https://researchers.uq.edu.au/researcher/26509",
        "dblp": "247/9523;;257/5920;65/7802;;",
        "google_scholar": "RBLkGM4AAAAJ;;;BU7EwlsAAAAJ;;vqpIjSAAAAAJ",
        "orcid": "0000-0001-6232-0040;;0000-0002-3079-1347;0000-0002-5465-1162;;0000-0001-9409-6960",
        "linkedin": ";;;;;",
        "or_profile": "~Shaofei_Shen1;~Chenhao_Zhang1;~Yawen_Zhao1;~Alina_Bialkowski4;~Weitong_Tony_Chen1;~Miao_Xu3",
        "aff": "University of Queensland;;University of Queensland;University of Queensland;;University of Queensland",
        "aff_domain": "uq.edu.au;;uq.edu.au;uq.edu.au;;uq.edu.au",
        "position": "PhD student;;PhD student;Lecturer;;Lecturer",
        "bibtex": "@inproceedings{\nshen2024labelagnostic,\ntitle={Label-Agnostic Forgetting: A Supervision-Free Unlearning in Deep Models},\nauthor={Shaofei Shen and Chenhao Zhang and Yawen Zhao and Alina Bialkowski and Weitong Tony Chen and Miao Xu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=SIZWiya7FE}\n}",
        "github": "",
        "project": "",
        "reviewers": "iDSm;4NxB;1kCq;CMsQ",
        "pdf_size": 2014074,
        "rating": "3;5;8;8",
        "confidence": "4;3;4;4",
        "soundness": "1;2;3;4",
        "contribution": "2;2;3;4",
        "presentation": "2;2;2;3",
        "wc_summary": "124;63;101;122",
        "wc_strengths": "31;25;254;177",
        "wc_weaknesses": "146;117;62;95",
        "wc_questions": "138;1;226;58",
        "wc_review": "439;206;643;452",
        "wc_reply_reviewers": "0;400;71;42",
        "wc_reply_authors": "1796;2654;1934;1448",
        "reply_reviewers": "0;5;1;1",
        "reply_authors": "5;7;6;3",
        "rating_avg": [
            6.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            1.118033988749895
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            102.5,
            24.520399670478458
        ],
        "wc_strengths_avg": [
            121.75,
            97.64572443276766
        ],
        "wc_weaknesses_avg": [
            105.0,
            30.71644510681534
        ],
        "wc_questions_avg": [
            105.75,
            84.78317934590564
        ],
        "wc_review_avg": [
            435.0,
            154.9274023534894
        ],
        "wc_reply_reviewers_avg": [
            128.25,
            158.91251524030446
        ],
        "wc_reply_authors_avg": [
            1958.0,
            439.12868273434384
        ],
        "reply_reviewers_avg": [
            1.75,
            1.920286436967152
        ],
        "reply_authors_avg": [
            5.25,
            1.479019945774904
        ],
        "replies_avg": [
            35,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.2721655269759087,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7645991824528215167&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=SIZWiya7FE",
        "pdf": "https://openreview.net/pdf?id=SIZWiya7FE",
        "email": "uq.edu.au;;uq.edu.au;uq.edu.au;;uq.edu.au",
        "author_num": 6,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of Queensland",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uq.edu.au",
        "aff_unique_abbr": "UQ",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Australia"
    },
    {
        "id": "SIojR1ruNQ",
        "title": "TIGERScore: Building Explainable Metric for All Text Generation Task",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We present TIGERScore, a \\textbf{T}rained metric that follow \\textbf{I}nstruction \\textbf{G}uidance to perform \\textbf{E}xplainable, and \\textbf{R}eference-free evaluation over a wide spectrum of text generation tasks. \nDifferent from other automatic evaluation methods that only provide arcane scores, TIGERScore is guided by the natural language instruction to provide error analysis to pinpoint the mistakes in the generated text. Our metric is based on LLaMA, trained on our meticulously curated instruction-tuning dataset MetricInstruct that covers 6 text generation tasks and 23 text generation datasets. The dataset consists of 48K quadruple in the form of (instruction, input, system output $\\rightarrow$ error analysis). We collected the `system outputs' through diverse channels to cover different types of errors.\nTo quantitatively assess our metric, we evaluate its correlation with human ratings on 5 held-in datasets, 2 held-out datasets and show that TIGERScore can achieve the highest overall Spearman's correlation with human ratings across these datasets and outperforms other metrics significantly. As a reference-free metric, its correlation can even surpass the best existing reference-based metrics. To further qualitatively assess the rationale generated by our metric, we conduct human evaluation on the generated explanations and found that the explanations are 70.8\\% accurate.\nThrough these experimental results, we believe TIGERScore demonstrate the possibilities to build a universal explainable metrics to evaluate any text generation task.",
        "keywords": "Text Generation;Evaluation;Metrics;Instruction Tuning;Language Models",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/8e08b645b0dd17aed802cf835cf04b98b0275730.zip",
        "author": "Dongfu Jiang;Yishan Li;Ge Zhang;Wenhao Huang;Bill Yuchen Lin;Wenhu Chen",
        "authorids": "~Dongfu_Jiang1;~Yishan_Li2;~Ge_Zhang5;~Wenhao_Huang1;~Bill_Yuchen_Lin1;~Wenhu_Chen3",
        "gender": "M;Non-Binary;M;;M;",
        "homepage": "https://jdf-prog.github.io/;;;;http://yuchenlin.xyz/;",
        "dblp": "336/6970;;;;190/4518;",
        "google_scholar": "kciKEPUAAAAJ;5PfpWbAAAAAJ;qyTrq4kAAAAJ;;https://scholar.google.com/citations?hl=en;",
        "orcid": "0009-0007-9442-6721;;;;;",
        "linkedin": "dongfu-jiang-a76a15222/;;ge-zhang-792797169/;;;",
        "or_profile": "~Dongfu_Jiang1;~Yishan_Li2;~Ge_Zhang5;~Wenhao_Huang1;~Bill_Yuchen_Lin1;~Wenhu_Chen3",
        "aff": "Allen Institute for Artificial Intelligence;Tsinghua University;University of Waterloo;;Allen Institute for Artificial Intelligence;",
        "aff_domain": "allenai.org;tsinghua.edu.cn;cs.uwaterloo.ca;;allenai.org;",
        "position": "Intern;Undergrad student;PhD student;;Researcher;",
        "bibtex": "@misc{\njiang2024tigerscore,\ntitle={{TIGERS}core: Building Explainable Metric for All Text Generation Task},\nauthor={Dongfu Jiang and Yishan Li and Ge Zhang and Wenhao Huang and Bill Yuchen Lin and Wenhu Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=SIojR1ruNQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "Az3X;2ZJr;A6PK;WhZB",
        "site": "https://openreview.net/forum?id=SIojR1ruNQ",
        "pdf_size": 755452,
        "rating": "5;5;6;8",
        "confidence": "4;4;4;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;2",
        "wc_summary": "107;139;45;167",
        "wc_strengths": "76;49;63;236",
        "wc_weaknesses": "175;117;72;160",
        "wc_questions": "200;78;1;625",
        "wc_review": "558;383;181;1188",
        "wc_reply_reviewers": "0;0;0;115",
        "wc_reply_authors": "2506;972;795;1575",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "11;5;5;5",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            114.5,
            45.39548435692696
        ],
        "wc_strengths_avg": [
            106.0,
            75.66042558696059
        ],
        "wc_weaknesses_avg": [
            131.0,
            40.168395536789866
        ],
        "wc_questions_avg": [
            226.0,
            241.04252736809744
        ],
        "wc_review_avg": [
            577.5,
            376.87298921519965
        ],
        "wc_reply_reviewers_avg": [
            28.75,
            49.79646071760522
        ],
        "wc_reply_authors_avg": [
            1462.0,
            668.5233728150423
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            6.5,
            2.598076211353316
        ],
        "replies_avg": [
            34,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15306260689094617188&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Allen Institute for Artificial Intelligence;Tsinghua University;University of Waterloo",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://allenai.org;https://www.tsinghua.edu.cn;https://uwaterloo.ca",
        "aff_unique_abbr": "AI2;THU;UW",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;0",
        "aff_country_unique": "United States;China;Canada"
    },
    {
        "id": "SJ9lqUalq1",
        "title": "$\\gamma$-Orthogonalized Tensor Deflation: Towards Robust \\& Interpretable Tensor Decomposition in the Presence of Correlated Components",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We tackle the problem of recovering a low-rank tensor signal with possibly correlated components from a random noisy tensor, or the so-called \\textit{spiked tensor model}. When the underlying components are orthogonal, they can be recovered efficiently using \\textit{tensor deflation}, while correlated components may alter the tensor deflation mechanism, thereby preventing efficient recovery. \nRelying on recently developed tools from random tensor theory, we deal precisely with the non-orthogonal case by deriving an asymptotic analysis of a \\textit{parameterized} deflation procedure, which we refer to as $\\gamma$-orthogonalized tensor deflation. \nBased on this analysis, an efficient tensor deflation algorithm is proposed by optimizing the parameter injected into the deflation mechanism, which in turn is proven to be optimal by construction for the studied tensor model. We perform a detailed theoretical and algorithmic analysis on the rank-2 order-3 model, and outline a general structure to tackle the problem in more generality for arbitrary ranks/orders, aiming to lead to a broader impact in machine learning and beyond.",
        "keywords": "Low-rank signal reconstruction;tensor decomposition;random matrix theory;optimization.",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Mohammed Mahfoud;Mohamed El Amine Seddik;Merouane Abdelkader DEBBAH",
        "authorids": "~Mohammed_Mahfoud1;~Mohamed_El_Amine_Seddik1;~Merouane_Abdelkader_DEBBAH1",
        "gender": ";M;M",
        "homepage": ";https://melaseddik.github.io/;",
        "dblp": ";211/7861;75/4085",
        "google_scholar": ";https://scholar.google.fr/citations?user=85Hxd24AAAAJ;HU5I0X4AAAAJ",
        "orcid": ";;",
        "linkedin": ";melaseddik;merouanedebbah/",
        "or_profile": "~Mohammed_Mahfoud1;~Mohamed_El_Amine_Seddik1;~Merouane_Abdelkader_DEBBAH1",
        "aff": ";Technology Innovation Institute;Khalifa University of Science, Technology and Research",
        "aff_domain": ";polytechnique.edu;ku.ac.ae",
        "position": ";Researcher;Full Professor",
        "bibtex": "@misc{\nmahfoud2024gammaorthogonalized,\ntitle={\\${\\textbackslash}gamma\\$-Orthogonalized Tensor Deflation: Towards Robust {\\textbackslash}\\& Interpretable Tensor Decomposition in the Presence of Correlated Components},\nauthor={Mohammed Mahfoud and Mohamed El Amine Seddik and Merouane Abdelkader DEBBAH},\nyear={2024},\nurl={https://openreview.net/forum?id=SJ9lqUalq1}\n}",
        "github": "",
        "project": "",
        "reviewers": "Een1;rV4h;fjzE;54VG",
        "site": "https://openreview.net/forum?id=SJ9lqUalq1",
        "pdf_size": 608701,
        "rating": "3;5;5;8",
        "confidence": "3;3;3;5",
        "soundness": "2;3;3;4",
        "contribution": "2;3;2;3",
        "presentation": "1;1;2;3",
        "wc_summary": "100;48;108;105",
        "wc_strengths": "20;25;56;103",
        "wc_weaknesses": "174;61;127;51",
        "wc_questions": "55;2;4;54",
        "wc_review": "349;136;295;313",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "506;188;332;152",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            90.25,
            24.55987581401828
        ],
        "wc_strengths_avg": [
            51.0,
            33.03785707336358
        ],
        "wc_weaknesses_avg": [
            103.25,
            50.21142798208392
        ],
        "wc_questions_avg": [
            28.75,
            25.762133063859444
        ],
        "wc_review_avg": [
            273.25,
            81.59158964010935
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            294.5,
            139.4516045085176
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.8892972917998875,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:L00TGRY8g1YJ:scholar.google.com/&scioq=%24%5Cgamma%24-Orthogonalized+Tensor+Deflation:+Towards+Robust+%5C%26+Interpretable+Tensor+Decomposition+in+the+Presence+of+Correlated+Components&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Technology Innovation Institute;Khalifa University of Science, Technology and Research",
        "aff_unique_dep": ";",
        "aff_unique_url": ";https://www.kustar.ac.ae",
        "aff_unique_abbr": ";KUSTAR",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "1",
        "aff_country_unique": ";United Arab Emirates"
    },
    {
        "id": "SJPUmX4LXD",
        "title": "Brain2Music: Reconstructing Music from Human Brain Activity",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The process of reconstructing experiences from human brain activity offers a unique lens into how the brain interprets and represents the world. In this paper, we introduce a method for reconstructing music from brain activity, captured using functional magnetic resonance imaging (fMRI). Our approach uses either music retrieval or the MusicLM music generation model conditioned on embeddings derived from fMRI data. The generated music resembles the musical stimuli that human subjects experienced, with respect to semantic properties like genre, instrumentation, and mood. We investigate the relationship between different components of MusicLM and brain activity through a voxel-wise encoding modeling analysis. Furthermore, we discuss which brain regions represent information derived from purely textual descriptions of music stimuli. We provide supplementary material including examples of the reconstructed music at https://f2mu.github.io",
        "keywords": "neuroscience;deep learning;music generation;fmri",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/857299638cb62434c633b654cd8529e9f76d9de7.zip",
        "author": "Timo I. Denk;Yu Takagi;Takuya Matsuyama;Andrea Agostinelli;Tomoya Nakai;Christian Frank;Shinji Nishimoto",
        "authorids": "~Timo_I._Denk1;~Yu_Takagi1;~Takuya_Matsuyama1;~Andrea_Agostinelli1;~Tomoya_Nakai1;~Christian_Frank1;~Shinji_Nishimoto1",
        "gender": "M;M;;M;;M;M",
        "homepage": "https://yu-takagi.github.io/;https://suyamat.github.io/;;https://researchmap.jp/nakai.tomoya?lang=en;;https://nishimotolab.org;https://timodenk.com",
        "dblp": "217/8879;352/6172.html;;;;;",
        "google_scholar": "https://scholar.google.co.jp/citations?user=mxth_vkAAAAJ;;NM85zIEAAAAJ;zfU6gw8AAAAJ;TiV0z9gAAAAJ;;",
        "orcid": ";;;;;0000-0001-8015-340X;",
        "linkedin": ";;;;christian-frank-6b899b36/;;",
        "or_profile": "~Yu_Takagi1;~Takuya_Matsuyama1;~Andrea_Agostinelli1;~Tomoya_Nakai1;~Christian_Frank1;~Shinji_Nishimoto1;~Timo_Immanuel_Denk1",
        "aff": "Osaka University;National Institute of Information and Communications Technology (NICT), National Institute of Advanced Industrial Science and Technology;Google;;Research, Google;Osaka University;Google",
        "aff_domain": "osaka-u.ac.jp;nict.go.jp;google.com;;research.google.com;osaka-u.ac.jp;google.com",
        "position": "Assistant Professor;Collaborating Researcher;Researcher;;Researcher;Full Professor;Software Engineer",
        "bibtex": "@misc{\ndenk2024brainmusic,\ntitle={Brain2Music: Reconstructing Music from Human Brain Activity},\nauthor={Timo I. Denk and Yu Takagi and Takuya Matsuyama and Andrea Agostinelli and Tomoya Nakai and Christian Frank and Shinji Nishimoto},\nyear={2024},\nurl={https://openreview.net/forum?id=SJPUmX4LXD}\n}",
        "github": "",
        "project": "",
        "reviewers": "WEzt;fWGs;QVSZ",
        "site": "https://openreview.net/forum?id=SJPUmX4LXD",
        "pdf_size": 11520738,
        "rating": "3;3;8",
        "confidence": "5;4;3",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "4;3;3",
        "wc_summary": "91;187;118",
        "wc_strengths": "9;80;67",
        "wc_weaknesses": "288;251;41",
        "wc_questions": "2;63;47",
        "wc_review": "390;581;273",
        "wc_reply_reviewers": "0;171;0",
        "wc_reply_authors": "376;1065;148",
        "reply_reviewers": "0;1;0",
        "reply_authors": "1;2;1",
        "rating_avg": [
            4.666666666666667,
            2.357022603955158
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            132.0,
            40.422765862815474
        ],
        "wc_strengths_avg": [
            52.0,
            30.865298745786774
        ],
        "wc_weaknesses_avg": [
            193.33333333333334,
            108.76988962432982
        ],
        "wc_questions_avg": [
            37.333333333333336,
            25.82419193099542
        ],
        "wc_review_avg": [
            414.6666666666667,
            126.94443228786716
        ],
        "wc_reply_reviewers_avg": [
            57.0,
            80.61017305526642
        ],
        "wc_reply_authors_avg": [
            529.6666666666666,
            389.81391571990974
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.8660254037844387,
        "gs_citation": 16,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7584279482359735721&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;2;2;0;2",
        "aff_unique_norm": "Osaka University;National Institute of Information and Communications Technology;Google",
        "aff_unique_dep": ";;Google",
        "aff_unique_url": "https://www.osaka-u.ac.jp;https://www.nict.go.jp/;https://www.google.com",
        "aff_unique_abbr": "Osaka U;NICT;Google",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0;1;1;0;1",
        "aff_country_unique": "Japan;United States"
    },
    {
        "id": "SJTSvRtGsN",
        "title": "Tree-as-a-Prompt: Boosting Black-Box Large Language Models on Few-Shot Classification of Tabular Data",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) have achieved remarkable success across various natural language processing tasks, yet their application to tabular data presents unique challenges in terms of performance and interpretability. The intrinsic structure and characteristics of tabular data necessitate innovative strategies to unlock the full potential of LLMs in this domain. Recognizing the proficiency of decision trees in handling tabular data, we introduce Tree-as-a-Prompt in this paper. In addition to the original query, we propose to convert a decision tree into prompts and feed them into the LLM, aiming to enhance the performance of LLMs on tabular data. The decision tree is treated as a part of the composite model alongside the LLM and is optimized based on the LLM's predictions. Our results demonstrate that appending the decision tree as a prompt boosts the performance of LLMs on tabular data significantly. Additionally, the decision tree serves as an instrumental tool in elucidating the predictions of LLMs, thereby enhancing the model interpretability for different applications.",
        "keywords": "large language models; tabular data",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Qinbin Li;Yesheng Liang;Yiqun Diao;Chulin Xie;Bo Li;Bingsheng He;Dawn Song",
        "authorids": "~Qinbin_Li1;~Yesheng_Liang1;~Yiqun_Diao1;~Chulin_Xie1;~Bo_Li19;~Bingsheng_He1;~Dawn_Song1",
        "gender": "M;M;M;F;F;M;F",
        "homepage": "https://qinbinli.com/;https://liang2kl.github.io;;;http://boli.cs.illinois.edu/;http://www.comp.nus.edu.sg/~hebs/;",
        "dblp": "225/9769;;;245/4284;50/3402-26;h/BingshengHe.html;s/DXSong",
        "google_scholar": "https://scholar.google.com.sg/citations?user=1EMOEqQAAAAJ;;rlL7Uc4AAAAJ;WeJnzAgAAAAJ;K8vJkTcAAAAJ;https://scholar.google.com.tw/citations?user=RogYLKYAAAAJ;",
        "orcid": ";;;;;0000-0001-8618-4581;",
        "linkedin": ";;;;;bingsheng-he-7734b131;",
        "or_profile": "~Qinbin_Li1;~Yesheng_Liang1;~Yiqun_Diao1;~Chulin_Xie1;~Bo_Li19;~Bingsheng_He1;~Dawn_Song1",
        "aff": "University of California, Berkeley;Tsinghua University;National University of Singapore;University of Illinois, Urbana Champaign;University of Illinois, Urbana Champaign;National University of Singapore;University of California, Berkeley",
        "aff_domain": "berkeley.edu;tsinghua.edu.cn;nus.edu.sg;illinois.edu;illinois.edu;nus.edu.sg;berkeley.edu",
        "position": "Postdoc;Undergrad student;PhD student;PhD student;Assistant Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nli2024treeasaprompt,\ntitle={Tree-as-a-Prompt: Boosting Black-Box Large Language Models on Few-Shot Classification of Tabular Data},\nauthor={Qinbin Li and Yesheng Liang and Yiqun Diao and Chulin Xie and Bo Li and Bingsheng He and Dawn Song},\nyear={2024},\nurl={https://openreview.net/forum?id=SJTSvRtGsN}\n}",
        "github": "",
        "project": "",
        "reviewers": "3KZT;fSXp;iRXR",
        "site": "https://openreview.net/forum?id=SJTSvRtGsN",
        "pdf_size": 411848,
        "rating": "3;3;6",
        "confidence": "4;3;3",
        "soundness": "2;2;3",
        "contribution": "2;1;3",
        "presentation": "4;2;4",
        "wc_summary": "83;60;58",
        "wc_strengths": "38;29;67",
        "wc_weaknesses": "90;387;84",
        "wc_questions": "26;81;42",
        "wc_review": "237;557;251",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            67.0,
            11.343133018115703
        ],
        "wc_strengths_avg": [
            44.666666666666664,
            16.21384867602041
        ],
        "wc_weaknesses_avg": [
            187.0,
            141.44256784999345
        ],
        "wc_questions_avg": [
            49.666666666666664,
            23.098821518760552
        ],
        "wc_review_avg": [
            348.3333333333333,
            147.660270741847
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8695134415137659237&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;3;3;2;0",
        "aff_unique_norm": "University of California, Berkeley;Tsinghua University;National University of Singapore;University of Illinois Urbana-Champaign",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.berkeley.edu;https://www.tsinghua.edu.cn;https://www.nus.edu.sg;https://illinois.edu",
        "aff_unique_abbr": "UC Berkeley;THU;NUS;UIUC",
        "aff_campus_unique_index": "0;2;2;0",
        "aff_campus_unique": "Berkeley;;Urbana-Champaign",
        "aff_country_unique_index": "0;1;2;0;0;2;0",
        "aff_country_unique": "United States;China;Singapore"
    },
    {
        "id": "SJZL5w4Iez",
        "title": "Investigating the effective dimensionality of a model using a thermodynamic learning capacity",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We use a formal correspondence between thermodynamics and inference, where the number of samples can be thought of as the inverse temperature, to study a quantity called ``learning capacity'' which is a measure of the effective dimensionality of a model. We show that the learning capacity is a useful notion of the complexity because (a) it is a tiny fraction of the number of parameters for many deep networks trained on typical datasets and correlates well with the test loss, (b) it depends upon the number of samples used for training, (c) it is numerically consistent with notions of capacity obtained from PAC-Bayes generalization bounds, and (d) the test loss as a function of the learning capacity does not exhibit double descent. We show that the learning capacity saturates at very small and very large sample sizes; the threshold that characterizes the transition between these two regimes provides guidelines as to when one should procure more data and when one should search for a different architecture to improve performance. We show how the learning capacity can be used to provide a quantitative notion of capacity even for non-parametric models such as random forests and nearest neighbor classifiers.",
        "keywords": "thermodynamics;information theory;model selection;double descent",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Daiwei Chen;WEI-KAI CHANG;Pratik Chaudhari",
        "authorids": "~Daiwei_Chen1;~WEI-KAI_CHANG1;~Pratik_Chaudhari1",
        "gender": "M;M;M",
        "homepage": "https://github.com/ChenDaiwei-99;https://scholar.google.com.tw/citations?hl=zh-TW&user=o-cU7CAAAAAJ&view_op=list_works&gmla=AJsN-F5_PylM2Rk19letdRzWvwKLycnIgX3Im5RYhaS1sQsXFe018erH3c0hhoLHrOKpsfUwlQk7lzW_lcwwce0hB9BmdXXw2g;https://pratikac.github.io/",
        "dblp": ";;",
        "google_scholar": "x7b5TJMAAAAJ;;c_z5hWEAAAAJ",
        "orcid": ";;",
        "linkedin": "daiwei-chen-89969a230/;;pratik-chaudhari-59508765",
        "or_profile": "~Daiwei_Chen1;~WEI-KAI_CHANG1;~Pratik_Chaudhari1",
        "aff": "University of Wisconsin - Madison;Purdue University;School of Engineering and Applied Science, University of Pennsylvania",
        "aff_domain": "wisc.edu;purdue.edu;seas.upenn.edu",
        "position": "PhD student;PhD student;Assistant Professor",
        "bibtex": "@misc{\nchen2024investigating,\ntitle={Investigating the effective dimensionality of a model using a thermodynamic learning capacity},\nauthor={Daiwei Chen and WEI-KAI CHANG and Pratik Chaudhari},\nyear={2024},\nurl={https://openreview.net/forum?id=SJZL5w4Iez}\n}",
        "github": "",
        "project": "",
        "reviewers": "nwdU;anL3;4vaU;mHxX",
        "site": "https://openreview.net/forum?id=SJZL5w4Iez",
        "pdf_size": 2364941,
        "rating": "3;3;3;6",
        "confidence": "3;3;3;4",
        "soundness": "1;1;3;2",
        "contribution": "3;1;2;4",
        "presentation": "2;1;2;3",
        "wc_summary": "92;142;96;271",
        "wc_strengths": "121;48;34;94",
        "wc_weaknesses": "1510;397;305;155",
        "wc_questions": "2;127;88;201",
        "wc_review": "1725;714;523;721",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "3817;1903;1642;1328",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "6;3;3;2",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            1.118033988749895
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            150.25,
            72.4305702034714
        ],
        "wc_strengths_avg": [
            74.25,
            34.945493271665235
        ],
        "wc_weaknesses_avg": [
            591.75,
            537.1421483183013
        ],
        "wc_questions_avg": [
            104.5,
            71.75827478416687
        ],
        "wc_review_avg": [
            920.75,
            471.080871507218
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            2172.5,
            971.0330838854051
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            3.5,
            1.5
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:kYVdZrvy73EJ:scholar.google.com/&scioq=Investigating+the+effective+dimensionality+of+a+model+using+a+thermodynamic+learning+capacity&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of Wisconsin-Madison;Purdue University;University of Pennsylvania",
        "aff_unique_dep": ";;School of Engineering and Applied Science",
        "aff_unique_url": "https://www.wisc.edu;https://www.purdue.edu;https://www.upenn.edu",
        "aff_unique_abbr": "UW-Madison;Purdue;UPenn",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Madison;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "SKfBx2rv2c",
        "title": "Feasible Algorithmic Recourse Without Explicit Structure Prior",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "To ensure that vulnerable end-users have a clear understanding of decisions made by black-box models, algorithmic recourse has made significant progress by identifying small changes in input features that can alter predictions. However, the recoursed examples in real-world scenarios are only feasible and actionable for end-users if they preserve the realistic constraints among input features. Previous works have highlighted the importance of incorporating causality into algorithmic recourse to capture these constraints as causal relationships. Existing methods often rely on inaccessible prior Structural Causal Models (SCMs) or complete causal graphs. To maintain the causal relationships without such prior knowledge, we propose a novel approach that focuses on identifying and constraining the variation of exogenous noise by leveraging recent advancements in non-linear Independent Component Analysis (ICA). Based on this idea, we introduce two methods: Algorithmic Recourse with L2 norm (AR-L2) and Algorithmic Recourse with Nuclear norm (AR-Nuc). Experimental results on synthetic, semi-synthetic, and real-world data demonstrate the effectiveness of our proposed methods.",
        "keywords": "Deep learning;Black box;Algorithmic Recourse;Interpretability;Feasibility",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Haotian Wang;Hao Zou;Xueguang Zhou;Mingyang Geng;Shangwen Wang;Wenjing Yang;Peng Cui",
        "authorids": "~Haotian_Wang2;~Hao_Zou1;~Xueguang_Zhou2;~Mingyang_Geng1;~Shangwen_Wang1;~Wenjing_Yang1;~Peng_Cui1",
        "gender": "M;M;;M;M;F;M",
        "homepage": "https://www.researchgate.net/profile/Haotian-Wang-9;https://scholar.google.com/citations?user=f5cbI4cAAAAJ&hl=en;;;https://shangwenwang.github.io/;https://www.researchgate.net/scientific-contributions/Wen-Jing-Yang-2056467943;http://pengcui.thumedialab.com/",
        "dblp": "63/11345-1;13/4741-1;;204/1555;219/1645;48/3396-2;31/891-1",
        "google_scholar": "CbH1UJAAAAAJ;f5cbI4cAAAAJ;;;https://scholar.google.com.hk/citations?user=YAezhncAAAAJ;;https://scholar.google.com.tw/citations?user=G8x97ZgAAAAJ",
        "orcid": "0000-0003-2928-5575;0000-0002-6000-6936;;0000-0002-7239-1819;0000-0003-1469-2063;;0000-0003-2957-8511",
        "linkedin": ";;;;;;",
        "or_profile": "~Haotian_Wang2;~Hao_Zou1;~Xueguang_Zhou2;~Mingyang_Geng1;~Shangwen_Wang1;~Wenjing_Yang1;~Peng_Cui1",
        "aff": "National University of Defense Technology;Tsinghua University;;National University of Defense Technology;National University of Defense Technology;National University of Defense Technology;Tsinghua University",
        "aff_domain": "nudt.edu.cn;tsinghua.edu.cn;;nudt.edu.cn;nudt.edu.cn;nudt.edu.cn;tsinghua.edu.cn",
        "position": "PhD student;PhD student;;PhD student;Assistant Professor;Associate Professor;Associate Professor",
        "bibtex": "@misc{\nwang2024feasible,\ntitle={Feasible Algorithmic Recourse Without Explicit Structure Prior},\nauthor={Haotian Wang and Hao Zou and Xueguang Zhou and Mingyang Geng and Shangwen Wang and Wenjing Yang and Peng Cui},\nyear={2024},\nurl={https://openreview.net/forum?id=SKfBx2rv2c}\n}",
        "github": "",
        "project": "",
        "reviewers": "u6SK;sk1y;Nx58;k9bp;VUqJ",
        "site": "https://openreview.net/forum?id=SKfBx2rv2c",
        "pdf_size": 982995,
        "rating": "3;3;5;6;8",
        "confidence": "3;3;2;3;4",
        "soundness": "2;2;2;3;4",
        "contribution": "2;2;3;3;4",
        "presentation": "1;1;2;3;2",
        "wc_summary": "129;79;86;54;206",
        "wc_strengths": "41;82;104;32;199",
        "wc_weaknesses": "248;508;87;64;161",
        "wc_questions": "102;61;50;10;34",
        "wc_review": "520;730;327;160;600",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            5.0,
            1.8973665961010275
        ],
        "confidence_avg": [
            3.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.6,
            0.8
        ],
        "contribution_avg": [
            2.8,
            0.7483314773547882
        ],
        "presentation_avg": [
            1.8,
            0.7483314773547883
        ],
        "wc_summary_avg": [
            110.8,
            53.379396774411006
        ],
        "wc_strengths_avg": [
            91.6,
            59.82173518045093
        ],
        "wc_weaknesses_avg": [
            213.6,
            160.64196213941113
        ],
        "wc_questions_avg": [
            51.4,
            30.565339847611707
        ],
        "wc_review_avg": [
            467.4,
            201.7499442379105
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Z_gyvccL5F4J:scholar.google.com/&scioq=Feasible+Algorithmic+Recourse+Without+Explicit+Structure+Prior&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0;0;1",
        "aff_unique_norm": "National University of Defense Technology;Tsinghua University",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.nudt.edu.cn/;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "NUDT;THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Interventional Fairness on Partially Known Causal Graphs: A Constrained Optimization Approach",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18609",
        "id": "SKulT2VX9p",
        "author_site": "Aoqi Zuo, yiqing li, Susan Wei, Mingming Gong",
        "tldr": "",
        "abstract": "Fair machine learning aims to prevent discrimination against individuals or sub-populations based on sensitive attributes such as gender and race. In recent years, causal inference methods have been increasingly used in fair machine learning to measure unfairness by causal effects. However, current methods assume that the true causal graph is given, which is often not true in real-world applications. To address this limitation, this paper proposes a framework for achieving causal fairness based on the notion of interventions when the true causal graph is partially known. The proposed approach involves modeling fair prediction using a Partially Directed Acyclic Graph (PDAG), specifically, a class of causal DAGs that can be learned from observational data combined with domain knowledge. The PDAG is used to measure causal fairness, and a constrained optimization problem is formulated to balance between fairness and accuracy. Results on both simulated and real-world datasets demonstrate the effectiveness of this method.",
        "keywords": "trustworthy machine learning;causal inference;fairness",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/634e02c73fc1fa9d1b19fb401c9a334dc5c3775b.zip",
        "author": "Aoqi Zuo;Yiqing Li;Susan Wei;Mingming Gong",
        "authorids": "~Aoqi_Zuo1;~Yiqing_Li1;~Susan_Wei1;~Mingming_Gong1",
        "gender": "F;F;F;M",
        "homepage": ";https://leeedwina430.github.io/;https://www.suswei.com/;https://mingming-gong.github.io/",
        "dblp": "321/1755.html;189/0933;203/8878;98/8479",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;Udv9jsIAAAAJ;https://scholar.google.com.au/citations?user=6BmiCJIAAAAJ",
        "orcid": ";;0000-0002-6842-2352;0000-0001-7147-5589",
        "linkedin": ";yiqing-li-955340266/;;",
        "or_profile": "~Aoqi_Zuo1;~Yiqing_Li1;~Susan_Wei1;~Mingming_Gong1",
        "aff": "University of Melbourne;Fudan University;The University of Melbourne;University of Melbourne",
        "aff_domain": "unimelb.edu.au;fudan.edu.cn;unimelb.edu.au;unimelb.edu.au",
        "position": "PhD student;Undergrad student;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nzuo2024interventional,\ntitle={Interventional Fairness on Partially Known Causal Graphs: A Constrained Optimization Approach},\nauthor={Aoqi Zuo and Yiqing Li and Susan Wei and Mingming Gong},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=SKulT2VX9p}\n}",
        "github": "",
        "project": "",
        "reviewers": "U24x;T67w;93qw",
        "pdf_size": 1391052,
        "rating": "6;6;8",
        "confidence": "4;3;4",
        "soundness": "3;3;3",
        "contribution": "2;2;3",
        "presentation": "3;3;3",
        "wc_summary": "89;165;133",
        "wc_strengths": "45;115;132",
        "wc_weaknesses": "264;111;87",
        "wc_questions": "59;18;56",
        "wc_review": "457;409;408",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1034;698;490",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;2;1",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            129.0,
            31.15552385479446
        ],
        "wc_strengths_avg": [
            97.33333333333333,
            37.65043898224237
        ],
        "wc_weaknesses_avg": [
            154.0,
            78.39642849007855
        ],
        "wc_questions_avg": [
            44.333333333333336,
            18.660713336371206
        ],
        "wc_review_avg": [
            424.6666666666667,
            22.866763848189994
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            740.6666666666666,
            224.12694815414073
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.49999999999999983,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9278283902707594164&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=SKulT2VX9p",
        "pdf": "https://openreview.net/pdf?id=SKulT2VX9p",
        "email": "unimelb.edu.au;fudan.edu.cn;unimelb.edu.au;unimelb.edu.au",
        "author_num": 4,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "University of Melbourne;Fudan University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.unimelb.edu.au;https://www.fudan.edu.cn",
        "aff_unique_abbr": "UniMelb;Fudan",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "Australia;China"
    },
    {
        "title": "Rethinking the symmetry-preserving circuits for constrained variational quantum algorithms",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18608",
        "id": "SL7djdVpde",
        "author_site": "Ge Yan, Hongxu Chen, Kaisen Pan, Junchi Yan",
        "tldr": "",
        "abstract": "With the arrival of the Noisy Intermediate-Scale Quantum (NISQ) era, Variational Quantum Algorithms (VQAs) have emerged as popular approaches to obtain possible quantum advantage in the relatively near future. In particular, how to effectively incorporate the common symmetries in physical systems as hard constraints in VQAs remains a critical and open question. In this paper, we revisit the Hamming Weight (HW) preserving ansatz and establish the links from ansatz to various symmetries and constraints, which both enlarges the usage of HW preserving ansatz and provides a coherent solution for constrained VQAs. Meanwhile, we utilize the quantum optimal control theory and quantum overparameterization theory to analyze the capability and expressivity of HW preserving ansatz and verify these theoretical results on unitary approximation problem. We conduct detailed numerical experiments on two well-studied symmetry-preserving problems, namely ground state energy estimation and feature selection in machine learning. The superior performance demonstrates the efficiency and supremacy of the proposed HW preserving ansatz on constrained VQAs.",
        "keywords": "variational quantum algorithm;quantum machine learning;symmetry-preserving circuit",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Ge Yan;Hongxu Chen;Kaisen Pan;Junchi Yan",
        "authorids": "~Ge_Yan1;~Hongxu_Chen6;~Kaisen_Pan1;~Junchi_Yan2",
        "gender": "M;M;;M",
        "homepage": "https://github.com/GrahamYan;https://github.com/Mechtachx;https://github.com/pks0813;http://thinklab.sjtu.edu.cn/",
        "dblp": "169/8155;;;60/7949.html",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;;ga230VoAAAAJ",
        "orcid": ";;;0000-0001-9639-7679",
        "linkedin": ";;;",
        "or_profile": "~Ge_Yan1;~Hongxu_Chen6;~Kaisen_Pan1;~Junchi_Yan1",
        "aff": "Shanghai Jiaotong University;;Shanghai Jiaotong University;Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn;;sjtu.edu.cn;sjtu.edu.cn",
        "position": "PhD student;;Undergrad student;Full Professor",
        "bibtex": "@inproceedings{\nyan2024rethinking,\ntitle={Rethinking the symmetry-preserving circuits for constrained variational quantum algorithms},\nauthor={Ge Yan and Hongxu Chen and Kaisen Pan and Junchi Yan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=SL7djdVpde}\n}",
        "github": "",
        "project": "",
        "reviewers": "obpr;Yeih;Eu68;ADjN",
        "pdf_size": 889909,
        "rating": "5;6;8;8",
        "confidence": "4;4;3;5",
        "soundness": "4;4;4;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;4;2",
        "wc_summary": "60;67;59;109",
        "wc_strengths": "51;53;166;125",
        "wc_weaknesses": "56;163;169;273",
        "wc_questions": "22;68;9;178",
        "wc_review": "189;351;403;685",
        "wc_reply_reviewers": "287;68;0;53",
        "wc_reply_authors": "2827;1644;270;1705",
        "reply_reviewers": "2;1;0;1",
        "reply_authors": "7;4;1;5",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            73.75,
            20.58367071248469
        ],
        "wc_strengths_avg": [
            98.75,
            48.95086822519086
        ],
        "wc_weaknesses_avg": [
            165.25,
            76.75407155324075
        ],
        "wc_questions_avg": [
            69.25,
            66.50328939233006
        ],
        "wc_review_avg": [
            407.0,
            178.85748516626302
        ],
        "wc_reply_reviewers_avg": [
            102.0,
            109.7565487795603
        ],
        "wc_reply_authors_avg": [
            1611.5,
            906.4851074342038
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            4.25,
            2.165063509461097
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8906033660722896793&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=SL7djdVpde",
        "pdf": "https://openreview.net/pdf?id=SL7djdVpde",
        "email": "sjtu.edu.cn;;sjtu.edu.cn;sjtu.edu.cn",
        "author_num": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Shanghai Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sjtu.edu.cn",
        "aff_unique_abbr": "SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "SLA7VOqwwT",
        "title": "Split-Ensemble: Efficient OOD-aware Ensemble via Task and Model Splitting",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Uncertainty estimation is crucial for machine learning models to detect out-of-distribution (OOD) inputs. However, the conventional discriminative deep learning classifiers produce uncalibrated closed-set predictions for OOD data. A more robust classifiers with the uncertainty estimation typically require a potentially unavailable OOD dataset for outlier exposure training, or a considerable amount of additional memory and compute to build ensemble models. In this work, we improve on uncertainty estimation without extra OOD data or additional inference costs using an alternative Split-Ensemble method. Specifically, we propose a novel subtask-splitting ensemble training objective, where a common multiclass classification task is split into several complementary subtasks. Then, each subtask's training data can be considered as OOD to the other subtasks. Diverse submodels can therefore be trained on each subtask with OOD-aware objectives. The subtask-splitting objective enables us to share low-level features across submodels to avoid parameter and computational overheads. In particular, we build a tree-like Split-Ensemble architecture by performing iterative splitting and pruning from a shared backbone model, where each branch serves as a submodel corresponding to a subtask. This leads to improved accuracy and uncertainty estimation across submodels under a fixed ensemble computation budget. Empirical study with ResNet-18 backbone shows Split-Ensemble, without additional computation cost, improves accuracy over a single model by 0.8%, 1.8%, and 25.5% on CIFAR-10, CIFAR-100, and Tiny-ImageNet, respectively. OOD detection for the same backbone and in-distribution datasets surpasses a single model baseline by, correspondingly, 2.2%, 8.1%, and 29.6% mean AUROC.",
        "keywords": "OOD;Ensemble;Efficient model architecture",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/195b56f0b6c9da3ed541f125455f5decdb2d4e2e.pdf",
        "author": "Anthony Chen;Huanrui Yang;Yulu Gan;Denis A Gudovskiy;Zhen Dong;Haofan Wang;Tomoyuki Okuno;Yohei Nakata;Shanghang Zhang;Kurt Keutzer",
        "authorids": "~Anthony_Chen3;~Huanrui_Yang1;~Yulu_Gan1;~Denis_A_Gudovskiy1;~Zhen_Dong3;~Haofan_Wang1;~Tomoyuki_Okuno1;~Yohei_Nakata1;~Shanghang_Zhang4;~Kurt_Keutzer1",
        "gender": "M;M;M;M;M;M;M;M;M;F",
        "homepage": "https://atchen.com/;https://sites.google.com/view/huanrui-yang;https://yulugan.com/;https://gudovskiy.github.io/;https://dong-zhen.com/;https://haofanwang.github.io/;;;https://people.eecs.berkeley.edu/~keutzer/;https://www.shanghangzhang.com/",
        "dblp": ";221/2845;307/1107;136/4981;;234/7841.html;;27/8364.html;k/KurtKeutzer.html;95/11531",
        "google_scholar": ";bjNCUt8AAAAJ;https://scholar.google.com/citations?hl=en;03qjEm0AAAAJ;czxMUzcAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.co.jp/citations?user=E7BhgRsAAAAJ;MA5f-rYAAAAJ;ID9QePIAAAAJ;voqw10cAAAAJ",
        "orcid": ";;0009-0002-8541-2911;0000-0002-6829-6667;;;;0009-0006-9838-1367;0000-0003-3868-8501;",
        "linkedin": "anthony-chen-08873b254/;;yulu-g-31a626281/;gudovskiy;zhen-dong/;;;;kurtkeutzer/;",
        "or_profile": "~Anthony_Chen3;~Huanrui_Yang1;~Yulu_Gan1;~Denis_A_Gudovskiy1;~Zhen_Dong3;~Haofan_Wang1;~Tomoyuki_Okuno1;~Yohei_Nakata1;~Kurt_Keutzer1;~Shanghang_Zhang1",
        "aff": "Peking University;University of California, Berkeley;Peking University;Panasonic Corp;Nexusflow.ai Inc;Xiaohongshu;Panasonic Holdings Corporation;Panasonic;University of California, Berkeley;Peking University",
        "aff_domain": "pku.edu.cn;berkeley.edu;pku.edu.cn;panasonic.com;nexusflow.ai;xiaohongshu.com;panasonic.com;us.panasonic.com;berkeley.edu;pku.edu.cn",
        "position": "MS student;Postdoc;MS student;Senior Researcher;Principal Researcher;Researcher;Researcher;Researcher;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nchen2024splitensemble,\ntitle={Split-Ensemble: Efficient {OOD}-aware Ensemble via Task and Model Splitting},\nauthor={Anthony Chen and Huanrui Yang and Yulu Gan and Denis A Gudovskiy and Zhen Dong and Haofan Wang and Tomoyuki Okuno and Yohei Nakata and Shanghang Zhang and Kurt Keutzer},\nyear={2024},\nurl={https://openreview.net/forum?id=SLA7VOqwwT}\n}",
        "github": "",
        "project": "",
        "reviewers": "Fg3Y;FimD;ZwnE;37MR",
        "site": "https://openreview.net/forum?id=SLA7VOqwwT",
        "pdf_size": 1736431,
        "rating": "5;5;5;5",
        "confidence": "4;3;4;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;2;2",
        "presentation": "3;2;2;3",
        "wc_summary": "137;57;76;161",
        "wc_strengths": "107;88;17;22",
        "wc_weaknesses": "226;83;50;159",
        "wc_questions": "4;148;44;51",
        "wc_review": "474;376;187;393",
        "wc_reply_reviewers": "10;0;0;78",
        "wc_reply_authors": "1542;1808;1200;1513",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "4;4;3;4",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            107.75,
            42.64607250380743
        ],
        "wc_strengths_avg": [
            58.5,
            39.613760235554516
        ],
        "wc_weaknesses_avg": [
            129.5,
            68.30995535059293
        ],
        "wc_questions_avg": [
            61.75,
            52.92624585212898
        ],
        "wc_review_avg": [
            357.5,
            105.17247738833578
        ],
        "wc_reply_reviewers_avg": [
            22.0,
            32.58834147360065
        ],
        "wc_reply_authors_avg": [
            1515.75,
            215.52537553615352
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.75,
            0.4330127018922193
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:QSpKMtkYqfoJ:scholar.google.com/&scioq=Split-Ensemble:+Efficient+OOD-aware+Ensemble+via+Task+and+Model+Splitting&hl=en&as_sdt=0,5",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;0;2;3;4;5;2;1;0",
        "aff_unique_norm": "Peking University;University of California, Berkeley;Panasonic Corporation;Nexusflow.ai;Xiaohongshu;Panasonic Holdings Corporation",
        "aff_unique_dep": ";;;;;",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.berkeley.edu;https://www.panasonic.com;https://www.nexusflow.ai;https://www.xiaohongshu.com;https://www.panasonic.com/global",
        "aff_unique_abbr": "Peking U;UC Berkeley;Panasonic;Nexusflow.ai;XHS;PHC",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Berkeley",
        "aff_country_unique_index": "0;1;0;2;1;0;2;2;1;0",
        "aff_country_unique": "China;United States;Japan"
    },
    {
        "title": "Controlled Text Generation via Language Model Arithmetic",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18607",
        "id": "SLw9fp4yI6",
        "author_site": "Jasper Dekoninck, Marc Fischer, Luca Beurer-Kellner, Martin Vechev",
        "tldr": "",
        "abstract": "As Large Language Models (LLMs) are deployed more widely, customization with respect to vocabulary, style, and character becomes more important. In this work, we introduce model arithmetic, a novel inference framework for composing and biasing LLMs without the need for model (re)training or highly specific datasets. In addition, the framework allows for more precise control of generated text than direct prompting and prior controlled text generation (CTG) techniques. Using model arithmetic, we can express prior CTG techniques as simple formulas and naturally extend them to new and more effective formulations. Further, we show that speculative sampling, a technique for efficient LLM sampling, extends to our setting. This enables highly efficient text generation with multiple composed models with only marginal overhead over a single model. Our empirical evaluation demonstrates that model arithmetic allows fine-grained control of generated text while outperforming state-of-the-art on the task of toxicity reduction. We release an open source easy-to-use implementation of our framework at https://github.com/eth-sri/language-model-arithmetic.",
        "keywords": "Controlled text generation;LLM;Natural Language Processing",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/1d589305025bfa35dc59d60e735c4678218d9c2d.zip",
        "author": "Jasper Dekoninck;Marc Fischer;Luca Beurer-Kellner;Martin Vechev",
        "authorids": "~Jasper_Dekoninck1;~Marc_Fischer1;~Luca_Beurer-Kellner1;~Martin_Vechev1",
        "gender": "M;M;M;M",
        "homepage": ";;;https://www.sri.inf.ethz.ch/people/martin",
        "dblp": "361/7298;37/9373-2;314/2627;93/2189.html",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;https://scholar.google.com/citations?hl=de;https://scholar.google.ch/citations?user=aZ1Rh50AAAAJ",
        "orcid": ";;;",
        "linkedin": "jasper-dekoninck-8a1bb41a1/;;;",
        "or_profile": "~Jasper_Dekoninck1;~Marc_Fischer1;~Luca_Beurer-Kellner1;~Martin_Vechev1",
        "aff": "Department of Computer Science, ETHZ - ETH Zurich;Swiss Federal Institute of Technology;ETHZ - ETH Zurich;Swiss Federal Institute of Technology",
        "aff_domain": "inf.ethz.ch;ethz.ch;ethz.ch;ethz.ch",
        "position": "PhD student;PhD student;PhD student;Full Professor",
        "bibtex": "@inproceedings{\ndekoninck2024controlled,\ntitle={Controlled Text Generation via Language Model Arithmetic},\nauthor={Jasper Dekoninck and Marc Fischer and Luca Beurer-Kellner and Martin Vechev},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=SLw9fp4yI6}\n}",
        "github": "",
        "project": "",
        "reviewers": "bqfK;Ne4m;Gru5;gF67;dPAm",
        "pdf_size": 700937,
        "rating": "5;6;8;8;8",
        "confidence": "3;3;3;3;4",
        "soundness": "3;3;3;3;3",
        "contribution": "2;3;3;2;4",
        "presentation": "3;4;3;3;4",
        "wc_summary": "58;68;107;56;1211",
        "wc_strengths": "27;59;52;87;109",
        "wc_weaknesses": "131;177;229;129;295",
        "wc_questions": "9;4;14;55;1",
        "wc_review": "225;308;402;327;1616",
        "wc_reply_reviewers": "0;137;26;63;61",
        "wc_reply_authors": "415;353;619;636;1025",
        "reply_reviewers": "0;1;1;1;1",
        "reply_authors": "1;1;1;1;2",
        "rating_avg": [
            7.0,
            1.2649110640673518
        ],
        "confidence_avg": [
            3.2,
            0.39999999999999997
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.8,
            0.7483314773547882
        ],
        "presentation_avg": [
            3.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            300.0,
            455.8714731149559
        ],
        "wc_strengths_avg": [
            66.8,
            28.47033543883879
        ],
        "wc_weaknesses_avg": [
            192.2,
            63.07582738260355
        ],
        "wc_questions_avg": [
            16.6,
            19.703806738800502
        ],
        "wc_review_avg": [
            575.6,
            523.240136075206
        ],
        "wc_reply_reviewers_avg": [
            57.4,
            46.17618433781639
        ],
        "wc_reply_authors_avg": [
            609.6,
            235.39549698326857
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            1.2,
            0.4
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3952847075210474,
        "gs_citation": 29,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15100798356179039266&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=SLw9fp4yI6",
        "pdf": "https://openreview.net/pdf?id=SLw9fp4yI6",
        "email": "inf.ethz.ch;ethz.ch;ethz.ch;ethz.ch",
        "author_num": 4,
        "aff_unique_index": "0;1;0;1",
        "aff_unique_norm": "ETH Zurich;Swiss Federal Institute of Technology",
        "aff_unique_dep": "Department of Computer Science;",
        "aff_unique_url": "https://www.ethz.ch;https://www.ethz.ch",
        "aff_unique_abbr": "ETHZ;ETH Zurich",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Zurich;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Switzerland"
    },
    {
        "id": "SMZGQu6lld",
        "title": "LLM-Prop: Predicting Physical And Electronic Properties of Crystalline Solids From Their Text Descriptions",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The prediction of crystal properties plays a crucial role in the crystal design process. Current methods for predicting crystal properties focus on modeling crystal structures using graph neural networks (GNNs). Although GNNs are powerful, accurately modeling the complex interactions between atoms and molecules within a crystal remains a challenge. Surprisingly, predicting crystal properties from crystal text descriptions is understudied, despite the rich information and expressiveness that text data offer. One of the main reasons is the lack of publicly available data for this task. In this paper, we develop and make public a benchmark dataset (TextEdge) that contains text descriptions of crystal structures with their properties. We then propose LLM-Prop, a method that leverages the general-purpose learning capabilities of large language models (LLMs) to predict the physical and electronic properties of crystals from their text descriptions. LLM-Prop outperforms the current state-of-the-art GNN-based crystal property predictor by about 4% on predicting band gap, 3% on classifying whether the band gap is direct or indirect, and 66% on predicting unit cell volume. LLM-Prop also outperforms a finetuned MatBERT, a domain-specific pre-trained BERT model, despite having 3 times fewer parameters. Our empirical results may highlight the current inability of GNNs to capture information pertaining to space group symmetry and Wyckoff sites for accurate crystal property prediction.",
        "keywords": "Text embedding;Property prediction;Materials science;Machine learning",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Andre Niyongabo Rubungo;Craig Arnold;Barry Rand;Adji Bousso Dieng",
        "authorids": "~Andre_Niyongabo_Rubungo1;~Craig_Arnold1;~Barry_Rand1;~Adji_Bousso_Dieng1",
        "gender": "M;M;M;F",
        "homepage": "https://andrews2017.github.io/;;;https://vertaix.princeton.edu/",
        "dblp": "276/0370;;;188/6478",
        "google_scholar": "5qnTWQEAAAAJ;https://scholar.google.com/citations?hl=en;nReCjz4AAAAJ;ZCniP_MAAAAJ",
        "orcid": ";;0000-0003-4409-8751;0000-0001-5687-3554",
        "linkedin": "andre-niyongabo-rubungo-851370168/;;;diengadji45",
        "or_profile": "~Andre_Niyongabo_Rubungo1;~Craig_Arnold1;~Barry_Rand1;~Adji_Bousso_Dieng1",
        "aff": "Princeton University;Princeton University;Princeton University;Princeton University",
        "aff_domain": "princeton.edu;princeton.edu;princeton.edu;princeton.edu",
        "position": "PhD student;Full Professor;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nrubungo2024llmprop,\ntitle={{LLM}-Prop: Predicting Physical And Electronic Properties of Crystalline Solids From Their Text Descriptions},\nauthor={Andre Niyongabo Rubungo and Craig Arnold and Barry Rand and Adji Bousso Dieng},\nyear={2024},\nurl={https://openreview.net/forum?id=SMZGQu6lld}\n}",
        "github": "",
        "project": "",
        "reviewers": "Vdge;WsXq;vjeb",
        "site": "https://openreview.net/forum?id=SMZGQu6lld",
        "pdf_size": 505798,
        "rating": "3;3;5",
        "confidence": "3;3;4",
        "soundness": "2;2;3",
        "contribution": "1;2;2",
        "presentation": "3;2;3",
        "wc_summary": "49;51;51",
        "wc_strengths": "25;34;58",
        "wc_weaknesses": "90;80;79",
        "wc_questions": "13;1;161",
        "wc_review": "177;166;349",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "465;311;509",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;2;2",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            50.333333333333336,
            0.9428090415820634
        ],
        "wc_strengths_avg": [
            39.0,
            13.92838827718412
        ],
        "wc_weaknesses_avg": [
            83.0,
            4.96655480858378
        ],
        "wc_questions_avg": [
            58.333333333333336,
            72.76140613142535
        ],
        "wc_review_avg": [
            230.66666666666666,
            83.79472271900872
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            428.3333333333333,
            84.88947062046165
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 38,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16694401881788538580&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Princeton University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.princeton.edu",
        "aff_unique_abbr": "Princeton",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "SMZnJtkNX5",
        "title": "Temporal Parallelization for GPU Acceleration of Spiking Neural Networks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Inspired by neurobiological structures, Spiking Neural Networks (SNNs) are heralded as a significant advancement in deep learning, given their potential for superior computational efficiency. However, this potential often remains untapped on contemporary hardware platforms. Specifically, when deployed on standard GPUs, SNNs tend to require extended computation times, placing them at a disadvantage compared to traditional Artificial Neural Networks (ANNs). Such inefficiencies have somehow diminished enthusiasm for SNN research and presented the tangible challenge to achieving scalability. To address such a challenge, this study introduces a temporal parallelization method specifically tailored for accelerating the propagation dynamics of SNNs on GPUs. Furthermore, we furnish two distinct implementations\\footnote{The source code will be made publicly available.} based on the CUDA and JAX frameworks respectively, ensuring adaptability across both single and multi-GPU setups. When benchmarked against several established SNN implementations, the empirical analysis confirmed the efficacy of our proposed method. Notably, with the Leaky Integrate-and-Fire model as a test case, the CUDA-based implementation achieved $5\\times$ to $40\\times$ acceleration on the A100 GPU.",
        "keywords": "Spiking neural networks;High-performance computing;GPU acceleration",
        "primary_area": "infrastructure, software libraries, hardware, etc.",
        "supplementary_material": "/attachment/2c7be7b5d0032a455ce20c27af1552d901286f59.pdf",
        "author": "Jiachun Li;Yanchen Li;Kebin Sun;Ran Cheng",
        "authorids": "~Jiachun_Li2;~Yanchen_Li1;~Kebin_Sun1;~Ran_Cheng1",
        "gender": "F;M;M;M",
        "homepage": "https://github.com/ChristinaLJC;https://github.com/liyc5929;;https://chengran.tech/",
        "dblp": ";;;",
        "google_scholar": ";;5LmzvloAAAAJ;bjeIdlcAAAAJ",
        "orcid": ";;0009-0008-9213-7835;0000-0001-9410-8263",
        "linkedin": ";;;",
        "or_profile": "~Jiachun_Li2;~Yanchen_Li1;~Kebin_Sun1;~Ran_Cheng1",
        "aff": "Southern University of Science and Technology;South University of Science and Technology of China;Southern University of Science and Technology;Southern Unviersity of Science and Technology",
        "aff_domain": "mail.sustech.edu.cn;sustc.edu.cn;mail.sustech.edu.cn;sustech.edu.cn",
        "position": "Undergrad student;MS student;MS student;Asociate Professor",
        "bibtex": "@misc{\nli2024temporal,\ntitle={Temporal Parallelization for {GPU} Acceleration of Spiking Neural Networks},\nauthor={Jiachun Li and Yanchen Li and Kebin Sun and Ran Cheng},\nyear={2024},\nurl={https://openreview.net/forum?id=SMZnJtkNX5}\n}",
        "github": "",
        "project": "",
        "reviewers": "yZKs;VQqA;4kmC;81ci",
        "site": "https://openreview.net/forum?id=SMZnJtkNX5",
        "pdf_size": 626657,
        "rating": "3;3;3;3",
        "confidence": "5;4;4;3",
        "soundness": "3;3;2;1",
        "contribution": "2;2;2;2",
        "presentation": "1;2;1;2",
        "wc_summary": "24;18;51;62",
        "wc_strengths": "25;17;23;29",
        "wc_weaknesses": "27;86;246;322",
        "wc_questions": "130;5;15;10",
        "wc_review": "206;126;335;423",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            38.75,
            18.2944663764757
        ],
        "wc_strengths_avg": [
            23.5,
            4.330127018922194
        ],
        "wc_weaknesses_avg": [
            170.25,
            118.72736626405893
        ],
        "wc_questions_avg": [
            40.0,
            52.08166663999915
        ],
        "wc_review_avg": [
            272.5,
            114.5
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:MKfk5z2IW0kJ:scholar.google.com/&scioq=Temporal+Parallelization+for+GPU+Acceleration+of+Spiking+Neural+Networks&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Southern University of Science and Technology;South University of Science and Technology of China",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.sustech.edu.cn;https://www.sustech.edu.cn",
        "aff_unique_abbr": "SUSTech;SUSTech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "SN3iwsAp0n",
        "title": "Diversity, Plausibility, and Difficulty: Dynamic Data-Free Quantization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Without access to the original training data, data-free quantization (DFQ) aims to recover the performance loss induced by quantization. Most previous works have focused on using an original network to extract the train data information, which is instilled into surrogate synthesized images. However, existing DFQ methods do not take into account important aspects of quantization: the extent of a computational-cost-and-accuracy trade-off varies for each image depending on its task difficulty. Neglecting such aspects, previous works have resorted to the same-bit-width quantization. By contrast, without the original training data, we make dynamic quantization possible by modeling varying extents of task difficulties in synthesized data. To do so, we first note that networks are often confused with similar classes. Thus, we generate plausibly difficult images with soft labels, where the probabilities are allocated to a group of similar classes. Under data-free setting, we show that the class similarity information can be obtained from the similarities of corresponding weights in the classification layer. Using the class similarity, we generate plausible images of diverse difficulty levels, which enable us to train our framework to dynamically handle the varying trade-off. Consequently, we demonstrate that our first dynamic data-free quantization pipeline, dubbed DynaDFQ, achieves a better accuracy-complexity trade-off than existing data-free quantization approaches across various settings.",
        "keywords": "Data-Free Quantization;Dynamic Quantization;Image Classification",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Cheeun Hong;Sungyong Baik;Junghun Oh;Kyoung Mu Lee",
        "authorids": "~Cheeun_Hong1;~Sungyong_Baik1;~Junghun_Oh1;~Kyoung_Mu_Lee2",
        "gender": "F;M;M;M",
        "homepage": "https://cheeun.github.io/;https://dsybaik-hy.github.io/;;https://cv.snu.ac.kr/kmlee/",
        "dblp": "281/7988;243/2775;281/8729;17/4029",
        "google_scholar": "HHjMKhIAAAAJ;lQ4gotkAAAAJ;fCFkL9EAAAAJ;Hofj9kAAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Cheeun_Hong1;~Sungyong_Baik1;~Junghun_Oh1;~Kyoung_Mu_Lee1",
        "aff": "Seoul National University;Hanyang University;Seoul National University;Seoul National University",
        "aff_domain": "snu.ac.kr;hanyang.ac.kr;snu.ac.kr;snu.ac.kr",
        "position": "PhD student;Assistant Professor;PhD student;Full Professor",
        "bibtex": "@misc{\nhong2024diversity,\ntitle={Diversity, Plausibility, and Difficulty: Dynamic Data-Free Quantization},\nauthor={Cheeun Hong and Sungyong Baik and Junghun Oh and Kyoung Mu Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=SN3iwsAp0n}\n}",
        "github": "",
        "project": "",
        "reviewers": "P8Hw;Lwg9;Esi8;TLwm",
        "site": "https://openreview.net/forum?id=SN3iwsAp0n",
        "pdf_size": 7849464,
        "rating": "3;3;5;5",
        "confidence": "5;5;5;5",
        "soundness": "3;2;2;4",
        "contribution": "2;2;2;2",
        "presentation": "3;3;3;3",
        "wc_summary": "73;9;226;105",
        "wc_strengths": "21;12;55;51",
        "wc_weaknesses": "155;233;109;200",
        "wc_questions": "47;83;319;2",
        "wc_review": "296;337;709;358",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            5.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            103.25,
            78.8491439395508
        ],
        "wc_strengths_avg": [
            34.75,
            18.579222265746218
        ],
        "wc_weaknesses_avg": [
            174.25,
            46.75133687928079
        ],
        "wc_questions_avg": [
            112.75,
            122.48749936217982
        ],
        "wc_review_avg": [
            425.0,
            165.47658444625935
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:9xRGPYPvVKQJ:scholar.google.com/&scioq=Diversity,+Plausibility,+and+Difficulty:+Dynamic+Data-Free+Quantization&hl=en&as_sdt=0,31",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Seoul National University;Hanyang University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.snu.ac.kr;https://www.hanyang.ac.kr",
        "aff_unique_abbr": "SNU;HYU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "SNGANmQPLv",
        "title": "Understanding Multimodal Instruction Format for In-context Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The field of vision and language machine learning has witnessed a surge in interest regarding in-context learning\u2014a technique that enables rapid adaptation to new tasks with just a handful of annotated examples. To bolster the in-context learning capabilities of multimodal vision and language models, researchers have explored various instruction tuning formats. In this paper, we aim to study what should be the effective format for enhancing the in-context learning ability for vision and language models. We propose Unified Multimodal Instruction Tuning (UMIT), a framework to suggest how to construct a text-image interleaved instruction dataset by merging diverse visual instruction datasets in a unified multimodal instruction format. To examine the effectiveness of UMIT , we train several models based on OpenFlamingo in different multimodal instruction formats used by existing MLLMs. Extensive experiments confirm that UMIT can significantly improve the in-context learning ability on a wide range of vision-language tasks,  compared with prior formats, including MME Benchmark and SEED-Bench. Furthermore, we conduct a comprehensive study on the impact of different components in multimodal instruction formats on the in-context learning ability of MLLMs in 3 traditional vision-language tasks. The results indicate that UMIT  successfully constrains the model to focus on task-specific information within in-context exemplars by incorporating a task definition component, thus giving it remarkable advantages over prior formats on zero- and few-shot generalization during both the training and testing stages.",
        "keywords": "Visual instruction tuning;in-context learning;instruction format",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Yingzi Ma;Chunyuan Li;Chaowei Xiao",
        "authorids": "~Yingzi_Ma2;~Chunyuan_Li1;~Chaowei_Xiao2",
        "gender": ";M;M",
        "homepage": "http://chunyuan.li/;https://xiaocw11.github.io/;https://gray311.github.io/",
        "dblp": "64/9590;150/3317;362/5926",
        "google_scholar": "Zd7WmXUAAAAJ;Juoqtj8AAAAJ;jE9IZjkAAAAJ",
        "orcid": ";0000-0002-7043-4926;",
        "linkedin": ";;",
        "or_profile": "~Chunyuan_Li1;~chaowei_xiao1;~YingziYingzi_Ma1",
        "aff": "Microsoft Research;NVIDIA;Sichuan University",
        "aff_domain": "microsoft.com;nvidia.com;scu.edu.cn",
        "position": "Principal Researcher;Researcher;Undergrad student",
        "bibtex": "@misc{\nma2024understanding,\ntitle={Understanding Multimodal Instruction Format for In-context Learning},\nauthor={Yingzi Ma and Chunyuan Li and Chaowei Xiao},\nyear={2024},\nurl={https://openreview.net/forum?id=SNGANmQPLv}\n}",
        "github": "",
        "project": "",
        "reviewers": "y2C2;srth;4eXe;Sdyx",
        "site": "https://openreview.net/forum?id=SNGANmQPLv",
        "pdf_size": 861261,
        "rating": "5;5;5;6",
        "confidence": "5;4;4;4",
        "soundness": "2;2;2;2",
        "contribution": "2;2;2;3",
        "presentation": "2;2;3;2",
        "wc_summary": "48;64;28;51",
        "wc_strengths": "39;27;61;38",
        "wc_weaknesses": "180;111;123;116",
        "wc_questions": "22;5;23;29",
        "wc_review": "289;207;235;234",
        "wc_reply_reviewers": "0;0;0;11",
        "wc_reply_authors": "1329;733;1438;912",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "3;2;3;2",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            47.75,
            12.891373084353738
        ],
        "wc_strengths_avg": [
            41.25,
            12.336429791475327
        ],
        "wc_weaknesses_avg": [
            132.5,
            27.753378172755834
        ],
        "wc_questions_avg": [
            19.75,
            8.926785535678562
        ],
        "wc_review_avg": [
            241.25,
            29.768901558505647
        ],
        "wc_reply_reviewers_avg": [
            2.75,
            4.763139720814412
        ],
        "wc_reply_authors_avg": [
            1103.0,
            290.1215262609791
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:wkfZmHozaUIJ:scholar.google.com/&scioq=Understanding+Multimodal+Instruction+Format+for+In-context+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Microsoft;NVIDIA;Sichuan University",
        "aff_unique_dep": "Microsoft Research;NVIDIA Corporation;",
        "aff_unique_url": "https://www.microsoft.com/en-us/research;https://www.nvidia.com;https://www.scu.edu.cn",
        "aff_unique_abbr": "MSR;NVIDIA;SCU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "Neuron Activation Coverage: Rethinking Out-of-distribution Detection and Generalization",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18606",
        "id": "SNGXbZtK6Q",
        "author_site": "Yibing Liu, Chris Xing TIAN, Haoliang Li, Lei Ma, Shiqi Wang",
        "tldr": "",
        "abstract": "The out-of-distribution (OOD) problem generally arises when neural networks encounter data that significantly deviates from the training data distribution, i.e., in-distribution (InD). In this paper, we study the OOD problem from a neuron activation view. We first formulate neuron activation states by considering both the neuron output and its influence on model decisions. Then, to characterize the relationship between neurons and OOD issues, we introduce the *neuron activation coverage* (NAC) -- a simple measure for neuron behaviors under InD data. Leveraging our NAC, we show that 1) InD and OOD inputs can be largely separated based on the neuron behavior, which significantly eases the OOD detection problem and beats the 21 previous methods over three benchmarks (CIFAR-10, CIFAR-100, and ImageNet-1K). 2) a positive correlation between NAC and model generalization ability consistently holds across architectures and datasets, which enables a NAC-based criterion for evaluating model robustness. Compared to prevalent InD validation criteria, we show that NAC not only can select more robust models, but also has a stronger correlation with OOD test performance.",
        "keywords": "Out-of-distribution;Generalization;Neuron Activation",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Yibing Liu;Chris XING TIAN;Haoliang Li;Lei Ma;Shiqi Wang",
        "authorids": "~Yibing_Liu1;~Chris_XING_TIAN1;~Haoliang_Li2;~Lei_Ma1;~Shiqi_Wang1",
        "gender": "Not Specified;M;;M;M",
        "homepage": "https://bierone.github.io;;;https://www.malei.org;https://www.cs.cityu.edu.hk/~shiqwang/",
        "dblp": ";166/6330;;20/6534-3;58/9145-1",
        "google_scholar": "NcmJACMAAAAJ;;;xsfGc58AAAAJ;Pr7s2VUAAAAJ",
        "orcid": "0000-0002-2862-5542;0000-0002-6709-0261;;;",
        "linkedin": ";;;lei-ma-345a0484;",
        "or_profile": "~Yibing_Liu1;~Chris_XING_TIAN1;~Haoliang_Li2;~Lei_Ma1;~Shiqi_Wang1",
        "aff": "City University of Hong Kong;City University of Hong Kong;;University of Alberta;City University of Hong Kong",
        "aff_domain": "cityu.edu.hk;cityu.edu.hk;;ualberta.ca;cityu.edu.hk",
        "position": "PhD student;PhD student;;Associate Professor;Associate Professor",
        "bibtex": "@inproceedings{\nliu2024neuron,\ntitle={Neuron Activation Coverage: Rethinking Out-of-distribution Detection and Generalization},\nauthor={Yibing Liu and Chris XING TIAN and Haoliang Li and Lei Ma and Shiqi Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=SNGXbZtK6Q}\n}",
        "github": "",
        "project": "",
        "reviewers": "iXGU;pybD;sJ3q;xpKd",
        "pdf_size": 2075872,
        "rating": "5;6;8;8",
        "confidence": "4;3;3;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;3;4",
        "wc_summary": "89;220;92;114",
        "wc_strengths": "54;229;113;53",
        "wc_weaknesses": "242;263;43;95",
        "wc_questions": "22;5;24;40",
        "wc_review": "407;717;272;302",
        "wc_reply_reviewers": "189;18;26;43",
        "wc_reply_authors": "2295;1218;1251;782",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "5;3;3;2",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            128.75,
            53.560129760858494
        ],
        "wc_strengths_avg": [
            112.25,
            71.64975575673654
        ],
        "wc_weaknesses_avg": [
            160.75,
            93.86792583199014
        ],
        "wc_questions_avg": [
            22.75,
            12.397076268217438
        ],
        "wc_review_avg": [
            424.5,
            176.15689029952816
        ],
        "wc_reply_reviewers_avg": [
            69.0,
            69.86773218017026
        ],
        "wc_reply_authors_avg": [
            1386.5,
            556.224999438177
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.25,
            1.0897247358851685
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.7777777777777777,
        "gs_citation": 21,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2682763210765537935&as_sdt=1005&sciodt=0,4&hl=en",
        "gs_version_total": 8,
        "openreview": "https://openreview.net/forum?id=SNGXbZtK6Q",
        "pdf": "https://openreview.net/pdf?id=SNGXbZtK6Q",
        "email": "cityu.edu.hk;cityu.edu.hk;;ualberta.ca;cityu.edu.hk",
        "author_num": 5,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "City University of Hong Kong;University of Alberta",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cityu.edu.hk;https://www.ualberta.ca",
        "aff_unique_abbr": "CityU;UAlberta",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "China;Canada"
    },
    {
        "id": "SNzpTSuuVJ",
        "title": "Every Mistake Counts: Spatial and Temporal Beliefs for Mistake Detection in Assembly Tasks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Assembly tasks, as an integral part of daily routines and activities, involve a series of sequential steps that are prone to error. This paper proposes a novel method for identifying ordering mistakes in assembly tasks based on knowledge-grounded beliefs. The beliefs comprise spatial and temporal aspects, each serving a unique role. \nSpatial beliefs capture the structural relationships among assembly components, indicating their topological feasibility. Temporal beliefs model the action preconditions and enforce sequencing constraints. Furthermore, we introduce a learning algorithm that dynamically updates and augments the belief sets in an online manner. \nTo evaluate our approach, we first test its ability to deduce the predefined rules using synthetic data from industry assembly, and then apply it to a real-world dataset, enhanced with a new collection of annotations providing part information. We demonstrate our framework achieves superior performance in detecting ordering mistakes under both synthetic and real-world settings.",
        "keywords": "mistake detection",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/2b9f580bb3bee3d15fcbd34d792b8be8b3223c48.pdf",
        "author": "Guodong Ding;Fadime Sener;Shugao Ma;Angela Yao",
        "authorids": "~Guodong_Ding1;~Fadime_Sener1;~Shugao_Ma3;~Angela_Yao1",
        "gender": "M;F;M;",
        "homepage": "https://comp.nus.edu.sg/~dinggd;https://fadimesener.github.io/;https://shugaoma.github.io/;http://www.angelayao.com",
        "dblp": "54/5798;119/1497;70/418;64/8484",
        "google_scholar": "PqlGbTYAAAAJ;-juoweoAAAAJ;SUd2LJUAAAAJ;https://scholar.google.ch/citations?user=-LJCZMMAAAAJ",
        "orcid": "0000-0001-6080-5220;0000-0001-5004-6005;;",
        "linkedin": ";;;",
        "or_profile": "~Guodong_Ding1;~Fadime_Sener1;~Shugao_Ma3;~Angela_Yao1",
        "aff": "Natioal University of Singapore;Meta;Meta;National University of Singapore",
        "aff_domain": "nus.edu.sg;meta.com;meta.com;nus.edu.sg",
        "position": "Postdoc;Researcher;Research Scientist Manager;Associate Professor",
        "bibtex": "@misc{\nding2024every,\ntitle={Every Mistake Counts: Spatial and Temporal Beliefs for Mistake Detection in Assembly Tasks},\nauthor={Guodong Ding and Fadime Sener and Shugao Ma and Angela Yao},\nyear={2024},\nurl={https://openreview.net/forum?id=SNzpTSuuVJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "MJjr;6neE;ugZt;RoBJ",
        "site": "https://openreview.net/forum?id=SNzpTSuuVJ",
        "pdf_size": 807554,
        "rating": "3;5;5;5",
        "confidence": "4;3;2;2",
        "soundness": "2;2;3;2",
        "contribution": "1;3;2;2",
        "presentation": "2;1;2;1",
        "wc_summary": "130;47;45;47",
        "wc_strengths": "41;84;31;30",
        "wc_weaknesses": "565;33;159;71",
        "wc_questions": "128;155;13;2",
        "wc_review": "864;319;248;150",
        "wc_reply_reviewers": "388;0;0;0",
        "wc_reply_authors": "1063;546;355;459",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            67.25,
            36.237929024711114
        ],
        "wc_strengths_avg": [
            46.5,
            22.073740054644116
        ],
        "wc_weaknesses_avg": [
            207.0,
            211.68372634664195
        ],
        "wc_questions_avg": [
            74.5,
            67.78827332216096
        ],
        "wc_review_avg": [
            395.25,
            277.2051361356784
        ],
        "wc_reply_reviewers_avg": [
            97.0,
            168.0089283341811
        ],
        "wc_reply_authors_avg": [
            605.75,
            272.5154812116185
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8703882797784891,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:deufnqsAknMJ:scholar.google.com/&scioq=Every+Mistake+Counts:+Spatial+and+Temporal+Beliefs+for+Mistake+Detection+in+Assembly+Tasks&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;0",
        "aff_unique_norm": "National University of Singapore;Meta",
        "aff_unique_dep": ";Meta Platforms, Inc.",
        "aff_unique_url": "https://www.nus.edu.sg;https://meta.com",
        "aff_unique_abbr": "NUS;Meta",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "Singapore;United States"
    },
    {
        "id": "SQFDJLyJNB",
        "title": "PromptCCD: Learning Gaussian Mixture Prompt Pool for Continual Category Discovery",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this paper, we address the challenging open-world learning problem of continual category discovery (CCD). Initially, a labelled dataset consisting of known categories is provided to the model. Subsequently, unlabelled data arrives continuously at different time steps, which may contain objects from known or novel categories. The primary objective of CCD is to automatically assign labels to unlabelled objects, regardless of whether they belong to seen or unseen categories. However, the crucial challenge in continual category discovery is to automatically discover new categories in the unlabelled stream without experiencing catastrophic forgetting, which remains an open problem even in conventional, fully supervised continual learning.\nTo address this challenge, we propose PromptCCD, a simple yet effective approach that utilizes Gaussian mixture model as a prompting method for CCD. At the core of PromptCCD is our proposed Gaussian Mixture Prompt Module (GMP), which acts as a dynamic pool updating over time to provide guidance for embedding data representation and avoid forgetting during continual category discovery. \nAdditionally, we introduce a GM-based category estimation module into PromptCCD, which enables it to discover categories in the unlabelled stream without prior knowledge of category numbers.\nFinally, we extend the standard evaluation metric for generalized category discovery to CCD and benchmark state-of-the-art methods using different datasets. Our PromptCCD significantly outperforms other methods, demonstrating the effectiveness of our approach.",
        "keywords": "Continuous Category Discovery;Generalized Category Discovery;Continual Learning;Incremental Learning;Open World",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Fernando Julio Cendra;Bingchen Zhao;Kai Han",
        "authorids": "~Fernando_Julio_Cendra1;~Bingchen_Zhao1;~Kai_Han1",
        "gender": "M;M;M",
        "homepage": "https://fcendra.github.io;http://bzhao.me/;http://www.kaihan.org/",
        "dblp": "332/1120;120/3602;51/4757-1.html",
        "google_scholar": "cnChUoEAAAAJ;lEcqFJEAAAAJ;tG8S_vMAAAAJ",
        "orcid": "0000-0002-2409-0843;;0000-0002-7995-9999",
        "linkedin": "fernando-julio-cendra/;;kaihancs/",
        "or_profile": "~Fernando_Julio_Cendra1;~Bingchen_Zhao1;~Kai_Han1",
        "aff": "The University of Hong Kong;University of Edinburgh, University of Edinburgh;The University of Hong Kong",
        "aff_domain": "hku.hk;ed.ac.uk;hku.hk",
        "position": "MPhil Student;PhD student;Assistant Professor",
        "bibtex": "@misc{\ncendra2024promptccd,\ntitle={Prompt{CCD}: Learning Gaussian Mixture Prompt Pool for Continual Category Discovery},\nauthor={Fernando Julio Cendra and Bingchen Zhao and Kai Han},\nyear={2024},\nurl={https://openreview.net/forum?id=SQFDJLyJNB}\n}",
        "github": "",
        "project": "",
        "reviewers": "si3G;YA1L;k1JJ;1nUF",
        "site": "https://openreview.net/forum?id=SQFDJLyJNB",
        "pdf_size": 8618184,
        "rating": "3;5;5;6",
        "confidence": "5;4;5;3",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;2;3;2",
        "wc_summary": "177;59;106;99",
        "wc_strengths": "45;47;96;82",
        "wc_weaknesses": "472;246;166;98",
        "wc_questions": "19;6;110;67",
        "wc_review": "713;358;478;346",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1028;654;504;257",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            110.25,
            42.50514674718816
        ],
        "wc_strengths_avg": [
            67.5,
            22.073740054644116
        ],
        "wc_weaknesses_avg": [
            245.5,
            140.87139525112968
        ],
        "wc_questions_avg": [
            50.5,
            41.18555572042218
        ],
        "wc_review_avg": [
            473.75,
            147.45910450019693
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            610.75,
            279.5097270221557
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.7608859102526822,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17725946705363819582&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 10,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Hong Kong;University of Edinburgh",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.hku.hk;https://www.ed.ac.uk",
        "aff_unique_abbr": "HKU;Edinburgh",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "title": "The Devil is in the Neurons: Interpreting and Mitigating Social Biases in Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18605",
        "id": "SQGUDc9tC8",
        "author_site": "Yan Liu, Yu Liu, Xiaokang Chen, Pin-Yu Chen, Daoguang Zan, Min-Yen Kan, Tsung-Yi Ho",
        "tldr": "",
        "abstract": "Pre-trained Language models (PLMs) have been acknowledged to contain harmful information, such as social biases, which may cause negative social impacts or even bring catastrophic results in application. Previous works on this problem mainly focused on using black-box methods such as probing to detect and quantify social biases in PLMs by observing model outputs. As a result, previous debiasing methods mainly finetune or even pre-train PLMs on newly constructed anti-stereotypical datasets, which are high-cost. In this work, we try to unveil the mystery of social bias inside language models by introducing the concept of {\\sc Social Bias Neurons}. Specifically, we propose {\\sc Integrated Gap Gradients (IG$^2$)} to accurately pinpoint units (i.e., neurons) in a language model that can be attributed to undesirable behavior, such as social bias.  By formalizing undesirable behavior as a distributional property of language, we employ sentiment-bearing prompts to elicit classes of sensitive words (demographics) correlated with such sentiments. Our IG$^2$ thus attributes the uneven distribution for different demographics to specific Social Bias Neurons, which track the trail of unwanted behavior inside PLM units to achieve interoperability. Moreover, derived from our interpretable technique, {\\sc Bias Neuron Suppression (BNS)} is further proposed to mitigate social biases. By studying BERT, RoBERTa, and their attributable differences from debiased FairBERTa, IG$^2$ allows us to locate and suppress identified neurons, and further mitigate undesired behaviors. As measured by prior metrics from StereoSet, our model achieves a higher degree of fairness while maintaining language modeling ability with low cost\\footnote{This work contains examples that potentially implicate stereotypes, associations, and other harms that could be offensive to individuals in certain social groups.}.",
        "keywords": "Interpretable social bias",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Yan Liu;Yu Liu;Xiaokang Chen;Pin-Yu Chen;Daoguang Zan;Min-Yen Kan;Tsung-Yi Ho",
        "authorids": "~Yan_Liu13;~Yu_Liu34;~Xiaokang_Chen1;~Pin-Yu_Chen1;~Daoguang_Zan1;~Min-Yen_Kan1;~Tsung-Yi_Ho2",
        "gender": ";M;M;M;M;M;M",
        "homepage": ";;https://charlescxk.github.io/;http://www.pinyuchen.com;;https://www.comp.nus.edu.sg/~kanmy/;https://www.cse.cuhk.edu.hk/people/faculty/tsung-yi-ho/",
        "dblp": ";;163/6632;39/8969;305/5798;k/MinYenKan;63/4181.html",
        "google_scholar": ";;https://scholar.google.com.hk/citations?view_op=list_works;jxwlCUUAAAAJ;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com.tw/citations?user=aNVcd3EAAAAJ;TRDUYkAAAAAJ",
        "orcid": ";;;0000-0003-1039-8369;0009-0009-4269-8543;;0000-0001-7348-5625",
        "linkedin": ";yu-liu-027992292/;;pin-yu-chen-940062a2;;;",
        "or_profile": "~Yan_Liu13;~Yu_Liu34;~Xiaokang_Chen1;~Pin-Yu_Chen1;~Daoguang_Zan1;~Min-Yen_Kan1;~Tsung-Yi_Ho2",
        "aff": ";University of Eastern Finland;Peking University;International Business Machines;Institute of Software, Chinese Academy of Sciences;National University of Singapore;Department of Computer Science and Engineering, The Chinese University of Hong Kong",
        "aff_domain": ";uef.fi;pku.edu.cn;ibm.com;ucas.ac.cn;nus.edu.sg;cse.cuhk.edu.hk",
        "position": ";Undergrad student;PhD student;Principal Researcher;PhD student;Associate Professor;Full Professor",
        "bibtex": "@inproceedings{\nliu2024the,\ntitle={The Devil is in the Neurons: Interpreting and Mitigating Social Biases in Language Models},\nauthor={Yan Liu and Yu Liu and Xiaokang Chen and Pin-Yu Chen and Daoguang Zan and Min-Yen Kan and Tsung-Yi Ho},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=SQGUDc9tC8}\n}",
        "github": "",
        "project": "",
        "reviewers": "zYP2;GcZ6;jE7C;auwC;pmu7",
        "pdf_size": 1398110,
        "rating": "6;6;6;8;8",
        "confidence": "3;4;4;3;4",
        "soundness": "3;3;3;4;3",
        "contribution": "3;3;3;4;4",
        "presentation": "3;3;3;4;4",
        "wc_summary": "147;64;61;92;193",
        "wc_strengths": "56;28;33;164;55",
        "wc_weaknesses": "98;99;47;180;88",
        "wc_questions": "84;19;107;26;118",
        "wc_review": "385;210;248;462;454",
        "wc_reply_reviewers": "47;0;0;0;0",
        "wc_reply_authors": "534;718;826;349;1307",
        "reply_reviewers": "1;0;0;0;0",
        "reply_authors": "1;1;2;1;2",
        "rating_avg": [
            6.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            3.2,
            0.39999999999999997
        ],
        "contribution_avg": [
            3.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            3.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            111.4,
            51.164831671764546
        ],
        "wc_strengths_avg": [
            67.2,
            49.700704220362915
        ],
        "wc_weaknesses_avg": [
            102.4,
            43.19537012227121
        ],
        "wc_questions_avg": [
            70.8,
            40.99463379516885
        ],
        "wc_review_avg": [
            351.8,
            104.47277157230968
        ],
        "wc_reply_reviewers_avg": [
            9.4,
            18.800000000000004
        ],
        "wc_reply_authors_avg": [
            746.8,
            323.86873884337774
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            1.4,
            0.4898979485566356
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.16666666666666663,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9611828330508043381&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=SQGUDc9tC8",
        "pdf": "https://openreview.net/pdf?id=SQGUDc9tC8",
        "email": ";uef.fi;pku.edu.cn;ibm.com;ucas.ac.cn;nus.edu.sg;cse.cuhk.edu.hk",
        "author_num": 7,
        "aff_unique_index": "0;1;2;3;4;5",
        "aff_unique_norm": "University of Eastern Finland;Peking University;International Business Machines Corporation;Chinese Academy of Sciences;National University of Singapore;Chinese University of Hong Kong",
        "aff_unique_dep": ";;;Institute of Software;;Department of Computer Science and Engineering",
        "aff_unique_url": "https://www.uef.fi;http://www.pku.edu.cn;https://www.ibm.com;http://www.ios.ac.cn;https://www.nus.edu.sg;https://www.cuhk.edu.hk",
        "aff_unique_abbr": "UEF;Peking U;IBM;CAS;NUS;CUHK",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;1;2;1;3;1",
        "aff_country_unique": "Finland;China;United States;Singapore"
    },
    {
        "id": "SQLDXQ3IG8",
        "title": "Robustness Guarantees for Adversarial Training on Non-Separable Data",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Adversarial training has emerged as a popular approach for training models that are robust to inference time attacks. However, our theoretical understanding of why and when it works remains limited. Prior work has offered convergence analysis of adversarial training, but they are either restricted to the Neural Tangent Kernel (NTK) regime or make restrictive assumptions about data such as linearly realizability. In this work, we provide convergence and generalization guarantees for adversarial training of two-layer networks of any width on non-separable data. Our analysis goes beyond the NTK regime and holds for both smooth and non-smooth activation functions. We support our theoretical findings with an empirical study on synthetic and real-world data.",
        "keywords": "Adversarial training;neural networks;convergence and generalization guarantees",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/62689c176e6ba7af98d8362cf49d94f4ffe70071.zip",
        "author": "Yunjuan Wang;Kaibo Zhang;Raman Arora",
        "authorids": "~Yunjuan_Wang1;~Kaibo_Zhang3;~Raman_Arora1",
        "gender": "F;M;M",
        "homepage": "https://yunjuanwang.github.io/;;http://www.cs.jhu.edu/~raman/Home.html",
        "dblp": "31/560;72/9686;",
        "google_scholar": "t_VSEEwAAAAJ;;Spe0xdkAAAAJ",
        "orcid": ";;",
        "linkedin": "yunjuan-wang-12ab85169/;kaibo-zhang-97b911230/;",
        "or_profile": "~Yunjuan_Wang1;~Kaibo_Zhang3;~Raman_Arora1",
        "aff": "Johns Hopkins University;Department of Computer Science, Whiting School of Engineering;Johns Hopkins University",
        "aff_domain": "jhu.edu;cs.jhu.edu;jhu.edu",
        "position": "PhD student;PhD student;Associate Professor",
        "bibtex": "@misc{\nwang2024robustness,\ntitle={Robustness Guarantees for Adversarial Training on Non-Separable Data},\nauthor={Yunjuan Wang and Kaibo Zhang and Raman Arora},\nyear={2024},\nurl={https://openreview.net/forum?id=SQLDXQ3IG8}\n}",
        "github": "",
        "project": "",
        "reviewers": "GnZf;4oeH;jW96;ycei",
        "site": "https://openreview.net/forum?id=SQLDXQ3IG8",
        "pdf_size": 1653561,
        "rating": "3;6;6;6",
        "confidence": "4;3;3;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "49;32;57;61",
        "wc_strengths": "23;22;64;11",
        "wc_weaknesses": "148;70;99;42",
        "wc_questions": "131;2;79;4",
        "wc_review": "351;126;299;118",
        "wc_reply_reviewers": "1541;0;0;0",
        "wc_reply_authors": "2301;18;174;98",
        "reply_reviewers": "3;0;0;0",
        "reply_authors": "4;1;1;1",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            49.75,
            11.121488209767612
        ],
        "wc_strengths_avg": [
            30.0,
            20.18662923818635
        ],
        "wc_weaknesses_avg": [
            89.75,
            39.20698279643564
        ],
        "wc_questions_avg": [
            54.0,
            54.217155956394464
        ],
        "wc_review_avg": [
            223.5,
            103.1903580767118
        ],
        "wc_reply_reviewers_avg": [
            385.25,
            667.27257361591
        ],
        "wc_reply_authors_avg": [
            647.75,
            956.0968504811633
        ],
        "reply_reviewers_avg": [
            0.75,
            1.299038105676658
        ],
        "reply_authors_avg": [
            1.75,
            1.299038105676658
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:TP81pu0AKe0J:scholar.google.com/&scioq=Robustness+Guarantees+for+Adversarial+Training+on+Non-Separable+Data&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Johns Hopkins University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.jhu.edu",
        "aff_unique_abbr": "JHU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Baltimore",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "SQnOmOzqAM",
        "title": "Neural Manifold Operators for Learning the Evolution of Physical Dynamics",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Modeling the evolution of physical dynamics is a foundational problem in science and engineering, and it is regarded as the modeling of an operator mapping between infinite-dimensional functional spaces. Operator learning methods, learning the underlying infinite-dimensional operator in a high-dimensional latent space, have shown significant potential in modeling physical dynamics. However, there remains insufficient research on how to approximate an infinite-dimensional operator using a finite-dimensional parameter space. Inappropriate dimensionality representation of the underlying operator leads to convergence difficulties, decreasing generalization capability, and violating the physical consistency. To address the problem, we present Neural Manifold Operator (NMO) to learn the intrinsic dimension representation of underlying operators by calculating the minimum dimensional submanifold representation in the latent space. NMO achieves state-of-the-art performance in statistical and physical metrics and gains 23.35% average improvement on three real-world scenarios and four equation-governed scenarios across a wide range of multi-disciplinary fields. Our paradigm has been demonstrated universal effectiveness across various model structure implementations, including Multi-Layer Perceptron, Convolutional Neural Network, and Transformer. Experimentally, we prove that the intrinsic dimension calculated by our paradigm is the optimal dimensional representation of the underlying operators. Our code is available at https://anonymous.4open.science/r/Neural_Manifold_Operator.",
        "keywords": "Neural Operator;Manifold Learning;Dynamical System",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/45380fa6e0045cc6487c6304e493f562e34820ce.zip",
        "author": "Hao Wu;Shuyi Zhou;Xiaomeng Huang;Wei Xiong",
        "authorids": "~Hao_Wu39;~Shuyi_Zhou1;~Xiaomeng_Huang1;~Wei_Xiong12",
        "gender": "M;M;M;M",
        "homepage": "https://easylearningscores.github.io/;https://www.researchgate.net/profile/Shuyi-Zhou-4;http://faculty.dess.tsinghua.edu.cn/huangxiaomeng/en/index.htm;https://xiongweithu.github.io/",
        "dblp": "111;;;33/4054-16",
        "google_scholar": "HdXMhfcAAAAJ;;;PW8-kxsAAAAJ",
        "orcid": "0009-0008-4084-1409;;;0000-0002-0099-6050",
        "linkedin": ";;;",
        "or_profile": "~Hao_Wu39;~Shuyi_Zhou1;~Xiaomeng_Huang1;~Wei_Xiong12",
        "aff": "University of Science and Technology of China;Tsinghua University;Tsinghua University;Yale University",
        "aff_domain": "ustc.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;yale.edu",
        "position": "MS student;PhD student;Full Professor;PhD student",
        "bibtex": "@misc{\nwu2024neural,\ntitle={Neural Manifold Operators for Learning the Evolution of Physical Dynamics},\nauthor={Hao Wu and Shuyi Zhou and Xiaomeng Huang and Wei Xiong},\nyear={2024},\nurl={https://openreview.net/forum?id=SQnOmOzqAM}\n}",
        "github": "",
        "project": "",
        "reviewers": "MXPe;MieG;ivj1;KyVY;bPYN",
        "site": "https://openreview.net/forum?id=SQnOmOzqAM",
        "pdf_size": 29448271,
        "rating": "1;3;3;5;8",
        "confidence": "5;3;3;3;2",
        "soundness": "3;1;1;3;4",
        "contribution": "2;1;1;3;4",
        "presentation": "3;1;1;2;3",
        "wc_summary": "29;49;92;182;40",
        "wc_strengths": "16;9;1;51;61",
        "wc_weaknesses": "138;169;170;373;250",
        "wc_questions": "179;24;1;1;203",
        "wc_review": "362;251;264;607;554",
        "wc_reply_reviewers": "0;46;0;107;0",
        "wc_reply_authors": "860;178;556;635;533",
        "reply_reviewers": "0;1;0;1;0",
        "reply_authors": "3;1;1;2;1",
        "rating_avg": [
            4.0,
            2.3664319132398464
        ],
        "confidence_avg": [
            3.2,
            0.9797958971132712
        ],
        "soundness_avg": [
            2.4,
            1.2
        ],
        "contribution_avg": [
            2.2,
            1.16619037896906
        ],
        "presentation_avg": [
            2.0,
            0.8944271909999159
        ],
        "wc_summary_avg": [
            78.4,
            56.030705867408095
        ],
        "wc_strengths_avg": [
            27.6,
            23.87969849055888
        ],
        "wc_weaknesses_avg": [
            220.0,
            85.0105875759014
        ],
        "wc_questions_avg": [
            81.6,
            90.03910261658542
        ],
        "wc_review_avg": [
            407.6,
            147.2529795963396
        ],
        "wc_reply_reviewers_avg": [
            30.6,
            42.15020759142237
        ],
        "wc_reply_authors_avg": [
            552.4,
            220.00236362366653
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.6,
            0.8
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8625819491779428,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:S_KtBH0EKzAJ:scholar.google.com/&scioq=Neural+Manifold+Operators+for+Learning+the+Evolution+of+Physical+Dynamics&hl=en&as_sdt=0,33",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "University of Science and Technology of China;Tsinghua University;Yale University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.ustc.edu.cn;https://www.tsinghua.edu.cn;https://www.yale.edu",
        "aff_unique_abbr": "USTC;THU;Yale",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Social-Transmotion: Promptable Human Trajectory Prediction",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18604",
        "id": "SQpnEfv9WH",
        "author_site": "Saeed Saadatnejad, Yang Gao, Kaouther Messaoud, Alexandre Alahi",
        "tldr": "",
        "abstract": "Accurate human trajectory prediction is crucial for applications such as autonomous vehicles, robotics, and surveillance systems. Yet, existing models often fail to fully leverage the non-verbal social cues human subconsciously communicate when navigating the space.\nTo address this, we introduce *Social-Transmotion*, a generic Transformer-based model that exploits diverse and numerous visual cues to predict human behavior. We translate the idea of a prompt from Natural Language Processing (NLP) to the task of human trajectory prediction, where a prompt can be a sequence of x-y coordinates on the ground, bounding boxes in the image plane, or body pose keypoints in either 2D or 3D.  This, in turn, augments trajectory data, leading to enhanced human trajectory prediction.\nUsing masking technique, our model exhibits flexibility and adaptability by capturing spatiotemporal interactions between agents based on the available visual cues.\nWe delve into the merits of using 2D versus 3D poses, and a limited set of poses. Additionally, we investigate the spatial and temporal attention map to identify which keypoints and time-steps in the sequence are vital for optimizing human trajectory prediction.\nOur approach is validated on multiple datasets, including JTA, JRDB, Pedestrians and Cyclists in Road Traffic, and ETH-UCY.\nThe code is publicly available: [https://github.com/vita-epfl/social-transmotion](https://github.com/vita-epfl/social-transmotion).",
        "keywords": "human trajectory prediction;robot navigation;autonomous driving;attention mechanism",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/ecb46a9e701c832c79affccf0380473888a8cf97.zip",
        "author": "Saeed Saadatnejad;Yang Gao;Kaouther Messaoud;Alexandre Alahi",
        "authorids": "~Saeed_Saadatnejad1;~Yang_Gao15;~Kaouther_Messaoud1;~Alexandre_Alahi3",
        "gender": "M;M;F;M",
        "homepage": "https://saeedsaadatnejad.github.io/;;;https://vita.epfl.ch/",
        "dblp": "232/4081;;248/3410;48/3455",
        "google_scholar": "PBdhgFYAAAAJ;;X0teZIAAAAAJ;UIhXQ64AAAAJ",
        "orcid": "0000-0001-7310-8686;0000-0002-3695-9155;0000-0002-4602-8100;",
        "linkedin": "saeedsaadatnejad/;yang-gao-525910248/;kaoutharmessaoud/?locale=en_US;",
        "or_profile": "~Saeed_Saadatnejad1;~Yang_Gao15;~Kaouther_Messaoud1;~Alexandre_Alahi3",
        "aff": "EPFL;EPFL - EPF Lausanne;EPFL Ecole Polytechnique Federale de Lausanne;EPFL",
        "aff_domain": "epfl.ch;epfl.ch;epfl.ch;epfl.ch",
        "position": "PhD student;PhD student;Postdoc;Associate Professor",
        "bibtex": "@inproceedings{\nsaadatnejad2024socialtransmotion,\ntitle={Social-Transmotion: Promptable Human Trajectory Prediction},\nauthor={Saeed Saadatnejad and Yang Gao and Kaouther Messaoud and Alexandre Alahi},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=SQpnEfv9WH}\n}",
        "github": "",
        "project": "",
        "reviewers": "BUFd;qMC2;mJke;KGKG",
        "pdf_size": 1319897,
        "rating": "3;5;5;6",
        "confidence": "5;5;5;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;2;3",
        "wc_summary": "56;99;73;114",
        "wc_strengths": "41;68;111;65",
        "wc_weaknesses": "87;190;165;68",
        "wc_questions": "18;120;127;34",
        "wc_review": "202;477;476;281",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "551;1218;481;488",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            85.5,
            22.477766792989023
        ],
        "wc_strengths_avg": [
            71.25,
            25.222757581200355
        ],
        "wc_weaknesses_avg": [
            127.5,
            51.21767273119699
        ],
        "wc_questions_avg": [
            74.75,
            49.139469879110415
        ],
        "wc_review_avg": [
            359.0,
            120.77458341886343
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            684.5,
            309.2203906601245
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.6622661785325219,
        "gs_citation": 16,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10904508255313924188&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=SQpnEfv9WH",
        "pdf": "https://openreview.net/pdf?id=SQpnEfv9WH",
        "email": "epfl.ch;epfl.ch;epfl.ch;epfl.ch",
        "author_num": 4,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "EPFL;Ecole Polytechnique Federale de Lausanne",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.epfl.ch;https://www.epfl.ch",
        "aff_unique_abbr": "EPFL;EPFL",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Lausanne",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Switzerland"
    },
    {
        "title": "CABINET: Content Relevance-based Noise Reduction for Table Question Answering",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18603",
        "id": "SQrHpTllXa",
        "author_site": "Sohan Patnaik, Heril Changwal, Milan Aggarwal, Sumit Bhatia, Yaman Singla, Balaji Krishnamurthy",
        "tldr": "",
        "abstract": "Table understanding capability of Large Language Models (LLMs) has been extensively studied through the task of question-answering (QA) over tables. Typically, only a small part of the whole table is relevant to derive the answer for a given question. The irrelevant parts act as noise and are distracting information, resulting in sub-optimal performance due to the vulnerability of LLMs to noise. To mitigate this, we propose CABINET (Content RelevAnce-Based NoIse ReductioN for TablE QuesTion-Answering) \u2013 a framework to enable LLMs to focus on relevant tabular data by suppressing extraneous information. CABINET comprises an Unsupervised Relevance Scorer (URS), trained differentially with the QA LLM, that weighs the table content based on its relevance to the input question before feeding it to the question answering LLM (QA LLM). To further aid the relevance scorer, CABINET employs a weakly supervised module that generates a parsing statement describing the criteria of rows and columns relevant to the question and highlights the content of corresponding table cells. CABINET significantly outperforms various tabular LLM baselines, as well as GPT3-based in-context learning methods, is more robust to noise, maintains outperformance on tables of varying sizes, and establishes new SoTA performance on WikiTQ, FeTaQA, and WikiSQL datasets. We release our code and datasets here.",
        "keywords": "Table Question Answering;Large Language Models;Noise Reduction;Unsupervised Relevance Scoring;Table Parsing;Relevant Cell Highlighting",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Sohan Patnaik;Heril Changwal;Milan Aggarwal;Sumit Bhatia;Yaman Kumar;Balaji Krishnamurthy",
        "authorids": "~Sohan_Patnaik1;~Heril_Changwal1;~Milan_Aggarwal2;~Sumit_Bhatia1;~Yaman_Kumar1;~Balaji_Krishnamurthy1",
        "gender": "M;;;;M;M",
        "homepage": ";;;http://sumitbhatia.net/;https://sites.google.com/view/yaman-kumar/;",
        "dblp": ";;;52/7536;239/5601;79/1076",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;;8HVTWNkAAAAJ;https://scholar.google.co.in/citations?hl=en;n8iUBg8AAAAJ",
        "orcid": ";;;;0000-0001-7880-8219;0000-0002-0366-2427",
        "linkedin": "sohan-patnaik-29061a1a4/;;;;yaman-kumar/;balaji-krishnamurthy-4241695/",
        "or_profile": "~Sohan_Patnaik1;~Heril_Changwal1;~Milan_Aggarwal2;~Sumit_Bhatia1;~Yaman_Kumar1;~Balaji_Krishnamurthy1",
        "aff": "Indian Institute of Technology Kharagpur;;;Adobe Systems;Adobe ;Adobe Systems",
        "aff_domain": "iitkgp.ac.in;;;adobe.com;adobe.com;adobe.com",
        "position": "Undergrad student;;;Senior ML Scientist;Researcher;Principal Scientist",
        "bibtex": "@inproceedings{\npatnaik2024cabinet,\ntitle={{CABINET}: Content Relevance-based Noise Reduction for Table Question Answering},\nauthor={Sohan Patnaik and Heril Changwal and Milan Aggarwal and Sumit Bhatia and Yaman Kumar and Balaji Krishnamurthy},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=SQrHpTllXa}\n}",
        "github": "",
        "project": "",
        "reviewers": "mwZa;e8r4;nyxN;NUWR",
        "pdf_size": 1619682,
        "rating": "8;8;8;8",
        "confidence": "4;4;4;5",
        "soundness": "3;3;4;3",
        "contribution": "3;3;4;3",
        "presentation": "3;3;4;2",
        "wc_summary": "101;166;82;147",
        "wc_strengths": "15;47;33;87",
        "wc_weaknesses": "222;86;44;115",
        "wc_questions": "5;115;122;93",
        "wc_review": "343;414;281;442",
        "wc_reply_reviewers": "32;85;85;0",
        "wc_reply_authors": "891;1618;807;1711",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "3;4;2;3",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            124.0,
            33.860005906674026
        ],
        "wc_strengths_avg": [
            45.5,
            26.509432283623127
        ],
        "wc_weaknesses_avg": [
            116.75,
            65.80036094125929
        ],
        "wc_questions_avg": [
            83.75,
            46.70853776345391
        ],
        "wc_review_avg": [
            370.0,
            62.789330303802416
        ],
        "wc_reply_reviewers_avg": [
            50.5,
            36.30771267926417
        ],
        "wc_reply_authors_avg": [
            1256.75,
            410.1502011458729
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 18,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16063531865040933184&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=SQrHpTllXa",
        "pdf": "https://openreview.net/pdf?id=SQrHpTllXa",
        "email": "iitkgp.ac.in;;;adobe.com;adobe.com;adobe.com",
        "author_num": 6,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Indian Institute of Technology Kharagpur;Adobe",
        "aff_unique_dep": ";Adobe Systems Incorporated",
        "aff_unique_url": "https://www.iitkgp.ac.in;https://www.adobe.com",
        "aff_unique_abbr": "IIT Kharagpur;Adobe",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Kharagpur;",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "India;United States"
    },
    {
        "id": "SRn2o3ij25",
        "title": "IKL: Boosting Long-Tail Recognition with Implicit Knowledge Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In the field of visual long-tailed recognition, the long-tailed distribution of image representations often raises two key challenges: (1) the training process shows great uncertainty (e.g., uncertainty in the prediction of augmented views by the same expert for the same sample) and (2) a marked bias in the model's prediction towards the head class.\nTo tackle the above issue, we propose a novel method termed Implicit Knowledge Learning (IKL) to extract the knowledge hidden in long-tail learning processes, aiming to significantly improve performance in long-tail recognition. Our IKL contains two core components: Implicit Uncertainty Regularization (IUR) and Implicit Correlation Labeling (ICL). The former method, IUR, exploits the uncertainty of the predictions over adjacent epochs. Then, it transfers the correct knowledge to reduce uncertainty and improve long-tail recognition accuracy. The latter approach, ICL, endeavors to reduce the bias introduced by one-hot labels by exploring the implicit knowledge in the model: inter-class similarity information.\nOur approach is lightweight enough to plug and play with existing long-tail learning methods, achieving state-of-the-art performance in popular long-tail benchmarks. The experimental results highlight the great potential of implicit knowledge learning in dealing with long-tail recognition. Our code will be open-sourced upon acceptance.",
        "keywords": "Long-tail Recognition",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/3dbc5dfb59f900416e6a459bb039e163ef03b475.zip",
        "author": "Qihao Zhao;Yalun Dai;Wei Hu;Fan Zhang;Jun Liu",
        "authorids": "~Qihao_Zhao2;~Yalun_Dai1;~Wei_Hu2;~Fan_Zhang5;~Jun_Liu8",
        "gender": "M;;M;M;M",
        "homepage": ";;;https://www.researchgate.net/profile/Fan-Zhang-253;",
        "dblp": "274/3230;;52/173-4;21/3626-7;95/3736-36",
        "google_scholar": "sECb19EAAAAJ;;ACJickwAAAAJ;CujOi1kAAAAJ;Q5Ild8UAAAAJ",
        "orcid": "0009-0009-8165-1860;;;0000-0002-2058-2373;",
        "linkedin": ";;;;",
        "or_profile": "~Qihao_Zhao2;~Yalun_Dai1;~Wei_Hu2;~Fan_Zhang5;~Jun_Liu8",
        "aff": "Beijing University of Chemical Technology;;Beijing Univeristy of Chemical Technology;Beijing University of Chemical Technology;Singapore University of Technology and Design",
        "aff_domain": "buct.edu.cn;;mail.buct.edu.cn;buct.edu.cn;sutd.edu.sg",
        "position": "PhD student;;Associate Professor;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nanonymous2024ikl,\ntitle={{IKL}: Boosting Long-Tail Recognition with Implicit Knowledge Learning},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=SRn2o3ij25}\n}",
        "github": "",
        "project": "",
        "reviewers": "W2Ce;Zu8m;6AeQ",
        "site": "https://openreview.net/forum?id=SRn2o3ij25",
        "pdf_size": 9939140,
        "rating": "3;5;6",
        "confidence": "5;5;4",
        "soundness": "2;2;3",
        "contribution": "2;2;2",
        "presentation": "3;3;3",
        "wc_summary": "64;106;120",
        "wc_strengths": "53;25;97",
        "wc_weaknesses": "173;215;336",
        "wc_questions": "76;2;228",
        "wc_review": "366;348;781",
        "wc_reply_reviewers": "0;0;526",
        "wc_reply_authors": "1669;1205;2990",
        "reply_reviewers": "0;0;2",
        "reply_authors": "4;3;7",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            96.66666666666667,
            23.79542439676633
        ],
        "wc_strengths_avg": [
            58.333333333333336,
            29.634814361190493
        ],
        "wc_weaknesses_avg": [
            241.33333333333334,
            69.10057082896559
        ],
        "wc_questions_avg": [
            102.0,
            94.07798183776407
        ],
        "wc_review_avg": [
            498.3333333333333,
            200.01055527702087
        ],
        "wc_reply_reviewers_avg": [
            175.33333333333334,
            247.95877793608264
        ],
        "wc_reply_authors_avg": [
            1954.6666666666667,
            756.201178405735
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            4.666666666666667,
            1.699673171197595
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.7559289460184544,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:iesQXnBlB_EJ:scholar.google.com/&scioq=IKL:+Boosting+Long-Tail+Recognition+with+Implicit+Knowledge+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "Beijing University of Chemical Technology;Singapore University of Technology and Design",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.buct.edu.cn;https://www.sutd.edu.sg",
        "aff_unique_abbr": "BUCT;SUTD",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "China;Singapore"
    },
    {
        "id": "SSItGuNLD2",
        "title": "Exploring the Relationship between In-Context Learning and Instruction Tuning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In-Context Learning (ICL) and Instruction Tuning (IT) are two primary paradigms of adopting Large Language Models (LLMs) to downstream applications. How- ever, they are significantly different. In ICL, a set of demonstrations are provided at inference time but the LLM\u2019s parameters are not updated. In IT, a set of demon- strations are used to tune LLM\u2019s parameters in training time but no demonstrations are used at inference time. Although a growing body of literature has explored ICL and IT, studies on these topics have largely been conducted in isolation, leading to a disconnect between these two paradigms. In this work, we explore the relation- ship between ICL and IT by examining how the hidden states of LLMs change in these two paradigms. Through carefully designed experiments conducted with LLaMA-2 (7B and 13B), we find that ICL is implicit IT. In other words, ICL changes an LLM\u2019s hidden states as if the demonstrations were used to instruction- ally tune the model. Furthermore, the convergence between ICL and IT is largely contingent upon several factors related to the provided demonstrations. Overall, this work offers a unique perspective to explore the connection between ICL and IT and sheds light on understanding the behaviors of LLM.",
        "keywords": "large language model;in-context learning;instruction tuning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Hanyu Duan;Yixuan Tang;Yi Yang;Ahmed Abbasi;KAR YAN TAM",
        "authorids": "~Hanyu_Duan2;~Yixuan_Tang2;~Yi_Yang7;~Ahmed_Abbasi2;~KAR_YAN_TAM1",
        "gender": ";;M;M;M",
        "homepage": "https://yixuantt.github.io/;http://yya518.github.io/;https://ahmedabbasi.com/;https://facultyprofiles.hkust.edu.hk/profiles.php?profile=kar-yan-tam-kytam;",
        "dblp": ";;65/64.html;;305/9869",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com.hk/citations?user=Prh_dHkAAAAJ;2MG9-NAAAAAJ;prT6OvEAAAAJ;",
        "orcid": "0009-0006-2405-2026;0000-0001-8863-112X;0000-0001-7698-7794;0000-0003-3242-0184;",
        "linkedin": "yixuan-tang-2023yixuan;;ahmednabbasi;;",
        "or_profile": "~Yixuan_Tang2;~Yi_Yang7;~Ahmed_Abbasi2;~KAR_YAN_TAM1;~HANYU_DUAN1",
        "aff": "Hong Kong University of Science and Technology;Hong Kong University of Science and Technology;University of Notre Dame;;Hong Kong University of Science and Technology",
        "aff_domain": "connect.ust.hk;ust.hk;nd.edu;;ust.hk",
        "position": "PhD student;Associate Professor;Full Professor;;PhD student",
        "bibtex": "@misc{\nduan2024exploring,\ntitle={Exploring the Relationship between In-Context Learning and Instruction Tuning},\nauthor={Hanyu Duan and Yixuan Tang and Yi Yang and Ahmed Abbasi and KAR YAN TAM},\nyear={2024},\nurl={https://openreview.net/forum?id=SSItGuNLD2}\n}",
        "github": "",
        "project": "",
        "reviewers": "i92c;GTLB;g5Tk;Z5vk;szc9",
        "site": "https://openreview.net/forum?id=SSItGuNLD2",
        "pdf_size": 4045552,
        "rating": "3;3;5;5;8",
        "confidence": "4;4;4;3;4",
        "soundness": "2;2;2;3;4",
        "contribution": "2;3;2;3;3",
        "presentation": "3;3;3;3;4",
        "wc_summary": "71;86;144;72;68",
        "wc_strengths": "16;77;94;68;114",
        "wc_weaknesses": "189;167;292;335;398",
        "wc_questions": "5;4;150;9;10",
        "wc_review": "281;334;680;484;590",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            4.8,
            1.8330302779823362
        ],
        "confidence_avg": [
            3.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.6,
            0.8
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            3.2,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            88.2,
            28.582512135919753
        ],
        "wc_strengths_avg": [
            73.8,
            32.89012009707474
        ],
        "wc_weaknesses_avg": [
            276.2,
            87.25915424756305
        ],
        "wc_questions_avg": [
            35.6,
            57.24543649934028
        ],
        "wc_review_avg": [
            473.8,
            150.2270281939971
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.05455447255899811,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17513276309753216737&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Hong Kong University of Science and Technology;University of Notre Dame",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ust.hk;https://www.nd.edu",
        "aff_unique_abbr": "HKUST;Notre Dame",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "When can transformers reason with abstract symbols?",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18602",
        "id": "STUGfUz8ob",
        "author_site": "Enric Boix-Adser\u00e0, Omid Saremi, Emmanuel Abbe, Samy Bengio, Etai Littwin, Joshua Susskind",
        "tldr": "",
        "abstract": "We investigate the capabilities of transformer models on relational reasoning tasks. In these tasks, models are trained on a set of strings encoding abstract relations, and are then tested out-of-distribution on data that contains symbols that did not appear in the training dataset. We prove that for any relational reasoning task in a large family of tasks, transformers learn the abstract relations and generalize to the test set when trained by gradient descent on sufficiently large quantities of training data. This is in contrast to classical fully-connected networks, which we prove fail to learn to reason. Our results inspire modifications of the transformer architecture that add only two trainable parameters per head, and that we empirically demonstrate improve data efficiency for learning to reason.",
        "keywords": "transformers;language models;reasoning;theoretical analysis;variable binding",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/71626da1d5c816dec304d5efd9f5442c6d0be645.zip",
        "author": "Enric Boix-Adser\u00e0;Omid Saremi;Emmanuel Abbe;Samy Bengio;Etai Littwin;Joshua M. Susskind",
        "authorids": "~Enric_Boix-Adser\u00e01;~Omid_Saremi1;~Emmanuel_Abbe1;~Samy_Bengio1;~Etai_Littwin1;~Joshua_M._Susskind1",
        "gender": ";;M;M;M;M",
        "homepage": ";;http://bengio.abracadoudou.com;;http://www.apple.com;http://web.mit.edu/eboix/www/",
        "dblp": ";84/5016;b/SamyBengio;;132/7797;",
        "google_scholar": ";;Vs-MdPcAAAAJ;NOVS7vwAAAAJ;Sv2TGqsAAAAJ;",
        "orcid": ";;;;;",
        "linkedin": "omidsaremi/;;bengio;;joshua-susskind-8ab2ab5/;",
        "or_profile": "~Omid_Saremi1;~Emmanuel_Abbe1;~Samy_Bengio1;~Etai_Littwin1;~Joshua_M._Susskind1;~Enric_Boix_Adser\u00e01",
        "aff": "Apple;Swiss Federal Institute of Technology Lausanne;Apple;;Apple;Massachusetts Institute of Technology",
        "aff_domain": "apple.com;epfl.ch;apple.com;;apple.com;mit.edu",
        "position": "ML;Full Professor;Senior Director;;Researcher;PhD student",
        "bibtex": "@inproceedings{\nboix-adser{\\`a}2024when,\ntitle={When can transformers reason with abstract symbols?},\nauthor={Enric Boix-Adser{\\`a} and Omid Saremi and Emmanuel Abbe and Samy Bengio and Etai Littwin and Joshua M. Susskind},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=STUGfUz8ob}\n}",
        "github": "",
        "project": "",
        "reviewers": "xzui;Fsbi;jCDP;gjp1;5tFF",
        "pdf_size": 2283712,
        "rating": "6;8;8;8;8",
        "confidence": "1;3;3;4;4",
        "soundness": "2;4;4;3;4",
        "contribution": "2;4;3;3;3",
        "presentation": "2;3;4;3;3",
        "wc_summary": "94;43;73;71;321",
        "wc_strengths": "44;127;151;53;130",
        "wc_weaknesses": "113;234;125;353;92",
        "wc_questions": "35;203;156;51;273",
        "wc_review": "286;607;505;528;816",
        "wc_reply_reviewers": "13;17;0;203;52",
        "wc_reply_authors": "408;760;1254;1651;1450",
        "reply_reviewers": "1;1;0;2;1",
        "reply_authors": "1;1;2;5;3",
        "rating_avg": [
            7.6,
            0.7999999999999999
        ],
        "confidence_avg": [
            3.0,
            1.0954451150103321
        ],
        "soundness_avg": [
            3.4,
            0.8
        ],
        "contribution_avg": [
            3.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            3.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            120.4,
            101.60236217726437
        ],
        "wc_strengths_avg": [
            101.0,
            43.749285708454714
        ],
        "wc_weaknesses_avg": [
            183.4,
            98.02571091300486
        ],
        "wc_questions_avg": [
            143.6,
            90.3274044794823
        ],
        "wc_review_avg": [
            548.4,
            170.99543853565217
        ],
        "wc_reply_reviewers_avg": [
            57.0,
            75.0013333214817
        ],
        "wc_reply_authors_avg": [
            1104.6,
            456.9847262217852
        ],
        "reply_reviewers_avg": [
            1.0,
            0.6324555320336759
        ],
        "reply_authors_avg": [
            2.4,
            1.4966629547095764
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.9128709291752771,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6213946331903984242&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=STUGfUz8ob",
        "pdf": "https://openreview.net/pdf?id=STUGfUz8ob",
        "email": "apple.com;epfl.ch;apple.com;;apple.com;mit.edu",
        "author_num": 6,
        "aff_unique_index": "0;1;0;0;2",
        "aff_unique_norm": "Apple;Swiss Federal Institute of Technology Lausanne;Massachusetts Institute of Technology",
        "aff_unique_dep": "Apple Inc.;;",
        "aff_unique_url": "https://www.apple.com;https://www.epfl.ch;https://web.mit.edu",
        "aff_unique_abbr": "Apple;EPFL;MIT",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Lausanne",
        "aff_country_unique_index": "0;1;0;0;0",
        "aff_country_unique": "United States;Switzerland"
    },
    {
        "id": "STxmh1ZLOI",
        "title": "RTMPose: Real-Time Models for Multi-Person Pose Estimation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent studies on 2D pose estimation have achieved excellent performance on public benchmarks, yet its application in the industrial community still suffers from heavy model parameters and high latency. To bridge this gap, we empirically explore key factors in pose estimation including paradigm, model architecture, training strategy, and deployment, and present a high-performance real-time multi-person pose estimation pipeline, RTMPose. Our RTMPose-m achieves 75.8% AP on COCO with 90+ FPS on an Intel i7-11700 CPU and 430+ FPS on an NVIDIA GTX 1660 Ti GPU, and RTMPose-x achieves 65.3% AP on COCO-WholeBody. To further evaluate RTMPose's capability in critical real-time applications, we also report the performance after deploying on the mobile device. Our RTMPose-s model achieves 72.2% AP on COCO with 70+ FPS on a Snapdragon 865 chip, outperforming existing methods used by industrial companies.",
        "keywords": "human pose estimation;real-time;coco;coco-wholebody;crowdpose",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/295ab113e06e3ec3e81d8832d11244f9634a8af0.pdf",
        "author": "Tao Jiang;Peng Lu;Li Zhang;Ningsheng Ma;Han Lyu;Chengqi Lyu;Yining Li;Kai Chen",
        "authorids": "~Tao_Jiang16;~Peng_Lu4;~Li_Zhang39;~Ningsheng_Ma1;~Han_Lyu1;~Chengqi_Lyu1;~Yining_Li1;~Kai_Chen4",
        "gender": "M;M;M;M;F;M;M;M",
        "homepage": "https://github.com/Tau-J;;https://github.com/lzhangzz;https://github.com/RunningLeon;https://github.com/lvhan028;;https://liyn.site;https://chenkai.site/",
        "dblp": ";;;;;319/5244;166/3420;181/2839-26",
        "google_scholar": ";https://scholar.google.com/citations?view_op=list_works;;;;https://scholar.google.com/citations?view_op=list_works;https://scholar.google.com.hk/citations?user=y_cp1sUAAAAJ;https://scholar.google.com.hk/citations?user=eGD0b7IAAAAJ",
        "orcid": ";;;;;;;0000-0002-6820-2325",
        "linkedin": ";;;;;;;",
        "or_profile": "~Tao_Jiang16;~Peng_Lu4;~Li_Zhang39;~Ningsheng_Ma1;~Han_Lyu1;~Chengqi_Lyu1;~Yining_Li1;~Kai_Chen4",
        "aff": "Shanghai AI Laboratory;SIGS, Tsinghua University;Shanghai AI Labratory;;;Shanghai AI Laboratory;Shanghai AI Laboratory;Shanghai AI Laboratory",
        "aff_domain": "pjlab.org.cn;tsinghua.edu.cn;pjlab.org.cn;;;pjlab.org.cn;pjlab.org.cn;pjlab.org.cn",
        "position": "Researcher;graduate student;Engineer;;;Researcher;Researcher;Researcher",
        "bibtex": "@misc{\njiang2024rtmpose,\ntitle={{RTMP}ose: Real-Time Models for Multi-Person Pose Estimation},\nauthor={Tao Jiang and Peng Lu and Li Zhang and Ningsheng Ma and Han Lyu and Chengqi Lyu and Yining Li and Kai Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=STxmh1ZLOI}\n}",
        "github": "",
        "project": "",
        "reviewers": "KXJ9;Snzb;hfGj",
        "site": "https://openreview.net/forum?id=STxmh1ZLOI",
        "pdf_size": 1069145,
        "rating": "3;5;8",
        "confidence": "5;4;4",
        "soundness": "3;3;4",
        "contribution": "2;2;3",
        "presentation": "1;3;3",
        "wc_summary": "43;64;36",
        "wc_strengths": "25;43;58",
        "wc_weaknesses": "65;92;61",
        "wc_questions": "3;4;6",
        "wc_review": "136;203;161",
        "wc_reply_reviewers": "0;27;0",
        "wc_reply_authors": "255;269;283",
        "reply_reviewers": "0;1;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            5.333333333333333,
            2.0548046676563256
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            47.666666666666664,
            11.897712198383164
        ],
        "wc_strengths_avg": [
            42.0,
            13.490737563232042
        ],
        "wc_weaknesses_avg": [
            72.66666666666667,
            13.767917618708921
        ],
        "wc_questions_avg": [
            4.333333333333333,
            1.247219128924647
        ],
        "wc_review_avg": [
            166.66666666666666,
            27.644569488820444
        ],
        "wc_reply_reviewers_avg": [
            9.0,
            12.727922061357855
        ],
        "wc_reply_authors_avg": [
            269.0,
            11.430952132988164
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.8029550685469661,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:MmyTRLUVpn8J:scholar.google.com/&scioq=RTMPose:+Real-Time+Models+for+Multi-Person+Pose+Estimation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0;0;0",
        "aff_unique_norm": "Shanghai AI Laboratory;Tsinghua University",
        "aff_unique_dep": ";School of Information Management and Engineering",
        "aff_unique_url": "https://www.shanghai-ai-lab.com;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "SAIL;THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "SU8vFBJXJt",
        "title": "Why not both? Combining Bellman losses in deep reinforcement learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Several deep reinforcement learning algorithms use a variant of fitted Q-evaluation for policy evaluation, alternating between estimating and regressing a target value function. In the linear function approximator case, Fitted Q-evaluation is related to the projected Bellman error. A known alternative to the projected Bellman error is the Bellman residual, but the latter is known to give worse results in practice for the linear case and was recently shown to perform equally poorly with neural networks. While insufficient on its own, we show in this paper that the Bellman residual can be a useful auxiliary loss for neural fitted Q-evaluation. In fact, we show that existing auxiliary losses based on modelling the environment's reward and transition function can be seen as a combination of the Bellman residual and the projected Bellman error. Experimentally, we show that adding a Bellman residual loss stabilizes policy evaluation, allowing significantly more aggressive target network update rates. When applied to Soft-Actor Critic---a strong baseline for continuous control tasks---we show that the target's faster update rates yield an improved sample efficiency on several Mujoco tasks, while without the Bellman residual auxiliary loss, fitted Q-evaluation would diverge in several such instances.",
        "keywords": "Deep reinforcement learning;Soft actor-critic;policy evaluation",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/1e88926f03fe0dc4cc50f0f77e62019c28811bce.zip",
        "author": "Riad Akrour",
        "authorids": "~Riad_Akrour1",
        "gender": "M",
        "homepage": "https://akrouriad.github.io/",
        "dblp": "98/9987.html",
        "google_scholar": "https://scholar.google.de/citations?user=7g1bMNkAAAAJ",
        "orcid": "0000-0002-8735-6960",
        "linkedin": "",
        "or_profile": "~Riad_Akrour1",
        "aff": "INRIA",
        "aff_domain": "inria.fr",
        "position": "Researcher",
        "bibtex": "@misc{\nakrour2024why,\ntitle={Why not both? Combining Bellman losses in deep reinforcement learning},\nauthor={Riad Akrour},\nyear={2024},\nurl={https://openreview.net/forum?id=SU8vFBJXJt}\n}",
        "github": "",
        "project": "",
        "reviewers": "X6y6;JxN6;he6H;BJvN",
        "site": "https://openreview.net/forum?id=SU8vFBJXJt",
        "pdf_size": 3897287,
        "rating": "5;5;5;6",
        "confidence": "3;3;3;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "2;2;2;4",
        "wc_summary": "108;350;169;116",
        "wc_strengths": "81;40;79;167",
        "wc_weaknesses": "233;394;268;139",
        "wc_questions": "6;34;42;50",
        "wc_review": "428;818;558;472",
        "wc_reply_reviewers": "0;151;0;0",
        "wc_reply_authors": "366;604;859;494",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;2;2;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            185.75,
            97.68412102281516
        ],
        "wc_strengths_avg": [
            91.75,
            46.418611569067856
        ],
        "wc_weaknesses_avg": [
            258.5,
            91.35233987151068
        ],
        "wc_questions_avg": [
            33.0,
            16.583123951777
        ],
        "wc_review_avg": [
            569.0,
            151.17208737065187
        ],
        "wc_reply_reviewers_avg": [
            37.75,
            65.38491798572512
        ],
        "wc_reply_authors_avg": [
            580.75,
            181.38822315685218
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:A8NyXXkfiawJ:scholar.google.com/&scioq=Why+not+both%3F+Combining+Bellman+losses+in+deep+reinforcement+learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "INRIA",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.inria.fr",
        "aff_unique_abbr": "INRIA",
        "aff_country_unique_index": "0",
        "aff_country_unique": "France"
    },
    {
        "id": "SUUckMrHNY",
        "title": "\u03b1-Former: Local-Feature-Aware (L-FA) Transformer",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Despite the success of current segmentation models powered by the transformer, the camouflaged instance segmentation (CIS) task remains a challenge due to the similarity between the target and the background. To address this issue, we propose a novel approach called the local-feature-aware transformer ($\\alpha$-Former) that incorporates traditional computer vision descriptors to extract critical edge features in camouflaged instances. Specifically, we introduce an adapter to merge local features into the transformer framework. Using the proposed transformer-based encoder-decoder architecture, our $\\alpha$-Former surpasses state-of-the-art performance on the COD10K and NC4K datasets. Additionally, we introduce an edge-aware feature fusion module to improve boundary results in the segmentation model.",
        "keywords": "Camouflaged instance segmentation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/8d0f84376196cedf4501e5cf169edae37150b56d.pdf",
        "author": "Zhi Xu;Bin Sun;Yue Bai;Yun Fu",
        "authorids": "~Zhi_Xu2;~Bin_Sun1;~Yue_Bai1;~Yun_Fu1",
        "gender": "M;M;M;M",
        "homepage": "https://github.com/zhix9767;https://sun1992.github.io/;https://yueb17.github.io/;http://www1.ece.neu.edu/~yunfu/",
        "dblp": ";01/5401-2;119/0848;00/5815-1",
        "google_scholar": "https://scholar.google.com/citations?hl=en;7s-TBDUAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com.tw/citations?user=h-JEcQ8AAAAJ",
        "orcid": ";0000-0001-9239-0402;;0000-0002-5098-2853",
        "linkedin": ";bin-sun-521700107/;;furaymond/",
        "or_profile": "~Zhi_Xu2;~Bin_Sun1;~Yue_Bai1;~Yun_Fu1",
        "aff": "Northeastern University;Topazlabs LLC.;Northeastern University;Northeastern University",
        "aff_domain": "neu.edu;topazlabs.com;neu.edu;northeastern.edu",
        "position": "PhD student;Researcher;PhD student;Full Professor",
        "bibtex": "@misc{\nxu2024former,\ntitle={\\ensuremath{\\alpha}-Former: Local-Feature-Aware (L-{FA}) Transformer},\nauthor={Zhi Xu and Bin Sun and Yue Bai and Yun Fu},\nyear={2024},\nurl={https://openreview.net/forum?id=SUUckMrHNY}\n}",
        "github": "",
        "project": "",
        "reviewers": "1G3o;vJX5;Zqb6",
        "site": "https://openreview.net/forum?id=SUUckMrHNY",
        "pdf_size": 1158226,
        "rating": "3;3;3",
        "confidence": "5;4;4",
        "soundness": "2;2;2",
        "contribution": "2;2;2",
        "presentation": "2;3;2",
        "wc_summary": "78;71;95",
        "wc_strengths": "19;25;7",
        "wc_weaknesses": "122;376;416",
        "wc_questions": "2;351;3",
        "wc_review": "221;823;521",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            81.33333333333333,
            10.077477638553983
        ],
        "wc_strengths_avg": [
            17.0,
            7.483314773547883
        ],
        "wc_weaknesses_avg": [
            304.6666666666667,
            130.1930190994211
        ],
        "wc_questions_avg": [
            118.66666666666667,
            164.28498274509315
        ],
        "wc_review_avg": [
            521.6666666666666,
            245.76592296103397
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ZZq55PYE_kUJ:scholar.google.com/&scioq=%CE%B1-Former:+Local-Feature-Aware+(L-FA)+Transformer&hl=en&as_sdt=0,33",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Northeastern University;Topazlabs LLC",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.northeastern.edu;",
        "aff_unique_abbr": "NEU;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "VCR-Graphormer: A Mini-batch Graph Transformer via Virtual Connections",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18601",
        "id": "SUUrkC3STJ",
        "author_site": "Dongqi Fu, Zhigang Hua, Yan Xie, Jin Fang, Si Zhang, Kaan Sancak, Hao Wu, Andrey Malevich, Jingrui He, Bo Long",
        "tldr": "",
        "abstract": "Graph transformer has been proven as an effective graph learning method for its adoption of attention mechanism that is capable of capturing expressive representations from complex topological and feature information of graphs. Graph transformer conventionally performs dense attention (or global attention) for every pair of nodes to learn node representation vectors, resulting in quadratic computational costs that are unaffordable for large-scale graph data. Therefore, mini-batch training for graph transformers is a promising direction, but limited samples in each mini-batch can not support effective dense attention to encode informative representations. Facing this bottleneck, (1) we start by assigning each node a token list that is sampled by personalized PageRank (PPR) and then apply standard multi-head self-attention only on this list to compute its node representations. This PPR tokenization method decouples model training from complex graph topological information and makes heavy feature engineering offline and independent, such that mini-batch training of graph transformers is possible by loading each node's token list in batches. We further prove this PPR tokenization is viable as a graph convolution network with a fixed polynomial filter and jumping knowledge. However, only using personalized PageRank may limit information carried by a token list, which could not support different graph inductive biases for model training. To this end, (2) we rewire graphs by introducing multiple types of virtual connections through structure- and content-based super nodes that enable PPR tokenization to encode local and global contexts, long-range interaction, and heterophilous information into each node's token list, and then formalize our $\\underline{\\textbf{V}}$irtual $\\underline{\\textbf{C}}$onnection $\\underline{\\textbf{R}}$anking based $\\underline{\\textbf{Graph}}$ Trans$\\underline{\\textbf{former}}$ (VCR-Graphormer). Overall, VCR-Graphormer needs $O(m+klogk)$ complexity for graph tokenization as compared to $O(n^{3})$ of previous works. The [code](https://github.com/DongqiFu/VCR-Graphormer) is provided.",
        "keywords": "Graph Representation Learning;Graph Transformer",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Dongqi Fu;Zhigang Hua;Yan Xie;Jin Fang;Si Zhang;Kaan Sancak;Hao Wu;Andrey Malevich;Jingrui He;Bo Long",
        "authorids": "~Dongqi_Fu1;~Zhigang_Hua2;~Yan_Xie2;~Jin_Fang4;~Si_Zhang1;~Kaan_Sancak1;~Hao_Wu16;~Andrey_Malevich1;~Jingrui_He1;~Bo_Long3",
        "gender": "M;M;;F;M;M;;M;F;M",
        "homepage": "https://dongqifu.github.io/;https://www.linkedin.com/in/zhi-h-888b7b307/;https://www.cs.uic.edu/~yxie/;;https://sizhang2.web.illinois.edu/;https://www.kaansancak.com/;;;https://www.hejingrui.org;https://www.linkedin.com/in/bolonglinkedin/",
        "dblp": "273/0228;76/170;;;119/2063;274/7229;;;34/2685;96/6993.html",
        "google_scholar": "WByXZAcAAAAJ;;;;JCs-EyYAAAAJ;3hLbpiQAAAAJ;https://scholar.google.com/citations?hl=en;;hXpZynkAAAAJ;",
        "orcid": "0000-0002-8726-9234;0009-0000-2045-0701;0009-0000-2557-2265;0009-0007-1506-7637;;0000-0002-0197-7513;;;0000-0002-6429-6272;",
        "linkedin": ";zhi-h-888b7b307/;;jinfang9812/;;kaansancak;hao-howard-wu-ba107158/;amalevich/;;bolonglinkedin/",
        "or_profile": "~Dongqi_Fu1;~Zhigang_Hua2;~Yan_Xie2;~Jin_Fang4;~Si_Zhang1;~Kaan_Sancak1;~Hao_Wu16;~Andrey_Malevich1;~Jingrui_He1;~Bo_Long1",
        "aff": "University of Illinois, Urbana Champaign;Ant Group;Meta Facebook;Meta;Meta;Georgia Institute of Technology;Meta Facebook;Meta Facebook;University of Illinois, Urbana Champaign;Meta",
        "aff_domain": "illinois.edu;antfin.com;meta.com;meta.com;fb.com;gatech.edu;fb.com;facebook.com;illinois.edu;meta.com",
        "position": "PhD student;Software Engineer;Researcher;Researcher;Researcher;PhD student;Research Scientist;Researcher;Full Professor;Principal Researcher",
        "bibtex": "@inproceedings{\nfu2024vcrgraphormer,\ntitle={{VCR}-Graphormer: A Mini-batch Graph Transformer via Virtual Connections},\nauthor={Dongqi Fu and Zhigang Hua and Yan Xie and Jin Fang and Si Zhang and Kaan Sancak and Hao Wu and Andrey Malevich and Jingrui He and Bo Long},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=SUUrkC3STJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "QU1U;jsyZ;5Wvh;82Qp",
        "pdf_size": 1008085,
        "rating": "5;5;6;6",
        "confidence": "5;4;5;4",
        "soundness": "2;2;2;3",
        "contribution": "2;3;3;3",
        "presentation": "3;1;3;3",
        "wc_summary": "13;65;73;176",
        "wc_strengths": "34;44;60;48",
        "wc_weaknesses": "38;299;29;22",
        "wc_questions": "38;1;368;155",
        "wc_review": "123;409;530;401",
        "wc_reply_reviewers": "0;193;17;0",
        "wc_reply_authors": "126;698;658;166",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;2;2;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            81.75,
            59.09050262097963
        ],
        "wc_strengths_avg": [
            46.5,
            9.313968005098578
        ],
        "wc_weaknesses_avg": [
            97.0,
            116.76257962206898
        ],
        "wc_questions_avg": [
            140.5,
            143.11970514223398
        ],
        "wc_review_avg": [
            365.75,
            149.18005060999275
        ],
        "wc_reply_reviewers_avg": [
            52.5,
            81.41406512390841
        ],
        "wc_reply_authors_avg": [
            412.0,
            266.7508200549719
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 31,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14210817925046197888&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=SUUrkC3STJ",
        "pdf": "https://openreview.net/pdf?id=SUUrkC3STJ",
        "email": "illinois.edu;antfin.com;meta.com;meta.com;fb.com;gatech.edu;fb.com;facebook.com;illinois.edu;meta.com",
        "author_num": 10,
        "aff_unique_index": "0;1;2;2;2;3;2;2;0;2",
        "aff_unique_norm": "University of Illinois Urbana-Champaign;Ant Group;Meta;Georgia Institute of Technology",
        "aff_unique_dep": ";;Meta Platforms, Inc.;",
        "aff_unique_url": "https://illinois.edu;https://www.antgroup.com;https://meta.com;https://www.gatech.edu",
        "aff_unique_abbr": "UIUC;Ant Group;Meta;Georgia Tech",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Urbana-Champaign;",
        "aff_country_unique_index": "0;1;0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "SWRFC2EupO",
        "title": "Language Reward Modulation for Pretraining Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Using learned reward functions (LRFs) as a means to solve sparse-reward reinforcement learning (RL) tasks has yielded some steady progress in task-complexity through the years. In this work, we question whether today's LRFs are best-suited as a direct replacement for task rewards. Instead, we propose leveraging the capabilities of LRFs as a pretraining signal for RL. Concretely,  we propose $\\textbf{LA}$nguage Reward $\\textbf{M}$odulated $\\textbf{P}$retraining (LAMP) which leverages the zero-shot capabilities of Vision-Language Models (VLMs) as a $\\textit{pretraining}$ utility for RL as opposed to a downstream task reward. LAMP uses a frozen, pretrained VLM to scalably generate noisy, albeit shaped exploration rewards by computing the contrastive alignment between a highly diverse collection of language instructions and the image observations of an agent in its pretraining environment. LAMP optimizes these rewards in conjunction with standard novelty-seeking exploration rewards with reinforcement learning to acquire a language-conditioned, pretrained policy. Our VLM pretraining approach, which is a departure from previous attempts to use LRFs, can warmstart sample-efficient learning on robot manipulation tasks in RLBench.",
        "keywords": "Reinforcement Learning;Deep Learning;Robotics;Generative Models;Language Models;Vision-Language Models",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/861b539b86813afa509e63e2ccb90eff5aea4169.zip",
        "author": "Ademi Adeniji;Amber Xie;Carmelo Sferrazza;Younggyo Seo;Stephen James;Pieter Abbeel",
        "authorids": "~Ademi_Adeniji1;~Amber_Xie1;~Carmelo_Sferrazza1;~Younggyo_Seo1;~Stephen_James1;~Pieter_Abbeel2",
        "gender": "M;;;M;M;M",
        "homepage": ";;https://sferrazza.cc;https://younggyo.me/;https://stepjam.github.io/;https://people.eecs.berkeley.edu/~pabbeel/",
        "dblp": ";;190/8406;265/5586;163/5669;",
        "google_scholar": "KFnmktMAAAAJ;https://scholar.google.com/citations?hl=en;x0_lwNYAAAAJ;tI1-YwIAAAAJ;OXtG-isAAAAJ;https://scholar.google.com.tw/citations?user=vtwH6GkAAAAJ",
        "orcid": ";;0000-0002-7432-7634;;;",
        "linkedin": "ademi-adeniji/;;csferrazza/;;;",
        "or_profile": "~Ademi_Adeniji1;~Amber_Xie1;~Carmelo_Sferrazza1;~Younggyo_Seo1;~Stephen_James1;~Pieter_Abbeel2",
        "aff": "University of California, Berkeley;;University of California, Berkeley;Dyson;Dyson;Covariant",
        "aff_domain": "berkeley.edu;;berkeley.edu;dyson.com;dyson.com;covariant.ai",
        "position": "PhD student;;Postdoc;Researcher;Principal Researcher;Founder",
        "bibtex": "@misc{\nadeniji2024language,\ntitle={Language Reward Modulation for Pretraining Reinforcement Learning},\nauthor={Ademi Adeniji and Amber Xie and Carmelo Sferrazza and Younggyo Seo and Stephen James and Pieter Abbeel},\nyear={2024},\nurl={https://openreview.net/forum?id=SWRFC2EupO}\n}",
        "github": "",
        "project": "",
        "reviewers": "PM9W;YXuM;GnSb;hH26",
        "site": "https://openreview.net/forum?id=SWRFC2EupO",
        "pdf_size": 7982448,
        "rating": "5;5;6;6",
        "confidence": "4;3;4;3",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;2;3",
        "wc_summary": "55;55;177;56",
        "wc_strengths": "63;36;60;61",
        "wc_weaknesses": "380;378;188;129",
        "wc_questions": "55;39;203;2",
        "wc_review": "553;508;628;248",
        "wc_reply_reviewers": "0;625;304;135",
        "wc_reply_authors": "787;1762;1957;605",
        "reply_reviewers": "0;2;2;1",
        "reply_authors": "3;4;5;3",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            85.75,
            52.68479382136747
        ],
        "wc_strengths_avg": [
            55.0,
            11.022703842524301
        ],
        "wc_weaknesses_avg": [
            268.75,
            112.20823276391087
        ],
        "wc_questions_avg": [
            74.75,
            76.49959150217732
        ],
        "wc_review_avg": [
            484.25,
            142.97617808572167
        ],
        "wc_reply_reviewers_avg": [
            266.0,
            233.5818914214028
        ],
        "wc_reply_authors_avg": [
            1277.75,
            589.3442860501831
        ],
        "reply_reviewers_avg": [
            1.25,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.75,
            0.82915619758885
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 34,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1478452546930673497&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;1;2",
        "aff_unique_norm": "University of California, Berkeley;Dyson;Covariant",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.berkeley.edu;https://www.dyson.com;",
        "aff_unique_abbr": "UC Berkeley;;",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Berkeley;",
        "aff_country_unique_index": "0;0;1;1",
        "aff_country_unique": "United States;United Kingdom;"
    },
    {
        "id": "SXMTK2eltf",
        "title": "GPT-Driver: Learning to Drive with GPT",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We present a simple yet effective approach that can transform the OpenAI GPT-3.5 model into a reliable motion planner for autonomous vehicles. Motion planning is a core challenge in autonomous driving, aiming to plan a driving trajectory that is safe and comfortable. Existing motion planners predominantly leverage heuristic methods to forecast driving trajectories, yet these approaches demonstrate insufficient generalization capabilities in the face of novel and unseen driving scenarios. In this paper, we propose a novel approach to motion planning that capitalizes on the strong reasoning capabilities and generalization potential inherent to Large Language Models (LLMs). The fundamental insight of our approach is the reformulation of motion planning as a language modeling problem, a perspective not previously explored. Specifically, we represent the planner inputs and outputs as language tokens, and leverage the LLM to generate driving trajectories through a language description of coordinate positions. Furthermore, we propose a novel prompting-reasoning-finetuning strategy to stimulate the numerical reasoning potential of the LLM. With this strategy, the LLM can describe highly precise trajectory coordinates and also its internal decision-making process in natural language. We evaluate our approach on the large-scale nuScenes dataset, and extensive experiments substantiate the effectiveness, generalization ability, and interpretability of our GPT-based motion planner. Code will be released upon acceptance.",
        "keywords": "Motion Planning;Autonomous Driving;Large Language Models (LLMs);GPT",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Jiageng Mao;Hang Zhao;Yue Wang",
        "authorids": "~Jiageng_Mao1;~Hang_Zhao1;~Yue_Wang2",
        "gender": ";M;M",
        "homepage": ";http://www.mit.edu/~hangzhao/;https://yuewang.xyz",
        "dblp": ";;33/4822-41",
        "google_scholar": ";DmahiOYAAAAJ;v-AEFIEAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Jiageng_Mao1;~Hang_Zhao1;~Yue_Wang2",
        "aff": ";Tsinghua University;NVIDIA",
        "aff_domain": ";tsinghua.edu.cn;nvidia.com",
        "position": ";Assistant Professor;Researcher",
        "bibtex": "@misc{\nmao2024gptdriver,\ntitle={{GPT}-Driver: Learning to Drive with {GPT}},\nauthor={Jiageng Mao and Hang Zhao and Yue Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=SXMTK2eltf}\n}",
        "github": "",
        "project": "",
        "reviewers": "PY8W;1ZwR;FVv6;cPYB",
        "site": "https://openreview.net/forum?id=SXMTK2eltf",
        "pdf_size": 1589860,
        "rating": "5;5;5;5",
        "confidence": "5;3;3;4",
        "soundness": "3;2;2;2",
        "contribution": "3;2;2;2",
        "presentation": "3;1;3;3",
        "wc_summary": "59;37;110;65",
        "wc_strengths": "87;54;52;18",
        "wc_weaknesses": "203;375;310;42",
        "wc_questions": "16;140;79;395",
        "wc_review": "365;606;551;520",
        "wc_reply_reviewers": "250;406;244;190",
        "wc_reply_authors": "773;1762;582;1019",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;3;2;2",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            67.75,
            26.52710877574109
        ],
        "wc_strengths_avg": [
            52.75,
            24.40671014290947
        ],
        "wc_weaknesses_avg": [
            232.5,
            125.96924227762902
        ],
        "wc_questions_avg": [
            157.5,
            143.95919560764432
        ],
        "wc_review_avg": [
            510.5,
            89.47206267880495
        ],
        "wc_reply_reviewers_avg": [
            272.5,
            80.5403625519528
        ],
        "wc_reply_authors_avg": [
            1034.0,
            447.9492158716209
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 255,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7336271763350554600&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Tsinghua University;NVIDIA",
        "aff_unique_dep": ";NVIDIA Corporation",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.nvidia.com",
        "aff_unique_abbr": "THU;NVIDIA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "SXTmAdGjlg",
        "title": "Adaptive Bilevel Optimization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We propose a new \\textit{adaptive} optimization algorithm based on mirror descent for a class of possibly non-convex smooth bilevel optimization problems. The optimization template is broadly applicable in machine learning as it features two coupled problems where the optimal solution set of an inner problem serves as a constraint set for the outer problem. As such, existing algorithms require knowledge of gradient Lipschitz constants of both inner and outer levels and are often challenging to tune in practice. Our adaptive algorithm, to our knowledge the first in this setting, circumvents this difficulty by using an AdaGrad-type accumulation strategy on gradient norms and obtains a convergence rate of $\\mathcal{O}(1/T)$ in terms of the outer objective function, when it is convex, where $T$ is the number of iterations. When the outer objective is non-convex, our algorithm obtains an $\\mathcal{O}(1/T)$ best-iterate guarantee for the squared norm of the gradient of the outer objective function. We also provide numerical evidence to support the theory in a reinforcement learning setting where all problem parameters are accessible.",
        "keywords": "adaptive methods; mirror descent methods;bi-level optimization",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/839f7cf4dbbd9030af05efb3a4e62ca303685232.zip",
        "author": "Kimon Antonakopoulos;Shoham Sabach;Luca Viano;Mingyi Hong;Volkan Cevher",
        "authorids": "~Kimon_Antonakopoulos1;~Shoham_Sabach1;~Luca_Viano1;~Mingyi_Hong1;~Volkan_Cevher1",
        "gender": "M;M;;M;M",
        "homepage": ";https://ssabach.net.technion.ac.il/;https://scholar.google.com/citations?hl=en&user=e9Bpg5gAAAAJ;http://people.ece.umn.edu/~mhong/mingyi.html;http://lions.epfl.ch",
        "dblp": "https://dblp.org/pers/hd/a/Antonakopoulos:Kimon;;268/8179;57/8053;70/5301",
        "google_scholar": ";https://scholar.google.ca/citations?user=42D12TkAAAAJ;E_dAUKEAAAAJ;qRnP-p0AAAAJ;https://scholar.google.ch/citations?user=hlWhzU8AAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Kimon_Antonakopoulos1;~Shoham_Sabach1;~Luca_Viano1;~Mingyi_Hong1;~Volkan_Cevher1",
        "aff": "EPFL - EPF Lausanne;Technion - Israel Institute of Technology, Technion;EPFL - EPF Lausanne;University of Minnesota, Minneapolis;Amazon Development Center Germany",
        "aff_domain": "epfl.ch;technion.ac.il;epfl.ch;umn.edu;amazon.de",
        "position": "Postdoc;Associate Professor;PhD student;Associate Professor;Amazon Scholar",
        "bibtex": "@misc{\nantonakopoulos2024adaptive,\ntitle={Adaptive Bilevel Optimization},\nauthor={Kimon Antonakopoulos and Shoham Sabach and Luca Viano and Mingyi Hong and Volkan Cevher},\nyear={2024},\nurl={https://openreview.net/forum?id=SXTmAdGjlg}\n}",
        "github": "",
        "project": "",
        "reviewers": "JR6w;DLXB;YefR;1J7b;KS49",
        "site": "https://openreview.net/forum?id=SXTmAdGjlg",
        "pdf_size": 612491,
        "rating": "3;3;5;6;6",
        "confidence": "4;5;4;2;3",
        "soundness": "2;2;3;3;3",
        "contribution": "2;2;2;3;2",
        "presentation": "2;2;2;2;3",
        "wc_summary": "84;57;124;56;61",
        "wc_strengths": "37;57;101;56;55",
        "wc_weaknesses": "391;145;273;236;131",
        "wc_questions": "179;171;50;65;9",
        "wc_review": "691;430;548;413;256",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            4.6,
            1.3564659966250536
        ],
        "confidence_avg": [
            3.6,
            1.019803902718557
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.2,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            76.4,
            25.89671793876591
        ],
        "wc_strengths_avg": [
            61.2,
            21.226398658274558
        ],
        "wc_weaknesses_avg": [
            235.2,
            94.54818877165232
        ],
        "wc_questions_avg": [
            94.8,
            68.04821819856858
        ],
        "wc_review_avg": [
            467.6,
            145.28675094446845
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.8385566513510482,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10420015263990691157&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;2;3",
        "aff_unique_norm": "EPFL;Technion - Israel Institute of Technology;University of Minnesota;Amazon",
        "aff_unique_dep": ";;;Development Center",
        "aff_unique_url": "https://www.epfl.ch;https://www.technion.ac.il;https://www.minnesota.edu;https://www.amazon.de",
        "aff_unique_abbr": "EPFL;Technion;UMN;Amazon",
        "aff_campus_unique_index": "0;0;2",
        "aff_campus_unique": "Lausanne;;Minneapolis",
        "aff_country_unique_index": "0;1;0;2;3",
        "aff_country_unique": "Switzerland;Israel;United States;Germany"
    },
    {
        "id": "SXTr9hIvJ1",
        "title": "Reweighted Solutions for Weighted Low Rank Approximation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The weighted low rank approximation problem is an important yet computationally challenging primitive with applications ranging from statistical analysis, model compression, and signal processing. To cope with the NP-hardness of this problem, prior work either considers heuristics or bicriteria algorithms to solve this problem. In this work, we introduce a new relaxed solution to the weighted low rank approximation which outputs a matrix that is not necessarily low rank, but can be stored using very few parameters and gives provable approximation guarantees for this problem when the rank matrix has low rank. Our central idea is to use the weight matrix itself to reweight the low rank solution. Our algorithm is extremely simple to implement and achieves remarkable empirical performance in applications to model compression. Our algorithm also gives nearly optimal communication complexity bounds for a natural distributed algorithm  associated with the low rank approximation problem, for which we show matching communication lower bounds. Together, our communication complexity bounds show that the rank of the weight matrix provably parameterizes the communication complexity of weighted low rank approximation. We also obtain the first feature selection guarantees for weighted low rank approximation.",
        "keywords": "Weighted low rank approximation;column subset selection;communication complexity",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/c576ab1cb7a067b004ef2bedd92cb7fa782c0517.zip",
        "author": "David Woodruff;Taisuke Yasuda",
        "authorids": "~David_Woodruff1;~Taisuke_Yasuda1",
        "gender": "M;M",
        "homepage": "http://www.cs.cmu.edu/~dwoodruf/;https://taisukeyasuda.github.io/",
        "dblp": "w/DPWoodruff;177/9741-2",
        "google_scholar": "https://scholar.google.com.tw/citations?user=0G2t-6sAAAAJ;c62WqiEAAAAJ",
        "orcid": ";",
        "linkedin": ";taisukeyasuda/",
        "or_profile": "~David_Woodruff1;~Taisuke_Yasuda1",
        "aff": "Carnegie Mellon University;School of Computer Science, Carnegie Mellon University",
        "aff_domain": "cmu.edu;cs.cmu.edu",
        "position": "Full Professor;PhD student",
        "bibtex": "@misc{\nwoodruff2024reweighted,\ntitle={Reweighted Solutions for Weighted Low Rank Approximation},\nauthor={David Woodruff and Taisuke Yasuda},\nyear={2024},\nurl={https://openreview.net/forum?id=SXTr9hIvJ1}\n}",
        "github": "",
        "project": "",
        "reviewers": "ftz8;GrgZ;e1o5;hd3F",
        "site": "https://openreview.net/forum?id=SXTr9hIvJ1",
        "pdf_size": 1156572,
        "rating": "5;5;5;8",
        "confidence": "3;4;4;2",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "55;147;164;15",
        "wc_strengths": "23;82;58;39",
        "wc_weaknesses": "60;126;196;18",
        "wc_questions": "52;2;74;1",
        "wc_review": "190;357;492;73",
        "wc_reply_reviewers": "107;322;387;52",
        "wc_reply_authors": "439;1164;1168;7",
        "reply_reviewers": "1;3;1;1",
        "reply_authors": "2;3;2;1",
        "rating_avg": [
            5.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            95.25,
            62.17867399679733
        ],
        "wc_strengths_avg": [
            50.5,
            22.005681084665387
        ],
        "wc_weaknesses_avg": [
            100.0,
            67.48333127521195
        ],
        "wc_questions_avg": [
            32.25,
            31.72045869781835
        ],
        "wc_review_avg": [
            278.0,
            159.53526255972378
        ],
        "wc_reply_reviewers_avg": [
            217.0,
            140.75688260259247
        ],
        "wc_reply_authors_avg": [
            694.5,
            495.6230926823325
        ],
        "reply_reviewers_avg": [
            1.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.8703882797784892,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4768689046908959188&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Carnegie Mellon University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cmu.edu",
        "aff_unique_abbr": "CMU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Pittsburgh",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "SXUMYMETIR",
        "title": "Maximum Entropy On-Policy Actor-Critic via Entropy Advantage Estimation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Entropy regularisation is a widely adopted technique that enhances policy optimisation performance and stability. Many practical on-policy methods employ an entropy regularisation term to the policy gradient, thereby maximising policy entropy at visited states. \nOn the other hand, another form of entropy regularisation, maximum entropy reinforcement learning (MaxEnt RL), augments the standard objective with an entropy term, aiming to maximise both the cumulative reward and the entropy of the trajectories induced by a policy.\nHowever, despite its empirical and theoretical achievements, its application in on-policy actor-critic contexts remains relatively underexplored. In this work, we propose an on-policy actor-critic algorithm based on the MaxEnt RL framework. A key aspect of our approach is separating the entropy objective from the MaxEnt RL objective. This delineation allows us to introduce an additional critic for the entropy objective alongside the conventional value critic. It also offers finer control over the optimisation process, incorporating a discount factor specifically for the entropy that provides a distinct way to balance the original and entropy objectives. Our empirical evaluations demonstrate that extending Proximal Policy Optimisation (PPO) and replacing its entropy regularisation with the proposed method significantly improves the performance of PPO in both continuous control tasks and across 16 Procgen environments. Additionally, the results underline MaxEnt RL's capacity to enhance generalisation.",
        "keywords": "reinforcement learning;maximum entropy rl;entropy regularization;policy optimization;generalization",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/53ccc7c5a04cecdc9ccdbfcdf515f2be435a2438.zip",
        "author": "Jean Seong Bjorn Choe;Jong-Kook Kim",
        "authorids": "~Jean_Seong_Bjorn_Choe1;~Jong-Kook_Kim1",
        "gender": "M;M",
        "homepage": "https://github.com/rnilva;http://hpic.korea.ac.kr",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Jean_Seong_Bjorn_Choe1;~Jong-Kook_Kim1",
        "aff": "Korea University;Korea University",
        "aff_domain": "korea.ac.kr;korea.ac.kr",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nchoe2024maximum,\ntitle={Maximum Entropy On-Policy Actor-Critic via Entropy Advantage Estimation},\nauthor={Jean Seong Bjorn Choe and Jong-Kook Kim},\nyear={2024},\nurl={https://openreview.net/forum?id=SXUMYMETIR}\n}",
        "github": "",
        "project": "",
        "reviewers": "62Vd;ztEn;oWp6;273E",
        "site": "https://openreview.net/forum?id=SXUMYMETIR",
        "pdf_size": 1877442,
        "rating": "3;3;3;3",
        "confidence": "4;4;4;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "2;1;3;2",
        "wc_summary": "65;30;150;63",
        "wc_strengths": "34;10;260;37",
        "wc_weaknesses": "306;84;260;79",
        "wc_questions": "5;211;219;54",
        "wc_review": "410;335;889;233",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            77.0,
            44.379049111038874
        ],
        "wc_strengths_avg": [
            85.25,
            101.43316765240057
        ],
        "wc_weaknesses_avg": [
            182.25,
            102.06952287534217
        ],
        "wc_questions_avg": [
            122.25,
            94.39643796245704
        ],
        "wc_review_avg": [
            466.75,
            251.75024826204245
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7199569642466174046&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Korea University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.korea.ac.kr",
        "aff_unique_abbr": "KU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "SXj1qjFEpQ",
        "title": "Generalizing to New Dynamical Systems via Frequency Domain Adaptation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Learning the underlying dynamics from data with deep neural networks has shown remarkable potential in modeling various complex physical dynamics. However, current approaches are constrained in their ability to make reliable predictions in a specific domain and struggle with generalizing to unseen systems that are governed by the same general dynamics but differ in environmental characteristics. In this work, we formulate a parameter-efficient method, FNSDA, that can readily generalize to new dynamics via adaptation in Fourier space. Specifically, FNSDA identifies the shareable dynamics based on the known environments using an automatic partition in Fourier modes and learns to adjust the modes specific for each new environment by conditioning on low-dimensional latent systematic parameters for efficient generalization. We experimentally evaluate FNSDA on representative families of nonlinear dynamics. The results show that FNSDA can achieve superior or competitive generalization performance compared to existing methods with a significantly reduced parameter cost.",
        "keywords": "physical system modeling;generalization;fourier transform",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Tiexin Qin;Hong Yan;Haoliang Li",
        "authorids": "~Tiexin_Qin1;~Hong_Yan2;~Haoliang_Li2",
        "gender": "M;;",
        "homepage": ";;",
        "dblp": ";;",
        "google_scholar": "86PL14gAAAAJ;;",
        "orcid": "0000-0003-2968-7320;;",
        "linkedin": ";;",
        "or_profile": "~Tiexin_Qin1;~Hong_Yan2;~Haoliang_Li2",
        "aff": "City University of Hong Kong;;",
        "aff_domain": "cityu.edu.hk;;",
        "position": "PhD student;;",
        "bibtex": "@misc{\nqin2024generalizing,\ntitle={Generalizing to New Dynamical Systems via Frequency Domain Adaptation},\nauthor={Tiexin Qin and Hong Yan and Haoliang Li},\nyear={2024},\nurl={https://openreview.net/forum?id=SXj1qjFEpQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "fQXG;nLXT;YVis;uCSb",
        "site": "https://openreview.net/forum?id=SXj1qjFEpQ",
        "pdf_size": 20614957,
        "rating": "5;6;6;6",
        "confidence": "5;4;3;4",
        "soundness": "3;3;2;3",
        "contribution": "2;3;3;2",
        "presentation": "3;3;2;3",
        "wc_summary": "37;60;183;147",
        "wc_strengths": "61;28;34;62",
        "wc_weaknesses": "29;127;191;106",
        "wc_questions": "221;292;91;96",
        "wc_review": "348;507;499;411",
        "wc_reply_reviewers": "0;14;44;0",
        "wc_reply_authors": "410;650;646;675",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            106.75,
            60.17630347570379
        ],
        "wc_strengths_avg": [
            46.25,
            15.400892831261439
        ],
        "wc_weaknesses_avg": [
            113.25,
            57.84624015439552
        ],
        "wc_questions_avg": [
            175.0,
            85.29654154770873
        ],
        "wc_review_avg": [
            441.25,
            65.70530800475711
        ],
        "wc_reply_reviewers_avg": [
            14.5,
            17.96524422322168
        ],
        "wc_reply_authors_avg": [
            595.25,
            107.52993769178889
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:yD2naBfVeHkJ:scholar.google.com/&scioq=Generalizing+to+New+Dynamical+Systems+via+Frequency+Domain+Adaptation&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "City University of Hong Kong",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cityu.edu.hk",
        "aff_unique_abbr": "CityU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "title": "When Semantic Segmentation Meets Frequency Aliasing",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18600",
        "id": "SYBdkHcXXK",
        "author_site": "Linwei Chen, Lin Gu, Ying Fu",
        "tldr": "",
        "abstract": "Despite recent advancements in semantic segmentation, where and what pixels are hard to segment remains largely unexplored.\nExisting research only separates an image into easy and hard regions and empirically observes the latter are associated with object boundaries.\nIn this paper, we conduct a comprehensive analysis of hard pixel errors, categorizing them into three types: false responses, merging mistakes, and displacements. \nOur findings reveal a quantitative association between hard pixels and aliasing, \nwhich is distortion caused by the overlapping of frequency components in the Fourier domain during downsampling.\nTo identify the frequencies responsible for aliasing, we propose using the equivalent sampling rate to calculate the Nyquist frequency, which marks the threshold for aliasing. \nThen, we introduce the aliasing score as a metric to quantify the extent of aliasing.\nWhile positively correlated with the proposed aliasing score, three types of hard pixels exhibit different patterns.\nHere, we propose two novel de-aliasing filter (DAF) and frequency mixing (FreqMix) modules to alleviate aliasing degradation by accurately removing or adjusting frequencies higher than the Nyquist frequency.\nThe DAF precisely removes the frequencies responsible for aliasing before downsampling, \nwhile the FreqMix dynamically selects high-frequency components within the encoder block.\nExperimental results demonstrate consistent improvements in semantic segmentation and low-light instance segmentation tasks.\nThe code is at: \\url{https://github.com/Linwei-Chen/Seg-Aliasing}.",
        "keywords": "Aliasing; Hard Pixel; Semantic Segmentation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/7d1e7d87e9bca8fc4d03f2240b536f84142138eb.pdf",
        "author": "Linwei Chen;Lin Gu;Ying Fu",
        "authorids": "~Linwei_Chen1;~Lin_Gu4;~Ying_Fu3",
        "gender": ";M;F",
        "homepage": ";;https://ying-fu.github.io/",
        "dblp": ";;89/1229-1",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en",
        "orcid": ";;0000-0002-6677-694X",
        "linkedin": ";;",
        "or_profile": "~Linwei_Chen1;~Lin_Gu4;~Ying_Fu3",
        "aff": ";RIKEN;Beijing Institute of Technology",
        "aff_domain": ";riken.jp;bit.edu.cn",
        "position": ";Researcher;Full Professor",
        "bibtex": "@inproceedings{\nchen2024when,\ntitle={When Semantic Segmentation Meets Frequency Aliasing},\nauthor={Linwei Chen and Lin Gu and Ying Fu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=SYBdkHcXXK}\n}",
        "github": "",
        "project": "",
        "reviewers": "uz5r;LE8t;qrZx",
        "pdf_size": 26722669,
        "rating": "5;5;8",
        "confidence": "5;4;4",
        "soundness": "3;3;3",
        "contribution": "3;2;3",
        "presentation": "1;4;3",
        "wc_summary": "59;55;108",
        "wc_strengths": "70;30;95",
        "wc_weaknesses": "52;56;84",
        "wc_questions": "67;251;29",
        "wc_review": "248;392;316",
        "wc_reply_reviewers": "0;50;0",
        "wc_reply_authors": "440;1407;441",
        "reply_reviewers": "0;1;0",
        "reply_authors": "1;3;1",
        "rating_avg": [
            6.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "wc_summary_avg": [
            74.0,
            24.097026095903757
        ],
        "wc_strengths_avg": [
            65.0,
            26.770630673681683
        ],
        "wc_weaknesses_avg": [
            64.0,
            14.236104336041748
        ],
        "wc_questions_avg": [
            115.66666666666667,
            96.94442852594584
        ],
        "wc_review_avg": [
            318.6666666666667,
            58.8179866669674
        ],
        "wc_reply_reviewers_avg": [
            16.666666666666668,
            23.570226039551585
        ],
        "wc_reply_authors_avg": [
            762.6666666666666,
            455.612652248474
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1871656124856368581&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=SYBdkHcXXK",
        "pdf": "https://openreview.net/pdf?id=SYBdkHcXXK",
        "email": ";riken.jp;bit.edu.cn",
        "author_num": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "RIKEN;Beijing Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.riken.jp;http://www.bit.edu.cn/",
        "aff_unique_abbr": "RIKEN;BIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Japan;China"
    },
    {
        "id": "SYPx4NukeB",
        "title": "SSL Framework for Causal Inconsistency between Structures and Representations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The cross-pollination of deep learning and causal discovery has catalyzed a burgeoning field of research, seeking to elucidate causal relationships within non-statistical data forms like images, videos, and text. Such data, often being named \u2018indefinite data', exhibit unique challenges\u2014inconsistency between causal structure and representation, which are not common in conventional data forms. To tackle this issue, we theoretically develop intervention strategies suitable for indefinite data and derive causal consistency condition (CCC). Moreover, we design a self-supervised learning (SSL) framework that considers interventions as  \u2019views' and CCC as a `philosophy' with two implement examples on Supervised Specialized Models (SSMs) and Large Language Models (LLMs), respectively. To evaluate pure inconsistency manifestations, we have prepared the first high-quality causal dialogue dataset-Causalogue. Evaluations are also performed \non three other downstream tasks. Extensive experimentation has substantiated the efficacy of our methodology, illuminating how CCC could potentially play an influential role in various fields. Our code is available in https://anonymous.4open.science/r/ICLR_Anonymous_submission_575_new_dataset_Causalogue_and_codes/Causalogue_Dataset/Fork_I_demo.py.",
        "keywords": "Self-supervised Learning;Causal Representations;Causal Consistency;Interventions",
        "primary_area": "causal reasoning",
        "supplementary_material": "/attachment/47e813acfde0d1441e68ff0b1620dc47f559317a.pdf",
        "author": "Hang Chen;Xinyu Yang;Keqing Du",
        "authorids": "~Hang_Chen3;~Xinyu_Yang2;~Keqing_Du1",
        "gender": "M;M;F",
        "homepage": "https://github.com/Zodiark-ch;http://gr.xjtu.edu.cn/web/xyyang;https://github.com/777Rebecca",
        "dblp": ";;329/5757.html",
        "google_scholar": "https://scholar.google.com.hk/citations?user=8-PmU7QAAAAJ;;https://scholar.google.com/citations?view_op=list_works",
        "orcid": "0000-0002-9141-174X;;0000-0003-3018-689X",
        "linkedin": ";;",
        "or_profile": "~Hang_Chen3;~Xinyu_Yang2;~Keqing_Du1",
        "aff": "Xi'an Jiaotong University;Xi'an Jiaotong University;Xi'an Jiaotong University",
        "aff_domain": "xjtu.edu.cn;xjtu.edu.cn;xjtu.edu.cn",
        "position": "PhD student;Full Professor;PhD student",
        "bibtex": "@misc{\nchen2024ssl,\ntitle={{SSL} Framework for Causal Inconsistency between Structures and Representations},\nauthor={Hang Chen and Xinyu Yang and Keqing Du},\nyear={2024},\nurl={https://openreview.net/forum?id=SYPx4NukeB}\n}",
        "github": "",
        "project": "",
        "reviewers": "dzLx;cecZ;2DS3",
        "site": "https://openreview.net/forum?id=SYPx4NukeB",
        "pdf_size": 1355303,
        "rating": "3;5;6",
        "confidence": "3;4;3",
        "soundness": "2;3;3",
        "contribution": "3;3;2",
        "presentation": "1;4;2",
        "wc_summary": "66;38;39",
        "wc_strengths": "22;21;20",
        "wc_weaknesses": "57;14;133",
        "wc_questions": "395;117;39",
        "wc_review": "540;190;231",
        "wc_reply_reviewers": "0;22;22",
        "wc_reply_authors": "414;727;363",
        "reply_reviewers": "0;1;1",
        "reply_authors": "1;2;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "wc_summary_avg": [
            47.666666666666664,
            12.970050972229146
        ],
        "wc_strengths_avg": [
            21.0,
            0.816496580927726
        ],
        "wc_weaknesses_avg": [
            68.0,
            49.200271001963664
        ],
        "wc_questions_avg": [
            183.66666666666666,
            152.79034291763628
        ],
        "wc_review_avg": [
            320.3333333333333,
            156.22704275793257
        ],
        "wc_reply_reviewers_avg": [
            14.666666666666666,
            10.370899457402697
        ],
        "wc_reply_authors_avg": [
            501.3333333333333,
            160.9230319818211
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.18898223650461363,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9550020023507115094&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Xi'an Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.xjtu.edu.cn",
        "aff_unique_abbr": "XJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "SZErAetdMu",
        "title": "Time Series Modeling at Scale: A Universal Representation Across Tasks and Domains",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Time series are ubiquitous, capturing real-world phenomena ranging from human\nneuronal firing and tectonic activity to atmospheric conditions. However, they are\nchallenging to analyze due to domain-specific timescales (e.g., sub-second for brain\nactivity and years for weather phenomena), complex multivariate relations, and\ndisparate modeling objectives. Prior works model time series by targeting specific\ntasks, like forecasting, or distinct domains, like neural recordings. We introduce\na universal approach for scalable time series modeling across many tasks and\ndomains, which we call TOTEM: Tokenized Time Series Embeddings. We propose\na task-agnostic embedding that projects a continuous time series of any length\nonto a discrete set of learned tokens. This embedding is derived by optimizing\na self-supervised objective formulated as a task-independent convolution-based\nvector quantized variational autoencoder. Drawing inspiration from the recent\nsuccesses of Large Language Models, these discrete token sequences are then used\nto learn downstream models with the powerful Transformer architecture. We show\nthat TOTEM matches or achieves SOTA performance on forecasting, classification,\nand translation tasks with data drawn from a myriad of domains: neuroscience,\nseismology, meteorology, power grids, and urban traffic. We further demonstrate\nTOTEM\u2019s scalability by introducing and evaluating it on new datasets, the largest\nbeing \u223c14\u00d7 larger than existing benchmarks. Finally, we illustrate TOTEM\u2019s\ndominant zero-shot generalization capabilities across all of our downstream tasks.",
        "keywords": "Time Series;Tokenization;Transformers;VQVAE",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/8ef99c4d853d16fca1d9885d45d47576c553f650.zip",
        "author": "Sabera J Talukder;Georgia Gkioxari",
        "authorids": "~Sabera_J_Talukder1;~Georgia_Gkioxari1",
        "gender": ";F",
        "homepage": "https://saberatalukder.com/;https://gkioxari.github.io/",
        "dblp": ";135/4895.html",
        "google_scholar": "S00bhfIAAAAJ;kQisE-gAAAAJ",
        "orcid": ";",
        "linkedin": "sabera-talukder-69600bb1/;",
        "or_profile": "~Sabera_J_Talukder1;~Georgia_Gkioxari1",
        "aff": "California Institute of Technology;California Institute of Technology",
        "aff_domain": "caltech.edu;caltech.edu",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\ntalukder2024time,\ntitle={Time Series Modeling at Scale: A Universal Representation Across Tasks and Domains},\nauthor={Sabera J Talukder and Georgia Gkioxari},\nyear={2024},\nurl={https://openreview.net/forum?id=SZErAetdMu}\n}",
        "github": "",
        "project": "",
        "reviewers": "EFAQ;tudQ;9M6r",
        "site": "https://openreview.net/forum?id=SZErAetdMu",
        "pdf_size": 1477347,
        "rating": "3;3;3",
        "confidence": "4;5;5",
        "soundness": "2;3;2",
        "contribution": "2;2;2",
        "presentation": "1;2;2",
        "wc_summary": "58;56;92",
        "wc_strengths": "48;27;44",
        "wc_weaknesses": "590;194;338",
        "wc_questions": "15;58;102",
        "wc_review": "711;335;576",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            68.66666666666667,
            16.519348924485158
        ],
        "wc_strengths_avg": [
            39.666666666666664,
            9.104333522498441
        ],
        "wc_weaknesses_avg": [
            374.0,
            163.65818036383027
        ],
        "wc_questions_avg": [
            58.333333333333336,
            35.51838334659329
        ],
        "wc_review_avg": [
            540.6666666666666,
            155.52134544456877
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:XsFnibmmH1AJ:scholar.google.com/&scioq=Time+Series+Modeling+at+Scale:+A+Universal+Representation+Across+Tasks+and+Domains&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "California Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.caltech.edu",
        "aff_unique_abbr": "Caltech",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Pasadena",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "OWL: A Large Language Model for IT Operations",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18599",
        "id": "SZOQ9RKYJu",
        "author_site": "Hongcheng Guo, Jian Yang, Jiaheng Liu, Liqun Yang, Linzheng Chai, Jiaqi Bai, Junran Peng, Xiaorong Hu, Chao Chen, Dongfeng Zhang, xu Shi, Tieqiao Zheng, liangfan zheng, Bo Zhang, Ke Xu, Zhoujun Li",
        "tldr": "",
        "abstract": "With the rapid advancement of IT operations, managing and analyzing large data volumes efficiently for practical applications has become increasingly critical. Natural Language Processing (NLP) techniques have demonstrated remarkable capabilities in various tasks, including named entity recognition, machine translation, and dialogue systems. Recently, Large Language Models (LLMs) have achieved significant improvements across various domain-specific areas. However, there is a noticeable gap in the development of specialized Large Language Models (LLMs) tailored for IT operations. In this paper, we introduce the OWL, a large language model trained on our constructed Owl-Instruct with a wide range of IT-related information. Specifically, limited by the maximum input length, we propose the \\textbf{H}omogeneous \\textbf{M}arkov \\textbf{C}ontext \\textbf{E}xtension method (HMCE). The mixture-of-adapter strategy is leveraged to improve the parameter-efficient tuning across different domains or tasks.\nFurther, we evaluate the performance of OWL on the Owl-Bench established by us and open IT-related benchmarks. OWL  demonstrates superior performance results on IT tasks, which outperforms existing models by significant margins. Moreover, we hope that the findings of our work will provide more insights to revolutionize the techniques of IT operations with specialized LLMs.",
        "keywords": "Large language model;IT operations;AIOps",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Hongcheng Guo;Jian Yang;Jiaheng Liu;Liqun Yang;Linzheng Chai;Jiaqi Bai;Junran Peng;Xiaorong Hu;Chao Chen;Dongfeng Zhang;xu Shi;Tieqiao Zheng;liangfan zheng;Bo Zhang;Ke Xu;Zhoujun Li",
        "authorids": "~Hongcheng_Guo1;~Jian_Yang10;~Jiaheng_Liu1;~Liqun_Yang2;~Linzheng_Chai1;~Jiaqi_Bai1;~Junran_Peng1;~Xiaorong_Hu1;~Chao_Chen20;~Dongfeng_Zhang1;~xu_Shi2;~Tieqiao_Zheng1;~liangfan_zheng1;~Bo_Zhang21;~Ke_Xu4;~Zhoujun_Li1",
        "gender": "M;M;M;M;M;M;M;;M;;M;M;M;M;;M",
        "homepage": ";https://www.researchgate.net/scientific-contributions/Jian-Yang-2146089927;https://liujiaheng.github.io/;https://cst.buaa.edu.cn/info/1113/2735.htm;;;https://jrpeng.github.io/;;https://github.com/1163307648;https://github.com/Semeron;https://github.com/iammeizu;;https://www.cloudwise.ai/;https://www.cloudwise.ai/;;",
        "dblp": "84/8542;181/2854-30;225/1962;;320/5967.html;;;;;;;;;;x/KeXu;76/2866-1",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;i9opWEgAAAAJ;yFI_RjUAAAAJ;;;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com.hk/citations?hl=en;4zUO5g0AAAAJ;;;;;;;;",
        "orcid": ";0000-0003-1983-012X;;;;;;;;;;;;;;",
        "linkedin": ";;;;;;;;;;;https://www.linkedin.cn/incareer/in/ACoAACJP2JcBI-1arF7v8hZctrUPJK7uAo21jtc;https://www.linkedin.cn/incareer/in/ACoAABtX7BUBFdurXmj4NgmSefF1l38s5izCFZ4;;;",
        "or_profile": "~Hongcheng_Guo1;~Jian_Yang10;~Jiaheng_Liu1;~Liqun_Yang2;~Linzheng_Chai1;~Jiaqi_Bai1;~Junran_Peng1;~Xiaorong_Hu1;~Chao_Chen20;~Dongfeng_Zhang1;~xu_Shi2;~Tieqiao_Zheng1;~liangfan_zheng1;~Bo_Zhang21;~Ke_Xu4;~Zhoujun_Li1",
        "aff": "Beihang University;Alibaba Group;Alibaba Group;;Beihang University;Beihang University;University of Science and Technology Beijing;;;;;;Cloudwise Research;;Beihang University;Beihang University",
        "aff_domain": "buaa.edu.cn;alibaba-inc.com;alibaba-inc.com;;buaa.edu.cn;buaa.edu.cn;ustb.edu.cn;;;;;;cloudwise.com;;buaa.edu.cn;buaa.edu.cn",
        "position": "PhD student;Researcher;Researcher;;PhD student;PhD student;Associate Professor;;;;;;Principal Researcher;;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nguo2024owl,\ntitle={{OWL}: A Large Language Model for {IT} Operations},\nauthor={Hongcheng Guo and Jian Yang and Jiaheng Liu and Liqun Yang and Linzheng Chai and Jiaqi Bai and Junran Peng and Xiaorong Hu and Chao Chen and Dongfeng Zhang and xu Shi and Tieqiao Zheng and liangfan zheng and Bo Zhang and Ke Xu and Zhoujun Li},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=SZOQ9RKYJu}\n}",
        "github": "",
        "project": "",
        "reviewers": "YiYB;39Lm;xogR;btSj",
        "pdf_size": 997465,
        "rating": "5;5;6;6",
        "confidence": "3;3;3;3",
        "soundness": "2;3;2;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "18;91;94;61",
        "wc_strengths": "23;58;72;75",
        "wc_weaknesses": "136;112;199;21",
        "wc_questions": "4;99;76;50",
        "wc_review": "181;360;441;207",
        "wc_reply_reviewers": "0;22;0;34",
        "wc_reply_authors": "945;1001;758;656",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "4;5;6;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            66.0,
            30.569592735265545
        ],
        "wc_strengths_avg": [
            57.0,
            20.65187642806338
        ],
        "wc_weaknesses_avg": [
            117.0,
            63.88661831714056
        ],
        "wc_questions_avg": [
            57.25,
            35.29429840639986
        ],
        "wc_review_avg": [
            297.25,
            107.54156173312715
        ],
        "wc_reply_reviewers_avg": [
            14.0,
            14.628738838327793
        ],
        "wc_reply_authors_avg": [
            840.0,
            139.21745580206527
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            4.25,
            1.479019945774904
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            16,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 44,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3952844749742464431&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=SZOQ9RKYJu",
        "pdf": "https://openreview.net/pdf?id=SZOQ9RKYJu",
        "email": "buaa.edu.cn;alibaba-inc.com;alibaba-inc.com;;buaa.edu.cn;buaa.edu.cn;ustb.edu.cn;;;;;;cloudwise.com;;buaa.edu.cn;buaa.edu.cn",
        "author_num": 16,
        "aff_unique_index": "0;1;1;0;0;2;3;0;0",
        "aff_unique_norm": "Beihang University;Alibaba Group;University of Science and Technology Beijing;Cloudwise Research",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "http://www.buaa.edu.cn/;https://www.alibaba.com;http://www.ustb.edu.cn;",
        "aff_unique_abbr": "BUAA;Alibaba;USTB;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "China;"
    },
    {
        "id": "SZZEH8x54D",
        "title": "Part-based bird classifiers with an explainable, editable language bottleneck",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Most CLIP-based image classifiers rely heavily on having known class names in the prompt and therefore are neither explainable nor editable to humans. Here, we present PEEB, a novel bird classifier that allows users to describe in text the 12 parts of every bird that they want to identify. After the textual descriptors are defined, PEEB detects 12 parts of a bird in the image and then computes a matching score between the image and each class by summing over the dot products of 12 pairs of visual and textual part embeddings. Besides editability, our classifier achieves state-of-the-art accuracy in two different zero-shot settings and competitive performance when finetuned on target datasets.",
        "keywords": "part-based;explainable;editable;bird classifier;language bottleneck",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/db364d1f7cc65c60968a285245387eefb1f10e9b.pdf",
        "author": "Thang M. Pham;Peijie Chen;Tin Nguyen;Seunghyun Yoon;Trung Bui;Anh Totti Nguyen",
        "authorids": "~Thang_M._Pham1;~Peijie_Chen2;~Tin_Nguyen1;~Seunghyun_Yoon1;~Trung_Bui1;~Anh_Totti_Nguyen1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://ngthanhtin.github.io/;https://david-yoon.github.io/;https://sites.google.com/site/trungbuistanford/;http://anhnguyen.me;https://chanfeechen.github.io/resume/;https://thangpm.github.io/",
        "dblp": "365/9058;68/3020-2;180/0632;;267/9646;282/4513",
        "google_scholar": "zSAfD80AAAAJ;https://scholar.google.com/citations?hl=en;FpFTduYAAAAJ;EQw8d9AAAAAJ;QBfXEq0AAAAJ;eNrX3mYAAAAJ",
        "orcid": "0000-0002-6798-9808;0000-0002-7262-3579;0000-0002-0871-349X;;;",
        "linkedin": "kevin-nguyen-836806221/;david-s-yoon/;trung-bui-4333322/;;chen-peijie-3897b8211/;thangpm/",
        "or_profile": "~Tin_Nguyen1;~Seunghyun_Yoon1;~Trung_Bui1;~Anh_Totti_Nguyen1;~PEIJIE_CHEN1;~Thang_Minh_Pham1",
        "aff": "Auburn University;Adobe Research;Adobe Research;Auburn University;Auburn University;Auburn University",
        "aff_domain": "auburn.edu;adobe.com;adobe.com;auburn.edu;auburn.edu;auburn.edu",
        "position": "PhD student;Researcher;Researcher;Associate Professor;PhD student;PhD student",
        "bibtex": "@misc{\npham2024partbased,\ntitle={Part-based bird classifiers with an explainable, editable language bottleneck},\nauthor={Thang M. Pham and Peijie Chen and Tin Nguyen and Seunghyun Yoon and Trung Bui and Anh Totti Nguyen},\nyear={2024},\nurl={https://openreview.net/forum?id=SZZEH8x54D}\n}",
        "github": "",
        "project": "",
        "reviewers": "4q8P;H7HS;AaGv;fPwG",
        "site": "https://openreview.net/forum?id=SZZEH8x54D",
        "pdf_size": 9408769,
        "rating": "3;3;5;6",
        "confidence": "5;2;4;3",
        "soundness": "2;2;3;2",
        "contribution": "2;1;2;2",
        "presentation": "2;2;3;2",
        "wc_summary": "110;43;113;61",
        "wc_strengths": "33;33;60;39",
        "wc_weaknesses": "306;37;62;230",
        "wc_questions": "26;15;26;5",
        "wc_review": "475;128;261;335",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1819;671;948;1242",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "5;1;3;3",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            81.75,
            30.441542339375644
        ],
        "wc_strengths_avg": [
            41.25,
            11.098986440211556
        ],
        "wc_weaknesses_avg": [
            158.75,
            112.85250329523045
        ],
        "wc_questions_avg": [
            18.0,
            8.74642784226795
        ],
        "wc_review_avg": [
            299.75,
            125.45392580545257
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1170.0,
            425.6377567838643
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            3.0,
            1.4142135623730951
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.08606629658238704,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:7qQxyMN9EB4J:scholar.google.com/&scioq=Part-based+bird+classifiers+with+an+explainable,+editable+language+bottleneck&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;0;0;0",
        "aff_unique_norm": "Auburn University;Adobe",
        "aff_unique_dep": ";Adobe Research",
        "aff_unique_url": "https://www.auburn.edu;https://research.adobe.com",
        "aff_unique_abbr": "Auburn;Adobe",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "SZn1Ex72Lv",
        "title": "Block-operations: Creating an Inductive Bias to Route Data and Reuse Subnetworks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Feed Forward Neural Networks (FNNs) often suffer from poor generalization due to their inability to effectively develop and reuse subnetworks for related tasks. Csord\u00e1s et al. (2020) suggest that this may be because FNNs are more likely to learn new mappings than to copy and route activation patterns without altering them. To tackle this problem, we propose the concept of block-operations: Learnable functions that group neurons into larger semantic units and operate on these blocks, with routing as a primitive operation. As a first step, we introduce the Multiplexer, a new architectural component that enhances the FNN by adding block-operations to it. We experimentally verified that the Multiplexer exhibits several desirable properties, as compared to the FNN which it replaces: It represents concepts consistently with the same neuron activation patterns throughout the network, suffers less from negative interference, shows an increased propensity for specialization and transfer learning, can more easily reuse learned subnetworks for new tasks, and is particularly effective at learning algorithmic tasks with conditional logics. In several cases, the Multiplexer achieved 100% OOD-generalization on our tasks, where FNNs only learned correlations that failed to generalize. Our results suggest that block-operations are a promising direction for future research. Adapting more complex architectures than the FNN to make use of them could lead to increased compositionality and better generalization.",
        "keywords": "Neural Network Architecture;FNN;Data Representation;Generalization;Routing;Inductive Bias;Negative interference",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/8e9790cdaae20ab37ae9eb6eb969c97cddf499e2.zip",
        "author": "Florian Dietz;Dietrich Klakow",
        "authorids": "~Florian_Dietz1;~Dietrich_Klakow1",
        "gender": "M;M",
        "homepage": ";https://www.lsv.uni-saarland.de/",
        "dblp": "205/1998.html;00/1846",
        "google_scholar": "E4Tt_74AAAAJ;https://scholar.google.de/citations?user=_HtGYmoAAAAJ",
        "orcid": ";0000-0002-4147-9690",
        "linkedin": "floriandietz/;https://www.linkedin.com/feed/?trk=DACH-SEM_google-adwords_brand-ghpwwww.l",
        "or_profile": "~Florian_Dietz1;~Dietrich_Klakow1",
        "aff": "Saarland University;Saarland University",
        "aff_domain": "uni-saarland.de;saarland.de",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\ndietz2024blockoperations,\ntitle={Block-operations: Creating an Inductive Bias to Route Data and Reuse Subnetworks},\nauthor={Florian Dietz and Dietrich Klakow},\nyear={2024},\nurl={https://openreview.net/forum?id=SZn1Ex72Lv}\n}",
        "github": "",
        "project": "",
        "reviewers": "pnJf;frtd;VWus;NTVM",
        "site": "https://openreview.net/forum?id=SZn1Ex72Lv",
        "pdf_size": 638286,
        "rating": "3;3;3;5",
        "confidence": "3;4;4;3",
        "soundness": "1;2;2;2",
        "contribution": "1;2;3;2",
        "presentation": "2;2;1;2",
        "wc_summary": "153;65;293;107",
        "wc_strengths": "8;21;102;60",
        "wc_weaknesses": "167;394;513;152",
        "wc_questions": "1;129;218;279",
        "wc_review": "329;609;1126;598",
        "wc_reply_reviewers": "0;679;258;0",
        "wc_reply_authors": "275;1279;478;443",
        "reply_reviewers": "0;2;1;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            154.5,
            85.806468287653
        ],
        "wc_strengths_avg": [
            47.75,
            36.70405290972647
        ],
        "wc_weaknesses_avg": [
            306.5,
            152.99428093886385
        ],
        "wc_questions_avg": [
            156.75,
            104.55231943864277
        ],
        "wc_review_avg": [
            665.5,
            288.54852278256425
        ],
        "wc_reply_reviewers_avg": [
            234.25,
            277.53952421231827
        ],
        "wc_reply_authors_avg": [
            618.75,
            388.84211127397197
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:t5K7GWll6wUJ:scholar.google.com/&scioq=Block-operations:+Creating+an+Inductive+Bias+to+Route+Data+and+Reuse+Subnetworks&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Saarland University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uni-saarland.de",
        "aff_unique_abbr": "UdS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Germany"
    },
    {
        "title": "Efficient local linearity regularization to overcome catastrophic overfitting",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18598",
        "id": "SZzQz8ikwg",
        "author_site": "Elias Abad Rocamora, Fanghui Liu, Grigorios Chrysos, Pablo M. Olmos, Volkan Cevher",
        "tldr": "",
        "abstract": "Catastrophic overfitting (CO) in single-step adversarial training (AT) results in abrupt drops in the adversarial test accuracy (even down to $0$%). For models trained with multi-step AT, it has been observed that the loss function behaves locally linearly with respect to the input, this is however lost in single-step AT. To address CO in single-step AT, several methods have been proposed to enforce local linearity of the loss via regularization. However, these regularization terms considerably slow down training due to *Double Backpropagation*. Instead, in this work, we introduce a regularization term, called ELLE, to mitigate CO *effectively* and *efficiently* in classical AT evaluations, as well as some more difficult regimes, e.g., large adversarial perturbations and long training schedules. Our regularization term can be theoretically linked to curvature of the loss function and is computationally cheaper than previous methods by avoiding *Double Backpropagation*. Our thorough experimental validation demonstrates that our work does not suffer from CO, even in challenging settings where previous works suffer from it. We also notice that adapting our regularization parameter during training (ELLE-A) greatly improves the performance, specially in large $\\epsilon$ setups. Our implementation is available in https://github.com/LIONS-EPFL/ELLE.",
        "keywords": "Fast Adversarial Training;Catastrophic Overfitting;Local Linearity",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/eb1d4678a2f1c99938c5214eb6dd54ce785c5a13.zip",
        "author": "Elias Abad Rocamora;Fanghui Liu;Grigorios Chrysos;Pablo M. Olmos;Volkan Cevher",
        "authorids": "~Elias_Abad_Rocamora1;~Fanghui_Liu1;~Grigorios_Chrysos1;~Pablo_M._Olmos1;~Volkan_Cevher1",
        "gender": "M;M;M;;M",
        "homepage": "https://megaelius.github.io/;http://www.lfhsgre.org;https://grigorisg9gr.github.io/;http://www.tsc.uc3m.es/~olmos/;http://lions.epfl.ch",
        "dblp": "329/4351;119/1038;75/6117-2;83/8261;70/5301",
        "google_scholar": "lHfp1OAAAAAJ;AKxBgssAAAAJ;1bU041kAAAAJ;pdcdDVoAAAAJ;https://scholar.google.ch/citations?user=hlWhzU8AAAAJ",
        "orcid": ";0000-0003-4133-7921;;;",
        "linkedin": "el%C3%ADas-abad-rocamora-8587261b8/?originalSubdomain=es;;;;",
        "or_profile": "~Elias_Abad_Rocamora1;~Fanghui_Liu1;~Grigorios_Chrysos1;~Pablo_M._Olmos1;~Volkan_Cevher1",
        "aff": "EPFL - EPF Lausanne;University of Warwick;University of Wisconsin - Madison;Universidad Carlos III de Madrid;Amazon Development Center Germany",
        "aff_domain": "epfl.ch;warwick.ac.uk;wisc.edu;uc3m.es;amazon.de",
        "position": "PhD student;Assistant Professor;Assistant Professor;Associate Professor;Amazon Scholar",
        "bibtex": "@inproceedings{\nrocamora2024efficient,\ntitle={Efficient local linearity regularization to overcome catastrophic overfitting},\nauthor={Elias Abad Rocamora and Fanghui Liu and Grigorios Chrysos and Pablo M. Olmos and Volkan Cevher},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=SZzQz8ikwg}\n}",
        "github": "",
        "project": "",
        "reviewers": "e1KG;vQnz;4XDh",
        "pdf_size": 4283340,
        "rating": "5;6;6",
        "confidence": "4;3;5",
        "soundness": "2;3;3",
        "contribution": "1;3;3",
        "presentation": "2;3;3",
        "wc_summary": "78;34;77",
        "wc_strengths": "75;37;41",
        "wc_weaknesses": "307;78;308",
        "wc_questions": "75;40;9",
        "wc_review": "535;189;435",
        "wc_reply_reviewers": "159;13;27",
        "wc_reply_authors": "1327;473;1296",
        "reply_reviewers": "1;1;1",
        "reply_authors": "5;3;4",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            63.0,
            20.51016008388688
        ],
        "wc_strengths_avg": [
            51.0,
            17.048949136725895
        ],
        "wc_weaknesses_avg": [
            231.0,
            108.18810778762455
        ],
        "wc_questions_avg": [
            41.333333333333336,
            26.96087700518826
        ],
        "wc_review_avg": [
            386.3333333333333,
            145.38531180586602
        ],
        "wc_reply_reviewers_avg": [
            66.33333333333333,
            65.7740239169098
        ],
        "wc_reply_authors_avg": [
            1032.0,
            395.4752415343679
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            4.0,
            0.816496580927726
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5981146391436919930&as_sdt=5,34&sciodt=0,34&hl=en",
        "gs_version_total": 8,
        "openreview": "https://openreview.net/forum?id=SZzQz8ikwg",
        "pdf": "https://openreview.net/pdf?id=SZzQz8ikwg",
        "email": "epfl.ch;warwick.ac.uk;wisc.edu;uc3m.es;amazon.de",
        "author_num": 5,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "EPFL;University of Warwick;University of Wisconsin-Madison;Universidad Carlos III de Madrid;Amazon",
        "aff_unique_dep": ";;;;Development Center",
        "aff_unique_url": "https://www.epfl.ch;https://www.warwick.ac.uk;https://www.wisc.edu;https://www.uc3m.es;https://www.amazon.de",
        "aff_unique_abbr": "EPFL;Warwick;UW-Madison;UC3M;Amazon",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Lausanne;;Madison",
        "aff_country_unique_index": "0;1;2;3;4",
        "aff_country_unique": "Switzerland;United Kingdom;United States;Spain;Germany"
    },
    {
        "id": "Sa0t0vGPDv",
        "title": "FARS: FSM-Augmentation to Make LLMs Hallucinate the Right APIs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) have shown remarkable ability to converse with humans and solve a wide range of tasks. They have also been extended to make use of external tools or services through API calls. This is commonly achieved by fine-tuning the model, or with the use of in-context learning, where instructions and descriptions of those external APIs, along with examples of how to call them, are given to the LLM via its prompt. Given the limited context available in the LLM prompt and other latency constraints, scaling up to a large number of tools is challenging and requires the help of an external shortlisting process to prepare instructions and examples from a large number of APIs to a smaller set of relevant ones. In this work, we propose a new way for an LLM to generate the right API calls without the need to shortlist instructions or examples. Rather, we do this by allowing the LLM to hallucinate meaningful output while grounding the generation to an available set of APIs using a finite state machine-based constrained decoding algorithm. We call our approach FARS (FSM-Augmentation to make LLMs hallucinate the Right APIS). FARS allows us to ground LLMs to a large set of APIs with semantically meaningful names without using an external retriever or exemplars. We also demonstrate that with FARS, LLMs can seamlessly switch between conversation and API calling during multi-turn dialogs. We show that this can be achieved without any additional fine-tuning over the standard instruction tuning typically performed to train LLMs. This allows us to pave the way to build a truly powerful AI assistant using LLMs. We demonstrate the effectiveness of FARS for API calling on two public task-oriented API datasets: SNIPS and MultiWOZ, and a very challenging in-house Smart Home Control dataset.",
        "keywords": "LLM;API Prediction;Finite State Machine;Tries;Constrained Decoding",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Subendhu Rongali;Chandana Satya Prakash;Arpit Gupta;Wael Hamza",
        "authorids": "~Subendhu_Rongali1;~Chandana_Satya_Prakash1;~Arpit_Gupta1;~Wael_Hamza1",
        "gender": "M;;M;M",
        "homepage": "https://subendhurongali.netlify.app/;;;",
        "dblp": "173/5464;319/4358;;58/4075",
        "google_scholar": "pKEjWnsAAAAJ;https://scholar.google.com/citations?view_op=list_works;XXVjLVgAAAAJ;",
        "orcid": ";;;",
        "linkedin": ";chandanasatyaprakash;;",
        "or_profile": "~Subendhu_Rongali1;~Chandana_Satya_Prakash1;~Arpit_Gupta1;~Wael_Hamza1",
        "aff": "Amazon;Amazon;Amazon;Amazon",
        "aff_domain": "amazon.com;amazon.com;amazon.com;amazon.com",
        "position": "Researcher;Researcher;Researcher;Principal Researcher",
        "bibtex": "@misc{\nrongali2024fars,\ntitle={{FARS}: {FSM}-Augmentation to Make {LLM}s Hallucinate the Right {API}s},\nauthor={Subendhu Rongali and Chandana Satya Prakash and Arpit Gupta and Wael Hamza},\nyear={2024},\nurl={https://openreview.net/forum?id=Sa0t0vGPDv}\n}",
        "github": "",
        "project": "",
        "reviewers": "msYT;QTFS;NqbF",
        "site": "https://openreview.net/forum?id=Sa0t0vGPDv",
        "pdf_size": 616830,
        "rating": "6;6;8",
        "confidence": "4;4;4",
        "soundness": "4;4;3",
        "contribution": "3;4;3",
        "presentation": "4;4;3",
        "wc_summary": "76;96;94",
        "wc_strengths": "62;105;36",
        "wc_weaknesses": "46;100;114",
        "wc_questions": "2;11;21",
        "wc_review": "186;312;265",
        "wc_reply_reviewers": "22;0;10",
        "wc_reply_authors": "165;468;306",
        "reply_reviewers": "1;0;1",
        "reply_authors": "3;2;2",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            88.66666666666667,
            8.993825042154695
        ],
        "wc_strengths_avg": [
            67.66666666666667,
            28.452689777164398
        ],
        "wc_weaknesses_avg": [
            86.66666666666667,
            29.31817790306136
        ],
        "wc_questions_avg": [
            11.333333333333334,
            7.760297817881877
        ],
        "wc_review_avg": [
            254.33333333333334,
            51.98931514156432
        ],
        "wc_reply_reviewers_avg": [
            10.666666666666666,
            8.993825042154695
        ],
        "wc_reply_authors_avg": [
            313.0,
            123.79822292747178
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:kq0KQrdBmdMJ:scholar.google.com/&scioq=FARS:+FSM-Augmentation+to+Make+LLMs+Hallucinate+the+Right+APIs&hl=en&as_sdt=0,48",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Amazon",
        "aff_unique_dep": "Amazon.com, Inc.",
        "aff_unique_url": "https://www.amazon.com",
        "aff_unique_abbr": "Amazon",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "SaSK9M66KK",
        "title": "Pick and Adapt: An Iterative Approach for Source-Free Domain Adaptation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Domain adaptation plays a pivotal role in deploying models when inference data distribution is different from the training data. It becomes particularly challenging in source-free domain adaptation (SFDA) scenarios, where access to the source domain data is restricted due to data privacy concern. To tackle such cases, existing approaches often resort to generating source-like data for standard unsupervised domain adaptation or endeavor to fine-tune a model pre-trained on a source domain using self-supervised training techniques. Instead, our approach strikes a different path by theoretically analyzing into an empirical risk bound for SFDA. We identify the population risk and domain drift as the major factors from the risk bound. Subsequently, we introduce a top-k importance sampling to purify the pseudo labeling and thus reduce the population risk. We further present a nearest neighbor voting based semantic domain alignment to mitigate the domain drift. An iterative optimization is finally proposed to combine the above two steps for multiple rounds. Extensive experiments across three widely applied domain adaptation datasets, i.e., Office-Home, DomainNet, and VisDA-C, demonstrate the consistently advantageous performance over the state-of-the-art methods.",
        "keywords": "representation learning;domain adaptation",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Ronghang Zhu;Xiang Yu;Weiming Zhuang;Lingjuan Lyu;Sheng Li",
        "authorids": "~Ronghang_Zhu2;~Xiang_Yu1;~Weiming_Zhuang1;~Lingjuan_Lyu1;~Sheng_Li3",
        "gender": ";M;;F;M",
        "homepage": ";https://sites.google.com/site/xiangyurutgers/;https://weiming.me/;https://sites.google.com/view/lingjuan-lyu;http://sheng-li.org",
        "dblp": ";19/2453-2.html;274/0724;178/9876;23/3439-1",
        "google_scholar": ";QJbtEKMAAAAJ;lLuLAzEAAAAJ;;DEncVcYAAAAJ",
        "orcid": ";;;;0000-0003-1205-8632",
        "linkedin": ";;;;sheng-li-15a70022/",
        "or_profile": "~Ronghang_Zhu2;~Xiang_Yu1;~Weiming_Zhuang1;~Lingjuan_Lyu1;~Sheng_Li3",
        "aff": ";Amazon;Sony Research;Sony;University of Virginia, Charlottesville",
        "aff_domain": ";amazon.com;sony.com;sony.com;virginia.edu",
        "position": ";Researcher;Researcher;scientist;Associate Professor",
        "bibtex": "@misc{\nzhu2024pick,\ntitle={Pick and Adapt: An Iterative Approach for Source-Free Domain Adaptation},\nauthor={Ronghang Zhu and Xiang Yu and Weiming Zhuang and Lingjuan Lyu and Sheng Li},\nyear={2024},\nurl={https://openreview.net/forum?id=SaSK9M66KK}\n}",
        "github": "",
        "project": "",
        "reviewers": "tSbQ;hw5d;PRg5;UfbE",
        "site": "https://openreview.net/forum?id=SaSK9M66KK",
        "pdf_size": 594868,
        "rating": "3;5;6;6",
        "confidence": "4;4;4;4",
        "soundness": "2;2;3;2",
        "contribution": "2;2;2;2",
        "presentation": "3;2;3;3",
        "wc_summary": "64;33;73;61",
        "wc_strengths": "42;17;80;58",
        "wc_weaknesses": "110;181;56;266",
        "wc_questions": "61;53;23;34",
        "wc_review": "277;284;232;419",
        "wc_reply_reviewers": "0;0;0;21",
        "wc_reply_authors": "1681;1997;659;1002",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "4;6;3;3",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            57.75,
            14.956186011146023
        ],
        "wc_strengths_avg": [
            49.25,
            22.993205518152532
        ],
        "wc_weaknesses_avg": [
            153.25,
            78.75714253323314
        ],
        "wc_questions_avg": [
            42.75,
            15.039531242695032
        ],
        "wc_review_avg": [
            303.0,
            69.88204347327002
        ],
        "wc_reply_reviewers_avg": [
            5.25,
            9.093266739736606
        ],
        "wc_reply_authors_avg": [
            1334.75,
            530.5244457138615
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.0,
            1.224744871391589
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:xjho2YtBc3AJ:scholar.google.com/&scioq=Pick+and+Adapt:+An+Iterative+Approach+for+Source-Free+Domain+Adaptation&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Amazon;Sony;Sony Corporation;University of Virginia",
        "aff_unique_dep": "Amazon.com, Inc.;Research;;",
        "aff_unique_url": "https://www.amazon.com;https://www.sony.com;https://www.sony.com;https://www.virginia.edu",
        "aff_unique_abbr": "Amazon;Sony;Sony;UVA",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Charlottesville",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "United States;Japan"
    },
    {
        "id": "Sbi8BdKcob",
        "title": "From Indeterminacy to Determinacy: Augmenting Logical Reasoning Capabilities with Large Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recent advances in large language models (LLMs) have revolutionized the landscape of reasoning tasks. To enhance the capabilities of LLMs to emulate human reasoning, many prior works have focused on modeling intermediate reasoning steps using specific thought structures like chains, trees, or graphs. However, LLM-based reasoning continues to encounter challenges in three key aspects: 1) Selecting appropriate reasoning structures for various tasks; 2) Sufficiently and efficiently exploiting known conditions to deduce new insights; 3) Considering the impact of historical reasoning experience on future reasoning steps. To address these challenges, we propose DetermLR, a novel reasoning framework that formulates the reasoning process as a transformational journey from indeterminate premises to determinate ones. This process is marked by the incremental accumulation of determinate premises, making the conclusion progressively closer to clarity. DetermLR includes three essential components: 1) Premise identification: We systematically categorize premises into two distinct types: determinate and indeterminate. This empowers LLMs to flexibly customize reasoning structures to match the specific task complexities. 2) Premise prioritization and exploration: We leverage quantitative measurements to assess the relevance of each premise to the target, prioritizing more relevant premises for exploring new insights. 3) Iterative process with reasoning memory: We introduce a reasoning memory module to automate storage and extraction of available premises and reasoning paths, preserving historical reasoning details for more accurate premise prioritization and exploration during iterative reasoning. Comprehensive experimental results demonstrate that DetermLR outperforms all baselines on four challenging logical reasoning tasks: LogiQA, ProofWriter, FOLIO, and LogicalDeduction. Compared to previous multi-step reasoning methods, DetermLR can achieve better reasoning performance while requiring fewer visited states, highlighting its superior efficiency and effectiveness in tackling logical reasoning tasks.",
        "keywords": "large language model;natural language processing;logical reasoning;chain-of-thought prompting",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/ceb047b807574759484196c2eb6b261181029aec.pdf",
        "author": "Hongda Sun;Weikai Xu;Wei Liu;Jian Luan;Bin Wang;Shuo Shang;Ji-Rong Wen;Rui Yan",
        "authorids": "~Hongda_Sun1;~Weikai_Xu2;~Wei_Liu47;~Jian_Luan1;~Bin_Wang13;~Shuo_Shang1;~Ji-Rong_Wen1;~Rui_Yan2",
        "gender": "M;M;M;M;M;;M;M",
        "homepage": "https://sunhongda98.netlify.app/;;;;;https://sites.google.com/site/jedishang;https://gsai.ruc.edu.cn/english/jrwen;https://gsai.ruc.edu.cn/english/ruiyan",
        "dblp": "279/2033-1.html;;;61/3233-1.html;13/1898-4;29/8750;w/JRWen;19/2405-1",
        "google_scholar": "https://scholar.google.com.hk/citations?user=OxL7P9cAAAAJ;;oTP5ZpcAAAAJ;6Z8RUi4AAAAJ;tDajnHEAAAAJ;https://scholar.google.com/citations?hl=en;tbxCHJgAAAAJ;eLw6g-UAAAAJ",
        "orcid": "0000-0003-4850-6134;;0009-0009-4327-1920;;;0000-0002-1117-2890;0000-0002-9777-9676;0000-0002-3356-6823",
        "linkedin": ";;;https://www.linkedin.cn/incareer/in/jian-luan-58b5a428;;;;",
        "or_profile": "~Hongda_Sun1;~Weikai_Xu2;~Wei_Liu47;~Jian_Luan1;~Bin_Wang13;~Shuo_Shang1;~Ji-Rong_Wen1;~Rui_Yan2",
        "aff": "Renmin University of China;University of Electronic Science and Technology of China;xiaomi;Xiaomi Corporation;AI Lab, Xiaomi Inc.;University of Electronic Science and Technology of China;Renmin University of China;Renmin University of China",
        "aff_domain": "ruc.edu.cn;uestc.edu.cn;xiaomi.com;xiaomi.com;xiaomi.com;uestc.edu.cn;ruc.edu.cn;ruc.edu.cn",
        "position": "PhD student;MS student;Principal Researcher;Principal Researcher;Principal Researcher;Full Professor;Full Professor;Associate Professor",
        "bibtex": "@misc{\nsun2024from,\ntitle={From Indeterminacy to Determinacy: Augmenting Logical Reasoning Capabilities with Large Language Models},\nauthor={Hongda Sun and Weikai Xu and Wei Liu and Jian Luan and Bin Wang and Shuo Shang and Ji-Rong Wen and Rui Yan},\nyear={2024},\nurl={https://openreview.net/forum?id=Sbi8BdKcob}\n}",
        "github": "",
        "project": "",
        "reviewers": "96xE;aK68;KbK2;2L5z",
        "site": "https://openreview.net/forum?id=Sbi8BdKcob",
        "pdf_size": 483528,
        "rating": "3;5;5;5",
        "confidence": "2;4;4;3",
        "soundness": "2;2;2;3",
        "contribution": "3;2;3;2",
        "presentation": "2;3;2;2",
        "wc_summary": "63;56;79;63",
        "wc_strengths": "38;61;67;26",
        "wc_weaknesses": "73;85;139;122",
        "wc_questions": "158;88;17;46",
        "wc_review": "332;290;302;257",
        "wc_reply_reviewers": "52;57;125;0",
        "wc_reply_authors": "1560;1614;872;642",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "3;3;2;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            65.25,
            8.437268515343103
        ],
        "wc_strengths_avg": [
            48.0,
            16.688319268278637
        ],
        "wc_weaknesses_avg": [
            104.75,
            26.78035660703569
        ],
        "wc_questions_avg": [
            77.25,
            53.015917421091565
        ],
        "wc_review_avg": [
            295.25,
            26.864242032858474
        ],
        "wc_reply_reviewers_avg": [
            58.5,
            44.41002139157332
        ],
        "wc_reply_authors_avg": [
            1172.0,
            423.3225720416997
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.8703882797784891,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11596524493306270224&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;2;3;1;0;0",
        "aff_unique_norm": "Renmin University of China;University of Electronic Science and Technology of China;Xiaomi Corporation;Xiaomi Inc.",
        "aff_unique_dep": ";;;AI Lab",
        "aff_unique_url": "http://www.ruc.edu.cn;https://www.uestc.edu.cn;https://www.xiaomi.com;https://www.xiaomi.com",
        "aff_unique_abbr": "RUC;UESTC;Xiaomi;Xiaomi",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Horizon-Free Regret for Linear Markov Decision Processes",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18597",
        "id": "SdBApv9iT4",
        "author_site": "Zhang Zihan, Jason Lee, Yuxin Chen, Simon Du",
        "tldr": "",
        "abstract": "A recent line of works showed regret bounds in reinforcement learning (RL) can be (nearly) independent of planning horizon, a.k.a. the horizon-free bounds. However, these regret bounds only apply to settings where a polynomial dependency on the size of transition model is allowed, such as tabular Markov Decision Process (MDP) and linear mixture MDP. We give the first horizon-free bound for the popular linear MDP setting where the size of the transition model can be exponentially large or even uncountable.  In contrast to prior works which explicitly estimate the transition model and compute the inhomogeneous value functions at different time steps, we directly estimate the value functions and confidence sets.  We obtain the horizon-free bound by: (1) maintaining multiple weighted least square estimators for the value functions; and (2) a structural lemma which shows the maximal total variation of the inhomogeneous value functions is bounded by a polynomial factor of the feature dimension.",
        "keywords": "Linear MDP; horizon-free;regret analysis",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/d8387b372d368491ed4a84b08f0daba6def9762f.pdf",
        "author": "Zihan Zhang;Jason D. Lee;Yuxin Chen;Simon Shaolei Du",
        "authorids": "~Zihan_Zhang1;~Jason_D._Lee1;~Yuxin_Chen5;~Simon_Shaolei_Du1",
        "gender": "M;M;M;M",
        "homepage": "https://zsubfuncz.github.io/zihanzhang.github.io/;https://jasondlee88.github.io/;https://yuxinchen2020.github.io/;http://simonshaoleidu.com",
        "dblp": ";88/3262;11/5123-2;176/5602",
        "google_scholar": "un0eGzEAAAAJ;GR_DsT0AAAAJ;RtNVud4AAAAJ;OttawxUAAAAJ",
        "orcid": ";;0000-0001-9256-5815;",
        "linkedin": ";;;",
        "or_profile": "~Zihan_Zhang1;~Jason_D._Lee1;~Yuxin_Chen5;~Simon_Shaolei_Du1",
        "aff": "Princeton University;Princeton University;University of Pennsylvania;University of Washington",
        "aff_domain": "princeton.edu;princeton.edu;upenn.edu;washington.edu",
        "position": "Postdoc;Assistant Professor;Associate Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nzihan2024horizonfree,\ntitle={Horizon-Free Regret for Linear Markov Decision Processes},\nauthor={Zihan Zhang and Jason D. Lee and Yuxin Chen and Simon Shaolei Du},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=SdBApv9iT4}\n}",
        "github": "",
        "project": "",
        "reviewers": "p2b6;pF7R;anFv;nnTm",
        "pdf_size": 693116,
        "rating": "5;6;6;8",
        "confidence": "3;3;2;4",
        "soundness": "2;3;3;4",
        "contribution": "3;2;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "282;87;33;42",
        "wc_strengths": "53;79;18;23",
        "wc_weaknesses": "98;228;20;41",
        "wc_questions": "310;173;9;347",
        "wc_review": "743;567;80;453",
        "wc_reply_reviewers": "197;12;11;29",
        "wc_reply_authors": "431;413;16;464",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "3;2;1;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            111.0,
            100.82410426083635
        ],
        "wc_strengths_avg": [
            43.25,
            24.600558936739628
        ],
        "wc_weaknesses_avg": [
            96.75,
            80.97337525384502
        ],
        "wc_questions_avg": [
            209.75,
            132.7956606971779
        ],
        "wc_review_avg": [
            460.75,
            242.89130799598408
        ],
        "wc_reply_reviewers_avg": [
            62.25,
            78.12609999225612
        ],
        "wc_reply_authors_avg": [
            331.0,
            182.78265782070247
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.6488856845230502,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17533658256145193775&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=SdBApv9iT4",
        "pdf": "https://openreview.net/pdf?id=SdBApv9iT4",
        "email": "princeton.edu;princeton.edu;upenn.edu;washington.edu",
        "author_num": 4,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "Princeton University;University of Pennsylvania;University of Washington",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.princeton.edu;https://www.upenn.edu;https://www.washington.edu",
        "aff_unique_abbr": "Princeton;UPenn;UW",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "SdBQM7f4bX",
        "title": "EchoPrompt: Instructing the Model to Rephrase Queries for Improved In-context Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Language models are achieving impressive performance on various tasks by aggressively adopting inference-time prompting techniques, such as zero-shot and few-shot prompting. In this work, we introduce EchoPrompt, a simple yet effective approach that prompts the model to rephrase its queries before answering them. EchoPrompt is adapted for both zero-shot and few-shot in-context learning with standard and chain-of-thought prompting. Experimental results show that EchoPrompt yields substantial improvements across all these settings for four families of causal language models. These improvements are observed across various numerical reasoning (e.g. GSM8K, SVAMP), reading comprehension (e.g. DROP), and logical reasoning (e.g. Coin Flipping) tasks. On average, EchoPrompt improves the Zero-shot-CoT performance of code-davinci-002 by 5% in numerical tasks and 13% in reading comprehension tasks. We investigate the factors contributing to EchoPrompt\u2019s effectiveness through ablation studies, which reveal that both the original query and the model-generated rephrased version are instrumental in its performance gains. Our empirical results indicate that EchoPrompt is an effective technique that enhances in-context learning performance. We recommend incorporating EchoPrompt into various baseline prompting strategies to achieve performance boosts.",
        "keywords": "In-context learning;prompting;large language models;zero-shot learning;few-shot learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/42513b2e47f2761d414063665ccba77188693864.zip",
        "author": "Raja Sekhar Reddy Mekala;Yasaman Razeghi;Sameer Singh",
        "authorids": "~Raja_Sekhar_Reddy_Mekala1;~Yasaman_Razeghi1;~Sameer_Singh1",
        "gender": "M;F;M",
        "homepage": "https://rajasekharmekala.github.io/;https://yasamanrazeghi.com/;http://sameersingh.org",
        "dblp": ";https://dblp.dagstuhl.de/pid/277/6248.html;13/3568-1",
        "google_scholar": "Tn_YYiQAAAAJ;YCtmdaMAAAAJ;-hGZC54AAAAJ",
        "orcid": ";;0000-0003-0621-6323",
        "linkedin": "rajasekhar-mekala-482941116/;;sameersingh/",
        "or_profile": "~Raja_Sekhar_Reddy_Mekala1;~Yasaman_Razeghi1;~Sameer_Singh1",
        "aff": ";University of California, Irvine;University of California, Irvine",
        "aff_domain": ";uci.edu;uci.edu",
        "position": ";PhD student;Full Professor",
        "bibtex": "@misc{\nmekala2024echoprompt,\ntitle={EchoPrompt: Instructing the Model to Rephrase Queries for Improved In-context Learning},\nauthor={Raja Sekhar Reddy Mekala and Yasaman Razeghi and Sameer Singh},\nyear={2024},\nurl={https://openreview.net/forum?id=SdBQM7f4bX}\n}",
        "github": "",
        "project": "",
        "reviewers": "avEG;oXYq;KWdy;KwXV",
        "site": "https://openreview.net/forum?id=SdBQM7f4bX",
        "pdf_size": 724493,
        "rating": "3;3;5;6",
        "confidence": "4;3;4;4",
        "soundness": "3;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "4;3;3;4",
        "wc_summary": "115;147;87;93",
        "wc_strengths": "14;117;20;104",
        "wc_weaknesses": "165;213;103;348",
        "wc_questions": "61;26;2;185",
        "wc_review": "355;503;212;730",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            110.5,
            23.510635891017493
        ],
        "wc_strengths_avg": [
            63.75,
            47.023265518251705
        ],
        "wc_weaknesses_avg": [
            207.25,
            90.13427483482629
        ],
        "wc_questions_avg": [
            68.5,
            70.45743395838369
        ],
        "wc_review_avg": [
            450.0,
            191.6233284336748
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5555555555555555,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4234905109766671388&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of California, Irvine",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uci.edu",
        "aff_unique_abbr": "UCI",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Irvine",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "SdUUyqakLl",
        "title": "Exploit Gradient Skew to Circumvent Byzantine Defenses for Federated Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Federated Learning (FL) is notorious for its vulnerability to Byzantine attacks. Most current Byzantine defenses share a common inductive bias: among all the gradients, the majorities are more likely to be honest. However, such bias is a poison to Byzantine robustness due to a newly discovered phenomenon -- gradient skew. We discover that the majority of honest gradients skew away from the optimal gradient (the average of honest gradients) as a result of heterogeneous data. This gradient skew phenomenon allows Byzantine gradients to hide within the skewed majority of honest gradients and thus be recognized as the majority. As a result, Byzantine defenses are deceived into perceiving Byzantine gradients as honest. Motivated by this observation, we propose a novel skew-aware attack called STRIKE: first, we search for the skewed majority of honest gradients; then, we construct Byzantine gradients within the skewed majority. Experiments on three benchmark datasets validate the effectiveness of our attack.",
        "keywords": "Federated Learning; Byzantine Robustness",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/abcbf7bcfe79eff7ecc9593d28dcf1cd94b710cb.zip",
        "author": "Yuchen Liu;Chen Chen;Lingjuan Lyu;Yaochu Jin;Gang Chen",
        "authorids": "~Yuchen_Liu8;~Chen_Chen20;~Lingjuan_Lyu1;~Yaochu_Jin1;~Gang_Chen6",
        "gender": ";M;F;M;M",
        "homepage": ";https://cc233.github.io/;https://sites.google.com/view/lingjuan-lyu;https://en.westlake.edu.cn/faculty/yaochu-jin.html;",
        "dblp": ";65/4423-43;178/9876;j/YaochuJin;67/6383-1",
        "google_scholar": ";;;B5WAkz4AAAAJ;",
        "orcid": "0000-0002-3629-128X;0000-0001-7359-8515;;0000-0003-1100-0631;0000-0002-7483-0045",
        "linkedin": ";;;;",
        "or_profile": "~Yuchen_Liu8;~Chen_Chen20;~Lingjuan_Lyu1;~Yaochu_Jin1;~Gang_Chen6",
        "aff": "Zhejiang University;Sony AI;Sony;Westlake University;College of Computer Science and Technology, Zhejiang University",
        "aff_domain": "zju.edu.cn;sony.com;sony.com;westlake.edu.cn;cs.zju.edu.cn",
        "position": "PhD student;Researcher;scientist;Full Professor;Full Professor",
        "bibtex": "@misc{\nliu2024exploit,\ntitle={Exploit Gradient Skew to Circumvent Byzantine Defenses for Federated Learning},\nauthor={Yuchen Liu and Chen Chen and Lingjuan Lyu and Yaochu Jin and Gang Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=SdUUyqakLl}\n}",
        "github": "",
        "project": "",
        "reviewers": "EJRr;ykp2;h2Sd;vYnj",
        "site": "https://openreview.net/forum?id=SdUUyqakLl",
        "pdf_size": 1082802,
        "rating": "3;5;6;10",
        "confidence": "4;3;5;4",
        "soundness": "1;2;3;4",
        "contribution": "2;2;3;4",
        "presentation": "2;2;4;4",
        "wc_summary": "56;46;78;92",
        "wc_strengths": "35;27;48;65",
        "wc_weaknesses": "532;175;63;53",
        "wc_questions": "5;1;25;5",
        "wc_review": "628;249;214;215",
        "wc_reply_reviewers": "202;65;0;0",
        "wc_reply_authors": "1566;456;563;424",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "3;3;1;1",
        "rating_avg": [
            6.0,
            2.5495097567963922
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            1.118033988749895
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            1.0
        ],
        "wc_summary_avg": [
            68.0,
            18.05547008526779
        ],
        "wc_strengths_avg": [
            43.75,
            14.376630342329875
        ],
        "wc_weaknesses_avg": [
            205.75,
            194.35454072390488
        ],
        "wc_questions_avg": [
            9.0,
            9.38083151964686
        ],
        "wc_review_avg": [
            326.5,
            174.6403447087757
        ],
        "wc_reply_reviewers_avg": [
            66.75,
            82.47234384931714
        ],
        "wc_reply_authors_avg": [
            752.25,
            472.6300746884396
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            1.0
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.1386750490563073,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:EYxqehHsJsoJ:scholar.google.com/&scioq=Exploit+Gradient+Skew+to+Circumvent+Byzantine+Defenses+for+Federated+Learning&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;0",
        "aff_unique_norm": "Zhejiang University;Sony;Sony Corporation;Westlake University",
        "aff_unique_dep": ";Sony AI;;",
        "aff_unique_url": "https://www.zju.edu.cn;https://www.sony.com;https://www.sony.com;https://www.westlake.edu.cn",
        "aff_unique_abbr": "ZJU;Sony AI;Sony;WU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;0;0",
        "aff_country_unique": "China;Japan"
    },
    {
        "title": "Incremental Randomized Smoothing Certification",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18596",
        "id": "SdeAPV1irk",
        "author_site": "Shubham Dipak Ugare, Tarun Suresh, Debangshu Banerjee, Gagandeep Singh, Sasa Misailovic",
        "tldr": "",
        "abstract": "Randomized smoothing-based certification is an effective approach for obtaining robustness certificates of deep neural networks (DNNs) against adversarial attacks. This method constructs a smoothed DNN model and certifies its robustness through statistical sampling, but it is computationally expensive, especially when certifying with a large number of samples. Furthermore, when the smoothed model is modified (e.g., quantized or pruned), certification guarantees may not hold for the modified DNN, and recertifying from scratch can be prohibitively expensive.\n\nWe present the first approach for incremental robustness certification for randomized smoothing, IRS. We show how to reuse the certification guarantees for the original smoothed model to certify an approximated model with very few samples. IRS significantly reduces the computational cost of certifying modified DNNs while maintaining strong robustness guarantees. We experimentally demonstrate the effectiveness of our approach, showing up to 4.1x certification speedup over the certification that applies randomized smoothing of the approximate model from scratch.",
        "keywords": "Robustness;Verification;Certification;Approximation",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "/attachment/69f6a8e95ea0306eff8df8688c8fa87e81ff0d06.zip",
        "author": "Shubham Ugare;Tarun Suresh;Debangshu Banerjee;Gagandeep Singh;Sasa Misailovic",
        "authorids": "~Shubham_Ugare1;~Tarun_Suresh1;~Debangshu_Banerjee2;~Gagandeep_Singh1;~Sasa_Misailovic1",
        "gender": "M;M;M;M;M",
        "homepage": "https://shubhamugare.github.io/;https://tarsur909.github.io/;https://debangshu-banerjee.github.io/;https://ggndpsngh.github.io/;http://misailo.cs.illinois.edu/",
        "dblp": "227/3014;348/7104;268/6756;64/3747-1;00/4734.html",
        "google_scholar": "vpK-0x8AAAAJ;Yxx6B5YAAAAJ;G5dhKqAAAAAJ;https://scholar.google.ch/citations?user=m4b2ruEAAAAJ;https://scholar.google.com.tw/citations?user=3qJQjIYAAAAJ",
        "orcid": ";0000-0002-1426-7633;0009-0001-0163-9717;0000-0002-9299-2961;",
        "linkedin": ";tarun-suresh-802231157/;debangshu-banerjee/;gagandeep-singh-1bb01b49/;",
        "or_profile": "~Shubham_Ugare1;~Tarun_Suresh1;~Debangshu_Banerjee2;~Gagandeep_Singh1;~Sasa_Misailovic1",
        "aff": "Uber;Department of Computer Science;University of Illinois, Urbana Champaign;University of Illinois, Urbana Champaign;University of Illinois, Urbana Champaign",
        "aff_domain": "uber.com;cs.illinois.edu;uiuc.edu;illinois.edu;illinois.edu",
        "position": "Intern;Undergrad student;PhD student;Assistant Professor;Associate Professor",
        "bibtex": "@inproceedings{\nugare2024incremental,\ntitle={Incremental Randomized Smoothing Certification},\nauthor={Shubham Ugare and Tarun Suresh and Debangshu Banerjee and Gagandeep Singh and Sasa Misailovic},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=SdeAPV1irk}\n}",
        "github": "",
        "project": "",
        "reviewers": "qzcN;6uEd;VbzH;7muz",
        "pdf_size": 4651729,
        "rating": "6;6;6;6",
        "confidence": "5;3;3;3",
        "soundness": "3;3;2;3",
        "contribution": "3;2;2;3",
        "presentation": "4;4;3;3",
        "wc_summary": "89;165;66;68",
        "wc_strengths": "63;56;38;50",
        "wc_weaknesses": "391;54;117;224",
        "wc_questions": "18;8;3;2",
        "wc_review": "561;283;224;344",
        "wc_reply_reviewers": "46;0;22;0",
        "wc_reply_authors": "340;140;198;566",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            97.0,
            40.28026812224566
        ],
        "wc_strengths_avg": [
            51.75,
            9.175374651751284
        ],
        "wc_weaknesses_avg": [
            196.5,
            127.68418069596562
        ],
        "wc_questions_avg": [
            7.75,
            6.339361166552983
        ],
        "wc_review_avg": [
            353.0,
            127.3636525858143
        ],
        "wc_reply_reviewers_avg": [
            17.0,
            19.0
        ],
        "wc_reply_authors_avg": [
            311.0,
            164.2224101637776
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10369065967051562557&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=SdeAPV1irk",
        "pdf": "https://openreview.net/pdf?id=SdeAPV1irk",
        "email": "uber.com;cs.illinois.edu;uiuc.edu;illinois.edu;illinois.edu",
        "author_num": 5,
        "aff_unique_index": "0;1;2;2;2",
        "aff_unique_norm": "Uber Technologies Inc.;Unknown Institution;University of Illinois Urbana-Champaign",
        "aff_unique_dep": ";Department of Computer Science;",
        "aff_unique_url": "https://www.uber.com;;https://illinois.edu",
        "aff_unique_abbr": "Uber;;UIUC",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Urbana-Champaign",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States;"
    },
    {
        "id": "SdoSUDBWJY",
        "title": "Attacking for Inspection and Instruction: Debiasing Self-explaining Text Classification",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "eXplainable Artificial Intelligence (XAI) techniques are indispensable for increasing the transparency of deep learning models. Such transparency facilitates a deeper human comprehension of the model's fairness, security, robustness, among other attributes, leading to heightened trust in the model's decisions. An important line of research in the field of NLP involves self-explanation using a cooperative game, where a generator selects a semantically consistent subset of the input as the explanation, and a subsequent predictor makes predictions based on the selected subset. In this paper, we first uncover a potential caveat: such a cooperative game could unintentionally introduce a sampling bias between the explanation and the target prediction label. Specifically, the generator might inadvertently create an incorrect correlation between the selected explanation and the label, even when they are semantically unrelated in the original dataset. Subsequently, we elucidate the origins of this bias using both theoretical analysis and empirical evidence. Our findings suggest a direction for mitigating this bias, and we introduce an adversarial game as a practical solution. Experiments on two widely used real-world benchmarks show  the effectiveness of the proposed method.",
        "keywords": "Sampling bias;interpretability;self-explaining",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Wei Liu;Jun Wang;Haozhao Wang;Ruixuan Li;Zhiying Deng;YuanKai Zhang",
        "authorids": "~Wei_Liu30;~Jun_Wang1;~Haozhao_Wang1;~Ruixuan_Li1;~Zhiying_Deng2;~YuanKai_Zhang1",
        "gender": ";;M;M;;",
        "homepage": ";;https://wanghaozhao.mysxl.cn/;http://idc.hust.edu.cn/rxli/index.html;;",
        "dblp": ";w/JunWang18;224/4500.html;60/4429.html;;",
        "google_scholar": ";Anp1nPUAAAAJ;https://scholar.google.com.hk/citations?user=yFrOuMEAAAAJ;https://scholar.google.com/scholar?q=ruixuan+li;;",
        "orcid": ";0000-0002-9515-076X;0000-0002-7591-5315;0000-0002-7791-5511;;",
        "linkedin": ";hustwj/;;https://www.linkedin.cn/incareer/in/ruixuan-li-b367319;;",
        "or_profile": "~Wei_Liu30;~Jun_Wang1;~Haozhao_Wang1;~Ruixuan_Li1;~Zhiying_Deng2;~YuanKai_Zhang1",
        "aff": ";iWudao Tech.;Huazhong University of Science and Technology;Huazhong University of Science and Technology;;",
        "aff_domain": ";iwudao.tech;hust.edu.cn;hust.edu.cn;;",
        "position": ";Consultant;Postdoc;Full Professor;;",
        "bibtex": "@misc{\nliu2024attacking,\ntitle={Attacking for Inspection and Instruction: Debiasing Self-explaining Text Classification},\nauthor={Wei Liu and Jun Wang and Haozhao Wang and Ruixuan Li and Zhiying Deng and YuanKai Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=SdoSUDBWJY}\n}",
        "github": "",
        "project": "",
        "reviewers": "TefW;H4hs;MTBk;LkPz;QZhC",
        "site": "https://openreview.net/forum?id=SdoSUDBWJY",
        "pdf_size": 714512,
        "rating": "3;5;5;6;6",
        "confidence": "3;3;3;3;3",
        "soundness": "2;2;2;4;3",
        "contribution": "2;2;2;2;3",
        "presentation": "1;3;2;4;3",
        "wc_summary": "128;131;74;68;145",
        "wc_strengths": "20;38;82;146;100",
        "wc_weaknesses": "679;128;156;69;102",
        "wc_questions": "5;45;1;110;5",
        "wc_review": "832;342;313;393;352",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "4019;748;1717;1333;806",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "5;1;2;2;1",
        "rating_avg": [
            5.0,
            1.0954451150103321
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.6,
            0.8
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.6,
            1.019803902718557
        ],
        "wc_summary_avg": [
            109.2,
            31.770426500127446
        ],
        "wc_strengths_avg": [
            77.2,
            44.910577818594135
        ],
        "wc_weaknesses_avg": [
            226.8,
            227.9187574553705
        ],
        "wc_questions_avg": [
            33.2,
            41.62883615956612
        ],
        "wc_review_avg": [
            446.4,
            194.4968894352812
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1724.6,
            1201.2704275058136
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.2,
            1.469693845669907
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:S5TeAfgiinAJ:scholar.google.com/&scioq=Attacking+for+Inspection+and+Instruction:+Debiasing+Self-explaining+Text+Classification&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "iWudao Tech;Huazhong University of Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": ";http://www.hust.edu.cn",
        "aff_unique_abbr": ";HUST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "Se6aznYMHa",
        "title": "Explaining Contrastive Models using Exemplars: Explanation, Confidence, and Knowledge Limits",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Explainable AI (XAI) provides human users with transparency and interpretability of powerful ``black-box'' models. Recent work on XAI has focused on explaining specific model responses by identifying key input features using attribution analysis. Another avenue for explaining AI decisions is to leverage exemplars of training data. However, there are limited investigations on using exemplars to establish metrics for confidence and knowledge limits. Recently, contrastive learning has received increased focus in computer vision, natural language, audio, and many other fields. However, there are very few explainability studies that could leverage the learning process to explain the contrastive models. In this paper, we advance post-hoc explainable AI for contrastive models. The main contributions include i) explaining the relation among test and training data samples using pairwise attribution analysis, ii) developing exemplar-based confidence metrics, and iii) establishing measures for the model knowledge limits. In the experimental evaluation, we evaluate the proposed techniques using the OpenAI CLIP model. The evaluation on ImageNet demonstrates that exemplars of training data can provide meaningful explanations for the decision-making of contrastive models. We observe that the proposed exemplar-based confidence score gives a more reliable, dataset-agnostic probability measure compared to the softmax score and temperature scaling. Furthermore, the OOD detection module of our framework shows significant improvement compared to other state-of-the-art methods (6.1\\% and 9.6\\% improvement in AUROC and FPR@95TPR, respectively). The three modules together can give a meaningful explanation of the model decisions made by a contrastive model. The proposed techniques extend the body of science of XAI for contrastive models and are expected to impact the explainability of future foundational models.",
        "keywords": "Explainable AI;Contrastive Learning;Exemplars;Confidence;Knowledge Limits;OOD",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "M Shifat Hossain;Chase Walker;Sumit Kumar Jha;Rickard Ewetz",
        "authorids": "~M_Shifat_Hossain1;~Chase_Walker1;~Sumit_Kumar_Jha2;~Rickard_Ewetz1",
        "gender": ";M;;M",
        "homepage": "https://shifathossain.github.io;;http://www.sumitkumarjha.com;https://ewetz.ece.ufl.edu/",
        "dblp": "201/6141;348/7054;05/5046-1;127/9041",
        "google_scholar": "p-dnT8MAAAAJ;j5vNNv4AAAAJ;3kJbs98AAAAJ;h_RaG-8AAAAJ",
        "orcid": "0000-0002-4537-2620;0000-0001-8664-5843;0000-0003-0354-2940;",
        "linkedin": ";;sumit-jha-572a45180/;",
        "or_profile": "~M_Shifat_Hossain1;~Chase_Walker1;~Sumit_Kumar_Jha2;~Rickard_Ewetz1",
        "aff": "University of Central Florida;University of Central Florida;Florida International University;University of Central Florida",
        "aff_domain": "ucf.edu;ucf.edu;fiu.edu;ucf.edu",
        "position": "PhD student;PhD student;Full Professor;Associate Professor",
        "bibtex": "@misc{\nhossain2024explaining,\ntitle={Explaining Contrastive Models using Exemplars: Explanation, Confidence, and Knowledge Limits},\nauthor={M Shifat Hossain and Chase Walker and Sumit Kumar Jha and Rickard Ewetz},\nyear={2024},\nurl={https://openreview.net/forum?id=Se6aznYMHa}\n}",
        "github": "",
        "project": "",
        "reviewers": "VpfW;fEiN;NdQo;CGuX",
        "site": "https://openreview.net/forum?id=Se6aznYMHa",
        "pdf_size": 4321678,
        "rating": "3;3;5;8",
        "confidence": "4;4;4;3",
        "soundness": "3;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "45;96;63;50",
        "wc_strengths": "48;43;69;81",
        "wc_weaknesses": "180;246;405;153",
        "wc_questions": "93;63;80;104",
        "wc_review": "366;448;617;388",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            63.5,
            19.880895352071043
        ],
        "wc_strengths_avg": [
            60.25,
            15.449514555480375
        ],
        "wc_weaknesses_avg": [
            246.0,
            97.83404315472197
        ],
        "wc_questions_avg": [
            85.0,
            15.280706789936126
        ],
        "wc_review_avg": [
            454.75,
            98.36507256135178
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9169493006161777,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Lja17wVhbNYJ:scholar.google.com/&scioq=Explaining+Contrastive+Models+using+Exemplars:+Explanation,+Confidence,+and+Knowledge+Limits&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "University of Central Florida;Florida International University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ucf.edu;https://www.fiu.edu",
        "aff_unique_abbr": "UCF;FIU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "SeiL55hCnu",
        "title": "OpenLEAF: Open-Domain Interleaved Image-Text Generation and Evaluation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "This work investigates a challenging task named open-domain interleaved image-text generation, which generates interleaved texts and images following an input query. We propose a new interleaved generation framework based on prompting large-language models (LLMs) and pre-trained text-to-image (T2I) models, namely OpenLEAF. In OpenLEAF, the LLM generates textual descriptions, coordinates T2I models, creates visual prompts for generating images, and incorporates global contexts into the T2I models. This global context improves the entity and style consistencies of images in the interleaved generation. For model assessment, we first propose to use large multi-modal models (LMMs) to evaluate the entity and style consistencies of open-domain interleaved image-text sequences. According to the LMM evaluation on our constructed evaluation set, the proposed interleaved generation framework can generate high-quality image-text content for various domains and applications, such as how-to question answering, storytelling, graphical story rewriting, and webpage/poster generation tasks. Moreover, we validate the effectiveness of the proposed LMM evaluation technique with human assessment. We hope our proposed framework, benchmark, and LMM evaluation could help establish the intriguing interleaved image-text generation task.",
        "keywords": "Interleaved Content Generation;Multi-Modal Evaluation;Large Language Model;Text-to-Image Generation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/8a977974f2e6540ad2c4f58b0d373424fbc35c31.pdf",
        "author": "Jie An;Zhengyuan Yang;Linjie Li;Jianfeng Wang;Kevin Lin;Zicheng Liu;Lijuan Wang;Jiebo Luo",
        "authorids": "~Jie_An1;~Zhengyuan_Yang1;~Linjie_Li1;~Jianfeng_Wang4;~Kevin_Lin3;~Zicheng_Liu1;~Lijuan_Wang1;~Jiebo_Luo1",
        "gender": "M;M;F;M;;M;F;M",
        "homepage": ";http://zhengyuan.info/;;;https://sites.google.com/site/kevinlin311tw/;https://sites.google.com/view/zichengliu/home?pli=1;https://www.microsoft.com/en-us/research/people/lijuanw/;https://www.cs.rochester.edu/u/jluo/",
        "dblp": "145/0655-2;163/9713;200/8256;;;l/ZichengLiu;51/2527.html;25/5545",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=zh-CN;WR875gYAAAAJ;vJWEw_8AAAAJ;https://scholar.google.com.tw/citations?user=LKSy1kwAAAAJ;bkALdvsAAAAJ;cDcWXuIAAAAJ;CcbnBvgAAAAJ",
        "orcid": "0000-0002-1402-8288;;;;0000-0001-8944-1336;0000-0001-5894-7828;;0000-0002-4516-9729",
        "linkedin": "jie-an-769636a5/;;;;;;;jieboluo/",
        "or_profile": "~Jie_An1;~Zhengyuan_Yang1;~Linjie_Li1;~Jianfeng_Wang4;~Kevin_Lin3;~Zicheng_Liu1;~Lijuan_Wang1;~Jiebo_Luo3",
        "aff": "University of Rochester;Microsoft;Microsoft;Microsoft;Microsoft;Microsoft;Microsoft;University of Rochester",
        "aff_domain": "rochester.edu;microsoft.com;microsoft.com;microsoft.com;microsoft.com;microsoft.com;microsoft.com;rochester.edu",
        "position": "PhD student;Researcher;Researcher;Principal Researcher;Principal Researcher;partner research manager;Principal Researcher;Full Professor",
        "bibtex": "@misc{\nan2024openleaf,\ntitle={Open{LEAF}: Open-Domain Interleaved Image-Text Generation and Evaluation},\nauthor={Jie An and Zhengyuan Yang and Linjie Li and Jianfeng Wang and Kevin Lin and Zicheng Liu and Lijuan Wang and Jiebo Luo},\nyear={2024},\nurl={https://openreview.net/forum?id=SeiL55hCnu}\n}",
        "github": "",
        "project": "",
        "reviewers": "bkvJ;vJS3;d9kj;qwLm",
        "site": "https://openreview.net/forum?id=SeiL55hCnu",
        "pdf_size": 4991458,
        "rating": "3;3;5;5",
        "confidence": "5;4;4;4",
        "soundness": "2;1;3;3",
        "contribution": "2;2;2;2",
        "presentation": "2;1;3;3",
        "wc_summary": "39;140;60;56",
        "wc_strengths": "53;9;66;53",
        "wc_weaknesses": "326;38;248;56",
        "wc_questions": "1;25;1;4",
        "wc_review": "419;212;375;169",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            73.75,
            39.0536489972448
        ],
        "wc_strengths_avg": [
            45.25,
            21.591375593046404
        ],
        "wc_weaknesses_avg": [
            167.0,
            123.2923355282071
        ],
        "wc_questions_avg": [
            7.75,
            10.034316120194738
        ],
        "wc_review_avg": [
            293.75,
            105.51629021151189
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17530139361245801797&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1;1;1;1;1;0",
        "aff_unique_norm": "University of Rochester;Microsoft",
        "aff_unique_dep": ";Microsoft Corporation",
        "aff_unique_url": "https://www.rochester.edu;https://www.microsoft.com",
        "aff_unique_abbr": "U of R;Microsoft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "SerYSFntLh",
        "title": "Multimodal Variational Disentangled Knowledge Alignment for Cross-domain Recommendation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Multimodal recommendation systems have been widely used in e-commerce and short video platforms. Due to the large differences in data volume and data distribution in different business scenarios, cross-domain recommendation is studied to improve the effect of target domain by using rich source domain data. Some studies use encoders to represent domain information and design knowledge alignment to achieve cross-domain knowledge transfer. However, simple information representation and alignment methods are easily affected by noisy information and lead to negative transfer problems. The distribution of features in different domains also has a large deviation, which affects the effective transfer of knowledge. Therefore, we propose a Variational Disentangled Cross-domain Knowledge Alignment Method (VDKA) for multimodal recommendation. Specifically, we propose a variational multimodal graph attention encoder, which consists of variational autoencoder and graph attention encoder. Variational encoder can learn domain sharing and domain specific representations under multimodal data utilization. Then we introduce variational optimization objectives and disentangled representation objectives to improve the accuracy of domain representation. Furthermore, in order to solve the problem of domain knowledge distribution drift, adversarial learning is designed to realize cross-domain knowledge alignment. We conducted comprehensive experiments on four real-world multimodal data sets, and the experimental results show that our proposed VDKA method outperforms other state-of-the-art models. Ablation experiments have verified the effectiveness of our various designs.",
        "keywords": "Variational Encoding;Disentangled Representation;Multimodal Recommendation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Wei Yang;Qingchen Yang;Zhiqiang Liu;Chi Lu",
        "authorids": "~Wei_Yang10;~Qingchen_Yang1;~Zhiqiang_Liu6;~Chi_Lu2",
        "gender": "M;;M;M",
        "homepage": ";;;",
        "dblp": ";;;",
        "google_scholar": ";;;",
        "orcid": "0009-0004-0151-2160;0009-0000-2895-041X;0009-0009-5497-5405;0009-0009-9196-6241",
        "linkedin": ";;;",
        "or_profile": "~Wei_Yang10;~Qingchen_Yang1;~Zhiqiang_Liu6;~Chi_Lu2",
        "aff": "Institute of Automation, Chinese Academy of Sciences;Qingdao University;Kuaishou Technology;Tencent",
        "aff_domain": "ia.ac.cn;qdu.edu.cn;kuaishou.com;tencent.com",
        "position": "PhD student;MS student;Researcher;Researcher",
        "bibtex": "@misc{\nyang2024multimodal,\ntitle={Multimodal Variational Disentangled  Knowledge Alignment for Cross-domain Recommendation},\nauthor={Wei Yang and Qingchen Yang and Zhiqiang Liu and Chi Lu},\nyear={2024},\nurl={https://openreview.net/forum?id=SerYSFntLh}\n}",
        "github": "",
        "project": "",
        "reviewers": "AGJw;UcLq;XyWD",
        "site": "https://openreview.net/forum?id=SerYSFntLh",
        "pdf_size": 8616246,
        "rating": "3;3;5",
        "confidence": "4;5;3",
        "soundness": "3;2;2",
        "contribution": "2;2;2",
        "presentation": "3;2;2",
        "wc_summary": "38;49;93",
        "wc_strengths": "24;35;43",
        "wc_weaknesses": "135;134;35",
        "wc_questions": "5;58;132",
        "wc_review": "202;276;303",
        "wc_reply_reviewers": "16;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "1;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            60.0,
            23.762715894162152
        ],
        "wc_strengths_avg": [
            34.0,
            7.788880963698615
        ],
        "wc_weaknesses_avg": [
            101.33333333333333,
            46.906526435265086
        ],
        "wc_questions_avg": [
            65.0,
            52.083266666624
        ],
        "wc_review_avg": [
            260.3333333333333,
            42.695302890234764
        ],
        "wc_reply_reviewers_avg": [
            5.333333333333333,
            7.542472332656507
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8660254037844387,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:DGNvwD7IuNIJ:scholar.google.com/&scioq=Multimodal+Variational+Disentangled+Knowledge+Alignment+for+Cross-domain+Recommendation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Chinese Academy of Sciences;Qingdao University;Kuaishou Technology;Tencent",
        "aff_unique_dep": "Institute of Automation;;;Tencent Holdings Limited",
        "aff_unique_url": "http://www.ia.cas.cn;https://www.qdu.edu.cn;https://www.kuaishou.com;https://www.tencent.com",
        "aff_unique_abbr": "CAS;QDU;Kuaishou;Tencent",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Dropout-Based Rashomon Set Exploration for Efficient Predictive Multiplicity Estimation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18595",
        "id": "Sf2A2PUXO3",
        "author_site": "Hsiang Hsu, Guihong Li, Shaohan Hu, Chun-Fu Chen",
        "tldr": "",
        "abstract": "Predictive multiplicity refers to the phenomenon in which classification tasks may admit multiple competing models that achieve almost-equally-optimal performance, yet generate conflicting outputs for individual samples.\nThis presents significant concerns, as it can potentially result in systemic exclusion, inexplicable discrimination, and unfairness in practical applications.\nMeasuring and mitigating predictive multiplicity, however, is computationally challenging due to the need to explore all such almost-equally-optimal models, known as the Rashomon set, in potentially huge hypothesis spaces. \nTo address this challenge, we propose a novel framework that utilizes dropout techniques for exploring models in the Rashomon set.\nWe provide rigorous theoretical derivations to connect the dropout parameters to properties of the Rashomon set, and empirically evaluate our framework through extensive experimentation.\nNumerical results show that our technique consistently outperforms baselines in terms of the effectiveness of predictive multiplicity metric estimation, with runtime speedup up to $20\\times \\sim 5000\\times$.\nWith efficient Rashomon set exploration and metric estimation, mitigation of predictive multiplicity is then achieved through dropout ensemble and model selection.",
        "keywords": "Rashomon Effect;Rashomon Set;Predictive Multiplicity;Dropout;Speedup.",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Hsiang Hsu;Guihong Li;Shaohan Hu;Chun-Fu Chen",
        "authorids": "~Hsiang_Hsu1;~Guihong_Li1;~Shaohan_Hu2;~Chun-Fu_Chen1",
        "gender": "M;Unspecified;;M",
        "homepage": "https://hsianghsu.github.io;https://liguihong.github.io/;https://hushaohan.github.io/;",
        "dblp": ";143/6649.html;;48/915",
        "google_scholar": "https://scholar.google.com.tw/citations?user=JRl3iYIAAAAJ;;m9dh1GoAAAAJ;9gqd5cYAAAAJ",
        "orcid": "0000-0001-8084-3929;0000-0001-8537-8632;;",
        "linkedin": ";;;",
        "or_profile": "~Hsiang_Hsu1;~Guihong_Li1;~Shaohan_Hu2;~Chun-Fu_Chen1",
        "aff": "JP Morgan & Chase Bank;University of Texas, Austin;J.P. Morgan Chase;JPMorganChase, GTAR",
        "aff_domain": "jpmchase.com;utexas.edu;jpmchase.com;jpmchase.com",
        "position": "Researcher;PhD student;Executive Director;Executive Director",
        "bibtex": "@inproceedings{\nhsu2024dropoutbased,\ntitle={Dropout-Based Rashomon Set Exploration for Efficient Predictive Multiplicity Estimation},\nauthor={Hsiang Hsu and Guihong Li and Shaohan Hu and Chun-Fu Chen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Sf2A2PUXO3}\n}",
        "github": "",
        "project": "",
        "reviewers": "kvbj;BakJ;pYox;7265",
        "pdf_size": 15552319,
        "rating": "5;6;6;6",
        "confidence": "3;4;2;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;4;4;4",
        "wc_summary": "71;68;94;50",
        "wc_strengths": "31;38;76;70",
        "wc_weaknesses": "181;697;181;74",
        "wc_questions": "117;123;21;33",
        "wc_review": "400;926;372;227",
        "wc_reply_reviewers": "0;247;11;46",
        "wc_reply_authors": "1455;2842;924;715",
        "reply_reviewers": "0;2;1;1",
        "reply_authors": "3;6;3;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            70.75,
            15.642490210960657
        ],
        "wc_strengths_avg": [
            53.75,
            19.524023663169434
        ],
        "wc_weaknesses_avg": [
            283.25,
            242.83983919447815
        ],
        "wc_questions_avg": [
            73.5,
            46.74130935264865
        ],
        "wc_review_avg": [
            481.25,
            265.0390301446185
        ],
        "wc_reply_reviewers_avg": [
            76.0,
            100.17734274774911
        ],
        "wc_reply_authors_avg": [
            1484.0,
            829.151071880149
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            3.25,
            1.7853571071357126
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=425848024235550895&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=Sf2A2PUXO3",
        "pdf": "https://openreview.net/pdf?id=Sf2A2PUXO3",
        "email": "jpmchase.com;utexas.edu;jpmchase.com;jpmchase.com",
        "author_num": 4,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "JPMorgan Chase & Co.;University of Texas at Austin;JPMorgan Chase",
        "aff_unique_dep": ";;Global Technology, Analytics, and Research (GTAR)",
        "aff_unique_url": "https://www.jpmorganchase.com;https://www.utexas.edu;https://www.jpmorganchase.com",
        "aff_unique_abbr": "JPM;UT Austin;JPM",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Austin",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "SfNY6qAJBO",
        "title": "Masked Diffusion Models are Fast Distribution Learners",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Diffusion models have emerged as the de-facto generative model for image synthesis, yet they entail significant training overhead, hindering the technique\u2019s broader adoption in the research community. We observe that these models are commonly trained to learn all fine-grained visual information from scratch, thus motivating our investigation on its necessity. In this work, we show that it suffices to set up pretraining stage to initialize a diffusion model by encouraging it to learn some primer distribution of the unknown real image distribution. Then the pre-trained model can be fine-tuned for specific generation tasks efficiently. To approximate the primer distribution, our approach centers on masking a high proportion (e.g., up to 90%) of an input image and employing masked denoising score matching to denoise visible areas. Utilizing the learned primer distribution in subsequent fine-tuning, we efficiently train a ViT-based diffusion model on CelebA-HQ 256 \u00d7 256 in the raw pixel space, achieving superior training acceleration compared to denoising diffusion probabilistic model (DDPM) counterpart and a new FID score record of 6.73 for ViT-based diffusion models. Moreover, our masked pre-training technique can be universally applied to various diffusion models that directly generate images in the pixel space, aiding in the learning of pre-trained models with superior generalizability. For instance, a diffusion model pre-trained on VGGFace2 attains a 46% quality improvement through fine-tuning on only 10% data from a different dataset. Our code will be made publicly available.",
        "keywords": "image synthesis;diffusion model;masked pre-training;training efficiency",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Jiachen Lei;Qinglong Wang;Peng Cheng;Zhongjie Ba;Zhan Qin;Zhibo Wang;Zhenguang Liu;Kui Ren",
        "authorids": "~Jiachen_Lei1;~Qinglong_Wang1;~Peng_Cheng8;~Zhongjie_Ba1;~Zhan_Qin2;~Zhibo_Wang1;~Zhenguang_Liu1;~Kui_Ren4",
        "gender": ";M;;M;M;M;M;M",
        "homepage": ";;;;https://person.zju.edu.cn/en/zhanqin;https://person.zju.edu.cn/en/zhibowang;https://sites.google.com/view/zhenguangliu/;",
        "dblp": ";27/10136;;139/5759.html;148/4477;31/5772-1.html;145/1147;20/6179-1.html",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;;;;0ox7zDkAAAAJ;OP2ySB8AAAAJ;https://scholar.google.com/citations?view_op=list_works",
        "orcid": ";;;;;0000-0002-5804-3279;;0000-0003-3441-6277",
        "linkedin": ";;;;;;;",
        "or_profile": "~Jiachen_Lei1;~Qinglong_Wang1;~Peng_Cheng8;~Zhongjie_Ba1;~Zhan_Qin2;~Zhibo_Wang1;~Zhenguang_Liu1;~Kui_Ren4",
        "aff": ";Zhejiang University;;Zhejiang University;Zhejiang University;Zhejiang University;Zhejiang University;Zhejiang University",
        "aff_domain": ";zju.edu.cn;;zju.edu.cn;zju.edu.cn;zju.edu.cn;zju.edu.cn;zju.edu.cn",
        "position": ";Researcher;;Full Professor;Full Professor;Full Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nlei2024masked,\ntitle={Masked Diffusion Models are Fast Distribution Learners},\nauthor={Jiachen Lei and Qinglong Wang and Peng Cheng and Zhongjie Ba and Zhan Qin and Zhibo Wang and Zhenguang Liu and Kui Ren},\nyear={2024},\nurl={https://openreview.net/forum?id=SfNY6qAJBO}\n}",
        "github": "",
        "project": "",
        "reviewers": "GstE;mkao;SYPq;DGdo;QVNJ;yJNq",
        "site": "https://openreview.net/forum?id=SfNY6qAJBO",
        "pdf_size": 5806222,
        "rating": "3;3;5;5;5;5",
        "confidence": "4;4;4;4;3;3",
        "soundness": "2;3;2;2;3;3",
        "contribution": "2;2;2;2;2;3",
        "presentation": "3;3;2;3;2;2",
        "wc_summary": "46;61;32;77;66;56",
        "wc_strengths": "29;28;31;60;69;39",
        "wc_weaknesses": "257;73;88;278;357;45",
        "wc_questions": "30;49;3;70;113;37",
        "wc_review": "362;211;154;485;605;177",
        "wc_reply_reviewers": "0;0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0;0",
        "reply_authors": "0;0;0;0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.1666666666666665,
            0.3726779962499649
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            56.333333333333336,
            14.383632673594278
        ],
        "wc_strengths_avg": [
            42.666666666666664,
            16.048537489614297
        ],
        "wc_weaknesses_avg": [
            183.0,
            118.98599357347345
        ],
        "wc_questions_avg": [
            50.333333333333336,
            34.51408730101699
        ],
        "wc_review_avg": [
            332.3333333333333,
            167.92227037796056
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.5000000000000001,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:8QAClEjsQYUJ:scholar.google.com/&scioq=Masked+Diffusion+Models+are+Fast+Distribution+Learners&hl=en&as_sdt=0,10",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "Zhejiang University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.zju.edu.cn",
        "aff_unique_abbr": "ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "SfunjRKld1",
        "title": "Decoupled Kullback-Leibler Divergence Loss",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In this paper, we delve deeper into the Kullback\u2013Leibler (KL) Divergence loss and mathematically prove that it is equivalent to the Doupled Kullback-Leibler (DKL) Divergence loss that consists of 1) a weighted Mean Square Error ($w$MSE) loss and 2) a Cross-Entropy loss incorporating soft labels. From our analysis of the DKL loss, we have identified two areas for improvement. Firstly, we address the limitation of DKL in scenarios like knowledge distillation by breaking its asymmetry property in training optimization. This modification ensures that the $w$MSE component is always effective during training, providing extra constructive cues. Secondly, we introduce global information into DKL to mitigate bias from individual samples.\nWith these two enhancements, we derive the Improved Kullback\u2013Leibler (IKL) Divergence loss and evaluate its effectiveness by conducting experiments on CIFAR-10/100 and ImageNet datasets, focusing on adversarial training and knowledge distillation tasks. The proposed approach achieves new state-of-the-art adversarial robustness on the public leaderboard --- RobustBench and competitive performance on knowledge distillation, demonstrating the substantial practical merits.",
        "keywords": "adversarial robustness;knowledge distillation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/c0c0dce8c6bb42e5086612f0f177c017165c5649.pdf",
        "author": "Jiequan Cui;Zhuotao Tian;Zhisheng Zhong;XIAOJUAN QI;Bei Yu;Hanwang Zhang",
        "authorids": "~Jiequan_Cui1;~Zhuotao_Tian1;~Zhisheng_Zhong1;~XIAOJUAN_QI2;~Bei_Yu2;~Hanwang_Zhang3",
        "gender": "M;M;M;F;M;M",
        "homepage": "https://jiequancui.github.io/;https://scholar.google.com/citations?user=mEjhz-IAAAAJ&hl=zh-CN;https://zhishengzhong.com;https://xjqi.github.io/;http://www.cse.cuhk.edu.hk/~byu/index.html;https://mreallab.github.io/index.html",
        "dblp": "259/5474;243/7181;168/0784;176/1445-1.html;28/4556-1.html;79/8116.html",
        "google_scholar": "KbXLN2AAAAAJ;mEjhz-IAAAAJ;https://scholar.google.com.hk/citations?user=u-2_7C8AAAAJ;bGn0uacAAAAJ;tGneTm4AAAAJ;YG0DFyYAAAAJ",
        "orcid": ";;;;0000-0001-6406-4810;",
        "linkedin": ";;;;yubei/;",
        "or_profile": "~Jiequan_Cui1;~Zhuotao_Tian1;~Zhisheng_Zhong1;~XIAOJUAN_QI2;~Bei_Yu2;~Hanwang_Zhang3",
        "aff": "Nanyang Technological University;SmartMore;The Chinese University of Hong Kong;University of Hong Kong;Department of Computer Science and Engineering, The Chinese University of Hong Kong;Nanyang Technological University",
        "aff_domain": "ntu.edu.sg;smartmore.com;cuhk.edu.hk;hku.hk;cse.cuhk.edu.hk;ntu.edu.sg",
        "position": "Research Fellow;Researcher;PhD student;Assistant Professor;Associate Professor;Associate Professor",
        "bibtex": "@misc{\ncui2024decoupled,\ntitle={Decoupled Kullback-Leibler Divergence Loss},\nauthor={Jiequan Cui and Zhuotao Tian and Zhisheng Zhong and XIAOJUAN QI and Bei Yu and Hanwang Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=SfunjRKld1}\n}",
        "github": "",
        "project": "",
        "reviewers": "MJfm;JUiH;2ej3;6Mi2",
        "site": "https://openreview.net/forum?id=SfunjRKld1",
        "pdf_size": 1470742,
        "rating": "3;3;5;5",
        "confidence": "4;4;4;2",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;2",
        "presentation": "2;2;2;2",
        "wc_summary": "124;103;105;37",
        "wc_strengths": "17;40;25;24",
        "wc_weaknesses": "43;282;44;33",
        "wc_questions": "264;75;265;88",
        "wc_review": "448;500;439;182",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            92.25,
            32.93459427410637
        ],
        "wc_strengths_avg": [
            26.5,
            8.381527307120106
        ],
        "wc_weaknesses_avg": [
            100.5,
            104.87730927135765
        ],
        "wc_questions_avg": [
            173.0,
            91.61604662939784
        ],
        "wc_review_avg": [
            392.25,
            123.60092030401715
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 49,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1302951723222363368&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;2;3;2;0",
        "aff_unique_norm": "Nanyang Technological University;SmartMore;Chinese University of Hong Kong;University of Hong Kong",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.ntu.edu.sg;;https://www.cuhk.edu.hk;https://www.hku.hk",
        "aff_unique_abbr": "NTU;;CUHK;HKU",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;2;2;2;0",
        "aff_country_unique": "Singapore;;China"
    },
    {
        "title": "OpenNeRF: Open Set 3D Neural Scene Segmentation with Pixel-Wise Features and Rendered Novel Views",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18594",
        "id": "SgjAojPKb3",
        "author_site": "Francis Engelmann, Fabian Manhardt, Michael Niemeyer, Keisuke Tateno, Federico Tombari",
        "tldr": "",
        "abstract": "Large visual-language models (VLMs), like CLIP, enable open-set image segmentation to segment arbitrary concepts from an image in a zero-shot manner. This goes beyond the traditional closed-set assumption, i.e., where models can only segment classes from a pre-defined training set. More recently, first works on open-set segmentation in 3D scenes have appeared in the literature. These methods are heavily influenced by closed-set 3D convolutional approaches that process point clouds or polygon meshes. However, these 3D scene representations do not align well with the image-based nature of the visual-language models. Indeed, point cloud and 3D meshes typically have a lower resolution than images and the reconstructed 3D scene geometry might not project well to the underlying 2D image sequences used to compute pixel-aligned CLIP features. To address these challenges, we propose OpenNeRF which naturally operates on posed images and directly encodes the VLM features within the NeRF. This is similar in spirit to LERF, however our work shows that using pixel-wise VLM features (instead of global CLIP features) results in an overall less complex architecture without the need for additional DINO regularization. Our OpenNeRF further leverages NeRF\u2019s ability to render novel views and extract open-set VLM features from areas that are not well observed in the initial posed images. For 3D point cloud segmentation on the Replica dataset, OpenNeRF outperforms recent open-vocabulary methods such as LERF and OpenScene by at least +4.9 mIoU.",
        "keywords": "3D;open set segmentation;neural radiance fields;VLM features",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Francis Engelmann;Fabian Manhardt;Michael Niemeyer;Keisuke Tateno;Federico Tombari",
        "authorids": "~Francis_Engelmann1;~Fabian_Manhardt1;~Michael_Niemeyer1;~Keisuke_Tateno1;~Federico_Tombari1",
        "gender": ";M;M;M;M",
        "homepage": ";http://campar.in.tum.de/Main/FabianManhardt;https://m-niemeyer.github.io/;;https://federicotombari.github.io/",
        "dblp": ";173/9271;232/1712;25/1526;16/3539",
        "google_scholar": ";https://scholar.google.de/citations?user=bERItx8AAAAJ;https://scholar.google.de/citations?user=v1O7i_0AAAAJ;https://scholar.google.com/citations?hl=en;TFsE4BIAAAAJ",
        "orcid": ";0000-0002-4577-4590;;;0000-0001-5598-5212",
        "linkedin": ";;;;fedet/",
        "or_profile": "~Francis_Engelmann1;~Fabian_Manhardt1;~Michael_Niemeyer1;~Keisuke_Tateno1;~Federico_Tombari1",
        "aff": ";Google;Google;Google;Technical University Munich (TUM)",
        "aff_domain": ";google.com;google.com;google.com;in.tum.de",
        "position": ";Researcher;Researcher;Researcher;Lecturer",
        "bibtex": "@inproceedings{\nengelmann2024opennerf,\ntitle={OpenNe{RF}: Open Set 3D Neural Scene Segmentation with Pixel-Wise Features and Rendered Novel Views},\nauthor={Francis Engelmann and Fabian Manhardt and Michael Niemeyer and Keisuke Tateno and Federico Tombari},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=SgjAojPKb3}\n}",
        "github": "",
        "project": "",
        "reviewers": "UKPx;Nxv7;AABJ;Y2vi",
        "pdf_size": 6018622,
        "rating": "5;5;6;8",
        "confidence": "4;4;3;5",
        "soundness": "3;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "4;3;3;4",
        "wc_summary": "77;97;229;40",
        "wc_strengths": "49;101;88;84",
        "wc_weaknesses": "239;155;47;27",
        "wc_questions": "10;70;49;59",
        "wc_review": "375;423;413;210",
        "wc_reply_reviewers": "0;0;17;11",
        "wc_reply_authors": "470;1060;412;556",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "1;2;2;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            110.75,
            71.26841867194753
        ],
        "wc_strengths_avg": [
            80.5,
            19.241881404893856
        ],
        "wc_weaknesses_avg": [
            117.0,
            85.62709851443059
        ],
        "wc_questions_avg": [
            47.0,
            22.616365755797283
        ],
        "wc_review_avg": [
            355.25,
            85.75072885987618
        ],
        "wc_reply_reviewers_avg": [
            7.0,
            7.314369419163897
        ],
        "wc_reply_authors_avg": [
            624.5,
            256.6023187736229
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 33,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13627983035162289561&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=SgjAojPKb3",
        "pdf": "https://openreview.net/pdf?id=SgjAojPKb3",
        "email": ";google.com;google.com;google.com;in.tum.de",
        "author_num": 5,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "Google;Technical University Munich",
        "aff_unique_dep": "Google;",
        "aff_unique_url": "https://www.google.com;https://www.tum.de",
        "aff_unique_abbr": "Google;TUM",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Mountain View;",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "United States;Germany"
    },
    {
        "id": "Sgvb61ZM2x",
        "title": "Effective Learning by Node Perturbation in Deep Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Backpropagation (BP) is the dominant and most successful method for training parameters of deep neural network models. However, BP relies on two computationally distinct phases, does not provide a satisfactory explanation of biological learning, and can be challenging to apply for training of networks with discontinuities or noisy node dynamics. By comparison, node perturbation (NP) proposes learning by the injection of noise into the network activations, and subsequent measurement of the induced loss change. NP relies on two forward (inference) passes, does not make use of network derivatives, and has been proposed as a model for learning in biological systems. However, standard NP is highly data inefficient and unstable due to its unguided, noise-based, activity search. In this work, we investigate different formulations of NP and relate it more directly to the concept of directional derivatives as well as combining it with a de-biasing mechanism for layer outputs. We find that a closer alignment with directional derivatives, and induction of decorrelation of node outputs significantly enhance performance of NP learning making it competitive with BP.",
        "keywords": "Node Perturbation;Credit Assignment;Directional Derivatives;Decorrelation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Sander Dalm;Marcel van Gerven;Nasir Ahmad",
        "authorids": "~Sander_Dalm1;~Marcel_van_Gerven1;~Nasir_Ahmad1",
        "gender": "M;M;",
        "homepage": ";http://www.artcogsys.com;",
        "dblp": ";;",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;",
        "orcid": ";0000-0002-2206-9098;",
        "linkedin": "sander-dalm-06914220;marcel-van-gerven-8698784/;",
        "or_profile": "~Sander_Dalm1;~Marcel_van_Gerven1;~Nasir_Ahmad1",
        "aff": "Radboud University;Donders Institute for Brain, Cognition and Behaviour, Radboud University;",
        "aff_domain": "ru.nl;ru.nl;",
        "position": "PhD student;Full Professor;",
        "bibtex": "@misc{\ndalm2024effective,\ntitle={Effective Learning by Node Perturbation in Deep Neural Networks},\nauthor={Sander Dalm and Marcel van Gerven and Nasir Ahmad},\nyear={2024},\nurl={https://openreview.net/forum?id=Sgvb61ZM2x}\n}",
        "github": "",
        "project": "",
        "reviewers": "W31p;G9as;PZS3;hNrk",
        "site": "https://openreview.net/forum?id=Sgvb61ZM2x",
        "pdf_size": 5742738,
        "rating": "3;3;5;5",
        "confidence": "5;4;4;5",
        "soundness": "3;3;2;3",
        "contribution": "1;2;1;2",
        "presentation": "4;3;3;3",
        "wc_summary": "116;74;21;99",
        "wc_strengths": "75;46;57;90",
        "wc_weaknesses": "318;168;190;209",
        "wc_questions": "81;193;44;203",
        "wc_review": "590;481;312;601",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "321;785;363;704",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            77.5,
            35.878266401820476
        ],
        "wc_strengths_avg": [
            67.0,
            16.837458240482736
        ],
        "wc_weaknesses_avg": [
            221.25,
            57.71210878143338
        ],
        "wc_questions_avg": [
            130.25,
            69.09187723603983
        ],
        "wc_review_avg": [
            496.0,
            116.12708555716017
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            543.25,
            203.81900671919684
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3539280291572242331&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Radboud University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ru.nl",
        "aff_unique_abbr": "RU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Netherlands"
    },
    {
        "id": "ShOT80BjUZ",
        "title": "SpikeGPT: Generative Pre-trained Language Model with Spiking Neural Networks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "As the size of large language models continue to scale, so does the computational resources required to run them. Spiking Neural Networks (SNNs) have emerged as an energy-efficient approach to deep learning that leverage sparse and event-driven activations to reduce the computational overhead associated with model inference. While they have become competitive with non-spiking models on many computer vision tasks, SNNs have proven to be more challenging to train. As a result, their performance lags behind modern deep learning, and until now, SNNs have yet to succeed at language generation on large-scale datasets. In this paper, inspired by the Receptance Weighted Key Value (RWKV) language model, we successfully implement `SpikeGPT', a generative language model with binary, event-driven spiking activation units. We train the proposed model on two model variants: 45M and 216M parameters. To the best of our knowledge, SpikeGPT is the largest backpropagation-trained SNN model to date, rendering it suitable for both the generation and comprehension of natural language. We achieve this by modifying the transformer block to replace multi-head self-attention to reduce quadratic computational complexity $\\mathcal{O}(T^2)$ to linear complexity $\\mathcal{O}(T)$ with increasing sequence length. Input tokens are instead streamed in sequentially to our attention mechanism (as with typical SNNs). Our experiments show that SpikeGPT remains competitive with non-spiking models on tested benchmarks, while maintaining 32.2$\\times$ fewer operations when processed on neuromorphic hardware that can leverage sparse, event-driven activations.",
        "keywords": "Neuromorphic Computing;Spiking Neural Networks;Generative Language Model",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/5f4058b5fd363ad3dc010dff7e973ec865e65e55.zip",
        "author": "Rui-Jie Zhu;Qihang Zhao;Guoqi Li;Jason Eshraghian",
        "authorids": "~Rui-Jie_Zhu2;~Qihang_Zhao1;~Guoqi_Li1;~Jason_Eshraghian1",
        "gender": "M;M;M;M",
        "homepage": "https://ruijie-zhu.github.io;https://www.researchgate.net/profile/Qihang-Zhao-2;https://scholar.google.com/citations?hl=en&user=qCfE--MAAAAJ;https://www.ncg.ucsc.edu",
        "dblp": "317/4836;264/3765;;184/4409",
        "google_scholar": "08ITzJsAAAAJ;;https://scholar.google.com/citations?hl=en;https://scholar.google.com.au/citations?user=C16f0r3hL-kC",
        "orcid": ";;;0000-0002-5832-4054",
        "linkedin": ";;;",
        "or_profile": "~Rui-Jie_Zhu2;~Qihang_Zhao1;~Guoqi_Li1;~Jason_Eshraghian1",
        "aff": "University of California, Santa Cruz;;Institute of Automation, Chinese Academy of Sciences;University of California, Santa Cruz",
        "aff_domain": "ucsc.edu;;ia.ac.cn;ucsc.edu",
        "position": "PhD student;;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nzhu2024spikegpt,\ntitle={Spike{GPT}: Generative Pre-trained Language Model with Spiking Neural Networks},\nauthor={Rui-Jie Zhu and Qihang Zhao and Guoqi Li and Jason Eshraghian},\nyear={2024},\nurl={https://openreview.net/forum?id=ShOT80BjUZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "c7Vs;DdDP;dRbn;o3UE",
        "site": "https://openreview.net/forum?id=ShOT80BjUZ",
        "pdf_size": 1561645,
        "rating": "1;3;5;6",
        "confidence": "4;5;5;2",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;3;2",
        "wc_summary": "6;63;41;68",
        "wc_strengths": "4;42;31;41",
        "wc_weaknesses": "68;535;198;156",
        "wc_questions": "3;39;7;35",
        "wc_review": "81;679;277;300",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.920286436967152
        ],
        "confidence_avg": [
            4.0,
            1.224744871391589
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            44.5,
            24.438698819699873
        ],
        "wc_strengths_avg": [
            29.5,
            15.337861650177967
        ],
        "wc_weaknesses_avg": [
            239.25,
            177.07819600391235
        ],
        "wc_questions_avg": [
            21.0,
            16.1245154965971
        ],
        "wc_review_avg": [
            334.25,
            216.47098535369585
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.42519520276218703,
        "gs_citation": 130,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16357368493738094500&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of California, Santa Cruz;Chinese Academy of Sciences",
        "aff_unique_dep": ";Institute of Automation",
        "aff_unique_url": "https://www.ucsc.edu;http://www.ia.cas.cn",
        "aff_unique_abbr": "UCSC;CAS",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Santa Cruz;",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "Accurate Forgetting for Heterogeneous Federated Continual Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18593",
        "id": "ShQrnAsbPI",
        "author_site": "Abudukelimu Wuerkaixi, Sen Cui, Jingfeng Zhang, Kunda Yan, Bo Han, Gang Niu, Lei Fang, Changshui Zhang, Masashi Sugiyama",
        "tldr": "",
        "abstract": "Recent years have witnessed a burgeoning interest in federated learning (FL). However, the contexts in which clients engage in sequential learning remain under- explored. Bridging FL and continual learning (CL) gives rise to a challenging practical problem: federated continual learning (FCL). Existing research in FCL primarily focuses on mitigating the catastrophic forgetting issue of continual learning while collaborating with other clients. We argue that forgetting phenomena are not invariably detrimental. In this paper, we consider a more practical and challenging FCL setting characterized by potentially unrelated or even antagonistic data/tasks across different clients. In the FL scenario, statistical heterogeneity and data noise among clients may exhibit spurious correlations which result in biased feature learning. While existing CL strategies focus on the complete utilization of previous knowledge, we found that forgetting biased information was beneficial in our study. Therefore, we propose a new concept accurate forgetting (AF) and develop a novel generative-replay method AF-FCL that selectively utilizes previous knowledge in federated networks. We employ a probabilistic framework based on a normalizing flow model to quantify the credibility of previous knowledge. Comprehensive experiments affirm the superiority of our method over baselines.",
        "keywords": "federated learning;robustness",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Abudukelimu Wuerkaixi;Sen Cui;Jingfeng Zhang;Kunda Yan;Bo Han;Gang Niu;Lei Fang;Changshui Zhang;Masashi Sugiyama",
        "authorids": "~Abudukelimu_Wuerkaixi1;~Sen_Cui1;~Jingfeng_Zhang1;~Kunda_Yan1;~Bo_Han1;~Gang_Niu1;~Lei_Fang6;~Changshui_Zhang2;~Masashi_Sugiyama1",
        "gender": "M;M;M;M;M;;M;M;M",
        "homepage": "https://www.baidu.com;;https://zjfheart.github.io;https://github.com/yankd22;https://niug1984.github.io;https://linkedin.com/in/leifang;http://bigeye.au.tsinghua.edu.cn/english/Introduction.html;http://www.ms.k.u-tokyo.ac.jp/sugi/;https://bhanml.github.io/",
        "dblp": "293/3368;267/5483;227/2664.html;;26/3367-1;;z/ChangshuiZhang;35/1228;241/0472-3",
        "google_scholar": ";UzQuG1UAAAAJ;NS0P1FkAAAAJ;;https://scholar.google.co.jp/citations?user=HOkcy00AAAAJ;;GL9M37YAAAAJ;https://scholar.google.co.jp/citations?user=GkYIrlIAAAAJ;nTNjqHwAAAAJ",
        "orcid": ";;0000-0003-3491-8074;;;;;0000-0001-6658-6743;",
        "linkedin": ";;;;;;;;",
        "or_profile": "~Abudukelimu_Wuerkaixi1;~Sen_Cui1;~Jingfeng_Zhang1;~Kunda_Yan1;~Gang_Niu1;~Lei_Fang6;~Changshui_Zhang2;~Masashi_Sugiyama1;~bo_han2",
        "aff": "Tsinghua University, Beijing;Tsinghua University;University of Auckland;Tsinghua University;Southeast University;;Tsinghua University;The University of Tokyo;MBZUAI",
        "aff_domain": "tsinghua.edu.cn;tsinghua.edu.cn;auckland.ac.nz;tsinghua.edu.cn;seu.edu.cn;;mail.tsinghua.edu.cn;u-tokyo.ac.jp;mbzuai.ac.ae",
        "position": "PhD student;PhD student;Assistant Professor;PhD student;Adjunct Full Professor;;Full Professor;Full Professor;Researcher",
        "bibtex": "@inproceedings{\nwuerkaixi2024accurate,\ntitle={Accurate Forgetting for Heterogeneous Federated Continual Learning},\nauthor={Abudukelimu Wuerkaixi and Sen Cui and Jingfeng Zhang and Kunda Yan and Bo Han and Gang Niu and Lei Fang and Changshui Zhang and Masashi Sugiyama},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ShQrnAsbPI}\n}",
        "github": "",
        "project": "",
        "reviewers": "cH3G;hHgp;T35E;BJsd;pq5J",
        "pdf_size": 763409,
        "rating": "5;6;8;8;8",
        "confidence": "2;4;4;4;4",
        "soundness": "3;2;3;4;3",
        "contribution": "2;2;3;3;3",
        "presentation": "3;3;3;2;3",
        "wc_summary": "83;67;99;50;115",
        "wc_strengths": "81;76;45;18;102",
        "wc_weaknesses": "144;342;68;144;473",
        "wc_questions": "267;4;102;2;87",
        "wc_review": "575;489;314;214;777",
        "wc_reply_reviewers": "0;286;25;17;84",
        "wc_reply_authors": "1903;2831;2079;823;2173",
        "reply_reviewers": "0;2;1;1;1",
        "reply_authors": "5;6;6;3;4",
        "rating_avg": [
            7.0,
            1.2649110640673518
        ],
        "confidence_avg": [
            3.6,
            0.8000000000000002
        ],
        "soundness_avg": [
            3.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            82.8,
            22.912005586591498
        ],
        "wc_strengths_avg": [
            64.4,
            29.50660942907538
        ],
        "wc_weaknesses_avg": [
            234.2,
            150.02719753431376
        ],
        "wc_questions_avg": [
            92.4,
            96.5331031304806
        ],
        "wc_review_avg": [
            473.8,
            197.70422352595304
        ],
        "wc_reply_reviewers_avg": [
            82.4,
            105.65718148805598
        ],
        "wc_reply_authors_avg": [
            1961.8,
            650.2573029193904
        ],
        "reply_reviewers_avg": [
            1.0,
            0.6324555320336759
        ],
        "reply_authors_avg": [
            4.8,
            1.16619037896906
        ],
        "replies_avg": [
            36,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.7905694150420945,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5641938183199664145&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=ShQrnAsbPI",
        "pdf": "https://openreview.net/pdf?id=ShQrnAsbPI",
        "email": "tsinghua.edu.cn;tsinghua.edu.cn;auckland.ac.nz;tsinghua.edu.cn;seu.edu.cn;;mail.tsinghua.edu.cn;u-tokyo.ac.jp;mbzuai.ac.ae",
        "author_num": 9,
        "aff_unique_index": "0;0;1;0;2;0;3;4",
        "aff_unique_norm": "Tsinghua University;University of Auckland;Southeast University;University of Tokyo;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.auckland.ac.nz;https://www.seu.edu.cn/;https://www.u-tokyo.ac.jp;https://www.mbzuai.ac.ae",
        "aff_unique_abbr": "THU;UoA;SEU;UTokyo;MBZUAI",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Beijing;",
        "aff_country_unique_index": "0;0;1;0;0;0;2;3",
        "aff_country_unique": "China;New Zealand;Japan;United Arab Emirates"
    },
    {
        "title": "Self-Consuming Generative Models Go MAD",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18592",
        "id": "ShjMHfmPs0",
        "author_site": "Sina Alemohammad, Josue Casco-Rodriguez, Lorenzo Luzi, Ahmed Imtiaz Humayun, Hossein Babaei, Daniel LeJeune, Ali Siahkoohi, Richard Baraniuk",
        "tldr": "",
        "abstract": "Seismic advances in generative AI algorithms for imagery, text, and other data types have led to the temptation to use AI-synthesized data to train next-generation models. Repeating this process creates an autophagous (\"self-consuming\") loop  whose properties are poorly understood. We conduct a thorough analytical and empirical analysis using state-of-the-art generative image models of three families of autophagous loops that differ in how fixed or fresh real training data is available through the generations of training and whether the samples from previous-generation models have been biased to trade off data quality versus diversity.  Our primary conclusion across all scenarios is that *without enough fresh real data in each generation of an autophagous loop, future generative models are doomed to have their quality (precision) or diversity (recall) progressively decrease.* We term this condition Model Autophagy Disorder (MAD), by analogy to mad cow disease, and show that appreciable MADness arises in just a few generations.",
        "keywords": "Generative Models;Synthetic Data;Sampling Bias;Diffusion Models;GANs",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/88d0b7860e363172eb2aae73fdc05f8faf386dc6.zip",
        "author": "Sina Alemohammad;Josue Casco-Rodriguez;Lorenzo Luzi;Ahmed Imtiaz Humayun;Hossein Babaei;Daniel LeJeune;Ali Siahkoohi;Richard Baraniuk",
        "authorids": "~Sina_Alemohammad1;~Josue_Casco-Rodriguez1;~Lorenzo_Luzi1;~Ahmed_Imtiaz_Humayun1;~Hossein_Babaei1;~Daniel_LeJeune1;~Ali_Siahkoohi1;~Richard_Baraniuk1",
        "gender": "M;M;M;M;M;M;M;",
        "homepage": ";https://sites.google.com/rice.edu/josuecasco-rodriguez/home;;https://imtiazhumayun.github.io;https://echbaba.github.io/;https://dlej.net/;https://alisiahkoohi.github.io;http://richb.rice.edu/",
        "dblp": "267/9746;;;222/1771;;219/9028;00/10956;32/2804",
        "google_scholar": "https://scholar.google.co.il/citations?user=ATjmZVsAAAAJ;;https://scholar.google.com/citations?hl=en;wJ2HUn4AAAAJ;https://scholar.google.com/citations?hl=en;vlZDXYgAAAAJ;sxRMqYIAAAAJ;https://scholar.google.com.tw/citations?user=N-BBA20AAAAJ",
        "orcid": ";0000-0002-9694-0982;;;0000-0002-5086-710X;;0000-0001-8779-2247;",
        "linkedin": ";josuecascorodriguez/;;;;;alisiahkoohi/;richard-baraniuk",
        "or_profile": "~Sina_Alemohammad1;~Josue_Casco-Rodriguez1;~Lorenzo_Luzi1;~Ahmed_Imtiaz_Humayun1;~Hossein_Babaei1;~Daniel_LeJeune1;~Ali_Siahkoohi1;~Richard_Baraniuk1",
        "aff": "Rice University;Rice University;;Google;Rice university;Stanford University;Rice University;William Marsh Rice University",
        "aff_domain": "rice.edu;rice.edu;;google.com;rice.edu;stanford.edu;rice.edu;rice.edu",
        "position": "PhD student;MS student;;Student Researcher;PhD student;Postdoc;Postdoc;C. Sidney Burrus Professor",
        "bibtex": "@inproceedings{\nalemohammad2024selfconsuming,\ntitle={Self-Consuming Generative Models Go {MAD}},\nauthor={Sina Alemohammad and Josue Casco-Rodriguez and Lorenzo Luzi and Ahmed Imtiaz Humayun and Hossein Babaei and Daniel LeJeune and Ali Siahkoohi and Richard Baraniuk},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ShjMHfmPs0}\n}",
        "github": "",
        "project": "",
        "reviewers": "uRXW;ZeQh;VGNe",
        "pdf_size": 12619443,
        "rating": "6;6;8",
        "confidence": "3;4;3",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "3;4;3",
        "wc_summary": "123;85;116",
        "wc_strengths": "138;61;67",
        "wc_weaknesses": "165;79;172",
        "wc_questions": "95;62;2",
        "wc_review": "521;287;357",
        "wc_reply_reviewers": "22;103;0",
        "wc_reply_authors": "741;817;228",
        "reply_reviewers": "1;1;0",
        "reply_authors": "1;2;1",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            108.0,
            16.51262143533445
        ],
        "wc_strengths_avg": [
            88.66666666666667,
            34.96982826507572
        ],
        "wc_weaknesses_avg": [
            138.66666666666666,
            42.28737662970147
        ],
        "wc_questions_avg": [
            53.0,
            38.49675310984031
        ],
        "wc_review_avg": [
            388.3333333333333,
            98.06573758907281
        ],
        "wc_reply_reviewers_avg": [
            41.666666666666664,
            44.28945196720722
        ],
        "wc_reply_authors_avg": [
            595.3333333333334,
            261.5904347554695
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 179,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=50163507110428150&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=ShjMHfmPs0",
        "pdf": "https://openreview.net/pdf?id=ShjMHfmPs0",
        "email": "rice.edu;rice.edu;;google.com;rice.edu;stanford.edu;rice.edu;rice.edu",
        "author_num": 8,
        "aff_unique_index": "0;0;1;0;2;0;0",
        "aff_unique_norm": "Rice University;Google;Stanford University",
        "aff_unique_dep": ";Google;",
        "aff_unique_url": "https://www.rice.edu;https://www.google.com;https://www.stanford.edu",
        "aff_unique_abbr": "Rice;Google;Stanford",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Mountain View;Stanford",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "R-EDL: Relaxing Nonessential Settings of Evidential Deep Learning",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18591",
        "id": "Si3YFA641c",
        "author_site": "Mengyuan Chen, Junyu Gao, Changsheng Xu",
        "tldr": "",
        "abstract": "A newly-arising uncertainty estimation method named Evidential Deep Learning (EDL), which can obtain reliable predictive uncertainty in a single forward pass, has garnered increasing interest. Guided by the subjective logic theory, EDL obtains Dirichlet concentration parameters from deep neural networks, thus constructing a Dirichlet probability density function (PDF) to model the distribution of class probabilities. Despite its great success, we argue that EDL keeps nonessential settings in both stages of model construction and optimization.\nIn this work, our analysis indicates that (1) in the construction of the Dirichlet PDF, a commonly ignored parameter termed prior weight governs the balance between leveraging the proportion of evidence and its magnitude in deriving predictive scores, and (2) in model optimization, a variance-minimized regularization term adopted by traditional EDL encourages the Dirichlet PDF to approach a Dirac delta function, potentially exacerbating overconfidence. Therefore, we propose the R-EDL (Relaxed-EDL) method by relaxing these nonessential settings. Specifically, R-EDL treats the prior weight as an adjustable hyper-parameter instead of a fixed scalar, and directly optimizes the expectation of the Dirichlet PDF provided to deprecate the variance-minimized regularization term. Extensive experiments and SOTA performances demonstrate the effectiveness of our method. Source codes are provided in Appendix E.",
        "keywords": "uncertainty quantification;evidential deep learning;subjective logic;single-forward-pass uncertainty method",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/9a88e9a8d7ea58cecfb485444a1e22da9796ab5b.zip",
        "author": "Mengyuan Chen;Junyu Gao;Changsheng Xu",
        "authorids": "~Mengyuan_Chen1;~Junyu_Gao1;~Changsheng_Xu1",
        "gender": "M;M;M",
        "homepage": "https://github.com/MengyuanChen21;;",
        "dblp": ";153/4522;85/1301",
        "google_scholar": "uwaZ_wIAAAAJ;y1nOY24AAAAJ;https://scholar.google.com.sg/citations?user=hI9NRDkAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Mengyuan_Chen1;~Junyu_Gao1;~Changsheng_Xu1",
        "aff": "Institute of Automation, Chinese Academy of Sciences;Institute of Automation, Chinese Academy of Sciences;Institute of Automation, Chinese Academy of Sciences",
        "aff_domain": "ia.ac.cn;ia.ac.cn;ia.ac.cn",
        "position": "PhD student;Associate Professor;Full Professor",
        "bibtex": "@inproceedings{\nchen2024redl,\ntitle={R-{EDL}: Relaxing Nonessential Settings of Evidential Deep Learning},\nauthor={Mengyuan Chen and Junyu Gao and Changsheng Xu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Si3YFA641c}\n}",
        "github": "",
        "project": "",
        "reviewers": "R4i1;5NaH;vQHP;yPVK;ErzN",
        "pdf_size": 1340912,
        "rating": "6;6;8;8;8",
        "confidence": "3;3;5;4;4",
        "soundness": "3;3;3;3;3",
        "contribution": "3;3;3;3;3",
        "presentation": "3;2;3;3;4",
        "wc_summary": "17;58;58;56;212",
        "wc_strengths": "11;107;90;48;104",
        "wc_weaknesses": "92;96;78;21;325",
        "wc_questions": "2;20;103;19;312",
        "wc_review": "122;281;329;144;953",
        "wc_reply_reviewers": "16;0;22;19;97",
        "wc_reply_authors": "793;654;1326;539;2044",
        "reply_reviewers": "1;0;1;1;1",
        "reply_authors": "2;2;3;1;3",
        "rating_avg": [
            7.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.8,
            0.7483314773547882
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            80.2,
            67.73005241397648
        ],
        "wc_strengths_avg": [
            72.0,
            37.067505985701274
        ],
        "wc_weaknesses_avg": [
            122.4,
            104.80572503446555
        ],
        "wc_questions_avg": [
            91.2,
            115.87130792392051
        ],
        "wc_review_avg": [
            365.8,
            303.96802463417106
        ],
        "wc_reply_reviewers_avg": [
            30.8,
            33.961154279558876
        ],
        "wc_reply_authors_avg": [
            1071.2,
            556.0487029029022
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            2.2,
            0.7483314773547882
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.8728715609439696,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17342334055263916843&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=Si3YFA641c",
        "pdf": "https://openreview.net/pdf?id=Si3YFA641c",
        "email": "ia.ac.cn;ia.ac.cn;ia.ac.cn",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Chinese Academy of Sciences",
        "aff_unique_dep": "Institute of Automation",
        "aff_unique_url": "http://www.ia.cas.cn",
        "aff_unique_abbr": "CAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "SiUhAbb3LH",
        "title": "Continual Learning Knowledge Graph Embeddings for Dynamic Knowledge Graphs",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Knowledge graphs (KG) have shown great power in representing the facts for numerous downstream applications. Notice that the KGs are usually evolving and growing with the development of the real world, due to the change of old knowledge and the emergence of new knowledge, thus the study of dynamic knowledge graphs attracts a new wave. However, conventional work mainly pays attention to learning new knowledge based on existing knowledge while neglecting new knowledge and old knowledge should contribute to each other. Under this circumstance, they cannot tackle the following two challenges: (C1) transfer the knowledge from the old to the new without retraining the entire KG; (C2) alleviate the catastrophic forgetting of old knowledge with new knowledge. To address these issues, we revisit the embedding paradigm for dynamic knowledge graphs and propose a new method termed \\textbf{C}ontinual \\textbf{L}earning \\textbf{K}nowledge \\textbf{G}raph \\textbf{E}mbeddings (\\textbf{CLKGE}).  In this paper, we establish a new framework, allowing new and old knowledge to be gained from each other. Specifically, to tackle the (C1), we leverage continual learning to conduct the knowledge transfer and obtain new knowledge based on the old knowledge graph. In the face of (C2), we utilize the energy-based model, learning an energy manifold for the knowledge representations and aligning new knowledge and old knowledge such that their energy on the manifold is minimized, hence can alleviate catastrophic forgetting with the assistance of new knowledge. On top of this, we propose a theoretical guarantee that our model can converge to the optimal solution for the dynamic knowledge graphs. Moreover, we conduct extensive experimental results demonstrating that CLKGE achieves state-of-the-art performance compared with the embedding baselines.",
        "keywords": "Continual Learning;Dynamic Knowledge Graphs",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/a38266fdfc6302f93df0b9424592c9a94d40823f.zip",
        "author": "Zongsheng Cao",
        "authorids": "~Zongsheng_Cao1",
        "gender": "",
        "homepage": "",
        "dblp": "",
        "google_scholar": "",
        "orcid": "",
        "linkedin": "",
        "or_profile": "",
        "aff": "",
        "aff_domain": "",
        "position": "",
        "bibtex": "@misc{\ncao2024continual,\ntitle={Continual Learning Knowledge Graph Embeddings for Dynamic Knowledge Graphs},\nauthor={Zongsheng Cao},\nyear={2024},\nurl={https://openreview.net/forum?id=SiUhAbb3LH}\n}",
        "github": "",
        "project": "",
        "reviewers": "7psf;QHuf;pwUu;RKmJ",
        "site": "https://openreview.net/forum?id=SiUhAbb3LH",
        "pdf_size": 1918643,
        "rating": "3;5;5;6",
        "confidence": "4;4;3;3",
        "soundness": "2;3;2;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;2;3",
        "wc_summary": "75;46;39;91",
        "wc_strengths": "18;47;69;68",
        "wc_weaknesses": "181;42;129;76",
        "wc_questions": "104;1;43;17",
        "wc_review": "378;136;280;252",
        "wc_reply_reviewers": "0;48;108;0",
        "wc_reply_authors": "2456;1074;1776;851",
        "reply_reviewers": "0;1;3;0",
        "reply_authors": "4;2;4;2",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            62.75,
            21.1704392963396
        ],
        "wc_strengths_avg": [
            50.5,
            20.71834935510066
        ],
        "wc_weaknesses_avg": [
            107.0,
            52.787309080876625
        ],
        "wc_questions_avg": [
            41.25,
            39.20698279643564
        ],
        "wc_review_avg": [
            261.5,
            86.24818838677135
        ],
        "wc_reply_reviewers_avg": [
            39.0,
            44.395945760846224
        ],
        "wc_reply_authors_avg": [
            1539.25,
            629.8068652372725
        ],
        "reply_reviewers_avg": [
            1.0,
            1.224744871391589
        ],
        "reply_authors_avg": [
            3.0,
            1.0
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.6882472016116854,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Z9QF2UgsBTYJ:scholar.google.com/&scioq=Continual+Learning+Knowledge+Graph+Embeddings+for+Dynamic+Knowledge+Graphs&hl=en&as_sdt=0,5",
        "gs_version_total": 0
    },
    {
        "id": "SirD4KYNRr",
        "title": "Invariant Attention: Provable Clustering Under Transformations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Attention mechanisms play a crucial role in state-of-the-art vision architectures, enabling them to rapidly identify relationships between distant image patches. Conventional attention mechanisms do not incorporate other structural properties of images, such as invariance to geometric transformations, instead learning these properties from data. In this paper, we introduce a novel mechanism, Invariant Attention, which, like standard attention, captures image similarity, but with the additional guarantee of being agnostic to geometric transformations. We provide theoretical assurance and empirical verification that invariant attention is far more successful than standard kernel attention on multi-class, transformed vision data, and illustrate its potential to correctly cluster transformed data with intra-class variation.",
        "keywords": "Attention;Vision Transformer;Clustering;geometric transformations;CNN;Convolutional Neural Networks",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/5e70a396fa0ae7cdd66a670214da412ead7dac89.zip",
        "author": "Sree Rohith Pulipaka;Mariam Avagyan;Jacqueline O Yang;John Wright",
        "authorids": "~Sree_Rohith_Pulipaka1;~Mariam_Avagyan1;~Jacqueline_O_Yang1;~John_Wright1",
        "gender": ";Not Specified;;",
        "homepage": ";https://www.mariamavagyan.com/;;http://www.columbia.edu/~jw2966",
        "dblp": ";;;",
        "google_scholar": ";r97LedMAAAAJ;;nujTx04AAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Sree_Rohith_Pulipaka1;~Mariam_Avagyan1;~Jacqueline_O_Yang1;~John_Wright1",
        "aff": ";Columbia University;;Columbia University",
        "aff_domain": ";columbia.edu;;columbia.edu",
        "position": ";PhD student;;Associate Professor",
        "bibtex": "@misc{\npulipaka2024invariant,\ntitle={Invariant Attention: Provable Clustering Under Transformations},\nauthor={Sree Rohith Pulipaka and Mariam Avagyan and Jacqueline O Yang and John Wright},\nyear={2024},\nurl={https://openreview.net/forum?id=SirD4KYNRr}\n}",
        "github": "",
        "project": "",
        "reviewers": "9EKX;omyp;pRB3;4tjm",
        "site": "https://openreview.net/forum?id=SirD4KYNRr",
        "pdf_size": 5096951,
        "rating": "3;3;5;6",
        "confidence": "3;4;3;3",
        "soundness": "2;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "2;1;2;2",
        "wc_summary": "90;87;29;57",
        "wc_strengths": "29;25;29;43",
        "wc_weaknesses": "595;146;48;155",
        "wc_questions": "78;41;34;4",
        "wc_review": "792;299;140;259",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "773;209;45;600",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            65.75,
            24.833193511910626
        ],
        "wc_strengths_avg": [
            31.5,
            6.837397165588672
        ],
        "wc_weaknesses_avg": [
            236.0,
            211.4745847613845
        ],
        "wc_questions_avg": [
            39.25,
            26.337947907914163
        ],
        "wc_review_avg": [
            372.5,
            249.1590857263688
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            406.75,
            292.1697922441675
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5555555555555555,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:1QSj_WYc25UJ:scholar.google.com/&scioq=Invariant+Attention:+Provable+Clustering+Under+Transformations&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Columbia University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.columbia.edu",
        "aff_unique_abbr": "Columbia",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "SjgfWbamtN",
        "title": "MiniFold: Simple, Fast and Accurate Protein Structure Prediction",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Protein structure prediction has emerged as a powerful tool for biologists and drug makers. However, the computational toll associated with state-of-the-art models, such as AlphaFold2 or ESMFold, hinders their use in large-scale applications like virtual screening or mutational scanning, where a single experiment may involve processing millions of protein sequences. In an effort to develop a more efficient model, we aimed to understand which of the complex architectural choices proposed in AlphaFold2 were essential to achieve high performance, and which could be omitted without significantly compromising accuracy. This analysis culminated in a simple, yet highly expressive architecture for protein structure prediction. Our model, MiniFold, consists of a minimal Evoformer variant, a parameter-free coordinate recovery algorithm, and a custom hardware-optimized implementation composed of newly designed GPU kernels. When compared against ESMFold, MiniFold achieves over 100x speedup and shows improved scalability to long protein sequences while conserving over 95% of the original performance, making it a promising candidate for large-scale applications.",
        "keywords": "protein;structure prediction;efficiency;hardware-optimization",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Jeremy Wohlwend;Mateo Reveiz;Axel Feldmann;Wengong Jin;Regina Barzilay",
        "authorids": "~Jeremy_Wohlwend1;~Mateo_Reveiz1;~Axel_Feldmann1;~Wengong_Jin1;~Regina_Barzilay1",
        "gender": ";M;M;;female",
        "homepage": "https://jeremywohlwend.com;;https://feldmann.nyc;http://people.csail.mit.edu/wengong;https://www.regina.csail.mit.edu/",
        "dblp": ";;260/5858;173/6620;b/ReginaBarzilay",
        "google_scholar": ";;QkpYowMAAAAJ;IE5D8_QAAAAJ;",
        "orcid": ";0000-0002-5680-4150;;;",
        "linkedin": ";;;;",
        "or_profile": "~Jeremy_Wohlwend1;~Mateo_Reveiz1;~Axel_Feldmann1;~Wengong_Jin1;~Regina_Barzilay1",
        "aff": "Massachusetts Institute of Technology;Computer Science and Artificial Intelligence Laboratory, Electrical Engineering & Computer Science;Computer Science and Artificial Intelligence Laboratory, Electrical Engineering & Computer Science;Broad Institute;Massachusetts Institute of Technology",
        "aff_domain": "mit.edu;csail.mit.edu;csail.mit.edu;broadinstitute.org;mit.edu",
        "position": "PhD student;PhD student;PhD student;Postdoc;Professor",
        "bibtex": "@misc{\nwohlwend2024minifold,\ntitle={MiniFold: Simple, Fast and Accurate Protein Structure Prediction},\nauthor={Jeremy Wohlwend and Mateo Reveiz and Axel Feldmann and Wengong Jin and Regina Barzilay},\nyear={2024},\nurl={https://openreview.net/forum?id=SjgfWbamtN}\n}",
        "github": "",
        "project": "",
        "reviewers": "FoqV;NKzF;mayn;cGwq",
        "site": "https://openreview.net/forum?id=SjgfWbamtN",
        "pdf_size": 5341858,
        "rating": "3;3;5;6",
        "confidence": "5;4;3;4",
        "soundness": "1;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "3;3;3;4",
        "wc_summary": "70;53;46;54",
        "wc_strengths": "54;50;34;47",
        "wc_weaknesses": "518;142;37;349",
        "wc_questions": "133;104;61;6",
        "wc_review": "775;349;178;456",
        "wc_reply_reviewers": "0;149;0;0",
        "wc_reply_authors": "1285;1168;564;794",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            55.75,
            8.78564169540279
        ],
        "wc_strengths_avg": [
            46.25,
            7.495832175282475
        ],
        "wc_weaknesses_avg": [
            261.5,
            185.82855001317748
        ],
        "wc_questions_avg": [
            76.0,
            47.84871994108097
        ],
        "wc_review_avg": [
            439.5,
            217.6034236863014
        ],
        "wc_reply_reviewers_avg": [
            37.25,
            64.51889258194068
        ],
        "wc_reply_authors_avg": [
            952.75,
            288.5527464780053
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5443310539518174,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:96PPOpxgERYJ:scholar.google.com/&scioq=MiniFold:+Simple,+Fast+and+Accurate+Protein+Structure+Prediction&hl=en&as_sdt=0,23",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "Massachusetts Institute of Technology;Broad Institute",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://web.mit.edu;https://www.broadinstitute.org",
        "aff_unique_abbr": "MIT;Broad",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Cambridge",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "SkETBJRKH7",
        "title": "A Prefrontal Cortex-inspired Architecture for Planning in Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs) demonstrate impressive performance on a wide variety of tasks, but they often struggle with tasks that require multi-step reasoning or goal-directed planning. To address this, we take inspiration from the human brain, in which planning is accomplished via the recurrent interaction of specialized modules in the prefrontal cortex (PFC). These modules perform functions such as conflict monitoring, state prediction, state evaluation, task decomposition, and task coordination. We find that LLMs are sometimes capable of carrying out these functions in isolation, but struggle to autonomously coordinate them in the service of a goal. Therefore, we propose a black box architecture with multiple LLM-based (GPT-4) modules. The architecture improves planning through the interaction of specialized PFC-inspired modules that break down a larger problem into multiple brief automated calls to the LLM. We evaluate the combined architecture on two challenging planning tasks -- graph traversal and Tower of Hanoi -- finding that it yields significant improvements over standard LLM methods (e.g., zero-shot prompting or in-context learning). These results demonstrate the benefit of utilizing knowledge from cognitive neuroscience to improve planning in LLMs.",
        "keywords": "large language models;prefrontal cortex;planning;LLM agents;generalization",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "/attachment/dfd42774b06ce7b248f278c72471b05fb9f7dde7.zip",
        "author": "Shanka Subhra Mondal;Taylor Whittington Webb;Chi Wang;Brian Krabach;Ida Momennejad",
        "authorids": "~Shanka_Subhra_Mondal1;~Taylor_Whittington_Webb1;~Chi_Wang3;~Brian_Krabach1;~Ida_Momennejad1",
        "gender": "M;M;M;M;F",
        "homepage": "https://sites.google.com/view/shankasubhramondal/;https://scholar.google.com/citations?user=WCmrJoQAAAAJ&hl=en;http://chiwang.cc;;https://www.momen-nejad.org",
        "dblp": "241/7065;183/6144;09/404-1;;",
        "google_scholar": "5V-xQYUAAAAJ;WCmrJoQAAAAJ;https://scholar.google.com/citations?hl=en;;https://scholar.google.de/citations?user=OFdUAJwAAAAJ",
        "orcid": ";;;;0000-0003-0830-3973",
        "linkedin": "shanka-subhra-mondal-057622147;;chi-wang-autogen/;briankrabach/;ida-momennejad-8661a710/",
        "or_profile": "~Shanka_Subhra_Mondal1;~Taylor_Whittington_Webb1;~Chi_Wang3;~Brian_Krabach1;~Ida_Momennejad1",
        "aff": "Princeton University;University of California, Los Angeles;Microsoft Research;;Microsoft Research",
        "aff_domain": "princeton.edu;ucla.edu;microsoft.com;;research.microsoft.com",
        "position": "PhD student;Postdoc;Principal Researcher;;Principal Researcher",
        "bibtex": "@misc{\nmondal2024a,\ntitle={A Prefrontal Cortex-inspired Architecture for Planning in Large Language Models},\nauthor={Shanka Subhra Mondal and Taylor Whittington Webb and Chi Wang and Brian Krabach and Ida Momennejad},\nyear={2024},\nurl={https://openreview.net/forum?id=SkETBJRKH7}\n}",
        "github": "",
        "project": "",
        "reviewers": "i64f;upo6;PrdT;t84f",
        "site": "https://openreview.net/forum?id=SkETBJRKH7",
        "pdf_size": 803714,
        "rating": "5;5;5;6",
        "confidence": "3;4;3;4",
        "soundness": "2;4;2;3",
        "contribution": "2;3;2;2",
        "presentation": "3;4;3;3",
        "wc_summary": "88;58;85;127",
        "wc_strengths": "24;72;40;34",
        "wc_weaknesses": "125;315;118;143",
        "wc_questions": "119;20;126;2",
        "wc_review": "356;465;369;306",
        "wc_reply_reviewers": "0;0;0;21",
        "wc_reply_authors": "1212;1704;1531;1316",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "3;4;4;4",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            89.5,
            24.60182920028509
        ],
        "wc_strengths_avg": [
            42.5,
            17.96524422322168
        ],
        "wc_weaknesses_avg": [
            175.25,
            81.19844518215851
        ],
        "wc_questions_avg": [
            66.75,
            56.166604846652426
        ],
        "wc_review_avg": [
            374.0,
            57.56300895540468
        ],
        "wc_reply_reviewers_avg": [
            5.25,
            9.093266739736606
        ],
        "wc_reply_authors_avg": [
            1440.75,
            190.61397509102002
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.75,
            0.4330127018922193
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12368562780517929170&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;2",
        "aff_unique_norm": "Princeton University;University of California, Los Angeles;Microsoft",
        "aff_unique_dep": ";;Microsoft Research",
        "aff_unique_url": "https://www.princeton.edu;https://www.ucla.edu;https://www.microsoft.com/en-us/research",
        "aff_unique_abbr": "Princeton;UCLA;MSR",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Los Angeles",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "SkF7NZGVr5",
        "title": "Curvature Explains Loss of Plasticity",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Loss of plasticity is a phenomenon in which neural networks lose their ability to learn from new experience.\n  Despite being empirically observed in several problem settings, little is understood about the mechanisms that lead to loss of plasticity.\n  In this paper, we offer a consistent explanation for plasticity loss,\n  based on an assertion that neural networks lose directions of curvature during training and that plasticity loss can be attributed to this reduction in curvature.\n  To support such a claim, we provide a systematic empirical investigation of plasticity loss across several continual supervised learning problems.\n  Our findings illustrate that curvature loss  coincides with and sometimes precedes plasticity loss, while also showing that previous explanations are insufficient to explain loss of plasticity in all settings.\n  Lastly, we show that regularizers which mitigate loss of plasticity also preserve curvature, motivating a simple distributional regularizer that proves to be effective across the problem settings considered.",
        "keywords": "Plasitcity;neural networks;continual learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Alex Lewandowski;Haruto Tanaka;Dale Schuurmans;Marlos C. Machado",
        "authorids": "~Alex_Lewandowski1;~Haruto_Tanaka1;~Dale_Schuurmans1;~Marlos_C._Machado1",
        "gender": ";M;;M",
        "homepage": "https://lewandowskialex.com;;;https://webdocs.cs.ualberta.ca/~machado/",
        "dblp": ";;;21/10949",
        "google_scholar": ";;;https://scholar.google.ca/citations?user=xf_n4xUAAAAJ",
        "orcid": ";;;",
        "linkedin": ";haruto-tanaka/;;cholodovskis/",
        "or_profile": "~Alex_Lewandowski1;~Haruto_Tanaka1;~Dale_Schuurmans1;~Marlos_C._Machado1",
        "aff": "University of Alberta;University of Alberta;;University of Alberta",
        "aff_domain": "ualberta.ca;ualberta.ca;;ualberta.ca",
        "position": "PhD student;MS student;;Assistant Professor",
        "bibtex": "@misc{\nlewandowski2024curvature,\ntitle={Curvature Explains Loss of Plasticity},\nauthor={Alex Lewandowski and Haruto Tanaka and Dale Schuurmans and Marlos C. Machado},\nyear={2024},\nurl={https://openreview.net/forum?id=SkF7NZGVr5}\n}",
        "github": "",
        "project": "",
        "reviewers": "3UTT;iEeG;BAzs;sWyZ",
        "site": "https://openreview.net/forum?id=SkF7NZGVr5",
        "pdf_size": 2803564,
        "rating": "5;5;6;6",
        "confidence": "3;4;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;4;3",
        "wc_summary": "15;77;101;104",
        "wc_strengths": "47;306;157;49",
        "wc_weaknesses": "280;629;340;145",
        "wc_questions": "4;257;1;127",
        "wc_review": "346;1269;599;425",
        "wc_reply_reviewers": "0;360;345;135",
        "wc_reply_authors": "344;1203;665;222",
        "reply_reviewers": "0;1;2;1",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            74.25,
            35.77272005313546
        ],
        "wc_strengths_avg": [
            139.75,
            105.80022447991308
        ],
        "wc_weaknesses_avg": [
            348.5,
            176.6755500911204
        ],
        "wc_questions_avg": [
            97.25,
            105.31470695016912
        ],
        "wc_review_avg": [
            659.75,
            363.46346102462627
        ],
        "wc_reply_reviewers_avg": [
            210.0,
            150.37453241822567
        ],
        "wc_reply_authors_avg": [
            608.5,
            379.4617899077587
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13986244242318180571&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Alberta",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ualberta.ca",
        "aff_unique_abbr": "UAlberta",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "SkRBoJ0F8B",
        "title": "Solving Robust MDPs through No-Regret Dynamics",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Reinforcement Learning is a powerful framework for training agents to navigate different situations, but it is susceptible to changes in environmental dynamics. However, solving Markov Decision Processes that are robust to changes is difficult due to nonconvexity and complex interactions between policy and environment. While most works have analyzed this problem by taking different assumptions on the problem, a general and efficient theoretical analysis is still missing. We generate a simple, Nonconvex No-Regret framework for improving robustness by solving a minimax iterative optimization problem where a policy player and an environmental dynamics player are playing against each other. By decoupling the behavior of both players with our framework, we yield several scalable algorithms that solve Robust MDPs under different conditions on the order of $\\mathcal{O}\\left(\\frac{1}{T^{\\frac{1}{2}}}\\right)$ with only a convex uncertainty set assumption.",
        "keywords": "Robust MDPs;Gradient Methods;No-Regret Dynamics",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/dadbf327603d2467f966de8727f0af1e3281ae62.zip",
        "author": "Etash Kumar Guha;Jason D. Lee",
        "authorids": "~Etash_Kumar_Guha1;~Jason_D._Lee1",
        "gender": "M;M",
        "homepage": "https://etash.me/;https://jasondlee88.github.io/",
        "dblp": "331/5590;88/3262",
        "google_scholar": "https://scholar.google.com/citations?hl=en;GR_DsT0AAAAJ",
        "orcid": ";",
        "linkedin": "etash-guha-00097116a/;",
        "or_profile": "~Etash_Kumar_Guha1;~Jason_D._Lee1",
        "aff": ";Princeton University",
        "aff_domain": ";princeton.edu",
        "position": ";Assistant Professor",
        "bibtex": "@misc{\nguha2024solving,\ntitle={Solving Robust {MDP}s through No-Regret Dynamics},\nauthor={Etash Kumar Guha and Jason D. Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=SkRBoJ0F8B}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZrbN;Qfzd;fufQ;yiTS;MYdb",
        "site": "https://openreview.net/forum?id=SkRBoJ0F8B",
        "pdf_size": 509916,
        "rating": "3;3;3;3;3",
        "confidence": "3;3;3;4;3",
        "soundness": "2;3;2;3;2",
        "contribution": "2;2;1;2;2",
        "presentation": "2;2;3;1;2",
        "wc_summary": "52;105;208;54;21",
        "wc_strengths": "43;76;48;44;16",
        "wc_weaknesses": "49;503;22;281;382",
        "wc_questions": "181;4;11;51;2",
        "wc_review": "325;688;289;430;421",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.2,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            1.8,
            0.4
        ],
        "presentation_avg": [
            2.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            88.0,
            65.7723346096214
        ],
        "wc_strengths_avg": [
            45.4,
            19.053608582103287
        ],
        "wc_weaknesses_avg": [
            247.4,
            186.94662339823097
        ],
        "wc_questions_avg": [
            49.8,
            67.97470117624644
        ],
        "wc_review_avg": [
            430.6,
            139.6776288458535
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4513742386718378164&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0",
        "aff_unique_norm": "Princeton University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.princeton.edu",
        "aff_unique_abbr": "Princeton",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "SkeoEFlF0E",
        "title": "NEURAL ADDITIVE TENSOR DECOMPOSITION FOR SPARSE TENSORS",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Canonical Polyadic Decomposition (CPD) is a fundamental technique for tensor analysis, discovering underlying multi-linear structures represented as rank-one tensors (components). The simplicity of the rank-one tensors facilitates the interpretation of hidden structures within tensors compared to other types of conventional tensor decomposition models. However, CPD has limitations in modeling nonlinear structures present in real-world tensors. Recent tensor decomposition models combined with neural networks have shown superior performance in tensor completion tasks compared to multi-linear tensor models. Nevertheless, one drawback of those nonlinear tensor models is the lack of interpretability since their black-box approaches entangle all interactions between latent components, unlike CPD, which handles the components individually as rank-one tensors.\n\nTo overcome this major limitation and bridge the gap between CPD and various state-of-the-art neural tensor models,\nwe propose Neural Additive Tensor Decomposition (NeAT) to accurately capture non-linear interactions in sparse tensors while respecting the separation of distinct components in a similar vein as CPD. The main idea is to neuralize each component to model non-linear interactions within each component separately. This not only captures non-linear interactions but also makes the decomposition results easy to interpret by being as close to the CPD model as possible. Extensive experiments with six large-scale real-world datasets demonstrate that \\method{} is more accurate than the state-of-the-art neural tensor models and easy to interpret latent patterns.\nIn the link prediction task, \nNeAT outperforms CPD by 10\\% and the second-best performing neural tensor model by 4\\%, in terms of AUC score.\nFinally, we demonstrate the interpretability of NeAT by visualizing and analyzing latent components from real data.",
        "keywords": "Tensor Decomposition;Neural Tensor Models;Interpretability",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/3e3f859d228b463d4fb1103c58d52136ddba0f27.pdf",
        "author": "Dawon Ahn;Uday Singh Saini;Evangelos E. Papalexakis;Ali Payani",
        "authorids": "~Dawon_Ahn1;~Uday_Singh_Saini1;~Evangelos_E._Papalexakis1;~Ali_Payani1",
        "gender": ";M;M;M",
        "homepage": "https://dawonahn.github.io;https://scholar.google.com/citations?user=oQRhhVQAAAAJ&hl=en&oi=ao;http://www.cs.ucr.edu/~epapalex;",
        "dblp": "276/5018;180/5901;48/9024;184/3921",
        "google_scholar": ";oQRhhVQAAAAJ;https://scholar.google.com.tw/citations?user=2P1kinAAAAAJ;9rHwD8wAAAAJ",
        "orcid": ";0000-0002-8561-5527;0000-0002-3411-8483;0000-0003-4054-2958",
        "linkedin": ";;;ali-payani-59267515",
        "or_profile": "~Dawon_Ahn1;~Uday_Singh_Saini1;~Evangelos_E._Papalexakis1;~Ali_Payani1",
        "aff": "University of California, Riverside;VISA;University of California, Riverside;Cisco",
        "aff_domain": "ucr.edu;visa.com;ucr.edu;cisco.com",
        "position": "PhD student;Researcher;Associate Professor;Researcher",
        "bibtex": "@misc{\nahn2024neural,\ntitle={{NEURAL} {ADDITIVE} {TENSOR} {DECOMPOSITION} {FOR} {SPARSE} {TENSORS}},\nauthor={Dawon Ahn and Uday Singh Saini and Evangelos E. Papalexakis and Ali Payani},\nyear={2024},\nurl={https://openreview.net/forum?id=SkeoEFlF0E}\n}",
        "github": "",
        "project": "",
        "reviewers": "LDaU;3Eaz;ZGpK;XfPM",
        "site": "https://openreview.net/forum?id=SkeoEFlF0E",
        "pdf_size": 1166897,
        "rating": "3;3;5;8",
        "confidence": "4;4;4;4",
        "soundness": "4;2;2;4",
        "contribution": "2;1;2;4",
        "presentation": "3;2;3;4",
        "wc_summary": "74;65;78;79",
        "wc_strengths": "76;23;47;46",
        "wc_weaknesses": "233;148;217;37",
        "wc_questions": "58;145;2;140",
        "wc_review": "441;381;344;302",
        "wc_reply_reviewers": "0;0;104;24",
        "wc_reply_authors": "1758;1658;1145;654",
        "reply_reviewers": "0;0;2;1",
        "reply_authors": "4;4;4;3",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            1.0
        ],
        "contribution_avg": [
            2.25,
            1.0897247358851685
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            74.0,
            5.522680508593631
        ],
        "wc_strengths_avg": [
            48.0,
            18.801595676963167
        ],
        "wc_weaknesses_avg": [
            158.75,
            77.20872683835681
        ],
        "wc_questions_avg": [
            86.25,
            59.65892640669961
        ],
        "wc_review_avg": [
            367.0,
            51.05389309347525
        ],
        "wc_reply_reviewers_avg": [
            32.0,
            42.708313008125245
        ],
        "wc_reply_authors_avg": [
            1303.75,
            441.3651407848155
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.75,
            0.4330127018922193
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14274814821149865628&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "University of California, Riverside;VISA;Cisco Systems",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ucr.edu;https://www.visa.com;https://www.cisco.com",
        "aff_unique_abbr": "UCR;VISA;Cisco",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Riverside;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "SksPFxRRiJ",
        "title": "Removing Spurious Concepts from Neural Network Representations via Joint Subspace Estimation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Out-of-distribution generalization in neural networks is often hampered by spurious correlations. A common strategy is to mitigate this by removing spurious concepts from the neural network representation of the data. Existing concept-removal methods tend to be overzealous by inadvertently eliminating features associated with the main task of the model, thereby harming model performance. We propose an iterative algorithm that separates spurious from main-task concepts by jointly identifying two low-dimensional orthogonal subspaces in the neural network representation. We evaluate the algorithm on benchmark datasets for computer vision (Waterbirds, CelebA) and natural language processing (MultiNLI), and show that it outperforms existing concept removal methods.",
        "keywords": "Concept-removal methods;Spurious Correlations",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/b89fde785d9cc0b55eaee37be5d8f08cdaca1720.zip",
        "author": "Floris Holstege;Bram Wouters;Noud Van Giersbergen;Cees Diks",
        "authorids": "~Floris_Holstege1;~Bram_Wouters1;~Noud_Van_Giersbergen1;~Cees_Diks1",
        "gender": "M;;M;M",
        "homepage": "https://www.uva.nl/profiel/h/o/f.g.holstege/f.g.holstege.html;;https://www.uva.nl/profiel/g/i/n.p.a.vangiersbergen/n.p.a.vangiersbergen.html;https://www.uva.nl/en/profile/d/i/c.g.h.diks/c.g.h.diks.html",
        "dblp": ";;;",
        "google_scholar": ";https://scholar.google.nl/citations?user=_22XG4YAAAAJ;;kMBFQ64AAAAJ",
        "orcid": ";;0000-0002-1790-3105;",
        "linkedin": "fholstege/;;noud-van-giersbergen-26a5655;",
        "or_profile": "~Floris_Holstege1;~Bram_Wouters1;~Noud_Van_Giersbergen1;~Cees_Diks1",
        "aff": "University of Amsterdam;University of Amsterdam;University of Amsterdam;University of Amsterdam",
        "aff_domain": "uva.nl;uva.nl;uva.nl;uva.nl",
        "position": "PhD student;Lecturer;Associate Professor;Full Professor",
        "bibtex": "@misc{\nholstege2024removing,\ntitle={Removing Spurious Concepts from Neural Network Representations via Joint Subspace Estimation},\nauthor={Floris Holstege and Bram Wouters and Noud Van Giersbergen and Cees Diks},\nyear={2024},\nurl={https://openreview.net/forum?id=SksPFxRRiJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "YBBU;YHWA;SKcn;AJaV",
        "site": "https://openreview.net/forum?id=SksPFxRRiJ",
        "pdf_size": 6797837,
        "rating": "5;5;5;5",
        "confidence": "4;4;4;4",
        "soundness": "3;2;3;2",
        "contribution": "2;2;2;2",
        "presentation": "2;2;3;3",
        "wc_summary": "89;44;75;67",
        "wc_strengths": "28;37;42;86",
        "wc_weaknesses": "579;43;118;206",
        "wc_questions": "3;2;87;26",
        "wc_review": "699;126;322;385",
        "wc_reply_reviewers": "0;0;100;43",
        "wc_reply_authors": "760;502;722;698",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            68.75,
            16.315253599009733
        ],
        "wc_strengths_avg": [
            48.25,
            22.364872009470567
        ],
        "wc_weaknesses_avg": [
            236.5,
            205.98604321652473
        ],
        "wc_questions_avg": [
            29.5,
            34.55792239125495
        ],
        "wc_review_avg": [
            383.0,
            205.9308136243821
        ],
        "wc_reply_reviewers_avg": [
            35.75,
            41.038853541491626
        ],
        "wc_reply_authors_avg": [
            670.5,
            99.76347026843042
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=467918938177801081&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of Amsterdam",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uva.nl",
        "aff_unique_abbr": "UvA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Netherlands"
    },
    {
        "id": "SmZD7yxpPC",
        "title": "GlycoNMR: A Carbohydrate-Specific NMR Chemical Shift Dataset for Machine Learning Research",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Molecular representation learning (MRL) is a powerful contribution by machine learning to chemistry as it converts molecules into numerical representations, which serves as fundamental for diverse biochemical applications, such as property prediction and drug design. While MRL has had great success with proteins and general biomolecules, it has yet to be explored for carbohydrates in the growing fields of glycoscience and glycomaterials (the study and design of carbohydrates). This under-exploration can be primarily attributed to the limited availability of comprehensive and well-curated carbohydrate-specific datasets and a lack of machine learning (ML) techniques tailored to meet the unique problems presented by carbohydrate data. Interpreting and annotating carbohydrate data is generally more complicated than protein data, and requires substantial domain knowledge. In addition, existing MRL methods were predominately optimized for proteins and small biomolecules, and may not be effective for carbohydrate applications without special modifications. To address this challenge, accelerate progress in glycoscience and glycomaterials, and enrich the data resources of the ML community, we introduce GlycoNMR. GlycoNMR contains two laboriously curated datasets with 2,609 carbohydrate structures and 211,543 annotated nuclear magnetic resonance (NMR) atomic-level chemical shifts that can be used to train ML models for precise atomic-level prediction. NMR data is one of the most appealing starting points for developing ML techniques to facilitate glycoscience and glycomaterials research, as NMR is the preeminent technique in carbohydrate structure research, and biomolecule structure is among the foremost predictors of functions and properties. We tailored a set of carbohydrate-specific features and adapted existing MRL models to effectively tackle the problem of predicting NMR shifts. For illustration, we benchmark these modified MRL models on the GlycoNMR.",
        "keywords": "AI for science;Glycoscience;Graph Neural Network;Nuclear Magnetic Resonance",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/78cd59611b3f259507e6e6a46040429b87cdd4ad.pdf",
        "author": "Zizhang Chen;Ryan Paul Badman;Bethany Lachele Foley;Robert J Woods;Pengyu Hong",
        "authorids": "~Zizhang_Chen1;~Ryan_Paul_Badman1;~Bethany_Lachele_Foley1;~Robert_J_Woods2;~Pengyu_Hong1",
        "gender": ";M;F;M;M",
        "homepage": ";;;http://www.cs.brandeis.edu/~hong/;https://glycam.org",
        "dblp": ";;;89/4734;",
        "google_scholar": ";Q2esw9MAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com.tw/citations?user=pvDa8pcAAAAJ;",
        "orcid": ";0000-0001-8819-1144;0000-0003-2786-7432;0000-0002-3177-2754;",
        "linkedin": "%E6%A2%93%E5%BD%B0-%E9%99%88-7043b3148;ryan-badman-60483939/;;;",
        "or_profile": "~Zizhang_Chen1;~Ryan_Paul_Badman1;~Bethany_Lachele_Foley1;~Pengyu_Hong1;~Robert_Woods1",
        "aff": "Brandeis University;Harvard Medical School;Complex Carbohydrate Research Center;Brandeis University;University of Georgia",
        "aff_domain": "brandeis.edu;hms.harvard.edu;ccrc.uga.edu;brandeis.edu;uga.edu",
        "position": "PhD student;Postdoc;Associate Research Scientist;Full Professor;Full Professor",
        "bibtex": "@misc{\nchen2024glyconmr,\ntitle={Glyco{NMR}: A Carbohydrate-Specific {NMR} Chemical Shift Dataset for Machine Learning Research},\nauthor={Zizhang Chen and Ryan Paul Badman and Bethany Lachele Foley and Robert J Woods and Pengyu Hong},\nyear={2024},\nurl={https://openreview.net/forum?id=SmZD7yxpPC}\n}",
        "github": "",
        "project": "",
        "reviewers": "dVzH;sFB8;ozW2",
        "site": "https://openreview.net/forum?id=SmZD7yxpPC",
        "pdf_size": 3055590,
        "rating": "5;6;6",
        "confidence": "2;3;4",
        "soundness": "2;2;3",
        "contribution": "1;2;3",
        "presentation": "2;2;3",
        "wc_summary": "22;87;35",
        "wc_strengths": "13;73;26",
        "wc_weaknesses": "230;48;295",
        "wc_questions": "1;111;67",
        "wc_review": "266;319;423",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "2066;739;2685",
        "reply_reviewers": "0;0;0",
        "reply_authors": "4;1;5",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            48.0,
            28.083209693100727
        ],
        "wc_strengths_avg": [
            37.333333333333336,
            25.77250904010361
        ],
        "wc_weaknesses_avg": [
            191.0,
            104.54026337572843
        ],
        "wc_questions_avg": [
            59.666666666666664,
            45.20570268843916
        ],
        "wc_review_avg": [
            336.0,
            65.21247324451564
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1830.0,
            811.788560320153
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            1.699673171197595
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.8660254037844385,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:48pRf4jW4JkJ:scholar.google.com/&scioq=GlycoNMR:+A+Carbohydrate-Specific+NMR+Chemical+Shift+Dataset+for+Machine+Learning+Research&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0;3",
        "aff_unique_norm": "Brandeis University;Harvard University;Complex Carbohydrate Research Center;University of Georgia",
        "aff_unique_dep": ";Medical School;;",
        "aff_unique_url": "https://www.brandeis.edu;https://hms.harvard.edu;http://www.csrc.uga.edu/;https://www.uga.edu",
        "aff_unique_abbr": "Brandeis;HMS;;UGA",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Boston",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "SnlDQ5pL6L",
        "title": "Spatial-Temporal Mutual Distillation for Lightweight Sleep Stage Classification",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Sleep stage classification has important clinical significance for the diagnosis of sleep-related diseases. Recently, multi-channel sleep signals are widely used in deep neural networks for sleep stage classification and achieve better performance compared to single-channel sleep signals because of the rich spatial-temporal knowledge contained. However, it leads to a great increment in the size and computational costs which constrain the application of multi-channel sleep stage classification models. Knowledge distillation is an effective way to compress models. But existing knowledge distillation methods cannot fully extract and transfer the spatial-temporal knowledge in the multi-channel sleep signals. To solve the problem, we propose a spatial-temporal mutual distillation for multi-channel sleep stage classification. Spatial-temporal knowledge are key references for sleep stage classification. Spatial knowledge represents the spatial relationship of the human body while temporal knowledge means the transition rules between multiple sleep epochs. Moreover, the mutual distillation framework mutually transfer the spatial-temporal knowledge between the teacher and student to improve the knowledge transfer. The results on the ISRUC-III and MASS-SS3 datasets show that our proposed method compresses the sleep models effectively with minimal performance loss and achieves the state-of-the-art performance compared to the baseline methods.",
        "keywords": "Knowledge Distillation; Sleep Stage Classification; Time Series",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "Haichao Wang;Ziyu Jia;Yucheng Liu;Tianzi Jiang",
        "authorids": "~Haichao_Wang2;~Ziyu_Jia1;~Yucheng_Liu3;~Tianzi_Jiang3",
        "gender": "M;M;;F",
        "homepage": "https://ziyujia.github.io/;https://yuchengliu.github.io/;http://www.nlpr.ia.ac.cn/jiangtz/;https://xs.zidianzhan.net/scholar?hl=zh-CN&as_sdt=0%2C5&q=haichao+wang&btnG=",
        "dblp": "256/1411;09/5179-3;https://dblp.org/search?q=Tianzi%20Jiang;",
        "google_scholar": ";;https://scholar.google.com.hk/citations?hl=zh-CN;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Ziyu_Jia1;~Yucheng_Liu3;~Tianzi_Jiang3;~Xiyang_Cai3",
        "aff": "Institute of Automation, Chinese Academy of Sciences;henan normal university;, Institute of automation, Chinese academy of science;Southeast University",
        "aff_domain": "ia.ac.cn;htu.edu.cn;nlpr.ia.ac.cn;seu.edu.cn",
        "position": "Assistant Professor;PhD student;Full Professor;Intern",
        "bibtex": "@misc{\nanonymous2024spatialtemporal,\ntitle={Spatial-Temporal Mutual Distillation for Lightweight Sleep Stage Classification},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=SnlDQ5pL6L}\n}",
        "github": "",
        "project": "",
        "reviewers": "8oup;kX3p;xpJP;c6gb",
        "site": "https://openreview.net/forum?id=SnlDQ5pL6L",
        "pdf_size": 901567,
        "rating": "3;5;6;8",
        "confidence": "5;4;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;4;3",
        "wc_summary": "22;65;76;43",
        "wc_strengths": "15;143;80;63",
        "wc_weaknesses": "224;155;158;148",
        "wc_questions": "4;19;128;2",
        "wc_review": "265;382;442;256",
        "wc_reply_reviewers": "0;16;8;37",
        "wc_reply_authors": "922;748;889;921",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "2;1;2;1",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            51.5,
            20.766559657295186
        ],
        "wc_strengths_avg": [
            75.25,
            45.805976684271236
        ],
        "wc_weaknesses_avg": [
            171.25,
            30.670629272970583
        ],
        "wc_questions_avg": [
            38.25,
            52.23205433447932
        ],
        "wc_review_avg": [
            336.25,
            78.72856851232595
        ],
        "wc_reply_reviewers_avg": [
            15.25,
            13.77270852083932
        ],
        "wc_reply_authors_avg": [
            870.0,
            71.67635593415726
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5883484054145521,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:01DrqwVYLCIJ:scholar.google.com/&scioq=Spatial-Temporal+Mutual+Distillation+for+Lightweight+Sleep+Stage+Classification&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "Chinese Academy of Sciences;Henan Normal University;Southeast University",
        "aff_unique_dep": "Institute of Automation;;",
        "aff_unique_url": "http://www.ia.cas.cn;http://www.henannu.edu.cn/;https://www.seu.edu.cn/",
        "aff_unique_abbr": "CAS;HENU;SEU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "SoEFmDBwlI",
        "title": "Domain Feature Perturbation for Domain Generalization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Deep neural networks (DNNs) often struggle with distribution shifts between training and test environments, which can lead to poor performance, untrustworthy predictions, or unexpected behaviors. In this work, we propose domain feature perturbation (DFP), a novel approach that explicitly leverages domain information to improve the out-of-distribution performance of DNNs. Specifically, we train a domain classifier in conjunction with the main prediction model and perturb the multi-layer representation of the latter with random noise modulated by the gradient of the former. The domain classifier is designed to share the backbone with the main model and is easy to implement with minimal extra model parameters that can be discarded at inference time. Intuitively, our proposed method aims to reduce the dependence of the main prediction model on domain-specific features, such that the model can focus on domain-agnostic features that generalize across different domains. We demonstrate the effectiveness of DFP on multiple benchmarks for domain generalization.",
        "keywords": "domain generalization;deep learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/159a95126e94bf4732c0d8de84c94fbc10ebfa9d.zip",
        "author": "Chenguang Wang;Zijun Zhang",
        "authorids": "~Chenguang_Wang3;~Zijun_Zhang1",
        "gender": "F;M",
        "homepage": ";",
        "dblp": "62/3432-8;",
        "google_scholar": ";vf0m9lkAAAAJ",
        "orcid": "0000-0002-7896-2360;",
        "linkedin": ";",
        "or_profile": "~Chenguang_Wang3;~Zijun_Zhang1",
        "aff": "Wuhan University;Wuhan University",
        "aff_domain": "whu.edu.cn;whu.edu.cn",
        "position": "MS student;Associate Professor",
        "bibtex": "@misc{\nwang2024domain,\ntitle={Domain Feature Perturbation for Domain Generalization},\nauthor={Chenguang Wang and Zijun Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=SoEFmDBwlI}\n}",
        "github": "",
        "project": "",
        "reviewers": "QF8t;H66K;U8c9;VyGr",
        "site": "https://openreview.net/forum?id=SoEFmDBwlI",
        "pdf_size": 6105095,
        "rating": "3;3;5;5",
        "confidence": "5;4;4;5",
        "soundness": "2;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "3;3;2;3",
        "wc_summary": "51;96;97;68",
        "wc_strengths": "34;33;66;124",
        "wc_weaknesses": "128;62;66;243",
        "wc_questions": "4;229;35;193",
        "wc_review": "217;420;264;628",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            78.0,
            19.45507645834372
        ],
        "wc_strengths_avg": [
            64.25,
            36.961973702712356
        ],
        "wc_weaknesses_avg": [
            124.75,
            73.11420860544139
        ],
        "wc_questions_avg": [
            115.25,
            97.21207486727151
        ],
        "wc_review_avg": [
            382.25,
            160.55275612707493
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11173928613986232626&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Wuhan University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.whu.edu.cn/",
        "aff_unique_abbr": "WHU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Generalized Schr\u00f6dinger Bridge Matching",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18590",
        "id": "SoismgeX7z",
        "author_site": "Guan-Horng Liu, Yaron Lipman, Maximilian Nickel, Brian Karrer, Evangelos Theodorou, Ricky T. Q. Chen",
        "tldr": "",
        "abstract": "Modern distribution matching algorithms for training diffusion or flow models directly prescribe the time evolution of the marginal distributions between two boundary distributions. In this work, we consider a generalized distribution matching setup, where these marginals are only implicitly described as a solution to some task-specific objective function. The problem setup, known as the Generalized Schr\u00f6dinger Bridge (GSB), appears prevalently in many scientific areas both within and without machine learning. We propose Generalized Sch\u00f6dinger Bridge Matching (GSBM), a new matching algorithm inspired by recent advances, generalizing them beyond kinetic energy minimization and to account for nonlinear state costs. We show that such a generalization can be cast as solving conditional stochastic optimal control, for which efficient variational approximations can be used, and further debiased with the aid of path integral theory. Compared to prior methods for solving GSB problems, our GSBM algorithm always preserves a feasible transport map between the boundary distributions throughout training, thereby enabling stable convergence and significantly improved scalability. We empirically validate our claims on an extensive suite of experimental setups, including crowd navigation, opinion depolarization, LiDAR manifolds, and image domain transfer. Our work brings new algorithmic opportunities for training diffusion models enhanced with task-specific optimality structures.",
        "keywords": "Distribution matching;diffusion models;generalized Schr\u00f6dinger bridge;stochastic optimal control",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Guan-Horng Liu;Yaron Lipman;Maximilian Nickel;Brian Karrer;Evangelos Theodorou;Ricky T. Q. Chen",
        "authorids": "~Guan-Horng_Liu1;~Yaron_Lipman1;~Maximilian_Nickel1;~Brian_Karrer1;~Evangelos_Theodorou1;~Ricky_T._Q._Chen1",
        "gender": ";;M;M;M;",
        "homepage": "https://ghliu.github.io;;https://mnick.github.io/;;;",
        "dblp": "143/6907;;83/10622;27/7164;155/9964;",
        "google_scholar": "2Dt0VJ4AAAAJ;;KDqGTIUAAAAJ;Wewcpo4AAAAJ;;",
        "orcid": ";;0000-0001-5006-0827;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Guan-Horng_Liu1;~Yaron_Lipman1;~Maximilian_Nickel1;~Brian_Karrer1;~Evangelos_Theodorou1;~Ricky_T._Q._Chen1",
        "aff": "Georgia Institute of Technology;;Meta Facebook;Meta Fundamental AI Research (FAIR);Georgia Institute of Technology;",
        "aff_domain": "gatech.edu;;fb.com;meta.com;gatech.edu;",
        "position": "PhD student;;Research Scientist;Researcher;Assistant Professor;",
        "bibtex": "@inproceedings{\nliu2024generalized,\ntitle={Generalized Schr\\\"odinger Bridge Matching},\nauthor={Guan-Horng Liu and Yaron Lipman and Maximilian Nickel and Brian Karrer and Evangelos Theodorou and Ricky T. Q. Chen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=SoismgeX7z}\n}",
        "github": "",
        "project": "",
        "reviewers": "cBUM;7Jx7;fcZ9;AA2i",
        "pdf_size": 5458566,
        "rating": "6;6;8;8",
        "confidence": "5;4;4;2",
        "soundness": "3;3;2;3",
        "contribution": "3;3;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "167;81;65;93",
        "wc_strengths": "69;44;81;34",
        "wc_weaknesses": "1061;45;67;30",
        "wc_questions": "85;79;13;41",
        "wc_review": "1382;249;226;198",
        "wc_reply_reviewers": "162;0;0;18",
        "wc_reply_authors": "1618;1341;668;782",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "3;2;1;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            101.5,
            39.099232729044694
        ],
        "wc_strengths_avg": [
            57.0,
            18.828170383762732
        ],
        "wc_weaknesses_avg": [
            300.75,
            439.12775760591586
        ],
        "wc_questions_avg": [
            54.5,
            29.304436524185206
        ],
        "wc_review_avg": [
            513.75,
            501.6095966984683
        ],
        "wc_reply_reviewers_avg": [
            45.0,
            67.94850991743675
        ],
        "wc_reply_authors_avg": [
            1102.25,
            391.8331117963361
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.6882472016116854,
        "gs_citation": 26,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16243501911738198693&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=SoismgeX7z",
        "pdf": "https://openreview.net/pdf?id=SoismgeX7z",
        "email": "gatech.edu;;fb.com;meta.com;gatech.edu;",
        "author_num": 6,
        "aff_unique_index": "0;1;1;0",
        "aff_unique_norm": "Georgia Institute of Technology;Meta",
        "aff_unique_dep": ";Meta Platforms, Inc.",
        "aff_unique_url": "https://www.gatech.edu;https://meta.com",
        "aff_unique_abbr": "Georgia Tech;Meta",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "IDEAL: Influence-Driven Selective Annotations Empower In-Context Learners in Large Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18589",
        "id": "Spp2i1hKwV",
        "author_site": "Shaokun Zhang, Xiaobo Xia, Zhaoqing Wang, Ling-Hao Chen, Jiale Liu, Qingyun Wu, Tongliang Liu",
        "tldr": "",
        "abstract": "In-context learning is a promising paradigm that utilizes in-context examples as prompts for the predictions of large language models. These prompts are crucial for achieving strong performance. However, since the prompts need to be sampled from a large volume of annotated examples, finding the right prompt may result in high annotation costs. To address this challenge, this paper introduces an influence-driven selective annotation method that aims to minimize annotation costs while improving the quality of in-context examples. The essence of our method is to select a pivotal subset from a large-scale unlabeled data pool to annotate for the subsequent sampling of prompts. Specifically, a directed graph is first constructed to represent unlabeled data. Afterward, the influence of candidate unlabeled subsets is quantified with a diffusion process. A simple yet effective greedy algorithm for unlabeled data selection is lastly introduced. It iteratively selects the data if it provides a maximum marginal gain with respect to quantified influence. Compared with previous efforts on selective annotations, our influence-driven method works in an end-to-end manner, avoids an intractable explicit balance between data diversity and representativeness, and enjoys theoretical support. Experiments confirm the superiority of the proposed method on various benchmarks, achieving better performance under lower time consumption during subset selection.",
        "keywords": "in-context learning;large language models;active learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/ce1d4c2f90831f4aa18b60647b13103e6c6adc62.zip",
        "author": "Shaokun Zhang;Xiaobo Xia;Zhaoqing Wang;Ling-Hao Chen;Jiale Liu;Qingyun Wu;Tongliang Liu",
        "authorids": "~Shaokun_Zhang2;~Xiaobo_Xia1;~Zhaoqing_Wang1;~Ling-Hao_Chen1;~Jiale_Liu2;~Qingyun_Wu2;~Tongliang_Liu1",
        "gender": ";M;M;;;;M",
        "homepage": ";https://xiaoboxia.github.io/;https://derrickwang005.github.io/;https://lhchen.top;;;https://tongliang-liu.github.io/",
        "dblp": ";242/8072;;339/7448.html;;;150/6667",
        "google_scholar": ";jRsugY0AAAAJ;ZqOjPKQAAAAJ;mxvMDpMAAAAJ;;;https://scholar.google.com.au/citations?user=EiLdZ_YAAAAJ",
        "orcid": ";;;;;;",
        "linkedin": ";;%E5%85%86%E5%8D%BF-%E7%8E%8B-ba58221b7/;ling-hao-chen-79b87a224/;;;",
        "or_profile": "~Shaokun_Zhang2;~Xiaobo_Xia1;~Zhaoqing_Wang1;~Ling-Hao_Chen1;~Jiale_Liu2;~Qingyun_Wu2;~Tongliang_Liu1",
        "aff": ";The University of Sydney;The University of Sydney;International Digital Economy Academy;;;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_domain": ";sydney.edu.au;uni.sydney.edu.au;idea.edu.cn;;;mbzuai.ac.ae",
        "position": ";PhD student;PhD student;Research Intern;;;Affiliated Associate Professor",
        "bibtex": "@inproceedings{\nzhang2024ideal,\ntitle={{IDEAL}: Influence-Driven Selective Annotations Empower In-Context Learners in Large Language Models},\nauthor={Shaokun Zhang and Xiaobo Xia and Zhaoqing Wang and Ling-Hao Chen and Jiale Liu and Qingyun Wu and Tongliang Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Spp2i1hKwV}\n}",
        "github": "",
        "project": "",
        "reviewers": "Ra1D;Ctph;QkNp;oY6L;RM4K",
        "pdf_size": 766795,
        "rating": "3;5;6;8;8",
        "confidence": "4;4;3;3;5",
        "soundness": "3;3;2;3;3",
        "contribution": "3;3;3;3;3",
        "presentation": "3;3;3;3;4",
        "wc_summary": "60;90;78;95;129",
        "wc_strengths": "36;38;101;70;140",
        "wc_weaknesses": "62;77;110;683;42",
        "wc_questions": "242;99;35;83;329",
        "wc_review": "400;304;324;931;640",
        "wc_reply_reviewers": "0;0;16;406;17",
        "wc_reply_authors": "984;781;550;3405;578",
        "reply_reviewers": "0;0;1;1;1",
        "reply_authors": "5;4;2;10;2",
        "rating_avg": [
            6.0,
            1.8973665961010275
        ],
        "confidence_avg": [
            3.8,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.2,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            90.4,
            22.75609808381041
        ],
        "wc_strengths_avg": [
            77.0,
            39.486706623875335
        ],
        "wc_weaknesses_avg": [
            194.8,
            245.10846578606788
        ],
        "wc_questions_avg": [
            157.6,
            110.02835998050685
        ],
        "wc_review_avg": [
            519.8,
            237.82043646415252
        ],
        "wc_reply_reviewers_avg": [
            87.8,
            159.27134079927876
        ],
        "wc_reply_authors_avg": [
            1259.6,
            1084.053983895636
        ],
        "reply_reviewers_avg": [
            0.6,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            4.6,
            2.9393876913398134
        ],
        "replies_avg": [
            35,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 28,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11486113376492671276&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=Spp2i1hKwV",
        "pdf": "https://openreview.net/pdf?id=Spp2i1hKwV",
        "email": ";sydney.edu.au;uni.sydney.edu.au;idea.edu.cn;;;mbzuai.ac.ae",
        "author_num": 7,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "University of Sydney;International Digital Economy Academy;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.sydney.edu.au;;https://mbzuai.ac.ae",
        "aff_unique_abbr": "USYD;;MBZUAI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;2",
        "aff_country_unique": "Australia;;United Arab Emirates"
    },
    {
        "id": "SqMVI1GFnp",
        "title": "Lie Neurons: A General Adjoint-Equivariant Neural Network for Semisimple Lie Algebras",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this paper, we propose an adjoint-equivariant neural network that takes Lie algebra data as input. Various types of equivariant neural networks have been proposed in the literature, which treat the input data as elements in a vector space carrying certain types of transformations. In comparison, we aim to process inputs that are transformations between vector spaces. The change of basis on transformation is described by conjugations, inducing the adjoint-equivariance relationship that our model is designed to capture. Leveraging the invariance property of the Killing form, the proposed network is a general framework that works for arbitrary semisimple Lie algebras. Our network possesses a simple structure that can be viewed as a Lie algebraic generalization of a multi-layer perceptron (MLP). This work extends the application of equivariant feature learning. As an example, we showcase its value in homography modeling using $\\mathfrak{sl}(3)$ Lie algebra.",
        "keywords": "geometric learning;equivariance;representation learning;lie group",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Tzu-Yuan Lin;Minghan Zhu;Maani Ghaffari",
        "authorids": "~Tzu-Yuan_Lin1;~Minghan_Zhu1;~Maani_Ghaffari1",
        "gender": "M;Not Specified;M",
        "homepage": "https://tzuyuan.github.io/;;https://curly.engin.umich.edu/",
        "dblp": "116/9958;255/5003;",
        "google_scholar": "1HY3TXcAAAAJ;70CbUXwAAAAJ;l2jdSb8AAAAJ",
        "orcid": ";0000-0002-0145-7542;0000-0002-4734-4295",
        "linkedin": ";;maani-ghaffari-19b017203/",
        "or_profile": "~Tzu-Yuan_Lin1;~Minghan_Zhu1;~Maani_Ghaffari1",
        "aff": "University of Michigan;University of Pennsylvania;University of Michigan",
        "aff_domain": "umich.edu;upenn.edu;umich.edu",
        "position": "PhD student;Postdoc;Assistant Professor",
        "bibtex": "@misc{\nlin2024lie,\ntitle={Lie Neurons: A General Adjoint-Equivariant Neural Network for Semisimple Lie Algebras},\nauthor={Tzu-Yuan Lin and Minghan Zhu and Maani Ghaffari},\nyear={2024},\nurl={https://openreview.net/forum?id=SqMVI1GFnp}\n}",
        "github": "",
        "project": "",
        "reviewers": "Wrrb;272k;mGDP;fTEN",
        "site": "https://openreview.net/forum?id=SqMVI1GFnp",
        "pdf_size": 1303517,
        "rating": "5;5;6;6",
        "confidence": "3;3;3;4",
        "soundness": "2;3;4;2",
        "contribution": "2;2;2;2",
        "presentation": "2;2;3;2",
        "wc_summary": "139;83;65;77",
        "wc_strengths": "159;65;33;43",
        "wc_weaknesses": "600;274;120;156",
        "wc_questions": "67;322;83;94",
        "wc_review": "965;744;301;370",
        "wc_reply_reviewers": "0;0;0;115",
        "wc_reply_authors": "2837;2958;1246;2247",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "5;5;2;5",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            91.0,
            28.460498941515414
        ],
        "wc_strengths_avg": [
            75.0,
            49.85980344927164
        ],
        "wc_weaknesses_avg": [
            287.5,
            189.2002906974511
        ],
        "wc_questions_avg": [
            141.5,
            104.65299804592317
        ],
        "wc_review_avg": [
            595.0,
            272.10384047271367
        ],
        "wc_reply_reviewers_avg": [
            28.75,
            49.79646071760522
        ],
        "wc_reply_authors_avg": [
            2322.0,
            676.9641792591392
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.25,
            1.299038105676658
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:FjC-ZMjYVJ8J:scholar.google.com/&scioq=Lie+Neurons:+A+General+Adjoint-Equivariant+Neural+Network+for+Semisimple+Lie+Algebras&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Michigan;University of Pennsylvania",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.umich.edu;https://www.upenn.edu",
        "aff_unique_abbr": "UM;UPenn",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "SqNi6Se1NT",
        "title": "A Bayesian Framework for Clustered Federated Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "One of the main challenges of federated learning (FL) is handling non-independent and identically distributed (non-IID) client data, which may occur in practice due to unbalanced datasets and use of different data sources across clients. Knowledge sharing and model personalization are key strategies for addressing this issue. Clustered federated learning is a class of FL methods that groups clients that observe similarly distributed data into clusters, such that every client is typically associated with one data distribution and participates in training a model for that distribution along their cluster peers. In this paper, we present a unified Bayesian framework for clustered FL which optimally associates clients to clusters. Then we propose several practical algorithms to handle the, otherwise growing, data associations in a way that trades off performance and computational complexity. This work provides insights on client-cluster associations and enables client knowledge sharing in new ways. For instance, the proposed framework circumvents the need for unique client-cluster associations, which is seen to increase the performance of the resulting models in a variety of experiments.",
        "keywords": "Federated Learning;Data association;Bayesian;Clustering",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Peng Wu;Tales Imbiriba;Pau Closas",
        "authorids": "~Peng_Wu8;~Tales_Imbiriba1;~Pau_Closas1",
        "gender": "M;M;",
        "homepage": ";https://talesimbiriba.github.io;",
        "dblp": ";07/1491;",
        "google_scholar": "uh14vcAAAAAJ;jYxVQtkAAAAJ;o7bF79sAAAAJ",
        "orcid": ";0000-0002-2626-2039;",
        "linkedin": ";;",
        "or_profile": "~Peng_Wu8;~Tales_Imbiriba1;~Pau_Closas1",
        "aff": ";Northeastern University;Northeastern University",
        "aff_domain": ";neu.edu;northeastern.edu",
        "position": ";Researcher;Associate Professor",
        "bibtex": "@misc{\nanonymous2024a,\ntitle={A Bayesian Framework for Clustered Federated Learning},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=SqNi6Se1NT}\n}",
        "github": "",
        "project": "",
        "reviewers": "n2mn;Yz5m;UPyv;V6Hn",
        "site": "https://openreview.net/forum?id=SqNi6Se1NT",
        "pdf_size": 3741776,
        "rating": "5;5;5;5",
        "confidence": "2;3;3;3",
        "soundness": "2;2;3;2",
        "contribution": "2;2;3;2",
        "presentation": "1;2;1;1",
        "wc_summary": "43;76;57;41",
        "wc_strengths": "56;65;48;97",
        "wc_weaknesses": "469;348;352;211",
        "wc_questions": "104;3;93;152",
        "wc_review": "672;492;550;501",
        "wc_reply_reviewers": "438;0;318;0",
        "wc_reply_authors": "2469;575;782;920",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "4;1;1;2",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            54.25,
            13.988834833537782
        ],
        "wc_strengths_avg": [
            66.5,
            18.607794065928395
        ],
        "wc_weaknesses_avg": [
            345.0,
            91.36465399704636
        ],
        "wc_questions_avg": [
            88.0,
            53.85629025471398
        ],
        "wc_review_avg": [
            553.75,
            71.75087107485177
        ],
        "wc_reply_reviewers_avg": [
            189.0,
            193.70338148829515
        ],
        "wc_reply_authors_avg": [
            1186.5,
            750.5632884707325
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Aj41-HJvigcJ:scholar.google.com/&scioq=A+Bayesian+Framework+for+Clustered+Federated+Learning&hl=en&as_sdt=0,44",
        "gs_version_total": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Northeastern University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.northeastern.edu",
        "aff_unique_abbr": "NEU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "SrzrUGWoRq",
        "title": "Towards Complex-query Referring Image Segmentation: A Novel Benchmark",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Referring Image Understanding (RIS) has been extensively studied over the past decade, leading to the development of advanced algorithms. However, there has been a lack of research investigating how existing algorithms should be benchmarked with complex language queries, which include more informative descriptions of surrounding objects and backgrounds (e.g., \"the black car.\" vs. \"the black car is parking on the road and beside the bus.\"). Given the significant improvement in the semantic understanding capability of large pre-trained models, it is crucial to take a step further in RIS by incorporating complex language that resembles real-world applications. To close this gap, building upon the existing RefCOCO and Visual Genome datasets, we propose a new RIS benchmark with complex queries, namely RIS-CQ. The RIS-CQ dataset is of high quality and large scale, which challenges the existing RIS with enriched, specific and informative queries, and enables a more realistic scenario of RIS research. Besides, we present a nichetargeting method to better task the RIS-CQ, called dual-modality graph alignment model (DuMoGa), which outperforms a series of RIS methods. To provide a valuable foundation for future advancements in the field of RIS with complex queries, we release the datasets, preprocessing and synthetic scripts, and the algorithm implementations.",
        "keywords": "Referring Image Segmentation; Complex Language Query; Dual-Modality Alignment",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/266777bea0c704815ea6141cc41449dbbd06ca19.pdf",
        "author": "Wei Ji;Li Li;Hao Fei;Xiangyan Liu;Xun Yang;Juncheng Li;Roger Zimmermann",
        "authorids": "~Wei_Ji1;~Li_Li18;~Hao_Fei1;~Xiangyan_Liu1;~Xun_Yang1;~Juncheng_Li3;~Roger_Zimmermann1",
        "gender": "M;M;M;M;M;M;M",
        "homepage": "https://jiwei0523.github.io/;https://lili0415.github.io;https://haofei.vip/;https://github.com/xyliugo;https://sites.google.com/site/xunyangprofile/;;https://www.comp.nus.edu.sg/cs/bio/rogerz/",
        "dblp": "52/3220-8;53/2189-91;81/3569-1;;72/4772-1;182/7674-6;79/1490",
        "google_scholar": "69OFB-AAAAAJ;r4kIL4cAAAAJ;YGDX46AAAAAJ;lsFTg-0AAAAJ;ro8lzsUAAAAJ;lm9s-QgAAAAJ;https://scholar.google.com.tw/citations?user=IDREwXEAAAAJ",
        "orcid": "0000-0002-8106-9768;0009-0003-2007-2706;0000-0003-3026-6347;;0000-0003-0201-1638;0000-0003-2258-1291;0000-0002-7410-2590",
        "linkedin": ";;;;;;roger-zimmermann-76b56b6/",
        "or_profile": "~Wei_Ji1;~Li_Li18;~Hao_Fei1;~Xiangyan_Liu1;~Xun_Yang1;~Juncheng_Li3;~Roger_Zimmermann1",
        "aff": "Nanjing University;National University of Singapore;National University of Singapore;National University of Singapore;University of Science and Technology of China;National University of Singapore;National University of Singapore",
        "aff_domain": "nju.edu.cn;u.nus.edu;nus.edu.sg;u.nus.edu;ustc.edu.cn;nus.edu;nus.edu.sg",
        "position": "Associate Professor;MS student;Postdoc;MS student;Full Professor;Postdoc;Full Professor",
        "bibtex": "@misc{\nji2024towards,\ntitle={Towards Complex-query Referring Image Segmentation: A Novel Benchmark},\nauthor={Wei Ji and Li Li and Hao Fei and Xiangyan Liu and Xun Yang and Juncheng Li and Roger Zimmermann},\nyear={2024},\nurl={https://openreview.net/forum?id=SrzrUGWoRq}\n}",
        "github": "",
        "project": "",
        "reviewers": "V6x1;8JWc;ruSq;iqmc",
        "site": "https://openreview.net/forum?id=SrzrUGWoRq",
        "pdf_size": 3501475,
        "rating": "3;3;3;8",
        "confidence": "5;5;2;5",
        "soundness": "2;1;1;4",
        "contribution": "2;2;2;4",
        "presentation": "3;2;1;3",
        "wc_summary": "100;43;51;57",
        "wc_strengths": "47;73;27;195",
        "wc_weaknesses": "84;117;43;117",
        "wc_questions": "3;223;22;78",
        "wc_review": "234;456;143;447",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            2.165063509461097
        ],
        "confidence_avg": [
            4.25,
            1.299038105676658
        ],
        "soundness_avg": [
            2.0,
            1.224744871391589
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            62.75,
            22.072324299900995
        ],
        "wc_strengths_avg": [
            85.5,
            65.28973885688318
        ],
        "wc_weaknesses_avg": [
            90.25,
            30.425112982534674
        ],
        "wc_questions_avg": [
            81.5,
            86.22209693576235
        ],
        "wc_review_avg": [
            320.0,
            135.4160256395084
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2844351580479202868&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1;1;2;1;1",
        "aff_unique_norm": "Nanjing University;National University of Singapore;University of Science and Technology of China",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.nju.edu.cn;https://www.nus.edu.sg;http://www.ustc.edu.cn",
        "aff_unique_abbr": "Nanjing U;NUS;USTC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;0;1;1",
        "aff_country_unique": "China;Singapore"
    },
    {
        "id": "SsbMoaQUyA",
        "title": "Exposure Bias Mitigation for Self Information Updating of Large Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Current large language models (LLMs) have demonstrated remarkable capabilities in addressing users' requests for various types of information. However, these models are limited by the most recent data available in their pretraining corpora, rendering them incapable of providing up-to-date information. While periodically updating LLM pretraining corpora is possible, the optimal updating strategy remains underexplored. Retraining LLMs from scratch is cost-prohibitive, and the effectiveness of continual fine-tuning on new corpora has not been thoroughly examined. Additionally, current update procedures typically demand significant human involvement to convert the information into more structured format, such as knowledge triples, conversational data or responses with human feedback. In this study, we conduct a comprehensive examination of a novel \\problem{} task in LLMs, which only requires the provision of informative text corpora without additional human intervention. For instance, we can use the latest news articles to update the LLMs' existing knowledge. We define the \\problem{} task and assess the continual fine-tuning approach for this purpose. We formulate this task as a self knowledge distillation task where the teacher model is the original LLM with a new corpus as the context. We observe that the na\\\"ive distillation method can be problematic due to LLMs' exposure bias, which prioritizes existing information over new information that we aim to incorporate. When fine-tuned to accommodate instructions related to new information, LLMs tend to rely on pre-existing knowledge, neglecting recent facts and leading to incorrect reasoning chains that ultimately diminish the efficacy of information updates. Based on our theoretical analysis, we propose a straightforward yet effective method to mitigate exposure bias by incorporating the selected relevant facts into training losses. To validate our hypothesis, we develop two datasets to evaluate information updates, one derived from news articles published in March and April 2023 (the latest available news by the time of dataset collection) and the other derived from the Natural Questions benchmark. The latter has been chosen due to its provided link between questions and relevant passages from Wikipedia, which are utilized as the corpus for information updates and evaluation, respectively. Experimental results demonstrate that our proposed approach significantly increases the factual consistency score (on a scale from 0 to 1) by up to 0.16. Furthermore, we perform a preliminary investigation into the forgetting issue associated with this task, unveiling that our method, with a compact replay buffer of only 2.3\\% of the training tokens, can significantly alleviate the forgetting problem. This study thus marks a significant stride towards optimizing the procedures for updating LLMs with the latest information, promising enhanced accuracy and efficacy.",
        "keywords": "Large Language Models;Knowledge Update;Exposure Bias",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Pengfei Yu;Heng Ji",
        "authorids": "~Pengfei_Yu1;~Heng_Ji3",
        "gender": "M;F",
        "homepage": ";http://blender.cs.illinois.edu/hengji.html",
        "dblp": ";",
        "google_scholar": "bFbykBYAAAAJ;z7GCqT4AAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Pengfei_Yu1;~Heng_Ji3",
        "aff": "University of Illinois, Urbana Champaign;University of Illinois, Urbana-Champaign",
        "aff_domain": "illinois.edu;uiuc.edu",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nyu2024exposure,\ntitle={Exposure Bias Mitigation for Self Information Updating of Large Language Models},\nauthor={Pengfei Yu and Heng Ji},\nyear={2024},\nurl={https://openreview.net/forum?id=SsbMoaQUyA}\n}",
        "github": "",
        "project": "",
        "reviewers": "fBKp;b44p;z86B;f8AU;o5o3",
        "site": "https://openreview.net/forum?id=SsbMoaQUyA",
        "pdf_size": 353744,
        "rating": "3;5;6;6;6",
        "confidence": "4;4;3;3;3",
        "soundness": "1;3;2;3;3",
        "contribution": "2;3;2;3;3",
        "presentation": "1;2;3;3;2",
        "wc_summary": "153;64;103;496;85",
        "wc_strengths": "12;58;103;28;72",
        "wc_weaknesses": "261;137;32;126;21",
        "wc_questions": "221;31;45;236;5",
        "wc_review": "647;290;283;886;183",
        "wc_reply_reviewers": "69;0;11;13;0",
        "wc_reply_authors": "501;268;131;319;133",
        "reply_reviewers": "2;0;1;1;0",
        "reply_authors": "3;1;1;1;1",
        "rating_avg": [
            5.2,
            1.16619037896906
        ],
        "confidence_avg": [
            3.4,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.4,
            0.8
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.2,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            180.2,
            160.62054663087162
        ],
        "wc_strengths_avg": [
            54.6,
            32.18446830382631
        ],
        "wc_weaknesses_avg": [
            115.4,
            86.77004091274821
        ],
        "wc_questions_avg": [
            107.6,
            99.65861728922391
        ],
        "wc_review_avg": [
            457.8,
            265.849130147157
        ],
        "wc_reply_reviewers_avg": [
            18.6,
            25.772853935876018
        ],
        "wc_reply_authors_avg": [
            270.4,
            137.0074450531795
        ],
        "reply_reviewers_avg": [
            0.8,
            0.7483314773547883
        ],
        "reply_authors_avg": [
            1.4,
            0.8000000000000002
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.840168050416806,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:9xiSywk3P48J:scholar.google.com/&scioq=Exposure+Bias+Mitigation+for+Self+Information+Updating+of+Large+Language+Models&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Illinois Urbana-Champaign;University of Illinois",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://illinois.edu;https://illinois.edu",
        "aff_unique_abbr": "UIUC;UIUC",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Urbana-Champaign",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Provable Robust Watermarking for AI-Generated Text",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18588",
        "id": "SsmT8aO45L",
        "author_site": "Xuandong Zhao, Prabhanjan Ananth, Lei Li, Yu-Xiang Wang",
        "tldr": "",
        "abstract": "We study the problem of watermarking large language models (LLMs) generated text \u2014 one of the most promising approaches for addressing the safety challenges of LLM usage. In this paper, we propose a rigorous theoretical framework to quantify the effectiveness and robustness of LLM watermarks. We propose a robust and high-quality watermark method, Unigram-Watermark, by extending an existing approach with a simplified fixed grouping strategy. We prove that our watermark method enjoys guaranteed generation quality, correctness in watermark detection, and is robust against text editing and paraphrasing. Experiments on three varying LLMs and two datasets verify that our Unigram-Watermark achieves superior detection accuracy and comparable generation quality in perplexity, thus promoting the responsible use of LLMs.",
        "keywords": "text generation;watermark;secure ai",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Xuandong Zhao;Prabhanjan Vijendra Ananth;Lei Li;Yu-Xiang Wang",
        "authorids": "~Xuandong_Zhao1;~Prabhanjan_Vijendra_Ananth1;~Lei_Li11;~Yu-Xiang_Wang1",
        "gender": "M;;M;",
        "homepage": "https://xuandongzhao.github.io/;https://sites.google.com/site/prabhanjanva/home;https://www.cs.cmu.edu/~leili;http://www.cs.ucsb.edu/~yuxiangw/publications.html",
        "dblp": "244/8033;22/8772.html;13/7007-5.html;62/1637-3.html",
        "google_scholar": "CxeH4uoAAAAJ;xS_vRnYAAAAJ;BYXqAlwAAAAJ;HGNZ1fkAAAAJ",
        "orcid": ";;0000-0003-3095-9776;",
        "linkedin": "xuandong-zhao-a3270610b/;;;",
        "or_profile": "~Xuandong_Zhao1;~Prabhanjan_Vijendra_Ananth1;~Lei_Li11;~Yu-Xiang_Wang1",
        "aff": "UC Santa Barbara;, University of California, Santa Barbara;School of Computer Science, Carnegie Mellon University;UC Santa Barbara",
        "aff_domain": "ucsb.edu;cs.ucsb.edu;cs.cmu.edu;ucsb.edu",
        "position": "PhD student;Assistant Professor;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nzhao2024provable,\ntitle={Provable Robust Watermarking for {AI}-Generated Text},\nauthor={Xuandong Zhao and Prabhanjan Vijendra Ananth and Lei Li and Yu-Xiang Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=SsmT8aO45L}\n}",
        "github": "",
        "project": "",
        "reviewers": "L3yT;ivTE;Rdg2;Po1T",
        "pdf_size": 703489,
        "rating": "6;6;8;8",
        "confidence": "3;2;3;4",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;3;2",
        "wc_summary": "154;39;139;38",
        "wc_strengths": "106;66;86;62",
        "wc_weaknesses": "83;232;94;137",
        "wc_questions": "89;77;142;120",
        "wc_review": "432;414;461;357",
        "wc_reply_reviewers": "0;12;0;12",
        "wc_reply_authors": "1029;1150;630;427",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            92.5,
            54.26094359666076
        ],
        "wc_strengths_avg": [
            80.0,
            17.549928774784245
        ],
        "wc_weaknesses_avg": [
            136.5,
            58.71328640095017
        ],
        "wc_questions_avg": [
            107.0,
            25.583197610932064
        ],
        "wc_review_avg": [
            416.0,
            37.96709101313926
        ],
        "wc_reply_reviewers_avg": [
            6.0,
            6.0
        ],
        "wc_reply_authors_avg": [
            809.0,
            292.6798592318918
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.7071067811865475,
        "gs_citation": 166,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7192876037420865725&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=SsmT8aO45L",
        "pdf": "https://openreview.net/pdf?id=SsmT8aO45L",
        "email": "ucsb.edu;cs.ucsb.edu;cs.cmu.edu;ucsb.edu",
        "author_num": 4,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "University of California, Santa Barbara;Carnegie Mellon University",
        "aff_unique_dep": ";School of Computer Science",
        "aff_unique_url": "https://www.ucsb.edu;https://www.cmu.edu",
        "aff_unique_abbr": "UCSB;CMU",
        "aff_campus_unique_index": "0;0;1;0",
        "aff_campus_unique": "Santa Barbara;Pittsburgh",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "St7aZgQJBf",
        "title": "Curriculum metric learning for robust image retrieval",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep Metric Learning (DML) is a widely used paradigm for learning data representations used for retrieval, where the goal is to retrieve a set of items that are relevant to a query sample. Similar to other deep learning approaches, DML is vulnerable to various forms of adversarial ranking attacks, which change the retrieval ranking through adversarial perturbations. Current DML defenses initialize their models with pretrained ImageNet weights (as is standard), though we hypothesize this is sub-optimal. Deep models optimized to solve the robust optimization framework are trained to be invariant to a set of perturbations $\\Delta$, which we hypothesize is a useful, if not necessary, starting point for robust retrieval. Learning approaches for robust retrieval representations must accomplish two goals: (a) learn semantically meaningful representations, and (b) learn robust representations resistant to ranking attacks. We propose the use of curriculum learning for robust retrieval by decomposing the learning process into two steps: (1) learn robust features followed by (2) robust metric learning to learn semantic features for accurate retrieval. In this work, we demonstrate that imposing robust optimization as a feature prior is critical for learning robust retrieval representations. We show that robust representations learned by robust models possess a certain degree of robustness against ranking attacks. Furthermore, by initialing adversarial ranking defenses with robust weights, we significantly improve model's recall on benign examples and their robustness against adversarial ranking attacks",
        "keywords": "adversarial robustness;robustness prior",
        "primary_area": "metric learning, kernel learning, and sparse coding",
        "supplementary_material": "/attachment/e02c5a0706fec6b1c627a41c504a035f646a16d6.pdf",
        "author": "Michal Kucer;Diane Oyen",
        "authorids": "~Michal_Kucer1;~Diane_Oyen1",
        "gender": ";F",
        "homepage": ";https://public.lanl.gov/doyen",
        "dblp": ";87/10813",
        "google_scholar": ";3zO8KmkAAAAJ",
        "orcid": ";0000-0002-1353-3688",
        "linkedin": ";diane-oyen-b7469428/",
        "or_profile": "~Michal_Kucer1;~Diane_Oyen1",
        "aff": ";Los Alamos National Laboratory",
        "aff_domain": ";lanl.gov",
        "position": ";Scientist",
        "bibtex": "@misc{\nkucer2024curriculum,\ntitle={Curriculum metric learning for robust image retrieval},\nauthor={Michal Kucer and Diane Oyen},\nyear={2024},\nurl={https://openreview.net/forum?id=St7aZgQJBf}\n}",
        "github": "",
        "project": "",
        "reviewers": "QZHk;uGeY;Khkm;fFop",
        "site": "https://openreview.net/forum?id=St7aZgQJBf",
        "pdf_size": 6188950,
        "rating": "3;5;5;6",
        "confidence": "3;3;4;1",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;2;3",
        "wc_summary": "84;61;35;9",
        "wc_strengths": "107;41;16;9",
        "wc_weaknesses": "197;159;29;9",
        "wc_questions": "118;1;91;9",
        "wc_review": "506;262;171;36",
        "wc_reply_reviewers": "0;0;49;0",
        "wc_reply_authors": "495;198;294;0",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;1;0",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            2.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            47.25,
            28.07467720206236
        ],
        "wc_strengths_avg": [
            43.25,
            38.68058298423125
        ],
        "wc_weaknesses_avg": [
            98.5,
            80.93670366403613
        ],
        "wc_questions_avg": [
            54.75,
            50.73645139345084
        ],
        "wc_review_avg": [
            243.75,
            171.4356657758239
        ],
        "wc_reply_reviewers_avg": [
            12.25,
            21.21762239271875
        ],
        "wc_reply_authors_avg": [
            246.75,
            178.27138721623277
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            0.75,
            0.4330127018922193
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.4736842105263159,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18048503770984679605&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Los Alamos National Laboratory",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.lanl.gov",
        "aff_unique_abbr": "LANL",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Sliced Wasserstein Estimation with Control Variates",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18587",
        "id": "StYc4hQAEi",
        "author_site": "Khai Nguyen, Nhat Ho",
        "tldr": "",
        "abstract": "The sliced Wasserstein (SW) distances between two probability measures are defined as the expectation of the Wasserstein distance between two one-dimensional projections of the two measures. The randomness comes from a projecting direction that is used to project the two input measures to one dimension. Due to the intractability of the expectation, Monte Carlo integration is performed to estimate the value of the SW distance. Despite having various variants, there has been no prior work that improves the Monte Carlo estimation scheme for the SW distance in terms of controlling its variance. To bridge the literature on variance reduction and the literature on the SW distance, we propose computationally efficient control variates to reduce the variance of the empirical estimation of the SW distance. The key idea is to first find Gaussian approximations of projected one-dimensional measures, then we utilize the closed-form of the Wasserstein-2 distance between two Gaussian distributions to design the control variates. In particular, we propose using a lower bound and an upper bound of the Wasserstein-2 distance between two fitted Gaussians as two computationally efficient control variates. We empirically show that the proposed control variate estimators can help to reduce the variance considerably when comparing measures over images and point-clouds. Finally, we demonstrate the favorable performance of the proposed control variate estimators in gradient flows to interpolate between two point-clouds and in deep generative modeling on standard image datasets, such as CIFAR10 and CelebA.",
        "keywords": "Sliced Wasserstein;Monte Carlo Methods;Point-Cloud;Generative Models;Optimal Transport",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/a5a96dc42fdd3ae99776f4bf0df6c311dd670d78.zip",
        "author": "Khai Nguyen;Nhat Ho",
        "authorids": "~Khai_Nguyen1;~Nhat_Ho1",
        "gender": "M;M",
        "homepage": "https://khainb.com;https://nhatptnk8912.github.io/",
        "dblp": "120/4308;203/4479",
        "google_scholar": "im5fNaQAAAAJ;https://scholar.google.ca/citations?user=Xs7cKMwAAAAJ",
        "orcid": ";",
        "linkedin": ";nhat-pham-minh-ho-267b8164/",
        "or_profile": "~Khai_Nguyen1;~Nhat_Ho1",
        "aff": "University of Texas, Austin;University of Texas, Austin",
        "aff_domain": "utexas.edu;utexas.edu",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nnguyen2024sliced,\ntitle={Sliced Wasserstein Estimation with Control Variates},\nauthor={Khai Nguyen and Nhat Ho},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=StYc4hQAEi}\n}",
        "github": "",
        "project": "",
        "reviewers": "yEdx;mJzC;dx24;pTc9",
        "pdf_size": 2563397,
        "rating": "6;6;6;8",
        "confidence": "4;4;3;4",
        "soundness": "3;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;2",
        "wc_summary": "151;200;65;86",
        "wc_strengths": "112;129;131;158",
        "wc_weaknesses": "111;199;245;194",
        "wc_questions": "40;81;61;134",
        "wc_review": "414;609;502;572",
        "wc_reply_reviewers": "163;0;113;18",
        "wc_reply_authors": "1158;866;1176;909",
        "reply_reviewers": "2;0;2;1",
        "reply_authors": "3;2;4;3",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            125.5,
            53.434539391670626
        ],
        "wc_strengths_avg": [
            132.5,
            16.469669092000604
        ],
        "wc_weaknesses_avg": [
            187.25,
            48.30307961196677
        ],
        "wc_questions_avg": [
            79.0,
            34.90701935141412
        ],
        "wc_review_avg": [
            524.25,
            74.35178209027676
        ],
        "wc_reply_reviewers_avg": [
            73.5,
            67.18072640274143
        ],
        "wc_reply_authors_avg": [
            1027.25,
            140.7184689370944
        ],
        "reply_reviewers_avg": [
            1.25,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5252188942005925864&as_sdt=5,31&sciodt=0,31&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=StYc4hQAEi",
        "pdf": "https://openreview.net/pdf?id=StYc4hQAEi",
        "email": "utexas.edu;utexas.edu",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Texas at Austin",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.utexas.edu",
        "aff_unique_abbr": "UT Austin",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Austin",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "StkLULT1i1",
        "title": "Learning a Diffusion Model Policy from Rewards via Q-Score Matching",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Diffusion models have become a popular choice for representing actor policies in behavior cloning and offline reinforcement learning. This is due to their natural ability to optimize an expressive class of distributions over a continuous space. However, previous works fail to exploit the score-based structure of diffusion models and utilize a simple behavior cloning term to train the actor, limiting their ability in the actor-critic setting. In this paper, we focus on off-policy reinforcement learning and propose a new method for learning a diffusion model policy that exploits the linked structure between the score of the policy and the action gradient of the Q-function. We denote this method Q-score matching and provide theoretical justification for this approach. We conduct experiments in simulated environments to demonstrate the effectiveness of our proposed method and compare to popular baselines. Our code is publicly available at https://www.scorematchingrl.com.",
        "keywords": "reinforcement learning;diffusion models;online learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Michael Psenka;Alejandro Escontrela;Pieter Abbeel;Yi Ma",
        "authorids": "~Michael_Psenka1;~Alejandro_Escontrela1;~Pieter_Abbeel2;~Yi_Ma4",
        "gender": ";M;M;M",
        "homepage": "https://www.michaelpsenka.io;https://www.escontrela.me;https://people.eecs.berkeley.edu/~pabbeel/;http://people.eecs.berkeley.edu/~yima/",
        "dblp": "306/1500;;;",
        "google_scholar": "vqYq3egAAAAJ;53OxjmYAAAAJ;https://scholar.google.com.tw/citations?user=vtwH6GkAAAAJ;https://scholar.google.com.hk/citations?user=XqLiBQMAAAAJ",
        "orcid": ";;;",
        "linkedin": "michael-psenka/;alejandro-escontrela/;;",
        "or_profile": "~Michael_Psenka1;~Alejandro_Escontrela1;~Pieter_Abbeel2;~Yi_Ma4",
        "aff": "University of California, Berkeley;University of California, Berkeley;Covariant;University of California, Berkeley",
        "aff_domain": "berkeley.edu;berkeley.edu;covariant.ai;berkeley.edu",
        "position": "PhD student;PhD student;Founder;Full Professor",
        "bibtex": "@misc{\npsenka2024learning,\ntitle={Learning a Diffusion Model Policy from Rewards via Q-Score Matching},\nauthor={Michael Psenka and Alejandro Escontrela and Pieter Abbeel and Yi Ma},\nyear={2024},\nurl={https://openreview.net/forum?id=StkLULT1i1}\n}",
        "github": "",
        "project": "",
        "reviewers": "pZv9;VG7o;uSr1",
        "site": "https://openreview.net/forum?id=StkLULT1i1",
        "pdf_size": 465750,
        "rating": "5;5;5",
        "confidence": "4;3;4",
        "soundness": "3;2;2",
        "contribution": "4;3;2",
        "presentation": "3;4;2",
        "wc_summary": "79;51;73",
        "wc_strengths": "68;71;42",
        "wc_weaknesses": "154;148;293",
        "wc_questions": "13;6;30",
        "wc_review": "314;276;438",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "461;651;739",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            67.66666666666667,
            12.036980056845191
        ],
        "wc_strengths_avg": [
            60.333333333333336,
            13.02134998974974
        ],
        "wc_weaknesses_avg": [
            198.33333333333334,
            66.98424358674873
        ],
        "wc_questions_avg": [
            16.333333333333332,
            10.077477638553981
        ],
        "wc_review_avg": [
            342.6666666666667,
            69.1728912861743
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            617.0,
            116.0114936834565
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 24,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18392490740254682730&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "University of California, Berkeley;Covariant",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.berkeley.edu;",
        "aff_unique_abbr": "UC Berkeley;",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Berkeley;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States;"
    },
    {
        "id": "SuUh5aRbbu",
        "title": "End-to-end Story Plot Generator",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Story plots, while short, carry most of the essential information of a full story that may contain tens of thousands of words. We study the problem of automatic generation of story plots, which includes story premise, character descriptions, plot outlines, etc. To generate a single engaging plot, existing plot generators (e.g., DOC (Yang et al., 2022a)) require hundreds to thousands of calls to LLMs (e.g., OpenAI API) in the planning stage of the story plot, which is costly and takes at least several minutes. Moreover, the hard-wired nature of the method makes the pipeline non-differentiable, blocking fast specialization and personalization of the plot generator. In this paper, we overcome these issues with an end-to-end story plot generator, which is (1) faster and cheaper to generate and (2) end-to-end fine-tunable with human feedback. Compared to DOC, our work replaces expensive OpenAI API calls with Llama2 models via careful prompt designs, which leads to the cheap generation of high-quality training datasets. We then perform supervised fine-tuning (SFT) using approximately 13000 story plots to obtain an end-to-end model. The end-to-end model can generate story plots of comparable quality to the previous DOC method and is $>10\\times$ faster (1k tokens in only 30 seconds on average). Furthermore, fine-tuned with RLHF on several different reward models for different aspects of story quality, our model achieves 60.0\\% winning rate against the model after SFT in the aspect of suspense and surprise.",
        "keywords": "automatic story generation;end-to-end generator;reader-specific reward model;rlhf",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/d6c75c3bc89b5bde5774c0083764ca2c6bad841d.pdf",
        "author": "Hanlin Zhu;Andrew Cohen;Danqing Wang;Kevin Yang;Xiaomeng Yang;Jiantao Jiao;Yuandong Tian",
        "authorids": "~Hanlin_Zhu2;~Andrew_Cohen4;~Danqing_Wang1;~Kevin_Yang2;~Xiaomeng_Yang1;~Jiantao_Jiao1;~Yuandong_Tian1",
        "gender": "M;M;F;M;M;M;M",
        "homepage": "https://hanlinzhu.com/;;;;https://scholar.google.com/citations?user=aO8KpGcAAAAJ&hl=en;http://yuandong-tian.com;https://people.eecs.berkeley.edu/~yangk/",
        "dblp": ";;226/6524.html;;43/8919;t/YuandongTian;13/10565",
        "google_scholar": "yDVn5LEAAAAJ;;https://scholar.google.com/citations?hl=en-US;t8v3JXsAAAAJ;aO8KpGcAAAAJ;0mgEF28AAAAJ;sRpY9TIAAAAJ",
        "orcid": ";;;0009-0007-3917-6811;;0000-0003-4202-4847;",
        "linkedin": ";andrew-cohen-17a7aa15b;;xiaomeng-yang-356a976b;;yuandongtian;",
        "or_profile": "~Hanlin_Zhu2;~Andrew_Cohen4;~Danqing_Wang1;~Xiaomeng_Yang1;~Jiantao_Jiao1;~Yuandong_Tian1;~Kevin_Yang1",
        "aff": "Electrical Engineering & Computer Science Department, University of California Berkeley;Meta Platforms;Carnegie Mellon University;Moonshot AI;University of California, Berkeley;Meta AI (FAIR);Scaled Cognition",
        "aff_domain": "eecs.berkeley.edu;meta.com;andrew.cmu.edu;msh.team;berkeley.edu;meta.com;scaledcognition.com",
        "position": "PhD student;Researcher;PhD student;Member of Technical Staff;Assistant Professor;Research Scientist;Researcher",
        "bibtex": "@misc{\nzhu2024endtoend,\ntitle={End-to-end Story Plot Generator},\nauthor={Hanlin Zhu and Andrew Cohen and Danqing Wang and Kevin Yang and Xiaomeng Yang and Jiantao Jiao and Yuandong Tian},\nyear={2024},\nurl={https://openreview.net/forum?id=SuUh5aRbbu}\n}",
        "github": "",
        "project": "",
        "reviewers": "vgZV;zk9y;G5uN",
        "site": "https://openreview.net/forum?id=SuUh5aRbbu",
        "pdf_size": 261146,
        "rating": "1;5;6",
        "confidence": "5;5;3",
        "soundness": "1;2;2",
        "contribution": "1;2;3",
        "presentation": "2;3;4",
        "wc_summary": "69;139;109",
        "wc_strengths": "37;103;97",
        "wc_weaknesses": "313;714;148",
        "wc_questions": "30;37;199",
        "wc_review": "449;993;553",
        "wc_reply_reviewers": "143;114;26",
        "wc_reply_authors": "1229;1094;448",
        "reply_reviewers": "1;1;1",
        "reply_authors": "3;3;1",
        "rating_avg": [
            4.0,
            2.160246899469287
        ],
        "confidence_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            105.66666666666667,
            28.674417556808756
        ],
        "wc_strengths_avg": [
            79.0,
            29.79932885150268
        ],
        "wc_weaknesses_avg": [
            391.6666666666667,
            237.66970545041895
        ],
        "wc_questions_avg": [
            88.66666666666667,
            78.06976936618224
        ],
        "wc_review_avg": [
            665.0,
            235.78521299408635
        ],
        "wc_reply_reviewers_avg": [
            94.33333333333333,
            49.74825513411389
        ],
        "wc_reply_authors_avg": [
            923.6666666666666,
            340.8326405860931
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.654653670707977,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13162215195000706612&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;3;0;1;4",
        "aff_unique_norm": "University of California, Berkeley;Meta;Carnegie Mellon University;Moonshot AI;Scaled Cognition",
        "aff_unique_dep": "Electrical Engineering & Computer Science Department;Meta Platforms, Inc.;;;",
        "aff_unique_url": "https://www.berkeley.edu;https://www.meta.com;https://www.cmu.edu;https://moonshot.ai;",
        "aff_unique_abbr": "UC Berkeley;Meta;CMU;Moonshot AI;",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Berkeley;",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "SvEMbCMgb5",
        "title": "$R^2$: Range Regularization for Model Compression and Quantization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Model parameter regularization is a widely used technique to improve generalization, but, it can also be used to shape the weight distributions for various purposes. \nIn this work, we propose range regularization ($R^2$) for building quantization and compression friendly models by removing outliers from weights during training. By effectively regulating range of weights, we mold the overall distribution into a tight shape to ensure high quantization bit resolution, therefore allowing model compression and quantization techniques can to utilize their limited numeric representation powers better. We introduce $L_\\infty$ regularization, its extension margin regularization and a new soft-min-max regularization to be used as a regularization loss during full-precision model training. We show that this technique generalizes well for post training quantization, quantization aware training methods like EWGS and compression techniques like DKM. Coupled with state-of-the-art quantization and compression techniques, models trained with $R^2$ perform better on an average, specifically at lower bit weights with 16x compression ratio. Our results show that $R^2$ generates state of the art 2-bit quantized models for heavily parameter constrained models like MobileNet V1 and V2 when coupled with EWGS. Additionally, for high compression ratio (32x), models trained with $R^2$ significantly better than the ones trained without it.",
        "keywords": "regularization;quantization;compression;post-training quantization;quantization-aware training",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Arnav Kundu;Chungkuk Yoo;Srijan Mishra;Minsik Cho;Saurabh Adya",
        "authorids": "~Arnav_Kundu1;~Chungkuk_Yoo1;~Srijan_Mishra1;~Minsik_Cho1;~Saurabh_Adya1",
        "gender": "M;M;M;M;M",
        "homepage": ";https://sites.google.com/view/ckyoo;;;",
        "dblp": "277/9242;;;https://dblp.uni-trier.de/pid/230/3574.html;",
        "google_scholar": "3ox4NwgAAAAJ;;_AZys7EAAAAJ;greEG1EAAAAJ;-f_R7YYAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;saurabh-adya-b126a3;srijan-mishra/",
        "or_profile": "~Arnav_Kundu1;~Chungkuk_Yoo1;~Minsik_Cho1;~Saurabh_Adya1;~Srijan_Mishra2",
        "aff": "Apple;;;;Apple",
        "aff_domain": "apple.com;;;;apple.com",
        "position": "Researcher;;;;Researcher",
        "bibtex": "@misc{\nkundu2024r,\ntitle={\\$R{\\textasciicircum}2\\$: Range Regularization for Model Compression and Quantization},\nauthor={Arnav Kundu and Chungkuk Yoo and Srijan Mishra and Minsik Cho and Saurabh Adya},\nyear={2024},\nurl={https://openreview.net/forum?id=SvEMbCMgb5}\n}",
        "github": "",
        "project": "",
        "reviewers": "aeAj;htAB;vWZn;yMkf",
        "site": "https://openreview.net/forum?id=SvEMbCMgb5",
        "pdf_size": 631168,
        "rating": "3;5;5;6",
        "confidence": "4;5;4;4",
        "soundness": "1;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "106;49;43;35",
        "wc_strengths": "82;17;36;44",
        "wc_weaknesses": "118;157;170;58",
        "wc_questions": "239;59;42;2",
        "wc_review": "545;282;291;139",
        "wc_reply_reviewers": "48;0;0;0",
        "wc_reply_authors": "349;772;425;422",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            58.25,
            28.01227409547465
        ],
        "wc_strengths_avg": [
            44.75,
            23.636571240347024
        ],
        "wc_weaknesses_avg": [
            125.75,
            43.54523510098436
        ],
        "wc_questions_avg": [
            85.5,
            91.00686787270509
        ],
        "wc_review_avg": [
            314.25,
            146.23504197011056
        ],
        "wc_reply_reviewers_avg": [
            12.0,
            20.784609690826528
        ],
        "wc_reply_authors_avg": [
            492.0,
            164.49772034894588
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.13245323570650439,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15772369373632634000&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Apple",
        "aff_unique_dep": "Apple Inc.",
        "aff_unique_url": "https://www.apple.com",
        "aff_unique_abbr": "Apple",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "SvF5JSbA0F",
        "title": "Extracting Robust On-Manifold Interactions Encoded by Neural Networks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "This paper aims to extract faithful interactions between input variables encoded by a deep neural network (DNN). Recent studies (Ren et al., 2023d; Li & Zhang, 2023b) provided lots of mathematical evidence to support that interactions can be roughly considered as primitive inference patterns encoded by a DNN, given that a small number of interactions can accurately explain the network outputs on any randomly masked samples. However, the instability of interactions to small perturbations on the input still hinders people from taking interactions as rigorous primitives for the network inference. Therefore, in this paper, we propose to extract on-manifold interactions, which are shared by different perturbed inputs. The extracted on-manifold interactions can also explain primitives for adversarial vulnerability. The code will be released after the acceptance of the paper.",
        "keywords": "Robustness;Out-of-distribution;Neural Networks",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Jie Ren;Muyan Weng;Quanshi Zhang",
        "authorids": "~Jie_Ren1;~Muyan_Weng1;~Quanshi_Zhang1",
        "gender": "F;M;M",
        "homepage": "https://jie-ren.github.io/;https://github.com/Ray0202;http://qszhang.com",
        "dblp": "r/JieRen-18;385/8151.html;http://dblp.uni-trier.de/pers/hd/z/Zhang:Quanshi",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;BSDXGlcAAAAJ;iFFhHK0AAAAJ",
        "orcid": "0000-0001-9918-3000;0009-0005-8723-0689;",
        "linkedin": ";;",
        "or_profile": "~Jie_Ren1;~Muyan_Weng1;~Quanshi_Zhang1",
        "aff": "Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn",
        "position": "PhD student;Undergrad student;Associate Professor",
        "bibtex": "@misc{\nren2024extracting,\ntitle={Extracting Robust On-Manifold Interactions Encoded by Neural Networks},\nauthor={Jie Ren and Muyan Weng and Quanshi Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=SvF5JSbA0F}\n}",
        "github": "",
        "project": "",
        "reviewers": "5igS;yWZn;DNgx",
        "site": "https://openreview.net/forum?id=SvF5JSbA0F",
        "pdf_size": 1251214,
        "rating": "3;3;6",
        "confidence": "3;2;2",
        "soundness": "2;2;3",
        "contribution": "2;1;2",
        "presentation": "3;1;3",
        "wc_summary": "49;212;116",
        "wc_strengths": "17;20;40",
        "wc_weaknesses": "31;659;150",
        "wc_questions": "126;83;3",
        "wc_review": "223;974;309",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            125.66666666666667,
            66.89461031270673
        ],
        "wc_strengths_avg": [
            25.666666666666668,
            10.208928554075703
        ],
        "wc_weaknesses_avg": [
            280.0,
            272.36127967585014
        ],
        "wc_questions_avg": [
            70.66666666666667,
            50.96621974951208
        ],
        "wc_review_avg": [
            502.0,
            335.5959872624622
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:sVemchYWSZAJ:scholar.google.com/&scioq=Extracting+Robust+On-Manifold+Interactions+Encoded+by+Neural+Networks&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Shanghai Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sjtu.edu.cn",
        "aff_unique_abbr": "SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "Svy1XoOLXj",
        "title": "BiLoRA: A Bi-level Optimization Framework for Low-rank Adapters",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Low-rank adaptations (LoRA) are widely employed for fine-tuning large-scale pretrained models in downstream tasks, by learning low-rank incremental matrices. LoRA and its variants such as AdaLoRA train an entire low-rank incremental matrix on a single training dataset, which often leads to overfitting to training data and inferior generalization on test data. To address this problem, we propose a bi-level optimization (BLO) based method for alleviating overfitting. Our method parameterizes a low-rank incremental matrix in a pseudo singular value decomposition form, and separates the training of pseudo singular  vectors and values onto different data subsets in different optimization problems. This separation alleviates the risk of overfitting to a single dataset and improves generalization on other data. \nSpecifically, in the lower level of our BLO formulation, we train  the pseudo singular vectors on a subset of the training data. In the upper level, we learn  the pseudo singular values on the other subset of the training data. The two levels of optimization problems are mutually dependent on each other and solved jointly. On ten datasets from natural language understanding and generation tasks and on various popular large pretrained models, our method achieves significantly better performance than LoRA,  AdaLoRA, and other fine-tuning baseline methods  with similar amounts of trainable parameters.",
        "keywords": "Parameter-efficient fine-tuning;Natural language processing;Low-rank adaptation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/52e6535173eab135f0eb6ee299f528ff7f62d94e.zip",
        "author": "Rushi Qiang;Ruiyi Zhang;Pengtao Xie",
        "authorids": "~Rushi_Qiang1;~Ruiyi_Zhang4;~Pengtao_Xie3",
        "gender": "M;M;M",
        "homepage": "https://github.com/jerrycool2002;;https://pengtaoxie.github.io/",
        "dblp": "372/2703;;133/1998",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;D7EXgU0AAAAJ;cnncomYAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Rushi_Qiang1;~Ruiyi_Zhang4;~Pengtao_Xie3",
        "aff": "Georgia Institute of Technology;University of California, San Diego;Carnegie Mellon University",
        "aff_domain": "gatech.edu;ucsd.edu; ",
        "position": "PhD student;PhD student;Graduate Student",
        "bibtex": "@misc{\nqiang2024bilora,\ntitle={BiLo{RA}: A Bi-level Optimization Framework for Low-rank Adapters},\nauthor={Rushi Qiang and Ruiyi Zhang and Pengtao Xie},\nyear={2024},\nurl={https://openreview.net/forum?id=Svy1XoOLXj}\n}",
        "github": "",
        "project": "",
        "reviewers": "MGLE;hUsX;3MBr;YcPD",
        "site": "https://openreview.net/forum?id=Svy1XoOLXj",
        "pdf_size": 1877969,
        "rating": "5;5;6;6",
        "confidence": "4;3;3;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;2",
        "presentation": "3;3;3;4",
        "wc_summary": "94;62;46;99",
        "wc_strengths": "92;40;56;44",
        "wc_weaknesses": "171;51;140;81",
        "wc_questions": "66;36;2;112",
        "wc_review": "423;189;244;336",
        "wc_reply_reviewers": "81;0;0;36",
        "wc_reply_authors": "1743;1437;1167;1658",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "3;3;3;3",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            75.25,
            22.060994991160303
        ],
        "wc_strengths_avg": [
            58.0,
            20.493901531919196
        ],
        "wc_weaknesses_avg": [
            110.75,
            47.27776961744283
        ],
        "wc_questions_avg": [
            54.0,
            40.422765862815474
        ],
        "wc_review_avg": [
            298.0,
            89.25525194631406
        ],
        "wc_reply_reviewers_avg": [
            29.25,
            33.29695932063467
        ],
        "wc_reply_authors_avg": [
            1501.25,
            222.97127057089665
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.0,
            0.0
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3416387715401989133&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Georgia Institute of Technology;University of California, San Diego;Carnegie Mellon University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.gatech.edu;https://www.ucsd.edu;https://www.cmu.edu",
        "aff_unique_abbr": "Georgia Tech;UCSD;CMU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";San Diego",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Sw0O2ESxbf",
        "title": "Collapsing the Learning: Crafting Broadly Transferable Unlearnable Examples",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The success of Artificial Intelligence (AI) can be largely attributed to the availability of high-quality data for constructing machine learning models. Recently, the importance of data in AI has been significantly emphasized, leading to concerns regarding the secure utilization of data, particularly in the context of unauthorized usage. To address data exploitation, data unlearning has been introduced as a method to render data unexploitable by generating unlearnable examples. However, existing unlearnable examples lack the necessary generalization for broad applicability. In this paper, we propose a novel data protection method that generates robust transferable unlearnable examples, ensuring their effectiveness across diverse network architectures, even under challenging adversarial training conditions. To the best of our knowledge, our approach is the first to generate transferable unlearnable examples by leveraging data collapse as a means to reduce the information contained in data. Moreover, we modify the conventional adversarial training process to ensure that our unlearnable examples maintain robust transferability, even when the targeted model undergoes adversarial training. Comprehensive experiments demonstrate that the unlearnable examples generated by our method exhibit superior robust transferability compared to other state-of-the-art techniques.",
        "keywords": "unlearnable examples;data privacy;Data Availablity Attacks",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Bin Fang;Bo Li;Shuang Wu;Shouhong Ding;Tianyi Zheng;Ran Yi;Lizhuang Ma",
        "authorids": "~Bin_Fang6;~Bo_Li20;~Shuang_Wu7;~Shouhong_Ding3;~Tianyi_Zheng2;~Ran_Yi1;~Lizhuang_Ma1",
        "gender": "M;M;M;M;M;F;M",
        "homepage": "https://github.com/EuterpeK;https://libraboli.github.io/;;;;https://yiranran.github.io/;http://english.seiee.sjtu.edu.cn/english/detail/841_680.htm",
        "dblp": ";50/3402-115;85/3231-1;119/6735;;136/5469;10/4950",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com.hk/citations?hl=zh-CN;Na9u1wMAAAAJ;OGf40fkAAAAJ;https://scholar.google.com.hk/citations?user=ojUZAN0AAAAJ;https://scholar.google.com.hk/citations?user=y68DLo4AAAAJ;https://scholar.google.com.tw/citations?user=yd58y_0AAAAJ",
        "orcid": ";;;0000-0002-3175-3553;;0000-0003-1858-3358;",
        "linkedin": ";;;;;;",
        "or_profile": "~Bin_Fang6;~Bo_Li20;~Shuang_Wu7;~Shouhong_Ding3;~Tianyi_Zheng2;~Ran_Yi1;~Lizhuang_Ma1",
        "aff": "Shanghai Jiaotong University;Tencent Youtu Lab;Tencent YouTu Lab;Tencent Youtu Lab;Shanghai Jiaotong University;Shanghai Jiaotong University;Dept. of Computer Sci. & Eng., Shanghai Jiao Tong University",
        "aff_domain": "sjtu.edu.cn;tencent.com;tencent.com;tencent.com;sjtu.edu.cn;sjtu.edu.cn;cs.sjtu.edu.cn",
        "position": "MS student;Researcher;Researcher;researcher;PhD student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nfang2024collapsing,\ntitle={Collapsing the Learning: Crafting Broadly Transferable Unlearnable Examples},\nauthor={Bin Fang and Bo Li and Shuang Wu and Shouhong Ding and Tianyi Zheng and Ran Yi and Lizhuang Ma},\nyear={2024},\nurl={https://openreview.net/forum?id=Sw0O2ESxbf}\n}",
        "github": "",
        "project": "",
        "reviewers": "x3eU;KXx5;czgC;qwUi",
        "site": "https://openreview.net/forum?id=Sw0O2ESxbf",
        "pdf_size": 2209247,
        "rating": "3;5;5;6",
        "confidence": "5;2;3;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "1;3;2;3",
        "wc_summary": "11;52;79;37",
        "wc_strengths": "11;49;45;24",
        "wc_weaknesses": "79;183;63;83",
        "wc_questions": "5;116;117;142",
        "wc_review": "106;400;304;286",
        "wc_reply_reviewers": "0;0;0;130",
        "wc_reply_authors": "476;2565;1040;1189",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "2;5;3;4",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            44.75,
            24.620875289071265
        ],
        "wc_strengths_avg": [
            32.25,
            15.514106484100203
        ],
        "wc_weaknesses_avg": [
            102.0,
            47.36032094485847
        ],
        "wc_questions_avg": [
            95.0,
            52.99528280894442
        ],
        "wc_review_avg": [
            274.0,
            106.23558725775464
        ],
        "wc_reply_reviewers_avg": [
            32.5,
            56.29165124598851
        ],
        "wc_reply_authors_avg": [
            1317.5,
            767.772264411785
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.5,
            1.118033988749895
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5129891760425771,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:I9iiIEr8pCwJ:scholar.google.com/&scioq=Collapsing+the+Learning:+Crafting+Broadly+Transferable+Unlearnable+Examples&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1;0;0;0",
        "aff_unique_norm": "Shanghai Jiao Tong University;Tencent",
        "aff_unique_dep": ";Youtu Lab",
        "aff_unique_url": "https://www.sjtu.edu.cn;https://www.tencent.com",
        "aff_unique_abbr": "SJTU;Tencent",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "CRITIC: Large Language Models Can Self-Correct with Tool-Interactive Critiquing",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18586",
        "id": "Sx038qxjek",
        "author_site": "Zhibin Gou, Zhihong Shao, Yeyun Gong, yelong shen, Yujiu Yang, Nan Duan, Weizhu Chen",
        "tldr": "",
        "abstract": "Recent developments in large language models (LLMs) have been impressive. However, these models sometimes show inconsistencies and problematic behavior, such as hallucinating facts, generating flawed code, or creating offensive and toxic content. Unlike these models, humans typically utilize external tools to cross-check and refine their initial content, like using a search engine for fact-checking, or a code interpreter for debugging. Inspired by this observation, we introduce a framework called CRITIC that allows LLMs, which are essentially \u201cblack boxes\u201d to validate and progressively amend their own outputs in a manner similar to human interaction with tools. More specifically, starting with an initial output, CRITIC interacts with appropriate tools to evaluate certain aspects of the text, and then revises the output based on the feedback obtained during this validation process. Comprehensive evaluations involving free-form question answering, mathematical program synthesis, and toxicity reduction demonstrate that CRITIC consistently enhances the performance of LLMs. Meanwhile, our research highlights the crucial importance of external feedback in promoting the ongoing self-improvement of LLMs.",
        "keywords": "Large Language Models;In-context Learning;Self-Verification;Self-Correction;Truthfulness;Tool-use;Interaction",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "",
        "author": "Zhibin Gou;Zhihong Shao;Yeyun Gong;yelong shen;Yujiu Yang;Nan Duan;Weizhu Chen",
        "authorids": "~Zhibin_Gou1;~Zhihong_Shao1;~Yeyun_Gong2;~yelong_shen1;~Yujiu_Yang2;~Nan_Duan1;~Weizhu_Chen1",
        "gender": "M;M;M;;M;M;M",
        "homepage": "https://github.com/zubingou;;;;https://sites.google.com/view/iigroup-thu;https://nanduan.github.io/;https://www.microsoft.com/en-us/research/people/wzchen/",
        "dblp": "315/9328;247/5748;06/10400.html;;30/3847;;79/2536",
        "google_scholar": ";PZy4HEIAAAAJ;piUkwMYAAAAJ;;4gH3sxsAAAAJ;Qaa6OxIAAAAJ;LG_E-4EAAAAJ",
        "orcid": ";;;;0000-0002-6427-1024;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Zhibin_Gou1;~Zhihong_Shao1;~Yeyun_Gong2;~yelong_shen1;~Yujiu_Yang2;~Nan_Duan1;~Weizhu_Chen1",
        "aff": "Microsoft;Tsinghua University;Microsoft;;Tsinghua University;Microsoft Research Asia;Microsoft GenAI",
        "aff_domain": "microsoft.com;tsinghua.edu.cn;microsoft.com;;tsinghua.edu.cn;microsoft.com;microsoft.com",
        "position": "Intern;PhD student;Researcher;;Full Professor;Principal Researcher;Vice President",
        "bibtex": "@inproceedings{\ngou2024critic,\ntitle={{CRITIC}: Large Language Models Can Self-Correct with Tool-Interactive Critiquing},\nauthor={Zhibin Gou and Zhihong Shao and Yeyun Gong and yelong shen and Yujiu Yang and Nan Duan and Weizhu Chen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Sx038qxjek}\n}",
        "github": "",
        "project": "",
        "reviewers": "hutJ;ASEM;rWYL;dDfr",
        "pdf_size": 1077889,
        "rating": "5;5;8;8",
        "confidence": "3;4;5;4",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;2;4;3",
        "wc_summary": "37;86;71;65",
        "wc_strengths": "27;55;108;72",
        "wc_weaknesses": "138;193;15;138",
        "wc_questions": "15;74;53;21",
        "wc_review": "217;408;247;296",
        "wc_reply_reviewers": "134;875;18;19",
        "wc_reply_authors": "2084;3874;1270;600",
        "reply_reviewers": "2;2;1;1",
        "reply_authors": "5;9;3;2",
        "rating_avg": [
            6.5,
            1.5
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            64.75,
            17.75352077758099
        ],
        "wc_strengths_avg": [
            65.5,
            29.33001875212493
        ],
        "wc_weaknesses_avg": [
            121.0,
            65.18818911428664
        ],
        "wc_questions_avg": [
            40.75,
            24.02472684548151
        ],
        "wc_review_avg": [
            292.0,
            72.66704892865816
        ],
        "wc_reply_reviewers_avg": [
            261.5,
            357.3293298905087
        ],
        "wc_reply_authors_avg": [
            1957.0,
            1225.1975350938312
        ],
        "reply_reviewers_avg": [
            1.5,
            0.5
        ],
        "reply_authors_avg": [
            4.75,
            2.680951323690902
        ],
        "replies_avg": [
            32,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.7071067811865476,
        "gs_citation": 347,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=847439943785631377&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=Sx038qxjek",
        "pdf": "https://openreview.net/pdf?id=Sx038qxjek",
        "email": "microsoft.com;tsinghua.edu.cn;microsoft.com;;tsinghua.edu.cn;microsoft.com;microsoft.com",
        "author_num": 7,
        "aff_unique_index": "0;1;0;1;0;0",
        "aff_unique_norm": "Microsoft;Tsinghua University",
        "aff_unique_dep": "Microsoft Corporation;",
        "aff_unique_url": "https://www.microsoft.com;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "Microsoft;THU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Asia",
        "aff_country_unique_index": "0;1;0;1;1;0",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "Variational Bayesian Last Layers",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18585",
        "id": "Sx7BIiPzys",
        "author_site": "James Harrison, John Willes, Jasper Snoek",
        "tldr": "",
        "abstract": "We introduce a deterministic variational formulation for training Bayesian last layer neural networks. This yields a sampling-free, single-pass model and loss that effectively improves uncertainty estimation. Our variational Bayesian last layer (VBLL) can be trained and evaluated with only quadratic complexity in last layer width, and is thus (nearly) computationally free to add to standard architectures. We experimentally investigate VBLLs, and show that they improve predictive accuracy, calibration, and out of distribution detection over baselines across both regression and classification. Finally, we investigate combining VBLL layers with variational Bayesian feature learning, yielding a lower variance collapsed variational inference method for Bayesian neural networks.",
        "keywords": "bayesian deep learning;variational methods;bayesian last layers;neural linear models",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "James Harrison;John Willes;Jasper Snoek",
        "authorids": "~James_Harrison1;~John_Willes2;~Jasper_Snoek1",
        "gender": ";;M",
        "homepage": ";;",
        "dblp": ";;95/6097",
        "google_scholar": "-tEiRFcAAAAJ;;FM2DTXwAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~James_Harrison1;~John_Willes2;~Jasper_Snoek1",
        "aff": "Google;;Google",
        "aff_domain": "google.com;;google.com",
        "position": "Researcher;;Research Scientist",
        "bibtex": "@inproceedings{\nharrison2024variational,\ntitle={Variational Bayesian Last Layers},\nauthor={James Harrison and John Willes and Jasper Snoek},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Sx7BIiPzys}\n}",
        "github": "",
        "project": "",
        "reviewers": "vugz;b26R;tM8T;tT7z",
        "pdf_size": 7134451,
        "rating": "6;8;8;10",
        "confidence": "4;4;4;4",
        "soundness": "2;4;3;4",
        "contribution": "2;4;3;4",
        "presentation": "3;4;3;4",
        "wc_summary": "62;54;88;108",
        "wc_strengths": "59;124;117;82",
        "wc_weaknesses": "495;128;293;62",
        "wc_questions": "139;11;93;46",
        "wc_review": "755;317;591;298",
        "wc_reply_reviewers": "0;0;29;0",
        "wc_reply_authors": "1079;169;1038;192",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "2;1;2;1",
        "rating_avg": [
            8.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            3.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            78.0,
            21.400934559032695
        ],
        "wc_strengths_avg": [
            95.5,
            26.405491853021786
        ],
        "wc_weaknesses_avg": [
            244.5,
            167.3178113650785
        ],
        "wc_questions_avg": [
            72.25,
            48.28755015529365
        ],
        "wc_review_avg": [
            490.25,
            191.8454781849184
        ],
        "wc_reply_reviewers_avg": [
            7.25,
            12.55736835487436
        ],
        "wc_reply_authors_avg": [
            619.5,
            439.3145228648832
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 36,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8100317155820755913&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=Sx7BIiPzys",
        "pdf": "https://openreview.net/pdf?id=Sx7BIiPzys",
        "email": "google.com;;google.com",
        "author_num": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Google",
        "aff_unique_dep": "Google",
        "aff_unique_url": "https://www.google.com",
        "aff_unique_abbr": "Google",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Mountain View",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Emergent Communication with Conversational Repair",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18584",
        "id": "Sy8upuD6Bw",
        "tldr": "",
        "abstract": "Research on conversation has put emphasis on the importance of a multi-level communication system, in which the interlocutors aim to establish and maintain common ground. In natural conversations, repair mechanisms such as clarification requests are frequently used to improve mutual understanding.\nHere we explore the effects of conversational repair on languages emerging in signaling games. We extend the basic Lewis signaling game setup with a feedback channel that allows for the transmission of messages backwards from the receiver to the sender. Further, we add noise to the communication channel so that repair mechanisms become necessary for optimal performance.\n\nWe find that languages emerging in setups with feedback channel are less compositional.\nHowever, the models still achieve a substantially higher generalization performance in conditions with noise, putting to question the role of compositionality for generalization.\nThese findings generalize also to a more realistic case involving a guessing game with naturalistic images.\n\nMore broadly speaking, this study provides an important step towards the creation of signaling games that more closely resemble the conditions under which human languages emerged.",
        "keywords": "emergent communication;conversation;signaling games;language evolution",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "Mitja Nikolaus",
        "authorids": "~Mitja_Nikolaus1",
        "gender": "",
        "homepage": "",
        "dblp": "",
        "google_scholar": "",
        "orcid": "",
        "linkedin": "",
        "or_profile": "",
        "aff": "",
        "aff_domain": "",
        "position": "",
        "bibtex": "@inproceedings{\nnikolaus2024emergent,\ntitle={Emergent Communication with Conversational Repair},\nauthor={Mitja Nikolaus},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Sy8upuD6Bw}\n}",
        "github": "",
        "project": "",
        "reviewers": "R7xc;p6xc;3F5Q",
        "pdf_size": 7014945,
        "rating": "5;6;8",
        "confidence": "3;3;4",
        "soundness": "3;3;4",
        "contribution": "2;3;3",
        "presentation": "2;3;4",
        "wc_summary": "72;61;101",
        "wc_strengths": "51;90;71",
        "wc_weaknesses": "354;123;66",
        "wc_questions": "33;80;107",
        "wc_review": "510;354;345",
        "wc_reply_reviewers": "40;0;0",
        "wc_reply_authors": "455;530;470",
        "reply_reviewers": "1;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            78.0,
            16.87206764645835
        ],
        "wc_strengths_avg": [
            70.66666666666667,
            15.923427883328248
        ],
        "wc_weaknesses_avg": [
            181.0,
            124.52309022827855
        ],
        "wc_questions_avg": [
            73.33333333333333,
            30.57595278791634
        ],
        "wc_review_avg": [
            403.0,
            75.7495874576225
        ],
        "wc_reply_reviewers_avg": [
            13.333333333333334,
            18.856180831641264
        ],
        "wc_reply_authors_avg": [
            485.0,
            32.4037034920393
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0.944911182523068,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16485603943854383584&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=Sy8upuD6Bw",
        "pdf": "https://openreview.net/pdf?id=Sy8upuD6Bw",
        "email": "",
        "author_num": 1
    },
    {
        "id": "SyuQKk7sX2",
        "title": "(Dynamic) Prompting might be all you need to repair Compressed LLMs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs), while transformative for NLP, come with significant computational demands, underlining the need for efficient, training-free compression. Notably, the reliability of perplexity as a benchmark for compressed model efficacy is in question, as our tests using LLaMA-7B and OPT-6.7b reveal a significant performance drop in several realistic downstream tasks, underscoring the disparity between perplexity as a performance indicator and real-world performance. Investigation into the trade-off between resource-intensive post-compression re-training highlights the prospect of prompt-driven recovery as a lightweight adaption tool. However, existing studies, confined mainly to perplexity evaluations and simple tasks, fail to offer unequivocal confidence in the scalability and generalizability of prompting.We tackle this uncertainty in two key ways. First, we uncover the vulnerability of naive prompts in LLM compression as an over-reliance on a singular prompt per input. In response, we propose \\textit{inference-time dynamic prompting} (IDP), a mechanism that autonomously chooses from a set of curated prompts based on the context of each individual input. Second, we delve into a scientific understanding of why ``prompting might be all you need post-LLM compression\". Our findings suggest that compression doesn't irretrievably erase LLM model knowledge but displace it, necessitating a new inference path. IDP effectively redirects this path, enabling the model to tap into its inherent yet displaced knowledge and thereby recover performance. Empirical tests affirm the value of IDP, demonstrating an average performance improvement of 1.24\\% across nine varied tasks spanning multiple knowledge domains.",
        "keywords": "LLMs;Compression;Prompting",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Duc N.M Hoang;Minsik Cho;Thomas Merth;Mohammad Rastegari;Zhangyang Wang",
        "authorids": "~Duc_N.M_Hoang1;~Minsik_Cho1;~Thomas_Merth2;~Mohammad_Rastegari2;~Zhangyang_Wang1",
        "gender": "M;M;M;M;M",
        "homepage": ";;;https://mrastegari.github.io/;https://vita-group.github.io",
        "dblp": ";;;31/5228;119/4026",
        "google_scholar": "v7S4UNcAAAAJ;_AZys7EAAAAJ;;N4-2Z_cAAAAJ;pxFyKAIAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;https://www.google.com/url?sa=t&rct=j&q=&esrc=s&source=web&cd=&cad=rja&uact=8&ved=2ahUKEwjeqPL1wbX6AhUYADQIHQuHCiEQFnoECAgQAQ&url=https%3A%2F%2Fwww.linkedin.com%2Fin%2Fthomas-merth&usg=AOvVaw0Zc9tUoZi9bmAfDVWzwB71;;",
        "or_profile": "~Duc_N.M_Hoang1;~Minsik_Cho1;~Thomas_Merth2;~Mohammad_Rastegari2;~Zhangyang_Wang1",
        "aff": "University of Texas, Austin;;;Department of Computer Science, University of Washington;University of Texas at Austin",
        "aff_domain": "utexas.edu;;;cs.washington.edu;utexas.edu",
        "position": "PhD student;;;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nhoang2024dynamic,\ntitle={(Dynamic) Prompting might be all you need to repair Compressed {LLM}s},\nauthor={Duc N.M Hoang and Minsik Cho and Thomas Merth and Mohammad Rastegari and Zhangyang Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=SyuQKk7sX2}\n}",
        "github": "",
        "project": "",
        "reviewers": "gfXp;dG5d;UB9L;zxJa",
        "site": "https://openreview.net/forum?id=SyuQKk7sX2",
        "pdf_size": 390051,
        "rating": "3;3;6;8",
        "confidence": "4;3;3;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "103;105;89;93",
        "wc_strengths": "95;46;131;20",
        "wc_weaknesses": "473;120;84;47",
        "wc_questions": "58;7;72;28",
        "wc_review": "729;278;376;188",
        "wc_reply_reviewers": "55;215;0;0",
        "wc_reply_authors": "1334;1025;544;162",
        "reply_reviewers": "1;2;0;0",
        "reply_authors": "4;4;2;2",
        "rating_avg": [
            5.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            97.5,
            6.689544080129826
        ],
        "wc_strengths_avg": [
            73.0,
            42.970920399730794
        ],
        "wc_weaknesses_avg": [
            181.0,
            170.5505790081054
        ],
        "wc_questions_avg": [
            41.25,
            25.370997221236692
        ],
        "wc_review_avg": [
            392.75,
            205.20401433695199
        ],
        "wc_reply_reviewers_avg": [
            67.5,
            88.06957476904269
        ],
        "wc_reply_authors_avg": [
            766.25,
            448.27579401524684
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.0,
            1.0
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5443310539518174,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:4lw44ydpJFUJ:scholar.google.com/&scioq=(Dynamic)+Prompting+might+be+all+you+need+to+repair+Compressed+LLMs&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Texas at Austin;University of Washington",
        "aff_unique_dep": ";Department of Computer Science",
        "aff_unique_url": "https://www.utexas.edu;https://www.washington.edu",
        "aff_unique_abbr": "UT Austin;UW",
        "aff_campus_unique_index": "0;1;0",
        "aff_campus_unique": "Austin;Seattle",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "SzV37yefM4",
        "title": "Contrastive Decoding Improves Reasoning in Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We demonstrate that Contrastive Decoding -- a simple, computationally light, and training-free text generation method proposed by Li et al 2022 -- achieves large out-of-the-box improvements over greedy decoding on a variety of reasoning tasks. Originally shown to improve the perceived quality of long-form text generation, Contrastive Decoding searches for strings that maximize a weighted difference in likelihood between strong and weak models. We show that Contrastive Decoding leads LLaMA-65B to outperform LLaMA 2, GPT-3.5 and PaLM 2-L on the HellaSwag commonsense reasoning benchmark, and to outperform LLaMA 2, GPT-3.5 and PaLM-540B on the GSM8K math word reasoning benchmark, in addition to improvements on a collection of other tasks. Analysis suggests that Contrastive Decoding improves over existing methods by preventing some abstract reasoning errors, as well as by avoiding simpler modes such as copying sections of the input during chain-of-thought. Overall, Contrastive Decoding outperforms nucleus sampling for long-form generation and greedy decoding for reasoning tasks, making it a powerful general purpose method for generating text from language models.",
        "keywords": "natural language processing;language models;contrastive decoding;decoding;reasoning",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Sean O'Brien;Mike Lewis",
        "authorids": "~Sean_O'Brien1;~Mike_Lewis1",
        "gender": "M;M",
        "homepage": ";",
        "dblp": ";19/6214",
        "google_scholar": "https://scholar.google.com/citations?hl=en;SnQnQicAAAAJ",
        "orcid": ";",
        "linkedin": "https://linkedin.com/in/cal-sean-obrien;",
        "or_profile": "~Sean_O'Brien1;~Mike_Lewis1",
        "aff": "University of California, San Diego;Facebook AI Research",
        "aff_domain": "ucsd.edu;fb.com",
        "position": "PhD student;Research Scientist",
        "bibtex": "@misc{\no'brien2024contrastive,\ntitle={Contrastive Decoding Improves Reasoning in Large Language Models},\nauthor={Sean O'Brien and Mike Lewis},\nyear={2024},\nurl={https://openreview.net/forum?id=SzV37yefM4}\n}",
        "github": "",
        "project": "",
        "reviewers": "Y5Km;ee57;CBdx",
        "site": "https://openreview.net/forum?id=SzV37yefM4",
        "pdf_size": 1072033,
        "rating": "3;5;5",
        "confidence": "4;5;4",
        "soundness": "3;3;2",
        "contribution": "1;3;2",
        "presentation": "3;3;3",
        "wc_summary": "107;162;51",
        "wc_strengths": "79;72;87",
        "wc_weaknesses": "108;147;129",
        "wc_questions": "179;112;13",
        "wc_review": "473;493;280",
        "wc_reply_reviewers": "38;6;32",
        "wc_reply_authors": "722;591;428",
        "reply_reviewers": "1;1;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            106.66666666666667,
            45.31617322276403
        ],
        "wc_strengths_avg": [
            79.33333333333333,
            6.128258770283411
        ],
        "wc_weaknesses_avg": [
            128.0,
            15.937377450509228
        ],
        "wc_questions_avg": [
            101.33333333333333,
            68.18764958227814
        ],
        "wc_review_avg": [
            415.3333333333333,
            96.04281452676312
        ],
        "wc_reply_reviewers_avg": [
            25.333333333333332,
            13.888444437333106
        ],
        "wc_reply_authors_avg": [
            580.3333333333334,
            120.26175156253501
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 48,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9223350434841837990&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of California, San Diego;Meta",
        "aff_unique_dep": ";Facebook AI Research",
        "aff_unique_url": "https://www.ucsd.edu;https://research.facebook.com",
        "aff_unique_abbr": "UCSD;FAIR",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "San Diego;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "SznHfMwmjG",
        "title": "Measuring Feature Sparsity in Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent works have proposed that intermediate activations in language models can be modelled as sparse linear combinations of vectors corresponding to features of the input text. Under this assumption, these works have aimed to reconstruct these feature directions using sparse coding. We develop metrics which can be used to assess the success of these sparse coding techniques and thereby implicitly test the validity of the linearity and sparsity assumptions. We show that our metrics can predict the level of sparsity on synthetic sparse linear activations, and that they can distinguish between sparse linear data and several other distributions. We use our metrics to measure the level of sparsity in several language models. We find evidence that language model activations can be accurately modelled by sparse linear combinations of features, significantly more so than control datasets. We also show that model activations appear to be sparsest in the first and final layers, and least sparse in middle layers.",
        "keywords": "sparse coding;sparse dictionary learning;interpretability;language models;superposition;polysemanticity;metrics",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Mingyang Deng;Lucas Tao;Joe Benton",
        "authorids": "~Mingyang_Deng1;~Lucas_Tao2;~Joe_Benton1",
        "gender": "M;;M",
        "homepage": "https://lambertae.github.io/;;https://joejbenton.com/",
        "dblp": ";;",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;;ywp_eYsAAAAJ",
        "orcid": ";;0000-0002-2103-6112",
        "linkedin": ";;joe-benton-686420157/",
        "or_profile": "~Mingyang_Deng1;~Lucas_Tao2;~Joe_Benton1",
        "aff": "Massachusetts Institute of Technology;;Anthropic",
        "aff_domain": "mit.edu;;anthropic.com",
        "position": "PhD student;;Researcher",
        "bibtex": "@misc{\ndeng2024measuring,\ntitle={Measuring Feature Sparsity in Language Models},\nauthor={Mingyang Deng and Lucas Tao and Joe Benton},\nyear={2024},\nurl={https://openreview.net/forum?id=SznHfMwmjG}\n}",
        "github": "",
        "project": "",
        "reviewers": "CS4c;de3y;EBCo;5HjV",
        "site": "https://openreview.net/forum?id=SznHfMwmjG",
        "pdf_size": 1611777,
        "rating": "3;3;3;5",
        "confidence": "3;4;3;3",
        "soundness": "2;1;2;3",
        "contribution": "2;2;1;2",
        "presentation": "3;3;3;3",
        "wc_summary": "78;42;65;105",
        "wc_strengths": "62;71;56;122",
        "wc_weaknesses": "88;278;56;125",
        "wc_questions": "284;34;50;2",
        "wc_review": "512;425;227;354",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            72.5,
            22.76510487566442
        ],
        "wc_strengths_avg": [
            77.75,
            26.099568961957974
        ],
        "wc_weaknesses_avg": [
            136.75,
            85.12747793750265
        ],
        "wc_questions_avg": [
            92.5,
            111.90509371784647
        ],
        "wc_review_avg": [
            379.5,
            104.32281629634046
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2594075940015158390&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Massachusetts Institute of Technology;Anthropic",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://web.mit.edu;https://www.anthropic.com",
        "aff_unique_abbr": "MIT;Anthropic",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "T0FuEDnODP",
        "title": "Cooperative Graph Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph neural networks are popular architectures for graph machine learning, based on iterative computation of node representations of an input graph through a series of invariant transformations. A large class of graph neural networks follow a standard message-passing paradigm: at every layer, each node state is updated based on an aggregate of messages from its neighborhood. In this work, we propose a novel framework for training graph neural networks, where every node is viewed as a player that can choose to either listen, broadcast, listen and broadcast, or to isolate. The standard message propagation scheme can then be viewed as a special case of this framework where every node `listens and broadcasts' to all neighbors. Our approach offers a more flexible and dynamic message-passing paradigm, where each node can determine its own strategy based on their state,  effectively exploring the graph topology while learning. We provide a theoretical analysis of the new message-passing scheme which is further supported by an extensive empirical analysis on a synthetic dataset and on real-world datasets.",
        "keywords": "graph neural networks;dynamic message passing;information flow",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/10ca3b43cad24d15c6f0f78c4040f6936e1150ef.pdf",
        "author": "Ben Finkelshtein;Xingyue Huang;Michael M. Bronstein;Ismail Ilkan Ceylan",
        "authorids": "~Ben_Finkelshtein1;~Xingyue_Huang1;~Michael_M._Bronstein1;~Ismail_Ilkan_Ceylan2",
        "gender": "M;M;M;",
        "homepage": "https://benfinkelshtein.github.io/;https://github.com/HxyScotthuang;http://www.inf.usi.ch/bronstein/;https://www.cs.ox.ac.uk/people/ismaililkan.ceylan/",
        "dblp": "278/2449.html;208/4778;07/2668;147/6111",
        "google_scholar": "goWM7VwAAAAJ;qah4McsAAAAJ;UU3N6-UAAAAJ;avJ5kQcAAAAJ",
        "orcid": ";;;0000-0003-4118-4689",
        "linkedin": "ben-finkelshtein/;xingyue-huang-1251651a2/;mbronstein/;",
        "or_profile": "~Ben_Finkelshtein1;~Xingyue_Huang1;~Michael_M._Bronstein1;~Ismail_Ilkan_Ceylan2",
        "aff": "University of Oxford;University of Oxford;University of Oxford;University of Oxford",
        "aff_domain": "cs.ox.ac.uk;cs.ox.ac.uk;ox.ac.uk;oxford.ac.uk",
        "position": "PhD student;PhD student;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nfinkelshtein2024cooperative,\ntitle={Cooperative Graph Neural Networks},\nauthor={Ben Finkelshtein and Xingyue Huang and Michael M. Bronstein and Ismail Ilkan Ceylan},\nyear={2024},\nurl={https://openreview.net/forum?id=T0FuEDnODP}\n}",
        "github": "",
        "project": "",
        "reviewers": "nWqM;8ypJ;9qTL;7kxJ",
        "site": "https://openreview.net/forum?id=T0FuEDnODP",
        "pdf_size": 1188516,
        "rating": "3;5;6;8",
        "confidence": "5;4;3;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;4",
        "presentation": "3;2;3;4",
        "wc_summary": "32;101;61;65",
        "wc_strengths": "65;81;73;68",
        "wc_weaknesses": "430;186;123;56",
        "wc_questions": "247;97;83;4",
        "wc_review": "774;465;340;193",
        "wc_reply_reviewers": "95;0;50;94",
        "wc_reply_authors": "2205;1644;1169;747",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "5;4;3;3",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            64.75,
            24.498724456591614
        ],
        "wc_strengths_avg": [
            71.75,
            6.057020719792859
        ],
        "wc_weaknesses_avg": [
            198.75,
            141.20441742381857
        ],
        "wc_questions_avg": [
            107.75,
            87.86744277603623
        ],
        "wc_review_avg": [
            443.0,
            213.98247591800595
        ],
        "wc_reply_reviewers_avg": [
            59.75,
            38.98958194184698
        ],
        "wc_reply_authors_avg": [
            1441.25,
            543.2597790192092
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.75,
            0.82915619758885
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9198662110077999,
        "gs_citation": 25,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12907554645302309822&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of Oxford",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ox.ac.uk",
        "aff_unique_abbr": "Oxford",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "T0hhkuv8I0",
        "title": "TKG-LM: Temporal Knowledge Graph Extrapolation Enhanced by Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Temporal Knowledge Graph (TKG) extrapolation aims to predict future missing facts based on historical information. While graph embedding methods based on TKG topology structure have achieved satisfactory performance, the semantic text information of entities and relations still needs to be fully exploited. As large language models (LMs) such as ChatGPT sweep the entire field of natural language processing field, considerable works about KGs augment LMs with structured representations of world knowledge. In this paper, we proposed a method called TKG-LM to fill the gap in the effective integration of TKG and LMs, including historical events pruning, sampling prompt construction, and layer-wise modality fusion. Specifically, we adopt a pruning strategy to extract valuable events from numerous historical facts and reduce the search space for answers. Then, LMs and time-weighted functions are adopted to score the semantic similarity of each neighbor tuple, and the history-sampling prompt is built as the input of LMs. We integrate the encoded representation of LMs and graph neural networks in a multi-layer framework to enable bidirectional information flow between the modalities. This facilitates the incorporation of structured topology knowledge into the language context representation while leveraging linguistic nuances to enhance the graphical representation of knowledge. Our TKG-LM outperforms state-of-the-art (SOTA) TKG methods on five standard TKG datasets and beats the existing LLM and LM+KG models. Further ablation experiments demonstrate the role of our module designs and the benefits of integrating LM and GNN representation.",
        "keywords": "Knowledge Graph Reasoning;Temporal Knowledge Graph;Large Language Model",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Tianli Zhang;Tongya Zheng;Zulong Chen;Liangyue Li;Zunlei Feng;Dongxiang Zhang;Mingli Song",
        "authorids": "~Tianli_Zhang1;~Tongya_Zheng1;~Zulong_Chen1;~Liangyue_Li1;~Zunlei_Feng1;~Dongxiang_Zhang2;~Mingli_Song1",
        "gender": "M;M;M;M;M;M;M",
        "homepage": "https://github.com/tianlizhang;https://doujiang-zheng.github.io/;https://www.semanticscholar.org/author/Zulong-Chen/8157135;http://www.public.asu.edu/~liangyue/;https://person.zju.edu.cn/en/zunleifeng;https://person.zju.edu.cn/zhangdongxiang;https://person.zju.edu.cn/msong",
        "dblp": ";245/8743;278/9803.html;https://dblp.uni-trier.de/pers/hd/l/Li:Liangyue;191/2455;89/6013;71/5333",
        "google_scholar": ";Ko2OtGgAAAAJ;https://scholar.google.com.hk/citations?user=nUVmSqUAAAAJ;xkx5nVQAAAAJ;wMtjcGwAAAAJ;nYN9A3IAAAAJ;7oLbhAwAAAAJ",
        "orcid": ";0000-0003-1190-9773;0000-0003-0807-6889;;;;0000-0003-2621-6048",
        "linkedin": ";;;;;;",
        "or_profile": "~Tianli_Zhang1;~Tongya_Zheng1;~Zulong_Chen1;~Liangyue_Li1;~Zunlei_Feng1;~Dongxiang_Zhang2;~Mingli_Song1",
        "aff": "Zhejiang University;Hangzhou City University;Alibaba Group;Amazon;Zhejiang University;Zhejiang University;Zhejiang University",
        "aff_domain": "zju.edu.cn;hzcu.edu.cn;alibaba-inc.com;amazon.com;zju.edu.cn;zju.edu.cn;zju.edu.cn",
        "position": "MS student;Postdoc;Principal Researcher;Applied Scientist;Associate Professor;Researcher;Full Professor",
        "bibtex": "@misc{\nzhang2024tkglm,\ntitle={{TKG}-{LM}: Temporal Knowledge Graph Extrapolation Enhanced by Language Models},\nauthor={Tianli Zhang and Tongya Zheng and Zulong Chen and Liangyue Li and Zunlei Feng and Dongxiang Zhang and Mingli Song},\nyear={2024},\nurl={https://openreview.net/forum?id=T0hhkuv8I0}\n}",
        "github": "",
        "project": "",
        "reviewers": "SrU9;ZuLH;CAix;Xuok",
        "site": "https://openreview.net/forum?id=T0hhkuv8I0",
        "pdf_size": 466251,
        "rating": "3;3;5;5",
        "confidence": "4;4;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;2",
        "presentation": "2;1;3;4",
        "wc_summary": "107;141;41;43",
        "wc_strengths": "70;42;30;122",
        "wc_weaknesses": "128;193;82;105",
        "wc_questions": "100;107;82;26",
        "wc_review": "405;483;235;296",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            83.0,
            42.731721238442994
        ],
        "wc_strengths_avg": [
            66.0,
            35.4400902933387
        ],
        "wc_weaknesses_avg": [
            127.0,
            41.430664971733194
        ],
        "wc_questions_avg": [
            78.75,
            31.7913117061879
        ],
        "wc_review_avg": [
            354.75,
            95.8706811282782
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:YONflrKoQesJ:scholar.google.com/&scioq=TKG-LM:+Temporal+Knowledge+Graph+Extrapolation+Enhanced+by+Language+Models&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;0;0;0",
        "aff_unique_norm": "Zhejiang University;Hangzhou City University;Alibaba Group;Amazon",
        "aff_unique_dep": ";;;Amazon.com, Inc.",
        "aff_unique_url": "https://www.zju.edu.cn;http://www.hghedu.com;https://www.alibaba.com;https://www.amazon.com",
        "aff_unique_abbr": "ZJU;;Alibaba;Amazon",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "T11rD8k578",
        "title": "Calibrated on Average, but not Within Each Slice: Few-shot Calibration for All Slices of a Distribution",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent work has uncovered promising ways to extract well-calibrated confidence estimates from language models (LMs), in which the model\u2019s confidence accurately reflects the probability that the answer is correct. However, while a model may be well-calibrated on average over some input distribution, the same model can actually be significantly miscalibrated within any narrower slice of the full distribution. For example, we find that a model may be well-calibrated over multiple-choice exam questions, but this calibration is the result of systematic overconfidence in one subject (e.g. math) getting balanced out by systematic underconfidence in another subject (e.g. history). In practice, being calibrated within narrower slices of a distribution is important because the full distribution is often formed from the queries of individual users who each only care about a narrower slice. In this work, we propose a new framework for calibrating models on any given slice of a distribution, using just a few unlabeled samples from that slice. Specifically, we train a model that approximates the precision-threshold curve for any given slice by using its few-shot samples to predict the LM\u2019s empirical precision at various confidence thresholds. This allows us to directly identify slice-specific thresholds above which the LM\u2019s predictions can be trusted (e.g. for a target precision of 90), and below which it should abstain. We also show that the precision curve can be mapped back to the classic calibration curve, which can guide adjusting the LM confidence to achieve lower calibration error. Experiments show that our fewshot recalibrator consistently outperforms existing calibration methods, for instance improving calibration error for PaLM2-Large on MMLU by 16%, as compared to temperature scaling.",
        "keywords": "calibration;language models;LMs;domains",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/922d468404531e9e203b7dc7804e79beea249921.pdf",
        "author": "Xiang Lisa Li;Urvashi Khandelwal;Kelvin Guu",
        "authorids": "~Xiang_Lisa_Li1;~Urvashi_Khandelwal1;~Kelvin_Guu1",
        "gender": "F;F;M",
        "homepage": "https://xiangli1999.github.io;;http://kelvinguu.com/",
        "dblp": "40/1491-63;135/6699;164/5838",
        "google_scholar": "nzA4P0oAAAAJ;2ITGSdgAAAAJ;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Xiang_Lisa_Li1;~Urvashi_Khandelwal1;~Kelvin_Guu1",
        "aff": "Stanford University;Google;Google",
        "aff_domain": "stanford.edu;google.com;google.com",
        "position": "PhD student;Research Scientist;Senior Research Scientist/Manager",
        "bibtex": "@misc{\nli2024calibrated,\ntitle={Calibrated on Average, but not Within Each Slice: Few-shot Calibration for All Slices of a Distribution},\nauthor={Xiang Lisa Li and Urvashi Khandelwal and Kelvin Guu},\nyear={2024},\nurl={https://openreview.net/forum?id=T11rD8k578}\n}",
        "github": "",
        "project": "",
        "reviewers": "QbDV;nvLA;fySy;LrPN",
        "site": "https://openreview.net/forum?id=T11rD8k578",
        "pdf_size": 1592012,
        "rating": "3;5;5;6",
        "confidence": "4;3;3;4",
        "soundness": "3;2;2;2",
        "contribution": "1;2;2;3",
        "presentation": "1;3;2;3",
        "wc_summary": "45;55;77;241",
        "wc_strengths": "54;44;60;117",
        "wc_weaknesses": "398;32;14;250",
        "wc_questions": "202;33;60;109",
        "wc_review": "699;164;211;717",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "489;149;161;197",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            104.5,
            79.6539390112002
        ],
        "wc_strengths_avg": [
            68.75,
            28.43743131859838
        ],
        "wc_weaknesses_avg": [
            173.5,
            159.46394576831466
        ],
        "wc_questions_avg": [
            101.0,
            64.3622560201241
        ],
        "wc_review_avg": [
            447.75,
            260.85760004262863
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            249.0,
            139.6853607218738
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.2294157338705618,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:0-Qx6kY1LJkJ:scholar.google.com/&scioq=Calibrated+on+Average,+but+not+Within+Each+Slice:+Few-shot+Calibration+for+All+Slices+of+a+Distribution&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Stanford University;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.stanford.edu;https://www.google.com",
        "aff_unique_abbr": "Stanford;Google",
        "aff_campus_unique_index": "0;1;1",
        "aff_campus_unique": "Stanford;Mountain View",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "T16M4SzH1v",
        "title": "Distributional Bellman Operators over Mean Embeddings",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We propose a novel algorithmic framework for distributional reinforcement learning, based on learning finite-dimensional mean embeddings  of return distributions. We derive several new algorithms for dynamic programming and temporal-difference learning based on this framework, provide asymptotic convergence theory, and examine the empirical performance of the algorithms on a suite of tabular tasks.   Further, we show that this approach can be straightforwardly combined with deep reinforcement learning, and obtain a new deep reinforcement learning agent that improves over baseline distributional approaches on the Arcade Learning Environment.",
        "keywords": "Reinforcement learning;distributional reinforcement learning;dynamic programming",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Li Kevin Wenliang;Gregoire Deletang;Matthew Aitchison;Marcus Hutter;Anian Ruoss;Arthur Gretton;Mark Rowland",
        "authorids": "~Li_Kevin_Wenliang1;~Gregoire_Deletang1;~Matthew_Aitchison1;~Marcus_Hutter1;~Anian_Ruoss1;~Arthur_Gretton1;~Mark_Rowland1",
        "gender": ";M;;M;M;M;M",
        "homepage": "https://kevin-w-li.github.io/;;http://www.hutter1.net/;;http://www.gatsby.ucl.ac.uk/~gretton/;http://sites.google.com/view/markrowland;http://gdeletang.com/",
        "dblp": "255/7009;;h/MarcusHutter;259/2083;56/2574;86/4090;277/0588",
        "google_scholar": "https://scholar.google.co.uk/citations?user=MW45NMEAAAAJ;81URpqMAAAAJ;https://scholar.google.com.tw/citations?user=7hmCntEAAAAJ;gFkwD3kAAAAJ;OUv7J6QAAAAJ;https://scholar.google.co.uk/citations?user=-0U84zMAAAAJ;OgVNoSkAAAAJ",
        "orcid": ";;0000-0002-3263-4097;;;;",
        "linkedin": ";;hutter1/;anian-ruoss;;;gr%C3%A9goire-del%C3%A9tang-4a1900128/",
        "or_profile": "~Li_Kevin_Wenliang1;~Matthew_Aitchison1;~Marcus_Hutter1;~Anian_Ruoss1;~Arthur_Gretton1;~Mark_Rowland1;~Gregoire_Detetang1",
        "aff": "Google DeepMind;Australian National University;Australian National University;Google DeepMind;University College London;Google DeepMind;",
        "aff_domain": "deepmind.com;anu.edu.au;anu.edu.au;deepmind.com;ucl.ac.uk;google.com;",
        "position": "Researcher;PhD student;Full Professor;Researcher;Professor;Research Scientist;",
        "bibtex": "@misc{\nwenliang2024distributional,\ntitle={Distributional Bellman Operators over Mean Embeddings},\nauthor={Li Kevin Wenliang and Gregoire Deletang and Matthew Aitchison and Marcus Hutter and Anian Ruoss and Arthur Gretton and Mark Rowland},\nyear={2024},\nurl={https://openreview.net/forum?id=T16M4SzH1v}\n}",
        "github": "",
        "project": "",
        "reviewers": "7TXx;PQKZ;RJqf;ReLT",
        "site": "https://openreview.net/forum?id=T16M4SzH1v",
        "pdf_size": 1010551,
        "rating": "3;5;6;8",
        "confidence": "5;4;3;3",
        "soundness": "3;3;3;4",
        "contribution": "1;2;2;4",
        "presentation": "2;2;2;4",
        "wc_summary": "63;109;56;40",
        "wc_strengths": "28;70;26;82",
        "wc_weaknesses": "389;180;193;42",
        "wc_questions": "5;55;6;46",
        "wc_review": "485;414;281;210",
        "wc_reply_reviewers": "480;0;16;0",
        "wc_reply_authors": "2249;680;468;568",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "4;1;1;1",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            1.0897247358851685
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            67.0,
            25.64176280991617
        ],
        "wc_strengths_avg": [
            51.5,
            24.8746859276655
        ],
        "wc_weaknesses_avg": [
            201.0,
            123.62240897183649
        ],
        "wc_questions_avg": [
            28.0,
            22.726636354727024
        ],
        "wc_review_avg": [
            347.5,
            108.00115740120566
        ],
        "wc_reply_reviewers_avg": [
            124.0,
            205.64046294443125
        ],
        "wc_reply_authors_avg": [
            991.25,
            730.0244430839285
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            1.299038105676658
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.9198662110077999,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10050873653996038853&as_sdt=5,31&sciodt=0,31&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;1;0;2;0",
        "aff_unique_norm": "Google;Australian National University;University College London",
        "aff_unique_dep": "Google DeepMind;;",
        "aff_unique_url": "https://deepmind.com;https://www.anu.edu.au;https://www.ucl.ac.uk",
        "aff_unique_abbr": "DeepMind;ANU;UCL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;0;0;0",
        "aff_country_unique": "United Kingdom;Australia"
    },
    {
        "id": "T1Y2KmVtUn",
        "title": "Differentiable Sensor Layouts for End-to-End Learning of Task-Specific Camera Parameters",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Computational imaging concepts based on integrated edge AI and and neural sensor concepts solve vision problems in an end-to-end, task-specific manner, by jointly optimizing the algorithmic and hardware parameters to sense data with high information value. They yield energy, data, and privacy efficient solutions, but rely on novel hardware concepts, yet to be scaled up. In this work, we present the first truly end-to-end trained imaging pipeline that optimizes imaging sensor parameters, available in standard CMOS design methods, jointly with the parameters of a given neural network on a specific task. Specifically, we derive an analytic, differentiable approach for the sensor layout parameterization that allows for task-specific, local varying  pixel resolutions. We present two pixel layout parameterization functions: rectangular and curvilinear grid shapes that retain a regular topology. We provide a drop-in module that approximates sensor simulation given existing high-resolution images to directly connect our method with existing deep learning models. We show that network predictions benefit from learnable pixel layouts for two different downstream tasks, classification and semantic segmentation. Moreover, we give a fully featured design for the hardware implementation of the learned chip layout for a semantic segmentation task.",
        "keywords": "sensors;computer vision;computer graphics;semantic segmentation;classification",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/6d5c9d8c9e017ea5536d2f7948aec8211a31fc89.zip",
        "author": "Hendrik Sommerhoff;Shashank Agnihotri;Mohamed Emam Saleh;Michael Moeller;Margret Keuper;Bhaskar Choubey;Andreas Kolb",
        "authorids": "~Hendrik_Sommerhoff2;~Shashank_Agnihotri1;~Mohamed_Emam_Saleh1;~Michael_Moeller1;~Margret_Keuper1;~Bhaskar_Choubey1;~Andreas_Kolb1",
        "gender": "M;M;M;M;F;M;M",
        "homepage": "https://www.cg.informatik.uni-siegen.de/en/sommerhoff-hendirk;https://www.uni-mannheim.de/dws/people/researchers/phd-students/shashank/;;http://vsa.informatik.uni-siegen.de;https://www.vc.informatik.uni-siegen.de/en/keuper-margret;https://www.eti.uni-siegen.de/acis/people/bhaskarchoubey/;https://www.cg.informatik.uni-siegen.de/",
        "dblp": "250/9036;;;08/5840-1;95/7589;;76/311.html",
        "google_scholar": "1EsFebAAAAAJ;vhm_xu8AAAAJ;;https://scholar.google.de/citations?user=sxzdAGUAAAAJ;https://scholar.google.de/citations?user=KMqMQAcAAAAJ;;https://scholar.google.de/citations?user=T_Fwt_oAAAAJ",
        "orcid": ";0000-0001-6097-8551;;;0000-0002-8437-7993;;0000-0003-4753-7801",
        "linkedin": ";shashank-agnihotri/;md-saleh/;;;;andreas-kolb-7818a610/",
        "or_profile": "~Hendrik_Sommerhoff2;~Shashank_Agnihotri1;~Mohamed_Emam_Saleh1;~Michael_Moeller1;~Margret_Keuper1;~Bhaskar_Choubey1;~Andreas_Kolb1",
        "aff": "University of Siegen;Universit\u00e4t Siegen;Universit\u00e4t Siegen;University of Siegen;Max Planck Institute for Informatics;Universit\u00e4t Siegen;Universit\u00e4t Siegen",
        "aff_domain": "uni-siegen.de;uni-siegen.de;uni-siegen.de;uni-siegen.de;mpi-inf.mpg;uni-siegen.de;uni-siegen.de",
        "position": "PhD student;PhD student;PhD student;Full Professor;Researcher;Full Professor;Full Professor",
        "bibtex": "@misc{\nsommerhoff2024differentiable,\ntitle={Differentiable Sensor Layouts for End-to-End Learning of Task-Specific Camera Parameters},\nauthor={Hendrik Sommerhoff and Shashank Agnihotri and Mohamed Emam Saleh and Michael Moeller and Margret Keuper and Bhaskar Choubey and Andreas Kolb},\nyear={2024},\nurl={https://openreview.net/forum?id=T1Y2KmVtUn}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZrRZ;iE4U;TZ9J;9y41",
        "site": "https://openreview.net/forum?id=T1Y2KmVtUn",
        "pdf_size": 14494198,
        "rating": "5;5;8;8",
        "confidence": "4;4;3;5",
        "soundness": "3;2;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "72;44;72;96",
        "wc_strengths": "63;27;52;51",
        "wc_weaknesses": "286;174;56;76",
        "wc_questions": "70;70;13;9",
        "wc_review": "491;315;193;232",
        "wc_reply_reviewers": "0;60;0;0",
        "wc_reply_authors": "1070;1141;277;391",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            6.5,
            1.5
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            71.0,
            18.411952639521967
        ],
        "wc_strengths_avg": [
            48.25,
            13.141061600951424
        ],
        "wc_weaknesses_avg": [
            148.0,
            91.33454987024352
        ],
        "wc_questions_avg": [
            40.5,
            29.53387885124472
        ],
        "wc_review_avg": [
            307.75,
            114.60666429139276
        ],
        "wc_reply_reviewers_avg": [
            15.0,
            25.98076211353316
        ],
        "wc_reply_authors_avg": [
            719.75,
            388.6614046956554
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14751166943415839433&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0;1;0;0",
        "aff_unique_norm": "University of Siegen;Max Planck Institute for Informatics",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uni-siegen.de;https://mpi-inf.mpg.de",
        "aff_unique_abbr": "Uni Siegen;MPII",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "T218mLyMHg",
        "title": "Spectrum-guided Multi-view Graph Fusion",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Multi-view graphs capture diverse relations among entities through graph views and individual characteristics via attribute views, presenting a challenge for unsupervised learning due to potential conflicts across views. Existing approaches often lack efficacy, efficiency, and the ability to explicitly control view contributions. In this paper, we present SMGF, a novel graph fusion framework that approximates underlying entity connections by aggregating view-specific graph structures. We construct a multi-view Laplacian $\\mathcal{L}$ from normalized Laplacian matrices representing all views. View weights are determined through the optimization of two objectives derived from $\\mathcal{L}$'s spectral properties, which exploit the eigenvalue gap and enhance connectivity.\nComprehensive experiments on six real-world datasets showcase the superior performance of SMGF in node embedding and clustering results, along with its efficiency and scalability. SMGF offers a promising solution for unsupervised learning on multi-view graphs, addressing the challenge of interpretably combining diverse and potentially conflicting information from both graph and attribute views.\nThe source code of SMGF is available at \\url{https://anonymous.4open.science/r/SMGF-E903/}.",
        "keywords": "unsupervised learning;multi-view graph;spectral graph theory;embedding;clustering",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Yiran Li;Gongyao GUO;Jieming Shi",
        "authorids": "~Yiran_Li2;~Gongyao_GUO1;~Jieming_Shi1",
        "gender": "M;M;Not Specified",
        "homepage": ";https://github.com/gongyguo;https://www4.comp.polyu.edu.hk/~jiemshi/",
        "dblp": ";;147/1237-1.html",
        "google_scholar": ";;",
        "orcid": "0000-0003-4476-016X;0009-0009-5600-2236;0000-0002-0465-1551",
        "linkedin": ";;",
        "or_profile": "~Yiran_Li2;~Gongyao_GUO1;~Jieming_Shi1",
        "aff": "Hong Kong Polytechnic University;Hong Kong Polytechnic University;The Hong Kong Polytechnic University",
        "aff_domain": "polyu.edu.hk;polyu.edu.hk;polyu.edu.hk",
        "position": "PhD student;Researcher;Assistant Professor",
        "bibtex": "@misc{\nli2024spectrumguided,\ntitle={Spectrum-guided Multi-view Graph Fusion},\nauthor={Yiran Li and Gongyao GUO and Jieming Shi},\nyear={2024},\nurl={https://openreview.net/forum?id=T218mLyMHg}\n}",
        "github": "",
        "project": "",
        "reviewers": "zn5a;DRP3;Yebg;nNdD",
        "site": "https://openreview.net/forum?id=T218mLyMHg",
        "pdf_size": 1777073,
        "rating": "3;3;5;5",
        "confidence": "5;4;3;3",
        "soundness": "2;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "3;3;2;2",
        "wc_summary": "35;134;80;57",
        "wc_strengths": "14;13;48;28",
        "wc_weaknesses": "297;198;212;36",
        "wc_questions": "2;1;16;2",
        "wc_review": "348;346;356;123",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "751;1029;1034;211",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;2;2;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            76.5,
            36.81372026839993
        ],
        "wc_strengths_avg": [
            25.75,
            14.148763196831021
        ],
        "wc_weaknesses_avg": [
            185.75,
            94.39378952028571
        ],
        "wc_questions_avg": [
            5.25,
            6.219927652312364
        ],
        "wc_review_avg": [
            293.25,
            98.36507256135178
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            756.25,
            334.9861004579145
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.9045340337332909,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:huEiuFfKnx4J:scholar.google.com/&scioq=Spectrum-guided+Multi-view+Graph+Fusion&hl=en&as_sdt=0,6",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Hong Kong Polytechnic University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.polyu.edu.hk",
        "aff_unique_abbr": "PolyU",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "T23HYw6lta",
        "title": "Forget-Me-Not: Making Backdoor Hard to be Forgotten in Fine-tuning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Backdoor attacks are training time attacks that fool deep neural networks (DNNs) into misclassifying inputs containing a specific trigger, thus representing serious security risks. However, due to catastrophic forgetting, the backdoor inside the poisoned models can be gradually removed under advanced finetuning methods. It reduces the practicality of backdoor attacks since the pretrained models often undergo extra finetuning instead of being used as is, and the attacks gradually lose their robustness given various finetuning-based backdoor defenses. Particularly, recent work reveals that finetuning with a cyclical learning rate scheme can effectively mitigate almost all backdoor attacks. In this paper, we propose a new mechanism for developing backdoor models that significantly strengthens the durability of the generated backdoor. The key idea in this design is to coach the backdoor to become more robust by exposing it to a wider range of learning rates and clean-data-only training epochs. The backdoor models developed with our mechanism can bypass finetuning-based defenses and maintain the backdoor effect even under long and sophisticated finetuning processes. In addition, the backdoor in our backdoored models can persist even if the whole model is finetuned end-to-end with another task, causing a notable accuracy drop when the trigger is present. We demonstrate the effectiveness of our technique through empirical evaluation with various backdoor triggers on three popular benchmarks, including CIFAR-10, CelebA, and ImageNet-10.",
        "keywords": "backdoor attack;fine-tuning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/b45759aec5764bd769784424a1dc201d30cb3e7c.zip",
        "author": "Tran Ngoc Huynh;Anh Tuan Tran;Khoa D Doan;Tung Pham",
        "authorids": "~Tran_Ngoc_Huynh1;~Anh_Tuan_Tran2;~Khoa_D_Doan1;~Tung_Pham1",
        "gender": "F;M;M;",
        "homepage": ";https://sites.google.com/site/anhttranusc/;;https://khoadoan.me",
        "dblp": "371/4479;150/5269-1;38/10862-1;238/4276.html",
        "google_scholar": "Tje4PQMAAAAJ;FYZ5ODQAAAAJ;KcUuEKsAAAAJ;Zz2hMgcAAAAJ",
        "orcid": ";0000-0002-3120-4036;;",
        "linkedin": ";https://linkedin.com/in/anh-tran-97814b19;;",
        "or_profile": "~Tran_Ngoc_Huynh1;~Anh_Tuan_Tran2;~Tung_Pham1;~Khoa_Doan1",
        "aff": "VinAI Research;VinAI Research;VinAI Research;VinUniversity",
        "aff_domain": "vinai.io;vinai.io;vinai.io;vinuni.edu.vn",
        "position": "Research resident;Research Scientist;Researcher;Assistant Professor",
        "bibtex": "@misc{\nhuynh2024forgetmenot,\ntitle={Forget-Me-Not: Making Backdoor Hard to be Forgotten in Fine-tuning},\nauthor={Tran Ngoc Huynh and Anh Tuan Tran and Khoa D Doan and Tung Pham},\nyear={2024},\nurl={https://openreview.net/forum?id=T23HYw6lta}\n}",
        "github": "",
        "project": "",
        "reviewers": "EHtc;xTDh;Rq4g;WyV7",
        "site": "https://openreview.net/forum?id=T23HYw6lta",
        "pdf_size": 769255,
        "rating": "3;5;6;6",
        "confidence": "5;4;4;5",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;4",
        "wc_summary": "35;76;67;74",
        "wc_strengths": "16;28;23;74",
        "wc_weaknesses": "316;470;41;224",
        "wc_questions": "3;8;24;5",
        "wc_review": "370;582;155;377",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "861;347;355;344",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            63.0,
            16.507574019219177
        ],
        "wc_strengths_avg": [
            35.25,
            22.77471185328148
        ],
        "wc_weaknesses_avg": [
            262.75,
            155.2922647783849
        ],
        "wc_questions_avg": [
            10.0,
            8.276472678623424
        ],
        "wc_review_avg": [
            371.0,
            151.0082779187949
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            476.75,
            221.88327449359494
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.40824829046386296,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12138467465512108074&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "VinAI Research;VinUniversity",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.vinai.io/;https://vinuni.edu.vn",
        "aff_unique_abbr": "VinAI;VinUni",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Vietnam"
    },
    {
        "id": "T2ToleSDk6",
        "title": "Learning Constraints from Offline Dataset via Inverse Dual Values Estimation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "To develop safe control strategies, Inverse Constrained Reinforcement learning (ICRL) infers constraints from expert demonstrations and trains policy models under these constraints. Classical ICRL algorithms typically adopt an online learning diagram that permits boundless exploration in an interactive environment. However, in realistic applications, iteratively collecting experiences from the environment is dangerous and expensive, especially for safe-critical control tasks. To address this challenge, in this work, we present a novel Inverse Dual Values Estimation (IDVE) framework. To enable offline ICRL, IDVE dynamically integrates the conservative estimation inherent in offline RL and the data-driven inference in inverse RL, thereby effectively learning constraints from limited data. Specifically, IDVE derives the dual values functions for both rewards and costs, estimating their values in a bi-level optimization problem based on the offline dataset. \nTo derive a practical IDVE algorithm for offline constraint inference, we introduce the method of 1) tacking unknown transitions, 2) scaling to continuous environments, and 3) controlling the degree of constraint regularization.  Under these advancements, empirical studies demonstrate that IDVE outperforms other baselines in terms of accurately recovering the constraints and adapting to high-dimensional environments with diverse reward configurations.",
        "keywords": "Inverse Constrained Reinforcement Learning;Offline Reinforcement Learning;Dual Reinforcement Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/0fb640210cbc0e56f856c5d32265886ec3dd9449.zip",
        "author": "Guorui Quan;zhiqiang xu;Guiliang Liu",
        "authorids": "~Guorui_Quan1;~zhiqiang_xu1;~Guiliang_Liu1",
        "gender": ";M;M",
        "homepage": "https://github.com/quangr/;https://scholar.google.com/citations?user=0R20iBMAAAAJ&hl=en;http://guiliang.me/",
        "dblp": ";72/51-3.html;220/5411",
        "google_scholar": ";;CuMylvEAAAAJ",
        "orcid": ";0000-0002-5693-8933;",
        "linkedin": ";;",
        "or_profile": "~Guorui_Quan1;~zhiqiang_xu1;~Guiliang_Liu1",
        "aff": "The Chinese University of Hong Kong, Shenzhen;Mohamed bin Zayed University of Artificial Intelligence;The Chinese University of Hong Kong, Shenzhen",
        "aff_domain": "cuhk.edu.hk;mbzuai.ac.ae;cuhk.edu.hk",
        "position": "Visiting Student;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nquan2024learning,\ntitle={Learning Constraints from Offline Dataset via Inverse Dual Values Estimation},\nauthor={Guorui Quan and zhiqiang xu and Guiliang Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=T2ToleSDk6}\n}",
        "github": "",
        "project": "",
        "reviewers": "KCBL;86gQ;US7L",
        "site": "https://openreview.net/forum?id=T2ToleSDk6",
        "pdf_size": 930292,
        "rating": "3;3;5",
        "confidence": "4;3;3",
        "soundness": "2;2;2",
        "contribution": "2;2;3",
        "presentation": "2;2;2",
        "wc_summary": "185;128;65",
        "wc_strengths": "28;47;40",
        "wc_weaknesses": "341;233;298",
        "wc_questions": "70;68;89",
        "wc_review": "624;476;492",
        "wc_reply_reviewers": "399;0;0",
        "wc_reply_authors": "1996;678;630",
        "reply_reviewers": "1;0;0",
        "reply_authors": "4;1;1",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            126.0,
            49.01020301937138
        ],
        "wc_strengths_avg": [
            38.333333333333336,
            7.845734863959881
        ],
        "wc_weaknesses_avg": [
            290.6666666666667,
            44.39469437769438
        ],
        "wc_questions_avg": [
            75.66666666666667,
            9.46337971105226
        ],
        "wc_review_avg": [
            530.6666666666666,
            66.31909394904473
        ],
        "wc_reply_reviewers_avg": [
            133.0,
            188.09040379562165
        ],
        "wc_reply_authors_avg": [
            1101.3333333333333,
            632.9282915324786
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            1.4142135623730951
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:_x2O7_Gc7kcJ:scholar.google.com/&scioq=Learning+Constraints+from+Offline+Dataset+via+Inverse+Dual+Values+Estimation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Chinese University of Hong Kong;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cuhk.edu.cn;https://mbzuai.ac.ae",
        "aff_unique_abbr": "CUHK;MBZUAI",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Shenzhen;",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "China;United Arab Emirates"
    },
    {
        "title": "Neur2RO: Neural Two-Stage Robust Optimization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18583",
        "id": "T5Xb0iGCCv",
        "author_site": "Justin Dumouchelle, Esther Julien, Jannis Kurtz, Elias Khalil",
        "tldr": "",
        "abstract": "Robust optimization provides a mathematical framework for modeling and solving decision-making problems under worst-case uncertainty.  This work addresses two-stage robust optimization (2RO) problems (also called *adjustable robust optimization*), wherein first-stage and second-stage decisions are made before and after uncertainty is realized, respectively.  This results in a nested min-max-min optimization problem which is extremely challenging computationally, especially when the decisions are discrete.  We propose Neur2RO, an efficient machine learning-driven instantiation of column-and-constraint generation (CCG), a classical iterative algorithm for 2RO.  Specifically, we learn to estimate the value function of the second-stage problem via a novel neural network architecture that is easy to optimize over by design. Embedding our neural network into CCG yields high-quality solutions quickly as evidenced by experiments on two 2RO benchmarks, knapsack and capital budgeting. For knapsack, Neur2RO finds solutions that are within roughly $2$% of the best-known values in a few seconds compared to the three hours of the state-of-the-art exact branch-and-price algorithm; for larger and more complex instances, Neur2RO finds even better solutions. For capital budgeting, Neur2RO outperforms three variants of the $k$-adaptability algorithm, particularly on the largest instances, with a $10$ to $100$-fold reduction in solution time. Our code and data are available at https://github.com/khalil-research/Neur2RO.",
        "keywords": "robust optimization;deep learning;discrete optimization",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/cfdf0133705f5c11bcb04057eb57fdc6a7bf503e.pdf",
        "author": "Justin Dumouchelle;Esther Julien;Jannis Kurtz;Elias Boutros Khalil",
        "authorids": "~Justin_Dumouchelle1;~Esther_Julien1;~Jannis_Kurtz1;~Elias_Boutros_Khalil1",
        "gender": "M;F;;M",
        "homepage": ";;;http://www.ekhalil.com",
        "dblp": ";;181/0912;151/3240",
        "google_scholar": ";qyOapq8AAAAJ;https://scholar.google.de/citations?user=rBbMHgwAAAAJ;juqDWQMAAAAJ",
        "orcid": ";0000-0002-7337-1086;0000-0003-1570-7044;",
        "linkedin": "justin-dumouchelle-676bbb84/;esther-julien/;;",
        "or_profile": "~Justin_Dumouchelle1;~Esther_Julien1;~Jannis_Kurtz1;~Elias_Bouros_Khalil1",
        "aff": "University of Toronto;Delft University of Technology;University of Amsterdam;Polytechnique Montreal",
        "aff_domain": "utoronto.ca;tudelft.nl;uva.nl;polymtl.ca",
        "position": "PhD student;PhD student;Assistant Professor;Postdoc",
        "bibtex": "@inproceedings{\ndumouchelle2024neurro,\ntitle={Neur2{RO}: Neural Two-Stage Robust Optimization},\nauthor={Justin Dumouchelle and Esther Julien and Jannis Kurtz and Elias Boutros Khalil},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=T5Xb0iGCCv}\n}",
        "github": "",
        "project": "",
        "reviewers": "viyN;3Yd3;fXRT",
        "pdf_size": 820265,
        "rating": "6;6;8",
        "confidence": "4;4;4",
        "soundness": "3;3;3",
        "contribution": "2;2;3",
        "presentation": "3;3;4",
        "wc_summary": "135;95;304",
        "wc_strengths": "90;32;132",
        "wc_weaknesses": "28;23;313",
        "wc_questions": "60;315;239",
        "wc_review": "313;465;988",
        "wc_reply_reviewers": "0;0;41",
        "wc_reply_authors": "204;1085;654",
        "reply_reviewers": "0;0;1",
        "reply_authors": "1;2;1",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            178.0,
            90.57961507241387
        ],
        "wc_strengths_avg": [
            84.66666666666667,
            40.99864496405812
        ],
        "wc_weaknesses_avg": [
            121.33333333333333,
            135.5441707423164
        ],
        "wc_questions_avg": [
            204.66666666666666,
            106.89662711652268
        ],
        "wc_review_avg": [
            588.6666666666666,
            289.1093603158193
        ],
        "wc_reply_reviewers_avg": [
            13.666666666666666,
            19.3275853524323
        ],
        "wc_reply_authors_avg": [
            647.6666666666666,
            359.6946235659107
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12173083746931293775&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=T5Xb0iGCCv",
        "pdf": "https://openreview.net/pdf?id=T5Xb0iGCCv",
        "email": "utoronto.ca;tudelft.nl;uva.nl;polymtl.ca",
        "author_num": 4,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "University of Toronto;Delft University of Technology;University of Amsterdam;Polytechnique Montreal",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.utoronto.ca;https://www.tudelft.nl;https://www.uva.nl;https://www.polymtl.ca",
        "aff_unique_abbr": "U of T;TU Delft;UvA;PolyMTL",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Montreal",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "Canada;Netherlands"
    },
    {
        "id": "T629ezwzxI",
        "title": "Out-of-domain Fact Checking",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Evaluating the veracity of everyday claims is time consuming and in some cases requires domain expertise. In this paper, we reveal that large commercial language models, e.g., ChatGPT or GPT4, are unable to successfully accomplish this task. We then empirically demonstrate that the commonly used fact checking pipeline, known as the retriever-reader, suffers from performance deterioration when it is trained on the labeled data from one topic (or domain) and used in another topic. Existing studies in this area mostly evaluate the transferability of fact checking systems across various platforms, e.g., Wikipedia to scientific repositories, or from one fact checking website to another one. Even in doing so, they do not step beyond pretraining models on one resource and evaluating on another resource.  This calls for developing methods and techniques to make fact checking models more generalizable. Therefore, we delve into each component of the pipeline and propose algorithms to achieve this goal. We propose an adversarial algorithm to make the retriever component robust against distribution shift. Our core idea is to initially train a bi-encoder on the labeled source data, and then, to adversarially train two separate document and claim encoders using unlabeled target data. Then, we focus on the reader component and propose to train it such that it is insensitive towards the order of claims and evidence documents. Our empirical evaluations support the hypothesis that such a reader shows a higher robustness against distribution shift. To our knowledge, there is no publicly available multi-topic fact checking dataset. Thus, we propose a straightforward method to re-purpose two well-known fact checking datasets. We construct eight fact checking scenarios from these datasets, and compare our model to a set of strong baseline models, including recent models that use GPT4 for generating pseudo-queries. Our results signify to the effectiveness of our model. Our code will be publicly available on our GitHub webpage.",
        "keywords": "fact checking;misinformation;natural language processing;distribution shift;text classification",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Payam Karisani;Heng Ji",
        "authorids": "~Payam_Karisani1;~Heng_Ji3",
        "gender": "M;F",
        "homepage": ";http://blender.cs.illinois.edu/hengji.html",
        "dblp": "150/5408;",
        "google_scholar": ";z7GCqT4AAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Payam_Karisani1;~Heng_Ji3",
        "aff": "University of Illinois, Urbana Champaign;University of Illinois, Urbana-Champaign",
        "aff_domain": "uiuc.edu;uiuc.edu",
        "position": "Researcher;Full Professor",
        "bibtex": "@misc{\nkarisani2024outofdomain,\ntitle={Out-of-domain Fact Checking},\nauthor={Payam Karisani and Heng Ji},\nyear={2024},\nurl={https://openreview.net/forum?id=T629ezwzxI}\n}",
        "github": "",
        "project": "",
        "reviewers": "mmrP;5Ldi;FTvD",
        "site": "https://openreview.net/forum?id=T629ezwzxI",
        "pdf_size": 2769699,
        "rating": "3;3;6",
        "confidence": "4;4;4",
        "soundness": "3;1;2",
        "contribution": "2;1;2",
        "presentation": "3;2;3",
        "wc_summary": "75;192;65",
        "wc_strengths": "23;52;47",
        "wc_weaknesses": "117;388;137",
        "wc_questions": "12;55;100",
        "wc_review": "227;687;349",
        "wc_reply_reviewers": "122;165;273",
        "wc_reply_authors": "1983;2813;1560",
        "reply_reviewers": "4;1;1",
        "reply_authors": "7;4;4",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            110.66666666666667,
            57.656068390258994
        ],
        "wc_strengths_avg": [
            40.666666666666664,
            12.657891697365017
        ],
        "wc_weaknesses_avg": [
            214.0,
            123.30720443942708
        ],
        "wc_questions_avg": [
            55.666666666666664,
            35.92894221778438
        ],
        "wc_review_avg": [
            421.0,
            194.57303684392312
        ],
        "wc_reply_reviewers_avg": [
            186.66666666666666,
            63.52077525415515
        ],
        "wc_reply_authors_avg": [
            2118.6666666666665,
            520.4525808264274
        ],
        "reply_reviewers_avg": [
            2.0,
            1.4142135623730951
        ],
        "reply_authors_avg": [
            5.0,
            1.4142135623730951
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:T9UJMlY05xEJ:scholar.google.com/&scioq=Out-of-domain+Fact+Checking&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Illinois Urbana-Champaign;University of Illinois",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://illinois.edu;https://illinois.edu",
        "aff_unique_abbr": "UIUC;UIUC",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Urbana-Champaign",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "T6pC0E2ziE",
        "title": "Learning Identifiable Causal Structures with Pairwise Representation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Supervised Causal Learning (SCL) aims to obtain causal relations from observational data, leveraging the model learned from prior datasets with ground truth causal relations. \nDeep Neural Network (DNN) based SCL, which learns DNNs as causal models, has gained significant attention with its numerous advantages. \nA recently proposed transformer-based architecture employs sample-wise and node-wise attention mechanisms to capture representations of individual variables.\nIn the inference stage, the trained model takes the test data as input and outputs a Directed Acyclic Graph (DAG) represented as a weighted adjacency matrix.\n\nHowever, this paper identifies two limitations of these approaches. \nFirst, using the adjacency matrix as a learning target can yield inconsistent results, w.r.t. structure identifiability if Bernoulli sampling is further adopted to generate the DAG.\nSecond, current network architecture does not adequately encode the essential causal information for learning causal structures.\nTo address these issues, we propose a novel DNN-based SCL approach, PAIRE, which incorporates a unique pairwise encoder module with a unidirectional attention layer. \nBy taking both node features and pairwise features as layer input, it can model the internal and external relationships of variable pairs. \nIn addition, we use a skeleton matrix along with a v-tensor, a third-order tensor representing v-structures, as our output, so as to represent the Markov Equivalence Class (MEC), which resolves identifiability inconsistency. \nEmpirical evidence indicates PAIRE significantly outperforms other DNN-based SCL approaches.",
        "keywords": "causality;causal discovery;deep learning;supervised causal learning",
        "primary_area": "causal reasoning",
        "supplementary_material": "/attachment/e03d5a76431f456b8bc9ae077cb0c20575e6de78.pdf",
        "author": "Jiaru Zhang;Rui Ding;Qiang Fu;Yang Hua;Haibing Guan;Shi Han;Dongmei Zhang",
        "authorids": "~Jiaru_Zhang1;~Rui_Ding1;~Qiang_Fu7;~Yang_Hua2;~Haibing_Guan1;~Shi_Han1;~Dongmei_Zhang2",
        "gender": "M;M;M;M;M;M;",
        "homepage": "https://jiaruzhang.github.io;https://www.microsoft.com/en-us/research/people/juding/;;https://pure.qub.ac.uk/en/persons/yang-hua;http://www.cs.sjtu.edu.cn/~hbguan/;https://www.microsoft.com/en-us/research/people/shihan/;https://www.microsoft.com/en-us/research/people/dongmeiz/",
        "dblp": "300/5670;55/5564-1;;;96/5680.html;23/3395;87/461-1",
        "google_scholar": "d6q4zkMAAAAJ;ggVQ4dIAAAAJ;bwTLZSIAAAAJ;N0tFi8MAAAAJ;;wLabxmYAAAAJ;jLlBBl4AAAAJ",
        "orcid": "0000-0002-9273-9093;0000-0003-3990-7403;0000-0002-5821-7267;0000-0001-5536-503X;;0000-0002-0360-6089;0000-0002-9230-2799",
        "linkedin": ";;qiang-fu-08301285/;;;shi-han-86888526/;dongmei-zhang-38a86317/",
        "or_profile": "~Jiaru_Zhang1;~Rui_Ding1;~Qiang_Fu7;~Yang_Hua2;~Haibing_Guan1;~Shi_Han1;~Dongmei_Zhang2",
        "aff": "Shanghai Jiaotong University;Microsoft;Microsoft;Queen's University Belfast;Shanghai Jiaotong University;Microsoft;Microsoft",
        "aff_domain": "sjtu.edu.cn;microsoft.com;microsoft.com;qub.ac.uk;sjtu.edu.cn;microsoft.com;microsoft.com",
        "position": "PhD student;Researcher;Researcher;Assistant Professor;Full Professor;Researcher;Distinguished Scientist",
        "bibtex": "@misc{\nzhang2024learning,\ntitle={Learning Identifiable Causal Structures with Pairwise Representation},\nauthor={Jiaru Zhang and Rui Ding and Qiang Fu and Yang Hua and Haibing Guan and Shi Han and Dongmei Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=T6pC0E2ziE}\n}",
        "github": "",
        "project": "",
        "reviewers": "t5Qz;4F7j;JJmt;mhH7",
        "site": "https://openreview.net/forum?id=T6pC0E2ziE",
        "pdf_size": 743057,
        "rating": "3;3;5;6",
        "confidence": "3;3;2;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "37;85;82;58",
        "wc_strengths": "24;292;98;30",
        "wc_weaknesses": "66;2;500;121",
        "wc_questions": "568;2;368;42",
        "wc_review": "695;381;1048;251",
        "wc_reply_reviewers": "148;104;150;0",
        "wc_reply_authors": "2266;606;2637;296",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "4;2;5;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            65.5,
            19.5
        ],
        "wc_strengths_avg": [
            111.0,
            108.4665847162157
        ],
        "wc_weaknesses_avg": [
            172.25,
            193.85609998140373
        ],
        "wc_questions_avg": [
            245.0,
            234.3693665989649
        ],
        "wc_review_avg": [
            593.75,
            307.9507874644908
        ],
        "wc_reply_reviewers_avg": [
            100.5,
            60.866657539247214
        ],
        "wc_reply_authors_avg": [
            1451.25,
            1014.7500615915231
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            1.5811388300841898
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.2721655269759087,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:dgu0voRKDsEJ:scholar.google.com/&scioq=Learning+Identifiable+Causal+Structures+with+Pairwise+Representation&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;2;0;1;1",
        "aff_unique_norm": "Shanghai Jiao Tong University;Microsoft;Queen's University Belfast",
        "aff_unique_dep": ";Microsoft Corporation;",
        "aff_unique_url": "https://www.sjtu.edu.cn;https://www.microsoft.com;https://www.qub.ac.uk",
        "aff_unique_abbr": "SJTU;Microsoft;QUB",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;2;0;1;1",
        "aff_country_unique": "China;United States;United Kingdom"
    },
    {
        "title": "Neural Fine-Tuning Search for Few-Shot Learning",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18582",
        "id": "T7YV5UZKBc",
        "author_site": "Panagiotis Eustratiadis, \u0141ukasz Dudziak, Da Li, Timothy Hospedales",
        "tldr": "",
        "abstract": "In few-shot recognition, a classifier that has been trained on one set of classes is required to rapidly adapt and generalize to a disjoint, novel set of classes. To that end, recent studies have shown the efficacy of fine-tuning with carefully-crafted adaptation architectures. However this raises the question of: How can one design the optimal adaptation strategy? In this paper, we study this question through the lens of neural architecture search (NAS). Given a pre-trained neural network, our algorithm discovers the optimal arrangement of adapters, which layers to keep frozen, and which to fine-tune. We demonstrate the generality of our NAS method by applying it to both residual networks and vision transformers and report state-of-the-art performance on Meta-Dataset and Meta-Album.",
        "keywords": "stochastic;neural;architecture;search;few;shot;learning;adapters",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Panagiotis Eustratiadis;\u0141ukasz Dudziak;Da Li;Timothy Hospedales",
        "authorids": "~Panagiotis_Eustratiadis1;~\u0141ukasz_Dudziak1;~Da_Li3;~Timothy_Hospedales1",
        "gender": "M;M;M;M",
        "homepage": ";;https://dali-dl.github.io/;http://homepages.inf.ed.ac.uk/thospeda/",
        "dblp": ";228/7987;43/4804-1;32/3545",
        "google_scholar": "lj5XzYUAAAAJ;R47NvpoAAAAJ;RPvaE3oAAAAJ;https://scholar.google.fr/citations?user=nHhtvqkAAAAJ",
        "orcid": ";;0000-0002-2101-2989;0000-0003-4867-7486",
        "linkedin": "peustr/;;;timothyhospedales/",
        "or_profile": "~Panagiotis_Eustratiadis1;~\u0141ukasz_Dudziak1;~Da_Li3;~Timothy_Hospedales1",
        "aff": "University of Amsterdam;Samsung;University of Edinburgh;Samsung AI Research Centre",
        "aff_domain": "uva.nl;samsung.com;ed.ac.uk;samsung.com",
        "position": "Postdoc;Software Engineer;Visiting Scholar;Principal Researcher",
        "bibtex": "@inproceedings{\neustratiadis2024neural,\ntitle={Neural Fine-Tuning Search for Few-Shot Learning},\nauthor={Panagiotis Eustratiadis and {\\L}ukasz Dudziak and Da Li and Timothy Hospedales},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=T7YV5UZKBc}\n}",
        "github": "",
        "project": "",
        "reviewers": "pojm;eX3h;mc8g",
        "pdf_size": 3580561,
        "rating": "6;8;8",
        "confidence": "4;3;4",
        "soundness": "3;3;4",
        "contribution": "3;3;4",
        "presentation": "2;3;4",
        "wc_summary": "71;45;100",
        "wc_strengths": "20;89;82",
        "wc_weaknesses": "57;59;176",
        "wc_questions": "40;26;83",
        "wc_review": "188;219;441",
        "wc_reply_reviewers": "64;43;0",
        "wc_reply_authors": "957;478;393",
        "reply_reviewers": "1;1;0",
        "reply_authors": "3;1;1",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            72.0,
            22.464787260658994
        ],
        "wc_strengths_avg": [
            63.666666666666664,
            31.008959278820623
        ],
        "wc_weaknesses_avg": [
            97.33333333333333,
            55.63172556095029
        ],
        "wc_questions_avg": [
            49.666666666666664,
            24.25329301810833
        ],
        "wc_review_avg": [
            282.6666666666667,
            112.67159752523654
        ],
        "wc_reply_reviewers_avg": [
            35.666666666666664,
            26.637484032009397
        ],
        "wc_reply_authors_avg": [
            609.3333333333334,
            248.27448967266497
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4334647051582066115&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "openreview": "https://openreview.net/forum?id=T7YV5UZKBc",
        "pdf": "https://openreview.net/pdf?id=T7YV5UZKBc",
        "email": "uva.nl;samsung.com;ed.ac.uk;samsung.com",
        "author_num": 4,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "University of Amsterdam;Samsung;University of Edinburgh",
        "aff_unique_dep": ";Samsung;",
        "aff_unique_url": "https://www.uva.nl;https://www.samsung.com;https://www.ed.ac.uk",
        "aff_unique_abbr": "UvA;Samsung;Edinburgh",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;1",
        "aff_country_unique": "Netherlands;South Korea;United Kingdom"
    },
    {
        "id": "T8Rf1CRbHQ",
        "title": "Error-Feedback Meets Stochastic Approximation with Two Time Scales",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Two-time-scale stochastic approximation is a recursive algorithm for solving a system of two equations. The method has found broad applications in many areas including machine learning and reinforcement learning. Recent works have revealed that single-time-scale stochastic approximation (especially its variant stochastic gradient descent in optimization) is robust to structured perturbations such as compression, local updates, and delays, but it is not well-understood in the two-time-scale case. Almost nothing is known about the analogous question: Is two-time-scale stochastic approximation also robust to similar structured perturbations? In this paper, we study error-feedback-based two-time-scale stochastic approximation. We propose a unified theory of two-time-scale stochastic approximation based on error-feedback to analyze the impact of different forms of structured perturbations. We show that two-time-scale stochastic approximation is robust to structured perturbations. In particular, two-time-scale stochastic approximation with different forms of structured perturbations exhibits the same non-asymptotic theoretical guarantees as its single-time-scale counterpart without structured perturbations. We further show that the convergence rate in all cases consists of two terms, where only the higher-order term is affected by structured perturbations. This is especially important for distributed parallel implementations of two-time-scale stochastic approximation algorithms.",
        "keywords": "stochastic approximation;error-feedback;two time scales;structured perturbations",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/330d89f13b8c12c1373631d3e083fa73be8fb1eb.pdf",
        "author": "Pengfei Wang;Nenggan Zheng",
        "authorids": "~Pengfei_Wang8;~Nenggan_Zheng1",
        "gender": ";",
        "homepage": ";",
        "dblp": ";",
        "google_scholar": "g6SeV5IAAAAJ;",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Pengfei_Wang8;~Nenggan_Zheng1",
        "aff": ";",
        "aff_domain": ";",
        "position": ";",
        "bibtex": "@misc{\nwang2024errorfeedback,\ntitle={Error-Feedback Meets Stochastic Approximation with Two Time Scales},\nauthor={Pengfei Wang and Nenggan Zheng},\nyear={2024},\nurl={https://openreview.net/forum?id=T8Rf1CRbHQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "FQA6;3q7e;hjVi",
        "site": "https://openreview.net/forum?id=T8Rf1CRbHQ",
        "pdf_size": 232422,
        "rating": "3;5;5",
        "confidence": "4;3;4",
        "soundness": "3;3;3",
        "contribution": "2;2;2",
        "presentation": "3;3;3",
        "wc_summary": "48;52;54",
        "wc_strengths": "21;45;32",
        "wc_weaknesses": "190;147;183",
        "wc_questions": "153;2;161",
        "wc_review": "412;246;430",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            51.333333333333336,
            2.494438257849294
        ],
        "wc_strengths_avg": [
            32.666666666666664,
            9.809292646374775
        ],
        "wc_weaknesses_avg": [
            173.33333333333334,
            18.83849486792639
        ],
        "wc_questions_avg": [
            105.33333333333333,
            73.14065596886287
        ],
        "wc_review_avg": [
            362.6666666666667,
            82.82243389055621
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:HCLbrN4viwYJ:scholar.google.com/&scioq=Error-Feedback+Meets+Stochastic+Approximation+with+Two+Time+Scales&hl=en&as_sdt=0,33",
        "gs_version_total": 0
    },
    {
        "id": "T8RiH35Hy6",
        "title": "Understanding Community Bias Amplification in Graph Representation Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this work, we discover a phenomenon of community bias amplification in graph representation learning, which refers to the exacerbation of performance bias between different classes by graph representation learning. We conduct an in-depth theoretical study of this phenomenon from a novel spectral perspective. Our analysis suggests that structural bias between communities results in varying local convergence speeds for node embeddings. This phenomenon leads to bias amplification in the classification results of downstream tasks. Based on the theoretical insights, we propose random graph coarsening, which is proved to be effective in dealing with the above issue. Finally, we propose a novel graph contrastive learning model called Random Graph Coarsening Contrastive Learning (RGCCL), which utilizes random coarsening as data augmentation and mitigates community bias by contrasting the coarsened graph with the original graph. Extensive experiments on various datasets demonstrate the advantage of our method when dealing with community bias amplification.",
        "keywords": "Graph Representation Learning;Community Bias Amplification",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Shengzhong Zhang;Wenjie Yang;Yimin Zhang;Hongwei Zhang;Divin Yan;Zengfeng Huang",
        "authorids": "~Shengzhong_Zhang1;~Wenjie_Yang4;~Yimin_Zhang4;~Hongwei_Zhang3;~Divin_Yan1;~Zengfeng_Huang1",
        "gender": "M;M;F;M;M;M",
        "homepage": "https://szzhang17.github.io/;https://agoyang.github.io;;;https://divinyan.com/;https://zengfenghuang.github.io/",
        "dblp": "255/8703;74/4603-6;;;359/6307.html;97/9726",
        "google_scholar": "bWD48lgAAAAJ;28iyqm0AAAAJ;https://scholar.google.com.hk/citations?view_op=list_works;6tZzBr4AAAAJ;-Vv6hJsAAAAJ;https://scholar.google.com.hk/citations?user=FwNBuXUAAAAJ",
        "orcid": "0000-0003-1783-6835;0000-0001-5420-2722;;;0009-0009-2880-3124;0000-0003-2671-7483",
        "linkedin": ";;;;;",
        "or_profile": "~Shengzhong_Zhang1;~Wenjie_Yang4;~Yimin_Zhang4;~Hongwei_Zhang3;~Divin_Yan1;~Zengfeng_Huang1",
        "aff": "Fudan University;Fudan University;Ant Group;Fudan University;ISTBI & School of Data Science, Fudan University;Fudan University",
        "aff_domain": "fudan.edu.cn;fudan.edu.cn;antgroup.com;fudan.edu.cn;fudan.edu.cn;fudan.edu",
        "position": "PhD student;PhD student;Engineer;PhD student;Applied Mathmatics Research Master Student;Full Professor",
        "bibtex": "@misc{\nzhang2024understanding,\ntitle={Understanding Community Bias Amplification in Graph Representation Learning},\nauthor={Shengzhong Zhang and Wenjie Yang and Yimin Zhang and Hongwei Zhang and Divin Yan and Zengfeng Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=T8RiH35Hy6}\n}",
        "github": "",
        "project": "",
        "reviewers": "vF6X;bi59;K8c3",
        "site": "https://openreview.net/forum?id=T8RiH35Hy6",
        "pdf_size": 566100,
        "rating": "3;6;6",
        "confidence": "3;3;2",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "2;2;3",
        "wc_summary": "51;168;89",
        "wc_strengths": "36;51;26",
        "wc_weaknesses": "273;112;174",
        "wc_questions": "38;76;152",
        "wc_review": "398;407;441",
        "wc_reply_reviewers": "285;51;0",
        "wc_reply_authors": "2651;782;751",
        "reply_reviewers": "1;1;0",
        "reply_authors": "7;3;3",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            102.66666666666667,
            48.732831734764694
        ],
        "wc_strengths_avg": [
            37.666666666666664,
            10.274023338281626
        ],
        "wc_weaknesses_avg": [
            186.33333333333334,
            66.30401362076222
        ],
        "wc_questions_avg": [
            88.66666666666667,
            47.39432689913659
        ],
        "wc_review_avg": [
            415.3333333333333,
            18.51725921644153
        ],
        "wc_reply_reviewers_avg": [
            112.0,
            124.08867796862049
        ],
        "wc_reply_authors_avg": [
            1394.6666666666667,
            888.4519620603519
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            4.333333333333333,
            1.8856180831641267
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ucvSG-0C2fQJ:scholar.google.com/&scioq=Understanding+Community+Bias+Amplification+in+Graph+Representation+Learning&hl=en&as_sdt=0,11",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;0;0;0",
        "aff_unique_norm": "Fudan University;Ant Group",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.fudan.edu.cn;https://www.antgroup.com",
        "aff_unique_abbr": "Fudan;Ant Group",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "T97kxctihq",
        "title": "Revisiting Long-term Time Series Forecasting: An Investigation on Affine Mapping",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Long-term time series forecasting (LTSF) has gained significant attention in recent years. While there are various specialized designs for capturing temporal dependency, previous studies have demonstrated that a single linear layer can achieve competitive forecasting performance compared to other complex architectures. In this paper, we thoroughly investigate the intrinsic effectiveness of recent approaches and find that: 1) affine mapping in some LTSF models dominates forecasting performance across commonly utilized benchmarks; 2) affine mapping can effectively capture periodic patterns but encounter challenges when predicting non-periodic signals or time series with different periods across channels; and 3) using reversible normalization and increasing input horizon can significantly enhance the robustness of models. We provide theoretical and experimental explanations to support our findings and also discuss the limitations and future works. Our framework's code is available at \\url{https://github.com/anonymous}.",
        "keywords": "Time series forecasting;Affine mapping",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/0ca31881d03d58acb7bcc8fec77dd22730560b71.zip",
        "author": "Zhe Li;Shiyi Qi;Yiduo Li;Zenglin Xu",
        "authorids": "~Zhe_Li13;~Shiyi_Qi1;~Yiduo_Li1;~Zenglin_Xu1",
        "gender": "M;M;F;M",
        "homepage": "https://plumprc.github.io/;https://github.com/yikouchunzhen;;https://faculty.fudan.edu.cn/xuzenglin/en/index.htm",
        "dblp": ";321/1594;;68/1538",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;;gF0H9nEAAAAJ",
        "orcid": ";0000-0002-8060-1273;0000-0002-0375-8269;0000-0001-5550-6461",
        "linkedin": ";;;",
        "or_profile": "~Zhe_Li13;~Shiyi_Qi1;~Yiduo_Li1;~Zenglin_Xu1",
        "aff": "Singapore Management University;Harbin Institute of Technology, shenzhen;Alibaba Group;Harbin Institute of Technology Shenzhen",
        "aff_domain": "smu.edu.sg;hit.edu.cn;antgroup.com;hit.edu.cn",
        "position": "Researcher;MS student;Researcher;Full Professor",
        "bibtex": "@misc{\nli2024revisiting,\ntitle={Revisiting Long-term Time Series Forecasting: An Investigation on Affine Mapping},\nauthor={Zhe Li and Shiyi Qi and Yiduo Li and Zenglin Xu},\nyear={2024},\nurl={https://openreview.net/forum?id=T97kxctihq}\n}",
        "github": "",
        "project": "",
        "reviewers": "uhGz;NWqo;TkUX;SH4h",
        "site": "https://openreview.net/forum?id=T97kxctihq",
        "pdf_size": 5269655,
        "rating": "3;5;6;6",
        "confidence": "4;4;4;3",
        "soundness": "1;2;3;3",
        "contribution": "1;2;2;3",
        "presentation": "3;1;3;3",
        "wc_summary": "279;60;133;67",
        "wc_strengths": "43;42;156;42",
        "wc_weaknesses": "100;177;223;41",
        "wc_questions": "160;51;1;18",
        "wc_review": "582;330;513;168",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "855;941;519;576",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            134.75,
            88.01810893219644
        ],
        "wc_strengths_avg": [
            70.75,
            49.220803528589414
        ],
        "wc_weaknesses_avg": [
            135.25,
            69.9441741676889
        ],
        "wc_questions_avg": [
            57.5,
            61.84860548144962
        ],
        "wc_review_avg": [
            398.25,
            161.71328795123796
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            722.75,
            179.00611023090804
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.4714045207910316,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5352859173353083645&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "Singapore Management University;Harbin Institute of Technology;Alibaba Group",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.smu.edu.sg;http://en.hhit.edu.cn/;https://www.alibaba.com",
        "aff_unique_abbr": "SMU;HIT;Alibaba",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Shenzhen",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "Singapore;China"
    },
    {
        "id": "T9w5ttdqLV",
        "title": "Towards Complete Expressiveness Capacity of Mixed Multi-Agent Q Value Function",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Value decomposition is an efficient approach to achieving centralized training with decentralized execution in fully cooperative Multi-Agent Reinforcement Learning (MARL) problems. Recently, Strictly Monotonic Mixing Function (SMMF) has gained widespread application in value decomposition methods, but SMMF could suffer from convergence difficulties for the representational limitation. \nThis paper investigates the circumstances under which the representational limitation occurs and presents approaches to overcome it. \nWe begin our investigation with Linear Mixing Function (LMF), a simple case of SMMF.\nFirstly, we prove that LMF is free from representational limitation only in a rare case of MARL problems.\nSecondly, we propose a two-stage mixing framework, which includes a difference rescaling stage after SMMF to complete the representational capability.\nHowever, the capacity could remain unrealized for the cross interference between the representation of different action-values. Finally, we introduce gradient shaping to address this problem. \nThe experimental results validate the expressiveness of LMF and demonstrate the effectiveness of our proposed methods.",
        "keywords": "Multi-Agent;Reinforcement Learning;Value Decomposition",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Lipeng Wan;Xu He;Zeyang Liu;Kai Li;Xingyu Chen;Mengchen Zhao;Dong Li;Bo An;Xuguang Lan",
        "authorids": "~Lipeng_Wan1;~Xu_He2;~Zeyang_Liu2;~Kai_Li16;~Xingyu_Chen2;~Mengchen_Zhao1;~Dong_Li10;~Bo_An2;~Xuguang_Lan1",
        "gender": "M;M;M;M;M;M;M;M;",
        "homepage": "http://gr.xjtu.edu.cn/web/zeuslan/team;jsessionid=F923495DAAA043708B20337E681673E5;https://scholar.google.com/citations?user=308KqrIAAAAJ&hl=en;;;;https://batmanzzmc.github.io/;;https://personal.ntu.edu.sg/boan/;",
        "dblp": "377/4923.html;89/3991;;;;178/8719;47/4826-16;42/6178-1.html;",
        "google_scholar": ";308KqrIAAAAJ;YOOlkJoAAAAJ;mjXgE1oAAAAJ;https://scholar.google.com.hk/citations?user=LR76K-MAAAAJ;nLgORGMAAAAJ;;PEEpuNwAAAAJ;",
        "orcid": ";;0000-0002-3110-8618;0000-0002-3026-5240;0000-0002-5226-963X;;;0000-0002-7064-7438;",
        "linkedin": ";;;;;;;;",
        "or_profile": "~Lipeng_Wan1;~Xu_He2;~Zeyang_Liu2;~Kai_Li16;~Xingyu_Chen2;~Mengchen_Zhao1;~Dong_Li10;~Bo_An2;~Xuguang_Lan1",
        "aff": "Xi'an Jiaotong University;Huawei Technologies Ltd.;Xi'an Jiaotong University;Huawei Noah's Ark Lab;Xi'an Jiaotong University;Huawei Noah's Ark Lab;Huawei Technologies Ltd.;Nanyang Technological University;",
        "aff_domain": "xjtu.edu.cn;huawei.com;xjtu.edu.cn;huawei.com;xjtu.edu.cn;huawei.com;huawei.com;ntu.edu.sg;",
        "position": "Postdoc;Researcher;PhD student;Principal Researcher;Assistant Professor;Research Scientist;Principal Researcher;Full Professor;",
        "bibtex": "@misc{\nwan2024towards,\ntitle={Towards Complete Expressiveness Capacity of Mixed Multi-Agent Q Value Function},\nauthor={Lipeng Wan and Xu He and Zeyang Liu and Kai Li and Xingyu Chen and Mengchen Zhao and Dong Li and Bo An and Xuguang Lan},\nyear={2024},\nurl={https://openreview.net/forum?id=T9w5ttdqLV}\n}",
        "github": "",
        "project": "",
        "reviewers": "dx4A;mg9a;weNa",
        "site": "https://openreview.net/forum?id=T9w5ttdqLV",
        "pdf_size": 9205928,
        "rating": "5;5;6",
        "confidence": "4;3;5",
        "soundness": "3;2;3",
        "contribution": "3;2;3",
        "presentation": "3;3;4",
        "wc_summary": "54;78;98",
        "wc_strengths": "25;67;25",
        "wc_weaknesses": "22;183;17",
        "wc_questions": "376;5;22",
        "wc_review": "477;333;162",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1436;1022;345",
        "reply_reviewers": "0;0;0",
        "reply_authors": "3;2;1",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            76.66666666666667,
            17.987650084309387
        ],
        "wc_strengths_avg": [
            39.0,
            19.79898987322333
        ],
        "wc_weaknesses_avg": [
            74.0,
            77.10166448700487
        ],
        "wc_questions_avg": [
            134.33333333333334,
            171.02501441472108
        ],
        "wc_review_avg": [
            324.0,
            128.7555824032496
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            934.3333333333334,
            449.69199335644043
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.8660254037844385,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:gM3iuOIP_TgJ:scholar.google.com/&scioq=Towards+Complete+Expressiveness+Capacity+of+Mixed+Multi-Agent+Q+Value+Function&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;1;0;1;1;2",
        "aff_unique_norm": "Xi'an Jiao Tong University;Huawei;Nanyang Technological University",
        "aff_unique_dep": ";Huawei Technologies;",
        "aff_unique_url": "https://www.xjtu.edu.cn;https://www.huawei.com;https://www.ntu.edu.sg",
        "aff_unique_abbr": "XJTU;Huawei;NTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;1",
        "aff_country_unique": "China;Singapore"
    },
    {
        "id": "TAtAYUf1aq",
        "title": "Memoria: Hebbian Memory Architecture for Human-Like Sequential Processing",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Transformers have demonstrated their success in various domains and tasks. However, Transformers struggle with long input sequences due to their limited capacity. While one solution is to increase input length, endlessly stretching the length is unrealistic. Furthermore, humans selectively remember and use only relevant information from inputs, unlike Transformers which process all raw data from start to end. We introduce Memoria, a general memory network that applies Hebbian theory which is a major theory explaining human memory formulation to enhance long-term dependencies in neural networks. Memoria stores and retrieves information called engram at multiple memory levels of working memory, short-term memory, and long-term memory, using connection weights that change according to Hebb's rule. Through experiments with popular Transformer-based models like BERT and GPT, we present that Memoria significantly improves the ability to consider long-term dependencies in various tasks. Results show that Memoria outperformed existing methodologies in sorting and language modeling, and long text classification.",
        "keywords": "Hebbian;Memory",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/d54aa0f574f11a2c80a7dfddd4d9105ba6a64392.zip",
        "author": "Sangjun Park;JinYeong Bak",
        "authorids": "~Sangjun_Park1;~JinYeong_Bak2",
        "gender": "M;M",
        "homepage": "https://cosmoquester.github.io/;https://nosyu.kr",
        "dblp": ";22/11519",
        "google_scholar": "lb_8YyMAAAAJ;https://scholar.google.co.kr/citations?user=oYK9Z_IAAAAJ",
        "orcid": "0000-0002-1838-9259;0000-0002-3212-5241",
        "linkedin": "cosmoquester/;jybak/",
        "or_profile": "~Sangjun_Park1;~JinYeong_Bak2",
        "aff": "SungKyunKwan University;Sungkyunkwan University",
        "aff_domain": "skku.edu;skku.edu",
        "position": "Undergrad student;Assistant Professor",
        "bibtex": "@misc{\npark2024memoria,\ntitle={Memoria: Hebbian Memory Architecture for Human-Like Sequential Processing},\nauthor={Sangjun Park and JinYeong Bak},\nyear={2024},\nurl={https://openreview.net/forum?id=TAtAYUf1aq}\n}",
        "github": "",
        "project": "",
        "reviewers": "kh5V;nkcU;Dynf;XBXw;1Zx2",
        "site": "https://openreview.net/forum?id=TAtAYUf1aq",
        "pdf_size": 35741685,
        "rating": "5;6;6;6;8",
        "confidence": "3;3;4;3;4",
        "soundness": "2;3;3;3;3",
        "contribution": "2;3;3;3;4",
        "presentation": "2;2;2;3;3",
        "wc_summary": "39;28;118;108;108",
        "wc_strengths": "72;26;16;69;61",
        "wc_weaknesses": "78;262;191;259;141",
        "wc_questions": "307;193;68;427;191",
        "wc_review": "496;509;393;863;501",
        "wc_reply_reviewers": "156;0;0;65;78",
        "wc_reply_authors": "1090;1163;770;1048;1391",
        "reply_reviewers": "1;0;0;1;1",
        "reply_authors": "3;2;1;2;3",
        "rating_avg": [
            6.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.4,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            3.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            2.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            80.2,
            38.46244921998598
        ],
        "wc_strengths_avg": [
            48.8,
            23.198275797998438
        ],
        "wc_weaknesses_avg": [
            186.2,
            70.45395659577963
        ],
        "wc_questions_avg": [
            237.2,
            121.33655673373956
        ],
        "wc_review_avg": [
            552.4,
            160.9889437197474
        ],
        "wc_reply_reviewers_avg": [
            59.8,
            57.90474937343223
        ],
        "wc_reply_authors_avg": [
            1092.4,
            200.03259734353298
        ],
        "reply_reviewers_avg": [
            0.6,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            2.2,
            0.7483314773547882
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.6666666666666667,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13626156294722498526&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Sungkyunkwan University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.skku.edu",
        "aff_unique_abbr": "SKKU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "TB5THwq1sq",
        "title": "Physics Informed Neurally Constructed ODE Networks (PINeCONes)",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recently, there has been a growing interest in using neural networks to approximate the solutions of partial differential equations (PDEs). Physics-informed neural networks (PINNs) have emerged as a promising framework for parameterizing PDE solutions using deep neural networks. However, PINNs often rely on memory-intensive optimizers to attain reasonable accuracy and can encounter training difficulties due to issues such as stiffness in the gradient flow of the loss. To address these challenges, we propose a novel network architecture that combines neural ordinary differential equations (ODEs) with physics-informed constraints in the loss function. In this approach, the dynamics within a neural ODE are expanded to include a system of ODEs whose solution provides the partial derivatives governing our PDE system. We call this architecture PINECONEs: physics-informed neurally constructed ODE networks. We evaluate the approach using simple but canonical PDEs from the literature to illustrate its potential. Our results show that training requires fewer iterations than previous approaches to achieve higher accuracy when using first-order optimization methods.",
        "keywords": "Scientific Machine Learning;Neural ODEs;PINNs;PDEs",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "/attachment/45b469e8182ff7d4397b26dca2fa8a5593047a9f.pdf",
        "author": "Maricela Best Mckay;Brian Wetton;Bhushan Gopaluni",
        "authorids": "~Maricela_Best_Mckay1;~Brian_Wetton1;~Bhushan_Gopaluni1",
        "gender": "F;M;M",
        "homepage": "https://dais.chbe.ubc.ca/people/maricela-best-mckay/;https://sites.google.com/view/brianwetton;http://dais.chbe.ubc.ca",
        "dblp": ";88/953;41/1931",
        "google_scholar": ";https://scholar.google.ca/citations?user=AiPavewAAAAJ;https://scholar.google.ca/citations?user=3rB_SGYAAAAJ",
        "orcid": ";0000-0002-6808-6301;",
        "linkedin": ";;",
        "or_profile": "~Maricela_Best_Mckay1;~Brian_Wetton1;~Bhushan_Gopaluni1",
        "aff": "University of British Columbia;University of British Columbia;University of British Columbia",
        "aff_domain": "ubc.ca;ubc.ca;ubc.ca",
        "position": "PhD student;Full Professor;Professor",
        "bibtex": "@misc{\nmckay2024physics,\ntitle={Physics Informed Neurally Constructed {ODE} Networks ({PIN}e{CON}es)},\nauthor={Maricela Best Mckay and Brian Wetton and Bhushan Gopaluni},\nyear={2024},\nurl={https://openreview.net/forum?id=TB5THwq1sq}\n}",
        "github": "",
        "project": "",
        "reviewers": "cWov;Lv3K;jF5i;Btbx;WRLE",
        "site": "https://openreview.net/forum?id=TB5THwq1sq",
        "pdf_size": 838241,
        "rating": "3;3;3;3;6",
        "confidence": "4;2;4;3;4",
        "soundness": "2;2;2;2;3",
        "contribution": "2;2;2;1;3",
        "presentation": "3;2;3;2;3",
        "wc_summary": "49;53;40;51;43",
        "wc_strengths": "20;87;33;157;6",
        "wc_weaknesses": "219;60;225;208;142",
        "wc_questions": "6;229;9;61;138",
        "wc_review": "294;429;307;477;329",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "451;306;495;729;452",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            3.6,
            1.2
        ],
        "confidence_avg": [
            3.4,
            0.8
        ],
        "soundness_avg": [
            2.2,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            47.2,
            4.915282290977803
        ],
        "wc_strengths_avg": [
            60.6,
            55.463862108583825
        ],
        "wc_weaknesses_avg": [
            170.8,
            62.85029832864758
        ],
        "wc_questions_avg": [
            88.6,
            84.93903696181161
        ],
        "wc_review_avg": [
            367.2,
            72.54901791202965
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            486.6,
            137.04685330207332
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.375,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:UbRce5MnF1sJ:scholar.google.com/&scioq=Physics+Informed+Neurally+Constructed+ODE+Networks+(PINeCONes)&hl=en&as_sdt=0,22",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of British Columbia",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ubc.ca",
        "aff_unique_abbr": "UBC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "TBLe2BHBsr",
        "title": "Dilated convolution neural operator for multiscale partial differential equations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper presents a data-driven operator learning method for multiscale partial differential equations, where preserving high-frequency information is critical. We propose the Dilated Convolution Neural Operator (DCNO), which combines dilated convolution layers to effectively capture high-frequency features at a low computational cost, along with Fourier layers to handle smooth features. We conduct experiments to evaluate the performance of DCNO on various datasets, including the multiscale elliptic equation, its inverse problem, Navier-Stokes equation, and Helmholtz equation. DCNO stands out with significantly higher accuracy compared to existing neural operator techniques, and strikes an optimal balance between accuracy and computational cost.",
        "keywords": "operator learning;multiscale PDE;dilated convolution;high frequency features;spectral bias",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/dc29d7b68846a0e0341cca0a9ef4d2c5a217bdc3.zip",
        "author": "Bo Xu;Lei Zhang",
        "authorids": "~Bo_Xu12;~Lei_Zhang42",
        "gender": ";M",
        "homepage": "https://boxu.github.io/index.html;https://ins.sjtu.edu.cn/people/lzhang/home.html",
        "dblp": ";",
        "google_scholar": ";bsoSk6EAAAAJ",
        "orcid": ";0000-0002-2917-9652",
        "linkedin": ";",
        "or_profile": "~Bo_Xu12;~Lei_Zhang42",
        "aff": "Shanghai Jiaotong University;",
        "aff_domain": "sjtu.edu.cn;",
        "position": "PhD student;",
        "bibtex": "@misc{\nxu2024dilated,\ntitle={Dilated convolution neural operator for multiscale partial differential equations},\nauthor={Bo Xu and Lei Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=TBLe2BHBsr}\n}",
        "github": "",
        "project": "",
        "reviewers": "TQWW;epq9;Ds1k",
        "site": "https://openreview.net/forum?id=TBLe2BHBsr",
        "pdf_size": 9532551,
        "rating": "5;5;5",
        "confidence": "4;4;4",
        "soundness": "2;3;2",
        "contribution": "2;2;1",
        "presentation": "2;3;2",
        "wc_summary": "140;86;118",
        "wc_strengths": "91;105;14",
        "wc_weaknesses": "284;1030;99",
        "wc_questions": "234;142;141",
        "wc_review": "749;1363;372",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "642;1318;1017",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;2;2",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            114.66666666666667,
            22.17105219775452
        ],
        "wc_strengths_avg": [
            70.0,
            40.00833246545858
        ],
        "wc_weaknesses_avg": [
            471.0,
            402.42349169334864
        ],
        "wc_questions_avg": [
            172.33333333333334,
            43.606829230701415
        ],
        "wc_review_avg": [
            828.0,
            408.4123733026053
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            992.3333333333334,
            276.5264705030766
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16733577655121322993&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0",
        "aff_unique_norm": "Shanghai Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sjtu.edu.cn",
        "aff_unique_abbr": "SJTU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "TBh4XQAXEb",
        "title": "Untrained Networks' Class Bias: A Theoretical Investigation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The initial state of neural networks plays a central role in conditioning the subsequent training dynamics.\nIn the context of classification problems, we provide a theoretical analysis demonstrating that the structure of a neural network can condition the model to assign all predictions to the same class, even before the beginning of training, and in the absence of explicit biases. We show that the presence of this phenomenon, which we call \"Initial Guessing Bias\" (IGB), depends on architectural choices such as activation functions, max-pooling layers, and network depth.\nOur analysis of IGB has practical consequences, in that it guides architecture selection and initialization. We also highlight theoretical consequences, such as the breakdown of node-permutation symmetry, the violation of self-averaging, the validity of some mean-field approximations, and the non-trivial differences arising with depth.",
        "keywords": "theoretical;bias;initialization;classification;self-averaging",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Emanuele Francazi;Aurelien Lucchi;Marco Baity-Jesi",
        "authorids": "~Emanuele_Francazi1;~Aurelien_Lucchi1;~Marco_Baity-Jesi1",
        "gender": ";M;M",
        "homepage": "https://sites.google.com/view/emanuelefrancazi/home-page;http://people.inf.ethz.ch/alucchi/;https://mbaityje.github.io/",
        "dblp": "323/8096;14/5780;52/11265",
        "google_scholar": "hf5I62kAAAAJ;https://scholar.google.ch/citations?user=V1ONSgIAAAAJ;",
        "orcid": ";;0000-0002-8723-906X",
        "linkedin": "emanuele-francazi-a71717238;;",
        "or_profile": "~Emanuele_Francazi1;~Aurelien_Lucchi1;~Marco_Baity-Jesi1",
        "aff": "EPFL - EPF Lausanne;University of Basel;Eawag",
        "aff_domain": "epfl.ch;unibas.ch;eawag.ch",
        "position": "PhD student;Assistant Professor;Group Leader",
        "bibtex": "@misc{\nfrancazi2024untrained,\ntitle={Untrained Networks' Class Bias: A Theoretical Investigation},\nauthor={Emanuele Francazi and Aurelien Lucchi and Marco Baity-Jesi},\nyear={2024},\nurl={https://openreview.net/forum?id=TBh4XQAXEb}\n}",
        "github": "",
        "project": "",
        "reviewers": "8Cof;GMZV;uugM;nZE9",
        "site": "https://openreview.net/forum?id=TBh4XQAXEb",
        "pdf_size": 22348692,
        "rating": "3;3;3;5",
        "confidence": "4;4;4;3",
        "soundness": "3;3;2;2",
        "contribution": "2;1;3;2",
        "presentation": "1;2;2;3",
        "wc_summary": "70;96;78;195",
        "wc_strengths": "85;35;18;347",
        "wc_weaknesses": "475;124;295;841",
        "wc_questions": "4;29;3;7",
        "wc_review": "634;284;394;1390",
        "wc_reply_reviewers": "0;0;0;273",
        "wc_reply_authors": "757;179;749;141",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            109.75,
            50.11175011910879
        ],
        "wc_strengths_avg": [
            121.25,
            132.6430831215861
        ],
        "wc_weaknesses_avg": [
            433.75,
            265.8715620370106
        ],
        "wc_questions_avg": [
            10.75,
            10.638961415476606
        ],
        "wc_review_avg": [
            675.5,
            431.49362683590124
        ],
        "wc_reply_reviewers_avg": [
            68.25,
            118.21246761657588
        ],
        "wc_reply_authors_avg": [
            456.5,
            296.8177049975287
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:_Nk5qKHD1qEJ:scholar.google.com/&scioq=Untrained+Networks%27+Class+Bias:+A+Theoretical+Investigation&hl=en&as_sdt=0,47",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "EPFL;University of Basel;Eawag",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.epfl.ch;https://www.unibas.ch;https://www.eawag.ch",
        "aff_unique_abbr": "EPFL;UniBas;",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Lausanne;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Switzerland"
    },
    {
        "id": "TBuOs3jV3w",
        "title": "Text-driven Editing of 3D Scenes without Retraining",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Numerous diffusion models have recently been applied to image synthesis and editing. However, editing 3D scenes is still in its early stages. It poses various challenges, such as the requirement to design specific methods for different editing types, retraining new models for various 3D scenes, and the absence of convenient human interaction during editing. To tackle these issues, we introduce a text-driven editing method, termed DN2N, which allows for the direct acquisition of a NeRF model with universal editing capabilities, eliminating the requirement for retraining. Our method employs off-the-shelf text-based editing models of 2D images to modify the 3D scene images, followed by a filtering process to discard poorly edited images that disrupt 3D consistency. We then consider the remaining inconsistency as a problem of removing noise perturbation, which can be solved by generating data with similar perturbation characteristics for training. We propose cross-view regularization terms to help the DN2N model mitigate these perturbations. Our text-driven method allows users to edit a 3D scene with their desired description, which is more friendly, intuitive, and practical than prior works. Empirical results show that our method achieves multiple editing types, including but not limited to appearance editing, weather transition, object changing, and style transfer. Most significantly, our method exhibits strong generalization of editing capabilities, eliminating the need to customize or retrain editing models for specific scenes or editing types. It realizes visual outcomes on par with or exceeding previous techniques needing iterative optimization while reducing editing time and memory overhead.",
        "keywords": "3D scene editing;text-driven;generalizable;without retraining",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/7294642c2d8e68a59871e9bf4bf6f46893f3a45b.zip",
        "author": "Shuangkang Fang;Yufeng Wang;Yi Yang;Yi-Hsuan Tsai;Wenrui Ding;Shuchang Zhou;Ming-Hsuan Yang",
        "authorids": "~Shuangkang_Fang1;~Yufeng_Wang2;~Yi_Yang20;~Yi-Hsuan_Tsai1;~Wenrui_Ding1;~Shuchang_Zhou1;~Ming-Hsuan_Yang1",
        "gender": "M;M;M;M;F;M;M",
        "homepage": "http://sk-fun.fun/;https://wyfeng1020.github.io/;https://blog.ahyangyi.org;https://sites.google.com/site/yihsuantsai/home;https://shi.buaa.edu.cn/dingwenrui/zh_CN/index.htm;https://zsc.github.io/;https://faculty.ucmerced.edu/mhyang/",
        "dblp": "262/4025;90/6339-4;33/4854-33.html;142/2924;08/10143;67/8436-1;79/3711.html",
        "google_scholar": "https://scholar.google.com.hk/citations?user=gkSIImkAAAAJ;;5u95wzMAAAAJ;https://scholar.google.it/citations?user=zjI51wEAAAAJ;;zYI0rysAAAAJ;p9-ohHsAAAAJ",
        "orcid": "0009-0001-1066-5896;0000-0001-8713-3153;;;0000-0001-5490-4724;0000-0002-7294-5869;0000-0003-4848-2304",
        "linkedin": ";;;;;;minghsuanyang/",
        "or_profile": "~Shuangkang_Fang1;~Yufeng_Wang2;~Yi_Yang20;~Yi-Hsuan_Tsai1;~Wenrui_Ding1;~Shuchang_Zhou1;~Ming-Hsuan_Yang1",
        "aff": "Beihang University;Beihang University;StepFun Technology Co., Ltd.;Google;Beihang University;Megvii Technology Inc.;University of California at Merced",
        "aff_domain": "buaa.edu.cn;buaa.edu.cn;step.ai;google.com;buaa.edu.cn;megvii.com;umcerced.edu",
        "position": "PhD student;Assistant Professor;Researcher;Researcher;Full Professor;Principal Researcher;Professor",
        "bibtex": "@misc{\nfang2024textdriven,\ntitle={Text-driven Editing of 3D Scenes without Retraining},\nauthor={Shuangkang Fang and Yufeng Wang and Yi Yang and Yi-Hsuan Tsai and Wenrui Ding and Shuchang Zhou and Ming-Hsuan Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=TBuOs3jV3w}\n}",
        "github": "",
        "project": "",
        "reviewers": "xjTT;P4QJ;bafn;A4Ej",
        "site": "https://openreview.net/forum?id=TBuOs3jV3w",
        "pdf_size": 23471223,
        "rating": "1;5;5;5",
        "confidence": "3;4;4;2",
        "soundness": "1;2;1;2",
        "contribution": "2;2;3;3",
        "presentation": "1;2;3;2",
        "wc_summary": "33;62;78;101",
        "wc_strengths": "19;8;51;56",
        "wc_weaknesses": "341;33;175;184",
        "wc_questions": "143;36;29;198",
        "wc_review": "536;139;333;539",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1232;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;0;0;0",
        "rating_avg": [
            4.0,
            1.7320508075688772
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            1.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            68.5,
            24.743686063317245
        ],
        "wc_strengths_avg": [
            33.5,
            20.45116133621756
        ],
        "wc_weaknesses_avg": [
            183.25,
            109.0054471116008
        ],
        "wc_questions_avg": [
            101.5,
            71.73039801924983
        ],
        "wc_review_avg": [
            386.75,
            165.6236320698227
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            308.0,
            533.4716487312143
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0.5,
            0.8660254037844386
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.17407765595569782,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16367026458429294383&as_sdt=5,31&sciodt=0,31&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2;0;3;4",
        "aff_unique_norm": "Beihang University;StepFun Technology;Google;Megvii Technology;University of California, Merced",
        "aff_unique_dep": ";Technology;Google;;",
        "aff_unique_url": "http://www.buaa.edu.cn/;;https://www.google.com;https://www.megvii.com;https://www.ucmerced.edu",
        "aff_unique_abbr": "BUAA;;Google;Megvii;UC Merced",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Mountain View;Merced",
        "aff_country_unique_index": "0;0;0;1;0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "TC9r8gsaoh",
        "title": "Nuisance-Robust Weighting Network for End-to-End Causal Effect Estimation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We combine the two major approaches to causal inference: the conventional statistical approach based on weighting and the end-to-end learning with adversarial networks.\nCausal inference concerns the expected loss in a distribution different from the training distribution due to intervening on the input variables.\nRecently, the representation balancing approach with neural networks has repeatedly demonstrated superior performance for complex problems, owing to its end-to-end modeling by adversarial formulation.\nHowever, some recent work has shown that the limitation lies in the unrealistic theoretical assumption of the invertibility of the representation extractor.\nThis inherent difficulty stems from the fact that the representation-level discrepancy in representation balancing accounts only for the uncertainty of the later layers than the representation, i.e., the hypothesis layers and the loss.\nTherefore, we shed light once again on the conventional weighting-based approach, retaining the spirit of end-to-end learning.\nMost conventional statistical methods are based on inverse probability weighting using propensity scores, which involves nuisance estimation of propensity as an intermediate step.\nThey often suffer from inaccurate estimation of the propensity scores and instability due to large weights.\nOne might be tempted to jointly optimize the nuisance and the target, though it may lead to an optimistic evaluation, e.g., avoiding noisy instances by weighting less when noise levels are heterogeneous.\nIn this paper, we propose a simple method that amalgamates the strengths of both approaches: adversarial joint optimization of the nuisance and the target.\nOur formulation follows the pessimistic evaluation principle in offline reinforcement learning, which brings provable robustness to the estimation uncertainty of the nuisance and the instability due to extreme weights.\nOur method performed consistently well under challenging settings with heterogeneous noise. Our code is available online: https://anonymous.4open.science/r/NuNet-002A .",
        "keywords": "causal inference;pessimism;adversarial training",
        "primary_area": "causal reasoning",
        "supplementary_material": "/attachment/bdbd9308ab58b336ab273a9e39406445e40280c8.pdf",
        "author": "Akira Tanimoto",
        "authorids": "~Akira_Tanimoto1",
        "gender": "M",
        "homepage": "https://jpn.nec.com/rd/people/akira_tanimoto.html",
        "dblp": "143/0191",
        "google_scholar": "https://scholar.google.co.jp/citations?user=f6ICjvgAAAAJ",
        "orcid": "0000-0003-0459-3993",
        "linkedin": "",
        "or_profile": "~Akira_Tanimoto1",
        "aff": "NEC",
        "aff_domain": "nec.com",
        "position": "Researcher",
        "bibtex": "@misc{\ntanimoto2024nuisancerobust,\ntitle={Nuisance-Robust Weighting Network for End-to-End Causal Effect Estimation},\nauthor={Akira Tanimoto},\nyear={2024},\nurl={https://openreview.net/forum?id=TC9r8gsaoh}\n}",
        "github": "",
        "project": "",
        "reviewers": "S5uy;DQuR;KLj8",
        "site": "https://openreview.net/forum?id=TC9r8gsaoh",
        "pdf_size": 308556,
        "rating": "5;5;8",
        "confidence": "4;3;2",
        "soundness": "2;3;3",
        "contribution": "2;2;4",
        "presentation": "3;2;3",
        "wc_summary": "51;63;253",
        "wc_strengths": "25;51;33",
        "wc_weaknesses": "770;171;19",
        "wc_questions": "12;144;2",
        "wc_review": "858;429;307",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "937;1130;203",
        "reply_reviewers": "0;0;0",
        "reply_authors": "3;2;1",
        "rating_avg": [
            6.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            122.33333333333333,
            92.52507167729668
        ],
        "wc_strengths_avg": [
            36.333333333333336,
            10.873004286866728
        ],
        "wc_weaknesses_avg": [
            320.0,
            324.1923297468135
        ],
        "wc_questions_avg": [
            52.666666666666664,
            64.71132478597201
        ],
        "wc_review_avg": [
            531.3333333333334,
            236.29689422889632
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            756.6666666666666,
            399.3514186221899
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.8660254037844387,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:GF_Z42Yym5AJ:scholar.google.com/&scioq=Nuisance-Robust+Weighting+Network+for+End-to-End+Causal+Effect+Estimation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "NEC Corporation",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nec.com",
        "aff_unique_abbr": "NEC",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Japan"
    },
    {
        "id": "TCGUnoiaWP",
        "title": "3D Human Reconstruction in the Wild with Synthetic Data Using Generative Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Human pose and shape estimation from monocular images play a fundamental role in computer vision applications such as augmented reality, virtual try-on, and human motion analysis. However, it is laborious to annotate 2D skeleton keypoints and it is even more expensive to obtain high-quality 3D human meshes using motion capture or computer graphics rendering techniques. In this work, we propose an effective approach based on recent diffusion models, termed \\emph{\\Ours}, which can effortlessly generate human images and corresponding 2D human skeletons and 3D mesh annotations. Specifically,  we first leverage a multi-conditioned stable diffusion model to generate diverse human images and initial ground-truth labels. At the core of this step is that we can easily obtain numerous depth and keypoints conditions from a 3D human parametric model, e.g., SMPL-X, by rendering the 3D mesh onto the image plane. The generated human image and the corresponding 3D mesh with camera parameters can be regarded as a pair of training samples. As there exists inevitable noise in the initial labels, we then cast the problem into a label-denoising process by employing an off-the-shelf 2D human pose estimator to filter negative data pairs and further optimize the pose parameters. Finally, we can build a unified human pose dataset with both 2D skeleton and 3D parametric model annotations. Experiments on 2D datasets (COCO, OCHuman) and 3D datasets (3DPW, RICH, SSP-3D) demonstrate the effectiveness of our approach. Thus, our method offers a promising avenue for advancing the field of human pose and shape estimation by generating large-scale human images and high-quality annotations in a fully automated fashion.",
        "keywords": "human pose and shape estimation;generative models;human pose dataset;automatic annotation",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/5f2bbba869588b03ed5764118feba51a7b2b461b.zip",
        "author": "Yongtao Ge;Wenjia Wang;Yongfan Chen;Yang Liu;Hao Chen;Xuan Wang;Chunhua Shen",
        "authorids": "~Yongtao_Ge1;~Wenjia_Wang1;~Yongfan_Chen1;~Yang_Liu83;~Hao_Chen17;~Xuan_Wang2;~Chunhua_Shen2",
        "gender": "M;M;M;M;;M;",
        "homepage": "https://www.github.com/yongtaoge;https://wenjiawang0312.github.io/;https://github.com/Jeckinchen;https://github.com/yangliu96;;https://xuanwangvc.github.io/;",
        "dblp": "289/0822;;;51/3710-98.html;;34/4799-9;",
        "google_scholar": "r8SywYYAAAAJ;https://scholar.google.com/citations?hl=zh-CN;;9JcQ2hwAAAAJ;;h-3xd3EAAAAJ;",
        "orcid": "0000-0003-1265-3204;;;0009-0003-8540-9154;;0000-0001-5813-3875;",
        "linkedin": ";;;;;;",
        "or_profile": "~Yongtao_Ge1;~Wenjia_Wang1;~Yongfan_Chen1;~Yang_Liu83;~Hao_Chen17;~Xuan_Wang2;~Chunhua_Shen2",
        "aff": "University of Adelaide;University of Hong Kong;Zhejiang University;Zhejiang University;;Ant Research;",
        "aff_domain": "adelaide.edu.au;hku.hk;zju.edu.cn;zju.edu.cn;;antgroup.com;",
        "position": "PhD student;PhD student;MS student;PhD student;;Scientific Researcher;",
        "bibtex": "@misc{\nge2024d,\ntitle={3D Human Reconstruction in the Wild with Synthetic Data Using Generative Models},\nauthor={Yongtao Ge and Wenjia Wang and Yongfan Chen and Yang Liu and Hao Chen and Xuan Wang and Chunhua Shen},\nyear={2024},\nurl={https://openreview.net/forum?id=TCGUnoiaWP}\n}",
        "github": "",
        "project": "",
        "reviewers": "NnQT;iUwf;isbg;QSLS",
        "site": "https://openreview.net/forum?id=TCGUnoiaWP",
        "pdf_size": 6688484,
        "rating": "3;3;3;6",
        "confidence": "5;4;5;3",
        "soundness": "2;4;3;3",
        "contribution": "2;2;1;3",
        "presentation": "3;3;3;3",
        "wc_summary": "64;87;122;86",
        "wc_strengths": "28;24;62;28",
        "wc_weaknesses": "316;174;73;258",
        "wc_questions": "15;33;54;5",
        "wc_review": "423;318;311;377",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            89.75,
            20.765054779605084
        ],
        "wc_strengths_avg": [
            35.5,
            15.386682553429118
        ],
        "wc_weaknesses_avg": [
            205.25,
            91.5351708361327
        ],
        "wc_questions_avg": [
            26.75,
            18.659782956937093
        ],
        "wc_review_avg": [
            357.25,
            45.805976684271236
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.8703882797784892,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10442158563098905541&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;2;3",
        "aff_unique_norm": "University of Adelaide;University of Hong Kong;Zhejiang University;Ant Research",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.adelaide.edu.au;https://www.hku.hk;https://www.zju.edu.cn;https://www.antgroup.com",
        "aff_unique_abbr": "Adelaide;HKU;ZJU;Ant Research",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;1;1;1;1",
        "aff_country_unique": "Australia;China"
    },
    {
        "id": "TCJbcjS0c2",
        "title": "LASER: Linear Compression in Wireless Distributed Optimization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Data-parallel SGD is the de facto algorithm for distributed optimization, especially for large scale machine learning. Despite its merits, communication bottleneck is one of its persistent issues. Most compression schemes to alleviate this either assume noiseless communication links, or fail to achieve good performance on practical tasks. In this paper, we close this gap and introduce ${\\bf LASER}$: ${\\bf L}$ine${\\bf A}$r Compre${\\bf S}$sion in Wir${\\bf E}$less Dist${\\bf R}$ibuted Optimization. LASER capitalizes on the inherent low-rank structure of gradients and transmits them efficiently over the noisy channels. Whilst enjoying theoretical guarantees similar to that of the classical SGD, LASER shows consistent gains over baselines on a variety of practical benchmarks. In particular, it outperforms the state-of-the-art compression schemes on challenging computer vision and GPT language modeling tasks. On the latter, we obtain $50$-$64$ % improvement in perplexity over our baselines for noisy channels.",
        "keywords": "distributed optimization;wireless communication;gradient compression;deep learning",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/948989ce67c87ed31a1a06eca54fb2a6fc0d2119.zip",
        "author": "Ashok Vardhan Makkuva;Marco Bondaschi;Thijs Vogels;Martin Jaggi;Hyeji Kim;Michael Gastpar",
        "authorids": "~Ashok_Vardhan_Makkuva1;~Marco_Bondaschi1;~Thijs_Vogels1;~Martin_Jaggi1;~Hyeji_Kim1;~Michael_Gastpar1",
        "gender": ";M;M;M;;",
        "homepage": ";;https://thijs.link;https://mlo.epfl.ch;;https://people.epfl.ch/michael.gastpar",
        "dblp": ";255/4933;https://dblp.uni-trier.de/pid/169/7392;17/4402;;",
        "google_scholar": ";;KKQCt30AAAAJ;https://scholar.google.ch/citations?user=r1TJBr8AAAAJ;;https://scholar.google.ch/citations?user=IQ3hcw4AAAAJ",
        "orcid": ";0000-0002-4158-2487;0000-0002-5884-4842;0000-0003-1579-5558;;0000-0002-5499-5336",
        "linkedin": ";;;;;",
        "or_profile": "~Ashok_Vardhan_Makkuva1;~Marco_Bondaschi1;~Thijs_Vogels1;~Martin_Jaggi1;~Hyeji_Kim1;~Michael_Gastpar1",
        "aff": ";EPFL - EPF Lausanne;Swiss Federal Institute of Technology Lausanne;EPFL;;School of Computer and Communication Sciences, EPFL - EPF Lausanne",
        "aff_domain": ";epfl.ch;epfl.ch;epfl.ch;;ic.epfl.ch",
        "position": ";PhD student;PhD student;Associate Professor;;Full Professor",
        "bibtex": "@misc{\nmakkuva2024laser,\ntitle={{LASER}: Linear Compression in Wireless Distributed Optimization},\nauthor={Ashok Vardhan Makkuva and Marco Bondaschi and Thijs Vogels and Martin Jaggi and Hyeji Kim and Michael Gastpar},\nyear={2024},\nurl={https://openreview.net/forum?id=TCJbcjS0c2}\n}",
        "github": "",
        "project": "",
        "reviewers": "71LW;dVrm;DPBP;t6dq;ykHv;yf4L",
        "site": "https://openreview.net/forum?id=TCJbcjS0c2",
        "pdf_size": 434337,
        "rating": "3;6;6;6;6;8",
        "confidence": "4;4;3;4;4;3",
        "soundness": "3;3;2;2;3;4",
        "contribution": "1;2;2;2;3;4",
        "presentation": "3;3;2;3;3;4",
        "wc_summary": "75;66;65;80;43;66",
        "wc_strengths": "64;90;24;90;31;160",
        "wc_weaknesses": "192;153;69;86;300;9",
        "wc_questions": "91;62;5;2;28;272",
        "wc_review": "422;371;163;258;402;507",
        "wc_reply_reviewers": "0;0;0;10;0;334",
        "wc_reply_authors": "316;285;34;311;839;485",
        "reply_reviewers": "0;0;0;1;0;2",
        "reply_authors": "1;2;1;2;2;2",
        "rating_avg": [
            5.833333333333333,
            1.462494064565354
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.8333333333333335,
            0.6871842709362768
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "presentation_avg": [
            3.0,
            0.5773502691896257
        ],
        "wc_summary_avg": [
            65.83333333333333,
            11.596215857865971
        ],
        "wc_strengths_avg": [
            76.5,
            45.31280172313339
        ],
        "wc_weaknesses_avg": [
            134.83333333333334,
            94.36704344679285
        ],
        "wc_questions_avg": [
            76.66666666666667,
            92.78589452186264
        ],
        "wc_review_avg": [
            353.8333333333333,
            112.7850709190814
        ],
        "wc_reply_reviewers_avg": [
            57.333333333333336,
            123.78296418418095
        ],
        "wc_reply_authors_avg": [
            378.3333333333333,
            244.70640004344435
        ],
        "reply_reviewers_avg": [
            0.5,
            0.7637626158259734
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5640760748177662,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12759355906006547739&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "EPFL;Swiss Federal Institute of Technology Lausanne",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.epfl.ch;https://www.epfl.ch",
        "aff_unique_abbr": "EPFL;EPFL",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Lausanne;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Switzerland"
    },
    {
        "id": "TCSoDjtSZL",
        "title": "Consistent123: One Image to Highly Consistent 3D Asset Using Case-Aware Diffusion Priors",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Reconstructing 3D objects from a single image guided by pretrained diffusion models has demonstrated promising outcomes. However, due to utilizing the case-agnostic rigid strategy, their generalization ability to arbitrary cases and the 3D consistency of reconstruction are still poor. In this work, we propose Consistent123, a case-aware two-stage method for highly consistent 3D asset reconstruction from one image with both 2D and 3D diffusion priors. In the first stage, Consistent123 utilizes only 3D structural priors for sufficient geometry exploitation, with a CLIP-based case-aware adaptive detection mechanism embedded within this process. In the second stage, 2D texture priors are introduced and progressively take on a dominant guiding role, delicately sculpting the details of the 3D model. Consistent123 aligns more closely with the evolving trends in guidance requirements, adaptively providing adequate 3D geometric initialization and suitable 2D texture refinement for different objects. Consistent123 can obtain highly 3D-consistent reconstruction and exhibits strong generalization ability across various objects. Qualitative and quantitative experiments show that our method significantly outperforms state-of-the-art image-to-3D methods. See https://Consistent123.github.io for a more comprehensive exploration of our generated 3D assets.",
        "keywords": "Image-to-3D;Diffusion prior;Case-aware optimization",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/c8881ae0a2c098febfa44c95e9281ea429633c7e.zip",
        "author": "Yukang Lin;Haonan Han;Chaoqun Gong;Zunnan Xu;Yachao Zhang;Xiu Li",
        "authorids": "~Yukang_Lin1;~Haonan_Han1;~Chaoqun_Gong1;~Zunnan_Xu1;~Yachao_Zhang1;~Xiu_Li1",
        "gender": "M;M;M;;M;F",
        "homepage": "https://github.com/lyk412;https://vincenthancoder.github.io/;;;https://yachao-zhang.github.io/;https://thusigsiclab.github.io/thu.github.io/introduction.html",
        "dblp": ";;;;40/10584-1;13/1206-1",
        "google_scholar": ";vLZp870AAAAJ;;;https://scholar.google.de/citations?user=a-I8c8EAAAAJ;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": "0009-0001-2469-5690;0009-0002-4894-3860;0009-0007-1790-0434;;0000-0002-6153-5004;0000-0003-0403-1923",
        "linkedin": ";;;;;",
        "or_profile": "~Yukang_Lin1;~Haonan_Han1;~Chaoqun_Gong1;~Zunnan_Xu1;~Yachao_Zhang1;~Xiu_Li1",
        "aff": "Alibaba Group;Tsinghua University;Tsinghua University;;Tsinghua University;Tsinghua University",
        "aff_domain": "alibaba-inc.com;tsinghua.edu.cn;mail.tsinghua.edu.cn;;tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "Intern;PhD student;MS student;;Postdoc;Professor",
        "bibtex": "@misc{\nlin2024consistent,\ntitle={Consistent123: One Image to Highly Consistent 3D Asset Using Case-Aware Diffusion Priors},\nauthor={Yukang Lin and Haonan Han and Chaoqun Gong and Zunnan Xu and Yachao Zhang and Xiu Li},\nyear={2024},\nurl={https://openreview.net/forum?id=TCSoDjtSZL}\n}",
        "github": "",
        "project": "",
        "reviewers": "kMhZ;Ehrz;6JEL;qhyn",
        "site": "https://openreview.net/forum?id=TCSoDjtSZL",
        "pdf_size": 5661441,
        "rating": "3;5;5;5",
        "confidence": "5;3;3;4",
        "soundness": "1;3;3;3",
        "contribution": "1;2;2;2",
        "presentation": "1;2;3;3",
        "wc_summary": "116;100;70;73",
        "wc_strengths": "53;24;53;69",
        "wc_weaknesses": "236;395;154;250",
        "wc_questions": "322;98;24;94",
        "wc_review": "727;617;301;486",
        "wc_reply_reviewers": "12;303;41;61",
        "wc_reply_authors": "1191;1034;520;897",
        "reply_reviewers": "1;2;1;1",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            89.75,
            19.13602623325961
        ],
        "wc_strengths_avg": [
            49.75,
            16.23845743905498
        ],
        "wc_weaknesses_avg": [
            258.75,
            86.7910565669067
        ],
        "wc_questions_avg": [
            134.5,
            112.18177213790126
        ],
        "wc_review_avg": [
            532.75,
            158.68581379568874
        ],
        "wc_reply_reviewers_avg": [
            104.25,
            116.06329092353016
        ],
        "wc_reply_authors_avg": [
            910.5,
            248.29669752133233
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.8703882797784891,
        "gs_citation": 51,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2652532865861300105&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;1;1;1",
        "aff_unique_norm": "Alibaba Group;Tsinghua University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.alibaba.com;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "Alibaba;THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "TDxtP8nxkh",
        "title": "NAP2: Neural Networks Hyperparameter Optimization Using Weights and Gradients Analysis",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent hyper-parameter tuning methods for deep neural networks (DNNs) generally rely on first using low-fidelity methods to identify promising configurations and then using high-fidelity methods for further evaluation. While effective, existing solutions treat DNNs as `black boxes', which limits their predictive abilities. In this work, we propose Neural Architectures Performance Prediction (NAP2), a `white box' hyperparameter optimization approach. NAP2 models the changes in the weights and gradients of the analyzed networks over time and can predict their final performance with high accuracy, even after a short training period. Our evaluation shows that NAP2 outperforms the current state-of-the-art both in its ability to identify top-performing architectures and in the amount of resources it utilizes. Moreover, we show that our approach is transferable, meaning it is possible to train NAP2 on one dataset and apply it to another.",
        "keywords": "hyper-parameter optimization;neural networks performance prediction;meta-learning",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/ca8b2c491908fe4c5c1fa6c2e5552b3d1775da27.zip",
        "author": "Ariel Amsel;Gilad Katz",
        "authorids": "amsel@post.bgu.ac.il;~Gilad_Katz1",
        "gender": ";M",
        "homepage": ";",
        "dblp": ";54/10321",
        "google_scholar": ";FTCVfdMAAAAJ",
        "orcid": ";0000-0001-9478-7550",
        "linkedin": ";",
        "or_profile": "amsel@post.bgu.ac.il;~Gilad_Katz1",
        "aff": ";Ben-Gurion University of the Negev",
        "aff_domain": ";bgu.ac.il",
        "position": ";Assistant Professor",
        "bibtex": "@misc{\namsel2024nap,\ntitle={{NAP}2: Neural Networks Hyperparameter Optimization Using Weights and Gradients Analysis},\nauthor={Ariel Amsel and Gilad Katz},\nyear={2024},\nurl={https://openreview.net/forum?id=TDxtP8nxkh}\n}",
        "github": "",
        "project": "",
        "reviewers": "p8Rh;2Mh1;W1Sa;Q7He",
        "site": "https://openreview.net/forum?id=TDxtP8nxkh",
        "pdf_size": 1861580,
        "rating": "3;3;5;5",
        "confidence": "4;5;4;5",
        "soundness": "3;2;3;3",
        "contribution": "2;2;2;2",
        "presentation": "2;2;2;2",
        "wc_summary": "50;59;78;58",
        "wc_strengths": "31;71;52;55",
        "wc_weaknesses": "84;289;145;303",
        "wc_questions": "18;2;22;140",
        "wc_review": "183;421;297;556",
        "wc_reply_reviewers": "100;336;55;323",
        "wc_reply_authors": "668;824;762;1371",
        "reply_reviewers": "1;1;1;2",
        "reply_authors": "1;1;2;4",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            61.25,
            10.280442597476044
        ],
        "wc_strengths_avg": [
            52.25,
            14.236836024903848
        ],
        "wc_weaknesses_avg": [
            205.25,
            93.4087121204441
        ],
        "wc_questions_avg": [
            45.5,
            55.070409477322755
        ],
        "wc_review_avg": [
            364.25,
            139.07080031408464
        ],
        "wc_reply_reviewers_avg": [
            203.5,
            127.08363387942603
        ],
        "wc_reply_authors_avg": [
            906.25,
            274.0112908257614
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:05SYl1eTMgUJ:scholar.google.com/&scioq=NAP2:+Neural+Networks+Hyperparameter+Optimization+Using+Weights+and+Gradients+Analysis&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Ben-Gurion University of the Negev",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.bgu.ac.il",
        "aff_unique_abbr": "BGU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Israel"
    },
    {
        "title": "Proximal Policy Gradient Arborescence for Quality Diversity Reinforcement Learning",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18581",
        "id": "TFKIfhvdmZ",
        "author_site": "Sumeet Batra, Bryon Tjanaka, Matthew Fontaine, Aleksei Petrenko, Stefanos Nikolaidis, Gaurav Sukhatme",
        "tldr": "",
        "abstract": "Training generally capable agents that thoroughly explore their environment and\nlearn new and diverse skills is a long-term goal of robot learning. Quality Diversity\nReinforcement Learning (QD-RL) is an emerging research area that blends the\nbest aspects of both fields \u2013 Quality Diversity (QD) provides a principled form\nof exploration and produces collections of behaviorally diverse agents, while\nReinforcement Learning (RL) provides a powerful performance improvement\noperator enabling generalization across tasks and dynamic environments. Existing\nQD-RL approaches have been constrained to sample efficient, deterministic off-\npolicy RL algorithms and/or evolution strategies and struggle with highly stochastic\nenvironments. In this work, we, for the first time, adapt on-policy RL, specifically\nProximal Policy Optimization (PPO), to the Differentiable Quality Diversity (DQD)\nframework and propose several changes that enable efficient optimization and\ndiscovery of novel skills on high-dimensional, stochastic robotics tasks. Our new\nalgorithm, Proximal Policy Gradient Arborescence (PPGA), achieves state-of-\nthe-art results, including a 4x improvement in best reward over baselines on the\nchallenging humanoid domain.",
        "keywords": "Reinforcement Learning;Quality Diversity;Robotics;Machine Learning;Evolution Strategies",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/c86dc0f0cb27215dd68fdf05ef563b1b7f50bed9.zip",
        "author": "Sumeet Batra;Bryon Tjanaka;Matthew Christopher Fontaine;Aleksei Petrenko;Stefanos Nikolaidis;Gaurav S. Sukhatme",
        "authorids": "~Sumeet_Batra1;~Bryon_Tjanaka1;~Matthew_Christopher_Fontaine1;~Aleksei_Petrenko1;~Stefanos_Nikolaidis1;~Gaurav_S._Sukhatme1",
        "gender": "M;Not Specified;M;M;;M",
        "homepage": "https://sumeetbatra.github.io/;https://btjanaka.net;;https://alex-petrenko.github.io/;http://stefanosnikolaidis.net/;http://www-robotics.usc.edu/~gaurav/",
        "dblp": "255/5461;277/1380;239/8516;267/9701;62/6555;s/GauravSSukhatme",
        "google_scholar": "https://scholar.google.com/citations?hl=ja;851Y-O8AAAAJ;RqSvzikAAAAJ;G2zXCNkAAAAJ;;https://scholar.google.com.tw/citations?user=lRUi-A8AAAAJ",
        "orcid": ";0000-0002-9602-5039;;;;0000-0003-2408-474X",
        "linkedin": "sumeetbatra/;btjanaka/;;apetrenko-nn/;;gaurav-sukhatme-9b6420b/",
        "or_profile": "~Sumeet_Batra1;~Bryon_Tjanaka1;~Matthew_Christopher_Fontaine1;~Aleksei_Petrenko1;~Stefanos_Nikolaidis1;~Gaurav_S._Sukhatme1",
        "aff": "University of Southern California;University of Southern California;University of Southern California;Apple;University of Southern California;University of Southern California",
        "aff_domain": "usc.edu;usc.edu;usc.edu;apple.com;usc.edu;usc.edu",
        "position": "PhD student;PhD student;PhD student;Researcher;Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\nbatra2024proximal,\ntitle={Proximal Policy Gradient Arborescence for Quality Diversity Reinforcement Learning},\nauthor={Sumeet Batra and Bryon Tjanaka and Matthew Christopher Fontaine and Aleksei Petrenko and Stefanos Nikolaidis and Gaurav S. Sukhatme},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=TFKIfhvdmZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "2hvw;1LjB;vTCA;RPaL",
        "pdf_size": 5281801,
        "rating": "6;6;8;8",
        "confidence": "4;3;5;2",
        "soundness": "3;3;3;3",
        "contribution": "2;2;4;3",
        "presentation": "2;3;3;3",
        "wc_summary": "90;235;88;118",
        "wc_strengths": "63;41;30;69",
        "wc_weaknesses": "66;66;82;115",
        "wc_questions": "50;51;1578;13",
        "wc_review": "269;393;1778;315",
        "wc_reply_reviewers": "67;0;126;12",
        "wc_reply_authors": "757;685;2123;658",
        "reply_reviewers": "1;0;2;1",
        "reply_authors": "1;1;4;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            132.75,
            60.21368200002388
        ],
        "wc_strengths_avg": [
            50.75,
            15.880412463157246
        ],
        "wc_weaknesses_avg": [
            82.25,
            20.004686950812303
        ],
        "wc_questions_avg": [
            423.0,
            667.0153671393186
        ],
        "wc_review_avg": [
            688.75,
            630.4388848254841
        ],
        "wc_reply_reviewers_avg": [
            51.25,
            50.006874527408726
        ],
        "wc_reply_authors_avg": [
            1055.75,
            617.2387605295053
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            1.75,
            1.299038105676658
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6066492890297966375&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=TFKIfhvdmZ",
        "pdf": "https://openreview.net/pdf?id=TFKIfhvdmZ",
        "email": "usc.edu;usc.edu;usc.edu;apple.com;usc.edu;usc.edu",
        "author_num": 6,
        "aff_unique_index": "0;0;0;1;0;0",
        "aff_unique_norm": "University of Southern California;Apple",
        "aff_unique_dep": ";Apple Inc.",
        "aff_unique_url": "https://www.usc.edu;https://www.apple.com",
        "aff_unique_abbr": "USC;Apple",
        "aff_campus_unique_index": "0;0;0;0;0",
        "aff_campus_unique": "Los Angeles;",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "TFR0GrzERG",
        "title": "On Task Description of In-context Learning: A Study from Information Perspective",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs) have demonstrated remarkable performance in a wide range of applications, making in-context learning an essential technique. Although the in-context learning has been widely applied, our understanding of its underlying processes still remains limited. In-context learning in LLMs primarily relies on two types of information: in-context samples and task descriptions. While previous research has extensively investigated the influence of in-context samples on learning behavior, the role of task descriptions has not been adequately explored, despite their practical significance. In this paper, we present a study examining the impact of task descriptions on the in-context learning performance of LLMs. We devise a synthetic experiment setting, making the information of task description controllable. Through a series of well-designed experiments, we systematically vary task description information and assess the resulting effects on model performance across multiple tasks. Our findings reveal complex roles of task descriptions: task description will suppress the model to learn from in-context examples; task description will increase the lower bound of the in-context learning performance. This study contributes to a deeper understanding of the in-context learning mechanism in LLMs, paving the way for more effective real-world applications of these powerful models",
        "keywords": "in-context learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Meidai Xuanyuan;Tao Yang;Jingwen Fu;Yuwang Wang",
        "authorids": "~Meidai_Xuanyuan1;~Tao_Yang9;~Jingwen_Fu1;~Yuwang_Wang3",
        "gender": "F;M;M;M",
        "homepage": "https://github.com/xymd18;https://github.com/ThomasMrY;https://www.jw-fu.cn/;",
        "dblp": ";;247/5290;161/2633",
        "google_scholar": ";https://scholar.google.com.hk/citations?user=qT5psCEAAAAJ;;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Meidai_Xuanyuan1;~Tao_Yang9;~Jingwen_Fu1;~Yuwang_Wang3",
        "aff": "Tsinghua University;Xi'an Jiaotong University;Microsoft;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;xjtu.edu.cn;microsoft.com;tsinghua.edu.cn",
        "position": "MS student;PhD student;Intern;Researcher",
        "bibtex": "@misc{\nxuanyuan2024on,\ntitle={On Task Description of In-context Learning: A Study from Information Perspective},\nauthor={Meidai Xuanyuan and Tao Yang and Jingwen Fu and Yuwang Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=TFR0GrzERG}\n}",
        "github": "",
        "project": "",
        "reviewers": "9ENX;YT61;hvVV;DYTw",
        "site": "https://openreview.net/forum?id=TFR0GrzERG",
        "pdf_size": 932254,
        "rating": "3;5;5;8",
        "confidence": "4;3;4;4",
        "soundness": "1;2;2;4",
        "contribution": "1;2;3;3",
        "presentation": "2;3;2;2",
        "wc_summary": "59;121;610;223",
        "wc_strengths": "22;30;129;35",
        "wc_weaknesses": "390;41;890;427",
        "wc_questions": "66;324;699;113",
        "wc_review": "537;516;2328;798",
        "wc_reply_reviewers": "30;0;0;14",
        "wc_reply_authors": "1269;1371;2200;524",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "3;2;4;1",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            1.0897247358851685
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            253.25,
            214.13123896339835
        ],
        "wc_strengths_avg": [
            54.0,
            43.54882317583335
        ],
        "wc_weaknesses_avg": [
            437.0,
            301.8004307485329
        ],
        "wc_questions_avg": [
            300.5,
            249.75037537509328
        ],
        "wc_review_avg": [
            1044.75,
            749.1666620318873
        ],
        "wc_reply_reviewers_avg": [
            11.0,
            12.36931687685298
        ],
        "wc_reply_authors_avg": [
            1341.0,
            594.0231476971247
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.08084520834544431,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Xb84oXomq8kJ:scholar.google.com/&scioq=On+Task+Description+of+In-context+Learning:+A+Study+from+Information+Perspective&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Tsinghua University;Xi'an Jiao Tong University;Microsoft",
        "aff_unique_dep": ";;Microsoft Corporation",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.xjtu.edu.cn;https://www.microsoft.com",
        "aff_unique_abbr": "THU;XJTU;Microsoft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "TGaFO0YglG",
        "title": "Mini-batch Submodular Maximization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We present the first *mini-batch* algorithm for maximizing a non-negative monotone *decomposable* submodular function, $F=\\sum_{i=1}^N f^i$, under a set of constraints. The expected number of oracle evaluations of our algorithm only depends on the size of the ground set. Previous results require a number of oracle evaluations that either depend on $N$ or have a worst-case *exponential* dependence on the size of the ground set.",
        "keywords": "Submodular maximization;mini-batch",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Gregory Schwartzman",
        "authorids": "~Gregory_Schwartzman1",
        "gender": "",
        "homepage": "https://sites.google.com/view/gregoryschwartzman/",
        "dblp": "176/5322.html",
        "google_scholar": "",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Gregory_Schwartzman1",
        "aff": "Japan Advanced Institute of Science and Technology",
        "aff_domain": "jaist.ac.jp",
        "position": "Associate Professor",
        "bibtex": "@misc{\nschwartzman2024minibatch,\ntitle={Mini-batch Submodular Maximization},\nauthor={Gregory Schwartzman},\nyear={2024},\nurl={https://openreview.net/forum?id=TGaFO0YglG}\n}",
        "github": "",
        "project": "",
        "reviewers": "dUP7;QSfG;qFjC;ev1Q",
        "site": "https://openreview.net/forum?id=TGaFO0YglG",
        "pdf_size": 277758,
        "rating": "3;3;5;5",
        "confidence": "4;3;4;4",
        "soundness": "3;3;2;2",
        "contribution": "2;3;2;2",
        "presentation": "3;2;1;2",
        "wc_summary": "125;21;90;78",
        "wc_strengths": "79;54;52;55",
        "wc_weaknesses": "344;136;598;184",
        "wc_questions": "135;7;440;4",
        "wc_review": "683;218;1180;321",
        "wc_reply_reviewers": "71;56;49;88",
        "wc_reply_authors": "456;37;614;199",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            78.5,
            37.41991448413532
        ],
        "wc_strengths_avg": [
            60.0,
            11.022703842524301
        ],
        "wc_weaknesses_avg": [
            315.5,
            180.36837305913696
        ],
        "wc_questions_avg": [
            146.5,
            177.5112672480257
        ],
        "wc_review_avg": [
            600.5,
            376.51460795034234
        ],
        "wc_reply_reviewers_avg": [
            66.0,
            14.983324063771697
        ],
        "wc_reply_authors_avg": [
            326.5,
            223.3231962873539
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6462826788820207808&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0",
        "aff_unique_norm": "Japan Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.jaist.ac.jp",
        "aff_unique_abbr": "JAIST",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Japan"
    },
    {
        "title": "Harnessing Density Ratios for Online Reinforcement Learning",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18580",
        "id": "THJEa8adBn",
        "author_site": "Philip Amortila, Dylan Foster, Nan Jiang, Ayush Sekhari, Tengyang Xie",
        "tldr": "",
        "abstract": "The theories of offline and online reinforcement learning, despite having evolved in parallel, have begun to show signs of the possibility for a unification, with algorithms and analysis techniques for one setting often having natural counterparts in the other. However, the notion of *density ratio modeling*, an emerging paradigm in offline RL, has been largely absent from online RL, perhaps for good reason: the very existence and boundedness of density ratios relies on access to an exploratory dataset with good coverage, but the core challenge in online RL is to collect such a dataset without having one to start.\n\nIn this work we show---perhaps surprisingly---that density ratio-based algorithms have online counterparts.  Assuming only the existence of an exploratory distribution with good coverage, a structural condition known as *coverability* (Xie et al., 2023), we give a new algorithm (GLOW) that uses density ratio realizability and value function realizability to perform sample-efficient online exploration. GLOW addresses unbounded density ratios via careful use of truncation, and combines this with optimism to guide exploration. GLOW is computationally inefficient; we complement it with a more efficient counterpart, HyGLOW, for the Hybrid RL setting (Song et al., 2023) wherein online RL is augmented with additional offline data. HyGLOW is derived as a special case of a more general meta-algorithm that provides a provable black-box reduction from hybrid RL to offline RL, which may be of independent interest.",
        "keywords": "reinforcement learning theory;online RL;offline RL;hybrid RL;density ratio;marginalized importance weight;weight function;general function approximation",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/a794ccf758ae203e03a35ed0ecb8aeb43b32db6b.pdf",
        "author": "Philip Amortila;Dylan J Foster;Nan Jiang;Ayush Sekhari;Tengyang Xie",
        "authorids": "~Philip_Amortila1;~Dylan_J_Foster1;~Nan_Jiang2;~Ayush_Sekhari1;~Tengyang_Xie1",
        "gender": "M;;M;M;",
        "homepage": "https://www.philipamortila.com;http://dylanfoster.net;http://nanjiang.cs.illinois.edu;https://ayush.sekhari.com/;https://tengyangxie.github.io/",
        "dblp": "222/2989;167/4271;06/4489-8;203/8152;227/3335",
        "google_scholar": "NZQkB8sAAAAJ;RqwU8xsAAAAJ;nUlanA8AAAAJ;jH9i188AAAAJ;rlmROVsAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;nan-jiang-28139937/;;",
        "or_profile": "~Philip_Amortila1;~Dylan_J_Foster1;~Nan_Jiang2;~Ayush_Sekhari1;~Tengyang_Xie1",
        "aff": "University of Illinois, Urbana Champaign;Microsoft Research;University of Illinois, Urbana Champaign;Massachusetts Institute of Technology;Microsoft Research, New England & NYC",
        "aff_domain": "illinois.edu;microsoft.com;illinois.edu;mit.edu;microsoft.com",
        "position": "PhD student;Principal Researcher;Assistant Professor;Postdoc;Postdoc",
        "bibtex": "@inproceedings{\namortila2024harnessing,\ntitle={Harnessing Density Ratios for Online Reinforcement Learning},\nauthor={Philip Amortila and Dylan J Foster and Nan Jiang and Ayush Sekhari and Tengyang Xie},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=THJEa8adBn}\n}",
        "github": "",
        "project": "",
        "reviewers": "reZc;4ukw;xDdp",
        "pdf_size": 663566,
        "rating": "6;6;8",
        "confidence": "3;3;2",
        "soundness": "3;4;3",
        "contribution": "3;3;3",
        "presentation": "3;3;3",
        "wc_summary": "51;131;149",
        "wc_strengths": "92;38;123",
        "wc_weaknesses": "134;41;105",
        "wc_questions": "4;66;57",
        "wc_review": "281;276;434",
        "wc_reply_reviewers": "24;0;0",
        "wc_reply_authors": "631;484;527",
        "reply_reviewers": "1;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            110.33333333333333,
            42.59368758656877
        ],
        "wc_strengths_avg": [
            84.33333333333333,
            35.122009560324926
        ],
        "wc_weaknesses_avg": [
            93.33333333333333,
            38.852999312222416
        ],
        "wc_questions_avg": [
            42.333333333333336,
            27.35365098523819
        ],
        "wc_review_avg": [
            330.3333333333333,
            73.33181816616546
        ],
        "wc_reply_reviewers_avg": [
            8.0,
            11.313708498984761
        ],
        "wc_reply_authors_avg": [
            547.3333333333334,
            61.71079502179681
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9999999999999998,
        "gs_citation": 16,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8581028805127778616&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=THJEa8adBn",
        "pdf": "https://openreview.net/pdf?id=THJEa8adBn",
        "email": "illinois.edu;microsoft.com;illinois.edu;mit.edu;microsoft.com",
        "author_num": 5,
        "aff_unique_index": "0;1;0;2;1",
        "aff_unique_norm": "University of Illinois Urbana-Champaign;Microsoft;Massachusetts Institute of Technology",
        "aff_unique_dep": ";Microsoft Research;",
        "aff_unique_url": "https://illinois.edu;https://www.microsoft.com/en-us/research;https://web.mit.edu",
        "aff_unique_abbr": "UIUC;MSR;MIT",
        "aff_campus_unique_index": "0;0;2",
        "aff_campus_unique": "Urbana-Champaign;;New England",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "THL0keBDIR",
        "title": "A Backdoor-based Explainable AI Benchmark for Improved Fidelity in Evaluating Attribution Methods",
        "track": "main",
        "status": "Desk Reject",
        "tldr": "",
        "abstract": "Attribution methods compute importance scores for input features to explain the output predictions of deep models. However, accurate assessment of the performance of attribution methods is challenged by the lack of ground truth along with other confounding factors such as attribution post-processing and explanation objectives. In this paper, we first identify a set of fidelity criteria that must be satisfied for reliable evaluation of attribution methods. Then, we introduce a Trojaned model based benchmarking framework that adheres to the desired fidelity criteria. We theoretically establish the superiority of our approach over existing benchmarks for well-founded attribution evaluation. With extensive analysis, we also identify a setup for a consistent and fair benchmarking of attribution methods across different underlying methodologies. This setup is ultimately employed for a comprehensive comparison of existing methods using our benchmark. Finally, our analysis also provides guidance for defending against backdoor attacks using existing attribution methods.",
        "keywords": "Feature Attribution;Explainable AI Benchmark;Backdoor",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/2c2fbd5676a0e0062a532fdd8a5c55b3b684fc12.zip",
        "author": "Peiyu Yang;NAVEED AKHTAR;Jiantong Jiang;Ajmal Saeed Mian",
        "authorids": "~Peiyu_Yang1;~NAVEED_AKHTAR3;~Jiantong_Jiang1;~Ajmal_Saeed_Mian1",
        "gender": "M;;F;M",
        "homepage": "https://ypeiyu.github.io/;;https://jjiantong.github.io/;https://ajmalsaeed.net/",
        "dblp": "155/8089;;259/3790;63/807",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;MuyZqjgAAAAJ;X589yaIAAAAJ",
        "orcid": "0000-0002-3827-8476;;0000-0002-1624-3969;0000-0002-5206-3842",
        "linkedin": ";;;",
        "or_profile": "~Peiyu_Yang1;~NAVEED_AKHTAR3;~Jiantong_Jiang1;~Ajmal_Saeed_Mian1",
        "aff": "University of Western Australia;;University of Western Australia;University of Western Australia",
        "aff_domain": "uwa.edu.au;;uwa.edu.au;uwa.edu.au",
        "position": "PhD student;;PhD student;Professor",
        "bibtex": "@misc{\nyang2024a,\ntitle={A Backdoor-based Explainable {AI} Benchmark for Improved Fidelity in Evaluating Attribution Methods},\nauthor={Peiyu Yang and NAVEED AKHTAR and Jiantong Jiang and Ajmal Saeed Mian},\nyear={2024},\nurl={https://openreview.net/forum?id=THL0keBDIR}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=THL0keBDIR",
        "pdf_size": 5144854,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:YDUETzElm7cJ:scholar.google.com/&scioq=A+Backdoor-based+Explainable+AI+Benchmark+for+Improved+Fidelity+in+Evaluating+Attribution+Methods&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Western Australia",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uwa.edu.au",
        "aff_unique_abbr": "UWA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Australia"
    },
    {
        "title": "Querying Easily Flip-flopped Samples for Deep Active Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18579",
        "id": "THUBTfSAS2",
        "author_site": "Seong Jin Cho, Gwangsu Kim, Junghyun Lee, Jinwoo Shin, Chang Yoo",
        "tldr": "",
        "abstract": "Active learning, a paradigm within machine learning, aims to select and query unlabeled data to enhance model performance strategically. A crucial selection strategy leverages the model's predictive uncertainty, reflecting the informativeness of a data point. While the sample's distance to the decision boundary intuitively measures predictive uncertainty, its computation becomes intractable for complex decision boundaries formed in multiclass classification tasks. This paper introduces the *least disagree metric* (LDM), the smallest probability of predicted label disagreement. We propose an asymptotically consistent estimator for LDM under mild assumptions. The estimator boasts computational efficiency and straightforward implementation for deep learning models using parameter perturbation. The LDM-based active learning algorithm queries unlabeled data with the smallest LDM, achieving state-of-the-art *overall* performance across various datasets and deep architectures, as demonstrated by the experimental results.",
        "keywords": "active learning;uncertainty;closeness;disagree metric;diversity",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Seong Jin Cho;Gwangsu Kim;Junghyun Lee;Jinwoo Shin;Chang D. Yoo",
        "authorids": "~Seong_Jin_Cho1;~Gwangsu_Kim1;~Junghyun_Lee1;~Jinwoo_Shin1;~Chang_D._Yoo1",
        "gender": "M;M;M;M;M",
        "homepage": ";;https://nick-jhlee.github.io/;https://sites.google.com/site/mijirim/;https://sanctusfactory.com/family.php",
        "dblp": ";218/3948;;31/7062;31/7819",
        "google_scholar": ";https://scholar.google.co.kr/citations?user=uD1Osx8AAAAJ;sYtSnnQAAAAJ;https://scholar.google.com.tw/citations?user=m3eDp7kAAAAJ;gFWgUQEAAAAJ",
        "orcid": "0000-0003-4640-7407;;0000-0002-3898-6464;;0000-0002-0756-7179",
        "linkedin": ";;junghyun-nick-lee-89799a197/;;",
        "or_profile": "~Seong_Jin_Cho1;~Gwangsu_Kim1;~Junghyun_Lee1;~Jinwoo_Shin1;~Chang_D._Yoo1",
        "aff": "Korea Institute of Oriental Medicine;Chonbuk National University;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kiom.re.kr;jbnu.ac.kr;kaist.ac.kr;kaist.ac.kr;kaist.ac.kr",
        "position": "Researcher;Assistant Professor;PhD student;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\ncho2024querying,\ntitle={Querying Easily Flip-flopped Samples for Deep Active Learning},\nauthor={Seong Jin Cho and Gwangsu Kim and Junghyun Lee and Jinwoo Shin and Chang D. Yoo},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=THUBTfSAS2}\n}",
        "github": "",
        "project": "",
        "reviewers": "L6Gr;ixMJ;o58y;2mvn",
        "pdf_size": 2853065,
        "rating": "6;6;8;10",
        "confidence": "3;4;3;4",
        "soundness": "4;3;3;4",
        "contribution": "3;2;3;3",
        "presentation": "4;3;3;4",
        "wc_summary": "220;43;104;67",
        "wc_strengths": "26;30;251;90",
        "wc_weaknesses": "93;297;570;124",
        "wc_questions": "16;153;114;69",
        "wc_review": "355;523;1039;350",
        "wc_reply_reviewers": "28;25;25;90",
        "wc_reply_authors": "525;2120;1965;683",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;5;4;2",
        "rating_avg": [
            7.5,
            1.6583123951777
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            108.5,
            67.94299080847118
        ],
        "wc_strengths_avg": [
            99.25,
            91.20683910760201
        ],
        "wc_weaknesses_avg": [
            271.0,
            189.32115571166366
        ],
        "wc_questions_avg": [
            88.0,
            51.102837494604934
        ],
        "wc_review_avg": [
            566.75,
            281.4039578612923
        ],
        "wc_reply_reviewers_avg": [
            42.0,
            27.739863013360395
        ],
        "wc_reply_authors_avg": [
            1323.25,
            723.4944281057042
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.25,
            1.299038105676658
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.30151134457776363,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2938383364272752729&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=THUBTfSAS2",
        "pdf": "https://openreview.net/pdf?id=THUBTfSAS2",
        "email": "kiom.re.kr;jbnu.ac.kr;kaist.ac.kr;kaist.ac.kr;kaist.ac.kr",
        "author_num": 5,
        "aff_unique_index": "0;1;2;2;2",
        "aff_unique_norm": "Korea Institute of Oriental Medicine;Chonbuk National University;Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.kiom.re.kr;http://www.cbnu.ac.kr;https://www.kaist.ac.kr",
        "aff_unique_abbr": "KIOM;CBNU;KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "THtX863Io2",
        "title": "Who SAID that? Benchmarking Social Media AI Detection",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "AI-generated content (AIGC) has proliferated across various online platforms, offering both transformative prospects and posing significant risks related to misinformation and manipulation. Addressing these challenges, this paper introduces SAID (\\underline{s}ocial media \\underline{AI} \\underline{d}etection), a novel benchmark developed to assess AIGC detection models' capabilities in realistic scenarios. It incorporates real AIGC data from popular social media platforms like Zhihu and Quora. Unlike existing benchmarks, SAID deals with content that reflects the sophisticated strategies employed by AIGCs on the Internet to evade detection or gain visibility, providing a more realistic and challenging evaluation landscape. A notable finding of our study, based on the Zhihu dataset, reveals that expert annotators can distinguish between AI-generated and human-generated texts with an average accuracy rate of 97\\%. This finding necessitates a re-evaluation of human capability in recognizing AIGC in today\u2019s widely AI-influenced environment. Furthermore, we present a new user-oriented AIGC detection challenge focusing on the practicality and effectiveness of identifying AIGC based on user information and answer content.",
        "keywords": "AI-generated text detection;benchmark;large language model",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Wanyun Cui;Linqiu Zhang;Qianle Wang;Shuyang Cai",
        "authorids": "~Wanyun_Cui1;~Linqiu_Zhang1;~Qianle_Wang1;~Shuyang_Cai1",
        "gender": "M;M;M;M",
        "homepage": "https://cuiwanyun.github.io/;https://github.com/zlq147;https://github.com/wangitu;https://github.com/AllenCsy",
        "dblp": "116/5305;358/9128;;",
        "google_scholar": "https://scholar.google.com.hk/citations?user=FP7ANisAAAAJ;;;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Wanyun_Cui1;~Linqiu_Zhang1;~Qianle_Wang1;~Shuyang_Cai1",
        "aff": "Shanghai University of Finance and Economics;Shanghai University of Finance and Economics;SUFE;Shanghai University of Finance and Economics",
        "aff_domain": "shufe.edu.cn;sufe.edu;sufe.edu;sufe.edu",
        "position": "Associate Professor;PhD student;MS student;PhD student",
        "bibtex": "@misc{\ncui2024who,\ntitle={Who {SAID} that? Benchmarking Social Media {AI} Detection},\nauthor={Wanyun Cui and Linqiu Zhang and Qianle Wang and Shuyang Cai},\nyear={2024},\nurl={https://openreview.net/forum?id=THtX863Io2}\n}",
        "github": "",
        "project": "",
        "reviewers": "mwr2;epQ3;MEvR",
        "site": "https://openreview.net/forum?id=THtX863Io2",
        "pdf_size": 159742,
        "rating": "3;5;5",
        "confidence": "4;3;4",
        "soundness": "2;2;2",
        "contribution": "2;2;2",
        "presentation": "3;3;3",
        "wc_summary": "92;78;43",
        "wc_strengths": "140;16;29",
        "wc_weaknesses": "691;332;192",
        "wc_questions": "75;24;47",
        "wc_review": "998;450;311",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            71.0,
            20.607442021431645
        ],
        "wc_strengths_avg": [
            61.666666666666664,
            55.643707840349954
        ],
        "wc_weaknesses_avg": [
            405.0,
            210.15391185192502
        ],
        "wc_questions_avg": [
            48.666666666666664,
            20.853989759489405
        ],
        "wc_review_avg": [
            586.3333333333334,
            296.5718949747074
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18163728469344397278&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Shanghai University of Finance and Economics",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.sufe.edu.cn",
        "aff_unique_abbr": "SUFE",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "TJ2PQ9QaDF",
        "title": "Benign Overfitting in Two-Layer ReLU Convolutional Neural Networks for XOR Data",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Modern deep learning models are usually highly over-parameterized so that they can overfit the training data. Surprisingly, such overfitting neural networks can usually still achieve high  prediction accuracy. To study this ``benign overfitting'' phenomenon, a line of recent works has theoretically studied the learning of linear models and two-layer neural networks. However, most of these analyses are still limited to the very simple learning problems where the Bayes-optimal classifier is linear. In this work, we investigate a class of XOR-type classification tasks with label-flipping noises. We show that, under a certain condition on the sample complexity and signal-to-noise ratio, an over-parameterized ReLU CNN trained by gradient descent can achieve near Bayes-optimal accuracy. Moreover, we also establish a matching lower bound result showing that when the previous condition is not satisfied, the prediction accuracy of the obtained CNN is an absolute constant away from the Bayes-optimal rate. Our result demonstrates that CNNs have a remarkable capacity to efficiently learn XOR problems, even in the presence of highly correlated features.",
        "keywords": "Benign overfitting;Over-parameterized;XOR;Label-flipping;Correlated Features",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Xuran Meng;Difan Zou;Yuan Cao",
        "authorids": "~Xuran_Meng1;~Difan_Zou1;~Yuan_Cao1",
        "gender": "M;M;M",
        "homepage": ";https://difanzou.github.io/;https://yuancaohku.github.io/",
        "dblp": "307/5287;161/8923;",
        "google_scholar": "WwASl80AAAAJ;Cp4fcTQAAAAJ;-VGnHI4AAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Xuran_Meng1;~Difan_Zou1;~Yuan_Cao1",
        "aff": "University of Hong Kong;University of Hong Kong;University of Hong Kong",
        "aff_domain": "hku.hk;hku.hk;hku.hk",
        "position": "PhD student;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nmeng2024benign,\ntitle={Benign Overfitting in Two-Layer Re{LU} Convolutional Neural Networks for {XOR} Data},\nauthor={Xuran Meng and Difan Zou and Yuan Cao},\nyear={2024},\nurl={https://openreview.net/forum?id=TJ2PQ9QaDF}\n}",
        "github": "",
        "project": "",
        "reviewers": "X4FC;EAhF;VjnG;vd3N;jBsa",
        "site": "https://openreview.net/forum?id=TJ2PQ9QaDF",
        "pdf_size": 1603011,
        "rating": "5;5;6;6;6",
        "confidence": "3;4;3;4;4",
        "soundness": "3;4;3;3;3",
        "contribution": "3;3;3;3;3",
        "presentation": "3;3;3;3;3",
        "wc_summary": "36;74;86;95;28",
        "wc_strengths": "20;201;103;51;35",
        "wc_weaknesses": "133;246;103;332;43",
        "wc_questions": "82;47;14;2;41",
        "wc_review": "271;568;306;480;147",
        "wc_reply_reviewers": "125;0;17;0;0",
        "wc_reply_authors": "1111;702;303;744;579",
        "reply_reviewers": "2;0;1;0;0",
        "reply_authors": "3;1;1;1;1",
        "rating_avg": [
            5.6,
            0.48989794855663565
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            3.2,
            0.39999999999999997
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            63.8,
            26.92508124407427
        ],
        "wc_strengths_avg": [
            82.0,
            65.75104561906221
        ],
        "wc_weaknesses_avg": [
            171.4,
            103.92035411794939
        ],
        "wc_questions_avg": [
            37.2,
            27.909854890342945
        ],
        "wc_review_avg": [
            354.4,
            150.8066311539383
        ],
        "wc_reply_reviewers_avg": [
            28.4,
            48.74669219547106
        ],
        "wc_reply_authors_avg": [
            687.8,
            261.6741485129932
        ],
        "reply_reviewers_avg": [
            0.6,
            0.7999999999999999
        ],
        "reply_authors_avg": [
            1.4,
            0.8000000000000002
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.16666666666666666,
        "gs_citation": 18,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2390669850575548429&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Hong Kong",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.hku.hk",
        "aff_unique_abbr": "HKU",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "TJNCnkDRkY",
        "title": "Generative Pre-Trained Speech Language Model with Efficient Hierarchical Transformer",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "While recent advancements in speech language modeling have achieved significant progress, they face remarkable challenges in modelling the long acoustic sequence of neural audio codecs. Previous speech language models are compelled to learn acoustic tokens through a multi-stage generation process, which hinders their performance due to error propagation and information loss. In this paper, we introduce \\textbf{G}enerative \\textbf{P}re-Trained \\textbf{S}peech Language Model (GPST), a hierarchical transformer designed for efficient speech language modeling. GPST quantizes audio waveforms into two distinct types of discrete speech representations and integrates them within a hierarchical transformer architecture, allowing for a unified one-stage generation process and enhancing Hi-Res audio generation capabilities. By training on large corpora of raw audio waveforms in an end-to-end unsupervised manner, GPST can generate syntactically consistent speech with diverse speaker identity unconditionally. When provided a brief 3-second prompt, GPST is able to produce natural and coherent personalized speech, demonstrating in-context learning abilities. Moreover, our approach can be easily extended to spoken cross-lingual speech generation by incorporating multi-lingual semantic tokens and universal acoustic tokens. Experimental results indicate that GPST significantly outperforms the existing speech language models in terms of word error rate, speech quality and speaker similarity.",
        "keywords": "speech language model;speech generation",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Yongxin Zhu;Dan Su;Liqiang He;Linli Xu;Dong Yu",
        "authorids": "~Yongxin_Zhu1;~Dan_Su3;andylqhe@tencent.com;~Linli_Xu1;~Dong_Yu2",
        "gender": "M;M;;;M",
        "homepage": "https://youngsheen.github.io;;;;https://sites.google.com/view/dongyu888/",
        "dblp": "27/3343-3;;;;71/4598-1",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;yE6WZy4AAAAJ;;;tMY31_gAAAAJ",
        "orcid": ";;;;0000-0003-0520-6844",
        "linkedin": ";dan-su-4948621a/;;;dongyu/",
        "or_profile": "~Yongxin_Zhu1;~Dan_Su3;andylqhe@tencent.com;~Linli_Xu1;~Dong_Yu2",
        "aff": "University of Science and Technology of China;;;;Tencent AI Lab",
        "aff_domain": "ustc.edu;;;;tencent.com",
        "position": "PhD student;;;;Distinguished Scientist",
        "bibtex": "@misc{\nzhu2024generative,\ntitle={Generative Pre-Trained Speech Language Model with Efficient Hierarchical Transformer},\nauthor={Yongxin Zhu and Dan Su and Liqiang He and Linli Xu and Dong Yu},\nyear={2024},\nurl={https://openreview.net/forum?id=TJNCnkDRkY}\n}",
        "github": "",
        "project": "",
        "reviewers": "tzty;7zWQ;3McF;BzgH",
        "site": "https://openreview.net/forum?id=TJNCnkDRkY",
        "pdf_size": 2008907,
        "rating": "5;5;5;6",
        "confidence": "4;4;5;4",
        "soundness": "3;2;3;3",
        "contribution": "2;3;2;2",
        "presentation": "3;3;3;3",
        "wc_summary": "78;204;92;87",
        "wc_strengths": "124;48;53;68",
        "wc_weaknesses": "216;193;54;76",
        "wc_questions": "31;96;421;56",
        "wc_review": "449;541;620;287",
        "wc_reply_reviewers": "65;453;100;29",
        "wc_reply_authors": "1085;965;1166;583",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "3;3;3;3",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            115.25,
            51.484827862196454
        ],
        "wc_strengths_avg": [
            73.25,
            30.21071829665756
        ],
        "wc_weaknesses_avg": [
            134.75,
            70.65187541742965
        ],
        "wc_questions_avg": [
            151.0,
            157.59917512474487
        ],
        "wc_review_avg": [
            474.25,
            123.89385577985698
        ],
        "wc_reply_reviewers_avg": [
            161.75,
            170.01672711824563
        ],
        "wc_reply_authors_avg": [
            949.75,
            223.49203005923948
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.0,
            0.0
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12333167127205140906&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Science and Technology of China;Tencent",
        "aff_unique_dep": ";Tencent AI Lab",
        "aff_unique_url": "http://www.ustc.edu.cn;https://ai.tencent.com",
        "aff_unique_abbr": "USTC;Tencent AI Lab",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "TKDwsJmrDJ",
        "title": "Collaborating Heterogeneous Natural Language Processing Tasks via Federated Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The increasing privacy concerns regarding personal private data promote the development of federated learning (FL) in recent years. However, the existing studies on applying FL in Natural Language Processing (NLP) are not suitable for coordinating participants with heterogeneous or private learning objectives. In this study, we further broaden the application scope of FL in NLP by proposing an Assign-Then-Contrast (ATC) framework, which enables clients with heterogeneous NLP tasks to construct an FL course and learn useful knowledge from each other. Specifically, clients are suggested to first perform local training with the unified tasks assigned by the server rather than using their own learning objectives, which is called the Assign training stage. After that, in the Contrast training stage, clients train with different local learning objectives and exchange knowledge with other clients who contribute consistent and useful model updates. We conduct extensive experiments on six widely-used datasets covering both Natural Language Understanding and Natural Language Generation tasks, showing that ATC framework achieves significant improvements compared to several baseline methods. We will release the source code for promoting further research.",
        "keywords": "Federated Learning;Heterogeneous Tasks",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Chenhe Dong;Yuexiang Xie;Bolin Ding;Ying Shen;Yaliang Li",
        "authorids": "~Chenhe_Dong1;~Yuexiang_Xie1;~Bolin_Ding3;~Ying_Shen1;~Yaliang_Li1",
        "gender": ";M;M;F;M",
        "homepage": ";https://xieyxclack.github.io/;https://bolinding.github.io/;http://ise.sysu.edu.cn/teacher/teacher02/1371452.htm;https://sites.google.com/site/yaliangli/",
        "dblp": "254/8252;232/2045;46/3522.html;01/8558-1;https://dblp.org/pers/hd/l/Li:Yaliang",
        "google_scholar": "iDp0iYkAAAAJ;https://scholar.google.com/citations?hl=zh-CN;AjYkTi8AAAAJ;rVpl7SIAAAAJ;CCPBcdYAAAAJ",
        "orcid": "0000-0002-2211-5138;0009-0005-6545-7882;;0000-0002-3220-904X;0000-0002-4204-6096",
        "linkedin": ";;bolin-ding-50a0119/;;",
        "or_profile": "~Chenhe_Dong1;~Yuexiang_Xie1;~Bolin_Ding3;~Ying_Shen1;~Yaliang_Li1",
        "aff": ";Alibaba Group;Alibaba Group;SUN YAT-SEN UNIVERSITY, Tsinghua University;Alibaba Group",
        "aff_domain": ";alibaba-inc.com;alibaba-inc.com;sysu.edu.cn;alibaba-inc.com",
        "position": ";Staff;Senior Director;Associate Professor;Staff Engineer",
        "bibtex": "@misc{\ndong2024collaborating,\ntitle={Collaborating Heterogeneous Natural Language Processing Tasks via Federated Learning},\nauthor={Chenhe Dong and Yuexiang Xie and Bolin Ding and Ying Shen and Yaliang Li},\nyear={2024},\nurl={https://openreview.net/forum?id=TKDwsJmrDJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "6MMF;q9mK;4Nhg;3Hkg",
        "site": "https://openreview.net/forum?id=TKDwsJmrDJ",
        "pdf_size": 569735,
        "rating": "5;5;6;8",
        "confidence": "3;4;2;3",
        "soundness": "1;2;3;3",
        "contribution": "3;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "153;83;68;143",
        "wc_strengths": "89;101;229;36",
        "wc_weaknesses": "284;162;187;26",
        "wc_questions": "52;59;171;203",
        "wc_review": "578;405;655;408",
        "wc_reply_reviewers": "73;0;22;18",
        "wc_reply_authors": "923;699;479;777",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "2;1;1;2",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            111.75,
            36.80607966083864
        ],
        "wc_strengths_avg": [
            113.75,
            70.89208347904581
        ],
        "wc_weaknesses_avg": [
            164.75,
            92.16120387668555
        ],
        "wc_questions_avg": [
            121.25,
            66.76217117499999
        ],
        "wc_review_avg": [
            511.5,
            108.4769560782381
        ],
        "wc_reply_reviewers_avg": [
            28.25,
            27.13277538328875
        ],
        "wc_reply_authors_avg": [
            719.5,
            160.45170612991313
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.28867513459481287,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7235773841040102181&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Alibaba Group;Sun Yat-sen University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.alibaba.com;http://www.sysu.edu.cn",
        "aff_unique_abbr": "Alibaba;SYSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Structural Inference with Dynamics Encoding and Partial Correlation Coefficients",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18578",
        "id": "TKnzPdyeJu",
        "author_site": "Aoran Wang, Jun Pang",
        "tldr": "",
        "abstract": "This paper introduces a novel approach to structural inference, combining a variational dynamics encoder with partial correlation coefficients. \nIn contrast to prior methods, our approach leverages variational inference to encode node dynamics within latent variables, and structural reconstruction relies on the calculation of partial correlation coefficients derived from these latent variables.\nThis unique design endows our method with scalability and extends its applicability to both one-dimensional and multi-dimensional feature spaces.\nFurthermore, by reorganizing latent variables according to temporal steps, our approach can effectively reconstruct directed graph structures. \nWe validate our method through extensive experimentation on twenty datasets from a benchmark dataset and biological networks. \nOur results showcase the superior scalability, accuracy, and versatility of our proposed approach compared to existing methods.\nMoreover, experiments conducted on noisy data affirm the robustness of our method.",
        "keywords": "Structural Inference;AI4Science",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Aoran Wang;Jun Pang",
        "authorids": "~Aoran_Wang1;~Jun_Pang1",
        "gender": ";M",
        "homepage": ";https://satoss.uni.lu/members/jun/",
        "dblp": ";p/JunPang",
        "google_scholar": ";0JjOM_gAAAAJ",
        "orcid": ";0000-0002-4521-4112",
        "linkedin": ";",
        "or_profile": "~Aoran_Wang1;~Jun_Pang1",
        "aff": ";University of Luxembourg",
        "aff_domain": ";uni.lu",
        "position": ";Principal Researcher",
        "bibtex": "@inproceedings{\nwang2024structural,\ntitle={Structural Inference with Dynamics Encoding and Partial Correlation Coefficients},\nauthor={Aoran Wang and Jun Pang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=TKnzPdyeJu}\n}",
        "github": "",
        "project": "",
        "reviewers": "5DvY;Fg5F;LxHJ",
        "pdf_size": 528745,
        "rating": "6;6;10",
        "confidence": "3;3;4",
        "soundness": "2;2;4",
        "contribution": "2;3;4",
        "presentation": "2;4;4",
        "wc_summary": "103;91;81",
        "wc_strengths": "109;57;169",
        "wc_weaknesses": "103;166;47",
        "wc_questions": "117;128;48",
        "wc_review": "432;442;345",
        "wc_reply_reviewers": "55;267;197",
        "wc_reply_authors": "2499;3679;825",
        "reply_reviewers": "1;2;1",
        "reply_authors": "5;8;2",
        "rating_avg": [
            7.333333333333333,
            1.8856180831641267
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            91.66666666666667,
            8.993825042154695
        ],
        "wc_strengths_avg": [
            111.66666666666667,
            45.7626728046147
        ],
        "wc_weaknesses_avg": [
            105.33333333333333,
            48.609555530665865
        ],
        "wc_questions_avg": [
            97.66666666666667,
            35.405586502069916
        ],
        "wc_review_avg": [
            406.3333333333333,
            43.560940710177
        ],
        "wc_reply_reviewers_avg": [
            173.0,
            88.19674975114823
        ],
        "wc_reply_authors_avg": [
            2334.3333333333335,
            1170.9441584559968
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            5.0,
            2.449489742783178
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8832053694128642781&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=TKnzPdyeJu",
        "pdf": "https://openreview.net/pdf?id=TKnzPdyeJu",
        "email": ";uni.lu",
        "author_num": 2,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Luxembourg",
        "aff_unique_dep": "",
        "aff_unique_url": "https://wwwen.uniluxembourg.lu",
        "aff_unique_abbr": "Uni Lu",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Luxembourg"
    },
    {
        "title": "Modulate Your Spectrum in Self-Supervised Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18577",
        "id": "TKqMmKlmA7",
        "author_site": "Xi Weng, Yunhao Ni, Tengwei Song, Jie Luo, Rao Anwer, Salman Khan, Fahad Khan, Lei Huang",
        "tldr": "",
        "abstract": "Whitening loss offers a theoretical guarantee against feature collapse in self-supervised learning (SSL) with joint embedding architectures. Typically, it involves a hard whitening approach, transforming the embedding and applying loss to the whitened output. In this work, we introduce Spectral Transformation (ST), a framework to modulate the spectrum of embedding and to seek for functions beyond whitening that can avoid dimensional collapse. We show that whitening is a special instance of ST by definition, and our empirical investigations unveil other ST instances capable of preventing collapse. Additionally, we propose a novel ST instance named IterNorm with trace loss (INTL). Theoretical analysis confirms INTL's efficacy in preventing collapse and modulating the spectrum of embedding toward equal-eigenvalues during optimization. Our experiments on ImageNet classification and COCO object detection demonstrate INTL's potential in learning superior representations. The code is available at https://github.com/winci-ai/INTL.",
        "keywords": "self-supervised learning;whitening;dimensional collapse;spectral transformation;iterative normalization",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/27578845ec6be6a4ba6e29b5e04dadb3ec2dc692.zip",
        "author": "Xi Weng;Yunhao Ni;Tengwei Song;Jie Luo;Rao Muhammad Anwer;Salman Khan;Fahad Khan;Lei Huang",
        "authorids": "~Xi_Weng1;~Yunhao_Ni1;~Tengwei_Song1;~Jie_Luo5;~Rao_Muhammad_Anwer2;~Salman_Khan4;~Fahad_Khan1;~Lei_Huang1",
        "gender": "M;;F;M;;M;M;M",
        "homepage": "https://winci-ai.github.io;https://github.com/Musicath;;https://www.linkedin.com/in/luo-jie-32847334;;https://salman-h-khan.github.io/;https://sites.google.com/view/fahadkhans/home;https://huangleibuaa.github.io/",
        "dblp": ";;258/5053;29/186-4;;32/11535-1;05/8618;18/1763-15",
        "google_scholar": "https://scholar.google.com.hk/citations?user=kT4c594AAAAJ;;https://scholar.google.com/citations?view_op=list_works;gwJTOVgAAAAJ;;https://scholar.google.es/citations?user=M59O9lkAAAAJ;zvaeYnUAAAAJ;https://scholar.google.com.hk/citations?user=yTshbKkAAAAJ",
        "orcid": ";0009-0000-7637-1447;;0000-0002-4157-9931;;0000-0002-9502-1749;;",
        "linkedin": ";;;luo-jie-32847334;;;;",
        "or_profile": "~Xi_Weng1;~Yunhao_Ni1;~Tengwei_Song1;~Jie_Luo5;~Rao_Muhammad_Anwer2;~Salman_Khan4;~Fahad_Khan1;~Lei_Huang1",
        "aff": "Beihang University ;Beihang University;Beihang University;Beihang University;;Australian National University;Link\u00f6ping University;Beihang University",
        "aff_domain": "buaa.edu.cn;buaa.edu.cn;buaa.edu.cn;buaa.edu.cn;;anu.edu.au;liu.se;buaa.edu.cn",
        "position": "MS student;MS student;PhD student;Associate Professor;;Lecturer;Associate Professor;Associate Professor",
        "bibtex": "@inproceedings{\nweng2024modulate,\ntitle={Modulate Your Spectrum in Self-Supervised Learning},\nauthor={Xi Weng and Yunhao Ni and Tengwei Song and Jie Luo and Rao Muhammad Anwer and Salman Khan and Fahad Khan and Lei Huang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=TKqMmKlmA7}\n}",
        "github": "",
        "project": "",
        "reviewers": "UjJ7;AFis;YNa9",
        "pdf_size": 3109467,
        "rating": "6;6;6",
        "confidence": "4;3;4",
        "soundness": "3;3;3",
        "contribution": "3;2;3",
        "presentation": "3;2;3",
        "wc_summary": "78;71;59",
        "wc_strengths": "48;40;6",
        "wc_weaknesses": "37;115;102",
        "wc_questions": "14;4;3",
        "wc_review": "177;230;170",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "543;1068;1210",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;3;3",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            69.33333333333333,
            7.845734863959881
        ],
        "wc_strengths_avg": [
            31.333333333333332,
            18.208667044996886
        ],
        "wc_weaknesses_avg": [
            84.66666666666667,
            34.120700787384514
        ],
        "wc_questions_avg": [
            7.0,
            4.96655480858378
        ],
        "wc_review_avg": [
            192.33333333333334,
            26.78722747048592
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            940.3333333333334,
            286.875505325142
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6464286174143687705&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=TKqMmKlmA7",
        "pdf": "https://openreview.net/pdf?id=TKqMmKlmA7",
        "email": "buaa.edu.cn;buaa.edu.cn;buaa.edu.cn;buaa.edu.cn;;anu.edu.au;liu.se;buaa.edu.cn",
        "author_num": 8,
        "aff_unique_index": "0;0;0;0;1;2;0",
        "aff_unique_norm": "Beihang University;Australian National University;Link\u00f6ping University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.buaa.edu.cn/;https://www.anu.edu.au;https://www.liu.se",
        "aff_unique_abbr": "BUAA;ANU;LiU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;1;2;0",
        "aff_country_unique": "China;Australia;Sweden"
    },
    {
        "title": "TiC-CLIP: Continual Training of CLIP Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18576",
        "id": "TLADT8Wrhn",
        "author_site": "Saurabh Garg, Mehrdad Farajtabar, Hadi Pouransari, Raviteja Vemulapalli, Sachin Mehta, Oncel Tuzel, Vaishaal Shankar, Fartash Faghri",
        "tldr": "",
        "abstract": "Keeping large foundation models up to date on latest data is inherently expensive. To avoid the prohibitive costs of constantly retraining, it is imperative to continually train these models. This problem is exacerbated by the lack of any large scale continual learning benchmarks or baselines. We introduce the first set of web-scale Time-Continual (TiC) benchmarks for training vision-language models: TiC-DataComp, TiC-YFCC, and TiC-Redcaps. TiC-DataComp, our largest dataset, contains over 12.7B timestamped image-text pairs spanning 9 years (2014-2022). We first use our benchmarks to curate various dynamic evaluations to measure temporal robustness of existing models. We show OpenAI's CLIP (trained on data up to 2020) loses $\\approx 8\\%$ zero-shot accuracy on our curated retrieval task from 2021-2022 compared with more recently trained models in OpenCLIP repository. We then study how to efficiently train models on time-continuous data. We demonstrate that a simple rehearsal-based approach that continues training from the last checkpoint  and replays old data reduces compute by $2.5\\times$ when compared to the standard practice of retraining from scratch. Code is available at https://github.com/apple/ml-tic-clip.",
        "keywords": "CLIP;Continual learning;distribution shift;benchmark",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Saurabh Garg;Mehrdad Farajtabar;Hadi Pouransari;Raviteja Vemulapalli;Sachin Mehta;Oncel Tuzel;Vaishaal Shankar;Fartash Faghri",
        "authorids": "~Saurabh_Garg3;~Mehrdad_Farajtabar1;~Hadi_Pouransari1;~Raviteja_Vemulapalli1;~Sachin_Mehta1;~Oncel_Tuzel2;~Vaishaal_Shankar1;~Fartash_Faghri1",
        "gender": "M;M;M;M;M;M;M;M",
        "homepage": "http://saurabhgarg1996.github.io/;https://www.cc.gatech.edu/~mfarajta/;;http://ravitejav.weebly.com/;https://sacmehta.github.io/;http://www.onceltuzel.net;;http://vaishaal.com",
        "dblp": "80/208;21/9988;162/5187;135/4940;34/11140;73/2943.html;115/7922;159/3628",
        "google_scholar": "SAnJ1hIAAAAJ;shkKxnQAAAAJ;besz69AAAAAJ;0OFqm7YAAAAJ;https://scholar.google.co.in/citations?user=cnRJ0GUAAAAJ;Fe7NTe0AAAAJ;https://scholar.google.ca/citations?user=KUG_tG0AAAAJ;",
        "orcid": ";;;;;;;",
        "linkedin": "saurabh-garg-b680b5b8/;;;raviteja-vemulapalli-85146113?utm_source=share&utm_campaign=share_via&utm_content=profile&utm_medium=ios_app;;;fartash-faghri;",
        "or_profile": "~Saurabh_Garg3;~Mehrdad_Farajtabar1;~Hadi_Pouransari1;~Raviteja_Vemulapalli1;~Sachin_Mehta1;~Oncel_Tuzel2;~Fartash_Faghri1;~vaishaal_naanny_shankar1",
        "aff": "Carnegie Mellon University;Apple;Apple;Apple;Apple;Apple;Apple;Apple",
        "aff_domain": "cmu.edu;apple.com;apple.com;apple.com;apple.com;apple.com;apple.com;apple.com",
        "position": "PhD student;Researcher;Principal Researcher;Researcher;Researcher;Principal Researcher;Researcher;Researcher",
        "bibtex": "@inproceedings{\ngarg2024ticclip,\ntitle={TiC-{CLIP}: Continual Training of {CLIP} Models},\nauthor={Saurabh Garg and Mehrdad Farajtabar and Hadi Pouransari and Raviteja Vemulapalli and Sachin Mehta and Oncel Tuzel and Vaishaal Shankar and Fartash Faghri},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=TLADT8Wrhn}\n}",
        "github": "",
        "project": "",
        "reviewers": "RTur;R93w;wUu1;fC5h",
        "pdf_size": 4205017,
        "rating": "5;6;6;8",
        "confidence": "3;5;3;4",
        "soundness": "3;3;2;4",
        "contribution": "2;3;2;3",
        "presentation": "3;3;3;4",
        "wc_summary": "52;139;46;329",
        "wc_strengths": "43;198;40;158",
        "wc_weaknesses": "111;199;46;1037",
        "wc_questions": "6;4;59;166",
        "wc_review": "212;540;191;1690",
        "wc_reply_reviewers": "43;0;27;1415",
        "wc_reply_authors": "1155;459;753;4456",
        "reply_reviewers": "1;0;1;6",
        "reply_authors": "4;2;2;8",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            141.5,
            114.33831378851097
        ],
        "wc_strengths_avg": [
            109.75,
            69.7078725826574
        ],
        "wc_weaknesses_avg": [
            348.25,
            401.33986532613477
        ],
        "wc_questions_avg": [
            58.75,
            65.73193668225515
        ],
        "wc_review_avg": [
            658.25,
            611.5457362291065
        ],
        "wc_reply_reviewers_avg": [
            371.25,
            602.8052649902786
        ],
        "wc_reply_authors_avg": [
            1705.75,
            1606.9628768269663
        ],
        "reply_reviewers_avg": [
            2.0,
            2.345207879911715
        ],
        "reply_authors_avg": [
            4.0,
            2.449489742783178
        ],
        "replies_avg": [
            32,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.3458572319330373,
        "gs_citation": 35,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17170977244329958045&as_sdt=80005&sciodt=0,11&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=TLADT8Wrhn",
        "pdf": "https://openreview.net/pdf?id=TLADT8Wrhn",
        "email": "cmu.edu;apple.com;apple.com;apple.com;apple.com;apple.com;apple.com;apple.com",
        "author_num": 8,
        "aff_unique_index": "0;1;1;1;1;1;1;1",
        "aff_unique_norm": "Carnegie Mellon University;Apple",
        "aff_unique_dep": ";Apple Inc.",
        "aff_unique_url": "https://www.cmu.edu;https://www.apple.com",
        "aff_unique_abbr": "CMU;Apple",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "TLBPjECC5D",
        "title": "Unlearning via Sparse Representations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Machine unlearning, which involves erasing knowledge about a forget set from a trained model, can prove to be costly and infeasible by existing techniques. We propose a nearly compute-free zero-shot unlearning technique based on a discrete representational bottleneck. We show that the proposed technique efficiently unlearns the forget set and incurs negligible damage to the model's performance on the rest of the data set. We evaluate the proposed technique on the problem of \\textit{class unlearning} using three datasets: CIFAR-10, CIFAR-100, and LACUNA-100. We compare the proposed technique to SCRUB, a state-of-the-art approach which uses knowledge distillation for unlearning. Across all three datasets, the  proposed technique performs as well as if not better than SCRUB while incurring almost no computational cost.",
        "keywords": "Unlearning;Discrete Bottlenecks;Model Editing",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Vedant Shah;Frederik Tr\u00e4uble;Ashish Malik;Hugo Larochelle;Michael Curtis Mozer;Sanjeev Arora;Yoshua Bengio;Anirudh Goyal",
        "authorids": "~Vedant_Shah2;~Frederik_Tr\u00e4uble1;~Ashish_Malik1;~Hugo_Larochelle1;~Michael_Curtis_Mozer1;~Sanjeev_Arora1;~Yoshua_Bengio1;~Anirudh_Goyal1",
        "gender": "M;M;M;M;M;;M;M",
        "homepage": "https://veds12.github.io/;https://ei.is.tuebingen.mpg.de/person/ftraeuble;;https://mila.quebec/en/directory/hugo-larochelle;https://www.cs.colorado.edu/~mozer;http://www.cs.princeton.edu/~arora/;http://yoshuabengio.org;https://anirudh9119.github.io/",
        "dblp": ";;;86/3862.html;m/MichaelCMozer;a/SArora;56/953;172/1039",
        "google_scholar": ";https://scholar.google.de/citations?user=oc2OOyMAAAAJ;https://scholar.google.co.in/citations?user=q7gz_SgAAAAJ;https://scholar.google.ca/citations?user=U89FHq4AAAAJ;lmjR_qMAAAAJ;RUP4S68AAAAJ;kukA0LcAAAAJ;krrh6OUAAAAJ",
        "orcid": ";;;;;;;",
        "linkedin": "veds12/;;;;;;yoshuabengio/?originalSubdomain=ca;",
        "or_profile": "~Vedant_Shah2;~Frederik_Tr\u00e4uble1;~Ashish_Malik1;~Hugo_Larochelle1;~Michael_Curtis_Mozer1;~Sanjeev_Arora1;~Yoshua_Bengio1;~Anirudh_Goyal1",
        "aff": "Mila - Quebec Artificial Intelligence Institute;Max Planck Institute for Intelligent Systems;Oregon State University;Google;Google DeepMind;Princeton University;University of Montreal;Google DeepMind",
        "aff_domain": "mila.quebec;is.tuebingen.mpg.de;oregonstate.edu;google.com;google.com;princeton.edu;umontreal.ca;google.com",
        "position": "MS student;PhD student;PhD student;Research Scientist;Research Scientist;Full Professor;Full Professor;Researcher",
        "bibtex": "@misc{\nshah2024unlearning,\ntitle={Unlearning via Sparse Representations},\nauthor={Vedant Shah and Frederik Tr{\\\"a}uble and Ashish Malik and Hugo Larochelle and Michael Curtis Mozer and Sanjeev Arora and Yoshua Bengio and Anirudh Goyal},\nyear={2024},\nurl={https://openreview.net/forum?id=TLBPjECC5D}\n}",
        "github": "",
        "project": "",
        "reviewers": "ffna;g9Bk;GrC6;Pr1b",
        "site": "https://openreview.net/forum?id=TLBPjECC5D",
        "pdf_size": 2059500,
        "rating": "5;5;5;6",
        "confidence": "3;2;4;2",
        "soundness": "3;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "3;2;2;2",
        "wc_summary": "59;102;71;155",
        "wc_strengths": "37;20;12;48",
        "wc_weaknesses": "247;42;457;235",
        "wc_questions": "130;23;176;164",
        "wc_review": "473;187;716;602",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1089;243;1205;594",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;2;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            96.75,
            37.11047695732298
        ],
        "wc_strengths_avg": [
            29.25,
            14.095655359010449
        ],
        "wc_weaknesses_avg": [
            245.25,
            146.84749742504977
        ],
        "wc_questions_avg": [
            123.25,
            60.28836952514141
        ],
        "wc_review_avg": [
            494.5,
            197.25427752015923
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            782.75,
            386.9886141735956
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10862037839408534968&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;3;3;4;5;3",
        "aff_unique_norm": "Quebec Artificial Intelligence Institute;Max Planck Institute for Intelligent Systems;Oregon State University;Google;Princeton University;University of Montreal",
        "aff_unique_dep": "Artificial Intelligence;Intelligent Systems;;Google;;",
        "aff_unique_url": "https://mila.quebec;https://www.mpi-is.mpg.de;https://oregonstate.edu;https://www.google.com;https://www.princeton.edu;https://wwwumontreal.ca",
        "aff_unique_abbr": "Mila;MPI-IS;OSU;Google;Princeton;UM",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;2;2;3;2;0;3",
        "aff_country_unique": "Canada;Germany;United States;United Kingdom"
    },
    {
        "id": "TLE2BRkdd8",
        "title": "Robust Algorithmic Recourse Design Under Model Shifts",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Algorithmic recourse offers users recommendations for actions that can help alter unfavorable outcomes in practical decision-making systems. Although many methods have been proposed to design easily implementable recourses, model updates or shifts may render previously generated recourses invalid. To assess the robustness of recourses against model shifts, we propose an uncertainty quantification method to calculate a theoretical upper-bound of the recourse invalidation rate for any counterfactual plan and any prediction model, without requiring distributional assumptions about the feature space. Furthermore, given the inherent trade-off between recourse cost and recourse robustness, users should be empowered to manage the implementation cost versus robustness trade-off. To this end, we propose a novel framework that leverages the derived invalidation rate bounds to generate model-agnostic recourses that satisfy the user's specified invalidation needs. Numerical results on multiple datasets demonstrate the effectiveness of the derived theoretical bounds and the efficacy of the proposed algorithms.",
        "keywords": "Algorithmic recourse;Model shifts;Robustness;Uncertainty quantification",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/b6cda88b5d2d5089376a5eefdfa255a88b5617c6.zip",
        "author": "Yulu Jin;Lifeng Lai",
        "authorids": "~Yulu_Jin1;~Lifeng_Lai1",
        "gender": "F;",
        "homepage": ";",
        "dblp": ";12/4889",
        "google_scholar": "LH9t3qUAAAAJ;gOhaCfUAAAAJ",
        "orcid": "0000-0001-7871-1759;",
        "linkedin": "yulujin/;",
        "or_profile": "~Yulu_Jin1;~Lifeng_Lai1",
        "aff": ";University of California, Davis",
        "aff_domain": ";ucdavis.edu",
        "position": ";Full Professor",
        "bibtex": "@misc{\njin2024robust,\ntitle={Robust Algorithmic Recourse Design Under Model Shifts},\nauthor={Yulu Jin and Lifeng Lai},\nyear={2024},\nurl={https://openreview.net/forum?id=TLE2BRkdd8}\n}",
        "github": "",
        "project": "",
        "reviewers": "LkRN;rDRT;NqmB;C8WR",
        "site": "https://openreview.net/forum?id=TLE2BRkdd8",
        "pdf_size": 484290,
        "rating": "3;3;5;5",
        "confidence": "5;4;2;4",
        "soundness": "3;1;4;2",
        "contribution": "2;2;2;3",
        "presentation": "3;1;3;2",
        "wc_summary": "68;123;247;78",
        "wc_strengths": "26;20;117;23",
        "wc_weaknesses": "302;185;206;52",
        "wc_questions": "4;81;41;233",
        "wc_review": "400;409;611;386",
        "wc_reply_reviewers": "0;0;15;19",
        "wc_reply_authors": "541;1425;665;1079",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "2;3;2;3",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.5,
            1.118033988749895
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            129.0,
            71.207443431147
        ],
        "wc_strengths_avg": [
            46.5,
            40.75843470988551
        ],
        "wc_weaknesses_avg": [
            186.25,
            89.18064532172886
        ],
        "wc_questions_avg": [
            89.75,
            87.07288613569669
        ],
        "wc_review_avg": [
            451.5,
            92.45133855169432
        ],
        "wc_reply_reviewers_avg": [
            8.5,
            8.616843969807043
        ],
        "wc_reply_authors_avg": [
            927.5,
            349.552213553283
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.6882472016116854,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:C1ae_YoihzwJ:scholar.google.com/&scioq=Robust+Algorithmic+Recourse+Design+Under+Model+Shifts&hl=en&as_sdt=0,21",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of California, Davis",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucdavis.edu",
        "aff_unique_abbr": "UC Davis",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Davis",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "TMYxJIcdgS",
        "title": "What Makes ImageNet Look Unlike LAION",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "ImageNet was famously created from Flickr image search results. What if we recreated ImageNet instead by searching the massive LAION dataset based on image captions alone? In this work, we carry out this counterfactual investigation. We find that the resulting ImageNet recreation, which we call LAIONet, looks distinctly unlike the original. Specifically, the intra-class similarity of images in the original ImageNet is dramatically higher than it is for LAIONet. Consequently, models trained on ImageNet perform significantly worse on LAIONet. We propose a rigorous explanation for the discrepancy in terms of a subtle, yet important, difference in two plausible causal data-generating processes for the respective datasets, that we support with systematic experimentation. In a nutshell, searching based on an image caption alone creates an information bottleneck that mitigates the selection bias otherwise present in image-based filtering. Our explanation formalizes a long-held intuition in the community that ImageNet images are stereotypical, unnatural, and overly simple representations of the class category. At the same time, it provides a simple and actionable takeaway for future dataset creation efforts.",
        "keywords": "benchmarks;datasets as benchmarks;selection bias;ImageNet;LAION",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/acfa1656681aed3e4d5fd1f0f75bc6f68b013837.zip",
        "author": "Ali Shirali;Moritz Hardt",
        "authorids": "~Ali_Shirali1;~Moritz_Hardt1",
        "gender": "M;Not Specified",
        "homepage": "https://sites.google.com/berkeley.edu/ali/home;http://mrtz.org/",
        "dblp": "299/4983.html;26/4683",
        "google_scholar": "FUSSkq0AAAAJ;adnTgaAAAAAJ",
        "orcid": "0000-0003-3750-0159;",
        "linkedin": ";",
        "or_profile": "~Ali_Shirali1;~Moritz_Hardt1",
        "aff": "University of California, Berkeley;Max-Planck-Institute for Intelligent Systems, Max-Planck Institute",
        "aff_domain": "berkeley.edu;is.mpg.de",
        "position": "PhD Student;Principal Researcher",
        "bibtex": "@misc{\nshirali2024what,\ntitle={What Makes ImageNet Look Unlike {LAION}},\nauthor={Ali Shirali and Moritz Hardt},\nyear={2024},\nurl={https://openreview.net/forum?id=TMYxJIcdgS}\n}",
        "github": "",
        "project": "",
        "reviewers": "fkPT;j7LU;UY2S;fH12",
        "site": "https://openreview.net/forum?id=TMYxJIcdgS",
        "pdf_size": 5389566,
        "rating": "5;5;5;6",
        "confidence": "5;4;3;4",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;2",
        "presentation": "3;3;2;1",
        "wc_summary": "119;50;48;35",
        "wc_strengths": "39;108;23;19",
        "wc_weaknesses": "599;194;177;124",
        "wc_questions": "251;5;16;1",
        "wc_review": "1008;357;264;179",
        "wc_reply_reviewers": "656;0;0;12",
        "wc_reply_authors": "1708;762;650;142",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "4;1;1;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            63.0,
            32.840523747346055
        ],
        "wc_strengths_avg": [
            47.25,
            35.86345633092271
        ],
        "wc_weaknesses_avg": [
            273.5,
            189.69251434887988
        ],
        "wc_questions_avg": [
            68.25,
            105.65362038283402
        ],
        "wc_review_avg": [
            452.0,
            327.12153704701257
        ],
        "wc_reply_reviewers_avg": [
            167.0,
            282.36678274896286
        ],
        "wc_reply_authors_avg": [
            815.5,
            565.7762366872614
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            1.299038105676658
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2246491574612398207&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of California, Berkeley;Max-Planck-Institute for Intelligent Systems",
        "aff_unique_dep": ";Intelligent Systems",
        "aff_unique_url": "https://www.berkeley.edu;https://www.mpi-is.mpg.de",
        "aff_unique_abbr": "UC Berkeley;MPI-IS",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Berkeley;",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United States;Germany"
    },
    {
        "id": "TO2dzfZtgt",
        "title": "CycleAlign: Iterative Distillation from Black-box LLM to White-box Models for Better Human Alignment",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Language models trained on large-scale corpus often exhibit a propensity for generating content that is harmful, toxic, or contrary to human preferences, making their alignment with human values a critical concern. \nA prevalent approach for achieving this alignment has been reinforcement learning from human feedback (RLHF), utilizing algorithms such as proximal policy optimization (PPO). \nHowever, these methods are often characterized by complexity, instability, and substantial resource consumption. \nRecently, ranking-based alignment methods have emerged, offering stability and effectiveness by replacing the RL framework with supervised fine-tuning, but they are costly due to the need for annotated data.\nConsidering that existing large language models (LLMs) like ChatGPT are already relatively well-aligned and cost-friendly, researchers have begun to align the language model with human preference from AI feedback. The common practices, which unidirectionally distill the instruction-following responses from LLMs, are constrained by their bottleneck. To address this, we introduce CycleAlign to distill alignment capabilities from parameter-invisible LLMs (black-box) to a parameter-visible model (white-box) in an iterative manner. With in-context learning (ICL) as the core of the cycle, the black-box models are able to rank the model-generated responses guided by human-craft instruction and demonstrations about their preferences. During iterative interaction, the white-box models also have a judgment about responses generated by them. Consequently, the agreement ranking could be viewed as a pseudo label to dynamically update the in-context demonstrations and improve the preference ranking ability of black-box models. Through multiple interactions, the CycleAlign framework could align the white-box model with the black-box model effectively in a low-resource way. Empirical results illustrate that the model fine-tuned by CycleAlign remarkably exceeds existing methods, and achieves the state-of-the-art performance in alignment with human value.",
        "keywords": "human alignment;in-context learning;distillation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Jixiang Hong;Quan Tu;Changyu Chen;Gao Xing;Ji Zhang;Rui Yan",
        "authorids": "~Jixiang_Hong1;~Quan_Tu2;~Changyu_Chen1;~Gao_Xing1;~Ji_Zhang3;~Rui_Yan2",
        "gender": "M;M;M;;M;M",
        "homepage": "https://hongjx175.github.io/;;https://scholar.google.com.hk/citations?user=eqApuiQAAAAJ&hl=en;;https://gsai.ruc.edu.cn/english/ruiyan;https://github.com/morecry",
        "dblp": "348/0743;161/5246.html;;86/1953-11;19/2405-1;269/5183.html",
        "google_scholar": ";5D7J2doAAAAJ;;cgnuJDUAAAAJ;eLw6g-UAAAAJ;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": "0009-0006-5599-6425;;;;0000-0002-3356-6823;0009-0005-8806-247X",
        "linkedin": ";;;;;",
        "or_profile": "~Jixiang_Hong1;~Changyu_Chen1;~Gao_Xing1;~Ji_Zhang3;~Rui_Yan2;~quan_Tu1",
        "aff": "Renmin University of China;Renmin University of China;;Alibaba Group;Renmin University of China;Renmin University of China",
        "aff_domain": "ruc.edu.cn;ruc.edu.cn;;alibaba-inc.com;ruc.edu.cn;ruc.edu.cn",
        "position": "PhD student;PhD student;;Senior Staff Engineer;Associate Professor;PhD student",
        "bibtex": "@misc{\nhong2024cyclealign,\ntitle={CycleAlign: Iterative Distillation from Black-box {LLM} to White-box Models for Better Human Alignment},\nauthor={Jixiang Hong and Quan Tu and Changyu Chen and Gao Xing and Ji Zhang and Rui Yan},\nyear={2024},\nurl={https://openreview.net/forum?id=TO2dzfZtgt}\n}",
        "github": "",
        "project": "",
        "reviewers": "NcP5;eDHy;mkaA;q2L9",
        "site": "https://openreview.net/forum?id=TO2dzfZtgt",
        "pdf_size": 401333,
        "rating": "3;3;5;5",
        "confidence": "4;4;4;5",
        "soundness": "1;2;3;2",
        "contribution": "2;2;3;2",
        "presentation": "2;2;3;2",
        "wc_summary": "114;81;65;94",
        "wc_strengths": "81;37;21;59",
        "wc_weaknesses": "200;87;55;378",
        "wc_questions": "37;57;71;31",
        "wc_review": "432;262;212;562",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            88.5,
            17.95132307101624
        ],
        "wc_strengths_avg": [
            49.5,
            22.643983748448505
        ],
        "wc_weaknesses_avg": [
            180.0,
            126.37048706086402
        ],
        "wc_questions_avg": [
            49.0,
            15.937377450509228
        ],
        "wc_review_avg": [
            367.0,
            139.01438774457844
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9356204538713467779&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "Renmin University of China;Alibaba Group",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.ruc.edu.cn;https://www.alibaba.com",
        "aff_unique_abbr": "RUC;Alibaba",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "TOE6N8dp4w",
        "title": "Harnessing large-language models to generate private synthetic text",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Differentially private training algorithms like DP-SGD protect sensitive training data by ensuring that trained models do not reveal private information. An alternative approach, which this paper studies, is to use a sensitive dataset to generate synthetic data that is differentially private with respect to the original data, and then non-privately training a model on the synthetic data.  Doing so has several advantages: synthetic data can be reused for other tasks (including for hyper parameter tuning), retained indefinitely, and shared with third parties without sacrificing privacy. \n\nHowever, generating private synthetic data is much harder than training a private model. To improve performance on text data, recent work has utilized public data by starting with a pre-trained generative language model and privately fine-tuning it on sensitive data. This model can be used to sample a DP synthetic dataset. While this strategy seems straightforward, executing it has proven problematic. Previous approaches either show significant performance loss, or have, as we show, critical design flaws.\n \nIn this paper we demonstrate that a proper training objective along with tuning fewer parameters results in excellent DP synthetic data quality. Our approach is competitive with direct DP-training of downstream classifiers in terms of performance on downstream tasks. Further, we demonstrate that our DP synthetic data is not only useful for downstream classifier training, but also to tune those same models.",
        "keywords": "Privacy;synthetic data;large language models",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/a4a173e8166c51b018d80e017233d59f7ffb349f.pdf",
        "author": "Alexey Kurakin;Natalia Ponomareva;Umar Syed;Liam MacDermed;Andreas Terzis",
        "authorids": "~Alexey_Kurakin1;~Natalia_Ponomareva1;~Umar_Syed1;~Liam_MacDermed1;~Andreas_Terzis1",
        "gender": "M;F;M;M;M",
        "homepage": "http://kurakin.me;;https://umarsyed.com;;https://aterzis-personal.github.io/aterzis/",
        "dblp": "56/9834;71/6768-1;75/1894;85/9922;12/6664",
        "google_scholar": "nCh4qyMAAAAJ;eIdQR5oAAAAJ;zKORw8wAAAAJ;;NcIqQ88AAAAJ",
        "orcid": ";0009-0005-6761-1468;;;",
        "linkedin": ";;;;andreas-terzis-2395371/",
        "or_profile": "~Alexey_Kurakin1;~Natalia_Ponomareva1;~Umar_Syed1;~Liam_MacDermed1;~Andreas_Terzis1",
        "aff": "Research, Google;Google;Google;Google;Google DeepMind",
        "aff_domain": "research.google.com;google.com;google.com;google.com;deepmind.google",
        "position": "Research Software Engineer;Software Engineer in Research;Researcher;Researcher;Researcher",
        "bibtex": "@misc{\nkurakin2024harnessing,\ntitle={Harnessing large-language models to generate private synthetic text},\nauthor={Alexey Kurakin and Natalia Ponomareva and Umar Syed and Liam MacDermed and Andreas Terzis},\nyear={2024},\nurl={https://openreview.net/forum?id=TOE6N8dp4w}\n}",
        "github": "",
        "project": "",
        "reviewers": "B33T;TdTq;cvof;gTGD",
        "site": "https://openreview.net/forum?id=TOE6N8dp4w",
        "pdf_size": 667165,
        "rating": "3;5;5;6",
        "confidence": "5;3;4;4",
        "soundness": "3;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;1;4",
        "wc_summary": "82;112;74;198",
        "wc_strengths": "87;121;46;101",
        "wc_weaknesses": "193;502;38;135",
        "wc_questions": "721;6;775;211",
        "wc_review": "1083;741;933;645",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "604;816;548;236",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            116.5,
            49.14010581999188
        ],
        "wc_strengths_avg": [
            88.75,
            27.48067502809929
        ],
        "wc_weaknesses_avg": [
            217.0,
            173.61307554444164
        ],
        "wc_questions_avg": [
            428.25,
            328.4169415544819
        ],
        "wc_review_avg": [
            850.5,
            169.6194269534006
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            551.0,
            207.52590199779883
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.6488856845230502,
        "gs_citation": 31,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10930355231623511291&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Google",
        "aff_unique_dep": "Google Research",
        "aff_unique_url": "https://research.google",
        "aff_unique_abbr": "Google",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Mountain View;",
        "aff_country_unique_index": "0;0;0;0;1",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "title": "Discovering Failure Modes of Text-guided Diffusion Models via Adversarial Search",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18575",
        "id": "TOWdQQgMJY",
        "author_site": "Qihao Liu, Adam Kortylewski, Yutong Bai, Song Bai, Alan Yuille",
        "tldr": "",
        "abstract": "Text-guided diffusion models (TDMs) are widely applied but can fail unexpectedly. Common failures include: _(i)_ natural-looking text prompts generating images with the wrong content, or _(ii)_ different random samples of the latent variables that generate vastly different, and even unrelated, outputs despite being conditioned on the same text prompt. In this work, we aim to study and understand the failure modes of TDMs in more detail. To achieve this, we propose SAGE, the first adversarial search method on TDMs that systematically explores the discrete prompt space and the high-dimensional latent space, to automatically discover undesirable behaviors and failure cases in image generation. We use image classifiers as surrogate loss functions during searching, and employ human inspections to validate the identified failures. For the first time, our method enables efficient exploration of both the discrete and intricate human language space and the challenging latent space, overcoming the gradient vanishing problem. Then, we demonstrate the effectiveness of SAGE on five widely used generative models and reveal four typical failure modes that have not been systematically studied before: (1) We find a variety of natural text prompts that generate images failing to capture the semantics of input texts. We further discuss the underlying causes and potential solutions based on the results. (2) We find regions in the latent space that lead to distorted images independent of the text prompt, suggesting that parts of the latent space are not well-structured. (3) We also find latent samples that result in natural-looking images unrelated to the text prompt, implying a possible misalignment between the latent and prompt spaces. (4) By appending a single adversarial token embedding to any input prompts, we can generate a variety of specified target objects, with minimal impact on CLIP scores, demonstrating the fragility of language representations.",
        "keywords": "Text-guided diffusion models;Robustness;Adversarial examiner;Failure detection",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Qihao Liu;Adam Kortylewski;Yutong Bai;Song Bai;Alan Yuille",
        "authorids": "~Qihao_Liu1;~Adam_Kortylewski1;~Yutong_Bai1;~Song_Bai3;~Alan_Yuille1",
        "gender": ";;F;;M",
        "homepage": ";https://gvrl.mpi-inf.mpg.de/;https://yutongbai.com/;https://songbai.site/;",
        "dblp": "158/2755;161/0772;216/8431;;y/AlanLYuille",
        "google_scholar": "WFl3hH0AAAAJ;https://scholar.google.ch/citations?user=tRLUOBIAAAAJ;N1-l4GsAAAAJ;LXuWMF4AAAAJ;",
        "orcid": ";0000-0002-9146-4403;;;",
        "linkedin": ";;%E9%9B%A8%E6%A1%90-%E7%99%BD-59a44a136/;;",
        "or_profile": "~Qihao_Liu1;~Adam_Kortylewski1;~Yutong_Bai1;~Song_Bai3;~Alan_Yuille1",
        "aff": "Johns Hopkins University;Albert-Ludwigs-Universit\u00e4t Freiburg;Johns Hopkins University;ByteDance;Johns Hopkins University",
        "aff_domain": "jh.edu;uni-freiburg.de;jhu.edu;bytedance.com;johnshopkins.edu",
        "position": "PhD student;Research Group Leader;PhD student;Computer Vision Lead;Full Professor",
        "bibtex": "@inproceedings{\nliu2024discovering,\ntitle={Discovering Failure Modes of Text-guided Diffusion Models via Adversarial Search},\nauthor={Qihao Liu and Adam Kortylewski and Yutong Bai and Song Bai and Alan Yuille},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=TOWdQQgMJY}\n}",
        "github": "",
        "project": "",
        "reviewers": "jsKc;6z3X;5bJZ;6EFD",
        "pdf_size": 15245536,
        "rating": "6;6;6;10",
        "confidence": "4;3;4;5",
        "soundness": "2;3;3;4",
        "contribution": "2;2;3;4",
        "presentation": "1;3;3;4",
        "wc_summary": "199;87;103;90",
        "wc_strengths": "36;52;91;112",
        "wc_weaknesses": "308;115;130;76",
        "wc_questions": "59;20;62;133",
        "wc_review": "602;274;386;411",
        "wc_reply_reviewers": "33;0;10;0",
        "wc_reply_authors": "1711;979;340;836",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "5;3;2;2",
        "rating_avg": [
            7.0,
            1.7320508075688772
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            119.75,
            46.14853735493683
        ],
        "wc_strengths_avg": [
            72.75,
            30.22726418318403
        ],
        "wc_weaknesses_avg": [
            157.25,
            89.2394951801051
        ],
        "wc_questions_avg": [
            68.5,
            40.75843470988551
        ],
        "wc_review_avg": [
            418.25,
            117.96689154165249
        ],
        "wc_reply_reviewers_avg": [
            10.75,
            13.47915056670857
        ],
        "wc_reply_authors_avg": [
            966.5,
            490.90961489871023
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.0,
            1.224744871391589
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.816496580927726,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4013556481618548312&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=TOWdQQgMJY",
        "pdf": "https://openreview.net/pdf?id=TOWdQQgMJY",
        "email": "jh.edu;uni-freiburg.de;jhu.edu;bytedance.com;johnshopkins.edu",
        "author_num": 5,
        "aff_unique_index": "0;1;0;2;0",
        "aff_unique_norm": "Johns Hopkins University;Albert-Ludwigs-Universit\u00e4t Freiburg;ByteDance",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.jhu.edu;https://www.uni-freiburg.de;https://www.bytedance.com",
        "aff_unique_abbr": "JHU;Albert-Ludwigs-Universit\u00e4t;ByteDance",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Freiburg",
        "aff_country_unique_index": "0;1;0;2;0",
        "aff_country_unique": "United States;Germany;China"
    },
    {
        "id": "TOveLu4O51",
        "title": "Parameter-Efficient Detoxification with Contrastive Decoding",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The field of natural language generation has witnessed significant advancements in recent years, including the development of controllable text generation techniques. However, controlling the attributes of the generated text remains a challenge, especially when aiming to avoid undesirable behavior such as toxicity. In this work, we introduce Detoxification Generator (DETOXIGEN), an inference-time algorithm that steers the generation away from unwanted styles. DETOXIGEN is an ensemble of a pre-trained language model (generator) and a detoxifier. The detoxifier is trained intentionally on the toxic data representative of the undesirable attribute, encouraging it to generate text in that style exclusively. During the actual generation, we use the trained detoxifier to produce undesirable tokens for the generator to contrast against at each decoding step. This approach directly informs the generator to avoid generating tokens that the detoxifier considers highly likely. We evaluate DETOXIGEN on the commonly used REALTOXICITYPROMPTS benchmark (Gehman et al., 2020) with various language models as generators. We find that it significantly outperforms previous approaches in detoxification metrics while not compromising on the generation quality. Moreover, the detoxifier is obtained by soft prompt-tuning using the same backbone language model as the generator. Hence, DETOXIGEN requires only a tiny amount of extra weights from the virtual tokens of the detoxifier to be loaded into GPU memory while decoding, making it a promising lightweight, practical, and parameter-efficient detoxification strategy.",
        "keywords": "controllable;text generation;detoxification;contrastive decoding",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Tong Niu;Caiming Xiong;Semih Yavuz;Yingbo Zhou",
        "authorids": "~Tong_Niu1;~Caiming_Xiong1;~Semih_Yavuz1;~Yingbo_Zhou1",
        "gender": "M;M;;M",
        "homepage": ";http://cmxiong.com/;;",
        "dblp": ";80/7282;72/8614;",
        "google_scholar": "rrMtKR4AAAAJ;vaSdahkAAAAJ;H_6RQ7oAAAAJ;krh3p8AAAAAJ",
        "orcid": ";;;",
        "linkedin": ";caiming-xiong-150a1417;yingbozhou/;semih-yavuz-4303518b",
        "or_profile": "~Tong_Niu1;~Caiming_Xiong1;~Yingbo_Zhou1;~Semih_Yavuz2",
        "aff": "Salesforce AI Research;Salesforce Research;Salesforce Research;SalesForce.com",
        "aff_domain": "salesforce.com;salesforce.com;salesforce.com;salesforce.com",
        "position": "Research Scientist;Research Scientist;Research Scientist;Research Scientist",
        "bibtex": "@misc{\nniu2024parameterefficient,\ntitle={Parameter-Efficient Detoxification with Contrastive Decoding},\nauthor={Tong Niu and Caiming Xiong and Semih Yavuz and Yingbo Zhou},\nyear={2024},\nurl={https://openreview.net/forum?id=TOveLu4O51}\n}",
        "github": "",
        "project": "",
        "reviewers": "qHFk;EV4t;FrfU;9Tow",
        "site": "https://openreview.net/forum?id=TOveLu4O51",
        "pdf_size": 448634,
        "rating": "5;5;5;8",
        "confidence": "4;4;4;4",
        "soundness": "2;3;3;4",
        "contribution": "2;2;2;3",
        "presentation": "3;3;4;4",
        "wc_summary": "50;53;65;34",
        "wc_strengths": "30;28;20;97",
        "wc_weaknesses": "131;151;82;67",
        "wc_questions": "15;4;5;3",
        "wc_review": "226;236;172;201",
        "wc_reply_reviewers": "0;0;0;14",
        "wc_reply_authors": "390;401;241;130",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            50.5,
            11.05667219374799
        ],
        "wc_strengths_avg": [
            43.75,
            30.97075233183721
        ],
        "wc_weaknesses_avg": [
            107.75,
            34.404759845114455
        ],
        "wc_questions_avg": [
            6.75,
            4.815340071064556
        ],
        "wc_review_avg": [
            208.75,
            24.752525123712125
        ],
        "wc_reply_reviewers_avg": [
            3.5,
            6.06217782649107
        ],
        "wc_reply_authors_avg": [
            290.5,
            112.16171361030466
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=836803339686108215&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Salesforce",
        "aff_unique_dep": "Salesforce AI Research",
        "aff_unique_url": "https://www.salesforce.com",
        "aff_unique_abbr": "Salesforce AI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "TPAj63ax4Y",
        "title": "Segment, Select, Correct: A Framework for Weakly-Supervised Referring Segmentation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Referring Image Segmentation (RIS) - the problem of identifying objects in images through natural language sentences - is a challenging task currently mostly solved through supervised learning. However, while collecting referred annotation masks is a time-consuming process, the few existing weakly-supervised and zero-shot approaches fall significantly short in performance compared to fully-supervised learning ones. To bridge the performance gap without mask annotations, we propose a novel weakly-supervised framework that tackles RIS by decomposing it into three steps: obtaining instance masks for the  object mentioned in the referencing instruction (*segment*), using zero-shot learning to select a potentially correct mask for the given  instruction (*select*), and bootstrapping a model which allows for fixing the mistakes of zero-shot selection (*correct*). In our experiments, using only the first two steps (zero-shot segment and select) outperforms other zero-shot baselines by as much as $19\\\\%$, while our full method improves upon this much stronger baseline and sets the new state-of-the-art for weakly-supervised RIS, reducing the gap between the weakly-supervised and fully-supervised methods in some cases from around $33\\\\%$ to as little as $14\\\\%$.",
        "keywords": "referring image segmentation;weakly-supervised learning;computer vision",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/edc80868bb33dc89f9912bdb483c55ffdcaeb639.zip",
        "author": "Francisco Eiras;Kemal Oksuz;Adel Bibi;Philip Torr;Puneet K. Dokania",
        "authorids": "~Francisco_Eiras1;~Kemal_Oksuz1;~Adel_Bibi1;~Philip_Torr1;~Puneet_K._Dokania1",
        "gender": "M;M;M;;M",
        "homepage": "https://fgirbal.github.io;https://kemaloksuz.github.io/;http://adelbibi.com;http://www.robots.ox.ac.uk/~tvg/;http://puneetkdokania.github.io/",
        "dblp": "218/5843;202/7522;176/0964;;150/4211",
        "google_scholar": "O_iJTgYAAAAJ;nWHRjrkAAAAJ;Q4j2laYAAAAJ;;https://scholar.google.fr/citations?user=WsM7ybkAAAAJ",
        "orcid": ";0000-0002-0066-1517;0000-0002-6169-3918;;",
        "linkedin": "franciscogirbaleiras/;;adel-bibi-ba3671ab/;;",
        "or_profile": "~Francisco_Eiras1;~Kemal_Oksuz1;~Adel_Bibi1;~Philip_Torr1;~Puneet_Dokania1",
        "aff": "University of Oxford;Five AI;University of Oxford;University of Oxford;University of Oxford",
        "aff_domain": "ox.ac.uk;five.ai;ox.ac.uk;ox.ac.uk;oxford.ac.uk",
        "position": "PhD student;Researcher;Senior Researcher;Full Professor;Senior Researcher",
        "bibtex": "@misc{\neiras2024segment,\ntitle={Segment, Select, Correct: A Framework for Weakly-Supervised Referring Segmentation},\nauthor={Francisco Eiras and Kemal Oksuz and Adel Bibi and Philip Torr and Puneet K. Dokania},\nyear={2024},\nurl={https://openreview.net/forum?id=TPAj63ax4Y}\n}",
        "github": "",
        "project": "",
        "reviewers": "xVs3;6s9c;VXus;g3AQ",
        "site": "https://openreview.net/forum?id=TPAj63ax4Y",
        "pdf_size": 7687768,
        "rating": "3;3;5;5",
        "confidence": "5;4;3;3",
        "soundness": "2;2;2;3",
        "contribution": "2;1;2;2",
        "presentation": "2;3;1;2",
        "wc_summary": "71;90;64;43",
        "wc_strengths": "18;24;23;56",
        "wc_weaknesses": "54;214;60;95",
        "wc_questions": "17;30;102;65",
        "wc_review": "160;358;249;259",
        "wc_reply_reviewers": "0;0;60;0",
        "wc_reply_authors": "56;1232;896;709",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;3;3;2",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            67.0,
            16.80773631397161
        ],
        "wc_strengths_avg": [
            30.25,
            15.039531242695032
        ],
        "wc_weaknesses_avg": [
            105.75,
            64.42970976187927
        ],
        "wc_questions_avg": [
            53.5,
            33.04920573932148
        ],
        "wc_review_avg": [
            256.5,
            70.13736521997387
        ],
        "wc_reply_reviewers_avg": [
            15.0,
            25.98076211353316
        ],
        "wc_reply_authors_avg": [
            723.25,
            428.39664739584504
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9045340337332909,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3765593415485063743&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;0;0",
        "aff_unique_norm": "University of Oxford;Five AI",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ox.ac.uk;https://www.five.ai",
        "aff_unique_abbr": "Oxford;Five AI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "title": "Test-time Adaptation against Multi-modal Reliability Bias",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18574",
        "id": "TPZRq4FALB",
        "author_site": "Mouxing Yang, Yunfan Li, Changqing Zhang, Peng Hu, Xi Peng",
        "tldr": "",
        "abstract": "Test-time adaptation (TTA) has emerged as a new paradigm for reconciling distribution shifts across domains without accessing source data. However, existing TTA methods mainly concentrate on uni-modal tasks, overlooking the complexity of multi-modal scenarios.\nIn this paper, we delve into the multi-modal test-time adaptation and reveal a new challenge named reliability bias. Different from the definition of traditional distribution shifts, reliability bias refers to the information discrepancies across different modalities derived from intra-modal distribution shifts. To solve the challenge, we propose a novel method, dubbed REliable fusion and robust ADaptation (READ). On the one hand, unlike the existing TTA paradigm that mainly repurposes the normalization layers, READ employs a new paradigm that modulates the attention between modalities in a self-adaptive way, supporting reliable fusion against reliability bias. On the other hand, READ adopts a novel objective function for robust multi-modal adaptation, where the contributions of confident predictions could be amplified and the negative impacts of noisy predictions could be mitigated. Moreover, we introduce two new benchmarks to facilitate comprehensive evaluations of multi-modal TTA under reliability bias. Extensive experiments on the benchmarks verify the effectiveness of our method against multi-modal reliability bias. The code and benchmarks are available at https://github.com/XLearning-SCU/2024-ICLR-READ.",
        "keywords": "Test-time adaption;Imbalanced multi-modal learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Mouxing Yang;Yunfan Li;Changqing Zhang;Peng Hu;Xi Peng",
        "authorids": "~Mouxing_Yang1;~Yunfan_Li1;~Changqing_Zhang1;~Peng_Hu2;~Xi_Peng3",
        "gender": "M;M;M;M;M",
        "homepage": "https://yunfan-li.github.io/;http://cic.tju.edu.cn/faculty/zhangchangqing/index.html;https://penghu-cs.github.io/;https://mouxingyang.github.io;http://www.pengxi.me",
        "dblp": "80/1874-3;78/2668;11/6278-2;300/5807;18/931-1",
        "google_scholar": "JmXIt5oAAAAJ;yJGhdykAAAAJ;gvESkwYAAAAJ;IaRmgrEAAAAJ;bw9FOHAAAAAJ",
        "orcid": ";;0000-0003-3868-3997;;",
        "linkedin": ";;;;",
        "or_profile": "~Yunfan_Li1;~Changqing_Zhang1;~Peng_Hu2;~Yang_Mouxing1;~Xi_Peng2",
        "aff": "Sichuan University;Tianjin University;Sichuan University;Sichuan University;Sichuan University",
        "aff_domain": "scu.edu.cn;tju.edu.cn;scu.edu.cn;scu.edu.cn;scu.edu.cn",
        "position": "PhD student;Associate Professor;Associate Professor;PhD student;Full Professor",
        "bibtex": "@inproceedings{\nyang2024testtime,\ntitle={Test-time Adaptation against Multi-modal Reliability Bias},\nauthor={Mouxing Yang and Yunfan Li and Changqing Zhang and Peng Hu and Xi Peng},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=TPZRq4FALB}\n}",
        "github": "",
        "project": "",
        "reviewers": "kzfx;9FmQ;r3k4;Hrwp",
        "pdf_size": 6059103,
        "rating": "8;8;8;8",
        "confidence": "5;5;4;5",
        "soundness": "3;4;3;4",
        "contribution": "4;4;3;4",
        "presentation": "4;3;3;4",
        "wc_summary": "96;131;198;166",
        "wc_strengths": "115;274;304;240",
        "wc_weaknesses": "245;253;289;272",
        "wc_questions": "43;23;23;70",
        "wc_review": "499;681;814;748",
        "wc_reply_reviewers": "0;31;0;0",
        "wc_reply_authors": "858;2320;1529;1880",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "2;6;4;3",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            4.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            147.75,
            38.13381045738807
        ],
        "wc_strengths_avg": [
            233.25,
            71.9283497655827
        ],
        "wc_weaknesses_avg": [
            264.75,
            17.09349291397168
        ],
        "wc_questions_avg": [
            39.75,
            19.279198634798075
        ],
        "wc_review_avg": [
            685.5,
            117.49574460379405
        ],
        "wc_reply_reviewers_avg": [
            7.75,
            13.423393758658799
        ],
        "wc_reply_authors_avg": [
            1646.75,
            534.7108447563038
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.75,
            1.479019945774904
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 19,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6235498219096329534&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=TPZRq4FALB",
        "pdf": "https://openreview.net/pdf?id=TPZRq4FALB",
        "email": "scu.edu.cn;tju.edu.cn;scu.edu.cn;scu.edu.cn;scu.edu.cn",
        "author_num": 5,
        "aff_unique_index": "0;1;0;0;0",
        "aff_unique_norm": "Sichuan University;Tianjin University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.scu.edu.cn;http://www.tju.edu.cn",
        "aff_unique_abbr": "SCU;TJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "TQWXWtJSda",
        "title": "Unlocking the Potential of Knowledge Distillation: The Role of Teacher Calibration",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Knowledge distillation (KD) is one of the successful deep learning compression methods for edge devices, transferring the knowledge from a large model, known as the *teacher*, to a smaller model, referred to as the *student*. KD has demonstrated remarkable performance since its first introduction. However, recent research in KD reveals that using a higher-performance teacher network does not guarantee better performance of the student network. This naturally leads to a question about the criterion for choosing an appropriate teacher. In this paper, we reveal that there is a strong correlation between the calibration error of the teacher and the accuracy of the student. Therefore, we claim that the calibration error of the teacher model can be a selection criterion for knowledge distillation. Furthermore, we demonstrate that the performance of KD can be improved by simply applying a temperature-based calibration method that reduces the teacher's calibration error. Our algorithm can be easily applied to other methods, and when applied on top of the current state-of-the-art (SOTA) model, it achieves a new SOTA performance.",
        "keywords": "knowledge distillation;Calibration",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Suyoung Kim;SeongUk Park;JunHoo Lee;Nojun Kwak",
        "authorids": "~Suyoung_Kim2;~SeongUk_Park1;~JunHoo_Lee1;~Nojun_Kwak1",
        "gender": "M;M;M;M",
        "homepage": "https://github.com/Swiminn;;https://junhoo-lee.com;http://mipal.snu.ac.kr",
        "dblp": ";;376/0719;49/2806",
        "google_scholar": ";;https://scholar.google.com/citations?hl=ko;h_8-1M0AAAAJ",
        "orcid": ";0000-0001-7139-317X;;0000-0002-1792-0327",
        "linkedin": ";;;",
        "or_profile": "~Suyoung_Kim2;~SeongUk_Park1;~JunHoo_Lee1;~Nojun_Kwak1",
        "aff": "Seoul National University;Seoul National University;Seoul National University;Seoul National University",
        "aff_domain": "snu.ac.kr;snu.ac.kr;snu.ac.kr;snu.ac.kr",
        "position": "PhD student;PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nkim2024unlocking,\ntitle={Unlocking the Potential of Knowledge Distillation: The Role of Teacher Calibration},\nauthor={Suyoung Kim and SeongUk Park and JunHoo Lee and Nojun Kwak},\nyear={2024},\nurl={https://openreview.net/forum?id=TQWXWtJSda}\n}",
        "github": "",
        "project": "",
        "reviewers": "f68K;vJXm;F9hQ",
        "site": "https://openreview.net/forum?id=TQWXWtJSda",
        "pdf_size": 321711,
        "rating": "5;6;6",
        "confidence": "4;4;4",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "3;4;3",
        "wc_summary": "60;78;81",
        "wc_strengths": "49;54;81",
        "wc_weaknesses": "54;28;226",
        "wc_questions": "1;272;20",
        "wc_review": "164;432;408",
        "wc_reply_reviewers": "0;120;0",
        "wc_reply_authors": "989;1104;918",
        "reply_reviewers": "0;1;0",
        "reply_authors": "2;3;2",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            73.0,
            9.273618495495704
        ],
        "wc_strengths_avg": [
            61.333333333333336,
            14.055445761538676
        ],
        "wc_weaknesses_avg": [
            102.66666666666667,
            87.85341326449543
        ],
        "wc_questions_avg": [
            97.66666666666667,
            123.51608082441014
        ],
        "wc_review_avg": [
            334.6666666666667,
            121.07665157062924
        ],
        "wc_reply_reviewers_avg": [
            40.0,
            56.568542494923804
        ],
        "wc_reply_authors_avg": [
            1003.6666666666666,
            76.6391254879357
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:PsLm3N6-UhEJ:scholar.google.com/&scioq=Unlocking+the+Potential+of+Knowledge+Distillation:+The+Role+of+Teacher+Calibration&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Seoul National University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.snu.ac.kr",
        "aff_unique_abbr": "SNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "TQsrRW9mq9",
        "title": "DeCUR: decoupling common & unique representations for multimodal self-supervision",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The increasing availability of multi-sensor data sparks interest in multimodal self-supervised learning. However, most existing approaches learn only common representations across modalities while ignoring intra-modal training and modality-unique representations. We propose Decoupling Common and Unique Representations (DeCUR), a simple yet effective method for multimodal self-supervised learning. By distinguishing inter- and intra-modal embeddings, DeCUR is trained to integrate complementary information across different modalities. We evaluate DeCUR in three common multimodal scenarios (radar-optical, RGB-elevation, and RGB-depth), and demonstrate its consistent benefits on scene classification and semantic segmentation downstream tasks. Notably, we get straightforward improvements by transferring our pretrained backbones to state-of-the-art supervised multimodal methods without any hyperparameter tuning. Furthermore, we conduct a comprehensive explainability analysis to shed light on the interpretation of common and unique features in our multimodal approach.",
        "keywords": "multimodal self-supervised learning;representation learning;RGBD;Earth observation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/f8e54714c7f1ea8fe6b1fe3761dff2ba809cbb51.zip",
        "author": "Yi Wang;Conrad M Albrecht;Nassim Ait Ait Ali Braham;Chenying Liu;Zhitong Xiong;Xiao Xiang Zhu",
        "authorids": "~Yi_Wang31;~Conrad_M_Albrecht1;~Nassim_Ait_Ait_Ali_Braham1;~Chenying_Liu1;~Zhitong_Xiong2;~Xiao_Xiang_Zhu1",
        "gender": ";M;M;F;M;F",
        "homepage": "https://wangyi111.github.io/;https://conrad-m-albrecht.github.io;https://www.linkedin.com/in/nassim-ait-ali-braham/;;https://zhitong-xiong.github.io;https://www.sipeo.bgu.tum.de/",
        "dblp": "17/221-72;173/9302;;;202/2877;35/8954",
        "google_scholar": "rEADuMEAAAAJ;;;https://scholar.google.de/citations?user=AhwX6dcAAAAJ;zKUfuxoAAAAJ;https://scholar.google.de/citations?user=CNakdIgAAAAJ",
        "orcid": ";0009-0009-2422-7289;;;;0000-0001-5530-3613",
        "linkedin": ";;;;;xiaoxiang-zhu-90b473228/",
        "or_profile": "~Yi_Wang31;~Conrad_M_Albrecht1;~Nassim_Ait_Ait_Ali_Braham1;~Chenying_Liu1;~Zhitong_Xiong2;~Xiaoxiang_Zhu1",
        "aff": "German Aerospace Center (DLR);Technische Universit\u00e4t M\u00fcnchen;Technische Universit\u00e4t M\u00fcnchen;Technische Universit\u00e4t M\u00fcnchen;Technische Universit\u00e4t M\u00fcnchen;Technical University Munich",
        "aff_domain": "dlr.de;tum.de;tum.de;tum.de;tum.de;tum.de",
        "position": "PhD student;Instructor;PhD student;PhD student;Postdoc;Full Professor",
        "bibtex": "@misc{\nwang2024decur,\ntitle={De{CUR}: decoupling common \\& unique representations for multimodal self-supervision},\nauthor={Yi Wang and Conrad M Albrecht and Nassim Ait Ait Ali Braham and Chenying Liu and Zhitong Xiong and Xiao Xiang Zhu},\nyear={2024},\nurl={https://openreview.net/forum?id=TQsrRW9mq9}\n}",
        "github": "",
        "project": "",
        "reviewers": "7Nuf;FCpx;KmGU;ZvJb",
        "site": "https://openreview.net/forum?id=TQsrRW9mq9",
        "pdf_size": 1936802,
        "rating": "3;5;5;8",
        "confidence": "4;4;3;4",
        "soundness": "1;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;3;3",
        "wc_summary": "72;42;19;73",
        "wc_strengths": "33;45;53;38",
        "wc_weaknesses": "437;54;227;14",
        "wc_questions": "6;2;18;1",
        "wc_review": "548;143;317;126",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "908;476;1090;85",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;2;1",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            51.5,
            22.522211259110417
        ],
        "wc_strengths_avg": [
            42.25,
            7.5291101731877985
        ],
        "wc_weaknesses_avg": [
            183.0,
            167.07333719058826
        ],
        "wc_questions_avg": [
            6.75,
            6.7592529172978875
        ],
        "wc_review_avg": [
            283.5,
            170.0213221922474
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            639.75,
            390.2706592866033
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.08084520834544431,
        "gs_citation": 21,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11569654046737422524&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;1;1;1;2",
        "aff_unique_norm": "German Aerospace Center;Technische Universit\u00e4t M\u00fcnchen;Technical University of Munich",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.dlr.de;https://www.tum.de;https://www.tum.de",
        "aff_unique_abbr": "DLR;TUM;TUM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "TS8DP0x1Vd",
        "title": "Interpreting Age Predictions from Brain Maps via Deep Neural Activations and Tensor Decomposition",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Deep learning models, while effective, often lack transparent interpretability, especially in critical areas like healthcare. This paper introduces a novel approach to interpret 3D convolutional neural networks trained to estimate one or more of the individual's clinically relevant attributes from 3D brain maps. In contrast to interpretability methods commonly applied to object classification in images, such as gradient approaches like GradCAM, which must rely on per-instance explanations due to the spatial variation of object location, brain maps have a common spatial registration and we propose to compute explanations at the dataset-level.  After organizing the internal activations of 3D convolutional neural network across the training dataset into a tensor, we use a constrained tensor decomposition to reveal the key spatial patterns that highlight the specific regions of the brain the model focuses on during its predictions. We use reconstruction error to guide the selection of the rank of the tensor decomposition, and fit linear models to relate the decomposition of activations to the original target attributes. We apply the method to network trained to estimate an individual's chronological age using brain maps of volume and stiffness computed from magnetic resonance imaging (MRI) and T1-weighted magnetic resonance elastography (MRE) scans, respectively. The tensor decomposition's spatial factors predominantly emphasize areas of the brain known to vary with aging. Additionally, the linear model fit to the decomposition has only a slight decrease in performance. The proposed decomposition technique provides a mechanism to interpret convolutional models applied to brain maps, and offers potential insights into the age-related structural changes in the brain.",
        "keywords": "neuroimaging;mri;non-linear regression;tensor decomposition;interpretability methods;convolutional neural networks.",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "Claudio Cesar Claros-Olivares;Curtis Johnson;Grace McIlvain;Austin J. Brockmeier",
        "authorids": "~Claudio_Cesar_Claros-Olivares1;~Curtis_Johnson1;gm3128@columbia.edu;~Austin_J._Brockmeier1",
        "gender": "M;;;M",
        "homepage": ";http://mechneurolab.squarespace.com;;https://www.eecis.udel.edu/~ajbrock/",
        "dblp": ";;;24/9878",
        "google_scholar": ";;;g_QoCQQAAAAJ",
        "orcid": ";;;",
        "linkedin": "ccclaros;;;",
        "or_profile": "~Claudio_Cesar_Claros-Olivares1;~Curtis_Johnson1;gm3128@columbia.edu;~Austin_J._Brockmeier1",
        "aff": "University of Delaware;University of Delaware;;University of Delaware",
        "aff_domain": "udel.edu;udel.edu;;udel.edu",
        "position": "PhD student;Associate Professor;;Assistant Professor",
        "bibtex": "@misc{\nclaros-olivares2024interpreting,\ntitle={Interpreting Age Predictions from Brain Maps via Deep Neural Activations and Tensor Decomposition},\nauthor={Claudio Cesar Claros-Olivares and Curtis Johnson and Grace McIlvain and Austin J. Brockmeier},\nyear={2024},\nurl={https://openreview.net/forum?id=TS8DP0x1Vd}\n}",
        "github": "",
        "project": "",
        "reviewers": "KNBM;Gsu3;vyRz",
        "site": "https://openreview.net/forum?id=TS8DP0x1Vd",
        "pdf_size": 2357410,
        "rating": "1;1;3",
        "confidence": "4;2;4",
        "soundness": "1;2;3",
        "contribution": "1;2;2",
        "presentation": "1;1;3",
        "wc_summary": "64;26;76",
        "wc_strengths": "71;8;55",
        "wc_weaknesses": "19;96;87",
        "wc_questions": "11;59;83",
        "wc_review": "165;189;301",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            55.333333333333336,
            21.31248981752771
        ],
        "wc_strengths_avg": [
            44.666666666666664,
            26.737406173540638
        ],
        "wc_weaknesses_avg": [
            67.33333333333333,
            34.373762603991366
        ],
        "wc_questions_avg": [
            51.0,
            29.93325909419153
        ],
        "wc_review_avg": [
            218.33333333333334,
            59.269628722380986
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:AERXerH-vdoJ:scholar.google.com/&scioq=Interpreting+Age+Predictions+from+Brain+Maps+via+Deep+Neural+Activations+and+Tensor+Decomposition&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Delaware",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.udel.edu",
        "aff_unique_abbr": "UD",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Feature-aligned N-BEATS with Sinkhorn divergence",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18573",
        "id": "TS8HoIWAPQ",
        "author_site": "Joonhun Lee, Myeongho Jeon, Myungjoo Kang, Kyunghyun Park",
        "tldr": "",
        "abstract": "We propose Feature-aligned N-BEATS as a domain-generalized time series forecasting model. It is a nontrivial extension of N-BEATS with doubly residual stacking principle (Oreshkin et al. [45]) into a representation learning framework. In particular, it revolves around marginal feature probability measures induced by the intricate composition of residual and feature extracting operators of N-BEATS in each stack and aligns them stack-wise via an approximate of an optimal transport distance referred to as the Sinkhorn divergence. The training loss consists of an empirical risk minimization from multiple source domains, i.e., forecasting loss, and an alignment loss calculated with the Sinkhorn divergence, which allows the model to learn invariant features stack-wise across multiple source data sequences while retaining N-BEATS\u2019s interpretable design and forecasting power. Comprehensive experimental evaluations with ablation studies are provided and the corresponding results demonstrate the proposed model\u2019s forecasting and generalization capabilities.",
        "keywords": "Time series forecasting;Deep learning;Domain generalization;Representation learning;Sinkhorn divergence",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/427c346826a6404919153c18448e4a0e1a51272e.zip",
        "author": "Joonhun Lee;Myeongho Jeon;Myungjoo Kang;Kyunghyun Park",
        "authorids": "~Joonhun_Lee1;~Myeongho_Jeon1;~Myungjoo_Kang1;~Kyunghyun_Park1",
        "gender": "M;;;M",
        "homepage": "https://leejoonhun.xyz;;http://ncia.snu.ac.kr/;https://sites.google.com/view/kyunghyunpark",
        "dblp": "348/5647;275/3060;64/5657.html;133/9177",
        "google_scholar": "R3YfefEAAAAJ;U1KJOawAAAAJ;;https://scholar.google.co.uk/citations?user=OkvbHXwAAAAJ",
        "orcid": "0009-0000-2821-480X;;;",
        "linkedin": "https://linkedin.com/in/leejoonhun;;;",
        "or_profile": "~Joonhun_Lee1;~Myeongho_Jeon1;~Myungjoo_Kang1;~Kyunghyun_Park1",
        "aff": "Seoul National University;Seoul National University;Seoul National University;Nanyang Technological University",
        "aff_domain": "snu.ac.kr;snu.ac.kr;snu.ac.kr;ntu.edu.sg",
        "position": "MS student;PhD student;Full Professor;Postdoc",
        "bibtex": "@inproceedings{\nlee2024featurealigned,\ntitle={Feature-aligned N-{BEATS} with Sinkhorn divergence},\nauthor={Joonhun Lee and Myeongho Jeon and Myungjoo Kang and Kyunghyun Park},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=TS8HoIWAPQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "adrw;F4wY;g8xd",
        "pdf_size": 8169440,
        "rating": "6;6;8",
        "confidence": "3;3;3",
        "soundness": "3;3;3",
        "contribution": "3;2;3",
        "presentation": "2;3;4",
        "wc_summary": "170;83;349",
        "wc_strengths": "37;51;165",
        "wc_weaknesses": "255;113;384",
        "wc_questions": "176;4;153",
        "wc_review": "638;251;1051",
        "wc_reply_reviewers": "71;0;31",
        "wc_reply_authors": "1341;322;1174",
        "reply_reviewers": "1;0;1",
        "reply_authors": "3;1;3",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            200.66666666666666,
            110.73792886309951
        ],
        "wc_strengths_avg": [
            84.33333333333333,
            57.3255808712151
        ],
        "wc_weaknesses_avg": [
            250.66666666666666,
            110.67771029234187
        ],
        "wc_questions_avg": [
            111.0,
            76.24084644510886
        ],
        "wc_review_avg": [
            646.6666666666666,
            326.65612227879984
        ],
        "wc_reply_reviewers_avg": [
            34.0,
            29.06314963431642
        ],
        "wc_reply_authors_avg": [
            945.6666666666666,
            446.23785386520296
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17281393854528184409&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=TS8HoIWAPQ",
        "pdf": "https://openreview.net/pdf?id=TS8HoIWAPQ",
        "email": "snu.ac.kr;snu.ac.kr;snu.ac.kr;ntu.edu.sg",
        "author_num": 4,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "Seoul National University;Nanyang Technological University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.snu.ac.kr;https://www.ntu.edu.sg",
        "aff_unique_abbr": "SNU;NTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "South Korea;Singapore"
    },
    {
        "id": "TS8PXBN6B6",
        "title": "AST-T5: Structure-Aware Pretraining for Code Generation and Understanding",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs) have made significant advancements in code-related tasks, yet many LLMs treat code as simple sequences, neglecting its structured nature. We introduce AST-T5, a novel pretraining paradigm that leverages the Abstract Syntax Tree (AST) for enhanced code generation, transpilation, and understanding. Using dynamic programming, our AST-Aware Segmentation retains code structure, while our AST-Aware Span Corruption objective equips the model to reconstruct various code structures. Unlike other models, AST-T5 avoids intricate program analyses or architectural changes, so it integrates seamlessly with any encoder-decoder Transformer. Evaluations show that AST-T5 consistently outperforms similar-sized LMs across various code-related tasks. Structure-awareness makes it particularly powerful in code-to-code tasks, surpassing CodeT5 by 2 pts in Bug Fixing and 3 pts in Java-C# Transpilation. Our code and model are publicly available at https://anonymized.",
        "keywords": "Large Language Models;Pretraining;Transformers;Code Generation;Code Transpilation;Code Understanding;Dynamic Programming;T5;Span Corruption",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/4602a8a2a91e217f01b714e425b8a36ae16391cc.zip",
        "author": "Linyuan Gong;Mostafa Elhoushi;Alvin Cheung",
        "authorids": "~Linyuan_Gong1;~Mostafa_Elhoushi1;~Alvin_Cheung2",
        "gender": "M;M;",
        "homepage": "https://gonglinyuan.com;;",
        "dblp": "213/8172;157/6350;",
        "google_scholar": "w5A4QPQAAAAJ;https://scholar.google.ca/citations?user=y_cwSKAAAAAJ;",
        "orcid": ";0000-0001-6172-4510;",
        "linkedin": ";mostafaelhoushi/;",
        "or_profile": "~Linyuan_Gong1;~Mostafa_Elhoushi1;~Alvin_Cheung2",
        "aff": "University of California, Berkeley;Meta;",
        "aff_domain": "berkeley.edu;meta.com;",
        "position": "PhD student;Researcher;",
        "bibtex": "@misc{\ngong2024astt,\ntitle={{AST}-T5: Structure-Aware Pretraining for Code Generation and Understanding},\nauthor={Linyuan Gong and Mostafa Elhoushi and Alvin Cheung},\nyear={2024},\nurl={https://openreview.net/forum?id=TS8PXBN6B6}\n}",
        "github": "",
        "project": "",
        "reviewers": "vdfV;s5j8;dEhq",
        "site": "https://openreview.net/forum?id=TS8PXBN6B6",
        "pdf_size": 382015,
        "rating": "5;6;6",
        "confidence": "4;5;4",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "3;3;3",
        "wc_summary": "125;158;58",
        "wc_strengths": "61;89;28",
        "wc_weaknesses": "383;154;242",
        "wc_questions": "2;36;125",
        "wc_review": "571;437;453",
        "wc_reply_reviewers": "0;0;29",
        "wc_reply_authors": "949;776;1572",
        "reply_reviewers": "0;0;1",
        "reply_authors": "2;2;4",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            113.66666666666667,
            41.60395280365664
        ],
        "wc_strengths_avg": [
            59.333333333333336,
            24.931015935086872
        ],
        "wc_weaknesses_avg": [
            259.6666666666667,
            94.31978701323611
        ],
        "wc_questions_avg": [
            54.333333333333336,
            51.86092513208336
        ],
        "wc_review_avg": [
            487.0,
            59.75505557412416
        ],
        "wc_reply_reviewers_avg": [
            9.666666666666666,
            13.67073110293992
        ],
        "wc_reply_authors_avg": [
            1099.0,
            341.837193217278
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 22,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9535961078207435437&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of California, Berkeley;Meta",
        "aff_unique_dep": ";Meta Platforms, Inc.",
        "aff_unique_url": "https://www.berkeley.edu;https://meta.com",
        "aff_unique_abbr": "UC Berkeley;Meta",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Berkeley;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "TTEwosByrg",
        "title": "Benchmarking Cognitive Biases in Large Language Models as Evaluators",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) have recently been shown to be effective as automatic evaluators with simple prompting and in-context learning. In this work, we assemble 15 LLMs of four different size ranges and evaluate their output responses by preference ranking from the other LLMs as evaluators, such as \"System Star is better than System Square.\"\nWe then evaluate the quality of ranking outputs introducing the Cognitive Bias Benchmark for LLMs as Evaluators (CoBBLEr), a benchmark to measure six different cognitive biases in LLM evaluation outputs, such as the Egocentric bias where a model prefers to rank its own outputs highly in evaluation. We find that LLMs are biased text quality evaluators, exhibiting strong indications on our bias benchmark (average of \\textbf{40\\%} of comparisons across all models) within each of their evaluations that question their robustness as evaluators. \nFurthermore, we examine the correlation between human and machine preferences and calculate the average Rank-Biased Overlap (RBO) score to be \\textbf{49.6\\%}, indicating that machine preferences are misaligned with humans. According to our findings, LLMs may still be unable to be utilized for automatic annotation aligned with human preferences.",
        "keywords": "Large Language Models;Automatic Evaluation;Cognitive Biases",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/de2917f80ce8d1b225860609353c9c1eba72ddd1.zip",
        "author": "Ryan Hyunkyo Koo;Minhwa Lee;Vipul Raheja;Jong Inn Park;Zae Myung Kim;Dongyeop Kang",
        "authorids": "~Ryan_Hyunkyo_Koo1;~Minhwa_Lee1;~Vipul_Raheja1;~Jong_Inn_Park1;~Zae_Myung_Kim1;~Dongyeop_Kang2",
        "gender": "M;F;;M;M;",
        "homepage": "https://kooryan.netlify.app;https://mimn97.github.io;;;https://zaemyung.github.io/;",
        "dblp": ";346/0688;;;166/2067;",
        "google_scholar": "PS7Qw2gAAAAJ;8lhVY7sAAAAJ;;3Hw6n5AAAAAJ;https://scholar.google.co.kr/citations?user=WIpsTa4AAAAJ;",
        "orcid": ";;;;;",
        "linkedin": "kooryan/;;;jong-inn-park/;zaemyung/;",
        "or_profile": "~Ryan_Hyunkyo_Koo1;~Minhwa_Lee1;~Vipul_Raheja1;~Jong_Inn_Park1;~Zae_Myung_Kim1;~Dongyeop_Kang2",
        "aff": "University of Minnesota - Twin Cities;University of Massachusetts at Lowell;;University of Minnesota - Twin Cities;University of Minnesota - Twin Cities;",
        "aff_domain": "umn.edu;uml.edu;;umn.edu;umn.edu;",
        "position": "Undergrad student;Researcher;;MS student;PhD student;",
        "bibtex": "@misc{\nkoo2024benchmarking,\ntitle={Benchmarking Cognitive Biases in Large Language Models as Evaluators},\nauthor={Ryan Hyunkyo Koo and Minhwa Lee and Vipul Raheja and Jong Inn Park and Zae Myung Kim and Dongyeop Kang},\nyear={2024},\nurl={https://openreview.net/forum?id=TTEwosByrg}\n}",
        "github": "",
        "project": "",
        "reviewers": "tfnE;K15E;mWup;1K6b",
        "site": "https://openreview.net/forum?id=TTEwosByrg",
        "pdf_size": 2128549,
        "rating": "5;6;6;8",
        "confidence": "3;3;4;3",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;4",
        "presentation": "3;3;3;3",
        "wc_summary": "140;80;64;55",
        "wc_strengths": "59;28;71;130",
        "wc_weaknesses": "329;79;129;124",
        "wc_questions": "103;161;131;44",
        "wc_review": "631;348;395;353",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1692;1760;1581;1218",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;4;3;2",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            84.75,
            33.13136731256348
        ],
        "wc_strengths_avg": [
            72.0,
            36.979724174201195
        ],
        "wc_weaknesses_avg": [
            165.25,
            96.5255795113399
        ],
        "wc_questions_avg": [
            109.75,
            43.14727685497661
        ],
        "wc_review_avg": [
            431.75,
            116.4761241628515
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1562.75,
            209.04470215721804
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.13245323570650439,
        "gs_citation": 104,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4030484840551337580&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "University of Minnesota;University of Massachusetts Lowell",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.minnesota.edu;https://www.uml.edu",
        "aff_unique_abbr": "UMN;UMass Lowell",
        "aff_campus_unique_index": "0;1;0;0",
        "aff_campus_unique": "Twin Cities;Lowell",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "TTWiS0DVv8",
        "title": "On the benefits of pixel-based hierarchical policies for task generalization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Reinforcement learning practitioners often avoid hierarchical policies, especially in image-based observation spaces. Typically, the single-task performance improvement over flat-policy counterparts does not justify the additional complexity associated with implementing a hierarchy. However, by introducing multiple decision-making levels, hierarchical policies can compose lower-level policies to more effectively generalize between tasks, highlighting the need for multi-task evaluations. We analyze the benefits of hierarchy through simulated multi-task robotic control experiments from pixels. Our results show that hierarchical policies trained with task conditioning can (1) increase performance on training tasks, (2) lead to improved reward and state-space generalizations in similar tasks, and (3) decrease the complexity of fine tuning required to solve novel tasks. Thus, we believe that hierarchical policies should be considered when building reinforcement learning architectures capable of generalizing between tasks.",
        "keywords": "hierarchical reinforcement learning;generalization",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/4e82c5b6a429cb1cd5b6083eba2a7b21f05caca5.zip",
        "author": "Tudor Cristea-Platon;Bogdan Mazoure;Joshua M. Susskind;Walter Talbott",
        "authorids": "~Tudor_Cristea-Platon1;~Bogdan_Mazoure1;~Joshua_M._Susskind1;~Walter_Talbott1",
        "gender": ";M;M;",
        "homepage": ";https://bmazoure.github.io;http://www.apple.com;",
        "dblp": ";;132/7797;241/6096",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.ca/citations?user=NaxShlcAAAAJ;Sv2TGqsAAAAJ;",
        "orcid": "0000-0001-8268-4693;;;",
        "linkedin": ";;joshua-susskind-8ab2ab5/;",
        "or_profile": "~Tudor_Cristea-Platon1;~Bogdan_Mazoure1;~Joshua_M._Susskind1;~Walter_Talbott1",
        "aff": "Apple;Apple;Apple;Apple",
        "aff_domain": "apple.com;apple.com;apple.com;apple.com",
        "position": "Researcher;Research Scientist;Researcher;Research Scientist",
        "bibtex": "@misc{\ncristea-platon2024on,\ntitle={On the benefits of pixel-based hierarchical policies for task generalization},\nauthor={Tudor Cristea-Platon and Bogdan Mazoure and Joshua M. Susskind and Walter Talbott},\nyear={2024},\nurl={https://openreview.net/forum?id=TTWiS0DVv8}\n}",
        "github": "",
        "project": "",
        "reviewers": "eEP2;guTM;yc95;TyzN",
        "site": "https://openreview.net/forum?id=TTWiS0DVv8",
        "pdf_size": 1599254,
        "rating": "1;3;3;3",
        "confidence": "4;3;3;4",
        "soundness": "1;1;3;2",
        "contribution": "1;1;1;2",
        "presentation": "1;2;2;3",
        "wc_summary": "37;56;100;198",
        "wc_strengths": "46;20;65;75",
        "wc_weaknesses": "210;294;189;100",
        "wc_questions": "30;2;1;2",
        "wc_review": "323;372;355;375",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            1.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            97.75,
            62.22690334573945
        ],
        "wc_strengths_avg": [
            51.5,
            20.958291915134687
        ],
        "wc_weaknesses_avg": [
            198.25,
            69.00135868227524
        ],
        "wc_questions_avg": [
            8.75,
            12.275483697190918
        ],
        "wc_review_avg": [
            356.25,
            20.656415468323637
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:1ZHlowlgaYcJ:scholar.google.com/&scioq=On+the+benefits+of+pixel-based+hierarchical+policies+for+task+generalization&hl=en&as_sdt=0,33",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Apple",
        "aff_unique_dep": "Apple Inc.",
        "aff_unique_url": "https://www.apple.com",
        "aff_unique_abbr": "Apple",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Fast Hyperboloid Decision Tree Algorithms",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18572",
        "id": "TTonmgTT9X",
        "author_site": "Philippe Chlenski, Ethan Turok, Antonio Moretti, Itsik Pe'er",
        "tldr": "",
        "abstract": "Hyperbolic geometry is gaining traction in machine learning due to its capacity to effectively capture hierarchical structures in real-world data. Hyperbolic spaces, where neighborhoods grow exponentially, offer substantial advantages and have consistently delivered state-of-the-art results across diverse applications. However, hyperbolic classifiers often grapple with computational challenges. Methods reliant on Riemannian optimization frequently exhibit sluggishness, stemming from the increased computational demands of operations on Riemannian manifolds. In response to these challenges, we present HyperDT, a novel extension of decision tree algorithms into hyperbolic space. Crucially, HyperDT eliminates the need for computationally intensive Riemannian optimization, numerically unstable exponential and logarithmic maps, or pairwise comparisons between points by leveraging inner products to adapt Euclidean decision tree algorithms to hyperbolic space. Our approach is conceptually straightforward and maintains constant-time decision complexity while mitigating the scalability issues inherent in high-dimensional Euclidean spaces. Building upon HyperDT, we introduce HyperRF, a hyperbolic random forest model. Extensive benchmarking across diverse datasets underscores the superior performance of these models, providing a swift, precise, accurate, and user-friendly toolkit for hyperbolic data analysis.",
        "keywords": "hyperbolic space;random forest;decision tree",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/3da8fd194bede32dfd451d7cfa91bc0f277b79c4.zip",
        "author": "Philippe Chlenski;Ethan Turok;Antonio Khalil Moretti;Itsik Pe'er",
        "authorids": "~Philippe_Chlenski1;~Ethan_Turok1;~Antonio_Khalil_Moretti1;~Itsik_Pe'er1",
        "gender": "M;;M;M",
        "homepage": "http://www.chlenski.com;https://eitan.turok.github.io/;;http://www.cs.columbia.edu/~itsik/",
        "dblp": ";;;43/6414.html",
        "google_scholar": "_8s9f44AAAAJ;;zOHnboAAAAAJ;k7gYh7gAAAAJ",
        "orcid": "0000-0002-2951-4385;;;0000-0002-6128-7231",
        "linkedin": ";;;itsik-pe-er-99b26a1/",
        "or_profile": "~Philippe_Chlenski1;~Ethan_Turok1;~Antonio_Khalil_Moretti1;~Itsik_Pe'er1",
        "aff": "Columbia University;Weizmann Institute of Science;Barnard College;Columbia University",
        "aff_domain": "columbia.edu;weizmann.ac.il;barnard.edu;columbia.edu",
        "position": "PhD student;MS student;Researcher;Full Professor",
        "bibtex": "@inproceedings{\nchlenski2024fast,\ntitle={Fast Hyperboloid Decision Tree Algorithms},\nauthor={Philippe Chlenski and Ethan Turok and Antonio Khalil Moretti and Itsik Pe'er},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=TTonmgTT9X}\n}",
        "github": "",
        "project": "",
        "reviewers": "uhLf;nNVW;RLmq;71Gr;ZUYY",
        "pdf_size": 2105375,
        "rating": "5;6;6;8;8",
        "confidence": "4;3;2;4;3",
        "soundness": "3;4;3;4;3",
        "contribution": "2;3;3;3;4",
        "presentation": "3;3;3;3;4",
        "wc_summary": "131;66;92;75;95",
        "wc_strengths": "129;56;106;60;46",
        "wc_weaknesses": "86;78;170;48;160",
        "wc_questions": "271;2;6;288;215",
        "wc_review": "617;202;374;471;516",
        "wc_reply_reviewers": "0;0;0;0;173",
        "wc_reply_authors": "1015;326;598;692;959",
        "reply_reviewers": "0;0;0;0;1",
        "reply_authors": "2;1;1;1;2",
        "rating_avg": [
            6.6,
            1.2
        ],
        "confidence_avg": [
            3.2,
            0.7483314773547882
        ],
        "soundness_avg": [
            3.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            3.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            3.2,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            91.8,
            22.33741256278354
        ],
        "wc_strengths_avg": [
            79.4,
            32.27134952244793
        ],
        "wc_weaknesses_avg": [
            108.4,
            48.02332766479224
        ],
        "wc_questions_avg": [
            156.4,
            126.7637172064625
        ],
        "wc_review_avg": [
            436.0,
            140.70252307616946
        ],
        "wc_reply_reviewers_avg": [
            34.6,
            69.2
        ],
        "wc_reply_authors_avg": [
            718.0,
            251.00995996175132
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4
        ],
        "reply_authors_avg": [
            1.4,
            0.4898979485566356
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.08908708063747484,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14641030169598808799&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=TTonmgTT9X",
        "pdf": "https://openreview.net/pdf?id=TTonmgTT9X",
        "email": "columbia.edu;weizmann.ac.il;barnard.edu;columbia.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Columbia University;Weizmann Institute of Science;Barnard College",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.columbia.edu;https://www.weizmann.org.il;https://www.barnard.edu",
        "aff_unique_abbr": "Columbia;Weizmann;Barnard",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "United States;Israel"
    },
    {
        "title": "Distributionally Robust Optimization with Bias and Variance Reduction",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18571",
        "id": "TTrzgEZt9s",
        "author_site": "Ronak Mehta, Vincent Roulet, Krishna Pillutla, Zaid Harchaoui",
        "tldr": "",
        "abstract": "We consider the distributionally robust optimization (DRO) problem, wherein a learner optimizes the worst-case empirical risk achievable by reweighing the observed training examples. We present Prospect, a stochastic gradient-based algorithm that only requires tuning a single learning rate hyperparameter, and prove that it enjoys linear convergence for smooth regularized losses. This contrasts with previous algorithms that either require tuning multiple hyperparameters or potentially fail to converge due to biased gradient estimates or inadequate regularization. Empirically, we show that Prospect can converge 2-3x faster than baselines such as SGD and stochastic saddle-point methods on distribution shift and fairness benchmarks spanning tabular, vision, and language domains.",
        "keywords": "stochastic optimization;convex optimization;distributionally robust learning;spectral risk measures;incremental optimization",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Ronak Mehta;Vincent Roulet;Krishna Pillutla;Zaid Harchaoui",
        "authorids": "~Ronak_Mehta2;~Vincent_Roulet1;~Krishna_Pillutla1;~Zaid_Harchaoui1",
        "gender": ";M;M;",
        "homepage": ";https://vroulet.github.io/;https://krishnap25.github.io;",
        "dblp": ";164/6165;173/5185.html;",
        "google_scholar": ";https://scholar.google.fr/citations?user=vwoZrVMAAAAJ;IL7N6sMAAAAJ;",
        "orcid": ";;;",
        "linkedin": ";vincentroulet/;;",
        "or_profile": "~Ronak_Mehta2;~Vincent_Roulet1;~Krishna_Pillutla1;~Zaid_Harchaoui1",
        "aff": ";Google;Google;",
        "aff_domain": ";google.com;google.com;",
        "position": ";Researcher;Visiting Researcher;",
        "bibtex": "@inproceedings{\nmehta2024distributionally,\ntitle={Distributionally Robust Optimization with Bias and Variance Reduction},\nauthor={Ronak Mehta and Vincent Roulet and Krishna Pillutla and Zaid Harchaoui},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=TTrzgEZt9s}\n}",
        "github": "",
        "project": "",
        "reviewers": "Ed47;ss6k;ucUf;12Ff",
        "pdf_size": 6404849,
        "rating": "8;8;8;8",
        "confidence": "3;4;4;3",
        "soundness": "3;4;4;3",
        "contribution": "3;4;4;3",
        "presentation": "3;3;4;2",
        "wc_summary": "43;117;81;87",
        "wc_strengths": "32;96;100;115",
        "wc_weaknesses": "127;132;3;257",
        "wc_questions": "59;38;258;6",
        "wc_review": "261;383;442;465",
        "wc_reply_reviewers": "24;0;32;27",
        "wc_reply_authors": "685;656;532;337",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            82.0,
            26.324893162176366
        ],
        "wc_strengths_avg": [
            85.75,
            31.830606340439072
        ],
        "wc_weaknesses_avg": [
            129.75,
            89.82030672403651
        ],
        "wc_questions_avg": [
            90.25,
            98.67212118932075
        ],
        "wc_review_avg": [
            387.75,
            79.05496505596597
        ],
        "wc_reply_reviewers_avg": [
            20.75,
            12.316147936753602
        ],
        "wc_reply_authors_avg": [
            552.5,
            137.0483491327057
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6455244731253808464&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=TTrzgEZt9s",
        "pdf": "https://openreview.net/pdf?id=TTrzgEZt9s",
        "email": ";google.com;google.com;",
        "author_num": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Google",
        "aff_unique_dep": "Google",
        "aff_unique_url": "https://www.google.com",
        "aff_unique_abbr": "Google",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Mountain View",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "TUUjIWntkU",
        "title": "Explainable medical image clustering",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Image classification stands as a pivotal task within the realm of computer vision, entailing the assignment of labels to entire images. Nonetheless, the complete supervision necessary for such microwell image classification demands extensive annotations, a process that can prove time-intensive to accomplish. Furthermore, situations arise where delving into the intrinsic attributes of data is desired, even when data labels remain uncertain. In this paper, we introduce a cell dataset that captures the developmental trend of cancer cells, along with T Cells, under the influence of diverse experimental conditions medications. Concurrently, we present an approach to both cluster input images and elucidate the rationale behind their grouping. To achieve this, we leverage a U-net encoder for individual microwell image information encoding and a multi-head attention layer for information encapsulation across different time points. Subsequent to clustering, we employ various techniques to expound upon our clustering outcomes. Specifically, we utilize Grad-CAM for visual explication, coupled with human-friendly textual generation aimed at facilitating comprehension of trends within each cluster. Our study encompasses a comparison of diverse architectural models on our proposed dataset, conclusively demonstrating the superior performance of its architecture. Experimental analyses and ablation studies further substantiate the advantages conferred by our innovative architectural approach.",
        "keywords": "Explainable AI;unsupervised learning",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/875f9fe72dc29c5d4d165d49a7603b505d946452.pdf",
        "author": "Zhi Xu;Qi Zhao;Xueqi Liu;Kirby Madden-Hennessey;Jordan Urbani;Yun Fu",
        "authorids": "~Zhi_Xu2;~Qi_Zhao10;~Xueqi_Liu1;~Kirby_Madden-Hennessey1;~Jordan_Urbani1;~Yun_Fu1",
        "gender": "M;M;M;;M;M",
        "homepage": "https://github.com/zhix9767;https://enrichbiosystems.com/about-us/;;;https://enrichbiosystems.com/;http://www1.ece.neu.edu/~yunfu/",
        "dblp": ";;;;;00/5815-1",
        "google_scholar": "https://scholar.google.com/citations?hl=en;LPL-_fUAAAAJ;;;;https://scholar.google.com.tw/citations?user=h-JEcQ8AAAAJ",
        "orcid": ";;;;;0000-0002-5098-2853",
        "linkedin": ";;xueqi2018;kirby-madden-hennessey/;jordanurbani/;furaymond/",
        "or_profile": "~Zhi_Xu2;~Qi_Zhao10;~Xueqi_Liu1;~Kirby_Madden-Hennessey1;~Jordan_Urbani1;~Yun_Fu1",
        "aff": "Northeastern University;;;Enrich Biosystems;;Northeastern University",
        "aff_domain": "neu.edu;;;enrichtx.com;;northeastern.edu",
        "position": "PhD student;;;Researcher;;Full Professor",
        "bibtex": "@misc{\nxu2024explainable,\ntitle={Explainable medical image clustering},\nauthor={Zhi Xu and Qi Zhao and Xueqi Liu and Kirby Madden-Hennessey and Jordan Urbani and Yun Fu},\nyear={2024},\nurl={https://openreview.net/forum?id=TUUjIWntkU}\n}",
        "github": "",
        "project": "",
        "reviewers": "ig3J;5T7W;peGV;ENtk",
        "site": "https://openreview.net/forum?id=TUUjIWntkU",
        "pdf_size": 1934368,
        "rating": "1;3;3;3",
        "confidence": "4;5;5;3",
        "soundness": "2;1;1;2",
        "contribution": "2;2;1;2",
        "presentation": "2;1;1;2",
        "wc_summary": "123;48;116;64",
        "wc_strengths": "56;54;26;81",
        "wc_weaknesses": "310;174;197;207",
        "wc_questions": "3;5;68;10",
        "wc_review": "492;281;407;362",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            1.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            87.75,
            32.34482184214345
        ],
        "wc_strengths_avg": [
            54.25,
            19.472737352514155
        ],
        "wc_weaknesses_avg": [
            222.0,
            52.19674319342156
        ],
        "wc_questions_avg": [
            21.5,
            26.9675731203236
        ],
        "wc_review_avg": [
            385.5,
            76.28400880918622
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.17407765595569782,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:9oFU1XTAbvQJ:scholar.google.com/&scioq=Explainable+medical+image+clustering&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Northeastern University;Enrich Biosystems",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.northeastern.edu;",
        "aff_unique_abbr": "NEU;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States;"
    },
    {
        "id": "TUiEgloner",
        "title": "Adaptive Learning of Quantum Hamiltonians",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The challenge of learning representations for quantum Hamiltonian systems resides at the intersection of quantum information and learning theory. Viewed through the lens of learning theory, this task can be regarded as the non-commutative counterpart to learning graphical models. In our research, we design and analyze adaptive learning algorithms, including the quantum iterative scaling algorithm (QIS) and gradient descent (GD), for the Hamiltonian inference problem using adaptive Gibbs state oracles. Our principal technical contribution centers on the thorough analysis of their convergence rates, involving the establishment of both lower and upper bounds on the spectrum of the Jacobian matrix for each iteration of these algorithms. Furthermore, we explore quasi-Newton methods to enhance the performance of both QIS and GD. Specifically, we propose the use of Anderson mixing and the L-BFGS method for QIS and GD, respectively. These quasi-Newton techniques exhibit remarkable efficiency gains, resulting in orders of magnitude improvements in performance.",
        "keywords": "Hamiltonian Learning;Quantum Learning Theory;Iterative Scaling;Convergence;Quasi-Newton Methods;Anderson Mixing",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/7d149e7016e6c3f2f47b46fb8924349a30ad96c4.zip",
        "author": "Minbo Gao;Zhengfeng Ji;Fuchao Wei",
        "authorids": "~Minbo_Gao1;~Zhengfeng_Ji1;~Fuchao_Wei1",
        "gender": ";Not Specified;",
        "homepage": ";;",
        "dblp": ";30/2575.html;303/4842",
        "google_scholar": ";https://scholar.google.com.au/citations?user=2uXdu7AAAAAJ;",
        "orcid": ";;0000-0003-3536-371X",
        "linkedin": ";;",
        "or_profile": "~Minbo_Gao1;~Zhengfeng_Ji1;~Fuchao_Wei1",
        "aff": ";Tsinghua University;",
        "aff_domain": ";tsinghua.edu.cn;",
        "position": ";Full Professor;",
        "bibtex": "@misc{\ngao2024adaptive,\ntitle={Adaptive Learning of Quantum Hamiltonians},\nauthor={Minbo Gao and Zhengfeng Ji and Fuchao Wei},\nyear={2024},\nurl={https://openreview.net/forum?id=TUiEgloner}\n}",
        "github": "",
        "project": "",
        "reviewers": "yC5R;LkFc;Zhky;VgoS",
        "site": "https://openreview.net/forum?id=TUiEgloner",
        "pdf_size": 193328,
        "rating": "3;5;5;6",
        "confidence": "5;3;3;3",
        "soundness": "3;3;3;3",
        "contribution": "2;2;2;2",
        "presentation": "3;3;3;2",
        "wc_summary": "66;93;62;106",
        "wc_strengths": "64;125;37;25",
        "wc_weaknesses": "332;87;66;176",
        "wc_questions": "80;23;17;27",
        "wc_review": "542;328;182;334",
        "wc_reply_reviewers": "183;5;11;11",
        "wc_reply_authors": "753;211;118;331",
        "reply_reviewers": "2;1;1;1",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            81.75,
            18.38987493160299
        ],
        "wc_strengths_avg": [
            62.75,
            38.615896985568
        ],
        "wc_weaknesses_avg": [
            165.25,
            104.75536979076539
        ],
        "wc_questions_avg": [
            36.75,
            25.222757581200355
        ],
        "wc_review_avg": [
            346.5,
            128.237085119711
        ],
        "wc_reply_reviewers_avg": [
            52.5,
            75.38401687360525
        ],
        "wc_reply_authors_avg": [
            353.25,
            242.83366220522228
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.9271726499455306,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:plRJWSe7GmEJ:scholar.google.com/&scioq=Adaptive+Learning+of+Quantum+Hamiltonians&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Tsinghua University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "THU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "TUpXE7KR07",
        "title": "Weakly Supervised Fine-grained Scene Graph Generation via Large Language Model",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Weakly-Supervised Scene Graph Generation (WSSGG) research has recently emerged as an alternative to the fully-supervised approach that heavily relies on costly annotations. In this regard, studies on WSSGG have utilized image captions to obtain unlocalized triplets while primarily focusing on grounding the unlocalized triplets over image regions. However, they have overlooked the two issues involved in the triplet formation process from the captions: 1) Semantic over-simplification issue arises when extracting triplets from captions, where fine-grained predicates in captions are undesirably converted into coarse-grained predicates, resulting in a long-tailed predicate distribution, and 2) Low-density scene graph issue arises when aligning the triplets in the caption with entity/predicate classes of interest, where many triplets are discarded and not used in training, leading to insufficient supervision. To tackle the two issues, we propose a new approach, i.e., Large Language Model for weakly-supervised SGG (LLM4SGG), where we mitigate the two issues by leveraging the LLM\u2019s in-depth understanding of language and reasoning ability during the extraction of triplets from captions and alignment of entity/predicate classes with target data. To further engage the LLM in these processes, we adopt the idea of Chain-of-Thought and the incontext few-shot learning strategy. To validate the effectiveness of LLM4SGG, we conduct extensive experiments on Visual Genome and GQA datasets, showing significant improvements in both Recall@K and mean Recall@K compared to the state-of-the-art WSSGG methods. A further appeal is that LLM4SGG is data-efficient, enabling effective model training with a small amount of training images.",
        "keywords": "Scene Graph Generation;Large Language Model;Scene Understanding;Weakly-Supervised Learning;Long-tailed Problem",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Kibum Kim;Kanghoon Yoon;Jaehyeong Jeon;Yeonjun In;Jinyoung Moon;Donghyun Kim;Chanyoung Park",
        "authorids": "~Kibum_Kim1;~Kanghoon_Yoon2;~Jaehyeong_Jeon1;~Yeonjun_In1;~Jinyoung_Moon1;~Donghyun_Kim2;~Chanyoung_Park1",
        "gender": "M;M;M;M;F;M;M",
        "homepage": "https://rlqja1107.github.io;https://kanghoonyoon.github.io/;https://github.com/JeonJaeHyeong;https://yeonjun-in.notion.site/;https://ksp.etri.re.kr/ksp/user/read?id=04225;https://cs-people.bu.edu/donhk;https://dsail.kaist.ac.kr/",
        "dblp": ";327/3704;359/3197;317/6906;34/391;;170/5430.html",
        "google_scholar": "https://scholar.google.com/citations?hl=ko;cHwMvgYAAAAJ;https://scholar.google.co.kr/citations?user=_uSWJ6gAAAAJ;bBJXfnUAAAAJ;TzK33Q0AAAAJ;https://scholar.google.co.kr/citations?user=UsqNPH4AAAAJ;lWk2LtQAAAAJ",
        "orcid": "0000-0002-7381-019X;0000-0001-6947-2944;;0000-0003-0408-4259;0000-0002-6616-824X;;0000-0002-5957-5816",
        "linkedin": "kibum-kim-253b01206/;;jaehyeong-jeon-44329a1b9/;yeonjun-in-9654b0180/;;;",
        "or_profile": "~Kibum_Kim1;~Kanghoon_Yoon2;~Jaehyeong_Jeon1;~Yeonjun_In1;~Jinyoung_Moon1;~Donghyun_Kim2;~Chanyoung_Park1",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Adobe Systems;Electronics and Telecommunications Research Institute;Korea University;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr;kaist.ac.kr;adobe.com;etri.re.kr;korea.ac.kr;kaist.ac.kr",
        "position": "PhD student;PhD student;MS student;Intern;Principal Researcher;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nkim2024weakly,\ntitle={Weakly Supervised Fine-grained Scene Graph Generation via Large Language Model},\nauthor={Kibum Kim and Kanghoon Yoon and Jaehyeong Jeon and Yeonjun In and Jinyoung Moon and Donghyun Kim and Chanyoung Park},\nyear={2024},\nurl={https://openreview.net/forum?id=TUpXE7KR07}\n}",
        "github": "",
        "project": "",
        "reviewers": "mv1X;XUZu;rSZy;EXTF",
        "site": "https://openreview.net/forum?id=TUpXE7KR07",
        "pdf_size": 3700740,
        "rating": "5;5;5;6",
        "confidence": "4;4;4;5",
        "soundness": "3;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "65;90;55;162",
        "wc_strengths": "47;82;55;47",
        "wc_weaknesses": "217;328;111;22",
        "wc_questions": "56;5;32;70",
        "wc_review": "385;505;253;301",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            93.0,
            41.827024756728754
        ],
        "wc_strengths_avg": [
            57.75,
            14.376630342329875
        ],
        "wc_weaknesses_avg": [
            169.5,
            114.62656760105835
        ],
        "wc_questions_avg": [
            40.75,
            24.71209218176397
        ],
        "wc_review_avg": [
            361.0,
            95.62426470305536
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3753593332742482684&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;2;3;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology;Adobe;Electronics and Telecommunications Research Institute;Korea University",
        "aff_unique_dep": ";Adobe Systems Incorporated;;",
        "aff_unique_url": "https://www.kaist.ac.kr;https://www.adobe.com;http://www.etri.re.kr;https://www.korea.ac.kr",
        "aff_unique_abbr": "KAIST;Adobe;ETRI;KU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0;0;0",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "title": "Zeroth-Order Optimization Meets Human Feedback: Provable Learning via Ranking Oracles",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18570",
        "id": "TVDUVpgu9s",
        "author_site": "Zhiwei Tang, Dmitry Rybin, Tsung-Hui Chang",
        "tldr": "",
        "abstract": "In this study, we delve into an emerging optimization challenge involving a black-box objective function that can only be gauged via a ranking oracle\u2014a situation frequently encountered in real-world scenarios, especially when the function is evaluated by human judges. A prominent instance of such a situation is Reinforcement Learning with Human Feedback (RLHF), an approach recently employed to enhance the performance of Large Language Models (LLMs) using human guidance [Ouyang et al. 2022, Liu et al. 2023, OpenAI et al. 2022, Bai et al. 2022]. We introduce ZO-RankSGD, an innovative zeroth-order optimization algorithm designed to tackle this optimization problem, accompanied by theoretical assurances. Our algorithm utilizes a novel rank-based random estimator to determine the descent direction and guarantees convergence to a stationary point. Moreover, ZO-RankSGD is readily applicable to policy optimization problems in Reinforcement Learning (RL), particularly when only ranking oracles for the episode reward are available. Last but not least, we demonstrate the effectiveness of ZO-RankSGD in a novel application: improving the quality of images generated by a diffusion generative model with human ranking feedback. Throughout experiments, we found that ZO-RankSGD can significantly enhance the detail of generated images with only a few rounds of human feedback. Overall, our work advances the field of zeroth-order optimization by addressing the problem of optimizing functions with only ranking feedback, and offers a new and effective approach for aligning Artificial Intelligence (AI) with human intentions.",
        "keywords": "Learng from human feedback;zeroth-order optimization;Stable Diffusion;ranking and preferences",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/eb91d527f5662aba1029d3444cd174ecc8b236b5.zip",
        "author": "Zhiwei Tang;Dmitry Rybin;Tsung-Hui Chang",
        "authorids": "~Zhiwei_Tang1;~Dmitry_Rybin1;~Tsung-Hui_Chang1",
        "gender": "M;M;",
        "homepage": "https://zhiweitang-ml.bio;;",
        "dblp": ";;",
        "google_scholar": "GN-N9c8AAAAJ;vpfVfgkAAAAJ;",
        "orcid": ";0000-0003-0850-9074;",
        "linkedin": ";rybindmitry;",
        "or_profile": "~Zhiwei_Tang1;~Dmitry_Rybin1;~Tsung-Hui_Chang1",
        "aff": "Chinese University of HongKong, Shenzhen;The Chinese University of Hong Kong, Shenzhen;",
        "aff_domain": "link.cuhk.edu.cn;cuhk.edu.cn;",
        "position": "PhD student;PhD student;",
        "bibtex": "@inproceedings{\ntang2024zerothorder,\ntitle={Zeroth-Order Optimization Meets Human Feedback: Provable Learning via Ranking Oracles},\nauthor={Zhiwei Tang and Dmitry Rybin and Tsung-Hui Chang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=TVDUVpgu9s}\n}",
        "github": "",
        "project": "",
        "reviewers": "6pMr;T8Lm;BfNk",
        "pdf_size": 27779843,
        "rating": "6;6;6",
        "confidence": "3;4;4",
        "soundness": "3;4;2",
        "contribution": "3;3;2",
        "presentation": "2;4;3",
        "wc_summary": "65;105;110",
        "wc_strengths": "69;69;123",
        "wc_weaknesses": "182;116;162",
        "wc_questions": "168;12;2",
        "wc_review": "484;302;397",
        "wc_reply_reviewers": "25;49;0",
        "wc_reply_authors": "1059;676;502",
        "reply_reviewers": "1;1;0",
        "reply_authors": "2;2;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            93.33333333333333,
            20.13840995599095
        ],
        "wc_strengths_avg": [
            87.0,
            25.45584412271571
        ],
        "wc_weaknesses_avg": [
            153.33333333333334,
            27.632509034750274
        ],
        "wc_questions_avg": [
            60.666666666666664,
            76.00584772824318
        ],
        "wc_review_avg": [
            394.3333333333333,
            74.32511165294152
        ],
        "wc_reply_reviewers_avg": [
            24.666666666666668,
            20.005554784164875
        ],
        "wc_reply_authors_avg": [
            745.6666666666666,
            232.6690544290084
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 35,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18000599101471651249&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=TVDUVpgu9s",
        "pdf": "https://openreview.net/pdf?id=TVDUVpgu9s",
        "email": "link.cuhk.edu.cn;cuhk.edu.cn;",
        "author_num": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Chinese University of Hong Kong",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cuhk.edu.cn",
        "aff_unique_abbr": "CUHK",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Shenzhen",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Towards Seamless Adaptation of Pre-trained Models for Visual Place Recognition",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18569",
        "id": "TVg6hlfsKa",
        "author_site": "Feng Lu, Lijun Zhang, Xiangyuan Lan, Shuting Dong, Yaowei Wang, Chun Yuan",
        "tldr": "",
        "abstract": "Recent studies show that vision models pre-trained in generic visual learning tasks with large-scale data can provide useful feature representations for a wide range of visual perception problems. However, few attempts have been made to exploit pre-trained foundation models in visual place recognition (VPR). Due to the inherent difference in training objectives and data between the tasks of model pre-training and VPR, how to bridge the gap and fully unleash the capability of pre-trained models for VPR is still a key issue to address. To this end, we propose a novel method to realize seamless adaptation of pre-trained models for VPR. Specifically, to obtain both global and local features that focus on salient landmarks for discriminating places, we design a hybrid adaptation method to achieve both global and local adaptation efficiently, in which only lightweight adapters are tuned without adjusting the pre-trained model. Besides, to guide effective adaptation, we propose a mutual nearest neighbor local feature loss, which ensures proper dense local features are produced for local matching and avoids time-consuming spatial verification in re-ranking. Experimental results show that our method outperforms the state-of-the-art methods with less training data and training time, and uses about only 3% retrieval runtime of the two-stage VPR methods with RANSAC-based spatial verification. It ranks 1st on the MSLS challenge leaderboard (at the time of submission). The code is released at https://github.com/Lu-Feng/SelaVPR.",
        "keywords": "Visual Place Recognition;Parameter-efficient Transfer Learning;Global Adaptation;Local Adaptation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Feng Lu;Lijun Zhang;Xiangyuan Lan;Shuting Dong;Yaowei Wang;Chun Yuan",
        "authorids": "~Feng_Lu6;~Lijun_Zhang7;~Xiangyuan_Lan4;~Shuting_Dong1;~Yaowei_Wang1;~Chun_Yuan1",
        "gender": ";F;F;M;M;M",
        "homepage": "https://github.com/Lu-Feng;;;https://dblp.org/pid/68/2992.html;https://www.sigs.tsinghua.edu.cn/fg3/105064.jhtml;https://www.comp.hkbu.edu.hk/v1/?page=profile&id=lanxiangyuan",
        "dblp": ";;;68/2992-1;;151/8902",
        "google_scholar": "Gws7FKMAAAAJ;;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com.hk/citations?user=fYdxi2sAAAAJ;https://scholar.google.com.hk/citations?user=c3iwWRcAAAAJ",
        "orcid": "0000-0002-5236-2287;0000-0002-9453-4032;;0000-0002-6110-4036;;",
        "linkedin": ";;;yaowei-wang-971ab310/;;",
        "or_profile": "~Feng_Lu6;~Lijun_Zhang7;~Shuting_Dong1;~Yaowei_Wang1;~Chun_Yuan1;~xiangyuan_lan1",
        "aff": "Tsinghua University;University of Chinese Academy of Sciences;Tsinghua University;Pengcheng Laboratory;Tsinghua University;Pengcheng Laboratory",
        "aff_domain": "tsinghua.edu.cn;cigit.ac.cn;tsinghua.edu.cn;pcl.ac.cn;tsinghua.edu.cn;pcl.ac.cn",
        "position": "PhD student;PhD student;PhD student;Full Professor;Full Professor;Researcher",
        "bibtex": "@inproceedings{\nlu2024towards,\ntitle={Towards Seamless Adaptation of Pre-trained Models for Visual Place Recognition},\nauthor={Feng Lu and Lijun Zhang and Xiangyuan Lan and Shuting Dong and Yaowei Wang and Chun Yuan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=TVg6hlfsKa}\n}",
        "github": "",
        "project": "",
        "reviewers": "LtSJ;Gibf;mSaw;S5xw",
        "pdf_size": 9005471,
        "rating": "5;8;8;8",
        "confidence": "5;4;5;5",
        "soundness": "3;3;4;4",
        "contribution": "2;3;3;4",
        "presentation": "2;4;3;3",
        "wc_summary": "81;71;89;89",
        "wc_strengths": "42;55;99;99",
        "wc_weaknesses": "282;114;66;54",
        "wc_questions": "44;4;82;41",
        "wc_review": "449;244;336;283",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1142;281;448;366",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            7.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            82.5,
            7.399324293474371
        ],
        "wc_strengths_avg": [
            73.75,
            25.66490794840301
        ],
        "wc_weaknesses_avg": [
            129.0,
            91.14274518577987
        ],
        "wc_questions_avg": [
            42.75,
            27.598686562950782
        ],
        "wc_review_avg": [
            328.0,
            77.11355263505891
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            559.25,
            341.5928680461581
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 43,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10082731223547699869&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=TVg6hlfsKa",
        "pdf": "https://openreview.net/pdf?id=TVg6hlfsKa",
        "email": "tsinghua.edu.cn;cigit.ac.cn;tsinghua.edu.cn;pcl.ac.cn;tsinghua.edu.cn;pcl.ac.cn",
        "author_num": 6,
        "aff_unique_index": "0;1;0;2;0;2",
        "aff_unique_norm": "Tsinghua University;University of Chinese Academy of Sciences;Pengcheng Laboratory",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;http://www.ucas.ac.cn;",
        "aff_unique_abbr": "THU;UCAS;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "TW0MVSflg5",
        "title": "Self-Evolving Neural Radiance Fields",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recently, neural radiance field (NeRF) has shown remarkable performance in novel view synthesis and 3D reconstruction. However, it still requires abundant high-quality images, limiting its applicability in real-world scenarios. To overcome this limitation, recent works have focused on training NeRF only with sparse viewpoints by giving additional regularizations, often called few-shot NeRF. We observe that due to the under-constrained nature of the task, solely using additional regularization is not enough to prevent the model from overfitting to sparse viewpoints. In this paper, we propose a novel framework, dubbed Self-Evolving Neural Radiance Fields (SE-NeRF), that applies a self-training framework to NeRF to address these problems. We formulate few-shot NeRF into a teacher-student framework to guide the network to learn a more robust representation of the scene by training the student with additional pseudo labels generated from the teacher. By distilling ray-level pseudo labels using distinct distillation schemes for reliable and unreliable rays obtained with our novel reliability estimation method, we enable NeRF to learn a more accurate and robust geometry of the 3D scene. We show and evaluate that applying our self-training framework to existing models improves the quality of the rendered images and achieves state-of-the-art performance in multiple settings.",
        "keywords": "Neural Radiance Fields;Self-Supervised Training",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Jaewoo Jung;Jisang Han;Jiwon Kang;Seongchan Kim;Min-Seop Kwak;Seungryong Kim",
        "authorids": "~Jaewoo_Jung2;~Jisang_Han1;~Jiwon_Kang2;~Seongchan_Kim2;~Min-Seop_Kwak1;~Seungryong_Kim1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://crepejung00.github.io;https://onground-korea.github.io/;https://github.com/loggerJK;https://github.com/deep-overflow;;https://cvlab.korea.ac.kr/members/faculty",
        "dblp": "219/7944;362/5845;;41/8001;338/9125;141/9955",
        "google_scholar": "TNhL4AoAAAAJ;https://scholar.google.com/citations?hl=en;;;;cIK1hS8AAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";jisang-%E2%80%8Dhan-556900233/;;seongchan-kim-776b88267/;matthewmatics96;",
        "or_profile": "~Jaewoo_Jung2;~Jisang_Han1;~Jiwon_Kang2;~Seongchan_Kim2;~Min-Seop_Kwak1;~Seungryong_Kim1",
        "aff": "Korea University;Korea University;Korea University;Korea University;Korea Advanced Institute of Science & Technology;Korea University",
        "aff_domain": "korea.ac.kr;korea.ac.kr;korea.ac.kr;korea.ac.kr;kaist.ac.kr;korea.ac.kr",
        "position": "MS student;Undergrad student;Undergrad student;Undergrad student;PhD student;Assistant Professor",
        "bibtex": "@misc{\njung2024selfevolving,\ntitle={Self-Evolving Neural Radiance Fields},\nauthor={Jaewoo Jung and Jisang Han and Jiwon Kang and Seongchan Kim and Min-Seop Kwak and Seungryong Kim},\nyear={2024},\nurl={https://openreview.net/forum?id=TW0MVSflg5}\n}",
        "github": "",
        "project": "",
        "reviewers": "BBPH;qP3j;qLAL;qNfa",
        "site": "https://openreview.net/forum?id=TW0MVSflg5",
        "pdf_size": 51048266,
        "rating": "3;5;5;6",
        "confidence": "3;3;4;5",
        "soundness": "3;2;3;3",
        "contribution": "1;2;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "53;91;85;73",
        "wc_strengths": "29;124;46;120",
        "wc_weaknesses": "306;150;107;95",
        "wc_questions": "5;96;3;151",
        "wc_review": "393;461;241;439",
        "wc_reply_reviewers": "0;72;0;0",
        "wc_reply_authors": "1371;3490;950;2769",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "3;7;2;6",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            75.5,
            14.517231140957975
        ],
        "wc_strengths_avg": [
            79.75,
            42.69879974893908
        ],
        "wc_weaknesses_avg": [
            164.5,
            84.21549738616996
        ],
        "wc_questions_avg": [
            63.75,
            62.83858289299656
        ],
        "wc_review_avg": [
            383.5,
            85.85307216401752
        ],
        "wc_reply_reviewers_avg": [
            18.0,
            31.176914536239792
        ],
        "wc_reply_authors_avg": [
            2145.0,
            1027.8012940252604
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.5,
            2.0615528128088303
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.7608859102526822,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8796097590860320648&as_sdt=8005&sciodt=0,7&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0;1;0",
        "aff_unique_norm": "Korea University;Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.korea.ac.kr;https://www.kaist.ac.kr",
        "aff_unique_abbr": "KU;KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "Enhancing Human-AI Collaboration Through Logic-Guided Reasoning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18568",
        "id": "TWC4gLoAxY",
        "author_site": "Chengzhi Cao, Yinghao Fu, Sheng Xu, Ruimao Zhang, Shuang Li",
        "tldr": "",
        "abstract": "We present a systematic framework designed to enhance human-robot perception and collaboration through the integration of logical rules and Theory of Mind (ToM). Logical rules provide interpretable predictions and generalize well across diverse tasks, making them valuable for learning and decision-making. Leveraging the ToM for understanding others' mental states, our approach facilitates effective collaboration. In this paper, we employ logic rules derived from observational data to infer human goals and guide human-like agents. These rules are treated as latent variables, and a rule encoder is trained alongside a multi-agent system in the robot's mind. We assess the posterior distribution of latent rules using learned embeddings, representing entities and relations. Confidence scores for each rule indicate their consistency with observed data. Then, we employ a hierarchical reinforcement learning model with ToM to plan robot actions for assisting humans. Extensive experiments validate each component of our framework, and results on multiple benchmarks demonstrate that our model outperforms the majority of existing approaches.",
        "keywords": "Logic rule;human-robot interaction and collaboration",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/8c32dd12bc51d1cc1a771f1639dcaffde8c7beb0.pdf",
        "author": "Chengzhi Cao;Yinghao Fu;Sheng Xu;Ruimao Zhang;Shuang Li",
        "authorids": "~Chengzhi_Cao1;~Yinghao_Fu1;~Sheng_Xu8;~Ruimao_Zhang1;~Shuang_Li3",
        "gender": "M;M;;M;F",
        "homepage": ";https://github.com/EddieFua;https://shengxu.net/;http://zhangruimao.site/#;https://shuangli01.github.io",
        "dblp": "30/185;379/6317;;54/10697;43/6294-2",
        "google_scholar": ";8vBEgIYAAAAJ;rJhWU6gAAAAJ;ZJwZdtgAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Chengzhi_Cao1;~Yinghao_Fu1;~Sheng_Xu8;~Ruimao_Zhang1;~Shuang_Li3",
        "aff": "University of Science and Technology of China;City University of Hong Kong;The Chinese University of Hong Kong, Shenzhen;The Chinese University of Hong Kong (Shenzhen);The Chinese University of Hong Kong (Shenzhen)",
        "aff_domain": "ustc.edu.cn;cityu.edu.hk;cuhk.edu.cn;cuhk.edu.cn;cuhk.edu.cn",
        "position": "MS student;PhD student;PhD student;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\ncao2024enhancing,\ntitle={Enhancing Human-{AI} Collaboration Through Logic-Guided Reasoning},\nauthor={Chengzhi Cao and Yinghao Fu and Sheng Xu and Ruimao Zhang and Shuang Li},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=TWC4gLoAxY}\n}",
        "github": "",
        "project": "",
        "reviewers": "WpfX;iG1y;wN2Q;dixh",
        "pdf_size": 2792566,
        "rating": "5;6;6;8",
        "confidence": "5;3;2;3",
        "soundness": "3;3;2;3",
        "contribution": "2;3;3;3",
        "presentation": "2;4;2;3",
        "wc_summary": "139;46;71;98",
        "wc_strengths": "62;54;47;72",
        "wc_weaknesses": "36;178;211;249",
        "wc_questions": "5;2;106;92",
        "wc_review": "242;280;435;511",
        "wc_reply_reviewers": "0;0;35;24",
        "wc_reply_authors": "804;583;545;445",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "3;1;1;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            88.5,
            34.471002306286366
        ],
        "wc_strengths_avg": [
            58.75,
            9.310612224768036
        ],
        "wc_weaknesses_avg": [
            168.5,
            80.51863138429515
        ],
        "wc_questions_avg": [
            51.25,
            48.01757490752735
        ],
        "wc_review_avg": [
            367.0,
            110.1748610164769
        ],
        "wc_reply_reviewers_avg": [
            14.75,
            15.2540978100968
        ],
        "wc_reply_authors_avg": [
            594.25,
            131.17045208430136
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.4736842105263159,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7300882808282202934&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=TWC4gLoAxY",
        "pdf": "https://openreview.net/pdf?id=TWC4gLoAxY",
        "email": "ustc.edu.cn;cityu.edu.hk;cuhk.edu.cn;cuhk.edu.cn;cuhk.edu.cn",
        "author_num": 5,
        "aff_unique_index": "0;1;2;2;2",
        "aff_unique_norm": "University of Science and Technology of China;City University of Hong Kong;Chinese University of Hong Kong",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.ustc.edu.cn;https://www.cityu.edu.hk;https://www.cuhk.edu.cn",
        "aff_unique_abbr": "USTC;CityU;CUHK",
        "aff_campus_unique_index": "1;2;2;2",
        "aff_campus_unique": ";Hong Kong SAR;Shenzhen",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Learning Semantic Proxies from Visual Prompts for Parameter-Efficient Fine-Tuning in Deep Metric Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18567",
        "id": "TWVMVPx2wO",
        "author_site": "Li Ren, Chen Chen, Liqiang Wang, Kien Hua",
        "tldr": "",
        "abstract": "Deep Metric Learning (DML) has long attracted the attention of the machine learning community as a key objective. Existing solutions concentrate on fine-tuning the pre-trained models on conventional image datasets. As a result of the success of recent pre-trained models derived from larger-scale datasets, it is challenging to adapt the model to the DML tasks in the local data domain while retaining the previously gained knowledge. In this paper, we investigate parameter-efficient methods for fine-tuning the pre-trained model for DML tasks. In particular, we propose a novel and effective framework based on learning Visual Prompts (VPT) in the pre-trained Vision Transformers (ViT). Based on the conventional proxy-based DML paradigm, we augment the proxy by incorporating the semantic information from the input image and the ViT, in which we optimize the visual prompts for each class. We demonstrate that our new approximations with semantic information are superior to representative capabilities, thereby improving metric learning performance. We conduct extensive experiments to demonstrate that our proposed framework is superior and efficient by evaluating popular DML benchmarks. In particular, we demonstrate that our fine-tuning method achieves comparable or even better performance than recent state-of-the-art full fine-tuning works of DML while tuning only a small percentage of total parameters.",
        "keywords": "metric learning;image retrieval;parameter-efficient fine tuning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Li Ren;Chen Chen;Liqiang Wang;Kien A. Hua",
        "authorids": "~Li_Ren2;~Chen_Chen18;~Liqiang_Wang1;~Kien_A._Hua2",
        "gender": "M;M;M;",
        "homepage": ";https://www.crcv.ucf.edu/chenchen/;http://www.cs.ucf.edu/~lwang;",
        "dblp": ";65/4423-1;;",
        "google_scholar": "9Mc2DoMAAAAJ;TuEwcZ0AAAAJ;mZKxB10AAAAJ;",
        "orcid": ";0000-0003-3957-7061;;",
        "linkedin": "renli3000/;dennychen/;;",
        "or_profile": "~Li_Ren2;~Chen_Chen18;~Liqiang_Wang1;~Kien_A._Hua2",
        "aff": "University of Central Florida;University of Central Florida;University of Central Florida;",
        "aff_domain": "ucf.edu;ucf.edu;ucf.edu;",
        "position": "PhD student;Assistant Professor;Full Professor;",
        "bibtex": "@inproceedings{\nren2024learning,\ntitle={Learning Semantic Proxies from Visual Prompts for Parameter-Efficient Fine-Tuning in Deep Metric Learning},\nauthor={Li Ren and Chen Chen and Liqiang Wang and Kien A. Hua},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=TWVMVPx2wO}\n}",
        "github": "",
        "project": "",
        "reviewers": "hvFX;1Fvy;HvDC",
        "pdf_size": 787231,
        "rating": "5;6;8",
        "confidence": "3;3;4",
        "soundness": "3;3;4",
        "contribution": "2;3;4",
        "presentation": "3;3;3",
        "wc_summary": "101;111;57",
        "wc_strengths": "25;148;104",
        "wc_weaknesses": "95;54;135",
        "wc_questions": "72;2;4",
        "wc_review": "293;315;300",
        "wc_reply_reviewers": "0;0;18",
        "wc_reply_authors": "866;438;322",
        "reply_reviewers": "0;0;1",
        "reply_authors": "2;1;1",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            89.66666666666667,
            23.456816114345575
        ],
        "wc_strengths_avg": [
            92.33333333333333,
            50.88767587103537
        ],
        "wc_weaknesses_avg": [
            94.66666666666667,
            33.06895153396242
        ],
        "wc_questions_avg": [
            26.0,
            32.53715824509981
        ],
        "wc_review_avg": [
            302.6666666666667,
            9.177266598624136
        ],
        "wc_reply_reviewers_avg": [
            6.0,
            8.48528137423857
        ],
        "wc_reply_authors_avg": [
            542.0,
            233.94586268337096
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.944911182523068,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12006533193620606773&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=TWVMVPx2wO",
        "pdf": "https://openreview.net/pdf?id=TWVMVPx2wO",
        "email": "ucf.edu;ucf.edu;ucf.edu;",
        "author_num": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Central Florida",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucf.edu",
        "aff_unique_abbr": "UCF",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "TXvaWOBuAC",
        "title": "Towards Explaining Deep Neural Network Compression Through a Probabilistic Latent Space",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Despite the impressive performance of deep neural networks (DNNs), their computational complexity and storage space consumption have led to the concept of network compression. While DNN compression techniques such as pruning and low-rank decomposition have been extensively studied, there has been insufficient attention paid to their theoretical explanation. In this paper, we propose a novel theoretical framework that leverages a probabilistic latent space of DNN weights and explains the optimal network sparsity by using the information-theoretic divergence measures. We introduce new analogous projected patterns (AP2) and analogous-in-probability projected patterns (AP3) notions for DNNs and prove that there exists a relationship between AP3/AP2 property of layers in the network and its performance. Further, we provide a theoretical analysis that explains the training process of the compressed network. The theoretical results are empirically validated through experiments conducted on standard pre-trained benchmarks, including AlexNet, ResNet50, and VGG16, using CIFAR10 and CIFAR100 datasets. Through our experiments, we highlight the relationship of AP3 and AP2 properties with fine-tuning pruned DNNs and sparsity levels.",
        "keywords": "Network Pruning;Theoritical Explanation;Latent Space",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/948546675f75e3c3a299cee430de0fd7b5288272.zip",
        "author": "Mahsa Mozafarinia;Salimeh Yasaei Sekeh",
        "authorids": "~Mahsa_Mozafarinia1;~Salimeh_Yasaei_Sekeh1",
        "gender": "F;F",
        "homepage": ";https://www.salimeh.info",
        "dblp": ";151/6376",
        "google_scholar": "jJUYsAgAAAAJ;s17L6jAAAAAJ",
        "orcid": ";",
        "linkedin": "https://linkedin.com/in/mahsa-mozafarinia-66b5151a3;",
        "or_profile": "~Mahsa_Mozafarinia1;~Salimeh_Yasaei_Sekeh1",
        "aff": "University of Maine;University of Maine",
        "aff_domain": "umaine.edu;umaine.edu",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nmozafarinia2024towards,\ntitle={Towards Explaining Deep Neural Network Compression Through a Probabilistic Latent Space},\nauthor={Mahsa Mozafarinia and Salimeh Yasaei Sekeh},\nyear={2024},\nurl={https://openreview.net/forum?id=TXvaWOBuAC}\n}",
        "github": "",
        "project": "",
        "reviewers": "4kq3;amvG;kKNE;EYVP",
        "site": "https://openreview.net/forum?id=TXvaWOBuAC",
        "pdf_size": 4109782,
        "rating": "3;3;5;6",
        "confidence": "2;3;4;3",
        "soundness": "1;1;2;3",
        "contribution": "2;2;3;3",
        "presentation": "1;1;1;3",
        "wc_summary": "47;59;66;184",
        "wc_strengths": "25;32;61;195",
        "wc_weaknesses": "27;128;382;140",
        "wc_questions": "85;674;8;172",
        "wc_review": "184;893;517;691",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "267;754;745;654",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            1.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            89.0,
            55.2675311552814
        ],
        "wc_strengths_avg": [
            78.25,
            68.7436360690937
        ],
        "wc_weaknesses_avg": [
            169.25,
            130.43652670935393
        ],
        "wc_questions_avg": [
            234.75,
            260.15320005719707
        ],
        "wc_review_avg": [
            571.25,
            260.17722325368914
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            605.0,
            199.02638016102287
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.5443310539518174,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:NpCI2FWX80wJ:scholar.google.com/&scioq=Towards+Explaining+Deep+Neural+Network+Compression+Through+a+Probabilistic+Latent+Space&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Maine",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.umaine.edu",
        "aff_unique_abbr": "UMaine",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "TYMeXb6PAw",
        "title": "Adaptive Compression of the Latent Space in Variational Autoencoders",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Variational Autoencoders (VAEs) are powerful generative models that have been widely used in various fields, including image and text generation. However, one of the known challenges in using VAEs is the model's sensitivity to its hyperparameters, such as the latent space size. This paper presents a simple extension of VAEs for automatically determining the optimal latent space size during the training process by gradually decreasing the latent size through neuron removal and observing the model performance.  The proposed method is compared to traditional hyperparameter grid search and is shown to be significantly faster while still achieving the best optimal dimensionality on four image datasets. Furthermore, we show that the final performance of our method is comparable to training on the optimal latent size from scratch, and might thus serve as a convenient substitute.",
        "keywords": "variational autoencoders;hyperparameter tuning;generative models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/2a34d5f598eb06efbcdd4bb9236d7e4295fd0f63.zip",
        "author": "Gabriela Sejnova;Michal Vavrecka;Karla Stepanova",
        "authorids": "~Gabriela_Sejnova1;~Michal_Vavrecka1;~Karla_Stepanova1",
        "gender": "F;;F",
        "homepage": ";;http://karlastepanova.cz",
        "dblp": ";;",
        "google_scholar": ";AhgkbbIAAAAJ;I-PURrEAAAAJ",
        "orcid": "0000-0002-0045-6425;;0000-0003-4239-2092",
        "linkedin": ";;",
        "or_profile": "~Gabriela_Sejnova1;~Michal_Vavrecka1;~Karla_Stepanova1",
        "aff": ";;",
        "aff_domain": ";;",
        "position": ";;",
        "bibtex": "@misc{\nsejnova2024adaptive,\ntitle={Adaptive Compression of the Latent Space in Variational Autoencoders},\nauthor={Gabriela Sejnova and Michal Vavrecka and Karla Stepanova},\nyear={2024},\nurl={https://openreview.net/forum?id=TYMeXb6PAw}\n}",
        "github": "",
        "project": "",
        "reviewers": "fzax;g7w5;ksU9;iAX2",
        "site": "https://openreview.net/forum?id=TYMeXb6PAw",
        "pdf_size": 1013259,
        "rating": "1;5;5;5",
        "confidence": "4;2;4;4",
        "soundness": "1;2;2;2",
        "contribution": "1;2;2;2",
        "presentation": "1;2;3;2",
        "wc_summary": "16;29;117;76",
        "wc_strengths": "16;9;29;105",
        "wc_weaknesses": "308;89;85;123",
        "wc_questions": "2;63;11;171",
        "wc_review": "342;190;242;475",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.7320508075688772
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            59.5,
            40.00312487793922
        ],
        "wc_strengths_avg": [
            39.75,
            38.349543673947416
        ],
        "wc_weaknesses_avg": [
            151.25,
            91.69616949469591
        ],
        "wc_questions_avg": [
            61.75,
            67.23605803436129
        ],
        "wc_review_avg": [
            312.25,
            108.68848835088286
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5526294182905723228&as_sdt=5,34&sciodt=0,34&hl=en",
        "gs_version_total": 5
    },
    {
        "title": "Towards Transparent Time Series Forecasting",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18566",
        "id": "TYXtXLYHpR",
        "author_site": "Krzysztof Kacprzyk, Tennison Liu, Mihaela van der Schaar",
        "tldr": "",
        "abstract": "Transparent machine learning (ML) models are essential for ensuring interpretability and trustworthiness in decision-making systems, particularly in high-stakes domains such as healthcare, finance, and criminal justice. While transparent machine learning models have been proposed for classification and regression, time series forecasting presents some unique challenges for ensuring transparency. In particular, currently used bottom-up approaches that focus on the values of the time series at specific time points (usually regularly spaced) do not provide a holistic understanding of the entire time series. This limits the applicability of ML in many critical areas. To open up these domains for ML, we propose a top-down framework of bi-level transparency, which involves understanding the higher-level trends and the lower-level properties of the predicted time series. Applying this framework, we develop TIMEVIEW, a transparent ML model for time series forecasting based on static features, complemented with an interactive visualization tool. Through a series of experiments, we demonstrate the efficacy and interpretability of our approach, paving the way for more transparent and reliable applications of ML in various domains.",
        "keywords": "transparency;interpretability;time series",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Krzysztof Kacprzyk;Tennison Liu;Mihaela van der Schaar",
        "authorids": "~Krzysztof_Kacprzyk1;~Tennison_Liu1;~Mihaela_van_der_Schaar2",
        "gender": ";M;F",
        "homepage": ";https://www.vanderschaar-lab.com/research-team/#Tennison;https://www.vanderschaar-lab.com",
        "dblp": ";256/9899;",
        "google_scholar": ";LtdHRjsAAAAJ;DZ3S--MAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Krzysztof_Kacprzyk1;~Tennison_Liu1;~Mihaela_van_der_Schaar2",
        "aff": ";University of Cambridge;University of California, Los Angeles",
        "aff_domain": ";cam.ac.uk;ucla.edu",
        "position": ";PhD student;Full Professor",
        "bibtex": "@inproceedings{\nkacprzyk2024towards,\ntitle={Towards Transparent Time Series Forecasting},\nauthor={Krzysztof Kacprzyk and Tennison Liu and Mihaela van der Schaar},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=TYXtXLYHpR}\n}",
        "github": "",
        "project": "",
        "reviewers": "nunX;pJsr;PiQk;eJfZ",
        "pdf_size": 2020196,
        "rating": "3;6;6;8",
        "confidence": "2;3;3;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "1;2;3;3",
        "wc_summary": "72;114;152;137",
        "wc_strengths": "35;30;34;106",
        "wc_weaknesses": "135;53;44;139",
        "wc_questions": "858;195;91;13",
        "wc_review": "1100;392;321;395",
        "wc_reply_reviewers": "367;0;12;48",
        "wc_reply_authors": "4323;1182;1229;434",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "6;2;3;2",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            118.75,
            30.194163343268844
        ],
        "wc_strengths_avg": [
            51.25,
            31.665241195986493
        ],
        "wc_weaknesses_avg": [
            92.75,
            44.38679420728647
        ],
        "wc_questions_avg": [
            289.25,
            334.65532641809244
        ],
        "wc_review_avg": [
            552.0,
            317.7711440644037
        ],
        "wc_reply_reviewers_avg": [
            106.75,
            151.29007733489993
        ],
        "wc_reply_authors_avg": [
            1792.0,
            1494.92424557233
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.25,
            1.6393596310755
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.8892972917998875,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11037130592333305630&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=TYXtXLYHpR",
        "pdf": "https://openreview.net/pdf?id=TYXtXLYHpR",
        "email": ";cam.ac.uk;ucla.edu",
        "author_num": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Cambridge;University of California, Los Angeles",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cam.ac.uk;https://www.ucla.edu",
        "aff_unique_abbr": "Cambridge;UCLA",
        "aff_campus_unique_index": "0;1",
        "aff_campus_unique": "Cambridge;Los Angeles",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "id": "TYyzypZrgU",
        "title": "DOMAIN-GROUNDING OF NEURAL NETWORKS FOR SPATIOTEMPORAL REASONING",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Neural Networks are powerful approximators for learning to reason from raw data (e.g., pixels, text) in spatio-temporal domains (e.g., traffic-scene understanding). However, several recent studies have shown that neural networks are prone to erroneous or sometimes absurd reasoning that lacks domain-grounding (e.g., adhering to intuitive physics and causality). Incorporating comprehensive symbolic representation for domain understanding as part of a consolidated architecture offers a promising solution. In this paper, we take a dynamical systems perspective of a neural network and its training process, and formulate domain knowledge-dependent constraints over its internal structures (parameters and inductive biases) during training. This is inspired by \\textit{control barrier function}, a constraint specification method from control theory. In particular, we specify the domain knowledge using Knowledge Graphs in our approach. To demonstrate the effectiveness of our approach, we apply it to two benchmark datasets focused on spatiotemporal reasoning: CLEVRER and CLEVRER-Humans, both centered around the task of question answering. Furthermore, we propose novel ways to evaluate if domain-grounding is achieved using our method. Our results show that the proposed methodology improves domain-grounding and question-answering accuracy while endowing the model with enhanced interpretability - an interpretability score that specifies to which extent the domain constraints are followed or violated.",
        "keywords": "Domain Grounding;Knowledge Graphs;Constrained Learning",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "/attachment/da9477f314098f9912bb76f5152093892eb14487.zip",
        "author": "Kaushik Roy;Alessandro Oltramari;Chathurangi Shyalika;Yuxin Zi;Vignesh Narayanan;Amit P. Sheth",
        "authorids": "~Kaushik_Roy4;~Alessandro_Oltramari1;~Chathurangi_Shyalika2;~Yuxin_Zi1;~Vignesh_Narayanan1;~Amit_P._Sheth1",
        "gender": "M;M;;;;M",
        "homepage": "https://www.linkedin.com/in/kaushik-roy-b8a323ab/;https://www.bosch.com/research/know-how/research-experts/alessandro-oltramari-ph-d/;;;https://vigsnar.github.io;http://aiisc.ai/amit",
        "dblp": "183/5157-9;23/2350;;;156/0202;s/AmitPSheth",
        "google_scholar": "LpOo_IUAAAAJ;KXGry3IAAAAJ;dnybS1oAAAAJ;;rirGB10AAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0001-6610-7845;;;;;0000-0002-0021-5293",
        "linkedin": "kaushik-roy-b8a323ab/;alessandrooltramari;chathurangi-shyalika-1b89229b/;;;amitsheth/",
        "or_profile": "~Kaushik_Roy4;~Alessandro_Oltramari1;~Chathurangi_Shyalika2;~Yuxin_Zi1;~Vignesh_Narayanan1;~Amit_P._Sheth1",
        "aff": "University of South Carolina;;University of South Carolina;;University of South Carolina;University of South Carolina",
        "aff_domain": "sc.edu;;sc.edu;;sc.edu;sc.edu",
        "position": "PhD student;;PhD student;;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nanonymous2024domaingrounding,\ntitle={{DOMAIN}-{GROUNDING} {OF} {NEURAL} {NETWORKS} {FOR} {SPATIOTEMPORAL} {REASONING}},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=TYyzypZrgU}\n}",
        "github": "",
        "project": "",
        "reviewers": "f8Mp;g76t;vq2f;1Yru",
        "site": "https://openreview.net/forum?id=TYyzypZrgU",
        "pdf_size": 4249401,
        "rating": "1;3;3;3",
        "confidence": "3;2;3;4",
        "soundness": "1;2;3;3",
        "contribution": "1;2;3;2",
        "presentation": "1;1;2;2",
        "wc_summary": "62;49;111;74",
        "wc_strengths": "28;52;116;30",
        "wc_weaknesses": "86;191;367;348",
        "wc_questions": "42;2;104;33",
        "wc_review": "218;294;698;485",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            74.0,
            23.119256043393783
        ],
        "wc_strengths_avg": [
            56.5,
            35.61951712193752
        ],
        "wc_weaknesses_avg": [
            248.0,
            115.81666546745335
        ],
        "wc_questions_avg": [
            45.25,
            37.022797031018605
        ],
        "wc_review_avg": [
            423.75,
            185.8310724825103
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:kJ8TtZLByy0J:scholar.google.com/&scioq=DOMAIN-GROUNDING+OF+NEURAL+NETWORKS+FOR+SPATIOTEMPORAL+REASONING&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of South Carolina",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sc.edu",
        "aff_unique_abbr": "USC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Tc3duzOHa8",
        "title": "RODEO: Robust Out-of-Distribution Detection Via Exposing Adaptive Outliers",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Detecting out-of-distribution (OOD) input samples at the time of inference is a key element in the trustworthy deployment of intelligent models. While there has been tremendous improvement in various variants of OOD detection in recent years, detection performance under adversarial settings lags far behind the performance in the standard setting. In order to bridge this gap, we introduce RODEO in this paper, a data-centric approach that generates effective outliers for robust OOD detection. More specifically, we first show that targeting the classification of adversarially perturbed in- and out-of-distribution samples through outlier exposure (OE) could be an effective strategy for the mentioned purpose, as long as the training outliers meet certain quality standards. We hypothesize that the outliers in the OE should possess several characteristics simultaneously to be effective in the adversarial training: diversity, and both conceptual differentiability and analogy to the inliers. These aspects seem to play a more critical role in the adversarial setup compared to the standard training. Next, we propose an adaptive OE method to generate near and diverse outliers by incorporating both text and image domain information. This process helps satisfy the mentioned criteria for the generated outliers and significantly enhances the performance of the OE technique, particularly in adversarial settings. Our method demonstrates its effectiveness across various detection setups, such as novelty detection (ND), Open-Set Recognition (OSR), and out-of-distribution (OOD) detection. Furthermore, we conduct a comprehensive comparison of our approach with other OE techniques in adversarial settings to showcase its effectiveness.",
        "keywords": "Out-of-Distribution Detection;Adversarial Robustness;Robust Anomaly Detection;Outlier Exposure;Generative Models",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/eeeb0f5d78ca261eea9ec85d0f837cc8eb6bdc81.zip",
        "author": "Hossein Mirzaei;Mohammad Jafari;Hamid Reza Dehbashi;Ali Ansari;Sepehr Ghobadi;Masoud Hadi;Arshia Soltani Moakhar;Mahdieh Soleymani Baghshah;Mohammad Hossein Rohban",
        "authorids": "~Hossein_Mirzaei1;~Mohammad_Jafari1;~Hamid_Reza_Dehbashi1;~Ali_Ansari2;~Sepehr_Ghobadi1;~Masoud_Hadi1;~Arshia_Soltani_Moakhar1;~Mahdieh_Soleymani_Baghshah1;~Mohammad_Hossein_Rohban1",
        "gender": "M;M;M;M;;M;;;M",
        "homepage": ";https://mohammadjafari80.github.io/;https://github.com/hamiddeboo8;https://allliance.github.io;;https://ex3ploiter.github.io/;;;http://sharif.edu/~rohban/",
        "dblp": ";;;200/9876-1;;;;;43/8108",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;;WEMgPWgAAAAJ;WYxYPXUAAAAJ;;https://scholar.google.com/citations?hl=en;;;pRyJ6FkAAAAJ",
        "orcid": ";;;0000-0002-9798-6966;;;;;",
        "linkedin": "hossein-mirzaei-6bb2301aa;mohammadjafari01/;;https://linkedin.com/in/ali-ansari-195999213;;masoud-hadi-a382601b4/;;;",
        "or_profile": "~Hossein_Mirzaei1;~Mohammad_Jafari1;~Hamid_Reza_Dehbashi1;~Ali_Ansari2;~Sepehr_Ghobadi1;~Masoud_Hadi1;~Arshia_Soltani_Moakhar1;~Mahdieh_Soleymani_Baghshah1;~Mohammad_Hossein_Rohban1",
        "aff": "EPFL - EPF Lausanne;Sharif University of Technology;Sharif University of Technology, Sharif University of Technology;Sharif University of Technology;;Isfahan University of Technology;;;Sharif University of Technology",
        "aff_domain": "epfl.ch;sharif.edu;ce.sharif.edu;sharif.edu;;iut.ac.ir;;;sharif.edu",
        "position": "PhD student;Undergrad student;Undergrad student;Undergrad student;;Undergrad student;;;Associate Professor",
        "bibtex": "@misc{\nmirzaei2024rodeo,\ntitle={{RODEO}: Robust Out-of-Distribution Detection Via Exposing Adaptive Outliers},\nauthor={Hossein Mirzaei and Mohammad Jafari and Hamid Reza Dehbashi and Ali Ansari and Sepehr Ghobadi and Masoud Hadi and Arshia Soltani Moakhar and Mahdieh Soleymani Baghshah and Mohammad Hossein Rohban},\nyear={2024},\nurl={https://openreview.net/forum?id=Tc3duzOHa8}\n}",
        "github": "",
        "project": "",
        "reviewers": "MBna;3m3p;JDt4;wbuR",
        "site": "https://openreview.net/forum?id=Tc3duzOHa8",
        "pdf_size": 47079064,
        "rating": "6;6;6;8",
        "confidence": "5;5;2;4",
        "soundness": "2;4;2;3",
        "contribution": "2;3;2;3",
        "presentation": "2;2;2;3",
        "wc_summary": "117;94;48;128",
        "wc_strengths": "116;111;60;142",
        "wc_weaknesses": "232;207;149;124",
        "wc_questions": "41;43;3;81",
        "wc_review": "506;455;260;475",
        "wc_reply_reviewers": "17;25;0;13",
        "wc_reply_authors": "678;702;774;614",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "2;2;3;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            1.224744871391589
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            96.75,
            30.70321644388418
        ],
        "wc_strengths_avg": [
            107.25,
            29.710057219736214
        ],
        "wc_weaknesses_avg": [
            178.0,
            43.34166586553867
        ],
        "wc_questions_avg": [
            42.0,
            27.586228448267445
        ],
        "wc_review_avg": [
            424.0,
            96.41317337376672
        ],
        "wc_reply_reviewers_avg": [
            13.75,
            9.03811374126261
        ],
        "wc_reply_authors_avg": [
            692.0,
            57.23635208501674
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:sEY7XEGkoCQJ:scholar.google.com/&scioq=RODEO:+Robust+Out-of-Distribution+Detection+Via+Exposing+Adaptive+Outliers&hl=en&as_sdt=0,47",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1;2;1",
        "aff_unique_norm": "EPFL;Sharif University of Technology;Isfahan University of Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.epfl.ch;https://www.sharif.edu;https://www.iut.ac.ir",
        "aff_unique_abbr": "EPFL;SUT;IUT",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Lausanne;",
        "aff_country_unique_index": "0;1;1;1;1;1",
        "aff_country_unique": "Switzerland;Iran"
    },
    {
        "title": "Momentum Benefits Non-iid Federated Learning Simply and Provably",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18565",
        "id": "TdhkAcXkRi",
        "author_site": "Ziheng Cheng, Xinmeng Huang, Pengfei Wu, Kun Yuan",
        "tldr": "",
        "abstract": "Federated learning is a powerful paradigm for large-scale machine learning, but it\nfaces significant challenges due to unreliable network connections, slow commu-\nnication, and substantial data heterogeneity across clients. FedAvg and SCAFFOLD are two prominent algorithms to address these challenges. In particular,\nFedAvg employs multiple local updates before communicating with a central\nserver, while SCAFFOLD maintains a control variable on each client to compen-\nsate for \u201cclient drift\u201d in its local updates. Various methods have been proposed\nto enhance the convergence of these two algorithms, but they either make imprac-\ntical adjustments to algorithmic structure, or rely on the assumption of bounded\ndata heterogeneity. This paper explores the utilization of momentum to enhance\nthe performance of FedAvg and SCAFFOLD. When all clients participate in the\ntraining process, we demonstrate that incorporating momentum allows FedAvg\nto converge without relying on the assumption of bounded data heterogeneity even\nusing a constant local learning rate. This is novel and fairly suprising as existing\nanalyses for FedAvg require bounded data heterogeneity even with diminishing\nlocal learning rates. In partial client participation, we show that momentum en-\nables SCAFFOLD to converge provably faster without imposing any additional\nassumptions. Furthermore, we use momentum to develop new variance-reduced\nextensions of FedAvg and SCAFFOLD, which exhibit state-of-the-art conver-\ngence rates. Our experimental results support all theoretical findings.",
        "keywords": "federated learning;momentum;data heterogeneity;non-convex optimization",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Ziheng Cheng;Xinmeng Huang;Pengfei Wu;Kun Yuan",
        "authorids": "~Ziheng_Cheng4;~Xinmeng_Huang1;~Pengfei_Wu6;~Kun_Yuan4",
        "gender": "M;M;;",
        "homepage": "https://alexczh1.github.io/;;;",
        "dblp": ";256/1617;;",
        "google_scholar": "M8Hz2NSNe3QC;vM2nHxEAAAAJ;;",
        "orcid": ";;;",
        "linkedin": ";xinmeng-huang-8032221b3/;;",
        "or_profile": "~Ziheng_Cheng4;~Xinmeng_Huang1;~Pengfei_Wu6;~Kun_Yuan4",
        "aff": "Peking University;University of Pennsylvania;;",
        "aff_domain": "pku.edu.cn;upenn.edu;;",
        "position": "Undergrad student;PhD student;;",
        "bibtex": "@inproceedings{\ncheng2024momentum,\ntitle={Momentum Benefits Non-iid Federated Learning Simply and Provably},\nauthor={Ziheng Cheng and Xinmeng Huang and Pengfei Wu and Kun Yuan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=TdhkAcXkRi}\n}",
        "github": "",
        "project": "",
        "reviewers": "W4SM;CZuh;XBW2;ELLH",
        "pdf_size": 662258,
        "rating": "5;5;5;8",
        "confidence": "4;4;4;4",
        "soundness": "2;2;2;4",
        "contribution": "2;2;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "114;42;87;103",
        "wc_strengths": "30;34;69;118",
        "wc_weaknesses": "315;120;66;405",
        "wc_questions": "350;121;26;235",
        "wc_review": "809;317;248;861",
        "wc_reply_reviewers": "162;0;148;243",
        "wc_reply_authors": "1673;862;1001;1145",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "5;4;4;3",
        "rating_avg": [
            5.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            86.5,
            27.427176303804956
        ],
        "wc_strengths_avg": [
            62.75,
            35.32262023123426
        ],
        "wc_weaknesses_avg": [
            226.5,
            138.56135824969385
        ],
        "wc_questions_avg": [
            183.0,
            121.53805988249113
        ],
        "wc_review_avg": [
            558.75,
            277.93378258139114
        ],
        "wc_reply_reviewers_avg": [
            138.25,
            87.67090452367877
        ],
        "wc_reply_authors_avg": [
            1170.25,
            307.0255486111864
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.0,
            0.7071067811865476
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 26,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13499060793999754845&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=TdhkAcXkRi",
        "pdf": "https://openreview.net/pdf?id=TdhkAcXkRi",
        "email": "pku.edu.cn;upenn.edu;;",
        "author_num": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Peking University;University of Pennsylvania",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.upenn.edu",
        "aff_unique_abbr": "Peking U;UPenn",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "TdyfmCM8iR",
        "title": "Latent Concept-based Explanation of NLP Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Interpreting and understanding the predictions made by deep learning models poses a formidable challenge due to their inherently opaque nature. Many previous efforts aimed at explaining these predictions rely on input features\u2014specifically, the words within NLP models. However, such explanations are often less informative due to the discrete nature of these words and their lack of contextual verbosity. To address this limitation, we introduce the Latent Concept Attribution method (LACOAT), which generates explanations for predictions based on latent concepts. Our founding intuition is that a word can exhibit multiple facets, contingent upon the context in which it is used. Therefore, given a word in context, the latent space derived from our training process reflects a specific facet of that word. LACOAT functions by mapping the representations of salient input words into the training latent space, allowing it to provide predictions with context-based explanations within this latent space. We will make the code of LACOAT available to the research community.",
        "keywords": "interpretation;explainable AI;deep learning;NLP",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/491b9627575b7ac0649b15bdfe298fb805bb39a5.pdf",
        "author": "Xuemin Yu;Fahim Dalvi;Nadir Durrani;Hassan Sajjad",
        "authorids": "~Xuemin_Yu1;~Fahim_Dalvi1;~Nadir_Durrani1;~Hassan_Sajjad1",
        "gender": "F;M;M;M",
        "homepage": "https://xueminyu.com/;https://fdalvi.github.io;https://nadirdurrani.github.io/;https://hsajjad.github.io/",
        "dblp": ";194/2537;54/9012;73/5938",
        "google_scholar": ";uQGCv10AAAAJ;https://scholar.google.co.uk/citations?user=K6uisFAAAAAJ;https://scholar.google.de/citations?user=t3BH6NkAAAAJ",
        "orcid": "0000-0002-9388-7282;;0000-0002-9378-4128;",
        "linkedin": ";;nadir-durrani-04048744/;hassan-sajjad-154b043a/",
        "or_profile": "~Xuemin_Yu1;~Fahim_Dalvi1;~Nadir_Durrani1;~Hassan_Sajjad1",
        "aff": "Dalhousie University;Hamad Bin Khalifa University;Qatar Computing Research Institute;Dalhousie University",
        "aff_domain": "dal.ca;hbku.edu.qa;hbku.edu.qa;dal.ca",
        "position": "PhD student;Researcher;Scientist;Associate Professor",
        "bibtex": "@misc{\nyu2024latent,\ntitle={Latent Concept-based Explanation of {NLP} Models},\nauthor={Xuemin Yu and Fahim Dalvi and Nadir Durrani and Hassan Sajjad},\nyear={2024},\nurl={https://openreview.net/forum?id=TdyfmCM8iR}\n}",
        "github": "",
        "project": "",
        "reviewers": "jD3R;Zm9D;6gzN",
        "site": "https://openreview.net/forum?id=TdyfmCM8iR",
        "pdf_size": 2134111,
        "rating": "3;5;5",
        "confidence": "4;2;2",
        "soundness": "2;2;2",
        "contribution": "2;1;2",
        "presentation": "3;3;2",
        "wc_summary": "61;70;49",
        "wc_strengths": "38;29;49",
        "wc_weaknesses": "249;85;128",
        "wc_questions": "46;63;56",
        "wc_review": "394;247;282",
        "wc_reply_reviewers": "0;0;47",
        "wc_reply_authors": "612;424;528",
        "reply_reviewers": "0;0;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            60.0,
            8.602325267042627
        ],
        "wc_strengths_avg": [
            38.666666666666664,
            8.178562764256865
        ],
        "wc_weaknesses_avg": [
            154.0,
            69.4310209248479
        ],
        "wc_questions_avg": [
            55.0,
            6.97614984548545
        ],
        "wc_review_avg": [
            307.6666666666667,
            62.69680126520721
        ],
        "wc_reply_reviewers_avg": [
            15.666666666666666,
            22.15601247717849
        ],
        "wc_reply_authors_avg": [
            521.3333333333334,
            76.89531122824648
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12250662376347891358&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Dalhousie University;Hamad Bin Khalifa University;Qatar Computing Research Institute",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.dal.ca;https://www.hbku.edu.qa;https://www.qcri.org",
        "aff_unique_abbr": "Dal;HBKU;QCRI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "Canada;Qatar"
    },
    {
        "id": "Te5v4EcFGL",
        "title": "PatchMixer: A Patch-Mixing Architecture for Long-Term Time Series Forecasting",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Although the Transformer has been the dominant architecture for time series forecasting tasks in recent years, a fundamental challenge remains: the permutation-invariant self-attention mechanism within Transformers leads to a loss of temporal information. \nTo tackle these challenges, we propose PatchMixer, a novel CNN-based model. It introduces a permutation-variant convolutional structure to preserve temporal information. Diverging from conventional CNNs in this field, which often employ multiple scales or numerous branches, our method relies exclusively on depthwise separable convolutions. This allows us to extract both local features and global correlations using a single-scale architecture. Furthermore, we employ dual forecasting heads that encompass both linear and nonlinear components to better model future curve trends and details. Our experimental results on seven time-series forecasting benchmarks indicate that compared with the state-of-the-art method and the best-performing CNN, PatchMixer yields 3.9\\% and 21.2\\% relative improvements, respectively, while being 2-3x faster than the most advanced method. We will release our code and model.",
        "keywords": "long-term forecasting;patch-mixing architecture;depthwise separable convolution",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Zeying Gong;Yujin Tang;Junwei Liang",
        "authorids": "~Zeying_Gong1;~Yujin_Tang2;~Junwei_Liang1",
        "gender": "M;F;M",
        "homepage": "https://zeying-gong.github.io/;https://yyyujintang.github.io/;https://junweiliang.me/",
        "dblp": ";;62/10704-1",
        "google_scholar": "ze2Wh9EAAAAJ;T41IQ1EAAAAJ;bMedjfUAAAAJ",
        "orcid": "0009-0000-9591-5358;;0000-0003-2219-5569",
        "linkedin": "richard-kung/;yujin-tang-542b321a7/;junweiliang/",
        "or_profile": "~Zeying_Gong1;~Yujin_Tang2;~Junwei_Liang1",
        "aff": "Hong Kong University of Science and Technology;Hong Kong University of Science and Technology (Guangzhou);Hong Kong University of Science and Technology",
        "aff_domain": "hkust-gz.edu.cn;hkust-gz.edu.cn;ust.hk",
        "position": "MS student;Intern;Assistant Professor",
        "bibtex": "@misc{\ngong2024patchmixer,\ntitle={PatchMixer: A Patch-Mixing Architecture for Long-Term Time Series Forecasting},\nauthor={Zeying Gong and Yujin Tang and Junwei Liang},\nyear={2024},\nurl={https://openreview.net/forum?id=Te5v4EcFGL}\n}",
        "github": "",
        "project": "",
        "reviewers": "u92x;hpaR;TNRF;doHD",
        "site": "https://openreview.net/forum?id=Te5v4EcFGL",
        "pdf_size": 1419274,
        "rating": "5;5;6;8",
        "confidence": "5;4;4;3",
        "soundness": "2;3;2;4",
        "contribution": "2;2;2;4",
        "presentation": "3;3;2;4",
        "wc_summary": "65;77;56;54",
        "wc_strengths": "23;71;23;29",
        "wc_weaknesses": "232;56;166;252",
        "wc_questions": "68;15;203;122",
        "wc_review": "388;219;448;457",
        "wc_reply_reviewers": "49;0;202;27",
        "wc_reply_authors": "1293;335;1014;1010",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "3;2;3;2",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            63.0,
            9.082951062292475
        ],
        "wc_strengths_avg": [
            36.5,
            20.068632240389476
        ],
        "wc_weaknesses_avg": [
            176.5,
            76.50326790405754
        ],
        "wc_questions_avg": [
            102.0,
            69.5089922240281
        ],
        "wc_review_avg": [
            378.0,
            95.55364985179791
        ],
        "wc_reply_reviewers_avg": [
            69.5,
            78.44265421312565
        ],
        "wc_reply_authors_avg": [
            913.0,
            352.8788744031017
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8660254037844386,
        "gs_citation": 57,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13954101427328275663&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Hong Kong University of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ust.hk",
        "aff_unique_abbr": "HKUST",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "TeeyHEi25C",
        "title": "Value function estimation using conditional diffusion models for control",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "A fairly reliable trend in deep reinforcement learning is that the performance scales with the number of parameters, provided a complimentary scaling in amount of training data. As the appetite for large models increases, it is imperative to address, sooner than later, the potential problem of running out of high-quality demonstrations.\nIn this case, instead of collecting only new data via costly human demonstrations or risking a simulation-to-real transfer with uncertain effects, it would be beneficial to leverage vast amounts of readily-available low-quality data. \nSince classical control algorithms such as behavior cloning or temporal difference learning cannot be used on reward-free or action-free data out-of-the-box, this solution warrants novel training paradigms for continuous control. \nWe propose a simple algorithm called Diffused Value Function (DVF), which learns a joint multi-step model of the environment-robot interaction dynamics using a diffusion model. This model can be efficiently learned from state sequences (i.e., without access to reward functions nor actions), and subsequently used to estimate the value of each action out-of-the-box. We show how DVF can be used to efficiently capture the state visitation measure for multiple controllers, and show promising qualitative and quantitative results on challenging robotics benchmarks.",
        "keywords": "diffusion models;off-policy learning;offline RL;reinforcement learning;robotics",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/973e288c70da8a5b5add15656d33ad8ee61bf7f5.zip",
        "author": "Bogdan Mazoure;Walter Talbott;Miguel \u00c1ngel Bautista;R Devon Hjelm;Alexander T Toshev;Joshua M. Susskind",
        "authorids": "~Bogdan_Mazoure1;~Walter_Talbott1;~Miguel_\u00c1ngel_Bautista1;~R_Devon_Hjelm1;~Alexander_T_Toshev1;~Joshua_M._Susskind1",
        "gender": "M;;M;M;M;M",
        "homepage": "https://bmazoure.github.io;;;;http://www.apple.com;http://alex.toshev.tech",
        "dblp": ";241/6096;38/10085;195/5928;132/7797;96/2687",
        "google_scholar": "https://scholar.google.ca/citations?user=NaxShlcAAAAJ;;ZrRs-qoAAAAJ;https://scholar.google.ca/citations?user=68c5HfwAAAAJ;Sv2TGqsAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;;;",
        "linkedin": ";;;;joshua-susskind-8ab2ab5/;alexander-toshev-9270726/",
        "or_profile": "~Bogdan_Mazoure1;~Walter_Talbott1;~Miguel_\u00c1ngel_Bautista1;~R_Devon_Hjelm1;~Joshua_M._Susskind1;~Alexander_Toshev1",
        "aff": "Apple;Apple;Apple;Apple;Apple;Apple",
        "aff_domain": "apple.com;apple.com;apple.com;apple.com;apple.com;apple.com",
        "position": "Research Scientist;Research Scientist;Research Scientist;Researcher;Researcher;research scientist",
        "bibtex": "@misc{\nmazoure2024value,\ntitle={Value function estimation using conditional diffusion models for control},\nauthor={Bogdan Mazoure and Walter Talbott and Miguel {\\'A}ngel Bautista and R Devon Hjelm and Alexander T Toshev and Joshua M. Susskind},\nyear={2024},\nurl={https://openreview.net/forum?id=TeeyHEi25C}\n}",
        "github": "",
        "project": "",
        "reviewers": "nnB2;65QG;ZNxJ;zxfx",
        "site": "https://openreview.net/forum?id=TeeyHEi25C",
        "pdf_size": 2925935,
        "rating": "3;6;8;8",
        "confidence": "4;3;4;3",
        "soundness": "2;3;3;3",
        "contribution": "1;3;4;3",
        "presentation": "2;3;3;3",
        "wc_summary": "57;74;191;90",
        "wc_strengths": "72;62;126;57",
        "wc_weaknesses": "447;2;580;292",
        "wc_questions": "105;116;2;45",
        "wc_review": "681;254;899;484",
        "wc_reply_reviewers": "0;26;0;33",
        "wc_reply_authors": "945;401;564;1042",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "3;1;1;2",
        "rating_avg": [
            6.25,
            2.0463381929681126
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            1.0897247358851685
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            103.0,
            52.12964607591346
        ],
        "wc_strengths_avg": [
            79.25,
            27.52612395525385
        ],
        "wc_weaknesses_avg": [
            330.25,
            215.18407817494304
        ],
        "wc_questions_avg": [
            67.0,
            46.24391851908746
        ],
        "wc_review_avg": [
            579.5,
            238.46016438810068
        ],
        "wc_reply_reviewers_avg": [
            14.75,
            14.956186011146023
        ],
        "wc_reply_authors_avg": [
            738.0,
            264.15431096236154
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.3665083330689157,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18445204156875345377&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "Apple",
        "aff_unique_dep": "Apple Inc.",
        "aff_unique_url": "https://www.apple.com",
        "aff_unique_abbr": "Apple",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "TfbpnxTJt3",
        "title": "Federated Learning with Local Openset Noisy Labels",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Federated learning is a learning paradigm that allows the central server to learn from different data sources while keeping the data private locally. Without controlling and monitoring the local data collection process, the locally available training labels are likely noisy, $\\textit{i.e.}$, the collected training labels differ from the unobservable ground truth. Additionally, in heterogenous FL, each local client may only have access to a subset of label space (referred to as openset label learning), meanwhile without overlapping with others. In this work, we study the challenge of federated learning with local openset noisy labels. We observe that many existing solutions in the noisy label literature, $\\textit{e.g.}$, loss correction, are ineffective during local training due to overfitting to noisy labels and being not generalizable to openset labels. To address the problems, we design a label communication mechanism that shares randomly selected ``contrastive labels\" among clients. The privacy of the shared contrastive labels is protected by label differential privacy (DP). Both the DP guarantee and the effectiveness of our approach are theoretically guaranteed. Compared with several baseline methods, our solution shows its efficiency in several public benchmarks and real-world datasets under different noise ratios and noise models.",
        "keywords": "Federated Learning;openset;noisy label;heterogenous",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/04205041d5bdb77c8d10b9cbb51cc6a297e8d38b.zip",
        "author": "Zonglin Di;Zhaowei Zhu;Xiaoxiao Li;Yang Liu",
        "authorids": "~Zonglin_Di1;~Zhaowei_Zhu1;~Xiaoxiao_Li1;~Yang_Liu3",
        "gender": ";M;Unspecified;M",
        "homepage": ";https://www.zzw.ai;https://xxlya.github.io/;http://www.yliuu.com",
        "dblp": ";202/1712;71/8042;51/3710-18",
        "google_scholar": ";YS8pSQoAAAAJ;sdENOQ4AAAAJ;jKrIVCIAAAAJ",
        "orcid": ";0000-0003-3894-5862;;0000-0001-8420-6011",
        "linkedin": ";;;",
        "or_profile": "~Zonglin_Di1;~Zhaowei_Zhu1;~Xiaoxiao_Li1;~Yang_Liu3",
        "aff": ";Docta.ai;University of British Columbia;University of California, Santa Cruz",
        "aff_domain": ";docta.ai;ece.ubc.ca;ucsc.edu",
        "position": ";Researcher;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\ndi2024federated,\ntitle={Federated Learning with Local Openset Noisy Labels},\nauthor={Zonglin Di and Zhaowei Zhu and Xiaoxiao Li and Yang Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=TfbpnxTJt3}\n}",
        "github": "",
        "project": "",
        "reviewers": "CSq3;L6ru;zvrT;pQNK",
        "site": "https://openreview.net/forum?id=TfbpnxTJt3",
        "pdf_size": 449779,
        "rating": "3;5;5;5",
        "confidence": "3;4;3;3",
        "soundness": "2;3;3;3",
        "contribution": "2;3;2;2",
        "presentation": "1;3;2;2",
        "wc_summary": "69;141;64;37",
        "wc_strengths": "43;64;98;26",
        "wc_weaknesses": "227;336;287;42",
        "wc_questions": "203;29;3;178",
        "wc_review": "542;570;452;283",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            77.75,
            38.49269411200001
        ],
        "wc_strengths_avg": [
            57.75,
            26.85493436968335
        ],
        "wc_weaknesses_avg": [
            223.0,
            111.40242367201891
        ],
        "wc_questions_avg": [
            103.25,
            88.17702365128912
        ],
        "wc_review_avg": [
            461.75,
            112.03208245855292
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1252704356872072176&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Docta.ai;University of British Columbia;University of California, Santa Cruz",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://docta.ai;https://www.ubc.ca;https://www.ucsc.edu",
        "aff_unique_abbr": "Docta.ai;UBC;UCSC",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Santa Cruz",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United States;Canada"
    },
    {
        "title": "Patched Denoising Diffusion Models For High-Resolution Image Synthesis",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18564",
        "id": "TgSRPRz8cI",
        "author_site": "Zheng Ding, Mengqi Zhang, Jiajun Wu, Zhuowen Tu",
        "tldr": "",
        "abstract": "We propose an effective denoising diffusion model for generating high-resolution images (e.g., 1024$\\times$512), trained on small-size image patches (e.g., 64$\\times$64). We name our algorithm Patch-DM, in which a new feature collage strategy is designed to avoid the boundary artifact when synthesizing large-size images. Feature collage systematically crops and combines partial features of the neighboring patches to predict the features of a shifted image patch, allowing the seamless generation of the entire image due to the overlap in the patch feature space. Patch-DM produces high-quality image synthesis results on our newly collected dataset of nature images (1024$\\times$512), as well as on standard benchmarks of LHQ(1024$\\times$ 1024), FFHQ(1024$\\times$ 1024) and on other datasets with smaller sizes (256$\\times$256), including LSUN-Bedroom, LSUN-Church, and FFHQ. We compare our method with previous patch-based generation methods and achieve state-of-the-art FID scores on all six datasets. Further, Patch-DM also reduces memory complexity compared to the classic diffusion models. Project page: https://patchdm.github.io.",
        "keywords": "Diffusion Models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/25c3bc615e97b041fb02de0b9a9edc23d40f6542.pdf",
        "author": "Zheng Ding;Mengqi Zhang;Jiajun Wu;Zhuowen Tu",
        "authorids": "~Zheng_Ding2;~Mengqi_Zhang2;~Jiajun_Wu1;~Zhuowen_Tu1",
        "gender": "M;F;M;",
        "homepage": ";https://mq-zhang1.github.io/;https://jiajunwu.com;",
        "dblp": "08/9587;;117/4768;",
        "google_scholar": "TOYBXFQAAAAJ;https://scholar.google.com/citations?hl=en;2efgcS0AAAAJ;",
        "orcid": ";;0000-0002-4176-343X;",
        "linkedin": "zheng-ding-224b3122b;mengqi-z-9a83341bb/;jiajunwu/;",
        "or_profile": "~Zheng_Ding2;~Mengqi_Zhang2;~Jiajun_Wu1;~Zhuowen_Tu1",
        "aff": "University of California, San Diego;Georgia Institute of Technology;Stanford University;",
        "aff_domain": "ucsd.edu;gatech.edu;stanford.edu;",
        "position": "PhD student;PhD student;Assistant Professor;",
        "bibtex": "@inproceedings{\nding2024patched,\ntitle={Patched Denoising Diffusion Models For High-Resolution Image Synthesis},\nauthor={Zheng Ding and Mengqi Zhang and Jiajun Wu and Zhuowen Tu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=TgSRPRz8cI}\n}",
        "github": "",
        "project": "",
        "reviewers": "oyqb;3rts;Tdt5;7jCc",
        "pdf_size": 8367199,
        "rating": "5;5;6;6",
        "confidence": "4;4;2;4",
        "soundness": "3;4;3;3",
        "contribution": "2;3;2;2",
        "presentation": "3;4;2;3",
        "wc_summary": "76;134;87;114",
        "wc_strengths": "20;87;30;31",
        "wc_weaknesses": "114;110;43;197",
        "wc_questions": "15;66;264;63",
        "wc_review": "225;397;424;405",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "633;1160;692;835",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;2;1;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            102.75,
            22.730761095924613
        ],
        "wc_strengths_avg": [
            42.0,
            26.334388164527386
        ],
        "wc_weaknesses_avg": [
            116.0,
            54.61226968365259
        ],
        "wc_questions_avg": [
            102.0,
            95.69482744641948
        ],
        "wc_review_avg": [
            362.75,
            80.13231245883273
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            830.0,
            204.19231131460361
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 26,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14534146067362844754&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=TgSRPRz8cI",
        "pdf": "https://openreview.net/pdf?id=TgSRPRz8cI",
        "email": "ucsd.edu;gatech.edu;stanford.edu;",
        "author_num": 4,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of California, San Diego;Georgia Institute of Technology;Stanford University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ucsd.edu;https://www.gatech.edu;https://www.stanford.edu",
        "aff_unique_abbr": "UCSD;Georgia Tech;Stanford",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "San Diego;;Stanford",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "TgTJvwMEax",
        "title": "Embedding Improves Neural Regularizers for Inverse Problems",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Obtaining meaningful solutions for inverse problems has been a major challenge with many applications in science and engineering. Recent machine learning techniques based on proximal and diffusion-based methods have shown some promising results. However, as we show in this work, they can also face challenges when applied to some exemplary problems. We show that similar to previous works on over-complete dictionaries, it is possible to overcome these shortcomings by embedding the solution into higher dimensions. The novelty of the work proposed is that we jointly design and learn the embedding and the regularizer for the embedding vector. \nWe demonstrate the merit of this approach on several exemplary and common inverse problems.",
        "keywords": "Inverse Problems;High Dimensional Embedding;Dictionary Learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Moshe Eliasof;Eldad Haber;Eran Treister",
        "authorids": "~Moshe_Eliasof1;~Eldad_Haber3;~Eran_Treister1",
        "gender": "M;M;M",
        "homepage": ";https://eldad-haber.webnode.com/;https://www.cs.bgu.ac.il/~erant/",
        "dblp": "239/6004;;22/10384",
        "google_scholar": "44LKqBsAAAAJ;https://scholar.google.ca/citations?user=NZmEIS8AAAAJ;https://scholar.google.co.il/citations?user=5nNoFlEAAAAJ",
        "orcid": ";;0000-0002-5351-0966",
        "linkedin": ";;",
        "or_profile": "~Moshe_Eliasof1;~Eldad_Haber3;~Eran_Treister1",
        "aff": "University of Cambridge;University of British Columbia;Ben-Gurion University of the Negev",
        "aff_domain": "cam.ac.uk;ubc.ca;bgu.ac.il",
        "position": "Postdoc;Full Professor;Associate Professor",
        "bibtex": "@misc{\neliasof2024embedding,\ntitle={Embedding Improves Neural Regularizers for Inverse Problems},\nauthor={Moshe Eliasof and Eldad Haber and Eran Treister},\nyear={2024},\nurl={https://openreview.net/forum?id=TgTJvwMEax}\n}",
        "github": "",
        "project": "",
        "reviewers": "riDU;zbc8;TUQu;9vsv",
        "site": "https://openreview.net/forum?id=TgTJvwMEax",
        "pdf_size": 5476821,
        "rating": "3;3;3;5",
        "confidence": "3;2;4;4",
        "soundness": "2;3;2;2",
        "contribution": "2;2;1;3",
        "presentation": "3;2;2;3",
        "wc_summary": "106;18;62;79",
        "wc_strengths": "16;22;26;9",
        "wc_weaknesses": "225;200;68;255",
        "wc_questions": "73;36;513;92",
        "wc_review": "420;276;669;435",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            66.25,
            31.971667144520318
        ],
        "wc_strengths_avg": [
            18.25,
            6.417748826496718
        ],
        "wc_weaknesses_avg": [
            187.0,
            71.41078349941274
        ],
        "wc_questions_avg": [
            178.5,
            194.17067234780848
        ],
        "wc_review_avg": [
            450.0,
            140.85630976282178
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5222329678670935,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Q57wN1L892wJ:scholar.google.com/&scioq=Embedding+Improves+Neural+Regularizers+for+Inverse+Problems&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of Cambridge;University of British Columbia;Ben-Gurion University of the Negev",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.cam.ac.uk;https://www.ubc.ca;https://www.bgu.ac.il",
        "aff_unique_abbr": "Cambridge;UBC;BGU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Cambridge;",
        "aff_country_unique_index": "0;1;2",
        "aff_country_unique": "United Kingdom;Canada;Israel"
    },
    {
        "id": "TgeVptDYAt",
        "title": "Towards Causal Foundation Model: on Duality between Causal Inference and Attention",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Foundation models have brought changes to the landscape of machine learning, demonstrating sparks of human-level intelligence across a diverse array of tasks. However, a gap persists in complex tasks such as causal inference, primarily due to challenges associated with intricate reasoning steps and high numerical precision requirements. In this work, we take a first step towards building causally-aware foundation models for complex tasks. We propose a novel, theoretically sound method called Causal Inference with Attention (CInA), which utilizes multiple unlabeled datasets to perform self-supervised causal learning, and subsequently enables zero-shot causal inference on unseen tasks with new data. This is based on our theoretical results that demonstrate the primal-dual connection between optimal covariate balancing and self-attention, facilitating zero-shot causal inference through the final layer of a trained transformer-type architecture. We demonstrate empirically that our approach CInA effectively generalizes to out-of-distribution datasets and various real-world datasets, matching or even surpassing traditional per-dataset causal inference methodologies.",
        "keywords": "foundation model;causal inference;zero-shot learning;attention",
        "primary_area": "causal reasoning",
        "supplementary_material": "/attachment/9a40e16e13de57f831d6f6f0bb7b6282cb4ac55c.pdf",
        "author": "Jiaqi Zhang;Joel Jennings;Cheng Zhang;Chao Ma",
        "authorids": "~Jiaqi_Zhang2;~Joel_Jennings1;~Cheng_Zhang1;~Chao_Ma2",
        "gender": "F;F;M;",
        "homepage": ";http://cheng-zhang.org;;",
        "dblp": ";82/6384-5;;217/1994",
        "google_scholar": ";r40iAwIAAAAJ;https://scholar.google.co.uk/citations?user=UWP3kWEAAAAJ;",
        "orcid": "0000-0001-9039-6843;;;",
        "linkedin": "vicky-jiaqi-zhang-34b490180/;;;",
        "or_profile": "~Jiaqi_Zhang2;~Cheng_Zhang1;~Chao_Ma2;~Joel_Nicholas_Jennings1",
        "aff": "Apple;Microsoft;Microsoft;Google Deepmind",
        "aff_domain": "apple.com;microsoft.com;microsoft.com;google.com",
        "position": "Intern;Principal Researcher;Researcher;Researcher",
        "bibtex": "@misc{\nzhang2024towards,\ntitle={Towards Causal Foundation Model: on Duality between Causal Inference and Attention},\nauthor={Jiaqi Zhang and Joel Jennings and Cheng Zhang and Chao Ma},\nyear={2024},\nurl={https://openreview.net/forum?id=TgeVptDYAt}\n}",
        "github": "",
        "project": "",
        "reviewers": "deJS;FDY4;YMpy;BTeh",
        "site": "https://openreview.net/forum?id=TgeVptDYAt",
        "pdf_size": 1480678,
        "rating": "3;5;6;10",
        "confidence": "4;5;2;3",
        "soundness": "1;2;3;4",
        "contribution": "2;2;3;4",
        "presentation": "2;1;3;4",
        "wc_summary": "64;29;94;116",
        "wc_strengths": "151;30;23;95",
        "wc_weaknesses": "1004;154;194;51",
        "wc_questions": "298;4;6;54",
        "wc_review": "1517;217;317;316",
        "wc_reply_reviewers": "464;96;0;0",
        "wc_reply_authors": "2450;1398;949;319",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "5;4;2;1",
        "rating_avg": [
            6.0,
            2.5495097567963922
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.5,
            1.118033988749895
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            75.75,
            32.6984326841517
        ],
        "wc_strengths_avg": [
            74.75,
            52.212905492799386
        ],
        "wc_weaknesses_avg": [
            350.75,
            380.7449113251548
        ],
        "wc_questions_avg": [
            90.5,
            121.46089905809194
        ],
        "wc_review_avg": [
            591.75,
            535.7356507644419
        ],
        "wc_reply_reviewers_avg": [
            140.0,
            191.12299704640463
        ],
        "wc_reply_authors_avg": [
            1279.0,
            777.1586067206616
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.0,
            1.5811388300841898
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.43852900965351466,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15834777829917654241&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "Apple;Microsoft;DeepMind",
        "aff_unique_dep": "Apple Inc.;Microsoft Corporation;DeepMind",
        "aff_unique_url": "https://www.apple.com;https://www.microsoft.com;https://deepmind.com",
        "aff_unique_abbr": "Apple;Microsoft;DeepMind",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "title": "DoLa: Decoding by Contrasting Layers Improves Factuality in Large Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18563",
        "id": "Th6NyL07na",
        "author_site": "Yung-Sung Chuang, Yujia Xie, Hongyin Luo, Yoon Kim, James R Glass, Pengcheng He",
        "tldr": "",
        "abstract": "Despite their impressive capabilities, large language models (LLMs) are prone to hallucinations, i.e., generating content that deviates from facts seen during pretraining. We propose a simple decoding strategy for reducing hallucinations with pretrained LLMs that does not require conditioning on retrieved external knowledge nor additional fine-tuning. Our approach obtains the next-token distribution by contrasting the differences in logits obtained from projecting the later layers versus earlier layers to the vocabulary space, exploiting the fact that factual knowledge in an LLMs has generally been shown to be localized to particular transformer layers. We find that this **D**ecoding by C**o**ntrasting **La**yers (DoLa) approach is able to better surface factual knowledge and reduce the generation of incorrect facts. DoLa consistently improves the truthfulness across multiple choices tasks and open-ended generation tasks, for example improving the performance of LLaMA family models on TruthfulQA by 12-17% absolute points, demonstrating its potential in making LLMs reliably generate truthful facts.",
        "keywords": "Large Language Models;Hallucination;Factuality;Decoding;Text Generation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/fc4ac2f6b716f1c4af2b4fa52d9231bcd982e94f.zip",
        "author": "Yung-Sung Chuang;Yujia Xie;Hongyin Luo;Yoon Kim;James R. Glass;Pengcheng He",
        "authorids": "~Yung-Sung_Chuang1;~Yujia_Xie1;~Hongyin_Luo1;~Yoon_Kim1;~James_R._Glass1;~Pengcheng_He2",
        "gender": "M;F;M;;;M",
        "homepage": "https://people.csail.mit.edu/yungsung/;;;https://people.csail.mit.edu/yoonkim/;;",
        "dblp": "64/3095;201/8729;147/4317;;;116/8665",
        "google_scholar": "3ar1DOwAAAAJ;r2FiAE4AAAAJ;;n_ts4eYAAAAJ;;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0002-1723-5063;;;;;",
        "linkedin": "yschuang;;;;;",
        "or_profile": "~Yung-Sung_Chuang1;~Yujia_Xie1;~Hongyin_Luo1;~Yoon_Kim1;~James_R._Glass1;~Pengcheng_He2",
        "aff": "Massachusetts Institute of Technology;Microsoft;Massachusetts Institute of Technology;Massachusetts Institute of Technology;;Microsoft",
        "aff_domain": "mit.edu;microsoft.com;mit.edu;mit.edu;;microsoft.com",
        "position": "PhD student;Researcher;Postdoc;Assistant Professor;;Principal Researcher",
        "bibtex": "@inproceedings{\nchuang2024dola,\ntitle={DoLa: Decoding by Contrasting Layers Improves Factuality in Large Language Models},\nauthor={Yung-Sung Chuang and Yujia Xie and Hongyin Luo and Yoon Kim and James R. Glass and Pengcheng He},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Th6NyL07na}\n}",
        "github": "",
        "project": "",
        "reviewers": "NRik;Cc1D;VLmJ;uyVJ",
        "pdf_size": 546422,
        "rating": "5;8;8;8",
        "confidence": "3;4;4;4",
        "soundness": "2;3;4;4",
        "contribution": "3;4;3;3",
        "presentation": "3;3;4;4",
        "wc_summary": "56;67;266;82",
        "wc_strengths": "77;43;54;60",
        "wc_weaknesses": "161;22;99;389",
        "wc_questions": "80;60;204;91",
        "wc_review": "374;192;623;622",
        "wc_reply_reviewers": "0;0;18;0",
        "wc_reply_authors": "1857;639;2135;1010",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "6;2;5;3",
        "rating_avg": [
            7.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            117.75,
            86.0882541349283
        ],
        "wc_strengths_avg": [
            58.5,
            12.298373876248844
        ],
        "wc_weaknesses_avg": [
            167.75,
            136.90028305303096
        ],
        "wc_questions_avg": [
            108.75,
            56.104255631814596
        ],
        "wc_review_avg": [
            452.75,
            181.53701413210476
        ],
        "wc_reply_reviewers_avg": [
            4.5,
            7.794228634059948
        ],
        "wc_reply_authors_avg": [
            1410.25,
            608.2505137687924
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.0,
            1.5811388300841898
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 314,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8391217322765741220&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=Th6NyL07na",
        "pdf": "https://openreview.net/pdf?id=Th6NyL07na",
        "email": "mit.edu;microsoft.com;mit.edu;mit.edu;;microsoft.com",
        "author_num": 6,
        "aff_unique_index": "0;1;0;0;1",
        "aff_unique_norm": "Massachusetts Institute of Technology;Microsoft",
        "aff_unique_dep": ";Microsoft Corporation",
        "aff_unique_url": "https://web.mit.edu;https://www.microsoft.com",
        "aff_unique_abbr": "MIT;Microsoft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Th9VeE7flR",
        "title": "Enhanced Label Propagation through Affinity Matrix Fusion for Source-Free Domain Adaptation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Source-free domain adaptation (SFDA) has gained significant attention as a method to transfer knowledge from a pre-trained model on source domains toward target domains without accessing the source data. Recent research in SFDA has predominately adopted a self-training paradigm, focusing on utilizing local consistency constraints to refine pseudo-labels during self-training. These constraints encourage similar predictions among samples residing in local neighborhoods. Despite their effectiveness, the importance of global consistency is often overlooked. Moreover, such self-training-based adaptation processes suffer from the \"confirmation bias\": models use self-generated sub-optimal pseudo-labels to guide their subsequent training, resulting in a loop of self-reinforcing errors. In this study, we address the global consistency limitation by employing a label propagation method that seamlessly enforces both local and global consistency, leading to more coherent label predictions within the target domain. To mitigate the \"confirmation bias\", we propose utilizing an affinity matrix derived from current and historical models during the label propagation process. This approach takes advantage of different snapshots of the model to obtain a more accurate representation of the underlying graph structure, significantly enhancing the efficacy of label propagation and resulting in more refined pseudo-labels. Extensive experiments prove the superiority of our approach over the existing methods by a large margin. Our findings not only highlight the significance of incorporating global consistency within the SFDA framework but also offer a novel approach to mitigate the confirmation bias that arises from the use of noisy pseudo-labels in the self-training paradigm.",
        "keywords": "transfer learning;source-free domain adaptation;label propagation",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/9296f368fd6f55afd2a98966c6fb38941365ebd5.zip",
        "author": "Li Guo;Yuxuan Xia;Shengjie Wang",
        "authorids": "~Li_Guo6;~Yuxuan_Xia1;~Shengjie_Wang1",
        "gender": "F;M;M",
        "homepage": ";https://github.com/NovTi;https://sheng-jie-wang.github.io/",
        "dblp": ";;",
        "google_scholar": "JNeOWZkAAAAJ;;",
        "orcid": ";;0000-0002-9311-102X",
        "linkedin": ";;",
        "or_profile": "~Li_Guo6;~Yuxuan_Xia1;~Shengjie_Wang1",
        "aff": ";New York University Shanghai;New York University, Shanghai",
        "aff_domain": ";nyu.edu;nyu.edu",
        "position": ";Undergrad student;Assistant Professor",
        "bibtex": "@misc{\nguo2024enhanced,\ntitle={Enhanced Label Propagation through Affinity Matrix Fusion for Source-Free Domain Adaptation},\nauthor={Li Guo and Yuxuan Xia and Shengjie Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=Th9VeE7flR}\n}",
        "github": "",
        "project": "",
        "reviewers": "113e;j3cS;CpfT;CVkN",
        "site": "https://openreview.net/forum?id=Th9VeE7flR",
        "pdf_size": 1390999,
        "rating": "5;5;6;6",
        "confidence": "3;5;4;4",
        "soundness": "2;3;3;4",
        "contribution": "2;2;2;2",
        "presentation": "2;2;3;4",
        "wc_summary": "96;78;47;109",
        "wc_strengths": "77;62;43;41",
        "wc_weaknesses": "134;117;276;67",
        "wc_questions": "89;2;71;53",
        "wc_review": "396;259;437;270",
        "wc_reply_reviewers": "56;0;42;0",
        "wc_reply_authors": "450;508;617;271",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            82.5,
            23.264780248263683
        ],
        "wc_strengths_avg": [
            55.75,
            14.7542366796795
        ],
        "wc_weaknesses_avg": [
            148.5,
            77.62248385616117
        ],
        "wc_questions_avg": [
            53.75,
            32.47595264191645
        ],
        "wc_review_avg": [
            340.5,
            77.46773521925111
        ],
        "wc_reply_reviewers_avg": [
            24.5,
            24.994999499899976
        ],
        "wc_reply_authors_avg": [
            461.5,
            125.26471969393457
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ekWD8j0lnyMJ:scholar.google.com/&scioq=Enhanced+Label+Propagation+through+Affinity+Matrix+Fusion+for+Source-Free+Domain+Adaptation&hl=en&as_sdt=0,24",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "New York University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nyu.edu",
        "aff_unique_abbr": "NYU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Shanghai",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Ti0kjqFx7D",
        "title": "Editable Graph Neural Network for Node Classifications",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Despite Graph Neural Networks (GNNs) have achieved prominent success in many graph-based learning problem, such as credit risk assessment in financial networks and fake news detection in social networks. However, the trained GNNs still make errors and these errors may cause serious negative impact on society. Model editing, which corrects the model behavior on wrongly predicted target samples while leaving model predictions unchanged on unrelated samples, has garnered significant interest in the fields of computer vision and natural language processing. However, model editing for graph neural networks (GNNs) is rarely explored, despite GNNs' widespread applicability. To fill the gap, we first observe that existing model editing methods significantly deteriorate prediction accuracy (up to $50\\%$ accuracy drop) in GNNs while a slight accuracy drop in multi-layer perception (MLP).  The rationale behind this observation is that the node aggregation in GNNs will spread the editing effect throughout the whole graph. This propagation pushes the node representation far from its original one. Motivated by this observation, we propose Editable Graph Neural Networks (EGNN), a neighbor propagation-free approach to correct the model prediction on misclassified nodes. Specifically, EGNN simply stitches an MLP to the underlying GNNs, where the weights of GNNs are frozen during model editing. In this way, EGNN disables the propagation during editing while still utilizing the neighbor propagation scheme for node prediction to obtain satisfactory results. Experiments demonstrate that EGNN outperforms existing baselines in terms of effectiveness (correcting wrong predictions with lower accuracy drop), generalizability (correcting wrong predictions for other similar nodes), and efficiency (low training time and memory) on various graph datasets.",
        "keywords": "Editable Neural Network;Graph Neural Network",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Zirui Liu;Zhimeng Jiang;Shaochen Zhong;Kaixiong Zhou;Li Li;Rui Chen;Soo-Hyun Choi;Xia Hu",
        "authorids": "~Zirui_Liu1;~Zhimeng_Jiang1;~Shaochen_Zhong1;~Kaixiong_Zhou1;~Li_Li11;~Rui_Chen4;~Soo-Hyun_Choi1;~Xia_Hu4",
        "gender": "M;M;M;M;M;;M;",
        "homepage": "https://zirui-ray-liu.github.io/;http://www.zhimengjiang.com/;https://openreview.net/profile?id=~Shaochen_Zhong1;https://kaixiong-zhou.github.io/;;;;",
        "dblp": "196/8629-1.html;217/3235;326/7286.html;178/7315;53/2189-35;;185/1826;",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;5Es3Yk4AAAAJ;https://scholar.google.com/citations?hl=en;zMspIjIAAAAJ;FPcI7HkAAAAJ;;Lm1BDEoAAAAJ;",
        "orcid": ";0000-0001-6933-3952;;0000-0001-5226-8736;0000-0002-3365-8904;;0000-0001-5768-9978;",
        "linkedin": ";;shaochen-henry-zhong-96a941249/;;li-li-b8a08664/;;soo-hyun-choi-706b5297/;",
        "or_profile": "~Zirui_Liu1;~Zhimeng_Jiang1;~Shaochen_Zhong1;~Kaixiong_Zhou1;~Li_Li11;~Rui_Chen4;~Soo-Hyun_Choi1;~Xia_Hu4",
        "aff": "Rice University;VISA Research;Rice University;Massachusetts Institute of Technology;Samsung;;Samsung Electronics America;",
        "aff_domain": "rice.edu;visa.com;rice.edu;mit.edu;samsung.com;;samsung.com;",
        "position": "PhD student;Researcher;PhD student;Postdoc;Researcher;;Principal Researcher;",
        "bibtex": "@misc{\nliu2024editable,\ntitle={Editable Graph Neural Network for Node Classifications},\nauthor={Zirui Liu and Zhimeng Jiang and Shaochen Zhong and Kaixiong Zhou and Li Li and Rui Chen and Soo-Hyun Choi and Xia Hu},\nyear={2024},\nurl={https://openreview.net/forum?id=Ti0kjqFx7D}\n}",
        "github": "",
        "project": "",
        "reviewers": "7JjA;fgMm;5Af8",
        "site": "https://openreview.net/forum?id=Ti0kjqFx7D",
        "pdf_size": 1455828,
        "rating": "3;5;5",
        "confidence": "4;4;4",
        "soundness": "2;2;1",
        "contribution": "1;3;2",
        "presentation": "3;3;3",
        "wc_summary": "35;70;36",
        "wc_strengths": "15;52;54",
        "wc_weaknesses": "236;61;206",
        "wc_questions": "180;2;4",
        "wc_review": "466;185;300",
        "wc_reply_reviewers": "139;0;167",
        "wc_reply_authors": "2700;669;2824",
        "reply_reviewers": "1;0;1",
        "reply_authors": "4;1;5",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            47.0,
            16.268579122549905
        ],
        "wc_strengths_avg": [
            40.333333333333336,
            17.93197020841702
        ],
        "wc_weaknesses_avg": [
            167.66666666666666,
            76.412622575651
        ],
        "wc_questions_avg": [
            62.0,
            83.4425950379461
        ],
        "wc_review_avg": [
            317.0,
            115.34585673818833
        ],
        "wc_reply_reviewers_avg": [
            102.0,
            73.02510983673127
        ],
        "wc_reply_authors_avg": [
            2064.3333333333335,
            987.9474794857379
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            1.699673171197595
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16254467153035955118&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;0;2;3;3",
        "aff_unique_norm": "Rice University;VISA;Massachusetts Institute of Technology;Samsung",
        "aff_unique_dep": ";Research;;Samsung",
        "aff_unique_url": "https://www.rice.edu;https://www.visa.com/;https://web.mit.edu;https://www.samsung.com",
        "aff_unique_abbr": "Rice;VISA;MIT;Samsung",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;1;0",
        "aff_country_unique": "United States;South Korea"
    },
    {
        "id": "TiY8Cvc2SR",
        "title": "Progressive Pseudo Bag Augmentation with Instance Importance Estimation for Whole Slide Image Classification",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In the field of computational pathology, the classification of whole-slide images (WSI) remains a challenging task due to the vast amount of gigapixel information and the limited availability of refined manual annotations. Recently, multiple instance learning (MIL) has emerged as a promising approach to address this issue. While attention-based MIL methods utilize attention mechanisms to distill instance information for training or further fine-tuning, the current ranking of attention scores fails to accurately locate positive instances. In this study, we propose the instance importance score (IIS) based on the Shapley value to tackle this problem. This approach enables the identification and prioritization of crucial features. Building upon this foundation, we present a novel framework for the progressive assignment of pseudo bags. Through comprehensive experiments, our approach achieves state-of-the-art performance compared to other superior methods on the CAMELYON-16, BRACS, and TCGA-LUNG datasets. Furthermore, the visualization results demonstrate the enhanced interpretability provided by the IIS in the classification of WSI. Code for our framework is accessible at https://github.com/*****.",
        "keywords": "Instance inportance score;Shapley value;progressive pseudo bag augmentation;multiple instance learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Renao Yan;Sun Qiehe;Cheng Jin;Yiqing Liu;Yonghong He;Tian Guan;Hao Chen",
        "authorids": "~Renao_Yan1;~Sun_Qiehe1;~Cheng_Jin3;~Yiqing_Liu1;~Yonghong_He1;~Tian_Guan1;~Hao_Chen1",
        "gender": "M;M;M;M;M;M;M",
        "homepage": ";;https://academic.peterkam.top/;;https://scholar.google.com/citations?hl=zh-CN&user=KR_wIQgAAAAJ;http://www.sigs.tsinghua.edu.cn;https://cse.hkust.edu.hk/~jhc/",
        "dblp": "277/9821;;84/4201-3;159/3798;171/2389;84/6828;86/475-11",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;;DFMxV_oAAAAJ;;;;https://scholar.google.com.hk/citations?user=Z_t5DjwAAAAJ",
        "orcid": "0000-0002-2399-199X;0009-0008-4948-8664;0000-0002-3522-3592;0000-0002-8157-2814;;;0000-0002-8400-3780",
        "linkedin": ";;;;;;",
        "or_profile": "~Renao_Yan1;~Sun_Qiehe1;~Cheng_Jin3;~Yiqing_Liu1;~Yonghong_He1;~Tian_Guan1;~Hao_Chen1",
        "aff": "Tsinghua University;Tsinghua University;Hong Kong University of Science and Technology;Biomedical Engineering, Tsinghua University;Tsinghua University;Graduate School at Shenzhen, Tsinghua University;Hong Kong University of Science and Technology",
        "aff_domain": "mails.tsinghua.edu.cn;mails.tsinghua.edu.cn;connect.ust.hk;mails.tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;ust.hk",
        "position": "MS student;MS student;PhD student;PhD student;Full Professor;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nyan2024progressive,\ntitle={Progressive Pseudo Bag Augmentation with Instance Importance Estimation for Whole Slide Image Classification},\nauthor={Renao Yan and Sun Qiehe and Cheng Jin and Yiqing Liu and Yonghong He and Tian Guan and Hao Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=TiY8Cvc2SR}\n}",
        "github": "",
        "project": "",
        "reviewers": "vsHj;WwcE;znAR",
        "site": "https://openreview.net/forum?id=TiY8Cvc2SR",
        "pdf_size": 6037399,
        "rating": "3;3;8",
        "confidence": "4;3;4",
        "soundness": "2;2;3",
        "contribution": "1;1;3",
        "presentation": "2;3;3",
        "wc_summary": "47;55;181",
        "wc_strengths": "87;12;114",
        "wc_weaknesses": "129;132;85",
        "wc_questions": "68;20;137",
        "wc_review": "331;219;517",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.666666666666667,
            2.357022603955158
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            94.33333333333333,
            61.369554521946974
        ],
        "wc_strengths_avg": [
            71.0,
            43.15089802078283
        ],
        "wc_weaknesses_avg": [
            115.33333333333333,
            21.483844059096025
        ],
        "wc_questions_avg": [
            75.0,
            48.02082881417188
        ],
        "wc_review_avg": [
            355.6666666666667,
            122.90194827133088
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.5000000000000001,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:m8WOqRm4EVEJ:scholar.google.com/&scioq=Progressive+Pseudo+Bag+Augmentation+with+Instance+Importance+Estimation+for+Whole+Slide+Image+Classification&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;0;0;1",
        "aff_unique_norm": "Tsinghua University;Hong Kong University of Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.ust.hk",
        "aff_unique_abbr": "THU;HKUST",
        "aff_campus_unique_index": "1;2;1",
        "aff_campus_unique": ";Hong Kong SAR;Shenzhen",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Overthinking the Truth: Understanding how Language Models Process False Demonstrations",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18562",
        "id": "Tigr1kMDZy",
        "author_site": "Danny Halawi, Jean-Stanislas Denain, Jacob Steinhardt",
        "tldr": "",
        "abstract": "Modern language models can imitate complex patterns through few-shot learning, enabling them to complete challenging tasks without fine-tuning. However, imitation can also lead models to reproduce inaccuracies or harmful content if present in the context. We study harmful imitation through the lens of a model\u2019s internal representations, and identify two related phenomena: overthinking and false induction heads. The first phenomenon, overthinking, appears when we decode predictions from intermediate layers, given correct vs. incorrect few-shot demonstrations. At early layers, both demonstrations induce similar model behavior, but the behavior diverges sharply at some \u201ccritical layer\u201d, after which the accuracy given incorrect demonstrations progressively decreases. The second phenomenon, false induction heads, are a possible mechanistic cause of overthinking: these are heads in late layers that attend to and copy false information from previous demonstrations, and whose ablation reduces overthinking. Beyond scientific understanding, our results suggest that studying intermediate model computations could be a promising avenue for understanding and guarding against harmful model behaviors.",
        "keywords": "Mechanistic Interpretability;AI Safety;Interpretability;Science of ML;few-shot learning;Large Language Models",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Danny Halawi;Jean-Stanislas Denain;Jacob Steinhardt",
        "authorids": "~Danny_Halawi1;~Jean-Stanislas_Denain1;~Jacob_Steinhardt1",
        "gender": "M;;",
        "homepage": "https://dannyhalawi.me;https://github.com/js-d;",
        "dblp": "321/4165;259/3213;35/10625",
        "google_scholar": ";njFysmYAAAAJ;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Danny_Halawi1;~Jean-Stanislas_Denain1;~Jacob_Steinhardt1",
        "aff": "University of California, Berkeley;University of California, Berkeley;University of California, Berkeley",
        "aff_domain": "berkeley.edu;berkeley.edu;berkeley.edu",
        "position": "Researcher;PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nhalawi2024overthinking,\ntitle={Overthinking the Truth: Understanding how Language Models Process False Demonstrations},\nauthor={Danny Halawi and Jean-Stanislas Denain and Jacob Steinhardt},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Tigr1kMDZy}\n}",
        "github": "",
        "project": "",
        "reviewers": "Lx2y;bUf7;qL6Z",
        "pdf_size": 836001,
        "rating": "6;8;8",
        "confidence": "5;3;3",
        "soundness": "3;3;3",
        "contribution": "3;4;3",
        "presentation": "3;3;3",
        "wc_summary": "11;106;90",
        "wc_strengths": "9;175;54",
        "wc_weaknesses": "42;281;53",
        "wc_questions": "3;3;35",
        "wc_review": "65;565;232",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "210;489;185",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            69.0,
            41.52910625894406
        ],
        "wc_strengths_avg": [
            79.33333333333333,
            70.09675852388294
        ],
        "wc_weaknesses_avg": [
            125.33333333333333,
            110.1645234284714
        ],
        "wc_questions_avg": [
            13.666666666666666,
            15.084944665313014
        ],
        "wc_review_avg": [
            287.3333333333333,
            207.84021640566957
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            294.6666666666667,
            137.79292031482927
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 45,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16292281746775867387&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=Tigr1kMDZy",
        "pdf": "https://openreview.net/pdf?id=Tigr1kMDZy",
        "email": "berkeley.edu;berkeley.edu;berkeley.edu",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of California, Berkeley",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.berkeley.edu",
        "aff_unique_abbr": "UC Berkeley",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Berkeley",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Waxing-and-Waning: a Generic Similarity-based Framework for Efficient Self-Supervised Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18561",
        "id": "TilcG5C8bN",
        "author_site": "Sheng Li, Chao Wu, Ao Li, Yanzhi Wang, Xulong Tang, Geng Yuan",
        "tldr": "",
        "abstract": "Deep Neural Networks (DNNs), essential for diverse applications such as visual recognition and eldercare, often require a large amount of labeled data for training, making widespread deployment of DNNs a challenging task. Self-supervised learning (SSL) emerges as a promising approach, which leverages inherent patterns within data through diverse augmentations to train models without explicit labels. However, while SSL has shown notable advancements in accuracy, its high computation costs remain a daunting impediment, particularly for resource-constrained platforms. To address this problem, we introduce SimWnW, a similarity-based efficient self-supervised learning framework. By strategically removing less important regions in augmented images and feature maps, SimWnW not only reduces computation costs but also eliminates irrelevant features that might slow down the learning process, thereby accelerating model convergence. The experimental results show that SimWnW effectively reduces the amount of computation costs in self-supervised model training without compromising accuracy. Specifically, SimWnW yields up to 54\\% and 51\\% computation savings in training from scratch and transfer learning tasks, respectively.",
        "keywords": "Self-supervised learning;efficient training;image similarity",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Sheng Li;Chao Wu;Ao Li;Yanzhi Wang;Xulong Tang;Geng Yuan",
        "authorids": "~Sheng_Li16;~Chao_Wu4;~Ao_Li7;~Yanzhi_Wang3;~Xulong_Tang1;~Geng_Yuan1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://shengli99.github.io/;;;https://web.northeastern.edu/yanzhiwang/;http://xzt102.github.io/;",
        "dblp": "23/3439-19;45/3158-6.html;54/2788-4;;66/10956;205/3007",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;;https://scholar.google.com/citations?hl=en;jmjRUi4AAAAJ;tBIAgtgAAAAJ",
        "orcid": ";;0000-0002-1927-8606;;;0000-0001-9844-992X",
        "linkedin": "2702851b2;;;;;",
        "or_profile": "~Sheng_Li16;~Chao_Wu4;~Ao_Li7;~Yanzhi_Wang3;~Xulong_Tang1;~Geng_Yuan1",
        "aff": "University of Pittsburgh;;University of Arizona;Northeastern University;University of Pittsburgh;University of Georgia",
        "aff_domain": "pitt.edu;;arizona.edu;northeastern.edu;pitt.edu;uga.edu",
        "position": "PhD student;;Assistant Professor;Associate Professor;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nli2024waxingandwaning,\ntitle={Waxing-and-Waning: a Generic Similarity-based Framework for Efficient Self-Supervised Learning},\nauthor={Sheng Li and Chao Wu and Ao Li and Yanzhi Wang and Xulong Tang and Geng Yuan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=TilcG5C8bN}\n}",
        "github": "",
        "project": "",
        "reviewers": "wGaZ;5JXS;Aoaq;vumm",
        "pdf_size": 789152,
        "rating": "6;6;6;8",
        "confidence": "5;4;4;3",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;3;3",
        "wc_summary": "116;81;57;135",
        "wc_strengths": "58;61;74;96",
        "wc_weaknesses": "69;94;176;235",
        "wc_questions": "333;2;5;91",
        "wc_review": "576;238;312;557",
        "wc_reply_reviewers": "32;19;0;0",
        "wc_reply_authors": "2513;1395;1876;814",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "6;4;5;3",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            97.25,
            30.252066045148055
        ],
        "wc_strengths_avg": [
            72.25,
            14.972892172189045
        ],
        "wc_weaknesses_avg": [
            143.5,
            66.00946901770988
        ],
        "wc_questions_avg": [
            107.75,
            134.86914954873853
        ],
        "wc_review_avg": [
            420.75,
            148.23187072961065
        ],
        "wc_reply_reviewers_avg": [
            12.75,
            13.5531361684298
        ],
        "wc_reply_authors_avg": [
            1649.5,
            624.4527604230764
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            4.5,
            1.118033988749895
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16725443381257426360&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=TilcG5C8bN",
        "pdf": "https://openreview.net/pdf?id=TilcG5C8bN",
        "email": "pitt.edu;;arizona.edu;northeastern.edu;pitt.edu;uga.edu",
        "author_num": 6,
        "aff_unique_index": "0;1;2;0;3",
        "aff_unique_norm": "University of Pittsburgh;University of Arizona;Northeastern University;University of Georgia",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.pitt.edu;https://www.arizona.edu;https://www.northeastern.edu;https://www.uga.edu",
        "aff_unique_abbr": "Pitt;UA;NEU;UGA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "On the Foundations of Shortcut Learning",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18560",
        "id": "Tj3xLVuE9f",
        "author_site": "Katherine Hermann, Hossein Mobahi, Thomas FEL, Michael Mozer",
        "tldr": "",
        "abstract": "Deep-learning models can extract a rich assortment of features from data. Which features a model uses depends not only on *predictivity*---how reliably a feature indicates training-set labels---but also on *availability*---how easily the feature can be extracted from inputs. The literature on shortcut learning has noted examples in which models privilege one feature over another, for example texture over shape and image backgrounds over foreground objects. Here, we test hypotheses about which input properties are more available to a model, and systematically study how predictivity and availability interact to shape models' feature use. We construct a minimal, explicit generative framework for synthesizing classification datasets with two latent features that vary in predictivity and in factors we hypothesize to relate to availability, and we quantify a model's shortcut bias---its over-reliance on the shortcut (more available, less predictive) feature at the expense of the core (less available, more predictive) feature. We find that linear models are relatively unbiased, but introducing a single hidden layer with ReLU or Tanh units yields a bias. Our empirical findings are consistent with a theoretical account based on Neural Tangent Kernels. Finally, we study how models used in practice trade off predictivity and availability in naturalistic datasets, discovering availability manipulations which increase models' degree of shortcut bias. Taken together, these findings suggest that the propensity to learn shortcut features is a fundamental characteristic of deep nonlinear architectures warranting systematic study given its role in shaping how models solve tasks.",
        "keywords": "shortcut learning;spurious correlations;architectural inductive bias",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Katherine Hermann;Hossein Mobahi;Thomas FEL;Michael Curtis Mozer",
        "authorids": "~Katherine_Hermann1;~Hossein_Mobahi2;~Thomas_FEL1;~Michael_Curtis_Mozer1",
        "gender": "F;M;M;M",
        "homepage": ";https://thomasfel.me;https://www.cs.colorado.edu/~mozer;http://people.csail.mit.edu/hmobahi/",
        "dblp": "254/1923;274/2390;m/MichaelCMozer;94/1490",
        "google_scholar": "owcAYmEAAAAJ;1m5Mlx4AAAAJ;lmjR_qMAAAAJ;GSHmKZkAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Katherine_Hermann1;~Thomas_FEL1;~Michael_Curtis_Mozer1;~Hossein_Mobahi1",
        "aff": "Google;Brown University;Google DeepMind;Google",
        "aff_domain": "google.com;brown.edu;google.com;google.com",
        "position": "Researcher;PhD student;Research Scientist;Research Scientist",
        "bibtex": "@inproceedings{\nhermann2024on,\ntitle={On the Foundations of Shortcut Learning},\nauthor={Katherine Hermann and Hossein Mobahi and Thomas FEL and Michael Curtis Mozer},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Tj3xLVuE9f}\n}",
        "github": "",
        "project": "",
        "reviewers": "gtPN;mfV7;QCsi;G1nt;KL3Q",
        "pdf_size": 11869173,
        "rating": "6;6;6;8;8",
        "confidence": "3;3;2;4;3",
        "soundness": "2;3;3;3;3",
        "contribution": "2;3;3;3;3",
        "presentation": "4;2;3;2;3",
        "wc_summary": "126;143;106;270;114",
        "wc_strengths": "65;70;37;115;71",
        "wc_weaknesses": "195;245;66;196;87",
        "wc_questions": "207;58;58;220;12",
        "wc_review": "593;516;267;801;284",
        "wc_reply_reviewers": "54;0;0;0;29",
        "wc_reply_authors": "762;448;350;532;219",
        "reply_reviewers": "1;0;0;0;1",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            6.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.8,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.8,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            151.8,
            60.4
        ],
        "wc_strengths_avg": [
            71.6,
            25.00879845174494
        ],
        "wc_weaknesses_avg": [
            157.8,
            69.11844905667371
        ],
        "wc_questions_avg": [
            111.0,
            85.45876198494804
        ],
        "wc_review_avg": [
            492.2,
            200.07338653604083
        ],
        "wc_reply_reviewers_avg": [
            16.6,
            21.813757127097567
        ],
        "wc_reply_authors_avg": [
            462.2,
            182.5863083585404
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.6454972243679028,
        "gs_citation": 27,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11830702720106206699&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=Tj3xLVuE9f",
        "pdf": "https://openreview.net/pdf?id=Tj3xLVuE9f",
        "email": "google.com;brown.edu;google.com;google.com",
        "author_num": 4,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Google;Brown University",
        "aff_unique_dep": "Google;",
        "aff_unique_url": "https://www.google.com;https://www.brown.edu",
        "aff_unique_abbr": "Google;Brown",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Mountain View;",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "title": "Probabilistically Rewired Message-Passing Neural Networks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18559",
        "id": "Tj6Wcx7gVk",
        "author_site": "Chendi Qian, Andrei Manolache, Kareem Ahmed, Zhe Zeng, Guy Van den Broeck, Mathias Niepert, Christopher Morris",
        "tldr": "",
        "abstract": "Message-passing graph neural networks (MPNNs) emerged as powerful tools for processing graph-structured input. However, they operate on a fixed input graph structure, ignoring potential noise and missing information. Furthermore, their local aggregation mechanism can lead to problems such as over-squashing and limited expressive power in capturing relevant graph structures. Existing solutions to these challenges have primarily relied on heuristic methods, often disregarding the underlying data distribution. Hence, devising principled approaches for learning to infer graph structures relevant to the given prediction task remains an open challenge. In this work, leveraging recent progress in exact and differentiable k-subset sampling, we devise probabilistically rewired MPNNs (PR-MPNNs), which learn to add relevant edges while omitting less beneficial ones. For the first time, our theoretical analysis explores how PR-MPNNs enhance expressive power, and we identify precise conditions under which they outperform purely randomized approaches. Empirically, we demonstrate that our approach effectively mitigates issues like over-squashing and under-reaching. In addition, on established real-world datasets, our method exhibits competitive or superior predictive performance compared to traditional MPNN models and recent graph transformer architectures.",
        "keywords": "GNN;MPNN;graph;rewiring;probabilistic;weisfeiler;leman;lehman;k-subset;sampling;expressivity",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Chendi Qian;Andrei Manolache;Kareem Ahmed;Zhe Zeng;Guy Van den Broeck;Mathias Niepert;Christopher Morris",
        "authorids": "~Chendi_Qian1;~Andrei_Manolache1;~Kareem_Ahmed2;~Zhe_Zeng1;~Guy_Van_den_Broeck1;~Mathias_Niepert1;~Christopher_Morris1",
        "gender": ";M;M;F;M;M;M",
        "homepage": "https://github.com/chendiqian;https://andreimano.github.io;http://kareemahmed.com;https://zzeng.me/;http://www.matlog.net;http://christophermorris.info;http://web.cs.ucla.edu/~guyvdb/",
        "dblp": "322/9379;290/2275;188/6144;27/10464;n/MathiasNiepert;156/7303;96/7521.html",
        "google_scholar": ";0H7Htc4AAAAJ;hkM0hbIAAAAJ;PyK6cB0AAAAJ;https://scholar.google.de/citations?user=p5vLzq0AAAAJ;;d0KQ9z0AAAAJ",
        "orcid": ";;;;;;0000-0003-3434-2503",
        "linkedin": ";andreimano/;kareem-yousrii/;;;;guyvdb",
        "or_profile": "~Chendi_Qian1;~Andrei_Manolache1;~Kareem_Ahmed2;~Zhe_Zeng1;~Mathias_Niepert1;~Christopher_Morris1;~Guy_Van_den_Broek1",
        "aff": "Rheinisch Westf\u00e4lische Technische Hochschule Aachen;Universit\u00e4t Stuttgart;University of California, Los Angeles;University of California, Los Angeles;NEC;Rheinisch Westf\u00e4lische Technische Hochschule Aachen;University of California, Los Angeles",
        "aff_domain": "rwth-aachen.de;uni-stuttgart.de;cs.ucla.edu;cs.ucla.edu;neclab.eu;rwth-aachen.de;ucla.edu",
        "position": "PhD student;PhD student;PhD student;PhD student;Research Scientist;Assistant Professor;Associate Professor",
        "bibtex": "@inproceedings{\nqian2024probabilistically,\ntitle={Probabilistically Rewired Message-Passing Neural Networks},\nauthor={Chendi Qian and Andrei Manolache and Kareem Ahmed and Zhe Zeng and Guy Van den Broeck and Mathias Niepert and Christopher Morris},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Tj6Wcx7gVk}\n}",
        "github": "",
        "project": "",
        "reviewers": "8vRc;MyQT;j89x",
        "pdf_size": 769808,
        "rating": "6;6;8",
        "confidence": "4;2;4",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "2;3;3",
        "wc_summary": "96;22;73",
        "wc_strengths": "64;11;46",
        "wc_weaknesses": "353;17;121",
        "wc_questions": "8;13;110",
        "wc_review": "521;63;350",
        "wc_reply_reviewers": "26;0;52",
        "wc_reply_authors": "1534;489;712",
        "reply_reviewers": "1;0;2",
        "reply_authors": "3;1;2",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            63.666666666666664,
            30.922843048824316
        ],
        "wc_strengths_avg": [
            40.333333333333336,
            22.005049925465343
        ],
        "wc_weaknesses_avg": [
            163.66666666666666,
            140.45007021081273
        ],
        "wc_questions_avg": [
            43.666666666666664,
            46.94914506380518
        ],
        "wc_review_avg": [
            311.3333333333333,
            188.96619333156454
        ],
        "wc_reply_reviewers_avg": [
            26.0,
            21.228911104120876
        ],
        "wc_reply_authors_avg": [
            911.6666666666666,
            449.37462718266096
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 19,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=112527552626398119&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=Tj6Wcx7gVk",
        "pdf": "https://openreview.net/pdf?id=Tj6Wcx7gVk",
        "email": "rwth-aachen.de;uni-stuttgart.de;cs.ucla.edu;cs.ucla.edu;neclab.eu;rwth-aachen.de;ucla.edu",
        "author_num": 7,
        "aff_unique_index": "0;1;2;2;3;0;2",
        "aff_unique_norm": "RWTH Aachen University;University of Stuttgart;University of California, Los Angeles;NEC Corporation",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.rwth-aachen.de;https://www.uni-stuttgart.de;https://www.ucla.edu;https://www.nec.com",
        "aff_unique_abbr": "RWTH;Uni Stuttgart;UCLA;NEC",
        "aff_campus_unique_index": "0;2;2;0;2",
        "aff_campus_unique": "Aachen;;Los Angeles",
        "aff_country_unique_index": "0;0;1;1;2;0;1",
        "aff_country_unique": "Germany;United States;Japan"
    },
    {
        "title": "Learning Hierarchical World Models with Adaptive Temporal Abstractions from Discrete Latent Dynamics",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18558",
        "id": "TjCDNssXKU",
        "author_site": "Christian Gumbsch, Noor Sajid, Georg Martius, Martin V. Butz",
        "tldr": "",
        "abstract": "Hierarchical world models can significantly improve model-based reinforcement learning (MBRL) and planning by enabling reasoning across multiple time scales. Nonetheless, the majority of state-of-the-art MBRL methods employ flat, non-hierarchical models. We propose Temporal Hierarchies from Invariant Context Kernels (THICK), an algorithm that learns a world model hierarchy via discrete latent dynamics. The lower level of THICK updates parts of its latent state sparsely in time, forming invariant contexts. The higher level exclusively predicts situations involving context changes. Our experiments demonstrate that THICK learns categorical, interpretable, temporal abstractions on the high level, while maintaining precise low-level predictions. Furthermore, we show that the emergent hierarchical predictive model seamlessly enhances the abilities of MBRL or planning methods. We believe that THICK contributes to the further development of hierarchical agents capable of more sophisticated planning and reasoning abilities.",
        "keywords": "world models;temporal abstraction;hierarchical learning;model-based reinforcement learning;hierarchical planning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Christian Gumbsch;Noor Sajid;Georg Martius;Martin V. Butz",
        "authorids": "~Christian_Gumbsch1;~Noor_Sajid1;~Georg_Martius1;~Martin_V._Butz2",
        "gender": "M;F;M;M",
        "homepage": "https://cgumbsch.github.io;https://noorsajid.com;https://uni-tuebingen.de/de/264672;https://cm.inf.uni-tuebingen.de",
        "dblp": "212/4217;230/7793;47/2706;b/MartinVButz.html",
        "google_scholar": "FQOFw5cAAAAJ;https://scholar.google.co.uk/citations?user=lNfhdlEAAAAJ;https://scholar.google.de/citations?user=b-JF-UIAAAAJ;https://scholar.google.de/citations?user=dIcpfzAAAAAJ",
        "orcid": "0000-0003-2741-6551;;;0000-0002-8120-8537",
        "linkedin": ";;;martin-butz-85b971150/",
        "or_profile": "~Christian_Gumbsch1;~Noor_Sajid1;~Georg_Martius1;~Martin_V._Butz2",
        "aff": "Max-Planck Institute;University College London;Max Planck Institute for Intelligent Systems;University of Tuebingen",
        "aff_domain": "mpg.de;ucl.ac.uk;tuebingen.mpg.de;uni-tuebingen.de",
        "position": "PhD student;PhD student;Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\ngumbsch2024learning,\ntitle={Learning Hierarchical World Models with Adaptive Temporal Abstractions from Discrete Latent Dynamics},\nauthor={Christian Gumbsch and Noor Sajid and Georg Martius and Martin V. Butz},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=TjCDNssXKU}\n}",
        "github": "",
        "project": "",
        "reviewers": "h1NE;sX3c;yLBk",
        "pdf_size": 3100290,
        "rating": "6;6;8",
        "confidence": "3;3;4",
        "soundness": "2;3;4",
        "contribution": "3;3;3",
        "presentation": "4;3;4",
        "wc_summary": "146;80;110",
        "wc_strengths": "99;89;103",
        "wc_weaknesses": "326;80;55",
        "wc_questions": "63;84;1",
        "wc_review": "634;333;269",
        "wc_reply_reviewers": "139;0;0",
        "wc_reply_authors": "1255;718;565",
        "reply_reviewers": "1;0;0",
        "reply_authors": "3;1;1",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            112.0,
            26.981475126464083
        ],
        "wc_strengths_avg": [
            97.0,
            5.887840577551898
        ],
        "wc_weaknesses_avg": [
            153.66666666666666,
            122.28473148989433
        ],
        "wc_questions_avg": [
            49.333333333333336,
            35.235714205271265
        ],
        "wc_review_avg": [
            412.0,
            159.1372573179099
        ],
        "wc_reply_reviewers_avg": [
            46.333333333333336,
            65.5252283899534
        ],
        "wc_reply_authors_avg": [
            846.0,
            295.8749735952671
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.9999999999999998,
        "gs_citation": 16,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12271763854603321351&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=TjCDNssXKU",
        "pdf": "https://openreview.net/pdf?id=TjCDNssXKU",
        "email": "mpg.de;ucl.ac.uk;tuebingen.mpg.de;uni-tuebingen.de",
        "author_num": 4,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Max-Planck-Gesellschaft zur F\u00f6rderung der Wissenschaften e.V.;University College London;Max Planck Institute for Intelligent Systems;University of Tuebingen",
        "aff_unique_dep": ";;Intelligent Systems;",
        "aff_unique_url": "https://www.mpg.de;https://www.ucl.ac.uk;https://www.mpi-is.mpg.de;https://www.uni-tuebingen.de/",
        "aff_unique_abbr": "MPG;UCL;MPI-IS;Uni T\u00fcbingen",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "Germany;United Kingdom"
    },
    {
        "title": "Doubly Robust Proximal Causal Learning for Continuous Treatments",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18557",
        "id": "TjGJFkU3xL",
        "author_site": "Yong Wu, Yanwei Fu, Shouyan Wang, Xinwei Sun",
        "tldr": "",
        "abstract": "Proximal causal learning is a powerful framework for identifying the causal effect under the existence of unmeasured confounders. Within this framework, the doubly robust (DR) estimator was derived and has shown its effectiveness in estimation, especially when the model assumption is violated. However, the current form of the DR estimator is restricted to binary treatments, while the treatments can be continuous in many real-world applications. The primary obstacle to continuous treatments resides in the delta function present in the original DR estimator, making it infeasible in causal effect estimation and introducing a heavy computational burden in nuisance function estimation. To address these challenges, we propose a kernel-based DR estimator that can well handle continuous treatments for proximal causal learning. Equipped with its smoothness, we show that its oracle form is a consistent approximation of the influence function. Further, we propose a new approach to efficiently solve the nuisance functions. We then provide a comprehensive convergence analysis in terms of the mean square error. We demonstrate the utility of our estimator on synthetic datasets and real-world applications.",
        "keywords": "causal effect;continuous treatment;kernel function;doubly robust",
        "primary_area": "causal reasoning",
        "supplementary_material": "/attachment/925d405aebfca55ec3e07dcb3f93041bf2ba1a49.zip",
        "author": "Yong Wu;Yanwei Fu;Shouyan Wang;Xinwei Sun",
        "authorids": "~Yong_Wu9;~Yanwei_Fu2;~Shouyan_Wang1;~Xinwei_Sun1",
        "gender": "M;M;M;M",
        "homepage": ";http://yanweifu.github.io;https://istbi.fudan.edu.cn/info/1774/4601.htm;https://sunxinwei0625.github.io/sunxw.github.io/",
        "dblp": ";63/9065;;145/6592-1",
        "google_scholar": ";https://scholar.google.co.uk/citations?user=Vg54TcsAAAAJ;;",
        "orcid": "0000-0001-7457-4873;0000-0002-6595-6893;;",
        "linkedin": ";;;",
        "or_profile": "~Yong_Wu9;~Yanwei_Fu2;~Shouyan_Wang1;~Xinwei_Sun1",
        "aff": "Fudan University;Fudan University,;Fudan University;Fudan University",
        "aff_domain": "fudan.edu.cn;fudan.edu.cn;fudan.edu.cn;fudan.edu.cn",
        "position": "PhD student;Professor;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nwu2024doubly,\ntitle={Doubly Robust Proximal Causal Learning for Continuous Treatments},\nauthor={Yong Wu and Yanwei Fu and Shouyan Wang and Xinwei Sun},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=TjGJFkU3xL}\n}",
        "github": "",
        "project": "",
        "reviewers": "eqxp;sZEk;jsr3",
        "pdf_size": 780107,
        "rating": "6;6;8",
        "confidence": "3;4;4",
        "soundness": "3;4;3",
        "contribution": "3;3;3",
        "presentation": "3;3;3",
        "wc_summary": "90;25;47",
        "wc_strengths": "27;27;6",
        "wc_weaknesses": "97;84;141",
        "wc_questions": "111;110;2",
        "wc_review": "325;246;196",
        "wc_reply_reviewers": "0;97;13",
        "wc_reply_authors": "553;367;360",
        "reply_reviewers": "0;1;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            54.0,
            26.993826454703797
        ],
        "wc_strengths_avg": [
            20.0,
            9.899494936611665
        ],
        "wc_weaknesses_avg": [
            107.33333333333333,
            24.390344173235622
        ],
        "wc_questions_avg": [
            74.33333333333333,
            51.14901975817545
        ],
        "wc_review_avg": [
            255.66666666666666,
            53.105764491458196
        ],
        "wc_reply_reviewers_avg": [
            36.666666666666664,
            42.99095512107427
        ],
        "wc_reply_authors_avg": [
            426.6666666666667,
            89.37685507010315
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.49999999999999983,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17665744275499124505&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=TjGJFkU3xL",
        "pdf": "https://openreview.net/pdf?id=TjGJFkU3xL",
        "email": "fudan.edu.cn;fudan.edu.cn;fudan.edu.cn;fudan.edu.cn",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Fudan University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.fudan.edu.cn",
        "aff_unique_abbr": "Fudan",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "TjXjkxhSdE",
        "title": "Enhancing One-Shot Pruned Generative Pre-training Language Models through Sparse-Dense-Sparse Mechanism",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Generative pre-trained language models (PLMs) are engineered to be robust in contextual understanding and exhibit outstanding performance in various natural language processing tasks. However, their considerable size incurs significant computational and storage costs. Modern pruning strategies employ one-shot techniques to compress PLMs without the need for retraining on task-specific or otherwise general data; however, these approaches often lead to an indispensable reduction in performance. In this paper, we propose SDS, a Sparse-Dense-Sparse pruning framework to enhance the performance of the pruned PLMs from a weight distribution optimization perspective. We outline the pruning process in three steps. Initially, we prune less critical connections in the model with conventional one-shot pruning methods. Next, we reconstruct a dense model featuring a pruning-friendly weight distribution by reactivating pruned connections with sparse regularization. Finally, we perform a second pruning round, yielding a superior pruned model compared to the initial pruning. Notably, SDS requires only a limited number of calibration samples, comparable to typical one-shot pruning methods, but significantly outperforms them. Experimental results demonstrate that, under an identical sparsity configuration, SDS outperforms the state-of-the-art pruning technique SparseGPT by decreasing language comprehension perplexity by an average of 2.4 and achieving an average accuracy improvement of over 2% across seven downstream tasks on OPTs.",
        "keywords": "Generative pre-trained language models;Unstructured pruning;Sparse regularization;Model compression",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Guanchen Li;Xiandong Zhao;Zeping Li;Dong Li;Lu Tian;Jie He;Ashish Sirasao",
        "authorids": "~Guanchen_Li1;~Xiandong_Zhao1;~Zeping_Li4;~Dong_Li13;~Lu_Tian3;~Jie_He6;~Ashish_Sirasao1",
        "gender": "M;M;M;F;M;M;M",
        "homepage": ";https://joyeeo.github.io/about/;https://github.com/ZepinLi;;;;https://sites.google.com/site/lidonggg930/",
        "dblp": "153/2874;;;;28/4019;19/4292.html;47/4826-25",
        "google_scholar": ";;;edbuKpcAAAAJ;1i54GNwAAAAJ;;I9s_CWwAAAAJ",
        "orcid": "0000-0002-3493-8887;;;;0000-0003-2134-0998;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Guanchen_Li1;~Xiandong_Zhao1;~Zeping_Li4;~Lu_Tian3;~Jie_He6;~Ashish_Sirasao1;~Dong_Li4",
        "aff": "University of Science and Technology Beijing;, Chinese Academy of Sciences;AMD;AMD;University of Science and Technology Beijing;Amd inc;Advanced Micro Devices",
        "aff_domain": "ustb.edu.cn;ict.ac.cn;amd.com;amd.com;ustb.edu.cn;amd.com;amd.com",
        "position": "MS student;PhD student;Researcher;Researcher;Full Professor;Researcher;Researcher",
        "bibtex": "@misc{\nli2024enhancing,\ntitle={Enhancing One-Shot Pruned Generative Pre-training Language Models through Sparse-Dense-Sparse Mechanism},\nauthor={Guanchen Li and Xiandong Zhao and Zeping Li and Dong Li and Lu Tian and Jie He and Ashish Sirasao},\nyear={2024},\nurl={https://openreview.net/forum?id=TjXjkxhSdE}\n}",
        "github": "",
        "project": "",
        "reviewers": "k1aZ;XgFT;hYrm",
        "site": "https://openreview.net/forum?id=TjXjkxhSdE",
        "pdf_size": 923578,
        "rating": "5;6;6",
        "confidence": "4;4;3",
        "soundness": "3;3;3",
        "contribution": "2;3;2",
        "presentation": "3;4;4",
        "wc_summary": "142;94;87",
        "wc_strengths": "68;50;68",
        "wc_weaknesses": "155;248;30",
        "wc_questions": "130;13;46",
        "wc_review": "495;405;231",
        "wc_reply_reviewers": "58;0;0",
        "wc_reply_authors": "1438;1453;518",
        "reply_reviewers": "1;0;0",
        "reply_authors": "4;4;1",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            107.66666666666667,
            24.44494948973214
        ],
        "wc_strengths_avg": [
            62.0,
            8.48528137423857
        ],
        "wc_weaknesses_avg": [
            144.33333333333334,
            89.31716271554731
        ],
        "wc_questions_avg": [
            63.0,
            49.25444142409901
        ],
        "wc_review_avg": [
            377.0,
            109.5810202544218
        ],
        "wc_reply_reviewers_avg": [
            19.333333333333332,
            27.34146220587984
        ],
        "wc_reply_authors_avg": [
            1136.3333333333333,
            437.2705747652768
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.0,
            1.4142135623730951
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:bhXjsGbCoQsJ:scholar.google.com/&scioq=Enhancing+One-Shot+Pruned+Generative+Pre-training+Language+Models+through+Sparse-Dense-Sparse+Mechanism&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;2;0;2;2",
        "aff_unique_norm": "University of Science and Technology Beijing;Chinese Academy of Sciences;Advanced Micro Devices, Inc.",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.ustb.edu.cn;http://www.cas.cn;https://www.amd.com",
        "aff_unique_abbr": "USTB;CAS;AMD",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;1;0;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "NOLA: Compressing LoRA using Linear Combination of Random Basis",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18556",
        "id": "TjfXcDgvzk",
        "author_site": "Soroush Abbasi Koohpayegani, K L Navaneet, Parsa Nooralinejad, Soheil Kolouri, Hamed Pirsiavash",
        "tldr": "",
        "abstract": "Fine-tuning Large Language Models (LLMs) and storing them for each downstream task or domain is impractical because of the massive model size (e.g., 350GB in GPT-3).\nCurrent literature, such as LoRA, showcases the potential of low-rank modifications to the original weights of an LLM, enabling efficient adaptation and storage for task-specific models. These methods can reduce the number of parameters needed to fine-tune an LLM by several orders of magnitude. Yet, these methods face two primary limitations: (1) the parameter count is lower-bounded by the rank one decomposition, and (2) the extent of reduction is heavily influenced by both the model architecture and the chosen rank. We introduce NOLA, which overcomes the rank one lower bound present in LoRA. It achieves this by re-parameterizing the low-rank matrices in LoRA using linear combinations of randomly generated matrices (basis) and optimizing the linear mixture coefficients only. This approach allows us to decouple the number of trainable parameters from both the choice of rank and the network architecture. We present adaptation results using GPT-2, LLaMA-2, and ViT in natural language and computer vision tasks. NOLA performs as well as LoRA models with much fewer number of parameters compared to LoRA with rank one, the best compression LoRA can archive. Particularly, on LLaMA-2 70B, our method is almost 20 times more compact than the most compressed LoRA without degradation in accuracy. Our code is available here: https://github.com/UCDvision/NOLA",
        "keywords": "computer vision;natural language processing;natural language generation;Generative AI;GPT;large language models;LoRA;adaptation;PEFT;Transfer Learning;Transformers;ViT;LLaMA",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/d34c8731e3d6560283fb49546c9689e440ae7ab5.zip",
        "author": "Soroush Abbasi Koohpayegani;Navaneet K L;Parsa Nooralinejad;Soheil Kolouri;Hamed Pirsiavash",
        "authorids": "~Soroush_Abbasi_Koohpayegani1;~Navaneet_K_L1;~Parsa_Nooralinejad2;~Soheil_Kolouri1;~Hamed_Pirsiavash1",
        "gender": "M;M;M;M;M",
        "homepage": "http://soroush-abbasi.github.io;;https://p-nooralinejad.github.io;https://skolouri.github.io/;https://web.cs.ucdavis.edu/~hpirsiav/",
        "dblp": "277/5486;226/4749;;143/9637;07/6340",
        "google_scholar": "JS10DM0AAAAJ;https://scholar.google.co.in/citations?hl=en;qTKtwa0AAAAJ;yREBSy0AAAAJ;https://scholar.google.com.tw/citations?user=c9XXy4MAAAAJ",
        "orcid": ";;;0000-0001-8495-5362;",
        "linkedin": ";;;skolouri/;hpirsiav/",
        "or_profile": "~Soroush_Abbasi_Koohpayegani1;~Navaneet_K_L1;~Parsa_Nooralinejad2;~Soheil_Kolouri1;~Hamed_Pirsiavash1",
        "aff": "University of California, Davis;University of California, Davis;University of California, Davis;Vanderbilt University;University of California, Davis",
        "aff_domain": "ucdavis.edu;ucdavis.edu;ucdavis.edu;vanderbilt.edu;ucdavis.edu",
        "position": "PhD student;PhD student;PhD student;Assistant Professor;Associate Professor",
        "bibtex": "@inproceedings{\nkoohpayegani2024nola,\ntitle={{NOLA}: Compressing Lo{RA} using Linear Combination of Random Basis},\nauthor={Soroush Abbasi Koohpayegani and Navaneet K L and Parsa Nooralinejad and Soheil Kolouri and Hamed Pirsiavash},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=TjfXcDgvzk}\n}",
        "github": "",
        "project": "",
        "reviewers": "CrTj;WWfE;ba8s;P5nc",
        "pdf_size": 1169718,
        "rating": "6;6;6;6",
        "confidence": "4;3;3;4",
        "soundness": "3;2;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;3;2",
        "wc_summary": "159;78;78;100",
        "wc_strengths": "71;41;48;41",
        "wc_weaknesses": "200;92;127;138",
        "wc_questions": "21;38;163;116",
        "wc_review": "451;249;416;395",
        "wc_reply_reviewers": "0;0;25;17",
        "wc_reply_authors": "1170;458;867;414",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            103.75,
            33.138912172852024
        ],
        "wc_strengths_avg": [
            50.25,
            12.316147936753602
        ],
        "wc_weaknesses_avg": [
            139.25,
            38.970341286675946
        ],
        "wc_questions_avg": [
            84.5,
            57.768936289324216
        ],
        "wc_review_avg": [
            377.75,
            76.97848725455704
        ],
        "wc_reply_reviewers_avg": [
            10.5,
            10.874281585465774
        ],
        "wc_reply_authors_avg": [
            727.25,
            310.7164100912599
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 17,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4259515696238803638&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=TjfXcDgvzk",
        "pdf": "https://openreview.net/pdf?id=TjfXcDgvzk",
        "email": "ucdavis.edu;ucdavis.edu;ucdavis.edu;vanderbilt.edu;ucdavis.edu",
        "author_num": 5,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "University of California, Davis;Vanderbilt University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ucdavis.edu;https://www.vanderbilt.edu",
        "aff_unique_abbr": "UC Davis;Vanderbilt",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Davis;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Understanding and Mitigating the Label Noise in Pre-training on Downstream Tasks",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18555",
        "id": "TjhUtloBZU",
        "author_site": "Hao Chen, Jindong Wang, Ankit Parag Shah, Ran Tao, Hongxin Wei, Xing Xie, Masashi Sugiyama, Bhiksha Raj",
        "tldr": "",
        "abstract": "Pre-training on large-scale datasets and then fine-tuning on downstream tasks have become a standard practice in deep learning. However, pre-training data often contain label noise that may adversely affect the generalization of the model. This paper aims to understand the nature of noise in pre-training datasets and to mitigate its impact on downstream tasks. More specifically, through extensive experiments of supervised pre-training models on synthetic noisy ImageNet-1K and YFCC15M datasets, we demonstrate that while slight noise in pre-training can benefit in-domain (ID) transfer performance, where the training and testing data share the same distribution, it always deteriorates out-of-domain (OOD) performance, where training and testing data distribution are different. We empirically verify that the reason behind is noise in pre-training shapes the feature space differently. We then propose a light-weight black-box tuning method (NMTune) to affine the feature space to mitigate the malignant effect of noise and improve generalization on both ID and OOD tasks, considering one may not be able to fully fine-tune or even access the pre-trained models. We conduct practical experiments on popular vision and language models that are pre-trained on noisy data for evaluation of our approach. Our analysis and results show the importance of this interesting and novel research direction, which we term Noisy Model Learning.",
        "keywords": "Pre training;Noisy model learning;Label noise;Noise mitigation",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/385394a5c9241244693eea1636b2cf1916324236.zip",
        "author": "Hao Chen;Jindong Wang;Ankit Shah;Ran Tao;Hongxin Wei;Xing Xie;Masashi Sugiyama;Bhiksha Raj",
        "authorids": "~Hao_Chen15;~Jindong_Wang1;~Ankit_Shah1;~Ran_Tao2;~Hongxin_Wei1;~Xing_Xie3;~Masashi_Sugiyama1;~Bhiksha_Raj1",
        "gender": "M;M;F;M;M;M;M;M",
        "homepage": "https://hhhhhhao.github.io/;https://ankitshah009.github.io/;;https://hongxin001.github.io/;http://research.microsoft.com/en-us/people/xingx/;http://www.ms.k.u-tokyo.ac.jp/sugi/;https://www.cs.cmu.edu/directory/bhikshar/;https://jd92.wang/",
        "dblp": ";04/1935-1.html;99/955;150/6350;08/6809-1;35/1228;60/3996;19/2969-1",
        "google_scholar": "tktqkhwAAAAJ;https://scholar.google.co.in/citations?user=TqG1H4cAAAAJ;7xW2y6EAAAAJ;cABH034AAAAJ;5EQfAFIAAAAJ;https://scholar.google.co.jp/citations?user=GkYIrlIAAAAJ;;hBZ_tKsAAAAJ",
        "orcid": ";0000-0002-8838-5421;;;0000-0002-8608-8482;0000-0001-6658-6743;;0000-0002-4833-0880",
        "linkedin": "haochen97/;ankpsh01/;;;xingx/;;;jindong-wang/",
        "or_profile": "~Hao_Chen15;~Ankit_Shah1;~Ran_Tao2;~Hongxin_Wei1;~Xing_Xie3;~Masashi_Sugiyama1;~Bhiksha_Raj1;~Jindong_Wang4",
        "aff": "Carnegie Mellon University;Accenture;;Southern University of Science and Technology;Microsoft Research Asia;The University of Tokyo;Mohamed bin Zayed University of Artificial Intelligence;Microsoft Research",
        "aff_domain": "andrew.cmu.edu;accenture.com;;sustech.edu.cn;microsoft.com;u-tokyo.ac.jp;mbzuai.ac.ae;microsoft.com",
        "position": "PhD student;Principal Researcher;;Assistant Professor;Senior Principal Researcher;Full Professor;Full Professor;Researcher",
        "bibtex": "@inproceedings{\nchen2024understanding,\ntitle={Understanding and Mitigating the Label Noise in Pre-training on Downstream Tasks},\nauthor={Hao Chen and Jindong Wang and Ankit Shah and Ran Tao and Hongxin Wei and Xing Xie and Masashi Sugiyama and Bhiksha Raj},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=TjhUtloBZU}\n}",
        "github": "",
        "project": "",
        "reviewers": "vftf;5WgV;jd9i;JmqY",
        "pdf_size": 2055202,
        "rating": "8;8;8;10",
        "confidence": "3;4;4;5",
        "soundness": "3;2;3;3",
        "contribution": "3;3;3;4",
        "presentation": "3;3;3;4",
        "wc_summary": "103;120;88;132",
        "wc_strengths": "51;103;51;141",
        "wc_weaknesses": "64;309;74;33",
        "wc_questions": "39;2;250;42",
        "wc_review": "257;534;463;348",
        "wc_reply_reviewers": "0;100;19;52",
        "wc_reply_authors": "595;1506;1406;485",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "1;3;3;1",
        "rating_avg": [
            8.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            110.75,
            16.69393602479655
        ],
        "wc_strengths_avg": [
            86.5,
            37.957212753309484
        ],
        "wc_weaknesses_avg": [
            120.0,
            110.16124545410695
        ],
        "wc_questions_avg": [
            83.25,
            97.5535109568077
        ],
        "wc_review_avg": [
            400.5,
            106.15672376255779
        ],
        "wc_reply_reviewers_avg": [
            42.75,
            37.93003427364653
        ],
        "wc_reply_authors_avg": [
            998.0,
            461.00596525424703
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            1.0
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.816496580927726,
        "gs_citation": 29,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12077856247514938841&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=TjhUtloBZU",
        "pdf": "https://openreview.net/pdf?id=TjhUtloBZU",
        "email": "andrew.cmu.edu;accenture.com;;sustech.edu.cn;microsoft.com;u-tokyo.ac.jp;mbzuai.ac.ae;microsoft.com",
        "author_num": 8,
        "aff_unique_index": "0;1;2;3;4;5;3",
        "aff_unique_norm": "Carnegie Mellon University;Accenture;Southern University of Science and Technology;Microsoft;University of Tokyo;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_unique_dep": ";;;Research;;",
        "aff_unique_url": "https://www.cmu.edu;https://www.accenture.com;https://www.sustech.edu.cn;https://www.microsoft.com/en-us/research/group/asia;https://www.u-tokyo.ac.jp;https://mbzuai.ac.ae",
        "aff_unique_abbr": "CMU;Accenture;SUSTech;MSR Asia;UTokyo;MBZUAI",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Asia",
        "aff_country_unique_index": "0;0;1;1;2;3;0",
        "aff_country_unique": "United States;China;Japan;United Arab Emirates"
    },
    {
        "id": "TjpiApms66",
        "title": "Feature Selection in the Presence of Monotone Batch Effects",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We study the feature selection problem in the presence of monotone batch effects when merging datasets from disparate technologies and different environments affects the underlying causal dependence of data features. We propose two novel algorithms for this task: 1) joint feature selection and batch effect correction through non-linear transformations matching the distribution of data batches; 2) transforming data using a batch-invariant characteristic (i.e., feature rank) to append datasets. To match the distribution of data batches during the feature selection procedure, we use the maximum mean discrepancy (MMD) distance. We assess the performance of the feature selection methods used in conjunction with our batch effect removal methods.\n\nOur experiments on synthetic data show that the former method combined with Lasso improves the $F_1$ score significantly, even with few samples per dataset. This method outperforms popular batch effect removal algorithms, including Combat-Seq, Limma, and PCA. Comparatively, while the ranking method is computationally more efficient, its performance is worse due to the information loss resulting from ignoring the magnitude of data.",
        "keywords": "Batch Effect;Distribution Shift",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Peng Dai;Sina Baharlouei;Taojian Tu;Bangyan L. Stiles;Meisam Razaviyayn;Sze-Chuan Suen",
        "authorids": "~Peng_Dai4;~Sina_Baharlouei1;taojiant@usc.edu;bstiles@usc.edu;~Meisam_Razaviyayn1;~Sze-Chuan_Suen1",
        "gender": "M;M;;;M;",
        "homepage": ";;;;https://sites.usc.edu/razaviyayn/;",
        "dblp": ";243/6970;;;43/8577;218/7394",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;;;https://scholar.google.com/citations?hl=en;",
        "orcid": ";;;;;",
        "linkedin": "www.linkedin.com/in/peng-dai-064034b1;sina-baharlouei-00b4ba97/;;;;",
        "or_profile": "~Peng_Dai4;~Sina_Baharlouei1;taojiant@usc.edu;bstiles@usc.edu;~Meisam_Razaviyayn1;~Sze-Chuan_Suen1",
        "aff": ";University of Southern California;;;Google;University of Southern California",
        "aff_domain": ";usc.edu;;;google.com;usc.edu",
        "position": ";PhD student;;;Researcher;Assistant Professor",
        "bibtex": "@misc{\ndai2024feature,\ntitle={Feature Selection in the Presence of Monotone Batch Effects},\nauthor={Peng Dai and Sina Baharlouei and Taojian Tu and Bangyan L. Stiles and Meisam Razaviyayn and Sze-Chuan Suen},\nyear={2024},\nurl={https://openreview.net/forum?id=TjpiApms66}\n}",
        "github": "",
        "project": "",
        "reviewers": "p82K;xAdr;6Rhw",
        "site": "https://openreview.net/forum?id=TjpiApms66",
        "pdf_size": 791469,
        "rating": "3;3;3",
        "confidence": "4;3;4",
        "soundness": "2;3;3",
        "contribution": "1;2;2",
        "presentation": "1;2;2",
        "wc_summary": "108;258;81",
        "wc_strengths": "32;8;55",
        "wc_weaknesses": "177;226;167",
        "wc_questions": "401;443;140",
        "wc_review": "718;935;443",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            149.0,
            77.85884663928692
        ],
        "wc_strengths_avg": [
            31.666666666666668,
            19.189117286165672
        ],
        "wc_weaknesses_avg": [
            190.0,
            25.78113005022601
        ],
        "wc_questions_avg": [
            328.0,
            134.03730823916152
        ],
        "wc_review_avg": [
            698.6666666666666,
            201.3228474090531
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:7ciXMIO1VGIJ:scholar.google.com/&scioq=Feature+Selection+in+the+Presence+of+Monotone+Batch+Effects&hl=en&as_sdt=0,34",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Southern California;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.usc.edu;https://www.google.com",
        "aff_unique_abbr": "USC;Google",
        "aff_campus_unique_index": "0;1;0",
        "aff_campus_unique": "Los Angeles;Mountain View",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "TkP2RtR4hr",
        "title": "Regulating the level of manipulation in text augmentation with systematic adjustment and advanced sentence-embedding",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Text augmentation, a method for generating samples by applying combinations, noise, and other manipulations to a small dataset, is a crucial technique in natural language processing (NLP) research. It introduced diversity into the training process, thereby enabling the construction of robust models. The level of manipulation is the most important issue in text augmentation; low-level manipulation generates data similar to the original, resulting in inefficient augmentation because it cannot ensure diversity, whereas high-level manipulation causes reliability issues for labels and degrades the model's performance. Therefore, this paper proposes a systematically adjustable text augmentation technique to address the ``level of manipulation'' issue. Specifically, it proposes a method for systematically adjusting the data candidate pool for manipulation to provide an appropriate level of randomness during the augmentation process. Furthermore, we propose an advanced sentence-embedding methodology to achieve robust pseudo-labeling at the manipulation level. In other words, we leverage combined sentence embedding, which incorporates sentence embedding, document embedding, and XAI information from the original data to assign reliable pseudo-labels. We conducted performance comparisons with existing text augmentation approaches to validate the effectiveness of our proposed methodology. The experimental results demonstrate that the proposed method achieves the highest performance improvement across all the experimental datasets",
        "keywords": "Text augmentation;the level of manipulation;advanced sentence-embedding;reliable pseudo-labels",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/d0982916346d5465c84ebc9fe658cacf425d50ab.zip",
        "author": "Youhoo Cha;Younghoon Lee",
        "authorids": "~Youhoo_Cha1;~Younghoon_Lee1",
        "gender": "M;",
        "homepage": ";https://iise.seoultech.ac.kr/about_the_department/about_professor/?togo=list&menu=1215&profidx=02575",
        "dblp": ";",
        "google_scholar": "i-MtpXwAAAAJ;E6IKiR0AAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Youhoo_Cha1;~Younghoon_Lee1",
        "aff": "Seoul National University of Science and Technology;",
        "aff_domain": "seoultech.ac.kr;",
        "position": "MS student;",
        "bibtex": "@misc{\ncha2024regulating,\ntitle={Regulating the level of manipulation in text augmentation with systematic adjustment and advanced sentence-embedding},\nauthor={Youhoo Cha and Younghoon Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=TkP2RtR4hr}\n}",
        "github": "",
        "project": "",
        "reviewers": "HBAq;xUBm;MCTc;WQ8f",
        "site": "https://openreview.net/forum?id=TkP2RtR4hr",
        "pdf_size": 612902,
        "rating": "1;3;3;5",
        "confidence": "4;4;4;4",
        "soundness": "2;2;2;2",
        "contribution": "2;2;2;3",
        "presentation": "1;2;1;2",
        "wc_summary": "42;117;123;62",
        "wc_strengths": "33;29;29;65",
        "wc_weaknesses": "230;326;41;421",
        "wc_questions": "14;433;175;430",
        "wc_review": "319;905;368;978",
        "wc_reply_reviewers": "0;0;0;14",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            86.0,
            34.792240514229604
        ],
        "wc_strengths_avg": [
            39.0,
            15.0996688705415
        ],
        "wc_weaknesses_avg": [
            254.5,
            140.54981323360056
        ],
        "wc_questions_avg": [
            263.0,
            177.85808949834134
        ],
        "wc_review_avg": [
            642.5,
            300.6114601940518
        ],
        "wc_reply_reviewers_avg": [
            3.5,
            6.06217782649107
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:vUAYuO84g5AJ:scholar.google.com/&scioq=Regulating+the+level+of+manipulation+in+text+augmentation+with+systematic+adjustment+and+advanced+sentence-embedding&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "Seoul National University of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.snust.ac.kr",
        "aff_unique_abbr": "SNUST",
        "aff_country_unique_index": "0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "TkdMRKvZDJ",
        "title": "Phrase Grounding-based Style Transfer for Single-Domain Generalized Object Detection",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "This paper focuses on a more challenging scenario of single-domain generalized object detection, which aims to learn a detector that performs well on multiple unseen target domains with only one source domain for training. Recently, the grounded language-image pre-training model (GLIP) has gained widespread attention, which reformulates object detection as a phrase grounding task by aligning each region or box to phrases in a textual prompt. Inspired by this, this paper proposes a phrase grounding-based style transfer (PGST) approach for single-domain generalized object detection. Specifically, we introduce a textual prompt that contains a set of phrases for each target domain, such as a car driving in the foggy scene. Subsequently, we use the corresponding target textual prompt to train the PGST module from the source domain to the target domain, and the training losses include the localization loss and region-phrase alignment loss from GLIP. As such, the visual features of the source domain could be close to imaginary counterparts in the target domain while preserving their semantic content. When freezing PGST, we fine-tune the image and text encoders of GLIP using the style-transferred visual features of the source domain, to enhance the generalization of the model to corresponding unseen target domains. Our proposed approach significantly outperforms existing state-of-the-art methods, achieving a mean average precision (mAP) improvement of 8.5\\% on average across five diverse weather driving benchmarks. In addition, our performance on some datasets surprisingly matches or even surpasses that of those domain adaptive object detection methods, even though these methods incorporate target domain images into their training process.",
        "keywords": "single domain generalization;object detection;transfer learning;style transfer",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/bce738809876bc6516d0e42a44ced44912f16c36.zip",
        "author": "Hao Li;Wei Wang;Cong Wang;Mengzhu Wang;Zhigang Luo;Xinwang Liu;Kenli Li",
        "authorids": "~Hao_Li42;~Wei_Wang57;~Cong_Wang6;~Mengzhu_Wang3;~Zhigang_Luo2;~Xinwang_Liu1;~Kenli_Li1",
        "gender": ";M;;;;M;M",
        "homepage": ";;;;;https://xinwangliu.github.io/;http://csee.hnu.edu.cn/people/likenli",
        "dblp": ";;;;;45/6569-2.html;l/KenliLi.html",
        "google_scholar": ";https://scholar.google.com.hk/citations?user=B-pQ7nAAAAAJ;;;;A56vWC4AAAAJ;https://scholar.google.com/citations?view_op=list_works",
        "orcid": ";;;;;;0000-0002-2635-7716",
        "linkedin": ";;;;;;",
        "or_profile": "~Hao_Li42;~Wei_Wang57;~Cong_Wang6;~Mengzhu_Wang3;~Zhigang_Luo2;~Xinwang_Liu1;~Kenli_Li1",
        "aff": ";SUN YAT-SEN UNIVERSITY;;;;National University of Defense Technology;Hunan University",
        "aff_domain": ";sysu.edu.cn;;;;nudt.edu.cn;hnu.edu.cn",
        "position": ";Postdoc;;;;Full Professor;Full Professor",
        "bibtex": "@misc{\nli2024phrase,\ntitle={Phrase Grounding-based Style Transfer for Single-Domain Generalized Object Detection},\nauthor={Hao Li and Wei Wang and Cong Wang and Mengzhu Wang and Zhigang Luo and Xinwang Liu and Kenli Li},\nyear={2024},\nurl={https://openreview.net/forum?id=TkdMRKvZDJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "G99H;Ci7j;JhCL",
        "site": "https://openreview.net/forum?id=TkdMRKvZDJ",
        "pdf_size": 9820712,
        "rating": "6;6;6",
        "confidence": "4;3;5",
        "soundness": "3;2;3",
        "contribution": "3;2;2",
        "presentation": "3;3;3",
        "wc_summary": "78;41;68",
        "wc_strengths": "44;38;65",
        "wc_weaknesses": "29;74;358",
        "wc_questions": "51;76;22",
        "wc_review": "202;229;513",
        "wc_reply_reviewers": "43;18;162",
        "wc_reply_authors": "1066;965;2304",
        "reply_reviewers": "1;1;1",
        "reply_authors": "3;3;6",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            62.333333333333336,
            15.627610892974722
        ],
        "wc_strengths_avg": [
            49.0,
            11.575836902790225
        ],
        "wc_weaknesses_avg": [
            153.66666666666666,
            145.64874031571836
        ],
        "wc_questions_avg": [
            49.666666666666664,
            22.065558884580486
        ],
        "wc_review_avg": [
            314.6666666666667,
            140.67535518190653
        ],
        "wc_reply_reviewers_avg": [
            74.33333333333333,
            62.82426990334937
        ],
        "wc_reply_authors_avg": [
            1445.0,
            608.8026500161335
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            4.0,
            1.4142135623730951
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12743560575733762789&as_sdt=805&sciodt=0,3&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Sun Yat-sen University;National University of Defense Technology;Hunan University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.sysu.edu.cn;http://www.nudt.edu.cn/;http://www.hunu.edu.cn/",
        "aff_unique_abbr": "SYSU;NUDT;HNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Mol-Instructions: A Large-Scale Biomolecular Instruction Dataset for Large Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18554",
        "id": "Tlsdsb6l9n",
        "author_site": "Yin Fang, Xiaozhuan Liang, Ningyu Zhang, Kangwei Liu, Rui Huang, Zhuo Chen, Xiaohui Fan, Huajun Chen",
        "tldr": "",
        "abstract": "Large Language Models (LLMs), with their remarkable task-handling capabilities and innovative outputs, have catalyzed significant advancements across a spectrum of fields. However, their proficiency within specialized domains such as biomolecular studies remains limited. To address this challenge, we introduce Mol-Instructions, a comprehensive instruction dataset designed for the biomolecular domain. Mol-Instructions encompasses three key components: molecule-oriented instructions, protein-oriented instructions, and biomolecular text instructions. Each component aims to improve the understanding and prediction capabilities of LLMs concerning biomolecular features and behaviors. Through extensive instruction tuning experiments on LLMs, we demonstrate the effectiveness of Mol-Instructions in enhancing large models' performance in the intricate realm of biomolecular studies, thus fostering progress in the biomolecular research community. Mol-Instructions is publicly available for ongoing research and will undergo regular updates to enhance its applicability (https://github.com/zjunlp/Mol-Instructions).",
        "keywords": "instruction dataset;large language models;biomolecular studies;molecule;protein",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/595fccb2e1670e665e06d3d83545c264589ed9ae.zip",
        "author": "Yin Fang;Xiaozhuan Liang;Ningyu Zhang;Kangwei Liu;Rui Huang;Zhuo Chen;Xiaohui Fan;Huajun Chen",
        "authorids": "~Yin_Fang1;~Xiaozhuan_Liang1;~Ningyu_Zhang1;~Kangwei_Liu4;~Rui_Huang15;~Zhuo_Chen3;~Xiaohui_Fan1;~Huajun_Chen1",
        "gender": "F;M;M;M;M;;;M",
        "homepage": "https://github.com/Fangyinfff;;https://person.zju.edu.cn/en/ningyu;https://github.com/hunxuewangzi;https://github.com/HRHRHRHR666;;https://person.zju.edu.cn/en/fanxh;",
        "dblp": "231/7716;295/8804;139/4181-1.html;;;;133/8797;94/5089",
        "google_scholar": "4rWspjsAAAAJ;https://scholar.google.com.hk/citations?user=Rmt2jcYAAAAJ;xQDOPvsAAAAJ;;;;;",
        "orcid": "0000-0001-9538-848X;;0000-0002-1970-0678;;;;0000-0002-6336-3007;",
        "linkedin": ";;ningyuzhang/;;;;;",
        "or_profile": "~Yin_Fang1;~Xiaozhuan_Liang1;~Ningyu_Zhang1;~Kangwei_Liu4;~Rui_Huang15;~Zhuo_Chen3;~Xiaohui_Fan1;~Huajun_Chen1",
        "aff": "Zhejiang University;Zhejiang University;Zhejiang University;Zhejiang University;Zhejiang University;;Zhejiang University;Zhejiang University",
        "aff_domain": "zju.edu.cn;zju.edu.cn;zju.edu.cn;zju.edu.cn;zju.edu.cn;;zju.edu.cn;zju.edu.cn",
        "position": "PhD student;MS student;Associate Professor;MS student;Undergrad student;;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nfang2024molinstructions,\ntitle={Mol-Instructions: A Large-Scale Biomolecular Instruction Dataset for Large Language Models},\nauthor={Yin Fang and Xiaozhuan Liang and Ningyu Zhang and Kangwei Liu and Rui Huang and Zhuo Chen and Xiaohui Fan and Huajun Chen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Tlsdsb6l9n}\n}",
        "github": "",
        "project": "",
        "reviewers": "RHmE;aY9N;SfxB;KuQ5",
        "pdf_size": 10714224,
        "rating": "6;6;8;8",
        "confidence": "3;4;4;3",
        "soundness": "3;2;3;4",
        "contribution": "3;2;4;4",
        "presentation": "3;3;3;3",
        "wc_summary": "90;77;83;92",
        "wc_strengths": "103;82;81;73",
        "wc_weaknesses": "162;509;19;15",
        "wc_questions": "59;79;2;75",
        "wc_review": "414;747;185;255",
        "wc_reply_reviewers": "12;80;0;0",
        "wc_reply_authors": "476;684;98;197",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "2;3;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            85.5,
            5.937171043518958
        ],
        "wc_strengths_avg": [
            84.75,
            11.098986440211556
        ],
        "wc_weaknesses_avg": [
            176.25,
            201.03155846781868
        ],
        "wc_questions_avg": [
            53.75,
            30.80077109424373
        ],
        "wc_review_avg": [
            400.25,
            216.71106916814378
        ],
        "wc_reply_reviewers_avg": [
            23.0,
            33.27160951922825
        ],
        "wc_reply_authors_avg": [
            363.75,
            231.0783146467881
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 124,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16907322260583913724&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=Tlsdsb6l9n",
        "pdf": "https://openreview.net/pdf?id=Tlsdsb6l9n",
        "email": "zju.edu.cn;zju.edu.cn;zju.edu.cn;zju.edu.cn;zju.edu.cn;;zju.edu.cn;zju.edu.cn",
        "author_num": 8,
        "aff_unique_index": "0;0;0;0;0;0;0",
        "aff_unique_norm": "Zhejiang University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.zju.edu.cn",
        "aff_unique_abbr": "ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Generative Adversarial Equilibrium Solvers",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18553",
        "id": "TlyiaPXaVN",
        "author_site": "Denizalp Goktas, David Parkes, Ian Gemp, Luke Marris, Georgios Piliouras, Romuald Elie, Guy Lever, Andrea Tacchetti",
        "tldr": "",
        "abstract": "We introduce the use of generative adversarial learning to compute equilibria in general game-theoretic settings, specifically the generalized Nash equilibrium (GNE) in pseudo-games, and its specific instantiation as the competitive equilibrium (CE) in Arrow-Debreu competitive economies. Pseudo-games are a generalization of games in which players' actions affect not only the payoffs of other players but also their feasible action spaces. Although the computation of GNE and CE is intractable in the worst-case, i.e., PPAD-hard, in practice, many applications only require solutions with high accuracy in expectation over a distribution of problem instances. We introduce Generative Adversarial Equilibrium Solvers (GAES): a family of generative adversarial neural networks that can learn GNE and CE from only a sample of problem instances. We provide computational and sample complexity bounds for Lipschitz-smooth function approximators in a large class of concave pseudo-games, and apply the framework to finding Nash equilibria in normal-form games, CE in Arrow-Debreu competitive economies, and GNE in an environmental economic model of the Kyoto mechanism.",
        "keywords": "Game Theory;Amortized Optimization;Generalized Nash equilibrium;Economics",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/b816476db1b1cb66cef2c6307bc0e2f45625a622.pdf",
        "author": "Denizalp Goktas;David C. Parkes;Ian Gemp;Luke Marris;Georgios Piliouras;Romuald Elie;Guy Lever;Andrea Tacchetti",
        "authorids": "~Denizalp_Goktas1;~David_C._Parkes1;~Ian_Gemp1;~Luke_Marris2;~Georgios_Piliouras1;~Romuald_Elie3;~Guy_Lever1;~Andrea_Tacchetti1",
        "gender": "M;M;M;;;M;M;M",
        "homepage": "https://www.denizalpgoktas.com/about/;https://parkes.seas.harvard.edu/;https://imgemp.github.io/;https://www.lukemarris.info/;;;http://web.mit.edu/~atacchet/www/;https://www.deepmind.com/",
        "dblp": "297/4657;p/DavidCParkes.html;66/10996;223/4422;62/1236;52/6149;127/6624;",
        "google_scholar": "sokzE0sAAAAJ;JUn8PgwAAAAJ;5vo3MeEAAAAJ;dvTeSX4AAAAJ;;;https://scholar.google.co.uk/citations?user=HKybSogAAAAJ;",
        "orcid": ";0000-0002-2701-3464;;;;;0000-0001-9311-9171;",
        "linkedin": "denizalp-goktas/;;;;;;andreatacchetti/;",
        "or_profile": "~Denizalp_Goktas1;~David_C._Parkes1;~Ian_Gemp1;~Luke_Marris2;~Georgios_Piliouras1;~Guy_Lever1;~Andrea_Tacchetti1;~Romuald_ELIE2",
        "aff": "Brown University;Harvard University;Google DeepMind;University College London;Singapore University of Technology and Design;;Google DeepMind;Google DeepMind",
        "aff_domain": "brown.edu;harvard.edu;google.com;ucl.ac.uk;sutd.edu.sg;;google.com;deepmind.com",
        "position": "PhD student;Full Professor;Research Scientist;PhD student;Associate Professor;;Research Scientist;Researcher",
        "bibtex": "@inproceedings{\ngoktas2024generative,\ntitle={Generative Adversarial Equilibrium Solvers},\nauthor={Denizalp Goktas and David C. Parkes and Ian Gemp and Luke Marris and Georgios Piliouras and Romuald Elie and Guy Lever and Andrea Tacchetti},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=TlyiaPXaVN}\n}",
        "github": "",
        "project": "",
        "reviewers": "Db1F;pH5J;Wcqa;ni1H",
        "pdf_size": 1739619,
        "rating": "5;6;6;10",
        "confidence": "4;4;4;5",
        "soundness": "2;4;2;4",
        "contribution": "3;3;3;4",
        "presentation": "2;2;3;4",
        "wc_summary": "52;166;68;166",
        "wc_strengths": "48;78;93;164",
        "wc_weaknesses": "49;85;303;37",
        "wc_questions": "86;43;107;35",
        "wc_review": "235;372;571;402",
        "wc_reply_reviewers": "262;464;288;0",
        "wc_reply_authors": "1073;1217;1243;177",
        "reply_reviewers": "1;2;2;0",
        "reply_authors": "2;3;2;1",
        "rating_avg": [
            6.75,
            1.920286436967152
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            1.0
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            113.0,
            53.301031884945715
        ],
        "wc_strengths_avg": [
            95.75,
            42.60501731017135
        ],
        "wc_weaknesses_avg": [
            118.5,
            107.9756917088286
        ],
        "wc_questions_avg": [
            67.75,
            29.82762980861872
        ],
        "wc_review_avg": [
            395.0,
            119.53451384432866
        ],
        "wc_reply_reviewers_avg": [
            253.5,
            165.70681941308268
        ],
        "wc_reply_authors_avg": [
            927.5,
            438.11271380775975
        ],
        "reply_reviewers_avg": [
            1.25,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.9771398364036774,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18240547852975038259&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=TlyiaPXaVN",
        "pdf": "https://openreview.net/pdf?id=TlyiaPXaVN",
        "email": "brown.edu;harvard.edu;google.com;ucl.ac.uk;sutd.edu.sg;;google.com;deepmind.com",
        "author_num": 8,
        "aff_unique_index": "0;1;2;3;4;2;2",
        "aff_unique_norm": "Brown University;Harvard University;Google;University College London;Singapore University of Technology and Design",
        "aff_unique_dep": ";;Google DeepMind;;",
        "aff_unique_url": "https://www.brown.edu;https://www.harvard.edu;https://deepmind.com;https://www.ucl.ac.uk;https://www.sutd.edu.sg",
        "aff_unique_abbr": "Brown;Harvard;DeepMind;UCL;SUTD",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;1;2;1;1",
        "aff_country_unique": "United States;United Kingdom;Singapore"
    },
    {
        "id": "TmcH09s6pT",
        "title": "Generalized Neural Collapse for a Large Number of Classes",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Neural collapse provides an elegant mathematical characterization of learned last layer representations (a.k.a. features) and classifier weights in deep classification models. Such results not only provide insights but also motivate new techniques for improving practical deep models. However, most of the existing empirical and theoretical studies in neural collapse focus on the case that the number of classes is small relative to the dimension of the feature space. This paper extends neural collapse to cases where the number of classes are much larger than the dimension of feature space, which broadly occur for language models, retrieval systems, and face recognition applications. We show that the features and classifier exhibit a generalized neural collapse phenomenon, where the minimum one-vs-rest margins is maximized. We provide empirical study to verify the occurrence of generalized neural collapse in practical deep neural networks. Moreover, we provide theoretical study to show that the generalized neural collapse provably occurs under unconstrained feature model with spherical constraint, under certain technical conditions on feature dimension and number of classes.",
        "keywords": "Neural Collapse; Tammes Problem; Sphere Packing; Deep Learning",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/96c370d09e8b7a165bead5204eed09835621d4c5.pdf",
        "author": "Jiachen Jiang;Jinxin Zhou;Peng Wang;Qing Qu;Dustin Mixon;Chong You;Zhihui Zhu",
        "authorids": "~Jiachen_Jiang1;~Jinxin_Zhou2;~Peng_Wang23;~Qing_Qu2;~Dustin_Mixon2;~Chong_You2;~Zhihui_Zhu1",
        "gender": "M;;M;M;M;M;M",
        "homepage": "https://kongwanbianjinyu.github.io/;;https://peng8wang.github.io/;https://qingqu.engin.umich.edu/;https://math.osu.edu/people/mixon.23;https://sites.google.com/view/cyou;https://zhihuizhu.github.io/",
        "dblp": ";;95/4442-98;127/6874-1;;164/7311;71/8081",
        "google_scholar": "MNgI0PUAAAAJ;;baF3HKUAAAAJ;JfblW3MAAAAJ;ivJJRhgAAAAJ;Mfrpm_IAAAAJ;gmSwszcAAAAJ",
        "orcid": ";;0000-0002-6799-0745;0000-0001-9136-558X;;;",
        "linkedin": "jiachen-jiang-b5916221b/;;;qing-q-1a0b9746/;;;",
        "or_profile": "~Jiachen_Jiang1;~Jinxin_Zhou2;~Peng_Wang23;~Qing_Qu2;~Dustin_Mixon2;~Chong_You2;~Zhihui_Zhu1",
        "aff": "Ohio State University, Columbus;;University of Michigan - Ann Arbor;University of Michigan;Ohio State University, Columbus;Google;Ohio State University, Columbus",
        "aff_domain": "osu.edu;;umich.edu;umich.edu;osu.edu;google.com;osu.edu",
        "position": "PhD student;;Postdoc;Assistant Professor;Associate Professor;Research Scientist;Assistant Professor",
        "bibtex": "@misc{\njiang2024generalized,\ntitle={Generalized Neural Collapse for a Large Number of Classes},\nauthor={Jiachen Jiang and Jinxin Zhou and Peng Wang and Qing Qu and Dustin Mixon and Chong You and Zhihui Zhu},\nyear={2024},\nurl={https://openreview.net/forum?id=TmcH09s6pT}\n}",
        "github": "",
        "project": "",
        "reviewers": "4XF7;MYoA;SY44;7nq8",
        "site": "https://openreview.net/forum?id=TmcH09s6pT",
        "pdf_size": 6567059,
        "rating": "6;6;8;8",
        "confidence": "3;4;5;3",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;3;2",
        "wc_summary": "99;114;130;150",
        "wc_strengths": "72;61;100;34",
        "wc_weaknesses": "297;84;80;127",
        "wc_questions": "4;1;3;290",
        "wc_review": "472;260;313;601",
        "wc_reply_reviewers": "0;0;14;55",
        "wc_reply_authors": "1168;298;706;1666",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "3;2;2;4",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            123.25,
            18.93904696651867
        ],
        "wc_strengths_avg": [
            66.75,
            23.657715443381257
        ],
        "wc_weaknesses_avg": [
            147.0,
            88.54095097749968
        ],
        "wc_questions_avg": [
            74.5,
            124.42367138129303
        ],
        "wc_review_avg": [
            411.5,
            134.37354650376687
        ],
        "wc_reply_reviewers_avg": [
            17.25,
            22.531921799970814
        ],
        "wc_reply_authors_avg": [
            959.5,
            510.9938845035232
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.30151134457776363,
        "gs_citation": 22,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14730372549421542554&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;1;0;2;0",
        "aff_unique_norm": "Ohio State University;University of Michigan;Google",
        "aff_unique_dep": ";;Google",
        "aff_unique_url": "https://www.osu.edu;https://www.umich.edu;https://www.google.com",
        "aff_unique_abbr": "OSU;UM;Google",
        "aff_campus_unique_index": "0;1;0;3;0",
        "aff_campus_unique": "Columbus;Ann Arbor;;Mountain View",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "ToHMTetlGr",
        "title": "Noises are Transferable - An Empirical Study on Heterogeneous Domain Adaptation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Semi-supervised Heterogeneous Domain Adaptation (SHDA) handles the learning of cross-domain samples with both distinct feature representations and distributions.\nIn this paper, we perform the first empirical study on the SHDA problem by utilizing seven typical SHDA approaches for nearly 100 standard SHDA tasks. Surprisingly, we find that the noises drawn from simple distributions as source samples are transferable and can be used to improve the performance of target domain. To go deeper with the essence of the SHDA, we identify and explore several key factors, including the number of source samples, the dimensions of source samples, the original discriminability of source samples, and the transferable discriminability of source samples. Building upon extensive experimental results, we believe that the transferable knowledge in SHDA is primarily rooted in the transferable discriminability of source samples.",
        "keywords": "noises;heterogeneous domain adaptation;semi-supervised learning;transferable discriminability",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Yuan Yao;Xiaopu Zhang;Yu Zhang;Jian Jin;Zhenzhen Jiao;Zhen Fang",
        "authorids": "~Yuan_Yao15;~Xiaopu_Zhang1;~Yu_Zhang3;~Jian_Jin4;~Zhenzhen_Jiao1;~Zhen_Fang2",
        "gender": "M;M;M;M;;M",
        "homepage": "https://yyyaoyuan.github.io/;;http://cse.sustech.edu.cn/faculty/~zhangy/;http://www.caict.ac.cn;;https://fang-zhen.github.io/index.html",
        "dblp": "25/4120-16;224/3841.html;50/671-6;;;",
        "google_scholar": "https://scholar.google.com.hk/citations?user=jD1u0hAAAAAJ;;https://scholar.google.com.hk/citations?user=jaRS5w4AAAAJ;;;OzD6WJcAAAAJ",
        "orcid": ";0000-0002-9647-1477;;0000-0002-4128-966X;;0000-0003-0602-6255",
        "linkedin": ";;;;;",
        "or_profile": "~Yuan_Yao15;~Xiaopu_Zhang1;~Yu_Zhang3;~Jian_Jin4;~Zhenzhen_Jiao1;~Zhen_Fang2",
        "aff": "Beijing Teleinfo Technology Co., LTD;Beijing Teleinfo Technology Company Limited;Southern University of Science and Technology;Pengcheng Labs;;University of Technology Sydney",
        "aff_domain": "teleinfo.cn;teleinfo.cn;sustc.edu.cn;pcl.ac.cn;;uts.edu.au",
        "position": "Researcher;Researcher;Associate Professor;Full Professor;;Assistant Professor",
        "bibtex": "@misc{\nanonymous2025noises,\ntitle={Noises are Transferable - An Empirical Study on Heterogeneous Domain Adaptation},\nauthor={Anonymous},\nyear={2025},\nurl={https://openreview.net/forum?id=ToHMTetlGr}\n}",
        "github": "",
        "project": "",
        "reviewers": "SDg6;AqYr;9AV3;WVvA",
        "site": "https://openreview.net/forum?id=ToHMTetlGr",
        "pdf_size": 920412,
        "rating": "3;3;5;6",
        "confidence": "3;5;4;2",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;4;3",
        "wc_summary": "51;51;53;47",
        "wc_strengths": "17;59;17;27",
        "wc_weaknesses": "350;201;243;57",
        "wc_questions": "5;4;1;87",
        "wc_review": "423;315;314;218",
        "wc_reply_reviewers": "262;0;0;35",
        "wc_reply_authors": "5295;554;688;553",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "7;1;1;2",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            50.5,
            2.179449471770337
        ],
        "wc_strengths_avg": [
            30.0,
            17.233687939614086
        ],
        "wc_weaknesses_avg": [
            212.75,
            105.05801968436299
        ],
        "wc_questions_avg": [
            24.25,
            36.25861966484659
        ],
        "wc_review_avg": [
            317.5,
            72.54136750847753
        ],
        "wc_reply_reviewers_avg": [
            74.25,
            109.33520704695263
        ],
        "wc_reply_authors_avg": [
            1772.5,
            2034.4574829668966
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.75,
            2.48746859276655
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.6024640760767093,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:xCUaH9m-hM8J:scholar.google.com/&scioq=Noises+are+Transferable+-+An+Empirical+Study+on+Heterogeneous+Domain+Adaptation&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "Beijing Teleinfo Technology Co., LTD;Beijing Teleinfo Technology Company Limited;Southern University of Science and Technology;Pengcheng Labs;University of Technology Sydney",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": ";;https://www.sustech.edu.cn;;https://www.uts.edu.au",
        "aff_unique_abbr": ";;SUSTech;;UTS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;1",
        "aff_country_unique": "China;Australia"
    },
    {
        "title": "Meta Continual Learning Revisited: Implicitly Enhancing Online Hessian Approximation via Variance Reduction",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18552",
        "id": "TpD2aG1h0D",
        "author_site": "Yichen Wu, Long-Kai Huang, Renzhen Wang, Deyu Meng, Ying Wei",
        "tldr": "",
        "abstract": "Regularization-based methods have so far been among the *de facto* choices for continual learning. Recent theoretical studies have revealed that these methods all boil down to relying on the Hessian matrix approximation of model weights. \nHowever, these methods suffer from suboptimal trade-offs between knowledge transfer and forgetting due to fixed and unchanging Hessian estimations during training.\nAnother seemingly parallel strand of Meta-Continual Learning (Meta-CL) algorithms enforces alignment between gradients of previous tasks and that of the current task. \nIn this work we revisit Meta-CL and for the first time bridge it with regularization-based methods. Concretely, Meta-CL implicitly approximates Hessian in an online manner, which enjoys the benefits of timely adaptation but meantime suffers from high variance induced by random memory buffer sampling. \nWe are thus highly motivated to combine the best of both worlds, through the proposal of Variance Reduced Meta-CL (VR-MCL) to achieve both timely and accurate Hessian approximation.\nThrough comprehensive experiments across three datasets and various settings, we consistently observe that VR-MCL outperforms other SOTA methods, which further validates the effectiveness of VR-MCL.",
        "keywords": "Continual Learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Yichen Wu;Long-Kai Huang;Renzhen Wang;Deyu Meng;Ying Wei",
        "authorids": "~Yichen_Wu2;~Long-Kai_Huang1;~Renzhen_Wang1;~Deyu_Meng1;~Ying_Wei1",
        "gender": "M;;M;M;F",
        "homepage": "https://wuyichen-97.github.io/;https://sites.google.com/site/longkaihugo/home;;http://dymeng.gr.xjtu.edu.cn;https://wei-ying.net/",
        "dblp": ";133/2006;242/6299;22/5614;14/4899-1",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;CaP64WUAAAAJ;https://scholar.google.com.hk/citations?user=QZ1-nnwAAAAJ;an6w-64AAAAJ;5UpFdKsAAAAJ",
        "orcid": "0000-0003-2859-3285;0000-0001-5263-1443;;0000-0002-1294-8283;",
        "linkedin": ";;;;",
        "or_profile": "~Yichen_Wu2;~Long-Kai_Huang1;~Renzhen_Wang1;~Deyu_Meng1;~Ying_Wei1",
        "aff": "City University of Hong Kong;Tencent;Xi'an Jiaotong University;Xi'an Jiaotong University;Nanyang Technological University",
        "aff_domain": "cityu.edu.hk;tencent.com;xjtu.edu.cn;xjtu.edu.cn;ntu.edu.sg",
        "position": "PhD student;Researcher;Assistant Professor;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nwu2024meta,\ntitle={Meta Continual Learning Revisited: Implicitly Enhancing Online Hessian Approximation via Variance Reduction},\nauthor={Yichen Wu and Long-Kai Huang and Renzhen Wang and Deyu Meng and Ying Wei},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=TpD2aG1h0D}\n}",
        "github": "",
        "project": "",
        "reviewers": "1xci;6aKN;Z5So",
        "pdf_size": 1973959,
        "rating": "8;8;10",
        "confidence": "3;5;4",
        "soundness": "3;3;4",
        "contribution": "3;3;4",
        "presentation": "3;3;4",
        "wc_summary": "151;49;171",
        "wc_strengths": "60;64;437",
        "wc_weaknesses": "72;223;47",
        "wc_questions": "254;62;8",
        "wc_review": "537;398;663",
        "wc_reply_reviewers": "42;25;56",
        "wc_reply_authors": "1331;1203;461",
        "reply_reviewers": "1;1;2",
        "reply_authors": "3;3;2",
        "rating_avg": [
            8.666666666666666,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            123.66666666666667,
            53.42492135906446
        ],
        "wc_strengths_avg": [
            187.0,
            176.78423760807033
        ],
        "wc_weaknesses_avg": [
            114.0,
            77.74745440634483
        ],
        "wc_questions_avg": [
            108.0,
            105.56514576317318
        ],
        "wc_review_avg": [
            532.6666666666666,
            108.22918070259774
        ],
        "wc_reply_reviewers_avg": [
            41.0,
            12.675435561221029
        ],
        "wc_reply_authors_avg": [
            998.3333333333334,
            383.52864589522153
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 22,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9115519366760254217&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=TpD2aG1h0D",
        "pdf": "https://openreview.net/pdf?id=TpD2aG1h0D",
        "email": "cityu.edu.hk;tencent.com;xjtu.edu.cn;xjtu.edu.cn;ntu.edu.sg",
        "author_num": 5,
        "aff_unique_index": "0;1;2;2;3",
        "aff_unique_norm": "City University of Hong Kong;Tencent;Xi'an Jiao Tong University;Nanyang Technological University",
        "aff_unique_dep": ";Tencent Holdings Limited;;",
        "aff_unique_url": "https://www.cityu.edu.hk;https://www.tencent.com;https://www.xjtu.edu.cn;https://www.ntu.edu.sg",
        "aff_unique_abbr": "CityU;Tencent;XJTU;NTU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0;1",
        "aff_country_unique": "China;Singapore"
    },
    {
        "id": "Tpk0p9QBM6",
        "title": "Computing Low-Entropy Couplings for Large-Support Distributions",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "A minimum-entropy coupling is a joint probability distribution having minimum joint entropy among all joint distributions with given pre-specified marginals. While provable approximation algorithms for a minimum-entropy coupling exist, they take log-linear time in the size of the support of the marginal distributions. Thus, applications involving very large-support distributions instead use a class of heuristic iterative minimum-entropy coupling (IMEC) algorithms. Unfortunately, existing IMEC algorithms are limited to specific classes of distributions, prohibiting applications involving general large-support distributions. In this work, we resolve this issue by making three main contributions: 1) We unify existing IMEC algorithms under a single formalism using sets of partitions. 2) We derive a new IMEC instance from this formalism, which we call ARIMEC, that, unlike existing IMEC algorithms, can be applied to arbitrary discrete distributions; furthermore, we introduce associated operations that make ARIMEC efficient in practice. 3) We empirically illustrate the utility of ARIMEC for both Markov coding games and steganography.",
        "keywords": "minimum-entropy coupling",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Samuel Sokota;Dylan Sam;Christian Schroeder de Witt;Spencer Compton;Jakob Nicolaus Foerster;J Zico Kolter",
        "authorids": "~Samuel_Sokota1;~Dylan_Sam1;~Christian_Schroeder_de_Witt1;~Spencer_Compton1;~Jakob_Nicolaus_Foerster1;~J_Zico_Kolter1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://ssokota.github.io/;https://dsam99.github.io/;https://www.schroederdewitt.com;;https://www.jakobfoerster.com;http://www.zicokolter.com",
        "dblp": "243/5881;289/8487.html;;258/3302;176/5095;67/2526",
        "google_scholar": ";43ffAwcAAAAJ;DE60h_0AAAAJ;;6z4lQzMAAAAJ;UXh1I6UAAAAJ",
        "orcid": ";;;;;",
        "linkedin": "samuel-sokota-87a153149/;;;;;",
        "or_profile": "~Samuel_Sokota1;~Dylan_Sam1;~Christian_Schroeder_de_Witt1;~Spencer_Compton1;~Jakob_Nicolaus_Foerster1;~Zico_Kolter1",
        "aff": "Carnegie Mellon University;Google;University of Oxford;Stanford University;University of Oxford, University of Oxford;Carnegie Mellon University",
        "aff_domain": "cmu.edu;google.com;oxford.ac.uk;stanford.edu;eng.ox.ac.uk;cmu.edu",
        "position": "PhD student;Intern;Lecturer;PhD student;Associate Professor;Full Professor",
        "bibtex": "@misc{\nsokota2024computing,\ntitle={Computing Low-Entropy Couplings for Large-Support Distributions},\nauthor={Samuel Sokota and Dylan Sam and Christian Schroeder de Witt and Spencer Compton and Jakob Nicolaus Foerster and J Zico Kolter},\nyear={2024},\nurl={https://openreview.net/forum?id=Tpk0p9QBM6}\n}",
        "github": "",
        "project": "",
        "reviewers": "caMu;n51E;dCYg",
        "site": "https://openreview.net/forum?id=Tpk0p9QBM6",
        "pdf_size": 1153300,
        "rating": "3;5;6",
        "confidence": "3;2;3",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "2;4;3",
        "wc_summary": "196;157;38",
        "wc_strengths": "62;175;47",
        "wc_weaknesses": "448;50;71",
        "wc_questions": "163;35;98",
        "wc_review": "869;417;254",
        "wc_reply_reviewers": "458;0;13",
        "wc_reply_authors": "1576;335;274",
        "reply_reviewers": "2;0;1",
        "reply_authors": "5;1;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            130.33333333333334,
            67.20284385516898
        ],
        "wc_strengths_avg": [
            94.66666666666667,
            57.13337222869154
        ],
        "wc_weaknesses_avg": [
            189.66666666666666,
            182.87032442568577
        ],
        "wc_questions_avg": [
            98.66666666666667,
            52.25790742929618
        ],
        "wc_review_avg": [
            513.3333333333334,
            260.1491025461275
        ],
        "wc_reply_reviewers_avg": [
            157.0,
            212.90529976181116
        ],
        "wc_reply_authors_avg": [
            728.3333333333334,
            599.9079559028664
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            1.8856180831641267
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.18898223650461363,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16315371507419467054&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;2;3;2;0",
        "aff_unique_norm": "Carnegie Mellon University;Google;University of Oxford;Stanford University",
        "aff_unique_dep": ";Google;;",
        "aff_unique_url": "https://www.cmu.edu;https://www.google.com;https://www.ox.ac.uk;https://www.stanford.edu",
        "aff_unique_abbr": "CMU;Google;Oxford;Stanford",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Mountain View;Stanford",
        "aff_country_unique_index": "0;0;1;0;1;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "TppgZwyEnQ",
        "title": "On the memorisation of image classifiers",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The success of modern neural models has prompted study of the connection between memorisation and generalisation: such models generalise well, despite being able to perfectly fit (\u201cmemorise\u201d) completely random labels.  To more carefully study this issue, recent work proposed an intuitive metric to quantify the degree of memorisation of individual training examples, and empirically computed the corresponding memorisation profile of a ResNet on image classification benchmarks.  While an exciting first glimpse into what real-world models memorise, these studies leave open a fundamental question: do larger neural models memorise more? We present a comprehensive empirical analysis of this question on image classification benchmarks. Intriguingly, we find that training examples exhibit a diverse set of memorisation trajectories across model sizes: while most samples experience decreased memorisation under larger models, surprisingly, there is a dichotomy between the remaining samples. In particular, per-example memorisation trajectories reveal that examples exhibit decreasing or cap-shaped memorisation, and some examples even exhibit increasing memorisation. We further show that various memorisation proxies fail to capture such fundamental characteristics as we vary model size. Lastly, we find that knowledge distillation \u2014 an effective and popular model compression technique \u2014 tends to inhibit memorisation, while also improving generalisation. Intriguingly, we find that the memorisation is mostly inhibited on examples for which memorisation increases as the model size increases, thus pointing at how distillation improves generalisation by limiting memorisation of such examples.",
        "keywords": "memorization;generalization;distillation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Michal Lukasik;Vaishnavh Nagarajan;Ankit Singh Rawat;Aditya Krishna Menon;Sanjiv Kumar",
        "authorids": "~Michal_Lukasik1;~Vaishnavh_Nagarajan3;~Ankit_Singh_Rawat1;~Aditya_Krishna_Menon1;~Sanjiv_Kumar1",
        "gender": ";M;;M;M",
        "homepage": "https://mlukasik.github.io/;https://ankitsrawat.github.io/home/;http://www.sanjivk.com/;https://akmenon.github.io/;https://vaishnavh.github.io/",
        "dblp": "72/11338;https://dblp.org/pers/hd/r/Rawat:Ankit_Singh;;89/3514;161/0079",
        "google_scholar": "https://scholar.google.co.uk/citations?user=cLZLZCQAAAAJ;http://scholar.google.com/citations?user=U0_ab4cAAAAJ;https://scholar.google.com/citations?hl=en;;https://scholar.google.nl/citations?user=LrsjJfwAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Michal_Lukasik1;~Ankit_Singh_Rawat1;~Sanjiv_Kumar1;~Aditya_Menon1;~Vaishnavh_Nagarajan1",
        "aff": "Google Research;Google;Google;Google;Google",
        "aff_domain": "google.com;google.com;google.com;google.com;google.com",
        "position": "Research Scientist;Research Scientist;Research Scientist;Research Scientist;Researcher",
        "bibtex": "@misc{\nlukasik2024on,\ntitle={On the memorisation of image classifiers},\nauthor={Michal Lukasik and Vaishnavh Nagarajan and Ankit Singh Rawat and Aditya Krishna Menon and Sanjiv Kumar},\nyear={2024},\nurl={https://openreview.net/forum?id=TppgZwyEnQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "qzMw;zqKb;eUrH;6PUm",
        "site": "https://openreview.net/forum?id=TppgZwyEnQ",
        "pdf_size": 3907283,
        "rating": "3;3;5;6",
        "confidence": "4;4;4;2",
        "soundness": "1;2;2;2",
        "contribution": "1;2;2;3",
        "presentation": "3;2;4;4",
        "wc_summary": "99;89;44;65",
        "wc_strengths": "47;100;20;65",
        "wc_weaknesses": "419;394;117;83",
        "wc_questions": "85;75;103;3",
        "wc_review": "650;658;284;216",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            74.25,
            21.39363223017541
        ],
        "wc_strengths_avg": [
            58.0,
            29.06028217344078
        ],
        "wc_weaknesses_avg": [
            253.25,
            153.97463265096624
        ],
        "wc_questions_avg": [
            66.5,
            38.00986713999406
        ],
        "wc_review_avg": [
            452.0,
            203.44532435030303
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.7777777777777777,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:UpefiBo8vn8J:scholar.google.com/&scioq=On+the+memorisation+of+image+classifiers&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Google",
        "aff_unique_dep": "Google Research",
        "aff_unique_url": "https://research.google",
        "aff_unique_abbr": "Google Research",
        "aff_campus_unique_index": "0;0;0;0;0",
        "aff_campus_unique": "Mountain View",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "GeoLLM: Extracting Geospatial Knowledge from Large Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18551",
        "id": "TqL2xBwXP3",
        "author_site": "Rohin Manvi, Samar Khanna, Gengchen Mai, Marshall Burke, David Lobell, Stefano Ermon",
        "tldr": "",
        "abstract": "The application of machine learning (ML) in a range of geospatial tasks is increasingly common but often relies on globally available covariates such as satellite imagery that can either be expensive or lack predictive power.\nHere we explore the question of whether the vast amounts of knowledge found in Internet language corpora, now compressed within large language models (LLMs), can be leveraged for geospatial prediction tasks. \nWe first demonstrate that LLMs embed remarkable spatial information about locations, but \nnaively querying LLMs using geographic coordinates alone is ineffective in predicting key indicators like population density. \nWe then present GeoLLM, a novel method that can effectively extract geospatial knowledge from LLMs with auxiliary map data from OpenStreetMap.\nWe demonstrate the utility of our approach across multiple tasks of central interest to the international community, including the measurement of population density and economic livelihoods.\nAcross these tasks, our method demonstrates a 70\\% improvement in performance (measured using Pearson's $r^2$) relative to baselines that use nearest neighbors or use information directly from the prompt, and performance equal to or exceeding satellite-based benchmarks in the literature.\nWith GeoLLM, we observe that GPT-3.5 outperforms Llama 2 and RoBERTa by 19\\% and 51\\% respectively, suggesting that the performance of our method scales well with the size of the model and its pretraining dataset.\nOur experiments reveal that LLMs are remarkably sample-efficient, rich in geospatial information, and robust across the globe.\nCrucially, GeoLLM shows promise in mitigating the limitations of existing geospatial covariates and complementing them well.\nCode is available on the project website: https://rohinmanvi.github.io/GeoLLM",
        "keywords": "geospatial;knowledge extraction;large language models;pre-trained language models;natural language processing",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Rohin Manvi;Samar Khanna;Gengchen Mai;Marshall Burke;David B. Lobell;Stefano Ermon",
        "authorids": "~Rohin_Manvi1;~Samar_Khanna1;~Gengchen_Mai1;~Marshall_Burke1;~David_B._Lobell1;~Stefano_Ermon1",
        "gender": "M;;M;;;M",
        "homepage": ";https://samar-khanna.github.io/;https://gengchenmai.github.io/;http://web.stanford.edu/~mburke/;;http://cs.stanford.edu/~ermon/",
        "dblp": ";;151/5583;;00/11322;47/8135",
        "google_scholar": ";DPHEQsMAAAAJ;X2Wfl1UAAAAJ;ppx71KUAAAAJ;;",
        "orcid": ";;0000-0002-7818-7309;;;",
        "linkedin": "rohin-manvi-2a9226187/;samar-khanna-133b8190/;gengchen-mai-144439121/;;;",
        "or_profile": "~Rohin_Manvi1;~Samar_Khanna1;~Gengchen_Mai1;~Marshall_Burke1;~David_B._Lobell1;~Stefano_Ermon1",
        "aff": "Stanford University;Computer Science Department, Stanford University;University of Georgia;;Stanford University;Stanford University",
        "aff_domain": "stanford.edu;cs.stanford.edu;uga.edu;;stanford.edu;stanford.edu",
        "position": "Undergrad student;Researcher;Assistant Professor;;Full Professor;Associate Professor",
        "bibtex": "@inproceedings{\nmanvi2024geollm,\ntitle={Geo{LLM}: Extracting Geospatial Knowledge from Large Language Models},\nauthor={Rohin Manvi and Samar Khanna and Gengchen Mai and Marshall Burke and David B. Lobell and Stefano Ermon},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=TqL2xBwXP3}\n}",
        "github": "",
        "project": "",
        "reviewers": "xypS;Gcfb;92yi;5MUc;tFFk",
        "pdf_size": 2422214,
        "rating": "3;5;6;6;8",
        "confidence": "4;5;4;3;4",
        "soundness": "2;2;3;3;3",
        "contribution": "1;3;2;2;3",
        "presentation": "2;3;3;3;3",
        "wc_summary": "41;125;78;76;34",
        "wc_strengths": "22;115;98;65;72",
        "wc_weaknesses": "94;187;201;35;47",
        "wc_questions": "155;33;33;15;367",
        "wc_review": "312;460;410;191;520",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "819;435;333;282;523",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "3;2;2;2;2",
        "rating_avg": [
            5.6,
            1.624807680927192
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.2,
            0.7483314773547882
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            70.8,
            32.43084951092092
        ],
        "wc_strengths_avg": [
            74.4,
            31.765389970847203
        ],
        "wc_weaknesses_avg": [
            112.8,
            69.31204801475714
        ],
        "wc_questions_avg": [
            120.6,
            132.96255111872665
        ],
        "wc_review_avg": [
            378.6,
            115.96137287907555
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            478.4,
            189.5231911930569
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.2,
            0.39999999999999997
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.19462473604038075,
        "gs_citation": 95,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15299718393224649135&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=TqL2xBwXP3",
        "pdf": "https://openreview.net/pdf?id=TqL2xBwXP3",
        "email": "stanford.edu;cs.stanford.edu;uga.edu;;stanford.edu;stanford.edu",
        "author_num": 6,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "Stanford University;University of Georgia",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.stanford.edu;https://www.uga.edu",
        "aff_unique_abbr": "Stanford;UGA",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Stanford;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "LILO: Learning Interpretable Libraries by Compressing and Documenting Code",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18550",
        "id": "TqYbAWKMIe",
        "author_site": "Gabriel Grand, Lio Wong, Maddy Bowers, Theo X. Olausson, Muxin Liu, Joshua B Tenenbaum, Jacob Andreas",
        "tldr": "",
        "abstract": "While large language models (LLMs) now excel at code generation, a key aspect of software development is the art of refactoring: consolidating code into libraries of reusable and readable programs. In this paper, we introduce LILO, a neurosymbolic framework that iteratively synthesizes, compresses, and documents code to build libraries tailored to particular problem domains. LILO combines LLM-guided program synthesis with recent algorithmic advances in automated refactoring from Stitch: a symbolic compression system that efficiently identifies optimal lambda abstractions across large code corpora. To make these abstractions interpretable, we introduce an auto-documentation (AutoDoc) procedure that infers natural language names and docstrings based on contextual examples of usage. In addition to improving human readability, we find that AutoDoc boosts performance by helping LILO's synthesizer to interpret and deploy learned abstractions. We evaluate LILO on three inductive program synthesis benchmarks for string editing, scene reasoning, and graphics composition. Compared to existing neural and symbolic methods\u2014including the state-of-the-art library learning algorithm DreamCoder\u2014LILO solves more complex tasks and learns richer libraries that are grounded in linguistic knowledge.",
        "keywords": "program synthesis;language models;library learning;compression;refactoring;abstraction;documentation;neurosymbolic",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "",
        "author": "Gabriel Grand;Lionel Wong;Matthew Bowers;Theo X. Olausson;Muxin Liu;Joshua B. Tenenbaum;Jacob Andreas",
        "authorids": "~Gabriel_Grand1;~Lionel_Wong1;~Matthew_Bowers1;~Theo_X._Olausson1;~Muxin_Liu1;~Joshua_B._Tenenbaum1;~Jacob_Andreas1",
        "gender": "M;F;F;;M;Non-Binary;M",
        "homepage": "https://www.gabegrand.com;https://mlb2251.github.io/;https://www.linkedin.com/in/maxine-liu-60577422a/;;http://web.mit.edu/jda/www;https://web.mit.edu/zyzzyva/www/academic.html;https://people.csail.mit.edu/theoxo/",
        "dblp": "215/3760;282/1446;;t/JoshuaBTenenbaum;97/8154;339/3594;334/7669",
        "google_scholar": "1qmAFhsAAAAJ;ghdbIsoAAAAJ;;;dnZ8udEAAAAJ;KssJcIAAAAAJ;e7K3ZagAAAAJ",
        "orcid": "0000-0003-1920-0021;0000-0001-8450-7033;;;;;0000-0001-6653-2227",
        "linkedin": ";;;;;;",
        "or_profile": "~Gabriel_Grand1;~Matthew_Bowers1;~Muxin_Liu1;~Joshua_B._Tenenbaum1;~Jacob_Andreas1;~Catherine_Wong1;~Theo_X_Olausson1",
        "aff": "Massachusetts Institute of Technology;Massachusetts Institute of Technology;Harvey Mudd College;Massachusetts Institute of Technology;Microsoft;Massachusetts Institute of Technology;Massachusetts Institute of Technology",
        "aff_domain": "mit.edu;mit.edu;hmc.edu;mit.edu;microsoft.com;mit.edu;mit.edu",
        "position": "PhD student;PhD student;Undergrad student;Professor;Researcher;PhD student;PhD student",
        "bibtex": "@inproceedings{\ngrand2024lilo,\ntitle={{LILO}: Learning Interpretable Libraries by Compressing and Documenting Code},\nauthor={Gabriel Grand and Lionel Wong and Matthew Bowers and Theo X. Olausson and Muxin Liu and Joshua B. Tenenbaum and Jacob Andreas},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=TqYbAWKMIe}\n}",
        "github": "",
        "project": "",
        "reviewers": "dfJc;FkLi;NLqL;oPbs",
        "pdf_size": 4125247,
        "rating": "6;6;8;8",
        "confidence": "4;3;4;5",
        "soundness": "3;3;4;4",
        "contribution": "2;3;4;3",
        "presentation": "4;3;3;4",
        "wc_summary": "102;54;75;148",
        "wc_strengths": "34;83;27;296",
        "wc_weaknesses": "287;84;78;373",
        "wc_questions": "219;39;115;356",
        "wc_review": "642;260;295;1173",
        "wc_reply_reviewers": "355;11;120;137",
        "wc_reply_authors": "2037;917;1220;1667",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "4;3;2;3",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            94.75,
            35.13812032536743
        ],
        "wc_strengths_avg": [
            110.0,
            109.5331000200396
        ],
        "wc_weaknesses_avg": [
            205.5,
            128.17663593650755
        ],
        "wc_questions_avg": [
            182.25,
            118.93564436282338
        ],
        "wc_review_avg": [
            592.5,
            366.9104114085617
        ],
        "wc_reply_reviewers_avg": [
            155.75,
            124.78256088091797
        ],
        "wc_reply_authors_avg": [
            1460.25,
            426.6810137561783
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.7071067811865475,
        "gs_citation": 19,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13932515265575934055&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=TqYbAWKMIe",
        "pdf": "https://openreview.net/pdf?id=TqYbAWKMIe",
        "email": "mit.edu;mit.edu;hmc.edu;mit.edu;microsoft.com;mit.edu;mit.edu",
        "author_num": 7,
        "aff_unique_index": "0;0;1;0;2;0;0",
        "aff_unique_norm": "Massachusetts Institute of Technology;Harvey Mudd College;Microsoft",
        "aff_unique_dep": ";;Microsoft Corporation",
        "aff_unique_url": "https://web.mit.edu;https://www.hmc.edu;https://www.microsoft.com",
        "aff_unique_abbr": "MIT;HMC;Microsoft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Plug-and-Play: An Efficient Post-training Pruning Method for Large Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18549",
        "id": "Tr0lPx9woF",
        "author_site": "Yingtao Zhang, Haoli Bai, Haokun Lin, Jialin Zhao, LU HOU, Carlo Vittorio Cannistraci",
        "tldr": "",
        "abstract": "With the rapid growth of large language models (LLMs), there is increasing demand for memory and computation in LLMs. Recent efforts on post-training pruning of LLMs aim to reduce the model size and computation requirements, yet the performance is still sub-optimal. \nIn this paper, we present a plug-and-play solution for post-training pruning of LLMs.\nThe proposed solution has two innovative components: 1) **Relative Importance and Activations (RIA)**, a new pruning metric that jointly considers the weight and activations efficiently on LLMs, and 2) **Channel Permutation**, a new approach to maximally preserves important weights under N:M sparsity.\nThe two proposed components can be readily combined to further enhance the N:M semi-structured pruning of LLMs.\nOur empirical experiments show that RIA alone can already surpass all existing post-training pruning methods on prevalent LLMs, e.g., LLaMA ranging from 7B to 65B. Furthermore, N:M semi-structured pruning with channel permutation can even outperform the original LLaMA2-70B on zero-shot tasks, together with practical speed-up on specific hardware.\nOur code is available at: https://github.com/biomedical-cybernetics/Relative-importance-and-activation-pruning",
        "keywords": "Post-Training Pruning;Combinatorial Optimization;Large Language Models;Inference Acceleration",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Yingtao Zhang;Haoli Bai;Haokun Lin;Jialin Zhao;Lu Hou;Carlo Vittorio Cannistraci",
        "authorids": "~Yingtao_Zhang3;~Haoli_Bai2;~Haokun_Lin4;~Jialin_Zhao1;~Lu_Hou2;~Carlo_Vittorio_Cannistraci1",
        "gender": "M;M;;M;;M",
        "homepage": "https://brain.tsinghua.edu.cn/en/info/1048/1156.htm;https://haolibai.github.io;;https://github.com/abcbdf/;;https://brain.tsinghua.edu.cn/en/info/1010/1003.htm",
        "dblp": ";195/9712;;160/9058-4;;54/8711",
        "google_scholar": ";;;;;b7xoXO0AAAAJ",
        "orcid": ";;;;;0000-0003-0100-8410",
        "linkedin": ";;;;;",
        "or_profile": "~Yingtao_Zhang3;~Haoli_Bai2;~Haokun_Lin4;~Jialin_Zhao1;~Lu_Hou2;~Carlo_Vittorio_Cannistraci1",
        "aff": "Tsinghua University;Huawei Technologies Ltd.;;Tsinghua University;;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;huawei.com;;tsinghua.edu.cn;;tsinghua.edu.cn",
        "position": "PhD student;Researcher;;PhD student;;Full Professor",
        "bibtex": "@inproceedings{\nzhang2024plugandplay,\ntitle={Plug-and-Play: An Efficient Post-training Pruning Method for Large Language Models},\nauthor={Yingtao Zhang and Haoli Bai and Haokun Lin and Jialin Zhao and Lu Hou and Carlo Vittorio Cannistraci},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Tr0lPx9woF}\n}",
        "github": "",
        "project": "",
        "reviewers": "hn9p;ee73;NPvK;dzPo",
        "pdf_size": 2119576,
        "rating": "6;6;6;8",
        "confidence": "4;4;3;4",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "53;239;132;69",
        "wc_strengths": "79;94;38;33",
        "wc_weaknesses": "216;86;413;136",
        "wc_questions": "50;47;6;6",
        "wc_review": "398;466;589;244",
        "wc_reply_reviewers": "140;0;196;16",
        "wc_reply_authors": "1373;883;2417;1202",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "2;2;4;3",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            123.25,
            73.06290098264645
        ],
        "wc_strengths_avg": [
            61.0,
            26.105554964413226
        ],
        "wc_weaknesses_avg": [
            212.75,
            124.5659965640704
        ],
        "wc_questions_avg": [
            27.25,
            21.276454121869087
        ],
        "wc_review_avg": [
            424.25,
            124.5639895796534
        ],
        "wc_reply_reviewers_avg": [
            88.0,
            82.60750571225353
        ],
        "wc_reply_authors_avg": [
            1468.75,
            575.0227712882335
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 47,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9265049272667044988&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=Tr0lPx9woF",
        "pdf": "https://openreview.net/pdf?id=Tr0lPx9woF",
        "email": "tsinghua.edu.cn;huawei.com;;tsinghua.edu.cn;;tsinghua.edu.cn",
        "author_num": 6,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Tsinghua University;Huawei",
        "aff_unique_dep": ";Huawei Technologies",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.huawei.com",
        "aff_unique_abbr": "THU;Huawei",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Sample-Efficient Linear Representation Learning from Non-IID Non-Isotropic Data",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18548",
        "id": "Tr3fZocrI6",
        "author_site": "Thomas T. Zhang, Leonardo Felipe Toso, James Anderson, Nikolai Matni",
        "tldr": "",
        "abstract": "A powerful concept behind much of the recent progress in machine learning is the extraction of common features across data from heterogeneous sources or tasks. Intuitively, using all of one's data to learn a common representation function benefits both computational effort and statistical generalization by leaving a smaller number of parameters to fine-tune on a given task. Toward theoretically grounding these merits, we propose a general setting of recovering linear operators $M$\nfrom noisy vector measurements $y = Mx + w$, where the covariates $x$ may be both non-i.i.d. and non-isotropic. We demonstrate that existing isotropy-agnostic meta-learning approaches incur biases on the representation update, which causes the scaling of the noise terms to lose favorable dependence on the number of source tasks. This in turn can cause the sample complexity of representation learning to be bottlenecked by the single-task data size. We introduce an adaptation, $\\texttt{De-bias}$ & $\\texttt{Feature-Whiten}$ ($\\texttt{DFW}$), of the popular alternating minimization-descent (AMD) scheme proposed in Collins et al., (2021), and establish linear convergence to the optimal representation with noise level scaling down with the $\\textit{total}$ source data size. This leads to generalization bounds on the same order as an oracle empirical risk minimizer. We verify the vital importance of $\\texttt{DFW}$ on various numerical simulations. In particular, we show that vanilla alternating-minimization descent fails catastrophically even for iid, but mildly non-isotropic data.\nOur analysis unifies and generalizes prior work, and provides a flexible framework for a wider range of applications, such as in controls and dynamical systems.",
        "keywords": "Representation learning;meta learning;multi-task learning",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/eca16fea73445d29c9ffccfcc46a2cbca73c3fba.pdf",
        "author": "Thomas TCK Zhang;Leonardo Felipe Toso;James Anderson;Nikolai Matni",
        "authorids": "~Thomas_TCK_Zhang1;~Leonardo_Felipe_Toso1;~James_Anderson6;~Nikolai_Matni2",
        "gender": "M;;M;M",
        "homepage": ";http://www.columbia.edu/~ja3451/;https://nikolaimatni.github.io;http://thomaszh3.github.io",
        "dblp": "304/4835;;52/8135;143/7488",
        "google_scholar": "IbpD59gAAAAJ;https://scholar.google.co.uk/citations?user=rIX6oiMAAAAJ;ZDPCh_EAAAAJ;0ZSqAe0AAAAJ",
        "orcid": ";0000-0001-8210-6527;;",
        "linkedin": ";;;",
        "or_profile": "~Leonardo_Felipe_Toso1;~James_Anderson6;~Nikolai_Matni1;~Thomas_Tian_Cheng_Kaiming_Zhang1",
        "aff": "Columbia University;Columbia University;School of Engineering and Applied Science, University of Pennsylvania;University of Pennsylvania",
        "aff_domain": "columbia.edu;columbia.edu;seas.upenn.edu;seas.upenn.edu",
        "position": "PhD student;Assistant Professor;Assistant Professor;PhD student",
        "bibtex": "@inproceedings{\nzhang2024sampleefficient,\ntitle={Sample-Efficient Linear Representation Learning from Non-{IID} Non-Isotropic Data},\nauthor={Thomas TCK Zhang and Leonardo Felipe Toso and James Anderson and Nikolai Matni},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Tr3fZocrI6}\n}",
        "github": "",
        "project": "",
        "reviewers": "6Cex;St8o;ZRaH;4V27",
        "pdf_size": 639531,
        "rating": "6;8;8;8",
        "confidence": "3;3;4;3",
        "soundness": "2;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;4;3;4",
        "wc_summary": "70;103;64;102",
        "wc_strengths": "67;220;91;46",
        "wc_weaknesses": "89;310;168;104",
        "wc_questions": "224;245;3;23",
        "wc_review": "450;878;326;275",
        "wc_reply_reviewers": "25;64;0;12",
        "wc_reply_authors": "411;1210;480;552",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            84.75,
            17.879807045938723
        ],
        "wc_strengths_avg": [
            106.0,
            67.71632004177427
        ],
        "wc_weaknesses_avg": [
            167.75,
            87.32231959814169
        ],
        "wc_questions_avg": [
            123.75,
            111.22359237140293
        ],
        "wc_review_avg": [
            482.25,
            237.1838685492755
        ],
        "wc_reply_reviewers_avg": [
            25.25,
            24.055924426219832
        ],
        "wc_reply_authors_avg": [
            663.25,
            319.57892217729255
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8404394594608484681&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=Tr3fZocrI6",
        "pdf": "https://openreview.net/pdf?id=Tr3fZocrI6",
        "email": "columbia.edu;columbia.edu;seas.upenn.edu;seas.upenn.edu",
        "author_num": 4,
        "aff_unique_index": "0;0;1;1",
        "aff_unique_norm": "Columbia University;University of Pennsylvania",
        "aff_unique_dep": ";School of Engineering and Applied Science",
        "aff_unique_url": "https://www.columbia.edu;https://www.upenn.edu",
        "aff_unique_abbr": "Columbia;UPenn",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Large Content And Behavior Models To Understand, Simulate, And Optimize Content And Behavior",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18547",
        "id": "TrKq4Wlwcz",
        "author_site": "Ashmit Khandelwal, Aditya Agrawal, Aanisha Bhattacharyya, Yaman Singla, Somesh Singh, Uttaran Bhattacharya, Ishita Dasgupta, Stefano Petrangeli, Rajiv Ratn Shah, Changyou Chen, Balaji Krishnamurthy",
        "tldr": "",
        "abstract": "Shannon and Weaver's seminal information theory divides communication into three levels: technical, semantic, and effectiveness. While the technical level deals with the accurate reconstruction of transmitted symbols, the semantic and effectiveness levels deal with the inferred meaning and its effect on the receiver. Large Language Models (LLMs), with their wide generalizability, make some progress towards the second level. However, LLMs and other communication models are not conventionally designed for predicting and optimizing communication for desired receiver behaviors and intents. As a result, the effectiveness level remains largely untouched by modern communication systems. In this paper, we introduce the receivers' \"behavior tokens,\" such as shares, likes, clicks, purchases, and retweets, in the LLM's training corpora to optimize content for the receivers and predict their behaviors. Other than showing similar performance to LLMs on content understanding tasks, our trained models show generalization capabilities on the behavior dimension for behavior simulation, content simulation, behavior understanding, and behavior domain adaptation. We show results on all these capabilities using a wide range of tasks on three corpora. We call these models Large Content and Behavior Models (LCBMs). Further, to spur more research on LCBMs, we release our new Content Behavior Corpus (CBC), a repository containing communicator, message, and corresponding receiver behavior (https://behavior-in-the-wild.github.io/LCBM).",
        "keywords": "large language models;behavior simulation;large content and behavior models;behavior understanding;behavior in the wild;computational marketing;computational behavior science",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Ashmit Khandelwal;Aditya Agrawal;Aanisha Bhattacharyya;Yaman Kumar;Somesh Singh;Uttaran Bhattacharya;Ishita Dasgupta;Stefano Petrangeli;Rajiv Ratn Shah;Changyou Chen;Balaji Krishnamurthy",
        "authorids": "~Ashmit_Khandelwal1;~Aditya_Agrawal3;~Aanisha_Bhattacharyya2;~Yaman_Kumar1;~Somesh_Singh1;~Uttaran_Bhattacharya1;~Ishita_Dasgupta3;~Stefano_Petrangeli1;~Rajiv_Ratn_Shah1;~Changyou_Chen1;~Balaji_Krishnamurthy1",
        "gender": "M;M;F;M;;M;F;;M;M;M",
        "homepage": "https://ashmitkx.github.io;https://aditya-agrawal-30502.netlify.app/;https://www.linkedin.com/in/aanisha-bhattacharyya/;https://sites.google.com/view/yaman-kumar/;;http://www.cs.umd.edu/~uttaranb/;;;https://iiitd.ac.in/rajivratn;https://www.cse.buffalo.edu/~changyou/;",
        "dblp": "356/2261;;;239/5601;;220/7744;169/6218-2;;134/3502;65/2802;79/1076",
        "google_scholar": "https://scholar.google.com/citations?hl=en;5OP8PEEAAAAJ;PkCeGdoAAAAJ;https://scholar.google.co.in/citations?hl=en;;xx9nrfoAAAAJ;https://scholar.google.com/citations?hl=en;;https://scholar.google.com.sg/citations?hl=en;LtEcKBcAAAAJ;n8iUBg8AAAAJ",
        "orcid": "0009-0007-0533-9176;;;0000-0001-7880-8219;;0000-0003-2141-9276;0000-0002-6753-626X;;;;0000-0002-0366-2427",
        "linkedin": "ashmitkx/;aditya-agrawal-9aba24208/;aanisha-bhattacharyya/;yaman-kumar/;;uttaran-bhattacharya/;ishitadg/;;;;balaji-krishnamurthy-4241695/",
        "or_profile": "~Ashmit_Khandelwal1;~Aditya_Agrawal3;~Aanisha_Bhattacharyya2;~Yaman_Kumar1;~Somesh_Singh1;~Uttaran_Bhattacharya1;~Ishita_Dasgupta3;~Stefano_Petrangeli1;~Rajiv_Ratn_Shah1;~Changyou_Chen1;~Balaji_Krishnamurthy1",
        "aff": "Birla Institute of Technology and Science, Pilani;Birla Institute of Tchnology and Science - KK Birla Goa Campus;Adobe Systems;Adobe ;;Adobe Systems;Adobe Systems;;Indraprastha Institute of Information Technology, Delhi;State University of New York, Buffalo;Adobe Systems",
        "aff_domain": "bits-pilani.ac.in;goa.bits-pilani.ac.in;adobe.com;adobe.com;;adobe.com;adobe.com;;iiitd.ac.in;buffalo.edu;adobe.com",
        "position": "Undergrad student;Undergrad student;Researcher;Researcher;;Researcher;Researcher;;Associate Professor;Assistant Professor;Principal Scientist",
        "bibtex": "@inproceedings{\nkhandelwal2024large,\ntitle={Large Content And Behavior Models To Understand, Simulate, And Optimize Content And Behavior},\nauthor={Ashmit Khandelwal and Aditya Agrawal and Aanisha Bhattacharyya and Yaman Kumar and Somesh Singh and Uttaran Bhattacharya and Ishita Dasgupta and Stefano Petrangeli and Rajiv Ratn Shah and Changyou Chen and Balaji Krishnamurthy},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=TrKq4Wlwcz}\n}",
        "github": "",
        "project": "",
        "reviewers": "A7CN;73Nf;jTBK;aTeR",
        "pdf_size": 3634062,
        "rating": "5;6;8;10",
        "confidence": "3;3;3;3",
        "soundness": "3;3;4;4",
        "contribution": "2;3;4;4",
        "presentation": "2;3;3;4",
        "wc_summary": "48;91;65;153",
        "wc_strengths": "43;65;84;169",
        "wc_weaknesses": "166;83;93;87",
        "wc_questions": "3;14;2;89",
        "wc_review": "260;253;244;498",
        "wc_reply_reviewers": "0;16;20;0",
        "wc_reply_authors": "946;990;348;1080",
        "reply_reviewers": "0;1;2;0",
        "reply_authors": "2;3;2;2",
        "rating_avg": [
            7.25,
            1.920286436967152
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            89.25,
            39.86461463503692
        ],
        "wc_strengths_avg": [
            90.25,
            47.72512441052407
        ],
        "wc_weaknesses_avg": [
            107.25,
            34.10553474144629
        ],
        "wc_questions_avg": [
            27.0,
            36.10401639707139
        ],
        "wc_review_avg": [
            313.75,
            106.52787193969473
        ],
        "wc_reply_reviewers_avg": [
            9.0,
            9.1104335791443
        ],
        "wc_reply_authors_avg": [
            841.0,
            288.7022687822179
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10825501544222830703&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 9,
        "openreview": "https://openreview.net/forum?id=TrKq4Wlwcz",
        "pdf": "https://openreview.net/pdf?id=TrKq4Wlwcz",
        "email": "bits-pilani.ac.in;goa.bits-pilani.ac.in;adobe.com;adobe.com;;adobe.com;adobe.com;;iiitd.ac.in;buffalo.edu;adobe.com",
        "author_num": 11,
        "aff_unique_index": "0;0;1;1;1;1;2;3;1",
        "aff_unique_norm": "Birla Institute of Technology and Science;Adobe;Indraprastha Institute of Information Technology;State University of New York at Buffalo",
        "aff_unique_dep": ";Adobe Systems Incorporated;;",
        "aff_unique_url": "https://www.bits-pilani.ac.in;https://www.adobe.com;http://www.iiitd.ac.in;https://www.buffalo.edu",
        "aff_unique_abbr": "BITS Pilani;Adobe;IIIT-D;SUNY Buffalo",
        "aff_campus_unique_index": "0;1;3;4",
        "aff_campus_unique": "Pilani;Goa;;Delhi;Buffalo",
        "aff_country_unique_index": "0;0;1;1;1;1;0;1;1",
        "aff_country_unique": "India;United States"
    },
    {
        "id": "Trg9qb0d5U",
        "title": "Fantastic DNN-Classifier Identification without Testing Dataset",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep Neural Networks (DNNs) are trained, validated, and tested with an example dataset. For a given example dataset, several models for different architectures are trained and then using the validation dataset a model is selected. If the models have hyper-parameters, their good values are selected using validation datasets as well. Finally, performance of the selected DNN is tested using a test dataset. This testing method treats the DNN as a black-box and doesn\u2019t attempt to understand its characteristics. On the other hand, many theoretical and empirical studies have used complexity measures for estimating generalization phenomena using the training dataset, with rare exceptions. To the best of our knowledge, no method exists to estimate test accuracy (not generalization) without any testing dataset. We propose a method for estimating test accuracy of a given DNN without any test dataset. Assuming that a DNN is the composition of a feature extractor and a classifier, we propose and evaluate a method for estimating their qualities. The first step of the proposed method is generation of one (input) prototype vector for each class. Then using these seed prototypes, (k \u2212 1) core prototypes are generated for each class. These prototypes are our data for evaluating the qualities of the feature extractor and classifier as well as estimating test accuracy of the given DNN. We have empirically evaluated the proposed method for DNNs trained with CIFAR10, and CIFAR100.",
        "keywords": "prototype;evaluation;representation;interpretation",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Nathaniel Dean;Dilip Sarkar",
        "authorids": "~Nathaniel_Dean1;~Dilip_Sarkar1",
        "gender": "M;M",
        "homepage": ";http://www.cs.miami.edu/~sarkar/",
        "dblp": ";",
        "google_scholar": ";uMMfI1UAAAAJ",
        "orcid": ";",
        "linkedin": "nathaniel-dean-97885667/;",
        "or_profile": "~Nathaniel_Dean1;~Dilip_Sarkar1",
        "aff": "University of Miami;University of Miami, University of Miami",
        "aff_domain": "miami.edu;cs.miami.edu",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\ndean2024fantastic,\ntitle={Fantastic {DNN}-Classifier Identification without Testing Dataset},\nauthor={Nathaniel Dean and Dilip Sarkar},\nyear={2024},\nurl={https://openreview.net/forum?id=Trg9qb0d5U}\n}",
        "github": "",
        "project": "",
        "reviewers": "Szfc;QA6N;THQj",
        "site": "https://openreview.net/forum?id=Trg9qb0d5U",
        "pdf_size": 262179,
        "rating": "3;3;5",
        "confidence": "4;4;3",
        "soundness": "2;2;2",
        "contribution": "2;2;3",
        "presentation": "2;1;2",
        "wc_summary": "48;56;95",
        "wc_strengths": "35;22;19",
        "wc_weaknesses": "147;402;89",
        "wc_questions": "20;28;19",
        "wc_review": "250;508;222",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            66.33333333333333,
            20.531818125912658
        ],
        "wc_strengths_avg": [
            25.333333333333332,
            6.944222218666553
        ],
        "wc_weaknesses_avg": [
            212.66666666666666,
            135.95669245102363
        ],
        "wc_questions_avg": [
            22.333333333333332,
            4.0276819911981905
        ],
        "wc_review_avg": [
            326.6666666666667,
            128.730554087037
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:eIzDwwjUu_8J:scholar.google.com/&scioq=Fantastic+DNN-Classifier+Identification+without+Testing+Dataset&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Miami",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.miami.edu",
        "aff_unique_abbr": "UM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "TrwocPauNQ",
        "title": "Reinforcement Learning with Human Feedback: Learning Dynamic Choices via Pessimism",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In this paper, we study offline Reinforcement Learning with Human Feedback (RLHF) where we aim to learn the human's underlying reward and the MDP's optimal policy from a set of trajectories induced by human choices.   RLHF is challenging for multiple reasons: large state space but limited human feedback, the bounded rationality of human decisions, and the off-policy distribution shift. In this paper, we focus on the Dynamic Discrete Choice (DDC) model for modeling and understanding human choices. DCC, rooted in econometrics and decision theory, is widely used to model a human decision-making process with forward-looking and bounded rationality.  We propose a \\underline{D}ynamic-\\underline{C}hoice-\\underline{P}essimistic-\\underline{P}olicy-\\underline{O}ptimization (DCPPO) method. \\ The method involves a three-stage process: The first step is to estimate the human behavior policy and the state-action value function via maximum likelihood estimation (MLE); the second step recovers the human reward function via  minimizing Bellman mean squared error using the learned value functions; the third step is to plug in the learned reward and invoke pessimistic value iteration for finding a near-optimal policy. With only single-policy coverage (i.e., optimal policy) of the dataset, we prove that the  suboptimality of DCPPO \\textit{almost} matches the classical pessimistic offline RL algorithm in terms of suboptimality\u2019s dependency on distribution shift and dimension. To the best of our knowledge, this paper presents the first theoretical guarantees for off-policy offline RLHF with dynamic discrete choice model.",
        "keywords": "Preference-based reinforcement learning; offline reinforcement learning; reinforcement learning with human feedback",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Zihao Li;Zhuoran Yang;Mengdi Wang",
        "authorids": "~Zihao_Li3;~Zhuoran_Yang1;~Mengdi_Wang1",
        "gender": "M;M;F",
        "homepage": ";https://zhuoranyang.github.io/;http://mwang.princeton.edu",
        "dblp": ";;",
        "google_scholar": ";;",
        "orcid": ";;",
        "linkedin": "zihao-li-48b313235/;;",
        "or_profile": "~Zihao_Li3;~Zhuoran_Yang1;~Mengdi_Wang1",
        "aff": "Princeton University;Yale University;Princeton University",
        "aff_domain": "princeton.edu;yale.edu;princeton.edu",
        "position": "PhD student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nli2024reinforcement,\ntitle={Reinforcement Learning with Human Feedback: Learning Dynamic Choices via Pessimism},\nauthor={Zihao Li and Zhuoran Yang and Mengdi Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=TrwocPauNQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "Ejar;e24G;CQn7",
        "site": "https://openreview.net/forum?id=TrwocPauNQ",
        "pdf_size": 405019,
        "rating": "5;5;6",
        "confidence": "3;3;3",
        "soundness": "3;2;3",
        "contribution": "3;2;2",
        "presentation": "3;3;3",
        "wc_summary": "100;97;165",
        "wc_strengths": "41;47;47",
        "wc_weaknesses": "231;268;54",
        "wc_questions": "2;62;206",
        "wc_review": "374;474;472",
        "wc_reply_reviewers": "211;0;15",
        "wc_reply_authors": "1975;905;1480",
        "reply_reviewers": "2;0;1",
        "reply_authors": "5;3;3",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            120.66666666666667,
            31.372316175606517
        ],
        "wc_strengths_avg": [
            45.0,
            2.8284271247461903
        ],
        "wc_weaknesses_avg": [
            184.33333333333334,
            93.38926895289178
        ],
        "wc_questions_avg": [
            90.0,
            85.60373823613078
        ],
        "wc_review_avg": [
            440.0,
            46.676189504571454
        ],
        "wc_reply_reviewers_avg": [
            75.33333333333333,
            96.12607462193712
        ],
        "wc_reply_authors_avg": [
            1453.3333333333333,
            437.23245787821173
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 62,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11399907122022006723&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Princeton University;Yale University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.princeton.edu;https://www.yale.edu",
        "aff_unique_abbr": "Princeton;Yale",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Spatially-Aware Transformers for Embodied Agents",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18546",
        "id": "Ts95eXsPBc",
        "author_site": "Junmo Cho, Jaesik Yoon, Sungjin Ahn",
        "tldr": "",
        "abstract": "Episodic memory plays a crucial role in various cognitive processes, such as the ability to mentally recall past events. While cognitive science emphasizes the significance of spatial context in the formation and retrieval of episodic memory, the current primary approach to implementing episodic memory in AI systems is through transformers that store temporally ordered experiences, which overlooks the spatial dimension. As a result, it is unclear how the underlying structure could be extended to incorporate the spatial axis beyond temporal order alone and thereby what benefits can be obtained. To address this, this paper explores the use of Spatially-Aware Transformer models that incorporate spatial information. These models enable the creation of place-centric episodic memory that considers both temporal and spatial dimensions. Adopting this approach, we demonstrate that memory utilization efficiency can be improved, leading to enhanced accuracy in various place-centric downstream tasks. Additionally, we propose the Adaptive Memory Allocator, a memory management method based on reinforcement learning that aims to optimize efficiency of memory utilization. Our experiments demonstrate the advantages of our proposed model in various environments and across multiple downstream tasks, including prediction, generation, reasoning, and reinforcement learning. The source code for our models and experiments will be available at \\href{https://github.com/spatially_aware_transformer}{https://github.com/spatially_aware_transformer}.",
        "keywords": "Episodic Memory;Spatial Inference;Prediction;Generation;Reinforcement Learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Junmo Cho;Jaesik Yoon;Sungjin Ahn",
        "authorids": "~Junmo_Cho1;~Jaesik_Yoon1;~Sungjin_Ahn1",
        "gender": "M;M;",
        "homepage": ";https://jaesikyoon.com;",
        "dblp": ";158/9715;",
        "google_scholar": "9Vx4BLgAAAAJ;qboyyIAAAAAJ;",
        "orcid": ";;",
        "linkedin": ";jaesik-yoon-809726123/;",
        "or_profile": "~Junmo_Cho1;~Jaesik_Yoon1;~Sungjin_Ahn1",
        "aff": "KAIST;SAP Labs Korea;",
        "aff_domain": "kaist.ac.kr;sap.com;",
        "position": "PhD student;Researcher;",
        "bibtex": "@inproceedings{\ncho2024spatiallyaware,\ntitle={Spatially-Aware Transformers for Embodied Agents},\nauthor={Junmo Cho and Jaesik Yoon and Sungjin Ahn},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Ts95eXsPBc}\n}",
        "github": "",
        "project": "",
        "reviewers": "44cr;XL1m;QvRD;BEnq",
        "pdf_size": 11862564,
        "rating": "6;6;8;8",
        "confidence": "4;3;4;3",
        "soundness": "3;2;4;3",
        "contribution": "3;3;3;4",
        "presentation": "3;2;4;3",
        "wc_summary": "85;78;75;111",
        "wc_strengths": "62;53;172;166",
        "wc_weaknesses": "88;218;425;292",
        "wc_questions": "3;5;19;2",
        "wc_review": "238;354;691;571",
        "wc_reply_reviewers": "27;35;0;0",
        "wc_reply_authors": "159;518;1119;338",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            87.25,
            14.184057952504283
        ],
        "wc_strengths_avg": [
            113.25,
            55.881011980815096
        ],
        "wc_weaknesses_avg": [
            255.75,
            121.9884728160821
        ],
        "wc_questions_avg": [
            7.25,
            6.869315832017043
        ],
        "wc_review_avg": [
            463.5,
            177.5901179683149
        ],
        "wc_reply_reviewers_avg": [
            15.5,
            15.75595125658873
        ],
        "wc_reply_authors_avg": [
            533.5,
            361.08205438653414
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9598602520897791024&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=Ts95eXsPBc",
        "pdf": "https://openreview.net/pdf?id=Ts95eXsPBc",
        "email": "kaist.ac.kr;sap.com;",
        "author_num": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology;SAP Labs",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.kaist.ac.kr;https://labs.sap/",
        "aff_unique_abbr": "KAIST;SAP Labs",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "Training Bayesian Neural Networks with Sparse Subspace Variational Inference",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18545",
        "id": "TskzCtpMEO",
        "author_site": "Junbo Li, Zichen Miao, Qiang Qiu, Ruqi Zhang",
        "tldr": "",
        "abstract": "Bayesian neural networks (BNNs) offer uncertainty quantification but come with the downside of substantially increased training and inference costs. Sparse BNNs have been investigated for efficient inference, typically by either slowly introducing sparsity throughout the training or by post-training compression of dense BNNs. The dilemma of how to cut down massive training costs remains, particularly given the requirement to learn about the uncertainty. To solve this challenge, we introduce Sparse Subspace Variational Inference (SSVI), the first fully sparse BNN framework that maintains a consistently sparse Bayesian model throughout the training and inference phases. Starting from a randomly initialized low-dimensional sparse subspace, our approach alternately optimizes the sparse subspace basis selection and its associated parameters. While basis selection is characterized as a non-differentiable problem, we approximate the optimal solution with a removal-and-addition strategy, guided by novel criteria based on weight distribution statistics. Our extensive experiments show that SSVI sets new benchmarks in crafting sparse BNNs, achieving, for instance, a 10-20\u00d7 compression in model size with under 3\\% performance drop, and up to 20\u00d7 FLOPs reduction during training. Remarkably, SSVI also demonstrates enhanced robustness to hyperparameters, reducing the need for intricate tuning in VI and occasionally even surpassing VI-trained dense BNNs.",
        "keywords": "Bayesian neural networks;sparse Bayesian learning;variational inference",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/07f792b3717720c65e4b2b7a8985b19dfbc677c0.pdf",
        "author": "Junbo Li;Zichen Miao;Qiang Qiu;Ruqi Zhang",
        "authorids": "~Junbo_Li3;~Zichen_Miao1;~Qiang_Qiu1;~Ruqi_Zhang1",
        "gender": "M;M;;F",
        "homepage": "https://ljb121002.github.io/;https://zichenmiao.github.io;https://web.ics.purdue.edu/~qqiu/;https://ruqizhang.github.io/",
        "dblp": "74/8487-3;206/1549;97/360;",
        "google_scholar": "XVSPtCoAAAAJ;Kmv2KIkAAAAJ;jdLtt_YAAAAJ;4ojpmc8AAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Junbo_Li3;~Zichen_Miao1;~Qiang_Qiu1;~Ruqi_Zhang1",
        "aff": "Mohamed bin Zayed University of Artificial Intelligence;Purdue University;Purdue University;Purdue University",
        "aff_domain": "mbzuai.ac.ae;purdue.edu;purdue.edu;purdue.edu",
        "position": "Researcher;PhD student;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nli2024training,\ntitle={Training Bayesian Neural Networks with Sparse Subspace Variational Inference},\nauthor={Junbo Li and Zichen Miao and Qiang Qiu and Ruqi Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=TskzCtpMEO}\n}",
        "github": "",
        "project": "",
        "reviewers": "SCNX;DFxu;KZuX",
        "pdf_size": 918256,
        "rating": "6;6;8",
        "confidence": "4;4;3",
        "soundness": "3;2;3",
        "contribution": "3;2;4",
        "presentation": "2;2;3",
        "wc_summary": "215;33;174",
        "wc_strengths": "68;52;125",
        "wc_weaknesses": "492;224;239",
        "wc_questions": "163;120;24",
        "wc_review": "938;429;562",
        "wc_reply_reviewers": "0;240;46",
        "wc_reply_authors": "2476;1956;907",
        "reply_reviewers": "0;4;1",
        "reply_authors": "6;7;2",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            140.66666666666666,
            77.95012650549211
        ],
        "wc_strengths_avg": [
            81.66666666666667,
            31.329787033357817
        ],
        "wc_weaknesses_avg": [
            318.3333333333333,
            122.9534690667797
        ],
        "wc_questions_avg": [
            102.33333333333333,
            58.10526845495357
        ],
        "wc_review_avg": [
            643.0,
            215.5473652510433
        ],
        "wc_reply_reviewers_avg": [
            95.33333333333333,
            104.004273416475
        ],
        "wc_reply_authors_avg": [
            1779.6666666666667,
            652.5643433579728
        ],
        "reply_reviewers_avg": [
            1.6666666666666667,
            1.699673171197595
        ],
        "reply_authors_avg": [
            5.0,
            2.160246899469287
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9999999999999998,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13193062208284882532&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=TskzCtpMEO",
        "pdf": "https://openreview.net/pdf?id=TskzCtpMEO",
        "email": "mbzuai.ac.ae;purdue.edu;purdue.edu;purdue.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Mohamed bin Zayed University of Artificial Intelligence;Purdue University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://mbzuai.ac.ae;https://www.purdue.edu",
        "aff_unique_abbr": "MBZUAI;Purdue",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "United Arab Emirates;United States"
    },
    {
        "id": "TsrqDYRJ99",
        "title": "DEBOSH: Deep Bayesian Shape Optimization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Shape optimization is at the heart of many industrial applications, such as aerodynamics, heat transfer, and structural analysis. It has recently been shown that Graph Neural Networks (GNNs) can predict the performance of a shape quickly and accurately and be used to optimize shapes more effectively than traditional techniques. However, to fully explore the shape space, one must often explore shapes that deviate significantly from the training set. For these, GNN predictions become unreliable, something that is often ignored by most current methods. For classical optimization techniques, such as those relying on Gaussian Processes, Bayesian Optimization (BO) framework addresses this issue by enabling the model to assess its own prediction accuracy. Unfortunately, standard approaches to estimating neural network's uncertainty can entail long training times, high memory and computational requirements, and reduced model accuracy. In this paper, we propose a novel uncertainty-based method tailored to shape optimization that enables effective Bayesian optimization and increases the quality of the resulting shapes beyond that of popular state-of-the-art approaches.",
        "keywords": "gnns;optimization;shape;physics",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Nikita Durasov;Artem Lukoianov;Jonathan Donier;Pascal Fua",
        "authorids": "~Nikita_Durasov1;~Artem_Lukoianov1;~Jonathan_Donier1;~Pascal_Fua1",
        "gender": "M;M;;M",
        "homepage": "https://www.norange.io/about/;https://lukoianov.com;;https://people.epfl.ch/pascal.fua/bio?lang=en",
        "dblp": "230/4660;267/1639;236/5194;f/PFua",
        "google_scholar": "KMMvTfcAAAAJ;A9tNPiQAAAAJ;https://scholar.google.fr/citations?user=3hoYiLAAAAAJ;https://scholar.google.com/citations?view_op=list_works",
        "orcid": ";0000-0001-8308-1923;;",
        "linkedin": ";artem-lukoianov/;;pascal-fua-epfl/?lipi=urn%3Ali%3Apage%3Ad_flagship3_search_srp_top%3BOz8ffqlCTcmui5v37AilTQ%3D%3D&licu=urn%3Ali%3Acontrol%3Ad_flagship3_search_srp_top-search_srp_result&lici=IhLn%2B0y4Rj23iI9XNMDNwA%3D%3D",
        "or_profile": "~Nikita_Durasov1;~Artem_Lukoianov1;~Jonathan_Donier1;~Pascal_Fua1",
        "aff": "NVIDIA;Massachusetts Institute of Technology;Neural Concept;EPFL - EPF Lausanne",
        "aff_domain": "nvidia.com;mit.edu;neuralconcept.com;epfl.ch",
        "position": "Intern;PhD student;Principal Researcher;Full Professor",
        "bibtex": "@misc{\ndurasov2024debosh,\ntitle={{DEBOSH}: Deep Bayesian Shape Optimization},\nauthor={Nikita Durasov and Artem Lukoianov and Jonathan Donier and Pascal Fua},\nyear={2024},\nurl={https://openreview.net/forum?id=TsrqDYRJ99}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZDCz;2niw;UWPo;5pXv",
        "site": "https://openreview.net/forum?id=TsrqDYRJ99",
        "pdf_size": 15943163,
        "rating": "3;3;5;5",
        "confidence": "4;4;3;4",
        "soundness": "2;2;2;2",
        "contribution": "2;1;3;2",
        "presentation": "2;1;3;3",
        "wc_summary": "28;69;121;82",
        "wc_strengths": "13;73;46;41",
        "wc_weaknesses": "36;378;139;229",
        "wc_questions": "53;52;121;62",
        "wc_review": "130;572;427;414",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            75.0,
            33.20391543176798
        ],
        "wc_strengths_avg": [
            43.25,
            21.288200957337846
        ],
        "wc_weaknesses_avg": [
            195.5,
            125.55974673437343
        ],
        "wc_questions_avg": [
            72.0,
            28.556960622587273
        ],
        "wc_review_avg": [
            385.75,
            160.15363717380882
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12712702655957216318&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "NVIDIA;Massachusetts Institute of Technology;Neural Concept;EPFL",
        "aff_unique_dep": "NVIDIA Corporation;;;",
        "aff_unique_url": "https://www.nvidia.com;https://web.mit.edu;;https://www.epfl.ch",
        "aff_unique_abbr": "NVIDIA;MIT;;EPFL",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Lausanne",
        "aff_country_unique_index": "0;0;2",
        "aff_country_unique": "United States;;Switzerland"
    },
    {
        "title": "TEST: Text Prototype Aligned Embedding to Activate LLM's Ability for Time Series",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18544",
        "id": "Tuh4nZVb0g",
        "author_site": "Chenxi Sun, Hongyan Li, Yaliang Li, Shenda Hong",
        "tldr": "",
        "abstract": "This work summarizes two ways to accomplish Time-Series (TS) tasks in today's Large Language Model (LLM) context: LLM-for-TS (model-centric) designs and trains a fundamental large model, or fine-tunes a pre-trained LLM for TS data; TS-for-LLM (data-centric) converts TS into a model-friendly representation to enable the pre-trained LLM to handle TS data. Given the lack of data, limited resources, semantic context requirements, and so on, this work focuses on TS-for-LLM, where we aim to activate LLM's ability for TS data by designing a TS embedding method suitable for LLM. The proposed method is named TEST. It first tokenizes TS, builds an encoder to embed TS via instance-wise, feature-wise, and text-prototype-aligned contrast, where the TS embedding space is aligned to LLM\u2019s embedding layer space, then creates soft prompts to make LLM more open to that embeddings, and finally implements TS tasks using the frozen LLM. We also demonstrate the feasibility of TS-for-LLM through theory and experiments. Experiments are carried out on TS classification, forecasting, and representation tasks using eight frozen LLMs with various structures and sizes. The results show that the pre-trained LLM with TEST strategy can achieve better or comparable performance than today's SOTA TS models, and offers benefits for few-shot and generalization. By treating LLM as the pattern machine, TEST can endow LLM's ability to process TS data without compromising language ability. We hope that this study will serve as a foundation for future work to support TS+LLM progress.",
        "keywords": "Time Series;Embedding;LLM",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/d311feafb66bbe4ea87bb9719c288feeb7d52aaa.zip",
        "author": "Chenxi Sun;Hongyan Li;Yaliang Li;Shenda Hong",
        "authorids": "~Chenxi_Sun2;~Hongyan_Li2;~Yaliang_Li1;~Shenda_Hong1",
        "gender": "F;F;M;",
        "homepage": ";;https://sites.google.com/site/yaliangli/;",
        "dblp": "https://dblp.uni-trier.de/pid/166/6086.html;;https://dblp.org/pers/hd/l/Li:Yaliang;",
        "google_scholar": ";;CCPBcdYAAAAJ;",
        "orcid": "0000-0002-1762-0877;0000-0001-7174-2851;0000-0002-4204-6096;",
        "linkedin": ";;;",
        "or_profile": "~Chenxi_Sun2;~Hongyan_Li2;~Yaliang_Li1;~Shenda_Hong1",
        "aff": "Peking University;Peking University;Alibaba Group;",
        "aff_domain": "pku.edu.cn;pku.edu.cn;alibaba-inc.com;",
        "position": "PhD student;Full Professor;Staff Engineer;",
        "bibtex": "@inproceedings{\nsun2024test,\ntitle={{TEST}: Text Prototype Aligned Embedding to Activate {LLM}'s Ability for Time Series},\nauthor={Chenxi Sun and Hongyan Li and Yaliang Li and Shenda Hong},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Tuh4nZVb0g}\n}",
        "github": "",
        "project": "",
        "reviewers": "YYDc;3p6a;t5Ny;M1Ks",
        "pdf_size": 3722804,
        "rating": "5;5;6;8",
        "confidence": "3;3;3;2",
        "soundness": "2;2;2;4",
        "contribution": "3;3;3;3",
        "presentation": "3;2;2;4",
        "wc_summary": "145;125;123;100",
        "wc_strengths": "103;62;154;113",
        "wc_weaknesses": "142;117;191;54",
        "wc_questions": "2;44;357;73",
        "wc_review": "392;348;825;340",
        "wc_reply_reviewers": "0;0;32;74",
        "wc_reply_authors": "619;453;956;462",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "2;2;4;2",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            123.25,
            15.943258763502524
        ],
        "wc_strengths_avg": [
            108.0,
            32.71849629796577
        ],
        "wc_weaknesses_avg": [
            126.0,
            49.36091571273774
        ],
        "wc_questions_avg": [
            119.0,
            139.7086253600686
        ],
        "wc_review_avg": [
            476.25,
            202.3219896600466
        ],
        "wc_reply_reviewers_avg": [
            26.5,
            30.376800358168072
        ],
        "wc_reply_authors_avg": [
            622.5,
            203.54667769334876
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            0.8660254037844386
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9428090415820632,
        "gs_citation": 126,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5834900459031573069&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=Tuh4nZVb0g",
        "pdf": "https://openreview.net/pdf?id=Tuh4nZVb0g",
        "email": "pku.edu.cn;pku.edu.cn;alibaba-inc.com;",
        "author_num": 4,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Peking University;Alibaba Group",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.alibaba.com",
        "aff_unique_abbr": "Peking U;Alibaba",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "Tusy7IlWWw",
        "title": "SASSL: Enhancing Self-Supervised Learning via Neural Style Transfer",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Self-supervised learning relies heavily on data augmentation to extract meaningful representations from unlabeled images. While existing state-of-the-art augmentation pipelines incorporate a wide range of primitive transformations, these often disregard natural image structure. Thus, augmented samples can exhibit degraded semantic information and low stylistic diversity, affecting downstream performance of self-supervised representations. To overcome this, we propose SASSL: Style Augmentations for Self Supervised Learning, a novel augmentation technique based on Neural Style Transfer. The method decouples semantic and stylistic attributes in images and applies transformations exclusively to the style while preserving content, generating diverse augmented samples that better retain their semantic properties. Experimental results show our technique achieves a top-1 classification performance improvement of more than 2% on ImageNet compared to the well-established MoCo v2. We also measure transfer learning performance across five diverse datasets, observing significant improvements of up to 3.75%. Our experiments indicate that decoupling style from content information and transferring style across datasets to diversify augmentations can significantly improve downstream performance of self-supervised representations.",
        "keywords": "data augmentation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/06b4fa7e29017be352111b0b2762ad709d338ef1.zip",
        "author": "Renan A. Rojas Gomez;Alex Bijamov;Warren Richard Morningstar;Philip Andrew Mansfield",
        "authorids": "~Renan_A._Rojas_Gomez1;~Alex_Bijamov1;~Warren_Richard_Morningstar1;~Philip_Andrew_Mansfield1",
        "gender": ";;M;M",
        "homepage": ";;;https://www.linkedin.com/in/philipmansfield/",
        "dblp": ";;260/0779;207/8144",
        "google_scholar": ";;https://scholar.google.com/citations?view_op=search_authors;https://scholar.google.ca/citations?user=Pm_geMkAAAAJ",
        "orcid": ";;;0000-0003-4969-0543",
        "linkedin": ";;;philipmansfield/",
        "or_profile": "~Renan_A._Rojas_Gomez1;~Alex_Bijamov1;~Warren_Richard_Morningstar1;~Philip_Andrew_Mansfield1",
        "aff": ";;Google;Simon Fraser University",
        "aff_domain": ";;google.com;sfu.ca",
        "position": ";;Senior Software Engineer;Assistant Professor",
        "bibtex": "@misc{\ngomez2024sassl,\ntitle={{SASSL}: Enhancing Self-Supervised Learning via Neural Style Transfer},\nauthor={Renan A. Rojas Gomez and Alex Bijamov and Warren Richard Morningstar and Philip Andrew Mansfield},\nyear={2024},\nurl={https://openreview.net/forum?id=Tusy7IlWWw}\n}",
        "github": "",
        "project": "",
        "reviewers": "PzRD;4joa;ifUN;ZUu3",
        "site": "https://openreview.net/forum?id=Tusy7IlWWw",
        "pdf_size": 2733026,
        "rating": "3;6;6;6",
        "confidence": "5;3;3;4",
        "soundness": "3;2;3;2",
        "contribution": "2;3;2;2",
        "presentation": "2;3;3;4",
        "wc_summary": "66;80;187;162",
        "wc_strengths": "35;36;292;42",
        "wc_weaknesses": "444;114;150;14",
        "wc_questions": "1;64;27;20",
        "wc_review": "546;294;656;238",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1270;697;817;73",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;2;1",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            123.75,
            51.751207715376076
        ],
        "wc_strengths_avg": [
            101.25,
            110.16209647605659
        ],
        "wc_weaknesses_avg": [
            180.5,
            160.08357192416716
        ],
        "wc_questions_avg": [
            28.0,
            22.85825890132492
        ],
        "wc_review_avg": [
            433.5,
            173.09173868212198
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            714.25,
            427.4677619423481
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8703882797784892,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18381403336975259610&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Google;Simon Fraser University",
        "aff_unique_dep": "Google;",
        "aff_unique_url": "https://www.google.com;https://www.sfu.ca",
        "aff_unique_abbr": "Google;SFU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Mountain View;",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United States;Canada"
    },
    {
        "id": "TvkvWjxj3T",
        "title": "Negative-prompt Inversion: Fast Image Inversion for Editing with Text-guided Diffusion Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In image editing employing diffusion models, it is crucial to preserve the reconstruction quality of the original image while changing its style. Although existing methods ensure reconstruction quality through optimization, a drawback of these is the significant amount of time required for optimization. In this paper, we propose negative-prompt inversion, a method capable of achieving equivalent reconstruction solely through forward propagation without optimization, thereby enabling much faster editing processes. We experimentally demonstrate that the reconstruction quality of our method is comparable to that of existing methods, allowing for inversion at a resolution of 512 pixels and with 50 sampling steps within approximately 5 seconds, which is more than 30 times faster than null-text inversion. Reduction of the computation time by the proposed method further allows us to use a larger number of sampling steps in diffusion models to improve the reconstruction quality with a moderate increase in computation time.",
        "keywords": "generative models;diffusion models;score-based models;image generation;image editing",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/830c646564ad45298ecb6620723e77df6335a966.zip",
        "author": "Daiki Miyake;Akihiro Iohara;Yu Saito;Toshiyuki Tanaka",
        "authorids": "~Daiki_Miyake1;~Akihiro_Iohara2;~Yu_Saito2;~Toshiyuki_Tanaka1",
        "gender": "M;M;M;M",
        "homepage": "https://kym384.github.io/;;;https://datagrid.co.jp/",
        "dblp": ";;28/1895;",
        "google_scholar": "6j-lfMUAAAAJ;https://scholar.google.co.jp/citations?user=M3gyCrUAAAAJ;J_bqd7EAAAAJ;",
        "orcid": ";;0000-0001-5962-9119;",
        "linkedin": ";;;",
        "or_profile": "~Daiki_Miyake1;~Yu_Saito2;~Toshiyuki_Tanaka1;~akihiro_iohara1",
        "aff": "Kyoto University;DATAGRID;Kyoto University, Kyoto University;DATAGRID Inc.",
        "aff_domain": "kyoto-u.ac.jp;co.jp;i.kyoto-u.ac.jp;datagrid.co.jp",
        "position": "Undergrad student;Researcher;Full Professor;Researcher",
        "bibtex": "@misc{\nmiyake2024negativeprompt,\ntitle={Negative-prompt Inversion: Fast Image Inversion for Editing with Text-guided Diffusion Models},\nauthor={Daiki Miyake and Akihiro Iohara and Yu Saito and Toshiyuki Tanaka},\nyear={2024},\nurl={https://openreview.net/forum?id=TvkvWjxj3T}\n}",
        "github": "",
        "project": "",
        "reviewers": "RErT;eMct;8NbU;69er",
        "site": "https://openreview.net/forum?id=TvkvWjxj3T",
        "pdf_size": 16538912,
        "rating": "3;5;5;6",
        "confidence": "4;4;4;4",
        "soundness": "1;3;3;2",
        "contribution": "2;1;3;3",
        "presentation": "2;3;4;2",
        "wc_summary": "114;136;107;92",
        "wc_strengths": "39;20;76;68",
        "wc_weaknesses": "189;251;109;73",
        "wc_questions": "112;131;28;169",
        "wc_review": "454;538;320;402",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "373;425;203;545",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            112.25,
            15.848895860595462
        ],
        "wc_strengths_avg": [
            50.75,
            22.465250944514285
        ],
        "wc_weaknesses_avg": [
            155.5,
            69.30187587648692
        ],
        "wc_questions_avg": [
            110.0,
            51.59941860137573
        ],
        "wc_review_avg": [
            428.5,
            79.23856384362351
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            386.5,
            122.94205952398877
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 100,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7805621972715539251&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "Kyoto University;DATAGRID;DATAGRID Inc.",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.kyoto-u.ac.jp;;",
        "aff_unique_abbr": "Kyoto U;;",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Kyoto",
        "aff_country_unique_index": "0;0;2",
        "aff_country_unique": "Japan;;United States"
    },
    {
        "title": "PubDef: Defending Against Transfer Attacks From Public Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18543",
        "id": "Tvwf4Vsi5F",
        "author_site": "Chawin Sitawarin, Jaewon Chang, David Huang, Wesson Altoyan, David Wagner",
        "tldr": "",
        "abstract": "Adversarial attacks have been a looming and unaddressed threat in the industry. However, through a decade-long history of the robustness evaluation literature, we have learned that mounting a strong or optimal attack is challenging. It requires both machine learning and domain expertise. In other words, the white-box threat model, religiously assumed by a large majority of the past literature, is unrealistic. In this paper, we propose a new practical threat model where the adversary relies on transfer attacks through publicly available surrogate models. We argue that this setting will become the most prevalent for security-sensitive applications in the future. We evaluate the transfer attacks in this setting and propose a specialized defense method based on a game-theoretic perspective. The defenses are evaluated under 24 public models and 11 attack algorithms across three datasets (CIFAR-10, CIFAR-100, and ImageNet). Under this threat model, our defense, PubDef, outperforms the state-of-the-art white-box adversarial training by a large margin with almost no loss in the normal accuracy. For instance, on ImageNet, our defense achieves 62% accuracy under the strongest transfer attack vs only 36% of the best adversarially trained model. Its accuracy when not under attack is only 2% lower than that of an undefended model (78% vs 80%). We release our code at https://github.com/wagner-group/pubdef.",
        "keywords": "adversarial robustness;adversarial examples;transfer attack;security",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/74cb37ecb33d459096a4a041d9e0b1b77f150d51.zip",
        "author": "Chawin Sitawarin;Jaewon Chang;David Huang;Wesson Altoyan;David Wagner",
        "authorids": "~Chawin_Sitawarin1;changjaewon0315@berkeley.edu;huang33176@berkeley.edu;~Wesson_Altoyan1;~David_Wagner3",
        "gender": "M;;;;",
        "homepage": "https://chawins.github.io/;;;;https://people.eecs.berkeley.edu/~daw/",
        "dblp": "211/7105;;;;42/5626",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;;;67kghxAAAAAJ",
        "orcid": "0000-0002-4949-9661;;;;0000-0002-9944-9232",
        "linkedin": "chawins/;;;;",
        "or_profile": "~Chawin_Sitawarin1;changjaewon0315@berkeley.edu;huang33176@berkeley.edu;~Wesson_Altoyan1;~David_Wagner3",
        "aff": "University of California, Berkeley;;;;University of California, Berkeley",
        "aff_domain": "berkeley.edu;;;;berkeley.edu",
        "position": "PhD student;;;;Professor",
        "bibtex": "@inproceedings{\nsitawarin2024pubdef,\ntitle={PubDef: Defending Against Transfer Attacks From Public Models},\nauthor={Chawin Sitawarin and Jaewon Chang and David Huang and Wesson Altoyan and David Wagner},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Tvwf4Vsi5F}\n}",
        "github": "",
        "project": "",
        "reviewers": "nPyj;DtJG;nHrU;CVr6",
        "pdf_size": 8749588,
        "rating": "3;6;6;8",
        "confidence": "5;3;5;3",
        "soundness": "2;4;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;4;3;4",
        "wc_summary": "55;59;214;54",
        "wc_strengths": "9;39;152;147",
        "wc_weaknesses": "19;40;464;7",
        "wc_questions": "556;43;150;114",
        "wc_review": "639;181;980;322",
        "wc_reply_reviewers": "211;10;227;14",
        "wc_reply_authors": "2124;357;1938;529",
        "reply_reviewers": "1;1;2;1",
        "reply_authors": "4;2;4;2",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.0,
            1.0
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            95.5,
            68.44158092855541
        ],
        "wc_strengths_avg": [
            86.75,
            63.664648746380436
        ],
        "wc_weaknesses_avg": [
            132.5,
            191.75570395688365
        ],
        "wc_questions_avg": [
            215.75,
            200.18038740096392
        ],
        "wc_review_avg": [
            530.5,
            307.9955356819316
        ],
        "wc_reply_reviewers_avg": [
            115.5,
            103.66412108342982
        ],
        "wc_reply_authors_avg": [
            1237.0,
            799.0359816679096
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            1.0
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.7001400420140049,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1839905317470285538&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=Tvwf4Vsi5F",
        "pdf": "https://openreview.net/pdf?id=Tvwf4Vsi5F",
        "email": "berkeley.edu;;;;berkeley.edu",
        "author_num": 5,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of California, Berkeley",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.berkeley.edu",
        "aff_unique_abbr": "UC Berkeley",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Berkeley",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Towards Reliable and Efficient Backdoor Trigger Inversion via Decoupling Benign Features",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18542",
        "id": "Tw9wemV6cb",
        "author_site": "Xiong Xu, Kunzhe Huang, Yiming Li, Zhan Qin, Kui Ren",
        "tldr": "",
        "abstract": "Recent studies revealed that using third-party models may lead to backdoor threats, where adversaries can maliciously manipulate model predictions based on backdoors implanted during model training. Arguably, backdoor trigger inversion (BTI), which generates trigger patterns of given benign samples for a backdoored model, is the most critical module for backdoor defenses used in these scenarios. With BTI, defenders can remove backdoors by fine-tuning based on generated poisoned samples with ground-truth labels or deactivate backdoors by removing trigger patterns during the inference process. However, we find that existing BTI methods suffer from relatively poor performance, $i.e.$, their generated triggers are significantly different from the ones used by the adversaries even in the feature space. We argue that it is mostly because existing methods require to 'extract' backdoor features at first, while this task is very difficult since defenders have no information ($e.g.$, trigger pattern or target label) about poisoned samples. In this paper, we explore BTI from another perspective where we decouple benign features instead of decoupling backdoor features directly. Specifically, our method consists of two main steps, including \\textbf{(1)} decoupling benign features and \\textbf{(2)} trigger inversion by minimizing the differences between benign samples and their generated poisoned version in decoupled benign features while maximizing the differences in remaining backdoor features. In particular, our method is more efficient since it doesn't need to `scan' all classes to speculate the target label, as required by existing BTI. We also exploit our BTI module to further design backdoor-removal and pre-processing-based defenses. Extensive experiments on benchmark datasets demonstrate that our defenses can reach state-of-the-art performances.",
        "keywords": "backdoor trigger inversion;backdoor defense;backdoor learning;Trustworthy ML;AI Security",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/ad5beb274a5620d7de5068432ad1b5d33e1fca44.zip",
        "author": "Xiong Xu;Kunzhe Huang;Yiming Li;Zhan Qin;Kui Ren",
        "authorids": "~Xiong_Xu1;~Kunzhe_Huang1;~Yiming_Li1;~Zhan_Qin2;~Kui_Ren4",
        "gender": "M;;M;M;M",
        "homepage": "https://xuxiong0214.github.io/;;http://liyiming.tech;https://person.zju.edu.cn/en/zhanqin;",
        "dblp": ";;l/YimingLi-4;148/4477;20/6179-1.html",
        "google_scholar": ";;mSW7kU8AAAAJ;;https://scholar.google.com/citations?view_op=list_works",
        "orcid": ";;0000-0002-2258-265X;;0000-0003-3441-6277",
        "linkedin": ";;yiming-li-thu/;;",
        "or_profile": "~Xiong_Xu1;~Kunzhe_Huang1;~Yiming_Li1;~Zhan_Qin2;~Kui_Ren4",
        "aff": "Zhejiang University;;Zhejiang University;Zhejiang University;Zhejiang University",
        "aff_domain": "zju.edu.cn;;zju.edu.cn;zju.edu.cn;zju.edu.cn",
        "position": "MS student;;Research Professor;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nxu2024towards,\ntitle={Towards Reliable and Efficient Backdoor Trigger Inversion via Decoupling Benign Features},\nauthor={Xiong Xu and Kunzhe Huang and Yiming Li and Zhan Qin and Kui Ren},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Tw9wemV6cb}\n}",
        "github": "",
        "project": "",
        "reviewers": "SUKT;tkgj;gstB;pvdL",
        "pdf_size": 2170347,
        "rating": "6;8;8;8",
        "confidence": "4;5;4;4",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;4;4;3",
        "wc_summary": "56;46;52;173",
        "wc_strengths": "34;6;102;34",
        "wc_weaknesses": "125;468;49;6",
        "wc_questions": "7;5;3;110",
        "wc_review": "222;525;206;323",
        "wc_reply_reviewers": "0;19;0;18",
        "wc_reply_authors": "978;1550;584;784",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "4;4;3;2",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            81.75,
            52.803290617157565
        ],
        "wc_strengths_avg": [
            44.0,
            35.38361202590826
        ],
        "wc_weaknesses_avg": [
            162.0,
            181.7346967422567
        ],
        "wc_questions_avg": [
            31.25,
            45.48832267736413
        ],
        "wc_review_avg": [
            319.0,
            127.11215520161713
        ],
        "wc_reply_reviewers_avg": [
            9.25,
            9.256754290786809
        ],
        "wc_reply_authors_avg": [
            974.0,
            360.5523540347504
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.25,
            0.82915619758885
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 31,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17472774791212655884&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=Tw9wemV6cb",
        "pdf": "https://openreview.net/pdf?id=Tw9wemV6cb",
        "email": "zju.edu.cn;;zju.edu.cn;zju.edu.cn;zju.edu.cn",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Zhejiang University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.zju.edu.cn",
        "aff_unique_abbr": "ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "TwB6N055Ub",
        "title": "Reduced-Rank Online Gaussian Process Modeling With Uncertain Inputs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Gaussian Process (GP) is an increasingly popular modeling approach. In its classical formulation, the inputs are supposed to be perfectly known. However, in some use cases, this assumption is not true: the inputs as well as the outputs can be corrupted by noise. Some methods already insert these uncertainties in GP modeling but the only currently existing online algorithm (i.e.  that incrementally updates the model each time a measure is acquired) still lacks in robustness and precision. In this article we propose a novel online Gaussian Process (GP) modeling approach for vector field mapping with uncertain inputs. They are included into the GP through a complete second-order Taylor approximation with a better estimation of variances. Our experiments prove that our algorithm is more accurate and robust than the previous online method for a shorter computing time. Moreover, for high input uncertainties, our method achieves better performance than both online and offline state of the art methods on simulated data. This algorithm can also be applied to diverse real scenarios which require precise estimation of unknown functions from a small set of corrupted datapoints, as we show in the challenging problem of indoor localization, mapping magnetic fields.",
        "keywords": "Gaussian process;reduced-rank;uncertainty;input noise",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/e0a7e129331a4647017871782536b5fec225962e.zip",
        "author": "Jade Coulin;Mohamed Ouerfelli;Richard Guillemard;Vincent Gay-Bellile;Cyril JOLY;Arnaud de La Fortelle",
        "authorids": "~Jade_Coulin1;~Mohamed_Ouerfelli1;~Richard_Guillemard1;~Vincent_Gay-Bellile1;~Cyril_JOLY1;~Arnaud_de_La_Fortelle1",
        "gender": "F;M;M;M;M;M",
        "homepage": ";;;;;",
        "dblp": "310/5960;32/1893;;42/2276;47/8924;",
        "google_scholar": ";;;kUVG8pIAAAAJ;p0R5vbsAAAAJ;https://scholar.google.fr/citations?hl=en",
        "orcid": "0000-0002-5407-6655;0000-0002-7361-2556;0000-0002-4260-7383;;0000-0002-2899-0179;",
        "linkedin": ";;guillemardrichard/;;;arnaud-de-la-fortelle-353ba15/",
        "or_profile": "~Jade_Coulin1;~Mohamed_Ouerfelli1;~Richard_Guillemard1;~Vincent_Gay-Bellile1;~Cyril_JOLY1;~Arnaud_de_La_Fortelle1",
        "aff": "Mines ParisTech;CEA;;CEA;Mines ParisTech;",
        "aff_domain": "mines-paristech.fr;cea.fr;;cea.fr;mines-paristech.fr;",
        "position": "PhD student;Researcher;;Researcher;Associate Professor;",
        "bibtex": "@misc{\ncoulin2024reducedrank,\ntitle={Reduced-Rank Online Gaussian Process Modeling With Uncertain Inputs},\nauthor={Jade Coulin and Mohamed Ouerfelli and Richard Guillemard and Vincent Gay-Bellile and Cyril JOLY and Arnaud de La Fortelle},\nyear={2024},\nurl={https://openreview.net/forum?id=TwB6N055Ub}\n}",
        "github": "",
        "project": "",
        "reviewers": "37Cr;1vN1;RsmZ;9wSx",
        "site": "https://openreview.net/forum?id=TwB6N055Ub",
        "pdf_size": 357580,
        "rating": "3;5;5;6",
        "confidence": "4;3;3;4",
        "soundness": "2;2;2;4",
        "contribution": "2;3;2;3",
        "presentation": "1;2;2;3",
        "wc_summary": "67;52;30;85",
        "wc_strengths": "55;53;29;104",
        "wc_weaknesses": "717;124;160;276",
        "wc_questions": "131;246;18;19",
        "wc_review": "970;475;237;484",
        "wc_reply_reviewers": "9;70;31;87",
        "wc_reply_authors": "977;706;688;600",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            58.5,
            20.180436070610565
        ],
        "wc_strengths_avg": [
            60.25,
            27.25229348146684
        ],
        "wc_weaknesses_avg": [
            319.25,
            236.40999873101813
        ],
        "wc_questions_avg": [
            103.5,
            94.2244660372241
        ],
        "wc_review_avg": [
            541.5,
            266.48686646812445
        ],
        "wc_reply_reviewers_avg": [
            49.25,
            30.85753554644311
        ],
        "wc_reply_authors_avg": [
            742.75,
            141.06625216542758
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.2294157338705618,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:G_KzgnuRjwEJ:scholar.google.com/&scioq=Reduced-Rank+Online+Gaussian+Process+Modeling+With+Uncertain+Inputs&hl=en&as_sdt=0,30",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;0",
        "aff_unique_norm": "MINES ParisTech;Commissariat \u00e0 l'\u00c9nergie Atomique et aux \u00c9nergies Alternatives",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.mines-paristech.fr;https://www cea fr",
        "aff_unique_abbr": "Mines ParisTech;CEA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "France"
    },
    {
        "title": "Multi-task Learning with 3D-Aware Regularization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18541",
        "id": "TwBY17Hgiy",
        "author_site": "Wei-Hong Li, Steven McDonagh, Ales Leonardis, Hakan Bilen",
        "tldr": "",
        "abstract": "Deep neural networks have become the standard solution for designing models that can perform multiple dense computer vision tasks such as depth estimation and semantic segmentation thanks to their ability to capture complex correlations in high dimensional feature space across tasks. However, the cross-task correlations that are learned in the unstructured feature space can be extremely noisy and susceptible to overfitting, consequently hurting performance. We propose to address this problem by introducing a structured 3D-aware regularizer which interfaces multiple tasks through the projection of features extracted from an image encoder to a shared 3D feature space and decodes them into their task output space through differentiable rendering. We show that the proposed method is architecture agnostic and can be plugged into various prior multi-task backbones to improve their performance; as we evidence using standard benchmarks NYUv2 and PASCAL-Context.",
        "keywords": "Multi-task learning;3D-aware;dense prediction",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/ff8076476ea5cdd081011daf829415eb1afce900.pdf",
        "author": "Wei-Hong Li;Steven McDonagh;Ales Leonardis;Hakan Bilen",
        "authorids": "~Wei-Hong_Li1;~Steven_McDonagh1;~Ales_Leonardis1;~Hakan_Bilen1",
        "gender": "M;;;M",
        "homepage": "https://weihonglee.github.io;https://smcdonagh.github.io/;;http://homepages.inf.ed.ac.uk/hbilen/",
        "dblp": "255/5590;159/2641;;97/2993",
        "google_scholar": "xKKsIxcAAAAJ;https://scholar.google.co.uk/citations?user=k8-q2AoAAAAJ;;PtBtfawAAAAJ",
        "orcid": ";0000-0001-7025-5197;;0000-0002-6947-6918",
        "linkedin": ";;;",
        "or_profile": "~Wei-Hong_Li1;~Steven_McDonagh1;~Ales_Leonardis1;~Hakan_Bilen1",
        "aff": "The Chinese University of Hong Kong;University of Edinburgh;;University of Edinburgh",
        "aff_domain": "cuhk.edu.hk;ed.ac.uk;;ed.ac.uk",
        "position": "Postdoc;Associate Professor;;Associate Professor",
        "bibtex": "@inproceedings{\nli2024multitask,\ntitle={Multi-task Learning with 3D-Aware Regularization},\nauthor={Wei-Hong Li and Steven McDonagh and Ales Leonardis and Hakan Bilen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=TwBY17Hgiy}\n}",
        "github": "",
        "project": "",
        "reviewers": "4RSv;boi3;girT;aMPL",
        "pdf_size": 14020994,
        "rating": "6;6;6;6",
        "confidence": "5;4;4;3",
        "soundness": "3;3;3;3",
        "contribution": "3;2;3;3",
        "presentation": "3;3;2;3",
        "wc_summary": "42;88;46;90",
        "wc_strengths": "50;60;73;64",
        "wc_weaknesses": "121;209;27;122",
        "wc_questions": "6;86;97;21",
        "wc_review": "219;443;243;297",
        "wc_reply_reviewers": "0;0;0;111",
        "wc_reply_authors": "964;1232;1003;641",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "2;2;3;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            66.5,
            22.555487137279922
        ],
        "wc_strengths_avg": [
            61.75,
            8.257572282456872
        ],
        "wc_weaknesses_avg": [
            119.75,
            64.37148048631475
        ],
        "wc_questions_avg": [
            52.5,
            39.5506005011302
        ],
        "wc_review_avg": [
            300.5,
            86.98706800438787
        ],
        "wc_reply_reviewers_avg": [
            27.75,
            48.064409910036346
        ],
        "wc_reply_authors_avg": [
            960.0,
            210.71900721102497
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5176860634760426116&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=TwBY17Hgiy",
        "pdf": "https://openreview.net/pdf?id=TwBY17Hgiy",
        "email": "cuhk.edu.hk;ed.ac.uk;;ed.ac.uk",
        "author_num": 4,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Chinese University of Hong Kong;University of Edinburgh",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cuhk.edu.hk;https://www.ed.ac.uk",
        "aff_unique_abbr": "CUHK;Edinburgh",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "title": "Safe RLHF: Safe Reinforcement Learning from Human Feedback",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18540",
        "id": "TyFrPOKYXw",
        "author_site": "Juntao Dai, Xuehai Pan, Ruiyang Sun, Jiaming Ji, Xinbo Xu, Mickel Liu, Yizhou Wang, Yaodong Yang",
        "tldr": "",
        "abstract": "With the development of large language models (LLMs), striking a balance between the performance and safety of AI systems has never been more critical. However, the inherent tension between the objectives of helpfulness and harmlessness presents a significant challenge during LLM training. To address this issue, we propose Safe Reinforcement Learning from Human Feedback (Safe RLHF), a novel algorithm for human value alignment. Safe RLHF explicitly decouples human preferences regarding helpfulness and harmlessness, effectively avoiding the crowd workers' confusion about the tension and allowing us to train separate reward and cost models. We formalize the safety concern of LLMs as an optimization task of maximizing the reward function while satisfying specified cost constraints. Leveraging the Lagrangian method to solve this constrained problem, Safe RLHF dynamically adjusts the balance between the two objectives during fine-tuning. Through a three-round fine-tuning using Safe RLHF, we demonstrate a superior ability to mitigate harmful responses while enhancing model performance compared to existing value-aligned algorithms. Experimentally, we fine-tuned the Alpaca-7B using Safe RLHF and aligned it with collected human preferences, significantly improving its helpfulness and harmlessness according to human evaluations.\n\nCode is available at https://github.com/PKU-Alignment/safe-rlhf.\n\n\nWarning: This paper contains example data that may be offensive or harmful.",
        "keywords": "Safe Reinforcement Learning;Reinforcement Learning from Human Feedback;Large Language Model;AI Safety",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/b217a456a924d098f0a67e06e943ad2a9a18a040.zip",
        "author": "Josef Dai;Xuehai Pan;Ruiyang Sun;Jiaming Ji;Xinbo Xu;Mickel Liu;Yizhou Wang;Yaodong Yang",
        "authorids": "~Josef_Dai1;~Xuehai_Pan1;~Ruiyang_Sun2;~Jiaming_Ji2;~Xinbo_Xu1;~Mickel_Liu1;~Yizhou_Wang1;~Yaodong_Yang1",
        "gender": "M;M;M;;M;M;M;M",
        "homepage": "https://github.com/XuehaiPan;https://github.com/rockmagma02;https://jijiaming.com;https://github.com/Zn-Pt;https://mickel-liu.github.io/;https://cfcs.pku.edu.cn/wangyizhou/;https://www.yangyaodong.com;https://github.com/calico-1226",
        "dblp": ";273/6822;313/9356.html;;;71/3387-1;170/1496-1;359/3349",
        "google_scholar": "VIwJg4gAAAAJ;EE_w5nAAAAAJ;aW8WbYYAAAAJ;;2oog2ZcAAAAJ;831z_VcAAAAJ;https://scholar.google.co.uk/citations?user=6yL0xw8AAAAJ;",
        "orcid": ";;;;;;0000-0001-8132-5613;",
        "linkedin": ";;;;;;yaodong-yang;",
        "or_profile": "~Xuehai_Pan1;~Ruiyang_Sun2;~Jiaming_Ji2;~Xinbo_Xu1;~Mickel_Liu1;~Yizhou_Wang1;~Yaodong_Yang1;~Juntao_Dai2",
        "aff": "Peking University;Peking University;Peking University;Beijing University of Posts and Telecommunications;Beijing Institute for General Artificial Intelligence;Peking University;Peking University;Peking University",
        "aff_domain": "pku.edu.cn;pku.edu.cn;pku.edu.cn;bupt.edu.cn;bigai.ai;pku.edu.cn;pku.edu.cn;pku.edu.cn",
        "position": "PhD student;Undergrad student;PhD student;Undergrad student;Intern;Full Professor;Assistant Professor;Researcher",
        "bibtex": "@inproceedings{\ndai2024safe,\ntitle={Safe {RLHF}: Safe Reinforcement Learning from Human Feedback},\nauthor={Josef Dai and Xuehai Pan and Ruiyang Sun and Jiaming Ji and Xinbo Xu and Mickel Liu and Yizhou Wang and Yaodong Yang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=TyFrPOKYXw}\n}",
        "github": "",
        "project": "",
        "reviewers": "xNog;NMqi;murU;NDaV",
        "pdf_size": 1074019,
        "rating": "6;8;8;8",
        "confidence": "5;3;3;4",
        "soundness": "3;2;4;3",
        "contribution": "2;2;4;3",
        "presentation": "3;2;4;3",
        "wc_summary": "78;166;84;106",
        "wc_strengths": "72;154;41;123",
        "wc_weaknesses": "197;70;4;229",
        "wc_questions": "144;79;24;249",
        "wc_review": "491;469;153;707",
        "wc_reply_reviewers": "443;20;0;22",
        "wc_reply_authors": "2373;1265;331;1537",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "5;3;1;4",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            108.5,
            34.79583308386221
        ],
        "wc_strengths_avg": [
            97.5,
            43.83206588788623
        ],
        "wc_weaknesses_avg": [
            125.0,
            91.74148461846472
        ],
        "wc_questions_avg": [
            124.0,
            83.74067112222113
        ],
        "wc_review_avg": [
            455.0,
            197.61072845369503
        ],
        "wc_reply_reviewers_avg": [
            121.25,
            185.96152155755232
        ],
        "wc_reply_authors_avg": [
            1376.5,
            728.7446397744549
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.25,
            1.479019945774904
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.8703882797784891,
        "gs_citation": 320,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10151978917046355982&as_sdt=5,31&sciodt=0,31&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=TyFrPOKYXw",
        "pdf": "https://openreview.net/pdf?id=TyFrPOKYXw",
        "email": "pku.edu.cn;pku.edu.cn;pku.edu.cn;bupt.edu.cn;bigai.ai;pku.edu.cn;pku.edu.cn;pku.edu.cn",
        "author_num": 8,
        "aff_unique_index": "0;0;0;1;2;0;0;0",
        "aff_unique_norm": "Peking University;Beijing University of Posts and Telecommunications;Beijing Institute for General Artificial Intelligence",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.pku.edu.cn;http://www.bupt.edu.cn/;http://www.bigaiai.org/",
        "aff_unique_abbr": "Peking U;BUPT;BIGAI",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Beijing",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "TyZhiK6fDf",
        "title": "Co-Learning Empirical Games & World Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Game-based decision-making involves reasoning over both world dynamics and strategic interactions among the agents.\nTypically, empirical models capturing these respective aspects are learned and used separately.\nWe investigate the potential gain from co-learning these elements: a world model for dynamics and an empirical game for strategic interactions.\nEmpirical games drive world models toward a broader consideration of possible game dynamics induced by a diversity of strategy profiles. \nConversely, world models guide empirical games to efficiently discover new strategies through planning. \nWe demonstrate these benefits first independently, then in combination as realized by a new algorithm, Dyna-PSRO, that co-learns an empirical game and a world model.\nWhen compared to PSRO---a baseline empirical-game building algorithm, Dyna-PSRO is found to compute lower regret solutions on partially observable general-sum games.\nIn our experiments, Dyna-PSRO also requires substantially fewer experiences than PSRO, a key algorithmic advantage for settings where collecting player-game interaction data is a cost-limiting factor.",
        "keywords": "Multiagent learning;Empirical Game Theory;Model-Based Reinforcement Learning;Transfer Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/13f1fc4904392f7987e08a71e4068616419df365.pdf",
        "author": "Max Olan Smith;Michael P. Wellman",
        "authorids": "~Max_Olan_Smith1;~Michael_P._Wellman1",
        "gender": "M;M",
        "homepage": "https://www.maxosmith.com;https://strategicreasoning.org/michael-p-wellman",
        "dblp": "275/3418;w/MichaelPWellman",
        "google_scholar": "gc1jnZ4AAAAJ;https://scholar.google.com.tw/citations?user=UruIct4AAAAJ",
        "orcid": ";0000-0002-1691-6844",
        "linkedin": ";https://linkedin.com/in/michael-wellman-23ab1",
        "or_profile": "~Max_Smith1;~Michael_Wellman1",
        "aff": ";University of Michigan",
        "aff_domain": ";umich.edu",
        "position": ";Full Professor",
        "bibtex": "@misc{\nsmith2024colearning,\ntitle={Co-Learning Empirical Games \\& World Models},\nauthor={Max Olan Smith and Michael P. Wellman},\nyear={2024},\nurl={https://openreview.net/forum?id=TyZhiK6fDf}\n}",
        "github": "",
        "project": "",
        "reviewers": "SAe1;Y4nV;c2GE;sm74;qJSG",
        "site": "https://openreview.net/forum?id=TyZhiK6fDf",
        "pdf_size": 2136755,
        "rating": "3;5;6;6;8",
        "confidence": "4;4;4;4;3",
        "soundness": "2;2;3;2;3",
        "contribution": "2;3;3;2;3",
        "presentation": "1;2;3;3;3",
        "wc_summary": "108;78;39;64;86",
        "wc_strengths": "117;45;99;109;39",
        "wc_weaknesses": "497;604;254;278;42",
        "wc_questions": "90;29;59;55;176",
        "wc_review": "812;756;451;506;343",
        "wc_reply_reviewers": "357;411;0;318;6",
        "wc_reply_authors": "2132;1180;767;1849;621",
        "reply_reviewers": "1;1;0;2;1",
        "reply_authors": "4;3;2;3;1",
        "rating_avg": [
            5.6,
            1.624807680927192
        ],
        "confidence_avg": [
            3.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.4,
            0.8
        ],
        "wc_summary_avg": [
            75.0,
            22.960836221705865
        ],
        "wc_strengths_avg": [
            81.8,
            33.047844105175756
        ],
        "wc_weaknesses_avg": [
            335.0,
            197.11113616434767
        ],
        "wc_questions_avg": [
            81.8,
            50.92504295530834
        ],
        "wc_review_avg": [
            573.6,
            180.48889162494183
        ],
        "wc_reply_reviewers_avg": [
            218.4,
            178.34640450538947
        ],
        "wc_reply_authors_avg": [
            1309.8,
            592.0599293990432
        ],
        "reply_reviewers_avg": [
            1.0,
            0.6324555320336759
        ],
        "reply_authors_avg": [
            2.6,
            1.019803902718557
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.7385489458759964,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3999842010021962723&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Michigan",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.umich.edu",
        "aff_unique_abbr": "UM",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "TyjVB2VIq3",
        "title": "Reinforcement Learning with Partial Order Representation for Monotonic Physical System",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Prior model-free reinforcement learning techniques may struggle with complex high-dimensional visual-motor control tasks such as rope manipulation and pouring water due to the high sample complexity involved in state representation and dynamics learning. These tasks often involve physical systems that preserve the property of monotonicity, such as water always flowing downwards when poured. Motivated by this insight, we propose the Partial Order Representation (POR) framework, which improves reinforcement learning algorithms' ability to capture the systems' monotonicity, resulting in valuable signals during training that can enhance performance and reduce sample complexity. Our experiments demonstrate that the POR framework outperforms state-of-the-art methods in terms of sample efficiency and performance across a diverse set of challenging visual-motor control tasks.",
        "keywords": "reinforcement learning;representation learning;robotics",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/685647716d84ece419d223702df8eb840282780a.pdf",
        "author": "Yen-Jen Wang;Xiaoyu Chen;Hai Zhong;Yanjiang Guo;Jianyu Chen",
        "authorids": "~Yen-Jen_Wang1;~Xiaoyu_Chen4;~Hai_Zhong1;~Yanjiang_Guo1;~Jianyu_Chen1",
        "gender": "M;;;M;M",
        "homepage": "https://wangyenjen.github.io;https://github.com/Cospui;https://github.com/zhonghai1995;https://robert-gyj.github.io/;http://people.iiis.tsinghua.edu.cn/~jychen/",
        "dblp": "164/2206;;;;",
        "google_scholar": "_U-HwfkAAAAJ;;;rBeZZPMAAAAJ;",
        "orcid": ";;;;",
        "linkedin": "wangyenjen/;;;;",
        "or_profile": "~Yen-Jen_Wang1;~Xiaoyu_Chen4;~Hai_Zhong1;~Yanjiang_Guo1;~Jianyu_Chen1",
        "aff": "Tsinghua University;Tsinghua University;Tsinghua University;Tsinghua University;Tsinghua University",
        "aff_domain": "mails.tsinghua.edu.cn;tsinghua.edu.cn;mail.tsinghua.edu.cn;mails.tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "MS student;Graduate student;PhD student;PhD student;Assistant Professor",
        "bibtex": "@misc{\nwang2024reinforcement,\ntitle={Reinforcement Learning with Partial Order Representation for Monotonic Physical System},\nauthor={Yen-Jen Wang and Xiaoyu Chen and Hai Zhong and Yanjiang Guo and Jianyu Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=TyjVB2VIq3}\n}",
        "github": "",
        "project": "",
        "reviewers": "T6bZ;TCFd;Beac;nyme",
        "site": "https://openreview.net/forum?id=TyjVB2VIq3",
        "pdf_size": 2992648,
        "rating": "3;3;5;5",
        "confidence": "5;3;5;4",
        "soundness": "1;2;4;2",
        "contribution": "1;2;4;2",
        "presentation": "3;3;3;3",
        "wc_summary": "64;281;376;76",
        "wc_strengths": "29;55;133;42",
        "wc_weaknesses": "422;79;201;294",
        "wc_questions": "40;24;25;8",
        "wc_review": "555;439;735;420",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            1.0897247358851685
        ],
        "contribution_avg": [
            2.25,
            1.0897247358851685
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            199.25,
            133.61020731965056
        ],
        "wc_strengths_avg": [
            64.75,
            40.46217369346338
        ],
        "wc_weaknesses_avg": [
            249.0,
            125.6562772009421
        ],
        "wc_questions_avg": [
            24.25,
            11.321991874224253
        ],
        "wc_review_avg": [
            537.25,
            125.3203395303412
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.30151134457776363,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:5wz6Ib9XPR4J:scholar.google.com/&scioq=Reinforcement+Learning+with+Partial+Order+Representation+for+Monotonic+Physical+System&hl=en&as_sdt=0,48",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Tsinghua University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "Tz6HnhBzLl",
        "title": "Zero-Sum Positional Differential Games as a Framework for Robust Reinforcement Learning: Deep Q-Learning Approach",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Robust Reinforcement Learning (RRL) is a promising Reinforcement Learning (RL) paradigm aimed at training robust to uncertainty or disturbances models, making them more efficient for real-world applications. Following this paradigm, uncertainty or disturbances are interpreted as actions of a second adversarial agent, and thus, the problem is reduced to seeking the agents' policies robust to any opponent's actions. This paper is the first to propose considering the RRL problems within the positional differential game theory, which helps us to obtain theoretically justified intuition to develop a centralized Q-learning approach. Namely, we prove that under Isaacs's condition (sufficiently general for real-world dynamical systems), the same Q-function can be utilized as an approximate solution of both minimax and maximin Bellman equations, and we also indicate conditions when this Q-function can be decomposed. Based on these results, we present the Isaacs Deep Q-Networks (IDQN) and Decomposed Isaacs Deep Q-Networks (DIDQN) algorithms, respectively. We analyze their performance by comparing them with other baseline RRL and Multi-Agent RL algorithms. We consider both simple environments with known accurate solutions and complex large-dimensional MuJoCo environments. In each experiment, we thoroughly evaluate the agents' policies obtained after learning, training opponents against them using various RL algorithms with various parameters. The experiment results demonstrate the superiority of the presented algorithms in all experiments under consideration.",
        "keywords": "robust reinforcement learning;zero-sum games;deep q-learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/4ec2fdb52e411f85f5f0e1c56a755ed20801e643.zip",
        "author": "Anton Plaksin;Vitaly Kalev",
        "authorids": "~Anton_Plaksin1;~Vitaly_Kalev1",
        "gender": "M;M",
        "homepage": "https://orcid.org/0000-0002-1468-201X;",
        "dblp": "276/9860;",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;",
        "orcid": "0000-0002-1468-201X;0000-0002-8904-2930",
        "linkedin": ";",
        "or_profile": "~Anton_Plaksin1;~Vitaly_Kalev1",
        "aff": ";",
        "aff_domain": ";",
        "position": ";",
        "bibtex": "@misc{\nplaksin2024zerosum,\ntitle={Zero-Sum Positional Differential Games as a Framework for Robust Reinforcement Learning: Deep Q-Learning Approach},\nauthor={Anton Plaksin and Vitaly Kalev},\nyear={2024},\nurl={https://openreview.net/forum?id=Tz6HnhBzLl}\n}",
        "github": "",
        "project": "",
        "reviewers": "BWN5;o2s5;Uwp8;h5zf",
        "site": "https://openreview.net/forum?id=Tz6HnhBzLl",
        "pdf_size": 670241,
        "rating": "3;5;6;8",
        "confidence": "5;3;3;3",
        "soundness": "2;1;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;1;3;3",
        "wc_summary": "64;84;90;84",
        "wc_strengths": "15;54;49;32",
        "wc_weaknesses": "217;67;159;13",
        "wc_questions": "11;39;11;153",
        "wc_review": "307;244;309;282",
        "wc_reply_reviewers": "0;29;18;5",
        "wc_reply_authors": "1266;628;776;390",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "2;2;2;1",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            80.5,
            9.836157786453
        ],
        "wc_strengths_avg": [
            37.5,
            15.337861650177967
        ],
        "wc_weaknesses_avg": [
            114.0,
            79.12648102879339
        ],
        "wc_questions_avg": [
            53.5,
            58.57260451781191
        ],
        "wc_review_avg": [
            285.5,
            26.21545345783666
        ],
        "wc_reply_reviewers_avg": [
            13.0,
            11.335784048754634
        ],
        "wc_reply_authors_avg": [
            765.0,
            320.3576126768334
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.8006407690254357,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3663410815533770007&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7
    },
    {
        "title": "FFB: A Fair Fairness Benchmark for In-Processing Group Fairness Methods",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18539",
        "id": "TzAJbTClAz",
        "author_site": "Xiaotian Han, Jianfeng Chi, Yu Chen, Qifan Wang, Han Zhao, Na Zou, Xia Hu",
        "tldr": "",
        "abstract": "This paper introduces the Fair Fairness Benchmark (FFB), a benchmarking framework for in-processing group fairness methods. Ensuring fairness in machine learning is important for ethical compliance. However, there exist challenges in comparing and developing fairness methods due to inconsistencies in experimental settings, lack of accessible algorithmic implementations, and limited extensibility of current fairness packages and tools. To address these issues, we introduce an open-source standardized benchmark for evaluating in-processing group fairness methods and provide a comprehensive analysis of state-of-the-art methods to ensure different notions of group fairness. This work offers the following key contributions: the provision of flexible, extensible, minimalistic, and research-oriented open-source code; the establishment of unified fairness method benchmarking pipelines; and extensive benchmarking, which yields key insights from 45,079 experiments, 14,428 GPU hours. We believe that our work will significantly facilitate the growth and development of the fairness research community. The benchmark is available at https://github.com/ahxt/fair_fairness_benchmark.",
        "keywords": "Fairness Benchmark;Bias Mitigation;Algorithmic Fairness",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Xiaotian Han;Jianfeng Chi;Yu Chen;Qifan Wang;Han Zhao;Na Zou;Xia Hu",
        "authorids": "~Xiaotian_Han1;~Jianfeng_Chi1;~Yu_Chen5;~Qifan_Wang2;~Han_Zhao1;~Na_Zou2;~Xia_Hu4",
        "gender": "M;M;M;M;M;F;M",
        "homepage": "https://ahxt.github.io/;https://jfchi.github.io/;http://academic.hugochan.net;https://wqfcr.github.io/;https://hanzhaoml.github.io/;https://nzou1.github.io/;https://cs.rice.edu/~xh37/index.html",
        "dblp": ";231/6028.html;87/1254-22;33/8610;03/3520-2;152/0090-1.html;256/9406.html",
        "google_scholar": "Uromx98AAAAJ;S_7a_B4AAAAJ;m6Sj1yoAAAAJ;LrSyLosAAAAJ;x942ipYAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com.tw/citations?user=pcCS60IAAAAJ",
        "orcid": ";;;0000-0002-7570-5756;0000-0002-8579-1600;0000-0003-1984-795X;",
        "linkedin": ";;;;;na-zou-a1721535/;",
        "or_profile": "~Xiaotian_Han1;~Jianfeng_Chi1;~Yu_Chen5;~Qifan_Wang2;~Han_Zhao1;~Na_Zou2;~Xia_Hu2",
        "aff": "Texas A&M University;Meta AI;Anytime.AI;Meta AI;University of Illinois, Urbana Champaign;University of Houston;Rice University",
        "aff_domain": "tamu.edu;meta.com;anytime-ai.com;fb.com;illinois.edu;uh.edu;rice.edu",
        "position": "PhD student;Research Scientist;Researcher;Principal Researcher;Assistant Professor;Assistant Professor;Associate Professor",
        "bibtex": "@inproceedings{\nhan2024ffb,\ntitle={{FFB}: A Fair Fairness Benchmark for In-Processing Group Fairness Methods},\nauthor={Xiaotian Han and Jianfeng Chi and Yu Chen and Qifan Wang and Han Zhao and Na Zou and Xia Hu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=TzAJbTClAz}\n}",
        "github": "",
        "project": "",
        "reviewers": "Tj8b;5ZmP;8vvg;dSax",
        "pdf_size": 4001293,
        "rating": "5;6;8;8",
        "confidence": "4;4;4;4",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;4;3;3",
        "wc_summary": "45;85;34;60",
        "wc_strengths": "29;60;9;76",
        "wc_weaknesses": "394;216;26;97",
        "wc_questions": "6;26;19;27",
        "wc_review": "474;387;88;260",
        "wc_reply_reviewers": "0;107;0;0",
        "wc_reply_authors": "777;700;266;271",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "3;1;1;1",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            56.0,
            19.11805429430516
        ],
        "wc_strengths_avg": [
            43.5,
            26.119915773217954
        ],
        "wc_weaknesses_avg": [
            183.25,
            139.3330093696393
        ],
        "wc_questions_avg": [
            19.5,
            8.381527307120106
        ],
        "wc_review_avg": [
            302.25,
            145.23149623962428
        ],
        "wc_reply_reviewers_avg": [
            26.75,
            46.332359102467464
        ],
        "wc_reply_authors_avg": [
            503.5,
            236.5782111691607
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 26,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1087909453372911011&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=TzAJbTClAz",
        "pdf": "https://openreview.net/pdf?id=TzAJbTClAz",
        "email": "tamu.edu;meta.com;anytime-ai.com;fb.com;illinois.edu;uh.edu;rice.edu",
        "author_num": 7,
        "aff_unique_index": "0;1;2;1;3;4;5",
        "aff_unique_norm": "Texas A&M University;Meta;Anytime AI;University of Illinois Urbana-Champaign;University of Houston;Rice University",
        "aff_unique_dep": ";Meta AI;;;;",
        "aff_unique_url": "https://www.tamu.edu;https://meta.com;https://www.anytime.ai;https://illinois.edu;https://www.uh.edu;https://www.rice.edu",
        "aff_unique_abbr": "TAMU;Meta;Anytime AI;UIUC;UH;Rice",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Urbana-Champaign",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "TzE7EG7S4i",
        "title": "High-Dimensional Geometric Streaming for Nearly Low Rank Data",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We study streaming algorithms for the outer $(d-k)$-radius estimation of a set of points $a_1, \\ldots ,a_n \\in \\mathbb{R}^d$. The problem asks to compute the minimum over all $k$-dimensional flats $F$ of $\\max_i d(a_i, F)$, where $d(u, F)$ denotes the distance of a point $u$ from the flat $F$. This problem has been extensively studied in earlier works (Varadarajan et al., SIAM J. Comput. 2006) over a wide range of values of $d$, $k$ and $d-k$. The earlier algorithms are based on SDP relaxations of the problem and are not applicable in the streaming setting where we do not have space to store all the rows that we see. We give an efficient streaming coreset algorithm that selects $\\text{poly}(k, \\log n)$ rows and at the end outputs a $\\text{poly}(k, \\log n)$ approximation to the outer $(d-k)$-radius. The algorithm only uses $d \\cdot \\text{poly}(k, \\log n)$ bits of space and runs in an overall time of $O(\\text{nnz}(A) \\cdot \\log n + \\text{poly}(d, \\log n))$, where $\\text{nnz}(A)$ denotes the number of nonzero entries in the $n \\times d$ matrix $A$ with rows given by $a_1, \\ldots, a_n \\in \\mathbb{R}^d$.\n\nIn a recent work, Woodruff and Yasuda (FOCS 2022), give streaming algorithms for a number of high-dimensional geometric problems such as width estimation, convex hull estimation, volume estimation etc. Their algorithms require $\\Omega(d^2)$ bits of space and have an $\\Omega(\\sqrt{d})$ multiplicative approximation factor even when the rows $a_1,\\ldots, a_n$ are \u201calmost\u201d spanned by a $k$ dimensional subspace. We show that when the rows are $a_1,\\ldots,a_n$  are \u201calmost\u201d spanned by a $k$ dimensional space, our streaming coreset construction algorithm can be used to obtain algorithms that use only $O(d \\cdot \\text{poly}(k, \\log n))$ bits of space and have a multiplicative error of $O(\\text{poly}(k, \\log n))$. When $d$ is large and $k$ is much smaller than $d$, our algorithms use a much smaller amount of space while guaranteeing a better approximation. We pay an additive error depending on how close the rows $a_1,\\ldots,a_n$ to being spanned by a rank $k$ subspace.\n\nAs another application of our algorithm, we show that our streaming coreset can also be used to obtain approximations to the $\\ell_p$ subspace approximation problem using exponential random variables to embed the $\\ell_p$ subspace approximation problem into an instance of the  $\\ell_{\\infty}$ subspace approximation problem.",
        "keywords": "Coresets;Subspace Approximation;Streaming Algorithms",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/2279ed07ea4495ec11333b7bbd069fb7f6a5af81.zip",
        "author": "Hossein Esfandiari;Praneeth Kacham;Vahab Mirrokni;David Woodruff;Peilin Zhong",
        "authorids": "~Hossein_Esfandiari1;~Praneeth_Kacham1;~Vahab_Mirrokni2;~David_Woodruff1;~Peilin_Zhong1",
        "gender": ";M;M;M;M",
        "homepage": "https://sites.google.com/corp/view/hossein-esfandiari;https://www.praneethkacham.com;https://people.csail.mit.edu/mirrokni/Welcome.html;http://www.cs.cmu.edu/~dwoodruf/;http://www.cs.columbia.edu/~peilin/",
        "dblp": "146/7746;255/5684;m/VahabSMirrokni;w/DPWoodruff;148/9632",
        "google_scholar": "Rt8ppJsAAAAJ;hKhPmTkAAAAJ;opbZfw0AAAAJ;https://scholar.google.com.tw/citations?user=0G2t-6sAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0001-8130-6631;;;;",
        "linkedin": "hossein-esfandiari-10bb0281;;;;",
        "or_profile": "~Hossein_Esfandiari1;~Praneeth_Kacham1;~Vahab_Mirrokni2;~David_Woodruff1;~Peilin_Zhong1",
        "aff": "Google;Carnegie Mellon University;Google Research;Carnegie Mellon University;Google",
        "aff_domain": "google.com;cmu.edu;google.com;cmu.edu;google.com",
        "position": "Researcher;PhD student;VP, Google Fellow;Full Professor;Researcher",
        "bibtex": "@misc{\nesfandiari2024highdimensional,\ntitle={High-Dimensional Geometric Streaming for Nearly Low Rank Data},\nauthor={Hossein Esfandiari and Praneeth Kacham and Vahab Mirrokni and David Woodruff and Peilin Zhong},\nyear={2024},\nurl={https://openreview.net/forum?id=TzE7EG7S4i}\n}",
        "github": "",
        "project": "",
        "reviewers": "XBn6;YvdX;TTZL",
        "site": "https://openreview.net/forum?id=TzE7EG7S4i",
        "pdf_size": 1045102,
        "rating": "3;6;8",
        "confidence": "3;3;3",
        "soundness": "2;4;4",
        "contribution": "2;4;3",
        "presentation": "2;3;4",
        "wc_summary": "139;194;207",
        "wc_strengths": "20;93;108",
        "wc_weaknesses": "153;170;8",
        "wc_questions": "53;126;3",
        "wc_review": "365;583;326",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "472;334;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;2;0",
        "rating_avg": [
            5.666666666666667,
            2.0548046676563256
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            180.0,
            29.473151624260794
        ],
        "wc_strengths_avg": [
            73.66666666666667,
            38.43898484033567
        ],
        "wc_weaknesses_avg": [
            110.33333333333333,
            72.69265590293301
        ],
        "wc_questions_avg": [
            60.666666666666664,
            50.50632523643835
        ],
        "wc_review_avg": [
            424.6666666666667,
            113.08502209498047
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            268.6666666666667,
            198.15370016451593
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.9428090415820634
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:yBCFaXBOuMIJ:scholar.google.com/&scioq=High-Dimensional+Geometric+Streaming+for+Nearly+Low+Rank+Data&hl=en&as_sdt=0,7",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;0;1;0",
        "aff_unique_norm": "Google;Carnegie Mellon University",
        "aff_unique_dep": "Google;",
        "aff_unique_url": "https://www.google.com;https://www.cmu.edu",
        "aff_unique_abbr": "Google;CMU",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Mountain View;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "TzWLecXH6I",
        "title": "Towards Personalized AI: Early-stopping Low-Rank Adaptation of Foundation Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Foundation models, such as Latent Diffusion Models and Generative Pre-trained Transformers, trained on broad data have shown impressive results in various downstream applications. Fine-tuning a pre-trained foundation model is an affordable way to customize it on small and personalized data. However, the non-AI experts often struggle with the hyperparameter configurations and sometimes encounter the overfitting issue without even realizing it. To mitigate this issue, we introduce a new monitoring metric (CS-Fluctuation) to facilitate early stopping the fine-tuning process. Specifically, we leverage Low-Rank Adaptation (LoRA) to fit the small scale of the personalized data while monitoring the cosine similarity of the parameter changes between the LoRA branch and its corresponding layer. When the changes become steady, we observe the onset of overfitting issue which becomes increasingly severe as fine-tuning progresses. Empirically, we leverage various types of personalized data to conduct customization experiments on both vision and language foundation models, which corroborates the effectiveness of CS-Fluctuation in early stopping the LoRA fine-tuning. The code can be found at the anonymous link: \\url{https://anonymous.4open.science/r/EarlyStopLoRA-7467/}.",
        "keywords": "Foundation Models;Fine-Tuning;Overfitting Prevention",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Zihao LUO;Di Wang;Yun Sing Koh;Jingfeng Zhang",
        "authorids": "~Zihao_LUO2;~Di_Wang1;~Yun_Sing_Koh2;~Jingfeng_Zhang1",
        "gender": "M;;;M",
        "homepage": ";;https://profiles.auckland.ac.nz/y-koh;https://zjfheart.github.io",
        "dblp": ";;23/1879.html;227/2664.html",
        "google_scholar": ";;0L38IrAAAAAJ;NS0P1FkAAAAJ",
        "orcid": "0000-0002-9204-7580;;0000-0001-7256-4049;0000-0003-3491-8074",
        "linkedin": ";;yun-sing-koh-a7ba358/;",
        "or_profile": "~Zihao_LUO2;~Di_Wang1;~Yun_Sing_Koh2;~Jingfeng_Zhang1",
        "aff": "University of Auckland;;University of Auckland;University of Auckland",
        "aff_domain": "auckland.ac.nz;;auckland.ac.nz;auckland.ac.nz",
        "position": "MS student;;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nluo2024towards,\ntitle={Towards Personalized {AI}: Early-stopping Low-Rank Adaptation of Foundation Models},\nauthor={Zihao LUO and Di Wang and Yun Sing Koh and Jingfeng Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=TzWLecXH6I}\n}",
        "github": "",
        "project": "",
        "reviewers": "9V6J;fqrQ;ndtG;rWot",
        "site": "https://openreview.net/forum?id=TzWLecXH6I",
        "pdf_size": 27340710,
        "rating": "3;3;5;6",
        "confidence": "4;3;3;4",
        "soundness": "1;2;2;3",
        "contribution": "3;2;2;3",
        "presentation": "2;2;3;3",
        "wc_summary": "43;47;138;67",
        "wc_strengths": "23;30;107;121",
        "wc_weaknesses": "118;99;195;197",
        "wc_questions": "42;60;144;3",
        "wc_review": "226;236;584;388",
        "wc_reply_reviewers": "0;79;38;0",
        "wc_reply_authors": "328;433;248;354",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            73.75,
            38.192767639960316
        ],
        "wc_strengths_avg": [
            70.25,
            44.09861108923953
        ],
        "wc_weaknesses_avg": [
            152.25,
            44.268357773922446
        ],
        "wc_questions_avg": [
            62.25,
            51.49939320030868
        ],
        "wc_review_avg": [
            358.5,
            145.15767289399483
        ],
        "wc_reply_reviewers_avg": [
            29.25,
            32.64486942844159
        ],
        "wc_reply_authors_avg": [
            340.75,
            66.05064344879617
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.19245008972987526,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5429048563661051813&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Auckland",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.auckland.ac.nz",
        "aff_unique_abbr": "UoA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "New Zealand"
    },
    {
        "id": "TzcuXQq0aR",
        "title": "PlugVFL: Robust and IP-Protecting Vertical Federated Learning against Unexpected Quitting of Parties",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In federated learning systems, the unexpected quitting of participants is inevitable. Such quittings generally do not incur serious consequences in horizontal federated learning (HFL), but they do bring damage to vertical federated learning (VFL), which is underexplored in previous research. In this paper, we show that there are two major vulnerabilities when passive parties unexpectedly quit in the deployment phase of VFL --- severe performance degradation and intellectual property (IP) leakage of the active party's labels. To solve these issues, we design PlugVFL to improve the VFL model's robustness against the unexpected exit of passive parties and protect the active party's IP in the deployment phase simultaneously. We evaluate our framework on multiple datasets against different inference attacks. The results show that PlugVFL effectively maintains model performance after the passive party quits and successfully disguises label information from the passive party's feature extractor, thereby mitigating IP leakage.",
        "keywords": "federated learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Jingwei Sun;Zhixu Du;Anna Dai;Saleh Baghersalimi;Alireza Amirshahi;Qilin Zheng;David Atienza;Yiran Chen",
        "authorids": "~Jingwei_Sun2;~Zhixu_Du1;~Anna_Dai1;~Saleh_Baghersalimi1;~Alireza_Amirshahi1;~Qilin_Zheng1;~David_Atienza1;~Yiran_Chen1",
        "gender": "M;M;F;;M;M;M;M",
        "homepage": ";https://doesnothave.com;https://dai-anna.github.io;;;https://scholar.google.com/citations?hl=en&user=9jk5h9UAAAAJ;https://people.epfl.ch/david.atienza;https://ece.duke.edu/people/yiran-chen/",
        "dblp": "66/7761-2;;;;;;a/DavidAtienza.html;80/1641",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;UpxfrVMAAAAJ;zaz6bLMAAAAJ;;gt_fJD0AAAAJ;;H1JXhMIAAAAJ;",
        "orcid": ";;;;;;0000-0001-9536-4947;0000-0002-1486-8412",
        "linkedin": ";;dai-anna/;;a-amirshahi/;;david-atienza-7bb0852/;",
        "or_profile": "~Jingwei_Sun2;~Zhixu_Du1;~Anna_Dai1;~Saleh_Baghersalimi1;~Alireza_Amirshahi1;~Qilin_Zheng1;~David_Atienza1;~Yiran_Chen1",
        "aff": "Duke University;Duke University, Duke University;;Swiss Federal Institute of Technology Lausanne;Swiss Federal Institute of Technology Lausanne;Duke University;;Duke University",
        "aff_domain": "duke.edu;ece.duke.edu;;epfl.ch;epfl.ch;duke.edu;;duke.edu",
        "position": "PhD student;PhD student;;Assistant Professor;PhD student;PhD student;;Professor",
        "bibtex": "@misc{\nsun2024plugvfl,\ntitle={Plug{VFL}: Robust and {IP}-Protecting Vertical Federated Learning against Unexpected Quitting of Parties},\nauthor={Jingwei Sun and Zhixu Du and Anna Dai and Saleh Baghersalimi and Alireza Amirshahi and Qilin Zheng and David Atienza and Yiran Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=TzcuXQq0aR}\n}",
        "github": "",
        "project": "",
        "reviewers": "T9tD;kTBy;ccWW;71Ut",
        "site": "https://openreview.net/forum?id=TzcuXQq0aR",
        "pdf_size": 3114271,
        "rating": "3;5;6;6",
        "confidence": "4;3;3;3",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "1;3;3;3",
        "wc_summary": "31;315;118;63",
        "wc_strengths": "5;97;41;104",
        "wc_weaknesses": "6;227;330;319",
        "wc_questions": "80;168;85;44",
        "wc_review": "122;807;574;530",
        "wc_reply_reviewers": "145;0;51;45",
        "wc_reply_authors": "345;958;728;1511",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "1;4;2;3",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            131.75,
            110.28004125860672
        ],
        "wc_strengths_avg": [
            61.75,
            40.861809798392436
        ],
        "wc_weaknesses_avg": [
            220.5,
            130.1393483924059
        ],
        "wc_questions_avg": [
            94.25,
            45.42232380669223
        ],
        "wc_review_avg": [
            508.25,
            246.59518953134508
        ],
        "wc_reply_reviewers_avg": [
            60.25,
            52.75118482081706
        ],
        "wc_reply_authors_avg": [
            885.5,
            422.33073532481626
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.9428090415820632,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:8A6gv1X2XK8J:scholar.google.com/&scioq=PlugVFL:+Robust+and+IP-Protecting+Vertical+Federated+Learning+against+Unexpected+Quitting+of+Parties&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1;1;0;0",
        "aff_unique_norm": "Duke University;Swiss Federal Institute of Technology Lausanne",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.duke.edu;https://www.epfl.ch",
        "aff_unique_abbr": "Duke;EPFL",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Lausanne",
        "aff_country_unique_index": "0;0;1;1;0;0",
        "aff_country_unique": "United States;Switzerland"
    },
    {
        "title": "Scaling Laws for Associative Memories",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18538",
        "id": "Tzh6xAJSll",
        "author_site": "Vivien Cabannes, Elvis Dohmatob, Alberto Bietti",
        "tldr": "",
        "abstract": "Learning arguably involves the discovery and memorization of abstract rules. The aim of this paper is to study associative memory mechanisms. Our model is based on high-dimensional matrices consisting of outer products of embeddings, which relates to the inner layers of transformer language models. We derive precise scaling laws with respect to sample size and parameter size, and discuss the statistical efficiency of different estimators, including optimization-based algorithms. We provide extensive numerical experiments to validate and interpret theoretical results, including fine-grained visualizations of the stored memory associations.",
        "keywords": "scaling law;associative memory;mechanistic interpretability;Hopfield network",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/87508fd941eec802b081163b0addc6d35a34c788.zip",
        "author": "Vivien Cabannes;Elvis Dohmatob;Alberto Bietti",
        "authorids": "~Vivien_Cabannes1;~Elvis_Dohmatob1;~Alberto_Bietti1",
        "gender": "Not Specified;M;M",
        "homepage": "https://viviencabannes.github.io/;http://dohmatob.github.io/;http://alberto.bietti.me",
        "dblp": ";134/9794;166/6461",
        "google_scholar": ";https://scholar.google.fr/citations?user=FDWgJY8AAAAJ;iT7Tp70AAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Vivien_Cabannes1;~Elvis_Dohmatob1;~Alberto_Bietti1",
        "aff": "META;Meta Facebook;Flatiron Institute",
        "aff_domain": "meta.com;facebook.com;flatironinstitute.org",
        "position": "Postdoc;Researcher;Researcher",
        "bibtex": "@inproceedings{\ncabannes2024scaling,\ntitle={Scaling Laws for Associative Memories},\nauthor={Vivien Cabannes and Elvis Dohmatob and Alberto Bietti},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Tzh6xAJSll}\n}",
        "github": "",
        "project": "",
        "reviewers": "fGhC;vzgF;fK8b;qN1v;cFvv",
        "pdf_size": 4925618,
        "rating": "6;8;8;8;8",
        "confidence": "3;3;2;4;2",
        "soundness": "3;4;4;3;4",
        "contribution": "2;4;3;3;3",
        "presentation": "2;2;3;4;3",
        "wc_summary": "170;104;97;112;71",
        "wc_strengths": "60;142;164;39;163",
        "wc_weaknesses": "292;376;120;84;126",
        "wc_questions": "163;58;33;53;97",
        "wc_review": "685;680;414;288;457",
        "wc_reply_reviewers": "813;0;0;0;0",
        "wc_reply_authors": "1304;535;352;692;258",
        "reply_reviewers": "3;0;0;0;0",
        "reply_authors": "3;1;1;1;1",
        "rating_avg": [
            7.6,
            0.7999999999999999
        ],
        "confidence_avg": [
            2.8,
            0.7483314773547882
        ],
        "soundness_avg": [
            3.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            3.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            2.8,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            110.8,
            32.63985294084519
        ],
        "wc_strengths_avg": [
            113.6,
            53.33891637444465
        ],
        "wc_weaknesses_avg": [
            199.6,
            113.81669473324202
        ],
        "wc_questions_avg": [
            80.8,
            46.03650725239699
        ],
        "wc_review_avg": [
            504.8,
            155.36975252603062
        ],
        "wc_reply_reviewers_avg": [
            162.6,
            325.2
        ],
        "wc_reply_authors_avg": [
            628.2,
            369.5393889695657
        ],
        "reply_reviewers_avg": [
            0.6,
            1.2000000000000002
        ],
        "reply_authors_avg": [
            1.4,
            0.8000000000000002
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.13363062095621223,
        "gs_citation": 21,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10881754446215715607&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=Tzh6xAJSll",
        "pdf": "https://openreview.net/pdf?id=Tzh6xAJSll",
        "email": "meta.com;facebook.com;flatironinstitute.org",
        "author_num": 3,
        "aff_unique_index": "1;2",
        "aff_unique_norm": ";Meta;Flatiron Institute",
        "aff_unique_dep": ";Meta Platforms, Inc.;",
        "aff_unique_url": ";https://meta.com;https://flatironinstitute.org",
        "aff_unique_abbr": ";Meta;Flatiron",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "1;1",
        "aff_country_unique": ";United States"
    },
    {
        "title": "ODEFormer: Symbolic Regression of Dynamical Systems with Transformers",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18537",
        "id": "TzoHLiGVMo",
        "author_site": "St\u00e9phane d'Ascoli, S\u00f6ren Becker, Philippe Schwaller, Alexander Mathis, Niki Kilbertus",
        "tldr": "",
        "abstract": "We introduce ODEFormer, the first transformer able to infer multidimensional ordinary differential equation (ODE) systems in symbolic form from the observation of a single solution trajectory. We perform extensive evaluations on two datasets: (i) the existing \u2018Strogatz\u2019 dataset featuring two-dimensional systems; (ii) ODEBench, a collection of one- to four-dimensional systems that we carefully curated from the literature to provide a more holistic benchmark. ODEFormer consistently outperforms existing methods while displaying substantially improved robustness to noisy and irregularly sampled observations, as well as faster inference. We release our code, model and benchmark at https://github.com/sdascoli/odeformer.",
        "keywords": "symbolic regression;dynamical systems;differential equations;transformer",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/412ea260f8b55c7db4d71514e2e8268487056100.pdf",
        "author": "St\u00e9phane d'Ascoli;S\u00f6ren Becker;Philippe Schwaller;Alexander Mathis;Niki Kilbertus",
        "authorids": "~St\u00e9phane_d'Ascoli1;~S\u00f6ren_Becker2;~Philippe_Schwaller1;~Alexander_Mathis1;~Niki_Kilbertus1",
        "gender": "M;;M;M;",
        "homepage": "https://sdascoli.github.io/;;https://schwallergroup.github.io;;",
        "dblp": "227/3250;;209/9632;117/7258;202/1966",
        "google_scholar": "2GcqQgYAAAAJ;;Tz0I4ywAAAAJ;https://scholar.google.ch/citations?user=Y1xCzE0AAAAJ;uQZjTq4AAAAJ",
        "orcid": "0000-0002-3131-3371;;0000-0003-3046-6576;0000-0002-3777-2202;",
        "linkedin": "st%C3%A9phane-d-ascoli-182642130/;;;;",
        "or_profile": "~St\u00e9phane_d'Ascoli1;~S\u00f6ren_Becker2;~Philippe_Schwaller1;~Alexander_Mathis1;~Niki_Kilbertus1",
        "aff": "Meta Facebook;;Swiss Federal Institute of Technology Lausanne;EPFL - EPF Lausanne;Helmholtz AI",
        "aff_domain": "facebook.com;;epfl.ch;epfl.ch;helmholtz-muenchen.de",
        "position": "Researcher;;Assistant Professor;Assistant Professor;Group Leader",
        "bibtex": "@inproceedings{\nd'ascoli2024odeformer,\ntitle={{ODEF}ormer: Symbolic Regression of Dynamical Systems with Transformers},\nauthor={St{\\'e}phane d'Ascoli and S{\\\"o}ren Becker and Philippe Schwaller and Alexander Mathis and Niki Kilbertus},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=TzoHLiGVMo}\n}",
        "github": "",
        "project": "",
        "reviewers": "znUh;hEs1;hbTD",
        "pdf_size": 2367113,
        "rating": "3;8;8",
        "confidence": "3;4;4",
        "soundness": "3;3;4",
        "contribution": "1;3;4",
        "presentation": "2;3;4",
        "wc_summary": "115;59;69",
        "wc_strengths": "144;40;102",
        "wc_weaknesses": "117;115;173",
        "wc_questions": "146;194;170",
        "wc_review": "522;408;514",
        "wc_reply_reviewers": "0;427;39",
        "wc_reply_authors": "460;3396;1066",
        "reply_reviewers": "0;2;1",
        "reply_authors": "1;7;2",
        "rating_avg": [
            6.333333333333333,
            2.357022603955158
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            81.0,
            24.385788210895843
        ],
        "wc_strengths_avg": [
            95.33333333333333,
            42.71871824960212
        ],
        "wc_weaknesses_avg": [
            135.0,
            26.8824602048746
        ],
        "wc_questions_avg": [
            170.0,
            19.595917942265423
        ],
        "wc_review_avg": [
            481.3333333333333,
            51.95724738239657
        ],
        "wc_reply_reviewers_avg": [
            155.33333333333334,
            192.75603463676276
        ],
        "wc_reply_authors_avg": [
            1640.6666666666667,
            1265.6237812065463
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            2.6246692913372702
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.9999999999999998,
        "gs_citation": 25,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1375885867500578043&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=TzoHLiGVMo",
        "pdf": "https://openreview.net/pdf?id=TzoHLiGVMo",
        "email": "facebook.com;;epfl.ch;epfl.ch;helmholtz-muenchen.de",
        "author_num": 5,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Meta;Swiss Federal Institute of Technology Lausanne;EPFL;Helmholtz Association of German Research Centres",
        "aff_unique_dep": "Meta Platforms, Inc.;;;Helmholtz AI",
        "aff_unique_url": "https://meta.com;https://www.epfl.ch;https://www.epfl.ch;https://www.helmholtz-ai.de",
        "aff_unique_abbr": "Meta;EPFL;EPFL;Helmholtz AI",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Lausanne",
        "aff_country_unique_index": "0;1;1;2",
        "aff_country_unique": "United States;Switzerland;Germany"
    },
    {
        "title": "Sin3DM: Learning a Diffusion Model from a Single 3D Textured Shape",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18536",
        "id": "U0IOMStUQ8",
        "author_site": "Rundi Wu, Ruoshi Liu, Carl Vondrick, Changxi Zheng",
        "tldr": "",
        "abstract": "Synthesizing novel 3D models that resemble the input example as long been pursued by graphics artists and machine learning researchers. In this paper, we present Sin3DM, a diffusion model that learns the internal patch distribution from a single 3D textured shape\nand generates high-quality variations with fine geometry and texture details. Training a diffusion model directly in 3D would induce large memory and computational cost. Therefore, we first compress the input into a lower-dimensional latent space and then train a diffusion model on it. Specifically, we encode the input 3D textured shape into triplane feature maps that represent the signed distance and texture fields of the input. The denoising network of our diffusion model has a limited receptive field to avoid overfitting, and uses triplane-aware 2D convolution blocks to improve the result quality. Aside from randomly generating new samples, our model also facilitates applications such as retargeting, outpainting and local editing. Through extensive qualitative and quantitative evaluation, we show that our method outperforms prior methods in generation quality of 3D shapes.",
        "keywords": "3D generation;shape analysis and synthesis;diffusion models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/fccd81a25994c1289d21009943879eea4ae4c645.zip",
        "author": "Rundi Wu;Ruoshi Liu;Carl Vondrick;Changxi Zheng",
        "authorids": "~Rundi_Wu1;~Ruoshi_Liu2;~Carl_Vondrick2;~Changxi_Zheng1",
        "gender": "M;M;M;M",
        "homepage": "https://www.cs.columbia.edu/~rundi/;https://ruoshiliu.github.io/;http://www.cs.columbia.edu/~vondrick/;http://www.cs.columbia.edu/~cxz",
        "dblp": "241/5506;283/4797;26/8610;92/5285",
        "google_scholar": "ulf_Pt0AAAAJ;suAawHYAAAAJ;3MzhkFIAAAAJ;-0rEuLgAAAAJ",
        "orcid": ";;;",
        "linkedin": ";ruoshi-liu-a5046aa0/;;",
        "or_profile": "~Rundi_Wu1;~Ruoshi_Liu2;~Carl_Vondrick2;~Changxi_Zheng1",
        "aff": "Columbia University;Columbia University;Columbia University;Columbia University",
        "aff_domain": "columbia.edu;columbia.edu;columbia.edu;cs.columbia.edu",
        "position": "PhD student;PhD student;Associate Professor;Associate Professor",
        "bibtex": "@inproceedings{\nwu2024sindm,\ntitle={Sin3{DM}: Learning a Diffusion Model from a Single 3D Textured Shape},\nauthor={Rundi Wu and Ruoshi Liu and Carl Vondrick and Changxi Zheng},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=U0IOMStUQ8}\n}",
        "github": "",
        "project": "",
        "reviewers": "s6cL;Udpj;vrWR;cGW2",
        "pdf_size": 44599122,
        "rating": "5;5;6;8",
        "confidence": "3;4;4;4",
        "soundness": "3;3;3;4",
        "contribution": "3;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "55;89;94;96",
        "wc_strengths": "25;49;36;259",
        "wc_weaknesses": "129;171;98;289",
        "wc_questions": "90;19;77;333",
        "wc_review": "299;328;305;977",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "390;146;238;440",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            83.5,
            16.650825805346713
        ],
        "wc_strengths_avg": [
            92.25,
            96.6472322417978
        ],
        "wc_weaknesses_avg": [
            171.75,
            72.48232543179061
        ],
        "wc_questions_avg": [
            129.75,
            120.35234729742498
        ],
        "wc_review_avg": [
            477.25,
            288.73376577740265
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            303.5,
            117.4851054389449
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.4714045207910316,
        "gs_citation": 19,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12004067743748687615&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=U0IOMStUQ8",
        "pdf": "https://openreview.net/pdf?id=U0IOMStUQ8",
        "email": "columbia.edu;columbia.edu;columbia.edu;cs.columbia.edu",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Columbia University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.columbia.edu",
        "aff_unique_abbr": "Columbia",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "U0P622bfUN",
        "title": "Federated Generative Learning with Foundation Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Existing federated learning solutions focus on transmitting features, parameters, or gradients between clients and server, which suffer from serious low-efficiency and privacy-leakage problems. Thanks to the emerging foundation generative models, we propose a novel federated learning framework, namely Federated Generative Learning. In this framework, each client can create text prompts that are tailored to their local data, based on its features, and then send them to the server. Given the received prompts, the informative training data can be remotely synthesized on the server using foundation generative models. This new framework offers several advantages, including enhanced communication efficiency, improved resilience to distribution shift, significant performance gains, and enhanced privacy protection. We validate these benefits through extensive experiments conducted on ImageNet and DomainNet datasets, e.g.,  on  ImageNet100 dataset, with a highly skewed data distribution, our method outperforms FedAvg by 12% in a single communication round. Moreover, our approach only requires 229 Bytes prompts for communication, while FedAvg necessitates the transmission of 42.7 MB parameters.",
        "keywords": "federated learning;non-iid data",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/d93483983494d294c6a6f928afbd361ec85a3525.zip",
        "author": "Jie Zhang;Xiao hua Qi;Shengyuan Pang;Siyuan Pan;Xiaobing Tu;Pengfei Wan;Bo Zhao",
        "authorids": "~Jie_Zhang14;~Xiao_hua_Qi1;~Shengyuan_Pang1;~Siyuan_Pan1;~Xiaobing_Tu1;~Pengfei_Wan1;~Bo_Zhao4",
        "gender": "M;M;M;M;M;M;M",
        "homepage": "https://zj-jayzhang.github.io/;https://github.com/Pang-0093;;https://scholar.google.com.sg/citations?hl=zh-CN&user=5sut5EUAAAAJ;;;https://scholar.google.com/scholar?hl=zh-CN&as_sdt=0%2C5&q=Xiaohua+Qi+ustc&btnG=&oq=xiaohu",
        "dblp": "84/6889-81;;250/5783;309/5944.html;;;",
        "google_scholar": "soDBSE8AAAAJ;;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com.sg/citations?hl=zh-CN;P6MraaYAAAAJ;R3_AR5EAAAAJ;https://scholar.google.com/scholar?hl=zh-CN",
        "orcid": ";;;;0000-0001-7225-565X;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Jie_Zhang14;~Shengyuan_Pang1;~Siyuan_Pan1;~Xiaobing_Tu1;~Pengfei_Wan1;~Bo_Zhao4;~Qi_Xiao_Hua1",
        "aff": "Department of Computer Science, ETHZ - ETH Zurich;Zhejiang University;;;Kuaishou Technology;BAAI;University of Science and Technology of China",
        "aff_domain": "inf.ethz.ch;zju.edu.cn;;;kuaishou.com;baai.ac.cn;ustc.edu.cn",
        "position": "PhD student;MS student;;;Director;Principal Researcher;MS student",
        "bibtex": "@misc{\nzhang2024federated,\ntitle={Federated Generative Learning with Foundation Models},\nauthor={Jie Zhang and Xiao hua Qi and Shengyuan Pang and Siyuan Pan and Xiaobing Tu and Pengfei Wan and Bo Zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=U0P622bfUN}\n}",
        "github": "",
        "project": "",
        "reviewers": "zu8q;ZNb2;wnsW;HdAm",
        "site": "https://openreview.net/forum?id=U0P622bfUN",
        "pdf_size": 2892070,
        "rating": "5;5;5;6",
        "confidence": "4;4;4;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;4;3",
        "wc_summary": "169;83;136;82",
        "wc_strengths": "53;47;72;43",
        "wc_weaknesses": "83;112;343;160",
        "wc_questions": "5;34;51;53",
        "wc_review": "310;276;602;338",
        "wc_reply_reviewers": "0;69;411;0",
        "wc_reply_authors": "1125;1240;1497;1233",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "4;4;4;3",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            117.5,
            36.89512162874653
        ],
        "wc_strengths_avg": [
            53.75,
            11.121488209767612
        ],
        "wc_weaknesses_avg": [
            174.5,
            101.09525211403353
        ],
        "wc_questions_avg": [
            35.75,
            19.22725929507375
        ],
        "wc_review_avg": [
            381.5,
            129.18494494328664
        ],
        "wc_reply_reviewers_avg": [
            120.0,
            170.35404309848357
        ],
        "wc_reply_authors_avg": [
            1273.75,
            136.7175464232737
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.75,
            0.4330127018922193
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 22,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14955951417492639812&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "ETH Zurich;Zhejiang University;Kuaishou Technology;Beijing Academy of Artificial Intelligence;University of Science and Technology of China",
        "aff_unique_dep": "Department of Computer Science;;;;",
        "aff_unique_url": "https://www.ethz.ch;https://www.zju.edu.cn;https://www.kuaishou.com;https://www.baaic.cn;http://www.ustc.edu.cn",
        "aff_unique_abbr": "ETHZ;ZJU;Kuaishou;BAAI;USTC",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Zurich;",
        "aff_country_unique_index": "0;1;1;1;1",
        "aff_country_unique": "Switzerland;China"
    },
    {
        "id": "U0Z7sBavgm",
        "title": "Class-Context-Aware Phantom Uncertainty Modeling",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Uncertainty modeling is crucial in developing robust and reliable models since it enables decision-makers to access the trustworthiness of predictions and make informed choices based on the uncertainty associated with the prediction. A straightforward approach to endow models with the ability to estimate uncertainty involves modeling a probabilistic distribution of the input representations and approximating it by variational inference. However, this method inevitably leads to an issue where uncertainty is underestimated, resulting in overconfident predictions even when dealing with data that contains inherent noise or ambiguity. In response to this challenge, we introduce a novel approach called Class-Context-aware Phantom Uncertainty Modeling. To circumvent the problem of underestimating uncertainty associated with the input data, we shift the focus to infer the distribution of their respective phantoms, which are derived by leveraging class-contextual information. We mitigate the issue of uncertainty underestimation by demonstrating that the estimated uncertainty of the original input data is no less than that of the phantom. We showcase our method's superior robustness and generalization capabilities through experiments involving robust learning tasks such as noisy label learning and cross-domain generalization.",
        "keywords": "uncertainty modeling;probabilistic representations;variation inference;robust learning",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Wei Wei;Jiahuan Zhou;Ying Wu",
        "authorids": "~Wei_Wei9;~Jiahuan_Zhou1;~Ying_Wu7",
        "gender": "M;M;M",
        "homepage": ";https://zhoujiahuan1991.github.io/;http://www.ece.northwestern.edu/~yingwu",
        "dblp": ";126/1129;64/5840-1",
        "google_scholar": "BlApk24AAAAJ;ZLZmI8sAAAAJ;zAlz89wAAAAJ",
        "orcid": ";0000-0002-3301-747X;0000-0002-3523-7054",
        "linkedin": ";jiahuan-zhou-866b257a/;ying-wu-a758497/",
        "or_profile": "~Wei_Wei9;~Jiahuan_Zhou1;~Ying_Wu1",
        "aff": "Columbia University;Peking University;Northwestern University",
        "aff_domain": "columbia.edu;pku.edu.cn;northwestern.edu",
        "position": "Postdoc;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nwei2024classcontextaware,\ntitle={Class-Context-Aware Phantom Uncertainty Modeling},\nauthor={Wei Wei and Jiahuan Zhou and Ying Wu},\nyear={2024},\nurl={https://openreview.net/forum?id=U0Z7sBavgm}\n}",
        "github": "",
        "project": "",
        "reviewers": "najj;QjyL;QLP6;R4BK",
        "site": "https://openreview.net/forum?id=U0Z7sBavgm",
        "pdf_size": 7126936,
        "rating": "3;3;5;5",
        "confidence": "4;4;3;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;2;3",
        "wc_summary": "69;119;38;136",
        "wc_strengths": "21;87;59;32",
        "wc_weaknesses": "450;311;142;137",
        "wc_questions": "9;223;11;86",
        "wc_review": "549;740;250;391",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            90.5,
            39.05444917035702
        ],
        "wc_strengths_avg": [
            49.75,
            25.567313116555678
        ],
        "wc_weaknesses_avg": [
            260.0,
            130.14799268525044
        ],
        "wc_questions_avg": [
            82.25,
            86.98670875484369
        ],
        "wc_review_avg": [
            482.5,
            182.45341871283202
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Lw-d9mnNUG0J:scholar.google.com/&scioq=Class-Context-Aware+Phantom+Uncertainty+Modeling&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Columbia University;Peking University;Northwestern University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.columbia.edu;http://www.pku.edu.cn;https://www.northwestern.edu",
        "aff_unique_abbr": "Columbia;Peking U;NU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "U0c2IaQhHk",
        "title": "Exploring the State and Action Space in Reinforcement Learning with Infinite-Dimensional Confidence Balls",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Reinforcement Learning (RL) is a powerful tool for solving complex decision-making problems. However, existing RL approaches suffer from the curse of dimensionality when dealing with large or continuous state and action spaces. This paper introduces a non-parametric online RL algorithm called RKHS-RL that overcomes these challenges by utilizing reproducing kernels and the RKHS-embedding assumption. The proposed algorithm can handle both finite and infinite state and action spaces, as well as nonlinear relationships in transition probabilities. The RKHS-RL algorithm estimates the transition core using ridge regression and balances exploration and exploitation through infinite-dimensional confidence balls. The paper provides theoretical guarantees, demonstrating that RKHS-RL achieves a sublinear regret bound of $\\tilde{\\mathcal{O}}(H\\sqrt{T})$, where $T$ denotes the time step of the algorithm and $H$ represents the horizon of the Markov Decision Process (MDP), making it an effective approach for RL problems.",
        "keywords": "online reinforcement learning;reproducing kernel Hilbert space;embedding learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/174cbee6b952a4fd69e0215a9f6b5252cf6668db.zip",
        "author": "Yucong Lin;Yicheng Teng;Jingda Wu;Junwei Lu",
        "authorids": "~Yucong_Lin2;~Yicheng_Teng1;~Jingda_Wu1;~Junwei_Lu1",
        "gender": "M;M;M;M",
        "homepage": ";https://github.com/YichengTeng;https://ioe.engin.umich.edu/people/wu-jingda/;https://junwei-lu.github.io/",
        "dblp": ";;;",
        "google_scholar": "https://scholar.google.com.hk/citations?hl=zh-CN;;;",
        "orcid": "0000-0002-9039-0318;;;",
        "linkedin": ";;;",
        "or_profile": "~Yucong_Lin2;~Yicheng_Teng1;~Jingda_Wu1;~Junwei_Lu1",
        "aff": "Beijing Institute of Technology;Department of Mathematical Sciences, Tsinghua University;Tsinghua University;Harvard University",
        "aff_domain": "bit.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;harvard.edu",
        "position": "Postdoc;Undergrad student;Undergrad student;Assistant Professor",
        "bibtex": "@misc{\nlin2024exploring,\ntitle={Exploring the State and Action Space in Reinforcement Learning with Infinite-Dimensional Confidence Balls},\nauthor={Yucong Lin and Yicheng Teng and Jingda Wu and Junwei Lu},\nyear={2024},\nurl={https://openreview.net/forum?id=U0c2IaQhHk}\n}",
        "github": "",
        "project": "",
        "reviewers": "u1Ph;oU2p;3vbX",
        "site": "https://openreview.net/forum?id=U0c2IaQhHk",
        "pdf_size": 437112,
        "rating": "3;6;6",
        "confidence": "4;3;4",
        "soundness": "2;3;3",
        "contribution": "2;3;2",
        "presentation": "2;3;4",
        "wc_summary": "67;111;68",
        "wc_strengths": "46;64;150",
        "wc_weaknesses": "253;199;174",
        "wc_questions": "28;177;167",
        "wc_review": "394;551;559",
        "wc_reply_reviewers": "230;10;0",
        "wc_reply_authors": "1111;706;698",
        "reply_reviewers": "1;1;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            82.0,
            20.51016008388688
        ],
        "wc_strengths_avg": [
            86.66666666666667,
            45.38232646698002
        ],
        "wc_weaknesses_avg": [
            208.66666666666666,
            32.96799795087486
        ],
        "wc_questions_avg": [
            124.0,
            68.00490178411161
        ],
        "wc_review_avg": [
            501.3333333333333,
            75.9663668269642
        ],
        "wc_reply_reviewers_avg": [
            80.0,
            106.14455552060438
        ],
        "wc_reply_authors_avg": [
            838.3333333333334,
            192.83210889844622
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:jA3mKlQbznEJ:scholar.google.com/&scioq=Exploring+the+State+and+Action+Space+in+Reinforcement+Learning+with+Infinite-Dimensional+Confidence+Balls&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "Beijing Institute of Technology;Tsinghua University;Harvard University",
        "aff_unique_dep": ";Department of Mathematical Sciences;",
        "aff_unique_url": "http://www.bit.edu.cn/;https://www.tsinghua.edu.cn;https://www.harvard.edu",
        "aff_unique_abbr": "BIT;THU;Harvard",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "U17KoLrXE8",
        "title": "ObjectNet Captions: Models are not superhuman captioners",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Even on out-of-domain image captioning datasets such as nocaps, models often outperform humans according to captioning metrics like CIDEr. Yet, in real world conditions, model captions are often wrong. We demonstrate that this performance deficit exists by introducing a new dataset and a new captioning metric. We introduce a new dataset, called ObjectNet Captions, that reduces spurious correlations which machines often exploit. We show the shortcomings of current captioning metrics with a head-to-head experiment against humans, where we find that humans rate human-generated captions as being of much higher quality than machine captions.  Driven by this, we introduce HUMANr, a new, highly robust, easy to replicate, and consistent metric, computed from head-to-head comparisons, which can be crowdsourced at low cost.  We also develop tooling to automatically compute HUMANr. HUMANr is an absolute performance metric: driving it to 0 means that humans can no longer distinguish machine captions from human captions. No current metric provides such a fixed target to aim for along with knowledge of when captioning is solved in this sense. Moreover, HUMANr can reveal that humans still outperform machines, which no current metric is able to demonstrate. Existing metrics both overstate the performance of machine models and, at the same time, they inherently limit it. While most current metrics are saturated, HUMANr provides significant opportunities for further captioning research, thereby opening the door to new advances. ObjectNet Captions and HUMANr are made available to the research community.",
        "keywords": "Deep learning;Representation learning;Computer vision Datasets",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/dd218ff27cce82a3d23565b96560b9596232e1e0.zip",
        "author": "Jesse Cummings;David Mayo;Ian Alexander Palmer;James R. Glass;Boris Katz;Andrei Barbu",
        "authorids": "~Jesse_Cummings1;~David_Mayo1;~Ian_Alexander_Palmer1;~James_R._Glass1;~Boris_Katz1;~Andrei_Barbu3",
        "gender": "M;;M;;M;M",
        "homepage": ";http://david-mayo.com;https://ianpalmer.io;;http://people.csail.mit.edu/boris/boris.html;https://0xab.com",
        "dblp": ";190/8836;;;k/BorisKatz;58/8365",
        "google_scholar": "FTAdd7EAAAAJ;QjVd0f8AAAAJ;;;FdNuUb8AAAAJ;t1rjgHgAAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";;;;;andrei-barbu-1166131",
        "or_profile": "~Jesse_Cummings1;~David_Mayo1;~Ian_Alexander_Palmer1;~James_R._Glass1;~Boris_Katz1;~Andrei_Barbu3",
        "aff": "Massachusetts Institute of Technology;Massachusetts Institute of Technology;;;Massachusetts Institute of Technology;Massachusetts Institute of Technology",
        "aff_domain": "mit.edu;mit.edu;;;mit.edu;mit.edu",
        "position": "MS student;PhD student;;;Principal Research Scientist;Researcher",
        "bibtex": "@misc{\ncummings2024objectnet,\ntitle={ObjectNet Captions: Models are not superhuman captioners},\nauthor={Jesse Cummings and David Mayo and Ian Alexander Palmer and James R. Glass and Boris Katz and Andrei Barbu},\nyear={2024},\nurl={https://openreview.net/forum?id=U17KoLrXE8}\n}",
        "github": "",
        "project": "",
        "reviewers": "zcyp;X1XD;V5WD;DRVD",
        "site": "https://openreview.net/forum?id=U17KoLrXE8",
        "pdf_size": 4526256,
        "rating": "5;5;5;6",
        "confidence": "4;4;3;3",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;2",
        "presentation": "3;3;2;3",
        "wc_summary": "60;63;60;149",
        "wc_strengths": "49;36;38;90",
        "wc_weaknesses": "142;94;99;52",
        "wc_questions": "25;40;100;29",
        "wc_review": "276;233;297;320",
        "wc_reply_reviewers": "37;0;0;0",
        "wc_reply_authors": "766;608;2134;660",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "2;1;4;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            83.0,
            38.1247950814165
        ],
        "wc_strengths_avg": [
            53.25,
            21.787324296480282
        ],
        "wc_weaknesses_avg": [
            96.75,
            31.869852525545205
        ],
        "wc_questions_avg": [
            48.5,
            30.236567265481707
        ],
        "wc_review_avg": [
            281.5,
            32.035136959282696
        ],
        "wc_reply_reviewers_avg": [
            9.25,
            16.021469970012117
        ],
        "wc_reply_authors_avg": [
            1042.0,
            633.0323846376266
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:JLXKwmggC6IJ:scholar.google.com/&scioq=ObjectNet+Captions:+Models+are+not+superhuman+captioners&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Massachusetts Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://web.mit.edu",
        "aff_unique_abbr": "MIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "U1ErjorKhN",
        "title": "Revisiting Traffic Forecasting from a PINN Perspective",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "This paper revisits various traffic forecasting models and provides a fresh perspective by examining them through the lens of Physics-Informed Neural Networks (PINNs). Instead of proposing new models, our approach focuses on identifying common methods within existing models and elucidating why these methods are effective from a PINN perspective.\n\nWe explore the concept of symmetry in traffic forecasting models, particularly in deep learning models and classical model-driven approaches that simulate traffic as fluids using partial differential equations (PDEs). We observe that deep learning models often exhibit spatial symmetry in their main backbone, with the exception of node embeddings. In contrast, classical PDE-based traffic models feature spatial symmetry in the PDE but not in the boundary conditions. This insight suggests that node embeddings encode critical boundary conditions in these models.\n\nAdditionally, we investigate the relationship between adaptive adjacency and graph re-wiring, shedding light on the dynamic nature of traffic network representations. By drawing parallels between these concepts, we offer valuable insights into how traffic systems adapt to changing conditions.\n\nIn conclusion, this paper presents a unique perspective on traffic forecasting models, emphasizing the role of symmetries and boundary conditions. It envisions a future where deep learning models harness the full capabilities of classical simulations, enabling the exploration of counter-factual questions. Such advancements hold great promise for traffic planners, managers, and engineers seeking more comprehensive and effective solutions for urban transportation management.",
        "keywords": "traffic forecasting;pinn",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Arian Prabowo;Flora D. Salim",
        "authorids": "~Arian_Prabowo1;~Flora_D._Salim1",
        "gender": ";F",
        "homepage": "https://www.arianprabowo.com/;http://florasalim.com/",
        "dblp": "249/5419.html;08/1554",
        "google_scholar": "ozZvUN4AAAAJ;https://scholar.google.com.au/citations?user=Yz35RSYAAAAJ",
        "orcid": "0000-0002-0459-354X;0000-0002-1237-1664",
        "linkedin": "arianprabowo/;https://au.linkedin.com/in/flora-salim-6958986",
        "or_profile": "~Arian_Prabowo1;~Flora_Salim1",
        "aff": "University of New South Wales;University of New South Wales",
        "aff_domain": "unsw.edu.au;unsw.edu.au",
        "position": "Postdoc;Full Professor",
        "bibtex": "@misc{\nprabowo2024revisiting,\ntitle={Revisiting Traffic Forecasting from a {PINN} Perspective},\nauthor={Arian Prabowo and Flora D. Salim},\nyear={2024},\nurl={https://openreview.net/forum?id=U1ErjorKhN}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=U1ErjorKhN",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:DNrYn5dDWFQJ:scholar.google.com/&scioq=Revisiting+Traffic+Forecasting+from+a+PINN+Perspective&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of New South Wales",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.unsw.edu.au",
        "aff_unique_abbr": "UNSW",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Australia"
    },
    {
        "id": "U2To7z3JOw",
        "title": "Bi-GCL: Efficient Search on Networks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recent research shows the promising potential of node continuous embedding methods in Top-K network node similarity search, which often involves finding nearest neighbors measured by similarity in a continuous embedding space.However, these methods poorly scale to searching on large networks, since their embeddings demand significant storage and entail tremendous computation costs.In this paper, we introduce a graph contrastive learning framework for compressing continuous node embeddings into binary codes that enable customized bits per dimension, striking a balance between retrieval accuracy, speed, and storage.Specifically, a recurrent binarization with GNNs is presented, which consists of two components, a GNN encoder for learning node continuous representations, and a residual multilayer perception module for encoding representations to binary codes.The whole architecture is trained end-to-end by jointly optimizing three losses, i.e., contrastive loss from giving closely aligned representations to  positives, information bottleneck loss from superfluous information minimization, and representation distillation loss from aligning binary codes and their continuous counterparts.Extensive experiments demonstrates that our method achieves approximately 6x-19x faster retrieval and 16x-32x space reduction compared to traditional continuous-based embedding methods.Moreover, it significantly outperforms state-of-the-art continuous- and hash-based network embedding methods on several real-world networks.",
        "keywords": "Graph Contrastive Learning;Similarity Search;Binary Coding;Efficiency",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Zhaochong Yu;Shuyang Feng",
        "authorids": "~Zhaochong_Yu1;~Shuyang_Feng2",
        "gender": ";M",
        "homepage": ";https://github.com/CamusFSY",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Zhaochong_Yu1;~Shuyang_Feng2",
        "aff": ";Shenzhen University",
        "aff_domain": ";szu.edu.cn",
        "position": ";Undergrad student",
        "bibtex": "@misc{\nyu2024bigcl,\ntitle={Bi-{GCL}: Efficient Search on Networks},\nauthor={Zhaochong Yu and Shuyang Feng},\nyear={2024},\nurl={https://openreview.net/forum?id=U2To7z3JOw}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=U2To7z3JOw",
        "pdf_size": 303512,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:kZ5cb8wgroAJ:scholar.google.com/&scioq=Bi-GCL:+Efficient+Search+on+Networks&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Shenzhen University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.szu.edu.cn",
        "aff_unique_abbr": "SZU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "U2ZIgcrg7Z",
        "title": "ZOOPFL: EXPLORING BLACK-BOX FOUNDATION MODELS FOR PERSONALIZED FEDERATED LEARNING",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "When personalized federated learning (FL) meets large foundation models, new challenges arise from various limitations in resources. In addition to typical limitations such as data, computation, and communication costs, access to the models is also often limited. This paper endeavors to solve both the challenges of limited resources and personalization. i.e., distribution shifts between clients. To do so, we propose a method named ZOOPFL that uses Zeroth-Order Optimization for Personalized Federated Learning. ZOOPFL avoids direct interference with the foundation models and instead learns to adapt its inputs through zeroth-order optimization. In addition, we employ simple yet effective linear projections to remap its predictions for personalization. To reduce the computation costs and enhance personalization, we propose input surgery to incorporate an auto-encoder with low-dimensional and client-specific embeddings. We provide theoretical support for ZOOPFL to analyze its convergence. Extensive empirical experiments on computer vision and natural language processing tasks using popular foundation models demonstrate its effectiveness for FL on black-box foundation models.",
        "keywords": "Federated Learning;Personalization;Zero-Order Optimization",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Wang Lu;Hao Yu;Jindong Wang;Damien Teney;Haohan Wang;Yiqiang Chen;Qiang Yang;Xing Xie;Xiangyang Ji",
        "authorids": "~Wang_Lu2;~Hao_Yu8;~Jindong_Wang1;~Damien_Teney1;~Haohan_Wang1;~Yiqiang_Chen1;~Qiang_Yang1;~Xing_Xie3;~Xiangyang_Ji1",
        "gender": "M;;;M;M;M;;M;",
        "homepage": ";https://www.researchgate.net/profile/Hao-Yu-19;;https://www.damienteney.info;http://cs.cmu.edu/~haohanw;http://www.ict.cas.cn/sourcedb_2018_ict_cas/cn/jssrck/200909/t20090917_2496596.html;;http://research.microsoft.com/en-us/people/xingx/;",
        "dblp": ";;;62/10068;132/4066;;;08/6809-1;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;;https://scholar.google.com.au/citations?user=iS_jP_3dpD8J;nZxJGeUAAAAJ;LC3SwhEAAAAJ;;5EQfAFIAAAAJ;",
        "orcid": ";;;;;;;0000-0002-8608-8482;",
        "linkedin": ";;;;haohanwang/;;;xingx/;",
        "or_profile": "~Wang_Lu2;~Hao_Yu8;~Jindong_Wang1;~Damien_Teney1;~Haohan_Wang1;~Yiqiang_Chen1;~Qiang_Yang1;~Xing_Xie3;~Xiangyang_Ji1",
        "aff": "Tsinghua University;;;Idiap Research Institute;University of Illinois, Urbana Champaign;Chinese Academy of Sciences;;Microsoft Research Asia;",
        "aff_domain": "tsinghua.edu.cn;;;idiap.ch;illinois.edu;ict.ac.cn;;microsoft.com;",
        "position": "Researcher;;;Researcher;Assistant Professor;Full Professor;;Senior Principal Researcher;",
        "bibtex": "@misc{\nlu2024zoopfl,\ntitle={{ZOOPFL}: {EXPLORING} {BLACK}-{BOX} {FOUNDATION} {MODELS} {FOR} {PERSONALIZED} {FEDERATED} {LEARNING}},\nauthor={Wang Lu and Hao Yu and Jindong Wang and Damien Teney and Haohan Wang and Yiqiang Chen and Qiang Yang and Xing Xie and Xiangyang Ji},\nyear={2024},\nurl={https://openreview.net/forum?id=U2ZIgcrg7Z}\n}",
        "github": "",
        "project": "",
        "reviewers": "RdGi;hxrH;1Crz;MDQp",
        "site": "https://openreview.net/forum?id=U2ZIgcrg7Z",
        "pdf_size": 2140291,
        "rating": "3;5;5;6",
        "confidence": "5;4;3;4",
        "soundness": "1;3;3;3",
        "contribution": "1;3;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "53;73;35;76",
        "wc_strengths": "37;88;46;13",
        "wc_weaknesses": "255;128;268;223",
        "wc_questions": "2;70;2;97",
        "wc_review": "347;359;351;409",
        "wc_reply_reviewers": "404;112;0;0",
        "wc_reply_authors": "467;1311;556;342",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "1;6;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            59.25,
            16.55860803328589
        ],
        "wc_strengths_avg": [
            46.0,
            27.08320512790168
        ],
        "wc_weaknesses_avg": [
            218.5,
            54.75627817885361
        ],
        "wc_questions_avg": [
            42.75,
            41.853165949543175
        ],
        "wc_review_avg": [
            366.5,
            24.914855006601986
        ],
        "wc_reply_reviewers_avg": [
            129.0,
            165.22409025320732
        ],
        "wc_reply_authors_avg": [
            669.0,
            378.37349272907585
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            2.165063509461097
        ],
        "replies_avg": [
            36,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -0.6488856845230502,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13131793981144449375&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "Tsinghua University;Idiap Research Institute;University of Illinois Urbana-Champaign;Chinese Academy of Sciences;Microsoft",
        "aff_unique_dep": ";;;;Research",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.idiap.ch;https://illinois.edu;https://www.cas.cn;https://www.microsoft.com/en-us/research/group/asia",
        "aff_unique_abbr": "THU;Idiap;UIUC;CAS;MSR Asia",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Urbana-Champaign;Asia",
        "aff_country_unique_index": "0;1;2;0;0",
        "aff_country_unique": "China;Switzerland;United States"
    },
    {
        "id": "U3ROVRTKTa",
        "title": "Prompting-based Efficient Temporal Domain Generalization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Machine learning traditionally assumes that training and testing data are distributed independently and identically. However, in many real-world settings, the data distribution can shift over time, leading to poor generalization of trained models in future time periods. Our paper presents a novel prompting-based approach to temporal domain generalization that is parameter-efficient, time-efficient, and does not require access to the target domain data (i.e., unseen future time periods) during training. Our method adapts a target pre-trained model to temporal drift by learning global prompts, domain-specific prompts, and drift-aware prompts that capture underlying temporal dynamics. It is compatible across diverse tasks, such as classification, regression, and time series forecasting, and sets a new state-of-the-art benchmark in temporal domain generalization. The code repository will be publicly shared.",
        "keywords": "Temporal domain generalization;Prompting;Temporal drift",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/f4388bf0efaca37335c772b17c65eb8235132f08.zip",
        "author": "Sepidehsadat Hosseini;Mengyao Zhai;Hossein Hajimirsadeghi;Frederick Tung",
        "authorids": "~Sepidehsadat_Hosseini2;~Mengyao_Zhai1;~Hossein_Hajimirsadeghi1;~Frederick_Tung1",
        "gender": "F;;M;M",
        "homepage": "https://sepidsh.github.io/;https://mzhai.weebly.com/;;",
        "dblp": ";139/8207;64/8131;10/7697",
        "google_scholar": ";L5OLKPwAAAAJ;;https://scholar.google.ca/citations?user=T4EeZ9gAAAAJ",
        "orcid": ";;;",
        "linkedin": "sepidehsadat-hosseini-9b0314a0/;;;",
        "or_profile": "~Sepidehsadat_Hosseini2;~Mengyao_Zhai1;~Hossein_Hajimirsadeghi1;~Frederick_Tung1",
        "aff": "Simon Fraser University;Simon Fraser University;Borealis AI;Borealis AI",
        "aff_domain": "sfu.ca;sfu.ca;borealisai.com;borealisai.com",
        "position": "PhD student;PhD student;Principal Researcher;Researcher",
        "bibtex": "@misc{\nhosseini2024promptingbased,\ntitle={Prompting-based Efficient Temporal Domain Generalization},\nauthor={Sepidehsadat Hosseini and Mengyao Zhai and Hossein Hajimirsadeghi and Frederick Tung},\nyear={2024},\nurl={https://openreview.net/forum?id=U3ROVRTKTa}\n}",
        "github": "",
        "project": "",
        "reviewers": "zvod;ci1c;HfUr;Bw2Q",
        "site": "https://openreview.net/forum?id=U3ROVRTKTa",
        "pdf_size": 1315917,
        "rating": "3;5;5;5",
        "confidence": "4;2;4;4",
        "soundness": "3;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "2;3;3;3",
        "wc_summary": "61;117;87;72",
        "wc_strengths": "36;62;37;48",
        "wc_weaknesses": "100;205;128;215",
        "wc_questions": "170;150;338;63",
        "wc_review": "367;534;590;398",
        "wc_reply_reviewers": "212;0;15;23",
        "wc_reply_authors": "1175;606;754;789",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "2;2;1;2",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            84.25,
            21.040140208658308
        ],
        "wc_strengths_avg": [
            45.75,
            10.497023387608508
        ],
        "wc_weaknesses_avg": [
            162.0,
            49.137562007083744
        ],
        "wc_questions_avg": [
            180.25,
            99.56499133731695
        ],
        "wc_review_avg": [
            472.25,
            92.559102739817
        ],
        "wc_reply_reviewers_avg": [
            62.5,
            86.70784278253035
        ],
        "wc_reply_authors_avg": [
            831.0,
            210.15113609019582
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ssFJJSx3PKcJ:scholar.google.com/&scioq=Prompting-based+Efficient+Temporal+Domain+Generalization&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;1",
        "aff_unique_norm": "Simon Fraser University;Borealis AI",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.sfu.ca;https://www.borealisai.com",
        "aff_unique_abbr": "SFU;Borealis AI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "U4RoAyYGJZ",
        "title": "On-Policy Policy Gradient Reinforcement Learning Without On-Policy Sampling",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "On-policy reinforcement learning RL algorithms perform policy updates using i.i.d. trajectories collected by the current policy. \nHowever, after observing only a finite number of trajectories, on-policy sampling may produce data that fails to match the expected on-policy data distribution. \nThis sampling error leads to noisy updates and data inefficient on-policy learning.\nRecent work in the policy evaluation setting has shown that non-i.i.d., off-policy sampling can produce data with lower sampling error than on-policy sampling can produce~\\citep{zhong2022robust}.\nMotivated by this observation, we introduce an adaptive, off-policy sampling method to improve the data efficiency of on-policy policy gradient algorithms.\nOur method, Proximal Robust On-Policy Sampling (PROPS) reduces sampling error by collecting data with a \\textit{behavior policy} that increases the probability of sampling actions that are under-sampled with respect to the current policy. \nRather than discarding data from old policies -- as is commonly done in on-policy algorithms -- PROPS uses data collection to adjust the distribution of previously collected data to be approximately on-policy. \nWe empirically evaluate PROPS on both continuous-action MuJoCo benchmark tasks as well discrete-action tasks\nand demonstrate that (1) PROPS decreases sampling error throughout training and (2) improves the data efficiency of on-policy policy gradient algorithms.\nOur work improves the RL community\u2019s understanding of a nuance in the on-policy vs off-policy dichotomy: on-policy learning requires on-policy data, not on-policy sampling.",
        "keywords": "reinforcement learning;on-policy;policy gradient;data collection",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/5e5cd7812435d2e85f1827d61607d351bbfd7d77.zip",
        "author": "Nicholas Corrado;Josiah P. Hanna",
        "authorids": "~Nicholas_Corrado1;~Josiah_P._Hanna1",
        "gender": ";M",
        "homepage": "https://nicholascorrado.github.io;https://pages.cs.wisc.edu/~jphanna/",
        "dblp": "340/2322;135/6336",
        "google_scholar": "7aEHl08AAAAJ;",
        "orcid": "0000-0001-7720-6013;",
        "linkedin": "nicholas-e-corrado;",
        "or_profile": "~Nicholas_Corrado1;~Josiah_Hanna2",
        "aff": "Amazon;University of Wisconsin - Madison",
        "aff_domain": "amazon.com;wisc.edu",
        "position": "Applied Scientist Intern;Assistant Professor",
        "bibtex": "@misc{\ncorrado2024onpolicy,\ntitle={On-Policy Policy Gradient Reinforcement Learning Without On-Policy Sampling},\nauthor={Nicholas Corrado and Josiah P. Hanna},\nyear={2024},\nurl={https://openreview.net/forum?id=U4RoAyYGJZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "KNrT;8MkC;ErDF;FJW4",
        "site": "https://openreview.net/forum?id=U4RoAyYGJZ",
        "pdf_size": 19901223,
        "rating": "5;5;8;8",
        "confidence": "4;4;4;4",
        "soundness": "2;2;3;4",
        "contribution": "2;2;4;3",
        "presentation": "2;3;3;3",
        "wc_summary": "52;104;76;354",
        "wc_strengths": "72;33;34;21",
        "wc_weaknesses": "94;350;656;61",
        "wc_questions": "419;71;2;701",
        "wc_review": "637;558;768;1137",
        "wc_reply_reviewers": "0;100;384;0",
        "wc_reply_authors": "745;1302;973;730",
        "reply_reviewers": "0;1;2;0",
        "reply_authors": "1;3;4;1",
        "rating_avg": [
            6.5,
            1.5
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            146.5,
            121.20540416994615
        ],
        "wc_strengths_avg": [
            40.0,
            19.170289512680814
        ],
        "wc_weaknesses_avg": [
            290.25,
            238.9627324500622
        ],
        "wc_questions_avg": [
            298.25,
            281.15598428630324
        ],
        "wc_review_avg": [
            775.0,
            222.0506698931575
        ],
        "wc_reply_reviewers_avg": [
            121.0,
            157.23549217654391
        ],
        "wc_reply_authors_avg": [
            937.5,
            231.42655422401293
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.25,
            1.299038105676658
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17340944287524512062&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Amazon;University of Wisconsin-Madison",
        "aff_unique_dep": "Amazon.com, Inc.;",
        "aff_unique_url": "https://www.amazon.com;https://www.wisc.edu",
        "aff_unique_abbr": "Amazon;UW-Madison",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Madison",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "U5BZcr0H7r",
        "title": "Multi-Armed Bandits with Abstention",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We introduce a novel extension of the canonical multi-armed bandit problem that incorporates an additional strategic element: abstention. In this enhanced framework, the agent is not only tasked with selecting an arm at each time step, but also has the option to abstain from accepting the stochastic instantaneous reward before observing it. When opting for abstention, the agent either suffers a fixed regret or gains a guaranteed reward. Given this added layer of complexity, we ask whether we can develop efficient algorithms that are both asymptotically and minimax optimal. We answer this question affirmatively by designing and analyzing algorithms whose regrets meet their corresponding information-theoretic lower bounds. Our results offer valuable quantitative insights into the benefits of the abstention option, laying the groundwork for further exploration in other online decision-making problems with such an option. Numerical results further corroborate our theoretical findings.",
        "keywords": "multi-armed bandits;abstention;online decision-making",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/a0d87b4079dcd61faa6020eb529fc4d7455593bf.zip",
        "author": "Junwen Yang;Tianyuan Jin;Vincent Tan",
        "authorids": "~Junwen_Yang1;~Tianyuan_Jin1;~Vincent_Tan1",
        "gender": "Not Specified;M;M",
        "homepage": "https://iora.nus.edu.sg/;https://tianyuanjin.github.io/;https://www.ece.nus.edu.sg/stfpage/vtan/pubs.htm",
        "dblp": "208/0023;208/2335;60/2327",
        "google_scholar": ";3e5kmjsAAAAJ;dJoAVvAAAAAJ",
        "orcid": ";;0000-0002-5008-4527",
        "linkedin": ";;",
        "or_profile": "~Junwen_Yang1;~Tianyuan_Jin1;~Vincent_Tan1",
        "aff": "National University of Singapore;National University of Singapore;National University of Singapore",
        "aff_domain": "u.nus.edu;nus.edu.sg;nus.edu.sg",
        "position": "PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nyang2024multiarmed,\ntitle={Multi-Armed Bandits with Abstention},\nauthor={Junwen Yang and Tianyuan Jin and Vincent Tan},\nyear={2024},\nurl={https://openreview.net/forum?id=U5BZcr0H7r}\n}",
        "github": "",
        "project": "",
        "reviewers": "4Y9t;n2KC;Yyub;ahVb",
        "site": "https://openreview.net/forum?id=U5BZcr0H7r",
        "pdf_size": 469688,
        "rating": "6;6;8;8",
        "confidence": "4;3;3;4",
        "soundness": "2;4;3;4",
        "contribution": "2;3;3;3",
        "presentation": "3;4;4;4",
        "wc_summary": "90;255;69;86",
        "wc_strengths": "17;93;122;92",
        "wc_weaknesses": "163;179;77;111",
        "wc_questions": "3;70;138;5",
        "wc_review": "273;597;406;294",
        "wc_reply_reviewers": "194;26;177;57",
        "wc_reply_authors": "1656;841;628;249",
        "reply_reviewers": "2;1;1;1",
        "reply_authors": "5;2;2;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            125.0,
            75.46853649038121
        ],
        "wc_strengths_avg": [
            81.0,
            38.86515148561755
        ],
        "wc_weaknesses_avg": [
            132.5,
            40.72775466435635
        ],
        "wc_questions_avg": [
            54.0,
            55.4842319943243
        ],
        "wc_review_avg": [
            392.5,
            128.43772810198723
        ],
        "wc_reply_reviewers_avg": [
            113.5,
            73.07701416998371
        ],
        "wc_reply_authors_avg": [
            843.5,
            514.7895200953493
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            1.299038105676658
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:RPS_eazTj6wJ:scholar.google.com/&scioq=Multi-Armed+Bandits+with+Abstention&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "National University of Singapore",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nus.edu.sg",
        "aff_unique_abbr": "NUS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Singapore"
    },
    {
        "id": "U6Mb3CRuj8",
        "title": "TADA: Timestep-Aware Data Augmentation for Diffusion Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Data augmentation is a popular technique to improve the generalization performance of neural networks, particularly when dealing with limited data.\nHowever, simply applying augmentation techniques to generative models can lead to a distribution shift problem, producing unintended augmented-like output samples.\nWhile this issue has been actively studied in generative adversarial networks (GANs), little attention has been paid to diffusion models despite their widespread use. \nIn this paper, we conduct the first comprehensive study of data augmentation for diffusion models, primarily investigating the relationship between distribution shifts and data augmentation.\nOur study reveals that distribution shifts in diffusion models originate exclusively from specific timestep intervals, rather than from the entire timesteps.\nBased on these findings, we introduce a simple yet effective data augmentation strategy that flexibly adjusts the augmentation strength depending on timesteps.\nExperiments on diverse diffusion model settings (e.g., noise schedule, model size, and sampling steps), datasets, and a training setup (e.g., training from scratch or transfer learning) show that our approach is applicable across different design choices, with minimal adjustments to the data processing pipeline.\nWe expect that our data augmentation method can benefit various diffusion model designs and tasks across a wide scope of applications.\nWe will make our code publicly available.",
        "keywords": "data augmentation;generative models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/062302e21df67c8e7deb48ae189decab3a6435d2.zip",
        "author": "NaHyeon Park;Kunhee Kim;Song Park;Jung-Woo Ha;Hyunjung Shim",
        "authorids": "~NaHyeon_Park2;~Kunhee_Kim1;~Song_Park1;~Jung-Woo_Ha1;~Hyunjung_Shim1",
        "gender": ";M;F;M;F",
        "homepage": ";https://www.kunheekim.xyz;https://8uos.github.io;https://aidljwha.wordpress.com/;https://sites.google.com/view/cvml-kaist",
        "dblp": "387/0866;300/4058;;66/867-1;72/4620",
        "google_scholar": "LZ0zLRYAAAAJ;6sU5r7MAAAAJ;https://scholar.google.co.kr/citations?user=VR1c0H8AAAAJ;https://scholar.google.co.kr/citations?user=eGj3ay4AAAAJ;KB5XZGIAAAAJ",
        "orcid": ";;;0000-0002-7400-7681;",
        "linkedin": "katynahyeonpark/;kunheekim;;jung-woo-ha-b2782862?trk=hp-identity-name;",
        "or_profile": "~NaHyeon_Park2;~Kunhee_Kim1;~Song_Park1;~Jung-Woo_Ha1;~Hyunjung_Shim1",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;NAVER;NAVER AI Lab;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr;navercorp.com;navercorp.com;kaist.ac.kr",
        "position": "PhD student;PhD student;Researcher;Research fellow;Associate Professor",
        "bibtex": "@misc{\npark2024tada,\ntitle={{TADA}: Timestep-Aware Data Augmentation for Diffusion Models},\nauthor={NaHyeon Park and Kunhee Kim and Song Park and Jung-Woo Ha and Hyunjung Shim},\nyear={2024},\nurl={https://openreview.net/forum?id=U6Mb3CRuj8}\n}",
        "github": "",
        "project": "",
        "reviewers": "L1D2;xARD;zkiV;o4Pj",
        "site": "https://openreview.net/forum?id=U6Mb3CRuj8",
        "pdf_size": 37297162,
        "rating": "3;3;6;8",
        "confidence": "4;4;2;2",
        "soundness": "2;1;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;1;3;3",
        "wc_summary": "38;140;94;65",
        "wc_strengths": "37;46;128;94",
        "wc_weaknesses": "240;207;153;95",
        "wc_questions": "52;496;57;182",
        "wc_review": "367;889;432;436",
        "wc_reply_reviewers": "114;252;175;0",
        "wc_reply_authors": "1108;1715;349;995",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "3;4;2;2",
        "rating_avg": [
            5.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            3.0,
            1.0
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            84.25,
            37.79136806203237
        ],
        "wc_strengths_avg": [
            76.25,
            36.90782437370157
        ],
        "wc_weaknesses_avg": [
            173.75,
            55.06076189084201
        ],
        "wc_questions_avg": [
            196.75,
            180.4513438575618
        ],
        "wc_review_avg": [
            531.0,
            208.49820143109147
        ],
        "wc_reply_reviewers_avg": [
            135.25,
            92.13407350160959
        ],
        "wc_reply_authors_avg": [
            1041.75,
            484.7016479237511
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9428090415820635,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:F_7UmnaTdycJ:scholar.google.com/&scioq=TADA:+Timestep-Aware+Data+Augmentation+for+Diffusion+Models&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;1;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology;NAVER Corporation",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.kaist.ac.kr;https://www.naver.com",
        "aff_unique_abbr": "KAIST;NAVER",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "Provable Benefits of Multi-task RL under Non-Markovian Decision Making Processes",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18535",
        "id": "U6Qulbv2qT",
        "author_site": "Ruiquan Huang, Yuan Cheng, Jing Yang, Vincent Tan, Yingbin Liang",
        "tldr": "",
        "abstract": "In multi-task reinforcement learning (RL) under Markov decision processes (MDPs), the presence of shared latent structures among multiple MDPs has been shown to yield significant benefits to the sample efficiency compared to single-task RL. In this paper, we investigate whether such a benefit can extend to more general sequential decision making problems such as predictive state representations (PSRs). The main challenge here is that the large and complex model space makes it hard to identify what types of common latent structure of multi-task PSRs can reduce the model complexity and improve sample efficiency.\nTo this end, we posit a  joint model class for tasks and use the notion of $\\eta$-bracketing number to quantify its complexity; this number also serves as a general metric  to capture the similarity of tasks and thus determines the benefit of multi-task over single-task RL. We first study  upstream multi-task learning over PSRs, in which all tasks share the same observation and action spaces. We propose a provably efficient algorithm  UMT-PSR for finding near-optimal policies for all PSRs, and demonstrate that the advantage of multi-task learning manifests if the joint model class of PSRs has a smaller $\\eta$-bracketing number compared to that of individual single-task learning. We further investigate downstream learning, in which the agent needs to learn a new target task that shares some commonalities with the upstream tasks via a similarity constraint. By exploiting the learned PSRs from the upstream, we develop a sample-efficient algorithm that provably finds a near-optimal policy. \nUpon specialization to some examples with small $\\eta$-bracketing numbers, our results further highlight the benefit compared to directly learning a single-task PSR.",
        "keywords": "Reinforcement learning;multi-task learning;bracketing number;predictive state representation;POMDP",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Ruiquan Huang;Yuan Cheng;Jing Yang;Vincent Tan;Yingbin Liang",
        "authorids": "~Ruiquan_Huang1;~Yuan_Cheng6;~Jing_Yang3;~Vincent_Tan1;~Yingbin_Liang1",
        "gender": "M;;;M;F",
        "homepage": ";;http://www.ee.psu.edu/yang;https://www.ece.nus.edu.sg/stfpage/vtan/pubs.htm;https://sites.google.com/view/yingbinliang/home",
        "dblp": "304/8880;;;60/2327;51/332",
        "google_scholar": "0eo3JGgAAAAJ;5v47GU0AAAAJ;https://scholar.google.com/citations?hl=en;dJoAVvAAAAAJ;lGgLAiIAAAAJ",
        "orcid": ";;;0000-0002-5008-4527;",
        "linkedin": "ruiquan-huang-369543185/;;;;",
        "or_profile": "~Ruiquan_Huang1;~Yuan_Cheng6;~Jing_Yang3;~Vincent_Tan1;~Yingbin_Liang1",
        "aff": "Pennsylvania State University;National University of Singapore;Pennsylvania State University;National University of Singapore;The Ohio State University",
        "aff_domain": "psu.edu;u.nus.edu;psu.edu;nus.edu.sg;osu.edu",
        "position": "PhD student;PhD student;Associate Professor;Full Professor;Professor",
        "bibtex": "@inproceedings{\nhuang2024provable,\ntitle={Provable Benefits of Multi-task {RL} under Non-Markovian Decision Making Processes},\nauthor={Ruiquan Huang and Yuan Cheng and Jing Yang and Vincent Tan and Yingbin Liang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=U6Qulbv2qT}\n}",
        "github": "",
        "project": "",
        "reviewers": "FV3A;qpJY;t71h;W5uL;iJpQ",
        "pdf_size": 999185,
        "rating": "6;6;6;8;8",
        "confidence": "1;4;3;3;2",
        "soundness": "2;3;3;3;3",
        "contribution": "2;2;3;3;3",
        "presentation": "2;4;3;2;4",
        "wc_summary": "178;160;134;34;159",
        "wc_strengths": "28;50;44;35;125",
        "wc_weaknesses": "28;239;20;306;9",
        "wc_questions": "28;56;40;311;579",
        "wc_review": "262;505;238;686;872",
        "wc_reply_reviewers": "24;0;0;31;0",
        "wc_reply_authors": "74;993;440;1424;1373",
        "reply_reviewers": "1;0;0;1;0",
        "reply_authors": "2;2;1;3;2",
        "rating_avg": [
            6.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            2.6,
            1.019803902718557
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            3.0,
            0.8944271909999159
        ],
        "wc_summary_avg": [
            133.0,
            51.443172530472886
        ],
        "wc_strengths_avg": [
            56.4,
            35.11466929931136
        ],
        "wc_weaknesses_avg": [
            120.4,
            126.12787162241342
        ],
        "wc_questions_avg": [
            202.8,
            215.33360165101962
        ],
        "wc_review_avg": [
            512.6,
            243.92589038476422
        ],
        "wc_reply_reviewers_avg": [
            11.0,
            13.65283853270081
        ],
        "wc_reply_authors_avg": [
            860.8,
            527.8535402931385
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            2.0,
            0.6324555320336759
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.08006407690254354,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7709056630689320128&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=U6Qulbv2qT",
        "pdf": "https://openreview.net/pdf?id=U6Qulbv2qT",
        "email": "psu.edu;u.nus.edu;psu.edu;nus.edu.sg;osu.edu",
        "author_num": 5,
        "aff_unique_index": "0;1;0;1;2",
        "aff_unique_norm": "Pennsylvania State University;National University of Singapore;Ohio State University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.psu.edu;https://www.nus.edu.sg;https://www.osu.edu",
        "aff_unique_abbr": "PSU;NUS;OSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;1;0",
        "aff_country_unique": "United States;Singapore"
    },
    {
        "title": "3D-Aware Hypothesis & Verification for Generalizable Relative Object Pose Estimation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18534",
        "id": "U6hEOZlDf5",
        "author_site": "Chen Zhao, Tong Zhang, Mathieu Salzmann",
        "tldr": "",
        "abstract": "Prior methods that tackle the problem of generalizable object pose estimation highly rely on having dense views of the unseen object. By contrast, we address the scenario where only a single reference view of the object is available. Our goal then is to estimate the relative object pose between this reference view and a query image that depicts the object in a different pose. In this scenario, robust generalization is imperative due to the presence of unseen objects during testing and the large-scale object pose variation between the reference and the query. To this end, we present a new hypothesis-and-verification framework, in which we generate and evaluate multiple pose hypotheses, ultimately selecting the most reliable one as the relative object pose. To measure reliability, we introduce a 3D-aware verification that explicitly applies 3D transformations to the 3D object representations learned from the two input images. Our comprehensive experiments on the Objaverse, LINEMOD, and CO3D datasets evidence the superior accuracy of our approach in relative pose estimation and its robustness in large-scale pose variations, when dealing with unseen objects.",
        "keywords": "Object pose estimation; Unseen objects; 3D computer vision",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/23d3fa5a50ab0fda60654ac71b2eefac2f91600e.pdf",
        "author": "Chen Zhao;Tong Zhang;Mathieu Salzmann",
        "authorids": "~Chen_Zhao6;~Tong_Zhang9;~Mathieu_Salzmann1",
        "gender": "M;M;M",
        "homepage": "https://sites.google.com/view/tong-zhang;https://people.epfl.ch/mathieu.salzmann;https://sailor-z.github.io/",
        "dblp": "07/4227-23;18/4533;",
        "google_scholar": "https://scholar.google.com.au/citations?user=kCy8JG8AAAAJ;https://scholar.google.ch/citations?user=n-B0jr4AAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0001-5818-4285;;0000-0001-9843-6758",
        "linkedin": ";;",
        "or_profile": "~Tong_Zhang9;~Mathieu_Salzmann1;~Chen_Zhao1",
        "aff": "Swiss Federal Institute of Technology Lausanne;CSIRO;EPFL - EPF Lausanne",
        "aff_domain": "epfl.ch;data61.csiro.au;epfl.ch",
        "position": "Postdoc;Collaborator;PhD student",
        "bibtex": "@inproceedings{\nzhao2024daware,\ntitle={3D-Aware Hypothesis \\& Verification for Generalizable Relative Object Pose Estimation},\nauthor={Chen Zhao and Tong Zhang and Mathieu Salzmann},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=U6hEOZlDf5}\n}",
        "github": "",
        "project": "",
        "reviewers": "jg4A;jWeY;c3Qb;nmWB",
        "pdf_size": 2956115,
        "rating": "6;6;6;6",
        "confidence": "3;3;4;4",
        "soundness": "3;3;3;4",
        "contribution": "3;3;3;2",
        "presentation": "2;3;3;4",
        "wc_summary": "73;89;83;134",
        "wc_strengths": "62;103;37;121",
        "wc_weaknesses": "117;211;101;339",
        "wc_questions": "27;116;5;66",
        "wc_review": "279;519;226;660",
        "wc_reply_reviewers": "26;30;16;226",
        "wc_reply_authors": "380;679;397;717",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            94.75,
            23.370654676324325
        ],
        "wc_strengths_avg": [
            80.75,
            33.09361720936531
        ],
        "wc_weaknesses_avg": [
            192.0,
            94.70480452437458
        ],
        "wc_questions_avg": [
            53.5,
            42.18115693055372
        ],
        "wc_review_avg": [
            421.0,
            176.7158736503317
        ],
        "wc_reply_reviewers_avg": [
            74.5,
            87.61706454795207
        ],
        "wc_reply_authors_avg": [
            543.25,
            155.44834350999048
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13644304466158408808&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=U6hEOZlDf5",
        "pdf": "https://openreview.net/pdf?id=U6hEOZlDf5",
        "email": "epfl.ch;data61.csiro.au;epfl.ch",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Swiss Federal Institute of Technology Lausanne;Commonwealth Scientific and Industrial Research Organisation;EPFL",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.epfl.ch;https://www.csiro.au;https://www.epfl.ch",
        "aff_unique_abbr": "EPFL;CSIRO;EPFL",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Lausanne;",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Switzerland;Australia"
    },
    {
        "title": "Respect the model: Fine-grained and Robust Explanation with Sharing Ratio Decomposition",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18533",
        "id": "U7VW3KBm34",
        "author_site": "Sangyu Han, Yearim Kim, Nojun Kwak",
        "tldr": "",
        "abstract": "The truthfulness of existing explanation methods in authentically elucidating the underlying model's decision-making process has been questioned. Existing methods have deviated from faithfully representing the model, thus susceptible to adversarial attacks.\nTo address this, we propose a novel eXplainable AI (XAI) method called SRD (Sharing Ratio Decomposition), which sincerely reflects the model's inference process, resulting in significantly enhanced robustness in our explanations.\nDifferent from the conventional emphasis on the neuronal level, we adopt a vector perspective to consider the intricate nonlinear interactions between filters.\nWe also introduce an interesting observation termed Activation-Pattern-Only Prediction (APOP), letting us emphasize the importance of inactive neurons and redefine relevance encapsulating all relevant information including both active and inactive neurons.\nOur method, SRD, allows for the recursive decomposition of a Pointwise Feature Vector (PFV), providing a high-resolution Effective Receptive Field (ERF) at any layer.",
        "keywords": "explainable ai",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/48fdbfc7eb2d8c17f9e45761dc0523276d486513.zip",
        "author": "Sangyu Han;Yearim Kim;Nojun Kwak",
        "authorids": "~Sangyu_Han1;~Yearim_Kim1;~Nojun_Kwak1",
        "gender": ";M;F",
        "homepage": ";http://mipal.snu.ac.kr;https://github.com/yerrrringo98",
        "dblp": "367/9248;49/2806;",
        "google_scholar": ";h_8-1M0AAAAJ;",
        "orcid": ";0000-0002-1792-0327;",
        "linkedin": "%EC%83%81%EC%9C%A0-%ED%95%9C-681973216;;",
        "or_profile": "~Sangyu_Han1;~Nojun_Kwak1;~Yerim_Kim1",
        "aff": "Seoul National University;Seoul National University;Seoul National University",
        "aff_domain": "snu.ac.kr;snu.ac.kr;snu.ac.kr",
        "position": "MS student;Full Professor;PhD student",
        "bibtex": "@inproceedings{\nhan2024respect,\ntitle={Respect the model: Fine-grained and Robust Explanation with Sharing Ratio Decomposition},\nauthor={Sangyu Han and Yearim Kim and Nojun Kwak},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=U7VW3KBm34}\n}",
        "github": "",
        "project": "",
        "reviewers": "HQ8j;WQ6F;z79h;aoME",
        "pdf_size": 23225463,
        "rating": "6;6;6;6",
        "confidence": "2;3;3;3",
        "soundness": "2;3;2;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;2;2",
        "wc_summary": "39;57;56;76",
        "wc_strengths": "54;78;37;219",
        "wc_weaknesses": "87;186;82;161",
        "wc_questions": "112;46;6;32",
        "wc_review": "292;367;181;488",
        "wc_reply_reviewers": "13;0;0;83",
        "wc_reply_authors": "437;335;318;440",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            57.0,
            13.095800853708795
        ],
        "wc_strengths_avg": [
            97.0,
            71.92704637339142
        ],
        "wc_weaknesses_avg": [
            129.0,
            45.403744338985966
        ],
        "wc_questions_avg": [
            49.0,
            39.102429592034305
        ],
        "wc_review_avg": [
            332.0,
            111.7609055081427
        ],
        "wc_reply_reviewers_avg": [
            24.0,
            34.4746283518764
        ],
        "wc_reply_authors_avg": [
            382.5,
            56.331607468631674
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11652910758207888689&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=U7VW3KBm34",
        "pdf": "https://openreview.net/pdf?id=U7VW3KBm34",
        "email": "snu.ac.kr;snu.ac.kr;snu.ac.kr",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Seoul National University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.snu.ac.kr",
        "aff_unique_abbr": "SNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "CALICO: Self-Supervised Camera-LiDAR Contrastive Pre-training for BEV Perception",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18532",
        "id": "U7iiF79kI3",
        "author_site": "Jiachen Sun, Haizhong Zheng, Qingzhao Zhang, Atul Prakash, Zhuoqing Mao, Chaowei Xiao",
        "tldr": "",
        "abstract": "Perception is crucial in the realm of autonomous driving systems, where bird's eye view (BEV)-based architectures have recently reached state-of-the-art performance. The desirability of self-supervised representation learning stems from the expensive and laborious process of annotating 2D and 3D data.  Although previous research has investigated pretraining methods for both LiDAR and camera-based 3D object detection, a unified pretraining framework for multimodal BEV perception is missing. In this study, we introduce CALICO, a novel framework that applies contrastive objectives to both LiDAR and camera backbones. Specifically, CALICO incorporates two stages: point-region contrast (PRC) and region-aware distillation (RAD). PRC better balances the region- and scene-level representation learning on the LiDAR modality and offers significant performance improvement compared to existing methods. RAD effectively achieves contrastive distillation on our self-trained teacher model. CALICO's efficacy is substantiated by extensive evaluations on 3D object detection and BEV map segmentation tasks, where it delivers significant performance improvements. Notably, CALICO outperforms the baseline method by 10.5\\% and 8.6\\% on NDS and mAP. Moreover, CALICO boosts the robustness of multimodal 3D object detection against adversarial attacks and corruption. Additionally, our framework can be tailored to different backbones and heads, positioning it as a promising approach for multimodal BEV perception.",
        "keywords": "Contrastive Learning;BEV Perception",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Jiachen Sun;Haizhong Zheng;Qingzhao Zhang;Atul Prakash;Zhuoqing Mao;Chaowei Xiao",
        "authorids": "~Jiachen_Sun1;~Haizhong_Zheng1;~Qingzhao_Zhang1;~Atul_Prakash1;~Zhuoqing_Mao1;~Chaowei_Xiao2",
        "gender": "M;M;M;;F;M",
        "homepage": "https://web.eecs.umich.edu/~jiachens/;http://zhenghaizhong.com/;https://zqzqz.github.io;https://www.eecs.umich.edu/~aprakash;https://web.eecs.umich.edu/~zmao/;https://xiaocw11.github.io/",
        "dblp": ";158/4817;132/5633;p/AtulPrakash;;150/3317",
        "google_scholar": "Knnv3p4AAAAJ;Zx6pKsQAAAAJ;ZSXIPHgAAAAJ;kIkHa2IAAAAJ;Ba_Ci9UAAAAJ;Juoqtj8AAAAJ",
        "orcid": ";0000-0003-3723-8701;0000-0003-2598-5988;0000-0002-4907-3687;;0000-0002-7043-4926",
        "linkedin": "jiachensun23/;haizhong-zheng-1093a0a7/;qingzhao-zhang-zqzqz/;atul-prakash-8729a44/;;",
        "or_profile": "~Jiachen_Sun1;~Haizhong_Zheng1;~Qingzhao_Zhang1;~Atul_Prakash1;~Zhuoqing_Mao1;~chaowei_xiao1",
        "aff": "LinkedIn;University of Michigan;University of Michigan - Ann Arbor;University of Michigan;University of Michigan;NVIDIA",
        "aff_domain": "linkedin.com;umich.edu;umich.edu;umich.edu;umich.edu;nvidia.com",
        "position": "Researcher;PhD student;PhD student;Professor;Professor;Researcher",
        "bibtex": "@inproceedings{\nsun2024calico,\ntitle={{CALICO}: Self-Supervised Camera-Li{DAR} Contrastive Pre-training for {BEV} Perception},\nauthor={Jiachen Sun and Haizhong Zheng and Qingzhao Zhang and Atul Prakash and Zhuoqing Mao and Chaowei Xiao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=U7iiF79kI3}\n}",
        "github": "",
        "project": "",
        "reviewers": "ksX5;2HK8;fxyA",
        "pdf_size": 3533678,
        "rating": "6;6;8",
        "confidence": "5;5;3",
        "soundness": "4;3;4",
        "contribution": "4;2;3",
        "presentation": "4;3;4",
        "wc_summary": "45;148;98",
        "wc_strengths": "63;62;65",
        "wc_weaknesses": "72;98;54",
        "wc_questions": "3;88;5",
        "wc_review": "183;396;222",
        "wc_reply_reviewers": "14;216;8",
        "wc_reply_authors": "550;2567;756",
        "reply_reviewers": "1;2;1",
        "reply_authors": "2;5;3",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "soundness_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            97.0,
            42.05551886098502
        ],
        "wc_strengths_avg": [
            63.333333333333336,
            1.247219128924647
        ],
        "wc_weaknesses_avg": [
            74.66666666666667,
            18.06162291219209
        ],
        "wc_questions_avg": [
            32.0,
            39.60639678974429
        ],
        "wc_review_avg": [
            267.0,
            92.59589623736032
        ],
        "wc_reply_reviewers_avg": [
            79.33333333333333,
            96.66896548990731
        ],
        "wc_reply_authors_avg": [
            1291.0,
            906.1791581506753
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            1.247219128924647
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.9999999999999998,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13311113978049566644&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=U7iiF79kI3",
        "pdf": "https://openreview.net/pdf?id=U7iiF79kI3",
        "email": "linkedin.com;umich.edu;umich.edu;umich.edu;umich.edu;nvidia.com",
        "author_num": 6,
        "aff_unique_index": "0;1;1;1;1;2",
        "aff_unique_norm": "LinkedIn Corporation;University of Michigan;NVIDIA",
        "aff_unique_dep": ";;NVIDIA Corporation",
        "aff_unique_url": "https://www.linkedin.com;https://www.umich.edu;https://www.nvidia.com",
        "aff_unique_abbr": "LinkedIn;UM;NVIDIA",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Ann Arbor",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "U96nHn0dmK",
        "title": "Stochastic Subnetwork Annealing: A Regularization Technique for Fine Tuning Subnetworks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Pruning methods have recently grown in popularity as an effective way to reduce the size and computational complexity of deep neural networks. Large numbers of parameters can be removed from trained models with little discernible loss in accuracy after a small number of continued training epochs. However, pruning too many parameters at once often causes an initial steep drop in accuracy which can undermine convergence quality. Iterative pruning approaches mitigate this by gradually removing a small number of parameters over multiple epochs. However, this can still lead to subnetworks that overfit local regions of the loss landscape. We introduce a novel and effective approach to tuning subnetworks through a regularization technique we call Stochastic Subnetwork Annealing. Instead of removing parameters in a discrete manner, we instead represent subnetworks with stochastic masks where each parameter has a probabilistic chance of being included or excluded on any given forward pass. We anneal these probabilities over time such that subnetwork structure slowly evolves as mask values become more deterministic, allowing for a smoother and more robust optimization of subnetworks at high levels of sparsity.",
        "keywords": "Deep Learning;Pruning;Fine Tuning;Subnetworks;Stochastic Annealing;Regularization",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Tim Whitaker;Darrell Whitley",
        "authorids": "~Tim_Whitaker1;~Darrell_Whitley1",
        "gender": "M;M",
        "homepage": "https://tim-whitaker.com;https://www.cs.colostate.edu/~whitley/",
        "dblp": ";w/LDarrellWhitley",
        "google_scholar": ";0VzUxIcAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Tim_Whitaker1;~Darrell_Whitley1",
        "aff": ";",
        "aff_domain": ";",
        "position": ";",
        "bibtex": "@misc{\nwhitaker2024stochastic,\ntitle={Stochastic Subnetwork Annealing: A Regularization Technique for Fine Tuning Subnetworks},\nauthor={Tim Whitaker and Darrell Whitley},\nyear={2024},\nurl={https://openreview.net/forum?id=U96nHn0dmK}\n}",
        "github": "",
        "project": "",
        "reviewers": "kiVy;6mmk;8ZvZ;wViy;i1oq",
        "site": "https://openreview.net/forum?id=U96nHn0dmK",
        "pdf_size": 356405,
        "rating": "3;3;5;6;6",
        "confidence": "4;3;5;3;3",
        "soundness": "2;2;3;2;2",
        "contribution": "2;2;3;2;2",
        "presentation": "2;4;3;3;2",
        "wc_summary": "67;58;112;76;87",
        "wc_strengths": "17;25;62;64;104",
        "wc_weaknesses": "454;484;119;160;169",
        "wc_questions": "38;49;54;49;123",
        "wc_review": "576;616;347;349;483",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            4.6,
            1.3564659966250536
        ],
        "confidence_avg": [
            3.6,
            0.8
        ],
        "soundness_avg": [
            2.2,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.8,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            80.0,
            18.665476152512156
        ],
        "wc_strengths_avg": [
            54.4,
            31.21922484623858
        ],
        "wc_weaknesses_avg": [
            277.2,
            157.7940429800821
        ],
        "wc_questions_avg": [
            62.6,
            30.650285479910295
        ],
        "wc_review_avg": [
            474.2,
            111.71642672409462
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.1474419561548971,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:E8X9DrQNa54J:scholar.google.com/&scioq=Stochastic+Subnetwork+Annealing:+A+Regularization+Technique+for+Fine+Tuning+Subnetworks&hl=en&as_sdt=0,5",
        "gs_version_total": 0
    },
    {
        "id": "U9NHClvopO",
        "title": "SuperPos-Prompt: Enhancing Soft Prompt Tuning of Language Models with Superposition of Multi Token Embeddings",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Soft prompt tuning techniques have recently gained traction as an effective strategy for the parameter-efficient tuning of pretrained language models, particularly minimizing the required adjustment of model parameters. Despite their growing use, achieving optimal tuning with soft prompts, especially with smaller datasets, remains a substantial challenge. This study makes two contributions in this domain: (i) we introduce SuperPos-Prompt, a new reparameterization technique employing the superposition of multiple pretrained vocabulary embeddings to improve the learning of soft prompts.  Our experiments across several GLUE and SuperGLUE benchmarks consistently highlight SuperPos-Prompt's superiority over \\textit{Residual Prompt} tuning, exhibiting an average score increase of +4.7 in T5-Small and $+3.9$ in T5-Base along with a faster convergence. Remarkably, SuperPos-Prompt occasionally outperforms even full fine-tuning methods. (ii) Additionally, we demonstrate enhanced performance and rapid convergence by omitting dropout from the frozen network, yielding consistent improvements across various scenarios and tuning methods. Unlike many existing strategies, our approach does not rely on the availability of a proficient pretrained source prompt for initialization, thereby ensuring notable flexibility and more effective combination of related prompt candidates.",
        "keywords": "Parameter-Efficient Fine-tuning;Prompt Learning;Soft Prompt Tuning;Langauge Models",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "MohammadAli SadraeiJavaheri;Ehsaneddin Asgari;Alice C McHardy;Hamid R. Rabiee",
        "authorids": "~MohammadAli_SadraeiJavaheri1;~Ehsaneddin_Asgari1;~Alice_C_McHardy1;~Hamid_R._Rabiee1",
        "gender": "M;M;F;M",
        "homepage": ";;https://www.helmholtz-hzi.de/en/research/research-topics/bacterial-and-viral-pathogens/computational-biology-of-infection-research/alice-mchardy/;http://sharif.edu/~rabiee",
        "dblp": "375/8117.html;127/1257;;01/4547",
        "google_scholar": "7YknS9kAAAAJ;lIVvIFsAAAAJ;https://scholar.google.de/citations?user=zJaGqmAAAAAJ;rKDtrNgAAAAJ",
        "orcid": "0000-0002-7267-4894;;;0000-0002-9835-4493",
        "linkedin": "mohammad-ali-sadraei-javaheri-970052207/;;;hrabiee/",
        "or_profile": "~MohammadAli_SadraeiJavaheri1;~Ehsaneddin_Asgari1;~Alice_C_McHardy1;~Hamid_R._Rabiee1",
        "aff": "Part AI Research Center;University of California, Berkeley;;Sharif University of Technology",
        "aff_domain": "partdp.ai;berkeley.edu;;sharif.edu",
        "position": "Researcher;Researcher;;Full Professor",
        "bibtex": "@misc{\nsadraeijavaeri2024superposprompt,\ntitle={SuperPos-Prompt: Enhancing Soft Prompt Tuning of Language Models with Superposition of Multi Token Embeddings},\nauthor={MohammadAli SadraeiJavaheri and Ehsaneddin Asgari and Alice C McHardy and Hamid R. Rabiee},\nyear={2024},\nurl={https://openreview.net/forum?id=U9NHClvopO}\n}",
        "github": "",
        "project": "",
        "reviewers": "HvC5;gZe6;4x9F;xLGd",
        "site": "https://openreview.net/forum?id=U9NHClvopO",
        "pdf_size": 2375769,
        "rating": "3;5;5;6",
        "confidence": "4;4;4;3",
        "soundness": "2;2;2;2",
        "contribution": "2;3;2;3",
        "presentation": "2;2;3;3",
        "wc_summary": "27;290;103;66",
        "wc_strengths": "9;155;56;106",
        "wc_weaknesses": "143;624;76;57",
        "wc_questions": "2;182;17;58",
        "wc_review": "181;1251;252;287",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "494;445;421;430",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            121.5,
            100.92695378341705
        ],
        "wc_strengths_avg": [
            81.5,
            54.56418239101544
        ],
        "wc_weaknesses_avg": [
            225.0,
            232.56719459115467
        ],
        "wc_questions_avg": [
            64.75,
            70.72967906049058
        ],
        "wc_review_avg": [
            492.75,
            439.43849114523414
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            447.5,
            28.182441342083905
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.6622661785325219,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:zlCidQXRA20J:scholar.google.com/&scioq=SuperPos-Prompt:+Enhancing+Soft+Prompt+Tuning+of+Language+Models+with+Superposition+of+Multi+Token+Embeddings&hl=en&as_sdt=0,5",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Part AI Research Center;University of California, Berkeley;Sharif University of Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": ";https://www.berkeley.edu;https://www.sharif.edu",
        "aff_unique_abbr": ";UC Berkeley;SUT",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Berkeley",
        "aff_country_unique_index": "1;2",
        "aff_country_unique": ";United States;Iran"
    },
    {
        "id": "U9XuNY9crx",
        "title": "Complete and continuous representations of Euclidean graphs",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Euclidean graphs have unordered vertices and non-intersecting straight-line edges in any Euclidean space. The main application is for molecular graphs with vertices at atomic centers and edges representing inter-atomic bonds. Euclidean graphs are considered equivalent if they are related by isometry (any distance-preserving transformation). This paper introduces the strongest descriptors that are provably (1) invariant under any isometry, (2) complete and sufficient to reconstruct any Euclidean graph up to isometry,  (3) Lipschitz continuous so that perturbations of all vertices within their epsilon-neighborhoods change the complete invariant up to a constant multiple of epsilon in a suitable metric, and (4) computable (both invariant and metric) in a polynomial time in the number of vertices for a fixed dimension. These strongest invariants transparently explained a continuous structure-property landscape for molecular graphs from the QM9 database of 130K+ molecules.",
        "keywords": "complete representation;Euclidean graph;rigid molecule;isometry invariant;continuous metric;structure-property relation",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/c0c1a74084812b99517cdc112ae49564b8a4e733.zip",
        "author": "Yury Elkin;Vitaliy Kurlin",
        "authorids": "~Yury_Elkin2;~Vitaliy_Kurlin1",
        "gender": ";Not Specified",
        "homepage": "http://kurlin.org/#yury;http://kurlin.org",
        "dblp": ";13/7215",
        "google_scholar": ";https://scholar.google.co.uk/citations?user=mtz3cigAAAAJ",
        "orcid": ";0000-0001-5328-5351",
        "linkedin": ";vitaliy-kurlin-09850621/",
        "or_profile": "~Yury_Elkin2;~Vitaliy_Kurlin1",
        "aff": "University of Liverpool;University of Liverpool",
        "aff_domain": "liverpool.ac.uk;liv.ac.uk",
        "position": "Postdoc;Full Professor",
        "bibtex": "@misc{\nelkin2024complete,\ntitle={Complete and continuous representations of Euclidean graphs},\nauthor={Yury Elkin and Vitaliy Kurlin},\nyear={2024},\nurl={https://openreview.net/forum?id=U9XuNY9crx}\n}",
        "github": "",
        "project": "",
        "reviewers": "C7Vu;FYHL;ekKc;7QMR;AGV3",
        "site": "https://openreview.net/forum?id=U9XuNY9crx",
        "pdf_size": 5118476,
        "rating": "3;3;5;6;8",
        "confidence": "2;4;5;2;3",
        "soundness": "3;2;3;4;3",
        "contribution": "3;2;2;3;2",
        "presentation": "3;3;3;3;4",
        "wc_summary": "72;161;73;116;62",
        "wc_strengths": "53;72;53;114;30",
        "wc_weaknesses": "116;236;189;155;43",
        "wc_questions": "120;139;422;5;29",
        "wc_review": "361;608;737;390;164",
        "wc_reply_reviewers": "384;0;358;0;0",
        "wc_reply_authors": "1206;726;2125;387;220",
        "reply_reviewers": "1;0;4;0;0",
        "reply_authors": "2;1;5;1;1",
        "rating_avg": [
            5.0,
            1.8973665961010275
        ],
        "confidence_avg": [
            3.2,
            1.16619037896906
        ],
        "soundness_avg": [
            3.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            3.2,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            96.8,
            37.10202150826825
        ],
        "wc_strengths_avg": [
            64.4,
            28.146758250285234
        ],
        "wc_weaknesses_avg": [
            147.8,
            65.60914570393369
        ],
        "wc_questions_avg": [
            143.0,
            148.61090134980003
        ],
        "wc_review_avg": [
            452.0,
            200.31475232743094
        ],
        "wc_reply_reviewers_avg": [
            148.4,
            181.93801142147288
        ],
        "wc_reply_authors_avg": [
            932.8,
            684.7958527911803
        ],
        "reply_reviewers_avg": [
            1.0,
            1.5491933384829668
        ],
        "reply_authors_avg": [
            2.0,
            1.5491933384829668
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.09038769075777342,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:jFLWZLNfDAkJ:scholar.google.com/&scioq=Complete+and+continuous+representations+of+Euclidean+graphs&hl=en&as_sdt=0,48",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Liverpool",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.liverpool.ac.uk",
        "aff_unique_abbr": "Liv Uni",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "U9p10hgOpU",
        "title": "Unsupervised Lifelong Learning with Sustained Representation Fairness",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Lifelong learning, pivotal in the incremental improvement of decision-making\nfunctions, can be ill-conditioned when dealing with one or several upcoming\ntasks that insinuate spurious correlations between target labels and sensitive de-\nmographic attributes. This often results in biased decisions, disproportionately\nfavoring certain demographic groups. Prior studies to de-bias such learners by\nfostering fairness-aware, intermediate representations often overlook the inherent\ndiversity of task distributions, thereby faltering in ensuring fairness in a lifelong\nfashion. This challenge intensi\ufb01es in the context of unlabeled tasks, where dis-\ncerning distributional shifts for the adaptation of learned fair representations is\nnotably intricate. Motivated by this, we propose Sustaining Fair Representations\nin Unsupervised Lifelong Learning (FaRULi), a new paradigm inspired by human\ninstinctive learning behavior. Like human who tends to prioritize simpler tasks\nover more challenging ones that signi\ufb01cantly outstrip one\u2019s current knowledge\nscope, FaRULi reschedules a buffer of tasks based on the proximity of their fair\nrepresentations. The learner starts from tasks that share similar fair representa-\ntions, accumulating essential de-biasing knowledge from them. Once the learner\nrevisits a previously postponed task with more disparate demographic distribu-\ntions, it is more likely to increment a fair representation from it, as the learner\nis now provided a larger rehearsal dataset enriched from the learned tasks with\ndiverse demographic patterns. FaRULi showcases promising capability in mak-\ning fair yet accurate decisions in a sequence of tasks without supervision labels,\nbacked by both theoretical results and empirical evaluation on benchmark datasets.\nCode is available at: anonymous.4open.science/r/FaRULi/.",
        "keywords": "Lifelong Learning;Fairness-aware Machine Learning;Unsupervised Learning;Adversarial Games",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/e67ebf2b5cdae3b105b69d3b4c370c2408a23b6f.pdf",
        "author": "Heng Lian;Xingquan Zhu;My T. Thai;Yi He",
        "authorids": "~Heng_Lian2;~Xingquan_Zhu1;~My_T._Thai2;~Yi_He4",
        "gender": "M;M;M;F",
        "homepage": ";http://www.cse.fau.edu/~xqzhu/;https://www.lions.odu.edu/~y1he;http://www.cise.ufl.edu/~mythai",
        "dblp": ";https://dblp.uni-trier.de/pid/26/4253.html;65/425-7;63/4711",
        "google_scholar": "https://scholar.google.com/citations?hl=en;YhKZXtcAAAAJ;DKqpGaUAAAAJ;zLLJimcAAAAJ",
        "orcid": "0000-0003-3240-4221;;0000-0002-5357-6623;0000-0003-0503-2012",
        "linkedin": ";;;",
        "or_profile": "~Heng_Lian2;~Xingquan_Zhu1;~Yi_He4;~My_Thai1",
        "aff": "Old Dominion University;Florida Atlantic University;Old Dominion University;University of Florida",
        "aff_domain": "odu.edu;fau.edu;odu.edu;ufl.edu",
        "position": "PhD student;Full Professor;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nlian2024unsupervised,\ntitle={Unsupervised Lifelong Learning with Sustained Representation Fairness},\nauthor={Heng Lian and Xingquan Zhu and My T. Thai and Yi He},\nyear={2024},\nurl={https://openreview.net/forum?id=U9p10hgOpU}\n}",
        "github": "",
        "project": "",
        "reviewers": "kvtG;8gZZ;E5F7;an9h",
        "site": "https://openreview.net/forum?id=U9p10hgOpU",
        "pdf_size": 3422640,
        "rating": "3;5;5;6",
        "confidence": "4;2;3;1",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;3;3",
        "wc_summary": "123;68;261;75",
        "wc_strengths": "25;73;116;40",
        "wc_weaknesses": "478;128;747;126",
        "wc_questions": "62;63;455;93",
        "wc_review": "688;332;1579;334",
        "wc_reply_reviewers": "0;0;369;0",
        "wc_reply_authors": "782;788;1463;750",
        "reply_reviewers": "0;0;2;0",
        "reply_authors": "2;2;4;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            2.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            131.75,
            77.56730948021854
        ],
        "wc_strengths_avg": [
            63.5,
            34.93207694941714
        ],
        "wc_weaknesses_avg": [
            369.75,
            260.716680517377
        ],
        "wc_questions_avg": [
            168.25,
            166.0231535057686
        ],
        "wc_review_avg": [
            733.25,
            509.34829684607763
        ],
        "wc_reply_reviewers_avg": [
            92.25,
            159.78168699822893
        ],
        "wc_reply_authors_avg": [
            945.75,
            298.98359068684687
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            2.25,
            1.0897247358851685
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9233805168766388,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:gD3oE2da-lwJ:scholar.google.com/&scioq=Unsupervised+Lifelong+Learning+with+Sustained+Representation+Fairness&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "Old Dominion University;Florida Atlantic University;University of Florida",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.odu.edu;https://www.fau.edu;https://www.ufl.edu",
        "aff_unique_abbr": "ODU;FAU;UF",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "U9sHVjidYH",
        "title": "On the Efficiency of Transformers: The Effect of Attention Rank",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Transformers have showcased superior performance across a variety of real-world scenarios, marking the advent of a period dominated by large language models. However, with the escalating complexity of these models and the continuous enlargement of training datasets, efficiency-related challenges have become more pronounced. In this study, we investigate the influence of the rank of attention matrices on the training and performance of these models. We first gain insight by benchmark tasks such as BERT and GPT-2. Our findings underscore that \n(i) the mean rank of attention matrices is stable throughout the training, and the initial rank is a dependable indicator of the final rank;\n(ii) a distinct positive relationship exists between the attention rank and the effectiveness of the model, where elevated ranks correlate with diminished loss and expedited convergence. \nThese insights reveal a relationship between initial attention matrix rank and performance. We proceed to investigate the impact of hyperparameters on the initial rank. The study unveils that modifying the softmax temperature or the head dimension can amplify the ranks, with the former exerting a more significant effect. Notably, we theoretically identify the characterization in the attention matrix rank at low temperatures, and we demonstrate the existence of an upper bound of attention matrix rank with respect to the head dimension. These observations are validated through trials on a high-rank target, underscoring instances where traditional setups fall short.",
        "keywords": "Transformers;Attention Matrix Rank;Softmax Temperature;Head Dimension;Model Performance",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Zeping Min;Zhong Li",
        "authorids": "~Zeping_Min1;~Zhong_Li2",
        "gender": ";M",
        "homepage": ";https://www.microsoft.com/en-us/research/people/lzhong/",
        "dblp": ";",
        "google_scholar": ";https://scholar.google.com/citations?view_op=list_works",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Zeping_Min1;~Zhong_Li2",
        "aff": ";Microsoft Research Asia",
        "aff_domain": ";microsoft.com",
        "position": ";Researcher",
        "bibtex": "@misc{\nmin2024on,\ntitle={On the Efficiency of Transformers: The Effect of Attention Rank},\nauthor={Zeping Min and Zhong Li},\nyear={2024},\nurl={https://openreview.net/forum?id=U9sHVjidYH}\n}",
        "github": "",
        "project": "",
        "reviewers": "cW94;ZXWy;orQ3",
        "site": "https://openreview.net/forum?id=U9sHVjidYH",
        "pdf_size": 2622208,
        "rating": "3;3;5",
        "confidence": "4;4;4",
        "soundness": "1;2;2",
        "contribution": "1;2;2",
        "presentation": "2;2;3",
        "wc_summary": "103;114;126",
        "wc_strengths": "63;39;95",
        "wc_weaknesses": "257;213;376",
        "wc_questions": "169;24;49",
        "wc_review": "592;390;646",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            114.33333333333333,
            9.392668535736915
        ],
        "wc_strengths_avg": [
            65.66666666666667,
            22.939534045447004
        ],
        "wc_weaknesses_avg": [
            282.0,
            68.85249934945475
        ],
        "wc_questions_avg": [
            80.66666666666667,
            63.28945848682508
        ],
        "wc_review_avg": [
            542.6666666666666,
            110.17965127715533
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:62p0E7rm9AkJ:scholar.google.com/&scioq=On+the+Efficiency+of+Transformers:+The+Effect+of+Attention+Rank&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Microsoft",
        "aff_unique_dep": "Research",
        "aff_unique_url": "https://www.microsoft.com/en-us/research/group/asia",
        "aff_unique_abbr": "MSR Asia",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Asia",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "UB03wcP8RH",
        "title": "Multitask Contrastive Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Multi-task and contrastive learning are both aimed at enhancing the robustness of learned embeddings. But combining these two fields presents challenges. Supervised contrastive learning brings together examples of the same class while pushing apart examples of different classes, which is intuitive in single-task scenarios. However, it becomes less intuitive when dealing with multiple tasks, which might require different notions of similarity. In this work, we introduce a novel method, Multi-Task Contrastive Loss (MTCon), that improves the generalization capabilities of learned embeddings by concurrently incorporating supervision from multiple similarity metrics. MTCon learns task weightings that consider the uncertainty associated with each task, reducing the influence of uncertain tasks. In a series of experiments, we show that these learned weightings enhance out-of-domain generalization to novel tasks. Across three distinct multi-task datasets, we find that networks trained with MTCon consistently outperform networks trained with weighted multi-task cross-entropy in both in-domain and out-of domain multi-task learning scenarios. Code will be made available upon publication.",
        "keywords": "representation learning;contrastive learning;generalization;multi-task learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Emily Mu;John Guttag;Maggie Makar",
        "authorids": "~Emily_Mu1;~John_Guttag2;~Maggie_Makar1",
        "gender": "F;M;F",
        "homepage": ";https://people.csail.mit.edu/guttag/;https://mymakar.github.io/",
        "dblp": ";g/JohnVGuttag;211/6995",
        "google_scholar": "OW1TCKIAAAAJ;;bmlgkM4AAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Emily_Mu1;~John_Guttag2;~Maggie_Makar1",
        "aff": "Massachusetts Institute of Technology;Massachusetts Institute of Technology;University of Michigan - Ann Arbor",
        "aff_domain": "mit.edu;mit.edu;umich.edu",
        "position": "PhD student;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nmu2024multitask,\ntitle={Multitask Contrastive Learning},\nauthor={Emily Mu and John Guttag and Maggie Makar},\nyear={2024},\nurl={https://openreview.net/forum?id=UB03wcP8RH}\n}",
        "github": "",
        "project": "",
        "reviewers": "TwpG;BR7u;yq2P;EEgJ",
        "site": "https://openreview.net/forum?id=UB03wcP8RH",
        "pdf_size": 1539374,
        "rating": "5;5;5;6",
        "confidence": "4;3;4;4",
        "soundness": "3;3;2;3",
        "contribution": "2;1;2;3",
        "presentation": "2;3;2;3",
        "wc_summary": "505;34;130;83",
        "wc_strengths": "2;49;90;53",
        "wc_weaknesses": "2;176;121;115",
        "wc_questions": "2;68;23;59",
        "wc_review": "511;327;364;310",
        "wc_reply_reviewers": "0;0;0;16",
        "wc_reply_authors": "376;246;425;159",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            188.0,
            186.14107553143663
        ],
        "wc_strengths_avg": [
            48.5,
            31.244999599935987
        ],
        "wc_weaknesses_avg": [
            103.5,
            63.23962365479415
        ],
        "wc_questions_avg": [
            38.0,
            26.74883175019051
        ],
        "wc_review_avg": [
            378.0,
            79.23067587746554
        ],
        "wc_reply_reviewers_avg": [
            4.0,
            6.928203230275509
        ],
        "wc_reply_authors_avg": [
            301.5,
            105.10589897812586
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:QmCxTlC1FQgJ:scholar.google.com/&scioq=Multitask+Contrastive+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Massachusetts Institute of Technology;University of Michigan",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://web.mit.edu;https://www.umich.edu",
        "aff_unique_abbr": "MIT;UM",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Ann Arbor",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "CivRealm: A Learning and Reasoning Odyssey in Civilization for Decision-Making Agents",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18531",
        "id": "UBVNwD3hPN",
        "author_site": "Siyuan Qi, Shuo Chen, Yexin Li, Xiangyu Kong, Junqi Wang, Bangcheng Yang, pring wong, Yifan Zhong, Xiaoyuan Zhang, Zhaowei Zhang, Nian Liu, Yaodong Yang, Song-Chun Zhu",
        "tldr": "",
        "abstract": "The generalization of decision-making agents encompasses two fundamental elements: learning from past experiences and reasoning in novel contexts. However, the predominant emphasis in most interactive environments is on learning, often at the expense of complexity in reasoning. In this paper, we introduce CivRealm, an environment inspired by the Civilization game. Civilization\u2019s profound alignment with human society requires sophisticated learning and prior knowledge, while its ever-changing space and action space demand robust reasoning for generalization. Particularly, CivRealm sets up an imperfect-information general-sum game with a changing number of players; it presents a plethora of complex features, challenging the agent to deal with open-ended stochastic environments that require diplomacy and negotiation skills. Within CivRealm, we provide interfaces for two typical agent types: tensor-based agents that focus on learning, and language-based agents that emphasize reasoning. To catalyze further research, we present initial results for both paradigms. The canonical RL-based agents exhibit reasonable performance in mini-games, whereas both RL- and LLM-based agents struggle to make substantial progress in the full game. Overall, CivRealm stands as a unique learning and reasoning challenge for decision-making agents. The code is available at https://github.com/bigai-ai/civrealm.",
        "keywords": "Interactive Environments;Benchmark;Reinforcement Learning;Language Agent;Multi-agent",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/be464c49a632e7f0d8f85a21d0f6deaa38501cd4.zip",
        "author": "Siyuan Qi;Shuo Chen;Yexin Li;Xiangyu Kong;Junqi Wang;Bangcheng Yang;Pring Wong;Yifan Zhong;Xiaoyuan Zhang;Zhaowei Zhang;Nian Liu;Yaodong Yang;Song-Chun Zhu",
        "authorids": "~Siyuan_Qi1;~Shuo_Chen3;~Yexin_Li1;~Xiangyu_Kong1;~Junqi_Wang1;~Bangcheng_Yang1;~Pring_Wong2;~Yifan_Zhong2;~Xiaoyuan_Zhang3;~Zhaowei_Zhang2;~Nian_Liu4;~Yaodong_Yang1;~Song-Chun_Zhu1",
        "gender": ";;F;M;M;M;;;;M;;M;M",
        "homepage": ";;https://liyexn.github.io/liyexin.github.io/;https://sites.google.com/site/pkuxykong/;;https://github.com/DumbMice;;;;https://zowiezhang.github.io;;https://www.yangyaodong.com;https://zhusongchun.net/",
        "dblp": "177/5178;;176/1477;12/8442;213/0790;;;;;127/1796;;170/1496-1;10/10313",
        "google_scholar": "ePclJR4AAAAJ;;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com/citations?pli=1;;;;GAH17kgAAAAJ;https://scholar.google.com.hk/citations?view_op=list_works;;https://scholar.google.co.uk/citations?user=6yL0xw8AAAAJ;https://scholar.google.com.tw/citations?user=Al8dyb4AAAAJ",
        "orcid": "0000-0002-4070-733X;;;0000-0002-8737-0180;;;;;;;;0000-0001-8132-5613;",
        "linkedin": ";;;;;;;;;;;yaodong-yang;",
        "or_profile": "~Siyuan_Qi1;~Shuo_Chen3;~Yexin_Li1;~Xiangyu_Kong1;~Junqi_Wang1;~Bangcheng_Yang1;~Pring_Wong2;~Yifan_Zhong2;~Xiaoyuan_Zhang3;~Zhaowei_Zhang2;~Nian_Liu4;~Yaodong_Yang1;~Song-Chun_Zhu1",
        "aff": "Beijing Institute for General Artificial Intelligence;;State Key Laboratory of General Artificial Intelligence, BIGAI;Beijing Institute for General Artificial Intelligence;Beijing Institute for General Artificial Intelligence;;;;Beijing Institute for General Artificial Intelligence;Peking University;;Peking University;Peking University",
        "aff_domain": "bigai.ai;;bigai.ai;bigai.ai;bigai.ai;;;;bigai.ai;pku.edu.cn;;pku.edu.cn;pku.edu.cn",
        "position": "Researcher;;Researcher;Researcher;Researcher;;;;Intern;PhD student;;Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\nqi2024civrealm,\ntitle={CivRealm: A Learning and Reasoning Odyssey in Civilization for Decision-Making Agents},\nauthor={Siyuan Qi and Shuo Chen and Yexin Li and Xiangyu Kong and Junqi Wang and Bangcheng Yang and Pring Wong and Yifan Zhong and Xiaoyuan Zhang and Zhaowei Zhang and Nian Liu and Yaodong Yang and Song-Chun Zhu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=UBVNwD3hPN}\n}",
        "github": "",
        "project": "",
        "reviewers": "XJ4N;4Csd;3D5Q",
        "pdf_size": 6022875,
        "rating": "6;8;8",
        "confidence": "4;4;3",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "3;2;3",
        "wc_summary": "40;44;72",
        "wc_strengths": "53;57;31",
        "wc_weaknesses": "80;117;22",
        "wc_questions": "25;66;45",
        "wc_review": "198;284;170",
        "wc_reply_reviewers": "90;13;16",
        "wc_reply_authors": "867;777;229",
        "reply_reviewers": "1;1;1",
        "reply_authors": "3;2;2",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            52.0,
            14.236104336041748
        ],
        "wc_strengths_avg": [
            47.0,
            11.430952132988164
        ],
        "wc_weaknesses_avg": [
            73.0,
            39.098167049961134
        ],
        "wc_questions_avg": [
            45.333333333333336,
            16.73983937265296
        ],
        "wc_review_avg": [
            217.33333333333334,
            48.50658603621666
        ],
        "wc_reply_reviewers_avg": [
            39.666666666666664,
            35.6121078036982
        ],
        "wc_reply_authors_avg": [
            624.3333333333334,
            281.94719757823844
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            13,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 21,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4158976954333697611&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=UBVNwD3hPN",
        "pdf": "https://openreview.net/pdf?id=UBVNwD3hPN",
        "email": "bigai.ai;;bigai.ai;bigai.ai;bigai.ai;;;;bigai.ai;pku.edu.cn;;pku.edu.cn;pku.edu.cn",
        "author_num": 13,
        "aff_unique_index": "0;1;0;0;0;2;2;2",
        "aff_unique_norm": "Beijing Institute for General Artificial Intelligence;State Key Laboratory of General Artificial Intelligence;Peking University",
        "aff_unique_dep": ";General Artificial Intelligence;",
        "aff_unique_url": "http://www.bigaiai.org/;;http://www.pku.edu.cn",
        "aff_unique_abbr": "BIGAI;SKLGA;Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "UC9pzq9NUU",
        "title": "Beyond adversarial examples: sampling and repairing diverse failures with RADIUM",
        "track": "main",
        "status": "Desk Reject",
        "tldr": "",
        "abstract": "Recent years have seen large numbers of learning-enabled autonomous systems deployed in the real world. Unfortunately, increased deployment has seen a corresponding increase in accidents involving these systems. We must be able to predict the ways in which these systems might fail and take steps to prevent those failures \\textit{before} deployment. Existing tools for failure prediction struggle to search over high-dimensional environmental parameters and provide little guidance on how to mitigate failures once they are discovered. In this paper, we develop a novel framework to efficiently predict failures and propose policy parameter updates to mitigate those failures. By re-framing adversarial optimization as a sequential inference problem, our approach is able to generate a more diverse set of challenging failures, which in turn lead to more robust repaired policies. We propose both gradient-free and gradient-based approaches to solving this inference problem, achieving state-of-the-art performance for policy repair, and we include a theoretical and empirical evaluation of the trade-offs between the two.",
        "keywords": "failure prediction;test-case generation;adversarial optimization",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/968a039ed6b3cb42b298ac406a47997cb498fccd.zip",
        "author": "Charles Dawson;Anjali Parashar;Chuchu Fan",
        "authorids": "~Charles_Dawson1;~Anjali_Parashar1;~Chuchu_Fan2",
        "gender": "M;F;F",
        "homepage": "https://dawson.mit.edu;https://anjalip.mit.edu/;https://chuchu.mit.edu",
        "dblp": "39/1246;319/5798;127/1756",
        "google_scholar": "FkDdz9gAAAAJ;https://scholar.google.com/citations?hl=en;J-dq_8EAAAAJ",
        "orcid": "0000-0002-8371-5313;0009-0002-2206-1165;",
        "linkedin": "c6d5;anjali-parashar-434b66151;chuchu-fan/",
        "or_profile": "~Charles_Dawson1;~Anjali_Parashar1;~Chuchu_Fan2",
        "aff": "Massachusetts State Government;Massachusetts Institute of Technology;Massachusetts Institute of Technology",
        "aff_domain": "mass.gov;mit.edu;mit.edu",
        "position": "Postdoc;PhD student;Assistant Professor",
        "bibtex": "@misc{\ndawson2024beyond,\ntitle={Beyond adversarial examples: sampling and repairing diverse failures with {RADIUM}},\nauthor={Charles Dawson and Anjali Parashar and Chuchu Fan},\nyear={2024},\nurl={https://openreview.net/forum?id=UC9pzq9NUU}\n}",
        "github": "",
        "project": "",
        "reviewers": "4Vs3",
        "site": "https://openreview.net/forum?id=UC9pzq9NUU",
        "pdf_size": 1892917,
        "rating": "1",
        "confidence": "5",
        "soundness": "2",
        "contribution": "2",
        "presentation": "1",
        "wc_summary": "20",
        "wc_strengths": "20",
        "wc_weaknesses": "20",
        "wc_questions": "20",
        "wc_review": "80",
        "wc_reply_reviewers": "0",
        "wc_reply_authors": "71",
        "reply_reviewers": "0",
        "reply_authors": "1",
        "rating_avg": [
            1.0,
            0.0
        ],
        "confidence_avg": [
            5.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.0,
            0.0
        ],
        "wc_summary_avg": [
            20.0,
            0.0
        ],
        "wc_strengths_avg": [
            20.0,
            0.0
        ],
        "wc_weaknesses_avg": [
            20.0,
            0.0
        ],
        "wc_questions_avg": [
            20.0,
            0.0
        ],
        "wc_review_avg": [
            80.0,
            0.0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            71.0,
            0.0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            2,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:YqRmweZgooAJ:scholar.google.com/&scioq=Beyond+adversarial+examples:+sampling+and+repairing+diverse+failures+with+RADIUM&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Massachusetts State Government;Massachusetts Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.mass.gov;https://web.mit.edu",
        "aff_unique_abbr": ";MIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "UCdAfq3oPY",
        "title": "Look-Ahead Selective Plasticity for Continual Learning of Visual Tasks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Contrastive representation learning has emerged as a promising technique for continual learning as it can learn representations that are robust to catastrophic forgetting and generalize well to unseen future tasks. Previous work in continual learning has addressed forgetting by using previous task data and trained models. Inspired by event models created and updated in the brain, we propose a new mechanism that takes place during task boundaries, i.e., when one task finishes and another starts. By observing the redundancy-inducing ability of contrastive loss on the output of a neural network, our method leverages the first few samples of the new task to identify and retain parameters contributing most to the transfer ability of the neural network, freeing up the remaining parts of the network to learn new features. We evaluate the proposed methods on benchmark computer vision datasets including CIFAR10 and TinyImagenet and demonstrate state-of-the-art performance in the task-incremental, class-incremental, and domain-incremental continual learning scenarios.",
        "keywords": "Continual Learning;Representation Learning;Contrastive Learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/cdc7f4661e237faa859df64a57d1b38e64c46b03.zip",
        "author": "Rouzbeh Meshkinnejad;Jie Mei;Daniel J Lizotte;Yalda Mohsenzadeh",
        "authorids": "~Rouzbeh_Meshkinnejad1;~Jie_Mei4;~Daniel_J_Lizotte1;~Yalda_Mohsenzadeh1",
        "gender": "M;F;female;M",
        "homepage": ";;https://mohsenzadehlab.com/people;http://www.csd.uwo.ca/~dlizotte/",
        "dblp": ";;;07/2428",
        "google_scholar": "0UgoPJ8AAAAJ;n7zXscEAAAAJ;xZIgSigAAAAJ;35zn-2cAAAAJ",
        "orcid": "0000-0002-0862-5422;0000-0003-4221-6275;0000-0001-8525-957X;",
        "linkedin": "rouzbeh-meshkin/;jiemiettimei/;;",
        "or_profile": "~Rouzbeh_Meshkinnejad1;~Jie_Mei4;~Yalda_Mohsenzadeh1;~Dan_Lizotte1",
        "aff": ";The University of Tokyo, Tokyo Institute of Technology;University of Western Ontario;University of Western Ontario",
        "aff_domain": ";u-tokyo.ac.jp;uwo.ca;uwo.ca",
        "position": ";Assistant Professor;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nmeshkinnejad2024lookahead,\ntitle={Look-Ahead Selective Plasticity for Continual Learning of Visual Tasks},\nauthor={Rouzbeh Meshkinnejad and Jie Mei and Daniel J Lizotte and Yalda Mohsenzadeh},\nyear={2024},\nurl={https://openreview.net/forum?id=UCdAfq3oPY}\n}",
        "github": "",
        "project": "",
        "reviewers": "ecgj;dRbC;a9u9",
        "site": "https://openreview.net/forum?id=UCdAfq3oPY",
        "pdf_size": 900124,
        "rating": "3;3;5",
        "confidence": "5;4;4",
        "soundness": "3;3;2",
        "contribution": "2;2;2",
        "presentation": "2;2;3",
        "wc_summary": "164;66;73",
        "wc_strengths": "40;49;30",
        "wc_weaknesses": "442;89;153",
        "wc_questions": "9;140;5",
        "wc_review": "655;344;261",
        "wc_reply_reviewers": "0;15;42",
        "wc_reply_authors": "778;796;786",
        "reply_reviewers": "0;1;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            101.0,
            44.63929509598765
        ],
        "wc_strengths_avg": [
            39.666666666666664,
            7.760297817881877
        ],
        "wc_weaknesses_avg": [
            228.0,
            153.5599774246749
        ],
        "wc_questions_avg": [
            51.333333333333336,
            62.718064029078214
        ],
        "wc_review_avg": [
            420.0,
            169.5897009451537
        ],
        "wc_reply_reviewers_avg": [
            19.0,
            17.378147196982766
        ],
        "wc_reply_authors_avg": [
            786.6666666666666,
            7.363574011458175
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13656852927128912291&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "University of Tokyo;University of Western Ontario",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.u-tokyo.ac.jp;https://www.uwo.ca",
        "aff_unique_abbr": "UTokyo;UWO",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Tokyo;",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "Japan;Canada"
    },
    {
        "title": "CrossLoco: Human Motion Driven Control of Legged Robots via Guided Unsupervised Reinforcement Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18530",
        "id": "UCfz492fM8",
        "author_site": "Tianyu Li, Hyunyoung Jung, Matthew Gombolay, Yong Cho, Sehoon Ha",
        "tldr": "",
        "abstract": "Human motion driven control (HMDC) is an effective approach for generating natural and compelling robot motions while preserving high-level semantics. However, establishing the correspondence between humans and robots with different body structures is not straightforward due to the mismatches in kinematics and dynamics properties, which causes intrinsic ambiguity to the problem. Many previous algorithms approach this motion retargeting problem with unsupervised learning, which requires the prerequisite skill sets. However, it will be extremely costly to learn all the skills without understanding the given human motions, particularly for high-dimensional robots. In this work, we introduce CrossLoco, a guided unsupervised reinforcement learning framework that simultaneously learns robot skills and their correspondence to human motions. Our key innovation is to introduce a cycle-consistency-based reward term designed to maximize the mutual information between human motions and robot states. We demonstrate that the proposed framework can generate compelling robot motions by translating diverse human motions, such as running, hopping, and dancing. We quantitatively compare our CrossLoco against the manually engineered and unsupervised baseline algorithms along with the ablated versions of our framework and demonstrate that our method translates human motions with better accuracy, diversity, and user preference. We also showcase its utility in other applications, such as synthesizing robot movements from language input and enabling interactive robot control.",
        "keywords": "Human Motion Driven Control;Legged Locomotion;Unsupervised Reinforcement Learning",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/546b2b1b9bb3fe36455316bb3849713452600fce.zip",
        "author": "Tianyu Li;Hyunyoung Jung;Matthew Gombolay;Yong Cho;Sehoon Ha",
        "authorids": "~Tianyu_Li10;~Hyunyoung_Jung2;~Matthew_Gombolay1;~Yong_Cho1;~Sehoon_Ha2",
        "gender": "M;M;M;;M",
        "homepage": "https://easypapersniper.github.io/;;https://core-robotics.gatech.edu/;http://rical.ce.gatech.edu/;https://www.cc.gatech.edu/~sha9",
        "dblp": ";;144/1022;;33/10491",
        "google_scholar": "https://scholar.google.com.sg/citations?hl=en;;Ihyz20wAAAAJ;;Q6F3O0sAAAAJ",
        "orcid": ";0009-0001-7382-9608;;;",
        "linkedin": ";;;;",
        "or_profile": "~Tianyu_Li10;~Hyunyoung_Jung2;~Matthew_Gombolay1;~Yong_Cho1;~Sehoon_Ha2",
        "aff": "Georgia Institute of Technology;Georgia Institute of Technology;Georgia Institute of Technology;Georgia Institute of Technology;Georgia Institute of Technology",
        "aff_domain": "gatech.edu;gatech.edu;cc.gatech.edu;gatech.edu;gatech.edu",
        "position": "PhD student;MS student;Assistant Professor;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nli2024crossloco,\ntitle={CrossLoco: Human Motion Driven Control of Legged Robots via Guided Unsupervised Reinforcement Learning},\nauthor={Tianyu Li and Hyunyoung Jung and Matthew Gombolay and Yong Cho and Sehoon Ha},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=UCfz492fM8}\n}",
        "github": "",
        "project": "",
        "reviewers": "Xm7A;QSkw;TXup",
        "pdf_size": 3021196,
        "rating": "6;6;8",
        "confidence": "4;4;3",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "3;2;3",
        "wc_summary": "117;64;114",
        "wc_strengths": "181;85;77",
        "wc_weaknesses": "489;219;7",
        "wc_questions": "75;29;2",
        "wc_review": "862;397;200",
        "wc_reply_reviewers": "70;0;0",
        "wc_reply_authors": "956;828;108",
        "reply_reviewers": "1;0;0",
        "reply_authors": "3;2;1",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            98.33333333333333,
            24.30820620467271
        ],
        "wc_strengths_avg": [
            114.33333333333333,
            47.2534537244516
        ],
        "wc_weaknesses_avg": [
            238.33333333333334,
            197.24998239684473
        ],
        "wc_questions_avg": [
            35.333333333333336,
            30.13672547278855
        ],
        "wc_review_avg": [
            486.3333333333333,
            277.5443908438592
        ],
        "wc_reply_reviewers_avg": [
            23.333333333333332,
            32.99831645537222
        ],
        "wc_reply_authors_avg": [
            630.6666666666666,
            373.2571350810174
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9999999999999998,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=197285674356299578&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=UCfz492fM8",
        "pdf": "https://openreview.net/pdf?id=UCfz492fM8",
        "email": "gatech.edu;gatech.edu;cc.gatech.edu;gatech.edu;gatech.edu",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Georgia Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.gatech.edu",
        "aff_unique_abbr": "Georgia Tech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "UDNJdVjhyg",
        "title": "Learning Graph Representations via Graph Entropy Maximization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph representation learning aims to represent graphs as vectors that can be utilized in downstream tasks such as graph classification. In this work, we focus on learning diverse representations that can capture the graph information as much as possible. We propose to quantify graph information using graph entropy, where we define a probability distribution of a graph based on its node and global representations. However, computing graph entropy is NP-hard due to the complex vertex packing polytope involved in its definition. We therefore provide an approximation of graph entropy based on the Shannon entropy and the chromatic entropy. \nBy maximizing the approximation of graph entropy through graph neural networks, we obtain informative node and graph representations. Experimental results demonstrate the effectiveness of our method in comparison to baselines in unsupervised learning and semi-supervised learning tasks.",
        "keywords": "Graph representation learning;K\u00f6rner graph entropy;orthonormal representations;chromatic entropy",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/8651ffe9f0c5006f0ae6d4e2cf2beebe5d9bdf82.zip",
        "author": "Ziheng Sun;Chris Ding;Jicong Fan",
        "authorids": "~Ziheng_Sun1;~Chris_Ding1;~Jicong_Fan2",
        "gender": "M;M;M",
        "homepage": ";http://ranger.uta.edu/~chqding/;https://jicongfan.github.io/",
        "dblp": ";https://dblp.uni-trier.de/pers/hd/d/Ding:Chris;139/1570",
        "google_scholar": "https://scholar.google.com/citations?hl=en;q7FfnjgAAAAJ;vdJsnhIAAAAJ",
        "orcid": ";;0000-0001-9665-0355",
        "linkedin": ";;",
        "or_profile": "~Ziheng_Sun1;~Chris_Ding1;~Jicong_Fan2",
        "aff": "Chinese University of HongKong;University of Texas at Arlington;The Chinese University of Hong Kong, Shenzhen",
        "aff_domain": "cuhk.edu.cn;cse.uta.edu;cuhk.edu.cn",
        "position": "PhD student;Professor;Assistant Professor",
        "bibtex": "@misc{\nsun2024learning,\ntitle={Learning Graph Representations via Graph Entropy Maximization},\nauthor={Ziheng Sun and Chris Ding and Jicong Fan},\nyear={2024},\nurl={https://openreview.net/forum?id=UDNJdVjhyg}\n}",
        "github": "",
        "project": "",
        "reviewers": "Dct6;zWFj;Jju5;QWua",
        "site": "https://openreview.net/forum?id=UDNJdVjhyg",
        "pdf_size": 2049472,
        "rating": "3;5;5;6",
        "confidence": "3;4;3;3",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;2;2",
        "wc_summary": "45;75;55;94",
        "wc_strengths": "19;86;13;27",
        "wc_weaknesses": "101;181;77;37",
        "wc_questions": "34;70;2;139",
        "wc_review": "199;412;147;297",
        "wc_reply_reviewers": "0;0;0;11",
        "wc_reply_authors": "547;481;367;670",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            67.25,
            18.846418757949746
        ],
        "wc_strengths_avg": [
            36.25,
            29.14939965076468
        ],
        "wc_weaknesses_avg": [
            99.0,
            52.57375771237966
        ],
        "wc_questions_avg": [
            61.25,
            50.92825836409488
        ],
        "wc_review_avg": [
            263.75,
            101.12708588701645
        ],
        "wc_reply_reviewers_avg": [
            2.75,
            4.763139720814412
        ],
        "wc_reply_authors_avg": [
            516.25,
            109.66169568267672
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.13245323570650439,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1164052794404602400&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Chinese University of Hong Kong;University of Texas at Arlington",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cuhk.edu.hk;https://www.uta.edu",
        "aff_unique_abbr": "CUHK;UTA",
        "aff_campus_unique_index": "0;1;2",
        "aff_campus_unique": "Hong Kong SAR;Arlington;Shenzhen",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "UDbEpJojik",
        "title": "Unleashing the power of Neural Collapse for Transferability Estimation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Transferability estimation aims to provide heuristics for quantifying how suitable a pre-trained model is for a specific downstream task, without fine-tuning them all. Prior studies have revealed that well-trained models exhibit the phenomenon of Neural Collapse.  Based on a widely used neural collapse metric in existing literature, we observe a strong correlation between the neural collapse of pre-trained models and their corresponding fine-tuned models. Inspired by this observation, we propose a novel method termed Fair Collapse (FaCe) for transferability estimation by comprehensively measuring the degree of neural collapse in the pre-trained model. Typically, FaCe comprises two different terms: the variance collapse term, which assesses the class separation and within-class compactness, and the class fairness term, which quantifies the fairness of the pre-trained model towards each class. We investigate FaCe on a variety of pre-trained classification models across different network architectures, source datasets, and training loss functions. Results show that FaCe yields state-of-the-art performance on different tasks including image classification, semantic segmentation, and text classification, which demonstrate the effectiveness and generalization of our method.",
        "keywords": "Transferability Estimation; Transfer Learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/cdf68454de5e28700272f15371483cedc6ea4160.zip",
        "author": "Yuhe Ding;Bo Jiang;Lijun Sheng;AIHUA ZHENG;Jian Liang",
        "authorids": "~Yuhe_Ding1;~Bo_Jiang5;~Lijun_Sheng1;~AIHUA_ZHENG2;~Jian_Liang1",
        "gender": "F;;M;F;M",
        "homepage": ";;https://tomsheng21.github.io/;https://aihuazheng.github.io/;https://liangjian.xyz",
        "dblp": "278/3256;34/2005-2;321/3477;74/7436;19/2208-1",
        "google_scholar": "uLBdZHYAAAAJ;https://scholar.google.com.hk/citations?user=n-aTwuMAAAAJ;https://scholar.google.com.sg/citations?user=1sM6ZrcAAAAJ;https://scholar.google.com.hk/citations?user=vcMHRWEAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";0000-0002-6238-1596;;;0000-0003-3890-1894",
        "linkedin": ";;;;",
        "or_profile": "~Yuhe_Ding1;~Bo_Jiang5;~Lijun_Sheng1;~AIHUA_ZHENG2;~Jian_Liang1",
        "aff": "Anhui University;Anhui University;University of Science and Technology of China;Anhui University;Institute of Automation, Chinese Academy of Sciences",
        "aff_domain": "ahu.edu.cn;ahu.edu.cn;ustc.edu.cn;ahu.edu.cn;ia.ac.cn",
        "position": "PhD student;Full Professor;PhD student;Full Professor;Associate Professor",
        "bibtex": "@misc{\nding2024unleashing,\ntitle={Unleashing the power of Neural Collapse for Transferability Estimation},\nauthor={Yuhe Ding and Bo Jiang and Lijun Sheng and AIHUA ZHENG and Jian Liang},\nyear={2024},\nurl={https://openreview.net/forum?id=UDbEpJojik}\n}",
        "github": "",
        "project": "",
        "reviewers": "Rkcn;cirw;TZ7d;JPai;pEKS",
        "site": "https://openreview.net/forum?id=UDbEpJojik",
        "pdf_size": 460757,
        "rating": "5;5;6;6;6",
        "confidence": "4;5;4;3;2",
        "soundness": "2;2;2;3;4",
        "contribution": "2;2;1;3;3",
        "presentation": "3;2;2;3;4",
        "wc_summary": "79;76;66;80;61",
        "wc_strengths": "58;50;48;82;26",
        "wc_weaknesses": "241;142;224;222;68",
        "wc_questions": "16;2;103;62;84",
        "wc_review": "394;270;441;446;239",
        "wc_reply_reviewers": "0;0;358;0;52",
        "wc_reply_authors": "839;824;1478;982;1005",
        "reply_reviewers": "0;0;3;0;1",
        "reply_authors": "3;3;5;4;3",
        "rating_avg": [
            5.6,
            0.48989794855663565
        ],
        "confidence_avg": [
            3.6,
            1.019803902718557
        ],
        "soundness_avg": [
            2.6,
            0.8
        ],
        "contribution_avg": [
            2.2,
            0.7483314773547882
        ],
        "presentation_avg": [
            2.8,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            72.4,
            7.552483035399682
        ],
        "wc_strengths_avg": [
            52.8,
            18.048822676285564
        ],
        "wc_weaknesses_avg": [
            179.4,
            65.43271353077145
        ],
        "wc_questions_avg": [
            53.4,
            38.758740949623224
        ],
        "wc_review_avg": [
            358.0,
            86.98735540295498
        ],
        "wc_reply_reviewers_avg": [
            82.0,
            139.46182273296156
        ],
        "wc_reply_authors_avg": [
            1025.6,
            237.67759675661483
        ],
        "reply_reviewers_avg": [
            0.8,
            1.1661903789690602
        ],
        "reply_authors_avg": [
            3.6,
            0.8
        ],
        "replies_avg": [
            32,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.7205766921228919,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13865822381142470538&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1;0;2",
        "aff_unique_norm": "Anhui University;University of Science and Technology of China;Chinese Academy of Sciences",
        "aff_unique_dep": ";;Institute of Automation",
        "aff_unique_url": "http://www.ahu.edu.cn/;http://www.ustc.edu.cn;http://www.ia.cas.cn",
        "aff_unique_abbr": "AHU;USTC;CAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "UDvvpK9oNO",
        "title": "Dual Diffusion Model for One-Shot High-Fidelity Talking Head Generation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "One-shot audio-driven talking head generation is a significant task with applications in the movie industry and virtual avatars. However, existing methods have limitations in accurately capturing dynamic nuances within the mapping of audio-to-lip motion. Furthermore, GAN based models for converting lip motion into pixel-level video often exhibit unstable training. To overcome these limitations, recent approaches based on diffusion models are proposed but still face issues such as time consumption and maintaining temporal consistency due to stochasticity. To circumvent these challenges, we introduce the following two modules: 1) AToM-Net, tasked with the generation of audio-to-motion pairs, and 2) MC-VDM, designed to produce high-quality image sequences corresponding to generated motion sequences reflecting a single identity image. Both modules are grounded in the framework of diffusion models. AToM-Net, with its inherent stochasticity akin to diffusion models, excels in capturing the subtleties of lip motion dynamics, avoiding the problem of mode collapse. MC-VDM solves the problems of the existing diffusion-based talking head by utilizing the efficient tri-plane based module. Our experiments conducted on the standard benchmark indicate that our model achieves performance that surpasses that of existing models.",
        "keywords": "Diffusion model;Talking head generation;Video Synthesis",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Jihye Park;Seyeon Kim;Kihong Kim;Siyoon Jin;Jiyoung Kim;Seungryong Kim",
        "authorids": "~Jihye_Park1;~Seyeon_Kim2;~Kihong_Kim1;~Siyoon_Jin1;~Jiyoung_Kim2;~Seungryong_Kim1",
        "gender": "F;F;;F;F;M",
        "homepage": ";;https://hxngiee.github.io/;https://github.com/JinSY515;https://github.com/rlawldud53;https://cvlab.korea.ac.kr/members/faculty",
        "dblp": ";;;368/8254;;141/9955",
        "google_scholar": "Fg0DBKwAAAAJ;;;;;cIK1hS8AAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";seyeon-kim-837588232;;;;",
        "or_profile": "~Jihye_Park1;~Seyeon_Kim2;~Kihong_Kim1;~Siyoon_Jin1;~Jiyoung_Kim2;~Seungryong_Kim1",
        "aff": "Korea University;Korea University;VIVE STUDIOS;Korea University;Korea University;Korea University",
        "aff_domain": "korea.ac.kr;korea.ac.kr;vivestudios.com;korea.ac.kr;korea.ac.kr;korea.ac.kr",
        "position": "MS student;MS student;Researcher;Undergrad student;Undergrad student;Assistant Professor",
        "bibtex": "@misc{\npark2024dual,\ntitle={Dual Diffusion Model for One-Shot High-Fidelity Talking Head Generation},\nauthor={Jihye Park and Seyeon Kim and Kihong Kim and Siyoon Jin and Jiyoung Kim and Seungryong Kim},\nyear={2024},\nurl={https://openreview.net/forum?id=UDvvpK9oNO}\n}",
        "github": "",
        "project": "",
        "reviewers": "FJie;KsG2;qQ9o;4W8w",
        "site": "https://openreview.net/forum?id=UDvvpK9oNO",
        "pdf_size": 7789660,
        "rating": "3;5;5;5",
        "confidence": "4;4;2;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;2",
        "presentation": "1;2;3;3",
        "wc_summary": "59;147;110;115",
        "wc_strengths": "74;49;89;43",
        "wc_weaknesses": "221;29;232;45",
        "wc_questions": "359;36;172;82",
        "wc_review": "713;261;603;285",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            107.75,
            31.522809202226885
        ],
        "wc_strengths_avg": [
            63.75,
            18.64638034579366
        ],
        "wc_weaknesses_avg": [
            131.75,
            94.99835524891996
        ],
        "wc_questions_avg": [
            162.25,
            123.67775669052216
        ],
        "wc_review_avg": [
            465.5,
            196.57250570718173
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:0K8Ch80PSYUJ:scholar.google.com/&scioq=Dual+Diffusion+Model+for+One-Shot+High-Fidelity+Talking+Head+Generation&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;0;0",
        "aff_unique_norm": "Korea University;VIVE STUDIOS",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.korea.ac.kr;",
        "aff_unique_abbr": "KU;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "South Korea;"
    },
    {
        "id": "UEP8yRxTfV",
        "title": "Debias the Training of Diffusion Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Diffusion models have demonstrated compelling generation quality by optimizing the variational lower bound through a simple denoising score matching loss. In this paper, we provide theoretical evidence that the prevailing practice of using a constant loss weight strategy in diffusion models leads to biased estimation during the training phase. Simply optimizing the denoising network to predict Gaussian noise with constant weighting may hinder precise estimations of original images. \nTo address the issue, we propose an elegant and effective weighting strategy grounded in the theoretically unbiased principle. \nMoreover, we conduct a comprehensive and systematic exploration to dissect the inherent bias problem deriving from constant weighting loss from the perspectives of its existence, impact and reasons. These analyses are expected to advance our understanding and demystify the inner workings of diffusion models. Through empirical evaluation, we demonstrate that our proposed debiased estimation method significantly enhances sample quality without the reliance on complex techniques, and exhibits improved efficiency compared to the baseline method both in training and sampling processes.",
        "keywords": "diffusion models;generative models;debiased training",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Hu Yu;Li Shen;Jie Huang;Man Zhou;Hongsheng Li;Feng Zhao",
        "authorids": "~Hu_Yu2;~Li_Shen9;~Jie_Huang4;~Man_Zhou4;~Hongsheng_Li3;~Feng_Zhao6",
        "gender": "M;M;M;M;;M",
        "homepage": "https://yuhuustc.github.io/;;http://www.ee.cuhk.edu.hk/~hsli;https://bivlab123.github.io/;https://lishen-shirley.github.io;",
        "dblp": ";;27/7402-1;181/2734-4;91/3680-5;165/8237",
        "google_scholar": "https://scholar.google.com.hk/citations?hl=zh-CN;https://scholar.google.com/citations?hl=zh-CN;BN2Ze-QAAAAJ;https://scholar.google.co.uk/citations?hl=en;ABbCaxsAAAAJ;",
        "orcid": "0000-0003-0598-8989;0000-0002-3518-3404;;0000-0001-6767-8105;;0000-0003-2872-605X",
        "linkedin": ";;;;;",
        "or_profile": "~Hu_Yu2;~Jie_Huang4;~Hongsheng_Li3;~Feng_Zhao6;~li_shen5;~man_zhou1",
        "aff": "University of Science and Technology of China;University of Science and Technology of China;The Chinese University of Hong Kong;University of Science and Technology of China;Alibaba Group;University of Science and Technology of China",
        "aff_domain": "ustc.edu.cn;ustc.edu.cn;cuhk.edu.hk;ustc.edu.cn;alibaba-inc.com;ustc.edu.cn",
        "position": "PhD student;PhD student;Associate Professor;Full Professor;Principal Researcher;Postdoc",
        "bibtex": "@misc{\nyu2024debias,\ntitle={Debias the Training of Diffusion Models},\nauthor={Hu Yu and Li Shen and Jie Huang and Man Zhou and Hongsheng Li and Feng Zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=UEP8yRxTfV}\n}",
        "github": "",
        "project": "",
        "reviewers": "sefk;kAkY;kayo;dmLU",
        "site": "https://openreview.net/forum?id=UEP8yRxTfV",
        "pdf_size": 5985480,
        "rating": "1;3;5;8",
        "confidence": "4;4;4;5",
        "soundness": "1;2;3;4",
        "contribution": "1;2;2;4",
        "presentation": "2;2;3;4",
        "wc_summary": "40;86;79;63",
        "wc_strengths": "20;24;62;115",
        "wc_weaknesses": "136;90;185;84",
        "wc_questions": "1;31;4;20",
        "wc_review": "197;231;330;282",
        "wc_reply_reviewers": "278;0;0;0",
        "wc_reply_authors": "232;360;506;140",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.25,
            2.5860201081971503
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            1.118033988749895
        ],
        "contribution_avg": [
            2.25,
            1.0897247358851685
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            67.0,
            17.67766952966369
        ],
        "wc_strengths_avg": [
            55.25,
            38.192767639960316
        ],
        "wc_weaknesses_avg": [
            123.75,
            40.68399562481542
        ],
        "wc_questions_avg": [
            14.0,
            12.186057606953941
        ],
        "wc_review_avg": [
            260.0,
            50.482670293874115
        ],
        "wc_reply_reviewers_avg": [
            69.5,
            120.37753112603697
        ],
        "wc_reply_authors_avg": [
            309.5,
            137.74886569405933
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.8372183582789214,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6450976606823846518&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;2;0",
        "aff_unique_norm": "University of Science and Technology of China;Chinese University of Hong Kong;Alibaba Group",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.ustc.edu.cn;https://www.cuhk.edu.hk;https://www.alibaba.com",
        "aff_unique_abbr": "USTC;CUHK;Alibaba",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "UEdS2lIgfY",
        "title": "In-Context Learning in Large Language Models: A Neuroscience-inspired Analysis of Representations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs) exhibit remarkable performance improvement through in-context learning (ICL) by leveraging task-specific examples in the input. However, the mechanisms behind this improvement remain elusive. In this work, we investigate how LLM embeddings and attention representations change following in-context-learning, and how these changes mediate improvement in behavior. We employ neuroscience-inspired techniques such as representational similarity analysis (RSA) and propose novel methods for parameterized probing and measuring ratio of attention to relevant vs. irrelevant information in Llama-2 70B and Vicuna 13B. We designed three tasks with a priori relationships among their conditions: reading comprehension, linear regression, and adversarial prompt injection. We formed hypotheses about expected similarities in task representations to investigate latent changes in embeddings and attention. Our analyses revealed a meaningful correlation between changes in both embeddings and attention representations with improvements in behavioral performance after ICL. This empirical framework empowers a nuanced understanding of how latent representations affect LLM behavior with and without ICL, offering valuable tools and insights for future research and practical applications.",
        "keywords": "large language models;in-context learning;representational similarity analysis",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/9c626a17ceb125649eff0f1b91dac5819b320e02.zip",
        "author": "Safoora Yousefi;Hosein Hasanbeig;Leo Moreno Betthauser;Akanksha Saran;Rapha\u00ebl Milli\u00e8re;Ida Momennejad",
        "authorids": "~Safoora_Yousefi1;~Hosein_Hasanbeig1;~Leo_Moreno_Betthauser2;~Akanksha_Saran1;~Rapha\u00ebl_Milli\u00e8re2;~Ida_Momennejad1",
        "gender": "Unspecified;;;F;M;F",
        "homepage": ";;https://www.linkedin.com/in/leo-betthauser-a57b4420/;;https://raphaelmilliere.com/;https://www.momen-nejad.org",
        "dblp": "171/4767;;;173/6209;;",
        "google_scholar": ";;;zZhWSQ0AAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.de/citations?user=OFdUAJwAAAAJ",
        "orcid": ";;;;0000-0001-6965-6073;0000-0003-0830-3973",
        "linkedin": "https://linkedin.com/in/safooray;;;akanksha-saran-8b506620/;;ida-momennejad-8661a710/",
        "or_profile": "~Safoora_Yousefi1;~Hosein_Hasanbeig1;~Leo_Moreno_Betthauser2;~Akanksha_Saran1;~Rapha\u00ebl_Milli\u00e8re2;~Ida_Momennejad1",
        "aff": "Microsoft Inc;;Splunk;Sony AI;Macquarie University;Microsoft Research",
        "aff_domain": "microsoft.com;;splunk.com;sony.com;mq.edu.au;research.microsoft.com",
        "position": "ML scientist;;Applied Scientist;Researcher;Assistant Professor;Principal Researcher",
        "bibtex": "@misc{\nyousefi2024incontext,\ntitle={In-Context Learning in Large Language Models: A Neuroscience-inspired Analysis of Representations},\nauthor={Safoora Yousefi and Hosein Hasanbeig and Leo Moreno Betthauser and Akanksha Saran and Rapha{\\\"e}l Milli{\\`e}re and Ida Momennejad},\nyear={2024},\nurl={https://openreview.net/forum?id=UEdS2lIgfY}\n}",
        "github": "",
        "project": "",
        "reviewers": "8pv7;DTAM;FbLG;Sz99",
        "site": "https://openreview.net/forum?id=UEdS2lIgfY",
        "pdf_size": 2090251,
        "rating": "3;3;3;6",
        "confidence": "4;4;4;3",
        "soundness": "2;1;3;3",
        "contribution": "1;2;2;2",
        "presentation": "2;2;2;3",
        "wc_summary": "41;38;124;100",
        "wc_strengths": "48;75;33;191",
        "wc_weaknesses": "233;356;237;317",
        "wc_questions": "132;6;214;24",
        "wc_review": "454;475;608;632",
        "wc_reply_reviewers": "0;0;140;31",
        "wc_reply_authors": "912;1059;775;579",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "2;2;2;1",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            75.75,
            37.24496610281717
        ],
        "wc_strengths_avg": [
            86.75,
            62.04182057290066
        ],
        "wc_weaknesses_avg": [
            285.75,
            52.60881580115637
        ],
        "wc_questions_avg": [
            94.0,
            84.39194274336857
        ],
        "wc_review_avg": [
            542.25,
            78.56327068038856
        ],
        "wc_reply_reviewers_avg": [
            42.75,
            57.555951038967294
        ],
        "wc_reply_authors_avg": [
            831.25,
            176.90728503936745
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5232235403774638384&as_sdt=5,31&sciodt=0,31&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;0",
        "aff_unique_norm": "Microsoft;Splunk Inc.;Sony;Macquarie University",
        "aff_unique_dep": "Microsoft Corporation;;Sony AI;",
        "aff_unique_url": "https://www.microsoft.com;https://www.splunk.com;https://www.sony.com;https://www.mq.edu.au",
        "aff_unique_abbr": "Microsoft;Splunk;Sony AI;MQ",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;2;0",
        "aff_country_unique": "United States;Japan;Australia"
    },
    {
        "id": "UH4HinPK9d",
        "title": "Provably Accurate ODE Forecasting Through Explicit Trajectory Optimization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This work introduces a method to enable accurate forecasting of time series governed by ordinary differential equations (ODE) through the usage of cost functions explicitly dependent on the future trajectory rather than the past measurement times. We prove that the space of solutions of an $N$-dimensional, smooth, Lipschitz ODE on any given finite time horizon is an $N$-dimensional Riemannian manifold embedded in the space of square integrable continuous functions. This finite dimensional manifold structure enables the application of common statistical objectives such as maximum likelihood (ML), maximum a posteriori (MAP), and minimum mean squared error (MMSE) estimation directly in the space of feasible ODE solutions. The restriction to feasible trajectories of the system limits known issues such as oversmoothing seen in unconstrained MMSE forecasting. We demonstrate that direct optimization of trajectories reduces error in forecasting when compared to estimating initial conditions or minimizing empirical error. Beyond theoretical justifications, we provide Monte Carlo simulations evaluating the performance of the optimal solutions of six different objective functions: ML, MAP state estimation, MMSE state estimation, MAP trajectory estimation, MMSE trajectory estimation over all square integrable functions, and MMSE trajectory estimation over solutions of the differential equation.",
        "keywords": "Forecasting;Dynamical Systems;Parameter Estimation;Bayesian Inference",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/812b2e28155f43c2e3939960f0be846ff43065da.zip",
        "author": "Helmuth Naumer;Farzad Kamalabadi",
        "authorids": "~Helmuth_Naumer1;~Farzad_Kamalabadi1",
        "gender": "M;",
        "homepage": "https://www.helmuthnaumer.com;https://ece.illinois.edu/about/directory/faculty/farzadk",
        "dblp": "277/6500;",
        "google_scholar": "3yPUPN8AAAAJ;",
        "orcid": "0000-0001-8256-1642;",
        "linkedin": "helmuth-naumer/;",
        "or_profile": "~Helmuth_Naumer1;~Farzad_Kamalabadi1",
        "aff": "University of Illinois, Urbana Champaign;University of Illinois at Urbana-Champaign ",
        "aff_domain": "illinois.edu;illinois.edu",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nnaumer2024provably,\ntitle={Provably Accurate {ODE} Forecasting Through Explicit Trajectory Optimization},\nauthor={Helmuth Naumer and Farzad Kamalabadi},\nyear={2024},\nurl={https://openreview.net/forum?id=UH4HinPK9d}\n}",
        "github": "",
        "project": "",
        "reviewers": "U4Us;Rdcm;kKvz;YW1N",
        "site": "https://openreview.net/forum?id=UH4HinPK9d",
        "pdf_size": 591374,
        "rating": "3;3;3;5",
        "confidence": "4;3;4;3",
        "soundness": "3;3;3;2",
        "contribution": "1;2;1;3",
        "presentation": "4;2;3;4",
        "wc_summary": "76;87;159;81",
        "wc_strengths": "59;32;20;73",
        "wc_weaknesses": "335;54;262;221",
        "wc_questions": "131;265;123;51",
        "wc_review": "601;438;564;426",
        "wc_reply_reviewers": "0;0;45;19",
        "wc_reply_authors": "939;798;993;450",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "2;2;2;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            100.75,
            33.855391003501936
        ],
        "wc_strengths_avg": [
            46.0,
            21.03568396796263
        ],
        "wc_weaknesses_avg": [
            218.0,
            103.11401456640121
        ],
        "wc_questions_avg": [
            142.5,
            77.28356875817782
        ],
        "wc_review_avg": [
            507.25,
            76.4963234410648
        ],
        "wc_reply_reviewers_avg": [
            16.0,
            18.452642087245934
        ],
        "wc_reply_authors_avg": [
            795.0,
            211.52659407270755
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:sh04HizZPewJ:scholar.google.com/&scioq=Provably+Accurate+ODE+Forecasting+Through+Explicit+Trajectory+Optimization&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Illinois Urbana-Champaign",
        "aff_unique_dep": "",
        "aff_unique_url": "https://illinois.edu",
        "aff_unique_abbr": "UIUC",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Urbana-Champaign",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "UHIKtKzTj7",
        "title": "PAPM: A Physics-aware Proxy Model for Process Systems",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Process systems, which play a fundamental role in various scientific and engineering fields, often rely on computational models to capture their complex temporal-spatial dynamics. However, due to limited insights into the intricate physical principles, these models can be imprecise or inapplicable, coupled with a significant computational demand exacerbating inefficiencies. To address these challenges, we propose a physics-aware proxy model (PAPM) to explicitly incorporate partial prior mechanistic knowledge, including conservation and constitutive relations. Additionally, to enhance the inductive biases about strict physical laws and broaden the applicability scope, we introduce a holistic temporal and spatial stepping method (TSSM) aligned with the distinct equation characteristics of different process systems, resulting in better out-of-sample generalization. We systematically compare state-of-the-art pure data-driven models and physics-aware models, spanning five two-dimensional non-trivial benchmarks in nine generalization tasks. Notably, PAPM achieves an average absolute performance improvement of 6.4%, while requiring fewer FLOPs, and only 1% of the parameters compared to the prior leading method, PPNN. Through such analysis, the structural design and specialized spatio-temporal modeling schemes (i.e., TSSM) of PAPM exhibit not only the most balanced trade-off between accuracy and computational efficiency among all methods evaluated, but also an impressive out-of-sample generalization.",
        "keywords": "Process systems modeling;Physics-informed machine learning;Temporal-spatial stepping method;Out-of-sample generalizability.",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "/attachment/bba5ee17f6691d592c3e248133053c5555cbae92.zip",
        "author": "Pengwei Liu;Zhongkai Hao;Xingyu Ren;Hangjie Yuan;Dong Ni",
        "authorids": "~Pengwei_Liu1;~Zhongkai_Hao1;~Xingyu_Ren2;~Hangjie_Yuan1;~Dong_Ni3",
        "gender": ";M;M;M;M",
        "homepage": "https://github.com/pengwei07;https://github.com/small-dumpling;https://jacobyuan7.github.io/;;https://haozhongkai.github.io/",
        "dblp": ";;293/9956;;270/0220.html",
        "google_scholar": "https://scholar.google.com.hk/citations?user=mlcLvUEAAAAJ;;jQ3bFDMAAAAJ;;dfSzq27ZiVoC",
        "orcid": ";;;0000-0002-2227-2555;",
        "linkedin": ";;;;",
        "or_profile": "~Pengwei_Liu1;~Xingyu_Ren2;~Hangjie_Yuan1;~Dong_Ni3;~Hao_Zhongkai1",
        "aff": "Zhejiang University;Zhejiang University;Zhejiang University;Zhejiang University;Tsinghua University",
        "aff_domain": "zju.edu.cn;zju.edu.cn;zju.edu.cn;zju.edu.cn;mails.tsinghua.edu.cn",
        "position": "PhD student;Undergrad student;PhD student;Full Professor;PhD student",
        "bibtex": "@misc{\nliu2024papm,\ntitle={{PAPM}: A Physics-aware Proxy Model for Process Systems},\nauthor={Pengwei Liu and Zhongkai Hao and Xingyu Ren and Hangjie Yuan and Dong Ni},\nyear={2024},\nurl={https://openreview.net/forum?id=UHIKtKzTj7}\n}",
        "github": "",
        "project": "",
        "reviewers": "9hXa;hyse;uLfn;La8N",
        "site": "https://openreview.net/forum?id=UHIKtKzTj7",
        "pdf_size": 11479375,
        "rating": "3;5;6;6",
        "confidence": "4;3;2;2",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "77;71;74;28",
        "wc_strengths": "9;10;67;24",
        "wc_weaknesses": "258;110;51;50",
        "wc_questions": "48;265;34;62",
        "wc_review": "392;456;226;164",
        "wc_reply_reviewers": "63;0;0;0",
        "wc_reply_authors": "4282;2026;1869;1653",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "8;4;4;3",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            62.5,
            20.03122562401013
        ],
        "wc_strengths_avg": [
            27.5,
            23.56374333589636
        ],
        "wc_weaknesses_avg": [
            117.25,
            84.81560882290476
        ],
        "wc_questions_avg": [
            102.25,
            94.48379490685161
        ],
        "wc_review_avg": [
            309.5,
            118.75499989474127
        ],
        "wc_reply_reviewers_avg": [
            15.75,
            27.279800219209818
        ],
        "wc_reply_authors_avg": [
            2457.5,
            1061.6667320774443
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.75,
            1.920286436967152
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9847319278346618,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1065915363133201743&as_sdt=5,31&sciodt=0,31&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;0;0;1",
        "aff_unique_norm": "Zhejiang University;Tsinghua University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.zju.edu.cn;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "ZJU;THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "UHZVrhQuO1",
        "title": "Linking Finite-Time Lyapunov Exponents to RNN Gradient Subspaces and Input Sensitivity",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recurrent Neural Networks (RNN) are ubiquitous computing systems for sequences and multivariate time series data. They can be viewed as non-autonomous dynamical systems which can be analyzed using dynamical systems tools, such as Lyapunov Exponents. In this work, we derive and analyze the components of RNNs' Finite Time Lyapunov Exponents (FTLE) which measure directions (vectors Q) and factors (scalars R) with which the distance between nearby trajectories expands or contracts over finite-time horizons. We derive an expression for RNN gradients in terms of $Q$ vectors and $R$ values and demonstrate a direct connection between these quantities and the loss. We find that the dominant directions of the gradient extracted by singular value decomposition become increasingly aligned with the dominant $Q$ vectors as training proceeds. Furthermore, we show that the task outcome of an RNN is maximally affected by input perturbations at moments where high state space expansion is taking place (as measured by FTLEs). Our results showcase deep links between computations, loss gradients, and dynamical systems stability theory for RNNs. This opens the way to design adaptive methods that take into account state-space dynamics to improve computations.",
        "keywords": "Dynamical Systems;Recurrent Neural Networks;Lyapunov Exponents",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Ryan Vogt;Eli Shlizerman;Guillaume Lajoie",
        "authorids": "~Ryan_Vogt1;~Eli_Shlizerman1;~Guillaume_Lajoie1",
        "gender": "M;;M",
        "homepage": ";http://faculty.washington.edu/shlizee/;https://dms.umontreal.ca/~lajoie/",
        "dblp": ";00/9501;31/10384",
        "google_scholar": "P3teu6IAAAAJ;oJnSO50AAAAJ;",
        "orcid": "0000-0002-7912-7244;0000-0002-3136-4531;",
        "linkedin": ";;",
        "or_profile": "~Ryan_Vogt1;~Eli_Shlizerman1;~Guillaume_Lajoie1",
        "aff": ";University of Washington;Mila - Quebec Artificial Intelligence Institute",
        "aff_domain": ";u.washington.edu;mila.quebec",
        "position": ";Associate Professor;Associate Professor",
        "bibtex": "@misc{\nvogt2024linking,\ntitle={Linking Finite-Time Lyapunov Exponents to {RNN} Gradient Subspaces and Input Sensitivity},\nauthor={Ryan Vogt and Eli Shlizerman and Guillaume Lajoie},\nyear={2024},\nurl={https://openreview.net/forum?id=UHZVrhQuO1}\n}",
        "github": "",
        "project": "",
        "reviewers": "NbRp;YMuh;kefG;pkxF",
        "site": "https://openreview.net/forum?id=UHZVrhQuO1",
        "pdf_size": 2108112,
        "rating": "3;5;5;5",
        "confidence": "3;3;3;3",
        "soundness": "2;2;3;2",
        "contribution": "2;3;3;2",
        "presentation": "2;3;3;3",
        "wc_summary": "66;77;68;82",
        "wc_strengths": "28;42;24;8",
        "wc_weaknesses": "125;78;74;189",
        "wc_questions": "11;456;17;56",
        "wc_review": "230;653;183;335",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            73.25,
            6.53356717268599
        ],
        "wc_strengths_avg": [
            25.5,
            12.114041439585717
        ],
        "wc_weaknesses_avg": [
            116.5,
            46.41389878042998
        ],
        "wc_questions_avg": [
            135.0,
            186.13301695293075
        ],
        "wc_review_avg": [
            350.25,
            183.25034106380267
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ir9z-CuyVkYJ:scholar.google.com/&scioq=Linking+Finite-Time+Lyapunov+Exponents+to+RNN+Gradient+Subspaces+and+Input+Sensitivity&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Washington;Quebec Artificial Intelligence Institute",
        "aff_unique_dep": ";Artificial Intelligence",
        "aff_unique_url": "https://www.washington.edu;https://mila.quebec",
        "aff_unique_abbr": "UW;Mila",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United States;Canada"
    },
    {
        "id": "UHdd6EUAy7",
        "title": "Noise-Aware Algorithm for Heterogeneous Differentially Private Federated Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Federated Learning (FL) is a useful paradigm for learning models from the data distributed among some clients. High utility and rigorous data privacy guaranties are among the main goals of an FL system. Previous works have tried to achieve the latter by ensuring differential privacy (DP) while performing federated training. In real systems, there is often heterogeneity in the privacy requirements of various\nclients, and the existing DPFL works either assume uniform requirements or propose methods relying on a trusted server. Furthermore, in real FL systems, there is also heterogeneity in memory/computing power across clients\u2019 devices, which has not been addressed in existing DPFL algorithms. Having these two sources of heterogeneity, straightforward solutions, e.g., meeting the privacy requirements of the most privacy-sensitive client or removing the clients with low memory budgets will lead to lower utility and fairness problems, due to high DP noise and/or data loss. In this work, we propose Robust-HDP to achieve high utility in the presence of an untrusted server, while addressing both the privacy and memory heterogeneity across clients. Our main idea is to efficiently estimate the noise in each client model update and assign their aggregation weights accordingly. Noise-aware aggregation of Robust-HDP without sharing clients privacy preferences with the server, results in the improvement of utility, privacy and convergence speed, while meeting the heterogeneous privacy/memory requirements of all clients. Extensive experimental results on multiple benchmark datasets and our convergence analysis confirm the effectiveness of Robust-HDP in improving system utility and convergence speed",
        "keywords": "Federated Learning;Differential Privacy;Differentially Private Federated Learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/a414adfb81411beeda9fbc021846c5597ba507dc.zip",
        "author": "Saber Malekmohammadi;Yaoliang Yu;YANG CAO",
        "authorids": "~Saber_Malekmohammadi1;~Yaoliang_Yu1;~YANG_CAO10",
        "gender": "M;M;Unspecified",
        "homepage": ";https://cs.uwaterloo.ca/~y328yu/;https://yangcao88.github.io/",
        "dblp": "236/4827;90/4989;https://dblp.uni-trier.de/pid/25/7045-11",
        "google_scholar": ";https://scholar.google.ca/citations?user=zbXIQMsAAAAJ;https://scholar.google.co.jp/citations?user=S-p4DFMAAAAJ",
        "orcid": ";0000-0002-3823-0720;0000-0002-6424-8633",
        "linkedin": "saber-mm;;",
        "or_profile": "~Saber_Malekmohammadi1;~Yaoliang_Yu1;~YANG_CAO10",
        "aff": "University of Waterloo;University of Waterloo;Hokkaido University",
        "aff_domain": "uwaterloo.ca;uwaterloo.ca;hokudai.ac.jp",
        "position": "PhD Student;Associate Professor;Associate Professor",
        "bibtex": "@misc{\nmalekmohammadi2024noiseaware,\ntitle={Noise-Aware Algorithm for Heterogeneous Differentially Private Federated Learning},\nauthor={Saber Malekmohammadi and Yaoliang Yu and YANG CAO},\nyear={2024},\nurl={https://openreview.net/forum?id=UHdd6EUAy7}\n}",
        "github": "",
        "project": "",
        "reviewers": "bWRm;ThZo;fjuK;eRk3",
        "site": "https://openreview.net/forum?id=UHdd6EUAy7",
        "pdf_size": 536585,
        "rating": "5;5;6;8",
        "confidence": "3;4;3;3",
        "soundness": "2;3;3;4",
        "contribution": "2;2;3;4",
        "presentation": "2;2;2;4",
        "wc_summary": "53;94;75;60",
        "wc_strengths": "23;67;25;137",
        "wc_weaknesses": "163;241;124;115",
        "wc_questions": "31;169;162;65",
        "wc_review": "270;571;386;377",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "827;1298;980;834",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;2;2;2",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            70.5,
            15.724185193516387
        ],
        "wc_strengths_avg": [
            63.0,
            46.195237849804386
        ],
        "wc_weaknesses_avg": [
            160.75,
            49.721097131901665
        ],
        "wc_questions_avg": [
            106.75,
            60.01822639832004
        ],
        "wc_review_avg": [
            401.0,
            108.23816332514147
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            984.75,
            190.89182145917096
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.4714045207910316,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2189799830929108890&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "University of Waterloo;Hokkaido University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://uwaterloo.ca;https://www.hokudai.ac.jp",
        "aff_unique_abbr": "UW;Hokkaido U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "Canada;Japan"
    },
    {
        "title": "To Grok or not to Grok: Disentangling Generalization and Memorization on Corrupted Algorithmic Datasets",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18529",
        "id": "UHjE5v5MB7",
        "author_site": "Darshil Doshi, Aritra Das, Tianyu He, Andrey Gromov",
        "tldr": "",
        "abstract": "Robust generalization is a major challenge in deep learning, particularly when the number of trainable parameters is very large. In general, it is very difficult to know if the network has memorized a particular set of examples or understood the underlying rule (or both). Motivated by this challenge, we study an interpretable model where generalizing representations are understood analytically, and are easily distinguishable from the memorizing ones. Namely, we consider multi-layer perceptron (MLP) and Transformer architectures trained on modular arithmetic tasks, where ($\\xi \\cdot 100\\\\%$) of labels are corrupted (*i.e.* some results of the modular operations in the training set are incorrect). We show that (i) it is possible for the network to memorize the corrupted labels *and* achieve $100\\\\%$ generalization at the same time; (ii) the memorizing neurons can be identified and pruned, lowering the accuracy on corrupted data and improving the accuracy on uncorrupted data; (iii) regularization methods such as weight decay, dropout and BatchNorm force the network to ignore the corrupted data during optimization, and achieve $100\\\\%$ accuracy on the uncorrupted dataset; and (iv) the effect of these regularization methods is (\"mechanistically\") interpretable: weight decay and dropout force all the neurons to learn generalizing representations, while BatchNorm de-amplifies the output of memorizing neurons and amplifies the output of the generalizing ones. Finally, we show that in the presence of regularization, the training dynamics involves two consecutive stages: first, the network undergoes *grokking* dynamics reaching high train *and* test accuracy; second, it unlearns the memorizing representations, where the train accuracy suddenly jumps from $100\\\\%$ to $100 (1-\\xi)\\\\%$.",
        "keywords": "Interpretability;Grokking;Label noise;Generalization;Memorization;Representations;Modular Arithmetic",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/77f468170606157796e5fdaf48507f5f8d9e16c7.zip",
        "author": "Darshil Doshi;Aritra Das;Tianyu He;Andrey Gromov",
        "authorids": "~Darshil_Doshi1;~Aritra_Das1;~Tianyu_He2;~Andrey_Gromov1",
        "gender": "M;M;M;M",
        "homepage": ";;;",
        "dblp": ";;;",
        "google_scholar": "4dp-dEMAAAAJ;;STDwwY8AAAAJ;D056qfMAAAAJ",
        "orcid": "0000-0003-3578-9016;0000-0002-1658-4608;0000-0002-2592-9698;",
        "linkedin": "darshil-doshi-2b010b7b/;aritra-das-22b7221a2/;;andrey-gromov-2329a241",
        "or_profile": "~Darshil_Doshi1;~Aritra_Das1;~Tianyu_He2;~Andrey_Gromov1",
        "aff": "University of Maryland, College Park;University of Maryland, College Park;University of Maryland, College Park;University of Maryland, College Park",
        "aff_domain": "umd.edu;umd.edu;umd.edu;umd.edu",
        "position": "PhD student;PhD student;PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\ndoshi2024to,\ntitle={To Grok or not to Grok: Disentangling Generalization and Memorization on Corrupted Algorithmic Datasets},\nauthor={Darshil Doshi and Aritra Das and Tianyu He and Andrey Gromov},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=UHjE5v5MB7}\n}",
        "github": "",
        "project": "",
        "reviewers": "4cwR;kDnz;j4fN",
        "pdf_size": 5359383,
        "rating": "5;5;8",
        "confidence": "4;4;4",
        "soundness": "3;3;3",
        "contribution": "2;2;3",
        "presentation": "3;3;4",
        "wc_summary": "60;96;110",
        "wc_strengths": "134;57;136",
        "wc_weaknesses": "350;295;106",
        "wc_questions": "69;140;23",
        "wc_review": "613;588;375",
        "wc_reply_reviewers": "53;246;0",
        "wc_reply_authors": "1028;1011;117",
        "reply_reviewers": "1;1;0",
        "reply_authors": "2;2;1",
        "rating_avg": [
            6.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            88.66666666666667,
            21.060758665241753
        ],
        "wc_strengths_avg": [
            109.0,
            36.778616975991184
        ],
        "wc_weaknesses_avg": [
            250.33333333333334,
            104.49986709188782
        ],
        "wc_questions_avg": [
            77.33333333333333,
            48.12714641678044
        ],
        "wc_review_avg": [
            525.3333333333334,
            106.79055305701074
        ],
        "wc_reply_reviewers_avg": [
            99.66666666666667,
            105.71134702050146
        ],
        "wc_reply_authors_avg": [
            718.6666666666666,
            425.4991839657928
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12337624545582398405&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=UHjE5v5MB7",
        "pdf": "https://openreview.net/pdf?id=UHjE5v5MB7",
        "email": "umd.edu;umd.edu;umd.edu;umd.edu",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of Maryland",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www/umd.edu",
        "aff_unique_abbr": "UMD",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "College Park",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "UIGAtKp8nW",
        "title": "MUBen: Benchmarking the Uncertainty of Molecular Representation Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large molecular representation models pre-trained on massive unlabeled data have shown great success in predicting molecular properties.\n  However, these models may tend to overfit the fine-tuning data, resulting in over-confident predictions on test data that fall outside of the training distribution.\n  To address this issue, uncertainty quantification (UQ) methods can be used to improve the models' calibration of predictions.\n  Although many UQ approaches exist, not all of them lead to improved performance.\n  While some studies have included UQ to improve molecular pre-trained models, the process of selecting suitable backbone and UQ methods for reliable molecular uncertainty estimation remains underexplored.\n  To address this gap, we present MUBen, which evaluates different UQ methods for state-of-the-art backbone molecular representation models to investigate their capabilities.\n  By fine-tuning various backbones using different molecular descriptors as inputs with UQ methods from different categories, we critically assess the influence of architectural decisions and training strategies.\n  Our study offers insights for selecting UQ for backbone models, which can facilitate research on uncertainty-critical applications in fields such as materials science and drug discovery.",
        "keywords": "Uncertainty Quantification;Molecular Property;Pre-trained Models;Molecular Representation Models",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Yinghao Li;Lingkai Kong;Yuanqi Du;Yue Yu;Yuchen Zhuang;Wenhao Mu;Chao Zhang",
        "authorids": "~Yinghao_Li3;~Lingkai_Kong1;~Yuanqi_Du1;~Yue_Yu2;~Yuchen_Zhuang1;~Wenhao_Mu1;~Chao_Zhang15",
        "gender": "M;M;M;M;M;M;",
        "homepage": "https://yinghao-li.github.io/;https://lingkai-kong.com/;https://yuanqidu.github.io/;https://yueyu1030.github.io;https://night-chen.github.io/;https://github.com/SSSScuderia;http://chaozhang.org/",
        "dblp": "15/1534;20/10253;266/2837;;191/5231.html;;94/3019-14",
        "google_scholar": "2WSooDIAAAAJ;https://scholar.google.com/citations?hl=en;fAc_zZMAAAAJ;zQ3Jh6UAAAAJ;T-f6XlEAAAAJ;;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0002-7188-4136;0000-0001-6480-513X;;0000-0002-3683-5208;;;0000-0003-3009-598X",
        "linkedin": "yinghao-li-903412473/;;;;;wenhao-mu/;",
        "or_profile": "~Yinghao_Li3;~Lingkai_Kong1;~Yuanqi_Du1;~Yue_Yu2;~Yuchen_Zhuang1;~Wenhao_Mu1;~Chao_Zhang15",
        "aff": "Georgia Institute of Technology;Georgia Institute of Technology;Cornell University;Georgia Institute of Technology;Georgia Institute of Technology;Georgia Institute of Technology;Georgia Institute of Technology",
        "aff_domain": "gatech.edu;gatech.edu;cornell.edu;gatech.edu;gatech.edu;gatech.edu;gatech.edu",
        "position": "PhD student;PhD student;PhD student;PhD student;PhD student;MS student;Assistant Professor",
        "bibtex": "@misc{\nli2024muben,\ntitle={{MUB}en: Benchmarking the Uncertainty of Molecular Representation Models},\nauthor={Yinghao Li and Lingkai Kong and Yuanqi Du and Yue Yu and Yuchen Zhuang and Wenhao Mu and Chao Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=UIGAtKp8nW}\n}",
        "github": "",
        "project": "",
        "reviewers": "YzRo;qJaY;KD9p;McGM",
        "site": "https://openreview.net/forum?id=UIGAtKp8nW",
        "pdf_size": 1922419,
        "rating": "5;5;5;8",
        "confidence": "3;5;3;4",
        "soundness": "3;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "3;4;3;3",
        "wc_summary": "244;191;34;104",
        "wc_strengths": "36;139;35;59",
        "wc_weaknesses": "278;221;76;229",
        "wc_questions": "34;199;227;155",
        "wc_review": "592;750;372;547",
        "wc_reply_reviewers": "583;512;0;29",
        "wc_reply_authors": "1130;1877;632;994",
        "reply_reviewers": "1;3;0;1",
        "reply_authors": "3;5;2;4",
        "rating_avg": [
            5.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            143.25,
            80.47786962886133
        ],
        "wc_strengths_avg": [
            67.25,
            42.522788008313846
        ],
        "wc_weaknesses_avg": [
            201.0,
            75.39562321514425
        ],
        "wc_questions_avg": [
            153.75,
            73.74745758329571
        ],
        "wc_review_avg": [
            565.25,
            134.6539546392901
        ],
        "wc_reply_reviewers_avg": [
            281.0,
            267.8759041048672
        ],
        "wc_reply_authors_avg": [
            1158.25,
            453.1326378666626
        ],
        "reply_reviewers_avg": [
            1.25,
            1.0897247358851685
        ],
        "reply_authors_avg": [
            3.5,
            1.118033988749895
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.17407765595569782,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7011843234602088343&as_sdt=5,24&sciodt=0,24&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;1;0;0;0;0",
        "aff_unique_norm": "Georgia Institute of Technology;Cornell University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.gatech.edu;https://www.cornell.edu",
        "aff_unique_abbr": "Georgia Tech;Cornell",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "UJeIujVxMn",
        "title": "FedEBA+: Towards Fair and Effective Federated Learning via Entropy-based Model",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Ensuring fairness is a crucial aspect of Federated Learning (FL), which enables the model to perform consistently across all clients. \nHowever, designing an FL algorithm that simultaneously improves global model performance and promotes fairness remains a formidable challenge, as achieving the latter often necessitates a trade-off with the former.\nTo address this challenge, we propose a new FL algorithm, FedEBA+, which enhances fairness while simultaneously improving global model performance. \nFedEBA+ incorporates a fair aggregation scheme that assigns higher weights to underperforming clients and an alignment update method. \nIn addition, we provide theoretical convergence analysis and show the fairness of FedEBA+.\nExtensive experiments demonstrate that FedEBA+ outperforms other SOTA fairness FL methods in terms of both fairness and global model performance.",
        "keywords": "federated learning;fairness algorithm",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/b29d4f2016796ef0b9f0ef860c3b6a7f8dfcfa61.zip",
        "author": "Lin Wang;Zhichao Wang;Xiaoying Tang",
        "authorids": "~Lin_Wang14;~Zhichao_Wang6;~Xiaoying_Tang2",
        "gender": ";M;F",
        "homepage": ";https://github.com/ZhichaoWang091732;https://sse.cuhk.edu.cn/en/faculty/tangxiaoying",
        "dblp": ";;134/9714-2",
        "google_scholar": ";;https://scholar.google.com/citations?hl=zh-TW",
        "orcid": ";;0000-0003-3955-1195",
        "linkedin": ";;",
        "or_profile": "~Lin_Wang14;~Zhichao_Wang6;~Xiaoying_Tang2",
        "aff": ";The Chinese University of HongKong, Shenzhen;The Chinese University of Hong Kong, Shenzhen",
        "aff_domain": ";cuhk.edu.cn;cuhk.edu.cn",
        "position": ";MS student;Assistant Professor",
        "bibtex": "@misc{\nwang2024fedeba,\ntitle={Fed{EBA}+: Towards Fair and Effective Federated Learning via Entropy-based Model},\nauthor={Lin Wang and Zhichao Wang and Xiaoying Tang},\nyear={2024},\nurl={https://openreview.net/forum?id=UJeIujVxMn}\n}",
        "github": "",
        "project": "",
        "reviewers": "ABP1;yc23;4hVe",
        "site": "https://openreview.net/forum?id=UJeIujVxMn",
        "pdf_size": 3412428,
        "rating": "5;5;6",
        "confidence": "3;3;3",
        "soundness": "2;2;3",
        "contribution": "3;2;3",
        "presentation": "2;2;4",
        "wc_summary": "71;88;76",
        "wc_strengths": "50;83;42",
        "wc_weaknesses": "39;779;126",
        "wc_questions": "4;6;41",
        "wc_review": "164;956;285",
        "wc_reply_reviewers": "62;536;41",
        "wc_reply_authors": "1752;6404;2201",
        "reply_reviewers": "1;2;1",
        "reply_authors": "5;11;5",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            78.33333333333333,
            7.1336448530109
        ],
        "wc_strengths_avg": [
            58.333333333333336,
            17.745108872274887
        ],
        "wc_weaknesses_avg": [
            314.6666666666667,
            330.24872781317754
        ],
        "wc_questions_avg": [
            17.0,
            16.990193249832878
        ],
        "wc_review_avg": [
            468.3333333333333,
            348.3526310443996
        ],
        "wc_reply_reviewers_avg": [
            213.0,
            228.55633878761708
        ],
        "wc_reply_authors_avg": [
            3452.3333333333335,
            2095.177372496711
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            7.0,
            2.8284271247461903
        ],
        "replies_avg": [
            31,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10650803762358956068&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Chinese University of Hong Kong",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cuhk.edu.cn",
        "aff_unique_abbr": "CUHK",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Shenzhen",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "UJeqE3gmg2",
        "title": "Robust Policy Optimization with Evolutionary Techniques",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Learning-based techniques to train control policies of autonomous agents often assume that the agent experiences \nare sampled according to a specific dynamical model for the environment. However, \nenvironmental dynamics can change, due to intentional or unintended environmental changes. While domain randomization and robust\nlearning can handle some distribution shifts, significant environmental shifts may necessitate re-training to learn policies optimal in the \nchanged environment.\nWe present an algorithm called `Evolutionary Robust Policy Optimization' (ERPO)\ninspired by evolutionary game theory (EGT) to address\nthe problem of incrementally and efficiently adapting policies to an altered \nenvironment. We give theoretical guarantees on the convergence of our \nalgorithm to the optimal policy under the assumption of sparse rewards.\nWe empirically demonstrate that our algorithm outperforms several state-of-the-art \ndeep RL algorithms in many gym environments. Specifically, we are \nable to adapt policies using fewer training steps while getting \nhigher rewards and requiring lower overall computation time.",
        "keywords": "Reinforcement Learning;Evolutionary methods;Policy Adaptation;robustness",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Sheryl Paul;Jyotirmoy V. Deshmukh",
        "authorids": "~Sheryl_Paul1;~Jyotirmoy_V._Deshmukh1",
        "gender": "F;M",
        "homepage": ";https://jdeshmukh.github.io",
        "dblp": ";42/160",
        "google_scholar": ";https://scholar.google.com.tw/citations?user=CwFX74MAAAAJ",
        "orcid": ";0000-0002-8815-464X",
        "linkedin": "sheryl-paul-2402/;jdeshmukh/",
        "or_profile": "~Sheryl_Paul1;~Jyotirmoy_Deshmukh1",
        "aff": "University of Southern California;University of Southern California",
        "aff_domain": "usc.edu;usc.edu",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\npaul2024robust,\ntitle={Robust Policy Optimization with Evolutionary Techniques},\nauthor={Sheryl Paul and Jyotirmoy V. Deshmukh},\nyear={2024},\nurl={https://openreview.net/forum?id=UJeqE3gmg2}\n}",
        "github": "",
        "project": "",
        "reviewers": "uN8Y;nzVe;X8NW",
        "site": "https://openreview.net/forum?id=UJeqE3gmg2",
        "pdf_size": 3702452,
        "rating": "3;3;6",
        "confidence": "4;3;5",
        "soundness": "2;1;4",
        "contribution": "2;2;3",
        "presentation": "1;1;4",
        "wc_summary": "31;133;40",
        "wc_strengths": "2;77;26",
        "wc_weaknesses": "109;255;244",
        "wc_questions": "2;6;30",
        "wc_review": "144;471;340",
        "wc_reply_reviewers": "0;0;10",
        "wc_reply_authors": "705;647;606",
        "reply_reviewers": "0;0;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            1.4142135623730951
        ],
        "wc_summary_avg": [
            68.0,
            46.10856753359401
        ],
        "wc_strengths_avg": [
            35.0,
            31.272991542223778
        ],
        "wc_weaknesses_avg": [
            202.66666666666666,
            66.38440245184775
        ],
        "wc_questions_avg": [
            12.666666666666666,
            12.36482466066094
        ],
        "wc_review_avg": [
            318.3333333333333,
            134.373443143436
        ],
        "wc_reply_reviewers_avg": [
            3.3333333333333335,
            4.714045207910316
        ],
        "wc_reply_authors_avg": [
            652.6666666666666,
            40.61472092179824
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.8660254037844387,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:zmsUSfK3QkQJ:scholar.google.com/&scioq=Robust+Policy+Optimization+with+Evolutionary+Techniques&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Southern California",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.usc.edu",
        "aff_unique_abbr": "USC",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Los Angeles",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "UJkgGbLfWA",
        "title": "Guiding Language Models Reasoning with Planning Tokens",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs) have recently attracted considerable interest for their ability to perform complex reasoning tasks, such as chain-of-thought reasoning. However, most of the existing approaches to enhance this ability rely heavily on data-driven methods, while neglecting the structural aspects of the model\u2019s reasoning capacity. We find that while LLMs can manage individual reasoning steps well, they struggle with maintaining consistency across an entire reasoning chain. To solve this, we introduce 'planning tokens' at the start of each reasoning step, serving as a guide for the model. These tokens embeddings are then fine-tuned along with the rest of the model parameters. Our approach requires a negligible increase in trainable parameters (just 0.001%) and can be applied through either full fine-tuning or a more parameter-efficient scheme. We demonstrate our method's effectiveness by applying it to three different LLMs, showing notable accuracy improvements across three math word problem datasets w.r.t. plain chain-of-thought fine-tuning baselines.",
        "keywords": "Large language model;chain-of-thoughts reasoning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Xinyi Wang;Lucas Caccia;Oleksiy Ostapenko;Xingdi Yuan;Alessandro Sordoni",
        "authorids": "~Xinyi_Wang2;~Lucas_Caccia1;~Oleksiy_Ostapenko1;~Xingdi_Yuan2;~Alessandro_Sordoni2",
        "gender": "F;M;M;M;M",
        "homepage": "https://wangxinyilinda.github.io/;https://www.cs.mcgill.ca/~lpagec/;;;https://xingdi-eric-yuan.github.io/",
        "dblp": ";;;57/7642;40/10147",
        "google_scholar": "3vvbplcAAAAJ;fuvIITUAAAAJ;mqLVUGgAAAAJ;;hYfE-B8AAAAJ",
        "orcid": ";;;;",
        "linkedin": "xinyi-wang-444385133/;;;;",
        "or_profile": "~Xinyi_Wang2;~Lucas_Caccia1;~Oleksiy_Ostapenko1;~Alessandro_Sordoni1;~Eric_Yuan1",
        "aff": "International Business Machines;Microsoft;University of Montreal;Microsoft;Microsoft Research",
        "aff_domain": "ibm.com;microsoft.com;umontreal.ca;microsoft.com;microsoft.com",
        "position": "Intern;Postdoc;PhD student;Researcher;Senior Researcher",
        "bibtex": "@misc{\nwang2024guiding,\ntitle={Guiding Language Models Reasoning with Planning Tokens},\nauthor={Xinyi Wang and Lucas Caccia and Oleksiy Ostapenko and Xingdi Yuan and Alessandro Sordoni},\nyear={2024},\nurl={https://openreview.net/forum?id=UJkgGbLfWA}\n}",
        "github": "",
        "project": "",
        "reviewers": "C3Cd;UavC;1L1z;9J4w",
        "site": "https://openreview.net/forum?id=UJkgGbLfWA",
        "pdf_size": 791765,
        "rating": "1;5;6;8",
        "confidence": "4;4;3;3",
        "soundness": "1;3;2;4",
        "contribution": "1;2;3;4",
        "presentation": "2;2;4;4",
        "wc_summary": "32;68;37;56",
        "wc_strengths": "16;36;32;56",
        "wc_weaknesses": "65;330;42;30",
        "wc_questions": "1;84;2;23",
        "wc_review": "114;518;113;165",
        "wc_reply_reviewers": "366;208;0;0",
        "wc_reply_authors": "1301;857;158;182",
        "reply_reviewers": "1;2;0;0",
        "reply_authors": "3;3;1;1",
        "rating_avg": [
            5.0,
            2.5495097567963922
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            1.118033988749895
        ],
        "contribution_avg": [
            2.5,
            1.118033988749895
        ],
        "presentation_avg": [
            3.0,
            1.0
        ],
        "wc_summary_avg": [
            48.25,
            14.49784466739798
        ],
        "wc_strengths_avg": [
            35.0,
            14.247806848775006
        ],
        "wc_weaknesses_avg": [
            116.75,
            123.76060560614593
        ],
        "wc_questions_avg": [
            27.5,
            33.78239186321774
        ],
        "wc_review_avg": [
            227.5,
            169.0332807467216
        ],
        "wc_reply_reviewers_avg": [
            143.5,
            153.98944769041805
        ],
        "wc_reply_authors_avg": [
            624.5,
            480.92021167757133
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.0,
            1.0
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.7844645405527362,
        "gs_citation": 16,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8882168171600401098&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;1;1",
        "aff_unique_norm": "International Business Machines Corporation;Microsoft;University of Montreal",
        "aff_unique_dep": ";Microsoft Corporation;",
        "aff_unique_url": "https://www.ibm.com;https://www.microsoft.com;https://wwwumontreal.ca",
        "aff_unique_abbr": "IBM;Microsoft;UM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "United States;Canada"
    },
    {
        "id": "UK7Hs7f0So",
        "title": "VMFTransformer: An Angle-Preserving and Auto-Scaling Machine for Multi-horizon Probabilistic Forecasting",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Time series forecasting has historically been a key area of academic research and industrial applications. As deep learning develops, the major research methodologies of time series forecasting can be divided into two categories, i.e., iterative and direct methods. In the iterative methods, since a small amount of error is produced at each time step, the recursive structure can potentially lead to large error accumulations over longer forecasting horizons. Although the direct methods can avoid this puzzle involved in the iterative methods, it faces abuse of conditional independence among time points. This impractical assumption can also lead to biased models. To solve these challenges, we propose a direct approach for multi-horizon probabilistic forecasting, which can effectively characterize the dependence across future horizons. Specifically, we consider the multi-horizon target as a random vector. The direction of the vector embodies the temporal dependence, and the length of the vector measures the overall scale across each horizon. Therefore, we respectively apply the von Mises-Fisher (VMF) distribution and the truncated normal distribution to characterize the angle and the magnitude of the target vector in our model. We evaluate the performance of our framework on three benchmarks. Extensive results demonstrate the superiority of our framework over six state-of-the-art methods and show the remarkable versatility and extensibility for different time series forecasting tasks.",
        "keywords": "time series forecasting;probabilistic forecasting",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/c22abf4845f0eb97099152893e423788cc129315.pdf",
        "author": "Yunyi Zhou;Zhixuan Chu;Ruohan Gao;Xinping Zheng;Yuchen Huang;Sheng Li",
        "authorids": "~Yunyi_Zhou1;~Zhixuan_Chu1;~Ruohan_Gao3;~Xinping_Zheng1;~Yuchen_Huang1;~Sheng_Li3",
        "gender": "M;M;M;F;M;M",
        "homepage": "https://work.antgroup-inc.cn/nwpipe/u/299739;;;http://gyhfkj.com/html/qclyrwzf5242.jhtml.html;;http://sheng-li.org",
        "dblp": ";258/1233;;;;23/3439-1",
        "google_scholar": ";a4IuTngAAAAJ;;;;DEncVcYAAAAJ",
        "orcid": ";;;;;0000-0003-1205-8632",
        "linkedin": ";;ryan-gao-/;;yuchenhuang17;sheng-li-15a70022/",
        "or_profile": "~Yunyi_Zhou1;~Zhixuan_Chu1;~Ruohan_Gao3;~Xinping_Zheng1;~Yuchen_Huang1;~Sheng_Li3",
        "aff": "Antgroup;Ant Group;;;;University of Virginia, Charlottesville",
        "aff_domain": "alibaba-inc.com;antgroup.com;;;;virginia.edu",
        "position": "Researcher;Researcher;;;;Associate Professor",
        "bibtex": "@misc{\nzhou2024vmftransformer,\ntitle={{VMFT}ransformer: An Angle-Preserving and Auto-Scaling Machine for Multi-horizon Probabilistic Forecasting},\nauthor={Yunyi Zhou and Zhixuan Chu and Ruohan Gao and Xinping Zheng and Yuchen Huang and Sheng Li},\nyear={2024},\nurl={https://openreview.net/forum?id=UK7Hs7f0So}\n}",
        "github": "",
        "project": "",
        "reviewers": "s4Yt;2Tuf;7TJV;Abqw",
        "site": "https://openreview.net/forum?id=UK7Hs7f0So",
        "pdf_size": 1319931,
        "rating": "5;5;5;6",
        "confidence": "5;4;4;4",
        "soundness": "2;3;2;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;3;2",
        "wc_summary": "112;96;86;76",
        "wc_strengths": "51;66;62;41",
        "wc_weaknesses": "368;147;173;66",
        "wc_questions": "79;7;21;109",
        "wc_review": "610;316;342;292",
        "wc_reply_reviewers": "149;232;60;0",
        "wc_reply_authors": "431;251;310;445",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            92.5,
            13.294735800308331
        ],
        "wc_strengths_avg": [
            55.0,
            9.772410142846033
        ],
        "wc_weaknesses_avg": [
            188.5,
            110.89296641356475
        ],
        "wc_questions_avg": [
            54.0,
            41.677331968349414
        ],
        "wc_review_avg": [
            390.0,
            128.24195881223898
        ],
        "wc_reply_reviewers_avg": [
            110.25,
            88.04082859673687
        ],
        "wc_reply_authors_avg": [
            359.25,
            81.61609828949189
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:XWhjn6WNW9YJ:scholar.google.com/&scioq=VMFTransformer:+An+Angle-Preserving+and+Auto-Scaling+Machine+for+Multi-horizon+Probabilistic+Forecasting&hl=en&as_sdt=0,10",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Antgroup;Ant Group;University of Virginia",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.antgroup.com;https://www.antgroup.com;https://www.virginia.edu",
        "aff_unique_abbr": "Antgroup;Ant Group;UVA",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Charlottesville",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "UKE7YpUubu",
        "title": "RACH-Space: Reconstructing Adaptive Convex Hull Space with applications in weak supervision",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We introduce RACH-Space, a novel classification method in ensemble learning. In particular, we show its applicability as a label model for weakly supervised learning. RACH-Space offers simplicity in implementation with minimal assumptions on the data or weak signals. The model is well suited for scenarios where fully labeled data is not available. Our method is built upon geometrical interpretation of the space spanned by weak signals. Our analysis of the high dimensional convex hull structure underlying general set of weak signals bridges geometry with machine learning. Empirical results also demonstrate that RACH-Space works well in practice and compares favorably to best existing label models for weakly supervised learning.",
        "keywords": "Machine Learning;Weakly Supervised learning;Convex Hull Analysis;Geometry;Label Model;Ensemble Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/b7385180a99e9a32686a66015568acdbb58195e7.zip",
        "author": "Woojoo Na;Abiy Tasissa",
        "authorids": "~Woojoo_Na1;~Abiy_Tasissa1",
        "gender": "M;M",
        "homepage": "https://itsmeuniverse.github.io/;http://sites.tufts.edu/atasissa/",
        "dblp": ";218/6144",
        "google_scholar": ";https://scholar.google.com/citations?hl=en",
        "orcid": ";",
        "linkedin": "woojoo-na-373701151/;",
        "or_profile": "~Woojoo_Na1;~Abiy_Tasissa1",
        "aff": ";Tufts University",
        "aff_domain": ";tufts.edu",
        "position": ";Assistant Professor",
        "bibtex": "@misc{\nna2024rachspace,\ntitle={{RACH}-Space: Reconstructing Adaptive Convex Hull Space with applications in weak supervision},\nauthor={Woojoo Na and Abiy Tasissa},\nyear={2024},\nurl={https://openreview.net/forum?id=UKE7YpUubu}\n}",
        "github": "",
        "project": "",
        "reviewers": "16fQ;LHEL;YGuB;LMCF;TWM9",
        "site": "https://openreview.net/forum?id=UKE7YpUubu",
        "pdf_size": 251818,
        "rating": "3;3;3;5;5",
        "confidence": "2;2;2;4;5",
        "soundness": "1;2;2;2;3",
        "contribution": "2;2;2;3;3",
        "presentation": "1;2;1;2;2",
        "wc_summary": "22;73;302;63;55",
        "wc_strengths": "25;25;19;39;44",
        "wc_weaknesses": "298;65;160;114;32",
        "wc_questions": "253;37;4;2;324",
        "wc_review": "598;200;485;218;455",
        "wc_reply_reviewers": "128;26;53;10;34",
        "wc_reply_authors": "655;327;190;296;767",
        "reply_reviewers": "1;1;1;1;1",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            3.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.0,
            1.2649110640673518
        ],
        "soundness_avg": [
            2.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            1.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            103.0,
            100.96137875445244
        ],
        "wc_strengths_avg": [
            30.4,
            9.457272334029511
        ],
        "wc_weaknesses_avg": [
            133.8,
            92.88358304888976
        ],
        "wc_questions_avg": [
            124.0,
            136.74355560683654
        ],
        "wc_review_avg": [
            391.2,
            156.32709298135111
        ],
        "wc_reply_reviewers_avg": [
            50.2,
            41.29116128180461
        ],
        "wc_reply_authors_avg": [
            447.0,
            223.12059519461667
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.9682458365518541,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:2zzhthX6NuMJ:scholar.google.com/&scioq=RACH-Space:+Reconstructing+Adaptive+Convex+Hull+Space+with+applications+in+weak+supervision&hl=en&as_sdt=0,11",
        "gs_version_total": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "Tufts University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tufts.edu",
        "aff_unique_abbr": "Tufts",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "UKhnJ2Ifio",
        "title": "What Images are More Memorable to Machines?",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "This paper studies the problem of measuring and predicting how memorable an image is to pattern recognition machines, as a path to explore machine intelligence. Firstly, we propose a self-supervised machine memory quantification pipeline, dubbed ''MachineMem measurer'', to collect machine memorability scores of images. Similar to humans, machines also tend to memorize certain kinds of images, whereas the types of images that machines and humans memorize are different. Through in-depth analysis and comprehensive visualizations, we gradually unveil that ''complex''  images are usually more memorable to machines. We further conduct extensive experiments across 11 different machines and 9 pre-training methods to analyze and understand machine memory. This work proposes the concept of machine memorability and opens a new research direction at the interface between machine memory and visual data.",
        "keywords": "Memorability of Images;Visual Intelligence;Image Attributes",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "Junlin Han;Huangying Zhan;JIE HONG;Pengfei Fang;Hongdong Li;Lars Petersson;Ian Reid",
        "authorids": "~Junlin_Han1;~Huangying_Zhan3;~JIE_HONG2;~Pengfei_Fang1;~Hongdong_Li1;~Lars_Petersson2;~Ian_Reid1",
        "gender": "M;M;M;M;M;M;M",
        "homepage": "https://junlinhan.github.io/;https://huangying-zhan.github.io/;;https://fpfcjdsg.github.io/;http://users.cecs.anu.edu.au/~hongdong/;;",
        "dblp": "151/9037;210/9949;;204/7650.html;59/4859.html;18/5485;r/IanDReid1",
        "google_scholar": "5L0Uj_IAAAAJ;bZUyUy4AAAAJ;https://scholar.google.com.au/citations?user=Uz7TC6IAAAAJ;Fk4A13IAAAAJ;https://scholar.google.com.tw/citations?hl=en;32RHN4oAAAAJ;https://scholar.google.com.au/citations?user=ATkNLcQAAAAJ",
        "orcid": ";;;0000-0001-8939-0460;;;0000-0001-7790-6423",
        "linkedin": ";;;fang-pengfei-62956a96/?locale=zh_CN;;lars-petersson-9013541/;",
        "or_profile": "~Junlin_Han1;~Huangying_Zhan3;~JIE_HONG2;~Pengfei_Fang1;~Hongdong_Li1;~Lars_Petersson2;~Ian_Reid1",
        "aff": "GenAI, Meta;InnoPeak Technology, Inc.;Australian National University;Southeast University;Australian National University;CSIRO;University of Adelaide",
        "aff_domain": "meta.com;innopeaktech.com;anu.edu.au;seu.edu.cn;anu.edu.au;csiro.au;adelaide.edu.au",
        "position": "Researcher;Researcher;PhD student;Associate Professor;Full Professor;Principal Research Scientist;Professor",
        "bibtex": "@misc{\nhan2024what,\ntitle={What Images are More Memorable to Machines?},\nauthor={Junlin Han and Huangying Zhan and JIE HONG and Pengfei Fang and Hongdong Li and Lars Petersson and Ian Reid},\nyear={2024},\nurl={https://openreview.net/forum?id=UKhnJ2Ifio}\n}",
        "github": "",
        "project": "",
        "reviewers": "7Y5p;1XLS;wA3f;hEof",
        "site": "https://openreview.net/forum?id=UKhnJ2Ifio",
        "pdf_size": 4586380,
        "rating": "1;3;3;6",
        "confidence": "4;4;4;4",
        "soundness": "1;3;2;3",
        "contribution": "1;2;2;3",
        "presentation": "3;4;3;3",
        "wc_summary": "105;282;58;87",
        "wc_strengths": "8;95;21;137",
        "wc_weaknesses": "266;417;143;114",
        "wc_questions": "14;43;3;6",
        "wc_review": "393;837;225;344",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            133.0,
            87.64416694794924
        ],
        "wc_strengths_avg": [
            65.25,
            53.07718436390536
        ],
        "wc_weaknesses_avg": [
            235.0,
            119.57215394898597
        ],
        "wc_questions_avg": [
            16.5,
            15.819292019556375
        ],
        "wc_review_avg": [
            449.75,
            231.77507954911806
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:KbT56dEQ1l4J:scholar.google.com/&scioq=What+Images+are+More+Memorable+to+Machines%3F&hl=en&as_sdt=0,5",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;3;2;4;5",
        "aff_unique_norm": "Meta;InnoPeak Technology;Australian National University;Southeast University;Commonwealth Scientific and Industrial Research Organisation;University of Adelaide",
        "aff_unique_dep": "Meta;;;;;",
        "aff_unique_url": "https://meta.com;;https://www.anu.edu.au;https://www.seu.edu.cn/;https://www.csiro.au;https://www.adelaide.edu.au",
        "aff_unique_abbr": "Meta;;ANU;SEU;CSIRO;Adelaide",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;2;1;1;1",
        "aff_country_unique": "United States;Australia;China"
    },
    {
        "id": "ULsnvrTB9Y",
        "title": "Free-style and Fast 3D Portrait Synthesis",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Efficiently generating a free-style 3D portrait with high quality and consistency is a promising yet challenging task. The portrait styles generated by most existing methods are usually restricted by their 3D generators, which are learned in specific facial datasets, such as FFHQ. To get a free-style 3D portrait, one can build a large-scale multi-style database to retrain the 3D generator, or use a off-the-shelf tool to do the style translation. However, the former is time-consuming due to data collection and training process, the latter may destroy the multi-view consistency. To tackle this problem, we propose a fast 3D portrait synthesis framework in this paper, which enable one to use text prompts to specify styles. Specifically, for a given portrait style, we first leverage two generative priors, a 3D-aware GAN generator (EG3D) and a text-guided image editor (Ip2p), to quickly construct a few-shot training set, where the inference process of Ip2p is optimized to make editing more stable. Then we replace original triplane generator of EG3D with a Image-to-Triplane (I2T) module for two purposes: 1) getting rid of the style constraints of pre-trained EG3D by fine-tuning I2T on the few-shot dataset; 2) improving training efficiency by fixing all parts of EG3D except I2T. Furthermore, we construct a multi-style and multi-identity 3D portrait database to demonstrate the scalability and generalization of our method. Experimental results show that our method is capable of synthesizing high-quality 3D portraits with specified styles in a few minutes, outperforming the state-of-the-art.",
        "keywords": "3D Portrait Synthesis;text-to-3D;3D portrait stylization",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/1123b8a2ea76ab8f3c893901a517c8f8f7795d72.zip",
        "author": "Tianxiang Ma;Kang Zhao;Jianxin Sun;Yingya Zhang;Jing Dong;Tieniu Tan",
        "authorids": "~Tianxiang_Ma1;~Kang_Zhao7;~Jianxin_Sun2;~Yingya_Zhang3;~Jing_Dong1;~Tieniu_Tan1",
        "gender": "M;;M;M;F;",
        "homepage": ";;https://www.ia.ac.cn;;;",
        "dblp": "50/10800;;98/10799;142/2510;85/1692-3;",
        "google_scholar": "AQR7PoYAAAAJ;;;16RDSEUAAAAJ;cf4RSDoAAAAJ;",
        "orcid": ";;;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Tianxiang_Ma1;~Kang_Zhao7;~Jianxin_Sun2;~Yingya_Zhang3;~Jing_Dong1;~Tieniu_Tan1",
        "aff": "University of Chinese Academy of Sciences;;Institute of Automation, Chinese Academy of Sciences;Alibaba Group;Institute of Automation, Chinese Academy of Sciences;",
        "aff_domain": "ucas.edu.cn;;ia.ac.cn;alibaba-inc.com;ia.ac.cn;",
        "position": "PhD student;;PhD student;Researcher;Full Professor;",
        "bibtex": "@misc{\nma2024freestyle,\ntitle={Free-style and Fast 3D Portrait Synthesis},\nauthor={Tianxiang Ma and Kang Zhao and Jianxin Sun and Yingya Zhang and Jing Dong and Tieniu Tan},\nyear={2024},\nurl={https://openreview.net/forum?id=ULsnvrTB9Y}\n}",
        "github": "",
        "project": "",
        "reviewers": "jiQH;8A9M;1GQB;W4GE",
        "site": "https://openreview.net/forum?id=ULsnvrTB9Y",
        "pdf_size": 17115254,
        "rating": "3;5;5;5",
        "confidence": "4;3;4;4",
        "soundness": "2;2;3;2",
        "contribution": "2;2;2;2",
        "presentation": "3;2;4;2",
        "wc_summary": "60;35;144;85",
        "wc_strengths": "31;16;124;38",
        "wc_weaknesses": "98;81;194;144",
        "wc_questions": "86;15;137;4",
        "wc_review": "275;147;599;271",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            81.0,
            40.441315507782384
        ],
        "wc_strengths_avg": [
            52.25,
            42.180416071916596
        ],
        "wc_weaknesses_avg": [
            129.25,
            43.91682479414922
        ],
        "wc_questions_avg": [
            60.5,
            54.23329235810785
        ],
        "wc_review_avg": [
            323.0,
            167.45148551147582
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "University of Chinese Academy of Sciences;Chinese Academy of Sciences;Alibaba Group",
        "aff_unique_dep": ";Institute of Automation;",
        "aff_unique_url": "http://www.ucas.ac.cn;http://www.ia.cas.cn;https://www.alibaba.com",
        "aff_unique_abbr": "UCAS;CAS;Alibaba",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "UM6QLuOVNi",
        "title": "EVEREST: Efficient Masked Video Autoencoder by Removing Redundant Spatiotemporal Tokens",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Masked video autoencoder approaches have demonstrated their potential by significantly outperforming previous self-supervised learning methods in video representation learning. However, they require an excessive amount of computations and memory while predicting uninformative tokens/frames due to random masking strategies, requiring excessive computing power for training. (e.g., over 16 nodes with 128 NVIDIA A100 GPUs). To resolve this issue, we exploit the unequal information density among the patches in videos and propose Efficient Masked Video AutoEncoder by Removing REdundant Spatiotemporal Tokens (EVEREST), a new token selection method for video representation learning that finds tokens containing rich motion features and drops uninformative ones during both pre-training and fine-tuning. We further present an information-intensive frame selection strategy that allows the model to focus on informative and causal frames with minimal redundancy. Our method significantly reduces the computation and memory requirements of Masked video autoencoder, enabling the pre-training and fine-tuning on a single machine with 8 GPUs while achieving comparable performance to computation- and memory-heavy state-of-the-art methods on multiple benchmarks and on the uncurated Ego4D dataset. We hope that our work contributes to reducing the barrier to further research on video understanding.",
        "keywords": "Efficient Learning;Masked Modeling;Video Representation Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/135316730ed8e46221b3f35f982d7173e9cbe28b.zip",
        "author": "Sunil Hwang;Jaehong Yoon;Youngwan Lee;Sung Ju Hwang",
        "authorids": "~Sunil_Hwang1;~Jaehong_Yoon1;~Youngwan_Lee1;~Sung_Ju_Hwang1",
        "gender": ";M;M;",
        "homepage": "https://github.com/sunilhoho;https://jaehong31.github.io/;https://youngwanlee.github.io/;",
        "dblp": "225/3993;203/4449;184/5625;",
        "google_scholar": ";-5comoUAAAAJ;EqemKYsAAAAJ;",
        "orcid": ";;0000-0001-8644-155X;",
        "linkedin": ";jaehongyoon/;youngwanlee/;",
        "or_profile": "~Sunil_Hwang1;~Jaehong_Yoon1;~Youngwan_Lee1;~Sung_Ju_Hwang1",
        "aff": "Korea Military Academy;University of North Carolina at Chapel Hill;Electronics and Telecommunication Research Institute;",
        "aff_domain": "kma.ac.kr;unc.edu;etri.re.kr;",
        "position": "Instructor;Postdoc;Researcher;",
        "bibtex": "@misc{\nhwang2024everest,\ntitle={{EVEREST}: Efficient Masked Video Autoencoder by Removing Redundant Spatiotemporal Tokens},\nauthor={Sunil Hwang and Jaehong Yoon and Youngwan Lee and Sung Ju Hwang},\nyear={2024},\nurl={https://openreview.net/forum?id=UM6QLuOVNi}\n}",
        "github": "",
        "project": "",
        "reviewers": "4Vgt;viqa;JSFH",
        "site": "https://openreview.net/forum?id=UM6QLuOVNi",
        "pdf_size": 4039307,
        "rating": "3;5;8",
        "confidence": "4;5;4",
        "soundness": "2;4;3",
        "contribution": "2;3;3",
        "presentation": "2;4;3",
        "wc_summary": "75;107;58",
        "wc_strengths": "113;145;142",
        "wc_weaknesses": "397;239;16",
        "wc_questions": "33;8;135",
        "wc_review": "618;499;351",
        "wc_reply_reviewers": "585;0;25",
        "wc_reply_authors": "3755;1601;737",
        "reply_reviewers": "5;0;1",
        "reply_authors": "10;5;3",
        "rating_avg": [
            5.333333333333333,
            2.0548046676563256
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            80.0,
            20.314198646923455
        ],
        "wc_strengths_avg": [
            133.33333333333334,
            14.42990721460891
        ],
        "wc_weaknesses_avg": [
            217.33333333333334,
            156.2953045431059
        ],
        "wc_questions_avg": [
            58.666666666666664,
            54.932281543328926
        ],
        "wc_review_avg": [
            489.3333333333333,
            109.21640088476741
        ],
        "wc_reply_reviewers_avg": [
            203.33333333333334,
            270.07200685907617
        ],
        "wc_reply_authors_avg": [
            2031.0,
            1269.0563423268488
        ],
        "reply_reviewers_avg": [
            2.0,
            2.160246899469287
        ],
        "reply_authors_avg": [
            6.0,
            2.943920288775949
        ],
        "replies_avg": [
            30,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.11470786693528084,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12311685144230178080&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Korea Military Academy;University of North Carolina;Electronics and Telecommunication Research Institute",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.kma.go.kr;https://www.unc.edu;http://www.etri.re.kr",
        "aff_unique_abbr": "KMA;UNC;ETRI",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Chapel Hill",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "title": "A Precise Characterization of SGD Stability Using Loss Surface Geometry",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18528",
        "id": "UMOlFJzLfL",
        "author_site": "Gregory Dexter, Borja Ocejo, Sathiya Keerthi, Aman Gupta, Ayan Acharya, Rajiv Khanna",
        "tldr": "",
        "abstract": "Stochastic Gradient Descent (SGD) stands as a cornerstone optimization algorithm with proven real-world empirical successes but relatively limited theoretical understanding. Recent research has illuminated a key factor contributing to its practical efficacy: the implicit regularization it instigates. Several studies have investigated the linear stability property of SGD in the vicinity of a stationary point as a predictive proxy for sharpness and generalization error in overparameterized neural networks (Wu et al., 2022; Jastrzebski et al., 2019; Cohen et al., 2021). In this paper, we delve deeper into the relationship between linear stability and sharpness. More specifically, we meticulously delineate the necessary and sufficient conditions for linear stability, contingent on hyperparameters of SGD and the sharpness at the optimum. Towards this end, we introduce a novel coherence measure of the loss Hessian that encapsulates pertinent geometric properties of the loss function that are relevant to the linear stability of SGD. It enables us to provide a simplified sufficient condition for identifying linear instability at an optimum. Notably, compared to previous works, our analysis relies on significantly milder assumptions and is applicable for a broader class of loss functions than known before, encompassing not only mean-squared error but also cross-entropy loss.",
        "keywords": "SGD;linear dynamics;sharpness;implicit regularization",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/810125a9247ea43f8ad272eac7c80b55389d14d0.zip",
        "author": "Gregory Dexter;Borja Ocejo;Sathiya Keerthi;Aman Gupta;Ayan Acharya;Rajiv Khanna",
        "authorids": "~Gregory_Dexter1;bocejo@linkedin.com;~Sathiya_Keerthi1;~Aman_Gupta1;~Ayan_Acharya1;~Rajiv_Khanna1",
        "gender": ";;M;M;M;M",
        "homepage": "https://www.gregorydexter.com/;;http://www.keerthis.com;;;http://rjvak7.github.io/",
        "dblp": "252/2283;;;359/1957.html;53/770;31/4624",
        "google_scholar": "nEIGQ00AAAAJ;;Sr7jln4AAAAJ;vuGUPbkAAAAJ;u11FXaoAAAAJ;523w4w8AAAAJ",
        "orcid": ";;;;;0000-0003-1314-3126",
        "linkedin": "gregorydexter1;;;aman-gupta1/;;",
        "or_profile": "~Gregory_Dexter1;bocejo@linkedin.com;~Sathiya_Keerthi1;~Aman_Gupta1;~Ayan_Acharya1;~Rajiv_Khanna1",
        "aff": "Purdue University;;;LinkedIn;LinkedIn;Purdue University",
        "aff_domain": "purdue.edu;;;linkedin.com;linkedin.com;purdue.edu",
        "position": "PhD student;;;Researcher;Researcher;Assistant Professor",
        "bibtex": "@inproceedings{\ndexter2024a,\ntitle={A Precise Characterization of {SGD} Stability Using Loss Surface Geometry},\nauthor={Gregory Dexter and Borja Ocejo and Sathiya Keerthi and Aman Gupta and Ayan Acharya and Rajiv Khanna},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=UMOlFJzLfL}\n}",
        "github": "",
        "project": "",
        "reviewers": "mpeb;SPXN;asFh;ELtf",
        "pdf_size": 812019,
        "rating": "3;6;6;8",
        "confidence": "4;4;3;4",
        "soundness": "2;3;2;4",
        "contribution": "1;3;2;4",
        "presentation": "1;2;3;4",
        "wc_summary": "91;90;76;61",
        "wc_strengths": "12;29;31;77",
        "wc_weaknesses": "174;356;131;106",
        "wc_questions": "127;199;76;221",
        "wc_review": "404;674;314;465",
        "wc_reply_reviewers": "0;0;245;19",
        "wc_reply_authors": "764;1365;1344;1080",
        "reply_reviewers": "0;0;3;1",
        "reply_authors": "1;2;3;2",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            1.118033988749895
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            79.5,
            12.216791722870616
        ],
        "wc_strengths_avg": [
            37.25,
            24.107830678018296
        ],
        "wc_weaknesses_avg": [
            191.75,
            97.89886362976846
        ],
        "wc_questions_avg": [
            155.75,
            57.69477879323223
        ],
        "wc_review_avg": [
            464.25,
            132.4771206661739
        ],
        "wc_reply_reviewers_avg": [
            66.0,
            103.63638357256586
        ],
        "wc_reply_authors_avg": [
            1138.25,
            243.51835146452515
        ],
        "reply_reviewers_avg": [
            1.0,
            1.224744871391589
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.08084520834544431,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15828489067376605921&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=UMOlFJzLfL",
        "pdf": "https://openreview.net/pdf?id=UMOlFJzLfL",
        "email": "purdue.edu;;;linkedin.com;linkedin.com;purdue.edu",
        "author_num": 6,
        "aff_unique_index": "0;1;1;0",
        "aff_unique_norm": "Purdue University;LinkedIn Corporation",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.purdue.edu;https://www.linkedin.com",
        "aff_unique_abbr": "Purdue;LinkedIn",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Faithful Explanations of Black-box NLP Models Using LLM-generated Counterfactuals",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18527",
        "id": "UMfcdRIotC",
        "author_site": "Yair Gat, Nitay Calderon, Amir Feder, Alexander Chapanin, Amit Sharma, Roi Reichart",
        "tldr": "",
        "abstract": "Causal explanations of the predictions of NLP systems are essential to ensure safety and establish trust. Yet, existing methods often fall short of explaining model predictions effectively or efficiently and are often model-specific. In this paper, we address model-agnostic explanations, proposing two approaches for counterfactual (CF) approximation. The first approach is CF generation, where a large language model (LLM) is prompted to change a specific text concept while keeping confounding concepts unchanged. While this approach is demonstrated to be very effective, applying LLM at inference-time is costly. We hence present a second approach based on matching, and propose a method that is guided by an LLM at training-time and learns a dedicated embedding space. This space is faithful to a given causal graph and effectively serves to identify matches that approximate CFs. After showing theoretically that approximating CFs is required in order to construct faithful explanations, we benchmark our approaches and explain several models, including LLMs with billions of parameters. Our empirical results demonstrate the excellent performance of CF generation models as model-agnostic explainers. Moreover, our matching approach, which requires far less test-time resources, also provides effective explanations, surpassing many baselines. We also find that Top-K techniques universally improve every tested method. Finally, we showcase the potential of LLMs in constructing new benchmarks for model explanation and subsequently validate our conclusions. Our work illuminates new pathways for efficient and accurate approaches to interpreting NLP systems.",
        "keywords": "NLP;LLMs;Interpretability;Explanation;Causal Inference;Matching",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/a4fee95eda37038c8e632a95c28aa271b72a7cfc.zip",
        "author": "Yair Ori Gat;Nitay Calderon;Amir Feder;Alexander Chapanin;Amit Sharma;Roi Reichart",
        "authorids": "~Yair_Ori_Gat1;~Nitay_Calderon1;~Amir_Feder1;~Alexander_Chapanin1;~Amit_Sharma3;~Roi_Reichart1",
        "gender": "M;;M;M;M;M",
        "homepage": "https://nitaytech.github.io/;https://www.amirfeder.com/;;http://amitsharma.in/;https://roireichart.com/;",
        "dblp": "305/0373;214/3604;;72/2540-7;96/5429;",
        "google_scholar": "_1qnAh4AAAAJ;ERwoPLIAAAAJ;;https://scholar.google.co.in/citations?user=CXgQufgAAAAJ;https://scholar.google.co.il/citations?user=xXJIsh4AAAAJ;",
        "orcid": ";0000-0001-5472-1135;;0000-0002-2086-3191;;",
        "linkedin": "nitay-calderon-b628a6185;amir-feder-b65b7035/;chapanin/;;roi-reichart-ba2a8a7/;yair-gat/",
        "or_profile": "~Nitay_Calderon1;~Amir_Feder1;~Alexander_Chapanin1;~Amit_Sharma3;~Roi_Reichart1;~Yair_Gat1",
        "aff": "Technion - Israel Institute of Technology;Google;Technion - Israel Institute of Technology, Technion - Israel Institute of Technology;Microsoft Research;Technion, Israel Institute of Technology;",
        "aff_domain": "campus.technion.ac.il;google.com;campus.technion.ac.il;microsoft.com;technion.ac.il;",
        "position": "PhD student;Researcher;PhD student;Principal Researcher;Associate Professor;",
        "bibtex": "@inproceedings{\ngat2024faithful,\ntitle={Faithful Explanations of Black-box {NLP} Models Using {LLM}-generated Counterfactuals},\nauthor={Yair Ori Gat and Nitay Calderon and Amir Feder and Alexander Chapanin and Amit Sharma and Roi Reichart},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=UMfcdRIotC}\n}",
        "github": "",
        "project": "",
        "reviewers": "GEWc;wvZe;32rU;9xHf",
        "pdf_size": 1047952,
        "rating": "6;6;6;6",
        "confidence": "4;4;5;4",
        "soundness": "3;2;3;3",
        "contribution": "3;2;3;3",
        "presentation": "2;2;3;4",
        "wc_summary": "64;127;126;94",
        "wc_strengths": "55;110;85;53",
        "wc_weaknesses": "83;227;290;45",
        "wc_questions": "87;35;2;15",
        "wc_review": "289;499;503;207",
        "wc_reply_reviewers": "38;85;547;182",
        "wc_reply_authors": "790;2246;2581;867",
        "reply_reviewers": "1;1;3;1",
        "reply_authors": "1;4;5;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            102.75,
            26.013217794036937
        ],
        "wc_strengths_avg": [
            75.75,
            23.488028865786077
        ],
        "wc_weaknesses_avg": [
            161.25,
            100.6687016902473
        ],
        "wc_questions_avg": [
            34.75,
            32.37572393013012
        ],
        "wc_review_avg": [
            374.5,
            129.78732603763743
        ],
        "wc_reply_reviewers_avg": [
            213.0,
            199.70353026423945
        ],
        "wc_reply_authors_avg": [
            1621.0,
            801.7639927060831
        ],
        "reply_reviewers_avg": [
            1.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            3.0,
            1.5811388300841898
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 41,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11161528919856367933&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=UMfcdRIotC",
        "pdf": "https://openreview.net/pdf?id=UMfcdRIotC",
        "email": "campus.technion.ac.il;google.com;campus.technion.ac.il;microsoft.com;technion.ac.il;",
        "author_num": 6,
        "aff_unique_index": "0;1;0;2;3",
        "aff_unique_norm": "Technion - Israel Institute of Technology;Google;Microsoft;Israel Institute of Technology",
        "aff_unique_dep": ";Google;Microsoft Research;",
        "aff_unique_url": "https://www.technion.ac.il/en/;https://www.google.com;https://www.microsoft.com/en-us/research;https://www.technion.ac.il/en/",
        "aff_unique_abbr": "Technion;Google;MSR;Technion",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;0;1;0",
        "aff_country_unique": "Israel;United States"
    },
    {
        "id": "UMwn5l37gU",
        "title": "Non-uniform Noise Injection For Enhancing DNN Adversarial Robustness And Efficiency",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep Neural Networks (DNNs) have revolutionized a wide range of industries, from healthcare and finance to automotive, by offering unparalleled capabilities in data analysis and decision-making. Despite their transforming impact, DNNs face two critical challenges: the vulnerability to adversarial attacks and the increasing computational costs associated with more complex and larger models. In this paper, we introduce an effective method designed to simultaneously enhance adversarial robustness and execution efficiency. Unlike prior studies that enhance robustness via uniformly injecting noise, we introduce a non-uniform noise injection algorithm, strategically applied at each DNN layer to disrupt adversarial perturbations introduced in attacks. By employing approximation techniques, our approach identifies and safeguards essential neurons while strategically introducing noise into non-essential neurons. Our experimental results demonstrate that our method successfully enhances both robustness and efficiency across diverse attack scenarios, model architectures, and datasets.",
        "keywords": "Adversarial Robustness;Efficient Neural Networks;Hardware and Software Co-design",
        "primary_area": "infrastructure, software libraries, hardware, etc.",
        "supplementary_material": "",
        "author": "Zhenyu Liu;Garrett Gagnon;Swagath Venkataramani;Liu Liu",
        "authorids": "~Zhenyu_Liu5;~Garrett_Gagnon1;~Swagath_Venkataramani2;~Liu_Liu2",
        "gender": "M;M;;M",
        "homepage": ";;;https://liuliu-cs.github.io",
        "dblp": ";;;74/7037-17",
        "google_scholar": "nCvMoVMAAAAJ;;l2RQ_S8AAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";0009-0009-0754-9518;;0000-0003-0792-8146",
        "linkedin": "zhenyu-liu-85686828a/;;;",
        "or_profile": "~Zhenyu_Liu5;~Garrett_Gagnon1;~Swagath_Venkataramani2;~Liu_Liu2",
        "aff": "Rensselaer Polytechnic Institute;Rensselaer Polytechnic Institute;;Rensselaer Polytechnic Institute",
        "aff_domain": "rpi.edu;rpi.edu;;rpi.edu",
        "position": "PhD student;PhD student;;Assistant Professor",
        "bibtex": "@misc{\nliu2024nonuniform,\ntitle={Non-uniform Noise Injection For Enhancing {DNN} Adversarial Robustness And Efficiency},\nauthor={Zhenyu Liu and Garrett Gagnon and Swagath Venkataramani and Liu Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=UMwn5l37gU}\n}",
        "github": "",
        "project": "",
        "reviewers": "4ReP;A4cN;UxUE;xfb1",
        "site": "https://openreview.net/forum?id=UMwn5l37gU",
        "pdf_size": 367671,
        "rating": "3;3;3;6",
        "confidence": "5;2;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;1;2;3",
        "wc_summary": "68;30;51;89",
        "wc_strengths": "23;15;52;37",
        "wc_weaknesses": "328;191;120;79",
        "wc_questions": "3;22;19;38",
        "wc_review": "422;258;242;243",
        "wc_reply_reviewers": "0;49;0;0",
        "wc_reply_authors": "126;387;31;426",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            59.5,
            21.70829334609241
        ],
        "wc_strengths_avg": [
            31.75,
            14.095655359010449
        ],
        "wc_weaknesses_avg": [
            179.5,
            94.6374661537385
        ],
        "wc_questions_avg": [
            20.5,
            12.419742348374221
        ],
        "wc_review_avg": [
            291.25,
            75.75412530021055
        ],
        "wc_reply_reviewers_avg": [
            12.25,
            21.21762239271875
        ],
        "wc_reply_authors_avg": [
            242.5,
            167.97097963636458
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.13245323570650439,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:TlNpbz4mT6EJ:scholar.google.com/&scioq=Non-uniform+Noise+Injection+For+Enhancing+DNN+Adversarial+Robustness+And+Efficiency&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Rensselaer Polytechnic Institute",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.rpi.edu",
        "aff_unique_abbr": "RPI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "UNv8RzIf5x",
        "title": "Class-Wise Generalization Error: An Information-Theoretic Analysis",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Existing generalization theories of supervised learning typically take a holistic approach and provide bounds for the expected generalization over the whole data distribution, which implicitly assumes that the model generalizes uniformly for all the classes. In practice, however, there are significant variations in generalization performance among different classes, which cannot be captured by the existing generalization bounds. In this work, we tackle this problem by theoretically studying the class-generalization error, which quantifies the generalization performance of each individual class. We first derive a novel information-theoretic bound for class-generalization error using the KL divergence, and we further obtain several tighter bounds using the conditional mutual information (CMI), which are significantly easier to estimate in practice. We empirically validate our proposed bounds in different neural networks and show that they capture the class-generalization error behavior closely. Moreover, we show that the theoretical tools developed in this paper are useful beyond this context and can be applied in several other applications.",
        "keywords": "Information-theoretic bounds;generalization error;learning theory;class-bias",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Firas Laakom;Yuheng Bu;Moncef Gabbouj",
        "authorids": "~Firas_Laakom1;~Yuheng_Bu1;~Moncef_Gabbouj1",
        "gender": "M;M;M",
        "homepage": ";https://buyuheng.github.io/;https://www.tuni.fi/en/moncef-gabbouj",
        "dblp": "242/8179;168/8338;08/6597",
        "google_scholar": "VPWIyx8AAAAJ;1jPQEVMAAAAJ;cHukfSUAAAAJ",
        "orcid": "0000-0001-7436-5692;0000-0002-3479-4553;0000-0002-9788-2323",
        "linkedin": ";bu-yuheng-36560039/;moncef-gabbouj-2186282/?originalSubdomain=fi",
        "or_profile": "~Firas_Laakom1;~Yuheng_Bu1;~Moncef_Gabbouj1",
        "aff": "Tampere University;University of Florida;Tampere University",
        "aff_domain": "tuni.fi;ufl.edu;tuni.fi",
        "position": "PhD student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nlaakom2024classwise,\ntitle={Class-Wise Generalization Error: An Information-Theoretic Analysis},\nauthor={Firas Laakom and Yuheng Bu and Moncef Gabbouj},\nyear={2024},\nurl={https://openreview.net/forum?id=UNv8RzIf5x}\n}",
        "github": "",
        "project": "",
        "reviewers": "ceHs;yBBn;Lz6e;mpfA",
        "site": "https://openreview.net/forum?id=UNv8RzIf5x",
        "pdf_size": 8152135,
        "rating": "5;5;5;6",
        "confidence": "4;4;4;4",
        "soundness": "2;3;3;2",
        "contribution": "2;2;2;3",
        "presentation": "2;3;2;3",
        "wc_summary": "50;78;85;71",
        "wc_strengths": "26;48;52;98",
        "wc_weaknesses": "410;142;85;41",
        "wc_questions": "5;378;109;586",
        "wc_review": "491;646;331;796",
        "wc_reply_reviewers": "0;0;0;324",
        "wc_reply_authors": "783;619;280;625",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            71.0,
            13.095800853708795
        ],
        "wc_strengths_avg": [
            56.0,
            26.19160170741759
        ],
        "wc_weaknesses_avg": [
            169.5,
            143.3954322842956
        ],
        "wc_questions_avg": [
            269.5,
            227.85137699825296
        ],
        "wc_review_avg": [
            566.0,
            173.31330012437013
        ],
        "wc_reply_reviewers_avg": [
            81.0,
            140.29611541307906
        ],
        "wc_reply_authors_avg": [
            576.75,
            183.51617776098107
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Tampere University;University of Florida",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tuni.fi;https://www.ufl.edu",
        "aff_unique_abbr": "Tuni;UF",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Finland;United States"
    },
    {
        "id": "UOdz9U4fxg",
        "title": "A Linearly Convergent GAN Inversion-based Algorithm for Reverse Engineering of Deceptions",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "An important aspect of developing reliable deep learning systems is devising strategies that make these systems robust to adversarial attacks. There is a long line of work that focuses on developing defenses against these attacks, but recently, researchers have begun to study ways to reverse engineer the attack process. This allows us to not only defend against several attack models, but also classify the threat model. However, there is still a lack of theoretical guarantees for the reverse engineering process. Current approaches that give any guarantees are based on the assumption that the data lies in a union of linear subspaces, which is not a valid assumption for more complex datasets. In this paper, we propose a novel framework for reverse engineering of deceptions which supposes that the clean data lies in the range of a GAN. To classify the signal and attack, we jointly solve a GAN inversion problem and a block-sparse recovery problem.  The core contribution of this paper is to provide for the first time deterministic linear convergence guarantees for this problem. We also empirically demonstrate the merits of the proposed approach on several nonlinear datasets as compared to state-of-the-art methods.",
        "keywords": "reverse engineering deceptions;GAN inversion;optimization;adversarial attacks;generative models;inverse problems",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Darshan Thaker;Paris Giampouras;Rene Vidal",
        "authorids": "~Darshan_Thaker1;~Paris_Giampouras1;~Rene_Vidal1",
        "gender": "M;M;",
        "homepage": "https://darshanthaker.github.io;https://parisgiampouras.github.io;http://www.vision.jhu.edu",
        "dblp": "99/1272;134/0138;v/ReneVidal",
        "google_scholar": "q-EqG80AAAAJ;mZCc1TEAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;",
        "linkedin": ";;rene-vidal-74844928/",
        "or_profile": "~Darshan_Thaker1;~Paris_Giampouras1;~Rene_Vidal1",
        "aff": "University of Pennsylvania;University of Warwick;Amazon",
        "aff_domain": "seas.upenn.edu;warwick.ac.uk;amazon.com",
        "position": "PhD student;Assistant Professor;Principal Researcher",
        "bibtex": "@misc{\nthaker2024a,\ntitle={A Linearly Convergent {GAN} Inversion-based Algorithm for Reverse Engineering of Deceptions},\nauthor={Darshan Thaker and Paris Giampouras and Rene Vidal},\nyear={2024},\nurl={https://openreview.net/forum?id=UOdz9U4fxg}\n}",
        "github": "",
        "project": "",
        "reviewers": "sjuu;yzAo;MrgY",
        "site": "https://openreview.net/forum?id=UOdz9U4fxg",
        "pdf_size": 1663841,
        "rating": "3;5;6",
        "confidence": "2;3;3",
        "soundness": "2;2;2",
        "contribution": "2;2;2",
        "presentation": "2;1;3",
        "wc_summary": "49;103;113",
        "wc_strengths": "37;48;108",
        "wc_weaknesses": "140;87;217",
        "wc_questions": "48;26;47",
        "wc_review": "274;264;485",
        "wc_reply_reviewers": "287;0;57",
        "wc_reply_authors": "761;633;1359",
        "reply_reviewers": "1;0;1",
        "reply_authors": "1;1;3",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            88.33333333333333,
            28.110891523077353
        ],
        "wc_strengths_avg": [
            64.33333333333333,
            31.201851796897497
        ],
        "wc_weaknesses_avg": [
            148.0,
            53.372901988431046
        ],
        "wc_questions_avg": [
            40.333333333333336,
            10.143416036468626
        ],
        "wc_review_avg": [
            341.0,
            101.90518468982168
        ],
        "wc_reply_reviewers_avg": [
            114.66666666666667,
            124.06002131584893
        ],
        "wc_reply_authors_avg": [
            917.6666666666666,
            316.4146365486626
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.9449111825230683,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:X07bXK4pqL8J:scholar.google.com/&scioq=A+Linearly+Convergent+GAN+Inversion-based+Algorithm+for+Reverse+Engineering+of+Deceptions&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of Pennsylvania;University of Warwick;Amazon",
        "aff_unique_dep": ";;Amazon.com, Inc.",
        "aff_unique_url": "https://www.upenn.edu;https://www.warwick.ac.uk;https://www.amazon.com",
        "aff_unique_abbr": "UPenn;Warwick;Amazon",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "title": "Source-Free and Image-Only Unsupervised Domain Adaptation for Category Level Object Pose Estimation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18526",
        "id": "UPvufoBAIs",
        "author_site": "Prakhar Kaushik, Aayush Mishra, Adam Kortylewski, Alan Yuille",
        "tldr": "",
        "abstract": "We consider the problem of source-free unsupervised category-level 3D pose estimation from only RGB images to an non-annotated and unlabelled target domain without any access to source domain data or annotations during adaptation. Collecting and annotating real world 3D data and corresponding images is laborious, expensive yet unavoidable process since even 3D pose domain adaptation methods require 3D data in the target domain. We introduce a method which is capable of adapting to a nuisance ridden target domain without any 3D data or annotations. We represent object categories as simple cuboid meshes, and harness a generative model of neural feature activations modeled as a von Mises Fisher distribution at each mesh vertex learnt using differential rendering. We focus on individual mesh vertex features and iteratively update them based on their proximity to corresponding features in the target domain. Our key insight stems from the observation that specific object subparts remain stable across out-of-domain (OOD) scenarios, enabling strategic utilization of these invariant subcomponents for effective model updates. Our model is then trained in an EM fashion alternating between updating the vertex features and feature extractor. We show that our method simulates fine-tuning on a global-pseudo labelled dataset under mild assumptions which converges to the target domain asymptotically. Through extensive empirical validation, we demonstrate the potency of our simple approach in addressing the domain shift challenge and significantly enhancing pose estimation accuracy. By accentuating robust and less changed object subcomponents, our framework contributes to the evolution of UDA techniques in the context of 3D pose estimation using only images from the target domain.",
        "keywords": "3D Pose Estimation;Unsupervised Learning;Neural Rendering;Analysis-by-Synthesis",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/9e06220e2a5d5fa827804acd87f1022ccb913ca5.zip",
        "author": "Prakhar Kaushik;Aayush Mishra;Adam Kortylewski;Alan Yuille",
        "authorids": "~Prakhar_Kaushik1;~Aayush_Mishra1;~Adam_Kortylewski1;~Alan_Yuille1",
        "gender": "M;M;;M",
        "homepage": ";https://aamixsh.github.io;https://gvrl.mpi-inf.mpg.de/;",
        "dblp": "204/5219;263/3200;161/0772;y/AlanLYuille",
        "google_scholar": "GXJRSLQAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.ch/citations?user=tRLUOBIAAAAJ;",
        "orcid": ";;0000-0002-9146-4403;",
        "linkedin": ";aamixsh/;;",
        "or_profile": "~Prakhar_Kaushik1;~Aayush_Mishra1;~Adam_Kortylewski1;~Alan_Yuille1",
        "aff": "Johns Hopkins University;Adobe Systems;Albert-Ludwigs-Universit\u00e4t Freiburg;Johns Hopkins University",
        "aff_domain": "jhu.edu;adobe.com;uni-freiburg.de;johnshopkins.edu",
        "position": "PhD student;Intern;Research Group Leader;Full Professor",
        "bibtex": "@inproceedings{\nkaushik2024sourcefree,\ntitle={Source-Free and Image-Only Unsupervised Domain Adaptation for Category Level Object Pose Estimation},\nauthor={Prakhar Kaushik and Aayush Mishra and Adam Kortylewski and Alan Yuille},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=UPvufoBAIs}\n}",
        "github": "",
        "project": "",
        "reviewers": "wu5J;PE77;xesL;KkCS",
        "pdf_size": 9179872,
        "rating": "6;6;6;6",
        "confidence": "3;4;4;3",
        "soundness": "3;3;3;2",
        "contribution": "3;3;2;2",
        "presentation": "3;3;1;2",
        "wc_summary": "91;118;117;81",
        "wc_strengths": "82;102;48;38",
        "wc_weaknesses": "61;143;142;109",
        "wc_questions": "228;74;140;5",
        "wc_review": "462;437;447;233",
        "wc_reply_reviewers": "17;16;19;16",
        "wc_reply_authors": "735;841;1098;830",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;2;3;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            101.75,
            16.145819892467525
        ],
        "wc_strengths_avg": [
            67.5,
            25.743931323712
        ],
        "wc_weaknesses_avg": [
            113.75,
            33.38693606786942
        ],
        "wc_questions_avg": [
            111.75,
            82.36010866918522
        ],
        "wc_review_avg": [
            394.75,
            93.80931456950317
        ],
        "wc_reply_reviewers_avg": [
            17.0,
            1.224744871391589
        ],
        "wc_reply_authors_avg": [
            876.0,
            134.63469092325352
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7622273541116368780&as_sdt=8000005&sciodt=0,19&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=UPvufoBAIs",
        "pdf": "https://openreview.net/pdf?id=UPvufoBAIs",
        "email": "jhu.edu;adobe.com;uni-freiburg.de;johnshopkins.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Johns Hopkins University;Adobe;Albert-Ludwigs-Universit\u00e4t Freiburg",
        "aff_unique_dep": ";Adobe Systems Incorporated;",
        "aff_unique_url": "https://www.jhu.edu;https://www.adobe.com;https://www.uni-freiburg.de",
        "aff_unique_abbr": "JHU;Adobe;Albert-Ludwigs-Universit\u00e4t",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Freiburg",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "United States;Germany"
    },
    {
        "id": "UPyLDIVBNP",
        "title": "Fully Identical Initialization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep neural networks (DNNs) have achieved numerous remarkable accomplishments in practice. The success of these networks hinges on effective initialization methods, which are vital for ensuring stable and rapid convergence during training. Recently, initialization methods that maintain identity transition within layers have shown good efficiency in network training. These techniques (e.g., Fixup) set specific weights to zero to achieve identity control. However, settings of remaining weight (e.g., Fixup uses random values to initialize non-zero weights) will affect inductive bias that is achieved only by a zero weight, which may be harmful to training. Addressing this concern, we introduce fully identical initialization (IDInit), an innovative method that preserves identity in both the main and sub-stem layers of residual networks. IDInit employs a padded identity-like matrix to overcome rank constraints in non-square weight matrices. Furthermore, we show a convergence problem of an identity matrix can be solved by adding a momentum term into the optimizer. Additionally, we explore enhancing the universality of IDInit by processing higher-order weights and addressing dead neuron problems. IDInit is a straightforward yet effective initialization method, promising improved convergence, stability, and performance across various settings, including large-scale datasets and deep models. It stands as a novel solution for initializing non-standard weight matrices, offering significant advantages in network training.",
        "keywords": "Initialization;Idetity Matrix;Dynamic Isometry",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/f06aa1544ac52cc32efd2d54ffea565abe9d6357.zip",
        "author": "Yu Pan;Chaozheng Wang;Zekai Wu;Qifan Wang;Min Zhang;Zenglin Xu",
        "authorids": "~Yu_Pan1;~Chaozheng_Wang1;~Zekai_Wu1;~Qifan_Wang2;~Min_Zhang9;~Zenglin_Xu1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://yupan.me;;https://github.com/CandyOre;https://wqfcr.github.io/;https://zhangmin-nlp-ai.github.io/;https://faculty.fudan.edu.cn/xuzenglin/en/index.htm",
        "dblp": ";217/1869;;33/8610;83/5342-5;68/1538",
        "google_scholar": "NuxEyPAAAAAJ;gx5zRYIAAAAJ;;LrSyLosAAAAJ;https://scholar.google.com/citations?hl=zh-CN;gF0H9nEAAAAJ",
        "orcid": "0000-0001-7515-8492;;;0000-0002-7570-5756;;0000-0001-5550-6461",
        "linkedin": ";;;;;",
        "or_profile": "~Yu_Pan1;~Chaozheng_Wang1;~Zekai_Wu1;~Qifan_Wang2;~Min_Zhang9;~Zenglin_Xu1",
        "aff": "Harbin Institute of Technology, Shenzhen;Department of Computer Science and Engineering, The Chinese University of Hong Kong;Harbin Institute of Technology, Shenzhen;Meta AI;Harbin Institute of Technology, Shenzhen;Harbin Institute of Technology Shenzhen",
        "aff_domain": "hit.edu.cn;cse.cuhk.edu.hk;hit.edu.cn;fb.com;hit.edu.cn;hit.edu.cn",
        "position": "PhD Candidate;PhD student;Undergrad student;Principal Researcher;Full Professor;Full Professor",
        "bibtex": "@misc{\npan2024fully,\ntitle={Fully Identical Initialization},\nauthor={Yu Pan and Chaozheng Wang and Zekai Wu and Qifan Wang and Min Zhang and Zenglin Xu},\nyear={2024},\nurl={https://openreview.net/forum?id=UPyLDIVBNP}\n}",
        "github": "",
        "project": "",
        "reviewers": "FbDy;GXx1;eQMM",
        "site": "https://openreview.net/forum?id=UPyLDIVBNP",
        "pdf_size": 1548929,
        "rating": "3;6;6",
        "confidence": "4;4;4",
        "soundness": "2;3;3",
        "contribution": "2;4;3",
        "presentation": "3;2;3",
        "wc_summary": "60;64;147",
        "wc_strengths": "41;101;151",
        "wc_weaknesses": "182;316;234",
        "wc_questions": "46;97;25",
        "wc_review": "329;578;557",
        "wc_reply_reviewers": "381;165;0",
        "wc_reply_authors": "2454;2937;1105",
        "reply_reviewers": "2;1;0",
        "reply_authors": "6;6;2",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            90.33333333333333,
            40.10264607506869
        ],
        "wc_strengths_avg": [
            97.66666666666667,
            44.96912521077347
        ],
        "wc_weaknesses_avg": [
            244.0,
            55.16037224916694
        ],
        "wc_questions_avg": [
            56.0,
            30.23243291566195
        ],
        "wc_review_avg": [
            488.0,
            112.75637454263949
        ],
        "wc_reply_reviewers_avg": [
            182.0,
            156.00641012471252
        ],
        "wc_reply_authors_avg": [
            2165.3333333333335,
            775.2643993431459
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            4.666666666666667,
            1.8856180831641267
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:uqgZgvY4vH8J:scholar.google.com/&scioq=Fully+Identical+Initialization&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;2;0;0",
        "aff_unique_norm": "Harbin Institute of Technology;Chinese University of Hong Kong;Meta",
        "aff_unique_dep": ";Department of Computer Science and Engineering;Meta AI",
        "aff_unique_url": "http://en.hhit.edu.cn/;https://www.cuhk.edu.hk;https://meta.com",
        "aff_unique_abbr": "HIT;CUHK;Meta",
        "aff_campus_unique_index": "0;1;0;0;0",
        "aff_campus_unique": "Shenzhen;Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;1;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "UQNSe4Da29",
        "title": "One-Hot Encoding Strikes Back: Fully Orthogonal Coordinate-Aligned Class Representations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Representation learning via embeddings has become a central component in many machine learning tasks.  This featurization process has gotten gradually less interpretable from each coordinating having a specific meaning (e.g., one-hot encodings) to learned distributed representations where meaning is entangled across all coordinates.  In this paper, we provide a new mechanism that converts state-of-the-art embedded representations and carefully augments them to allocate some of the coordinates for specific meaning.  We focus on applications in multi-class image processing applications, where our method Iterative Class Rectification (ICR) makes the representation of each class completely orthogonal, and then changes the basis to be on coordinate axes.  This allows these representations to regain their long-lost interpretability, and demonstrating that classification accuracy is about the same or in some cases slightly improved.",
        "keywords": "Representation Learning;Interpretability;Embedding",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/fbe17ef16df1ce2be96afae5abe377acda33a22f.zip",
        "author": "Prince Osei Aboagye;Hasan Pourmahmoodaghababa;Yan Zheng;Chin-Chia Michael Yeh;Junpeng Wang;Huiyuan Chen;Xin Dai;Liang Wang;Wei Zhang;Jeff M. Phillips",
        "authorids": "~Prince_Osei_Aboagye1;~Hasan_Pourmahmoodaghababa2;~Yan_Zheng2;~Chin-Chia_Michael_Yeh1;~Junpeng_Wang1;~Huiyuan_Chen1;~Xin_Dai1;~Liang_Wang11;~Wei_Zhang52;~Jeff_M._Phillips1",
        "gender": "M;M;F;Unspecified;M;M;M;M;M;M",
        "homepage": "https://poaboagye.github.io/;;https://usa.visa.com/about-visa/visa-research/yan-zheng.html;https://mcyeh.github.io/;https://junpengw.github.io/;;https://usa.visa.com/about-visa/visa-research/xin-dai.html;;;http://www.cs.utah.edu/~jeffp/",
        "dblp": "326/7261;;10/2381-1;117/5435;172/6642-1;204/5464;98/2150;;10/4661-189.html;17/3933",
        "google_scholar": "T2ZJ6xYAAAAJ;O_6yB00AAAAJ;fCDg0VQAAAAJ;F4d7Sv4AAAAJ;6_6MH5wAAAAJ;j3y4dJwAAAAJ;n82TkYwAAAAJ;SNToU-gAAAAJ;;aFDuhV8AAAAJ",
        "orcid": ";;;0000-0002-9807-2963;0000-0002-1130-9914;0000-0002-6360-558X;;;;",
        "linkedin": "prince-osei-aboagye-669514b6;;;;;;;liang-wang-7472712/;zhangwei0119/;",
        "or_profile": "~Prince_Osei_Aboagye1;~Hasan_Pourmahmoodaghababa2;~Yan_Zheng2;~Chin-Chia_Michael_Yeh1;~Junpeng_Wang1;~Huiyuan_Chen1;~Xin_Dai1;~Liang_Wang11;~Wei_Zhang52;~Jeff_Phillips1",
        "aff": ";;VISA;VISA;VISA;Amazon;VISA;VISA;;Universit\u00e4t Leipzig",
        "aff_domain": ";;visa.com;visa.com;visa.com;amazon.com;visa.com;visa.com;;uni-leipzig.de",
        "position": ";;Principal Researcher;Research Scientist;Researcher;Researcher;Researcher;Principal Scientist;;Researcher",
        "bibtex": "@misc{\naboagye2024onehot,\ntitle={One-Hot Encoding Strikes Back: Fully Orthogonal Coordinate-Aligned Class Representations},\nauthor={Prince Osei Aboagye and Hasan Pourmahmoodaghababa and Yan Zheng and Chin-Chia Michael Yeh and Junpeng Wang and Huiyuan Chen and Xin Dai and Liang Wang and Wei Zhang and Jeff M. Phillips},\nyear={2024},\nurl={https://openreview.net/forum?id=UQNSe4Da29}\n}",
        "github": "",
        "project": "",
        "reviewers": "vbSf;E1pC;j8xu;EbUE",
        "site": "https://openreview.net/forum?id=UQNSe4Da29",
        "pdf_size": 1935708,
        "rating": "3;3;3;5",
        "confidence": "4;3;3;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;2;2",
        "wc_summary": "54;87;54;78",
        "wc_strengths": "56;24;33;63",
        "wc_weaknesses": "381;222;215;174",
        "wc_questions": "2;18;70;56",
        "wc_review": "493;351;372;371",
        "wc_reply_reviewers": "176;27;104;24",
        "wc_reply_authors": "553;65;480;188",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;1;2;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            68.25,
            14.600941750448838
        ],
        "wc_strengths_avg": [
            44.0,
            16.015617378046965
        ],
        "wc_weaknesses_avg": [
            248.0,
            78.9461842016446
        ],
        "wc_questions_avg": [
            36.5,
            27.54541704167864
        ],
        "wc_review_avg": [
            396.75,
            56.19775351381939
        ],
        "wc_reply_reviewers_avg": [
            82.75,
            62.66328669962979
        ],
        "wc_reply_authors_avg": [
            321.5,
            201.45036609547276
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Y2E0GbdEd_oJ:scholar.google.com/&scioq=One-Hot+Encoding+Strikes+Back:+Fully+Orthogonal+Coordinate-Aligned+Class+Representations&hl=en&as_sdt=0,47",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;0;0;2",
        "aff_unique_norm": "VISA;Amazon;University of Leipzig",
        "aff_unique_dep": ";Amazon.com, Inc.;",
        "aff_unique_url": "https://www.visa.com;https://www.amazon.com;https://www.uni-leipzig.de",
        "aff_unique_abbr": "VISA;Amazon;Uni Leipzig",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;1",
        "aff_country_unique": "United States;Germany"
    },
    {
        "id": "UQVhOVhUi4",
        "title": "Graph Generation with Destination-Predicting Diffusion Mixture",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Generation of graphs is a major challenge for real-world tasks that require understanding the complex nature of their non-Euclidean structures. Although diffusion models have achieved notable success in graph generation recently, they are ill-suited for modeling the structural information of graphs since learning to denoise the noisy samples does not explicitly capture the graph topology. To tackle this limitation, we propose a novel generative framework that models the topology of graphs by predicting the destination of the diffusion process, which is the original graph that has the correct topology information, as a weighted mean of data. Specifically, we design the generative process as a mixture of diffusion processes conditioned on the endpoint in the data distribution, which drives the process toward the predicted destination, resulting in rapid convergence. We introduce new simulation-free training objectives for predicting the destination, and further discuss the advantages of our framework that can explicitly model the graph topology and exploit the inductive bias of the data. Through extensive experimental validation on general graph and 2D/3D molecule generation tasks, we show that our method outperforms previous generative models, generating graphs with correct topology with both continuous (e.g. 3D coordinates) and discrete (e.g. atom types) features.",
        "keywords": "Graph Generation;Diffusion Model",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/f4cba74302585dbb41a2f6c9588c1dc400c63558.zip",
        "author": "Jaehyeong Jo;Dongki Kim;Sung Ju Hwang",
        "authorids": "~Jaehyeong_Jo1;~Dongki_Kim1;~Sung_Ju_Hwang1",
        "gender": "M;M;",
        "homepage": "https://github.com/harryjo97;https://github.com/dongkikim95;",
        "dblp": "296/2037;02/1692;",
        "google_scholar": "https://scholar.google.com/citations?hl=ko;Cz_OIhEAAAAJ;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Jaehyeong_Jo1;~Dongki_Kim1;~Sung_Ju_Hwang1",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr;",
        "position": "MS student;PhD student;",
        "bibtex": "@misc{\njo2024graph,\ntitle={Graph Generation with Destination-Predicting Diffusion Mixture},\nauthor={Jaehyeong Jo and Dongki Kim and Sung Ju Hwang},\nyear={2024},\nurl={https://openreview.net/forum?id=UQVhOVhUi4}\n}",
        "github": "",
        "project": "",
        "reviewers": "w5ob;HfR4;txBt;cip6",
        "site": "https://openreview.net/forum?id=UQVhOVhUi4",
        "pdf_size": 13110763,
        "rating": "5;6;6;8",
        "confidence": "2;3;3;3",
        "soundness": "3;3;3;4",
        "contribution": "4;2;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "59;61;22;103",
        "wc_strengths": "53;85;28;110",
        "wc_weaknesses": "232;133;32;256",
        "wc_questions": "20;49;80;107",
        "wc_review": "364;328;162;576",
        "wc_reply_reviewers": "47;144;0;133",
        "wc_reply_authors": "1606;1716;989;1077",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "4;4;3;3",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            61.25,
            28.673812093964763
        ],
        "wc_strengths_avg": [
            69.0,
            31.12073263919087
        ],
        "wc_weaknesses_avg": [
            163.25,
            88.69998590755243
        ],
        "wc_questions_avg": [
            64.0,
            32.657311585615865
        ],
        "wc_review_avg": [
            357.5,
            147.37282653189496
        ],
        "wc_reply_reviewers_avg": [
            81.0,
            59.979163048512106
        ],
        "wc_reply_authors_avg": [
            1347.0,
            317.92530569301965
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.5,
            0.5
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.6622661785325219,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11052334881763332542&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "URCfZ2NgaR",
        "title": "Structural Knowledge Informed Continual Multivariate Time Series Forecasting",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent studies in multivariate time series (MTS) forecasting reveal that explicitly modeling the hidden dependencies among different time series can yield promising forecasting performance and reliable explanations. However, modeling variable dependencies remains underexplored when a sequence of MTS under different regimes (stages) is continuously accumulated. Due to the potential distribution and dependency disparities, the underlying model may encounter the catastrophic forgetting problem, i.e., it is challenging to memorize and infer different types of variable dependencies across different regimes while maintaining forecasting performance. To this end, we propose a novel Structural Knowledge Informed Continual Learning (SKI-CL) framework to perform MTS forecasting under the continual learning setting, which leverages the structural knowledge to characterize the dynamic variable dependencies within each regime. Specifically, we first develop a deep forecasting model with a graph learner that enables fine-grained dynamic MTS modeling. Next, we impose a regularization scheme to ensure the consistency between the learned variable dependencies and the structure knowledge (e.g., physical constraints, domain knowledge, feature similarity).  Finally, we develop a representation-matching memory replay scheme to tackle the catastrophic forgetting problem, which maximizes the temporal coverage of MTS data to efficiently preserve the underlying temporal dynamics and dependency structures of each regime. Thoroughly empirical studies on synthetic and real-world benchmarks validate SKI-CL's efficacy and advantages over the state-of-the-art in tackling continual MTS forecasting tasks. In addition, SKI-CL can accurately infer learned dependencies in the test stage based on MTS data without knowing the identities of different regimes.",
        "keywords": "Continual Learning;Multivariate Time Series Forecasting;Graph Structure Learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Zijie Pan;Yushan Jiang;Dongjin Song;Fernando Gama;Sahil Garg;Kashif Rasul;Anderson Schneider;Yuriy Nevmyvaka",
        "authorids": "~Zijie_Pan3;~Yushan_Jiang1;~Dongjin_Song2;~Fernando_Gama1;~Sahil_Garg1;~Kashif_Rasul1;~Anderson_Schneider1;~Yuriy_Nevmyvaka1",
        "gender": "M;M;M;M;M;;;",
        "homepage": ";https://sites.google.com/view/jayjiang/home;https://songdj.github.io/;https://sites.google.com/view/fgama;https://sgarg87.github.io/;;;",
        "dblp": ";;41/3281;145/1221;117/4904;80/5769;;92/1859",
        "google_scholar": ";7zOFNbIAAAAJ;BJdHw6AAAAAJ;https://scholar.google.ca/citations?user=DwYn408AAAAJ;Sz2mNx0AAAAJ;cfIrwmAAAAAJ;;https://scholar.google.com/citations?hl=en",
        "orcid": "0009-0006-4893-586X;;;0000-0001-6117-8193;;;;",
        "linkedin": "zijiepan/;;;fgfgama/;;;;",
        "or_profile": "~Zijie_Pan3;~Yushan_Jiang1;~Dongjin_Song2;~Fernando_Gama1;~Sahil_Garg1;~Kashif_Rasul1;~Anderson_Schneider1;~Yuriy_Nevmyvaka1",
        "aff": "University of Connecticut;University of Connecticut;University of Connecticut;Pendulum Systems;Morgan Stanley;Zalando SE;;Morgan Stanley",
        "aff_domain": "uconn.edu;uconn.edu;uconn.edu;pendulum.global;morganstanley.com;zalando.de;;morganstanley.com",
        "position": "PhD student;PhD student;Assistant Professor;Machine Learning Scientist;Machine Learning Researcher (Vice President);Researcher;;Principal Researcher",
        "bibtex": "@misc{\npan2024structural,\ntitle={Structural Knowledge Informed Continual Multivariate Time Series Forecasting},\nauthor={Zijie Pan and Yushan Jiang and Dongjin Song and Fernando Gama and Sahil Garg and Kashif Rasul and Anderson Schneider and Yuriy Nevmyvaka},\nyear={2024},\nurl={https://openreview.net/forum?id=URCfZ2NgaR}\n}",
        "github": "",
        "project": "",
        "reviewers": "1Nyy;YCYx;RPp8",
        "site": "https://openreview.net/forum?id=URCfZ2NgaR",
        "pdf_size": 11712242,
        "rating": "3;5;8",
        "confidence": "4;3;4",
        "soundness": "2;3;3",
        "contribution": "2;3;4",
        "presentation": "2;3;3",
        "wc_summary": "104;80;66",
        "wc_strengths": "82;19;146",
        "wc_weaknesses": "161;35;61",
        "wc_questions": "644;9;4",
        "wc_review": "991;143;277",
        "wc_reply_reviewers": "801;0;13",
        "wc_reply_authors": "4268;1550;1156",
        "reply_reviewers": "2;0;1",
        "reply_authors": "9;5;3",
        "rating_avg": [
            5.333333333333333,
            2.0548046676563256
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            83.33333333333333,
            15.691469727919761
        ],
        "wc_strengths_avg": [
            82.33333333333333,
            51.84806864505391
        ],
        "wc_weaknesses_avg": [
            85.66666666666667,
            54.31594813884981
        ],
        "wc_questions_avg": [
            219.0,
            300.52731434374925
        ],
        "wc_review_avg": [
            470.3333333333333,
            372.2090213247868
        ],
        "wc_reply_reviewers_avg": [
            271.3333333333333,
            374.56849247574945
        ],
        "wc_reply_authors_avg": [
            2324.6666666666665,
            1383.5262516081466
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            5.666666666666667,
            2.494438257849294
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.1147078669352809,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13780169825984204219&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;1;2;3;2",
        "aff_unique_norm": "University of Connecticut;Pendulum Systems;Morgan Stanley;Zalando SE",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.uconn.edu;;https://www.morganstanley.com;https://www.zalando.de",
        "aff_unique_abbr": "UConn;;Morgan Stanley;Zalando",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;2;0",
        "aff_country_unique": "United States;;Germany"
    },
    {
        "id": "USWkUOfxOO",
        "title": "Pseudo-Calibration: Improving Predictive Uncertainty Estimation in Domain Adaptation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Unsupervised domain adaptation (UDA) has seen significant efforts to enhance model accuracy for an unlabeled target domain with the help of one or more labeled source domains. However, UDA models often exhibit poorly calibrated predictive uncertainty of target data, a problem that remains under-explored and poses risks in safety-critical UDA applications. The two primary challenges in addressing predictive uncertainty calibration in UDA are the absence of labeled target data and severe distribution shifts between the two domains. Traditional supervised calibration methods like \\emph{temperature scaling} are inapplicable due to the former challenge. Recent studies address the first challenge by employing \\emph{importance-weighting} with labeled source data but still suffer from the second challenge and additional complex density modeling. We propose Pseudo-Calibration (PseudoCal), a novel post-hoc calibration framework. In contrast to prior approaches, we consider UDA calibration as a target domain-specific unsupervised problem rather than a \\emph{covariate shift} problem across domains. Our innovative use of inference-stage \\emph{mixup} and \\emph{cluster assumption} guarantees that a synthesized labeled pseudo-target set captures the structure of the real target. In this way, we turn the unsupervised calibration problem into a supervised one, readily solvable with \\emph{temperature scaling}. Extensive empirical evaluation across 5 diverse UDA scenarios involving 10 UDA methods consistently demonstrates the superior performance of PseudoCal over alternative calibration methods.",
        "keywords": "Domain Adaptation; Predictive Uncertainty; Model Calibration",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Dapeng Hu;Jian Liang;Xinchao Wang;Chuan-Sheng Foo",
        "authorids": "~Dapeng_Hu2;~Jian_Liang1;~Xinchao_Wang1;~Chuan-Sheng_Foo1",
        "gender": "M;M;M;M",
        "homepage": "https://lhxxhb.github.io/;https://liangjian.xyz;http://ai.stanford.edu/~csfoo;https://sites.google.com/site/sitexinchaowang/",
        "dblp": "247/3382;19/2208-1;73/1823;",
        "google_scholar": "wv9HjA0AAAAJ;https://scholar.google.com/citations?hl=en;AgbeqGkAAAAJ;https://scholar.google.com.tw/citations?user=w69Buq0AAAAJ",
        "orcid": ";0000-0003-3890-1894;0000-0002-4748-5792;",
        "linkedin": ";;;",
        "or_profile": "~Dapeng_Hu2;~Jian_Liang1;~Chuan-Sheng_Foo1;~Xinchao_WANG3",
        "aff": "Apple;Institute of Automation, Chinese Academy of Sciences;Institute for Infocomm Research, A*STAR;National University of Singapore",
        "aff_domain": "apple.com;ia.ac.cn;i2r.a-star.edu.sg;nus.edu",
        "position": "Siri Engineer;Associate Professor;Principal Scientist;Assistant Professor",
        "bibtex": "@misc{\nhu2024pseudocalibration,\ntitle={Pseudo-Calibration: Improving Predictive Uncertainty Estimation in Domain Adaptation},\nauthor={Dapeng Hu and Jian Liang and Xinchao Wang and Chuan-Sheng Foo},\nyear={2024},\nurl={https://openreview.net/forum?id=USWkUOfxOO}\n}",
        "github": "",
        "project": "",
        "reviewers": "M3LQ;SpZE;dbpq;fgV1",
        "site": "https://openreview.net/forum?id=USWkUOfxOO",
        "pdf_size": 2393596,
        "rating": "5;5;6;6",
        "confidence": "4;4;4;4",
        "soundness": "2;2;3;2",
        "contribution": "2;2;2;2",
        "presentation": "3;2;3;3",
        "wc_summary": "72;47;46;70",
        "wc_strengths": "47;30;46;56",
        "wc_weaknesses": "173;210;132;58",
        "wc_questions": "48;2;5;82",
        "wc_review": "340;289;229;266",
        "wc_reply_reviewers": "0;88;0;0",
        "wc_reply_authors": "1568;1310;1145;1106",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "4;3;3;3",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            58.75,
            12.275483697190918
        ],
        "wc_strengths_avg": [
            44.75,
            9.364160400164021
        ],
        "wc_weaknesses_avg": [
            143.25,
            56.42417478350924
        ],
        "wc_questions_avg": [
            34.25,
            33.03312731183652
        ],
        "wc_review_avg": [
            281.0,
            40.23058537978288
        ],
        "wc_reply_reviewers_avg": [
            22.0,
            38.1051177665153
        ],
        "wc_reply_authors_avg": [
            1282.25,
            181.88234521250268
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.25,
            0.4330127018922193
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6957885543463410869&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Apple;Chinese Academy of Sciences;Institute for Infocomm Research;National University of Singapore",
        "aff_unique_dep": "Apple Inc.;Institute of Automation;;",
        "aff_unique_url": "https://www.apple.com;http://www.ia.cas.cn;https://www.i2r.a-star.edu.sg;https://www.nus.edu.sg",
        "aff_unique_abbr": "Apple;CAS;I2R;NUS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;2",
        "aff_country_unique": "United States;China;Singapore"
    },
    {
        "id": "UTGv8CayNt",
        "title": "Chain-of-Thought Predictive Control",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We study generalizable policy learning from demonstrations for complex low-level control tasks (e.g., contact-rich object manipulations). We propose a novel hierarchical imitation learning method that utilizes scalable, albeit sub-optimal, demonstrations. Firstly, we propose an observation space-agnostic approach that efficiently discovers the multi-step subgoal decomposition (sequences of key observations) of the demos in an unsupervised manner. By grouping temporarily close and functionally similar actions into subskill-level segments, the discovered breakpoints (the segment boundaries) constitute a chain of planning steps (i.e., the chain-of-thought) to complete the task. Next, we propose a Transformer-based design that effectively learns to predict the chain-of-thought (CoT) as the high-level guidance for low-level action. We couple action and CoT predictions via prompt tokens and a hybrid masking strategy, which enable dynamically updated CoT guidance at test time and improve feature representation of the trajectory for generalizable policy learning. Our method, named Chain-of-Thought Predictive Control (CoTPC), consistently surpasses existing strong baselines on a wide range of challenging low-level manipulation tasks with scalable yet sub-optimal demos.",
        "keywords": "Hierarchical Imitation Learning;Robotic Manipulation",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/832e1f21e4109c6e46d3e8e0b72b74800d184545.zip",
        "author": "Zhiwei Jia;Vineet Thumuluri;Fangchen Liu;Linghao Chen;Zhiao Huang;Hao Su",
        "authorids": "~Zhiwei_Jia1;~Vineet_Thumuluri1;~Fangchen_Liu2;~Linghao_Chen2;~Zhiao_Huang1;~Hao_Su1",
        "gender": "M;;F;;M;M",
        "homepage": "https://www.zjia.xyz/;;https://fangchenliu.github.io/;https://ootts.github.io/;;http://ai.ucsd.edu/~haosu",
        "dblp": ";;;262/3716;172/1410;09/4945-1",
        "google_scholar": "nQhMGqAAAAAJ;;;;;1P8Zu04AAAAJ",
        "orcid": ";;;;;",
        "linkedin": "zhiweijia;;;;;",
        "or_profile": "~Zhiwei_Jia1;~Vineet_Thumuluri1;~Fangchen_Liu2;~Linghao_Chen2;~Zhiao_Huang1;~Hao_Su1",
        "aff": "Zoom Communications;;University of California, Berkeley;Zhejiang University;University of California, San Diego, University of California, San Diego;University of California, San Diego",
        "aff_domain": "zoom.com;;berkeley.edu;zju.edu.cn;eng.ucsd.edu;ucsd.edu",
        "position": "Researcher;;PhD student;PhD student;PhD student;Associate Professor",
        "bibtex": "@misc{\njia2024chainofthought,\ntitle={Chain-of-Thought Predictive Control},\nauthor={Zhiwei Jia and Vineet Thumuluri and Fangchen Liu and Linghao Chen and Zhiao Huang and Hao Su},\nyear={2024},\nurl={https://openreview.net/forum?id=UTGv8CayNt}\n}",
        "github": "",
        "project": "",
        "reviewers": "QpAT;HDpH;iFzy;2mSo",
        "site": "https://openreview.net/forum?id=UTGv8CayNt",
        "pdf_size": 2263379,
        "rating": "5;5;6;6",
        "confidence": "4;3;4;4",
        "soundness": "2;3;2;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;3;2",
        "wc_summary": "41;98;79;122",
        "wc_strengths": "123;32;114;113",
        "wc_weaknesses": "614;155;21;264",
        "wc_questions": "36;49;10;152",
        "wc_review": "814;334;224;651",
        "wc_reply_reviewers": "45;0;18;0",
        "wc_reply_authors": "1326;712;42;583",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "3;1;1;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            85.0,
            29.62262648719725
        ],
        "wc_strengths_avg": [
            95.5,
            36.86800781165155
        ],
        "wc_weaknesses_avg": [
            263.5,
            219.9028194453177
        ],
        "wc_questions_avg": [
            61.75,
            53.9646875280493
        ],
        "wc_review_avg": [
            505.75,
            237.16911160604369
        ],
        "wc_reply_reviewers_avg": [
            15.75,
            18.417043736713012
        ],
        "wc_reply_authors_avg": [
            665.75,
            456.61273252067775
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 25,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9612779628799289760&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;2;3;3",
        "aff_unique_norm": "Zoom Communications;University of California, Berkeley;Zhejiang University;University of California, San Diego",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://zoom.us;https://www.berkeley.edu;https://www.zju.edu.cn;https://www.ucsd.edu",
        "aff_unique_abbr": "Zoom;UC Berkeley;ZJU;UCSD",
        "aff_campus_unique_index": "1;2;2",
        "aff_campus_unique": ";Berkeley;San Diego",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "UTLv72uDlS",
        "title": "Scaling Safe Learning-based Control to Long-Horizon Temporal Tasks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper introduces a model-based approach for training parameterized policies for an autonomous agent operating in a highly nonlinear (albeit deterministic) environment. We desire the trained policy to ensure that the agent satisfies specific task objectives and safety constraints, both expressed in Signal Temporal Logic. We show that this learning problem reduces to the problem of training recurrent neural networks (RNNs), where the number of recurrent units is proportional to the temporal horizon of the agent's task objectives. This poses a challenge: RNNs are susceptible to vanishing and exploding gradients, and naive gradient descent-based strategies to solve long-horizon task objectives thus suffer from the same problems. To tackle this challenge, we introduce a novel gradient approximation algorithm based on the idea of gradient sampling, and a smooth computation graph that provides a neurosymblic encoding of STL formulas. We show that these two methods combined improve the quality of the stochastic gradient, enabling scalable backpropagation over long time horizon trajectories. We demonstrate the efficacy of our approach on various motion planning applications requiring complex spatio-temporal and sequential tasks ranging over thousands of time steps.",
        "keywords": "neural network;control;signal temporal logics",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "",
        "author": "Navid Hashemi;Bardh Hoxha;Danil V. Prokhorov;Georgios Fainekos;Jyotirmoy V. Deshmukh",
        "authorids": "~Navid_Hashemi1;~Bardh_Hoxha1;~Danil_V._Prokhorov1;~Georgios_Fainekos1;~Jyotirmoy_V._Deshmukh1",
        "gender": "M;M;M;M;M",
        "homepage": ";https://www.bhoxha.com;;https://www.fainekos.net/;https://jdeshmukh.github.io",
        "dblp": ";121/3956;74/5147;34/4314;42/160",
        "google_scholar": "M7Ht5zIAAAAJ;kK7LubkAAAAJ;7GTfQmgAAAAJ;https://scholar.google.com.tw/citations?user=WGRYgBEAAAAJ;https://scholar.google.com.tw/citations?user=CwFX74MAAAAJ",
        "orcid": ";;0000-0002-6208-4233;0000-0002-0456-2129;0000-0002-8815-464X",
        "linkedin": ";bardhhoxha/;danil-prokhorov-78b154/;fainekos/;jdeshmukh/",
        "or_profile": "~Navid_Hashemi1;~Bardh_Hoxha1;~Danil_V._Prokhorov1;~Georgios_Fainekos1;~Jyotirmoy_Deshmukh1",
        "aff": ";Toyota Motor Corporation;Toyota Motor Corporation;Toyota NA R&D;University of Southern California",
        "aff_domain": ";toyota.com;toyota.com;toyota.com;usc.edu",
        "position": ";Principal Researcher;Researcher;Principal Researcher;Associate Professor",
        "bibtex": "@misc{\nhashemi2024scaling,\ntitle={Scaling Safe Learning-based Control to  Long-Horizon Temporal Tasks},\nauthor={Navid Hashemi and Bardh Hoxha and Danil V. Prokhorov and Georgios Fainekos and Jyotirmoy V. Deshmukh},\nyear={2024},\nurl={https://openreview.net/forum?id=UTLv72uDlS}\n}",
        "github": "",
        "project": "",
        "reviewers": "NFTL;xgYh;Ga35;pDd8",
        "site": "https://openreview.net/forum?id=UTLv72uDlS",
        "pdf_size": 2331674,
        "rating": "3;3;5;6",
        "confidence": "4;2;4;5",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "2;1;2;3",
        "wc_summary": "65;92;109;46",
        "wc_strengths": "72;79;39;43",
        "wc_weaknesses": "606;152;165;137",
        "wc_questions": "3;49;99;5",
        "wc_review": "746;372;412;231",
        "wc_reply_reviewers": "26;0;83;0",
        "wc_reply_authors": "2478;1445;1685;244",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "4;2;3;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            78.0,
            24.238399287081645
        ],
        "wc_strengths_avg": [
            58.25,
            17.483921184905864
        ],
        "wc_weaknesses_avg": [
            265.0,
            197.12559448229953
        ],
        "wc_questions_avg": [
            39.0,
            39.21734310225516
        ],
        "wc_review_avg": [
            440.25,
            188.89464656257465
        ],
        "wc_reply_reviewers_avg": [
            27.25,
            33.89229263416684
        ],
        "wc_reply_authors_avg": [
            1463.0,
            800.904800834656
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.7505683356701914,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:eHtT9AgZUT8J:scholar.google.com/&scioq=Scaling+Safe+Learning-based+Control+to+Long-Horizon+Temporal+Tasks&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "Toyota Motor Corporation;Toyota Research Institute (TRI);University of Southern California",
        "aff_unique_dep": ";R&D;",
        "aff_unique_url": "https://www.toyota-global.com;https://www.toyota-global.com/innovation/tri;https://www.usc.edu",
        "aff_unique_abbr": "Toyota;TRI;USC",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Los Angeles",
        "aff_country_unique_index": "0;0;1;1",
        "aff_country_unique": "Japan;United States"
    },
    {
        "id": "UU9Icwbhin",
        "title": "Retentive Network: A Successor to Transformer for Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this work, we propose Retentive Network (RetNet) as a foundation architecture for large language models, simultaneously achieving training parallelism, low-cost inference, and good performance. We theoretically derive the connection between recurrence and attention. Then we propose the retention mechanism for sequence modeling, which supports three computation paradigms, i.e., parallel, recurrent, and chunkwise recurrent. Specifically, the parallel representation allows for training parallelism. The recurrent representation enables low-cost $O(1)$ inference, which improves decoding throughput, latency, and GPU memory without sacrificing performance. The chunkwise recurrent representation facilitates efficient long-sequence modeling with linear complexity, where each chunk is encoded parallelly while recurrently summarizing the chunks. Experimental results on language modeling show that RetNet achieves favorable scaling results, parallel training, low-cost deployment, and efficient inference. The intriguing properties make RetNet a strong successor to Transformer for large language models.",
        "keywords": "Large Language Models;Inference Efficiency",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Yutao Sun;Li Dong;Shaohan Huang;Shuming Ma;Yuqing Xia;Jilong Xue;Jianyong Wang;Furu Wei",
        "authorids": "~Yutao_Sun1;~Li_Dong1;~Shaohan_Huang1;~Shuming_Ma1;~Yuqing_Xia1;~Jilong_Xue2;~Jianyong_Wang2;~Furu_Wei1",
        "gender": "M;M;M;;;M;M;M",
        "homepage": "https://sunyt32.github.io/;http://dong.li;;https://www.microsoft.com/en-us/research/people/shumma/;https://github.com/xiayuqing0622;;http://dbgroup.cs.tsinghua.edu.cn/wangjy/;https://www.microsoft.com/en-us/research/people/fuwei/",
        "dblp": "01/9758;85/5090-4;176/0380;;211/8365;06/10336.html;24/2006;72/5870",
        "google_scholar": "apGDooYAAAAJ;wEfQgPgAAAAJ;;;3UAveGYAAAAJ;xKI6HXgAAAAJ;VfBaiG8AAAAJ;G-V1VpwAAAAJ",
        "orcid": ";;;;;;0000-0002-7555-170X;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Yutao_Sun1;~Li_Dong1;~Shaohan_Huang1;~Shuming_Ma1;~Yuqing_Xia1;~Jilong_Xue2;~Jianyong_Wang2;~Furu_Wei1",
        "aff": "Tsinghua University;Microsoft Research;Microsoft;Microsoft;Microsoft Research;Microsoft Research;Tsinghua University;Microsoft Research",
        "aff_domain": "tsinghua.edu.cn;microsoft.com;microsoft.com;microsoft.com;research.microsoft.com;microsoft.com;tsinghua.edu.cn;microsoft.com",
        "position": "PhD student;Principal Researcher;Researcher;Researcher;Researcher;Principal Researcher;Full Professor;Distinguished Scientist",
        "bibtex": "@misc{\nsun2024retentive,\ntitle={Retentive Network: A Successor to Transformer for Large Language Models},\nauthor={Yutao Sun and Li Dong and Shaohan Huang and Shuming Ma and Yuqing Xia and Jilong Xue and Jianyong Wang and Furu Wei},\nyear={2024},\nurl={https://openreview.net/forum?id=UU9Icwbhin}\n}",
        "github": "",
        "project": "",
        "reviewers": "8FpU;Y3WY;pKLR;4ryG",
        "site": "https://openreview.net/forum?id=UU9Icwbhin",
        "pdf_size": 554557,
        "rating": "3;5;5;6",
        "confidence": "5;2;5;5",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;2;2",
        "wc_summary": "20;140;87;34",
        "wc_strengths": "17;22;17;51",
        "wc_weaknesses": "288;107;297;94",
        "wc_questions": "719;73;42;32",
        "wc_review": "1044;342;443;211",
        "wc_reply_reviewers": "0;18;0;0",
        "wc_reply_authors": "826;347;315;121",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.25,
            1.299038105676658
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            70.25,
            47.39396058571176
        ],
        "wc_strengths_avg": [
            26.75,
            14.148763196831021
        ],
        "wc_weaknesses_avg": [
            196.5,
            96.16262267638086
        ],
        "wc_questions_avg": [
            216.5,
            290.5120479429382
        ],
        "wc_review_avg": [
            510.0,
            319.0885457047934
        ],
        "wc_reply_reviewers_avg": [
            4.5,
            7.794228634059948
        ],
        "wc_reply_authors_avg": [
            402.25,
            259.48542829993363
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.13245323570650439,
        "gs_citation": 386,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14499954689213944503&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1;1;1;1;0;1",
        "aff_unique_norm": "Tsinghua University;Microsoft",
        "aff_unique_dep": ";Microsoft Research",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.microsoft.com/en-us/research",
        "aff_unique_abbr": "THU;MSR",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;1;1;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "UVSKuh9eK5",
        "title": "CLIP Exhibits Improved Compositional Generalization Through Representation Disentanglement",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Vision-language models (VLMs), such as CLIP, have shown promising Out-of-Distribution (OoD) generalization under various flavors of distribution shifts. Recent studies attempted to investigate the leading cause of this property. In this work, we target the same goal, but focus on a certain type of distribution shift, in which test images contain unseen compositions of attribute-object pairs, but with the objects and attributes being individually seen during training. The models are expected to classify those images into the composition classes, i.e. attribute-object pairs, and also into object classes by ignoring attributes. We carefully designed an authentic image test dataset consisting of attributes for objects that are unlikely encountered in the CLIP training data. We found that the compositions diversity in the training data, as measured by normalized mutual information between objects and attributes, has a significant effect on the improvement of compositional generalization in the CLIP models. We found that image/text representation disentanglement with respect to the composition constituents also plays a key role in the improved generalization of these models. We notice that larger training datasets could potentially trigger emergence of such a disentanglement, as the compositions are typically more diverse in such datasets. We validate this hypothesis through different representation disentanglement metrics, including Z-Diff, and explicitness scores for various CLIPs. Our findings reveal a correlation between better OoD performance and higher scores in these disentanglement metrics, suggesting that improved disentanglement potentially contributes to enhanced compositional OoD generalization in VLMs.",
        "keywords": "Compositional generalization;Out-of-distribution generalization;Vision-language models;CLIP;Disentangled representations;Language supervision;data-centric AI",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Reza Abbasi;Amirarshia Hemmat;Mahdi Samiei;Mohammad Hossein Rohban;Mahdieh Soleymani Baghshah",
        "authorids": "~Reza_Abbasi2;~Amirarshia_Hemmat1;~Mahdi_Samiei1;~Mohammad_Hossein_Rohban1;~Mahdieh_Soleymani_Baghshah1",
        "gender": "M;M;M;M;F",
        "homepage": ";https://github.com/arshiahemmat;;http://sharif.edu/~rohban/;http://sharif.edu/~soleymani/",
        "dblp": ";;;43/8108;21/473",
        "google_scholar": "B_lX57gAAAAJ;lASBGvMAAAAJ;;pRyJ6FkAAAAJ;S1U0KlgAAAAJ",
        "orcid": ";;;;",
        "linkedin": "reza-abbasi-sut;;mmsamiei/;;",
        "or_profile": "~Reza_Abbasi2;~Amirarshia_Hemmat1;~Mahdi_Samiei1;~Mohammad_Hossein_Rohban1;~Mahdieh_Baghshah1",
        "aff": "Sharif University of Technology;Isfahan University, University of Tehran;Sharif University of Technology, Sharif University of Technology;Sharif University of Technology;Sharif University of Technology",
        "aff_domain": "sharif.edu;ui.ac.ir;ce.sharif.edu;sharif.edu;sharif.edu",
        "position": "MS student;Undergrad student;PhD student;Associate Professor;Associate Professor",
        "bibtex": "@misc{\nabbasi2024clip,\ntitle={{CLIP} Exhibits Improved Compositional Generalization Through Representation Disentanglement},\nauthor={Reza Abbasi and Amirarshia Hemmat and Mahdi Samiei and Mohammad Hossein Rohban and Mahdieh Soleymani Baghshah},\nyear={2024},\nurl={https://openreview.net/forum?id=UVSKuh9eK5}\n}",
        "github": "",
        "project": "",
        "reviewers": "qiWV;PAYB;unRs",
        "site": "https://openreview.net/forum?id=UVSKuh9eK5",
        "pdf_size": 4274545,
        "rating": "5;6;6",
        "confidence": "3;3;3",
        "soundness": "2;3;3",
        "contribution": "3;2;3",
        "presentation": "2;3;2",
        "wc_summary": "111;92;60",
        "wc_strengths": "25;62;79",
        "wc_weaknesses": "755;306;226",
        "wc_questions": "69;25;38",
        "wc_review": "960;485;403",
        "wc_reply_reviewers": "366;206;126",
        "wc_reply_authors": "2880;989;1421",
        "reply_reviewers": "2;2;1",
        "reply_authors": "7;3;3",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            87.66666666666667,
            21.044925490219462
        ],
        "wc_strengths_avg": [
            55.333333333333336,
            22.543784558547888
        ],
        "wc_weaknesses_avg": [
            429.0,
            232.81895684558563
        ],
        "wc_questions_avg": [
            44.0,
            18.457157599876172
        ],
        "wc_review_avg": [
            616.0,
            245.53750562117116
        ],
        "wc_reply_reviewers_avg": [
            232.66666666666666,
            99.77753031397177
        ],
        "wc_reply_authors_avg": [
            1763.3333333333333,
            809.0588496655989
        ],
        "reply_reviewers_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            4.333333333333333,
            1.8856180831641267
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:QCPtnpJyGPYJ:scholar.google.com/&scioq=CLIP+Exhibits+Improved+Compositional+Generalization+Through+Representation+Disentanglement&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0;0",
        "aff_unique_norm": "Sharif University of Technology;Isfahan University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.sharif.edu;https://www.ui.ac.ir",
        "aff_unique_abbr": "SUT;UI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Iran"
    },
    {
        "id": "UVb0g26xyH",
        "title": "Vocabulary for Universal Approximation: A Linguistic Perspective of Mapping Compositions",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In recent years, deep learning-based sequence modelings, such as language models, have received much attention and success, which pushes researchers to explore the possibility of transforming non-sequential problems into a sequential form. Following this thought, deep neural networks can be represented as composite functions of a sequence of mappings, linear or nonlinear, where each composition can be viewed as a \\emph{word}. However, the weights of linear mappings are undetermined and hence require an infinite number of words. In this article, we investigate the finite case and constructively prove the existence of a finite \\emph{vocabulary} $V$={$\\phi_i: \\mathbb{R}^d \\to \\mathbb{R}^d | i=1,...,n$} with $n=O(d^2)$ for the universal approximation. That is, for any continuous mapping $f: \\mathbb{R}^d \\to \\mathbb{R}^d$, compact domain $\\Omega$ and $\\varepsilon>0$, there is a sequence of mappings $\\phi_{i_1}, ..., \\phi_{i_m} \\in V, m \\in Z_+$, such that the composition $\\phi_{i_m} \\circ ... \\circ \\phi_{i_1} $ approximates $f$ on $\\Omega$ with an error less than $\\varepsilon$. Our results provide a linguistic perspective of composite mappings and suggest a cross-disciplinary study between linguistics and approximation theory.",
        "keywords": "Neural Networks;Approximation Theory;Composite Mappings;Sequence Modeling",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Yongqiang Cai",
        "authorids": "~Yongqiang_Cai1",
        "gender": "M",
        "homepage": "",
        "dblp": "228/6809",
        "google_scholar": "https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0002-2666-0539",
        "linkedin": "",
        "or_profile": "~Yongqiang_Cai1",
        "aff": "Beijing Normal University",
        "aff_domain": "bnu.edu.cn",
        "position": "Lecturer",
        "bibtex": "@misc{\ncai2024vocabulary,\ntitle={Vocabulary for Universal Approximation: A Linguistic Perspective of Mapping Compositions},\nauthor={Yongqiang Cai},\nyear={2024},\nurl={https://openreview.net/forum?id=UVb0g26xyH}\n}",
        "github": "",
        "project": "",
        "reviewers": "jZQe;zLrM;JbK3;gE5q",
        "site": "https://openreview.net/forum?id=UVb0g26xyH",
        "pdf_size": 338838,
        "rating": "3;5;6;8",
        "confidence": "3;3;1;2",
        "soundness": "2;3;3;4",
        "contribution": "2;2;3;4",
        "presentation": "2;3;2;3",
        "wc_summary": "26;177;50;72",
        "wc_strengths": "20;65;64;55",
        "wc_weaknesses": "197;1370;24;72",
        "wc_questions": "1;56;21;74",
        "wc_review": "244;1668;159;273",
        "wc_reply_reviewers": "0;96;0;6",
        "wc_reply_authors": "226;384;150;264",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            2.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            81.25,
            57.62540672307659
        ],
        "wc_strengths_avg": [
            51.0,
            18.3166590840142
        ],
        "wc_weaknesses_avg": [
            415.75,
            554.5441258367092
        ],
        "wc_questions_avg": [
            38.0,
            28.626910416599273
        ],
        "wc_review_avg": [
            586.0,
            626.0962386087302
        ],
        "wc_reply_reviewers_avg": [
            25.5,
            40.77683165720456
        ],
        "wc_reply_authors_avg": [
            256.0,
            84.53401682163222
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.5853694070049635,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13576541971883970788&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0",
        "aff_unique_norm": "Beijing Normal University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.bnu.edu.cn",
        "aff_unique_abbr": "BNU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "UX9lljSZqX",
        "title": "Unified Static and Dynamic: Temporal Filtering Network for Efficient Video Grounding",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Inspired by the activity-silent and persistent activity mechanisms in human visual perception biology, we design a Unified Static and Dynamic Network (UniSDNet), to learn the semantic association between text/audio queries and the video in a cross-modal environment for efficient video grounding. For static modeling, we add the MLP into the residual structure (ResMLP) to handle the global comprehensive interaction between and in the video and multiple queries, achieving mutual semantic supplement. For dynamic modeling, we integrate three characteristics of persistent activity mechanism into network design for a better video context comprehension. Specifically, we construct a diffusive connected video clip graph on the basis of 2D spare temporal masking to reflect the \u201cshort-term effect\u201d relationship. We innovatively consider the temporal distance and relevance as the joint \u201cauxiliary evidence clues\u201d and design a multi-kernel Temporal Gaussian Filter to\nexpand the joint clue to high-dimensional space, simulating the \u201ccomplex visual perception\u201d, and then conduct element level filtering convolution operations on neighbour clip nodes in message passing stage for finally generating and ranking the candidate proposals. Our UniSDNet is applicable to both Natural Language Video Grounding(NLVG) and Spoken Language Video Grounding(SLVG) tasks. Our UniSDNet achieves SOTA performance on three widely used datasets for NLVG, as well as datasets for SLVG, e.g., reporting new records at 38.88% R@1, IoU @0.7 on ActivityNet Captions and 40.26% R@1, IoU @0.5 on TACoS. To facilitate this field, we collect new two datasets (Charades-STA Speech and TACoS Speech) for SLVG. Meanwhile, the inference speed of our UniSDNet is 1.56\u00d7 faster than the strong multi-query benchmark. We will release the new data and our source code after blind review.",
        "keywords": "Natural Language Video Grounding;Spoken Language Video Grounding;Cross-modal interactions",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Jingjing Hu;Dan Guo;Kun Li;Zhan Si;Xun Yang;Meng Wang",
        "authorids": "~Jingjing_Hu4;~Dan_Guo1;~Kun_Li4;~Zhan_Si1;~Xun_Yang1;~Meng_Wang3",
        "gender": ";F;M;F;M;M",
        "homepage": "https://github.com/xian-sh;http://faculty.hfut.edu.cn/gd/zh_CN/index.htm;;https://github.com/xianHUJINGJING;https://sites.google.com/site/xunyangprofile/;https://sites.google.com/view/meng-wang/home",
        "dblp": ";44/6570-1.html;75/1458-8;;72/4772-1;93/6765-2",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;DsEONuMAAAAJ;UQ_bInoAAAAJ;;ro8lzsUAAAAJ;rHagaaIAAAAJ",
        "orcid": "0009-0003-6944-0848;0000-0003-2594-254X;0000-0001-5083-2145;;0000-0003-0201-1638;0000-0002-3094-7735",
        "linkedin": ";;;;;",
        "or_profile": "~Jingjing_Hu4;~Dan_Guo1;~Kun_Li4;~Zhan_Si1;~Xun_Yang1;~Meng_Wang3",
        "aff": "Hefei University of Technology;Hefei University of Technology;Zhejiang University;Anhui University;University of Science and Technology of China;Hefei University of Technology",
        "aff_domain": "hfut.edu.cn;hfut.edu.cn;zju.edu.cn;ahu.edu.cn;ustc.edu.cn;hfut.edu.cn",
        "position": "MS student;Full Professor;Researcher;MS student;Full Professor;Full Professor",
        "bibtex": "@misc{\nhu2024unified,\ntitle={Unified Static and Dynamic: Temporal Filtering Network for Efficient Video Grounding},\nauthor={Jingjing Hu and Dan Guo and Kun Li and Zhan Si and Xun Yang and Meng Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=UX9lljSZqX}\n}",
        "github": "",
        "project": "",
        "reviewers": "Z5of;TT77;1gED;GE2s",
        "site": "https://openreview.net/forum?id=UX9lljSZqX",
        "pdf_size": 7744105,
        "rating": "5;6;6;8",
        "confidence": "3;4;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;3;3;4",
        "wc_summary": "63;66;107;80",
        "wc_strengths": "44;87;73;88",
        "wc_weaknesses": "101;182;110;289",
        "wc_questions": "18;16;37;6",
        "wc_review": "226;351;327;463",
        "wc_reply_reviewers": "0;27;30;60",
        "wc_reply_authors": "1465;1792;1123;1748",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "3;3;2;3",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            79.0,
            17.392527130926087
        ],
        "wc_strengths_avg": [
            73.0,
            17.76231966833161
        ],
        "wc_weaknesses_avg": [
            170.5,
            75.2744976735149
        ],
        "wc_questions_avg": [
            19.25,
            11.211043662389331
        ],
        "wc_review_avg": [
            341.75,
            84.26557719496141
        ],
        "wc_reply_reviewers_avg": [
            29.25,
            21.25294097295713
        ],
        "wc_reply_authors_avg": [
            1532.0,
            267.4069931770671
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            0.4330127018922193
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.6622661785325219,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:flQ2Fl97ZlQJ:scholar.google.com/&scioq=Unified+Static+and+Dynamic:+Temporal+Filtering+Network+for+Efficient+Video+Grounding&hl=en&as_sdt=0,15",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2;3;0",
        "aff_unique_norm": "Hefei University of Technology;Zhejiang University;Anhui University;University of Science and Technology of China",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "http://www.hfut.edu.cn/;https://www.zju.edu.cn;http://www.ahu.edu.cn/;http://www.ustc.edu.cn",
        "aff_unique_abbr": "HUT;ZJU;AHU;USTC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Separate and Diffuse: Using a Pretrained Diffusion Model for Better Source Separation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18525",
        "id": "UXALv0lJZS",
        "author_site": "Shahar Lutati, Eliya Nachmani, Lior Wolf",
        "tldr": "",
        "abstract": "The problem of speech separation, also known as the cocktail party problem,\nrefers to the task of isolating a single speech signal from a mixture of speech\nsignals. Previous work on source separation derived an upper bound for the\nsource separation task in the domain of human speech. This bound is derived for\ndeterministic models. Recent advancements in generative models challenge this\nbound. We show how the upper bound can be generalized to the case of random\ngenerative models. Applying a diffusion model Vocoder that was pretrained to\nmodel single-speaker voices on the output of a deterministic separation model leads\nto state-of-the-art separation results. It is shown that this requires one to combine\nthe output of the separation model with that of the diffusion model. In our method,\na linear combination is performed, in the frequency domain, using weights that are\ninferred by a learned model. We show state-of-the-art results on 2, 3, 5, 10, and 20\nspeakers on multiple benchmarks. In particular, for two speakers, our method is\nable to surpass what was previously considered the upper performance bound.",
        "keywords": "Source Separation;Deep Learning;Diffusion Models;Upper Bound;Information Bound",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/0675746542ddbb45417df71a05ccdf65286e5461.zip",
        "author": "Shahar Lutati;Eliya Nachmani;Lior Wolf",
        "authorids": "~Shahar_Lutati1;~Eliya_Nachmani1;~Lior_Wolf1",
        "gender": "M;M;M",
        "homepage": ";;http://www.cs.tau.ac.il/~wolf",
        "dblp": "292/4297;183/6370;83/4103",
        "google_scholar": "https://scholar.google.co.il/citations?user=S8gPxXUAAAAJ;;UbFrXTsAAAAJ",
        "orcid": ";;0000-0001-5578-8892",
        "linkedin": "shahar-lutati-4b4863118/;;",
        "or_profile": "~Shahar_Lutati1;~Eliya_Nachmani1;~Lior_Wolf1",
        "aff": "Tel Aviv University;Research, Google;Tel Aviv University",
        "aff_domain": "tau.ac.il;research.google.com;tau.ac.il",
        "position": "PhD student;Researcher;Full Professor",
        "bibtex": "@inproceedings{\nlutati2024separate,\ntitle={Separate and Diffuse: Using a Pretrained Diffusion Model for Better Source Separation},\nauthor={Shahar Lutati and Eliya Nachmani and Lior Wolf},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=UXALv0lJZS}\n}",
        "github": "",
        "project": "",
        "reviewers": "9rFE;d285;fbeS",
        "pdf_size": 4539962,
        "rating": "6;6;6",
        "confidence": "5;4;2",
        "soundness": "3;4;3",
        "contribution": "2;2;3",
        "presentation": "3;3;3",
        "wc_summary": "45;54;98",
        "wc_strengths": "76;112;88",
        "wc_weaknesses": "476;84;230",
        "wc_questions": "7;38;124",
        "wc_review": "604;288;540",
        "wc_reply_reviewers": "186;0;0",
        "wc_reply_authors": "718;380;233",
        "reply_reviewers": "1;0;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            1.247219128924647
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            65.66666666666667,
            23.156472577277874
        ],
        "wc_strengths_avg": [
            92.0,
            14.966629547095765
        ],
        "wc_weaknesses_avg": [
            263.3333333333333,
            161.75976700719565
        ],
        "wc_questions_avg": [
            56.333333333333336,
            49.492984912566705
        ],
        "wc_review_avg": [
            477.3333333333333,
            136.4046268358307
        ],
        "wc_reply_reviewers_avg": [
            62.0,
            87.68124086713189
        ],
        "wc_reply_authors_avg": [
            443.6666666666667,
            203.05390636205178
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5318382178988795215&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=UXALv0lJZS",
        "pdf": "https://openreview.net/pdf?id=UXALv0lJZS",
        "email": "tau.ac.il;research.google.com;tau.ac.il",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Tel Aviv University;Google",
        "aff_unique_dep": ";Google Research",
        "aff_unique_url": "https://www.tau.ac.il;https://research.google",
        "aff_unique_abbr": "TAU;Google",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Israel;United States"
    },
    {
        "id": "UZS6D7GfP1",
        "title": "Human-in-the-loop Detection of AI-generated Text via Grammatical Patterns",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The increasing proliferation of large language models (LLMs) has raised significant concerns about the detection of AI-written text. Ideally, the detection method should be accurate (in particular, it should not falsely accuse humans of using AI-generated text), and interpretable (it should provide a decision as to why the text was detected as either human or AI-generated). Existing methods tend to fall short of one or both of these requirements, and recent work has even shown that detection is impossible in the full generality. In this work, we focus on the problem of detecting AI-generated text in a domain where a training dataset of human-written samples is readily available. Our key insight is to learn interpretable grammatical patterns that are highly indicative of human or AI written text. The most useful of these patterns can then be given to humans as part of a human-in-the-loop approach. In our experimental evaluation, we show that the approach can effectively detect AI-written text in a variety of domains and generalize to different language models. Our results in a human trial show an improvement in the detection accuracy from $43$% to $86$%, demonstrating the effectiveness of the human-in-the-loop approach. We also show that the method is robust to different ways of prompting LLM to generate human-like patterns. Overall, our study demonstrates that AI text can be accurately and interpretably detected using a human-in-the-loop approach.",
        "keywords": "detection;language models",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/f15bd03dd01e0aecc1b82250cf5c395913bfae5b.pdf",
        "author": "Johan Lokna;Mislav Balunovic;Martin Vechev",
        "authorids": "~Johan_Lokna1;~Mislav_Balunovic1;~Martin_Vechev1",
        "gender": "M;M;M",
        "homepage": ";https://www.sri.inf.ethz.ch/people/mislav;https://www.sri.inf.ethz.ch/people/martin",
        "dblp": "340/7644;231/7686;93/2189.html",
        "google_scholar": ";fxkgmGwAAAAJ;https://scholar.google.ch/citations?user=aZ1Rh50AAAAJ",
        "orcid": ";;",
        "linkedin": "johan-lokna-31137714b/;;",
        "or_profile": "~Johan_Lokna1;~Mislav_Balunovic1;~Martin_Vechev1",
        "aff": ";Swiss Federal Institute of Technology;Swiss Federal Institute of Technology",
        "aff_domain": ";ethz.ch;ethz.ch",
        "position": ";PhD student;Full Professor",
        "bibtex": "@misc{\nlokna2024humanintheloop,\ntitle={Human-in-the-loop Detection of {AI}-generated Text via Grammatical Patterns},\nauthor={Johan Lokna and Mislav Balunovic and Martin Vechev},\nyear={2024},\nurl={https://openreview.net/forum?id=UZS6D7GfP1}\n}",
        "github": "",
        "project": "",
        "reviewers": "1GBn;G9ty;7kmh;sRmw",
        "site": "https://openreview.net/forum?id=UZS6D7GfP1",
        "pdf_size": 611305,
        "rating": "3;3;3;5",
        "confidence": "3;3;3;3",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;2",
        "presentation": "2;2;3;2",
        "wc_summary": "59;49;67;78",
        "wc_strengths": "26;46;36;152",
        "wc_weaknesses": "90;283;118;168",
        "wc_questions": "247;20;4;229",
        "wc_review": "422;398;225;627",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            63.25,
            10.638961415476606
        ],
        "wc_strengths_avg": [
            65.0,
            50.724747411889595
        ],
        "wc_weaknesses_avg": [
            164.75,
            73.76779446343777
        ],
        "wc_questions_avg": [
            125.0,
            113.32034239270547
        ],
        "wc_review_avg": [
            418.0,
            142.60610085126092
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Uhe8rOiwGIMJ:scholar.google.com/&scioq=Human-in-the-loop+Detection+of+AI-generated+Text+via+Grammatical+Patterns&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Swiss Federal Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ethz.ch",
        "aff_unique_abbr": "ETH Zurich",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Switzerland"
    },
    {
        "id": "UZmKxjvsyo",
        "title": "Multiclass Alignment of Confidences and Softened Target Occurrences for Train-time Calibration",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In spite of delivering remarkable predictive accuracy across many domains, including computer vision and medical imaging, Deep Neural Networks (DNNs) are susceptible to making overconfident predictions. This could potentially limit their utilization and adoption in many real-world applications, especially involving security-sensitive decision making. Among existing approaches to model calibration, post-hoc based techniques are simple and effective, however, they require a separate hold-out data. Lately, train-time calibration has emerged as an alternate paradigm, in which the recent methods have shown state-of-the-art calibration results. Inspired by the train-time calibration direction, in this paper, we propose a novel train-time calibration method at the core of which is an auxiliary loss formulation, namely multiclass alignment of confidences with the gradually softened ground truth occurrences (MACSO). It is developed on the intuition that, for a class, the gradually softened ground truth occurrences distribution is a suitable non-zero entropy signal whose better alignment with the predicted confidences distribution is positively correlated with reducing the model calibration error. In our train-time approach, besides simply aligning the two distributions, e.g., via their means or KL divergence, we propose to quantify the linear correlation between the two distributions which preserves the relations among them, thereby further improving the calibration performance. Extensive results on several challenging datasets, featuring in and out-of-domain scenarios, class imbalanced problem, and a medical image classification task, validate the efficacy of our method against state-of-the-art train-time calibration methods.",
        "keywords": "Model calibration;network calibration;calibration",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/0b225a92a4f4d38fcf4ecc5f3823f9eccc5f6cc8.pdf",
        "author": "Vinith Kugathasan;Honglu Zhou;Zachary Izzo;Gayal Kuruppu;Sejong Yoon;Muhammad Haris Khan",
        "authorids": "~Vinith_Kugathasan1;~Honglu_Zhou1;~Zachary_Izzo1;~Gayal_Kuruppu1;~Sejong_Yoon2;~Muhammad_Haris_Khan3",
        "gender": "M;F;M;M;;M",
        "homepage": ";https://sites.google.com/view/hongluzhou/;https://zleizzo.github.io;https://gayalkuruppu.github.io;http://sejongyoon.net;https://m-haris-khan.com",
        "dblp": "309/3256;184/9372;259/2117;267/0511;49/5597;155/3076",
        "google_scholar": "QB2LVWN3twYC;https://scholar.google.com/citations?hl=en;K9XheYUAAAAJ;P0s7U8EAAAAJ;iLamXfcAAAAJ;ZgERfFwAAAAJ",
        "orcid": ";;;;0000-0003-1012-283X;0000-0001-9746-276X",
        "linkedin": "vinith-kugathasan-a4b38145/;honglu-zhou-21058a169/;;gayalkuruppu/;sejongyoon/;muhammad-haris-khan-1516714b/",
        "or_profile": "~Vinith_Kugathasan1;~Honglu_Zhou1;~Zachary_Izzo1;~Gayal_Kuruppu1;~Sejong_Yoon2;~Muhammad_Haris_Khan3",
        "aff": "University of Maryland, College Park;SalesForce.com;NEC Labs America;University of Minnesota - Twin Cities;The College of New Jersey;Mohamed Bin Zayed University of Artificial Intelligence",
        "aff_domain": "umd.edu;salesforce.com;nec-labs.com;umn.edu;tcnj.edu;mbzuai.ac.ae",
        "position": "PhD student;Research Scientist;Researcher;PhD student;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nkugathasan2024multiclass,\ntitle={Multiclass Alignment of Confidences and Softened Target Occurrences for Train-time Calibration},\nauthor={Vinith Kugathasan and Honglu Zhou and Zachary Izzo and Gayal Kuruppu and Sejong Yoon and Muhammad Haris Khan},\nyear={2024},\nurl={https://openreview.net/forum?id=UZmKxjvsyo}\n}",
        "github": "",
        "project": "",
        "reviewers": "fMWK;cBLH;MZK5;u54s",
        "site": "https://openreview.net/forum?id=UZmKxjvsyo",
        "pdf_size": 1076288,
        "rating": "1;3;5;5",
        "confidence": "5;4;4;3",
        "soundness": "2;2;2;2",
        "contribution": "1;2;2;2",
        "presentation": "2;3;3;2",
        "wc_summary": "38;60;58;51",
        "wc_strengths": "11;43;32;21",
        "wc_weaknesses": "31;66;398;135",
        "wc_questions": "2;79;100;37",
        "wc_review": "82;248;588;244",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            1.6583123951777
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            51.75,
            8.613216588476108
        ],
        "wc_strengths_avg": [
            26.75,
            11.96609794377432
        ],
        "wc_weaknesses_avg": [
            157.5,
            143.80629332543134
        ],
        "wc_questions_avg": [
            54.5,
            37.85828839237189
        ],
        "wc_review_avg": [
            290.5,
            184.3549565376532
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.8528028654224417,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Jb9-3X_KgM8J:scholar.google.com/&scioq=Multiclass+Alignment+of+Confidences+and+Softened+Target+Occurrences+for+Train-time+Calibration&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;4;5",
        "aff_unique_norm": "University of Maryland;Salesforce;NEC Labs America;University of Minnesota;College of New Jersey;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_unique_dep": ";;;;;",
        "aff_unique_url": "https://www/umd.edu;https://www.salesforce.com;https://www.nec-labs.com;https://www.minnesota.edu;https://www.tcnj.edu;https://www.mbzuai.ac.ae",
        "aff_unique_abbr": "UMD;Salesforce;NEC LA;UMN;TCNJ;MBZUAI",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "College Park;;Twin Cities",
        "aff_country_unique_index": "0;0;0;0;0;1",
        "aff_country_unique": "United States;United Arab Emirates"
    },
    {
        "title": "Decoupling regularization from the action space",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18524",
        "id": "UaMgmoKEBj",
        "author_site": "Sobhan Mohammadpour, Emma Frejinger, Pierre-Luc Bacon",
        "tldr": "",
        "abstract": "Regularized reinforcement learning (RL), particularly the entropy-regularized kind, has gained traction in optimal control and inverse RL. While standard unregularized RL methods remain unaffected by changes in the number of actions, we show that it can severely impact their regularized counterparts. This paper demonstrates the importance of decoupling the regularizer from the action space: that is, to maintain a consistent level of regularization regardless of how many actions are involved to avoid over-regularization. Whereas the problem can be avoided by introducing a task-specific temperature parameter, it is often undesirable and cannot solve the problem when action spaces are state-dependent. In the state-dependent action context, different states with varying action spaces are regularized inconsistently. We introduce two solutions: a static temperature selection approach and a dynamic counterpart, universally applicable where this problem arises. Implementing these changes improves performance on the DeepMind control suite in static and dynamic temperature regimes and a biological design task.",
        "keywords": "reinforcement learning;regularized markov decision process;soft actor-critique",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Sobhan Mohammadpour;Emma Frejinger;Pierre-Luc Bacon",
        "authorids": "~Sobhan_Mohammadpour1;~Emma_Frejinger1;~Pierre-Luc_Bacon1",
        "gender": ";F;",
        "homepage": "https://sobhan.info/;https://www.emmafrejinger.org/;",
        "dblp": "331/8638;215/2337;",
        "google_scholar": "XD41OOkAAAAJ;https://scholar.google.ca/citations?user=PBOoXfwAAAAJ;",
        "orcid": "0000-0002-7910-0383;0000-0003-1930-607X;",
        "linkedin": ";;",
        "or_profile": "~Sobhan_Mohammadpour1;~Emma_Frejinger1;~Pierre-Luc_Bacon1",
        "aff": "Massachusetts Institute of Technology;Universit\u00e9 de Montr\u00e9al;",
        "aff_domain": "mit.edu;umontreal.ca;",
        "position": "PhD student;Full Professor;",
        "bibtex": "@inproceedings{\nmohammadpour2024decoupling,\ntitle={Decoupling regularization from the action space},\nauthor={Sobhan Mohammadpour and Emma Frejinger and Pierre-Luc Bacon},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=UaMgmoKEBj}\n}",
        "github": "",
        "project": "",
        "reviewers": "aWwr;g8g2;nhQG",
        "pdf_size": 2819775,
        "rating": "5;6;6",
        "confidence": "3;3;3",
        "soundness": "2;3;3",
        "contribution": "2;3;2",
        "presentation": "2;3;3",
        "wc_summary": "117;114;102",
        "wc_strengths": "59;62;59",
        "wc_weaknesses": "565;66;154",
        "wc_questions": "21;78;49",
        "wc_review": "762;320;364",
        "wc_reply_reviewers": "58;0;0",
        "wc_reply_authors": "1630;411;1788",
        "reply_reviewers": "1;0;0",
        "reply_authors": "4;1;3",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            111.0,
            6.48074069840786
        ],
        "wc_strengths_avg": [
            60.0,
            1.4142135623730951
        ],
        "wc_weaknesses_avg": [
            261.6666666666667,
            217.4769464155275
        ],
        "wc_questions_avg": [
            49.333333333333336,
            23.27134623427608
        ],
        "wc_review_avg": [
            482.0,
            198.803085153794
        ],
        "wc_reply_reviewers_avg": [
            19.333333333333332,
            27.34146220587984
        ],
        "wc_reply_authors_avg": [
            1276.3333333333333,
            615.2735615606732
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3427915115333798798&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=UaMgmoKEBj",
        "pdf": "https://openreview.net/pdf?id=UaMgmoKEBj",
        "email": "mit.edu;umontreal.ca;",
        "author_num": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Massachusetts Institute of Technology;Universit\u00e9 de Montr\u00e9al",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://web.mit.edu;https://www.umontreal.ca",
        "aff_unique_abbr": "MIT;UdeM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United States;Canada"
    },
    {
        "id": "Uavy4DLrXR",
        "title": "($\\texttt{PASS}$) Visual Prompt Locates Good Structure Sparisty through a Recurent HyperNetwork",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large-scale neural networks have demonstrated remarkable performance in different domains like vision and language processing, although at the cost of massive computation resources. As illustrated by compression literature, structured model pruning is a prominent algorithm to encourage model efficiency, thanks to its acceleration-friendly sparsity patterns. One of the key questions of structural pruning is how to estimate the channel significance. In parallel, work on data-centric AI has shown that prompting-based techniques enable impressive generalization of large language models across diverse downstream tasks. In this paper, we investigate a charming possibility -  *leveraging visual prompts to capture the channel importance and derive high-quality structural sparsity*. To this end, we propose a novel algorithmic framework, namely \\texttt{PASS}. It is a tailored hyper-network to take both visual prompts and network weight statistics as input, and output layer-wise channel sparsity in a recurrent manner. Such designs consider the intrinsic channel dependency between layers. Comprehensive experiments across multiple network architectures and six datasets demonstrate the superiority of $\\texttt{PASS}$ in locating good structural sparsity. For example, at the same FLOPs level, $\\texttt{PASS}$ subnetworks achieve 1\\%$\\sim$3\\% better accuracy on Food101 dataset; or with a similar performance of 80\\% accuracy, $\\texttt{PASS}$ subnetworks obtain 0.35$\\times$ more speedup than the baselines. Codes are provided in the supplements.",
        "keywords": "Channel Prunning;Visual Prompt;Sparse Neural Network",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/bed44589b47a4f5b9f7325e18fe691de7b38c11b.zip",
        "author": "Tianjin Huang;Meng Fang;Li Shen;Fan Liu;Yulong Pei;Mykola Pechenizkiy;Shiwei Liu;Tianlong Chen",
        "authorids": "~Tianjin_Huang1;~Meng_Fang1;~Li_Shen1;~Fan_Liu7;~Yulong_Pei1;~Mykola_Pechenizkiy1;~Shiwei_Liu2;~Tianlong_Chen1",
        "gender": "M;M;M;M;;M;M;M",
        "homepage": "https://research.tue.nl/nl/persons/tianjin-huang;;https://sites.google.com/site/mathshenli/home;https://cies.hhu.edu.cn/2013/0508/c4122a54931/page.htm;;http://www.win.tue.nl/~mpechen/;https://shiweiliuiiiiiii.github.io/;https://tianlong-chen.github.io",
        "dblp": "189/3972;67/463;91/3680-8;56/2849-3;;37/4649;234/8697-3.html;",
        "google_scholar": "https://scholar.google.co.uk/citations?user=yFLmPsoAAAAJ;IcNYP1oAAAAJ;yVhgENIAAAAJ;Sneof_QAAAAJ;;https://scholar.google.com.tw/citations?user=F0uFT_kAAAAJ;73IbXtsAAAAJ;LE3ctn0AAAAJ",
        "orcid": ";;;0000-0001-8746-9845;;0000-0003-4955-0743;;0000-0001-7774-8197",
        "linkedin": ";;;;;mpechen/;;tianlong-chen-783862167/",
        "or_profile": "~Tianjin_Huang1;~Meng_Fang1;~Li_Shen1;~Fan_Liu7;~Yulong_Pei1;~Mykola_Pechenizkiy1;~Shiwei_Liu2;~Tianlong_Chen1",
        "aff": "University of Exeter;Eindhoven University of Technology;JD Explore Academy;Hohai University;;Eindhoven University of Technology;University of Oxford;Harvard University",
        "aff_domain": "exeter.ac.uk;tue.nl;jd.com;hhu.edu.cn;;tue.nl;ox.ac.uk;harvard.edu",
        "position": "Lecturer;Assistant Professor;Researcher;Full Professor;;Full Professor;Postdoc;Postdoc",
        "bibtex": "@misc{\nhuang2024textttpass,\ntitle={(\\${\\textbackslash}texttt\\{{PASS}\\}\\$) Visual Prompt Locates Good Structure Sparisty through a Recurent HyperNetwork},\nauthor={Tianjin Huang and Meng Fang and Li Shen and Fan Liu and Yulong Pei and Mykola Pechenizkiy and Shiwei Liu and Tianlong Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=Uavy4DLrXR}\n}",
        "github": "",
        "project": "",
        "reviewers": "dU7f;dN4F;F4Cf;NTwF",
        "site": "https://openreview.net/forum?id=Uavy4DLrXR",
        "pdf_size": 488946,
        "rating": "5;5;5;8",
        "confidence": "4;4;3;2",
        "soundness": "2;3;2;3",
        "contribution": "2;3;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "36;63;111;59",
        "wc_strengths": "29;25;46;36",
        "wc_weaknesses": "318;91;91;5",
        "wc_questions": "44;48;9;10",
        "wc_review": "427;227;257;110",
        "wc_reply_reviewers": "143;0;0;17",
        "wc_reply_authors": "2960;1061;956;310",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "5;4;4;2",
        "rating_avg": [
            5.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            67.25,
            27.279800219209818
        ],
        "wc_strengths_avg": [
            34.0,
            7.968688725254614
        ],
        "wc_weaknesses_avg": [
            126.25,
            116.14080893467205
        ],
        "wc_questions_avg": [
            27.75,
            18.30812661087966
        ],
        "wc_review_avg": [
            255.25,
            113.35425664702672
        ],
        "wc_reply_reviewers_avg": [
            40.0,
            59.87069399965228
        ],
        "wc_reply_authors_avg": [
            1321.75,
            988.5930343169529
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.75,
            1.0897247358851685
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.8703882797784892,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:kArmTlV1MWMJ:scholar.google.com/&scioq=(%24%5Ctexttt%7BPASS%7D%24)+Visual+Prompt+Locates+Good+Structure+Sparisty+through+a+Recurent+HyperNetwork&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;1;4;5",
        "aff_unique_norm": "University of Exeter;Eindhoven University of Technology;JD;Hohai University;University of Oxford;Harvard University",
        "aff_unique_dep": ";;JD Explore Academy;;;",
        "aff_unique_url": "https://www.exeter.ac.uk;https://www.tue.nl;;https://www.hohai.edu.cn;https://www.ox.ac.uk;https://www.harvard.edu",
        "aff_unique_abbr": "Exeter;TU/e;;Hohai;Oxford;Harvard",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;3;1;0;4",
        "aff_country_unique": "United Kingdom;Netherlands;;China;United States"
    },
    {
        "id": "UbOzNf6hGq",
        "title": "FiLM: Fill-in Language Models for Any-Order Generation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Language models have become the backbone of today's AI systems. However, their predominant left-to-right generation limits the use of bidirectional context, which is essential for tasks that involve filling text in the middle. We propose the Fill-in Language Model (FiLM), a new language modeling approach that allows for flexible generation at any position without adhering to a specific generation order. Its training extends the masked language modeling objective by adopting varying mask probabilities sampled from the Beta distribution to enhance the generative capabilities of FiLM. During inference, FiLM can seamlessly insert missing phrases, sentences, or paragraphs, ensuring that the outputs are fluent and are coherent with the surrounding context. In both automatic and human evaluations, FiLM outperforms existing infilling methods that rely on left-to-right language models trained on rearranged text segments. FiLM is easy to implement and can be either trained from scratch or fine-tuned from a left-to-right language model. Notably, as the model size grows, FiLM's perplexity approaches that of strong left-to-right language models of similar sizes, indicating FiLM's scalability and potential as a large language model.",
        "keywords": "any-order language model;text generation;infilling",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Tianxiao Shen;Hao Peng;Ruoqi Shen;Yao Fu;Zaid Harchaoui;Yejin Choi",
        "authorids": "~Tianxiao_Shen1;~Hao_Peng4;~Ruoqi_Shen1;~Yao_Fu3;~Zaid_Harchaoui1;~Yejin_Choi1",
        "gender": ";;;M;;F",
        "homepage": "https://shentianxiao.github.io/;;https://homes.cs.washington.edu/~shenr3/;https://franxyao.github.io/;;https://yejinc.github.io/",
        "dblp": "185/5533;;248/8237.html;;;89/579-1",
        "google_scholar": "aYtllNgAAAAJ;;;liSP4cEAAAAJ;;vhP-tlcAAAAJ",
        "orcid": ";;;;;",
        "linkedin": "shentianxiao/;;;;;",
        "or_profile": "~Tianxiao_Shen1;~Hao_Peng4;~Ruoqi_Shen1;~Yao_Fu3;~Zaid_Harchaoui1;~Yejin_Choi1",
        "aff": "University of Washington;;University of Washington, Seattle;University of Edinburgh;;Department of Computer Science, University of Washington",
        "aff_domain": "uw.edu;;uw.edu;ed.ac.uk;;cs.washington.edu",
        "position": "Postdoc;;PhD student;PhD student;;Full Professor",
        "bibtex": "@misc{\nshen2024film,\ntitle={Fi{LM}: Fill-in Language Models for Any-Order Generation},\nauthor={Tianxiao Shen and Hao Peng and Ruoqi Shen and Yao Fu and Zaid Harchaoui and Yejin Choi},\nyear={2024},\nurl={https://openreview.net/forum?id=UbOzNf6hGq}\n}",
        "github": "",
        "project": "",
        "reviewers": "Q9uj;Bw7d;FCE8;Ad3z",
        "site": "https://openreview.net/forum?id=UbOzNf6hGq",
        "pdf_size": 999602,
        "rating": "3;3;5;6",
        "confidence": "3;5;4;3",
        "soundness": "2;4;3;3",
        "contribution": "1;2;3;3",
        "presentation": "3;3;3;2",
        "wc_summary": "42;117;122;225",
        "wc_strengths": "15;100;60;118",
        "wc_weaknesses": "69;214;37;123",
        "wc_questions": "48;4;1;257",
        "wc_review": "174;435;220;723",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            126.5,
            65.10184329187615
        ],
        "wc_strengths_avg": [
            73.25,
            39.6445141223852
        ],
        "wc_weaknesses_avg": [
            110.75,
            67.06852838701622
        ],
        "wc_questions_avg": [
            77.5,
            105.29126269543926
        ],
        "wc_review_avg": [
            388.0,
            217.05644427199115
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.4061811972299616,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12814184172324466716&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "University of Washington;University of Edinburgh",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.washington.edu;https://www.ed.ac.uk",
        "aff_unique_abbr": "UW;Edinburgh",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Seattle",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "UbgIbJfvio",
        "title": "Prompt Space Optimizing Few-shot Reasoning Success with Large Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Prompt engineering is an essential technique for enhancing the abilities of large language models (LLMs) by providing explicit and specific instructions. It enables LLMs to excel in various tasks, such as arithmetic reasoning, question answering, summarization, relation extraction, machine translation, and sentiment analysis. Researchers have been actively exploring different prompt engineering strategies, such as Chain of Thought (CoT), Zero-CoT, and In-context learning. However, an unresolved problem arises from the fact that current approaches lack a solid mathematical solution for determining optimal prompts. To address this issue in prompt engineering, we propose a new and effective approach called Prompt Space. Our methodology utilizes text embeddings to obtain basis vectors by matrix decomposition, and then constructs a space for representing all prompts. Prompt Space significantly outperforms state-of-the-art prompt paradigms on ten public reasoning benchmarks. Notably, without the help of the CoT method and the prompt \"Let's think step by step\", Prompt Space shows superior performance over the few-shot method. Overall, our approach provides a robust and effective mathematical framework for selecting simple and effective prompts. This advancement marks a significant step towards improving prompt engineering for a wide variety of applications in LLMs.",
        "keywords": "Prompt engineering; Large Language Models; Chain of Thought; Reasoning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/796ea1d151156bab9f4c7c04f74f0241aa7b91b0.zip",
        "author": "Fobo Shi;Peijun Qing;Dong Yang;Nan Wang;Haonan Lu;Xiaodong Lin",
        "authorids": "~Fobo_Shi1;~Peijun_Qing2;~Dong_Yang2;~Nan_Wang5;~Haonan_Lu1;~Xiaodong_Lin2",
        "gender": "M;M;;M;M;",
        "homepage": ";https://scholar.google.com/citations?user=8iYd-1UAAAAJ&hl=en;;;;",
        "dblp": ";332/0688;;;129/0998;",
        "google_scholar": ";8iYd-1UAAAAJ;;;EPBgKu0AAAAJ;",
        "orcid": "0000-0002-9357-4745;;;;0000-0001-6332-2785;",
        "linkedin": ";;;;;",
        "or_profile": "~Fobo_Shi1;~Peijun_Qing2;~Dong_Yang2;~Nan_Wang5;~Haonan_Lu1;~Xiaodong_Lin2",
        "aff": "Central China Normal University;Dartmouth College;;Guangdong OPPO Mobile Telecommunications Corp.,Ltd.;OPPO Guangdong Mobile Telecommunications Co., Ltd.;",
        "aff_domain": "ccnu.edu.cn;dartmouth.edu;;oppo.com;oppo.com;",
        "position": "MS student;PhD student;;Researcher;Researcher;",
        "bibtex": "@misc{\nshi2024prompt,\ntitle={Prompt Space Optimizing Few-shot Reasoning Success with Large Language Models},\nauthor={Fobo Shi and Peijun Qing and Dong Yang and Nan Wang and Haonan Lu and Xiaodong Lin},\nyear={2024},\nurl={https://openreview.net/forum?id=UbgIbJfvio}\n}",
        "github": "",
        "project": "",
        "reviewers": "46e7;4To8;bdzS;YN58",
        "site": "https://openreview.net/forum?id=UbgIbJfvio",
        "pdf_size": 2964832,
        "rating": "3;3;3;5",
        "confidence": "4;4;4;4",
        "soundness": "2;2;2;2",
        "contribution": "2;2;1;3",
        "presentation": "2;1;2;3",
        "wc_summary": "57;65;69;46",
        "wc_strengths": "30;24;36;61",
        "wc_weaknesses": "385;331;218;90",
        "wc_questions": "36;37;8;70",
        "wc_review": "508;457;331;267",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            59.25,
            8.78564169540279
        ],
        "wc_strengths_avg": [
            37.75,
            14.077908225301087
        ],
        "wc_weaknesses_avg": [
            256.0,
            113.20998189205756
        ],
        "wc_questions_avg": [
            37.75,
            21.958768180387533
        ],
        "wc_review_avg": [
            390.75,
            96.20388505668573
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6593441198642818619&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Central China Normal University;Dartmouth College;OPPO Mobile Telecommunications Corp.,Ltd.;OPPO",
        "aff_unique_dep": ";;;Mobile Telecommunications",
        "aff_unique_url": "http://www.ccnu.edu.cn;https://www.dartmouth.edu;https://www.oppo.com;https://www.oppo.com",
        "aff_unique_abbr": "CCNU;Dartmouth;OPPO;OPPO",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Let 2D Diffusion Model Know 3D-Consistency for Robust Text-to-3D Generation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18523",
        "id": "UbxWjq0UO2",
        "author_site": "Junyoung Seo, Wooseok Jang, Min-Seop Kwak, In\u00e8s Hyeonsu Kim, Jaehoon Ko, Junho Kim, Jin-Hwa Kim, Jiyoung Lee, Seungryong Kim",
        "tldr": "",
        "abstract": "Text-to-3D generation has shown rapid progress in recent days with the advent of score distillation sampling (SDS), a methodology of using pretrained text-to-2D diffusion models to optimize a neural radiance field (NeRF) in a zero-shot setting. However, the lack of 3D awareness in the 2D diffusion model often destabilizes previous methods from generating a plausible 3D scene. To address this issue, we propose 3DFuse, a novel framework that incorporates 3D awareness into the pretrained 2D diffusion model, enhancing the robustness and 3D consistency of score distillation-based methods. Specifically, we introduce a consistency injection module which constructs a 3D point cloud from the text prompt and utilizes its projected depth map at given view as a condition for the diffusion model. The 2D diffusion model, through its generative capability, robustly infers dense structure from the sparse point cloud depth map and generates a geometrically consistent and coherent 3D scene. We also introduce a new technique called semantic coding that reduces semantic ambiguity of the text prompt for improved results. Our method can be easily adapted to various text-to-3D baselines, and we experimentally demonstrate how our method notably enhances the 3D consistency of generated scenes in comparison to previous baselines, achieving state-of-the-art performance in geometric robustness and fidelity.",
        "keywords": "Diffusion models;NeRF;3D synthesis",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/b5dcebaf7d7efd31aa9ab9707ab807963cc0b9c1.zip",
        "author": "Junyoung Seo;Wooseok Jang;Min-Seop Kwak;Hyeonsu Kim;Jaehoon Ko;Junho Kim;Jin-Hwa Kim;Jiyoung Lee;Seungryong Kim",
        "authorids": "~Junyoung_Seo1;~Wooseok_Jang2;~Min-Seop_Kwak1;~Hyeonsu_Kim2;~Jaehoon_Ko1;~Junho_Kim3;~Jin-Hwa_Kim1;~Jiyoung_Lee2;~Seungryong_Kim1",
        "gender": "M;;M;F;M;M;Unspecified;F;M",
        "homepage": "https://j0seo.github.io;https://github.com/woo1726;;https://ines-hyeonsu-kim.github.io;;http://bit.ly/jhkim_resume;http://wityworks.com;https://lee-jiyoung.github.io/;https://cvlab.korea.ac.kr/members/faculty",
        "dblp": "209/9340;30/4458;338/9125;367/9344;319/4233;;48/258;;141/9955",
        "google_scholar": "orJRvmEAAAAJ;;;tBcqfncAAAAJ;ySBl-10AAAAJ;WtjDugkAAAAJ;https://scholar.google.co.kr/citations?user=3f2wPekAAAAJ;nIPWv9EAAAAJ;cIK1hS8AAAAJ",
        "orcid": ";;;0009-0003-3695-0243;;0000-0003-3712-8510;0000-0002-0423-0415;0009-0000-6647-9403;",
        "linkedin": ";;matthewmatics96;;;taki0112/;;;",
        "or_profile": "~Junyoung_Seo1;~Wooseok_Jang2;~Min-Seop_Kwak1;~Hyeonsu_Kim2;~Jaehoon_Ko1;~Junho_Kim3;~Jin-Hwa_Kim1;~Jiyoung_Lee2;~Seungryong_Kim1",
        "aff": "Korea University;Korea University;Korea Advanced Institute of Science & Technology;Korea University;Korea University;NAVER;NAVER;NAVER;Korea University",
        "aff_domain": "korea.ac.kr;korea.ac.kr;kaist.ac.kr;korea.ac.kr;korea.ac.kr;navercorp.com;navercorp.com;navercorp.com;korea.ac.kr",
        "position": "PhD student;MS student;PhD student;Undergrad student;MS student;Research Scientist;Research Scientist;Research Scientist;Assistant Professor",
        "bibtex": "@inproceedings{\nseo2024let,\ntitle={Let 2D Diffusion Model Know 3D-Consistency for Robust Text-to-3D Generation},\nauthor={Junyoung Seo and Wooseok Jang and Min-Seop Kwak and Hyeonsu Kim and Jaehoon Ko and Junho Kim and Jin-Hwa Kim and Jiyoung Lee and Seungryong Kim},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=UbxWjq0UO2}\n}",
        "github": "",
        "project": "",
        "reviewers": "MdgG;ftV7;s3AW",
        "pdf_size": 48669064,
        "rating": "5;6;8",
        "confidence": "5;4;5",
        "soundness": "3;4;3",
        "contribution": "2;4;3",
        "presentation": "3;3;3",
        "wc_summary": "101;120;50",
        "wc_strengths": "126;133;44",
        "wc_weaknesses": "150;105;130",
        "wc_questions": "1;49;19",
        "wc_review": "378;407;243",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "2465;2284;796",
        "reply_reviewers": "0;0;0",
        "reply_authors": "7;6;4",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            90.33333333333333,
            29.555973263547855
        ],
        "wc_strengths_avg": [
            101.0,
            40.40627014049511
        ],
        "wc_weaknesses_avg": [
            128.33333333333334,
            18.408935028645434
        ],
        "wc_questions_avg": [
            23.0,
            19.79898987322333
        ],
        "wc_review_avg": [
            342.6666666666667,
            71.46249987852993
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1848.3333333333333,
            747.7719497874261
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            5.666666666666667,
            1.247219128924647
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.18898223650461357,
        "gs_citation": 136,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=22160970474684632&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=UbxWjq0UO2",
        "pdf": "https://openreview.net/pdf?id=UbxWjq0UO2",
        "email": "korea.ac.kr;korea.ac.kr;kaist.ac.kr;korea.ac.kr;korea.ac.kr;navercorp.com;navercorp.com;navercorp.com;korea.ac.kr",
        "author_num": 9,
        "aff_unique_index": "0;0;1;0;0;2;2;2;0",
        "aff_unique_norm": "Korea University;Korea Advanced Institute of Science and Technology;NAVER Corporation",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.korea.ac.kr;https://www.kaist.ac.kr;https://www.naver.com",
        "aff_unique_abbr": "KU;KAIST;NAVER",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "Ue93J8VV3W",
        "title": "TabGraphs: new benchmark and insights for learning on graphs with tabular features",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The field of tabular machine learning is very important for industry and science. Table rows are typically treated as independent data samples. However, often additional information about the relations between these samples is available, and leveraging this information may improve the predictive performance. As such relational information can be naturally modeled with a graph, the field of tabular machine learning can borrow methods from graph machine learning. However, graph models are typically evaluated on datasets with homogeneous features, such as word embeddings or bag-of-words representations, which have little in common with the heterogeneous mixture of numerical and categorical features distinctive for tabular data. Thus, there is a critical difference between the data used in tabular and graph machine learning studies, which does not allow us to understand how successfully graph methods can be transferred to tabular data. In this work, we aim to bridge this gap. First, we create a benchmark of diverse graphs with heterogeneous tabular node features and realistic prediction tasks. Further, we evaluate a vast set of methods on this benchmark, analyze their performance, and provide insights and tips for researchers and practitioners in both tabular and graph machine learning fields.",
        "keywords": "graph benchmarks;tabular machine learning;graph machine learning;tabular features;graph neural networks",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Gleb Bazhenov;Oleg Platonov;Liudmila Prokhorenkova",
        "authorids": "~Gleb_Bazhenov1;~Oleg_Platonov1;~Liudmila_Prokhorenkova1",
        "gender": "M;M;F",
        "homepage": ";https://t.me/Oleg_Platonov;",
        "dblp": "322/8649.html;329/5448;45/11468",
        "google_scholar": "DLt-B68AAAAJ;q024V_QAAAAJ;https://scholar.google.ru/citations?user=6JyZlSEAAAAJ",
        "orcid": ";;",
        "linkedin": "bazhenov-gleb/;;",
        "or_profile": "~Gleb_Bazhenov1;~Oleg_Platonov1;~Liudmila_Prokhorenkova1",
        "aff": "Yandex Research;Higher School of Economics;Yandex",
        "aff_domain": "yandex-team.ru;hse.ru;yandex-team.ru",
        "position": "Researcher;Researcher;Researcher",
        "bibtex": "@misc{\nbazhenov2024tabgraphs,\ntitle={TabGraphs: new benchmark and insights for learning on graphs with tabular features},\nauthor={Gleb Bazhenov and Oleg Platonov and Liudmila Prokhorenkova},\nyear={2024},\nurl={https://openreview.net/forum?id=Ue93J8VV3W}\n}",
        "github": "",
        "project": "",
        "reviewers": "VTYd;Umnm;36H3;b5gj",
        "site": "https://openreview.net/forum?id=Ue93J8VV3W",
        "pdf_size": 227656,
        "rating": "3;3;3;6",
        "confidence": "4;4;5;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;2;3",
        "wc_summary": "75;51;20;68",
        "wc_strengths": "56;50;42;33",
        "wc_weaknesses": "70;119;258;86",
        "wc_questions": "39;92;1;221",
        "wc_review": "240;312;321;408",
        "wc_reply_reviewers": "0;0;278;16",
        "wc_reply_authors": "453;641;1259;826",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            53.5,
            21.219095173922945
        ],
        "wc_strengths_avg": [
            45.25,
            8.642193008721803
        ],
        "wc_weaknesses_avg": [
            133.25,
            74.15987796645838
        ],
        "wc_questions_avg": [
            88.25,
            83.17864810154106
        ],
        "wc_review_avg": [
            320.25,
            59.60023070425147
        ],
        "wc_reply_reviewers_avg": [
            73.5,
            118.24867863955183
        ],
        "wc_reply_authors_avg": [
            794.75,
            298.72091908669535
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:XCkEpBjRgJsJ:scholar.google.com/&scioq=TabGraphs:+new+benchmark+and+insights+for+learning+on+graphs+with+tabular+features&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Yandex;Higher School of Economics",
        "aff_unique_dep": "Yandex Research;",
        "aff_unique_url": "https://research.yandex.com;https://www.hse.ru",
        "aff_unique_abbr": "Yandex;HSE",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Russian Federation"
    },
    {
        "id": "UeGTOoPDu6",
        "title": "Using Attention to Weight Particles in Particle Filters",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Particle filters are a set of algorithms for state estimation in dynamical systems. The archetypal usage of particle filters is estimating the position and orientation of a robot based on noisy sensor readings. In many situations, sensor noise is modeled to be Gaussian, where evaluating particle observations using a Gaussian probability distribution function is a reasonable way to weight particles. In this paper, we propose using attention (i.e. softmax dot product) as an alternative particle weighting function. We investigated using attention vs the traditional Gaussian weighting function in physical and temporal localization and navigation tasks, and found time performance advantages, especially when using a GPU. At the same time, we found that attention maintains comparable accuracy to the Gaussian weighting function. Code is publicly available at github.com/anonuser-2023/project2023.",
        "keywords": "particle filter;robotics;navigation;localization;sensor",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Harvey Dam;Maxwell Nathan Yaw",
        "authorids": "~Harvey_Dam1;~Maxwell_Nathan_Yaw1",
        "gender": ";M",
        "homepage": ";https://github.com/Maxny87",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": "harvey-tanh/;",
        "or_profile": "~Harvey_Dam1;~Maxwell_Nathan_Yaw1",
        "aff": "University of Utah;Saginaw Valley State University",
        "aff_domain": "utah.edu;svsu.edu",
        "position": "PhD student;Undergrad student",
        "bibtex": "@misc{\ndam2024using,\ntitle={Using Attention to Weight Particles in Particle Filters},\nauthor={Harvey Dam and Maxwell Nathan Yaw},\nyear={2024},\nurl={https://openreview.net/forum?id=UeGTOoPDu6}\n}",
        "github": "",
        "project": "",
        "reviewers": "Vkcn;1peL;8Hzj;EvVM",
        "site": "https://openreview.net/forum?id=UeGTOoPDu6",
        "pdf_size": 553864,
        "rating": "1;3;3;5",
        "confidence": "4;5;4;3",
        "soundness": "1;1;2;3",
        "contribution": "1;1;2;2",
        "presentation": "2;2;3;3",
        "wc_summary": "47;56;75;68",
        "wc_strengths": "18;46;102;79",
        "wc_weaknesses": "393;553;93;115",
        "wc_questions": "12;48;45;60",
        "wc_review": "470;703;315;322",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            61.5,
            10.781929326423912
        ],
        "wc_strengths_avg": [
            61.25,
            31.932546093288583
        ],
        "wc_weaknesses_avg": [
            288.5,
            193.13402082491837
        ],
        "wc_questions_avg": [
            41.25,
            17.795715776557007
        ],
        "wc_review_avg": [
            452.5,
            157.31576526209952
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:n8f3KiGmwsIJ:scholar.google.com/&scioq=Using+Attention+to+Weight+Particles+in+Particle+Filters&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Utah;Saginaw Valley State University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.utah.edu;https://www.svsu.edu",
        "aff_unique_abbr": "Utah;SVSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Deep Confident Steps to New Pockets: Strategies for Docking Generalization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18522",
        "id": "UfBIxpTK10",
        "author_site": "Gabriele Corso, Arthur Deng, Nicholas Polizzi, Regina Barzilay, Tommi Jaakkola",
        "tldr": "",
        "abstract": "Accurate blind docking has the potential to lead to new biological breakthroughs, but for this promise to be realized, docking methods must generalize well across the proteome. Existing benchmarks, however, fail to rigorously assess generalizability. Therefore, we develop DockGen, a new benchmark based on the ligand-binding domains of proteins, and we show that existing machine learning-based docking models have very weak generalization abilities. We carefully analyze the scaling laws of ML-based docking and show that, by scaling data and model size, as well as integrating synthetic data strategies, we are able to significantly increase the generalization capacity and set new state-of-the-art performance across benchmarks.  Further, we propose Confidence Bootstrapping, a new training paradigm that solely relies on the interaction between diffusion and confidence models and exploits the multi-resolution generation process of diffusion models. We demonstrate that Confidence Bootstrapping significantly improves the ability of ML-based docking methods to dock to unseen protein classes, edging closer to accurate and generalizable blind docking methods.",
        "keywords": "generalization;molecular docking;protein-ligand binding;diffusion models;benchmark;bootstrapping;self-training",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Gabriele Corso;Arthur Deng;Nicholas Polizzi;Regina Barzilay;Tommi S. Jaakkola",
        "authorids": "~Gabriele_Corso1;~Arthur_Deng1;~Nicholas_Polizzi1;~Regina_Barzilay1;~Tommi_S._Jaakkola1",
        "gender": ";M;;female;",
        "homepage": "https://gcorso.github.io/;;http://polizzilab.org;https://www.regina.csail.mit.edu/;",
        "dblp": "262/6499;;;b/ReginaBarzilay;",
        "google_scholar": "LUrAYgEAAAAJ;;;;",
        "orcid": ";;;;",
        "linkedin": "gcorso/;arthur-deng-709a91156/;;;",
        "or_profile": "~Gabriele_Corso1;~Arthur_Deng1;~Nicholas_Polizzi1;~Regina_Barzilay1;~Tommi_S._Jaakkola1",
        "aff": "Massachusetts Institute of Technology;University of California, Berkeley;Dana-Farber Cancer Institute ;Massachusetts Institute of Technology;",
        "aff_domain": "mit.edu;berkeley.edu;dfci.harvard.edu;mit.edu;",
        "position": "PhD student;MS student;Assistant Professor;Professor;",
        "bibtex": "@inproceedings{\ncorso2024deep,\ntitle={Deep Confident Steps to New Pockets: Strategies for Docking Generalization},\nauthor={Gabriele Corso and Arthur Deng and Nicholas Polizzi and Regina Barzilay and Tommi S. Jaakkola},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=UfBIxpTK10}\n}",
        "github": "",
        "project": "",
        "reviewers": "Eb79;f6Xk;Jhgj;ksBz;kTFp",
        "pdf_size": 8118041,
        "rating": "5;5;6;6;8",
        "confidence": "4;5;2;4;3",
        "soundness": "3;3;3;3;4",
        "contribution": "2;3;3;3;4",
        "presentation": "2;3;4;3;4",
        "wc_summary": "79;120;25;142;178",
        "wc_strengths": "41;73;16;151;373",
        "wc_weaknesses": "147;99;16;350;337",
        "wc_questions": "122;1;9;137;151",
        "wc_review": "389;293;66;780;1039",
        "wc_reply_reviewers": "0;0;0;0;54",
        "wc_reply_authors": "980;841;61;967;1182",
        "reply_reviewers": "0;0;0;0;1",
        "reply_authors": "2;2;1;2;2",
        "rating_avg": [
            6.0,
            1.0954451150103321
        ],
        "confidence_avg": [
            3.6,
            1.019803902718557
        ],
        "soundness_avg": [
            3.2,
            0.39999999999999997
        ],
        "contribution_avg": [
            3.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            3.2,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            108.8,
            52.776509926292015
        ],
        "wc_strengths_avg": [
            130.8,
            129.3466659794523
        ],
        "wc_weaknesses_avg": [
            189.8,
            132.37431775083866
        ],
        "wc_questions_avg": [
            84.0,
            65.2012269823199
        ],
        "wc_review_avg": [
            513.4,
            349.7282373500887
        ],
        "wc_reply_reviewers_avg": [
            10.8,
            21.6
        ],
        "wc_reply_authors_avg": [
            806.2,
            388.28412277609294
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4
        ],
        "reply_authors_avg": [
            1.8,
            0.4
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5370861555295747,
        "gs_citation": 49,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14729063079633092767&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=UfBIxpTK10",
        "pdf": "https://openreview.net/pdf?id=UfBIxpTK10",
        "email": "mit.edu;berkeley.edu;dfci.harvard.edu;mit.edu;",
        "author_num": 5,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Massachusetts Institute of Technology;University of California, Berkeley;Dana-Farber Cancer Institute",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://web.mit.edu;https://www.berkeley.edu;https://www.dana-farber.org",
        "aff_unique_abbr": "MIT;UC Berkeley;DFCI",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Berkeley",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Ufp0DVjRs0",
        "title": "Feature Accentuation: Explaining 'what' features respond to in natural images",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Efforts to decode neural network vision models necessitate a comprehensive grasp of both the spatial and semantic facets governing feature responses within images. Most research has primarily centered around attribution methods, which provide explanations in the form of heatmaps, showing 'where' the model directs its attention for a given feature. However, grasping 'where' alone falls short, as numerous studies have highlighted the limitations of those methods and the necessity to understand 'what' the model has recognized at the focal point of its attention. In parallel, 'Feature visualization' offers another avenue for interpreting neural network features. This approach synthesizes an optimal image through gradient ascent, providing clearer insights into 'what' features respond to. However, feature visualizations only provide one global explanation per feature; they do not explain why features activate for particular images. In this work, we introduce a new method to the interpretability tool-kit, 'feature accentuation', which is capable of conveying both 'where' and 'what' in arbitrary input images induces a feature's response. At its core, feature accentuation is image-seeded (rather than noise-seeded) feature visualization. We find a particular combination of parameterization, augmentation, and regularization yields naturalistic visualizations that resemble the seed image and target feature simultaneously. Furthermore, we validate these accentuations are processed along a natural circuit by the model. We make our precise implementation of 'feature accentuation' available to the community as the 'Faccent' library, an extension of the popular 'Lucent' library for feature visualization.",
        "keywords": "Feature Visualization;Attribution;Explainability",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/83aff4532f7edc3c9a70124324cd3f91cac46b25.pdf",
        "author": "Christopher J Hamblin;Thomas FEL;Srijani Saha;Talia Konkle;George A. Alvarez",
        "authorids": "~Christopher_J_Hamblin1;~Thomas_FEL1;~Srijani_Saha1;~Talia_Konkle1;~George_A._Alvarez2",
        "gender": "M;M;;F;M",
        "homepage": "https://chrishamblin.xyz/;https://thomasfel.me;;https://konklab.fas.harvard.edu/;https://visionlab.harvard.edu/george/",
        "dblp": ";274/2390;;;",
        "google_scholar": "rCJ0dG8AAAAJ;1m5Mlx4AAAAJ;;QxV9vroAAAAJ;qU8dld4AAAAJ",
        "orcid": ";;;0000-0003-1738-4744;",
        "linkedin": "chris-hamblin-2180aa56/;;;;",
        "or_profile": "~Christopher_J_Hamblin1;~Thomas_FEL1;~Srijani_Saha1;~Talia_Konkle1;~George_A._Alvarez2",
        "aff": "Harvard University;Brown University;;Harvard University;Harvard University",
        "aff_domain": "harvard.edu;brown.edu;;harvard.edu;harvard.edu",
        "position": "PhD student;PhD student;;Full Professor;Full Professor",
        "bibtex": "@misc{\nhamblin2024feature,\ntitle={Feature Accentuation: Explaining 'what' features respond to in natural images},\nauthor={Christopher J Hamblin and Thomas FEL and Srijani Saha and Talia Konkle and George A. Alvarez},\nyear={2024},\nurl={https://openreview.net/forum?id=Ufp0DVjRs0}\n}",
        "github": "",
        "project": "",
        "reviewers": "zCew;bchW;kHZK;L6NW",
        "site": "https://openreview.net/forum?id=Ufp0DVjRs0",
        "pdf_size": 45188300,
        "rating": "3;6;6;8",
        "confidence": "4;3;3;3",
        "soundness": "3;3;2;4",
        "contribution": "2;2;2;4",
        "presentation": "3;4;2;2",
        "wc_summary": "38;50;51;117",
        "wc_strengths": "28;91;51;83",
        "wc_weaknesses": "69;410;46;71",
        "wc_questions": "3;40;24;122",
        "wc_review": "138;591;172;393",
        "wc_reply_reviewers": "455;180;264;25",
        "wc_reply_authors": "555;499;772;597",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            64.0,
            31.024184114977142
        ],
        "wc_strengths_avg": [
            63.25,
            25.262373206015305
        ],
        "wc_weaknesses_avg": [
            149.0,
            151.0082779187949
        ],
        "wc_questions_avg": [
            47.25,
            45.107510461119446
        ],
        "wc_review_avg": [
            323.5,
            182.85855189189266
        ],
        "wc_reply_reviewers_avg": [
            231.0,
            155.16281771094518
        ],
        "wc_reply_authors_avg": [
            605.75,
            102.08666661224667
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.8892972917998875,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:gRfiNqjIpQ4J:scholar.google.com/&scioq=Feature+Accentuation:+Explaining+%27what%27+features+respond+to+in+natural+images&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Harvard University;Brown University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.harvard.edu;https://www.brown.edu",
        "aff_unique_abbr": "Harvard;Brown",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "UgBcLI4onx",
        "title": "Rethinking Self-Supervise Learning: An Instance-wise Similarity Perspective",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "This paper studies self-supervised learning from the perspective of instance-wise similarity (IwS), characterized by the pairwise similarity matrix among all instances. Ideally, the IwS matrix in the representation space should closely mirror that in the input space so that the learned representations retain their discriminative power and account for semantic similarities. This perspective not only allows us to understand diverse existing self-supervised learning methodologies better but also uncovers a notable limitation within current approaches: the discrepancy between IwS matrices in the input and representation spaces. Indeed, many established methods, including SimCLR and MoCo v3, implicitly assume that the IwS matrix within the representation space is an identity matrix, even when the IwS matrix in the input space may deviate from this form. Inspired by this observation, we introduce sparse contrastive learning, a new approach that learns an appropriately sparse IwS matrix within the representation space instead of presuming an identity IwS matrix. Our comprehensive experiments conducted on ImageNet and CIFAR datasets substantiate the superior performance of our method in comparison to other state-of-the-art methods.",
        "keywords": "Self-Supervised Learning;Instance-wise Similarity;Sparse structure",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/bfbed26db972972341fe8d738e47d397f15d5271.zip",
        "author": "Xianghong Fang;Ronghe Qiu;Zenglin Xu;Lei Ma;Qiang Sun;Jie Fu",
        "authorids": "~Xianghong_Fang1;~Ronghe_Qiu2;~Zenglin_Xu1;~Lei_Ma3;~Qiang_Sun2;~Jie_Fu2",
        "gender": "M;M;Not Specified;M;M;M",
        "homepage": "https://github.com/ConnerQiu;https://faculty.fudan.edu.cn/xuzenglin/en/index.htm;https://nbic.pku.edu.cn/rcdw/kyry/02c5f5ce8e254b1e82a48bebd0a24c33.htm;https://sites.google.com/view/qsun;https://bigaidream.github.io/;",
        "dblp": ";68/1538;20/6534-8;73/2066-7;;202/6322.html",
        "google_scholar": "https://scholar.google.com/citations?hl=en;gF0H9nEAAAAJ;;f0V2fAYAAAAJ;66osleIAAAAJ;https://scholar.google.com.hk/citations?user=hQfxe5QAAAAJ",
        "orcid": ";0000-0001-5550-6461;0000-0001-6024-3854;;0000-0002-4494-843X;0000-0003-2250-6961",
        "linkedin": ";;maleiwhat/;;;",
        "or_profile": "~Ronghe_Qiu2;~Zenglin_Xu1;~Lei_Ma3;~Qiang_Sun2;~Jie_Fu1;~Fang_XiangHong1",
        "aff": "Hong Kong University of Science and Technology;Harbin Institute of Technology Shenzhen;Beijing Academy of Artifical Intelligence;University of Toronto;Hong Kong University of Science and Technology;University of Toronto",
        "aff_domain": "hkust.edu;hit.edu.cn;baai.ac.cn;utoronto.ca;ust.hk;utoronto.ca",
        "position": "MS student;Full Professor;Principal Researcher;Full Professor;Researcher;PhD student",
        "bibtex": "@misc{\nfang2024rethinking,\ntitle={Rethinking Self-Supervise Learning: An Instance-wise Similarity Perspective},\nauthor={Xianghong Fang and Ronghe Qiu and Zenglin Xu and Lei Ma and Qiang Sun and Jie Fu},\nyear={2024},\nurl={https://openreview.net/forum?id=UgBcLI4onx}\n}",
        "github": "",
        "project": "",
        "reviewers": "TW8A;dXtK;LXXA",
        "site": "https://openreview.net/forum?id=UgBcLI4onx",
        "pdf_size": 3684897,
        "rating": "3;5;5",
        "confidence": "4;4;5",
        "soundness": "2;2;2",
        "contribution": "2;2;2",
        "presentation": "2;3;2",
        "wc_summary": "49;64;74",
        "wc_strengths": "37;104;70",
        "wc_weaknesses": "135;166;282",
        "wc_questions": "37;63;4",
        "wc_review": "258;397;430",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            62.333333333333336,
            10.274023338281626
        ],
        "wc_strengths_avg": [
            70.33333333333333,
            27.353650985238193
        ],
        "wc_weaknesses_avg": [
            194.33333333333334,
            63.26838775319701
        ],
        "wc_questions_avg": [
            34.666666666666664,
            24.143091949642425
        ],
        "wc_review_avg": [
            361.6666666666667,
            74.53112697986586
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:QiNKAKqvYpUJ:scholar.google.com/&scioq=Rethinking+Self-Supervise+Learning:+An+Instance-wise+Similarity+Perspective&hl=en&as_sdt=0,48",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;0;3",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Harbin Institute of Technology;Beijing Academy of Artificial Intelligence;University of Toronto",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.ust.hk;https://www.hit.edu.cn/;https://www.baaic.cn;https://www.utoronto.ca",
        "aff_unique_abbr": "HKUST;HIT;BAAI;U of T",
        "aff_campus_unique_index": "0;1;0",
        "aff_campus_unique": "Hong Kong SAR;Shenzhen;",
        "aff_country_unique_index": "0;0;0;1;0;1",
        "aff_country_unique": "China;Canada"
    },
    {
        "id": "UgTrngiN16",
        "title": "LangProp: A code optimization framework using Language Models applied to driving",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "LangProp is a framework for iteratively optimizing code generated by large language models (LLMs) in a supervised/reinforcement learning setting. While LLMs can generate sensible solutions zero-shot, the solutions are often sub-optimal. Especially for code generation tasks, it is likely that the initial code will fail on certain edge cases. LangProp automatically evaluates the code performance on a dataset of input-output pairs, as well as catches any exceptions, and feeds the results back to the LLM in the training loop, so that the LLM can iteratively improve the code it generates. By adopting a metric- and data-driven training paradigm for this code optimization procedure, one could easily adapt findings from traditional machine learning techniques such as imitation learning, DAgger, and reinforcement learning. \nWe demonstrate the first proof of concept of automated code optimization for autonomous driving in CARLA, showing that LangProp can generate interpretable and transparent driving policies that can be verified and improved in a metric- and data-driven way.\nOur code will be open-sourced and is available at https://github.com/langprop-iclr24/LangProp.",
        "keywords": "optimization;autonomous driving;Large Language Models;code generation",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/0229924f58489aa9a197ab9330557ba5210992e4.zip",
        "author": "Shu Ishida;Gianluca Corrado;George Fedoseev;Hudson Yeo;Lloyd Russell;Jamie Shotton;Joao F. Henriques;Anthony Hu",
        "authorids": "~Shu_Ishida1;~Gianluca_Corrado1;~George_Fedoseev1;~Hudson_Yeo1;~Lloyd_Russell1;~Jamie_Shotton1;~Joao_F._Henriques1;~Anthony_Hu1",
        "gender": ";;;M;;M;M;M",
        "homepage": ";;;;https://www.lloydrussell.co.uk/;https://jamie.shotton.org/;http://www.robots.ox.ac.uk/~joao/;https://anthonyhu.github.io/",
        "dblp": ";;;;209/4864;47/572.html;31/8617.html;220/5381",
        "google_scholar": "h_qfOBYAAAAJ;https://scholar.google.co.uk/citations?user=POZPkQgAAAAJ;FCxuyrQAAAAJ;7ZoZlhIAAAAJ;https://scholar.google.co.uk/citations?view_op=list_works;eSOXB6IAAAAJ;aCQjyp0AAAAJ;https://scholar.google.fr/citations?user=5eV1m40AAAAJ",
        "orcid": ";;;;0000-0001-6332-756X;;;",
        "linkedin": ";gianluca-corrado-617a6167/;georgefedoseev/;hudson-yeo-20b409b1/;llerussell/;jamie-shotton-295ab25/;;",
        "or_profile": "~Shu_Ishida1;~Gianluca_Corrado1;~George_Fedoseev1;~Hudson_Yeo1;~Lloyd_Russell1;~Jamie_Shotton1;~Joao_F._Henriques1;~Anthony_Hu1",
        "aff": "University of Oxford;Wayve;;;;Wayve;University of Oxford;Wayve",
        "aff_domain": "ox.ac.uk;wayve.ai;;;;wayve.ai;ox.ac.uk;wayve.ai",
        "position": "PhD student;Researcher;;;;Chief Scientist;Principal Researcher;Researcher",
        "bibtex": "@misc{\nishida2024langprop,\ntitle={LangProp: A code optimization framework using Language Models applied to driving},\nauthor={Shu Ishida and Gianluca Corrado and George Fedoseev and Hudson Yeo and Lloyd Russell and Jamie Shotton and Joao F. Henriques and Anthony Hu},\nyear={2024},\nurl={https://openreview.net/forum?id=UgTrngiN16}\n}",
        "github": "",
        "project": "",
        "reviewers": "JXcz;ayZc;woM2;ZuhC;maNz;cL61",
        "site": "https://openreview.net/forum?id=UgTrngiN16",
        "pdf_size": 1288123,
        "rating": "1;3;6;6;6;8",
        "confidence": "5;4;3;3;4;3",
        "soundness": "1;2;3;3;2;3",
        "contribution": "3;2;3;4;2;4",
        "presentation": "2;2;3;4;2;3",
        "wc_summary": "130;33;52;82;250;171",
        "wc_strengths": "65;11;65;127;80;74",
        "wc_weaknesses": "65;340;87;334;261;247",
        "wc_questions": "326;32;16;6;90;60",
        "wc_review": "586;416;220;549;681;552",
        "wc_reply_reviewers": "0;0;0;13;100;28",
        "wc_reply_authors": "2259;1912;1029;1354;1387;855",
        "reply_reviewers": "0;0;0;1;1;1",
        "reply_authors": "5;4;2;3;4;2",
        "rating_avg": [
            5.0,
            2.309401076758503
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.7453559924999298
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.7453559924999298
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.7453559924999298
        ],
        "wc_summary_avg": [
            119.66666666666667,
            74.42819059708192
        ],
        "wc_strengths_avg": [
            70.33333333333333,
            33.900180268285034
        ],
        "wc_weaknesses_avg": [
            222.33333333333334,
            109.1538160375328
        ],
        "wc_questions_avg": [
            88.33333333333333,
            109.90551497637516
        ],
        "wc_review_avg": [
            500.6666666666667,
            147.6004366148315
        ],
        "wc_reply_reviewers_avg": [
            23.5,
            35.68262882692361
        ],
        "wc_reply_authors_avg": [
            1466.0,
            484.91236321628264
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            1.1055415967851334
        ],
        "replies_avg": [
            33,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.8714212528966688,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14519877304206849022&as_sdt=5,31&sciodt=0,31&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;1;0;1",
        "aff_unique_norm": "University of Oxford;Wayve",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ox.ac.uk;https://www.wayve.ai",
        "aff_unique_abbr": "Oxford;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "UhcXE3o1R3",
        "title": "Apollo: Zero-shot MultiModal Reasoning with Multiple Experts",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We propose a modular framework that leverages the expertise of different foundation models over different modalities and domains in order to perform a single, complex, multi-modal task, without relying on prompt engineering or otherwise tailor-made multi-modal training. Our approach enables decentralized command execution and allows each model to both contribute and benefit from the expertise of the other models. Our method can be extended to a variety of foundation models (including audio and vision), above and beyond only language models, as it does not depend on prompts. We demonstrate our approach on two tasks. On the well-known task of stylized image captioning, our experiments show that our approach outperforms semi-supervised state-of-the-art models, while being zero-shot and avoiding costly training, data collection, and prompt engineering. We further demonstrate this method on a novel task, audio-aware image captioning, in which an image and audio are given and the task is to generate text that describes the image within the context of the provided audio.",
        "keywords": "Multimodality;Zero-shot learning;Pre-trained transformers;Vision;Language;Audio;Image Captioning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/500476f9aad1b528fc889f7ebd4d8f2a21fb5653.zip",
        "author": "Daniela Ben-David;Tzuf Paz-Argaman;Reut Tsarfaty",
        "authorids": "~Daniela_Ben-David1;~Tzuf_Paz-Argaman2;~Reut_Tsarfaty1",
        "gender": "F;F;F",
        "homepage": "https://www.linkedin.com/in/daniela-ben-david-9852b6164/;;",
        "dblp": ";;21/3716",
        "google_scholar": ";;",
        "orcid": ";;",
        "linkedin": ";tzuf-argaman-334b9290;",
        "or_profile": "~Daniela_Ben-David1;~Tzuf_Paz-Argaman2;~Reut_Tsarfaty1",
        "aff": ";Bar-Ilan University;Bar-Ilan University, Technion",
        "aff_domain": ";biu.ac.il;biu.ac.il",
        "position": ";PhD student;Associate Professor",
        "bibtex": "@misc{\nben-david2024apollo,\ntitle={Apollo: Zero-shot MultiModal Reasoning with Multiple Experts},\nauthor={Daniela Ben-David and Tzuf Paz-Argaman and Reut Tsarfaty},\nyear={2024},\nurl={https://openreview.net/forum?id=UhcXE3o1R3}\n}",
        "github": "",
        "project": "",
        "reviewers": "6i3a;JWXZ;mH2v",
        "site": "https://openreview.net/forum?id=UhcXE3o1R3",
        "pdf_size": 27139895,
        "rating": "3;5;5",
        "confidence": "4;3;3",
        "soundness": "3;2;2",
        "contribution": "2;3;2",
        "presentation": "2;2;2",
        "wc_summary": "50;133;56",
        "wc_strengths": "40;76;52",
        "wc_weaknesses": "308;293;249",
        "wc_questions": "2;72;67",
        "wc_review": "400;574;424",
        "wc_reply_reviewers": "20;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "1;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            79.66666666666667,
            37.791827452800185
        ],
        "wc_strengths_avg": [
            56.0,
            14.966629547095765
        ],
        "wc_weaknesses_avg": [
            283.3333333333333,
            25.037749277618563
        ],
        "wc_questions_avg": [
            47.0,
            31.88521078284832
        ],
        "wc_review_avg": [
            466.0,
            76.99350621968063
        ],
        "wc_reply_reviewers_avg": [
            6.666666666666667,
            9.428090415820632
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.9999999999999998,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:pFtCTtHFMJ4J:scholar.google.com/&scioq=Apollo:+Zero-shot+MultiModal+Reasoning+with+Multiple+Experts&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Bar-Ilan University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.biu.ac.il",
        "aff_unique_abbr": "BIU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Israel"
    },
    {
        "id": "Uhxtq4nCzS",
        "title": "Divergence at the Interpolation Threshold: Identifying, Interpreting & Ablating the Sources of a Deep Learning Puzzle",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Machine learning models misbehave, often in unexpected ways. One prominent misbehavior is when the test loss diverges at the interpolation threshold, perhaps best known from its distinctive appearance in double descent. While considerable theoretical effort has gone into understanding generalization of overparameterized models, less effort has been made at understanding why the test loss misbehaves at the interpolation threshold. Moreover, analytically solvable models in this area employ a range of assumptions and use complex techniques from random matrix theory, statistical mechanics, and kernel methods, making it difficult to assess when and why test error might diverge; for instance, recent work found a divergence in noise-free toy nonlinear autoencoders, surprising the authors and raising questions about whether such an outcome should have been anticipated. In this work, we analytically study the simplest supervised model - ordinary linear regression - and show intuitively and rigorously when and why a divergence occurs at the interpolation threshold using basic linear algebra. We identify three interpretable factors that, when simultaneously all present, cause double descent. We demonstrate on real data that both models' test losses diverge at the interpolation threshold and that the divergence disappears when we ablate any one of the three identified factors. We conclude by using our fresh perspective to shed light on recent observations in nonlinear models concerning superposition and double descent.",
        "keywords": "mechanistic interpretability;interpretability;double descent",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/e7a706634f14a880bd73aa7bc9f96f59f7acf9be.pdf",
        "author": "Rylan Schaeffer;Zachary Robertson;Akhilan Boopathy;Mikail Khona;Ila R Fiete;Andrey Gromov;Sanmi Koyejo",
        "authorids": "~Rylan_Schaeffer2;~Zachary_Robertson1;~Akhilan_Boopathy1;~Mikail_Khona2;~Ila_R_Fiete1;~Andrey_Gromov1;~Sanmi_Koyejo1",
        "gender": "M;M;M;F;M;M;M",
        "homepage": "https://rylanschaeffer.github.io;;;https://fietelab.mit.edu/;;;https://cs.stanford.edu/~sanmi/",
        "dblp": "280/1341;271/8503.html;230/8358;;;;14/8885",
        "google_scholar": "6tMEGz8AAAAJ;769PIisAAAAJ;;uE-CihIAAAAJ;D056qfMAAAAJ;;EaaOeJwAAAAJ",
        "orcid": ";;;0000-0003-4738-2539;;;0000-0002-4023-419X",
        "linkedin": "rylanschaeffer/;zrobertson466920/;;;andrey-gromov-2329a241;mikail-khona-60656b141/;sanmi-koyejo-984754/",
        "or_profile": "~Rylan_Schaeffer2;~Zachary_Robertson1;~Akhilan_Boopathy1;~Ila_R_Fiete1;~Andrey_Gromov1;~mikail_khona1;~Oluwasanmi_O_Koyejo1",
        "aff": "Meta Generative AI;Stanford University;Amazon;Massachusetts Institute of Technology;University of Maryland, College Park;;Google",
        "aff_domain": "meta.com;stanford.edu;amazon.com;mit.edu;umd.edu;;google.com",
        "position": "Intern;PhD student;Intern;Professor;Assistant Professor;;Research Scientist",
        "bibtex": "@misc{\nschaeffer2024divergence,\ntitle={Divergence at the Interpolation Threshold: Identifying, Interpreting \\& Ablating the Sources of a Deep Learning Puzzle},\nauthor={Rylan Schaeffer and Zachary Robertson and Akhilan Boopathy and Mikail Khona and Ila R Fiete and Andrey Gromov and Sanmi Koyejo},\nyear={2024},\nurl={https://openreview.net/forum?id=Uhxtq4nCzS}\n}",
        "github": "",
        "project": "",
        "reviewers": "yGEF;iMad;7Ltc;5RFc",
        "site": "https://openreview.net/forum?id=Uhxtq4nCzS",
        "pdf_size": 2066087,
        "rating": "1;3;3;6",
        "confidence": "4;3;3;4",
        "soundness": "2;3;3;4",
        "contribution": "2;1;1;4",
        "presentation": "2;3;3;2",
        "wc_summary": "43;29;104;123",
        "wc_strengths": "11;45;20;212",
        "wc_weaknesses": "135;295;180;621",
        "wc_questions": "125;403;2;162",
        "wc_review": "314;772;306;1118",
        "wc_reply_reviewers": "77;0;0;22",
        "wc_reply_authors": "818;914;754;463",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "2;3;2;2",
        "rating_avg": [
            3.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            1.224744871391589
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            74.75,
            39.63820757804268
        ],
        "wc_strengths_avg": [
            72.0,
            81.78325011883545
        ],
        "wc_weaknesses_avg": [
            307.75,
            190.03338522480726
        ],
        "wc_questions_avg": [
            173.0,
            145.40116918374488
        ],
        "wc_review_avg": [
            627.5,
            340.26276610878244
        ],
        "wc_reply_reviewers_avg": [
            24.75,
            31.47518864121389
        ],
        "wc_reply_authors_avg": [
            737.25,
            168.2667153658144
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.14002800840280097,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7921710082829236367&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;3;4;5",
        "aff_unique_norm": "Meta;Stanford University;Amazon;Massachusetts Institute of Technology;University of Maryland;Google",
        "aff_unique_dep": "Generative AI;;Amazon.com, Inc.;;;Google",
        "aff_unique_url": "https://meta.com;https://www.stanford.edu;https://www.amazon.com;https://web.mit.edu;https://www/umd.edu;https://www.google.com",
        "aff_unique_abbr": "Meta;Stanford;Amazon;MIT;UMD;Google",
        "aff_campus_unique_index": "1;2;3",
        "aff_campus_unique": ";Stanford;College Park;Mountain View",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Uj2Wjv0pMY",
        "title": "Put on your detective hat: What\u2019s wrong in this video?",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Following step-by-step procedures is an essential component of various activities carried out by individuals in their everyday lives. These procedures serve as a guiding framework that helps achieve goals efficiently, whether assembling furniture or preparing a recipe. However, the complexity and duration of procedural activities inherently increase the likelihood of making errors. Understanding such procedural activities from a sequence of frames is a challenging task that demands an accurate interpretation of visual information and an ability to reason about the structure of the activity. To this end, we collected a new ego-centric 4D dataset comprising 384 recordings (94.5 hrs) of people performing recipes in kitchen environments. This dataset consists of two distinct activity types: one in which participants adhere to the provided recipe instructions and another where they deviate and induce errors. We provide 5.3K step annotations and 10K fine-grained action annotations for 20% of the collected data and benchmark it on two tasks: error recognition, multi step localization and procedure learning.",
        "keywords": "Ego-centric 4D video dataset;Procedural activity understanding;Multi-step localization;Procedure learning;Error Recognition",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Rohith Peddi;Shivvrat Arya;Bharath Challa;Likhitha Pallapothula;Akshay Vyas;Qifan Zhang;Jikai Wang;Vasundhara Komaragiri;Nicholas Ruozzi;Eric Ragan;Yu Xiang;Vibhav Giridhar Gogate",
        "authorids": "~Rohith_Peddi1;~Shivvrat_Arya1;~Bharath_Challa1;~Likhitha_Pallapothula1;~Akshay_Vyas2;~Qifan_Zhang5;~Jikai_Wang3;~Vasundhara_Komaragiri1;~Nicholas_Ruozzi1;~Eric_Ragan1;~Yu_Xiang3;~Vibhav_Giridhar_Gogate1",
        "gender": "M;M;M;F;M;M;M;;M;;M;M",
        "homepage": "https://rohithpeddi.github.io/;https://shivvrat.github.io;;;;;;;http://cs.utdallas.edu/people/faculty/nicholas-ruozzi/;https://www.cise.ufl.edu/~eragan/;http://www.hlt.utdallas.edu/~vgogate/;https://yuxng.github.io/",
        "dblp": "331/1651;275/7819;;;;;;;46/1258;;14/4229;00/6716-1",
        "google_scholar": "MvhACDcAAAAJ;eM1co-kAAAAJ;;;;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en;;https://scholar.google.com.tw/citations?user=kzmSnEQAAAAJ;VT7D6oYAAAAJ;https://scholar.google.com.tw/citations?user=pm_dg3cAAAAJ;",
        "orcid": "0009-0007-4705-8129;0000-0002-9727-2533;;;;;0009-0005-1725-3981;;;;;0000-0001-9431-5131",
        "linkedin": "rohithpeddi/;shivvrat/;bharathchalla/;likhitha-p-31054527a/;akshay-vyas-43345b134/;qifan-zhang-2a68211a7/;jikai-wang-03243787/;vasundhara-komaragiri/;;;;",
        "or_profile": "~Rohith_Peddi1;~Shivvrat_Arya1;~Bharath_Challa1;~Likhitha_Pallapothula1;~Akshay_Vyas2;~Qifan_Zhang5;~Jikai_Wang3;~Vasundhara_Komaragiri1;~Nicholas_Ruozzi1;~Eric_Ragan1;~Vibhav_Gogate1;~Yu_Xiang1",
        "aff": "University of Texas, Dallas;The University of Texas at Dallas;;University of Texas at Dallas;University of Texas at Dallas;University of Texas at Dallas;University of Texas at Dallas;University of Texas, Dallas;University of Texas, Dallas;University of Florida;University of Texas, Dallas;University of Texas, Dallas",
        "aff_domain": "utdallas.edu;cs.utdallas.edu;;utd.edu;cs.utdallas.edu;utdallas.edu;cs.utdallas.edu;utdallas.edu;utdallas.edu;ufl.edu;utdallas.edu;utdallas.edu",
        "position": "PhD student;PhD student;;PhD student;PhD student;PhD student;PhD student;PhD student;Associate Professor;Assistant Professor;Professor;Assistant Professor",
        "bibtex": "@misc{\npeddi2024put,\ntitle={Put on your detective hat: What{\\textquoteright}s wrong in this video?},\nauthor={Rohith Peddi and Shivvrat Arya and Bharath Challa and Likhitha Pallapothula and Akshay Vyas and Qifan Zhang and Jikai Wang and Vasundhara Komaragiri and Nicholas Ruozzi and Eric Ragan and Yu Xiang and Vibhav Giridhar Gogate},\nyear={2024},\nurl={https://openreview.net/forum?id=Uj2Wjv0pMY}\n}",
        "github": "",
        "project": "",
        "reviewers": "81qP;tDxh;bmra",
        "site": "https://openreview.net/forum?id=Uj2Wjv0pMY",
        "pdf_size": 28079671,
        "rating": "3;5;5",
        "confidence": "4;4;4",
        "soundness": "2;2;2",
        "contribution": "1;2;2",
        "presentation": "2;3;3",
        "wc_summary": "121;42;108",
        "wc_strengths": "25;33;74",
        "wc_weaknesses": "369;123;330",
        "wc_questions": "11;32;309",
        "wc_review": "526;230;821",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "625;388;786",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            90.33333333333333,
            34.58644564308715
        ],
        "wc_strengths_avg": [
            44.0,
            21.463146709340332
        ],
        "wc_weaknesses_avg": [
            274.0,
            107.95369377654477
        ],
        "wc_questions_avg": [
            117.33333333333333,
            135.7996890849002
        ],
        "wc_review_avg": [
            525.6666666666666,
            241.2748547933571
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            599.6666666666666,
            163.46729200532917
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            12,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:wjLEojD2vH4J:scholar.google.com/&scioq=Put+on+your+detective+hat:+What%E2%80%99s+wrong+in+this+video%3F&hl=en&as_sdt=0,5",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0;0;0;0;0;0;1;0;0",
        "aff_unique_norm": "University of Texas at Dallas;University of Florida",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.utdallas.edu;https://www.ufl.edu",
        "aff_unique_abbr": "UT Dallas;UF",
        "aff_campus_unique_index": "0;0;0;0;0;0;0;0;0;0",
        "aff_campus_unique": "Dallas;",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "UjYeectI4p",
        "title": "Evaluating graph generative models with graph kernels: what structural characteristics are captured?",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "For a number of practical problems, it is important to measure the similarity between graphs. In particular, it is essential for assessing the quality of graph generative models. In evaluation measures for graph generative models, graph kernels are often used to measure the similarity of graphs. Recently, it has been shown that the choice of a graph kernel may drastically affect research outcomes in this area. Therefore, it is essential to choose a kernel that is suitable for the task at hand. In this paper, we propose a framework for comparing graph kernels in terms of which high-level structural properties they are sensitive to. For this, we choose several pairs of random graph models that are different in one particular property: heterogeneity of degree distribution, the presence of community structure, the presence or particular type of latent geometry, and others. Then, we design continuous transitions between these models and measure which graph kernel is sensitive to the corresponding change. We show that using such diverse graph modifications is crucial for evaluation: many kernels can successfully capture some properties and fail on others. One of our conclusions is that simple and long-known Shortest Path and Graphlet kernels are able to successfully capture all graph properties that we consider in this work.",
        "keywords": "graph kernel;random graph model;degree distribution;community structure;graph generative model",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Martijn G\u00f6sgens;Alexey Tikhonov;Liudmila Prokhorenkova",
        "authorids": "~Martijn_G\u00f6sgens1;~Alexey_Tikhonov1;~Liudmila_Prokhorenkova1",
        "gender": "M;F;M",
        "homepage": "https://martijngosgens.nl;;http://altsoph.com",
        "dblp": "254/0995;45/11468;82/8978",
        "google_scholar": "iusaOxAAAAAJ;https://scholar.google.ru/citations?user=6JyZlSEAAAAJ;X6vNzpoAAAAJ",
        "orcid": "0000-0002-7197-7682;;",
        "linkedin": "martijn-g%C3%B6sgens-175165100/;;altsoph/",
        "or_profile": "~Martijn_G\u00f6sgens1;~Liudmila_Prokhorenkova1;~Aleksei_Tikhonov1",
        "aff": "Eindhoven University of Technology;Yandex;Inworld AI",
        "aff_domain": "tue.nl;yandex-team.ru;inworld.ai",
        "position": "PhD student;Researcher;Staff researcher",
        "bibtex": "@misc{\ng{\\\"o}sgens2024evaluating,\ntitle={Evaluating graph generative models with graph kernels: what structural characteristics are captured?},\nauthor={Martijn G{\\\"o}sgens and Alexey Tikhonov and Liudmila Prokhorenkova},\nyear={2024},\nurl={https://openreview.net/forum?id=UjYeectI4p}\n}",
        "github": "",
        "project": "",
        "reviewers": "oaCD;7Dfc;3Bx8;nxnq",
        "site": "https://openreview.net/forum?id=UjYeectI4p",
        "pdf_size": 552223,
        "rating": "3;3;5;6",
        "confidence": "4;5;3;5",
        "soundness": "3;3;2;2",
        "contribution": "2;3;1;3",
        "presentation": "4;4;2;4",
        "wc_summary": "67;84;31;159",
        "wc_strengths": "141;81;19;74",
        "wc_weaknesses": "196;151;167;118",
        "wc_questions": "56;46;1;210",
        "wc_review": "460;362;218;561",
        "wc_reply_reviewers": "199;88;43;114",
        "wc_reply_authors": "912;610;424;753",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;2;1;2",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            85.25,
            46.68176838981145
        ],
        "wc_strengths_avg": [
            78.75,
            43.222534631832964
        ],
        "wc_weaknesses_avg": [
            158.0,
            28.16913204200655
        ],
        "wc_questions_avg": [
            78.25,
            78.83646047356515
        ],
        "wc_review_avg": [
            400.25,
            126.57877981715576
        ],
        "wc_reply_reviewers_avg": [
            111.0,
            56.80228868628446
        ],
        "wc_reply_authors_avg": [
            674.75,
            179.91577890779897
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.058025885318565944,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:HM4qlRwuYmwJ:scholar.google.com/&scioq=Evaluating+graph+generative+models+with+graph+kernels:+what+structural+characteristics+are+captured%3F&hl=en&as_sdt=0,33",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Eindhoven University of Technology;Yandex;Inworld AI",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.tue.nl;https://yandex.com;https://www.inworld.ai",
        "aff_unique_abbr": "TU/e;Yandex;Inworld AI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2",
        "aff_country_unique": "Netherlands;Russian Federation;United States"
    },
    {
        "id": "UkLSvLqiO7",
        "title": "The Emergence of Reproducibility and Consistency in Diffusion Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recently, diffusion models have emerged as powerful deep generative models, showcasing cutting-edge performance across various applications such as image generation, solving inverse problems, and text-to-image synthesis. These models generate new data (e.g., images) by transforming random noise inputs through a reverse diffusion process.\nIn this work, we uncover a distinct and prevalent phenomenon within diffusion models in contrast to most other generative models, which we refer to as ``consistent model reproducibility''. \nTo elaborate, our extensive experiments have consistently shown that when starting with the same initial noise input and sampling with a deterministic solver, diffusion models tend to produce nearly identical output content. This consistency holds true regardless of the choices of model architectures and training procedures.\nAdditionally, our research has unveiled that this exceptional model reproducibility manifests in two distinct training regimes: (i) \"memorization regime,'' characterized by a significantly overparameterized model which attains reproducibility mainly by memorizing the training data; (ii) \"generalization regime,'' in which the model is trained on an extensive dataset, and its reproducibility emerges with the model's generalization capabilities. Our analysis provides theoretical justification for the model reproducibility in \"memorization regime''.\nMoreover, our research reveals that this valuable property generalizes to many variants of diffusion models, including conditional diffusion models, diffusion models for solving inverse problems, and fine-tuned diffusion models.\nA deeper understanding of this phenomenon has the potential to yield more interpretable and controlable data generative processes based on diffusion models.",
        "keywords": "Diffusion model; Consistent model reproducibility; Phenomenon; Uniquely identifiable encoding",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/86f7f449744f40ee89785f902095b9ebf128ee99.zip",
        "author": "Huijie Zhang;Jinfan Zhou;Yifu Lu;Minzhe Guo;Liyue Shen;Qing Qu",
        "authorids": "~Huijie_Zhang2;~Jinfan_Zhou2;~Yifu_Lu1;~Minzhe_Guo1;~Liyue_Shen1;~Qing_Qu2",
        "gender": "M;M;;M;F;M",
        "homepage": "https://www.huijiezh.com/;;;;https://liyueshen.engin.umich.edu/;https://qingqu.engin.umich.edu/",
        "dblp": ";;;;159/2036;127/6874-1",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;;ybsmKpsAAAAJ;;Ho4qk9wAAAAJ;JfblW3MAAAAJ",
        "orcid": ";0000-0002-5853-1731;;;0000-0001-5942-3196;0000-0001-9136-558X",
        "linkedin": ";;yifu-lu-3547b321b;minzhe-guo/;;qing-q-1a0b9746/",
        "or_profile": "~Huijie_Zhang2;~Jinfan_Zhou2;~Yifu_Lu1;~Minzhe_Guo1;~Liyue_Shen1;~Qing_Qu2",
        "aff": "University of Michigan - Ann Arbor;University of Michigan - Ann Arbor;University of Michigan - Ann Arbor;University of Michigan - Ann Arbor;University of Michigan - Ann Arbor;University of Michigan",
        "aff_domain": "umich.edu;umich.edu;umich.edu;umich.edu;umich.edu;umich.edu",
        "position": "PhD student;MS student;Undergrad student;Undergrad student;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nzhang2024the,\ntitle={The Emergence of Reproducibility and Consistency in Diffusion Models},\nauthor={Huijie Zhang and Jinfan Zhou and Yifu Lu and Minzhe Guo and Liyue Shen and Qing Qu},\nyear={2024},\nurl={https://openreview.net/forum?id=UkLSvLqiO7}\n}",
        "github": "",
        "project": "",
        "reviewers": "LTJ7;uEsZ;6ysm;vqyB",
        "site": "https://openreview.net/forum?id=UkLSvLqiO7",
        "pdf_size": 6878163,
        "rating": "3;5;6;8",
        "confidence": "3;4;4;4",
        "soundness": "3;2;4;4",
        "contribution": "1;2;4;4",
        "presentation": "3;3;4;4",
        "wc_summary": "80;63;90;174",
        "wc_strengths": "31;22;62;130",
        "wc_weaknesses": "223;50;17;60",
        "wc_questions": "33;39;33;106",
        "wc_review": "367;174;202;470",
        "wc_reply_reviewers": "0;140;133;39",
        "wc_reply_authors": "1430;2155;1347;1077",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "5;6;4;4",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            1.299038105676658
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            101.75,
            42.81573892857625
        ],
        "wc_strengths_avg": [
            61.25,
            42.37555309373554
        ],
        "wc_weaknesses_avg": [
            87.5,
            79.83263743607623
        ],
        "wc_questions_avg": [
            52.75,
            30.84132779242813
        ],
        "wc_review_avg": [
            303.25,
            121.27113217909694
        ],
        "wc_reply_reviewers_avg": [
            78.0,
            60.153969112603036
        ],
        "wc_reply_authors_avg": [
            1502.25,
            398.8241310402368
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.75,
            0.82915619758885
        ],
        "replies_avg": [
            33,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.8006407690254357,
        "gs_citation": 57,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8316373501545972369&as_sdt=5,31&sciodt=0,31&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "University of Michigan",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.umich.edu",
        "aff_unique_abbr": "UM",
        "aff_campus_unique_index": "0;0;0;0;0",
        "aff_campus_unique": "Ann Arbor;",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "EfficientDM: Efficient Quantization-Aware Fine-Tuning of Low-Bit Diffusion Models",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18521",
        "id": "UmMa3UNDAz",
        "author_site": "YEFEI HE, Jing Liu, Weijia Wu, Hong Zhou, Bohan Zhuang",
        "tldr": "",
        "abstract": "Diffusion models have demonstrated remarkable capabilities in image synthesis and related generative tasks. Nevertheless, their practicality for low-latency real-world applications is constrained by substantial computational costs and latency issues. Quantization is a dominant way to compress and accelerate diffusion models, where post-training quantization (PTQ) and quantization-aware training (QAT) are two main approaches, each bearing its own properties. While PTQ exhibits efficiency in terms of both time and data usage, it may lead to diminished performance in low bit-width settings. On the other hand, QAT can help alleviate performance degradation but comes with substantial demands on computational and data resources. To capitalize on the advantages while avoiding their respective drawbacks, we introduce a data-free, quantization-aware and parameter-efficient fine-tuning framework for low-bit diffusion models, dubbed EfficientDM, to achieve QAT-level performance with PTQ-like efficiency. Specifically, we propose a quantization-aware variant of the low-rank adapter (QALoRA) that can be merged with model weights and jointly quantized to low bit-width. The fine-tuning process distills the denoising capabilities of the full-precision model into its quantized counterpart, eliminating the requirement for training data. To further enhance performance, we introduce scale-aware optimization to address ineffective learning of QALoRA due to variations in weight quantization scales across different layers. We also employ temporal learned step-size quantization to handle notable variations in activation distributions across denoising steps. Extensive experimental results demonstrate that our method significantly outperforms previous PTQ-based diffusion models while maintaining similar time and data efficiency. Specifically, there is only a marginal $0.05$ sFID increase when quantizing both weights and activations of LDM-4 to 4-bit on ImageNet $256\\times256$. Compared to QAT-based methods, our EfficientDM also boasts a $16.2\\times$ faster quantization speed with comparable generation quality, rendering it a compelling choice for practical applications.",
        "keywords": "Diffusion Models;Model Quantization;Model Compression;Efficient Models",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Yefei He;Jing Liu;Weijia Wu;Hong Zhou;Bohan Zhuang",
        "authorids": "~Yefei_He1;~Jing_Liu8;~Weijia_Wu2;~Hong_Zhou3;~Bohan_Zhuang1",
        "gender": "M;M;M;M;M",
        "homepage": "https://hexy.tech/;https://www.jing-liu.com/;https://weijiawu.github.io/;https://person.zju.edu.cn/zhouhong;https://bohanzhuang.github.io/",
        "dblp": "92/6254;72/2590-48;87/7695-1;45/3426;145/1096",
        "google_scholar": "CTEQwwwAAAAJ;-lHaZH4AAAAJ;NgjTRe4AAAAJ;;https://scholar.google.com.au/citations?user=DFuDBBwAAAAJ",
        "orcid": "0000-0002-2171-4518;0000-0002-6745-3050;0000-0003-3912-7212;;",
        "linkedin": ";jing-liu-619688133/;%E5%A8%81%E4%BD%B3-%E5%90%B4-07a852280/;;bohan-zhuang/",
        "or_profile": "~Yefei_He1;~Jing_Liu8;~Weijia_Wu2;~Hong_Zhou3;~Bohan_Zhuang1",
        "aff": "Zhejiang University;Monash University;National University of Singapore;Zhejiang University;Monash University",
        "aff_domain": "zju.edu.cn;monash.edu.au;nus.edu;zju.edu.cn;monash.edu",
        "position": "PhD student;PhD student;Postdoc;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nhe2024efficientdm,\ntitle={Efficient{DM}: Efficient Quantization-Aware Fine-Tuning of Low-Bit Diffusion Models},\nauthor={Yefei He and Jing Liu and Weijia Wu and Hong Zhou and Bohan Zhuang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=UmMa3UNDAz}\n}",
        "github": "",
        "project": "",
        "reviewers": "SYoS;BLfX;ec6g;5Wot",
        "pdf_size": 13451444,
        "rating": "6;6;6;8",
        "confidence": "3;4;5;5",
        "soundness": "3;3;3;4",
        "contribution": "3;2;2;4",
        "presentation": "3;3;3;3",
        "wc_summary": "81;90;94;93",
        "wc_strengths": "33;39;47;76",
        "wc_weaknesses": "69;30;74;87",
        "wc_questions": "6;220;276;2",
        "wc_review": "189;379;491;258",
        "wc_reply_reviewers": "149;26;89;43",
        "wc_reply_authors": "797;719;731;286",
        "reply_reviewers": "2;1;3;1",
        "reply_authors": "3;2;4;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            89.5,
            5.123475382979799
        ],
        "wc_strengths_avg": [
            48.75,
            16.498105951896417
        ],
        "wc_weaknesses_avg": [
            65.0,
            21.24852936087578
        ],
        "wc_questions_avg": [
            126.0,
            123.60420704814217
        ],
        "wc_review_avg": [
            329.25,
            115.52570060380503
        ],
        "wc_reply_reviewers_avg": [
            76.75,
            47.65697745346425
        ],
        "wc_reply_authors_avg": [
            633.25,
            202.67261161785032
        ],
        "reply_reviewers_avg": [
            1.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5222329678670935,
        "gs_citation": 44,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16276485965925586493&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=UmMa3UNDAz",
        "pdf": "https://openreview.net/pdf?id=UmMa3UNDAz",
        "email": "zju.edu.cn;monash.edu.au;nus.edu;zju.edu.cn;monash.edu",
        "author_num": 5,
        "aff_unique_index": "0;1;2;0;1",
        "aff_unique_norm": "Zhejiang University;Monash University;National University of Singapore",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.zju.edu.cn;https://www.monash.edu;https://www.nus.edu.sg",
        "aff_unique_abbr": "ZJU;Monash;NUS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;0;1",
        "aff_country_unique": "China;Australia;Singapore"
    },
    {
        "title": "VDT: General-purpose Video Diffusion Transformers via Mask Modeling",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18520",
        "id": "Un0rgm9f04",
        "author_site": "Haoyu Lu, Guoxing Yang, Nanyi Fei, Yuqi Huo, Zhiwu Lu, Ping Luo, Mingyu Ding",
        "tldr": "",
        "abstract": "This work introduces Video Diffusion Transformer (VDT), which pioneers the use of transformers in diffusion-based video generation.\nIt features transformer blocks with modularized temporal and spatial attention modules to leverage the rich spatial-temporal representation inherited in transformers. Additionally, we propose a unified spatial-temporal mask modeling mechanism, seamlessly integrated with the model, to cater to diverse video generation scenarios.\n\nVDT offers several appealing benefits. (1) It excels at capturing temporal dependencies to produce temporally consistent video frames and even simulate the physics and dynamics of 3D objects over time. (2) It facilitates flexible conditioning information, e.g., simple concatenation in the token space, effectively unifying different token lengths and modalities. (3) Pairing with our proposed spatial-temporal mask modeling mechanism, it becomes a general-purpose video diffuser for harnessing a range of tasks, including unconditional generation, video prediction, interpolation, animation, and completion, etc. Extensive experiments on these tasks spanning various scenarios, including autonomous driving, natural weather, human action, and physics-based simulation, demonstrate the effectiveness of VDT. Moreover, we provide a comprehensive study on the capabilities of VDT in capturing accurate temporal dependencies, handling conditioning information, and the spatial-temporal mask modeling mechanism. Additionally, we present comprehensive studies on how VDT handles conditioning information with the mask modeling mechanism, which we believe will benefit future research and advance the field. Codes and models are available at the https://VDT-2023.github.io.",
        "keywords": "diffusion model;video generation",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Haoyu Lu;Guoxing Yang;Nanyi Fei;Yuqi Huo;Zhiwu Lu;Ping Luo;Mingyu Ding",
        "authorids": "~Haoyu_Lu1;~Guoxing_Yang3;~Nanyi_Fei1;~Yuqi_Huo1;~Zhiwu_Lu1;~Ping_Luo2;~Mingyu_Ding1",
        "gender": ";M;M;M;M;M;",
        "homepage": "https://haoyulu1998.github.io/;;;https://gsai.ruc.edu.cn/luzhiwu;https://dingmyu.github.io/;https://github.com/GuoxingY;http://luoping.me/",
        "dblp": "240/2720;232/2227;219/6931.html;53/5234;188/5243;271/9521;54/4989-2.html",
        "google_scholar": "https://scholar.google.com.hk/citations?view_op=list_works;Oz6VqeQAAAAJ;3oryMg0AAAAJ;OUXS8doAAAAJ;w4yTWwoAAAAJ;;https://scholar.google.com.hk/citations?hl=en",
        "orcid": ";;;;0000-0001-6556-8359;;0000-0002-6685-7950",
        "linkedin": "%E6%B5%A9%E5%AE%87-%E5%8D%A2-4b42b7198/;;;;dingmyu/;;",
        "or_profile": "~Haoyu_Lu1;~Nanyi_Fei1;~Yuqi_Huo1;~Zhiwu_Lu1;~Mingyu_Ding1;~GuoXing_Yang2;~Luo_Ping2",
        "aff": "Renmin University of China;Renmin University of China;Baichuan Intelligent Technology;Renmin University of China;University of California, Berkeley;Renmin University of China;The University of Hong Kong",
        "aff_domain": "ruc.edu.cn;ruc.edu.cn;baichuan-inc.com;ruc.edu.cn;berkeley.edu;ruc.edu.cn;hku.hk",
        "position": "PhD student;PhD student;Researcher;Full Professor;Postdoc;PhD student;Associate Professor",
        "bibtex": "@inproceedings{\nlu2024vdt,\ntitle={{VDT}: General-purpose Video Diffusion Transformers via Mask Modeling},\nauthor={Haoyu Lu and Guoxing Yang and Nanyi Fei and Yuqi Huo and Zhiwu Lu and Ping Luo and Mingyu Ding},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Un0rgm9f04}\n}",
        "github": "",
        "project": "",
        "reviewers": "mnca;cvvZ;HPRy",
        "pdf_size": 25490481,
        "rating": "6;6;6",
        "confidence": "4;4;4",
        "soundness": "3;3;3",
        "contribution": "3;2;3",
        "presentation": "3;3;2",
        "wc_summary": "66;78;53",
        "wc_strengths": "39;93;27",
        "wc_weaknesses": "116;147;78",
        "wc_questions": "138;2;118",
        "wc_review": "359;320;276",
        "wc_reply_reviewers": "17;19;0",
        "wc_reply_authors": "1022;872;978",
        "reply_reviewers": "1;1;0",
        "reply_authors": "4;3;4",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            65.66666666666667,
            10.208928554075703
        ],
        "wc_strengths_avg": [
            53.0,
            28.705400188814647
        ],
        "wc_weaknesses_avg": [
            113.66666666666667,
            28.21740991342441
        ],
        "wc_questions_avg": [
            86.0,
            59.95553908244564
        ],
        "wc_review_avg": [
            318.3333333333333,
            33.9050963065371
        ],
        "wc_reply_reviewers_avg": [
            12.0,
            8.524474568362947
        ],
        "wc_reply_authors_avg": [
            957.3333333333334,
            62.95677529508286
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 61,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9927415465920305669&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=Un0rgm9f04",
        "pdf": "https://openreview.net/pdf?id=Un0rgm9f04",
        "email": "ruc.edu.cn;ruc.edu.cn;baichuan-inc.com;ruc.edu.cn;berkeley.edu;ruc.edu.cn;hku.hk",
        "author_num": 7,
        "aff_unique_index": "0;0;1;0;2;0;3",
        "aff_unique_norm": "Renmin University of China;Baichuan Intelligent Technology;University of California, Berkeley;University of Hong Kong",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "http://www.ruc.edu.cn;;https://www.berkeley.edu;https://www.hku.hk",
        "aff_unique_abbr": "RUC;;UC Berkeley;HKU",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Berkeley;Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;1;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "WizardCoder: Empowering Code Large Language Models with Evol-Instruct",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18519",
        "id": "UnUwSIgK5W",
        "author_site": "Ziyang Luo, Can Xu, Pu Zhao, Qingfeng Sun, Xiubo Geng, Wenxiang Hu, Chongyang Tao, Jing Ma, Qingwei Lin, Daxin Jiang",
        "tldr": "",
        "abstract": "Code Large Language Models (Code LLMs), such as StarCoder, have demonstrated remarkable performance in various code-related tasks. However, different from their counterparts in the general language modeling field, the technique of instruction fine-tuning remains relatively under-researched in this domain. In this paper, we present Code Evol-Instruct, a novel approach that adapts the Evol-Instruct method to the realm of code, enhancing Code LLMs to create novel models, WizardCoder. Through comprehensive experiments on five prominent code generation benchmarks, namely HumanEval, HumanEval+, MBPP, DS-1000, and MultiPL-E, our models showcase outstanding performance. They consistently outperform all other open-source Code LLMs by a significant margin. Remarkably, WizardCoder 15B even surpasses the well-known closed-source LLMs, including Anthropic's Claude and Google's Bard, on the HumanEval and HumanEval+ benchmarks. Additionally, WizardCoder 34B not only achieves a HumanEval score comparable to GPT3.5 (ChatGPT) but also surpasses it on the HumanEval+ benchmark. Furthermore, our preliminary exploration highlights the pivotal role of instruction complexity in achieving exceptional coding performance.",
        "keywords": "Large Language Models;Code;Instruction Fine-tuning",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/454dd28d2c302fe98facff8cb2bfd495492729ca.zip",
        "author": "Ziyang Luo;Can Xu;Pu Zhao;Qingfeng Sun;Xiubo Geng;Wenxiang Hu;Chongyang Tao;Jing Ma;Qingwei Lin;Daxin Jiang",
        "authorids": "~Ziyang_Luo2;~Can_Xu2;~Pu_Zhao3;~Qingfeng_Sun1;~Xiubo_Geng2;~Wenxiang_Hu1;~Chongyang_Tao1;~Jing_Ma4;~Qingwei_Lin1;~Daxin_Jiang2",
        "gender": "M;M;M;M;F;M;M;F;M;M",
        "homepage": "https://chiyeunglaw.github.io/;;https://www.microsoft.com/en-us/research/people/puzhao/;https://victorsungo.github.io;https://xiubo0211.github.io/;https://wxpl.us;;https://majingcuhk.github.io/;https://www.microsoft.com/en-us/research/people/qlin/;https://www.microsoft.com/en-us/research/people/djiang/",
        "dblp": ";;75/8475-4.html;;19/189;141/4590;;96/6129-4.html;120/0743;77/5094",
        "google_scholar": "VI8NeJEAAAAJ;5aiE_NcAAAAJ;G3kyd-MAAAAJ;https://scholar.google.com.tw/citations?user=GLMKUEwAAAAJ;XxeX3FgAAAAJ;L2o2eHsAAAAJ;x_cOKuwAAAAJ;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.co.jp/citations?hl=zh-CN;N-wAHCoAAAAJ",
        "orcid": ";0000-0002-1949-5715;0000-0002-4518-323X;;;0000-0002-4273-6759;;;0000-0003-2559-2383;",
        "linkedin": "ziyang-luo-681a17192/;;;;;;;;;",
        "or_profile": "~Ziyang_Luo2;~Can_Xu2;~Pu_Zhao3;~Qingfeng_Sun1;~Xiubo_Geng2;~Wenxiang_Hu1;~Chongyang_Tao1;~Jing_Ma4;~Qingwei_Lin1;~Daxin_Jiang2",
        "aff": "Microsoft;Microsoft;Microsoft;Microsoft;Microsoft;Microsoft Research;Microsoft;Hong Kong Baptist University;Microsoft Research;StepFun",
        "aff_domain": "microsoft.com;microsoft.com;microsoft.com;microsoft.com;microsoft.com;research.microsoft.com;microsoft.com;hkbu.edu.hk;microsoft.com;stepfun.com",
        "position": "Intern;Researcher;Researcher;Researcher;Researcher;Researcher;Researcher;Assistant Professor;Sr. Principal Researcher;CEO",
        "bibtex": "@inproceedings{\nluo2024wizardcoder,\ntitle={WizardCoder: Empowering Code Large Language Models with Evol-Instruct},\nauthor={Ziyang Luo and Can Xu and Pu Zhao and Qingfeng Sun and Xiubo Geng and Wenxiang Hu and Chongyang Tao and Jing Ma and Qingwei Lin and Daxin Jiang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=UnUwSIgK5W}\n}",
        "github": "",
        "project": "",
        "reviewers": "QRie;fiHu;6CYQ;FnZW",
        "pdf_size": 1183194,
        "rating": "5;6;6;8",
        "confidence": "4;5;4;4",
        "soundness": "3;2;3;4",
        "contribution": "2;3;3;3",
        "presentation": "3;2;2;4",
        "wc_summary": "61;153;84;82",
        "wc_strengths": "61;52;43;57",
        "wc_weaknesses": "74;169;109;44",
        "wc_questions": "99;319;273;71",
        "wc_review": "295;693;509;254",
        "wc_reply_reviewers": "0;120;59;95",
        "wc_reply_authors": "736;1794;1352;469",
        "reply_reviewers": "0;2;1;1",
        "reply_authors": "1;6;4;2",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            95.0,
            34.677081768799404
        ],
        "wc_strengths_avg": [
            53.25,
            6.722164829874376
        ],
        "wc_weaknesses_avg": [
            99.0,
            46.502688094345686
        ],
        "wc_questions_avg": [
            190.5,
            107.20424431896342
        ],
        "wc_review_avg": [
            437.75,
            176.33118697496482
        ],
        "wc_reply_reviewers_avg": [
            68.5,
            45.10266067539697
        ],
        "wc_reply_authors_avg": [
            1087.75,
            518.4584723003377
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            3.25,
            1.920286436967152
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": -0.13245323570650439,
        "gs_citation": 661,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=461592279997493544&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=UnUwSIgK5W",
        "pdf": "https://openreview.net/pdf?id=UnUwSIgK5W",
        "email": "microsoft.com;microsoft.com;microsoft.com;microsoft.com;microsoft.com;research.microsoft.com;microsoft.com;hkbu.edu.hk;microsoft.com;stepfun.com",
        "author_num": 10,
        "aff_unique_index": "0;0;0;0;0;0;0;1;0;2",
        "aff_unique_norm": "Microsoft;Hong Kong Baptist University;StepFun",
        "aff_unique_dep": "Microsoft Corporation;;",
        "aff_unique_url": "https://www.microsoft.com;https://www.hkbu.edu.hk;",
        "aff_unique_abbr": "Microsoft;HKBU;",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;0;0;0;1;0",
        "aff_country_unique": "United States;China;"
    },
    {
        "title": "Time-LLM: Time Series Forecasting by Reprogramming Large Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18518",
        "id": "Unb5CVPtae",
        "author_site": "Ming Jin, Shiyu Wang, Lintao Ma, Zhixuan Chu, James Zhang, Xiaoming Shi, Pin-Yu Chen, Yuxuan Liang, Yuan-Fang Li, Shirui Pan, Qingsong Wen",
        "tldr": "",
        "abstract": "Time series forecasting holds significant importance in many real-world dynamic systems and has been extensively studied. Unlike natural language process (NLP) and computer vision (CV), where a single large model can tackle multiple tasks, models for time series forecasting are often specialized, necessitating distinct designs for different tasks and applications. While pre-trained foundation models have made impressive strides in NLP and CV, their development in time series domains has been constrained by data sparsity. Recent studies have revealed that large language models (LLMs) possess robust pattern recognition and reasoning abilities over complex sequences of tokens. However, the challenge remains in effectively aligning the modalities of time series data and natural language to leverage these capabilities. In this work, we present Time-LLM, a reprogramming framework to repurpose LLMs for general time series forecasting with the backbone language models kept intact. We begin by reprogramming the input time series with text prototypes before feeding it into the frozen LLM to align the two modalities. To augment the LLM's ability to reason with time series data, we propose Prompt-as-Prefix (PaP), which enriches the input context and directs the transformation of reprogrammed input patches. The transformed time series patches from the LLM are finally projected to obtain the forecasts. Our comprehensive evaluations demonstrate that \\method is a powerful time series learner that outperforms state-of-the-art, specialized forecasting models. Moreover, Time-LLM excels in both few-shot and zero-shot learning scenarios. The code is made available at https://github.com/KimMeen/Time-LLM.",
        "keywords": "time series forecasting;large language models;model reprogramming",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Ming Jin;Shiyu Wang;Lintao Ma;Zhixuan Chu;James Y. Zhang;Xiaoming Shi;Pin-Yu Chen;Yuxuan Liang;Yuan-Fang Li;Shirui Pan;Qingsong Wen",
        "authorids": "~Ming_Jin3;~Shiyu_Wang3;~Lintao_Ma1;~Zhixuan_Chu1;~James_Y._Zhang1;~Xiaoming_Shi2;~Pin-Yu_Chen1;~Yuxuan_Liang1;~Yuan-Fang_Li1;~Shirui_Pan1;~Qingsong_Wen2",
        "gender": "M;;;M;M;M;M;M;M;;",
        "homepage": "https://mingjin.dev/;;;;https://scholar.google.com/citations?user=Ywakh_sAAAAJ;;http://www.pinyuchen.com;https://yuxuanliang.com;https://users.monash.edu.au/~yli/;;",
        "dblp": "34/3870-5;;;258/1233;151/3086;;39/8969;183/0977;20/2537;91/8171;",
        "google_scholar": "I2xvKaIAAAAJ;;;a4IuTngAAAAJ;Ywakh_sAAAAJ;0WMTWacAAAAJ;jxwlCUUAAAAJ;n9cODgcAAAAJ;https://scholar.google.com.tw/citations?user=wufXO1kAAAAJ;https://scholar.google.com.au/citations?user=frWRJN4AAAAJ;",
        "orcid": "0000-0002-6833-4811;;;;0000-0001-6519-676X;0000-0003-0764-8961;0000-0003-1039-8369;0000-0003-2817-7337;;0000-0003-0794-527X;",
        "linkedin": ";;;;jamesymzhang/;;pin-yu-chen-940062a2;yoshall/;;;",
        "or_profile": "~Ming_Jin3;~Shiyu_Wang3;~Lintao_Ma1;~Zhixuan_Chu1;~James_Y._Zhang1;~Xiaoming_Shi2;~Pin-Yu_Chen1;~Yuxuan_Liang1;~Yuan-Fang_Li1;~Shirui_Pan1;~Qingsong_Wen2",
        "aff": "Griffith University;;;Ant Group;Ant Group;Ant Group;International Business Machines;The Hong Kong University of Science and Technology (Guangzhou);Oracle;Griffith University;",
        "aff_domain": "griffith.edu.au;;;antgroup.com;alipay.com;antgroup.com;ibm.com;hkust-gz.edu.cn;oracle.com;griffith.edu.au;",
        "position": "Assistant Professor;;;Researcher;managing director;Researcher;Principal Researcher;Assistant Professor;Principal Researcher;Full Professor;",
        "bibtex": "@inproceedings{\njin2024timellm,\ntitle={Time-{LLM}: Time Series Forecasting by Reprogramming Large Language Models},\nauthor={Ming Jin and Shiyu Wang and Lintao Ma and Zhixuan Chu and James Y. Zhang and Xiaoming Shi and Pin-Yu Chen and Yuxuan Liang and Yuan-Fang Li and Shirui Pan and Qingsong Wen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Unb5CVPtae}\n}",
        "github": "",
        "project": "",
        "reviewers": "L3pe;baDP;cwaB;MAkL;Z9NA",
        "pdf_size": 3266209,
        "rating": "3;8;8;8;8",
        "confidence": "5;4;3;4;4",
        "soundness": "2;4;2;3;3",
        "contribution": "2;4;3;3;3",
        "presentation": "2;4;3;3;3",
        "wc_summary": "52;139;111;69;74",
        "wc_strengths": "36;219;159;64;61",
        "wc_weaknesses": "317;216;110;244;255",
        "wc_questions": "83;72;124;30;26",
        "wc_review": "488;646;504;407;416",
        "wc_reply_reviewers": "1042;37;128;142;32",
        "wc_reply_authors": "4525;705;1314;1878;1995",
        "reply_reviewers": "2;1;1;1;1",
        "reply_authors": "9;2;4;5;5",
        "rating_avg": [
            7.0,
            2.0
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.8,
            0.7483314773547882
        ],
        "contribution_avg": [
            3.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            3.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            89.0,
            31.55312979721663
        ],
        "wc_strengths_avg": [
            107.8,
            69.64309010950046
        ],
        "wc_weaknesses_avg": [
            228.4,
            67.78377386956262
        ],
        "wc_questions_avg": [
            67.0,
            36.27671429443411
        ],
        "wc_review_avg": [
            492.2,
            85.87991616204572
        ],
        "wc_reply_reviewers_avg": [
            276.2,
            385.55746653384887
        ],
        "wc_reply_authors_avg": [
            2083.4,
            1304.099474733427
        ],
        "reply_reviewers_avg": [
            1.2,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            5.0,
            2.280350850198276
        ],
        "replies_avg": [
            41,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": -0.7905694150420948,
        "gs_citation": 577,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4605741467245220036&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "openreview": "https://openreview.net/forum?id=Unb5CVPtae",
        "pdf": "https://openreview.net/pdf?id=Unb5CVPtae",
        "email": "griffith.edu.au;;;antgroup.com;alipay.com;antgroup.com;ibm.com;hkust-gz.edu.cn;oracle.com;griffith.edu.au;",
        "author_num": 11,
        "aff_unique_index": "0;1;1;1;2;3;4;0",
        "aff_unique_norm": "Griffith University;Ant Group;International Business Machines Corporation;Hong Kong University of Science and Technology;Oracle Corporation",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.griffith.edu.au;https://www.antgroup.com;https://www.ibm.com;https://www.ust.hk;https://www.oracle.com",
        "aff_unique_abbr": "Griffith;Ant Group;IBM;HKUST;Oracle",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Guangzhou",
        "aff_country_unique_index": "0;1;1;1;2;1;2;0",
        "aff_country_unique": "Australia;China;United States"
    },
    {
        "id": "UndmcWatBN",
        "title": "Dissecting Zero-Shot Visual Reasoning Capabilities in Vision and Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Vision-language models (VLMs) have shown impressive zero- and few-shot performance on real-world visual question answering (VQA) benchmarks such as VQAv2 and OK-VQA, alluding to their capabilities as visual reasoning engines. However, the benchmarks being used have questions that involve a limited number of reasoning steps, and also conflate visual reasoning with world knowledge. Consequently, it remains unclear whether a VLM\u2019s apparent visual reasoning performance is due to its world knowledge, or due to actual visual reasoning capabilities. Hence, we systematically examine and benchmark the zero-shot visual reasoning capabilities of VLMs through synthetic datasets that require minimal world knowledge, and allow for analysis over a broad range of reasoning steps. We specifically focus on zero-shot reasoning rather than few-shot or fine-tuned approaches to gain clearer insights into the inherent capabilities of the models, without additional influence of task-specific training data. We design novel scene-informed prompting techniques and focus on two novel aspects of zero-shot visual reasoning: i) evaluating the impact of conveying visual scene information as either visual embeddings or purely textual scene descriptions to the underlying large language model (LLM) of the VLM, and ii) comparing the effectiveness of chain-of-thought prompting to standard prompting for zero-shot visual reasoning. Notably, we find that: i) the underlying LLMs of VLMs when provided only ground-truth textual scene descriptions, consistently perform better in comparison to being provided visual embeddings, particularly achieving \u223c18% higher accuracy on the PTR dataset, and ii) CoT prompting performs marginally better than standard prompting only for the comparatively large GPT-3.5-Turbo (175B) model, and does worse for smaller-scale models. This suggests the emergence of CoT abilities for visual reasoning in LLMs at larger scales even when world knowledge is limited. Overall, we find limitations in the reasoning capabilities of VLMs and LLMs for more complex visual reasoning, and highlight the important role that LLMs can play in visual reasoning.",
        "keywords": "Visual Reasoning;Multimodal Models;Large Language Models;Chain-of-Thought Reasoning;LLM Grounding;Sensory Grounding;Synthetic Datasets;Benchmarking;Automated Prompt Generation",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/8a1a867771076325eda762b9fcb5c624076538f6.zip",
        "author": "Aishik Nagar;Shantanu Jaiswal;Cheston Tan",
        "authorids": "~Aishik_Nagar1;~Shantanu_Jaiswal1;~Cheston_Tan1",
        "gender": "M;;M",
        "homepage": "https://aishiknagar.com/;;",
        "dblp": ";203/9071;136/9366",
        "google_scholar": ";GmGNq2MAAAAJ;Up0UYEYAAAAJ",
        "orcid": ";;",
        "linkedin": "aishik-nagar/;;cheston-tan/",
        "or_profile": "~Aishik_Nagar1;~Shantanu_Jaiswal1;~Cheston_Tan1",
        "aff": ";Center for Frontier AI Research, A*STAR Singapore;Singapore University of Technology and Design",
        "aff_domain": ";ihpc.a-star.edu.sg;sutd.edu.sg",
        "position": ";Research Engineer;Assistant Professor",
        "bibtex": "@misc{\nnagar2024dissecting,\ntitle={Dissecting Zero-Shot Visual Reasoning Capabilities in Vision and Language Models},\nauthor={Aishik Nagar and Shantanu Jaiswal and Cheston Tan},\nyear={2024},\nurl={https://openreview.net/forum?id=UndmcWatBN}\n}",
        "github": "",
        "project": "",
        "reviewers": "PwJg;An5H;Jf6s;13QZ",
        "site": "https://openreview.net/forum?id=UndmcWatBN",
        "pdf_size": 7744168,
        "rating": "3;3;3;5",
        "confidence": "4;3;4;4",
        "soundness": "2;1;2;2",
        "contribution": "2;3;2;2",
        "presentation": "2;2;2;2",
        "wc_summary": "71;40;57;32",
        "wc_strengths": "47;52;47;55",
        "wc_weaknesses": "125;178;224;49",
        "wc_questions": "56;11;9;98",
        "wc_review": "299;281;337;234",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            50.0,
            15.116216457830975
        ],
        "wc_strengths_avg": [
            50.25,
            3.418698582794336
        ],
        "wc_weaknesses_avg": [
            144.0,
            65.0807191109625
        ],
        "wc_questions_avg": [
            43.5,
            36.65037516861185
        ],
        "wc_review_avg": [
            287.75,
            37.036299761180246
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16122724432687896696&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "A*STAR Singapore;Singapore University of Technology and Design",
        "aff_unique_dep": "Center for Frontier AI Research;",
        "aff_unique_url": "https://www.a-star.edu.sg;https://www.sutd.edu.sg",
        "aff_unique_abbr": "A*STAR;SUTD",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Singapore"
    },
    {
        "id": "UnsLGUCynE",
        "title": "3D Diffuser Actor: Multi-task 3D Robot Manipulation with Iterative Error Feedback",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We present 3D Diffuser Actor, a framework that marries diffusion policies and 3D scene representations for robot manipulation. Diffusion policies capture the action distribution conditioned on the robot and environment state using conditional diffusion models. They have recently shown to outperform both deterministic and alternative generative policy formulations in learning from demonstrations. 3D robot policies use 3D scene feature representations aggregated from single or multiple 2D image views using sensed depth. They typically generalize better than their 2D counterparts in novel viewpoints. We unify these two lines of work and present a neural policy architecture that uses 3D scene representations to iteratively denoise robot 3D rotations and translations for a given language task description. At each denoising iteration, our model \u201cgrounds\" the current end-effector estimate in the 3D scene workspace, featurizes it using 3D relative position attentions and predicts its 3D translation and rotation error. We test 3D Diffuser Actor on learning from demonstrations in simulation and in the real world. We show our model outperforms both 3D policies and 2D diffusion policies and sets a new state of the art on RLBench, an established learning from demonstrations benchmark, where it outperforms the previous SOTA with a 12% absolute gain. We ablate our architectural design choices, such as translation invariance through 3D grounding and relative 3D transformers, and show they help model generalization. Our results suggest that 3D scene representations and powerful generative modeling are key to efficient learning of multi-task robot policies.",
        "keywords": "Diffusion;Robot Learning;3D Representations",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Nikolaos Gkanatsios;Tsung-Wei Ke;Brian Yang;Zhou Xian;Katerina Fragkiadaki",
        "authorids": "~Nikolaos_Gkanatsios1;~Tsung-Wei_Ke2;~Brian_Yang1;~Zhou_Xian1;~Katerina_Fragkiadaki1",
        "gender": "M;;M;M;F",
        "homepage": "https://nickgkan.github.io/;https://twke18.github.io/;https://byang.org;;https://www.cs.cmu.edu/~katef/",
        "dblp": "225/5677;173/4984;311/3411;258/5020;21/8780",
        "google_scholar": "https://scholar.google.gr/citations?user=jk7GqOEAAAAJ;WTEFsHMAAAAJ;https://scholar.google.com/citations?view_op=list_works;;FWp7728AAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Nikolaos_Gkanatsios1;~Tsung-Wei_Ke2;~Brian_Yang1;~Zhou_Xian1;~Katerina_Fragkiadaki1",
        "aff": "Carnegie Mellon University;Carnegie Mellon University;School of Computer Science, Carnegie Mellon University;Carnegie Mellon University;Carnegie Mellon University",
        "aff_domain": "cmu.edu;andrew.cmu.edu;cs.cmu.edu;cmu.edu;cmu.edu",
        "position": "Graduate student;Postdoc;PhD student;PhD student;Associate Professor",
        "bibtex": "@misc{\ngkanatsios2024d,\ntitle={3D Diffuser Actor: Multi-task 3D Robot Manipulation with Iterative Error Feedback},\nauthor={Nikolaos Gkanatsios and Tsung-Wei Ke and Brian Yang and Zhou Xian and Katerina Fragkiadaki},\nyear={2024},\nurl={https://openreview.net/forum?id=UnsLGUCynE}\n}",
        "github": "",
        "project": "",
        "reviewers": "Ws6y;2s3N;sG3K;7nbv",
        "site": "https://openreview.net/forum?id=UnsLGUCynE",
        "pdf_size": 11594785,
        "rating": "1;3;5;6",
        "confidence": "4;2;4;4",
        "soundness": "3;2;2;4",
        "contribution": "2;2;3;3",
        "presentation": "2;3;3;2",
        "wc_summary": "130;91;57;74",
        "wc_strengths": "40;42;62;20",
        "wc_weaknesses": "160;82;342;89",
        "wc_questions": "1;62;3;170",
        "wc_review": "331;277;464;353",
        "wc_reply_reviewers": "154;112;443;0",
        "wc_reply_authors": "567;645;1226;548",
        "reply_reviewers": "1;1;2;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            3.75,
            1.920286436967152
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            88.0,
            27.064737205448715
        ],
        "wc_strengths_avg": [
            41.0,
            14.866068747318506
        ],
        "wc_weaknesses_avg": [
            168.25,
            104.85317114899291
        ],
        "wc_questions_avg": [
            59.0,
            68.61122357165772
        ],
        "wc_review_avg": [
            356.25,
            68.07853920289418
        ],
        "wc_reply_reviewers_avg": [
            177.25,
            163.43098696391698
        ],
        "wc_reply_authors_avg": [
            746.5,
            279.21541862869964
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.22549380840084865,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:6Q8nh-1WCbsJ:scholar.google.com/&scioq=3D+Diffuser+Actor:+Multi-task+3D+Robot+Manipulation+with+Iterative+Error+Feedback&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Carnegie Mellon University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cmu.edu",
        "aff_unique_abbr": "CMU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Pittsburgh",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "UnstiBOfnv",
        "title": "Style Over Substance: Evaluation Biases for Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "As large language models (LLMs) continue to advance, accurately and comprehensively evaluating their performance becomes increasingly challenging. Human evaluations are conventionally considered the gold standard in natural language generation, but recent advancements incorporate state-of-the-art LLMs as proxies for human judges in evaluation processes. However, the extent to which humans and LLMs are capable evaluators remains uncertain. This study investigates the behavior of crowd-sourced and expert annotators, as well as LLMs, when comparing outputs from different models. To achieve this, we curate a dataset of intentionally flawed machine-generated answers. Our findings reveal a concerning bias in the evaluation process, as answers with factual errors are rated more favorably than answers that are too short or contained grammatical errors. To address this issue, we propose independently evaluating machine-generated text across multiple dimensions, rather than merging all the evaluation aspects into a single score. We instantiate this idea with the Elo rating system, resulting in the Multi-Elo Rating System (MERS). Empirical results from our study reveal that this proposed approach significantly enhances the quality of LLM-based evaluations, particularly in terms of factual accuracy. However, there is no significant improvement in crowd-sourced-based evaluations, indicating the need for further investigation and refinement.",
        "keywords": "Evaluation;Large Language Models",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Minghao Wu;Alham Fikri Aji",
        "authorids": "~Minghao_Wu1;~Alham_Fikri_Aji1",
        "gender": "M;M",
        "homepage": "https://minghao-wu.github.io/;",
        "dblp": "122/6257;188/8762",
        "google_scholar": "https://scholar.google.co.uk/citations?user=E2zcuy0AAAAJ;0Cyfqv4AAAAJ",
        "orcid": "0000-0002-5717-9318;",
        "linkedin": "minghao-wu-9087076a/;",
        "or_profile": "~Minghao_Wu1;~Alham_Fikri_Aji1",
        "aff": "Monash University;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_domain": "monash.edu;mbzuai.ac.ae",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nwu2024style,\ntitle={Style Over Substance: Evaluation Biases for Large Language Models},\nauthor={Minghao Wu and Alham Fikri Aji},\nyear={2024},\nurl={https://openreview.net/forum?id=UnstiBOfnv}\n}",
        "github": "",
        "project": "",
        "reviewers": "X9cm;2ems;fkGz",
        "site": "https://openreview.net/forum?id=UnstiBOfnv",
        "pdf_size": 872476,
        "rating": "3;3;5",
        "confidence": "4;5;4",
        "soundness": "2;1;3",
        "contribution": "2;2;3",
        "presentation": "2;2;2",
        "wc_summary": "122;157;145",
        "wc_strengths": "35;45;48",
        "wc_weaknesses": "88;763;139",
        "wc_questions": "21;39;793",
        "wc_review": "266;1004;1125",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "364;732;358",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            141.33333333333334,
            14.522013940527977
        ],
        "wc_strengths_avg": [
            42.666666666666664,
            5.557777333511022
        ],
        "wc_weaknesses_avg": [
            330.0,
            306.8843430349616
        ],
        "wc_questions_avg": [
            284.3333333333333,
            359.75670791368003
        ],
        "wc_review_avg": [
            798.3333333333334,
            379.64398527509366
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            484.6666666666667,
            174.90822990611073
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 68,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16182249669223104194&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Monash University;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.monash.edu;https://mbzuai.ac.ae",
        "aff_unique_abbr": "Monash;MBZUAI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Australia;United Arab Emirates"
    },
    {
        "id": "UnuSBQjgqK",
        "title": "CIM: Constrained Intrinsic Motivation for Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper investigates two fundamental problems that arise when implementing intrinsic motivation for reinforcement learning: 1) how to design a proper intrinsic objective for Reward-Free Pre-Training (RFPT), and 2) how to reduce the bias introduced by the intrinsic objective for Exploration with Intrinsic Motivation (EIM).\nExisting intrinsic motivation methods suffer from static skills, limited state coverage, sample inefficiency in RFPT, and suboptimality in EIM.\nTo tackle these problems, we propose \\emph{Constrained Intrinsic Motivation (CIM)} for RFPT and EIM, separately. CIM for RFPT maximizes a novel lower bound of the state entropy with an alignment constraint on the skill and state representations for efficient dynamic skill discovery and state coverage maximization. CIM for EIM leverages constrained policy optimization to adaptively adjust the temperature parameter of the intrinsic reward for bias reduction.\nIn multiple MuJoCo robotics environments and tasks, we empirically show that CIM for RFPT achieves greatly improved performance and sample efficiency over state-of-the-art intrinsic motivation methods. Additionally, we showcase the effectiveness of CIM for EIM in redeeming intrinsic rewards when extrinsic rewards are exposed from the beginning.",
        "keywords": "Reinforcement Learing;Intrinsic Motivation;Skill Discovery",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/2041dcb93e28131f2759c654481d849af21bbe69.zip",
        "author": "Xiang Zheng;Xingjun Ma;Chao Shen;Cong Wang",
        "authorids": "~Xiang_Zheng4;~Xingjun_Ma1;~Chao_Shen2;~Cong_Wang10",
        "gender": ";M;M;",
        "homepage": ";http://xingjunma.com/;http://gr.xjtu.edu.cn/web/cshen;",
        "dblp": ";195/8270;48/4825-1;",
        "google_scholar": ";https://scholar.google.com.au/citations?user=XQViiyYAAAAJ;m6QY7-wAAAAJ;",
        "orcid": ";;0000-0002-6959-0569;",
        "linkedin": ";xingjun-ma-173532129/;;",
        "or_profile": "~Xiang_Zheng4;~Xingjun_Ma1;~Chao_Shen2;~Cong_Wang10",
        "aff": ";Fudan University;Xi\u2019an Jiaotong University;",
        "aff_domain": ";fudan.edu.cn;xjtu.edu.cn;",
        "position": ";Associate Professor;Full Professor;",
        "bibtex": "@misc{\nzheng2024cim,\ntitle={{CIM}: Constrained Intrinsic Motivation for Reinforcement Learning},\nauthor={Xiang Zheng and Xingjun Ma and Chao Shen and Cong Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=UnuSBQjgqK}\n}",
        "github": "",
        "project": "",
        "reviewers": "hXz5;YFdU;9QWm;kU8G",
        "site": "https://openreview.net/forum?id=UnuSBQjgqK",
        "pdf_size": 22818215,
        "rating": "3;6;6;8",
        "confidence": "4;3;3;3",
        "soundness": "2;3;3;3",
        "contribution": "3;2;3;3",
        "presentation": "1;2;3;3",
        "wc_summary": "67;102;72;66",
        "wc_strengths": "63;30;44;34",
        "wc_weaknesses": "390;105;19;42",
        "wc_questions": "72;209;75;109",
        "wc_review": "592;446;210;251",
        "wc_reply_reviewers": "223;11;0;19",
        "wc_reply_authors": "2491;1310;535;457",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "4;2;1;1",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            76.75,
            14.7542366796795
        ],
        "wc_strengths_avg": [
            42.75,
            12.754901018824098
        ],
        "wc_weaknesses_avg": [
            139.0,
            148.29531347955674
        ],
        "wc_questions_avg": [
            116.25,
            55.485921637835304
        ],
        "wc_review_avg": [
            374.75,
            153.89180452512733
        ],
        "wc_reply_reviewers_avg": [
            63.25,
            92.47803793333853
        ],
        "wc_reply_authors_avg": [
            1198.25,
            817.4721325525416
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8892972917998875,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:IFA9f2tY-LcJ:scholar.google.com/&scioq=CIM:+Constrained+Intrinsic+Motivation+for+Reinforcement+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Fudan University;Xi'an Jiao Tong University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.fudan.edu.cn;https://www.xjtu.edu.cn",
        "aff_unique_abbr": "Fudan;XJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "Unz9zYdjTt",
        "title": "FedNovel: Federated Novel Class Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In a privacy-focused era, Federated Learning (FL) has emerged as a promising machine learning technique. However, most existing FL studies assume that the data distribution remains nearly fixed over time, while real-world scenarios often involve dynamic and continual changes. To equip FL systems with continual model evolution capabilities, enabling them to discover and incorporate unseen novel classes, we focus on an important problem called *Federated Novel Class Learning* (FedNovel) in this work. The biggest challenge in FedNovel is to merge and align novel classes that are discovered and learned by different clients without compromising privacy. To address this, we propose a *Global Alignment Learning* (GAL) framework that can accurately estimate the global novel class number and provide effective guidance for local training from a global perspective, all while maintaining privacy protection. Specifically, GAL first locates high-density regions in the representation space through a bi-level clustering mechanism to estimate the novel class number, with which the global prototypes corresponding to novel classes can be constructed. Then, GAL uses a novel semantic weighted loss to capture all possible correlations between these prototypes and the training data for mitigating the impact of pseudo-label noise and data heterogeneity. Extensive experiments on various datasets demonstrate GAL's superior performance over state-of-the-art novel class discovery methods. In particular, GAL achieves significant improvements in novel-class performance, increasing the accuracy by 5.1\\% to 10.6\\% in the case of one novel class learning stage and by 7.8\\% to 17.9\\% in the case of two novel class learning stages, without sacrificing known-class performance. Moreover, GAL is shown to be effective in equipping a variety of different mainstream FL algorithms with novel class discovery and learning capability, highlighting its potential for many real-world applications.",
        "keywords": "Federated Learning;Novel Class Discovery;Continual Learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/21be838e55827028f8c778ce0003b5606efc296d.zip",
        "author": "Lixu Wang;Chenxi Liu;Junfeng Guo;Jiahua Dong;Xiao Wang;Heng Huang;Qi Zhu",
        "authorids": "~Lixu_Wang1;~Chenxi_Liu2;~Junfeng_Guo2;~Jiahua_Dong1;~Xiao_Wang11;~Heng_Huang1;~Qi_Zhu2",
        "gender": ";M;M;;M;M;",
        "homepage": ";https://dawnliu35.github.io/;https://junfenggo.github.io/;;https://wangxiao1254.github.io/;https://www.cs.umd.edu/~heng/;http://zhulab.ece.northwestern.edu/",
        "dblp": ";;;;150/9413;03/281;66/5923-2.html",
        "google_scholar": ";;TqblqYcAAAAJ;;QbWLR8QAAAAJ;4OqLaDwAAAAJ;TN09YMcAAAAJ",
        "orcid": ";;;;;;",
        "linkedin": ";chenxi-liu-8b9719211/;;;;;",
        "or_profile": "~Lixu_Wang1;~Chenxi_Liu2;~Junfeng_Guo2;~Jiahua_Dong1;~Xiao_Wang11;~Heng_Huang1;~Qi_Zhu2",
        "aff": ";University of Maryland, College Park;University of Maryland Institute for Advanced Computer Studies, University of Maryland, College Park;;Northwestern University;Department of Computer Science, University of Maryland, College Park;Northwestern University",
        "aff_domain": ";umd.edu;umiacs.umd.edu;;northwestern.edu;cs.umd.edu;northwestern.edu",
        "position": ";PhD student;Postdoc;;Assistant Professor;Full Professor;Associate Professor",
        "bibtex": "@misc{\nwang2024fednovel,\ntitle={FedNovel: Federated Novel Class Learning},\nauthor={Lixu Wang and Chenxi Liu and Junfeng Guo and Jiahua Dong and Xiao Wang and Heng Huang and Qi Zhu},\nyear={2024},\nurl={https://openreview.net/forum?id=Unz9zYdjTt}\n}",
        "github": "",
        "project": "",
        "reviewers": "RSBY;hsUT;a8Cy;skcH",
        "site": "https://openreview.net/forum?id=Unz9zYdjTt",
        "pdf_size": 883255,
        "rating": "3;5;6;8",
        "confidence": "5;3;4;4",
        "soundness": "2;3;3;3",
        "contribution": "1;3;3;3",
        "presentation": "3;2;3;2",
        "wc_summary": "45;95;68;17",
        "wc_strengths": "31;77;40;106",
        "wc_weaknesses": "284;73;99;96",
        "wc_questions": "3;251;19;11",
        "wc_review": "363;496;226;230",
        "wc_reply_reviewers": "144;0;200;10",
        "wc_reply_authors": "3696;1173;1150;407",
        "reply_reviewers": "1;0;2;1",
        "reply_authors": "9;5;4;2",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            56.25,
            28.752173830860162
        ],
        "wc_strengths_avg": [
            63.5,
            29.9874973947477
        ],
        "wc_weaknesses_avg": [
            138.0,
            84.89110671913755
        ],
        "wc_questions_avg": [
            71.0,
            104.0768946500615
        ],
        "wc_review_avg": [
            328.75,
            111.19211977473944
        ],
        "wc_reply_reviewers_avg": [
            88.5,
            85.88800847615457
        ],
        "wc_reply_authors_avg": [
            1606.5,
            1245.1029073936018
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            5.0,
            2.5495097567963922
        ],
        "replies_avg": [
            32,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.39223227027636803,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:VPg9L6Tm02cJ:scholar.google.com/&scioq=FedNovel:+Federated+Novel+Class+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2;1",
        "aff_unique_norm": "University of Maryland;Northwestern University;University of Maryland, College Park",
        "aff_unique_dep": ";;Department of Computer Science",
        "aff_unique_url": "https://www/umd.edu;https://www.northwestern.edu;https://www/umd.edu",
        "aff_unique_abbr": "UMD;NU;UMD",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "College Park;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Query-Policy Misalignment in Preference-Based Reinforcement Learning",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18517",
        "id": "UoBymIwPJR",
        "author_site": "Xiao Hu, Jianxiong Li, Xianyuan Zhan, Qing-Shan Jia, Ya-Qin Zhang",
        "tldr": "",
        "abstract": "Preference-based reinforcement learning (PbRL) provides a natural way to align RL agents\u2019 behavior with human desired outcomes, but is often restrained by costly human feedback. To improve feedback efficiency, most existing PbRL methods focus on selecting queries to maximally improve the overall quality of the reward model, but counter-intuitively, we find that this may not necessarily lead to improved performance. To unravel this mystery, we identify a long-neglected issue in the query selection schemes of existing PbRL studies: Query-Policy Misalignment. We show that the seemingly informative queries selected to improve the overall quality of reward model actually may not align with RL agents\u2019 interests, thus offering little help on policy learning and eventually resulting in poor feedback efficiency. We show that this issue can be effectively addressed via policy-aligned query and a specially designed hybrid experience replay, which together enforce the bidirectional query-policy alignment. Simple yet elegant, our method can be easily incorporated into existing approaches by changing only a few lines of code. We showcase in comprehensive experiments that our method achieves substantial gains in both human feedback and RL sample efficiency, demonstrating the importance of addressing query-policy misalignment in PbRL tasks.",
        "keywords": "preference-based reinforcement learning;human feedback efficiency;query-policy misalignment",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/7194a1b5194ff6cd1a1ddac5574db5f02f457eac.zip",
        "author": "Xiao Hu;Jianxiong Li;Xianyuan Zhan;Qing-Shan Jia;Ya-Qin Zhang",
        "authorids": "~Xiao_Hu7;~Jianxiong_Li1;~Xianyuan_Zhan1;~Qing-Shan_Jia1;~Ya-Qin_Zhang1",
        "gender": "M;M;M;M;M",
        "homepage": "https://github.com/huxiao09;http://zhanxianyuan.xyz/;http://cfins.au.tsinghua.edu.cn/personalhg/jiaqingshan;https://air.tsinghua.edu.cn/en/info/1046/1188.htm;https://facebear-ljx.github.io/",
        "dblp": "19/1374;181/5081;09/3139;09/2187;43/1987",
        "google_scholar": "_9btJRYAAAAJ;pDMnGloAAAAJ;;mDOMfxIAAAAJ;TRLwpiUAAAAJ",
        "orcid": ";0000-0002-3683-0554;;;",
        "linkedin": ";;;;",
        "or_profile": "~Xiao_Hu7;~Xianyuan_Zhan1;~Qing-Shan_Jia1;~Ya-Qin_Zhang1;~Li_Jianxiong1",
        "aff": "Tsinghua University;Tsinghua University;Tsinghua University;AIR, Tsinghua University;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "PhD student;Associate Professor;Full Professor;Full Professor;PhD student",
        "bibtex": "@inproceedings{\nhu2024querypolicy,\ntitle={Query-Policy Misalignment in Preference-Based Reinforcement Learning},\nauthor={Xiao Hu and Jianxiong Li and Xianyuan Zhan and Qing-Shan Jia and Ya-Qin Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=UoBymIwPJR}\n}",
        "github": "",
        "project": "",
        "reviewers": "EPnJ;EEB5;LzS2",
        "pdf_size": 33120239,
        "rating": "6;6;8",
        "confidence": "3;4;4",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "3;3;2",
        "wc_summary": "118;40;77",
        "wc_strengths": "65;75;125",
        "wc_weaknesses": "100;71;280",
        "wc_questions": "46;61;69",
        "wc_review": "329;247;551",
        "wc_reply_reviewers": "21;56;67",
        "wc_reply_authors": "776;653;499",
        "reply_reviewers": "1;1;1",
        "reply_authors": "2;2;3",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            78.33333333333333,
            31.857320805254304
        ],
        "wc_strengths_avg": [
            88.33333333333333,
            26.246692913372705
        ],
        "wc_weaknesses_avg": [
            150.33333333333334,
            92.44938555171088
        ],
        "wc_questions_avg": [
            58.666666666666664,
            9.533566430716727
        ],
        "wc_review_avg": [
            375.6666666666667,
            128.4194516245711
        ],
        "wc_reply_reviewers_avg": [
            48.0,
            19.61292091114087
        ],
        "wc_reply_authors_avg": [
            642.6666666666666,
            113.32058751857738
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.49999999999999983,
        "gs_citation": 19,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3753322317425620305&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=UoBymIwPJR",
        "pdf": "https://openreview.net/pdf?id=UoBymIwPJR",
        "email": "tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Tsinghua University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "UoaHvbjpbG",
        "title": "Semantic-Enhanced Prototypical Network for Universal Novel Category Discovery",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We address the challenging task of Universal Novel Category Discovery (UniNCD) in image classification, where models must distinguish between common and novel categories while avoiding the misclassification of novel categories as private-known ones. Previous prototype-based approaches face two major challenges: first, they significantly increase the negative transfer risk by often misaligning novel categories with private-known categories; second, they lead to sub-optimal prototypes because traditional prototype learning ignores diverse object characteristics of images, resulting in insufficient semantic guidance when optimizing instance representations using only instance-level prototypical distributions. To tackle these challenges, we present a Semantic-Enhanced Prototypical Network, dubbed SEPNet. This prototypical network is enhanced by refined prototypes and enriched semantics to learn better representations and avoid negative transfer, including three key ideas: (1) we design a Prototype Refinement (PR) strategy that can decouple common, private-known, and novel categories from unlabeled data, which can exclude misaligned prototypes to avoid negative transfer; (2) we attach prototypical distribution to each patch of images, which embed enhanced semantic information to prototypes and guide prototypical contrastive learning and, (3) we design a patch-entropy balance (PEB) method to encourage sparser patch-level prototypical distributions while maintaining the uniformity of dense distributions, sparsity emphasizes dominant category characteristics, and uniformity avoids the misguidance of irrelevant disturbance, thereby enhancing the distinctiveness of instances to the prototypes. Our method demonstrates superior performance on the UniNCD task across three benchmark datasets, outperforming existing state-of-the-art approaches by approximately 3.4% in terms of accuracy. We will release our code for reproduction.",
        "keywords": "Prototype Refinement strategy;Semantic enrichment;Prototypical Network;Patch-Entropy Balance",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/7915a700115fbbdfed10bc8e96e79101dc1b51a7.zip",
        "author": "Haonan Lin;Wenbin An;Yan Chen;Feng Tian;Wei Ding;QianYing Wang;Ping Chen;Yaqiang Wu;mingxiang cai;Guang Dai",
        "authorids": "~Haonan_Lin1;~Wenbin_An1;~Yan_Chen16;~Feng_Tian4;~Wei_Ding2;~QianYing_Wang1;~Ping_Chen1;~Yaqiang_Wu1;~mingxiang_cai1;~Guang_Dai1",
        "gender": "M;M;;;;F;;;M;M",
        "homepage": ";;;;https://www.cs.umb.edu/~ding/;https://research.lenovo.com/webapp/view/home.html;http://www.cs.umb.edu/~pchen;;https://www.lenovo.com;",
        "dblp": "269/0292;331/2394;;;59/622-3;86/11012;;242/7854.html;;",
        "google_scholar": "GBnV3HIAAAAJ;https://scholar.google.com.hk/citations?user=BpkQZGgAAAAJ;;;cQ5Ox-8AAAAJ;gXgWhfEAAAAJ;;https://scholar.google.com/citations?hl=en;;",
        "orcid": ";;0000-0003-4838-3779;;0000-0002-3383-551X;;;0000-0001-8830-8250;;0000-0002-3529-9087",
        "linkedin": "haonan-lin-035276207/;;;;wei-ding-9b40485/;qianying-jane-wang-0255231/;;wuadam/;;",
        "or_profile": "~Haonan_Lin1;~Wenbin_An1;~Yan_Chen16;~Feng_Tian4;~Wei_Ding2;~QianYing_Wang1;~Ping_Chen1;~Yaqiang_Wu1;~mingxiang_cai1;~Guang_Dai1",
        "aff": "Xi'an Jiaotong University;Xi'an Jiaotong University;Xi'an Jiaotong University;;University of Massachusetts, Boston;lenovo group;University of Massachusetts, Boston;Lenovo Research;;SGIT AI",
        "aff_domain": "xjtu.edu.cn;xjtu.edu.cn;xjtu.edu.cn;;umb.edu;lenovo.com;umb.edu;lenovo.com;;sgcc.com.cn",
        "position": "MS student;PhD student;Associate Professor;;Professor;Principal Researcher;Full Professor;Principal Researcher;;Principal Researcher",
        "bibtex": "@misc{\nlin2024semanticenhanced,\ntitle={Semantic-Enhanced Prototypical Network for Universal Novel Category Discovery},\nauthor={Haonan Lin and Wenbin An and Yan Chen and Feng Tian and Wei Ding and QianYing Wang and Ping Chen and Yaqiang Wu and mingxiang cai and Guang Dai},\nyear={2024},\nurl={https://openreview.net/forum?id=UoaHvbjpbG}\n}",
        "github": "",
        "project": "",
        "reviewers": "r29F;Hwey;ASnA",
        "site": "https://openreview.net/forum?id=UoaHvbjpbG",
        "pdf_size": 2768609,
        "rating": "5;5;5",
        "confidence": "3;4;4",
        "soundness": "3;3;3",
        "contribution": "3;2;2",
        "presentation": "3;2;2",
        "wc_summary": "95;92;62",
        "wc_strengths": "82;53;17",
        "wc_weaknesses": "323;340;131",
        "wc_questions": "3;6;62",
        "wc_review": "503;491;272",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            83.0,
            14.89966442575134
        ],
        "wc_strengths_avg": [
            50.666666666666664,
            26.587382136812362
        ],
        "wc_weaknesses_avg": [
            264.6666666666667,
            94.7710691907375
        ],
        "wc_questions_avg": [
            23.666666666666668,
            27.13341523329163
        ],
        "wc_review_avg": [
            422.0,
            106.17909398747005
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6970369474447125611&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;2;1;3;4",
        "aff_unique_norm": "Xi'an Jiao Tong University;University of Massachusetts Boston;Lenovo Group;Lenovo;SGIT AI",
        "aff_unique_dep": ";;;Research;",
        "aff_unique_url": "https://www.xjtu.edu.cn;https://www.umb.edu;https://www.lenovo.com;https://www.lenovo.com;",
        "aff_unique_abbr": "XJTU;UMass Boston;Lenovo;Lenovo;",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Boston",
        "aff_country_unique_index": "0;0;0;1;0;1;0",
        "aff_country_unique": "China;United States;"
    },
    {
        "title": "Accelerating Data Generation for Neural Operators via Krylov Subspace Recycling",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18516",
        "id": "UpgRVWexaD",
        "author_site": "Hong Wang, Zhongkai Hao, Jie Wang, Zijie Geng, Zhen Wang, Bin Li, Feng Wu",
        "tldr": "",
        "abstract": "Learning neural operators for solving partial differential equations (PDEs) has attracted great attention due to its high inference efficiency.\nHowever, training such operators requires generating a substantial amount of labeled data, i.e., PDE problems together with their solutions.\nThe data generation process is exceptionally time-consuming, as it involves solving numerous systems of linear equations to obtain numerical solutions to the PDEs.\nMany existing methods solve these systems independently without considering their inherent similarities, resulting in extremely redundant computations.\nTo tackle this problem, we propose a novel method, namely **S**orting **K**rylov **R**ecycling (**SKR**), to boost the efficiency of solving these systems, thus significantly accelerating data generation for neural operators training.\nTo the best of our knowledge, SKR is the first attempt to address the time-consuming nature of data generation for learning neural operators.\nThe working horse of SKR is Krylov subspace recycling, a powerful technique for solving a series of interrelated systems by leveraging their inherent similarities.\nSpecifically, SKR employs a sorting algorithm to arrange these systems in a sequence, where adjacent systems exhibit high similarities.\nThen it equips a solver with Krylov subspace recycling to solve the systems sequentially instead of independently, thus effectively enhancing the solving efficiency.\nBoth theoretical analysis and extensive experiments demonstrate that SKR can significantly accelerate neural operator data generation, achieving a remarkable speedup of up to 13.9 times.",
        "keywords": "AI4PDE; Neural Operator; Data Generation; Krylov Subspace",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/ec667f577e769a42f2ddddb89616e6e42d98ea62.zip",
        "author": "Hong Wang;Zhongkai Hao;Jie Wang;Zijie Geng;Zhen Wang;Bin Li;Feng Wu",
        "authorids": "~Hong_Wang14;~Zhongkai_Hao1;~Jie_Wang1;~Zijie_Geng1;~Zhen_Wang30;~Bin_Li8;~Feng_Wu1",
        "gender": "M;M;M;Not Specified;M;M;M",
        "homepage": "https://wanghong1700.github.io/;http://staff.ustc.edu.cn/~jwangx;https://miralab.ai/people/zijie-geng/;http://home.ustc.edu.cn/~wangzhen0518/;http://staff.ustc.edu.cn/~binli;;https://haozhongkai.github.io/",
        "dblp": ";29/5259-5;320/7568;;89/6764-25;25/3972-1;270/0220.html",
        "google_scholar": ";OugG4dUAAAAJ;https://scholar.google.com.hk/citations?user=Ga66HL4AAAAJ;mnHzqrAAAAAJ;;5bInRDEAAAAJ;dfSzq27ZiVoC",
        "orcid": ";;;0000-0002-4357-7171;0000-0002-2332-3959;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Hong_Wang14;~Jie_Wang1;~Zijie_Geng1;~Zhen_Wang30;~Bin_Li8;~Feng_Wu1;~Hao_Zhongkai1",
        "aff": "University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China;Tsinghua University",
        "aff_domain": "ustc.edu.cn;ustc.edu.cn;mail.ustc.edu.cn;ustc.edu.cn;ustc.edu.cn;ustc.edu.cn;mails.tsinghua.edu.cn",
        "position": "PhD student;Full Professor;MS student;MS student;Full Professor;Full Professor;PhD student",
        "bibtex": "@inproceedings{\nwang2024accelerating,\ntitle={Accelerating Data Generation for Neural Operators via Krylov Subspace Recycling},\nauthor={Hong Wang and Zhongkai Hao and Jie Wang and Zijie Geng and Zhen Wang and Bin Li and Feng Wu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=UpgRVWexaD}\n}",
        "github": "",
        "project": "",
        "reviewers": "7U2z;ZpMg;A7dr;BjLB",
        "pdf_size": 1182216,
        "rating": "6;6;8;8",
        "confidence": "3;2;3;4",
        "soundness": "2;2;3;3",
        "contribution": "3;2;3;2",
        "presentation": "3;2;2;3",
        "wc_summary": "103;76;71;129",
        "wc_strengths": "34;115;65;63",
        "wc_weaknesses": "80;103;212;72",
        "wc_questions": "46;138;3;103",
        "wc_review": "263;432;351;367",
        "wc_reply_reviewers": "0;0;73;0",
        "wc_reply_authors": "1487;2901;2413;2065",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "4;6;4;4",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            94.75,
            23.220411279734044
        ],
        "wc_strengths_avg": [
            69.25,
            29.123658767400773
        ],
        "wc_weaknesses_avg": [
            116.75,
            56.15770205412611
        ],
        "wc_questions_avg": [
            72.5,
            51.848336521049546
        ],
        "wc_review_avg": [
            353.25,
            60.29251611933275
        ],
        "wc_reply_reviewers_avg": [
            18.25,
            31.60992723813201
        ],
        "wc_reply_authors_avg": [
            2216.5,
            515.3336297972412
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.5,
            0.8660254037844386
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.7071067811865475,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8089790267123633940&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=UpgRVWexaD",
        "pdf": "https://openreview.net/pdf?id=UpgRVWexaD",
        "email": "ustc.edu.cn;ustc.edu.cn;mail.ustc.edu.cn;ustc.edu.cn;ustc.edu.cn;ustc.edu.cn;mails.tsinghua.edu.cn",
        "author_num": 7,
        "aff_unique_index": "0;0;0;0;0;0;1",
        "aff_unique_norm": "University of Science and Technology of China;Tsinghua University",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.ustc.edu.cn;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "USTC;THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "UptDyx5VMk",
        "title": "Continuous Multi-step Predictions of Highly Imbalanced Multivariate Time Series via Deep Learning Network",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Multi-step prediction of multivariate time series has always been a very popular research topic across industries. We focus on the scenario in which the data with severe imbalance problem caused by the \u201c0\u201d expansion in regression analysis, and meanwhile the data contains complex textual information. Such data is very common in customer's life time value evaluation tasks in businesses. The commonly used two-stage modeling scheme effectively predicts whether or not a customer will pay for a product or service at the next moment. However, it is incapable of continuously forecasting potential payment values due to the strong imbalanced and randomness distribution of the data. In this paper, we propose a feature learning based deep learning method for imbalanced multivariate time series (FLIMTS). The innovative use of a weighted quantile loss in our proposed method handles the highly imbalance problem in regression. Furthermore, FLIMTS incorporates both the customer's payment sequence and the behavioral characteristics of their interests which allows for more accurate predictions. Empirical analysis shows that FLIMTS has significant advantages and performs better than the existing two-stage approaches on common model evaluation criteria.",
        "keywords": "highly imbalanced data;multivariate time series;LTV study;feature learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Zhenguo Gao",
        "authorids": "~Zhenguo_Gao1",
        "gender": "M",
        "homepage": "https://math.sjtu.edu.cn/Default/teachershow/tags/MDAwMDAwMDAwMLJ4nJg",
        "dblp": "",
        "google_scholar": "",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Zhenguo_Gao1",
        "aff": "Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn",
        "position": "Associate Professor",
        "bibtex": "@misc{\ngao2024continuous,\ntitle={Continuous Multi-step Predictions of Highly Imbalanced Multivariate Time Series via Deep Learning Network},\nauthor={Zhenguo Gao},\nyear={2024},\nurl={https://openreview.net/forum?id=UptDyx5VMk}\n}",
        "github": "",
        "project": "",
        "reviewers": "BcAV;sXU7;NGnU;wbNx;jHHC",
        "site": "https://openreview.net/forum?id=UptDyx5VMk",
        "pdf_size": 515017,
        "rating": "1;3;3;5;5",
        "confidence": "4;4;3;4;3",
        "soundness": "2;2;2;3;2",
        "contribution": "1;2;2;3;2",
        "presentation": "1;2;3;3;2",
        "wc_summary": "45;92;52;66;115",
        "wc_strengths": "6;10;9;43;18",
        "wc_weaknesses": "332;27;181;57;97",
        "wc_questions": "8;292;5;107;2",
        "wc_review": "391;421;247;273;232",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            3.4,
            1.4966629547095767
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.2,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            2.2,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            74.0,
            26.053790511171304
        ],
        "wc_strengths_avg": [
            17.2,
            13.49666625504239
        ],
        "wc_weaknesses_avg": [
            138.8,
            109.58540048747369
        ],
        "wc_questions_avg": [
            82.8,
            111.82736695460551
        ],
        "wc_review_avg": [
            312.8,
            77.80077120440389
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.32732683535398854,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:wwfkm9LdyZQJ:scholar.google.com/&scioq=Continuous+Multi-step+Predictions+of+Highly+Imbalanced+Multivariate+Time+Series+via+Deep+Learning+Network&hl=en&as_sdt=0,22",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Shanghai Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sjtu.edu.cn",
        "aff_unique_abbr": "SJTU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "UqEI76CKgO",
        "title": "Amphibian: A Meta-Learner for Rehearsal-Free Fast Online Continual Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Online continual learning is challenging as it requires fast adaptation over a stream of data in a non-stationary environment without forgetting the knowledge acquired in the past. To address this challenge, in this paper, we introduce Amphibian - a gradient-based meta-learner that learns to scale the direction of gradient descent to achieve the desired balance between fast learning and continual learning. For this purpose, using only the current batch of data, Amphibian minimizes a meta-objective that encourages alignments of gradients among given data samples along selected basis directions in the gradient space. From this objective, it learns a diagonal scale matrix in each layer that accumulates the history of such gradient alignments. Using these scale matrices Amphibian updates the model online only in the directions having positive cumulative gradient alignments among the data observed for far. With evaluation on standard continual image classification benchmarks, we show that such meta-learned scaled gradient descent in  Amphibian achieves state-of-the-art accuracy in online continual learning while enabling fast learning with less data and few-shot knowledge transfer to new tasks. Finally, with loss landscape visualizations, we show such gradient updates incur minimum loss to the old task enabling fast continual learning in Amphibian.",
        "keywords": "Continual learning;Meta learning;Online learning;Deep learning Algorithm",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/b676c9009bec084e5abfe214292f334e3cdec9da.zip",
        "author": "Gobinda Saha;Kaushik Roy",
        "authorids": "~Gobinda_Saha1;~Kaushik_Roy1",
        "gender": "M;M",
        "homepage": "https://sahagobinda.github.io/portfolio/;https://engineering.purdue.edu/NRL/Group",
        "dblp": "218/5562;r/KaushikRoy",
        "google_scholar": "https://scholar.google.com/citations?hl=en;to4P8KgAAAAJ",
        "orcid": ";",
        "linkedin": "gobinda-saha/;",
        "or_profile": "~Gobinda_Saha1;~Kaushik_Roy1",
        "aff": "Purdue University;Purdue University",
        "aff_domain": "purdue.edu;purdue.edu",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nsaha2024amphibian,\ntitle={Amphibian: A Meta-Learner for Rehearsal-Free Fast Online Continual Learning},\nauthor={Gobinda Saha and Kaushik Roy},\nyear={2024},\nurl={https://openreview.net/forum?id=UqEI76CKgO}\n}",
        "github": "",
        "project": "",
        "reviewers": "kAVs;ebWh;esZ7",
        "site": "https://openreview.net/forum?id=UqEI76CKgO",
        "pdf_size": 755572,
        "rating": "3;3;5",
        "confidence": "4;3;4",
        "soundness": "1;3;2",
        "contribution": "1;2;2",
        "presentation": "2;2;3",
        "wc_summary": "183;77;49",
        "wc_strengths": "22;30;50",
        "wc_weaknesses": "545;63;409",
        "wc_questions": "21;31;79",
        "wc_review": "771;201;587",
        "wc_reply_reviewers": "102;24;24",
        "wc_reply_authors": "774;197;202",
        "reply_reviewers": "1;1;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            103.0,
            57.71192828754439
        ],
        "wc_strengths_avg": [
            34.0,
            11.775681155103795
        ],
        "wc_weaknesses_avg": [
            339.0,
            202.90556095550133
        ],
        "wc_questions_avg": [
            43.666666666666664,
            25.315783394730033
        ],
        "wc_review_avg": [
            519.6666666666666,
            237.52239660480205
        ],
        "wc_reply_reviewers_avg": [
            50.0,
            36.76955262170047
        ],
        "wc_reply_authors_avg": [
            391.0,
            270.82958971771654
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:UOdg3FvZnhYJ:scholar.google.com/&scioq=Amphibian:+A+Meta-Learner+for+Rehearsal-Free+Fast+Online+Continual+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Purdue University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.purdue.edu",
        "aff_unique_abbr": "Purdue",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "UqY0SEe5pC",
        "title": "Analyzing Neural Network Based Generative Diffusion Models via Convexification",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Diffusion models are becoming widely used in state-of-the-art image, video and audio generation. Score-based diffusion models stand out among these methods, necessitating the estimation of the score function of the input data distribution. In this study, we present a theoretical framework to analyze two-layer neural network-based diffusion models by reframing score matching and denoising score matching as convex optimization. We show that the global optimum of the score matching objective can be attained by solving a simple convex program. Specifically, for univariate training data, we establish that the Langevin diffusion process through the learned neural network model converges in the Kullback-Leibler (KL) divergence to either a Gaussian or a Gaussian-Laplace distribution when the\nweight decay parameter is set appropriately. Our convex programs alleviate issues in computing the Jacobian and also extends to multidimensional score matching.",
        "keywords": "diffusion; score matching; convex optimization;",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/dc3bceb6c83a85efdd6d495b453e3d4eebb82043.zip",
        "author": "Fangzhao Zhang;Mert Pilanci",
        "authorids": "~Fangzhao_Zhang1;~Mert_Pilanci3",
        "gender": ";M",
        "homepage": ";https://stanford.edu/~pilanci/",
        "dblp": ";45/8056",
        "google_scholar": ";aSAS-aAAAAAJ",
        "orcid": ";",
        "linkedin": ";mert-pilanci-ba615743/",
        "or_profile": "~Fangzhao_Zhang1;~Mert_Pilanci3",
        "aff": ";Stanford University",
        "aff_domain": ";stanford.edu",
        "position": ";Assistant Professor",
        "bibtex": "@misc{\nzhang2024analyzing,\ntitle={Analyzing Neural Network Based Generative Diffusion Models via Convexification},\nauthor={Fangzhao Zhang and Mert Pilanci},\nyear={2024},\nurl={https://openreview.net/forum?id=UqY0SEe5pC}\n}",
        "github": "",
        "project": "",
        "reviewers": "Nb2h;nxW6;1kxL;wVrH",
        "site": "https://openreview.net/forum?id=UqY0SEe5pC",
        "pdf_size": 632025,
        "rating": "3;5;5;6",
        "confidence": "4;4;2;4",
        "soundness": "2;3;2;3",
        "contribution": "1;2;2;3",
        "presentation": "2;2;2;2",
        "wc_summary": "97;51;16;106",
        "wc_strengths": "24;23;42;62",
        "wc_weaknesses": "300;142;46;50",
        "wc_questions": "37;8;154;118",
        "wc_review": "458;224;258;336",
        "wc_reply_reviewers": "70;0;0;23",
        "wc_reply_authors": "1600;528;771;626",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "4;1;2;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            67.5,
            36.32148124732801
        ],
        "wc_strengths_avg": [
            37.75,
            15.911866640969563
        ],
        "wc_weaknesses_avg": [
            134.5,
            102.97936686540659
        ],
        "wc_questions_avg": [
            79.25,
            59.05664653533927
        ],
        "wc_review_avg": [
            319.0,
            89.9388681271896
        ],
        "wc_reply_reviewers_avg": [
            23.25,
            28.577744837547975
        ],
        "wc_reply_authors_avg": [
            881.25,
            423.8793312960659
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.13245323570650439,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:icONCUU2MB4J:scholar.google.com/&scioq=Analyzing+Neural+Network+Based+Generative+Diffusion+Models+via+Convexification&hl=en&as_sdt=0,23",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Stanford University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.stanford.edu",
        "aff_unique_abbr": "Stanford",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Stanford",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "UqZecMwLTo",
        "title": "A Unified Concept-Based System for Local, Global, and Misclassification Explanations",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Explainability of Deep Neural Networks (DNNs) has been garnering increasing attention in recent years.  Of the various explainability approaches, concept-based techniques stand out for their ability to utilize human-meaningful concepts instead of focusing solely on individual pixels. However, there is a scarcity of methods that consistently provide both local and global explanations. Moreover, most of the methods have no offer to explain misclassification cases. Considering these challenges, we present a unified concept-based system for unsupervised learning of both local and global concepts. Our primary objective is to uncover the intrinsic concepts underlying each data category by training surrogate explainer networks to estimate the importance of the concepts. Our experimental results substantiated the efficacy of the discovered concepts through diverse quantitative and qualitative assessments, encompassing faithfulness, completeness, and generality. Furthermore, our approach facilitates the explanation of both accurate and erroneous predictions, rendering it a valuable tool for comprehending the characteristics of the target objects and classes.",
        "keywords": "Explainability;Concepts;Superpixels;Local explanations;Global explanations",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Fatemeh Aghaeipoor;Dorsa Asgarian;Mohammad Sabokrou",
        "authorids": "~Fatemeh_Aghaeipoor1;~Dorsa_Asgarian1;~Mohammad_Sabokrou1",
        "gender": "F;F;M",
        "homepage": ";;https://sabokrou.github.io/",
        "dblp": "242/0890;;163/2030",
        "google_scholar": "oOBigssAAAAJ;https://scholar.google.com/citations?view_op=list_works;jqHXvT0AAAAJ",
        "orcid": ";;",
        "linkedin": "fatemeh-aghaeipoor-a5051375?originalSubdomain=ir;;",
        "or_profile": "~Fatemeh_Aghaeipoor1;~Dorsa_Asgarian1;~Mohammad_Sabokrou1",
        "aff": "Institute for Research in Fundamental Sciences;Institute for Research in Fundamental Sciences;Okinawa Institute of Science and Technology (OIST)",
        "aff_domain": "ipm.ir;ipm.ir;oist.jp",
        "position": "Postdoc;Researcher;Researcher",
        "bibtex": "@misc{\naghaeipoor2024a,\ntitle={A Unified Concept-Based System for Local, Global, and Misclassification Explanations},\nauthor={Fatemeh Aghaeipoor and Dorsa Asgarian and Mohammad Sabokrou},\nyear={2024},\nurl={https://openreview.net/forum?id=UqZecMwLTo}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZcJk;2Hkv;itZT;u8Pp;DJR7",
        "site": "https://openreview.net/forum?id=UqZecMwLTo",
        "pdf_size": 12093026,
        "rating": "3;3;3;5;6",
        "confidence": "4;5;4;4;4",
        "soundness": "2;2;1;2;2",
        "contribution": "2;1;2;2;3",
        "presentation": "2;2;1;3;3",
        "wc_summary": "85;46;96;167;42",
        "wc_strengths": "46;47;38;89;42",
        "wc_weaknesses": "169;306;231;239;201",
        "wc_questions": "144;3;52;62;5",
        "wc_review": "444;402;417;557;290",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;590",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;1",
        "rating_avg": [
            4.0,
            1.2649110640673518
        ],
        "confidence_avg": [
            4.2,
            0.39999999999999997
        ],
        "soundness_avg": [
            1.8,
            0.4
        ],
        "contribution_avg": [
            2.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            2.2,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            87.2,
            45.145985425062996
        ],
        "wc_strengths_avg": [
            52.4,
            18.57525235360209
        ],
        "wc_weaknesses_avg": [
            229.2,
            45.643838576526406
        ],
        "wc_questions_avg": [
            53.2,
            51.31627422173204
        ],
        "wc_review_avg": [
            422.0,
            85.50789437239114
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            118.0,
            236.0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0.2,
            0.4
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.39528470752104744,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:QkLkrijQejUJ:scholar.google.com/&scioq=A+Unified+Concept-Based+System+for+Local,+Global,+and+Misclassification+Explanations&hl=en&as_sdt=0,5",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Institute for Research in Fundamental Sciences;Okinawa Institute of Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://ipm.ir;https://www.oist.jp",
        "aff_unique_abbr": "IPM;OIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "Iran;Japan"
    },
    {
        "id": "Ur25Xxvzsg",
        "title": "Transferable Deep Clustering Model",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep learning has shown remarkable success in the field of clustering recently. However, how to transfer a trained clustering model on a source domain to a target domain by leveraging the acquired knowledge to guide the clustering process remains challenging. Existing deep clustering methods often lack generalizability to new domains because they typically learn a group of fixed cluster centroids, which may not be optimal for the new domain distributions. In this paper, we propose a novel transferable deep clustering model that can automatically adapt the cluster centroids according to the distribution of data samples. Rather than learning a fixed set of centroids, our approach introduces a novel attention-based module that can adapt the centroids by measuring their relationship with samples. In addition, we theoretically show that our model is strictly more powerful than some classical clustering algorithms such as k-means or Gaussian Mixture Model (GMM). Experimental results on both synthetic and real-world datasets demonstrate the effectiveness and efficiency of our proposed transfer learning framework, which significantly improves the performance on target domain and reduces the computational cost.",
        "keywords": "Deep clustering model;transfer learning;attention model",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/55624fa3ac1ac3a4459c1e8b05b874943d88444b.zip",
        "author": "Zheng Zhang;Liang Zhao",
        "authorids": "~Zheng_Zhang10;~Liang_Zhao6",
        "gender": "M;M",
        "homepage": ";https://cs.emory.edu/~lzhao41/",
        "dblp": "181/2621-18;63/5422-2",
        "google_scholar": "fRdZRHsAAAAJ;qnvyqtwAAAAJ",
        "orcid": ";0000-0002-2648-9989",
        "linkedin": ";",
        "or_profile": "~Zheng_Zhang10;~Liang_Zhao6",
        "aff": "Emory University;Emory University",
        "aff_domain": "emory.edu;emory.edu",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\nzhang2024transferable,\ntitle={Transferable Deep Clustering Model},\nauthor={Zheng Zhang and Liang Zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=Ur25Xxvzsg}\n}",
        "github": "",
        "project": "",
        "reviewers": "qTtt;UH8p;akM3;ffVS",
        "site": "https://openreview.net/forum?id=Ur25Xxvzsg",
        "pdf_size": 371143,
        "rating": "3;3;5;6",
        "confidence": "4;3;4;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "2;2;3;2",
        "wc_summary": "38;70;49;82",
        "wc_strengths": "6;53;43;63",
        "wc_weaknesses": "118;293;158;123",
        "wc_questions": "118;5;164;138",
        "wc_review": "280;421;414;406",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            59.75,
            17.239127008059313
        ],
        "wc_strengths_avg": [
            41.25,
            21.545011023436494
        ],
        "wc_weaknesses_avg": [
            173.0,
            70.97534783289196
        ],
        "wc_questions_avg": [
            106.25,
            60.6892700565759
        ],
        "wc_review_avg": [
            380.25,
            58.12217735081851
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.19245008972987526,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:pYvmzHZmHTIJ:scholar.google.com/&scioq=Transferable+Deep+Clustering+Model&hl=en&as_sdt=0,33",
        "gs_version_total": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Emory University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.emory.edu",
        "aff_unique_abbr": "Emory",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Ur4LqAOXIF",
        "title": "SODA: Stream Out-of-Distribution Adaptation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In open-context environments, machine learning models require out-of-distribution (OOD) awareness to ensure safe operation. However, existing OOD detection approaches have primarily focused on the offline setting, where OOD detectors remain static and fixed after deployment. This limits their ability to perform in real-world environments with unknown and ever-shifting out-of-distribution data. To address this limitation, we propose a novel online OOD detection framework that allows for continuous adaptation of the OOD detector. Our framework updates the ID classifier and OOD detector sequentially, based on samples observed from the deployed environment, and minimizes the risk of incorrect OOD predictions at each timestep. Unlike traditional offline OOD detection methods, our online framework provides the adaptivity and practicality needed for real-world environments. Theoretical analysis demonstrates that our algorithm provably achieves sub-linear regret and converges to the optimal OOD detector over time. Empirical evaluation in various environments shows that our online OOD detector significantly outperforms offline methods, highlighting the superiority of our framework for real-world applications of OOD detection.",
        "keywords": "out-of-distribution detection;distribution shift;machine learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Andrew Geng;Kangwook Lee;Yixuan Li",
        "authorids": "~Andrew_Geng1;~Kangwook_Lee1;~Yixuan_Li1",
        "gender": "M;M;F",
        "homepage": "https://pages.cs.wisc.edu/~ageng/#/;http://kangwooklee.com/;http://pages.cs.wisc.edu/~sharonli/",
        "dblp": ";88/9826-1;144/6087-1",
        "google_scholar": ";sCEl8r-n5VEC;https://scholar.google.com/citations?hl=en",
        "orcid": ";;",
        "linkedin": ";;liyixuan",
        "or_profile": "~Andrew_Geng1;~Kangwook_Lee1;~Yixuan_Li1",
        "aff": "International Business Machines;KRAFTON;Cornell University",
        "aff_domain": "ibm.com;krafton.com;cornell.edu",
        "position": "Researcher;Researcher;Graduate Student",
        "bibtex": "@misc{\ngeng2024soda,\ntitle={{SODA}: Stream Out-of-Distribution Adaptation},\nauthor={Andrew Geng and Kangwook Lee and Yixuan Li},\nyear={2024},\nurl={https://openreview.net/forum?id=Ur4LqAOXIF}\n}",
        "github": "",
        "project": "",
        "reviewers": "oqWZ;dt7Y;eZ4h;WYay",
        "site": "https://openreview.net/forum?id=Ur4LqAOXIF",
        "pdf_size": 4162061,
        "rating": "3;3;3;5",
        "confidence": "4;3;3;2",
        "soundness": "3;3;3;3",
        "contribution": "2;2;2;2",
        "presentation": "3;2;3;3",
        "wc_summary": "80;78;74;34",
        "wc_strengths": "32;59;22;59",
        "wc_weaknesses": "250;335;28;244",
        "wc_questions": "20;134;139;6",
        "wc_review": "382;606;263;343",
        "wc_reply_reviewers": "0;0;258;0",
        "wc_reply_authors": "529;911;839;506",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;2;2;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            66.5,
            18.887826767524103
        ],
        "wc_strengths_avg": [
            43.0,
            16.38596960817394
        ],
        "wc_weaknesses_avg": [
            214.25,
            113.39394825121842
        ],
        "wc_questions_avg": [
            74.75,
            61.973280532823175
        ],
        "wc_review_avg": [
            398.5,
            127.24877209623675
        ],
        "wc_reply_reviewers_avg": [
            64.5,
            111.71727708819259
        ],
        "wc_reply_authors_avg": [
            696.25,
            180.73651401971878
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:QZNXXRkAiaoJ:scholar.google.com/&scioq=SODA:+Stream+Out-of-Distribution+Adaptation&hl=en&as_sdt=0,47",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "International Business Machines Corporation;KRAFTON Inc.;Cornell University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ibm.com;https://www.krafton.com;https://www.cornell.edu",
        "aff_unique_abbr": "IBM;KRAFTON;Cornell",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United States;South Korea"
    },
    {
        "id": "UrmnIDCzLA",
        "title": "Overcoming bias towards base sessions in few-shot class-incremental learning (FSCIL)",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Few-shot class-incremental learning (FSCIL) with a more realistic and challenging problem setting aims to learn a set of novel object classes with a restricted number of training examples in sequence. In the process, striking a balance between not forgetting previously-learned object classes and overfitting to novel ones plays a crucial role. Meanwhile, conventional methods exhibit a significant performance bias towards a base session: excessively low incremental performance compared to base performance. To tackle this, we propose a simple-but-effective pipeline that achieves a substantial performance margin for incremental sessions. Further, we devise and perform comprehensive experiments under diverse conditions\u2014leveraging pretrained representations, various classification modules, and aggregation of the predictions within our pipeline; our findings reveal essential insights towards model design and future research directions. Additionally, we introduce a set of new evaluation metrics and benchmark datasets to address the limitations of the conventional metrics and benchmark datasets which disguise the bias towards a base session. These newly introduced metrics and datasets allow to estimate the generalization of FSCIL models. Furthermore, we achieve new state-of-the-art performance with significant margins as a result of our study. The codes of our study are available at GITHUB.",
        "keywords": "Continual learning;Few-shot learning;Few-shot class-incremental learning;Pretrained representations;Self-supervised learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/2db1f82a0a30f85df81ebfb8220d0c7537b576be.pdf",
        "author": "Myeongjin Lee;Jiae Yoon;Ue-Hwan Kim",
        "authorids": "~Myeongjin_Lee2;~Jiae_Yoon1;~Ue-Hwan_Kim1",
        "gender": "M;F;M",
        "homepage": "https://github.com/lmj311;https://www.notion.so/jiaeyoon/Jiae-Yoon-905908b9308747818ca4f5f0a77de777;https://uehwan.github.io/",
        "dblp": ";;",
        "google_scholar": ";;EPliWZIAAAAJ",
        "orcid": ";;0000-0003-2201-2988",
        "linkedin": ";;",
        "or_profile": "~Myeongjin_Lee2;~Jiae_Yoon1;~Ue-Hwan_Kim1",
        "aff": "Gwangju Institute of Science and Technology;Gwangju Institute of Science and Technology;Gwangju Institute of Science and Technology",
        "aff_domain": "gist.ac.kr;gist.ac.kr;gist.ac.kr",
        "position": "Undergrad student;PhD student;Assistant Professor",
        "bibtex": "@misc{\nlee2024overcoming,\ntitle={Overcoming bias towards base sessions in few-shot class-incremental learning ({FSCIL})},\nauthor={Myeongjin Lee and Jiae Yoon and Ue-Hwan Kim},\nyear={2024},\nurl={https://openreview.net/forum?id=UrmnIDCzLA}\n}",
        "github": "",
        "project": "",
        "reviewers": "qGui;SuEP;jpg9",
        "site": "https://openreview.net/forum?id=UrmnIDCzLA",
        "pdf_size": 4556406,
        "rating": "5;5;5",
        "confidence": "5;2;3",
        "soundness": "3;2;3",
        "contribution": "2;2;2",
        "presentation": "2;2;2",
        "wc_summary": "164;70;32",
        "wc_strengths": "60;26;13",
        "wc_weaknesses": "368;398;61",
        "wc_questions": "31;4;11",
        "wc_review": "623;498;117",
        "wc_reply_reviewers": "108;29;0",
        "wc_reply_authors": "757;725;538",
        "reply_reviewers": "1;1;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.3333333333333335,
            1.247219128924647
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            88.66666666666667,
            55.481728724168484
        ],
        "wc_strengths_avg": [
            33.0,
            19.8158185969358
        ],
        "wc_weaknesses_avg": [
            275.6666666666667,
            152.2855504927795
        ],
        "wc_questions_avg": [
            15.333333333333334,
            11.440668201153676
        ],
        "wc_review_avg": [
            412.6666666666667,
            215.20584461290906
        ],
        "wc_reply_reviewers_avg": [
            45.666666666666664,
            45.63867755411948
        ],
        "wc_reply_authors_avg": [
            673.3333333333334,
            96.58272217235452
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:i91z00z92c4J:scholar.google.com/&scioq=Overcoming+bias+towards+base+sessions+in+few-shot+class-incremental+learning+(FSCIL)&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Gwangju Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.gist.ac.kr",
        "aff_unique_abbr": "GIST",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Gwangju",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "Ut4lyQnJ7Y",
        "title": "Learn What You Need in Personalized Federated Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Personalized federated learning aims to address data heterogeneity across local clients in federated learning. However, current methods blindly incorporate either full model parameters or predefined partial parameters in personalized federated learning. They fail to customize the collaboration manner according to each local client's data characteristics, causing unpleasant aggregation results. To address this essential issue, we propose $\\textit{Learn2pFed}$, a novel algorithm-unrolling-based personalized federated learning framework, enabling each client to adaptively select which part of its local model parameters should participate in collaborative training. The key novelty of the proposed $\\textit{Learn2pFed}$ is to optimize each local model parameter's degree of participant in collaboration as learnable parameters via algorithm unrolling methods. This approach brings two benefits:  1) mathmatically determining the participation degree of local model parameters in the federated collaboration, and 2) obtaining more stable and improved solutions. Extensive experiments on various tasks, including regression, forecasting, and image classification,  demonstrate that $\\textit{Learn2pFed}$ significantly outperforms previous personalized federated learning methods.",
        "keywords": "personalized federated learning;unrolling;collaboration",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/c1791c34cc09251acb1931c2475e7fde9ef17322.pdf",
        "author": "Kexin Lv;Rui Ye;Xiaolin Huang;JIE YANG;Siheng Chen",
        "authorids": "~Kexin_Lv1;~Rui_Ye1;~Xiaolin_Huang1;~JIE_YANG18;~Siheng_Chen1",
        "gender": "F;M;M;M;M",
        "homepage": ";http://rui-ye.github.io/;http://www.pami.sjtu.edu.cn/en/xiaolin;http://www.pami.sjtu.edu.cn;https://siheng-chen.github.io/",
        "dblp": "263/6869;;61/2227;;136/4945",
        "google_scholar": ";Q4-VTxcAAAAJ;DR-gBcEAAAAJ;;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0002-3462-241X;;;;",
        "linkedin": ";;;;",
        "or_profile": "~Kexin_Lv1;~Rui_Ye1;~Xiaolin_Huang1;~JIE_YANG18;~Siheng_Chen2",
        "aff": ";Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University",
        "aff_domain": ";sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn",
        "position": ";PhD student;Full Professor;Full Professor;Associate Professor",
        "bibtex": "@misc{\nlv2024learn,\ntitle={Learn What You Need  in Personalized Federated Learning},\nauthor={Kexin Lv and Rui Ye and Xiaolin Huang and JIE YANG and Siheng Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=Ut4lyQnJ7Y}\n}",
        "github": "",
        "project": "",
        "reviewers": "pvjk;BaaV;tbfK;7Lgr",
        "site": "https://openreview.net/forum?id=Ut4lyQnJ7Y",
        "pdf_size": 0,
        "rating": "3;5;6;6",
        "confidence": "4;4;3;5",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "51;41;60;60",
        "wc_strengths": "90;26;41;38",
        "wc_weaknesses": "317;207;64;91",
        "wc_questions": "62;76;86;18",
        "wc_review": "520;350;251;207",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            53.0,
            7.842193570679061
        ],
        "wc_strengths_avg": [
            48.75,
            24.468091466234142
        ],
        "wc_weaknesses_avg": [
            169.75,
            100.56683101301343
        ],
        "wc_questions_avg": [
            60.5,
            25.975950415721076
        ],
        "wc_review_avg": [
            332.0,
            120.26429228993949
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8274519216860366080&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Shanghai Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sjtu.edu.cn",
        "aff_unique_abbr": "SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "UtB1Uk1LFE",
        "title": "Delayed Generalization: Bridging Double Descent and Grokking",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "A popular approach to understanding generalization in neural networks is to study phenomena such as double descent or grokking, in which learning curves exhibit non-monotonicity and generalization long after overfitting. So far, these topics have been studied in isolation. We unify double descent and grokking by showing important similarities; in particular we provide the first demonstrations of grokking with respect to model size, regularization strength, and sample size, and show it is possible to empirically interpolate between grokking and double descent in various settings. We argue that grokking and double descent are better understood as instances of a broader phenomenon that we call \\emph{Staggered Learning}, and introduce a model of delayed generalization in terms of pattern learning speeds.",
        "keywords": "double descent;grokking;science of deep learning;empirical theory of deep learning;generalization;overfitting;delayed generalization;feature learning;pattern learning;representation learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Xander Davies;Jesse Hoogland;Lauro Langosco;David Krueger",
        "authorids": "~Xander_Davies1;~Jesse_Hoogland1;~Lauro_Langosco1;~David_Krueger1",
        "gender": "M;M;;M",
        "homepage": "https://jessehoogland.com;https://mila.umontreal.ca/en/person/david-scott-krueger/;https://www.laurolangosco.com/;https://xanderdavies.com/",
        "dblp": ";142/2741.html;298/0973;",
        "google_scholar": "KzeLSKMAAAAJ;https://scholar.google.ca/citations?user=5Uz70IoAAAAJ;8-HOLxkAAAAJ;",
        "orcid": ";;;",
        "linkedin": "jesse-hoogland/;;laurolangosco/;alexander-l-davies",
        "or_profile": "~Jesse_Hoogland1;~David_Krueger1;~Lauro_Langosco_di_Langosco1;~Alexander_Davies1",
        "aff": "Timaeus;University of Cambridge;University of Cambridge;University of Oxford",
        "aff_domain": "timaeus.co;cam.ac.uk;cam.ac.uk;oxford.ac.uk",
        "position": "Researcher;Assistant Professor;PhD student;PhD student",
        "bibtex": "@misc{\ndavies2024delayed,\ntitle={Delayed Generalization: Bridging Double Descent and Grokking},\nauthor={Xander Davies and Jesse Hoogland and Lauro Langosco and David Krueger},\nyear={2024},\nurl={https://openreview.net/forum?id=UtB1Uk1LFE}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=UtB1Uk1LFE",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:XfgSia7WaVkJ:scholar.google.com/&scioq=Delayed+Generalization:+Bridging+Double+Descent+and+Grokking&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "Timaeus;University of Cambridge;University of Oxford",
        "aff_unique_dep": ";;",
        "aff_unique_url": ";https://www.cam.ac.uk;https://www.ox.ac.uk",
        "aff_unique_abbr": ";Cambridge;Oxford",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Cambridge",
        "aff_country_unique_index": "1;1;1",
        "aff_country_unique": ";United Kingdom"
    },
    {
        "id": "UtfesouuLv",
        "title": "AbnormalLog: A Deep Anomaly Detection Method for Log Sequence Data",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Anomaly detection for computer log sequence data plays a very important role in various industries. Log data is complex time series with plenty of text information, which is difficult to process due to both its non-structural characteristics and temporal correlation. Existing log anomaly detection schemes do not utilize all available data information such as the semantic and parameter information, nor do they consider weighting of data based on time. The AbnormalLog algorithm proposed in this paper implements semantic parsing technique to expand current detection schemes by analyzing template and parameter information of the log data. AbnormalLog is comprised of four functional modules: Log Parsing, Semantic Embedding, Parameter Anomaly Detection and Template Anomaly Detection. We compare the proposed method to three most commonly used log anomaly detection methods in industry. The results demonstrate that AbnormalLog is superior to the other algorithms with respect to common model evaluation criteria.",
        "keywords": "Log Data Analysis;Anomaly Detection;Complex Sequential Data analysis;Log parsing",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Zhenguo Gao",
        "authorids": "~Zhenguo_Gao1",
        "gender": "M",
        "homepage": "https://math.sjtu.edu.cn/Default/teachershow/tags/MDAwMDAwMDAwMLJ4nJg",
        "dblp": "",
        "google_scholar": "",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Zhenguo_Gao1",
        "aff": "Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn",
        "position": "Associate Professor",
        "bibtex": "@misc{\ngao2024abnormallog,\ntitle={AbnormalLog: A Deep Anomaly Detection Method for Log Sequence Data},\nauthor={Zhenguo Gao},\nyear={2024},\nurl={https://openreview.net/forum?id=UtfesouuLv}\n}",
        "github": "",
        "project": "",
        "reviewers": "reVm;edrz;jFMJ",
        "site": "https://openreview.net/forum?id=UtfesouuLv",
        "pdf_size": 249241,
        "rating": "3;3;5",
        "confidence": "4;4;4",
        "soundness": "2;1;1",
        "contribution": "1;2;2",
        "presentation": "2;2;3",
        "wc_summary": "36;25;51",
        "wc_strengths": "24;9;144",
        "wc_weaknesses": "169;346;553",
        "wc_questions": "43;68;9",
        "wc_review": "272;448;757",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            37.333333333333336,
            10.656244908763853
        ],
        "wc_strengths_avg": [
            59.0,
            60.41522986797286
        ],
        "wc_weaknesses_avg": [
            356.0,
            156.92673449734434
        ],
        "wc_questions_avg": [
            40.0,
            24.179881444429512
        ],
        "wc_review_avg": [
            492.3333333333333,
            200.46667775191187
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:VH6w2jhfkYAJ:scholar.google.com/&scioq=AbnormalLog:+A+Deep+Anomaly+Detection+Method+for+Log+Sequence+Data&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Shanghai Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sjtu.edu.cn",
        "aff_unique_abbr": "SJTU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "title": "Fourier Transporter: Bi-Equivariant Robotic Manipulation in 3D",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18515",
        "id": "UulwvAU1W0",
        "author_site": "Haojie Huang, Owen Howell, Dian Wang, Xupeng Zhu, Robert Platt, Robin Walters",
        "tldr": "",
        "abstract": "Many complex robotic manipulation tasks can be decomposed as a sequence of pick and place actions. Training a robotic agent to learn this sequence over many different starting conditions typically requires many iterations or demonstrations, especially in 3D environments. In this work, we propose Fourier Transporter ($\\text{FourTran}$), which leverages the two-fold $\\mathrm{SE}(d)\\times\\mathrm{SE}(d)$  symmetry in the pick-place problem to achieve much higher sample efficiency. $\\text{FourTran}$ is an open-loop behavior cloning method trained using expert demonstrations to predict pick-place actions on new configurations. $\\text{FourTran}$ is constrained by the symmetries of the pick and place actions independently. Our method utilizes a fiber space Fourier transformation that allows for memory-efficient computation. Tests on the RLbench benchmark achieve state-of-the-art results across various tasks.",
        "keywords": "Robot Learning;Geometric Deep Learning;Robotic Manipulation;Equivariant deep learning",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Haojie Huang;Owen Lewis Howell;Dian Wang;Xupeng Zhu;Robert Platt;Robin Walters",
        "authorids": "~Haojie_Huang1;~Owen_Lewis_Howell1;~Dian_Wang1;~Xupeng_Zhu1;~Robert_Platt1;~Robin_Walters1",
        "gender": "M;M;M;M;;M",
        "homepage": "https://haojhuang.github.io/;;https://pointw.github.io/;https://zxp-s-works.github.io/;http://www.ccs.neu.edu/home/rplatt/;http://www.robinwalters.com",
        "dblp": "144/2195;;191/1369-1;257/4426;39/5434;258/3416",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;8bmIJtAAAAAJ;CckjtfQAAAAJ;mwxz-8MAAAAJ;Z4Y5S2oAAAAJ;fnprJmUAAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";;dianwang1007;xupengzhu-skunk;;",
        "or_profile": "~Haojie_Huang1;~Owen_Lewis_Howell1;~Dian_Wang1;~Xupeng_Zhu1;~Robert_Platt1;~Robin_Walters1",
        "aff": "Northeastern University;Northeastern University;Northeastern University;Northeastern University;Northeastern University;Northeastern University ",
        "aff_domain": "northeastern.edu;neu.edu;northeastern.edu;northeastern.edu;neu.edu;northeastern.edu",
        "position": "PhD student;PhD student;PhD student;PhD student;Associate Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nhuang2024fourier,\ntitle={Fourier Transporter: Bi-Equivariant Robotic Manipulation in 3D},\nauthor={Haojie Huang and Owen Lewis Howell and Dian Wang and Xupeng Zhu and Robert Platt and Robin Walters},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=UulwvAU1W0}\n}",
        "github": "",
        "project": "",
        "reviewers": "DeU9;vhc8;sjsh;n4JL",
        "pdf_size": 7894720,
        "rating": "5;6;6;8",
        "confidence": "4;4;3;3",
        "soundness": "2;3;3;4",
        "contribution": "2;2;3;3",
        "presentation": "2;3;3;2",
        "wc_summary": "60;216;84;68",
        "wc_strengths": "43;79;42;91",
        "wc_weaknesses": "76;336;57;88",
        "wc_questions": "26;137;187;75",
        "wc_review": "205;768;370;322",
        "wc_reply_reviewers": "17;94;48;0",
        "wc_reply_authors": "774;804;517;404",
        "reply_reviewers": "1;1;2;0",
        "reply_authors": "2;2;2;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            107.0,
            63.52164985262898
        ],
        "wc_strengths_avg": [
            63.75,
            21.672274915199836
        ],
        "wc_weaknesses_avg": [
            139.25,
            114.13013405757482
        ],
        "wc_questions_avg": [
            106.25,
            60.997438470807936
        ],
        "wc_review_avg": [
            416.25,
            211.7644623160364
        ],
        "wc_reply_reviewers_avg": [
            39.75,
            35.73776014245996
        ],
        "wc_reply_authors_avg": [
            624.75,
            169.37144830224486
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.6882472016116854,
        "gs_citation": 24,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2270463298186511714&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=UulwvAU1W0",
        "pdf": "https://openreview.net/pdf?id=UulwvAU1W0",
        "email": "northeastern.edu;neu.edu;northeastern.edu;northeastern.edu;neu.edu;northeastern.edu",
        "author_num": 6,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "Northeastern University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.northeastern.edu",
        "aff_unique_abbr": "NEU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "UvRjDCYIHw",
        "title": "Double Equivariance for Inductive Link Prediction for Both New Nodes and New Relation Types",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The task of inductive link prediction in discrete attributed multigraphs (e.g., knowledge graphs, multilayer networks, heterogeneous networks, etc.) generally focuses on test predictions with solely new nodes but not both new nodes and new relation types. In this work, we formally define the task of predicting (completely) new nodes and new relation types in test as a doubly inductive link prediction task and introduce a theoretical framework for the solution. We start by defining the concept of double permutation-equivariant representations that are equivariant to permutations of both node identities and edge relation types. We then propose a general blueprint to design neural architectures that impose a structural representation of relations that can inductively generalize from training nodes and relations to arbitrarily new test nodes and relations without the need for adaptation, side information, or retraining. We also introduce the concept of distributionally double equivariant positional embeddings designed to perform the same task. Finally, we empirically demonstrate the capability of the two proposed models on a set of novel real-world benchmarks, showcasing relative performance gains of up to 41.40% on predicting new relations types compared to baselines.",
        "keywords": "Link Prediction;Double Permutation-Equivariance;Discrete Attributed Multigraph;Knowledge Graph;GNN",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Jianfei Gao;Yangze Zhou;Jincheng Zhou;Bruno Ribeiro",
        "authorids": "~Jianfei_Gao2;~Yangze_Zhou1;~Jincheng_Zhou1;~Bruno_Ribeiro1",
        "gender": "M;M;M;M",
        "homepage": ";;https://www.jinchengzhou.net/;https://www.cs.purdue.edu/homes/ribeirob/",
        "dblp": "258/3220-1;287/4321;;15/606",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;o_lyLmgAAAAJ;https://scholar.google.com/citations?hl=en;KIEleCsAAAAJ",
        "orcid": ";;0000-0003-2328-6614;0000-0002-3527-6192",
        "linkedin": "%E5%89%91%E9%A3%9E-%E9%AB%98-b9b16a207/?locale=en_US;yangze-zhou-29a710115/;jincheng-zhou-042096176/;",
        "or_profile": "~Jianfei_Gao2;~Yangze_Zhou1;~Jincheng_Zhou1;~Bruno_Ribeiro1",
        "aff": "Amazon;Purdue University;Purdue University;Stanford University",
        "aff_domain": "amazon.com;purdue.edu;purdue.edu;stanford.edu",
        "position": "Researcher;PhD student;PhD student;Visiting Associate Professor",
        "bibtex": "@misc{\ngao2024double,\ntitle={Double Equivariance for Inductive Link Prediction for Both New Nodes and New Relation Types},\nauthor={Jianfei Gao and Yangze Zhou and Jincheng Zhou and Bruno Ribeiro},\nyear={2024},\nurl={https://openreview.net/forum?id=UvRjDCYIHw}\n}",
        "github": "",
        "project": "",
        "reviewers": "Uo9n;ZXyk;1Qir;VGiN",
        "site": "https://openreview.net/forum?id=UvRjDCYIHw",
        "pdf_size": 17361843,
        "rating": "3;5;6;8",
        "confidence": "4;4;4;4",
        "soundness": "2;4;3;3",
        "contribution": "2;2;3;3",
        "presentation": "1;3;3;4",
        "wc_summary": "108;55;67;110",
        "wc_strengths": "65;55;33;131",
        "wc_weaknesses": "412;83;78;233",
        "wc_questions": "71;39;74;151",
        "wc_review": "656;232;252;625",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1934;985;1231;1142",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;2;2;2",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            85.0,
            24.38237068047322
        ],
        "wc_strengths_avg": [
            71.0,
            36.52396473549935
        ],
        "wc_weaknesses_avg": [
            201.5,
            136.5622568647721
        ],
        "wc_questions_avg": [
            83.75,
            41.17872630376029
        ],
        "wc_review_avg": [
            441.25,
            199.6764570498986
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1323.0,
            363.5897413294275
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13487655965999374600&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "Amazon;Purdue University;Stanford University",
        "aff_unique_dep": "Amazon.com, Inc.;;",
        "aff_unique_url": "https://www.amazon.com;https://www.purdue.edu;https://www.stanford.edu",
        "aff_unique_abbr": "Amazon;Purdue;Stanford",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Stanford",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "A representation-learning game for classes of prediction tasks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18514",
        "id": "Uw8xvFqVAE",
        "author_site": "Neria Uzan, Nir Weinberger",
        "tldr": "",
        "abstract": "We propose a game-based formulation for learning dimensionality-reducing representations of feature vectors, when only a prior knowledge on future prediction tasks is available. In this game, the first player chooses a representation, and then the second player adversarially chooses a prediction task from a given class, representing the prior knowledge. The first player aims to minimize, and the second player to maximize, the regret: The minimal prediction loss using the representation, compared to the same loss using the original features. We consider the canonical setting in which the representation, the response to predict and the predictors are all linear functions, and the loss function is the mean squared error. We derive the theoretically optimal representation in pure strategies, which shows the effectiveness of the prior knowledge, and the optimal regret in mixed strategies, which shows the usefulness of randomizing the representation. For general representation, prediction and loss functions, we propose an efficient algorithm to optimize a randomized representation. The algorithm only requires the gradients of the loss function, and is based on incrementally adding a representation rule to a mixture of such rules.",
        "keywords": "representation learning;semi-supervised learning;dimensionality-reduction;regret;minimax solution;mixed strategies;multiplicative weights update",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Neria Uzan;Nir Weinberger",
        "authorids": "~Neria_Uzan1;~Nir_Weinberger1",
        "gender": "M;M",
        "homepage": ";https://sites.google.com/view/nir-weinberger/home",
        "dblp": ";82/11151.html",
        "google_scholar": ";zRkNfH8AAAAJ",
        "orcid": ";",
        "linkedin": "neria-uzan-369803107/;",
        "or_profile": "~Neria_Uzan1;~Nir_Weinberger1",
        "aff": ";Electrical Engineering Department, Technion \u2013 Israel Institute of Technology, Technion - Israel Institute of Technology",
        "aff_domain": ";ee.technion.ac.il",
        "position": ";Assistant Professor",
        "bibtex": "@inproceedings{\nuzan2024a,\ntitle={A representation-learning game for classes of prediction tasks},\nauthor={Neria Uzan and Nir Weinberger},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Uw8xvFqVAE}\n}",
        "github": "",
        "project": "",
        "reviewers": "HEJP;eNwZ;yB5J;crzZ",
        "pdf_size": 778055,
        "rating": "6;8;8;8",
        "confidence": "2;3;2;4",
        "soundness": "3;3;3;3",
        "contribution": "4;3;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "757;43;46;46",
        "wc_strengths": "201;51;17;27",
        "wc_weaknesses": "178;33;21;30",
        "wc_questions": "1;101;92;19",
        "wc_review": "1137;228;176;122",
        "wc_reply_reviewers": "0;311;0;0",
        "wc_reply_authors": "267;1523;671;357",
        "reply_reviewers": "0;2;0;0",
        "reply_authors": "1;3;1;1",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            223.0,
            308.3074763932915
        ],
        "wc_strengths_avg": [
            74.0,
            74.35724578008521
        ],
        "wc_weaknesses_avg": [
            65.5,
            65.10184329187615
        ],
        "wc_questions_avg": [
            53.25,
            43.831352933716296
        ],
        "wc_review_avg": [
            415.75,
            418.09710295576076
        ],
        "wc_reply_reviewers_avg": [
            77.75,
            134.66695028848022
        ],
        "wc_reply_authors_avg": [
            704.5,
            495.7890176274581
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.5222329678670935,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:3MeR4ktXjMcJ:scholar.google.com/&scioq=A+representation-learning+game+for+classes+of+prediction+tasks&hl=en&as_sdt=0,33",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=Uw8xvFqVAE",
        "pdf": "https://openreview.net/pdf?id=Uw8xvFqVAE",
        "email": ";ee.technion.ac.il",
        "author_num": 2,
        "aff_unique_index": "0",
        "aff_unique_norm": "Technion \u2013 Israel Institute of Technology",
        "aff_unique_dep": "Electrical Engineering Department",
        "aff_unique_url": "https://www.technion.ac.il",
        "aff_unique_abbr": "Technion",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Israel"
    },
    {
        "title": "Meaning Representations from Trajectories in Autoregressive Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18513",
        "id": "UyGWafcopT",
        "author_site": "Tian Yu Liu, Matthew Trager, Alessandro Achille, Pramuditha Perera, Luca Zancato, Stefano Soatto",
        "tldr": "",
        "abstract": "We propose to extract meaning representations from autoregressive language models by considering the distribution of all possible trajectories extending an input text. This strategy is prompt-free, does not require fine-tuning, and is applicable to any pre-trained autoregressive model. Moreover, unlike vector-based representations,  distribution-based representations can also model asymmetric relations (e.g., direction of logical entailment, hypernym/hyponym relations) by using algebraic operations between likelihood functions. These ideas are grounded in distributional perspectives on semantics and are connected to standard constructions in automata theory, but to our knowledge they have not been applied to modern language models. We empirically show that the representations obtained from large models align well with human annotations, outperform other zero-shot and prompt-free methods on semantic similarity tasks, and can be used to solve more complex entailment and containment tasks that standard embeddings cannot handle. Finally, we extend our method  to represent data from different modalities (e.g., image and text) using multimodal autoregressive models. Our code is available at: https://github.com/tianyu139/meaning-as-trajectories",
        "keywords": "definitions of meaning;semantic similarity;sentence embeddings",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Tian Yu Liu;Matthew Trager;Alessandro Achille;Pramuditha Perera;Luca Zancato;Stefano Soatto",
        "authorids": "~Tian_Yu_Liu2;~Matthew_Trager2;~Alessandro_Achille1;~Pramuditha_Perera3;~Luca_Zancato1;~Stefano_Soatto3",
        "gender": ";;M;M;M;",
        "homepage": ";;;;;",
        "dblp": ";176/1439;190/7328;192/4889;274/1481;",
        "google_scholar": ";g3sXAWkAAAAJ;;RxvJDQMAAAAJ;Z2Mhh2UAAAAJ;",
        "orcid": ";;;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Tian_Yu_Liu2;~Matthew_Trager2;~Alessandro_Achille1;~Pramuditha_Perera3;~Luca_Zancato1;~Stefano_Soatto3",
        "aff": ";Amazon;Amazon;Amazon;Amazon Web Services;",
        "aff_domain": ";amazon.com;amazon.com;amazon.com;amazon.it;",
        "position": ";Applied Scientist;Applied Research Scientist;Researcher;Applied Scientist;",
        "bibtex": "@inproceedings{\nliu2024meaning,\ntitle={Meaning Representations from Trajectories in Autoregressive Models},\nauthor={Tian Yu Liu and Matthew Trager and Alessandro Achille and Pramuditha Perera and Luca Zancato and Stefano Soatto},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=UyGWafcopT}\n}",
        "github": "",
        "project": "",
        "reviewers": "7D5R;Lfxp;xcZs;ecJy",
        "pdf_size": 1189056,
        "rating": "6;6;8;8",
        "confidence": "3;4;4;4",
        "soundness": "3;3;4;3",
        "contribution": "3;3;3;3",
        "presentation": "3;4;4;3",
        "wc_summary": "108;171;56;98",
        "wc_strengths": "62;106;49;47",
        "wc_weaknesses": "93;102;190;181",
        "wc_questions": "37;15;161;76",
        "wc_review": "300;394;456;402",
        "wc_reply_reviewers": "86;0;9;16",
        "wc_reply_authors": "754;338;1294;709",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "2;1;2;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            108.25,
            41.14835962708599
        ],
        "wc_strengths_avg": [
            66.0,
            23.80126047082381
        ],
        "wc_weaknesses_avg": [
            141.5,
            44.22951503238533
        ],
        "wc_questions_avg": [
            72.25,
            55.70177286227073
        ],
        "wc_review_avg": [
            388.0,
            56.124860801609124
        ],
        "wc_reply_reviewers_avg": [
            27.75,
            34.10553474144629
        ],
        "wc_reply_authors_avg": [
            773.75,
            340.99880864894527
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12887239941272670875&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=UyGWafcopT",
        "pdf": "https://openreview.net/pdf?id=UyGWafcopT",
        "email": ";amazon.com;amazon.com;amazon.com;amazon.it;",
        "author_num": 6,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Amazon",
        "aff_unique_dep": "Amazon.com, Inc.",
        "aff_unique_url": "https://www.amazon.com",
        "aff_unique_abbr": "Amazon",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "DreamGaussian: Generative Gaussian Splatting for Efficient 3D Content Creation",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18512",
        "id": "UyNXMqnN3c",
        "author_site": "Jiaxiang Tang, Jiawei Ren, Hang Zhou, Ziwei Liu, Gang Zeng",
        "tldr": "",
        "abstract": "Recent advances in 3D content creation mostly leverage optimization-based 3D generation via score distillation sampling (SDS).\nThough promising results have been exhibited, these methods often suffer from slow per-sample optimization, limiting their practical usage. \nIn this paper, we propose DreamGaussian, a novel 3D content generation framework that achieves both efficiency and quality simultaneously. \nOur key insight is to design a generative 3D Gaussian Splatting model with companioned mesh extraction and texture refinement in UV space.\nIn contrast to the occupancy pruning used in Neural Radiance Fields, we demonstrate that the progressive densification of 3D Gaussians converges significantly faster for 3D generative tasks.\nTo further enhance the texture quality and facilitate downstream applications, we introduce an efficient algorithm to convert 3D Gaussians into textured meshes and apply a fine-tuning stage to refine the details.\nExtensive experiments demonstrate the superior efficiency and competitive generation quality of our proposed approach.\nNotably, DreamGaussian produces high-quality textured meshes in just 2 minutes from a single-view image, achieving approximately 10 times acceleration compared to existing methods.",
        "keywords": "Text-to-3D;Image-to-3D;3D Generation;Efficiency",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/9bf656012f7bb6c82f5f9e3d48b55ccd3f11c53f.zip",
        "author": "Jiaxiang Tang;Jiawei Ren;Hang Zhou;Ziwei Liu;Gang Zeng",
        "authorids": "~Jiaxiang_Tang1;~Jiawei_Ren1;~Hang_Zhou4;~Ziwei_Liu1;~Gang_Zeng1",
        "gender": ";Unspecified;M;M;M",
        "homepage": ";https://jiawei-ren.github.io/;https://hangz-nju-cuhk.github.io/;https://liuziwei7.github.io/;https://www.cis.pku.edu.cn/info/1177/1378.htm",
        "dblp": ";122/3626-1;;05/6300-2;",
        "google_scholar": ";https://scholar.google.com.sg/citations?user=YUKPVCoAAAAJ;https://scholar.google.com.hk/citations?user=iqbKD9UAAAAJ;https://scholar.google.com.hk/citations?user=lc45xlcAAAAJ;RuHyY6gAAAAJ",
        "orcid": ";0000-0003-1950-5976;;;",
        "linkedin": ";;;;",
        "or_profile": "~Jiaxiang_Tang1;~Jiawei_Ren1;~Hang_Zhou4;~Ziwei_Liu1;~Gang_Zeng1",
        "aff": ";Nanyang Technological University;Baidu;Nanyang Technological University;Peking University",
        "aff_domain": ";ntu.edu.sg;baidu.com;ntu.edu.sg;pku.edu.cn",
        "position": ";PhD student;Researcher;Assistant Professor;Researcher",
        "bibtex": "@inproceedings{\ntang2024dreamgaussian,\ntitle={DreamGaussian: Generative Gaussian Splatting for Efficient 3D Content Creation},\nauthor={Jiaxiang Tang and Jiawei Ren and Hang Zhou and Ziwei Liu and Gang Zeng},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=UyNXMqnN3c}\n}",
        "github": "",
        "project": "",
        "reviewers": "MZY6;huut;L9mE;E7Ru",
        "pdf_size": 7845027,
        "rating": "8;8;8;10",
        "confidence": "4;3;4;5",
        "soundness": "3;3;3;3",
        "contribution": "4;3;2;4",
        "presentation": "2;3;1;4",
        "wc_summary": "109;114;90;83",
        "wc_strengths": "47;158;47;117",
        "wc_weaknesses": "597;111;236;267",
        "wc_questions": "37;3;110;42",
        "wc_review": "790;386;483;509",
        "wc_reply_reviewers": "184;0;153;0",
        "wc_reply_authors": "608;433;436;479",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            8.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            99.0,
            12.864680330268607
        ],
        "wc_strengths_avg": [
            92.25,
            47.515129169560296
        ],
        "wc_weaknesses_avg": [
            302.75,
            179.64183115299176
        ],
        "wc_questions_avg": [
            48.0,
            38.8136573901507
        ],
        "wc_review_avg": [
            542.0,
            150.34127843011046
        ],
        "wc_reply_reviewers_avg": [
            84.25,
            84.95991701973348
        ],
        "wc_reply_authors_avg": [
            489.0,
            71.07390519733667
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.816496580927726,
        "gs_citation": 636,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14486643360665800227&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=UyNXMqnN3c",
        "pdf": "https://openreview.net/pdf?id=UyNXMqnN3c",
        "email": ";ntu.edu.sg;baidu.com;ntu.edu.sg;pku.edu.cn",
        "author_num": 5,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "Nanyang Technological University;Baidu;Peking University",
        "aff_unique_dep": ";Baidu, Inc.;",
        "aff_unique_url": "https://www.ntu.edu.sg;https://www.baidu.com;http://www.pku.edu.cn",
        "aff_unique_abbr": "NTU;Baidu;Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;1",
        "aff_country_unique": "Singapore;China"
    },
    {
        "id": "UyPmWupphV",
        "title": "Hyperion: Fused Multi-Trial and Gradient Descent for Joint Hyperparameter and Neural Architecture Optimization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We consider the fusion of multi-trial optimizers and gradient descent based oneshot algorithms to jointly optimize neural network hyperparameters and architectures. To combine strengths of optimizers from both categories, we propose Hyperion, which smartly distributes searched parameters into different involved optimizers, efficiently samples sub-search-spaces to reduce exploration costs of one-shot algorithms, and orchestrates co-optimization of both hyperparameters and network architectures. We demonstrate with open and industrial datasets that Hyperion outperforms non-fused optimization algorithms in optimized metrics, while significantly reducing GPU resources required for one-shot algorithms.",
        "keywords": "AutoML;Hyperparameter Optimization;Neural Architecture Search",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Tanmay Goyal;Pengcheng Huang;Balz Maag",
        "authorids": "~Tanmay_Goyal1;~Pengcheng_Huang1;~Balz_Maag1",
        "gender": "M;M;M",
        "homepage": ";;",
        "dblp": ";;",
        "google_scholar": ";https://scholar.google.com.sg/citations?user=HSEpj_MAAAAJ;GBxmNGYAAAAJ",
        "orcid": ";;",
        "linkedin": "tanmay-goyal2703/;;",
        "or_profile": "~Tanmay_Goyal1;~Pengcheng_Huang1;~Balz_Maag1",
        "aff": "Technische Universit\u00e4t M\u00fcnchen;;",
        "aff_domain": "tum.de;;",
        "position": "PhD student;;",
        "bibtex": "@misc{\ngoyal2024hyperion,\ntitle={Hyperion: Fused Multi-Trial and Gradient Descent for Joint Hyperparameter and Neural Architecture Optimization},\nauthor={Tanmay Goyal and Pengcheng Huang and Balz Maag},\nyear={2024},\nurl={https://openreview.net/forum?id=UyPmWupphV}\n}",
        "github": "",
        "project": "",
        "reviewers": "uHaA;sktS;sixZ;nymt",
        "site": "https://openreview.net/forum?id=UyPmWupphV",
        "pdf_size": 1181884,
        "rating": "1;3;3;5",
        "confidence": "5;5;4;5",
        "soundness": "2;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "2;2;2;3",
        "wc_summary": "112;91;56;114",
        "wc_strengths": "105;169;86;72",
        "wc_weaknesses": "669;401;128;348",
        "wc_questions": "186;156;59;64",
        "wc_review": "1072;817;329;598",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            93.25,
            23.31710745354149
        ],
        "wc_strengths_avg": [
            108.0,
            37.11468711979127
        ],
        "wc_weaknesses_avg": [
            386.5,
            192.56232757213962
        ],
        "wc_questions_avg": [
            116.25,
            55.7959451931769
        ],
        "wc_review_avg": [
            704.0,
            273.8859251586324
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:tNaW1hrLTNEJ:scholar.google.com/&scioq=Hyperion:+Fused+Multi-Trial+and+Gradient+Descent+for+Joint+Hyperparameter+and+Neural+Architecture+Optimization&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Technische Universit\u00e4t M\u00fcnchen",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tum.de",
        "aff_unique_abbr": "TUM",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "V01FPV3SNY",
        "title": "Defending Against Alignment-Breaking Attacks via Robustly Aligned LLM",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recently, Large Language Models (LLMs) have made significant advancements and are now widely used across various domains. Unfortunately, there has been a rising concern that LLMs can be misused to generate harmful or malicious content. Though a line of research has focused on aligning LLMs with human values and preventing them from producing inappropriate content, such alignments are usually vulnerable and can be bypassed by alignment-breaking attacks via adversarially optimized or handcrafted jailbreaking prompts.  \nIn this work, we introduce a Robustly Aligned LLM (RA-LLM) to defend against potential alignment-breaking attacks. RA-LLM can be directly constructed upon an existing aligned LLM with a robust alignment checking function, without requiring any expensive retraining or fine-tuning process of the original LLM. Furthermore, we also provide a theoretical analysis for RA-LLM to verify its effectiveness in defending against alignment-breaking attacks.\nThrough real-world experiments on open-source large language models, we demonstrate that RA-LLM can successfully defend against both state-of-the-art adversarial prompts and popular handcrafted jailbreaking prompts by reducing their attack success rates from nearly 100\\% to around 10\\% or less.",
        "keywords": "Robustness;Large Language Models;Safety Alignments;Jailbreaking Attack",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Bochuan Cao;Yuanpu Cao;Lu Lin;Jinghui Chen",
        "authorids": "~Bochuan_Cao1;~Yuanpu_Cao1;~Lu_Lin2;~Jinghui_Chen1",
        "gender": ";M;F;M",
        "homepage": "https://aaaaaasuka.github.io/;;https://louise-lulin.github.io;https://jinghuichen.github.io/",
        "dblp": "334/3881;243/0230;86/2209-1;67/5633",
        "google_scholar": "eOZCg2IAAAAJ;F5S2bO8AAAAJ;8N04pBgAAAAJ;mKia7Y4AAAAJ",
        "orcid": ";;0000-0002-2539-3352;",
        "linkedin": ";yuanpu-cao-a392751b2/;lulin92/;",
        "or_profile": "~Bochuan_Cao1;~Yuanpu_Cao1;~Lu_Lin2;~Jinghui_Chen1",
        "aff": "Pennsylvania State University;Pennsylvania State University;Pennsylvania State University;Pennsylvania State University",
        "aff_domain": "psu.edu;psu.edu;psu.edu;psu.edu",
        "position": "PhD student;PhD student;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\ncao2024defending,\ntitle={Defending Against Alignment-Breaking Attacks via Robustly Aligned {LLM}},\nauthor={Bochuan Cao and Yuanpu Cao and Lu Lin and Jinghui Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=V01FPV3SNY}\n}",
        "github": "",
        "project": "",
        "reviewers": "Lpzg;8tCQ;Nds5",
        "site": "https://openreview.net/forum?id=V01FPV3SNY",
        "pdf_size": 581721,
        "rating": "5;5;6",
        "confidence": "4;4;3",
        "soundness": "2;2;2",
        "contribution": "2;2;2",
        "presentation": "3;2;3",
        "wc_summary": "103;32;43",
        "wc_strengths": "32;44;43",
        "wc_weaknesses": "359;151;38",
        "wc_questions": "2;2;12",
        "wc_review": "496;229;136",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1681;1107;968",
        "reply_reviewers": "0;0;0",
        "reply_authors": "4;3;3",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            59.333333333333336,
            31.201851796897497
        ],
        "wc_strengths_avg": [
            39.666666666666664,
            5.436502143433364
        ],
        "wc_weaknesses_avg": [
            182.66666666666666,
            132.94694012608522
        ],
        "wc_questions_avg": [
            5.333333333333333,
            4.714045207910317
        ],
        "wc_review_avg": [
            287.0,
            152.58440287263963
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1252.0,
            308.6108660865114
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9999999999999997,
        "gs_citation": 142,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4077350643577311461&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Pennsylvania State University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.psu.edu",
        "aff_unique_abbr": "PSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "V04YoiX4Zq",
        "title": "Challenging the Foundations: Mining Hard Test Samples through Diffusion Generation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large foundation models have achieved tremendous success with impressive performance in multiple applications. However, their performance is often benchmarked on natural images, where novel combinations of specific objects and nuisances can be missing and not tested. In this work, we develop a framework to efficiently probe foundation models for their vulnerabilities with diffusion generation, termed  DiffusionExplorer. We show that our framework can efficiently construct a test set with novel combinations of object and nuisance factors to expose the failures of foundation models. Experimental results show that our mined test samples are challenging to foundation models, such as MiniGPT-4 and LLaVa,   significantly reducing their accuracy by 29.56\\% and 39.96\\%, respectively. Our work suggests that generative models can be viewed as an effective data source in finding the vulnerability of large vision foundation models.",
        "keywords": "Large foundation models;Diffusion models;Vulnerability",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Chenshuang Zhang;Fei Pan;Junmo Kim;In So Kweon;Chengzhi Mao",
        "authorids": "~Chenshuang_Zhang2;~Fei_Pan2;~Junmo_Kim1;~In_So_Kweon2;~Chengzhi_Mao2",
        "gender": "F;M;M;M;M",
        "homepage": "https://chenshuang-zhang.github.io/;https://www.feipan.info;https://siit.kaist.ac.kr/Faculty;http://www.cs.columbia.edu/~mcz/;https://ee.kaist.ac.kr/en/professor-s2/2/",
        "dblp": "165/5102.html;;40/240-2.html;;74/4917.html",
        "google_scholar": "HbqjLHYAAAAJ;VGE3DlYAAAAJ;https://scholar.google.com.tw/citations?user=GdQtWNQAAAAJ;pTTEiHUAAAAJ;XA8EOlEAAAAJ",
        "orcid": ";0000-0002-5688-5413;;;",
        "linkedin": ";;;;",
        "or_profile": "~Chenshuang_Zhang2;~Fei_Pan2;~Junmo_Kim1;~Chengzhi_Mao2;~In-So_Kweon1",
        "aff": "Korea Advanced Institute of Science & Technology;University of Michigan - Ann Arbor;Korea Advanced Institute of Science & Technology;Mila - Quebec Artificial Intelligence Institute;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;umich.edu;kaist.ac.kr;mila.quebec;kaist.ac.kr",
        "position": "PhD student;Postdoc;Associate Professor;Assistant Professor;Emeritus",
        "bibtex": "@misc{\nzhang2024challenging,\ntitle={Challenging the Foundations: Mining Hard Test Samples through Diffusion Generation},\nauthor={Chenshuang Zhang and Fei Pan and Junmo Kim and In So Kweon and Chengzhi Mao},\nyear={2024},\nurl={https://openreview.net/forum?id=V04YoiX4Zq}\n}",
        "github": "",
        "project": "",
        "reviewers": "UyNd;aTrF;NvzL;YyzH",
        "site": "https://openreview.net/forum?id=V04YoiX4Zq",
        "pdf_size": 11334759,
        "rating": "3;3;5;6",
        "confidence": "4;3;4;3",
        "soundness": "2;2;3;2",
        "contribution": "2;1;2;2",
        "presentation": "3;3;3;3",
        "wc_summary": "76;55;38;112",
        "wc_strengths": "49;35;71;74",
        "wc_weaknesses": "359;130;79;106",
        "wc_questions": "3;265;17;134",
        "wc_review": "487;485;205;426",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            70.25,
            27.60774347895894
        ],
        "wc_strengths_avg": [
            57.25,
            16.068213964221414
        ],
        "wc_weaknesses_avg": [
            168.5,
            111.45514792955954
        ],
        "wc_questions_avg": [
            104.75,
            105.58024199631292
        ],
        "wc_review_avg": [
            400.75,
            115.64249867587607
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.19245008972987526,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:iAC_R6obOEAJ:scholar.google.com/&scioq=Challenging+the+Foundations:+Mining+Hard+Test+Samples+through+Diffusion+Generation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;2;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology;University of Michigan;Quebec Artificial Intelligence Institute",
        "aff_unique_dep": ";;Artificial Intelligence",
        "aff_unique_url": "https://www.kaist.ac.kr;https://www.umich.edu;https://mila.quebec",
        "aff_unique_abbr": "KAIST;UM;Mila",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Ann Arbor",
        "aff_country_unique_index": "0;1;0;2;0",
        "aff_country_unique": "South Korea;United States;Canada"
    },
    {
        "id": "V0CUOBWUHa",
        "title": "Scaling Sentence Embeddings with Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs) have recently garnered significant interest. With in-context learning, LLMs achieve impressive results in various natural language tasks. However, the application of LLMs to sentence embeddings remains an area of ongoing research. In this work, we propose an in-context learning-based method aimed at improving sentence embeddings performance. Our approach involves adapting the previous prompt-based representation method for autoregressive models, constructing a demonstration set that enables LLMs to perform in-context learning, and scaling up the LLMs to different model sizes. Through extensive experiments, in-context learning enables LLMs to generate high-quality sentence embeddings without any fine-tuning. It helps LLMs achieve performance comparable to current contrastive learning methods. By scaling model size, we find scaling to more than tens of billion parameters harms the performance on semantic textual similarity (STS) tasks. However, the largest model outperforms other counterparts and achieves the new state-of-the-art result on transfer tasks. We also fine-tune LLMs with current contrastive learning approach, and the 2.7B OPT model, incorporating our prompt-based method, surpasses the performance of 4.8B ST5, achieving the new state-of-the-art results on STS tasks.",
        "keywords": "Sentence Representations;Large Language Models;In-context Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/4740753d1c03bafd134aab2584615bb754f8a08f.zip",
        "author": "Ting Jiang;Shaohan Huang;Zhongzhi Luan;deqing wang;Fuzhen Zhuang",
        "authorids": "~Ting_Jiang1;~Shaohan_Huang1;~Zhongzhi_Luan1;~deqing_wang2;~Fuzhen_Zhuang1",
        "gender": "M;M;M;M;M",
        "homepage": "https://470928d55.github.io/;;https://scse.buaa.edu.cn/info/1079/2724.htm;https://ktl.buaa.edu.cn/;https://fuzhenzhuang.github.io/index.html",
        "dblp": ";176/0380;26/2404;;48/5638",
        "google_scholar": ";;;NrYqxY4AAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;0000-0002-7186-0556;0000-0001-6441-4390;0000-0001-9170-7009",
        "linkedin": ";;;;",
        "or_profile": "~Ting_Jiang1;~Shaohan_Huang1;~Zhongzhi_Luan1;~deqing_wang2;~Fuzhen_Zhuang1",
        "aff": "Beihang University;Microsoft;Beihang University ;Beihang University;Institute of Computing Technology, Chinese Academy of Sciences",
        "aff_domain": "buaa.edu.cn;microsoft.com;buaa.edu.cn;buaa.edu.cn;ict.ac.cn",
        "position": "PhD student;Researcher;Associate Professor;Full Professor;Associate Professor",
        "bibtex": "@misc{\njiang2024scaling,\ntitle={Scaling Sentence Embeddings with Large Language Models},\nauthor={Ting Jiang and Shaohan Huang and Zhongzhi Luan and deqing wang and Fuzhen Zhuang},\nyear={2024},\nurl={https://openreview.net/forum?id=V0CUOBWUHa}\n}",
        "github": "",
        "project": "",
        "reviewers": "oEkP;ViaW;dT5b",
        "site": "https://openreview.net/forum?id=V0CUOBWUHa",
        "pdf_size": 1168695,
        "rating": "5;6;6",
        "confidence": "3;4;5",
        "soundness": "3;3;3",
        "contribution": "3;3;2",
        "presentation": "3;2;3",
        "wc_summary": "231;108;143",
        "wc_strengths": "186;55;54",
        "wc_weaknesses": "332;129;83",
        "wc_questions": "79;74;37",
        "wc_review": "828;366;317",
        "wc_reply_reviewers": "0;371;0",
        "wc_reply_authors": "923;1723;743",
        "reply_reviewers": "0;2;0",
        "reply_authors": "3;6;2",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            160.66666666666666,
            51.74510175422941
        ],
        "wc_strengths_avg": [
            98.33333333333333,
            61.99103877891456
        ],
        "wc_weaknesses_avg": [
            181.33333333333334,
            108.17989133331984
        ],
        "wc_questions_avg": [
            63.333333333333336,
            18.732028424302822
        ],
        "wc_review_avg": [
            503.6666666666667,
            230.2090837091843
        ],
        "wc_reply_reviewers_avg": [
            123.66666666666667,
            174.89107721347276
        ],
        "wc_reply_authors_avg": [
            1129.6666666666667,
            425.9368758656877
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            1.699673171197595
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.8660254037844385,
        "gs_citation": 82,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6373660805264701508&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;0;0;2",
        "aff_unique_norm": "Beihang University;Microsoft;Chinese Academy of Sciences",
        "aff_unique_dep": ";Microsoft Corporation;Institute of Computing Technology",
        "aff_unique_url": "http://www.buaa.edu.cn/;https://www.microsoft.com;http://www.ict.ac.cn",
        "aff_unique_abbr": "BUAA;Microsoft;CAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "V163iNHVi7",
        "title": "Feynman-Kac Operator Expectation Estimator: An Innovative Method for Enhancing MCMC Efficiency and Reducing Variance",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The Feynman-Kac Operator Expectation Estimator (FKEE) is an innovative method for estimating the target Mathematical Expectation  $\\mathbb{E}_{X\\sim P}[f(X)]$ without relying on a large number of samples, in contrast to the commonly used Markov chain Monte Carlo (MCMC) algorithm. This method uses Physically Informed Neural Networks (PINN) to approximate the Feynman-Kac operator. It enables the incorporation of existing diffusion bridge models into the expectation estimator, and significantly improves the efficiency of using Markov chains while substantially reduces the variance. Additionally, this method mitigates the adverse impact of the curse of dimensionality, weakening the assumptions on the distribution of $X$ and $f$ in the general MCMC expectation  estimator. In the algorithm implementation, the first step involves constructing a diffusion bridge over the target distribution or known data by matching the coefficients of the diffusion bridge from the random flow trajectories or a Markov chain. Subsequently, we employ PINN to solve the Feynman-Kac equation, and the solution of this equation provides the mathematical expectation in analytical form. Finally, we demonstrate the advantages and potential applications of this method through various concrete experiments, including the challenging task of approximating the partition function in the random graph model  such as the Ising model.",
        "keywords": "Expectation estimator;Diffusion bridge model;MCMC;PINN;Feynman-Kac formula",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/2c360b5c59af25adcbf61a528a21e77eb0e58834.zip",
        "author": "Jingyuan Li;WEI LIU",
        "authorids": "~Jingyuan_Li4;~WEI_LIU22",
        "gender": "M;M",
        "homepage": ";http://maths.whu.edu.cn/info/1306/10033.htm",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": "0009-0002-6861-7042;",
        "linkedin": ";",
        "or_profile": "~Jingyuan_Li4;~WEI_LIU22",
        "aff": ";School of Mathematics and Statistics,Wuhan University",
        "aff_domain": ";maths.whu.edu.cn",
        "position": ";Full Professor",
        "bibtex": "@misc{\nli2024feynmankac,\ntitle={Feynman-Kac Operator Expectation Estimator: An Innovative Method for Enhancing {MCMC} Efficiency and Reducing Variance},\nauthor={Jingyuan Li and WEI LIU},\nyear={2024},\nurl={https://openreview.net/forum?id=V163iNHVi7}\n}",
        "github": "",
        "project": "",
        "reviewers": "Q5pZ;crQM;1WcQ;dqNa",
        "site": "https://openreview.net/forum?id=V163iNHVi7",
        "pdf_size": 809681,
        "rating": "3;3;3;5",
        "confidence": "4;3;2;4",
        "soundness": "3;1;1;3",
        "contribution": "2;2;1;2",
        "presentation": "1;1;1;3",
        "wc_summary": "11;25;112;80",
        "wc_strengths": "13;17;27;14",
        "wc_weaknesses": "45;677;370;274",
        "wc_questions": "30;2;95;60",
        "wc_review": "99;721;604;428",
        "wc_reply_reviewers": "0;135;0;94",
        "wc_reply_authors": "125;1686;1446;1330",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "1;3;2;3",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.0,
            1.0
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            57.0,
            40.90843433816552
        ],
        "wc_strengths_avg": [
            17.75,
            5.539629951540085
        ],
        "wc_weaknesses_avg": [
            341.5,
            226.84851773815936
        ],
        "wc_questions_avg": [
            46.75,
            34.593171291455775
        ],
        "wc_review_avg": [
            463.0,
            234.6092496045286
        ],
        "wc_reply_reviewers_avg": [
            57.25,
            59.05664653533927
        ],
        "wc_reply_authors_avg": [
            1146.75,
            603.7165622210475
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.5222329678670935,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:vPnyz1jSRvsJ:scholar.google.com/&scioq=Feynman-Kac+Operator+Expectation+Estimator:+An+Innovative+Method+for+Enhancing+MCMC+Efficiency+and+Reducing+Variance&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Wuhan University",
        "aff_unique_dep": "School of Mathematics and Statistics",
        "aff_unique_url": "http://www.whu.edu.cn",
        "aff_unique_abbr": "WHU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Wuhan",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "title": "Neural structure learning with stochastic differential equations",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18511",
        "id": "V1GM9xDvIY",
        "author_site": "Benjie Wang, Joel Jennings, Wenbo Gong",
        "tldr": "",
        "abstract": "Discovering the underlying relationships among variables from temporal observations has been a longstanding challenge in numerous scientific disciplines, including biology, finance, and climate science. The dynamics of such systems are often best described using continuous-time stochastic processes. Unfortunately, most existing structure learning approaches assume that the underlying process evolves in discrete-time and/or observations occur at regular time intervals. These mismatched assumptions can often lead to incorrect learned structures and models. In this work, we introduce a novel structure learning method, SCOTCH, which combines neural stochastic differential equations (SDE) with variational inference to infer a posterior distribution over possible structures. This continuous-time approach can naturally handle both learning from and predicting observations at arbitrary time points. Theoretically, we establish sufficient conditions for an SDE and SCOTCH to be structurally identifiable, and prove its consistency under infinite data limits. Empirically, we demonstrate that our approach leads to improved structure learning performance on both synthetic and real-world datasets compared to relevant baselines under regular and irregular sampling intervals.",
        "keywords": "Structure Learning;Causal Discovery;Generative Model;Variational Inference;Differential Equation",
        "primary_area": "causal reasoning",
        "supplementary_material": "/attachment/4010e934ef23a478411ec8ca0a2148cd22466adb.pdf",
        "author": "Benjie Wang;Joel Jennings;Wenbo Gong",
        "authorids": "~Benjie_Wang1;~Joel_Jennings1;~Wenbo_Gong1",
        "gender": ";M;",
        "homepage": "https://web.cs.ucla.edu/~benjiewang/;;",
        "dblp": "255/7169;222/3265-1;217/1994",
        "google_scholar": "https://scholar.google.co.uk/citations?user=tOeUlJoAAAAJ;J99ffO0AAAAJ;",
        "orcid": ";;",
        "linkedin": ";wenbo-gong-786867119/;",
        "or_profile": "~Benjie_Wang1;~Wenbo_Gong1;~Joel_Nicholas_Jennings1",
        "aff": "University of California, Los Angeles;Microsoft;Google Deepmind",
        "aff_domain": "ucla.edu;microsoft.com;google.com",
        "position": "Postdoc;Senior Researcher;Researcher",
        "bibtex": "@inproceedings{\nwang2024neural,\ntitle={Neural structure learning with stochastic differential equations},\nauthor={Benjie Wang and Joel Jennings and Wenbo Gong},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=V1GM9xDvIY}\n}",
        "github": "",
        "project": "",
        "reviewers": "gu2c;XYcj;pC52;rM8f",
        "pdf_size": 530321,
        "rating": "6;6;8;8",
        "confidence": "3;4;3;3",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;4",
        "presentation": "3;2;3;3",
        "wc_summary": "92;71;95;52",
        "wc_strengths": "72;40;126;76",
        "wc_weaknesses": "183;54;110;63",
        "wc_questions": "108;4;2;19",
        "wc_review": "455;169;333;210",
        "wc_reply_reviewers": "332;0;6;0",
        "wc_reply_authors": "1306;144;523;580",
        "reply_reviewers": "2;0;1;0",
        "reply_authors": "3;1;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            77.5,
            17.38533865071371
        ],
        "wc_strengths_avg": [
            78.5,
            30.769302884530873
        ],
        "wc_weaknesses_avg": [
            102.5,
            51.11017511220246
        ],
        "wc_questions_avg": [
            33.25,
            43.654180784891615
        ],
        "wc_review_avg": [
            291.75,
            111.91821790932877
        ],
        "wc_reply_reviewers_avg": [
            84.5,
            142.91518463760247
        ],
        "wc_reply_authors_avg": [
            638.25,
            420.37148749647616
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1847315880479921197&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=V1GM9xDvIY",
        "pdf": "https://openreview.net/pdf?id=V1GM9xDvIY",
        "email": "ucla.edu;microsoft.com;google.com",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of California, Los Angeles;Microsoft;DeepMind",
        "aff_unique_dep": ";Microsoft Corporation;DeepMind",
        "aff_unique_url": "https://www.ucla.edu;https://www.microsoft.com;https://deepmind.com",
        "aff_unique_abbr": "UCLA;Microsoft;DeepMind",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Los Angeles;",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "V1VORwPwnd",
        "title": "InCo: Enhance Domain Generalization in Noisy Environments",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The Invariant Risk Minimization (IRM) approach aims to address the challenge of domain generalization by training a feature representation that remains invariant across multiple environments. However, in noisy environments, IRM-related techniques such as IRMv1 and VREx may be unable to achieve the optimal IRM solution due to incorrect optimization directions. To address this issue, we introduce InCo (short for Invariant Correlation), a novel approach that effectively tackles the aforementioned challenges in noisy environments. Additionally, we provide a case study to analyze why previous methods may lose ground while InCo can succeed. We offer theoretical analysis from a causal perspective, demonstrating that the invariant correlation of representation with labels across environments is a necessary condition for the optimal invariant predictor in noisy environments, whereas the optimization motivations for other methods may not be. Subsequently, we empirically demonstrate the usefulness of InCo by comparing it with other domain generalization methods on various noisy datasets.",
        "keywords": "causality;invariant risk minimization;domain generalization;noisy environments",
        "primary_area": "causal reasoning",
        "supplementary_material": "/attachment/cd9086e6007b084fcb559206dab9f49afde0ea92.zip",
        "author": "Gaojie Jin;Ronghui Mu;Xinping Yi;Xiaowei Huang;Lijun Zhang",
        "authorids": "~Gaojie_Jin1;~Ronghui_Mu1;~Xinping_Yi1;~Xiaowei_Huang1;~Lijun_Zhang2",
        "gender": "M;M;M;M;F",
        "homepage": "https://alexkael.github.io/;https://sites.google.com/site/xinpingyi00/;https://cgi.csc.liv.ac.uk/~xiaowei/;;",
        "dblp": "276/5476;95/10043.html;60/5414-1.html;76/4015-1;306/1456",
        "google_scholar": "n_cu7jwAAAAJ;wAcbI5kAAAAJ;https://scholar.google.co.uk/citations?user=X4fLCCIAAAAJ;;",
        "orcid": ";;;;0000-0001-6150-4948",
        "linkedin": ";;;;",
        "or_profile": "~Gaojie_Jin1;~Xinping_Yi1;~Xiaowei_Huang1;~Lijun_Zhang2;~Rronghui_Mu1",
        "aff": "Chinese Academy of Sciences, Chinese Academy of Sciences;Southeast University;University of Liverpool;Chinese Academy of Sciences, Chinese Academy of Sciences;University of Liverpool",
        "aff_domain": "ios.ac.cn;seu.edu.cn;liverpool.ac.uk;ios.ac.cn;liverpool.ac.uk",
        "position": "Associate Professor;Full Professor;Full Professor;Full Professor;Postdoc",
        "bibtex": "@misc{\njin2024inco,\ntitle={InCo: Enhance Domain Generalization in Noisy Environments},\nauthor={Gaojie Jin and Ronghui Mu and Xinping Yi and Xiaowei Huang and Lijun Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=V1VORwPwnd}\n}",
        "github": "",
        "project": "",
        "reviewers": "CFEC;wTh9;4DKZ;Rcpq;Ymy1",
        "site": "https://openreview.net/forum?id=V1VORwPwnd",
        "pdf_size": 4404416,
        "rating": "3;5;5;6;6",
        "confidence": "3;3;3;4;3",
        "soundness": "3;3;3;3;3",
        "contribution": "2;3;2;3;3",
        "presentation": "1;3;3;3;3",
        "wc_summary": "75;40;68;106;61",
        "wc_strengths": "26;49;66;181;31",
        "wc_weaknesses": "196;169;289;225;84",
        "wc_questions": "52;13;32;3;5",
        "wc_review": "349;271;455;515;181",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            5.0,
            1.0954451150103321
        ],
        "confidence_avg": [
            3.2,
            0.39999999999999997
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.6,
            0.8000000000000002
        ],
        "wc_summary_avg": [
            70.0,
            21.475567512873788
        ],
        "wc_strengths_avg": [
            70.6,
            56.97929448492672
        ],
        "wc_weaknesses_avg": [
            192.6,
            67.3872391480761
        ],
        "wc_questions_avg": [
            21.0,
            18.579558659989747
        ],
        "wc_review_avg": [
            354.2,
            120.80132449605013
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.4564354645876385,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:TTswZX33pf8J:scholar.google.com/&scioq=InCo:+Enhance+Domain+Generalization+in+Noisy+Environments&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0;2",
        "aff_unique_norm": "Chinese Academy of Sciences;Southeast University;University of Liverpool",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.cas.cn;https://www.seu.edu.cn/;https://www.liverpool.ac.uk",
        "aff_unique_abbr": "CAS;SEU;Liv Uni",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;1",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "id": "V2LpzVNtCT",
        "title": "Towards Predicate-powered Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The traditional approach to data-driven learning has become increasingly demanding in terms of its training data and computational resources. This work further develops a new paradigm of learning using predicates to reduce the need of data in learning. Among many recent efforts towards the same direction, learning using statistical invariants (LUSI) has been proposed to be the new paradigm of learning. Building on top of LUSI and to break the ``brute force'' learning trend, we build towards a generalized theory of predicates and the invariants. The primary objective of this work is to propose an Extended Structure Risk Minimization (ESRM) paradigm with predicates, and provide a theoretical justification of the need for predicates in learning problems from both data complexity and model complexity perspectives. In this work, we show that predicates not only can aid in reducing the need for data in training, but they are also imperative for a highly efficient model. \n\nOur primary contributions consist of the following: I) Proposing an extension to the structure risk minimization paradigm of learning, and II) Proving the efficacy of predicates in reducing both the data complexity and the model complexity.",
        "keywords": "Learning theory;Learning using statistical invariants",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Yang Liu;Ernest Fokoue;Daniel Krutz",
        "authorids": "~Yang_Liu114;epfeqa@rit.edu;~Daniel_Krutz1",
        "gender": "M;;M",
        "homepage": ";;https://dan7800.github.io/index.html",
        "dblp": ";;137/6127",
        "google_scholar": ";;",
        "orcid": ";;",
        "linkedin": "yang-emrick-liu;;",
        "or_profile": "~Yang_Liu114;epfeqa@rit.edu;~Daniel_Krutz1",
        "aff": "Rochester Institute of Technology;;Rochester Institute of Technology",
        "aff_domain": "rit.edu;;rit.edu",
        "position": "PhD student;;Associate Professor",
        "bibtex": "@misc{\nliu2024towards,\ntitle={Towards Predicate-powered Learning},\nauthor={Yang Liu and Ernest Fokoue and Daniel Krutz},\nyear={2024},\nurl={https://openreview.net/forum?id=V2LpzVNtCT}\n}",
        "github": "",
        "project": "",
        "reviewers": "ufoZ;kdak;oViS;afMq",
        "site": "https://openreview.net/forum?id=V2LpzVNtCT",
        "pdf_size": 223936,
        "rating": "3;3;3;5",
        "confidence": "3;4;3;2",
        "soundness": "2;2;1;3",
        "contribution": "2;2;2;2",
        "presentation": "2;1;2;3",
        "wc_summary": "70;27;65;43",
        "wc_strengths": "2;20;38;17",
        "wc_weaknesses": "559;31;332;51",
        "wc_questions": "40;292;127;32",
        "wc_review": "671;370;562;143",
        "wc_reply_reviewers": "0;0;32;16",
        "wc_reply_authors": "299;173;145;57",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            51.25,
            17.297037318569906
        ],
        "wc_strengths_avg": [
            19.25,
            12.794041581923986
        ],
        "wc_weaknesses_avg": [
            243.25,
            217.70665469847265
        ],
        "wc_questions_avg": [
            122.75,
            104.57861875163584
        ],
        "wc_review_avg": [
            436.5,
            200.81396863764235
        ],
        "wc_reply_reviewers_avg": [
            12.0,
            13.2664991614216
        ],
        "wc_reply_authors_avg": [
            168.5,
            86.6530438011268
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:t8vHnLfvs5gJ:scholar.google.com/&scioq=Towards+Predicate-powered+Learning&hl=en&as_sdt=0,47",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Rochester Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.rit.edu",
        "aff_unique_abbr": "RIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Exploring the Promise and Limits of Real-Time Recurrent Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18510",
        "id": "V2cBKtdC3a",
        "author_site": "Kazuki Irie, Anand Gopalakrishnan, J\u00fcrgen Schmidhuber",
        "tldr": "",
        "abstract": "Real-time recurrent learning (RTRL) for sequence-processing recurrent neural networks (RNNs) offers certain conceptual advantages over backpropagation through time (BPTT). RTRL requires neither caching past activations nor truncating context, and enables online learning. However, RTRL's time and space complexity make it impractical. To overcome this problem, most recent work on RTRL focuses on approximation theories, while experiments are often limited to diagnostic settings. Here we explore the practical promise of RTRL in more realistic settings. We study actor-critic methods that combine RTRL and policy gradients, and test them in several subsets of DMLab-30, ProcGen, and Atari-2600 environments. On DMLab memory tasks, our system trained on fewer than 1.2B environmental frames is competitive with or outperforms well-known IMPALA and R2D2 baselines trained on 10B frames. To scale to such challenging tasks, we focus on certain well-known neural architectures with element-wise recurrence, allowing for tractable RTRL without approximation. Importantly, we also discuss rarely addressed limitations of RTRL in real-world applications, such as its complexity in the multi-layer case.",
        "keywords": "recurrent neural networks;real-time recurrent learning;online recurrent learning;reinforcement learning;actor-critic;policy gradients",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/22ffdb149060b0ae0f77ca98eab1204f1fb8beea.zip",
        "author": "Kazuki Irie;Anand Gopalakrishnan;J\u00fcrgen Schmidhuber",
        "authorids": "~Kazuki_Irie1;~Anand_Gopalakrishnan1;~J\u00fcrgen_Schmidhuber1",
        "gender": ";M;M",
        "homepage": "https://sites.harvard.edu/kazuki-irie/;https://agopal42.github.io/;http://people.idsia.ch/~juergen/",
        "dblp": "148/9667;191/1040;s/JurgenSchmidhuber",
        "google_scholar": "https://scholar.google.de/citations?user=-gZ-BdwAAAAJ;SsbgJ1UAAAAJ;https://scholar.google.ch/citations?user=gLnCTgIAAAAJ",
        "orcid": "0000-0003-0923-691X;;",
        "linkedin": ";;",
        "or_profile": "~Kazuki_Irie1;~Anand_Gopalakrishnan1;~J\u00fcrgen_Schmidhuber1",
        "aff": "Harvard University;Dalle Molle Institute for Artificial Intelligence Research;IDSIA",
        "aff_domain": "fas.harvard.edu;idsia.ch;idsia.ch",
        "position": "Postpostdoc;PhD student;Scientific Director",
        "bibtex": "@inproceedings{\nirie2024exploring,\ntitle={Exploring the Promise and Limits of Real-Time Recurrent Learning},\nauthor={Kazuki Irie and Anand Gopalakrishnan and J{\\\"u}rgen Schmidhuber},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=V2cBKtdC3a}\n}",
        "github": "",
        "project": "",
        "reviewers": "cmdn;nFUx;8WmR;PxbF",
        "pdf_size": 1638536,
        "rating": "6;6;6;8",
        "confidence": "3;4;4;4",
        "soundness": "3;4;4;3",
        "contribution": "3;2;3;4",
        "presentation": "3;3;4;3",
        "wc_summary": "44;101;72;72",
        "wc_strengths": "63;53;70;132",
        "wc_weaknesses": "444;276;67;143",
        "wc_questions": "150;35;53;96",
        "wc_review": "701;465;262;443",
        "wc_reply_reviewers": "154;250;27;441",
        "wc_reply_authors": "1392;960;637;966",
        "reply_reviewers": "1;1;1;2",
        "reply_authors": "3;2;1;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            72.25,
            20.154093876927337
        ],
        "wc_strengths_avg": [
            79.5,
            30.907118921051183
        ],
        "wc_weaknesses_avg": [
            232.5,
            143.20003491619687
        ],
        "wc_questions_avg": [
            83.5,
            44.33114029663573
        ],
        "wc_review_avg": [
            467.75,
            156.01181846257674
        ],
        "wc_reply_reviewers_avg": [
            218.0,
            151.10426863593233
        ],
        "wc_reply_authors_avg": [
            988.75,
            268.1803264596417
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6073559528544751678&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=V2cBKtdC3a",
        "pdf": "https://openreview.net/pdf?id=V2cBKtdC3a",
        "email": "fas.harvard.edu;idsia.ch;idsia.ch",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Harvard University;Dalle Molle Institute for Artificial Intelligence Research;Institute of Digital Technologies",
        "aff_unique_dep": ";Artificial Intelligence Research;",
        "aff_unique_url": "https://www.harvard.edu;http://www.dallemolle.ch/;https://www.idsia.ch",
        "aff_unique_abbr": "Harvard;DMI;IDSIA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "United States;Switzerland"
    },
    {
        "title": "FedLoGe: Joint Local and Generic Federated Learning under Long-tailed Data",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18509",
        "id": "V3j5d0GQgH",
        "author_site": "Zikai Xiao, Zihan Chen, Liyinglan Liu, YANG FENG, Joey Tianyi Zhou, Jian Wu, Wanlu Liu, Howard Yang, Zuozhu Liu",
        "tldr": "",
        "abstract": "Federated Long-Tailed Learning (Fed-LT), a paradigm wherein data collected from decentralized local clients manifests a globally prevalent long-tailed distribution, has garnered considerable attention in recent times. In the context of Fed-LT, existing works have predominantly centered on addressing the data imbalance issue to enhance the efficacy of the generic global model while neglecting the performance at the local level. In contrast, conventional Personalized Federated Learning (pFL) techniques are primarily devised to optimize personalized local models under the presumption of a balanced global data distribution. This paper introduces an approach termed Federated Local and Generic Model Training in Fed-LT (FedLoGe), which enhances both local and generic model performance through the integration of representation learning and classifier alignment within a neural collapse framework. Our investigation reveals the feasibility of employing a shared backbone as a foundational framework for capturing overarching global trends, while concurrently employing individualized classifiers to encapsulate distinct refinements stemming from each client\u2019s local features. Building upon this discovery, we establish the Static Sparse Equiangular Tight Frame Classifier (SSE-C), inspired by neural collapse principles that naturally prune extraneous noisy features and foster the acquisition of potent data representations. Furthermore, leveraging insights from imbalance neural collapse's classifier norm patterns, we develop Global and Local Adaptive Feature Realignment (GLA-FR) via an auxiliary global classifier and personalized Euclidean norm transfer to align global features with client preferences. Extensive experimental results on CIFAR-10/100-LT, ImageNet, and iNaturalist demonstrate the advantage of our method over state-of-the-art pFL and Fed-LT approaches.",
        "keywords": "Personalized federated learning;Data heterogeneity;Long-tailed Learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/67d0add0358a834f27001447b4b3eef5b51ded53.zip",
        "author": "Zikai Xiao;Zihan Chen;Liyinglan Liu;YANG FENG;Joey Tianyi Zhou;Jian Wu;Wanlu Liu;Howard Hao Yang;Zuozhu Liu",
        "authorids": "~Zikai_Xiao1;~Zihan_Chen1;~Liyinglan_Liu1;~YANG_FENG6;~Joey_Tianyi_Zhou1;~Jian_Wu6;~Wanlu_Liu1;~Howard_Hao_Yang1;~Zuozhu_Liu1",
        "gender": "M;M;F;M;M;M;F;M;M",
        "homepage": ";https://www.linkedin.com/in/zihan-chen-961217144/;;;https://joeyzhouty.github.io/;https://scholar.google.com/citations?hl=zh-TW&user=VO9XIXYAAAAJ;https://labw.org/;https://person.zju.edu.cn/en/howardyang;https://person.zju.edu.cn/en/lzz",
        "dblp": ";139/3503-1;367/1295;;123/5110;96/2744-1;;87/763;173/9297",
        "google_scholar": "d5G1eV0AAAAJ;;;;https://scholar.google.com.sg/citations?user=cYNqDokAAAAJ;https://scholar.google.com/citations?hl=zh-TW;;https://scholar.google.com.sg/citations?user=q0z9D9cAAAAJ;h602wLIAAAAJ",
        "orcid": "0000-0002-8507-5241;;0009-0007-8531-8833;;0000-0002-4675-7055;;;;0000-0002-7816-502X",
        "linkedin": ";;;https://www.linkedin.cn/incareer/in/%E6%B4%8B-%E5%86%AF-797451b0;;;;;",
        "or_profile": "~Zikai_Xiao1;~Zihan_Chen1;~Liyinglan_Liu1;~YANG_FENG6;~Joey_Tianyi_Zhou1;~Jian_Wu6;~Wanlu_Liu1;~Howard_Hao_Yang1;~Zuozhu_Liu1",
        "aff": "Zhejiang University;Singapore University of Technology and Design;University of Electronic Science and Technology of China;;A*STAR Centre for Frontier AI Research;Zhejiang University;;Zhejiang University;Zhejiang University",
        "aff_domain": "zju.edu.cn;sutd.edu.sg;uestc.edu.cn;;cfar.a-star.edu.sg;zju.edu.cn;;zju.edu.cn;zju.edu.cn",
        "position": "PhD student;Postdoc;MS student;;Principal Researcher;Full Professor;;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nxiao2024fedloge,\ntitle={FedLoGe: Joint Local and Generic Federated Learning under Long-tailed Data},\nauthor={Zikai Xiao and Zihan Chen and Liyinglan Liu and YANG FENG and Joey Tianyi Zhou and Jian Wu and Wanlu Liu and Howard Hao Yang and Zuozhu Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=V3j5d0GQgH}\n}",
        "github": "",
        "project": "",
        "reviewers": "YQxK;Nmh4;tSL5;YHb3",
        "pdf_size": 2284074,
        "rating": "5;5;6;8",
        "confidence": "3;3;4;4",
        "soundness": "3;3;3;2",
        "contribution": "2;2;2;3",
        "presentation": "2;2;3;1",
        "wc_summary": "56;116;80;75",
        "wc_strengths": "61;41;59;91",
        "wc_weaknesses": "136;116;125;259",
        "wc_questions": "34;46;4;159",
        "wc_review": "287;319;268;584",
        "wc_reply_reviewers": "131;0;37;283",
        "wc_reply_authors": "1639;2139;1414;2081",
        "reply_reviewers": "2;0;1;2",
        "reply_authors": "4;4;3;4",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            81.75,
            21.706853756359994
        ],
        "wc_strengths_avg": [
            63.0,
            17.944358444926362
        ],
        "wc_weaknesses_avg": [
            159.0,
            58.16786054171152
        ],
        "wc_questions_avg": [
            60.75,
            58.75106382015563
        ],
        "wc_review_avg": [
            364.5,
            128.03222250667994
        ],
        "wc_reply_reviewers_avg": [
            112.75,
            109.28031615986477
        ],
        "wc_reply_authors_avg": [
            1818.25,
            303.0951789454923
        ],
        "reply_reviewers_avg": [
            1.25,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.75,
            0.4330127018922193
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.8164965809277259,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9191781612808563090&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=V3j5d0GQgH",
        "pdf": "https://openreview.net/pdf?id=V3j5d0GQgH",
        "email": "zju.edu.cn;sutd.edu.sg;uestc.edu.cn;;cfar.a-star.edu.sg;zju.edu.cn;;zju.edu.cn;zju.edu.cn",
        "author_num": 9,
        "aff_unique_index": "0;1;2;3;0;0;0",
        "aff_unique_norm": "Zhejiang University;Singapore University of Technology and Design;University of Electronic Science and Technology of China;A*STAR",
        "aff_unique_dep": ";;;Centre for Frontier AI Research",
        "aff_unique_url": "https://www.zju.edu.cn;https://www.sutd.edu.sg;https://www.uestc.edu.cn;https://www.a-star.edu.sg",
        "aff_unique_abbr": "ZJU;SUTD;UESTC;A*STAR",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;1;0;0;0",
        "aff_country_unique": "China;Singapore"
    },
    {
        "id": "V42LZPlorE",
        "title": "Generating Explanations From Linear Structural Causal Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Causality and explainability are intertwined in that they mutually inform each other. For instance, incorporating knowledge on the causal structure of the data into an explanation aligns the reasoning within said explanation with how the data was generated. Surprisingly, this conceptual idea of generating explanations mainly from a suitable causal representation, like Pearl's Structural Causal Model, has not been studied before. To this end we are going to present a first algorithm within this new type of explanation that takes an SCM as input. We  start by identifying desiderata for this new approach by discussing shortcomings of previous causal explainers. Our current key restriction are linear SCM, for which we then define the set of possible questions before deriving the actual algorithm step-by-step alongside an example. To better understand whether our so-called Structural Causal Explanations are sensible w.r.t. the initial desiderata we asked 22 study participants to provide their guess of causal relations on simple, every-day variables to then evaluate SCE on these SCM approximations. We find that SCE is a suitable explanation scheme and followup our empirical study of SCE with SCM approximations as discovered by popular graph learning algorithms. In this second experiment we find that SCE reveals defficiencies of current graph learning algorithms for which we then propose a na\u00efve regularizer that incorporates SCE into learning.",
        "keywords": "causality;explanations",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Matej Ze\u010devi\u0107;Devendra Singh Dhami;Constantin A. Rothkopf;Kristian Kersting",
        "authorids": "~Matej_Ze\u010devi\u01071;~Devendra_Singh_Dhami1;~Constantin_A._Rothkopf1;~Kristian_Kersting1",
        "gender": "M;M;M;M",
        "homepage": "https://sites.google.com/view/devendradhami;http://www.ml.informatik.tu-darmstadt.de/;https://www.pip.tu-darmstadt.de;https://www.matej-zecevic.de",
        "dblp": "201/2130;40/3793;71/5555;286/1847",
        "google_scholar": "aVlaHfkAAAAJ;QY-earAAAAAJ;https://scholar.google.com/citations?hl=en;gzJZcPUAAAAJ",
        "orcid": ";0000-0002-2873-9152;;",
        "linkedin": ";;;",
        "or_profile": "~Devendra_Singh_Dhami1;~Kristian_Kersting1;~Constantin_Rothkopf1;~Matej_Zecevic1",
        "aff": "Eindhoven University of Technology;TU Darmstadt;Technische Universit\u00e4t Darmstadt;TU Darmstadt",
        "aff_domain": "tue.nl;tu-darmstadt.de;tu-darmstadt.de;tu-darmstadt.de",
        "position": "Assistant Professor;Full Professor;Full Professor;PhD student",
        "bibtex": "@misc{\nze{\\v{c}}evi{\\'c}2024generating,\ntitle={Generating Explanations From Linear Structural Causal Models},\nauthor={Matej Ze{\\v{c}}evi{\\'c} and Devendra Singh Dhami and Constantin A. Rothkopf and Kristian Kersting},\nyear={2024},\nurl={https://openreview.net/forum?id=V42LZPlorE}\n}",
        "github": "",
        "project": "",
        "reviewers": "bZoD;iBei;7kYr;hAzn;85pJ",
        "site": "https://openreview.net/forum?id=V42LZPlorE",
        "pdf_size": 1336062,
        "rating": "3;3;3;3;5",
        "confidence": "4;2;3;4;2",
        "soundness": "3;2;3;2;2",
        "contribution": "1;3;2;2;2",
        "presentation": "3;3;2;2;3",
        "wc_summary": "88;52;56;129;95",
        "wc_strengths": "23;32;60;34;76",
        "wc_weaknesses": "440;201;631;917;68",
        "wc_questions": "96;45;4;24;104",
        "wc_review": "647;330;751;1104;343",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            3.4,
            0.8
        ],
        "confidence_avg": [
            3.0,
            0.8944271909999159
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            84.0,
            28.178005607210743
        ],
        "wc_strengths_avg": [
            45.0,
            19.79898987322333
        ],
        "wc_weaknesses_avg": [
            451.4,
            302.94065425426146
        ],
        "wc_questions_avg": [
            54.6,
            39.35276356242341
        ],
        "wc_review_avg": [
            635.0,
            287.0017421549911
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5590169943749475,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:LCrXrkjlvYsJ:scholar.google.com/&scioq=Generating+Explanations+From+Linear+Structural+Causal+Models&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Eindhoven University of Technology;Technische Universit\u00e4t Darmstadt",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tue.nl;https://www.tu-darmstadt.de",
        "aff_unique_abbr": "TU/e;TU Darmstadt",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Darmstadt",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "Netherlands;Germany"
    },
    {
        "id": "V4fyVlX13y",
        "title": "Minimum Edit Distance Training for Conditional Language Generation Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The utilization of attention-based encoder-decoder (AED) structures, including transformers, has further advanced the capabilities of conditional language generation (CLG) models. However, the conventional AED model training approach which aims to maximize the likelihood conditioned on the prefix of reference label sequence, introduces exposure bias and possesses limitations in that it uses different evaluation metrics in the training and inference stages. In this study, we introduce a novel AED model training technique focused on minimizing the Levenshtein distance between the reference and inferred label sequences. The proposed method effectively mitigates exposure bias and improves the generalization performance of neural machine translation and automatic speech recognition models. Furthermore, we demonstrate that a post-hoc calibration function trained with the proposed objective function significantly reduces the calibration error of the ASR model, resulting in notable performance improvements.",
        "keywords": "Conditional language generation model;speech recognition;neural machine translation;calibration;exposure bias",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/4d4cb5381c222c026e5b97a9c5761fcd0e0600e9.zip",
        "author": "Munhak Lee;Joon-Hyuk Chang",
        "authorids": "~Munhak_Lee1;~Joon-Hyuk_Chang1",
        "gender": "M;M",
        "homepage": "http://asap.hanyang.ac.kr/kor/page/index.php;http://asmllab.hanyang.ac.kr",
        "dblp": ";22/4361",
        "google_scholar": "S8vGHrQAAAAJ;",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Munhak_Lee1;~Joon-Hyuk_Chang1",
        "aff": "Hanyang University;Hanyang University",
        "aff_domain": "hanyang.ac.kr;hanyang.ac.kr",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nlee2024minimum,\ntitle={Minimum Edit Distance Training for Conditional Language Generation Models},\nauthor={Munhak Lee and Joon-Hyuk Chang},\nyear={2024},\nurl={https://openreview.net/forum?id=V4fyVlX13y}\n}",
        "github": "",
        "project": "",
        "reviewers": "DVwK;kjTK;FobE;eZjX",
        "site": "https://openreview.net/forum?id=V4fyVlX13y",
        "pdf_size": 520298,
        "rating": "3;3;6;6",
        "confidence": "4;5;4;4",
        "soundness": "2;2;3;3",
        "contribution": "1;2;3;3",
        "presentation": "2;1;3;3",
        "wc_summary": "96;141;200;100",
        "wc_strengths": "120;10;25;102",
        "wc_weaknesses": "721;256;82;172",
        "wc_questions": "31;384;58;105",
        "wc_review": "968;791;365;479",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            134.25,
            41.8471922594575
        ],
        "wc_strengths_avg": [
            64.25,
            47.478284509868296
        ],
        "wc_weaknesses_avg": [
            307.75,
            246.39640317991658
        ],
        "wc_questions_avg": [
            144.5,
            140.78796113304574
        ],
        "wc_review_avg": [
            650.75,
            240.55599659954436
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5773502691896258,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:I06b6g1233IJ:scholar.google.com/&scioq=Minimum+Edit+Distance+Training+for+Conditional+Language+Generation+Models&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Hanyang University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.hanyang.ac.kr",
        "aff_unique_abbr": "HYU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "V4oQAR8uoE",
        "title": "The Best Defense is Attack: Repairing Semantics in Textual Adversarial Examples",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent studies have revealed the vulnerability of pre-trained language models to adversarial attacks. Existing adversarial defense techniques attempt to reconstruct adversarial examples within feature or text spaces. However, these methods struggle to effectively repair the semantics in adversarial examples, resulting in unsatisfactory performance and limiting their practical utility. To repair the semantics in adversarial examples, we introduce a novel approach named Reactive Perturbation Defocusing (Rapid). Rapid employs an adversarial detector to identify pseudo-labels for adversarial examples and leverage adversarial attackers to repair the semantics in adversarial examples by adversarial attacks. Our extensive experimental results, conducted on four public datasets, spanning various adversarial attack scenarios, convincingly demonstrate the effectiveness of Rapid. To address the problem of defense performance validation in previous works, we provide a demonstration of adversarial detection and repair based on our work, which can be easily evaluated at this page: https://tinyurl.com/22ercuf8.",
        "keywords": "textual adversarial detection;textual adversarial defense;perturbation defocusing",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/69a9026c065e249e942b30b33ba6603ae04e5b76.zip",
        "author": "Heng Yang;Ke Li",
        "authorids": "~Heng_Yang6;~Ke_Li5",
        "gender": "M;M",
        "homepage": "https://colalab.ai/;https://yangheng95.github.io",
        "dblp": "75/6627-1.html;83/415-8",
        "google_scholar": "https://scholar.google.co.uk/citations?user=lUFU8KsAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0001-7200-4244;0000-0002-6831-196X",
        "linkedin": "ke-li-29423226/;heng-yang-3b6278243/",
        "or_profile": "~Ke_Li5;~HENG_YANG5",
        "aff": "University of Exeter;University of Exeter",
        "aff_domain": "exeter.ac.uk;exeter.ac.uk",
        "position": "Associate Professor;PhD student",
        "bibtex": "@misc{\nyang2024the,\ntitle={The Best Defense is Attack: Repairing Semantics in Textual Adversarial Examples},\nauthor={Heng Yang and Ke Li},\nyear={2024},\nurl={https://openreview.net/forum?id=V4oQAR8uoE}\n}",
        "github": "",
        "project": "",
        "reviewers": "7Ywq;EQRG;WkfB",
        "site": "https://openreview.net/forum?id=V4oQAR8uoE",
        "pdf_size": 1178168,
        "rating": "5;5;6",
        "confidence": "3;4;2",
        "soundness": "2;3;3",
        "contribution": "2;2;2",
        "presentation": "2;3;2",
        "wc_summary": "70;49;182",
        "wc_strengths": "19;15;40",
        "wc_weaknesses": "238;28;56",
        "wc_questions": "6;176;25",
        "wc_review": "333;268;303",
        "wc_reply_reviewers": "51;0;13",
        "wc_reply_authors": "2124;1569;1330",
        "reply_reviewers": "1;0;1",
        "reply_authors": "5;4;4",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            100.33333333333333,
            58.37998134825175
        ],
        "wc_strengths_avg": [
            24.666666666666668,
            10.96458946893235
        ],
        "wc_weaknesses_avg": [
            107.33333333333333,
            93.09970760188003
        ],
        "wc_questions_avg": [
            69.0,
            76.05699617173076
        ],
        "wc_review_avg": [
            301.3333333333333,
            26.562295750848712
        ],
        "wc_reply_reviewers_avg": [
            21.333333333333332,
            21.63844315615664
        ],
        "wc_reply_authors_avg": [
            1674.3333333333333,
            332.5961849183214
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17165901360438501639&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Exeter",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.exeter.ac.uk",
        "aff_unique_abbr": "Exeter",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "title": "Don't Trust: Verify -- Grounding LLM Quantitative Reasoning with Autoformalization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18508",
        "id": "V5tdi14ple",
        "author_site": "Jin Zhou, Charles Staats, Wenda Li, Christian Szegedy, Kilian Weinberger, Yuhuai Wu",
        "tldr": "",
        "abstract": "Large language models (LLM), such as Google's Minerva and OpenAI's GPT families, are becoming increasingly capable of solving mathematical quantitative reasoning problems. However, they still make unjustified logical and computational errors in their reasoning steps and answers. In this paper, we leverage the fact that if the training corpus of LLMs contained sufficiently many examples of formal mathematics (e.g. in Isabelle, a formal theorem proving environment), they can be prompted to translate i.e. autoformalize informal mathematical statements into formal Isabelle code --- which can be verified automatically for internal consistency. This provides a mechanism to automatically reject solutions whose formalized versions are inconsistent within themselves or with the formalized problem statement. We evaluate our method on GSM8K, MATH and MultiArith datasets and demonstrate that our approach provides a consistently better heuristic than vanilla majority voting --- the previously best method to identify correct answers, by more than 12\\% on GSM8K. In our experiments it improves results consistently across all datasets and LLM model sizes. The code can be found at https://github.com/jinpz/dtv.",
        "keywords": "mathematical reasoning;autoformalization;automated theorem proving;quantitative reasoning",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "/attachment/07d65845b587ea195c96872b0bbc30fef43edeac.zip",
        "author": "Jin Peng Zhou;Charles E Staats;Wenda Li;Christian Szegedy;Kilian Q Weinberger;Yuhuai Wu",
        "authorids": "~Jin_Peng_Zhou1;~Charles_E_Staats1;~Wenda_Li1;~Christian_Szegedy1;~Kilian_Q_Weinberger1;~Yuhuai_Wu1",
        "gender": "M;M;M;;M;M",
        "homepage": ";;https://wenda302.github.io;;http://www.cs.cornell.edu/~kilian/;http://www.cs.toronto.edu/~ywu/",
        "dblp": "255/1107;;132/9868.html;78/1537;88/4801;",
        "google_scholar": "Nf48jqcAAAAJ;;ufYxQkEAAAAJ;3QeF7mAAAAAJ;jsxk8vsAAAAJ;https://scholar.google.ca/citations?user=bOQGfFIAAAAJ",
        "orcid": ";;;;0009-0008-9313-7239;",
        "linkedin": "https://ca.linkedin.com/in/jinpeng-zhou;charles-staats-8a34919a/;;;;",
        "or_profile": "~Jin_Peng_Zhou1;~Charles_E_Staats1;~Wenda_Li1;~Christian_Szegedy1;~Kilian_Q_Weinberger1;~Yuhuai_Wu1",
        "aff": "Department of Computer Science, Cornell University;Google;University of Edinburgh;Google;ASAPP Inc.;",
        "aff_domain": "cs.cornell.edu;google.com;ed.ac.uk;google.com;asapp.com;",
        "position": "PhD student;software engineer;Lecturer;Research Scientist;Principal Researcher;",
        "bibtex": "@inproceedings{\nzhou2024dont,\ntitle={Don't Trust: Verify -- Grounding {LLM} Quantitative Reasoning with Autoformalization},\nauthor={Jin Peng Zhou and Charles E Staats and Wenda Li and Christian Szegedy and Kilian Q Weinberger and Yuhuai Wu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=V5tdi14ple}\n}",
        "github": "",
        "project": "",
        "reviewers": "1bgq;wLE8;HYaT;HDyn",
        "pdf_size": 1179075,
        "rating": "3;6;8;8",
        "confidence": "4;4;4;3",
        "soundness": "3;3;4;3",
        "contribution": "1;2;4;3",
        "presentation": "3;3;4;3",
        "wc_summary": "49;148;102;119",
        "wc_strengths": "24;70;89;123",
        "wc_weaknesses": "63;106;25;259",
        "wc_questions": "29;2;185;74",
        "wc_review": "165;326;401;575",
        "wc_reply_reviewers": "89;125;0;43",
        "wc_reply_authors": "1131;678;518;865",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "3;3;1;3",
        "rating_avg": [
            6.25,
            2.0463381929681126
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            1.118033988749895
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            104.5,
            36.01735692690401
        ],
        "wc_strengths_avg": [
            76.5,
            35.76660453551609
        ],
        "wc_weaknesses_avg": [
            113.25,
            88.89424897033554
        ],
        "wc_questions_avg": [
            72.5,
            69.85878613317011
        ],
        "wc_review_avg": [
            366.75,
            147.39805799263436
        ],
        "wc_reply_reviewers_avg": [
            64.25,
            47.12417108024289
        ],
        "wc_reply_authors_avg": [
            798.0,
            228.13263685847318
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.8660254037844386
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.49374193110101877,
        "gs_citation": 31,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2304536601948849981&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=V5tdi14ple",
        "pdf": "https://openreview.net/pdf?id=V5tdi14ple",
        "email": "cs.cornell.edu;google.com;ed.ac.uk;google.com;asapp.com;",
        "author_num": 6,
        "aff_unique_index": "0;1;2;1;3",
        "aff_unique_norm": "Cornell University;Google;University of Edinburgh;ASAPP Inc.",
        "aff_unique_dep": "Department of Computer Science;Google;;",
        "aff_unique_url": "https://www.cornell.edu;https://www.google.com;https://www.ed.ac.uk;https://www.asapp.com",
        "aff_unique_abbr": "Cornell;Google;Edinburgh;ASAPP",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "V6JRkfj9dU",
        "title": "How many samples are needed to train a deep-ReLU neural network?",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Neural networks have become standard tools in many areas, yet many important statistical questions remain open. This paper studies the question of how much data are needed to train a neural network. Our theoretical and empirical results suggest that the generalization error of neural networks scales at the rate $1/\\sqrt{n}$ in the sample size $n$ rather than the usual \"parametric rate\" $1/n$. Thus, broadly speaking, our results underpin the common belief that neural networks need \"many\" training samples.",
        "keywords": "Neural networks;deep learning;generalization error;Fano's method;statistical learning theory",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Pegah Golestaneh;Mahsa Taheri;Johannes Lederer",
        "authorids": "~Pegah_Golestaneh1;~Mahsa_Taheri1;~Johannes_Lederer1",
        "gender": "F;F;",
        "homepage": ";https://scholar.google.com/citations?user=I42VT-4AAAAJ&hl=en&oi=sra;",
        "dblp": ";;",
        "google_scholar": "sn8FtFEAAAAJ;I42VT-4AAAAJ;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Pegah_Golestaneh1;~Mahsa_Taheri1;~Johannes_Lederer1",
        "aff": "Universit\u00e4t Hamburg;Technische Universit\u00e4t M\u00fcnchen;",
        "aff_domain": "uni-hamburg.de;tum.de;",
        "position": "PhD student;Postdoc;",
        "bibtex": "@misc{\ngolestaneh2024how,\ntitle={How many samples are needed to train a deep-Re{LU} neural network?},\nauthor={Pegah Golestaneh and Mahsa Taheri and Johannes Lederer},\nyear={2024},\nurl={https://openreview.net/forum?id=V6JRkfj9dU}\n}",
        "github": "",
        "project": "",
        "reviewers": "xTTm;NyqE;NcCL",
        "site": "https://openreview.net/forum?id=V6JRkfj9dU",
        "pdf_size": 629502,
        "rating": "3;5;6",
        "confidence": "4;3;3",
        "soundness": "2;2;3",
        "contribution": "1;2;3",
        "presentation": "2;3;2",
        "wc_summary": "115;66;51",
        "wc_strengths": "29;36;93",
        "wc_weaknesses": "329;215;217",
        "wc_questions": "2;66;73",
        "wc_review": "475;383;434",
        "wc_reply_reviewers": "0;51;0",
        "wc_reply_authors": "298;325;391",
        "reply_reviewers": "0;1;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            77.33333333333333,
            27.329267990359508
        ],
        "wc_strengths_avg": [
            52.666666666666664,
            28.66279043560755
        ],
        "wc_weaknesses_avg": [
            253.66666666666666,
            53.27496806401879
        ],
        "wc_questions_avg": [
            47.0,
            31.94787421201396
        ],
        "wc_review_avg": [
            430.6666666666667,
            37.63272807307786
        ],
        "wc_reply_reviewers_avg": [
            17.0,
            24.041630560342615
        ],
        "wc_reply_authors_avg": [
            338.0,
            39.06404996924922
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.9449111825230683,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:TJgubDiUKaQJ:scholar.google.com/&scioq=How+many+samples+are+needed+to+train+a+deep-ReLU+neural+network%3F&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Hamburg;Technische Universit\u00e4t M\u00fcnchen",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uni-hamburg.de;https://www.tum.de",
        "aff_unique_abbr": "UHH;TUM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "V7QAX3zRh0",
        "title": "Towards guarantees for parameter isolation in continual learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep learning has proved to be a successful paradigm to solve many challenges in machine learning.  However, deep neural networks fail when trained sequentially on multiple tasks, a shortcoming known as catastrophic forgetting in the continual learning literature. Despite a recent flourish of learning algorithms successfully addressing this problem, we find that provable guarantees against catastrophic forgetting are lacking. In this work, we study the relationship between learning and forgetting by looking at the geometry of neural networks' loss landscape. We offer a unifying perspective on a family of continual learning algorithms, namely methods based on parameter isolation, and we establish guarantees on catastrophic forgetting for some of them.",
        "keywords": "continual learning;catastrophic forgetting;deep learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/0cd8e63329bcdf7199b9962215f14485803bef3f.zip",
        "author": "Giulia Lanzillotta;Sidak Pal Singh;Benjamin F Grewe;Thomas Hofmann",
        "authorids": "~Giulia_Lanzillotta1;~Sidak_Pal_Singh1;~Benjamin_F_Grewe1;~Thomas_Hofmann1",
        "gender": "F;;M;M",
        "homepage": ";http://sidakpal.com/;https://www.ini.uzh.ch/en/institute/people?uname=bgrewe;http://www.da.inf.ethz.ch/",
        "dblp": ";189/9168;;h/ThHofmann",
        "google_scholar": "eiB9OOkAAAAJ;c59mPS4AAAAJ;https://scholar.google.de/citations?user=ZA-1rh8AAAAJ;T3hAyLkAAAAJ",
        "orcid": "0009-0008-2047-8251;;0000-0001-8560-2120;",
        "linkedin": "giulia-lanzillotta-0aab3186/;;;thomas-hofmann-1ab2402/",
        "or_profile": "~Giulia_Lanzillotta1;~Sidak_Pal_Singh1;~Benjamin_F_Grewe1;~Thomas_Hofmann1",
        "aff": "Swiss Federal Institute of Technology;Max Planck Institute for Intelligent Systems;ETHZ - ETH Zurich;Swiss Federal Institute of Technology",
        "aff_domain": "ethz.ch;tuebingen.mpg.de;ethz.ch;ethz.ch",
        "position": "PhD student;PhD student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nlanzillotta2024towards,\ntitle={Towards guarantees for parameter isolation in continual learning},\nauthor={Giulia Lanzillotta and Sidak Pal Singh and Benjamin F Grewe and Thomas Hofmann},\nyear={2024},\nurl={https://openreview.net/forum?id=V7QAX3zRh0}\n}",
        "github": "",
        "project": "",
        "reviewers": "5dAQ;oq6r;9KMy;W8iZ",
        "site": "https://openreview.net/forum?id=V7QAX3zRh0",
        "pdf_size": 18454146,
        "rating": "1;5;5;6",
        "confidence": "5;3;3;1",
        "soundness": "1;2;3;3",
        "contribution": "2;2;2;2",
        "presentation": "2;2;2;3",
        "wc_summary": "100;86;52;39",
        "wc_strengths": "68;61;31;13",
        "wc_weaknesses": "514;142;145;14",
        "wc_questions": "67;165;7;152",
        "wc_review": "749;454;235;218",
        "wc_reply_reviewers": "457;0;0;0",
        "wc_reply_authors": "1854;542;466;881",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "3;1;1;2",
        "rating_avg": [
            4.25,
            1.920286436967152
        ],
        "confidence_avg": [
            3.0,
            1.4142135623730951
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            69.25,
            24.691850882426778
        ],
        "wc_strengths_avg": [
            43.25,
            22.320114247019436
        ],
        "wc_weaknesses_avg": [
            203.75,
            186.76505963375484
        ],
        "wc_questions_avg": [
            97.75,
            64.51114244841739
        ],
        "wc_review_avg": [
            414.0,
            214.64039694335267
        ],
        "wc_reply_reviewers_avg": [
            114.25,
            197.88680476474423
        ],
        "wc_reply_authors_avg": [
            935.75,
            552.6944793464107
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9205746178983233,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:SHB2HwS39YwJ:scholar.google.com/&scioq=Towards+guarantees+for+parameter+isolation+in+continual+learning&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Swiss Federal Institute of Technology;Max Planck Institute for Intelligent Systems;ETH Zurich",
        "aff_unique_dep": ";Intelligent Systems;",
        "aff_unique_url": "https://www.ethz.ch;https://www.mpi-is.mpg.de;https://www.ethz.ch",
        "aff_unique_abbr": "ETH Zurich;MPI-IS;ETHZ",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "Switzerland;Germany"
    },
    {
        "id": "V7WjTjX7AY",
        "title": "Balanced Multimodal Learning: An Integrated Framework for Multi-Task Learning in Audio-Visual Fusion",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Multimodal learning integrates sensory information from various perspectives, providing significant advantages in different fields like sentiment analysis. However, recent studies have highlighted challenges associated with imbalanced contributions and varying convergence rates across different modalities. Neglecting these imbalances in joint-learning models compromises both information utilization and overall performance. We further find that neither advanced semantic representations nor complex deep networks effectively address these imbalances. To empirically examine these challenges, we approach them from an audio-visual multi-task perspective, focusing on two tasks: lip reading and sentiment analysis, and exploring the contributions of different modalities under varying scenarios. We introduce $\\textit{BalanceMLA}$ in our work, a multimodal learning framework designed to dynamically balance and optimize each modality. This framework can independently adjust the objectives of each modality and adaptively control their optimization. Additionally, we propose a bilateral residual feature fusion and an adaptive weighted decision fusion strategy to dynamically manage these imbalances. We also introduce a dynamically generated class-level weighting scheme to cater to fine-grained tasks. Extensive experimental results validate the superiority of our model in addressing modality imbalances, showcasing both its effectiveness and versatility. Furthermore, experiments conducted under extreme noise conditions demonstrate that our model maintains high fusion efficiency and robustness, even in challenging environments.",
        "keywords": "modal imbalance; audio-visual fusion; multi-task",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Xiao Fu;Wei Xi;Jie Yang;Yutao Bai;Zhao Yang;Rui Jiang;LI XIZHE;Jiankang Gao;Jizhong Zhao",
        "authorids": "~Xiao_Fu7;~Wei_Xi1;~Jie_Yang29;~Yutao_Bai1;~Zhao_Yang7;~Rui_Jiang3;~LI_XIZHE1;~Jiankang_Gao1;~Jizhong_Zhao3",
        "gender": "M;M;M;;;M;M;M;M",
        "homepage": ";http://xiwei.gr.xjtu.edu.cn;;https://github.com/1024bb;;;https://m.bilibili.com/space/311848800;https://github.com/kawhi-95;http://www.xjtu.edu.cn/jsnr.jsp?urltype=tree.TreeTempUrl&wbtreeid=1632&wbwbxjtuteacherid=626",
        "dblp": ";;;;;;;;",
        "google_scholar": "https://scholar.google.com.hk/citations?hl=zh-CN;https://scholar.google.com.hk/citations?user=Xt3XP-EAAAAJ;;;;https://scholar.google.com.hk/citations?view_op=list_works;;;",
        "orcid": "0009-0006-6601-5290;;;;;;;;",
        "linkedin": ";;%E6%9D%B0-%E6%9D%A8-70072327b/;;;;;;",
        "or_profile": "~Xiao_Fu7;~Wei_Xi1;~Jie_Yang29;~Yutao_Bai1;~Zhao_Yang7;~Rui_Jiang3;~LI_XIZHE1;~Jiankang_Gao1;~Jizhong_Zhao3",
        "aff": "Xi'an Jiaotong University;Xi'an Jiaotong University;;Xi'an Jiaotong University;;Xi'an Jiaotong University;Xi'an Jiaotong University;Xi'an Jiaotong University;Xi'an Jiaotong University",
        "aff_domain": "xjtu.edu.cn;xjtu.edu.cn;;xjtu.edu.cn;;xjtu.edu.cn;xjtu.edu.cn;xjtu.edu.cn;xjtu.edu.cn",
        "position": "PhD student;Full Professor;;MS student;;PhD student;PhD student;MS student;Full Professor",
        "bibtex": "@misc{\nfu2024balanced,\ntitle={Balanced Multimodal Learning: An Integrated Framework for Multi-Task Learning in Audio-Visual Fusion},\nauthor={Xiao Fu and Wei Xi and Jie Yang and Yutao Bai and Zhao Yang and Rui Jiang and LI XIZHE and Jiankang Gao and Jizhong Zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=V7WjTjX7AY}\n}",
        "github": "",
        "project": "",
        "reviewers": "iFEs;jui1;LE8u;vtJb",
        "site": "https://openreview.net/forum?id=V7WjTjX7AY",
        "pdf_size": 1118886,
        "rating": "1;3;3;5",
        "confidence": "5;4;4;4",
        "soundness": "2;2;2;3",
        "contribution": "1;2;2;2",
        "presentation": "3;2;2;3",
        "wc_summary": "86;38;93;54",
        "wc_strengths": "17;66;57;21",
        "wc_weaknesses": "365;156;273;64",
        "wc_questions": "38;2;70;21",
        "wc_review": "506;262;493;160",
        "wc_reply_reviewers": "0;0;0;21",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            67.75,
            22.609455986378798
        ],
        "wc_strengths_avg": [
            40.25,
            21.533404282648853
        ],
        "wc_weaknesses_avg": [
            214.5,
            114.17639861197235
        ],
        "wc_questions_avg": [
            32.75,
            24.993749218554626
        ],
        "wc_review_avg": [
            355.25,
            148.760503830822
        ],
        "wc_reply_reviewers_avg": [
            5.25,
            9.093266739736606
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8138070229388781429&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0;0;0",
        "aff_unique_norm": "Xi'an Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.xjtu.edu.cn",
        "aff_unique_abbr": "XJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "V7uPprVelO",
        "title": "GenCO: Generating Diverse Solutions to Design Problems with Combinatorial Nature",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The generation of diverse but realistic objects that have combinatorial properties has various practical applications across several fields, including computer graphics, animation, industrial design, material science, etc. For instance, we might want to restrict the output of the generator so that it satisfies discrete constraints or encourage certain combinatorial properties as a penalty. However, existing generative models and optimization solvers often struggle to concurrently ensure solution diversity and uphold the underlying combinatorial nature. To address this, we propose $GenCO$, a novel framework that conducts end-to-end training of deep generative models integrated with embedded combinatorial solvers, aiming to uncover high-quality solutions aligned with nonlinear objectives. While structurally akin to conventional generative models, $GenCO$ diverges in its role - it focuses on generating instances of combinatorial optimization problems rather than final objects (e.g., images). This shift allows finer control over the generated outputs, enabling assessments of their feasibility and introducing an additional combinatorial loss component. We demonstrate the effectiveness of our approach on a variety of generative tasks characterized by combinatorial intricacies, including game level generation and map creation for path planning, consistently demonstrating its capability to yield diverse, high-quality solutions that reliably adhere to user-specified combinatorial properties.",
        "keywords": "generative models;combinatorial optimization;end-to-end learning",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/efd8e08349ace56c2adddeaea65236a42ddb413c.pdf",
        "author": "Aaron M Ferber;Arman Zharmagambetov;Taoan Huang;Bistra Dilkina;Yuandong Tian",
        "authorids": "~Aaron_M_Ferber1;~Arman_Zharmagambetov1;~Taoan_Huang2;~Bistra_Dilkina2;~Yuandong_Tian1",
        "gender": "M;M;M;F;M",
        "homepage": "https://aaron-ferber.github.io/;https://arman-z.github.io/;;;http://yuandong-tian.com",
        "dblp": "163/7788;252/5004;241/7690;30/5718;t/YuandongTian",
        "google_scholar": "TuVq07oAAAAJ;D6QocXMAAAAJ;;1jjyaBYAAAAJ;0mgEF28AAAAJ",
        "orcid": ";;;0000-0002-6784-473X;0000-0003-4202-4847",
        "linkedin": "aaron-ferber-64a73980/;;;;yuandongtian",
        "or_profile": "~Aaron_M_Ferber1;~Arman_Zharmagambetov1;~Taoan_Huang2;~Bistra_Dilkina2;~Yuandong_Tian1",
        "aff": "Cornell University;Meta AI (FAIR);University of Southern California;University of Southern California;Meta AI (FAIR)",
        "aff_domain": "cornell.edu;meta.com;usc.edu;usc.edu;meta.com",
        "position": "Postdoc;Postdoc;PhD student;Associate Professor;Research Scientist",
        "bibtex": "@misc{\nferber2024genco,\ntitle={Gen{CO}: Generating Diverse Solutions to Design Problems with Combinatorial Nature},\nauthor={Aaron M Ferber and Arman Zharmagambetov and Taoan Huang and Bistra Dilkina and Yuandong Tian},\nyear={2024},\nurl={https://openreview.net/forum?id=V7uPprVelO}\n}",
        "github": "",
        "project": "",
        "reviewers": "GDcb;qozd;X2M2;5GZK",
        "site": "https://openreview.net/forum?id=V7uPprVelO",
        "pdf_size": 2152251,
        "rating": "5;5;6;6",
        "confidence": "3;3;3;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;2;3",
        "wc_summary": "72;37;215;96",
        "wc_strengths": "19;23;111;72",
        "wc_weaknesses": "26;254;161;173",
        "wc_questions": "194;2;32;186",
        "wc_review": "311;316;519;527",
        "wc_reply_reviewers": "13;456;96;48",
        "wc_reply_authors": "748;2835;984;841",
        "reply_reviewers": "1;2;2;2",
        "reply_authors": "1;5;2;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            105.0,
            66.8842283352361
        ],
        "wc_strengths_avg": [
            56.25,
            37.877268908937985
        ],
        "wc_weaknesses_avg": [
            153.5,
            81.84283719422244
        ],
        "wc_questions_avg": [
            103.5,
            87.19374977600172
        ],
        "wc_review_avg": [
            418.25,
            104.80308917202775
        ],
        "wc_reply_reviewers_avg": [
            153.25,
            177.2588150135276
        ],
        "wc_reply_authors_avg": [
            1352.0,
            860.3269727260677
        ],
        "reply_reviewers_avg": [
            1.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            1.5
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14795781952008268438&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;2;1",
        "aff_unique_norm": "Cornell University;Meta;University of Southern California",
        "aff_unique_dep": ";Facebook AI Research (FAIR);",
        "aff_unique_url": "https://www.cornell.edu;https://ai.facebook.com;https://www.usc.edu",
        "aff_unique_abbr": "Cornell;Meta AI;USC",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Los Angeles",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "V8FZXjRWX1",
        "title": "ReBaR: Reference-Based Reasoning for Robust Human Pose and Shape Estimation from Monocular Images",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper introduces a novel method, ReBaR (Reference-Based Reasoning for Robust Human Pose and Shape Estimation), designed to estimate human body shape and pose from single-view images. ReBaR effectively addresses the challenges of occlusions and depth ambiguity by learning reference features for part regression reasoning. Our approach starts by extracting features from both body and part regions using an attention-guided mechanism. Subsequently, these features are used to encode additional part-body dependencies for individual part regression, with part features serving as queries and the body feature as a reference. This reference-based reasoning allows our network to infer the spatial relationships of occluded parts with the body, utilizing visible parts and body reference information. ReBaR outperforms existing state-of-the-art methods on two benchmark datasets, demonstrating significant improvement in handling depth ambiguity and occlusion. These results strongly support the effectiveness of our reference-based framework for estimating human body shape and pose from single-view images.",
        "keywords": "Soft-Attention-Guided; Avatar; Deepth Error",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/ff7d633eae3c7646ffe399afdc748ebcace81aab.zip",
        "author": "Yongkang Cheng;Shaoli Huang;Jifeng Ning;Xiaohang Zhan;Ying Shan",
        "authorids": "~Yongkang_Cheng2;~Shaoli_Huang2;~Jifeng_Ning3;~Xiaohang_Zhan1;~Ying_Shan2",
        "gender": "M;M;M;M;M",
        "homepage": ";;https://xiaohangzhan.github.io/;;",
        "dblp": "80/8502;83/212.html;211/7010;68/5910;",
        "google_scholar": "o31BPFsAAAAJ;bePJGzMAAAAJ;QfquhDEAAAAJ;4oXBp9UAAAAJ;https://scholar.google.com/citations?view_op=list_works",
        "orcid": ";;0000-0003-2136-7592;0000-0001-7673-8325;",
        "linkedin": ";;xiaohang-zhan-%EF%BC%88%E8%A9%B9%E6%99%93%E8%88%AA%EF%BC%89-7659b2b8/;YingShanProfile/;",
        "or_profile": "~Shaoli_Huang2;~Jifeng_Ning3;~Xiaohang_Zhan1;~Ying_Shan2;~yongkang_cheng1",
        "aff": "Tencent AI Lab;Northwest A&F University;Tencent AI Lab;Tencent PCG ARC Lab;Northwest A&F University",
        "aff_domain": "tencent.com;nwsuaf.edu;tencent.com;arc.tencent.com;nwafu.edu.cn",
        "position": "Researcher;Full Professor;Researcher;Director;MS student",
        "bibtex": "@misc{\ncheng2024rebar,\ntitle={ReBaR: Reference-Based Reasoning for Robust Human Pose and Shape Estimation from Monocular Images},\nauthor={Yongkang Cheng and Shaoli Huang and Jifeng Ning and Xiaohang Zhan and Ying Shan},\nyear={2024},\nurl={https://openreview.net/forum?id=V8FZXjRWX1}\n}",
        "github": "",
        "project": "",
        "reviewers": "VfGb;h8nb;mMLH;aFNK;nWz1",
        "site": "https://openreview.net/forum?id=V8FZXjRWX1",
        "pdf_size": 12219443,
        "rating": "5;5;5;5;6",
        "confidence": "5;5;5;5;4",
        "soundness": "3;3;2;3;3",
        "contribution": "2;3;2;2;3",
        "presentation": "2;1;1;3;2",
        "wc_summary": "49;78;58;36;81",
        "wc_strengths": "12;60;33;15;44",
        "wc_weaknesses": "158;375;182;103;265",
        "wc_questions": "69;2;22;3;5",
        "wc_review": "288;515;295;157;395",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "735;731;519;687;1103",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "2;1;1;1;2",
        "rating_avg": [
            5.2,
            0.39999999999999997
        ],
        "confidence_avg": [
            4.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            1.8,
            0.7483314773547883
        ],
        "wc_summary_avg": [
            60.4,
            17.118411141224527
        ],
        "wc_strengths_avg": [
            32.8,
            17.971087891388212
        ],
        "wc_weaknesses_avg": [
            216.6,
            94.83585819720302
        ],
        "wc_questions_avg": [
            20.2,
            25.466841186138492
        ],
        "wc_review_avg": [
            330.0,
            119.47217249217493
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            755.0,
            190.99738218101317
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.4,
            0.4898979485566356
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:JSyH2JO2OjIJ:scholar.google.com/&scioq=ReBaR:+Reference-Based+Reasoning+for+Robust+Human+Pose+and+Shape+Estimation+from+Monocular+Images&hl=en&as_sdt=0,14",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;0;0;1",
        "aff_unique_norm": "Tencent;Northwest A&F University",
        "aff_unique_dep": "Tencent AI Lab;",
        "aff_unique_url": "https://ai.tencent.com;https://www.nwsuaf.edu.cn",
        "aff_unique_abbr": "Tencent AI Lab;NWSUAF",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "V8Lj9eoGl8",
        "title": "Proximal Curriculum with Task Correlations for Deep Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Curriculum design for reinforcement learning (RL) can speed up an agent's learning process and help it learn to perform well on complex tasks. However, existing techniques typically require domain-specific hyperparameter tuning, involve expensive optimization procedures for task selection, or are suitable only for specific learning objectives. In this work, we consider curriculum design in contextual multi-task settings where the agent's final performance is measured w.r.t. a target distribution over complex tasks. We base our curriculum design on the Zone of Proximal Development concept, which has proven to be effective in accelerating the learning process of RL agents for uniform distribution over all tasks. We propose a novel curriculum, ProxCoRL, that effectively balances the need for selecting tasks that are not too difficult for the agent while progressing the agent's learning toward the target distribution via leveraging task correlations. We theoretically justify the task selection strategy of ProxCoRL by analyzing a simple learning setting with REINFORCE learner model. Our experimental results across various domains with challenging target task distributions affirm the effectiveness of our curriculum strategy over state-of-the-art baselines in accelerating the training process of deep RL agents.",
        "keywords": "curriculum design;reinforcement learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/ab4a15c5057542d38f1819c52b4ff664c30513b5.zip",
        "author": "Georgios Tzannetos;Parameswaran Kamalaruban;Adish Singla",
        "authorids": "~Georgios_Tzannetos1;~Parameswaran_Kamalaruban2;~Adish_Singla2",
        "gender": "M;M;",
        "homepage": "https://georgetzannetos.github.io/;https://markovkernel.net/;https://machineteaching.mpi-sws.org/adishsingla.html",
        "dblp": "345/8576;164/7413;58/657",
        "google_scholar": "E_EE9gUAAAAJ;0ioRCikAAAAJ;kXz2seUAAAAJ",
        "orcid": ";;",
        "linkedin": "gtzannetos;;",
        "or_profile": "~Georgios_Tzannetos1;~Parameswaran_Kamalaruban2;~Adish_Kumar_Singla1",
        "aff": "MPI-SWS;Featurespace;Max Planck Institute for Software Systems (MPI-SWS)",
        "aff_domain": "mpi-sws.org;featurespace.co.uk;mpi-sws.org",
        "position": "PhD student;Researcher;Researcher",
        "bibtex": "@misc{\ntzannetos2024proximal,\ntitle={Proximal Curriculum with Task Correlations for Deep Reinforcement Learning},\nauthor={Georgios Tzannetos and Parameswaran Kamalaruban and Adish Singla},\nyear={2024},\nurl={https://openreview.net/forum?id=V8Lj9eoGl8}\n}",
        "github": "",
        "project": "",
        "reviewers": "ynrZ;MJvx;LEfH;eLrA",
        "site": "https://openreview.net/forum?id=V8Lj9eoGl8",
        "pdf_size": 592058,
        "rating": "3;5;5;8",
        "confidence": "4;3;3;3",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;4",
        "presentation": "3;3;3;3",
        "wc_summary": "79;115;123;23",
        "wc_strengths": "56;34;21;44",
        "wc_weaknesses": "142;270;68;81",
        "wc_questions": "73;6;80;2",
        "wc_review": "350;425;292;150",
        "wc_reply_reviewers": "0;86;47;0",
        "wc_reply_authors": "671;615;711;104",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            85.0,
            39.44616584663204
        ],
        "wc_strengths_avg": [
            38.75,
            12.871965661856
        ],
        "wc_weaknesses_avg": [
            140.25,
            79.95115696473691
        ],
        "wc_questions_avg": [
            40.25,
            36.36189626518397
        ],
        "wc_review_avg": [
            304.25,
            100.76798846856079
        ],
        "wc_reply_reviewers_avg": [
            33.25,
            35.99565946055163
        ],
        "wc_reply_authors_avg": [
            525.25,
            245.5874335140135
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.7276068751089989,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5638272068863523686&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Max Planck Institute for Software Systems;Featurespace Ltd.",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.mpi-sws.org;https://www.featurespace.co.uk",
        "aff_unique_abbr": "MPI-SWS;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Germany;United Kingdom"
    },
    {
        "id": "V8PhVhb4pp",
        "title": "Text-to-3D Generation with Bidirectional Diffusion using both 3D and 2D priors",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Most research in 3D object generation focuses on boosting 2D foundational models into the 3D space, either by minimizing 2D SDS loss or fine-tuning on multi-view datasets. Without explicit 3D priors, these methods often lead to geometric anomalies and multi-view inconsistency. Recently, researchers have attempted to improve the genuineness of 3D objects by training directly on 3D datasets, albeit at the cost of low-quality texture generation due to the limited 2D texture variation in 3D datasets. To harness the advantages of both approaches, in this paper, we propose Bidirectional Diffusion (BiDiff), a unified framework that incorporates both a 3D and a 2D diffusion process, to preserve both 3D fidelity and 2D texture richness, respetively. Recognizing that a simple combination of two diffusion processes can yield inconsistent generation results, we further bridge them with innovative bidirectional guidance. At last, we also demonstrate that this is the first 3D generative model that can separately control texture and geometry generation. Experimental results have shown that our model achieves high-quality, diverse, and scalable 3D generation. The project website is https://bidiff.github.io",
        "keywords": "3D generation;foundation model",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/04a4722cd6e9bfe3bb78f736b6ce5fb1701e5b61.pdf",
        "author": "Lihe Ding;Shaocong Dong;Zhanpeng Huang;Zibin Wang;Yiyuan Zhang;Kaixiong Gong;Dan Xu;Tianfan Xue",
        "authorids": "~Lihe_Ding1;~Shaocong_Dong1;~Zhanpeng_Huang1;~Zibin_Wang1;~Yiyuan_Zhang1;~Kaixiong_Gong1;~Dan_Xu4;~Tianfan_Xue2",
        "gender": "M;;;M;M;M;M;M",
        "homepage": ";;;http://www.sensetime.com;https://invictus717.github.io/;;https://www.danxurgb.net;https://tianfan.info",
        "dblp": "307/5395;329/6563;;54/8616;163/6458;289/0124;16/3823-2.html;54/8652",
        "google_scholar": "6nJrd8oAAAAJ;https://scholar.google.com.hk/citations?user=Pee4FRsAAAAJ;;;KuYlJCIAAAAJ;kBVshUUAAAAJ;OuSPv-AAAAAJ;RfSQKrIAAAAJ",
        "orcid": "0000-0003-1976-9496;0000-0001-6152-9299;;;0000-0001-6643-9698;;0000-0003-0136-9603;0000-0001-5031-6618",
        "linkedin": ";;;;;;;tianfan-xue-54016716",
        "or_profile": "~Lihe_Ding1;~Shaocong_Dong1;~Zhanpeng_Huang1;~Zibin_Wang1;~Yiyuan_Zhang1;~Kaixiong_Gong1;~Dan_Xu4;~Tianfan_Xue2",
        "aff": "The Chinese University of Hong Kong;Hong Kong University of Science and Technology;;Sensetime Group Limited;The Chinese University of Hong Kong;The Chinese University of Hong Kong;VGG, University of Oxford;The Chinese University of Hong Kong",
        "aff_domain": "ie.cuhk.edu;ust.hk;;sensetime.com;ie.cuhk.edu;ie.cuhk.edu;ox.ac.uk;cuhk.edu.hk",
        "position": "PhD student;PhD student;;Director;PhD student;PhD student;Postdoc;Assistant Professor",
        "bibtex": "@misc{\nding2024texttod,\ntitle={Text-to-3D Generation with Bidirectional Diffusion using both 3D and 2D priors},\nauthor={Lihe Ding and Shaocong Dong and Zhanpeng Huang and Zibin Wang and Yiyuan Zhang and Kaixiong Gong and Dan Xu and Tianfan Xue},\nyear={2024},\nurl={https://openreview.net/forum?id=V8PhVhb4pp}\n}",
        "github": "",
        "project": "",
        "reviewers": "Ymwx;hKcU;ZH4m;7ENe",
        "site": "https://openreview.net/forum?id=V8PhVhb4pp",
        "pdf_size": 2665244,
        "rating": "3;5;6;6",
        "confidence": "4;4;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;2;2;1",
        "wc_summary": "81;134;126;68",
        "wc_strengths": "73;112;125;79",
        "wc_weaknesses": "311;267;226;259",
        "wc_questions": "106;87;75;8",
        "wc_review": "571;600;552;414",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "282;292;96;203",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            102.25,
            28.269904492233433
        ],
        "wc_strengths_avg": [
            97.25,
            21.84462176372024
        ],
        "wc_weaknesses_avg": [
            265.75,
            30.309858132297485
        ],
        "wc_questions_avg": [
            69.0,
            36.9120576505835
        ],
        "wc_review_avg": [
            534.25,
            71.4995629357271
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            218.25,
            78.55054105478841
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 17,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11258898912313189356&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;2;0;0;3;0",
        "aff_unique_norm": "Chinese University of Hong Kong;Hong Kong University of Science and Technology;SenseTime Group;University of Oxford",
        "aff_unique_dep": ";;;VGG",
        "aff_unique_url": "https://www.cuhk.edu.hk;https://www.ust.hk;https://www.sensetime.com;https://www.ox.ac.uk",
        "aff_unique_abbr": "CUHK;HKUST;SenseTime;Oxford",
        "aff_campus_unique_index": "0;0;0;0;2;0",
        "aff_campus_unique": "Hong Kong SAR;;Oxford",
        "aff_country_unique_index": "0;0;0;0;0;1;0",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "id": "V8YwPdoSlr",
        "title": "Capturing Static, Short-Term, and Long-Term Dynamics Through Self-Supervised Time Series Learning: CHRONOS",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Time series data presents a rich tapestry of temporal patterns, encompassing both enduring static trends that persist throughout the entire temporal sequence and dynamic patterns that define its evolving nature. To advance the field of Self-Supervised Learning (SSL) in time series analysis, it is essential to adopt a comprehensive approach that considers these distinct temporal facets. In this paper, we introduce Contrasting Heads Represent Opposed Natures of Signals (CHRONOS), a novel SSL methodology which drives the model to understand three distinct temporal attributes \u2013 static, short-term dynamics, and long-term dynamics. This is achieved by projecting the representations into two separate spaces, employing contrasting heads. Furthermore, a selective optimization leads distinct model units to be specialized in different temporal natures. To evaluate the effectiveness of CHRONOS, we applied this methodology to the analysis of electrocardiagram (ECG) signals across four distinct downstream tasks, utilizing four independent datasets. Our study demonstrates the consistent performance of CHRONOS across all tasks, surpassing state-of-the-art methods for time series data analysis. CHRONOS serves as a testament to the importance of capturing diverse temporal aspects of time series data for driving versatile models capable of consistently excelling in a wide spectrum of downstream tasks",
        "keywords": "Self-Supervised Learning;Time Series;Physiological Signals.",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Adrian Atienza;Jakob E. Bardram;Sadasivan Puthusserypady",
        "authorids": "~Adrian_Atienza1;~Jakob_E._Bardram1;~Sadasivan_Puthusserypady1",
        "gender": "M;M;M",
        "homepage": ";https://www.bardram.net;https://orbit.dtu.dk/en/persons/sadasivan-puthusserypady",
        "dblp": "347/8343;b/JakobEBardram;",
        "google_scholar": "DF7UxzAAAAAJ;https://scholar.google.dk/citations?user=VqgHPskAAAAJ;HcBaWxkAAAAJ",
        "orcid": ";0000-0003-1390-8758;0000-0001-7564-2612",
        "linkedin": "adrian-atienza-arroyo/;bardram/;sadasivan-puthusserypady-0b62185/",
        "or_profile": "~Adrian_Atienza1;~Jakob_E._Bardram1;~Sadasivan_Puthusserypady1",
        "aff": "Technical University of Denmark;Technical University of Denmark;Technical University of Denmark",
        "aff_domain": "dtu.dk;dtu.dk;dtu.dk",
        "position": "PhD student;Full Professor;Associate Professor",
        "bibtex": "@misc{\natienza2024capturing,\ntitle={Capturing Static, Short-Term, and Long-Term Dynamics Through Self-Supervised Time Series Learning: {CHRONOS}},\nauthor={Adrian Atienza and Jakob E. Bardram and Sadasivan Puthusserypady},\nyear={2024},\nurl={https://openreview.net/forum?id=V8YwPdoSlr}\n}",
        "github": "",
        "project": "",
        "reviewers": "DudA;PCQf;S57d;pVMv",
        "site": "https://openreview.net/forum?id=V8YwPdoSlr",
        "pdf_size": 453318,
        "rating": "3;3;3;5",
        "confidence": "3;4;3;4",
        "soundness": "3;2;2;2",
        "contribution": "2;2;2;3",
        "presentation": "1;2;2;1",
        "wc_summary": "102;43;147;85",
        "wc_strengths": "92;36;88;144",
        "wc_weaknesses": "358;270;291;167",
        "wc_questions": "64;6;140;794",
        "wc_review": "616;355;666;1190",
        "wc_reply_reviewers": "169;58;216;0",
        "wc_reply_authors": "378;835;813;413",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            94.25,
            37.265097611572145
        ],
        "wc_strengths_avg": [
            90.0,
            38.2099463490856
        ],
        "wc_weaknesses_avg": [
            271.5,
            68.52919086053767
        ],
        "wc_questions_avg": [
            251.0,
            317.0820083196144
        ],
        "wc_review_avg": [
            706.75,
            302.9664791689008
        ],
        "wc_reply_reviewers_avg": [
            110.75,
            85.90510753150828
        ],
        "wc_reply_authors_avg": [
            609.75,
            214.74796273771724
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:8tPeMOppIjsJ:scholar.google.com/&scioq=Capturing+Static,+Short-Term,+and+Long-Term+Dynamics+Through+Self-Supervised+Time+Series+Learning:+CHRONOS&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Technical University of Denmark",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tek.dk",
        "aff_unique_abbr": "DTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Denmark"
    },
    {
        "id": "V8aD5pUcVX",
        "title": "What Makes for Good Visual Tokenizers for Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We empirically investigate proper pre-training methods to build good visual tokenizers, making Large Language Models (LLMs) powerful Multimodal Large Language Models (MLLMs). In our benchmark, which is curated to evaluate MLLM\u2019s visual semantic understanding and fine-grained perception capabilities, we discussed different visual tokenizers pre-trained with dominant methods (i.e., DeiT, CLIP, MAE, DINO), and observed that: i) Fully/weakly supervised models capture more semantics than self-supervised models, but the gap is narrowed by scaling up the pre-training dataset. ii) Self-supervised models are better at fine-grained perception, where patch-level supervision is particularly effective. iii) Tuning the visual tokenizer leads to the loss of semantics obtained from large-scale pretraining, which is unfavorable with a relatively small-scale instruction-tuning dataset. Given the findings, we reviewed methods that attempted to unify semantics and fine-grained visual understanding, e.g., patch-level feature distillation with semantically rich targets. We obtain an intriguing insight: mask-based strategies that were once all the rage may not be applicable for obtaining good visual tokenizers. Based on this critical observation, we obtain a new MLLM equipped with a tailored Good Visual Tokenizer \u2013 GVT, which exhibits strong visual comprehension capability at multiple scales. In particular, without introducing extra parameters and task-specific fine-tuning, GVT achieves superior performance on visual question answering, image captioning, and other fine-grained visual understanding tasks such as object counting and multi-class identification.",
        "keywords": "Visual Tokenizer;Multimodal Large Language Models;Visual Pretraining",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/29638db6eaab28af5bee05d62441c24525def3fa.pdf",
        "author": "Guangzhi Wang;Yixiao Ge;Xiaohan Ding;Mohan Kankanhalli;Ying Shan",
        "authorids": "~Guangzhi_Wang1;~Yixiao_Ge2;~Xiaohan_Ding1;~Mohan_Kankanhalli1;~Ying_Shan2",
        "gender": ";F;M;M;M",
        "homepage": "https://github.com/daoyuan98;https://geyixiao.com/;https://dingxiaohan.xyz/;https://www.comp.nus.edu.sg/~mohan;",
        "dblp": "67/1183;228/6649;218/7379;09/3613.html;68/5910",
        "google_scholar": ";TtU74NAAAAAJ;CIjw0KoAAAAJ;6Lx_eowAAAAJ;4oXBp9UAAAAJ",
        "orcid": "0000-0002-5036-4051;;;0000-0002-4846-2015;0000-0001-7673-8325",
        "linkedin": ";;;mohan-kankanhalli-583417221;YingShanProfile/",
        "or_profile": "~Guangzhi_Wang1;~Yixiao_Ge2;~Xiaohan_Ding1;~Mohan_Kankanhalli1;~Ying_Shan2",
        "aff": "National University of Singapore;Tencent;Tencent AI Lab;National University of Singapore;Tencent PCG ARC Lab",
        "aff_domain": "u.nus.edu;tencent.com;tencent.com;nus.edu.sg;arc.tencent.com",
        "position": "PhD student;Researcher;Researcher;Full Professor;Director",
        "bibtex": "@misc{\nwang2024what,\ntitle={What Makes for Good Visual Tokenizers for Large Language Models},\nauthor={Guangzhi Wang and Yixiao Ge and Xiaohan Ding and Mohan Kankanhalli and Ying Shan},\nyear={2024},\nurl={https://openreview.net/forum?id=V8aD5pUcVX}\n}",
        "github": "",
        "project": "",
        "reviewers": "v493;p5cW;NrqM",
        "site": "https://openreview.net/forum?id=V8aD5pUcVX",
        "pdf_size": 5944401,
        "rating": "5;5;6",
        "confidence": "5;4;3",
        "soundness": "3;2;3",
        "contribution": "2;2;2",
        "presentation": "3;3;3",
        "wc_summary": "52;141;117",
        "wc_strengths": "36;155;76",
        "wc_weaknesses": "137;306;319",
        "wc_questions": "32;127;500",
        "wc_review": "257;729;1012",
        "wc_reply_reviewers": "0;0;107",
        "wc_reply_authors": "438;666;764",
        "reply_reviewers": "0;0;1",
        "reply_authors": "1;1;2",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            103.33333333333333,
            37.597281225582734
        ],
        "wc_strengths_avg": [
            89.0,
            49.44357052910587
        ],
        "wc_weaknesses_avg": [
            254.0,
            82.90154803540563
        ],
        "wc_questions_avg": [
            219.66666666666666,
            201.98404777495563
        ],
        "wc_review_avg": [
            666.0,
            311.4300349463209
        ],
        "wc_reply_reviewers_avg": [
            35.666666666666664,
            50.440283724640395
        ],
        "wc_reply_authors_avg": [
            622.6666666666666,
            136.57069801225867
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 40,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14479955000791436447&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1;0;1",
        "aff_unique_norm": "National University of Singapore;Tencent",
        "aff_unique_dep": ";Tencent Holdings Limited",
        "aff_unique_url": "https://www.nus.edu.sg;https://www.tencent.com",
        "aff_unique_abbr": "NUS;Tencent",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;0;1",
        "aff_country_unique": "Singapore;China"
    },
    {
        "id": "V9C0cuEWbR",
        "title": "Soft Convex Quantization: Revisiting Vector Quantization with Convex Optimization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Vector Quantization (VQ) is a well-known technique in deep learning for extracting informative discrete latent representations. VQ-embedded models have shown impressive results in a range of applications including image and speech generation. VQ operates as a parametric K-means algorithm that quantizes inputs using a single codebook vector in the forward pass. While powerful, this technique faces practical challenges including codebook collapse, non-differentiability and lossy compression. To mitigate the aforementioned issues, we propose Soft Convex Quantization (SCQ) as a direct substitute for VQ. SCQ works like a differentiable convex optimization (DCO) layer: in the forward pass, we solve for the optimal convex combination of codebook vectors that quantize the inputs. In the backward pass, we leverage differentiability through the optimality conditions of the forward solution. We then introduce a scalable relaxation of the SCQ optimization and demonstrate its efficacy on the CIFAR-10, GTSRB and LSUN datasets. We train powerful SCQ autoencoder models that significantly outperform matched VQ-based architectures, observing an order of magnitude better image reconstruction and codebook usage with comparable quantization runtime.",
        "keywords": "convex optimization;vector quantization;representation learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/829d6de8892a5265c185f75d5c2cb2a6295664ce.zip",
        "author": "Tanmay Gautam;Reid Pryzant;Ziyi Yang;Chenguang Zhu;Somayeh Sojoudi",
        "authorids": "~Tanmay_Gautam1;~Reid_Pryzant1;~Ziyi_Yang1;~Chenguang_Zhu1;~Somayeh_Sojoudi1",
        "gender": "M;;M;M;F",
        "homepage": "https://people.eecs.berkeley.edu/~tgautam23/;;;;https://eecs.berkeley.edu/~sojoudi/",
        "dblp": ";205/3986;;48/7536-1.html;06/7000",
        "google_scholar": "oKeqnc0AAAAJ;FkufKDgAAAAJ;JkyLIM0AAAAJ;1b2kKWoAAAAJ;kNH8zcgAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;ziyi-yang;;",
        "or_profile": "~Tanmay_Gautam1;~Reid_Pryzant1;~Ziyi_Yang1;~Chenguang_Zhu1;~Somayeh_Sojoudi1",
        "aff": "University of California, Berkeley;Microsoft Research;Microsoft;Meta Facebook;University of California, Berkeley",
        "aff_domain": "berkeley.edu;research.microsoft.com;microsoft.com;meta.com;berkeley.edu",
        "position": "MS student;Researcher;Principal Researcher;Principal Researcher;Associate Professor",
        "bibtex": "@misc{\ngautam2024soft,\ntitle={Soft Convex Quantization: Revisiting Vector Quantization with Convex Optimization},\nauthor={Tanmay Gautam and Reid Pryzant and Ziyi Yang and Chenguang Zhu and Somayeh Sojoudi},\nyear={2024},\nurl={https://openreview.net/forum?id=V9C0cuEWbR}\n}",
        "github": "",
        "project": "",
        "reviewers": "d7nB;Jz15;RwMk;7Ro3",
        "site": "https://openreview.net/forum?id=V9C0cuEWbR",
        "pdf_size": 27407140,
        "rating": "3;3;6;6",
        "confidence": "3;3;4;4",
        "soundness": "2;3;3;3",
        "contribution": "1;3;3;3",
        "presentation": "2;3;3;2",
        "wc_summary": "147;65;84;64",
        "wc_strengths": "36;14;137;37",
        "wc_weaknesses": "322;174;114;35",
        "wc_questions": "1;2;40;26",
        "wc_review": "506;255;375;162",
        "wc_reply_reviewers": "230;162;0;85",
        "wc_reply_authors": "511;769;517;472",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            90.0,
            33.860005906674026
        ],
        "wc_strengths_avg": [
            56.0,
            47.6602559791699
        ],
        "wc_weaknesses_avg": [
            161.25,
            105.08895041820524
        ],
        "wc_questions_avg": [
            17.25,
            16.513252253871737
        ],
        "wc_review_avg": [
            324.5,
            129.15978476290522
        ],
        "wc_reply_reviewers_avg": [
            119.25,
            85.8585318998642
        ],
        "wc_reply_authors_avg": [
            567.25,
            117.75477697316572
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6033047580503214150&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;1;2;0",
        "aff_unique_norm": "University of California, Berkeley;Microsoft;Meta",
        "aff_unique_dep": ";Microsoft Research;Meta Platforms, Inc.",
        "aff_unique_url": "https://www.berkeley.edu;https://www.microsoft.com/en-us/research;https://meta.com",
        "aff_unique_abbr": "UC Berkeley;MSR;Meta",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Berkeley;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "VAmVEghgoC",
        "title": "Detecting Out-of-distribution with Insights from Neural Collapse",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Out-of-distribution (OOD) detection is essential for the safe deployment of AI. \nParticularly, OOD detectors should generalize effectively across diverse scenarios. \nTo improve upon the generalizability of existing OOD detectors, we introduce a highly versatile OOD detector, called Neural Collapse inspired OOD detector (NC-OOD). \nWe extend the prevalent observation that in-distribution (ID) features tend to form clusters, whereas OOD features are far away. \nParticularly, based on the recent observation, Neural Collapse, we further demonstrate that ID features tend to cluster in proximity to weight vectors. \nFrom our extended observation, we propose to detect OOD based on feature proximity to weight vectors. \nTo further rule out OOD samples, we leverage the observation that OOD features tend to reside closer to the origin than ID features. Extensive experiments show that our approach enhances the generalizability of existing work and can consistently achieve state-of-the-art OOD detection performance across a wide range of OOD Benchmarks over different classification tasks, training losses, and model architectures.",
        "keywords": "Out-of-distribution detection; Neural Collapse",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/541e6429dc7adb987bda20ebea2ffe4043a2fdb0.zip",
        "author": "Litian Liu;Yao Qin",
        "authorids": "~Litian_Liu1;~Yao_Qin1",
        "gender": "F;",
        "homepage": "https://litianliu.github.io/;https://yaoqin1.github.io",
        "dblp": ";66/10420-1",
        "google_scholar": ";https://scholar.google.com/citations?view_op=list_works",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Litian_Liu1;~Yao_Qin1",
        "aff": "Qualcomm Inc, QualComm;Google",
        "aff_domain": "qti.qualcomm.com;google.com",
        "position": "Researcher;Researcher",
        "bibtex": "@misc{\nliu2024detecting,\ntitle={Detecting Out-of-distribution with Insights from Neural Collapse},\nauthor={Litian Liu and Yao Qin},\nyear={2024},\nurl={https://openreview.net/forum?id=VAmVEghgoC}\n}",
        "github": "",
        "project": "",
        "reviewers": "ayHR;cGpn;GX46;vw3f",
        "site": "https://openreview.net/forum?id=VAmVEghgoC",
        "pdf_size": 1231816,
        "rating": "3;5;5;5",
        "confidence": "4;4;3;4",
        "soundness": "2;3;2;2",
        "contribution": "2;2;2;2",
        "presentation": "2;2;3;3",
        "wc_summary": "118;69;81;77",
        "wc_strengths": "20;33;53;24",
        "wc_weaknesses": "640;274;150;195",
        "wc_questions": "2;2;22;131",
        "wc_review": "780;378;306;427",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            86.25,
            18.833148966649205
        ],
        "wc_strengths_avg": [
            32.5,
            12.737739202856996
        ],
        "wc_weaknesses_avg": [
            314.75,
            192.95773500950926
        ],
        "wc_questions_avg": [
            39.25,
            53.597457962108614
        ],
        "wc_review_avg": [
            472.75,
            182.53681135595636
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:eyeP37TrzngJ:scholar.google.com/&scioq=Detecting+Out-of-distribution+with+Insights+from+Neural+Collapse&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Qualcomm Incorporated;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.qualcomm.com;https://www.google.com",
        "aff_unique_abbr": "Qualcomm;Google",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "VAvSUG3hwI",
        "title": "One by One, Continual Coordinating with Humans via Hyper-Teammate Identification",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "One of the primary objectives in modern artificial intelligence researches is to empower  agents to effectively coordinate with diverse teammates, particularly human teammates. Previous studies focused on training agents either with a fixed population of pre-generated teammates or through the co-evolution of distinct populations of agents and teammates. However, it is challenging to enumerate all possible teammates in advance, and it is costly, or even impractical to maintain such a sufficiently diverse population and repeatedly interact with previously encountered teammates. Additional design considerations, such as prioritized sampling, are also required to ensure efficient training. To address these challenges and obtain an efficient human-AI coordination paradigm, we propose a novel approach called \\textbf{Concord}. Considering that human participants tend to occur in a sequential manner, we model the training process with different teammates as a continual learning framework, akin to how humans learn and adapt in the real world.  We propose a mechanism based on hyper-teammate identification to prevent catastrophic forgetting while promoting forward knowledge transfer.  Concretely, we introduce a teammate recognition module that captures the identification of corresponding teammates. Leveraging the identification, a well-coordinated AI policy can be generated via the hyper-network. The entire framework is trained in a decomposed policy gradient manner,  allowing for effective credit assignment among agents. This approach enables us to train agents with each generated teammate or humans one by one, ensuring that agents can coordinate effectively with concurrent teammates without forgetting previous knowledge. Our approach outperforms multiple baselines in various multi-agent benchmarks, either with generated human proxies or real human participants.",
        "keywords": "Multi-agent Reinforcement Learning;Cooperation and Coordination;Continual Coordination;Human-AI Coordination",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/2143b56c8c7be335e824c3effc882e941387d9b6.zip",
        "author": "Cong Guan;Feng Chen;Ke Xue;Chunpeng Fan;Lichao Zhang;Ziqian Zhang;Pengyao Zhao;Zongzhang Zhang;Chao Qian;Lei Yuan;Yang Yu",
        "authorids": "~Cong_Guan1;~Feng_Chen12;~Ke_Xue1;~Chunpeng_Fan1;~Lichao_Zhang3;~Ziqian_Zhang2;~Pengyao_Zhao1;~Zongzhang_Zhang1;~Chao_Qian1;~Lei_Yuan2;~Yang_Yu5",
        "gender": "M;M;M;;M;M;M;M;M;M;",
        "homepage": "http://www.lamda.nju.edu.cn/guanc/;;http://www.lamda.nju.edu.cn/xuek/;;http://polixir.ai/;;https://github.com/dlmuzpy;http://www.lamda.nju.edu.cn/zhangzz;http://www.lamda.nju.edu.cn/qianc/;http://www.lamda.nju.edu.cn/yuanl/;",
        "dblp": "191/7206;21/3047-42;93/2469-1;;126/8027;234/0368;264/9619.html;90/8724;84/8508-1;23/6750-1;",
        "google_scholar": ";QgorT8QAAAAJ;78bZVOwAAAAJ;;;cTYBlgkAAAAJ;;sG7WEAgAAAAJ;;https://scholar.google.com/citations?hl=zh-CN;",
        "orcid": ";;0000-0001-6789-2670;;;;;;;;",
        "linkedin": ";;;;;;;;;;",
        "or_profile": "~Cong_Guan1;~Feng_Chen12;~Ke_Xue1;~Chunpeng_Fan1;~Lichao_Zhang3;~Ziqian_Zhang2;~Pengyao_Zhao1;~Zongzhang_Zhang1;~Chao_Qian1;~Lei_Yuan2;~Yang_Yu5",
        "aff": "Nanjing University;Nanjing University;Nanjing University;;POLIXIR;Nanjing University;POLIXIR;Nanjing University;Nanjing university;Nanjing University;",
        "aff_domain": "nju.edu.cn;lamda.nju.edu.cn;nju.edu.cn;;polixir.ai;nju.edu.cn;polixir.ai;nju.edu.cn;nju.edu;nju.edu.cn;",
        "position": "PhD student;MS student;PhD student;;Researcher;MS student;Researcher;Associate Professor;Full Professor;Researcher;",
        "bibtex": "@misc{\nguan2024one,\ntitle={One by One, Continual Coordinating with Humans via Hyper-Teammate Identification},\nauthor={Cong Guan and Feng Chen and Ke Xue and Chunpeng Fan and Lichao Zhang and Ziqian Zhang and Pengyao Zhao and Zongzhang Zhang and Chao Qian and Lei Yuan and Yang Yu},\nyear={2024},\nurl={https://openreview.net/forum?id=VAvSUG3hwI}\n}",
        "github": "",
        "project": "",
        "reviewers": "d3uq;rwTj;v6K1",
        "site": "https://openreview.net/forum?id=VAvSUG3hwI",
        "pdf_size": 4399264,
        "rating": "3;5;6",
        "confidence": "5;4;3",
        "soundness": "3;3;2",
        "contribution": "2;2;2",
        "presentation": "3;3;3",
        "wc_summary": "80;146;79",
        "wc_strengths": "39;79;39",
        "wc_weaknesses": "448;198;176",
        "wc_questions": "7;169;172",
        "wc_review": "574;592;466",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            101.66666666666667,
            31.351058816073323
        ],
        "wc_strengths_avg": [
            52.333333333333336,
            18.856180831641264
        ],
        "wc_weaknesses_avg": [
            274.0,
            123.36396016125076
        ],
        "wc_questions_avg": [
            116.0,
            77.08436936240706
        ],
        "wc_review_avg": [
            544.0,
            55.641710972974224
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": -0.9819805060619659,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ziXqgrc-8oUJ:scholar.google.com/&scioq=One+by+One,+Continual+Coordinating+with+Humans+via+Hyper-Teammate+Identification&hl=en&as_sdt=0,5",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0;1;0;1;0;0;0",
        "aff_unique_norm": "Nanjing University;Polixir",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.nju.edu.cn;",
        "aff_unique_abbr": "Nanjing U;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China;"
    },
    {
        "id": "VAwgL8kPvr",
        "title": "Structural Pruning of Large Language Models via Neural Architecture Search",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs) mark the state-of-the-art for natural language understanding. \nHowever, their large size poses challenges in deploying them for inference in real-world applications, due to significant GPU memory requirements and high inference latency.\nThis paper explores weight-sharing based neural architecture search (NAS) as a form of structural pruning to find sub-parts of the fine-tuned network that optimally trade-off efficiency, for example in terms of model size or latency, and generalization performance. \nUnlike traditional pruning methods with fixed thresholds, we propose to adopt a multi-objective approach that identifies the Pareto optimal set of sub-networks, allowing for a more flexible and automated compression process.\nOur NAS approach achieves up to 50% compression with less than 5% performance drop for a fine-tuned BERT model on 7 out of 8 text classification tasks.",
        "keywords": "Neural architecture search;model compression;structural pruning;large language models",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Aaron Klein;Jacek Golebiowski;Xingchen Ma;Valerio Perrone;Cedric Archambeau",
        "authorids": "~Aaron_Klein1;~Jacek_Golebiowski1;~Xingchen_Ma1;~Valerio_Perrone1;~Cedric_Archambeau1",
        "gender": "M;M;M;M;M",
        "homepage": "https://aaronkl.github.io/;;;https://sites.google.com/view/valerioperrone/;http://www0.cs.ucl.ac.uk/staff/c.archambeau/",
        "dblp": "178/3281;314/8576;192/5223;202/1297;59/1878",
        "google_scholar": "usl__skAAAAJ;K5ivIucAAAAJ;;https://scholar.google.de/citations?user=gXqr8A4AAAAJ;pPx5WWIAAAAJ",
        "orcid": ";;0000-0001-9667-3768;;",
        "linkedin": ";jacek-golebiowski/;;valerio-perrone-391731132/;carchambeau/",
        "or_profile": "~Aaron_Klein1;~Jacek_Golebiowski1;~Xingchen_Ma1;~Valerio_Perrone1;~Cedric_Archambeau1",
        "aff": "Amazon Berlin;Amazon;Amazon Development Center Germany;Amazon;Helsing",
        "aff_domain": "amazon.com;amazon.com;amazon.de;amazon.com;helsing.ai",
        "position": "Scientist;Researcher;Applied Scientist;Senior Machine Learning Scientist;Principal Researcher",
        "bibtex": "@misc{\nklein2024structural,\ntitle={Structural Pruning of Large Language Models via Neural Architecture Search},\nauthor={Aaron Klein and Jacek Golebiowski and Xingchen Ma and Valerio Perrone and Cedric Archambeau},\nyear={2024},\nurl={https://openreview.net/forum?id=VAwgL8kPvr}\n}",
        "github": "",
        "project": "",
        "reviewers": "aZ9T;t4jT;2Az8",
        "site": "https://openreview.net/forum?id=VAwgL8kPvr",
        "pdf_size": 969871,
        "rating": "3;5;6",
        "confidence": "4;5;2",
        "soundness": "3;3;3",
        "contribution": "2;2;3",
        "presentation": "2;3;3",
        "wc_summary": "74;51;61",
        "wc_strengths": "46;55;44",
        "wc_weaknesses": "383;121;33",
        "wc_questions": "54;2;50",
        "wc_review": "557;229;188",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "472;273;338",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.6666666666666665,
            1.247219128924647
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            62.0,
            9.41629792788369
        ],
        "wc_strengths_avg": [
            48.333333333333336,
            4.784233364802441
        ],
        "wc_weaknesses_avg": [
            179.0,
            148.65620292025042
        ],
        "wc_questions_avg": [
            35.333333333333336,
            23.6267268622258
        ],
        "wc_review_avg": [
            324.6666666666667,
            165.13496163912583
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            361.0,
            82.85328398239062
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6494996550977295377&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0;1",
        "aff_unique_norm": "Amazon;Helsing",
        "aff_unique_dep": "Amazon;",
        "aff_unique_url": "https://www.amazon.de;",
        "aff_unique_abbr": "Amazon;",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Berlin;",
        "aff_country_unique_index": "0;1;0;1",
        "aff_country_unique": "Germany;United States;"
    },
    {
        "id": "VB2WkqvFwF",
        "title": "The Underlying Scaling Laws and Universal Statistical Structure of Complex Datasets",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We study universal traits which emerge both in real-world complex datasets, as well as in artificially generated ones. Our approach is to analogize data to a physical system and employ tools from statistical physics and Random Matrix Theory (RMT) to reveal their underlying structure. We focus on the feature-feature covariance matrix, analyzing both its local and global eigenvalue statistics. Our main observations are: (i) The power-law scalings that the bulk of its eigenvalues exhibit are vastly different for uncorrelated normally distributed data compared to real-world data, (ii) this scaling behavior can be completely modeled by generating gaussian data with long range correlations, (iii) both generated and real-world datasets lie in the same universality class from the RMT perspective, as chaotic rather than integrable systems, (iv) the expected RMT statistical behavior already manifests for empirical covariance matrices at dataset sizes significantly smaller than those conventionally used for real-world training, and can be related to the number of samples required to approximate the population power-law scaling behavior, (v) the Shannon entropy is correlated with local RMT structure and eigenvalues scaling, and substantially smaller in strongly correlated datasets compared to uncorrelated synthetic data, and requires fewer samples to reach the distribution entropy. These findings show that with sufficient sample size, the Gram matrix of natural image datasets can be well approximated by a Wishart random matrix with a simple covariance structure, opening the door to rigorous studies of neural network dynamics and generalization which rely on the data Gram matrix.",
        "keywords": "Random Matrix Theory;Data Structure;Universality;Random Feature Models;Empirical Data Estimation;Neural Scaling Laws",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Noam Itzhak Levi;Yaron Oz",
        "authorids": "~Noam_Itzhak_Levi1;~Yaron_Oz1",
        "gender": "M;",
        "homepage": "https://inspirehep.net/authors/1645549;",
        "dblp": "97/693;",
        "google_scholar": "bOrtf9UAAAAJ;",
        "orcid": "0000-0002-3421-6059;",
        "linkedin": "noam-levi-b240035a/;",
        "or_profile": "~Noam_Itzhak_Levi1;~Yaron_Oz1",
        "aff": "Tel Aviv University;Tel Aviv University, Technion",
        "aff_domain": "tau.ac.il;tau.ac.il",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nlevi2024the,\ntitle={The Underlying Scaling Laws and Universal Statistical Structure of Complex Datasets},\nauthor={Noam Itzhak Levi and Yaron Oz},\nyear={2024},\nurl={https://openreview.net/forum?id=VB2WkqvFwF}\n}",
        "github": "",
        "project": "",
        "reviewers": "HU1E;A5az;tQUp",
        "site": "https://openreview.net/forum?id=VB2WkqvFwF",
        "pdf_size": 2421621,
        "rating": "3;5;5",
        "confidence": "4;3;3",
        "soundness": "3;3;2",
        "contribution": "2;3;2",
        "presentation": "3;3;2",
        "wc_summary": "104;61;64",
        "wc_strengths": "148;63;58",
        "wc_weaknesses": "254;225;370",
        "wc_questions": "459;700;3",
        "wc_review": "965;1049;495",
        "wc_reply_reviewers": "0;114;0",
        "wc_reply_authors": "827;751;728",
        "reply_reviewers": "0;1;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            76.33333333333333,
            19.601587237318874
        ],
        "wc_strengths_avg": [
            89.66666666666667,
            41.298372311212894
        ],
        "wc_weaknesses_avg": [
            283.0,
            62.64716008460931
        ],
        "wc_questions_avg": [
            387.3333333333333,
            289.02633482473914
        ],
        "wc_review_avg": [
            836.3333333333334,
            243.78314589450645
        ],
        "wc_reply_reviewers_avg": [
            38.0,
            53.74011537017761
        ],
        "wc_reply_authors_avg": [
            768.6666666666666,
            42.3031388380999
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.9999999999999998,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12808627158960626724&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Tel Aviv University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tau.ac.il",
        "aff_unique_abbr": "TAU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Israel"
    },
    {
        "id": "VCnuSuDSHv",
        "title": "Identifying Spurious Biases Early in Training through the Lens of Simplicity Bias",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Neural networks trained with (stochastic) gradient descent have an inductive bias towards learning simpler solutions. This makes them highly prone to learning simple \\textit{spurious} features that are highly correlated with a label instead of the predictive but more complex core features. In this work, we show that, interestingly, the simplicity bias of gradient descent, can be leveraged to identify spurious correlations early in training. We provide theoretical insights on a two-layer neural network that subsets of data points where the spurious features strongly influence the label predictions are separable based on the model's output in the initial training iterations. We further show that if spurious features have a small enough noise-to-signal ratio, the network\u2019s output on the majority of examples \ncontaining the spurious feature will be almost exclusively determined by the spurious features and will be nearly invariant to the core feature, leading to poor generalization performance for minority groups. Building on these findings, we propose SPARE, which separates groups with spurious features early in training and utilizes importance sampling to alleviate the spurious correlation by balancing the group sizes. \nThrough rigorous experiments, we first establish SPARE's effectiveness in discovering spurious correlations in the Restricted ImageNet dataset. We then demonstrate that SPARE outperforms state-of-the-art methods by up to 5.6\\% in worst-group accuracy, while being up to 12x faster.",
        "keywords": "spurious correlations;simplicity bias",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/56b3f08481279dd29c87242228657b648d8e0223.zip",
        "author": "Yu Yang;Eric Gan;Gintare Karolina Dziugaite;Baharan Mirzasoleiman",
        "authorids": "~Yu_Yang4;~Eric_Gan1;~Gintare_Karolina_Dziugaite1;~Baharan_Mirzasoleiman1",
        "gender": "F;M;F;F",
        "homepage": "https://sites.google.com/view/yuyang0901/home;;http://gkdz.org/;http://web.cs.ucla.edu/~baharan/",
        "dblp": "16/4505-7;347/3322;163/1774;52/10075",
        "google_scholar": "KK6Yj4IAAAAJ;;5K1QB_8AAAAJ;x63j7HEAAAAJ",
        "orcid": ";;;",
        "linkedin": ";eric-gan-107889207/;;",
        "or_profile": "~Yu_Yang4;~Eric_Gan1;~Gintare_Karolina_Dziugaite1;~Baharan_Mirzasoleiman1",
        "aff": "University of California, Los Angeles;University of California, Los Angeles;Montreal Institute for Learning Algorithms, University of Montreal, University of Montreal;University of California, Los Angeles",
        "aff_domain": "ucla.edu;ucla.edu;mila.umontreal.ca;ucla.edu",
        "position": "PhD student;Undergrad student;Member;Assistant Professor",
        "bibtex": "@misc{\nyang2024identifying,\ntitle={Identifying Spurious Biases Early in Training through the Lens of Simplicity Bias},\nauthor={Yu Yang and Eric Gan and Gintare Karolina Dziugaite and Baharan Mirzasoleiman},\nyear={2024},\nurl={https://openreview.net/forum?id=VCnuSuDSHv}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=VCnuSuDSHv",
        "pdf_size": 6378652,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 28,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4718830017672141356&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "University of California, Los Angeles;University of Montreal",
        "aff_unique_dep": ";Montreal Institute for Learning Algorithms",
        "aff_unique_url": "https://www.ucla.edu;https://www.umontreal.ca",
        "aff_unique_abbr": "UCLA;UM",
        "aff_campus_unique_index": "0;0;1;0",
        "aff_campus_unique": "Los Angeles;Montreal",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "United States;Canada"
    },
    {
        "id": "VCscggkg2t",
        "title": "Goal2FlowNet: Learning Diverse Policy Covers using GFlowNets for Goal-Conditioned RL",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Goal-Conditioned Reinforcement Learning is a promising direction for learning policies to reach a diverse set of goals and achieve a flexible and adaptable agent capable of solving multiple tasks. However, many current approaches train policies that explore only a subset of the state space or learn to achieve only a subset of goals in a limited number of ways, leading to suboptimality in these learned policies. This leads to brittleness when the agent is taken into new regions of the state space, or when the distribution changes, rendering the learnt policy ineffective. Additionally, we argue that this also leads to poor sample efficiency and convergence because the knowledge for a specific set of goals has worse generalization to other goals. We propose \\emph{Goal2FlowNets}, that use Generative Flow Networks (GFlowNets) in order to learn exploratory goal-conditioned policies that are robust and can generalize better by learning multiple nearly optimal paths to reach the goals. We show that this leads to a significant improvement in sample complexity and enables better zero-shot and few-shot generalization to novel environmental changes through the learning of a stochastic goal-conditioned policy that has a wide coverage of the state and goal space.",
        "keywords": "GFlowNets;Goal-Conditioned Reinforcement Learning;Generalization",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Kanika Madan;Albert Zhan;Alex Lamb;Emmanuel Bengio;Ling Pan;Glen Berseth;Yoshua Bengio",
        "authorids": "~Kanika_Madan3;~Albert_Zhan1;~Alex_Lamb1;~Emmanuel_Bengio1;~Ling_Pan1;~Glen_Berseth1;~Yoshua_Bengio1",
        "gender": ";M;;M;F;M;M",
        "homepage": ";https://albertzhan.github.io;;http://folinoid.com;https://ling-pan.github.io/;http://fracturedplane.com/;http://yoshuabengio.org",
        "dblp": ";258/1288;;137/8040;199/9303/;147/5478;56/953",
        "google_scholar": ";P356Id4AAAAJ;;https://scholar.google.ca/citations?user=yVtSOt8AAAAJ;qZ_zlacAAAAJ;https://scholar.google.ca/citations?user=-WZcuuwAAAAJ;kukA0LcAAAAJ",
        "orcid": ";;;;;0000-0001-7351-8028;",
        "linkedin": ";;;;;glen-berseth-0523278b?trk=hp-identity-name;yoshuabengio/?originalSubdomain=ca",
        "or_profile": "~Kanika_Madan3;~Albert_Zhan1;~Alex_Lamb1;~Emmanuel_Bengio1;~Ling_Pan1;~Glen_Berseth1;~Yoshua_Bengio1",
        "aff": ";Universit\u00e9 de Montr\u00e9al;;Valence Labs powered by recursion;Montreal Institute for Learning Algorithms (MILA);Montreal Institute for Learning Algorithms, University of Montreal, Universit\u00e9 de Montr\u00e9al;University of Montreal",
        "aff_domain": ";umontreal.ca;;valencelabs.com;mila.umontreal.ca;mila.umontreal.ca;umontreal.ca",
        "position": ";PhD student;;Researcher;Postdoc;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nmadan2024goalflownet,\ntitle={Goal2FlowNet: Learning Diverse Policy Covers using {GF}lowNets for Goal-Conditioned {RL}},\nauthor={Kanika Madan and Albert Zhan and Alex Lamb and Emmanuel Bengio and Ling Pan and Glen Berseth and Yoshua Bengio},\nyear={2024},\nurl={https://openreview.net/forum?id=VCscggkg2t}\n}",
        "github": "",
        "project": "",
        "reviewers": "RmNo;c4yU;vRuK",
        "site": "https://openreview.net/forum?id=VCscggkg2t",
        "pdf_size": 4130327,
        "rating": "3;3;3",
        "confidence": "4;4;5",
        "soundness": "2;3;3",
        "contribution": "2;3;2",
        "presentation": "1;1;2",
        "wc_summary": "79;34;124",
        "wc_strengths": "73;38;113",
        "wc_weaknesses": "247;92;128",
        "wc_questions": "176;2;156",
        "wc_review": "575;166;521",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            79.0,
            36.742346141747674
        ],
        "wc_strengths_avg": [
            74.66666666666667,
            30.64129385141706
        ],
        "wc_weaknesses_avg": [
            155.66666666666666,
            66.23359335630892
        ],
        "wc_questions_avg": [
            111.33333333333333,
            77.74030843491397
        ],
        "wc_review_avg": [
            420.6666666666667,
            181.4209347224172
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:f3rZEL8ZB2YJ:scholar.google.com/&scioq=Goal2FlowNet:+Learning+Diverse+Policy+Covers+using+GFlowNets+for+Goal-Conditioned+RL&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;3",
        "aff_unique_norm": "Universit\u00e9 de Montr\u00e9al;Valence Labs;Montreal Institute for Learning Algorithms;University of Montreal",
        "aff_unique_dep": ";;Artificial Intelligence;Montreal Institute for Learning Algorithms",
        "aff_unique_url": "https://www.umontreal.ca;;https://mila.quebec;https://www.mila.quebec",
        "aff_unique_abbr": "UdeM;;MILA;MILA",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Montreal",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Canada;"
    },
    {
        "id": "VDcmdsHM5X",
        "title": "On the power of graph neural networks and the role of the activation function",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In this article we present new results about the expressivity of Graph Neural Networks (GNNs). We prove that for any GNN with piecewise polynomial activations and whose architecture size does not grow with the graph input sizes, there exists a pair of non-isomorphic rooted trees of depth two such that the GNN cannot distinguish their root vertex up to an arbitrary number of iterations. The proof relies on tools the algebra of symmetric polynomials. In contrast, it was already known that unbounded GNNs (those whose size is allowed to change with the graph sizes) with piecewise polynomial activations can distinguish these vertices in only two iterations. Our results imply a strict separation between bounded and unbounded size GNNs, answering an open question formulated by [Grohe, 2021].\n\nWe next prove that if one allows activations that are not piecewise polynomial, then in two iterations a single neuron perceptron can distinguish the root vertices of any pair of non-isomorphic trees of depth two (our results hold for activations like the sigmoid, hyperbolic tan and others). This shows how the power of graph neural networks can change drastically if one changes the activation function of the neural networks. The proof of this result utilizes the Lindemann-Weierstrass theorem from transcendental number theory.",
        "keywords": "Graph Neural Networks;Expressivity;Descriptive Complexity;Combinatorics;Algebra",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Sammy Khalife;Amitabh Basu",
        "authorids": "~Sammy_Khalife1;~Amitabh_Basu1",
        "gender": "Not Specified;M",
        "homepage": "https://khalife.github.io;",
        "dblp": "230/7960;",
        "google_scholar": ";",
        "orcid": "0000-0003-3161-7794;",
        "linkedin": ";",
        "or_profile": "~Sammy_Khalife1;~Amitabh_Basu1",
        "aff": "Cornell University;Johns Hopkins University",
        "aff_domain": "cornell.edu;jhu.edu",
        "position": "Postdoc;Assistant Professor",
        "bibtex": "@misc{\nkhalife2024on,\ntitle={On the power of graph neural networks and the role of the activation function},\nauthor={Sammy Khalife and Amitabh Basu},\nyear={2024},\nurl={https://openreview.net/forum?id=VDcmdsHM5X}\n}",
        "github": "",
        "project": "",
        "reviewers": "2Pnx;HnF2;QzRv;b3We",
        "site": "https://openreview.net/forum?id=VDcmdsHM5X",
        "pdf_size": 294768,
        "rating": "1;3;5;6",
        "confidence": "5;5;3;3",
        "soundness": "3;3;3;2",
        "contribution": "2;2;3;3",
        "presentation": "3;2;2;2",
        "wc_summary": "4;87;73;99",
        "wc_strengths": "4;49;79;46",
        "wc_weaknesses": "167;47;216;130",
        "wc_questions": "4;143;33;6",
        "wc_review": "179;326;401;281",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "211;42;42;42",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.75,
            1.920286436967152
        ],
        "confidence_avg": [
            4.0,
            1.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            65.75,
            36.819661866997095
        ],
        "wc_strengths_avg": [
            44.5,
            26.706740722147284
        ],
        "wc_weaknesses_avg": [
            140.0,
            61.75354240851289
        ],
        "wc_questions_avg": [
            46.5,
            56.879258082362504
        ],
        "wc_review_avg": [
            296.75,
            80.36907054333776
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            84.25,
            73.17914661978507
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.911322376865767,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3531365634567928023&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Cornell University;Johns Hopkins University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cornell.edu;https://www.jhu.edu",
        "aff_unique_abbr": "Cornell;JHU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "VDkye4EKVe",
        "title": "Discovering Minimal Reinforcement Learning Environments",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Human agents often acquire skills under conditions that are significantly different from the context in which the skill is needed. For example, students prepare for an exam not by taking it, but by studying books or supplementary material. Can artificial agents benefit from training outside of their evaluation environment as well? In this project, we develop a novel meta-optimization framework to discover neural network-based synthetic environments.  We find that training contextual bandits suffices to train Reinforcement Learning agents that generalize well to their evaluation environment, eliminating the need to meta-learn a transition function. We show that the synthetic contextual bandits train Reinforcement Learning agents in a fraction of time steps and wall clock time, and generalize across hyperparameter settings and algorithms. Using our method in combination with a curriculum on the performance evaluation horizon, we are able to achieve competitive results on a number of challenging continuous control problems. Our approach opens a multitude of new research directions: Contextual bandits are easy to interpret, yielding insights into the tasks that are encoded by the evaluation environment. Additionally, we demonstrate that synthetic environments can be used in downstream meta-learning setups, derive a new policy from the differentiable reward function, and show that the synthetic environments generalize to entirely different optimization settings.",
        "keywords": "Reinforcement Learning;Meta-Learning;Evolution Strategies;Environments",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/8d62a90cd9973786f748995dd7c6238e10656932.zip",
        "author": "Jarek Luca Liesen;Chris Lu;Andrei Lupu;Jakob Nicolaus Foerster;Henning Sprekeler;Robert Tjarko Lange",
        "authorids": "~Jarek_Luca_Liesen1;~Chris_Lu1;~Andrei_Lupu1;~Jakob_Nicolaus_Foerster1;~Henning_Sprekeler1;~Robert_Tjarko_Lange1",
        "gender": "M;;M;M;;",
        "homepage": "https://jarek.ai;;;https://www.jakobfoerster.com;https://www.sprekelerlab.org/;https://roberttlange.github.io/",
        "dblp": ";77/9579;218/7027;176/5095;66/5955;245/9152",
        "google_scholar": "JSvnpS0AAAAJ;4WLoIRsAAAAJ;I6aB-YUAAAAJ;6z4lQzMAAAAJ;https://scholar.google.de/citations?user=m0v2CxEAAAAJ;https://scholar.google.es/citations?user=cTrc3x4AAAAJ",
        "orcid": ";;;;;",
        "linkedin": "jarek-liesen/;;lupu-andrei;;;",
        "or_profile": "~Jarek_Luca_Liesen1;~Chris_Lu1;~Andrei_Lupu1;~Jakob_Nicolaus_Foerster1;~Henning_Sprekeler1;~Robert_Tjarko_Lange1",
        "aff": "Bernstein center for computational neuroscience;University of Oxford;Meta AI;University of Oxford, University of Oxford;Technische Universit\u00e4t Berlin;TU Berlin",
        "aff_domain": "bccn-berlin.de;ox.ac.uk;meta.com;eng.ox.ac.uk;tu-berlin.de;tu-berlin.de",
        "position": "MS student;PhD student;Researcher;Associate Professor;Full Professor;PhD student",
        "bibtex": "@misc{\nliesen2024discovering,\ntitle={Discovering Minimal Reinforcement Learning Environments},\nauthor={Jarek Luca Liesen and Chris Lu and Andrei Lupu and Jakob Nicolaus Foerster and Henning Sprekeler and Robert Tjarko Lange},\nyear={2024},\nurl={https://openreview.net/forum?id=VDkye4EKVe}\n}",
        "github": "",
        "project": "",
        "reviewers": "nrWg;rbXB;XskH;ABpb",
        "site": "https://openreview.net/forum?id=VDkye4EKVe",
        "pdf_size": 1799301,
        "rating": "3;3;3;3",
        "confidence": "4;2;4;4",
        "soundness": "2;3;2;2",
        "contribution": "2;3;2;2",
        "presentation": "1;2;3;3",
        "wc_summary": "59;85;98;200",
        "wc_strengths": "87;88;32;64",
        "wc_weaknesses": "439;76;504;266",
        "wc_questions": "111;20;115;215",
        "wc_review": "696;269;749;745",
        "wc_reply_reviewers": "0;0;0;212",
        "wc_reply_authors": "866;451;657;1493",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            110.5,
            53.54670858232091
        ],
        "wc_strengths_avg": [
            67.75,
            22.76373211931646
        ],
        "wc_weaknesses_avg": [
            321.25,
            166.17968437808517
        ],
        "wc_questions_avg": [
            115.25,
            68.99411206762501
        ],
        "wc_review_avg": [
            614.75,
            200.70672011669166
        ],
        "wc_reply_reviewers_avg": [
            53.0,
            91.7986928011505
        ],
        "wc_reply_authors_avg": [
            866.75,
            390.2027517842487
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14130124361547593229&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;1;3;3",
        "aff_unique_norm": "Bernstein Center for Computational Neuroscience;University of Oxford;Meta;Technische Universit\u00e4t Berlin",
        "aff_unique_dep": "Computational Neuroscience;;Meta AI;",
        "aff_unique_url": "https://www.bccn-berlin.de;https://www.ox.ac.uk;https://meta.com;https://www.tu-berlin.de",
        "aff_unique_abbr": "BCCN;Oxford;Meta;TU Berlin",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Berlin",
        "aff_country_unique_index": "0;1;2;1;0;0",
        "aff_country_unique": "Germany;United Kingdom;United States"
    },
    {
        "id": "VEwUA1wbrz",
        "title": "Linguistic Image Understanding",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We present a novel, text-centric vision-language framework called Linguistic Image Understanding (LIU). It introduces a unique pipeline for image-text processing by transforming images into comprehensive textual descriptions that encapsulate not only comprehensive object semantic details but also the spatial positioning of objects within images, enriching visual grounding ability. Then  LIU feeds these descriptions into pretrained large language models to handle vision-language tasks without seeing the image and achieves promising performance on many vision-language tasks with high computational efficiency and enhanced interpretability.   Experimental results show that   LIU exhibits a unique potential to refine and elevate the quality of existing vision-language pre-train datasets, resulting in significantly improved Image-Text Matching scores.  Accordingly, vision-language models fine-tuned on these refined datasets have also shown performance improvement across a broad spectrum of vision-language tasks.   Our work points to a promising future where the amalgamation of advanced language models and semantic-rich textual descriptions can drive the evolution of more efficient and adaptable vision-language models.",
        "keywords": "vision-language;text-centric;dataset refinement",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/1e77fd6256d8a785461d677db3bb2ebca1a97255.zip",
        "author": "Alex Jinpeng Wang;Pan Zhou;Xudong Lin;Mike Zheng Shou",
        "authorids": "~Alex_Jinpeng_Wang1;~Pan_Zhou3;~Xudong_Lin1;~Mike_Zheng_Shou1",
        "gender": ";;M;",
        "homepage": ";;;",
        "dblp": ";;23/7723-3;",
        "google_scholar": ";;https://scholar.google.com.hk/citations?hl=en;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Alex_Jinpeng_Wang1;~Pan_Zhou3;~Xudong_Lin1;~Mike_Zheng_Shou1",
        "aff": ";;Columbia University;",
        "aff_domain": ";;columbia.edu;",
        "position": ";;PhD student;",
        "bibtex": "@misc{\nwang2024linguistic,\ntitle={Linguistic Image Understanding},\nauthor={Alex Jinpeng Wang and Pan Zhou and Xudong Lin and Mike Zheng Shou},\nyear={2024},\nurl={https://openreview.net/forum?id=VEwUA1wbrz}\n}",
        "github": "",
        "project": "",
        "reviewers": "kGwW;bm8R;9a9c;PcyU",
        "site": "https://openreview.net/forum?id=VEwUA1wbrz",
        "pdf_size": 12936692,
        "rating": "3;3;5;5",
        "confidence": "4;4;4;5",
        "soundness": "2;2;3;2",
        "contribution": "2;2;2;2",
        "presentation": "2;2;3;3",
        "wc_summary": "85;46;40;39",
        "wc_strengths": "22;43;25;52",
        "wc_weaknesses": "216;382;22;361",
        "wc_questions": "1;3;62;8",
        "wc_review": "324;474;149;460",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            52.5,
            18.953891421024867
        ],
        "wc_strengths_avg": [
            35.5,
            12.459935794377111
        ],
        "wc_weaknesses_avg": [
            245.25,
            143.87038437426932
        ],
        "wc_questions_avg": [
            18.5,
            25.243811122728676
        ],
        "wc_review_avg": [
            351.75,
            130.9014419324707
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0",
        "aff_unique_norm": "Columbia University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.columbia.edu",
        "aff_unique_abbr": "Columbia",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "VGLU5N1AD2",
        "title": "Incentivized Black-Box Model Sharing",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Black-box model sharing is a preferable alternative to data sharing because of practical considerations (e.g., administrative regulation and data expiration). However, previous works may neglect the self-interests of individual parties. To encourage self-interested parties to contribute predictions in the ensemble, it is crucial to provide incentives, such as __fairness__: allocating higher reward/payoff to parties with more contributions, and __individual rationality__: ensuring guaranteed model performance improvement for each party. This paper presents a novel incentivized black-box model sharing framework that fairly distributes ensemble predictions and monetary payoffs commensurate to each party's contribution. We propose a contribution measure using the average ensemble weight of black-box models. Subsequently, we derive a closed-form solution that explicitly determines the fair reward and payoff allocation given the contribution and payment. By incorporating ensemble predictions and analyzing the generalization error bound, we theoretically show approximate individual rationality is guaranteed. Furthermore, we empirically demonstrate our proposed method achieves incentive guarantee using real-world datasets.",
        "keywords": "incentives;ensemble distillation;collaborative learning;model sharing",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/06068cfa64cbd600c680eb14c55b2341b36b09a5.zip",
        "author": "Wenyang Hu;Xinyi Xu;See-Kiong Ng;Bryan Kian Hsiang Low",
        "authorids": "~Wenyang_Hu1;~Xinyi_Xu4;~See-Kiong_Ng1;~Bryan_Kian_Hsiang_Low1",
        "gender": ";M;M;M",
        "homepage": "https://scholar.google.com/citations?user=EecZzYsAAAAJ;https://xinyi-xu.com;https://www.comp.nus.edu.sg/~ngsk/;http://www.comp.nus.edu.sg/~lowkh",
        "dblp": "258/0545;;00/5480;97/4877",
        "google_scholar": "EecZzYsAAAAJ;2762GgsAAAAJ;https://scholar.google.com.tw/citations?user=_wsommYAAAAJ;https://scholar.google.com.tw/citations?user=2P-Q09UAAAAJ",
        "orcid": "0009-0008-6189-7890;0000-0002-8744-0695;0000-0001-6565-7511;",
        "linkedin": ";xinyi-xu-a93222133/;seekiong/?originalSubdomain=sg;",
        "or_profile": "~Wenyang_Hu1;~Xinyi_Xu4;~See-Kiong_Ng1;~Bryan_Kian_Hsiang_Low1",
        "aff": "National University of Singapore;National University of Singapore;National University of Singapore;National University of Singapore",
        "aff_domain": "u.nus.edu;nus.edu.sg;nus.edu.sg;nus.edu.sg",
        "position": "PhD student;PhD student;Full Professor;Associate Professor",
        "bibtex": "@misc{\nhu2024incentivized,\ntitle={Incentivized Black-Box Model Sharing},\nauthor={Wenyang Hu and Xinyi Xu and See-Kiong Ng and Bryan Kian Hsiang Low},\nyear={2024},\nurl={https://openreview.net/forum?id=VGLU5N1AD2}\n}",
        "github": "",
        "project": "",
        "reviewers": "hnks;1Wgz;gZai;jHme",
        "site": "https://openreview.net/forum?id=VGLU5N1AD2",
        "pdf_size": 1721743,
        "rating": "5;5;6;8",
        "confidence": "3;2;2;1",
        "soundness": "2;3;3;3",
        "contribution": "3;2;2;3",
        "presentation": "1;2;2;3",
        "wc_summary": "200;53;216;85",
        "wc_strengths": "30;36;37;93",
        "wc_weaknesses": "126;180;64;2",
        "wc_questions": "319;2;216;85",
        "wc_review": "675;271;533;265",
        "wc_reply_reviewers": "414;299;53;0",
        "wc_reply_authors": "2124;1536;1508;823",
        "reply_reviewers": "2;1;1;0",
        "reply_authors": "5;4;4;3",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            2.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            138.5,
            70.64170156501045
        ],
        "wc_strengths_avg": [
            49.0,
            25.544079548889602
        ],
        "wc_weaknesses_avg": [
            93.0,
            66.67083320313314
        ],
        "wc_questions_avg": [
            155.5,
            121.37236093938355
        ],
        "wc_review_avg": [
            436.0,
            175.35392781457733
        ],
        "wc_reply_reviewers_avg": [
            191.5,
            170.96563982274333
        ],
        "wc_reply_authors_avg": [
            1497.75,
            460.71812152334536
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            4.0,
            0.7071067811865476
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8660254037844386,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:5A0j9Wij0BkJ:scholar.google.com/&scioq=Incentivized+Black-Box+Model+Sharing&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "National University of Singapore",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nus.edu.sg",
        "aff_unique_abbr": "NUS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Singapore"
    },
    {
        "id": "VIEbRFp6s3",
        "title": "Off-the-Grid MARL: Datasets with Baselines for Offline Multi-Agent Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Being able to harness the power of large datasets for developing cooperative multi-agent controllers promises to unlock enormous value for real-world applications. Many important industrial systems are multi-agent in nature and are difficult to model using bespoke simulators. However, in industry, distributed processes can often be recorded during operation, and large quantities of demonstrative data stored. Offline multi-agent reinforcement learning (MARL) provides a promising paradigm for building effective decentralised controllers from such datasets. However, offline MARL is still in its infancy and therefore lacks standardised benchmark datasets and baselines typically found in more mature subfields of reinforcement learning (RL). These deficiencies make it difficult for the community to sensibly measure progress. In this work, we aim to fill this gap by releasing off-the-grid MARL (OG-MARL): a growing repository of high-quality datasets with baselines for cooperative offline MARL research. Our datasets provide settings that are characteristic of real-world systems, including complex environment dynamics, heterogeneous agents, non-stationarity, many agents, partial observability, suboptimality, sparse rewards and demonstrated coordination. For each setting, we provide a range of different dataset types (e.g. Good, Medium, Poor, and Replay) and profile the composition of experiences for each dataset. We hope that OG-MARL will serve the community as a reliable source of datasets and help drive progress, while also providing an accessible entry point for researchers new to the field.",
        "keywords": "reinforcement learning;multi-agent reinforcement learning;multi-agent systems;offline reinforcement learning;datasets",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/508f1d55ee6c0b39e3d262b0413690a798d19ed6.pdf",
        "author": "Juan Claude Formanek;Asad Jeewa;Jonathan Phillip Shock;Arnu Pretorius",
        "authorids": "~Juan_Claude_Formanek1;~Asad_Jeewa1;~Jonathan_Phillip_Shock1;~Arnu_Pretorius1",
        "gender": "M;M;M;M",
        "homepage": ";;http://www.shocklab.net;",
        "dblp": ";258/0370.html;161/9917;188/4368",
        "google_scholar": "YGkp5PYAAAAJ;nkDOU-kAAAAJ;lR_UV54AAAAJ;zZ6ydrAAAAAJ",
        "orcid": ";0000-0003-4329-8137;0000-0003-3757-0376;",
        "linkedin": "claude-formanek/;asadjeewa;;arnupretorius/",
        "or_profile": "~Juan_Claude_Formanek1;~Asad_Jeewa1;~Jonathan_Phillip_Shock1;~Arnu_Pretorius1",
        "aff": "University of Cape Town;University of KwaZulu-Natal;University of Cape Town;InstaDeep",
        "aff_domain": "uct.ac.za;ukzn.ac.za;uct.ac.za;instadeep.com",
        "position": "PhD student;Lecturer;Lecturer;Researcher",
        "bibtex": "@misc{\nformanek2024offthegrid,\ntitle={Off-the-Grid {MARL}: Datasets with Baselines for Offline Multi-Agent Reinforcement Learning},\nauthor={Juan Claude Formanek and Asad Jeewa and Jonathan Phillip Shock and Arnu Pretorius},\nyear={2024},\nurl={https://openreview.net/forum?id=VIEbRFp6s3}\n}",
        "github": "",
        "project": "",
        "reviewers": "4ULc;YX5P;DuA2;UqF2;KxKX",
        "site": "https://openreview.net/forum?id=VIEbRFp6s3",
        "pdf_size": 2102244,
        "rating": "5;6;6;6;6",
        "confidence": "5;4;3;3;4",
        "soundness": "2;3;4;3;3",
        "contribution": "2;3;3;3;2",
        "presentation": "3;3;3;3;3",
        "wc_summary": "41;65;52;68;68",
        "wc_strengths": "37;81;128;67;42",
        "wc_weaknesses": "82;239;43;79;59",
        "wc_questions": "4;4;195;55;6",
        "wc_review": "164;389;418;269;175",
        "wc_reply_reviewers": "0;22;108;0;0",
        "wc_reply_authors": "351;582;467;398;303",
        "reply_reviewers": "0;1;1;0;0",
        "reply_authors": "1;1;2;1;1",
        "rating_avg": [
            5.8,
            0.39999999999999997
        ],
        "confidence_avg": [
            3.8,
            0.7483314773547882
        ],
        "soundness_avg": [
            3.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            58.8,
            10.684568311354464
        ],
        "wc_strengths_avg": [
            71.0,
            32.74751898999373
        ],
        "wc_weaknesses_avg": [
            100.4,
            70.73217089839672
        ],
        "wc_questions_avg": [
            52.8,
            73.72760676978467
        ],
        "wc_review_avg": [
            283.0,
            105.33945129912155
        ],
        "wc_reply_reviewers_avg": [
            26.0,
            41.876007450567684
        ],
        "wc_reply_authors_avg": [
            420.2,
            97.35173342062276
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.2,
            0.4
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8017837257372734,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10296668573684770739&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "University of Cape Town;University of KwaZulu-Natal;InstaDeep",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.uct.ac.za;https://ukzn.ac.za;https://www.instadeep.com",
        "aff_unique_abbr": "UCT;UKZN;InstaDeep",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "South Africa;United Kingdom"
    },
    {
        "id": "VJDFhkwQg6",
        "title": "Federated contrastive GFlowNets",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Generative flow networks (GFlowNets) are powerful samplers for distributions supported in spaces of compositional objects (e.g., sequences and graphs), with applications ranging from the design of biological sequences to causal discovery. However, there are no principled approaches to deal with GFlowNets in federated settings, where the target distribution results from a combination of (possibly sensitive) rewards from different parties. To fill this gap, we propose *federated contrastive GFlowNet* (FC-GFlowNet), a divide-and-conquer framework for federated learning of GFlowNets, requiring a single communication step. First, each client learns a GFlowNet locally to sample proportionally to their reward. Then, the server gathers the local policy networks and aggregates them to enforce *federated balance* (FB), which provably ensures the correctness of FC-GFlowNet. Additionally, our theoretical analysis builds on a novel concept, which we coin *contrastive balance*, that imposes necessary and sufficient conditions for the correctness of general (non-federated) GFlowNets. We empirically attest the performance of FC-GFlowNets in four controlled settings, including grid-world, sequence, and multiset generation, and Bayesian phylogenetic inference. Our experiments also suggest that, in some cases, the contrastive balance objective can accelerate the training of conventional GFlowNets.",
        "keywords": "GFlowNet;Federated Learning",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/04bf9d494abeeebfe5adc04b3cb357b90123b14c.zip",
        "author": "Tiago Silva;Amauri H Souza;Luiz Max Carvalho;Samuel Kaski;Diego Mesquita",
        "authorids": "~Tiago_Silva4;~Amauri_H_Souza1;~Luiz_Max_Carvalho1;~Samuel_Kaski1;~Diego_Mesquita1",
        "gender": "M;M;M;M;M",
        "homepage": "https://github.com/tiagodsilva;http://www.amauriholanda.org;https://github.com/maxbiostat;https://people.aalto.fi/samuel.kaski;https://weakly-informative.github.io",
        "dblp": ";131/3352;;64/5826;163/4293",
        "google_scholar": ";lP0LBI4AAAAJ;y2mxpbcAAAAJ;https://scholar.google.com/citations?hl=en;",
        "orcid": ";;;0000-0003-1925-9154;",
        "linkedin": ";;;samuel-kaski-27790/;",
        "or_profile": "~Tiago_Silva4;~Amauri_H_Souza1;~Luiz_Max_Carvalho1;~Samuel_Kaski1;~Diego_Mesquita1",
        "aff": "Escola de Matem\u00e1tica Aplicada;Federal Institute of Cear\u00e1;Funda\u00e7\u00e3o Getulio Vargas;Aalto University;Getulio Vargas Foundation",
        "aff_domain": "fgv.br;ifce.edu.br;fgv.br;aalto.fi;fgv.br",
        "position": "PhD student;Associate Professor;Lecturer;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nsilva2024federated,\ntitle={Federated contrastive {GF}lowNets},\nauthor={Tiago Silva and Amauri H Souza and Luiz Max Carvalho and Samuel Kaski and Diego Mesquita},\nyear={2024},\nurl={https://openreview.net/forum?id=VJDFhkwQg6}\n}",
        "github": "",
        "project": "",
        "reviewers": "rsSg;Npeg;Xj4h;wWFS",
        "site": "https://openreview.net/forum?id=VJDFhkwQg6",
        "pdf_size": 863421,
        "rating": "3;5;6;6",
        "confidence": "3;3;5;3",
        "soundness": "2;2;3;4",
        "contribution": "3;2;3;3",
        "presentation": "2;3;4;4",
        "wc_summary": "76;57;82;108",
        "wc_strengths": "5;21;146;65",
        "wc_weaknesses": "8;138;475;115",
        "wc_questions": "177;3;82;2",
        "wc_review": "266;219;785;290",
        "wc_reply_reviewers": "32;580;291;17",
        "wc_reply_authors": "905;1546;1406;511",
        "reply_reviewers": "1;3;2;1",
        "reply_authors": "2;4;4;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            80.75,
            18.239723133863627
        ],
        "wc_strengths_avg": [
            59.25,
            54.691749834869974
        ],
        "wc_weaknesses_avg": [
            184.0,
            175.02428402938833
        ],
        "wc_questions_avg": [
            66.0,
            71.83662018775661
        ],
        "wc_review_avg": [
            390.0,
            229.47875718680368
        ],
        "wc_reply_reviewers_avg": [
            230.0,
            229.56153859041805
        ],
        "wc_reply_authors_avg": [
            1092.0,
            411.47357144779056
        ],
        "reply_reviewers_avg": [
            1.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.75,
            1.299038105676658
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.4714045207910316,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:2dzRw6Dx-04J:scholar.google.com/&scioq=Federated+contrastive+GFlowNets&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "Escola de Matem\u00e1tica Aplicada;Federal Institute of Cear\u00e1;Funda\u00e7\u00e3o Getulio Vargas;Aalto University;Getulio Vargas Foundation",
        "aff_unique_dep": "Escola de Matem\u00e1tica Aplicada;;;;",
        "aff_unique_url": ";http://www.ifce.edu.br;https://www.fgv.br;https://www.aalto.fi;https://fgv.br",
        "aff_unique_abbr": ";IFCE;FGV;Aalto;FGV",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "Brazil;Finland"
    },
    {
        "id": "VJEcAnFPqC",
        "title": "Toward a Mechanistic Understanding of Stepwise Inference in Transformers: A Synthetic Graph Navigation Model",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Taking correct steps through elementary logical operations is the essence of log- ical reasoning, culminating in precise planning outcomes. While such step- wise inference approaches have demonstrated benefits in Large Language Mod- els (LLMs), conducting an accurate quantitative evaluation is challenging, given their extensive scale, complexity, and lack of accessibility. Here, we introduce and explore a paradigm casting stepwise inference as a graph navigation problem. We introduce a minimal synthetic setup, where an autoregressive language model solves a navigation task on directed acyclic graphs (DAGs), taking inspiration from computational graphs and execution traces. Despite its apparent simplicity, we demonstrate that our synthetic model effectively recapitulates phenomena ob- served in LLMs. By implementing training with sample paths from start to goal node in a \u2019step-by-step\u2019 manner, we perform systematic experiments and develop novel analyses illustrating that stepwise navigation proves advantageous when the underlying graph is hierarchical and generalization necessitates the stitching of subpaths observed during pretraining. Further, we observe a diversity-precision tradeoff while varying sampling temperature and a bias towards generating shorter paths. We next elucidate how in-context chain-of-thought exemplars can steer the model\u2019s navigation. Importantly, these exemplars can guide the model to follow a path of reasoning we provide, instead of relying on its potentially biased pri- ors. Together, this work showcases the utility and adaptability of this paradigm in exploring the complexities of logical reasoning and planning in LLMs.",
        "keywords": "mechanistic interpretability;ai safety;synthetic task;alignment;directed acyclic graphs;chain-of-thought;transformers;cognitive science",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/3d2f9a4d09ce95669c63af7249fffbf0c9937f6c.pdf",
        "author": "Mikail Khona;Maya Okawa;Rahul Ramesh;Kento Nishi;Robert P. Dick;Ekdeep Singh Lubana;Hidenori Tanaka",
        "authorids": "~Mikail_Khona2;~Maya_Okawa1;~Rahul_Ramesh2;~Kento_Nishi1;~Robert_P._Dick1;~Ekdeep_Singh_Lubana1;~Hidenori_Tanaka1",
        "gender": ";;M;M;M;M;",
        "homepage": ";;https://cis.upenn.edu/~rahulram;https://kentonishi.github.io/;http://robertdick.org/;https://ekdeepslubana.github.io/;https://sites.google.com/view/htanaka/home",
        "dblp": ";;168/7029;;84/523.html;228/2683;",
        "google_scholar": ";;wCa6nygAAAAJ;iQoZSr4AAAAJ;;https://scholar.google.co.in/citations?user=OP7S3vsAAAAJ;f_pWOGIAAAAJ",
        "orcid": ";;;;;;",
        "linkedin": ";;;kento-nishi-5696ab185/;;;",
        "or_profile": "~Mikail_Khona2;~Maya_Okawa1;~Rahul_Ramesh2;~Kento_Nishi1;~Robert_P._Dick1;~Ekdeep_Singh_Lubana1;~Hidenori_Tanaka1",
        "aff": ";;University of Pennsylvania;Harvard University;University of Michigan;University of Michigan;Physics & Informatics Lab, NTT Research, Inc.",
        "aff_domain": ";;upenn.edu;harvard.edu;umich.edu;umich.edu;ntt-research.com",
        "position": ";;PhD student;Undergrad student;Full Professor;PhD student;Senior Research Scientist",
        "bibtex": "@misc{\nkhona2024toward,\ntitle={Toward a Mechanistic Understanding of Stepwise Inference in Transformers: A Synthetic Graph Navigation Model},\nauthor={Mikail Khona and Maya Okawa and Rahul Ramesh and Kento Nishi and Robert P. Dick and Ekdeep Singh Lubana and Hidenori Tanaka},\nyear={2024},\nurl={https://openreview.net/forum?id=VJEcAnFPqC}\n}",
        "github": "",
        "project": "",
        "reviewers": "3PuG;V1TB;JQZB;7XTH",
        "site": "https://openreview.net/forum?id=VJEcAnFPqC",
        "pdf_size": 5948968,
        "rating": "3;6;6;6",
        "confidence": "4;2;3;2",
        "soundness": "2;3;3;2",
        "contribution": "2;3;4;2",
        "presentation": "2;3;3;3",
        "wc_summary": "15;69;38;103",
        "wc_strengths": "13;59;40;101",
        "wc_weaknesses": "185;56;63;110",
        "wc_questions": "5;19;11;4",
        "wc_review": "218;203;152;318",
        "wc_reply_reviewers": "880;0;19;0",
        "wc_reply_authors": "2372;928;1594;1154",
        "reply_reviewers": "3;0;1;0",
        "reply_authors": "5;2;4;2",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            56.25,
            33.10117067416196
        ],
        "wc_strengths_avg": [
            53.25,
            32.04976598978532
        ],
        "wc_weaknesses_avg": [
            103.5,
            51.431993933737395
        ],
        "wc_questions_avg": [
            9.75,
            5.973901572674261
        ],
        "wc_review_avg": [
            222.75,
            60.188765563018485
        ],
        "wc_reply_reviewers_avg": [
            224.75,
            378.3882761133067
        ],
        "wc_reply_authors_avg": [
            1512.0,
            551.2585600242412
        ],
        "reply_reviewers_avg": [
            1.0,
            1.224744871391589
        ],
        "reply_authors_avg": [
            3.25,
            1.299038105676658
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.8703882797784892,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:hwaHDjeRzmwJ:scholar.google.com/&scioq=Toward+a+Mechanistic+Understanding+of+Stepwise+Inference+in+Transformers:+A+Synthetic+Graph+Navigation+Model&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;2;3",
        "aff_unique_norm": "University of Pennsylvania;Harvard University;University of Michigan;NTT Research, Inc.",
        "aff_unique_dep": ";;;Physics & Informatics Lab",
        "aff_unique_url": "https://www.upenn.edu;https://www.harvard.edu;https://www.umich.edu;https://www.ntt-research.com",
        "aff_unique_abbr": "UPenn;Harvard;UM;NTT Research",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "VJLD9MquPH",
        "title": "Stochastic Gradient Langevin Dynamics Based on Quantization with Increasing Resolution",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Stochastic learning dynamics based on Langevin or Levy stochastic differential equations (SDEs) in deep neural networks control the variance of noise by varying the size of the mini-batch or directly those of injecting noise.\nSince the noise variance affects the approximation performance, the design of the additive noise is significant in SDE-based learning and practical implementation.\nIn this paper, we propose an alternative stochastic descent learning equation based on quantized optimization for non-convex objective functions, adopting a stochastic analysis perspective. \nThe proposed method employs a quantized optimization approach that utilizes Langevin SDE dynamics, allowing for controllable noise with an identical distribution without the need for additive noise or adjusting the mini-batch size.\nNumerical experiments demonstrate the effectiveness of the proposed algorithm on vanilla convolution neural network (CNN) models and the ResNet-50 architecture across various data sets. Furthermore, we provide a simple PyTorch implementation of the proposed algorithm.",
        "keywords": "Stochastic differential equations;Quantization;Langevin SDE;White noise hypothesis;Weak convergence",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/3713a8b41a29ad6e436c47e723c60d8995ac61bd.zip",
        "author": "Jinwuk Seok;Changsik Cho",
        "authorids": "~Jinwuk_Seok1;~Changsik_Cho1",
        "gender": "M;M",
        "homepage": "https://jinwuk.github.io;",
        "dblp": ";",
        "google_scholar": "https://scholar.google.com/citations?hl=ko;",
        "orcid": "0000-0001-5318-1237;0000-0002-2162-8142",
        "linkedin": "https://www.linkedin.com/feed/?lipi=urn%3Ali%3Apage%3Ad_flagship3_feed%3B%2BpWpmX6dRWy2l1%2B3W%2B%2FCYg%3D%3D&licu=urn%3Ali%3Acontrol%3Ad_flagship3_feed-nav_homepage;",
        "or_profile": "~Jinwuk_Seok1;~Changsik_Cho1",
        "aff": "School of Computer and SW;Electronics and Telecommunications Research Institute",
        "aff_domain": "ust.ac.kr;etri.re.kr",
        "position": "Full Professor;Principal Researcher",
        "bibtex": "@misc{\nseok2024stochastic,\ntitle={Stochastic Gradient Langevin Dynamics Based on Quantization with Increasing Resolution},\nauthor={Jinwuk Seok and Changsik Cho},\nyear={2024},\nurl={https://openreview.net/forum?id=VJLD9MquPH}\n}",
        "github": "",
        "project": "",
        "reviewers": "JTTw;qh6T;wZWw",
        "site": "https://openreview.net/forum?id=VJLD9MquPH",
        "pdf_size": 1478907,
        "rating": "3;3;5",
        "confidence": "3;3;3",
        "soundness": "2;2;2",
        "contribution": "2;2;2",
        "presentation": "2;1;3",
        "wc_summary": "57;40;65",
        "wc_strengths": "46;50;72",
        "wc_weaknesses": "216;134;242",
        "wc_questions": "34;354;106",
        "wc_review": "353;578;485",
        "wc_reply_reviewers": "0;0;39",
        "wc_reply_authors": "977;949;992",
        "reply_reviewers": "0;0;1",
        "reply_authors": "2;2;2",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            54.0,
            10.424330514074594
        ],
        "wc_strengths_avg": [
            56.0,
            11.430952132988164
        ],
        "wc_weaknesses_avg": [
            197.33333333333334,
            46.02414825091522
        ],
        "wc_questions_avg": [
            164.66666666666666,
            137.06770427622823
        ],
        "wc_review_avg": [
            472.0,
            92.31467922275417
        ],
        "wc_reply_reviewers_avg": [
            13.0,
            18.384776310850235
        ],
        "wc_reply_authors_avg": [
            972.6666666666666,
            17.82008853949821
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:tXUw6qZllTsJ:scholar.google.com/&scioq=Stochastic+Gradient+Langevin+Dynamics+Based+on+Quantization+with+Increasing+Resolution&hl=en&as_sdt=0,23",
        "gs_version_total": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "School of Computer and Software;Electronics and Telecommunications Research Institute",
        "aff_unique_dep": "Department of Computer and Software;",
        "aff_unique_url": ";http://www.etri.re.kr",
        "aff_unique_abbr": ";ETRI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "1",
        "aff_country_unique": ";South Korea"
    },
    {
        "title": "GNNX-BENCH: Unravelling the Utility of Perturbation-based GNN Explainers through In-depth Benchmarking",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18507",
        "id": "VJvbOSXRUq",
        "author_site": "Mert Kosan, Samidha Verma, Burouj Armgaan, Khushbu Pahwa, Ambuj K Singh, Sourav Medya, Sayan Ranu",
        "tldr": "",
        "abstract": "Numerous explainability methods have been proposed to shed light on the inner workings of GNNs. Despite the inclusion of empirical evaluations in all the proposed algorithms, the interrogative aspects of these evaluations lack diversity. As a result, various facets of explainability pertaining to GNNs, such as a comparative analysis of counterfactual reasoners, their stability to variational factors such as different GNN architectures, noise, stochasticity in non-convex loss surfaces, feasibility amidst domain constraints, and so forth, have yet to be formally investigated. Motivated by this need, we present a benchmarking study on perturbation-based explainability methods for GNNs, aiming to systematically evaluate and compare a wide range of explainability techniques. Among the key findings of our study, we identify the Pareto-optimal methods that exhibit superior efficacy and stability in the presence of noise. Nonetheless, our study reveals that\nall algorithms are affected by stability issues when faced with noisy data. Furthermore, we have established that the current generation of counterfactual explainers often fails to provide feasible recourses due to violations of topological constraints encoded by domain-specific considerations. Overall, this benchmarking study empowers stakeholders in the field of GNNs with a comprehensive understanding of the state-of-the-art explainability methods, potential research problems for further enhancement, and the implications of their application in real-world scenarios.",
        "keywords": "graph neural network explanations;factual explanations;counterfactual explanations",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/0a7c7ed1605d8ac206e15ac7ff6d11e0070308c3.pdf",
        "author": "Mert Kosan;Samidha Verma;Burouj Armgaan;Khushbu Pahwa;Ambuj Singh;Sourav Medya;Sayan Ranu",
        "authorids": "~Mert_Kosan1;~Samidha_Verma1;~Burouj_Armgaan1;~Khushbu_Pahwa1;~Ambuj_Singh1;~Sourav_Medya1;~Sayan_Ranu2",
        "gender": "M;F;M;F;;M;M",
        "homepage": "https://www.mertkosan.com;;https://armagaan.github.io/;;;https://souravmedya.github.io/;https://www.cse.iitd.ac.in/~sayan/index.html",
        "dblp": "304/8019;;349/0229;299/8490;;178/3021;38/768",
        "google_scholar": "12lDpTAAAAAJ;YPXPa7QAAAAJ;GaOJrMYAAAAJ;https://scholar.google.com/citations?hl=en;;RCFhOM4AAAAJ;K4w5qYUAAAAJ",
        "orcid": "0000-0002-8092-5024;;0009-0007-2423-1523;;;0000-0003-0996-2807;0000-0003-4147-9372",
        "linkedin": "https://linkedin.com/in/mertkosan;samidha-verma-a5b3b0125/;burouj-armgaan/;khushbupahwa;;sourav-medya-35987a49/;",
        "or_profile": "~Mert_Kosan1;~Samidha_Verma1;~Burouj_Armgaan1;~Khushbu_Pahwa1;~Ambuj_Singh1;~Sourav_Medya1;~Sayan_Ranu2",
        "aff": "VISA;Indian Institute of Technology, Delhi;Indian Institute of Technology Delhi;Rice University;;University of Illinois at Chicago;Indian Institute of Technology Delhi",
        "aff_domain": "visa.com;iitd.ac.in;iitd.ac.in;rice.edu;;uic.edu;iitd.ac.in",
        "position": "Researcher;PhD student;PhD student;MS student;;Assistant Professor;Associate Professor",
        "bibtex": "@inproceedings{\nkosan2024gnnxbench,\ntitle={{GNNX}-{BENCH}: Unravelling the Utility of Perturbation-based {GNN} Explainers through In-depth Benchmarking},\nauthor={Mert Kosan and Samidha Verma and Burouj Armgaan and Khushbu Pahwa and Ambuj Singh and Sourav Medya and Sayan Ranu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=VJvbOSXRUq}\n}",
        "github": "",
        "project": "",
        "reviewers": "PPUE;aTj3;ac1w;NT8w",
        "pdf_size": 3849420,
        "rating": "3;6;6;8",
        "confidence": "4;2;3;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;4;3",
        "presentation": "3;3;2;3",
        "wc_summary": "83;22;44;138",
        "wc_strengths": "92;71;60;74",
        "wc_weaknesses": "85;109;38;99",
        "wc_questions": "61;7;170;63",
        "wc_review": "321;209;312;374",
        "wc_reply_reviewers": "0;23;0;58",
        "wc_reply_authors": "559;1069;836;951",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "5;5;3;4",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            71.75,
            44.04755952376931
        ],
        "wc_strengths_avg": [
            74.25,
            11.497282287566918
        ],
        "wc_weaknesses_avg": [
            82.75,
            27.206387117733954
        ],
        "wc_questions_avg": [
            75.25,
            59.137023090446476
        ],
        "wc_review_avg": [
            304.0,
            59.74529270160119
        ],
        "wc_reply_reviewers_avg": [
            20.25,
            23.731571797923543
        ],
        "wc_reply_authors_avg": [
            853.75,
            189.0652995660494
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            4.25,
            0.82915619758885
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.1266600992762247,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13427314289912588064&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=VJvbOSXRUq",
        "pdf": "https://openreview.net/pdf?id=VJvbOSXRUq",
        "email": "visa.com;iitd.ac.in;iitd.ac.in;rice.edu;;uic.edu;iitd.ac.in",
        "author_num": 7,
        "aff_unique_index": "0;1;1;2;3;1",
        "aff_unique_norm": "VISA;Indian Institute of Technology Delhi;Rice University;University of Illinois at Chicago",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.visa.com;https://www.iitdelhi.ac.in;https://www.rice.edu;https://www.uic.edu",
        "aff_unique_abbr": "VISA;IIT Delhi;Rice;UIC",
        "aff_campus_unique_index": "1;1;2;1",
        "aff_campus_unique": ";Delhi;Chicago",
        "aff_country_unique_index": "0;1;1;0;0;1",
        "aff_country_unique": "United States;India"
    },
    {
        "id": "VL2txtmPYA",
        "title": "Freenets: Learning Layerfree Neural Network Topologies",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We propose a novel data driven approach to neural architectures based on information flows in a Neural Connectivity Graph (NCG). This technique gives rise to a category of neural networks that we call Free Networks, characterized entirely by the edges of an acyclic uni-directional graph. Further, we design a unique, data-informed methodology to systematically prune and augment connections in the proposed architecture during training. We show that any layered feed forward architecture is a subset of the class of Free Networks. Therefore, we propose that our method can produce a class of neural graphs that is a superset of any existing feed-forward networks. Additionally, we demonstrate the existence of certain classes of data, which are expressible through FreeNets, but not through any other feedforward architecture over the same number of neurons. We perform extensive experiments on this new architecture, to visualize the evolution of the neural topology over real world datasets, and showcase its performance alongside comparable baselines.",
        "keywords": "NAS;Neural Architecture Search;Neural Architecture;Neural Coactivation Matrix;AutoML;Neural Connectivity Graph",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/672c2a2eca8a43af9f6ca6d758427f0b88188ef5.pdf",
        "author": "Yerram Varun;Rahul Madhavan",
        "authorids": "~Yerram_Varun1;~Rahul_Madhavan1",
        "gender": "M;M",
        "homepage": "https://varun221.github.io/;",
        "dblp": "321/0471;290/2008",
        "google_scholar": ";HrM2xRcAAAAJ",
        "orcid": ";",
        "linkedin": "yvarun25221/;rahul-madhavan/",
        "or_profile": "~Yerram_Varun1;~Rahul_Madhavan1",
        "aff": "Google DeepMind;Indian Institute of Science, Bangalore",
        "aff_domain": "research.google.com;iisc.ac.in",
        "position": "Researcher;PhD student",
        "bibtex": "@misc{\nvarun2024freenets,\ntitle={Freenets: Learning Layerfree Neural Network Topologies},\nauthor={Yerram Varun and Rahul Madhavan},\nyear={2024},\nurl={https://openreview.net/forum?id=VL2txtmPYA}\n}",
        "github": "",
        "project": "",
        "reviewers": "hDot;d4y1;6txU",
        "site": "https://openreview.net/forum?id=VL2txtmPYA",
        "pdf_size": 568285,
        "rating": "1;3;6",
        "confidence": "2;4;3",
        "soundness": "1;1;3",
        "contribution": "1;2;3",
        "presentation": "1;3;4",
        "wc_summary": "39;75;107",
        "wc_strengths": "66;80;123",
        "wc_weaknesses": "185;385;375",
        "wc_questions": "1;81;131",
        "wc_review": "291;621;736",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.3333333333333335,
            2.0548046676563256
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "wc_summary_avg": [
            73.66666666666667,
            27.776888874666213
        ],
        "wc_strengths_avg": [
            89.66666666666667,
            24.25329301810833
        ],
        "wc_weaknesses_avg": [
            315.0,
            92.01449161228173
        ],
        "wc_questions_avg": [
            71.0,
            53.54126134736337
        ],
        "wc_review_avg": [
            549.3333333333334,
            188.60599731244557
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.3973597071195131,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:fSy-uIkrmcwJ:scholar.google.com/&scioq=Freenets:+Learning+Layerfree+Neural+Network+Topologies&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Google;Indian Institute of Science",
        "aff_unique_dep": "Google DeepMind;",
        "aff_unique_url": "https://deepmind.com;https://www.iisc.ac.in",
        "aff_unique_abbr": "DeepMind;IISc",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Bangalore",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United Kingdom;India"
    },
    {
        "title": "Tangent Transformers for Composition,Privacy and Removal",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18506",
        "id": "VLFhbOCz5D",
        "author_site": "Tian Yu Liu, Aditya Golatkar, Stefano Soatto",
        "tldr": "",
        "abstract": "We introduce Tangent Attention Fine-Tuning (TAFT), a method for fine-tuning linearized transformers obtained by computing a First-order Taylor Expansion around a pre-trained initialization. We show that the Jacobian-Vector Product resulting from linearization can be computed efficiently in a single forward pass, reducing training and inference cost to the same order of magnitude as its original non-linear counterpart, while using the same number of parameters. Furthermore, we show that, when applied to various downstream visual classification tasks, the resulting Tangent Transformer fine-tuned with TAFT can perform comparably with fine-tuning the original non-linear network. Since Tangent Transformers are linear with respect to the new set of weights, and the resulting fine-tuning loss is convex, we show that TAFT enjoys several advantages compared to non-linear fine-tuning when it comes to model composition, parallel training, machine unlearning, and differential privacy. Our code is available at: https://github.com/tianyu139/tangent-model-composition",
        "keywords": "Composition;Forgetting;Tangent Learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Tian Yu Liu;Aditya Golatkar;Stefano Soatto",
        "authorids": "~Tian_Yu_Liu2;~Aditya_Golatkar1;~Stefano_Soatto1",
        "gender": ";M;",
        "homepage": ";https://adityagolatkar.github.io;",
        "dblp": ";;",
        "google_scholar": ";IMAwpekAAAAJ;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Tian_Yu_Liu2;~Aditya_Golatkar1;~Stefano_Soatto1",
        "aff": ";Amazon;",
        "aff_domain": ";amazon.com;",
        "position": ";Researcher;",
        "bibtex": "@inproceedings{\nliu2024tangent,\ntitle={Tangent Transformers for Composition,Privacy and Removal},\nauthor={Tian Yu Liu and Aditya Golatkar and Stefano Soatto},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=VLFhbOCz5D}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZQ32;QE2Q;Ef2Q",
        "pdf_size": 404467,
        "rating": "6;6;6",
        "confidence": "2;4;4",
        "soundness": "3;3;4",
        "contribution": "3;3;3",
        "presentation": "3;3;3",
        "wc_summary": "153;48;135",
        "wc_strengths": "302;31;137",
        "wc_weaknesses": "216;48;25",
        "wc_questions": "97;2;75",
        "wc_review": "768;129;372",
        "wc_reply_reviewers": "0;0;26",
        "wc_reply_authors": "414;266;567",
        "reply_reviewers": "0;0;1",
        "reply_authors": "1;1;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            112.0,
            45.8475735453906
        ],
        "wc_strengths_avg": [
            156.66666666666666,
            111.50585435552502
        ],
        "wc_weaknesses_avg": [
            96.33333333333333,
            85.13649171901683
        ],
        "wc_questions_avg": [
            58.0,
            40.60377650744653
        ],
        "wc_review_avg": [
            423.0,
            263.3514761682569
        ],
        "wc_reply_reviewers_avg": [
            8.666666666666666,
            12.256517540566826
        ],
        "wc_reply_authors_avg": [
            415.6666666666667,
            122.88838657723339
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2122572693073970349&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=VLFhbOCz5D",
        "pdf": "https://openreview.net/pdf?id=VLFhbOCz5D",
        "email": ";amazon.com;",
        "author_num": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "Amazon",
        "aff_unique_dep": "Amazon.com, Inc.",
        "aff_unique_url": "https://www.amazon.com",
        "aff_unique_abbr": "Amazon",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "VNHsZPZ5rJ",
        "title": "Targeted Model Inversion: Distilling Style Encoded in Predictions",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Previous model inversion (MI) research has demonstrated the feasibility of reconstructing images representative of specific classes, inadvertently revealing additional feature information. However, there are still two remaining challenges for practical black-box MI: (1) reconstructing a high-quality input image tailored to the observed prediction vector, and (2) minimizing the number of queries made to the target model. We introduce a practical black-box MI attack called Targeted Model Inversion (TMI). Our approach involves altering the mapping network in StyleGAN, so that it can take an observed prediction vector and transform it into a StyleGAN latent representation, which serves as the initial data point for subsequent MI steps. Later, TMI leverages a surrogate model that is also derived from StyleGAN to guide instance-specific MI by optimizing the latent representation. These mapping and surrogate networks work together to conduct high-fidelity MI while significantly decreasing the number of necessary queries. Our experiments demonstrate that TMI outperforms state-of-the-art MI methods, demonstrating a new upper bound on the susceptibility to black-box MI attacks.",
        "keywords": "model inversion attack;machine learning;privacy",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Hoyong Jeong;Kiwon Chung;Sung Ju Hwang;Sooel Son",
        "authorids": "~Hoyong_Jeong1;~Kiwon_Chung1;~Sung_Ju_Hwang1;~Sooel_Son1",
        "gender": "M;M;;",
        "homepage": "https://yongari38.notion.site/;https://github.com/kiwon94;;",
        "dblp": "285/0804;;;",
        "google_scholar": "1vfshtsAAAAJ;;;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Hoyong_Jeong1;~Kiwon_Chung1;~Sung_Ju_Hwang1;~Sooel_Son1",
        "aff": "Deeping Source;Korea Advanced Institute of Science & Technology;;",
        "aff_domain": "deepingsource.io;kaist.edu;;",
        "position": "Researcher;MS student;;",
        "bibtex": "@misc{\njeong2024targeted,\ntitle={Targeted Model Inversion: Distilling Style Encoded in Predictions},\nauthor={Hoyong Jeong and Kiwon Chung and Sung Ju Hwang and Sooel Son},\nyear={2024},\nurl={https://openreview.net/forum?id=VNHsZPZ5rJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "Xyhs;6NZM;wJqb;ZpeV",
        "site": "https://openreview.net/forum?id=VNHsZPZ5rJ",
        "pdf_size": 11170699,
        "rating": "5;5;6;8",
        "confidence": "5;3;3;4",
        "soundness": "2;3;3;4",
        "contribution": "2;2;2;3",
        "presentation": "2;3;2;4",
        "wc_summary": "107;252;92;90",
        "wc_strengths": "41;141;38;65",
        "wc_weaknesses": "17;273;221;76",
        "wc_questions": "381;135;17;83",
        "wc_review": "546;801;368;314",
        "wc_reply_reviewers": "0;327;44;15",
        "wc_reply_authors": "1166;1294;971;778",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "3;2;2;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            135.25,
            67.72508767067046
        ],
        "wc_strengths_avg": [
            71.25,
            41.60754138374437
        ],
        "wc_weaknesses_avg": [
            146.75,
            104.03454954965682
        ],
        "wc_questions_avg": [
            154.0,
            137.56816492197603
        ],
        "wc_review_avg": [
            507.25,
            190.0833698670139
        ],
        "wc_reply_reviewers_avg": [
            96.5,
            134.01585727069764
        ],
        "wc_reply_authors_avg": [
            1052.25,
            195.7017820562705
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:mserAjt0v64J:scholar.google.com/&scioq=Targeted+Model+Inversion:+Distilling+Style+Encoded+in+Predictions&hl=en&as_sdt=0,5",
        "gs_version_total": 7,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Deeping Source;Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": ";https://www.kaist.ac.kr",
        "aff_unique_abbr": ";KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "1",
        "aff_country_unique": ";South Korea"
    },
    {
        "id": "VNyIVrKrqv",
        "title": "Constrained Reinforcement Learning as Wasserstein Variational Inference: Formal Methods for Interpretability",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Reinforcement learning can provide effective reasoning for sequential decision-making problems with variable dynamics. Such reasoning in practical implementation, however, poses a persistent challenge in interpreting the reward function and corresponding optimal policy. Consequently, representing sequential decision-making problems as probabilistic inference can have considerable value, as, in principle, the inference offers diverse and powerful mathematical tools to infer the stochastic dynamics whilst suggesting a probabilistic interpretation of policy optimization. In this study, we propose a novel Adaptive Wasserstein Variational Optimization, namely AWaVO, to tackle these interpretability challenges. Our approach uses formal methods to achieve the interpretability of guaranteed convergence, training transparency, and sequential decisions. To demonstrate its practicality, we showcase guaranteed interpretability including a global convergence rate $\\Theta(1/\\sqrt{T})$ not only in simulation but also in real-world robotic tasks. In comparison with state-of-the-art benchmarks including TRPO-IPO, PCPO and CRPO, we empirically verify that AWaVO offers a reasonable trade-off between high performance and sufficient interpretability. The real-world hardware implementation is demonstrated via an anonymous video.",
        "keywords": "Interpretable Machine Learning;Reinforcement Learning;Distributional Representation;Formal Methods;Variational Inference",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/d0f3d9244886388b2d17780520f9b1dc760e1991.zip",
        "author": "YANRAN WANG;David Boyle",
        "authorids": "~YANRAN_WANG3;~David_Boyle1",
        "gender": "M;M",
        "homepage": "https://alex-yanranwang.github.io/;https://www.imperial.ac.uk/people/david.boyle",
        "dblp": ";08/1254",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.co.uk/citations?user=XRzAhnYAAAAJ",
        "orcid": "0000-0003-1107-4235;0000-0002-1993-4482",
        "linkedin": "yanran-wang-3882a223b/;",
        "or_profile": "~YANRAN_WANG3;~David_Boyle1",
        "aff": "Imperial College London;Imperial College London, Imperial College London",
        "aff_domain": "imperial.ac.uk;imperial.ac.uk",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\nwang2024constrained,\ntitle={Constrained Reinforcement Learning as Wasserstein Variational Inference: Formal Methods for Interpretability},\nauthor={YANRAN WANG and David Boyle},\nyear={2024},\nurl={https://openreview.net/forum?id=VNyIVrKrqv}\n}",
        "github": "",
        "project": "",
        "reviewers": "3BVe;e4UV;x9MY",
        "site": "https://openreview.net/forum?id=VNyIVrKrqv",
        "pdf_size": 19917163,
        "rating": "3;6;6",
        "confidence": "3;2;3",
        "soundness": "1;3;3",
        "contribution": "2;3;3",
        "presentation": "2;2;2",
        "wc_summary": "202;112;127",
        "wc_strengths": "88;68;39",
        "wc_weaknesses": "710;53;179",
        "wc_questions": "85;93;125",
        "wc_review": "1085;326;470",
        "wc_reply_reviewers": "360;147;236",
        "wc_reply_authors": "2796;643;968",
        "reply_reviewers": "1;2;2",
        "reply_authors": "5;2;3",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            147.0,
            39.370039370059054
        ],
        "wc_strengths_avg": [
            65.0,
            20.11632835948615
        ],
        "wc_weaknesses_avg": [
            314.0,
            284.69984193883914
        ],
        "wc_questions_avg": [
            101.0,
            17.281975195754296
        ],
        "wc_review_avg": [
            627.0,
            329.1473834014179
        ],
        "wc_reply_reviewers_avg": [
            247.66666666666666,
            87.3473271231327
        ],
        "wc_reply_authors_avg": [
            1469.0,
            947.6648493358117
        ],
        "reply_reviewers_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            1.247219128924647
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:fVENZQkQMqQJ:scholar.google.com/&scioq=Constrained+Reinforcement+Learning+as+Wasserstein+Variational+Inference:+Formal+Methods+for+Interpretability&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Imperial College London",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.imperial.ac.uk",
        "aff_unique_abbr": "ICL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "VOrfPVYvbN",
        "title": "Domain Bridge: Generative Model-based Domain Forensic for Black-box Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In forensic investigations of machine learning models, techniques that determine a model's data domain play an essential role, with prior work relying on large-scale corpora like ImageNet to approximate the target model's domain. Although such methods are effective in finding broad domains, they often struggle in identifying finer-grained classes within those domains. In this paper, we introduce an enhanced approach to determine not just the general data domain (e.g., human face) but also its specific attributes (e.g., wearing glasses). Our approach uses an image embedding model as the encoder and a generative model as the decoder. Beginning with a coarse-grained description, the decoder generates a set of images, which are then presented to the unknown target model. Successful classifications by the model guide the encoder to refine the description, which in turn, are used to produce a more specific set of images in the subsequent iteration. This iterative refinement narrows down the exact class of interest. A key strength of our approach lies in leveraging the expansive dataset, LAION-5B, on which the generative model Stable Diffusion is trained. This enlarges our search space beyond traditional corpora, such as ImageNet. Empirical results showcase our method's performance in identifying specific attributes of a model's input domain, paving the way for more detailed forensic analyses of deep learning models.",
        "keywords": "Security;Forensic",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Jiyi Zhang;Han Fang;Yupeng Qiu;Ee-Chien Chang",
        "authorids": "~Jiyi_Zhang1;~Han_Fang5;~Yupeng_Qiu1;~Ee-Chien_Chang1",
        "gender": "M;M;M;M",
        "homepage": ";;;https://www.comp.nus.edu.sg/~changec/",
        "dblp": ";;323/4753;67/4662",
        "google_scholar": ";_s8pJB0AAAAJ;https://scholar.google.com.sg/citations?user=QqqkPQUAAAAJ;qZavFBcAAAAJ",
        "orcid": ";0000-0001-9635-9859;0000-0002-2494-4992;0000-0003-4613-0866",
        "linkedin": "jiyizhang93;;%E7%85%9C%E5%BD%AD-%E9%82%B1-b766a2222/;",
        "or_profile": "~Jiyi_Zhang1;~Han_Fang5;~Yupeng_Qiu1;~Ee-Chien_Chang1",
        "aff": ";National University of Singapore;National University of Singapore;National University of Singapore",
        "aff_domain": ";nus.edu.sg;u.nus.edu;nus.edu.sg",
        "position": ";Postdoc;MS student;Associate Professor",
        "bibtex": "@misc{\nzhang2024domain,\ntitle={Domain Bridge: Generative Model-based Domain Forensic for Black-box Models},\nauthor={Jiyi Zhang and Han Fang and Yupeng Qiu and Ee-Chien Chang},\nyear={2024},\nurl={https://openreview.net/forum?id=VOrfPVYvbN}\n}",
        "github": "",
        "project": "",
        "reviewers": "PcJA;kDtS;9fPL;dB4Y;6Wte",
        "site": "https://openreview.net/forum?id=VOrfPVYvbN",
        "pdf_size": 888688,
        "rating": "3;3;5;5;6",
        "confidence": "4;4;3;2;3",
        "soundness": "2;1;3;3;2",
        "contribution": "2;1;2;3;2",
        "presentation": "2;2;2;2;3",
        "wc_summary": "64;37;59;42;84",
        "wc_strengths": "54;27;98;33;46",
        "wc_weaknesses": "138;267;86;16;100",
        "wc_questions": "90;52;5;2;43",
        "wc_review": "346;383;248;93;273",
        "wc_reply_reviewers": "0;47;0;0;24",
        "wc_reply_authors": "311;295;263;136;427",
        "reply_reviewers": "0;1;0;0;1",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            4.4,
            1.2
        ],
        "confidence_avg": [
            3.2,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.2,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            2.2,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            57.2,
            16.773789077009404
        ],
        "wc_strengths_avg": [
            51.6,
            25.064716236175506
        ],
        "wc_weaknesses_avg": [
            121.4,
            82.81932141716689
        ],
        "wc_questions_avg": [
            38.4,
            32.58588651548397
        ],
        "wc_review_avg": [
            268.6,
            100.35656430946607
        ],
        "wc_reply_reviewers_avg": [
            14.2,
            18.850994668717085
        ],
        "wc_reply_authors_avg": [
            286.4,
            93.39721623260513
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.7572401854185358,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:0U06H5dvTesJ:scholar.google.com/&scioq=Domain+Bridge:+Generative+Model-based+Domain+Forensic+for+Black-box+Models&hl=en&as_sdt=0,48",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "National University of Singapore",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nus.edu.sg",
        "aff_unique_abbr": "NUS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Singapore"
    },
    {
        "id": "VP20ZB6DHL",
        "title": "Chain-of-Verification Reduces Hallucination in Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Generation of plausible yet incorrect factual information, termed hallucination, is an unsolved issue in large language models. We study the ability of language models to deliberate on the responses they give in order to correct their mistakes. We develop the Chain-of-Verification (CoVe) method whereby the model first (i) drafts an initial response; then (ii) plans verification questions to fact-check its draft; (iii) answers those questions independently so the answers are not biased by other responses; and (iv) generates its final verified response. In experiments, we show CoVe decreases hallucinations across a variety of tasks, from list-based questions from Wikidata, closed book MultiSpanQA and longform text generation.",
        "keywords": "Large Language Model;Hallucination",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/834cf9b1b1f9e43fd189db60b73552d9eecc782b.zip",
        "author": "Shehzaad Zuzar Dhuliawala;Mojtaba Komeili;Jing Xu;Roberta Raileanu;Xian Li;Asli Celikyilmaz;Jason E Weston",
        "authorids": "~Shehzaad_Zuzar_Dhuliawala3;~Mojtaba_Komeili1;~Jing_Xu5;~Roberta_Raileanu2;~Xian_Li1;~Asli_Celikyilmaz1;~Jason_E_Weston1",
        "gender": ";M;F;;;F;",
        "homepage": ";https://mojtaba-komeili.github.io/;;;;https://asli.us;",
        "dblp": ";192/1409.html;;;82/1763-3.html;15/3724;",
        "google_scholar": ";gyaOXCAAAAAJ;https://scholar.google.com/citations?hl=en;;v_sIgawAAAAJ;https://scholar.google.com/citations?hl=en;",
        "orcid": ";;0000-0001-8289-1852;;;;",
        "linkedin": ";mkomeili/;jing-xu-818022a1;;;aslicelikyilmaz/;",
        "or_profile": "~Shehzaad_Zuzar_Dhuliawala3;~Mojtaba_Komeili1;~Jing_Xu5;~Roberta_Raileanu2;~Xian_Li1;~Asli_Celikyilmaz1;~Jason_E_Weston1",
        "aff": ";Facebook AI Research;FAIR;;Facebook AI;FAIR ;",
        "aff_domain": ";ai.facebook.com;meta.com;;fb.com;meta.com;",
        "position": ";Researcher;Researcher;;Principal Researcher;Principal Researcher;",
        "bibtex": "@misc{\ndhuliawala2024chainofverification,\ntitle={Chain-of-Verification Reduces Hallucination in Large Language Models},\nauthor={Shehzaad Zuzar Dhuliawala and Mojtaba Komeili and Jing Xu and Roberta Raileanu and Xian Li and Asli Celikyilmaz and Jason E Weston},\nyear={2024},\nurl={https://openreview.net/forum?id=VP20ZB6DHL}\n}",
        "github": "",
        "project": "",
        "reviewers": "r3aM;kMJo;Lhor;gDTz",
        "site": "https://openreview.net/forum?id=VP20ZB6DHL",
        "pdf_size": 1116238,
        "rating": "3;5;5;6",
        "confidence": "4;3;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "121;62;83;77",
        "wc_strengths": "24;34;83;63",
        "wc_weaknesses": "256;76;267;76",
        "wc_questions": "67;106;6;41",
        "wc_review": "468;278;439;257",
        "wc_reply_reviewers": "0;35;56;0",
        "wc_reply_authors": "644;356;523;202",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            85.75,
            21.741377601246892
        ],
        "wc_strengths_avg": [
            51.0,
            23.37733945512192
        ],
        "wc_weaknesses_avg": [
            168.75,
            92.83150058035257
        ],
        "wc_questions_avg": [
            55.0,
            36.54449342924321
        ],
        "wc_review_avg": [
            360.5,
            93.85760491297442
        ],
        "wc_reply_reviewers_avg": [
            22.75,
            23.93089007956035
        ],
        "wc_reply_authors_avg": [
            431.25,
            167.25635264467536
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.13245323570650439,
        "gs_citation": 394,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5213298442364780829&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Meta",
        "aff_unique_dep": "Facebook AI Research",
        "aff_unique_url": "https://research.facebook.com",
        "aff_unique_abbr": "FAIR",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "VPl472SKaB",
        "title": "Transforming Smallholder Farmers Support with an AI-Powered FAQbot: A Comparison of Techniques",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Access to sufficient information on desired agricultural practices, such as planting period, when to apply fertiliser, how to transport grains, etc. is of utmost importance in the agricultural industry as it directly affects farm yields. The responses to these questions are closed domain, therefore leading to the development of a question-answering conversational bot (FAQbot) that can provide the appropriate responses immediately. This study undertakes a comparative analysis of three distinct methodologies for constructing a FAQbot. These approaches encompass the development of a generative-based chatbot employing BERT and GPT-2, the creation of an intent classification model leveraging PyTorch and the Natural Language Toolkit (NLTK) libraries, and the implementation of an information retrieval-based model utilising pre-trained Large Language Models (LLMs) using Langchain. Our methodological framework includes the transformation of a FAQ dataset into formats suitable for chatbot training, specifically CSV and JSON. Notably, the retrieval-based method surpassed the generative-based and intent classification methods by consistently providing precise answers for every question in the database, irrespective of rephrasing or reframing.\n\nKeywords: Agriculture, FAQBot, LLMs, Natural Language Processing",
        "keywords": "Agriculture;FAQBot;LLMs;Natural Language Processing",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Mojolaoluwa Jadesola Adedokun;Saad Salami;David Chinweuba Onyeali;Bolaji Olayemi Toheeb;Damilare Adeyoyin;Kingsley Afuzobugwu",
        "authorids": "~Mojolaoluwa_Jadesola_Adedokun1;~Saad_Salami1;~David_Chinweuba_Onyeali1;~Bolaji_Olayemi_Toheeb1;~Damilare_Adeyoyin1;~Kingsley_Afuzobugwu1",
        "gender": "F;M;M;M;F;M",
        "homepage": ";;;;;",
        "dblp": ";;;;;",
        "google_scholar": ";;;;;",
        "orcid": ";;;;;",
        "linkedin": "jadesola-adedokun-75aa16182;saad-salami/;david-onyeali/;toheeb-olayemi/;https://linkedin.com/in/damilare-adeyoyin;https://www.linkedin.com/me?trk=p_mwlite_feed_updates-secondary_nav",
        "or_profile": "~Mojolaoluwa_Jadesola_Adedokun1;~Saad_Salami1;~David_Chinweuba_Onyeali1;~Bolaji_Olayemi_Toheeb1;~Damilare_Adeyoyin1;~Kingsley_Afuzobugwu1",
        "aff": "Babban Gona;Babban Gona;Babban Gona;;;",
        "aff_domain": "babbangona.com;babbangona.com;babbangona.com;;;",
        "position": "Associate Software Engineer;Machine Learning Engineer;Machine Learning Engineer;;;",
        "bibtex": "@misc{\nadedokun2024transforming,\ntitle={Transforming Smallholder Farmers Support with an {AI}-Powered {FAQ}bot: A Comparison of Techniques},\nauthor={Mojolaoluwa Jadesola Adedokun and Saad Salami and David Chinweuba Onyeali and Bolaji Olayemi Toheeb and Damilare Adeyoyin and Kingsley Afuzobugwu},\nyear={2024},\nurl={https://openreview.net/forum?id=VPl472SKaB}\n}",
        "github": "",
        "project": "",
        "reviewers": "VUMf;MXc3;WuHD;GDnG",
        "site": "https://openreview.net/forum?id=VPl472SKaB",
        "pdf_size": 326159,
        "rating": "1;3;3;3",
        "confidence": "4;4;3;4",
        "soundness": "1;2;2;2",
        "contribution": "1;1;1;1",
        "presentation": "1;2;2;1",
        "wc_summary": "209;40;38;73",
        "wc_strengths": "32;64;25;24",
        "wc_weaknesses": "260;108;39;105",
        "wc_questions": "23;2;1;34",
        "wc_review": "524;214;103;236",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.0,
            0.0
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            90.0,
            70.09636224512653
        ],
        "wc_strengths_avg": [
            36.25,
            16.315253599009733
        ],
        "wc_weaknesses_avg": [
            128.0,
            81.04628307331558
        ],
        "wc_questions_avg": [
            15.0,
            14.053469322555197
        ],
        "wc_review_avg": [
            269.25,
            155.4788972819141
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2482450133600345908&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Babban Gona",
        "aff_unique_dep": "",
        "aff_unique_url": "",
        "aff_unique_abbr": "",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "",
        "aff_country_unique": ""
    },
    {
        "id": "VPx3Jw2MSk",
        "title": "Seizing Serendipity: Exploiting the Value of Past Success in Off-Policy Actor Critic",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Learning high-quality $Q$-value functions plays a key role in the success of many modern off-policy deep reinforcement learning (RL) algorithms. \nPrevious works focus on addressing the value overestimation issue, an outcome of adopting function approximators and off-policy learning. \nDeviating from the common viewpoint, we observe that $Q$-values are indeed underestimated in the latter stage of the RL training process, \nprimarily related to the use of inferior actions from the current policy in Bellman updates as compared to the more optimal action samples in the replay buffer.\nWe hypothesize that this long-neglected phenomenon potentially hinders policy learning and reduces sample efficiency.\nOur insight to address this issue is to incorporate sufficient exploitation of past successes while maintaining exploration optimism.\nWe propose the Blended Exploitation and Exploration (BEE) operator, a simple yet effective approach that updates $Q$-value using both historical best-performing actions and the current policy. \nThe instantiations of our method in both model-free and model-based settings outperform state-of-the-art methods in various continuous control tasks and achieve strong performance in failure-prone scenarios and real-world robot tasks",
        "keywords": "Online RL;Off-policy Actor-Critic;Bellman operator;underexploitation issue",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/db1f0d62b36b166585b53e6887a2c91642a839cc.zip",
        "author": "Tianying Ji;Yu Luo;Fuchun Sun;Xianyuan Zhan;Jianwei Dr. Zhang;Huazhe Xu",
        "authorids": "~Tianying_Ji2;~Yu_Luo5;~Fuchun_Sun1;~Xianyuan_Zhan1;~Jianwei_Dr._Zhang1;~Huazhe_Xu1",
        "gender": "F;M;M;M;M;M",
        "homepage": ";;https://www.cs.tsinghua.edu.cn/info/1121/3555.htm;http://zhanxianyuan.xyz/;https://tams.informatik.uni-hamburg.de/people/zhang/;http://hxu.rocks",
        "dblp": "124/2199.html;;;181/5081;;164/9006",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com.hk/citations?user=KQjoQOMAAAAJ;;pDMnGloAAAAJ;;t9HPFawAAAAJ",
        "orcid": ";0000-0001-6229-4639;;0000-0002-3683-0554;;",
        "linkedin": ";;;;;",
        "or_profile": "~Tianying_Ji2;~Yu_Luo5;~Fuchun_Sun1;~Xianyuan_Zhan1;~Jianwei_Dr._Zhang1;~Huazhe_Xu1",
        "aff": "Tsinghua University;Tsinghua University;Tsinghua University;Tsinghua University;Universit\u00e4t Hamburg;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;tsinghua.edu.cn;cs.tsinghua.edu.cn;tsinghua.edu.cn;uni-hamburg.de;tsinghua.edu.cn",
        "position": "PhD student;PhD student;Full Professor;Associate Professor;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nji2024seizing,\ntitle={Seizing Serendipity: Exploiting the Value of Past Success in Off-Policy Actor Critic},\nauthor={Tianying Ji and Yu Luo and Fuchun Sun and Xianyuan Zhan and Jianwei Dr. Zhang and Huazhe Xu},\nyear={2024},\nurl={https://openreview.net/forum?id=VPx3Jw2MSk}\n}",
        "github": "",
        "project": "",
        "reviewers": "7mFW;FAWm;kjkr",
        "site": "https://openreview.net/forum?id=VPx3Jw2MSk",
        "pdf_size": 46597876,
        "rating": "6;6;6",
        "confidence": "3;4;5",
        "soundness": "3;3;3",
        "contribution": "2;3;2",
        "presentation": "2;3;4",
        "wc_summary": "61;63;61",
        "wc_strengths": "52;61;33",
        "wc_weaknesses": "156;93;232",
        "wc_questions": "4;215;2",
        "wc_review": "273;432;328",
        "wc_reply_reviewers": "14;17;22",
        "wc_reply_authors": "466;971;1306",
        "reply_reviewers": "1;1;1",
        "reply_authors": "2;3;5",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            61.666666666666664,
            0.9428090415820634
        ],
        "wc_strengths_avg": [
            48.666666666666664,
            11.67142760000773
        ],
        "wc_weaknesses_avg": [
            160.33333333333334,
            56.82917873377686
        ],
        "wc_questions_avg": [
            73.66666666666667,
            99.94109376138637
        ],
        "wc_review_avg": [
            344.3333333333333,
            65.93094030035435
        ],
        "wc_reply_reviewers_avg": [
            17.666666666666668,
            3.299831645537222
        ],
        "wc_reply_authors_avg": [
            914.3333333333334,
            345.2615755562086
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            1.247219128924647
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 16,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9080183421535615976&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;0;0;1;0",
        "aff_unique_norm": "Tsinghua University;University of Hamburg",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.uni-hamburg.de",
        "aff_unique_abbr": "THU;UHH",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;1;0",
        "aff_country_unique": "China;Germany"
    },
    {
        "id": "VQ7Q6qdp0P",
        "title": "Fine-tuning can cripple foundation models; preserving features may be the solution",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Pre-trained foundation models, due to their enormous capacity and their training using vast amounts of data can store knowledge about many real-world concepts. To further improve performance on downstream tasks, these models can be fine-tuned on task specific datasets. While various fine-tuning methods have been devised and have been shown to be highly effective, we observe that a fine-tuned model's ability to recognize concepts on tasks different from the downstream one is reduced significantly compared to its pre-trained counterpart. This is clearly undesirable as a huge amount of time and money went into learning those very concepts in the first place. We call this undesirable phenomenon \"concept forgetting'' and via experiments show that most end-to-end fine-tuning approaches suffer heavily from this side effect. To this end, we also propose a rather simple fix to this problem by designing a method called LDIFS (short for $\\ell_2$ distance in feature space) that simply preserves the features of the original foundation model during fine-tuning. We show that LDIFS significantly reduces concept forgetting without having noticeable impact on the downstream task performance.",
        "keywords": "concept forgetting;foundation model",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/d4d43a5d9abd7a3059afbbdaa921e9db396bc2c4.zip",
        "author": "Jishnu Mukhoti;Yarin Gal;Philip Torr;Puneet K. Dokania",
        "authorids": "~Jishnu_Mukhoti2;~Yarin_Gal1;~Philip_Torr1;~Puneet_K._Dokania1",
        "gender": "M;;;M",
        "homepage": "https://omegafragger.github.io/;http://www.cs.ox.ac.uk/people/yarin.gal/website//;http://www.robots.ox.ac.uk/~tvg/;http://puneetkdokania.github.io/",
        "dblp": ";67/9076;;150/4211",
        "google_scholar": "ebhcf9kAAAAJ;https://scholar.google.co.uk/citations?user=SIayDoQAAAAJ;;https://scholar.google.fr/citations?user=WsM7ybkAAAAJ",
        "orcid": ";;;",
        "linkedin": "jishnu-mukhoti;;;",
        "or_profile": "~Jishnu_Mukhoti2;~Yarin_Gal1;~Philip_Torr1;~Puneet_Dokania1",
        "aff": "University of Oxford;University of Oxford;University of Oxford;University of Oxford",
        "aff_domain": "ox.ac.uk;ox.ac.uk;ox.ac.uk;oxford.ac.uk",
        "position": "Doctoral Student;Associate Professor;Full Professor;Senior Researcher",
        "bibtex": "@misc{\nmukhoti2024finetuning,\ntitle={Fine-tuning can cripple foundation models; preserving features may be the solution},\nauthor={Jishnu Mukhoti and Yarin Gal and Philip Torr and Puneet K. Dokania},\nyear={2024},\nurl={https://openreview.net/forum?id=VQ7Q6qdp0P}\n}",
        "github": "",
        "project": "",
        "reviewers": "Deyx;cA9V;VWxz;2XG5",
        "site": "https://openreview.net/forum?id=VQ7Q6qdp0P",
        "pdf_size": 703364,
        "rating": "3;3;5;8",
        "confidence": "4;4;3;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;4;3;3",
        "wc_summary": "67;61;108;44",
        "wc_strengths": "77;38;98;26",
        "wc_weaknesses": "185;153;272;104",
        "wc_questions": "22;22;60;75",
        "wc_review": "351;274;538;249",
        "wc_reply_reviewers": "59;315;0;35",
        "wc_reply_authors": "803;782;1028;621",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "3;3;3;3",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            70.0,
            23.50531854708632
        ],
        "wc_strengths_avg": [
            59.75,
            29.03769102390891
        ],
        "wc_weaknesses_avg": [
            178.5,
            61.20661728930949
        ],
        "wc_questions_avg": [
            44.75,
            23.35995505132662
        ],
        "wc_review_avg": [
            353.0,
            113.23206259712838
        ],
        "wc_reply_reviewers_avg": [
            102.25,
            124.61014204309375
        ],
        "wc_reply_authors_avg": [
            808.5,
            144.9732733989269
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            0.0
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.07053456158585983,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6063341852602268987&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of Oxford",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ox.ac.uk",
        "aff_unique_abbr": "Oxford",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "VQZCXoteoP",
        "title": "Automatic Hallucination Assessment for Aligned Large Language Models via Transferable Adversarial Attacks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Although remarkable progress has been achieved preventing LLMs hallucinations, using instruction tuning and retrieval augmentation, it is currently difficult to measure the reliability of LLMs using available static data that is often not challenging enough and could suffer from data leakage. Inspired by adversarial machine learning, this paper aims to develop an automatic method for generating new evaluation data by appropriately modifying existing data on which LLMs behave faithfully. Specifically, this paper presents AutoDebug, an LLM-based framework for using prompt chaining to generate transferable adversarial attacks (in the form of question-answering examples). We seek to understand the extent to which these trigger hallucination behavior in LLMs.\nWe first implement our framework using ChatGPT and evaluate the resulting two variants of a popular open-domain question-answering dataset, Natural Questions (NQ) on a collection of open-source and proprietary LLMs under various prompting settings. Our generated evaluation data is human-readable and, as we show, humans can answer these modified questions well. Nevertheless, we observe pronounced accuracy drops across multiple LLMs including GPT-4. Our experimental results confirm that LLMs are likely to hallucinate in two categories of question-answering scenarios where (1) there are conflicts between knowledge given in the prompt and their parametric knowledge, or (2) the knowledge expressed in the prompt is complex. Finally, the adversarial examples generated by the proposed method are transferrable across all considered LLMs, making our approach viable for LLM-based debugging using more cost-effective LLMs.",
        "keywords": "LLM;Large Language Model;Hallucination;Adversarial Attack;Question Answering",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Xiaodong Yu;Hao Cheng;Xiaodong Liu;Dan Roth;Jianfeng Gao",
        "authorids": "~Xiaodong_Yu2;~Hao_Cheng4;~Xiaodong_Liu1;~Dan_Roth3;~Jianfeng_Gao1",
        "gender": "M;M;;M;M",
        "homepage": "https://www.xiaodongyu.me/;https://sites.google.com/site/hcheng2site/Home;;https://www.cis.upenn.edu/~danroth/;https://www.microsoft.com/en-us/research/people/jfgao/",
        "dblp": "97/4403-3;09/5158-2;65/622;r/DanRoth;92/5339",
        "google_scholar": "nmyIoRMAAAAJ;https://scholar.google.com/citations?hl=en;NIewcxMAAAAJ;E-bpPWgAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";0000-0001-7988-3149;;;",
        "linkedin": ";;;dan-roth-8667361/;",
        "or_profile": "~Xiaodong_Yu2;~Hao_Cheng4;~Xiaodong_Liu1;~Dan_Roth3;~Jianfeng_Gao1",
        "aff": "University of Pennsylvania;Microsoft Research;Microsoft Research;Amazon;Microsoft Research",
        "aff_domain": "seas.upenn.edu;microsoft.com;microsoft.com;amazon.com;microsoft.com",
        "position": "PhD student;Researcher;Researcher;VP and Distinguished Scientist;Principal Researcher",
        "bibtex": "@misc{\nyu2024automatic,\ntitle={Automatic Hallucination Assessment for Aligned Large Language Models via Transferable Adversarial Attacks},\nauthor={Xiaodong Yu and Hao Cheng and Xiaodong Liu and Dan Roth and Jianfeng Gao},\nyear={2024},\nurl={https://openreview.net/forum?id=VQZCXoteoP}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZWCj;akN9;6oNo;mBjG",
        "site": "https://openreview.net/forum?id=VQZCXoteoP",
        "pdf_size": 4233043,
        "rating": "3;3;5;5",
        "confidence": "4;3;3;3",
        "soundness": "3;3;3;3",
        "contribution": "2;2;2;2",
        "presentation": "3;3;3;3",
        "wc_summary": "70;72;53;166",
        "wc_strengths": "21;31;47;81",
        "wc_weaknesses": "87;182;325;391",
        "wc_questions": "79;29;49;5",
        "wc_review": "257;314;474;643",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            90.25,
            44.35298749802543
        ],
        "wc_strengths_avg": [
            45.0,
            22.759613353482084
        ],
        "wc_weaknesses_avg": [
            246.25,
            118.99868696754599
        ],
        "wc_questions_avg": [
            40.5,
            27.143139096279928
        ],
        "wc_review_avg": [
            422.0,
            150.36123170551645
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4807548127695761730&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;1;2;1",
        "aff_unique_norm": "University of Pennsylvania;Microsoft;Amazon",
        "aff_unique_dep": ";Microsoft Research;Amazon.com, Inc.",
        "aff_unique_url": "https://www.upenn.edu;https://www.microsoft.com/en-us/research;https://www.amazon.com",
        "aff_unique_abbr": "UPenn;MSR;Amazon",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "VRCh74Liu9",
        "title": "Federated Generalization via Information-Theoretic Distribution Diversification",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Federated Learning (FL) has surged in prominence due to its capability of collaborative model training without direct data sharing. However, the vast disparity in local data distributions among clients, often termed the non-Independent Identically Distributed (non-IID) challenge, poses a significant hurdle to FL's generalization efficacy. The scenario becomes even more complex when not all clients participate in the training process, a common occurrence due to unstable network connections or limited computational capacities. This can greatly complicate the assessment of the trained models' generalization abilities. While a plethora of recent studies has centered on the generalization gap pertaining to unseen data from participating clients with diverse distributions, the divergence between the training distributions of participating clients and the testing distributions of non-participating ones has been largely overlooked.\nIn response, our paper unveils an information-theoretic generalization framework for FL. Specifically, it quantifies generalization errors by evaluating the information entropy of local distributions and discerning discrepancies across these distributions. Inspired by our deduced generalization bounds, we introduce a weighted aggregation approach and a duo of client selection strategies. These innovations aim to bolster FL's generalization prowess by encompassing a more varied set of client data distributions. Our extensive empirical evaluations reaffirm the potency of our proposed methods, aligning seamlessly with our theoretical construct.",
        "keywords": "Federated learning;Information theory;Generalization theory;Learning theory",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/001cd428390559a88f7c1c5e52a200591852e470.pdf",
        "author": "Zheshun Wu;Zenglin Xu;Dun Zeng;Qifan Wang",
        "authorids": "~Zheshun_Wu1;~Zenglin_Xu1;~Dun_Zeng1;~Qifan_Wang2",
        "gender": "M;M;;M",
        "homepage": ";https://faculty.fudan.edu.cn/xuzenglin/en/index.htm;https://github.com/Zengdun-cs;https://wqfcr.github.io/",
        "dblp": ";68/1538;298/1134;33/8610",
        "google_scholar": "Y9cnocIAAAAJ;gF0H9nEAAAAJ;CuNFd3EAAAAJ;LrSyLosAAAAJ",
        "orcid": "0000-0002-4099-552X;0000-0001-5550-6461;;0000-0002-7570-5756",
        "linkedin": ";;;",
        "or_profile": "~Zheshun_Wu1;~Zenglin_Xu1;~Dun_Zeng1;~Qifan_Wang2",
        "aff": "Harbin Institute of Technology, Shenzhen;Harbin Institute of Technology Shenzhen;University of Electronic Science and Technology of China;Meta AI",
        "aff_domain": "hit.edu.cn;hit.edu.cn;uestc.edu.cn;fb.com",
        "position": "PhD student;Full Professor;PhD student;Principal Researcher",
        "bibtex": "@misc{\nwu2024federated,\ntitle={Federated Generalization via Information-Theoretic Distribution Diversification},\nauthor={Zheshun Wu and Zenglin Xu and Dun Zeng and Qifan Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=VRCh74Liu9}\n}",
        "github": "",
        "project": "",
        "reviewers": "tc4X;kMKS;poBc;pRU9",
        "site": "https://openreview.net/forum?id=VRCh74Liu9",
        "pdf_size": 3195580,
        "rating": "3;3;5;6",
        "confidence": "3;4;4;4",
        "soundness": "2;2;3;2",
        "contribution": "1;2;3;2",
        "presentation": "3;2;3;2",
        "wc_summary": "77;78;76;70",
        "wc_strengths": "45;61;45;88",
        "wc_weaknesses": "95;130;46;144",
        "wc_questions": "590;64;270;88",
        "wc_review": "807;333;437;390",
        "wc_reply_reviewers": "450;0;0;15",
        "wc_reply_authors": "1501;592;547;1039",
        "reply_reviewers": "3;0;0;1",
        "reply_authors": "5;1;1;3",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            75.25,
            3.112474899497183
        ],
        "wc_strengths_avg": [
            59.75,
            17.5695048308141
        ],
        "wc_weaknesses_avg": [
            103.75,
            37.81781987370504
        ],
        "wc_questions_avg": [
            253.0,
            210.24033866030564
        ],
        "wc_review_avg": [
            491.75,
            185.69783924429493
        ],
        "wc_reply_reviewers_avg": [
            116.25,
            192.78793401040429
        ],
        "wc_reply_authors_avg": [
            919.75,
            386.7928224515031
        ],
        "reply_reviewers_avg": [
            1.0,
            1.224744871391589
        ],
        "reply_authors_avg": [
            2.5,
            1.6583123951777
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5555555555555555,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13247250065013035381&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "Harbin Institute of Technology;University of Electronic Science and Technology of China;Meta",
        "aff_unique_dep": ";;Meta AI",
        "aff_unique_url": "http://en.hhit.edu.cn/;https://www.uestc.edu.cn;https://meta.com",
        "aff_unique_abbr": "HIT;UESTC;Meta",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Shenzhen;",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "VRJzlm2ecv",
        "title": "LMExplainer: A Knowledge-Enhanced Explainer for Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Language models (LMs), such as GPT-4, are powerful tools for natural language processing, capable of handling diverse tasks from text generation to question answering. However, their decision process lack transparency due to the complex, multi-layered, and nonlinear model structures involving millions of parameters. This hinders user trust on LMs, especially in safety-critical applications. Due to the opaque nature of LMs, a promising approach for explaining how they work is by generating explanations on a more transparent surrogate (e.g., a knowledge graph (KG)). Such works mostly exploit attention weights to provide explanations for LM recommendations. However, pure attention-based explanations lack scalability to keep up with the growing complexity of LMs. To bridge this important\ngap, we propose LMExplainer, a knowledge-enhanced explainer for LMs capable of providing human-understandable explanations. It is designed to efficiently locate the most relevant knowledge within a large-scale KG via the graph attention neural network (GAT) to extract key decision signals reflecting how a given LM works. Extensive experiments comparing LMExplainer against seven\nstate-of-the-art baselines show that it outperforms existing LM+KG methods on the CommonsenseQA and OpenBookQA datasets. We compare the explanation generated by LMExplainer with other algorithm-generated explanations as well as human-annotated explanations. The results show that LMExplainer generates more comprehensive and clearer explanations.",
        "keywords": "Explainability;XAI;Language Model",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Zichen Chen;Jianda Chen;Chen YuanYuan;Han Yu;Ambuj Singh;Misha Sra",
        "authorids": "~Zichen_Chen1;~Jianda_Chen1;~Chen_YuanYuan1;~Han_Yu1;~Ambuj_Singh1;~Misha_Sra1",
        "gender": "F;;M;M;;F",
        "homepage": ";;;https://sites.google.com/site/hanyushomepage/home;;https://sites.cs.ucsb.edu/~sra",
        "dblp": "23/7781;176/6660;;35/1096-1;;119/4545",
        "google_scholar": "X4goIzYAAAAJ;jEOSgcUAAAAJ;https://scholar.google.com/citations?hl=zh-TW;https://scholar.google.com.sg/citations?hl=en;;yDkV9BsAAAAJ",
        "orcid": ";;;0000-0001-6893-8650;;0000-0001-8154-8518",
        "linkedin": ";;;;;mishasra",
        "or_profile": "~Zichen_Chen1;~Jianda_Chen1;~Chen_YuanYuan1;~Han_Yu1;~Ambuj_Singh1;~Misha_Sra1",
        "aff": "University of California, Santa Barbara;Nanyang Technological University;Nanyang Technological University;Nanyang Technological University;;University of California, Santa Barbara",
        "aff_domain": "ucsb.edu;ntu.edu.sg;ntu.edu.sg;ntu.edu.sg;;ucsb.edu",
        "position": "PhD student;Researcher;Researcher;Associate Professor;;Assistant Professor",
        "bibtex": "@misc{\nchen2024lmexplainer,\ntitle={{LME}xplainer: A Knowledge-Enhanced Explainer for Language Models},\nauthor={Zichen Chen and Jianda Chen and Chen YuanYuan and Han Yu and Ambuj Singh and Misha Sra},\nyear={2024},\nurl={https://openreview.net/forum?id=VRJzlm2ecv}\n}",
        "github": "",
        "project": "",
        "reviewers": "hNAs;gb89;gatd;d4rH",
        "site": "https://openreview.net/forum?id=VRJzlm2ecv",
        "pdf_size": 410031,
        "rating": "3;5;5;6",
        "confidence": "3;3;4;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;3;3",
        "wc_summary": "61;56;89;79",
        "wc_strengths": "42;37;91;40",
        "wc_weaknesses": "124;92;250;29",
        "wc_questions": "5;122;163;36",
        "wc_review": "232;307;593;184",
        "wc_reply_reviewers": "0;0;135;0",
        "wc_reply_authors": "934;752;1767;583",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "3;2;4;2",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            71.25,
            13.348689074212494
        ],
        "wc_strengths_avg": [
            52.5,
            22.299103120977758
        ],
        "wc_weaknesses_avg": [
            123.75,
            80.50582277077851
        ],
        "wc_questions_avg": [
            81.5,
            63.64943047663506
        ],
        "wc_review_avg": [
            329.0,
            158.5985498042148
        ],
        "wc_reply_reviewers_avg": [
            33.75,
            58.45671475544961
        ],
        "wc_reply_authors_avg": [
            1009.0,
            454.89394368357995
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.13245323570650439,
        "gs_citation": 16,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18330774122276396723&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;1;1;0",
        "aff_unique_norm": "University of California, Santa Barbara;Nanyang Technological University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ucsb.edu;https://www.ntu.edu.sg",
        "aff_unique_abbr": "UCSB;NTU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Santa Barbara;",
        "aff_country_unique_index": "0;1;1;1;0",
        "aff_country_unique": "United States;Singapore"
    },
    {
        "id": "VT8jxBVe6a",
        "title": "$\\mathrm{BP}(\\lambda)$: bias-free online learning via synthetic gradients",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Training recurrent neural networks typically relies on backpropagation through time (BPTT). BPTT depends on forward and backward passes to be completed, rendering the network locked to these computations before loss gradients are available. Recently, Jaderberg et al. proposed synthetic gradients to alleviate the need for full BPTT. In their implementation synthetic gradients are learned through a mixture of backpropagated gradients and bootstrapped synthetic gradients, analogous to the temporal difference (TD) algorithm in Reinforcement Learning (RL). However, as in TD learning, heavy use of bootstrapping can result in bias which leads to poor synthetic gradient estimates. Inspired by the accumulate $\\mathrm{TD}(\\lambda)$ in RL, we propose a fully online method for learning synthetic gradients which avoids the use of BPTT altogether: *accumulate* $BP(\\lambda)$. As in accumulate $\\mathrm{TD}(\\lambda)$, we show analytically that accumulate $\\mathrm{BP}(\\lambda)$ can control the level of bias by using a mixture of temporal difference errors and recursively defined eligibility traces. We next demonstrate empirically that our model outperforms the original implementation for learning synthetic gradients in a variety of tasks, and is particularly suited for capturing longer timescales. Finally, building on recent work we reflect on accumulate $\\mathrm{BP}(\\lambda)$ as a principle for learning in biological circuits. In summary, inspired by RL principles we introduce an algorithm capable of bias-free online learning via synthetic gradients.",
        "keywords": "recurrent neural networks; supervised learning; temporal credit assignment; synthetic gradients; reinforcement learning; biological learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Joseph Oliver Pemberton;Rui Ponte Costa",
        "authorids": "~Joseph_Oliver_Pemberton1;~Rui_Ponte_Costa3",
        "gender": "M;M",
        "homepage": "https://neuralml.github.io/people/RPC_joe_pemberton/index.html;http://neuralml.github.io/",
        "dblp": "304/8878;210/2512",
        "google_scholar": "B9nk9MQAAAAJ;https://scholar.google.co.uk/citations?hl=en",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Joseph_Oliver_Pemberton1;~Rui_Ponte_Costa3",
        "aff": "University of Bristol;University of Oxford",
        "aff_domain": "bristol.ac.uk;ox.ac.uk",
        "position": "PhD student;Group Leader",
        "bibtex": "@misc{\npemberton2024mathrmbplambda,\ntitle={\\${\\textbackslash}mathrm\\{{BP}\\}({\\textbackslash}lambda)\\$: bias-free online learning via synthetic gradients},\nauthor={Joseph Oliver Pemberton and Rui Ponte Costa},\nyear={2024},\nurl={https://openreview.net/forum?id=VT8jxBVe6a}\n}",
        "github": "",
        "project": "",
        "reviewers": "5BBb;kswN;5CoH;KPff",
        "site": "https://openreview.net/forum?id=VT8jxBVe6a",
        "pdf_size": 14462582,
        "rating": "3;3;3;6",
        "confidence": "4;4;2;4",
        "soundness": "3;2;2;4",
        "contribution": "1;2;2;3",
        "presentation": "3;3;3;4",
        "wc_summary": "29;102;85;477",
        "wc_strengths": "16;121;19;42",
        "wc_weaknesses": "731;180;149;59",
        "wc_questions": "7;22;53;251",
        "wc_review": "783;425;306;829",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            173.25,
            177.437841228978
        ],
        "wc_strengths_avg": [
            49.5,
            42.488233665333745
        ],
        "wc_weaknesses_avg": [
            279.75,
            264.2928063720237
        ],
        "wc_questions_avg": [
            83.25,
            98.2608136542742
        ],
        "wc_review_avg": [
            585.75,
            224.82145693861162
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Bristol;University of Oxford",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.bristol.ac.uk;https://www.ox.ac.uk",
        "aff_unique_abbr": "Bristol;Oxford",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "title": "SWE-bench: Can Language Models Resolve Real-world Github Issues?",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18505",
        "id": "VTF8yNQM66",
        "author_site": "Carlos E Jimenez, John Yang, Alexander Wettig, Shunyu Yao, Kexin Pei, Ofir Press, Karthik Narasimhan",
        "tldr": "",
        "abstract": "Language models have outpaced our ability to evaluate them effectively, but for their future development it is essential to study the frontier of their capabilities. We find real-world software engineering to be a rich, sustainable, and challenging testbed for evaluating the next generation of language models. To this end, we introduce SWE-bench, an evaluation framework consisting of 2,294 software engineering problems drawn from real GitHub issues and corresponding pull requests across 12 popular Python repositories. Given a codebase along with a description of an issue to be resolved, a language model is tasked with editing the codebase to address the issue. Resolving issues in SWE-bench frequently requires understanding and coordinating changes across multiple functions, classes, and even files simultaneously, calling for models to interact with execution environments, process extremely long contexts and perform complex reasoning that goes far beyond traditional code generation tasks. Our evaluations show that both state-of-the-art proprietary models and our fine-tuned model SWE-Llama can resolve only the simplest issues. The best-performing model, Claude 2, is able to solve a mere 1.96% of the issues. Advances on SWE-bench represent steps towards LMs that are more practical, intelligent, and autonomous.",
        "keywords": "Language models;Natural language processing;Software engineering",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/26a8695734e7f6d2919446fc0aebea1ead373486.zip",
        "author": "Carlos E Jimenez;John Yang;Alexander Wettig;Shunyu Yao;Kexin Pei;Ofir Press;Karthik R Narasimhan",
        "authorids": "~Carlos_E_Jimenez1;~John_Yang3;~Alexander_Wettig1;~Shunyu_Yao1;~Kexin_Pei1;~Ofir_Press1;~Karthik_R_Narasimhan1",
        "gender": "M;M;;M;M;M;M",
        "homepage": "https://www.carlosejimenez.com;https://john-b-yang.github.io/;https://www.cs.princeton.edu/~awettig/;https://ysymyth.github.io;https://sites.google.com/site/kexinpeisite/;https://ofir.io/about;http://www.karthiknarasimhan.com",
        "dblp": "153/0588;;302/0235;156/1038;145/6061;185/0577;147/0322",
        "google_scholar": "Ue4wghAAAAAJ;71G11ksAAAAJ;N_jSE08AAAAJ;qJBXk9cAAAAJ;XzSkny0AAAAJ;LeHa8psAAAAJ;euc0GX4AAAAJ",
        "orcid": "0000-0001-9370-3909;;;;0000-0001-5052-9808;;",
        "linkedin": ";jyang20/;alexander-wettig/;;kexin-pei/;;",
        "or_profile": "~Carlos_E_Jimenez1;~John_Yang3;~Alexander_Wettig1;~Shunyu_Yao1;~Kexin_Pei1;~Ofir_Press1;~Karthik_R_Narasimhan1",
        "aff": "Princeton University;Stanford University;Allen Institute for Artificial Intelligence;Princeton University;The University of Chicago;Princeton University;Princeton University",
        "aff_domain": "princeton.edu;stanford.edu;allenai.org;princeton.edu;uchicago.edu;princeton.edu;princeton.edu",
        "position": "PhD student;PhD student;Intern;PhD student;Assistant Professor;Postdoc;Assistant Professor",
        "bibtex": "@inproceedings{\njimenez2024swebench,\ntitle={{SWE}-bench: Can Language Models Resolve Real-world Github Issues?},\nauthor={Carlos E Jimenez and John Yang and Alexander Wettig and Shunyu Yao and Kexin Pei and Ofir Press and Karthik R Narasimhan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=VTF8yNQM66}\n}",
        "github": "",
        "project": "",
        "reviewers": "BfZn;onWq;r43j;YqAB",
        "pdf_size": 2680380,
        "rating": "5;6;6;8",
        "confidence": "3;4;2;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;4",
        "presentation": "3;3;4;4",
        "wc_summary": "61;42;64;170",
        "wc_strengths": "37;68;38;124",
        "wc_weaknesses": "200;64;64;56",
        "wc_questions": "75;100;128;89",
        "wc_review": "373;274;294;439",
        "wc_reply_reviewers": "0;10;0;0",
        "wc_reply_authors": "1132;276;401;266",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            84.25,
            50.22138488731668
        ],
        "wc_strengths_avg": [
            66.75,
            35.32262023123426
        ],
        "wc_weaknesses_avg": [
            96.0,
            60.13318551349163
        ],
        "wc_questions_avg": [
            98.0,
            19.45507645834372
        ],
        "wc_review_avg": [
            345.0,
            65.69246532137457
        ],
        "wc_reply_reviewers_avg": [
            2.5,
            4.330127018922194
        ],
        "wc_reply_authors_avg": [
            518.75,
            358.03308157208045
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.48420012470625223,
        "gs_citation": 500,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14455904679012888680&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 9,
        "openreview": "https://openreview.net/forum?id=VTF8yNQM66",
        "pdf": "https://openreview.net/pdf?id=VTF8yNQM66",
        "email": "princeton.edu;stanford.edu;allenai.org;princeton.edu;uchicago.edu;princeton.edu;princeton.edu",
        "author_num": 7,
        "aff_unique_index": "0;1;2;0;3;0;0",
        "aff_unique_norm": "Princeton University;Stanford University;Allen Institute for Artificial Intelligence;University of Chicago",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.princeton.edu;https://www.stanford.edu;https://allenai.org;https://www.uchicago.edu",
        "aff_unique_abbr": "Princeton;Stanford;AI2;UChicago",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Stanford",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "ImageNet-OOD: Deciphering Modern Out-of-Distribution Detection Algorithms",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18504",
        "id": "VTYg5ykEGS",
        "author_site": "William Yang, Byron Zhang, Olga Russakovsky",
        "tldr": "",
        "abstract": "The task of out-of-distribution (OOD) detection is notoriously ill-defined. Earlier works focused on new-class detection, aiming to identify label-altering data distribution shifts, also known as \"semantic shift.\" However, recent works argue for a focus on failure detection, expanding the OOD evaluation framework to account for label-preserving data distribution shifts, also known as \"covariate shift.\u201d Intriguingly, under this new framework, complex OOD detectors that were previously considered state-of-the-art now perform similarly to, or even worse than the simple maximum softmax probability baseline. This raises the question: what are the latest OOD detectors actually detecting? Deciphering the behavior of OOD detection algorithms requires evaluation datasets that decouples semantic shift and covariate shift. To aid our investigations, we present ImageNet-OOD, a clean semantic shift dataset that minimizes the interference of covariate shift. Through comprehensive experiments, we show that OOD detectors are more sensitive to covariate shift than to semantic shift, and the benefits of recent OOD detection algorithms on semantic shift detection is minimal. Our dataset and analyses provide important insights for guiding the design of future OOD detectors.",
        "keywords": "Out-of-distribution Detection;Failure Detection;Object Discovery;Novelty Detection;Robustness",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "William Yang;Byron Zhang;Olga Russakovsky",
        "authorids": "~William_Yang1;~Byron_Zhang1;~Olga_Russakovsky1",
        "gender": "M;M;F",
        "homepage": ";;http://cs.princeton.edu/~olgarus",
        "dblp": ";;52/6883",
        "google_scholar": ";;TB5OwW8AAAAJ",
        "orcid": ";;0000-0001-5272-3241",
        "linkedin": "william-y-b218a6168/;byron-zhang/;",
        "or_profile": "~William_Yang1;~Byron_Zhang1;~Olga_Russakovsky1",
        "aff": "Princeton University;;Princeton University",
        "aff_domain": "princeton.edu;;princeton.edu",
        "position": "PhD student;;Associate Professor",
        "bibtex": "@inproceedings{\nyang2024imagenetood,\ntitle={ImageNet-{OOD}: Deciphering Modern Out-of-Distribution Detection Algorithms},\nauthor={William Yang and Byron Zhang and Olga Russakovsky},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=VTYg5ykEGS}\n}",
        "github": "",
        "project": "",
        "reviewers": "YNoR;PDzS;JbD1;pNua",
        "pdf_size": 2373157,
        "rating": "6;6;6;8",
        "confidence": "3;3;4;5",
        "soundness": "2;3;2;3",
        "contribution": "3;2;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "119;58;345;96",
        "wc_strengths": "72;106;36;153",
        "wc_weaknesses": "109;106;191;295",
        "wc_questions": "3;5;469;95",
        "wc_review": "303;275;1041;639",
        "wc_reply_reviewers": "0;0;20;114",
        "wc_reply_authors": "336;437;1211;623",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "1;1;2;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            154.5,
            112.12158578971312
        ],
        "wc_strengths_avg": [
            91.75,
            43.16465568031326
        ],
        "wc_weaknesses_avg": [
            175.25,
            77.09207157678408
        ],
        "wc_questions_avg": [
            143.0,
            191.84889887617285
        ],
        "wc_review_avg": [
            564.5,
            310.15923329799483
        ],
        "wc_reply_reviewers_avg": [
            33.5,
            47.188451977152205
        ],
        "wc_reply_authors_avg": [
            651.75,
            338.89627838027377
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.8703882797784891,
        "gs_citation": 16,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14907634667348731106&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=VTYg5ykEGS",
        "pdf": "https://openreview.net/pdf?id=VTYg5ykEGS",
        "email": "princeton.edu;;princeton.edu",
        "author_num": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Princeton University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.princeton.edu",
        "aff_unique_abbr": "Princeton",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "VTdGLgmQQM",
        "title": "Dual Fusion AutoEncoder for Graph Clustering",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Clustering of graphs has been an attractive topic in recent years. \nRecent research has focused on deep fusion graph clustering methods, i.e., fusing two different network structures to enhance the performance of clustering by capturing both graph structure information and node feature information. However, this approach is constrained by the representativeness of the chosen neural network and the choice of the fusion mechanism leads to an unpredictable degree of discretization of the learned graph embeddings. It thus becomes crucial to obtain more compact graph embeddings compatible with the clustering task. In this paper, we propose a new end-to-end fusion, dual fusion autoencoder for graph clustering (DFAC) for deep fusion networks. Our model makes full use of the topology and feature information of the graph and is trained simultaneously by multiple components to obtain better graph embedding. Benefiting from our design of a new dual fusion mechanism, this captures cross-modal good embeddings containing node topology and node feature information. Such a design makes it learn relaxed k-means and performs self-supervised training to improve the quality of graph embeddings while reconstructing the graph structure. By optimizing the training process that is in a unified framework, multiple components are mutually beneficial. Experimental results on six publicly available datasets demonstrate the superiority of the proposed method.",
        "keywords": "Graph Clustering;Graph Autoencoder;graph embeddings",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Yuanchi Ma;Hui He;Kaize Shi;Zhongxiang Lei;Jinyan Liu;Peng Zhang;Zhendong Niu",
        "authorids": "~Yuanchi_Ma1;~Hui_He2;~Kaize_Shi1;~Zhongxiang_Lei1;~Jinyan_Liu1;~Peng_Zhang38;~Zhendong_Niu2",
        "gender": "M;F;M;M;;;M",
        "homepage": "https://blog.csdn.net/weixin_43288629?type=blog;https://www.researchgate.net/profile/Hui_He43;https://profiles.uts.edu.au/Kaize.Shi;https://github.com/NPCLEI;;https://blog.csdn.net/KFasery/;",
        "dblp": "338/2501;https://dblp.uni-trier.de/pid/53/1151;233/6951;;149/9402;21/1048;https://dblp.uni-trier.de/pid/06/3613.html",
        "google_scholar": ";1IqAdRwAAAAJ;https://scholar.google.com/citations?hl=en;;;;",
        "orcid": ";0000-0001-5515-2739;0000-0003-3561-3627;;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Yuanchi_Ma1;~Hui_He2;~Kaize_Shi1;~Zhongxiang_Lei1;~Jinyan_Liu1;~Peng_Zhang38;~Zhendong_Niu2",
        "aff": "Beijing Institute of Technology;Beijing Institute of Technology;University of Technology Sydney;Beijing Institute of Technology;Beijing Institute of Technology;Beijing Institute of Technology;Beijing Institute of Technology",
        "aff_domain": "bit.edu.cn;bit.edu.cn;uts.edu.au;bit.edu.cn;bit.edu.cn;bit.edu.cn;bit.edu.cn",
        "position": "PhD student;PhD student;Postdoc;MS student;Full Professor;PhD student;Full Professor",
        "bibtex": "@misc{\nma2024dual,\ntitle={Dual Fusion AutoEncoder for Graph Clustering},\nauthor={Yuanchi Ma and Hui He and Kaize Shi and Zhongxiang Lei and Jinyan Liu and Peng Zhang and Zhendong Niu},\nyear={2024},\nurl={https://openreview.net/forum?id=VTdGLgmQQM}\n}",
        "github": "",
        "project": "",
        "reviewers": "TvZP;apCG;kMme;UPjN",
        "site": "https://openreview.net/forum?id=VTdGLgmQQM",
        "pdf_size": 1080010,
        "rating": "3;3;3;5",
        "confidence": "5;4;5;5",
        "soundness": "2;2;3;2",
        "contribution": "2;2;2;2",
        "presentation": "3;2;3;3",
        "wc_summary": "58;43;64;41",
        "wc_strengths": "23;23;60;70",
        "wc_weaknesses": "440;62;174;52",
        "wc_questions": "2;181;31;103",
        "wc_review": "523;309;329;266",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            51.5,
            9.759610647971568
        ],
        "wc_strengths_avg": [
            44.0,
            21.295539439046856
        ],
        "wc_weaknesses_avg": [
            182.0,
            156.46724896923317
        ],
        "wc_questions_avg": [
            79.25,
            69.30503228482041
        ],
        "wc_review_avg": [
            356.75,
            98.64678149843512
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:eZQSHsoufjwJ:scholar.google.com/&scioq=Dual+Fusion+AutoEncoder+for+Graph+Clustering&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;0;0;0",
        "aff_unique_norm": "Beijing Institute of Technology;University of Technology Sydney",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.bit.edu.cn/;https://www.uts.edu.au",
        "aff_unique_abbr": "BIT;UTS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0;0;0",
        "aff_country_unique": "China;Australia"
    },
    {
        "id": "VUA9LSmC2r",
        "title": "Learning Embodied Vision-Language Programming From Instruction, Exploration, and Environmental Feedback",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The fusion of vision and language in recent vision-language models (VLMs) represents a significant advancement in multimodal comprehension and interpretation. Furthermore, when seamlessly integrated into an embodied agent, it signifies a crucial stride towards the creation of autonomous and context-aware systems capable of formulating plans and executing commands with precision. In this paper, we introduce Octopus, a novel VLM designed to proficiently decipher an agent's egocentric vision and textual task objectives and to formulate intricate action sequences and generate executable code. Our design allows the agent to adeptly handle a wide spectrum of tasks, ranging from mundane daily chores in simulators to sophisticated interactions in complex video games. Octopus is trained by leveraging GPT-4 to generate training data, i.e., action blueprints and the corresponding executable code, within our experimental environment called OctoVerse, which provides instant feedback to refine the agent\u2019s decision making. Through a series of experiments, we illuminate Octopus's functionality and present compelling results. By open-sourcing our model architecture, simulator, and dataset, we aspire to ignite further innovation and foster collaborative applications within the broader embodied AI community.",
        "keywords": "Embodied AI;vision-language models",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/08d6732564e3cbb4473576a52c4416508888626a.zip",
        "author": "Jingkang Yang;Yuhao Dong;Shuai Liu;Bo Li;Ziyue Wang;Jiamu Kang;ChenCheng Jiang;Haoran Tan;Yuanhan Zhang;Kaiyang Zhou;Ziwei Liu",
        "authorids": "~Jingkang_Yang1;~Yuhao_Dong1;~Shuai_Liu14;~Bo_Li23;~Ziyue_Wang5;~Jiamu_Kang1;~ChenCheng_Jiang1;~Haoran_Tan1;~Yuanhan_Zhang1;~Kaiyang_Zhou1;~Ziwei_Liu1",
        "gender": "M;M;M;M;F;M;M;M;M;M;M",
        "homepage": "https://jingkang50.github.io/;;https://github.com/choiszt;https://www.brianboli.com/;;https://dorbmon.github.io/;;https://zhangyuanhan-ai.github.io/;https://kaiyangzhou.github.io/;https://liuziwei7.github.io/;https://kangjiamu.github.io/",
        "dblp": "175/5365.html;232/7896;;50/3402-80;;;;10/2476;203/3155;05/6300-2;359/0657",
        "google_scholar": "S-YjbUYAAAAJ;https://scholar.google.com/citations?hl=zh-CN;W9190BQAAAAJ;1_zc1-IAAAAJ;CSsCwyAAAAAJ;;;g6grFy0AAAAJ;https://scholar.google.co.uk/citations?user=gRIejugAAAAJ;https://scholar.google.com.hk/citations?user=lc45xlcAAAAJ;",
        "orcid": ";;;;;0009-0005-9411-1936;;;;;",
        "linkedin": ";https://www.linkedin.cn/incareer/in/ACoAADne80YBuYZteGlmnGrYzW2D-YEPj5UUXe0;;brianbo1121/;ziyue-wang-2b2512208/;;%E6%B5%A9%E7%84%B6-%E8%B0%AD-b3a486292/;;;;",
        "or_profile": "~Jingkang_Yang1;~Yuhao_Dong1;~Shuai_Liu14;~Bo_Li23;~Ziyue_Wang5;~ChenCheng_Jiang1;~Haoran_Tan1;~Yuanhan_Zhang1;~Kaiyang_Zhou1;~Ziwei_Liu1;~Kang_Jiamu1",
        "aff": "Nanyang Technological University;Department of Automation, Tsinghua University;Beijing University of Posts and Telecommunications;Nanyang Technological University;Nanyang Technological University;Xi'an Jiaotong University;Beijing University of Posts and Telecommunications;Nanyang Technological University;Hong Kong Baptist University;Nanyang Technological University;Tsinghua University",
        "aff_domain": "ntu.edu.sg;mails.tsinghua.edu.cn;bupt.edu.cn;ntu.edu.sg;ntu.edu.sg;xjtu.edu.cn;bupt.edu.cn;ntu.edu.sg;hkbu.edu.hk;ntu.edu.sg;tsinghua.edu.cn",
        "position": "PhD student;Undergrad student;Undergrad student;PhD student;MS student;Undergrad student;Undergrad student;PhD student;Assistant Professor;Assistant Professor;Undergrad student",
        "bibtex": "@misc{\nyang2024learning,\ntitle={Learning Embodied Vision-Language Programming From Instruction, Exploration, and Environmental Feedback},\nauthor={Jingkang Yang and Yuhao Dong and Shuai Liu and Bo Li and Ziyue Wang and Jiamu Kang and ChenCheng Jiang and Haoran Tan and Yuanhan Zhang and Kaiyang Zhou and Ziwei Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=VUA9LSmC2r}\n}",
        "github": "",
        "project": "",
        "reviewers": "ABA1;qA1p;VoZ1;CLdb",
        "site": "https://openreview.net/forum?id=VUA9LSmC2r",
        "pdf_size": 5122127,
        "rating": "3;3;5;5",
        "confidence": "5;4;4;4",
        "soundness": "2;1;3;3",
        "contribution": "2;2;3;3",
        "presentation": "1;1;2;3",
        "wc_summary": "39;20;66;44",
        "wc_strengths": "26;21;58;50",
        "wc_weaknesses": "442;278;280;193",
        "wc_questions": "24;4;48;240",
        "wc_review": "531;323;452;527",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1625;1121;1217;1361",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "4;3;3;3",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            42.25,
            16.37643123516232
        ],
        "wc_strengths_avg": [
            38.75,
            15.610493265749165
        ],
        "wc_weaknesses_avg": [
            298.25,
            90.11763146021981
        ],
        "wc_questions_avg": [
            79.0,
            94.24966843443005
        ],
        "wc_review_avg": [
            458.25,
            84.18840478355675
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1331.0,
            190.02105146535737
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            3.25,
            0.4330127018922193
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:7EfP4alA5bIJ:scholar.google.com/&scioq=Learning+Embodied+Vision-Language+Programming+From+Instruction,+Exploration,+and+Environmental+Feedback&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0;0;3;2;0;4;0;1",
        "aff_unique_norm": "Nanyang Technological University;Tsinghua University;Beijing University of Posts and Telecommunications;Xi'an Jiao Tong University;Hong Kong Baptist University",
        "aff_unique_dep": ";Department of Automation;;;",
        "aff_unique_url": "https://www.ntu.edu.sg;https://www.tsinghua.edu.cn;http://www.bupt.edu.cn/;https://www.xjtu.edu.cn;https://www.hkbu.edu.hk",
        "aff_unique_abbr": "NTU;THU;BUPT;XJTU;HKBU",
        "aff_campus_unique_index": "1;1;2",
        "aff_campus_unique": ";Beijing;Hong Kong SAR",
        "aff_country_unique_index": "0;1;1;0;0;1;1;0;1;0;1",
        "aff_country_unique": "Singapore;China"
    },
    {
        "id": "VUR7STEajx",
        "title": "M-BioBERTa: Modular RoBERTa-based Model for Biobank-scale Unified Representations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Transformers provide a novel approach for unifying large-scale biobank data spread across different modalities and omic domains. We introduce M-BioBERTa, a modular architecture for multimodal data that offers a robust mechanism for managing missing information. We evaluate the model using genetic, demographic, laboratory, diagnostic, and drug prescription data from the UK Biobank, focusing on multimorbidity and polypharmacy related to major depressive disorder. We investigate the harmonized and modular representations in M-BioBERTa for patient stratification. Furthermore, leveraging the learned representations to forecast future disease and drug burdens outperforms traditional machine learning approaches applied directly to the raw data.",
        "keywords": "transformers;RoBERTa;pretraining;multimodal data fusion;patient stratification;UK Biobank;major depressive disorder;multimorbidity;drug prescription",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "M\u00e1ty\u00e1s Antal;M\u00e1rk Marosi;Tam\u00e1s Nagy;Gabriella Juh\u00e1sz;Peter Antal",
        "authorids": "~M\u00e1ty\u00e1s_Antal1;~M\u00e1rk_Marosi1;tnagy@mit.bme.hu;juhasz.gabriella@semmelweis.hu;~Peter_Antal1",
        "gender": ";M;;;M",
        "homepage": "https://github.com/talma18/;https://github.com/Mapika;;;http://www.mit.bme.hu/eng/general/staff/antal",
        "dblp": ";;;;04/859",
        "google_scholar": ";;;;goOj9QwAAAAJ",
        "orcid": ";;;;0000-0002-4370-2198",
        "linkedin": ";;;;peter-antal-57142524/",
        "or_profile": "~M\u00e1ty\u00e1s_Antal1;~M\u00e1rk_Marosi1;tnagy@mit.bme.hu;juhasz.gabriella@semmelweis.hu;~Peter_Antal1",
        "aff": "Budapest University of Technology and Economics;Budapest University of Technology and Economics;;;Budapest University of Technology and Economics",
        "aff_domain": "bme.hu;bme.hu;;;bme.hu",
        "position": "MS student;MS student;;;Associate Professor",
        "bibtex": "@misc{\nantal2024mbioberta,\ntitle={M-Bio{BERT}a: Modular Ro{BERT}a-based Model for Biobank-scale Unified Representations},\nauthor={M{\\'a}ty{\\'a}s Antal and M{\\'a}rk Marosi and Tam{\\'a}s Nagy and Gabriella Juh{\\'a}sz and Peter Antal},\nyear={2024},\nurl={https://openreview.net/forum?id=VUR7STEajx}\n}",
        "github": "",
        "project": "",
        "reviewers": "e4Cc;aX8N;Xzvp",
        "site": "https://openreview.net/forum?id=VUR7STEajx",
        "pdf_size": 14167606,
        "rating": "3;5;8",
        "confidence": "5;4;4",
        "soundness": "3;3;2",
        "contribution": "3;2;3",
        "presentation": "1;2;3",
        "wc_summary": "60;27;102",
        "wc_strengths": "29;95;90",
        "wc_weaknesses": "35;98;46",
        "wc_questions": "251;50;39",
        "wc_review": "375;270;277",
        "wc_reply_reviewers": "0;25;17",
        "wc_reply_authors": "715;421;324",
        "reply_reviewers": "0;1;1",
        "reply_authors": "1;2;1",
        "rating_avg": [
            5.333333333333333,
            2.0548046676563256
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            63.0,
            30.692018506445613
        ],
        "wc_strengths_avg": [
            71.33333333333333,
            30.00370347510824
        ],
        "wc_weaknesses_avg": [
            59.666666666666664,
            27.475241379993168
        ],
        "wc_questions_avg": [
            113.33333333333333,
            97.44856192998553
        ],
        "wc_review_avg": [
            307.3333333333333,
            47.932823363072984
        ],
        "wc_reply_reviewers_avg": [
            14.0,
            10.424330514074594
        ],
        "wc_reply_authors_avg": [
            486.6666666666667,
            166.24145759172777
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.8029550685469661,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17453364805250248727&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Budapest University of Technology and Economics",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.bme.hu",
        "aff_unique_abbr": "BME",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Hungary"
    },
    {
        "id": "VVV5lGwuyQ",
        "title": "Parallel-in-Time Diffusion Model Sampling",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Diffusion models have emerged as a powerful new class of generative models that can produce high-quality data by reversing a stochastic differential equation. However, diffusion models have slow inference, as they require sampling one timestep at a time. To speed up inference, various samplers have been proposed in the past two years that use higher-order differential equation solvers, such as Heun\u2019s method and Runge-Kutta methods. However, these methods still perform sampling sequentially, limiting their efficiency. In this paper, we propose a new method for parallel-in-time sampling of diffusion models, inspired by classical parallel-in-time integration techniques. Our method can be used with any pre-trained diffusion model without modifying its architecture or finetuning it. We show that our method can achieve significant speedups over sequential sampling across a range of diffusion models and datasets, while maintaining comparable or better sample quality. Our method can also be applied to other differential-equation-based generative models, such as continuous normalizing flows.",
        "keywords": "diffusion;sampling;speed;inference",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Luke Melas-Kyriazi",
        "authorids": "~Luke_Melas-Kyriazi1",
        "gender": "M",
        "homepage": "https://lukemelas.github.io/",
        "dblp": "228/5680",
        "google_scholar": "https://scholar.google.com/citations?hl=en",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Luke_Melas-Kyriazi1",
        "aff": "",
        "aff_domain": "",
        "position": "",
        "bibtex": "@misc{\nmelas-kyriazi2024parallelintime,\ntitle={Parallel-in-Time Diffusion Model Sampling},\nauthor={Luke Melas-Kyriazi},\nyear={2024},\nurl={https://openreview.net/forum?id=VVV5lGwuyQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=VVV5lGwuyQ",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:n7nSsMIm-kwJ:scholar.google.com/&scioq=Parallel-in-Time+Diffusion+Model+Sampling&hl=en&as_sdt=0,44",
        "gs_version_total": 0
    },
    {
        "title": "An LLM can Fool Itself: A Prompt-Based Adversarial Attack",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18503",
        "id": "VVgGbB9TNV",
        "author_site": "Xilie Xu, Keyi Kong, Ning Liu, Lizhen Cui, Di Wang, Jingfeng Zhang, Mohan Kankanhalli",
        "tldr": "",
        "abstract": "The wide-ranging applications of large language models (LLMs), especially in safety-critical domains, necessitate the proper evaluation of the LLM\u2019s adversarial robustness. This paper proposes an efficient tool to audit the LLM\u2019s adversarial robustness via a prompt-based adversarial attack (PromptAttack). PromptAttack converts adversarial textual attacks into an attack prompt that can cause the victim LLM to output the adversarial sample to fool itself. The attack prompt is composed of three important components: (1) original input (OI) including the original sample and its ground-truth label, (2) attack objective (AO) illustrating a task description of generating a new sample that can fool itself without changing the semantic meaning, and (3) attack guidance (AG) containing the perturbation instructions to guide the LLM on how to complete the task by perturbing the original sample at character, word, and sentence levels, respectively. Besides, we use a fidelity filter to ensure that PromptAttack maintains the original semantic meanings of the adversarial examples. Further, we enhance the attack power of PromptAttack by ensembling adversarial examples at different perturbation levels. Comprehensive empirical results using Llama2 and GPT-3.5 validate that PromptAttack consistently yields a much higher attack success rate compared to AdvGLUE and AdvGLUE++. Interesting findings include that a simple emoji can easily mislead GPT-3.5 to make wrong predictions. Our source code is available at https://github.com/GodXuxilie/PromptAttack.",
        "keywords": "large language model;adversarial attack;adversarial robustness",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Xilie Xu;Keyi Kong;Ning Liu;Lizhen Cui;Di Wang;Jingfeng Zhang;Mohan Kankanhalli",
        "authorids": "~Xilie_Xu1;~Keyi_Kong1;~Ning_Liu3;~Lizhen_Cui1;~Di_Wang1;~Jingfeng_Zhang1;~Mohan_Kankanhalli1",
        "gender": "M;M;M;M;;M;M",
        "homepage": "https://godxuxilie.github.io/;https://github.com/luxinyayaya;http://liucsthu.github.io;https://faculty.sdu.edu.cn/cuilizhen/zh_CN/index.htm;;https://zjfheart.github.io;https://www.comp.nus.edu.sg/~mohan",
        "dblp": "259/2327;359/3282;83/622-14;;;227/2664.html;09/3613.html",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=zh-CN;fL1FZ-QAAAAJ;;;NS0P1FkAAAAJ;6Lx_eowAAAAJ",
        "orcid": ";0009-0001-2646-4781;;;;0000-0003-3491-8074;0000-0002-4846-2015",
        "linkedin": ";;;;;;mohan-kankanhalli-583417221",
        "or_profile": "~Xilie_Xu1;~Keyi_Kong1;~Ning_Liu3;~Lizhen_Cui1;~Di_Wang1;~Jingfeng_Zhang1;~Mohan_Kankanhalli1",
        "aff": "National University of Singapore;Shandong University;Shandong University;Shandong University;;University of Auckland;National University of Singapore",
        "aff_domain": "nus.edu.sg;sdu.edu.cn;sdu.edu.cn;sdu.edu.cn;;auckland.ac.nz;nus.edu.sg",
        "position": "PhD student;Undergrad student;Assistant Professor;Full Professor;;Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\nxu2024an,\ntitle={An {LLM} can Fool Itself: A Prompt-Based Adversarial Attack},\nauthor={Xilie Xu and Keyi Kong and Ning Liu and Lizhen Cui and Di Wang and Jingfeng Zhang and Mohan Kankanhalli},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=VVgGbB9TNV}\n}",
        "github": "",
        "project": "",
        "reviewers": "tZSe;2JDp;zRU1",
        "pdf_size": 775912,
        "rating": "5;5;6",
        "confidence": "3;3;5",
        "soundness": "3;2;2",
        "contribution": "2;2;2",
        "presentation": "4;3;3",
        "wc_summary": "55;92;48",
        "wc_strengths": "64;19;23",
        "wc_weaknesses": "83;104;84",
        "wc_questions": "7;5;56",
        "wc_review": "209;220;211",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "779;1334;1118",
        "reply_reviewers": "0;0;0",
        "reply_authors": "3;4;2",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            65.0,
            19.30457631409368
        ],
        "wc_strengths_avg": [
            35.333333333333336,
            20.33606539022619
        ],
        "wc_weaknesses_avg": [
            90.33333333333333,
            9.672412085697939
        ],
        "wc_questions_avg": [
            22.666666666666668,
            23.584363935078304
        ],
        "wc_review_avg": [
            213.33333333333334,
            4.784233364802441
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1077.0,
            228.42504240997746
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            3.0,
            0.816496580927726
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 32,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10256393491899952557&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=VVgGbB9TNV",
        "pdf": "https://openreview.net/pdf?id=VVgGbB9TNV",
        "email": "nus.edu.sg;sdu.edu.cn;sdu.edu.cn;sdu.edu.cn;;auckland.ac.nz;nus.edu.sg",
        "author_num": 7,
        "aff_unique_index": "0;1;1;1;2;0",
        "aff_unique_norm": "National University of Singapore;Shandong University;University of Auckland",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.nus.edu.sg;http://www.sdu.edu.cn;https://www.auckland.ac.nz",
        "aff_unique_abbr": "NUS;SDU;UoA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;2;0",
        "aff_country_unique": "Singapore;China;New Zealand"
    },
    {
        "id": "VWGyUZ9dOX",
        "title": "Data augmentation guided Decouple Knowledge Distillation for low-resolution fine-grained image classification",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Continuous development of convolutional neural networks has shown good performance for fine-grained image classification by identifying fine features in high-resolution images.However, in the real world, many images are due to camera or environmental restrictions. Low resolution images with fewer fine features result in a dramatic reduction in classification accuracy.In this study, a twophase Data Augmentation guided Decoupled Knowledge Distillation (DADKD) framework is proposed to improve classification accuracy for low-resolution images.In the proposed DADKD, one phase is data augmentation that generates a composite image and corresponding labels. Another stage is knowledge distillation, which minimizes differences between high-resolution and low-resolution image features.\nThe proposed DADKD validated on three fine-grained datasets (i.e Stanford-Cars, FGVC-Aircraft, and CUB-200-2011 datasets).\nExperimental results show that our proposed DADKD achieves 88.19%, 78.98% and 80.33% classification accuracy on these three datasets, state-of-the-art methods such as SnapMix and Decoupled Knowledge Distillation (DKD).The method proposes a viable solution for fine-grained classification at low resolution.",
        "keywords": "Data augmentation/Knowledge Distillation/low-resolution/fine-grained image classification",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Haotian Zhang;YongLiang Qiao;Meili Wang",
        "authorids": "~Haotian_Zhang8;~YongLiang_Qiao2;~Meili_Wang1",
        "gender": "M;M;F",
        "homepage": ";https://www.google.com/;https://cie.nwsuaf.edu.cn/szdw/js/2012110003/index.htm",
        "dblp": ";;119/6259",
        "google_scholar": ";;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0003-2546-0129;;",
        "linkedin": ";;",
        "or_profile": "~Haotian_Zhang8;~YongLiang_Qiao2;~Meili_Wang1",
        "aff": "NORTHWEST A&F UNIVERSITY;The University of Sydney;Northwest A&F University",
        "aff_domain": "nwafu.edu.cn;sydney.edu.au;nwafu.edu.cn",
        "position": "MS student;Researcher;Full Professor",
        "bibtex": "@misc{\nzhang2024data,\ntitle={Data augmentation guided Decouple Knowledge Distillation for low-resolution fine-grained image classification},\nauthor={Haotian Zhang and YongLiang Qiao and Meili Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=VWGyUZ9dOX}\n}",
        "github": "",
        "project": "",
        "reviewers": "9NKv;EVNV;XNWE;c2Tf",
        "site": "https://openreview.net/forum?id=VWGyUZ9dOX",
        "pdf_size": 1191038,
        "rating": "3;3;3;5",
        "confidence": "5;4;3;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;1;3",
        "presentation": "3;3;1;3",
        "wc_summary": "50;83;95;36",
        "wc_strengths": "30;109;13;21",
        "wc_weaknesses": "321;466;151;99",
        "wc_questions": "102;104;9;2",
        "wc_review": "503;762;268;158",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            66.0,
            23.90606617576384
        ],
        "wc_strengths_avg": [
            43.25,
            38.43419701255641
        ],
        "wc_weaknesses_avg": [
            259.25,
            144.87645598923243
        ],
        "wc_questions_avg": [
            54.25,
            48.81790142970097
        ],
        "wc_review_avg": [
            422.75,
            232.14798620707438
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ONF5fx9k4AEJ:scholar.google.com/&scioq=Data+augmentation+guided+Decouple+Knowledge+Distillation+for+low-resolution+fine-grained+image+classification&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Northwest A&F University;University of Sydney",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.nwsuaf.edu.cn;https://www.sydney.edu.au",
        "aff_unique_abbr": "NWSUAF;USYD",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "China;Australia"
    },
    {
        "title": "Order-Preserving GFlowNets",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18502",
        "id": "VXDPXuq4oG",
        "author_site": "Yihang Chen, Lukas Mauch",
        "tldr": "",
        "abstract": "Generative Flow Networks (GFlowNets) have been introduced as a method to sample a diverse set of candidates with probabilities proportional to a given reward. However, GFlowNets can only be used with a predefined scalar reward, which can be either computationally expensive or not directly accessible, in the case of multi-objective optimization (MOO) tasks for example. Moreover, to prioritize identifying high-reward candidates, the conventional practice is to raise the reward to a higher exponent, the optimal choice of which may vary across different environments. To address these issues, we propose Order-Preserving GFlowNets (OP-GFNs), which sample with probabilities in proportion to a learned reward function that is consistent with a provided (partial) order on the candidates, thus eliminating the need for an explicit formulation of the reward function. We theoretically prove that the training process of OP-GFNs gradually sparsifies the learned reward landscape in single-objective maximization tasks. The sparsification concentrates on candidates of a higher hierarchy in the ordering, ensuring exploration at the beginning and exploitation towards the end of the training. We demonstrate OP-GFN's state-of-the-art performance in single-objective maximization (totally ordered) and multi-objective Pareto front approximation (partially ordered) tasks, including synthetic datasets, molecule generation, and neural architecture search.",
        "keywords": "probabilistic sampling;multi-objective optimization;GFlowNet",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/bcf29a6ec8a5d4b9138954c77d56f8166bb9fba1.zip",
        "author": "Yihang Chen;Lukas Mauch",
        "authorids": "~Yihang_Chen1;~Lukas_Mauch1",
        "gender": "M;M",
        "homepage": "https://yhangchen.github.io/;",
        "dblp": ";123/9181",
        "google_scholar": "HzlOQRkAAAAJ;ivJ6Tf8AAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Yihang_Chen1;~Lukas_Mauch1",
        "aff": "EPFL - EPF Lausanne;Sony Europe B.V.",
        "aff_domain": "epfl.ch;sony.com",
        "position": "MS student;Researcher",
        "bibtex": "@inproceedings{\nchen2024orderpreserving,\ntitle={Order-Preserving {GF}lowNets},\nauthor={Yihang Chen and Lukas Mauch},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=VXDPXuq4oG}\n}",
        "github": "",
        "project": "",
        "reviewers": "CCax;Ndf3;8SYj;BMH3;ipVV",
        "pdf_size": 4288365,
        "rating": "6;6;6;6;8",
        "confidence": "4;3;3;4;4",
        "soundness": "3;3;3;3;3",
        "contribution": "2;3;3;3;3",
        "presentation": "3;3;3;3;3",
        "wc_summary": "150;112;84;76;96",
        "wc_strengths": "22;116;102;74;51",
        "wc_weaknesses": "408;161;219;112;162",
        "wc_questions": "10;114;187;91;488",
        "wc_review": "590;503;592;353;797",
        "wc_reply_reviewers": "103;22;19;16;110",
        "wc_reply_authors": "435;396;534;510;855",
        "reply_reviewers": "1;1;1;1;1",
        "reply_authors": "4;2;2;3;2",
        "rating_avg": [
            6.4,
            0.7999999999999999
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.8,
            0.39999999999999997
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            103.6,
            26.180909075125715
        ],
        "wc_strengths_avg": [
            73.0,
            33.988233257996804
        ],
        "wc_weaknesses_avg": [
            212.4,
            103.50381635476056
        ],
        "wc_questions_avg": [
            178.0,
            164.96666329898292
        ],
        "wc_review_avg": [
            567.0,
            144.18460389375838
        ],
        "wc_reply_reviewers_avg": [
            54.0,
            42.96510211788167
        ],
        "wc_reply_authors_avg": [
            546.0,
            162.3219024038346
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.6,
            0.8
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.408248290463863,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7554998388877200461&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=VXDPXuq4oG",
        "pdf": "https://openreview.net/pdf?id=VXDPXuq4oG",
        "email": "epfl.ch;sony.com",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "EPFL;Sony Europe",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.epfl.ch;https://www.sony.eu",
        "aff_unique_abbr": "EPFL;Sony Europe",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Lausanne;",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Switzerland;Unknown"
    },
    {
        "title": "HYPO: Hyperspherical Out-Of-Distribution Generalization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18501",
        "id": "VXak3CZZGC",
        "author_site": "Haoyue Bai, Yifei Ming, Julian Katz-Samuels, Yixuan Li",
        "tldr": "",
        "abstract": "Out-of-distribution (OOD) generalization is critical for machine learning models deployed in the real world. However, achieving this can be fundamentally challenging, as it requires the ability to learn invariant features across different domains or environments. In this paper, we propose a novel framework HYPO (HYPerspherical OOD generalization) that provably learns domain-invariant representations in a hyperspherical space. In particular, our hyperspherical learning algorithm is guided by intra-class variation and inter-class separation principles\u2014ensuring that features from the same class (across different training domains) are closely aligned with their class prototypes, while different class prototypes are maximally separated. We further provide theoretical justifications on how our prototypical learning objective improves the OOD generalization bound. Through extensive experiments on challenging OOD benchmarks, we demonstrate that our approach outperforms competitive baselines and achieves superior performance. Code is available at https://github.com/deeplearning-wisc/hypo.",
        "keywords": "OOD Generalization;Domain Generalization;Hypersphere",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Haoyue Bai;Yifei Ming;Julian Katz-Samuels;Yixuan Li",
        "authorids": "~Haoyue_Bai1;~Yifei_Ming1;~Julian_Katz-Samuels3;~Yixuan_Li1",
        "gender": "F;M;F;M",
        "homepage": "https://haoyuebaizju.github.io/;https://alvinmingsf.github.io/;http://pages.cs.wisc.edu/~sharonli/;https://jkatzsam.github.io/",
        "dblp": "150/3371.html;277/4125;144/6087-1;",
        "google_scholar": "https://scholar.google.com/citations?view_op=search_authors;Dh_4cyQAAAAJ;https://scholar.google.com/citations?hl=en;",
        "orcid": "0000-0001-8139-0431;;;",
        "linkedin": "haoyue-bai-a2234a257/;;liyixuan;",
        "or_profile": "~Haoyue_Bai1;~Yifei_Ming1;~Yixuan_Li1;~JULIAN_KATZ-SAMUELS1",
        "aff": "University of Wisconsin - Madison;University of Wisconsin - Madison;Cornell University;",
        "aff_domain": "wisc.edu;wisc.edu;cornell.edu;",
        "position": "PhD student;PhD student;Graduate Student;",
        "bibtex": "@inproceedings{\nbai2024hypo,\ntitle={{HYPO}: Hyperspherical Out-Of-Distribution Generalization},\nauthor={Haoyue Bai and Yifei Ming and Julian Katz-Samuels and Yixuan Li},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=VXak3CZZGC}\n}",
        "github": "",
        "project": "",
        "reviewers": "kMBq;W1ps;HW2k",
        "pdf_size": 4859661,
        "rating": "3;6;6",
        "confidence": "5;4;3",
        "soundness": "3;4;3",
        "contribution": "2;3;3",
        "presentation": "3;3;3",
        "wc_summary": "76;170;126",
        "wc_strengths": "33;220;65",
        "wc_weaknesses": "276;282;238",
        "wc_questions": "2;404;38",
        "wc_review": "387;1076;467",
        "wc_reply_reviewers": "925;268;111",
        "wc_reply_authors": "2746;807;1044",
        "reply_reviewers": "2;1;1",
        "reply_authors": "6;3;2",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            124.0,
            38.40138886377245
        ],
        "wc_strengths_avg": [
            106.0,
            81.66190462306562
        ],
        "wc_weaknesses_avg": [
            265.3333333333333,
            19.48218559493661
        ],
        "wc_questions_avg": [
            148.0,
            181.61497735594386
        ],
        "wc_review_avg": [
            643.3333333333334,
            307.67984803832843
        ],
        "wc_reply_reviewers_avg": [
            434.6666666666667,
            352.592619825707
        ],
        "wc_reply_authors_avg": [
            1532.3333333333333,
            863.6289069321898
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            1.699673171197595
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8660254037844387,
        "gs_citation": 16,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8691457727600318616&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=VXak3CZZGC",
        "pdf": "https://openreview.net/pdf?id=VXak3CZZGC",
        "email": "wisc.edu;wisc.edu;cornell.edu;",
        "author_num": 4,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "University of Wisconsin-Madison;Cornell University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.wisc.edu;https://www.cornell.edu",
        "aff_unique_abbr": "UW-Madison;Cornell",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Madison;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "VZTFUtldbC",
        "title": "MeMo: Meaningful, Modular Controllers Via Information Bottlenecks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Robots are often built from standardized assemblies, (e.g. arms, legs, or fingers), but each robot must be trained from scratch to control all the actuators of all the parts together. In this paper we demonstrate a new approach that takes a single robot and its controller as input and produces a set of modular controllers for each of these assemblies such that when a new robot is built from the same parts, its control can be quickly learned by reusing the modular controllers. We achieve this with a framework called MeMo which learns (Me)aningful, (Mo)dular controllers. Specifically, MeMo pretrains a modular architecture that assigns separate neural networks to physical substructures and uses an information bottleneck to learn an appropriate division of control information between the modules. We benchmark our framework in locomotion and grasping environments on challenging simple to complex robot morphology transfer. We also show that the modules help in task transfer. On both structure and task transfer, MeMo achieves improved training efficiency to pretrained graph neural network baselines. In particular, MeMo significantly improves training efficiency on structure transfer, often achieving 2x the training efficiency of the strongest baseline.",
        "keywords": "modular neural network policy;policy transfer;imitation learning;reinforcement learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/670918b28af969667bf7bc5823e5ad80f31843bb.zip",
        "author": "Megan Tjandrasuwita;Jie Xu;Armando Solar-Lezama;Wojciech Matusik",
        "authorids": "~Megan_Tjandrasuwita1;~Jie_Xu7;~Armando_Solar-Lezama1;~Wojciech_Matusik2",
        "gender": "F;M;M;M",
        "homepage": "https://megantj.github.io/;https://people.csail.mit.edu/jiex;https://people.csail.mit.edu/asolar/;https://cdfg.mit.edu/wojciech",
        "dblp": "294/8475;37/5126-28;95/6919;",
        "google_scholar": ";3Tj5lWEAAAAJ;https://scholar.google.com.tw/citations?user=8BX3BokAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;0000-0003-0212-5643",
        "linkedin": "megan-tjandrasuwita/;;;wojciech-matusik-67238126/",
        "or_profile": "~Megan_Tjandrasuwita1;~Jie_Xu7;~Armando_Solar-Lezama1;~Wojciech_Matusik2",
        "aff": "Massachusetts Institute of Technology;NVIDIA;Massachusetts Institute of Technology;Massachusetts Institute of Technology",
        "aff_domain": "mit.edu;nvidia.com;mit.edu;mit.edu",
        "position": "PhD student;Researcher;Full Professor;Full Professor",
        "bibtex": "@misc{\ntjandrasuwita2024memo,\ntitle={MeMo: Meaningful, Modular Controllers Via Information Bottlenecks},\nauthor={Megan Tjandrasuwita and Jie Xu and Armando Solar-Lezama and Wojciech Matusik},\nyear={2024},\nurl={https://openreview.net/forum?id=VZTFUtldbC}\n}",
        "github": "",
        "project": "",
        "reviewers": "eG93;uVBN;aQSN;PL91",
        "site": "https://openreview.net/forum?id=VZTFUtldbC",
        "pdf_size": 5960253,
        "rating": "3;5;5;6",
        "confidence": "4;4;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;3;3",
        "wc_summary": "89;58;98;66",
        "wc_strengths": "23;128;59;78",
        "wc_weaknesses": "438;136;216;84",
        "wc_questions": "3;41;48;27",
        "wc_review": "553;363;421;255",
        "wc_reply_reviewers": "0;5;0;0",
        "wc_reply_authors": "927;745;694;418",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            77.75,
            16.315253599009733
        ],
        "wc_strengths_avg": [
            72.0,
            37.887992820945264
        ],
        "wc_weaknesses_avg": [
            218.5,
            135.16933823911398
        ],
        "wc_questions_avg": [
            29.75,
            17.195566289017645
        ],
        "wc_review_avg": [
            398.0,
            107.50348831549607
        ],
        "wc_reply_reviewers_avg": [
            1.25,
            2.165063509461097
        ],
        "wc_reply_authors_avg": [
            696.0,
            182.38009759839477
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.13245323570650439,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:fgdgs47wycUJ:scholar.google.com/&scioq=MeMo:+Meaningful,+Modular+Controllers+Via+Information+Bottlenecks&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Massachusetts Institute of Technology;NVIDIA",
        "aff_unique_dep": ";NVIDIA Corporation",
        "aff_unique_url": "https://web.mit.edu;https://www.nvidia.com",
        "aff_unique_abbr": "MIT;NVIDIA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "VZVXqiaI4U",
        "title": "Attribute Based Interpretable Evaluation Metrics for Generative Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "When the training dataset comprises a 1:1 proportion of dogs to cats, a generative model that produces 1:1 dogs and cats better resembles the training species distribution than another model with 3:1 dogs and cats. Can we capture this phenomenon using existing metrics? Unfortunately, we cannot, because these metrics do not provide any interpretability beyond \u201cdiversity\". In this context, we propose a new evaluation protocol that measures the divergence of a set of generated images from the training set regarding the distribution of attribute strengths as follows. Single-attribute Divergence (SaD) measures the divergence regarding PDFs of a single attribute. Paired-attribute Divergence (PaD) measures the divergence regarding joint PDFs of a pair of attributes. They provide which attributes the models struggle. For measuring the attribute strengths of an image, we propose Heterogeneous CLIPScore (HCS) which measures the cosine similarity between image and text vectors with heterogeneous initial points. With SaD and PaD, we reveal the following about existing generative models. ProjectedGAN generates implausible attribute relationships such as a baby with a beard even though it has competitive scores of existing metrics. Diffusion models struggle to capture diverse colors in the datasets. The larger sampling timesteps of latent diffusion model generate the more minor objects including earrings and necklaces. Stable Diffusion v1.5 better captures the attributes than v2.1. Our metrics lay a foundation for explainable evaluations of generative models.",
        "keywords": "Evaluation metric for generative models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/17c81ab5034278489416f347122df13403b69222.zip",
        "author": "Dongkyun Kim;Mingi Kwon;Youngjung Uh",
        "authorids": "~Dongkyun_Kim2;~Mingi_Kwon1;~Youngjung_Uh2",
        "gender": "M;M;",
        "homepage": "https://vilab.yonsei.ac.kr;https://github.com/kwonminki;https://vilab.yonsei.ac.kr/member/professor",
        "dblp": ";327/3276;57/10511",
        "google_scholar": ";https://scholar.google.co.kr/citations?user=W8vK8BwAAAAJ;BWBGrEEAAAAJ",
        "orcid": ";;",
        "linkedin": ";kwonmingi/;youngjung-uh-78b459b5/",
        "or_profile": "~Dongkyun_Kim2;~Mingi_Kwon1;~Youngjung_Uh2",
        "aff": "Yonsei University;Yonsei University;Yonsei University",
        "aff_domain": "yonsei.ac.kr;yonsei.ac.kr;yonsei.ac.kr",
        "position": "MS student;PhD student;Associate Professor",
        "bibtex": "@misc{\nkim2024attribute,\ntitle={Attribute Based Interpretable Evaluation Metrics for Generative Models},\nauthor={Dongkyun Kim and Mingi Kwon and Youngjung Uh},\nyear={2024},\nurl={https://openreview.net/forum?id=VZVXqiaI4U}\n}",
        "github": "",
        "project": "",
        "reviewers": "rWJQ;7B16;B3SF",
        "site": "https://openreview.net/forum?id=VZVXqiaI4U",
        "pdf_size": 13271764,
        "rating": "3;5;8",
        "confidence": "3;4;5",
        "soundness": "1;3;4",
        "contribution": "2;2;4",
        "presentation": "2;2;4",
        "wc_summary": "63;63;133",
        "wc_strengths": "5;45;130",
        "wc_weaknesses": "279;141;124",
        "wc_questions": "4;8;88",
        "wc_review": "351;257;475",
        "wc_reply_reviewers": "482;17;236",
        "wc_reply_authors": "2304;471;1857",
        "reply_reviewers": "1;1;3",
        "reply_authors": "4;2;5",
        "rating_avg": [
            5.333333333333333,
            2.0548046676563256
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            86.33333333333333,
            32.99831645537222
        ],
        "wc_strengths_avg": [
            60.0,
            52.121652570372966
        ],
        "wc_weaknesses_avg": [
            181.33333333333334,
            69.4086129781856
        ],
        "wc_questions_avg": [
            33.333333333333336,
            38.689648342791756
        ],
        "wc_review_avg": [
            361.0,
            89.2785901919753
        ],
        "wc_reply_reviewers_avg": [
            245.0,
            189.9420964399414
        ],
        "wc_reply_authors_avg": [
            1544.0,
            780.3627361682514
        ],
        "reply_reviewers_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            1.247219128924647
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.9933992677987828,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8110686798915227576&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Yonsei University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.yonsei.ac.kr",
        "aff_unique_abbr": "Yonsei",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "Va2IQ471GR",
        "title": "Convergence of SVGD in KL divergence via approximate gradient flow",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This study investigates the convergence of Stein variational gradient descent (SVGD), which is used to approximate a target distribution based on a gradient flow on the space of probability distributions. The existing studies mainly focus on the convergence in the kernel Stein discrepancy, which doesn't imply the weak convergence in many practical settings.  To address this issue, we propose to introduce a novel analytical approach called $(\\epsilon,\\delta)$-approximate gradient flow, extending conventional concepts of approximation error for Wasserstein gradient. With this approach, we show the sub-linear convergence of SVGD in Kullback-Leibler divergence under the discrete-time and infinite particle settings. Finally, we validate our theoretical findings through several numerical experiments.",
        "keywords": "Stein variational gradient descent;SVGD;gradient flow;approximate inference",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/77ac7ac8756e242ed3964218adc5e87e3812e312.zip",
        "author": "Masahiro Fujisawa;Futoshi Futami",
        "authorids": "~Masahiro_Fujisawa1;~Futoshi_Futami1",
        "gender": "M;M",
        "homepage": "https://msfuji0211.github.io/;",
        "dblp": "236/6307;209/4960",
        "google_scholar": "gS24jX8AAAAJ;https://scholar.google.co.jp/citations?user=WTOG0mMAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Masahiro_Fujisawa1;~Futoshi_Futami1",
        "aff": "RIKEN;Osaka University",
        "aff_domain": "riken.jp;osaka-u.ac.jp",
        "position": "Special Postdoctoral Researcher;Lecturer",
        "bibtex": "@misc{\nfujisawa2024convergence,\ntitle={Convergence of {SVGD} in {KL} divergence via approximate gradient flow},\nauthor={Masahiro Fujisawa and Futoshi Futami},\nyear={2024},\nurl={https://openreview.net/forum?id=Va2IQ471GR}\n}",
        "github": "",
        "project": "",
        "reviewers": "hQF6;t4TL;Spa3;ZqiW",
        "site": "https://openreview.net/forum?id=Va2IQ471GR",
        "pdf_size": 687960,
        "rating": "3;5;6;6",
        "confidence": "3;4;4;3",
        "soundness": "2;2;4;3",
        "contribution": "2;2;3;2",
        "presentation": "3;2;3;3",
        "wc_summary": "29;18;74;246",
        "wc_strengths": "36;22;86;69",
        "wc_weaknesses": "76;34;49;218",
        "wc_questions": "162;71;230;574",
        "wc_review": "303;145;439;1107",
        "wc_reply_reviewers": "39;0;99;134",
        "wc_reply_authors": "495;285;466;1127",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "1;1;2;3",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            91.75,
            91.494193804853
        ],
        "wc_strengths_avg": [
            53.25,
            25.469344318219107
        ],
        "wc_weaknesses_avg": [
            94.25,
            73.01498133944841
        ],
        "wc_questions_avg": [
            259.25,
            190.2752939821668
        ],
        "wc_review_avg": [
            498.5,
            366.39971342783554
        ],
        "wc_reply_reviewers_avg": [
            68.0,
            51.91820489963034
        ],
        "wc_reply_authors_avg": [
            593.25,
            318.4936223851272
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.40824829046386296,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ZN0h3G4GYG8J:scholar.google.com/&scioq=Convergence+of+SVGD+in+KL+divergence+via+approximate+gradient+flow&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "RIKEN;Osaka University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.riken.jp;https://www.osaka-u.ac.jp",
        "aff_unique_abbr": "RIKEN;Osaka U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Japan"
    },
    {
        "id": "Va4t6R8cGG",
        "title": "End-to-End Spatio-Temporal Action Localisation with Video Transformers",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The most performant spatio-temporal action localisation models use external person proposals and complex external memory banks. We propose a fully end-to-end, transformer based model that directly ingests an input video, and outputs tubelets -- a sequence of bounding boxes and the action classes at each frame. Our flexible model can be trained with either sparse bounding-box supervision on individual frames, or full tubelet annotations. And in both cases, it predicts coherent tubelets as the output. Moreover, our end-to-end model requires no additional pre-processing in the form of proposals, or post-processing in terms of non-maximal suppression. We perform extensive ablation experiments, and significantly advance the state-of-the-art results on four different spatio-temporal action localisation benchmarks with both sparse keyframes and full tubelet annotations.",
        "keywords": "action localisation;video understanding",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/e67a79e8a6aa6baef11977903664b29e5a816d52.zip",
        "author": "Alexey A. Gritsenko;Xuehan Xiong;Josip Djolonga;Mostafa Dehghani;Chen Sun;Mario Lucic;Cordelia Schmid;Anurag Arnab",
        "authorids": "~Alexey_A._Gritsenko1;~Xuehan_Xiong1;~Josip_Djolonga2;~Mostafa_Dehghani1;~Chen_Sun1;~Mario_Lucic1;~Cordelia_Schmid1;~Anurag_Arnab1",
        "gender": ";;M;M;M;M;F;",
        "homepage": ";;;http://mostafadehghani.com/;https://chensun.me;http://lucic.ai;https://cordeliaschmid.github.io/;",
        "dblp": ";;139/1342;125/4062;01/6072-2;155/1945;s/CordeliaSchmid;",
        "google_scholar": ";vM1SktEAAAAJ;;https://scholar.google.nl/citations?user=MiHOX3QAAAAJ;vQa7heEAAAAJ;SzZRlcMAAAAJ;IvqCXP4AAAAJ;",
        "orcid": ";;;;;;;",
        "linkedin": ";;;;;;cordelia-schmid-47985a9;",
        "or_profile": "~Alexey_A._Gritsenko1;~Xuehan_Xiong1;~Josip_Djolonga2;~Mostafa_Dehghani1;~Chen_Sun1;~Mario_Lucic1;~Cordelia_Schmid1;~Anurag_Arnab1",
        "aff": ";Google;Google;Google DeepMind;Google;Google;Inria;",
        "aff_domain": ";google.com;google.com;google.com;google.com;deepmind.com;inria.fr;",
        "position": ";Staff Software Engineer;Research Engineer;Research Scientist;Research Scientist;Senior Staff Research Scientist;Researcher;",
        "bibtex": "@misc{\ngritsenko2024endtoend,\ntitle={End-to-End Spatio-Temporal Action Localisation with Video Transformers},\nauthor={Alexey A. Gritsenko and Xuehan Xiong and Josip Djolonga and Mostafa Dehghani and Chen Sun and Mario Lucic and Cordelia Schmid and Anurag Arnab},\nyear={2024},\nurl={https://openreview.net/forum?id=Va4t6R8cGG}\n}",
        "github": "",
        "project": "",
        "reviewers": "PJAV;J8Sj;zmts;dyfN",
        "site": "https://openreview.net/forum?id=Va4t6R8cGG",
        "pdf_size": 736770,
        "rating": "5;5;6;6",
        "confidence": "3;4;4;4",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;4",
        "wc_summary": "36;42;61;83",
        "wc_strengths": "31;14;67;80",
        "wc_weaknesses": "201;103;143;100",
        "wc_questions": "132;2;33;31",
        "wc_review": "400;161;304;294",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1689;530;773;777",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;2;1;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            55.5,
            18.364367672206956
        ],
        "wc_strengths_avg": [
            48.0,
            26.59887215654077
        ],
        "wc_weaknesses_avg": [
            136.75,
            40.794454279963105
        ],
        "wc_questions_avg": [
            49.5,
            49.18587195526781
        ],
        "wc_review_avg": [
            289.75,
            85.07753816372451
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            942.25,
            442.5886210692724
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 21,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17654259418030662275&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;0;0;0;1",
        "aff_unique_norm": "Google;INRIA",
        "aff_unique_dep": "Google;",
        "aff_unique_url": "https://www.google.com;https://www.inria.fr",
        "aff_unique_abbr": "Google;Inria",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Mountain View;",
        "aff_country_unique_index": "0;0;1;0;0;2",
        "aff_country_unique": "United States;United Kingdom;France"
    },
    {
        "id": "VaZa8zj0Yw",
        "title": "Lyfe Agents: generative agents for low-cost real-time social interactions",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Highly autonomous generative agents powered by large language models promise to simulate intricate social behaviors in virtual societies. However, achieving real-time interactions with humans at a low computational cost remains challenging. Here, we introduce Lyfe Agents. They combine low-cost with real-time responsiveness, all while remaining intelligent and goal-oriented. Key innovations include: (1) an option-action framework, reducing the cost of high-level decisions; (2) asynchronous self-monitoring for better self-consistency; and (3) a Summarize-and-Forget memory mechanism, prioritizing critical memory items at a low cost. We evaluate Lyfe Agents' self-motivation and sociability across several multi-agent scenarios in our custom LyfeGame 3D virtual environment platform. When equipped with our brain-inspired techniques, Lyfe Agents can exhibit human-like self-motivated social reasoning. For example, the agents can solve a crime (a murder mystery) through autonomous collaboration and information exchange. Meanwhile, our techniques enabled Lyfe Agents to operate at a computational cost 10-100 times lower than existing alternatives. Our findings underscore the transformative potential of autonomous generative agents to enrich human social experiences in virtual worlds.",
        "keywords": "Generative Agents;Large Language Models;Simulate Social Behavior;Virtual Society;Autonomy;Human-Like Interactions",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Kaiya Ivy Zhao;Michelangelo Naim;Jovana Kondic;Manuel Ernesto Cortes;Jiaxin Ge;Shuying Luo;Guangyu Robert Yang;Andrew Ahn",
        "authorids": "~Kaiya_Ivy_Zhao1;~Michelangelo_Naim1;~Jovana_Kondic1;~Manuel_Ernesto_Cortes1;~Jiaxin_Ge1;~Shuying_Luo1;~Guangyu_Robert_Yang1;~Andrew_Ahn1",
        "gender": "F;M;F;M;F;F;M;M",
        "homepage": "https://kyzhao-ivy.github.io/;;;https://github.com/ManuelCortes23;https://jiaxin.ge/;;https://www.metaconscious.org/;https://e.math.cornell.edu/people/aahn/",
        "dblp": ";;;;;;;",
        "google_scholar": "N0yuICkAAAAJ;hCEneNIAAAAJ;CmAO43YAAAAJ;;I6P0SwgAAAAJ;;hrI8aH8AAAAJ;",
        "orcid": ";;;;;;0000-0002-8919-4248;",
        "linkedin": "kaiya-zhao-910830218/;michelangelonaim/;jovanakondic/;;;shuying-luo-1900811a/;;",
        "or_profile": "~Kaiya_Ivy_Zhao1;~Michelangelo_Naim1;~Jovana_Kondic1;~Manuel_Ernesto_Cortes1;~Jiaxin_Ge1;~Shuying_Luo1;~Guangyu_Robert_Yang1;~Andrew_Ahn1",
        "aff": "Fudan University;Massachusetts Institute of Technology;IBM, International Business Machines;;Peking University;;Massachusetts Institute of Technology;Massachusetts Institute of Technology",
        "aff_domain": "fudan.edu.cn;mit.edu;us.ibm.com;;pku.edu.cn;;mit.edu;mit.edu",
        "position": "Undergrad student;Postdoc;Intern;;Undergrad student;;Assistant Professor;Researcher",
        "bibtex": "@misc{\nzhao2024lyfe,\ntitle={Lyfe Agents: generative agents for low-cost real-time social interactions},\nauthor={Kaiya Ivy Zhao and Michelangelo Naim and Jovana Kondic and Manuel Ernesto Cortes and Jiaxin Ge and Shuying Luo and Guangyu Robert Yang and Andrew Ahn},\nyear={2024},\nurl={https://openreview.net/forum?id=VaZa8zj0Yw}\n}",
        "github": "",
        "project": "",
        "reviewers": "XnQy;4MNZ;tWHo;yeom;Qy47",
        "site": "https://openreview.net/forum?id=VaZa8zj0Yw",
        "pdf_size": 3884911,
        "rating": "3;3;5;5;5",
        "confidence": "2;4;2;3;4",
        "soundness": "2;1;2;3;3",
        "contribution": "1;1;3;2;2",
        "presentation": "3;2;3;3;3",
        "wc_summary": "73;96;113;61;146",
        "wc_strengths": "82;24;124;99;121",
        "wc_weaknesses": "84;455;277;287;131",
        "wc_questions": "40;99;125;104;65",
        "wc_review": "279;674;639;551;463",
        "wc_reply_reviewers": "0;584;44;161;0",
        "wc_reply_authors": "916;3277;1154;839;549",
        "reply_reviewers": "0;2;1;1;0",
        "reply_authors": "2;8;2;3;2",
        "rating_avg": [
            4.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.0,
            0.8944271909999159
        ],
        "soundness_avg": [
            2.2,
            0.7483314773547882
        ],
        "contribution_avg": [
            1.8,
            0.7483314773547883
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            97.8,
            30.089200720524296
        ],
        "wc_strengths_avg": [
            90.0,
            36.3813138850152
        ],
        "wc_weaknesses_avg": [
            246.8,
            130.9876330040359
        ],
        "wc_questions_avg": [
            86.6,
            30.229786635039286
        ],
        "wc_review_avg": [
            521.2,
            141.53501333592334
        ],
        "wc_reply_reviewers_avg": [
            157.8,
            221.09219796275036
        ],
        "wc_reply_authors_avg": [
            1347.0,
            984.1522239978935
        ],
        "reply_reviewers_avg": [
            0.8,
            0.7483314773547883
        ],
        "reply_authors_avg": [
            3.4,
            2.33238075793812
        ],
        "replies_avg": [
            39,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 31,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1872931721935492945&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;3;1;1",
        "aff_unique_norm": "Fudan University;Massachusetts Institute of Technology;International Business Machines;Peking University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.fudan.edu.cn;https://web.mit.edu;https://www.ibm.com;http://www.pku.edu.cn",
        "aff_unique_abbr": "Fudan;MIT;IBM;Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;0;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "Vaf4sIrRUC",
        "title": "Aligning Text-to-Image Diffusion Models with Reward Backpropagation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Text-to-image diffusion models have recently emerged at the forefront of image generation, powered by very large-scale unsupervised or weakly supervised text-to-image training datasets.  Due to the weakly supervised nature of their training, precise control of their behavior in downstream tasks such as maximizing human-perceived image quality,  image-text alignment, or ethical image generation, is difficult. Recent works finetune diffusion models to downstream reward functions using vanilla reinforcement learning, notorious for the high variance of the gradient estimators. In this paper, we propose AlignProp, a method that aligns diffusion models to downstream reward functions using end to-end backpropagation of the reward gradient through the denoising process. While naive implementation of such backpropagation would require prohibitive memory resources for storing the partial derivatives of modern text-to-image models, AlignProp finetunes low-rank adapter weight modules and uses gradient checkpointing, to render its memory usage viable. We test AlignProp to finetuning diffusion models to various objectives, such as image-text semantic alignment, aesthetics, compressibility and controllability of the number of objects present, as well as their combinations.  We show AlignProp  achieves higher rewards in fewer training steps than alternatives, while being conceptually simpler, making it a straightforward choice for optimizing diffusion models for differentiable reward functions of interest.",
        "keywords": "alignment;diffusion models;reinforcement learning;text-to-image models",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Mihir Prabhudesai;Anirudh Goyal;Deepak Pathak;Katerina Fragkiadaki",
        "authorids": "~Mihir_Prabhudesai1;~Anirudh_Goyal1;~Deepak_Pathak1;~Katerina_Fragkiadaki1",
        "gender": "M;M;M;F",
        "homepage": "https://mihirp1998.github.io/;https://anirudh9119.github.io/;https://www.cs.cmu.edu/~dpathak/;https://www.cs.cmu.edu/~katef/",
        "dblp": "249/9214;172/1039;155/9860;21/8780",
        "google_scholar": ";krrh6OUAAAAJ;https://scholar.google.cl/citations?user=AEsPCAUAAAAJ;FWp7728AAAAJ",
        "orcid": ";;;",
        "linkedin": ";;pathak22/;",
        "or_profile": "~Mihir_Prabhudesai1;~Anirudh_Goyal1;~Deepak_Pathak1;~Katerina_Fragkiadaki1",
        "aff": "School of Computer Science, Carnegie Mellon University;Google DeepMind;Carnegie Mellon University;Carnegie Mellon University",
        "aff_domain": "cs.cmu.edu;google.com;cmu.edu;cmu.edu",
        "position": "PhD student;Researcher;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nprabhudesai2024aligning,\ntitle={Aligning Text-to-Image Diffusion Models with Reward Backpropagation},\nauthor={Mihir Prabhudesai and Anirudh Goyal and Deepak Pathak and Katerina Fragkiadaki},\nyear={2024},\nurl={https://openreview.net/forum?id=Vaf4sIrRUC}\n}",
        "github": "",
        "project": "",
        "reviewers": "VMQ3;e5M5;JeN1;MYQY",
        "site": "https://openreview.net/forum?id=Vaf4sIrRUC",
        "pdf_size": 19958025,
        "rating": "3;5;5;6",
        "confidence": "4;4;4;3",
        "soundness": "2;2;3;3",
        "contribution": "2;1;2;2",
        "presentation": "2;3;3;3",
        "wc_summary": "65;66;71;47",
        "wc_strengths": "56;35;9;30",
        "wc_weaknesses": "86;438;231;66",
        "wc_questions": "2;85;63;12",
        "wc_review": "209;624;374;155",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "149;536;424;110",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            62.25,
            9.093266739736606
        ],
        "wc_strengths_avg": [
            32.5,
            16.710774967068403
        ],
        "wc_weaknesses_avg": [
            205.25,
            148.6999915938128
        ],
        "wc_questions_avg": [
            40.5,
            34.57238782612506
        ],
        "wc_review_avg": [
            340.5,
            182.48082091003428
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            304.75,
            180.19624718622748
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.6622661785325219,
        "gs_citation": 83,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9972972803745487315&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Carnegie Mellon University;Google",
        "aff_unique_dep": "School of Computer Science;Google DeepMind",
        "aff_unique_url": "https://www.cmu.edu;https://deepmind.com",
        "aff_unique_abbr": "CMU;DeepMind",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Pittsburgh;",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "VbR6K7TQV4",
        "title": "Learning the Latent Noisy Data Generative Process for Label-Noise Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In learning with noisy labels, the noise transition reveals how an instance relates from its clean label to its noisy one. Accurately inferring an instance's noise transition is crucial for inferring its clean label.  However, when only a noisy dataset is available, noise transitions can typically be inferred only for a ``special'' group of instances. To use these learned transitions to assist in inferring others, it is essential to understand the connections among different transitions across different instances.\nExisting work usually addresses this by introducing assumptions that explicitly define the similarity of noise transitions across various instances. However, these similarity-based assumptions often lack empirical validation and may not be aligned with real-world data. The misalignment can lead to misinterpretations of both noise transitions and clean labels.\nIn this work, instead of directly defining similarity, we propose modeling the generative process of noisy data. Intuitively, to understand the connections among noise transitions across different instances, we represent the causal generative process of noisy data using a learnable graphical model. Relying solely on noisy data, our method can effectively discern the underlying causal generative process, subsequently inferring the noise transitions of instances and their clean labels. Experiments on various datasets with different types of label noise further demonstrate our method's effectiveness.",
        "keywords": "Learning with noisy labels;noise transition;image classification",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Yexiong Lin;Yu Yao;Tongliang Liu",
        "authorids": "~Yexiong_Lin1;~Yu_Yao3;~Tongliang_Liu1",
        "gender": "M;M;M",
        "homepage": "https://yexionglin.github.io/;https://a5507203.github.io/;https://tongliang-liu.github.io/",
        "dblp": "287/6488;230/9625;150/6667",
        "google_scholar": "OfsQPbwAAAAJ;OkcaMKAAAAAJ;https://scholar.google.com.au/citations?user=EiLdZ_YAAAAJ",
        "orcid": ";;",
        "linkedin": ";yu-yao-150377134/;",
        "or_profile": "~Yexiong_Lin1;~Yu_Yao3;~Tongliang_Liu1",
        "aff": "University of Sydney;University of Sydney;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_domain": "usyd.edu.au;sydney.edu.au;mbzuai.ac.ae",
        "position": "PhD student;Lecturer;Affiliated Associate Professor",
        "bibtex": "@misc{\nlin2024learning,\ntitle={Learning the Latent Noisy Data Generative Process for Label-Noise Learning},\nauthor={Yexiong Lin and Yu Yao and Tongliang Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=VbR6K7TQV4}\n}",
        "github": "",
        "project": "",
        "reviewers": "XDR1;qcRj;5FMB;5Lfr",
        "site": "https://openreview.net/forum?id=VbR6K7TQV4",
        "pdf_size": 12387698,
        "rating": "3;5;5;6",
        "confidence": "5;4;3;4",
        "soundness": "3;3;2;3",
        "contribution": "1;2;2;3",
        "presentation": "4;3;2;3",
        "wc_summary": "49;133;65;54",
        "wc_strengths": "26;39;27;42",
        "wc_weaknesses": "182;291;441;179",
        "wc_questions": "121;181;8;31",
        "wc_review": "378;644;541;306",
        "wc_reply_reviewers": "953;97;219;37",
        "wc_reply_authors": "3618;1489;1537;702",
        "reply_reviewers": "3;2;2;1",
        "reply_authors": "7;4;5;2",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            75.25,
            33.840619084171614
        ],
        "wc_strengths_avg": [
            33.5,
            7.088723439378913
        ],
        "wc_weaknesses_avg": [
            273.25,
            106.8465605436132
        ],
        "wc_questions_avg": [
            85.25,
            69.5642688454353
        ],
        "wc_review_avg": [
            467.25,
            132.89728176302177
        ],
        "wc_reply_reviewers_avg": [
            326.5,
            367.6067872061124
        ],
        "wc_reply_authors_avg": [
            1836.5,
            1080.6582484763626
        ],
        "reply_reviewers_avg": [
            2.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            4.5,
            1.8027756377319946
        ],
        "replies_avg": [
            32,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.6488856845230502,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:sJ5CcJIjlFEJ:scholar.google.com/&scioq=Learning+the+Latent+Noisy+Data+Generative+Process+for+Label-Noise+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "University of Sydney;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.sydney.edu.au;https://mbzuai.ac.ae",
        "aff_unique_abbr": "USYD;MBZUAI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "Australia;United Arab Emirates"
    },
    {
        "id": "Vc52HZwNwe",
        "title": "Gradient-free Proxy for Efficient Language Model Search",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The rising demand for efficient natural language processing (NLP) systems has underscored the significance of developing lightweight language models. However, prevailing approaches to neural architecture search (NAS) often confront issues such as biased evaluation metrics and computational inefficiencies. This paper introduces weight-weighted PCA (W-PCA), a novel zero-shot NAS method specifically tailored for lightweight language models. Our approach leverages two evaluation proxies, namely parameter count and principal component analysis (PCA) value of the feed-forward neural (FFN) layer, to provide a comprehensive and unbiased assessment. Additionally, by eliminating the need for gradient computations, we optimize the evaluation time, thereby enhancing the efficiency of designing and evaluating lightweight language models. Comparative analysis on the GLUE and SQuAD datasets demonstrates that our approach not only significantly reduces training time compared to one-shot NAS methods but also achieves higher scores in the testing phase compared to previous state-of-the-art training-based methods. Furthermore, ranking evaluations on a dataset sampled from the FlexiBERT search space reveal that our approach exhibits superior ranking correlation and further reduces solving time compared to other zero-shot NAS methods that require gradient computation.",
        "keywords": "gradient-free;neural architecture search;efficient language model",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Shang Wang;Huanrong Tang",
        "authorids": "~Shang_Wang2;~Huanrong_Tang1",
        "gender": "M;",
        "homepage": ";https://gmsadm.xtu.edu.cn/dsxxgl/dsfc/grxx?dsxm=2884%E5%94%90%E6%AC%A2%E5%AE%B9",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": "0000-0003-4429-0882;",
        "linkedin": ";",
        "or_profile": "~Shang_Wang2;~Huanrong_Tang1",
        "aff": "Xiangtan University;Xiangtan University",
        "aff_domain": "xtu.edu.cn;xtu.edu.cn",
        "position": "MS student;Full Professor",
        "bibtex": "@misc{\nwang2024gradientfree,\ntitle={Gradient-free Proxy for Efficient Language Model Search},\nauthor={Shang Wang and Huanrong Tang},\nyear={2024},\nurl={https://openreview.net/forum?id=Vc52HZwNwe}\n}",
        "github": "",
        "project": "",
        "reviewers": "8KoX;7PxN;pvZH;EqU6",
        "site": "https://openreview.net/forum?id=Vc52HZwNwe",
        "pdf_size": 671370,
        "rating": "3;5;5;8",
        "confidence": "4;2;4;4",
        "soundness": "3;2;2;4",
        "contribution": "2;2;2;3",
        "presentation": "2;2;2;4",
        "wc_summary": "74;78;57;101",
        "wc_strengths": "52;38;24;80",
        "wc_weaknesses": "142;67;65;158",
        "wc_questions": "47;45;268;2",
        "wc_review": "315;228;414;341",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1323;245;867;329",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;2;1",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            77.5,
            15.692354826475215
        ],
        "wc_strengths_avg": [
            48.5,
            20.706279240848655
        ],
        "wc_weaknesses_avg": [
            108.0,
            42.38513890504548
        ],
        "wc_questions_avg": [
            90.5,
            104.04446164981584
        ],
        "wc_review_avg": [
            324.5,
            66.4924807779045
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            691.0,
            435.99311921176
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.08084520834544431,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:pLXeRAnfzjYJ:scholar.google.com/&scioq=Gradient-free+Proxy+for+Efficient+Language+Model+Search&hl=en&as_sdt=0,33",
        "gs_version_total": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Xiangtan University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.xtu.edu.cn/",
        "aff_unique_abbr": "XTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "VdOaaDzDD6",
        "title": "Bandits with Ranking Feedback",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this paper, we introduce a novel variation of multi-armed bandits called bandits with ranking feedback. Unlike traditional bandits, this variation provides feedback to the learner that allows them to rank the arms based on previous pulls, without quantifying numerically the difference in performance.  This type of feedback is well-suited for scenarios where the arms' values cannot be precisely measured using metrics such as monetary scores, probabilities, or occurrences. Common examples include  human preferences in matchmaking problems. Furthermore, its investigation answers the theoretical question on how numerical rewards are crucial in bandit settings. In particular, we study the problem of designing no-regret algorithms with ranking feedback both in the stochastic and adversarial settings. We show that, with stochastic rewards, differently from what happens with non-ranking feedback, no algorithm can suffer a logarithmic regret in the time horizon $T$ in the instance-dependent case. Furthermore, we provide two algorithms. The first, namely DREE, guarantees a superlogarithmic regret in $T$ in the instance-dependent case thus matching our lower bound, while the second, namely R-LPE, guarantees a regret of $\\mathcal{\\widetilde O}(\\sqrt{T})$ in the instance-independent case. Remarkably, we show that no algorithm can have an optimal regret bound in both instance-dependent and instance-independent cases. We also prove that no algorithm can achieve a sublinear regret when the rewards are adversarial. Finally, we numerically evaluate our algorithms in a testbed, and we compare their performance with some baseline from the literature.",
        "keywords": "bandits;online learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/822c4737dfb40d2474e800aa1641a0852c46d709.zip",
        "author": "Davide Maran;Francesco Bacchiocchi;Francesco Emanuele Stradi;Matteo Castiglioni;Nicola Gatti;Marcello Restelli",
        "authorids": "~Davide_Maran1;~Francesco_Bacchiocchi1;~Francesco_Emanuele_Stradi1;~Matteo_Castiglioni1;~Nicola_Gatti1;~Marcello_Restelli1",
        "gender": "M;M;M;;M;M",
        "homepage": "https://davidezfc.github.io/;;https://francescoemanuelestradi.github.io;https://castiglionimatteo.github.io;https://www4.ceda.polimi.it/manifesti/manifesti/controller/ricerche/RicercaPerDocentiPublic.do?k_doc=75785&lang=EN&EVN_PRODOTTI=evento&__pj0=0&__pj1=d918ee8916afbd0005f5c0bc3c0ff350;http://home.deib.polimi.it/restelli/",
        "dblp": "320/3835;312/4794.html;345/9650;225/7720;g/NicolaGatti;64/1011",
        "google_scholar": "https://scholar.google.it/citations?user=a8i0X8oAAAAJ;https://scholar.google.com.vn/citations?user=UKGWeAoAAAAJ;JYdi_FMAAAAJ;https://scholar.google.it/citations?user=NPE3HAYAAAAJ;https://scholar.google.com.tw/citations?user=j-HrYREAAAAJ;https://scholar.google.com.tw/citations?user=xdgxRiEAAAAJ",
        "orcid": ";;;0000-0002-1070-6766;0000-0001-7349-3932;0000-0002-6322-1076",
        "linkedin": "davide-maran/;;francesco-emanuele-stradi-bb35b0222/;;nicola-gatti-1284b21;",
        "or_profile": "~Davide_Maran1;~Francesco_Bacchiocchi1;~Francesco_Emanuele_Stradi1;~Matteo_Castiglioni1;~Nicola_Gatti1;~Marcello_Restelli1",
        "aff": "Polytechnic Institute of Milan;Polytechnic Institute of Milan;Polytechnic Institute of Milan;Politecnico di Milano;Polytechnic Institute of Milan;Politecnico di Milano",
        "aff_domain": "polimi.it;polimi.it;polimi.it;polimi.it;polimi.it;polimi.it",
        "position": "PhD student;PhD student;PhD student;Assistant Professor;Full Professor;Associate Professor",
        "bibtex": "@misc{\nmaran2024bandits,\ntitle={Bandits with Ranking Feedback},\nauthor={Davide Maran and Francesco Bacchiocchi and Francesco Emanuele Stradi and Matteo Castiglioni and Nicola Gatti and Marcello Restelli},\nyear={2024},\nurl={https://openreview.net/forum?id=VdOaaDzDD6}\n}",
        "github": "",
        "project": "",
        "reviewers": "qw3s;qbW7;hR48;7Kt2",
        "site": "https://openreview.net/forum?id=VdOaaDzDD6",
        "pdf_size": 504833,
        "rating": "3;3;6;8",
        "confidence": "3;3;3;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "55;85;106;145",
        "wc_strengths": "61;59;100;124",
        "wc_weaknesses": "248;115;169;299",
        "wc_questions": "88;224;73;350",
        "wc_review": "452;483;448;918",
        "wc_reply_reviewers": "288;300;15;378",
        "wc_reply_authors": "1494;1497;712;1214",
        "reply_reviewers": "2;1;1;1",
        "reply_authors": "4;3;1;2",
        "rating_avg": [
            5.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            97.75,
            32.751908341347075
        ],
        "wc_strengths_avg": [
            86.0,
            27.358728040608906
        ],
        "wc_weaknesses_avg": [
            207.75,
            70.80033545118272
        ],
        "wc_questions_avg": [
            183.75,
            112.57525260908811
        ],
        "wc_review_avg": [
            575.25,
            198.34991177210037
        ],
        "wc_reply_reviewers_avg": [
            245.25,
            137.35242080138232
        ],
        "wc_reply_authors_avg": [
            1229.25,
            319.9854488879143
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.8164965809277261,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15715671025942107014&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0;1;0;1",
        "aff_unique_norm": "Polytechnic Institute of Milan;Politecnico di Milano",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.polimi.it/;https://www.polimi.it",
        "aff_unique_abbr": "Politecnico di Milano;Polimi",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "Italy"
    },
    {
        "id": "Vdb8oSyEay",
        "title": "E$^{2}$GAN: Efficient Training of Efficient GANs for Image-to-Image Translation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "One highly promising direction for enabling flexible *real-time on-device* image editing is utilizing data distillation by leveraging large-scale text-to-image diffusion models, such as Stable Diffusion, to generate paired datasets used for training generative adversarial networks (GANs). \nThis approach notably alleviates the stringent requirements typically imposed by high-end commercial GPUs for performing image editing with diffusion models. \nHowever, unlike text-to-image diffusion models, each distilled GAN is specialized for a specific image editing task, necessitating costly training efforts to obtain models for various concepts.\nIn this work, we introduce and address a novel research direction: *can the process of distilling GANs from diffusion models be made significantly more efficient?*\nTo achieve this goal, we propose a series of innovative techniques.\nFirst, we develop an attention-based network architecture tailored for efficient image-to-image translation on mobile devices, which yields faster inference speeds, reduces the number of parameters, and lowers computational costs compared to existing image-to-image models.\nSecond, we introduce a hybrid training pipeline that efficiently adapts a pre-trained text-conditioned GAN model to different concepts while substantially reducing computational costs. \nMoreover, this approach significantly minimizes the storage requirements for each concept.\nThird, we investigate the minimal amount of data necessary to train each GAN, further reducing the overall training time.\nExtensive experiments demonstrate that we can efficiently empower GANs with the ability to perform real-time high-quality image editing on mobile devices with remarkable reduced training cost and storage for each concept.",
        "keywords": "generative adversarial network;diffusion model;efficient training",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/7b949d8c3f848a16b327d118430f708a4341e38a.zip",
        "author": "Yifan Gong;Zheng Zhan;Qing Jin;Yanyu Li;Yerlan Idelbayev;Xian Liu;Andrey Zharkov;Kfir Aberman;Sergey Tulyakov;Yanzhi Wang;Jian Ren",
        "authorids": "~Yifan_Gong2;~Zheng_Zhan3;~Qing_Jin1;~Yanyu_Li1;~Yerlan_Idelbayev1;~Xian_Liu1;~Andrey_Zharkov1;~Kfir_Aberman1;~Sergey_Tulyakov1;~Yanzhi_Wang3;~Jian_Ren2",
        "gender": "F;;;;M;M;;M;M;M;M",
        "homepage": "https://yifanfanfanfan.github.io/;;;;http://graduatestudent.ucmerced.edu/yidelbayev/;https://alvinliu0.github.io/;;https://kfiraberman.github.io/;http://www.stulyakov.com/;https://web.northeastern.edu/yanzhiwang/;https://alanspike.github.io/",
        "dblp": "49/3073-4.html;156/4008-1.html;37/11144;194/5818;203/8094;;;;40/6115;;59/2180-5",
        "google_scholar": "U_gevVgAAAAJ;hwTuEX0AAAAJ;X9iggBcAAAAJ;https://scholar.google.com/citations?hl=en;nAaroNMAAAAJ;https://scholar.google.com/citations?hl=en-us;;https://scholar.google.co.il/citations?user=jdbZDakAAAAJ;mgzXR0sAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.co.jp/citations?user=vDALiU4AAAAJ",
        "orcid": "0000-0002-3912-097X;;0000-0001-8795-9297;;;0000-0001-9817-7418;;;;;",
        "linkedin": "yifan-gong-3059b8132/;;;;;xian-liu-9840b52a3/;;;sergeytulyakov/;;",
        "or_profile": "~Yifan_Gong2;~Zheng_Zhan3;~Qing_Jin1;~Yanyu_Li1;~Yerlan_Idelbayev1;~Xian_Liu1;~Andrey_Zharkov1;~Kfir_Aberman1;~Sergey_Tulyakov1;~Yanzhi_Wang3;~Jian_Ren2",
        "aff": "Northeastern University;Northeastern University;Snap Inc.;Northeastern University;Snap Inc.;The Chinese University of Hong Kong;;Snap Inc.;Snap Inc.;Northeastern University;Snap Inc.",
        "aff_domain": "neu.edu;neu.edu;snap.com;northeastern.edu;snapchat.com;cuhk.edu.hk;;snap.com;snapchat.com;northeastern.edu;snapchat.com",
        "position": "PhD student;PhD student;Researcher;PhD student;Researcher;PhD student;;Researcher;Director of Research;Associate Professor;Research Scientist",
        "bibtex": "@misc{\ngong2024egan,\ntitle={E\\${\\textasciicircum}\\{2\\}\\${GAN}: Efficient Training of Efficient {GAN}s for Image-to-Image Translation},\nauthor={Yifan Gong and Zheng Zhan and Qing Jin and Yanyu Li and Yerlan Idelbayev and Xian Liu and Andrey Zharkov and Kfir Aberman and Sergey Tulyakov and Yanzhi Wang and Jian Ren},\nyear={2024},\nurl={https://openreview.net/forum?id=Vdb8oSyEay}\n}",
        "github": "",
        "project": "",
        "reviewers": "Jjyt;DSwv;iBPB;myfn",
        "site": "https://openreview.net/forum?id=Vdb8oSyEay",
        "pdf_size": 40328663,
        "rating": "3;3;5;5",
        "confidence": "3;4;3;4",
        "soundness": "2;2;3;2",
        "contribution": "1;2;2;2",
        "presentation": "2;3;3;3",
        "wc_summary": "85;102;84;67",
        "wc_strengths": "41;49;67;35",
        "wc_weaknesses": "68;152;193;198",
        "wc_questions": "28;24;64;39",
        "wc_review": "222;327;408;339",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "442;514;198;317",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            84.5,
            12.379418403139947
        ],
        "wc_strengths_avg": [
            48.0,
            12.041594578792296
        ],
        "wc_weaknesses_avg": [
            152.75,
            52.083466666496
        ],
        "wc_questions_avg": [
            38.75,
            15.578430601315397
        ],
        "wc_review_avg": [
            324.0,
            66.5093978321861
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            367.75,
            120.71945783509798
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18204567626855748828&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;1;0;1;2;1;1;0;1",
        "aff_unique_norm": "Northeastern University;Snap Inc.;Chinese University of Hong Kong",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.northeastern.edu;https://www.snapinc.com;https://www.cuhk.edu.hk",
        "aff_unique_abbr": "NEU;Snap;CUHK",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;0;1;0;0;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "Generative Sliced MMD Flows with Riesz Kernels",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18500",
        "id": "VdkGRV1vcf",
        "author_site": "Johannes Hertrich, Christian Wald, Fabian Altekr\u00fcger, Paul Hagemann",
        "tldr": "",
        "abstract": "Maximum mean discrepancy (MMD) flows suffer from high computational costs in large scale computations.\nIn this paper, we show that MMD flows with Riesz kernels $K(x,y) = - \\|x-y\\|^r$, $r \\in (0,2)$\nhave exceptional properties which allow their efficient computation.\nWe prove that the MMD of Riesz kernels, which is also known as energy distance, coincides with the MMD of their sliced version.\nAs a consequence, the computation of gradients of MMDs can be performed in the one-dimensional setting.\nHere, for $r=1$, a simple sorting algorithm can be applied to reduce the complexity\nfrom $O(MN+N^2)$ to $O((M+N)\\log(M+N))$ for two  measures with $M$ and $N$ support points.\nAs another interesting follow-up result, the MMD of compactly supported measures\ncan be estimated from above and below by the Wasserstein-1 distance.\nFor the implementations we approximate the gradient of the sliced MMD by using only a finite number $P$ of slices. \nWe show that the resulting error has complexity \\smash{$O(\\sqrt{d/P})$}, where $d$ is the data dimension. \nThese results enable us to train generative models by approximating MMD gradient flows by neural networks even\nfor image applications. We demonstrate the efficiency of our model by image generation on MNIST, FashionMNIST and CIFAR10.",
        "keywords": "sliced maximum mean discrepancy;energy distance;gradient flows;Riesz kernels;generative modelling",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/9ee328fc77b1bd9294aadc99afbe933dbeb76c65.zip",
        "author": "Johannes Hertrich;Christian Wald;Fabian Altekr\u00fcger;Paul Hagemann",
        "authorids": "~Johannes_Hertrich1;~Christian_Wald1;~Fabian_Altekr\u00fcger1;~Paul_Hagemann1",
        "gender": "M;M;;M",
        "homepage": "https://johertrich.github.io;;;https://www.math.tu-berlin.de/fachgebiete_ag_modnumdiff/angewandte_mathematik/v_menue/team/paul_hagemann/v_menue/homepage/",
        "dblp": "243/3816;239/5898;;274/2221",
        "google_scholar": "https://scholar.google.de/citations?user=ra-eAmEAAAAJ;;;-IZIcqMAAAAJ",
        "orcid": "0000-0003-4433-8604;0000-0003-2373-9492;;",
        "linkedin": ";;;paul-lyonel-hagemann/",
        "or_profile": "~Johannes_Hertrich1;~Christian_Wald1;~Fabian_Altekr\u00fcger1;~Paul_Hagemann1",
        "aff": "University College London, University of London;Technische Universit\u00e4t Berlin;;Technische Universit\u00e4t Berlin",
        "aff_domain": "ucl.ac.uk;tu-berlin.de;;tu-berlin.de",
        "position": "Postdoc;Postdoc;;PhD student",
        "bibtex": "@inproceedings{\nhertrich2024generative,\ntitle={Generative Sliced {MMD} Flows with Riesz Kernels},\nauthor={Johannes Hertrich and Christian Wald and Fabian Altekr{\\\"u}ger and Paul Hagemann},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=VdkGRV1vcf}\n}",
        "github": "",
        "project": "",
        "reviewers": "pBbs;e9Tn;HuoH;hi5p",
        "pdf_size": 9944214,
        "rating": "5;5;6;8",
        "confidence": "2;3;3;4",
        "soundness": "2;2;3;3",
        "contribution": "3;2;3;3",
        "presentation": "3;3;3;2",
        "wc_summary": "154;81;137;58",
        "wc_strengths": "17;30;114;57",
        "wc_weaknesses": "112;108;53;733",
        "wc_questions": "34;2;14;13",
        "wc_review": "317;221;318;861",
        "wc_reply_reviewers": "0;54;50;549",
        "wc_reply_authors": "322;352;157;1935",
        "reply_reviewers": "0;1;1;2",
        "reply_authors": "1;2;1;4",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            107.5,
            39.322385482063524
        ],
        "wc_strengths_avg": [
            54.5,
            37.259227045122664
        ],
        "wc_weaknesses_avg": [
            251.5,
            278.96998046384846
        ],
        "wc_questions_avg": [
            15.75,
            11.54068888758379
        ],
        "wc_review_avg": [
            429.25,
            252.36518678296338
        ],
        "wc_reply_reviewers_avg": [
            163.25,
            223.72681444118405
        ],
        "wc_reply_authors_avg": [
            691.5,
            721.7639849701563
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.8660254037844386,
        "gs_citation": 24,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6720649105713195907&as_sdt=4005&sciodt=0,6&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=VdkGRV1vcf",
        "pdf": "https://openreview.net/pdf?id=VdkGRV1vcf",
        "email": "ucl.ac.uk;tu-berlin.de;;tu-berlin.de",
        "author_num": 4,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "University College London;Technische Universit\u00e4t Berlin",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ucl.ac.uk;https://www.tu-berlin.de",
        "aff_unique_abbr": "UCL;TU Berlin",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "United Kingdom;Germany"
    },
    {
        "title": "WildFusion: Learning 3D-Aware Latent Diffusion Models in View Space",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18499",
        "id": "VdwVOREDZM",
        "author_site": "Katja Schwarz, Seung Wook Kim, Jun Gao, Sanja Fidler, Andreas Geiger, Karsten Kreis",
        "tldr": "",
        "abstract": "Modern learning-based approaches to 3D-aware image synthesis achieve high photorealism and 3D-consistent viewpoint changes for the generated images. Existing approaches represent instances in a shared canonical space. However, for in-the-wild datasets a shared canonical system can be difficult to define or might not even exist. In this work, we instead model instances in view space, alleviating the need for posed images and learned camera distributions. We find that in this setting, existing GAN-based methods are prone to generating flat geometry and struggle with distribution coverage. We hence propose WildFusion, a new approach to 3D-aware image synthesis based on latent diffusion models (LDMs). We first train an autoencoder that infers a compressed latent representation, which additionally\ncaptures the images\u2019 underlying 3D structure and enables not only reconstruction but also novel view synthesis. To learn a faithful 3D representation, we leverage cues from monocular depth prediction. Then, we train a diffusion model in the 3D-aware latent space, thereby enabling synthesis of high-quality 3D-consistent image samples, outperforming recent state-of-the-art GAN-based methods. Importantly,\nour 3D-aware LDM is trained without any direct supervision from multiview images or 3D geometry and does not require posed images or learned pose or camera distributions. It directly learns a 3D representation without relying on canonical camera coordinates. This opens up promising research avenues for scalable 3D-aware image synthesis and 3D content creation from in-the-wild image data.",
        "keywords": "3D-aware image synthesis;diffusion model;latent diffusion;3D-aware generative model",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/4a7644e458b51b17893f0cde71120ca981096f60.zip",
        "author": "Katja Schwarz;Seung Wook Kim;Jun Gao;Sanja Fidler;Andreas Geiger;Karsten Kreis",
        "authorids": "~Katja_Schwarz1;~Seung_Wook_Kim1;~Jun_Gao3;~Sanja_Fidler1;~Andreas_Geiger3;~Karsten_Kreis1",
        "gender": ";M;M;F;M;",
        "homepage": ";http://www.cs.toronto.edu/~seung/;http://www.cs.toronto.edu/~jungao/;http://www.cs.toronto.edu/~fidler/;http://www.cvlibs.net;https://karstenkreis.github.io/",
        "dblp": ";;82/4977-4.html;08/6607;40/5825-1;238/6834",
        "google_scholar": ";https://scholar.google.co.kr/citations?hl=en;jTdkr10AAAAJ;CUlqK5EAAAAJ;https://scholar.google.ca/citations?hl=en;https://scholar.google.de/citations?user=rFd-DiAAAAAJ",
        "orcid": ";;;;0000-0002-8151-3726;",
        "linkedin": ";;;sanja-fidler-2846a1a?trk=hp-identity-name;;karstenkreis",
        "or_profile": "~Katja_Schwarz1;~Seung_Wook_Kim1;~Jun_Gao3;~Sanja_Fidler1;~Andreas_Geiger3;~Karsten_Kreis1",
        "aff": ";Vector Institute;Department of Computer Science, University of Toronto;Department of Computer Science, University of Toronto;University of Tuebingen;NVIDIA",
        "aff_domain": ";vectorinstitute.ai;cs.toronto.edu;cs.toronto.edu;uni-tuebingen.de;nvidia.com",
        "position": ";Grad student;PhD student;Associate Professor;Professor;Research Scientist",
        "bibtex": "@inproceedings{\nschwarz2024wildfusion,\ntitle={WildFusion: Learning 3D-Aware Latent Diffusion Models in View Space},\nauthor={Katja Schwarz and Seung Wook Kim and Jun Gao and Sanja Fidler and Andreas Geiger and Karsten Kreis},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=VdwVOREDZM}\n}",
        "github": "",
        "project": "",
        "reviewers": "CqTg;US3i;D5rM;HTTZ",
        "pdf_size": 13595621,
        "rating": "6;6;8;8",
        "confidence": "4;4;4;3",
        "soundness": "3;3;4;3",
        "contribution": "3;3;2;3",
        "presentation": "3;3;4;3",
        "wc_summary": "110;79;109;103",
        "wc_strengths": "63;50;43;65",
        "wc_weaknesses": "248;159;240;26",
        "wc_questions": "67;2;74;3",
        "wc_review": "488;290;466;197",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "748;554;482;114",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            100.25,
            12.55736835487436
        ],
        "wc_strengths_avg": [
            55.25,
            9.12071817347735
        ],
        "wc_weaknesses_avg": [
            168.25,
            89.20306889339626
        ],
        "wc_questions_avg": [
            36.5,
            34.09178786746157
        ],
        "wc_review_avg": [
            360.25,
            121.5408881817144
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            474.5,
            229.74931991194228
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10360029240194214370&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=VdwVOREDZM",
        "pdf": "https://openreview.net/pdf?id=VdwVOREDZM",
        "email": ";vectorinstitute.ai;cs.toronto.edu;cs.toronto.edu;uni-tuebingen.de;nvidia.com",
        "author_num": 6,
        "aff_unique_index": "0;1;1;2;3",
        "aff_unique_norm": "Vector Institute;University of Toronto;University of Tuebingen;NVIDIA",
        "aff_unique_dep": ";Department of Computer Science;;NVIDIA Corporation",
        "aff_unique_url": "https://vectorinstitute.ai/;https://www.utoronto.ca;https://www.uni-tuebingen.de/;https://www.nvidia.com",
        "aff_unique_abbr": "Vector Institute;U of T;Uni T\u00fcbingen;NVIDIA",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Toronto",
        "aff_country_unique_index": "0;0;0;1;2",
        "aff_country_unique": "Canada;Germany;United States"
    },
    {
        "id": "Ve9GKnDNDQ",
        "title": "Diffusion-Stego: Training-free Diffusion Generative Steganography via Message Projection",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Generative steganography is the process of hiding secret messages in generated images instead of cover images.\nExisting studies on generative steganography use GAN or Flow models to obtain high hiding message capacity and anti-detection ability over cover images. \nHowever, they create relatively unrealistic stego images because of the inherent limitations of generative models.\nWe propose Diffusion-Stego, a generative steganography approach based on diffusion models that outperform other generative models in image generation.\nDiffusion-Stego projects secret messages into the latent noise of diffusion models and generates stego images with an iterative denoising process.\nSince the naive hiding of secret messages into noise boosts visual degradation and decreases extracted message accuracy, we introduce message projection, which hides messages into noise space while addressing these issues.\nWe suggest three options for message projection to adjust the trade-off between extracted message accuracy, anti-detection ability, and image quality.\nDiffusion-Stego is a training-free approach, so we can apply it to pre-trained diffusion models that generate high-quality images, or even large-scale text-to-image models, such as Stable diffusion.\nDiffusion-Stego achieved a high capacity of messages (3.0 bpp of binary messages with 98\\% accuracy, and 6.0 bpp with 90\\% accuracy) as well as high quality (with a FID score of 2.77 for 1.0 bpp on the FFHQ 64$\\times$64 dataset) that makes it challenging to distinguish from real images in the PNG format.",
        "keywords": "Diffusion models;Steganography",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/716436b2f2085f08efffc1a598234d02eb0abb97.pdf",
        "author": "Daegyu Kim;Chaehun Shin;Jooyoung Choi;Dahuin Jung;Sungroh Yoon",
        "authorids": "~Daegyu_Kim1;~Chaehun_Shin1;~Jooyoung_Choi1;~Dahuin_Jung2;~Sungroh_Yoon1",
        "gender": ";M;M;F;",
        "homepage": "http://dsail.snu.ac.kr/;https://github.com/chaehunshin;http://ailab.snu.ac.kr/;https://hai.ssu.ac.kr/;http://ailab.snu.ac.kr",
        "dblp": ";287/9294;;224/0158;99/1474",
        "google_scholar": ";M8RX0MEAAAAJ;9EIn52wAAAAJ;https://scholar.google.co.kr/citations?user=wleS-UQAAAAJ;Bphl_fIAAAAJ",
        "orcid": ";;;;0000-0002-2367-197X",
        "linkedin": ";;jooyoung-choi-548892187/;;",
        "or_profile": "~Daegyu_Kim1;~Chaehun_Shin1;~Jooyoung_Choi1;~Dahuin_Jung2;~Sungroh_Yoon1",
        "aff": "Seoul National University;Seoul National University;Seoul National University;Seoul National University;Seoul National University",
        "aff_domain": "snu.ac.kr;snu.ac.kr;snu.ac.kr;snu.ac.kr;snu.ac.kr",
        "position": "MS student;PhD student;PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nkim2024diffusionstego,\ntitle={Diffusion-Stego: Training-free Diffusion Generative Steganography via Message Projection},\nauthor={Daegyu Kim and Chaehun Shin and Jooyoung Choi and Dahuin Jung and Sungroh Yoon},\nyear={2024},\nurl={https://openreview.net/forum?id=Ve9GKnDNDQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "Ny5h;LtLp;Yv3H;xvqX",
        "site": "https://openreview.net/forum?id=Ve9GKnDNDQ",
        "pdf_size": 1752126,
        "rating": "1;3;3;5",
        "confidence": "4;5;4;4",
        "soundness": "3;3;2;3",
        "contribution": "2;2;1;2",
        "presentation": "3;3;2;2",
        "wc_summary": "53;58;29;24",
        "wc_strengths": "26;28;24;12",
        "wc_weaknesses": "179;40;228;313",
        "wc_questions": "3;217;2;70",
        "wc_review": "261;343;283;419",
        "wc_reply_reviewers": "0;0;27;260",
        "wc_reply_authors": "576;499;299;773",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            41.0,
            14.713938969562161
        ],
        "wc_strengths_avg": [
            22.5,
            6.224949798994366
        ],
        "wc_weaknesses_avg": [
            190.0,
            98.98737293210685
        ],
        "wc_questions_avg": [
            73.0,
            87.5870995067196
        ],
        "wc_review_avg": [
            326.5,
            61.259693110560065
        ],
        "wc_reply_reviewers_avg": [
            71.75,
            109.2437069125723
        ],
        "wc_reply_authors_avg": [
            536.75,
            169.7827656153592
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17951384139340103423&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Seoul National University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.snu.ac.kr",
        "aff_unique_abbr": "SNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "VeFmnRmoaW",
        "title": "MetroGNN: Metro Network Expansion with Deep Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Selecting urban regions for metro network expansion that serve maximal transportation demands is critical to urban development, while computationally challenging to solve. First, metro network expansion is dependent on multiple complicated features, such as urban demographics, origin-destination (OD) flow, and relationships with existing metro lines, requiring a unified model to incorporate these correlated features for region selection. Second, it is a complex decision-making task with an enormous solution space and various constraints, due to the large number of candidate regions and restrictions on urban geography. In this paper, we present a reinforcement learning framework to solve a Markov decision process on an urban heterogeneous multi-graph, achieving metro network expansion by intelligently selecting a set of nodes on the graph. A novel graph neural network is proposed, which unifies the complicated features and learns effective representations for urban regions. In addition, we design an attentive reinforcement learning agent with action masks to efficiently search the large solution space and avoid infeasible solutions indicated by the various constraints. Experiments on real-world urban data of Beijing and Changsha show that our proposed approach can improve the satisfied transportation demands substantially by over 30\\% compared with state-of-the-art reinforcement learning methods. Further in-depth analysis demonstrates that MetroGNN can provide explainable results in scenarios with much more complicated initial conditions and expansion requirements, indicating its applicability in real-world metro network design tasks. Codes are released at https://anonymous.4open.science/r/MetroGNN-31DD.",
        "keywords": "metro network expansion;reinforcement learning;graph neural networks",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Hongyuan Su;Yu Zheng;Depeng Jin;Yong Li",
        "authorids": "~Hongyuan_Su2;~Yu_Zheng7;~Depeng_Jin1;~Yong_Li7",
        "gender": "M;;;M",
        "homepage": "https://suhongyuan.github.io/;;;http://fi.ee.tsinghua.edu.cn/~liyong/",
        "dblp": "308/6219;;46/5770;",
        "google_scholar": ";;;https://scholar.google.com/citations?hl=en",
        "orcid": "0009-0007-1110-2124;;;",
        "linkedin": ";;;",
        "or_profile": "~Hongyuan_Su2;~Yu_Zheng7;~Depeng_Jin1;~Yong_Li7",
        "aff": "Tsinghua University;;Tsinghua University;Tsinghua University",
        "aff_domain": "mails.tsinghua.edu.cn;;tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "Undergrad student;;Full Professor;Full Professor",
        "bibtex": "@misc{\nsu2024metrognn,\ntitle={Metro{GNN}: Metro Network Expansion with Deep Reinforcement Learning},\nauthor={Hongyuan Su and Yu Zheng and Depeng Jin and Yong Li},\nyear={2024},\nurl={https://openreview.net/forum?id=VeFmnRmoaW}\n}",
        "github": "",
        "project": "",
        "reviewers": "zGme;WxNe;m3ip;6Gv3",
        "site": "https://openreview.net/forum?id=VeFmnRmoaW",
        "pdf_size": 1088201,
        "rating": "3;5;6;6",
        "confidence": "3;4;4;4",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;2",
        "presentation": "1;2;2;3",
        "wc_summary": "85;115;99;97",
        "wc_strengths": "58;125;77;80",
        "wc_weaknesses": "224;344;69;185",
        "wc_questions": "1;205;68;30",
        "wc_review": "368;789;313;392",
        "wc_reply_reviewers": "0;401;0;73",
        "wc_reply_authors": "846;1455;436;977",
        "reply_reviewers": "0;2;0;1",
        "reply_authors": "3;3;1;3",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            99.0,
            10.677078252031311
        ],
        "wc_strengths_avg": [
            85.0,
            24.586581706288495
        ],
        "wc_weaknesses_avg": [
            205.5,
            98.2051424315448
        ],
        "wc_questions_avg": [
            76.0,
            78.17608329917789
        ],
        "wc_review_avg": [
            465.5,
            188.9556826348443
        ],
        "wc_reply_reviewers_avg": [
            118.5,
            165.8018395555369
        ],
        "wc_reply_authors_avg": [
            928.5,
            363.6334005561095
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.5,
            0.8660254037844386
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.9428090415820632,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:tR049Yu8e-QJ:scholar.google.com/&scioq=MetroGNN:+Metro+Network+Expansion+with+Deep+Reinforcement+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Tsinghua University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "VeXAYl6tDB",
        "title": "Truthful High Dimensional Sparse Linear Regression",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In this paper, we study the problem of fitting the high dimensional sparse linear regression model with bounded covariates and sub-Gaussian responses where the data are provided by strategic or self-interested agents (individuals) who prioritize their privacy of data disclosure. In contrast to the classical setting, our focus is on designing mechanisms that can effectively incentivize most agents to truthfully report their data while preserving the privacy of individual reports. Simultaneously, we seek an estimator which should be close to the underlying parameter. \nWe attempt to solve the problem by deriving a novel private estimator that has a closed-form expression. \nBased on the estimator, we propose a mechanism which has the following properties via some appropriate design of the computation and payment scheme:  (1) the mechanism is $(o(1), O(n^{-\\Omega({1})}))$-jointly differentially private, where $n$ is the number of agents; (2) it is an $o(\\frac{1}{n})$-approximate Bayes Nash equilibrium for a $(1-o(1))$-fraction of agents to truthfully report their data; (3) the output could achieve an error of $o(1)$ to the underlying parameter; (4) it is individually rational for a $(1-o(1))$ fraction of agents in the mechanism ; (5) the payment budget required from the analyst to run the mechanism is $o(1)$. To the best of our knowledge, this is the first study on designing truthful and privacy-preserving mechanisms for high dimensional sparse linear regression.",
        "keywords": "truthful mechanism; game theory; Nash equilibrium;",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Liyang Zhu;Amina Manseur;Jinyan Liu;Di Wang",
        "authorids": "~Liyang_Zhu1;~Amina_Manseur1;~Jinyan_Liu1;~Di_Wang1",
        "gender": "M;F;;",
        "homepage": "https://cowboyliyang.github.io/homepage/#;;;",
        "dblp": "189/1681;;149/9402;",
        "google_scholar": ";;;",
        "orcid": ";;;",
        "linkedin": ";amina-manseur/;;",
        "or_profile": "~Liyang_Zhu1;~Amina_Manseur1;~Jinyan_Liu1;~Di_Wang1",
        "aff": "Duke University;Ecole Nationale de la Statistique et de l'Administration Economique;Beijing Institute of Technology;",
        "aff_domain": "duke.edu;ensae.fr;bit.edu.cn;",
        "position": "PhD student;MS student;Full Professor;",
        "bibtex": "@misc{\nzhu2024truthful,\ntitle={Truthful High Dimensional Sparse Linear Regression},\nauthor={Liyang Zhu and Amina Manseur and Jinyan Liu and Di Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=VeXAYl6tDB}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=VeXAYl6tDB",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16491442353410059438&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Duke University;Ecole Nationale de la Statistique et de l'Administration Economique;Beijing Institute of Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.duke.edu;https://ensae.fr;http://www.bit.edu.cn/",
        "aff_unique_abbr": "Duke;ENSAE;BIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2",
        "aff_country_unique": "United States;France;China"
    },
    {
        "id": "VfPWJM5FMr",
        "title": "ColA: Collaborative Adaptation with Gradient Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "A primary function of back-propagation is to compute both the gradient of hidden representations and parameters for optimization with gradient descent. Training large models requires high computational costs due to their vast parameter sizes. While Parameter-Efficient Fine-Tuning (PEFT) methods aim to train smaller auxiliary models to save computational space, they still present computational overheads, especially in Fine-Tuning as a Service (FTaaS) for numerous users. We introduce Collaborative Adaptation (ColA) with Gradient Learning (GL), a parameter-free, model-agnostic fine-tuning approach that decouples the computation of the gradient of hidden representations and parameters. In comparison to PEFT methods, ColA facilitates more cost-effective FTaaS by offloading the computation of the gradient to low-cost devices. We also provide a theoretical analysis of ColA and experimentally demonstrate that ColA can perform on par or better than existing PEFT methods on various benchmarks.",
        "keywords": "Parameter Efficiency;Fine-Tuning;Adaptation;Transfer Learning;Distributed Machine Learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/1009b229a2ad35dd8986948e22f1c5c5ecd59161.zip",
        "author": "Enmao Diao;Qi Le;Suya Wu;Xinran Wang;Ali Anwar;Jie Ding;Vahid Tarokh",
        "authorids": "~Enmao_Diao1;~Qi_Le1;~Suya_Wu1;~Xinran_Wang3;~Ali_Anwar1;~Jie_Ding2;~Vahid_Tarokh1",
        "gender": "M;M;F;F;M;M;",
        "homepage": "https://diaoenmao.com/;https://www.linkedin.com/in/qi-le-60a8811a0/;;https://wang8740.github.io;https://chalianwar.github.io/;http://jding.org;",
        "dblp": "226/5549;;;;69/9027-1;94/1825-2;",
        "google_scholar": "jhVVjF4AAAAJ;;;u8gID6EAAAAJ;o3eOVbgAAAAJ;ZyqvoqcAAAAJ;",
        "orcid": "0000-0002-9151-7990;;;;;;",
        "linkedin": "enmaodiao/;;suya-w-5a3a07167/;wang-xinran;;;",
        "or_profile": "~Enmao_Diao1;~Qi_Le1;~Suya_Wu1;~Xinran_Wang3;~Ali_Anwar1;~Jie_Ding2;~Vahid_Tarokh1",
        "aff": "Duke University;University of Minnesota - Twin Cities;Duke University;University of Minnesota - Twin Cities;University of Minnesota;University of Minnesota - Twin Cities;",
        "aff_domain": "duke.edu;umn.edu;duke.edu;umn.edu;umn.edu;umn.edu;",
        "position": "Postdoc;PhD student;PhD student;PhD student;Assistant Professor;Associate Professor;",
        "bibtex": "@misc{\ndiao2024cola,\ntitle={ColA: Collaborative Adaptation with Gradient Learning},\nauthor={Enmao Diao and Qi Le and Suya Wu and Xinran Wang and Ali Anwar and Jie Ding and Vahid Tarokh},\nyear={2024},\nurl={https://openreview.net/forum?id=VfPWJM5FMr}\n}",
        "github": "",
        "project": "",
        "reviewers": "cUyw;UBHP;NXJy",
        "site": "https://openreview.net/forum?id=VfPWJM5FMr",
        "pdf_size": 5377841,
        "rating": "3;5;6",
        "confidence": "3;2;4",
        "soundness": "3;3;3",
        "contribution": "2;2;3",
        "presentation": "2;2;3",
        "wc_summary": "110;66;305",
        "wc_strengths": "43;17;181",
        "wc_weaknesses": "254;34;241",
        "wc_questions": "44;146;82",
        "wc_review": "451;263;809",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "663;721;587",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            160.33333333333334,
            103.85994843484609
        ],
        "wc_strengths_avg": [
            80.33333333333333,
            71.96912918436318
        ],
        "wc_weaknesses_avg": [
            176.33333333333334,
            100.78469901505663
        ],
        "wc_questions_avg": [
            90.66666666666667,
            42.089850980438925
        ],
        "wc_review_avg": [
            507.6666666666667,
            226.47639072440987
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            657.0,
            54.86954224947267
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.3273268353539886,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14484645745637732953&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;1;1;1",
        "aff_unique_norm": "Duke University;University of Minnesota",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.duke.edu;https://www.minnesota.edu",
        "aff_unique_abbr": "Duke;UMN",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Twin Cities",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "VgPmCLQke7",
        "title": "Training-time Neuron Alignment for Improving Linear Mode Connectivity and Model Fusion",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In deep learning, Stochastic Gradient Descent (SGD) will find different solutions that are functionally similar but far away from each other in the parameter space. The loss landscape of linearly connecting two SGD solutions is called Linear Mode Connectivity (LMC), which often shows barriers. Current neuron alignment methods seek to find a network permutation that can map two SGD solutions into the same loss basin to improve LMC and model fusion. However, these methods are post-hoc and usually require large computations due to the astronomical number of permutation matrices. Can we realize training-time neuron alignment? In this paper, we first hypothesize that it can be realized by learning into an effective subspace. First, we provide a preliminary theoretical result to support the hypothesis. We further propose a subspace algorithm for partially fixing neuron weights to reduce the potential permutation symmetries without hurting accuracy. It is found that by applying our training-time alignment method, the LMC is largely improved and the required computation for post-matching is reduced. Interestingly, we also find random pruning at initialization can improve connectivity, which validates our subspace hypothesis. Lastly, we propose two algorithms, incorporating training-time neuron alignment in federated learning, to showcase its prospects in boosting model fusion even under heterogeneous datasets.",
        "keywords": "deep learning;linear mode connectivity;neuron alignment;permutation invariance;model fusion",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Zexi Li;Zhiqi Li;Tao Shen;Tao Lin;Chao Wu",
        "authorids": "~Zexi_Li1;~Zhiqi_Li4;~Tao_Shen4;~Tao_Lin1;~Chao_Wu1",
        "gender": "M;M;;M;M",
        "homepage": "https://zexilee.github.io/about-zexili/;https://zhiqili-cg.github.io;;https://lins-lab.github.io/;",
        "dblp": "151/9187-1;143/0347-4.html;;64/4492-4.html;45/3158-1",
        "google_scholar": "https://scholar.google.com.hk/citations?user=6lMg5eoAAAAJ;gh_nHawAAAAJ;;QE9pa_cAAAAJ;gpTPt58AAAAJ",
        "orcid": "0000-0003-0831-3549;0000-0002-6892-8097;;0000-0002-3246-6935;0000-0003-0885-6869",
        "linkedin": ";li-zhiqi;;;",
        "or_profile": "~Zexi_Li1;~Zhiqi_Li4;~Tao_Shen4;~Tao_Lin1;~Chao_Wu1",
        "aff": "Zhejiang University;Georgia Institute of Technology;;Westlake University;Zhejiang University",
        "aff_domain": "zju.edu.cn;gatech.edu;;westlake.edu;zju.edu.cn",
        "position": "PhD student;MS student;;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nli2024trainingtime,\ntitle={Training-time Neuron Alignment for Improving Linear Mode Connectivity and Model Fusion},\nauthor={Zexi Li and Zhiqi Li and Tao Shen and Tao Lin and Chao Wu},\nyear={2024},\nurl={https://openreview.net/forum?id=VgPmCLQke7}\n}",
        "github": "",
        "project": "",
        "reviewers": "M3kr;xuvq;kfmS;vDht",
        "site": "https://openreview.net/forum?id=VgPmCLQke7",
        "pdf_size": 1074671,
        "rating": "5;5;6;6",
        "confidence": "3;3;2;3",
        "soundness": "3;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "3;2;2;2",
        "wc_summary": "184;68;100;67",
        "wc_strengths": "94;48;34;46",
        "wc_weaknesses": "253;128;31;96",
        "wc_questions": "108;147;108;3",
        "wc_review": "639;391;273;212",
        "wc_reply_reviewers": "128;116;0;0",
        "wc_reply_authors": "1976;2478;896;843",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "4;5;3;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            104.75,
            47.64123738947174
        ],
        "wc_strengths_avg": [
            55.5,
            22.863726730347352
        ],
        "wc_weaknesses_avg": [
            127.0,
            80.70625750212929
        ],
        "wc_questions_avg": [
            91.5,
            53.518688324733816
        ],
        "wc_review_avg": [
            378.75,
            163.45393081844193
        ],
        "wc_reply_reviewers_avg": [
            61.0,
            61.14736298484179
        ],
        "wc_reply_authors_avg": [
            1548.25,
            701.8213358825735
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.5,
            1.118033988749895
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:yuvMAYM9WtIJ:scholar.google.com/&scioq=Training-time+Neuron+Alignment+for+Improving+Linear+Mode+Connectivity+and+Model+Fusion&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Zhejiang University;Georgia Institute of Technology;Westlake University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.zju.edu.cn;https://www.gatech.edu;https://www.westlake.edu.cn",
        "aff_unique_abbr": "ZJU;Georgia Tech;WU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "VgdSNOkiuA",
        "title": "Adaptive-Solver Framework for Dynamic Strategy Selection in Large Language Model Reasoning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "As the field of artificial intelligence evolves, Large Language Models (LLMs) are showcasing impressive ability in handling complex reasoning tasks. Researchers have developed various techniques utilizing LLMs to tackle these challenges. In real-world situations, problems often span a spectrum of complexities. Humans inherently adjust their problem-solving approaches based on task complexity. However, most methodologies that leverage LLMs tend to adopt a uniform approach: utilizing consistent models, prompting methods, and degrees of problem decomposition, regardless of the problem complexity. Inflexibility of these methods can bring unnecessary computational overhead or sub-optimal performance. To address this problem, we introduce an Adaptive-Solver framework. It strategically modulates solving strategies based on the difficulties of the problems. Given an initial solution, the framework functions with two primary modules. The initial evaluation module assesses the adequacy of the current solution. If improvements are needed, the subsequent adaptation module comes into play. Within this module, three key adaptation strategies are employed: (1) Model Adaptation: Switching to a stronger LLM when a weaker variant is inadequate. (2) Prompting Method Adaptation: Alternating between different prompting techniques to suit the problem's nuances. (3) Decomposition Granularity Adaptation: Breaking down a complex problem into more fine-grained sub-questions to enhance solvability. Through such dynamic adaptations, our framework not only enhances computational efficiency but also elevates the overall performance. This dual-benefit ensures both the efficiency of the system for simpler tasks and the precision required for more complex questions. Experimental results from complex reasoning benchmarks reveal that the prompting method adaptation and decomposition granularity adaptation within the Adaptive-Solver framework enhance performance across all tasks. Furthermore, the model adaptation approach significantly reduces API costs (up to 50%) while maintaining superior performance.",
        "keywords": "reasoning;large language models;natural language processing;prompting;adaptive-solver framework",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Jianpeng Zhou;Wanjun Zhong;Yanlin Wang;Jiahai Wang",
        "authorids": "~Jianpeng_Zhou2;~Wanjun_Zhong1;~Yanlin_Wang1;~Jiahai_Wang1",
        "gender": "M;F;F;M",
        "homepage": "https://github.com/john1226966735;http://zhongwanjun.github.io/;https://yanlin.info/;",
        "dblp": ";227/2128;41/3458-1.html;00/2989",
        "google_scholar": ";https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com/citations?hl=zh-CN;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Jianpeng_Zhou2;~Wanjun_Zhong1;~Yanlin_Wang1;~Jiahai_Wang1",
        "aff": "SUN YAT-SEN UNIVERSITY;Huawei Technologies Ltd.;Sun Yat-Sen University;SUN YAT-SEN UNIVERSITY",
        "aff_domain": "sysu.edu.cn;huawei.com;mail.sysu.edu.cn;sysu.edu.cn",
        "position": "PhD student;Researcher;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nzhou2024adaptivesolver,\ntitle={Adaptive-Solver Framework for Dynamic Strategy Selection in Large Language Model Reasoning},\nauthor={Jianpeng Zhou and Wanjun Zhong and Yanlin Wang and Jiahai Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=VgdSNOkiuA}\n}",
        "github": "",
        "project": "",
        "reviewers": "63XR;5Pco;uCwU;xp3G",
        "site": "https://openreview.net/forum?id=VgdSNOkiuA",
        "pdf_size": 455985,
        "rating": "3;3;5;6",
        "confidence": "3;4;4;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "2;4;2;3",
        "wc_summary": "40;52;147;91",
        "wc_strengths": "10;83;53;58",
        "wc_weaknesses": "58;174;185;187",
        "wc_questions": "20;106;172;72",
        "wc_review": "128;415;557;408",
        "wc_reply_reviewers": "49;51;146;0",
        "wc_reply_authors": "1574;1463;1483;1551",
        "reply_reviewers": "2;1;1;0",
        "reply_authors": "5;3;3;4",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            82.5,
            41.740268326880695
        ],
        "wc_strengths_avg": [
            51.0,
            26.258332011001766
        ],
        "wc_weaknesses_avg": [
            151.0,
            53.92123885817165
        ],
        "wc_questions_avg": [
            92.5,
            55.17925334761245
        ],
        "wc_review_avg": [
            377.0,
            155.56831296893336
        ],
        "wc_reply_reviewers_avg": [
            61.5,
            52.88903478037768
        ],
        "wc_reply_authors_avg": [
            1517.75,
            46.02920268698992
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            3.75,
            0.82915619758885
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5555555555555555,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2751504237675084574&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Sun Yat-sen University;Huawei",
        "aff_unique_dep": ";Huawei Technologies",
        "aff_unique_url": "http://www.sysu.edu.cn;https://www.huawei.com",
        "aff_unique_abbr": "SYSU;Huawei",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "VhFSqBOYLs",
        "title": "NeuroSURF: Neural Uncertainty-aware Robust Surface Reconstruction",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Neural implicit functions have become popular for representing surfaces because they offer an adaptive resolution and support arbitrary topologies. While previous works rely on ground truth point clouds, they often ignore the effect of input quality and sampling methods on the reconstruction. In this paper, we introduce NeuroSURF, which generates significantly improved qualitative and quantitative reconstructions driven by a novel sampling and interpolation technique. We show that employing a sampling technique that considers the geometric characteristics of inputs can enhance the training process. To this end, we introduce a strategy that efficiently computes differentiable geometric features, namely, mean curvatures, to augment the sampling phase during the training period. Moreover, we augment the neural implicit surface representation with uncertainty, which offers insights into the occupancy and reliability of the output signed distance value, thereby expanding representation capabilities into open surfaces. Finally, we demonstrate that NeuroSURF leads to state-of-the-art reconstructions on both synthetic and real-world data.",
        "keywords": "implicit representation;sampling;neural network;surface reconstruction",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Lu Sang;Abhishek Saroha;Maolin Gao;Daniel Cremers",
        "authorids": "~Lu_Sang1;~Abhishek_Saroha1;~Maolin_Gao1;~Daniel_Cremers1",
        "gender": "F;M;M;M",
        "homepage": ";;https://maolingao.github.io/;https://vision.in.tum.de/members/cremers",
        "dblp": "255/5290;230/4206;205/3401;c/DanielCremers",
        "google_scholar": "TIRXP0QAAAAJ;;BupaOMMAAAAJ;cXQciMEAAAAJ",
        "orcid": "0009-0007-1158-5584;;;",
        "linkedin": ";abhishek-saroha/;;",
        "or_profile": "~Lu_Sang1;~Abhishek_Saroha1;~Maolin_Gao1;~Daniel_Cremers1",
        "aff": "Technische Universit\u00e4t M\u00fcnchen;Department of Informatics, Technische Universit\u00e4t M\u00fcnchen;Technical University Munich;Technical University Munich",
        "aff_domain": "tum.de;in.tum.de;tum.de;tum.de",
        "position": "PhD student;PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nsang2024neurosurf,\ntitle={Neuro{SURF}: Neural Uncertainty-aware Robust Surface Reconstruction},\nauthor={Lu Sang and Abhishek Saroha and Maolin Gao and Daniel Cremers},\nyear={2024},\nurl={https://openreview.net/forum?id=VhFSqBOYLs}\n}",
        "github": "",
        "project": "",
        "reviewers": "MUY9;PKLg;Mh1P;drJN",
        "site": "https://openreview.net/forum?id=VhFSqBOYLs",
        "pdf_size": 36551056,
        "rating": "3;3;5;5",
        "confidence": "4;3;4;3",
        "soundness": "3;2;3;2",
        "contribution": "2;2;2;3",
        "presentation": "1;2;2;3",
        "wc_summary": "175;71;125;103",
        "wc_strengths": "75;60;83;47",
        "wc_weaknesses": "743;522;156;99",
        "wc_questions": "506;113;84;36",
        "wc_review": "1499;766;448;285",
        "wc_reply_reviewers": "222;0;0;0",
        "wc_reply_authors": "1355;1350;1226;460",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "3;3;3;2",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            118.5,
            37.851684242580276
        ],
        "wc_strengths_avg": [
            66.25,
            13.845125496000389
        ],
        "wc_weaknesses_avg": [
            380.0,
            265.0801765504165
        ],
        "wc_questions_avg": [
            184.75,
            187.50116666303705
        ],
        "wc_review_avg": [
            749.5,
            466.0163623736832
        ],
        "wc_reply_reviewers_avg": [
            55.5,
            96.12881982007269
        ],
        "wc_reply_authors_avg": [
            1097.75,
            371.81337724724216
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Ngq0dzu4HSMJ:scholar.google.com/&scioq=NeuroSURF:+Neural+Uncertainty-aware+Robust+Surface+Reconstruction&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;1",
        "aff_unique_norm": "Technische Universit\u00e4t M\u00fcnchen;Technical University of Munich",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tum.de;https://www.tum.de",
        "aff_unique_abbr": "TUM;TUM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "VhQUwxIHER",
        "title": "Small Variance, Big Fairness: A Path to Harmless Fairness without Demographics",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Statistical fairness harnesses a classifier to accommodate parity requirements by equalizing the model utility (e.g., accuracy) across disadvantaged and advantaged groups. \nDue to privacy and security concerns, recently there has arisen a need for learning fair classifiers without ready-to-use demographic information.\nExisting studies remedy this challenge by introducing various side information about groups and many of them are found fair by unavoidably comprising model utility. $Can\\ we\\ improve\\ fairness\\ without\\ demographics\\ and\\ without\\ hurting\\ model\\ utility?$\nTo address this problem, we propose to center on minimizing the variance of losses, allowing the model to effectively eliminate possible accuracy disparities without knowledge of sensitive attributes. \nDuring optimization, we develop a dynamic harmless update approach operating at both loss and gradient levels, directing the model towards fair solutions while preserving its intact utility. \nThrough extensive experiments across four benchmark datasets, our results consistently demonstrate that our method effectively reduces group accuracy disparities while maintaining comparable or even improved utility.",
        "keywords": "Fairness;Fairness withou demographics;Harmless fairness;Max-Min fairness",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/75c01f15f46a49052dad44a3ad583e9db7bb2eee.zip",
        "author": "Xuanqian Wang;Jing Li;Ivor Tsang",
        "authorids": "~Xuanqian_Wang1;~Jing_Li17;~Ivor_Tsang1",
        "gender": "F;;",
        "homepage": ";;",
        "dblp": "336/0539.html;;",
        "google_scholar": ";;",
        "orcid": "0009-0004-4496-6939;;",
        "linkedin": ";;",
        "or_profile": "~Xuanqian_Wang1;~Jing_Li17;~Ivor_Tsang1",
        "aff": "Beihang University;;",
        "aff_domain": "buaa.edu.cn;;",
        "position": "MS student;;",
        "bibtex": "@misc{\nwang2024small,\ntitle={Small Variance, Big Fairness: A Path to Harmless Fairness without Demographics},\nauthor={Xuanqian Wang and Jing Li and Ivor Tsang},\nyear={2024},\nurl={https://openreview.net/forum?id=VhQUwxIHER}\n}",
        "github": "",
        "project": "",
        "reviewers": "6VBP;NHS2;DML4;6MVk",
        "site": "https://openreview.net/forum?id=VhQUwxIHER",
        "pdf_size": 1663455,
        "rating": "3;5;6;6",
        "confidence": "4;5;3;3",
        "soundness": "2;2;3;3",
        "contribution": "1;2;3;3",
        "presentation": "3;3;3;2",
        "wc_summary": "29;79;138;76",
        "wc_strengths": "31;77;85;111",
        "wc_weaknesses": "177;287;127;116",
        "wc_questions": "265;46;105;150",
        "wc_review": "502;489;455;453",
        "wc_reply_reviewers": "142;23;183;31",
        "wc_reply_authors": "1004;834;1049;514",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;3;2;2",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            80.5,
            38.66846260197062
        ],
        "wc_strengths_avg": [
            76.0,
            28.861739379323623
        ],
        "wc_weaknesses_avg": [
            176.75,
            67.67708253168128
        ],
        "wc_questions_avg": [
            141.5,
            80.27608610289866
        ],
        "wc_review_avg": [
            474.75,
            21.26470079733077
        ],
        "wc_reply_reviewers_avg": [
            94.75,
            69.34109531872134
        ],
        "wc_reply_authors_avg": [
            850.25,
            210.04091863253694
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.4923659639173309,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:dbPsjOVkqWkJ:scholar.google.com/&scioq=Small+Variance,+Big+Fairness:+A+Path+to+Harmless+Fairness+without+Demographics&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Beihang University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.buaa.edu.cn/",
        "aff_unique_abbr": "BUAA",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "title": "Deep Temporal Graph Clustering",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18498",
        "id": "ViNe1fjGME",
        "author_site": "Meng Liu, Yue Liu, KE LIANG, Wenxuan Tu, Siwei Wang, sihang zhou, Xinwang Liu",
        "tldr": "",
        "abstract": "Deep graph clustering has recently received significant attention due to its ability to enhance the representation learning capabilities of models in unsupervised scenarios. Nevertheless, deep clustering for temporal graphs, which could capture crucial dynamic interaction information, has not been fully explored. It means that in many clustering-oriented real-world scenarios, temporal graphs can only be processed as static graphs. This not only causes the loss of dynamic information but also triggers huge computational consumption. To solve the problem, we propose a general framework for deep Temporal Graph Clustering called TGC, which introduces deep clustering techniques to suit the interaction sequence-based batch-processing pattern of temporal graphs. In addition, we discuss differences between temporal graph clustering and static graph clustering from several levels. To verify the superiority of the proposed framework TGC, we conduct extensive experiments. The experimental results show that temporal graph clustering enables more flexibility in finding a balance between time and space requirements, and our framework can effectively improve the performance of existing temporal graph learning methods. The code is released: https://github.com/MGitHubL/Deep-Temporal-Graph-Clustering.",
        "keywords": "Clustering;Graph Learning;Temporal Graph",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/4832058bb7f462433f418a4b86b3ac28c93d7ac8.zip",
        "author": "Meng Liu;Yue Liu;KE LIANG;Wenxuan Tu;Siwei Wang;sihang zhou;Xinwang Liu",
        "authorids": "~Meng_Liu6;~Yue_Liu10;~KE_LIANG1;~Wenxuan_Tu1;~Siwei_Wang4;~sihang_zhou1;~Xinwang_Liu1",
        "gender": ";M;M;;M;M;M",
        "homepage": ";https://yueliu1999.github.io/;https://liangke23.github.io/;;https://wangsiwei2010.github.io/;;https://xinwangliu.github.io/",
        "dblp": "41/7841-14.html;74/1932-8;48/73-6;;51/8279-1;;45/6569-2.html",
        "google_scholar": "6DtqpM8AAAAJ;5tfpu3MAAAAJ;gwea2McAAAAJ;;5o9hK3EAAAAJ;_cbTMjIAAAAJ;A56vWC4AAAAJ",
        "orcid": ";;0000-0002-4837-455X;;0000-0001-9517-262X;0000-0003-1491-4594;",
        "linkedin": ";;;;;;",
        "or_profile": "~Meng_Liu6;~Yue_Liu10;~KE_LIANG1;~Wenxuan_Tu1;~Siwei_Wang4;~sihang_zhou1;~Xinwang_Liu1",
        "aff": "National University of Defense Technology;University of Illinois, Urbana Champaign;National University of Defense Technology;;Intelligent Game and Decision Lab;National University of Defense Technology;National University of Defense Technology",
        "aff_domain": "nudt.edu.cn;uiuc.edu;nudt.edu.cn;;nudt.edu.cn;nudt.edu.cn;nudt.edu.cn",
        "position": "PhD student;Intern;PhD student;;Assistant Professor;Lecturer;Full Professor",
        "bibtex": "@inproceedings{\nliu2024deep,\ntitle={Deep Temporal Graph Clustering},\nauthor={Meng Liu and Yue Liu and KE LIANG and Wenxuan Tu and Siwei Wang and sihang zhou and Xinwang Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ViNe1fjGME}\n}",
        "github": "",
        "project": "",
        "reviewers": "Euq6;PosK;8jHD",
        "pdf_size": 904969,
        "rating": "6;8;8",
        "confidence": "4;4;5",
        "soundness": "2;3;3",
        "contribution": "2;4;4",
        "presentation": "2;4;3",
        "wc_summary": "99;43;48",
        "wc_strengths": "67;63;56",
        "wc_weaknesses": "347;209;98",
        "wc_questions": "58;4;30",
        "wc_review": "571;319;232",
        "wc_reply_reviewers": "16;34;9",
        "wc_reply_authors": "1645;1147;1001",
        "reply_reviewers": "1;1;1",
        "reply_authors": "3;2;2",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            63.333333333333336,
            25.302612952464457
        ],
        "wc_strengths_avg": [
            62.0,
            4.546060565661952
        ],
        "wc_weaknesses_avg": [
            218.0,
            101.85283501208987
        ],
        "wc_questions_avg": [
            30.666666666666668,
            22.050447211388303
        ],
        "wc_review_avg": [
            374.0,
            143.75673897247393
        ],
        "wc_reply_reviewers_avg": [
            19.666666666666668,
            10.530379332620875
        ],
        "wc_reply_authors_avg": [
            1264.3333333333333,
            275.6922599969434
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 76,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7479532381957705644&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=ViNe1fjGME",
        "pdf": "https://openreview.net/pdf?id=ViNe1fjGME",
        "email": "nudt.edu.cn;uiuc.edu;nudt.edu.cn;;nudt.edu.cn;nudt.edu.cn;nudt.edu.cn",
        "author_num": 7,
        "aff_unique_index": "0;1;0;2;0;0",
        "aff_unique_norm": "National University of Defense Technology;University of Illinois Urbana-Champaign;Intelligent Game and Decision Lab",
        "aff_unique_dep": ";;Intelligent Game and Decision Lab",
        "aff_unique_url": "http://www.nudt.edu.cn/;https://illinois.edu;",
        "aff_unique_abbr": "NUDT;UIUC;",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Urbana-Champaign",
        "aff_country_unique_index": "0;1;0;0;0",
        "aff_country_unique": "China;United States;"
    },
    {
        "title": "T-MARS: Improving Visual Representations by Circumventing Text Feature Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18497",
        "id": "ViPtjIVzUw",
        "author_site": "Pratyush Maini, Sachin Goyal, Zachary Lipton, J Kolter, Aditi Raghunathan",
        "tldr": "",
        "abstract": "Large web-crawled multimodal datasets have powered a slew of new methods for learning general-purpose visual representations, advancing the state of the art in computer vision and revolutionizing zero- and few-shot recognition. One crucial decision facing practitioners is how, if at all, to curate these ever-larger datasets. For example, the creators of the LAION-5B dataset chose to retain only image-caption pairs whose CLIP similarity score exceeded a designated threshold. In this paper, we propose a new state-of-the-art data filtering approach motivated by our observation that nearly $40\\%$ of LAION's images contain text that overlaps significantly with the caption. Intuitively, such data could be wasteful as it incentivizes models to perform optical character recognition rather than learning visual features. However, naively removing all such data could also be wasteful, as it throws away images that contain visual features (in addition to overlapping text). Our simple and scalable approach, T-MARS (Text Masking and Re-Scoring), filters out only those pairs where the text dominates the remaining visual features---by first masking out the text and then filtering out those with a low CLIP similarity score of the masked image with original captions. Experimentally, T-MARS is the top ranked approach on Imagenet at ``medium scale'' of DataComp (a data filtering benchmark), and outperforms CLIP filtering by a margin of $6.5\\%$ on ImageNet and $4.7\\%$ on VTAB. Additionally, we show that the accuracy gains enjoyed by T-MARS linearly increase as data and compute are scaled exponentially.",
        "keywords": "Data Cleaning;CLIP;Image-caption;Hard examples;representation learning;Web Scale;LAION",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/076ec1f762a988e568d1c4ea3a680eabdfea7972.zip",
        "author": "Pratyush Maini;Sachin Goyal;Zachary Chase Lipton;J Zico Kolter;Aditi Raghunathan",
        "authorids": "~Pratyush_Maini1;~Sachin_Goyal1;~Zachary_Chase_Lipton1;~J_Zico_Kolter1;~Aditi_Raghunathan1",
        "gender": "M;M;Unspecified;F;M",
        "homepage": "https://pratyushmaini.github.io/;https://saching007.github.io/;http://zacklipton.com;https://www.cs.cmu.edu/~aditirag/;http://www.zicokolter.com",
        "dblp": "248/8071;82/2605;;166/1409;67/2526",
        "google_scholar": ";-KK-60AAAAAJ;MN9Kfg8AAAAJ;Ch9iRwQAAAAJ;UXh1I6UAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Pratyush_Maini1;~Sachin_Goyal1;~Zachary_Chase_Lipton1;~Aditi_Raghunathan1;~Zico_Kolter1",
        "aff": "Carnegie Mellon University;Carnegie Mellon University;Carnegie Mellon University;Carnegie Mellon University;Carnegie Mellon University",
        "aff_domain": "cmu.edu;andrew.cmu.edu;cmu.edu;cmu.edu;cmu.edu",
        "position": "PhD student;PhD student;Assistant Professor;Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\nmaini2024tmars,\ntitle={T-{MARS}: Improving Visual Representations by Circumventing Text Feature Learning},\nauthor={Pratyush Maini and Sachin Goyal and Zachary Chase Lipton and J Zico Kolter and Aditi Raghunathan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ViPtjIVzUw}\n}",
        "github": "",
        "project": "",
        "reviewers": "3vr7;hNGm;ZjEa;NY9s",
        "pdf_size": 7451784,
        "rating": "6;6;6;8",
        "confidence": "4;2;2;4",
        "soundness": "3;3;3;4",
        "contribution": "2;3;3;4",
        "presentation": "3;2;3;4",
        "wc_summary": "103;41;76;105",
        "wc_strengths": "90;16;117;122",
        "wc_weaknesses": "152;57;77;61",
        "wc_questions": "86;3;153;102",
        "wc_review": "431;117;423;390",
        "wc_reply_reviewers": "45;0;0;24",
        "wc_reply_authors": "1004;438;1001;340",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "4;2;3;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            1.0
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            81.25,
            25.907286619790966
        ],
        "wc_strengths_avg": [
            86.25,
            42.346044679521135
        ],
        "wc_weaknesses_avg": [
            86.75,
            38.408169703853375
        ],
        "wc_questions_avg": [
            86.0,
            53.930510844975316
        ],
        "wc_review_avg": [
            340.25,
            129.80634614686602
        ],
        "wc_reply_reviewers_avg": [
            17.25,
            18.779976038323372
        ],
        "wc_reply_authors_avg": [
            695.75,
            308.7024254844785
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 34,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10035907848161757279&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=ViPtjIVzUw",
        "pdf": "https://openreview.net/pdf?id=ViPtjIVzUw",
        "email": "cmu.edu;andrew.cmu.edu;cmu.edu;cmu.edu;cmu.edu",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Carnegie Mellon University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cmu.edu",
        "aff_unique_abbr": "CMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "VjAjZWJ7Fr",
        "title": "A Graph-Theoretic Framework for Joint OOD Generalization and Detection",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In the context of modern machine learning, models deployed in real-world scenarios often encounter various forms of data shifts, leading to challenges in both out-of-distribution (OOD) generalization and detection. While these two aspects have received significant attention individually, they lack a unified framework for theoretical understanding and practical usage. This paper bridges the gap by formalizing a graph-theoretical framework tailored for both OOD generalization and detection. In particular, based on our graph formulation, we introduce spectral learning with wild data (SLW) and show the equivalence of minimizing the objective and performing spectral decomposition on the graph. This equivalence allows us to derive provable error quantifying OOD generalization and detection performance. Empirically, SLW demonstrates competitive performance against existing baselines, aligning with the theoretical insight.",
        "keywords": "OOD generalization;OOD detection",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/987587c2e55033e1403c907337c1ba94c9af13a6.pdf",
        "author": "Han Wang;Yixuan Li",
        "authorids": "~Han_Wang19;~Yixuan_Li1",
        "gender": "M;F",
        "homepage": "https://rookiehb.github.io/;http://pages.cs.wisc.edu/~sharonli/",
        "dblp": "67/1771-19;144/6087-1",
        "google_scholar": "5C6OSIgAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";",
        "linkedin": ";liyixuan",
        "or_profile": "~Han_Wang19;~Yixuan_Li1",
        "aff": "Zhejiang University;Cornell University",
        "aff_domain": "zju.edu.cn;cornell.edu",
        "position": "Undergrad student;Graduate Student",
        "bibtex": "@misc{\nwang2024a,\ntitle={A Graph-Theoretic Framework for Joint {OOD} Generalization and Detection},\nauthor={Han Wang and Yixuan Li},\nyear={2024},\nurl={https://openreview.net/forum?id=VjAjZWJ7Fr}\n}",
        "github": "",
        "project": "",
        "reviewers": "uUKR;BLbH;WvgX",
        "site": "https://openreview.net/forum?id=VjAjZWJ7Fr",
        "pdf_size": 1685718,
        "rating": "3;6;6",
        "confidence": "3;4;4",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "2;3;3",
        "wc_summary": "67;65;151",
        "wc_strengths": "43;62;186",
        "wc_weaknesses": "260;158;160",
        "wc_questions": "4;20;36",
        "wc_review": "374;305;533",
        "wc_reply_reviewers": "0;46;0",
        "wc_reply_authors": "750;765;584",
        "reply_reviewers": "0;1;0",
        "reply_authors": "1;2;1",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            94.33333333333333,
            40.07770230717103
        ],
        "wc_strengths_avg": [
            97.0,
            63.40872705445731
        ],
        "wc_weaknesses_avg": [
            192.66666666666666,
            47.61885714247619
        ],
        "wc_questions_avg": [
            20.0,
            13.063945294843617
        ],
        "wc_review_avg": [
            404.0,
            95.46727187890099
        ],
        "wc_reply_reviewers_avg": [
            15.333333333333334,
            21.684607956387456
        ],
        "wc_reply_authors_avg": [
            699.6666666666666,
            82.01761328451887
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:fu6Lkq33C6YJ:scholar.google.com/&scioq=A+Graph-Theoretic+Framework+for+Joint+OOD+Generalization+and+Detection&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Zhejiang University;Cornell University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.zju.edu.cn;https://www.cornell.edu",
        "aff_unique_abbr": "ZJU;Cornell",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Towards Green AI in Fine-tuning Large Language Models via Adaptive Backpropagation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18496",
        "id": "Vja3ecieXY",
        "author_site": "Kai Huang, Hanyun Yin, Heng Huang, Wei Gao",
        "tldr": "",
        "abstract": "Fine-tuning is essential to adapting pre-trained large language models to downstream applications. With the increasing popularity of LLM-enabled applications, fine-tuning has been performed intensively worldwide, incurring a tremendous amount of computing costs that correspond to big carbon footprint and environmental impact. Mitigating such environmental impact directly correlates to reducing the fine-tuning FLOPs. Existing fine-tuning schemes focus on either saving memory or reducing the overhead of computing weight updates, but cannot achieve sufficient FLOPs reduction due to their ignorance of the training cost in backpropagation. To address this limitation, in this paper we present GreenTrainer, a new technique that minimizes the FLOPs of LLM fine-tuning via adaptive backpropagation, which adaptively selects the most appropriate set of LLM tensors for fine-tuning based on their importance and backpropagation cost in training. Experiment results show that GreenTrainer can save up to 64\\% training FLOPs compared to full fine-tuning, without any noticeable accuracy loss. Compared to the existing schemes such as Prefix Tuning and LoRA, GreenTrainer can achieve up to 4\\% improvement of model accuracy, with on-par FLOPs reduction.",
        "keywords": "Green AI;Large Language Models;Fine-Tuning;Adaptive Backpropagation",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Kai Huang;Hanyun Yin;Heng Huang;Wei Gao",
        "authorids": "k.huang@pitt.edu;ykissgoodbye@gmail.com;~Heng_Huang1;~Wei_Gao5",
        "gender": ";;M;M",
        "homepage": ";;https://www.cs.umd.edu/~heng/;http://www.pitt.edu/~weigao",
        "dblp": ";;03/281;28/2073-6",
        "google_scholar": ";;4OqLaDwAAAAJ;jPKDQwgAAAAJ",
        "orcid": ";;;0000-0003-2144-6960",
        "linkedin": ";;;",
        "or_profile": "k.huang@pitt.edu;ykissgoodbye@gmail.com;~Heng_Huang1;~Wei_Gao5",
        "aff": ";;Department of Computer Science, University of Maryland, College Park;University of Pittsburgh",
        "aff_domain": ";;cs.umd.edu;pitt.edu",
        "position": ";;Full Professor;Associate Professor",
        "bibtex": "@inproceedings{\nhuang2024towards,\ntitle={Towards Green {AI} in Fine-tuning Large Language Models via Adaptive Backpropagation},\nauthor={Kai Huang and Hanyun Yin and Heng Huang and Wei Gao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Vja3ecieXY}\n}",
        "github": "",
        "project": "",
        "reviewers": "CgrN;B8AP;U1j2;P1Bv",
        "pdf_size": 689594,
        "rating": "5;5;6;6",
        "confidence": "4;5;4;4",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "104;73;61;103",
        "wc_strengths": "68;132;48;87",
        "wc_weaknesses": "113;204;259;127",
        "wc_questions": "48;192;6;2",
        "wc_review": "333;601;374;319",
        "wc_reply_reviewers": "0;184;172;120",
        "wc_reply_authors": "877;1681;1345;1344",
        "reply_reviewers": "0;1;2;2",
        "reply_authors": "3;4;4;3",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            85.25,
            18.73999733191016
        ],
        "wc_strengths_avg": [
            83.75,
            31.083556746292725
        ],
        "wc_weaknesses_avg": [
            175.75,
            59.251054842930856
        ],
        "wc_questions_avg": [
            62.0,
            77.18808198161165
        ],
        "wc_review_avg": [
            406.75,
            113.95695459251269
        ],
        "wc_reply_reviewers_avg": [
            119.0,
            72.79423054061358
        ],
        "wc_reply_authors_avg": [
            1311.75,
            286.13753249093344
        ],
        "reply_reviewers_avg": [
            1.25,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.5,
            0.5
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 20,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5885721174763533012&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=Vja3ecieXY",
        "pdf": "https://openreview.net/pdf?id=Vja3ecieXY",
        "email": ";;cs.umd.edu;pitt.edu",
        "author_num": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Maryland, College Park;University of Pittsburgh",
        "aff_unique_dep": "Department of Computer Science;",
        "aff_unique_url": "https://www/umd.edu;https://www.pitt.edu",
        "aff_unique_abbr": "UMD;Pitt",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "College Park;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "RECOMBINER: Robust and Enhanced Compression with Bayesian Implicit Neural Representations",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18495",
        "id": "VkWbxFrCC8",
        "author_site": "Jiajun He, Gergely Flamich, Zongyu Guo, Jos\u00e9 Miguel Hern\u00e1ndez Lobato",
        "tldr": "",
        "abstract": "COMpression with Bayesian Implicit NEural Representations (COMBINER) is a recent data compression method that addresses a key inefficiency of previous Implicit Neural Representation (INR)-based approaches: it avoids quantization and enables direct optimization of the rate-distortion performance. However, COMBINER still has significant limitations: 1) it uses factorized priors and posterior approximations that lack flexibility; 2) it cannot effectively adapt to local deviations from global patterns in the data; and 3) its performance can be susceptible to modeling choices and the variational parameters' initializations. Our proposed method, Robust and Enhanced COMBINER (RECOMBINER), addresses these issues by 1) enriching the variational approximation while retaining a low computational cost via a linear reparameterization of the INR weights, 2) augmenting our INRs with learnable positional encodings that enable them to adapt to local details and 3) splitting high-resolution data into patches to increase robustness and utilizing expressive hierarchical priors to capture dependency across patches. We conduct extensive experiments across several data modalities, showcasing that RECOMBINER achieves competitive results with the best INR-based methods and even outperforms autoencoder-based codecs on low-resolution images at low bitrates. Our PyTorch implementation is available at https://github.com/cambridge-mlg/RECOMBINER/.",
        "keywords": "implicit neural representations;neural data compression;relative entropy coding;combiner",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Jiajun He;Gergely Flamich;Zongyu Guo;Jos\u00e9 Miguel Hern\u00e1ndez-Lobato",
        "authorids": "~Jiajun_He3;~Gergely_Flamich1;~Zongyu_Guo1;~Jos\u00e9_Miguel_Hern\u00e1ndez-Lobato1",
        "gender": "M;M;M;",
        "homepage": ";https://gergely-flamich.github.io/;;http://jmhl.org",
        "dblp": "205/5074-3;187/9709;247/4138;40/6058",
        "google_scholar": ";4Iw9TH8AAAAJ;paus9RMAAAAJ;BEBccCQAAAAJ",
        "orcid": ";0009-0009-9831-7455;;0000-0001-7610-949X",
        "linkedin": "jiajun-he-76a59526b/;gergely-flamich-142773102;;",
        "or_profile": "~Jiajun_He3;~Gergely_Flamich1;~Zongyu_Guo1;~Jose_Miguel_Hernandez_Lobato1",
        "aff": "University of Cambridge;University of Cambridge;University of Science and Technology of China;University of Cambridge",
        "aff_domain": "cam.ac.uk;cam.ac.uk;ustc.edu.cn;cam.ac.uk",
        "position": "Research Assistant;PhD student;PhD student;Associate Professor",
        "bibtex": "@inproceedings{\nhe2024recombiner,\ntitle={{RECOMBINER}: Robust and Enhanced Compression with Bayesian Implicit Neural Representations},\nauthor={Jiajun He and Gergely Flamich and Zongyu Guo and Jos{\\'e} Miguel Hern{\\'a}ndez-Lobato},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=VkWbxFrCC8}\n}",
        "github": "",
        "project": "",
        "reviewers": "DDkv;TTUk;oN2Z",
        "pdf_size": 4750425,
        "rating": "6;6;8",
        "confidence": "3;4;4",
        "soundness": "3;3;4",
        "contribution": "3;3;2",
        "presentation": "3;2;4",
        "wc_summary": "131;75;103",
        "wc_strengths": "85;107;114",
        "wc_weaknesses": "227;106;392",
        "wc_questions": "58;4;42",
        "wc_review": "501;292;651",
        "wc_reply_reviewers": "20;21;125",
        "wc_reply_authors": "731;304;1726",
        "reply_reviewers": "1;1;1",
        "reply_authors": "1;1;4",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            103.0,
            22.861904265976328
        ],
        "wc_strengths_avg": [
            102.0,
            12.355835328567093
        ],
        "wc_weaknesses_avg": [
            241.66666666666666,
            117.21869399640238
        ],
        "wc_questions_avg": [
            34.666666666666664,
            22.64705033528404
        ],
        "wc_review_avg": [
            481.3333333333333,
            147.21941297110092
        ],
        "wc_reply_reviewers_avg": [
            55.333333333333336,
            49.2634640366356
        ],
        "wc_reply_authors_avg": [
            920.3333333333334,
            595.7663598723543
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.0,
            1.4142135623730951
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.49999999999999983,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6048739875001517537&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=VkWbxFrCC8",
        "pdf": "https://openreview.net/pdf?id=VkWbxFrCC8",
        "email": "cam.ac.uk;cam.ac.uk;ustc.edu.cn;cam.ac.uk",
        "author_num": 4,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "University of Cambridge;University of Science and Technology of China",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cam.ac.uk;http://www.ustc.edu.cn",
        "aff_unique_abbr": "Cambridge;USTC",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Cambridge;",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "United Kingdom;China"
    },
    {
        "title": "Influencer Backdoor Attack on Semantic Segmentation",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18494",
        "id": "VmGRoNDQgJ",
        "author_site": "Haoheng Lan, Jindong Gu, Philip Torr, Hengshuang Zhao",
        "tldr": "",
        "abstract": "When a small number of poisoned samples are injected into the training dataset of a deep neural network, the network can be induced to exhibit malicious behavior during inferences, which poses potential threats to real-world applications. While they have been intensively studied in classification, backdoor attacks on semantic segmentation have been largely overlooked. Unlike classification, semantic segmentation aims to classify every pixel within a given image. In this work, we explore backdoor attacks on segmentation models to misclassify all pixels of a victim class by injecting a specific trigger on non-victim pixels during inferences, which is dubbed Influencer Backdoor Attack (IBA). IBA is expected to maintain the classification accuracy of non-victim pixels and mislead classifications of all victim pixels in every single inference and could be easily applied to real-world scenes. Based on the context aggregation ability of segmentation models, we proposed a simple, yet effective, Nearest-Neighbor trigger injection strategy. We also introduce an innovative Pixel Random Labeling strategy which maintains optimal performance even when the trigger is placed far from the victim pixels. Our extensive experiments reveal that current segmentation models do suffer from backdoor attacks, demonstrate IBA real-world applicability, and show that our proposed techniques can further increase attack performance.",
        "keywords": "Semantic Segmentation;Backdoor Attack",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Haoheng Lan;Jindong Gu;Philip Torr;Hengshuang Zhao",
        "authorids": "~Haoheng_Lan2;~Jindong_Gu1;~Philip_Torr1;~Hengshuang_Zhao2",
        "gender": ";;;M",
        "homepage": ";;http://www.robots.ox.ac.uk/~tvg/;https://hszhao.github.io",
        "dblp": ";;;185/7848",
        "google_scholar": ";;;4uE10I0AAAAJ",
        "orcid": ";;;0000-0001-8277-2706",
        "linkedin": ";;;hengshuang-zhao-347b8391/?originalSubdomain=hk",
        "or_profile": "~Haoheng_Lan2;~Jindong_Gu1;~Philip_Torr1;~Hengshuang_Zhao2",
        "aff": ";;University of Oxford;The University of Hong Kong",
        "aff_domain": ";;ox.ac.uk;hku.hk",
        "position": ";;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nlan2024influencer,\ntitle={Influencer Backdoor Attack on Semantic Segmentation},\nauthor={Haoheng Lan and Jindong Gu and Philip Torr and Hengshuang Zhao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=VmGRoNDQgJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "tjpw;6EGX;dGyx;DVe6",
        "pdf_size": 37021503,
        "rating": "6;8;8;8",
        "confidence": "2;4;5;4",
        "soundness": "2;3;3;4",
        "contribution": "2;3;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "76;78;82;116",
        "wc_strengths": "62;85;57;76",
        "wc_weaknesses": "47;136;195;95",
        "wc_questions": "61;18;6;32",
        "wc_review": "246;317;340;319",
        "wc_reply_reviewers": "32;41;57;15",
        "wc_reply_authors": "509;394;722;631",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;1;2;1",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            88.0,
            16.30950643030009
        ],
        "wc_strengths_avg": [
            70.0,
            11.113055385446435
        ],
        "wc_weaknesses_avg": [
            118.25,
            54.36623492573309
        ],
        "wc_questions_avg": [
            29.25,
            20.51066795596867
        ],
        "wc_review_avg": [
            305.5,
            35.51408171415952
        ],
        "wc_reply_reviewers_avg": [
            36.25,
            15.188400179084036
        ],
        "wc_reply_authors_avg": [
            564.0,
            123.87291875143654
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.9271726499455306,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5627070487152273032&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=VmGRoNDQgJ",
        "pdf": "https://openreview.net/pdf?id=VmGRoNDQgJ",
        "email": ";;ox.ac.uk;hku.hk",
        "author_num": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Oxford;University of Hong Kong",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ox.ac.uk;https://www.hku.hk",
        "aff_unique_abbr": "Oxford;HKU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United Kingdom;China"
    },
    {
        "id": "VmnWoLbzCS",
        "title": "LUMOS: Towards Language Agents that are Unified, Modular, and Open Source",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this paper, we present LUMOS, **L**anguage agents with **U**nified formats, **M**odular design, and **O**pen **S**ource LLMs. LUMOS features a modular architecture consisting of planning, grounding, and execution modules built based on open-source LLMs such as LLAMA-2. The planning module decomposes a task into a sequence of high-level subgoals; the grounding module then grounds the generated subgoals to a series of low-level actions that can then be executed by the execution module. To obtain high-quality annotations for training these modules, we leverage LLMs to convert ground-truth intermediate reasoning steps in existing benchmarks into a unified format that can be used in the LUMOS framework. LUMOS achieves competitive or superior performance compared to the state of the art on a variety of complex interactive tasks. We observe: (1) LUMOS is competitive with the LLM agents that are 2 \u2212 4\u00d7 larger on maths tasks, and outperforms GPT-4/3.5-based agents on complex QA and web agent tasks; (2) LUMOS shows superior performance against open-source agent baseline formulations including chain-of-thoughts fine-tuning and unmodularized training; (3) LUMOS surpasses larger LLM-based agents on an unseen interactive task, WebShop, and achieves 5-10 reward improvement over domain-specific agents.",
        "keywords": "language agent;interactive NLP;tool-augmented LLM",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/fa119dbf4d05c7ad678b8f1f9f7370b56289006c.zip",
        "author": "Da Yin;Faeze Brahman;Abhilasha Ravichander;Khyathi Chandu;Kai-Wei Chang;Yejin Choi;Bill Yuchen Lin",
        "authorids": "~Da_Yin2;~Faeze_Brahman1;~Abhilasha_Ravichander2;~Khyathi_Chandu1;~Kai-Wei_Chang1;~Yejin_Choi1;~Bill_Yuchen_Lin1",
        "gender": "M;F;;;M;F;M",
        "homepage": "https://wadeyin9712.github.io/;https://fabrahman.github.io;https://www.cs.cmu.edu/~aravicha/;;http://kwchang.net;https://yejinc.github.io/;http://yuchenlin.xyz/",
        "dblp": "131/0141;276/6005;170/4795.html;;18/2428;89/579-1;190/4518",
        "google_scholar": "n32w34kAAAAJ;viCG2ikAAAAJ;6vLsKGsAAAAJ;;fqDBtzYAAAAJ;vhP-tlcAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;;0000-0001-5365-0072;;",
        "linkedin": ";;abhilasha-ravichander-57524958;;kai-wei-chang-41239040;;",
        "or_profile": "~Da_Yin2;~Faeze_Brahman1;~Abhilasha_Ravichander2;~Khyathi_Chandu1;~Kai-Wei_Chang1;~Yejin_Choi1;~Bill_Yuchen_Lin1",
        "aff": "University of California, Los Angeles;Allen Institute for AI;Allen Institute for Artificial Intelligence;;Amazon;Department of Computer Science, University of Washington;Allen Institute for Artificial Intelligence",
        "aff_domain": "cs.ucla.edu;allenai.org;allenai.org;;amazon.com;cs.washington.edu;allenai.org",
        "position": "PhD student;Postdoc;Postdoc;;Researcher;Full Professor;Researcher",
        "bibtex": "@misc{\nyin2024lumos,\ntitle={{LUMOS}: Towards Language Agents that are Unified, Modular, and Open Source},\nauthor={Da Yin and Faeze Brahman and Abhilasha Ravichander and Khyathi Chandu and Kai-Wei Chang and Yejin Choi and Bill Yuchen Lin},\nyear={2024},\nurl={https://openreview.net/forum?id=VmnWoLbzCS}\n}",
        "github": "",
        "project": "",
        "reviewers": "7VK9;9Mw2;xkWX;UN8U",
        "site": "https://openreview.net/forum?id=VmnWoLbzCS",
        "pdf_size": 793864,
        "rating": "5;5;6;8",
        "confidence": "2;4;3;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "191;80;46;68",
        "wc_strengths": "93;48;45;47",
        "wc_weaknesses": "615;300;122;81",
        "wc_questions": "99;18;5;2",
        "wc_review": "998;446;218;198",
        "wc_reply_reviewers": "41;174;0;9",
        "wc_reply_authors": "1479;1980;944;634",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "5;5;3;2",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            96.25,
            56.046297825993825
        ],
        "wc_strengths_avg": [
            58.25,
            20.09197601033806
        ],
        "wc_weaknesses_avg": [
            279.5,
            210.46911887495514
        ],
        "wc_questions_avg": [
            31.0,
            39.717754216471
        ],
        "wc_review_avg": [
            465.0,
            322.78011091143765
        ],
        "wc_reply_reviewers_avg": [
            56.0,
            69.81045766932057
        ],
        "wc_reply_authors_avg": [
            1259.25,
            514.3176912181808
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.75,
            1.299038105676658
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.4923659639173309,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7546983566751377277&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;4;2",
        "aff_unique_norm": "University of California, Los Angeles;Allen Institute for AI;Allen Institute for Artificial Intelligence;Amazon;University of Washington",
        "aff_unique_dep": ";;;Amazon.com, Inc.;Department of Computer Science",
        "aff_unique_url": "https://www.ucla.edu;https://allenai.org;https://allenai.org;https://www.amazon.com;https://www.washington.edu",
        "aff_unique_abbr": "UCLA;AI2;AI2;Amazon;UW",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Los Angeles;;Seattle",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "VmqTuFMk68",
        "title": "Trainable Transformer in Transformer",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent works attribute the capability of in-context learning (ICL) in large pre-trained language models to implicitly simulating and fine-tuning an internal model (e.g., linear or 2-layer MLP) during inference. However, such constructions require large memory overhead, which makes simulation of more sophisticated internal models intractable. In this work, we propose a new efficient construction, Transformer in Transformer (in short, TINT), that allows a transformer to simulate and fine-tune more complex models during inference (e.g., pre-trained language models). In particular, we introduce innovative approximation techniques that allow a TINT model with less than 2 billion parameters to simulate and fine-tune a 125 million parameter transformer model within a single forward pass. TINT accommodates many common transformer variants and its design ideas also improve the efficiency of past instantiations of simple models inside transformers. We conduct end-to-end experiments to validate the internal fine-tuning procedure of TINT on various language modeling and downstream tasks. For example, even with a limited one-step budget, we observe TINT for a OPT-125M model improves performance by 4 \u2212 16% absolute on average compared to OPT-125M. These findings suggest that large pre-trained language models are capable of performing intricate subroutines. To facilitate further work, a modular and extensible codebase for TINT is included.",
        "keywords": "Gradient descent;transformers;in-context learning;construction",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/1c6f9299e32655192d5f0d49d477d1174e08abfa.zip",
        "author": "Abhishek Panigrahi;Sadhika Malladi;Mengzhou Xia;Sanjeev Arora",
        "authorids": "~Abhishek_Panigrahi1;~Sadhika_Malladi2;~Mengzhou_Xia1;~Sanjeev_Arora1",
        "gender": "M;F;F;",
        "homepage": "https://abhishekpanigrahi1996.github.io/;https://www.cs.princeton.edu/~smalladi/;https://xiamengzhou.github.io/;http://www.cs.princeton.edu/~arora/",
        "dblp": "208/4926;176/9810;241/9329;a/SArora",
        "google_scholar": "https://scholar.google.co.in/citations?user=oMhp8p8AAAAJ;9HCmTcwAAAAJ;zyJn1IcAAAAJ;RUP4S68AAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Abhishek_Panigrahi1;~Sadhika_Malladi2;~Mengzhou_Xia1;~Sanjeev_Arora1",
        "aff": "Princeton University;Princeton University;Princeton University;Princeton University",
        "aff_domain": "princeton.edu;princeton.edu;princeton.edu;princeton.edu",
        "position": "PhD student;PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\npanigrahi2024trainable,\ntitle={Trainable Transformer in Transformer},\nauthor={Abhishek Panigrahi and Sadhika Malladi and Mengzhou Xia and Sanjeev Arora},\nyear={2024},\nurl={https://openreview.net/forum?id=VmqTuFMk68}\n}",
        "github": "",
        "project": "",
        "reviewers": "LDni;KkDE;zqc2;k6Mj",
        "site": "https://openreview.net/forum?id=VmqTuFMk68",
        "pdf_size": 3692509,
        "rating": "5;5;5;8",
        "confidence": "2;3;2;2",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;1;2;3",
        "wc_summary": "194;61;72;28",
        "wc_strengths": "109;28;45;63",
        "wc_weaknesses": "672;143;257;80",
        "wc_questions": "1;25;2;97",
        "wc_review": "976;257;376;268",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "515;594;718;480",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            5.75,
            1.299038105676658
        ],
        "confidence_avg": [
            2.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            88.75,
            62.88630614052634
        ],
        "wc_strengths_avg": [
            61.25,
            30.21899237234756
        ],
        "wc_weaknesses_avg": [
            288.0,
            230.60030355574122
        ],
        "wc_questions_avg": [
            31.25,
            39.15593824696326
        ],
        "wc_review_avg": [
            469.25,
            296.2443037427049
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            576.75,
            91.40944973032055
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 21,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12741922747654223685&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Princeton University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.princeton.edu",
        "aff_unique_abbr": "Princeton",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Understanding Reconstruction Attacks with the Neural Tangent Kernel and Dataset Distillation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18493",
        "id": "VoLDkQ6yR3",
        "author_site": "Noel Loo, Ramin Hasani, Mathias Lechner, Alexander Amini, Daniela Rus",
        "tldr": "",
        "abstract": "Modern deep learning requires large volumes of data, which could contain sensitive or private information that cannot be leaked. Recent work has shown for homogeneous neural networks a large portion of this training data could be reconstructed with only access to the trained network parameters. While the attack was shown to work empirically, there exists little formal understanding of its effective regime and which datapoints are susceptible to reconstruction. In this work, we first build a stronger version of the dataset reconstruction attack and show how it can provably recover the \\emph{entire training set} in the infinite width regime. We then empirically study the characteristics of this attack on two-layer networks and reveal that its success heavily depends on deviations from the frozen infinite-width Neural Tangent Kernel limit. Next, we study the nature of easily-reconstructed images. We show that both theoretically and empirically, reconstructed images tend to ``outliers'' in the dataset, and that these reconstruction attacks can be used for \\textit{dataset distillation}, that is, we can retrain on reconstructed images and obtain high predictive accuracy.",
        "keywords": "Dataset Distillation;Reconstruction Attacks;Neural Tangent Kernel",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/2b2dbf25518c58e3c43abbc90d881ef3746f619c.zip",
        "author": "Noel Loo;Ramin Hasani;Mathias Lechner;Alexander Amini;Daniela Rus",
        "authorids": "~Noel_Loo1;~Ramin_Hasani1;~Mathias_Lechner1;~Alexander_Amini1;~Daniela_Rus1",
        "gender": ";Unspecified;;F;M",
        "homepage": "https://yolky.github.io/;https://mlech26l.github.io/pages/;https://www.mit.edu/~amini;https://www.csail.mit.edu/person/daniela-rus;http://www.raminhasani.com",
        "dblp": "279/6288;209/9862;;r/DanielaRus;190/3168",
        "google_scholar": "vokGv-gAAAAJ;https://scholar.google.at/citations?hl=en;EWB-8-oAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.at/citations?user=YarJF3QAAAAJ",
        "orcid": ";;;;0000-0002-9889-5222",
        "linkedin": "noel-loo-23a2a112b;;;;raminhasani/",
        "or_profile": "~Noel_Loo1;~Mathias_Lechner1;~Alexander_Amini1;~Daniela_Rus1;~Ramin_M._Hasani1",
        "aff": "Massachusetts Institute of Technology;;Massachusetts Institute of Technology;Massachusetts Institute of Technology;Massachusetts Institute of Technology",
        "aff_domain": "mit.edu;;mit.edu;mit.edu;mit.edu",
        "position": "PhD student;;PhD student;Full Professor;Researcher",
        "bibtex": "@inproceedings{\nloo2024understanding,\ntitle={Understanding Reconstruction Attacks with the Neural Tangent Kernel and Dataset Distillation},\nauthor={Noel Loo and Ramin Hasani and Mathias Lechner and Alexander Amini and Daniela Rus},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=VoLDkQ6yR3}\n}",
        "github": "",
        "project": "",
        "reviewers": "kua5;FNQS;GBp6",
        "pdf_size": 13496318,
        "rating": "6;6;8",
        "confidence": "3;2;4",
        "soundness": "2;3;4",
        "contribution": "3;3;3",
        "presentation": "3;2;3",
        "wc_summary": "31;85;33",
        "wc_strengths": "15;135;111",
        "wc_weaknesses": "226;197;13",
        "wc_questions": "42;97;198",
        "wc_review": "314;514;355",
        "wc_reply_reviewers": "63;20;180",
        "wc_reply_authors": "953;634;562",
        "reply_reviewers": "2;1;2",
        "reply_authors": "4;1;3",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            49.666666666666664,
            24.997777679003566
        ],
        "wc_strengths_avg": [
            87.0,
            51.84592558726288
        ],
        "wc_weaknesses_avg": [
            145.33333333333334,
            94.3197870132361
        ],
        "wc_questions_avg": [
            112.33333333333333,
            64.6030615029625
        ],
        "wc_review_avg": [
            394.3333333333333,
            86.25672276537188
        ],
        "wc_reply_reviewers_avg": [
            87.66666666666667,
            67.60834925428138
        ],
        "wc_reply_authors_avg": [
            716.3333333333334,
            169.91043392198006
        ],
        "reply_reviewers_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.8660254037844385,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16238328334050882577&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=VoLDkQ6yR3",
        "pdf": "https://openreview.net/pdf?id=VoLDkQ6yR3",
        "email": "mit.edu;;mit.edu;mit.edu;mit.edu",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Massachusetts Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://web.mit.edu",
        "aff_unique_abbr": "MIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "VpCqrMMGVm",
        "title": "Interpreting the Inner Mechanisms of Large Language Models in Mathematical Addition",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs) have achieved stunning performance on various language tasks, but remain as mysterious as a black box. Understanding the internal mechanisms of LLMs could contribute to the development of more transparent and interpretable LLMs. To this end, we take the first attempt to reveal a specific mechanism relating to how LLMs implement the reasoning task of a mathematical addition, i.e., scenarios involving the addition of two integers. Through comprehensive experiments, we find that LLMs frequently involve a small fraction of attention heads (0.5% of all heads) when implementing the addition task. Meanwhile, knocking out these frequently involved heads significantly degrades the LLMs' performance on the same task. Surprisingly, these key heads identified for a specific model exhibit outstanding generalizability across multiple datasets related to the mathematical addition task. Moreover, we find an intuitive phenomenon that knocking out these key heads could also affect the performance of LLMs on mathematical subtraction, which shares the same spirit with human behavior. Our work serves as a preliminary exploration into the mathematical prowess of LLMs, laying a solid foundation to reveal more intricate capabilities.",
        "keywords": "Model Interpretability;Large Language Models;Transformers;Mathematical Computation",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/ecb3fac359d4b948a99877ec9efeb5dbb6c96ea9.pdf",
        "author": "Wei Zhang;Wan Chaoqun;Yonggang Zhang;Xinmei Tian;Xu Shen;Jieping Ye",
        "authorids": "~Wei_Zhang58;~Wan_Chaoqun1;~Yonggang_Zhang1;~Xinmei_Tian1;~Xu_Shen1;~Jieping_Ye4",
        "gender": "M;M;F;M;M;M",
        "homepage": "http://staff.ustc.edu.cn/~xinmei/students.html;https://yonggangzhangben.github.io/index.html;https://faculty.ustc.edu.cn/tianxinmei1/zh_CN/index.htm;;http://yelabs.net/;http://staff.ustc.edu.cn/~xinmei/students.html",
        "dblp": "208/4855;27/6859-3;03/5204-1;09/10130-1.html;03/5454;",
        "google_scholar": ";XSbEr98AAAAJ;https://scholar.google.com.au/citations?hl=zh-CN;38jwGs8AAAAJ;T9AzhwcAAAAJ;",
        "orcid": ";0000-0002-4080-7592;0000-0002-5952-8753;;0000-0001-8662-5818;",
        "linkedin": ";;;;;",
        "or_profile": "~Wan_Chaoqun1;~Yonggang_Zhang1;~Xinmei_Tian1;~Xu_Shen1;~Jieping_Ye4;~Zhang_Wei3",
        "aff": "Alibaba Group;Hong Kong Baptist University;University of Science and Technology of China;Alibaba Group;Alibaba Group;University of Science and Technology of China",
        "aff_domain": "alibaba-inc.com;hkbu.edu.hk;ustc.edu.cn;alibaba-inc.com;alibaba-inc.com;ustc.edu.cn",
        "position": "Researcher;Postdoc;Full Professor;Researcher;Principal Researcher;PhD student",
        "bibtex": "@misc{\nzhang2024interpreting,\ntitle={Interpreting the Inner Mechanisms of Large Language Models in Mathematical Addition},\nauthor={Wei Zhang and Wan Chaoqun and Yonggang Zhang and Xinmei Tian and Xu Shen and Jieping Ye},\nyear={2024},\nurl={https://openreview.net/forum?id=VpCqrMMGVm}\n}",
        "github": "",
        "project": "",
        "reviewers": "h6js;7p7z;K8c8;jEqH",
        "site": "https://openreview.net/forum?id=VpCqrMMGVm",
        "pdf_size": 5085131,
        "rating": "3;6;6;6",
        "confidence": "4;4;4;3",
        "soundness": "3;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "42;92;146;89",
        "wc_strengths": "122;132;86;40",
        "wc_weaknesses": "319;119;185;68",
        "wc_questions": "274;21;151;22",
        "wc_review": "757;364;568;219",
        "wc_reply_reviewers": "898;40;36;39",
        "wc_reply_authors": "2886;1291;1494;898",
        "reply_reviewers": "2;1;1;1",
        "reply_authors": "6;5;5;4",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            92.25,
            36.82645109157275
        ],
        "wc_strengths_avg": [
            95.0,
            36.069377593742864
        ],
        "wc_weaknesses_avg": [
            172.75,
            94.07543515711208
        ],
        "wc_questions_avg": [
            117.0,
            104.93569459435622
        ],
        "wc_review_avg": [
            477.0,
            203.7240781056574
        ],
        "wc_reply_reviewers_avg": [
            253.25,
            372.24949630590504
        ],
        "wc_reply_authors_avg": [
            1642.25,
            749.3625207468011
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            5.0,
            0.7071067811865476
        ],
        "replies_avg": [
            31,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17351739096539853743&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0;0;2",
        "aff_unique_norm": "Alibaba Group;Hong Kong Baptist University;University of Science and Technology of China",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.alibaba.com;https://www.hkbu.edu.hk;http://www.ustc.edu.cn",
        "aff_unique_abbr": "Alibaba;HKBU;USTC",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "VqEE9i6jhE",
        "title": "Tensor methods to learn the Green's function to solve high-dimensional PDE",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The method of Green's function plays an important role in solving PDEs. Recently deep learning models have been used to  explicitly learn the Green's function to  parameterize solutions of PDEs. DecGreenNet uses  low-rank decomposition of the Green's function to obtain computational efficiency by separated learning from training data and Monte-Carlo samples. However, learning from a large number of Monte-Carlo samples for a high-dimensional PDE can lead to slow training and large memory requirements. As a solution we investigate on learning the Green's function by using tensor product grids generated by  random  partitions of dimensions. We propose DecGreenNet-TT by applying tensor-train structured low-rank decomposition to the Green's function and replace its components with  neural networks  that learn from partitions of  each dimensions instead of all grid elements. We further propose  DecGreenNet-TT-C to learn with a reduced number of neural networks by combining dimensions to generate combined tensor product grids.  We further show that for the special case of separable source functions  the Green's function can be constructed without multiplication of all tensor-train component neural networks leading to memory and computational efficiency. Using several Poisson equations we show that the proposed methods can  learn  with a collection of smaller neural networks compared to DecGreenNet to  efficiently parameterize solutions with faster training times and low errors.",
        "keywords": "Green's function;high-dimensional PDE;neural networks;tensor-train;low-rank;tensor product grid",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/3dd4cf8d3a56b172ae5e65e1eb72bff0ee2736bd.pdf",
        "author": "Kishan Wimalawarne;Taiji Suzuki",
        "authorids": "~Kishan_Wimalawarne2;~Taiji_Suzuki1",
        "gender": ";M",
        "homepage": "https://www.kishan-wimalawarne.com/;http://ibis.t.u-tokyo.ac.jp/suzuki/",
        "dblp": "130/5696;08/312",
        "google_scholar": "I_-MLv4AAAAJ;x8osrBsAAAAJ",
        "orcid": ";",
        "linkedin": "kishanwimalawarne/?originalSubdomain=jp;",
        "or_profile": "~Kishan_Wimalawarne2;~Taiji_Suzuki1",
        "aff": "The University of Tokyo;The University of Tokyo",
        "aff_domain": "tokyo.ac.jp;tokyo.ac.jp",
        "position": "Postdoctoral fellow;Associate Professor",
        "bibtex": "@misc{\nwimalawarne2024tensor,\ntitle={Tensor methods to learn the Green's function to solve high-dimensional {PDE}},\nauthor={Kishan Wimalawarne and Taiji Suzuki},\nyear={2024},\nurl={https://openreview.net/forum?id=VqEE9i6jhE}\n}",
        "github": "",
        "project": "",
        "reviewers": "Ympv;572E;Mq8o;KPfc",
        "site": "https://openreview.net/forum?id=VqEE9i6jhE",
        "pdf_size": 880546,
        "rating": "3;3;3;5",
        "confidence": "3;4;4;3",
        "soundness": "2;2;3;3",
        "contribution": "1;2;2;3",
        "presentation": "1;2;2;3",
        "wc_summary": "117;84;70;119",
        "wc_strengths": "40;42;33;57",
        "wc_weaknesses": "61;289;323;24",
        "wc_questions": "160;3;17;37",
        "wc_review": "378;418;443;237",
        "wc_reply_reviewers": "0;25;0;0",
        "wc_reply_authors": "328;200;369;190",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            97.5,
            21.10094784600919
        ],
        "wc_strengths_avg": [
            43.0,
            8.74642784226795
        ],
        "wc_weaknesses_avg": [
            174.25,
            132.9424217471609
        ],
        "wc_questions_avg": [
            54.25,
            62.238954843409765
        ],
        "wc_review_avg": [
            369.0,
            79.6586467371873
        ],
        "wc_reply_reviewers_avg": [
            6.25,
            10.825317547305483
        ],
        "wc_reply_authors_avg": [
            271.75,
            78.18687549710629
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:f2391LW_jfAJ:scholar.google.com/&scioq=Tensor+methods+to+learn+the+Green%27s+function+to+solve+high-dimensional+PDE&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Tokyo",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.u-tokyo.ac.jp",
        "aff_unique_abbr": "UTokyo",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Japan"
    },
    {
        "id": "VqzKim4Pd0",
        "title": "Data-Centric Defense: Shaping Loss Landscape with Augmentations to Counter Model Inversion",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Machine learning (ML) models are widely used but vulnerable to privacy attacks, such as model inversion. Current defense techniques are mostly model-centric, involving modifying the model training or inference process. However, these approaches require model trainers' cooperation, are computationally expensive, and often result in a significant privacy-utility tradeoff.\nTo address these limitations, this paper proposes a novel data-centric approach to mitigate model inversion attacks. Compared to traditional model-centric techniques, our approach offers the unique advantage of decentralization, enabling individual users to control their data's privacy risk. Specifically, we introduce several privacy-focused data augmentations that modify the private data uploaded to the model trainer. These augmentations will shape the resulting model's loss landscape, making it challenging for attackers to generate private target samples. Additionally, we provide theoretical analysis to support our approach and explain how data augmentation can reduce the risk of model inversion. We evaluate our approach against state-of-the-art model inversion attacks and demonstrate its effectiveness and robustness across various model architectures and datasets. Specifically, in standard face recognition benchmarks, we reduce face reconstruction success rates to less or equal to 5%, while maintaining high utility with only a 2% classification accuracy drop, surpassing state-of-the-art model-centric defenses by 90%. This is the first study to propose a data-centric approach for mitigating model inversion attacks, showing potential for decentralized privacy protection.",
        "keywords": "model inversion attacks; data-centric defenses",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/52a404c9b2c4440c5b2ad1bd2273faad995513ab.zip",
        "author": "Si Chen;Nikhil Abhyankar;Feiyang Kang;Ming Jin;Ruoxi Jia",
        "authorids": "~Si_Chen5;~Nikhil_Abhyankar1;~Feiyang_Kang1;~Ming_Jin2;~Ruoxi_Jia1",
        "gender": ";M;M;M;",
        "homepage": ";https://nikhilsab.github.io/;;http://www.jinming.tech/;https://ruoxijia.info/",
        "dblp": ";;218/1175;;147/5355-1",
        "google_scholar": ";VpuIhycAAAAJ;_6mV_iEAAAAJ;YdxdTtkAAAAJ;JCrug-YAAAAJ",
        "orcid": ";0009-0001-8507-429X;;;",
        "linkedin": ";nikhil-abhyankar/;;;",
        "or_profile": "~Si_Chen5;~Nikhil_Abhyankar1;~Feiyang_Kang1;~Ming_Jin2;~Ruoxi_Jia1",
        "aff": ";Virginia Polytechnic Institute and State University;NVIDIA;Virginia Tech;Virginia Tech",
        "aff_domain": ";vt.edu;nvidia.com;vt.edu;vt.edu",
        "position": ";PhD student;Intern;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nchen2024datacentric,\ntitle={Data-Centric Defense: Shaping Loss Landscape with Augmentations to Counter Model Inversion},\nauthor={Si Chen and Nikhil Abhyankar and Feiyang Kang and Ming Jin and Ruoxi Jia},\nyear={2024},\nurl={https://openreview.net/forum?id=VqzKim4Pd0}\n}",
        "github": "",
        "project": "",
        "reviewers": "q9ZP;rG9e;Ftk9;wDFW",
        "site": "https://openreview.net/forum?id=VqzKim4Pd0",
        "pdf_size": 3722945,
        "rating": "3;3;3;6",
        "confidence": "5;4;5;5",
        "soundness": "2;1;1;3",
        "contribution": "2;2;2;2",
        "presentation": "3;2;3;3",
        "wc_summary": "33;83;139;132",
        "wc_strengths": "69;72;37;100",
        "wc_weaknesses": "309;444;549;407",
        "wc_questions": "285;35;5;120",
        "wc_review": "696;634;730;759",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            96.75,
            42.66365549270245
        ],
        "wc_strengths_avg": [
            69.5,
            22.321514285549714
        ],
        "wc_weaknesses_avg": [
            427.25,
            85.87308949839874
        ],
        "wc_questions_avg": [
            111.25,
            108.82181536805936
        ],
        "wc_review_avg": [
            704.75,
            46.53694768675746
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3483760372643498778&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Virginia Tech;NVIDIA",
        "aff_unique_dep": ";NVIDIA Corporation",
        "aff_unique_url": "https://www.vt.edu;https://www.nvidia.com",
        "aff_unique_abbr": "VT;NVIDIA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Understanding Catastrophic Forgetting in Language Models via Implicit Inference",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18492",
        "id": "VrHiF2hsrm",
        "author_site": "Suhas Kotha, Jacob Springer, Aditi Raghunathan",
        "tldr": "",
        "abstract": "We lack a systematic understanding of the effects of fine-tuning (via methods such as instruction-tuning or reinforcement learning from human feedback), particularly on tasks outside the narrow fine-tuning distribution. In a simplified scenario, we demonstrate that improving performance on tasks within the fine-tuning data distribution comes at the expense of capabilities on other tasks. We hypothesize that language models implicitly infer the task of the prompt and that fine-tuning skews this inference towards tasks in the fine-tuning distribution. To test this, we propose Conjugate Prompting, which artificially makes the task look farther from the fine-tuning distribution while requiring the same capability, and we find that this recovers some of the pretraining capabilities in our synthetic setup. Since real-world fine-tuning distributions are predominantly English, we apply conjugate prompting to recover pretrained capabilities in LLMs by simply translating the prompts to different languages. This allows us to recover in-context learning abilities lost via instruction tuning, natural reasoning capability lost during code fine-tuning, and, more concerningly, harmful content generation suppressed by safety fine-tuning in chatbots like ChatGPT.",
        "keywords": "implicit inference in language models;fine-tuning;catastrophic forgetting",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Suhas Kotha;Jacob Mitchell Springer;Aditi Raghunathan",
        "authorids": "~Suhas_Kotha1;~Jacob_Mitchell_Springer1;~Aditi_Raghunathan1",
        "gender": "M;M;F",
        "homepage": "https://www.andrew.cmu.edu/user/suhask/;https://sprin.xyz;https://www.cs.cmu.edu/~aditirag/",
        "dblp": "312/5932.html;;166/1409",
        "google_scholar": ";niZiN38AAAAJ;Ch9iRwQAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Suhas_Kotha1;~Jacob_Mitchell_Springer1;~Aditi_Raghunathan1",
        "aff": "Carnegie Mellon University;Carnegie Mellon University;Carnegie Mellon University",
        "aff_domain": "cmu.edu;cmu.edu;cmu.edu",
        "position": "MS student;PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nkotha2024understanding,\ntitle={Understanding Catastrophic Forgetting in Language Models via Implicit Inference},\nauthor={Suhas Kotha and Jacob Mitchell Springer and Aditi Raghunathan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=VrHiF2hsrm}\n}",
        "github": "",
        "project": "",
        "reviewers": "MyAe;X78o;xPCE;sicX",
        "pdf_size": 2708832,
        "rating": "3;6;6;8",
        "confidence": "5;4;3;3",
        "soundness": "2;3;4;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;4;3",
        "wc_summary": "104;101;87;368",
        "wc_strengths": "95;102;64;88",
        "wc_weaknesses": "468;236;67;238",
        "wc_questions": "107;65;58;45",
        "wc_review": "774;504;276;739",
        "wc_reply_reviewers": "0;159;15;28",
        "wc_reply_authors": "1113;961;474;367",
        "reply_reviewers": "0;2;1;1",
        "reply_authors": "3;4;2;2",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            165.0,
            117.37759581794134
        ],
        "wc_strengths_avg": [
            87.25,
            14.306903927824496
        ],
        "wc_weaknesses_avg": [
            252.25,
            142.59448621878758
        ],
        "wc_questions_avg": [
            68.75,
            23.220411279734044
        ],
        "wc_review_avg": [
            573.25,
            200.57838243439895
        ],
        "wc_reply_reviewers_avg": [
            50.5,
            63.42121096289474
        ],
        "wc_reply_authors_avg": [
            728.75,
            315.1780250905827
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8866206949335731,
        "gs_citation": 67,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17343720003863267656&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=VrHiF2hsrm",
        "pdf": "https://openreview.net/pdf?id=VrHiF2hsrm",
        "email": "cmu.edu;cmu.edu;cmu.edu",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Carnegie Mellon University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cmu.edu",
        "aff_unique_abbr": "CMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "VsqVhrgjCt",
        "title": "Rigid Motion Compensated Compressed Sensing MRI with Untrained Neural Networks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Deep neural networks trained end-to-end for accelerated magnetic resonance imaging give excellent performance. However, these networks are trained and evaluated under a setup where the object to be imaged is static. \nHowever, in practice, patients often move during measurement acquisition which leads to motion artifacts in the reconstructed images. \nIn this work, we first demonstrate that if we train state-of-the-art neural networks to reconstruct an image for accelerated MRI under motion well, significantly larger training sets are required for good performance. \nSecondly, we demonstrate that as an alternative, one can resort to utilizing untrained neural networks for this task. We propose a modified untrained network which does not rely on any training set and performs single-instance motion-compensated compressed sensing MRI. Our approach outperforms untrained and trained optimization-based baselines such as $\\ell_1$-norm minimization and score-based generative models.",
        "keywords": "Compressed Sensing;Deep Learning;Unsupervised Learning;MRI Motion Correction",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/51f317b882d0f489eb96285bc706c435ea7a8cea.zip",
        "author": "Mohammad Zalbagi Darestani;Stefan Ruschke;Reinhard Heckel",
        "authorids": "~Mohammad_Zalbagi_Darestani1;stefan.ruschke@tum.de;~Reinhard_Heckel1",
        "gender": "M;;M",
        "homepage": "http://mersad95zd.github.io/;;",
        "dblp": ";;81/9668",
        "google_scholar": "Vk6qMDcAAAAJ;;ZWV0I7cAAAAJ",
        "orcid": "0000-0003-0846-7804;;",
        "linkedin": "mohammad-zalbagi-darestani-67295418a/;;",
        "or_profile": "~Mohammad_Zalbagi_Darestani1;stefan.ruschke@tum.de;~Reinhard_Heckel1",
        "aff": ";;Rice University",
        "aff_domain": ";;rice.edu",
        "position": ";;Assistant Professor",
        "bibtex": "@misc{\ndarestani2024rigid,\ntitle={Rigid Motion Compensated Compressed Sensing {MRI} with Untrained Neural Networks},\nauthor={Mohammad Zalbagi Darestani and Stefan Ruschke and Reinhard Heckel},\nyear={2024},\nurl={https://openreview.net/forum?id=VsqVhrgjCt}\n}",
        "github": "",
        "project": "",
        "reviewers": "HZMo;DaWq;tEj2;SFXv",
        "site": "https://openreview.net/forum?id=VsqVhrgjCt",
        "pdf_size": 1029818,
        "rating": "3;3;3;5",
        "confidence": "5;4;4;4",
        "soundness": "3;2;3;2",
        "contribution": "2;2;2;2",
        "presentation": "2;3;3;3",
        "wc_summary": "132;37;105;117",
        "wc_strengths": "92;13;54;92",
        "wc_weaknesses": "272;301;111;762",
        "wc_questions": "76;4;99;96",
        "wc_review": "572;355;369;1067",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            97.75,
            36.355020286062285
        ],
        "wc_strengths_avg": [
            62.75,
            32.64486942844159
        ],
        "wc_weaknesses_avg": [
            361.5,
            242.2916630839782
        ],
        "wc_questions_avg": [
            68.75,
            38.4146781842566
        ],
        "wc_review_avg": [
            590.75,
            288.06108293207535
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:rypWGES8wf4J:scholar.google.com/&scioq=Rigid+Motion+Compensated+Compressed+Sensing+MRI+with+Untrained+Neural+Networks&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Rice University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.rice.edu",
        "aff_unique_abbr": "Rice",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "title": "MetaGPT: Meta Programming for A Multi-Agent Collaborative Framework",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18491",
        "id": "VtmBAGCN7o",
        "author_site": "Sirui Hong, Mingchen Zhuge, Jonathan Chen, Xiawu Zheng, Yuheng Cheng, Jinlin Wang, Ceyao Zhang, zili wang, Steven Yau, Zijuan Lin, Liyang Zhou, Chenyu Ran, Lingfeng Xiao, Chenglin Wu, J\u00fcrgen Schmidhuber",
        "tldr": "",
        "abstract": "Recently, remarkable progress has been made on automated problem solving through societies of agents based on large language models (LLMs). Previous LLM-based multi-agent systems can already solve simple dialogue tasks. More complex tasks, however, face challenges through logic inconsistencies due to cascading hallucinations caused by naively chaining LLMs. Here we introduce MetaGPT, an innovative meta-programming framework incorporating efficient human workflows into LLM-based multi-agent collaborations. MetaGPT encodes Standardized Operating Procedures (SOPs) into prompt sequences for more streamlined workflows, thus allowing agents with human-like domain expertise to verify intermediate results and reduce errors.  MetaGPT utilizes an assembly line paradigm to assign diverse roles to various agents, efficiently breaking down complex tasks into subtasks involving many agents working together.  On collaborative software engineering benchmarks, MetaGPT generates more coherent solutions than previous chat-based multi-agent systems.",
        "keywords": "Autonomous Agent;Meta Programming;Multi-Agent Society;Group Intelligence",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Sirui Hong;Mingchen Zhuge;Jonathan Chen;Xiawu Zheng;Yuheng Cheng;Jinlin Wang;Ceyao Zhang;Zili Wang;Steven Ka Shing Yau;Zijuan Lin;Liyang Zhou;Chenyu Ran;Lingfeng Xiao;Chenglin Wu;J\u00fcrgen Schmidhuber",
        "authorids": "~Sirui_Hong1;~Mingchen_Zhuge2;~Jonathan_Chen3;~Xiawu_Zheng1;~Yuheng_Cheng1;~Jinlin_Wang1;~Ceyao_Zhang1;~Zili_Wang1;~Steven_Ka_Shing_Yau1;~Zijuan_Lin1;~Liyang_Zhou2;~Chenyu_Ran1;~Lingfeng_Xiao1;~Chenglin_Wu2;~J\u00fcrgen_Schmidhuber1",
        "gender": "F;M;M;M;M;M;M;M;;;M;M;M;F;M",
        "homepage": "https://www.linkedin.com/in/sirui-hong-b23593292/;https://metauto.ai;https://scholar.google.com/citations?user=gYNQMNsAAAAJ;https://sites.google.com/view/zhengxiawu/%E9%A6%96%E9%A1%B5;https://github.com/better629;;https://commencement.github.io/;https://stevenyau123.github.io/;https://sablin.top;;;http://people.idsia.ch/~juergen/;;https://github.com/Rchenyu;https://github.com/DerryChan",
        "dblp": "299/0086.html;283/5310;;222/7865;;277/1121;;;;;;s/JurgenSchmidhuber;223/3168;;96/10048",
        "google_scholar": "O-yMFdUAAAAJ;Qnj6XlMAAAAJ;gYNQMNsAAAAJ;jBgXocYAAAAJ;;OadTFGMAAAAJ;E9zWgmwAAAAJ;;;;;https://scholar.google.ch/citations?user=gLnCTgIAAAAJ;nYIj020AAAAJ;;",
        "orcid": ";;;0000-0002-6855-5403;;0000-0003-2544-0718;;;;;;;;;",
        "linkedin": ";;;;;ceyao-charles-zhang-02536815b;;;zijuanlin/;liyang-zhou12580;lingfeng-leo-xiao-493639236;;chenglin-wu-ai/;;",
        "or_profile": "~Sirui_Hong1;~Mingchen_Zhuge2;~Jonathan_Chen3;~Xiawu_Zheng1;~Jinlin_Wang1;~Ceyao_Zhang1;~Zili_Wang1;~Steven_Ka_Shing_Yau1;~Zijuan_Lin1;~Liyang_Zhou2;~Lingfeng_Xiao1;~J\u00fcrgen_Schmidhuber1;~Alexander_Wu1;~yu_chen_ran1;~derry_chan1",
        "aff": "DeepWisdom;King Abdullah University of Science and Technology;;PengCheng Lab;DeepWisdom;The Chinese University of Hong Kong, Shenzhen;stepfun;Nanjing University;;;University of California, Berkeley;IDSIA;DeepWisdom;;Department of Computer Science and Engineering, The Chinese University of Hong Kong",
        "aff_domain": "deepwisdom.com;kaust.edu.sa;;pcl.ac.cn;fuzhi.ai;cuhk.edu.cn;stepfun.com;nju.edu.cn;;;berkeley.edu;idsia.ch;deepwisdom.ai;;cse.cuhk.edu.hk",
        "position": "Researcher;PhD student;;Postdoc;Researcher;PhD student;Researcher;MS student;;;MS student;Scientific Director;CEO;;PhD student",
        "bibtex": "@inproceedings{\nhong2024metagpt,\ntitle={Meta{GPT}: Meta Programming for A Multi-Agent Collaborative Framework},\nauthor={Sirui Hong and Mingchen Zhuge and Jonathan Chen and Xiawu Zheng and Yuheng Cheng and Jinlin Wang and Ceyao Zhang and Zili Wang and Steven Ka Shing Yau and Zijuan Lin and Liyang Zhou and Chenyu Ran and Lingfeng Xiao and Chenglin Wu and J{\\\"u}rgen Schmidhuber},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=VtmBAGCN7o}\n}",
        "github": "",
        "project": "",
        "reviewers": "WkUQ;uj5i;itRX",
        "pdf_size": 16911937,
        "rating": "3;8;8",
        "confidence": "4;4;3",
        "soundness": "2;4;4",
        "contribution": "2;3;4",
        "presentation": "3;4;3",
        "wc_summary": "83;64;562",
        "wc_strengths": "57;96;2",
        "wc_weaknesses": "124;58;2",
        "wc_questions": "391;99;2",
        "wc_review": "655;317;568",
        "wc_reply_reviewers": "0;0;56",
        "wc_reply_authors": "1739;608;1302",
        "reply_reviewers": "0;0;1",
        "reply_authors": "3;1;3",
        "rating_avg": [
            6.333333333333333,
            2.357022603955158
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            236.33333333333334,
            230.4117088074205
        ],
        "wc_strengths_avg": [
            51.666666666666664,
            38.56019824753095
        ],
        "wc_weaknesses_avg": [
            61.333333333333336,
            49.862031870173745
        ],
        "wc_questions_avg": [
            164.0,
            165.32594069493953
        ],
        "wc_review_avg": [
            513.3333333333334,
            143.29999612312938
        ],
        "wc_reply_reviewers_avg": [
            18.666666666666668,
            26.398653164297773
        ],
        "wc_reply_authors_avg": [
            1216.3333333333333,
            465.6853969031978
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            15,
            0
        ],
        "corr_rating_confidence": -0.5000000000000001,
        "gs_citation": 872,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9253729440437341878&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 8,
        "openreview": "https://openreview.net/forum?id=VtmBAGCN7o",
        "pdf": "https://openreview.net/pdf?id=VtmBAGCN7o",
        "email": "deepwisdom.com;kaust.edu.sa;;pcl.ac.cn;fuzhi.ai;cuhk.edu.cn;stepfun.com;nju.edu.cn;;;berkeley.edu;idsia.ch;deepwisdom.ai;;cse.cuhk.edu.hk",
        "author_num": 15,
        "aff_unique_index": "0;1;2;0;3;4;5;6;7;0;3",
        "aff_unique_norm": "DeepWisdom;King Abdullah University of Science and Technology;Pengcheng Lab;Chinese University of Hong Kong;StepFun;Nanjing University;University of California, Berkeley;Institute of Digital Technologies",
        "aff_unique_dep": ";;;;;;;",
        "aff_unique_url": ";https://www.kast.kau.edu.sa;;https://www.cuhk.edu.cn;;https://www.nju.edu.cn;https://www.berkeley.edu;https://www.idsia.ch",
        "aff_unique_abbr": ";KAUST;;CUHK;;Nanjing U;UC Berkeley;IDSIA",
        "aff_campus_unique_index": "1;2;3",
        "aff_campus_unique": ";Shenzhen;Berkeley;Hong Kong SAR",
        "aff_country_unique_index": "1;2;2;2;3;4;2",
        "aff_country_unique": ";Saudi Arabia;China;United States;Switzerland"
    },
    {
        "id": "VtpANKeHeJ",
        "title": "Strategic Classification with Unforeseeable Outcomes",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Machine learning systems are often used to make decisions about individuals, where individuals may best respond and behave strategically to receive favorable outcomes, e.g., they may genuinely *improve* the true labels or *manipulate* observable features directly to game the system without changing labels. Although both behaviors have been studied (often as two separate problems) in the literature, most works assume individuals can (i) perfectly foresee the outcomes of their behaviors when they best respond; (ii) change their features arbitrarily as long as it's affordable, and the costs they need to pay are deterministic functions of feature changes. In this paper, we consider a different setting and focus on *imitative* strategic behaviors with *unforeseeable* outcomes, i.e., individuals manipulate/improve by imitating the features of those with positive labels, but the induced feature changes are unforeseeable.  We first propose a novel probabilistic model to capture both behaviors and establish a Stackelberg game between individuals and the decision-maker. Under this model, we examine how the decision-maker's ability to anticipate individual behavior affects its objective function and the individual's best response. We show that the objective difference between the two can be decomposed into three interpretable terms, with each representing the decision-maker's preference for a certain behavior. By exploring the roles of each term, we further illustrate how a decision-maker with adjusted preferences can simultaneously disincentivize manipulation, incentivize improvement, and promote fairness.",
        "keywords": "Strategic Classification",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/05261b5f1c0c5cb21936bf14de39afe53a0294e2.zip",
        "author": "Tian Xie;Zhiqun Zuo;Xueru Zhang",
        "authorids": "~Tian_Xie4;~Zhiqun_Zuo1;~Xueru_Zhang2",
        "gender": "M;M;F",
        "homepage": "https://www.linkedin.com/in/tianxie1999/;https://github.com/zuozhiqun;https://xueruzhang.github.io/",
        "dblp": ";258/4850;",
        "google_scholar": ";;PNBO_a4AAAAJ",
        "orcid": ";;",
        "linkedin": "tianxie1999/;;",
        "or_profile": "~Tian_Xie4;~Zhiqun_Zuo1;~Xueru_Zhang2",
        "aff": "Ohio State University, Columbus;Ohio State University, Columbus;Ohio State University",
        "aff_domain": "osu.edu;osu.edu;osu.edu",
        "position": "PhD student;PhD student;Assistant Professor",
        "bibtex": "@misc{\nxie2024strategic,\ntitle={Strategic Classification with Unforeseeable Outcomes},\nauthor={Tian Xie and Zhiqun Zuo and Xueru Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=VtpANKeHeJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "7Bt7;5Dsj;7kzc;q7Ka",
        "site": "https://openreview.net/forum?id=VtpANKeHeJ",
        "pdf_size": 397118,
        "rating": "3;3;5;5",
        "confidence": "3;3;4;3",
        "soundness": "2;3;2;3",
        "contribution": "1;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "282;83;140;339",
        "wc_strengths": "28;45;51;82",
        "wc_weaknesses": "129;158;182;77",
        "wc_questions": "87;22;2;252",
        "wc_review": "526;308;375;750",
        "wc_reply_reviewers": "10;0;0;266",
        "wc_reply_authors": "539;152;155;134",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            211.0,
            103.50120772242225
        ],
        "wc_strengths_avg": [
            51.5,
            19.525624189766635
        ],
        "wc_weaknesses_avg": [
            136.5,
            39.14396505209967
        ],
        "wc_questions_avg": [
            90.75,
            98.25826937209916
        ],
        "wc_review_avg": [
            489.75,
            169.7385857723576
        ],
        "wc_reply_reviewers_avg": [
            69.0,
            113.81124724736128
        ],
        "wc_reply_authors_avg": [
            245.0,
            169.93086829649286
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:MGPReEcM-9sJ:scholar.google.com/&scioq=Strategic+Classification+with+Unforeseeable+Outcomes&hl=en&as_sdt=0,47",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Ohio State University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.osu.edu",
        "aff_unique_abbr": "OSU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Columbus;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "VuCRpguZOr",
        "title": "Gaussian Mutual Information Maximization for Graph Self-supervised Learning: Bridging Contrastive-based to Decorrelation-based",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Enlightened by the \\textit{InfoMax} principle, graph contrastive learning has achieved remarkable performance in processing large amounts of unlabeled graph data. Due to the impracticality of precisely calculating mutual information (MI), conventional contrastive methods turn to approximate its lower bound using parametric neural estimators, which inevitably introduces additional parameters and leads to increased computational complexity. Building upon a common Gaussian assumption on the distribution of node representations, we rigorously derive a computationally tractable surrogate for the original MI, termed as Gaussian Mutual Information (GMI). GMI eliminates the reliance on parameterized estimators and negative samples, resulting in an efficient contrastive objective with provable performance guarantees. Another parallel research branch on {decorrelation-based} self-supervised methods has also emerged, with the core idea of mitigating dimensional collapse by decoupling various representation channels. While the differences between the two families of contrastive-based and decorrelation-based methods have been extensively discussed to inspire new approaches, their potential connections are still obscured in the mist. By positioning the proposed GMI-based objective with cross-view identity constraint as a pivot, we bridge the gap between these two research areas from two aspects of approximate form and consistent solution, which contributes to the advancement of a unified theoretical framework for graph self-supervised learning. Extensive comparison experiments and visual analysis provide compelling evidence for the effectiveness and efficiency of our method while supporting our theoretical achievements. Besides, the empirical evidence indicates that even in cases deviating from Gaussianity, our approach continues to maintain its performance, which significantly extends application scenarios.",
        "keywords": "Graph neural networks;graph self-supervised learning;Gaussian mutual information maximization;unified theoretical framework",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Jinyong Wen",
        "authorids": "~Jinyong_Wen1",
        "gender": "M",
        "homepage": "https://wenjinyong.github.io/",
        "dblp": "337/4329",
        "google_scholar": "",
        "orcid": "0000-0002-6661-7770",
        "linkedin": "",
        "or_profile": "~Jinyong_Wen1",
        "aff": "University of Chinese Academy of Sciences",
        "aff_domain": "ucas.ac.cn",
        "position": "PhD student",
        "bibtex": "@misc{\nwen2024gaussian,\ntitle={Gaussian Mutual Information Maximization for Graph Self-supervised Learning: Bridging Contrastive-based to Decorrelation-based},\nauthor={Jinyong Wen},\nyear={2024},\nurl={https://openreview.net/forum?id=VuCRpguZOr}\n}",
        "github": "",
        "project": "",
        "reviewers": "jkcF;qTvu;r9Qc",
        "site": "https://openreview.net/forum?id=VuCRpguZOr",
        "pdf_size": 9148687,
        "rating": "3;5;6",
        "confidence": "4;3;5",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "3;2;3",
        "wc_summary": "137;112;66",
        "wc_strengths": "163;71;83",
        "wc_weaknesses": "499;744;253",
        "wc_questions": "301;12;4",
        "wc_review": "1100;939;406",
        "wc_reply_reviewers": "631;111;18",
        "wc_reply_authors": "4544;2396;690",
        "reply_reviewers": "2;1;1",
        "reply_authors": "8;5;2",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            105.0,
            29.40521495698793
        ],
        "wc_strengths_avg": [
            105.66666666666667,
            40.83571421630281
        ],
        "wc_weaknesses_avg": [
            498.6666666666667,
            200.45004919486107
        ],
        "wc_questions_avg": [
            105.66666666666667,
            138.16013253548297
        ],
        "wc_review_avg": [
            815.0,
            296.5816357542501
        ],
        "wc_reply_reviewers_avg": [
            253.33333333333334,
            269.73608500820865
        ],
        "wc_reply_authors_avg": [
            2543.3333333333335,
            1576.8342405662752
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            5.0,
            2.449489742783178
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0.3273268353539886,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:nvGSy-mHABIJ:scholar.google.com/&scioq=Gaussian+Mutual+Information+Maximization+for+Graph+Self-supervised+Learning:+Bridging+Contrastive-based+to+Decorrelation-based&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Chinese Academy of Sciences",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.ucas.ac.cn",
        "aff_unique_abbr": "UCAS",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "VvAiCXwPvD",
        "title": "Do Models Explain Themselves? Counterfactual Simulatability of Natural Language Explanations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs) are trained to imitate humans to explain human decisions. However, do LLMs explain themselves? Can they help humans build mental models of how LLMs process different inputs? To answer these questions, we propose to evaluate $\\textbf{counterfactual simulatability}$ of natural language explanations: whether an explanation can enable humans to precisely infer the model's outputs on diverse counterfactuals of the explained input. For example, if a model answers ''$\\textit{yes}$'' to the input question ''$\\textit{Can eagles fly?}$'' with the explanation ''$\\textit{all birds can fly}$'', then humans would infer from the explanation that it would also answer ''$\\textit{yes}$'' to the counterfactual input ''$\\textit{Can penguins fly?}$''. If the explanation is precise, then the model's answer should match humans' expectations.\n\nWe implemented two metrics based on counterfactual simulatability: precision and generality. We generated diverse counterfactuals automatically using LLMs. We then used these metrics to evaluate state-of-the-art LLMs (e.g., GPT-4) on two tasks: multi-hop factual reasoning and reward modeling. We found that LLM's explanations have low precision and that precision does not correlate with plausibility. Therefore, naively optimizing human approvals (e.g., RLHF) may not be a sufficient solution.",
        "keywords": "explanation;large language model;faithfulness;counterfactual;simulatability",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Yanda Chen;Ruiqi Zhong;Narutatsu Ri;Chen Zhao;He He;Jacob Steinhardt;Zhou Yu;Kathleen McKeown",
        "authorids": "~Yanda_Chen1;~Ruiqi_Zhong1;~Narutatsu_Ri1;~Chen_Zhao2;~He_He2;~Jacob_Steinhardt1;~Zhou_Yu1;~Kathleen_McKeown1",
        "gender": "M;M;M;M;;F;F;F",
        "homepage": "https://yandachen.github.io/;https://ruiqi-zhong.github.io;https://narutatsuri.github.io/;http://umiacs.umd.edu/~chenz/;;http://www.cs.columbia.edu/~zhouyu/;http://www.cs.columbia.edu/~kathy/;http://hhexiy.github.io",
        "dblp": "212/0154;222/3024;;81/3-9;35/10625;83/3205;m/KathleenMcKeown;08/8618-1",
        "google_scholar": "https://scholar.google.com/citations?hl=en;GskOShAAAAAJ;Pp2YYKcAAAAJ;zehsvT8AAAAJ;;https://scholar.google.com.tw/citations?user=jee2Dy0AAAAJ;https://scholar.google.com.tw/citations?user=ujDhg2sAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;;;;;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Yanda_Chen1;~Ruiqi_Zhong1;~Narutatsu_Ri1;~Chen_Zhao2;~Jacob_Steinhardt1;~Zhou_Yu1;~Kathleen_McKeown1;~He_He1",
        "aff": "Columbia University;University of California, Berkeley;Columbia University;NYU Shanghai;University of California, Berkeley;Columbia University;Columbia University;New York University",
        "aff_domain": "columbia.edu;berkeley.edu;columbia.edu;nyu.edu;berkeley.edu;columbia.edu;columbia.edu;nyu.edu",
        "position": "PhD student;PhD student;Undergrad student;Assistant Professor;Assistant Professor;Assistant Professor;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nchen2024do,\ntitle={Do Models Explain Themselves? Counterfactual Simulatability of Natural Language Explanations},\nauthor={Yanda Chen and Ruiqi Zhong and Narutatsu Ri and Chen Zhao and He He and Jacob Steinhardt and Zhou Yu and Kathleen McKeown},\nyear={2024},\nurl={https://openreview.net/forum?id=VvAiCXwPvD}\n}",
        "github": "",
        "project": "",
        "reviewers": "yudN;Sh5n;wXPv",
        "site": "https://openreview.net/forum?id=VvAiCXwPvD",
        "pdf_size": 1372025,
        "rating": "5;6;6",
        "confidence": "4;4;4",
        "soundness": "2;2;3",
        "contribution": "2;2;2",
        "presentation": "3;2;3",
        "wc_summary": "91;70;110",
        "wc_strengths": "44;177;123",
        "wc_weaknesses": "259;481;169",
        "wc_questions": "7;377;140",
        "wc_review": "401;1105;542",
        "wc_reply_reviewers": "78;408;32",
        "wc_reply_authors": "733;1101;963",
        "reply_reviewers": "1;2;1",
        "reply_authors": "2;3;3",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            90.33333333333333,
            16.33673433979046
        ],
        "wc_strengths_avg": [
            114.66666666666667,
            54.61583002105607
        ],
        "wc_weaknesses_avg": [
            303.0,
            131.11826722467012
        ],
        "wc_questions_avg": [
            174.66666666666666,
            153.02795677769328
        ],
        "wc_review_avg": [
            682.6666666666666,
            304.13191582308855
        ],
        "wc_reply_reviewers_avg": [
            172.66666666666666,
            167.46210184861394
        ],
        "wc_reply_authors_avg": [
            932.3333333333334,
            151.7922556947122
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 57,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9653584904783729950&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;1;0;2;1;0;0;3",
        "aff_unique_norm": "Columbia University;University of California, Berkeley;New York University Shanghai;New York University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.columbia.edu;https://www.berkeley.edu;https://shanghai.nyu.edu;https://www.nyu.edu",
        "aff_unique_abbr": "Columbia;UC Berkeley;NYU Shanghai;NYU",
        "aff_campus_unique_index": "1;2;1",
        "aff_campus_unique": ";Berkeley;Shanghai",
        "aff_country_unique_index": "0;0;0;1;0;0;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "Tree Cross Attention",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18490",
        "id": "Vw24wtSddM",
        "author_site": "Leo Feng, Frederick Tung, Hossein Hajimirsadeghi, Yoshua Bengio, Mohamed Osama Ahmed",
        "tldr": "",
        "abstract": "Cross Attention is a popular method for retrieving information from a set of context tokens for making predictions. At inference time, for each prediction, Cross Attention scans the full set of $\\mathcal{O}(N)$ tokens. In practice, however, often only a small subset of tokens are required for good performance. \nMethods such as Perceiver IO are cheap at inference as they distill the information to a smaller-sized set of latent tokens $L < N$ on which cross attention is then applied, resulting in only $\\mathcal{O}(L)$ complexity. \nHowever, in practice, as the number of input tokens and the amount of information to distill increases, the number of latent tokens needed also increases significantly. \nIn this work, we propose Tree Cross Attention (TCA) - a module based on Cross Attention that only retrieves information from a logarithmic $\\mathcal{O}(\\log(N))$ number of tokens for performing inference. \nTCA organizes the data in a tree structure and performs a tree search at inference time to retrieve the relevant tokens for prediction. \nLeveraging TCA, we introduce ReTreever, a flexible architecture for token-efficient inference. \nWe show empirically that Tree Cross Attention (TCA) performs comparable to Cross Attention across various classification and uncertainty regression tasks while being significantly more token-efficient. \nFurthermore, we compare ReTreever against Perceiver IO, showing significant gains while using the same number of tokens for inference.",
        "keywords": "Attention;Retrieval;Tree",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/6d07661cc49256d55ae5b00a6ebfce08ff235d26.pdf",
        "author": "Leo Feng;Frederick Tung;Hossein Hajimirsadeghi;Yoshua Bengio;Mohamed Osama Ahmed",
        "authorids": "~Leo_Feng1;~Frederick_Tung1;~Hossein_Hajimirsadeghi1;~Yoshua_Bengio1;~Mohamed_Osama_Ahmed2",
        "gender": "M;M;M;M;M",
        "homepage": "https://leofeng-ca.github.io/;;;http://yoshuabengio.org;",
        "dblp": "255/9367;10/7697;64/8131;56/953;https://dblp.org/pers/hd/a/Ahmed:Mohamed_Osama",
        "google_scholar": "WsRunnEAAAAJ;https://scholar.google.ca/citations?user=T4EeZ9gAAAAJ;;kukA0LcAAAAJ;https://scholar.google.ca/citations?user=jyVyVj4AAAAJ",
        "orcid": ";;;;0000-0001-6758-1178",
        "linkedin": "leo-feng/;;;yoshuabengio/?originalSubdomain=ca;mohamed-osama-ahmed-91439a154/",
        "or_profile": "~Leo_Feng1;~Frederick_Tung1;~Hossein_Hajimirsadeghi1;~Yoshua_Bengio1;~Mohamed_Osama_Ahmed2",
        "aff": "Mila - Quebec Artificial Intelligence Institute;Borealis AI;Borealis AI;University of Montreal;",
        "aff_domain": "mila.quebec;borealisai.com;borealisai.com;umontreal.ca;",
        "position": "PhD student;Researcher;Principal Researcher;Full Professor;",
        "bibtex": "@inproceedings{\nfeng2024tree,\ntitle={Tree Cross Attention},\nauthor={Leo Feng and Frederick Tung and Hossein Hajimirsadeghi and Yoshua Bengio and Mohamed Osama Ahmed},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Vw24wtSddM}\n}",
        "github": "",
        "project": "",
        "reviewers": "rpWY;Wmtm;779Z;RnYk",
        "pdf_size": 2783690,
        "rating": "5;5;8;8",
        "confidence": "2;3;3;4",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;4",
        "presentation": "3;2;3;4",
        "wc_summary": "108;127;123;178",
        "wc_strengths": "105;34;19;127",
        "wc_weaknesses": "36;223;74;159",
        "wc_questions": "12;14;135;32",
        "wc_review": "261;398;351;496",
        "wc_reply_reviewers": "0;52;0;57",
        "wc_reply_authors": "427;1148;313;1174",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "1;3;1;2",
        "rating_avg": [
            6.5,
            1.5
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            134.0,
            26.372333988481188
        ],
        "wc_strengths_avg": [
            71.25,
            45.72950360544055
        ],
        "wc_weaknesses_avg": [
            123.0,
            72.9143332959988
        ],
        "wc_questions_avg": [
            48.25,
            50.68715320473226
        ],
        "wc_review_avg": [
            376.5,
            84.75405595014318
        ],
        "wc_reply_reviewers_avg": [
            27.25,
            27.307279249313726
        ],
        "wc_reply_authors_avg": [
            765.5,
            397.6546868829789
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.7071067811865476,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10745868715357411873&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=Vw24wtSddM",
        "pdf": "https://openreview.net/pdf?id=Vw24wtSddM",
        "email": "mila.quebec;borealisai.com;borealisai.com;umontreal.ca;",
        "author_num": 5,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "Quebec Artificial Intelligence Institute;Borealis AI;University of Montreal",
        "aff_unique_dep": "Artificial Intelligence;;",
        "aff_unique_url": "https://mila.quebec;https://www.borealisai.com;https://wwwumontreal.ca",
        "aff_unique_abbr": "Mila;Borealis AI;UM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "VwyTrglgmW",
        "title": "Learning A Disentangling Representation For PU Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In this paper, we address the problem of learning a binary (positive vs. negative) classifier given Positive and Unlabeled data commonly referred to as PU learning. Although rudimentary techniques like clustering, out-of-distribution detection, or positive density estimation can be used to solve the problem in low-dimensional settings, their efficacy progressively deteriorates with higher dimension due to the increasing complexities in the data distribution. In this paper we propose to learn a neural network-based data representation using a loss function that can be used to project the unlabeled data into two (positive and negative) clusters that can be easily identified using simple clustering techniques, effectively emulating the phenomenon observed in low-dimensional settings. We adopt a vector quantization technique to the learned representations to amplify the separation between the learned unlabeled data clusters. We conduct experiments on simulated PU data  that demonstrate the improved performance of our proposed method compared to the current state-of-the-art approaches. We also provide some theoretical justification for our two cluster-based approach and some of our algorithmic choices.",
        "keywords": "PU learning;semi-supervised learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/62eb2de5d9424af095e577eb97f96d95ecbf5ee3.zip",
        "author": "Omar Zamzam;Haleh Akrami;Mahdi Soltanolkotabi;Richard Leahy",
        "authorids": "~Omar_Zamzam1;~Haleh_Akrami1;~Mahdi_Soltanolkotabi1;leahy@usc.edu",
        "gender": "M;F;M;",
        "homepage": ";https://haleakrami.github.io/;http://www-bcf.usc.edu/~soltanol/;",
        "dblp": "327/7492;;75/6691;",
        "google_scholar": ";;narJyMAAAAAJ;",
        "orcid": ";;;",
        "linkedin": "omar-zamzam-4b154b18b/;;;",
        "or_profile": "~Omar_Zamzam1;~Haleh_Akrami1;~Mahdi_Soltanolkotabi1;leahy@usc.edu",
        "aff": "University of Southern California;University of Southern California;University of Southern California;",
        "aff_domain": "usc.edu;usc.edu;usc.edu;",
        "position": "PhD student;PhD student;Associate Professor;",
        "bibtex": "@misc{\nzamzam2024learning,\ntitle={Learning A Disentangling Representation For {PU} Learning},\nauthor={Omar Zamzam and Haleh Akrami and Mahdi Soltanolkotabi and Richard Leahy},\nyear={2024},\nurl={https://openreview.net/forum?id=VwyTrglgmW}\n}",
        "github": "",
        "project": "",
        "reviewers": "ShRs;w13V;Wr1j;NPjv",
        "site": "https://openreview.net/forum?id=VwyTrglgmW",
        "pdf_size": 1369271,
        "rating": "3;3;3;5",
        "confidence": "4;3;5;4",
        "soundness": "3;1;1;2",
        "contribution": "2;2;1;2",
        "presentation": "2;3;2;2",
        "wc_summary": "55;59;88;96",
        "wc_strengths": "15;18;24;25",
        "wc_weaknesses": "175;165;234;64",
        "wc_questions": "4;32;6;96",
        "wc_review": "249;274;352;281",
        "wc_reply_reviewers": "0;112;79;0",
        "wc_reply_authors": "790;1252;1147;962",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "2;3;3;2",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            74.5,
            17.783419243778738
        ],
        "wc_strengths_avg": [
            20.5,
            4.153311931459037
        ],
        "wc_weaknesses_avg": [
            159.5,
            61.11669166438903
        ],
        "wc_questions_avg": [
            34.5,
            37.1853465763061
        ],
        "wc_review_avg": [
            289.0,
            38.268786236304905
        ],
        "wc_reply_reviewers_avg": [
            47.75,
            49.15473018947414
        ],
        "wc_reply_authors_avg": [
            1037.75,
            176.74611028251795
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ObrragGz9W0J:scholar.google.com/&scioq=Learning+A+Disentangling+Representation+For+PU+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Southern California",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.usc.edu",
        "aff_unique_abbr": "USC",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Los Angeles",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Vy5aRVSbNo",
        "title": "Looping LOCI: Developing Object Permanence from Videos",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent compositional scene representation learning models have become remarkably good in segmenting and tracking distinct objects within visual scenes. Yet, many of these models require that objects are continuously, at least partially, visible. Moreover, they tend to fail on intuitive physics tests, which infants learn to solve over the first months of their life. Our goal is to advance compositional scene representation algorithms with an embedded algorithm that fosters the progressive learning of intuitive physics, akin to infant development.  As a fundamental component for such an algorithm, we introduce Loci-Looped, which advances a recently published unsupervised object location, identification, and tracking neural network architecture (Loci, Traub et al., ICLR 2023) with an internal processing loop. The loop is designed to adaptively blend pixel-space information with anticipations yielding information-fused activities as percepts. Moreover, it is designed to learn compositional representations of both individual object dynamics and between-objects interaction dynamics. We show that Loci-Looped learns to track objects through extended periods of object occlusions, indeed simulating their hidden trajectories and anticipating their reappearance, without the need for an explicit history buffer. We even find that Loci-Looped surpasses state-of-the-art models on the ADEPT and the CLEVRER dataset, when confronted with object occlusions or temporary sensory data interruptions. This indicates that Loci-Looped is able to learn the physical concepts of object permanence and inertia in a fully unsupervised emergent manner. We believe that even further architectural advancements of the internal loop\u2014also in other compositional scene representation learning\nmodels\u2014can be developed in the near future.",
        "keywords": "Deep Learning;Computer Vision;Object-Centric Models;Object Permanence;Compositional Scene Representation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/bddc157f90f7a3e17253e3555064fc4e96e189ae.zip",
        "author": "Manuel Traub;Frederic Becker;Sebastian Otte;Martin V. Butz",
        "authorids": "~Manuel_Traub1;~Frederic_Becker1;~Sebastian_Otte1;~Martin_V._Butz2",
        "gender": "M;;;M",
        "homepage": "https://manuel-traub.de/;;;https://cm.inf.uni-tuebingen.de",
        "dblp": "189/1743;266/1325;;b/MartinVButz.html",
        "google_scholar": "wz7mZEMAAAAJ;JbGitWUAAAAJ;;https://scholar.google.de/citations?user=dIcpfzAAAAAJ",
        "orcid": "0000-0003-0897-1701;0000-0002-8477-5203;;0000-0002-8120-8537",
        "linkedin": ";;;martin-butz-85b971150/",
        "or_profile": "~Manuel_Traub1;~Frederic_Becker1;~Sebastian_Otte1;~Martin_V._Butz2",
        "aff": "Eberhard-Karls-Universit\u00e4t T\u00fcbingen;Eberhard-Karls-Universit\u00e4t T\u00fcbingen;;University of Tuebingen",
        "aff_domain": "uni-tuebingen.de;uni-tuebingen.de;;uni-tuebingen.de",
        "position": "PhD student;PhD student;;Full Professor",
        "bibtex": "@misc{\ntraub2024looping,\ntitle={Looping {LOCI}: Developing Object Permanence from Videos},\nauthor={Manuel Traub and Frederic Becker and Sebastian Otte and Martin V. Butz},\nyear={2024},\nurl={https://openreview.net/forum?id=Vy5aRVSbNo}\n}",
        "github": "",
        "project": "",
        "reviewers": "A5xP;3utS;so16;4W7W",
        "site": "https://openreview.net/forum?id=Vy5aRVSbNo",
        "pdf_size": 6841898,
        "rating": "3;3;5;6",
        "confidence": "4;4;3;2",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;2;2",
        "wc_summary": "52;51;102;75",
        "wc_strengths": "56;38;37;107",
        "wc_weaknesses": "255;319;274;527",
        "wc_questions": "7;7;80;267",
        "wc_review": "370;415;493;976",
        "wc_reply_reviewers": "52;0;26;0",
        "wc_reply_authors": "474;201;446;711",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "2;1;2;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            70.0,
            20.820662813657012
        ],
        "wc_strengths_avg": [
            59.5,
            28.447319733148852
        ],
        "wc_weaknesses_avg": [
            343.75,
            108.32214685834103
        ],
        "wc_questions_avg": [
            90.25,
            106.30939516336268
        ],
        "wc_review_avg": [
            563.5,
            242.18845967551798
        ],
        "wc_reply_reviewers_avg": [
            19.5,
            21.558061137310098
        ],
        "wc_reply_authors_avg": [
            458.0,
            180.59485042492213
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.986440050415621,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14131517275265376089&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Eberhard Karls University of T\u00fcbingen;University of Tuebingen",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uni-tuebingen.de/;https://www.uni-tuebingen.de/",
        "aff_unique_abbr": "Uni T\u00fcbingen;Uni T\u00fcbingen",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "T\u00fcbingen;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "Vy6sjPt2Vr",
        "title": "A Spitting Image: Superpixel Transformers",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Vision Transformer (ViT) architectures treat tokenization as an inflexible, monolithic process with regular grid partitions. \nIn this work, we propose a generalized superpixel transformer (SPiT) framework that decouples tokenization from feature extraction; a significant shift from contemporary approaches, where these are treated as an undifferentiated whole. \nUsing on-line superpixel tokenization and scale- and shape-invariant feature extraction, we perform experiments and ablations that contrast our approach with canonical tokenization and randomized partitions as baselines. \nWe find that modular superpixel-based tokenization provides significantly improved interpretability using state-of-the-art metrics for faithfulness while maintaining competitive classification performance, providing a space of semantically-rich models that can generalize across different vision tasks.",
        "keywords": "vision transformer;ViT;superpixels;tokenizer;interpretability;attention maps;faithfulness",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Marius Aasan;Ad\u00edn Ram\u00edrez Rivera;Odd Kolbjornsen;Anne Schistad Solberg",
        "authorids": "~Marius_Aasan1;~Ad\u00edn_Ram\u00edrez_Rivera1;~Odd_Kolbjornsen1;~Anne_Schistad_Solberg1",
        "gender": "M;M;F;M",
        "homepage": ";https://www.mn.uio.no/math/english/people/aca/oddkol/index.html;;https://www.mn.uio.no/ifi/english/people/aca/adinr/",
        "dblp": "358/5791;;;85/9834",
        "google_scholar": "i9mjbNcAAAAJ;https://scholar.google.com/citations?view_op=search_authors;;p2aLoZAAAAAJ",
        "orcid": "0000-0003-2353-9984;;0000-0002-6149-971X;0000-0002-4321-9075",
        "linkedin": ";;;adinramirezrivera/",
        "or_profile": "~Marius_Aasan1;~Odd_Kolbjornsen1;~Anne_Schistad_Solberg1;~Adin_Ramirez_Rivera1",
        "aff": "University of Oslo;University of Oslo;University of Oslo;University of Oslo",
        "aff_domain": "uio.no;uio.no;uio.no;uio.no",
        "position": "PhD student;Associate Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\naasan2024a,\ntitle={A Spitting Image: Superpixel Transformers},\nauthor={Marius Aasan and Ad{\\'\\i}n Ram{\\'\\i}rez Rivera and Odd Kolbjornsen and Anne Schistad Solberg},\nyear={2024},\nurl={https://openreview.net/forum?id=Vy6sjPt2Vr}\n}",
        "github": "",
        "project": "",
        "reviewers": "Apxd;ubVn;Un4y;N399",
        "site": "https://openreview.net/forum?id=Vy6sjPt2Vr",
        "pdf_size": 16992218,
        "rating": "3;5;6;8",
        "confidence": "5;4;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "35;52;223;76",
        "wc_strengths": "49;34;86;101",
        "wc_weaknesses": "75;72;558;250",
        "wc_questions": "26;33;142;50",
        "wc_review": "185;191;1009;477",
        "wc_reply_reviewers": "0;0;290;18",
        "wc_reply_authors": "669;613;2629;903",
        "reply_reviewers": "0;0;2;1",
        "reply_authors": "1;1;6;3",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            96.5,
            74.47314952383846
        ],
        "wc_strengths_avg": [
            67.5,
            27.060118255469618
        ],
        "wc_weaknesses_avg": [
            238.75,
            197.90575408512
        ],
        "wc_questions_avg": [
            62.75,
            46.57990446533784
        ],
        "wc_review_avg": [
            465.5,
            335.2443138965969
        ],
        "wc_reply_reviewers_avg": [
            77.0,
            123.19496742968035
        ],
        "wc_reply_authors_avg": [
            1203.5,
            830.1703138513205
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.75,
            2.0463381929681126
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8006407690254357,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:wMC_wJ4J9mYJ:scholar.google.com/&scioq=A+Spitting+Image:+Superpixel+Transformers&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of Oslo",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uio.no",
        "aff_unique_abbr": "UiO",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Norway"
    },
    {
        "id": "VyMW4YZfw7",
        "title": "Simplifying GNN Performance with Low Rank Kernel Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We revisit recent spectral GNN approaches to \nsemi-supervised node classification (SSNC). \nWe posit that many of the current GNN architectures may be over-engineered. Instead, simpler, traditional methods from nonparametric estimation, applied in the spectral domain, could replace many deep-learning inspired GNN designs. These conventional techniques appear to be well suited for a variety of graph types reaching state-of-the-art performance on many the common SSNC benchmarks. Additionally, we show that recent performance improvements in GNN approaches may be partialy attributed to shifts in evaluation conventions. Lastly, an ablative study is conducted on the various hyperparameters associated with GNN spectral filtering techniques.",
        "keywords": "GNN;Spectral filtering;Semi-supervised node classification;Kernel methods;Low rank",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Luciano Vinas;Arash A. Amini",
        "authorids": "~Luciano_Vinas1;~Arash_A._Amini2",
        "gender": "M;M",
        "homepage": ";http://www.stat.ucla.edu/~arash.amini/",
        "dblp": "296/0489;83/10751",
        "google_scholar": ";",
        "orcid": "0000-0002-2773-3605;",
        "linkedin": ";",
        "or_profile": "~Luciano_Vinas1;~Arash_A_Amini1",
        "aff": "University of California, Los Angeles;University of California, Los Angeles",
        "aff_domain": "ucla.edu;ucla.edu",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\nvinas2024simplifying,\ntitle={Simplifying {GNN} Performance with Low Rank Kernel Models},\nauthor={Luciano Vinas and Arash A. Amini},\nyear={2024},\nurl={https://openreview.net/forum?id=VyMW4YZfw7}\n}",
        "github": "",
        "project": "",
        "reviewers": "3XZw;3FrS;3E1j;g7wG",
        "site": "https://openreview.net/forum?id=VyMW4YZfw7",
        "pdf_size": 1026177,
        "rating": "1;3;3;5",
        "confidence": "4;4;3;3",
        "soundness": "2;2;2;3",
        "contribution": "1;2;2;2",
        "presentation": "2;2;2;3",
        "wc_summary": "93;75;36;70",
        "wc_strengths": "13;48;32;267",
        "wc_weaknesses": "102;42;35;96",
        "wc_questions": "123;39;536;157",
        "wc_review": "331;204;639;590",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            68.5,
            20.62159062730128
        ],
        "wc_strengths_avg": [
            90.0,
            102.93930250395132
        ],
        "wc_weaknesses_avg": [
            68.75,
            30.425112982534674
        ],
        "wc_questions_avg": [
            213.75,
            190.94419996428275
        ],
        "wc_review_avg": [
            441.0,
            180.05138155537713
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.7071067811865476,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:MAUJECiGQAgJ:scholar.google.com/&scioq=Simplifying+GNN+Performance+with+Low+Rank+Kernel+Models&hl=en&as_sdt=0,33",
        "gs_version_total": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of California, Los Angeles",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucla.edu",
        "aff_unique_abbr": "UCLA",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Los Angeles",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "VyWv7GSh5i",
        "title": "A Novel Variational Lower Bound For Inverse Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Inverse reinforcement learning (IRL) seeks to learn the reward function from expert trajectories, to understand the task for imitation or collaboration thereby removing the need for manual reward engineering. However, IRL in the context of large, high-dimensional problems with unknown dynamics has been particularly challenging. In this paper, we present a new variational lower bound for IRL, which is derived under the framework of a probabilistic graphical model with an optimality node. Our method simultaneously learns the reward function and policy under the learned reward function by maximizing the lower bound, which is equivalent to minimizing the reverse Kullback\u2013Leibler divergence between an approximated distribution of optimality given the reward function and the true distribution of optimality given trajectories. This leads to a new IRL method that learns a valid reward function such that the policy under the learned reward achieves expert-level performance on several known domains. Importantly, the method outperforms the existing state-of-the-art IRL algorithms on these domains by demonstrating better reward from the learned policy.",
        "keywords": "Inverse Reinforcement Learning;Reverse Kullback-Leibler Divergence;Probabilistic Graphical Model;Variational Approximation",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/16456ea0cf57246b265ae7091f65d9ca6cd2b4d6.zip",
        "author": "Yikang Gui;Prashant Doshi",
        "authorids": "~Yikang_Gui1;~Prashant_Doshi1",
        "gender": "M;M",
        "homepage": ";http://thinc.cs.uga.edu",
        "dblp": "287/4505;d/PrashantDoshi",
        "google_scholar": "OdqtIvwAAAAJ;3PkyzawAAAAJ",
        "orcid": ";",
        "linkedin": "yikanggui/;",
        "or_profile": "~Yikang_Gui1;~Prashant_Doshi1",
        "aff": "University of Georgia;University of Georgia",
        "aff_domain": "uga.edu;cs.uga.edu",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\ngui2024a,\ntitle={A Novel Variational Lower Bound For Inverse Reinforcement Learning},\nauthor={Yikang Gui and Prashant Doshi},\nyear={2024},\nurl={https://openreview.net/forum?id=VyWv7GSh5i}\n}",
        "github": "",
        "project": "",
        "reviewers": "Ed3u;PBAj;CGqh;uUoB",
        "site": "https://openreview.net/forum?id=VyWv7GSh5i",
        "pdf_size": 1242264,
        "rating": "1;1;3;6",
        "confidence": "3;5;4;3",
        "soundness": "1;1;2;2",
        "contribution": "1;1;2;3",
        "presentation": "2;2;3;3",
        "wc_summary": "55;62;96;74",
        "wc_strengths": "26;33;17;156",
        "wc_weaknesses": "242;528;249;332",
        "wc_questions": "5;12;2;100",
        "wc_review": "328;635;364;662",
        "wc_reply_reviewers": "705;172;0;385",
        "wc_reply_authors": "921;750;193;754",
        "reply_reviewers": "2;1;0;2",
        "reply_authors": "2;2;1;2",
        "rating_avg": [
            2.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            1.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            71.75,
            15.562374497485916
        ],
        "wc_strengths_avg": [
            58.0,
            56.86387253784251
        ],
        "wc_weaknesses_avg": [
            337.75,
            115.40445182054287
        ],
        "wc_questions_avg": [
            29.75,
            40.720848468567056
        ],
        "wc_review_avg": [
            497.25,
            152.08447488156048
        ],
        "wc_reply_reviewers_avg": [
            315.5,
            262.99857414062154
        ],
        "wc_reply_authors_avg": [
            654.5,
            275.2385329128173
        ],
        "reply_reviewers_avg": [
            1.25,
            0.82915619758885
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.47886115464444223,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:nE8huOGUcnMJ:scholar.google.com/&scioq=A+Novel+Variational+Lower+Bound+For+Inverse+Reinforcement+Learning&hl=en&as_sdt=0,44",
        "gs_version_total": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Georgia",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uga.edu",
        "aff_unique_abbr": "UGA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "VylUGUSYq4",
        "title": "Two-sided Competing Matching Markets With Complementary Preferences",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In this paper, we propose a new algorithm for addressing the problem of two-sided matching markets with complementary preferences, where agents' preferences are unknown a priori and must be learned from data. The presence of complementary preferences can lead to instability in the matching process, making this problem challenging to solve. To overcome this challenge, we formulate the problem as a bandit learning framework and propose the Multi-agent Multi-type Thompson Sampling (MMTS) algorithm. The algorithm combines the strengths of Thompson Sampling for exploration with a double matching technique to achieve a stable matching outcome. Our theoretical analysis demonstrates the effectiveness of MMTS as it is able to achieve stability at every matching step and has a sublinear Bayesian regret over time. Our approach provides a useful method for addressing complementary preferences in real-world scenarios.",
        "keywords": "Two-sided matching; complementary sampling; bandit; incentive compatible",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/55adbc5fb9478657c7255ead1d5f66f750e1fa07.pdf",
        "author": "Yuantong Li;Guang Cheng;Xiaowu Dai",
        "authorids": "~Yuantong_Li1;~Guang_Cheng1;~Xiaowu_Dai1",
        "gender": "M;M;M",
        "homepage": "http://www.stat.ucla.edu/~guangcheng/;https://www.xiaowudai.org/;https://liyuantong93.com/home/",
        "dblp": "99/4812;232/3931;254/1270",
        "google_scholar": ";;wT8kLn4AAAAJ",
        "orcid": ";;0000-0001-7420-2332",
        "linkedin": ";;",
        "or_profile": "~Guang_Cheng1;~Xiaowu_Dai1;~Yuantong_Li_Li1",
        "aff": "University of California, Los Angeles;University of California, Los Angeles;University of California, Los Angeles",
        "aff_domain": "ucla.edu;ucla.edu;ucla.edu",
        "position": "Full Professor;Assistant Professor;PHD",
        "bibtex": "@misc{\nli2024twosided,\ntitle={Two-sided Competing Matching Markets With Complementary Preferences},\nauthor={Yuantong Li and Guang Cheng and Xiaowu Dai},\nyear={2024},\nurl={https://openreview.net/forum?id=VylUGUSYq4}\n}",
        "github": "",
        "project": "",
        "reviewers": "ULou;cZ2J;YP85;vqtQ",
        "site": "https://openreview.net/forum?id=VylUGUSYq4",
        "pdf_size": 802495,
        "rating": "3;3;5;6",
        "confidence": "3;4;3;2",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;1;3;3",
        "wc_summary": "161;219;49;234",
        "wc_strengths": "21;103;47;53",
        "wc_weaknesses": "261;473;73;531",
        "wc_questions": "6;9;2;19",
        "wc_review": "449;804;171;837",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            165.75,
            72.7096107815191
        ],
        "wc_strengths_avg": [
            56.0,
            29.68164415931166
        ],
        "wc_weaknesses_avg": [
            334.5,
            181.3690988013118
        ],
        "wc_questions_avg": [
            9.0,
            6.284902544988268
        ],
        "wc_review_avg": [
            565.25,
            273.76849252607576
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:mFdEydD1kmcJ:scholar.google.com/&scioq=Two-sided+Competing+Matching+Markets+With+Complementary+Preferences&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of California, Los Angeles",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucla.edu",
        "aff_unique_abbr": "UCLA",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Los Angeles",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "VzPGV19Bnp",
        "title": "Enhancing Detail Preservation for Customized Text-to-Image Generation: A Regularization-Free Approach",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent text-to-image generation models have demonstrated impressive capability of generating text-aligned images with high fidelity. However, generating images of novel concepts specified by a reference image remains a challenging task. To address this problem, researchers have been exploring various methods for customizing pre-trained text-to-image generation models. Currently, most existing methods for customizing pre-trained text-to-image generation models involve the use of regularization techniques to prevent over-fitting. Although regularization will ease the challenge of customization and leads to successful content creation with respect to text guidance, it may restrict the model capability, resulting in the loss of detailed information and inferior performance. In this work, we propose ProFusion, a novel framework for customized text-to-image generation, which can tackle the over-fitting problem without the widely used regularization. Specifically, it consists of an encoder network and a novel sampling method. Given a single user-provided image from an arbitrary domain, the proposed framework can customize a pre-trained text-to-image generation model within half a minute. Empirical results demonstrate that our proposed framework outperforms existing methods.",
        "keywords": "Generative Model;Diffusion Model",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/966adf0c1e3a1578eca05f241fbd33547060ea08.pdf",
        "author": "Yufan Zhou;Ruiyi Zhang;Jinhui Xu;Tong Sun",
        "authorids": "~Yufan_Zhou1;~Ruiyi_Zhang3;~Jinhui_Xu1;~Tong_Sun1",
        "gender": "M;M;F;M",
        "homepage": "https://www.yufanzhou.com/;https://www.cse.buffalo.edu/~jinhui/;https://research.adobe.com/person/tong-sun/;http://zhangry868.github.io/",
        "dblp": ";24/6437-1.html;;",
        "google_scholar": "0eVrHJAAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;",
        "linkedin": ";;tong-sun/?trk=hb_tab_pro_top;",
        "or_profile": "~Yufan_Zhou1;~Jinhui_Xu1;~Tong_Sun1;~RUIYI_ZHANG1",
        "aff": "Adobe ;University at Buffalo, State University of New York;Adobe Systems;Adobe Systems",
        "aff_domain": "adobe.com;buffalo.edu;adobe.com;adobe.com",
        "position": "Researcher;Full Professor;Director, Document Intelligence Lab;Research Scientist",
        "bibtex": "@misc{\nzhou2024enhancing,\ntitle={Enhancing Detail Preservation for Customized Text-to-Image Generation: A Regularization-Free Approach},\nauthor={Yufan Zhou and Ruiyi Zhang and Jinhui Xu and Tong Sun},\nyear={2024},\nurl={https://openreview.net/forum?id=VzPGV19Bnp}\n}",
        "github": "",
        "project": "",
        "reviewers": "qTeR;KZRC;Y2oZ;GgLb",
        "site": "https://openreview.net/forum?id=VzPGV19Bnp",
        "pdf_size": 11283282,
        "rating": "3;5;5;6",
        "confidence": "3;3;4;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;2;3",
        "wc_summary": "64;83;74;68",
        "wc_strengths": "19;140;21;2",
        "wc_weaknesses": "192;47;93;66",
        "wc_questions": "57;182;110;2",
        "wc_review": "332;452;298;138",
        "wc_reply_reviewers": "117;72;126;16",
        "wc_reply_authors": "701;521;241;198",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            72.25,
            7.1545440106270926
        ],
        "wc_strengths_avg": [
            45.5,
            55.056788863863105
        ],
        "wc_weaknesses_avg": [
            99.5,
            55.85024619462299
        ],
        "wc_questions_avg": [
            87.75,
            66.47696969627903
        ],
        "wc_review_avg": [
            305.0,
            112.11155159036913
        ],
        "wc_reply_reviewers_avg": [
            82.75,
            43.631267458097064
        ],
        "wc_reply_authors_avg": [
            415.25,
            206.3957061084363
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.13245323570650439,
        "gs_citation": 44,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7592657781263009607&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Adobe;University at Buffalo",
        "aff_unique_dep": "Adobe Inc.;",
        "aff_unique_url": "https://www.adobe.com;https://www.buffalo.edu",
        "aff_unique_abbr": "Adobe;UB",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Buffalo",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Vzn7c8SWbX",
        "title": "Video-CSR: Complex Video Digest Creation for Visual-Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We present a novel task and human annotated dataset for evaluating the ability for visual-language models to generate captions and summaries for real-world video clips, which we call **Video-CSR** (**C**aptioning, **S**ummarization and **R**etrieval). The dataset contains 4.8K YouTube video clips of 20-60 seconds in duration and covers a wide range of topics and interests. Each video clip corresponds to 5 independently annotated captions (1 sentence) and summaries (3-10 sentences). Given any video selected from the dataset and its corresponding ASR information, we evaluate visual-language models on either caption or summary generation that is grounded in both the visual and auditory content of the video. Additionally, models are also evaluated on caption- and summary-based retrieval tasks, where the summary-based retrieval task requires the identification of a target video given _excerpts_ of a given summary. Given the novel nature of the paragraph-length video summarization task, we perform extensive comparative analyses of different existing evaluation metrics and their alignment with human preferences. Finally, we propose a foundation model with competitive generation and retrieval capabilities that serves as a baseline for the Video-CSR task. We aim for Video-CSR to serve as a useful evaluation set in the age of large language models and complex multi-modal tasks.",
        "keywords": "dataset;video;multimodal;caption;summarization;retrieval",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Tingkai Liu;Yunzhe Tao;Haogeng Liu;Qihang Fan;Ding Zhou;Huaibo Huang;Ran He;Hongxia Yang",
        "authorids": "~Tingkai_Liu1;~Yunzhe_Tao2;~Haogeng_Liu1;~Qihang_Fan1;~Ding_Zhou2;~Huaibo_Huang1;~Ran_He1;~Hongxia_Yang2",
        "gender": "M;M;M;M;M;M;M;F",
        "homepage": "https://tk-21st.github.io/;;https://github.com/liuhaogeng;https://github.com/qhfan;;https://people.ucas.edu.cn/~huanghuaibo;https://rhe-web.github.io/;https://www4.comp.polyu.edu.hk/~hongxyang/",
        "dblp": "270/4091;;;344/3915;;211/7251.html;61/6198-1;",
        "google_scholar": "hUYLD3_8Z1sC;gldelC4AAAAJ;;9HGN_c0AAAAJ;;XMvLciUAAAAJ;ayrg9AUAAAAJ;iJlC5mMAAAAJ",
        "orcid": "0000-0003-3075-7648;;;0000-0002-6115-5503;;0000-0001-5866-2283;0000-0002-3807-991X;",
        "linkedin": ";yunzhe-tao/;;;ding-zhou-cs/;;;",
        "or_profile": "~Tingkai_Liu1;~Yunzhe_Tao2;~Haogeng_Liu1;~Qihang_Fan1;~Ding_Zhou2;~Huaibo_Huang1;~Ran_He1;~Hongxia_Yang2",
        "aff": "ByteDance Inc.;ByteDance;University of Chinese Academy of Sciences;Institute of Automation, Chinese Academy of Sciences;Bytedance;Institute of Automation, Chinese Academy of Sciences;Institute of Automation, Chinese Academy of Sciences;ByteDance Inc.",
        "aff_domain": "bytedance.com;bytedance.com;ucas.ac.cn;ia.ac.cn;bytedance.com;ia.ac.cn;ia.ac.cn;bytedance.com",
        "position": "Researcher;Researcher;MS student;PhD student;Researcher;Associate Professor;Full Professor;Principal Researcher",
        "bibtex": "@misc{\nliu2024videocsr,\ntitle={Video-{CSR}: Complex Video Digest Creation for Visual-Language Models},\nauthor={Tingkai Liu and Yunzhe Tao and Haogeng Liu and Qihang Fan and Ding Zhou and Huaibo Huang and Ran He and Hongxia Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=Vzn7c8SWbX}\n}",
        "github": "",
        "project": "",
        "reviewers": "Bzf5;2rQ2;V9Rq",
        "site": "https://openreview.net/forum?id=Vzn7c8SWbX",
        "pdf_size": 1641190,
        "rating": "3;5;6",
        "confidence": "2;4;4",
        "soundness": "2;3;3",
        "contribution": "2;2;3",
        "presentation": "1;2;3",
        "wc_summary": "123;56;162",
        "wc_strengths": "18;79;79",
        "wc_weaknesses": "211;186;333",
        "wc_questions": "18;52;258",
        "wc_review": "370;373;832",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "222;288;224",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            113.66666666666667,
            43.77467558100484
        ],
        "wc_strengths_avg": [
            58.666666666666664,
            28.75567576825293
        ],
        "wc_weaknesses_avg": [
            243.33333333333334,
            64.22010761609033
        ],
        "wc_questions_avg": [
            109.33333333333333,
            106.03563342365413
        ],
        "wc_review_avg": [
            525.0,
            217.08523671590382
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            244.66666666666666,
            30.652170486860395
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.944911182523068,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4223508769174706619&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;1;2;0;2;2;0",
        "aff_unique_norm": "ByteDance;University of Chinese Academy of Sciences;Chinese Academy of Sciences",
        "aff_unique_dep": ";;Institute of Automation",
        "aff_unique_url": "https://www.bytedance.com;http://www.ucas.ac.cn;http://www.ia.cas.cn",
        "aff_unique_abbr": "ByteDance;UCAS;CAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "VzrswFtUDf",
        "title": "Overcome Data Heterogeneity in Federated Learning with Filter Decomposition",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Data heterogeneity is one of the major challenges in federated learning, which\nresults in substantial client variance and slow convergence. In this study, we theoretically and empirically demonstrate that data heterogeneity in federated learning\n(FL) can be effectively handled by simply decomposing a convolutional filter into\na linear combination of filter subspace elements, i.e., filter atoms. This simple\ntechnique transforms global filter aggregation in federated learning into multiplying aggregated (weighted sum of) filter atoms with aggregated atom coefficients.\nMathematically expanding the product of two weighted sums naturally leads to\nnumerous additional filter atom-coefficient product terms, which can be interpreted as implicitly constructing many local model variants as virtual clients. We\nprove that those introduced virtual clients substantially reduce variance within the\naggregated model. Furthermore, our method permits different training schemes\nfor filter atoms and atom coefficients for highly adaptive model personalization\nand communication reduction. Our proposed approach outperforms current state-\nof-the-art federated learning methods regarding task accuracy, as evidenced by\nextensive evaluations conducted on benchmark datasets.",
        "keywords": "Federated Learning;Filter Decomposition;Heterogeneous Data;Non-IID",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/643ac2d198fd92018a0896b3a1860833ecc4a08a.zip",
        "author": "Wei Chen;Qiang Qiu",
        "authorids": "~Wei_Chen26;~Qiang_Qiu1",
        "gender": "M;",
        "homepage": "https://weichennone.github.io/myhomepage/;https://web.ics.purdue.edu/~qqiu/",
        "dblp": "181/2832-124.html;97/360",
        "google_scholar": "jVT7rQgAAAAJ;jdLtt_YAAAAJ",
        "orcid": "0000-0001-6722-4322;",
        "linkedin": ";",
        "or_profile": "~Wei_Chen26;~Qiang_Qiu1",
        "aff": "Purdue University;Purdue University",
        "aff_domain": "purdue.edu;purdue.edu",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nchen2024overcome,\ntitle={Overcome Data Heterogeneity in Federated Learning with Filter Decomposition},\nauthor={Wei Chen and Qiang Qiu},\nyear={2024},\nurl={https://openreview.net/forum?id=VzrswFtUDf}\n}",
        "github": "",
        "project": "",
        "reviewers": "XizG;1yYi;yKW9",
        "site": "https://openreview.net/forum?id=VzrswFtUDf",
        "pdf_size": 783977,
        "rating": "3;5;5",
        "confidence": "4;3;3",
        "soundness": "1;2;2",
        "contribution": "2;2;2",
        "presentation": "2;2;3",
        "wc_summary": "55;94;81",
        "wc_strengths": "34;54;50",
        "wc_weaknesses": "247;275;100",
        "wc_questions": "7;119;64",
        "wc_review": "343;542;295",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            76.66666666666667,
            16.21384867602041
        ],
        "wc_strengths_avg": [
            46.0,
            8.640987597877148
        ],
        "wc_weaknesses_avg": [
            207.33333333333334,
            76.75212628252646
        ],
        "wc_questions_avg": [
            63.333333333333336,
            45.72623851673008
        ],
        "wc_review_avg": [
            393.3333333333333,
            106.93403989791506
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.9999999999999998,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:8u-P0m535aUJ:scholar.google.com/&scioq=Overcome+Data+Heterogeneity+in+Federated+Learning+with+Filter+Decomposition&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Purdue University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.purdue.edu",
        "aff_unique_abbr": "Purdue",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "W0fmImkpHp",
        "title": "Leveraging Neuron Activation Patterns to Explain and Improve Deep Learning Classifiers",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Deep learning models embed all the training information as neuron activation patterns. However, understanding these patterns to improve model performance appears to be a notoriously challenging task. This paper examines the neuron activation patterns of deep learning-based classification models and explores whether model performances can be explained or improved through neurons\u2019 activation behaviour. We first show that the entropy of the neuron activation pattern is related to model performance. We then propose a novel modeling approach that given a trained deep learning model, can leverage the neurons' activation probabilities to further boost the classification accuracy. Our comprehensive experimental study shows notable improvements in classification accuracies   (sometimes up to 4.7\\%) on benchmark datasets for both classic fully connected neural networks and advanced convolutional neural networks.",
        "keywords": "explainableai;deeplearning;optimization",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/515d54632208973a154d6c183128614adc684ed5.zip",
        "author": "Sakib Mostafa;Debajyoti Mondal",
        "authorids": "~Sakib_Mostafa1;~Debajyoti_Mondal1",
        "gender": "M;",
        "homepage": ";https://www.cs.usask.ca/faculty/dmondal/",
        "dblp": ";https://dblp.uni-trier.de/pid/90/8236",
        "google_scholar": "iDKl2-AAAAAJ;DYu56mwAAAAJ",
        "orcid": "my-orcid?orcid=0000-0002-4777-7832;",
        "linkedin": "sakib-mostafa-414151ba/;",
        "or_profile": "~Sakib_Mostafa1;~Debajyoti_Mondal1",
        "aff": "University of Saskatchewan;University of Saskatchewan",
        "aff_domain": "usask.ca;usask.ca",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\nmostafa2024leveraging,\ntitle={Leveraging Neuron Activation Patterns to Explain and Improve Deep Learning Classifiers},\nauthor={Sakib Mostafa and Debajyoti Mondal},\nyear={2024},\nurl={https://openreview.net/forum?id=W0fmImkpHp}\n}",
        "github": "",
        "project": "",
        "reviewers": "zAME;s1Ur;feHw;YNcH",
        "site": "https://openreview.net/forum?id=W0fmImkpHp",
        "pdf_size": 789225,
        "rating": "1;3;5;6",
        "confidence": "4;2;4;4",
        "soundness": "1;4;3;3",
        "contribution": "2;1;2;3",
        "presentation": "2;4;3;3",
        "wc_summary": "46;43;61;105",
        "wc_strengths": "13;63;46;82",
        "wc_weaknesses": "425;74;135;5",
        "wc_questions": "30;7;4;115",
        "wc_review": "514;187;246;307",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.920286436967152
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.75,
            1.0897247358851685
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            63.75,
            24.772716847370617
        ],
        "wc_strengths_avg": [
            51.0,
            25.367301787931645
        ],
        "wc_weaknesses_avg": [
            159.75,
            159.89899155404328
        ],
        "wc_questions_avg": [
            39.0,
            45.0166635813895
        ],
        "wc_review_avg": [
            313.5,
            123.2892939390927
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.22549380840084865,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:mJ7wIBmEWL8J:scholar.google.com/&scioq=Leveraging+Neuron+Activation+Patterns+to+Explain+and+Improve+Deep+Learning+Classifiers&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Saskatchewan",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.usask.ca",
        "aff_unique_abbr": "U of S",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "W0zgCR6FIE",
        "title": "Spawrious: A Benchmark for Fine Control of Spurious Correlation Biases",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Spurious correlations (SCs) occur when a classifier relies on non-predictive features that happen to be correlated with the labels in the training data. For example, a classifier may misclassify dog breeds based on the background of dog images. This happens when the backgrounds are correlated with other breeds in the training data, leading to misclassifications during test time. Previous SC benchmark datasets suffer from varying issues, e.g., over-saturation or only containing one-to-one (O2O) SCs, but no many-to-many (M2M) SCs arising between groups of spurious attributes and classes.\n\nIn this paper, we present Spawrious-{O2O, M2M}-{Easy, Medium, Hard}, an image classification benchmark suite containing spurious correlations among different dog breeds and background locations. To create this dataset, we employ a text-to-image model to generate photo-realistic images, and an image captioning model to filter out unsuitable ones. The resulting dataset is of high quality, containing approximately 152,000 images.\n\nOur experimental results demonstrate that state-of-the-art group robustness methods struggle with Spawrious, most notably on the hardest split with <73% accuracy. By examining model misclassifications, we detect reliances on spurious backgrounds, demonstrating that our dataset provides a significant challenge to drive future research.",
        "keywords": "OOD generalization;Spurious correlations;science of deep learning",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Aengus Lynch;Gbetondji Jean-Sebastien Dovonon;Jean Kaddour;Ricardo Silva",
        "authorids": "~Aengus_Lynch1;~Gbetondji_Jean-Sebastien_Dovonon1;~Jean_Kaddour1;~Ricardo_Silva1",
        "gender": "M;M;M;M",
        "homepage": ";https://jean72human.github.io;https://jeankaddour.com/;http://www.homepages.ucl.ac.uk/~ucgtrbd/",
        "dblp": ";;;42/2642-1",
        "google_scholar": "Pd2002AAAAAJ;;z90bmSMAAAAJ;I-ANa0QAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Aengus_Lynch1;~Gbetondji_Jean-Sebastien_Dovonon1;~Jean_Kaddour1;~Ricardo_Silva1",
        "aff": "University College London, University of London;University College London, University of London;University College London;University College London",
        "aff_domain": "ucl.ac.uk;ucl.ac.uk;ucl.ac.uk;ucl.ac.uk",
        "position": "PhD student;PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nlynch2024spawrious,\ntitle={Spawrious: A Benchmark for Fine Control of Spurious Correlation Biases},\nauthor={Aengus Lynch and Gbetondji Jean-Sebastien Dovonon and Jean Kaddour and Ricardo Silva},\nyear={2024},\nurl={https://openreview.net/forum?id=W0zgCR6FIE}\n}",
        "github": "",
        "project": "",
        "reviewers": "d4Gu;evLb;9Fk3;GoTk",
        "site": "https://openreview.net/forum?id=W0zgCR6FIE",
        "pdf_size": 6532789,
        "rating": "5;5;5;8",
        "confidence": "5;4;3;4",
        "soundness": "3;3;2;4",
        "contribution": "3;3;2;4",
        "presentation": "3;3;3;4",
        "wc_summary": "65;116;69;113",
        "wc_strengths": "40;221;126;135",
        "wc_weaknesses": "255;142;165;122",
        "wc_questions": "41;48;150;60",
        "wc_review": "401;527;510;430",
        "wc_reply_reviewers": "177;96;261;164",
        "wc_reply_authors": "676;254;1061;588",
        "reply_reviewers": "1;1;2;1",
        "reply_authors": "2;1;2;2",
        "rating_avg": [
            5.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            90.75,
            23.81569860407206
        ],
        "wc_strengths_avg": [
            130.5,
            64.07222487162437
        ],
        "wc_weaknesses_avg": [
            171.0,
            50.82814181140208
        ],
        "wc_questions_avg": [
            74.75,
            43.97371373900549
        ],
        "wc_review_avg": [
            467.0,
            52.853571307906904
        ],
        "wc_reply_reviewers_avg": [
            174.5,
            58.653644388051454
        ],
        "wc_reply_authors_avg": [
            644.75,
            287.2919899683944
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 32,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15805546682516176349&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University College London",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucl.ac.uk",
        "aff_unique_abbr": "UCL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "W2HJKGnb5y",
        "title": "POPULATION DESCENT: A NATURAL-SELECTION BASED HYPER-PARAMETER TUNING FRAMEWORK",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "First-order gradient descent has been the base of the most successful optimization algorithms ever implemented.\nOn supervised learning problems with very high dimensionality, such as neural network optimization, it is almost always the algorithm of choice, mainly due to its memory and computational efficiency.\nHowever, it is a classical result in optimization that gradient descent converges to local minima on non-convex functions. Even more importantly, in certain high-dimensional cases, escaping the plateaus of large saddle points becomes intractable.\nOn the other hand, black-box optimization methods are not sensitive to the local structure of a loss function's landscape but suffer the curse of dimensionality.\nInstead, memetic algorithms aim to combine the benefits of both.\nInspired by this, we present Population Descent, a memetic algorithm focused on hyperparameter optimization.\nWe show that an adaptive $m$-elitist selection approach combined with a normalized-fitness-based randomization scheme outperforms more complex state-of-the-art algorithms by up to 13\\% on common benchmark tasks.",
        "keywords": "hyperparameter tuning;memetic algorithm;differential optimization;Gaussian mutations;supervised learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Abhinav Pomalapally;Bassel El Mabsout",
        "authorids": "~Abhinav_Pomalapally1;~Bassel_El_Mabsout1",
        "gender": "M;M",
        "homepage": ";https://bmabsout.com",
        "dblp": ";281/7194",
        "google_scholar": ";",
        "orcid": ";0000-0002-7969-0096",
        "linkedin": "apomalapally/;",
        "or_profile": "~Abhinav_Pomalapally1;~Bassel_El_Mabsout1",
        "aff": "University of California, Berkeley;Boston University, Boston University",
        "aff_domain": "berkeley.edu;bu.edu",
        "position": "Undergrad student;PhD student",
        "bibtex": "@misc{\npomalapally2024population,\ntitle={{POPULATION} {DESCENT}: A {NATURAL}-{SELECTION} {BASED} {HYPER}-{PARAMETER} {TUNING} {FRAMEWORK}},\nauthor={Abhinav Pomalapally and Bassel El Mabsout},\nyear={2024},\nurl={https://openreview.net/forum?id=W2HJKGnb5y}\n}",
        "github": "",
        "project": "",
        "reviewers": "VVKB;zXbc;nmn7;TkFw",
        "site": "https://openreview.net/forum?id=W2HJKGnb5y",
        "pdf_size": 437459,
        "rating": "3;3;3;5",
        "confidence": "2;4;4;5",
        "soundness": "2;2;2;3",
        "contribution": "2;1;1;3",
        "presentation": "2;2;1;2",
        "wc_summary": "12;33;49;78",
        "wc_strengths": "6;34;18;105",
        "wc_weaknesses": "104;361;153;182",
        "wc_questions": "2;65;2;153",
        "wc_review": "124;493;222;518",
        "wc_reply_reviewers": "15;110;0;0",
        "wc_reply_authors": "353;717;723;673",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            43.0,
            24.093567606313517
        ],
        "wc_strengths_avg": [
            40.75,
            38.40166012036459
        ],
        "wc_weaknesses_avg": [
            200.0,
            97.04380454207265
        ],
        "wc_questions_avg": [
            55.5,
            61.88901356460612
        ],
        "wc_review_avg": [
            339.25,
            170.05201410156835
        ],
        "wc_reply_reviewers_avg": [
            31.25,
            45.87687325875642
        ],
        "wc_reply_authors_avg": [
            616.5,
            153.3517199121027
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.6622661785325219,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:MU_VYrnqdXsJ:scholar.google.com/&scioq=POPULATION+DESCENT:+A+NATURAL-SELECTION+BASED+HYPER-PARAMETER+TUNING+FRAMEWORK&hl=en&as_sdt=0,5",
        "gs_version_total": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of California, Berkeley;Boston University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.berkeley.edu;https://www.bu.edu",
        "aff_unique_abbr": "UC Berkeley;BU",
        "aff_campus_unique_index": "0;1",
        "aff_campus_unique": "Berkeley;Boston",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "A Unified Sampling Framework for Solver Searching of Diffusion Probabilistic Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18489",
        "id": "W2d3LZbhhI",
        "author_site": "Enshu Liu, Xuefei Ning, Huazhong Yang, Yu Wang",
        "tldr": "",
        "abstract": "Recent years have witnessed the rapid progress and broad application of diffusion probabilistic models (DPMs). Sampling from DPMs can be viewed as solving an ordinary differential equation (ODE). Despite the promising performance, the generation of DPMs usually consumes much time due to the large number of function evaluations (NFE). Though recent works have accelerated the sampling to around 20 steps with high-order solvers, the sample quality with less than 10 NFE can still be improved. In this paper, we propose a unified sampling framework (USF) to study the optional strategies for solver. Under this framework, we further reveal that taking different solving strategies at different timesteps may help further decrease the truncation error, and a carefully designed \\emph{solver schedule} has the potential to improve the sample quality by a large margin. Therefore, we propose a new sampling framework based on the exponential integral formulation that allows free choices of solver strategy at each step and design specific decisions for the framework. Moreover, we propose $S^3$, a predictor-based search method that automatically optimizes the solver schedule to get a better time-quality trade-off of sampling. We demonstrate that $S^3$ can find outstanding solver schedules which outperform the state-of-the-art sampling methods on CIFAR-10, CelebA, ImageNet-64, and LSUN-Bedroom datasets. Specifically, we achieve 2.69 FID with 9 NFE and 6.86 FID with 5 NFE on CIFAR-10 dataset, outperforming the SOTA method significantly. We further apply $S^3$ to Stable-Diffusion model and get an acceleration ratio of 2$\\times$, showing the feasibility of sampling in very few steps without retraining of the neural network.",
        "keywords": "Diffusion Probabilistic Model;Diffusion Sampler;Solver Schedule",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Enshu Liu;Xuefei Ning;Huazhong Yang;Yu Wang",
        "authorids": "~Enshu_Liu1;~Xuefei_Ning1;~Huazhong_Yang2;~Yu_Wang3",
        "gender": "M;Not Specified;M;M",
        "homepage": "http://nicsefc.ee.tsinghua.edu.cn/people/EnshuLiu;https://nics-effalg.com/ningxuefei/;http://web.ee.tsinghua.edu.cn/yanghuazhong/en/index.htm;https://nicsefc.ee.tsinghua.edu.cn",
        "dblp": ";202/9525;94/1128.html;w/YuWang2.html",
        "google_scholar": "0LUhWzoAAAAJ;oVslpJsAAAAJ;;https://scholar.google.com.hk/citations?user=j8JGVvoAAAAJ",
        "orcid": ";;0000-0003-2421-353X;0000-0001-6108-5157",
        "linkedin": ";;;",
        "or_profile": "~Enshu_Liu1;~Xuefei_Ning1;~Huazhong_Yang2;~Yu_Wang3",
        "aff": "Tsinghua University;Tsinghua University;Tsinghua University;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "MS student;Research Assistant Professor;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nliu2024a,\ntitle={A Unified Sampling Framework for Solver Searching of Diffusion Probabilistic Models},\nauthor={Enshu Liu and Xuefei Ning and Huazhong Yang and Yu Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=W2d3LZbhhI}\n}",
        "github": "",
        "project": "",
        "reviewers": "qhfh;HfC4;7SgP;VK39;HHFa",
        "pdf_size": 35333238,
        "rating": "6;6;6;6;6",
        "confidence": "4;4;4;4;3",
        "soundness": "3;3;3;3;3",
        "contribution": "2;3;2;3;3",
        "presentation": "4;3;3;3;3",
        "wc_summary": "99;97;120;64;94",
        "wc_strengths": "58;74;36;62;101",
        "wc_weaknesses": "108;84;84;55;89",
        "wc_questions": "240;4;61;12;126",
        "wc_review": "505;259;301;193;410",
        "wc_reply_reviewers": "87;0;31;14;16",
        "wc_reply_authors": "1877;288;238;367;1561",
        "reply_reviewers": "1;0;1;1;1",
        "reply_authors": "6;2;3;3;4",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            3.2,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            94.8,
            17.92651667223725
        ],
        "wc_strengths_avg": [
            66.2,
            21.301643129110957
        ],
        "wc_weaknesses_avg": [
            84.0,
            16.982343772283023
        ],
        "wc_questions_avg": [
            88.6,
            87.30085910230208
        ],
        "wc_review_avg": [
            333.6,
            111.00558544505768
        ],
        "wc_reply_reviewers_avg": [
            29.6,
            30.33545780106178
        ],
        "wc_reply_authors_avg": [
            866.2,
            704.6438533046321
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            3.6,
            1.3564659966250536
        ],
        "replies_avg": [
            31,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10155010276910240507&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=W2d3LZbhhI",
        "pdf": "https://openreview.net/pdf?id=W2d3LZbhhI",
        "email": "tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Tsinghua University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "A Flexible Generative Model for Heterogeneous Tabular EHR with Missing Modality",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18488",
        "id": "W2tCmRrj7H",
        "author_site": "Huan He, Yijie Hao, Yuanzhe Xi, Yong Chen, Bradley Malin, Joyce Ho",
        "tldr": "",
        "abstract": "Realistic synthetic electronic health records (EHRs) can be leveraged to acceler- ate methodological developments for research purposes while mitigating privacy concerns associated with data sharing. However, the training of Generative Ad- versarial Networks remains challenging, often resulting in issues like mode col- lapse. While diffusion models have demonstrated progress in generating qual- ity synthetic samples for tabular EHRs given ample denoising steps, their perfor- mance wanes when confronted with missing modalities in heterogeneous tabular EHRs data. For example, some EHRs contain solely static measurements, and some contain only contain temporal measurements, or a blend of both data types. To bridge this gap, we introduce FLEXGEN-EHR\u2013 a versatile diffusion model tai- lored for heterogeneous tabular EHRs, equipped with the capability of handling missing modalities in an integrative learning framework. We define an optimal transport module to align and accentuate the common feature space of hetero- geneity of EHRs. We empirically show that our model consistently outperforms existing state-of-the-art synthetic EHR generation methods both in fidelity by up to 3.10% and utility by up to 7.16%. Additionally, we show that our method can be successfully used in privacy-sensitive settings, where the original patient-level data cannot be shared.",
        "keywords": "Generative Model;Synthetic EHR",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/d825e1894e3ef065c763e072c829870d2542621f.pdf",
        "author": "Huan He;William hao;Yuanzhe Xi;Yong Chen;Bradley Malin;Joyce Ho",
        "authorids": "~Huan_He2;william.hao@emory.edu;~Yuanzhe_Xi1;~Yong_Chen10;~Bradley_Malin1;~Joyce_Ho1",
        "gender": "M;;M;M;;F",
        "homepage": "https://hehuannb.github.io/;;http://www.math.emory.edu/~yxi26/;https://penncil.med.upenn.edu/about-pi/;;http://joyceho.github.io/",
        "dblp": ";;;;;144/4961",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;;U7M_JZ4AAAAJ;;DrUBb5sAAAAJ",
        "orcid": ";;;;;",
        "linkedin": "huanheemory/;;;;;",
        "or_profile": "~Huan_He2;william.hao@emory.edu;~Yuanzhe_Xi1;~Yong_Chen10;~Bradley_Malin1;~Joyce_Ho1",
        "aff": "University of Pennsylvania;;Emory University;University of Pennsylvania;;Emory University",
        "aff_domain": "upenn.edu;;emory.edu;upenn.edu;;emory.edu",
        "position": "Postdoc;;Associate Professor;Full Professor;;Associate Professor",
        "bibtex": "@inproceedings{\nhe2024a,\ntitle={A Flexible Generative Model for Heterogeneous Tabular {EHR} with Missing Modality},\nauthor={Huan He and William hao and Yuanzhe Xi and Yong Chen and Bradley Malin and Joyce Ho},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=W2tCmRrj7H}\n}",
        "github": "",
        "project": "",
        "reviewers": "z7JT;CG4L;Tnu1;DnAy;ULHZ",
        "pdf_size": 1147107,
        "rating": "5;5;6;6;6",
        "confidence": "4;5;3;4;2",
        "soundness": "2;2;3;3;2",
        "contribution": "2;3;3;3;2",
        "presentation": "2;3;3;3;3",
        "wc_summary": "106;41;94;58;95",
        "wc_strengths": "104;22;57;45;125",
        "wc_weaknesses": "388;135;76;52;497",
        "wc_questions": "280;1;100;75;80",
        "wc_review": "878;199;327;230;797",
        "wc_reply_reviewers": "62;36;15;22;37",
        "wc_reply_authors": "1969;358;589;395;1230",
        "reply_reviewers": "1;1;1;1;1",
        "reply_authors": "4;1;2;1;3",
        "rating_avg": [
            5.6,
            0.48989794855663565
        ],
        "confidence_avg": [
            3.6,
            1.019803902718557
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            78.8,
            24.87890672839142
        ],
        "wc_strengths_avg": [
            70.6,
            38.15022935710872
        ],
        "wc_weaknesses_avg": [
            229.6,
            179.26360478357006
        ],
        "wc_questions_avg": [
            107.2,
            92.70037756125916
        ],
        "wc_review_avg": [
            486.2,
            291.0569703683456
        ],
        "wc_reply_reviewers_avg": [
            34.4,
            16.131955864060625
        ],
        "wc_reply_authors_avg": [
            908.2,
            615.9277230325
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.2,
            1.16619037896906
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.7205766921228919,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8292886941246443700&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=W2tCmRrj7H",
        "pdf": "https://openreview.net/pdf?id=W2tCmRrj7H",
        "email": "upenn.edu;;emory.edu;upenn.edu;;emory.edu",
        "author_num": 6,
        "aff_unique_index": "0;1;0;1",
        "aff_unique_norm": "University of Pennsylvania;Emory University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.upenn.edu;https://www.emory.edu",
        "aff_unique_abbr": "UPenn;Emory",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "W3T9rql5eo",
        "title": "Uniform as Glass: Gliding over the Pareto Front with Neural Adaptive Preferences",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Multiobjective optimization (MOO) is prevalent in numerous real-world applications, in which a Pareto front (PF) is constructed to display optima under various preferences. Previous methods commonly utilize the set of Pareto objectives (particles) to represent the entire Pareto front. However, the corresponding discrete distribution of the points on the PF is less studied, which may impede the generation of diverse and representative Pareto objectives in previous methods. To bridge the gap, we highlight in this paper the benefits of uniformly distributed Pareto objectives on the PF, which alleviate the limited diversity found in previous multiobjective optimization (MOO) approaches. In particular, we introduce new techniques for measuring and analyzing the uniformity of Pareto objectives, and accordingly propose a new method to generate asymptotically uniform Pareto objectives in an adaptive manner. Our proposed method is validated through experiments on real-world and synthetic problems, which demonstrates its efficacy in generating high-quality uniform Pareto objectives on the Pareto front.",
        "keywords": "multiobjective optimization; uniform design; solution modelling",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Xiaoyuan Zhang;Xi Lin;Yifan Chen;Yichi Zhang;Qingfu Zhang",
        "authorids": "~Xiaoyuan_Zhang2;~Xi_Lin2;~Yifan_Chen3;~Yichi_Zhang14;~Qingfu_Zhang1",
        "gender": "M;M;;;M",
        "homepage": ";https://xi-l.github.io/;;https://yichistat.github.io/website/;https://www.cs.cityu.edu.hk/~qzhan7/index.html",
        "dblp": ";43/489-1;;;98/1240.html",
        "google_scholar": "KQj18L8AAAAJ;QB_MUboAAAAJ;;;https://scholar.google.co.uk/citations?user=nhL9PHwAAAAJ",
        "orcid": "0000-0002-3852-645X;;;;",
        "linkedin": ";;;;",
        "or_profile": "~Xiaoyuan_Zhang2;~Xi_Lin2;~Yifan_Chen3;~Yichi_Zhang14;~Qingfu_Zhang1",
        "aff": "City University of Hong Kong;City University of Hong Kong;;Duke University;City University of Hong Kong",
        "aff_domain": "cityu.edu.hk;cityu.edu.hk;;duke.edu;cityu.edu.hk",
        "position": "PhD student;Postdoc;;Postdoc;Full Professor",
        "bibtex": "@misc{\nzhang2024uniform,\ntitle={Uniform as Glass: Gliding over the Pareto Front with Neural Adaptive Preferences},\nauthor={Xiaoyuan Zhang and Xi Lin and Yifan Chen and Yichi Zhang and Qingfu Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=W3T9rql5eo}\n}",
        "github": "",
        "project": "",
        "reviewers": "AzbY;gHJ7;EYB8;1zQZ",
        "site": "https://openreview.net/forum?id=W3T9rql5eo",
        "pdf_size": 1505080,
        "rating": "3;3;5;6",
        "confidence": "3;4;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "1;1;2;4",
        "wc_summary": "69;22;105;46",
        "wc_strengths": "45;26;30;26",
        "wc_weaknesses": "139;272;130;115",
        "wc_questions": "65;11;53;63",
        "wc_review": "318;331;318;250",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "985;865;687;694",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            1.224744871391589
        ],
        "wc_summary_avg": [
            60.5,
            30.598202561588483
        ],
        "wc_strengths_avg": [
            31.75,
            7.8222439235810075
        ],
        "wc_weaknesses_avg": [
            164.0,
            62.94044804416314
        ],
        "wc_questions_avg": [
            48.0,
            21.840329667841555
        ],
        "wc_review_avg": [
            304.25,
            31.767711595266032
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            807.75,
            124.71442378490148
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.19245008972987526,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:6jSVlhSQNd4J:scholar.google.com/&scioq=Uniform+as+Glass:+Gliding+over+the+Pareto+Front+with+Neural+Adaptive+Preferences&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "City University of Hong Kong;Duke University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cityu.edu.hk;https://www.duke.edu",
        "aff_unique_abbr": "CityU;Duke",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Modeling Boundedly Rational Agents with Latent Inference Budgets",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18487",
        "id": "W3VsHuga3j",
        "author_site": "Athul Jacob, Abhishek Gupta, Jacob Andreas",
        "tldr": "",
        "abstract": "We study the problem of modeling a population of agents pursuing unknown goals subject to unknown computational constraints. In standard models of bounded rationality, sub-optimal decision-making is simulated by adding homoscedastic noise to optimal decisions rather than actually simulating constrained inference. In this work, we introduce a latent inference budget model (L-IBM) that models these constraints explicitly, via a latent variable (inferred jointly with a model of agents\u2019 goals) that controls the runtime of an iterative inference algorithm. L-IBMs make it possible to learn agent models using data from diverse populations of suboptimal actors. In three modeling tasks\u2014inferring navigation goals from routes, inferring communicative intents from human utterances, and predicting next moves in human chess games\u2014we show that L-IBMs match or outperforms Boltzmann models of decision-making under uncertainty. Moreover, the inferred inference budgets are themselves meaningful, efficient to compute, and correlated with measures of player skill, partner skill and task difficulty.",
        "keywords": "neurosymbolic;planning;rationality",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "",
        "author": "Athul Paul Jacob;Abhishek Gupta;Jacob Andreas",
        "authorids": "~Athul_Paul_Jacob1;~Abhishek_Gupta1;~Jacob_Andreas1",
        "gender": ";M;M",
        "homepage": "http://apjacob.me/;https://homes.cs.washington.edu/~abhgupta/;http://web.mit.edu/jda/www",
        "dblp": "192/1229;18/6404-4;97/8154",
        "google_scholar": "https://scholar.google.ca/citations?user=XT3E7RoAAAAJ;1wLVDP4AAAAJ;dnZ8udEAAAAJ",
        "orcid": ";;",
        "linkedin": "apjacob/;;",
        "or_profile": "~Athul_Paul_Jacob1;~Abhishek_Gupta1;~Jacob_Andreas1",
        "aff": "Massachusetts Institute of Technology;University of Washington;Microsoft",
        "aff_domain": "mit.edu;uw.edu;microsoft.com",
        "position": "PhD student;Assistant Professor;Researcher",
        "bibtex": "@inproceedings{\njacob2024modeling,\ntitle={Modeling Boundedly Rational Agents with Latent Inference Budgets},\nauthor={Athul Paul Jacob and Abhishek Gupta and Jacob Andreas},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=W3VsHuga3j}\n}",
        "github": "",
        "project": "",
        "reviewers": "q6an;KCR8;PxXG;egSD",
        "pdf_size": 1272611,
        "rating": "5;6;6;8",
        "confidence": "3;4;3;4",
        "soundness": "2;3;3;4",
        "contribution": "3;3;2;3",
        "presentation": "2;3;3;4",
        "wc_summary": "65;85;76;390",
        "wc_strengths": "102;27;68;197",
        "wc_weaknesses": "269;145;173;210",
        "wc_questions": "134;35;117;61",
        "wc_review": "570;292;434;858",
        "wc_reply_reviewers": "0;109;83;0",
        "wc_reply_authors": "479;487;666;692",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;2;2;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            154.0,
            136.43863089316017
        ],
        "wc_strengths_avg": [
            98.5,
            62.76344477480502
        ],
        "wc_weaknesses_avg": [
            199.25,
            46.40245144386232
        ],
        "wc_questions_avg": [
            86.75,
            40.2763888649417
        ],
        "wc_review_avg": [
            538.5,
            209.01853984754558
        ],
        "wc_reply_reviewers_avg": [
            48.0,
            48.87228253314961
        ],
        "wc_reply_authors_avg": [
            581.0,
            98.47080785694814
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.6882472016116854,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15943206975738211652&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=W3VsHuga3j",
        "pdf": "https://openreview.net/pdf?id=W3VsHuga3j",
        "email": "mit.edu;uw.edu;microsoft.com",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Massachusetts Institute of Technology;University of Washington;Microsoft",
        "aff_unique_dep": ";;Microsoft Corporation",
        "aff_unique_url": "https://web.mit.edu;https://www.washington.edu;https://www.microsoft.com",
        "aff_unique_abbr": "MIT;UW;Microsoft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "W44kiwovtC",
        "title": "FastDCFlow: Fast and Diverse Counterfactual Explanations Using Normalizing Flows",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Machine-learning models, which are known to accurately predict patterns from large datasets, are crucial in decision-making. Consequently, counterfactual explanations-methods explaining predictions by introducing input perturbations-have become prominent. These perturbations often suggest ways to alter predictions, leading to actionable recommendations. However, the current techniques require resolving the optimization problems for each input change, rendering them computationally expensive. In addition, traditional encoding methods inadequately address the perturbations of categorical variables in tabular data. Thus, this study propose \"FastDCFlow,\" an efficient counterfactual explanation method using normalizing flows. The proposed method captures complex data distributions, learns meaningful latent spaces that retain proximity, and improves the predictions. For categorical variables, we employed \"TargetEncoding,\" which respects ordinal relationships and includes perturbation costs. The proposed method outperformed existing methods in multiple metrics, striking a balance between trade-offs for counterfactual explanations.",
        "keywords": "Counterfactual explanations;Input-based methods;Model-based methods;Tabular data;TargetEncoding;Normalizing Flows;Latent representation;Reparametrization trick;Diversity",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/caa22c72c30e63033e4ae8ea8815af458f058e17.zip",
        "author": "Yuta Sumiya;Hayaru Shouno",
        "authorids": "~Yuta_Sumiya1;~Hayaru_Shouno2",
        "gender": "M;M",
        "homepage": "https://github.com/sumugit;",
        "dblp": ";95/2266",
        "google_scholar": ";https://scholar.google.co.jp/citations?user=CwYpG2AAAAAJ",
        "orcid": "0009-0002-0585-186X;0000-0002-2412-0184",
        "linkedin": ";",
        "or_profile": "~Yuta_Sumiya1;~Hayaru_Shouno2",
        "aff": "University of Electro-Communications, Tokyo Institute of Technology;University of Electro-Communications",
        "aff_domain": "uec.ac.jp;uec.ac.jp",
        "position": "MS student;Full Professor",
        "bibtex": "@misc{\nsumiya2024fastdcflow,\ntitle={Fast{DCF}low: Fast and Diverse Counterfactual Explanations Using Normalizing Flows},\nauthor={Yuta Sumiya and Hayaru Shouno},\nyear={2024},\nurl={https://openreview.net/forum?id=W44kiwovtC}\n}",
        "github": "",
        "project": "",
        "reviewers": "TXsm;KKcY;uvnA",
        "site": "https://openreview.net/forum?id=W44kiwovtC",
        "pdf_size": 2124974,
        "rating": "3;3;5",
        "confidence": "4;4;4",
        "soundness": "2;2;3",
        "contribution": "2;1;2",
        "presentation": "2;3;3",
        "wc_summary": "47;37;12",
        "wc_strengths": "22;45;26",
        "wc_weaknesses": "255;170;145",
        "wc_questions": "168;170;87",
        "wc_review": "492;422;270",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "950;1013;814",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;2;2",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            32.0,
            14.719601443879744
        ],
        "wc_strengths_avg": [
            31.0,
            10.03327796219494
        ],
        "wc_weaknesses_avg": [
            190.0,
            47.08148963941844
        ],
        "wc_questions_avg": [
            141.66666666666666,
            38.66379299666406
        ],
        "wc_review_avg": [
            394.6666666666667,
            92.66906471717277
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            925.6666666666666,
            83.0434959658023
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:MjUIt3OwnEMJ:scholar.google.com/&scioq=FastDCFlow:+Fast+and+Diverse+Counterfactual+Explanations+Using+Normalizing+Flows&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Electro-Communications",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uec.ac.jp",
        "aff_unique_abbr": "UEC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Japan"
    },
    {
        "id": "W478nWXfwO",
        "title": "What Makes Pre-Trained Visual Representations Successful for Robust Manipulation?",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Inspired by the success of transfer learning in computer vision, roboticists have investigated visual pre-training as a means to improve the learning efficiency and generalization ability of policies learned from pixels. To that end, past work has favored large object interaction datasets, such as first-person videos of humans completing diverse tasks, in pursuit of manipulation-relevant features. Although this approach improves the efficiency of policy learning, it remains unclear how reliable these representations are in the presence of distribution shifts that arise commonly in robotic applications. Surprisingly, we find that visual representations designed for manipulation and control tasks do not necessarily generalize under subtle changes in lighting and scene texture or the introduction of distractor objects. To understand what properties \\textit{do} lead to robust representations, we compare the performance of 15 pre-trained vision models under different visual appearances. We find that emergent segmentation ability is a strong predictor of out-of-distribution generalization among ViT models. The rank order induced by this metric is more predictive than metrics that have previously guided generalization research within computer vision and machine learning, such as downstream ImageNet accuracy, in-domain accuracy, or shape-bias as evaluated by cue-conflict performance. We test this finding extensively on a suite of distribution shifts in ten tasks across two simulated manipulation environments. On the ALOHA setup, segmentation score predicts real-world performance after offline training with 50 demonstrations.",
        "keywords": "pre-trained visual representations;robot learning;robustness",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/13bc6b4b8fbbc130ce1afabd83c3c24c7a633bc2.zip",
        "author": "Kaylee Burns;Zach Witzel;Jubayer Ibn Hamid;Tianhe Yu;Chelsea Finn;Karol Hausman",
        "authorids": "~Kaylee_Burns2;~Zach_Witzel1;~Jubayer_Ibn_Hamid1;~Tianhe_Yu1;~Chelsea_Finn1;~Karol_Hausman2",
        "gender": "F;;;M;F;",
        "homepage": "https://kayburns.github.io;;;https://cs.stanford.edu/~tianheyu/;https://ai.stanford.edu/~cbfinn/;",
        "dblp": "217/3002;;;192/1797;131/1783;",
        "google_scholar": "N_rVVG8AAAAJ;;;;vfPE6hgAAAAJ;",
        "orcid": ";;;;;",
        "linkedin": ";zachwitz;;;;",
        "or_profile": "~Kaylee_Burns2;~Zach_Witzel1;~Jubayer_Ibn_Hamid1;~Tianhe_Yu1;~Chelsea_Finn1;~Karol_Hausman2",
        "aff": "Stanford University;Stanford University;;Google Brain;Google;",
        "aff_domain": "stanford.edu;stanford.edu;;google.com;google.com;",
        "position": "PhD student;Undergrad student;;Research Scientist;Research Scientist;",
        "bibtex": "@misc{\nburns2024what,\ntitle={What Makes Pre-Trained Visual Representations Successful for Robust Manipulation?},\nauthor={Kaylee Burns and Zach Witzel and Jubayer Ibn Hamid and Tianhe Yu and Chelsea Finn and Karol Hausman},\nyear={2024},\nurl={https://openreview.net/forum?id=W478nWXfwO}\n}",
        "github": "",
        "project": "",
        "reviewers": "fmRi;ujtD;5UTX",
        "site": "https://openreview.net/forum?id=W478nWXfwO",
        "pdf_size": 4398166,
        "rating": "5;5;5",
        "confidence": "4;4;3",
        "soundness": "2;2;2",
        "contribution": "2;2;2",
        "presentation": "3;2;4",
        "wc_summary": "48;139;151",
        "wc_strengths": "60;172;33",
        "wc_weaknesses": "114;402;299",
        "wc_questions": "144;145;73",
        "wc_review": "366;858;556",
        "wc_reply_reviewers": "0;76;0",
        "wc_reply_authors": "776;1174;906",
        "reply_reviewers": "0;1;0",
        "reply_authors": "2;3;3",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            112.66666666666667,
            45.98792111945146
        ],
        "wc_strengths_avg": [
            88.33333333333333,
            60.1793615416079
        ],
        "wc_weaknesses_avg": [
            271.6666666666667,
            119.15349577564041
        ],
        "wc_questions_avg": [
            120.66666666666667,
            33.70789554721894
        ],
        "wc_review_avg": [
            593.3333333333334,
            202.58551006646275
        ],
        "wc_reply_reviewers_avg": [
            25.333333333333332,
            35.82674358011841
        ],
        "wc_reply_authors_avg": [
            952.0,
            165.70656796478124
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 19,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4951091306662038832&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;1;1",
        "aff_unique_norm": "Stanford University;Google",
        "aff_unique_dep": ";Google Brain",
        "aff_unique_url": "https://www.stanford.edu;https://brain.google.com",
        "aff_unique_abbr": "Stanford;Google Brain",
        "aff_campus_unique_index": "0;0;1;1",
        "aff_campus_unique": "Stanford;Mountain View",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "W47lwmHjdt",
        "title": "VIMEX: A Memory-Centered Task Description Framework for Vision-Based Robotics",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Robotics holds the potential to automate applications such as farming, construction, and elderly care; making food, shelter, and dignity easily accessible for everyone. This moonshot goal requires deploying robots in environments that are a priori unknown and typically uninstrumented (e.g., without optitrack, external reward/reset mechanisms, or digital twins), such as agricultural fields, construction sites, or private dwellings. It also requires the same robot to perform numerous different tasks within such environments, with each task defining its own notions of what an object is and what constitutes a desirable way of interacting with it (i.e., affordances). \nMotivated by these considerations, this paper presents a task-description framework called Vimex (i.e., Visual Memex) that allows a user to efficiently describe vision-based robotics tasks and the associated objects, parts, and affordances without requiring specialized equipment or training a deep neural network. Within this framework, arbitrary object definitions; anywhere on the spectrum between specific instances to general categories; are established using a small number of RGB images captured by a consumer camera, while part definitions are established using scribble annotations over these RGB images. Arbitrary metadata (i.e., any form of task-relevant information) are then attached to these annotations to form records stored in a memory. Given an RGBD image of a scene, these records are retrieved to define probability distributions of part locations and metadata over 3D coordinates using an association process based on nearest-neighbors. Finally, affordance definitions are established as probabilistic inference routines conditioned on such part and metadata distributions. To demonstrate what these abstractions mean and how they can be used to describe tasks to a robot, experiments that focus on vision-based grasping are presented.",
        "keywords": "task description;vision-based robotics;affordances;part detection;object recognition",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/06ea71a391a1c8b998d6fd752f0346b0840eba6a.zip",
        "author": "Onur Beker;Amirreza Razmjoo;Amir Zamir;Sylvain Calinon",
        "authorids": "~Onur_Beker1;~Amirreza_Razmjoo1;~Amir_Zamir1;~Sylvain_Calinon1",
        "gender": ";;M;M",
        "homepage": ";;https://amirzamir.com/;https://calinon.ch/",
        "dblp": ";;76/8610;59/6334",
        "google_scholar": ";;RKjEFukAAAAJ;t7VnipMAAAAJ",
        "orcid": ";;;0000-0002-9036-6799",
        "linkedin": ";;;sylvaincalinon",
        "or_profile": "~Onur_Beker1;~Amirreza_Razmjoo1;~Amir_Zamir1;~Sylvain_Calinon1",
        "aff": ";;Swiss Federal Institute of Technology Lausanne;EPFL - EPF Lausanne",
        "aff_domain": ";;epfl.ch;epfl.ch",
        "position": ";;Assistant Professor;Lecturer",
        "bibtex": "@misc{\nbeker2024vimex,\ntitle={{VIMEX}: A Memory-Centered Task Description Framework for Vision-Based Robotics},\nauthor={Onur Beker and Amirreza Razmjoo and Amir Zamir and Sylvain Calinon},\nyear={2024},\nurl={https://openreview.net/forum?id=W47lwmHjdt}\n}",
        "github": "",
        "project": "",
        "reviewers": "zCUf;oGXf;BqR3;pVhr",
        "site": "https://openreview.net/forum?id=W47lwmHjdt",
        "pdf_size": 43692163,
        "rating": "3;5;6;6",
        "confidence": "4;3;3;4",
        "soundness": "2;3;2;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "125;96;110;99",
        "wc_strengths": "116;121;114;106",
        "wc_weaknesses": "241;263;124;200",
        "wc_questions": "317;184;100;21",
        "wc_review": "799;664;448;426",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            107.5,
            11.368817000902073
        ],
        "wc_strengths_avg": [
            114.25,
            5.402545696243577
        ],
        "wc_weaknesses_avg": [
            207.0,
            52.98584716695582
        ],
        "wc_questions_avg": [
            155.5,
            109.61865717112211
        ],
        "wc_review_avg": [
            584.25,
            154.98770112496024
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.40824829046386296,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:HfcZWyNfkngJ:scholar.google.com/&scioq=VIMEX:+A+Memory-Centered+Task+Description+Framework+for+Vision-Based+Robotics&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Swiss Federal Institute of Technology Lausanne;EPFL",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.epfl.ch;https://www.epfl.ch",
        "aff_unique_abbr": "EPFL;EPFL",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Lausanne",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Switzerland"
    },
    {
        "id": "W4MO0vhOku",
        "title": "Multi-Image Zero-Shot Subject Generation for Visual Storytelling",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In text-to-image generation, the subfield of personalization deals with creating images of specific subjects/concepts in novel compositions. This is done by leveraging a set of images with a reference concept to either learn or guide a personalized generation process.\nSuch personalization, however, is only applicable when reference data exists - i.e. when the desired concept is present in (preferably numerous) images. This does not address the setting where consistency across generations is desired without constraints pertaining to existing data. In this work, we explore how to achieve consistency without reference images. Conditioning on sets of text prompts, we generate corresponding image sets where the shared concept has persistent appearance across generations. Our contributions are three-fold. First, we identify and define the novel task of Multi-image Zero-shot Subject Generation. Second, we create a benchmark of over 100 caption sets (corresponding to short stories) with repeated subject concepts to use as a testbed. Third, we demonstrate that existing methods cannot perform this task and propose an initial method which achieves uniform subject appearance by iteratively optimizing image sets to have similar visual content while still satisfying the text conditioning.",
        "keywords": "Text-to-Image Generation;Personalization",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Yuxin Tian;Bram Wallace;Senthil Purushwalkam;Akash Gokul;Stefano Ermon;Shafiq Joty;Nikhil Naik",
        "authorids": "~Yuxin_Tian1;~Bram_Wallace1;~Senthil_Purushwalkam1;~Akash_Gokul1;~Stefano_Ermon1;~Shafiq_Joty1;~Nikhil_Naik1",
        "gender": ";M;M;;M;M;M",
        "homepage": ";https://sites.coecis.cornell.edu/bram/;https://www.senthilpurushwalkam.com/;;http://cs.stanford.edu/~ermon/;https://raihanjoty.github.io/;mit.edu/~naik",
        "dblp": ";;130/6222;;47/8135;62/2078;43/7797",
        "google_scholar": ";bI-VIDcAAAAJ;T3Tt0S8AAAAJ;;;hR249csAAAAJ;M1IgIyMAAAAJ",
        "orcid": ";;;;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Yuxin_Tian1;~Bram_Wallace1;~Senthil_Purushwalkam1;~Akash_Gokul1;~Stefano_Ermon1;~Shafiq_Joty1;~Nikhil_Naik1",
        "aff": ";SalesForce.com;Salesforce;;Stanford University;SalesForce.com;MIT",
        "aff_domain": ";salesforce.com;salesforce.com;;stanford.edu;salesforce.com; ",
        "position": ";Researcher;Researcher;;Associate Professor;Principal Researcher;Graduate Student",
        "bibtex": "@misc{\ntian2024multiimage,\ntitle={Multi-Image Zero-Shot Subject Generation for Visual Storytelling},\nauthor={Yuxin Tian and Bram Wallace and Senthil Purushwalkam and Akash Gokul and Stefano Ermon and Shafiq Joty and Nikhil Naik},\nyear={2024},\nurl={https://openreview.net/forum?id=W4MO0vhOku}\n}",
        "github": "",
        "project": "",
        "reviewers": "4wft;wXM3;mwy1;JZkG",
        "site": "https://openreview.net/forum?id=W4MO0vhOku",
        "pdf_size": 12457,
        "rating": "3;5;5;6",
        "confidence": "4;5;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;2",
        "presentation": "2;4;3;4",
        "wc_summary": "146;109;80;39",
        "wc_strengths": "90;65;107;68",
        "wc_weaknesses": "228;105;113;54",
        "wc_questions": "4;30;78;92",
        "wc_review": "468;309;378;253",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            93.5,
            39.207779840230685
        ],
        "wc_strengths_avg": [
            82.5,
            17.124543789543708
        ],
        "wc_weaknesses_avg": [
            125.0,
            63.62782410235321
        ],
        "wc_questions_avg": [
            51.0,
            35.566838487557476
        ],
        "wc_review_avg": [
            352.0,
            80.2838713565807
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:RWR59ZoxUZ8J:scholar.google.com/&scioq=Multi-Image+Zero-Shot+Subject+Generation+for+Visual+Storytelling&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;2",
        "aff_unique_norm": "Salesforce;Stanford University;Massachusetts Institute of Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.salesforce.com;https://www.stanford.edu;https://web.mit.edu",
        "aff_unique_abbr": "Salesforce;Stanford;MIT",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Stanford",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "W6xD7K1ajR",
        "title": "Efficient Precision and Recall Metrics for Assessing Generative Models using Hubness-aware Sampling",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Despite impressive results, deep generative models require massive datasets for training, and as dataset size increases, effective evaluation metrics like precision and recall (P&R) become computationally infeasible on commodity hardware. In this paper, we address this challenge by proposing efficient P&R (eP&R) metrics that give almost identical results as the original P&R but with much lower computational costs. Specifically, we identify two redundancies in the original P&R: i) redundancy in ratio computation and ii) redundancy in manifold inside/outside identification. We find both can be effectively removed via hubness-aware sampling, which extracts representative elements from synthetic/real image samples based on their hubness values, i.e., the number of times a sample becomes a k-nearest neighbor to others in the feature space. Thanks to the insensitivity of hubness-aware sampling to exact k-nearest neighbor (k-NN) results, we further improve the efficiency of our eP&R metrics by using approximate k-NN methods. Extensive experiments show that our eP&R matches the original P&R but is far more efficient in time and space.",
        "keywords": "deep generative models;evaluation metrics;precision and recall;hubness;sampling",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/1cff033782a57dd8ac4607f723b2949b0ffe0bef.zip",
        "author": "Yuanbang Liang;Jing Wu;Yu-Kun Lai;Yipeng Qin",
        "authorids": "~Yuanbang_Liang1;~Jing_Wu3;~Yu-Kun_Lai1;~Yipeng_Qin1",
        "gender": "M;;;M",
        "homepage": "https://byronliang8.github.io/;https://www.cardiff.ac.uk/people/view/118177-wu-jing;https://profiles.cardiff.ac.uk/staff/qiny16;https://users.cs.cf.ac.uk/Yukun.Lai/",
        "dblp": "279/9811;;169/5516;60/4932",
        "google_scholar": "RRjSWYkAAAAJ;https://scholar.google.co.uk/citations?user=ms46emIAAAAJ;ojgWPpgAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": "0009-0000-8370-6655;;0000-0002-1551-9126;",
        "linkedin": ";;;",
        "or_profile": "~Yuanbang_Liang1;~Jing_Wu3;~Yipeng_Qin1;~Yukun_Lai1",
        "aff": "Cardiff University;Cardiff University;Cardiff University;Cardiff University",
        "aff_domain": "cardiff.ac.uk;cardiff.ac.uk;cardiff.ac.uk;cardiff.ac.uk",
        "position": "PhD student;Lecturer;Associate Professor;Full Professor",
        "bibtex": "@misc{\nliang2024efficient,\ntitle={Efficient Precision and Recall Metrics for Assessing Generative Models using Hubness-aware Sampling},\nauthor={Yuanbang Liang and Jing Wu and Yu-Kun Lai and Yipeng Qin},\nyear={2024},\nurl={https://openreview.net/forum?id=W6xD7K1ajR}\n}",
        "github": "",
        "project": "",
        "reviewers": "KcFU;ctE8;SeVE",
        "site": "https://openreview.net/forum?id=W6xD7K1ajR",
        "pdf_size": 490249,
        "rating": "5;5;6",
        "confidence": "2;4;4",
        "soundness": "2;3;3",
        "contribution": "2;2;3",
        "presentation": "2;3;3",
        "wc_summary": "94;74;277",
        "wc_strengths": "27;76;53",
        "wc_weaknesses": "19;237;126",
        "wc_questions": "104;33;55",
        "wc_review": "244;420;511",
        "wc_reply_reviewers": "62;0;0",
        "wc_reply_authors": "472;1791;334",
        "reply_reviewers": "2;0;0",
        "reply_authors": "2;3;1",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            148.33333333333334,
            91.34671434825788
        ],
        "wc_strengths_avg": [
            52.0,
            20.016659728003237
        ],
        "wc_weaknesses_avg": [
            127.33333333333333,
            89.00312104390248
        ],
        "wc_questions_avg": [
            64.0,
            29.676028485406647
        ],
        "wc_review_avg": [
            391.6666666666667,
            110.82819536963005
        ],
        "wc_reply_reviewers_avg": [
            20.666666666666668,
            29.227080289043965
        ],
        "wc_reply_authors_avg": [
            865.6666666666666,
            656.7304537547263
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9654841950521786071&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Cardiff University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cardiff.ac.uk",
        "aff_unique_abbr": "Cardiff",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "W7kxHxjeVm",
        "title": "ImAD: An End-to-End Method for Unsupervised Anomaly Detection in the Presence of Missing Values",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Common anomaly detection methods require fully observed data for model training and inference and cannot handle data containing missing values. The missing data problem is pervasive in various real-world scenarios but the study of anomaly detection with missing data is quite limited. In this work, we first construct and evaluate a straightforward strategy, \"impute-then-detect\", which combines state-of-the-art data imputation methods with unsupervised anomaly detection methods, where the training data are only composed of normal samples. We observe that such two-stage methods often yield imputation bias for normal data, namely, the imputation methods are inclined to make incomplete samples \"normal\". The fundamental reason is that the imputation models are learned from normal data and cannot be generalized to abnormal data. To solve the challenging problem, we propose an end-to-end method called ImAD for unsupervised anomaly detection in the presence of missing values. ImAD integrates data imputation with anomaly detection into a unified optimization problem and introduces well-designed pseudo-abnormal samples to ensure the discrimination ability of the imputation process. Experiments in the settings of three different missing mechanisms, including MCAR, MAR, and MNAR, show that the proposed ImAD alleviates the imputation bias and achieves much better detection performance on balanced and skewed data, in comparison to the baselines.",
        "keywords": "Anomaly Detection;Missing Values",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/dead7263c3d5d4a58bf553b2bc90b35087d2d285.zip",
        "author": "Feng Xiao;Jicong Fan",
        "authorids": "~Feng_Xiao3;~Jicong_Fan2",
        "gender": "M;M",
        "homepage": ";https://jicongfan.github.io/",
        "dblp": ";139/1570",
        "google_scholar": ";vdJsnhIAAAAJ",
        "orcid": "0000-0002-1410-4295;0000-0001-9665-0355",
        "linkedin": ";",
        "or_profile": "~Feng_Xiao3;~Jicong_Fan2",
        "aff": "The Chinese University of Hong Kong,Shenzhen;The Chinese University of Hong Kong, Shenzhen",
        "aff_domain": "cuhk.edu.cn;cuhk.edu.cn",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nxiao2024imad,\ntitle={Im{AD}: An End-to-End Method for Unsupervised Anomaly Detection in the Presence of Missing Values},\nauthor={Feng Xiao and Jicong Fan},\nyear={2024},\nurl={https://openreview.net/forum?id=W7kxHxjeVm}\n}",
        "github": "",
        "project": "",
        "reviewers": "Rb71;8XjW;sFKw",
        "site": "https://openreview.net/forum?id=W7kxHxjeVm",
        "pdf_size": 685305,
        "rating": "5;5;5",
        "confidence": "4;4;3",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "3;2;3",
        "wc_summary": "66;92;46",
        "wc_strengths": "45;50;55",
        "wc_weaknesses": "138;154;89",
        "wc_questions": "75;51;98",
        "wc_review": "324;347;288",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1278;568;694",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            68.0,
            18.83259585576738
        ],
        "wc_strengths_avg": [
            50.0,
            4.08248290463863
        ],
        "wc_weaknesses_avg": [
            127.0,
            27.65260686927485
        ],
        "wc_questions_avg": [
            74.66666666666667,
            19.189117286165672
        ],
        "wc_review_avg": [
            319.6666666666667,
            24.280765135299085
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            846.6666666666666,
            309.30603327808245
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:xl4R733QB7oJ:scholar.google.com/&scioq=ImAD:+An+End-to-End+Method+for+Unsupervised+Anomaly+Detection+in+the+Presence+of+Missing+Values&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Chinese University of Hong Kong, Shenzhen;Chinese University of Hong Kong",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cuhk.edu.cn;https://www.cuhk.edu.cn",
        "aff_unique_abbr": "CUHK;CUHK",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Shenzhen",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "W7n78TNfKy",
        "title": "Localized Linear Temporal Dynamics for Self-supervised Skeleton Action Recognition",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Skeleton-based action recognition has achieved remarkable performance on large-scale benchmark datasets. Nevertheless, the scarcity of annotated skeleton action data poses a significant obstacle to the advancement of this field, which inspired the recent endeavors to explore self-supervised approaches. Among them, contrastive learning based methods have gained significant attention, wherein existing approaches primarily employ a spatial-temporal backbone to extract features from the action sequence and then conduct contrastive learning within the feature space. Skeleton action sequence itself is a highly complex dynamical system, yet existing methods overlook the higher-order temporal information of the sequence. In this work, we introduce Koopman Temporal Contrastive Learning (KTCL), a Koopman theory inspired contrastive learning framework, which focuses on the localized latent dynamics of the sequence by learning discriminative linear system dynamics. Given an action sequence, we first map it into a new space where the temporal evolution becomes linear. A dynamics-oriented contrastive loss is used to enforce the dynamics of positive (or negative) samples more similar (or dissimilar).  To tackle the diverse dynamics across different action phases within one sequence, we further introduce segment-level localized linear dynamics,  accompanied by a cross-matching mechanism for alignment. Additionally, a cross-order contrastive loss is proposed to further amplify the effect of contrast across features of different orders. Intensive experiments on four benchmark datasets show that the proposed methods achieve superior performance than competing methods.",
        "keywords": "Skeleton-based action recognition;Self-supervised learning;Contrastive learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Xinghan Wang;Yadong MU",
        "authorids": "~Xinghan_Wang1;~Yadong_MU1",
        "gender": ";M",
        "homepage": ";http://www.muyadong.com/",
        "dblp": ";55/1817",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com.tw/citations?user=Fqqx4HsAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Xinghan_Wang1;~Yadong_MU1",
        "aff": "Peking University;Peking University",
        "aff_domain": "pku.edu.cn;pku.edu.cn",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\nwang2024localized,\ntitle={Localized Linear Temporal Dynamics for Self-supervised Skeleton Action Recognition},\nauthor={Xinghan Wang and Yadong MU},\nyear={2024},\nurl={https://openreview.net/forum?id=W7n78TNfKy}\n}",
        "github": "",
        "project": "",
        "reviewers": "mmWt;A4dc;7Efe;qrLh",
        "site": "https://openreview.net/forum?id=W7n78TNfKy",
        "pdf_size": 1456956,
        "rating": "3;3;5;5",
        "confidence": "3;5;4;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;2",
        "presentation": "2;2;3;3",
        "wc_summary": "106;73;90;84",
        "wc_strengths": "47;34;29;55",
        "wc_weaknesses": "715;169;123;109",
        "wc_questions": "135;5;125;22",
        "wc_review": "1003;281;367;270",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            88.25,
            11.92424001771182
        ],
        "wc_strengths_avg": [
            41.25,
            10.304731922762475
        ],
        "wc_weaknesses_avg": [
            279.0,
            252.70140482395422
        ],
        "wc_questions_avg": [
            71.75,
            58.66589724874239
        ],
        "wc_review_avg": [
            480.25,
            304.13761276764177
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.30151134457776363,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13249471768719480932&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Peking University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.pku.edu.cn",
        "aff_unique_abbr": "Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Neuroformer: Multimodal and Multitask Generative Pretraining for Brain Data",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18486",
        "id": "W8S8SxS9Ng",
        "author_site": "Antonis Antoniades, Yiyi Yu, Joe Canzano, William Wang, Spencer Smith",
        "tldr": "",
        "abstract": "State-of-the-art systems neuroscience experiments yield large-scale multimodal data, and these data sets require new tools for analysis. Inspired by the success of large pretrained models in vision and language domains, we reframe the analysis of large-scale, cellular-resolution neuronal spiking data into an auto-regressive spatiotemporal generation problem. Neuroformer is a multimodal, multitask generative pre-trained transformer (GPT) model that is specifically designed to handle the intricacies of data in systems neuroscience. It scales linearly with feature size, can process an arbitrary number of modalities, and is adaptable to downstream tasks, such as predicting behavior. We first trained Neuroformer on simulated datasets, and found that it both accurately predicted simulated neuronal circuit activity, and also intrinsically inferred the underlying neural circuit connectivity, including direction. When pretrained to decode neural responses, the model predicted the behavior of a mouse with only few-shot fine-tuning, suggesting that the model begins learning how to do so directly from the neural representations themselves, without any explicit supervision. We used an ablation study to show that joint training on neuronal responses and behavior boosted performance, highlighting the model's ability to associate behavioral and neural representations in an unsupervised manner. These findings show that Neuroformer can analyze neural datasets and their emergent properties, informing the development of models and hypotheses associated with the brain.",
        "keywords": "GPT;Pretraining;Transformers;Multimodal;Multitask;Neuron;Neuroscience;Neuronal;Spikes;Brain;Cortex;Human;Mice;Biology",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/751fa56416247daa5dec74b81bd3aa8044407ffc.zip",
        "author": "Antonis Antoniades;Yiyi Yu;Joe S Canzano;William Yang Wang;Spencer Smith",
        "authorids": "~Antonis_Antoniades1;~Yiyi_Yu1;~Joe_S_Canzano1;~William_Yang_Wang2;~Spencer_Smith1",
        "gender": "M;F;M;M;M",
        "homepage": ";;;http://slslab.org/;https://www.cs.ucsb.edu/~william/",
        "dblp": ";126/4451;;242/9109;08/9282",
        "google_scholar": ";6N6nROAAAAAJ;W6Bqxc0AAAAJ;7jywvqkAAAAJ;gf8Ms_8AAAAJ",
        "orcid": ";0000-0003-1053-413X;0000-0002-5371-4846;;",
        "linkedin": "antonis-antoniades-0497a136/;;;;",
        "or_profile": "~Antonis_Antoniades1;~Yiyi_Yu1;~Joe_S_Canzano1;~Spencer_Smith1;~William_Wang1",
        "aff": "University of California, Santa Barbara;;University of California, Santa Barbara;UC Santa Barbara;UC Santa Barbara",
        "aff_domain": "ucsb.edu;;ucsb.edu;ucsb.edu;ucsb.edu",
        "position": "PhD student;;PhD student;Associate Professor;Full Professor",
        "bibtex": "@inproceedings{\nantoniades2024neuroformer,\ntitle={Neuroformer: Multimodal and Multitask Generative Pretraining for Brain Data},\nauthor={Antonis Antoniades and Yiyi Yu and Joe S Canzano and William Yang Wang and Spencer Smith},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=W8S8SxS9Ng}\n}",
        "github": "",
        "project": "",
        "reviewers": "HBVf;M1PZ;pMwz;dTQU",
        "pdf_size": 11084917,
        "rating": "5;6;6;8",
        "confidence": "3;2;4;3",
        "soundness": "2;3;4;2",
        "contribution": "2;2;3;3",
        "presentation": "2;2;3;2",
        "wc_summary": "254;65;94;78",
        "wc_strengths": "71;18;38;11",
        "wc_weaknesses": "252;62;21;161",
        "wc_questions": "146;359;642;34",
        "wc_review": "723;504;795;284",
        "wc_reply_reviewers": "337;80;0;77",
        "wc_reply_authors": "1123;481;796;379",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "3;2;1;2",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            122.75,
            76.47017392421702
        ],
        "wc_strengths_avg": [
            34.5,
            23.286262044390035
        ],
        "wc_weaknesses_avg": [
            124.0,
            89.73015100845423
        ],
        "wc_questions_avg": [
            295.25,
            231.74703342222097
        ],
        "wc_review_avg": [
            576.5,
            200.01062471778843
        ],
        "wc_reply_reviewers_avg": [
            123.5,
            127.36659687688919
        ],
        "wc_reply_authors_avg": [
            694.75,
            291.13431178753217
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17789622648871212444&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=W8S8SxS9Ng",
        "pdf": "https://openreview.net/pdf?id=W8S8SxS9Ng",
        "email": "ucsb.edu;;ucsb.edu;ucsb.edu;ucsb.edu",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of California, Santa Barbara",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucsb.edu",
        "aff_unique_abbr": "UCSB",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Santa Barbara",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "W98SiAk2ni",
        "title": "Ensemble Systems Representation for Function Learning over Manifolds",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Function learning concerns with the search for functional relationships among datasets. It coincides with the formulations of various learning problems, particularly supervised learning problems, and serves as the prototype for many learning models, e.g., neural networks and kernel machines. In this paper, we propose a novel framework to tackle function learning tasks from the perspective of ensemble systems theory. Our central idea is to generate function learning algorithms by using flows of continuous-time ensemble systems defined on infinite-dimensional Riemannian manifolds. This immediately gives rise to the notion of natural gradient flow that enables the generated algorithms to tackle function learning tasks over manifolds. Moreover, we rigorously investigate the relationship between the convergence of the generated algorithms and the dynamics of the ensemble systems with and without an external forcing or control input. We show that by turning the penalty strengths into control inputs, the algorithms are able to converge to any function over the manifold, regardless of the initial guesses, providing {\\em ensemble controllability} of the systems. In addition to the theoretical investigation, concrete examples are also provided to demonstrate the high efficiency and excellent generalizability of these \"continuous-time\" algorithms compared with classical \"discrete-time\" algorithms.",
        "keywords": "Function learning;dynamical systems;control theory",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/f48bc625af689d1cd11b63cbda0f91e144e5d4ba.pdf",
        "author": "Wei Zhang;Vignesh Narayanan;Jr-Shin Li",
        "authorids": "~Wei_Zhang67;~Vignesh_Narayanan1;~Jr-Shin_Li1",
        "gender": "M;;M",
        "homepage": ";https://vigsnar.github.io;https://www.ese.wustl.edu/~jsli/AMLab/Home.html",
        "dblp": ";156/0202;",
        "google_scholar": ";rirGB10AAAAJ;",
        "orcid": "0000-0003-0003-0341;;",
        "linkedin": ";;",
        "or_profile": "~Wei_Zhang67;~Vignesh_Narayanan1;~Jr-Shin_Li1",
        "aff": "Washington University, Saint Louis;University of South Carolina;Washington University, St. Louis",
        "aff_domain": "wustl.edu;sc.edu;wustl.edu",
        "position": "Postdoc;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nanonymous2024ensemble,\ntitle={Ensemble Systems Representation for Function Learning over Manifolds},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=W98SiAk2ni}\n}",
        "github": "",
        "project": "",
        "reviewers": "o8J1;ZBR1;s5Ry;p7oi",
        "site": "https://openreview.net/forum?id=W98SiAk2ni",
        "pdf_size": 1009466,
        "rating": "1;3;3;5",
        "confidence": "3;3;3;3",
        "soundness": "2;3;3;2",
        "contribution": "1;2;2;2",
        "presentation": "2;2;2;3",
        "wc_summary": "156;136;87;85",
        "wc_strengths": "45;38;38;93",
        "wc_weaknesses": "92;284;96;99",
        "wc_questions": "40;160;73;109",
        "wc_review": "333;618;294;386",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            116.0,
            30.83018001893599
        ],
        "wc_strengths_avg": [
            53.5,
            22.983689869122408
        ],
        "wc_weaknesses_avg": [
            142.75,
            81.5885255412794
        ],
        "wc_questions_avg": [
            95.5,
            44.52246623896749
        ],
        "wc_review_avg": [
            407.75,
            125.70277443238872
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:L7K1nqULm3EJ:scholar.google.com/&scioq=Ensemble+Systems+Representation+for+Function+Learning+over+Manifolds&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Washington University in St. Louis;University of South Carolina",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://wustl.edu;https://www.sc.edu",
        "aff_unique_abbr": "WUSTL;USC",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Saint Louis;;St. Louis",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "W9DxKDCVnr",
        "title": "BeGin: Extensive Benchmark Scenarios and An Easy-to-use Framework for Graph Continual Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Continual Learning (CL) is the process of learning ceaselessly a sequence of tasks. Most existing CL methods deal with independent data (e.g., images and text) for which many benchmark frameworks and results under standard experimental settings are available. Compared to them, however, CL methods for graph data (graph CL) are relatively underexplored because of (a) the lack of standard experimental settings, especially regarding how to deal with the dependency between instances, (b) the lack of benchmark datasets and scenarios, and (c) high complexity in implementation and evaluation due to the dependency. In this paper, regarding (a) we define four standard incremental settings (task-, class-, domain-, and time-incremental) for node-, link-, and graph-level problems, extending the previously explored scope. Regarding (b), we provide 31 benchmark scenarios based on 20 real-world graphs. Regarding (c), we develop BeGin, an easy and fool-proof framework for graph CL. BeGin is easily extended since it is modularized with reusable modules for data processing, algorithm design, and evaluation. Especially, the evaluation module is completely separated from user code to eliminate potential mistakes. Regarding benchmark results, we cover 3$\\times$ more combinations of incremental settings and levels of problems than the latest benchmark.",
        "keywords": "Graph Continual Learning;Continual Learning Benchmark Framework",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Jihoon Ko;Shinhwan Kang;Taehyung Kwon;Heechan Moon;Kijung Shin",
        "authorids": "~Jihoon_Ko2;~Shinhwan_Kang1;~Taehyung_Kwon1;~Heechan_Moon1;~Kijung_Shin2",
        "gender": ";M;M;M;M",
        "homepage": ";https://sites.google.com/view/shinhwankang/;https://kbrother.github.io/;;https://kijungs.github.io/",
        "dblp": "127/7344;;175/2163;;153/2052",
        "google_scholar": "_m0bPIQAAAAJ;_wASixAAAAAJ;https://scholar.google.co.kr/citations?user=Ld_e3xIAAAAJ;;https://scholar.google.co.kr/citations?user=Yp3Cz5AAAAAJ",
        "orcid": ";;0000-0002-6177-7329;0000-0001-7086-8911;0000-0002-2872-1526",
        "linkedin": ";;;;kijungshin/",
        "or_profile": "~Jihoon_Ko2;~Shinhwan_Kang1;~Taehyung_Kwon1;~Heechan_Moon1;~Kijung_Shin2",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr;kaist.ac.kr;kaist.ac.kr;kaist.ac.kr",
        "position": "PhD student;PhD student;PhD student;MS student;Associate Professor",
        "bibtex": "@misc{\nko2024begin,\ntitle={BeGin: Extensive Benchmark Scenarios and An Easy-to-use Framework for Graph Continual Learning},\nauthor={Jihoon Ko and Shinhwan Kang and Taehyung Kwon and Heechan Moon and Kijung Shin},\nyear={2024},\nurl={https://openreview.net/forum?id=W9DxKDCVnr}\n}",
        "github": "",
        "project": "",
        "reviewers": "xQU7;amhN;mU8z;DN96",
        "site": "https://openreview.net/forum?id=W9DxKDCVnr",
        "pdf_size": 1101855,
        "rating": "3;3;5;5",
        "confidence": "4;4;3;3",
        "soundness": "2;2;3;3",
        "contribution": "2;1;3;3",
        "presentation": "2;2;2;3",
        "wc_summary": "79;35;23;89",
        "wc_strengths": "51;23;22;104",
        "wc_weaknesses": "227;109;58;151",
        "wc_questions": "6;124;3;56",
        "wc_review": "363;291;106;400",
        "wc_reply_reviewers": "0;116;0;66",
        "wc_reply_authors": "906;2074;1151;541",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "2;5;2;2",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            56.5,
            28.0490641555115
        ],
        "wc_strengths_avg": [
            50.0,
            33.279122584587476
        ],
        "wc_weaknesses_avg": [
            136.25,
            61.88446897243281
        ],
        "wc_questions_avg": [
            47.25,
            49.05800138611438
        ],
        "wc_review_avg": [
            290.0,
            113.23206259712838
        ],
        "wc_reply_reviewers_avg": [
            45.5,
            48.81342028581894
        ],
        "wc_reply_authors_avg": [
            1168.0,
            566.3254364762367
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.75,
            1.299038105676658
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16408330341075479371&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "WA2mZrDTAH",
        "title": "ZegOT: Zero-shot Segmentation Through Optimal Transport of Pixels to Text Prompts",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent success of large-scale Contrastive Language-Image Pre-training (CLIP) has led to great promise in zero-shot semantic segmentation by transferring text-image aligned knowledge to  pixel-level classification. \nHowever, existing methods usually require an additional image encoder or retraining/tuning the CLIP module. \nHere,  we propose a novel Zero-shot segmentation with Optimal Transport (ZegOT) method that matches multiple text prompts with frozen image embeddings through optimal transport. In particular, we introduce a novel  Multiple Prompt Optimal Transport Solver (MPOT), which is designed to learn an optimal mapping between multiple text prompts and pixel embeddings of the frozen image encoder layers. This unique mapping method facilitates each of the multiple text prompts to effectively focus on distinct visual semantic attributes and diversify the learned knowledge to robustly cope with previously unseen categories.\nThrough extensive experiments on benchmark datasets, we show that our method achieves the state-of-the-art (SOTA) performance over existing Zero-shot Semantic Segmentation (ZS3) approaches.",
        "keywords": "Zero-shot semantic segmentation;Optimal transport;Prompt learning;Vision-language model",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Kwanyoung Kim;Yujin Oh;Jong Chul Ye",
        "authorids": "~Kwanyoung_Kim1;~Yujin_Oh1;~Jong_Chul_Ye1",
        "gender": "M;F;M",
        "homepage": "https://sites.google.com/view/kwanyoung-kim/;;https://bispl.weebly.com/",
        "dblp": "120/3921;;15/5613",
        "google_scholar": "uvHIHbkAAAAJ;4nnw088AAAAJ;HNMjoNEAAAAJ",
        "orcid": ";0000-0003-4319-8435;",
        "linkedin": "kwanyoung-kim-2a39b41b3/;;",
        "or_profile": "~Kwanyoung_Kim1;~Yujin_Oh1;~Jong_Chul_Ye1",
        "aff": "Korea Advanced Institute of Science & Technology;KAIST;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr;kaist.ac.kr",
        "position": "PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nkim2024zegot,\ntitle={Zeg{OT}: Zero-shot Segmentation Through Optimal Transport of Pixels to Text Prompts},\nauthor={Kwanyoung Kim and Yujin Oh and Jong Chul Ye},\nyear={2024},\nurl={https://openreview.net/forum?id=WA2mZrDTAH}\n}",
        "github": "",
        "project": "",
        "reviewers": "41mH;Dhw2;kYrk",
        "site": "https://openreview.net/forum?id=WA2mZrDTAH",
        "pdf_size": 9202009,
        "rating": "3;6;6",
        "confidence": "4;3;4",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "2;3;3",
        "wc_summary": "82;51;77",
        "wc_strengths": "48;24;66",
        "wc_weaknesses": "219;136;89",
        "wc_questions": "2;26;3",
        "wc_review": "351;237;235",
        "wc_reply_reviewers": "125;36;0",
        "wc_reply_authors": "798;680;572",
        "reply_reviewers": "1;1;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            70.0,
            13.589211407093005
        ],
        "wc_strengths_avg": [
            46.0,
            17.204650534085253
        ],
        "wc_weaknesses_avg": [
            148.0,
            53.74631770332426
        ],
        "wc_questions_avg": [
            10.333333333333334,
            11.08552609887726
        ],
        "wc_review_avg": [
            274.3333333333333,
            54.21766829692657
        ],
        "wc_reply_reviewers_avg": [
            53.666666666666664,
            52.53781706753929
        ],
        "wc_reply_authors_avg": [
            683.3333333333334,
            92.29421554042389
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:4voet6hRZJgJ:scholar.google.com/&scioq=ZegOT:+Zero-shot+Segmentation+Through+Optimal+Transport+of+Pixels+to+Text+Prompts&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "WBCPdhQPuz",
        "title": "DAS$^2$C: A Distributed Adaptive Minimax Method with Near-Optimal Convergence",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Applying adaptive methods directly to distributed minimax problems can result in non-convergence due to inconsistency in locally computed adaptive stepsizes. To address this challenge, we propose DAS$^2$C, a $\\underline{\\text{D}}$istributed $\\underline{\\text{A}}$daptive method with time-scale \\$\\underline{\\text{S}}$eparated $\\underline{\\text{S}}$tepsize $\\underline{\\text{C}}$ontrol for minimax optimization. The key strategy is to employ an adaptive stepsize control protocol involving the transmission of two extra (scalar) variables. This protocol ensures the consistency among stepsizes of nodes, eliminating the steady-state errors due to the lack of coordination of stepsizes among nodes that commonly exists in vanilla distributed adaptive methods, and thus guarantees exact convergence. For non-convex-strongly-concave distributed minimax problems, we characterize the specific transient times that ensure time-scale separation and quasi-independence of networks, leading to a near-optimal convergence rate of $\\tilde{\\mathcal{O}} \\left( \\epsilon ^{-\\left( 4+\\delta \\right)} \\right)$ for any small $\\delta > 0$, matching that of the centralized counterpart. To the best of our knowledge, DAS$^2$C is the $\\textit{first}$ distributed adaptive method guaranteeing exact convergence without requiring to know any problem-dependent parameters for nonconvex minimax problems.",
        "keywords": "Minimax Optimization;Distributed Learning;Nonconvex Optimization;Convergence Analysis;Stepsize Inconsistency",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/afc19e2216a6103a66315ec6d478826dea6da9cb.zip",
        "author": "Yan Huang;Xiang Li;Yipeng Shen;Niao He;Jinming Xu",
        "authorids": "~Yan_Huang13;~Xiang_Li38;~Yipeng_Shen1;~Niao_He3;~Jinming_Xu1",
        "gender": ";M;M;;M",
        "homepage": ";https://shawnli.me;;;https://jinmingxu.github.io/",
        "dblp": ";40/1491;;;143/5957",
        "google_scholar": ";VFwF8tEAAAAJ;;;MuflLyIAAAAJ",
        "orcid": ";;0009-0006-7504-4456;;",
        "linkedin": ";;;;",
        "or_profile": "~Yan_Huang13;~Xiang_Li38;~Yipeng_Shen1;~Niao_He3;~Jinming_Xu1",
        "aff": ";ETHZ - ETH Zurich;Zhejiang University;;Zhejiang University",
        "aff_domain": ";ethz.ch;zju.edu.cn;;zju.edu.cn",
        "position": ";PhD student;MS student;;Assistant Professor",
        "bibtex": "@misc{\nhuang2024dasc,\ntitle={{DAS}\\${\\textasciicircum}2\\$C: A Distributed Adaptive Minimax Method with Near-Optimal Convergence},\nauthor={Yan Huang and Xiang Li and Yipeng Shen and Niao He and Jinming Xu},\nyear={2024},\nurl={https://openreview.net/forum?id=WBCPdhQPuz}\n}",
        "github": "",
        "project": "",
        "reviewers": "GJ7M;Wx7b;wTqn;x9Sp",
        "site": "https://openreview.net/forum?id=WBCPdhQPuz",
        "pdf_size": 1567505,
        "rating": "3;6;6;6",
        "confidence": "5;3;4;5",
        "soundness": "1;3;3;2",
        "contribution": "1;3;2;2",
        "presentation": "1;1;3;2",
        "wc_summary": "29;34;53;46",
        "wc_strengths": "11;36;51;46",
        "wc_weaknesses": "145;90;179;84",
        "wc_questions": "145;74;118;135",
        "wc_review": "330;234;401;311",
        "wc_reply_reviewers": "0;0;0;16",
        "wc_reply_authors": "498;561;928;760",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "2;1;2;2",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            40.5,
            9.5
        ],
        "wc_strengths_avg": [
            36.0,
            15.411035007422441
        ],
        "wc_weaknesses_avg": [
            124.5,
            39.436658073421995
        ],
        "wc_questions_avg": [
            118.0,
            27.175356483402386
        ],
        "wc_review_avg": [
            319.0,
            59.443250247610116
        ],
        "wc_reply_reviewers_avg": [
            4.0,
            6.928203230275509
        ],
        "wc_reply_authors_avg": [
            686.75,
            169.56322567113423
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:L_0Tyubg3jcJ:scholar.google.com/&scioq=DAS%24%5E2%24C:+A+Distributed+Adaptive+Minimax+Method+with+Near-Optimal+Convergence&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "ETH Zurich;Zhejiang University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ethz.ch;https://www.zju.edu.cn",
        "aff_unique_abbr": "ETHZ;ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "Switzerland;China"
    },
    {
        "id": "WBkjxnYAgy",
        "title": "Predicate-Argument Relations in the Human Brain",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Humans perceive, understand, and describe the world in terms of\nrelations between things: Who did what to whom. Novel stimulus design,\nneuroimaging (fMRI) data, and machine-learning analysis methods allow\nassessing the degree to which the human brain represents this\ninformation in a way that can be decoded across different subjects and\nmodalities.  Analysis of the voxels involved in this decoding\ndemonstrates signifcant commonality across pairs of subjects and\nmodalities.  This suggests a shared neural substrate that supports\npredicate-argument relations in multiple modalities that is common\nacross different people.",
        "keywords": "compositionality;thematic role assignment;neuroimaging;fMRI",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/f818f9107f3ddefb89d5c3034b28433aaa635061.zip",
        "author": "Yipei Wang;Xiaoqian Wang;Ronnie Bring Wilbur;Jeffrey Mark Siskind",
        "authorids": "~Yipei_Wang1;~Xiaoqian_Wang1;~Ronnie_Bring_Wilbur1;~Jeffrey_Mark_Siskind1",
        "gender": "M;F;M;F",
        "homepage": "https://yipei-wang.github.io;https://engineering.purdue.edu/~joywang/;http://engineering.purdue.edu/~qobi;",
        "dblp": "140/2763;151/3215-1;49/5331;42/2214",
        "google_scholar": "NXENco8AAAAJ;I3tc214AAAAJ;CgSBtPYAAAAJ;gC5RqdoAAAAJ",
        "orcid": ";;0000-0002-0105-6503;0000-0001-7081-9351",
        "linkedin": ";;;",
        "or_profile": "~Yipei_Wang1;~Xiaoqian_Wang1;~Jeffrey_Mark_Siskind1;~Ronnie_Wilbur1",
        "aff": "Purdue University;Purdue University;Purdue University;Purdue University",
        "aff_domain": "purdue.edu;purdue.edu;purdue.edu;purdue.edu",
        "position": "PhD student;Assistant Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nwang2024predicateargument,\ntitle={Predicate-Argument Relations in the Human Brain},\nauthor={Yipei Wang and Xiaoqian Wang and Ronnie Bring Wilbur and Jeffrey Mark Siskind},\nyear={2024},\nurl={https://openreview.net/forum?id=WBkjxnYAgy}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZsMm;HNdL;L5si;B2cQ",
        "site": "https://openreview.net/forum?id=WBkjxnYAgy",
        "pdf_size": 1213640,
        "rating": "3;3;3;8",
        "confidence": "3;4;5;4",
        "soundness": "1;2;2;4",
        "contribution": "1;2;2;4",
        "presentation": "2;2;3;3",
        "wc_summary": "49;99;109;87",
        "wc_strengths": "3;16;42;183",
        "wc_weaknesses": "175;233;98;40",
        "wc_questions": "64;296;9;68",
        "wc_review": "291;644;258;378",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            2.165063509461097
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            1.0897247358851685
        ],
        "contribution_avg": [
            2.25,
            1.0897247358851685
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            86.0,
            22.737634001804146
        ],
        "wc_strengths_avg": [
            61.0,
            71.8226983620081
        ],
        "wc_weaknesses_avg": [
            136.5,
            73.46597852067309
        ],
        "wc_questions_avg": [
            109.25,
            110.31177407693161
        ],
        "wc_review_avg": [
            392.75,
            151.53774282336397
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:u8baSa8bJ-YJ:scholar.google.com/&scioq=Predicate-Argument+Relations+in+the+Human+Brain&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Purdue University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.purdue.edu",
        "aff_unique_abbr": "Purdue",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "WDQ9ZzsgDL",
        "title": "PromptNER : Prompting For FewShot Named Entity Recognition",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In a surprising turn, Large Language Models (LLMs), together with a growing arsenal of prompt-based heuristics, provide powerful few-shot solutions to myriad classic NLP problems. However, despite promising early results, current LLM based few-shot methods remain far from the state of the art in Named Entity Recognition (NER), where prevailing methods include learning representations via end-to-end structural understanding and fine-tuning on standard labeled corpora. In this paper, we introduce PromptNER, an algorithm for few-shot and cross-domain NER. To adapt to a new NER task, PromptNER requires a set of entity definitions, and a set of few-shot examples, along with explanatory text justifying the applicability of each entity tag. Given a sentence, PromptNER prompts an LLM to produce a list of potential entities along with corresponding explanations justifying their compatibility with the provided entity type definitions. PromptNER achieves state-of-the-art performance on few-shot NER, achieving improvements in F1 score (absolute) of 4% on the ConLL dataset, 9% on GENIA, 4% on FewNERD, 5% on FaBNER and 24% on TweetNER. PromptNER also achieves state-of-the-art performance on Cross Domain NER beating even methods not restricted to the few-shot setting on 3/5 CrossNER target domains, with an average F1 gain of 3%, despite using less than 2% of the available data.",
        "keywords": "Named Entity Recognition;Large Language Models;Prompting;FewShot Learning;NER",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Dhananjay Ashok;Zachary Chase Lipton",
        "authorids": "~Dhananjay_Ashok1;~Zachary_Chase_Lipton1",
        "gender": ";Unspecified",
        "homepage": "https://dhananjayashok.github.io/;http://zacklipton.com",
        "dblp": "277/0892;",
        "google_scholar": "dxKCrsYAAAAJ;MN9Kfg8AAAAJ",
        "orcid": ";",
        "linkedin": "dhananjay-ashok-576342142/;",
        "or_profile": "~Dhananjay_Ashok1;~Zachary_Chase_Lipton1",
        "aff": "University of Southern California;Carnegie Mellon University",
        "aff_domain": "usc.edu;cmu.edu",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nashok2024promptner,\ntitle={Prompt{NER} : Prompting For FewShot Named Entity Recognition},\nauthor={Dhananjay Ashok and Zachary Chase Lipton},\nyear={2024},\nurl={https://openreview.net/forum?id=WDQ9ZzsgDL}\n}",
        "github": "",
        "project": "",
        "reviewers": "CmJa;Zo5E;9We2;2EDv",
        "site": "https://openreview.net/forum?id=WDQ9ZzsgDL",
        "pdf_size": 2070902,
        "rating": "3;3;3;5",
        "confidence": "5;4;3;4",
        "soundness": "2;2;3;3",
        "contribution": "1;2;2;1",
        "presentation": "2;2;3;3",
        "wc_summary": "75;31;56;74",
        "wc_strengths": "38;28;44;54",
        "wc_weaknesses": "224;62;127;90",
        "wc_questions": "99;1;2;58",
        "wc_review": "436;122;229;276",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "243;165;101;57",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            59.0,
            17.84656829757475
        ],
        "wc_strengths_avg": [
            41.0,
            9.433981132056603
        ],
        "wc_weaknesses_avg": [
            125.75,
            61.230609175476935
        ],
        "wc_questions_avg": [
            40.0,
            41.140004861448425
        ],
        "wc_review_avg": [
            265.75,
            113.0317986232193
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            141.5,
            70.06247212309883
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:RTr8vOZieqwJ:scholar.google.com/&scioq=PromptNER+:+Prompting+For+FewShot+Named+Entity+Recognition&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Southern California;Carnegie Mellon University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.usc.edu;https://www.cmu.edu",
        "aff_unique_abbr": "USC;CMU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Los Angeles;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "WEQS3oUPs3",
        "title": "Zero-Shot Goal-Directed Dialogue via RL on Imagined Conversations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs) have emerged as powerful and general solutions to many natural language tasks. However, many of the most important applications of language generation are interactive, where an agent has to talk to a person to reach a desired outcome.\nFor example, a teacher might try to understand their student's current comprehension level to tailor their instruction accordingly, and a travel agent might ask questions of their customer to understand their preferences in order to recommend activities they might enjoy.\nLLMs trained with supervised fine-tuning or ``single-step'' RL, as with standard RLHF, might struggle which tasks that require such goal-directed behavior, since they are not trained to optimize for overall conversational outcomes after multiple turns of interaction. In this work, we explore a new method for adapting LLMs with RL for such goal-directed dialogue. Our key insight is that, though LLMs might not effectively solve goal-directed dialogue tasks out of the box, they can provide useful data for solving such tasks by simulating suboptimal but human-like behaviors. Given a textual description of a goal-directed dialogue task, we leverage LLMs to sample diverse synthetic rollouts of hypothetical in-domain human-human interactions. Our algorithm then utilizes this dataset with offline reinforcement learning to train an interactive conversational agent that can optimize goal-directed objectives over multiple turns. In effect, the LLM produces examples of possible interactions, and RL then processes these examples to learn to perform more optimal interactions. Empirically, we show that our proposed approach achieves state-of-the-art performance in various goal-directed dialogue tasks that include teaching and preference elicitation.",
        "keywords": "goal-directed dialogue;offline reinforcement learning;zero-shot learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/8cc9caf41e953a5fd156b88b170e4834e2876c05.zip",
        "author": "Joey Hong;Sergey Levine;Anca Dragan",
        "authorids": "~Joey_Hong2;~Sergey_Levine1;~Anca_Dragan1",
        "gender": "M;M;F",
        "homepage": ";https://people.eecs.berkeley.edu/~svlevine/;http://www.ancadragan.com/",
        "dblp": "188/6056.html;80/7594;",
        "google_scholar": "SiBVfPUAAAAJ;8R35rCwAAAAJ;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Joey_Hong2;~Sergey_Levine1;~Anca_Dragan1",
        "aff": "University of California, Berkeley;Google;University of California, Berkeley",
        "aff_domain": "berkeley.edu;google.com;berkeley.edu",
        "position": "PhD student;Research Scientist;Associate Professor",
        "bibtex": "@misc{\nhong2024zeroshot,\ntitle={Zero-Shot Goal-Directed Dialogue via {RL} on Imagined Conversations},\nauthor={Joey Hong and Sergey Levine and Anca Dragan},\nyear={2024},\nurl={https://openreview.net/forum?id=WEQS3oUPs3}\n}",
        "github": "",
        "project": "",
        "reviewers": "yVGF;sDqR;Ntkf",
        "site": "https://openreview.net/forum?id=WEQS3oUPs3",
        "pdf_size": 612663,
        "rating": "5;5;6",
        "confidence": "4;3;3",
        "soundness": "3;2;3",
        "contribution": "2;2;3",
        "presentation": "2;2;2",
        "wc_summary": "178;92;74",
        "wc_strengths": "50;25;90",
        "wc_weaknesses": "238;77;30",
        "wc_questions": "4;14;28",
        "wc_review": "470;208;222",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1132;944;273",
        "reply_reviewers": "0;0;0",
        "reply_authors": "3;3;2",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            114.66666666666667,
            45.382326466980025
        ],
        "wc_strengths_avg": [
            55.0,
            26.770630673681683
        ],
        "wc_weaknesses_avg": [
            115.0,
            89.06551895468115
        ],
        "wc_questions_avg": [
            15.333333333333334,
            9.843215373488933
        ],
        "wc_review_avg": [
            300.0,
            120.3439515167533
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            783.0,
            368.701324470996
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 20,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12034110312959757782&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of California, Berkeley;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.berkeley.edu;https://www.google.com",
        "aff_unique_abbr": "UC Berkeley;Google",
        "aff_campus_unique_index": "0;1;0",
        "aff_campus_unique": "Berkeley;Mountain View",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "WEoyWdsI9f",
        "title": "Quantifying and Defending against the Privacy Risk in Logit-based Federated Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Federated learning (FL) aims to protect data privacy by collaboratively learning a model without sharing private data among clients. Novel logit-based FL methods share model outputs (i.e., logits) on public data instead of model weights or gradients during training to enable model heterogeneity, reduce communication overhead and preserve clients\u2019 privacy. However, the privacy risk of these logit-based methods is largely overlooked. To the best of our knowledge, this research is the first theoretical and empirical analysis of a hidden privacy risk in logit-based FL methods \u2013 the risk that the semi-honest server (adversary) may learn clients\u2019 private models from logits. To quantify the impacts of the privacy risk, we develop an effective attack named Adaptive Model Stealing Attack (AdaMSA) by leveraging historical logits during training. Additionally, we provide a theoretical analysis on the bound of this privacy risk. We then propose a simple but effective defense strategy that perturbs the transmitted logits in the direction that minimizes the privacy risk while maximally preserving the training performance. The experimental results validate our analysis and demonstrate the effectiveness of the proposed attack and defense strategy.",
        "keywords": "Logit-based Federated Learning;Privacy Attack;Defense",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Sheng Wan;Dashan Gao;Hanlin Gu;Lixin Fan;Qiang Yang",
        "authorids": "~Sheng_Wan2;~Dashan_Gao4;~Hanlin_Gu1;~Lixin_Fan1;~Qiang_Yang1",
        "gender": "M;M;M;M;",
        "homepage": "https://scholar.google.com/citations?user=CKfbX4AAAAAJ&hl=en&oi=ao;https://dashangao.github.io/;;;",
        "dblp": ";https://dblp.uni-trier.de/pid/37/2326-2.html;236/6661;36/3111;",
        "google_scholar": ";7WVd9ZwAAAAJ;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com/citations?hl=en;",
        "orcid": ";;0000-0001-8266-4561;;",
        "linkedin": ";;;;",
        "or_profile": "~Sheng_Wan2;~Dashan_Gao4;~Hanlin_Gu1;~Lixin_Fan1;~Qiang_Yang1",
        "aff": "Hong Kong University of Science and Technology;Department of Computer Science and Engineering, Hong Kong University of Science and Technology;webank;WeBank;",
        "aff_domain": "hkust.edu;cse.ust.hk;webank.com;webank.com;",
        "position": "PhD student;PhD student;Researcher;Principal Researcher;",
        "bibtex": "@misc{\nwan2024quantifying,\ntitle={Quantifying and Defending against the Privacy Risk in Logit-based Federated Learning},\nauthor={Sheng Wan and Dashan Gao and Hanlin Gu and Lixin Fan and Qiang Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=WEoyWdsI9f}\n}",
        "github": "",
        "project": "",
        "reviewers": "sfwc;K1GZ;kvRw;nzQ8",
        "site": "https://openreview.net/forum?id=WEoyWdsI9f",
        "pdf_size": 737656,
        "rating": "3;5;5;6",
        "confidence": "5;4;3;3",
        "soundness": "3;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;2",
        "wc_summary": "52;65;53;83",
        "wc_strengths": "33;50;19;62",
        "wc_weaknesses": "46;29;197;64",
        "wc_questions": "103;415;21;36",
        "wc_review": "234;559;290;245",
        "wc_reply_reviewers": "0;265;42;0",
        "wc_reply_authors": "1277;1432;1037;728",
        "reply_reviewers": "0;3;1;0",
        "reply_authors": "2;4;2;2",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            63.25,
            12.497499749949988
        ],
        "wc_strengths_avg": [
            41.0,
            16.355427233796124
        ],
        "wc_weaknesses_avg": [
            84.0,
            66.404066140561
        ],
        "wc_questions_avg": [
            143.75,
            159.62044825146933
        ],
        "wc_review_avg": [
            332.0,
            132.7271637608519
        ],
        "wc_reply_reviewers_avg": [
            76.75,
            110.0303935283338
        ],
        "wc_reply_authors_avg": [
            1118.5,
            265.7710480846249
        ],
        "reply_reviewers_avg": [
            1.0,
            1.224744871391589
        ],
        "reply_authors_avg": [
            2.5,
            0.8660254037844386
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.899228803025897,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:7OwqfTJnoFsJ:scholar.google.com/&scioq=Quantifying+and+Defending+against+the+Privacy+Risk+in+Logit-based+Federated+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;1",
        "aff_unique_norm": "Hong Kong University of Science and Technology;WeBank",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ust.hk;https://www.webank.com",
        "aff_unique_abbr": "HKUST;WeBank",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "WFYbBOEOtv",
        "title": "V-JEPA: Latent Video Prediction for Visual Representation Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper shows that the masked-modelling principle driving the success of large foundational language models can be effectively applied to video by making predictions in latent space. We introduce V-JEPA, a method for self-supervised learning from video that predicts masked spatio-temporal regions in a learned representation space. Our latent video prediction strategy produces visual features that can be applied to various downstream image and video tasks without adaption of the model's parameters (using only frozen evaluation), achieving 82.1% on Kinetics-400 and 71.2% on Something-Something-v2, surpassing the previous best video models by +4 and +10 points respectively. We also demonstrate the benefit of video pretraining compared to image pretraining for tasks involving motion understanding, where V-JEPA outperforms the largest state-of-the-art image models, DINOv2 and OpenCLIP. Finally, V-JEPA trained only on video achieves 77.9% on ImageNet classification without any image fine-tuning, surpassing the previous best video model by +6 points top-1.",
        "keywords": "self-supervised learning;video representation learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/5f27219c4bd46105568eadff9ba4b8cf38ec80f7.pdf",
        "author": "Adrien Bardes;Quentin Garrido;Jean Ponce;Xinlei Chen;Michael Rabbat;Yann LeCun;Mido Assran;Nicolas Ballas",
        "authorids": "~Adrien_Bardes1;~Quentin_Garrido1;~Jean_Ponce1;~Xinlei_Chen1;~Michael_Rabbat1;~Yann_LeCun1;~Mido_Assran1;~Nicolas_Ballas1",
        "gender": "M;M;M;M;M;M;;M",
        "homepage": ";https://garridoq.com;http://www.di.ens.fr/~ponce/;http://xinleic.xyz;;http://yann.lecun.com;;http://www.midoassran.ca/",
        "dblp": "292/3848.html;285/6628;p/JeanPonce;;47/1744;l/YannLeCun;120/9066;216/2717",
        "google_scholar": "SvRU8F8AAAAJ;RQaZUNsAAAAJ;https://scholar.google.com.tw/citations?user=vC2vywcAAAAJ;bSU7LYoAAAAJ;https://scholar.google.ch/citations?user=cMPKe9UAAAAJ;WLN3QrAAAAAJ;euUV4iUAAAAJ;gcQTTvkAAAAJ",
        "orcid": ";;;;;;;0000-0001-9159-8447",
        "linkedin": "adrien-bardes-48a080129/;;;;;;;",
        "or_profile": "~Adrien_Bardes1;~Quentin_Garrido1;~Jean_Ponce1;~Xinlei_Chen1;~Michael_Rabbat1;~Yann_LeCun1;~Nicolas_Ballas1;~Mahmoud_Assran1",
        "aff": "Meta Facebook;Research, Facebook;Ecole Normale Sup\u00e9rieure de Paris;Meta;Mila;New York University;Meta;Meta",
        "aff_domain": "meta.com;research.facebook.com;ens.fr;meta.com;mila.quebec;nyu.edu;meta.com;meta.com",
        "position": "Researcher;PhD student;Full Professor;Researcher;Associate Member;Full Professor;Researcher;Research Scientist",
        "bibtex": "@misc{\nbardes2024vjepa,\ntitle={V-{JEPA}: Latent Video Prediction for Visual Representation Learning},\nauthor={Adrien Bardes and Quentin Garrido and Jean Ponce and Xinlei Chen and Michael Rabbat and Yann LeCun and Mido Assran and Nicolas Ballas},\nyear={2024},\nurl={https://openreview.net/forum?id=WFYbBOEOtv}\n}",
        "github": "",
        "project": "",
        "reviewers": "V39V;HoWZ;TgmP;eUQX;zTBB",
        "site": "https://openreview.net/forum?id=WFYbBOEOtv",
        "pdf_size": 5662204,
        "rating": "3;3;5;5;6",
        "confidence": "5;4;5;4;3",
        "soundness": "1;1;3;3;3",
        "contribution": "1;1;2;3;2",
        "presentation": "2;2;3;2;3",
        "wc_summary": "55;55;35;86;99",
        "wc_strengths": "53;34;27;95;107",
        "wc_weaknesses": "356;375;130;159;141",
        "wc_questions": "63;12;5;134;98",
        "wc_review": "527;476;197;474;445",
        "wc_reply_reviewers": "0;1262;0;0;78",
        "wc_reply_authors": "746;1662;469;401;406",
        "reply_reviewers": "0;4;0;0;1",
        "reply_authors": "1;5;1;1;1",
        "rating_avg": [
            4.4,
            1.2
        ],
        "confidence_avg": [
            4.2,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.2,
            0.9797958971132712
        ],
        "contribution_avg": [
            1.8,
            0.7483314773547883
        ],
        "presentation_avg": [
            2.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            66.0,
            23.20344801963708
        ],
        "wc_strengths_avg": [
            63.2,
            32.239106687375816
        ],
        "wc_weaknesses_avg": [
            232.2,
            109.39725773528329
        ],
        "wc_questions_avg": [
            62.4,
            49.4554344839877
        ],
        "wc_review_avg": [
            423.8,
            116.43264147136748
        ],
        "wc_reply_reviewers_avg": [
            268.0,
            497.91726220327007
        ],
        "wc_reply_authors_avg": [
            736.8,
            479.5803999331082
        ],
        "reply_reviewers_avg": [
            1.0,
            1.5491933384829668
        ],
        "reply_authors_avg": [
            1.8,
            1.6000000000000003
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.5345224838248488,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10871243638138238304&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;1;0;2;3;0;0",
        "aff_unique_norm": "Meta;Ecole Normale Sup\u00e9rieure de Paris;Mila;New York University",
        "aff_unique_dep": "Meta Platforms, Inc.;;Quebec Artificial Intelligence Institute;",
        "aff_unique_url": "https://meta.com;https://www.ens.fr;https://mila.quebec;https://www.nyu.edu",
        "aff_unique_abbr": "Meta;ENS Paris;Mila;NYU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Paris",
        "aff_country_unique_index": "0;0;1;0;2;0;0;0",
        "aff_country_unique": "United States;France;Canada"
    },
    {
        "id": "WGLu9Mv8mn",
        "title": "POET: Prompt Offset Tuning for Continual Few-Shot Action Recognition",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "As virtual reality and augmented reality is redefining how users interact with computing devices, research in action and gesture recognition is indeed gaining prominence. Typically, these models deployed on AR/VR devices are trained in their factory, with large proprietary datasets. Though this training would cover the major set of activity and gestures classes, the user should ideally be able to add newer\nclasses to the model, without forgetting the base set of classes. Importantly, the user would be able to provide only few samples per class in this process. In-order to protect the user\u2019s privacy, the setting should also not allow storage and replay of a data sample, for future learning. We formalize this pragmatic problem setting as privacy aware few-shot class incremental learning for activity and gestures.\nTowards this end, we propose a novel strategy, POET: Prompt-offset Tuning. Unlike other prompt tuning approaches that demand access to transformer models pretrained on a large amount of data, our approach demonstrates the efficacy of prompting on a significantly smaller model trained exclusively on the data from the base classes. Additionally, we take advantage of the temporal sequencing in the data stream of actions and gestures to propose a unique temporal-ordered learnable prompt selection and prompt attachment. To evaluate our newly proposed problem setting, we introduce new benchmarks on NTU RGB+D dataset for action recognition and SHREC-2017 dataset for hand gesture recognition.",
        "keywords": "Activity Recognition;Continual Learning;Prompt Tuning;Few-Shot Class Incremental Learning (FSCIL)",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/1755390382f150cf3d0a9c77bff3241331cbb531.pdf",
        "author": "Prachi Garg;Joseph K J;Vineeth N. Balasubramanian;Necati Cihan Camgoz;Chengde Wan;Kenrick Kin;Weiguang Si;Shugao Ma;Fernando De la Torre",
        "authorids": "~Prachi_Garg1;~Joseph_K_J1;~Vineeth_N._Balasubramanian2;~Necati_Cihan_Camgoz2;~Chengde_Wan4;~Kenrick_Kin1;~Weiguang_Si1;~Shugao_Ma3;~Fernando_De_la_Torre2",
        "gender": "F;M;M;M;M;M;M;Not Specified;M",
        "homepage": "https://prachigarg23.github.io/;https://josephkj.in/;;;;https://shugaoma.github.io/;http://www.cs.cmu.edu/~ftorre/;https://www.cihancamgoz.com;https://people.iith.ac.in/vineethnb/",
        "dblp": ";227/3165;139/7079;75/7078;;70/418;d/FernandoDelaTorre;160/2823;88/4691",
        "google_scholar": "g5Aj5_IAAAAJ;sOG3L94AAAAJ;bm5dZwIAAAAJ;;;SUd2LJUAAAAJ;YB8_6gkAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.co.in/citations?user=7soDcboAAAAJ",
        "orcid": ";;;0000-0002-3956-9793;;;;;0000-0003-2656-0375",
        "linkedin": "prachi-garg-192276135;;;;si-weiguang-justin-61009a5/;;;;vineethnb?originalSubdomain=in",
        "or_profile": "~Prachi_Garg1;~Joseph_K_J1;~Chengde_Wan4;~Kenrick_Kin1;~Weiguang_Si1;~Shugao_Ma3;~Fernando_Torre1;~Necati_Cihan_Camgoz1;~Vineeth_Balasubramanian1",
        "aff": "Carnegie Mellon University;Adobe Systems;Meta Facebook;Meta;Meta Platforms, Inc.;Meta;School of Computer Science, Carnegie Mellon University;Meta;Indian Institute of Technology Hyderabad",
        "aff_domain": "cmu.edu;adobe.com;meta.com;research.facebook.com;meta.com;meta.com;cs.cmu.edu;meta.com;iith.ac.in",
        "position": "MS student;Researcher;Research scientist;Researcher;Researcher;Research Scientist Manager;Associate Professor;Researcher;Full Professor",
        "bibtex": "@misc{\ngarg2024poet,\ntitle={{POET}: Prompt Offset Tuning for Continual Few-Shot Action Recognition},\nauthor={Prachi Garg and Joseph K J and Vineeth N. Balasubramanian and Necati Cihan Camgoz and Chengde Wan and Kenrick Kin and Weiguang Si and Shugao Ma and Fernando De la Torre},\nyear={2024},\nurl={https://openreview.net/forum?id=WGLu9Mv8mn}\n}",
        "github": "",
        "project": "",
        "reviewers": "ioCA;SdtP;c8Px;H7jd",
        "site": "https://openreview.net/forum?id=WGLu9Mv8mn",
        "pdf_size": 879750,
        "rating": "3;3;3;5",
        "confidence": "4;3;5;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "3;2;3;2",
        "wc_summary": "51;68;28;114",
        "wc_strengths": "29;20;11;59",
        "wc_weaknesses": "107;325;137;226",
        "wc_questions": "20;5;4;135",
        "wc_review": "207;418;180;534",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            65.25,
            31.522809202226885
        ],
        "wc_strengths_avg": [
            29.75,
            18.046814123273947
        ],
        "wc_weaknesses_avg": [
            198.75,
            85.01874793244134
        ],
        "wc_questions_avg": [
            41.0,
            54.63972913549261
        ],
        "wc_review_avg": [
            334.75,
            147.39296964238153
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ToYDz2cI4EMJ:scholar.google.com/&scioq=POET:+Prompt+Offset+Tuning+for+Continual+Few-Shot+Action+Recognition&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;2;2;2;0;2;3",
        "aff_unique_norm": "Carnegie Mellon University;Adobe;Meta;Indian Institute of Technology Hyderabad",
        "aff_unique_dep": ";Adobe Systems Incorporated;Meta Platforms, Inc.;",
        "aff_unique_url": "https://www.cmu.edu;https://www.adobe.com;https://meta.com;https://www.iith.ac.in",
        "aff_unique_abbr": "CMU;Adobe;Meta;IIT Hyderabad",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Pittsburgh;Hyderabad",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;1",
        "aff_country_unique": "United States;India"
    },
    {
        "id": "WGP2pHtLtn",
        "title": "Multiple Positive Views in Self-Supervised Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Contrastive learning is a potent technique for self-supervised learning (SSL) that maintains invariance between two views. Advancements such as the ''core view'' (Tian et al., 2020a) or multi-cropping have harnessed insights from multiple views, culminating in the latest state-of-the-art performance. However, the complexities of multiview learning remain partially unexplored. In this paper, we introduce a ''plug-and-play'' multi-positive-views ($\\geq3$) learning approach seamlessly integrated with existing two-view SSL architectures. Theoretical and empirical analyses underscore the feasibility of enhancing traditional SSL models by incorporating multiple positive views. By mitigating the intrinsic biases towards sufficiency and minimality in the embeddings, our method achieves improvements in average accuracy (2% on CIFAR-10 and 26% on Tiny ImageNet) and significant speed-ups (3--4 times) across five datasets and eight architectures. Our research reveals and improves the double-edged nature of conventional assumptions tied to two-view suitability, thereby paving the way for future investigations in multiview SSL.",
        "keywords": "self-supervised learning;contrastive learning;representation learning;multiview learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Zhehao Liang;Yanqing Luo;Marvin Beese;David Jacob Drexlin",
        "authorids": "~Zhehao_Liang2;~Yanqing_Luo1;~Marvin_Beese1;~David_Jacob_Drexlin1",
        "gender": "F;;M;M",
        "homepage": ";;;https://px39n.github.io/#experience",
        "dblp": ";;;",
        "google_scholar": ";;;",
        "orcid": ";0009-0008-7417-515X;;",
        "linkedin": "yanqing-luo/;marvin-beese/;daviddrexlin/;",
        "or_profile": "~Yanqing_Luo1;~Marvin_Beese1;~David_Jacob_Drexlin1;~Zhehao_liang1",
        "aff": "Humboldt Universit\u00e4t Berlin;Technische Universit\u00e4t Berlin;Technische Universit\u00e4t Berlin;Technische Universit\u00e4t Berlin",
        "aff_domain": "hu-berlin.de;tu-berlin.de;tu-berlin.de;tu-berlin.de",
        "position": "MS student;MS student;MS student;MS student",
        "bibtex": "@misc{\nliang2024multiple,\ntitle={Multiple Positive Views in Self-Supervised Learning},\nauthor={Zhehao Liang and Yanqing Luo and Marvin Beese and David Jacob Drexlin},\nyear={2024},\nurl={https://openreview.net/forum?id=WGP2pHtLtn}\n}",
        "github": "",
        "project": "",
        "reviewers": "K5DW;z9y7;pKGj",
        "site": "https://openreview.net/forum?id=WGP2pHtLtn",
        "pdf_size": 2092891,
        "rating": "5;5;6",
        "confidence": "4;3;3",
        "soundness": "2;2;3",
        "contribution": "2;2;4",
        "presentation": "3;4;2",
        "wc_summary": "37;52;44",
        "wc_strengths": "45;36;20",
        "wc_weaknesses": "157;76;173",
        "wc_questions": "21;59;15",
        "wc_review": "260;223;252",
        "wc_reply_reviewers": "66;87;0",
        "wc_reply_authors": "985;950;1522",
        "reply_reviewers": "1;1;0",
        "reply_authors": "3;3;3",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            44.333333333333336,
            6.128258770283412
        ],
        "wc_strengths_avg": [
            33.666666666666664,
            10.338708279513881
        ],
        "wc_weaknesses_avg": [
            135.33333333333334,
            42.460439103816256
        ],
        "wc_questions_avg": [
            31.666666666666668,
            19.48218559493661
        ],
        "wc_review_avg": [
            245.0,
            15.895492023421818
        ],
        "wc_reply_reviewers_avg": [
            51.0,
            37.067505985701274
        ],
        "wc_reply_authors_avg": [
            1152.3333333333333,
            261.78405010406743
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:AZJmZdNoiZwJ:scholar.google.com/&scioq=Multiple+Positive+Views+in+Self-Supervised+Learning&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Humboldt University of Berlin;Technische Universit\u00e4t Berlin",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.hu-berlin.de;https://www.tu-berlin.de",
        "aff_unique_abbr": "HU Berlin;TU Berlin",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Berlin;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "title": "Motion Guidance: Diffusion-Based Image Editing with Differentiable Motion Estimators",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18485",
        "id": "WIAO4vbnNV",
        "author_site": "Daniel Geng, Andrew Owens",
        "tldr": "",
        "abstract": "Diffusion models are capable of generating impressive images conditioned on text descriptions, and extensions of these models allow users to edit images at a relatively coarse scale. However, the ability to precisely edit the layout, position, pose, and shape of objects in images with diffusion models is still difficult. To this end, we propose _motion guidance_, a zero-shot technique that allows a user to specify dense, complex motion fields that indicate where each pixel in an image should move. Motion guidance works by steering the diffusion sampling process with the gradients through an off-the-shelf optical flow network. Specifically, we design a guidance loss that encourages the sample to have the desired motion, as estimated by a flow network, while also being visually similar to the source image. By simultaneously sampling from a diffusion model and guiding the sample to have low guidance loss, we can obtain a motion-edited image. We demonstrate that our technique works on complex motions and produces high quality edits of real and generated images.",
        "keywords": "Optical Flow;Image Editing;Guidance;Diffusion Models",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Daniel Geng;Andrew Owens",
        "authorids": "~Daniel_Geng1;~Andrew_Owens1",
        "gender": "M;M",
        "homepage": "https://dangeng.github.io/;http://andrewowens.com",
        "dblp": "251/9557;85/2697",
        "google_scholar": "JbhCpzkAAAAJ;9hX-JksAAAAJ",
        "orcid": "0009-0004-0508-1003;",
        "linkedin": "dangeng;",
        "or_profile": "~Daniel_Geng1;~Andrew_Owens1",
        "aff": "Google;University of Michigan",
        "aff_domain": "google.com;umich.edu",
        "position": "Intern;Assistant Professor",
        "bibtex": "@inproceedings{\ngeng2024motion,\ntitle={Motion Guidance: Diffusion-Based Image Editing with Differentiable Motion Estimators},\nauthor={Daniel Geng and Andrew Owens},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=WIAO4vbnNV}\n}",
        "github": "",
        "project": "",
        "reviewers": "6Wgo;wHkp;iTDk;wQXZ",
        "pdf_size": 15136541,
        "rating": "6;6;8;8",
        "confidence": "3;4;4;4",
        "soundness": "3;3;4;3",
        "contribution": "3;3;4;2",
        "presentation": "3;3;4;3",
        "wc_summary": "100;75;63;79",
        "wc_strengths": "100;113;82;68",
        "wc_weaknesses": "182;141;141;195",
        "wc_questions": "190;34;5;165",
        "wc_review": "572;363;291;507",
        "wc_reply_reviewers": "100;0;0;0",
        "wc_reply_authors": "640;350;243;772",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            79.25,
            13.348689074212494
        ],
        "wc_strengths_avg": [
            90.75,
            17.137313091613866
        ],
        "wc_weaknesses_avg": [
            164.75,
            24.190649019817553
        ],
        "wc_questions_avg": [
            98.5,
            80.15141920140903
        ],
        "wc_review_avg": [
            433.25,
            111.64760409431095
        ],
        "wc_reply_reviewers_avg": [
            25.0,
            43.30127018922193
        ],
        "wc_reply_authors_avg": [
            501.25,
            213.38155379507387
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 34,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11691589551934459848&as_sdt=20000005&sciodt=0,21&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=WIAO4vbnNV",
        "pdf": "https://openreview.net/pdf?id=WIAO4vbnNV",
        "email": "google.com;umich.edu",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Google;University of Michigan",
        "aff_unique_dep": "Google;",
        "aff_unique_url": "https://www.google.com;https://www.umich.edu",
        "aff_unique_abbr": "Google;UM",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Mountain View;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "WIGsqpZpFT",
        "title": "The Impact of Depth and Width on Transformer Language Model Generalization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Transformer language models tend to perform better the more parameters they have. Previous theoretical and empirical work suggests that the total number of parameters is not the only relevant factor, however; rather, expressivity and out-of-distribution generalization may benefit more from increasing depth than increasing width. To test this hypothesis we disentangle depth from the number of parameters, constructing families of models which trade off depth for width while keeping the total number of parameters constant. We pretrain those models and evaluate them on both language modeling and compositional generalization tasks. We report three main conclusions: (1) within each family, deeper models show better language modeling performance, but the relative benefit of additional layers diminish rapidly; (2) when fine-tuned on compositional generalization tasks, deeper models generalize better out-of-distribution than shallower models do, but returns are similarly diminishing; (3) the benefits of depth for generalization cannot be attributed solely to better performance on language modeling or in-distribution data. These results replicate in three different model families (41M, 134M and 374M parameters), suggesting that depth improves performance across model sizes.",
        "keywords": "transformers;generalization;compositional;depth;width;layers",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/10809c46f154bedc3685e60bc5b333e4b07c957f.pdf",
        "author": "Jackson Petty;Sjoerd van Steenkiste;Fei Sha;Ishita Dasgupta;Dan Garrette;Tal Linzen",
        "authorids": "~Jackson_Petty1;~Sjoerd_van_Steenkiste1;~Fei_Sha3;~Ishita_Dasgupta1;~Dan_Garrette1;~Tal_Linzen1",
        "gender": ";M;;M;M;M",
        "homepage": "https://jacksonpetty.org;http://www.sjoerdvansteenkiste.com/;;http://www.dhgarrette.com/;http://tallinzen.net;http://feisha.org",
        "dblp": ";183/9326;169/6218;117/4050;169/3438;13/3601",
        "google_scholar": "hCYSiTgAAAAJ;i-AStBYAAAAJ;;tT9mhNMAAAAJ;5mJDXjoAAAAJ;HDHOS0QAAAAJ",
        "orcid": "0000-0002-9492-0144;;;;;",
        "linkedin": "https://linkedin.com/in/jackson-petty;;idasgupta6/;;;",
        "or_profile": "~Jackson_Petty1;~Sjoerd_van_Steenkiste1;~Ishita_Dasgupta1;~Dan_Garrette1;~Tal_Linzen1;~Fei_Sha2",
        "aff": "New York University;Google;Google DeepMind;Google DeepMind;Google;Google",
        "aff_domain": "nyu.edu;google.com;deepmind.com;google.com;google.com;google.com",
        "position": "PhD student;Researcher;Researcher;Researcher;Researcher;research scientist",
        "bibtex": "@misc{\npetty2024the,\ntitle={The Impact of Depth and Width on Transformer Language Model Generalization},\nauthor={Jackson Petty and Sjoerd van Steenkiste and Fei Sha and Ishita Dasgupta and Dan Garrette and Tal Linzen},\nyear={2024},\nurl={https://openreview.net/forum?id=WIGsqpZpFT}\n}",
        "github": "",
        "project": "",
        "reviewers": "yaYa;mDPp;1ZSK;ZnHf",
        "site": "https://openreview.net/forum?id=WIGsqpZpFT",
        "pdf_size": 853717,
        "rating": "3;5;5;6",
        "confidence": "4;3;2;3",
        "soundness": "3;3;3;4",
        "contribution": "2;2;2;2",
        "presentation": "3;3;3;4",
        "wc_summary": "17;140;81;114",
        "wc_strengths": "15;55;26;185",
        "wc_weaknesses": "114;99;111;132",
        "wc_questions": "5;56;142;41",
        "wc_review": "151;350;360;472",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "189;518;744;604",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            88.0,
            46.016301459374155
        ],
        "wc_strengths_avg": [
            70.25,
            67.8431094511447
        ],
        "wc_weaknesses_avg": [
            114.0,
            11.811011811017716
        ],
        "wc_questions_avg": [
            61.0,
            50.30407538162291
        ],
        "wc_review_avg": [
            333.25,
            115.61006660321583
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            513.75,
            204.10827396262013
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.6488856845230502,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14884917955352861064&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1;1;1",
        "aff_unique_norm": "New York University;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.nyu.edu;https://www.google.com",
        "aff_unique_abbr": "NYU;Google",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0;1;1;0;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "WIxiwMROqV",
        "title": "CLAM: Class-wise Layer-wise Attribute Model for Explaining Neural Networks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Deep learning techniques have been actively researched for solving complex and diverse problems, demonstrating high performance across various AI domains. However, the complexity and opaqueness of deep learning-based models often make them \"black boxes,\" leading to concerns about transparency and trustworthiness, which in turn hampers their real-world applicability. To address this issue, numerous studies have been carried out to interpret deep learning models and provide explanations for their predictions or propose interpretable new structures. In this paper, we introduce the Class-wise Layer-wise Attribute Model (CLAM), which aims to provide more accurate and detailed explanations for model predictions in image classification. Specifically, CLAM is designed to work in conjunction with a pre-trained image classification model and an existing interpretable algorithm to learn class-wise layer-wise attributes from the model features. Additionally, when generating a relevance map for new input images, CLAM leverages the learned attribute information to enhance the areas related to the target class thereby improving accuracy. Furthermore, we identify and present the influence of specific samples from the training dataset on the calculated relevance map, offering a higher level of explanation compared to existing methods. To validate the effectiveness of our proposed model, we present quantitative and qualitative experimental results using CUB-200-2011 and ImageNet datasets, along with pre-trained VGG-16 and ResNet-50 image classification models and well-known explainable models.",
        "keywords": "Interpretable Deep Learning;Explainable AI;Layer-wise Relevance Propagation",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/11a3151bd64a4c3cc913bf121897848e5a8494aa.zip",
        "author": "Seung-Ho Han;Ho-Jin Choi",
        "authorids": "~Seung-Ho_Han1;~Ho-Jin_Choi1",
        "gender": "F;M",
        "homepage": "https://github.com/SeunghoHan;https://keai.kaist.ac.kr/people/professor/",
        "dblp": "10/7539;60/1227",
        "google_scholar": ";https://scholar.google.co.kr/citations?hl=en",
        "orcid": ";0000-0002-3398-9543",
        "linkedin": ";",
        "or_profile": "~Seung-Ho_Han1;~Ho-Jin_Choi1",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nhan2024clam,\ntitle={{CLAM}: Class-wise Layer-wise Attribute Model for Explaining Neural Networks},\nauthor={Seung-Ho Han and Ho-Jin Choi},\nyear={2024},\nurl={https://openreview.net/forum?id=WIxiwMROqV}\n}",
        "github": "",
        "project": "",
        "reviewers": "wRSa;vhXF;fMxS;U1pQ",
        "site": "https://openreview.net/forum?id=WIxiwMROqV",
        "pdf_size": 7331557,
        "rating": "3;3;3;3",
        "confidence": "4;4;4;3",
        "soundness": "2;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "1;2;1;2",
        "wc_summary": "78;59;74;77",
        "wc_strengths": "57;28;14;41",
        "wc_weaknesses": "75;182;352;67",
        "wc_questions": "595;23;28;4",
        "wc_review": "805;292;468;189",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            72.0,
            7.648529270389178
        ],
        "wc_strengths_avg": [
            35.0,
            15.890248582070704
        ],
        "wc_weaknesses_avg": [
            169.0,
            114.99782606640875
        ],
        "wc_questions_avg": [
            162.5,
            249.864463259584
        ],
        "wc_review_avg": [
            438.5,
            233.93642298710134
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:F-_0x7BxlAQJ:scholar.google.com/&scioq=CLAM:+Class-wise+Layer-wise+Attribute+Model+for+Explaining+Neural+Networks&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "GNNBoundary: Towards Explaining Graph Neural Networks through the Lens of Decision Boundaries",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18484",
        "id": "WIzzXCVYiH",
        "author_site": "Xiaoqi Wang, Han Wei Shen",
        "tldr": "",
        "abstract": "While Graph Neural Networks (GNNs) have achieved remarkable performance on various machine learning tasks on graph data, they also raised questions regarding their transparency and interpretability. Recently, there have been extensive research efforts to explain the decision-making process of GNNs. These efforts often focus on explaining why a certain prediction is made for a particular instance, or what discriminative features the GNNs try to detect for each class. However, to the best of our knowledge, there is no existing study on understanding the decision boundaries of GNNs, even though the decision-making process of GNNs is directly determined by the decision boundaries. To bridge this research gap, we propose a model-level explainability method called GNNBoundary, which attempts to gain deeper insights into the decision boundaries of graph classifiers. Specifically, we first develop an algorithm to identify the pairs of classes whose decision regions are adjacent. For an adjacent class pair, the near-boundary graphs between them are effectively generated by optimizing a novel objective function specifically designed for boundary graph generation. Thus, by analyzing the nearboundary graphs, the important characteristics of decision boundaries can be uncovered. To evaluate the efficacy of GNNBoundary, we conduct experiments on both synthetic and public real-world datasets. The results demonstrate that, via the analysis of faithful near-boundary graphs generated by GNNBoundary, we can thoroughly assess the robustness and generalizability of the explained GNNs. The official implementation can be found at https://github.com/yolandalalala/GNNBoundary.",
        "keywords": "AI Interpretability;Graph Neural Networks;Model-Level Explanation of Neural Networks;Decision Boundaries",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Xiaoqi Wang;Han Wei Shen",
        "authorids": "~Xiaoqi_Wang2;~Han_Wei_Shen1",
        "gender": "F;M",
        "homepage": ";http://www.cse.ohio-state.edu/~hwshen",
        "dblp": ";61/6829",
        "google_scholar": "i__pLDEAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";0000-0002-1211-2320",
        "linkedin": "xiaoqiwang2582/;",
        "or_profile": "~Xiaoqi_Wang2;~Han_Wei_Shen1",
        "aff": "Ohio State University, Columbus;Ohio State University, Columbus",
        "aff_domain": "osu.edu;osu.edu",
        "position": "PhD student;Full Professor",
        "bibtex": "@inproceedings{\nwang2024gnnboundary,\ntitle={{GNNB}oundary: Towards Explaining Graph Neural Networks through the Lens of Decision Boundaries},\nauthor={Xiaoqi Wang and Han Wei Shen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=WIzzXCVYiH}\n}",
        "github": "",
        "project": "",
        "reviewers": "F52p;oN5P;hgmZ;9PKK",
        "pdf_size": 7819984,
        "rating": "6;6;6;8",
        "confidence": "3;3;3;3",
        "soundness": "3;3;2;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "80;108;83;67",
        "wc_strengths": "59;77;72;80",
        "wc_weaknesses": "298;38;226;83",
        "wc_questions": "2;83;42;102",
        "wc_review": "439;306;423;332",
        "wc_reply_reviewers": "0;18;0;0",
        "wc_reply_authors": "1543;1890;1477;1904",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "3;4;3;3",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            84.5,
            14.84082207965583
        ],
        "wc_strengths_avg": [
            72.0,
            8.031189202104505
        ],
        "wc_weaknesses_avg": [
            161.25,
            105.1270065206843
        ],
        "wc_questions_avg": [
            57.25,
            38.57055223872222
        ],
        "wc_review_avg": [
            375.0,
            57.03069349043548
        ],
        "wc_reply_reviewers_avg": [
            4.5,
            7.794228634059948
        ],
        "wc_reply_authors_avg": [
            1703.5,
            194.96474040195062
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.25,
            0.4330127018922193
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13614085052428996101&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=WIzzXCVYiH",
        "pdf": "https://openreview.net/pdf?id=WIzzXCVYiH",
        "email": "osu.edu;osu.edu",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Ohio State University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.osu.edu",
        "aff_unique_abbr": "OSU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Columbus",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "WJfbQulYPz",
        "title": "Wording Image for Domain-Invariant Representation in Domain Generalization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The out-of-domain (OOD) generalization ability is essential for AI systems in real-world applications. Recent works proposed to utilize prior knowledge like unlabeled data or descriptions to improve the OOD performance. However, the assumption that the domain of each test data is known in advance is unrealistic in practice, which limits the generalization of AI system to various domains and prevents the wide deployment. In this paper, we introduce WIDIn, which Words the Images to learn Domain-Invariant features being robust to complex domain biases. Different from visual embeddings, the language embeddings of class descriptions are domain-invariant, and they can be connected via vision-language alignment. Thus, we propose to project images into language space by representing each image as a word token, which is attached with hand-crafted prompt and fed into language encoder. Then, the difference between the extracted embedding and the language embedding of its class description is used to estimate the domain-specific counterpart, which facilitates the domain-invariant representation learning. Notably, our WIDIn can be applied to both pretrained vision-language models like CLIP, and separately trained uni-modal models like MoCo and BERT. Experimental studies on two domain generalization benchmark datasets and two long-tail benchmark datasets demonstrate the effectiveness of our approach.",
        "keywords": "Vision-Language Alignment;Domain Generalization;Domain-Invariant Representation Disentanglement;Long-Tail Learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Jiawei Ma;Yulei Niu;Shiyuan Huang;Guangxing Han;Shih-Fu Chang",
        "authorids": "~Jiawei_Ma1;~Yulei_Niu1;~Shiyuan_Huang1;~Guangxing_Han1;~Shih-Fu_Chang3",
        "gender": "M;M;F;M;M",
        "homepage": "https://blogs.cuit.columbia.edu/jm4743/;https://yuleiniu.github.io;https://shiyuanh.github.io/;https://guangxinghan.github.io/;http://www.ee.columbia.edu/~sfchang/",
        "dblp": "201/7741;165/2982;226/2744/;208/4894;c/ShihFuChang",
        "google_scholar": "kXbWREkAAAAJ;WXd3dDwAAAAJ;CEtd-cMAAAAJ;1dh5WWUAAAAJ;OMVTRscAAAAJ",
        "orcid": "0000-0002-8625-5391;;;;",
        "linkedin": "jiawei-ma-ee1128/?locale=en_US;;;guangxing-han-19b0a999/;",
        "or_profile": "~Jiawei_Ma1;~Yulei_Niu1;~Shiyuan_Huang1;~Guangxing_Han1;~Shih-Fu_Chang3",
        "aff": "Columbia University;Columbia University;Amazon;Meta;Columbia University",
        "aff_domain": "columbia.edu;columbia.edu;amazon.com;meta.com;ee.columbia.edu",
        "position": "PhD student;Postdoc;Researcher;Postdoc;Full Professor",
        "bibtex": "@misc{\nma2024wording,\ntitle={Wording Image for Domain-Invariant Representation in Domain Generalization},\nauthor={Jiawei Ma and Yulei Niu and Shiyuan Huang and Guangxing Han and Shih-Fu Chang},\nyear={2024},\nurl={https://openreview.net/forum?id=WJfbQulYPz}\n}",
        "github": "",
        "project": "",
        "reviewers": "wwhy;z1uR;m3y6",
        "site": "https://openreview.net/forum?id=WJfbQulYPz",
        "pdf_size": 489917,
        "rating": "5;5;6",
        "confidence": "3;5;3",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "3;3;2",
        "wc_summary": "86;62;54",
        "wc_strengths": "57;33;69",
        "wc_weaknesses": "146;192;117",
        "wc_questions": "12;3;2",
        "wc_review": "301;290;242",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            67.33333333333333,
            13.59738536958076
        ],
        "wc_strengths_avg": [
            53.0,
            14.966629547095765
        ],
        "wc_weaknesses_avg": [
            151.66666666666666,
            30.879694874715902
        ],
        "wc_questions_avg": [
            5.666666666666667,
            4.4969125210773475
        ],
        "wc_review_avg": [
            277.6666666666667,
            25.616834742454465
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:v7vVdBD9iV4J:scholar.google.com/&scioq=Wording+Image+for+Domain-Invariant+Representation+in+Domain+Generalization&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2;0",
        "aff_unique_norm": "Columbia University;Amazon;Meta",
        "aff_unique_dep": ";Amazon.com, Inc.;Meta Platforms, Inc.",
        "aff_unique_url": "https://www.columbia.edu;https://www.amazon.com;https://meta.com",
        "aff_unique_abbr": "Columbia;Amazon;Meta",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "WKALcMvCdm",
        "title": "Constrained Bayesian Optimization with Adaptive Active Learning of Unknown Constraints",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Optimizing objectives under constraints, where both the objectives and constraints are black box functions, is a common scenario in real-world applications such as scientific experimental design, design of medical therapies, and industrial process optimization. One popular approach to handling these complex scenarios is Bayesian Optimization (BO).\nIn terms of theoretical behavior, BO is relatively well understood in the unconstrained setting, where its principles have been well explored and validated. However, when it comes to constrained Bayesian optimization (CBO), the existing framework often relies on heuristics or approximations without the same level of theoretical guarantees.\n \nIn this paper, we delve into the theoretical and practical aspects of constrained Bayesian optimization, where the objective and constraints can be independently evaluated and are subject to noise. By recognizing that both the objective and constraints can help identify high-confidence **regions of interest** (ROI), we propose an efficient CBO framework that intersects the ROIs identified from each aspect to determine the general ROI. The ROI, coupled with a novel acquisition function that adaptively balances the optimization of the objective and the identification of feasible regions, enables us to derive rigorous theoretical justifications for its performance. We showcase the efficiency and robustness of our proposed CBO framework through empirical evidence and discuss the fundamental challenge of deriving practical regret bounds for CBO algorithms.",
        "keywords": "Bayesian Optimization;Level Set;Active Learning;Unknown Constraints",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/5d9ac6a24684746c3428a532d3b7d0c031cf174a.zip",
        "author": "Fengxue Zhang;Zejie Zhu;Yuxin Chen",
        "authorids": "~Fengxue_Zhang1;~Zejie_Zhu1;~Yuxin_Chen1",
        "gender": "M;M;",
        "homepage": ";;http://yuxinchen.org/",
        "dblp": ";;11/5123-1",
        "google_scholar": ";;-k1N7HAAAAAJ",
        "orcid": ";;",
        "linkedin": "fengxue-zhang-18b205146/;zejie-zhu-3864891aa/;",
        "or_profile": "~Fengxue_Zhang1;~Zejie_Zhu1;~Yuxin_Chen1",
        "aff": "University of Chicago;University of Chicago;University of Chicago",
        "aff_domain": "uchicago.edu;uchicago.edu;uchicago.edu",
        "position": "Ph.D. student;Undergrad student;Assistant Professor",
        "bibtex": "@misc{\nzhang2024constrained,\ntitle={Constrained Bayesian Optimization with Adaptive Active Learning of Unknown Constraints},\nauthor={Fengxue Zhang and Zejie Zhu and Yuxin Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=WKALcMvCdm}\n}",
        "github": "",
        "project": "",
        "reviewers": "E2Xp;AopU;vk7s;uw1z",
        "site": "https://openreview.net/forum?id=WKALcMvCdm",
        "pdf_size": 1453436,
        "rating": "1;3;5;6",
        "confidence": "4;4;3;3",
        "soundness": "1;2;2;3",
        "contribution": "1;2;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "70;56;91;125",
        "wc_strengths": "55;31;57;101",
        "wc_weaknesses": "597;647;228;68",
        "wc_questions": "42;6;44;92",
        "wc_review": "764;740;420;386",
        "wc_reply_reviewers": "365;776;140;0",
        "wc_reply_authors": "2384;3096;1353;956",
        "reply_reviewers": "2;2;1;0",
        "reply_authors": "4;6;3;2",
        "rating_avg": [
            3.75,
            1.920286436967152
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            85.5,
            25.985572920372565
        ],
        "wc_strengths_avg": [
            61.0,
            25.25866188063018
        ],
        "wc_weaknesses_avg": [
            385.0,
            244.297973794299
        ],
        "wc_questions_avg": [
            46.0,
            30.56141357987225
        ],
        "wc_review_avg": [
            577.5,
            175.11924508745463
        ],
        "wc_reply_reviewers_avg": [
            320.25,
            293.58165388865837
        ],
        "wc_reply_authors_avg": [
            1947.25,
            843.517449434213
        ],
        "reply_reviewers_avg": [
            1.25,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.75,
            1.479019945774904
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.911322376865767,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3145838034311886418&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Chicago",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uchicago.edu",
        "aff_unique_abbr": "UChicago",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "WKfMFtlz5D",
        "title": "MG-NeRF: Multimodal Representation Learning for Generalizable NeRF",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Neural Radiance Field (NeRF) is a novel view synthesis model for three-dimensional space implicit representation, which has swept the field of computer vision. However, vanilla NeRF overfits to a single scene and fails to synthesize novel views of unseen scenes. It is training expensive to learn per-scene representation so that generalization capability of NeRF has aroused tremendous attention. Previous works address the challenge through multi-view learning methods and achieve remarkable results. They convert novel view synthesis to multi-view image-based interpolation problem. These methods focus on image modality merely, while overlooking other meaningful multimodal knowledge. We propose MG-NeRF, a novel learning framework that incorporates multimodal information to polish the generalization performance of NeRF. To our best knowledge, we are the first to apply multimodal to NeRF\u2019s generalization. We employ a vision language pre-training (VLP) framework to generate text information for each scene. Then, image and text features are fused and fed to NeRF. Due to the alignment of image and text modalities, we bring in a semantic loss to encourage NeRF to synthesize reasonable novel views. For positional encoding, a frequency regularization mechanism is introduced to prevent NeRF from overfitting to high frequency information. We show that MG-NeRF achieves appreciable achievement on novel view synthesis of unseen scenes even trained with considerably less resources than prior work. We will public our code once upon acceptance.",
        "keywords": "Neural Radiance Field;Multimodal;Generalization",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Tong Yu;ZeYu Li;Jingsheng Gao;Jiacheng Ruan;Mingye Xie;Zefang Yu;Ting Liu;yuzhuo fu",
        "authorids": "~Tong_Yu5;~ZeYu_Li1;~Jingsheng_Gao1;~Jiacheng_Ruan1;~Mingye_Xie1;~Zefang_Yu1;~Ting_Liu15;~yuzhuo_fu1",
        "gender": ";;M;M;;F;F;M",
        "homepage": ";;https://gaojingsheng.github.io/;https://jcruan519.github.io/;;;https://scholar.google.com/citations?user=_PdbsmAAAAAJ&hl=zh-CN;https://dblp.org/pid/50/1476.html",
        "dblp": ";01/5929;275/7262.html;274/2808;206/0235;272/3989;52/5150-16;50/1476.html",
        "google_scholar": ";;O4o2aQcAAAAJ;sEzpwaAAAAAJ;5c9ctO4AAAAJ;;_PdbsmAAAAAJ;",
        "orcid": "0000-0002-6846-9791;;0000-0001-6271-0903;0000-0001-5469-507X;;;0000-0003-3489-4578;0000-0001-5516-3016",
        "linkedin": ";;;;;;;",
        "or_profile": "~Tong_Yu5;~ZeYu_Li1;~Jingsheng_Gao1;~Jiacheng_Ruan1;~Mingye_Xie1;~Zefang_Yu1;~Ting_Liu15;~yuzhuo_fu1",
        "aff": "Shanghai Jiaotong University;;Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn;;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn",
        "position": "MS student;;PhD student;PhD student;PhD student;PhD student;Lecturer;Full Professor",
        "bibtex": "@misc{\nyu2024mgnerf,\ntitle={{MG}-Ne{RF}: Multimodal Representation Learning for Generalizable Ne{RF}},\nauthor={Tong Yu and ZeYu Li and Jingsheng Gao and Jiacheng Ruan and Mingye Xie and Zefang Yu and Ting Liu and yuzhuo fu},\nyear={2024},\nurl={https://openreview.net/forum?id=WKfMFtlz5D}\n}",
        "github": "",
        "project": "",
        "reviewers": "5MMB;eSq7;diGW;dNY8",
        "site": "https://openreview.net/forum?id=WKfMFtlz5D",
        "pdf_size": 8214074,
        "rating": "1;1;3;5",
        "confidence": "4;4;4;4",
        "soundness": "1;2;3;2",
        "contribution": "1;1;2;2",
        "presentation": "3;2;4;3",
        "wc_summary": "117;88;106;100",
        "wc_strengths": "21;26;139;15",
        "wc_weaknesses": "296;121;274;120",
        "wc_questions": "224;47;201;25",
        "wc_review": "658;282;720;260",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.5,
            1.6583123951777
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            102.75,
            10.473180032826706
        ],
        "wc_strengths_avg": [
            50.25,
            51.38762010445706
        ],
        "wc_weaknesses_avg": [
            202.75,
            82.61771904379835
        ],
        "wc_questions_avg": [
            124.25,
            88.96452944853921
        ],
        "wc_review_avg": [
            480.0,
            210.2902755716488
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:nkbRBjBr1m4J:scholar.google.com/&scioq=MG-NeRF:+Multimodal+Representation+Learning+for+Generalizable+NeRF&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0;0;0",
        "aff_unique_norm": "Shanghai Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sjtu.edu.cn",
        "aff_unique_abbr": "SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Learning Optimal Contracts: How to Exploit Small Action Spaces",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18483",
        "id": "WKuimaBj4I",
        "author_site": "Francesco Bacchiocchi, Matteo Castiglioni, Alberto Marchesi, Nicola Gatti",
        "tldr": "",
        "abstract": "We study principal-agent problems in which a principal commits to an outcome-dependent payment scheme---called contract---in order to induce an agent to take a costly, unobservable action leading to favorable outcomes. We consider a generalization of the classical (single-round) version of the problem in which the principal interacts with the agent by committing to contracts over multiple rounds. The principal has no information about the agent, and they have to learn an optimal contract by only observing the outcome realized at each round. We focus on settings in which the size of the agent's action space is small. We design an algorithm that learns an approximately-optimal contract with high probability in a number of rounds polynomial in the size of the outcome space, when the number of actions is constant. Our algorithm solves an open problem by Zhu et al. [2022]. Moreover, it can also be employed to provide a $\\widetilde{\\mathcal{O}}(T^{4/5})$ regret bound in the related online learning setting in which the principal aims at maximizing their cumulative utility, thus considerably improving previously-known regret bounds.",
        "keywords": "principal-agent problems;sample complexity;online learning;contract design",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/2699780aa1b1222f53fc126a23582616af64a9ce.zip",
        "author": "Francesco Bacchiocchi;Matteo Castiglioni;Alberto Marchesi;Nicola Gatti",
        "authorids": "~Francesco_Bacchiocchi1;~Matteo_Castiglioni1;~Alberto_Marchesi1;~Nicola_Gatti1",
        "gender": "M;;M;M",
        "homepage": ";https://castiglionimatteo.github.io;https://albymarke.github.io;https://www4.ceda.polimi.it/manifesti/manifesti/controller/ricerche/RicercaPerDocentiPublic.do?k_doc=75785&lang=EN&EVN_PRODOTTI=evento&__pj0=0&__pj1=d918ee8916afbd0005f5c0bc3c0ff350",
        "dblp": "312/4794.html;225/7720;204/1718;g/NicolaGatti",
        "google_scholar": "https://scholar.google.com.vn/citations?user=UKGWeAoAAAAJ;https://scholar.google.it/citations?user=NPE3HAYAAAAJ;vXDtCzoAAAAJ;https://scholar.google.com.tw/citations?user=j-HrYREAAAAJ",
        "orcid": ";0000-0002-1070-6766;;0000-0001-7349-3932",
        "linkedin": ";;;nicola-gatti-1284b21",
        "or_profile": "~Francesco_Bacchiocchi1;~Matteo_Castiglioni1;~Alberto_Marchesi1;~Nicola_Gatti1",
        "aff": "Polytechnic Institute of Milan;Politecnico di Milano;Politecnico di Milano;Polytechnic Institute of Milan",
        "aff_domain": "polimi.it;polimi.it;polimi.it;polimi.it",
        "position": "PhD student;Assistant Professor;Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\nbacchiocchi2024learning,\ntitle={Learning Optimal Contracts: How to Exploit Small Action Spaces},\nauthor={Francesco Bacchiocchi and Matteo Castiglioni and Alberto Marchesi and Nicola Gatti},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=WKuimaBj4I}\n}",
        "github": "",
        "project": "",
        "reviewers": "NM4o;GCN2;Mt7g",
        "pdf_size": 447906,
        "rating": "6;6;6",
        "confidence": "3;3;4",
        "soundness": "3;3;3",
        "contribution": "2;2;3",
        "presentation": "3;3;3",
        "wc_summary": "385;83;28",
        "wc_strengths": "18;87;23",
        "wc_weaknesses": "236;233;188",
        "wc_questions": "9;46;42",
        "wc_review": "648;449;281",
        "wc_reply_reviewers": "10;42;0",
        "wc_reply_authors": "751;1416;1257",
        "reply_reviewers": "1;1;0",
        "reply_authors": "2;2;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            165.33333333333334,
            156.94231070329278
        ],
        "wc_strengths_avg": [
            42.666666666666664,
            31.414787742222433
        ],
        "wc_weaknesses_avg": [
            219.0,
            21.95449840010015
        ],
        "wc_questions_avg": [
            32.333333333333336,
            16.579773487261185
        ],
        "wc_review_avg": [
            459.3333333333333,
            150.0051850955678
        ],
        "wc_reply_reviewers_avg": [
            17.333333333333332,
            17.9133717900592
        ],
        "wc_reply_authors_avg": [
            1141.3333333333333,
            283.5375734458408
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 16,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17398174303078578997&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=WKuimaBj4I",
        "pdf": "https://openreview.net/pdf?id=WKuimaBj4I",
        "email": "polimi.it;polimi.it;polimi.it;polimi.it",
        "author_num": 4,
        "aff_unique_index": "0;1;1;0",
        "aff_unique_norm": "Polytechnic Institute of Milan;Politecnico di Milano",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.polimi.it/;https://www.polimi.it",
        "aff_unique_abbr": "Politecnico di Milano;Polimi",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Italy"
    },
    {
        "id": "WLOgB6oDnd",
        "title": "KNIFE: Distilling Reasoning Knowledge From Free-Text Rationales",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Language models (LMs) have yielded impressive results on many language reasoning tasks, but their unexpected errors raise doubts about their reasoning abilities. In light of this, there is growing interest in finetuning/prompting LMs with both task instances and their associated free-text rationales (FTRs), which explain the correct reasoning process for predicting the correct task output (i.e., how to be \"right for the right reasons\"). However, existing finetuning methods fail to improve LM performance, while prompting needs prohibitively large (i.e., >50B) LMs to work well. We propose KNIFE, which shows that reasoning knowledge can be effectively distilled from FTRs into a small (i.e., <1B) LM and improve the LM's performance. First, KNIFE finetunes a teacher LM (given task input and FTR) to predict the task output, transferring reasoning knowledge from the FTRs to the teacher's hidden states. Second, KNIFE finetunes a student LM (given task input only) such that its hidden states are aligned with the teacher's. Thus, the student is endowed with reasoning knowledge but can be used for inference without direct FTR input. On two question-answering benchmarks, KNIFE outperforms various finetuning and prompting baselines in fully-supervised and low-resource settings. Also, we observe that FTR quality is a crucial factor in KNIFE's performance.",
        "keywords": "free-text rationales;explanation tuning;explanation-based learning;knowledge distillation;language model;question answering;text classification;reasoning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/ee90afd6742972c0e21337095541ba545b509c7b.zip",
        "author": "Aaron Chan;Zhiyuan Zeng;Wyatt Lake;Brihi Joshi;Hanjie Chen;Xiang Ren",
        "authorids": "~Aaron_Chan1;~Zhiyuan_Zeng3;~Wyatt_Lake1;~Brihi_Joshi1;~Hanjie_Chen1;~Xiang_Ren1",
        "gender": ";M;M;F;;M",
        "homepage": ";https://zhiyuan-zeng.github.io/;https://mobile.twitter.com/lakewyatt_;https://brihijoshi.github.io;;https://shanzhenren.github.io/",
        "dblp": ";;;218/5191;;36/360-1",
        "google_scholar": ";qLJqCqsAAAAJ;;j0vHYhcAAAAJ;;_moJlrIAAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";;;brihijoshi/;;xren7",
        "or_profile": "~Aaron_Chan1;~Zhiyuan_Zeng3;~Wyatt_Lake1;~Brihi_Joshi1;~Hanjie_Chen1;~Xiang_Ren1",
        "aff": ";Tsinghua University;;University of Southern California;;University of Southern California",
        "aff_domain": ";tsinghua.edu.cn;;usc.edu;;usc.edu",
        "position": ";Undergrad student;;PhD student;;Associate Professor",
        "bibtex": "@misc{\nchan2024knife,\ntitle={{KNIFE}: Distilling Reasoning Knowledge From Free-Text Rationales},\nauthor={Aaron Chan and Zhiyuan Zeng and Wyatt Lake and Brihi Joshi and Hanjie Chen and Xiang Ren},\nyear={2024},\nurl={https://openreview.net/forum?id=WLOgB6oDnd}\n}",
        "github": "",
        "project": "",
        "reviewers": "HVcW;izvw;MPYM",
        "site": "https://openreview.net/forum?id=WLOgB6oDnd",
        "pdf_size": 2278657,
        "rating": "3;3;5",
        "confidence": "3;4;4",
        "soundness": "2;2;3",
        "contribution": "2;1;2",
        "presentation": "3;3;3",
        "wc_summary": "119;112;93",
        "wc_strengths": "21;82;44",
        "wc_weaknesses": "112;314;95",
        "wc_questions": "130;54;6",
        "wc_review": "382;562;238",
        "wc_reply_reviewers": "0;98;41",
        "wc_reply_authors": "595;1025;112",
        "reply_reviewers": "0;1;1",
        "reply_authors": "1;2;1",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            108.0,
            10.98483803552272
        ],
        "wc_strengths_avg": [
            49.0,
            25.152865973217974
        ],
        "wc_weaknesses_avg": [
            173.66666666666666,
            99.47305609504963
        ],
        "wc_questions_avg": [
            63.333333333333336,
            51.051172584204394
        ],
        "wc_review_avg": [
            394.0,
            132.54433220624713
        ],
        "wc_reply_reviewers_avg": [
            46.333333333333336,
            40.18568014714805
        ],
        "wc_reply_authors_avg": [
            577.3333333333334,
            372.93997133884994
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13294437454618923367&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Tsinghua University;University of Southern California",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.usc.edu",
        "aff_unique_abbr": "THU;USC",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Los Angeles",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "WLRlL3zR7f",
        "title": "Vibroacoustic Frequency Response Prediction with Query-based Operator Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Understanding vibroacoustic wave propagation in mechanical structures like airplanes, cars and houses is crucial to ensure health and comfort of their users. To analyze such systems, designers and engineers primarily consider the dynamic response in the frequency domain, which is computed through expensive numerical simulations like the finite element method. In contrast, data-driven surrogate models offer the promise of speeding up these simulations, thereby facilitating tasks like design optimization, uncertainty quantification, and design space exploration. We present a structured benchmark for a representative vibroacoustic problem: Predicting the frequency response for vibrating plates with varying forms of beadings. The benchmark features a total of 12,000 plate geometries with an associated numerical solution and introduces evaluation metrics to quantify the prediction quality. \nTo address the frequency response prediction task, we propose a novel frequency query operator model, which is trained to map plate geometries to frequency response functions. By integrating principles from operator learning and implicit models for shape encoding, our approach effectively addresses the prediction of resonance peaks of frequency responses. We evaluate the method on our vibrating-plates benchmark and find that it outperforms DeepONets, Fourier Neural Operators and more traditional neural network architectures.\n\nCode and dataset: https://anonymous.4open.science/r/FRONet-5536",
        "keywords": "Vibroacoustics;Operator Learning;Implicit Representations;Acoustics;Surrogate Modeling;Frequency Response Prediction",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/fb6d94a936472eb60c0566c18865281f58d1f5d8.zip",
        "author": "Jan van Delden;Julius Schultz;Christopher Blech;Sabine C. Langer;Timo L\u00fcddecke",
        "authorids": "~Jan_van_Delden1;~Julius_Schultz1;~Christopher_Blech1;~Sabine_C._Langer1;~Timo_L\u00fcddecke1",
        "gender": "M;M;M;F;",
        "homepage": "https://eckerlab.org/people/;;https://www.tu-braunschweig.de/ina/institut/team/christopher-blech;https://www.tu-braunschweig.de/;https://eckerlab.org/people/",
        "dblp": "357/1642;;;;142/3944",
        "google_scholar": ";;;;dgGelc4AAAAJ",
        "orcid": ";0000-0002-1486-9976;;0000-0002-5814-044X;",
        "linkedin": ";;;;",
        "or_profile": "~Jan_van_Delden1;~Julius_Schultz1;~Christopher_Blech1;~Sabine_C._Langer1;~Timo_L\u00fcddecke1",
        "aff": "Georg-August Universit\u00e4t G\u00f6ttingen;;TU Braunschweig;TU Braunschweig;University of Goettingen",
        "aff_domain": "uni-goettingen.de;;tu-braunschweig.de;tu-braunschweig.de;uni-goettingen.de",
        "position": "PhD student;;Postdoc;Full Professor;Postdoc",
        "bibtex": "@misc{\ndelden2024vibroacoustic,\ntitle={Vibroacoustic Frequency Response Prediction with Query-based Operator Networks},\nauthor={Jan van Delden and Julius Schultz and Christopher Blech and Sabine C. Langer and Timo L{\\\"u}ddecke},\nyear={2024},\nurl={https://openreview.net/forum?id=WLRlL3zR7f}\n}",
        "github": "",
        "project": "",
        "reviewers": "fgvw;K93H;81Xi;SgdV;4WC3",
        "site": "https://openreview.net/forum?id=WLRlL3zR7f",
        "pdf_size": 1488874,
        "rating": "5;5;6;6;8",
        "confidence": "5;2;1;3;1",
        "soundness": "4;3;3;3;4",
        "contribution": "4;3;3;2;4",
        "presentation": "4;3;3;3;4",
        "wc_summary": "326;50;21;87;192",
        "wc_strengths": "140;69;1;48;113",
        "wc_weaknesses": "262;138;1;27;187",
        "wc_questions": "8;164;1;24;6",
        "wc_review": "736;421;24;186;498",
        "wc_reply_reviewers": "52;0;0;59;56",
        "wc_reply_authors": "542;832;0;318;306",
        "reply_reviewers": "2;0;0;1;1",
        "reply_authors": "2;3;0;2;1",
        "rating_avg": [
            6.0,
            1.0954451150103321
        ],
        "confidence_avg": [
            2.4,
            1.4966629547095764
        ],
        "soundness_avg": [
            3.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            3.2,
            0.7483314773547882
        ],
        "presentation_avg": [
            3.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            135.2,
            111.58386980204621
        ],
        "wc_strengths_avg": [
            74.2,
            48.7991803209849
        ],
        "wc_weaknesses_avg": [
            123.0,
            97.71591477338787
        ],
        "wc_questions_avg": [
            40.6,
            62.17909616583375
        ],
        "wc_review_avg": [
            373.0,
            247.57544304716492
        ],
        "wc_reply_reviewers_avg": [
            33.4,
            27.361286519460304
        ],
        "wc_reply_authors_avg": [
            399.6,
            276.53108324381907
        ],
        "reply_reviewers_avg": [
            0.8,
            0.7483314773547883
        ],
        "reply_authors_avg": [
            1.6,
            1.019803902718557
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.6099375455928333,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5902874725771837756&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "Georg-August Universit\u00e4t G\u00f6ttingen;Technische Universit\u00e4t Braunschweig;University of G\u00f6ttingen",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.uni-goettingen.de;https://tu-braunschweig.de;https://www.uni-goettingen.de",
        "aff_unique_abbr": "GAU;TU Braunschweig;UG",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "WLgbjzKJkk",
        "title": "CO-MOT: Boosting End-to-end Transformer-based Multi-Object Tracking via Coopetition Label Assignment and Shadow Sets",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Existing end-to-end Multi-Object Tracking (e2e-MOT) methods have not surpassed non-end-to-end tracking-by-detection methods. One potential reason is its label assignment strategy during training that consistently binds the tracked objects with tracking queries and then assigns the few newborns to detection queries. With one-to-one bipartite matching, such an assignment will yield an unbalanced training, \\textit{i.e.}, scarce positive samples for detection queries, especially for an enclosed scene, as the majority of the newborns come on stage at the beginning of videos. Thus, e2e-MOT will be easier to yield a tracking terminal without renewal or re-initialization, compared to other tracking-by-detection methods. To alleviate this problem, we present Co-MOT, a simple and effective method to facilitate e2e-MOT by a novel coopetition label assignment with a shadow concept. Specifically, we add tracked objects to the matching targets for detection queries when performing the label assignment for training the intermediate decoders. For query initialization, we expand each query by a set of shadow counterparts with limited disturbance to itself. With extensive ablations, Co-MOT achieves superior performance without extra costs, \\textit{e.g.}, 69.4\\% HOTA on DanceTrack and 52.8\\% TETA on BDD100K.  Impressively, Co-MOT only requires 38\\% FLOPs of MOTRv2 to attain a similar performance, resulting in the 1.4$\\times$ faster inference speed.  Codes are attached for re-implementation.",
        "keywords": "End-to-End Multi-Object Tracking;Transformer",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/2af60c361827f10ddfd5373d217f4356082a0a6f.zip",
        "author": "Feng yan;Weixin Luo;Yujie Zhong;Yiyang Gan;Lin Ma",
        "authorids": "~Feng_yan8;~Weixin_Luo1;~Yujie_Zhong1;~Yiyang_Gan1;~Lin_Ma2",
        "gender": "M;;M;M;M",
        "homepage": "https://bingfengyan.github.io/;;https://y-zhong.info/;;http://forestlinma.com",
        "dblp": ";;198/2504;276/3228;74/3608-2",
        "google_scholar": "gO4divAAAAAJ;;;https://scholar.google.com/citations?hl=zh-CN;DAn1pA4AAAAJ",
        "orcid": ";;;0000-0001-9492-0104;",
        "linkedin": ";;;;",
        "or_profile": "~Feng_yan8;~Weixin_Luo1;~Yujie_Zhong1;~Yiyang_Gan1;~Lin_Ma2",
        "aff": "Meituan;;Meituan Inc.;Meituan;Meituan",
        "aff_domain": "meituan.com;;meituan.com;meituan.com;meituan.com",
        "position": "Researcher;;Researcher;Researcher;Principal Researcher and Research Manager ",
        "bibtex": "@misc{\nyan2024comot,\ntitle={{CO}-{MOT}: Boosting End-to-end Transformer-based Multi-Object Tracking via Coopetition Label Assignment and Shadow Sets},\nauthor={Feng yan and Weixin Luo and Yujie Zhong and Yiyang Gan and Lin Ma},\nyear={2024},\nurl={https://openreview.net/forum?id=WLgbjzKJkk}\n}",
        "github": "",
        "project": "",
        "reviewers": "gEi4;oLii;kcLe;NAsG",
        "site": "https://openreview.net/forum?id=WLgbjzKJkk",
        "pdf_size": 3661182,
        "rating": "3;6;6;8",
        "confidence": "5;5;2;4",
        "soundness": "2;3;3;4",
        "contribution": "2;2;2;4",
        "presentation": "2;3;2;3",
        "wc_summary": "48;43;78;104",
        "wc_strengths": "76;28;69;216",
        "wc_weaknesses": "312;160;128;114",
        "wc_questions": "44;3;5;77",
        "wc_review": "480;234;280;511",
        "wc_reply_reviewers": "267;0;0;0",
        "wc_reply_authors": "732;501;347;600",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.0,
            1.224744871391589
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            68.25,
            24.600558936739628
        ],
        "wc_strengths_avg": [
            97.25,
            70.96962378370058
        ],
        "wc_weaknesses_avg": [
            178.5,
            78.85905147793753
        ],
        "wc_questions_avg": [
            32.25,
            30.572659354397025
        ],
        "wc_review_avg": [
            376.25,
            120.851923857256
        ],
        "wc_reply_reviewers_avg": [
            66.75,
            115.61439140522256
        ],
        "wc_reply_authors_avg": [
            545.0,
            140.65383037798864
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.34299717028501764,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:lKPeS4Wuc5kJ:scholar.google.com/&scioq=CO-MOT:+Boosting+End-to-end+Transformer-based+Multi-Object+Tracking+via+Coopetition+Label+Assignment+and+Shadow+Sets&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Meituan;Meituan Inc.",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.meituan.com;https://www.meituan.com",
        "aff_unique_abbr": "Meituan;Meituan",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "WM5G2NWSYC",
        "title": "Projected Subnetworks Scale Adaptation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large models support great zero-shot and few-shot capabilities. However, updating these models on new tasks can break performance on previous seen tasks and their zero/few-shot unseen tasks. Our work explores how to update zero/few-shot learners such that they can maintain performance on seen/unseen tasks of previous tasks as well as new tasks. By manipulating the parameter updates of a gradient-based meta learner as the projected task-specific subnetworks, we show improvements for large models to retain seen and zero/few shot task performance in online settings.",
        "keywords": "adaptation;subnetworks",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Siddhartha Datta;Nigel Shadbolt",
        "authorids": "~Siddhartha_Datta1;~Nigel_Shadbolt1",
        "gender": ";M",
        "homepage": "http://siddharthadatta.ml/;https://www.cs.ox.ac.uk/people/nigel.shadbolt/",
        "dblp": ";s/NigelShadbolt",
        "google_scholar": ";wTAM67UAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Siddhartha_Datta1;~Nigel_Shadbolt1",
        "aff": "University of Oxford;University of Oxford",
        "aff_domain": "ox.ac.uk;ox.ac.uk",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\ndatta2024projected,\ntitle={Projected Subnetworks Scale Adaptation},\nauthor={Siddhartha Datta and Nigel Shadbolt},\nyear={2024},\nurl={https://openreview.net/forum?id=WM5G2NWSYC}\n}",
        "github": "",
        "project": "",
        "reviewers": "EH1D;bDN1;z8z7;oCJY",
        "site": "https://openreview.net/forum?id=WM5G2NWSYC",
        "pdf_size": 526716,
        "rating": "1;1;3;3",
        "confidence": "4;4;4;4",
        "soundness": "1;1;2;3",
        "contribution": "2;2;2;2",
        "presentation": "1;2;1;1",
        "wc_summary": "53;136;47;58",
        "wc_strengths": "73;16;12;39",
        "wc_weaknesses": "888;104;202;642",
        "wc_questions": "42;470;67;102",
        "wc_review": "1056;726;328;841",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            73.5,
            36.29393888791901
        ],
        "wc_strengths_avg": [
            35.0,
            24.238399287081645
        ],
        "wc_weaknesses_avg": [
            459.0,
            320.00156249618533
        ],
        "wc_questions_avg": [
            170.25,
            174.36796580794305
        ],
        "wc_review_avg": [
            737.75,
            264.5641462859244
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:McSQ6Lc-jvsJ:scholar.google.com/&scioq=Projected+Subnetworks+Scale+Adaptation&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Oxford",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ox.ac.uk",
        "aff_unique_abbr": "Oxford",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "title": "On the Role of Discrete Tokenization in Visual Representation Learning",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18482",
        "id": "WNLAkjUm19",
        "author_site": "Tianqi Du, Yifei Wang, Yisen Wang",
        "tldr": "",
        "abstract": "In the realm of self-supervised learning (SSL), masked image modeling (MIM) has gained popularity alongside contrastive learning methods. MIM involves reconstructing masked regions of input images using their unmasked portions. A notable subset of MIM methodologies employs discrete tokens as the reconstruction target, but the theoretical underpinnings of this choice remain underexplored. In this paper, we explore the role of these discrete tokens, aiming to unravel their benefits and limitations. Building upon the connection between MIM and contrastive learning, we provide a comprehensive theoretical understanding on how discrete tokenization affects the model's generalization capabilities. Furthermore, we propose a novel metric named TCAS, which is specifically designed to assess the effectiveness of discrete tokens within the MIM framework. Inspired by this metric, we contribute an innovative tokenizer design and propose a corresponding MIM method named ClusterMIM. It demonstrates superior performance on a variety of benchmark datasets and ViT backbones. Code is available at \\url{https://github.com/PKU-ML/ClusterMIM}.",
        "keywords": "Self-supervised learning;Masked image modeling;Discrete visual token",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Tianqi Du;Yifei Wang;Yisen Wang",
        "authorids": "~Tianqi_Du1;~Yifei_Wang1;~Yisen_Wang1",
        "gender": "M;M;M",
        "homepage": "https://yifeiwang77.com;https://yisenwang.github.io/;https://github.com/rexdu2003/rexdu.github.io",
        "dblp": "00/555-1;172/1346-1;341/5548",
        "google_scholar": "-CLy6YsAAAAJ;uMWPDboAAAAJ;nQjREpoAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Yifei_Wang1;~Yisen_Wang1;~Du_Tianqi1",
        "aff": "Massachusetts Institute of Technology;Peking University;Peking University",
        "aff_domain": "mit.edu;pku.edu.cn;pku.edu.cn",
        "position": "Postdoc;Assistant Professor;PhD student",
        "bibtex": "@inproceedings{\ndu2024on,\ntitle={On the Role of Discrete Tokenization in Visual Representation Learning},\nauthor={Tianqi Du and Yifei Wang and Yisen Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=WNLAkjUm19}\n}",
        "github": "",
        "project": "",
        "reviewers": "f8wZ;ss62;d6S4;yDgo",
        "pdf_size": 461583,
        "rating": "6;6;8;8",
        "confidence": "3;4;2;3",
        "soundness": "3;4;3;4",
        "contribution": "3;3;3;3",
        "presentation": "3;3;2;4",
        "wc_summary": "27;105;167;71",
        "wc_strengths": "20;27;86;63",
        "wc_weaknesses": "19;125;302;16",
        "wc_questions": "32;217;253;20",
        "wc_review": "98;474;808;170",
        "wc_reply_reviewers": "0;120;334;12",
        "wc_reply_authors": "203;1890;1658;159",
        "reply_reviewers": "0;1;2;1",
        "reply_authors": "1;4;3;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            92.5,
            51.134626233111355
        ],
        "wc_strengths_avg": [
            49.0,
            26.879360111431225
        ],
        "wc_weaknesses_avg": [
            115.5,
            116.28090986916123
        ],
        "wc_questions_avg": [
            130.5,
            105.3577239693417
        ],
        "wc_review_avg": [
            387.5,
            280.81087941887154
        ],
        "wc_reply_reviewers_avg": [
            116.5,
            133.9878725855441
        ],
        "wc_reply_authors_avg": [
            977.5,
            800.8634402942864
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.25,
            1.299038105676658
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.7071067811865475,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4826259883001592827&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=WNLAkjUm19",
        "pdf": "https://openreview.net/pdf?id=WNLAkjUm19",
        "email": "mit.edu;pku.edu.cn;pku.edu.cn",
        "author_num": 3,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Massachusetts Institute of Technology;Peking University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://web.mit.edu;http://www.pku.edu.cn",
        "aff_unique_abbr": "MIT;Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "AUGCAL: Improving Sim2Real Adaptation by Uncertainty Calibration on Augmented Synthetic Images",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18481",
        "id": "WNQjN5HzXt",
        "author_site": "Prithvijit Chattopadhyay, Bharat Goyal, Boglarka Ecsedi, Viraj Prabhu, Judy Hoffman",
        "tldr": "",
        "abstract": "Synthetic data (Sim) drawn from simulators have emerged as a popular alternativefor training models where acquiring annotated real-world images is difficult. However, transferring models trained on synthetic images to real-world applicationscan be challenging due to appearance disparities. A commonly employed solution to counter this Sim2Real gap is unsupervised domain adaptation, where models are trained using labeled Sim data and unlabeled Real data. Mispredictions made by such Sim2Real adapted models are often associated with miscalibration \u2013 stemming from overconfident predictions on real data. In this paper, we introduce AUGCAL, a simple training-time patch for unsupervised adaptation that improves Sim2Real adapted models by \u2013 (1) reducing overall miscalibration, (2) reducing overconfidence in incorrect predictions and (3) improving confidence score reliability by better guiding misclassification detection \u2013 all while retaining or improving Sim2Real performance. Given a base Sim2Real adaptation algorithm, at training time, AUGCAL involves replacing vanilla Sim images with strongly augmented views (AUG intervention) and additionally optimizing for a training time calibration loss on augmented Sim predictions (CAL intervention). We motivate AUGCAL using a brief analytical justification of how to reduce miscalibration on unlabeled REAL data. Through our experiments, we empirically show the efficacy of AUGCAL across multiple adaptation methods, backbones, tasks and shifts.",
        "keywords": "Unsupervised Domain Adaptation;Sim2Real",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Prithvijit Chattopadhyay;Bharat Goyal;Boglarka Ecsedi;Viraj Uday Prabhu;Judy Hoffman",
        "authorids": "~Prithvijit_Chattopadhyay1;~Bharat_Goyal1;~Boglarka_Ecsedi1;~Viraj_Uday_Prabhu1;~Judy_Hoffman1",
        "gender": "M;M;F;M;F",
        "homepage": "https://prithv1.xyz/;;;http://virajprabhu.github.io;https://www.cc.gatech.edu/~judy/",
        "dblp": "179/2452;;;199/1973;45/10336",
        "google_scholar": "https://scholar.google.co.in/citations?user=rIK7AMkAAAAJ;;;https://scholar.google.com/citations?hl=en;mqpjAt4AAAAJ",
        "orcid": ";;0000-0002-3592-8306;;",
        "linkedin": ";bgoyal7/;boglarka-ecsedi/;viraj-prabhu-0a2a9435/;",
        "or_profile": "~Prithvijit_Chattopadhyay1;~Bharat_Goyal1;~Boglarka_Ecsedi1;~Viraj_Uday_Prabhu1;~Judy_Hoffman1",
        "aff": "Georgia Institute of Technology;Georgia Institute of Technology;Medical University of Vienna;SalesForce.com;Georgia Institute of Technology",
        "aff_domain": "gatech.edu;gatech.edu;meduniwien.ac.at;salesforce.com;gatech.edu",
        "position": "PhD;MS student;Intern;Research Scientist;Assistant Professor",
        "bibtex": "@inproceedings{\nchattopadhyay2024augcal,\ntitle={{AUGCAL}: Improving Sim2Real Adaptation by Uncertainty Calibration on Augmented Synthetic Images},\nauthor={Prithvijit Chattopadhyay and Bharat Goyal and Boglarka Ecsedi and Viraj Uday Prabhu and Judy Hoffman},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=WNQjN5HzXt}\n}",
        "github": "",
        "project": "",
        "reviewers": "dFNn;iaFo;WuQd",
        "pdf_size": 48980327,
        "rating": "6;6;8",
        "confidence": "4;3;4",
        "soundness": "3;3;3",
        "contribution": "3;2;4",
        "presentation": "3;3;3",
        "wc_summary": "63;75;119",
        "wc_strengths": "16;49;102",
        "wc_weaknesses": "150;91;6",
        "wc_questions": "3;5;182",
        "wc_review": "232;220;409",
        "wc_reply_reviewers": "25;23;9",
        "wc_reply_authors": "702;592;569",
        "reply_reviewers": "1;1;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            85.66666666666667,
            24.073960113690383
        ],
        "wc_strengths_avg": [
            55.666666666666664,
            35.424410918022176
        ],
        "wc_weaknesses_avg": [
            82.33333333333333,
            59.10630724005312
        ],
        "wc_questions_avg": [
            63.333333333333336,
            83.91397711678046
        ],
        "wc_review_avg": [
            287.0,
            86.4060183089118
        ],
        "wc_reply_reviewers_avg": [
            19.0,
            7.118052168020874
        ],
        "wc_reply_authors_avg": [
            621.0,
            58.04021594262608
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.49999999999999983,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:YtBhK2zUOV0J:scholar.google.com/&scioq=AUGCAL:+Improving+Sim2Real+Adaptation+by+Uncertainty+Calibration+on+Augmented+Synthetic+Images&hl=en&as_sdt=0,5",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=WNQjN5HzXt",
        "pdf": "https://openreview.net/pdf?id=WNQjN5HzXt",
        "email": "gatech.edu;gatech.edu;meduniwien.ac.at;salesforce.com;gatech.edu",
        "author_num": 5,
        "aff_unique_index": "0;0;1;2;0",
        "aff_unique_norm": "Georgia Institute of Technology;Medical University of Vienna;Salesforce",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.gatech.edu;https://www.meduniwien.ac.at;https://www.salesforce.com",
        "aff_unique_abbr": "Georgia Tech;MUW;Salesforce",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "United States;Austria"
    },
    {
        "id": "WNSjteBJd9",
        "title": "Who Leaked the Model? Tracking IP Infringers in Accountable Federated Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Federated learning (FL) emerges as an effective collaborative learning framework to coordinate data and computation resources from massive and distributed clients in training. Such collaboration results in non-trivial intellectual property (IP) represented by the model parameters that should be protected and shared by the whole party rather than an individual user. Meanwhile, the distributed nature of FL endorses a malicious client the convenience to compromise IP through illegal model leakage to unauthorized third parties. To block such IP leakage, it is essential to make the IP identifiable in the shared model and locate the anonymous infringer who first leaks it. The collective challenges call for accountable federated learning, which requires verifiable ownership of the model and is capable of revealing the infringer's identity upon leakage. In this paper, we propose Decodable Unique Watermarking (DUW) for complying with the requirements of accountable FL. Specifically, before a global model is sent to a client in an FL round, DUW encodes a client-unique key into the model by leveraging a backdoor-based watermark injection. To identify the infringer of a leaked model, DUW examines the model and checks if the triggers can be decoded as the corresponding keys. Extensive empirical results show that DUW is highly effective and robust, achieving over 99% watermark success rate for Digits, CIFAR-10, and CIFAR-100 datasets under heterogeneous FL settings, and identifying the IP infringer with 100% accuracy even after common watermark removal attempts.",
        "keywords": "federated learning;watermarking;robustness",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/57bbf8a823b93f0fb8bcb610904690efd1ca6685.pdf",
        "author": "Shuyang Yu;Junyuan Hong;Yi Zeng;Fei Wang;Ruoxi Jia;Jiayu Zhou",
        "authorids": "~Shuyang_Yu1;~Junyuan_Hong1;~Yi_Zeng3;~Fei_Wang3;~Ruoxi_Jia1;~Jiayu_Zhou1",
        "gender": "F;M;M;;;M",
        "homepage": ";https://jyhong.gitlab.io/;https://yizeng623.github.io/;https://wcm-wanglab.github.io/index.html;https://ruoxijia.info/;http://jiayuzhou.github.io/",
        "dblp": ";185/1316;75/148;52/3194-9.html;147/5355-1;73/1353",
        "google_scholar": ";7Cbv6doAAAAJ;slUNmHQAAAAJ;https://scholar.google.com/citations?hl=en;JCrug-YAAAAJ;https://scholar.google.com.tw/citations?user=yQKlLTQAAAAJ",
        "orcid": "0000-0003-1889-0163;0000-0002-5718-5187;0000-0002-6901-9194;;;0000-0003-4336-6777",
        "linkedin": ";;chnyizeng/;fei-wang-50682425/;;jiayuzhou/",
        "or_profile": "~Shuyang_Yu1;~Junyuan_Hong1;~Yi_Zeng3;~Fei_Wang3;~Ruoxi_Jia1;~Jiayu_Zhou1",
        "aff": "Michigan State University;University of Texas at Austin;Virginia Tech;Cornell University;Virginia Tech;Michigan State University",
        "aff_domain": "msu.edu;utexas.edu;vt.edu;cornell.edu;vt.edu;msu.edu",
        "position": "PhD student;Postdoc;PhD student;Full Professor;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nyu2024who,\ntitle={Who Leaked the Model? Tracking {IP} Infringers in Accountable Federated Learning},\nauthor={Shuyang Yu and Junyuan Hong and Yi Zeng and Fei Wang and Ruoxi Jia and Jiayu Zhou},\nyear={2024},\nurl={https://openreview.net/forum?id=WNSjteBJd9}\n}",
        "github": "",
        "project": "",
        "reviewers": "qn5H;Khiu;MDWZ",
        "site": "https://openreview.net/forum?id=WNSjteBJd9",
        "pdf_size": 829970,
        "rating": "3;5;8",
        "confidence": "3;5;3",
        "soundness": "2;3;3",
        "contribution": "2;2;3",
        "presentation": "2;3;3",
        "wc_summary": "141;41;114",
        "wc_strengths": "52;54;68",
        "wc_weaknesses": "606;213;144",
        "wc_questions": "133;25;10",
        "wc_review": "932;333;336",
        "wc_reply_reviewers": "0;12;9",
        "wc_reply_authors": "2321;938;524",
        "reply_reviewers": "0;1;1",
        "reply_authors": "4;3;2",
        "rating_avg": [
            5.333333333333333,
            2.0548046676563256
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            98.66666666666667,
            42.24005471376928
        ],
        "wc_strengths_avg": [
            58.0,
            7.118052168020874
        ],
        "wc_weaknesses_avg": [
            321.0,
            203.48464315520226
        ],
        "wc_questions_avg": [
            56.0,
            54.7905101272109
        ],
        "wc_review_avg": [
            533.6666666666666,
            281.6668639052564
        ],
        "wc_reply_reviewers_avg": [
            7.0,
            5.0990195135927845
        ],
        "wc_reply_authors_avg": [
            1261.0,
            768.3527835571366
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.0,
            0.816496580927726
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.11470786693528094,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12486188240159492649&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;3;2;0",
        "aff_unique_norm": "Michigan State University;University of Texas at Austin;Virginia Tech;Cornell University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.msu.edu;https://www.utexas.edu;https://www.vt.edu;https://www.cornell.edu",
        "aff_unique_abbr": "MSU;UT Austin;VT;Cornell",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Austin",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Lipschitz Singularities in Diffusion Models",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18480",
        "id": "WNkW0cOwiz",
        "author_site": "Zhantao Yang, Ruili Feng, Han Zhang, Yujun Shen, Kai Zhu, Lianghua Huang, Yifei Zhang, Yu Liu, Deli Zhao, Jingren Zhou, Fan Cheng",
        "tldr": "",
        "abstract": "Diffusion models, which employ stochastic differential equations to sample images through integrals, have emerged as a dominant class of generative models. However, the rationality of the diffusion process itself receives limited attention, leaving the question of whether the problem is well-posed and well-conditioned. In this paper, we uncover a vexing propensity of diffusion models: they frequently exhibit the infinite Lipschitz near the zero point of timesteps. We provide theoretical proofs to illustrate the presence of infinite Lipschitz constants and empirical results to confirm it. The Lipschitz singularities pose a threat to the stability and accuracy during both the training and inference processes of diffusion models. Therefore, the mitigation of Lipschitz singularities holds great potential for enhancing the performance of diffusion models. To address this challenge, we propose a novel approach, dubbed E-TSDM, which alleviates the Lipschitz singularities of the diffusion model near the zero point. Remarkably, our technique yields a substantial improvement in performance. Moreover, as a byproduct of our method, we achieve a dramatic reduction in the Fr\u00e9chet Inception Distance of acceleration methods relying on network Lipschitz, including DDIM and DPM-Solver, by over 33\\%. Extensive experiments on diverse datasets validate our theory and method. Our work may advance the understanding of the general diffusion process, and also provide insights for the design of diffusion models.",
        "keywords": "Image Generation;Generative models;Diffusion models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/3d35d43c8b13c9365e0babf1d568a9e6e00fce61.zip",
        "author": "Zhantao Yang;Ruili Feng;Han Zhang;Yujun Shen;Kai Zhu;Lianghua Huang;Yifei Zhang;Yu Liu;Deli Zhao;Jingren Zhou;Fan Cheng",
        "authorids": "~Zhantao_Yang1;~Ruili_Feng1;~Han_Zhang16;~Yujun_Shen1;~Kai_Zhu4;~Lianghua_Huang2;~Yifei_Zhang4;~Yu_Liu23;~Deli_Zhao1;~Jingren_Zhou1;~Fan_Cheng1",
        "gender": "M;;M;;;M;;M;M;M;M",
        "homepage": ";https://github.com/RuiLiFeng;https://github.com/bibona;;;;;https://github.com/liuyuyuil;https://zhaodeli.github.io;;http://www.cs.sjtu.edu.cn/~chengfan",
        "dblp": "285/8489.html;20/9594;26/4189-10;;75/4078-4;166/6155;;97/2274-63;77/1992;84/2644;",
        "google_scholar": "Fz3X5FwAAAAJ;;;;https://scholar.google.com.hk/citations?hl=zh-CN;JYVCn3AAAAAJ;https://scholar.google.com/citations?hl=zh-CN;8zksQb4AAAAJ;https://scholar.google.com/citations?hl=en;;https://scholar.google.com.hk/citations?user=sFfkf94AAAAJ",
        "orcid": "0000-0003-2765-295X;;;;;0000-0002-9686-9354;0009-0005-4831-883X;;0000-0002-8838-578X;;0000-0002-4307-6334",
        "linkedin": ";;;;;;zhang-yf-2bb8a61a1;;;;",
        "or_profile": "~Zhantao_Yang1;~Ruili_Feng1;~Han_Zhang16;~Yujun_Shen1;~Kai_Zhu4;~Lianghua_Huang2;~Yifei_Zhang4;~Yu_Liu23;~Deli_Zhao1;~Jingren_Zhou1;~Fan_Cheng1",
        "aff": "Shanghai Jiaotong University;University of Science and Technology of China;Shanghai Jiaotong University;;University of Science and Technology of China;Alibaba Group;Shanghai Jiaotong University;Alibaba Group;Alibaba Group;Alibaba Group;Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn;mail.ustc.edu.cn;sjtu.edu.cn;;ustc.edu.cn;aliabba-inc.com;sjtu.edu.cn;alibaba-inc.com;alibaba-inc.com;alibaba-inc.com;sjtu.edu.cn",
        "position": "PhD student;PhD student;PhD student;;Postdoc;Researcher;PhD student;Researcher;Director;Researcher;Associate Professor",
        "bibtex": "@inproceedings{\nyang2024lipschitz,\ntitle={Lipschitz Singularities in Diffusion Models},\nauthor={Zhantao Yang and Ruili Feng and Han Zhang and Yujun Shen and Kai Zhu and Lianghua Huang and Yifei Zhang and Yu Liu and Deli Zhao and Jingren Zhou and Fan Cheng},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=WNkW0cOwiz}\n}",
        "github": "",
        "project": "",
        "reviewers": "gGRw;qCuR;DUEU;gj5E",
        "pdf_size": 6578125,
        "rating": "6;8;8;8",
        "confidence": "4;4;3;3",
        "soundness": "4;4;4;4",
        "contribution": "3;3;3;4",
        "presentation": "3;3;4;3",
        "wc_summary": "40;194;64;119",
        "wc_strengths": "52;28;65;182",
        "wc_weaknesses": "74;83;31;59",
        "wc_questions": "54;161;1;113",
        "wc_review": "220;466;161;473",
        "wc_reply_reviewers": "0;0;0;25",
        "wc_reply_authors": "1301;357;74;1216",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "5;2;1;3",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            4.0,
            0.0
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            104.25,
            59.20462397482142
        ],
        "wc_strengths_avg": [
            81.75,
            59.381710147148844
        ],
        "wc_weaknesses_avg": [
            61.75,
            19.715159142142372
        ],
        "wc_questions_avg": [
            82.25,
            60.30495419117736
        ],
        "wc_review_avg": [
            330.0,
            141.07267630551283
        ],
        "wc_reply_reviewers_avg": [
            6.25,
            10.825317547305483
        ],
        "wc_reply_authors_avg": [
            737.0,
            531.861354114021
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            1.479019945774904
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1973547962483834113&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=WNkW0cOwiz",
        "pdf": "https://openreview.net/pdf?id=WNkW0cOwiz",
        "email": "sjtu.edu.cn;mail.ustc.edu.cn;sjtu.edu.cn;;ustc.edu.cn;aliabba-inc.com;sjtu.edu.cn;alibaba-inc.com;alibaba-inc.com;alibaba-inc.com;sjtu.edu.cn",
        "author_num": 11,
        "aff_unique_index": "0;1;0;1;2;0;2;2;2;0",
        "aff_unique_norm": "Shanghai Jiao Tong University;University of Science and Technology of China;Alibaba Group",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.sjtu.edu.cn;http://www.ustc.edu.cn;https://www.alibaba.com",
        "aff_unique_abbr": "SJTU;USTC;Alibaba",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "WNxlJJIEVj",
        "title": "Contrastive Diffuser: Planning Towards High Return States via Contrastive Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Applying Diffusion in reinforcement learning for long-term planning has gained much attention recently. Depending on the capability of diffusion in modeling the underlying distribution, those methods leverage the diffusion to generate the subsequent trajectories for planning, and achieve significant improvement. However, these methods neglect the differences of samples in offline datasets, in which different states have different returns. They simply leverage diffusion to learn the distribution of data, and generate the trajectories whose states have the same distribution with the offline datasets. As a result, the probability of these models reaching the high-return states is largely dependent on the distribution in the dataset. Even equipped with the guidance model, the performance is still suppressed. To address these limitations, in this paper, we propose a novel method called CDiffuser, which devises a return contrast mechanism to pull the states in generated trajectories towards high-return states while pushing them away from low-return states. Experiments on nine commonly used D4RL benchmarks demonstrate the effectiveness of our proposed method. Our code is publicly available at https://anonymous.4open.science/r/ContrastiveDiffuser.",
        "keywords": "Offline Reinforcement Learning;  Diffusion Model; Contrastive Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Yixiang Shan;Zhengbang Zhu;Ting Long;Yi Chang;Weinan Zhang",
        "authorids": "~Yixiang_Shan1;~Zhengbang_Zhu1;~Ting_Long1;~Yi_Chang4;~Weinan_Zhang1",
        "gender": "M;M;F;M;M",
        "homepage": "https://dblp.org/pid/331/0031;https://github.com/zbzhu99;http://apex.sjtu.edu.cn/members/longting@apexlab.org;http://www.yichang-cs.com;http://wnzhang.net",
        "dblp": "331/0031;277/0869;06/8646.html;02/5438.html;28/10261-1",
        "google_scholar": "KSHTBUkAAAAJ;;;https://scholar.google.com.hk/citations?user=drEkR50AAAAJ;Qzss0GEAAAAJ",
        "orcid": "0000-0003-1300-9146;;0000-0001-5817-6875;0000-0003-2697-8093;0000-0002-0127-2425",
        "linkedin": ";;;;",
        "or_profile": "~Yixiang_Shan1;~Zhengbang_Zhu1;~Ting_Long1;~Yi_Chang4;~Weinan_Zhang1",
        "aff": "Jilin University;Shanghai Jiaotong University;Jilin University;Jilin University, China;Shanghai Jiaotong University",
        "aff_domain": "jlu.edu.cn;sjtu.edu.cn;jlu.edu.cn;jlu.edu.cn;sjtu.edu.cn",
        "position": "PhD student;PhD student;Assistant Professor;Full Professor;Associate Professor",
        "bibtex": "@misc{\nshan2024contrastive,\ntitle={Contrastive Diffuser: Planning Towards High Return States via Contrastive Learning},\nauthor={Yixiang Shan and Zhengbang Zhu and Ting Long and Yi Chang and Weinan Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=WNxlJJIEVj}\n}",
        "github": "",
        "project": "",
        "reviewers": "FaMZ;F1CC;ogtz;VS91",
        "site": "https://openreview.net/forum?id=WNxlJJIEVj",
        "pdf_size": 6640840,
        "rating": "3;3;5;10",
        "confidence": "3;5;3;3",
        "soundness": "2;1;2;4",
        "contribution": "2;3;3;4",
        "presentation": "3;3;3;4",
        "wc_summary": "68;73;49;70",
        "wc_strengths": "46;43;22;33",
        "wc_weaknesses": "172;303;42;131",
        "wc_questions": "37;3;113;111",
        "wc_review": "323;422;226;345",
        "wc_reply_reviewers": "211;339;12;140",
        "wc_reply_authors": "1862;2670;548;371",
        "reply_reviewers": "2;1;1;1",
        "reply_authors": "5;6;2;2",
        "rating_avg": [
            5.25,
            2.8613807855648994
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.25,
            1.0897247358851685
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            65.0,
            9.40744386111339
        ],
        "wc_strengths_avg": [
            36.0,
            9.40744386111339
        ],
        "wc_weaknesses_avg": [
            162.0,
            93.99734038790672
        ],
        "wc_questions_avg": [
            66.0,
            47.54997371187496
        ],
        "wc_review_avg": [
            329.0,
            69.91065727054782
        ],
        "wc_reply_reviewers_avg": [
            175.5,
            118.30574795841494
        ],
        "wc_reply_authors_avg": [
            1362.75,
            949.4128119527353
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.75,
            1.7853571071357126
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.45398994507478646,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:W9K8vICgW6EJ:scholar.google.com/&scioq=Contrastive+Diffuser:+Planning+Towards+High+Return+States+via+Contrastive+Learning&hl=en&as_sdt=0,44",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0;0;1",
        "aff_unique_norm": "Jilin University;Shanghai Jiao Tong University",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.jlu.edu.cn;https://www.sjtu.edu.cn",
        "aff_unique_abbr": "JLU;SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Improved Techniques for Training Consistency Models",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18479",
        "id": "WNzy9bRDvG",
        "author_site": "Yang Song, Prafulla Dhariwal",
        "tldr": "",
        "abstract": "Consistency models are a nascent family of generative models that can sample high quality data in one step without the need for adversarial training. Current consistency models achieve optimal sample quality by distilling from pre-trained diffusion models and employing learned metrics such as LPIPS. However, distillation limits the quality of consistency models to that of the pre-trained diffusion model, and LPIPS causes undesirable bias in evaluation. To tackle these challenges, we present improved techniques for consistency training, where consistency models learn directly from data without distillation. We delve into the theory behind consistency training and identify a previously overlooked flaw, which we address by eliminating Exponential Moving Average from the teacher consistency model. To replace learned metrics like LPIPS, we adopt Pseudo-Huber losses from robust statistics. Additionally, we introduce a lognormal noise schedule for the consistency training objective, and propose to double total discretization steps every set number of training iterations. Combined with better hyperparameter tuning, these modifications enable consistency models to achieve FID scores of 2.51 and 3.25 on CIFAR-10 and ImageNet $64\\times 64$ respectively in a single sampling step. These scores mark a 3.5$\\times$ and 4$\\times$ improvement compared to prior consistency training approaches. Through two-step sampling, we further reduce FID scores to 2.24 and 2.77 on these two datasets, surpassing those obtained via distillation in both one-step and two-step settings, while narrowing the gap between consistency models and other state-of-the-art generative models.",
        "keywords": "Consistency Models;Consistency Training;Diffusion Models;Score-Based Generative Models;Score-Based Diffusion Models;Distillation",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Yang Song;Prafulla Dhariwal",
        "authorids": "~Yang_Song1;~Prafulla_Dhariwal1",
        "gender": "M;M",
        "homepage": "https://yang-song.net;https://prafulladhariwal.com/",
        "dblp": ";",
        "google_scholar": "o_J2CroAAAAJ;0pOgVVAAAAAJ",
        "orcid": ";",
        "linkedin": ";prafulladhariwal",
        "or_profile": "~Yang_Song1;~Prafulla_Dhariwal1",
        "aff": "OpenAI;OpenAI",
        "aff_domain": "openai.com;openai.com",
        "position": "Researcher;Researcher",
        "bibtex": "@inproceedings{\nsong2024improved,\ntitle={Improved Techniques for Training Consistency Models},\nauthor={Yang Song and Prafulla Dhariwal},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=WNzy9bRDvG}\n}",
        "github": "",
        "project": "",
        "reviewers": "YvKM;ceYg;m7Dp;3jcG",
        "pdf_size": 19580986,
        "rating": "6;6;8;8",
        "confidence": "4;4;4;4",
        "soundness": "3;2;3;4",
        "contribution": "3;3;3;3",
        "presentation": "3;4;3;4",
        "wc_summary": "159;64;194;96",
        "wc_strengths": "111;59;130;90",
        "wc_weaknesses": "169;310;133;166",
        "wc_questions": "129;164;107;16",
        "wc_review": "568;597;564;368",
        "wc_reply_reviewers": "125;18;0;0",
        "wc_reply_authors": "454;399;249;226",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            128.25,
            51.080206538345166
        ],
        "wc_strengths_avg": [
            97.5,
            26.348624252510795
        ],
        "wc_weaknesses_avg": [
            194.5,
            68.16340660501058
        ],
        "wc_questions_avg": [
            104.0,
            54.7220248163388
        ],
        "wc_review_avg": [
            524.25,
            91.10536482556886
        ],
        "wc_reply_reviewers_avg": [
            35.75,
            52.04985590758153
        ],
        "wc_reply_authors_avg": [
            332.0,
            96.82200163186052
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 148,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5739615267694548147&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=WNzy9bRDvG",
        "pdf": "https://openreview.net/pdf?id=WNzy9bRDvG",
        "email": "openai.com;openai.com",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "OpenAI",
        "aff_unique_dep": "",
        "aff_unique_url": "https://openai.com",
        "aff_unique_abbr": "OpenAI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "WO4BCqEyWc",
        "title": "Augmentation-aware Self-Supervised Learning with Conditioned Projector",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Self-supervised learning (SSL) is a powerful technique for learning robust representations from unlabeled data. By learning to remain invariant to applied data augmentations, methods such as SimCLR and MoCo are able to reach quality on par with supervised approaches. However, this invariance may be harmful to solving some downstream tasks which depend on traits affected by augmentations used during pretraining, such as color. In this paper, we propose to foster sensitivity to such characteristics in the representation space by modifying the projector network, a common component of self-supervised architectures. Specifically, we supplement the projector with information about augmentations applied to images. In order for the projector to take advantage of this auxiliary conditioning when solving the SSL task, the feature extractor learns to preserve the augmentation information in its representations. Our approach, coined Conditional Augmentation-aware Self-supervised Learning (CASSLE), is directly applicable to typical joint-embedding SSL methods regardless of their objective functions. Moreover, it does not require major changes in the network architecture or prior knowledge of downstream tasks. In addition to an analysis of sensitivity towards different data augmentations, we conduct a series of experiments, which show that CASSLE improves over various SSL methods, reaching state-of-the-art performance in multiple downstream tasks.",
        "keywords": "self-supervised learning;contrastive learning;conditional computation;augmentation;computer vision;projector;simclr;simsiam;moco;barlow twins",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Marcin Przewi\u0119\u017alikowski;Mateusz Pyla;Bartosz Micha\u0142 Zieli\u0144ski;Bart\u0142omiej Twardowski;Jacek Tabor;Marek \u015amieja",
        "authorids": "~Marcin_Przewi\u0119\u017alikowski1;~Mateusz_Pyla1;~Bartosz_Micha\u0142_Zieli\u0144ski1;~Bart\u0142omiej_Twardowski1;~Jacek_Tabor1;~Marek_\u015amieja1",
        "gender": "M;M;M;M;M;M",
        "homepage": "http://mprzewie.github.io;https://mateusz-pyla.u.matinf.uj.edu.pl;https://bartoszzielinski.github.io/;;;https://mareksmieja.github.io/",
        "dblp": "242/4933;;12/3424-1;156/6628;31/5172;81/10360",
        "google_scholar": "https://scholar.google.com/citations?hl=pl;QzVVxMkAAAAJ;https://scholar.google.pl/citations?user=AJHaOpkAAAAJ;https://scholar.google.pl/citations?user=8yywECgAAAAJ;https://scholar.google.pl/citations?user=zSKYziUAAAAJ;https://scholar.google.pl/citations?user=MOmnpZcAAAAJ",
        "orcid": "0000-0003-4772-3268;;0000-0002-3063-3621;0000-0003-2117-8679;0000-0001-6652-7727;0000-0003-2027-4132",
        "linkedin": "marcin-przewi%C4%99%C5%BAlikowski-aa5b82135/;mateusz-pyla-91303b135/;bartosz-zieli%C5%84ski-1b2b1ab/;bartlomiejtwardowski/;;",
        "or_profile": "~Marcin_Przewi\u0119\u017alikowski1;~Mateusz_Pyla1;~Bartosz_Micha\u0142_Zieli\u0144ski1;~Bart\u0142omiej_Twardowski1;~Jacek_Tabor1;~Marek_\u015amieja1",
        "aff": "Jagiellonian University Cracow;Jagiellonian University Cracow;Jagiellonian University;Computer Vision Center, Universitat Aut\u00f2noma de Barcelona;Jagiellonian University;Jagiellonian University",
        "aff_domain": "uj.edu.pl;uj.edu.pl;uj.edu.pl;cvc.uab.es;uj.edu.pl;uj.edu.pl",
        "position": "PhD student;PhD student;Assistant Professor;Postdoc;Full Professor;Associate Professor",
        "bibtex": "@misc{\nprzewi{\\k{e}}{\\'z}likowski2024augmentationaware,\ntitle={Augmentation-aware Self-Supervised Learning with Conditioned Projector},\nauthor={Marcin Przewi{\\k{e}}{\\'z}likowski and Mateusz Pyla and Bartosz Micha{\\l} Zieli{\\'n}ski and Bart{\\l}omiej Twardowski and Jacek Tabor and Marek {\\'S}mieja},\nyear={2024},\nurl={https://openreview.net/forum?id=WO4BCqEyWc}\n}",
        "github": "",
        "project": "",
        "reviewers": "hzhB;Fj5t;ad4G;N37y",
        "site": "https://openreview.net/forum?id=WO4BCqEyWc",
        "pdf_size": 6528454,
        "rating": "3;5;6;6",
        "confidence": "5;4;4;4",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;4",
        "wc_summary": "70;65;77;188",
        "wc_strengths": "39;25;62;94",
        "wc_weaknesses": "246;254;283;108",
        "wc_questions": "41;219;180;97",
        "wc_review": "396;563;602;487",
        "wc_reply_reviewers": "239;484;98;16",
        "wc_reply_authors": "1462;1165;1290;636",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "3;2;2;2",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            100.0,
            50.98529199681022
        ],
        "wc_strengths_avg": [
            55.0,
            26.105554964413226
        ],
        "wc_weaknesses_avg": [
            222.75,
            67.66599958620282
        ],
        "wc_questions_avg": [
            134.25,
            69.56786255161215
        ],
        "wc_review_avg": [
            512.0,
            78.71149852467555
        ],
        "wc_reply_reviewers_avg": [
            209.25,
            177.54911292372034
        ],
        "wc_reply_authors_avg": [
            1138.25,
            308.5501377410161
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.9428090415820632,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15891167942288195423&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;0;1;0;0",
        "aff_unique_norm": "Jagiellonian University;Universitat Aut\u00f2noma de Barcelona",
        "aff_unique_dep": ";Computer Vision Center",
        "aff_unique_url": "https://www.uj.edu.pl;https://www.uab.cat",
        "aff_unique_abbr": "UJ;UAB",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Cracow;",
        "aff_country_unique_index": "0;0;0;1;0;0",
        "aff_country_unique": "Poland;Spain"
    },
    {
        "title": "TextField3D: Towards Enhancing Open-Vocabulary 3D Generation with Noisy Text Fields",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18478",
        "id": "WOiOzHG2zD",
        "author_site": "Tianyu Huang, Yihan Zeng, Bowen Dong, Hang Xu, Songcen Xu, Rynson W Lau, Wangmeng Zuo",
        "tldr": "",
        "abstract": "Recent works learn 3D representation explicitly under text-3D guidance. However, limited text-3D data restricts the vocabulary scale and text control of generations. Generators may easily fall into a stereotype concept for certain text prompts, thus losing open-vocabulary generation ability. To tackle this issue, we introduce a conditional 3D generative model, namely TextField3D. Specifically, rather than using the text prompts as input directly, we suggest to inject dynamic noise into the latent space of given text prompts, i.e., Noisy Text Fields (NTFs). In this way, limited 3D data can be mapped to the appropriate range of textual latent space that is expanded by NTFs. To this end, an NTFGen module is proposed to model general text latent code in noisy fields. Meanwhile, an NTFBind module is proposed to align view-invariant image latent code to noisy fields, further supporting image-conditional 3D generation. To guide the conditional generation in both geometry and texture, multi-modal discrimination is constructed with a text-3D discriminator and a text-2.5D discriminator. Compared to previous methods, TextField3D includes three merits: 1) large vocabulary, 2) text consistency, and 3) low latency. Extensive experiments demonstrate that our method achieves a potential open-vocabulary 3D generation capability.",
        "keywords": "3D Open Vocabulary;Conditional Generation",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Tianyu Huang;Yihan Zeng;Bowen Dong;Hang Xu;Songcen Xu;Rynson W. H. Lau;Wangmeng Zuo",
        "authorids": "~Tianyu_Huang2;~Yihan_Zeng1;~Bowen_Dong1;~Hang_Xu1;~Songcen_Xu1;~Rynson_W._H._Lau1;~Wangmeng_Zuo3",
        "gender": ";;M;M;M;;M",
        "homepage": ";;;;http://www.xusongcen.com/;;",
        "dblp": ";;;;131/6572;;93/2671",
        "google_scholar": ";;t0WhKEYAAAAJ;https://scholar.google.com.hk/citations?user=J_8TX6sAAAAJ;_xVW9SgAAAAJ;;rUOpCEYAAAAJ",
        "orcid": ";;0000-0001-7379-1286;0000-0003-3645-8972;;;0000-0002-3330-783X",
        "linkedin": ";;;;songcen-xu-2b313465/;;",
        "or_profile": "~Tianyu_Huang2;~Yihan_Zeng1;~Bowen_Dong1;~Hang_Xu1;~Songcen_Xu1;~Rynson_W._H._Lau1;~Wangmeng_Zuo3",
        "aff": ";;Harbin Institute of Technology;Huawei Noah\u2018s Ark Lab;Huawei Noah's Ark Lab;;Harbin Institute of Technology",
        "aff_domain": ";;hit.edu.cn;huawei.com;huawei.com;;hit.edu.cn",
        "position": ";;PhD student;Researcher;Principal Engineer;;Full Professor",
        "bibtex": "@inproceedings{\nhuang2024textfieldd,\ntitle={TextField3D: Towards Enhancing Open-Vocabulary 3D Generation with Noisy Text Fields},\nauthor={Tianyu Huang and Yihan Zeng and Bowen Dong and Hang Xu and Songcen Xu and Rynson W. H. Lau and Wangmeng Zuo},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=WOiOzHG2zD}\n}",
        "github": "",
        "project": "",
        "reviewers": "9TYY;oUD4;Fjdj",
        "pdf_size": 6295414,
        "rating": "6;6;8",
        "confidence": "4;5;3",
        "soundness": "3;2;3",
        "contribution": "3;2;3",
        "presentation": "3;4;3",
        "wc_summary": "173;185;147",
        "wc_strengths": "98;89;109",
        "wc_weaknesses": "197;385;74",
        "wc_questions": "2;117;24",
        "wc_review": "470;776;354",
        "wc_reply_reviewers": "34;108;0",
        "wc_reply_authors": "719;1035;477",
        "reply_reviewers": "1;1;0",
        "reply_authors": "3;4;2",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            168.33333333333334,
            15.86050300449376
        ],
        "wc_strengths_avg": [
            98.66666666666667,
            8.178562764256865
        ],
        "wc_weaknesses_avg": [
            218.66666666666666,
            127.88623416493618
        ],
        "wc_questions_avg": [
            47.666666666666664,
            49.84197249529981
        ],
        "wc_review_avg": [
            533.3333333333334,
            178.00624208780496
        ],
        "wc_reply_reviewers_avg": [
            47.333333333333336,
            45.087569117095775
        ],
        "wc_reply_authors_avg": [
            743.6666666666666,
            228.46930258181783
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.0,
            0.816496580927726
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17753294978424739515&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=WOiOzHG2zD",
        "pdf": "https://openreview.net/pdf?id=WOiOzHG2zD",
        "email": ";;hit.edu.cn;huawei.com;huawei.com;;hit.edu.cn",
        "author_num": 7,
        "aff_unique_index": "0;1;1;0",
        "aff_unique_norm": "Harbin Institute of Technology;Huawei",
        "aff_unique_dep": ";Noah's Ark Lab",
        "aff_unique_url": "http://www.hit.edu.cn/;https://www.huawei.com",
        "aff_unique_abbr": "HIT;Huawei",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Harbin;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Fine-Tuning Language Models for Factuality",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18477",
        "id": "WPZ2yPag4K",
        "author_site": "Katherine Tian, Eric Mitchell, Huaxiu Yao, Christopher Manning, Chelsea Finn",
        "tldr": "",
        "abstract": "The fluency and creativity of large pre-trained language models (LLMs) have led to their widespread use, sometimes even as a replacement for traditional search engines. Yet language models are prone to making convincing but factually inaccurate claims, often referred to as `hallucinations.' These errors can inadvertently spread misinformation or harmfully perpetuate misconceptions. Further, manual fact-checking of model responses is a time-consuming process, making human factuality labels expensive to acquire. In this work, we fine-tune language models to be more factual, without human labeling and targeting more open-ended generation settings than past work. We leverage two key recent innovations in NLP to do so. First, several recent works have proposed methods for judging the factuality of open-ended text by measuring consistency with an external knowledge base or simply a large model's confidence scores. Second, the Direct Preference Optimization algorithm enables straightforward fine-tuning of language models on objectives other than supervised imitation, using a preference ranking over possible model responses. We show that learning from automatically generated factuality preference rankings, generated either through existing retrieval systems or our novel retrieval-free approach, significantly improves the factuality (percent of generated claims that are correct) of Llama-2 on held-out topics compared with RLHF or decoding strategies targeted at factuality. At 7B scale, compared to Llama-2-Chat, we observe 53% and 50% reduction in factual error rate when generating biographies and answering medical questions, respectively. A reference implementation can be found at https://github.com/kttian/llm_factuality_tuning.",
        "keywords": "factuality;hallucination;language model;dpo",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Katherine Tian;Eric Mitchell;Huaxiu Yao;Christopher D Manning;Chelsea Finn",
        "authorids": "~Katherine_Tian1;~Eric_Mitchell1;~Huaxiu_Yao1;~Christopher_D_Manning1;~Chelsea_Finn1",
        "gender": "F;M;M;M;F",
        "homepage": ";https://ericmitchell.ai;http://huaxiuyao.mystrikingly.com;https://nlp.stanford.edu/~manning/;https://ai.stanford.edu/~cbfinn/",
        "dblp": ";238/0419;197/1635;m/ChristopherDManning;131/1783",
        "google_scholar": ";q77J4fgAAAAJ;A20BZnQAAAAJ;1zmDOdwAAAAJ;vfPE6hgAAAAJ",
        "orcid": ";0000-0002-7487-1744;;0000-0001-6155-649X;",
        "linkedin": "katherine-tian/;;huaxiuyao/;christopher-manning-011575/;",
        "or_profile": "~Katherine_Tian1;~Eric_Mitchell1;~Huaxiu_Yao1;~Christopher_D_Manning1;~Chelsea_Finn1",
        "aff": ";Stanford University;Department of Computer Science, University of North Carolina at Chapel Hill;Computer Science Department, Stanford University;Google",
        "aff_domain": ";stanford.edu;cs.unc.edu;cs.stanford.edu;google.com",
        "position": ";PhD student;Assistant Professor;Full Professor;Research Scientist",
        "bibtex": "@inproceedings{\ntian2024finetuning,\ntitle={Fine-Tuning Language Models for Factuality},\nauthor={Katherine Tian and Eric Mitchell and Huaxiu Yao and Christopher D Manning and Chelsea Finn},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=WPZ2yPag4K}\n}",
        "github": "",
        "project": "",
        "reviewers": "Pzp4;mN58;7K7x;2run",
        "pdf_size": 940560,
        "rating": "5;6;6;6",
        "confidence": "4;4;4;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;2;2",
        "presentation": "4;4;3;3",
        "wc_summary": "160;159;42;65",
        "wc_strengths": "51;53;58;34",
        "wc_weaknesses": "134;401;182;26",
        "wc_questions": "60;26;111;19",
        "wc_review": "405;639;393;144",
        "wc_reply_reviewers": "0;43;0;21",
        "wc_reply_authors": "523;847;879;193",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "1;2;2;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            106.5,
            53.621357685161236
        ],
        "wc_strengths_avg": [
            49.0,
            9.027735042633894
        ],
        "wc_weaknesses_avg": [
            185.75,
            136.5144223150067
        ],
        "wc_questions_avg": [
            54.0,
            36.37993952716249
        ],
        "wc_review_avg": [
            395.25,
            175.10050685249314
        ],
        "wc_reply_reviewers_avg": [
            16.0,
            17.790446874657196
        ],
        "wc_reply_authors_avg": [
            610.5,
            278.3823809079878
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 162,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13775477305382022797&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=WPZ2yPag4K",
        "pdf": "https://openreview.net/pdf?id=WPZ2yPag4K",
        "email": ";stanford.edu;cs.unc.edu;cs.stanford.edu;google.com",
        "author_num": 5,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "Stanford University;University of North Carolina at Chapel Hill;Google",
        "aff_unique_dep": ";Department of Computer Science;Google",
        "aff_unique_url": "https://www.stanford.edu;https://www.unc.edu;https://www.google.com",
        "aff_unique_abbr": "Stanford;UNC Chapel Hill;Google",
        "aff_campus_unique_index": "0;1;0;2",
        "aff_campus_unique": "Stanford;Chapel Hill;Mountain View",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "WQ6rnDriHj",
        "title": "Unifying Diverse Decision-Making Scenarios with Learned Discrete Actions",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Designing effective action spaces for complex environments is a fundamental and challenging problem in reinforcement learning (RL). \nAlthough various action shaping and representation learning methods have been proposed to address some specific action spaces and decision-making requirements (e.g. action constraints), these methods often are typically customized to fixed scenarios and require extensive domain knowledge.\nIn this paper, we introduce a general framework that can apply any common RL algorithms to a class of discrete latent actions learned from data. This framework unifies a wide range of action spaces, including those with continuous, hybrid, or constrained actions.\nSpecifically, we propose a novel algorithm, General Action Discretization Model (GADM), that can adaptively discretize raw actions to construct unified and compact latent action spaces. \nMoreover, GADM also predicts confidence scores of different latent actions, which can help mitigate the instability of parallel optimization in online RL settings, and serve as an implicit contraint for offline RL cases.\nQuantitative experiments and visualization results demonstrate that our proposed framework can match or outperform various approaches specifically designed for different environments.",
        "keywords": "Reinforcement Learning;DeepRL;Representation Learning;Action Discretization",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Yazhe Niu;Yuan Pu;Yun Chen;Chunyu Xuan;Zhenjie Yang;Yu Liu;Hongsheng Li",
        "authorids": "~Yazhe_Niu1;~Yuan_Pu2;~Yun_Chen6;~Chunyu_Xuan1;~Zhenjie_Yang1;~Yu_Liu2;~Hongsheng_Li3",
        "gender": "M;;M;M;M;M;M",
        "homepage": "https://github.com/PaParaZz1;https://cloud-pku.github.io/cloudchen.github.io/;https://github.com/HarryXuancy;https://github.com/jayyoung0802;http://liuyu.us;http://www.ee.cuhk.edu.hk/~hsli;https://github.com/puyuan1996",
        "dblp": "252/5570.html;;;;97/2274-15;27/7402-1;",
        "google_scholar": "P3BUrBQAAAAJ;;;jVlRiUEAAAAJ;;BN2Ze-QAAAAJ;NdowrLgAAAAJ",
        "orcid": ";;;;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Yazhe_Niu1;~Yun_Chen6;~Chunyu_Xuan1;~Zhenjie_Yang1;~Yu_Liu2;~Hongsheng_Li3;~Yuan_Pu1",
        "aff": "The Chinese University of Hong Kong;Peking University;Shanghai AI Lab;Shanghai Jiaotong University;SenseTime;The Chinese University of Hong Kong;Shanghai Artificial Intelligence Laboratory",
        "aff_domain": "cuhk.edu.hk;pku.edu.cn;pjlab.org.cn;sjtu.edu.cn;sensetime.com;cuhk.edu.hk;pjlab.org.cn",
        "position": "PhD student;MS student;Intern;PhD student;Principal Researcher;Associate Professor;Researcher",
        "bibtex": "@misc{\nniu2024unifying,\ntitle={Unifying Diverse Decision-Making Scenarios with Learned Discrete Actions},\nauthor={Yazhe Niu and Yuan Pu and Yun Chen and Chunyu Xuan and Zhenjie Yang and Yu Liu and Hongsheng Li},\nyear={2024},\nurl={https://openreview.net/forum?id=WQ6rnDriHj}\n}",
        "github": "",
        "project": "",
        "reviewers": "PWxK;Fy3u;3rup;9Kqe",
        "site": "https://openreview.net/forum?id=WQ6rnDriHj",
        "pdf_size": 4332123,
        "rating": "3;5;5;6",
        "confidence": "5;3;4;2",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "1;2;2;2",
        "wc_summary": "39;42;39;90",
        "wc_strengths": "55;20;69;84",
        "wc_weaknesses": "960;72;590;76",
        "wc_questions": "12;234;114;44",
        "wc_review": "1066;368;812;294",
        "wc_reply_reviewers": "120;162;0;0",
        "wc_reply_authors": "2829;1980;1560;482",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "4;4;3;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            52.5,
            21.68524844220144
        ],
        "wc_strengths_avg": [
            57.0,
            23.695991222145572
        ],
        "wc_weaknesses_avg": [
            424.5,
            374.1186309180552
        ],
        "wc_questions_avg": [
            101.0,
            85.18802732778826
        ],
        "wc_review_avg": [
            635.0,
            318.06445887587
        ],
        "wc_reply_reviewers_avg": [
            70.5,
            72.04685975113696
        ],
        "wc_reply_authors_avg": [
            1712.75,
            844.9134201206654
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.0,
            1.224744871391589
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.9233805168766388,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:FA5AV6qnoskJ:scholar.google.com/&scioq=Unifying+Diverse+Decision-Making+Scenarios+with+Learned+Discrete+Actions&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;4;0;5",
        "aff_unique_norm": "Chinese University of Hong Kong;Peking University;Shanghai AI Lab;Shanghai Jiao Tong University;SenseTime;Shanghai Artificial Intelligence Laboratory",
        "aff_unique_dep": ";;;;;",
        "aff_unique_url": "https://www.cuhk.edu.hk;http://www.pku.edu.cn;https://www.shanghaiailab.com;https://www.sjtu.edu.cn;https://www.sensetime.com;http://www.shailab.org/",
        "aff_unique_abbr": "CUHK;Peking U;SAIL;SJTU;SenseTime;Shanghai AI Lab",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Mind Your Augmentation: The Key to Decoupling Dense Self-Supervised Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18476",
        "id": "WQYHbr36Fo",
        "author_site": "Congpei Qiu, Tong Zhang, Yanhao Wu, Wei Ke, Mathieu Salzmann, Sabine Susstrunk",
        "tldr": "",
        "abstract": "Dense Self-Supervised Learning (SSL) creates positive pairs by building positive paired regions or points, thereby aiming to preserve local features, for example of individual objects. However, existing approaches tend to couple objects by leaking information from the neighboring contextual regions when the pairs have a limited overlap. In this paper, we first quantitatively identify and confirm the existence of such a coupling phenomenon. We then address it by developing a remarkably simple yet highly effective solution comprising a novel augmentation method, Region Collaborative Cutout (RCC), and a corresponding decoupling branch. Importantly, our design is versatile and can be seamlessly integrated into existing SSL frameworks, whether based on Convolutional Neural Networks (CNNs) or Vision Transformers (ViTs). We conduct extensive experiments, incorporating our solution into two CNN-based and two ViT-based methods, with results confirming the effectiveness of our approach. Moreover, we provide empirical evidence that our method significantly contributes to the disentanglement of feature representations among objects, both in quantitative and qualitative terms.",
        "keywords": "Dense Self-supervised Learning;representation learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Congpei Qiu;Tong Zhang;Yanhao Wu;Wei Ke;Mathieu Salzmann;Sabine S\u00fcsstrunk",
        "authorids": "~Congpei_Qiu1;~Tong_Zhang9;~Yanhao_Wu1;~Wei_Ke1;~Mathieu_Salzmann1;~Sabine_S\u00fcsstrunk1",
        "gender": "M;M;M;M;M;",
        "homepage": ";https://sites.google.com/view/tong-zhang;https://gr.xjtu.edu.cn/web/wei.ke/%E5%9B%A2%E9%98%9F%E6%88%90%E5%91%982;https://gr.xjtu.edu.cn/web/wei.ke/homepage;https://people.epfl.ch/mathieu.salzmann;https://www.epfl.ch/labs/ivrl/",
        "dblp": "317/5040;07/4227-23;251/6276;52/7566-3;18/4533;s/SSusstrunk",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com.au/citations?user=kCy8JG8AAAAJ;;BENt-uEAAAAJ;https://scholar.google.ch/citations?user=n-B0jr4AAAAJ;https://scholar.google.com/citations?hl=de",
        "orcid": ";0000-0001-5818-4285;0009-0002-2648-1650;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Congpei_Qiu1;~Tong_Zhang9;~Yanhao_Wu1;~Wei_Ke1;~Mathieu_Salzmann1;~Sabine_S\u00fcsstrunk1",
        "aff": "Xi'an Jiaotong University;Swiss Federal Institute of Technology Lausanne;Xi'an Jiaotong University;Xi'an Jiaotong University;CSIRO;EPFL - EPF Lausanne",
        "aff_domain": "xjtu.edu.cn;epfl.ch;xjtu.edu.cn;xjtu.edu.cn;data61.csiro.au;epfl.ch",
        "position": "MS student;Postdoc;PhD student;Associate Professor;Collaborator;Full Professor",
        "bibtex": "@inproceedings{\nqiu2024mind,\ntitle={Mind Your Augmentation: The Key to Decoupling Dense Self-Supervised Learning},\nauthor={Congpei Qiu and Tong Zhang and Yanhao Wu and Wei Ke and Mathieu Salzmann and Sabine S{\\\"u}sstrunk},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=WQYHbr36Fo}\n}",
        "github": "",
        "project": "",
        "reviewers": "VesV;wwZs;GFda",
        "pdf_size": 3891689,
        "rating": "6;6;8",
        "confidence": "3;4;2",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "2;2;3",
        "wc_summary": "132;81;30",
        "wc_strengths": "61;50;66",
        "wc_weaknesses": "369;160;121",
        "wc_questions": "176;210;3",
        "wc_review": "738;501;220",
        "wc_reply_reviewers": "232;53;62",
        "wc_reply_authors": "865;1384;371",
        "reply_reviewers": "1;1;2",
        "reply_authors": "2;4;3",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            81.0,
            41.641325627314025
        ],
        "wc_strengths_avg": [
            59.0,
            6.683312551921141
        ],
        "wc_weaknesses_avg": [
            216.66666666666666,
            108.8862811479124
        ],
        "wc_questions_avg": [
            129.66666666666666,
            90.63602423368364
        ],
        "wc_review_avg": [
            486.3333333333333,
            211.7267631222426
        ],
        "wc_reply_reviewers_avg": [
            115.66666666666667,
            82.34210479591971
        ],
        "wc_reply_authors_avg": [
            873.3333333333334,
            413.5974962314072
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.0,
            0.816496580927726
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10284735463504056175&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=WQYHbr36Fo",
        "pdf": "https://openreview.net/pdf?id=WQYHbr36Fo",
        "email": "xjtu.edu.cn;epfl.ch;xjtu.edu.cn;xjtu.edu.cn;data61.csiro.au;epfl.ch",
        "author_num": 6,
        "aff_unique_index": "0;1;0;0;2;3",
        "aff_unique_norm": "Xi'an Jiao Tong University;Swiss Federal Institute of Technology Lausanne;Commonwealth Scientific and Industrial Research Organisation;EPFL",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.xjtu.edu.cn;https://www.epfl.ch;https://www.csiro.au;https://www.epfl.ch",
        "aff_unique_abbr": "XJTU;EPFL;CSIRO;EPFL",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Lausanne",
        "aff_country_unique_index": "0;1;0;0;2;1",
        "aff_country_unique": "China;Switzerland;Australia"
    },
    {
        "title": "Modeling state-dependent communication between brain regions with switching nonlinear dynamical systems",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18475",
        "id": "WQwV7Y8qwa",
        "author_site": "Orren Karniol-Tambour, David Zoltowski, E. Mika Diamanti, Lucas Pinto, Carlos Brody, David Tank, Jonathan Pillow",
        "tldr": "",
        "abstract": "Understanding how multiple brain regions interact to produce behavior is a major challenge in systems neuroscience, with many regions causally implicated in common tasks such as sensory processing and decision making. A precise description of interactions between regions remains an open problem. Moreover, neural dynamics are nonlinear and non-stationary. Here, we propose MR-SDS, a multiregion, switching nonlinear state space model that decomposes global dynamics into local and cross-communication components in the latent space. MR-SDS includes directed interactions between brain regions, allowing for estimation of state-dependent communication signals, and accounts for sensory inputs effects. We show that our model accurately recovers latent trajectories, vector fields underlying switching nonlinear dynamics, and cross-region communication profiles in three simulations. We then apply our method to two large-scale, multi-region neural datasets involving mouse decision making. The first includes hundreds of neurons per region, recorded simultaneously at single-cell-resolution across 3 distant cortical regions. The second is a mesoscale widefield dataset of 8 adjacent cortical regions imaged across both hemispheres. On these multi-region datasets, our model outperforms existing piece-wise linear multi-region models and reveals multiple distinct dynamical states and a rich set of cross-region communication profiles.",
        "keywords": "neuroscience;neural dynamics;dynamical systems;decision making",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "Orren Karniol-Tambour;David M. Zoltowski;E. Mika Diamanti;Lucas Pinto;Carlos D Brody;David W. Tank;Jonathan W. Pillow",
        "authorids": "~Orren_Karniol-Tambour1;~David_M._Zoltowski1;~E._Mika_Diamanti1;~Lucas_Pinto1;~Carlos_D_Brody1;~David_W._Tank1;~Jonathan_W._Pillow1",
        "gender": "M;M;;M;M;M;Not Specified",
        "homepage": ";https://www.davidzoltowski.com/;;https://www.pintolab.org;http://brodylab.org;https://pni.princeton.edu/faculty/david-tank;http://pillowlab.princeton.edu/",
        "dblp": ";158/5356;;;;93/902;06/3460",
        "google_scholar": ";ZnxTn6IAAAAJ;;yKPoN3sAAAAJ;;_LHH8DgAAAAJ;https://scholar.google.com.tw/citations?user=-ElvJ9wAAAAJ",
        "orcid": ";; 0000-0003-1199-3362;0000-0002-0471-9317;0000-0002-4201-561X;0000-0002-9423-4267;0000-0002-3638-8831",
        "linkedin": "orren-karniol-tambour-975269a/;;;;;;",
        "or_profile": "~Orren_Karniol-Tambour1;~David_M._Zoltowski1;~E._Mika_Diamanti1;~Lucas_Pinto1;~Carlos_D_Brody1;~David_W._Tank1;~Jonathan_W._Pillow1",
        "aff": "Princeton University;Stanford University;Princeton University;Northwestern University;Princeton University;Princeton University;Princeton University",
        "aff_domain": "princeton.edu;stanford.edu;princeton.edu;northwestern.edu;princeton.edu;princeton.edu;princeton.edu",
        "position": "PhD student;Postdoc;Postdoc;Assistant Professor;Full Professor;Full Professor;Professor",
        "bibtex": "@inproceedings{\nkarniol-tambour2024modeling,\ntitle={Modeling state-dependent communication between brain regions with switching nonlinear dynamical systems},\nauthor={Orren Karniol-Tambour and David M. Zoltowski and E. Mika Diamanti and Lucas Pinto and Carlos D Brody and David W. Tank and Jonathan W. Pillow},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=WQwV7Y8qwa}\n}",
        "github": "",
        "project": "",
        "reviewers": "LTdS;yiV5;rCyL;zWh9;iayK",
        "pdf_size": 14487811,
        "rating": "5;6;6;6;6",
        "confidence": "4;4;4;4;4",
        "soundness": "2;2;3;2;3",
        "contribution": "2;2;2;2;2",
        "presentation": "2;3;2;2;2",
        "wc_summary": "89;97;54;148;65",
        "wc_strengths": "33;15;40;127;49",
        "wc_weaknesses": "193;202;125;250;286",
        "wc_questions": "158;58;157;474;2",
        "wc_review": "473;372;376;999;402",
        "wc_reply_reviewers": "33;28;20;87;0",
        "wc_reply_authors": "1300;536;766;749;747",
        "reply_reviewers": "2;1;1;1;0",
        "reply_authors": "3;2;1;1;1",
        "rating_avg": [
            5.8,
            0.39999999999999997
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.2,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            90.6,
            32.659454986266994
        ],
        "wc_strengths_avg": [
            52.8,
            38.74222502644885
        ],
        "wc_weaknesses_avg": [
            211.2,
            54.675040009130306
        ],
        "wc_questions_avg": [
            169.8,
            163.3993880037499
        ],
        "wc_review_avg": [
            524.4,
            240.04882836623054
        ],
        "wc_reply_reviewers_avg": [
            33.6,
            28.97309096385817
        ],
        "wc_reply_authors_avg": [
            819.6,
            254.69244197659265
        ],
        "reply_reviewers_avg": [
            1.0,
            0.6324555320336759
        ],
        "reply_authors_avg": [
            1.6,
            0.8
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13108714388332350612&as_sdt=80005&sciodt=0,11&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=WQwV7Y8qwa",
        "pdf": "https://openreview.net/pdf?id=WQwV7Y8qwa",
        "email": "princeton.edu;stanford.edu;princeton.edu;northwestern.edu;princeton.edu;princeton.edu;princeton.edu",
        "author_num": 7,
        "aff_unique_index": "0;1;0;2;0;0;0",
        "aff_unique_norm": "Princeton University;Stanford University;Northwestern University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.princeton.edu;https://www.stanford.edu;https://www.northwestern.edu",
        "aff_unique_abbr": "Princeton;Stanford;NU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Stanford",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "WR9M6AA4LT",
        "title": "Fit Like You Sample: Sample-Efficient Generalized Score Matching from Fast Mixing Diffusions",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Score matching is an approach to learning probability distributions parametrized up to a constant of proportionality (e.g. Energy-Based Models). The idea is to fit the score of the distribution (i.e. $\\nabla_x \\log p(x)$), rather than the likelihood, thus avoiding the need to evaluate the constant of proportionality. While there's a clear algorithmic benefit, the statistical cost can be steep: recent work by (Koehler et al '22) showed that for distributions that have poor isoperimetric properties (a large Poincar\\'e or log-Sobolev constant), score matching is substantially statistically less efficient than maximum likelihood. However, many natural realistic distributions, e.g. multimodal distributions as simple as a mixture of two Gaussians in one dimension---have a poor Poincar\\'e constant. \n\nIn this paper, we show a close connection between the mixing time of a broad class of Markov processes with generator $\\mathcal{L}$ and stationary distribution $p$, and an appropriately chosen generalized score matching loss that tries to fit $\\frac{\\mathcal{O} p}{p}$. In the special case of $\\mathcal{O} = \\nabla_x$, and $\\mathcal{L}$ being the generator of Langevin diffusion, this generalizes and recovers the results from (Koehler et al '22). This allows us to adapt techniques to speed up Markov chains to construct better score-matching losses. In particular, \"preconditioning\" the diffusion can be translated to an appropriate \"preconditioning\" of the score loss. Lifting the chain by adding a temperature like in simulated tempering can be shown to result in a Gaussian-convolution annealed score matching loss, similar to (Song-Ermon '19). Moreover, we show that if the distribution being learned is a finite mixture of Gaussians in $d$ dimensions with a shared covariance, the sample complexity of annealed score matching is polynomial in the ambient dimension, the diameter of the means, and the smallest and largest eigenvalues of the covariance---obviating the Poincar\\'e constant-based lower bounds of the basic score matching loss shown in (Koehler et al '22).",
        "keywords": "theory;score matching;annealing;sample complexity;SDE;Markov chain",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Yilong Qin;Andrej Risteski",
        "authorids": "~Yilong_Qin1;~Andrej_Risteski2",
        "gender": "M;M",
        "homepage": "https://www.yilongq.in/about;",
        "dblp": "301/7967;63/11143",
        "google_scholar": "CFeyF0EAAAAJ;",
        "orcid": ";",
        "linkedin": "yilongqin/;",
        "or_profile": "~Yilong_Qin1;~Andrej_Risteski2",
        "aff": "OpenAI;Carnegie Mellon University",
        "aff_domain": "openai.com;cmu.edu",
        "position": "Researcher;Assistant Professor",
        "bibtex": "@misc{\nqin2024fit,\ntitle={Fit Like You Sample: Sample-Efficient Generalized Score Matching from Fast Mixing Diffusions},\nauthor={Yilong Qin and Andrej Risteski},\nyear={2024},\nurl={https://openreview.net/forum?id=WR9M6AA4LT}\n}",
        "github": "",
        "project": "",
        "reviewers": "BbBg;ufaE;v9Ko",
        "site": "https://openreview.net/forum?id=WR9M6AA4LT",
        "pdf_size": 454071,
        "rating": "5;5;8",
        "confidence": "2;2;3",
        "soundness": "3;4;3",
        "contribution": "2;2;3",
        "presentation": "2;2;3",
        "wc_summary": "88;134;115",
        "wc_strengths": "5;22;82",
        "wc_weaknesses": "21;26;59",
        "wc_questions": "9;414;99",
        "wc_review": "123;596;355",
        "wc_reply_reviewers": "14;32;0",
        "wc_reply_authors": "139;808;460",
        "reply_reviewers": "1;1;0",
        "reply_authors": "2;2;1",
        "rating_avg": [
            6.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            112.33333333333333,
            18.87385022252275
        ],
        "wc_strengths_avg": [
            36.333333333333336,
            33.02860712910687
        ],
        "wc_weaknesses_avg": [
            35.333333333333336,
            16.858891488535722
        ],
        "wc_questions_avg": [
            174.0,
            173.63755354185338
        ],
        "wc_review_avg": [
            358.0,
            193.11309294469567
        ],
        "wc_reply_reviewers_avg": [
            15.333333333333334,
            13.097921802925667
        ],
        "wc_reply_authors_avg": [
            469.0,
            273.1922400069226
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13552401282523309700&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "OpenAI;Carnegie Mellon University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://openai.com;https://www.cmu.edu",
        "aff_unique_abbr": "OpenAI;CMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "WReszdNNdP",
        "title": "BOWLL: A DECEPTIVELY SIMPLE OPEN WORLD LIFELONG LEARNER",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The quest to improve scalar performance numbers on predetermined benchmarks seems to be deeply engraved in deep learning. However, the real world is seldom carefully curated and applications are seldom limited to excelling on test sets. A practical system is generally required to recognize novel concepts, refrain from actively including uninformative data, and retain previously acquired knowledge throughout its lifetime. Despite these key elements being rigorously researched individually, the study of their conjunction, open world lifelong learning, is only a recent trend. To accelerate this multifaceted field\u2019s exploration, we introduce its first monolithic and much-needed baseline. Leveraging the ubiquitous use of batch normalization across deep neural networks, we propose a deceptively simple yet highly effective way to repurpose standard models for open world lifelong learning. Through extensive empirical evaluation, we highlight why our approach should serve as a future standard for models that are able to effectively maintain their knowledge, selectively focus on informative data, and accelerate future learning.",
        "keywords": "Open World Learning;Lifelong Learning;Continual Learning;Active Learning;Benchmark Baseline",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/af81c911181161c1d1ae4c032ccc538f1570b52b.zip",
        "author": "Roshni Ramanna Kamath;Rupert Mitchell;Subarnaduti Paul;Kristian Kersting;Martin Mundt",
        "authorids": "~Roshni_Ramanna_Kamath1;~Rupert_Mitchell1;~Subarnaduti_Paul1;~Kristian_Kersting1;~Martin_Mundt1",
        "gender": "F;M;M;M;M",
        "homepage": "https://www.aiml.informatik.tu-darmstadt.de/people/rkamath/index.html;https://www.aiml.informatik.tu-darmstadt.de/people/rmitchell/index.html;https://scholar.google.com/citations?user=Sh8F8Y0AAAAJ&hl=en;http://www.ml.informatik.tu-darmstadt.de/;https://owl-ml.uni-bremen.de",
        "dblp": "300/8367.html;254/2746.html;327/4052;40/3793;200/8146",
        "google_scholar": ";;Sh8F8Y0AAAAJ;QY-earAAAAAJ;riGBurAAAAAJ",
        "orcid": ";;;0000-0002-2873-9152;0000-0003-1639-8255",
        "linkedin": "roshnikamath;;subarnaduti-paul-985106138/;;",
        "or_profile": "~Roshni_Ramanna_Kamath1;~Rupert_Mitchell1;~Subarnaduti_Paul1;~Kristian_Kersting1;~Martin_Mundt1",
        "aff": "Technische Universit\u00e4t Darmstadt;Technische Universit\u00e4t Darmstadt;Technische Universit\u00e4t Darmstadt;TU Darmstadt;Technische Universit\u00e4t Darmstadt & hessian.AI",
        "aff_domain": "tu-darmstadt.de;tu-darmstadt.de;tu-darmstadt.de;tu-darmstadt.de;tu-darmstadt.de",
        "position": "PhD student;PhD student;PhD student;Full Professor;Junior Research Group Leader",
        "bibtex": "@misc{\nkamath2024bowll,\ntitle={{BOWLL}: A {DECEPTIVELY} {SIMPLE} {OPEN} {WORLD} {LIFELONG} {LEARNER}},\nauthor={Roshni Ramanna Kamath and Rupert Mitchell and Subarnaduti Paul and Kristian Kersting and Martin Mundt},\nyear={2024},\nurl={https://openreview.net/forum?id=WReszdNNdP}\n}",
        "github": "",
        "project": "",
        "reviewers": "wS2P;SRy8;BmgJ;ELi2",
        "site": "https://openreview.net/forum?id=WReszdNNdP",
        "pdf_size": 547197,
        "rating": "5;5;5;6",
        "confidence": "4;4;3;4",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "78;23;88;81",
        "wc_strengths": "88;33;101;62",
        "wc_weaknesses": "158;102;63;22",
        "wc_questions": "59;2;46;103",
        "wc_review": "383;160;298;268",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "887;860;587;630",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;2;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            67.5,
            25.947061490658243
        ],
        "wc_strengths_avg": [
            71.0,
            26.04803255526221
        ],
        "wc_weaknesses_avg": [
            86.25,
            50.16161380976493
        ],
        "wc_questions_avg": [
            52.5,
            36.003472054789384
        ],
        "wc_review_avg": [
            277.25,
            79.7601874370917
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            741.0,
            133.7105081883993
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:v7vSo6wr0_gJ:scholar.google.com/&scioq=BOWLL:+A+DECEPTIVELY+SIMPLE+OPEN+WORLD+LIFELONG+LEARNER&hl=en&as_sdt=0,24",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Technische Universit\u00e4t Darmstadt",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tu-darmstadt.de",
        "aff_unique_abbr": "TUD",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Darmstadt",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "WRxCuhTMB2",
        "title": "Experimental methodology to evaluate the effectiveness of uncertainty disentanglement on regression models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The lack of an acceptable confidence level associated with the predictions of Machine Learning (ML) models may inhibit their deployment and usage. A practical way to avoid this drawback is to enhance these predictions with trustworthiness and risk-aware add-ons such as Uncertainty Quantification (UQ). Typically, the quantified uncertainty mainly captures two intertwined parts: an epistemic uncertainty component linked to a lack of observed data and an aleatoric uncertainty component due to irreducible variability. Several existing UQ-paradigms aim to disentangle the total quantified uncertainty into these two parts, with the aim of distinguishing model irrelevance from high uncertainty-level decisions. However, few of them are delving deeper into evaluating the disentanglement result, even less on real-world data. In this paper, we propose and implement a methodology to assess the effectiveness of uncertainty disentanglement through benchmarking of various UQ approaches. We introduce some indicators that allow us to robustly assess the decomposition feasibility in the absence of ground truth. The evaluation is done using an epistemic variability injection mechanism on four state-of-the-art UQ approaches based on ML models, on both synthetic and real-world gas demand datasets. The obtained results show the effectiveness of the proposed methodology for better understanding and selection of the relevant UQ approach. The corresponding code and data can be found in the Github repository.",
        "keywords": "Machine learning; Uncertainty quantification; Uncertainty decomposition; benchmark; Regression",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/6fd9fea406e7ec3fa919280eceb41f236d873d42.pdf",
        "author": "Kevin Pasini;Clement Arlotti;Milad Leyli-abadi;Marc Nabhan;Johanna Baro",
        "authorids": "~Kevin_Pasini1;~Clement_Arlotti1;~Milad_Leyli-abadi1;~Marc_Nabhan1;~Johanna_Baro1",
        "gender": "M;M;M;;F",
        "homepage": "https://scholar.google.com/citations?user=Zvo9L-8AAAAJ&hl=fr;https://www.researchgate.net/profile/Clement-Arlotti;https://dataexpertise.org/;;",
        "dblp": ";;;257/8840;",
        "google_scholar": ";;4wFjQ5QAAAAJ;;",
        "orcid": "0000-0001-9742-9273;;;;",
        "linkedin": ";;milad-leyliabadi/;marc-nabhan;johannabaro",
        "or_profile": "~Kevin_Pasini1;~Clement_Arlotti1;~Milad_Leyli-abadi1;~Marc_Nabhan1;~Johanna_Baro1",
        "aff": "IRT systemX;;Irt SystemX;IRT SystemX;",
        "aff_domain": "irt.systemx.fr;;irt-systemx.fr;irt-systemx.fr;",
        "position": "Researcher;;Researcher;Data Scientist;",
        "bibtex": "@misc{\npasini2024experimental,\ntitle={Experimental methodology to evaluate the effectiveness of uncertainty disentanglement on regression models},\nauthor={Kevin Pasini and Clement Arlotti and Milad Leyli-abadi and Marc Nabhan and Johanna Baro},\nyear={2024},\nurl={https://openreview.net/forum?id=WRxCuhTMB2}\n}",
        "github": "",
        "project": "",
        "reviewers": "wzW6;k1SL;3UD4",
        "site": "https://openreview.net/forum?id=WRxCuhTMB2",
        "pdf_size": 2575278,
        "rating": "1;1;3",
        "confidence": "5;4;4",
        "soundness": "1;1;3",
        "contribution": "2;1;2",
        "presentation": "1;1;2",
        "wc_summary": "93;47;33",
        "wc_strengths": "52;39;37",
        "wc_weaknesses": "248;239;168",
        "wc_questions": "202;38;2",
        "wc_review": "595;363;240",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "776;765;406",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            57.666666666666664,
            25.629843715654783
        ],
        "wc_strengths_avg": [
            42.666666666666664,
            6.649979114420002
        ],
        "wc_weaknesses_avg": [
            218.33333333333334,
            35.78019315518325
        ],
        "wc_questions_avg": [
            80.66666666666667,
            87.04532663439714
        ],
        "wc_review_avg": [
            399.3333333333333,
            147.1877108396697
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            649.0,
            171.8856208839665
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:MDfcJyFACx8J:scholar.google.com/&scioq=Experimental+methodology+to+evaluate+the+effectiveness+of+uncertainty+disentanglement+on+regression+models&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "IRT SystemX;SystemX",
        "aff_unique_dep": ";",
        "aff_unique_url": ";https://www.systemx.fr",
        "aff_unique_abbr": ";",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "1;1",
        "aff_country_unique": ";France"
    },
    {
        "title": "Learning to Embed Time Series Patches Independently",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18474",
        "id": "WS7GuBDFa2",
        "author_site": "Seunghan Lee, Taeyoung Park, Kibok Lee",
        "tldr": "",
        "abstract": "Masked time series modeling has recently gained much attention as a self-supervised representation learning strategy for time series.\nInspired by masked image modeling in computer vision, recent works first patchify and partially mask out time series, and then train Transformers to capture the dependencies between patches by predicting masked patches from unmasked patches.\nHowever, we argue that capturing such patch dependencies might not be an optimal strategy for time series representation learning;\nrather, learning to embed patches independently results in better time series representations.\nSpecifically, we propose to use 1) the simple patch reconstruction task, which autoencode each patch without looking at other patches, and 2) the simple patch-wise MLP that embeds each patch independently.\nIn addition, we introduce complementary contrastive learning to hierarchically capture adjacent time series information efficiently.\nOur proposed method improves time series forecasting and classification performance compared to state-of-the-art Transformer-based models, while it is more efficient in terms of the number of parameters and training time.\nCode is available at this repository: https://github.com/seunghan96/pits.",
        "keywords": "self-supervised learning;masked time-series modeling;contrastive learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/37f62671e9786bcb4d464be3eef512b235306af9.zip",
        "author": "Seunghan Lee;Taeyoung Park;Kibok Lee",
        "authorids": "~Seunghan_Lee1;~Taeyoung_Park1;~Kibok_Lee1",
        "gender": "M;M;M",
        "homepage": "https://seunghan96.github.io/;https://web.yonsei.ac.kr/tpark;https://ml.yonsei.ac.kr/",
        "dblp": ";;157/3147",
        "google_scholar": ";https://scholar.google.co.kr/citations?hl=en;6wwWRdEAAAAJ",
        "orcid": ";0000-0001-7405-0746;0000-0001-6995-7327",
        "linkedin": ";taeyoung-park-27a93b14/?originalSubdomain=kr;",
        "or_profile": "~Seunghan_Lee1;~Taeyoung_Park1;~Kibok_Lee1",
        "aff": "Yonsei University;Yonsei University;Yonsei University",
        "aff_domain": "yonsei.ac.kr;yonsei.ac.kr;yonsei.ac.kr",
        "position": "PhD student;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nlee2024learning,\ntitle={Learning to Embed Time Series Patches Independently},\nauthor={Seunghan Lee and Taeyoung Park and Kibok Lee},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=WS7GuBDFa2}\n}",
        "github": "",
        "project": "",
        "reviewers": "oFTu;DsGC;ZBCM;aEzH",
        "pdf_size": 1667611,
        "rating": "5;6;6;8",
        "confidence": "2;2;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "99;73;45;129",
        "wc_strengths": "103;55;27;177",
        "wc_weaknesses": "196;63;90;218",
        "wc_questions": "18;42;69;135",
        "wc_review": "416;233;231;659",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "535;375;739;570",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            86.5,
            31.0926036220835
        ],
        "wc_strengths_avg": [
            90.5,
            56.857277458562855
        ],
        "wc_weaknesses_avg": [
            141.75,
            66.40171308031141
        ],
        "wc_questions_avg": [
            66.0,
            43.73213921133976
        ],
        "wc_review_avg": [
            384.75,
            175.2546361726274
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            554.75,
            129.30656402518784
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.899228803025897,
        "gs_citation": 40,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1095414308693861957&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=WS7GuBDFa2",
        "pdf": "https://openreview.net/pdf?id=WS7GuBDFa2",
        "email": "yonsei.ac.kr;yonsei.ac.kr;yonsei.ac.kr",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Yonsei University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.yonsei.ac.kr",
        "aff_unique_abbr": "Yonsei",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "WSsP7W8tqN",
        "title": "Grokking Tickets: Lottery Tickets Accelerate Grokking",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Grokking is one of the most surprising puzzles in neural network generalization: a network first reaches a memorization solution with perfect training accuracy but poor generalization, but with further training, it reaches a perfectly generalizable solution. \nWe aim to analyze the mechanism of grokking from the lottery ticket hypothesis, identifying the process to find the lottery tickets (good sparse subnetworks) as the key to describing the transitional phase between memorization and generalization. \nFirstly, with the lottery tickets identified via the magnitude pruning after perfect generalization, we show that the lottery tickets drastically accelerate grokking compared to the dense networks on various configurations (MLP and Transformer, and an arithmetic and image classification task). \nWe also show that the speedup is significant even when compared with the dense networks with the same weight norm as the lottery tickets. \nBesides, the speedup only happens when training ``good'' subnetworks are identified at the generalization solution. Specifically, speedup does not happen when using tickets identified at the memorization solution or transition between memorization and generalization or when pruning networks at the initialization (Random pruning, Grasp, SNIP, and Synflow). \nThe results indicate that the weights norm of network parameters is not enough to explain the process of grokking, but the importance of finding good subnetworks to describe the transition from memorization to generalization.",
        "keywords": "grokking;lottery ticket hypothesis;weight norm;pruning;generalization",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/157c65559227f243f90a4c584b87c44acc2377f1.pdf",
        "author": "Minegishi Gouki;Yusuke Iwasawa;Yutaka Matsuo",
        "authorids": "~Minegishi_Gouki2;~Yusuke_Iwasawa1;~Yutaka_Matsuo1",
        "gender": "M;M;M",
        "homepage": "https://sites.google.com/weblab.t.u-tokyo.ac.jp/gouki-minegishi/about;;http://ymatsuo.com",
        "dblp": "359/6674;117/7377;m/YMatsuo.html",
        "google_scholar": "https://scholar.google.co.jp/citations?user=sxGpoYMAAAAJ;https://scholar.google.co.jp/citations?user=pvvZgj0AAAAJ;Dy8iau4AAAAJ",
        "orcid": ";0000-0002-1321-2622;",
        "linkedin": "gouki-minegishi-22363b236/;;",
        "or_profile": "~Minegishi_Gouki2;~Yusuke_Iwasawa1;~Yutaka_Matsuo1",
        "aff": ";The University of Tokyo, The University of Tokyo;The University of Tokyo",
        "aff_domain": ";weblab.t.u-tokyo.ac.jp;u-tokyo.ac.jp",
        "position": ";Associate Professor;Associate Professor",
        "bibtex": "@misc{\ngouki2024grokking,\ntitle={Grokking Tickets: Lottery Tickets Accelerate Grokking},\nauthor={Minegishi Gouki and Yusuke Iwasawa and Yutaka Matsuo},\nyear={2024},\nurl={https://openreview.net/forum?id=WSsP7W8tqN}\n}",
        "github": "",
        "project": "",
        "reviewers": "tMC9;DeHf;KZMf;qTo9;NUTh",
        "site": "https://openreview.net/forum?id=WSsP7W8tqN",
        "pdf_size": 995878,
        "rating": "3;3;3;6;6",
        "confidence": "4;4;4;2;4",
        "soundness": "2;2;3;3;3",
        "contribution": "2;2;2;3;3",
        "presentation": "3;2;2;3;2",
        "wc_summary": "45;117;93;61;184",
        "wc_strengths": "28;94;74;86;128",
        "wc_weaknesses": "227;332;150;140;29",
        "wc_questions": "50;123;6;78;1",
        "wc_review": "350;666;323;365;342",
        "wc_reply_reviewers": "0;197;86;0;0",
        "wc_reply_authors": "903;1019;779;569;304",
        "reply_reviewers": "0;1;1;0;0",
        "reply_authors": "3;3;2;2;2",
        "rating_avg": [
            4.2,
            1.469693845669907
        ],
        "confidence_avg": [
            3.6,
            0.8
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            100.0,
            48.86716689148246
        ],
        "wc_strengths_avg": [
            82.0,
            32.42221460665511
        ],
        "wc_weaknesses_avg": [
            175.6,
            100.51586939384248
        ],
        "wc_questions_avg": [
            51.6,
            45.68851059073824
        ],
        "wc_review_avg": [
            409.2,
            129.11297378652543
        ],
        "wc_reply_reviewers_avg": [
            56.6,
            77.70096524496978
        ],
        "wc_reply_authors_avg": [
            714.8,
            253.80811649748318
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            2.4,
            0.4898979485566356
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.6123724356957946,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=429055385342869898&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Tokyo",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.u-tokyo.ac.jp",
        "aff_unique_abbr": "UTokyo",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Japan"
    },
    {
        "id": "WSzRdcOkEx",
        "title": "GREAT Score: Global Robustness Evaluation of Adversarial Perturbation using Generative Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Current studies on adversarial robustness mainly focus on aggregating \\textit{local} robustness results from a set of data samples to evaluate and rank different models. However, the local statistics may not well represent the true \\textit{global} robustness of the underlying unknown data distribution. To address this challenge, this paper makes the first attempt to present a new framework, called \\textit{GREAT Score}, for global robustness evaluation of adversarial perturbation using generative models. Formally, GREAT Score carries the physical meaning of  a global statistic capturing a mean certified attack-proof perturbation level over all samples drawn from a generative model. For finite-sample evaluation, we also derive a probabilistic guarantee on the sample complexity and the difference between the sample mean and the true mean. GREAT Score has several advantages: (1) Robustness evaluations using GREAT Score are efficient and scalable to large models, by sparing the need of running adversarial attacks. In particular, we show high correlation and significantly reduced computation cost of GREAT Score when compared to the attack-based model ranking on RobustBench \\cite{croce2021robustbench}.\n(2) The use of generative models facilitates the approximation of the unknown data distribution. In our ablation study with different generative adversarial networks (GANs), we observe consistency between global robustness evaluation and the quality of GANs. (3) GREAT Score can be used for remote auditing of privacy-sensitive black-box models, as demonstrated by our robustness evaluation on several online facial recognition services.",
        "keywords": "Adversarial Robustness",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/941ef6c107c6680bd34ef6b73208eea816994be5.zip",
        "author": "ZAITANG LI;Pin-Yu Chen;Tsung-Yi Ho",
        "authorids": "~ZAITANG_LI1;~Pin-Yu_Chen1;~Tsung-Yi_Ho2",
        "gender": "M;M;M",
        "homepage": ";http://www.pinyuchen.com;https://www.cse.cuhk.edu.hk/people/faculty/tsung-yi-ho/",
        "dblp": "276/1334;39/8969;63/4181.html",
        "google_scholar": "nPGJNbgAAAAJ;jxwlCUUAAAAJ;TRDUYkAAAAAJ",
        "orcid": "0000-0001-8871-2755;0000-0003-1039-8369;0000-0001-7348-5625",
        "linkedin": ";pin-yu-chen-940062a2;",
        "or_profile": "~ZAITANG_LI1;~Pin-Yu_Chen1;~Tsung-Yi_Ho2",
        "aff": "Department of Computer Science and Engineering, The Chinese University of Hong Kong;International Business Machines;Department of Computer Science and Engineering, The Chinese University of Hong Kong",
        "aff_domain": "cse.cuhk.edu.hk;ibm.com;cse.cuhk.edu.hk",
        "position": "PhD student;Principal Researcher;Full Professor",
        "bibtex": "@misc{\nli2024great,\ntitle={{GREAT} Score: Global Robustness Evaluation of Adversarial Perturbation using Generative Models},\nauthor={ZAITANG LI and Pin-Yu Chen and Tsung-Yi Ho},\nyear={2024},\nurl={https://openreview.net/forum?id=WSzRdcOkEx}\n}",
        "github": "",
        "project": "",
        "reviewers": "fKuC;npik;UUBS;kzkL",
        "site": "https://openreview.net/forum?id=WSzRdcOkEx",
        "pdf_size": 7561210,
        "rating": "3;5;6;6",
        "confidence": "4;3;2;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "69;64;180;103",
        "wc_strengths": "26;17;69;107",
        "wc_weaknesses": "225;139;268;225",
        "wc_questions": "7;53;177;5",
        "wc_review": "327;273;694;440",
        "wc_reply_reviewers": "394;25;18;0",
        "wc_reply_authors": "1324;987;1063;637",
        "reply_reviewers": "2;1;1;0",
        "reply_authors": "3;4;3;2",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            104.0,
            46.373483802707774
        ],
        "wc_strengths_avg": [
            54.75,
            36.00260407248342
        ],
        "wc_weaknesses_avg": [
            214.25,
            46.85816364306224
        ],
        "wc_questions_avg": [
            60.5,
            69.94819511610002
        ],
        "wc_review_avg": [
            433.5,
            162.02237499802303
        ],
        "wc_reply_reviewers_avg": [
            109.25,
            164.65323410124685
        ],
        "wc_reply_authors_avg": [
            1002.75,
            245.38375557481388
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8660254037844386,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13847030510275551331&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Chinese University of Hong Kong;International Business Machines Corporation",
        "aff_unique_dep": "Department of Computer Science and Engineering;",
        "aff_unique_url": "https://www.cuhk.edu.hk;https://www.ibm.com",
        "aff_unique_abbr": "CUHK;IBM",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "WTFN4gxLQN",
        "title": "Mask and Restore: Blind Backdoor Defense at Test Time with Masked Autoencoder",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Deep neural networks are vulnerable to backdoor attacks, where an adversary maliciously manipulates the model behavior through overlaying images with special triggers. Existing backdoor defense methods often require accessing a few validation data and model parameters, which are impractical in many real-world applications, e.g., when the model is provided as a cloud service. In this paper, we address the practical task of blind backdoor defense at test time, in particular for black-box models. The true label of every test image needs to be recovered on the fly from a suspicious model regardless of image benignity. We focus on test-time image purification methods that incapacitate possible triggers while keeping semantic contents intact. Due to diverse trigger patterns and sizes, the heuristic trigger search in image space can be unscalable. We circumvent such barrier by leveraging the strong reconstruction power of generative models, and propose a framework of Blind Defense with Masked AutoEncoder (BDMAE). It detects possible triggers in the token space using image structural similarity and label consistency between the test image and MAE restorations. The detection results are then refined by considering trigger topology. Finally, we fuse MAE restorations adaptively into a purified image for making prediction. Our approach is blind to the model architectures, trigger patterns and image benignity. Extensive experiments under different backdoor settings validate its effectiveness and generalizability.",
        "keywords": "Backdoor defense;Test-time defense;Black-box model",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Tao Sun;Lu Pang;Chao Chen;Haibin Ling",
        "authorids": "~Tao_Sun10;~Lu_Pang2;~Chao_Chen1;~Haibin_Ling1",
        "gender": "M;;M;M",
        "homepage": ";;https://chaochen.github.io/;https://www3.cs.stonybrook.edu/~hling/",
        "dblp": "74/3590-9;191/4669-1;66/3019-12;93/3488",
        "google_scholar": "izyo6gkAAAAJ;https://scholar.google.com/citations?hl=zh-CN;J-iIIFAAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;0000-0003-1703-6483;",
        "linkedin": ";;;",
        "or_profile": "~Tao_Sun10;~Lu_Pang2;~Chao_Chen1;~Haibin_Ling1",
        "aff": "State University of New York, Stony Brook;State University of New York at Stony Brook;State University of New York at Stony Brook;State University of New York, Stony Brook",
        "aff_domain": "stonybrook.edu;stonybrook.edu;stonybrook.edu;stonybrook.edu",
        "position": "PhD student;PhD student;Associate Professor;Professor",
        "bibtex": "@misc{\nsun2024mask,\ntitle={Mask and Restore: Blind Backdoor Defense at Test Time with Masked Autoencoder},\nauthor={Tao Sun and Lu Pang and Chao Chen and Haibin Ling},\nyear={2024},\nurl={https://openreview.net/forum?id=WTFN4gxLQN}\n}",
        "github": "",
        "project": "",
        "reviewers": "j6HB;9rDY;mNMh",
        "site": "https://openreview.net/forum?id=WTFN4gxLQN",
        "pdf_size": 39075952,
        "rating": "3;3;5",
        "confidence": "4;3;4",
        "soundness": "3;2;3",
        "contribution": "2;2;2",
        "presentation": "2;3;2",
        "wc_summary": "34;45;102",
        "wc_strengths": "18;35;32",
        "wc_weaknesses": "145;142;248",
        "wc_questions": "12;24;16",
        "wc_review": "209;246;398",
        "wc_reply_reviewers": "0;0;260",
        "wc_reply_authors": "569;160;1306",
        "reply_reviewers": "0;0;1",
        "reply_authors": "1;1;3",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            60.333333333333336,
            29.80305726300948
        ],
        "wc_strengths_avg": [
            28.333333333333332,
            7.408703590297623
        ],
        "wc_weaknesses_avg": [
            178.33333333333334,
            49.27699485786671
        ],
        "wc_questions_avg": [
            17.333333333333332,
            4.988876515698588
        ],
        "wc_review_avg": [
            284.3333333333333,
            81.78155184528
        ],
        "wc_reply_reviewers_avg": [
            86.66666666666667,
            122.56517540566823
        ],
        "wc_reply_authors_avg": [
            678.3333333333334,
            474.19709919915044
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12419213242412958636&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;1;0",
        "aff_unique_norm": "State University of New York;State University of New York at Stony Brook",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.stonybrook.edu;https://www.stonybrook.edu",
        "aff_unique_abbr": "SUNY Stony Brook;SUNY Stony Brook",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Stony Brook",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "WTJv0L5QLX",
        "title": "A Geometric Perspective on Diffusion Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recent years have witnessed significant progress in developing effective training and fast sampling techniques for diffusion models. A remarkable advancement is the use of stochastic differential equations (SDEs) and their marginal-preserving ordinary differential equations (ODEs) to describe data perturbation and generative modeling in a unified framework. \nIn this paper, we carefully inspect the ODE-based sampling of a popular variance-exploding SDE and reveal several intriguing structures of its sampling dynamics. We discover that the data distribution and the noise distribution are smoothly connected with a quasi-linear sampling trajectory and another implicit denoising trajectory that even converges faster. Meanwhile, the denoising trajectory governs the curvature of the corresponding sampling trajectory and its various finite differences yield all second-order samplers used in practice.\nFurthermore, we establish a theoretical relationship between the optimal ODE-based sampling and the classic mean-shift (mode-seeking) algorithm, with which we can characterize the asymptotic behavior of diffusion models and identify the empirical score deviation.",
        "keywords": "diffusion models; denoising trajectory; mean shift; score matching; differential equations",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/4d6918d9b765712a650ecea435f2dd89b6c2df19.zip",
        "author": "Defang Chen;Zhenyu Zhou;Jian-Ping Mei;Chunhua Shen;Chun Chen;Can Wang",
        "authorids": "~Defang_Chen1;~Zhenyu_Zhou6;~Jian-Ping_Mei1;~Chunhua_Shen2;~Chun_Chen1;~Can_Wang5",
        "gender": "M;;;;M;M",
        "homepage": "https://www.researchgate.net/profile/Defang-Chen-3;;;;https://person.zju.edu.cn/en/0082004;https://person.zju.edu.cn/en/wangcan",
        "dblp": "236/4507-1;;36/8017;;07/4182-0001.html;71/4716-1",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;;GxMZygQAAAAJ;;;https://scholar.google.fr/citations?user=C63q3HoAAAAJ",
        "orcid": "0000-0003-0833-7401;;0000-0003-1678-6215;;0000-0002-6198-7481;0000-0002-5890-4307",
        "linkedin": "defang-chen-805b34165/;;;;;",
        "or_profile": "~Defang_Chen1;~Zhenyu_Zhou6;~Jian-Ping_Mei1;~Chunhua_Shen2;~Chun_Chen1;~Can_Wang5",
        "aff": "Zhejiang University;;Zhejiang University of Technology;;Zhejiang University;Zhejiang University",
        "aff_domain": "zju.edu.cn;;zjut.edu.cn;;zju.edu.cn;zju.edu.cn",
        "position": "PhD student;;Full Professor;;Full Professor;Full Professor",
        "bibtex": "@misc{\nchen2024a,\ntitle={A Geometric Perspective on Diffusion Models},\nauthor={Defang Chen and Zhenyu Zhou and Jian-Ping Mei and Chunhua Shen and Chun Chen and Can Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=WTJv0L5QLX}\n}",
        "github": "",
        "project": "",
        "reviewers": "C4jg;dBDN;SvFU;fQGm",
        "site": "https://openreview.net/forum?id=WTJv0L5QLX",
        "pdf_size": 43531788,
        "rating": "3;3;3;5",
        "confidence": "4;5;2;3",
        "soundness": "3;1;3;4",
        "contribution": "1;1;2;1",
        "presentation": "3;2;2;4",
        "wc_summary": "117;181;176;48",
        "wc_strengths": "122;34;25;47",
        "wc_weaknesses": "565;606;14;258",
        "wc_questions": "247;12;43;35",
        "wc_review": "1051;833;258;388",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.75,
            1.0897247358851685
        ],
        "contribution_avg": [
            1.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            130.5,
            53.87253474638074
        ],
        "wc_strengths_avg": [
            57.0,
            38.334057964165495
        ],
        "wc_weaknesses_avg": [
            360.75,
            241.17356302049362
        ],
        "wc_questions_avg": [
            84.25,
            94.65034336968884
        ],
        "wc_review_avg": [
            632.5,
            322.2471877301647
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.2581988897471611,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9651712772461819160&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Zhejiang University;Zhejiang University of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.zju.edu.cn;https://www.zjut.edu.cn",
        "aff_unique_abbr": "ZJU;ZJUT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "WTh6EnJXWQ",
        "title": "DeepROCK: Error-controlled interaction detection in deep neural networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The complexity of deep neural networks (DNNs) makes them powerful but also makes them challenging to interpret, hindering their applicability in error-intolerant domains. Existing methods attempt to reason about the internal mechanism of DNNs by identifying feature interactions that influence prediction outcomes. However, such methods typically lack a systematic strategy to prioritize interactions while controlling confidence levels, making them difficult to apply in practice for scientific discovery and hypothesis validation. In this paper, we introduce a method, called DeepROCK, to address this limitation by using knockoffs, which are dummy variables that are designed to mimic the dependence structure of a given set of features while being conditionally independent of the response. Together with a novel DNN architecture involving a pairwise-coupling layer, DeepROCK jointly controls the false discovery rate (FDR) and maximizes statistical power. In addition, we identify a challenge in correctly controlling FDR using off-the-shelf feature interaction importance measures. DeepROCK overcomes this challenge by proposing a calibration procedure applied to existing interaction importance measures to make the FDR under control at a target level. Finally, we validate the effectiveness of DeepROCK through extensive experiments on simulated and real datasets.",
        "keywords": "Interpretable AI;Explainable AI;interaction detection;FDR;reproducibility",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Winston Chen;William Noble;Yang Young Lu",
        "authorids": "chenwt@umich.edu;~William_Noble1;~Yang_Young_Lu1",
        "gender": ";M;M",
        "homepage": ";http://noble.gs.washington.edu;https://batmen-lab.github.io/",
        "dblp": ";08/978;197/8508",
        "google_scholar": ";plt2_DsAAAAJ;C4CLJQgAAAAJ",
        "orcid": ";0000-0001-7283-4715;",
        "linkedin": ";;",
        "or_profile": "chenwt@umich.edu;~William_Noble1;~Yang_Young_Lu1",
        "aff": ";University of Washington, Seattle;University of Waterloo",
        "aff_domain": ";uw.edu;uwaterloo.ca",
        "position": ";Professor;Assistant Professor",
        "bibtex": "@misc{\nchen2024deeprock,\ntitle={Deep{ROCK}: Error-controlled interaction detection in deep neural networks},\nauthor={Winston Chen and William Noble and Yang Young Lu},\nyear={2024},\nurl={https://openreview.net/forum?id=WTh6EnJXWQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "u7Lb;JPER;f17i",
        "site": "https://openreview.net/forum?id=WTh6EnJXWQ",
        "pdf_size": 8550314,
        "rating": "3;6;6",
        "confidence": "2;3;3",
        "soundness": "2;3;3",
        "contribution": "3;3;2",
        "presentation": "2;3;3",
        "wc_summary": "57;85;80",
        "wc_strengths": "35;81;31",
        "wc_weaknesses": "165;35;119",
        "wc_questions": "93;8;2",
        "wc_review": "350;209;232",
        "wc_reply_reviewers": "0;0;248",
        "wc_reply_authors": "1121;450;980",
        "reply_reviewers": "0;0;1",
        "reply_authors": "3;1;3",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            74.0,
            12.192894105447921
        ],
        "wc_strengths_avg": [
            49.0,
            22.686266036231405
        ],
        "wc_weaknesses_avg": [
            106.33333333333333,
            53.822754378505095
        ],
        "wc_questions_avg": [
            34.333333333333336,
            41.55585264302597
        ],
        "wc_review_avg": [
            263.6666666666667,
            61.76478680355733
        ],
        "wc_reply_reviewers_avg": [
            82.66666666666667,
            116.90832115617586
        ],
        "wc_reply_authors_avg": [
            850.3333333333334,
            288.87175162845
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14040672716147009494&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Washington;University of Waterloo",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.washington.edu;https://uwaterloo.ca",
        "aff_unique_abbr": "UW;UW",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Seattle;",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United States;Canada"
    },
    {
        "id": "WToVTopVcY",
        "title": "WHICH RESTRAINS FEW-SHOT CLASS-INCREMENTAL LEARNING, FORGETTING OR FEW-SHOT LEARNING?",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Few-shot class-incremental learning (FSCIL) is one common yet difficult task in machine learning. There are mainly two challenges in FSCIL: catastrophic forgetting of old classes during incremental sessions and insufficient learning of new classes with only a few samples. Recent wisdom mainly focuses on how to avoid catastrophic forgetting by calibrating prototypes of each class while surprisingly overlooking the issue of limited samples of new classes. In this paper, we aim to improve the FSCIL  by supplementing knowledge of new classes from old ones. To this end, we propose an old classes-guided FSCIL method with two stages of the base and incremental sessions. In the base session, we propose a prototype-centered loss trying to learn a compact distribution of old classes. During the incremental learning sessions, we first augment more samples for each new class by Gaussian sampling, where the mean and covariance are calibrated by old classes; we then propose to update the model based on both prototype-based and replay-based learning methods on those augmented samples. In addition, based on a series of analyses on examining the performance in both old and new classes during each session, we find out that most works contain a deceptive accuracy bias to old classes, where test data usually consists of a large part of samples in old classes. Extensive experiments on three popular FSCIL datasets including mini-ImageNet, CIFAR100, and CUB200 demonstrate the superiority of our model to the other state-of-the-art methods on both old and new classes.",
        "keywords": "Few-shot class incremental learning;catastrophic forgetting",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/7c65a996f914cc34064138c3a07ea414a67fe04d.zip",
        "author": "Yijie Hu;Qiufeng Wang;Kaizhu Huang",
        "authorids": "~Yijie_Hu1;~Qiufeng_Wang2;~Kaizhu_Huang1",
        "gender": "M;M;M",
        "homepage": "https://cmt3.research.microsoft.com;https://scholar.xjtlu.edu.cn/en/persons/QiufengWang;https://sites.google.com/view/kaizhu-huang-homepage",
        "dblp": ";86/7443-1;99/3390",
        "google_scholar": "8u0GpekAAAAJ;qj66yXAAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": "0009-0006-5968-3389;0000-0002-0918-4606;",
        "linkedin": ";;",
        "or_profile": "~Yijie_Hu1;~Qiufeng_Wang2;~Kaizhu_Huang1",
        "aff": "University of Liverpool;Xi'an Jiaotong-Liverpool University;Xi'an Jiaotong-Liverpool University",
        "aff_domain": "liverpool.ac.uk;xjtlu.edu.cn;xjtlu.edu.cn",
        "position": "PhD student;Associate Professor;Full Professor",
        "bibtex": "@misc{\nhu2024which,\ntitle={{WHICH} {RESTRAINS} {FEW}-{SHOT} {CLASS}-{INCREMENTAL} {LEARNING}, {FORGETTING} {OR} {FEW}-{SHOT} {LEARNING}?},\nauthor={Yijie Hu and Qiufeng Wang and Kaizhu Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=WToVTopVcY}\n}",
        "github": "",
        "project": "",
        "reviewers": "WPjb;VZnS;mFn2",
        "site": "https://openreview.net/forum?id=WToVTopVcY",
        "pdf_size": 1830071,
        "rating": "3;3;6",
        "confidence": "5;5;3",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "2;2;3",
        "wc_summary": "69;55;141",
        "wc_strengths": "48;21;132",
        "wc_weaknesses": "459;78;66",
        "wc_questions": "206;41;100",
        "wc_review": "782;195;439",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            88.33333333333333,
            37.67698973585278
        ],
        "wc_strengths_avg": [
            67.0,
            47.265209192385896
        ],
        "wc_weaknesses_avg": [
            201.0,
            182.49931506720785
        ],
        "wc_questions_avg": [
            115.66666666666667,
            68.26582030725349
        ],
        "wc_review_avg": [
            472.0,
            240.77513714390582
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:t0Y6hkE6XasJ:scholar.google.com/&scioq=WHICH+RESTRAINS+FEW-SHOT+CLASS-INCREMENTAL+LEARNING,+FORGETTING+OR+FEW-SHOT+LEARNING%3F&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "University of Liverpool;Xi'an Jiao Tong-Liverpool University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.liverpool.ac.uk;https://www.xjtu.edu.cn/en",
        "aff_unique_abbr": "Liv Uni;XJTLU",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Xi'an",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "United Kingdom;China"
    },
    {
        "id": "WVIq7jYIda",
        "title": "Manifold Kernel Rank Reduced Regression",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The Kernel Rank Reduced Regression (KRRR) technique works well on highly dependent dataset with a latent variable structure.\nWhen we extended the KRRR to the Reproducing Kernel Hilbert Space (RKHS), the powerful kernel presentation and  reproducing ability can enhance the regression ability. But previous research always work on Euclidean space with vector data presentation, which omit the intrinsic geometric shape of the data distribution. If the whole dataset can be thought as a manifold, the regression result will only rely on the intrinsic  data distribution instead of the extrinsic frame. So we present the manifold kernel rank reduced regression model (MKRRR).\nWe fist give the definition of the MKRRR model. Then with leveraging Kendall shape space for representing sample manifold data, we derive the closed-form solution of the regression model and prediction result. Moreover, we discuss the convergent and robust ability of the model, with presenting the robustness proof. At last, the we present a skull repair application by the MKRRR model for 3D mandibular reconstruction. The experiment result validate effective of our model even on the data with high-level noise.",
        "keywords": "Reproducing kernel hilbert space;Manifold kernel reduced rank regression;Shape analysis;Mandibular point cloud reconstruction",
        "primary_area": "metric learning, kernel learning, and sparse coding",
        "supplementary_material": "",
        "author": "Zhangwen Gu;Huzhen Wang;Wang Xing-Ce;Zhongke Wu",
        "authorids": "~Zhangwen_Gu1;~Huzhen_Wang1;~Wang_Xing-Ce1;~Zhongke_Wu1",
        "gender": "M;M;F;M",
        "homepage": ";https://github.com/wanghuzhen;https://ai.bnu.edu.cn/xygk/szdw/zgj/54761.html;https://www.bnu.edu.cn",
        "dblp": ";;;",
        "google_scholar": ";;;",
        "orcid": "0009-0008-0805-8764;;;",
        "linkedin": ";;;",
        "or_profile": "~Zhangwen_Gu1;~Huzhen_Wang1;~Wang_Xing-Ce1;~Zhongke_Wu1",
        "aff": "Beijing Normal University;Beijing Normal University;Beijing Normal University;Beijing Normal University",
        "aff_domain": "bnu.edu.cn;bnu.edu.cn;bnu.edu.cn;bnu.edu.cn",
        "position": "MS student;MS student;Full Professor;Full Professor",
        "bibtex": "@misc{\ngu2024manifold,\ntitle={Manifold Kernel Rank Reduced Regression},\nauthor={Zhangwen Gu and Huzhen Wang and Wang Xing-Ce and Zhongke Wu},\nyear={2024},\nurl={https://openreview.net/forum?id=WVIq7jYIda}\n}",
        "github": "",
        "project": "",
        "reviewers": "4QQN;Vara;CQ8o;DLdA",
        "site": "https://openreview.net/forum?id=WVIq7jYIda",
        "pdf_size": 1666277,
        "rating": "3;3;3;3",
        "confidence": "3;3;4;3",
        "soundness": "2;1;2;2",
        "contribution": "1;1;3;2",
        "presentation": "2;1;3;2",
        "wc_summary": "111;42;87;78",
        "wc_strengths": "15;11;9;102",
        "wc_weaknesses": "141;51;30;135",
        "wc_questions": "161;62;11;52",
        "wc_review": "428;166;137;367",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            79.5,
            24.78406746278746
        ],
        "wc_strengths_avg": [
            34.25,
            39.17508774718954
        ],
        "wc_weaknesses_avg": [
            89.25,
            49.35775015131869
        ],
        "wc_questions_avg": [
            71.5,
            55.09310301662087
        ],
        "wc_review_avg": [
            274.5,
            125.29664799985673
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:WarrdN930A0J:scholar.google.com/&scioq=Manifold+Kernel+Rank+Reduced+Regression&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Beijing Normal University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.bnu.edu.cn",
        "aff_unique_abbr": "BNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "WVeUAbjx9p",
        "title": "Optimal Noise Pursuit for Augmenting Text-to-Video Generation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Despite the remarkable progress in text-to-video generation, existing diffusion-based models often exhibit instability in terms of noise during inference. Specifically, when different noises are fed for the given text, these models produce videos that differ significantly in terms of both frame quality and temporal consistency. With this observation, we posit that there exists an optimal noise matched to each textual input; however, the widely adopted strategies of random noise sampling often fail to capture it. In this paper, we argue that the optimal noise can be approached through inverting the groundtruth video using the established noise-video mapping derived from the diffusion model. Nevertheless, the groundtruth video for the text prompt is not available during inference. To address this challenge, we propose to approximate the optimal noise via a search and inversion pipeline. Given a text prompt, we initially search for a video from a predefined candidate pool that closely relates to the text prompt. Subsequently, we invert the searched video into the noise space, which serves as an improved noise prompt for the textual input. In addition to addressing noise, we also observe that the text prompt with richer details often leads to higher-quality videos. Motivated by this, we further design a semantic-preserving rewriter to enrich the text prompt, where a reference-guided rewriting is devised for reasonable details compensation, and a denoising with a hybrid semantics strategy is proposed to preserve the semantic consistency. Extensive experiments on the WebVid-10M benchmark show that our proposed method can improve the text-to-video models with a clear margin, while introducing no optimization burden.",
        "keywords": "text-to-video generation\uff1bcross modal generation\uff1bdiffusion model",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/392afcaeb90f8474bf28aad375fe7e9d52836a00.pdf",
        "author": "Shijie Ma;Huayi Xu;Mengjian Li;Weidong Geng;Meng Wang;Yaxiong Wang",
        "authorids": "~Shijie_Ma2;~Huayi_Xu1;~Mengjian_Li1;~Weidong_Geng1;~Meng_Wang3;~Yaxiong_Wang1",
        "gender": "F;M;M;M;M;M",
        "homepage": "https://github.com/TechnicalAnt;https://github.com/StevensXu;;;https://sites.google.com/view/meng-wang/home;",
        "dblp": ";;279/3739;55/6597;93/6765-2;202/3251.html",
        "google_scholar": ";;bA3HUREAAAAJ;;rHagaaIAAAAJ;",
        "orcid": ";;0009-0000-9698-8508;0000-0002-2709-396X;0000-0002-3094-7735;0000-0001-6596-8117",
        "linkedin": ";;;;;",
        "or_profile": "~Shijie_Ma2;~Huayi_Xu1;~Mengjian_Li1;~Weidong_Geng1;~Meng_Wang3;~Yaxiong_Wang1",
        "aff": ";Zhejiang Lab;Zhejiang Lab;College of Computer Science and Technology, Zhejiang University;Hefei University of Technology;Hefei University of Technology",
        "aff_domain": ";zhejianglab.edu.cn;zhejianglab.com;cs.zju.edu.cn;hfut.edu.cn;hfut.edu.cn",
        "position": ";Researcher;Researcher;Full Professor;Full Professor;Associate Professor",
        "bibtex": "@misc{\nma2024optimal,\ntitle={Optimal Noise Pursuit for Augmenting Text-to-Video Generation},\nauthor={Shijie Ma and Huayi Xu and Mengjian Li and Weidong Geng and Meng Wang and Yaxiong Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=WVeUAbjx9p}\n}",
        "github": "",
        "project": "",
        "reviewers": "fHMH;9gsF;RVQz;y9ER",
        "site": "https://openreview.net/forum?id=WVeUAbjx9p",
        "pdf_size": 4568783,
        "rating": "3;5;5;5",
        "confidence": "5;3;3;5",
        "soundness": "2;2;3;2",
        "contribution": "1;2;3;2",
        "presentation": "2;3;3;3",
        "wc_summary": "79;119;82;83",
        "wc_strengths": "36;81;48;51",
        "wc_weaknesses": "346;139;231;154",
        "wc_questions": "7;8;2;2",
        "wc_review": "468;347;363;290",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            1.0
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            90.75,
            16.37643123516232
        ],
        "wc_strengths_avg": [
            54.0,
            16.56804152578089
        ],
        "wc_weaknesses_avg": [
            217.5,
            81.98932857390649
        ],
        "wc_questions_avg": [
            4.75,
            2.7726341266023544
        ],
        "wc_review_avg": [
            367.0,
            64.31562796086189
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7681612867093308026&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2;2",
        "aff_unique_norm": "Zhejiang Lab;Zhejiang University;Hefei University of Technology",
        "aff_unique_dep": ";College of Computer Science and Technology;",
        "aff_unique_url": "http://www.zhejianglab.com;http://www.zju.edu.cn;http://www.hfut.edu.cn/",
        "aff_unique_abbr": ";ZJU;HUT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "An operator preconditioning perspective on training in physics-informed machine learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18473",
        "id": "WWlxFtR5sV",
        "author_site": "Tim De Ryck, Florent Bonnet, Siddhartha Mishra, Emmanuel de B\u00e9zenac",
        "tldr": "",
        "abstract": "In this paper, we investigate the behavior of gradient descent algorithms in physics-informed machine learning methods like PINNs, which minimize residuals connected to partial differential equations (PDEs). Our key result is that the difficulty in training these models is closely related to the conditioning of a specific differential operator. This operator, in turn, is associated to the Hermitian square of the differential operator of the underlying PDE. If this operator is ill-conditioned, it results in slow or infeasible training. Therefore, preconditioning this operator is crucial. We employ both rigorous mathematical analysis and empirical evaluations to investigate various strategies, explaining how they better condition this critical operator, and consequently improve training.",
        "keywords": "physics-informed machine learning;operator preconditioning;deep learning;neural network training",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/568cb8219bb910cc7b94fb8693517025f45de9a7.zip",
        "author": "Tim De Ryck;Florent Bonnet;Siddhartha Mishra;Emmanuel de Bezenac",
        "authorids": "~Tim_De_Ryck1;~Florent_Bonnet1;~Siddhartha_Mishra1;~Emmanuel_de_Bezenac2",
        "gender": "M;;M;M",
        "homepage": "https://people.math.ethz.ch/~deryckt/;;http://www.sam.math.ethz.ch/;",
        "dblp": "255/5932;;07/2856.html;",
        "google_scholar": "o95Uj80AAAAJ;https://scholar.google.com/citations?hl=fr;FmEqyNcAAAAJ;https://scholar.google.fr/citations?user=KvZw5gYAAAAJ",
        "orcid": "0000-0001-6860-1345;0000-0002-7787-4086;;",
        "linkedin": ";florent-bonnet-46135b1b9/;;",
        "or_profile": "~Tim_De_Ryck1;~Florent_Bonnet1;~Siddhartha_Mishra1;~Emmanuel_de_Bezenac2",
        "aff": "ETHZ - ETH Zurich;Institut des syst\u00e8mes intelligents et robotique (ISIR) - Sorbonne Universit\u00e9;Swiss Federal Institute of Technology;ETHZ - ETH Zurich",
        "aff_domain": "ethz.ch;isir.upmc.fr;ethz.ch;ethz.ch",
        "position": "PhD student;Researcher;Full Professor;Postdoc",
        "bibtex": "@inproceedings{\nryck2024an,\ntitle={An operator preconditioning perspective on training in physics-informed machine learning},\nauthor={Tim De Ryck and Florent Bonnet and Siddhartha Mishra and Emmanuel de Bezenac},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=WWlxFtR5sV}\n}",
        "github": "",
        "project": "",
        "reviewers": "Wj3M;95TT;E6qc;2Mn2;gVcB;Wdfd",
        "pdf_size": 2185254,
        "rating": "5;5;6;6;8;8",
        "confidence": "5;3;4;3;4;3",
        "soundness": "4;2;2;3;4;4",
        "contribution": "3;2;2;3;4;4",
        "presentation": "2;3;2;3;3;3",
        "wc_summary": "182;109;97;99;58;99",
        "wc_strengths": "62;29;95;44;59;69",
        "wc_weaknesses": "99;322;786;265;24;130",
        "wc_questions": "1;125;465;42;42;217",
        "wc_review": "344;585;1443;450;183;515",
        "wc_reply_reviewers": "0;119;129;112;0;27",
        "wc_reply_authors": "926;1901;2338;1162;149;925",
        "reply_reviewers": "0;1;1;1;0;1",
        "reply_authors": "3;4;5;4;1;3",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.7453559924999298
        ],
        "soundness_avg": [
            3.1666666666666665,
            0.8975274678557507
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            107.33333333333333,
            37.09746921586731
        ],
        "wc_strengths_avg": [
            59.666666666666664,
            20.52369903848286
        ],
        "wc_weaknesses_avg": [
            271.0,
            251.10953785151213
        ],
        "wc_questions_avg": [
            148.66666666666666,
            158.03867318546503
        ],
        "wc_review_avg": [
            586.6666666666666,
            403.93013697365484
        ],
        "wc_reply_reviewers_avg": [
            64.5,
            56.44097211541748
        ],
        "wc_reply_authors_avg": [
            1233.5,
            711.3903640055859
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            1.247219128924647
        ],
        "replies_avg": [
            34,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.23904572186687878,
        "gs_citation": 29,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12642983763550291852&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=WWlxFtR5sV",
        "pdf": "https://openreview.net/pdf?id=WWlxFtR5sV",
        "email": "ethz.ch;isir.upmc.fr;ethz.ch;ethz.ch",
        "author_num": 4,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "ETH Zurich;Sorbonne Universit\u00e9;Swiss Federal Institute of Technology",
        "aff_unique_dep": ";Institut des syst\u00e8mes intelligents et robotique (ISIR);",
        "aff_unique_url": "https://www.ethz.ch;https://www.sorbonne-universite.fr;https://www.ethz.ch",
        "aff_unique_abbr": "ETHZ;Sorbonne U;ETH Zurich",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "Switzerland;France"
    },
    {
        "id": "WX9cd9iII4",
        "title": "Fair Off-Policy Learning from Observational Data",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Algorithmic decision-making in practice must be fair for legal, ethical, and societal reasons. To achieve this, prior research has contributed various approaches that ensure fairness in machine learning predictions, while comparatively little effort has focused on fairness in decision-making, specifically off-policy learning. In this paper, we propose a novel framework for fair off-policy learning: we learn decision rules from observational data under different notions of fairness, where we explicitly assume that observational data were collected under a different -- potentially discriminatory -- behavioral policy. For this, we first formalize different fairness notions for off-policy learning. We then propose a neural network-based framework to learn optimal policies under different fairness notions. We further provide theoretical guarantees in the form of generalization bounds for the finite-sample version of our framework. We demonstrate the effectiveness of our framework through extensive numerical experiments using both simulated and real-world data. Altogether, our work enables algorithmic decision-making in a wide array of practical applications where fairness must be ensured.",
        "keywords": "Causal machine learning;off-policy learning;fairness",
        "primary_area": "causal reasoning",
        "supplementary_material": "",
        "author": "Dennis Frauen;Valentyn Melnychuk;Stefan Feuerriegel",
        "authorids": "~Dennis_Frauen1;~Valentyn_Melnychuk1;~Stefan_Feuerriegel1",
        "gender": "M;M;M",
        "homepage": "https://www.ai.bwl.uni-muenchen.de/team/research_team/dennis_frauen/index.html;https://valentyn1997.github.io/;http://www.ai.bwl.lmu.de",
        "dblp": "315/0115;254/1513;125/0630",
        "google_scholar": "ieyW4WQAAAAJ;EMExrOMAAAAJ;https://scholar.google.de/citations?hl=de",
        "orcid": ";0000-0002-2401-6803;0000-0001-7856-8729",
        "linkedin": "dennis-frauen-6b5746171/;valentyn-melnychuk/;",
        "or_profile": "~Dennis_Frauen1;~Valentyn_Melnychuk1;~Stefan_Feuerriegel1",
        "aff": "Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen;Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen;LMU Munich",
        "aff_domain": "lmu.de;lmu.de;lmu.de",
        "position": "PhD student;PhD student;Professor",
        "bibtex": "@misc{\nfrauen2024fair,\ntitle={Fair Off-Policy Learning from Observational Data},\nauthor={Dennis Frauen and Valentyn Melnychuk and Stefan Feuerriegel},\nyear={2024},\nurl={https://openreview.net/forum?id=WX9cd9iII4}\n}",
        "github": "",
        "project": "",
        "reviewers": "TRGr;mTnw;3M28;1vxi",
        "site": "https://openreview.net/forum?id=WX9cd9iII4",
        "pdf_size": 637463,
        "rating": "5;5;6;8",
        "confidence": "3;4;4;3",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;2;4",
        "wc_summary": "87;181;141;87",
        "wc_strengths": "54;41;98;89",
        "wc_weaknesses": "178;424;312;59",
        "wc_questions": "72;2;565;3",
        "wc_review": "391;648;1116;238",
        "wc_reply_reviewers": "0;0;813;0",
        "wc_reply_authors": "894;1415;2144;543",
        "reply_reviewers": "0;0;2;0",
        "reply_authors": "2;2;5;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            124.0,
            39.61060464067672
        ],
        "wc_strengths_avg": [
            70.5,
            23.66960075708925
        ],
        "wc_weaknesses_avg": [
            243.25,
            137.47977123926267
        ],
        "wc_questions_avg": [
            160.5,
            235.2557119391578
        ],
        "wc_review_avg": [
            598.25,
            332.893657944996
        ],
        "wc_reply_reviewers_avg": [
            203.25,
            352.0393266383743
        ],
        "wc_reply_authors_avg": [
            1249.0,
            602.7109589181202
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            2.5,
            1.5
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.40824829046386296,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5841492373024397942&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen;Ludwig Maximilian University of Munich",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.lmu.de;https://www.lmu.de",
        "aff_unique_abbr": "LMU;LMU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Munich",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "WXXuORQwbQ",
        "title": "Sparse Mask Representation for Human-Scene Interaction",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Human-scene interaction is an active research topic with several applications in robotics, virtual experiences, gaming, surveillance, and healthcare. Despite efforts to improve the network architectures to achieve better results or optimize models for faster inference, a crucial aspect of input dimensionality has been somewhat overlooked. This paper introduces Sparse Mask Representation, a simple yet effective approach to enhance the inference speed of human-scene interaction models and improve the model's effectiveness by exploring the sparsity of high-dimensional inputs. Specifically, our method utilizes sparse masks to convert high-dimensional inputs into sparse tensors in a compressed COO format. Our approach not only effectively streamlines computational speed but also eliminates non-useful input information, thereby enhancing overall model performance. We conducted rigorous experiments across three datasets, with a specific emphasis on tasks related to contact prediction and scene synthesis. The results underscore the substantial enhancements realized by our proposed method in terms of accuracy and inference time, surpassing existing state-of-the-art approaches.",
        "keywords": "Human-scene Interaction;Scene Synthesis",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/b1ffc0f1ffb30cffb05f6ce1114d9d18a50a761f.zip",
        "author": "Anh Nguyen;Nghia Huu Vu;Tuong Khanh Long Do;Le Duc Huy;Erman Tjiputra;Quang D. Tran",
        "authorids": "~Anh_Nguyen2;~Nghia_Huu_Vu1;~Tuong_Khanh_Long_Do1;~Le_Duc_Huy1;~Erman_Tjiputra1;~Quang_D._Tran1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://www.csc.liv.ac.uk/~anguyen/;;;;https://aioz.io;https://quangduytran.github.io/",
        "dblp": "52/5285-3.html;;;;249/5414;160/1059",
        "google_scholar": "https://scholar.google.co.uk/citations?user=gEbaF0sAAAAJ;;qCcSKkMAAAAJ;;;DbAThEgAAAAJ",
        "orcid": "0000-0002-1449-211X;;0000-0002-3290-3787;;;0000-0001-5839-5875",
        "linkedin": ";nghiavuhuu;;huy-le-duc-itus;;quangduytran",
        "or_profile": "~Anh_Nguyen2;~Nghia_Huu_Vu1;~Tuong_Khanh_Long_Do1;~Le_Duc_Huy1;~Erman_Tjiputra1;~Quang_D._Tran1",
        "aff": "University of Liverpool;AIOZ Network;AIOZ;Ho Chi Minh city University of Science, Vietnam National University;AIOZ;AIOZ",
        "aff_domain": "liverpool.ac.uk;aioz.network;aioz.io;hcmus.edu.vn;aioz.io;aioz.io",
        "position": "Associate Professor;Researcher;Researcher;Graduated student;CEO/Researcher;Head of AI",
        "bibtex": "@misc{\nnguyen2024sparse,\ntitle={Sparse Mask Representation for Human-Scene Interaction},\nauthor={Anh Nguyen and Nghia Huu Vu and Tuong Khanh Long Do and Le Duc Huy and Erman Tjiputra and Quang D. Tran},\nyear={2024},\nurl={https://openreview.net/forum?id=WXXuORQwbQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "BCwn;gK1o;t62A;fpDr",
        "site": "https://openreview.net/forum?id=WXXuORQwbQ",
        "pdf_size": 45221332,
        "rating": "3;5;6;6",
        "confidence": "4;3;4;2",
        "soundness": "2;2;3;2",
        "contribution": "1;2;3;2",
        "presentation": "2;3;3;3",
        "wc_summary": "72;83;65;53",
        "wc_strengths": "37;38;67;56",
        "wc_weaknesses": "106;62;58;10",
        "wc_questions": "54;6;60;40",
        "wc_review": "269;189;250;159",
        "wc_reply_reviewers": "0;200;0;0",
        "wc_reply_authors": "1138;654;385;340",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "3;3;2;2",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            68.25,
            10.894379284750462
        ],
        "wc_strengths_avg": [
            49.5,
            12.619429464123963
        ],
        "wc_weaknesses_avg": [
            59.0,
            33.98529093593286
        ],
        "wc_questions_avg": [
            40.0,
            20.92844953645635
        ],
        "wc_review_avg": [
            216.75,
            44.55544298960566
        ],
        "wc_reply_reviewers_avg": [
            50.0,
            86.60254037844386
        ],
        "wc_reply_authors_avg": [
            629.25,
            317.31795962409694
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.4923659639173309,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:dSAvsitazGcJ:scholar.google.com/&scioq=Sparse+Mask+Representation+for+Human-Scene+Interaction&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;2;2",
        "aff_unique_norm": "University of Liverpool;AIOZ Network;AIOZ;Ho Chi Minh City University of Science",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.liverpool.ac.uk;https://aioz.network;;",
        "aff_unique_abbr": "Liv Uni;;;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "United Kingdom;Vietnam;"
    },
    {
        "id": "WYEEWScbaM",
        "title": "Communication-Efficient Federated Learning via Gradient Distillation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Federated learning revolutionizes collaborative model training across decentralized edge devices, ensuring privacy by avoiding direct data sharing. However, the frequent exchange of model updates introduces a significant communication overhead. The conventional FL process involves transmitting the differences in parameters between old and new models, resulting in redundant gradient communications due to the intricate interplay between model parameters and network architecture. Even minor adjustments to parameters necessitate the retransmission of entire models. In this paper, we introduce a groundbreaking concept known as \\textit{gradient distillation}, which decouples model parameters from network architecture, enabling the transmission of only essential information needed for synchronization. By leveraging gradient distillation, we approximate gradient disparities into a synthetic tensor sequence, allowing the recipient to reconstruct the sender's intended model update. This approach eliminates the need to transmit the entire set of raw parameter differences, offering a highly promising solution for achieving greater communication efficiency while without significant accuracy degradation. Experimental results demonstrate that our approach achieves an unprecedented level of gradient compression performance, surpassing widely recognized baselines by an impressive margin of orders of magnitude.",
        "keywords": "Federated Learning;Edge Intelligence",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Feilong Zhang;Xianming Liu;Shiyi Lin;Xiong Zhou;Junjun Jiang;Xiangyang Ji",
        "authorids": "~Feilong_Zhang1;~Xianming_Liu5;~Shiyi_Lin1;~Xiong_Zhou3;~Junjun_Jiang2;~Xiangyang_Ji1",
        "gender": ";M;;M;M;",
        "homepage": ";http://homepage.hit.edu.cn/xmliu;;https://hitcszx.github.io/;http://homepage.hit.edu.cn/jiangjunjun;",
        "dblp": ";89/58201.html;;;https://dblp.uni-trier.de/pers/hd/j/Jiang:Junjun;",
        "google_scholar": ";;https://scholar.google.com.hk/citations?view_op=list_works;BMGootgAAAAJ;WNH2_rgAAAAJ;",
        "orcid": ";0000-0002-8857-1785;;0000-0002-0856-6696;0000-0002-5694-505X;",
        "linkedin": ";;;;;",
        "or_profile": "~Feilong_Zhang1;~Xianming_Liu5;~Shiyi_Lin1;~Xiong_Zhou3;~Junjun_Jiang2;~Xiangyang_Ji1",
        "aff": ";Harbin Institute of Technology;Harbin Institute of Technology;Harbin Institute of Technology;Harbin Institute of Technology;",
        "aff_domain": ";hit.edu.cn;hit.edu.cn;hit.edu.cn;hit.edu.cn;",
        "position": ";Full Professor;PhD student;PhD student;Full Professor;",
        "bibtex": "@misc{\nzhang2024communicationefficient,\ntitle={Communication-Efficient Federated Learning via Gradient Distillation},\nauthor={Feilong Zhang and Xianming Liu and Shiyi Lin and Xiong Zhou and Junjun Jiang and Xiangyang Ji},\nyear={2024},\nurl={https://openreview.net/forum?id=WYEEWScbaM}\n}",
        "github": "",
        "project": "",
        "reviewers": "tMVR;avnc;RHbi",
        "site": "https://openreview.net/forum?id=WYEEWScbaM",
        "pdf_size": 1205940,
        "rating": "3;3;3",
        "confidence": "4;4;5",
        "soundness": "2;2;2",
        "contribution": "2;2;2",
        "presentation": "2;3;3",
        "wc_summary": "128;99;36",
        "wc_strengths": "84;63;23",
        "wc_weaknesses": "359;215;3",
        "wc_questions": "64;218;695",
        "wc_review": "635;595;757",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            87.66666666666667,
            38.4042821686448
        ],
        "wc_strengths_avg": [
            56.666666666666664,
            25.30261295246446
        ],
        "wc_weaknesses_avg": [
            192.33333333333334,
            146.21749401338937
        ],
        "wc_questions_avg": [
            325.6666666666667,
            268.61910248942127
        ],
        "wc_review_avg": [
            662.3333333333334,
            68.90250761442253
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:uhoSfrwK8iAJ:scholar.google.com/&scioq=Communication-Efficient+Federated+Learning+via+Gradient+Distillation&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Harbin Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.hit.edu.cn/",
        "aff_unique_abbr": "HIT",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Harbin",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "WYh828Cha9",
        "title": "PointHR: Exploring High-Resolution Architectures for 3D Point Cloud Segmentation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Significant progress has been made recently in point cloud segmentation utilizing an encoder-decoder framework, which initially encodes point clouds into low-resolution representations and subsequently decodes high-resolution predictions. Inspired by the success of high-resolution architectures in image dense prediction, which always maintains a high-resolution representation throughout the entire learning process, we consider it also highly important for 3D dense point cloud analysis. Therefore, in this paper, we explore high-resolution architectures for 3D point cloud segmentation. Specifically, we generalize high-resolution architectures using a unified pipeline named PointHR, which includes a knn-based sequence operator for feature extraction and a differential resampling operator to efficiently communicate different resolutions. Additionally, we propose to avoid numerous on-the-fly computations of high-resolution architectures by \\textit{pre-computing} the indices for both sequence and resampling operators. By doing so, we deliver highly competitive high-resolution architectures while capitalizing on the benefits of well-designed point cloud blocks without additional effort. To evaluate these architectures for dense point cloud analysis, we conduct thorough experiments using S3DIS and ScanNetV2 datasets, where the proposed PointHR outperforms recent state-of-the-art methods without any bells and whistles. The source code is available in the supplementary material and will be made publicly accessible.",
        "keywords": "Point Cloud;Semantic Segmentation;Hight-Resolution",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/df7922a2e8cdde24c84731e73369ece0bbe27511.zip",
        "author": "Haibo Qiu;Baosheng Yu;Yixin Chen;Dacheng Tao",
        "authorids": "~Haibo_Qiu1;~Baosheng_Yu1;~Yixin_Chen1;~Dacheng_Tao1",
        "gender": "M;;M;",
        "homepage": "https://haibo-qiu.github.io/;https://dr.ntu.edu.sg/cris/rp/rp02563;https://www.cse.wustl.edu/~yixin.chen/;",
        "dblp": "245/3520;178/8725;59/983;",
        "google_scholar": "O5gH5vkAAAAJ;fjzIdMQAAAAJ;NByrsK0AAAAJ;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Haibo_Qiu1;~Baosheng_Yu1;~Yixin_Chen1;~Dacheng_Tao1",
        "aff": "University of Sydney;The University of Sydney;Washington University, Saint Louis;",
        "aff_domain": "sydney.edu.au;sydney.edu.au;wustl.edu;",
        "position": "PhD;Research Fellow;Full Professor;",
        "bibtex": "@misc{\nqiu2024pointhr,\ntitle={Point{HR}: Exploring High-Resolution Architectures for 3D Point Cloud Segmentation},\nauthor={Haibo Qiu and Baosheng Yu and Yixin Chen and Dacheng Tao},\nyear={2024},\nurl={https://openreview.net/forum?id=WYh828Cha9}\n}",
        "github": "",
        "project": "",
        "reviewers": "PsJ9;BBdx;MgXg",
        "site": "https://openreview.net/forum?id=WYh828Cha9",
        "pdf_size": 2118157,
        "rating": "3;3;6",
        "confidence": "5;5;5",
        "soundness": "3;3;3",
        "contribution": "2;2;3",
        "presentation": "3;4;3",
        "wc_summary": "59;79;75",
        "wc_strengths": "38;67;164",
        "wc_weaknesses": "125;156;80",
        "wc_questions": "42;32;110",
        "wc_review": "264;334;429",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            5.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            71.0,
            8.640987597877148
        ],
        "wc_strengths_avg": [
            89.66666666666667,
            53.87846405465628
        ],
        "wc_weaknesses_avg": [
            120.33333333333333,
            31.201851796897497
        ],
        "wc_questions_avg": [
            61.333333333333336,
            34.65384378231207
        ],
        "wc_review_avg": [
            342.3333333333333,
            67.61820925033598
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9841116622496294588&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "University of Sydney;Washington University in St. Louis",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.sydney.edu.au;https://wustl.edu",
        "aff_unique_abbr": "USYD;WUSTL",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Saint Louis",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "Australia;United States"
    },
    {
        "id": "WYsLU5TEEo",
        "title": "Counterfactual Image Generation for adversarially robust and interpretable Classifiers",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Neural Image Classifiers are effective but inherently hard to interpret and susceptible to adversarial attacks. Solutions to both problems exist, among others, in the form of counterfactual examples generation to enhance explainability or adversarially augment training datasets for improved robustness. However, existing methods exclusively address only one of the issues. We propose a unified framework leveraging image-to-image translation Generative Adversarial Networks (GANs) to produce counterfactual samples that highlight salient regions for interpretability and act as adversarial samples to augment the dataset for more robustness. This is achieved by combining the classifier and discriminator into a single model that attributes real images to their respective classes and flags generated images as \"fake\". We assess the method's effectiveness by evaluating (i) the produced explainability masks on a semantic segmentation task for concrete cracks and (ii) the model's resilience against the Projected Gradient Descent (PGD) attack on a fruit defects detection problem. Our produced saliency maps are highly descriptive, achieving competitive IoU values compared to classical segmentation models despite being trained exclusively on classification labels. Furthermore, the model exhibits improved robustness to adversarial attacks, and we show how the discriminator's \"fakeness\" level serves as an uncertainty measure of the predictions.",
        "keywords": "Deep Learning;Image Classification;Robustness;Explainability;Generative Adversarial Networks;Image-to-Image Translation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Rafael Bischof;Florian Scheidegger;Michael Anton Kraus;Cristiano Malossi",
        "authorids": "~Rafael_Bischof2;~Florian_Scheidegger1;~Michael_Anton_Kraus1;~Cristiano_Malossi1",
        "gender": ";M;M;M",
        "homepage": "https://rabischof.ch;;https://research.ibm.com/people/cristiano-malossi;https://www.ismd.tu-darmstadt.de/das_institut_ismd/mitarbeiter_innen_ismd/team_ismd_details_109888.de.jsp",
        "dblp": ";179/2885;49/9752;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;lWXIym8AAAAJ;OSEugosAAAAJ;https://scholar.google.com/citations?hl=de",
        "orcid": ";0000-0003-0430-3634;0000-0002-8201-1533;0000-0002-5000-2923",
        "linkedin": ";;cristianomalossi;",
        "or_profile": "~Rafael_Bischof2;~Florian_Scheidegger1;~Cristiano_Malossi1;~Michael_Kraus1",
        "aff": ";International Business Machines;International Business Machines;ETHZ - ETH Zurich",
        "aff_domain": ";ibm.com;ibm.com;ethz.ch",
        "position": ";Researcher;Principal Researcher;Researcher",
        "bibtex": "@misc{\nbischof2024counterfactual,\ntitle={Counterfactual Image Generation for adversarially robust and interpretable Classifiers},\nauthor={Rafael Bischof and Florian Scheidegger and Michael Anton Kraus and Cristiano Malossi},\nyear={2024},\nurl={https://openreview.net/forum?id=WYsLU5TEEo}\n}",
        "github": "",
        "project": "",
        "reviewers": "ujhc;9wk6;jyYD;WMWv",
        "site": "https://openreview.net/forum?id=WYsLU5TEEo",
        "pdf_size": 2538658,
        "rating": "1;3;3;3",
        "confidence": "4;4;4;5",
        "soundness": "1;1;1;2",
        "contribution": "1;3;2;2",
        "presentation": "1;2;3;2",
        "wc_summary": "54;82;60;124",
        "wc_strengths": "17;84;48;124",
        "wc_weaknesses": "321;220;302;623",
        "wc_questions": "37;135;46;39",
        "wc_review": "429;521;456;910",
        "wc_reply_reviewers": "62;293;29;0",
        "wc_reply_authors": "661;556;323;707",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            80.0,
            27.459060435491963
        ],
        "wc_strengths_avg": [
            68.25,
            39.97733733004238
        ],
        "wc_weaknesses_avg": [
            366.5,
            152.87658421092485
        ],
        "wc_questions_avg": [
            64.25,
            40.9839907768875
        ],
        "wc_review_avg": [
            579.0,
            194.00644319197235
        ],
        "wc_reply_reviewers_avg": [
            96.0,
            115.83393285216556
        ],
        "wc_reply_authors_avg": [
            561.75,
            148.30943159489217
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13068210163064315039&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "International Business Machines Corporation;ETH Zurich",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ibm.com;https://www.ethz.ch",
        "aff_unique_abbr": "IBM;ETHZ",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "United States;Switzerland"
    },
    {
        "id": "WZ6NY4JfFX",
        "title": "Revisiting the Role of Language Priors in Vision-Language Models",
        "track": "main",
        "status": "Desk Reject",
        "tldr": "",
        "abstract": "Vision-language models (VLMs) are impactful in part because they can be applied to a variety of visual understanding tasks in a zero-shot fashion, without any fine-tuning. We study currently popular *generative VLMs* that are trained for next-word generation given the image. We explore their zero-shot performance on the illustrative task of image-text retrieval across 8 popular vision-language benchmarks. Our first observation is that they can be repurposed for discriminative tasks (such as image-text retrieval) by simply computing the match score of generating a particular text string given an image. We call this probabilistic score the *Visual Generative Pre-Training Score* (VisualGPTScore). While the VisualGPTScore produces near-perfect accuracy on some retrieval benchmarks, it produces poor accuracy on others. We analyze this behavior through a probabilistic lens, pointing out that some benchmarks inadvertently capture unnatural language distributions by creating adversarial but unlikely text captions. In fact, we demonstrate that even a ``blind'' language model that ignores any image evidence can sometimes outperform all prior art, reminiscent of similar challenges faced by the visual-question answering (VQA) community many years ago. We derive a probabilistic post-processing scheme that controls for the amount of linguistic bias in generative VLMs at test time without having to retrain or fine-tune the model. We show that the VisualGPTScore, when appropriately debiased, is a strong zero-shot baseline for vision-language understanding, oftentimes producing state-of-the-art accuracy.",
        "keywords": "Vision-Language Models;Visio-Linguistic Compositionality;Cross-Modal Retrieval;Computer Vision;Natural Language Processing",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/c179e1e145b64ffb322b88d48a0faeef8ac9966c.zip",
        "author": "Zhiqiu Lin;Xinyue Chen;Deepak Pathak;Pengchuan Zhang;Deva Ramanan",
        "authorids": "~Zhiqiu_Lin1;~Xinyue_Chen5;~Deepak_Pathak1;~Pengchuan_Zhang1;~Deva_Ramanan1",
        "gender": "M;F;M;M;M",
        "homepage": "https://linzhiqiu.github.io;;https://www.cs.cmu.edu/~dpathak/;https://pzzhang.github.io/pzzhang/;https://www.cs.cmu.edu/~deva/",
        "dblp": "230/4394;;155/9860;;49/488",
        "google_scholar": "https://scholar.google.com/citations?hl=en;u1LwS0UAAAAJ;https://scholar.google.cl/citations?user=AEsPCAUAAAAJ;3VZ_E64AAAAJ;9B8PoXUAAAAJ",
        "orcid": ";;;;",
        "linkedin": "zhiqiu-lin-b49ba7126/;xinyue-chen-073a4114b/;pathak22/;;",
        "or_profile": "~Zhiqiu_Lin1;~Xinyue_Chen5;~Deepak_Pathak1;~Pengchuan_Zhang1;~Deva_Ramanan1",
        "aff": "Carnegie Mellon University;ByteDance Inc.;Carnegie Mellon University;;School of Computer Science, Carnegie Mellon University",
        "aff_domain": "cmu.edu;bytedance.com;cmu.edu;;cs.cmu.edu",
        "position": "PhD student;Researcher;Assistant Professor;;Full Professor",
        "bibtex": "@misc{\nlin2024revisiting,\ntitle={Revisiting the Role of Language Priors in Vision-Language Models},\nauthor={Zhiqiu Lin and Xinyue Chen and Deepak Pathak and Pengchuan Zhang and Deva Ramanan},\nyear={2024},\nurl={https://openreview.net/forum?id=WZ6NY4JfFX}\n}",
        "github": "",
        "project": "",
        "reviewers": "AoET;85bY;eKtF;ANt2",
        "site": "https://openreview.net/forum?id=WZ6NY4JfFX",
        "pdf_size": 8266561,
        "rating": "5;5;5;8",
        "confidence": "3;4;3;5",
        "soundness": "2;2;3;4",
        "contribution": "3;1;2;4",
        "presentation": "3;3;3;4",
        "wc_summary": "79;100;79;112",
        "wc_strengths": "43;22;46;145",
        "wc_weaknesses": "131;263;115;72",
        "wc_questions": "118;198;44;4",
        "wc_review": "371;583;284;333",
        "wc_reply_reviewers": "179;0;120;0",
        "wc_reply_authors": "946;967;1087;302",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "2;2;2;1",
        "rating_avg": [
            5.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            1.118033988749895
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            92.5,
            14.150971698084906
        ],
        "wc_strengths_avg": [
            64.0,
            47.67074574621211
        ],
        "wc_weaknesses_avg": [
            145.25,
            71.32452243092834
        ],
        "wc_questions_avg": [
            91.0,
            74.08778576796583
        ],
        "wc_review_avg": [
            392.75,
            114.08850730901864
        ],
        "wc_reply_reviewers_avg": [
            74.75,
            77.60597592969242
        ],
        "wc_reply_authors_avg": [
            825.5,
            306.99226374617325
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.8703882797784892,
        "gs_citation": 27,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11731537112498758874&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Carnegie Mellon University;ByteDance",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cmu.edu;https://www.bytedance.com",
        "aff_unique_abbr": "CMU;ByteDance",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Pittsburgh",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "WZfatbNdLV",
        "title": "Generative modeling for RNA splicing code predictions and design",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Alternative splicing (AS) of pre-mRNA splicing is a highly regulated process with diverse phenotypic effects ranging from changes in AS across tissues to numerous diseases. The ability to predict or manipulate AS has therefore been a long time goal in the RNA field with applications ranging from identifying novel regulatory mechanisms to designing therapeutic targets. Here we take advantage of generative model architectures to address both the prediction and design of RNA splicing condition-specific outcome. First, we construct a predictive model, TrASPr, which combines multiple transformers along with side information to predict splicing in a tissue specific manner. Then, we exploit TrASPr as on Oracle to produce labeled data for a Bayesian Optimization (BO) algorithm with a costume loss function for RNA splicing outcome design. We demonstrate TrASPr significantly outperforms recently published models and that it can identify relevant regulatory features which are also captured by the BO generative process.",
        "keywords": "RNA Splicing;Computational Biology;Transformers;Deep Learning;Bayesian Optimization;RNA Design",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Di Wu;Anupama Jha;San Jewell;Natalie Maus;Jacob R. Gardner;Yoseph Barash",
        "authorids": "~Di_Wu27;~Anupama_Jha1;~San_Jewell2;~Natalie_Maus1;~Jacob_R._Gardner1;~Yoseph_Barash1",
        "gender": "M;F;;F;M;M",
        "homepage": "https://www.biociphers.org/copy-of-joseph-aicher-lab-member;https://anupamajha.com/;https://www.biociphers.org/san-jewell-lab-member;https://sites.google.com/seas.upenn.edu/natalie-maus/;https://www.biociphers.org/;",
        "dblp": ";209/7336;;264/7932;https://dblp.uni-trier.de/pers/hd/b/Barash:Yoseph;144/7773",
        "google_scholar": "kB6mIMkAAAAJ;aIhgsDIAAAAJ;;hNRd6lsAAAAJ;;0gkajvEAAAAJ",
        "orcid": ";0000-0003-3029-2086;;;0000-0003-3005-5048;",
        "linkedin": ";;;natalie-maus-14b936178/;;",
        "or_profile": "~Di_Wu27;~Anupama_Jha1;~San_Jewell2;~Natalie_Maus1;~Yoseph_Barash1;~Jacob_R_Gardner1",
        "aff": "University of Pennsylvania;University of Washington;University of Pennsylvania;University of Pennsylvania;University of Pennsylvania;University of Pennsylvania",
        "aff_domain": "upenn.edu;uw.edu;upenn.edu;upenn.edu;upenn.edu;upenn.edu",
        "position": "PhD student;Postdoc;Researcher;PhD student;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nwu2024generative,\ntitle={Generative modeling for {RNA} splicing code predictions and design},\nauthor={Di Wu and Anupama Jha and San Jewell and Natalie Maus and Jacob R. Gardner and Yoseph Barash},\nyear={2024},\nurl={https://openreview.net/forum?id=WZfatbNdLV}\n}",
        "github": "",
        "project": "",
        "reviewers": "Bzy6;Yedq;stAa;dwAm",
        "site": "https://openreview.net/forum?id=WZfatbNdLV",
        "pdf_size": 1533738,
        "rating": "5;5;6;6",
        "confidence": "5;4;4;4",
        "soundness": "2;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "127;388;44;41",
        "wc_strengths": "50;388;100;100",
        "wc_weaknesses": "375;388;57;160",
        "wc_questions": "134;388;338;3",
        "wc_review": "686;1552;539;304",
        "wc_reply_reviewers": "321;32;0;0",
        "wc_reply_authors": "4593;929;485;528",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "6;2;1;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            150.0,
            141.67745056994778
        ],
        "wc_strengths_avg": [
            159.5,
            133.49438190425843
        ],
        "wc_weaknesses_avg": [
            245.0,
            141.34885921011178
        ],
        "wc_questions_avg": [
            215.75,
            155.371128270345
        ],
        "wc_review_avg": [
            770.25,
            471.459635069642
        ],
        "wc_reply_reviewers_avg": [
            88.25,
            135.01180503941129
        ],
        "wc_reply_authors_avg": [
            1633.75,
            1717.2756585650425
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            2.0615528128088303
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13097030538542263973&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;0;0;0;0",
        "aff_unique_norm": "University of Pennsylvania;University of Washington",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.upenn.edu;https://www.washington.edu",
        "aff_unique_abbr": "UPenn;UW",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Latent Intuitive Physics: Learning to Transfer Hidden Physics from A 3D Video",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18472",
        "id": "WZu4gUGN13",
        "author_site": "Xiangming Zhu, Huayu Deng, Haochen Yuan, Yunbo Wang, Xiaokang Yang",
        "tldr": "",
        "abstract": "We introduce latent intuitive physics, a transfer learning framework for physics simulation that can infer hidden properties of fluids from a single 3D video and simulate the observed fluid in novel scenes. Our key insight is to use latent features drawn from a learnable prior distribution conditioned on the underlying particle states to capture the invisible and complex physical properties. To achieve this, we train a parametrized prior learner given visual observations to approximate the visual posterior of inverse graphics, and both the particle states and the visual posterior are obtained from a learned neural renderer. The converged prior learner is embedded in our probabilistic physics engine, allowing us to perform novel simulations on unseen geometries, boundaries, and dynamics without knowledge of the true physical parameters. We validate our model in three ways: (i) novel scene simulation with the learned visual-world physics, (ii) future prediction of the observed fluid dynamics, and (iii) supervised particle simulation. Our model demonstrates strong performance in all three tasks.",
        "keywords": "Intuitive physics;inverse graphics;particle-based fluid simulation;neural rendering",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/216f05bad7be4ad1bba4435eb0aacfc1d0b8d098.zip",
        "author": "Xiangming Zhu;Huayu Deng;Haochen Yuan;Yunbo Wang;Xiaokang Yang",
        "authorids": "~Xiangming_Zhu2;~Huayu_Deng1;~Haochen_Yuan1;~Yunbo_Wang2;~Xiaokang_Yang1",
        "gender": ";F;;M;M",
        "homepage": "https://github.com/xherdan76;https://github.com/hbell99;https://github.com/ironllen;https://icne.sjtu.edu.cn/info/1064/1078.htm;https://wyb15.github.io/",
        "dblp": "141/1940-2.html;300/5539;;06/3071-1.html;84/3894",
        "google_scholar": "0RMoo8AAAAAJ;;;yDEavdMAAAAJ;C8bGfr0AAAAJ",
        "orcid": ";;;0000-0003-4029-3322;",
        "linkedin": ";;;;",
        "or_profile": "~Xiangming_Zhu2;~Huayu_Deng1;~Haochen_Yuan1;~Xiaokang_Yang1;~Yunbo_Wang1",
        "aff": "Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn",
        "position": "MS student;PhD student;MS student;Full Professor;Associate Professor",
        "bibtex": "@inproceedings{\nzhu2024latent,\ntitle={Latent Intuitive Physics: Learning to Transfer Hidden Physics from A 3D Video},\nauthor={Xiangming Zhu and Huayu Deng and Haochen Yuan and Yunbo Wang and Xiaokang Yang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=WZu4gUGN13}\n}",
        "github": "",
        "project": "",
        "reviewers": "eXxy;zRiM;QGTH;5z4H",
        "pdf_size": 45183184,
        "rating": "6;6;6;8",
        "confidence": "4;1;3;3",
        "soundness": "3;3;3;4",
        "contribution": "3;3;3;3",
        "presentation": "2;3;2;3",
        "wc_summary": "68;81;46;56",
        "wc_strengths": "41;76;43;108",
        "wc_weaknesses": "99;151;77;103",
        "wc_questions": "26;22;35;57",
        "wc_review": "234;330;201;324",
        "wc_reply_reviewers": "0;0;16;0",
        "wc_reply_authors": "704;331;387;1124",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            2.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            62.75,
            13.102957681378658
        ],
        "wc_strengths_avg": [
            67.0,
            27.44995446262161
        ],
        "wc_weaknesses_avg": [
            107.5,
            26.995369973386175
        ],
        "wc_questions_avg": [
            35.0,
            13.546217184144066
        ],
        "wc_review_avg": [
            272.25,
            56.01952784520769
        ],
        "wc_reply_reviewers_avg": [
            4.0,
            6.928203230275509
        ],
        "wc_reply_authors_avg": [
            636.5,
            315.3541659785074
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.13245323570650439,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:LBUWDQMKWZEJ:scholar.google.com/&scioq=Latent+Intuitive+Physics:+Learning+to+Transfer+Hidden+Physics+from+A+3D+Video&hl=en&as_sdt=0,5",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=WZu4gUGN13",
        "pdf": "https://openreview.net/pdf?id=WZu4gUGN13",
        "email": "sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Shanghai Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sjtu.edu.cn",
        "aff_unique_abbr": "SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "Wa6Ebn4AYL",
        "title": "Big Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent advances in foundation models reveal a promising direction for deep learning, with the roadmap steadily moving from big data to big models/neural-nets to the presented big learning.\nSpecifically, the big learning exhaustively exploits the information inherent in its large-scale \\emph{complete/incomplete} training data, by simultaneously modeling many/all joint, conditional, and marginal data distributions across potentially diverse domains, with one universal foundation model. \nWe reveal that the big learning principle \n($i$) underlies most foundation models, \n($ii$) is equipped with extraordinary flexibilities for complete/incomplete training data and various data generative tasks, \n($iii$) potentially delivers all joint, conditional, and marginal data sampling capabilities with one universal model,\nand ($iv$) is a new dimension for upgrading conventional machine learning paradigms.\nWe leverage the big learning principle to upgrade the generative adversarial nets (in this paper), the expectation-maximization algorithm (in the supplementary), and the variational auto-encoders (in the supplementary) to their big-learning variants, with diverse experiments conducted to justify its effectiveness.",
        "keywords": "Foundation models;generative modeling;big learning;generative adversarial nets",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/b4411d298de02450e8bb802527bd72d198145736.zip",
        "author": "Yulai Cong;Miaoyun Zhao;Sijia Li",
        "authorids": "~Yulai_Cong1;~Miaoyun_Zhao1;~Sijia_Li2",
        "gender": "M;F;F",
        "homepage": ";;https://github.com/KKKirsty",
        "dblp": "163/0527;146/8434;",
        "google_scholar": "i_XfCIkAAAAJ;hXm2uDEAAAAJ;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Yulai_Cong1;~Miaoyun_Zhao1;~Sijia_Li2",
        "aff": "SUN YAT-SEN UNIVERSITY;Dalian University of Technology;SUN YAT-SEN UNIVERSITY",
        "aff_domain": "sysu.edu.cn;dlut.edu.cn;sysu.edu.cn",
        "position": "Associate Professor;Full Professor;MS student",
        "bibtex": "@misc{\ncong2024big,\ntitle={Big Learning},\nauthor={Yulai Cong and Miaoyun Zhao and Sijia Li},\nyear={2024},\nurl={https://openreview.net/forum?id=Wa6Ebn4AYL}\n}",
        "github": "",
        "project": "",
        "reviewers": "1dVT;dsm7;7mKq;dok4",
        "site": "https://openreview.net/forum?id=Wa6Ebn4AYL",
        "pdf_size": 22196469,
        "rating": "5;5;5;6",
        "confidence": "3;4;4;4",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;1;2",
        "wc_summary": "69;88;78;65",
        "wc_strengths": "78;30;35;50",
        "wc_weaknesses": "257;113;96;77",
        "wc_questions": "51;38;20;4",
        "wc_review": "455;269;229;196",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1152;433;470;838",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "5;2;3;2",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            75.0,
            8.860022573334675
        ],
        "wc_strengths_avg": [
            48.25,
            18.686559340873856
        ],
        "wc_weaknesses_avg": [
            135.75,
            71.15256495728035
        ],
        "wc_questions_avg": [
            28.25,
            17.80975856096876
        ],
        "wc_review_avg": [
            287.25,
            100.24064794283804
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            723.25,
            293.84296401309325
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            3.0,
            1.224744871391589
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Sun Yat-sen University;Dalian University of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.sysu.edu.cn;http://www.dlut.edu.cn/",
        "aff_unique_abbr": "SYSU;DUT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "WaAceago4p",
        "title": "Easing Non-IID Pain with Dual Relaxations in Federated Learning: SimFAFL redeems an enhanced efficacy",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Federated learning enables collaborative training across clients without sharing local data, making it well-suited for privacy preservation. However, statistical heterogeneity in local datasets, known as non-identically distributed (non-iid) problem, leads to client drift and poor convergence for global model. Feature alignment federated learning (FAFL) methods have emerged to tackle this problem by constraining local feature distribution with global per-class representations and achieved remarkable performance. However, issues persist around 1) lacking expandability and extensibility (i.e., tight coupling with classification tasks), 2) requiring additional communication and computational cost and 3) expecting rigorous theoretical analysis. To address these issues, this paper presents a simpler version of FAFL - SimFAFL, which decouples the constantly updated FAFL constraints from explicit categorical dependencies using two modular constraints. Specifically, the proposed constraints are i) a fixed global reference distribution and ii) globally shared task parameters. These act as centroid and shape regularizers to restrict drift in local feature distributions without requiring explicit categorization. We provide theoretical analysis proving the constraints reduce the deviation upper bound of the objective function, demonstrating efficacy of SimFAFL in mitigating harmful drift. Extensive experiments demonstrate SimFAFL's state-of-the-art performance compared to prevalent methods. Moreover, the modular design also expands model flexibility and benefits generalization without imposing communication/computation costs.",
        "keywords": "Federated learning;Non-iid;feature alignment",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Lu Zhang;Yao Yang;Yiteng Zhai;Yixun Luo;Xu Jiao;Di Li",
        "authorids": "~Lu_Zhang17;~Yao_Yang2;~Yiteng_Zhai2;~Yixun_Luo1;~Xu_Jiao2;~Di_Li2",
        "gender": "F;M;M;M;;F",
        "homepage": ";https://portal.zhejianglab.com/portal/employee/001112;;;;https://ieeexplore.ieee.org/abstract/document/8790213",
        "dblp": ";35/5535;124/8986.html;;;",
        "google_scholar": "Rk4E7fsAAAAJ;6xDMM1YAAAAJ;;bWZoeMgAAAAJ;LSUMYRsAAAAJ;",
        "orcid": ";0000-0002-7007-9071;;;0009-0003-0773-4429;",
        "linkedin": ";;;;;",
        "or_profile": "~Lu_Zhang17;~Yao_Yang2;~Yiteng_Zhai2;~Yixun_Luo1;~Xu_Jiao2;~Di_Li2",
        "aff": "Zhejiang Lab China;Zhejiang Lab China;;ZhejiangLab;Zhejiang Lab;",
        "aff_domain": "zhejianglab.com;zhejianglab.com;;zhejianglab.com;zhejianglab.com;",
        "position": "Researcher;Researcher;;Researcher;Researcher;",
        "bibtex": "@misc{\nzhang2024easing,\ntitle={Easing Non-{IID} Pain with Dual Relaxations in Federated Learning: Sim{FAFL} redeems an enhanced efficacy},\nauthor={Lu Zhang and Yao Yang and Yiteng Zhai and Yixun Luo and Xu Jiao and Di Li},\nyear={2024},\nurl={https://openreview.net/forum?id=WaAceago4p}\n}",
        "github": "",
        "project": "",
        "reviewers": "7zfg;NjjA;kTy4;bnjG",
        "site": "https://openreview.net/forum?id=WaAceago4p",
        "pdf_size": 602490,
        "rating": "3;3;5;6",
        "confidence": "3;4;4;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;2",
        "presentation": "1;2;3;3",
        "wc_summary": "60;97;55;73",
        "wc_strengths": "40;14;94;108",
        "wc_weaknesses": "321;33;93;92",
        "wc_questions": "3;187;15;35",
        "wc_review": "424;331;257;308",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            71.25,
            16.253845698787718
        ],
        "wc_strengths_avg": [
            64.0,
            38.44476557348217
        ],
        "wc_weaknesses_avg": [
            134.75,
            110.24149627068748
        ],
        "wc_questions_avg": [
            60.0,
            74.20916385460761
        ],
        "wc_review_avg": [
            330.0,
            60.518592184551025
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.19245008972987526,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:74amoIIaNeEJ:scholar.google.com/&scioq=Easing+Non-IID+Pain+with+Dual+Relaxations+in+Federated+Learning:+SimFAFL+redeems+an+enhanced+efficacy&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Zhejiang Lab;ZhejiangLab",
        "aff_unique_dep": ";",
        "aff_unique_url": ";https://www.zhejianglab.com",
        "aff_unique_abbr": ";",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "WbR415lO2L",
        "title": "Large Language Models can be Guided to Evade AI-generated Text Detection",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large language models (LLMs) have shown remarkable performance in various tasks and have been extensively utilized by the public.\nHowever, the increasing concerns regarding the misuse of LLMs, such as plagiarism and spamming, have led to the development of multiple detectors, including fine-tuned classifiers and statistical methods.\nIn this study, we equip LLMs with prompts, rather than relying on an external paraphraser, to evaluate the vulnerability of these detectors.\nWe propose a novel Substitution-based In-Context example Optimization method (SICO) to automatically construct prompts for evading the detectors.\nSICO is cost-efficient as it requires only 40 human-written examples and a limited number of LLM inferences to generate a prompt.\nMoreover, once a task-specific prompt has been constructed, it can be universally used against a wide range of detectors.\nExtensive experiments across three real-world tasks demonstrate that SICO significantly outperforms the paraphraser baselines\nand enables GPT-3.5 to successfully evade six detectors, decreasing their AUC by 0.5 on average.\nFurthermore, a comprehensive human evaluation as well as a validation experiment in the wild show that the SICO-generated text achieves human-level readability and task completion rates.\nFinally, the strong performance of SICO exhibits its potential as a reliable evaluation tool for future detectors.",
        "keywords": "AI-content detection;in-context learning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/e3d45f1aedd48fa12e85be88944b56f0929df6fe.zip",
        "author": "Ning Lu;Shengcai Liu;Rui He;Yew-Soon Ong;Qi Wang;Ke Tang",
        "authorids": "~Ning_Lu4;~Shengcai_Liu1;~Rui_He3;~Yew-Soon_Ong1;~Qi_Wang23;~Ke_Tang2",
        "gender": "M;;M;;M;M",
        "homepage": "https://colinlu50.github.io/;;;;https://cse.sustech.edu.cn/faculty/~wangqi/;https://faculty.sustech.edu.cn/tangk3/",
        "dblp": ";;28/6300;;19/1924-12;https://dblp.uni-trier.de/pers/hd/t/Tang:Ke.html",
        "google_scholar": "EQWpxacAAAAJ;;9do30b8AAAAJ;;ad6Sx3IAAAAJ;mzLHFbAAAAAJ",
        "orcid": "0000-0003-2314-4536;;;;;0000-0002-6236-2002",
        "linkedin": ";;;;;",
        "or_profile": "~Ning_Lu4;~Shengcai_Liu1;~Rui_He3;~Yew-Soon_Ong1;~Qi_Wang23;~Ke_Tang2",
        "aff": "Hong Kong University of Science and Technology;;Southern University of Science and Technology;;Southern University of Science and Technology;Southern University of Science and Technology",
        "aff_domain": "hkust.edu;;sustech.edu.cn;;sustech.edu.cn;sustech.edu.cn",
        "position": "PhD student;;PhD student;;Associate Professor;Full Professor",
        "bibtex": "@misc{\nlu2024large,\ntitle={Large Language Models can be Guided to Evade {AI}-generated Text Detection},\nauthor={Ning Lu and Shengcai Liu and Rui He and Yew-Soon Ong and Qi Wang and Ke Tang},\nyear={2024},\nurl={https://openreview.net/forum?id=WbR415lO2L}\n}",
        "github": "",
        "project": "",
        "reviewers": "iD8f;nfun;KWZu;Jo4D",
        "site": "https://openreview.net/forum?id=WbR415lO2L",
        "pdf_size": 841352,
        "rating": "5;5;5;6",
        "confidence": "4;3;5;4",
        "soundness": "2;2;2;3",
        "contribution": "3;2;2;3",
        "presentation": "3;2;3;4",
        "wc_summary": "44;54;100;66",
        "wc_strengths": "17;27;68;55",
        "wc_weaknesses": "336;161;301;25",
        "wc_questions": "3;5;3;157",
        "wc_review": "400;247;472;303",
        "wc_reply_reviewers": "28;12;26;0",
        "wc_reply_authors": "1159;1357;2314;723",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "3;4;5;2",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            66.0,
            21.118712081942874
        ],
        "wc_strengths_avg": [
            41.75,
            20.58367071248469
        ],
        "wc_weaknesses_avg": [
            205.75,
            123.19775769063331
        ],
        "wc_questions_avg": [
            42.0,
            66.40030120413611
        ],
        "wc_review_avg": [
            355.5,
            86.71937499774776
        ],
        "wc_reply_reviewers_avg": [
            16.5,
            11.346805717910216
        ],
        "wc_reply_authors_avg": [
            1388.25,
            581.6147242806014
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.5,
            1.118033988749895
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 49,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17448219307344543310&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Southern University of Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ust.hk;https://www.sustech.edu.cn",
        "aff_unique_abbr": "HKUST;SUSTech",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Knowledge Card: Filling LLMs' Knowledge Gaps with Plug-in Specialized Language Models",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18471",
        "id": "WbWtOYIzIK",
        "author_site": "Shangbin Feng, Weijia Shi, Yuyang Bai, Vidhisha Balachandran, Tianxing He, Yulia Tsvetkov",
        "tldr": "",
        "abstract": "By design, large language models (LLMs) are static general-purpose models, expensive to retrain or update frequently. As they are increasingly adopted for knowledge-intensive tasks, it becomes evident that these design choices lead to failures to generate factual, relevant, and up-to-date knowledge. To this end, we propose Knowledge Card, a modular framework to plug in new factual and relevant knowledge into general-purpose LLMs. We first introduce knowledge cards---specialized language models trained on corpora from specific domains and sources. Knowledge cards serve as parametric repositories that are selected at inference time to generate background knowledge for the base LLM. We then propose three content selectors to dynamically select and retain information in documents generated by knowledge cards, specifically controlling for relevance, brevity, and factuality of outputs. Finally, we propose two complementary integration approaches to augment the base LLM with the (relevant, factual) knowledge curated from the specialized LMs. Through extensive experiments, we demonstrate that Knowledge Card achieves state-of-the-art performance on six benchmark datasets. Ultimately, Knowledge Card framework enables dynamic synthesis and updates of knowledge from diverse domains. Its modularity will ensure that relevant knowledge can be continuously updated through the collective efforts of the research community.",
        "keywords": "large language models;black-box language models;modular and collaborative knowledge",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Shangbin Feng;Weijia Shi;Yuyang Bai;Vidhisha Balachandran;Tianxing He;Yulia Tsvetkov",
        "authorids": "~Shangbin_Feng1;~Weijia_Shi1;~Yuyang_Bai1;~Vidhisha_Balachandran1;~Tianxing_He1;~Yulia_Tsvetkov1",
        "gender": "M;;M;F;M;F",
        "homepage": "https://bunsenfeng.github.io/;https://weijiashi.notion.site/;https://leopoldwhite.github.io/;https://vidhishanair.github.io/;https://cloudygoose.github.io/;https://homes.cs.washington.edu/~yuliats/",
        "dblp": "295/9571;132/80601;261/0192;234/4867;149/0111;75/8157",
        "google_scholar": "Y3rLP9UAAAAJ;https://scholar.google.com/citations?hl=en;J2O6M1AAAAAJ;LgitgaIAAAAJ;egmfjjwAAAAJ;SEDPkrsAAAAJ",
        "orcid": "0000-0002-4133-1987;0000-3200-0000-0011;;;;0000-0002-4634-7128",
        "linkedin": ";weijia-shi-773768112;;;;",
        "or_profile": "~Shangbin_Feng1;~Weijia_Shi1;~Yuyang_Bai1;~Vidhisha_Balachandran1;~Tianxing_He1;~Yulia_Tsvetkov1",
        "aff": "University of Washington;University of Washington, Seattle;Xi'an Jiaotong University;Carnegie Mellon University;University of Washington;Department of Computer Science, University of Washington",
        "aff_domain": "cs.washington.edu;uw.edu;xjtu.edu.cn;cmu.edu;cs.washington.edu;cs.washington.edu",
        "position": "PhD student;PhD student;Undergrad student;PhD student;Postdoc;Associate Professor",
        "bibtex": "@inproceedings{\nfeng2024knowledge,\ntitle={Knowledge Card: Filling {LLM}s' Knowledge Gaps with Plug-in Specialized Language Models},\nauthor={Shangbin Feng and Weijia Shi and Yuyang Bai and Vidhisha Balachandran and Tianxing He and Yulia Tsvetkov},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=WbWtOYIzIK}\n}",
        "github": "",
        "project": "",
        "reviewers": "HvjK;fqxe;PFBW",
        "pdf_size": 877083,
        "rating": "8;8;8",
        "confidence": "3;3;2",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "4;3;3",
        "wc_summary": "76;53;129",
        "wc_strengths": "92;49;22",
        "wc_weaknesses": "21;89;48",
        "wc_questions": "24;28;197",
        "wc_review": "213;219;396",
        "wc_reply_reviewers": "0;21;12",
        "wc_reply_authors": "240;521;1345",
        "reply_reviewers": "0;1;1",
        "reply_authors": "1;2;3",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            86.0,
            31.822423959633664
        ],
        "wc_strengths_avg": [
            54.333333333333336,
            28.825143345504614
        ],
        "wc_weaknesses_avg": [
            52.666666666666664,
            27.956315128349008
        ],
        "wc_questions_avg": [
            83.0,
            80.62671186813131
        ],
        "wc_review_avg": [
            276.0,
            84.88816171881683
        ],
        "wc_reply_reviewers_avg": [
            11.0,
            8.602325267042627
        ],
        "wc_reply_authors_avg": [
            702.0,
            468.91861411834213
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 32,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5425607306504595616&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=WbWtOYIzIK",
        "pdf": "https://openreview.net/pdf?id=WbWtOYIzIK",
        "email": "cs.washington.edu;uw.edu;xjtu.edu.cn;cmu.edu;cs.washington.edu;cs.washington.edu",
        "author_num": 6,
        "aff_unique_index": "0;0;1;2;0;0",
        "aff_unique_norm": "University of Washington;Xi'an Jiao Tong University;Carnegie Mellon University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.washington.edu;https://www.xjtu.edu.cn;https://www.cmu.edu",
        "aff_unique_abbr": "UW;XJTU;CMU",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Seattle",
        "aff_country_unique_index": "0;0;1;0;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "Guiding Masked Representation Learning to Capture Spatio-Temporal Relationship of Electrocardiogram",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18470",
        "id": "WcOohbsF4H",
        "author_site": "Yeongyeon Na, Minje Park, Yunwon Tae, Sunghoon Joo",
        "tldr": "",
        "abstract": "Electrocardiograms (ECG) are widely employed as a diagnostic tool for monitoring electrical signals originating from a heart. Recent machine learning research efforts have focused on the application of screening various diseases using ECG signals. However, adapting to the application of screening disease is challenging in that labeled ECG data are limited. Achieving general representation through self-supervised learning (SSL) is a well-known approach to overcome the scarcity of labeled data; however, a naive application of SSL to ECG data, without considering the spatial-temporal relationships inherent in ECG signals, may yield suboptimal results. In this paper, we introduce ST-MEM (Spatio-Temporal Masked Electrocardiogram Modeling), designed to learn spatio-temporal features by reconstructing masked 12-lead ECG data. ST-MEM outperforms other SSL baseline methods in various experimental settings for arrhythmia classification tasks. Moreover, we demonstrate that ST-MEM is adaptable to various lead combinations. Through quantitative and qualitative analysis, we show a spatio-temporal relationship within ECG data. Our code is available at https://github.com/bakqui/ST-MEM.",
        "keywords": "Electrocardiogram;ECG;Cardiac signal;Biosignal;Self-supervised learning;Masked auto-encoder;Representation learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/3581b5749137f43ba1c8bbaec8b469996a12b28f.zip",
        "author": "Yeongyeon Na;Minje Park;Yunwon Tae;Sunghoon Joo",
        "authorids": "~Yeongyeon_Na1;~Minje_Park3;~Yunwon_Tae1;~Sunghoon_Joo1",
        "gender": "M;M;M;M",
        "homepage": ";;;",
        "dblp": ";;276/5054;",
        "google_scholar": ";AKiqrFgAAAAJ;;qW4rJmYAAAAJ",
        "orcid": ";;;0000-0002-3538-3975",
        "linkedin": "yeongyeon-na-757bb7211/;minbakje55/;;",
        "or_profile": "~Yeongyeon_Na1;~Minje_Park3;~Yunwon_Tae1;~Sunghoon_Joo1",
        "aff": "VUNO Inc. ;VUNO Inc.;VUNO;VUNO Inc.",
        "aff_domain": "vuno.co;vuno.co;vuno.co;vuno.co",
        "position": "Researcher;Researcher;Researcher;Principal Researcher",
        "bibtex": "@inproceedings{\nna2024guiding,\ntitle={Guiding Masked Representation Learning to Capture Spatio-Temporal Relationship of Electrocardiogram},\nauthor={Yeongyeon Na and Minje Park and Yunwon Tae and Sunghoon Joo},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=WcOohbsF4H}\n}",
        "github": "",
        "project": "",
        "reviewers": "QUx7;knNF;mpnR;pLfJ",
        "pdf_size": 11351264,
        "rating": "6;6;8;8",
        "confidence": "3;4;5;4",
        "soundness": "3;3;4;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;4;3",
        "wc_summary": "108;65;28;350",
        "wc_strengths": "55;49;65;42",
        "wc_weaknesses": "116;348;21;57",
        "wc_questions": "64;46;135;230",
        "wc_review": "343;508;249;679",
        "wc_reply_reviewers": "42;0;21;10",
        "wc_reply_authors": "1131;1016;522;1168",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "4;2;2;4",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            137.75,
            125.77037608276441
        ],
        "wc_strengths_avg": [
            52.75,
            8.437268515343103
        ],
        "wc_weaknesses_avg": [
            135.5,
            127.2880591414607
        ],
        "wc_questions_avg": [
            118.75,
            72.33731747860159
        ],
        "wc_review_avg": [
            444.75,
            163.97008111237855
        ],
        "wc_reply_reviewers_avg": [
            18.25,
            15.594470173750693
        ],
        "wc_reply_authors_avg": [
            959.25,
            258.59367258307
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            1.0
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.7071067811865475,
        "gs_citation": 24,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9361133886381724057&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=WcOohbsF4H",
        "pdf": "https://openreview.net/pdf?id=WcOohbsF4H",
        "email": "vuno.co;vuno.co;vuno.co;vuno.co",
        "author_num": 4,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "VUNO Inc.;VUNO",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.vuno.io;https://www.vuno.co.kr",
        "aff_unique_abbr": "VUNO;VUNO",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "WcSofkUVge",
        "title": "Utility-based Adaptive Teaching Strategies using Bayesian Theory of Mind",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Good teachers always tailor their explanations to the learners. Cognitive scientists model this process under the rationality principle: teachers try to maximise the learner's utility while minimising teaching costs. To this end, human teachers seem to build mental models of the learner's internal state, a capacity known as Theory of Mind (ToM). Inspired by cognitive science, we build on Bayesian ToM mechanisms to design teacher agents that, like humans, tailor their teaching strategies to the learners. Our ToM-equipped teachers construct models of learners' internal states from observations and leverage them to select demonstrations that maximise the learners' rewards while minimising teaching costs. Our experiments in simulated environments demonstrate that learners taught this way are more efficient than those taught in a learner-agnostic way. This effect gets stronger when the teacher's model of the learner better aligns with the actual learner's state, either using a more accurate prior or after accumulating observations of the learner's behaviour. This work is a first step towards social machines that teach us and each other, see https://teacher-with-tom.github.io.",
        "keywords": "Theory of Mind;Bayesian Inference;Teaching by Demonstration",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/d26a067f6e9b2be07128f0e95bbdb1c5fbd7798f.zip",
        "author": "Cl\u00e9mence Grislain;Hugo Caselles-Dupr\u00e9;Olivier Sigaud;Mohamed CHETOUANI",
        "authorids": "~Cl\u00e9mence_Grislain1;~Hugo_Caselles-Dupr\u00e91;~Olivier_Sigaud1;~Mohamed_CHETOUANI2",
        "gender": "F;M;M;",
        "homepage": "https://github.com/clemgris;https://sites.google.com/view/hugo-caselles-dupre/;http://people.isir.upmc.fr/sigaud;http://www.isir.upmc.fr/?op=view_profil&id=11&lang=en",
        "dblp": ";218/5478;50/5522;",
        "google_scholar": ";https://scholar.google.fr/citations?hl=fr;https://scholar.google.fr/citations?user=elLfDv0AAAAJ;https://scholar.google.fr/citations?user=AKdzMWUAAAAJ",
        "orcid": ";;0000-0002-8544-0229;0000-0002-2920-4539",
        "linkedin": "clemence-grislain/;;;",
        "or_profile": "~Cl\u00e9mence_Grislain1;~Hugo_Caselles-Dupr\u00e91;~Olivier_Sigaud1;~Mohamed_CHETOUANI2",
        "aff": "Universit\u00e9 Pierre et Marie Curie - Paris 6, Sorbonne Universit\u00e9 - Facult\u00e9 des Sciences (Paris VI);Obvious Research;Sorbonne Universit\u00e9;Sorbonne Universit\u00e9 - Facult\u00e9 des Sciences (Paris VI)",
        "aff_domain": "isir.upmc.fr;obvious-art.com;upmc.fr;upmc.fr",
        "position": "PhD student;Principal Researcher;Full Professor;Full Professor",
        "bibtex": "@misc{\ngrislain2024utilitybased,\ntitle={Utility-based Adaptive Teaching Strategies using Bayesian Theory of Mind},\nauthor={Cl{\\'e}mence Grislain and Hugo Caselles-Dupr{\\'e} and Olivier Sigaud and Mohamed CHETOUANI},\nyear={2024},\nurl={https://openreview.net/forum?id=WcSofkUVge}\n}",
        "github": "",
        "project": "",
        "reviewers": "C7a4;dJ9E;3FPZ;PobE;sVdN",
        "site": "https://openreview.net/forum?id=WcSofkUVge",
        "pdf_size": 1270239,
        "rating": "1;3;5;5;5",
        "confidence": "5;2;4;3;4",
        "soundness": "2;4;2;2;3",
        "contribution": "1;2;2;2;2",
        "presentation": "2;4;2;2;3",
        "wc_summary": "55;103;64;191;78",
        "wc_strengths": "31;71;60;118;49",
        "wc_weaknesses": "625;189;340;341;169",
        "wc_questions": "20;4;2;31;41",
        "wc_review": "731;367;466;681;337",
        "wc_reply_reviewers": "449;0;0;32;58",
        "wc_reply_authors": "1443;886;1312;1388;630",
        "reply_reviewers": "2;0;0;1;1",
        "reply_authors": "3;2;2;2;1",
        "rating_avg": [
            3.8,
            1.6
        ],
        "confidence_avg": [
            3.6,
            1.019803902718557
        ],
        "soundness_avg": [
            2.6,
            0.8
        ],
        "contribution_avg": [
            1.8,
            0.4000000000000001
        ],
        "presentation_avg": [
            2.6,
            0.8
        ],
        "wc_summary_avg": [
            98.2,
            49.150381483768776
        ],
        "wc_strengths_avg": [
            65.8,
            29.25337587356372
        ],
        "wc_weaknesses_avg": [
            332.8,
            163.10045983994036
        ],
        "wc_questions_avg": [
            19.6,
            15.107613974417005
        ],
        "wc_review_avg": [
            516.4,
            161.36368860434493
        ],
        "wc_reply_reviewers_avg": [
            107.8,
            171.9795336660732
        ],
        "wc_reply_authors_avg": [
            1131.8,
            318.48918348980084
        ],
        "reply_reviewers_avg": [
            0.8,
            0.7483314773547883
        ],
        "reply_authors_avg": [
            2.0,
            0.6324555320336759
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.294174202707276,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6500256447217929603&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;2",
        "aff_unique_norm": "Universit\u00e9 Pierre et Marie Curie - Paris 6;Obvious Research;Sorbonne Universit\u00e9",
        "aff_unique_dep": "Facult\u00e9 des Sciences;;",
        "aff_unique_url": "https://www.upmc.fr;;https://www.sorbonne-universite.fr",
        "aff_unique_abbr": "UPMC;;Sorbonne U",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Paris;;Paris VI",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "France;United States"
    },
    {
        "title": "Quasi-Monte Carlo for 3D Sliced Wasserstein",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18469",
        "id": "Wd47f7HEXg",
        "author_site": "Khai Nguyen, Nicola Bariletto, Nhat Ho",
        "tldr": "",
        "abstract": "Monte Carlo (MC) integration has been employed as the standard approximation method for the Sliced Wasserstein (SW) distance, whose analytical expression involves an intractable expectation. However, MC integration is not optimal in terms of absolute approximation error. To provide a better class of empirical SW, we propose quasi-sliced Wasserstein (QSW) approximations that rely on Quasi-Monte Carlo (QMC) methods. For a comprehensive investigation of QMC for SW, we focus on the 3D setting, specifically computing the SW between probability measures in three dimensions. In greater detail, we empirically evaluate various methods to construct QMC point sets on the 3D unit-hypersphere, including the Gaussian-based and equal area mappings, generalized spiral points, and optimizing discrepancy energies. Furthermore, to obtain an unbiased estimator for stochastic optimization, we extend QSW to Randomized Quasi-Sliced Wasserstein (RQSW) by introducing randomness in the discussed point sets. Theoretically, we prove the asymptotic convergence of QSW and the unbiasedness of RQSW. Finally, we conduct experiments on various 3D tasks, such as point-cloud comparison, point-cloud interpolation, image style transfer, and training deep point-cloud autoencoders, to demonstrate the favorable performance of the proposed QSW and RQSW variants.",
        "keywords": "Sliced Wasserstein;Monte Carlo Methods;Point-Cloud;Quasi-Monte Carlo;Optimal Transport",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/479c7602526b24df19de08b08804c167586584cb.zip",
        "author": "Khai Nguyen;Nicola Bariletto;Nhat Ho",
        "authorids": "~Khai_Nguyen1;~Nicola_Bariletto1;~Nhat_Ho1",
        "gender": "M;M;M",
        "homepage": "https://khainb.com;https://nbariletto.github.io/;https://nhatptnk8912.github.io/",
        "dblp": "120/4308;;203/4479",
        "google_scholar": "im5fNaQAAAAJ;https://scholar.google.it/citations?user=sqZB8ZEAAAAJ;https://scholar.google.ca/citations?user=Xs7cKMwAAAAJ",
        "orcid": ";;",
        "linkedin": ";;nhat-pham-minh-ho-267b8164/",
        "or_profile": "~Khai_Nguyen1;~Nicola_Bariletto1;~Nhat_Ho1",
        "aff": "University of Texas, Austin;University of Texas at Austin;University of Texas, Austin",
        "aff_domain": "utexas.edu;utexas.edu;utexas.edu",
        "position": "PhD student;PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nnguyen2024quasimonte,\ntitle={Quasi-Monte Carlo for 3D Sliced Wasserstein},\nauthor={Khai Nguyen and Nicola Bariletto and Nhat Ho},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Wd47f7HEXg}\n}",
        "github": "",
        "project": "",
        "reviewers": "Re8P;8GjU;UGxf;QEcr",
        "pdf_size": 10527543,
        "rating": "6;8;8;8",
        "confidence": "3;4;3;4",
        "soundness": "2;4;4;3",
        "contribution": "2;3;3;3",
        "presentation": "3;4;4;3",
        "wc_summary": "104;93;232;95",
        "wc_strengths": "136;130;47;37",
        "wc_weaknesses": "203;51;94;79",
        "wc_questions": "134;77;42;39",
        "wc_review": "577;351;415;250",
        "wc_reply_reviewers": "19;17;0;15",
        "wc_reply_authors": "1261;546;549;621",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "3;2;1;2",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            131.0,
            58.45938761225608
        ],
        "wc_strengths_avg": [
            87.5,
            45.68643124604941
        ],
        "wc_weaknesses_avg": [
            106.75,
            57.67310898503739
        ],
        "wc_questions_avg": [
            73.0,
            38.255718526777144
        ],
        "wc_review_avg": [
            398.25,
            118.78841483915845
        ],
        "wc_reply_reviewers_avg": [
            12.75,
            7.495832175282475
        ],
        "wc_reply_authors_avg": [
            744.25,
            299.85277637534057
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 17,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16816854695826782029&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=Wd47f7HEXg",
        "pdf": "https://openreview.net/pdf?id=Wd47f7HEXg",
        "email": "utexas.edu;utexas.edu;utexas.edu",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Texas at Austin",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.utexas.edu",
        "aff_unique_abbr": "UT Austin",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Austin",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "WdWGe88RdX",
        "title": "Bootstrapping Audio-Visual Segmentation by Strengthening Audio Cues",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "How to effectively interact audio with vision has always attracted extensive interest in the multi-modality community. Recently, a novel audio-visual segmentation (AVS) task has been proposed, aiming to segment the sounding objects in video frames using audio cues. However, current AVS methods suffer a modality imbalance issue. The fusion of audio features is insufficient because of its unidirectional and deficient interaction, while the vision information is more sufficiently exploited. Thus, the output features are always dominated by visual representations, which restricts audio-vision representation learning and may cause some false alarms. To address this issue, we propose AVSAC, where a Bidirectional Audio-Visual Decoder (BAVD) is devised with multiple bidirectional bridges built within. This strengthens audio cues and enables continuous interaction between audio and visual representations, which shrinks modality imbalance and boosts audio-visual representation learning. Furthermore, we introduce Audio Feature Reconstruction (AFR) to evade harmful data bias and curtail audio information loss by reconstructing lost ones from visual signals. Extensive experiments show that our method achieves new state-of-the-art performances in the AVS benchmark, especially boasting significant improvements (about 6$\\%$ in mIoU and 4$\\%$ in F-score) in the most challenging MS3 subset which needs to segment multiple sound sources.",
        "keywords": "audio-visual segmentation;multi-modality interaction",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/eb9253248e5ae66446cac846a2f255e59946668c.pdf",
        "author": "Tianxiang Chen;Zhentao Tan;Qi Chu;Yue Wu;Bin Liu;Nenghai Yu",
        "authorids": "~Tianxiang_Chen1;~Zhentao_Tan1;~Qi_Chu1;~Yue_Wu18;~Bin_Liu5;~Nenghai_Yu1",
        "gender": "M;M;;M;M;M",
        "homepage": ";;;;;",
        "dblp": ";211/5776;52/9077-1;35/837-16;96/5144;",
        "google_scholar": "xU3Ysg0AAAAJ;VCX7itEAAAAJ;JZjOMdsAAAAJ;kReWULQAAAAJ;https://scholar.google.com.hk/citations?user=7620QAMAAAAJ;srajsjoAAAAJ",
        "orcid": "0000-0002-7758-699X;0000-0001-9095-4462;0000-0003-3028-0755;;;",
        "linkedin": "https://www.linkedin.cn/incareer/in/ACoAADgzoswBlP5T24PioadxNqheOvpYlPsioy0;;;;;",
        "or_profile": "~Tianxiang_Chen1;~Zhentao_Tan1;~Qi_Chu1;~Bin_Liu5;~Nenghai_Yu1;~Yue_Wu3",
        "aff": "University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China;Alibaba Group",
        "aff_domain": "ustc.edu.cn;ustc.edu.cn;ustc.edu.cn;ustc.edu.cn;ustc.edu.cn;alibaba-inc.com",
        "position": "PhD student;Postdoc;Associate Professor;Associate Professor;Full Professor;Researcher",
        "bibtex": "@misc{\nchen2024bootstrapping,\ntitle={Bootstrapping Audio-Visual Segmentation by Strengthening Audio Cues},\nauthor={Tianxiang Chen and Zhentao Tan and Qi Chu and Yue Wu and Bin Liu and Nenghai Yu},\nyear={2024},\nurl={https://openreview.net/forum?id=WdWGe88RdX}\n}",
        "github": "",
        "project": "",
        "reviewers": "xbK3;MwLf;qkmM;7Z8k",
        "site": "https://openreview.net/forum?id=WdWGe88RdX",
        "pdf_size": 1850497,
        "rating": "3;6;6;6",
        "confidence": "4;3;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;2",
        "presentation": "3;2;3;3",
        "wc_summary": "104;42;75;87",
        "wc_strengths": "28;43;48;62",
        "wc_weaknesses": "426;138;57;227",
        "wc_questions": "9;102;1;9",
        "wc_review": "567;325;181;385",
        "wc_reply_reviewers": "565;0;0;121",
        "wc_reply_authors": "2218;353;296;884",
        "reply_reviewers": "2;0;0;1",
        "reply_authors": "5;2;2;3",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            77.0,
            22.68259244442751
        ],
        "wc_strengths_avg": [
            45.25,
            12.152674602736633
        ],
        "wc_weaknesses_avg": [
            212.0,
            137.40633173183832
        ],
        "wc_questions_avg": [
            30.25,
            41.55342946135734
        ],
        "wc_review_avg": [
            364.5,
            138.43680868901882
        ],
        "wc_reply_reviewers_avg": [
            171.5,
            232.4956988849471
        ],
        "wc_reply_authors_avg": [
            937.75,
            773.9032158480801
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.0,
            1.224744871391589
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1531367704504701236&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0;0;1",
        "aff_unique_norm": "University of Science and Technology of China;Alibaba Group",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.ustc.edu.cn;https://www.alibaba.com",
        "aff_unique_abbr": "USTC;Alibaba",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "WdhtdjoaVw",
        "title": "Functional Wasserstein Bridge Inference for Bayesian Deep Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Bayesian deep learning (BDL) is an emerging field that combines the strong function approximation power of deep learning with the uncertainty modeling capabilities of Bayesian methods. In addition to those virtues, however, there are accompanying issues brought by such a combination to the classical parameter-space variational inference, such as the nonmeaningful priors, intricate posteriors, and possible pathologies. In this paper, we propose a new function-space variational inference solution called Functional Wasserstein Bridge Inference (FWBI), which can assign meaningful functional priors and obtain well-behaved posterior. Specifically, we develop a Wasserstein distance-based bridge to avoid the potential pathological behaviors of Kullback\u2013Leibler (KL) divergence between stochastic processes that arise in most existing functional variational inference approaches. The derived functional variational objective is well-defined and proved to be a lower bound of the model evidence. We demonstrate the improved predictive performance and better uncertainty quantification of our FWBI on several tasks compared with various parameter-space and function-space variational methods.",
        "keywords": "Functional Variational Inference;Bayesian Deep Learning;Wasserstein Distance",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/3e8d3853f034692bbf5ab25c69c33d3d3033fe48.zip",
        "author": "Mengjing Wu;Junyu Xuan;Jie Lu",
        "authorids": "~Mengjing_Wu1;~Junyu_Xuan1;~Jie_Lu4",
        "gender": "F;M;",
        "homepage": ";https://www.uts.edu.au/staff/junyu.xuan;",
        "dblp": "285/1673;08/10768;",
        "google_scholar": "https://scholar.google.com.au/citations?view_op=list_works;https://scholar.google.com.au/citations?user=POQ_yJUAAAAJ;",
        "orcid": ";;",
        "linkedin": "mengjing-wu-a42838333/?originalSubdomain=au;;",
        "or_profile": "~Mengjing_Wu1;~Junyu_Xuan1;~Jie_Lu4",
        "aff": "University of Technology Sydney;University of Technology Sydney;",
        "aff_domain": "uts.edu.au;uts.edu.au;",
        "position": "PhD student;Assistant Professor;",
        "bibtex": "@misc{\nwu2024functional,\ntitle={Functional Wasserstein Bridge Inference for Bayesian Deep Learning},\nauthor={Mengjing Wu and Junyu Xuan and Jie Lu},\nyear={2024},\nurl={https://openreview.net/forum?id=WdhtdjoaVw}\n}",
        "github": "",
        "project": "",
        "reviewers": "kp8E;RTAX;ExHU;n4ZG;b5oJ",
        "site": "https://openreview.net/forum?id=WdhtdjoaVw",
        "pdf_size": 9208088,
        "rating": "3;3;6;6;6",
        "confidence": "4;3;3;4;3",
        "soundness": "2;2;3;4;3",
        "contribution": "3;3;3;3;2",
        "presentation": "2;3;3;3;3",
        "wc_summary": "164;136;67;50;205",
        "wc_strengths": "34;138;119;38;168",
        "wc_weaknesses": "294;278;160;255;164",
        "wc_questions": "148;110;19;40;381",
        "wc_review": "640;662;365;383;918",
        "wc_reply_reviewers": "206;0;0;0;0",
        "wc_reply_authors": "999;763;506;768;1329",
        "reply_reviewers": "1;0;0;0;0",
        "reply_authors": "3;1;1;1;3",
        "rating_avg": [
            4.8,
            1.469693845669907
        ],
        "confidence_avg": [
            3.4,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.8,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.8,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            124.4,
            58.35957504985792
        ],
        "wc_strengths_avg": [
            99.4,
            54.08733678043318
        ],
        "wc_weaknesses_avg": [
            230.2,
            57.062772452799734
        ],
        "wc_questions_avg": [
            139.6,
            129.37171251861824
        ],
        "wc_review_avg": [
            593.6,
            204.29253535065837
        ],
        "wc_reply_reviewers_avg": [
            41.2,
            82.4
        ],
        "wc_reply_authors_avg": [
            873.0,
            276.2701576356013
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            1.8,
            0.9797958971132713
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.16666666666666669,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10058016123398390235&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Technology Sydney",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uts.edu.au",
        "aff_unique_abbr": "UTS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Australia"
    },
    {
        "id": "WdvT2UgsTK",
        "title": "Enhancing the Cross-Size Generalization for Solving Vehicle Routing Problems via Continual Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep models for vehicle routing problems are typically trained and evaluated using instances of a single size, which severely limits their ability to generalize across different problem sizes and thus hampers their practical applicability. To address the issue, we propose a continual learning based framework that sequentially trains a deep model with instances of ascending problem sizes. Specifically, on the one hand, we design an inter-task regularization scheme to retain the knowledge acquired from smaller problem sizes in the model training on a larger size. On the other hand, we introduce an intra-task regularization scheme to consolidate the model by imitating the latest desirable behaviors during training on each size. Additionally, we exploit the experience replay to revisit instances of formerly trained sizes for mitigating the catastrophic forgetting. Extensive experimental results show that the proposed approach achieves predominantly superior performance across various problem sizes (either seen or unseen in the training), as compared to state-of-the-art deep models including the ones specialized for the generalizability enhancement. Meanwhile, the ablation studies on the key designs manifest their synergistic effect in the proposed framework.",
        "keywords": "Vehicle routing problem;generalization;continual learning",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/1c0fa52a874b8342c8edced40b20f35978329b54.pdf",
        "author": "Jingwen Li;Zhiguang Cao;Yaoxin Wu;Tang Liu",
        "authorids": "~Jingwen_Li1;~Zhiguang_Cao1;~Yaoxin_Wu2;~Tang_Liu2",
        "gender": "F;M;;M",
        "homepage": "https://scholar.google.com/citations?user=2nbigR8AAAAJ&hl=zh-CN&oi=ao;https://zhiguangcaosg.github.io/;https://cs.sicnu.edu.cn/p/0/?StId=st_app_news_i_x637286054938012864;https://research.tue.nl/en/persons/yaoxin-wu",
        "dblp": "98/2621-1;178/8621;;192/4964",
        "google_scholar": "2nbigR8AAAAJ;https://scholar.google.com.sg/citations?user=2R-cOkYAAAAJ;https://scholar.google.com.hk/citations?user=0yIrDHEAAAAJ;0qRnmK8AAAAJ",
        "orcid": "0000-0001-8661-5695;0000-0002-4499-759X;;0000-0002-3625-6599",
        "linkedin": ";;;",
        "or_profile": "~Jingwen_Li1;~Zhiguang_Cao1;~Tang_Liu2;~YAOXIN_WU1",
        "aff": "Sichuan Normal University;Singapore Management University;Sichuan Normal University;Eindhoven University of Technology",
        "aff_domain": "sicnu.edu.cn;smu.edu.sg;sicnu.edu.cn;tue.nl",
        "position": "Lecturer;Assistant Professor;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nli2024enhancing,\ntitle={Enhancing the Cross-Size Generalization for Solving Vehicle Routing Problems via Continual Learning},\nauthor={Jingwen Li and Zhiguang Cao and Yaoxin Wu and Tang Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=WdvT2UgsTK}\n}",
        "github": "",
        "project": "",
        "reviewers": "9M5K;SxzA;h875",
        "site": "https://openreview.net/forum?id=WdvT2UgsTK",
        "pdf_size": 872233,
        "rating": "5;6;6",
        "confidence": "4;2;4",
        "soundness": "3;3;3",
        "contribution": "3;3;2",
        "presentation": "3;3;2",
        "wc_summary": "56;44;152",
        "wc_strengths": "51;31;58",
        "wc_weaknesses": "66;52;312",
        "wc_questions": "58;6;1",
        "wc_review": "231;133;523",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1813;1024;2402",
        "reply_reviewers": "0;0;0",
        "reply_authors": "4;2;4",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            84.0,
            48.33218389437829
        ],
        "wc_strengths_avg": [
            46.666666666666664,
            11.440668201153676
        ],
        "wc_weaknesses_avg": [
            143.33333333333334,
            119.40221475705084
        ],
        "wc_questions_avg": [
            21.666666666666668,
            25.772509040103607
        ],
        "wc_review_avg": [
            295.6666666666667,
            165.65291693444124
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1746.3333333333333,
            564.537765688788
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:8r04y1B_-xAJ:scholar.google.com/&scioq=Enhancing+the+Cross-Size+Generalization+for+Solving+Vehicle+Routing+Problems+via+Continual+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "Sichuan Normal University;Singapore Management University;Eindhoven University of Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.sctu.edu.cn;https://www.smu.edu.sg;https://www.tue.nl",
        "aff_unique_abbr": "SNU;SMU;TU/e",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;2",
        "aff_country_unique": "China;Singapore;Netherlands"
    },
    {
        "id": "We6kIyBOMp",
        "title": "Delayed Spiking Neural Network and Exponential Time Dependent Plasticity Algorithm",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Spiking Neural Networks (SNNs) become more similar to artificial neural networks (ANNs) to solve complex machine learning tasks. However, such similarity does not bring superior performances but loses biological plausibility. Moreover, most learning methods of SNNs follow the pattern of gradient descent used in ANNs, which also suffer from low bio-plausibility. To address these issues, a realistic delayed spiking neural network (DSNN) is introduced in this study, which only considers the dendrite and axon delays as the learnable parameters. And a more biologically plausible exponential time-dependent plasticity (ETDP) algorithm is proposed to train the DSNN. The ETDP adjusts the delays according to the global and local time differences between presynaptic and postsynaptic spikes, and the forward and backward propagation time of signals. These biological indicators can surrogate the time-consuming computation of descents precisely. Experimental results demonstrate that the DSNN trained by ETDP achieves very competitive results on various benchmark datasets, compared with other SNNs.",
        "keywords": "Spiking Neural Network; supervised learning; delay; biological plausibility; time-dependent plasticity",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/0052f8f2371e6e25c29a0061261bae34565e0dbc.pdf",
        "author": "Junkai Ji;Haochang Jin;Zexuan Zhu;Xueliang Li;Jianqiang Li",
        "authorids": "~Junkai_Ji1;~Haochang_Jin2;zhuzx@szu.edu.cn;~Xueliang_Li1;~Jianqiang_Li2",
        "gender": "M;M;;M;M",
        "homepage": "https://bdsc.szu.edu.cn/teachers/doctoral/504c9b47-e610-4bd2-bf36-5a0d2b72c5ec;https://www.researchgate.net/profile/Haochang-Jin;;https://sites.google.com/view/xueliangli;https://scholar.google.com/citations?hl=zh-CN&user=-oVMPBwAAAAJ",
        "dblp": "165/8418;;;;08/2185-1",
        "google_scholar": "https://scholar.google.co.jp/citations?hl=en;;;acA7HFYAAAAJ;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": "0000-0002-1985-938X;;;;0000-0002-2208-962X",
        "linkedin": ";;;;",
        "or_profile": "~Junkai_Ji1;~Haochang_Jin2;zhuzx@szu.edu.cn;~Xueliang_Li1;~Jianqiang_Li2",
        "aff": "Shenzhen University;Shenzhen University;;;Shenzhen University",
        "aff_domain": "szu.edu.cn;szu.edu.cn;;;szu.edu.cn",
        "position": "Assistant Professor;MS student;;;Full Professor",
        "bibtex": "@misc{\nji2024delayed,\ntitle={Delayed Spiking Neural Network and Exponential Time Dependent Plasticity Algorithm},\nauthor={Junkai Ji and Haochang Jin and Zexuan Zhu and Xueliang Li and Jianqiang Li},\nyear={2024},\nurl={https://openreview.net/forum?id=We6kIyBOMp}\n}",
        "github": "",
        "project": "",
        "reviewers": "aK4j;KQb6;5rdv",
        "site": "https://openreview.net/forum?id=We6kIyBOMp",
        "pdf_size": 450449,
        "rating": "3;3;5",
        "confidence": "4;4;3",
        "soundness": "2;2;2",
        "contribution": "1;2;2",
        "presentation": "2;3;3",
        "wc_summary": "36;68;73",
        "wc_strengths": "20;50;23",
        "wc_weaknesses": "241;162;174",
        "wc_questions": "2;262;198",
        "wc_review": "299;542;468",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "629;444;749",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            59.0,
            16.391054470858997
        ],
        "wc_strengths_avg": [
            31.0,
            13.490737563232042
        ],
        "wc_weaknesses_avg": [
            192.33333333333334,
            34.75949110994323
        ],
        "wc_questions_avg": [
            154.0,
            110.6104274770994
        ],
        "wc_review_avg": [
            436.3333333333333,
            101.69999453731002
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            607.3333333333334,
            125.45472844372543
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:l12QX1_RLeMJ:scholar.google.com/&scioq=Delayed+Spiking+Neural+Network+and+Exponential+Time+Dependent+Plasticity+Algorithm&hl=en&as_sdt=0,24",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Shenzhen University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.szu.edu.cn",
        "aff_unique_abbr": "SZU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "WepT31bvcr",
        "title": "On Compositional Generalization in Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recent language models appear to solve complex tasks that require logical reasoning with its rationale through a large number of parameters and instruction tuning. While step-by-step explanations have been introduced to improve the accuracy of the final prediction of the language models, there is still a lack of research on the reliability of the rationale. Therefore, the paper includes a study on the compositional reasoning ability of language models, as well as an analysis of the logical proof generated by them. By employing clear and straightforward semantics and syntax of a boolean expression, we observed and analyzed how language models generalize and solve the boolean formula. We classified boolean expressions based on their depth and empirically observed that language models not only struggle to comprehend more complex boolean expressions but also that their rationale is unreliable in affirming that the language models truly understand and solve the problem. From the perspective of understanding the structure of boolean algebra expressions, we discovered that language models inherently fail to generalize the compositional structure and often fail not only in calculating formulas but in grasping the input structure itself.",
        "keywords": "Language model;Logic;Compositionality",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/05483b66f7bae75c6832d7d5ae6597ea74ecc576.zip",
        "author": "Minsu Kim;James Thorne",
        "authorids": "~Minsu_Kim7;~James_Thorne1",
        "gender": "M;",
        "homepage": "https://github.com/MS0117;https://jamesthorne.com",
        "dblp": ";204/1380",
        "google_scholar": ";hao9RrgAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Minsu_Kim7;~James_Thorne1",
        "aff": "Korea Advanced Institute of Science & Technology;KAIST",
        "aff_domain": "kaist.edu;kaist.ac.kr",
        "position": "MS student;Assistant Professor",
        "bibtex": "@misc{\nkim2024on,\ntitle={On Compositional Generalization in Language Models},\nauthor={Minsu Kim and James Thorne},\nyear={2024},\nurl={https://openreview.net/forum?id=WepT31bvcr}\n}",
        "github": "",
        "project": "",
        "reviewers": "dEnH;PEvF;kQgJ;iCBt",
        "site": "https://openreview.net/forum?id=WepT31bvcr",
        "pdf_size": 984329,
        "rating": "3;3;3;6",
        "confidence": "4;3;4;4",
        "soundness": "2;2;3;4",
        "contribution": "1;2;1;2",
        "presentation": "2;3;2;4",
        "wc_summary": "100;48;83;83",
        "wc_strengths": "2;18;16;12",
        "wc_weaknesses": "88;341;487;25",
        "wc_questions": "31;44;332;47",
        "wc_review": "221;451;918;167",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            78.5,
            18.9274932307477
        ],
        "wc_strengths_avg": [
            12.0,
            6.164414002968976
        ],
        "wc_weaknesses_avg": [
            235.25,
            187.38246316024347
        ],
        "wc_questions_avg": [
            113.5,
            126.29429915875063
        ],
        "wc_review_avg": [
            439.25,
            296.26540044358876
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:92HuNmtX5D0J:scholar.google.com/&scioq=On+Compositional+Generalization+in+Language+Models&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "Uni-RLHF: Universal Platform and Benchmark Suite for Reinforcement Learning with Diverse Human Feedback",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18468",
        "id": "WesY0H9ghM",
        "author_site": "Yifu Yuan, Jianye HAO, Yi Ma, Zibin Dong, Hebin Liang, Jinyi Liu, Zhixin Feng, Kai Zhao, YAN ZHENG",
        "tldr": "",
        "abstract": "Reinforcement Learning with Human Feedback (RLHF) has received significant attention for performing tasks without the need for costly manual reward design by aligning human preferences. It is crucial to consider diverse human feedback types and various learning methods in different environments. However, quantifying progress in RLHF with diverse feedback is challenging due to the lack of standardized annotation platforms and widely used unified benchmarks. To bridge this gap, we introduce **Uni-RLHF**, a comprehensive system implementation tailored for RLHF. It aims to provide a complete workflow from *real human feedback*, fostering progress in the development of practical problems. Uni-RLHF contains three packages: 1) a universal multi-feedback annotation platform, 2) large-scale crowdsourced feedback datasets, and 3) modular offline RLHF baseline implementations. Uni-RLHF develops a user-friendly annotation interface tailored to various feedback types, compatible with a wide range of mainstream RL environments. We then establish a systematic pipeline of crowdsourced annotations, resulting in large-scale annotated datasets comprising more than 15 million steps across 30 popular tasks. Through extensive experiments, the results in the collected datasets demonstrate competitive performance compared to those from well-designed manual rewards. We evaluate various design choices and offer insights into their strengths and potential areas of improvement. We wish to build valuable open-source platforms, datasets, and baselines to facilitate the development of more robust and reliable RLHF solutions based on realistic human feedback. The website is available at https://uni-rlhf.github.io/.",
        "keywords": "RLHF;Diverse Human Feedback;Reinforcement Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Yifu Yuan;Jianye HAO;Yi Ma;Zibin Dong;Hebin Liang;Jinyi Liu;Zhixin Feng;Kai Zhao;YAN ZHENG",
        "authorids": "~Yifu_Yuan1;~Jianye_HAO1;~Yi_Ma5;~Zibin_Dong1;~Hebin_Liang2;~Jinyi_Liu1;~Zhixin_Feng1;~Kai_Zhao12;~YAN_ZHENG1",
        "gender": "M;M;;M;;F;M;M;M",
        "homepage": "https://yifu-yuan.github.io/;http://www.icdai.org/jianye.html;https://mayi1996.top/;https://github.com/GrandpaDZB;;https://www.baidu.com/;http://www.icdai.org/team.html;https://yanzzzzz.github.io;https://github.com/superCat-star",
        "dblp": "261/3688;21/7664.html;69/1112-5.html;358/5885;192/6688-2;;72/2621;10/2381-2;352/9378.html",
        "google_scholar": "83JhosMAAAAJ;;TdVWzqgAAAAJ;JQ6881QAAAAJ;kaQS7NAAAAAJ;;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com.hk/citations?user=tJuhd1kAAAAJ;",
        "orcid": "0009-0009-2194-942X;0000-0002-0422-8235;0000-0001-9375-6605;0000-0002-2986-6022;;;;;0009-0000-8371-2297",
        "linkedin": ";;;;\u91d1\u6bc5-\u5218-5b7447118;;;;",
        "or_profile": "~Yifu_Yuan1;~Jianye_HAO1;~Yi_Ma5;~Zibin_Dong1;~Jinyi_Liu1;~Zhixin_Feng1;~Kai_Zhao12;~YAN_ZHENG1;~hebin_liang1",
        "aff": "Tianjin University;Tianjin University;Tianjin University;Tianjin University;Tianjin University;Tianjin University;Tianjin University;Tianjin Unibersity, China;Tianjin University",
        "aff_domain": "tju.edu.cn;tju.edu.cn;tju.edu.cn;tju.edu.cn;tju.edu.cn;tju.edu.cn;tju.edu.cn;tju.edu.cn;tju.edu.cn",
        "position": "PhD student;Associate Professor;PhD student;MS student;PhD student;MS student;MS student;Associate Professor;MS student",
        "bibtex": "@inproceedings{\nyuan2024unirlhf,\ntitle={Uni-{RLHF}: Universal Platform and Benchmark Suite for Reinforcement Learning with Diverse Human Feedback},\nauthor={Yifu Yuan and Jianye HAO and Yi Ma and Zibin Dong and Hebin Liang and Jinyi Liu and Zhixin Feng and Kai Zhao and YAN ZHENG},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=WesY0H9ghM}\n}",
        "github": "",
        "project": "",
        "reviewers": "BKHb;FdzJ;3bfZ",
        "pdf_size": 3338539,
        "rating": "5;6;8",
        "confidence": "2;3;3",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "3;3;3",
        "wc_summary": "95;53;139",
        "wc_strengths": "73;97;81",
        "wc_weaknesses": "105;80;815",
        "wc_questions": "39;4;113",
        "wc_review": "312;234;1148",
        "wc_reply_reviewers": "0;0;245",
        "wc_reply_authors": "1389;625;1797",
        "reply_reviewers": "0;0;1",
        "reply_authors": "3;1;3",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            95.66666666666667,
            35.11251755270318
        ],
        "wc_strengths_avg": [
            83.66666666666667,
            9.977753031397176
        ],
        "wc_weaknesses_avg": [
            333.3333333333333,
            340.74265297370033
        ],
        "wc_questions_avg": [
            52.0,
            45.43860326491855
        ],
        "wc_review_avg": [
            564.6666666666666,
            413.7062833567903
        ],
        "wc_reply_reviewers_avg": [
            81.66666666666667,
            115.49410759380275
        ],
        "wc_reply_authors_avg": [
            1270.3333333333333,
            485.7690351963118
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.7559289460184545,
        "gs_citation": 23,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18172344693867232865&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=WesY0H9ghM",
        "pdf": "https://openreview.net/pdf?id=WesY0H9ghM",
        "email": "tju.edu.cn;tju.edu.cn;tju.edu.cn;tju.edu.cn;tju.edu.cn;tju.edu.cn;tju.edu.cn;tju.edu.cn;tju.edu.cn",
        "author_num": 9,
        "aff_unique_index": "0;0;0;0;0;0;0;0;0",
        "aff_unique_norm": "Tianjin University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.tju.edu.cn",
        "aff_unique_abbr": "TJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "Wfe8o9RnnX",
        "title": "A Generative Augmentation Framework for Contrastive Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Contrastive learning has achieved unprecedented levels of accuracy on computer vision applications in recent years. However, in this time, the image augmentations used in these frameworks have remained, for the most part, unchanged. We propose a new augmentation strategy, GenCL, a Generative Augmentation Framework for Contrastive Learning, which utilizes generative modeling to augment images for forming positive pairs. Unlike geometry and color augmentations, GenCL is able to change high-level visual features in images, such as the background, positioning, and color schemas of objects. Our results show that adding these generative augmentations to the suite of augmentations typically used in contrastive learning significantly increases downstream accuracy. In our work, we (1) outline the neural network architecture used in GenCL, (2) use ablation studies to optimize the hyperparameters used in our generative augmentations, and (3) provide a cost-benefit analysis of our implementation in a contrastive learning setting. With these findings, we show that leveraging generative models can significantly increase the performance of contrastive learning on self-supervised learning benchmarks, providing a new avenue for future contrastive learning research.",
        "keywords": "Generative Modeling;Contrastive Learning;Self-Supervised Learning;Computer Vision;Generative Adversarial Networks;Transformers;Image Augmentation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Samuel Vincent Armstrong;Abdul Matin;Shrideep Pallickara;Sangmi Pallickara",
        "authorids": "~Samuel_Vincent_Armstrong1;~Abdul_Matin1;~Shrideep_Pallickara2;~Sangmi_Pallickara1",
        "gender": ";M;F;M",
        "homepage": ";;http://www.cs.colostate.edu/~sangmi/;https://www.cs.colostate.edu/~shrideep/",
        "dblp": "253/8839;;38/1106;p/ShrideepPallickara",
        "google_scholar": ";qBPkgK0AAAAJ;https://scholar.google.com.tw/citations?user=3_rdKBsAAAAJ;yjFpPkYAAAAJ",
        "orcid": "0000-0001-9386-426X;;;",
        "linkedin": "sam-armstrong-72843889/;abdulmatinmuaz/;;",
        "or_profile": "~Samuel_Vincent_Armstrong1;~Abdul_Matin1;~Sangmi_Pallickara1;~Shrideep_Pallickara1",
        "aff": ";Colorado State University;Colorado State University;Colorado State University",
        "aff_domain": ";colostate.edu;colostate.edu;colostate.edu",
        "position": ";PhD student;Full Professor;Full Professor",
        "bibtex": "@misc{\narmstrong2024a,\ntitle={A Generative Augmentation Framework for Contrastive Learning},\nauthor={Samuel Vincent Armstrong and Abdul Matin and Shrideep Pallickara and Sangmi Pallickara},\nyear={2024},\nurl={https://openreview.net/forum?id=Wfe8o9RnnX}\n}",
        "github": "",
        "project": "",
        "reviewers": "7GZG;NnqA;8vFk;4FGw;KP3v",
        "site": "https://openreview.net/forum?id=Wfe8o9RnnX",
        "pdf_size": 2748666,
        "rating": "3;3;3;5;5",
        "confidence": "4;4;4;4;3",
        "soundness": "2;3;2;3;2",
        "contribution": "2;2;1;2;2",
        "presentation": "4;3;2;3;2",
        "wc_summary": "42;137;44;56;34",
        "wc_strengths": "20;90;78;74;41",
        "wc_weaknesses": "70;460;110;217;277",
        "wc_questions": "63;233;8;16;8",
        "wc_review": "195;920;240;363;360",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            3.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            1.8,
            0.4
        ],
        "presentation_avg": [
            2.8,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            62.6,
            37.86079766724415
        ],
        "wc_strengths_avg": [
            60.6,
            25.996922894835073
        ],
        "wc_weaknesses_avg": [
            226.8,
            138.00492744826178
        ],
        "wc_questions_avg": [
            65.6,
            86.1686718012991
        ],
        "wc_review_avg": [
            415.6,
            260.68264230669445
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.6123724356957946,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:K4QhsfYagaoJ:scholar.google.com/&scioq=A+Generative+Augmentation+Framework+for+Contrastive+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Colorado State University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.colostate.edu",
        "aff_unique_abbr": "CSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "WfjJOEfAf7",
        "title": "Information Flow in Self-Supervised Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this paper, we provide a comprehensive toolbox for understanding and enhancing self-supervised learning (SSL) methods through the lens of matrix information theory. Specifically, by leveraging the principles of matrix mutual information and joint entropy, we offer a unified analysis for both contrastive and non-contrastive methods. Furthermore, we propose the matrix variational masked auto-encoder (M-MAE) method, grounded in matrix information theory, as an enhancement to masked image modeling. The empirical evaluations underscore the effectiveness of M-MAE compared with the state-of-the-art methods, including a 3.9% improvement in linear probing ViT-Base, and a 1% improvement in fine-tuning ViT-Large, both on ImageNet.",
        "keywords": "self-supervised learning;contrastive learning;non-contrastive learning;representation learning;information theory",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/6694a84629e665a1a29997926fdd1d0f6ed69411.zip",
        "author": "Zhiquan Tan;Jingqin Yang;Weiran Huang;Yang Yuan;Yifan Zhang",
        "authorids": "~Zhiquan_Tan1;~Jingqin_Yang2;~Weiran_Huang1;~Yang_Yuan4;~Yifan_Zhang16",
        "gender": "M;M;M;M;",
        "homepage": ";https://github.com/yjqqqaq;https://www.weiranhuang.com;http://people.iiis.tsinghua.edu.cn/~yuanyang/index.html;",
        "dblp": "326/0177;267/1955;170/0073-1;;",
        "google_scholar": ";;AjJ2rf8AAAAJ;;",
        "orcid": ";;;;",
        "linkedin": "https://www.linkedin.cn/incareer/in/ACoAAC1A8_QBFX8OlchWmVI_pNXN4zm_t6vPKCs;;;;",
        "or_profile": "~Zhiquan_Tan1;~Jingqin_Yang2;~Weiran_Huang1;~Yang_Yuan4;~Yifan_Zhang16",
        "aff": "Tsinghua University;Tsinghua University;Shanghai AI Laboratory;Tsinghua University;",
        "aff_domain": "tsinghua.edu.cn;tsinghua.edu.cn;pjlab.org.cn;tsinghua.edu.cn;",
        "position": "PhD student;PhD student;Consultant;Assistant Professor;",
        "bibtex": "@misc{\ntan2024information,\ntitle={Information Flow in Self-Supervised Learning},\nauthor={Zhiquan Tan and Jingqin Yang and Weiran Huang and Yang Yuan and Yifan Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=WfjJOEfAf7}\n}",
        "github": "",
        "project": "",
        "reviewers": "j36B;qQv9;cGgm;znaA",
        "site": "https://openreview.net/forum?id=WfjJOEfAf7",
        "pdf_size": 440808,
        "rating": "5;5;6;8",
        "confidence": "3;4;3;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;3;2",
        "wc_summary": "60;91;156;66",
        "wc_strengths": "12;43;185;60",
        "wc_weaknesses": "47;585;56;127",
        "wc_questions": "145;52;131;35",
        "wc_review": "264;771;528;288",
        "wc_reply_reviewers": "74;2339;0;87",
        "wc_reply_authors": "837;4673;615;1206",
        "reply_reviewers": "1;5;0;1",
        "reply_authors": "4;12;2;3",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            93.25,
            38.04848880047669
        ],
        "wc_strengths_avg": [
            75.0,
            65.79893616161283
        ],
        "wc_weaknesses_avg": [
            203.75,
            222.28514907658587
        ],
        "wc_questions_avg": [
            90.75,
            47.88723733939973
        ],
        "wc_review_avg": [
            462.75,
            205.73936789054252
        ],
        "wc_reply_reviewers_avg": [
            625.0,
            990.1345868113082
        ],
        "wc_reply_authors_avg": [
            1832.75,
            1653.35029183171
        ],
        "reply_reviewers_avg": [
            1.75,
            1.920286436967152
        ],
        "reply_authors_avg": [
            5.25,
            3.960744879438715
        ],
        "replies_avg": [
            35,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.4714045207910316,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12255284306292145309&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Tsinghua University;Shanghai AI Laboratory",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.shanghai-ai-lab.com",
        "aff_unique_abbr": "THU;SAIL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "Wfoiy6dIEk",
        "title": "Multi-Instance Learning Based Anomaly Detection Method for Sequence Data with Application to the Credit Card Delinquency Risk Control",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Anomaly detection in sequence data is widely applicable to many fields and has significant commercial value to the financial industry. The focus of this paper is its utility as means to control credit card delinquency risk. Transactions that deviate from the typical data sequence are a common precursor of payment difficulty. Current detection methods do not effectively use transaction data to detect abnormal transactions. This makes it difficult to control the overdue payment risk. We propose a Multi-Instance Learning based anomaly detection (MILAD) method with well designed learning networks to address this problem. MILAD analyze users\u2019 monthly transactions and payment history, and detect exceptions through well designed deep learning networks. By comparing the performance of MILAD and DAGMM, which is currently the most commonly used unsupervised deep learning algorithm for credit card risk control, MILAD best controls overdue risk by utilizing both transaction and payment information.",
        "keywords": "Anomaly Detection;Complex Sequential Data Analysis;Credit Card Delinquency Risk Control;Multi-Instance Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Zhenguo Gao",
        "authorids": "~Zhenguo_Gao1",
        "gender": "M",
        "homepage": "https://math.sjtu.edu.cn/Default/teachershow/tags/MDAwMDAwMDAwMLJ4nJg",
        "dblp": "",
        "google_scholar": "",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Zhenguo_Gao1",
        "aff": "Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn",
        "position": "Associate Professor",
        "bibtex": "@misc{\ngao2024multiinstance,\ntitle={Multi-Instance Learning Based Anomaly Detection Method for Sequence Data with Application to the Credit Card Delinquency Risk Control},\nauthor={Zhenguo Gao},\nyear={2024},\nurl={https://openreview.net/forum?id=Wfoiy6dIEk}\n}",
        "github": "",
        "project": "",
        "reviewers": "eMfY;vHLH;5JS1;nXvi",
        "site": "https://openreview.net/forum?id=Wfoiy6dIEk",
        "pdf_size": 1293856,
        "rating": "3;3;5;6",
        "confidence": "4;3;5;5",
        "soundness": "2;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "2;3;2;2",
        "wc_summary": "30;15;124;94",
        "wc_strengths": "34;8;99;11",
        "wc_weaknesses": "64;116;208;29",
        "wc_questions": "31;117;91;32",
        "wc_review": "159;256;522;166",
        "wc_reply_reviewers": "19;8;0;8",
        "wc_reply_authors": "158;51;120;149",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            65.75,
            44.846265173367556
        ],
        "wc_strengths_avg": [
            38.0,
            36.62649314362488
        ],
        "wc_weaknesses_avg": [
            104.25,
            67.42542176360486
        ],
        "wc_questions_avg": [
            67.75,
            37.399030736103306
        ],
        "wc_review_avg": [
            275.75,
            147.2283515495572
        ],
        "wc_reply_reviewers_avg": [
            8.75,
            6.7592529172978875
        ],
        "wc_reply_authors_avg": [
            119.5,
            41.96724913548659
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0.8703882797784892,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:S305eZFJBMMJ:scholar.google.com/&scioq=Multi-Instance+Learning+Based+Anomaly+Detection+Method+for+Sequence+Data+with+Application+to+the+Credit+Card+Delinquency+Risk+Control&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Shanghai Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sjtu.edu.cn",
        "aff_unique_abbr": "SJTU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "Wg3kLZ6pII",
        "title": "Observation-Guided Diffusion Probabilistic Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We propose a novel diffusion model called observation-guided diffusion probabilistic model (OGDM), which effectively addresses the trade-off between quality control and fast sampling. Our approach reestablishes the training objective by integrating the guidance of the observation process with the Markov chain in a principled way. This is achieved by introducing an additional loss term derived from the observation based on the conditional discriminator on noise level, which employs Bernoulli distribution indicating whether its input lies on the (noisy) real manifold or not. This strategy allows us to optimize the more accurate negative log-likelihood induced in the inference stage especially when the number of function evaluations is limited. The proposed training method is also advantageous even when incorporated only into the fine-tuning process, and it is compatible with various fast inference strategies since our method yields better denoising networks using the exactly same inference procedure without incurring extra computational cost. We demonstrate the effectiveness of the proposed training algorithm using diverse inference methods on strong diffusion model baselines.",
        "keywords": "diffusion model",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Junoh Kang;Jinyoung Choi;Sungik Choi;Bohyung Han",
        "authorids": "~Junoh_Kang2;~Jinyoung_Choi2;~Sungik_Choi1;~Bohyung_Han1",
        "gender": "M;F;Not Specified;M",
        "homepage": "https://junoh-kang.github.io/;;http://cvlab.snu.ac.kr/~bhhan;",
        "dblp": "355/1822;;73/4880.html;184/4055.html",
        "google_scholar": "TLGqhucAAAAJ;https://scholar.google.com/citations?hl=en;9aaeCToAAAAJ;H0QB0PwAAAAJ",
        "orcid": ";;;",
        "linkedin": "junohkang;jinyoung-choi-7b7470189/;;",
        "or_profile": "~Junoh_Kang2;~Jinyoung_Choi2;~Bohyung_Han1;~Choi_sungik1",
        "aff": "Adobe Systems;Seoul National University;Seoul National University;LG AI Research",
        "aff_domain": "adobe.com;snu.ac.kr;snu.ac.kr;lgresearch.ai",
        "position": "Intern;PhD student;Full Professor;Researcher",
        "bibtex": "@misc{\nkang2024observationguided,\ntitle={Observation-Guided Diffusion Probabilistic Models},\nauthor={Junoh Kang and Jinyoung Choi and Sungik Choi and Bohyung Han},\nyear={2024},\nurl={https://openreview.net/forum?id=Wg3kLZ6pII}\n}",
        "github": "",
        "project": "",
        "reviewers": "oGQD;RSLy;D5aC",
        "site": "https://openreview.net/forum?id=Wg3kLZ6pII",
        "pdf_size": 43461179,
        "rating": "3;3;5",
        "confidence": "4;3;4",
        "soundness": "2;3;3",
        "contribution": "2;2;2",
        "presentation": "2;3;3",
        "wc_summary": "59;124;36",
        "wc_strengths": "51;31;31",
        "wc_weaknesses": "240;147;58",
        "wc_questions": "202;16;23",
        "wc_review": "552;318;148",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "895;435;234",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            73.0,
            37.26481808176
        ],
        "wc_strengths_avg": [
            37.666666666666664,
            9.428090415820632
        ],
        "wc_weaknesses_avg": [
            148.33333333333334,
            74.3071702835975
        ],
        "wc_questions_avg": [
            80.33333333333333,
            86.07877529075071
        ],
        "wc_review_avg": [
            339.3333333333333,
            165.6207179739969
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            521.3333333333334,
            276.67108430208043
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3159915374293948748&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "Adobe;Seoul National University;LG",
        "aff_unique_dep": "Adobe Systems Incorporated;;LG AI Research",
        "aff_unique_url": "https://www.adobe.com;https://www.snu.ac.kr;https://www.lgaires.com",
        "aff_unique_abbr": "Adobe;SNU;LG AI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "United States;South Korea"
    },
    {
        "id": "Wgb8tuu5BI",
        "title": "Decoupling Intrinsic and Measurement Trends: A Crucial Consideration in Time Series Causal Discovery",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In the realm of time series data, it is common to encounter time trends, which manifest as a function concerning time within a given data span. Time trends can be classified into intrinsic (real) and measurement (false) trends. Intrinsic trends are inherent to the underlying mechanisms of the variables, while measurement trends are essentially measurement errors unique to the observed values (e.g., an increase in diagnosed thyroid nodule patients due to enhanced medical techniques, despite a stable incidence rate over time). Measurement trends can critically influence the results of a variety of causal discovery methods and hence, necessitate elimination prior to causal analytic procedures. In this study, we introduce a novel framework capable of detecting all trend-influenced variables and distinguishing between intrinsic and measurement trends, called Trend Differentiator (TrendDiff). This approach consists of two primary steps: trend variable identification and trend type differentiation. The first step leverages Constraint-based Causal Discovery from heterogeneous/Nonstationary Data (CD-NOD) to identify variables with trends. Following this, we utilize the structure characteristics to differentiate between intrinsic and measurement trends. Experimental results on various synthetic scenarios and real-world data sets are employed to demonstrate the efficacy of our methods.",
        "keywords": "Time trend;measurement error;data preprocessing",
        "primary_area": "causal reasoning",
        "supplementary_material": "",
        "author": "Pei Zhang;Biwei Huang;Linwei Tian;Kun Zhang",
        "authorids": "~Pei_Zhang10;~Biwei_Huang1;linweit@hku.hk;~Kun_Zhang1",
        "gender": "F;F;;M",
        "homepage": ";;;http://www.andrew.cmu.edu/user/kunz1/",
        "dblp": ";165/3288;;96/3115-1",
        "google_scholar": ";;;RGoypN4AAAAJ",
        "orcid": "0000-0003-0146-1047;;;",
        "linkedin": ";;;",
        "or_profile": "~Pei_Zhang10;~Biwei_Huang1;linweit@hku.hk;~Kun_Zhang1",
        "aff": "University of Hong Kong;University of California, San Diego;;Carnegie Mellon University",
        "aff_domain": "hku.hk;ucsd.edu;;cmu.edu",
        "position": "PhD student;Assistant Professor;;Associate Professor",
        "bibtex": "@misc{\nzhang2024decoupling,\ntitle={Decoupling Intrinsic and Measurement Trends: A Crucial Consideration in Time Series Causal Discovery},\nauthor={Pei Zhang and Biwei Huang and Linwei Tian and Kun Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=Wgb8tuu5BI}\n}",
        "github": "",
        "project": "",
        "reviewers": "Qn3u;hzGy;FN22",
        "site": "https://openreview.net/forum?id=Wgb8tuu5BI",
        "pdf_size": 3940288,
        "rating": "3;3;5",
        "confidence": "4;4;3",
        "soundness": "2;2;3",
        "contribution": "2;2;2",
        "presentation": "2;2;3",
        "wc_summary": "29;43;81",
        "wc_strengths": "29;22;28",
        "wc_weaknesses": "326;225;75",
        "wc_questions": "239;56;19",
        "wc_review": "623;346;203",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            51.0,
            21.96967607104544
        ],
        "wc_strengths_avg": [
            26.333333333333332,
            3.0912061651652345
        ],
        "wc_weaknesses_avg": [
            208.66666666666666,
            103.11913282973026
        ],
        "wc_questions_avg": [
            104.66666666666667,
            96.1815413106324
        ],
        "wc_review_avg": [
            390.6666666666667,
            174.34894767550378
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:WQMTEGKqc8cJ:scholar.google.com/&scioq=Decoupling+Intrinsic+and+Measurement+Trends:+A+Crucial+Consideration+in+Time+Series+Causal+Discovery&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of Hong Kong;University of California, San Diego;Carnegie Mellon University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.hku.hk;https://www.ucsd.edu;https://www.cmu.edu",
        "aff_unique_abbr": "HKU;UCSD;CMU",
        "aff_campus_unique_index": "0;1",
        "aff_campus_unique": "Hong Kong SAR;San Diego;",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Light Schr\u00f6dinger Bridge",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18467",
        "id": "WhZoCLRWYJ",
        "author_site": "Alexander Korotin, Nikita Gushchin, Evgeny Burnaev",
        "tldr": "",
        "abstract": "Despite the recent advances in the field of computational Schr\u00f6dinger Bridges (SB), most existing SB solvers are still heavy-weighted and require complex optimization of several neural networks. It turns out that there is no principal solver which plays the role of simple-yet-effective baseline for SB just like, e.g., $k$-means method in clustering, logistic regression in classification or Sinkhorn algorithm in discrete optimal transport. We address this issue and propose a novel fast and simple SB solver. Our development is a smart combination of two ideas which recently appeared in the field: (a) parameterization of the Schr\u00f6dinger potentials with sum-exp quadratic functions and (b) viewing the log-Schr\u00f6dinger potentials as the energy functions. We show that combined together these ideas yield a lightweight, simulation-free and theoretically justified SB solver with a simple straightforward optimization objective. As a result, it allows solving SB in moderate dimensions in a matter of minutes on CPU without a painful hyperparameter selection. Our light solver resembles the Gaussian mixture model which is widely used for density estimation. Inspired by this similarity, we also prove an important theoretical result showing that our light solver is a universal approximator of SBs. Furthemore, we conduct the analysis of the generalization error of our light solver. The code for our solver can be found at https://github.com/ngushchin/LightSB.",
        "keywords": "Schr\u00f6dinger Bridge;Optimal transport;Entropy regularized OT;Unpaired Learning",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/2ed66ea711c20cda7bcea0c164a3e74c16ea1eb8.zip",
        "author": "Alexander Korotin;Nikita Gushchin;Evgeny Burnaev",
        "authorids": "~Alexander_Korotin2;~Nikita_Gushchin1;~Evgeny_Burnaev1",
        "gender": "M;M;M",
        "homepage": ";http://faculty.skoltech.ru/people/evgenyburnaev;https://akorotin.netlify.app",
        "dblp": "332/1999;144/7845;209/9906",
        "google_scholar": "UaRTbNoAAAAJ;https://scholar.google.ru/citations?user=pCRdcOwAAAAJ;https://scholar.google.ru/citations?user=1rIIvjAAAAAJ",
        "orcid": ";0000-0001-8424-0690;0000-0003-4286-925X",
        "linkedin": "nikita-gushchin-937522145/;;",
        "or_profile": "~Nikita_Gushchin1;~Evgeny_Burnaev1;~Alexander_Andreevich_Korotin1",
        "aff": "Skolkovo Institute of Science and Technology;Skolkovo Institute of Science and Technology;Skolkovo Institute of Science and Technology",
        "aff_domain": "skoltech.ru;skoltech.ru;skoltech.ru",
        "position": "PhD student;Full Professor;Head of Research Group",
        "bibtex": "@inproceedings{\nkorotin2024light,\ntitle={Light Schr\\\"odinger Bridge},\nauthor={Alexander Korotin and Nikita Gushchin and Evgeny Burnaev},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=WhZoCLRWYJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "KWE5;cSx4;o21Y;o9rU;rvYk",
        "pdf_size": 26581344,
        "rating": "5;5;8;8;8",
        "confidence": "3;4;4;1;3",
        "soundness": "3;1;3;3;3",
        "contribution": "3;1;3;3;3",
        "presentation": "3;3;4;3;3",
        "wc_summary": "139;158;55;43;119",
        "wc_strengths": "92;34;62;88;85",
        "wc_weaknesses": "249;378;75;117;297",
        "wc_questions": "495;3;58;4;19",
        "wc_review": "975;573;250;252;520",
        "wc_reply_reviewers": "0;146;12;41;140",
        "wc_reply_authors": "505;1227;340;184;480",
        "reply_reviewers": "0;1;1;1;1",
        "reply_authors": "2;3;1;1;1",
        "rating_avg": [
            6.8,
            1.469693845669907
        ],
        "confidence_avg": [
            3.0,
            1.0954451150103321
        ],
        "soundness_avg": [
            2.6,
            0.8000000000000002
        ],
        "contribution_avg": [
            2.6,
            0.8000000000000002
        ],
        "presentation_avg": [
            3.2,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            102.8,
            45.783839943805496
        ],
        "wc_strengths_avg": [
            72.2,
            21.766028576660467
        ],
        "wc_weaknesses_avg": [
            223.2,
            112.5315955632017
        ],
        "wc_questions_avg": [
            115.8,
            190.64459079659196
        ],
        "wc_review_avg": [
            514.0,
            266.22471710943745
        ],
        "wc_reply_reviewers_avg": [
            67.8,
            62.85984409780221
        ],
        "wc_reply_authors_avg": [
            547.2,
            358.68392771352325
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            1.6,
            0.8
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.37267799624996495,
        "gs_citation": 18,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4839857612360265425&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=WhZoCLRWYJ",
        "pdf": "https://openreview.net/pdf?id=WhZoCLRWYJ",
        "email": "skoltech.ru;skoltech.ru;skoltech.ru",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Skolkovo Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.skoltech.ru",
        "aff_unique_abbr": "Skoltech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Russian Federation"
    },
    {
        "title": "Real-time Photorealistic Dynamic Scene Representation and Rendering with 4D Gaussian Splatting",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18466",
        "id": "WhgB5sispV",
        "author_site": "Zeyu Yang, Hongye Yang, Zijie Pan, Li Zhang",
        "tldr": "",
        "abstract": "Reconstructing dynamic 3D scenes from 2D images and generating diverse views over time is challenging due to scene complexity and temporal dynamics. Despite advancements in neural implicit models, limitations persist: (i) Inadequate Scene Structure: Existing methods struggle to reveal the spatial and temporal structure of dynamic scenes from directly learning the complex 6D plenoptic function. (ii) Scaling Deformation Modeling: Explicitly modeling scene element deformation becomes impractical for complex dynamics. To address these issues, we consider the spacetime as an entirety and propose to approximate the underlying spatio-temporal 4D volume of a dynamic scene by optimizing a collection of 4D primitives, with explicit geometry and appearance modeling. Learning to optimize the 4D primitives enables us to synthesize novel views at any desired time with our tailored rendering routine. Our model is conceptually simple, consisting of a 4D Gaussian parameterized by anisotropic ellipses that can rotate arbitrarily in space and time, as well as view-dependent and time-evolved appearance represented by the coefficient of 4D spherindrical harmonics. This approach offers simplicity, flexibility for variable-length video and end-to-end training, and efficient real-time rendering, making it suitable for capturing complex dynamic scene motions. Experiments across various benchmarks, including monocular and multi-view scenarios, demonstrate our 4DGS model's superior visual quality and efficiency.",
        "keywords": "Novel-view synthesis for dynamic scenes;4D Gaussian;point-based rendering",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/39f3ec90bfd5d4adcbe6e637cb3900fee3b1110b.zip",
        "author": "Zeyu Yang;Hongye Yang;Zijie Pan;Li Zhang",
        "authorids": "~Zeyu_Yang3;~Hongye_Yang2;~Zijie_Pan2;~Li_Zhang5",
        "gender": "M;M;M;M",
        "homepage": "https://github.com/Alexander0Yang;https://github.com/hoyeYang;https://github.com/mdarhdarz;http://www.robots.ox.ac.uk/~lz/",
        "dblp": ";90/5537;290/3418;89/5992-40",
        "google_scholar": ";Wa9C5qMAAAAJ;;-wOTCE8AAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Zeyu_Yang3;~Hongye_Yang2;~Zijie_Pan2;~Li_Zhang5",
        "aff": "Fudan University;Fudan University;Fudan University;Fudan University",
        "aff_domain": "fudan.edu.cn;fudan.edu.cn;fudan.edu.cn;fudan.edu.cn",
        "position": "PhD student;PhD student;PhD student;Associate Professor",
        "bibtex": "@inproceedings{\nyang2024realtime,\ntitle={Real-time Photorealistic Dynamic Scene Representation and Rendering with 4D Gaussian Splatting},\nauthor={Zeyu Yang and Hongye Yang and Zijie Pan and Li Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=WhgB5sispV}\n}",
        "github": "",
        "project": "",
        "reviewers": "8jaG;1bTN;XBJp",
        "pdf_size": 39167940,
        "rating": "6;6;8",
        "confidence": "3;4;5",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "3;3;3",
        "wc_summary": "62;120;127",
        "wc_strengths": "51;72;124",
        "wc_weaknesses": "230;137;150",
        "wc_questions": "101;3;92",
        "wc_review": "444;332;493",
        "wc_reply_reviewers": "0;24;37",
        "wc_reply_authors": "773;385;578",
        "reply_reviewers": "0;1;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            103.0,
            29.13188402192118
        ],
        "wc_strengths_avg": [
            82.33333333333333,
            30.684777260973487
        ],
        "wc_weaknesses_avg": [
            172.33333333333334,
            41.12041936664665
        ],
        "wc_questions_avg": [
            65.33333333333333,
            44.22920101270452
        ],
        "wc_review_avg": [
            423.0,
            67.38446903157038
        ],
        "wc_reply_reviewers_avg": [
            20.333333333333332,
            15.3260852434302
        ],
        "wc_reply_authors_avg": [
            578.6666666666666,
            158.40103815596945
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.8660254037844385,
        "gs_citation": 248,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15173901386559164406&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=WhgB5sispV",
        "pdf": "https://openreview.net/pdf?id=WhgB5sispV",
        "email": "fudan.edu.cn;fudan.edu.cn;fudan.edu.cn;fudan.edu.cn",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Fudan University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.fudan.edu.cn",
        "aff_unique_abbr": "Fudan",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Adaptive Self-training Framework for Fine-grained Scene Graph Generation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18465",
        "id": "WipsLtH77t",
        "author_site": "Kibum Kim, Kanghoon Yoon, Yeonjun In, Jinyoung Moon, Donghyun Kim, Chanyoung Park",
        "tldr": "",
        "abstract": "Scene graph generation (SGG) models have suffered from inherent problems regarding the benchmark datasets such as the long-tailed predicate distribution and missing annotation problems. In this work, we aim to alleviate the long-tailed problem of SGG by utilizing unannotated triplets. To this end, we introduce a **S**elf-**T**raining framework for **SGG** **(ST-SGG)** that assigns pseudo-labels for unannotated triplets based on which the SGG models are trained. While there has been significant progress in self-training for image recognition, designing a self-training framework for the SGG task is more challenging due to its inherent nature such as the semantic ambiguity and the long-tailed distribution of predicate classes. Hence, we propose a novel pseudo-labeling technique for SGG, called **C**lass-specific **A**daptive **T**hresholding with **M**omentum **(CATM)**, which is a model-agnostic framework that can be applied to any existing SGG models. Furthermore, we devise a graph structure learner (GSL) that is beneficial when adopting our proposed self-training framework to the state-of-the-art message-passing neural network (MPNN)-based SGG models. Our extensive experiments verify the effectiveness of ST-SGG on various SGG models, particularly in enhancing the performance on fine-grained predicate classes.",
        "keywords": "Scene Graph Generation;Scene Understanding;Imbalanced Classification;Self-training;Long-tailed Problem",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Kibum Kim;Kanghoon Yoon;Yeonjun In;Jinyoung Moon;Donghyun Kim;Chanyoung Park",
        "authorids": "~Kibum_Kim1;~Kanghoon_Yoon2;~Yeonjun_In1;~Jinyoung_Moon1;~Donghyun_Kim2;~Chanyoung_Park1",
        "gender": "M;M;M;F;M;M",
        "homepage": "https://rlqja1107.github.io;https://kanghoonyoon.github.io/;https://yeonjun-in.notion.site/;https://ksp.etri.re.kr/ksp/user/read?id=04225;https://cs-people.bu.edu/donhk;https://dsail.kaist.ac.kr/",
        "dblp": ";327/3704;317/6906;34/391;;170/5430.html",
        "google_scholar": "https://scholar.google.com/citations?hl=ko;cHwMvgYAAAAJ;bBJXfnUAAAAJ;TzK33Q0AAAAJ;https://scholar.google.co.kr/citations?user=UsqNPH4AAAAJ;lWk2LtQAAAAJ",
        "orcid": "0000-0002-7381-019X;0000-0001-6947-2944;0000-0003-0408-4259;0000-0002-6616-824X;;0000-0002-5957-5816",
        "linkedin": "kibum-kim-253b01206/;;yeonjun-in-9654b0180/;;;",
        "or_profile": "~Kibum_Kim1;~Kanghoon_Yoon2;~Yeonjun_In1;~Jinyoung_Moon1;~Donghyun_Kim2;~Chanyoung_Park1",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Adobe Systems;Electronics and Telecommunications Research Institute;Korea University;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr;adobe.com;etri.re.kr;korea.ac.kr;kaist.ac.kr",
        "position": "PhD student;PhD student;Intern;Principal Researcher;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nkim2024adaptive,\ntitle={Adaptive Self-training Framework for Fine-grained Scene Graph Generation},\nauthor={Kibum Kim and Kanghoon Yoon and Yeonjun In and Jinyoung Moon and Donghyun Kim and Chanyoung Park},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=WipsLtH77t}\n}",
        "github": "",
        "project": "",
        "reviewers": "QGUt;jErj;NQzC",
        "pdf_size": 2639303,
        "rating": "5;6;8",
        "confidence": "4;3;5",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "3;3;3",
        "wc_summary": "52;38;78",
        "wc_strengths": "40;58;177",
        "wc_weaknesses": "116;74;114",
        "wc_questions": "4;3;124",
        "wc_review": "212;173;493",
        "wc_reply_reviewers": "0;0;16",
        "wc_reply_authors": "1513;473;898",
        "reply_reviewers": "0;0;1",
        "reply_authors": "3;1;2",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            56.0,
            16.57307052620807
        ],
        "wc_strengths_avg": [
            91.66666666666667,
            60.78559770939897
        ],
        "wc_weaknesses_avg": [
            101.33333333333333,
            19.344824171395878
        ],
        "wc_questions_avg": [
            43.666666666666664,
            56.80571176289308
        ],
        "wc_review_avg": [
            292.6666666666667,
            142.54901691075327
        ],
        "wc_reply_reviewers_avg": [
            5.333333333333333,
            7.542472332656507
        ],
        "wc_reply_authors_avg": [
            961.3333333333334,
            426.933510306022
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.6546536707079772,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9804451217612846434&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=WipsLtH77t",
        "pdf": "https://openreview.net/pdf?id=WipsLtH77t",
        "email": "kaist.ac.kr;kaist.ac.kr;adobe.com;etri.re.kr;korea.ac.kr;kaist.ac.kr",
        "author_num": 6,
        "aff_unique_index": "0;0;1;2;3;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology;Adobe;Electronics and Telecommunications Research Institute;Korea University",
        "aff_unique_dep": ";Adobe Systems Incorporated;;",
        "aff_unique_url": "https://www.kaist.ac.kr;https://www.adobe.com;http://www.etri.re.kr;https://www.korea.ac.kr",
        "aff_unique_abbr": "KAIST;Adobe;ETRI;KU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0;0",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "title": "A Statistical Analysis of Wasserstein Autoencoders for Intrinsically Low-dimensional Data",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18464",
        "id": "WjRPZsfeBO",
        "author_site": "Saptarshi Chakraborty, Peter Bartlett",
        "tldr": "",
        "abstract": "Variational Autoencoders (VAEs) have gained significant popularity among researchers as a powerful tool for understanding unknown distributions based on limited samples. This popularity stems partly from their impressive performance and partly from their ability to provide meaningful feature representations in the latent space. Wasserstein Autoencoders (WAEs), a variant of VAEs, aim to not only improve model efficiency but also interpretability. However, there has been limited focus on analyzing their statistical guarantees. The matter is further complicated by the fact that the data distributions to which WAEs are applied - such as natural images - are often presumed to possess an underlying low-dimensional structure within a high-dimensional feature space, which current theory does not adequately account for, rendering known bounds inefficient. To bridge the gap between the theory and practice of WAEs, in this paper, we show that WAEs can learn the data distributions when the network architectures are properly chosen. We show that the convergence rates of the expected excess risk in the number of samples for WAEs are independent of the high feature dimension, instead relying only on the intrinsic dimension of the data distribution.",
        "keywords": "Wasserstein Autoencoders;Statistical Analysis;Error rates;Intrinsic Dimension",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/4acaa3e5bf05e5319aaedcccf8dd213791d817e5.zip",
        "author": "Saptarshi Chakraborty;Peter Bartlett",
        "authorids": "~Saptarshi_Chakraborty1;~Peter_Bartlett1",
        "gender": ";M",
        "homepage": ";https://www.stat.berkeley.edu/~bartlett/",
        "dblp": ";https://dblp.org/pers/hd/b/Bartlett:Peter_L=",
        "google_scholar": ";yQNhFGUAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Saptarshi_Chakraborty1;~Peter_Bartlett1",
        "aff": ";University of California, Berkeley",
        "aff_domain": ";berkeley",
        "position": ";Professor",
        "bibtex": "@inproceedings{\nchakraborty2024a,\ntitle={A Statistical Analysis of Wasserstein Autoencoders for Intrinsically Low-dimensional Data},\nauthor={Saptarshi Chakraborty and Peter Bartlett},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=WjRPZsfeBO}\n}",
        "github": "",
        "project": "",
        "reviewers": "e5jX;JGBa;GHGf;oqXa",
        "pdf_size": 594666,
        "rating": "6;6;6;6",
        "confidence": "3;4;3;4",
        "soundness": "3;4;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "54;81;90;158",
        "wc_strengths": "33;68;123;105",
        "wc_weaknesses": "72;152;165;173",
        "wc_questions": "46;3;7;2",
        "wc_review": "205;304;385;438",
        "wc_reply_reviewers": "19;17;18;0",
        "wc_reply_authors": "350;392;263;334",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            95.75,
            38.3038836151114
        ],
        "wc_strengths_avg": [
            82.25,
            34.665364558879226
        ],
        "wc_weaknesses_avg": [
            140.5,
            40.252329125157466
        ],
        "wc_questions_avg": [
            14.5,
            18.282505298782223
        ],
        "wc_review_avg": [
            333.0,
            87.96874444937815
        ],
        "wc_reply_reviewers_avg": [
            13.5,
            7.826237921249264
        ],
        "wc_reply_authors_avg": [
            334.75,
            46.5262022950509
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13461416057544057483&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=WjRPZsfeBO",
        "pdf": "https://openreview.net/pdf?id=WjRPZsfeBO",
        "email": ";berkeley",
        "author_num": 2,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of California, Berkeley",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.berkeley.edu",
        "aff_unique_abbr": "UC Berkeley",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Berkeley",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "WjYNFZEjc7",
        "title": "Head Information Bottleneck: An Evaluation Method for Transformer Head Contributions in Speech Task",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Multi-head attention mechanisms have been widely applied in speech pre-training. However, their roles and effectiveness in various downstream tasks have not been fully studied. Different attention heads may exhibit varying degrees of importance in different downstream tasks. We noticed that the attention allocation in the attention mechanism is similar to the information bottleneck, aiming to highlight the parts important to the task. Therefore, we introduced the information bottleneck into multi-head attention to estimate the degree of mutual information contained in each attention head's output about the input and forced it to focus on useful information. Additionally, we proposed a method to measure the contribution of attention heads in tasks. We also pruned the model heads according to their contributions, providing an interpretable direction for model pruning. Notably, our method can maintain an accuracy of 83.36% on the KS task while pruning 40% of the heads.",
        "keywords": "Attribution;Informational Bottleneck;Multi-Head Attention;Explainable AI",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/736abd824d1f0ee30a1deee9ade55e1bd30f1594.zip",
        "author": "Yukun Qian;Xuyi Zhuang;Mingjiang Wang",
        "authorids": "~Yukun_Qian2;~Xuyi_Zhuang1;~Mingjiang_Wang1",
        "gender": "M;M;M",
        "homepage": ";https://orcid.org/0000-0001-9884-521X;http://faculty.hitsz.edu.cn/wangmingjiang",
        "dblp": ";;",
        "google_scholar": ";;",
        "orcid": "0000-0001-9095-4024;0000-0001-9884-521X;",
        "linkedin": ";;",
        "or_profile": "~Yukun_Qian2;~Xuyi_Zhuang1;~Mingjiang_Wang1",
        "aff": "Harbin Institute of Technology;Harbin Institute of Technology;Harbin Institute of Technology",
        "aff_domain": "hit.edu.cn;hit.edu.cn;hit.edu.cn",
        "position": "PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nqian2024head,\ntitle={Head Information Bottleneck: An Evaluation Method for Transformer Head Contributions in Speech Task},\nauthor={Yukun Qian and Xuyi Zhuang and Mingjiang Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=WjYNFZEjc7}\n}",
        "github": "",
        "project": "",
        "reviewers": "QeFk;sbP7;oLGF;zTHX",
        "site": "https://openreview.net/forum?id=WjYNFZEjc7",
        "pdf_size": 2372231,
        "rating": "3;3;3;8",
        "confidence": "3;4;3;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;1;2;3",
        "wc_summary": "112;40;95;133",
        "wc_strengths": "110;42;70;128",
        "wc_weaknesses": "222;268;194;179",
        "wc_questions": "115;91;449;132",
        "wc_review": "559;441;808;572",
        "wc_reply_reviewers": "0;0;0;23",
        "wc_reply_authors": "453;451;497;147",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.25,
            2.165063509461097
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            95.0,
            34.489128721961066
        ],
        "wc_strengths_avg": [
            87.5,
            33.62662635472075
        ],
        "wc_weaknesses_avg": [
            215.75,
            33.88491552298751
        ],
        "wc_questions_avg": [
            196.75,
            146.36320405074494
        ],
        "wc_review_avg": [
            595.0,
            133.14465817298117
        ],
        "wc_reply_reviewers_avg": [
            5.75,
            9.959292143521045
        ],
        "wc_reply_authors_avg": [
            387.0,
            139.77839604173457
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:yDYPi9Ec6T0J:scholar.google.com/&scioq=Head+Information+Bottleneck:+An+Evaluation+Method+for+Transformer+Head+Contributions+in+Speech+Task&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Harbin Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.hit.edu.cn/",
        "aff_unique_abbr": "HIT",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Harbin",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "WkIsvAqoxA",
        "title": "Dolfin: Diffusion Layout Transformers without Autoencoder",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In this paper, we introduce a novel generative model, Diffusion Layout Transformers without Autoencoder (Dolfin), which significantly improves the modeling capability with reduced complexity compared to existing methods. Dolfin employs a Transformer-based diffusion process to model layout generation. In addition to an efficient bi-directional (non-causal joint) sequence representation, we further propose an autoregressive diffusion model (Dolfin-AR) that is especially adept at capturing rich semantic correlations, such as alignment, size, overlap, and neighborhood, between layout items/elements. When evaluated against standard generative layout benchmarks, Dolfin notably improves performance across various metrics, enhancing transparency and interoperability in the process. Moreover, Dolfin's applications extend beyond layout generation, making it suitable for modeling generative geometric structures, such as line segments. Our experiments present both qualitative and quantitative results to demonstrate the advantages of Dolfin.",
        "keywords": "Generative modeling;diffusion models;layout",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/6e96a3eed03bc651d6b9a1f32a471d95ebd86904.zip",
        "author": "Yilin Wang;Zeyuan Chen;Liangjun Zhong;Zheng Ding;Zhizhou Sha;Zhuowen Tu",
        "authorids": "~Yilin_Wang13;~Zeyuan_Chen2;~Liangjun_Zhong1;~Zheng_Ding2;~Zhizhou_Sha1;~Zhuowen_Tu1",
        "gender": "M;M;M;M;;",
        "homepage": ";http://zeyuan-chen.com/;;;https://jamessand.github.io;",
        "dblp": ";;;08/9587;359/4308;",
        "google_scholar": "w-XdUN8AAAAJ;dvplAJkAAAAJ;;TOYBXFQAAAAJ;eAObdYgAAAAJ;",
        "orcid": "0009-0004-6209-8346;;;;;",
        "linkedin": "yilin-wang-889719271;;https://www.linkedin.com/public-profile/settings?lipi=urn%3Ali%3Apage%3Ad_flagship3_profile_self_edit_contact-info%3BN2KbAu1BSKWxaS0DKo5rFg%3D%3D;zheng-ding-224b3122b;;",
        "or_profile": "~Yilin_Wang13;~Zeyuan_Chen2;~Liangjun_Zhong1;~Zheng_Ding2;~Zhizhou_Sha1;~Zhuowen_Tu1",
        "aff": "Tsinghua University;University of California, San Diego;Tsinghua University;University of California, San Diego;Tsinghua University;",
        "aff_domain": "tsinghua.edu.cn;ucsd.edu;tsinghua.edu.cn;ucsd.edu;mail.tsinghua.edu.cn;",
        "position": "Undergrad student;PhD student;Undergrad student;PhD student;Undergrad student;",
        "bibtex": "@misc{\nwang2024dolfin,\ntitle={Dolfin: Diffusion Layout Transformers without Autoencoder},\nauthor={Yilin Wang and Zeyuan Chen and Liangjun Zhong and Zheng Ding and Zhizhou Sha and Zhuowen Tu},\nyear={2024},\nurl={https://openreview.net/forum?id=WkIsvAqoxA}\n}",
        "github": "",
        "project": "",
        "reviewers": "qsqM;eh4o;SyW2",
        "site": "https://openreview.net/forum?id=WkIsvAqoxA",
        "pdf_size": 2913479,
        "rating": "3;3;5",
        "confidence": "4;4;4",
        "soundness": "2;2;3",
        "contribution": "2;1;2",
        "presentation": "2;2;3",
        "wc_summary": "46;80;46",
        "wc_strengths": "22;24;34",
        "wc_weaknesses": "85;167;47",
        "wc_questions": "101;70;92",
        "wc_review": "254;341;219",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "309;578;212",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            57.333333333333336,
            16.027753706895076
        ],
        "wc_strengths_avg": [
            26.666666666666668,
            5.2493385826745405
        ],
        "wc_weaknesses_avg": [
            99.66666666666667,
            50.075498555237125
        ],
        "wc_questions_avg": [
            87.66666666666667,
            13.021349989749739
        ],
        "wc_review_avg": [
            271.3333333333333,
            51.29219130519663
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            366.3333333333333,
            154.82104364573814
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13794808663692912024&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;0;1;0",
        "aff_unique_norm": "Tsinghua University;University of California, San Diego",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.ucsd.edu",
        "aff_unique_abbr": "THU;UCSD",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";San Diego",
        "aff_country_unique_index": "0;1;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "WmB803HJkD",
        "title": "Denoising Low-Rank Data Under Distribution Shift: Double Descent and Data Augmentation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Despite the importance of denoising in modern machine learning and ample empirical work on supervised denoising, its theoretical understanding is still relatively scarce. One concern about studying supervised denoising is that one might not always have noiseless training data from the test distribution. It is more reasonable to have access to noiseless training data from a different dataset than the test dataset. Motivated by this, we study supervised denoising and noisy-input regression under distribution shift. We add three considerations to increase the applicability of our theoretical insights to real-life data and modern machine learning. First, while most past theoretical work assumes that the data covariance matrix is full-rank and well-conditioned, empirical studies have shown that real-life data is approximately low-rank. Thus, we assume that our data matrices are low-rank. Second, we drop independence assumptions on our data. Third, the rise in computational power and dimensionality of data have made it important to study non-classical regimes of learning. Thus, we work in the non-classical proportional regime, where data dimension $d$ and number of samples $N$ grow as $d/N =  c + o(1)$. \n\nFor this setting, we derive general test error expressions for both denoising and noisy-input regression, and study when overfitting the noise is benign, tempered or catastrophic. We show that the test error exhibits double descent under distribution shift, providing insights for data augmentation and the role of noise as an implicit regularizer. We also perform experiments using real-life data, where we match the theoretical predictions with under 1% MSE error for low-rank data.",
        "keywords": "Denoising;Low Rank;distribution shift;double descent;overfitting;supervised;benign overfitting;autoencoder;covariate shift;out of distribution generalization",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Chinmaya Kausik;Kashvi Srivastava;Rishi Sonthalia",
        "authorids": "~Chinmaya_Kausik1;~Kashvi_Srivastava1;~Rishi_Sonthalia1",
        "gender": "M;F;M",
        "homepage": "https://chinmaya-kausik.github.io/;https://sites.google.com/umich.edu/kashvisrivastava/home;https://sites.google.com/umich.edu/rsonthal/home",
        "dblp": "334/1632;;223/5758",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;wD2HpZ8AAAAJ;HYozgRsAAAAJ",
        "orcid": ";;",
        "linkedin": "chinmaya-kausik/;kashvisrivastava/;rishi-sonthalia-53b44795/",
        "or_profile": "~Chinmaya_Kausik1;~Kashvi_Srivastava1;~Rishi_Sonthalia1",
        "aff": "University of Michigan - Ann Arbor;University of Michigan - Ann Arbor;University of California, Los Angeles",
        "aff_domain": "umich.edu;umich.edu;ucla.edu",
        "position": "PhD student;PhD student;Postdoc",
        "bibtex": "@misc{\nkausik2024denoising,\ntitle={Denoising Low-Rank Data Under Distribution Shift: Double Descent and Data Augmentation},\nauthor={Chinmaya Kausik and Kashvi Srivastava and Rishi Sonthalia},\nyear={2024},\nurl={https://openreview.net/forum?id=WmB803HJkD}\n}",
        "github": "",
        "project": "",
        "reviewers": "RbRx;sZRG;jx5r",
        "site": "https://openreview.net/forum?id=WmB803HJkD",
        "pdf_size": 951068,
        "rating": "3;5;5",
        "confidence": "4;2;3",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "2;3;2",
        "wc_summary": "107;235;88",
        "wc_strengths": "17;83;105",
        "wc_weaknesses": "374;206;289",
        "wc_questions": "215;90;168",
        "wc_review": "713;614;650",
        "wc_reply_reviewers": "1311;0;430",
        "wc_reply_authors": "3093;750;2168",
        "reply_reviewers": "4;0;3",
        "reply_authors": "10;2;7",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            143.33333333333334,
            65.2805909559308
        ],
        "wc_strengths_avg": [
            68.33333333333333,
            37.392809766347085
        ],
        "wc_weaknesses_avg": [
            289.6666666666667,
            68.58733281169506
        ],
        "wc_questions_avg": [
            157.66666666666666,
            51.551484513596264
        ],
        "wc_review_avg": [
            659.0,
            40.91454509095757
        ],
        "wc_reply_reviewers_avg": [
            580.3333333333334,
            545.6679902244181
        ],
        "wc_reply_authors_avg": [
            2003.6666666666667,
            963.5581052651792
        ],
        "reply_reviewers_avg": [
            2.3333333333333335,
            1.699673171197595
        ],
        "reply_authors_avg": [
            6.333333333333333,
            3.2998316455372216
        ],
        "replies_avg": [
            35,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Cb4ogF-0YD4J:scholar.google.com/&scioq=Denoising+Low-Rank+Data+Under+Distribution+Shift:+Double+Descent+and+Data+Augmentation&hl=en&as_sdt=0,44",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "University of Michigan;University of California, Los Angeles",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.umich.edu;https://www.ucla.edu",
        "aff_unique_abbr": "UM;UCLA",
        "aff_campus_unique_index": "0;0;1",
        "aff_campus_unique": "Ann Arbor;Los Angeles",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Wn82BUF7jH",
        "title": "On Accelerating Diffusion-based Molecular Conformation Generation in SE(3)-invariant Space",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Diffusion-based generative models in SE(3)-invariant space have demonstrated promising performance in molecular conformation generation, but typically require solving stochastic differential equations (SDEs) with thousands of update steps. \nTill now, it remains unclear how to effectively accelerate this procedure explicitly in SE(3)-invariant space, which greatly hinders its wide application in the real world.\nIn this paper, we systematically study the diffusion mechanism in SE(3)-invariant space via the lens of approximate errors induced by existing methods. Thereby, we develop more precise approximate in SE(3) in the context of projected differential equations. Theoretical analysis is further provided as well as empirical proof relating hyper-parameters with such errors. Altogether, we propose a novel acceleration scheme for generating molecular conformations in SE(3)-invariant space.\nExperimentally, our scheme can generate high-quality conformations with 50x--100x speedup compared to existing methods.\nCode is open-sourced at https://anonymous.4open.science/r/Fast-Sampling-41A6.",
        "keywords": "graph generative model;molecule conformation generation;differential equations",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Zihan Zhou;Ruiying Liu;Tianshu Yu",
        "authorids": "~Zihan_Zhou7;~Ruiying_Liu1;~Tianshu_Yu2",
        "gender": "M;F;M",
        "homepage": "https://github.com/zzh1282260738;https://sds.cuhk.edu.cn/en/node/712;https://mypage.cuhk.edu.cn/academics/yutianshu/",
        "dblp": "00/6525;190/9026;152/6675",
        "google_scholar": "NxB0_NkAAAAJ;;MTHO7DsAAAAJ",
        "orcid": "0009-0006-6107-6190;;0000-0002-6537-1924",
        "linkedin": ";;",
        "or_profile": "~Zihan_Zhou7;~Ruiying_Liu1;~Tianshu_Yu2",
        "aff": "The Chinese University of Hong Kong, Shenzhen;The Chinese University of Hong Kong, Shenzhen;Chinese University of Hong Kong (Shenzhen)",
        "aff_domain": "cuhk.edu.cn;cuhk.edu.com;cuhk.edu.cn",
        "position": "PhD student;PhD student;Assistant Professor",
        "bibtex": "@misc{\nzhou2024on,\ntitle={On Accelerating Diffusion-based Molecular Conformation Generation in {SE}(3)-invariant Space},\nauthor={Zihan Zhou and Ruiying Liu and Tianshu Yu},\nyear={2024},\nurl={https://openreview.net/forum?id=Wn82BUF7jH}\n}",
        "github": "",
        "project": "",
        "reviewers": "bG3y;vTuX;gijA",
        "site": "https://openreview.net/forum?id=Wn82BUF7jH",
        "pdf_size": 6206719,
        "rating": "3;3;5",
        "confidence": "4;4;4",
        "soundness": "2;2;2",
        "contribution": "1;2;3",
        "presentation": "2;1;2",
        "wc_summary": "29;54;142",
        "wc_strengths": "26;50;35",
        "wc_weaknesses": "322;254;447",
        "wc_questions": "3;70;121",
        "wc_review": "380;428;745",
        "wc_reply_reviewers": "26;205;0",
        "wc_reply_authors": "1056;1383;902",
        "reply_reviewers": "1;1;0",
        "reply_authors": "2;3;2",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            75.0,
            48.46304433964778
        ],
        "wc_strengths_avg": [
            37.0,
            9.899494936611665
        ],
        "wc_weaknesses_avg": [
            341.0,
            79.92913528036361
        ],
        "wc_questions_avg": [
            64.66666666666667,
            48.32068800098865
        ],
        "wc_review_avg": [
            517.6666666666666,
            161.93894597107337
        ],
        "wc_reply_reviewers_avg": [
            77.0,
            91.12994385308633
        ],
        "wc_reply_authors_avg": [
            1113.6666666666667,
            200.55644813590234
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:sq2wd1yN0YwJ:scholar.google.com/&scioq=On+Accelerating+Diffusion-based+Molecular+Conformation+Generation+in+SE(3)-invariant+Space&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Chinese University of Hong Kong",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cuhk.edu.cn",
        "aff_unique_abbr": "CUHK",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Shenzhen",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "WnEnU2K3Rb",
        "title": "Beyond the Benchmark: Detecting Diverse Anomalies in Videos",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Video Anomaly Detection (VAD) plays a crucial role in modern surveillance systems, aiming to  identify various anomalies in real-world situations. However, current benchmark datasets predominantly emphasize simple, single-frame anomalies such as novel object detection. This narrow focus restricts the advancement of VAD models. In this research, we advocate for an expansion of VAD investigations to encompass intricate anomalies that extend beyond conventional benchmark boundaries.\nTo facilitate this, we introduce two  datasets, HMDB-AD and HMDB-Violence, to challenge models with diverse action-based anomalies. These datasets are derived from the HMDB51 action recognition dataset.\nWe further present Multi-Frame Anomaly Detection (MFAD), a novel method built upon the AI-VAD framework. \nAI-VAD utilizes single-frame features such as pose estimation and deep image encoding, and two-frame features such as object velocity. They then apply a density estimation algorithm to compute anomaly scores. To address complex multi-frame anomalies, we add a deep video encoding features capturing long-range temporal dependencies, and logistic regression  to enhance final score calculation.\nExperimental results confirm our assumptions, highlighting existing models limitations with new anomaly types. MFAD excels in both simple and complex anomaly detection scenarios.",
        "keywords": "Computer Vision;Video Anomaly Detection;General Video Anomaly Detection;Multi-Frame Video Anomaly Detection;VAD;MFAD;Video Anomaly Detection Datasets",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/d8bb041a01717200829c289d716af865bd3cfb01.zip",
        "author": "Yoav Arad;Michael Werman",
        "authorids": "~Yoav_Arad1;~Michael_Werman1",
        "gender": "M;Unspecified",
        "homepage": ";http://www.cs.huji.ac.il/~werman/",
        "dblp": ";",
        "google_scholar": ";https://scholar.google.com.tw/citations?user=WBeDvikAAAAJ",
        "orcid": ";",
        "linkedin": "yoav-arad/;",
        "or_profile": "~Yoav_Arad1;~Michael_Werman1",
        "aff": ";Hebrew University of Jerusalem, Israel",
        "aff_domain": ";huji.ac.il",
        "position": ";Full Professor",
        "bibtex": "@misc{\narad2024beyond,\ntitle={Beyond the Benchmark: Detecting Diverse Anomalies in Videos},\nauthor={Yoav Arad and Michael Werman},\nyear={2024},\nurl={https://openreview.net/forum?id=WnEnU2K3Rb}\n}",
        "github": "",
        "project": "",
        "reviewers": "fVMW;HVoz;A5Te;y6mV",
        "site": "https://openreview.net/forum?id=WnEnU2K3Rb",
        "pdf_size": 10393905,
        "rating": "3;3;5;6",
        "confidence": "5;5;5;4",
        "soundness": "3;1;3;3",
        "contribution": "1;2;2;3",
        "presentation": "3;1;3;3",
        "wc_summary": "47;107;127;107",
        "wc_strengths": "19;111;56;154",
        "wc_weaknesses": "208;152;109;79",
        "wc_questions": "4;107;5;101",
        "wc_review": "278;477;297;441",
        "wc_reply_reviewers": "94;0;0;0",
        "wc_reply_authors": "484;449;312;244",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            97.0,
            30.0
        ],
        "wc_strengths_avg": [
            85.0,
            51.56064390598706
        ],
        "wc_weaknesses_avg": [
            137.0,
            48.51288488638869
        ],
        "wc_questions_avg": [
            54.25,
            49.79646071760522
        ],
        "wc_review_avg": [
            373.25,
            86.94933869788775
        ],
        "wc_reply_reviewers_avg": [
            23.5,
            40.703193977868615
        ],
        "wc_reply_authors_avg": [
            372.25,
            98.05196326438345
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.7777777777777777,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14747946961738964199&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0",
        "aff_unique_norm": "Hebrew University of Jerusalem",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.huji.ac.il",
        "aff_unique_abbr": "HUJI",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Israel"
    },
    {
        "id": "WnqD3EiylC",
        "title": "The Representation Jensen-Shannon Divergence",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Statistical divergences quantify the difference between probability distributions, thereby allowing for multiple uses in machine-learning. However, a fundamental challenge of these quantities is their estimation from empirical samples since the underlying distributions of the data are usually unknown. In this work, we propose a divergence inspired by the Jensen-Shannon divergence which avoids the estimation of the probability density functions. Our approach embeds the data in an reproducing kernel Hilbert space (RKHS) where we associate data distributions with uncentered covariance operators in this representation space. Therefore, we name this measure the representation Jensen-Shannon divergence (RJSD). We provide an estimator from empirical covariance matrices by explicitly mapping the data to an RKHS using Fourier features. This estimator is flexible, scalable, differentiable, and suitable for minibatch-based optimization problems. Additionally, we provide an estimator based on kernel matrices without an explicit mapping to the RKHS. We provide consistency convergence results for the proposed estimator. Moreover, we demonstrate that this quantity is a lower bound on the Jensen-Shannon divergence, leading to a variational approach to estimate it with theoretical guarantees. We leverage the proposed divergence to train generative networks, where our method mitigates mode collapse and encourages samples diversity.  Additionally, RJSD surpasses other state-of-the-art techniques in multiple two-sample testing problems, demonstrating superior performance and reliability in discriminating between distributions.",
        "keywords": "Statistical Divergence;Kernel methods;Two sample testing",
        "primary_area": "metric learning, kernel learning, and sparse coding",
        "supplementary_material": "/attachment/357a8492f4e30ca88e29dfd73dcb7340cff31859.pdf",
        "author": "Jhoan Keider Hoyos;Santiago Posso-Murillo;Luis Gonzalo Sanchez Giraldo",
        "authorids": "~Jhoan_Keider_Hoyos1;~Santiago_Posso-Murillo1;~Luis_Gonzalo_Sanchez_Giraldo2",
        "gender": "M;M;M",
        "homepage": ";;https://web.engr.uky.edu/~lgsanchez/index.html",
        "dblp": "308/0925;;",
        "google_scholar": "d7wk3gkAAAAJ;;f8SEjbIAAAAJ",
        "orcid": "0000-0002-7169-7963;;",
        "linkedin": ";santiago-posso-b41774135/;",
        "or_profile": "~Jhoan_Keider_Hoyos1;~Santiago_Posso-Murillo1;~Luis_Gonzalo_Sanchez_Giraldo1",
        "aff": "University of Kentucky;University of Kentucky;University of Kentucky",
        "aff_domain": "uky.edu;uky.edu;engr.uky.edu",
        "position": "PhD student;PhD student;Assistant Professor",
        "bibtex": "@misc{\nhoyos2024the,\ntitle={The Representation Jensen-Shannon Divergence},\nauthor={Jhoan Keider Hoyos and Santiago Posso-Murillo and Luis Gonzalo Sanchez Giraldo},\nyear={2024},\nurl={https://openreview.net/forum?id=WnqD3EiylC}\n}",
        "github": "",
        "project": "",
        "reviewers": "zuw1;apnH;kvgr;UrV9;MfNe",
        "site": "https://openreview.net/forum?id=WnqD3EiylC",
        "pdf_size": 779754,
        "rating": "3;5;5;6;6",
        "confidence": "4;3;4;3;3",
        "soundness": "2;3;2;2;3",
        "contribution": "2;2;2;2;2",
        "presentation": "1;3;3;2;3",
        "wc_summary": "229;106;177;76;99",
        "wc_strengths": "86;64;43;34;108",
        "wc_weaknesses": "909;159;360;601;107",
        "wc_questions": "4;159;3;299;2",
        "wc_review": "1228;488;583;1010;316",
        "wc_reply_reviewers": "0;166;0;393;0",
        "wc_reply_authors": "1213;833;476;1108;172",
        "reply_reviewers": "0;2;0;1;0",
        "reply_authors": "2;2;1;2;1",
        "rating_avg": [
            5.0,
            1.0954451150103321
        ],
        "confidence_avg": [
            3.4,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.4,
            0.8
        ],
        "wc_summary_avg": [
            137.4,
            56.90202105373763
        ],
        "wc_strengths_avg": [
            67.0,
            27.26169473822198
        ],
        "wc_weaknesses_avg": [
            427.2,
            297.09015466689567
        ],
        "wc_questions_avg": [
            93.4,
            119.24193893089797
        ],
        "wc_review_avg": [
            725.0,
            339.95529117811947
        ],
        "wc_reply_reviewers_avg": [
            111.8,
            154.60194047941314
        ],
        "wc_reply_authors_avg": [
            760.4,
            389.36902804409084
        ],
        "reply_reviewers_avg": [
            0.6,
            0.7999999999999999
        ],
        "reply_authors_avg": [
            1.6,
            0.4898979485566356
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.74535599249993,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1685700510433615622&as_sdt=8000005&sciodt=0,19&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Kentucky",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uky.edu",
        "aff_unique_abbr": "UK",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "WoP9veDwUp",
        "title": "Variance-Reduced Meta-Learning via Laplace Approximation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Meta-learning algorithms aim to learn a general prior over a set of related tasks to facilitate generalization to new, unseen tasks. This is achieved by estimating the optimal posterior using a finite set of support data. However, this estimation is subject to high variance due to the limited amount of support data for each task, which often leads to sub-optimal generalization performance. In this paper, we address the problem of variance reduction in gradient-based meta-learning and define a class of problems particularly prone to this. Specifically, we propose a novel approach that reduces the variance of the gradient estimate by weighing each support point individually by the variance of its posterior over the parameters. To estimate the posterior, we utilize the Laplace approximation, which allows us to express the variance in terms of the curvature of the loss landscape of our meta-learner. Experimental results demonstrate the effectiveness of the proposed method and highlight the importance of variance reduction in meta-learning.",
        "keywords": "meta-learning;multi-task learning;few-shot learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/0ebcfe4d5051da26336c54aa44f20c1c58e8d19a.zip",
        "author": "Gustaf Tegn\u00e9r;Alfredo Reichlin;Hang Yin;M\u00e5rten Bj\u00f6rkman;Danica Kragic",
        "authorids": "~Gustaf_Tegn\u00e9r1;~Alfredo_Reichlin1;~Hang_Yin1;~M\u00e5rten_Bj\u00f6rkman2;~Danica_Kragic1",
        "gender": "M;M;M;F;M",
        "homepage": "https://www.kth.se/profile/gustafte;;;http://www.csc.kth.se/~danik;https://www.kth.se/profile/celle",
        "dblp": "310/5032;324/2394;;82/1211;",
        "google_scholar": ";PE0RmDUAAAAJ;https://scholar.google.pt/citations?hl=en;;https://scholar.google.se/citations?user=jKjp9h4AAAAJ",
        "orcid": ";0000-0001-8938-9363;;;",
        "linkedin": ";;;;",
        "or_profile": "~Gustaf_Tegn\u00e9r1;~Alfredo_Reichlin1;~Hang_Yin1;~Danica_Kragic1;~Marten_Bjoerkman1",
        "aff": "KTH Royal Institute of Technology, Stockholm, Sweden;KTH Royal Institute of Technology;University of Copenhagen;KTH;KTH Royal Institute of Technology, Stockholm, Sweden",
        "aff_domain": "kth.se;kth.se;ku.dk;kth.se;kth.se",
        "position": "PhD student;PhD student;Assistant Professor;Professor;Associate Professor",
        "bibtex": "@misc{\ntegn{\\'e}r2024variancereduced,\ntitle={Variance-Reduced Meta-Learning via Laplace Approximation},\nauthor={Gustaf Tegn{\\'e}r and Alfredo Reichlin and Hang Yin and M{\\r{a}}rten Bj{\\\"o}rkman and Danica Kragic},\nyear={2024},\nurl={https://openreview.net/forum?id=WoP9veDwUp}\n}",
        "github": "",
        "project": "",
        "reviewers": "idd4;ciAP;mLEP;gPmV",
        "site": "https://openreview.net/forum?id=WoP9veDwUp",
        "pdf_size": 3779837,
        "rating": "5;5;5;6",
        "confidence": "3;4;4;3",
        "soundness": "3;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;2;4",
        "wc_summary": "27;40;118;68",
        "wc_strengths": "42;39;49;93",
        "wc_weaknesses": "61;215;997;58",
        "wc_questions": "2;11;93;66",
        "wc_review": "132;305;1257;285",
        "wc_reply_reviewers": "0;12;410;57",
        "wc_reply_authors": "67;510;787;504",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            63.25,
            34.90970495435331
        ],
        "wc_strengths_avg": [
            55.75,
            21.810261346439663
        ],
        "wc_weaknesses_avg": [
            332.75,
            388.72507958710355
        ],
        "wc_questions_avg": [
            43.0,
            37.8615900352851
        ],
        "wc_review_avg": [
            494.75,
            445.1440075975414
        ],
        "wc_reply_reviewers_avg": [
            119.75,
            168.9176944550215
        ],
        "wc_reply_authors_avg": [
            467.0,
            257.69070607998265
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:QHUe1E1qLLgJ:scholar.google.com/&scioq=Variance-Reduced+Meta-Learning+via+Laplace+Approximation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "KTH Royal Institute of Technology;University of Copenhagen",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.kth.se;https://www.ku.dk",
        "aff_unique_abbr": "KTH;UCPH",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Stockholm;",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "Sweden;Denmark"
    },
    {
        "id": "WpMHBIYsUf",
        "title": "Homeomorphic Model Transformation for Boosting Performance and Efficiency in Object Detection Networks",
        "track": "main",
        "status": "Desk Reject",
        "tldr": "",
        "abstract": "The field of computer vision has witnessed significant advancements in recent years with the development of deep learning networks. However, the fixed architectures of these networks limit their capabilities. For object detection task, existing methods typically rely on fixed architecture. While achieving promising performance, there is potential for further improving network performance with minimal modifications. In this study, we investigate that existing networks with minimal modifications can further boost performance. However, modifying some layers results in pre-trained weight mismatch, the fine-tune process is time-consuming and resource-inefficient. To address this issue, we propose a novel technique called Homeomorphic Model Transformation (HMT), which enables the adaptation of initial weights based on pretrained weights. This approach ensures the preservation of the original model's performance when modifying layers. Additionally, HMT significantly reduces the total training time required to achieve optimal results while further enhancing network performance. Extensive experiments across various object detection tasks validate the effectiveness and efficiency of our proposed HMT solution.",
        "keywords": "Objection Detection;Model Transfer;Transfer Learning;Homeomorphic Model Transformation",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Jin Liu;Zhongyuan Lu",
        "authorids": "~Jin_Liu13;~Zhongyuan_Lu1",
        "gender": "M;M",
        "homepage": "http://jszy.whu.edu.cn/liujin1/zh_CN/index/226411/list/index.htm;",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": ";0009-0007-1695-6305",
        "linkedin": ";",
        "or_profile": "~Jin_Liu13;~Zhongyuan_Lu1",
        "aff": "Wuhan University;Wuhan University of Technology",
        "aff_domain": "whu.edu.cn;whut.edu.cn",
        "position": "Associate Professor;PhD student",
        "bibtex": "@misc{\nliu2024homeomorphic,\ntitle={Homeomorphic Model Transformation for Boosting Performance and Efficiency in Object Detection Networks},\nauthor={Jin Liu and Zhongyuan Lu},\nyear={2024},\nurl={https://openreview.net/forum?id=WpMHBIYsUf}\n}",
        "github": "",
        "project": "",
        "reviewers": "qBbe;Qd9P;kpBG;v45U",
        "site": "https://openreview.net/forum?id=WpMHBIYsUf",
        "pdf_size": 3269487,
        "rating": "3;3;6;8",
        "confidence": "4;5;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;4",
        "presentation": "2;2;3;4",
        "wc_summary": "72;19;67;65",
        "wc_strengths": "70;13;51;47",
        "wc_weaknesses": "324;147;103;41",
        "wc_questions": "13;5;2;18",
        "wc_review": "479;184;223;171",
        "wc_reply_reviewers": "58;0;0;0",
        "wc_reply_authors": "906;794;792;413",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            5.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            55.75,
            21.370248009791556
        ],
        "wc_strengths_avg": [
            45.25,
            20.54720175595694
        ],
        "wc_weaknesses_avg": [
            153.75,
            105.26009452779338
        ],
        "wc_questions_avg": [
            9.5,
            6.34428877022476
        ],
        "wc_review_avg": [
            264.25,
            125.45392580545257
        ],
        "wc_reply_reviewers_avg": [
            14.5,
            25.11473670974872
        ],
        "wc_reply_authors_avg": [
            726.25,
            186.64722741042794
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5443310539518174,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Y0OhN9M86HAJ:scholar.google.com/&scioq=Homeomorphic+Model+Transformation+for+Boosting+Performance+and+Efficiency+in+Object+Detection+Networks&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Wuhan University;Wuhan University of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.whu.edu.cn/;http://www.wut.edu.cn",
        "aff_unique_abbr": "WHU;WUT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "WpQbM1kBuy",
        "title": "Prodigy: An Expeditiously Adaptive Parameter-Free Learner",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We consider the problem of estimating the learning rate in adaptive methods, such as Adagrad and Adam. We describe two techniques, Prodigy and Resetting, to provably estimate the distance to the solution $D$, which is needed to set the learning rate optimally. Our techniques are modifications of the D-Adaptation method for learning-rate-free learning. Our methods improve upon the convergence rate of D-Adaptation by a factor of $\\mathcal{O}(\\sqrt{\\log(D/d_0)})$, where $d_0$ is the initial estimate of $D$. We test our methods on 12 common logistic-regression benchmark datasets, VGG11 and ResNet-50 training on CIFAR10, ViT training on Imagenet, LSTM training on IWSLT14, DLRM training on Criteo dataset, VarNet on Knee MRI dataset, as well as RoBERTa and GPT transformer training on BookWiki. Our experimental results show that our approaches consistently outperform D-Adaptation and reach test accuracy values close to that of hand-tuned Adam.",
        "keywords": "optimization;adaptive methods;AdaGrad",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/493b3617cd498a02de81e2b2cdb92e638fcb03a5.zip",
        "author": "Konstantin Mishchenko;Aaron Defazio",
        "authorids": "~Konstantin_Mishchenko1;~Aaron_Defazio1",
        "gender": ";M",
        "homepage": "https://konstmish.com/;https://www.aarondefazio.com/",
        "dblp": "222/9853;116/2969",
        "google_scholar": "Z8Y8nhQAAAAJ;KEzJsdkAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Konstantin_Mishchenko1;~Aaron_Defazio1",
        "aff": "Samsung;Meta",
        "aff_domain": "samsung.com;meta.com",
        "position": "Researcher;Research Scientist",
        "bibtex": "@misc{\nmishchenko2024prodigy,\ntitle={Prodigy: An Expeditiously Adaptive Parameter-Free Learner},\nauthor={Konstantin Mishchenko and Aaron Defazio},\nyear={2024},\nurl={https://openreview.net/forum?id=WpQbM1kBuy}\n}",
        "github": "",
        "project": "",
        "reviewers": "gz9E;UUCM;JC31;bqiE",
        "site": "https://openreview.net/forum?id=WpQbM1kBuy",
        "pdf_size": 2518028,
        "rating": "1;5;5;6",
        "confidence": "5;3;2;4",
        "soundness": "1;3;3;3",
        "contribution": "1;2;2;3",
        "presentation": "1;2;2;3",
        "wc_summary": "21;147;131;125",
        "wc_strengths": "14;46;34;88",
        "wc_weaknesses": "1230;741;243;133",
        "wc_questions": "32;185;2;103",
        "wc_review": "1297;1119;410;449",
        "wc_reply_reviewers": "201;480;0;59",
        "wc_reply_authors": "150;516;284;256",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            4.25,
            1.920286436967152
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            106.0,
            49.72926703662542
        ],
        "wc_strengths_avg": [
            45.5,
            27.069355367278327
        ],
        "wc_weaknesses_avg": [
            586.75,
            436.35328290274157
        ],
        "wc_questions_avg": [
            80.5,
            70.60630283480364
        ],
        "wc_review_avg": [
            818.75,
            394.54554553308543
        ],
        "wc_reply_reviewers_avg": [
            185.0,
            185.32538951800424
        ],
        "wc_reply_authors_avg": [
            301.5,
            133.54680827335412
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.6404447607135402,
        "gs_citation": 50,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10885259152387899313&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Samsung;Meta",
        "aff_unique_dep": "Samsung;Meta Platforms, Inc.",
        "aff_unique_url": "https://www.samsung.com;https://meta.com",
        "aff_unique_abbr": "Samsung;Meta",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "id": "WqeRtP2T3R",
        "title": "Embracing Diversity: Zero-shot Classification Beyond a Single Vector per Class",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Vision-language models for the first time enable open-world classification of objects without the need for any retraining. While this zero-shot paradigm marks a significant advance, even today\u2019s best models exhibit skewed performance when objects are dissimilar from their typical depiction. Real world objects such as pears appear in a variety of forms --- from diced to whole, on a table or in a bowl ---\nyet standard VLM classifiers map all instances of a class\nto a single vector based on the class label. \nWe argue that to represent this rich diversity within a class, zero-shot classification should move beyond a single vector. \nWe propose a method to encode and account for diversity within a class using inferred attributes, still in the zero-shot setting without retraining.\nWe find our method consistently outperforms standard zero-shot classification over a large suite of datasets encompassing hierarchies, diverse object states, and \nreal-world geographic diversity.\nWe also find our method scales efficiently to a large number of attributes to account for diversity---leading to more accurate predictions for atypical instances.\nFinally, we highlight how our method offers fine-grained human-interpretable explanations of model predictions.\nWe hope this work spurs further research into the promise of zero-shot classification beyond a single class vector for capturing diversity in the world.",
        "keywords": "zero shot;classification;vision language models;fairness",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Mazda Moayeri;Michael Rabbat;Mark Ibrahim;Diane Bouchacourt",
        "authorids": "~Mazda_Moayeri1;~Michael_Rabbat1;~Mark_Ibrahim1;~Diane_Bouchacourt3",
        "gender": ";M;;F",
        "homepage": "https://www.cs.umd.edu/people/mmoayeri;;https://markibrahim.me/;https://dianebouchacourt.github.io/",
        "dblp": "261/8493;47/1744;180/5660;176/1498",
        "google_scholar": "4f4m6O0AAAAJ;https://scholar.google.ch/citations?user=cMPKe9UAAAAJ;AqYyoCMAAAAJ;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Mazda_Moayeri1;~Michael_Rabbat1;~Mark_Ibrahim1;~Diane_Nicole_Bouchacourt1",
        "aff": "University of Maryland, College Park;Mila;Facebook AI Research (FAIR) Meta;Meta AI Research",
        "aff_domain": "umd.edu;mila.quebec;ai.facebook.com;meta.com",
        "position": "PhD student;Associate Member;Researcher;Researcher",
        "bibtex": "@misc{\nmoayeri2024embracing,\ntitle={Embracing Diversity: Zero-shot Classification Beyond a Single Vector per Class},\nauthor={Mazda Moayeri and Michael Rabbat and Mark Ibrahim and Diane Bouchacourt},\nyear={2024},\nurl={https://openreview.net/forum?id=WqeRtP2T3R}\n}",
        "github": "",
        "project": "",
        "reviewers": "KwVV;3g4D;NLHE",
        "site": "https://openreview.net/forum?id=WqeRtP2T3R",
        "pdf_size": 6607876,
        "rating": "3;5;6",
        "confidence": "4;4;3",
        "soundness": "3;2;3",
        "contribution": "1;2;3",
        "presentation": "2;3;3",
        "wc_summary": "237;71;71",
        "wc_strengths": "101;42;60",
        "wc_weaknesses": "513;135;100",
        "wc_questions": "118;38;2",
        "wc_review": "969;286;233",
        "wc_reply_reviewers": "311;0;0",
        "wc_reply_authors": "2889;654;510",
        "reply_reviewers": "2;0;0",
        "reply_authors": "6;2;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            126.33333333333333,
            78.25315045131126
        ],
        "wc_strengths_avg": [
            67.66666666666667,
            24.689178916188272
        ],
        "wc_weaknesses_avg": [
            249.33333333333334,
            186.98722475672562
        ],
        "wc_questions_avg": [
            52.666666666666664,
            48.47909056719425
        ],
        "wc_review_avg": [
            496.0,
            335.16065799354595
        ],
        "wc_reply_reviewers_avg": [
            103.66666666666667,
            146.60680596601085
        ],
        "wc_reply_authors_avg": [
            1351.0,
            1089.1179917713232
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            3.0,
            2.160246899469287
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.7559289460184545,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:7r0ephdB5YYJ:scholar.google.com/&scioq=Embracing+Diversity:+Zero-shot+Classification+Beyond+a+Single+Vector+per+Class&hl=en&as_sdt=0,48",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;2",
        "aff_unique_norm": "University of Maryland;Mila;Meta",
        "aff_unique_dep": ";Quebec Artificial Intelligence Institute;Facebook AI Research",
        "aff_unique_url": "https://www/umd.edu;https://mila.quebec;https://www.meta.com",
        "aff_unique_abbr": "UMD;Mila;Meta AI",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "College Park;",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "United States;Canada"
    },
    {
        "id": "WqovbCMrOp",
        "title": "On the Recoverability of Causal Relations from Temporally Aggregated I.I.D Data",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Real-world data in fields such as economics, finance and neuroscience often exhibit a lower resolution compared to the underlying causal process, with temporally aggregated data being a common example. While the impact of temporally aggregated time series on temporal causal discovery has received attention, the effects of highly aggregated data, which yield independent and identically distributed (i.i.d.) observations, on instantaneous (non-temporal) causal discovery have been largely overlooked by the research community. There is substantial evidence suggesting that temporally aggregated i.i.d. data are prevalent in reality. This prevalence arises because the time required for causal interactions is often considerably shorter than the observational interval, leading to a large aggregation factor and subsequently rendering the temporally aggregated data i.i.d. The critical question arises: are causal discovery results obtained from such data consistent with the true causal process? In this paper, we provide theoretical conditions necessary to ensure the consistency of causal discovery results when analyzing temporally aggregated i.i.d. data. Through a combination of theoretical analysis and experimental validation, we demonstrate that conducting causal discovery on such data often leads to erroneous results. Our primary objective is to bring attention to the risks associated with performing causal discovery on highly aggregated i.i.d. data and advocate for a cautious and meticulous approach when interpreting causal discovery outcomes derived from such data.",
        "keywords": "Causality;Causal Discovery;Temporal Aggregation;Causal Frequency;Vector Autoregressive Model;Time Series",
        "primary_area": "causal reasoning",
        "supplementary_material": "/attachment/93a04d03fd9bd4d7d06cc52214694931c1b0ed91.zip",
        "author": "Shunxing Fan;Mingming Gong;Kun Zhang",
        "authorids": "~Shunxing_Fan1;~Mingming_Gong1;~Kun_Zhang1",
        "gender": "M;M;M",
        "homepage": "https://shunxing-fan.github.io/;https://mingming-gong.github.io/;http://www.andrew.cmu.edu/user/kunz1/",
        "dblp": "344/5064;98/8479;96/3115-1",
        "google_scholar": "SbGcOdYAAAAJ;https://scholar.google.com.au/citations?user=6BmiCJIAAAAJ;RGoypN4AAAAJ",
        "orcid": "0000-0003-2106-8074;0000-0001-7147-5589;",
        "linkedin": ";;",
        "or_profile": "~Shunxing_Fan1;~Mingming_Gong1;~Kun_Zhang1",
        "aff": "Mohamed bin Zayed University of Artificial Intelligence;University of Melbourne;Carnegie Mellon University",
        "aff_domain": "mbzuai.ac.ae;unimelb.edu.au;cmu.edu",
        "position": "Researcher;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nfan2024on,\ntitle={On the Recoverability of Causal Relations from Temporally Aggregated I.I.D Data},\nauthor={Shunxing Fan and Mingming Gong and Kun Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=WqovbCMrOp}\n}",
        "github": "",
        "project": "",
        "reviewers": "dWzu;yyms;2HMB;766L;eLuf",
        "site": "https://openreview.net/forum?id=WqovbCMrOp",
        "pdf_size": 765767,
        "rating": "5;6;6;6;6",
        "confidence": "4;3;4;3;4",
        "soundness": "2;3;3;2;3",
        "contribution": "2;3;2;2;3",
        "presentation": "1;2;3;3;2",
        "wc_summary": "48;117;74;29;84",
        "wc_strengths": "14;47;81;45;44",
        "wc_weaknesses": "131;33;605;167;173",
        "wc_questions": "18;44;75;255;46",
        "wc_review": "211;241;835;496;347",
        "wc_reply_reviewers": "64;0;200;26;42",
        "wc_reply_authors": "1001;301;1812;1376;975",
        "reply_reviewers": "1;0;1;1;1",
        "reply_authors": "3;2;4;4;3",
        "rating_avg": [
            5.8,
            0.39999999999999997
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.2,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            70.4,
            30.282668310437902
        ],
        "wc_strengths_avg": [
            46.2,
            21.235818797494012
        ],
        "wc_weaknesses_avg": [
            221.8,
            198.0488828547134
        ],
        "wc_questions_avg": [
            87.6,
            85.62382845913864
        ],
        "wc_review_avg": [
            426.0,
            227.53988661331445
        ],
        "wc_reply_reviewers_avg": [
            66.4,
            69.98742744236282
        ],
        "wc_reply_authors_avg": [
            1093.0,
            499.3399643529446
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            3.2,
            0.7483314773547882
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.408248290463863,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2617085200053013339&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Mohamed bin Zayed University of Artificial Intelligence;University of Melbourne;Carnegie Mellon University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://mbzuai.ac.ae;https://www.unimelb.edu.au;https://www.cmu.edu",
        "aff_unique_abbr": "MBZUAI;UniMelb;CMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2",
        "aff_country_unique": "United Arab Emirates;Australia;United States"
    },
    {
        "id": "WqsYs05Ri7",
        "title": "Estimation of Concept Explanations Should be Uncertainty Aware",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Model explanations are very valuable for interpreting and debugging prediction models. We study a specific kind of global explanations called Concept Explanations, where the goal is to interpret a model using human-understandable concepts. Recent advances in multi-modal learning rekindled interest in concept explanations and led to several label-efficient proposals for estimation. However, existing estimation methods are unstable to the choice of concepts or dataset that is used for computing explanations. We observe that instability in explanations is because estimations do not model noise. We propose an uncertainty aware estimation method, which readily improved reliability of the concept explanations. We demonstrate with theoretical analysis and empirical evaluation that explanations computed by our method are stable to the choice of concepts and data shifts while also being label-efficient and faithful.",
        "keywords": "concept explanations;interpretability;trustworthy machine learning;probabilistic methods",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/0da674a772cec97a0c58d18b68f066ef69aece99.pdf",
        "author": "Vihari Piratla;Juyeon Heo;Sukriti Singh;Adrian Weller",
        "authorids": "~Vihari_Piratla1;~Juyeon_Heo1;~Sukriti_Singh1;~Adrian_Weller1",
        "gender": "M;F;;M",
        "homepage": "https://vihari.github.io/;https://sites.google.com/view/juyeonheo/%ED%99%88;;http://mlg.eng.cam.ac.uk/adrian/",
        "dblp": "161/3626;;;73/8324",
        "google_scholar": "https://scholar.google.co.in/citations?user=DQddccYAAAAJ;;;https://scholar.google.co.uk/citations?user=Ek4hM10AAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Vihari_Piratla1;~Juyeon_Heo1;~Sukriti_Singh1;~Adrian_Weller1",
        "aff": "University of Cambridge;University of Cambridge;;University of Cambridge",
        "aff_domain": "cam.ac.uk;cam.ac.uk;;cam.ac.uk",
        "position": "Postdoc;PhD student;;Principal Researcher",
        "bibtex": "@misc{\npiratla2024estimation,\ntitle={Estimation of Concept Explanations Should be Uncertainty Aware},\nauthor={Vihari Piratla and Juyeon Heo and Sukriti Singh and Adrian Weller},\nyear={2024},\nurl={https://openreview.net/forum?id=WqsYs05Ri7}\n}",
        "github": "",
        "project": "",
        "reviewers": "6L9H;xCUE;eXDK;QofX;9tBC",
        "site": "https://openreview.net/forum?id=WqsYs05Ri7",
        "pdf_size": 4454459,
        "rating": "3;5;6;6;6",
        "confidence": "4;4;3;4;3",
        "soundness": "1;2;2;3;3",
        "contribution": "1;2;3;3;3",
        "presentation": "1;1;2;3;2",
        "wc_summary": "43;187;59;102;83",
        "wc_strengths": "8;111;110;146;157",
        "wc_weaknesses": "32;617;125;465;221",
        "wc_questions": "626;271;47;10;48",
        "wc_review": "709;1186;341;723;509",
        "wc_reply_reviewers": "0;1309;0;133;86",
        "wc_reply_authors": "1311;2009;561;571;480",
        "reply_reviewers": "0;3;0;1;1",
        "reply_authors": "2;4;1;2;2",
        "rating_avg": [
            5.2,
            1.16619037896906
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.2,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.4,
            0.8
        ],
        "presentation_avg": [
            1.8,
            0.7483314773547883
        ],
        "wc_summary_avg": [
            94.8,
            50.3126226706579
        ],
        "wc_strengths_avg": [
            106.4,
            52.62166854063067
        ],
        "wc_weaknesses_avg": [
            292.0,
            217.2942705181156
        ],
        "wc_questions_avg": [
            200.4,
            232.00396548335118
        ],
        "wc_review_avg": [
            693.6,
            283.53595891879394
        ],
        "wc_reply_reviewers_avg": [
            305.6,
            504.3033214247156
        ],
        "wc_reply_authors_avg": [
            986.4,
            593.4710102439714
        ],
        "reply_reviewers_avg": [
            1.0,
            1.0954451150103321
        ],
        "reply_authors_avg": [
            2.2,
            0.9797958971132712
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.560112033611204,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6137676069631527947&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Cambridge",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cam.ac.uk",
        "aff_unique_abbr": "Cambridge",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Cambridge",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "WrBxRtGNLH",
        "title": "On Convergence Rates of Deep Nonparametric Regression under Covariate Shift",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Traditional machine learning and statistical modeling methodologies are rooted in a fundamental assumption: that both training and test data originate from the same underlying distribution. However, the practical reality often presents a challenge, as training and test distributions frequently manifest discrepancies or biases. In this work, we study covariate shift, a type of distribution mismatches, in the context of deep nonparametric regression. We thus formulate a two-stage pre-training reweighted framework relying on deep ReLU neural networks. We rigorously establish convergence rates for the unweighted, reweighted, and pre-training reweighted estimators, illuminating the pivotal role played by the density-ratio reweighting strategy. Additionally, our analysis illustrates the efficacy of pre-training and provides valuable insights for practitioners, offering guidance for the judicious selection of the number of pre-training samples.",
        "keywords": "nonparametric regression;covariate shift;importance weighting;deep learning",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Chenguang Duan;Yuling Jiao;Lican Kang;Xiliang Lu;Jerry Zhijian Yang",
        "authorids": "~Chenguang_Duan1;~Yuling_Jiao1;~Lican_Kang1;~Xiliang_Lu1;~Jerry_Zhijian_Yang1",
        "gender": "M;M;M;M;M",
        "homepage": ";https://jszy.whu.edu.cn/jiaoyuling/en/index.htm;;http://jszy.whu.edu.cn/lvxiliang/en/index/275082/list/index.htm;http://zjyang.whu.edu.cn",
        "dblp": ";136/7658;;70/7812;11/9336",
        "google_scholar": "RpmGgyMAAAAJ;yFDDsVgAAAAJ;;https://scholar.google.com/citations?hl=en;",
        "orcid": ";;;0000-0002-7592-5994;",
        "linkedin": ";;;;",
        "or_profile": "~Chenguang_Duan1;~Yuling_Jiao1;~Lican_Kang1;~Xiliang_Lu1;~Jerry_Zhijian_Yang1",
        "aff": "Wuhan University;Wuhan University;National University of Singapore;Wuhan University;Wuhan University",
        "aff_domain": "whu.edu.cn;whu.edu.cn;nus.edu.sg;whu.edu.cn;whu.edu.cn",
        "position": "PhD student;Full Professor;Postdoc;Full Professor;Full Professor",
        "bibtex": "@misc{\nduan2024on,\ntitle={On Convergence Rates of Deep Nonparametric Regression under Covariate Shift},\nauthor={Chenguang Duan and Yuling Jiao and Lican Kang and Xiliang Lu and Jerry Zhijian Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=WrBxRtGNLH}\n}",
        "github": "",
        "project": "",
        "reviewers": "FH47;Wbn8;GV9c",
        "site": "https://openreview.net/forum?id=WrBxRtGNLH",
        "pdf_size": 383002,
        "rating": "3;5;6",
        "confidence": "3;3;3",
        "soundness": "3;3;3",
        "contribution": "1;2;3",
        "presentation": "3;3;3",
        "wc_summary": "26;72;67",
        "wc_strengths": "18;9;47",
        "wc_weaknesses": "115;36;38",
        "wc_questions": "83;164;57",
        "wc_review": "242;281;209",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            55.0,
            20.607442021431645
        ],
        "wc_strengths_avg": [
            24.666666666666668,
            16.21384867602041
        ],
        "wc_weaknesses_avg": [
            63.0,
            36.778616975991184
        ],
        "wc_questions_avg": [
            101.33333333333333,
            45.56558155255151
        ],
        "wc_review_avg": [
            244.0,
            29.427877939124322
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:2Fh3r5zeSaAJ:scholar.google.com/&scioq=On+Convergence+Rates+of+Deep+Nonparametric+Regression+under+Covariate+Shift&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "Wuhan University;National University of Singapore",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.whu.edu.cn/;https://www.nus.edu.sg",
        "aff_unique_abbr": "WHU;NUS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "China;Singapore"
    },
    {
        "id": "WrEFIbrVg9",
        "title": "Non-asymptotic Analysis of Stochastic Gradient Descent under Local Differential Privacy Guarantee",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In private machine learning algorithms, Differentially Private Stochastic Gradient Descent (DP-SGD) plays an important role. Despite this, there have been few studies that have explored the theoretical analysis that can be derived from DP-SGD, particularly in a more challenging scenario where individual users retain the autonomy to specify their differential privacy budgets. In this work, we conduct a comprehensive non-asymptotic analysis of the convergence of the DP-SGD algorithm as well as its variants. This will allow individual users to assign different privacy guarantees when releasing models trained by DP-SGD. Most importantly, we provide readers with practical guidelines regarding the effect of various hyperparameters, such as step size, parameter dimensions, and privacy budgets, on convergence rates. The problem we consider includes the most commonly used loss functions in standard machine learning algorithms. For strongly convex loss functions, we establish an upper bound on the expected distance between the estimators and the global optimum. In the case of non-strongly convex functions, we analyze the upper bound difference between the loss incurred by the estimators and the optimal loss. Our proposed estimators are validated in the theoretical and practical realms by rigorous mathematical derivation and numerous numerical tests.",
        "keywords": "Differential Privacy; Stochastic Gradient Descent; Non-asymptotic Analysis",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/47146542f7328d9576f74c3a0677b0c0ec9ba393.zip",
        "author": "Enze Shi;Jinhan Xie;Linglong Kong;Bei Jiang",
        "authorids": "~Enze_Shi1;~Jinhan_Xie2;~Linglong_Kong2;~Bei_Jiang1",
        "gender": "M;M;M;F",
        "homepage": ";https://scholar.google.com/citations?user=wxSqrpwAAAAJ&hl=en;https://www.ualberta.ca/~lkong;https://www.ualberta.ca/~bei1",
        "dblp": ";214/9664;35/8525;190/4697",
        "google_scholar": ";wxSqrpwAAAAJ;https://scholar.google.ca/citations?hl=en;https://scholar.google.ca/citations?user=MfOZ8G0AAAAJ",
        "orcid": ";0000-0001-7407-8474;0000-0003-3011-9216;0000-0002-0033-839X",
        "linkedin": "enze-shi-554b621bb/;;;",
        "or_profile": "~Enze_Shi1;~Jinhan_Xie2;~Linglong_Kong2;~Bei_Jiang1",
        "aff": "University of Alberta;University of Alberta;University of Alberta;University of Alberta",
        "aff_domain": "ualberta.ca;ualberta.ca;ualberta.ca;ualberta.ca",
        "position": "PhD student;Postdoc;Full Professor;Associate Professor",
        "bibtex": "@misc{\nshi2024nonasymptotic,\ntitle={Non-asymptotic Analysis of Stochastic Gradient Descent under Local Differential Privacy Guarantee},\nauthor={Enze Shi and Jinhan Xie and Linglong Kong and Bei Jiang},\nyear={2024},\nurl={https://openreview.net/forum?id=WrEFIbrVg9}\n}",
        "github": "",
        "project": "",
        "reviewers": "o6Sb;8zUa;MP3i;mgFR",
        "site": "https://openreview.net/forum?id=WrEFIbrVg9",
        "pdf_size": 6091619,
        "rating": "3;3;3;6",
        "confidence": "5;4;3;3",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;1;1",
        "wc_summary": "94;26;61;73",
        "wc_strengths": "41;13;20;68",
        "wc_weaknesses": "229;98;251;229",
        "wc_questions": "65;177;6;91",
        "wc_review": "429;314;338;461",
        "wc_reply_reviewers": "105;0;0;25",
        "wc_reply_authors": "809;559;706;681",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            63.5,
            24.66272491027705
        ],
        "wc_strengths_avg": [
            35.5,
            21.406774628607646
        ],
        "wc_weaknesses_avg": [
            201.75,
            60.56969126551662
        ],
        "wc_questions_avg": [
            84.75,
            61.5238774785855
        ],
        "wc_review_avg": [
            385.5,
            61.15758334008956
        ],
        "wc_reply_reviewers_avg": [
            32.5,
            43.084219849035215
        ],
        "wc_reply_authors_avg": [
            688.75,
            88.95609872290937
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:IcRFduUteYgJ:scholar.google.com/&scioq=Non-asymptotic+Analysis+of+Stochastic+Gradient+Descent+under+Local+Differential+Privacy+Guarantee&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of Alberta",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ualberta.ca",
        "aff_unique_abbr": "UAlberta",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "WroPkTLiAJ",
        "title": "FedLPA: Personalized One-shot Federated Learning with Layer-Wise Posterior Aggregation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Efficiently aggregating trained neural networks from local clients into a global model on a server is a widely researched topic in federated learning. Recently, motivated by diminishing privacy concerns, mitigating potential attacks, and reducing the overhead of communication, one-shot federated learning (i.e., limiting client-server communication into a single round) has gained popularity among researchers. However, the one-shot aggregation performances are sensitively affected by the non-identical training data distribution, which exhibits high statistical heterogeneity in some real-world scenarios. To address this issue, we propose a novel one-shot aggregation method with Layer-wise Posterior Aggregation, named FedLPA. FedLPA aggregates local models to obtain a more accurate global model without requiring extra auxiliary datasets or exposing any confidential local information, e.g., label distributions. To effectively capture the statistics\nmaintained in the biased local datasets in the practical non-IID scenario, we efficiently infer the posteriors of each layer in each local model using layer-wise Laplace approximation and aggregate them to train the global parameters. Extensive experimental results demonstrate that FedLPA significantly improves learning performance over state-of-the-art methods across several metrics.",
        "keywords": "Federated Learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/d9bc93991f54a4325e3f3ef2d57a0af3ed6779fe.zip",
        "author": "Xiang Liu;Liangxi Liu;Feiyang Ye;Yunheng Shen;Xia Li;Linshan Jiang;Jialin Li",
        "authorids": "~Xiang_Liu15;~Liangxi_Liu3;~Feiyang_Ye4;~Yunheng_Shen1;~Xia_Li3;~Linshan_Jiang1;~Jialin_Li2",
        "gender": "M;M;M;;;M;M",
        "homepage": "https://lebronlambert.github.io/;https://github.com/Glimmer0x;https://feiyang-ye.github.io/;;;https://sg.linkedin.com/in/linshan-jiang-059b297b;https://www.comp.nus.edu.sg/~lijl/",
        "dblp": ";252/7506;285/4704;;;183/1884;75/4924-1.html",
        "google_scholar": "Dj9s3oEAAAAJ;LOsVJ_8AAAAJ;3EX25cAAAAAJ;;;https://scholar.google.com.sg/citations?user=S01E5-cAAAAJ;eP9FYPQAAAAJ",
        "orcid": "0009-0006-8550-3767;0009-0000-4074-5144;;;;0000-0001-8501-9488;0000-0003-3530-7662",
        "linkedin": ";glimmer0x/en;;;;;",
        "or_profile": "~Xiang_Liu15;~Liangxi_Liu3;~Feiyang_Ye4;~Yunheng_Shen1;~Xia_Li3;~Linshan_Jiang1;~Jialin_Li2",
        "aff": "National University of Singapore;northeastern university;University of Technology Sydney;;;National University of Singapore;National University of Singapore",
        "aff_domain": "u.nus.edu;northeastern.edu;uts.edu.au;;;nus.edu.sg;nus.edu.sg",
        "position": "PhD student;MS student;PhD student;;;Postdoc;Assistant Professor",
        "bibtex": "@misc{\nliu2024fedlpa,\ntitle={Fed{LPA}: Personalized One-shot Federated Learning with Layer-Wise Posterior Aggregation},\nauthor={Xiang Liu and Liangxi Liu and Feiyang Ye and Yunheng Shen and Xia Li and Linshan Jiang and Jialin Li},\nyear={2024},\nurl={https://openreview.net/forum?id=WroPkTLiAJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "dmu6;8Erm;qtZC;8qhC;yUMy",
        "site": "https://openreview.net/forum?id=WroPkTLiAJ",
        "pdf_size": 8358207,
        "rating": "3;5;5;5;6",
        "confidence": "5;3;3;3;3",
        "soundness": "2;3;4;2;3",
        "contribution": "1;2;3;2;3",
        "presentation": "1;2;4;3;3",
        "wc_summary": "84;57;120;68;100",
        "wc_strengths": "49;54;82;35;89",
        "wc_weaknesses": "858;234;196;110;95",
        "wc_questions": "81;26;36;64;40",
        "wc_review": "1072;371;434;277;324",
        "wc_reply_reviewers": "0;0;274;78;0",
        "wc_reply_authors": "3203;987;2555;714;1286",
        "reply_reviewers": "0;0;1;1;0",
        "reply_authors": "6;3;6;3;3",
        "rating_avg": [
            4.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.4,
            0.8000000000000002
        ],
        "soundness_avg": [
            2.8,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.2,
            0.7483314773547882
        ],
        "presentation_avg": [
            2.6,
            1.019803902718557
        ],
        "wc_summary_avg": [
            85.8,
            22.4535075210979
        ],
        "wc_strengths_avg": [
            61.8,
            20.448960853794013
        ],
        "wc_weaknesses_avg": [
            298.6,
            284.48240718891566
        ],
        "wc_questions_avg": [
            49.4,
            20.13554071784515
        ],
        "wc_review_avg": [
            495.6,
            292.84439554138646
        ],
        "wc_reply_reviewers_avg": [
            70.4,
            106.18775823982725
        ],
        "wc_reply_authors_avg": [
            1749.0,
            962.2878987080737
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            4.2,
            1.469693845669907
        ],
        "replies_avg": [
            31,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.9185586535436916,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5484058763760812473&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0;0",
        "aff_unique_norm": "National University of Singapore;Northeastern University;University of Technology Sydney",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.nus.edu.sg;https://www.northeastern.edu;https://www.uts.edu.au",
        "aff_unique_abbr": "NUS;NEU;UTS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;0;0",
        "aff_country_unique": "Singapore;United States;Australia"
    },
    {
        "id": "WsHaBoucSG",
        "title": "Emergent Language based Dialog for Collaborative Multi-agent Navigation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper aims to provide an empirical study on how to build agents that can collaborate effectively with multi-turn emergent dialogues. Recent research on emergent language for multi-agent communications mainly focuses on single-turn dialogue and simple settings where observations are static during communications. Here, we propose a multi-agent navigation task, a representative task with multi-turn communications and dynamic environment observations: the Tourist (the embodied agent) who can observe its local visual surroundings, and the Guide who has a holistic view of the environment but no foreknowledge of the Tourist's location. The objective of the task is to guide the Tourist to reach the target place via multi-turn dialogues emerging from scratch. To this end, we propose a collaborative multi-agent reinforcement learning method that enables both agents to generate and understand emergent language, and develop optimal dialogue decisions with a long-term goal of solving the task. We also design a real-world navigation scene with the matterport3D simulator. The result shows that our proposed method highly aligns emergent messages with both surroundings and dialogue goals, hinting that even though without human annotation or initial meaning, the agents can learn to converse and collaborate under task-oriented goals.",
        "keywords": "emergent communication",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/5aab4b97bd7060f7006df301087169cc51253619.zip",
        "author": "Han Yu;Hengtong Lu;Caixia Yuan;Xiaojie Wang",
        "authorids": "~Han_Yu8;~Hengtong_Lu1;~Caixia_Yuan1;~Xiaojie_Wang1",
        "gender": "F;M;F;M",
        "homepage": "https://hanyu1999.github.io;https://github.com/luhengtong;https://teacher.bupt.edu.cn/yuancaixia/en/index.htm;",
        "dblp": ";249/0086;69/9013;99/7033-6",
        "google_scholar": ";https://scholar.google.com/citations?view_op=list_works;;",
        "orcid": ";;;",
        "linkedin": ";;;xiaojie-wang-4b732936/",
        "or_profile": "~Han_Yu8;~Hengtong_Lu1;~Caixia_Yuan1;~Xiaojie_Wang1",
        "aff": "Beijing University of Posts and Telecommunications;Beijing University of Posts and Telecommunications;Beijing University of Posts and Telecommunications;Beijing University of Post and Telecommunication",
        "aff_domain": "bupt.edu.cn;bupt.edu.cn;bupt.edu.cn;bupt.edu.cn",
        "position": "MS student;PhD student;Associate Professor;Full Professor",
        "bibtex": "@misc{\nyu2024emergent,\ntitle={Emergent Language based Dialog for Collaborative Multi-agent Navigation},\nauthor={Han Yu and Hengtong Lu and Caixia Yuan and Xiaojie Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=WsHaBoucSG}\n}",
        "github": "",
        "project": "",
        "reviewers": "1ZPo;cd7K;oveQ;YMT3",
        "site": "https://openreview.net/forum?id=WsHaBoucSG",
        "pdf_size": 18918957,
        "rating": "5;5;5;6",
        "confidence": "2;3;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;4;2;3",
        "presentation": "3;2;2;3",
        "wc_summary": "71;104;73;89",
        "wc_strengths": "46;53;31;176",
        "wc_weaknesses": "45;120;38;209",
        "wc_questions": "46;37;39;313",
        "wc_review": "208;314;181;787",
        "wc_reply_reviewers": "0;134;0;0",
        "wc_reply_authors": "589;567;215;1240",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;2;1;2",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            84.25,
            13.36740438529485
        ],
        "wc_strengths_avg": [
            76.5,
            57.9935341223485
        ],
        "wc_weaknesses_avg": [
            103.0,
            69.12669527758433
        ],
        "wc_questions_avg": [
            108.75,
            117.97112994288052
        ],
        "wc_review_avg": [
            372.5,
            244.42023238676458
        ],
        "wc_reply_reviewers_avg": [
            33.5,
            58.023702053557386
        ],
        "wc_reply_authors_avg": [
            652.75,
            370.10294176080254
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:rzVO46XHiNwJ:scholar.google.com/&scioq=Emergent+Language+based+Dialog+for+Collaborative+Multi-agent+Navigation&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Beijing University of Posts and Telecommunications",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.bupt.edu.cn/",
        "aff_unique_abbr": "BUPT",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Beijing",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "WsIDPBcnCN",
        "title": "Plasticity-Driven Sparsity Training for Deep Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "While the increasing complexity and model size of Deep Reinforcement Learning (DRL) networks promise potential for real-world applications, these same attributes can hinder deployment in scenarios that require efficient, low-latency models. The sparse-to-sparse training paradigm has gained traction in DRL for memory compression as it reduces peak memory usage and per-iteration computation. However, this approach may escalate the overall computational cost throughout the training process. Additionally, we establish a connection between sparsity and the loss of neural plasticity. Our findings indicate that the sparse-to-sparse training paradigm may compromise network plasticity early on due to an initially high degree of sparsity, potentially undermining policy performance. In this study, we present a novel sparse DRL training approach, building upon the na\u00efve dense-to-sparse training method, i.e., iterative magnitude pruning, aimed to enhance network plasticity during sparse training. Our proposed approach, namely Plasticity-Driven Sparsity Training (PlaD), incorporates memory reset mechanisms to improve the consistency of the replay buffer, thereby enhancing network plasticity. Furthermore, it utilizes dynamic weight rescaling to mitigate the training instability that can arise from the interplay between sparse training and memory reset. We assess PlaD on various MuJoCo locomotion tasks. We assess PlaD on various MuJoCo locomotion tasks. Remarkably, it delivers performance on par with the dense model, even at sparsity levels exceeding 90%.",
        "keywords": "Reinforcement Learning;Sparse Training;Network Plasticity",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/001ff384d10370556342c492e935947257ac2266.zip",
        "author": "Li Jiang;Yichuan Ding;Xue Liu;Xianyuan Zhan",
        "authorids": "~Li_Jiang4;~Yichuan_Ding1;~Xue_Liu1;~Xianyuan_Zhan1",
        "gender": "M;M;M;M",
        "homepage": "https://louieworth.github.io/;https://www.mcgill.ca/desautels/yichuan-daniel-ding;http://www.cs.mcgill.ca/~xueliu/;http://zhanxianyuan.xyz/",
        "dblp": "45/4954-8.html;;l/XueLiu;181/5081",
        "google_scholar": ";https://scholar.google.ca/citations?user=QkWtGNkAAAAJ;https://scholar.google.com.tw/citations?user=rfLIRakAAAAJ;pDMnGloAAAAJ",
        "orcid": ";0000-0003-3014-8973;;0000-0002-3683-0554",
        "linkedin": ";yichuan-ding-05083411/?originalSubdomain=ca;;",
        "or_profile": "~Li_Jiang4;~Yichuan_Ding1;~Xue_Liu1;~Xianyuan_Zhan1",
        "aff": "McGill University;McGill University;McGill University;Tsinghua University",
        "aff_domain": "mail.mcgill.ca;mcgill.ca;mcgill.ca;tsinghua.edu.cn",
        "position": "PhD student;Associate Professor;Full Professor;Associate Professor",
        "bibtex": "@misc{\njiang2024plasticitydriven,\ntitle={Plasticity-Driven Sparsity Training for Deep Reinforcement Learning},\nauthor={Li Jiang and Yichuan Ding and Xue Liu and Xianyuan Zhan},\nyear={2024},\nurl={https://openreview.net/forum?id=WsIDPBcnCN}\n}",
        "github": "",
        "project": "",
        "reviewers": "Pfk2;WTMV;3wF2;aeZw",
        "site": "https://openreview.net/forum?id=WsIDPBcnCN",
        "pdf_size": 1898750,
        "rating": "3;3;3;5",
        "confidence": "4;5;3;4",
        "soundness": "1;1;2;2",
        "contribution": "1;1;1;2",
        "presentation": "2;3;2;2",
        "wc_summary": "39;270;73;53",
        "wc_strengths": "22;101;168;47",
        "wc_weaknesses": "358;89;439;146",
        "wc_questions": "36;827;1;88",
        "wc_review": "455;1287;681;334",
        "wc_reply_reviewers": "71;190;0;32",
        "wc_reply_authors": "455;1979;667;950",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "1;3;2;2",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            1.5,
            0.5
        ],
        "contribution_avg": [
            1.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            108.75,
            93.87857849371176
        ],
        "wc_strengths_avg": [
            84.5,
            56.029010342857205
        ],
        "wc_weaknesses_avg": [
            258.0,
            144.79813534711005
        ],
        "wc_questions_avg": [
            238.0,
            341.46522516941604
        ],
        "wc_review_avg": [
            689.25,
            366.89533589294916
        ],
        "wc_reply_reviewers_avg": [
            73.25,
            71.94225114631874
        ],
        "wc_reply_authors_avg": [
            1012.75,
            584.851423440176
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:mKUkxOXe2HkJ:scholar.google.com/&scioq=Plasticity-Driven+Sparsity+Training+for+Deep+Reinforcement+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "McGill University;Tsinghua University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.mcgill.ca;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "McGill;THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "Canada;China"
    },
    {
        "title": "RingAttention with Blockwise Transformers for Near-Infinite Context",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18463",
        "id": "WsRHpHH4s0",
        "author_site": "Hao Liu, Matei Zaharia, Pieter Abbeel",
        "tldr": "",
        "abstract": "Transformers have emerged as the architecture of choice for many state-of-the-art AI models, showcasing exceptional performance across a wide range of AI applications. However, the memory demands imposed by Transformers limit their ability to handle long sequences, thereby posing challenges in utilizing videos, actions, and other long-form sequences and modalities in complex environments. We present a novel approach, Blockwise RingAttention, which leverages blockwise computation of self-attention and feedforward to distribute long sequences across multiple devices while fully overlapping the communication of key-value blocks with the computation of blockwise attention. Our approach enables training and inference of sequences that are up to device count times longer than those achievable by prior memory-efficient Transformers, without resorting to approximations or incurring additional communication and computation overheads. Extensive experiments on language modeling and reinforcement learning tasks demonstrate the effectiveness of our approach in allowing millions of tokens context size and improving performance.",
        "keywords": "Language Model;Large Context;Transformers;Long Context Model;Memory Efficiency",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Hao Liu;Matei Zaharia;Pieter Abbeel",
        "authorids": "~Hao_Liu1;~Matei_Zaharia1;~Pieter_Abbeel2",
        "gender": "M;M;M",
        "homepage": "https://cs.stanford.edu/~matei/;https://people.eecs.berkeley.edu/~pabbeel/;https://haoliu.ai",
        "dblp": "36/2133;;09/3214-55",
        "google_scholar": "I1EvjZsAAAAJ;https://scholar.google.com.tw/citations?user=vtwH6GkAAAAJ;wtK4Yh4AAAAJ",
        "orcid": "0000-0002-7547-7204;;",
        "linkedin": "mateizaharia/;;",
        "or_profile": "~Matei_Zaharia1;~Pieter_Abbeel2;~Hao_Liu10",
        "aff": "Databricks;Covariant;University of California, Berkeley",
        "aff_domain": "databricks.com;covariant.ai;berkeley.edu",
        "position": "CTO;Founder;PhD student",
        "bibtex": "@inproceedings{\nliu2024ringattention,\ntitle={RingAttention with Blockwise Transformers for Near-Infinite Context},\nauthor={Hao Liu and Matei Zaharia and Pieter Abbeel},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=WsRHpHH4s0}\n}",
        "github": "",
        "project": "",
        "reviewers": "dMuy;Z7SR;haGA;rUcK",
        "pdf_size": 2148387,
        "rating": "3;5;6;8",
        "confidence": "5;4;4;3",
        "soundness": "3;2;3;3",
        "contribution": "1;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "63;137;74;125",
        "wc_strengths": "28;68;20;48",
        "wc_weaknesses": "274;344;143;114",
        "wc_questions": "128;85;1;22",
        "wc_review": "493;634;238;309",
        "wc_reply_reviewers": "159;0;0;0",
        "wc_reply_authors": "1286;1044;576;406",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "4;2;1;1",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            99.75,
            31.77558024647229
        ],
        "wc_strengths_avg": [
            41.0,
            18.627936010197157
        ],
        "wc_weaknesses_avg": [
            218.75,
            94.14184776176852
        ],
        "wc_questions_avg": [
            59.0,
            50.42320894191484
        ],
        "wc_review_avg": [
            418.5,
            155.37132940153404
        ],
        "wc_reply_reviewers_avg": [
            39.75,
            68.84901960086287
        ],
        "wc_reply_authors_avg": [
            828.0,
            352.8484093771715
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.9805806756909202,
        "gs_citation": 202,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8066346532887973744&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=WsRHpHH4s0",
        "pdf": "https://openreview.net/pdf?id=WsRHpHH4s0",
        "email": "databricks.com;covariant.ai;berkeley.edu",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Databricks;Covariant;University of California, Berkeley",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://databricks.com;;https://www.berkeley.edu",
        "aff_unique_abbr": "Databricks;;UC Berkeley",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Berkeley",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States;"
    },
    {
        "id": "Wsab3NhIwC",
        "title": "Resource Efficient Self-Supervised Learning for Speech Embeddings",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Representation learning from sequential data using self-supervised learning (SSL) has proven to be a powerful technique and improved state-of-the-art (SOTA) results when fine-tuned for various downstream tasks. So far the success of SSL frameworks, e.g., Wav2Vec2 and Data2Vec2, for learning audio embeddings is primarily carried out by masking intermediate features and then solving a contrastive or non-contrastive task in an end-to-end manner, respectively. In comparison to contrastive SSL methods such as Wav2Vec2, non-contrastive techniques such as Data2Vec2 have emerged having better model quality and training time. However, Data2Vec2 is still quite demanding in terms of resources, namely infrastructure (more and better GPUs), which remains a significant barrier to further improving models for downstream tasks. In this work we show that non-contrastive learning, such as an extension of the Barlow--Twins methodology, when applied to a range of downstream tasks simultaneously decreases training time and resource requirements while maintaining or improving SOTA results in key benchmark datasets. From a computional point of view, our approach decreases Data2Vec2 training time by $2\\times$ and permits effective training with smaller sequence lengths and batch sizes without requiring gradient accumulation reducing GPU VRAM requirements from NVIDIA A100's to V100's.",
        "keywords": "SSL;Speech Processing",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Abhinav Mehrotra;Alberto Gil Couto Pimentel Ramos;Shucong Zhang;Salah Zaiem;Titouan Parcollet;Sourav Bhattacharya",
        "authorids": "~Abhinav_Mehrotra1;~Alberto_Gil_Couto_Pimentel_Ramos1;~Shucong_Zhang2;~Salah_Zaiem1;~Titouan_Parcollet1;~Sourav_Bhattacharya1",
        "gender": "M;M;;M;M;M",
        "homepage": "https://abhinavmehrotra.github.io/;;;;http://www.darnault-parcollet.fr/Parcollet/index.html;",
        "dblp": "154/4273;;;232/3285;https://dblp.org/pers/hd/p/Parcollet:Titouan;69/3637",
        "google_scholar": "https://scholar.google.co.uk/citations?user=AbeyFKwAAAAJ;;;;;EU-ESvsAAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";albertogilramos;;;titouan-parcollet-b233a698;",
        "or_profile": "~Abhinav_Mehrotra1;~Alberto_Gil_Couto_Pimentel_Ramos1;~Shucong_Zhang2;~Salah_Zaiem1;~Titouan_Parcollet1;~Sourav_Bhattacharya1",
        "aff": "Samsung AI Center;Samsung;;;University of Cambridge;Samsung AI Center",
        "aff_domain": "samsung.com;samsung.com;;;cam.ac.uk;samsung.com",
        "position": "Researcher;Researcher;;;Adjunct Researcher;Principal Researcher",
        "bibtex": "@misc{\nmehrotra2024resource,\ntitle={Resource Efficient Self-Supervised Learning for Speech Embeddings},\nauthor={Abhinav Mehrotra and Alberto Gil Couto Pimentel Ramos and Shucong Zhang and Salah Zaiem and Titouan Parcollet and Sourav Bhattacharya},\nyear={2024},\nurl={https://openreview.net/forum?id=Wsab3NhIwC}\n}",
        "github": "",
        "project": "",
        "reviewers": "3Nqf;CDH9;iuxy;QXLT",
        "site": "https://openreview.net/forum?id=Wsab3NhIwC",
        "pdf_size": 238020,
        "rating": "3;5;6;6",
        "confidence": "4;4;4;3",
        "soundness": "2;2;3;3",
        "contribution": "2;3;3;2",
        "presentation": "2;3;3;3",
        "wc_summary": "113;112;43;214",
        "wc_strengths": "66;103;56;20",
        "wc_weaknesses": "189;126;92;161",
        "wc_questions": "102;3;44;67",
        "wc_review": "470;344;235;462",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "506;463;421;353",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            120.5,
            60.98565405076837
        ],
        "wc_strengths_avg": [
            61.25,
            29.55820529057879
        ],
        "wc_weaknesses_avg": [
            142.0,
            36.489724581037876
        ],
        "wc_questions_avg": [
            54.0,
            35.96526101670889
        ],
        "wc_review_avg": [
            377.75,
            96.33891996488231
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            435.75,
            56.44189490086243
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.4714045207910316,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:x5fD2cRmxWYJ:scholar.google.com/&scioq=Resource+Efficient+Self-Supervised+Learning+for+Speech+Embeddings&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Samsung;University of Cambridge",
        "aff_unique_dep": "AI Center;",
        "aff_unique_url": "https://www.samsung.com/global/careers/ai-center/;https://www.cam.ac.uk",
        "aff_unique_abbr": "Samsung AI;Cambridge",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Cambridge",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "South Korea;United Kingdom"
    },
    {
        "id": "WtHKqtHVXo",
        "title": "Generating Robot Policy Code for High-Precision and Contact-Rich Manipulation Tasks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) have been successful at generating robot policy code, but so far these results have been limited to high-level tasks that do not require accurate movement.\n% \nIt is an open question how well such approaches can work for high-precision, contact-rich tasks that require controlling contact forces with the environment.\n% \nWe find that, with the right action space, LLMs are capable of successfully generating policies for a variety of contact-rich and high-precision manipulation tasks in a zero-shot fashion.\n% \nSpecifically, we reparameterize the action space to include robot compliance with constraints on the interaction forces and stiffnesses involved in reaching a target pose.\n% \nWe validate this approach on subtasks derived from the Functional Manipulation Benchmark (FMB) and the IROS 2020 Robotic Grasping\nand Manipulation Competition, where zero-shot policy generation in this action space improves success rates by greater than 3x and 4x, respectively, over a baseline that uses free space motions.\n% \nTo further investigate properties that make language models well posed to generate contact-rich tasks, we also analyse language models ability to complete control-relevant arithmetic reasoning tasks over continuous numbers in-context and ablate the importance of different prompt components in generating relevant motion patterns.\nProject webpage: https://dex-code-gen.github.io/dex-code-gen/",
        "keywords": "contact rich manipulation;language models as planners",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Kaylee Burns;Ajinkya Jain;Keegan Go;Fei Xia;Michael Stark;Stefan Schaal;Karol Hausman",
        "authorids": "~Kaylee_Burns2;~Ajinkya_Jain1;keegang@google.com;~Fei_Xia1;~Michael_Stark5;~Stefan_Schaal1;~Karol_Hausman2",
        "gender": "F;M;;M;;M;",
        "homepage": "https://kayburns.github.io;https://jainajinkya.github.io;;;;http://www-clmc.net;",
        "dblp": "217/3002;166/0292;;;;32/3952;",
        "google_scholar": "N_rVVG8AAAAJ;CNUnD7kAAAAJ;;pqP5_PgAAAAJ;;;",
        "orcid": ";;;0000-0003-4343-1444;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Kaylee_Burns2;~Ajinkya_Jain1;keegang@google.com;~Fei_Xia1;~Michael_Stark5;~Stefan_Schaal1;~Karol_Hausman2",
        "aff": "Stanford University;Intrinsic Innovation LLC;;Google;;;",
        "aff_domain": "stanford.edu;intrinsic.ai;;google.com;;;",
        "position": "PhD student;Researcher;;Researcher;;;",
        "bibtex": "@misc{\nburns2024generating,\ntitle={Generating Robot Policy Code for High-Precision and Contact-Rich Manipulation Tasks},\nauthor={Kaylee Burns and Ajinkya Jain and Keegan Go and Fei Xia and Michael Stark and Stefan Schaal and Karol Hausman},\nyear={2024},\nurl={https://openreview.net/forum?id=WtHKqtHVXo}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZcBU;dGpr;nuUX;7Rys",
        "site": "https://openreview.net/forum?id=WtHKqtHVXo",
        "pdf_size": 4566674,
        "rating": "1;5;5;5",
        "confidence": "4;5;4;4",
        "soundness": "1;3;3;3",
        "contribution": "1;2;2;3",
        "presentation": "1;4;3;3",
        "wc_summary": "31;141;65;150",
        "wc_strengths": "21;72;52;62",
        "wc_weaknesses": "188;337;143;320",
        "wc_questions": "86;16;159;79",
        "wc_review": "326;566;419;611",
        "wc_reply_reviewers": "178;223;91;0",
        "wc_reply_authors": "376;680;1073;884",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "1;2;3;2",
        "rating_avg": [
            4.0,
            1.7320508075688772
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            96.75,
            50.310908359917335
        ],
        "wc_strengths_avg": [
            51.75,
            19.109879643786353
        ],
        "wc_weaknesses_avg": [
            247.0,
            83.25563044022908
        ],
        "wc_questions_avg": [
            85.0,
            50.68037095365423
        ],
        "wc_review_avg": [
            480.5,
            114.00986799395919
        ],
        "wc_reply_reviewers_avg": [
            123.0,
            85.40784507292055
        ],
        "wc_reply_authors_avg": [
            753.25,
            258.369285132734
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4852920665225748802&as_sdt=5,34&sciodt=0,34&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Stanford University;Intrinsic Innovation LLC;Google",
        "aff_unique_dep": ";;Google",
        "aff_unique_url": "https://www.stanford.edu;;https://www.google.com",
        "aff_unique_abbr": "Stanford;;Google",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Stanford;;Mountain View",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "WtNgFrPn8y",
        "title": "Safe Online Bid Optimization with Return On Investment and Budget Constraints",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In online marketing, the advertisers' goal is a tradeoff between achieving high volumes and high profitability.\nThe companies business units address this tradeoff by maximizing the volumes while guaranteeing a minimum Return On Investment (ROI) level.\nTechnically speaking, such a task can be naturally modeled as a combinatorial optimization problem subject to ROI and budget constraints that can be solved online.\nIn this picture, the uncertainty over the constraints' parameters plays a crucial role since they can be arbitrarily violated during the learning process due to an uncontrolled algorithms' exploration.\nSuch violations represent a major obstacle to adopting online techniques in real-world applications.\nThus, controlling the algorithms' exploration during learning is paramount to making humans trust online learning tools.\nThis paper studies the nature of both optimization and learning problems.\nIn particular, we show that the learning problem is inapproximable within any factor (unless $\\textsf{P} = \\textsf{NP}$) and provide a pseudo-polynomial-time algorithm to solve its discretized version.\nSubsequently, we prove that no online learning algorithm can violate the (ROI or budget) constraints a sublinear number of times during the learning process while guaranteeing a sublinear regret.\nWe provide the $\\textsf{GCB}$ algorithm that guarantees sublinear regret at the cost of a linear number of constraint violations, and  $\\textsf{GCB}{safe}$ that guarantees w.h.p. a constant upper bound on the number of constraints violations at the cost of a linear regret.\nMoreover, we designed  $\\textsf{GCB}{safe}(\\psi,\\phi)$, which guarantees both sublinear regret and safety w.h.p. at the cost of accepting tolerances $\\psi$ and $\\phi$ in the satisfaction of the ROI and budget constraints, respectively.\nFinally, we provide experimental results to compare the regret and constraint violations of $\\textsf{GCB}$ and $\\textsf{GCB}{safe}$.",
        "keywords": "advertising;online learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Matteo Castiglioni;Alessandro Nuara;Giulia Romano;Giorgio Spadaro;Francesco Trov\u00f2;Nicola Gatti",
        "authorids": "~Matteo_Castiglioni1;~Alessandro_Nuara1;~Giulia_Romano1;~Giorgio_Spadaro1;~Francesco_Trov\u00f21;~Nicola_Gatti1",
        "gender": ";M;F;;M;M",
        "homepage": "https://castiglionimatteo.github.io;;;;https://trovo.faculty.polimi.it/;https://www4.ceda.polimi.it/manifesti/manifesti/controller/ricerche/RicercaPerDocentiPublic.do?k_doc=75785&lang=EN&EVN_PRODOTTI=evento&__pj0=0&__pj1=d918ee8916afbd0005f5c0bc3c0ff350",
        "dblp": "225/7720;182/8949;86/7239;;69/11487;g/NicolaGatti",
        "google_scholar": "https://scholar.google.it/citations?user=NPE3HAYAAAAJ;https://scholar.google.it/citations?user=jf-Tq0UAAAAJ;https://scholar.google.it/citations?user=2XpVNvQAAAAJ;;https://scholar.google.com/citations?hl=en;https://scholar.google.com.tw/citations?user=j-HrYREAAAAJ",
        "orcid": "0000-0002-1070-6766;;;0000-0002-2889-8903;0000-0001-5796-7667;0000-0001-7349-3932",
        "linkedin": ";;giulia-romano-092261190/;giorgio-spadaro-2a4943202/;;nicola-gatti-1284b21",
        "or_profile": "~Matteo_Castiglioni1;~Alessandro_Nuara1;~Giulia_Romano1;~Giorgio_Spadaro1;~Francesco_Trov\u00f21;~Nicola_Gatti1",
        "aff": "Politecnico di Milano;;Politecnico di Milano;Polytechnic Institute of Milan;Politecnico di Milano;Polytechnic Institute of Milan",
        "aff_domain": "polimi.it;;polimi.it;mail.polimi.it;polimi.it;polimi.it",
        "position": "Assistant Professor;;Postdoc;Independent Researcher;Assistant Professor;Full Professor",
        "bibtex": "@misc{\ncastiglioni2024safe,\ntitle={Safe Online Bid Optimization with Return On Investment and Budget Constraints},\nauthor={Matteo Castiglioni and Alessandro Nuara and Giulia Romano and Giorgio Spadaro and Francesco Trov{\\`o} and Nicola Gatti},\nyear={2024},\nurl={https://openreview.net/forum?id=WtNgFrPn8y}\n}",
        "github": "",
        "project": "",
        "reviewers": "zUb2;89GL;7DCz;M2xs",
        "site": "https://openreview.net/forum?id=WtNgFrPn8y",
        "pdf_size": 596032,
        "rating": "3;3;5;6",
        "confidence": "3;3;2;3",
        "soundness": "3;3;3;3",
        "contribution": "2;2;2;2",
        "presentation": "3;2;2;3",
        "wc_summary": "145;234;173;79",
        "wc_strengths": "38;15;73;44",
        "wc_weaknesses": "259;275;122;169",
        "wc_questions": "2;61;2;4",
        "wc_review": "444;585;370;296",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            157.75,
            55.70177286227073
        ],
        "wc_strengths_avg": [
            42.5,
            20.670026608594387
        ],
        "wc_weaknesses_avg": [
            206.25,
            63.235176128480894
        ],
        "wc_questions_avg": [
            17.25,
            25.272267409158207
        ],
        "wc_review_avg": [
            423.75,
            106.79507245186925
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0;0;1;0;1",
        "aff_unique_norm": "Politecnico di Milano;Polytechnic Institute of Milan",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.polimi.it;https://www.polimi.it/",
        "aff_unique_abbr": "Polimi;Politecnico di Milano",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Italy"
    },
    {
        "id": "Wure6HljpJ",
        "title": "CoSDA: Continual Source-Free Domain Adaptation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Without access to the source data, source-free domain adaptation (SFDA) transfers knowledge from a source-domain trained model to target domains. Recently, SFDA has gained popularity due to the need to protect the data privacy of the source domain, but it suffers from catastrophic forgetting on the source domain due to the lack of data. To systematically investigate the mechanism of catastrophic forgetting, we first reimplement previous SFDA approaches within a unified framework and evaluate them on four benchmarks. We observe that there is a trade-off between adaptation gain and forgetting loss, which motivates us to design a consistency regularization to mitigate forgetting. In particular, we propose a continual source-free domain adaptation approach named CoSDA, which employs a dual-speed optimized teacher-student model pair and is equipped with consistency learning capability. Our experiments demonstrate that CoSDA outperforms state-of-the-art approaches in continuous adaptation. Notably, our CoSDA can also be integrated with other SFDA methods to alleviate forgetting.",
        "keywords": "Source-Free Domain Adaptation;Continual Learning;Catastrophic Forgetting",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/afa4349836dd6379d78c1c8f456381acd3b19f53.zip",
        "author": "Haozhe Feng;Zhaorui Yang;Hesun Chen;Tianyu Pang;Chao Du;Minfeng Zhu;Wei Chen;Shuicheng YAN",
        "authorids": "~Haozhe_Feng1;~Zhaorui_Yang1;~Hesun_Chen2;~Tianyu_Pang1;~Chao_Du1;~Minfeng_Zhu1;~Wei_Chen34;~Shuicheng_YAN3",
        "gender": "M;M;M;M;M;M;M;M",
        "homepage": "https://fenghz.github.io/resume/;https://rickyang1114.github.io;https://github.com/HesunChen;https://p2333.github.io/;https://duchao0726.github.io/;https://minfengzhu.notion.site;http://www.cad.zju.edu.cn/home/chenwei/;https://yanshuicheng.ai/",
        "dblp": "https://dblp.uni-trier.de/pid/241/9604;297/0893.html;;202/2550;75/7523;163/6031-1;c/WeiChen1;y/ShuichengYan",
        "google_scholar": "kKOuziEAAAAJ;AGjSco8AAAAJ;;wYDbtFsAAAAJ;QOp7xW0AAAAJ;vrDSgC4AAAAJ;EgQyYGUAAAAJ;https://scholar.google.com.hk/citations?user=DNuiPHwAAAAJ",
        "orcid": ";0009-0001-6356-4845;;0000-0003-0639-6176;0000-0003-1244-6336;0000-0002-6711-3099;0000-0002-8365-4741;",
        "linkedin": ";;;%E5%A4%A9%E5%AE%87-%E5%BA%9E-b3999017a/;duchao/;;;",
        "or_profile": "~Haozhe_Feng1;~Zhaorui_Yang1;~Hesun_Chen2;~Tianyu_Pang1;~Chao_Du1;~Minfeng_Zhu1;~Wei_Chen34;~Shuicheng_YAN3",
        "aff": "State Key Lab of CAD&CG, Zhejiang University;Zhejiang University;University of Illinois, Urbana Champaign;Sea AI Lab;Sea AI Lab;Zhejiang University;State key laboratory of CAD&CG, Zhejiang University;sea Group",
        "aff_domain": "zju.edu.cn;zju.edu.cn;uiuc.edu;sea.com;sea.com;zju.edu.cn;zju.edu.cn;sea.com",
        "position": "PhD student;PhD student;MS student;Senior Research Scientist;Senior Research Scientist;Assistant Professor;Full Professor;Researcher",
        "bibtex": "@misc{\nfeng2024cosda,\ntitle={Co{SDA}: Continual Source-Free Domain Adaptation},\nauthor={Haozhe Feng and Zhaorui Yang and Hesun Chen and Tianyu Pang and Chao Du and Minfeng Zhu and Wei Chen and Shuicheng YAN},\nyear={2024},\nurl={https://openreview.net/forum?id=Wure6HljpJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "CBo9;GtVN;XnHS;nYkW;TdNX;qtge",
        "site": "https://openreview.net/forum?id=Wure6HljpJ",
        "pdf_size": 3550661,
        "rating": "3;3;3;3;5;5",
        "confidence": "5;5;4;4;4;5",
        "soundness": "2;2;1;2;3;3",
        "contribution": "2;1;2;2;2;2",
        "presentation": "3;3;2;3;3;3",
        "wc_summary": "108;166;92;60;58;80",
        "wc_strengths": "43;61;22;50;132;41",
        "wc_weaknesses": "206;291;396;238;246;211",
        "wc_questions": "67;108;139;9;49;2",
        "wc_review": "424;626;649;357;485;334",
        "wc_reply_reviewers": "78;162;205;0;50;0",
        "wc_reply_authors": "366;382;311;145;147;208",
        "reply_reviewers": "1;1;1;0;1;0",
        "reply_authors": "1;1;1;1;1;1",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.1666666666666665,
            0.6871842709362768
        ],
        "contribution_avg": [
            1.8333333333333333,
            0.3726779962499649
        ],
        "presentation_avg": [
            2.8333333333333335,
            0.3726779962499649
        ],
        "wc_summary_avg": [
            94.0,
            36.58779395736598
        ],
        "wc_strengths_avg": [
            58.166666666666664,
            35.02102543076405
        ],
        "wc_weaknesses_avg": [
            264.6666666666667,
            64.96580297014388
        ],
        "wc_questions_avg": [
            62.333333333333336,
            49.408726174859254
        ],
        "wc_review_avg": [
            479.1666666666667,
            122.11936328399723
        ],
        "wc_reply_reviewers_avg": [
            82.5,
            77.47634047458187
        ],
        "wc_reply_authors_avg": [
            259.8333333333333,
            97.82538298190074
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9482207153777900850&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;2;2;0;0;3",
        "aff_unique_norm": "Zhejiang University;University of Illinois Urbana-Champaign;Sea AI Lab;Sea Group",
        "aff_unique_dep": "State Key Lab of CAD&CG;;;",
        "aff_unique_url": "http://www.zju.edu.cn;https://illinois.edu;;",
        "aff_unique_abbr": "ZJU;UIUC;;",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Urbana-Champaign",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "China;United States;"
    },
    {
        "title": "QA-LoRA: Quantization-Aware Low-Rank Adaptation of Large Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18462",
        "id": "WvFoJccpo8",
        "author_site": "Yuhui Xu, Lingxi Xie, Xiaotao Gu, Xin Chen, Heng Chang, Hengheng Zhang, Zhengsu Chen, XIAOPENG ZHANG, Qi Tian",
        "tldr": "",
        "abstract": "Recently years have witnessed a rapid development of large language models (LLMs). Despite the strong ability in many language-understanding tasks, the heavy computational burden largely restricts the application of LLMs especially when one needs to deploy them onto edge devices. In this paper, we propose a quantization-aware low-rank adaptation (QA-LoRA) algorithm. The motivation lies in the imbalanced degrees of freedom of quantization and adaptation, and the solution is to use group-wise operators which increase the degree of freedom of quantization meanwhile decreasing that of adaptation. QA-LoRA is easily implemented with a few lines of code, and it equips the original LoRA with two-fold abilities: (i) during fine-tuning, the LLM's weights are quantized (e.g., into INT4) to reduce time and memory usage; (ii) after fine-tuning, the LLM and auxiliary weights are naturally integrated into a quantized model without loss of accuracy. We apply QA-LoRA to the LLaMA and LLaMA2 model families and validate its effectiveness in different fine-tuning datasets and downstream scenarios. The code is made available at https://github.com/yuhuixu1993/qa-lora.",
        "keywords": "Large Language Models;Quantization;LoRA;Instruct Fine-tuning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/a9cdb38ed80792b11c14134e75e8f9479ad113ec.zip",
        "author": "Yuhui Xu;Lingxi Xie;Xiaotao Gu;Xin Chen;Heng Chang;Hengheng Zhang;Zhengsu Chen;XIAOPENG ZHANG;Qi Tian",
        "authorids": "~Yuhui_Xu2;~Lingxi_Xie1;~Xiaotao_Gu1;~Xin_Chen11;~Heng_Chang2;~Hengheng_Zhang1;~Zhengsu_Chen1;~XIAOPENG_ZHANG7;~Qi_Tian3",
        "gender": "M;M;M;M;M;M;;M;M",
        "homepage": "https://yuhuixu1993.github.io/;http://lingxixie.com/;;;https://hchang95.github.io;;http://www.ldmcbuaa.com;https://sites.google.com/site/zxphistory/;https://www.qitian1987.com/index.html",
        "dblp": ";123/2869;190/5278.html;;79/5668;133/6550;;;78/1467-1.html",
        "google_scholar": "https://scholar.google.com.hk/citations?user=42DgoIMAAAAJ;EEMm7hwAAAAJ;YR4Lp0QAAAAJ;oqv81a0AAAAJ;e9NeskoAAAAJ;;;Ud6aBAcAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;;0000-0002-4978-8041;;;;0000-0002-7252-5047",
        "linkedin": ";;;;;;;;",
        "or_profile": "~Yuhui_Xu2;~Lingxi_Xie1;~Xiaotao_Gu1;~Xin_Chen11;~Heng_Chang2;~Hengheng_Zhang1;~Zhengsu_Chen1;~XIAOPENG_ZHANG7;~Qi_Tian3",
        "aff": "SalesForce.com;Huawei Technologies Ltd.;Zhipu AI;;Tsinghua University;University of Texas at San Antonio;;Huawei Technologies Ltd.;Huawei Technologies Ltd.",
        "aff_domain": "salesforce.com;huawei.com;aminer.cn;;tsinghua.edu.cn;utsa.edu;;huawei.com;huawei.com",
        "position": "Research Scientist;Researcher;Researcher;;Researcher;PhD student;;Principal Researcher;Principal Researcher",
        "bibtex": "@inproceedings{\nxu2024qalora,\ntitle={{QA}-Lo{RA}: Quantization-Aware Low-Rank Adaptation of Large Language Models},\nauthor={Yuhui Xu and Lingxi Xie and Xiaotao Gu and Xin Chen and Heng Chang and Hengheng Zhang and Zhengsu Chen and XIAOPENG ZHANG and Qi Tian},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=WvFoJccpo8}\n}",
        "github": "",
        "project": "",
        "reviewers": "KGp3;2aMS;YexA",
        "pdf_size": 786883,
        "rating": "5;6;8",
        "confidence": "4;4;4",
        "soundness": "3;4;4",
        "contribution": "2;3;3",
        "presentation": "2;3;4",
        "wc_summary": "113;111;90",
        "wc_strengths": "77;16;49",
        "wc_weaknesses": "50;119;22",
        "wc_questions": "177;4;29",
        "wc_review": "417;250;190",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1023;492;320",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            104.66666666666667,
            10.402991022884823
        ],
        "wc_strengths_avg": [
            47.333333333333336,
            24.931015935086872
        ],
        "wc_weaknesses_avg": [
            63.666666666666664,
            40.762182909598394
        ],
        "wc_questions_avg": [
            70.0,
            76.34570496541811
        ],
        "wc_review_avg": [
            285.6666666666667,
            96.04281452676312
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            611.6666666666666,
            299.212670557619
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 168,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15592374188232971831&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=WvFoJccpo8",
        "pdf": "https://openreview.net/pdf?id=WvFoJccpo8",
        "email": "salesforce.com;huawei.com;aminer.cn;;tsinghua.edu.cn;utsa.edu;;huawei.com;huawei.com",
        "author_num": 9,
        "aff_unique_index": "0;1;2;3;4;1;1",
        "aff_unique_norm": "Salesforce;Huawei;Zhipu AI;Tsinghua University;University of Texas at San Antonio",
        "aff_unique_dep": ";Huawei Technologies;;;",
        "aff_unique_url": "https://www.salesforce.com;https://www.huawei.com;https://www.zhipu.ai;https://www.tsinghua.edu.cn;https://www.utsa.edu",
        "aff_unique_abbr": "Salesforce;Huawei;Zhipu AI;THU;UTSA",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";San Antonio",
        "aff_country_unique_index": "0;1;1;1;0;1;1",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "WvVyG8qBCt",
        "title": "DPFormer: Learning Differentially Private Transformer on Long-Tailed Data",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The Transformer has emerged as a versatile and effective architecture with broad applications. However, it still remains an open problem how to efficiently train a Transformer model of high utility with differential privacy guarantees. In this paper, we identify two key challenges in learning differentially private Transformers, i.e., heavy computation overhead due to per-sample gradient clipping and unintentional attention distraction within the attention mechanism. In response, we propose DPFormer, equipped with Phantom Clipping and Re-Attention Mechanism, to address these challenges. Our theoretical analysis shows that DPFormer can reduce computational costs during gradient clipping and effectively mitigate attention distraction (which could obstruct the training process and lead to a significant performance drop, especially in the presence of long-tailed data). Such analysis is further corroborated by empirical results on two real-world recommendation datasets with varying degrees of long-tailedness, showing its significant improvement in terms of efficiency and effectiveness.",
        "keywords": "Differential privacy; Transformer; Recommendation Systems",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/4cfc97b69c36ba8840f7efe390f9a24b79612f73.zip",
        "author": "Youlong Ding;Xueyang Wu;Hao Wang;Weike Pan",
        "authorids": "~Youlong_Ding1;~Xueyang_Wu1;~Hao_Wang3;~Weike_Pan1",
        "gender": ";;;",
        "homepage": ";http://www.cse.ust.hk/~xwuba;;",
        "dblp": ";https://dblp.uni-trier.de/pid/194/1291-1;;",
        "google_scholar": ";ZySbpIAAAAAJ;;",
        "orcid": ";0000-0001-5419-7273;;",
        "linkedin": ";;;",
        "or_profile": "~Youlong_Ding1;~Xueyang_Wu1;~Hao_Wang3;~Weike_Pan1",
        "aff": ";Department of Computer Science and Engineering, The Hong Kong University of Science and Technology;;",
        "aff_domain": ";cse.ust.hk;;",
        "position": ";PhD student;;",
        "bibtex": "@misc{\nding2024dpformer,\ntitle={{DPF}ormer: Learning Differentially Private Transformer on Long-Tailed Data},\nauthor={Youlong Ding and Xueyang Wu and Hao Wang and Weike Pan},\nyear={2024},\nurl={https://openreview.net/forum?id=WvVyG8qBCt}\n}",
        "github": "",
        "project": "",
        "reviewers": "FhGH;v4h1;eHtL;SzC2",
        "site": "https://openreview.net/forum?id=WvVyG8qBCt",
        "pdf_size": 1186855,
        "rating": "3;5;6;6",
        "confidence": "3;3;4;4",
        "soundness": "2;2;2;3",
        "contribution": "2;3;3;3",
        "presentation": "2;3;2;3",
        "wc_summary": "54;84;99;89",
        "wc_strengths": "54;101;121;92",
        "wc_weaknesses": "424;61;281;148",
        "wc_questions": "4;14;289;58",
        "wc_review": "536;260;790;387",
        "wc_reply_reviewers": "0;50;188;0",
        "wc_reply_authors": "661;236;478;163",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            81.5,
            16.77050983124842
        ],
        "wc_strengths_avg": [
            92.0,
            24.320773014030618
        ],
        "wc_weaknesses_avg": [
            228.5,
            137.39814409226932
        ],
        "wc_questions_avg": [
            91.25,
            115.9641647234179
        ],
        "wc_review_avg": [
            493.25,
            197.21989630866355
        ],
        "wc_reply_reviewers_avg": [
            59.5,
            76.94640992275079
        ],
        "wc_reply_authors_avg": [
            384.5,
            197.67966511505426
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.8164965809277259,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8205786031971688575&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "Hong Kong University of Science and Technology",
        "aff_unique_dep": "Department of Computer Science and Engineering",
        "aff_unique_url": "https://www.ust.hk",
        "aff_unique_abbr": "HKUST",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "title": "Theoretical Understanding of Learning from Adversarial Perturbations",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18461",
        "id": "Ww9rWUAcdo",
        "author_site": "Soichiro Kumano, Hiroshi Kera, Toshihiko Yamasaki",
        "tldr": "",
        "abstract": "It is not fully understood why adversarial examples can deceive neural networks and transfer between different networks. To elucidate this, several studies have hypothesized that adversarial perturbations, while appearing as noises, contain class features. This is supported by empirical evidence showing that networks trained on mislabeled adversarial examples can still generalize well to correctly labeled test samples. However, a theoretical understanding of how perturbations include class features and contribute to generalization is limited. In this study, we provide a theoretical framework for understanding learning from perturbations using a one-hidden-layer network trained on mutually orthogonal samples. Our results highlight that various adversarial perturbations, even perturbations of a few pixels, contain sufficient class features for generalization. Moreover, we reveal that the decision boundary when learning from perturbations matches that from standard samples except for specific regions under mild conditions. The code is available at https://github.com/s-kumano/learning-from-adversarial-perturbations.",
        "keywords": "Adversarial Perturbations;Adversarial Examples;Adversarial Attacks;Non-Robust Features",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/d9ed713dfdbb5a0fad08e373ba6c93b71d45c4dc.zip",
        "author": "Soichiro Kumano;Hiroshi Kera;Toshihiko Yamasaki",
        "authorids": "~Soichiro_Kumano1;~Hiroshi_Kera1;~Toshihiko_Yamasaki1",
        "gender": "M;M;M",
        "homepage": "https://s-kumano.github.io/;;http://www.cvm.t.u-tokyo.ac.jp/en/",
        "dblp": "280/3037;190/2671;81/881",
        "google_scholar": ";https://scholar.google.co.jp/citations?user=M4Krt5gAAAAJ;rE9iY5MAAAAJ",
        "orcid": ";;0000-0002-1784-2314",
        "linkedin": ";;",
        "or_profile": "~Soichiro_Kumano1;~Hiroshi_Kera1;~Toshihiko_Yamasaki1",
        "aff": "The University of Tokyo;Chiba University;The University of Tokyo",
        "aff_domain": "g.ecc.u-tokyo.ac.jp;chiba-u.jp;u-tokyo.ac.jp",
        "position": "PhD student;Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\nkumano2024theoretical,\ntitle={Theoretical Understanding of Learning from Adversarial Perturbations},\nauthor={Soichiro Kumano and Hiroshi Kera and Toshihiko Yamasaki},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Ww9rWUAcdo}\n}",
        "github": "",
        "project": "",
        "reviewers": "doyy;K8gK;75Lo;qaZD",
        "pdf_size": 4361426,
        "rating": "5;5;6;6",
        "confidence": "3;3;4;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;3;2",
        "presentation": "1;3;3;3",
        "wc_summary": "45;73;98;64",
        "wc_strengths": "35;77;63;34",
        "wc_weaknesses": "314;362;462;56",
        "wc_questions": "216;190;6;128",
        "wc_review": "610;702;629;282",
        "wc_reply_reviewers": "264;0;0;24",
        "wc_reply_authors": "1362;706;782;666",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "3;1;1;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            70.0,
            19.06567596493762
        ],
        "wc_strengths_avg": [
            52.25,
            18.430613120566555
        ],
        "wc_weaknesses_avg": [
            298.5,
            149.842417225564
        ],
        "wc_questions_avg": [
            135.0,
            81.04936767180853
        ],
        "wc_review_avg": [
            555.75,
            161.7380211947704
        ],
        "wc_reply_reviewers_avg": [
            72.0,
            111.28342194594845
        ],
        "wc_reply_authors_avg": [
            879.0,
            281.95567027460186
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16670826722644233670&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=Ww9rWUAcdo",
        "pdf": "https://openreview.net/pdf?id=Ww9rWUAcdo",
        "email": "g.ecc.u-tokyo.ac.jp;chiba-u.jp;u-tokyo.ac.jp",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Tokyo;Chiba University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.u-tokyo.ac.jp;https://www.chiba-u.ac.jp",
        "aff_unique_abbr": "UTokyo;Chiba U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Japan"
    },
    {
        "id": "WwCirclMvl",
        "title": "Posterior Sampling via Langevin Monte Carlo for Offline Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this paper, we consider offline reinforcement learning (RL) problems. Within this setting, posterior sampling has been rarely used, perhaps partly due to its explorative nature. The only work using posterior sampling for offline RL that we are aware of is the model-based posterior sampling of \\cite{uehara2021pessimistic}. However, this framework does not permit any tractable algorithm (not even in the linear models) where simulations of posterior samples become challenging, especially in high dimensions. In addition, the algorithm only admits a weak form of guarantees -- Bayesian sub-optimality bounds which depend on the prior distribution. To address these problems, we propose and analyze the use of Markov Chain Monte Carlo methods for offline RL. We show that for low-rank Markov decision processes (MDPs), using the Langevin Monte Carlo (LMC) algorithm, our algorithm obtains the (frequentist) sub-optimality bound that competes against any comparator policy $\\pi$ and interpolates between $\\tilde{\\mathcal{O}}(H^2 d \\sqrt{C_{\\pi}/ K})$ and $\\tilde{\\mathcal{O}}(H^2  \\sqrt{d C_{\\pi}/ K})$, where $C_{\\pi}$ is the concentrability coefficient of $\\pi$, $d$ is the dimension of the linear feature, $H$ is the episode length, and $K$ is the number of episodes in the offline data. For general MDPs with overparameterized neural network function approximation, we show that our LMC-based algorithm obtains the sub-optimality bounds of $\\tilde{\\mathcal{O}}(H^{2.5}  \\tilde{d}  \\sqrt{C_{\\pi} /K})$,  where $\\tilde{d}$ is the effective dimension of the neural network. Finally, we collaborate our findings with numerical evaluations to demonstrate that LMC-based algorithms could be both efficient and competitive for offline RL in high dimensions.",
        "keywords": "reinforcement learning;offline RL;posterior sampling",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/96ea6ddfa18060531e0f70eff7ee8097bd3c2a12.zip",
        "author": "Thanh Nguyen-Tang;Ming Yin;Masatoshi Uehara;Yu-Xiang Wang;Mengdi Wang;Raman Arora",
        "authorids": "~Thanh_Nguyen-Tang1;~Ming_Yin4;~Masatoshi_Uehara1;~Yu-Xiang_Wang1;~Mengdi_Wang1;~Raman_Arora1",
        "gender": "M;M;;F;M;M",
        "homepage": "https://mingyin0312.github.io;https://www.masatoshiuehara.com/;http://www.cs.ucsb.edu/~yuxiangw/publications.html;http://mwang.princeton.edu;http://www.cs.jhu.edu/~raman/Home.html;https://thanhnguyentang.github.io/",
        "dblp": "89/453.html;225/6517;62/1637-3.html;;;287/5102.html",
        "google_scholar": "ncBRYIUAAAAJ;https://scholar.google.co.jp/citations?user=xuLKJboAAAAJ;HGNZ1fkAAAAJ;;Spe0xdkAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0001-6458-0751;0000-0001-9017-3105;;;;0000-0002-1917-2190",
        "linkedin": ";;;;;thanhnguyentang/",
        "or_profile": "~Ming_Yin4;~Masatoshi_Uehara1;~Yu-Xiang_Wang1;~Mengdi_Wang1;~Raman_Arora1;~Thanh_Tang_Nguyen2",
        "aff": "Princeton University;Genentech ;UC Santa Barbara;Princeton University;Johns Hopkins University;Johns Hopkins University",
        "aff_domain": "princeton.edu;gene.com;ucsb.edu;princeton.edu;jhu.edu;jhu.edu",
        "position": "Postdoc;Researcher;Assistant Professor;Full Professor;Associate Professor;Postdoc",
        "bibtex": "@misc{\nnguyen-tang2024posterior,\ntitle={Posterior Sampling via Langevin Monte Carlo for Offline Reinforcement Learning},\nauthor={Thanh Nguyen-Tang and Ming Yin and Masatoshi Uehara and Yu-Xiang Wang and Mengdi Wang and Raman Arora},\nyear={2024},\nurl={https://openreview.net/forum?id=WwCirclMvl}\n}",
        "github": "",
        "project": "",
        "reviewers": "jpdm;VjxR;Cabd",
        "site": "https://openreview.net/forum?id=WwCirclMvl",
        "pdf_size": 3375653,
        "rating": "5;6;6",
        "confidence": "4;4;3",
        "soundness": "3;4;3",
        "contribution": "3;3;2",
        "presentation": "2;4;2",
        "wc_summary": "14;73;42",
        "wc_strengths": "15;81;33",
        "wc_weaknesses": "28;88;170",
        "wc_questions": "55;9;12",
        "wc_review": "112;251;257",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "475;187;630",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;2;2",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            43.0,
            24.097026095903757
        ],
        "wc_strengths_avg": [
            43.0,
            27.85677655436824
        ],
        "wc_weaknesses_avg": [
            95.33333333333333,
            58.20271089524573
        ],
        "wc_questions_avg": [
            25.333333333333332,
            21.013223349965983
        ],
        "wc_review_avg": [
            206.66666666666666,
            66.98424358674873
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            430.6666666666667,
            183.55078013696615
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18345437685227056621&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0;3;3",
        "aff_unique_norm": "Princeton University;Genentech;University of California, Santa Barbara;Johns Hopkins University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.princeton.edu;https://www.genentech.com;https://www.ucsb.edu;https://www.jhu.edu",
        "aff_unique_abbr": "Princeton;Genentech;UCSB;JHU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Santa Barbara",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Wx97sznZwB",
        "title": "CLIP-Guided Reinforcement Learning for Open-Vocabulary Tasks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Open-vocabulary ability is crucial for an agent designed to follow natural language instructions. In this paper, we focus on developing an open-vocabulary agent through reinforcement learning. We leverage the capability of CLIP to segment the target object specified in language instructions from the image observations. The resulting confidence map replaces the text instruction as input to the agent's policy, grounding the natural language into the visual information. Compared to the giant embedding space of natural language, the two-dimensional confidence map provides a more accessible unified representation for neural networks. When faced with instructions containing unseen objects, the agent converts textual descriptions into comprehensible confidence maps as input, enabling it to accomplish open-vocabulary tasks. Additionally, we introduce an intrinsic reward function based on the confidence map to more effectively guide the agent towards the target objects. Our single-task experiments demonstrate that our intrinsic reward significantly improves performance. In multi-task experiments, through testing on tasks out of the training set, we show that the agent, when provided with confidence maps as input, possesses open-vocabulary capabilities.",
        "keywords": "open-vocabulary;reinforcement learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Haobin Jiang;Zongqing Lu",
        "authorids": "~Haobin_Jiang1;~Zongqing_Lu2",
        "gender": "M;",
        "homepage": "https://github.com/SigmaBM;",
        "dblp": "199/9785;",
        "google_scholar": "5Oc2LAEAAAAJ;",
        "orcid": "0009-0009-7114-534X;",
        "linkedin": "haobin-jiang-84178b2a9;",
        "or_profile": "~Haobin_Jiang1;~Zongqing_Lu2",
        "aff": "Peking University;",
        "aff_domain": "pku.edu.cn;",
        "position": "PhD student;",
        "bibtex": "@misc{\njiang2024clipguided,\ntitle={{CLIP}-Guided Reinforcement Learning for Open-Vocabulary Tasks},\nauthor={Haobin Jiang and Zongqing Lu},\nyear={2024},\nurl={https://openreview.net/forum?id=Wx97sznZwB}\n}",
        "github": "",
        "project": "",
        "reviewers": "NgQ4;6CKq;VdeC;Q4te;9Xm8",
        "site": "https://openreview.net/forum?id=Wx97sznZwB",
        "pdf_size": 7106686,
        "rating": "5;5;6;6;8",
        "confidence": "4;5;4;3;4",
        "soundness": "2;3;3;3;4",
        "contribution": "2;2;3;3;3",
        "presentation": "2;3;3;3;4",
        "wc_summary": "269;81;156;100;276",
        "wc_strengths": "96;46;91;68;204",
        "wc_weaknesses": "536;366;251;318;228",
        "wc_questions": "96;67;37;52;148",
        "wc_review": "997;560;535;538;856",
        "wc_reply_reviewers": "435;896;145;64;21",
        "wc_reply_authors": "1448;1913;1134;853;706",
        "reply_reviewers": "1;5;1;1;1",
        "reply_authors": "3;6;2;2;1",
        "rating_avg": [
            6.0,
            1.0954451150103321
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            3.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            3.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            176.4,
            82.27903742752463
        ],
        "wc_strengths_avg": [
            101.0,
            54.49403637096448
        ],
        "wc_weaknesses_avg": [
            339.8,
            109.58175030542266
        ],
        "wc_questions_avg": [
            80.0,
            39.19693865597159
        ],
        "wc_review_avg": [
            697.2,
            192.652433153594
        ],
        "wc_reply_reviewers_avg": [
            312.2,
            325.6558920087275
        ],
        "wc_reply_authors_avg": [
            1210.8,
            433.1491198190295
        ],
        "reply_reviewers_avg": [
            1.8,
            1.6000000000000003
        ],
        "reply_authors_avg": [
            2.8,
            1.7204650534085253
        ],
        "replies_avg": [
            30,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.2886751345948129,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:LgDbyev6UPgJ:scholar.google.com/&scioq=CLIP-Guided+Reinforcement+Learning+for+Open-Vocabulary+Tasks&hl=en&as_sdt=0,31",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Peking University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.pku.edu.cn",
        "aff_unique_abbr": "Peking U",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "Wxyyc2vvGd",
        "title": "CL-Calib: Enhancing Post-training Quantization Calibration through Contrastive Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Post-training quantization (PTQ) converts a pre-trained full-precision (FP) model into a quantized model in a training-free manner. Determining suitable quantization parameters, such as scaling factors and weight rounding, is the primary strategy for mitigating the impact of quantization noise (calibration) and restoring the performance of the quantized models. However, the existing activation calibration methods have never considered information degradation between pre- (FP) and post-quantized activations. In this study, we introduce a well-defined distributional metric from information theory, mutual information, into PTQ calibration. We aim to calibrate the quantized activations by maximizing the mutual information between the pre- and post-quantized activations. To realize this goal, we establish a contrastive learning (CL) framework for the PTQ calibration, where the quantization parameters are optimized through a self-supervised proxy task. Specifically, by leveraging CL during the PTQ process, we can benefit from pulling the positive pairs of quantized and FP activations collected from the same input samples, while pushing negative pairs from different samples. Thanks to the ingeniously designed critic function, we avoid the unwanted but often-encountered collision solution in CL, especially in calibration scenarios where the amount of calibration data is limited. Additionally, we provide a theoretical guarantee that minimizing our designed loss is equivalent to maximizing the desired mutual information. Consequently, the quantized activations retain more information, which ultimately enhances the performance of the quantized network. Experimental results show that our method can effectively serve as an add-on module to existing SoTA PTQ methods.",
        "keywords": "network compression",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/e093f0f7a0d4532889bd5b347eea82062f9d0f3d.pdf",
        "author": "Yuzhang Shang;Gaowen Liu;Ramana Rao Kompella;Yan Yan",
        "authorids": "~Yuzhang_Shang1;~Gaowen_Liu4;~Ramana_Rao_Kompella1;~Yan_Yan6",
        "gender": "M;F;M;M",
        "homepage": "https://42shawn.github.io/;;https://linkedin.com/en/rkompella;",
        "dblp": "300/8483;136/1007;98/2327;13/3953-2",
        "google_scholar": "6ZPL5E0AAAAJ;NIv_aeQAAAAJ;uf9RZboAAAAJ;",
        "orcid": ";0009-0000-9194-1233;;",
        "linkedin": ";;;",
        "or_profile": "~Yuzhang_Shang1;~Gaowen_Liu4;~Ramana_Rao_Kompella1;~Yan_Yan6",
        "aff": "Illinois Institute of Technology;Cisco Systems;Cisco;University of Illinois Chicago",
        "aff_domain": "iit.edu;cisco.com;cisco.com;uic.edu",
        "position": "PhD student;Researcher;Researcher;Associate Professor",
        "bibtex": "@misc{\nshang2024clcalib,\ntitle={{CL}-Calib: Enhancing Post-training Quantization Calibration through Contrastive Learning},\nauthor={Yuzhang Shang and Gaowen Liu and Ramana Rao Kompella and Yan Yan},\nyear={2024},\nurl={https://openreview.net/forum?id=Wxyyc2vvGd}\n}",
        "github": "",
        "project": "",
        "reviewers": "Wd4w;CeZB;ZHZD;Rw23",
        "site": "https://openreview.net/forum?id=Wxyyc2vvGd",
        "pdf_size": 3672465,
        "rating": "3;5;5;6",
        "confidence": "3;4;1;5",
        "soundness": "3;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "1;2;3;2",
        "wc_summary": "72;46;130;34",
        "wc_strengths": "36;56;59;9",
        "wc_weaknesses": "270;147;89;112",
        "wc_questions": "5;71;76;57",
        "wc_review": "383;320;354;212",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            1.479019945774904
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            70.5,
            36.99662146737185
        ],
        "wc_strengths_avg": [
            40.0,
            19.96246477767713
        ],
        "wc_weaknesses_avg": [
            154.5,
            69.80866708367951
        ],
        "wc_questions_avg": [
            52.25,
            28.154706533721853
        ],
        "wc_review_avg": [
            317.25,
            64.72779542051467
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.34900503044826664,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:uf4SYNJsRT8J:scholar.google.com/&scioq=CL-Calib:+Enhancing+Post-training+Quantization+Calibration+through+Contrastive+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "Illinois Institute of Technology;Cisco Systems;University of Illinois at Chicago",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.iit.edu;https://www.cisco.com;https://www.uic.edu",
        "aff_unique_abbr": "IIT;Cisco;UIC",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Chicago",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Visual Data-Type Understanding does not emerge from scaling Vision-Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18460",
        "id": "WyEdX2R4er",
        "author_site": "Vishaal Udandarao, Max F. Burg, Samuel Albanie, Matthias Bethge",
        "tldr": "",
        "abstract": "Recent advances in the development of vision-language models (VLMs) are yielding remarkable success in recognizing visual semantic content, including impressive instances of compositional image understanding. Here, we introduce the novel task of Visual Data-Type Identification, a basic perceptual skill with implications for data curation (e.g., noisy data-removal from large datasets, domains pecific retrieval) and autonomous vision (e.g., distinguishing changing weather conditions from camera lens staining). We develop two datasets consisting of animal images altered across a diverse set of 27 visual data-types, spanning four broad categories. An extensive zero-shot evaluation of 39 VLMs, ranging from 100M to 80B parameters, shows a nuanced performance landscape. While VLMs are reasonably good at identifying certain stylistic data-types, such as cartoons and sketches, they struggle with simpler data-types arising from basic manipulations like image rotations or additive noise. Our findings reveal that (i) model scaling alone yields marginal gains for contrastively-trained models like CLIP, and (ii) there is a pronounced drop in performance for the largest auto-regressively trained VLMs like OpenFlamingo. This finding points to a blind spot in current frontier VLMs: they excel in recognizing semantic content but fail to acquire an\nunderstanding of visual data-types through scaling. By analyzing the pre-training distributions of these models and incorporating data-type information into the captions during fine-tuning, we achieve a significant enhancement in performance. By exploring this previously uncharted task, we aim to set the stage for further advancing VLMs to equip them with visual data-type understanding.",
        "keywords": "Data-Type Understanding;Vision-Language Models;Scaling",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/0ddd4ec602e887cceb7f2bbd26e682e277001631.pdf",
        "author": "Vishaal Udandarao;Max F Burg;Samuel Albanie;Matthias Bethge",
        "authorids": "~Vishaal_Udandarao1;~Max_F_Burg1;~Samuel_Albanie2;~Matthias_Bethge1",
        "gender": "M;;;M",
        "homepage": "https://vishaal27.github.io/;;;https://bethgelab.org",
        "dblp": "247/4693;;;77/3005",
        "google_scholar": "jUOcawkAAAAJ;;;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;",
        "linkedin": "vishaal-udandarao/?originalSubdomain=de;;;",
        "or_profile": "~Vishaal_Udandarao1;~Max_F_Burg1;~Samuel_Albanie2;~Matthias_Bethge1",
        "aff": "University of Cambridge;;;University of Tuebingen",
        "aff_domain": "cam.ac.uk;;;uni-tuebingen.de",
        "position": "PhD student;;;Full Professor",
        "bibtex": "@inproceedings{\nudandarao2024visual,\ntitle={Visual Data-Type Understanding does not emerge from scaling Vision-Language Models},\nauthor={Vishaal Udandarao and Max F Burg and Samuel Albanie and Matthias Bethge},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=WyEdX2R4er}\n}",
        "github": "",
        "project": "",
        "reviewers": "GzDz;mQDi;aN8Q",
        "pdf_size": 18851770,
        "rating": "8;8;8",
        "confidence": "4;3;4",
        "soundness": "1;3;3",
        "contribution": "2;3;3",
        "presentation": "3;3;3",
        "wc_summary": "145;111;75",
        "wc_strengths": "38;198;99",
        "wc_weaknesses": "375;76;45",
        "wc_questions": "201;6;48",
        "wc_review": "759;391;267",
        "wc_reply_reviewers": "196;0;13",
        "wc_reply_authors": "1486;89;506",
        "reply_reviewers": "2;0;1",
        "reply_authors": "3;1;1",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            110.33333333333333,
            28.58126814696802
        ],
        "wc_strengths_avg": [
            111.66666666666667,
            65.93094030035435
        ],
        "wc_weaknesses_avg": [
            165.33333333333334,
            148.79590794851256
        ],
        "wc_questions_avg": [
            85.0,
            83.7973746605465
        ],
        "wc_review_avg": [
            472.3333333333333,
            208.92954687060313
        ],
        "wc_reply_reviewers_avg": [
            69.66666666666667,
            89.48867091549758
        ],
        "wc_reply_authors_avg": [
            693.6666666666666,
            585.5574741693215
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6743435531782711008&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=WyEdX2R4er",
        "pdf": "https://openreview.net/pdf?id=WyEdX2R4er",
        "email": "cam.ac.uk;;;uni-tuebingen.de",
        "author_num": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Cambridge;University of Tuebingen",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cam.ac.uk;https://www.uni-tuebingen.de/",
        "aff_unique_abbr": "Cambridge;Uni T\u00fcbingen",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Cambridge;",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United Kingdom;Germany"
    },
    {
        "id": "Wz2fUy36x1",
        "title": "Pruning-as-Reconstruct: Masked Autoencoders are Efficient Importance Indicators",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Network pruning has emerged as an effective technique for reducing the size and computational complexity of neural networks, thereby addressing the challenges of deployment on resource-limited devices. However, existing pruning criteria are predominantly based on handcrafted heuristics or calculated statistics, hindering their generality and effectiveness. In this paper, we reveal that masked autoencoder (MAE) can exploit the hidden semantic information within structured parameters, thereby functioning as a learnable pruning criterion. Specifically, to address the dimension inconsistency problem between layers, we propose a parallel training pipeline, facilitating stable and efficient MAE training on weight matrices. Based on the 'harder-reconstructed-more-important' assumption, we explore diverse pruning strategies and formulate structured pruning as a sample-without-replacement problem that strikes a balance between algorithm complexity and performance. Extensive experiments on benchmark datasets, including CIFAR-10 and ImageNet, demonstrate that our method can efficiently compress both convolutional neural networks and transformers. Furthermore, the trained MAE exhibits transferability across various structures and datasets, avoiding repetitive training from scratch and highlighting its potential as a universal pruning criterion. To the best of our knowledge, this is the first work that establishes a connection between structured pruning and self-supervised learning.",
        "keywords": "Network Pruning;Deep Neural Networks;Masked Autoencoder;Reconstruction",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Tao Niu;Yinglei Teng;Yiding Liu",
        "authorids": "~Tao_Niu1;~Yinglei_Teng1;~Yiding_Liu2",
        "gender": "M;F;",
        "homepage": ";https://teacher.bupt.edu.cn/tengyinglei/zh_CN/index.htm;",
        "dblp": ";11/8605.html;",
        "google_scholar": ";https://scholar.google.com.hk/citations?user=KLHNecUAAAAJ;",
        "orcid": " 0000-0001-6149-2908;0000-0002-7170-4764;0000-0002-8739-8482",
        "linkedin": ";;",
        "or_profile": "~Tao_Niu1;~Yinglei_Teng1;~Yiding_Liu2",
        "aff": "Beijing University of Posts and Telecommunications;Beijing University of Posts and Telecommunications;Beijing University of Posts and Telecommunications",
        "aff_domain": "bupt.edu.cn;bupt.edu.cn;bupt.edu.cn",
        "position": "PhD student;Full Professor;MS student",
        "bibtex": "@misc{\nniu2024pruningasreconstruct,\ntitle={Pruning-as-Reconstruct: Masked Autoencoders are Efficient Importance Indicators},\nauthor={Tao Niu and Yinglei Teng and Yiding Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=Wz2fUy36x1}\n}",
        "github": "",
        "project": "",
        "reviewers": "GDLV;XNx5;Q6JX;WXme",
        "site": "https://openreview.net/forum?id=Wz2fUy36x1",
        "pdf_size": 4112794,
        "rating": "3;3;5;5",
        "confidence": "4;4;3;5",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "57;29;46;112",
        "wc_strengths": "34;28;36;39",
        "wc_weaknesses": "213;127;198;79",
        "wc_questions": "6;3;6;120",
        "wc_review": "310;187;286;350",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            61.0,
            31.088583113419627
        ],
        "wc_strengths_avg": [
            34.25,
            4.02336923485777
        ],
        "wc_weaknesses_avg": [
            154.25,
            54.24654366869838
        ],
        "wc_questions_avg": [
            33.75,
            49.811519751960994
        ],
        "wc_review_avg": [
            283.25,
            60.08899649686288
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:5Bb-cB83C3MJ:scholar.google.com/&scioq=Pruning-as-Reconstruct:+Masked+Autoencoders+are+Efficient+Importance+Indicators&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Beijing University of Posts and Telecommunications",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.bupt.edu.cn/",
        "aff_unique_abbr": "BUPT",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Beijing",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "X0fDR10B7c",
        "title": "Predictive Coding beyond Correlations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Bayesian and causal inference are fundamental processes for intelligence. Bayesian inference models observations: what can be inferred about $y$  if we observe a related variable $x$? Causal inference models interventions: if we directly change $x$, how will $y$ change? Predictive coding is a neuroscience-inspired method for performing Bayesian inference on continuous state variables using local information only. \nIn this work, we show how a simple change in the inference process of predictive coding enables interventional and counterfactual inference in scenarios where the causal graph is known. We then extend our results, and show how predictive coding can be used in cases where the graph is unknown, and has to be inferred from observational data. This allows us to perform structure learning and causal query answering on predictive coding-based structural causal models. Empirically, we test our method on a large number of benchmarks, as well as presenting experiments that show potential applications in machine learning.",
        "keywords": "Cognitive Science;Bayesian Networks;Predictive Coding",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/1c16df1ded63ec1d53757abb01dcc0ce1150c2a8.pdf",
        "author": "Tommaso Salvatori;Luca Pinchetti;Amine M'Charrak;Beren Millidge;Thomas Lukasiewicz",
        "authorids": "~Tommaso_Salvatori1;~Luca_Pinchetti1;~Amine_M'Charrak1;~Beren_Millidge1;~Thomas_Lukasiewicz2",
        "gender": "M;M;;M;",
        "homepage": "https://www.cs.ox.ac.uk/people/tommaso.salvatori/;;;http://beren.io/;https://www.cs.ox.ac.uk/people/thomas.lukasiewicz/",
        "dblp": "270/2016;;330/3059;244/9967;l/ThomasLukasiewicz",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;VLGACv8AAAAJ;3GGkFTkAAAAJ;arjucpEAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";luca-pinchetti-414230222/;mcharrak/;beren-millidge-377065142/;",
        "or_profile": "~Tommaso_Salvatori1;~Luca_Pinchetti1;~Amine_M'Charrak1;~Beren_Millidge1;~Thomas_Lukasiewicz2",
        "aff": "VERSES;Department of Computer Science, University of Oxford;University of Oxford;;Department of Computer Science, University of Oxford",
        "aff_domain": "verses.ai;cs.ox.ac.uk;cs.ox.ac.uk;;cs.ox.ac.uk",
        "position": "Researcher;PhD student;PhD student;;Full Professor",
        "bibtex": "@misc{\nsalvatori2024predictive,\ntitle={Predictive Coding beyond Correlations},\nauthor={Tommaso Salvatori and Luca Pinchetti and Amine M'Charrak and Beren Millidge and Thomas Lukasiewicz},\nyear={2024},\nurl={https://openreview.net/forum?id=X0fDR10B7c}\n}",
        "github": "",
        "project": "",
        "reviewers": "ER1E;ai27;9K6b;sN6J",
        "site": "https://openreview.net/forum?id=X0fDR10B7c",
        "pdf_size": 5700199,
        "rating": "3;5;5;6",
        "confidence": "3;3;4;3",
        "soundness": "1;3;3;3",
        "contribution": "2;3;2;2",
        "presentation": "1;2;2;2",
        "wc_summary": "31;73;86;62",
        "wc_strengths": "9;58;19;45",
        "wc_weaknesses": "396;79;271;102",
        "wc_questions": "5;140;400;46",
        "wc_review": "441;350;776;255",
        "wc_reply_reviewers": "0;0;259;0",
        "wc_reply_authors": "1210;344;499;258",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "3;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            63.0,
            20.334699407662754
        ],
        "wc_strengths_avg": [
            32.75,
            19.62619423117992
        ],
        "wc_weaknesses_avg": [
            212.0,
            129.5434290112779
        ],
        "wc_questions_avg": [
            147.75,
            153.6397979040587
        ],
        "wc_review_avg": [
            455.5,
            196.38037070949835
        ],
        "wc_reply_reviewers_avg": [
            64.75,
            112.1502897900848
        ],
        "wc_reply_authors_avg": [
            577.75,
            375.1069014294458
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.13245323570650439,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17705514576379309609&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "1;1;1",
        "aff_unique_norm": ";University of Oxford",
        "aff_unique_dep": ";Department of Computer Science",
        "aff_unique_url": ";https://www.ox.ac.uk",
        "aff_unique_abbr": ";Oxford",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Oxford",
        "aff_country_unique_index": "1;1;1",
        "aff_country_unique": ";United Kingdom"
    },
    {
        "id": "X1StGoeR8d",
        "title": "AMMD: Attentive Maximum Mean Discrepancy for Few-Shot Image Classification",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Metric-based methods have attained promising performance for the few-shot classification of images. Maximum Mean Discrepancy (MMD) is a typical distance between distributions, requiring to compute expectations w.r.t. data distributions. In this paper, we propose Attentive Maximum Mean Discrepancy (AMMD) to assist MMD with distributions adaptively estimated by an attentive distribution generation module. Based on AMMD, the few-shot learning is modeled as the AMMD metric learning problem. In implementation, we incorporate the part-based feature representation for modeling the AMMD between images. By meta-learning technique, the attentive distribution generation module of AMMD can be learned to generate feature distributions for computing MMD between images, with higher probability mass on the more discriminative features. In the meta-test phase, each query image is labeled as the support class with minimal AMMD to the query image. Extensive experiments show that our AMMD achieves competitive or state-of-the-art performance on few-shot classification benchmark datasets of miniImageNet, tieredImageNet, CIFAR-FS, and FC100.",
        "keywords": "few-shot learning; metric learning; meta-learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Ji Wu;Shipeng Wang;Jian Sun",
        "authorids": "~Ji_Wu6;~Shipeng_Wang2;~Jian_Sun1",
        "gender": "M;M;M",
        "homepage": "https://github.com/WuJi1;https://shipengwang.github.io/;https://gr.xjtu.edu.cn/en/web/jiansun/publications",
        "dblp": ";;68/4942-9.html",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;SSgNWOMAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Ji_Wu6;~Shipeng_Wang2;~Jian_Sun1",
        "aff": "Xi'an Jiaotong University;Xi'an Jiaotong University;Xi'an Jiaotong University",
        "aff_domain": "xjtu.edu.cn;xjtu.edu.cn;xjtu.edu.cn",
        "position": "PhD student;Assistant Professor;Professor",
        "bibtex": "@misc{\nwu2024ammd,\ntitle={{AMMD}: Attentive Maximum Mean Discrepancy for Few-Shot Image Classification},\nauthor={Ji Wu and Shipeng Wang and Jian Sun},\nyear={2024},\nurl={https://openreview.net/forum?id=X1StGoeR8d}\n}",
        "github": "",
        "project": "",
        "reviewers": "qKBe;wPps;sp9L;H34j",
        "site": "https://openreview.net/forum?id=X1StGoeR8d",
        "pdf_size": 1135662,
        "rating": "3;5;5;5",
        "confidence": "5;5;5;4",
        "soundness": "2;2;2;2",
        "contribution": "1;3;2;2",
        "presentation": "3;3;2;1",
        "wc_summary": "58;47;85;133",
        "wc_strengths": "28;41;23;19",
        "wc_weaknesses": "326;292;149;209",
        "wc_questions": "3;79;3;5",
        "wc_review": "415;459;260;366",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            80.75,
            33.1841453106751
        ],
        "wc_strengths_avg": [
            27.75,
            8.287792227125388
        ],
        "wc_weaknesses_avg": [
            244.0,
            69.42261879243681
        ],
        "wc_questions_avg": [
            22.5,
            32.630507198019465
        ],
        "wc_review_avg": [
            375.0,
            74.09790820259369
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10522257051185978149&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Xi'an Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.xjtu.edu.cn",
        "aff_unique_abbr": "XJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "X1lDOv09hG",
        "title": "High variance score function estimates help diffusion models generalize",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "How do diffusion-based generative models generalize beyond their training set? In particular, do they perform something similar to kernel density estimation? If so, what is the kernel, and which aspects of training and sampling determine its form? We argue that a key contributor to generalization is the fact that the denoising score matching objective usually used to train diffusion models tends to obtain high variance score function estimates at early times. We investigate this claim by mathematically studying (unconditional) diffusion models in a variety of analytically tractable settings (e.g., when the training distribution is a Gaussian mixture), and are able to compute various exact and asymptotic expressions for quantities like the variance of score function parameter estimates. We show that the effect of this high variance is mathematically equivalent to running reverse diffusion using the \"optimal\" score, and then convolving the result with a data-dependent kernel function.",
        "keywords": "generative modeling;score-based modeling;score matching;generalization;diffusion;theory",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/9274d80659931e3a65c685fc7c0575ac29dac88d.pdf",
        "author": "John Vastola",
        "authorids": "~John_Vastola1",
        "gender": "M",
        "homepage": "https://www.johnvastola.com/",
        "dblp": "342/1644",
        "google_scholar": "LMFIFBcAAAAJ",
        "orcid": "0000-0002-5625-2106",
        "linkedin": "",
        "or_profile": "~John_Vastola1",
        "aff": "Harvard Medical School",
        "aff_domain": "hms.harvard.edu",
        "position": "Postdoc",
        "bibtex": "@misc{\nvastola2024high,\ntitle={High variance score function estimates help diffusion models generalize},\nauthor={John Vastola},\nyear={2024},\nurl={https://openreview.net/forum?id=X1lDOv09hG}\n}",
        "github": "",
        "project": "",
        "reviewers": "oZCe;V1yR;dwfL;TEfw",
        "site": "https://openreview.net/forum?id=X1lDOv09hG",
        "pdf_size": 326906,
        "rating": "3;3;5;5",
        "confidence": "4;3;4;4",
        "soundness": "1;2;2;2",
        "contribution": "1;2;2;3",
        "presentation": "2;3;2;3",
        "wc_summary": "86;173;49;53",
        "wc_strengths": "30;80;40;69",
        "wc_weaknesses": "528;153;70;100",
        "wc_questions": "87;130;77;3",
        "wc_review": "731;536;236;225",
        "wc_reply_reviewers": "76;0;99;0",
        "wc_reply_authors": "2063;1302;611;696",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "3;2;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            90.25,
            49.886746736984165
        ],
        "wc_strengths_avg": [
            54.75,
            20.437404434027332
        ],
        "wc_weaknesses_avg": [
            212.75,
            184.41986742214084
        ],
        "wc_questions_avg": [
            74.25,
            45.702160780427
        ],
        "wc_review_avg": [
            432.0,
            213.00352109765697
        ],
        "wc_reply_reviewers_avg": [
            43.75,
            44.499297747267875
        ],
        "wc_reply_authors_avg": [
            1168.0,
            581.3806842336611
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:sObLmE4tGqEJ:scholar.google.com/&scioq=High+variance+score+function+estimates+help+diffusion+models+generalize&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Harvard University",
        "aff_unique_dep": "Medical School",
        "aff_unique_url": "https://hms.harvard.edu",
        "aff_unique_abbr": "HMS",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Boston",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "X1p0eNzTGH",
        "title": "How the Level Sampling Process impacts Zero-Shot Generalisation in Deep Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "A key limitation preventing the wider adoption of autonomous agents trained via deep reinforcement learning (RL) is their limited ability to generalise to new environments, even when these share similar characteristics with environments encountered during training. In this work, we investigate how a non-uniform sampling strategy of individual environment instances, or levels,  affects the zero-shot generalisation (ZSG) ability of RL agents, considering two failure modes: overfitting and over-generalisation. As a first step, we measure the mutual information (MI) between the agent's internal representation and the set of training levels, which we find to be well-correlated to instance overfitting. In contrast to uniform sampling, adaptive sampling strategies prioritising levels based on their value loss are more effective at maintaining lower MI, which provides a novel theoretical justification for this class of techniques. We then turn our attention to Unsupervised Environment Design (UED) methods, which adaptively generate new training levels and minimise MI more effectively than methods sampling from a fixed set. However, we find UED methods significantly shift the training distribution, resulting in over-generalisation and worse ZSG performance over the distribution of interest. To prevent both instance overfitting and over-generalisation, we introduce Self-Supervised Environment Design (SSED). SSED generates levels using a variational autoencoder, effectively reducing MI while minimising the shift with the distribution of interest, and leads to statistically significant improvements in ZSG over fixed-set level sampling strategies and UED methods.",
        "keywords": "Deep Reinforcement Learning;Zero-Shot Generalisation;Unsupervised Environment Design;Deep Generative Models;Mutual Information;Distributional Shift",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/992357630b12494c287c4cee42cdf1929f36a526.pdf",
        "author": "Samuel Garcin;James Doran;Shangmin Guo;Christopher G. Lucas;Stefano V Albrecht",
        "authorids": "~Samuel_Garcin1;~James_Doran1;~Shangmin_Guo1;~Christopher_G._Lucas1;~Stefano_V_Albrecht1",
        "gender": "M;;M;;",
        "homepage": ";;;http://christopherglucas.com;https://agents-lab.org/stefano-albrecht/",
        "dblp": ";;183/0949;69/3093;118/3975",
        "google_scholar": ";;cpOrbSoAAAAJ;;https://scholar.google.co.uk/citations?user=ceSFqCcAAAAJ",
        "orcid": ";;0000-0003-1716-0994;;0000-0002-8735-1465",
        "linkedin": "samuel-garcin-7469b9b1/;;;;",
        "or_profile": "~Samuel_Garcin1;~James_Doran1;~Shangmin_Guo1;~Christopher_G._Lucas1;~Stefano_V_Albrecht1",
        "aff": "University of Edinburgh;;University of Edinburgh;University of Edinburgh, University of Edinburgh;University of Edinburgh",
        "aff_domain": "edinburgh.org;;ed.ac.uk;ed.ac.uk;ed.ac.uk",
        "position": "PhD student;;PhD student;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\ngarcin2024how,\ntitle={How the Level Sampling Process impacts Zero-Shot Generalisation in Deep Reinforcement Learning},\nauthor={Samuel Garcin and James Doran and Shangmin Guo and Christopher G. Lucas and Stefano V Albrecht},\nyear={2024},\nurl={https://openreview.net/forum?id=X1p0eNzTGH}\n}",
        "github": "",
        "project": "",
        "reviewers": "mvxM;zMV7;GmmJ",
        "site": "https://openreview.net/forum?id=X1p0eNzTGH",
        "pdf_size": 1558809,
        "rating": "3;6;8",
        "confidence": "3;3;4",
        "soundness": "2;3;3",
        "contribution": "3;3;3",
        "presentation": "2;2;4",
        "wc_summary": "94;78;228",
        "wc_strengths": "50;114;90",
        "wc_weaknesses": "749;291;67",
        "wc_questions": "84;50;48",
        "wc_review": "977;533;433",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "701;102;242",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            5.666666666666667,
            2.0548046676563256
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            133.33333333333334,
            67.25738290742181
        ],
        "wc_strengths_avg": [
            84.66666666666667,
            26.398653164297773
        ],
        "wc_weaknesses_avg": [
            369.0,
            283.83563318700254
        ],
        "wc_questions_avg": [
            60.666666666666664,
            16.519348924485154
        ],
        "wc_review_avg": [
            647.6666666666666,
            236.42522896021245
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            348.3333333333333,
            255.83892502032518
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.8029550685469661,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12754953463923289524&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of Edinburgh",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ed.ac.uk",
        "aff_unique_abbr": "Edinburgh",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "X2gjYmy77l",
        "title": "Taming AI Bots: Controllability of Neural States in Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We tackle the question of whether an agent can, by suitable choice of prompts, control an AI bot to any state. We view large language models (LLMs) and their corresponding conversational interfaces (AI bots) as discrete-time dynamical systems evolving in the embedding space of (sub-)word tokens, where they are trivially controllable. However, we are not interested in controlling AI Bots to produce individual words but rather sequences, or sentences, that convey certain ''meanings''. To tackle the question of controllability in the space of meanings, we first describe how meanings are represented in an LLM: after pre-training, the LLM is a deterministic map from incomplete sequences of discrete tokens to an inner product space of discriminant vectors (''embeddings'') of the next token; after fine-tuning and reinforcement, the same LLM maps complete sequences to a vector space. Since no token follows the special end-of-sequence token during pre-training, that vector space can be co-opted to represent meanings and align them with human supervision during fine-tuning.  Accordingly, ''meanings'' in trained LLMs can be viewed simply as equivalence classes of complete trajectories of tokens. Although rudimentary, this characterization of meanings is compatible with so-called deflationary theories in epistemology. More importantly, defining meanings as equivalence classes of sentences allows us to frame the key question as determining the controllability of a dynamical system evolving in the quotient space of discrete trajectories induced by the model itself, a problem that to the best of our knowledge has never been tackled before. To do so, we characterize a ``well trained LLM'' through conditions that are largely met by today's LLMs and show that, when restricted to the space of meanings, a well-trained AI bot is controllable under verifiable conditions. More precisely, we introduce a functional characterization of AI bots, and derive necessary and sufficient conditions for controllability. The fact that AI bots are controllable means that they can be designed to counteract adverse actions and avoid reaching undesirable states before their boundary is crossed.",
        "keywords": "Explainability;hallucination;controllability;generative language models",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Stefano Soatto;Paulo Tabuada;Pratik Chaudhari;Tian Yu Liu;Matteo Marchi;Rahul Ramesh",
        "authorids": "~Stefano_Soatto1;~Paulo_Tabuada1;~Pratik_Chaudhari1;~Tian_Yu_Liu2;matmarchi@g.ucla.edu;~Rahul_Ramesh2",
        "gender": ";M;M;;;M",
        "homepage": ";http://www.ee.ucla.edu/~tabuada;https://pratikac.github.io/;;;https://cis.upenn.edu/~rahulram",
        "dblp": ";43/2753;;;;168/7029",
        "google_scholar": ";bOElZi8AAAAJ;c_z5hWEAAAAJ;;;wCa6nygAAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";;pratik-chaudhari-59508765;;;",
        "or_profile": "~Stefano_Soatto1;~Paulo_Tabuada1;~Pratik_Chaudhari1;~Tian_Yu_Liu2;matmarchi@g.ucla.edu;~Rahul_Ramesh2",
        "aff": ";University of California, Los Angeles;School of Engineering and Applied Science, University of Pennsylvania;;;University of Pennsylvania",
        "aff_domain": ";ucla.edu;seas.upenn.edu;;;upenn.edu",
        "position": ";Professor;Assistant Professor;;;PhD student",
        "bibtex": "@misc{\nsoatto2024taming,\ntitle={Taming {AI} Bots: Controllability of Neural States in Large Language Models},\nauthor={Stefano Soatto and Paulo Tabuada and Pratik Chaudhari and Tian Yu Liu and Matteo Marchi and Rahul Ramesh},\nyear={2024},\nurl={https://openreview.net/forum?id=X2gjYmy77l}\n}",
        "github": "",
        "project": "",
        "reviewers": "gqJX;vfen;jHbh;ecwe",
        "site": "https://openreview.net/forum?id=X2gjYmy77l",
        "pdf_size": 687628,
        "rating": "1;5;5;5",
        "confidence": "4;2;4;3",
        "soundness": "1;3;2;3",
        "contribution": "1;2;3;2",
        "presentation": "1;3;2;2",
        "wc_summary": "26;82;40;96",
        "wc_strengths": "29;221;42;47",
        "wc_weaknesses": "133;157;212;117",
        "wc_questions": "3;99;636;166",
        "wc_review": "191;559;930;426",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "560;655;2000;875",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;4;2",
        "rating_avg": [
            4.0,
            1.7320508075688772
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            61.0,
            28.861739379323623
        ],
        "wc_strengths_avg": [
            84.75,
            78.93787113927003
        ],
        "wc_weaknesses_avg": [
            154.75,
            35.9887135085432
        ],
        "wc_questions_avg": [
            226.0,
            243.69961017613466
        ],
        "wc_review_avg": [
            526.5,
            267.64201837529174
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1022.5,
            575.8092131947873
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5018970041942616061&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "University of California, Los Angeles;University of Pennsylvania",
        "aff_unique_dep": ";School of Engineering and Applied Science",
        "aff_unique_url": "https://www.ucla.edu;https://www.upenn.edu",
        "aff_unique_abbr": "UCLA;UPenn",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Los Angeles;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "X34hvb6uX4",
        "title": "Discovering Localized Pollution Hotspots Using Sparse Sensor Measurements",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Air pollution is one of the key challenges in sustainable urban development and\nits management consists of two aspects, monitoring and governance policy. Most\ncities only deploy a sparse coarse-resolution sensor network for air pollution mon-\nitoring due to the high costs of industrial-grade gold standard air quality sensors.\nSimilarly, most city governments tend to focus on more heavily polluted areas of\nthe city, the so-called \u201chotspots\u201d, due to a lack of budget. In this paper, we first\nshow that the space-time resolution of the public sensor network is insufficient to\ndetect and analyze hotspots effectively. Taking New Delhi as our study area, we\naugmented the government network with 28 low-cost sensors that monitor PM 2.5\nconcentrations and collected pollution data over a 30-month period, from May 1,\n2018, to Nov 1, 2020. Applying established definitions of hotspots to this data, we\nshow the existence of additional hotspots that are missed by the public network.\nGoing further, we show that using machine-learning-based spatial interpolation\nmethods, like Gaussian Process regression, on the sparse sensor data allows us\nto find these hotspots in a manner that is robust to sensor failures and is extensi-\nble to new spatial locations that don\u2019t have sensors deployed. We also compare\nthis approach with traditional dispersion modeling and provide the pros and cons\nof both approaches. Finally, we present the findings of our analysis and provide\nrecommendations for changes to the New Delhi government\u2019s current policy.",
        "keywords": "Spatial Interpolation;Air Pollution;Hotspots;Sparse Data;Sensor Networks",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Ankit Bhardwaj;Ananth Balashankar;Shiva R. Iyer;Nita Soans;Anant Sudarshan;Rohini Pande;Lakshmi Subramanian",
        "authorids": "~Ankit_Bhardwaj1;~Ananth_Balashankar1;~Shiva_R._Iyer1;~Nita_Soans1;~Anant_Sudarshan1;~Rohini_Pande3;~Lakshmi_Subramanian1",
        "gender": "M;M;M;;;;M",
        "homepage": "https://sites.google.com/view/ankitbhardwaj/;https://ananthbalashankar.github.io/;https://cs.nyu.edu/~siyer;;;https://campuspress.yale.edu/rpande/;https://cs.nyu.edu/~lakshmi/Lakshmi/Home.html",
        "dblp": "205/6833;141/2020;146/7870;;;;",
        "google_scholar": "JFYBXjoAAAAJ;dr5VLwEAAAAJ;zD0SgJ8AAAAJ;;;;https://scholar.google.com.tw/citations?user=sNeVyqoAAAAJ",
        "orcid": ";;;;;;",
        "linkedin": "ankitbhardwaj2411/;;shiva-radhakrishnan-iyer/;;;;",
        "or_profile": "~Ankit_Bhardwaj1;~Ananth_Balashankar1;~Shiva_R._Iyer1;~Nita_Soans1;~Anant_Sudarshan1;~Rohini_Pande3;~Lakshmi_Subramanian1",
        "aff": "New York University;Google;;;;;New York University",
        "aff_domain": "nyu.edu;google.com;;;;;nyu.edu",
        "position": "PhD student;Researcher;;;;;Full Professor",
        "bibtex": "@misc{\nbhardwaj2024discovering,\ntitle={Discovering Localized Pollution Hotspots Using Sparse Sensor Measurements},\nauthor={Ankit Bhardwaj and Ananth Balashankar and Shiva R. Iyer and Nita Soans and Anant Sudarshan and Rohini Pande and Lakshmi Subramanian},\nyear={2024},\nurl={https://openreview.net/forum?id=X34hvb6uX4}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=X34hvb6uX4",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:DiCF03wnNNQJ:scholar.google.com/&scioq=Discovering+Localized+Pollution+Hotspots+Using+Sparse+Sensor+Measurements&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "New York University;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.nyu.edu;https://www.google.com",
        "aff_unique_abbr": "NYU;Google",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Training-free Multi-objective Diffusion Model for 3D Molecule Generation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18459",
        "id": "X41c4uB4k0",
        "author_site": "XU HAN, Caihua Shan, Yifei Shen, Can Xu, Han Yang, Xiang Li, Dongsheng Li",
        "tldr": "",
        "abstract": "Searching for novel and diverse molecular candidates is a critical undertaking in drug and material discovery. Existing approaches have successfully adapted the diffusion model, the most effective generative model in image generation, to create 1D SMILES strings, 2D chemical graphs, or 3D molecular conformers. However, these methods are not efficient and flexible enough to generate 3D molecules with multiple desired properties, as they require additional training for the models for each new property or even a new combination of existing properties. Moreover, some properties may potentially conflict, making it impossible to find a molecule that satisfies all of them simultaneously. To address these challenges, we present a training-free conditional 3D molecular generation algorithm based on off-the-shelf unconditional diffusion models and property prediction models. The key techniques include modeling the loss of property prediction models as energy functions, considering the property relation between multiple conditions as a probabilistic graph, and developing a stable posterior estimation for computing the conditional score function. We conducted experiments on both single-objective and multi-objective 3D molecule generation, focusing on quantum properties, and compared our approach with the trained or fine-tuned diffusion models. Our proposed model achieves superior performance in generating molecules that meet the conditions, without any additional training cost.",
        "keywords": "Multi-objective Diffusion Model;3D Molecule",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Xu Han;Caihua Shan;Yifei Shen;Can Xu;Han Yang;Xiang Li;Dongsheng Li",
        "authorids": "~Xu_Han9;~Caihua_Shan1;~Yifei_Shen1;~Can_Xu7;~Han_Yang6;~Xiang_Li24;~Dongsheng_Li2",
        "gender": "F;M;M;;M;M;M",
        "homepage": ";https://openreview.net/profile?id=~Yifei_Shen1;https://leoxc1571.github.io/;https://yanghan.dev;https://lixiang3776.github.io;http://recmind.cn;",
        "dblp": ";51/609.html;;;40/1491-67.html;254/0830-2.html;",
        "google_scholar": "-knurggAAAAJ;;https://scholar.google.com.hk/citations?user=6tJ39VAAAAAJ;;JnxxNtsAAAAJ;VNg5rA8AAAAJ;eFsFAJoAAAAJ",
        "orcid": ";;0000-0002-7354-9374;;0009-0003-0142-2483;0000-0003-3103-8442;",
        "linkedin": ";;;;;;",
        "or_profile": "~Caihua_Shan1;~Yifei_Shen1;~Can_Xu7;~Han_Yang6;~Xiang_Li24;~Dongsheng_Li2;~XU_HAN6",
        "aff": "Microsoft;Microsoft Research Asia;East China Normal University;Microsoft Research;East China Normal University;Microsoft Research Asia;Tufts University",
        "aff_domain": "microsoft.com;microsoft.com;stu.ecnu.edu.cn;research.microsoft.com;ecnu.edu.cn;microsoft.com;tufts.edu",
        "position": "Researcher;Research Cheerleader;PhD student;Senior Researcher;Full Professor;Principal Researcher;PhD student",
        "bibtex": "@inproceedings{\nhan2024trainingfree,\ntitle={Training-free Multi-objective Diffusion Model for 3D Molecule Generation},\nauthor={Xu Han and Caihua Shan and Yifei Shen and Can Xu and Han Yang and Xiang Li and Dongsheng Li},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=X41c4uB4k0}\n}",
        "github": "",
        "project": "",
        "reviewers": "7aDk;LmRX;yusH;ufcA",
        "pdf_size": 3686621,
        "rating": "6;6;6;8",
        "confidence": "4;4;2;3",
        "soundness": "2;3;2;3",
        "contribution": "3;3;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "115;32;27;208",
        "wc_strengths": "35;54;22;34",
        "wc_weaknesses": "309;49;5;6",
        "wc_questions": "115;49;17;157",
        "wc_review": "574;184;71;405",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1326;394;371;785",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            95.5,
            73.7580504080741
        ],
        "wc_strengths_avg": [
            36.25,
            11.453711188955307
        ],
        "wc_weaknesses_avg": [
            92.25,
            126.39496627635137
        ],
        "wc_questions_avg": [
            84.5,
            54.77910185463066
        ],
        "wc_review_avg": [
            308.5,
            194.74919768769266
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            719.0,
            387.1479045532857
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.17407765595569782,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13315316894335254474&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=X41c4uB4k0",
        "pdf": "https://openreview.net/pdf?id=X41c4uB4k0",
        "email": "microsoft.com;microsoft.com;stu.ecnu.edu.cn;research.microsoft.com;ecnu.edu.cn;microsoft.com;tufts.edu",
        "author_num": 7,
        "aff_unique_index": "0;0;1;0;1;0;2",
        "aff_unique_norm": "Microsoft;East China Normal University;Tufts University",
        "aff_unique_dep": "Microsoft Corporation;;",
        "aff_unique_url": "https://www.microsoft.com;http://www.ecnu.edu.cn;https://www.tufts.edu",
        "aff_unique_abbr": "Microsoft;ECNU;Tufts",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Asia",
        "aff_country_unique_index": "0;1;1;0;1;1;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "X4ATu1huMJ",
        "title": "Realistic Evaluation of Test-Time Adaptation: Surrogate-Based Model Selection Strategies",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Test-Time Adaptation (TTA) has recently emerged as a promising strategy for tackling the problem of machine learning model robustness under distribution shifts. This setting constitutes a significant challenge as the model has to adapt to the new environment without any labeled data. Contemporary methods, such as neural networks, typically rely on a cumbersome hyper-parameter tuning procedure that leverages target labels, yet what happens when those labels are unavailable, as in the test-time adaptation scenario? \nIn this work, we tackle this very problem of hyperparameter selection by evaluating several surrogate metrics (without any access to the test labels). The main goal of this work is to provide a\nrealistic evaluation of TTA methods under different domain shifts, as well as evaluation of different strategies for model selection in TTA. \nOur main findings are:\ni) the accuracy of model selection strategies strongly varies across datasets and adaptation methods; ii) out of 6 evaluated approaches, only the AdaContrast method allows for surrogate-based model selection that matches oracle selection performance and iii) using a tiny-set of labeled test samples beats all competing selection strategies. Our findings underscore the need for future research in the field to conduct rigorous evaluations with explicitly stated model selection strategies, to give more realistic approximations of test-time adaptation methods performance.",
        "keywords": "test-time adaptation;model selection",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/d7c3c59a197738f19e1a46af2a83369c2533acec.zip",
        "author": "Sebastian Cygert;Damian S\u00f3jka;Tomasz Trzcinski;Bart\u0142omiej Twardowski",
        "authorids": "~Sebastian_Cygert1;~Damian_S\u00f3jka1;~Tomasz_Trzcinski2;~Bart\u0142omiej_Twardowski1",
        "gender": "M;M;M;M",
        "homepage": "https://pg.edu.pl/en/p/sebastian-cygert-1128802;;https://cvlab.ii.pw.edu.pl/ttrzcins/;",
        "dblp": "138/3693;;05/11408;156/6628",
        "google_scholar": "https://scholar.google.pl/citations?user=wLH9PP8AAAAJ;;https://scholar.google.pl/citations?user=bJMRBFoAAAAJ;https://scholar.google.pl/citations?user=8yywECgAAAAJ",
        "orcid": ";;;0000-0003-2117-8679",
        "linkedin": "sebastiancygert/;damian-sojka-a907b618a;;bartlomiejtwardowski/",
        "or_profile": "~Sebastian_Cygert1;~Damian_S\u00f3jka1;~Tomasz_Trzcinski2;~Bart\u0142omiej_Twardowski1",
        "aff": "IDEAS NCBR;Technical University of Poznan;Warsaw University of Technology;Computer Vision Center, Universitat Aut\u00f2noma de Barcelona",
        "aff_domain": "ideas-ncbr.pl;put.poznan.pl;pw.edu.pl;cvc.uab.es",
        "position": "Postdoc;PhD student;Full Professor;Postdoc",
        "bibtex": "@misc{\ncygert2024realistic,\ntitle={Realistic Evaluation of Test-Time Adaptation: Surrogate-Based Model Selection Strategies},\nauthor={Sebastian Cygert and Damian S{\\'o}jka and Tomasz Trzcinski and Bart{\\l}omiej Twardowski},\nyear={2024},\nurl={https://openreview.net/forum?id=X4ATu1huMJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "Yunj;KXPd;tHzX;34fr",
        "site": "https://openreview.net/forum?id=X4ATu1huMJ",
        "pdf_size": 2623466,
        "rating": "3;3;3;5",
        "confidence": "4;4;4;4",
        "soundness": "3;2;2;2",
        "contribution": "1;2;1;2",
        "presentation": "2;3;2;2",
        "wc_summary": "99;103;104;86",
        "wc_strengths": "71;187;64;41",
        "wc_weaknesses": "499;848;265;125",
        "wc_questions": "131;408;7;26",
        "wc_review": "800;1546;440;278",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            98.0,
            7.176350047203662
        ],
        "wc_strengths_avg": [
            90.75,
            56.66734068226601
        ],
        "wc_weaknesses_avg": [
            434.25,
            273.70730260626954
        ],
        "wc_questions_avg": [
            143.0,
            160.12026729930224
        ],
        "wc_review_avg": [
            766.0,
            488.35847489318746
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:YO_sx8MsjiIJ:scholar.google.com/&scioq=Realistic+Evaluation+of+Test-Time+Adaptation:+Surrogate-Based+Model+Selection+Strategies&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Institute for Development, Economic Analysis, and Simulation (IDEAS);Technical University of Poznan;Warsaw University of Technology;Universitat Aut\u00f2noma de Barcelona",
        "aff_unique_dep": ";;;Computer Vision Center",
        "aff_unique_url": "https://www.ideas-ncbr.gov.pl;https://www.put.poznan.pl/;https://www.pw.edu.pl;https://www.uab.cat",
        "aff_unique_abbr": "IDEAS;PUT;WUT;UAB",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "Poland;Spain"
    },
    {
        "id": "X5VElAKt2s",
        "title": "LoRA ensembles for large language model fine-tuning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Finetuned LLMs often exhibit poor uncertainty quantification, manifesting as overconfidence, poor calibration, and unreliable prediction results on test data or out-of-distribution samples. One approach commonly used in vision for alleviating this issue is a deep ensemble, which constructs an ensemble by training the same model multiple times using different random initializations. However, there is\na huge challenge to ensembling LLMs: the most effective LLMs are very, very large. Keeping a single LLM in memory is already challenging enough: keeping an ensemble of e.g. 5 LLMs in memory is impossible in many settings. To address these issues, we propose an ensemble approach using Low-Rank Adapters (LoRA), a parameter-efficient fine-tuning technique. Critically, these low-rank adapters represent a very small number of parameters, orders of magnitude less than the underlying pre-trained model. Thus, it is possible to construct large ensembles of LoRA adapters with almost the same computational overhead as using the original model. We find that LoRA ensembles, applied on its own or on top of pre-existing regularization techniques, gives consistent improvements in predictive accuracy and uncertainty quantification.",
        "keywords": "Large language model; Deep ensemble; Calibration;",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Xi Wang;Laurence Aitchison;Maja Rudolph",
        "authorids": "~Xi_Wang4;~Laurence_Aitchison1;~Maja_Rudolph4",
        "gender": "M;;F",
        "homepage": ";http://www.gatsby.ucl.ac.uk/~laurence/;http://maja-rita-rudolph.com/",
        "dblp": ";155/1918.html;164/5581",
        "google_scholar": "giztudUAAAAJ;;https://scholar.google.com/citations?hl=en",
        "orcid": ";;",
        "linkedin": "wang-xi-660a47153/;;",
        "or_profile": "~Xi_Wang4;~Laurence_Aitchison1;~Maja_Rudolph4",
        "aff": "University of Massachusetts, Amherst;University of Bristol;Bosch",
        "aff_domain": "umass.edu;bristol.ac.uk;bosch.com",
        "position": "PhD student;Assistant Professor;Researcher",
        "bibtex": "@misc{\nwang2024lora,\ntitle={Lo{RA} ensembles for large language model fine-tuning},\nauthor={Xi Wang and Laurence Aitchison and Maja Rudolph},\nyear={2024},\nurl={https://openreview.net/forum?id=X5VElAKt2s}\n}",
        "github": "",
        "project": "",
        "reviewers": "zRFn;QbwE;o2gF",
        "site": "https://openreview.net/forum?id=X5VElAKt2s",
        "pdf_size": 557833,
        "rating": "3;5;5",
        "confidence": "4;4;4",
        "soundness": "3;3;2",
        "contribution": "2;2;2",
        "presentation": "2;3;2",
        "wc_summary": "85;48;139",
        "wc_strengths": "71;57;36",
        "wc_weaknesses": "260;166;124",
        "wc_questions": "7;92;5",
        "wc_review": "423;363;304",
        "wc_reply_reviewers": "0;55;0",
        "wc_reply_authors": "793;507;112",
        "reply_reviewers": "0;1;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            90.66666666666667,
            37.366057086910075
        ],
        "wc_strengths_avg": [
            54.666666666666664,
            14.383632673594278
        ],
        "wc_weaknesses_avg": [
            183.33333333333334,
            56.85849882725439
        ],
        "wc_questions_avg": [
            34.666666666666664,
            40.549010126293126
        ],
        "wc_review_avg": [
            363.3333333333333,
            48.58211833815218
        ],
        "wc_reply_reviewers_avg": [
            18.333333333333332,
            25.927248643506744
        ],
        "wc_reply_authors_avg": [
            470.6666666666667,
            279.201639600407
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 41,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7823920308368771614&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of Massachusetts Amherst;University of Bristol;Robert Bosch GmbH",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.umass.edu;https://www.bristol.ac.uk;https://www.bosch.com",
        "aff_unique_abbr": "UMass Amherst;Bristol;Bosch",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Amherst;",
        "aff_country_unique_index": "0;1;2",
        "aff_country_unique": "United States;United Kingdom;Germany"
    },
    {
        "id": "X5qi6fnnw7",
        "title": "Conservative World Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Zero-shot reinforcement learning (RL) promises to provide agents that can perform _any_ task in an environment after an offline pre-training phase. _Forward-backward_ (FB) representations represent remarkable progress towards this ideal, achieving 85% of the performance of task-specific agents in this setting. However, such performance is contingent on access to large and diverse datasets for pre-training, which cannot be expected for most real problems. Here, we explore how FB performance degrades when trained on small datasets that lack diversity, and mitigate it with _conservatism_, a well-established feature of performant offline RL algorithms. We evaluate our family of methods across various datasets, domains and tasks, reaching 150% of vanilla FB performance in aggregate. Somewhat surprisingly, conservative FB algorithms also outperform the task-specific baseline, despite lacking access to reward labels and being required to maintain policies for all tasks. Conservative FB algorithms perform no worse than FB on full datasets, and so present little downside over their predecessor. Our code is available anonymously at [https://anonymous.4open.science/r/conservative-world-models-4903](https://anonymous.4open.science/r/conservative-world-models-4903).",
        "keywords": "reinforcement learning;world models;offline reinforcement learning;zero-shot reinforcement learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Scott Jeen;Tom Bewley;Sergey Levine;Jonathan Cullen",
        "authorids": "~Scott_Jeen1;~Tom_Bewley1;~Sergey_Levine1;~Jonathan_Cullen1",
        "gender": "M;;M;M",
        "homepage": "https://enjeeneer.io/;http://tombewley.com;https://people.eecs.berkeley.edu/~svlevine/;https://www.refficiency.org/",
        "dblp": ";;80/7594;",
        "google_scholar": "3HPX720AAAAJ;OqPzZ08AAAAJ;8R35rCwAAAAJ;",
        "orcid": ";;;0000-0003-4347-5025",
        "linkedin": ";;;",
        "or_profile": "~Scott_Jeen1;~Tom_Bewley1;~Sergey_Levine1;~Jonathan_Cullen1",
        "aff": "University of Cambridge;J.P. Morgan;Google;University of Cambridge",
        "aff_domain": "cam.ac.uk;jpmorgan.com;google.com;cam.ac.uk",
        "position": "PhD student;Researcher;Research Scientist;Full Professor",
        "bibtex": "@misc{\njeen2024conservative,\ntitle={Conservative World Models},\nauthor={Scott Jeen and Tom Bewley and Sergey Levine and Jonathan Cullen},\nyear={2024},\nurl={https://openreview.net/forum?id=X5qi6fnnw7}\n}",
        "github": "",
        "project": "",
        "reviewers": "5Tki;xRo3;85iy;2wo9",
        "site": "https://openreview.net/forum?id=X5qi6fnnw7",
        "pdf_size": 3683586,
        "rating": "3;5;5;6",
        "confidence": "4;3;3;4",
        "soundness": "2;3;2;3",
        "contribution": "2;2;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "46;92;198;84",
        "wc_strengths": "41;78;303;59",
        "wc_weaknesses": "182;271;998;80",
        "wc_questions": "133;54;268;324",
        "wc_review": "402;495;1767;547",
        "wc_reply_reviewers": "0;287;813;15",
        "wc_reply_authors": "545;1060;1263;833",
        "reply_reviewers": "0;2;2;1",
        "reply_authors": "3;4;4;3",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            105.0,
            56.43580423808985
        ],
        "wc_strengths_avg": [
            120.25,
            106.31880125358826
        ],
        "wc_weaknesses_avg": [
            382.75,
            361.5863486084617
        ],
        "wc_questions_avg": [
            194.75,
            106.88165183978025
        ],
        "wc_review_avg": [
            802.75,
            559.1280600184541
        ],
        "wc_reply_reviewers_avg": [
            278.75,
            328.92124817347997
        ],
        "wc_reply_authors_avg": [
            925.25,
            267.0827353087429
        ],
        "reply_reviewers_avg": [
            1.25,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.5,
            0.5
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.2294157338705618,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3229917950591323634&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "University of Cambridge;J.P. Morgan;Google",
        "aff_unique_dep": ";;Google",
        "aff_unique_url": "https://www.cam.ac.uk;https://www.jpmorganchase.com;https://www.google.com",
        "aff_unique_abbr": "Cambridge;JPM;Google",
        "aff_campus_unique_index": "0;2;0",
        "aff_campus_unique": "Cambridge;;Mountain View",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "id": "X5u72wkdH3",
        "title": "SYRAC: Synthesize, Rank, and Count",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Crowd counting is a critical task in computer vision, with several important applications. However, existing counting methods rely on labor-intensive density map annotations, necessitating the manual localization of each individual pedestrian. While recent efforts have attempted to alleviate the annotation burden through weakly or semi-supervised learning, these approaches fall short of significantly reducing the workload. We propose a novel approach to eliminate the annotation burden by leveraging latent diffusion models to generate synthetic data. However, these models struggle to reliably understand object quantities, leading to noisy annotations when prompted to produce images with a specific quantity of objects. To address this, we use latent diffusion models to create two types of synthetic data: one by removing pedestrians from real images, which generates ranked image pairs with a weak but reliable object quantity signal, and the other by generating synthetic images with a predetermined number of objects, offering a strong but noisy counting signal. Our method utilizes the ranking image pairs for pre-training and then fits a linear layer to the noisy synthetic images using these crowd quantity features. We report state-of-the-art results for unsupervised crowd counting. As part of our commitment to fostering reproducibility within the field, we plan to release all synthetic datasets, code, and model checkpoints.",
        "keywords": "unsupervised learning;crowd counting;synthetic data generation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/2f0123e8ff27cb63870d993ab47f2562ac7aa416.pdf",
        "author": "Adriano C. D'Alessandro;Ali Mahdavi Amiri;Ghassan Hamarneh",
        "authorids": "~Adriano_C._D'Alessandro1;~Ali_Mahdavi_Amiri1;~Ghassan_Hamarneh1",
        "gender": "M;M;M",
        "homepage": "https://adrian-dalessandro.github.io/;https://www.sfu.ca/~amahdavi;http://www.medicalimageanalysis.com",
        "dblp": "358/6034;33/10499.html;h/GhassanHamarneh",
        "google_scholar": "FvPiYsEAAAAJ;https://scholar.google.ca/citations?user=M9eTADwAAAAJ;https://scholar.google.ca/citations?user=61DdlkAAAAAJ",
        "orcid": "0009-0004-1791-8843;;0000-0001-5040-7448",
        "linkedin": ";;ghassanhamarneh/",
        "or_profile": "~Adriano_C._D'Alessandro1;~Ali_Mahdavi_Amiri1;~Ghassan_Hamarneh1",
        "aff": "Simon Fraser University;Simon Fraser University;Simon Fraser University",
        "aff_domain": "sfu.ca;sfu.ca;sfu.ca",
        "position": "PhD student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nd'alessandro2024syrac,\ntitle={{SYRAC}: Synthesize, Rank, and Count},\nauthor={Adriano C. D'Alessandro and Ali Mahdavi Amiri and Ghassan Hamarneh},\nyear={2024},\nurl={https://openreview.net/forum?id=X5u72wkdH3}\n}",
        "github": "",
        "project": "",
        "reviewers": "rbvA;QJht;98cL",
        "site": "https://openreview.net/forum?id=X5u72wkdH3",
        "pdf_size": 51943155,
        "rating": "3;5;6",
        "confidence": "5;5;5",
        "soundness": "3;2;3",
        "contribution": "2;2;3",
        "presentation": "3;2;3",
        "wc_summary": "59;67;48",
        "wc_strengths": "49;30;16",
        "wc_weaknesses": "149;369;10",
        "wc_questions": "70;2;226",
        "wc_review": "327;468;300",
        "wc_reply_reviewers": "0;147;289",
        "wc_reply_authors": "967;1213;1573",
        "reply_reviewers": "0;2;1",
        "reply_authors": "2;3;3",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            5.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            58.0,
            7.788880963698615
        ],
        "wc_strengths_avg": [
            31.666666666666668,
            13.523641850067197
        ],
        "wc_weaknesses_avg": [
            176.0,
            147.79941362084853
        ],
        "wc_questions_avg": [
            99.33333333333333,
            93.77040518675862
        ],
        "wc_review_avg": [
            365.0,
            73.66138744281159
        ],
        "wc_reply_reviewers_avg": [
            145.33333333333334,
            117.98964172992287
        ],
        "wc_reply_authors_avg": [
            1251.0,
            248.85337048149458
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4660406585939475818&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Simon Fraser University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sfu.ca",
        "aff_unique_abbr": "SFU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "X6ajk22thA",
        "title": "HGMD: Rethinking Hard Sample Distillation for GNN-to-MLP Knowledge Distillation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "To bridge the gaps between powerful Graph Neural Networks (GNNs) and lightweight Multi-Layer Perceptron (MLPs), GNN-to-MLP Knowledge Distillation (KD) proposes to distill knowledge from a well-trained teacher GNN into a student MLP. A counter-intuitive observation is that ``better teacher, better student\" does not always hold true for GNN-to-MLP KD, which inspires us to explore what are the criteria for better GNN knowledge samples (nodes). In this paper, we revisit the knowledge samples in teacher GNNs from the perspective of hardness rather than correctness, and identify that hard sample distillation may be a major performance bottleneck of existing KD algorithms. The GNN-to-MLP KD involves two different types of hardness, one student-free knowledge hardness describing the inherent complexity of GNN knowledge, and the other student-dependent distillation hardness describing the difficulty of teacher-to-student distillation. In this paper, we propose a novel Hardness-aware GNN-to-MLP Distillation (HGMD) framework, which models both knowledge and distillation hardness and then extracts a hardness-aware subgraph for each sample separately, where a harder sample will be assigned a larger subgraph. Finally, two hardness-aware distillation schemes (i.e., HGMD-weight and HGMD-mixup) are devised to distill subgraph-level knowledge from teacher GNNs into the corresponding nodes of student MLPs. As non-parametric distillation, HGMD does not involve any additional learnable parameters beyond the student MLPs, but it still outperforms most of the state-of-the-art competitors. For example, HGMD-mixup improves over the vanilla MLPs by 12.95% and outperforms its teacher GNNs by 2.48% averaged over seven real-world datasets and three GNN architectures.",
        "keywords": "Graph Knowledge Distillation;Hard Sample Mining",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Lirong Wu;Yunfan Liu;Yufei Huang;Haitao Lin;Cheng Tan;Stan Z. Li",
        "authorids": "~Lirong_Wu1;~Yunfan_Liu2;~Yufei_Huang4;~Haitao_Lin2;~Cheng_Tan1;~Stan_Z._Li2",
        "gender": ";M;M;M;M;M",
        "homepage": ";https://github.com/XYxiyang;https://2021.igem.org/Team:ZJU-China;;https://chengtan9907.github.io/;https://en.westlake.edu.cn/academics/School_of_Engineering/About/Our_People/Faculty/201912/t20191206_2497.shtml",
        "dblp": "15/10330;170/8550-2;68/1946-2;34/1040;70/1533-12.html;l/StanZLi",
        "google_scholar": "Tk7TrCoAAAAJ;;qmTjdwIAAAAJ;o5A23qIAAAAJ;6kTV6aMAAAAJ;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": ";0009-0002-1639-5855;0009-0007-8184-4529;;;",
        "linkedin": ";;;;;stan-z-li-%E6%9D%8E%E5%AD%90%E9%9D%92-55753224/",
        "or_profile": "~Lirong_Wu1;~Yunfan_Liu2;~Yufei_Huang4;~Haitao_Lin2;~Cheng_Tan1;~Stan_Z._Li1",
        "aff": "Westlake University;Zhejiang University;Zhejiang University;Westlake University;Zhejiang University & Westlake University;Westlake University",
        "aff_domain": "westlake.edu.cn;zju.edu.cn;zju.edu.cn;westlake.edu.cn;westlake.edu.cn;westlake.edu.cn",
        "position": "PhD student;PhD student;PhD student;PhD student;PhD student;Chair Professor",
        "bibtex": "@misc{\nwu2024hgmd,\ntitle={{HGMD}: Rethinking Hard Sample Distillation for {GNN}-to-{MLP} Knowledge Distillation},\nauthor={Lirong Wu and Yunfan Liu and Yufei Huang and Haitao Lin and Cheng Tan and Stan Z. Li},\nyear={2024},\nurl={https://openreview.net/forum?id=X6ajk22thA}\n}",
        "github": "",
        "project": "",
        "reviewers": "RA2Z;X3Yr;61RB;bK6B",
        "site": "https://openreview.net/forum?id=X6ajk22thA",
        "pdf_size": 545941,
        "rating": "5;5;5;5",
        "confidence": "4;5;4;4",
        "soundness": "2;2;2;2",
        "contribution": "2;1;2;3",
        "presentation": "3;2;2;3",
        "wc_summary": "58;90;35;41",
        "wc_strengths": "63;40;22;29",
        "wc_weaknesses": "189;230;295;68",
        "wc_questions": "2;33;2;59",
        "wc_review": "312;393;354;197",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            56.0,
            21.365860619221497
        ],
        "wc_strengths_avg": [
            38.5,
            15.532224567009067
        ],
        "wc_weaknesses_avg": [
            195.5,
            82.74811176093385
        ],
        "wc_questions_avg": [
            24.0,
            23.843238035132728
        ],
        "wc_review_avg": [
            314.0,
            73.37233811185249
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:9wiYDyvDrrUJ:scholar.google.com/&scioq=HGMD:+Rethinking+Hard+Sample+Distillation+for+GNN-to-MLP+Knowledge+Distillation&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;0;1;0",
        "aff_unique_norm": "Westlake University;Zhejiang University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.westlake.edu.cn;https://www.zju.edu.cn",
        "aff_unique_abbr": "WU;ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Interpretable Diffusion via Information Decomposition",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18458",
        "id": "X6tNkN6ate",
        "author_site": "Xianghao Kong, Ollie Liu, Han Li, Dani Yogatama, Greg Ver Steeg",
        "tldr": "",
        "abstract": "Denoising diffusion models enable conditional generation and density modeling of complex relationships like images and text. \nHowever, the nature of the learned relationships is opaque making it difficult to understand precisely what relationships between words and parts of an image are captured, or to predict the effect of an intervention. We illuminate the fine-grained relationships learned by diffusion models by noticing a precise relationship between diffusion and information decomposition. Exact expressions for mutual information and conditional mutual information can be written in terms of the denoising model. Furthermore, ${pointwise}$ estimates can be easily estimated as well, allowing us to ask questions about the relationships between specific images and captions. Decomposing information even further to understand which variables in a high-dimensional space carry information is a long-standing problem. For diffusion models, we show that a natural non-negative decomposition of mutual information emerges, allowing us to quantify informative relationships between words and pixels in an image. We exploit these new relations to measure the compositional understanding of diffusion models, to do unsupervised localization of objects in images, and to measure effects when selectively editing images through prompt interventions.",
        "keywords": "Diffusion Models;Information Theory;Interpretable Machine Learning",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/86ae1d603f63b3fffe628c51366f92a4dfba55ea.zip",
        "author": "Xianghao Kong;Ollie Liu;Han Li;Dani Yogatama;Greg Ver Steeg",
        "authorids": "~Xianghao_Kong1;~Ollie_Liu1;~Han_Li15;~Dani_Yogatama2;~Greg_Ver_Steeg1",
        "gender": "M;M;M;M;",
        "homepage": ";https://ollieliu.com;;https://profiles.ucr.edu/app/home/profile/gregoryv;",
        "dblp": ";;;82/9058;08/8178",
        "google_scholar": "IMxyo-YAAAAJ;https://scholar.google.com/citations?view_op=list_works;;goLucoIAAAAJ;",
        "orcid": ";;;0000-0002-0793-141X;",
        "linkedin": ";oliu/;han-li-24ba461a6/;;",
        "or_profile": "~Xianghao_Kong1;~Ollie_Liu1;~Han_Li15;~Greg_Ver_Steeg1;~Dani_Yogatama1",
        "aff": "University of California, Riverside;University of Southern California;University of California, Riverside;USC/ISI;Google DeepMind",
        "aff_domain": "cs.ucr.edu;usc.edu;ucr.edu;isi.edu;google.com",
        "position": "PhD student;PhD;PhD student;Associate Professor;Research Scientist",
        "bibtex": "@inproceedings{\nkong2024interpretable,\ntitle={Interpretable Diffusion via Information Decomposition},\nauthor={Xianghao Kong and Ollie Liu and Han Li and Dani Yogatama and Greg Ver Steeg},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=X6tNkN6ate}\n}",
        "github": "",
        "project": "",
        "reviewers": "U1vn;gEHf;S4G8;qKVB;ajkd;EMcD",
        "pdf_size": 1687321,
        "rating": "6;6;6;6;6;6",
        "confidence": "4;5;3;3;4;2",
        "soundness": "3;2;3;3;3;2",
        "contribution": "3;3;3;3;3;2",
        "presentation": "2;2;3;3;1;2",
        "wc_summary": "50;107;55;79;136;111",
        "wc_strengths": "64;69;30;122;126;70",
        "wc_weaknesses": "66;27;45;86;137;102",
        "wc_questions": "7;50;78;83;128;103",
        "wc_review": "187;253;208;370;527;386",
        "wc_reply_reviewers": "0;30;113;48;0;15",
        "wc_reply_authors": "292;390;415;648;563;490",
        "reply_reviewers": "0;1;1;1;0;1",
        "reply_authors": "1;2;2;2;1;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.9574271077563381
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.8333333333333335,
            0.3726779962499649
        ],
        "presentation_avg": [
            2.1666666666666665,
            0.6871842709362768
        ],
        "wc_summary_avg": [
            89.66666666666667,
            31.06802572134609
        ],
        "wc_strengths_avg": [
            80.16666666666667,
            33.80540719405041
        ],
        "wc_weaknesses_avg": [
            77.16666666666667,
            36.40245718202123
        ],
        "wc_questions_avg": [
            74.83333333333333,
            38.54614838807576
        ],
        "wc_review_avg": [
            321.8333333333333,
            118.6077803331449
        ],
        "wc_reply_reviewers_avg": [
            34.333333333333336,
            38.998575472559104
        ],
        "wc_reply_authors_avg": [
            466.3333333333333,
            116.73426612991102
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 21,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1525880194944310279&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=X6tNkN6ate",
        "pdf": "https://openreview.net/pdf?id=X6tNkN6ate",
        "email": "cs.ucr.edu;usc.edu;ucr.edu;isi.edu;google.com",
        "author_num": 5,
        "aff_unique_index": "0;1;0;1;2",
        "aff_unique_norm": "University of California, Riverside;University of Southern California;Google",
        "aff_unique_dep": ";;Google DeepMind",
        "aff_unique_url": "https://www.ucr.edu;https://www.usc.edu;https://deepmind.com",
        "aff_unique_abbr": "UCR;USC;DeepMind",
        "aff_campus_unique_index": "0;1;0;2",
        "aff_campus_unique": "Riverside;Los Angeles;ISI;",
        "aff_country_unique_index": "0;0;0;0;1",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "X7gqOBG8ow",
        "title": "Generalizing Denoising to Non-Equilibrium Structures Improves Equivariant Force Fields",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Understanding the interactions of atoms such as forces in 3D atomistic systems is fundamental to many applications like molecular dynamics and catalyst design. However, simulating these interactions requires compute-intensive ab initio calcu\u0002lations and thus results in limited data for training neural networks. In this paper, we propose to use denoising non-equilibrium structures (DeNS) as an auxiliary task to better leverage training data and improve performance. For training DeNS, we first corrupt a 3D structure by adding noise to its 3D coordinates and then predict the noise. Different from previous works on pre-training via denoising, which are limited to equilibrium structures, the proposed DeNS generalizes to a much larger set of non-equilibrium structures without relying on another dataset for pre-training. The key enabler is the encoding of input forces. A non-equilibrium structure has non-zero forces and thus many possible atomic positions, making denoising an ill-posed problem. To address the issue, we additionally take the forces of the original structure as inputs to specify which non-equilibrium structure we are denoising. Concretely, given a corrupted non-equilibrium structure and the forces of the original one, we predict the non-equilibrium structure satisfying the input forces instead of any arbitrary structures. Since DeNS requires encoding forces, DeNS favors equivariant networks, which can easily incorporate forces and other higher-order tensors in node embeddings.\n\nWe demonstrate the effectiveness of training equivariant networks with DeNS on OC20, OC22 and MD17 datasets. For OC20, EquiformerV2 trained with DeNS achieves better S2EF results and comparable IS2RE results compared to EquiformerV2 trained without DeNS. For OC22, EquiformerV2 trained with DeNS establishs new state-of-the-art results. For MD17, Equiformer ($L_{max} = 2$) trained\nwith DeNS achieves better results than Equiformer ($L_{max} = 3$) without DeNS and saves 3.1$\\times$ training time. We also show that DeNS can improve other equivariant networks like eSCN on OC20 and SEGNN-like networks on MD17.",
        "keywords": "equivariant neural networks;graph neural networks;computational physics",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Yi-Lun Liao;Tess Smidt;Abhishek Das",
        "authorids": "~Yi-Lun_Liao1;~Tess_Smidt1;~Abhishek_Das1",
        "gender": "M;F;M",
        "homepage": ";https://blondegeek.github.io/;https://abhishekdas.com/",
        "dblp": "225/6644.html;215/4978.html;40/5262",
        "google_scholar": ";;t6exkOAAAAAJ",
        "orcid": ";0000-0001-5581-5344;",
        "linkedin": "yilunliao/;;",
        "or_profile": "~Yi-Lun_Liao1;~Tess_Smidt1;~Abhishek_Das1",
        "aff": "Massachusetts Institute of Technology;Massachusetts Institute of Technology;FAIR, Meta AI",
        "aff_domain": "mit.edu;mit.edu;meta.com",
        "position": "PhD student;Assistant Professor;Research Scientist",
        "bibtex": "@misc{\nliao2024generalizing,\ntitle={Generalizing Denoising to Non-Equilibrium Structures Improves Equivariant Force Fields},\nauthor={Yi-Lun Liao and Tess Smidt and Abhishek Das},\nyear={2024},\nurl={https://openreview.net/forum?id=X7gqOBG8ow}\n}",
        "github": "",
        "project": "",
        "reviewers": "erXC;AVUJ;tmjX;eCvt;NSpY",
        "site": "https://openreview.net/forum?id=X7gqOBG8ow",
        "pdf_size": 6948555,
        "rating": "5;5;5;5;6",
        "confidence": "3;4;4;4;2",
        "soundness": "3;2;2;3;3",
        "contribution": "3;3;3;2;4",
        "presentation": "3;2;2;3;2",
        "wc_summary": "51;72;59;51;120",
        "wc_strengths": "54;136;71;46;91",
        "wc_weaknesses": "90;230;422;268;381",
        "wc_questions": "66;170;142;98;76",
        "wc_review": "261;608;694;463;668",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "692;1233;713;1181;804",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "1;2;1;2;2",
        "rating_avg": [
            5.2,
            0.39999999999999997
        ],
        "confidence_avg": [
            3.4,
            0.8
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            3.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            2.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            70.6,
            25.865807545870283
        ],
        "wc_strengths_avg": [
            79.6,
            32.15338240372232
        ],
        "wc_weaknesses_avg": [
            278.2,
            117.55237130743046
        ],
        "wc_questions_avg": [
            110.4,
            39.64643741876438
        ],
        "wc_review_avg": [
            538.8,
            160.3039612735755
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            924.6,
            234.21067439380298
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.6,
            0.4898979485566356
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.875,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4405229843094524235&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Massachusetts Institute of Technology;Meta",
        "aff_unique_dep": ";Meta AI",
        "aff_unique_url": "https://web.mit.edu;https://meta.ai",
        "aff_unique_abbr": "MIT;Meta AI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "X7nz6ljg9Y",
        "title": "The No Free Lunch Theorem, Kolmogorov Complexity, and the Role of Inductive Biases in Machine Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "No free lunch theorems for supervised learning state that no learner can solve all problems or that all learners achieve exactly the same accuracy on average over a uniform distribution on learning problems.  Accordingly, these theorems are often referenced in support of the notion that individual problems require specially tailored inductive biases. While virtually all uniformly sampled datasets have high complexity, real-world problems disproportionately generate low-complexity data, and we argue that neural network models share this same preference, formalized using Kolmogorov complexity.  Notably, we show that architectures designed for a particular domain, such as computer vision, can compress datasets on a variety of seemingly unrelated domains. Our experiments show that pre-trained and even randomly initialized language models prefer to generate low-complexity sequences.  Whereas no free lunch theorems seemingly indicate that individual problems require specialized learners, we explain how tasks that often require human intervention such as picking an appropriately sized model when labeled data is scarce or plentiful can be automated into a single learning algorithm.  These observations justify the trend in deep learning of unifying seemingly disparate problems with an increasingly small set of machine learning models.",
        "keywords": "No free lunch theorem;Kolmogorov complexity;inductive bias",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Micah Goldblum;Marc Anton Finzi;Keefer Rowan;Andrew Gordon Wilson",
        "authorids": "~Micah_Goldblum1;~Marc_Anton_Finzi1;~Keefer_Rowan1;~Andrew_Gordon_Wilson1",
        "gender": ";M;M;Not Specified",
        "homepage": ";https://mfinzi.github.io;https://cims.nyu.edu/~kjr9750/;https://cims.nyu.edu/~andrewgw",
        "dblp": "241/7231;222/3062;344/5763;65/10453",
        "google_scholar": "pGDKzuUAAAAJ;ysMAhlwAAAAJ;;https://scholar.google.com.tw/citations?user=twWX2LIAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Micah_Goldblum1;~Marc_Anton_Finzi1;~Keefer_Rowan1;~Andrew_Gordon_Wilson1",
        "aff": "New York University;Carnegie Mellon University;NYU, New York University;New York University",
        "aff_domain": "nyu.edu;cmu.edu;cims.nyu.edu;nyu.edu",
        "position": "Postdoc;Postdoc;PhD student;Associate Professor",
        "bibtex": "@misc{\ngoldblum2024the,\ntitle={The No Free Lunch Theorem, Kolmogorov Complexity, and the Role of Inductive Biases in Machine Learning},\nauthor={Micah Goldblum and Marc Anton Finzi and Keefer Rowan and Andrew Gordon Wilson},\nyear={2024},\nurl={https://openreview.net/forum?id=X7nz6ljg9Y}\n}",
        "github": "",
        "project": "",
        "reviewers": "pHWe;VnMw;hV8P;wTgY",
        "site": "https://openreview.net/forum?id=X7nz6ljg9Y",
        "pdf_size": 495427,
        "rating": "3;5;6;6",
        "confidence": "4;3;5;2",
        "soundness": "2;3;4;3",
        "contribution": "1;2;3;2",
        "presentation": "3;3;4;2",
        "wc_summary": "1005;173;102;80",
        "wc_strengths": "46;87;206;128",
        "wc_weaknesses": "1034;496;75;114",
        "wc_questions": "341;278;38;35",
        "wc_review": "2426;1034;421;357",
        "wc_reply_reviewers": "0;255;0;0",
        "wc_reply_authors": "1650;1818;867;631",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "4;4;3;2",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            340.0,
            385.47308596061544
        ],
        "wc_strengths_avg": [
            116.75,
            59.12433931977591
        ],
        "wc_weaknesses_avg": [
            429.75,
            385.6983115078416
        ],
        "wc_questions_avg": [
            173.0,
            138.30943568679615
        ],
        "wc_review_avg": [
            1059.5,
            832.039812749366
        ],
        "wc_reply_reviewers_avg": [
            63.75,
            110.41823898251593
        ],
        "wc_reply_authors_avg": [
            1241.5,
            503.0370264702192
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.25,
            0.82915619758885
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.18257418583505536,
        "gs_citation": 39,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7588377309069657340&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "New York University;Carnegie Mellon University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.nyu.edu;https://www.cmu.edu",
        "aff_unique_abbr": "NYU;CMU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";New York",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "X8Vx1zGJMs",
        "title": "HumanNorm: Learning Normal Diffusion Model for High-quality and Realistic 3D Human Generation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recent text-to-3D methods have marked significant progress in 3D human generation. However, these methods struggle with high-quality generation, resulting in smooth geometry and cartoon-like appearances. In this paper, we found that by fine-tuning the text-to-image diffusion model with normal maps, it can be adapted to a text-to-normal diffusion model, while preserving part of the generation priors learned from large-scale datasets. Therefore, we propose HumanNorm, a novel approach for high-quality and realistic 3D human generation by integrating normal maps into diffusion models. We employ two integration strategies and propose a normal-adapted diffusion model as well as a normal-aligned diffusion model. The normal-adapted diffusion model can generate high-fidelity normal maps corresponding to prompts with view-dependent text. The normal-aligned diffusion model learns to generate color images aligned with the normal maps, thereby transforming physical geometry details into realistic appearance. Leveraging the proposed normal diffusion model, we devise a progressive geometry generation strategy and coarse-to-fine texture generation strategy to enhance the efficiency and robustness of 3D human generation. Comprehensive experiments substantiate our method's ability to generate 3D humans with intricate geometry and realistic appearances, significantly outperforming existing text-to-3D methods in both geometry and texture quality.",
        "keywords": "diffusion model;3D human",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/4a7acd4c1fccfc906758b96bf48a31434da70391.zip",
        "author": "Xin Huang;Ruizhi Shao;Qi Zhang;Hongwen Zhang;Ying Feng;Yebin Liu;Qing Wang",
        "authorids": "~Xin_Huang13;~Ruizhi_Shao1;~Qi_Zhang43;~Hongwen_Zhang1;~Ying_Feng3;~Yebin_Liu1;~Qing_Wang3",
        "gender": "M;M;;;F;M;M",
        "homepage": "https://xhuangcv.github.io/;https://dsaurus.github.io/saurus/;;https://zhanghongwen.cn;;http://liuyebin.com;http://www.npu-cvpg.org",
        "dblp": ";267/7795;;81/304-1.html;;84/1411.html;97/6505-6",
        "google_scholar": ";;;6z0m_ZMAAAAJ;PhkrqioAAAAJ;https://scholar.google.com/scholar?hl=zh-CN;",
        "orcid": ";0000-0003-2188-1348;;;;;0000-0003-3439-0644",
        "linkedin": ";;;;;;",
        "or_profile": "~Xin_Huang13;~Ruizhi_Shao1;~Qi_Zhang43;~Hongwen_Zhang1;~Ying_Feng3;~Yebin_Liu1;~Qing_Wang3",
        "aff": "Northwestern Polytechnical University;Tsinghua University;;Beijing Normal University;;Tsinghua University;Northwestern Polytechnical University",
        "aff_domain": "nwpu.edu.cn;tsinghua.edu.cn;;bnu.edu.cn;;tsinghua.edu.cn;nwpu.edu.cn",
        "position": "PhD student;PhD student;;Associate Professor;;Full Professor;Full Professor",
        "bibtex": "@misc{\nhuang2024humannorm,\ntitle={HumanNorm: Learning Normal Diffusion Model for High-quality and Realistic 3D Human Generation},\nauthor={Xin Huang and Ruizhi Shao and Qi Zhang and Hongwen Zhang and Ying Feng and Yebin Liu and Qing Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=X8Vx1zGJMs}\n}",
        "github": "",
        "project": "",
        "reviewers": "LRtj;KiDQ;6hVc;gv3j",
        "site": "https://openreview.net/forum?id=X8Vx1zGJMs",
        "pdf_size": 22707564,
        "rating": "3;5;5;6",
        "confidence": "5;4;3;3",
        "soundness": "2;2;2;3",
        "contribution": "2;3;2;3",
        "presentation": "2;3;2;3",
        "wc_summary": "72;110;27;88",
        "wc_strengths": "26;41;51;77",
        "wc_weaknesses": "182;225;253;77",
        "wc_questions": "26;262;4;24",
        "wc_review": "306;638;335;266",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            74.25,
            30.433328769623607
        ],
        "wc_strengths_avg": [
            48.75,
            18.579222265746218
        ],
        "wc_weaknesses_avg": [
            184.25,
            66.88562999628545
        ],
        "wc_questions_avg": [
            79.0,
            106.00471687618433
        ],
        "wc_review_avg": [
            386.25,
            147.39805799263436
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.899228803025897,
        "gs_citation": 79,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6746860679289195584&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;2;1;0",
        "aff_unique_norm": "Northwestern Polytechnical University;Tsinghua University;Beijing Normal University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.nwpu.edu.cn;https://www.tsinghua.edu.cn;https://www.bnu.edu.cn",
        "aff_unique_abbr": "NWPU;THU;BNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "XCEc63Hbar",
        "title": "Attention Prompt Tuning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In this paper, we introduce Attention Prompt Tuning (APT) \u2013 a computationally efficient variant of prompt tuning for video-based applications. Prompt tuning approaches involve injecting a set of learnable prompts along with data tokens during fine-tuning while keeping the backbone frozen. This approach greatly reduces the number of learnable parameters compared to full tuning. For image-based downstream tasks, normally a couple of learnable prompts achieve results close to those of full tuning. However, videos, which contain more complex spatiotemporal information, require hundreds of tunable prompts to achieve reasonably good results. This reduces the parameter efficiency observed in images and significantly increases latency and the number of floating-point operations (FLOPs) during inference. To tackle these issues, we directly inject the prompts into the keys and values of the non-local attention mechanism within the transformer block. Additionally, we introduce a novel prompt reparameterization technique to make APT more robust against hyperparameter selection. The proposed APT approach greatly reduces the number of FLOPs and latency while achieving a significant performance boost over the existing parameter-efficient tuning methods on the UCF101, HMDB51, and SSv2 datasets for action recognition. \\textit{The code and pre-trained models will be publically available after the review process.}",
        "keywords": "prompt tuning;efficient fine-tuning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/3d175bb616dc3edccfd8ef068a5eec7929354aa6.pdf",
        "author": "Wele Gedara Chaminda Bandara;Vishal M. Patel",
        "authorids": "~Wele_Gedara_Chaminda_Bandara1;~Vishal_M._Patel1",
        "gender": "M;M",
        "homepage": "https://www.wgcban.com/;https://engineering.jhu.edu/vpatel36/",
        "dblp": "296/3843;76/6100",
        "google_scholar": "WwLxOJYAAAAJ;AkEXTbIAAAAJ",
        "orcid": "0000-0003-2516-2930;",
        "linkedin": "chamindabandara/;",
        "or_profile": "~Wele_Gedara_Chaminda_Bandara1;~Vishal_Patel2",
        "aff": "Johns Hopkins University;Johns Hopkins University",
        "aff_domain": "johnshopkins.edu;jhu.edu",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nbandara2024attention,\ntitle={Attention Prompt Tuning},\nauthor={Wele Gedara Chaminda Bandara and Vishal M. Patel},\nyear={2024},\nurl={https://openreview.net/forum?id=XCEc63Hbar}\n}",
        "github": "",
        "project": "",
        "reviewers": "fMwu;nevf;r3ry;HmAo",
        "site": "https://openreview.net/forum?id=XCEc63Hbar",
        "pdf_size": 376906,
        "rating": "3;3;5;6",
        "confidence": "5;4;4;4",
        "soundness": "2;1;3;3",
        "contribution": "2;1;1;2",
        "presentation": "3;3;3;3",
        "wc_summary": "54;85;58;67",
        "wc_strengths": "89;14;38;54",
        "wc_weaknesses": "194;350;295;92",
        "wc_questions": "56;145;63;5",
        "wc_review": "393;594;454;218",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            66.0,
            11.937336386313323
        ],
        "wc_strengths_avg": [
            48.75,
            27.25229348146684
        ],
        "wc_weaknesses_avg": [
            232.75,
            98.65945215740862
        ],
        "wc_questions_avg": [
            67.25,
            50.16161380976493
        ],
        "wc_review_avg": [
            414.75,
            134.9580953481487
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5555555555555555,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Johns Hopkins University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.jhu.edu",
        "aff_unique_abbr": "JHU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "XCMbagV0No",
        "title": "A Language-Agent Approach to Formal Theorem-Proving",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Language agents, which use a large language model (LLM) capable of in-context learning to interact with an external environment, have emerged as a promising approach to control tasks. We present a language-agent approach that offers state-of-the-art performance in formal theorem-proving. Our method, COPRA, uses a high-capacity, black-box LLM (GPT-4) as part of a policy for a stateful backtracking search. During the search, the policy can select proof tactics and retrieve lemmas and definitions from an external database. Each selected tactic is executed in the underlying proof framework, and the execution feedback is used to build the prompt for the next policy invocation. The search also tracks selected information from its history and uses it to reduce hallucinations and unnecessary LLM queries.\n\nWe evaluate COPRA on the miniF2F benchmark for Lean and a set of Coq tasks from the Compcert project. On these benchmarks, COPRA is significantly better than one-shot invocations of GPT-4, as well as state-of-the-art models fine-tuned on proof data, at finding correct proofs quickly.",
        "keywords": "theorem proving;formal methods;large language models;agents",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "/attachment/950d17b176a9a64ae1bc9695071ffd899ff11cc0.zip",
        "author": "Amitayush Thakur;Yeming Wen;Swarat Chaudhuri",
        "authorids": "~Amitayush_Thakur1;~Yeming_Wen1;~Swarat_Chaudhuri1",
        "gender": "M;M;M",
        "homepage": "https://amit9oct.github.io/aboutme/;https://www.cs.utexas.edu/~ywen/;http://www.cs.utexas.edu/~swarat",
        "dblp": "299/3365;https://dblp.uni-trier.de/pers/hd/w/Wen:Yeming;37/6100",
        "google_scholar": "d3XU8EAAAAAJ;J2GzNAkAAAAJ;9j6RBYQAAAAJ",
        "orcid": ";;0000-0002-6859-1391",
        "linkedin": ";;swarat-chaudhuri-609b3092/",
        "or_profile": "~Amitayush_Thakur1;~Yeming_Wen1;~Swarat_Chaudhuri1",
        "aff": "University of Texas at Austin;University of Texas, Austin;University of Texas at Austin",
        "aff_domain": "utexas.edu;utexas.edu;utexas.edu",
        "position": "PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nthakur2024a,\ntitle={A Language-Agent Approach to Formal Theorem-Proving},\nauthor={Amitayush Thakur and Yeming Wen and Swarat Chaudhuri},\nyear={2024},\nurl={https://openreview.net/forum?id=XCMbagV0No}\n}",
        "github": "",
        "project": "",
        "reviewers": "4t7K;VHEv;rua8;VNR5",
        "site": "https://openreview.net/forum?id=XCMbagV0No",
        "pdf_size": 806448,
        "rating": "5;5;5;5",
        "confidence": "4;3;3;4",
        "soundness": "3;2;2;2",
        "contribution": "2;3;2;3",
        "presentation": "2;3;2;2",
        "wc_summary": "80;94;81;744",
        "wc_strengths": "39;36;18;3",
        "wc_weaknesses": "130;150;69;3",
        "wc_questions": "29;128;104;32",
        "wc_review": "278;408;272;782",
        "wc_reply_reviewers": "157;0;205;0",
        "wc_reply_authors": "604;1489;1674;2732",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "2;2;3;5",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            249.75,
            285.40880767768886
        ],
        "wc_strengths_avg": [
            24.0,
            14.543039572248986
        ],
        "wc_weaknesses_avg": [
            88.0,
            57.43256915722994
        ],
        "wc_questions_avg": [
            73.25,
            43.59687488800086
        ],
        "wc_review_avg": [
            435.0,
            207.5789006618929
        ],
        "wc_reply_reviewers_avg": [
            90.5,
            92.0774130826882
        ],
        "wc_reply_authors_avg": [
            1624.75,
            756.4368364245623
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.0,
            1.224744871391589
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 21,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10369661985483120931&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Texas at Austin",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.utexas.edu",
        "aff_unique_abbr": "UT Austin",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Austin",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "XCVuT5Stl5",
        "title": "SENSITIVITY-INFORMED REGULARIZATION FOR OFFLINE BLACK-BOX OPTIMIZATION",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Offline optimization is an important task in numerous material engineering domains where online experimentation to collect data is too expensive and needs to be replaced by an in silico maximization of a surrogate of the black-box function. Although such a surrogate can be learned from offline data, its prediction might not be reliable outside the offline data regime, which happens when the surrogate has narrow prediction margin and is (therefore) sensitive to small perturbations of its parameterization. This raises the following questions: (1) how to regulate the sensitivity of a surrogate model; and (2) whether conditioning an offline optimizer with such less sensitive surrogate will lead to better optimization performance. To address these questions, we develop an optimizable sensitivity measurement for the surrogate model, which then inspires a sensitivity-informed regularizer that is applicable to a wide range of offline optimizers. This development is both orthogonal and synergistic to prior research on offline optimization, which is demonstrated in our extensive experiment benchmark.",
        "keywords": "Offline Optimization;Black-Box Optimization",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Manh Cuong Dao;Phi Le Nguyen;Thao Nguyen Truong;Trong Nghia Hoang",
        "authorids": "daomanhcuong2001@gmail.com;~Phi_Le_Nguyen2;~Thao_Nguyen_Truong1;~Trong_Nghia_Hoang1",
        "gender": ";F;M;",
        "homepage": ";https://users.soict.hust.edu.vn/lenp/;https://researchmap.jp/nguyentt;",
        "dblp": ";147/2816;233/1462.html;",
        "google_scholar": ";L_NKoQwAAAAJ;;",
        "orcid": ";;0000-0003-3641-374X;",
        "linkedin": ";;;",
        "or_profile": "daomanhcuong2001@gmail.com;~Phi_Le_Nguyen2;~Thao_Nguyen_Truong1;~Trong_Nghia_Hoang1",
        "aff": ";Hanoi University of Science and Technology;AIST, National Institute of Advanced Industrial Science and Technology;",
        "aff_domain": ";hust.edu.vn;aist.go.jp;",
        "position": ";Associate Professor;Researcher;",
        "bibtex": "@misc{\ndao2024sensitivityinformed,\ntitle={{SENSITIVITY}-{INFORMED} {REGULARIZATION} {FOR} {OFFLINE} {BLACK}-{BOX} {OPTIMIZATION}},\nauthor={Manh Cuong Dao and Phi Le Nguyen and Thao Nguyen Truong and Trong Nghia Hoang},\nyear={2024},\nurl={https://openreview.net/forum?id=XCVuT5Stl5}\n}",
        "github": "",
        "project": "",
        "reviewers": "RJQp;eoHv;bS6c;kNdc",
        "site": "https://openreview.net/forum?id=XCVuT5Stl5",
        "pdf_size": 928709,
        "rating": "3;6;6;6",
        "confidence": "3;3;3;3",
        "soundness": "1;4;4;4",
        "contribution": "2;3;3;4",
        "presentation": "3;3;2;4",
        "wc_summary": "76;66;116;64",
        "wc_strengths": "24;25;59;47",
        "wc_weaknesses": "238;55;129;129",
        "wc_questions": "101;94;47;65",
        "wc_review": "439;240;351;305",
        "wc_reply_reviewers": "1507;118;201;77",
        "wc_reply_authors": "3416;572;1489;1116",
        "reply_reviewers": "4;2;2;1",
        "reply_authors": "7;3;4;3",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            3.25,
            1.299038105676658
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            80.5,
            20.994046775217015
        ],
        "wc_strengths_avg": [
            38.75,
            14.872373717735847
        ],
        "wc_weaknesses_avg": [
            137.75,
            65.2892602194266
        ],
        "wc_questions_avg": [
            76.75,
            21.84462176372024
        ],
        "wc_review_avg": [
            333.75,
            72.44092420724628
        ],
        "wc_reply_reviewers_avg": [
            475.75,
            597.0658987917498
        ],
        "wc_reply_authors_avg": [
            1648.25,
            1071.436506518235
        ],
        "reply_reviewers_avg": [
            2.25,
            1.0897247358851685
        ],
        "reply_authors_avg": [
            4.25,
            1.6393596310755
        ],
        "replies_avg": [
            36,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Tmzze-BLH4AJ:scholar.google.com/&scioq=SENSITIVITY-INFORMED+REGULARIZATION+FOR+OFFLINE+BLACK-BOX+OPTIMIZATION&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Hanoi University of Science and Technology;National Institute of Advanced Industrial Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.hust.edu.vn;https://www.aist.go.jp",
        "aff_unique_abbr": "HUST;AIST",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Hanoi;",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Vietnam;Japan"
    },
    {
        "id": "XD0PHQ5ry4",
        "title": "SELF: Language-Driven Self-Evolution for Large Language Model",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) have showcased remarkable versatility across diverse domains. However, the pathway toward autonomous model development, a cornerstone for achieving human-level learning and advancing autonomous AI, remains largely uncharted. Drawing inspiration from the human capability for self-driven learning, characterized by introspection and continuous refinement, we introduce an innovative approach, termed ``SELF\" (Self-Evolution with Language Feedback). This methodology empowers LLMs to undergo continual self-evolution, thereby augmenting their inherent capabilities. Furthermore, SELF employs language-based feedback as a versatile and comprehensive evaluative tool, pinpointing areas for response refinement and bolstering the stability of self-evolutionary training. Through this approach, we aim to illuminate the prospects of autonomous AI advancement, drawing parallels with the human aptitude for learning and adaptation. \nInitiating with meta-skill learning, SELF acquires foundational meta-skills with a focus on self-feedback and self-refinement. These meta-skills are critical, guiding the model's subsequent self-evolution through a cycle of perpetual training with self-curated data, thereby enhancing its intrinsic abilities. Given unlabeled instructions, SELF equips the model with the capability to autonomously generate and interactively refine responses. This synthesized training data is subsequently filtered and utilized for iterative fine-tuning, enhancing the model's capabilities. Experimental results on representative benchmarks substantiate that SELF can progressively advance its inherent abilities without the requirement of human intervention, thereby indicating a viable pathway for autonomous model evolution. \nAdditionally, SELF can employ online self-refinement strategy to produce responses of superior quality.\nIn essence, the SELF framework signifies a progressive step towards autonomous LLM development, transforming the LLM from a mere passive recipient of information into an active participant in its own evolution.",
        "keywords": "Large Language Model;Alignment;Self-Evolution;Self-Refinement;Reasoning",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Jianqiao Lu;Wanjun Zhong;Wenyong Huang;Yufei Wang;Fei Mi;Baojun Wang;Weichao Wang;Lifeng Shang;Qun Liu",
        "authorids": "~Jianqiao_Lu1;~Wanjun_Zhong1;~Wenyong_Huang1;~Yufei_Wang7;~Fei_Mi1;~Baojun_Wang1;~Weichao_Wang3;~Lifeng_Shang1;~Qun_Liu1",
        "gender": "M;F;M;M;M;;M;M;M",
        "homepage": "https://jianqiaolu.github.io/;http://zhongwanjun.github.io/;;https://garyyufei.github.io/;https://mifei.github.io/;;;;http://liuquncn.github.io/",
        "dblp": "358/4791;227/2128;;61/5568-3;161/0068;;;70/4288;75/4402-1",
        "google_scholar": "uIW6d6AAAAAJ;https://scholar.google.com/citations?hl=zh-CN;z8UoSOwAAAAJ;gFoSqqkAAAAJ;gX3493QAAAAJ;;HZnZBdcAAAAJ;https://scholar.google.com.hk/citations?user=jMQIjYoAAAAJ;2HhiGzcAAAAJ",
        "orcid": ";;;;;;;;0000-0002-7000-1792",
        "linkedin": "jianqiao-lu-308620201/;;;garyyufei/;;;;;qunliu/",
        "or_profile": "~Jianqiao_Lu1;~Wanjun_Zhong1;~Wenyong_Huang1;~Yufei_Wang7;~Fei_Mi1;~Baojun_Wang1;~Weichao_Wang3;~Lifeng_Shang1;~Qun_Liu1",
        "aff": "University of Hong Kong;Huawei Technologies Ltd.;Huawei Technologies Ltd.;Huawei Technologies Ltd.;;;;Huawei Technologies Ltd.;Huawei Noah's Ark Lab",
        "aff_domain": "hku.hk;huawei.com;huawei.com;huawei.com;;;;huawei.com;huawei.com",
        "position": "PhD student;Researcher;Researcher;Researcher;;;;Researcher;Chief Scientist of Speech and Language Computing",
        "bibtex": "@misc{\nlu2024self,\ntitle={{SELF}: Language-Driven Self-Evolution for Large Language Model},\nauthor={Jianqiao Lu and Wanjun Zhong and Wenyong Huang and Yufei Wang and Fei Mi and Baojun Wang and Weichao Wang and Lifeng Shang and Qun Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=XD0PHQ5ry4}\n}",
        "github": "",
        "project": "",
        "reviewers": "9itr;ARUW;VDXd",
        "site": "https://openreview.net/forum?id=XD0PHQ5ry4",
        "pdf_size": 590318,
        "rating": "3;5;6",
        "confidence": "5;2;4",
        "soundness": "2;3;4",
        "contribution": "2;4;3",
        "presentation": "1;1;3",
        "wc_summary": "79;91;124",
        "wc_strengths": "20;95;48",
        "wc_weaknesses": "333;294;181",
        "wc_questions": "76;505;85",
        "wc_review": "508;985;438",
        "wc_reply_reviewers": "137;294;0",
        "wc_reply_authors": "1144;2163;1219",
        "reply_reviewers": "2;2;0",
        "reply_authors": "3;5;2",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.6666666666666665,
            1.247219128924647
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            98.0,
            19.026297590440446
        ],
        "wc_strengths_avg": [
            54.333333333333336,
            30.944394574067136
        ],
        "wc_weaknesses_avg": [
            269.3333333333333,
            64.45842760174102
        ],
        "wc_questions_avg": [
            222.0,
            200.1449474755733
        ],
        "wc_review_avg": [
            643.6666666666666,
            243.04503469293275
        ],
        "wc_reply_reviewers_avg": [
            143.66666666666666,
            120.11753503224341
        ],
        "wc_reply_authors_avg": [
            1508.6666666666667,
            463.6955418758688
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            1.247219128924647
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -0.49999999999999994,
        "gs_citation": 23,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4599448032328524137&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;1;1;1;1",
        "aff_unique_norm": "University of Hong Kong;Huawei",
        "aff_unique_dep": ";Huawei Technologies",
        "aff_unique_url": "https://www.hku.hk;https://www.huawei.com",
        "aff_unique_abbr": "HKU;Huawei",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "XDEWIMoiNK",
        "title": "Mobile Object Rearrangement with Learned Localization Uncertainty",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Mobile object rearrangement (MOR) is a pivotal embodied AI task for a mobile agent to move objects to their target locations. \nWhile previous works rely on accurate pose information, we focus on scenarios where the agent needs to always localize both itself and the objects. This is challenging because accurate rearrangement depends on precise localization, yet localization in such a non-static environment is often disturbed by changes in the surroundings after rearrangement. To address this challenge, we first learn an effective representation for MOR only from sequential first-person view RGB images. It recurrently estimates agent and object poses, along with their associated uncertainties. With such uncertainty-aware localization as the input, we can then hierarchically train rearrangement policy networks for MOR. We develop and open source a simplified, yet challenging 3D MOR simulation environment to evaluate our method and relevant embodied AI baselines. Extensive comparisons reveal better performances of our method than baselines and the need for uncertainty estimation in our task.",
        "keywords": "Mobile object rearrangement;Uncertainty estimation;Reinforcement learning",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/54e8fccdea7f8e4940df68a2aacd96a58f7f9dce.zip",
        "author": "Wenyu Han;Rongjing Xie;Ashiq Rahman Anwar Batcha;Chen Feng",
        "authorids": "~Wenyu_Han1;~Rongjing_Xie1;aa10277@nyu.edu;~Chen_Feng2",
        "gender": "M;M;;M",
        "homepage": "https://ai4ce.github.io/;https://github.com/RongjingXie;;https://ai4ce.github.io/",
        "dblp": ";;;01/161-2",
        "google_scholar": ";;;YeG8ZM0AAAAJ",
        "orcid": ";;;0000-0003-3211-1576",
        "linkedin": ";;;simbaforrest/",
        "or_profile": "~Wenyu_Han1;~Rongjing_Xie1;aa10277@nyu.edu;~Chen_Feng2",
        "aff": "New York University;Tsinghua University;;New York University",
        "aff_domain": "nyu.edu;mails.tsinghua.edu.cn;;nyu.edu",
        "position": "PhD student;Undergrad student;;Assistant Professor",
        "bibtex": "@misc{\nhan2024mobile,\ntitle={Mobile Object Rearrangement with Learned Localization Uncertainty},\nauthor={Wenyu Han and Rongjing Xie and Ashiq Rahman Anwar Batcha and Chen Feng},\nyear={2024},\nurl={https://openreview.net/forum?id=XDEWIMoiNK}\n}",
        "github": "",
        "project": "",
        "reviewers": "XWmC;ZaeQ;CMyF;CAZo",
        "site": "https://openreview.net/forum?id=XDEWIMoiNK",
        "pdf_size": 715502,
        "rating": "3;3;5;5",
        "confidence": "4;4;3;3",
        "soundness": "3;2;3;3",
        "contribution": "2;1;3;2",
        "presentation": "2;2;3;3",
        "wc_summary": "79;77;70;57",
        "wc_strengths": "26;28;28;47",
        "wc_weaknesses": "200;133;130;214",
        "wc_questions": "70;20;75;1",
        "wc_review": "375;258;303;319",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "646;723;625;346",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            70.75,
            8.613216588476108
        ],
        "wc_strengths_avg": [
            32.25,
            8.554969316134336
        ],
        "wc_weaknesses_avg": [
            169.25,
            38.08789177678386
        ],
        "wc_questions_avg": [
            41.5,
            31.768695283250146
        ],
        "wc_review_avg": [
            313.75,
            41.841217716505334
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            585.0,
            142.72876374438334
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:s4IE9FQDKJ8J:scholar.google.com/&scioq=Mobile+Object+Rearrangement+with+Learned+Localization+Uncertainty&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "New York University;Tsinghua University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.nyu.edu;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "NYU;THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "XDYcMtLHEr",
        "title": "Emergent Robust Communication for Multi-Round Interactions in Noisy Environments",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We contribute a novel multi-agent architecture capable of learning a discrete communication protocol without any prior knowledge of the task to solve. We focus on ensuring agents can create a common language during their training to be able to cooperate and solve the task at hand, which is one of the primary goals of the emergent communication field. On top of this, we focus on increasing the task's difficulty by creating a novel referential game, based on the original Lewis Game, that has two new sources of complexity: adding random noise to the message being transmitted and the capability for multiple interactions between the agents before making a final prediction. When evaluating the proposed architecture on the newly developed game, we observe that the emerging communication protocol's generalization aptitude remains equivalent to architectures employed in much simpler and elementary games. Additionally, our method is the only one suitable to produce robust communication protocols that can handle cases with and without noise while maintaining increased generalization performance levels.",
        "keywords": "emergent communication;reinforcement learning;multi-agent reinforcement learning;transfer learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/64cd12ab8f5074afc9b8924812059724b76b0c67.zip",
        "author": "F\u00e1bio Vital;Alberto Sardinha;Francisco S. Melo",
        "authorids": "~F\u00e1bio_Vital1;~Alberto_Sardinha1;~Francisco_S._Melo1",
        "gender": "M;M;M",
        "homepage": "https://fgmv.me;https://www-di.inf.puc-rio.br/~sardinha/;http://gaips.inesc-id.pt/~fmelo",
        "dblp": "318/1041;91/515.html;86/839",
        "google_scholar": ";https://scholar.google.pt/citations?hl=en;5AEeWU4AAAAJ",
        "orcid": "0000-0003-2710-4590;0000-0002-5782-3142;0000-0001-5705-7372",
        "linkedin": "f%C3%A1bio-vital-46a847187/;albertosardinha/;",
        "or_profile": "~F\u00e1bio_Vital1;~Alberto_Sardinha1;~Francisco_S._Melo1",
        "aff": "INESC-ID;Pontifical Catholic University of Rio de Janeiro (PUC-Rio);INESC-ID",
        "aff_domain": "inesc-id.pt;inf.puc-rio.br;inesc-id.pt",
        "position": "Researcher;Associate Professor;Senior Researcher",
        "bibtex": "@misc{\nvital2024emergent,\ntitle={Emergent Robust Communication for Multi-Round Interactions in Noisy Environments},\nauthor={F{\\'a}bio Vital and Alberto Sardinha and Francisco S. Melo},\nyear={2024},\nurl={https://openreview.net/forum?id=XDYcMtLHEr}\n}",
        "github": "",
        "project": "",
        "reviewers": "zpnz;7Viy;WCrY;VCLK",
        "site": "https://openreview.net/forum?id=XDYcMtLHEr",
        "pdf_size": 366779,
        "rating": "3;3;5;6",
        "confidence": "4;4;4;3",
        "soundness": "2;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "2;3;2;3",
        "wc_summary": "35;30;99;66",
        "wc_strengths": "59;75;117;62",
        "wc_weaknesses": "274;117;163;306",
        "wc_questions": "343;111;3;49",
        "wc_review": "711;333;382;483",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1106;972;847;695",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;2;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            57.5,
            27.64507189355817
        ],
        "wc_strengths_avg": [
            78.25,
            23.166516786085904
        ],
        "wc_weaknesses_avg": [
            215.0,
            77.572546690179
        ],
        "wc_questions_avg": [
            126.5,
            130.7392442994834
        ],
        "wc_review_avg": [
            477.25,
            145.38977783874628
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            905.0,
            151.9490046035182
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.7777777777777777,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:5d1pIYzpHdwJ:scholar.google.com/&scioq=Emergent+Robust+Communication+for+Multi-Round+Interactions+in+Noisy+Environments&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "INESC-ID;Pontifical Catholic University of Rio de Janeiro",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.inesc-id.pt;https://www.puc-rio.br",
        "aff_unique_abbr": "INESC-ID;PUC-Rio",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Rio de Janeiro",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Portugal;Brazil"
    },
    {
        "title": "GRANDE: Gradient-Based Decision Tree Ensembles for Tabular Data",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18457",
        "id": "XEFWBxi075",
        "author_site": "Sascha Marton, Stefan L\u00fcdtke, Christian Bartelt, Heiner Stuckenschmidt",
        "tldr": "",
        "abstract": "Despite the success of deep learning for text and image data, tree-based ensemble models are still state-of-the-art for machine learning with heterogeneous tabular data. However, there is a significant need for tabular-specific gradient-based methods due to their high flexibility. In this paper, we propose $\\text{GRANDE}$, $\\text{GRA}$die$\\text{N}$t-Based $\\text{D}$ecision Tree $\\text{E}$nsembles, a novel approach for learning hard, axis-aligned decision tree ensembles using end-to-end gradient descent. GRANDE is based on a dense representation of tree ensembles, which affords to use backpropagation with a straight-through operator to jointly optimize all model parameters. Our method combines axis-aligned splits, which is a useful inductive bias for tabular data, with the flexibility of gradient-based optimization. Furthermore, we introduce an advanced instance-wise weighting that facilitates learning representations for both, simple and complex relations, within a single model. We conducted an extensive evaluation on a predefined benchmark with 19 classification datasets and demonstrate that our method outperforms existing gradient-boosting and deep learning frameworks on most datasets. The method is available under: https://github.com/s-marton/GRANDE",
        "keywords": "Tabular Data; Architectures; Ensembles; Decision Trees; Gradient Descent",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/8000a6b4d2335837eb6b4a0796737216999491ef.zip",
        "author": "Sascha Marton;Stefan L\u00fcdtke;Christian Bartelt;Heiner Stuckenschmidt",
        "authorids": "~Sascha_Marton1;~Stefan_L\u00fcdtke1;~Christian_Bartelt1;~Heiner_Stuckenschmidt2",
        "gender": "M;;M;M",
        "homepage": "https://s-marton.github.io/;;;https://www.uni-mannheim.de/dws/people/professors/prof-dr-heiner-stuckenschmidt/",
        "dblp": "281/6606;;15/73.html;https://dblp.uni-trier.de/pers/s/Stuckenschmidt:Heiner",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;;https://scholar.google.de/citations?user=9FcF1gwAAAAJ;oqpT1YUAAAAJ",
        "orcid": "0000-0001-8151-9223;;0000-0003-0426-6714;0000-0002-0209-3859",
        "linkedin": "sascha-marton-a19630185/;;christian-bartelt-digital/?originalSubdomain=de;",
        "or_profile": "~Sascha_Marton1;~Stefan_L\u00fcdtke1;~Christian_Bartelt1;~Heiner_Stuckenschmidt2",
        "aff": "University of Mannheim;;Universit\u00e4t Mannheim;University of Mannheim",
        "aff_domain": "uni-mannheim.de;;uni-mannheim.de;uni-mannheim.de",
        "position": "PhD student;;Researcher;Full Professor",
        "bibtex": "@inproceedings{\nmarton2024grande,\ntitle={{GRANDE}: Gradient-Based Decision Tree Ensembles for Tabular Data},\nauthor={Sascha Marton and Stefan L{\\\"u}dtke and Christian Bartelt and Heiner Stuckenschmidt},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=XEFWBxi075}\n}",
        "github": "",
        "project": "",
        "reviewers": "SMN1;JdQZ;Duhp;Tbch",
        "pdf_size": 489172,
        "rating": "6;6;6;8",
        "confidence": "5;4;3;4",
        "soundness": "3;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "92;61;46;154",
        "wc_strengths": "45;43;27;127",
        "wc_weaknesses": "17;139;331;198",
        "wc_questions": "134;2;14;53",
        "wc_review": "288;245;418;532",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "2147;1861;2206;1255",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "4;3;4;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            88.25,
            41.42689343892443
        ],
        "wc_strengths_avg": [
            60.5,
            39.02242944769072
        ],
        "wc_weaknesses_avg": [
            171.25,
            112.99197980387811
        ],
        "wc_questions_avg": [
            50.75,
            51.630296338487156
        ],
        "wc_review_avg": [
            370.75,
            112.79932402279722
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1867.25,
            376.7959494209034
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            3.25,
            0.82915619758885
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8885854028421284300&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "openreview": "https://openreview.net/forum?id=XEFWBxi075",
        "pdf": "https://openreview.net/pdf?id=XEFWBxi075",
        "email": "uni-mannheim.de;;uni-mannheim.de;uni-mannheim.de",
        "author_num": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Mannheim",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uni-mannheim.de",
        "aff_unique_abbr": "UM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "XFctwAb9UL",
        "title": "Fairly Explaining Monotonic Models: a New Shapley Value",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The Shapley value has been widely used as an attribution method for explaining black-box machine learning models. A rigorous mathematical framework based on a number of axioms has enabled Shapley value to disentangle the black-box structure of models. Recent studies have shown that domain knowledge is an important component of machine learning models. Science-informed machine learning models that incorporate domain knowledge have demonstrated better generalization and interpretation capabilities. But do we obtain consistent scientific explanations when we apply attribution methods to science-informed machine learning models? In this study, we show that Shapley value cannot be guaranteed to reflect domain knowledge, such as monotonicity. To remedy Shapley's monotonicity failure, we propose a new version of Shapley value. As a result of extensive analytical and empirical examples, we show that Shapley value often produces misleading explanations for monotonic models, which can be avoided using the new method.",
        "keywords": "Attribution problem;Model interpretation;Shapley value;Fairness",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/ec8f6ee3a7eeb2be6c44afc0e48bae425c2d88e9.zip",
        "author": "Dangxing Chen;Jingfeng Chen",
        "authorids": "~Dangxing_Chen1;~Jingfeng_Chen1",
        "gender": ";M",
        "homepage": "https://scholars.duke.edu/person/dangxing.chen;",
        "dblp": "183/0497;",
        "google_scholar": "gg1TbZUAAAAJ;",
        "orcid": ";0009-0000-3458-5463",
        "linkedin": ";",
        "or_profile": "~Dangxing_Chen1;~Jingfeng_Chen1",
        "aff": "Duke Kunshan University;Duke University",
        "aff_domain": "dukekunshan.edu.cn;duke.edu",
        "position": "Assistant Professor;Undergrad student",
        "bibtex": "@misc{\nchen2024fairly,\ntitle={Fairly Explaining Monotonic Models: a New Shapley Value},\nauthor={Dangxing Chen and Jingfeng Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=XFctwAb9UL}\n}",
        "github": "",
        "project": "",
        "reviewers": "bmYC;TM3d;Kdh1;HG66",
        "site": "https://openreview.net/forum?id=XFctwAb9UL",
        "pdf_size": 2136192,
        "rating": "3;3;3;3",
        "confidence": "3;3;4;4",
        "soundness": "2;1;2;3",
        "contribution": "1;2;1;2",
        "presentation": "2;2;2;2",
        "wc_summary": "73;85;154;114",
        "wc_strengths": "39;44;29;44",
        "wc_weaknesses": "298;62;361;722",
        "wc_questions": "333;137;65;73",
        "wc_review": "743;328;609;953",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            106.5,
            31.212978070027216
        ],
        "wc_strengths_avg": [
            39.0,
            6.123724356957945
        ],
        "wc_weaknesses_avg": [
            360.75,
            236.4797824339324
        ],
        "wc_questions_avg": [
            152.0,
            108.16191566350885
        ],
        "wc_review_avg": [
            658.25,
            226.68852529406954
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:hWaiKfOoxd4J:scholar.google.com/&scioq=Fairly+Explaining+Monotonic+Models:+a+New+Shapley+Value&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Duke Kunshan University;Duke University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.duk/Dk.edu;https://www.duke.edu",
        "aff_unique_abbr": "DKU;Duke",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Kunshan;",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "XHPjs3ivdV",
        "title": "Is margin all you need? An extensive empirical study of deep active learning on tabular data",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Given a labeled training set and a collection of unlabeled data, the goal of active learning (AL) is to identify the best unlabeled points to label. In this comprehensive study, we analyze the performance of a variety of AL algorithms on deep neural networks trained on 69 real-world tabular classification datasets from the OpenML-CC18 benchmark. We consider different data regimes and the effect of self-supervised model pre-training. Surprisingly, we find that the classical margin sampling technique matches or outperforms all others, including current state-of-art, in a wide range of experimental settings. To researchers, we hope to encourage rigorous benchmarking against margin, and to practitioners facing tabular data labeling constraints that hyper-parameter-free margin may often be all they need.",
        "keywords": "active learning;tabular data;margin sampling;self-supervised contrastive pre-training",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Dara Bahri;Heinrich Jiang;Tal Schuster;Afshin Rostamizadeh",
        "authorids": "~Dara_Bahri1;~Heinrich_Jiang1;~Tal_Schuster1;~Afshin_Rostamizadeh1",
        "gender": "M;M;Not Specified;",
        "homepage": "http://www.dara.run;;https://people.csail.mit.edu/tals/;",
        "dblp": "231/7656;182/2472;190/7491;97/4479",
        "google_scholar": "j5PpTOwAAAAJ;;oo8QRmIAAAAJ;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Dara_Bahri1;~Heinrich_Jiang1;~Tal_Schuster1;~Afshin_Rostamizadeh1",
        "aff": "Google Research;Google;Google;Google",
        "aff_domain": "google.com;google.com;google.com;google.com",
        "position": "Research Scientist;Research scientist;Researcher;Researcher",
        "bibtex": "@misc{\nbahri2024is,\ntitle={Is margin all you need? An extensive empirical study of deep active learning on tabular data},\nauthor={Dara Bahri and Heinrich Jiang and Tal Schuster and Afshin Rostamizadeh},\nyear={2024},\nurl={https://openreview.net/forum?id=XHPjs3ivdV}\n}",
        "github": "",
        "project": "",
        "reviewers": "rdp2;uF25;eSnA;vfAb",
        "site": "https://openreview.net/forum?id=XHPjs3ivdV",
        "pdf_size": 28737491,
        "rating": "3;5;5;6",
        "confidence": "2;5;4;2",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "33;75;51;135",
        "wc_strengths": "28;30;96;120",
        "wc_weaknesses": "30;234;41;82",
        "wc_questions": "34;2;48;62",
        "wc_review": "125;341;236;399",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "119;264;253;161",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            1.299038105676658
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            73.5,
            38.50649295898031
        ],
        "wc_strengths_avg": [
            68.5,
            40.4073013204297
        ],
        "wc_weaknesses_avg": [
            96.75,
            81.57626799504865
        ],
        "wc_questions_avg": [
            36.5,
            22.242976419535225
        ],
        "wc_review_avg": [
            275.25,
            104.58579014378579
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            199.25,
            61.206106721470206
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.22075539284417398,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1953404997285554503&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Google",
        "aff_unique_dep": "Google Research",
        "aff_unique_url": "https://research.google",
        "aff_unique_abbr": "Google Research",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Mountain View",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Debiasing Algorithm through Model Adaptation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18456",
        "id": "XIZEFyVGC9",
        "author_site": "Tomasz Limisiewicz, David Mare\u010dek, Tom\u00e1\u0161 Musil",
        "tldr": "",
        "abstract": "Large language models are becoming the go-to solution for the ever-growing number of tasks.\nHowever, with growing capacity, models are prone to rely on spurious correlations stemming from biases and stereotypes present in the training data.\nThis work proposes a novel method for detecting and mitigating gender bias in language models.\nWe perform causal analysis to identify problematic model components and discover that mid-upper feed-forward layers are most prone to convey bias.\nBased on the analysis results, we intervene in the model by applying a linear projection to the weight matrices of these layers.\nOur titular method DAMA, significantly decreases bias as measured by diverse metrics while maintaining the model's performance on downstream tasks.\nWe release code for our method and models, which retrain LLaMA's state-of-the-art performance while being significantly less biased.",
        "keywords": "Model Editingi;Gender Bias;Causal Inference",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Tomasz Limisiewicz;David Mare\u010dek;Tom\u00e1\u0161 Musil",
        "authorids": "~Tomasz_Limisiewicz1;~David_Mare\u010dek1;~Tom\u00e1\u0161_Musil1",
        "gender": "M;M;M",
        "homepage": "https://ufal.mff.cuni.cz/tomasz-limisiewicz;https://ufal.mff.cuni.cz/tomas-musil;https://ufal.mff.cuni.cz/david-marecek",
        "dblp": "264/0110;205/9019;23/7248",
        "google_scholar": "RqxyTsgAAAAJ;https://scholar.google.cz/citations?user=_0GP_jUAAAAJ;1Cis0JUAAAAJ",
        "orcid": "0000-0003-3809-2580;;0000-0001-5327-488X",
        "linkedin": ";;",
        "or_profile": "~Tomasz_Limisiewicz1;~Tom\u00e1\u0161_Musil1;~David_Marecek1",
        "aff": "Charles University ;Charles University, Prague;Charles University, Prague",
        "aff_domain": "cuni.cz;cuni.cz;cuni.cz",
        "position": "PhD student;PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nlimisiewicz2024debiasing,\ntitle={Debiasing Algorithm through Model Adaptation},\nauthor={Tomasz Limisiewicz and David Mare{\\v{c}}ek and Tom{\\'a}{\\v{s}} Musil},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=XIZEFyVGC9}\n}",
        "github": "",
        "project": "",
        "reviewers": "FcGW;2cbg;S9AC",
        "pdf_size": 1745244,
        "rating": "3;6;8",
        "confidence": "4;3;3",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "1;4;3",
        "wc_summary": "47;65;56",
        "wc_strengths": "28;69;41",
        "wc_weaknesses": "252;124;181",
        "wc_questions": "11;15;3",
        "wc_review": "338;273;281",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "648;281;536",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            5.666666666666667,
            2.0548046676563256
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "wc_summary_avg": [
            56.0,
            7.3484692283495345
        ],
        "wc_strengths_avg": [
            46.0,
            17.107503227141788
        ],
        "wc_weaknesses_avg": [
            185.66666666666666,
            52.359865885576475
        ],
        "wc_questions_avg": [
            9.666666666666666,
            4.988876515698588
        ],
        "wc_review_avg": [
            297.3333333333333,
            28.940552094864323
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            488.3333333333333,
            153.57155407894464
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.9176629354822472,
        "gs_citation": 17,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5875914926535027203&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=XIZEFyVGC9",
        "pdf": "https://openreview.net/pdf?id=XIZEFyVGC9",
        "email": "cuni.cz;cuni.cz;cuni.cz",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Charles University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cuni.cz",
        "aff_unique_abbr": "Charles U",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Prague",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Czech Republic"
    },
    {
        "title": "Idempotent Generative Network",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18455",
        "id": "XIaS66XkNA",
        "author_site": "Assaf Shocher, Amil Dravid, Yossi Gandelsman, Inbar Mosseri, Michael Rubinstein, Alexei Efros",
        "tldr": "",
        "abstract": "We propose a new approach for generative modeling based on training a neural network to be idempotent. An idempotent operator is one that can be applied sequentially without changing the result beyond the initial application, namely $f(f(z))=f(z)$. The proposed model $f$ is trained to map a source distribution (e.g, Gaussian noise) to a target distribution (e.g. realistic images) using the following objectives: \n(1) Instances from the target distribution should map to themselves, namely $f(x)=x$. We define the target manifold as the set of all instances that $f$ maps to themselves.\n(2) Instances that form the source distribution should map onto the defined target manifold. This is achieved by optimizing the idempotence term, $f(f(z))=f(z)$ which encourages the range of $f(z)$ to be on the target manifold. Under ideal assumptions such a process provably converges to the target distribution. This strategy results in a model capable of generating an output in one step, maintaining a consistent latent space, while also allowing sequential applications for refinement. Additionally, we find that by processing inputs from both target and source distributions, the model adeptly projects corrupted or modified data back to the target manifold. This work is a first step towards a ``global projector'' that enables projecting any input into a target data distribution.",
        "keywords": "Generative model;idempotent;energy based models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/dcaebfc820ab3db4b0178044f3249e457a8841d3.zip",
        "author": "Assaf Shocher;Amil V Dravid;Yossi Gandelsman;Inbar Mosseri;Michael Rubinstein;Alexei A Efros",
        "authorids": "~Assaf_Shocher1;~Amil_V_Dravid1;~Yossi_Gandelsman2;~Inbar_Mosseri4;~Michael_Rubinstein1;~Alexei_A_Efros1",
        "gender": "M;;M;M;F;M",
        "homepage": "https://assafshocher.github.io/;https://avdravid.github.io/;http://people.csail.mit.edu/mrub/;http://www.eecs.berkeley.edu/~efros/;;https://yossi.gandelsman.com",
        "dblp": "211/8006;272/9123;16/1356;40/6158;;232/1765",
        "google_scholar": "https://scholar.google.co.il/citations?user=ndRmNK8AAAAJ;YZ8Y-sUAAAAJ;ttBdcmsAAAAJ;https://scholar.google.com.tw/citations?user=d97bGd8AAAAJ;ifCcZ5IAAAAJ;https://scholar.google.co.il/citations?user=71L4yYMAAAAJ",
        "orcid": ";0000-0001-6007-0690;;0000-0001-5720-8070;;0000-0003-1259-3387",
        "linkedin": ";amil-dravid/;;alexei-efros-890736a3/;;yossi-gandelsman-26582981/",
        "or_profile": "~Assaf_Shocher1;~Amil_V_Dravid1;~Michael_Rubinstein1;~Alyosha_Efros1;~Inbar_Moressi1;~Yossi_Gandelsman1",
        "aff": "University of California, Berkeley;University of California, Berkeley;Google;University of California, Berkeley;Google;University of California, Berkeley",
        "aff_domain": "berkeley.edu;berkeley.edu;google.com;berkeley.edu;google.com;berkeley.edu",
        "position": "Postdoc;PhD student;Research Scientist;Professor;Researcher;PhD student",
        "bibtex": "@inproceedings{\nshocher2024idempotent,\ntitle={Idempotent Generative Network},\nauthor={Assaf Shocher and Amil V Dravid and Yossi Gandelsman and Inbar Mosseri and Michael Rubinstein and Alexei A Efros},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=XIaS66XkNA}\n}",
        "github": "",
        "project": "",
        "reviewers": "Cz9y;5afM;j2FZ;Sz9m",
        "pdf_size": 24345083,
        "rating": "3;5;8;8",
        "confidence": "4;3;3;4",
        "soundness": "2;3;2;4",
        "contribution": "2;3;3;4",
        "presentation": "3;3;3;3",
        "wc_summary": "169;89;148;330",
        "wc_strengths": "68;79;241;107",
        "wc_weaknesses": "262;132;401;83",
        "wc_questions": "15;8;190;38",
        "wc_review": "514;308;980;558",
        "wc_reply_reviewers": "121;202;204;0",
        "wc_reply_authors": "1074;949;852;496",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "4;3;3;2",
        "rating_avg": [
            6.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            184.0,
            89.24964985925715
        ],
        "wc_strengths_avg": [
            123.75,
            69.17143557856812
        ],
        "wc_weaknesses_avg": [
            219.5,
            123.52833683005693
        ],
        "wc_questions_avg": [
            62.75,
            74.3013290594455
        ],
        "wc_review_avg": [
            590.0,
            244.1434004842236
        ],
        "wc_reply_reviewers_avg": [
            131.75,
            83.10949103441797
        ],
        "wc_reply_authors_avg": [
            842.75,
            215.10854817975041
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.23570226039551587,
        "gs_citation": 22,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2440514468962679193&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=XIaS66XkNA",
        "pdf": "https://openreview.net/pdf?id=XIaS66XkNA",
        "email": "berkeley.edu;berkeley.edu;google.com;berkeley.edu;google.com;berkeley.edu",
        "author_num": 6,
        "aff_unique_index": "0;0;1;0;1;0",
        "aff_unique_norm": "University of California, Berkeley;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.berkeley.edu;https://www.google.com",
        "aff_unique_abbr": "UC Berkeley;Google",
        "aff_campus_unique_index": "0;0;1;0;1;0",
        "aff_campus_unique": "Berkeley;Mountain View",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "InstructPix2NeRF: Instructed 3D Portrait Editing from a Single Image",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18454",
        "id": "XIxhINXtQk",
        "author_site": "Jianhui Li, Shilong Liu, Zidong Liu, Yikai Wang, Kaiwen Zheng, Jinghui Xu, Jianmin Li, Jun Zhu",
        "tldr": "",
        "abstract": "With the success of Neural Radiance Field (NeRF) in 3D-aware portrait editing, a variety of works have achieved promising results regarding both quality and 3D consistency. However, these methods heavily rely on per-prompt optimization when handling natural language as editing instructions. Due to the lack of labeled human face 3D datasets and effective architectures, the area of human-instructed 3D-aware editing for open-world portraits in an end-to-end manner remains under-explored. To solve this problem, we propose an end-to-end diffusion-based framework termed $\\textbf{InstructPix2NeRF}$, which enables instructed 3D-aware portrait editing from a single open-world image with human instructions.  At its core lies a conditional latent 3D diffusion process that lifts 2D editing to 3D space by learning the correlation between the paired images' difference and the instructions via triplet data. With the help of our proposed token position randomization strategy, we could even achieve multi-semantic editing through one single pass with the portrait identity well-preserved. Besides, we further propose an identity consistency module that directly modulates the extracted identity signals into our diffusion process, which increases the multi-view 3D identity consistency. Extensive experiments verify the effectiveness of our method and show its superiority against strong baselines quantitatively and qualitatively. Source code and pretrained models can be found on our project page: https://mybabyyh.github.io/InstructPix2NeRF.",
        "keywords": "3D-aware editing;Human instruction;Conditional latent 3D diffusion",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/c962ae3168054007fe431afaa8bc3ecbdfcf3f5c.zip",
        "author": "Jianhui Li;Shilong Liu;Zidong Liu;Yikai Wang;Kaiwen Zheng;Jinghui Xu;Jianmin Li;Jun Zhu",
        "authorids": "~Jianhui_Li2;~Shilong_Liu1;~Zidong_Liu1;~Yikai_Wang2;~Kaiwen_Zheng2;~Jinghui_Xu1;~Jianmin_Li1;~Jun_Zhu2",
        "gender": "M;M;M;M;M;M;M;M",
        "homepage": ";https://www.lsl.zone;https://twitter.com/forthelostthing;https://yikaiw.github.io/;https://zhengkw18.github.io/;https://github.com/a574824551;;http://ml.cs.tsinghua.edu.cn/~jun",
        "dblp": "https://dblp.uni-trier.de/pid/59/304;;;85/9555-1;;;71/5930-1;50/2644-1",
        "google_scholar": ";nkSVY3MAAAAJ;;MnW5aegAAAAJ;0d80xSIAAAAJ;;PeF1aPkAAAAJ;axsP38wAAAAJ",
        "orcid": ";;;;;;;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Jianhui_Li2;~Shilong_Liu1;~Zidong_Liu1;~Yikai_Wang2;~Kaiwen_Zheng2;~Jinghui_Xu1;~Jianmin_Li1;~Jun_Zhu2",
        "aff": "Department of computer science and technology, Tsinghua University;NVIDIA;Tsinghua University;Tsinghua University;Tsinghua University;;Tsinghua University;Tsinghua University",
        "aff_domain": "cs.tsinghua.edu.cn;nvidia.com;tsinghua.edu.cn;tsinghua.edu.cn;cs.tsinghua.edu.cn;;tsinghua.edu.cn;mail.tsinghua.edu.cn",
        "position": "MS student;Research Intern;Undergrad student;Postdoc;MS student;;Associate Professor;Professor",
        "bibtex": "@inproceedings{\nli2024instructpixnerf,\ntitle={InstructPix2Ne{RF}: Instructed 3D Portrait Editing from a Single Image},\nauthor={Jianhui Li and Shilong Liu and Zidong Liu and Yikai Wang and Kaiwen Zheng and Jinghui Xu and Jianmin Li and Jun Zhu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=XIxhINXtQk}\n}",
        "github": "",
        "project": "",
        "reviewers": "TVmA;1rfe;e7JS",
        "pdf_size": 16092155,
        "rating": "5;6;8",
        "confidence": "5;3;3",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "2;3;2",
        "wc_summary": "97;79;104",
        "wc_strengths": "64;33;56",
        "wc_weaknesses": "155;113;56",
        "wc_questions": "91;15;35",
        "wc_review": "407;240;251",
        "wc_reply_reviewers": "431;8;25",
        "wc_reply_authors": "3460;1132;1315",
        "reply_reviewers": "2;1;1",
        "reply_authors": "7;4;4",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            93.33333333333333,
            10.530379332620877
        ],
        "wc_strengths_avg": [
            51.0,
            13.140268896284683
        ],
        "wc_weaknesses_avg": [
            108.0,
            40.570925550201586
        ],
        "wc_questions_avg": [
            47.0,
            32.16623488483952
        ],
        "wc_review_avg": [
            299.3333333333333,
            76.26416079799358
        ],
        "wc_reply_reviewers_avg": [
            154.66666666666666,
            195.52038825202405
        ],
        "wc_reply_authors_avg": [
            1969.0,
            1056.9399226067676
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            5.0,
            1.4142135623730951
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.7559289460184546,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9871228689944470165&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=XIxhINXtQk",
        "pdf": "https://openreview.net/pdf?id=XIxhINXtQk",
        "email": "cs.tsinghua.edu.cn;nvidia.com;tsinghua.edu.cn;tsinghua.edu.cn;cs.tsinghua.edu.cn;;tsinghua.edu.cn;mail.tsinghua.edu.cn",
        "author_num": 8,
        "aff_unique_index": "0;1;0;0;0;0;0",
        "aff_unique_norm": "Tsinghua University;NVIDIA",
        "aff_unique_dep": "Department of Computer Science and Technology;NVIDIA Corporation",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.nvidia.com",
        "aff_unique_abbr": "THU;NVIDIA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;0;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Adversarial Training Should Be Cast as a Non-Zero-Sum Game",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18453",
        "id": "XJ9vjEAqbx",
        "author_site": "Alex Robey, Fabian Latorre, George Pappas, Hamed Hassani, Volkan Cevher",
        "tldr": "",
        "abstract": "One prominent approach toward resolving the adversarial vulnerability of deep neural networks is the two-player zero-sum paradigm of adversarial training, in which predictors are trained against adversarially chosen perturbations of data. Despite the promise of this approach, algorithms based on this paradigm have not engendered sufficient levels of robustness and suffer from pathological behavior like robust overfitting. To understand this shortcoming, we first show that the commonly used surrogate-based relaxation used in adversarial training algorithms voids all guarantees on the robustness of trained classifiers.  The identification of this pitfall informs a novel non-zero-sum bilevel formulation of adversarial training, wherein each player optimizes a different objective function. Our formulation yields a simple algorithmic framework that matches and in some cases outperforms state-of-the-art attacks, attains comparable levels of robustness to standard adversarial training algorithms, and does not suffer from robust overfitting.",
        "keywords": "Adversarial training;two-player zero-sum;bilevel optimization",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Alexander Robey;Fabian Latorre;George J. Pappas;Hamed Hassani;Volkan Cevher",
        "authorids": "~Alexander_Robey1;~Fabian_Latorre1;~George_J._Pappas1;~Hamed_Hassani2;~Volkan_Cevher1",
        "gender": "M;M;M;M;M",
        "homepage": "https://arobey1.github.io/;https://fabianlatorre.com;https://www.seas.upenn.edu/~hassani/;http://lions.epfl.ch;http://www.georgejpappas.org/",
        "dblp": "242/9113;244/9638;73/4984;70/5301;p/GeorgeJPappas",
        "google_scholar": "V5NWZc8AAAAJ;B46S5NwAAAAJ;;https://scholar.google.ch/citations?user=hlWhzU8AAAAJ;https://scholar.google.com.tw/citations?user=Kia-4B0AAAAJ",
        "orcid": ";;;;0000-0001-9081-0637",
        "linkedin": "alexrobey/;;;;",
        "or_profile": "~Alexander_Robey1;~Fabian_Latorre1;~Hamed_Hassani2;~Volkan_Cevher1;~George_Pappas1",
        "aff": "School of Engineering and Applied Science, University of Pennsylvania;Swiss Federal Institute of Technology Lausanne;University of Pennsylvania;Amazon Development Center Germany;School of Engineering and Applied Science, University of Pennsylvania",
        "aff_domain": "seas.upenn.edu;epfl.ch;upenn.edu;amazon.de;seas.upenn.edu",
        "position": "PhD student;PhD student;;Amazon Scholar;Full Professor",
        "bibtex": "@inproceedings{\nrobey2024adversarial,\ntitle={Adversarial Training Should Be Cast as a Non-Zero-Sum Game},\nauthor={Alexander Robey and Fabian Latorre and George J. Pappas and Hamed Hassani and Volkan Cevher},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=XJ9vjEAqbx}\n}",
        "github": "",
        "project": "",
        "reviewers": "NF3x;hcTf;XrbP;DH4f",
        "pdf_size": 671884,
        "rating": "6;6;6;6",
        "confidence": "4;4;4;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "173;67;78;61",
        "wc_strengths": "79;37;42;64",
        "wc_weaknesses": "485;142;375;20",
        "wc_questions": "62;17;135;16",
        "wc_review": "799;263;630;161",
        "wc_reply_reviewers": "0;115;0;19",
        "wc_reply_authors": "1734;697;1152;254",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "3;1;2;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            94.75,
            45.58714182749342
        ],
        "wc_strengths_avg": [
            55.5,
            16.948451256678293
        ],
        "wc_weaknesses_avg": [
            255.5,
            183.9109839025391
        ],
        "wc_questions_avg": [
            57.5,
            48.44842618702903
        ],
        "wc_review_avg": [
            463.25,
            260.7627034297658
        ],
        "wc_reply_reviewers_avg": [
            33.5,
            47.68909728648677
        ],
        "wc_reply_authors_avg": [
            959.25,
            548.5304800099991
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17872249618577736544&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "openreview": "https://openreview.net/forum?id=XJ9vjEAqbx",
        "pdf": "https://openreview.net/pdf?id=XJ9vjEAqbx",
        "email": "seas.upenn.edu;epfl.ch;upenn.edu;amazon.de;seas.upenn.edu",
        "author_num": 5,
        "aff_unique_index": "0;1;0;2;0",
        "aff_unique_norm": "University of Pennsylvania;Swiss Federal Institute of Technology Lausanne;Amazon",
        "aff_unique_dep": "School of Engineering and Applied Science;;Development Center",
        "aff_unique_url": "https://www.upenn.edu;https://www.epfl.ch;https://www.amazon.de",
        "aff_unique_abbr": "UPenn;EPFL;Amazon",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Lausanne",
        "aff_country_unique_index": "0;1;0;2;0",
        "aff_country_unique": "United States;Switzerland;Germany"
    },
    {
        "id": "XJiN1VkgA0",
        "title": "Generating with Confidence: Uncertainty Quantification for Black-box Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs) specializing in natural language generation (NLG) have recently started exhibiting promising capabilities across a variety of domains. However, gauging the trustworthiness of responses generated by LLMs remains an open challenge, with limited research on uncertainty quantification (UQ) for NLG. Furthermore, existing literature typically assumes white-box access to language models, which is becoming unrealistic either due to the closed-source nature of the latest LLMs or computational constraints. In this work, we investigate UQ in NLG for *black-box* LLMs. We first differentiate *uncertainty* vs *confidence*: the former refers to the \u201cdispersion\u201d of the potential predictions for a fixed input, and the latter refers to the confidence on a particular prediction/generation. We then propose and compare several confidence/uncertainty metrics, applying them to *selective* NLG where unreliable results could either be ignored or yielded for further assessment. Experiments were carried out with several popular LLMs on question-answering datasets (for evaluation purposes). Results reveal that a simple metric for the semantic dispersion can be a reliable predictor of the quality of LLM responses, providing valuable insights for practitioners on uncertainty management when adopting LLMs.",
        "keywords": "Uncertainty Quantification;Selective Generation;Natural Language Generation",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/b65c38bfff55a1f0ad2c8c27e97231bcf2bae43a.zip",
        "author": "Zhen Lin;Shubhendu Trivedi;Jimeng Sun",
        "authorids": "~Zhen_Lin2;~Shubhendu_Trivedi2;~Jimeng_Sun3",
        "gender": ";;",
        "homepage": ";;http://sunlab.org",
        "dblp": ";;",
        "google_scholar": ";;9jmmp5sAAAAJ",
        "orcid": ";;0000-0003-1512-6426",
        "linkedin": ";;jimengsun/",
        "or_profile": "~Zhen_Lin2;~Shubhendu_Trivedi2;~Jimeng_Sun3",
        "aff": ";;Georgia Institute of Technology",
        "aff_domain": ";;gatech.edu",
        "position": ";;Associate Professor",
        "bibtex": "@misc{\nlin2024generating,\ntitle={Generating with Confidence: Uncertainty Quantification for Black-box Large Language Models},\nauthor={Zhen Lin and Shubhendu Trivedi and Jimeng Sun},\nyear={2024},\nurl={https://openreview.net/forum?id=XJiN1VkgA0}\n}",
        "github": "",
        "project": "",
        "reviewers": "sn9f;YpC9;LJF2;1J6D",
        "site": "https://openreview.net/forum?id=XJiN1VkgA0",
        "pdf_size": 711403,
        "rating": "6;6;6;6",
        "confidence": "3;3;3;3",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "2;3;3;2",
        "wc_summary": "109;111;113;83",
        "wc_strengths": "81;70;20;64",
        "wc_weaknesses": "193;44;242;88",
        "wc_questions": "96;68;91;27",
        "wc_review": "479;293;466;262",
        "wc_reply_reviewers": "0;0;17;0",
        "wc_reply_authors": "885;316;798;409",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            104.0,
            12.206555615733702
        ],
        "wc_strengths_avg": [
            58.75,
            23.1880896151451
        ],
        "wc_weaknesses_avg": [
            141.75,
            79.24763403408332
        ],
        "wc_questions_avg": [
            70.5,
            27.244265451650556
        ],
        "wc_review_avg": [
            375.0,
            98.22168803273541
        ],
        "wc_reply_reviewers_avg": [
            4.25,
            7.361215932167728
        ],
        "wc_reply_authors_avg": [
            602.0,
            243.6955067291968
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 243,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11964376410918155904&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0",
        "aff_unique_norm": "Georgia Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.gatech.edu",
        "aff_unique_abbr": "Georgia Tech",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "XK7kyCVjqr",
        "title": "Alignment-Enhancing Parallel Code Generation for Semi-Supervised Code Translation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Code translation is the task of converting source code from one programming language to another. Sufficient parallel code data is essential for neural code translation models to learn the correct alignment across different languages. However, existing parallel code data is limited in quantity and supported languages. In this paper, we propose a semi-supervised code translation method, SPACoder, that leverages snippet training, static analysis, and compilation to generate synthetic parallel code with enhanced alignment in a scalable way, and improves code translation by curriculum learning based on the alignment level of training instances. SPACoder can be generalized to multiple languages and various models with little overhead. Extensive experiments show that SPACoder significantly improves code translation performance on C++, Java, Python, and C, outperforming state-of-the-art baselines by wide margins in execution-based evaluation (CA@1). Notably, we improve C translation by up to 43% with less than 150 annotated training instances.",
        "keywords": "Code Translation; Machine Translation; Code Generation; Semi-Supervised Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/a2e16e87e879ebd649cb354405636ac58598081e.pdf",
        "author": "Ming Zhu;Ismini Lourentzou;Danfeng Yao",
        "authorids": "~Ming_Zhu1;~Ismini_Lourentzou1;~Danfeng_Yao2",
        "gender": ";F;F",
        "homepage": ";https://isminoula.github.io;https://people.cs.vt.edu/danfeng/",
        "dblp": ";136/7883;y/DanfengYao.html",
        "google_scholar": ";CjxQvikAAAAJ;_JLQTKwAAAAJ",
        "orcid": ";;0000-0001-8969-2792",
        "linkedin": ";;danfeng-daphne-yao-56918219/recent-activity/articles/",
        "or_profile": "~Ming_Zhu1;~Ismini_Lourentzou1;~Danfeng_Yao2",
        "aff": ";University of Illinois Urbana - Champaign;, Virginia Polytechnic Institute and State University",
        "aff_domain": ";illinois.edu;cs.vt.edu",
        "position": ";Assistant Professor;Full Professor",
        "bibtex": "@misc{\nzhu2024alignmentenhancing,\ntitle={Alignment-Enhancing Parallel Code Generation for Semi-Supervised Code Translation},\nauthor={Ming Zhu and Ismini Lourentzou and Danfeng Yao},\nyear={2024},\nurl={https://openreview.net/forum?id=XK7kyCVjqr}\n}",
        "github": "",
        "project": "",
        "reviewers": "okeA;jLZb;9b25;zW1g",
        "site": "https://openreview.net/forum?id=XK7kyCVjqr",
        "pdf_size": 1274716,
        "rating": "5;6;6;6",
        "confidence": "5;4;5;4",
        "soundness": "3;4;2;3",
        "contribution": "2;3;2;3",
        "presentation": "3;2;3;4",
        "wc_summary": "56;262;166;94",
        "wc_strengths": "17;60;119;164",
        "wc_weaknesses": "52;72;495;238",
        "wc_questions": "20;525;62;25",
        "wc_review": "145;919;842;521",
        "wc_reply_reviewers": "36;0;51;49",
        "wc_reply_authors": "427;780;933;619",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "2;1;3;2",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            144.5,
            78.50318464877715
        ],
        "wc_strengths_avg": [
            90.0,
            56.004464107783406
        ],
        "wc_weaknesses_avg": [
            214.25,
            177.44347691589005
        ],
        "wc_questions_avg": [
            158.0,
            212.50764692123434
        ],
        "wc_review_avg": [
            606.75,
            305.53590214572165
        ],
        "wc_reply_reviewers_avg": [
            34.0,
            20.457272545478784
        ],
        "wc_reply_authors_avg": [
            689.75,
            187.98853023522472
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14305847242715703090&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Illinois Urbana-Champaign;Virginia Polytechnic Institute and State University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://illinois.edu;https://www.vt.edu",
        "aff_unique_abbr": "UIUC;VT",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Urbana-Champaign;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "XKgTNCLqW9",
        "title": "Identifying Drivers of Predictive Uncertainty using Variance Feature Attribution",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Explainability and uncertainty quantification are two pillars of trustable artificial intelligence. However, the reasoning behind uncertainty estimates is generally left unexplained. Identifying the drivers of uncertainty complements explanations of point predictions in recognizing potential biases and model limitations. It additionally facilitates the detection of oversimplification in the uncertainty estimation process. Explanations of uncertainty enhance communication of and trust in decisions. They allow for verifying whether the main drivers of model uncertainty are relevant and may impact model usage in certain applications. So far, the subject of explaining uncertainties has been rarely studied. The few exceptions in existing literature are tailored to Bayesian neural networks or rely heavily on technically intricate approaches, such as auxiliary generative models, thereby hindering their broad adoption. We propose variance feature attribution, a simple and scalable solution to explain predictive aleatory uncertainties. First, we estimate uncertainty as predictive variance by adapting a neural network, for example, by equipping it with a Gaussian output distribution. We achieve this by adding a variance output neuron and can thereby rely on pre-trained point prediction models and fine-tune them for meaningful variance estimation. Second, we apply out-of-the-box explainers on the variance output of these models to explain the uncertainty estimation. This two-step method can be easily applied to any neural network with model-agnostic or model-specific explainers. We evaluate our approach in a synthetic setting where the data-generating process is known. We show that our method can explain uncertainty influences more reliably and faster than the established literature baseline CLUE, while the uncertainty estimation stage does not impede the accuracy of the model.\nAs an illustrative application, we fine-tune a state-of-the-art age regression model to estimate uncertainty and generate attributions for age prediction uncertainty. Our exemplary explanations highlight reasonable potential sources of uncertainty, such as laugh lines and frowning. Variance feature attribution provides accurate explanations for uncertainty estimates with little modifications to the model architecture and low computational overhead.",
        "keywords": "uncertainty;explainability;trustworthy ML;probabilistic methods;transfer learning",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Pascal Iversen;Simon Witzke;Katharina Baum;Bernhard Y Renard",
        "authorids": "~Pascal_Iversen1;~Simon_Witzke1;~Katharina_Baum1;~Bernhard_Y_Renard1",
        "gender": ";M;F;",
        "homepage": "https://www.mi.fu-berlin.de/inf/groups/ag-dilis/Members/Staff/index.html;https://hpi.de/en/renard/team/simon-witzke.html;https://hpi.de/renard/team/katharina-baum.html;http://hpi.de/renard",
        "dblp": "344/4858;322/5244;;57/7099",
        "google_scholar": "pOiv1wkAAAAJ;https://scholar.google.com/citations?hl=de;VRDJXPQAAAAJ;YeSos8AAAAAJ",
        "orcid": ";0009-0002-7596-1730;0000-0001-7256-0566;0000-0003-4589-9809",
        "linkedin": ";;;",
        "or_profile": "~Pascal_Iversen1;~Simon_Witzke1;~Katharina_Baum1;~Bernhard_Y_Renard1",
        "aff": "Universit\u00e4t Potsdam;Universit\u00e4t Potsdam;Hasso Plattner Institute;Freie Universit\u00e4t Berlin",
        "aff_domain": "uni-potsdam.de;uni-potsdam.de;hpi.de;fu-berlin.de",
        "position": "PhD student;PhD student;Researcher;Full Professor",
        "bibtex": "@misc{\niversen2024identifying,\ntitle={Identifying Drivers of Predictive Uncertainty using Variance Feature Attribution},\nauthor={Pascal Iversen and Simon Witzke and Katharina Baum and Bernhard Y Renard},\nyear={2024},\nurl={https://openreview.net/forum?id=XKgTNCLqW9}\n}",
        "github": "",
        "project": "",
        "reviewers": "3GEh;fhD9;H5dd;Dpa4",
        "site": "https://openreview.net/forum?id=XKgTNCLqW9",
        "pdf_size": 8521666,
        "rating": "1;1;6;8",
        "confidence": "5;4;4;3",
        "soundness": "1;3;3;4",
        "contribution": "1;1;3;3",
        "presentation": "3;3;3;4",
        "wc_summary": "113;44;69;150",
        "wc_strengths": "53;25;34;69",
        "wc_weaknesses": "522;134;103;88",
        "wc_questions": "38;2;47;41",
        "wc_review": "726;205;253;348",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "342;177;217;186",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.0,
            3.082207001484488
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            1.0897247358851685
        ],
        "contribution_avg": [
            2.0,
            1.0
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            94.0,
            40.68783602011786
        ],
        "wc_strengths_avg": [
            45.25,
            17.03489066592445
        ],
        "wc_weaknesses_avg": [
            211.75,
            179.88937572852933
        ],
        "wc_questions_avg": [
            32.0,
            17.621010186706094
        ],
        "wc_review_avg": [
            383.0,
            204.60816210503432
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            230.5,
            66.06247043518734
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8029550685469661,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15489133738492539340&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "University of Potsdam;Hasso Plattner Institute;Freie Universit\u00e4t Berlin",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.uni-potsdam.de;https://www.hpi.de;https://www.fu-berlin.de",
        "aff_unique_abbr": "UP;HPI;FU Berlin",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "XLjlLQz2y2",
        "title": "Spectral Greedy Coresets for Graph Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The ubiquity of large-scale graphs in node-classification tasks significantly hinders the real-world applications of Graph Neural Networks (GNNs). Node sampling, graph coarsening, and dataset condensation are effective strategies for enhancing data efficiency. However, owing to the interdependence of graph nodes, coreset selection, which selects subsets of the data examples, has not been successfully applied to speed up GNN training on large graphs, warranting special treatment. This paper studies graph coresets for GNNs and avoids the interdependence issue by selecting ego-graphs (i.e., neighborhood subgraphs around a node) based on their spectral embeddings. We decompose the coreset selection problem for GNNs into two phases: a coarse selection of widely spread ego graphs and a refined selection to diversify their topologies. We design a greedy algorithm that approximately optimizes both objectives. Our spectral greedy graph coreset (SGGC) scales to graphs with millions of nodes, obviates the need for model pre-training, and applies to low-homophily graphs. Extensive experiments on ten datasets demonstrate that SGGC outperforms other coreset methods by a wide margin, generalizes well across GNN architectures, and is much faster than graph condensation.",
        "keywords": "Coreset Selection;Graph Neural Networks;Node Classification",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/040cb88a31825fc65c8e8a36afaa68d5c64509b1.pdf",
        "author": "Mucong Ding;Yinhan He;Jundong Li;Furong Huang",
        "authorids": "~Mucong_Ding1;~Yinhan_He1;~Jundong_Li2;~Furong_Huang1",
        "gender": "M;M;M;F",
        "homepage": "http://www.cs.umd.edu/~mcding/;https://yinhanhe123.github.io;https://jundongli.github.io/;https://furong-huang.com",
        "dblp": "232/1754.html;377/5920.html;144/7997.html;72/8513",
        "google_scholar": "_bVao2MAAAAJ;SMHk6PMAAAAJ;uY6ek7sAAAAJ;13yyuCcAAAAJ",
        "orcid": "0000-0002-6173-8055;0009-0003-8163-395X;;",
        "linkedin": "mucong-ding-489296104;yinhan-he-06054125a/;;",
        "or_profile": "~Mucong_Ding1;~Yinhan_He1;~Jundong_Li2;~Furong_Huang1",
        "aff": "Department of Computer Science, University of Maryland, College Park;University of Virginia, Charlottesville;University of Virginia;University of Maryland",
        "aff_domain": "cs.umd.edu;virginia.edu;virginia.edu;cs.umd.edu",
        "position": "PhD student;PhD student;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nding2024spectral,\ntitle={Spectral Greedy Coresets for Graph Neural Networks},\nauthor={Mucong Ding and Yinhan He and Jundong Li and Furong Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=XLjlLQz2y2}\n}",
        "github": "",
        "project": "",
        "reviewers": "iC6X;Yh7x;EvwQ;Zq6N;y3Xk;CXBD;76UD",
        "site": "https://openreview.net/forum?id=XLjlLQz2y2",
        "pdf_size": 1403151,
        "rating": "3;3;5;5;6;6;8",
        "confidence": "5;4;3;3;4;4;4",
        "soundness": "2;2;3;3;3;3;4",
        "contribution": "2;2;3;3;2;3;3",
        "presentation": "2;3;3;2;3;3;4",
        "wc_summary": "57;122;75;141;259;85;142",
        "wc_strengths": "28;23;12;40;15;114;193",
        "wc_weaknesses": "177;266;138;140;77;54;115",
        "wc_questions": "13;8;38;107;53;2;67",
        "wc_review": "275;419;263;428;404;255;517",
        "wc_reply_reviewers": "0;0;0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0;0;0",
        "reply_authors": "0;0;0;0;0;0;0",
        "rating_avg": [
            5.142857142857143,
            1.64130361329658
        ],
        "confidence_avg": [
            3.857142857142857,
            0.6388765649999398
        ],
        "soundness_avg": [
            2.857142857142857,
            0.6388765649999399
        ],
        "contribution_avg": [
            2.5714285714285716,
            0.49487165930539345
        ],
        "presentation_avg": [
            2.857142857142857,
            0.6388765649999399
        ],
        "wc_summary_avg": [
            125.85714285714286,
            62.368555656627784
        ],
        "wc_strengths_avg": [
            60.714285714285715,
            62.932422453917724
        ],
        "wc_weaknesses_avg": [
            138.14285714285714,
            64.60302640285641
        ],
        "wc_questions_avg": [
            41.142857142857146,
            35.00787083511597
        ],
        "wc_review_avg": [
            365.85714285714283,
            94.19497798476849
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.2530121568524951,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12393558695560308396&as_sdt=5,34&sciodt=0,34&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "University of Maryland, College Park;University of Virginia;University of Maryland",
        "aff_unique_dep": "Department of Computer Science;;",
        "aff_unique_url": "https://www/umd.edu;https://www.virginia.edu;https://www/umd.edu",
        "aff_unique_abbr": "UMD;UVA;UMD",
        "aff_campus_unique_index": "0;1",
        "aff_campus_unique": "College Park;Charlottesville;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "XM0fepbZE9",
        "title": "Long-Tailed 3D Detection via 2D Late Fusion",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Autonomous vehicles (AVs) must accurately detect objects from both common and rare classes for safe navigation, motivating the problem of Long-Tailed 3D Object Detection (LT3D). Contemporary LiDAR-based 3D detectors perform poorly on rare classes (e.g., CenterPoint achieves only 5.1 AP on stroller) because it is difficult to recognize objects from sparse LiDAR points alone. RGB images may help resolve such ambiguities, motivating the study of multi-modal RGB-LiDAR fusion. Specifically, we delve into a simple late-fusion framework that ensembles 2D RGB and 3D LiDAR detections and find that (a) high-resolution RGB images help recognize rare objects, (b) LiDAR provides precise 3D localization, and (c) uni-modal detectors can easily leverage more training data because they do not require aligning and annotating multi-modal data. We examine three critical components in this late-fusion framekwork: (1) whether to train 2D or 3D RGB detectors, (2) whether to match RGB and LiDAR detections in 3D or the projected 2D image plane (3) how to fuse matched detections. Extensive experiments reveal that using 2D RGB detectors, matching in the 2D image plane, and fusing scores probabilistically with calibration leads to the state-of-the-art LT3D performance, achieving 51.4 mAP on the established nuScenes LT3D benchmark, improving over prior work by 5.9 mAP.",
        "keywords": "Long-Tailed 3D Detection;Autonomous Vehicles;Multi-modal Fusion;LiDAR;Object Detection",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/983c2d39cdba0852e35dc86072bd9a651a083ab2.zip",
        "author": "Yechi Ma;Neehar Peri;Shuoquan Wei;Yanan Li;Wei Hua;Deva Ramanan;Shu Kong",
        "authorids": "~Yechi_Ma1;~Neehar_Peri1;~Shuoquan_Wei1;~Yanan_Li4;~Wei_Hua1;~Deva_Ramanan1;~Shu_Kong1",
        "gender": "M;M;;F;M;M;M",
        "homepage": "https://github.com/mayechi;http://neeharperi.com;https://github.com/WeiSQ-zju;https://yananlix1.github.io/;https://portal.zhejianglab.com/portal/employee;https://www.cs.cmu.edu/~deva/;https://aimerykong.github.io/",
        "dblp": ";241/5094;;61/7498-2.html;;49/488;26/11141",
        "google_scholar": ";X3cGY7wAAAAJ;;9cTdt_kAAAAJ;;9B8PoXUAAAAJ;sm9FdLoAAAAJ",
        "orcid": ";;;0000-0001-8482-7221;0000-0003-2868-1920;;0000-0002-1362-5937",
        "linkedin": ";neeharperi/;;;;;aimerykong/",
        "or_profile": "~Yechi_Ma1;~Neehar_Peri1;~Shuoquan_Wei1;~Yanan_Li4;~Wei_Hua1;~Deva_Ramanan1;~Shu_Kong1",
        "aff": "Zhejiang Lab, Zhejiang Lab;Carnegie Mellon University;Zhejiang Lab;Zhejiang Lab;Zhejiang Lab;School of Computer Science, Carnegie Mellon University;Texas A&M University - College Station",
        "aff_domain": "zhejianglab.com;cmu.edu;zhejianglab.com;zhejianglab.com;zhejianglab.com;cs.cmu.edu;tamu.edu",
        "position": "Researcher;PhD student;Researcher;Researcher;Full Professor;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nma2024longtailed,\ntitle={Long-Tailed 3D Detection via 2D Late Fusion},\nauthor={Yechi Ma and Neehar Peri and Shuoquan Wei and Yanan Li and Wei Hua and Deva Ramanan and Shu Kong},\nyear={2024},\nurl={https://openreview.net/forum?id=XM0fepbZE9}\n}",
        "github": "",
        "project": "",
        "reviewers": "ezvM;zAdM;JxFc",
        "site": "https://openreview.net/forum?id=XM0fepbZE9",
        "pdf_size": 6372642,
        "rating": "3;5;5",
        "confidence": "5;4;5",
        "soundness": "2;1;2",
        "contribution": "1;2;3",
        "presentation": "3;2;3",
        "wc_summary": "26;225;38",
        "wc_strengths": "10;21;56",
        "wc_weaknesses": "3;48;65",
        "wc_questions": "219;83;109",
        "wc_review": "258;377;268",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            96.33333333333333,
            91.11287261169826
        ],
        "wc_strengths_avg": [
            29.0,
            19.61292091114087
        ],
        "wc_weaknesses_avg": [
            38.666666666666664,
            26.157641755751268
        ],
        "wc_questions_avg": [
            137.0,
            58.94630324852159
        ],
        "wc_review_avg": [
            301.0,
            53.89495956642575
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6975722966706179870&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;0;0;0;1;2",
        "aff_unique_norm": "Zhejiang Lab;Carnegie Mellon University;Texas A&M University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.zhejianglab.com;https://www.cmu.edu;https://www.tamu.edu",
        "aff_unique_abbr": ";CMU;TAMU",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Pittsburgh;College Station",
        "aff_country_unique_index": "0;1;0;0;0;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "XM5CC79fwF",
        "title": "Unsupervised Data Generation for Offline Reinforcement Learning: A Perspective from Model",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Offline reinforcement learning (RL) recently gains growing interests from RL researchers. However, the performance of offline RL suffers from the out-of-distribution problem, which can be corrected by environment feedback in online RL. Previous offline RL research focuses on restricting the offline algorithm in in-distribution even in-sample action sampling. In contrast, fewer work pays attention to the influence of the batch data. In this paper, we first build a bridge over the batch data and the performance of offline RL algorithms theoretically, from the perspective of model-based offline RL optimization. We draw a conclusion that, with mild assumptions, the distance between the state-action pair distribution generated by the behavioural policy, and the distribution generated by the optimal policy, accounts for the performance gap between the policy learned by model-based offline RL and the optimal policy. Secondly, we reveal that in task-agnostic settings, a series of policies trained by unsupervised RL can minimize the worst-case regret in the performance gap. Inspired by the theoretical conclusions, a framework named UDG (Unsupervised Data Generation) is composed to generate data and select proper data for offline training under tasks-agnostic settings. Empirical results on locomotive tasks demonstrate that UDG outperforms supervised data generation and previous unsupervised data generation in solving unknown tasks.",
        "keywords": "Reinforcement learning;Unsupervised RL;Model-based;Offline RL",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/f189d7a31578d74367cce21814c4af3411afb11a.zip",
        "author": "Shuncheng He;Hongchang Zhang;Jianzhun Shao;Yuhang Jiang;Xiangyang Ji",
        "authorids": "~Shuncheng_He1;~Hongchang_Zhang1;~Jianzhun_Shao1;~Yuhang_Jiang3;~Xiangyang_Ji1",
        "gender": "M;M;M;;",
        "homepage": ";;https://github.com/qyz55;;",
        "dblp": "267/1881;https://dblp.uni-trier.de/pid/36/9348;263/2309;239/4567;",
        "google_scholar": "3MtQN6EAAAAJ;;;https://scholar.google.com/citations?hl=en;",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Shuncheng_He1;~Hongchang_Zhang1;~Jianzhun_Shao1;~Yuhang_Jiang3;~Xiangyang_Ji1",
        "aff": "Tsinghua University;Tsinghua University;Tsinghua University;Tsinghua University;",
        "aff_domain": "tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;",
        "position": "PhD student;PhD student;PhD student;PhD student;",
        "bibtex": "@misc{\nhe2024unsupervised,\ntitle={Unsupervised Data Generation for Offline Reinforcement Learning: A Perspective from Model},\nauthor={Shuncheng He and Hongchang Zhang and Jianzhun Shao and Yuhang Jiang and Xiangyang Ji},\nyear={2024},\nurl={https://openreview.net/forum?id=XM5CC79fwF}\n}",
        "github": "",
        "project": "",
        "reviewers": "FQFn;jP6G;sJsv;DbRP",
        "site": "https://openreview.net/forum?id=XM5CC79fwF",
        "pdf_size": 6230687,
        "rating": "3;3;3;3",
        "confidence": "4;3;4;3",
        "soundness": "1;2;1;2",
        "contribution": "2;2;1;2",
        "presentation": "2;3;2;2",
        "wc_summary": "74;127;69;79",
        "wc_strengths": "46;65;24;98",
        "wc_weaknesses": "184;225;632;351",
        "wc_questions": "3;25;68;2",
        "wc_review": "307;442;793;530",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            1.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            87.25,
            23.220411279734044
        ],
        "wc_strengths_avg": [
            58.25,
            27.151197027018902
        ],
        "wc_weaknesses_avg": [
            348.0,
            175.13566170257843
        ],
        "wc_questions_avg": [
            24.5,
            26.744158240632665
        ],
        "wc_review_avg": [
            518.0,
            177.52887089146938
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ypEG9JUkpCsJ:scholar.google.com/&scioq=Unsupervised+Data+Generation+for+Offline+Reinforcement+Learning:+A+Perspective+from+Model&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Tsinghua University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "XM7INBbvwT",
        "title": "Does Calibration Affect Human Actions?",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Calibration has been proposed as a way to enhance the reliability and adoption of machine learning classifiers. We study a particular aspect of this proposal: what is the effect of calibrating a classification model on the decisions made by non-expert humans consuming the model's predictions? We perform a Human-Computer-Interaction (HCI) experiment to ascertain the effect of calibration on (i) trust in the model, and (ii) the correlation between decisions and predictions. \n\nWe also propose further corrections to the reported calibrated scores based on Kahneman and Tversky's prospect theory from behavioral economics and study the effect of these corrections on trust and decision-making. \n\nWe find that calibration is not sufficient on its own---the prospect theory correction is crucial for increasing the correlation between human decisions and the model's predictions. While this increased correlation suggests higher trust in the model, responses to ``Do you trust the model more?\" are unaffected by the method used.",
        "keywords": "human computer interaction; human-AI decision-making; model calibration; prospect theory",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Meir Nizri;Amos Azaria;Chirag Gupta;Noam Hazon",
        "authorids": "~Meir_Nizri1;~Amos_Azaria1;~Chirag_Gupta1;~Noam_Hazon1",
        "gender": "M;Not Specified;M;M",
        "homepage": ";http://azariaa.com;https://aigen.github.io;https://www.ariel.ac.il/wp/noam-hazon/",
        "dblp": ";18/9923;64/4756;80/1237",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.com.tw/citations?user=sdfKs_sAAAAJ;2ALBM1sAAAAJ;https://scholar.google.com.tw/citations?user=Bb-VR9sAAAAJ",
        "orcid": ";0000-0002-5057-1309;;0000-0001-9910-0762",
        "linkedin": "meir-nizri/;;;",
        "or_profile": "~Meir_Nizri1;~Amos_Azaria1;~Chirag_Gupta1;~Noam_Hazon1",
        "aff": "Ariel University Center of Samaria;Ariel University;Bloomberg AI;Ariel University",
        "aff_domain": "ariel.ac.il;ariel.ac.il;bloomberg.net;ariel.ac.il",
        "position": "PhD student;Associate Professor;Researcher;Associate Professor",
        "bibtex": "@misc{\nnizri2024does,\ntitle={Does Calibration Affect Human Actions?},\nauthor={Meir Nizri and Amos Azaria and Chirag Gupta and Noam Hazon},\nyear={2024},\nurl={https://openreview.net/forum?id=XM7INBbvwT}\n}",
        "github": "",
        "project": "",
        "reviewers": "NQcN;Yu3U;7xFz",
        "site": "https://openreview.net/forum?id=XM7INBbvwT",
        "pdf_size": 9420947,
        "rating": "3;5;6",
        "confidence": "3;4;4",
        "soundness": "2;2;3",
        "contribution": "3;2;2",
        "presentation": "3;2;3",
        "wc_summary": "141;105;97",
        "wc_strengths": "70;79;52",
        "wc_weaknesses": "247;159;140",
        "wc_questions": "38;35;130",
        "wc_review": "496;378;419",
        "wc_reply_reviewers": "0;0;242",
        "wc_reply_authors": "205;217;176",
        "reply_reviewers": "0;0;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            114.33333333333333,
            19.136933459209764
        ],
        "wc_strengths_avg": [
            67.0,
            11.224972160321824
        ],
        "wc_weaknesses_avg": [
            182.0,
            46.611872593435535
        ],
        "wc_questions_avg": [
            67.66666666666667,
            44.0933353492591
        ],
        "wc_review_avg": [
            431.0,
            48.91489207456832
        ],
        "wc_reply_reviewers_avg": [
            80.66666666666667,
            114.07989403142966
        ],
        "wc_reply_authors_avg": [
            199.33333333333334,
            17.21110752456745
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.9449111825230683,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:pCqH47PCumgJ:scholar.google.com/&scioq=Does+Calibration+Affect+Human+Actions%3F&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Ariel University;Bloomberg",
        "aff_unique_dep": ";Bloomberg AI",
        "aff_unique_url": "https://www.ariel.ac.il;https://www.bloomberg.com/professional/solution/engineering-ai/",
        "aff_unique_abbr": "Ariel U;Bloomberg AI",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Samaria;",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "Israel;United States"
    },
    {
        "id": "XMJBrvRDI8",
        "title": "Hierarchically branched diffusion models leverage dataset structure for class-conditional generation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Diffusion models have attained state-of-the-art performance in generating realistic objects, including when conditioning generation on class labels. Current class-conditional diffusion models, however, implicitly model the diffusion process on all classes in a flat fashion, ignoring any known relationships between classes. Class-labeled datasets, including those common in scientific domains, are rife with internal structure. To take advantage of this structure, we propose hierarchically branched diffusion models as a novel framework for class-conditional generation. Branched diffusion models explicitly leverage the inherent relationships between distinct classes in the dataset to learn the underlying diffusion process in a hierarchical manner. We highlight several advantages of branched diffusion models over the current state-of-the-art methods for class-conditional diffusion. Firstly, they can be easily extended to novel classes in a continual-learning setting at scale. Secondly, they enable more sophisticated forms of conditional generation, such as analogy-based conditional generation (i.e. transmutation). Finally, they offer a novel interpretability into the class-conditional generation process. We extensively evaluate branched diffusion models on several benchmark and large real-world scientific datasets, spanning different data modalities (images, tabular data, and graphs). We particularly highlight the advantages of branched diffusion models on a single-cell RNA-seq dataset, where our branched model leverages the intrinsic hierarchical structure between human cell types.",
        "keywords": "diffusion model;conditional generation;scientific discovery;interpretability;continual learning",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/8f0d95908be4d3e3608181fff229eabdd9a294c1.zip",
        "author": "Alex M Tseng;Max W Shen;Tommaso Biancalani;Gabriele Scalia",
        "authorids": "~Alex_M_Tseng1;~Max_W_Shen1;~Tommaso_Biancalani1;~Gabriele_Scalia1",
        "gender": "M;M;;Non-Binary",
        "homepage": ";;;https://alextseng.net/",
        "dblp": "233/9948;;201/9258;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.it/citations?user=s_qd9x0AAAAJ;MxeFvewAAAAJ;",
        "orcid": ";;0000-0003-3305-9220;0000-0002-5191-1926",
        "linkedin": ";;gabriele-scalia;",
        "or_profile": "~Max_W_Shen1;~Tommaso_Biancalani1;~Gabriele_Scalia1;~Alex_Tseng1",
        "aff": "Genentech;Genentech;Genentech;Genentech",
        "aff_domain": "gene.com;gene.com;gene.com;gene.com",
        "position": "Researcher;Director;Researcher;Researcher",
        "bibtex": "@misc{\ntseng2024hierarchically,\ntitle={Hierarchically branched diffusion models leverage dataset structure for class-conditional generation},\nauthor={Alex M Tseng and Max W Shen and Tommaso Biancalani and Gabriele Scalia},\nyear={2024},\nurl={https://openreview.net/forum?id=XMJBrvRDI8}\n}",
        "github": "",
        "project": "",
        "reviewers": "HyFs;MogQ;EPhc;DhnV",
        "site": "https://openreview.net/forum?id=XMJBrvRDI8",
        "pdf_size": 14466927,
        "rating": "5;6;6;8",
        "confidence": "4;3;2;4",
        "soundness": "3;3;3;3",
        "contribution": "2;4;3;4",
        "presentation": "3;3;3;3",
        "wc_summary": "182;103;57;81",
        "wc_strengths": "140;81;29;93",
        "wc_weaknesses": "204;197;9;263",
        "wc_questions": "197;47;49;386",
        "wc_review": "723;428;144;823",
        "wc_reply_reviewers": "734;32;33;327",
        "wc_reply_authors": "3583;782;96;2189",
        "reply_reviewers": "2;1;1;2",
        "reply_authors": "6;2;1;4",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            105.75,
            46.932797700542
        ],
        "wc_strengths_avg": [
            85.75,
            39.492879104972836
        ],
        "wc_weaknesses_avg": [
            168.25,
            95.44992142479741
        ],
        "wc_questions_avg": [
            169.75,
            138.8837193482375
        ],
        "wc_review_avg": [
            529.5,
            265.7522342333174
        ],
        "wc_reply_reviewers_avg": [
            281.5,
            287.5886819747954
        ],
        "wc_reply_authors_avg": [
            1662.5,
            1341.1492273419838
        ],
        "reply_reviewers_avg": [
            1.5,
            0.5
        ],
        "reply_authors_avg": [
            3.25,
            1.920286436967152
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.20751433915982243,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:wNVtiX6yvAYJ:scholar.google.com/&scioq=Hierarchically+branched+diffusion+models+leverage+dataset+structure+for+class-conditional+generation&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Genentech",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.genentech.com",
        "aff_unique_abbr": "Genentech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "XMaPp8CIXq",
        "title": "Always-Sparse Training with Guided Stochastic Exploration",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The excessive computational requirements of modern artificial neural networks (ANNs) are posing limitations on the machines that can run them. Sparsification of ANNs is often motivated by time, memory and energy savings only during model inference, yielding no benefits during training. A growing body of work is now focusing on providing the benefits of model sparsification also during training. While these methods greatly improve the training efficiency, the training algorithms yielding the most accurate models still materialize the dense weights, or compute dense gradients during training. We propose an efficient, always-sparse training algorithm which improves the accuracy over previous methods. Additionally, our method has excellent scaling to larger and sparser models, supported by its linear time complexity with respect to the model width during training and inference. We evaluate our method on CIFAR-10/100 and ImageNet using ResNet, VGG, and ViT models, and compare it against a range of sparsification methods.",
        "keywords": "sparse training;sparsity;pruning;lottery tickets;scalable;efficient",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Mike Heddes;Narayan Srinivasa;Tony Givargis;Alexandru Nicolau",
        "authorids": "~Mike_Heddes1;~Narayan_Srinivasa2;~Tony_Givargis1;~Alexandru_Nicolau1",
        "gender": "M;M;M;",
        "homepage": "https://www.mikeheddes.nl;;https://www.ics.uci.edu/~givargis/;",
        "dblp": "320/5938.html;;g/TonyGivargis.html;",
        "google_scholar": "SZpFJqIAAAAJ;g9wOc4wAAAAJ;bt2wk9EAAAAJ;",
        "orcid": "0000-0002-9276-458X;;;",
        "linkedin": "mikeheddes/;narayan-srinivasa-61866615b;;",
        "or_profile": "~Mike_Heddes1;~Narayan_Srinivasa2;~Tony_Givargis1;~Alexandru_Nicolau1",
        "aff": "Google;;University of California, Irvine;",
        "aff_domain": "google.com;;uci.edu;",
        "position": "Intern;;Full Professor;",
        "bibtex": "@misc{\nheddes2024alwayssparse,\ntitle={Always-Sparse Training with Guided Stochastic Exploration},\nauthor={Mike Heddes and Narayan Srinivasa and Tony Givargis and Alexandru Nicolau},\nyear={2024},\nurl={https://openreview.net/forum?id=XMaPp8CIXq}\n}",
        "github": "",
        "project": "",
        "reviewers": "bMwd;XMAg;hGq2",
        "site": "https://openreview.net/forum?id=XMaPp8CIXq",
        "pdf_size": 732887,
        "rating": "3;3;3",
        "confidence": "4;4;5",
        "soundness": "3;3;1",
        "contribution": "1;1;1",
        "presentation": "3;2;2",
        "wc_summary": "111;53;77",
        "wc_strengths": "16;31;32",
        "wc_weaknesses": "328;335;171",
        "wc_questions": "191;61;105",
        "wc_review": "646;480;385",
        "wc_reply_reviewers": "853;0;0",
        "wc_reply_authors": "933;418;616",
        "reply_reviewers": "3;0;0",
        "reply_authors": "3;1;1",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "contribution_avg": [
            1.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            80.33333333333333,
            23.79542439676633
        ],
        "wc_strengths_avg": [
            26.333333333333332,
            7.318166133366716
        ],
        "wc_weaknesses_avg": [
            278.0,
            75.71437556149206
        ],
        "wc_questions_avg": [
            119.0,
            53.98765290940759
        ],
        "wc_review_avg": [
            503.6666666666667,
            107.85896140588207
        ],
        "wc_reply_reviewers_avg": [
            284.3333333333333,
            402.10805623475005
        ],
        "wc_reply_authors_avg": [
            655.6666666666666,
            212.11055817400717
        ],
        "reply_reviewers_avg": [
            1.0,
            1.4142135623730951
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:m337Nb6vlV4J:scholar.google.com/&scioq=Always-Sparse+Training+with+Guided+Stochastic+Exploration&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Google;University of California, Irvine",
        "aff_unique_dep": "Google;",
        "aff_unique_url": "https://www.google.com;https://www.uci.edu",
        "aff_unique_abbr": "Google;UCI",
        "aff_campus_unique_index": "0;1",
        "aff_campus_unique": "Mountain View;Irvine",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "COLEP: Certifiably Robust Learning-Reasoning Conformal Prediction via Probabilistic Circuits",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18452",
        "id": "XN6ZPINdSg",
        "author_site": "Mintong Kang, Nezihe Merve G\u00fcrel, Linyi Li, Bo Li",
        "tldr": "",
        "abstract": "Conformal prediction has shown spurring performance in constructing statistically rigorous prediction sets for arbitrary black-box machine learning models, assuming the data is exchangeable. However, even small adversarial perturbations during the inference can violate the exchangeability assumption, challenge the coverage guarantees, and result in a subsequent decline in empirical coverage. In this work, we propose a certifiably robust learning-reasoning conformal prediction framework (COLEP) via probabilistic circuits, which comprise a data-driven learning component that trains statistical models to learn different semantic concepts, and a reasoning component that encodes knowledge and characterizes the relationships among the trained models for logic reasoning. To achieve exact and efficient reasoning, we employ probabilistic circuits (PCs) within the reasoning component. Theoretically, we provide end-to-end certification of prediction coverage for COLEP in the presence of $\\ell_2$ bounded adversarial perturbations. We also provide certified coverage considering the finite size of the calibration set. Furthermore, we prove that COLEP achieves higher prediction coverage and accuracy over a single model as long as the utilities of knowledge models are non-trivial. Empirically, we show the validity and tightness of our certified coverage, demonstrating the robust conformal prediction of COLEP on various datasets, including GTSRB, CIFAR10, and AwA2. We show that COLEP achieves up to 12% improvement in certified coverage on GTSRB, 9% on CIFAR-10, and 14% on AwA2.",
        "keywords": "conformal prediction;adversarial robustness;probabilistic circuits",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Mintong Kang;Nezihe Merve G\u00fcrel;Linyi Li;Bo Li",
        "authorids": "~Mintong_Kang1;~Nezihe_Merve_G\u00fcrel2;~Linyi_Li1;~Bo_Li19",
        "gender": "M;Not Specified;M;F",
        "homepage": "https://kangmintong.github.io/;https://nezihemervegurel.github.io/;http://linyil.com;http://boli.cs.illinois.edu/",
        "dblp": "303/0335.html;215/5003;99/4340-1.html;50/3402-26",
        "google_scholar": "oHXw2SAAAAAJ;5yYPHwYAAAAJ;-b0sk-YAAAAJ;K8vJkTcAAAAJ",
        "orcid": ";;;",
        "linkedin": ";nezihemervegurel/;;",
        "or_profile": "~Mintong_Kang1;~Nezihe_Merve_G\u00fcrel2;~Linyi_Li1;~Bo_Li19",
        "aff": "University of Illinois, Urbana Champaign;Delft University of Technology;Simon Fraser University;University of Illinois, Urbana Champaign",
        "aff_domain": "illinois.edu;tudelft.nl;sfu.ca;illinois.edu",
        "position": "PhD student;Assistant Professor;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nkang2024colep,\ntitle={{COLEP}: Certifiably Robust Learning-Reasoning Conformal Prediction via Probabilistic Circuits},\nauthor={Mintong Kang and Nezihe Merve G{\\\"u}rel and Linyi Li and Bo Li},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=XN6ZPINdSg}\n}",
        "github": "",
        "project": "",
        "reviewers": "qYpF;GJ8Z;MM5a;TP2m;nQJc",
        "pdf_size": 988447,
        "rating": "6;6;6;6;8",
        "confidence": "1;3;3;3;5",
        "soundness": "3;3;3;3;3",
        "contribution": "2;3;2;3;2",
        "presentation": "2;2;2;2;2",
        "wc_summary": "44;143;42;133;66",
        "wc_strengths": "48;210;31;85;143",
        "wc_weaknesses": "67;399;2;208;310",
        "wc_questions": "63;161;166;60;65",
        "wc_review": "222;913;241;486;584",
        "wc_reply_reviewers": "21;466;187;27;461",
        "wc_reply_authors": "1165;1858;1562;1621;1872",
        "reply_reviewers": "1;1;3;1;7",
        "reply_authors": "2;4;4;4;8",
        "rating_avg": [
            6.4,
            0.7999999999999999
        ],
        "confidence_avg": [
            3.0,
            1.2649110640673518
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            85.6,
            43.720018298257834
        ],
        "wc_strengths_avg": [
            103.4,
            65.69809738493194
        ],
        "wc_weaknesses_avg": [
            197.2,
            147.38982325791696
        ],
        "wc_questions_avg": [
            103.0,
            49.44896358873459
        ],
        "wc_review_avg": [
            489.2,
            253.61498378447595
        ],
        "wc_reply_reviewers_avg": [
            232.4,
            197.8722820407143
        ],
        "wc_reply_authors_avg": [
            1615.6,
            257.07633107697797
        ],
        "reply_reviewers_avg": [
            2.6,
            2.3323807579381204
        ],
        "reply_authors_avg": [
            4.4,
            1.9595917942265424
        ],
        "replies_avg": [
            43,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.7905694150420948,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1274881518775913856&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=XN6ZPINdSg",
        "pdf": "https://openreview.net/pdf?id=XN6ZPINdSg",
        "email": "illinois.edu;tudelft.nl;sfu.ca;illinois.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "University of Illinois Urbana-Champaign;Delft University of Technology;Simon Fraser University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://illinois.edu;https://www.tudelft.nl;https://www.sfu.ca",
        "aff_unique_abbr": "UIUC;TU Delft;SFU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Urbana-Champaign;",
        "aff_country_unique_index": "0;1;2;0",
        "aff_country_unique": "United States;Netherlands;Canada"
    },
    {
        "title": "Abstractors and relational cross-attention: An inductive bias for explicit relational reasoning in Transformers",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18451",
        "id": "XNa6r6ZjoB",
        "author_site": "Awni Altabaa, Taylor Webb, Jonathan Cohen, John Lafferty",
        "tldr": "",
        "abstract": "An extension of Transformers is proposed that enables explicit relational reasoning through a novel module called the *Abstractor*. At the core of the Abstractor is a variant of attention called *relational cross-attention*. The approach is motivated by an architectural inductive bias for relational learning that disentangles relational information from object-level features. This enables explicit relational reasoning, supporting abstraction and generalization from limited data. The Abstractor is first evaluated on simple discriminative relational tasks and compared to existing relational architectures. Next, the Abstractor is evaluated on purely relational sequence-to-sequence tasks, where dramatic improvements are seen in sample efficiency compared to standard Transformers. Finally, Abstractors are evaluated on a collection of tasks based on mathematical problem solving, where consistent improvements in performance and sample efficiency are observed.",
        "keywords": "relational representation learning;attention;transformers;sequence models;abstract representations",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/dfc553de22a91c9b71ab86263ed22b284a12ad13.zip",
        "author": "Awni Altabaa;Taylor Whittington Webb;Jonathan D. Cohen;John Lafferty",
        "authorids": "~Awni_Altabaa1;~Taylor_Whittington_Webb1;~Jonathan_D._Cohen1;~John_Lafferty2",
        "gender": ";M;;M",
        "homepage": "https://www.awni.xyz;https://scholar.google.com/citations?user=WCmrJoQAAAAJ&hl=en;http://statml.yale.edu;https://jdc.princeton.edu",
        "dblp": ";183/6144;;31/5509-3",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;WCmrJoQAAAAJ;;https://scholar.google.com.tw/citations?user=NCkkQAMAAAAJ",
        "orcid": ";;;0000-0003-2316-0763",
        "linkedin": ";;;",
        "or_profile": "~Awni_Altabaa1;~Taylor_Whittington_Webb1;~John_Lafferty2;~Jonathan_Cohen1",
        "aff": "Yale University;University of California, Los Angeles;Yale University;",
        "aff_domain": "yale.edu;ucla.edu;yale.edu;",
        "position": "PhD student;Postdoc;Professor;",
        "bibtex": "@inproceedings{\naltabaa2024abstractors,\ntitle={Abstractors and relational cross-attention: An inductive bias for explicit relational reasoning in Transformers},\nauthor={Awni Altabaa and Taylor Whittington Webb and Jonathan D. Cohen and John Lafferty},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=XNa6r6ZjoB}\n}",
        "github": "",
        "project": "",
        "reviewers": "qTc8;4fms;nkpJ;eiad",
        "pdf_size": 966709,
        "rating": "6;6;6;8",
        "confidence": "3;3;3;4",
        "soundness": "2;3;3;4",
        "contribution": "3;2;3;3",
        "presentation": "2;3;3;4",
        "wc_summary": "63;180;44;170",
        "wc_strengths": "42;82;41;135",
        "wc_weaknesses": "338;282;46;161",
        "wc_questions": "2;2;47;134",
        "wc_review": "445;546;178;600",
        "wc_reply_reviewers": "24;11;11;152",
        "wc_reply_authors": "1207;1023;225;1136",
        "reply_reviewers": "1;1;1;2",
        "reply_authors": "2;2;1;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            114.25,
            61.22244278040529
        ],
        "wc_strengths_avg": [
            75.0,
            38.38619543533847
        ],
        "wc_weaknesses_avg": [
            206.75,
            112.71950807202806
        ],
        "wc_questions_avg": [
            46.25,
            53.89051400756909
        ],
        "wc_review_avg": [
            442.25,
            162.39207954823414
        ],
        "wc_reply_reviewers_avg": [
            49.5,
            59.415906961015075
        ],
        "wc_reply_authors_avg": [
            897.75,
            393.9158380923519
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1391993246918759859&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=XNa6r6ZjoB",
        "pdf": "https://openreview.net/pdf?id=XNa6r6ZjoB",
        "email": "yale.edu;ucla.edu;yale.edu;",
        "author_num": 4,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Yale University;University of California, Los Angeles",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.yale.edu;https://www.ucla.edu",
        "aff_unique_abbr": "Yale;UCLA",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Los Angeles",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "XO944P8prc",
        "title": "Afterstate Reinforcement Learning for Continuous Control",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Humans consider the consequence of taking action in decision-making. In par2 ticular, we imagine what will happen upon executing an option of interest. In actor-critic algorithms, the critic evaluates actions from the actor by explicitly taking the action representation as input whereas the conventional value-based methods such as Deep Q-Network [Mnih et al., 2015] do not explicitly deal with such action information. With the action being input, the critic\u2019s task in the actor7 critic framework can be decomposed as follows; (I) learning the utility of action on the environment, (II) learning the future consequence of the action. Our work aims to enhance the critic\u2019s imagination (I) by utilising the environment model based on the model-based RL framework. To this end, our key insight is that all actions landing on the same next state are equivalent. In continuous action space tasks, robot control and painting, we show the efficacy of our method.",
        "keywords": "Reinforcement Learning;Actor-critic methods",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/97d44b0ee869cd6fea4907ddf008d054fff9fea5.zip",
        "author": "Norio Kosaka",
        "authorids": "~Norio_Kosaka1",
        "gender": "M",
        "homepage": "https://rowing0914.github.io/",
        "dblp": "",
        "google_scholar": "dIpkfPAAAAAJ",
        "orcid": "",
        "linkedin": "norio-kosaka-b73701117/",
        "or_profile": "~Norio_Kosaka1",
        "aff": "LINE",
        "aff_domain": "linecorp.com",
        "position": "Researcher",
        "bibtex": "@misc{\nkosaka2024afterstate,\ntitle={Afterstate Reinforcement Learning for Continuous Control},\nauthor={Norio Kosaka},\nyear={2024},\nurl={https://openreview.net/forum?id=XO944P8prc}\n}",
        "github": "",
        "project": "",
        "reviewers": "CtUq;D12j;Kkgd",
        "site": "https://openreview.net/forum?id=XO944P8prc",
        "pdf_size": 885710,
        "rating": "3;3;3",
        "confidence": "5;4;4",
        "soundness": "2;2;3",
        "contribution": "1;2;2",
        "presentation": "2;2;2",
        "wc_summary": "43;79;46",
        "wc_strengths": "35;8;30",
        "wc_weaknesses": "156;264;276",
        "wc_questions": "6;40;99",
        "wc_review": "240;391;451",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            56.0,
            16.30950643030009
        ],
        "wc_strengths_avg": [
            24.333333333333332,
            11.728408057172787
        ],
        "wc_weaknesses_avg": [
            232.0,
            53.96295025292817
        ],
        "wc_questions_avg": [
            48.333333333333336,
            38.42163742245016
        ],
        "wc_review_avg": [
            360.6666666666667,
            88.77061575894481
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:O0TvDdKK83kJ:scholar.google.com/&scioq=Afterstate+Reinforcement+Learning+for+Continuous+Control&hl=en&as_sdt=0,5",
        "gs_version_total": 0
    },
    {
        "title": "Consistent algorithms for multi-label classification with macro-at-$k$ metrics",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18450",
        "id": "XOnya9gSdF",
        "author_site": "Erik Schultheis, Wojciech Kotlowski, Marek Wydmuch, Rohit Babbar, Strom Borman, Krzysztof Dembczynski",
        "tldr": "",
        "abstract": "We consider the optimization of complex performance metrics in multi-label classification under the population utility framework. We mainly focus on metrics linearly decomposable into a sum of binary classification utilities applied separately to each label with an additional requirement of exactly $k$ labels predicted for each instance. These \"macro-at-$k$\" metrics possess desired properties for extreme classification problems with long tail labels. Unfortunately, the at-$k$ constraint couples the otherwise independent binary classification tasks, leading to a much more challenging optimization problem than standard macro-averages. We provide a statistical framework to study this problem, prove the existence and the form of the optimal classifier, and propose a statistically consistent and practical learning algorithm based on the Frank-Wolfe method. Interestingly, our main results concern even more general metrics being non-linear functions of label-wise confusion matrices. Empirical results provide evidence for the competitive performance of the proposed approach.",
        "keywords": "multi-label classification;complex performance metrics;macro-at-k;extreme classification",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Erik Schultheis;Wojciech Kotlowski;Marek Wydmuch;Rohit Babbar;Strom Borman;Krzysztof Dembczynski",
        "authorids": "~Erik_Schultheis1;~Wojciech_Kotlowski1;~Marek_Wydmuch1;~Rohit_Babbar1;~Strom_Borman1;~Krzysztof_Dembczynski1",
        "gender": ";M;M;;;",
        "homepage": "https://www.aalto.fi/en/people/erik-schultheis;;https://mwydmuch.pl;;;https://research.yahoo.com/researchers/kdembczynski",
        "dblp": "268/7969;63/4977;180/5883;;;91/3569",
        "google_scholar": "MGxmO7EAAAAJ;;lMXyoEAAAAAJ;;;https://scholar.google.pl/citations?user=SetMoyoAAAAJ",
        "orcid": "0000-0003-1685-8397;;0000-0002-6598-6304;;;0000-0001-7477-6758",
        "linkedin": ";;marekwydmuch;;;krzysztof-dembczynski-36155344/",
        "or_profile": "~Erik_Schultheis1;~Wojciech_Kotlowski1;~Marek_Wydmuch1;~Rohit_Babbar1;~Strom_Borman1;~Krzysztof_Dembczynski1",
        "aff": "Aalto University;Poznan University of Technology;Poznan University of Technology;;;Politechnika Poznanska",
        "aff_domain": "aalto.fi;put.poznan.pl;put.poznan.pl;;;put.poznan.pl",
        "position": "PhD student;Assistant Professor;Lecturer;;;Assistant Professor",
        "bibtex": "@inproceedings{\nschultheis2024consistent,\ntitle={Consistent algorithms for multi-label classification with macro-at-\\$k\\$ metrics},\nauthor={Erik Schultheis and Wojciech Kotlowski and Marek Wydmuch and Rohit Babbar and Strom Borman and Krzysztof Dembczynski},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=XOnya9gSdF}\n}",
        "github": "",
        "project": "",
        "reviewers": "XNZA;s4jL;gGLD;gTuy",
        "pdf_size": 1177707,
        "rating": "6;8;8;8",
        "confidence": "3;4;3;3",
        "soundness": "3;3;3;3",
        "contribution": "3;3;4;3",
        "presentation": "2;3;3;3",
        "wc_summary": "64;278;65;90",
        "wc_strengths": "9;68;41;126",
        "wc_weaknesses": "19;142;83;88",
        "wc_questions": "195;70;28;44",
        "wc_review": "287;558;217;348",
        "wc_reply_reviewers": "14;99;188;55",
        "wc_reply_authors": "985;938;471;880",
        "reply_reviewers": "1;2;1;1",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            124.25,
            89.3766608237296
        ],
        "wc_strengths_avg": [
            61.0,
            42.94764254298482
        ],
        "wc_weaknesses_avg": [
            83.0,
            43.59472445147463
        ],
        "wc_questions_avg": [
            84.25,
            65.67486200975226
        ],
        "wc_review_avg": [
            352.5,
            127.37837336062978
        ],
        "wc_reply_reviewers_avg": [
            89.0,
            64.57940848289027
        ],
        "wc_reply_authors_avg": [
            818.5,
            204.04717591772743
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11134820446239522&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=XOnya9gSdF",
        "pdf": "https://openreview.net/pdf?id=XOnya9gSdF",
        "email": "aalto.fi;put.poznan.pl;put.poznan.pl;;;put.poznan.pl",
        "author_num": 6,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "Aalto University;Poznan University of Technology;Politechnika Poznanska",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.aalto.fi;https://www.put.poznan.pl/;https://www.put.poznan.pl/",
        "aff_unique_abbr": "Aalto;PUT;PUT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "Finland;Poland"
    },
    {
        "id": "XSwxy3bojg",
        "title": "Generating Molecular Conformer Fields",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this paper we tackle the problem of generating conformers of a molecule in 3D space given its molecular graph. We parameterize these conformers as continuous functions that map elements from the molecular graph to points in 3D space. We then formulate the problem of learning to generate conformers as learning a distribution over these functions using a diffusion generative model, called Molecular Conformer Fields (MCF). Our approach is simple and scalable, and obtains results that are comparable or better than the previous state-of-the-art while making no assumptions about the explicit structure of molecules (\\eg modeling torsional angles). MCF represents an advance in extending diffusion models to handle complex scientific problems in a conceptually simple, scalable and effective manner.",
        "keywords": "diffusion model;molecular conformations;fields",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/4ad0f387d76dd568bd59800a709fd7ded542f866.zip",
        "author": "Yuyang Wang;Ahmed A. A. Elhag;Navdeep Jaitly;Joshua M. Susskind;Miguel \u00c1ngel Bautista",
        "authorids": "~Yuyang_Wang3;~Ahmed_A._A._Elhag1;~Navdeep_Jaitly1;~Joshua_M._Susskind1;~Miguel_\u00c1ngel_Bautista1",
        "gender": ";M;M;M;M",
        "homepage": "https://yuyangw.github.io/;;http://www.cs.toronto.edu/~ndjaitly/;http://www.apple.com;",
        "dblp": "43/8355-5;288/1987.html;04/6137;132/7797;38/10085",
        "google_scholar": "6eWGKEsAAAAJ;v0MsHOMAAAAJ;kjMNMLkAAAAJ;Sv2TGqsAAAAJ;ZrRs-qoAAAAJ",
        "orcid": "0000-0003-0723-6246;;;;",
        "linkedin": ";ahmed-a-a-elhag-7305441a3/;;joshua-susskind-8ab2ab5/;",
        "or_profile": "~Yuyang_Wang3;~Ahmed_A._A._Elhag1;~Navdeep_Jaitly1;~Joshua_M._Susskind1;~Miguel_\u00c1ngel_Bautista1",
        "aff": "Apple;Department of Computer Science, University of Oxford;Apple;Apple;Apple",
        "aff_domain": "apple.com;cs.ox.ac.uk;apple.com;apple.com;apple.com",
        "position": "Research Scientist;PhD student;Principal Researcher;Researcher;Research Scientist",
        "bibtex": "@misc{\nwang2024generating,\ntitle={Generating Molecular Conformer Fields},\nauthor={Yuyang Wang and Ahmed A. A. Elhag and Navdeep Jaitly and Joshua M. Susskind and Miguel {\\'A}ngel Bautista},\nyear={2024},\nurl={https://openreview.net/forum?id=XSwxy3bojg}\n}",
        "github": "",
        "project": "",
        "reviewers": "4uKr;Y3o3;6EV9;QmU2;ysLZ",
        "site": "https://openreview.net/forum?id=XSwxy3bojg",
        "pdf_size": 41611116,
        "rating": "3;3;5;5;6",
        "confidence": "4;4;4;4;3",
        "soundness": "2;2;2;2;3",
        "contribution": "2;2;3;2;2",
        "presentation": "3;1;3;3;2",
        "wc_summary": "79;107;59;66;95",
        "wc_strengths": "28;39;171;29;34",
        "wc_weaknesses": "764;195;788;73;107",
        "wc_questions": "116;75;166;35;106",
        "wc_review": "987;416;1184;203;342",
        "wc_reply_reviewers": "0;37;409;20;90",
        "wc_reply_authors": "1136;1412;2207;422;667",
        "reply_reviewers": "0;1;1;1;2",
        "reply_authors": "2;3;4;2;3",
        "rating_avg": [
            4.4,
            1.2
        ],
        "confidence_avg": [
            3.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.2,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.4,
            0.8
        ],
        "wc_summary_avg": [
            81.2,
            17.803370467414307
        ],
        "wc_strengths_avg": [
            60.2,
            55.53881525563901
        ],
        "wc_weaknesses_avg": [
            385.4,
            321.48940884576587
        ],
        "wc_questions_avg": [
            99.6,
            43.58256532146771
        ],
        "wc_review_avg": [
            626.4,
            386.1008158499539
        ],
        "wc_reply_reviewers_avg": [
            111.2,
            151.87020774332274
        ],
        "wc_reply_authors_avg": [
            1168.8,
            624.114540769561
        ],
        "reply_reviewers_avg": [
            1.0,
            0.6324555320336759
        ],
        "reply_authors_avg": [
            2.8,
            0.7483314773547882
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.6666666666666666,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15664863994993590258&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;0;0;0",
        "aff_unique_norm": "Apple;University of Oxford",
        "aff_unique_dep": "Apple Inc.;Department of Computer Science",
        "aff_unique_url": "https://www.apple.com;https://www.ox.ac.uk",
        "aff_unique_abbr": "Apple;Oxford",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Oxford",
        "aff_country_unique_index": "0;1;0;0;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "XT2yAa6Bbp",
        "title": "Sinkhorn Output Perturbations: Structured Pseudo-Label Noise in Semi-Supervised Segmentation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In semi-supervised segmentation, the strong-weak augmentation scheme has gained significant traction.\nTypically, a teacher model predicts a pseudo-label or consistency target from a weakly augmented image, while the student is tasked with matching the prediction when given a strong augmentation.\nHowever, this approach, popularized in self-supervised learning, is constrained by the model's current state.\nEven though the approach has led to state-of-the-art improvements as part of various algorithms, the inherent limitation, being confined to what the teacher model can predict, remains.\n\nIn Sinkhorn Output Perturbations, we introduce an algorithm that adds structured pseudo-label noise to the training, extending the strong-weak scheme to perturbations of the output beyond just input and feature perturbations.\nOur strategy softens the inherent limitations of the student-teacher methodologies by constructing noisy yet plausible pseudo-labels.\nSinkhorn Output Perturbations impose no specific architectural requirements and can be integrated into any segmentation model and combined with other semi-supervised strategies.\nOur method achieves state-of-the-art results on Cityscapes and presents competitive performance on Pascal VOC 2012, further improved upon combining our with another recent algorithm.\nThe experiments also show the efficacy of the reallocation algorithm and provide further empirical insights into pseudo-label noise in semi-supervised segmentation.\nCode is available at:",
        "keywords": "semi-supervised;segmentaiton;optimal transport;strong-weak augmentations",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Robert Mendel;David Rauber;Christoph Palm",
        "authorids": "~Robert_Mendel2;~David_Rauber1;~Christoph_Palm1",
        "gender": "M;;M",
        "homepage": "http://re-mic.de/;http://re-mic.de/;https://www.re-mic.de",
        "dblp": "197/5038;;14/6829.html",
        "google_scholar": ";;https://scholar.google.de/citations?user=VblqqkcAAAAJ",
        "orcid": ";;0000-0001-9468-2871",
        "linkedin": ";;https://linkedin.com/in/christophpalm",
        "or_profile": "~Robert_Mendel2;~David_Rauber1;~Christoph_Palm1",
        "aff": "Ostbayerische Technische Hochschule Regensburg;OTH Regensburg;Ostbayerische Technische Hochschule Regensburg",
        "aff_domain": "oth-regensburg.de;oth-regensburg.de;oth-regensburg.de",
        "position": "PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nmendel2024sinkhorn,\ntitle={Sinkhorn Output Perturbations: Structured Pseudo-Label Noise in Semi-Supervised Segmentation},\nauthor={Robert Mendel and David Rauber and Christoph Palm},\nyear={2024},\nurl={https://openreview.net/forum?id=XT2yAa6Bbp}\n}",
        "github": "",
        "project": "",
        "reviewers": "151F;tvp8;dzt9;XPw6",
        "site": "https://openreview.net/forum?id=XT2yAa6Bbp",
        "pdf_size": 7225199,
        "rating": "5;5;6;6",
        "confidence": "5;3;3;3",
        "soundness": "2;2;3;2",
        "contribution": "2;2;2;2",
        "presentation": "2;2;2;3",
        "wc_summary": "61;98;40;58",
        "wc_strengths": "43;42;19;43",
        "wc_weaknesses": "221;105;55;71",
        "wc_questions": "18;111;2;3",
        "wc_review": "343;356;116;175",
        "wc_reply_reviewers": "151;0;0;14",
        "wc_reply_authors": "612;748;262;425",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            64.25,
            21.07575621419075
        ],
        "wc_strengths_avg": [
            36.75,
            10.256095748383007
        ],
        "wc_weaknesses_avg": [
            113.0,
            64.91532946846992
        ],
        "wc_questions_avg": [
            33.5,
            45.191260216993285
        ],
        "wc_review_avg": [
            247.5,
            104.21252323977191
        ],
        "wc_reply_reviewers_avg": [
            41.25,
            63.62143899661497
        ],
        "wc_reply_authors_avg": [
            511.75,
            184.2313423389191
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:I3VK5uLIIqgJ:scholar.google.com/&scioq=Sinkhorn+Output+Perturbations:+Structured+Pseudo-Label+Noise+in+Semi-Supervised+Segmentation&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Ostbayerische Technische Hochschule;OTH Regensburg",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.oth-regensburg.de;https://www.oth-regensburg.de",
        "aff_unique_abbr": "OTH Regensburg;",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Regensburg;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "title": "Quantifying the Plausibility of Context Reliance in Neural Machine Translation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18449",
        "id": "XTHfNGI3zT",
        "author_site": "Gabriele Sarti, Grzegorz Chrupa\u0142a, Malvina Nissim, Arianna Bisazza",
        "tldr": "",
        "abstract": "Establishing whether language models can use contextual information in a human-plausible way is important to ensure their safe adoption in real-world settings. However, the questions of $\\textit{when}$ and $\\textit{which parts}$ of the context affect model generations are typically tackled separately, and current plausibility evaluations are practically limited to a handful of artificial benchmarks. To address this, we introduce $\\textbf{P}$lausibility $\\textbf{E}$valuation of $\\textbf{Co}$ntext $\\textbf{Re}$liance (PECoRe), an end-to-end interpretability framework designed to quantify context usage in language models' generations. Our approach leverages model internals to (i) contrastively identify context-sensitive target tokens in generated texts and (ii) link them to contextual cues justifying their prediction. We use PECoRe to quantify the plausibility of context-aware machine translation models, comparing model rationales with human annotations across several discourse-level phenomena. Finally, we apply our method to unannotated model translations to identify context-mediated predictions and highlight instances of (im)plausible context usage throughout generation.",
        "keywords": "explainable AI;interpretability;feature attribution;machine translation;document-level machine translation;natural language generation",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Gabriele Sarti;Grzegorz Chrupa\u0142a;Malvina Nissim;Arianna Bisazza",
        "authorids": "~Gabriele_Sarti1;~Grzegorz_Chrupa\u0142a1;~Malvina_Nissim1;~Arianna_Bisazza1",
        "gender": "M;M;F;F",
        "homepage": "https://gsarti.com;http://grzegorz.chrupala.me;https://malvinanissim.github.io;https://www.cs.rug.nl/~bisazza/",
        "dblp": "273/4259.html;19/1379;91/2392;32/10934",
        "google_scholar": "https://scholar.google.it/citations?user=sK0B_08AAAAJ;https://scholar.google.nl/citations?user=p6m63xoAAAAJ;hnTpEOAAAAAJ;https://scholar.google.it/citations?user=biQvUhcAAAAJ",
        "orcid": "0000-0001-8715-2987;0000-0001-9498-6912;;",
        "linkedin": "gabrielesarti/;;;arianna-bisazza-92754329/",
        "or_profile": "~Gabriele_Sarti1;~Grzegorz_Chrupa\u0142a1;~Malvina_Nissim1;~Arianna_Bisazza1",
        "aff": "University of Groningen;Tilburg University;University of Groningen;University of Groningen",
        "aff_domain": "rug.nl;tilburguniversity.edu;rug.nl;rug.nl",
        "position": "PhD student;Associate Professor;Full Professor;Associate Professor",
        "bibtex": "@inproceedings{\nsarti2024quantifying,\ntitle={Quantifying the Plausibility of Context Reliance in Neural Machine Translation},\nauthor={Gabriele Sarti and Grzegorz Chrupa{\\l}a and Malvina Nissim and Arianna Bisazza},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=XTHfNGI3zT}\n}",
        "github": "",
        "project": "",
        "reviewers": "DAmX;sS3A;GSke;kdfb",
        "pdf_size": 1125873,
        "rating": "3;5;6;8",
        "confidence": "2;2;2;4",
        "soundness": "2;2;3;4",
        "contribution": "2;3;3;3",
        "presentation": "1;3;2;4",
        "wc_summary": "127;95;77;248",
        "wc_strengths": "22;44;109;165",
        "wc_weaknesses": "103;194;39;162",
        "wc_questions": "88;16;18;35",
        "wc_review": "340;349;243;610",
        "wc_reply_reviewers": "0;0;0;23",
        "wc_reply_authors": "557;648;172;414",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            2.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            136.75,
            66.67973830182599
        ],
        "wc_strengths_avg": [
            85.0,
            56.182737562350944
        ],
        "wc_weaknesses_avg": [
            124.5,
            59.179810746571334
        ],
        "wc_questions_avg": [
            39.25,
            29.09789511287715
        ],
        "wc_review_avg": [
            385.5,
            136.1148412187297
        ],
        "wc_reply_reviewers_avg": [
            5.75,
            9.959292143521045
        ],
        "wc_reply_authors_avg": [
            447.75,
            179.73087519956053
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.8006407690254357,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17180830878524850325&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=XTHfNGI3zT",
        "pdf": "https://openreview.net/pdf?id=XTHfNGI3zT",
        "email": "rug.nl;tilburguniversity.edu;rug.nl;rug.nl",
        "author_num": 4,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "University of Groningen;Tilburg University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.rug.nl;https://www.tilburguniversity.edu/",
        "aff_unique_abbr": "RUG;Tilburg U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Netherlands"
    },
    {
        "id": "XTJ0YVBM10",
        "title": "What is a good question? Task-oriented asking with fact-level masking",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Asking questions is an important element of real-life collaboration on reason- ing tasks like question answering. For example, a legal assistant chatbot may be unable to make accurate recommendations without specific information on the user\u2019s circumstances. However, large language models are usually deployed to solve reasoning tasks directly without asking follow-up questions to the user or third parties. We term this problem task-oriented asking (TOA). Zero-shot chat models can perform TOA, but their training is primarily based on next- token prediction rather than whether questions contribute to successful col- laboration. To enable the training and evaluation of TOA models, we present a definition and framework for natural language task-oriented asking, the prob- lem of generating questions that result in answers useful for a reasoning task. We also present fact-level masking (FLM), a procedure for converting natural language datasets into self-supervised TOA datasets by omitting particular crit- ical facts. Finally, we generate a TOA dataset from the HotpotQA dataset using FLM and evaluate several zero-shot language models on it. Our experiments show that current zero-shot models struggle to ask questions that retrieve use- ful information, as compared to human annotators. These results demonstrate an opportunity to use FLM datasets and the TOA framework to train and evalu- ate better TOA models.",
        "keywords": "Question Generation;HCI;Information Retrieval;NLP;Language Model;Dataset",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Matthew Toles;Yukun Huang;Zhou Yu;Luis Gravano",
        "authorids": "~Matthew_Toles1;~Yukun_Huang3;~Zhou_Yu1;~Luis_Gravano1",
        "gender": "M;;F;",
        "homepage": "https://www.matoles.com;;http://www.cs.columbia.edu/~zhouyu/;",
        "dblp": ";;83/3205;",
        "google_scholar": ";;https://scholar.google.com.tw/citations?user=jee2Dy0AAAAJ;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Matthew_Toles1;~Yukun_Huang3;~Zhou_Yu1;~Luis_Gravano1",
        "aff": "Columbia University;;Columbia University;",
        "aff_domain": "columbia.edu;;columbia.edu;",
        "position": "PhD student;;Assistant Professor;",
        "bibtex": "@misc{\ntoles2024what,\ntitle={What is a good question? Task-oriented asking with fact-level masking},\nauthor={Matthew Toles and Yukun Huang and Zhou Yu and Luis Gravano},\nyear={2024},\nurl={https://openreview.net/forum?id=XTJ0YVBM10}\n}",
        "github": "",
        "project": "",
        "reviewers": "egWC;Hko3;tQwg",
        "site": "https://openreview.net/forum?id=XTJ0YVBM10",
        "pdf_size": 366059,
        "rating": "3;3;6",
        "confidence": "4;3;4",
        "soundness": "2;2;4",
        "contribution": "1;2;3",
        "presentation": "2;2;3",
        "wc_summary": "65;167;78",
        "wc_strengths": "69;67;153",
        "wc_weaknesses": "196;261;556",
        "wc_questions": "61;213;170",
        "wc_review": "391;708;957",
        "wc_reply_reviewers": "0;0;28",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;1",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            103.33333333333333,
            45.330882286680556
        ],
        "wc_strengths_avg": [
            96.33333333333333,
            40.07770230717103
        ],
        "wc_weaknesses_avg": [
            337.6666666666667,
            156.64893516678907
        ],
        "wc_questions_avg": [
            148.0,
            63.97395303298575
        ],
        "wc_review_avg": [
            685.3333333333334,
            231.62373702959627
        ],
        "wc_reply_reviewers_avg": [
            9.333333333333334,
            13.199326582148887
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3965814758390472635&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Columbia University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.columbia.edu",
        "aff_unique_abbr": "Columbia",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "XTXaJmWXKu",
        "title": "Continual Nonlinear ICA-Based Representation Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Unsupervised identification of disentangled representations remains a challenging problem. Recent progress in nonlinear Independent Component Analysis (ICA) provides a promising causal representation learning framework by separating latent sources from observable nonlinear mixtures. However, its identifiability hinges on the incorporation of side information, such as time or domain indexes,  which are challenging to obtain adequately offline in real-world scenarios.  In this paper, we develop a novel approach for nonlinear ICA that effectively accommodates continually arriving domains. We first theoretically demonstrate that model identifiability escalates from subspace to component-wise identifiability as new domains are involved. It motivates us to maintain prior knowledge and progressively refine it using new arriving domains.  Upon observing a new domain, our approach optimizes the model by satisfying two objectives: (1) reconstructing the observations within the current domain, and (2) preserving the reconstruction capabilities for prior domains through gradient constraints. Experiments demonstrate that our method achieves performance comparable to nonlinear ICA methods trained jointly on multiple offline domains, demonstrating its practical applicability in continual learning scenarios.",
        "keywords": "Casual Representation Learning;Nonlinear ICA;Continual Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/9730fbeba394989cd26b9897ecd6be8093794334.zip",
        "author": "Boyang Sun;Ignavier Ng;Guangyi Chen;Yifan Shen;Qirong Ho;Kun Zhang",
        "authorids": "~Boyang_Sun1;~Ignavier_Ng1;~Guangyi_Chen1;~Yifan_Shen4;~Qirong_Ho1;~Kun_Zhang1",
        "gender": "M;M;M;M;;M",
        "homepage": ";https://ignavierng.github.io/;https://chengy12.github.io/;https://sanshuiii.github.io/about/;;http://www.andrew.cmu.edu/user/kunz1/",
        "dblp": ";251/3037;c/GuangyiChen-2;59/7950-4;13/7590;96/3115-1",
        "google_scholar": ";;https://scholar.google.com/citations?hl=zh-CN;PMKkElwAAAAJ;tR3AZbwAAAAJ;RGoypN4AAAAJ",
        "orcid": "0000-0002-0118-4425;;;0000-0003-2358-1146;;",
        "linkedin": ";;;;;",
        "or_profile": "~Boyang_Sun1;~Ignavier_Ng1;~Guangyi_Chen1;~Yifan_Shen4;~Qirong_Ho1;~Kun_Zhang1",
        "aff": "Mohamed bin Zayed University of Artificial Intelligence;Carnegie Mellon University;Carnegie Mellon University;Mohamed bin Zayed University of Artificial Intelligence;Petuum, Inc.;Carnegie Mellon University",
        "aff_domain": "mbzuai.ac.ae;cmu.edu;cmu.edu;mbzuai.ac.ae;petuum.com;cmu.edu",
        "position": "PhD student;PhD student;Postdoc;MS student;CTO;Associate Professor",
        "bibtex": "@misc{\nsun2024continual,\ntitle={Continual Nonlinear {ICA}-Based Representation Learning},\nauthor={Boyang Sun and Ignavier Ng and Guangyi Chen and Yifan Shen and Qirong Ho and Kun Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=XTXaJmWXKu}\n}",
        "github": "",
        "project": "",
        "reviewers": "k5LY;iGtV;r8sE",
        "site": "https://openreview.net/forum?id=XTXaJmWXKu",
        "pdf_size": 3760630,
        "rating": "3;3;3",
        "confidence": "2;4;4",
        "soundness": "2;2;3",
        "contribution": "2;3;2",
        "presentation": "2;1;2",
        "wc_summary": "76;33;91",
        "wc_strengths": "14;36;35",
        "wc_weaknesses": "97;449;798",
        "wc_questions": "5;183;443",
        "wc_review": "192;701;1367",
        "wc_reply_reviewers": "0;157;480",
        "wc_reply_authors": "579;997;1990",
        "reply_reviewers": "0;2;1",
        "reply_authors": "1;2;3",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            66.66666666666667,
            24.580932086115496
        ],
        "wc_strengths_avg": [
            28.333333333333332,
            10.143416036468626
        ],
        "wc_weaknesses_avg": [
            448.0,
            286.18292518364314
        ],
        "wc_questions_avg": [
            210.33333333333334,
            179.8542619888546
        ],
        "wc_review_avg": [
            753.3333333333334,
            481.116987390339
        ],
        "wc_reply_reviewers_avg": [
            212.33333333333334,
            199.8271475272789
        ],
        "wc_reply_authors_avg": [
            1188.6666666666667,
            591.7670337406623
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:IVJmzYeQAfkJ:scholar.google.com/&scioq=Continual+Nonlinear+ICA-Based+Representation+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;0;2;1",
        "aff_unique_norm": "Mohamed bin Zayed University of Artificial Intelligence;Carnegie Mellon University;Petuum, Inc.",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://mbzuai.ac.ae;https://www.cmu.edu;https://www.petuum.com",
        "aff_unique_abbr": "MBZUAI;CMU;Petuum",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;0;1;1",
        "aff_country_unique": "United Arab Emirates;United States"
    },
    {
        "id": "XTwwtlEfTF",
        "title": "Robust Multimodal Learning with Missing Modalities via Parameter-Efficient Adaptation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Multimodal learning seeks to utilize data from multiple sources to improve the overall performance of downstream tasks. It is desirable for redundancies in the data to make multimodal systems robust to missing or corrupted observations in some correlated modalities.  However, we observe that the performance of several existing multimodal networks significantly deteriorates if one or multiple modalities are absent at test time. To enable robustness to missing modalities, we propose simple and parameter-efficient adaptation procedures for pretrained multimodal networks. In particular, we exploit low-rank adaptation and modulation of intermediate features to compensate for the missing modalities. We demonstrate that such adaptation can partially bridge performance drop due to missing modalities and outperform independent, dedicated networks trained for the available modality combinations in some cases. The proposed adaptation requires extremely small number of parameters (e.g., fewer than 0.7% of the total parameters in most experiments). We conduct a series of experiments to highlight the robustness of our proposed method using diverse datasets for RGB-thermal and RGB-Depth semantic segmentation, multimodal material segmentation, and multimodal sentiment analysis tasks. Our proposed method demonstrates versatility across various tasks and datasets, and outperforms existing methods for robust multimodal learning with missing modalities.",
        "keywords": "missing modalities;robust multimodal learning;model adaptation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Md Kaykobad Reza;Ashley Prater-Bennette;M. Salman Asif",
        "authorids": "~Md_Kaykobad_Reza1;~Ashley_Prater-Bennette1;~M._Salman_Asif1",
        "gender": "M;F;M",
        "homepage": "https://kaykobad.github.io/;;https://www.ece.ucr.edu/~sasif",
        "dblp": "356/4047;158/9018;21/1910",
        "google_scholar": "GgXLwMsAAAAJ;f1WPBE8AAAAJ;Dl0puDcAAAAJ",
        "orcid": "0009-0002-9982-7800;;0000-0001-5993-3903",
        "linkedin": "kaykobadreza/;;",
        "or_profile": "~Md_Kaykobad_Reza1;~Ashley_Prater-Bennette1;~Salman_Asif1",
        "aff": "University of California, Riverside;Air Force Research Laboratory;University of California, Riverside",
        "aff_domain": "ucr.edu;us.af.mil;ucr.edu",
        "position": "PhD student;Principal Researcher;Associate Professor",
        "bibtex": "@misc{\nreza2024robust,\ntitle={Robust Multimodal Learning with Missing Modalities via Parameter-Efficient Adaptation},\nauthor={Md Kaykobad Reza and Ashley Prater-Bennette and M. Salman Asif},\nyear={2024},\nurl={https://openreview.net/forum?id=XTwwtlEfTF}\n}",
        "github": "",
        "project": "",
        "reviewers": "WPGU;Gaao;ibUc;wJeo",
        "site": "https://openreview.net/forum?id=XTwwtlEfTF",
        "pdf_size": 8968432,
        "rating": "3;5;5;5",
        "confidence": "4;3;3;5",
        "soundness": "2;3;2;2",
        "contribution": "2;3;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "48;25;149;68",
        "wc_strengths": "8;38;99;82",
        "wc_weaknesses": "29;82;151;117",
        "wc_questions": "27;2;52;3",
        "wc_review": "112;147;451;270",
        "wc_reply_reviewers": "0;0;140;0",
        "wc_reply_authors": "664;483;2091;912",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "2;2;4;3",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            72.5,
            46.71455875848556
        ],
        "wc_strengths_avg": [
            56.75,
            35.88436288970448
        ],
        "wc_weaknesses_avg": [
            94.75,
            45.124134340727245
        ],
        "wc_questions_avg": [
            21.0,
            20.506096654409877
        ],
        "wc_review_avg": [
            245.0,
            132.62164227606291
        ],
        "wc_reply_reviewers_avg": [
            35.0,
            60.6217782649107
        ],
        "wc_reply_authors_avg": [
            1037.5,
            627.0137558299658
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.17407765595569782,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13032929081405574065&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of California, Riverside;Air Force Research Laboratory",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ucr.edu;https://www.afrl.af.mil/",
        "aff_unique_abbr": "UCR;AFRL",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Riverside;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "XUCAA0XnPC",
        "title": "Ensembler: Combating model inversion attacks using model ensemble during collaborative inference",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep learning models have exhibited remarkable performance across various domains. Nevertheless, the burgeoning model sizes compel edge devices to offload a significant portion of the inference process to the cloud. While this practice offers numerous advantages, it also raises critical concerns regarding user data privacy. In scenarios where the cloud server's trustworthiness is in question, the need for a practical and adaptable method to safeguard data privacy becomes imperative.\nIn this paper, we introduce $\\textit{Ensembler}$ an extensible framework designed to substantially increase the difficulty of conducting model inversion attacks for adversarial parties. $\\textit{Ensembler}$ leverages model ensembling on the adversarial server, running in parallel with existing approaches that introduce perturbations to sensitive data at different stages of the inference pipeline. Our experiments demonstrate that when combined with even basic Gaussian noise, $\\textit{Ensembler}$ can effectively shield images from reconstruction attacks, achieving recognition levels that fall below human performance in some strict settings, significantly outperforming baseline methods lacking the $\\textit{Ensembler}$ framework.",
        "keywords": "Privacy-preserving machine learning (PPML);collaborative inference;deep learning;machine learning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Dancheng Liu;Jinjun Xiong",
        "authorids": "~Dancheng_Liu2;~Jinjun_Xiong1",
        "gender": "M;",
        "homepage": "https://danchengliu.github.io/;https://www.xlab-ub.com",
        "dblp": "284/8181;81/1130",
        "google_scholar": ";tRt1xPYAAAAJ",
        "orcid": "0009-0003-6107-5612;0000-0002-2620-4859",
        "linkedin": ";jinjun-xiong-314774/",
        "or_profile": "~Dancheng_Liu2;~Jinjun_Xiong1",
        "aff": "University at Buffalo;State University of New York at Buffalo",
        "aff_domain": "buffalo.edu;buffalo.edu",
        "position": "PhD student;Professor",
        "bibtex": "@misc{\nliu2024ensembler,\ntitle={Ensembler: Combating model inversion attacks using model ensemble during collaborative inference},\nauthor={Dancheng Liu and Jinjun Xiong},\nyear={2024},\nurl={https://openreview.net/forum?id=XUCAA0XnPC}\n}",
        "github": "",
        "project": "",
        "reviewers": "oZxB;mcWL;Z7Pt;H7PD",
        "site": "https://openreview.net/forum?id=XUCAA0XnPC",
        "pdf_size": 12059864,
        "rating": "3;3;3;5",
        "confidence": "4;4;2;2",
        "soundness": "1;1;2;3",
        "contribution": "1;2;2;3",
        "presentation": "2;1;2;3",
        "wc_summary": "71;211;49;71",
        "wc_strengths": "40;42;20;25",
        "wc_weaknesses": "512;277;116;169",
        "wc_questions": "77;252;98;12",
        "wc_review": "700;782;283;277",
        "wc_reply_reviewers": "82;190;95;0",
        "wc_reply_authors": "391;766;195;266",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            1.0
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            100.5,
            64.42631449958937
        ],
        "wc_strengths_avg": [
            31.75,
            9.443913383762052
        ],
        "wc_weaknesses_avg": [
            268.5,
            152.08632417150466
        ],
        "wc_questions_avg": [
            109.75,
            88.03514923029324
        ],
        "wc_review_avg": [
            510.5,
            232.32574114806994
        ],
        "wc_reply_reviewers_avg": [
            91.75,
            67.41058893082005
        ],
        "wc_reply_authors_avg": [
            404.5,
            220.1913940189307
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17267991732427819400&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University at Buffalo;State University of New York at Buffalo",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.buffalo.edu;https://www.buffalo.edu",
        "aff_unique_abbr": "UB;SUNY Buffalo",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Buffalo",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "XUZ2S0JVJP",
        "title": "FrugalGPT: How to Use Large Language Models While Reducing Cost and Improving Performance",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The rapid adoption of large language models (LLMs) has led to an growing number of companies offering generative LLMs as callable services at varying costs. We find that popular generative LLM APIs, such as GPT-4, ChatGPT, and J1-Jumbo, exhibit heterogeneous pricing structures, with fees that can differ by two orders of magnitude, and heterogeneous performance across tasks and input queries. This makes it challenging for users to decide which generative LLM APIs to utilize for their applications and budget. Motivated by these findings, we propose FrugalGPT, an algorithmic framework that adaptively selects which generative LLMs to use for different queries to reduce cost and improve accuracy. Our experiments demonstrate that, for a range of natural language tasks including news classification, reading comprehension, and scientific question answering, FrugalGPT can match the performance of the best individual generative LLM (e.g., GPT-4) with up to a 98% cost reduction or improve the accuracy over GPT-4 by 4% at the same cost. The ideas and findings presented in this paper lay a foundation for using LLMs sustainably and efficiently.",
        "keywords": "LLM; GPT-4; joint optimization of performance-cost; MLaaS",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/b75b8be632d4844c128eedead8de2bab645f8c5c.pdf",
        "author": "Lingjiao Chen;Matei Zaharia;James Zou",
        "authorids": "~Lingjiao_Chen1;~Matei_Zaharia1;~James_Zou1",
        "gender": ";M;",
        "homepage": ";https://cs.stanford.edu/~matei/;",
        "dblp": "131/6638.html;36/2133;",
        "google_scholar": ";I1EvjZsAAAAJ;23ZXZvEAAAAJ",
        "orcid": ";0000-0002-7547-7204;",
        "linkedin": ";mateizaharia/;",
        "or_profile": "~Lingjiao_Chen1;~Matei_Zaharia1;~James_Zou1",
        "aff": "Stanford University;Databricks;Stanford University",
        "aff_domain": "stanford.edu;databricks.com;stanford.edu",
        "position": "PhD student;CTO;Assistant Professor",
        "bibtex": "@misc{\nchen2024frugalgpt,\ntitle={Frugal{GPT}: How to Use Large Language Models While Reducing Cost and Improving Performance},\nauthor={Lingjiao Chen and Matei Zaharia and James Zou},\nyear={2024},\nurl={https://openreview.net/forum?id=XUZ2S0JVJP}\n}",
        "github": "",
        "project": "",
        "reviewers": "3Fst;QsiX;dfGd;q9b6",
        "site": "https://openreview.net/forum?id=XUZ2S0JVJP",
        "pdf_size": 1778452,
        "rating": "5;6;8;8",
        "confidence": "3;5;5;4",
        "soundness": "2;2;4;3",
        "contribution": "2;4;3;4",
        "presentation": "3;4;3;3",
        "wc_summary": "50;80;117;29",
        "wc_strengths": "23;56;82;57",
        "wc_weaknesses": "117;231;62;52",
        "wc_questions": "258;138;11;25",
        "wc_review": "448;505;272;163",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1107;390;11;233",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            3.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            69.0,
            33.1134413795969
        ],
        "wc_strengths_avg": [
            54.5,
            20.958291915134687
        ],
        "wc_weaknesses_avg": [
            115.5,
            71.12840501515551
        ],
        "wc_questions_avg": [
            108.0,
            99.62178476618455
        ],
        "wc_review_avg": [
            347.0,
            136.60710084032968
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            435.25,
            410.54498839956625
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5222329678670935,
        "gs_citation": 226,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17810158224239597759&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Stanford University;Databricks",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.stanford.edu;https://databricks.com",
        "aff_unique_abbr": "Stanford;Databricks",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Stanford;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "XUzHegCq6f",
        "title": "Polyak Parameter Ensemble: Exponential Parameter Growth Leads to Better Generalization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Building an ensemble model via prediction averaging often improves the generalization performance over a single model across challenging tasks.\nYet, prediction averaging comes with three well-known disadvantages: the computational overhead of training multiple models, increased latency and memory requirements at testing.\nHere, we propose a remedy for these disadvantages.\nOur approach (PPE) constructs a parameter ensemble model to improve \nthe generalization performance \\emph{with virtually no additional computational cost}.\nDuring training, PPE maintains a running weighted average of the model parameters at each epoch interval.\nTherefore, PPE with uniform weights can be seen as applying the Polyak averaging technique at each epoch interval.\nWe show that a weight per epoch can be dynamically determined via the validation loss or pre-determined in an exponentially increasing fashion.\nWe conducted extensive experiments on 11 benchmark datasets ranging from multi-hop reasoning to image classification task.\nOverall, results suggest that PPE consistently leads to a more stable training and a better generalization across models and datasets.",
        "keywords": "Polyak Averagning;Ensemble Learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Caglar Demir;Axel-Cyrille Ngonga Ngomo",
        "authorids": "~Caglar_Demir1;~Axel-Cyrille_Ngonga_Ngomo2",
        "gender": "M;",
        "homepage": "https://dice-research.org/;http://dice-research.org",
        "dblp": ";65/4336",
        "google_scholar": ";ccQhjwkAAAAJ",
        "orcid": ";0000-0001-7112-3516",
        "linkedin": "caglar-demir/;",
        "or_profile": "~Caglar_Demir1;~Axel_Ngonga1",
        "aff": "eim;Universit\u00e4t Paderborn",
        "aff_domain": "paderborn.de;uni-paderborn.de",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\ndemir2024polyak,\ntitle={Polyak Parameter Ensemble: Exponential Parameter Growth Leads to Better Generalization},\nauthor={Caglar Demir and Axel-Cyrille Ngonga Ngomo},\nyear={2024},\nurl={https://openreview.net/forum?id=XUzHegCq6f}\n}",
        "github": "",
        "project": "",
        "reviewers": "cGaK;kkKM;XnC1;2Kw3",
        "site": "https://openreview.net/forum?id=XUzHegCq6f",
        "pdf_size": 388780,
        "rating": "3;3;3;3",
        "confidence": "4;4;3;4",
        "soundness": "2;2;1;3",
        "contribution": "1;1;1;1",
        "presentation": "2;2;2;3",
        "wc_summary": "76;52;57;53",
        "wc_strengths": "42;48;30;22",
        "wc_weaknesses": "209;276;191;141",
        "wc_questions": "66;30;1;39",
        "wc_review": "393;406;279;255",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            59.5,
            9.7082439194738
        ],
        "wc_strengths_avg": [
            35.5,
            10.136567466356647
        ],
        "wc_weaknesses_avg": [
            204.25,
            48.33929560926597
        ],
        "wc_questions_avg": [
            34.0,
            23.205602771744587
        ],
        "wc_review_avg": [
            333.25,
            66.94914114460319
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:9XzeDQyWpa4J:scholar.google.com/&scioq=Polyak+Parameter+Ensemble:+Exponential+Parameter+Growth+Leads+to+Better+Generalization&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "1",
        "aff_unique_norm": ";University of Paderborn",
        "aff_unique_dep": ";",
        "aff_unique_url": ";https://www.uni-paderborn.de",
        "aff_unique_abbr": ";UPB",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "1",
        "aff_country_unique": ";Germany"
    },
    {
        "title": "Stack Attention: Improving the Ability of Transformers to Model Hierarchical Patterns",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18448",
        "id": "XVhm3X8Fum",
        "author_site": "Brian DuSell, David Chiang",
        "tldr": "",
        "abstract": "Attention, specifically scaled dot-product attention, has proven effective for natural language, but it does not have a mechanism for handling hierarchical patterns of arbitrary nesting depth, which limits its ability to recognize certain syntactic structures. To address this shortcoming, we propose stack attention: an attention operator that incorporates stacks, inspired by their theoretical connections to context-free languages (CFLs). We show that stack attention is analogous to standard attention, but with a latent model of syntax that requires no syntactic supervision. We propose two variants: one related to deterministic pushdown automata (PDAs) and one based on nondeterministic PDAs, which allows transformers to recognize arbitrary CFLs. We show that transformers with stack attention are very effective at learning CFLs that standard transformers struggle on, achieving strong results on a CFL with theoretically maximal parsing difficulty. We also show that stack attention is more effective at natural language modeling under a constrained parameter budget, and we include results on machine translation.",
        "keywords": "transformer;attention;context-free languages;pushdown automata;formal languages;language modeling;machine translation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/e1831149abdf78111ed7c5f362c2bd0628013755.zip",
        "author": "Brian DuSell;David Chiang",
        "authorids": "~Brian_DuSell1;~David_Chiang1",
        "gender": ";M",
        "homepage": ";https://nd.edu/~dchiang",
        "dblp": ";https://dblp.org/pers/hd/c/Chiang_0001:David",
        "google_scholar": ";dok0514AAAAJ",
        "orcid": ";0000-0002-0435-4864",
        "linkedin": ";",
        "or_profile": "~Brian_DuSell1;~David_Chiang1",
        "aff": ";University of Notre Dame",
        "aff_domain": ";nd.edu",
        "position": ";Associate Professor",
        "bibtex": "@inproceedings{\ndusell2024stack,\ntitle={Stack Attention: Improving the Ability of Transformers to Model Hierarchical Patterns},\nauthor={Brian DuSell and David Chiang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=XVhm3X8Fum}\n}",
        "github": "",
        "project": "",
        "reviewers": "knG9;ecSr;bkRf",
        "pdf_size": 435228,
        "rating": "6;6;8",
        "confidence": "4;4;5",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "3;2;3",
        "wc_summary": "132;176;193",
        "wc_strengths": "65;33;47",
        "wc_weaknesses": "47;151;263",
        "wc_questions": "9;245;1",
        "wc_review": "253;605;504",
        "wc_reply_reviewers": "0;136;19",
        "wc_reply_authors": "279;1334;542",
        "reply_reviewers": "0;1;1",
        "reply_authors": "1;3;1",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            167.0,
            25.703436864876
        ],
        "wc_strengths_avg": [
            48.333333333333336,
            13.097921802925667
        ],
        "wc_weaknesses_avg": [
            153.66666666666666,
            88.20178884555321
        ],
        "wc_questions_avg": [
            85.0,
            113.18421562508911
        ],
        "wc_review_avg": [
            454.0,
            147.9887383102737
        ],
        "wc_reply_reviewers_avg": [
            51.666666666666664,
            60.13503323539634
        ],
        "wc_reply_authors_avg": [
            718.3333333333334,
            448.38698563728286
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.9999999999999997,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4037164006115822770&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=XVhm3X8Fum",
        "pdf": "https://openreview.net/pdf?id=XVhm3X8Fum",
        "email": ";nd.edu",
        "author_num": 2,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Notre Dame",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nd.edu",
        "aff_unique_abbr": "Notre Dame",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "XVv4S6LnMk",
        "title": "Towards Demystifying the Generalization Behaviors When Neural Collapse Emerges",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Neural Collapse (NC) is a well-known phenomenon of deep neural networks in the terminal phase of training (TPT). It is characterized by the collapse of features and classifier into a symmetrical structure, known as simplex equiangular tight frame (ETF). While there have been extensive studies on optimization characteristics showing the global optimality of neural collapse, little research has been done on the generalization behaviors during the occurrence of NC. Particularly, the important phenomenon of generalization improvement during TPT has been remaining in an empirical observation and lacking rigorous theoretical explanation. In this paper, we establish the connection between the minimization of CE and a multi-class SVM during TPT, and then derive a multi-class margin generalization bound, which provides a theoretical explanation for why continuing training can still lead to accuracy improvement on test set, even after the train accuracy has reached 100%. Additionally, our further theoretical results indicate that different alignment between labels and features in a simplex ETF can result in varying degrees of generalization improvement, despite all models reaching NC and demonstrating similar optimization performance on train set. We refer to this newly discovered property as \u201cnon-conservative generalization\u201d. In experiments, we also provide empirical observations to verify the indications suggested by our theoretical results.",
        "keywords": "Deep Learning; Neural Collapse; Generalization Analysis",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/d91b71d7f216ef78573d66e3cdbd65646aee3d02.pdf",
        "author": "Gao Peifeng;Qianqian Xu;Yibo Yang;Peisong Wen;Huiyang Shao;Zhiyong Yang;Bernard Ghanem;Qingming Huang",
        "authorids": "~Gao_Peifeng2;~Qianqian_Xu2;~Yibo_Yang2;~Peisong_Wen1;~Huiyang_Shao2;~Zhiyong_Yang1;~Bernard_Ghanem1;~Qingming_Huang1",
        "gender": "M;F;M;M;;M;M;",
        "homepage": "https://github.com/h-summit;http://vipl.ict.ac.cn/people/~qianqianxu;https://iboing.github.io/;https://github.com/KID-7391;;https://joshuaas.github.io/;https://ivul.kaust.edu.sa;",
        "dblp": ";07/7627;28/7717/;276/3218;;01/452-1.html;37/2516;",
        "google_scholar": ";https://scholar.google.com.hk/citations?user=MjifS2MAAAAJ;DxXXnCcAAAAJ;Zk2XLWYAAAAJ;;https://scholar.google.com/citations?hl=zh-CN;rVsGTeEAAAAJ;",
        "orcid": ";;;;;0000-0002-4409-4999;0000-0002-5534-587X;",
        "linkedin": ";;;;;;bernardghanem/;",
        "or_profile": "~Gao_Peifeng2;~Qianqian_Xu2;~Yibo_Yang2;~Peisong_Wen1;~Huiyang_Shao2;~Zhiyong_Yang1;~Bernard_Ghanem1;~Qingming_Huang1",
        "aff": "University of Chinese Academy of Sciences;Institute of Computing Technology, Chinese Academy of Sciences;King Abdullah University of Science and Technology;Chinese Academy of Sciences;;University of Chinese Academic of Sciences;King Abdullah University of Science and Technology;",
        "aff_domain": "ucas.ac.cn;ict.ac.cn;kaust.edu.sa;ict.ac.cn;;ucas.ac.cb;kaust.edu.sa;",
        "position": "Undergrad student;Full Professor;Research Scientist;PhD student;;Associate Professor;Full Professor;",
        "bibtex": "@misc{\npeifeng2024towards,\ntitle={Towards Demystifying the Generalization Behaviors When Neural Collapse Emerges},\nauthor={Gao Peifeng and Qianqian Xu and Yibo Yang and Peisong Wen and Huiyang Shao and Zhiyong Yang and Bernard Ghanem and Qingming Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=XVv4S6LnMk}\n}",
        "github": "",
        "project": "",
        "reviewers": "zHE3;PCNB;LrEp;c2cC",
        "site": "https://openreview.net/forum?id=XVv4S6LnMk",
        "pdf_size": 744767,
        "rating": "1;3;5;5",
        "confidence": "4;5;4;3",
        "soundness": "2;2;3;3",
        "contribution": "1;1;2;2",
        "presentation": "3;3;3;3",
        "wc_summary": "93;103;92;88",
        "wc_strengths": "89;9;102;54",
        "wc_weaknesses": "129;378;93;115",
        "wc_questions": "1060;6;10;109",
        "wc_review": "1371;496;297;366",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            1.6583123951777
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            94.0,
            5.522680508593631
        ],
        "wc_strengths_avg": [
            63.5,
            36.03123644839294
        ],
        "wc_weaknesses_avg": [
            178.75,
            115.75053995554406
        ],
        "wc_questions_avg": [
            296.25,
            442.87716976606504
        ],
        "wc_review_avg": [
            632.5,
            432.31845900909667
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.42640143271122083,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4168977188398836240&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2;1;0;2",
        "aff_unique_norm": "University of Chinese Academy of Sciences;Chinese Academy of Sciences;King Abdullah University of Science and Technology",
        "aff_unique_dep": ";Institute of Computing Technology;",
        "aff_unique_url": "http://www.ucas.ac.cn;http://www.ict.ac.cn;https://www.kast.kau.edu.sa",
        "aff_unique_abbr": "UCAS;CAS;KAUST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0;1",
        "aff_country_unique": "China;Saudi Arabia"
    },
    {
        "id": "XW0gD13oQp",
        "title": "Language Agents for Detecting Implicit Stereotypes in Text-to-image Models at Scale",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The recent surge in the research of diffusion models has accelerated the adoption of text-to-image models in various Artificial Intelligence Generated Content (AIGC) commercial products. While these exceptional AIGC products are gaining increasing recognition and sparking enthusiasm among consumers, the questions regarding whether, when, and how these models might unintentionally reinforce existing societal stereotypes remain largely unaddressed. Motivated by recent advancements in language agents, here we introduce a novel agent architecture tailored for stereotype detection in text-to-image models. This versatile agent architecture is capable of accommodating free-form detection tasks and can autonomously invoke various tools to facilitate the entire process, from generating corresponding instructions and images, to detecting stereotypes. \nWe build the stereotype-relevant benchmark based on multiple open text datasets, and apply this architecture to commercial products and popular open source text-to-image models. We find that these models often display serious biases when it comes to certain prompts about personal characteristics, social cultural context and crime-related aspects. In summary, these empirical findings underscore the pervasive existence of stereotypes across social dimensions, including gender, race, and religion, which not only validate the effectiveness of our proposed approach, but also emphasize the critical necessity of addressing potential ethical risks in the burgeoning realm of AIGC. As AIGC continues its rapid expansion trajectory, with new models and plugins emerging daily in staggering numbers, the challenge lies in the timely detection and mitigation of potential biases within these models.",
        "keywords": "Text-to-image generation;social stereotype;language agent",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/c5ab128e062d0d9a99922d5dd6ff505794d0acfb.zip",
        "author": "Qichao Wang;Tian Bian;Yian Yin;Tingyang Xu;Hong Cheng;Helen M. Meng;Zibin Zheng;Liang Chen;Bingzhe Wu",
        "authorids": "~Qichao_Wang1;~Tian_Bian1;~Yian_Yin2;~Tingyang_Xu1;~Hong_Cheng1;~Helen_M._Meng1;~Zibin_Zheng1;~Liang_Chen7;~Bingzhe_Wu1",
        "gender": "M;;;M;F;F;M;M;M",
        "homepage": "https://qichaos-wang.github.io/;;http://www.yianyin.net;;https://www1.se.cuhk.edu.hk/~hcheng/;http://www.se.cuhk.edu.hk/people/academic-staff/prof-meng-mei-ling-helen/;https://www.zibinzheng.com/;https://chenliang.tech/;",
        "dblp": ";;199/1984;157/0940;85/5637-1;92/3270;z/ZibinZheng;https://dblp.uni-trier.de/pid/01/5394-1;207/4843",
        "google_scholar": ";;;6gIs5YMAAAAJ;https://scholar.google.com.hk/citations?user=s3lQL7YAAAAJ;;WPC6ED4AAAAJ;pGZtPjcAAAAJ;_3hgtf8AAAAJ",
        "orcid": ";;;0009-0002-0106-8376;0000-0002-4673-2587;;0000-0002-7878-4330;;",
        "linkedin": ";;;;;;;;",
        "or_profile": "~Qichao_Wang1;~Tian_Bian1;~Yian_Yin2;~Tingyang_Xu1;~Hong_Cheng1;~Helen_M._Meng1;~Zibin_Zheng1;~Liang_Chen7;~Bingzhe_Wu1",
        "aff": "SUN YAT-SEN UNIVERSITY;;Cornell University;Tencent AI Lab;The Chinese University of Hong Kong;The Chinese University of Hong Kong;SUN YAT-SEN UNIVERSITY;;Tencent AI Lab",
        "aff_domain": "sysu.edu.cn;;cornell.edu;tencent.com;cuhk.edu.hk;cuhk.edu.hk;sysu.edu.cn;;tencent.com",
        "position": "MS student;;Assistant Professor;Researcher;Professor;Full Professor;Full Professor;;Researcher",
        "bibtex": "@misc{\nwang2024language,\ntitle={Language Agents for Detecting Implicit Stereotypes in Text-to-image Models at Scale},\nauthor={Qichao Wang and Tian Bian and Yian Yin and Tingyang Xu and Hong Cheng and Helen M. Meng and Zibin Zheng and Liang Chen and Bingzhe Wu},\nyear={2024},\nurl={https://openreview.net/forum?id=XW0gD13oQp}\n}",
        "github": "",
        "project": "",
        "reviewers": "35MJ;xoCn;d3He",
        "site": "https://openreview.net/forum?id=XW0gD13oQp",
        "pdf_size": 2907587,
        "rating": "3;5;6",
        "confidence": "4;3;3",
        "soundness": "2;2;3",
        "contribution": "1;2;2",
        "presentation": "1;1;4",
        "wc_summary": "96;61;108",
        "wc_strengths": "90;44;93",
        "wc_weaknesses": "210;311;34",
        "wc_questions": "136;30;59",
        "wc_review": "532;446;294",
        "wc_reply_reviewers": "78;60;0",
        "wc_reply_authors": "683;542;171",
        "reply_reviewers": "1;1;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            1.4142135623730951
        ],
        "wc_summary_avg": [
            88.33333333333333,
            19.93879523831757
        ],
        "wc_strengths_avg": [
            75.66666666666667,
            22.425184255405547
        ],
        "wc_weaknesses_avg": [
            185.0,
            114.45814373239969
        ],
        "wc_questions_avg": [
            75.0,
            44.7288124888943
        ],
        "wc_review_avg": [
            424.0,
            98.40054200392733
        ],
        "wc_reply_reviewers_avg": [
            46.0,
            33.34666400106613
        ],
        "wc_reply_authors_avg": [
            465.3333333333333,
            215.93877733180662
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -0.9449111825230683,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15321097075486253931&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;3;3;0;2",
        "aff_unique_norm": "Sun Yat-sen University;Cornell University;Tencent;Chinese University of Hong Kong",
        "aff_unique_dep": ";;Tencent AI Lab;",
        "aff_unique_url": "http://www.sysu.edu.cn;https://www.cornell.edu;https://ai.tencent.com;https://www.cuhk.edu.hk",
        "aff_unique_abbr": "SYSU;Cornell;Tencent AI Lab;CUHK",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;1;0;0;0;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "XWfjugkXzN",
        "title": "On Sampling Information Sets to Learn from Imperfect Information",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In many real-world decision-making scenarios, agents are confronted with incomplete and imperfect information, requiring them to make choices based on limited knowledge. Imperfect-information games tackle this challenge by organising different potential situations into so-called information sets, i.e. sets of possible world states that are indistinguishable from one observer's perspective, but directly evaluating an information set is difficult. A common but often suboptimal strategy is to evaluate the individual states in the set with a perfect information evaluator and combine the results. This not only presents problems related to translating perfect information evaluations to imperfect information settings but is also immensely costly in situations with extensive hidden information. This work focuses on learning direct evaluators for information sets by assessing only a subset of the states in the information set, thereby reducing the overall cost of evaluation. Critically, we focus on one question: How many states should be sampled from a given information set? This involves a trade-off between the cost of computing a training signal and its accuracy. We present experimental results in three settings: an artificial MNIST variant with hidden information, Heads-Up Poker, and Reconnaissance Blind Chess. Our results show that the number of sampled states significantly influences the efficiency of training neural networks. However, there are diminishing returns when sampling a large number of states. Notably, in the three regarded domains, using one, two and two samples respectively leads to the best performance concerning the total number of evaluations required. This research contributes to the understanding of how to optimise the sampling of information sets in scenarios of incomplete information, thus offering practical insight into the balance between computational cost and accuracy.",
        "keywords": "Games;Imperfect Information;Neural Networks",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Timo Bertram;Johannes F\u00fcrnkranz;Martin M\u00fcller",
        "authorids": "~Timo_Bertram1;~Johannes_F\u00fcrnkranz1;~Martin_M\u00fcller2",
        "gender": "M;M;M",
        "homepage": ";https://www.jku.at/en/institute-for-application-oriented-knowledge-processing/about-us/team/johannes-fuernkranz/;https://webdocs.cs.ualberta.ca/~mmueller/",
        "dblp": ";f/JohannesFurnkranz;https://dblp.org/pers/hd/m/M=uuml=ller_0003:Martin",
        "google_scholar": "b8aWdXcAAAAJ;https://scholar.google.de/citations?user=sfTn4wEAAAAJ;J60BcHkAAAAJ",
        "orcid": ";0000-0002-1207-0159;0000-0002-5639-5318",
        "linkedin": ";;",
        "or_profile": "~Timo_Bertram1;~Johannes_F\u00fcrnkranz1;~Martin_Mueller1",
        "aff": "Johannes Kepler Universit\u00e4t Linz;Johannes Kepler University Linz;University of Alberta",
        "aff_domain": "jku.at;jku.at;ualberta.ca",
        "position": "PhD student;Full Professor;Full Professor",
        "bibtex": "@misc{\nbertram2024on,\ntitle={On Sampling Information Sets to Learn from Imperfect Information},\nauthor={Timo Bertram and Johannes F{\\\"u}rnkranz and Martin M{\\\"u}ller},\nyear={2024},\nurl={https://openreview.net/forum?id=XWfjugkXzN}\n}",
        "github": "",
        "project": "",
        "reviewers": "p622;nuwk;ufB6",
        "site": "https://openreview.net/forum?id=XWfjugkXzN",
        "pdf_size": 5009616,
        "rating": "1;1;3",
        "confidence": "5;4;3",
        "soundness": "1;1;3",
        "contribution": "1;1;1",
        "presentation": "1;1;3",
        "wc_summary": "37;56;47",
        "wc_strengths": "1;25;30",
        "wc_weaknesses": "248;66;438",
        "wc_questions": "30;20;104",
        "wc_review": "316;167;619",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "contribution_avg": [
            1.0,
            0.0
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            46.666666666666664,
            7.760297817881877
        ],
        "wc_strengths_avg": [
            18.666666666666668,
            12.657891697365017
        ],
        "wc_weaknesses_avg": [
            250.66666666666666,
            151.8800696456107
        ],
        "wc_questions_avg": [
            51.333333333333336,
            37.464056848605644
        ],
        "wc_review_avg": [
            367.3333333333333,
            188.06440977022268
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:pQiTdCrzyMIJ:scholar.google.com/&scioq=On+Sampling+Information+Sets+to+Learn+from+Imperfect+Information&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Johannes Kepler University Linz;Johannes Kepler University;University of Alberta",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.jku.at;https://www.jku.at;https://www.ualberta.ca",
        "aff_unique_abbr": "JKU;JKU;UAlberta",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Linz;",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "Austria;Canada"
    },
    {
        "id": "XXpH3D0TVP",
        "title": "The Journey, Not the Destination: How Data Guides Diffusion Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Diffusion models trained on large datasets can synthesize photo-realistic images\nof remarkable quality and diversity. However, attributing these images\nback to the training data\u2014that is, identifying specific training examples which\ncaused an image to be generated\u2014remains a challenge. In this paper, we\npropose a framework that: (i) provides a formal notion of data attribution in\nthe context of diffusion models, and (ii) allows us to counterfactually\nvalidate such attributions.  Then, we provide a method for computing these\nattributions efficiently.  Finally, we apply our method to find (and evaluate)\nsuch attributions for denoising diffusion probabilistic models trained on\nCIFAR-10 and latent diffusion models trained on MS COCO.",
        "keywords": "diffusion models;data attribution;data valuation;generative models",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Kristian Georgiev;Joshua Vendrow;Hadi Salman;Sung Min Park;Aleksander Madry",
        "authorids": "~Kristian_Georgiev1;~Joshua_Vendrow2;~Hadi_Salman1;~Sung_Min_Park2;~Aleksander_Madry1",
        "gender": "M;;M;M;M",
        "homepage": "https://hadisalman.com/;https://sungminpark.com;https://people.csail.mit.edu/madry/;http://www.joshvendrow.com;https://kristian-georgiev.github.io/",
        "dblp": "192/3204;28/157;67/2454;274/7218;304/2868",
        "google_scholar": "Kr8JjF0AAAAJ;;SupjsEUAAAAJ;zQjuF5wAAAAJ;t8RKSJsAAAAJ",
        "orcid": ";;;0000-0002-1041-5782;0000-0003-4802-1962",
        "linkedin": ";;;joshua-vendrow/;",
        "or_profile": "~Hadi_Salman1;~Sung_Min_Park2;~Aleksander_Madry1;~Joshua_Vendrow1;~Kristian_Georgiev_Georgiev1",
        "aff": "Massachusetts Institute of Technology;Massachusetts Institute of Technology;Massachusetts Institute of Technology;Massachusetts Institute of Technology;Massachusetts Institute of Technology",
        "aff_domain": "mit.edu;mit.edu;mit.edu;mit.edu;mit.edu",
        "position": "PhD Student;PhD student;Professor;PhD student;PhD student",
        "bibtex": "@misc{\ngeorgiev2024the,\ntitle={The Journey, Not the Destination: How Data Guides Diffusion Models},\nauthor={Kristian Georgiev and Joshua Vendrow and Hadi Salman and Sung Min Park and Aleksander Madry},\nyear={2024},\nurl={https://openreview.net/forum?id=XXpH3D0TVP}\n}",
        "github": "",
        "project": "",
        "reviewers": "Kccm;ujFU;XavF;KmFt",
        "site": "https://openreview.net/forum?id=XXpH3D0TVP",
        "pdf_size": 4677187,
        "rating": "5;6;6;6",
        "confidence": "3;4;3;4",
        "soundness": "2;3;3;2",
        "contribution": "2;3;3;3",
        "presentation": "1;2;1;3",
        "wc_summary": "59;62;63;82",
        "wc_strengths": "58;59;74;189",
        "wc_weaknesses": "216;42;329;198",
        "wc_questions": "59;55;104;170",
        "wc_review": "392;218;570;639",
        "wc_reply_reviewers": "254;0;0;0",
        "wc_reply_authors": "1579;530;1123;966",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "3;2;3;3",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            66.5,
            9.069178573608527
        ],
        "wc_strengths_avg": [
            95.0,
            54.63972913549261
        ],
        "wc_weaknesses_avg": [
            196.25,
            102.23594035367405
        ],
        "wc_questions_avg": [
            97.0,
            46.330335634441504
        ],
        "wc_review_avg": [
            454.75,
            163.7213715432411
        ],
        "wc_reply_reviewers_avg": [
            63.5,
            109.9852262806237
        ],
        "wc_reply_authors_avg": [
            1049.5,
            375.041664352109
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            0.4330127018922193
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 18,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4991932943592751732&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Massachusetts Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://web.mit.edu",
        "aff_unique_abbr": "MIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "XXrUarMM20",
        "title": "Efficient and Quantization-Friendly Ternary Fourier Convolution Algorithms",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Fast convolution algorithms like Winograd and the Fourier transform are well-known for their substantial reduction in the multiplication complexity of Convolutional Neural Networks. However, when these methods are combined with model quantization, their inherently complex transformation matrices can introduce significant numerical errors, leading to a decrease in network accuracy. To address this challenge, we present a novel fast convolution algorithm that utilizes ternary matrices (coefficients containing only \u00b11 and 0) for input and weight transformations before multiplication, thus minimizing quantization errors. This approach is derived from the implementation of symbolic arithmetic on the Fourier transform to eliminate the involvement of irrational numbers. Then, we incorporate correction terms to  convert ineffective circular convolution results into efficient ones, thereby enhancing algorithm efficiency. Additionally, we propose a corresponding post-training quantization method that requires only a few samples for calibrating network parameters and restoring accuracy without the heavy cost of retraining. Our algorithms achieve 3.68x, 4.89x, and 4.54x theoretical multiplication complexity reduction for 3x3, 5x5, and 7x7 convolutions, respectively. For models trained on the ImageNet dataset, our algorithms with the post-training method, demonstrate an accuracy drop of less than 0.2% under Int8 quantization, surpassing other approaches with similar multiplication reduction ratios.",
        "keywords": "Deep Learning; Fast Convolution Algorithm; CNN; Winograd; Fourier Transform",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Liulu He;Li Du;Yuan Du",
        "authorids": "~Liulu_He1;~Li_Du5;~Yuan_Du2",
        "gender": "M;M;M",
        "homepage": "https://iscl.nju.edu.cn/2c/80/c42983a601216/page.htm;https://ese.nju.edu.cn/dy_en/list.htm;https://iscl.nju.edu.cn/main.psp",
        "dblp": "283/8409.html;26/8831;",
        "google_scholar": ";zyu8Qy4AAAAJ;",
        "orcid": ";0000-0002-5316-619X;0000-0003-2687-6978",
        "linkedin": ";;",
        "or_profile": "~Liulu_He1;~Yuan_Du2;~LI_DU4",
        "aff": "Nanjing University;Nanjing University;Nanjing University",
        "aff_domain": "nju.edu.cn;nju.edu.cn;nju.edu.cn",
        "position": "PhD student;Associate Professor;Associate Professor",
        "bibtex": "@misc{\nhe2024efficient,\ntitle={Efficient and Quantization-Friendly Ternary Fourier Convolution Algorithms},\nauthor={Liulu He and Li Du and Yuan Du},\nyear={2024},\nurl={https://openreview.net/forum?id=XXrUarMM20}\n}",
        "github": "",
        "project": "",
        "reviewers": "tjrq;uiWW;NNvf",
        "site": "https://openreview.net/forum?id=XXrUarMM20",
        "pdf_size": 971678,
        "rating": "3;5;6",
        "confidence": "4;2;4",
        "soundness": "3;2;3",
        "contribution": "2;2;3",
        "presentation": "3;1;3",
        "wc_summary": "68;114;144",
        "wc_strengths": "34;68;50",
        "wc_weaknesses": "187;102;57",
        "wc_questions": "67;64;7",
        "wc_review": "356;348;258",
        "wc_reply_reviewers": "0;0;31",
        "wc_reply_authors": "2052;1468;1070",
        "reply_reviewers": "0;0;1",
        "reply_authors": "3;3;2",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            108.66666666666667,
            31.255221785949445
        ],
        "wc_strengths_avg": [
            50.666666666666664,
            13.888444437333106
        ],
        "wc_weaknesses_avg": [
            115.33333333333333,
            53.90320542932077
        ],
        "wc_questions_avg": [
            46.0,
            27.60434748368452
        ],
        "wc_review_avg": [
            320.6666666666667,
            44.43222054120436
        ],
        "wc_reply_reviewers_avg": [
            10.333333333333334,
            14.613540144521982
        ],
        "wc_reply_authors_avg": [
            1530.0,
            403.2898048136931
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.1889822365046137,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:nce20mZP0FkJ:scholar.google.com/&scioq=Efficient+and+Quantization-Friendly+Ternary+Fourier+Convolution+Algorithms&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Nanjing University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nju.edu.cn",
        "aff_unique_abbr": "Nanjing U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "XZGklkaOsL",
        "title": "Unified Medical Image Pre-training in Language-Guided Common Semantic Space",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Vision-Language Pre-training (VLP) has shown the merits of analysing medical\nimages, by leveraging the semantic congruence between medical images and their\ncorresponding reports. It efficiently learns visual representations, which in turn fa-\ncilitates enhanced analysis and interpretation of intricate imaging data. However,\nsuch observation is predominantly justified on single-modality data (mostly 2D\nimages like X-rays), adapting VLP to learning unified representations for medical\nimages in real scenario remains an open challenge. This arises from medical im-\nages often encompass a variety of modalities, especially modalities with different\nvarious number of dimensions (e.g., 3D images like Computed Tomography). To\novercome the aforementioned challenges, we propose an Unified Medical Image\nPre-training framework, namely UniMedI, which utilizes diagnostic reports as\ncommon semantic space to create unified representations for diverse modalities\nof medical images (especially for 2D and 3D images). Under the text\u2019s guidance,\nwe effectively uncover visual modality information, identifying the affected areas\nin 2D X-rays and slices containing lesion in sophisticated 3D CT scans, ultimately\nenhancing the consistency across various medical imaging modalities. To demon-\nstrate the effectiveness and versatility of UniMedI, we evaluate its performance\non both 2D and 3D images across 10 different datasets, covering a wide range of\nmedical image tasks such as classification, segmentation, and retrieval. UniMedI\nhas demonstrated superior performance in downstream tasks, showcasing its ef-\nfectiveness in establishing a universal medical visual representation.",
        "keywords": "medical images;vision language pre-training",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Xiaoxuan He;Yifan Yang;XINYANG JIANG;Xufang Luo;Haoji Hu;Siyun Zhao;Dongsheng Li;Yuqing Yang;Lili Qiu",
        "authorids": "~Xiaoxuan_He1;~Yifan_Yang9;~XINYANG_JIANG2;~Xufang_Luo1;~Haoji_Hu1;~Siyun_Zhao1;~Dongsheng_Li2;~Yuqing_Yang1;~Lili_Qiu1",
        "gender": "M;M;M;F;M;F;M;;F",
        "homepage": "https://github.com/Shredded-Pork;https://www.microsoft.com/en-us/research/people/yifanyang/;;;https://person.zju.edu.cn/huhaoji;;http://recmind.cn;;https://www.cs.utexas.edu/~lili/",
        "dblp": "188/4696;83/89-4;155/6316;218/7350;65/11145;;254/0830-2.html;91/9064-1.html;",
        "google_scholar": ";;JiTfWVMAAAAJ;;https://scholar.google.com/citations?hl=zh-CN;;VNg5rA8AAAAJ;4BtNQAEAAAAJ;https://scholar.google.com.tw/citations?user=16posrQAAAAJ",
        "orcid": ";;;;0000-0001-6048-6549;;0000-0003-3103-8442;0000-0003-3518-5212;",
        "linkedin": ";yifyang/;xinyang-jiang-ab5416b0/;;;siyun-zhao-ba250212a;;;",
        "or_profile": "~Xiaoxuan_He1;~Yifan_Yang9;~XINYANG_JIANG2;~Xufang_Luo1;~Haoji_Hu1;~Siyun_Zhao1;~Dongsheng_Li2;~Yuqing_Yang1;~Lili_Qiu1",
        "aff": "Zhejiang University;Microsoft;Microsoft;Microsoft Research;Zhejiang University;Microsoft;Microsoft Research Asia;Microsoft Research;University of Texas at Austin",
        "aff_domain": "zju.edu.cn;microsoft.com;microsoft.com;microsoft.com;zju.edu.cn;microsoft.com;microsoft.com;research.microsoft.com;cs.utexas.edu",
        "position": "PhD student;Researcher;Senior Researcher;Researcher;Associate Professor;Research SDE;Principal Researcher;Researcher;Full Professor",
        "bibtex": "@misc{\nhe2024unified,\ntitle={Unified Medical Image Pre-training in Language-Guided Common Semantic Space},\nauthor={Xiaoxuan He and Yifan Yang and XINYANG JIANG and Xufang Luo and Haoji Hu and Siyun Zhao and Dongsheng Li and Yuqing Yang and Lili Qiu},\nyear={2024},\nurl={https://openreview.net/forum?id=XZGklkaOsL}\n}",
        "github": "",
        "project": "",
        "reviewers": "zUjR;vK4s;8U1f;EXCm",
        "site": "https://openreview.net/forum?id=XZGklkaOsL",
        "pdf_size": 2501669,
        "rating": "3;6;6;6",
        "confidence": "5;4;4;5",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "63;39;87;62",
        "wc_strengths": "45;95;65;64",
        "wc_weaknesses": "39;79;211;147",
        "wc_questions": "417;70;16;130",
        "wc_review": "564;283;379;403",
        "wc_reply_reviewers": "0;0;0;18",
        "wc_reply_authors": "2110;1503;1834;2467",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "3;2;3;4",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            62.75,
            16.97608612136496
        ],
        "wc_strengths_avg": [
            67.25,
            17.893783836852393
        ],
        "wc_weaknesses_avg": [
            119.0,
            65.66582063752801
        ],
        "wc_questions_avg": [
            158.25,
            154.73586365157885
        ],
        "wc_review_avg": [
            407.25,
            101.02567742905761
        ],
        "wc_reply_reviewers_avg": [
            4.5,
            7.794228634059948
        ],
        "wc_reply_authors_avg": [
            1978.5,
            354.5789756880687
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12445736600936386892&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 10,
        "aff_unique_index": "0;1;1;1;0;1;1;1;2",
        "aff_unique_norm": "Zhejiang University;Microsoft;University of Texas at Austin",
        "aff_unique_dep": ";Microsoft Corporation;",
        "aff_unique_url": "https://www.zju.edu.cn;https://www.microsoft.com;https://www.utexas.edu",
        "aff_unique_abbr": "ZJU;Microsoft;UT Austin",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Asia;Austin",
        "aff_country_unique_index": "0;1;1;1;0;1;0;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "XaqaitclOA",
        "title": "Investigating the Ability of PINNs To Solve Burgers' PDE Near Finite-Time BlowUp",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Physics Informed Neural Networks (PINNs) have been achieving ever newer feats of solving complicated PDEs numerically while offering an attractive trade-off between accuracy and speed of inference. A particularly challenging aspect of PDEs is that there exist simple PDEs which can evolve into singular solutions in finite time starting from smooth initial conditions. In recent times some striking experiments have suggested that PINNs might be good at even detecting such finite-time blow-ups. In this work, we embark on a program to investigate this stability of PINNs from a rigorous theoretical viewpoint. Firstly, we derive generalization bounds for PINNs for Burgers' PDE, in arbitrary dimensions, under conditions that allow for a finite-time blow-up. Then we demonstrate via experiments that our bounds are significantly correlated to the $\\ell_2$-distance of the neurally found surrogate from the true blow-up solution, when computed on sequences of PDEs that are getting increasingly close to a blow-up.",
        "keywords": "physics-informed neural networks;partial differential equations;generalization theory;blow-up",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Dibyakanti Kumar;Anirbit Mukherjee",
        "authorids": "~Dibyakanti_Kumar1;~Anirbit_Mukherjee1",
        "gender": ";M",
        "homepage": ";",
        "dblp": ";",
        "google_scholar": ";https://scholar.google.com/citations?pli=1",
        "orcid": ";",
        "linkedin": ";anirbit-mukherjee/",
        "or_profile": "~Dibyakanti_Kumar1;~Anirbit_Mukherjee1",
        "aff": ";University of Manchester",
        "aff_domain": ";manchester.ac.uk",
        "position": ";Assistant Professor",
        "bibtex": "@misc{\nkumar2024investigating,\ntitle={Investigating the Ability of {PINN}s To Solve Burgers' {PDE} Near Finite-Time BlowUp},\nauthor={Dibyakanti Kumar and Anirbit Mukherjee},\nyear={2024},\nurl={https://openreview.net/forum?id=XaqaitclOA}\n}",
        "github": "",
        "project": "",
        "reviewers": "QLQE;7pxF;aEZi;ndTQ",
        "site": "https://openreview.net/forum?id=XaqaitclOA",
        "pdf_size": 1990438,
        "rating": "3;5;6;6",
        "confidence": "4;2;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "40;80;20;253",
        "wc_strengths": "40;66;58;177",
        "wc_weaknesses": "352;228;158;152",
        "wc_questions": "27;22;4;39",
        "wc_review": "459;396;240;621",
        "wc_reply_reviewers": "0;105;0;0",
        "wc_reply_authors": "1007;751;274;659",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "3;3;2;2",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            98.25,
            91.91946203062766
        ],
        "wc_strengths_avg": [
            85.25,
            53.80230013670419
        ],
        "wc_weaknesses_avg": [
            222.5,
            80.51552645297676
        ],
        "wc_questions_avg": [
            23.0,
            12.589678312014172
        ],
        "wc_review_avg": [
            429.0,
            136.5412025727033
        ],
        "wc_reply_reviewers_avg": [
            26.25,
            45.46633369868303
        ],
        "wc_reply_authors_avg": [
            672.75,
            263.1714032717081
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14915957672086146966&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Manchester",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.manchester.ac.uk",
        "aff_unique_abbr": "UoM",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "XasWgF5WsZ",
        "title": "Elucidating the Solution Space of Extended Reverse-Time SDE for Diffusion Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Diffusion models (DMs) demonstrate potent image generation capabilities in various generative modeling tasks. Nevertheless, their primary limitation lies in slow sampling speed, requiring hundreds or thousands of sequential function evaluations through large neural networks to generate high-quality images. Sampling from DMs can be seen alternatively as solving corresponding stochastic differential equations (SDEs) or ordinary differential equations (ODEs). In this work, we formulate the sampling process as an extended reverse-time SDE (ER SDE), unifying prior explorations into ODEs and SDEs. Leveraging the semi-linear structure of ER SDE solutions, we offer exact solutions and arbitrarily high-order approximate solutions for VP SDE and VE SDE, respectively. Based on the solution space of the ER SDE, we yield mathematical insights elucidating the superior performance of ODE solvers over SDE solvers in terms of fast sampling. Additionally, we unveil that VP SDE solvers stand on par with their VE SDE counterparts. Finally, we devise fast and training-free samplers, ER-SDE-Solvers, achieving state-of-the-art performance across all stochastic samplers. Experimental results demonstrate achieving 3.45 FID in 20 function evaluations and 2.24 FID in 50 function evaluations on the ImageNet $64\\times64$ dataset.",
        "keywords": "diffusion probabilistic models;fast sampling;stochastic differential equations",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/4d657a2f31fd3d71005c0beae69a012ea751ba88.zip",
        "author": "Qinpeng Cui;Xinyi Zhang;Zongqing Lu;Qingmin Liao",
        "authorids": "~Qinpeng_Cui1;~Xinyi_Zhang10;~Zongqing_Lu3;~Qingmin_Liao1",
        "gender": "M;F;M;M",
        "homepage": "https://orcid.org/my-orcid?orcid=0009-0008-6796-2112;;https://www.x-mol.com/university/faculty/61332;https://www.sigs.tsinghua.edu.cn/lqm_en/main.htm",
        "dblp": ";;99/965-1.html;13/322",
        "google_scholar": ";https://scholar.google.cz/citations?user=Au0f7NEAAAAJ;;",
        "orcid": ";0009-0000-9915-5608;0000-0002-1191-9069;0000-0002-7509-3964",
        "linkedin": ";;;",
        "or_profile": "~Qinpeng_Cui1;~Xinyi_Zhang10;~Zongqing_Lu3;~Qingmin_Liao1",
        "aff": "Tsinghua University;Tsinghua University;Tsinghua University;Tsinghua University",
        "aff_domain": "mail.tsinghua.edu.cn;mail.tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "MS student;PhD student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\ncui2024elucidating,\ntitle={Elucidating the Solution Space of Extended Reverse-Time {SDE} for Diffusion Models},\nauthor={Qinpeng Cui and Xinyi Zhang and Zongqing Lu and Qingmin Liao},\nyear={2024},\nurl={https://openreview.net/forum?id=XasWgF5WsZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "RiM8;f7G3;yrnV;bLLA",
        "site": "https://openreview.net/forum?id=XasWgF5WsZ",
        "pdf_size": 20494897,
        "rating": "3;5;5;6",
        "confidence": "4;4;3;4",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;2;3",
        "wc_summary": "59;58;92;68",
        "wc_strengths": "37;30;104;56",
        "wc_weaknesses": "235;217;70;71",
        "wc_questions": "30;8;225;4",
        "wc_review": "361;313;491;199",
        "wc_reply_reviewers": "950;113;0;0",
        "wc_reply_authors": "3417;858;762;540",
        "reply_reviewers": "7;2;0;0",
        "reply_authors": "9;3;2;2",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            69.25,
            13.699908758820257
        ],
        "wc_strengths_avg": [
            56.75,
            28.89095879336648
        ],
        "wc_weaknesses_avg": [
            148.25,
            78.01081655770564
        ],
        "wc_questions_avg": [
            66.75,
            91.9004216530044
        ],
        "wc_review_avg": [
            341.0,
            104.69957019969088
        ],
        "wc_reply_reviewers_avg": [
            265.75,
            397.7363291176706
        ],
        "wc_reply_authors_avg": [
            1394.25,
            1173.5165902108074
        ],
        "reply_reviewers_avg": [
            2.25,
            2.8613807855648994
        ],
        "reply_authors_avg": [
            4.0,
            2.9154759474226504
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.13245323570650439,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10229430047460758182&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Tsinghua University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "XbLffB0T2z",
        "title": "Transferable Availability Poisoning Attacks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We study availability data poisoning attacks, where an adversary aims to degrade the overall test accuracy of a machine learning model by crafting imperceptible perturbations to its training data. Existing strategies can achieve the attack goal but usually assume that the victim employs the same training method as what the adversary uses to mount the attack. In this paper, we argue that this assumption is strong, since the victim may choose any learning algorithm to train the model as long as it achieves some targeted performance on clean data. In addition, we observe a large decrease in the effectiveness of prior poisoning attacks, when the victim uses a different learning paradigm to train the model, and marked differences in frequency-level characteristics between perturbations generated with different learners and attack methods. To enhance the attack transferability, we propose _Transferable Poisoning_, which generates high-frequency poisoning perturbations by alternately leveraging the gradient information with two specific algorithms respectively selected from supervised and unsupervised contrastive learning paradigms. Through extensive experiments on benchmark image datasets, we show that transferable poisoning can produce poisoned samples with significantly improved transferability, which not only applies to the two learners used to devise the attack but also works for learning algorithms and even paradigms beyond.",
        "keywords": "Availability Data Poisoning Attacks;Poisoning Transferability",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Yiyong Liu;Michael Backes;Xiao Zhang",
        "authorids": "~Yiyong_Liu1;~Michael_Backes3;~Xiao_Zhang2",
        "gender": "M;;M",
        "homepage": "https://liu199604.github.io/;;https://xiao-zhang.net",
        "dblp": "284/7130;;",
        "google_scholar": ";;L-lz7CUAAAAJ",
        "orcid": ";;0009-0008-1837-7670",
        "linkedin": ";;",
        "or_profile": "~Yiyong_Liu1;~Michael_Backes3;~Xiao_Zhang2",
        "aff": "CISPA, saarland university, saarland informatics campus;;CISPA Helmholtz Center for Information Security",
        "aff_domain": "cispa.saarland;;cispa.de",
        "position": "PhD student;;Tenure-Track Faculty",
        "bibtex": "@misc{\nliu2024transferable,\ntitle={Transferable Availability Poisoning Attacks},\nauthor={Yiyong Liu and Michael Backes and Xiao Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=XbLffB0T2z}\n}",
        "github": "",
        "project": "",
        "reviewers": "f8DL;TTnu;miSr;s6uj;uUSA",
        "site": "https://openreview.net/forum?id=XbLffB0T2z",
        "pdf_size": 1121599,
        "rating": "3;3;5;5;6",
        "confidence": "4;4;3;4;3",
        "soundness": "1;2;3;2;3",
        "contribution": "2;2;2;2;3",
        "presentation": "3;2;3;3;3",
        "wc_summary": "22;97;85;61;94",
        "wc_strengths": "55;18;74;56;41",
        "wc_weaknesses": "536;507;88;240;146",
        "wc_questions": "2;11;63;271;2",
        "wc_review": "615;633;310;628;283",
        "wc_reply_reviewers": "119;0;0;118;0",
        "wc_reply_authors": "376;233;132;419;233",
        "reply_reviewers": "1;0;0;1;0",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            4.4,
            1.2
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.2,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            71.8,
            27.92418306772823
        ],
        "wc_strengths_avg": [
            48.8,
            18.626862323000083
        ],
        "wc_weaknesses_avg": [
            303.4,
            184.79567094496556
        ],
        "wc_questions_avg": [
            69.8,
            103.12982109942787
        ],
        "wc_review_avg": [
            493.8,
            161.42787863315309
        ],
        "wc_reply_reviewers_avg": [
            47.4,
            58.05376818088555
        ],
        "wc_reply_authors_avg": [
            278.6,
            104.73700396707937
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.748455199183749,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8627423571758985463&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Saarland University;CISPA Helmholtz Center for Information Security",
        "aff_unique_dep": "CISPA;",
        "aff_unique_url": "https://www.uni-saarland.de;https://www.cispa.de/",
        "aff_unique_abbr": "Saarland U;CISPA",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Saarland Informatics Campus;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "XbydvPq92M",
        "title": "Information-Ordered Bottlenecks for Adaptive Dimensionality Reduction",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We present the information-ordered bottleneck (IOB), a neural layer designed to adaptively compress data into latent variables ordered by likelihood maximization. Without retraining, IOB nodes can be truncated at any bottleneck width, capturing the most crucial information in the first latent variables. Unifying several previous approaches, we show that IOBs achieve near-optimal compression for a given encoding architecture and can assign ordering to latent signals in a manner that is semantically meaningful. IOBs demonstrate a remarkable ability to compress embeddings of image and text data, leveraging the performance of SOTA architectures such as CNNs, transformers, and diffusion models. Moreover, we introduce a novel theory for estimating global intrinsic dimensionality with IOBs and show that they recover SOTA dimensionality estimates for complex synthetic data. Furthermore, we showcase the utility of these models for exploratory analysis through applications on heterogeneous datasets, enabling computer-aided discovery of dataset complexity.",
        "keywords": "Deep Learning;Nonlinear Dimension Reduction and Manifold Learning;Neural Networks;Component Analysis (ICA;PCA;CCA;FLDA);Compressed Sensing and Sparse Reconstruction",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/a1608a7b063a4de6f0c22c016838ca9f02e711cf.pdf",
        "author": "Matthew Ho;Xiaosheng Zhao;Benjamin Dan Wandelt",
        "authorids": "~Matthew_Ho2;~Xiaosheng_Zhao1;~Benjamin_Dan_Wandelt1",
        "gender": "M;M;",
        "homepage": "https://maho3.github.io/;https://xiaosheng-zhao.github.io/;https://benwandelt.org",
        "dblp": ";;",
        "google_scholar": "TJBifHwAAAAJ;;",
        "orcid": "0000-0003-3207-8868;0000-0002-8328-1447;",
        "linkedin": ";;https://linkedin.com/in/benwandelt",
        "or_profile": "~Matthew_Ho2;~Xiaosheng_Zhao1;~Benjamin_Dan_Wandelt1",
        "aff": "Institut d'Astrophysique de Paris;Tsinghua University;Institut d'Astrophysique de Paris, Sorbonne University",
        "aff_domain": "iap.fr;mails.tsinghua.edu.cn;iap.fr",
        "position": "Postdoc;PhD student;Full Professor",
        "bibtex": "@misc{\nho2024informationordered,\ntitle={Information-Ordered Bottlenecks for Adaptive Dimensionality Reduction},\nauthor={Matthew Ho and Xiaosheng Zhao and Benjamin Dan Wandelt},\nyear={2024},\nurl={https://openreview.net/forum?id=XbydvPq92M}\n}",
        "github": "",
        "project": "",
        "reviewers": "RDmE;nk9J;mmf3;E5s9",
        "site": "https://openreview.net/forum?id=XbydvPq92M",
        "pdf_size": 3839356,
        "rating": "3;3;5;5",
        "confidence": "3;3;3;5",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "2;2;2;3",
        "wc_summary": "56;58;44;72",
        "wc_strengths": "33;36;24;91",
        "wc_weaknesses": "60;88;76;101",
        "wc_questions": "150;2;38;4",
        "wc_review": "299;184;182;268",
        "wc_reply_reviewers": "69;0;23;0",
        "wc_reply_authors": "773;423;327;460",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            57.5,
            9.937303457175895
        ],
        "wc_strengths_avg": [
            46.0,
            26.353367906208877
        ],
        "wc_weaknesses_avg": [
            81.25,
            15.122417134836613
        ],
        "wc_questions_avg": [
            48.5,
            60.32205235235287
        ],
        "wc_review_avg": [
            233.25,
            51.43624694707031
        ],
        "wc_reply_reviewers_avg": [
            23.0,
            28.16913204200655
        ],
        "wc_reply_authors_avg": [
            495.75,
            167.26830990955818
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17560133612122541170&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Institut d'Astrophysique de Paris;Tsinghua University;Sorbonne University",
        "aff_unique_dep": "Astrophysics;;Institut d'Astrophysique de Paris",
        "aff_unique_url": "https://www.iap.fr;https://www.tsinghua.edu.cn;https://www.sorbonne-universite.fr",
        "aff_unique_abbr": "IAP;THU;Sorbonne U",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Paris",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "France;China"
    },
    {
        "id": "XcClNiB17O",
        "title": "Rethinking Adversarial Training with Neural Tangent Kernel",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Adversarial training (AT) is an important and attractive topic in deep learning security, exhibiting mysteries and odd properties. Recent studies of neural network training dynamics based on Neural Tangent Kernel (NTK) make it possible to reacquaint AT and deeply analyze its properties. In this paper, we perform an in-depth investigation of AT process and properties with NTK, including error-bound analysis and NTK evolution. We uncover three new findings that are missed in previous works. First, we disclose the impact of data normalization on AT and the importance of unbiased estimators in batch normalization layers. Second, we experimentally explore the kernel dynamics and propose more time-saving AT methods. Third, we study the spectrum feature inside the kernel to address the catastrophic overfitting problem. To the best of our knowledge, it is the first work leveraging the observations of kernel dynamics to improve existing AT methods.",
        "keywords": "Neural Tangent Kernel;Adversarial Training",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/527be827037250adea07332460b8a0aaf758f01d.zip",
        "author": "Guanlin Li;Han Qiu;Shangwei Guo;Jiwei Li;Tianwei Zhang",
        "authorids": "~Guanlin_Li2;~Han_Qiu3;~Shangwei_Guo1;~Jiwei_Li1;~Tianwei_Zhang1",
        "gender": "M;M;M;M;M",
        "homepage": "https://guanlinlee.github.io/;https://qiuhan.info;http://www.cs.cqu.edu.cn/info/1332/5290.htm;https://nlp.stanford.edu/~bdlijiwei/;https://personal.ntu.edu.sg/tianwei.zhang/index.html",
        "dblp": ";15/4507-1;176/6479;73/5746-1;77/7902-4",
        "google_scholar": "3LB0_wMAAAAJ;https://scholar.google.fr/citations?user=6JWNv6gAAAAJ;wQrVkBYAAAAJ;PwU16JEAAAAJ;9vpiYDIAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Guanlin_Li2;~Han_Qiu3;~Shangwei_Guo1;~Jiwei_Li1;~Tianwei_Zhang1",
        "aff": "Nanyang Technological University;Tsinghua University;Chongqing University;Zhejiang University;Nanyang Technological University",
        "aff_domain": "ntu.edu.sg;tsinghua.edu.cn;cqu.edu.cn;zju.edu.cn;ntu.edu.sg",
        "position": "PhD student;Assistant Professor;Associate Professor;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nli2024rethinking,\ntitle={Rethinking Adversarial Training with Neural Tangent Kernel},\nauthor={Guanlin Li and Han Qiu and Shangwei Guo and Jiwei Li and Tianwei Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=XcClNiB17O}\n}",
        "github": "",
        "project": "",
        "reviewers": "jZv6;9q81;2z5m;rUEy",
        "site": "https://openreview.net/forum?id=XcClNiB17O",
        "pdf_size": 1053340,
        "rating": "3;3;3;5",
        "confidence": "3;3;3;3",
        "soundness": "2;2;2;2",
        "contribution": "2;2;3;2",
        "presentation": "1;1;2;2",
        "wc_summary": "32;62;53;36",
        "wc_strengths": "30;23;99;8",
        "wc_weaknesses": "419;301;190;396",
        "wc_questions": "63;5;119;8",
        "wc_review": "544;391;461;448",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            45.75,
            12.255100978776143
        ],
        "wc_strengths_avg": [
            40.0,
            34.978564864785405
        ],
        "wc_weaknesses_avg": [
            326.5,
            90.37283883999662
        ],
        "wc_questions_avg": [
            48.75,
            46.67105634116288
        ],
        "wc_review_avg": [
            461.0,
            54.67632028584221
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:n_csHMdyWvAJ:scholar.google.com/&scioq=Rethinking+Adversarial+Training+with+Neural+Tangent+Kernel&hl=en&as_sdt=0,48",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;3;0",
        "aff_unique_norm": "Nanyang Technological University;Tsinghua University;Chongqing University;Zhejiang University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.ntu.edu.sg;https://www.tsinghua.edu.cn;https://www.cqu.edu.cn;https://www.zju.edu.cn",
        "aff_unique_abbr": "NTU;THU;CQU;ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;0",
        "aff_country_unique": "Singapore;China"
    },
    {
        "id": "XcRvEYlrt5",
        "title": "PanoOcc: Unified Occupancy Representation for Camera-based 3D Panoptic Segmentation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Comprehensive modeling of the surrounding 3D world is crucial for the success of autonomous driving. However, existing perception tasks like object detection, road structure segmentation, depth & elevation estimation, and open-set object localization each only focus on a small facet of the holistic 3D scene understanding task. This divide-and-conquer strategy simplifies the algorithm development process but comes at the cost of losing an end-to-end unified solution to the problem. In this work, we address this limitation by studying camera-based 3D panoptic segmentation, aiming to achieve a unified occupancy representation for camera-only 3D scene understanding.\nTo achieve this, we introduce a novel method called PanoOcc, which utilizes voxel queries to aggregate spatiotemporal information from multi-frame and multi-view images in a coarse-to-fine scheme, integrating feature learning and scene representation into a unified occupancy representation. We have conducted extensive ablation studies to validate the effectiveness and efficiency of the proposed method. Our approach achieves new state-of-the-art results for camera-based semantic segmentation and panoptic segmentation on the nuScenes dataset. Furthermore, our method can be easily extended to dense occupancy prediction and has demonstrated promising performance on the Occ3D benchmark. The code will be made available.",
        "keywords": "3D Scene Understanding;Occupancy Prediction;3D Panoptic Segmentation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yuqi Wang;Yuntao Chen;Xingyu Liao;Lue Fan;Zhaoxiang Zhang",
        "authorids": "~Yuqi_Wang3;~Yuntao_Chen1;~Xingyu_Liao1;~Lue_Fan1;~Zhaoxiang_Zhang3",
        "gender": "M;M;M;;M",
        "homepage": "http://robertwyq.github.io;;https://l1aoxingyu.github.io/blogpages/;;http://zhaoxiangzhang.net",
        "dblp": "20/1168-1;203/8284;223/4395;287/9792;55/2285-1.html",
        "google_scholar": "35UcX9sAAAAJ;iLOoUqIAAAAJ;;https://scholar.google.com/citations?hl=en;qxWfV6cAAAAJ",
        "orcid": "0000-0002-6360-1431;;;;",
        "linkedin": "https://www.linkedin.cn/injobs/in/yuqi-wang-a08563192;;;;",
        "or_profile": "~Yuqi_Wang3;~Yuntao_Chen1;~Xingyu_Liao1;~Lue_Fan1;~Zhaoxiang_Zhang3",
        "aff": "Institute of Automation, Chinese Academy of Sciences;Centre for Artificial Intelligence and Robotics (CAIR), Hong Kong Institute of Science & Innovation, Chinese Academy of Sciences;;Institute of Automation, Chinese Academy of Sciences;Institute of Automation, Chinese Academy of Sciences",
        "aff_domain": "ia.ac.cn;cair-cas.org.hk;;ia.ac.cn;ia.ac.cn",
        "position": "PhD student;Assistant Professor;;PhD student;Full Professor",
        "bibtex": "@misc{\nwang2024panoocc,\ntitle={PanoOcc: Unified Occupancy Representation for Camera-based 3D Panoptic Segmentation},\nauthor={Yuqi Wang and Yuntao Chen and Xingyu Liao and Lue Fan and Zhaoxiang Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=XcRvEYlrt5}\n}",
        "github": "",
        "project": "",
        "reviewers": "iHeu;eE1X;bsGt;DemZ",
        "site": "https://openreview.net/forum?id=XcRvEYlrt5",
        "pdf_size": 7989458,
        "rating": "3;5;5;5",
        "confidence": "4;3;5;3",
        "soundness": "3;3;3;3",
        "contribution": "1;2;2;3",
        "presentation": "3;2;3;2",
        "wc_summary": "50;79;64;67",
        "wc_strengths": "15;92;39;41",
        "wc_weaknesses": "51;176;84;55",
        "wc_questions": "38;38;40;69",
        "wc_review": "154;385;227;232",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            65.0,
            10.319883720275147
        ],
        "wc_strengths_avg": [
            46.75,
            28.05686190577984
        ],
        "wc_weaknesses_avg": [
            91.5,
            50.42072986381692
        ],
        "wc_questions_avg": [
            46.25,
            13.160072188251856
        ],
        "wc_review_avg": [
            249.5,
            84.10261589272952
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.17407765595569782,
        "gs_citation": 82,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8420258422559993374&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Chinese Academy of Sciences",
        "aff_unique_dep": "Institute of Automation",
        "aff_unique_url": "http://www.ia.cas.cn",
        "aff_unique_abbr": "CAS",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "XcwHDoKvVg",
        "title": "Learning from Shortcut: A Shortcut-guided Approach for Graph Rationalization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The remarkable success in graph neural networks (GNNs) promotes the Graph Rationalization methods that aim to provide explanations to support the prediction results by identifying a small subset of the original graph (i.e., rationale). Although existing methods have achieved promising results, recent studies have proved that these methods still suffer from  exploiting shortcuts in the data to yield task results and compose rationales. Different from previous methods plagued by shortcuts, in this paper, we propose a Shortcut-guided Graph Rationalization (SGR) method, which identifies rationales by learning from shortcuts. Specifically, SGR consists of two training stages. In the first stage, we train a shortcut guider with an early stop strategy to obtain shortcut information. During the second stage, SGR separates the graph into the rationale and non-rationale subgraphs and lets them learn from the shortcut information generated by the frozen shortcut guider to identify which information belongs to shortcuts and which does not. Finally, we employ the non-rationale subgraphs as environments and identify the invariant rationales which filter out the shortcuts under environment shifts. Extensive experimental results on both synthetic and real-world datasets clearly validate the effectiveness of our proposed method.",
        "keywords": "graph rationalization;shortcut learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Linan Yue;Qi Liu;Ye Liu;Weibo Gao;Chao Song",
        "authorids": "~Linan_Yue1;~Qi_Liu3;~Ye_Liu10;~Weibo_Gao1;~Chao_Song2",
        "gender": "M;M;M;;M",
        "homepage": "https://yuelinan.github.io/;http://staff.ustc.edu.cn/~qiliuql/;https://liuyeah.github.io;;https://scholar.google.com/citations?user=cm1ZxAUAAAAJ&hl=en",
        "dblp": "297/1080;95/2446-3;96/2615-11.html;;",
        "google_scholar": "https://scholar.google.com.hk/citations?user=XDaNgG4AAAAJ;5EoHAFwAAAAJ;HYYR4f8AAAAJ;;cm1ZxAUAAAAJ",
        "orcid": "0000-0002-5980-6098;0000-0001-6956-5550;;;",
        "linkedin": ";;;;",
        "or_profile": "~Linan_Yue1;~Qi_Liu3;~Ye_Liu10;~Weibo_Gao1;~Chao_Song2",
        "aff": "University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China;;",
        "aff_domain": "ustc.edu.cn;ustc.edu.cn;ustc.edu;;",
        "position": "PhD student;Full Professor;PhD student;;",
        "bibtex": "@misc{\nyue2024learning,\ntitle={Learning from Shortcut: A Shortcut-guided Approach for Graph Rationalization},\nauthor={Linan Yue and Qi Liu and Ye Liu and Weibo Gao and Chao Song},\nyear={2024},\nurl={https://openreview.net/forum?id=XcwHDoKvVg}\n}",
        "github": "",
        "project": "",
        "reviewers": "LR3y;enA8;gXJ9",
        "site": "https://openreview.net/forum?id=XcwHDoKvVg",
        "pdf_size": 1450976,
        "rating": "3;5;5",
        "confidence": "4;5;4",
        "soundness": "2;2;3",
        "contribution": "2;2;2",
        "presentation": "3;2;3",
        "wc_summary": "169;62;128",
        "wc_strengths": "21;39;77",
        "wc_weaknesses": "198;299;158",
        "wc_questions": "8;88;116",
        "wc_review": "396;488;479",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            119.66666666666667,
            44.078213313255894
        ],
        "wc_strengths_avg": [
            45.666666666666664,
            23.342855200015464
        ],
        "wc_weaknesses_avg": [
            218.33333333333334,
            59.33146064460425
        ],
        "wc_questions_avg": [
            70.66666666666667,
            45.7626728046147
        ],
        "wc_review_avg": [
            454.3333333333333,
            41.411216945278106
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:xfzUeM9cl6wJ:scholar.google.com/&scioq=Learning+from+Shortcut:+A+Shortcut-guided+Approach+for+Graph+Rationalization&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Science and Technology of China",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.ustc.edu.cn",
        "aff_unique_abbr": "USTC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "Xd46Q82QEO",
        "title": "Exploring Pointwise Similarity of Representations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Representation similarity measures have emerged as a popular tool for examining learned representations.\nMany existing studies have focused on analyzing aggregate estimates of similarity at a global level, i.e. over a set of representations for N input examples.\nIn this work, we shed light on the importance of investigating similarity of representations at a local level, i.e. representations of a single input example.\nWe show that peering through the lens of similarity of individual data points can reveal previously overlooked phenomena in deep learning.\nSpecifically, we investigate the similarity in learned representations of inputs by architecturally identical models that only differ in random initialization.\nWe find that while standard models represent (most) inputs similarly only when they are drawn from training data distribution, adversarially trained models represent a wide variety of out-of-distribution inputs similarly, thus indicating that these models learn more \"stable\" representations.\nWe design an instantiation of such a pointwise measure, named Pointwise Normalized Kernel Alignment (PNKA), that provides a way to quantify the similarity of an individual point across distinct representation spaces.\nUsing PNKA, we additionally show how we can further understand the effects of data (e.g. corruptions) and model (e.g. fairness constraints) interventions on the model's representations.",
        "keywords": "deep learning;representation learning;representation similarity;interpretability",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/23ea4f006537f4cd1c15cded8d28b3278e42b99c.zip",
        "author": "Camila Kolling;Till Speicher;Vedant Nanda;Mariya Toneva;Krishna P. Gummadi",
        "authorids": "~Camila_Kolling1;~Till_Speicher1;~Vedant_Nanda2;~Mariya_Toneva1;~Krishna_P._Gummadi1",
        "gender": "F;M;M;F;M",
        "homepage": "https://camilakolling.github.io;https://tillspeicher.com/;https://www.mpi-sws.org/~gummadi/;https://mtoneva.com;",
        "dblp": "249/8377;144/7849;g/PKrishnaGummadi;160/4677;201/5458",
        "google_scholar": "https://scholar.google.com.br/citations?user=VIfs12oAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com.tw/citations?user=Bz3APTsAAAAJ;https://scholar.google.ca/citations?user=a61sk-4AAAAJ;9GfPrCsAAAAJ",
        "orcid": ";0009-0000-1172-2525;;0000-0002-2407-9871;",
        "linkedin": "camilakollingr/;;;;",
        "or_profile": "~Camila_Kolling1;~Till_Speicher1;~Krishna_P._Gummadi1;~Mariya_K_Toneva1;~Vedant_Nanda1",
        "aff": "MPI-SWS;MPI-SWS;MPI-SWS;Max Planck Institute for Software Systems;University of Maryland, College Park & MPI-SWS",
        "aff_domain": "mpi-sws.org;mpi-sws.org;mpi-sws.org;mpi-sws.org;cs.umd.edu",
        "position": "PhD student;PhD student;Full Professor;Assistant Professor;PhD student",
        "bibtex": "@misc{\nkolling2024exploring,\ntitle={Exploring Pointwise Similarity of Representations},\nauthor={Camila Kolling and Till Speicher and Vedant Nanda and Mariya Toneva and Krishna P. Gummadi},\nyear={2024},\nurl={https://openreview.net/forum?id=Xd46Q82QEO}\n}",
        "github": "",
        "project": "",
        "reviewers": "vKT7;UEwp;tyLp",
        "site": "https://openreview.net/forum?id=Xd46Q82QEO",
        "pdf_size": 1217904,
        "rating": "5;5;5",
        "confidence": "3;4;4",
        "soundness": "2;3;3",
        "contribution": "2;2;2",
        "presentation": "2;3;2",
        "wc_summary": "31;103;98",
        "wc_strengths": "37;23;73",
        "wc_weaknesses": "172;176;220",
        "wc_questions": "16;1;73",
        "wc_review": "256;303;464",
        "wc_reply_reviewers": "0;0;209",
        "wc_reply_authors": "459;772;943",
        "reply_reviewers": "0;0;1",
        "reply_authors": "1;1;2",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            77.33333333333333,
            32.826141344293816
        ],
        "wc_strengths_avg": [
            44.333333333333336,
            21.06075866524175
        ],
        "wc_weaknesses_avg": [
            189.33333333333334,
            21.746008573733455
        ],
        "wc_questions_avg": [
            30.0,
            31.016124838541646
        ],
        "wc_review_avg": [
            341.0,
            89.06551895468115
        ],
        "wc_reply_reviewers_avg": [
            69.66666666666667,
            98.52354484532562
        ],
        "wc_reply_authors_avg": [
            724.6666666666666,
            200.4068084893547
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:dL-TPuKSRn0J:scholar.google.com/&scioq=Exploring+Pointwise+Similarity+of+Representations&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;1",
        "aff_unique_norm": "Max Planck Institute for Software Systems;University of Maryland, College Park",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.mpi-sws.org;https://www/umd.edu",
        "aff_unique_abbr": "MPI-SWS;UMD",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";College Park",
        "aff_country_unique_index": "0;0;0;0;1",
        "aff_country_unique": "Germany;United States"
    },
    {
        "id": "XdSYtriYfI",
        "title": "Federated Ensemble-Directed Offline Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We consider the problem of federated offline reinforcement learning (RL), a scenario under which distributed learning agents must collaboratively learn a high-quality control policy only using small pre-collected datasets generated according to different unknown behavior policies. Naively combining a standard offline RL approach with a standard federated learning approach to solve this problem can lead to poorly performing policies.  In response, we develop the Federated Ensemble-Directed Offline Reinforcement Learning  Algorithm (FEDORA), which distills the collective wisdom of the clients using an ensemble learning approach.  We develop the FEDORA codebase to utilize distributed compute resources on a federated learning platform. We show that FEDORA significantly outperforms other approaches, including offline RL over the combined data pool, in various complex continuous control environments and real-world datasets. Finally, we demonstrate the performance of FEDORA in the real-world on a mobile robot.",
        "keywords": "Federated Learning;Offline Reinforcement Learning;Deep Reinforcement Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/29b984b638d1ca9cdba0481fe58393c7fb5e2189.zip",
        "author": "Desik Rengarajan;Nitin Ragothaman;Dileep Kalathil;Srinivas Shakkottai",
        "authorids": "~Desik_Rengarajan1;~Nitin_Ragothaman1;~Dileep_Kalathil1;~Srinivas_Shakkottai1",
        "gender": "M;;M;",
        "homepage": "https://sites.google.com/view/desik-rengarajan/home;https://rnitin.github.io/;http://people.tamu.edu/~dileep.kalathil/;https://cesg.tamu.edu/faculty/sshakkot/",
        "dblp": "218/1345;;44/8356;03/353.html",
        "google_scholar": "ygOY_E4AAAAJ;;S24XFwwAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0002-8538-6023;;;0000-0002-5882-6433",
        "linkedin": "desik-rengarajan-109868100/;;;",
        "or_profile": "~Desik_Rengarajan1;~Nitin_Ragothaman1;~Dileep_Kalathil1;~Srinivas_Shakkottai1",
        "aff": "Hewlett Packard Labs ;Texas A&M University - College Station;Texas A&M University;Texas A&M",
        "aff_domain": "hpe.com;tamu.edu;tamu.edu;tamu.edu",
        "position": "Researcher;MS student;Associate Professor;Full Professor",
        "bibtex": "@misc{\nrengarajan2024federated,\ntitle={Federated Ensemble-Directed Offline Reinforcement Learning},\nauthor={Desik Rengarajan and Nitin Ragothaman and Dileep Kalathil and Srinivas Shakkottai},\nyear={2024},\nurl={https://openreview.net/forum?id=XdSYtriYfI}\n}",
        "github": "",
        "project": "",
        "reviewers": "oNBT;MJbF;mieC;RUBc",
        "site": "https://openreview.net/forum?id=XdSYtriYfI",
        "pdf_size": 2173337,
        "rating": "3;5;6;6",
        "confidence": "4;3;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "102;64;63;95",
        "wc_strengths": "95;49;46;82",
        "wc_weaknesses": "383;127;74;85",
        "wc_questions": "98;80;2;2",
        "wc_review": "678;320;185;264",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "954;716;352;451",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            81.0,
            17.67766952966369
        ],
        "wc_strengths_avg": [
            68.0,
            21.03568396796263
        ],
        "wc_weaknesses_avg": [
            167.25,
            126.12369920042784
        ],
        "wc_questions_avg": [
            45.5,
            43.96305266925854
        ],
        "wc_review_avg": [
            361.75,
            188.78079219030732
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            618.25,
            235.13015012966756
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.40824829046386296,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7069806738959863019&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Hewlett Packard Labs;Texas A&M University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.hpl.hp.com;https://www.tamu.edu",
        "aff_unique_abbr": "HPL;TAMU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";College Station",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "XfcZjjd0UW",
        "title": "Rethinking the Number of Shots in Robust Model-Agnostic Meta-Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Robust Model-Agnostic Meta-Learning (MAML) is usually adopted to train a meta-model which may fast adapt to novel classes with only a few exemplars and meanwhile remain robust to adversarial attacks. The conventional solution for robust MAML is to introduce robustness-promoting regularization during meta-training stage. However, although the robustness can be largely improved, previous methods sacrifice clean accuracy a lot. In this paper, we observe that introducing robustness-promoting regularization into MAML reduces the intrinsic dimension of clean sample features, which results in a lower capacity of clean representations. This may explain why the clean accuracy of previous robust MAML methods drops severely. Based on this observation, we propose a simple strategy, i.e., setting the number of training shots larger than that of test shots, to mitigate the loss of intrinsic dimension caused by robustness-promoting regularization. Though simple, our method remarkably improves the clean accuracy of MAML without much loss of robustness, producing a robust yet accurate model. Extensive experiments demonstrate that our method outperforms prior arts in achieving a better trade-off between accuracy and robustness. Besides, we observe that our method is less sensitive to the number of fine-tuning steps during training, which allows for a reduced number of fine-tuning steps to improve training efficiency.",
        "keywords": "few-shot learning;model-agnostic meta-learning;adversarial robustness",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Xiaoyue Duan;Guoliang Kang;Runqi Wang;Shumin Han;Baochang Zhang",
        "authorids": "~Xiaoyue_Duan1;~Guoliang_Kang1;~Runqi_Wang1;~Shumin_Han1;~Baochang_Zhang1",
        "gender": "M;M;M;M;M",
        "homepage": ";;;https://www.researchgate.net/scientific-contributions/Shumin-Han-2149208232;https://dblp.uni-trier.de/pid/80/3887-1.html",
        "dblp": "286/9258.html;178/8663;266/9915;https://dblp.uni-trier.de/pid/119/8234;https://dblp.uni-trier.de/pid/80/3887-1.html",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com.au/citations?user=P24HCsgAAAAJ;https://scholar.google.com.hk/citations?hl=zh-CN;eFoLdbQAAAAJ;",
        "orcid": ";0000-0003-1978-2025;;;",
        "linkedin": ";;;;",
        "or_profile": "~Xiaoyue_Duan1;~Guoliang_Kang1;~Runqi_Wang1;~Shumin_Han1;~Baochang_Zhang1",
        "aff": "Beihang University;Beihang University;Beihang University;;Beihang University",
        "aff_domain": "buaa.edu.cn;buaa.edu.cn;buaa.edu.cn;;buaa.edu.cn",
        "position": "MS student;Full Professor;PhD student;;Professor",
        "bibtex": "@misc{\nduan2024rethinking,\ntitle={Rethinking the Number of Shots in Robust Model-Agnostic Meta-Learning},\nauthor={Xiaoyue Duan and Guoliang Kang and Runqi Wang and Shumin Han and Baochang Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=XfcZjjd0UW}\n}",
        "github": "",
        "project": "",
        "reviewers": "fxbE;bLFF;u51s;biDU",
        "site": "https://openreview.net/forum?id=XfcZjjd0UW",
        "pdf_size": 2524394,
        "rating": "3;3;5;5",
        "confidence": "4;4;3;4",
        "soundness": "2;3;3;3",
        "contribution": "1;2;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "83;91;70;166",
        "wc_strengths": "24;126;30;154",
        "wc_weaknesses": "231;299;118;141",
        "wc_questions": "1;79;139;2",
        "wc_review": "339;595;357;463",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            102.5,
            37.41991448413532
        ],
        "wc_strengths_avg": [
            83.5,
            57.39991289191997
        ],
        "wc_weaknesses_avg": [
            197.25,
            72.34768482819612
        ],
        "wc_questions_avg": [
            55.25,
            57.78570324916017
        ],
        "wc_review_avg": [
            438.5,
            102.02328165668854
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9195562999985306048&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Beihang University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.buaa.edu.cn/",
        "aff_unique_abbr": "BUAA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "XgdKE7tZn4",
        "title": "HyperDisGAN: A Controllable Variety Generative Model Via Hyperplane Distances for Downstream Classifications",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Despite the potential benefits of data augmentation for mitigating the data insufficiency, traditional augmentation methods primarily rely on the prior intra-domain knowledge. On the other hand, advanced generative adversarial networks (GANs) generate cross-domain samples with limited variety, particularly in small-scale datasets. In light of these challenges, we propose that accurately controlling the variation degrees of generated samples can reshape the decision boundary in the hyperplane space for the downstream classifications. To achieve this, we develop a novel hyperplane distances GAN (HyperDisGAN) that effectively controls the locations of generated cross-domain and intra-domain samples. The locations are respectively defined using the vertical distances of the cross-domain target samples to the optimal hyperplane and the horizontal distances of the intra-domain target samples to the source samples, which are determined by Hinge Loss and Pythagorean Theorem. Experimental results show that the proposed HyperDisGAN consistently yields significant improvements in terms of the accuracy (ACC) and the area under the receiver operating characteristic curve (AUC) on two small-scale natural and two medical datasets, in the hyperplane spaces of eleven downstream classification architectures. Our codes are available in the anonymous link: https://anonymous.4open.science/r/HyperDisGAN-ICLR2024.",
        "keywords": "data insufficiency;hyperplane space;cross-domain and intra-domain generation;controllable variation degree;hinge loss;pythagorean theorem;downstream classification",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/f6d13cf2c897a08c6fe7678d8f19a0a89d4ecd0f.zip",
        "author": "Xiangyu Xiong;Yue Sun;Xiaohong Liu;Wei Ke;Chan-Tong Lam;Jiangang Chen;Mingfeng Jiang;Mingwei Wang;Hui Xie;Tong Tong;Qinquan Gao;Hao Chen;Tao Tan",
        "authorids": "~Xiangyu_Xiong1;~Yue_Sun10;~Xiaohong_Liu2;~Wei_Ke2;~Chan-Tong_Lam1;~Jiangang_Chen1;~Mingfeng_Jiang1;~Mingwei_Wang3;~Hui_Xie1;~Tong_Tong4;~Qinquan_Gao4;~Hao_Chen46;~Tao_Tan5",
        "gender": "M;;M;M;M;M;M;M;M;M;M;M;M",
        "homepage": ";;https://jhc.sjtu.edu.cn/~xiaohongliu/;;;https://faculty.ecnu.edu.cn/_s15/cjg2/main.psp;http://yjsxt.zstu.edu.cn/open/dsfc/search/F56F7CC7AC943059E0530100007F4C41;https://orcid.org/0000-0001-9060-5107;;http://itlab.fzu.edu.cn/gzl/ZhuanJi/TeacherInfo2.aspx?No=T19036;http://itlab.fzu.edu.cn/gzl/ZhuanJi/TeacherInfo2.aspx?No=T15008;;",
        "dblp": "238/4935;;95/2454-1;;13/4632;;;;;74/10649-1.html;;;",
        "google_scholar": ";;https://scholar.google.ca/citations?hl=en;;GXD7ppMAAAAJ;;;;;https://scholar.google.co.uk/citations?hl=en;https://scholar.google.com/citations?hl=en;C2vmNAQAAAAJ;lLg3WRkAAAAJ",
        "orcid": "0000-0002-9574-3936;;;0000-0003-0952-0961;0000-0002-8022-7744;;;;0000-0002-8490-1695;0000-0002-5015-1670;;;",
        "linkedin": ";;xiaohong-liu/;;;;;;;;;;",
        "or_profile": "~Xiangyu_Xiong1;~Yue_Sun10;~Xiaohong_Liu2;~Wei_Ke2;~Chan-Tong_Lam1;~Jiangang_Chen1;~Mingfeng_Jiang1;~Mingwei_Wang3;~Hui_Xie1;~Tong_Tong4;~Qinquan_Gao4;~Hao_Chen46;~Tao_Tan5",
        "aff": "Macao Polytechnic University;;Shanghai Jiaotong University;Macao Polytechnic University;Macao Polytechnic University;;;;Faulty of Applied Sciences;Fuzhou University;Fuzhou University;Sioux Technology;Netherlands Cancer Institute",
        "aff_domain": "mpu.edu.mo;;sjtu.edu.cn;mpu.edu.mo;mpu.edu.mo;;;;mpu.edu.mo;fzu.edu.cn;fzu.edu.cn;sioux.asia;nki.nl",
        "position": "PhD student;;Assistant Professor;Full Professor;Associate Professor;;;;PhD student;Full Professor;Associate Professor;Researcher;Researcher",
        "bibtex": "@misc{\nxiong2024hyperdisgan,\ntitle={HyperDis{GAN}: A Controllable Variety Generative Model Via Hyperplane Distances for Downstream Classifications},\nauthor={Xiangyu Xiong and Yue Sun and Xiaohong Liu and Wei Ke and Chan-Tong Lam and Jiangang Chen and Mingfeng Jiang and Mingwei Wang and Hui Xie and Tong Tong and Qinquan Gao and Hao Chen and Tao Tan},\nyear={2024},\nurl={https://openreview.net/forum?id=XgdKE7tZn4}\n}",
        "github": "",
        "project": "",
        "reviewers": "aNvk;bUmq",
        "site": "https://openreview.net/forum?id=XgdKE7tZn4",
        "pdf_size": 13171406,
        "rating": "1;5",
        "confidence": "5;3",
        "soundness": "2;2",
        "contribution": "1;2",
        "presentation": "1;3",
        "wc_summary": "105;61",
        "wc_strengths": "22;32",
        "wc_weaknesses": "345;289",
        "wc_questions": "7;50",
        "wc_review": "479;432",
        "wc_reply_reviewers": "0;220",
        "wc_reply_authors": "695;1391",
        "reply_reviewers": "0;1",
        "reply_authors": "1;3",
        "rating_avg": [
            3.0,
            2.0
        ],
        "confidence_avg": [
            4.0,
            1.0
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            1.0
        ],
        "wc_summary_avg": [
            83.0,
            22.0
        ],
        "wc_strengths_avg": [
            27.0,
            5.0
        ],
        "wc_weaknesses_avg": [
            317.0,
            28.0
        ],
        "wc_questions_avg": [
            28.5,
            21.5
        ],
        "wc_review_avg": [
            455.5,
            23.5
        ],
        "wc_reply_reviewers_avg": [
            110.0,
            110.0
        ],
        "wc_reply_authors_avg": [
            1043.0,
            348.0
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            1.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            13,
            0
        ],
        "corr_rating_confidence": -0.9999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:GaqovKYNuJwJ:scholar.google.com/&scioq=HyperDisGAN:+A+Controllable+Variety+Generative+Model+Via+Hyperplane+Distances+for+Downstream+Classifications&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0;2;3;3;4;5",
        "aff_unique_norm": "Macao Polytechnic University;Shanghai Jiao Tong University;Faculty of Applied Sciences;Fuzhou University;Sioux Technologies;Netherlands Cancer Institute",
        "aff_unique_dep": ";;;;;",
        "aff_unique_url": "https://www.mpu.edu.mo;https://www.sjtu.edu.cn;;https://www.fznu.edu.cn;;https://www.nki.nl",
        "aff_unique_abbr": "MPU;SJTU;;FZU;;NKI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;2;3",
        "aff_country_unique": "China;;United States;Netherlands"
    },
    {
        "id": "XgdNdoZ1Hc",
        "title": "Clarify When Necessary: Resolving Ambiguity with Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Resolving ambiguities through interaction is a hallmark of natural language, and modeling this behavior is a core challenge in crafting AI assistants. In this work, we study such behavior in LMs by proposing a task-agnostic framework for resolving ambiguity by asking users clarifying questions. Our framework breaks down this objective into three subtasks: (1) determining when clarification is needed, (2) determining what clarifying question to ask, and (3) responding accurately with the new information gathered through clarification. We evaluate systems across three NLP applications: question answering, machine translation and natural language inference. For the first subtask, we present a novel uncertainty estimation approach, Intent-Sim, that determines the utility of querying for clarification by estimating the entropy over user intents. Our method consistently outperforms existing uncertainty estimation approaches at identifying predictions that will benefit from clarification. When only allowed to ask for clarification on 10% of examples, our system is able to double the performance gains over randomly selecting examples to clarify. Furthermore, we find that Intent-Sim is robust, demonstrating improvements across a wide range of NLP tasks and LMs. Together, our work lays foundation for studying clarifying interactions with LMs.",
        "keywords": "Language Models;Ambiguity;Uncertainty",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Michael JQ Zhang;Eunsol Choi",
        "authorids": "~Michael_JQ_Zhang1;~Eunsol_Choi1",
        "gender": ";",
        "homepage": "https://eunsol.github.io/;https://mikejqzhang.github.io/",
        "dblp": "116/2765;301/8020",
        "google_scholar": "6wulN88AAAAJ;https://scholar.google.com/citations?view_op=list_works",
        "orcid": "0000-0003-3607-9104;",
        "linkedin": ";",
        "or_profile": "~Eunsol_Choi1;~Michael_J_Zhang1",
        "aff": "University of Texas, Austin;University of Texas at Austin",
        "aff_domain": "cs.utexas.edu;utexas.edu",
        "position": "Assistant Professor;PhD student",
        "bibtex": "@misc{\nzhang2024clarify,\ntitle={Clarify When Necessary: Resolving Ambiguity with Language Models},\nauthor={Michael JQ Zhang and Eunsol Choi},\nyear={2024},\nurl={https://openreview.net/forum?id=XgdNdoZ1Hc}\n}",
        "github": "",
        "project": "",
        "reviewers": "R4of;AZhU;Mm3G;SMVw",
        "site": "https://openreview.net/forum?id=XgdNdoZ1Hc",
        "pdf_size": 382773,
        "rating": "3;3;5;8",
        "confidence": "3;4;3;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;4;3",
        "wc_summary": "77;116;98;110",
        "wc_strengths": "33;27;18;86",
        "wc_weaknesses": "331;135;119;32",
        "wc_questions": "64;40;5;9",
        "wc_review": "505;318;240;237",
        "wc_reply_reviewers": "0;79;0;12",
        "wc_reply_authors": "255;354;253;74",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            100.25,
            14.905955185763842
        ],
        "wc_strengths_avg": [
            41.0,
            26.52357441974969
        ],
        "wc_weaknesses_avg": [
            154.25,
            109.31462619430211
        ],
        "wc_questions_avg": [
            29.5,
            24.088378940891808
        ],
        "wc_review_avg": [
            325.0,
            108.8783725080422
        ],
        "wc_reply_reviewers_avg": [
            22.75,
            32.84337832805876
        ],
        "wc_reply_authors_avg": [
            234.0,
            100.99752472214357
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.3665083330689157,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:TaKTcluGKMoJ:scholar.google.com/&scioq=Clarify+When+Necessary:+Resolving+Ambiguity+with+Language+Models&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Texas at Austin",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.utexas.edu",
        "aff_unique_abbr": "UT Austin",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Austin",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "XgklTOdV4J",
        "title": "DualAug: Exploiting Additional Heavy Augmentation with OOD Data Rejection",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Data augmentation is a dominant method for reducing model overfitting and improving generalization.\nMost existing data augmentation methods tend to find a compromise in augmenting the data, \\ie, increasing the amplitude of augmentation carefully to avoid degrading some data too much and doing harm to the model performance.\nWe delve into the relationship between data augmentation and model performance, revealing that the performance drop with heavy augmentation comes from the presence of out-of-distribution (OOD) data.\nNonetheless, as the same data transformation has different effects for different training samples, even for heavy augmentation, there remains part of in-distribution data which is beneficial to model training. \nBased on the observation, we propose a novel data augmentation method, named **DualAug**, to keep the augmentation in distribution as much as possible at a reasonable time and computational cost.\nWe design a data mixing strategy to fuse augmented data from both the basic- and the heavy-augmentation branches.\nExtensive experiments on supervised image classification benchmarks show that DualAug improve various automated data augmentation method. \nMoreover, the experiments on semi-supervised learning and contrastive self-supervised learning demonstrate that our DualAug can also improve related method.",
        "keywords": "data augmentation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Zehao Wang;Yiwen Guo;Qizhang Li;Guanglei Yang;Wangmeng Zuo",
        "authorids": "~Zehao_Wang6;~Yiwen_Guo1;~Qizhang_Li1;~Guanglei_Yang1;~Wangmeng_Zuo3",
        "gender": "M;;M;M;M",
        "homepage": ";;;https://ygjwd12345.github.io/;",
        "dblp": ";;272/9084;06/10218;93/2671",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;;W5JLehEAAAAJ;DHgNKnAAAAAJ;rUOpCEYAAAAJ",
        "orcid": ";;;0000-0002-5324-3642;0000-0002-3330-783X",
        "linkedin": ";;;;",
        "or_profile": "~Zehao_Wang6;~Yiwen_Guo1;~Qizhang_Li1;~Guanglei_Yang1;~Wangmeng_Zuo3",
        "aff": "Harbin Institute of Technology;;Harbin Institute of Technology;Harbin Institute of Technology;Harbin Institute of Technology",
        "aff_domain": "hit.edu.cn;;hit.edu;hit.edu.cn;hit.edu.cn",
        "position": "MS student;;PhD student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nwang2024dualaug,\ntitle={DualAug: Exploiting Additional Heavy Augmentation with {OOD} Data Rejection},\nauthor={Zehao Wang and Yiwen Guo and Qizhang Li and Guanglei Yang and Wangmeng Zuo},\nyear={2024},\nurl={https://openreview.net/forum?id=XgklTOdV4J}\n}",
        "github": "",
        "project": "",
        "reviewers": "WegG;c5kH;hEeP",
        "site": "https://openreview.net/forum?id=XgklTOdV4J",
        "pdf_size": 5061548,
        "rating": "5;6;6",
        "confidence": "4;4;4",
        "soundness": "3;3;3",
        "contribution": "2;3;2",
        "presentation": "3;3;3",
        "wc_summary": "135;154;235",
        "wc_strengths": "67;153;256",
        "wc_weaknesses": "214;326;149",
        "wc_questions": "44;116;34",
        "wc_review": "460;749;674",
        "wc_reply_reviewers": "0;0;25",
        "wc_reply_authors": "966;879;288",
        "reply_reviewers": "0;0;1",
        "reply_authors": "6;8;3",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            174.66666666666666,
            43.36152928832448
        ],
        "wc_strengths_avg": [
            158.66666666666666,
            77.26289895904473
        ],
        "wc_weaknesses_avg": [
            229.66666666666666,
            73.10418744656302
        ],
        "wc_questions_avg": [
            64.66666666666667,
            36.527006751473934
        ],
        "wc_review_avg": [
            627.6666666666666,
            122.44817497845999
        ],
        "wc_reply_reviewers_avg": [
            8.333333333333334,
            11.785113019775793
        ],
        "wc_reply_authors_avg": [
            711.0,
            301.2075696259973
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            5.666666666666667,
            2.0548046676563256
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Htxcig1akY4J:scholar.google.com/&scioq=DualAug:+Exploiting+Additional+Heavy+Augmentation+with+OOD+Data+Rejection&hl=en&as_sdt=0,14",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Harbin Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.hit.edu.cn/",
        "aff_unique_abbr": "HIT",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Harbin",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "MogaNet: Multi-order Gated Aggregation Network",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18447",
        "id": "XhYWgjqCrV",
        "author_site": "Siyuan Li, Zedong Wang, Zicheng Liu, Cheng Tan, Haitao Lin, Di Wu, Zhiyuan Chen, Jiangbin Zheng, Stan Z Li",
        "tldr": "",
        "abstract": "By contextualizing the kernel as global as possible, Modern ConvNets have shown great potential in computer vision tasks. However, recent progress on \\textit{multi-order game-theoretic interaction} within deep neural networks (DNNs) reveals the representation bottleneck of modern ConvNets, where the expressive interactions have not been effectively encoded with the increased kernel size. To tackle this challenge, we propose a new family of modern ConvNets, dubbed MogaNet, for discriminative visual representation learning in pure ConvNet-based models with favorable complexity-performance trade-offs. MogaNet encapsulates conceptually simple yet effective convolutions and gated aggregation into a compact module, where discriminative features are efficiently gathered and contextualized adaptively. MogaNet exhibits great scalability, impressive efficiency of parameters, and competitive performance compared to state-of-the-art ViTs and ConvNets on ImageNet and various downstream vision benchmarks, including COCO object detection, ADE20K semantic segmentation, 2D\\&3D human pose estimation, and video prediction. Notably, MogaNet hits 80.0\\% and 87.8\\% accuracy with 5.2M and 181M parameters on ImageNet-1K, outperforming ParC-Net and ConvNeXt-L, while saving 59\\% FLOPs and 17M parameters, respectively. The source code is available at https://github.com/Westlake-AI/MogaNet.",
        "keywords": "Network Architecture;Convolution Neural Network;Image Classification;Vision Transformer;Representation Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/0590b39707d934456f2c67073e867b122afa2c3b.zip",
        "author": "Siyuan Li;Zedong Wang;Zicheng Liu;Cheng Tan;Haitao Lin;Di Wu;Zhiyuan Chen;Jiangbin Zheng;Stan Z. Li",
        "authorids": "~Siyuan_Li6;~Zedong_Wang1;~Zicheng_Liu2;~Cheng_Tan1;~Haitao_Lin2;~Di_Wu10;~Zhiyuan_Chen5;~Jiangbin_Zheng3;~Stan_Z._Li2",
        "gender": "M;M;M;M;M;M;M;M;M",
        "homepage": "https://lupin1998.github.io/;https://jacky1128.github.io;;https://chengtan9907.github.io/;;;https://zyc.ai;;https://en.westlake.edu.cn/academics/School_of_Engineering/About/Our_People/Faculty/201912/t20191206_2497.shtml",
        "dblp": "63/9705-2;179/8811.html;l/ZichengLiu-6;70/1533-12.html;34/1040;;192/0196-8;;l/StanZLi",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=zh-CN;6kTV6aMAAAAJ;o5A23qIAAAAJ;https://scholar.google.com/citations?hl=en;CKiY8PIAAAAJ;;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": "0000-0001-6806-2468;0009-0000-0112-0491;;;;;0000-0003-3210-0324;0000-0003-3305-0103;",
        "linkedin": "https://www.linkedin.cn/incareer/in/siyuan-li-lupin1998/;;;;;;%E9%99%9F%E5%8E%9F-%E9%99%88-0b473aa9;;stan-z-li-%E6%9D%8E%E5%AD%90%E9%9D%92-55753224/",
        "or_profile": "~Siyuan_Li6;~Zedong_Wang1;~Zicheng_Liu2;~Cheng_Tan1;~Haitao_Lin2;~Di_Wu10;~Zhiyuan_Chen5;~Jiangbin_Zheng3;~Stan_Z._Li1",
        "aff": "Alibaba Group;Westlake University;Zhejiang University;Zhejiang University & Westlake University;Westlake University;Westlake University;DP Technology;Westlake University;Westlake University",
        "aff_domain": "alibaba-inc.com;westlake.edu;zju.edu.cn;westlake.edu.cn;westlake.edu.cn;westlake.edu.cn;dp.tech;westlake.edu.cn;westlake.edu.cn",
        "position": "Intern;Intern;PhD student;PhD student;PhD student;PhD student;Researcher;PhD student;Chair Professor",
        "bibtex": "@inproceedings{\nli2024moganet,\ntitle={MogaNet: Multi-order Gated Aggregation Network},\nauthor={Siyuan Li and Zedong Wang and Zicheng Liu and Cheng Tan and Haitao Lin and Di Wu and Zhiyuan Chen and Jiangbin Zheng and Stan Z. Li},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=XhYWgjqCrV}\n}",
        "github": "",
        "project": "",
        "reviewers": "XNzj;tkKT;6yMg;Koyy",
        "pdf_size": 8119031,
        "rating": "6;6;6;8",
        "confidence": "5;5;5;4",
        "soundness": "2;2;3;3",
        "contribution": "3;2;2;3",
        "presentation": "1;2;3;4",
        "wc_summary": "59;80;109;82",
        "wc_strengths": "47;49;55;148",
        "wc_weaknesses": "70;229;270;164",
        "wc_questions": "275;92;34;4",
        "wc_review": "451;450;468;398",
        "wc_reply_reviewers": "109;0;129;46",
        "wc_reply_authors": "1541;1627;2795;1304",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "3;3;5;3",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            82.5,
            17.755280904564703
        ],
        "wc_strengths_avg": [
            74.75,
            42.39324828318774
        ],
        "wc_weaknesses_avg": [
            183.25,
            75.52276146963908
        ],
        "wc_questions_avg": [
            101.25,
            105.18406485775304
        ],
        "wc_review_avg": [
            441.75,
            26.252380844411046
        ],
        "wc_reply_reviewers_avg": [
            71.0,
            51.171281008002914
        ],
        "wc_reply_authors_avg": [
            1816.75,
            577.0460878474092
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.5,
            0.8660254037844386
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 65,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1275386032640218531&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=XhYWgjqCrV",
        "pdf": "https://openreview.net/pdf?id=XhYWgjqCrV",
        "email": "alibaba-inc.com;westlake.edu;zju.edu.cn;westlake.edu.cn;westlake.edu.cn;westlake.edu.cn;dp.tech;westlake.edu.cn;westlake.edu.cn",
        "author_num": 9,
        "aff_unique_index": "0;1;2;2;1;1;3;1;1",
        "aff_unique_norm": "Alibaba Group;Westlake University;Zhejiang University;DP Technology",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.alibaba.com;https://www.westlake.edu.cn;https://www.zju.edu.cn;",
        "aff_unique_abbr": "Alibaba;WU;ZJU;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "China;"
    },
    {
        "id": "XheqLWvswO",
        "title": "Accelerated Neural Network Training with Rooted Logistic Objectives",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Many neural networks deployed in the real world scenarios are trained using cross entropy based loss functions. From the optimization perspective, it is known that the behavior of first order methods such as gradient descent crucially depend on the separability of datasets. In fact, even in the most simplest case of binary classification, the rate of convergence depends on two factors: (1) condition number of data matrix, and (2) separability of the dataset. With no further pre-processing techniques such as over-parametrization, data augmentation etc., separability is an intrinsic quantity of the data distribution under consideration. We focus on the landscape design of the logistic function and derive a novel sequence of strictly convex functions that are at least as strict as logistic loss. The minimizers of these functions coincide with those of the minimum norm solution wherever possible. The strict convexity of the derived function can be extended to finetune state-of-the-art models and applications. In empirical experimental analysis, we apply our proposed rooted logistic objective to multiple deep models, e.g., fully-connected neural networks and transformers, on various of classification benchmarks. Our results illustrate that training with rooted loss function is converged faster and gains performance improvements. Furthermore, we illustrate applications of our novel rooted loss function in generative modeling based downstream applications, such as finetuning StyleGAN model with the rooted loss. The code implementing our losses and models can be found here for open source software development purposes: https://anonymous.4open.science/r/rooted_loss.",
        "keywords": "optimization;logistic regression;neural networks;transformers;generative model",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/ce64c9201a5b3ce06aa0c712d37e34660ae37537.pdf",
        "author": "Zhu Wang;Praveen Raj Veluswami;Harsh Mishra;Sathya N. Ravi",
        "authorids": "~Zhu_Wang2;~Praveen_Raj_Veluswami1;~Harsh_Mishra1;~Sathya_N._Ravi1",
        "gender": "F;M;M;M",
        "homepage": ";;;http://sathyaravi.com",
        "dblp": ";;;159/2123",
        "google_scholar": "mMyQX4oAAAAJ;;;FW-0thoAAAAJ",
        "orcid": ";;;0000-0003-3881-6323",
        "linkedin": ";praveenraj-v/;harsh-mishra-515624144;sathya-narayanan-ravi-74a5a128/",
        "or_profile": "~Zhu_Wang2;~Praveen_Raj_Veluswami1;~Harsh_Mishra1;~Sathya_N._Ravi1",
        "aff": "University of Illinois at Chicago;University of Illinois at Chicago;Rothamsted Research ;University of Illinois, Chicago",
        "aff_domain": "cs.uic.edu;uic.edu;rothamsted.ac.uk;uic.edu",
        "position": "PhD student;Research Assistant Volunteer;Researcher;Assistant Professor",
        "bibtex": "@misc{\nwang2024accelerated,\ntitle={Accelerated Neural Network Training with Rooted Logistic Objectives},\nauthor={Zhu Wang and Praveen Raj Veluswami and Harsh Mishra and Sathya N. Ravi},\nyear={2024},\nurl={https://openreview.net/forum?id=XheqLWvswO}\n}",
        "github": "",
        "project": "",
        "reviewers": "G5jt;vuQU;QRfD;MpCx",
        "site": "https://openreview.net/forum?id=XheqLWvswO",
        "pdf_size": 4627483,
        "rating": "3;3;3;6",
        "confidence": "4;4;4;3",
        "soundness": "3;2;2;2",
        "contribution": "2;1;2;3",
        "presentation": "2;2;2;2",
        "wc_summary": "40;38;124;55",
        "wc_strengths": "30;7;63;21",
        "wc_weaknesses": "154;177;527;76",
        "wc_questions": "48;16;2;193",
        "wc_review": "272;238;716;345",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "124;124;116;139",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            64.25,
            35.116769498346514
        ],
        "wc_strengths_avg": [
            30.25,
            20.60794749605113
        ],
        "wc_weaknesses_avg": [
            233.5,
            173.53745993300697
        ],
        "wc_questions_avg": [
            64.75,
            75.89919301283776
        ],
        "wc_review_avg": [
            392.75,
            190.59036570613952
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            125.75,
            8.317902379807062
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:sQrwK0X4AEgJ:scholar.google.com/&scioq=Accelerated+Neural+Network+Training+with+Rooted+Logistic+Objectives&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "University of Illinois at Chicago;Rothamsted Research",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uic.edu;https://www.rothamsted.ac.uk",
        "aff_unique_abbr": "UIC;Rothamsted",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Chicago;",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "XhxzmAVjNG",
        "title": "FedPnP:A Plug and Play Approach For Personalized Graph-Structured Federated Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In Personalized Federated Learning (PFL), existing methods often overlook the intricate interconnections between clients and their local datasets, limiting effective information sharing. In this work, we introduce \"FedPnP\", a novel approach that leverages the inherent graph-based relationships among clients. Clients connected by a graph tend to exhibit similar model responses to similar input data, leading to a graph-based optimization problem linked to inverse problems like compressed sensing. To tackle this optimization problem, we employ a Half-Quadratic-Splitting technique (HQS) to effectively decompose it into two subproblems. The first subproblem, acting as a data fidelity term, ensures local models perform well on their respective datasets, while the second, serving as a sparsity-inducing term, promotes the smoothness of local model weights on the graph. Notably, we introduce a structural proximal term, a generalization for FedProx, in the first subproblem and demonstrate that any graph denoiser with a controllable noise parameter can be integrated as the second subproblem, offering flexibility without explicit derivation. We evaluate FedPnP on computer vision datasets (CIFAR-10, MNIST) and a human activity recognition dataset (HARBOX) to test its performance in real-world PFL scenarios. Empirical results confirm that FedPnP outperforms state-of-the-art algorithms. This novel bridge between PFL and inverse problems opens up the potential for cross-pollination of solutions, yielding superior algorithms for PFL tasks.",
        "keywords": "Personalized Federated Learning;Graph Federated Learning;Inverse Problems;Plug and Play;Federated Learning;Graph Signal Processing;Graph filtering;Half-Quadratic-Splitting",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Arash Rasti-Meymandi;Ahmad Sajedi;Konstantinos N Plataniotis",
        "authorids": "~Arash_Rasti-Meymandi1;~Ahmad_Sajedi2;~Konstantinos_N_Plataniotis1",
        "gender": "M;M;M",
        "homepage": ";https://ahmadsajedii.github.io/;https://www.comm.utoronto.ca/~kostas/",
        "dblp": ";290/7612;p/KonstantinosNPlataniotis",
        "google_scholar": "5pSY7R0AAAAJ;;https://scholar.google.ca/citations?hl=en",
        "orcid": ";0009-0000-0618-5198;0000-0003-3647-5473",
        "linkedin": ";ahmad-sajedi-392a30b6/;",
        "or_profile": "~Arash_Rasti-Meymandi1;~Ahmad_Sajedi2;~Kostantinos_Plataniotis1",
        "aff": "University of Toronto;University of Toronto;Toronto University",
        "aff_domain": "utoronto.ca;ece.utoronto.ca;utoronto.ca",
        "position": "PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nrasti-meymandi2024fedpnpa,\ntitle={FedPnP:A Plug and Play Approach For Personalized Graph-Structured Federated Learning},\nauthor={Arash Rasti-Meymandi and Ahmad Sajedi and Konstantinos N Plataniotis},\nyear={2024},\nurl={https://openreview.net/forum?id=XhxzmAVjNG}\n}",
        "github": "",
        "project": "",
        "reviewers": "CRgy;BmWz;4efK;vGbJ",
        "site": "https://openreview.net/forum?id=XhxzmAVjNG",
        "pdf_size": 15096812,
        "rating": "3;3;5;5",
        "confidence": "3;4;2;3",
        "soundness": "2;1;2;3",
        "contribution": "2;1;2;3",
        "presentation": "3;1;3;2",
        "wc_summary": "27;46;84;13",
        "wc_strengths": "22;20;35;22",
        "wc_weaknesses": "32;253;306;178",
        "wc_questions": "31;85;28;19",
        "wc_review": "112;404;453;232",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            42.5,
            26.669270706189174
        ],
        "wc_strengths_avg": [
            24.75,
            5.973901572674261
        ],
        "wc_weaknesses_avg": [
            192.25,
            103.09310112708803
        ],
        "wc_questions_avg": [
            40.75,
            25.926579026165406
        ],
        "wc_review_avg": [
            300.25,
            136.19173065939063
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.7071067811865475,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:j--gpbMhhsQJ:scholar.google.com/&scioq=FedPnP:A+Plug+and+Play+Approach+For+Personalized+Graph-Structured+Federated+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Toronto",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.utoronto.ca",
        "aff_unique_abbr": "U of T",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "Xi7UoErFRt",
        "title": "FedGP: Buffer-based Gradient Projection for Continual Federated Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Continual Federated Learning (CFL) is essential for enabling real-world applications where multiple decentralized clients adaptively learn from continuous data streams. A significant challenge in CFL is mitigating catastrophic forgetting, where models lose previously acquired knowledge when learning new information. Existing works on this issue either make unrealistic assumptions about the availability of task boundaries or heavily rely on surrogate samples. To address this gap, we introduce a buffer-based Gradient Projection method (\\ours{}). This method tackles catastrophic forgetting by leveraging local buffer samples and aggregated buffer gradients, thus preserving knowledge across multiple clients. Our method is compatible with various existing continual learning and CFL techniques, enhancing their performance in the CFL context. Our experiments on standard benchmarks consistently show performance improvements across diverse scenarios. For example, on a task-incremental learning setting with CIFAR100, our method can help increase the accuracy up to 27\\%. Our code is available at https://anonymous.4open.science/r/FedGP-F8D4.",
        "keywords": "continual federated learning;catastrophic forgetting;gradient projection",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/2f4dd9a65e51c0b88caa5f601c31e6f63393815b.pdf",
        "author": "Shenghong Dai;Yicong Chen;Jy-yong Sohn;S M Iftekharul Alam;Ravikumar Balakrishnan;Suman Banerjee;Nageen Himayat;Kangwook Lee",
        "authorids": "~Shenghong_Dai1;~Yicong_Chen1;~Jy-yong_Sohn1;~S_M_Iftekharul_Alam1;~Ravikumar_Balakrishnan1;~Suman_Banerjee3;~Nageen_Himayat1;~Kangwook_Lee1",
        "gender": "F;M;;M;M;;M;M",
        "homepage": ";https://itml.yonsei.ac.kr/professor;;;http://pages.cs.wisc.edu/~suman;https://www.linkedin.com/in/nageen-himayat-3292603/;http://kangwooklee.com/;https://bryce-chen.github.io/",
        "dblp": "319/0770;188/6303;;;;20/4102.html;88/9826-1;",
        "google_scholar": ";https://scholar.google.co.kr/citations?user=Cs75s1MAAAAJ;https://scholar.google.com/citations?hl=en;zVvdiTsAAAAJ;cLb-v7gAAAAJ;frmNZH4AAAAJ;sCEl8r-n5VEC;PqM7UJkAAAAJ",
        "orcid": ";;;;;;;",
        "linkedin": "shenghong-dai-7a6a96191/;;;ravikumar-balakrishnan-05193819/;;;;bryce-chen-046993250/",
        "or_profile": "~Shenghong_Dai1;~Jy-yong_Sohn1;~S_M_Iftekharul_Alam1;~Ravikumar_Balakrishnan1;~Suman_Banerjee3;~Nageen_Himayat1;~Kangwook_Lee1;~Bryce_Yicong_Chen1",
        "aff": "Microsoft;Yonsei University;Intel;;UW-Madison;Intel;KRAFTON;University of Wisconsin - Madison",
        "aff_domain": "microsoft.com;yonsei.ac.kr;intel.com;;cs.wisc.edu;intel.com;krafton.com;wisc.edu",
        "position": "Intern;Assistant Professor;Researcher;;Full Professor;Principal Researcher;Researcher;Undergrad student",
        "bibtex": "@misc{\ndai2024fedgp,\ntitle={Fed{GP}: Buffer-based Gradient Projection for Continual Federated Learning},\nauthor={Shenghong Dai and Yicong Chen and Jy-yong Sohn and S M Iftekharul Alam and Ravikumar Balakrishnan and Suman Banerjee and Nageen Himayat and Kangwook Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=Xi7UoErFRt}\n}",
        "github": "",
        "project": "",
        "reviewers": "sEUN;Nmd1;MNXy",
        "site": "https://openreview.net/forum?id=Xi7UoErFRt",
        "pdf_size": 2274051,
        "rating": "5;5;5",
        "confidence": "3;4;3",
        "soundness": "3;3;3",
        "contribution": "2;3;2",
        "presentation": "3;3;3",
        "wc_summary": "61;49;90",
        "wc_strengths": "56;44;39",
        "wc_weaknesses": "212;49;105",
        "wc_questions": "4;141;2",
        "wc_review": "333;283;236",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1536;1740;548",
        "reply_reviewers": "0;0;0",
        "reply_authors": "3;4;1",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            66.66666666666667,
            17.21110752456745
        ],
        "wc_strengths_avg": [
            46.333333333333336,
            7.1336448530109
        ],
        "wc_weaknesses_avg": [
            122.0,
            67.6214955961983
        ],
        "wc_questions_avg": [
            49.0,
            65.05894762956643
        ],
        "wc_review_avg": [
            284.0,
            39.60639678974429
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1274.6666666666667,
            520.536475400353
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1778168421310060357&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;3;2;4;3",
        "aff_unique_norm": "Microsoft;Yonsei University;Intel;University of Wisconsin-Madison;KRAFTON Inc.",
        "aff_unique_dep": "Microsoft Corporation;;Intel Corporation;;",
        "aff_unique_url": "https://www.microsoft.com;https://www.yonsei.ac.kr;https://www.intel.com;https://www.wisc.edu;https://www.krafton.com",
        "aff_unique_abbr": "Microsoft;Yonsei;Intel;UW-Madison;KRAFTON",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Madison",
        "aff_country_unique_index": "0;1;0;0;0;1;0",
        "aff_country_unique": "United States;South Korea"
    },
    {
        "id": "Xj5J38B4oi",
        "title": "Leveraging Cross-Modal Neighbor Representation for Improved CLIP Classification",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "CLIP showcases exceptional cross-modal matching capabilities due to its training on text-image matching tasks. However, without specific optimization for unimodal scenarios, its performance in single-modality feature extraction might be suboptimal. Despite this, some studies have directly used CLIP\u2019s image encoder for tasks like few-shot classification, introducing a misalignment between its pre-training objectives and feature extraction methods. This inconsistency can diminish the quality of the image feature representation, adversely affecting CLIP\u2019s effectiveness in targeted tasks. In this paper, we view text features as precise neighbors of image features in CLIP\u2019s space and present a novel CrOss-moDal nEighbor Representation (CODER) based on the distance structure between images and their neighbor texts. This feature extraction method aligns better with CLIP\u2019s pre-training objectives, thereby fully leveraging CLIP\u2019s robust cross-modal capabilities. The key to constructing a high-quality CODER lies in how to create a vast amount of high-quality text to match with images. We introduce the Auto Prompt Generator (APG) to autonomously produce the required text in a data-free and training-free manner. We apply CODER to CLIP\u2019s zero-shot and few-shot image classification tasks. Experimental results across various datasets and architectures confirm CODER\u2019s effectiveness.",
        "keywords": "Vision-Language Models;Large Language Model;Zero-Shot Learning;Few-Shot Learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Chao Yi;Lu Ren;De-Chuan Zhan;Han-Jia Ye",
        "authorids": "~Chao_Yi1;~Lu_Ren3;~De-Chuan_Zhan1;~Han-Jia_Ye1",
        "gender": "M;;M;M",
        "homepage": "http://www.lamda.nju.edu.cn/yic/;https://github.com/woshiluren;http://www.lamda.nju.edu.cn/zhandc/;http://www.lamda.nju.edu.cn/yehj",
        "dblp": "159/8631;;74/498;165/3014",
        "google_scholar": ";;mYJf4TcAAAAJ;mgOYhtoAAAAJ",
        "orcid": ";;0000-0002-3533-2078;",
        "linkedin": ";;;",
        "or_profile": "~Chao_Yi1;~Lu_Ren3;~De-Chuan_Zhan1;~Han-Jia_Ye1",
        "aff": "Nanjing University;Nanjing University;Nanjing University;Nanjing University",
        "aff_domain": "nju.edu.cn;nju.edu.cn;nju.edu.cn;nju.edu.cn",
        "position": "MS student;MS student;Full Professor;Associate Professor",
        "bibtex": "@misc{\nyi2024leveraging,\ntitle={Leveraging Cross-Modal Neighbor Representation for Improved {CLIP} Classification},\nauthor={Chao Yi and Lu Ren and De-Chuan Zhan and Han-Jia Ye},\nyear={2024},\nurl={https://openreview.net/forum?id=Xj5J38B4oi}\n}",
        "github": "",
        "project": "",
        "reviewers": "TwiA;uuv4;jDrX;fMUU",
        "site": "https://openreview.net/forum?id=Xj5J38B4oi",
        "pdf_size": 5189990,
        "rating": "3;5;5;5",
        "confidence": "4;5;5;2",
        "soundness": "3;2;3;2",
        "contribution": "1;2;1;1",
        "presentation": "3;3;3;3",
        "wc_summary": "48;32;515;66",
        "wc_strengths": "14;32;282;56",
        "wc_weaknesses": "81;233;592;282",
        "wc_questions": "71;22;131;9",
        "wc_review": "214;319;1520;413",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            1.224744871391589
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            165.25,
            202.28615251667622
        ],
        "wc_strengths_avg": [
            96.0,
            108.41586599755591
        ],
        "wc_weaknesses_avg": [
            297.0,
            185.74310215994564
        ],
        "wc_questions_avg": [
            58.25,
            47.94462952198087
        ],
        "wc_review_avg": [
            616.5,
            526.3641800122801
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8912945973476255131&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Nanjing University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nju.edu.cn",
        "aff_unique_abbr": "Nanjing U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "XjkJdWOyqN",
        "title": "Are Large Language Models Really Robust to Word-Level Perturbations?",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The swift advancement in the scales and capabilities of Large Language Models (LLMs) positions them as promising tools for a variety of downstream tasks. In addition to the pursuit of better performance and the avoidance of violent feedback on a certain prompt, to ensure the responsibility of the LLM, much attention is drawn to the robustness of LLMs. However, existing evaluation methods mostly rely on traditional question answering datasets with predefined supervised labels, which do not align with the superior generation capabilities of contemporary LLMs. To address this issue, we propose a novel rational evaluation approach that leverages pre-trained reward models as diagnostic tools to evaluate the longer conversation generated from more challenging open questions by LLMs, which we refer to as the  $R$eward Model for $R$easonable  $R$obustness $Eval$uation ($TREvaL$).  Longer conversations manifest the comprehensive grasp of language models in terms of their proficiency in understanding questions, a capability not entirely encompassed by individual words or letters, which may exhibit oversimplification and inherent biases. Our extensive empirical experiments demonstrate that TREvaL provides an innovative method for evaluating the robustness of LLMs. Furthermore, our results demonstrate that LLMs frequently exhibit vulnerability to word-level perturbations that are commonplace in daily language usage. Notably, we are surprised to discover that robustness tends to decrease as fine-tuning (SFT and RLHF) is conducted.",
        "keywords": "Large Language Models;Evaluation;Reward Model;Robustness;Helpfulness;Harmlessness",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/b6c706f1e9c7ae1f3f55a324a054b724d28f30d8.zip",
        "author": "Haoyu Wang;Guozheng Ma;Cong Yu;Ning Gui;Linrui Zhang;Suwei Ma;Yongzhe Chang;Sen Zhang;Li Shen;Xueqian Wang;Peilin Zhao;Dacheng Tao",
        "authorids": "~Haoyu_Wang12;~Guozheng_Ma2;~Cong_Yu4;~Ning_Gui2;~Linrui_Zhang1;~Suwei_Ma1;~Yongzhe_Chang1;~Sen_Zhang3;~Li_Shen1;~Xueqian_Wang1;~Peilin_Zhao2;~Dacheng_Tao1",
        "gender": "M;M;;M;M;M;M;M;M;M;;",
        "homepage": "https://github.com/Harry-mic;https://guozheng-ma.github.io/;https://github.com/calm-6908;;;;;https://github.com/SenZHANG-GitHub;https://sites.google.com/site/mathshenli/home;;;",
        "dblp": ";;;;;;;57/6221-6;91/3680-8;43/3563-1;84/8411;",
        "google_scholar": ";jDvVglUAAAAJ;-U3Wqi4AAAAJ;https://scholar.google.com/citations?hl=zh-CN;;;https://scholar.google.com.hk/citations?user=7iRQyFcAAAAJ;-bJJNV0AAAAJ;yVhgENIAAAAJ;h9dN_ykAAAAJ;https://scholar.google.com.hk/citations?user=HPeX_YcAAAAJ;",
        "orcid": ";;;;;;0000-0002-9083-5348;;;0000-0003-3542-0593;0000-0001-8543-3953;",
        "linkedin": ";;;;%E9%BA%9F%E7%9D%BF-%E5%BC%A0-bb5312222/;https://linkedin.com/in/will-ma-70b465292;;;;;;",
        "or_profile": "~Haoyu_Wang12;~Guozheng_Ma2;~Cong_Yu4;~Ning_Gui2;~Linrui_Zhang1;~Suwei_Ma1;~Yongzhe_Chang1;~Sen_Zhang3;~Li_Shen1;~Xueqian_Wang1;~Peilin_Zhao2;~Dacheng_Tao1",
        "aff": "Tsinghua University;Tsinghua University;Tsinghua University;Shenzhen International Graduate School, Tsinghua University;;Columbia University;Tsinghua University;University of Sydney, University of Sydney;JD Explore Academy;Tsinghua University;Tencent;",
        "aff_domain": "tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;;columbia.edu;tsinghua.edu.cn;sydney.edu.au;jd.com;tsinghua.edu.cn;tencent.com;",
        "position": "MS student;MS student;MS student;MS student;;Undergrad student;Researcher;Postdoc;Researcher;Full Professor;Researcher;",
        "bibtex": "@misc{\nwang2024are,\ntitle={Are Large Language Models Really Robust to Word-Level Perturbations?},\nauthor={Haoyu Wang and Guozheng Ma and Cong Yu and Ning Gui and Linrui Zhang and Suwei Ma and Yongzhe Chang and Sen Zhang and Li Shen and Xueqian Wang and Peilin Zhao and Dacheng Tao},\nyear={2024},\nurl={https://openreview.net/forum?id=XjkJdWOyqN}\n}",
        "github": "",
        "project": "",
        "reviewers": "CidD;dv1Q;83Jj;fGVC",
        "site": "https://openreview.net/forum?id=XjkJdWOyqN",
        "pdf_size": 2127817,
        "rating": "3;3;3;3",
        "confidence": "4;4;4;4",
        "soundness": "1;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "3;3;3;3",
        "wc_summary": "44;61;103;246",
        "wc_strengths": "32;54;19;144",
        "wc_weaknesses": "153;132;224;250",
        "wc_questions": "3;38;62;133",
        "wc_review": "232;285;408;773",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            113.5,
            79.45596264598397
        ],
        "wc_strengths_avg": [
            62.25,
            48.828142499996865
        ],
        "wc_weaknesses_avg": [
            189.75,
            48.70510753504195
        ],
        "wc_questions_avg": [
            59.0,
            47.5972688292091
        ],
        "wc_review_avg": [
            424.5,
            211.09298898826555
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            12,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 25,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9610192472343428926&as_sdt=8005&sciodt=0,7&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0;1;0;2;3;0;4",
        "aff_unique_norm": "Tsinghua University;Columbia University;University of Sydney;JD;Tencent",
        "aff_unique_dep": ";;;JD Explore Academy;Tencent Holdings Limited",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.columbia.edu;https://www.sydney.edu.au;;https://www.tencent.com",
        "aff_unique_abbr": "THU;Columbia;USYD;;Tencent",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Shenzhen",
        "aff_country_unique_index": "0;0;0;0;1;0;2;0;0",
        "aff_country_unique": "China;United States;Australia;"
    },
    {
        "id": "XjlZJJFyla",
        "title": "Patch-Prompt Aligned Bayesian Prompt Tuning for Vision-Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "For downstream applications of vision-language pre-trained models, there has been significant interest in constructing effective prompts. Existing works on prompt engineering, which either require laborious manual designs or optimize the prompt tuning as a point estimation problem, may fail to describe diverse characteristics of categories and limit their applications. We introduce a Bayesian probabilistic resolution to prompt tuning, where the label-specific stochastic prompts are generated hierarchically by first sampling a latent vector from an underlying distribution and then employing a lightweight generative model. Importantly, we semantically regularize the tuning process by minimizing the statistic distance between the visual patches and linguistic prompts, which pushes the stochastic label representations to faithfully capture diverse visual concepts, instead of overfitting the training categories. We evaluate the effectiveness of our approach on four tasks: few-shot image recognition, base-to-new generalization, dataset transfer learning, and domain shifts. Extensive results on over 15 datasets show promising transferability and generalization performance of our proposed model, both quantitatively and qualitatively.",
        "keywords": "Bayesian prompt learning; pre-trained vision language model",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/3006a8fb4e5b207d6cbc794fbf7f0dc64a62e8df.zip",
        "author": "Xinyang Liu;Dongsheng Wang;Miaoge Li;Bowei Fang;Yishi Xu;Zhibin Duan;Bo Chen;Mingyuan Zhou",
        "authorids": "~Xinyang_Liu4;~Dongsheng_Wang4;~Miaoge_Li1;~Bowei_Fang2;~Yishi_Xu2;~Zhibin_Duan1;~Bo_Chen1;~Mingyuan_Zhou1",
        "gender": "M;F;M;M;M;M;M;M",
        "homepage": "https://xinyangatk.github.io;https://github.com/keepgoingjkg;https://github.com/;;http://web.xidian.edu.cn/bchen/en/index.html;http://mingyuanzhou.github.io;https://wds2014.github.io/;https://novicestone.github.io/",
        "dblp": ";330/3622;;268/2560;89/5615-1;;21/841-3;268/6784",
        "google_scholar": "https://scholar.google.com.hk/citations?hl=zh-CN;;;https://scholar.google.com.hk/citations?user=bITyHaEAAAAJ;;LXwCIisAAAAJ;https://scholar.google.com/citations?hl=en;SHVgTzIAAAAJ",
        "orcid": ";;;;0000-0001-5151-9388;;0000-0002-3380-5337;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Xinyang_Liu4;~Miaoge_Li1;~Bowei_Fang2;~Zhibin_Duan1;~Bo_Chen1;~Mingyuan_Zhou1;~dongsheng_wang3;~Yi.shi_Xu1",
        "aff": "Xidian University;Hong Kong Polytechnic University;Xi'an University of Electronic Science and Technology;Xidian University;Xidian University;Google;Xidian University;Xidian University",
        "aff_domain": "xidian.edu;polyu.edu.hk;xidian.edu.cn;xidian.edu;xidian.edu.cn;google.com;xidian.edu.cn;xidian.edu.cn",
        "position": "MS student;PhD student;MS student;PhD student;Full Professor;Researcher;PhD student;PhD student",
        "bibtex": "@misc{\nliu2024patchprompt,\ntitle={Patch-Prompt Aligned Bayesian Prompt Tuning for Vision-Language Models},\nauthor={Xinyang Liu and Dongsheng Wang and Miaoge Li and Bowei Fang and Yishi Xu and Zhibin Duan and Bo Chen and Mingyuan Zhou},\nyear={2024},\nurl={https://openreview.net/forum?id=XjlZJJFyla}\n}",
        "github": "",
        "project": "",
        "reviewers": "H1KY;19zz;zJm8;EsJ6",
        "site": "https://openreview.net/forum?id=XjlZJJFyla",
        "pdf_size": 7761358,
        "rating": "3;5;6;6",
        "confidence": "5;5;4;3",
        "soundness": "2;2;3;2",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "52;55;120;59",
        "wc_strengths": "21;38;131;31",
        "wc_weaknesses": "145;550;204;75",
        "wc_questions": "6;40;6;34",
        "wc_review": "224;683;461;199",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "944;1374;374;266",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;3;1;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            71.5,
            28.111385593741193
        ],
        "wc_strengths_avg": [
            55.25,
            44.149603622229726
        ],
        "wc_weaknesses_avg": [
            243.5,
            182.7546169047447
        ],
        "wc_questions_avg": [
            21.5,
            15.644487847162015
        ],
        "wc_review_avg": [
            391.75,
            196.79605560071573
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            739.5,
            447.8289293915702
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.7385489458759963,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10651675310626806826&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2;0;0;3;0;0",
        "aff_unique_norm": "Xidian University;Hong Kong Polytechnic University;Xi'an University of Electronic Science and Technology;Google",
        "aff_unique_dep": ";;;Google",
        "aff_unique_url": "http://www.xidian.edu.cn/;https://www.polyu.edu.hk;http://www.xidian.edu.cn/;https://www.google.com",
        "aff_unique_abbr": "Xidian;PolyU;Xidian University;Google",
        "aff_campus_unique_index": "1;2;3",
        "aff_campus_unique": ";Hong Kong SAR;Xi'an;Mountain View",
        "aff_country_unique_index": "0;0;0;0;0;1;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "XkLMGx60aZ",
        "title": "Climate-sensitive Urban Planning through Optimization of Tree Placements",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Climate change is increasing the intensity and frequency of many extreme weather events, including heatwaves, which results in increased thermal discomfort and mortality rates. While global mitigation action is undoubtedly necessary, so is climate adaptation, e.g., through climate-sensitive urban planning. Among the most promising strategies is harnessing the benefits of urban trees in shading and cooling pedestrian-level environments. Our work investigates the challenge of optimal placement of such trees. Physical simulations can estimate the radiative and thermal impact of trees on human thermal comfort but induce high computational costs. This rules out optimization of tree placements over large areas and considering effects over longer time scales. Hence, we employ neural networks to simulate the point-wise mean radiant temperatures--a driving factor of outdoor human thermal comfort--across various time scales, spanning from daily variations to extended time scales of heatwave events and even decades. To optimize tree placements, we harness the innate local effect of trees within the iterated local search framework with tailored adaptations. We show the efficacy of our approach across a wide spectrum of study areas and time scales. We believe that our approach is a step towards empowering  decision-makers, urban designers and planners to proactively and effectively assess the potential of urban trees to mitigate heat stress.",
        "keywords": "Climate Adaptation;Optimization;Spatio-temporal Modeling;Urban Trees;AI for Climate Science",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Simon Schrodi;Ferdinand Briegel;Max Argus;Andreas Christen;Thomas Brox",
        "authorids": "~Simon_Schrodi1;~Ferdinand_Briegel1;~Max_Argus2;~Andreas_Christen1;~Thomas_Brox1",
        "gender": "M;M;M;M;M",
        "homepage": "https://lmb.informatik.uni-freiburg.de/people/schrodi/;;https://www.meteo.uni-freiburg.de/en/team/andreas-christen;https://lmb.informatik.uni-freiburg.de/people/brox/index.en.html;https://lmb.informatik.uni-freiburg.de/people/argusm/",
        "dblp": "289/1328;;;97/4586;192/2010",
        "google_scholar": "https://scholar.google.de/citations?user=yC-y0PEAAAAJ;;https://scholar.google.ca/citations?user=WTD7r8kAAAAJ;https://scholar.google.com/citations?hl=de;",
        "orcid": "0009-0003-7006-953X;0000-0003-1293-9747;0000-0003-3864-1703;0000-0002-6282-8861;0000-0002-1288-7476",
        "linkedin": "simon-schrodi-7b55161bb/;;;;max-argus-5810636/",
        "or_profile": "~Simon_Schrodi1;~Ferdinand_Briegel1;~Andreas_Christen1;~Thomas_Brox1;~Max_Argus1",
        "aff": "University of Freiburg, Albert-Ludwigs-Universit\u00e4t Freiburg;;Albert-Ludwigs-Universit\u00e4t Freiburg;University of Freiburg;University of Freiburg, Albert-Ludwigs-Universit\u00e4t Freiburg",
        "aff_domain": "cs.uni-freiburg.de;;uni-freiburg.de;uni-freiburg.de;cs.uni-freiburg.de",
        "position": "PhD student;;Full Professor;Full Professor;Postdoc",
        "bibtex": "@misc{\nschrodi2024climatesensitive,\ntitle={Climate-sensitive Urban Planning through Optimization of Tree Placements},\nauthor={Simon Schrodi and Ferdinand Briegel and Max Argus and Andreas Christen and Thomas Brox},\nyear={2024},\nurl={https://openreview.net/forum?id=XkLMGx60aZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "TK26;oMtG;eged;bCfL",
        "site": "https://openreview.net/forum?id=XkLMGx60aZ",
        "pdf_size": 1535857,
        "rating": "3;5;6;8",
        "confidence": "3;3;4;3",
        "soundness": "3;3;2;3",
        "contribution": "1;2;2;2",
        "presentation": "2;3;4;4",
        "wc_summary": "62;110;153;71",
        "wc_strengths": "184;49;35;33",
        "wc_weaknesses": "271;122;276;110",
        "wc_questions": "137;93;66;155",
        "wc_review": "654;374;530;369",
        "wc_reply_reviewers": "0;59;79;57",
        "wc_reply_authors": "985;617;533;1280",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "2;2;2;3",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            99.0,
            36.020827308655754
        ],
        "wc_strengths_avg": [
            75.25,
            63.08872720225064
        ],
        "wc_weaknesses_avg": [
            194.75,
            78.88401295573141
        ],
        "wc_questions_avg": [
            112.75,
            35.173676236640375
        ],
        "wc_review_avg": [
            481.75,
            118.65996586886413
        ],
        "wc_reply_reviewers_avg": [
            48.75,
            29.431063521388417
        ],
        "wc_reply_authors_avg": [
            853.75,
            299.101466897105
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.16012815380508713,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18433895695529902773&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "University of Freiburg;Albert-Ludwigs-Universit\u00e4t Freiburg",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uni-freiburg.de;https://www.uni-freiburg.de",
        "aff_unique_abbr": "UoF;Albert-Ludwigs-Universit\u00e4t",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Freiburg;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "title": "Stabilizing Contrastive RL: Techniques for Robotic Goal Reaching from Offline Data",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18446",
        "id": "Xkf2EBj4w3",
        "author_site": "Chongyi Zheng, Benjamin Eysenbach, Homer Walke, Patrick Yin, Kuan Fang, Ruslan Salakhutdinov, Sergey Levine",
        "tldr": "",
        "abstract": "Robotic systems that rely primarily on self-supervised learning have the potential to decrease the amount of human annotation and engineering effort required to learn control strategies. In the same way that prior robotic systems have leveraged self-supervised techniques from computer vision (CV) and natural language processing (NLP), our work builds on prior work showing that the reinforcement learning (RL) itself can be cast as a self-supervised problem: learning to reach any goal without human-specified rewards or labels. Despite the seeming appeal, little (if any) prior work has demonstrated how self-supervised RL methods can be practically deployed on robotic systems. By first studying a challenging simulated version of this task, we discover design decisions about architectures and hyperparameters that increase the success rate by $2 \\times$. These findings lay the groundwork for our main result: we demonstrate that a self-supervised RL algorithm based on contrastive learning can solve real-world, image-based robotic manipulation tasks, with tasks being specified by a single goal image provided after training.",
        "keywords": "reinforcement learning;self-supervised learning;contrastive learning;goal-conditioned RL;offline RL;robotics",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/dee6fa973ab448942dd839bf64eff1ac100991dc.zip",
        "author": "Chongyi Zheng;Benjamin Eysenbach;Homer Rich Walke;Patrick Yin;Kuan Fang;Ruslan Salakhutdinov;Sergey Levine",
        "authorids": "~Chongyi_Zheng1;~Benjamin_Eysenbach1;~Homer_Rich_Walke1;~Patrick_Yin1;~Kuan_Fang3;~Ruslan_Salakhutdinov1;~Sergey_Levine1",
        "gender": "M;M;M;M;;;M",
        "homepage": "https://chongyi-zheng.github.io;https://ben-eysenbach.github.io/;https://homerwalke.com;https://www.patrickyin.me/;;;https://people.eecs.berkeley.edu/~svlevine/",
        "dblp": "250/9267;192/1863;279/6795;319/3869.html;;;80/7594",
        "google_scholar": "bezWXYcAAAAJ;DRnOvU8AAAAJ;ZWH5jCwAAAAJ;https://scholar.google.com/citations?hl=en;;;8R35rCwAAAAJ",
        "orcid": ";0009-0000-7136-6307;;;;;",
        "linkedin": ";benjamin-eysenbach-a7235775/;;patrickhaoy/;;;",
        "or_profile": "~Chongyi_Zheng1;~Benjamin_Eysenbach1;~Homer_Rich_Walke1;~Patrick_Yin1;~Kuan_Fang3;~Ruslan_Salakhutdinov1;~Sergey_Levine1",
        "aff": "Princeton University;Princeton University;University of California, Berkeley;University of Washington;;;Google",
        "aff_domain": "princeton.edu;princeton.edu;berkeley.edu;cs.washington.edu;;;google.com",
        "position": "PhD student;Assistant Professor;PhD student;PhD student;;;Research Scientist",
        "bibtex": "@inproceedings{\nzheng2024stabilizing,\ntitle={Stabilizing Contrastive {RL}: Techniques for Robotic Goal Reaching from Offline Data},\nauthor={Chongyi Zheng and Benjamin Eysenbach and Homer Rich Walke and Patrick Yin and Kuan Fang and Ruslan Salakhutdinov and Sergey Levine},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Xkf2EBj4w3}\n}",
        "github": "",
        "project": "",
        "reviewers": "8PDP;wQCi;kFCy;8bYx",
        "pdf_size": 9061194,
        "rating": "5;8;8;8",
        "confidence": "4;3;4;4",
        "soundness": "3;4;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;4;3;4",
        "wc_summary": "182;147;93;141",
        "wc_strengths": "69;70;77;57",
        "wc_weaknesses": "311;92;168;130",
        "wc_questions": "46;43;52;1",
        "wc_review": "608;352;390;329",
        "wc_reply_reviewers": "127;0;11;0",
        "wc_reply_authors": "1751;258;1059;207",
        "reply_reviewers": "2;0;1;0",
        "reply_authors": "4;1;3;1",
        "rating_avg": [
            7.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            140.75,
            31.704692081772375
        ],
        "wc_strengths_avg": [
            68.25,
            7.189401922274203
        ],
        "wc_weaknesses_avg": [
            175.25,
            82.85340970654134
        ],
        "wc_questions_avg": [
            35.5,
            20.180436070610565
        ],
        "wc_review_avg": [
            419.75,
            110.8475868027807
        ],
        "wc_reply_reviewers_avg": [
            34.5,
            53.59337645642417
        ],
        "wc_reply_authors_avg": [
            818.75,
            635.5093921414538
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.25,
            1.299038105676658
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 17,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=22014992034916236&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=Xkf2EBj4w3",
        "pdf": "https://openreview.net/pdf?id=Xkf2EBj4w3",
        "email": "princeton.edu;princeton.edu;berkeley.edu;cs.washington.edu;;;google.com",
        "author_num": 7,
        "aff_unique_index": "0;0;1;2;3",
        "aff_unique_norm": "Princeton University;University of California, Berkeley;University of Washington;Google",
        "aff_unique_dep": ";;;Google",
        "aff_unique_url": "https://www.princeton.edu;https://www.berkeley.edu;https://www.washington.edu;https://www.google.com",
        "aff_unique_abbr": "Princeton;UC Berkeley;UW;Google",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Berkeley;Mountain View",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "The importance of feature preprocessing for differentially private linear optimization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18445",
        "id": "XlTDBZFXWp",
        "author_site": "Ziteng Sun, Ananda Theertha Suresh, Aditya Krishna Menon",
        "tldr": "",
        "abstract": "Training machine learning models with differential privacy (DP) has received increasing interest in recent years. One of the most popular algorithms for training differentially private models is differentially private stochastic gradient descent (DPSGD) and its variants, where at each step gradients are clipped and combined with some noise. Given the increasing usage of DPSGD, we ask the question: is DPSGD alone sufficient to find a good minimizer for every dataset under privacy constraints? \n\nAs a first step towards answering this question, we show that even for the simple case of linear classification, unlike non-private optimization, (private) feature preprocessing is vital for differentially private optimization.  In detail, we first show theoretically that there exists an example where without feature preprocessing, DPSGD incurs a privacy error proportional to the maximum norm of features over all samples. We then propose an algorithm called *DPSGD-F*, which combines DPSGD with feature preprocessing and prove that for classification tasks, it incurs a privacy error proportional to the diameter of the features $\\max_{x, x' \\in D} \\|x - x'\\|_2$. We then demonstrate the practicality of our algorithm on image classification benchmarks.",
        "keywords": "private optimization;feature preprocessing;differential privacy",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Ziteng Sun;Ananda Theertha Suresh;Aditya Krishna Menon",
        "authorids": "~Ziteng_Sun1;~Ananda_Theertha_Suresh1;~Aditya_Krishna_Menon1",
        "gender": "M;M;M",
        "homepage": "http://www.zitengsun.com/;https://theertha.info;https://akmenon.github.io/",
        "dblp": "194/8609;119/3884;89/3514",
        "google_scholar": ";K6ef57QAAAAJ;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Ziteng_Sun1;~Ananda_Theertha_Suresh1;~Aditya_Menon1",
        "aff": "Google;Google;Google",
        "aff_domain": "google.com;google.com;google.com",
        "position": "Researcher;Research Scientist;Research Scientist",
        "bibtex": "@inproceedings{\nsun2024the,\ntitle={The importance of feature preprocessing for differentially private linear optimization},\nauthor={Ziteng Sun and Ananda Theertha Suresh and Aditya Krishna Menon},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=XlTDBZFXWp}\n}",
        "github": "",
        "project": "",
        "reviewers": "4bdB;m2H3;eA3j;FnQ7",
        "pdf_size": 451982,
        "rating": "6;6;6;8",
        "confidence": "3;3;3;2",
        "soundness": "3;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "84;62;63;106",
        "wc_strengths": "66;42;59;58",
        "wc_weaknesses": "47;264;238;123",
        "wc_questions": "60;5;59;8",
        "wc_review": "257;373;419;295",
        "wc_reply_reviewers": "0;134;0;38",
        "wc_reply_authors": "516;939;434;314",
        "reply_reviewers": "0;2;0;1",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            78.75,
            18.019087102292392
        ],
        "wc_strengths_avg": [
            56.25,
            8.78564169540279
        ],
        "wc_weaknesses_avg": [
            168.0,
            87.72399899685377
        ],
        "wc_questions_avg": [
            33.0,
            26.52357441974969
        ],
        "wc_review_avg": [
            336.0,
            63.60031446463138
        ],
        "wc_reply_reviewers_avg": [
            43.0,
            54.78138369920935
        ],
        "wc_reply_authors_avg": [
            550.75,
            235.3862517225677
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3637928495005993793&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=XlTDBZFXWp",
        "pdf": "https://openreview.net/pdf?id=XlTDBZFXWp",
        "email": "google.com;google.com;google.com",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Google",
        "aff_unique_dep": "Google",
        "aff_unique_url": "https://www.google.com",
        "aff_unique_abbr": "Google",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Mountain View",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "DNA-GPT: Divergent N-Gram Analysis for Training-Free Detection of GPT-Generated Text",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18444",
        "id": "Xlayxj2fWp",
        "author_site": "Xianjun Yang, Wei Cheng, Yue Wu, Linda Petzold, William Wang, Haifeng Chen",
        "tldr": "",
        "abstract": "Large language models (LLMs) have notably enhanced the fluency and diversity of machine-generated text. However, this progress also presents a significant challenge in detecting the origin of a given text, and current research on detection methods lags behind the rapid evolution of LLMs. Conventional training-based methods have limitations in flexibility, particularly when adapting to new domains, and they often lack explanatory power. To address this gap, we propose a novel training-free detection strategy called Divergent N-Gram Analysis (DNA-GPT). Given a text, we first truncate it in the middle and then use only the preceding portion as input to the LLMs to regenerate the new remaining parts. By analyzing the differences between the original and new remaining parts through N-gram analysis in black-box or probability divergence in white-box, we can clearly illustrate significant discrepancies between machine-generated and human-written text. We conducted extensive experiments on the most advanced LLMs from OpenAI, including text-davinci-003, GPT-3.5-turbo, and GPT-4, as well as open-source models such as GPT-NeoX-20B and LLaMa-13B. Results show that our zero-shot approach exhibits state-of-the-art performance in distinguishing between human and GPT-generated text on four English and one German dataset, outperforming OpenAI's own classifier, which is trained on millions of text. Additionally, our methods provide reasonable explanations and evidence to support our claim, which is a unique feature of explainable detection. Our method is also robust under the revised text attack and can additionally solve model sourcing.",
        "keywords": "Text Detection;zero-shot;AI detection;GPT",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/71ac1808ad6da2bf3373d74114e4471f8c7d8ad4.zip",
        "author": "Xianjun Yang;Wei Cheng;Yue Wu;Linda Ruth Petzold;William Yang Wang;Haifeng Chen",
        "authorids": "~Xianjun_Yang1;~Wei_Cheng1;~Yue_Wu12;~Linda_Ruth_Petzold1;~William_Yang_Wang2;~Haifeng_Chen1",
        "gender": "M;M;M;;;",
        "homepage": ";https://chengw07.github.io/;https://yuewu.us/;;;https://haifengchen.gitlab.io/intro/",
        "dblp": "37/10237;89/2506-2.html;41/5979-11;;;08/57-1.html",
        "google_scholar": "Tunh15sAAAAJ;PRrGVmoAAAAJ;kSQ1mLYAAAAJ;;;QzakB68AAAAJ",
        "orcid": "0000-0003-3318-8444;;;;;",
        "linkedin": "xianjun-yang-0062aa1a6/;wei-cheng-ml/;;;;",
        "or_profile": "~Xianjun_Yang1;~Wei_Cheng1;~Yue_Wu12;~Linda_Ruth_Petzold1;~William_Yang_Wang2;~Haifeng_Chen1",
        "aff": "University of California, Santa Barbara;NEC-Labs;University of California, Los Angeles;;;NEC-Labs",
        "aff_domain": "ucsb.edu;nec-labs.com;ucla.edu;;;nec-labs.com",
        "position": "PhD student;Principal Researcher;PhD student;;;Researcher",
        "bibtex": "@inproceedings{\nyang2024dnagpt,\ntitle={{DNA}-{GPT}: Divergent N-Gram Analysis for Training-Free Detection of {GPT}-Generated Text},\nauthor={Xianjun Yang and Wei Cheng and Yue Wu and Linda Ruth Petzold and William Yang Wang and Haifeng Chen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Xlayxj2fWp}\n}",
        "github": "",
        "project": "",
        "reviewers": "FS9z;UDX7;4FGJ",
        "pdf_size": 875987,
        "rating": "6;6;8",
        "confidence": "4;3;4",
        "soundness": "3;3;4",
        "contribution": "2;2;4",
        "presentation": "3;3;4",
        "wc_summary": "63;138;71",
        "wc_strengths": "36;50;49",
        "wc_weaknesses": "234;61;53",
        "wc_questions": "36;3;3",
        "wc_review": "369;252;176",
        "wc_reply_reviewers": "691;0;0",
        "wc_reply_authors": "1361;497;391",
        "reply_reviewers": "4;0;0",
        "reply_authors": "4;1;1",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            90.66666666666667,
            33.62869145371091
        ],
        "wc_strengths_avg": [
            45.0,
            6.377042156569663
        ],
        "wc_weaknesses_avg": [
            116.0,
            83.50249497270526
        ],
        "wc_questions_avg": [
            14.0,
            15.556349186104045
        ],
        "wc_review_avg": [
            265.6666666666667,
            79.38233780606083
        ],
        "wc_reply_reviewers_avg": [
            230.33333333333334,
            325.74052386660287
        ],
        "wc_reply_authors_avg": [
            749.6666666666666,
            434.4385904692272
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            1.8856180831641267
        ],
        "reply_authors_avg": [
            2.0,
            1.4142135623730951
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.49999999999999983,
        "gs_citation": 100,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12764930736205697146&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=Xlayxj2fWp",
        "pdf": "https://openreview.net/pdf?id=Xlayxj2fWp",
        "email": "ucsb.edu;nec-labs.com;ucla.edu;;;nec-labs.com",
        "author_num": 6,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "University of California, Santa Barbara;NEC Laboratories;University of California, Los Angeles",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ucsb.edu;https://www.nec-labs.com;https://www.ucla.edu",
        "aff_unique_abbr": "UCSB;NEC-Labs;UCLA",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Santa Barbara;;Los Angeles",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "XlfTLt0zvd",
        "title": "An Efficient Multi-Task Transformer for 3D Face Alignment",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In the research of 3D face alignment, few prior works focus on information exchange among different vertices or 3DMM parameters in regression. On the other hand, there is a drawback that using high-resolution feature maps makes algorithms memory-consuming and not efficient. To solve these issues, we first propose a multi-task model equipped with two transformer-based branches which further enhances the information communication among different elements through self-attention and cross-attention mechanisms. To solve the problem of low efficiency of high-resolution feature maps and improve the accuracy of facial landmark detection, a lightweight module named query-aware memory (QAMem) is designed to enhance the discriminative ability of queries on low-resolution feature maps by assigning separate memory values to each query rather than a shared one. With the help of QAMem, our model is efficient because of removing the dependence on high-resolution feature maps and is still able to obtain superior accuracy. To further improve the robustness of the predicted landmarks, we introduce a multi-layer additive residual regression (MARR) module that can provide a more stable and reliable reference based on the average face model. Furthermore, the multi-information loss function with Euler Angles Loss is proposed to supervise the network with more effective information, making the model more robust to handle the case of atypical head poses. Extensive experiments on two public benchmarks show that our approach can achieve state-of-the-art performance. Besides, visualization results and ablation experiments verify the effectiveness of the proposed model.",
        "keywords": "vision transformer;facial landmark detection;3D face alignment",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Jin Jiang;Shengcai Liao;Haibo Jin;Xiaoyuan Yang",
        "authorids": "~Jin_Jiang3;~Shengcai_Liao2;~Haibo_Jin1;~Xiaoyuan_Yang1",
        "gender": "F;M;;F",
        "homepage": "https://www.researchgate.net/profile/Jin-Jiang-16;https://shengcailiao.github.io/;http://jhb86253817.github.io/;https://math.buaa.edu.cn/szdw/msfc/jxms/yxy.htm",
        "dblp": ";16/8313;134/7465;",
        "google_scholar": ";CnqsHlAAAAAJ;sptbC3EAAAAJ;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Jin_Jiang3;~Shengcai_Liao2;~Haibo_Jin1;~Xiaoyuan_Yang1",
        "aff": "Beihang University;Inception Institute of Artificial Intelligence;Hong Kong University of Science and Technology;Beihang University",
        "aff_domain": "buaa.edu.cn;inceptioniai.org;ust.hk;buaa.edu.cn",
        "position": "PhD student;Lead Scientist;PhD student;Full Professor",
        "bibtex": "@misc{\njiang2024an,\ntitle={An Efficient Multi-Task Transformer for 3D Face Alignment},\nauthor={Jin Jiang and Shengcai Liao and Haibo Jin and Xiaoyuan Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=XlfTLt0zvd}\n}",
        "github": "",
        "project": "",
        "reviewers": "PGZe;zzMV;QjYA;eTNq",
        "site": "https://openreview.net/forum?id=XlfTLt0zvd",
        "pdf_size": 13791430,
        "rating": "5;5;5;5",
        "confidence": "4;4;3;4",
        "soundness": "2;2;2;2",
        "contribution": "1;2;3;2",
        "presentation": "1;3;2;3",
        "wc_summary": "56;150;111;54",
        "wc_strengths": "36;63;50;19",
        "wc_weaknesses": "76;232;177;158",
        "wc_questions": "35;64;121;30",
        "wc_review": "203;509;459;261",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "519;654;1245;493",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            92.75,
            40.195615432531945
        ],
        "wc_strengths_avg": [
            42.0,
            16.355427233796124
        ],
        "wc_weaknesses_avg": [
            160.75,
            55.9704162928953
        ],
        "wc_questions_avg": [
            62.5,
            36.18355980276125
        ],
        "wc_review_avg": [
            358.0,
            128.87590930814028
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            727.75,
            304.8240271041638
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:VT1fgB2ILFgJ:scholar.google.com/&scioq=An+Efficient+Multi-Task+Transformer+for+3D+Face+Alignment&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Beihang University;Inception Institute of Artificial Intelligence;Hong Kong University of Science and Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.buaa.edu.cn/;https://www.inceptioniai.org;https://www.ust.hk",
        "aff_unique_abbr": "BUAA;;HKUST",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "China;United Arab Emirates"
    },
    {
        "title": "Generating Images with 3D Annotations Using Diffusion Models",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18443",
        "id": "XlkN11Xj6J",
        "author_site": "Wufei Ma, Qihao Liu, Jiahao Wang, Angtian Wang, Xiaoding Yuan, Yi Zhang, Zihao Xiao, Guofeng Zhang, Beijia Lu, Ruxiao Duan, Yongrui Qi, Adam Kortylewski, Yaoyao Liu, Alan Yuille",
        "tldr": "",
        "abstract": "Diffusion models have emerged as a powerful generative method, capable of producing stunning photo-realistic images from natural language descriptions. However, these models lack explicit control over the 3D structure in the generated images. Consequently, this hinders our ability to obtain detailed 3D annotations for the generated images or to craft instances with specific poses and distances. In this paper, we propose 3D Diffusion Style Transfer (3D-DST), which incorporates 3D geometry control into diffusion models. Our method exploits ControlNet, which extends diffusion models by using visual prompts in addition to text prompts. We generate images of the 3D objects taken from 3D shape repositories~(e.g., ShapeNet and Objaverse), render them from a variety of poses and viewing directions, compute the edge maps of the rendered images, and use these edge maps as visual prompts to generate realistic images. With explicit 3D geometry control, we can easily change the 3D structures of the objects in the generated images and obtain ground-truth 3D annotations automatically. This allows us to improve a wide range of vision tasks, e.g., classification and 3D pose estimation, in both in-distribution (ID) and out-of-distribution (OOD) settings. We demonstrate the effectiveness of our method through extensive experiments on ImageNet-100/200, ImageNet-R, PASCAL3D+, ObjectNet3D, and OOD-CV. The results show that our method significantly outperforms existing methods, e.g., 3.8 percentage points on ImageNet-100 using DeiT-B. Our code is available at <https://ccvl.jhu.edu/3D-DST/>",
        "keywords": "Synthetic Data;Transfer Learning;Diffusion Models;3D",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Wufei Ma;Qihao Liu;Jiahao Wang;Angtian Wang;Xiaoding Yuan;Yi Zhang;Zihao Xiao;Guofeng Zhang;Beijia Lu;Ruxiao Duan;Yongrui Qi;Adam Kortylewski;Yaoyao Liu;Alan Yuille",
        "authorids": "~Wufei_Ma1;~Qihao_Liu1;~Jiahao_Wang5;~Angtian_Wang2;~Xiaoding_Yuan1;~Yi_Zhang20;~Zihao_Xiao2;~Guofeng_Zhang4;~Beijia_Lu1;~Ruxiao_Duan1;~Yongrui_Qi1;~Adam_Kortylewski1;~Yaoyao_Liu1;~Alan_Yuille1",
        "gender": "M;;;M;;M;M;M;F;M;F;;;M",
        "homepage": "https://wufeim.github.io;;;https://angtianwang.github.io/;https://www.xiaodingyuan.com/;https://edz-o.github.io;;https://richard-guofeng-zhang.github.io/;https://beijia11.github.io/;;https://github.com/Auroraaa-Qi;https://gvrl.mpi-inf.mpg.de/;https://yaoyaoliu.web.illinois.edu/;",
        "dblp": "243/2814;158/2755;;;275/2126;64/6544-99.html;207/2005-1;;;361/2486;;161/0772;12/10033-1;y/AlanLYuille",
        "google_scholar": "mYkvHdIAAAAJ;WFl3hH0AAAAJ;;YR7re-cAAAAJ;p7QTY-cAAAAJ;8aXDeK8AAAAJ;https://scholar.google.com/citations?hl=en;vl0mzhEAAAAJ;;aG-fi1cAAAAJ;;https://scholar.google.ch/citations?user=tRLUOBIAAAAJ;Qi2PSmEAAAAJ;",
        "orcid": ";;;;;;;;;0009-0009-2734-9329;;0000-0002-9146-4403;0000-0002-5316-3028;",
        "linkedin": "wufei-ma-256352133/;;;;;;;;beijia-lu-87a020241;;;;;",
        "or_profile": "~Wufei_Ma1;~Qihao_Liu1;~Jiahao_Wang5;~Angtian_Wang2;~Xiaoding_Yuan1;~Yi_Zhang20;~Zihao_Xiao2;~Guofeng_Zhang4;~Beijia_Lu1;~Ruxiao_Duan1;~Yongrui_Qi1;~Adam_Kortylewski1;~Yaoyao_Liu1;~Alan_Yuille1",
        "aff": "Johns Hopkins University;Johns Hopkins University;;Johns Hopkins University;Johns Hopkins University;Sony Corporation of America;Johns Hopkins University;Johns Hopkins University;City University of Hong Kong;Johns Hopkins University;;Albert-Ludwigs-Universit\u00e4t Freiburg;Johns Hopkins University;Johns Hopkins University",
        "aff_domain": "jhu.edu;jh.edu;;jhu.edu;jhu.edu;sony.com;jhu.edu;jhu.edu;cityu.edu.hk;jh.edu;;uni-freiburg.de;jhu.edu;johnshopkins.edu",
        "position": "PhD student;PhD student;;PhD student;PhD student;Research Engineer;PhD student;PhD student;Undergrad student;MS student;;Research Group Leader;Postdoc;Full Professor",
        "bibtex": "@inproceedings{\nma2024generating,\ntitle={Generating Images with 3D Annotations Using Diffusion Models},\nauthor={Wufei Ma and Qihao Liu and Jiahao Wang and Angtian Wang and Xiaoding Yuan and Yi Zhang and Zihao Xiao and Guofeng Zhang and Beijia Lu and Ruxiao Duan and Yongrui Qi and Adam Kortylewski and Yaoyao Liu and Alan Yuille},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=XlkN11Xj6J}\n}",
        "github": "",
        "project": "",
        "reviewers": "eSpe;B6MH;5ugh;Xyyh",
        "pdf_size": 35119359,
        "rating": "5;5;6;8",
        "confidence": "3;4;4;4",
        "soundness": "3;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "88;96;73;45",
        "wc_strengths": "54;28;103;33",
        "wc_weaknesses": "252;119;118;42",
        "wc_questions": "10;123;26;2",
        "wc_review": "404;366;320;122",
        "wc_reply_reviewers": "151;187;34;0",
        "wc_reply_authors": "754;1526;649;437",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "3;3;2;2",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            75.5,
            19.448650338776723
        ],
        "wc_strengths_avg": [
            54.5,
            29.652150006365474
        ],
        "wc_weaknesses_avg": [
            132.75,
            75.60216597426293
        ],
        "wc_questions_avg": [
            40.25,
            48.55087537830806
        ],
        "wc_review_avg": [
            303.0,
            108.65081684000356
        ],
        "wc_reply_reviewers_avg": [
            93.0,
            77.9903840226473
        ],
        "wc_reply_authors_avg": [
            841.5,
            411.36145906003395
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            14,
            0
        ],
        "corr_rating_confidence": 0.4714045207910316,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14474550835339656168&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=XlkN11Xj6J",
        "pdf": "https://openreview.net/pdf?id=XlkN11Xj6J",
        "email": "jhu.edu;jh.edu;;jhu.edu;jhu.edu;sony.com;jhu.edu;jhu.edu;cityu.edu.hk;jh.edu;;uni-freiburg.de;jhu.edu;johnshopkins.edu",
        "author_num": 14,
        "aff_unique_index": "0;0;0;0;1;0;0;2;0;3;0;0",
        "aff_unique_norm": "Johns Hopkins University;Sony Corporation of America;City University of Hong Kong;Albert-Ludwigs-Universit\u00e4t Freiburg",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.jhu.edu;https://www.sony.com;https://www.cityu.edu.hk;https://www.uni-freiburg.de",
        "aff_unique_abbr": "JHU;Sony;CityU;Albert-Ludwigs-Universit\u00e4t",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Hong Kong SAR;Freiburg",
        "aff_country_unique_index": "0;0;0;0;0;0;0;1;0;2;0;0",
        "aff_country_unique": "United States;China;Germany"
    },
    {
        "id": "XmC4L3fhYG",
        "title": "TOAST: Transfer Learning via Top-Down Attention Steering",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Transfer learning involves adapting a pre-trained model to novel downstream tasks. In this work, we empirically observe that current transfer learning methods often fail to focus on task-relevant features, potentially degrading transfer learning performance. We then explore refocusing model attention to improve transfer learning. We introduce Top-Down Attention Steering (TOAST), a novel transfer learning algorithm that keeps the pre-trained backbone frozen, selects task-relevant features in the output, and feeds those features back to the model to steer the attention to the task-specific features. By refocusing the attention only, TOAST achieves state-of-the-art results on a number of transfer learning benchmarks, while having a small number of tunable parameters. Compared to fully fine-tuning, LoRA, and prompt tuning, TOAST substantially improves performance across a range of fine-grained visual classification datasets (e.g., 82.6% $\\rightarrow$ 86.2% on FGVC). TOAST also outperforms the fully fine-tuned Alpaca and Vicuna models on instruction-following language generation.",
        "keywords": "top-down attention; transfer learning; finetuning;",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Baifeng Shi;Siyu Gai;Trevor Darrell;Xin Wang",
        "authorids": "~Baifeng_Shi1;~Siyu_Gai1;~Trevor_Darrell2;~Xin_Wang1",
        "gender": ";F;F;M",
        "homepage": "https://bfshi.github.io;;https://people.eecs.berkeley.edu/~xinw/;https://people.eecs.berkeley.edu/~trevor/",
        "dblp": "261/9376;331/6237;;d/TrevorDarrell",
        "google_scholar": "LBEIm8gAAAAJ;;e9gUdKwAAAAJ;https://scholar.google.com.tw/citations?user=bh-uRFMAAAAJ",
        "orcid": ";0000-0002-5912-5196;;",
        "linkedin": "baifeng-shi-09171b188/;siyu-catherine-gai-6334b1192;xin-wang-aa83a577;",
        "or_profile": "~Baifeng_Shi1;~Siyu_Gai1;~Xin_Wang1;~trevor_darrell1",
        "aff": "NVIDIA;;Microsoft;Electrical Engineering & Computer Science Department",
        "aff_domain": "nvidia.com;;microsoft.com;eecs.berkeley.edu",
        "position": "Research Intern;;Senior Researcher;Professor",
        "bibtex": "@misc{\nshi2024toast,\ntitle={{TOAST}: Transfer Learning via Top-Down Attention Steering},\nauthor={Baifeng Shi and Siyu Gai and Trevor Darrell and Xin Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=XmC4L3fhYG}\n}",
        "github": "",
        "project": "",
        "reviewers": "fXJ4;J2p1;m6yv",
        "site": "https://openreview.net/forum?id=XmC4L3fhYG",
        "pdf_size": 4962429,
        "rating": "3;5;5",
        "confidence": "4;3;4",
        "soundness": "3;2;2",
        "contribution": "2;2;2",
        "presentation": "3;3;3",
        "wc_summary": "82;171;69",
        "wc_strengths": "94;169;47",
        "wc_weaknesses": "255;488;182",
        "wc_questions": "5;5;90",
        "wc_review": "436;833;388",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            107.33333333333333,
            45.330882286680556
        ],
        "wc_strengths_avg": [
            103.33333333333333,
            50.24163833139025
        ],
        "wc_weaknesses_avg": [
            308.3333333333333,
            130.4922305051999
        ],
        "wc_questions_avg": [
            33.333333333333336,
            40.069384267237695
        ],
        "wc_review_avg": [
            552.3333333333334,
            199.4263996789013
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:LFeYyKfSDwoJ:scholar.google.com/&scioq=TOAST:+Transfer+Learning+via+Top-Down+Attention+Steering&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "NVIDIA;Microsoft;Electrical Engineering & Computer Science Department",
        "aff_unique_dep": "NVIDIA Corporation;Microsoft Corporation;Electrical Engineering & Computer Science",
        "aff_unique_url": "https://www.nvidia.com;https://www.microsoft.com;",
        "aff_unique_abbr": "NVIDIA;Microsoft;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States;"
    },
    {
        "id": "XmkuQfWZAB",
        "title": "On Provable Benefits of Policy Learning from Human Preferences in Contextual Bandit Problems",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "For a real-world decision-making problem, the reward function often needs to be engineered or learned. A popular approach is to utilize human feedback to learn a reward function for training. The most straightforward way to do so is to ask humans to provide ratings for state-action pairs on an absolute scale and take these ratings as reward samples directly. Another popular way is to ask humans to rank a small set of state-action pairs by preference and learn a reward function from these preference data. Recently, preference-based methods have demonstrated substantial success in empirical applications such as InstructGPT. In this work, we develop a theoretical comparison between these human feedback approaches in offline contextual bandits and show how human bias and uncertainty in feedback modelings can affect the theoretical guarantees of these approaches. Through this, our results seek to provide a theoretical explanation for the empirical successes of preference-based methods from a modeling perspective.",
        "keywords": "bandit theory;policy learning with human preference",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/7bfd12a06f11a2c9a95cec89a7d76ceffaef6131.pdf",
        "author": "Xiang Ji;Huazheng Wang;Minshuo Chen;Tuo Zhao;Mengdi Wang",
        "authorids": "~Xiang_Ji3;~Huazheng_Wang1;~Minshuo_Chen1;~Tuo_Zhao1;~Mengdi_Wang1",
        "gender": ";;M;M;F",
        "homepage": ";https://huazhengwang.github.io/;https://minshuochen.github.io;http://www2.isye.gatech.edu/~tzhao80;http://mwang.princeton.edu",
        "dblp": ";163/2233;217/1509;;",
        "google_scholar": "oCcK0LoAAAAJ;w3PrbKwAAAAJ;qU9WvTgAAAAJ;EJXN6tYAAAAJ;",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Xiang_Ji3;~Huazheng_Wang1;~Minshuo_Chen1;~Tuo_Zhao1;~Mengdi_Wang1",
        "aff": "Princeton University;Oregon State University;Princeton University;Georgia Institute of Technology;Princeton University",
        "aff_domain": "princeton.edu;oregonstate.edu;princeton.edu;gatech.edu;princeton.edu",
        "position": "PhD student;Assistant Professor;Postdoc;Associate Professor;Full Professor",
        "bibtex": "@misc{\nji2024on,\ntitle={On Provable Benefits of Policy Learning from Human Preferences in Contextual Bandit Problems},\nauthor={Xiang Ji and Huazheng Wang and Minshuo Chen and Tuo Zhao and Mengdi Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=XmkuQfWZAB}\n}",
        "github": "",
        "project": "",
        "reviewers": "5Lzq;jnsn;TtXD",
        "site": "https://openreview.net/forum?id=XmkuQfWZAB",
        "pdf_size": 442978,
        "rating": "3;3;8",
        "confidence": "3;4;3",
        "soundness": "3;3;4",
        "contribution": "2;3;3",
        "presentation": "2;3;4",
        "wc_summary": "53;48;157",
        "wc_strengths": "33;37;99",
        "wc_weaknesses": "335;352;173",
        "wc_questions": "5;51;30",
        "wc_review": "426;488;459",
        "wc_reply_reviewers": "0;427;0",
        "wc_reply_authors": "777;1477;522",
        "reply_reviewers": "0;1;0",
        "reply_authors": "1;3;1",
        "rating_avg": [
            4.666666666666667,
            2.357022603955158
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            86.0,
            50.24606120549815
        ],
        "wc_strengths_avg": [
            56.333333333333336,
            30.214051182999096
        ],
        "wc_weaknesses_avg": [
            286.6666666666667,
            80.67355342503652
        ],
        "wc_questions_avg": [
            28.666666666666668,
            18.80307303489394
        ],
        "wc_review_avg": [
            457.6666666666667,
            25.32894698868383
        ],
        "wc_reply_reviewers_avg": [
            142.33333333333334,
            201.28973037777052
        ],
        "wc_reply_authors_avg": [
            925.3333333333334,
            403.7394649468337
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5000000000000001,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5072896650471623272&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;2;0",
        "aff_unique_norm": "Princeton University;Oregon State University;Georgia Institute of Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.princeton.edu;https://oregonstate.edu;https://www.gatech.edu",
        "aff_unique_abbr": "Princeton;OSU;Georgia Tech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "XnDUcwLXre",
        "title": "Submodular Minimax Optimization: Finding Effective Sets",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Despite the rich existing literature about minimax optimization in continuous settings, only very partial results of this kind have been obtained for combinatorial settings. In this paper, we fill this gap by providing a characterization of submodular minimax optimization, the problem of finding a set (for either the min or the max player) that is effective against every possible response. We show when and under what conditions we can find such sets. We also demonstrate how minimax submodular optimization provides robust solutions for downstream machine learning applications such as (i) prompt engineering in large language models, (ii) identifying robust waiting locations for ride-sharing, (iii) kernelization of the difficulty of instances of the previous setting, and (iv) finding adversarial images. Our experiments demonstrate that our proposed algorithms  consistently outperform other baselines.",
        "keywords": "submodular functions;minimax optimization;prompt engineering;personalized image summarization;ride-share optimization",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Loay Mualem;Ethan R. Elenberg;Moran Feldman;Amin Karbasi",
        "authorids": "~Loay_Mualem1;~Ethan_R._Elenberg2;~Moran_Feldman1;~Amin_Karbasi3",
        "gender": "M;;M;",
        "homepage": ";https://cs.haifa.ac.il/~moranfe/;http://seas.yale.edu/faculty-research/faculty-directory/amin-karbasi;http://eelenberg.github.io/",
        "dblp": "293/7129.html;41/771;49/7411;150/5501",
        "google_scholar": ";https://scholar.google.co.il/citations?hl=en;https://scholar.google.com.tw/citations?user=VusVB38AAAAJ;Kh-DC4IAAAAJ",
        "orcid": ";0000-0002-1535-2979;;",
        "linkedin": ";;;",
        "or_profile": "~Loay_Mualem1;~Moran_Feldman1;~amin_karbasi1;~Ethan_R_Elenberg1",
        "aff": "Haifa University;University of Haifa;Google;ASAPP",
        "aff_domain": "haifa.ac.il;haifa.ac.il;google.com;asapp.com",
        "position": "PhD student;Associate Professor;Researcher;Researcher",
        "bibtex": "@misc{\nmualem2024submodular,\ntitle={Submodular Minimax Optimization: Finding Effective Sets},\nauthor={Loay Mualem and Ethan R. Elenberg and Moran Feldman and Amin Karbasi},\nyear={2024},\nurl={https://openreview.net/forum?id=XnDUcwLXre}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=XnDUcwLXre",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12924917339259189161&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Haifa University;University of Haifa;Google;ASAPP",
        "aff_unique_dep": ";;Google;",
        "aff_unique_url": "https://www.haifa.ac.il;https://www.haifa.ac.il;https://www.google.com;https://www.asapp.com",
        "aff_unique_abbr": "HU;UoH;Google;ASAPP",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0;1;1",
        "aff_country_unique": "Israel;United States"
    },
    {
        "id": "XnyZfCerSX",
        "title": "Ghostbuster: Detecting Text Ghostwritten by Large Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We introduce Ghostbuster, a state-of-the-art system for detecting AI-generated text.\nOur method works by passing documents through a series of weaker language models and running a structured search over possible combinations of their features, then training a classifier on the selected features to determine if the target document was AI-generated.\nCrucially, Ghostbuster does not require access to token probabilities from the target model, making it useful for detecting text generated by black-box models or unknown model versions.\nIn conjunction with our model, we release three new datasets of human and AI-generated text as detection benchmarks that cover multiple domains (student essays, creative fiction, and news). Ghostbuster averages 99.0 F1 across all three datasets, outperforming previous approaches such as GPTZero and DetectGPT by up to 41.6 F1.",
        "keywords": "AI-generated text detection;text generation;large language models",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Vivek Verma;Eve Fleisig;Nicholas Tomlin;Dan Klein",
        "authorids": "~Vivek_Verma2;~Eve_Fleisig1;~Nicholas_Tomlin1;~Dan_Klein1",
        "gender": "M;F;M;",
        "homepage": "https://vivek.lol;https://www.efleisig.com;https://people.eecs.berkeley.edu/~nicholas_tomlin/;http://people.eecs.berkeley.edu/~klein/",
        "dblp": ";276/0223;;",
        "google_scholar": "D40otBIAAAAJ;NHlxXzwAAAAJ;zV5vhUcAAAAJ;",
        "orcid": ";;;",
        "linkedin": ";eve-fleisig/;;dan-klein/",
        "or_profile": "~Vivek_Verma2;~Eve_Fleisig1;~Nicholas_Tomlin1;~Dan_Klein1",
        "aff": "University of California, Berkeley;University of California, Berkeley;University of California, Berkeley;University of California, Berkeley",
        "aff_domain": "berkeley.edu;berkeley.edu;berkeley.edu;berkeley.edu",
        "position": "Undergrad student;PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nverma2024ghostbuster,\ntitle={Ghostbuster: Detecting Text Ghostwritten by Large Language Models},\nauthor={Vivek Verma and Eve Fleisig and Nicholas Tomlin and Dan Klein},\nyear={2024},\nurl={https://openreview.net/forum?id=XnyZfCerSX}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=XnyZfCerSX",
        "pdf_size": 783294,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 109,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13263500511172823777&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of California, Berkeley",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.berkeley.edu",
        "aff_unique_abbr": "UC Berkeley",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Berkeley",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "XqGsMD6KH5",
        "title": "MultiHot Embedding: A Multiple Activation Embedding Model for Numerical Features in Deep Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Numerical feature learning has long been a challenging problem in deep learning. Deep learning models exhibit sub-optimal performance in many numerical-feature-intense learning tasks. This paper proposes a simple but effective method, i.e. MultiHot Embedding, for numerical feature representation in deep learning models. The MultiHot Embedding discretizes the numerical data into bins and extends the one-hot embedding by allowing multiple activations of neighbor bits. The multiple neighbor activation mechanism enables the MultiHot Embedding to use small bin widths for discretization which overcomes the information loss problem as well as the inadequate training issue. The experiments on 6 numerical feature learning tasks validate the effectiveness and generalization capabilities of the proposed MultiHot Embedding method. Compared to the baseline models, the MultiHot Embedding model significantly improves the prediction performance. Specifically, it outperforms the state-of-the-art numerical feature representation model which has a much more complex structure. Furthermore, the sensitivity analysis shows that the MultiHot Embedding is capable of handling small width discretization width, which effectively reduces the information loss during the discretization process.",
        "keywords": "Feature Representation;Numerical Feature;Embedding;Deep Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/181d4e2a1b16b76c99dd2d837a77e3d92f6e067a.pdf",
        "author": "Pengfei Zhang;Zhenliang Ma;Zhenlin Qin",
        "authorids": "~Pengfei_Zhang8;~Zhenliang_Ma1;~Zhenlin_Qin1",
        "gender": "M;M;M",
        "homepage": ";https://www.kth.se/profile/zhema?l=en;",
        "dblp": ";;",
        "google_scholar": "https://scholar.google.com.au/citations?user=p-6bQfEqEAAAAJ;;",
        "orcid": ";;0000-0003-1747-9508",
        "linkedin": ";;",
        "or_profile": "~Pengfei_Zhang8;~Zhenliang_Ma1;~Zhenlin_Qin1",
        "aff": "Henan Academy of Sciences;KTH Royal Institute of Technology;Institute of Physics, Henan Academy of Sciences",
        "aff_domain": "hnas.ac.cn;kth.se;hnskxy.com",
        "position": "Researcher;Assistant Professor;Researcher",
        "bibtex": "@misc{\nzhang2024multihot,\ntitle={MultiHot Embedding: A Multiple Activation Embedding Model for Numerical Features in Deep Learning},\nauthor={Pengfei Zhang and Zhenliang Ma and Zhenlin Qin},\nyear={2024},\nurl={https://openreview.net/forum?id=XqGsMD6KH5}\n}",
        "github": "",
        "project": "",
        "reviewers": "4mSv;41SS;cyHj;jhZn;AWvM",
        "site": "https://openreview.net/forum?id=XqGsMD6KH5",
        "pdf_size": 266254,
        "rating": "3;3;3;5;5",
        "confidence": "4;4;4;2;2",
        "soundness": "2;2;3;3;2",
        "contribution": "2;1;2;2;2",
        "presentation": "2;2;3;2;2",
        "wc_summary": "21;13;57;45;107",
        "wc_strengths": "11;24;24;24;135",
        "wc_weaknesses": "170;73;94;133;193",
        "wc_questions": "46;113;55;30;63",
        "wc_review": "248;223;230;232;498",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            3.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.2,
            0.9797958971132712
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            1.8,
            0.4000000000000001
        ],
        "presentation_avg": [
            2.2,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            48.6,
            33.236124924545585
        ],
        "wc_strengths_avg": [
            43.6,
            45.976515744453714
        ],
        "wc_weaknesses_avg": [
            132.6,
            44.92037399666214
        ],
        "wc_questions_avg": [
            61.4,
            28.032837887021
        ],
        "wc_review_avg": [
            286.2,
            106.21562973498769
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:3K_EtBeBcnwJ:scholar.google.com/&scioq=MultiHot+Embedding:+A+Multiple+Activation+Embedding+Model+for+Numerical+Features+in+Deep+Learning&hl=en&as_sdt=0,23",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Henan Academy of Sciences;KTH Royal Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.hnas.cn;https://www.kth.se",
        "aff_unique_abbr": ";KTH",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "China;Sweden"
    },
    {
        "id": "XqLcFMMwNb",
        "title": "MM-LDM: Multi-Modal Latent Diffusion Model for Sounding Video Generation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Sounding video generation (SVG) is a challenging audio-video joint generation task that requires both single-modal realism and cross-modal consistency.\nPrevious diffusion-based methods tackled SVG within the original signal space, resulting in a huge computation burden.\nIn this paper, we introduce a novel multi-modal latent diffusion model (MM-LDM), which establishes a perceptual latent space that is perceptually equivalent to the original audio-video signal space but drastically reduces computational complexity.\nWe unify the representation of audio and video signals and construct a shared high-level semantic feature space to bridge the information gap between audio and video modalities.\nFurthermore, we present a novel cross-modal sampling guidance that extends our generative models to audio-to-video and video-to-audio conditional generation tasks. \nWe obtain the new state-of-the-art results with significant quality and efficiency gains.\nIn particular, our method achieves an overall improvement in all evaluation metrics and a faster training and sampling speed.",
        "keywords": "Sounding video generation;multi-modal generation;diffusion model",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/3ae7ee072049ee6042c81c3cace188a6a6006177.pdf",
        "author": "Mingzhen Sun;Weining Wang;Yanyuan Qiao;Longteng Guo;Jiahui Sun;Xinxin Zhu;Jing Liu",
        "authorids": "~Mingzhen_Sun1;~Weining_Wang3;~Yanyuan_Qiao1;~Longteng_Guo1;~Jiahui_Sun2;~Xinxin_Zhu1;~Jing_Liu1",
        "gender": "F;F;F;M;M;;F",
        "homepage": "https://github.com/iva-mzsun;;https://yanyuanqiao.github.io/;https://ltguo19.github.io/;https://github.com/LuoBoBo00;https://scholar.google.com/citations?user=MGL0W4gAAAAJ&hl=zh-CN&oi=ao;http://www.nlpr.ia.ac.cn/iva/liujing/",
        "dblp": "296/4017;97/6006-1.html;228/1344;207/1905;;;72/2590-1.html",
        "google_scholar": ";NDPvobAAAAAJ;vsfwX2EAAAAJ;OaGRHWYAAAAJ;;MGL0W4gAAAAJ;sOI-S7oAAAAJ",
        "orcid": ";;0000-0002-5606-0702;;;;",
        "linkedin": ";;yanyuan-qiao/;;;;",
        "or_profile": "~Mingzhen_Sun1;~Weining_Wang3;~Yanyuan_Qiao1;~Longteng_Guo1;~Jiahui_Sun2;~Xinxin_Zhu1;~Jing_Liu1",
        "aff": "Institute of Automation, Chinese Academy of Sciences;Institute of Automation, Chinese Academy of Sciences;University of Adelaide;Institute of Automation, Chinese Academy of Sciences;Institute of Automation, Chinese Academy of Sciences;, Institute of automation, Chinese academy of science;Institute of automation, Chinese academy of science",
        "aff_domain": "ia.ac.cn;ia.ac.cn;adelaide.edu.au;ia.ac.cn;ia.ac.cn;nlpr.ia.ac.cn;nlpr.ia.ac.cn",
        "position": "PhD student;Associate Professor;Postdoc;Associate Professor;MS student;Associate Professor;Full Professor",
        "bibtex": "@misc{\nsun2024mmldm,\ntitle={{MM}-{LDM}: Multi-Modal Latent Diffusion Model for Sounding Video Generation},\nauthor={Mingzhen Sun and Weining Wang and Yanyuan Qiao and Longteng Guo and Jiahui Sun and Xinxin Zhu and Jing Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=XqLcFMMwNb}\n}",
        "github": "",
        "project": "",
        "reviewers": "n6co;9ERg;1VF7;ApFF",
        "site": "https://openreview.net/forum?id=XqLcFMMwNb",
        "pdf_size": 3860841,
        "rating": "5;5;5;8",
        "confidence": "4;5;4;5",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;1;3",
        "wc_summary": "69;67;112;45",
        "wc_strengths": "41;78;155;35",
        "wc_weaknesses": "183;164;140;101",
        "wc_questions": "92;111;123;6",
        "wc_review": "385;420;530;187",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "475;523;712;116",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            73.25,
            24.27318479310039
        ],
        "wc_strengths_avg": [
            77.25,
            47.814093110713706
        ],
        "wc_weaknesses_avg": [
            147.0,
            30.618621784789728
        ],
        "wc_questions_avg": [
            83.0,
            45.80938768418543
        ],
        "wc_review_avg": [
            380.5,
            123.8678731552294
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            456.5,
            215.62989124887116
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15242424077172155435&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;1;0;0;0;0",
        "aff_unique_norm": "Chinese Academy of Sciences;University of Adelaide",
        "aff_unique_dep": "Institute of Automation;",
        "aff_unique_url": "http://www.ia.cas.cn;https://www.adelaide.edu.au",
        "aff_unique_abbr": "CAS;Adelaide",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0;0;0",
        "aff_country_unique": "China;Australia"
    },
    {
        "title": "Spatio-Temporal Approximation: A Training-Free SNN Conversion for Transformers",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18442",
        "id": "XrunSYwoLr",
        "author_site": "Yizhou Jiang, Kunlin Hu, Tianren Zhang, Haichuan Gao, Yuqian Liu, Ying Fang, Feng Chen",
        "tldr": "",
        "abstract": "Spiking neural networks (SNNs) are energy-efficient and hold great potential for large-scale inference. Since training SNNs from scratch is costly and has limited performance, converting pretrained artificial neural networks (ANNs) to SNNs is an attractive approach that retains robust performance without additional training data and resources. However, while existing conversion methods work well on convolution networks, emerging Transformer models introduce unique mechanisms like self-attention and test-time normalization, leading to non-causal non-linear interactions unachievable by current SNNs. To address this, we approximate these operations in both temporal and spatial dimensions, thereby providing the first SNN conversion pipeline for Transformers. We propose \\textit{Universal Group Operators} to approximate non-linear operations spatially and a \\textit{Temporal-Corrective Self-Attention Layer} that approximates spike multiplications at inference through an estimation-correction approach. Our algorithm is implemented on a pretrained ViT-B/32 from CLIP, inheriting its zero-shot classification capabilities, while improving control over conversion losses. To our knowledge, this is the first direct training-free conversion of a pretrained Transformer to a purely event-driven SNN, promising for neuromorphic hardware deployment.",
        "keywords": "Spiking Neural Network;Spike Calibration;Transformer",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/9495b37279d24b12eb288149b6aa13e04af3c10d.zip",
        "author": "Yizhou Jiang;Kunlin Hu;Tianren Zhang;Haichuan Gao;Yuqian Liu;Ying Fang;Feng Chen",
        "authorids": "~Yizhou_Jiang1;~Kunlin_Hu1;~Tianren_Zhang1;~Haichuan_Gao1;~Yuqian_Liu1;~Ying_Fang2;~Feng_Chen1",
        "gender": "M;F;M;M;F;F;M",
        "homepage": ";https://scholar.google.com/citations?hl=zh-CN&user=bnIsJbsAAAAJ;;;;;",
        "dblp": "201/8247;;;285/2988.html;;;21/3047-7",
        "google_scholar": "oM8ue_UAAAAJ;;https://scholar.google.com/citations?hl=zh-CN;;;;",
        "orcid": ";;0000-0001-9687-5263;;0000-0003-0858-0866;0000-0002-8073-0964;0000-0003-4813-2494",
        "linkedin": ";;%E5%A4%A9%E4%BB%BB-%E7%AB%A0-622b30110/;;;;",
        "or_profile": "~Yizhou_Jiang1;~Kunlin_Hu1;~Tianren_Zhang1;~Haichuan_Gao1;~Yuqian_Liu1;~Ying_Fang2;~Feng_Chen1",
        "aff": "Tsinghua University;Tsinghua University;Tsinghua University;Tsinghua University;Tsinghua University;Fujian Normal University;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;fjnu.edu.cn;tsinghua.edu.cn",
        "position": "PhD student;MS student;PhD student;Postdoc;PhD student;Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\njiang2024spatiotemporal,\ntitle={Spatio-Temporal Approximation: A Training-Free {SNN} Conversion for Transformers},\nauthor={Yizhou Jiang and Kunlin Hu and Tianren Zhang and Haichuan Gao and Yuqian Liu and Ying Fang and Feng Chen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=XrunSYwoLr}\n}",
        "github": "",
        "project": "",
        "reviewers": "S5Cb;jaAV;gaB3;wK6t",
        "pdf_size": 1117365,
        "rating": "6;6;8;8",
        "confidence": "4;4;5;4",
        "soundness": "2;3;3;4",
        "contribution": "2;4;4;3",
        "presentation": "2;3;4;3",
        "wc_summary": "27;37;57;46",
        "wc_strengths": "13;40;62;80",
        "wc_weaknesses": "176;53;67;183",
        "wc_questions": "3;80;199;7",
        "wc_review": "219;210;385;316",
        "wc_reply_reviewers": "21;13;74;12",
        "wc_reply_authors": "746;707;1419;649",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;1;3;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            41.75,
            11.07643895843786
        ],
        "wc_strengths_avg": [
            48.75,
            25.033727249452888
        ],
        "wc_weaknesses_avg": [
            119.75,
            60.00572889316486
        ],
        "wc_questions_avg": [
            72.25,
            79.33906666957962
        ],
        "wc_review_avg": [
            282.5,
            72.31355336311444
        ],
        "wc_reply_reviewers_avg": [
            30.0,
            25.64176280991617
        ],
        "wc_reply_authors_avg": [
            880.25,
            312.95636676699837
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7413617942655539394&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=XrunSYwoLr",
        "pdf": "https://openreview.net/pdf?id=XrunSYwoLr",
        "email": "tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;fjnu.edu.cn;tsinghua.edu.cn",
        "author_num": 7,
        "aff_unique_index": "0;0;0;0;0;1;0",
        "aff_unique_norm": "Tsinghua University;Fujian Normal University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tsinghua.edu.cn;http://www.fjnu.edu.cn",
        "aff_unique_abbr": "THU;FJNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Dichotomy of Early and Late Phase Implicit Biases Can Provably Induce Grokking",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18441",
        "id": "XsHqr9dEGH",
        "author_site": "Kaifeng Lyu, Jikai Jin, Zhiyuan Li, Simon Du, Jason Lee, Wei Hu",
        "tldr": "",
        "abstract": "Recent work by Power et al. (2022) highlighted a surprising \"grokking\" phenomenon in learning arithmetic tasks: a neural net first \"memorizes\" the training set, resulting in perfect training accuracy but near-random test accuracy, and after training for sufficiently longer, it suddenly transitions to perfect test accuracy. This paper studies the grokking phenomenon in theoretical setups and shows that it can be induced by a dichotomy of early and late phase implicit biases. Specifically, when training homogeneous neural nets with large initialization and small weight decay on both classification and regression tasks, we prove that the training process gets trapped at a solution corresponding to a kernel predictor for a long time, and then a very sharp transition to min-norm/max-margin predictors occurs, leading to a dramatic change in test accuracy.",
        "keywords": "grokking;implicit bias;margin;kernel;training dynamics;generalization",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/81eef69dc6b3b9296ea1ddebec8950f6006ef5a7.zip",
        "author": "Kaifeng Lyu;Jikai Jin;Zhiyuan Li;Simon Shaolei Du;Jason D. Lee;Wei Hu",
        "authorids": "~Kaifeng_Lyu2;~Jikai_Jin1;~Zhiyuan_Li2;~Simon_Shaolei_Du1;~Jason_D._Lee1;~Wei_Hu1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://kaifeng.ac/;https://www.jkjin.com/;https://zhiyuanli.ttic.edu;http://simonshaoleidu.com;https://jasondlee88.github.io/;https://weihu.me",
        "dblp": "220/3283;276/0406;l/ZhiyuanLi;176/5602;88/3262;",
        "google_scholar": "843JJtgAAAAJ;xQqZt2AAAAAJ;https://scholar.google.com/citations?hl=en;OttawxUAAAAJ;GR_DsT0AAAAJ;ZybgAqkAAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Kaifeng_Lyu2;~Jikai_Jin1;~Zhiyuan_Li2;~Simon_Shaolei_Du1;~Jason_D._Lee1;~Wei_Hu1",
        "aff": "Princeton University;Stanford University;Toyota Technological Institute at Chicago;University of Washington;Princeton University;University of Michigan - Ann Arbor",
        "aff_domain": "princeton.edu;stanford.edu;ttic.edu;washington.edu;princeton.edu;umich.edu",
        "position": "PhD student;PhD student;Assistant Professor;Assistant Professor;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nlyu2024dichotomy,\ntitle={Dichotomy of Early and Late Phase Implicit Biases Can Provably Induce Grokking},\nauthor={Kaifeng Lyu and Jikai Jin and Zhiyuan Li and Simon Shaolei Du and Jason D. Lee and Wei Hu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=XsHqr9dEGH}\n}",
        "github": "",
        "project": "",
        "reviewers": "vAjC;oyWf;XQUe",
        "pdf_size": 653573,
        "rating": "6;6;6",
        "confidence": "3;3;3",
        "soundness": "3;2;3",
        "contribution": "3;3;3",
        "presentation": "3;3;3",
        "wc_summary": "186;106;153",
        "wc_strengths": "203;90;63",
        "wc_weaknesses": "106;152;65",
        "wc_questions": "116;141;298",
        "wc_review": "611;489;579",
        "wc_reply_reviewers": "7;0;0",
        "wc_reply_authors": "481;749;1044",
        "reply_reviewers": "1;0;0",
        "reply_authors": "1;1;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            148.33333333333334,
            32.826141344293816
        ],
        "wc_strengths_avg": [
            118.66666666666667,
            60.642852468824024
        ],
        "wc_weaknesses_avg": [
            107.66666666666667,
            35.537148012873644
        ],
        "wc_questions_avg": [
            185.0,
            80.5522604690065
        ],
        "wc_review_avg": [
            559.6666666666666,
            51.64838386199084
        ],
        "wc_reply_reviewers_avg": [
            2.3333333333333335,
            3.2998316455372216
        ],
        "wc_reply_authors_avg": [
            758.0,
            229.93187396850107
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 31,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7351522609942257695&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=XsHqr9dEGH",
        "pdf": "https://openreview.net/pdf?id=XsHqr9dEGH",
        "email": "princeton.edu;stanford.edu;ttic.edu;washington.edu;princeton.edu;umich.edu",
        "author_num": 6,
        "aff_unique_index": "0;1;2;3;0;4",
        "aff_unique_norm": "Princeton University;Stanford University;Toyota Technological Institute at Chicago;University of Washington;University of Michigan",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.princeton.edu;https://www.stanford.edu;https://www.tti-chicago.org;https://www.washington.edu;https://www.umich.edu",
        "aff_unique_abbr": "Princeton;Stanford;TTI Chicago;UW;UM",
        "aff_campus_unique_index": "1;2;3",
        "aff_campus_unique": ";Stanford;Chicago;Ann Arbor",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Xsrsj3cne4",
        "title": "An Optimization-Based Framework for Adversarial Defence of Graph Neural Networks Via Adaptive Lipschitz Regularization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph Neural Networks (GNNs) have exhibited exceptional performance across diverse application domains by harnessing the inherent interconnectedness of data. However, the emergence of adversarial attacks targeting GNNs poses a substantial and pervasive threat, compromising their overall performance and learning capabilities. While recent efforts have focused on enhancing GNN robustness from both data and architectural perspectives, more attention should be given to overall network stability in the face of input perturbations. Prior methods addressing network stability have routinely employed gradient normalization as a fundamental technique. This study introduces a unifying approach, termed as AdaLip, for adversarial training of GNNs through an optimization framework that leverages the explicit Lipschitz constant. By seamlessly integrating graph denoising and network regularization, AdaLip offers a comprehensive and versatile solution, extending its applicability and enabling robust regularization for diverse neural network architectures. Further, we develop a provably convergent iterative algorithm, leveraging block majorization-minimization, graph learning, and alternate minimization techniques to solve the proposed optimization problem. Simulation results on real datasets demonstrate the efficacy of AdaLip over state-of-the-art defence methods across diverse classes of poisoning attacks. On select datasets, AdaLip demonstrates GCN performance improvements of up to 20\\% against modification attacks and approximately 10\\% against injection attacks. Remarkably, AdaLip achieves a similar performance gain on heterophily graph datasets.",
        "keywords": "Graph Neural Networks;Robustness;Lipschitz Regularization",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/c90ce29b76605964dcb8170dfb3a8dc851af5f42.zip",
        "author": "Vipul Kumar Singh;SARATH MOHAN;Sandeep Kumar;Jayadeva Jayadeva",
        "authorids": "~Vipul_Kumar_Singh1;~SARATH_MOHAN1;~Sandeep_Kumar8;~Jayadeva_Jayadeva1",
        "gender": "M;M;M;M",
        "homepage": ";;https://sites.google.com/view/sandeepkr/home;",
        "dblp": ";;;58/4288",
        "google_scholar": "MRJqKywAAAAJ;;lycMMW8AAAAJ;",
        "orcid": ";;;",
        "linkedin": ";sarathmohaniitd/;sandeep-kumar-84463332/;",
        "or_profile": "~Vipul_Kumar_Singh1;~SARATH_MOHAN1;~Sandeep_Kumar8;~Jayadeva_Jayadeva1",
        "aff": "Indian Institute of Technology Delhi;;Indian Institute of Technology Delhi;Indian Institute of Technology Delhi",
        "aff_domain": "iitd.ac.in;;iitd.ac.in;iitd.ac.in",
        "position": "PhD student;;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nsingh2024an,\ntitle={An Optimization-Based Framework for Adversarial Defence of Graph Neural Networks Via Adaptive Lipschitz Regularization},\nauthor={Vipul Kumar Singh and SARATH MOHAN and Sandeep Kumar and Jayadeva Jayadeva},\nyear={2024},\nurl={https://openreview.net/forum?id=Xsrsj3cne4}\n}",
        "github": "",
        "project": "",
        "reviewers": "uQo7;5YoB;umJp;C1i6",
        "site": "https://openreview.net/forum?id=Xsrsj3cne4",
        "pdf_size": 500771,
        "rating": "3;3;3;5",
        "confidence": "4;3;4;4",
        "soundness": "2;1;1;3",
        "contribution": "2;2;1;3",
        "presentation": "2;2;1;2",
        "wc_summary": "65;36;48;29",
        "wc_strengths": "21;10;16;67",
        "wc_weaknesses": "230;182;634;390",
        "wc_questions": "129;4;38;129",
        "wc_review": "445;232;736;615",
        "wc_reply_reviewers": "46;43;14;134",
        "wc_reply_authors": "667;461;954;390",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;2;2;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            44.5,
            13.647344063956181
        ],
        "wc_strengths_avg": [
            28.5,
            22.566568192793515
        ],
        "wc_weaknesses_avg": [
            359.0,
            176.46246059714798
        ],
        "wc_questions_avg": [
            75.0,
            55.32178594369491
        ],
        "wc_review_avg": [
            507.0,
            189.45579959452283
        ],
        "wc_reply_reviewers_avg": [
            59.25,
            44.92980636504012
        ],
        "wc_reply_authors_avg": [
            618.0,
            219.0490812580596
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:a8r8CMjCwNAJ:scholar.google.com/&scioq=An+Optimization-Based+Framework+for+Adversarial+Defence+of+Graph+Neural+Networks+Via+Adaptive+Lipschitz+Regularization&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Indian Institute of Technology Delhi",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.iitd.ac.in",
        "aff_unique_abbr": "IIT Delhi",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Delhi",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "India"
    },
    {
        "id": "XtND3b9Rv3",
        "title": "MST-GNN: Graph Neural Network with Multi-Granularity in Space and Time for Traffic Prediction",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Traffic flow prediction based on vehicle trajectories is a crucial aspect of Intelligent Transportation Systems (ITS). Deep learning approaches have recently been widely adopted to capture spatio-temporal correlations in traffic conditions, and have achieved superior performance compared to traditional methods. However, most existing studies focus on traffic prediction at a single spatial scale, usually corresponding to the road-segment level. According to the Hierarchy Theory, processes at different scales form a hierarchy of organization, and meaningful patterns may emerge at multiple levels of details. Presetting traffic data at an inappropriate scale can cause misunderstanding in features learning. In this paper, we propose a graph learning model called MST-GNN, which captures the comprehensive behaviors and dynamics of traffic patterns by fusing multi-scale features from both space and time perspectives. In ITS applications, users usually consider traffic conditions at the larger-scale regional level, and a prediction model must attend to multi-scale application requirements. Moreover, the structure of multiple granularities in time series can fully unleash the potential of different temporal scales in learning dynamic traffic pattern features. We inject the multi-scale spatio-temporal structure into a graph neural architecture with a tailored fusion module. Our model achieves state-of-the-art accuracy prediction results on two traffic benchmark datasets.",
        "keywords": "traffic flow prediction;graph neural network;multi-scale spatio-temporal structure",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/7694a50bfeac5e987a123973380a40ee42557caf.pdf",
        "author": "Xinru Zhao;Wenhao Yu;Lin Jianfeng;Yifan Zhang;Jinlu Zhang;Huang Binqiang",
        "authorids": "~Xinru_Zhao1;~Wenhao_Yu3;~Lin_Jianfeng1;~Yifan_Zhang19;~Jinlu_Zhang3;~Huang_Binqiang1",
        "gender": "F;M;M;M;F;M",
        "homepage": "https://www.researchgate.net/profile/Xinru-Zhao-4;https://grzy.cug.edu.cn/yuwenhao/zh_CN/index.htm;https://scholar.google.com/citations?user=eFTAHFEAAAAJ&hl=en;;https://jinluzhang.github.io/;",
        "dblp": ";159/8117-1;;57/4707-9;;",
        "google_scholar": ";;eFTAHFEAAAAJ;https://scholar.google.com/citations?authuser=1;;",
        "orcid": ";;;;;",
        "linkedin": ";;;;;https://linkedin.com/in/binqiang-huang-7a77547a",
        "or_profile": "~Xinru_Zhao1;~Wenhao_Yu3;~Lin_Jianfeng1;~Yifan_Zhang19;~Jinlu_Zhang3;~Huang_Binqiang1",
        "aff": "China University of Geosciences Wuhan;China University of Geosciences Wuhan;Meituan;China University of Geosciences Wuhan;;Meituan",
        "aff_domain": "cug.edu.cn;cug.edu.cn;meituan.com;cug.edu.cn;;meituan.com",
        "position": "MS student;Full Professor;Researcher;PhD student;;Researcher",
        "bibtex": "@misc{\nzhao2024mstgnn,\ntitle={{MST}-{GNN}: Graph Neural Network with Multi-Granularity in Space and Time for Traffic Prediction},\nauthor={Xinru Zhao and Wenhao Yu and Lin Jianfeng and Yifan Zhang and Jinlu Zhang and Huang Binqiang},\nyear={2024},\nurl={https://openreview.net/forum?id=XtND3b9Rv3}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZZx2;feuG;M4FU",
        "site": "https://openreview.net/forum?id=XtND3b9Rv3",
        "pdf_size": 969665,
        "rating": "3;5;5",
        "confidence": "4;4;3",
        "soundness": "3;3;2",
        "contribution": "2;3;2",
        "presentation": "2;3;2",
        "wc_summary": "113;50;140",
        "wc_strengths": "24;42;137",
        "wc_weaknesses": "266;91;166",
        "wc_questions": "6;5;5",
        "wc_review": "409;188;448",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            101.0,
            37.70941526992961
        ],
        "wc_strengths_avg": [
            67.66666666666667,
            49.573738567466904
        ],
        "wc_weaknesses_avg": [
            174.33333333333334,
            71.6860438920219
        ],
        "wc_questions_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "wc_review_avg": [
            348.3333333333333,
            114.4853217180652
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:FDU1KYMc9csJ:scholar.google.com/&scioq=MST-GNN:+Graph+Neural+Network+with+Multi-Granularity+in+Space+and+Time+for+Traffic+Prediction&hl=en&as_sdt=0,5",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;0;1",
        "aff_unique_norm": "China University of Geosciences;Meituan",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.cug.edu.cn/;https://www.meituan.com",
        "aff_unique_abbr": "CUG;Meituan",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Wuhan;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "XuNkuoihgG",
        "title": "Orthogonal Sequential Fusion in Multimodal Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The integration of data from multiple modalities is a fundamental challenge in machine learning, encompassing applications from image captioning to text-to-image generation. Traditional fusion methods typically combine all inputs concurrently, which can lead to an uneven representation of the modalities and restricted control over their integration. In this paper, we introduce a new fusion paradigm called Orthogonal Sequential Fusion (OSF), which sequentially merges inputs and permits selective weighting of modalities. This stepwise process also enables the promotion of orthogonal representations, thereby extracting complementary information for each additional modality. We demonstrate the effectiveness of our approach across various applications, and show that Orthogonal Sequential Fusion outperforms existing fusion techniques in terms of accuracy, while also providing valuable insights into the relationships between all modalities through its sequential mechanism. Our approach represents a promising alternative to established fusion techniques and offers a sophisticated way of combining modalities for a wide range of applications, including integration into any complex multimodal model that relies on information fusion.",
        "keywords": "Machine Learning;Representation Learning;Multimodal Learning;Information Fusion",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Sami Labbaki;Peter Minary",
        "authorids": "~Sami_Labbaki1;peter.minary@cs.ox.ac.uk",
        "gender": "M;",
        "homepage": ";",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": "sami-labbaki-750a01178/;",
        "or_profile": "~Sami_Labbaki1;peter.minary@cs.ox.ac.uk",
        "aff": "Department of Computer Science, University of Oxford;",
        "aff_domain": "cs.ox.ac.uk;",
        "position": "PhD student;",
        "bibtex": "@misc{\nlabbaki2024orthogonal,\ntitle={Orthogonal Sequential Fusion in Multimodal Learning},\nauthor={Sami Labbaki and Peter Minary},\nyear={2024},\nurl={https://openreview.net/forum?id=XuNkuoihgG}\n}",
        "github": "",
        "project": "",
        "reviewers": "SAr6;8gNn;HooP;ZKms",
        "site": "https://openreview.net/forum?id=XuNkuoihgG",
        "pdf_size": 999974,
        "rating": "1;3;3;5",
        "confidence": "5;4;3;2",
        "soundness": "1;3;2;2",
        "contribution": "1;2;2;2",
        "presentation": "1;3;2;2",
        "wc_summary": "68;48;62;56",
        "wc_strengths": "7;63;54;117",
        "wc_weaknesses": "309;160;116;169",
        "wc_questions": "60;9;56;4",
        "wc_review": "444;280;288;346",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            58.5,
            7.399324293474371
        ],
        "wc_strengths_avg": [
            60.25,
            39.06004992316318
        ],
        "wc_weaknesses_avg": [
            188.5,
            72.40338389882064
        ],
        "wc_questions_avg": [
            32.25,
            25.849323008543184
        ],
        "wc_review_avg": [
            339.5,
            65.48854861729644
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.9486832980505138,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17451495635674293620&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Oxford",
        "aff_unique_dep": "Department of Computer Science",
        "aff_unique_url": "https://www.ox.ac.uk",
        "aff_unique_abbr": "Oxford",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Oxford",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "XvSLWB0kfN",
        "title": "Cultural and Linguistic Diversity Improves Visual Representations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Computer vision often treats perception as objective, and this assumption gets reflected in the way that datasets are collected and models are trained.\nFor instance, image descriptions in different languages are typically assumed to be translations of the same semantic content. \nHowever, work in cross-cultural psychology and linguistics has shown that individuals  differ in their visual perception depending on their cultural background and the language they speak.\nIn this paper, we demonstrate significant differences in semantic content across languages in both dataset and model-produced captions.\nWhen data is multilingual as opposed to monolingual, captions have higher semantic coverage on average, as measured by scene graph, embedding, and linguistic complexity.\nFor example, multilingual captions have on average 21.8% more objects, 24.5% more relations, and 27.1% more attributes than a set of monolingual captions.\nMoreover, models trained on content from different languages perform best against test data from those languages, while those trained on multilingual content perform consistently well across all evaluation data compositions.\nOur research provides implications for how diverse modes of perception can improve image understanding.",
        "keywords": "multilingual;computer vision;linguistics;perception;social biases",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/ca567f8a6053f12b7002cda02743840ad0b81344.pdf",
        "author": "Andre Ye;Sebastin Santy;Jena D. Hwang;Amy X Zhang;Ranjay Krishna",
        "authorids": "~Andre_Ye1;~Sebastin_Santy2;~Jena_D._Hwang1;~Amy_X_Zhang1;~Ranjay_Krishna1",
        "gender": ";M;F;F;M",
        "homepage": "https://andre-ye.github.io;http://sebastinsanty.com/;https://jenahwang.github.io/;https://homes.cs.washington.edu/~axz/;http://ranjaykrishna.com",
        "dblp": "354/8393;212/5368;83/10905;133/8390;167/3785",
        "google_scholar": ";HsyMg08AAAAJ;9QuMhLgAAAAJ;thZJZaYAAAAJ;IcqahyAAAAAJ",
        "orcid": ";0000-0003-1162-0865;;;0000-0001-8784-2531",
        "linkedin": ";sebastinsanty/;;;ranjay-krishna-1a344444/",
        "or_profile": "~Andre_Ye1;~Sebastin_Santy2;~Jena_D._Hwang1;~Amy_X_Zhang1;~Ranjay_Krishna1",
        "aff": "University of Washington;University of Washington;Allen Institute for Artificial Intelligence;Department of Computer Science;University of Washington",
        "aff_domain": "uw.edu;cs.washington.edu;allenai.org;cs.washington.edu;cs.washington.edu",
        "position": "Undergrad student;PhD student;Researcher;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nye2024cultural,\ntitle={Cultural and Linguistic Diversity Improves Visual Representations},\nauthor={Andre Ye and Sebastin Santy and Jena D. Hwang and Amy X Zhang and Ranjay Krishna},\nyear={2024},\nurl={https://openreview.net/forum?id=XvSLWB0kfN}\n}",
        "github": "",
        "project": "",
        "reviewers": "VFGo;qG2w;DPPs",
        "site": "https://openreview.net/forum?id=XvSLWB0kfN",
        "pdf_size": 5680259,
        "rating": "3;6;8",
        "confidence": "5;4;4",
        "soundness": "2;2;3",
        "contribution": "2;3;3",
        "presentation": "1;3;3",
        "wc_summary": "121;146;78",
        "wc_strengths": "57;62;36",
        "wc_weaknesses": "296;126;127",
        "wc_questions": "206;146;71",
        "wc_review": "680;480;312",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1540;770;914",
        "reply_reviewers": "0;0;0",
        "reply_authors": "4;2;2",
        "rating_avg": [
            5.666666666666667,
            2.0548046676563256
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            115.0,
            28.083209693100727
        ],
        "wc_strengths_avg": [
            51.666666666666664,
            11.2644968324772
        ],
        "wc_weaknesses_avg": [
            183.0,
            79.9041091976293
        ],
        "wc_questions_avg": [
            141.0,
            55.226805085936306
        ],
        "wc_review_avg": [
            490.6666666666667,
            150.42458427915153
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1074.6666666666667,
            334.2507375542432
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9176629354822472,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12426763872810782663&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1;2;0",
        "aff_unique_norm": "University of Washington;Allen Institute for Artificial Intelligence;Unknown Institution",
        "aff_unique_dep": ";;Department of Computer Science",
        "aff_unique_url": "https://www.washington.edu;https://allenai.org;",
        "aff_unique_abbr": "UW;AI2;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States;"
    },
    {
        "title": "Continual Learning on a Diet: Learning from Sparsely Labeled Streams Under Constrained Computation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18440",
        "id": "Xvfz8NHmCj",
        "author_site": "Wenxuan Zhang, Youssef Mohamed, Bernard Ghanem, Philip Torr, Adel Bibi, Mohamed Elhoseiny",
        "tldr": "",
        "abstract": "We propose and study a realistic Continual Learning (CL) setting where learning algorithms are granted a restricted computational budget per time step while training. We apply this setting to large-scale semi-supervised Continual Learning scenarios with sparse label rate.  Previous proficient CL methods perform very poorly in this challenging setting. Overfitting to the sparse labeled data and insufficient computational budget are the two main culprits for such a poor performance. Our new setting encourages learning methods to effectively and efficiently utilize the unlabeled data during training. To that end, we propose a simple but highly effective baseline, DietCL, which utilizes both unlabeled and labeled data jointly. DietCL meticulously allocates computational budget for both types of data. We validate our baseline, at scale, on several datasets, e.g., CLOC, ImageNet10K, and CGLM, under constraint budget setup. DietCL outperforms, by a large margin, all existing supervised CL algorithms as well as more recent continual semi-supervised methods. Our extensive analysis and ablations demonstrate that DietCL is stable under a full spectrum of label sparsity, computational budget and various other ablations.",
        "keywords": "Continual Learning;Semi-supervised Continual Learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/1272f74e911735a1931570a592c2d251dd65ea03.zip",
        "author": "Wenxuan Zhang;Youssef Mohamed;Bernard Ghanem;Philip Torr;Adel Bibi;Mohamed Elhoseiny",
        "authorids": "~Wenxuan_Zhang3;~Youssef_Mohamed1;~Bernard_Ghanem1;~Philip_Torr1;~Adel_Bibi1;~Mohamed_Elhoseiny1",
        "gender": "F;M;;M;M;M",
        "homepage": "https://cemse.kaust.edu.sa/vcc/people/person/wenxuan-zhang;https://ivul.kaust.edu.sa;http://www.robots.ox.ac.uk/~tvg/;http://adelbibi.com;http://www.mohamed-elhoseiny.com;https://mo-youssef.github.io/",
        "dblp": ";37/2516;;176/0964;125/2894;282/0389",
        "google_scholar": ";rVsGTeEAAAAJ;;Q4j2laYAAAAJ;iRBUTOAAAAAJ;DtCLSdUAAAAJ",
        "orcid": ";0000-0002-5534-587X;;0000-0002-6169-3918;0000-0001-9659-1551;0000-0001-5699-7362",
        "linkedin": ";bernardghanem/;;adel-bibi-ba3671ab/;mohamed-elhoseiny-8a836215/;",
        "or_profile": "~Wenxuan_Zhang3;~Bernard_Ghanem1;~Philip_Torr1;~Adel_Bibi1;~Mohamed_Elhoseiny1;~Youssef_Sherif_Mansour_Mohamed1",
        "aff": "Samsung Research America;King Abdullah University of Science and Technology;University of Oxford;University of Oxford;KAUST;King Abdullah University of Science and Technology",
        "aff_domain": "samsung.com;kaust.edu.sa;ox.ac.uk;ox.ac.uk;kaust.edu.sa;kaust.edu.sa",
        "position": "Intern;Full Professor;Full Professor;Senior Researcher;Associate Professor;PhD student",
        "bibtex": "@inproceedings{\nzhang2024continual,\ntitle={Continual Learning on a Diet:  Learning from Sparsely Labeled Streams Under Constrained Computation},\nauthor={Wenxuan Zhang and Youssef Mohamed and Bernard Ghanem and Philip Torr and Adel Bibi and Mohamed Elhoseiny},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Xvfz8NHmCj}\n}",
        "github": "",
        "project": "",
        "reviewers": "GSPx;TT9Y;uZcN;dSE4",
        "pdf_size": 1520918,
        "rating": "5;6;8;8",
        "confidence": "3;3;4;3",
        "soundness": "2;3;4;3",
        "contribution": "2;3;3;3",
        "presentation": "2;3;4;3",
        "wc_summary": "40;78;42;76",
        "wc_strengths": "25;29;68;59",
        "wc_weaknesses": "246;161;54;150",
        "wc_questions": "73;10;103;2",
        "wc_review": "384;278;267;287",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1314;987;262;984",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;1;2",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            59.0,
            18.027756377319946
        ],
        "wc_strengths_avg": [
            45.25,
            18.579222265746218
        ],
        "wc_weaknesses_avg": [
            152.75,
            68.04915502781795
        ],
        "wc_questions_avg": [
            47.0,
            42.444080859408416
        ],
        "wc_review_avg": [
            304.0,
            46.7279359698243
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            886.75,
            384.825528649023
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5555555555555555,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=304626260878784799&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 9,
        "openreview": "https://openreview.net/forum?id=Xvfz8NHmCj",
        "pdf": "https://openreview.net/pdf?id=Xvfz8NHmCj",
        "email": "samsung.com;kaust.edu.sa;ox.ac.uk;ox.ac.uk;kaust.edu.sa;kaust.edu.sa",
        "author_num": 6,
        "aff_unique_index": "0;1;2;2;1;1",
        "aff_unique_norm": "Samsung;King Abdullah University of Science and Technology;University of Oxford",
        "aff_unique_dep": "Samsung Research America;;",
        "aff_unique_url": "https://www.samsung.com/us/careers/research/;https://www.kast.kau.edu.sa;https://www.ox.ac.uk",
        "aff_unique_abbr": "SRA;KAUST;Oxford",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;2;1;1",
        "aff_country_unique": "United States;Saudi Arabia;United Kingdom"
    },
    {
        "title": "Smooth ECE: Principled Reliability Diagrams via Kernel Smoothing",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18439",
        "id": "XwiA1nDahv",
        "author_site": "Jaroslaw Blasiok, Preetum Nakkiran",
        "tldr": "",
        "abstract": "Calibration measures and reliability diagrams are two fundamental tools for measuring and interpreting the calibration of probabilistic predictors. Calibration measures quantify the degree of miscalibration, and reliability diagrams visualize the structure of this miscalibration. However, the most common constructions of reliability diagrams and calibration measures --- binning and ECE --- both suffer from well-known flaws (e.g. discontinuity). We show that a simple modification fixes both constructions: first smooth the observations using an RBF kernel, then compute the Expected Calibration Error (ECE) of this smoothed function. We prove that with a careful choice of bandwidth, this method yields a calibration measure that is well-behaved in the sense of (Blasiok, Gopalan, Hu, and Nakkiran 2023) --- a consistent calibration measure. We call this measure the SmoothECE. Moreover, the reliability diagram obtained from this smoothed function visually encodes the SmoothECE, just as binned reliability diagrams encode the BinnedECE.   We also release a Python package with simple, hyperparameter-free methods for measuring and plotting calibration: \"pip install relplot.\"\nCode at: https://github.com/apple/ml-calibration",
        "keywords": "calibration;reliability;ECE;theory",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/fe63a8da9c11de7b3236350dd6c19242a857f902.zip",
        "author": "Jaroslaw Blasiok;Preetum Nakkiran",
        "authorids": "~Jaroslaw_Blasiok1;~Preetum_Nakkiran1",
        "gender": "M;",
        "homepage": "https://people.inf.ethz.ch/~jblasiok/;http://preetum.nakkiran.org",
        "dblp": "129/1698;151/6343",
        "google_scholar": "rM0Orl0AAAAJ;zithBbUAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Jaroslaw_Blasiok1;~Preetum_Nakkiran1",
        "aff": "Department of Computer Science, ETHZ - ETH Zurich;Apple",
        "aff_domain": "inf.ethz.ch;apple.com",
        "position": "Postdoc;Principal Researcher",
        "bibtex": "@inproceedings{\nblasiok2024smooth,\ntitle={Smooth {ECE}: Principled Reliability Diagrams via Kernel Smoothing},\nauthor={Jaroslaw Blasiok and Preetum Nakkiran},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=XwiA1nDahv}\n}",
        "github": "",
        "project": "",
        "reviewers": "MdfL;1zec;SRwZ;PxLa",
        "pdf_size": 2044674,
        "rating": "6;6;6;8",
        "confidence": "3;4;3;3",
        "soundness": "3;3;3;3",
        "contribution": "3;2;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "141;39;115;40",
        "wc_strengths": "87;83;105;50",
        "wc_weaknesses": "85;372;54;129",
        "wc_questions": "35;151;57;97",
        "wc_review": "348;645;331;316",
        "wc_reply_reviewers": "52;0;69;31",
        "wc_reply_authors": "508;999;280;352",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            83.75,
            45.19610049550735
        ],
        "wc_strengths_avg": [
            81.25,
            19.854155736268414
        ],
        "wc_weaknesses_avg": [
            160.0,
            125.26571757667777
        ],
        "wc_questions_avg": [
            85.0,
            44.11349000022555
        ],
        "wc_review_avg": [
            410.0,
            136.1488156393584
        ],
        "wc_reply_reviewers_avg": [
            38.0,
            25.739075352467502
        ],
        "wc_reply_authors_avg": [
            534.75,
            280.4187716612424
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 21,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11274890634013037781&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=XwiA1nDahv",
        "pdf": "https://openreview.net/pdf?id=XwiA1nDahv",
        "email": "inf.ethz.ch;apple.com",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "ETH Zurich;Apple",
        "aff_unique_dep": "Department of Computer Science;Apple Inc.",
        "aff_unique_url": "https://www.ethz.ch;https://www.apple.com",
        "aff_unique_abbr": "ETHZ;Apple",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Zurich;",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Switzerland;United States"
    },
    {
        "id": "XyB4VvF01X",
        "title": "Graph2Tac: Learning hierarchical representations of math concepts in theorem proving",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Concepts abound in mathematics and its applications.\n    They vary greatly between subject areas,\n    and new ones are introduced in each mathematical paper or application.\n    A formal theory builds a hierarchy of definitions, theorems and proofs\n    that reference each other.\n    When an AI agent is proving a new theorem,\n    most of the mathematical concepts and lemmas relevant to that theorem may have never been seen during training.\n    This is especially true in the Coq proof assistant, which has a diverse library of Coq projects,\n    each with its own definitions, lemmas, and even custom tactic procedures used to prove those lemmas.\n    It is essential for agents to incorporate such new information into their knowledge base on the fly.\n    We work towards this goal by utilizing a new, large-scale, graph-based dataset for machine learning in Coq.\n    We leverage a faithful graph-representation of Coq terms that\n    induces a directed graph of dependencies between definitions\n    to create a novel graph neural network, Graph2Tac (G2T),\n    that takes into account not only the current goal,\n    but also the entire hierarchy of definitions that led to the current goal.\n    G2T is an online model that is deeply integrated into the users' workflow and can adapt in real time to new Coq projects and their definitions.\n    It complements well with other online models that learn in real time from new proof scripts.\n    Our novel definition embedding task, which is trained to compute representations of mathematical concepts not seen during training,\n    boosts the performance of the neural network to rival\n    state-of-the-art k-nearest neighbor predictors.",
        "keywords": "theorem proving;automated reasoning;Coq",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "",
        "author": "Jason Rute;Miroslav Ol\u0161\u00e1k;Lasse Blaauwbroek;Fidel Ivan Schaposnik Massolo;Jelle Piepenbrock;Vasily Pestun",
        "authorids": "~Jason_Rute1;~Miroslav_Ol\u0161\u00e1k1;~Lasse_Blaauwbroek1;~Fidel_Ivan_Schaposnik_Massolo1;~Jelle_Piepenbrock1;~Vasily_Pestun1",
        "gender": "M;M;M;M;;",
        "homepage": "https://jasonrute.github.io;https://github.com/mirefek/;https://fr.linkedin.com/in/lasse-blaauwbroek-491306128;https://fidel-schaposnik.github.io;https://jellepiepenbrock.nl;https://pestun.ihes.fr",
        "dblp": "141/9655;;;;285/5325.html;",
        "google_scholar": "Z-oVfDMAAAAJ;;;sQtdf8cAAAAJ;04Oz0iQAAAAJ;",
        "orcid": "0000-0002-6247-1882;;;0000-0002-9557-7296;;",
        "linkedin": "jason-rute;;;fidel-schaposnik/;;",
        "or_profile": "~Jason_Rute1;~Miroslav_Ol\u0161\u00e1k1;~Lasse_Blaauwbroek1;~Fidel_Ivan_Schaposnik_Massolo1;~Jelle_Piepenbrock1;~Vasily_Pestun1",
        "aff": "IBM Research;University of Cambridge;IHES;;Technical University Prague;IHES",
        "aff_domain": "research.ibm.com;cam.ac.uk;ihes.fr;;cvut.cz;ihes.fr",
        "position": "Postdoc;Postdoc;Postdoc;;Researcher;Full Professor",
        "bibtex": "@misc{\nrute2024graphtac,\ntitle={Graph2Tac: Learning hierarchical representations of math concepts in theorem proving},\nauthor={Jason Rute and Miroslav Ol{\\v{s}}{\\'a}k and Lasse Blaauwbroek and Fidel Ivan Schaposnik Massolo and Jelle Piepenbrock and Vasily Pestun},\nyear={2024},\nurl={https://openreview.net/forum?id=XyB4VvF01X}\n}",
        "github": "",
        "project": "",
        "reviewers": "WdSC;UA5d;Ursv;ePHg",
        "site": "https://openreview.net/forum?id=XyB4VvF01X",
        "pdf_size": 12488812,
        "rating": "5;5;6;8",
        "confidence": "2;5;3;5",
        "soundness": "3;2;3;4",
        "contribution": "2;2;3;4",
        "presentation": "2;2;3;2",
        "wc_summary": "79;130;77;132",
        "wc_strengths": "77;117;31;80",
        "wc_weaknesses": "157;143;48;30",
        "wc_questions": "298;75;144;95",
        "wc_review": "611;465;300;337",
        "wc_reply_reviewers": "0;0;229;0",
        "wc_reply_authors": "817;1013;417;250",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            1.299038105676658
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            104.5,
            26.51886121235224
        ],
        "wc_strengths_avg": [
            76.25,
            30.50717128807586
        ],
        "wc_weaknesses_avg": [
            94.5,
            56.082528473669946
        ],
        "wc_questions_avg": [
            153.0,
            87.39851257315539
        ],
        "wc_review_avg": [
            428.25,
            121.98642342490413
        ],
        "wc_reply_reviewers_avg": [
            57.25,
            99.15990873331822
        ],
        "wc_reply_authors_avg": [
            624.25,
            304.669800767979
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.4714045207910316,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16539078336756980854&as_sdt=5,34&sciodt=0,34&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;2",
        "aff_unique_norm": "IBM;University of Cambridge;Institut des Hautes \u00c9tudes Scientifiques;Technical University of Prague",
        "aff_unique_dep": "IBM Research;;;",
        "aff_unique_url": "https://www.ibm.com/research;https://www.cam.ac.uk;https://www.ihes.fr/;https://www.tup.cz",
        "aff_unique_abbr": "IBM;Cambridge;IHES;TUP",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Cambridge",
        "aff_country_unique_index": "0;1;2;3;2",
        "aff_country_unique": "United States;United Kingdom;France;Czech Republic"
    },
    {
        "title": "Quantifying and Enhancing Multi-modal Robustness with Modality Preference",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18438",
        "id": "XyrB1Ay44j",
        "author_site": "Zequn Yang, Yake Wei, Ce Liang, Di Hu",
        "tldr": "",
        "abstract": "Multi-modal models have shown a promising capability to effectively integrate information from various sources, yet meanwhile, they are found vulnerable to pervasive perturbations, such as uni-modal attacks and missing conditions. To counter these perturbations, robust multi-modal representations are highly expected, which are positioned well away from the discriminative multi-modal decision boundary. In this paper, different from conventional empirical studies, we focus on a commonly used joint multi-modal framework and theoretically discover that larger uni-modal representation margins and more reliable integration for modalities are essential components for achieving higher robustness. This discovery can further explain the limitation of multi-modal robustness and the phenomenon that multi-modal models are often vulnerable to attacks on the specific modality. Moreover, our analysis reveals how the widespread issue, that the model has different preferences for modalities, limits the multi-modal robustness by influencing the essential components and could lead to attacks on the specific modality highly effective. Inspired by our theoretical finding, we introduce a training procedure called Certifiable Robust Multi-modal Training (CRMT), which can alleviate this influence from modality preference and explicitly regulate essential components to significantly improve robustness in a certifiable manner. Our method demonstrates substantial improvements in performance and robustness compared with existing methods. Furthermore, our training procedure can be easily extended to enhance other robust training strategies, highlighting its credibility and flexibility.",
        "keywords": "Robustness;Multi-modal learning;Modality preference",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Zequn Yang;Yake Wei;Ce Liang;Di Hu",
        "authorids": "~Zequn_Yang2;~Yake_Wei1;~Ce_Liang1;~Di_Hu1",
        "gender": "M;F;;M",
        "homepage": "https://bjlfzs.github.io/;https://echo0409.github.io/;https://github.com/sssqww;https://dtaoo.github.io/",
        "dblp": "318/1205;275/7048;;49/8496-1",
        "google_scholar": ";https://scholar.google.com.hk/citations?user=i9mWGA0AAAAJ;;https://scholar.google.com.hk/citations?user=F7bvTOEAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Zequn_Yang2;~Yake_Wei1;~Ce_Liang1;~Di_Hu1",
        "aff": "Renmin University of China;Renmin University of China;Renmin University of China;Renmin University of China",
        "aff_domain": "ruc.edu.cn;ruc.edu.cn;ruc.edu.cn;ruc.edu.cn",
        "position": "PhD student;PhD student;Undergrad student;Associate Professor",
        "bibtex": "@inproceedings{\nyang2024quantifying,\ntitle={Quantifying and Enhancing Multi-modal Robustness with Modality Preference},\nauthor={Zequn Yang and Yake Wei and Ce Liang and Di Hu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=XyrB1Ay44j}\n}",
        "github": "",
        "project": "",
        "reviewers": "hY8P;BCRJ;zQSE;yeWY",
        "pdf_size": 2464324,
        "rating": "6;6;6;6",
        "confidence": "4;4;3;4",
        "soundness": "3;3;3;3",
        "contribution": "3;3;4;2",
        "presentation": "3;3;3;3",
        "wc_summary": "85;38;63;107",
        "wc_strengths": "53;75;156;75",
        "wc_weaknesses": "90;175;153;93",
        "wc_questions": "4;1;71;1",
        "wc_review": "232;289;443;276",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "663;495;1340;586",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            73.25,
            25.616157010761782
        ],
        "wc_strengths_avg": [
            89.75,
            39.28978874975024
        ],
        "wc_weaknesses_avg": [
            127.75,
            37.09026152509578
        ],
        "wc_questions_avg": [
            19.25,
            29.902968080108703
        ],
        "wc_review_avg": [
            310.0,
            79.63981416352
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            771.0,
            333.8510146757083
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2727473990095960599&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=XyrB1Ay44j",
        "pdf": "https://openreview.net/pdf?id=XyrB1Ay44j",
        "email": "ruc.edu.cn;ruc.edu.cn;ruc.edu.cn;ruc.edu.cn",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Renmin University of China",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.ruc.edu.cn",
        "aff_unique_abbr": "RUC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Balancing Act: Constraining Disparate Impact in Sparse Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18437",
        "id": "Xz13DtbOVW",
        "author_site": "Meraj Hashemizadeh, Juan Ramirez, Rohan Sukumaran, Golnoosh Farnadi, Simon Lacoste-Julien, Jose Gallego-Posada",
        "tldr": "",
        "abstract": "Model pruning is a popular approach to enable the deployment of large deep learning models on edge devices with restricted computational or storage capacities. Although sparse models achieve performance comparable to that of their dense counterparts at the level of the entire dataset, they exhibit high accuracy drops for some data sub-groups. Existing methods to mitigate this disparate impact induced by pruning (i) rely on surrogate metrics that address the problem indirectly and have limited interpretability; or (ii) scale poorly with the number of protected sub-groups in terms of computational cost. We propose a constrained optimization approach that _directly addresses the disparate impact of pruning_: our formulation bounds the accuracy change between the dense and sparse models, for each sub-group. This choice of constraints provides an interpretable success criterion to determine if a pruned model achieves acceptable disparity levels. Experimental results demonstrate that our technique scales reliably to problems involving large models and hundreds of protected sub-groups.",
        "keywords": "deep learning;sparsity;disparate impact;constrained optimization;pruning;fairness",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Meraj Hashemizadeh;Juan Ramirez;Rohan Sukumaran;Golnoosh Farnadi;Simon Lacoste-Julien;Jose Gallego-Posada",
        "authorids": "~Meraj_Hashemizadeh1;~Juan_Ramirez2;~Rohan_Sukumaran1;~Golnoosh_Farnadi1;~Simon_Lacoste-Julien1;~Jose_Gallego-Posada1",
        "gender": ";M;M;F;M;M",
        "homepage": "http://www-ens.iro.umontreal.ca/~hashemis/;https://juan43ramirez.github.io;;http://www.cwi.ugent.be/people.php?userid=golnoosh;http://www.iro.umontreal.ca/~slacoste/;http://gallego-posada.github.io/",
        "dblp": ";;;148/1397;94/446.html;211/7701",
        "google_scholar": ";yop0kRkAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.nl/citations?user=4Vjp6hwAAAAJ;oejm5IUAAAAJ;tfKnkRQAAAAJ",
        "orcid": ";;;;0000-0001-6485-6180;",
        "linkedin": ";juan-camilo-ramirez-de-los-rios-11ab2b141/;;gfarnadi/;simon-lacoste-julien-355b9a3;",
        "or_profile": "~Meraj_Hashemizadeh1;~Juan_Ramirez2;~Rohan_Sukumaran1;~Golnoosh_Farnadi1;~Simon_Lacoste-Julien1;~Jose_Gallego-Posada1",
        "aff": ";University of Montreal;Montreal Institute for Learning Algorithms, University of Montreal, Universit\u00e9 de Montr\u00e9al;McGill University;Samsung - SAIT AI Lab, Montreal;University of Montreal",
        "aff_domain": ";umontreal.ca;mila.umontreal.ca;mcgill.ca;samsung.com;umontreal.ca",
        "position": ";PhD student;MS student;Assistant Professor;VP Lab Director;PhD student",
        "bibtex": "@inproceedings{\nhashemizadeh2024balancing,\ntitle={Balancing Act: Constraining Disparate Impact in Sparse Models},\nauthor={Meraj Hashemizadeh and Juan Ramirez and Rohan Sukumaran and Golnoosh Farnadi and Simon Lacoste-Julien and Jose Gallego-Posada},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Xz13DtbOVW}\n}",
        "github": "",
        "project": "",
        "reviewers": "cVd6;qBid;Haeo;KSs2",
        "pdf_size": 872663,
        "rating": "5;6;6;8",
        "confidence": "2;3;4;3",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "19;57;52;81",
        "wc_strengths": "9;95;68;65",
        "wc_weaknesses": "16;276;38;58",
        "wc_questions": "15;17;3;219",
        "wc_review": "59;445;161;423",
        "wc_reply_reviewers": "0;143;2;34",
        "wc_reply_authors": "380;1032;634;1607",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "2;2;3;3",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            52.25,
            22.106277389013286
        ],
        "wc_strengths_avg": [
            59.25,
            31.275989192989563
        ],
        "wc_weaknesses_avg": [
            97.0,
            104.40785411069419
        ],
        "wc_questions_avg": [
            63.5,
            89.93747828352761
        ],
        "wc_review_avg": [
            272.0,
            166.14752480852673
        ],
        "wc_reply_reviewers_avg": [
            44.75,
            58.30683922148413
        ],
        "wc_reply_authors_avg": [
            913.25,
            463.06769213582584
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.3244428422615251,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1609707290132401679&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=Xz13DtbOVW",
        "pdf": "https://openreview.net/pdf?id=Xz13DtbOVW",
        "email": ";umontreal.ca;mila.umontreal.ca;mcgill.ca;samsung.com;umontreal.ca",
        "author_num": 6,
        "aff_unique_index": "0;0;1;2;0",
        "aff_unique_norm": "University of Montreal;McGill University;Samsung",
        "aff_unique_dep": ";;SAIT AI Lab",
        "aff_unique_url": "https://wwwumontreal.ca;https://www.mcgill.ca;https://www.samsung.com",
        "aff_unique_abbr": "UM;McGill;Samsung",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Montreal",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "Y0wAim2F8A",
        "title": "PrivilegedDreamer: Explicit Imagination of Privileged Information for Adaptation in Uncertain Environments",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In many real-world control problems, such as robotics, the system dynamics can be significantly affected by unobservable hidden parameters, like friction coefficients. To represent these kinds of domains, we use Hidden-parameter Markov Decision Processes (HIP-MDPs), which model sequential decision problems where hidden variables affect the transition and reward functions. Existing approaches, such as domain randomization, domain adaptation, and meta-learning, simply treat the effect of hidden parameters as additional variance in dynamics and often struggle to effectively handle HIP-MDP problems, especially when rewards are parameterized by hidden variables. To address this, we introduce PrivilegedDreamer, a model-based reinforcement learning framework that extends Dreamer, a powerful world-modeling approach, by incorporating an explicit parameter estimation module. We introduce a novel dual recurrent architecture that explicitly estimates hidden parameters from limited historical data and enables us to condition the model, actor, and critic networks on these estimated parameters. Our empirical analysis on five diverse HIP-MDP tasks demonstrates that it outperforms state-of-the-art model-based, model-free, and domain adaptation learning algorithms. Furthermore, we also conduct ablation studies to justify our design decisions.",
        "keywords": "reinforcement learning;adaptation",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Morgan Byrd;Jackson Crandell;Jessica Inman;Robert Wright;Sehoon Ha",
        "authorids": "~Morgan_Byrd1;~Jackson_Crandell1;~Jessica_Inman1;~Robert_Wright1;~Sehoon_Ha2",
        "gender": ";M;F;M;M",
        "homepage": "https://morganbyrd03.github.io;https://jackson-crandell.github.io/;;;https://www.cc.gatech.edu/~sha9",
        "dblp": ";;;03/6763;33/10491",
        "google_scholar": ";;keXiNdwAAAAJ;v89BX9oAAAAJ;Q6F3O0sAAAAJ",
        "orcid": ";;;0000-0001-6508-1778;",
        "linkedin": ";;;robert-wright-690764b0/;",
        "or_profile": "~Morgan_Byrd1;~Jackson_Crandell1;~Jessica_Inman1;~Robert_Wright1;~Sehoon_Ha2",
        "aff": "Georgia Institute of Technology;Georgia Institute of Technology;Georgia Institute of Technology;;Georgia Institute of Technology",
        "aff_domain": "gatech.edu;gatech.edu;gatech.edu;;gatech.edu",
        "position": "PhD student;MS student;Researcher;;Assistant Professor",
        "bibtex": "@misc{\nbyrd2024privilegeddreamer,\ntitle={PrivilegedDreamer: Explicit Imagination of Privileged Information for Adaptation in Uncertain Environments},\nauthor={Morgan Byrd and Jackson Crandell and Jessica Inman and Robert Wright and Sehoon Ha},\nyear={2024},\nurl={https://openreview.net/forum?id=Y0wAim2F8A}\n}",
        "github": "",
        "project": "",
        "reviewers": "TWC6;vccC;iDRt;TuCu",
        "site": "https://openreview.net/forum?id=Y0wAim2F8A",
        "pdf_size": 547170,
        "rating": "3;3;3;5",
        "confidence": "4;4;5;5",
        "soundness": "2;2;2;3",
        "contribution": "2;2;1;2",
        "presentation": "3;3;2;3",
        "wc_summary": "149;108;76;78",
        "wc_strengths": "43;49;63;7",
        "wc_weaknesses": "329;534;557;138",
        "wc_questions": "111;127;55;2",
        "wc_review": "632;818;751;225",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            102.75,
            29.55820529057879
        ],
        "wc_strengths_avg": [
            40.5,
            20.657928260113597
        ],
        "wc_weaknesses_avg": [
            389.5,
            170.18298974926958
        ],
        "wc_questions_avg": [
            73.75,
            49.30200300190653
        ],
        "wc_review_avg": [
            606.5,
            230.1113860720499
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:YpIMvrAW370J:scholar.google.com/&scioq=PrivilegedDreamer:+Explicit+Imagination+of+Privileged+Information+for+Adaptation+in+Uncertain+Environments&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Georgia Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.gatech.edu",
        "aff_unique_abbr": "Georgia Tech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Y0yz1pmVfE",
        "title": "A Cooperative-Game-Theoretical Model for Ad Hoc Teamwork",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Ad hoc teamwork (AHT) is a cutting-edge problem in the multi-agent systems community, in which our task is to control an agent (`learner\u2019) which is required to cooperate with new teammates without prior coordination. Prior works formulated AHT as a stochastic Bayesian game (SBG), standing by the view of non-cooperative game theory. Follow-up work extended SBG to open team settings and proposed an empirical implementation framework based on GNNs called Graph-based Policy Learning (GPL) to tackle variant team sizes. Although the performance of GPL is convincing, its global Q-value representation is difficult to interpret and, therefore, impedes the potential application to real-world problems. In this work, we introduce a game model called coalitional affinity game (CAG) in cooperative game theory and establish a novel theoretical model named open stochastic Bayesian CAG to describe the process of AHT with open team settings. Based on the theoretical model, we derive the new solution concept that guides the representation of the global Q-value with theoretical guarantees for this setting. We further design a practical algorithm which can easily implement the theoretical results. In experiments, we demonstrate the performance improvement the proposed algorithm over GPL and verify the effectiveness and reasonableness of our theoretical model. The demo of the experiments is available at https://sites.google.com/view/cagpl.",
        "keywords": "ad hoc teamwork;reinforcement learning;cooperative game",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/b805b275b9a8a9312cc363b98bbc81e573644ebd.zip",
        "author": "Jianhong Wang;Yang Li;Yuan Zhang;Wei Pan;Samuel Kaski",
        "authorids": "~Jianhong_Wang1;~Yang_Li40;~Yuan_Zhang8;~Wei_Pan2;~Samuel_Kaski1",
        "gender": "M;M;;M;M",
        "homepage": "https://hsvgbkhgbv.github.io/;https://liyang.page;;http://panweihit.github.io;https://people.aalto.fi/samuel.kaski",
        "dblp": ";;;;64/5826",
        "google_scholar": "K1FKF3IAAAAJ;msAmwaoAAAAJ;gMzGCV0AAAAJ;GqryWPsAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;0000-0003-1121-9879;0000-0003-1925-9154",
        "linkedin": "jianhong-wang-45995b100/;;;wei-pan-6b558b17/;samuel-kaski-27790/",
        "or_profile": "~Jianhong_Wang1;~Yang_Li40;~Yuan_Zhang8;~Wei_Pan2;~Samuel_Kaski1",
        "aff": "University of Manchester;University of Manchester;University of Freiburg;University of Manchester;Aalto University",
        "aff_domain": "manchester.ac.uk;cs.manchester.ac.uk;uni-freiburg.de;manchester.ac.uk;aalto.fi",
        "position": "Postdoc;PhD student;PhD student;Associate Professor;Full Professor",
        "bibtex": "@misc{\nwang2024a,\ntitle={A Cooperative-Game-Theoretical Model for Ad Hoc Teamwork},\nauthor={Jianhong Wang and Yang Li and Yuan Zhang and Wei Pan and Samuel Kaski},\nyear={2024},\nurl={https://openreview.net/forum?id=Y0yz1pmVfE}\n}",
        "github": "",
        "project": "",
        "reviewers": "eRVD;UX5a;23zx;XvTp",
        "site": "https://openreview.net/forum?id=Y0yz1pmVfE",
        "pdf_size": 2798691,
        "rating": "3;3;5;5",
        "confidence": "2;4;3;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;2",
        "presentation": "1;1;2;2",
        "wc_summary": "35;316;247;68",
        "wc_strengths": "45;41;151;70",
        "wc_weaknesses": "274;372;96;47",
        "wc_questions": "282;112;510;1",
        "wc_review": "636;841;1004;186",
        "wc_reply_reviewers": "2247;435;111;97",
        "wc_reply_authors": "5192;2309;1528;484",
        "reply_reviewers": "5;2;1;1",
        "reply_authors": "10;6;3;2",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            166.5,
            118.13657350710659
        ],
        "wc_strengths_avg": [
            76.75,
            44.285296657016985
        ],
        "wc_weaknesses_avg": [
            197.25,
            131.58148615971777
        ],
        "wc_questions_avg": [
            226.25,
            191.97184038290615
        ],
        "wc_review_avg": [
            666.75,
            306.662171615607
        ],
        "wc_reply_reviewers_avg": [
            722.5,
            890.4969118419222
        ],
        "wc_reply_authors_avg": [
            2378.25,
            1748.7919222995056
        ],
        "reply_reviewers_avg": [
            2.25,
            1.6393596310755
        ],
        "reply_authors_avg": [
            5.25,
            3.112474899497183
        ],
        "replies_avg": [
            38,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:sLUf3BhwQ-IJ:scholar.google.com/&scioq=A+Cooperative-Game-Theoretical+Model+for+Ad+Hoc+Teamwork&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;2",
        "aff_unique_norm": "University of Manchester;University of Freiburg;Aalto University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.manchester.ac.uk;https://www.uni-freiburg.de;https://www.aalto.fi",
        "aff_unique_abbr": "UoM;UoF;Aalto",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;2",
        "aff_country_unique": "United Kingdom;Germany;Finland"
    },
    {
        "id": "Y29rdPpPu4",
        "title": "The Logarithm Trick: achieve better long term forecast via Mean Logarithm Square Loss",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Weather forecasting and time series prediction can be modeled as autoregressive prediction tasks and optimized through a pretraining-finetuning paradigm. We discovered that simply incorporating an element-wise logarithmic operation following the standard square error loss, which we term MLSE, noticeably enhances long-term forecast performance in the fine-tuning phase. Remarkably, MLSE acts as a plug-and-play, zero-cost enhancement for autoregressive tasks. In this paper, we conduct a series of comprehensive experiments that support the effectiveness of MLSE. Furthermore, we present a phenomenological theory to dive into the feasibility and limitations of MLSE, by modeling the rate of error accumulation. Our findings propose a promising direction for understanding long-term prediction based on finite history.",
        "keywords": "autoregressive;ai for science;time series;neural scientific simulations",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/1aa5858916a771daff4e686bcdad02b5471c90c6.pdf",
        "author": "Tianning Zhang;Rui Su;Tao Han;kang chen;Wanli Ouyang;LEI BAI",
        "authorids": "~Tianning_Zhang1;~Rui_Su1;~Tao_Han4;~kang_chen3;~Wanli_Ouyang1;~LEI_BAI1",
        "gender": ";M;M;M;;M",
        "homepage": "https://github.com/veya2ztn;;https://taohan10200.github.io/;https://github.com/yuchendoudou;;http://leibai.site/",
        "dblp": "71/2377;;78/744-3;;;119/1223-1",
        "google_scholar": ";tLLmRBwAAAAJ;a3OxwlMAAAAJ;;;https://scholar.google.com.au/citations?user=sakOO04AAAAJ",
        "orcid": ";;;;;0000-0003-3378-7201",
        "linkedin": ";;;;;lei-bai-641370153/",
        "or_profile": "~Tianning_Zhang1;~Rui_Su1;~Tao_Han4;~kang_chen3;~Wanli_Ouyang1;~LEI_BAI1",
        "aff": ";Shanghai Artificial Intelligence Laboratory;Department of Computer Science and Engineering, Hong Kong University of Science and Technology;University of Science and Technology of China;;Shanghai AI Laboratory",
        "aff_domain": ";pjlab.org.cn;cse.ust.hk;ustc.edu.cn;;pjlab.org.cn",
        "position": ";Researcher;PhD student;PhD student;;Researcher",
        "bibtex": "@misc{\nzhang2024the,\ntitle={The Logarithm Trick: achieve better long term forecast via Mean Logarithm Square Loss},\nauthor={Tianning Zhang and Rui Su and Tao Han and kang chen and Wanli Ouyang and LEI BAI},\nyear={2024},\nurl={https://openreview.net/forum?id=Y29rdPpPu4}\n}",
        "github": "",
        "project": "",
        "reviewers": "cW5f;YAoo;th6B;LBo8",
        "site": "https://openreview.net/forum?id=Y29rdPpPu4",
        "pdf_size": 1801118,
        "rating": "3;3;5;5",
        "confidence": "2;4;3;4",
        "soundness": "2;2;3;2",
        "contribution": "2;2;2;2",
        "presentation": "1;2;1;3",
        "wc_summary": "49;173;111;42",
        "wc_strengths": "44;57;83;33",
        "wc_weaknesses": "123;977;177;106",
        "wc_questions": "55;11;85;1",
        "wc_review": "271;1218;456;182",
        "wc_reply_reviewers": "0;0;69;37",
        "wc_reply_authors": "141;750;824;347",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "1;1;3;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            93.75,
            53.053628528122374
        ],
        "wc_strengths_avg": [
            54.25,
            18.64638034579366
        ],
        "wc_weaknesses_avg": [
            345.75,
            365.3938799432744
        ],
        "wc_questions_avg": [
            38.0,
            33.896902513356586
        ],
        "wc_review_avg": [
            531.75,
            408.3481204805527
        ],
        "wc_reply_reviewers_avg": [
            26.5,
            28.81405906844782
        ],
        "wc_reply_authors_avg": [
            515.5,
            282.31409812476596
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.30151134457776363,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:g1XKjLR5ni8J:scholar.google.com/&scioq=The+Logarithm+Trick:+achieve+better+long+term+forecast+via+Mean+Logarithm+Square+Loss&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Shanghai Artificial Intelligence Laboratory;Hong Kong University of Science and Technology;University of Science and Technology of China;Shanghai AI Laboratory",
        "aff_unique_dep": ";Department of Computer Science and Engineering;;",
        "aff_unique_url": "http://www.shailab.org/;https://www.ust.hk;http://www.ustc.edu.cn;https://www.shanghai-ai-lab.com",
        "aff_unique_abbr": "Shanghai AI Lab;HKUST;USTC;SAIL",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "Y2SHNI1R55",
        "title": "ABKD: Graph Neural Network Compression with Attention-Based Knowledge Distillation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Graph Neural Networks (GNNs) have proven to be quite versatile for a variety of applications, including recommendation systems, fake news detection, drug discovery, and even computer vision. Due to the expanding size of graph-structured data, GNN models have also increased in complexity, leading to substantial latency issues. This is primarily attributed to the irregular structure of graph data and its access pattern into memory. The natural solution to reduce latency is to compress large  GNNs into small GNNs. One way to do this is via knowledge distillation (KD). However, most KD approaches for GNNs only consider the outputs of the last layers and do not consider the outputs of the intermediate layers of the GNNs; these layers may contain important inductive biases indicated by the graph structure. To address this shortcoming, we propose a novel KD approach to GNN compression that we call Attention-Based Knowledge Distillation (ABKD). ABKD is a KD approach that uses attention to identify important intermediate teacher-student layer pairs and focuses on aligning their outputs. ABKD enables higher compression of GNNs with a smaller accuracy dropoff compared to existing KD approaches. On average, we achieve a 1.79% increase in accuracy with a $32.3\\times$ compression ratio on OGBN-Mag, a large graph dataset, compared to state-of-the-art approaches.",
        "keywords": "Graph Neural Networks;Compression;Knowledge Distillation",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/b7a25d607843a0aae2a9168986a4fbc986015e26.pdf",
        "author": "Anshul Ahluwalia;Rohit Das;Payman Behnam;Alind Khare;Pan Li;Alexey Tumanov",
        "authorids": "~Anshul_Ahluwalia1;~Rohit_Das1;~Payman_Behnam1;~Alind_Khare1;~Pan_Li2;~Alexey_Tumanov1",
        "gender": "M;M;M;M;;",
        "homepage": ";;http://www.paymanbehnam.com/;https://www.cc.gatech.edu/~akhare39/;;",
        "dblp": "359/4694;https://dblp.org/rec/journals/corr/abs-2310-15938;137/8818.html;211/0360;https://dblp.org/pers/hd/l/Li_0005:Pan;",
        "google_scholar": "z35QzKcAAAAJ;;3OGv5rMAAAAJ;zOqYHzsAAAAJ;IroP0EwAAAAJ;",
        "orcid": ";;0000-0002-3826-9123;0000-0003-4649-9022;;",
        "linkedin": "anshul-ahluwalia-17658264/;roh-das/;payman-behnam-ba104439/;;pan-li-b951105a/;",
        "or_profile": "~Anshul_Ahluwalia1;~Rohit_Das1;~Payman_Behnam1;~Alind_Khare1;~Pan_Li2;~Alexey_Tumanov1",
        "aff": "Georgia Institute of Technology;;Georgia Institute of Technology;Georgia Institute of Technology;Purdue University;",
        "aff_domain": "gatech.edu;;gatech.edu;gatech.edu;purdue.edu;",
        "position": "MS student;;PhD student;PhD student;Assistant Professor;",
        "bibtex": "@misc{\nahluwalia2024abkd,\ntitle={{ABKD}: Graph Neural Network Compression with Attention-Based Knowledge Distillation},\nauthor={Anshul Ahluwalia and Rohit Das and Payman Behnam and Alind Khare and Pan Li and Alexey Tumanov},\nyear={2024},\nurl={https://openreview.net/forum?id=Y2SHNI1R55}\n}",
        "github": "",
        "project": "",
        "reviewers": "GJj1;Vwgr;51nj;E3QF",
        "site": "https://openreview.net/forum?id=Y2SHNI1R55",
        "pdf_size": 544679,
        "rating": "3;3;3;5",
        "confidence": "3;4;3;4",
        "soundness": "2;2;2;2",
        "contribution": "2;3;2;2",
        "presentation": "2;2;2;3",
        "wc_summary": "107;201;90;94",
        "wc_strengths": "26;27;78;43",
        "wc_weaknesses": "66;444;460;102",
        "wc_questions": "57;116;2;2",
        "wc_review": "256;788;630;241",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            123.0,
            45.46977017755863
        ],
        "wc_strengths_avg": [
            43.5,
            21.02974084481309
        ],
        "wc_weaknesses_avg": [
            268.0,
            184.52642087245934
        ],
        "wc_questions_avg": [
            44.25,
            47.11886564848521
        ],
        "wc_review_avg": [
            478.75,
            236.98879192906992
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8459492375177299331&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "Georgia Institute of Technology;Purdue University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.gatech.edu;https://www.purdue.edu",
        "aff_unique_abbr": "Georgia Tech;Purdue",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Y2Txh5uGRe",
        "title": "Text2Data: Low-Resource Data Generation with Textual Control",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Natural language serves as a common and straightforward control signal for humans to interact seamlessly with machines. Recognizing the importance of this interface, the machine learning community is investing considerable effort in generating data that is semantically coherent with textual instructions. While strides have been made in text-to-data generation spanning image editing, audio synthesis, video creation, and beyond, low-resource areas characterized by expensive annotations or complex data structures, like molecules, motion dynamics, and time series, often lack textual labels. This deficiency impedes supervised learning, thereby constraining the application of advanced generative models for text-to-data tasks. In response to these challenges in the low-resource scenario, we propose Text2Data, a novel approach that utilizes unlabeled data to understand the underlying data distribution through an unsupervised diffusion model. Subsequently, it undergoes controllable finetuning via a novel constraint optimization-based learning objective that ensures controllability and effectively counteracts catastrophic forgetting. Comprehensive experiments demonstrate that Text2Data is able to achieve enhanced performance regarding both generation quality and controllability across various modalities, including molecules, motions and time series, when compared to existing baselines.",
        "keywords": "low resource;text-to-data generation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/231b20d714518efafb4de4b587232576615f9808.zip",
        "author": "Shiyu Wang;Yihao Feng;Tian Lan;Ning Yu;Yu Bai;Ran Xu;Huan Wang;Caiming Xiong;Silvio Savarese",
        "authorids": "~Shiyu_Wang2;~Yihao_Feng1;~Tian_Lan13;~Ning_Yu2;~Yu_Bai1;~Ran_Xu1;~Huan_Wang1;~Caiming_Xiong1;~Silvio_Savarese1",
        "gender": "M;M;;;;M;M;M;M",
        "homepage": "https://sites.google.com/view/about-shiyuwang;;;;https://yubai.org;;http://www.cs.yale.edu/homes/wang-huan/;http://cmxiong.com/;",
        "dblp": ";204/3696;;;03/6325-17.html;;70/6155-16.html;80/7282;50/3578",
        "google_scholar": "https://scholar.google.com/citations?hl=en;uqnNle0AAAAJ;;;owqhKD8AAAAJ;sgBB2sUAAAAJ;7NpTttkAAAAJ;vaSdahkAAAAJ;ImpbxLsAAAAJ",
        "orcid": ";;;;;;;;",
        "linkedin": "shiyu-wang-647a7b91/;;tian-lan-770b4b165/;;;;huanwangyale/;caiming-xiong-150a1417;",
        "or_profile": "~Shiyu_Wang2;~Yihao_Feng1;~Tian_Lan13;~Ning_Yu2;~Yu_Bai1;~Ran_Xu1;~Huan_Wang1;~Caiming_Xiong1;~Silvio_Savarese1",
        "aff": "Emory University;Salesforce AI Research;SalesForce;;Salesforce Research;SalesForce.com;Salesforce.com;Salesforce Research;Stanford University",
        "aff_domain": "emory.edu;salesforce.com;salesforce.com;;salesforce.com;salesforce.com;salesforce.com;salesforce.com;stanford.edu",
        "position": "PhD student;Researcher;Researcher;;Research Scientist;senior manager;Researcher;Research Scientist;Adjunct Professor",
        "bibtex": "@misc{\nwang2024textdata,\ntitle={Text2Data: Low-Resource Data Generation with Textual Control},\nauthor={Shiyu Wang and Yihao Feng and Tian Lan and Ning Yu and Yu Bai and Ran Xu and Huan Wang and Caiming Xiong and Silvio Savarese},\nyear={2024},\nurl={https://openreview.net/forum?id=Y2Txh5uGRe}\n}",
        "github": "",
        "project": "",
        "reviewers": "m4kw;L6cR;Yf2d;qy29",
        "site": "https://openreview.net/forum?id=Y2Txh5uGRe",
        "pdf_size": 4645990,
        "rating": "3;3;5;6",
        "confidence": "4;2;3;2",
        "soundness": "4;3;3;3",
        "contribution": "2;2;3;2",
        "presentation": "3;2;2;3",
        "wc_summary": "74;90;37;91",
        "wc_strengths": "42;45;95;104",
        "wc_weaknesses": "219;170;234;71",
        "wc_questions": "69;4;6;68",
        "wc_review": "404;309;372;334",
        "wc_reply_reviewers": "0;175;0;0",
        "wc_reply_authors": "622;742;843;638",
        "reply_reviewers": "0;2;0;0",
        "reply_authors": "1;2;2;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            73.0,
            21.85177338341216
        ],
        "wc_strengths_avg": [
            71.5,
            28.20017730440715
        ],
        "wc_weaknesses_avg": [
            173.5,
            63.735782728385786
        ],
        "wc_questions_avg": [
            36.75,
            31.75984099456419
        ],
        "wc_review_avg": [
            354.75,
            36.217226564164186
        ],
        "wc_reply_reviewers_avg": [
            43.75,
            75.77722283113839
        ],
        "wc_reply_authors_avg": [
            711.25,
            88.93080175057459
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -0.4061811972299616,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13273622007817632926&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1;1;1;1;1;2",
        "aff_unique_norm": "Emory University;Salesforce;Stanford University",
        "aff_unique_dep": ";Salesforce AI Research;",
        "aff_unique_url": "https://www.emory.edu;https://www.salesforce.com;https://www.stanford.edu",
        "aff_unique_abbr": "Emory;Salesforce AI;Stanford",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Stanford",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "DecompOpt: Controllable and Decomposed Diffusion Models for Structure-based Molecular Optimization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18436",
        "id": "Y3BbxvAQS9",
        "author_site": "Xiangxin Zhou, Xiwei Cheng, Yuwei Yang, Yu Bao, Liang Wang, Quanquan Gu",
        "tldr": "",
        "abstract": "Recently, 3D generative models have shown promising performances in structure-based drug design by learning to generate ligands given target binding sites. However, only modeling the target-ligand distribution can hardly fulfill one of the main goals in drug discovery -- designing novel ligands with desired properties, e.g., high binding affinity, easily synthesizable, etc. This challenge becomes particularly pronounced when the target-ligand pairs used for training do not align with these desired properties. Moreover, most existing methods aim at solving de novo design task, while many generative scenarios requiring flexible controllability, such as R-group optimization and scaffold hopping, have received little attention. In this work, we propose DecompOpt, a structure-based molecular optimization method based on a controllable and decomposed diffusion model. DecompOpt presents a new generation paradigm which combines optimization with conditional diffusion models to achieve desired properties while adhering to the molecular grammar. Additionally, DecompOpt offers a unified framework covering both de novo design and controllable generation. To achieve so, ligands are decomposed into substructures which allows fine-grained control and local optimization. Experiments show that DecompOpt can efficiently generate molecules with improved properties than strong de novo baselines, and demonstrate great potential in controllable generation tasks.",
        "keywords": "Structure-based drug design;molecule optimization;diffusion models;3D molecule generation",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/a696ab7416e575b8201f2881c9a5ad2fac7f95d3.zip",
        "author": "Xiangxin Zhou;Xiwei Cheng;Yuwei Yang;Yu Bao;Liang Wang;Quanquan Gu",
        "authorids": "~Xiangxin_Zhou1;~Xiwei_Cheng1;~Yuwei_Yang2;~Yu_Bao1;~Liang_Wang3;~Quanquan_Gu1",
        "gender": "Not Specified;F;;M;M;M",
        "homepage": ";https://github.com/laviaf;;https://baoy-nlp.github.io/;;http://web.cs.ucla.edu/~qgu/",
        "dblp": "247/9275;286/0981;;;56/4499-1;50/4597",
        "google_scholar": "eQgIWcQAAAAJ;;;https://scholar.google.com/citations?authuser=1;;GU9HgNAAAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";;yuwei-yang-89780179/;;;",
        "or_profile": "~Xiangxin_Zhou1;~Xiwei_Cheng1;~Yuwei_Yang2;~Yu_Bao1;~Liang_Wang3;~Quanquan_Gu1",
        "aff": "Institute of Automation, Chinese Academy of Sciences;University of California, San Diego;ByteDance AI Lab;ByteDance Research;Institute of Automation\uff0c CAS\uff0cChina;University of California, Los Angeles",
        "aff_domain": "ia.ac.cn;ucsd.edu;bytedance.com;bytedance.com;ia.ac.cn;cs.ucla.edu",
        "position": "PhD student;MS student;Researcher;Researcher;Full Professor;Associate Professor",
        "bibtex": "@inproceedings{\nzhou2024decompopt,\ntitle={DecompOpt: Controllable and Decomposed Diffusion Models for Structure-based Molecular Optimization},\nauthor={Xiangxin Zhou and Xiwei Cheng and Yuwei Yang and Yu Bao and Liang Wang and Quanquan Gu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Y3BbxvAQS9}\n}",
        "github": "",
        "project": "",
        "reviewers": "ewuH;dt3J;SQ7r;Tgrc;eZ5C",
        "pdf_size": 15789728,
        "rating": "5;6;6;6;8",
        "confidence": "4;4;3;3;3",
        "soundness": "2;2;3;3;3",
        "contribution": "2;3;2;2;3",
        "presentation": "3;2;3;2;3",
        "wc_summary": "57;50;127;40;70",
        "wc_strengths": "15;22;39;42;31",
        "wc_weaknesses": "237;155;28;64;92",
        "wc_questions": "35;76;59;45;24",
        "wc_review": "344;303;253;191;217",
        "wc_reply_reviewers": "0;0;35;0;62",
        "wc_reply_authors": "1609;1409;718;238;591",
        "reply_reviewers": "0;0;1;0;1",
        "reply_authors": "4;3;3;1;2",
        "rating_avg": [
            6.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.4,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            68.8,
            30.694624936623672
        ],
        "wc_strengths_avg": [
            29.8,
            10.146920715172659
        ],
        "wc_weaknesses_avg": [
            115.2,
            73.73303194634003
        ],
        "wc_questions_avg": [
            47.8,
            18.214280112043955
        ],
        "wc_review_avg": [
            261.6,
            55.76952572866296
        ],
        "wc_reply_reviewers_avg": [
            19.4,
            25.2475741408952
        ],
        "wc_reply_authors_avg": [
            913.0,
            515.3185422629385
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            2.6,
            1.019803902718557
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5833333333333334,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16619193089654386265&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=Y3BbxvAQS9",
        "pdf": "https://openreview.net/pdf?id=Y3BbxvAQS9",
        "email": "ia.ac.cn;ucsd.edu;bytedance.com;bytedance.com;ia.ac.cn;cs.ucla.edu",
        "author_num": 6,
        "aff_unique_index": "0;1;2;2;0;3",
        "aff_unique_norm": "Chinese Academy of Sciences;University of California, San Diego;ByteDance;University of California, Los Angeles",
        "aff_unique_dep": "Institute of Automation;;AI Lab;",
        "aff_unique_url": "http://www.ia.cas.cn;https://www.ucsd.edu;https://www.bytedance.com;https://www.ucla.edu",
        "aff_unique_abbr": "CAS;UCSD;ByteDance;UCLA",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";San Diego;Los Angeles",
        "aff_country_unique_index": "0;1;0;0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "Y3NBqtrQat",
        "title": "Learning Object-Centric Representation via Reverse Hierarchy Guidance",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Object-Centric Learning (OCL) seeks to enable Neural Networks to identify individual objects in a visual scene in an unsupervised manner, which is a meaningful task because the ability to recognize objects and understand their relationships is the foundation of interpretable visual comprehension and reasoning. Due to humans' strong ability to split visual scenes into object sets, incorporating the mechanism of human visual perception into model architecture is a potential way to enhance object representation. According to Reverse Hierarchy Theory (RHT), the human visual system comprises two reverse processes: a bottom-up process rapidly extracting the gist of scenes and a top-down process integrating detailed information into consciousness. Inspired by RHT, We propose Reverse Hierarchy Guided Network (RHGNet) that enhances the models' object-centric representations through an extra top-down pathway as described in RHT. This pathway allows for more decisive semantic information to be included in extracted low-level features, as well as helps search for optimal solutions to distinguish objects from low-level features. We demonstrate with experiments that the model benefits from our method and achieves a stronger ability to differentiate objects, especially the easily ignored small and occluded ones, than current models following a pure bottom-up fashion.",
        "keywords": "Computer Vision; Reverse Hierarchy Theory; Object-Centric Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/233f8c7ad15e0f60af6c8a1b71e33793961b74b6.pdf",
        "author": "Junhong Zou;Xiangyu Zhu;Zhaoxiang Zhang;Zhen Lei",
        "authorids": "~Junhong_Zou1;~Xiangyu_Zhu3;~Zhaoxiang_Zhang3;~Zhen_Lei2",
        "gender": ";M;M;M",
        "homepage": "https://xiangyuzhu-open.github.io/homepage/;http://zhaoxiangzhang.net;http://www.cbsr.ia.ac.cn/users/zlei/;",
        "dblp": "19/10065-1;55/2285-1.html;55/112-1.html;301/7838",
        "google_scholar": "1rbNk5oAAAAJ;qxWfV6cAAAAJ;cuJ3QG8AAAAJ;",
        "orcid": "0000-0002-4636-9677;;0000-0002-0791-189X;0000-0003-3186-7566",
        "linkedin": ";;;",
        "or_profile": "~Xiangyu_Zhu3;~Zhaoxiang_Zhang3;~Zhen_Lei2;~\u4fca\u6cd3_\u90b91",
        "aff": "Institute of Automation, Chinese Academy of Sciences;Institute of Automation, Chinese Academy of Sciences;Institute of Automation,  Chinese Academy of Sciences;Institute of Automation, Chinese Academy of Sciences",
        "aff_domain": "ia.ac.cn;ia.ac.cn;ia.ac.cn;ia.ac.cn",
        "position": "Associate Professor;Full Professor;Full Professor;PhD student",
        "bibtex": "@misc{\nzou2024learning,\ntitle={Learning Object-Centric Representation via Reverse Hierarchy Guidance},\nauthor={Junhong Zou and Xiangyu Zhu and Zhaoxiang Zhang and Zhen Lei},\nyear={2024},\nurl={https://openreview.net/forum?id=Y3NBqtrQat}\n}",
        "github": "",
        "project": "",
        "reviewers": "SoMm;UGEP;uwGV;TuCC",
        "site": "https://openreview.net/forum?id=Y3NBqtrQat",
        "pdf_size": 5679428,
        "rating": "5;5;6;6",
        "confidence": "4;3;4;3",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;2",
        "presentation": "3;3;2;2",
        "wc_summary": "72;31;88;140",
        "wc_strengths": "40;112;81;95",
        "wc_weaknesses": "85;51;97;204",
        "wc_questions": "20;3;148;499",
        "wc_review": "217;197;414;938",
        "wc_reply_reviewers": "5;0;124;0",
        "wc_reply_authors": "339;151;798;764",
        "reply_reviewers": "1;0;2;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            82.75,
            39.04724702203729
        ],
        "wc_strengths_avg": [
            82.0,
            26.61766330841233
        ],
        "wc_weaknesses_avg": [
            109.25,
            57.24672479714451
        ],
        "wc_questions_avg": [
            167.5,
            199.4298122147238
        ],
        "wc_review_avg": [
            441.5,
            298.9351936457131
        ],
        "wc_reply_reviewers_avg": [
            32.25,
            53.0112016464445
        ],
        "wc_reply_authors_avg": [
            513.0,
            276.3810774998896
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:qhbmKcoU-cYJ:scholar.google.com/&scioq=Learning+Object-Centric+Representation+via+Reverse+Hierarchy+Guidance&hl=en&as_sdt=0,33",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Chinese Academy of Sciences",
        "aff_unique_dep": "Institute of Automation",
        "aff_unique_url": "http://www.ia.cas.cn",
        "aff_unique_abbr": "CAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "GoLLIE: Annotation Guidelines improve Zero-Shot Information-Extraction",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18435",
        "id": "Y3wpuxd7u9",
        "author_site": "Oscar Sainz, Iker Garc\u00eda-Ferrero, Rodrigo Agerri, Oier Lacalle, German Rigau, Eneko Agirre",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) combined with instruction tuning have made significant progress when generalizing to unseen tasks. However, they have been less successful in Information Extraction (IE), lagging behind task-specific models. Typically, IE tasks are characterized by complex annotation guidelines which describe the task and give examples to humans. Previous attempts to leverage such information have failed, even with the largest models, as they are not able to follow the guidelines out-of-the-box. In this paper we propose GoLLIE (Guideline-following Large Language Model for IE), a model able to improve zero-shot results on unseen IE tasks by virtue of being fine-tuned to comply with annotation guidelines. Comprehensive evaluation empirically demonstrates that GoLLIE is able to generalize to and follow unseen guidelines, outperforming previous attempts at zero-shot information extraction. The ablation study shows that detailed guidelines is key for good results. Code, data and models will be made publicly available.",
        "keywords": "Information Extraction;Zero-Shot;Annotation Guidelines;Large Language Models;LLM;prompt",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Oscar Sainz;Iker Garc\u00eda-Ferrero;Rodrigo Agerri;Oier Lopez de Lacalle;German Rigau;Eneko Agirre",
        "authorids": "~Oscar_Sainz1;~Iker_Garc\u00eda-Ferrero1;~Rodrigo_Agerri1;~Oier_Lopez_de_Lacalle1;~German_Rigau2;~Eneko_Agirre1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://osainz59.github.io/;https://ikergarcia1996.github.io/Iker-Garcia-Ferrero/;https://ragerri.github.io/;https://oierldl.github.io/;https://adimen.si.ehu.es/~rigau/;http://ixa.si.ehu.eus/eneko",
        "dblp": "266/1113;305/9880;57/5047;11/4461;66/1456.html;a/EnekoAgirre",
        "google_scholar": "https://scholar.google.es/citations?user=3Z5zok8AAAAJ;https://scholar.google.es/citations?user=yoOzj1MAAAAJ;https://scholar.google.es/citations?user=1SJh0a8AAAAJ;nieh6tUAAAAJ;3RHckhYAAAAJ;https://scholar.google.es/citations?user=kSuqts0AAAAJ",
        "orcid": "0000-0003-0890-7670;0000-0001-9612-7134;0000-0002-7303-7598;0000-0003-4969-2055;0000-0003-1119-0930;",
        "linkedin": ";iker-garc%C3%ADa-ferrero-75343b172/;rodrigo-agerri-0678616;oier-lopez-de-lacalle-4044a36/;german-rigau-a4ba3a173/;",
        "or_profile": "~Oscar_Sainz1;~Iker_Garc\u00eda-Ferrero1;~Rodrigo_Agerri1;~Oier_Lopez_de_Lacalle1;~German_Rigau2;~Eneko_Agirre1",
        "aff": "University of the Basque Country (UPV/EHU);Universidad del Pa\u00eds Vasco;University of the Basque Country;Universidad del Pa\u00eds Vasco;Universidad del Pa\u00eds Vasco;University of the Basque Country (UPV/EHU)",
        "aff_domain": "ehu.eus;ehu.eus;ehu.eus;ehu.eus;ehu.eus;ehu.eus",
        "position": "PhD student;PhD student;Principal Researcher;Associate Professor;Associate Professor;Full Professor",
        "bibtex": "@inproceedings{\nsainz2024gollie,\ntitle={Go{LLIE}: Annotation Guidelines improve Zero-Shot Information-Extraction},\nauthor={Oscar Sainz and Iker Garc{\\'\\i}a-Ferrero and Rodrigo Agerri and Oier Lopez de Lacalle and German Rigau and Eneko Agirre},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Y3wpuxd7u9}\n}",
        "github": "",
        "project": "",
        "reviewers": "xrh5;bJoP;y8gw;zWZU",
        "pdf_size": 1121952,
        "rating": "5;6;6;8",
        "confidence": "4;3;4;5",
        "soundness": "2;3;4;3",
        "contribution": "3;3;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "100;105;75;38",
        "wc_strengths": "120;53;11;126",
        "wc_weaknesses": "222;112;137;173",
        "wc_questions": "223;56;3;102",
        "wc_review": "665;326;226;439",
        "wc_reply_reviewers": "220;5;4;87",
        "wc_reply_authors": "1370;638;409;396",
        "reply_reviewers": "2;1;1;1",
        "reply_authors": "3;2;1;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            79.5,
            26.51886121235224
        ],
        "wc_strengths_avg": [
            77.5,
            47.90876746483883
        ],
        "wc_weaknesses_avg": [
            161.0,
            41.35819144982043
        ],
        "wc_questions_avg": [
            96.0,
            81.26192220222212
        ],
        "wc_review_avg": [
            414.0,
            163.33554420272398
        ],
        "wc_reply_reviewers_avg": [
            79.0,
            88.09937570720919
        ],
        "wc_reply_authors_avg": [
            703.25,
            396.7993038048328
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.6488856845230502,
        "gs_citation": 98,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11101510429136301975&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 9,
        "openreview": "https://openreview.net/forum?id=Y3wpuxd7u9",
        "pdf": "https://openreview.net/pdf?id=Y3wpuxd7u9",
        "email": "ehu.eus;ehu.eus;ehu.eus;ehu.eus;ehu.eus;ehu.eus",
        "author_num": 6,
        "aff_unique_index": "0;1;0;1;1;0",
        "aff_unique_norm": "University of the Basque Country;Universidad del Pa\u00eds Vasco",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ehu.eus/en;https://www.ehu.eus/en",
        "aff_unique_abbr": "UPV/EHU;UPV/EHU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "Spain"
    },
    {
        "id": "Y5Xkw9fpty",
        "title": "Smooth Min-Max Monotonic Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Monotonicity constraints are powerful regularizers in statistical modelling. They can support fairness in computer-aided decision making and increase plausibility in data-driven scientific models. The seminal min-max (MM) neural network architecture ensures monotonicity, but often gets stuck in undesired local optima during training because of partial derivatives being zero when computing extrema. We propose a simple modification of the MM network using strictly-increasing smooth minimum and maximum functions that alleviates this problem. The resulting smooth min-max (SMM) network module inherits the asymptotic approximation properties from the MM architecture. It can be used within larger deep learning systems trained end-to-end. The SMM module is conceptually simple and computationally less demanding than state-of-the-art neural networks for monotonic modelling. Our experiments show that this does not come with a loss in generalization performance compared to alternative neural and non-neural approaches.",
        "keywords": "monotonicity;neural networks;deep learning;fairness;scientific modelling",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/97add8d5d2eadb9493521b35c2d449c7a6655866.zip",
        "author": "Christian Igel",
        "authorids": "~Christian_Igel1",
        "gender": "M",
        "homepage": "https://christian-igel.github.io/",
        "dblp": "38/6146",
        "google_scholar": "https://scholar.google.dk/citations?user=d-jF4zIAAAAJ",
        "orcid": "0000-0003-2868-0856",
        "linkedin": "christianigel/",
        "or_profile": "~Christian_Igel1",
        "aff": "University of Copenhagen",
        "aff_domain": "ku.dk",
        "position": "Full Professor",
        "bibtex": "@misc{\nigel2024smooth,\ntitle={Smooth Min-Max Monotonic Networks},\nauthor={Christian Igel},\nyear={2024},\nurl={https://openreview.net/forum?id=Y5Xkw9fpty}\n}",
        "github": "",
        "project": "",
        "reviewers": "odc5;2p1V;RbCP",
        "site": "https://openreview.net/forum?id=Y5Xkw9fpty",
        "pdf_size": 547932,
        "rating": "3;3;6",
        "confidence": "3;2;4",
        "soundness": "3;3;4",
        "contribution": "2;2;3",
        "presentation": "3;3;4",
        "wc_summary": "75;31;59",
        "wc_strengths": "68;33;71",
        "wc_weaknesses": "125;56;121",
        "wc_questions": "33;2;44",
        "wc_review": "301;122;295",
        "wc_reply_reviewers": "0;0;104",
        "wc_reply_authors": "477;410;326",
        "reply_reviewers": "0;0;1",
        "reply_authors": "1;1;2",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            55.0,
            18.184242262647807
        ],
        "wc_strengths_avg": [
            57.333333333333336,
            17.249798710580816
        ],
        "wc_weaknesses_avg": [
            100.66666666666667,
            31.626290048347787
        ],
        "wc_questions_avg": [
            26.333333333333332,
            17.78263822446552
        ],
        "wc_review_avg": [
            239.33333333333334,
            83.0033466527438
        ],
        "wc_reply_reviewers_avg": [
            34.666666666666664,
            49.0260701622673
        ],
        "wc_reply_authors_avg": [
            404.3333333333333,
            61.77557949725946
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0.8660254037844387,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:VAfUke2I2TUJ:scholar.google.com/&scioq=Smooth+Min-Max+Monotonic+Networks&hl=en&as_sdt=0,5",
        "gs_version_total": 7,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Copenhagen",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ku.dk",
        "aff_unique_abbr": "UCPH",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Denmark"
    },
    {
        "id": "Y6NjyD6NSJ",
        "title": "A Database-based Rather Than a Language Model-based Natural Language Processing Method",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Language models pre-training for NLP tasks take natural language as the direct modeling object. However, we believe that natural language is essentially a way of encoding information ( knowledge). Therefore, the object of study for natural language should be the information encoded in language, and the organizational and compositional structure of the information described in language. Based on this understanding, we propose a database-based NLP method that changes the modeling object from natural language to the information encoded in natural language. On this basis, 1) sentences generation task is transformed into read operations implemented on the database, and some sentence encoding rules to be followed; 2) sentences understanding task is transformed into sentence decoding rules and a series of Boolean operations implemented on the database; 3) learning task can be achieved by writing operations. Our method is more closer to how the human brain processes information and has excellent interpretability and scalability.",
        "keywords": "NLP;NLG;NLU;Learning;database;TGHM",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Limin Zhang",
        "authorids": "~Limin_Zhang1",
        "gender": "F",
        "homepage": "",
        "dblp": "92/3585",
        "google_scholar": "",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Limin_Zhang1",
        "aff": "",
        "aff_domain": "",
        "position": "",
        "bibtex": "@misc{\nzhang2024a,\ntitle={A Database-based Rather Than a Language Model-based Natural Language Processing Method},\nauthor={Limin Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=Y6NjyD6NSJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=Y6NjyD6NSJ",
        "pdf_size": 921310,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:KcP-jskoL94J:scholar.google.com/&scioq=A+Database-based+Rather+Than+a+Language+Model-based+Natural+Language+Processing+Method&hl=en&as_sdt=0,33",
        "gs_version_total": 2
    },
    {
        "id": "Y6PVsnkKVV",
        "title": "Reason to Behave: Achieving Human-Like Task Execution for Physics-Based Characters",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Two challenges have consistently been key in human-like agent research: 1) Many jobs require human-level reasoning and introspection capabilities to discern underlying patterns. 2) Controlling complex modeled humanoid characters in indeterministic black-box physical environments demands a powerful controller to exhibit human-like movement and commonsensical behavior. To the end, we introduce ''Reason to Behave\", a synergistic framework combining large language models (LLMs) based introspective reasoner with an enhanced controller. The reasoner empowers the agent with extensive world knowledge and semantic insights, enhancing contextual interpretation and reasoning formulating a code-based action plan to bridge the gap between high-level instructions and the underlying simulator. The steerable controller embeds motion-phase representation into adversarial motion prior to the precise timing of diverse life-like behaviors, allowing rapid mastery over 100 semantically distinct actions, ranging from locomotion, dance, and sport to challenging specialized maneuvers, preventing mode collapse during skill learning. Without any reward-shaping or training, our character intuitively performs commonsensical behavior, excelling in many real-world tasks from navigation to more complicated challenges like room escaping and pressure plate puzzle.Videos, codes are available at https://sites.google.com/view/reasontobehave.",
        "keywords": "animation character control;physics-based character control;humanoid skill learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Nian Liu;Yaodong Yang;Zilong Zhang;Zi Wang;Jiayi Zhou;Libin Liu;Song-Chun Zhu;Zhibo Yang;Zhaofeng He",
        "authorids": "~Nian_Liu4;~Yaodong_Yang1;~Zilong_Zhang3;~Zi_Wang11;~Jiayi_Zhou2;~Libin_Liu1;~Song-Chun_Zhu1;~Zhibo_Yang6;~Zhaofeng_He1",
        "gender": ";M;;M;M;;M;M;M",
        "homepage": ";https://www.yangyaodong.com;https://github.com/zzl-Alexander;https://github.com/1c33;https://gaiejj.github.io/;;https://zhusongchun.net/;;https://teacher.bupt.edu.cn/zhaofenghe/zh_CN/index.htm",
        "dblp": ";170/1496-1;;;;;10/10313;;13/3992",
        "google_scholar": ";https://scholar.google.co.uk/citations?user=6yL0xw8AAAAJ;;;rD77vW8AAAAJ;;https://scholar.google.com.tw/citations?user=Al8dyb4AAAAJ;;https://scholar.google.com.hk/citations?hl=zh-CN",
        "orcid": ";0000-0001-8132-5613;;;;;;0000-0001-7668-4283;0000-0002-3433-8435",
        "linkedin": ";yaodong-yang;;;;;;;",
        "or_profile": "~Nian_Liu4;~Yaodong_Yang1;~Zilong_Zhang3;~Zi_Wang11;~Jiayi_Zhou2;~Libin_Liu1;~Song-Chun_Zhu1;~Zhibo_Yang6;~Zhaofeng_He1",
        "aff": ";Peking University;Beijing University of Posts and Telecommunications;Beijing University of Posts and Telecommunications;Xi'an Jiaotong University;;Peking University;;Beijing University of Post and Telecommunication",
        "aff_domain": ";pku.edu.cn;bupt.edu.cn;bupt.edu.cn;xjtu.edu.cn;;pku.edu.cn;;bupt.edu.cn",
        "position": ";Assistant Professor;MS student;MS student;Undergrad student;;Full Professor;;Full Professor",
        "bibtex": "@misc{\nliu2024reason,\ntitle={Reason to Behave: Achieving Human-Like Task Execution for Physics-Based Characters},\nauthor={Nian Liu and Yaodong Yang and Zilong Zhang and Zi Wang and Jiayi Zhou and Libin Liu and Song-Chun Zhu and Zhibo Yang and Zhaofeng He},\nyear={2024},\nurl={https://openreview.net/forum?id=Y6PVsnkKVV}\n}",
        "github": "",
        "project": "",
        "reviewers": "qhTT;vRe6;oeTZ;DdyJ",
        "site": "https://openreview.net/forum?id=Y6PVsnkKVV",
        "pdf_size": 7426747,
        "rating": "1;3;3;5",
        "confidence": "4;5;4;4",
        "soundness": "1;1;2;3",
        "contribution": "1;2;1;2",
        "presentation": "1;1;1;3",
        "wc_summary": "138;83;48;103",
        "wc_strengths": "89;40;13;153",
        "wc_weaknesses": "804;424;334;362",
        "wc_questions": "6;29;2;1",
        "wc_review": "1037;576;397;619",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            1.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            93.0,
            32.59601202601324
        ],
        "wc_strengths_avg": [
            73.75,
            53.25117369598533
        ],
        "wc_weaknesses_avg": [
            481.0,
            189.30662957223657
        ],
        "wc_questions_avg": [
            9.5,
            11.412712210513327
        ],
        "wc_review_avg": [
            657.25,
            234.5233197360126
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:wccDGz8o6vYJ:scholar.google.com/&scioq=Reason+to+Behave:+Achieving+Human-Like+Task+Execution+for+Physics-Based+Characters&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;2;0;1",
        "aff_unique_norm": "Peking University;Beijing University of Posts and Telecommunications;Xi'an Jiao Tong University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.pku.edu.cn;http://www.bupt.edu.cn/;https://www.xjtu.edu.cn",
        "aff_unique_abbr": "Peking U;BUPT;XJTU",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Beijing",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "Y7SqgqKIkz",
        "title": "Data-Efficient Group Robustness via Out of Distribution Concepts",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Deep Neural Networks are prone to capturing correlations between spurious attributes and class labels, leading to low accuracy on some groups of the data. Existing methods rely on group labels either during training or validation to improve the model's robustness to spurious correlation. We propose Concept DRO, a method to mitigate spurious correlations even when both training and validation group labels are unknown. We first observe that data points can be separated into groups using concepts, sets of curated images representing the spurious attribute. We thus leverage concepts to estimate group labels, and then use these labels to train with a distributively robust optimization objective. We empirically show that Concept DRO outperforms existing methods that do not require group labels.",
        "keywords": "Spurious Correlations;Robustness;Group Shifts",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Yiwei Yang;Anthony Zhe Liu;Robert Wolfe;Aylin Caliskan;Bill Howe",
        "authorids": "~Yiwei_Yang1;~Anthony_Zhe_Liu1;~Robert_Wolfe1;~Aylin_Caliskan1;~Bill_Howe1",
        "gender": "M;;;Unspecified;M",
        "homepage": "https://yanyiwei.github.io/;https://anthliu.github.io/;https://wolferobert3.github.io/;https://faculty.washington.edu/aylin/;https://faculty.washington.edu/billhowe/",
        "dblp": "233/9195-4;264/2652.html;50/689;116/4680;h/BillHowe",
        "google_scholar": ";TjEqCOAAAAAJ;5FZ12lEAAAAJ;zxzZAi0AAAAJ;dQ-x9NQAAAAJ",
        "orcid": ";;;;",
        "linkedin": "yiwei-yang-1b8bb8125/;;wolferobertiii/;;",
        "or_profile": "~Yiwei_Yang1;~Anthony_Zhe_Liu1;~Robert_Wolfe1;~Aylin_Caliskan1;~Bill_Howe1",
        "aff": "University of Washington;University of Michigan;University of Washington;University of Washington;University of Washington",
        "aff_domain": "uw.edu;umich.edu;uw.edu;uw.edu;u.washington.edu",
        "position": "PhD student;PhD student;PhD student;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nyang2024dataefficient,\ntitle={Data-Efficient Group Robustness via Out of Distribution Concepts},\nauthor={Yiwei Yang and Anthony Zhe Liu and Robert Wolfe and Aylin Caliskan and Bill Howe},\nyear={2024},\nurl={https://openreview.net/forum?id=Y7SqgqKIkz}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=Y7SqgqKIkz",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:2CXmoLgJ4XgJ:scholar.google.com/&scioq=Data-Efficient+Group+Robustness+via+Out+of+Distribution+Concepts&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0;0",
        "aff_unique_norm": "University of Washington;University of Michigan",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.washington.edu;https://www.umich.edu",
        "aff_unique_abbr": "UW;UM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Y84b6FahMD",
        "title": "Counterfactual Fairness from Partially DAGs: A General Min-Max Optimization Framework",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Developing fair automated machine learning algorithms is critical in making safe and trustworthy decisions. Many causality-based fairness notions have been proposed to address the above issues by quantifying the causal connections between sensitive attributes and decisions, and when the true causal graph is fully known, certain algorithms that achieve counterfactual fairness have been proposed. However, when the true causal graph is unknown, it is still challenging to effectively and well exploit partially directed acyclic graphs (PDAGs) to achieve counterfactual fairness. To tackle the above issue, a recent work suggests using non-descendants of sensitive attribute for fair prediction. Interestingly, in this paper, we show it is actually possible to achieve counterfactual fairness even using the descendants of the sensitive attribute for prediction, by carefully control the possible counterfactual effects of the sensitive attribute. We propose a general min-max optimization framework that can effectively achieve counterfactual fairness with promising prediction accuracy, and can be extended to maximally oriented PDAGs (MPDAGs) with added background knowledge. Specifically, we first estimate all possible counterfactual treatment effects of sensitive attribute on a given prediction model from all possible adjustment sets of sensitive attributes. Next, we propose to alternatively update the prediction model and the corresponding possible estimated causal effects, where the prediction model is trained via a min-max loss to control the worst-case fairness violations. Extensive experiments on synthetic and real-world datasets verifying the effectiveness of our methods.",
        "keywords": "fairness;counterfactual fairness;DAG;partially DAG",
        "primary_area": "causal reasoning",
        "supplementary_material": "/attachment/b666bd31dea0556bd742181d36c2d2bd00280ade.zip",
        "author": "Haoxuan Li;Yue Liu;Zhi Geng;Kun Zhang",
        "authorids": "~Haoxuan_Li6;~Yue_Liu9;~Zhi_Geng1;~Kun_Zhang1",
        "gender": "M;;M;M",
        "homepage": "https://haoxuanli-pku.github.io/;;https://stxy.btbu.edu.cn/szdw/bssds/34339356074b408c8650309f05f24558.htm;http://www.andrew.cmu.edu/user/kunz1/",
        "dblp": "145/4965-1.html;;;96/3115-1",
        "google_scholar": "gtDqiucAAAAJ;;;RGoypN4AAAAJ",
        "orcid": "0000-0003-3620-3769;;;",
        "linkedin": ";;;",
        "or_profile": "~Haoxuan_Li6;~Yue_Liu9;~Zhi_Geng1;~Kun_Zhang1",
        "aff": "Peking University;;School of mathematical Science, Peking University, Peking University;Carnegie Mellon University",
        "aff_domain": "pku.edu.cn;;math.pku.edu.cn;cmu.edu",
        "position": "PhD student;;Full Professor;Associate Professor",
        "bibtex": "@misc{\nli2024counterfactual,\ntitle={Counterfactual Fairness from Partially {DAG}s: A General Min-Max Optimization Framework},\nauthor={Haoxuan Li and Yue Liu and Zhi Geng and Kun Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=Y84b6FahMD}\n}",
        "github": "",
        "project": "",
        "reviewers": "xASm;MxRt;yEED",
        "site": "https://openreview.net/forum?id=Y84b6FahMD",
        "pdf_size": 451554,
        "rating": "3;5;6",
        "confidence": "4;1;4",
        "soundness": "1;3;2",
        "contribution": "2;2;3",
        "presentation": "3;2;3",
        "wc_summary": "66;92;72",
        "wc_strengths": "32;39;29",
        "wc_weaknesses": "394;128;218",
        "wc_questions": "18;58;30",
        "wc_review": "510;317;349",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.0,
            1.4142135623730951
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            76.66666666666667,
            11.115554667022044
        ],
        "wc_strengths_avg": [
            33.333333333333336,
            4.189935029992179
        ],
        "wc_weaknesses_avg": [
            246.66666666666666,
            110.469704243089
        ],
        "wc_questions_avg": [
            35.333333333333336,
            16.75974011996871
        ],
        "wc_review_avg": [
            392.0,
            84.45511628472646
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.18898223650461363,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:gMQdXzSbWtYJ:scholar.google.com/&scioq=Counterfactual+Fairness+from+Partially+DAGs:+A+General+Min-Max+Optimization+Framework&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Peking University;Carnegie Mellon University",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.cmu.edu",
        "aff_unique_abbr": "Peking U;CMU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Peking",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "Y8DClN5ODu",
        "title": "Demonstration Distillation for Efficient In-Context Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In-context learning (ICL) substantially amplifies the predictive capability of large language models (LLMs), where the prompt typically contains a few question-answer pairs termed demonstrations, and a final question. Although lengthy and information-rich demonstrations can improve performance, they also inflate the computational burdens and financial costs, sometimes even breaching the context limit of LLMs. Existing solutions, such as prompt selection or context compression, frequently neglect the presence of superfluous information within these elongated prompts. To bridge the gap, this paper introduces demonstration distillation, a novel paradigm that targets excising the redundant content in the prompt without sacrificing ICL efficacy. We propose a distillation framework, Distillist-Generalist-Specialist (DGS), as an automated solution without additional model training. DGS iteratively refines the demonstration with the aid of three LLM-powered agents, eliminating superfluous information while maintaining valuable knowledge. Evaluations on three diverse datasets\u2014GSM8K, BoolQ, and MultiRC\u2014reveal the robustness and effectiveness of DGS. Particularly, DGS realizes $1.5-2$, $3-6$, and $1.5-3$ distillation ratios without compromising ICL performance on the three datasets.",
        "keywords": "demonstration;distillation;in-context learning;large language model;llm",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/5e9a2c2e04069f2db7e988dedd96157f5698f9cc.zip",
        "author": "Tong Chen;Qirun Dai;Zhijie Deng;Dequan Wang",
        "authorids": "~Tong_Chen13;~Qirun_Dai1;~Zhijie_Deng1;~Dequan_Wang1",
        "gender": "M;M;M;",
        "homepage": "https://github.com/CTDancer;https://qrdai.github.io/;https://thudzj.github.io/;",
        "dblp": ";42/5601;209/4959;",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;J3dR0sUAAAAJ;",
        "orcid": ";;0000-0002-0932-1631;",
        "linkedin": ";;;",
        "or_profile": "~Tong_Chen13;~Qirun_Dai1;~Zhijie_Deng1;~Dequan_Wang1",
        "aff": "Fudan University;Fudan University;Shanghai Jiaotong University;",
        "aff_domain": "fudan.edu.cn;fudan.edu.cn;sjtu.edu.cn;",
        "position": "Undergrad student;Undergrad student;Assistant Professor;",
        "bibtex": "@misc{\nchen2024demonstration,\ntitle={Demonstration Distillation for Efficient In-Context Learning},\nauthor={Tong Chen and Qirun Dai and Zhijie Deng and Dequan Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=Y8DClN5ODu}\n}",
        "github": "",
        "project": "",
        "reviewers": "rEVh;VMEd;u1NF;Ddz4;AeYf",
        "site": "https://openreview.net/forum?id=Y8DClN5ODu",
        "pdf_size": 267719,
        "rating": "3;3;3;3;5",
        "confidence": "4;4;4;5;4",
        "soundness": "2;3;2;2;3",
        "contribution": "2;3;2;2;3",
        "presentation": "2;3;4;3;2",
        "wc_summary": "225;47;109;75;124",
        "wc_strengths": "61;51;65;38;76",
        "wc_weaknesses": "821;188;84;132;127",
        "wc_questions": "352;233;27;75;8",
        "wc_review": "1459;519;285;320;335",
        "wc_reply_reviewers": "347;0;0;66;0",
        "wc_reply_authors": "1212;399;727;1135;670",
        "reply_reviewers": "1;0;0;1;0",
        "reply_authors": "2;1;1;2;1",
        "rating_avg": [
            3.4,
            0.8
        ],
        "confidence_avg": [
            4.2,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.8,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            116.0,
            60.722318796304215
        ],
        "wc_strengths_avg": [
            58.2,
            12.890306435457616
        ],
        "wc_weaknesses_avg": [
            270.4,
            277.2771898299606
        ],
        "wc_questions_avg": [
            139.0,
            132.66951420729632
        ],
        "wc_review_avg": [
            583.6,
            445.1847257038363
        ],
        "wc_reply_reviewers_avg": [
            82.6,
            134.64857964345555
        ],
        "wc_reply_authors_avg": [
            828.6,
            303.6146241537123
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.4,
            0.4898979485566356
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.25,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:aOH5klttwcsJ:scholar.google.com/&scioq=Demonstration+Distillation+for+Efficient+In-Context+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Fudan University;Shanghai Jiao Tong University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.fudan.edu.cn;https://www.sjtu.edu.cn",
        "aff_unique_abbr": "Fudan;SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "Y8OaqdX5Xt",
        "title": "Planning with Theory of Mind for Few-Shot Adaptation in Sequential Social Dilemmas",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Despite the recent successes of multi-agent reinforcement learning (MARL) algorithms, efficiently adapting to other agents in mixed-motive environments remains a significant challenge. One feasible approach is to use Theory of Mind (ToM) to reason about the mental states of other agents and model their behaviors. However, these methods often encounter difficulties in efficient reasoning and utilization of inferred information. To address these issues, we propose Planning with Theory of Mind (PToM), a novel multi-agent algorithm that enables few-shot adaptation to unseen policies in sequential social dilemmas (SSDs). PToM is hierarchically composed of two modules: an opponent modeling module that utilizes ToM to infer others' goals and learn corresponding goal-conditioned policies, and a planning module that employs Monte Carlo Tree Search (MCTS) to identify the best response. Our approach improves efficiency by updating beliefs about others' goals both between and within episodes and by using information from the opponent modeling module to guide planning. Experimental results demonstrate that in three representative SSD paradigms, PToM converges expeditiously, excels in self-play scenarios, and exhibits superior few-shot adaptation capabilities when interacting with various unseen agents. Furthermore, the emergence of social intelligence during our experiments underscores the potential of our approach in complex multi-agent environments.",
        "keywords": "Few-shot adaptation to unknown policies;Opponent modeling;Multi-agent reinforcement learning;Mixed-motive game;Decentralized training;Monte Carlo Tree Search",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/f8aaf027a70ef9ccd8cfb712889d016519390128.pdf",
        "author": "Yizhe Huang;Anji Liu;Fanqi Kong;Yaodong Yang;Song-Chun Zhu;Xue Feng",
        "authorids": "~Yizhe_Huang2;~Anji_Liu1;~Fanqi_Kong1;~Yaodong_Yang1;~Song-Chun_Zhu1;~Xue_Feng3",
        "gender": ";M;M;M;M;F",
        "homepage": ";https://liuanji.github.io/;https://github.com/kfq20;https://www.yangyaodong.com;https://zhusongchun.net/;",
        "dblp": ";227/8622;377/2991;170/1496-1;10/10313;",
        "google_scholar": "j5AxMFUAAAAJ;k_4zYecAAAAJ;Aj13PkAAAAAJ;https://scholar.google.co.uk/citations?user=6yL0xw8AAAAJ;https://scholar.google.com.tw/citations?user=Al8dyb4AAAAJ;",
        "orcid": "0000-0001-8722-7221;;;0000-0001-8132-5613;;0000-0002-7163-7274",
        "linkedin": ";anji-liu-7610b7190/;;yaodong-yang;;",
        "or_profile": "~Yizhe_Huang2;~Anji_Liu1;~Fanqi_Kong1;~Yaodong_Yang1;~Song-Chun_Zhu1;~Xue_Feng3",
        "aff": "Peking University;University of California, Los Angeles;Tsinghua University;Peking University;Peking University;Beijing Institute for General Artificial Intelligence",
        "aff_domain": "pku.edu.cn;ucla.edu;tsinghua.edu.cn;pku.edu.cn;pku.edu.cn;bigai.ai",
        "position": "PhD student;PhD student;Undergrad student;Assistant Professor;Full Professor;Researcher",
        "bibtex": "@misc{\nhuang2024planning,\ntitle={Planning with Theory of Mind for Few-Shot Adaptation in Sequential Social Dilemmas},\nauthor={Yizhe Huang and Anji Liu and Fanqi Kong and Yaodong Yang and Song-Chun Zhu and Xue Feng},\nyear={2024},\nurl={https://openreview.net/forum?id=Y8OaqdX5Xt}\n}",
        "github": "",
        "project": "",
        "reviewers": "zWBc;ciXi;v2eY;PVXH",
        "site": "https://openreview.net/forum?id=Y8OaqdX5Xt",
        "pdf_size": 1259564,
        "rating": "3;3;6;6",
        "confidence": "4;4;4;3",
        "soundness": "2;1;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "78;37;204;119",
        "wc_strengths": "109;72;479;28",
        "wc_weaknesses": "430;338;715;287",
        "wc_questions": "77;2;210;2",
        "wc_review": "694;449;1608;436",
        "wc_reply_reviewers": "0;248;0;0",
        "wc_reply_authors": "890;1796;1023;812",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "2;3;2;2",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            109.5,
            61.78389757857625
        ],
        "wc_strengths_avg": [
            172.0,
            179.5508284581277
        ],
        "wc_weaknesses_avg": [
            442.5,
            165.46374225189035
        ],
        "wc_questions_avg": [
            72.75,
            84.95108886883087
        ],
        "wc_review_avg": [
            796.75,
            479.51922537057885
        ],
        "wc_reply_reviewers_avg": [
            62.0,
            107.38715006927039
        ],
        "wc_reply_authors_avg": [
            1130.25,
            391.704209193621
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5773502691896258,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:updzhRsPrj8J:scholar.google.com/&scioq=Planning+with+Theory+of+Mind+for+Few-Shot+Adaptation+in+Sequential+Social+Dilemmas&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0;0;3",
        "aff_unique_norm": "Peking University;University of California, Los Angeles;Tsinghua University;Beijing Institute for General Artificial Intelligence",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.ucla.edu;https://www.tsinghua.edu.cn;http://www.bigaiai.org/",
        "aff_unique_abbr": "Peking U;UCLA;THU;BIGAI",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Los Angeles",
        "aff_country_unique_index": "0;1;0;0;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "Y8V6JdVdLw",
        "title": "An empirical investigation of generalization dynamics in deep ReLU networks via nonlinear mode decomposition",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The ability of deep networks to generalize, effectively learning some underlying nonlinear transform from noisy data, has long been investigated. The generalization dynamics of deep linear networks have previously been solved analytically and shown to qualitatively capture some aspects of how a linear transform is learned by a nonlinear network. Here we explore zero-bias deep ReLU networks playing both roles in a teacher-student framework, where measurement of the Jacobian of the network transform with respect to every input point allows for a complete description of the transform at those points, given the piecewise-linear nature of the ReLU network transform. The singular value/mode decomposition (SVD) of the Jacobian is computed at every input point for both teacher and student networks. The evolution over training of the singular values and vectors, averaged over all inputs, provides measurements of the globally nonlinear behavior of the network transform. For a deep ReLU student network trained on data from a deep ReLU teacher network with a user-specified singular value spectrum, we show over the course of training increasing student singular value magnitudes and increasing alignments of student singular vectors with teacher singular vectors, as observed in deep linear networks. We decompose the loss over training by singular mode, and directly observe nonlinear coupling of noise to student signal singular modes as well as coupling due to competition between signal modes. Nonlinear modes are shown to occur in teacher-student scenarios for deep convolutional ReLU networks with MNIST data, where their singular vectors reveal interpretable features that the network learns at local and global levels.",
        "keywords": "learning;generalization;statistical mechanics;teacher-student;svd",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "James Robert Golden",
        "authorids": "~James_Robert_Golden1",
        "gender": "M",
        "homepage": "",
        "dblp": "",
        "google_scholar": "EsrtnHUAAAAJ",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~James_Robert_Golden1",
        "aff": "Independent",
        "aff_domain": "cornell.edu",
        "position": "Researcher",
        "bibtex": "@misc{\ngolden2024an,\ntitle={An empirical investigation of generalization dynamics in deep Re{LU} networks via nonlinear mode decomposition},\nauthor={James Robert Golden},\nyear={2024},\nurl={https://openreview.net/forum?id=Y8V6JdVdLw}\n}",
        "github": "",
        "project": "",
        "reviewers": "wkT2;LBAp;CB8g;dQaM",
        "site": "https://openreview.net/forum?id=Y8V6JdVdLw",
        "pdf_size": 1090422,
        "rating": "3;3;3;6",
        "confidence": "3;5;2;3",
        "soundness": "2;1;2;3",
        "contribution": "2;1;2;3",
        "presentation": "2;1;1;2",
        "wc_summary": "29;98;114;133",
        "wc_strengths": "34;10;186;81",
        "wc_weaknesses": "79;20;173;365",
        "wc_questions": "21;183;113;11",
        "wc_review": "163;311;586;590",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            93.5,
            39.24601890638081
        ],
        "wc_strengths_avg": [
            77.75,
            67.5143503264306
        ],
        "wc_weaknesses_avg": [
            159.25,
            130.72179428083138
        ],
        "wc_questions_avg": [
            82.0,
            70.57619995437555
        ],
        "wc_review_avg": [
            412.5,
            183.1399737905409
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.13245323570650439,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:iCZzY4gXXTgJ:scholar.google.com/&scioq=An+empirical+investigation+of+generalization+dynamics+in+deep+ReLU+networks+via+nonlinear+mode+decomposition&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Independent",
        "aff_unique_dep": "",
        "aff_unique_url": "",
        "aff_unique_abbr": ""
    },
    {
        "title": "Sparse Weight Averaging with Multiple Particles for Iterative Magnitude Pruning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18434",
        "id": "Y9t7MqZtCR",
        "author_site": "Moonseok Choi, Hyungi Lee, Giung Nam, Juho Lee",
        "tldr": "",
        "abstract": "Given the ever-increasing size of modern neural networks, the significance of sparse architectures has surged due to their accelerated inference speeds and minimal memory demands. When it comes to global pruning techniques, Iterative Magnitude Pruning (IMP) still stands as a state-of-the-art algorithm despite its simple nature, particularly in extremely sparse regimes. In light of the recent finding that the two successive matching IMP solutions are linearly connected without a loss barrier, we propose Sparse Weight Averaging with Multiple Particles (SWAMP), a straightforward modification of IMP that achieves performance comparable to an ensemble of two IMP solutions. For every iteration, we concurrently train multiple sparse models, referred to as particles, using different batch orders yet the same matching ticket, and then weight average such models to produce a single mask. We demonstrate that our method consistently outperforms existing baselines across different sparsities through extensive experiments on various neural network structures and data.",
        "keywords": "Unstructured pruning;Sparse neural networks;Lottery ticket hypothesis;Weight averaging;Bayesian neural networks",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/b072552d04a4c7320fedff4d7e4af34f9af506e4.zip",
        "author": "Moonseok Choi;Hyungi Lee;Giung Nam;Juho Lee",
        "authorids": "~Moonseok_Choi1;~Hyungi_Lee1;~Giung_Nam1;~Juho_Lee2",
        "gender": "M;M;;M",
        "homepage": ";;https://cs-giung.github.io/;https://juho.lee.github.io",
        "dblp": "331/2083;221/7959;304/9008;55/3410-1",
        "google_scholar": "i-pOb1IAAAAJ;;https://scholar.google.co.kr/citations?user=HO-fMd8AAAAJ;Py4URJUAAAAJ",
        "orcid": ";;;",
        "linkedin": "moonseok-choi/;hyungi-lee-a8b161149/;;",
        "or_profile": "~Moonseok_Choi1;~Hyungi_Lee1;~Giung_Nam1;~Juho_Lee2",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr;kaist.ac.kr;kaist.ac.kr",
        "position": "PhD student;PhD student;PhD student;Associate Professor",
        "bibtex": "@inproceedings{\nchoi2024sparse,\ntitle={Sparse Weight Averaging with Multiple Particles for Iterative Magnitude Pruning},\nauthor={Moonseok Choi and Hyungi Lee and Giung Nam and Juho Lee},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Y9t7MqZtCR}\n}",
        "github": "",
        "project": "",
        "reviewers": "Eb3S;1f6B;YhLg;MGna;tk5N",
        "pdf_size": 575580,
        "rating": "6;6;6;6;8",
        "confidence": "4;4;3;4;4",
        "soundness": "2;3;3;3;4",
        "contribution": "2;2;2;2;2",
        "presentation": "3;3;3;3;4",
        "wc_summary": "44;120;54;123;100",
        "wc_strengths": "34;101;29;88;136",
        "wc_weaknesses": "74;104;123;274;225",
        "wc_questions": "88;21;42;5;73",
        "wc_review": "240;346;248;490;534",
        "wc_reply_reviewers": "159;48;88;197;51",
        "wc_reply_authors": "1585;304;494;861;807",
        "reply_reviewers": "2;1;1;1;1",
        "reply_authors": "2;2;2;3;2",
        "rating_avg": [
            6.4,
            0.7999999999999999
        ],
        "confidence_avg": [
            3.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            3.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.2,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            88.2,
            33.120386471175124
        ],
        "wc_strengths_avg": [
            77.6,
            40.81470323302621
        ],
        "wc_weaknesses_avg": [
            160.0,
            76.31775678045051
        ],
        "wc_questions_avg": [
            45.8,
            31.031596800680433
        ],
        "wc_review_avg": [
            371.6,
            121.36160842704747
        ],
        "wc_reply_reviewers_avg": [
            108.6,
            59.614092293685054
        ],
        "wc_reply_authors_avg": [
            810.2,
            437.9787209442943
        ],
        "reply_reviewers_avg": [
            1.2,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            2.2,
            0.39999999999999997
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.25000000000000006,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16998075158728147268&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=Y9t7MqZtCR",
        "pdf": "https://openreview.net/pdf?id=Y9t7MqZtCR",
        "email": "kaist.ac.kr;kaist.ac.kr;kaist.ac.kr;kaist.ac.kr",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "YB7z2AOqm3",
        "title": "Stress Testing Byzantine Robustness in Distributed Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Byzantine robustness in distributed learning consists in ensuring that distributed optimization algorithms, such as distributed SGD, are robust to arbitrarily malicious participants, also called Byzantine workers. Essentially, such workers attack the algorithm to prevent it from delivering a good model, by sharing erroneous information. Several defenses have been proposed so far, typically with theoretical worst-case robustness analyses. Yet, these analyses only show convergence to critical points up to large constants, which provides a false sense of security in the absence of a strong attack benchmark. We contribute to addressing this shortcoming by modeling an optimal Byzantine adversary in distributed learning, from which we derive Jump, a long-term attack strategy aiming at circumventing the training loss's minima. Interestingly, even if Jump is a solution to a simplified form of the optimal adversary's problem, it is very powerful: even the greedy version of Jump can satisfactorily break existing defenses. We systematically evaluate state-of-the-art attacks and defenses on MNIST and CIFAR-10 under data heterogeneity, and show that Jump consistently performs better or comparably to other attacks. For example, on CIFAR-10, Jump doubles the accuracy damage from 66% accuracy, across existing attacks, to 50% on average, compared to 81% without attack under moderate data heterogeneity. Hence, we encourage the usage of Jump as a stress test of Byzantine robustness in distributed learning.",
        "keywords": "Byzantine robustness;distributed machine learning;attacks",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/684deddedb6774c3dc02628b527886db6e577b29.zip",
        "author": "Youssef Allouah;Rachid Guerraoui;Nirupam Gupta;Haowen Liu;Rafael Pinot;Geovani Rizk",
        "authorids": "~Youssef_Allouah1;~Rachid_Guerraoui1;~Nirupam_Gupta1;~Haowen_Liu1;~Rafael_Pinot1;~Geovani_Rizk1",
        "gender": "M;M;;M;;M",
        "homepage": "https://youssefallouah.com/;https://lpdwww.epfl.ch/rachid/;;https://mekakuactor.github.io/;;",
        "dblp": "312/3936;g/RachidGuerraoui;;;;259/2889",
        "google_scholar": "kVZu88cAAAAJ;;;https://scholar.google.com/citations?hl=en;;",
        "orcid": "0000-0003-1048-7548;;;;;",
        "linkedin": ";;;haowen-liu-289618258/;;",
        "or_profile": "~Youssef_Allouah1;~Rachid_Guerraoui1;~Nirupam_Gupta1;~Haowen_Liu1;~Rafael_Pinot1;~Geovani_Rizk1",
        "aff": "Stanford University;;;EPFL - EPF Lausanne;;EPFL - EPF Lausanne",
        "aff_domain": "stanford.edu;;;epfl.ch;;epfl.ch",
        "position": "Visiting student researcher;;;MS student;;Postdoc",
        "bibtex": "@misc{\nallouah2024stress,\ntitle={Stress Testing Byzantine Robustness in Distributed Learning},\nauthor={Youssef Allouah and Rachid Guerraoui and Nirupam Gupta and Haowen Liu and Rafael Pinot and Geovani Rizk},\nyear={2024},\nurl={https://openreview.net/forum?id=YB7z2AOqm3}\n}",
        "github": "",
        "project": "",
        "reviewers": "Z2HT;y6Q8;6Sfh;hYhe;DW8P;p8Sy;9W2c",
        "site": "https://openreview.net/forum?id=YB7z2AOqm3",
        "pdf_size": 4157285,
        "rating": "3;3;5;5;5;5;6",
        "confidence": "4;4;5;3;3;5;3",
        "soundness": "2;3;3;3;2;3;3",
        "contribution": "2;3;2;3;2;3;3",
        "presentation": "2;4;3;2;2;3;3",
        "wc_summary": "45;58;124;17;187;107;54",
        "wc_strengths": "30;38;24;52;33;28;24",
        "wc_weaknesses": "292;136;41;1319;122;47;68",
        "wc_questions": "6;5;319;2;36;274;26",
        "wc_review": "373;237;508;1390;378;456;172",
        "wc_reply_reviewers": "141;120;420;225;114;0;0",
        "wc_reply_authors": "667;770;1723;1514;645;492;272",
        "reply_reviewers": "1;1;1;1;2;0;0",
        "reply_authors": "1;2;3;3;2;1;1",
        "rating_avg": [
            4.571428571428571,
            1.0497813183356477
        ],
        "confidence_avg": [
            3.857142857142857,
            0.8329931278350429
        ],
        "soundness_avg": [
            2.7142857142857144,
            0.4517539514526256
        ],
        "contribution_avg": [
            2.5714285714285716,
            0.49487165930539345
        ],
        "presentation_avg": [
            2.7142857142857144,
            0.6998542122237652
        ],
        "wc_summary_avg": [
            84.57142857142857,
            53.88044209930285
        ],
        "wc_strengths_avg": [
            32.714285714285715,
            9.113793090135188
        ],
        "wc_weaknesses_avg": [
            289.2857142857143,
            427.8042657523629
        ],
        "wc_questions_avg": [
            95.42857142857143,
            128.24514153187485
        ],
        "wc_review_avg": [
            502.0,
            378.31166289940666
        ],
        "wc_reply_reviewers_avg": [
            145.71428571428572,
            133.99010015212136
        ],
        "wc_reply_authors_avg": [
            869.0,
            499.2365600165345
        ],
        "reply_reviewers_avg": [
            0.8571428571428571,
            0.6388765649999398
        ],
        "reply_authors_avg": [
            1.8571428571428572,
            0.8329931278350429
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.23338001400466826,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:9eG62pCREu0J:scholar.google.com/&scioq=Stress+Testing+Byzantine+Robustness+in+Distributed+Learning&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Stanford University;EPFL",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.stanford.edu;https://www.epfl.ch",
        "aff_unique_abbr": "Stanford;EPFL",
        "aff_campus_unique_index": "0;1;1",
        "aff_campus_unique": "Stanford;Lausanne",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "United States;Switzerland"
    },
    {
        "id": "YBSEwwveMr",
        "title": "Score-Based Multimodal Autoencoders",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Multimodal Variational Autoencoders (VAEs) represent a promising group of generative models that facilitate the construction of a tractable posterior within the latent space, given multiple modalities. Daunhawer et al. (2022) demonstrate that as the number of modalities increases, the generative quality of each modality declines. In this study, we explore an alternative approach to enhance the generative performance of multimodal VAEs by jointly modeling the latent space of unimodal VAEs using score-based models (SBMs). The role of the SBM is to enforce multimodal coherence by learning the correlation among the latent variables. Consequently, our model combines the superior generative quality of unimodal VAEs with coherent integration across different modalities.",
        "keywords": "multimodal autoencoders;multimodal variational autoencoders;multimodal generative models;latent-space score-based models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/6a53b581ab0b4b0e9bf3d459756d01950aa9f266.zip",
        "author": "Daniel Wesego;Pedram Rooshenas",
        "authorids": "~Daniel_Wesego1;~Pedram_Rooshenas1",
        "gender": "M;M",
        "homepage": ";http://rooshenas.github.io",
        "dblp": ";137/4824",
        "google_scholar": ";ncHbkrQAAAAJ",
        "orcid": ";",
        "linkedin": "daniel-wesego/;",
        "or_profile": "~Daniel_Wesego1;~Pedram_Rooshenas1",
        "aff": "University of Illinois at Chicago;University of Illinois at Chicago",
        "aff_domain": "uic.edu;uic.edu",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nwesego2024scorebased,\ntitle={Score-Based Multimodal Autoencoders},\nauthor={Daniel Wesego and Pedram Rooshenas},\nyear={2024},\nurl={https://openreview.net/forum?id=YBSEwwveMr}\n}",
        "github": "",
        "project": "",
        "reviewers": "L126;7BDS;NJdA;qLtQ",
        "site": "https://openreview.net/forum?id=YBSEwwveMr",
        "pdf_size": 9380032,
        "rating": "3;6;6;8",
        "confidence": "3;4;5;3",
        "soundness": "2;3;2;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;2;4",
        "wc_summary": "58;92;37;178",
        "wc_strengths": "29;95;106;195",
        "wc_weaknesses": "129;176;500;88",
        "wc_questions": "234;120;119;1",
        "wc_review": "450;483;762;462",
        "wc_reply_reviewers": "0;265;0;18",
        "wc_reply_authors": "969;1239;477;264",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "2;3;1;1",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            91.25,
            53.793006050972835
        ],
        "wc_strengths_avg": [
            106.25,
            59.09896361189424
        ],
        "wc_weaknesses_avg": [
            223.25,
            162.7872461220473
        ],
        "wc_questions_avg": [
            118.5,
            82.38476800962664
        ],
        "wc_review_avg": [
            539.25,
            129.14599296919747
        ],
        "wc_reply_reviewers_avg": [
            70.75,
            112.39078031582484
        ],
        "wc_reply_authors_avg": [
            737.25,
            386.37958991126845
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.1266600992762247,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15790571184433244259&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Illinois at Chicago",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uic.edu",
        "aff_unique_abbr": "UIC",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Chicago",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Leveraging augmented-Lagrangian techniques for differentiating over infeasible quadratic programs in machine learning",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18433",
        "id": "YCPDFfmkFr",
        "author_site": "Antoine Bambade, Fabian Schramm, Adrien Taylor, Justin Carpentier",
        "tldr": "",
        "abstract": "Optimization layers within neural network architectures have become increasingly popular for their ability to solve a wide range of machine learning tasks and to model domain-specific knowledge. However, designing optimization layers requires careful consideration as the underlying optimization problems might be infeasible during training. \nMotivated by applications in learning, control and robotics, this work focuses on convex quadratic programming (QP) layers. The specific structure of this type of optimization layer can be efficiently exploited for faster computations while still allowing rich modeling capabilities. We leverage primal-dual augmented Lagrangian techniques for computing derivatives of both feasible and infeasible QP solutions. \nMore precisely, we propose a unified approach which tackles the differentiability of the closest feasible QP solutions in a classical $\\ell_2$ sense. We then harness this approach to enrich the expressive capabilities of existing QP layers. More precisely, we show how differentiating through infeasible QPs during training enables to drive towards feasibility at test time a new range of QP layers. These layers notably demonstrate superior predictive performance in some conventional learning tasks. Additionally, we present alternative formulations that enhance numerical robustness, speed, and accuracy for training such layers. \nAlong with these contributions, we provide an open-source C++ software package called QPLayer for differentiating feasible and infeasible convex QPs and which can be interfaced with modern learning frameworks.",
        "keywords": "Machine Learning;Optimization;Differentiable Optimization;Optimization layers",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/6e97e586201f446bc5cdd3c415e69219fddef15f.zip",
        "author": "Antoine Bambade;Fabian Schramm;Adrien Taylor;Justin Carpentier",
        "authorids": "~Antoine_Bambade1;~Fabian_Schramm1;~Adrien_Taylor1;~Justin_Carpentier1",
        "gender": "M;;;M",
        "homepage": "https://bambade.github.io/;;https://adrientaylor.github.io/;https://jcarpent.github.io",
        "dblp": "329/6816;;193/0003.html;173/7498",
        "google_scholar": "JfnD2T8AAAAJ;;tcRn4JYAAAAJ;https://scholar.google.fr/citations?user=CyhIdmMAAAAJ",
        "orcid": "0000-0003-0513-0691;;;",
        "linkedin": "antoine-bambade-5b0450135/?originalSubdomain=fr;;;",
        "or_profile": "~Antoine_Bambade1;~Fabian_Schramm1;~Adrien_Taylor1;~Justin_Carpentier1",
        "aff": ";;INRIA;INRIA",
        "aff_domain": ";;inria.fr;inria.fr",
        "position": ";;Researcher;Researcher",
        "bibtex": "@inproceedings{\nbambade2024leveraging,\ntitle={Leveraging augmented-Lagrangian techniques for differentiating over infeasible quadratic programs in machine learning},\nauthor={Antoine Bambade and Fabian Schramm and Adrien Taylor and Justin Carpentier},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=YCPDFfmkFr}\n}",
        "github": "",
        "project": "",
        "reviewers": "uDj8;sv98;vnSN;7UKP",
        "pdf_size": 2356892,
        "rating": "6;6;8;8",
        "confidence": "4;4;3;3",
        "soundness": "3;3;3;4",
        "contribution": "2;3;3;3",
        "presentation": "3;2;2;4",
        "wc_summary": "276;63;119;66",
        "wc_strengths": "117;21;59;53",
        "wc_weaknesses": "297;25;70;25",
        "wc_questions": "64;227;19;25",
        "wc_review": "754;336;267;169",
        "wc_reply_reviewers": "41;0;13;0",
        "wc_reply_authors": "639;627;374;161",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            131.0,
            86.62851724461177
        ],
        "wc_strengths_avg": [
            62.5,
            34.62296925452813
        ],
        "wc_weaknesses_avg": [
            104.25,
            112.79045837303792
        ],
        "wc_questions_avg": [
            83.75,
            84.49075393201318
        ],
        "wc_review_avg": [
            381.5,
            223.09919318545283
        ],
        "wc_reply_reviewers_avg": [
            13.5,
            16.740669042783207
        ],
        "wc_reply_authors_avg": [
            450.25,
            197.70353436395618
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4181676604703021731&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=YCPDFfmkFr",
        "pdf": "https://openreview.net/pdf?id=YCPDFfmkFr",
        "email": ";;inria.fr;inria.fr",
        "author_num": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "INRIA",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.inria.fr",
        "aff_unique_abbr": "INRIA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "France"
    },
    {
        "title": "Training Diffusion Models with Reinforcement Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18432",
        "id": "YCWjhGrJFD",
        "author_site": "Kevin Black, Michael Janner, Yilun Du, Ilya Kostrikov, Sergey Levine",
        "tldr": "",
        "abstract": "Diffusion models are a class of flexible generative models trained with an approximation to the log-likelihood objective. However, most use cases of diffusion models are not concerned with likelihoods, but instead with downstream objectives such as human-perceived image quality or drug effectiveness. In this paper, we investigate reinforcement learning methods for directly optimizing diffusion models for such objectives. We describe how posing denoising as a multi-step decision-making problem enables a class of policy gradient algorithms, which we refer to as denoising diffusion policy optimization ( DDPO), that are more effective than alternative reward-weighted likelihood approaches. Empirically, DDPO can adapt text-to-image diffusion models to objectives that are difficult to express via prompting, such as image compressibility, and those derived from human feedback, such as aesthetic quality. Finally, we show that DDPO can improve prompt-image alignment using feedback from a vision-language model without the need for additional data collection or human annotation. The project\u2019s website can be found at http://rl-diffusion.github.io.",
        "keywords": "reinforcement learning;RLHF;diffusion models",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Kevin Black;Michael Janner;Yilun Du;Ilya Kostrikov;Sergey Levine",
        "authorids": "~Kevin_Black2;~Michael_Janner1;~Yilun_Du1;~Ilya_Kostrikov1;~Sergey_Levine1",
        "gender": ";M;;M;M",
        "homepage": "https://kevin.black;;https://yilundu.github.io;;https://people.eecs.berkeley.edu/~svlevine/",
        "dblp": "66/9687;209/4967;204/4379;https://dblp.org/pers/k/Kostrikov:Ilya.html;80/7594",
        "google_scholar": "axX7PCwAAAAJ;;;PTS2AOgAAAAJ;8R35rCwAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Kevin_Black2;~Michael_Janner1;~Yilun_Du1;~Ilya_Kostrikov1;~Sergey_Levine1",
        "aff": "University of California, Berkeley;University of California, Berkeley;Massachusetts Institute of Technology;OpenAI;Google",
        "aff_domain": "berkeley.edu;berkele;mit.edu;openai.com;google.com",
        "position": "PhD student;PhD student;PhD student;Member of Technical Staff;Research Scientist",
        "bibtex": "@inproceedings{\nblack2024training,\ntitle={Training Diffusion Models with Reinforcement Learning},\nauthor={Kevin Black and Michael Janner and Yilun Du and Ilya Kostrikov and Sergey Levine},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=YCWjhGrJFD}\n}",
        "github": "",
        "project": "",
        "reviewers": "qqX7;rYFt;EgHv;sWSo",
        "pdf_size": 5154847,
        "rating": "5;6;6;8",
        "confidence": "4;3;4;4",
        "soundness": "3;2;2;4",
        "contribution": "1;2;2;3",
        "presentation": "2;3;3;4",
        "wc_summary": "112;71;72;103",
        "wc_strengths": "52;36;48;65",
        "wc_weaknesses": "354;209;205;105",
        "wc_questions": "31;29;33;172",
        "wc_review": "549;345;358;445",
        "wc_reply_reviewers": "486;20;129;68",
        "wc_reply_authors": "978;496;740;623",
        "reply_reviewers": "2;1;3;1",
        "reply_authors": "4;2;5;2",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            89.5,
            18.282505298782223
        ],
        "wc_strengths_avg": [
            50.25,
            10.353139620424328
        ],
        "wc_weaknesses_avg": [
            218.25,
            88.76197102363152
        ],
        "wc_questions_avg": [
            66.25,
            61.07116750153054
        ],
        "wc_review_avg": [
            424.25,
            81.64366172581923
        ],
        "wc_reply_reviewers_avg": [
            175.75,
            183.24079103736702
        ],
        "wc_reply_authors_avg": [
            709.25,
            177.54348058996703
        ],
        "reply_reviewers_avg": [
            1.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.25,
            1.299038105676658
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.13245323570650439,
        "gs_citation": 303,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8160058116077111576&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=YCWjhGrJFD",
        "pdf": "https://openreview.net/pdf?id=YCWjhGrJFD",
        "email": "berkeley.edu;berkele;mit.edu;openai.com;google.com",
        "author_num": 5,
        "aff_unique_index": "0;0;1;2;3",
        "aff_unique_norm": "University of California, Berkeley;Massachusetts Institute of Technology;OpenAI;Google",
        "aff_unique_dep": ";;;Google",
        "aff_unique_url": "https://www.berkeley.edu;https://web.mit.edu;https://openai.com;https://www.google.com",
        "aff_unique_abbr": "UC Berkeley;MIT;OpenAI;Google",
        "aff_campus_unique_index": "0;0;2",
        "aff_campus_unique": "Berkeley;;Mountain View",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "YD0GQBOFFZ",
        "title": "Structured Evaluation of Synthetic Tabular Data",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Tabular data is common yet typically incomplete, small in volume, and access-restricted due to privacy concerns. Synthetic data generation offers potential solutions. Many metrics exist for evaluating the quality of synthetic tabular data; however, we lack an objective, coherent interpretation of the many metrics. To address this issue, we propose an evaluation framework with a single, mathematical objective that posits that the synthetic data are drawn from the same distribution as the observed data. Through various structural decomposition of the objective, the framework reorganizes and unifies existing metrics, including those that stem from fidelity considerations, downstream application, and model-based approaches. Moreover, the framework motivates new metrics and model-free baselines. We evaluate structurally informed synthesizers and synthesizers powered by deep learning. Using metrics derived from the new comprehensive and coherent framework, we show that synthetic data generators that explicitly represent tabular structure outperform other methods, especially on smaller datasets.",
        "keywords": "Data synthesis;tabular data;evaluation;Bayesian nonparametrics",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Scott Cheng-Hsin Yang;Baxter Eaves;Michael Thomas Schmidt;Kenneth Brian Swanson;Patrick Shafto",
        "authorids": "~Scott_Cheng-Hsin_Yang2;~Baxter_Eaves1;~Michael_Thomas_Schmidt1;~Kenneth_Brian_Swanson1;~Patrick_Shafto2",
        "gender": ";M;M;;M",
        "homepage": "https://www.linkedin.com/in/baxtereaves/;;;http://www.shaftolab.com;http://scottchenghsinyang.com/",
        "dblp": ";;;03/5979;200/8517",
        "google_scholar": "_H_Vh-MAAAAJ;mMaelfoAAAAJ;;HUi6F7wAAAAJ;",
        "orcid": ";0000-0002-1658-6283;;;0000-0003-1437-5519",
        "linkedin": ";;swansonk/;;",
        "or_profile": "~Baxter_Eaves1;~Michael_Thomas_Schmidt1;~Kenneth_Brian_Swanson1;~Patrick_Shafto1;~Scott_Cheng-Hsin_Yang1",
        "aff": "Redpoll;Redpoll;Redpoll;Rutgers University;Redpoll",
        "aff_domain": "redpoll.ai;redpoll.ai;redpoll.ai;rutgers.edu;redpoll.ai",
        "position": "Founder & Director;Researcher;Software Engineer;Professor;Principal Researcher",
        "bibtex": "@misc{\nyang2024structured,\ntitle={Structured Evaluation of Synthetic Tabular Data},\nauthor={Scott Cheng-Hsin Yang and Baxter Eaves and Michael Thomas Schmidt and Kenneth Brian Swanson and Patrick Shafto},\nyear={2024},\nurl={https://openreview.net/forum?id=YD0GQBOFFZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "fbzR;9Y2W;UGhN",
        "site": "https://openreview.net/forum?id=YD0GQBOFFZ",
        "pdf_size": 458203,
        "rating": "3;5;6",
        "confidence": "4;4;4",
        "soundness": "2;2;3",
        "contribution": "3;2;3",
        "presentation": "1;2;3",
        "wc_summary": "62;172;95",
        "wc_strengths": "43;54;57",
        "wc_weaknesses": "435;215;110",
        "wc_questions": "2;832;3",
        "wc_review": "542;1273;265",
        "wc_reply_reviewers": "0;90;54",
        "wc_reply_authors": "982;2124;594",
        "reply_reviewers": "0;2;1",
        "reply_authors": "2;4;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            109.66666666666667,
            46.08928532991396
        ],
        "wc_strengths_avg": [
            51.333333333333336,
            6.018490028422596
        ],
        "wc_weaknesses_avg": [
            253.33333333333334,
            135.42115377181253
        ],
        "wc_questions_avg": [
            279.0,
            391.0302631084539
        ],
        "wc_review_avg": [
            693.3333333333334,
            425.19982230580587
        ],
        "wc_reply_reviewers_avg": [
            48.0,
            36.98648401781386
        ],
        "wc_reply_authors_avg": [
            1233.3333333333333,
            649.410673012249
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6325465452294415490&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "Redpoll;Rutgers University",
        "aff_unique_dep": ";",
        "aff_unique_url": ";https://www.rutgers.edu",
        "aff_unique_abbr": ";Rutgers",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "1",
        "aff_country_unique": ";United States"
    },
    {
        "id": "YELiOc1Bj9",
        "title": "Attention-Only Transformers and Implementing MLPs with Attention Heads",
        "track": "main",
        "status": "Desk Reject",
        "tldr": "",
        "abstract": "The transformer architecture is widely used in machine learning models and consists of two alternating sublayers: attention heads and MLPs. We prove that an MLP neuron can be implemented by a masked attention head with internal dimension 1 so long as the MLP's activation function comes from a restricted class including SiLU and close approximations of ReLU and GeLU. This allows one to convert an MLP-and-attention transformer into an attention-only transformer at the cost of greatly increasing the number of attention heads. We also prove that attention heads can perform the components of an MLP (linear transformations and activation functions) separately. Finally, we prove that attention heads can encode arbitrary masking patterns in their weight matrices to within arbitrarily small error.",
        "keywords": "transformer;neural network;architecture;attention",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Robert Huben;Valerie Morris",
        "authorids": "~Robert_Huben1;~Valerie_Morris1",
        "gender": ";F",
        "homepage": ";",
        "dblp": ";",
        "google_scholar": "Zyi236gAAAAJ;",
        "orcid": ";",
        "linkedin": "roberthuben/;https://linkedin.com/in/valerie-morris-992a81288",
        "or_profile": "~Robert_Huben1;~Valerie_Morris1",
        "aff": "Independent;",
        "aff_domain": "gmail.com;",
        "position": "Researcher;",
        "bibtex": "@misc{\nhuben2024attentiononly,\ntitle={Attention-Only Transformers and Implementing {MLP}s with Attention Heads},\nauthor={Robert Huben and Valerie Morris},\nyear={2024},\nurl={https://openreview.net/forum?id=YELiOc1Bj9}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=YELiOc1Bj9",
        "pdf_size": 226726,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:M64JAfmM0poJ:scholar.google.com/&scioq=Attention-Only+Transformers+and+Implementing+MLPs+with+Attention+Heads&hl=en&as_sdt=0,5",
        "gs_version_total": 4,
        "aff_unique_index": "0",
        "aff_unique_norm": "Independent",
        "aff_unique_dep": "",
        "aff_unique_url": "",
        "aff_unique_abbr": ""
    },
    {
        "title": "Implicit Gaussian process representation of vector fields over arbitrary latent manifolds",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18431",
        "id": "YEPlTU5mZC",
        "author_site": "Robert Peach, Matteo Vinao-Carl, Nir Grossman, Michael David, Emma-Jane Mallas, David Sharp, Paresh Malhotra, Pierre Vandergheynst, Adam Gosztolai",
        "tldr": "",
        "abstract": "Gaussian processes (GPs) are popular nonparametric statistical models for learning unknown functions and quantifying the spatiotemporal uncertainty in data. Recent works have extended GPs to model scalar and vector quantities distributed over non-Euclidean domains, including smooth manifolds, appearing in numerous fields such as computer vision, dynamical systems, and neuroscience. However, these approaches assume that the manifold underlying the data is known, limiting their practical utility. We introduce RVGP, a generalisation of GPs for learning vector signals over latent Riemannian manifolds. Our method uses positional encoding with eigenfunctions of the connection Laplacian, associated with the tangent bundle, readily derived from common graph-based approximation of data. We demonstrate that RVGP possesses global regularity over the manifold, which allows it to super-resolve and inpaint vector fields while preserving singularities. Furthermore, we use RVGP to reconstruct high-density neural dynamics derived from low-density EEG recordings in healthy individuals and Alzheimer's patients. We show that vector field singularities are important disease markers and that their reconstruction leads to a comparable classification accuracy of disease states to high-density recordings. Thus, our method overcomes a significant practical limitation in experimental and clinical applications.",
        "keywords": "Gaussian processes;neuroscience;vector field;tangent bundle;connection Laplacian;EEG;Alzheimer's disease",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Robert Peach;Matteo Vinao-Carl;Nir Grossman;Michael David;Emma Mallas;David J. Sharp;Paresh A. Malhotra;Pierre Vandergheynst;Adam Gosztolai",
        "authorids": "~Robert_Peach1;~Matteo_Vinao-Carl1;nirg@imperial.ac.uk;michael.david12@imperial.ac.uk;e.mallas@imperial.ac.uk;~David_J._Sharp1;p.malhotra@imperial.ac.uk;~Pierre_Vandergheynst1;~Adam_Gosztolai1",
        "gender": "M;M;;;;M;;M;M",
        "homepage": ";https://www.imperial.ac.uk/interventional-systems-neuroscience/team/phd-students/;;;;;;http://lts2.epfl.ch;https://gosztolai-lab.org",
        "dblp": "236/4823.html;;;;;91/6655;;16/355;342/2703",
        "google_scholar": ";yMRK9FsAAAAJ;;;;Sbz45kEAAAAJ;;1p9NOFEAAAAJ;fVGCjMsAAAAJ",
        "orcid": "0000-0002-8738-5825;0000-0003-2583-9761;;;;;;0000-0002-9070-900X;0000-0002-0699-5825",
        "linkedin": ";;;;;;;;adamgosztolai/",
        "or_profile": "~Robert_Peach1;~Matteo_Vinao-Carl1;nirg@imperial.ac.uk;michael.david12@imperial.ac.uk;e.mallas@imperial.ac.uk;~David_J._Sharp1;p.malhotra@imperial.ac.uk;~Pierre_Vandergheynst1;~Adam_Gosztolai1",
        "aff": "Bayerische Julius-Maximilians-Universit\u00e4t W\u00fcrzburg;Imperial College London;;;;Imperial College London;;EPFL - EPF Lausanne;Swiss Federal Institute of Technology Lausanne",
        "aff_domain": "uni-wuerzburg.de;ic.ac.uk;;;;ic.ac.uk;;epfl.ch;epfl.ch",
        "position": "Postdoc;PhD student;;;;Full Professor;;Full Professor;Postdoc",
        "bibtex": "@inproceedings{\npeach2024implicit,\ntitle={Implicit Gaussian process representation of vector fields over arbitrary latent manifolds},\nauthor={Robert Peach and Matteo Vinao-Carl and Nir Grossman and Michael David and Emma Mallas and David J. Sharp and Paresh A. Malhotra and Pierre Vandergheynst and Adam Gosztolai},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=YEPlTU5mZC}\n}",
        "github": "",
        "project": "",
        "reviewers": "bAaw;TuVU;3KnT",
        "pdf_size": 3287974,
        "rating": "6;8;8",
        "confidence": "5;4;2",
        "soundness": "2;3;2",
        "contribution": "3;3;3",
        "presentation": "3;3;3",
        "wc_summary": "65;111;88",
        "wc_strengths": "25;26;34",
        "wc_weaknesses": "190;65;90",
        "wc_questions": "272;87;3",
        "wc_review": "552;289;215",
        "wc_reply_reviewers": "213;191;19",
        "wc_reply_authors": "2109;1051;367",
        "reply_reviewers": "2;1;1",
        "reply_authors": "5;2;1",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            1.247219128924647
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            88.0,
            18.7794213613377
        ],
        "wc_strengths_avg": [
            28.333333333333332,
            4.0276819911981905
        ],
        "wc_weaknesses_avg": [
            115.0,
            54.00617248673217
        ],
        "wc_questions_avg": [
            120.66666666666667,
            112.36943040208439
        ],
        "wc_review_avg": [
            352.0,
            144.61212489506772
        ],
        "wc_reply_reviewers_avg": [
            141.0,
            86.73330771201262
        ],
        "wc_reply_authors_avg": [
            1175.6666666666667,
            716.6111606412194
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            1.699673171197595
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -0.7559289460184545,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1729758671038659655&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=YEPlTU5mZC",
        "pdf": "https://openreview.net/pdf?id=YEPlTU5mZC",
        "email": "uni-wuerzburg.de;ic.ac.uk;;;;ic.ac.uk;;epfl.ch;epfl.ch",
        "author_num": 9,
        "aff_unique_index": "0;1;1;2;3",
        "aff_unique_norm": "University of W\u00fcrzburg;Imperial College London;EPFL;Swiss Federal Institute of Technology Lausanne",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.uni-wuerzburg.de;https://www.imperial.ac.uk;https://www.epfl.ch;https://www.epfl.ch",
        "aff_unique_abbr": "JMU;ICL;EPFL;EPFL",
        "aff_campus_unique_index": "0;2;2",
        "aff_campus_unique": "W\u00fcrzburg;;Lausanne",
        "aff_country_unique_index": "0;1;1;2;2",
        "aff_country_unique": "Germany;United Kingdom;Switzerland"
    },
    {
        "title": "Differentially Private Synthetic Data via Foundation Model APIs 1: Images",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18430",
        "id": "YEhQs8POIo",
        "author_site": "Zinan Lin, Sivakanth Gopi, Janardhan Kulkarni, Harsha Nori, Sergey Yekhanin",
        "tldr": "",
        "abstract": "Generating differentially private (DP) synthetic data that closely resembles the original private data is a scalable way to mitigate privacy concerns in the current data-driven world. In contrast to current practices that train customized models for this task, we aim to generate DP Synthetic Data via APIs (DPSDA), where we treat foundation models as blackboxes and only utilize their inference APIs. Such API-based, training-free approaches are easier to deploy as exemplified by the recent surge in the number of API-based apps. These approaches can also leverage the power of large foundation models which are only accessible via their inference APIs. However, this comes with greater challenges due to strictly more restrictive model access and the need to protect privacy from the API provider. \n\nIn this paper, we present a new framework called Private Evolution (PE) to solve this problem and show its initial promise on synthetic images. Surprisingly, PE can match or even outperform state-of-the-art (SOTA) methods without any model training. For example, on CIFAR10 (with ImageNet as the public data), we achieve FID \u2264 7.9 with privacy cost \u03b5 = 0.67, significantly improving the previous SOTA from \u03b5 = 32. We further demonstrate the promise of applying PE on large foundation models such as Stable Diffusion to tackle challenging private datasets with a small number of high-resolution images. The code and data are released at https://github.com/microsoft/DPSDA.",
        "keywords": "synthetic data;differential privacy;model API;foundation models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/319ee1fd03a1fbd39ed2f106267ed0e7063d8923.zip",
        "author": "Zinan Lin;Sivakanth Gopi;Janardhan Kulkarni;Harsha Nori;Sergey Yekhanin",
        "authorids": "~Zinan_Lin1;~Sivakanth_Gopi1;~Janardhan_Kulkarni2;~Harsha_Nori1;~Sergey_Yekhanin1",
        "gender": "M;M;M;;M",
        "homepage": "https://zinanlin.me/;https://aka.ms/sigopi;;;https://www.microsoft.com/en-us/research/people/yekhanin/",
        "dblp": "64/237-1;123/7803.html;54/1978;217/2494;29/1329",
        "google_scholar": "67nE-wQ_g_cC;bYhGFrwAAAAJ;_fxnybwAAAAJ;HmxjgMAAAAAJ;4WEQ8h0AAAAJ",
        "orcid": ";;;;",
        "linkedin": ";sivakanthgopi/;;harshanori;sergey-yekhanin-5242ba192/",
        "or_profile": "~Zinan_Lin1;~Sivakanth_Gopi1;~Janardhan_Kulkarni2;~Harsha_Nori1;~Sergey_Yekhanin1",
        "aff": "Microsoft;Microsoft Research;Microsoft Research, Redmond;Microsoft;Microsoft",
        "aff_domain": "microsoft.com;microsoft.com;microsoft.com;microsoft.com;microsoft.com",
        "position": "Senior Researcher;Senior Researcher;Researcher;Research Engineer;Principal Researcher",
        "bibtex": "@inproceedings{\nlin2024differentially,\ntitle={Differentially Private Synthetic Data via Foundation Model {API}s 1: Images},\nauthor={Zinan Lin and Sivakanth Gopi and Janardhan Kulkarni and Harsha Nori and Sergey Yekhanin},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=YEhQs8POIo}\n}",
        "github": "",
        "project": "",
        "reviewers": "vg5F;wkXZ;eX7J;yzwb",
        "pdf_size": 12859431,
        "rating": "5;6;6;8",
        "confidence": "4;5;4;4",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;4;4",
        "wc_summary": "82;65;129;112",
        "wc_strengths": "41;67;50;107",
        "wc_weaknesses": "234;758;125;312",
        "wc_questions": "225;20;124;30",
        "wc_review": "582;910;428;561",
        "wc_reply_reviewers": "189;60;129;569",
        "wc_reply_authors": "2659;2600;1405;3166",
        "reply_reviewers": "1;1;1;4",
        "reply_authors": "5;8;5;8",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            97.0,
            24.9899979991996
        ],
        "wc_strengths_avg": [
            66.25,
            25.31180554602931
        ],
        "wc_weaknesses_avg": [
            357.25,
            240.71702785636083
        ],
        "wc_questions_avg": [
            99.75,
            82.91675041871817
        ],
        "wc_review_avg": [
            620.25,
            177.4040233478373
        ],
        "wc_reply_reviewers_avg": [
            236.75,
            197.1805961548955
        ],
        "wc_reply_authors_avg": [
            2457.5,
            646.2656187667731
        ],
        "reply_reviewers_avg": [
            1.75,
            1.299038105676658
        ],
        "reply_authors_avg": [
            6.5,
            1.5
        ],
        "replies_avg": [
            41,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.13245323570650439,
        "gs_citation": 42,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9894835027734680107&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=YEhQs8POIo",
        "pdf": "https://openreview.net/pdf?id=YEhQs8POIo",
        "email": "microsoft.com;microsoft.com;microsoft.com;microsoft.com;microsoft.com",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Microsoft",
        "aff_unique_dep": "Microsoft Corporation",
        "aff_unique_url": "https://www.microsoft.com",
        "aff_unique_abbr": "Microsoft",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Redmond",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "YG01CZDpCq",
        "title": "Don't Paint Everyone with the Same Brush: Adaptive Prompt Prototype Learning for Vision-Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Vision Language Models (VLMs) have demonstrated great potential on zero-shot classification tasks by computing the similarity between visual and textual embeddings. To adapt VLMs to a downstream task, recent advances introduced context optimization. It optimizes a single embedding for either visual or textual modalities, aiming to improve performance on both base and new classes. However, we identify a critical issue by using single embedding for each class. That is, for image samples of a single class, the visual appearance may vary significantly. Thus, existing methods relying on a singular textual embedding fail to capture the visual variance, leading to suboptimal performance on downstream tasks. In this paper, we propose an Adaptive Prompt Prototype Learning (APPLe) for VLMs. Specifically, we build various prompts as class prototypes to cover the visual variance. Moreover, there are inevitably some ambiguous words in prompts, bringing noise to the textual features. To resolve this problem, an adaptive attention mechanism is designed to weigh the importance of different prototypes. It learns to assign higher scores to the representative prototypes, and lower scores to the flawed or less representative prototypes. To evaluate the effectiveness of APPLe, we conduct experiments on three representative tasks, i.e., generalization to unseen classes, new target datasets, and unseen domain shifts. APPLe exhibits a consistent performance improvement of 3.66% on new classes and 2.79% on the harmonic mean.",
        "keywords": "Vision Language Models;Prototype Learning;Prompt Learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/4fef1431efbe9e8b468c6c6a412294829ef8f737.zip",
        "author": "Zhi Chen",
        "authorids": "~Zhi_Chen4",
        "gender": "M",
        "homepage": "https://uqzhichen.github.io/",
        "dblp": "05/1539-10",
        "google_scholar": "https://scholar.google.com.au/citations?user=9ZypKEYAAAAJ",
        "orcid": "0000-0002-9385-144X",
        "linkedin": "simon-chen-qld/",
        "or_profile": "~Zhi_Chen4",
        "aff": "University of Queensland",
        "aff_domain": "uq.edu.au",
        "position": "Postdoc",
        "bibtex": "@misc{\nchen2024dont,\ntitle={Don't Paint Everyone with the Same Brush: Adaptive Prompt Prototype Learning for Vision-Language Models},\nauthor={Zhi Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=YG01CZDpCq}\n}",
        "github": "",
        "project": "",
        "reviewers": "fKhC;tgxP;cng2;uJ9U",
        "site": "https://openreview.net/forum?id=YG01CZDpCq",
        "pdf_size": 619719,
        "rating": "5;5;6;6",
        "confidence": "5;4;4;5",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;3;3",
        "wc_summary": "51;103;52;98",
        "wc_strengths": "62;59;68;84",
        "wc_weaknesses": "137;145;87;286",
        "wc_questions": "2;404;10;33",
        "wc_review": "252;711;217;501",
        "wc_reply_reviewers": "0;80;21;351",
        "wc_reply_authors": "1022;3366;758;3215",
        "reply_reviewers": "0;1;1;2",
        "reply_authors": "3;7;2;7",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            76.0,
            24.566236993076494
        ],
        "wc_strengths_avg": [
            68.25,
            9.65336728815391
        ],
        "wc_weaknesses_avg": [
            163.75,
            73.9978884833885
        ],
        "wc_questions_avg": [
            112.25,
            168.8259088528772
        ],
        "wc_review_avg": [
            420.25,
            200.4212750682921
        ],
        "wc_reply_reviewers_avg": [
            113.0,
            140.50444832815793
        ],
        "wc_reply_authors_avg": [
            2090.25,
            1205.0569229293694
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            4.75,
            2.277608394786075
        ],
        "replies_avg": [
            31,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Rr3VgUocfk0J:scholar.google.com/&scioq=Don%27t+Paint+Everyone+with+the+Same+Brush:+Adaptive+Prompt+Prototype+Learning+for+Vision-Language+Models&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Queensland",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uq.edu.au",
        "aff_unique_abbr": "UQ",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Australia"
    },
    {
        "id": "YGTSLDAPqb",
        "title": "Connect Later: Improving Fine-Tuning for Robustness with Targeted Augmentations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Models trained on a labeled source domain (e.g., bright, nearby astronomical objects) often generalize poorly when deployed on an out-of-distribution (OOD) target domain (e.g., faint, distant objects). In the domain adaptation setting where unlabeled target data is available, self-supervised pretraining (e.g., masked autoencoding or contrastive learning) is a promising method to mitigate this performance drop. Pretraining improves OOD error when the generic data augmentations used (e.g., masking or cropping) connect the source and target domains, which may be far apart in the input space. In this paper, we show on real-world tasks that standard fine-tuning after pretraining does not consistently improve OOD error over just supervised learning on labeled source data. To better leverage pretraining for distribution shifts, we propose Connect Later: after pretraining with generic augmentations to learn good representations within the source and target domains, fine-tune with targeted augmentations designed with knowledge of the distribution shift to better connect the domains. Connect Later improves average OOD error over standard fine-tuning and supervised learning with targeted augmentations on 3 real-world datasets: astronomical time-series classification (AstroClassification) by 12%, redshift prediction for astronomical time-series (Redshifts) by 0.03 RMSE (11% relative), and wildlife species identification (iWildCam-WILDS) by 0.9%, achieving the state-of-the-art on AstroClassification and on iWildCam-WILDS with ResNet-50.",
        "keywords": "pretraining;domain adaptation;robustness",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/2c44fc44f9a0bea505ecd8af9bdf116ddf1c1fe9.zip",
        "author": "Helen Qu;Sang Michael Xie",
        "authorids": "~Helen_Qu1;~Sang_Michael_Xie1",
        "gender": ";",
        "homepage": "https://www.helenqu.com;https://cs.stanford.edu/~eix/",
        "dblp": "317/0339;220/3987",
        "google_scholar": ";EBNa5IEAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Helen_Qu1;~Sang_Michael_Xie1",
        "aff": "University of Pennsylvania;Stanford University",
        "aff_domain": "upenn.edu;stanford.edu",
        "position": "PhD student;PhD student",
        "bibtex": "@misc{\nqu2024connect,\ntitle={Connect Later: Improving Fine-Tuning for Robustness with Targeted Augmentations},\nauthor={Helen Qu and Sang Michael Xie},\nyear={2024},\nurl={https://openreview.net/forum?id=YGTSLDAPqb}\n}",
        "github": "",
        "project": "",
        "reviewers": "vvbp;erbX;atYU",
        "site": "https://openreview.net/forum?id=YGTSLDAPqb",
        "pdf_size": 1827859,
        "rating": "3;5;5",
        "confidence": "4;4;4",
        "soundness": "1;3;2",
        "contribution": "2;2;2",
        "presentation": "3;3;2",
        "wc_summary": "151;70;39",
        "wc_strengths": "114;16;10",
        "wc_weaknesses": "474;74;332",
        "wc_questions": "2;21;10",
        "wc_review": "741;181;391",
        "wc_reply_reviewers": "0;0;59",
        "wc_reply_authors": "1194;766;1196",
        "reply_reviewers": "0;0;1",
        "reply_authors": "3;2;3",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            86.66666666666667,
            47.21816976075583
        ],
        "wc_strengths_avg": [
            46.666666666666664,
            47.67482447674967
        ],
        "wc_weaknesses_avg": [
            293.3333333333333,
            165.57240779254926
        ],
        "wc_questions_avg": [
            11.0,
            7.788880963698615
        ],
        "wc_review_avg": [
            437.6666666666667,
            230.98821518760553
        ],
        "wc_reply_reviewers_avg": [
            19.666666666666668,
            27.812866726670865
        ],
        "wc_reply_authors_avg": [
            1052.0,
            202.23418768019087
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7541529667349864195&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Pennsylvania;Stanford University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.upenn.edu;https://www.stanford.edu",
        "aff_unique_abbr": "UPenn;Stanford",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Stanford",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "YGWGhdik6O",
        "title": "Neural Optimizer Equation, Decay Function, and Learning Rate Schedule Joint Evolution",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "A major contributor to the quality of a deep learning model is the selection of the optimizer. We propose a new dual-joint search space in the realm of neural optimizer search (NOS), along with an integrity check, to automate the process of finding deep learning optimizers. Our dual-joint search space simultaneously allows for the optimization of not only the update equation, but also internal decay functions and learning rate schedules for optimizers. We search the space using our proposed mutation-only, particle-based genetic algorithm able to be massively parallelized for our domain-specific problem. We evaluate our candidate optimizers on the CIFAR-10 dataset using a small ConvNet. To assess generalization, the final optimizers were then transferred to large-scale image classification on CIFAR-100 and TinyImageNet, while also being fine-tuned on Flowers102, Cars196, and Caltech101 using EfficientNetV2Small. We found multiple optimizers, learning rate schedules, and Adam variants that outperformed Adam, as well as other standard deep learning optimizers, across the image classification tasks.",
        "keywords": "genetic algorithms;deep learning optimizers;neural optimizer search",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Brandon Morgan;Dean F. Hougen",
        "authorids": "~Brandon_Morgan1;~Dean_F._Hougen1",
        "gender": "M;M",
        "homepage": "https://www.linkedin.com/in/brandon-morgan-00552115b/;https://www.cs.ou.edu/~hougen/",
        "dblp": ";85/4020",
        "google_scholar": ";zVMLl_cAAAAJ",
        "orcid": ";0000-0001-5393-1480",
        "linkedin": "brandon-morgan-00552115b/;deanhougen/",
        "or_profile": "~Brandon_Morgan1;~Dean_F._Hougen1",
        "aff": "University of Oklahoma;University of Oklahoma",
        "aff_domain": "ou.edu;ou.edu",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\nmorgan2024neural,\ntitle={Neural Optimizer Equation, Decay Function, and Learning Rate Schedule Joint Evolution},\nauthor={Brandon Morgan and Dean F. Hougen},\nyear={2024},\nurl={https://openreview.net/forum?id=YGWGhdik6O}\n}",
        "github": "",
        "project": "",
        "reviewers": "8NVV;Mvi5;XE1e;hhkB",
        "site": "https://openreview.net/forum?id=YGWGhdik6O",
        "pdf_size": 12631542,
        "rating": "3;3;3;3",
        "confidence": "4;4;4;4",
        "soundness": "3;2;2;2",
        "contribution": "2;1;2;2",
        "presentation": "2;1;2;2",
        "wc_summary": "116;35;37;121",
        "wc_strengths": "42;16;6;79",
        "wc_weaknesses": "377;153;24;243",
        "wc_questions": "178;2;18;98",
        "wc_review": "713;206;85;541",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1013;448;228;586",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            77.25,
            41.293916016769344
        ],
        "wc_strengths_avg": [
            35.75,
            28.216794644324857
        ],
        "wc_weaknesses_avg": [
            199.25,
            128.8029017530273
        ],
        "wc_questions_avg": [
            74.0,
            70.19971509913698
        ],
        "wc_review_avg": [
            386.25,
            251.9696162238614
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            568.75,
            286.50774422343284
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:fBg2O547gJ8J:scholar.google.com/&scioq=Neural+Optimizer+Equation,+Decay+Function,+and+Learning+Rate+Schedule+Joint+Evolution&hl=en&as_sdt=0,33",
        "gs_version_total": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Oklahoma",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ou.edu",
        "aff_unique_abbr": "OU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "YH3tFtwuzb",
        "title": "Differentially Private Bias-Term Fine-tuning of Foundation Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We study the problem of differentially private (DP) fine-tuning of large pre-trained models \u2014 a recent privacy-preserving approach suitable for solving downstream tasks with sensitive data. Existing work has demonstrated that high accuracy is possible under strong privacy constraint, yet requires significant computational overhead or modifications to the network architecture.\n\nWe propose differentially private bias-term fine-tuning (DP-BiTFiT), which matches the state-of-the-art accuracy for DP algorithms and the efficiency of the standard BiTFiT. DP-BiTFiT is model agnostic (not modifying the network architecture), parameter efficient (only training about 0.1% of the parameters), and computation efficient (almost removing the overhead caused by DP, in both the time and space complexity). On a wide range of tasks, DP-BiTFiT is 2 - 30X faster and uses 2 - 8X less memory than DP full fine-tuning, even faster than the standard full fine-tuning. This amazing efficiency enables us to conduct DP fine-tuning on language and vision tasks with long-sequence texts and high-resolution images, which were computationally difficult using existing methods.",
        "keywords": "deep learning;differential privacy;algorithm;fine-tuning;computation efficiency",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Zhiqi Bu;Yu-Xiang Wang;Sheng Zha;George Karypis",
        "authorids": "~Zhiqi_Bu1;~Yu-Xiang_Wang1;~Sheng_Zha1;~George_Karypis1",
        "gender": "M;;M;M",
        "homepage": "https://sites.google.com/view/zhiqi-bu;http://www.cs.ucsb.edu/~yuxiangw/publications.html;https://github.com/szha;",
        "dblp": "245/2573;62/1637-3.html;218/5471;",
        "google_scholar": "MEvTLxIAAAAJ;HGNZ1fkAAAAJ;;ElqwScwAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;shengzha/;",
        "or_profile": "~Zhiqi_Bu1;~Yu-Xiang_Wang1;~Sheng_Zha1;~George_Karypis1",
        "aff": "Amazon;UC Santa Barbara;Amazon;University of Minnesota, Minneapolis",
        "aff_domain": "amazon.com;ucsb.edu;amazon.com;umn.edu",
        "position": "Researcher;Assistant Professor;Researcher;Full Professor",
        "bibtex": "@misc{\nbu2024differentially,\ntitle={Differentially Private Bias-Term Fine-tuning of Foundation Models},\nauthor={Zhiqi Bu and Yu-Xiang Wang and Sheng Zha and George Karypis},\nyear={2024},\nurl={https://openreview.net/forum?id=YH3tFtwuzb}\n}",
        "github": "",
        "project": "",
        "reviewers": "regQ;tcjD;3Kry;BrY1;oSFo",
        "site": "https://openreview.net/forum?id=YH3tFtwuzb",
        "pdf_size": 636726,
        "rating": "3;5;5;6;8",
        "confidence": "4;3;4;3;3",
        "soundness": "2;3;3;3;3",
        "contribution": "2;2;2;3;4",
        "presentation": "3;2;3;1;3",
        "wc_summary": "107;46;121;72;74",
        "wc_strengths": "95;46;56;52;150",
        "wc_weaknesses": "120;125;84;159;75",
        "wc_questions": "37;38;138;122;24",
        "wc_review": "359;255;399;405;323",
        "wc_reply_reviewers": "0;431;336;33;271",
        "wc_reply_authors": "512;1050;467;498;182",
        "reply_reviewers": "0;3;1;1;1",
        "reply_authors": "2;4;2;1;1",
        "rating_avg": [
            5.4,
            1.624807680927192
        ],
        "confidence_avg": [
            3.4,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.6,
            0.8
        ],
        "presentation_avg": [
            2.4,
            0.8
        ],
        "wc_summary_avg": [
            84.0,
            26.780589986032794
        ],
        "wc_strengths_avg": [
            79.8,
            39.091687095851974
        ],
        "wc_weaknesses_avg": [
            112.6,
            30.3090745487222
        ],
        "wc_questions_avg": [
            71.8,
            48.04331379078675
        ],
        "wc_review_avg": [
            348.2,
            55.21738856555967
        ],
        "wc_reply_reviewers_avg": [
            214.2,
            169.5752340408233
        ],
        "wc_reply_authors_avg": [
            541.8,
            281.4692878450507
        ],
        "reply_reviewers_avg": [
            1.2,
            0.9797958971132712
        ],
        "reply_authors_avg": [
            2.0,
            1.0954451150103321
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.7035264706814485,
        "gs_citation": 55,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10076035367100406984&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 10,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "Amazon;University of California, Santa Barbara;University of Minnesota",
        "aff_unique_dep": "Amazon.com, Inc.;;",
        "aff_unique_url": "https://www.amazon.com;https://www.ucsb.edu;https://www.minnesota.edu",
        "aff_unique_abbr": "Amazon;UCSB;UMN",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Santa Barbara;Minneapolis",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "TEMPO: Prompt-based Generative Pre-trained Transformer for Time Series Forecasting",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18429",
        "id": "YH5w12OUuU",
        "author_site": "Defu Cao, Furong Jia, Sercan Arik, Tomas Pfister, Yixiang Zheng, Wen Ye, Yan Liu",
        "tldr": "",
        "abstract": "The past decade has witnessed significant advances in time series modeling with deep learning. While achieving state-of-the-art results, the best-performing architectures vary highly across applications and domains. Meanwhile, for natural language processing, the Generative Pre-trained Transformer (GPT) has demonstrated impressive performance via training one general-purpose model across various textual datasets. It is intriguing to explore whether GPT-type architectures can be effective for time series, capturing the intrinsic dynamic attributes and leading to significant accuracy improvements. In this paper, we propose a novel framework, TEMPO, that can effectively learn time series representations. We focus on utilizing two essential inductive biases of the time series task for pre-trained models: (i) decomposition of the complex interaction between trend, seasonal and residual components; and (ii) introducing the design of prompts to facilitate distribution adaptation in different types of time series. TEMPO expands the capability for dynamically modeling real-world temporal phenomena from data within diverse domains. Our experiments demonstrate the superior performance of TEMPO over state-of-the-art methods on zero shot setting for a number of time series benchmark datasets. This performance gain is observed not only in scenarios involving previously unseen datasets but also in scenarios with multi-modal inputs. This compelling finding highlights TEMPO's potential to constitute a foundational model-building framework.",
        "keywords": "Forecasting; Time Series; Large Language Model",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Defu Cao;Furong Jia;Sercan O Arik;Tomas Pfister;Yixiang Zheng;Wen Ye;Yan Liu",
        "authorids": "~Defu_Cao1;~Furong_Jia1;~Sercan_O_Arik1;~Tomas_Pfister1;~Yixiang_Zheng1;~Wen_Ye2;~Yan_Liu1",
        "gender": "M;F;M;M;M;F;F",
        "homepage": "https://idevede.github.io/;https://flora-jia-jfr.github.io/furongjia.github.io/;https://www.sercanarik.com/;http://tomas.pfister.fi;;https://wen-ye-xwz.github.io;http://www-bcf.usc.edu/~liu32/",
        "dblp": "274/1535;;;14/8360;;48/119-1;150/4295",
        "google_scholar": "https://scholar.google.com/citations?hl=en;yNx9cokAAAAJ;;ahSpJOAAAAAJ;;_HxPFowAAAAJ;UUKLPMYAAAAJ",
        "orcid": "0000-0003-0240-3818;;0000-0001-6333-1729;0009-0004-4088-8718;;0009-0006-6196-0824;0000-0002-7055-9518",
        "linkedin": ";;;;gary-zheng-yx/overlay/contact-info/;wen-ye-xwz/;",
        "or_profile": "~Defu_Cao1;~Furong_Jia1;~Sercan_O_Arik1;~Tomas_Pfister1;~Yixiang_Zheng1;~Wen_Ye2;~Yan_Liu1",
        "aff": "University of Southern California;University of Southern California;Google;Google;;University of Southern California;University of Southern California",
        "aff_domain": "usc.edu;usc.edu;google.com;google.com;;usc.edu;usc.edu",
        "position": "PhD student;Undergrad student;Research Scientist;Head of Research @ Cloud AI;;PhD student;Professor",
        "bibtex": "@inproceedings{\ncao2024tempo,\ntitle={{TEMPO}: Prompt-based Generative Pre-trained Transformer for Time Series Forecasting},\nauthor={Defu Cao and Furong Jia and Sercan O Arik and Tomas Pfister and Yixiang Zheng and Wen Ye and Yan Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=YH5w12OUuU}\n}",
        "github": "",
        "project": "",
        "reviewers": "izvx;W4kZ;2NZn",
        "pdf_size": 3218700,
        "rating": "5;6;8",
        "confidence": "4;3;4",
        "soundness": "2;3;4",
        "contribution": "3;3;4",
        "presentation": "2;3;3",
        "wc_summary": "47;67;92",
        "wc_strengths": "64;20;118",
        "wc_weaknesses": "402;80;76",
        "wc_questions": "169;123;48",
        "wc_review": "682;290;334",
        "wc_reply_reviewers": "289;0;0",
        "wc_reply_authors": "3927;2178;660",
        "reply_reviewers": "1;0;0",
        "reply_authors": "8;4;1",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            68.66666666666667,
            18.408935028645434
        ],
        "wc_strengths_avg": [
            67.33333333333333,
            40.07770230717103
        ],
        "wc_weaknesses_avg": [
            186.0,
            152.7437942001791
        ],
        "wc_questions_avg": [
            113.33333333333333,
            49.86871653540813
        ],
        "wc_review_avg": [
            435.3333333333333,
            175.3422050987408
        ],
        "wc_reply_reviewers_avg": [
            96.33333333333333,
            136.23590650860817
        ],
        "wc_reply_authors_avg": [
            2255.0,
            1334.8580448871708
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            4.333333333333333,
            2.8674417556808756
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.18898223650461363,
        "gs_citation": 202,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16350442495005177407&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=YH5w12OUuU",
        "pdf": "https://openreview.net/pdf?id=YH5w12OUuU",
        "email": "usc.edu;usc.edu;google.com;google.com;;usc.edu;usc.edu",
        "author_num": 7,
        "aff_unique_index": "0;0;1;1;0;0",
        "aff_unique_norm": "University of Southern California;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.usc.edu;https://www.google.com",
        "aff_unique_abbr": "USC;Google",
        "aff_campus_unique_index": "0;0;1;1;0;0",
        "aff_campus_unique": "Los Angeles;Mountain View",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "YH9tnuUYds",
        "title": "Model-based Reinforcement Learning for Parameterized Action Spaces",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We propose a novel model-based reinforcement learning algorithm---Dynamics Learning and predictive control with Parameterized Actions (DLPA)---for Parameterized Action Markov Decision Processes (PAMDPs). The agent learns a parameterized-action-conditioned dynamics model and plans with a modified Model Predictive Path Integral control. Our empirical results on several standard benchmarks show that our algorithm achieves superior sample efficiency and asymptotic performance than state-of-the-art PAMDP methods.",
        "keywords": "Model-based Reinforcement Learning;Parameterized Action Markov Decesion Process;deep reinforcement learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/2f5982d91d1b2e805818f3191f193fb676bd69a2.zip",
        "author": "Renhao Zhang;Haotian Fu;Yilin Miao;George Konidaris",
        "authorids": "~Renhao_Zhang1;~Haotian_Fu3;~Yilin_Miao1;~George_Konidaris1",
        "gender": "M;M;M;M",
        "homepage": "https://renhaoz.github.io/;https://haotianfu.me/;;http://cs.brown.edu/people/gdk/",
        "dblp": "256/2504;237/9681;;56/6762",
        "google_scholar": "https://scholar.google.com/citations?hl=en;btaP96wAAAAJ;;9UERvVEAAAAJ",
        "orcid": ";;0000-0002-5178-7363;",
        "linkedin": ";;yilin-miao/;",
        "or_profile": "~Renhao_Zhang1;~Haotian_Fu3;~Yilin_Miao1;~George_Konidaris1",
        "aff": "Brown University;Brown University;Brown University;Brown University",
        "aff_domain": "brown.edu;brown.edu;brown.edu;brown.edu",
        "position": "MS student;PhD student;MS student;Assistant Professor",
        "bibtex": "@misc{\nzhang2024modelbased,\ntitle={Model-based Reinforcement Learning for Parameterized Action Spaces},\nauthor={Renhao Zhang and Haotian Fu and Yilin Miao and George Konidaris},\nyear={2024},\nurl={https://openreview.net/forum?id=YH9tnuUYds}\n}",
        "github": "",
        "project": "",
        "reviewers": "75cb;7BWk;bdkF;RWZZ;WRCa",
        "site": "https://openreview.net/forum?id=YH9tnuUYds",
        "pdf_size": 5139425,
        "rating": "5;5;5;6;10",
        "confidence": "3;4;4;4;4",
        "soundness": "3;2;2;3;4",
        "contribution": "3;1;2;2;3",
        "presentation": "2;2;2;3;4",
        "wc_summary": "81;13;39;79;133",
        "wc_strengths": "58;7;85;24;105",
        "wc_weaknesses": "456;6;64;130;54",
        "wc_questions": "47;28;89;105;578",
        "wc_review": "642;54;277;338;870",
        "wc_reply_reviewers": "9;35;0;59;0",
        "wc_reply_authors": "1140;425;1005;686;399",
        "reply_reviewers": "1;1;0;1;0",
        "reply_authors": "3;1;2;1;1",
        "rating_avg": [
            6.2,
            1.9390719429665317
        ],
        "confidence_avg": [
            3.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.8,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.2,
            0.7483314773547882
        ],
        "presentation_avg": [
            2.6,
            0.8
        ],
        "wc_summary_avg": [
            69.0,
            40.92920717531675
        ],
        "wc_strengths_avg": [
            55.8,
            36.52615501253862
        ],
        "wc_weaknesses_avg": [
            142.0,
            161.90367506638012
        ],
        "wc_questions_avg": [
            169.4,
            206.17526524779834
        ],
        "wc_review_avg": [
            436.2,
            286.9149002753255
        ],
        "wc_reply_reviewers_avg": [
            20.6,
            23.08765904114144
        ],
        "wc_reply_authors_avg": [
            731.0,
            299.41342655265146
        ],
        "reply_reviewers_avg": [
            0.6,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.6,
            0.8
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3094263738776381,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11794975877883303160&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 13,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Brown University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.brown.edu",
        "aff_unique_abbr": "Brown",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Active Test-Time Adaptation: Theoretical Analyses and An Algorithm",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18428",
        "id": "YHUGlwTzFB",
        "author_site": "Shurui Gui, Xiner Li, Shuiwang Ji",
        "tldr": "",
        "abstract": "Test-time adaptation (TTA) addresses distribution shifts for streaming test data in unsupervised settings. Currently, most TTA methods can only deal with minor shifts and rely heavily on heuristic and empirical studies. \n  To advance TTA under domain shifts, we propose the novel problem setting of active test-time adaptation (ATTA) that integrates active learning within the fully TTA setting.\n  We provide a learning theory analysis, demonstrating that incorporating limited labeled test instances enhances overall performances across test domains with a theoretical guarantee. We also present a sample entropy balancing for implementing ATTA while avoiding catastrophic forgetting (CF). We introduce a simple yet effective ATTA algorithm, known as SimATTA, using real-time sample selection techniques. Extensive experimental results confirm consistency with our theoretical analyses and show that the proposed ATTA method yields substantial performance improvements over TTA methods while maintaining efficiency and shares similar effectiveness to the more demanding active domain adaptation (ADA) methods. Our code is available at https://github.com/divelab/ATTA.",
        "keywords": "Domain adaptation;Test-time adaptation;Distribution shift;Catastrophic forgetting",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/e64842bcfc40179583a7ecbdc784dbe95a232217.pdf",
        "author": "Shurui Gui;Xiner Li;Shuiwang Ji",
        "authorids": "~Shurui_Gui1;~Xiner_Li1;~Shuiwang_Ji1",
        "gender": "M;F;M",
        "homepage": "https://cm-bf.github.io;;http://people.tamu.edu/~sji",
        "dblp": "272/0674.html;267/6459;84/6405",
        "google_scholar": "U4AjtOkAAAAJ;bBQx_5MAAAAJ;BZGj6sAAAAAJ",
        "orcid": ";;0000-0002-4205-4563",
        "linkedin": ";;shuiwang-ji-9a040715/",
        "or_profile": "~Shurui_Gui1;~Xiner_Li1;~Shuiwang_Ji1",
        "aff": "Texas A&M University;Texas A&M University - College Station;Texas A&M University",
        "aff_domain": "tamu.edu;tamu.edu;tamu.edu",
        "position": "PhD student;PhD student;Professor",
        "bibtex": "@inproceedings{\ngui2024active,\ntitle={Active Test-Time Adaptation: Theoretical Analyses and An Algorithm},\nauthor={Shurui Gui and Xiner Li and Shuiwang Ji},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=YHUGlwTzFB}\n}",
        "github": "",
        "project": "",
        "reviewers": "5EyE;yeNU;BXz7;cDV9",
        "pdf_size": 4100151,
        "rating": "5;6;8;8",
        "confidence": "3;4;4;5",
        "soundness": "2;3;4;4",
        "contribution": "2;3;4;4",
        "presentation": "3;3;3;3",
        "wc_summary": "149;51;167;127",
        "wc_strengths": "114;53;102;170",
        "wc_weaknesses": "129;129;60;149",
        "wc_questions": "2;41;45;230",
        "wc_review": "394;274;374;676",
        "wc_reply_reviewers": "0;0;12;10",
        "wc_reply_authors": "1284;1236;545;1528",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "3;3;2;3",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            3.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            123.5,
            44.189930979805794
        ],
        "wc_strengths_avg": [
            109.75,
            41.61955670114712
        ],
        "wc_weaknesses_avg": [
            116.75,
            33.766662553471285
        ],
        "wc_questions_avg": [
            79.5,
            88.5
        ],
        "wc_review_avg": [
            429.5,
            149.4013052151821
        ],
        "wc_reply_reviewers_avg": [
            5.5,
            5.545268253204709
        ],
        "wc_reply_authors_avg": [
            1148.25,
            365.46160879085505
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.75,
            0.4330127018922193
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.816496580927726,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4194131213342595367&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=YHUGlwTzFB",
        "pdf": "https://openreview.net/pdf?id=YHUGlwTzFB",
        "email": "tamu.edu;tamu.edu;tamu.edu",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Texas A&M University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tamu.edu",
        "aff_unique_abbr": "TAMU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";College Station",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "YHihO8Ka3O",
        "title": "FedGT: Federated Node Classification with Scalable Graph Transformer",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graphs are widely used to model relational data in various data mining tasks. As graphs are getting larger and larger in real-world scenarios, there is a trend to store and compute subgraphs in multiple local systems. For example, recently proposed \\emph{subgraph federated learning} methods train Graph Neural Networks (GNNs) distributively on local subgraphs and aggregate GNN parameters with a central server. However, existing methods have the following limitations: (1) The links between local subgraphs are missing in the subgraph federated learning. This could severely damage the performance of GNNs that follow message-passing paradigms to update node/edge features. (2) Most existing methods overlook the subgraph heterogeneity issue, brought by subgraphs being from different parts of the whole graph. To address the aforementioned challenges, we propose a scalable \\textbf{Fed}erated \\textbf{G}raph \\textbf{T}ransformer (\\textbf{FedGT}) in the paper. Firstly, we design a hybrid attention scheme to reduce the complexity of Graph Transformer to linear while ensuring a global receptive field with theoretical bounds. Specifically, each node attends to the sampled local neighbors and a set of curated global nodes to learn both local and global information and be robust to missing links. The global nodes are dynamically updated during training with an online clustering algorithm to capture the data distribution of the corresponding local subgraph. Secondly, FedGT computes similarity based on the aligned global nodes with optimal transport. The similarity is used to perform weighted averaging for personalized aggregation, which well addresses the data heterogeneity problem. Moreover, local differential privacy is applied to further protect the privacy of clients. Finally, extensive experimental results on 6 datasets and both non-overlapping and overlapping subgraph settings validate the effectiveness of FedGT.",
        "keywords": "Graph Federated Learning;Graph Transformer;Node Classification",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "ZAIXI ZHANG;Zepu Lu;Qingyong Hu;Yang Yu;Weibo Gao;Ye Liu;Hongkang Li;Qi Liu",
        "authorids": "~ZAIXI_ZHANG2;~Zepu_Lu1;~Qingyong_Hu2;~Yang_Yu18;~Weibo_Gao1;~Ye_Liu10;~Hongkang_Li1;~Qi_Liu3",
        "gender": "M;F;M;M;;M;;M",
        "homepage": "http://home.ustc.edu.cn/~zaixi/;https://github.com/luzepu;;https://yflyl613.github.io/;;https://liuyeah.github.io;https://lohek330.github.io/lihongkang.github.io/;http://staff.ustc.edu.cn/~qiliuql/",
        "dblp": "267/9295.html;342/3815;;46/2181;;96/2615-11.html;318/8643;95/2446-3",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;;https://scholar.google.com/citations?hl=zh-CN;-DwIl3IAAAAJ;;HYYR4f8AAAAJ;https://scholar.google.com.hk/citations?user=DVlDPjMAAAAJ;5EoHAFwAAAAJ",
        "orcid": ";;0000-0002-8719-7816;;;;;0000-0001-6956-5550",
        "linkedin": ";;;;;;hongkang-li-b7a341173/;",
        "or_profile": "~ZAIXI_ZHANG2;~Zepu_Lu1;~Qingyong_Hu2;~Yang_Yu18;~Weibo_Gao1;~Ye_Liu10;~Hongkang_Li1;~Qi_Liu3",
        "aff": "University of Science and Technology of China;University of Science and Technology of China;Department of Computer Science and Engineering, Hong Kong University of Science and Technology;University of Science and Technology of China;;University of Science and Technology of China;Rensselaer Polytechnic Institute;University of Science and Technology of China",
        "aff_domain": "ustc.edu.cn;ustc.edu.cn;cse.ust.hk;ustc.edu.cn;;ustc.edu;rpi.edu;ustc.edu.cn",
        "position": "PhD student;PhD student;PhD student;MS student;;PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nzhang2024fedgt,\ntitle={Fed{GT}: Federated Node Classification with Scalable Graph Transformer},\nauthor={ZAIXI ZHANG and Zepu Lu and Qingyong Hu and Yang Yu and Weibo Gao and Ye Liu and Hongkang Li and Qi Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=YHihO8Ka3O}\n}",
        "github": "",
        "project": "",
        "reviewers": "uFDb;jUaw;nEXk",
        "site": "https://openreview.net/forum?id=YHihO8Ka3O",
        "pdf_size": 1420813,
        "rating": "5;5;8",
        "confidence": "4;5;4",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "2;3;3",
        "wc_summary": "47;29;77",
        "wc_strengths": "29;56;110",
        "wc_weaknesses": "218;150;37",
        "wc_questions": "185;23;20",
        "wc_review": "479;258;244",
        "wc_reply_reviewers": "59;0;53",
        "wc_reply_authors": "1302;758;610",
        "reply_reviewers": "1;0;1",
        "reply_authors": "3;2;1",
        "rating_avg": [
            6.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            51.0,
            19.79898987322333
        ],
        "wc_strengths_avg": [
            65.0,
            33.67491648096547
        ],
        "wc_weaknesses_avg": [
            135.0,
            74.65029582437478
        ],
        "wc_questions_avg": [
            76.0,
            77.08436936240706
        ],
        "wc_review_avg": [
            327.0,
            107.63208939097423
        ],
        "wc_reply_reviewers_avg": [
            37.333333333333336,
            26.512051766864236
        ],
        "wc_reply_authors_avg": [
            890.0,
            297.52758975709577
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15094963419958840713&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1;0;0;2;0",
        "aff_unique_norm": "University of Science and Technology of China;Hong Kong University of Science and Technology;Rensselaer Polytechnic Institute",
        "aff_unique_dep": ";Department of Computer Science and Engineering;",
        "aff_unique_url": "http://www.ustc.edu.cn;https://www.ust.hk;https://www.rpi.edu",
        "aff_unique_abbr": "USTC;HKUST;RPI",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "YHqEWF5gt8",
        "title": "Clean-NeRF: Defogging using Ray Statistics Prior in Natural NeRFs",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "State-of-the-art Neural Radiance Fields (NeRFs) still struggle in novel view synthesis for complex scenes, producing inconsistent geometry among multi-view observations, which is manifested into foggy ``floaters'' typically found hovering within the volumetric representation. This paper introduces Clean-NeRF to improve NeRF reconstruction quality by directly addressing the geometry inconsistency problem. Analogous to natural image statistics, we first perform empirical studies on NeRF ray profiles to derive the {\\em natural ray statistics prior}, which is employed in our novel ray rectification transformer capable of limiting the density only to have positive values in applicable regions, typically around the first intersection between the ray and object surface. Moreover, Clean-NeRF automatically detects and models view-dependent appearances to prevent them from interfering with density estimation. Codes will be released.",
        "keywords": "NeRF;novel view synthesis",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Xinhang Liu;Yu-Wing Tai;Chi-Keung Tang",
        "authorids": "~Xinhang_Liu1;~Yu-Wing_Tai2;~Chi-Keung_Tang1",
        "gender": ";M;Not Specified",
        "homepage": "https://xinhangliu.com;https://yuwingtai.github.io/;http://www.cse.ust.hk/~cktang/",
        "dblp": "291/3884;40/566;34/4366",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;nFhLmFkAAAAJ;https://scholar.google.com.tw/citations?user=EWfpM74AAAAJ",
        "orcid": ";0000-0002-3148-0380;",
        "linkedin": ";;",
        "or_profile": "~Xinhang_Liu1;~Yu-Wing_Tai2;~ChiKeung_Tang1",
        "aff": "Hong Kong University of Science and Technology;Dartmouth College;Hong Kong University of Science and Technology",
        "aff_domain": "ust.hk;dartmouth.edu;ust.hk",
        "position": "PhD student;Associate Professor;Professor",
        "bibtex": "@misc{\nliu2024cleannerf,\ntitle={Clean-Ne{RF}:  Defogging using Ray Statistics Prior in Natural Ne{RF}s},\nauthor={Xinhang Liu and Yu-Wing Tai and Chi-Keung Tang},\nyear={2024},\nurl={https://openreview.net/forum?id=YHqEWF5gt8}\n}",
        "github": "",
        "project": "",
        "reviewers": "wuek;cFcm;8rvn;pRKJ",
        "site": "https://openreview.net/forum?id=YHqEWF5gt8",
        "pdf_size": 8062385,
        "rating": "3;3;3;3",
        "confidence": "4;4;4;4",
        "soundness": "2;2;1;1",
        "contribution": "2;2;2;2",
        "presentation": "2;3;2;3",
        "wc_summary": "182;83;109;88",
        "wc_strengths": "49;78;22;16",
        "wc_weaknesses": "286;307;778;156",
        "wc_questions": "31;41;65;37",
        "wc_review": "548;509;974;297",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            1.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            115.5,
            39.613760235554516
        ],
        "wc_strengths_avg": [
            41.25,
            24.5903944661325
        ],
        "wc_weaknesses_avg": [
            381.75,
            235.9728533115621
        ],
        "wc_questions_avg": [
            43.5,
            12.913171570144957
        ],
        "wc_review_avg": [
            582.0,
            245.64914003513223
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:16WjRLctoJMJ:scholar.google.com/&scioq=Clean-NeRF:+Defogging+using+Ray+Statistics+Prior+in+Natural+NeRFs&hl=en&as_sdt=0,47",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Dartmouth College",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ust.hk;https://www.dartmouth.edu",
        "aff_unique_abbr": "HKUST;Dartmouth",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "YIIYhSqf1L",
        "title": "Activation Function Matters in Graph Transformers",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Following the success of Transformers in deep learning, Graph Transformers have emerged as one of the most prominent architectures for graph representation learning. At the heart of Graph Transformers lies the self-attention mechanism, which aims to elevate information from nodes similar to the query node while suppressing information from others.  However, this paper has unveiled a critical limitation: the attention mechanism in MPNN-based Graph Transformers cannot effectively discern the number of neighbors, resulting in a restricted expressive capacity. To address this limitation, we investigate three activation functions for the attention mechanism: $softmax$, $tanh$, and $sigmoid$, and show that $sigmoid$ is the most powerful. Our study culminate in the development of an enhanced variant of the Graph Transformer, known as the Expressive Graph Transformer (EGT), and we prove that EGT effectively distinguish number of neighbors without restricted expressive capacity.\nExtensive evaluations on graph classification and node classification demonstrate the effectiveness and robustness of EGT. Our code is released at https://anonymous.4open.science/r/EGT-98CA/.",
        "keywords": "graph neural network;graph transformer;expressive power",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/23349f9747e5a3cc0706bc5f5ffe1bbe8b50649c.zip",
        "author": "Zhihao Yu;Xu Chu;Zixiang Wang;Liantao Ma;Yasha Wang;Wenwu Zhu",
        "authorids": "~Zhihao_Yu1;~Xu_Chu1;~Zixiang_Wang1;~Liantao_Ma1;~Yasha_Wang3;~Wenwu_Zhu1",
        "gender": ";;M;Not Specified;M;M",
        "homepage": "https://github.com/yzhHoward;;https://fieldry.github.io;https://scholar.google.com/citations?view_op=list_works&hl=en&user=necbkJkAAAAJ;;http://media.cs.tsinghua.edu.cn/en/zww",
        "dblp": "201/5271;;;193/6198;70/2725.html;97/6308-1.html",
        "google_scholar": ";;U73PSFAAAAAJ;https://scholar.google.com/citations?view_op=list_works;;https://scholar.google.com.tw/citations?user=7t2jzpgAAAAJ",
        "orcid": ";;0009-0000-1257-9580;0000-0001-5233-0624;;0000-0003-2236-9290",
        "linkedin": ";;;;;",
        "or_profile": "~Zhihao_Yu1;~Xu_Chu1;~Zixiang_Wang1;~Liantao_Ma1;~Yasha_Wang3;~Wenwu_Zhu1",
        "aff": "Peking University;;Peking University;Peking University;Peking University;Tsinghua University",
        "aff_domain": "pku.edu.cn;;stu.pku.edu.cn;pku.edu.cn;pku.edu.cn;tsinghua.edu.cn",
        "position": "PhD student;;MS student;Assistant Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nyu2024activation,\ntitle={Activation Function Matters in Graph Transformers},\nauthor={Zhihao Yu and Xu Chu and Zixiang Wang and Liantao Ma and Yasha Wang and Wenwu Zhu},\nyear={2024},\nurl={https://openreview.net/forum?id=YIIYhSqf1L}\n}",
        "github": "",
        "project": "",
        "reviewers": "w1tJ;1n8G;TK6L;Ryu8",
        "site": "https://openreview.net/forum?id=YIIYhSqf1L",
        "pdf_size": 396666,
        "rating": "3;5;5;5",
        "confidence": "4;3;3;4",
        "soundness": "1;2;2;3",
        "contribution": "1;3;2;2",
        "presentation": "2;3;3;3",
        "wc_summary": "134;39;64;128",
        "wc_strengths": "24;30;55;51",
        "wc_weaknesses": "573;266;112;340",
        "wc_questions": "5;7;41;6",
        "wc_review": "736;342;272;525",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            91.25,
            40.776065283447835
        ],
        "wc_strengths_avg": [
            40.0,
            13.24764129949177
        ],
        "wc_weaknesses_avg": [
            322.75,
            166.25187968862187
        ],
        "wc_questions_avg": [
            14.75,
            15.171931320698759
        ],
        "wc_review_avg": [
            468.75,
            179.8351675840963
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:r6OtFqP-JR4J:scholar.google.com/&scioq=Activation+Function+Matters+in+Graph+Transformers&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;1",
        "aff_unique_norm": "Peking University;Tsinghua University",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "Peking U;THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "YIRpexWVFN",
        "title": "A Theoretically Grounded Extension of Universal Attacks from the Attacker's Viewpoint",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "This paper extends universal attacks by jointly learning a set of perturbations to choose from in order to maximize the chance to attack deep neural network models. In addition, we embrace the attacker's perspective and introduce a theoretical bound quantifying how much the universal perturbations are able to fool a given model on unseen examples. An extension to assert the transferability of universal attacks is also provided. To learn such perturbations, we devise an algorithmic solution with convergence guarantees under Lipschitz continuity assumptions. We also demonstrate how it can improve the performance of state-of-the-art gradient-based universal perturbation. In practice, these novel universal perturbations result in more interpretable, diverse, and transferable attacks, as evidenced by our experiments.",
        "keywords": "adversarial attack;universal perturbation;generalization bound",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/0ba42d00036953515c1621dc8dc931c9ca221ad6.zip",
        "author": "Jordan Frecon;Paul Viallard;Emilie Morvant;Gilles Gasso;Amaury Habrard;Stephane Canu",
        "authorids": "~Jordan_Frecon1;~Paul_Viallard1;~Emilie_Morvant1;~Gilles_Gasso1;~Amaury_Habrard1;~Stephane_Canu1",
        "gender": "M;M;Not Specified;M;M;M",
        "homepage": "http://jordan-frecon.com;https://paulviallard.github.io;https://perso.univ-st-etienne.fr/me63854h/;http://asi.insa-rouen.fr/enseignants/~gasso/;http://perso.univ-st-etienne.fr/habrarda/;http://asi.insa-rouen.fr/enseignants/~scanu/",
        "dblp": "154/1353;285/5954;94/10288;;22/2297.html;17/122",
        "google_scholar": "ZBj41pgAAAAJ;k-5mpncAAAAJ;4dzYdBsAAAAJ;https://scholar.google.fr/citations?user=wPTfsEQAAAAJ;https://scholar.google.fr/citations?user=oPemAuMAAAAJ;PpibCZUAAAAJ",
        "orcid": ";;0000-0002-8301-7240;;;0000-0002-7602-4557",
        "linkedin": ";;emilie-morvant-21508823;;amaury-habrard-0375145;st%C3%A9phane-canu-b1127a14/",
        "or_profile": "~Jordan_Frecon1;~Paul_Viallard1;~Emilie_Morvant1;~Gilles_Gasso1;~Amaury_Habrard1;~Stephane_Canu1",
        "aff": "Universit\u00e9 Jean Monnet, Inria;Inria;University Jean Monnet;INSA Rouen Normandy;Universit\u00e9 Saint-Etienne, Laboratoire Hubert Curien;INSA Rouen Normandy",
        "aff_domain": "univ-st-etienne.fr;inria.fr;univ-st-etienne.fr;insa-rouen.fr;univ-st-etienne.fr;insa-rouen.fr",
        "position": "Associate Professor;Postdoc;Assistant Professor;Full Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nfrecon2024a,\ntitle={A Theoretically Grounded Extension of Universal Attacks from the Attacker's Viewpoint},\nauthor={Jordan Frecon and Paul Viallard and Emilie Morvant and Gilles Gasso and Amaury Habrard and Stephane Canu},\nyear={2024},\nurl={https://openreview.net/forum?id=YIRpexWVFN}\n}",
        "github": "",
        "project": "",
        "reviewers": "sp9Z;fSqy;y5za;P53G",
        "site": "https://openreview.net/forum?id=YIRpexWVFN",
        "pdf_size": 632896,
        "rating": "3;3;5;5",
        "confidence": "4;3;4;4",
        "soundness": "3;2;2;2",
        "contribution": "2;3;2;2",
        "presentation": "2;4;2;2",
        "wc_summary": "22;46;31;34",
        "wc_strengths": "17;21;27;54",
        "wc_weaknesses": "195;26;251;210",
        "wc_questions": "19;192;6;2",
        "wc_review": "253;285;315;300",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            33.25,
            8.584142356694699
        ],
        "wc_strengths_avg": [
            29.75,
            14.446020213193666
        ],
        "wc_weaknesses_avg": [
            170.5,
            85.90838143045183
        ],
        "wc_questions_avg": [
            54.75,
            79.49017234853626
        ],
        "wc_review_avg": [
            288.25,
            22.949673200287624
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:rSb4tBb9PG0J:scholar.google.com/&scioq=A+Theoretically+Grounded+Extension+of+Universal+Attacks+from+the+Attacker%27s+Viewpoint&hl=en&as_sdt=0,5",
        "gs_version_total": 14,
        "aff_unique_index": "0;1;2;3;4;3",
        "aff_unique_norm": "Universit\u00e9 Jean Monnet;INRIA;University Jean Monnet;INSA Rouen Normandy;Universit\u00e9 Saint-Etienne",
        "aff_unique_dep": ";;;;Laboratoire Hubert Curien",
        "aff_unique_url": "https://www.univ-jean-monnet.fr;https://www.inria.fr;https://www.univ-jean-monnet.fr;https://www.insa-rouen.fr;https://www.univ-st-etienne.fr",
        "aff_unique_abbr": "UJM;Inria;UJM;INSA Rouen;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "France"
    },
    {
        "id": "YIWe2amtrV",
        "title": "Are LLMs Aware that Some Questions are not Open-ended?",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) have shown the impressive capability of answering questions in a wide range of scenarios. However, when LLMs face different types of questions, it is worth exploring whether LLMs are aware that some questions have limited answers and have to respond more deterministically but some do not. We refer to the ability as question awareness that LLMs know to adjust the determinacy of the answers according to the questions. The lack of question awareness leads to two contradictory issues: (1) Too casual to answer non-open-ended questions. (2) Too boring to answer open-ended questions. In this paper, we first evaluate the question awareness ability of LLMs. The experimental results show that LLMs have the above issues of lacking the awareness of questions in certain domains, e.g. factual knowledge. To mitigate these issues, we propose a method called Question Awareness Temperature (QAT) sampling. This method enhances the question awareness ability of LLMs by dynamically adjusting the answer distributions based on question features. The automatic adjustment in QAT eliminates the need for manual temperature tuning in text generation. These findings underscore the potential of QAT sampling to enhance LLMs' question-awareness capabilities, thereby advancing their performance in various LLM benchmarks.",
        "keywords": "Large Language Model;Text Generation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Dongjie Yang;hai zhao",
        "authorids": "~Dongjie_Yang1;~hai_zhao1",
        "gender": "M;M",
        "homepage": "https://github.com/mutonix/;http://bcmi.sjtu.edu.cn/~zhaohai/",
        "dblp": ";25/1145-1.html",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.com.tw/citations?user=4dU5KS0AAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Dongjie_Yang1;~hai_zhao1",
        "aff": "Shanghai Jiaotong University;Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn;sjtu.edu.cn",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nyang2024are,\ntitle={Are {LLM}s Aware that Some Questions are not Open-ended?},\nauthor={Dongjie Yang and hai zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=YIWe2amtrV}\n}",
        "github": "",
        "project": "",
        "reviewers": "BHia;iU6n;NsHB",
        "site": "https://openreview.net/forum?id=YIWe2amtrV",
        "pdf_size": 1387013,
        "rating": "3;3;5",
        "confidence": "4;4;4",
        "soundness": "2;2;2",
        "contribution": "1;3;2",
        "presentation": "3;3;3",
        "wc_summary": "19;64;86",
        "wc_strengths": "39;89;36",
        "wc_weaknesses": "110;133;21",
        "wc_questions": "39;96;68",
        "wc_review": "207;382;211",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            56.333333333333336,
            27.884683171152503
        ],
        "wc_strengths_avg": [
            54.666666666666664,
            24.30820620467271
        ],
        "wc_weaknesses_avg": [
            88.0,
            48.29768800539697
        ],
        "wc_questions_avg": [
            67.66666666666667,
            23.27134623427608
        ],
        "wc_review_avg": [
            266.6666666666667,
            81.56932974810788
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14120667601338587567&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Shanghai Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sjtu.edu.cn",
        "aff_unique_abbr": "SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Parsing neural dynamics with infinite recurrent switching linear dynamical systems",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18427",
        "id": "YIls9HEa52",
        "author_site": "Victor Geadah, International Brain Laboratory, Jonathan Pillow",
        "tldr": "",
        "abstract": "Unsupervised methods for dimensionality reduction of neural activity and behavior have provided unprecedented insights into the underpinnings of neural information processing. One popular approach involves the recurrent switching linear dynamical system (rSLDS) model, which describes the latent dynamics of neural spike train data using discrete switches between a finite number of low-dimensional linear dynamical systems. However, a few properties of rSLDS model limit its deployability on trial-varying data, such as a fixed number of states over trials, and no latent structure or organization of states. Here we overcome these limitations by endowing the rSLDS model with a semi-Markov discrete state process, with latent geometry, that captures key properties of stochastic processes over partitions with flexible state cardinality. We leverage partial differential equations (PDE) theory to derive an efficient, semi-parametric formulation for dynamical sufficient statistics to the discrete states. This process, combined with switching dynamics, defines our infinite recurrent switching linear dynamical system (irSLDS) model class. We first validate and demonstrate the capabilities of our model on synthetic data. Next, we turn to the analysis of mice electrophysiological data during decision-making, and uncover strong non-stationary processes underlying both within-trial and trial-averaged neural activity.",
        "keywords": "Markov switching processes;Neural data analysis;State-space models",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Victor Geadah;International Brain Laboratory;Jonathan W. Pillow",
        "authorids": "~Victor_Geadah1;~International_Brain_Laboratory1;~Jonathan_W._Pillow1",
        "gender": "M;;Not Specified",
        "homepage": ";https://www.internationalbrainlab.com/;http://pillowlab.princeton.edu/",
        "dblp": "264/3755;;06/3460",
        "google_scholar": "YxbE8CwAAAAJ;83-cG94AAAAJ;https://scholar.google.com.tw/citations?user=-ElvJ9wAAAAJ",
        "orcid": ";;0000-0002-3638-8831",
        "linkedin": "victorgeadah/;;",
        "or_profile": "~Victor_Geadah1;~International_Brain_Laboratory1;~Jonathan_W._Pillow1",
        "aff": "Princeton University;University College London, University of London;Princeton University",
        "aff_domain": "princeton.edu;ucl.ac.uk;princeton.edu",
        "position": "PhD student;Emeritus;Professor",
        "bibtex": "@inproceedings{\ngeadah2024parsing,\ntitle={Parsing neural dynamics with infinite recurrent switching linear dynamical systems},\nauthor={Victor Geadah and International Brain Laboratory and Jonathan W. Pillow},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=YIls9HEa52}\n}",
        "github": "",
        "project": "",
        "reviewers": "ots3;k1CY;Rx1k;uvcW;u3HM",
        "pdf_size": 3641028,
        "rating": "5;6;6;8;8",
        "confidence": "3;5;3;3;2",
        "soundness": "2;4;3;4;3",
        "contribution": "3;3;3;3;3",
        "presentation": "2;3;3;4;3",
        "wc_summary": "143;53;178;249;71",
        "wc_strengths": "75;18;148;62;41",
        "wc_weaknesses": "217;61;397;31;127",
        "wc_questions": "114;46;180;154;2",
        "wc_review": "549;178;903;496;241",
        "wc_reply_reviewers": "0;92;12;19;17",
        "wc_reply_authors": "482;409;539;368;363",
        "reply_reviewers": "0;1;1;1;1",
        "reply_authors": "1;2;2;1;2",
        "rating_avg": [
            6.6,
            1.2
        ],
        "confidence_avg": [
            3.2,
            0.9797958971132712
        ],
        "soundness_avg": [
            3.2,
            0.7483314773547882
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            138.8,
            71.63351171065119
        ],
        "wc_strengths_avg": [
            68.8,
            44.069944406590764
        ],
        "wc_weaknesses_avg": [
            166.6,
            131.7051251850132
        ],
        "wc_questions_avg": [
            99.2,
            66.37589924061292
        ],
        "wc_review_avg": [
            473.4,
            257.70261931148474
        ],
        "wc_reply_reviewers_avg": [
            28.0,
            32.67414880299103
        ],
        "wc_reply_authors_avg": [
            432.2,
            68.31515205282061
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            1.6,
            0.4898979485566356
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.4422689813358516,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2030146833464628944&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=YIls9HEa52",
        "pdf": "https://openreview.net/pdf?id=YIls9HEa52",
        "email": "princeton.edu;ucl.ac.uk;princeton.edu",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Princeton University;University College London",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.princeton.edu;https://www.ucl.ac.uk",
        "aff_unique_abbr": "Princeton;UCL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "title": "Symmetric Mean-field Langevin Dynamics for Distributional Minimax Problems",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18426",
        "id": "YItWKZci78",
        "author_site": "Juno Kim, Kakei Yamamoto, Kazusato Oko, Zhuoran Yang, Taiji Suzuki",
        "tldr": "",
        "abstract": "In this paper, we extend mean-field Langevin dynamics to minimax optimization over probability distributions for the first time with symmetric and provably convergent updates. We propose \\emph{mean-field Langevin averaged gradient} (MFL-AG), a single-loop algorithm that implements gradient descent ascent in the distribution spaces with a novel weighted averaging, and establish average-iterate convergence to the mixed Nash equilibrium. We also study both time and particle discretization regimes and prove a new uniform-in-time propagation of chaos result which accounts for the dependency of the particle interactions on all previous distributions. Furthermore, we propose \\emph{mean-field Langevin anchored best response} (MFL-ABR), a symmetric double-loop algorithm based on best response dynamics with linear last-iterate convergence. Finally, we study applications to zero-sum Markov games and conduct simulations demonstrating long-term optimality.",
        "keywords": "mean-field Langevin dynamics;minimax optimization;zero-sum games;Markov games",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Juno Kim;Kakei Yamamoto;Kazusato Oko;Zhuoran Yang;Taiji Suzuki",
        "authorids": "~Juno_Kim1;~Kakei_Yamamoto1;~Kazusato_Oko1;~Zhuoran_Yang1;~Taiji_Suzuki1",
        "gender": "M;M;M;M;M",
        "homepage": "https://junokim1.github.io/;;;https://zhuoranyang.github.io/;http://ibis.t.u-tokyo.ac.jp/suzuki/",
        "dblp": "59/8200;334/7773;;;08/312",
        "google_scholar": "PEHQlgkAAAAJ;https://scholar.google.com/citations?hl=ja;;;x8osrBsAAAAJ",
        "orcid": ";0000-0002-6231-2750;;;",
        "linkedin": ";kakei-yamamoto-bb37461a0/;kazusatooko/;;",
        "or_profile": "~Juno_Kim1;~Kakei_Yamamoto1;~Kazusato_Oko1;~Zhuoran_Yang1;~Taiji_Suzuki1",
        "aff": "RIKEN;Massachusetts Institute of Technology;The University of Tokyo;Yale University;The University of Tokyo",
        "aff_domain": "riken.jp;mit.edu;u-tokyo.ac.jp;yale.edu;tokyo.ac.jp",
        "position": "Researcher;PhD student;MS student;Assistant Professor;Associate Professor",
        "bibtex": "@inproceedings{\nkim2024symmetric,\ntitle={Symmetric Mean-field Langevin Dynamics for Distributional Minimax Problems},\nauthor={Juno Kim and Kakei Yamamoto and Kazusato Oko and Zhuoran Yang and Taiji Suzuki},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=YItWKZci78}\n}",
        "github": "",
        "project": "",
        "reviewers": "q6kk;ByeN;bLee;tSuv;DQbp",
        "pdf_size": 777011,
        "rating": "6;6;6;8;8",
        "confidence": "4;3;3;2;3",
        "soundness": "3;2;3;4;2",
        "contribution": "2;3;3;4;4",
        "presentation": "2;2;3;3;2",
        "wc_summary": "60;89;29;105;136",
        "wc_strengths": "100;33;61;70;57",
        "wc_weaknesses": "637;87;250;57;240",
        "wc_questions": "190;208;162;11;44",
        "wc_review": "987;417;502;243;477",
        "wc_reply_reviewers": "307;27;96;12;0",
        "wc_reply_authors": "1686;520;1583;619;592",
        "reply_reviewers": "1;1;1;1;0",
        "reply_authors": "4;1;3;1;1",
        "rating_avg": [
            6.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.8,
            0.7483314773547882
        ],
        "contribution_avg": [
            3.2,
            0.7483314773547882
        ],
        "presentation_avg": [
            2.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            83.8,
            36.798913027425144
        ],
        "wc_strengths_avg": [
            64.2,
            21.683173199511184
        ],
        "wc_weaknesses_avg": [
            254.2,
            206.6875903386558
        ],
        "wc_questions_avg": [
            123.0,
            80.02499609497022
        ],
        "wc_review_avg": [
            525.2,
            247.97774093656068
        ],
        "wc_reply_reviewers_avg": [
            88.4,
            114.24990153168623
        ],
        "wc_reply_authors_avg": [
            1000.0,
            520.0980676757029
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4
        ],
        "reply_authors_avg": [
            2.0,
            1.2649110640673518
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.6454972243679028,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11191091073183847092&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=YItWKZci78",
        "pdf": "https://openreview.net/pdf?id=YItWKZci78",
        "email": "riken.jp;mit.edu;u-tokyo.ac.jp;yale.edu;tokyo.ac.jp",
        "author_num": 5,
        "aff_unique_index": "0;1;2;3;2",
        "aff_unique_norm": "RIKEN;Massachusetts Institute of Technology;University of Tokyo;Yale University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.riken.jp;https://web.mit.edu;https://www.u-tokyo.ac.jp;https://www.yale.edu",
        "aff_unique_abbr": "RIKEN;MIT;UTokyo;Yale",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;1;0",
        "aff_country_unique": "Japan;United States"
    },
    {
        "id": "YJxhZnGU1q",
        "title": "Strategic Recommendations for Improved Outcomes in Congestion Games",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Traffic on roads, packets on the Internet, and electricity on power grids share a structure abstracted in congestion games, where self-interested behaviour can lead to socially sub-optimal results. External recommendations may seek to alleviate these issues, but recommenders must take into account the effect that their recommendations have on the system. In this paper, we investigate the effects that dynamic recommendations have on $Q$-learners as they repeatedly play congestion games. To do so, we propose a novel model of recommendation whereby a $Q$-learner receives a recommendation as a state. Thus, the recommender strategically picks states during learning, which we call the Learning Dynamic Manipulation Problem. We define the \\textit{manipulative potential} of these recommenders in repeated congestion games and propose an algorithm for the Learning Dynamic Manipulation Problem designed to drive the actions of $Q$-learners toward a target action distribution. We simulate our algorithm and show that it can drive the system to convergence at the social optimum of a well-known congestion game. Our results show theoretically and empirically that increasing the recommendation space can increase the manipulative potential of the recommender.",
        "keywords": "Reinforcement Learning;Congestion Games;Q-learning;Correlated Equilibria",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Cesare Carissimo;Marcin Korecki;Damian Dailisan",
        "authorids": "~Cesare_Carissimo1;~Marcin_Korecki1;~Damian_Dailisan1",
        "gender": "M;;M",
        "homepage": ";;",
        "dblp": "305/4578.html;262/6376;271/8046",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;9Q2uT0UAAAAJ",
        "orcid": ";;0000-0003-2899-9082",
        "linkedin": ";;",
        "or_profile": "~Cesare_Carissimo1;~Marcin_Korecki1;~Damian_Dailisan1",
        "aff": "ETHZ - ETH Zurich;ETHZ - ETH Zurich;ETHZ - ETH Zurich",
        "aff_domain": "ethz.ch;ethz.ch;ethz.ch",
        "position": "PhD student;Postdoc;Postdoc",
        "bibtex": "@misc{\ncarissimo2024strategic,\ntitle={Strategic Recommendations for Improved Outcomes in Congestion Games},\nauthor={Cesare Carissimo and Marcin Korecki and Damian Dailisan},\nyear={2024},\nurl={https://openreview.net/forum?id=YJxhZnGU1q}\n}",
        "github": "",
        "project": "",
        "reviewers": "B8k7;fzBq;rQFP;rUVY",
        "site": "https://openreview.net/forum?id=YJxhZnGU1q",
        "pdf_size": 1441570,
        "rating": "3;3;5;6",
        "confidence": "3;2;3;3",
        "soundness": "2;2;2;3",
        "contribution": "1;2;2;2",
        "presentation": "1;2;1;3",
        "wc_summary": "84;107;66;98",
        "wc_strengths": "40;26;21;83",
        "wc_weaknesses": "259;72;160;145",
        "wc_questions": "73;348;312;119",
        "wc_review": "456;553;559;445",
        "wc_reply_reviewers": "39;0;141;112",
        "wc_reply_authors": "693;577;647;581",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            88.75,
            15.481844205391036
        ],
        "wc_strengths_avg": [
            42.5,
            24.397745797511703
        ],
        "wc_weaknesses_avg": [
            159.0,
            66.64457967456919
        ],
        "wc_questions_avg": [
            213.0,
            118.80866971732324
        ],
        "wc_review_avg": [
            503.25,
            52.93569211788961
        ],
        "wc_reply_reviewers_avg": [
            73.0,
            56.191636388345195
        ],
        "wc_reply_authors_avg": [
            624.5,
            48.3399420769202
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5555555555555555,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3510705622960013532&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "ETH Zurich",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ethz.ch",
        "aff_unique_abbr": "ETHZ",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Switzerland"
    },
    {
        "id": "YKIGyf215Q",
        "title": "Structured Fine-Tuning Enables Data-Efficient Adaptation of Code Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Current models tailored for code tasks often adopt the successful pre-training-then-fine-tuning paradigm from natural language processing, treating source code in plain text as in natural language. \nThis approach, however, overlooks the well-defined and unambiguous structures inherent in programming languages.\nIn this work, we explore a data-efficient adaptation of pre-trained code language models by further training and fine-tuning them with program structures, which significantly improve the performance of the downstream coding tasks. \nSpecifically, we represent programs as parse trees, also known as concrete syntax trees (CSTs), and refine a model with serialized CSTs.\nFine-tuning with structures encourages the model to learn not only the associations of code text in different languages but also the mappings of their structures and grammars, by using only a small amount of data (e.g., 100 examples).\nWith a focus on generation, we design training objectives for encoder-decoder and decoder-only architectures. \nWe rigorously evaluate the proposed approach on various coding tasks and demonstrate that integrating parse structures with the plain-text representation of source code offers notable advantages, particularly in scenarios of low-data code translation.",
        "keywords": "Code Representations;Parse Trees;Structured Fine-Tuning;Pre-Trained Code Models",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/35fada470cf3ba24e709b4278b6e19279f929d3e.zip",
        "author": "Mayank Agarwal;Yikang Shen;Bailin Wang;Yoon Kim;Jie Chen",
        "authorids": "~Mayank_Agarwal1;~Yikang_Shen1;~Bailin_Wang3;~Yoon_Kim1;~Jie_Chen1",
        "gender": "M;M;;;M",
        "homepage": ";;https://people.csail.mit.edu/yoonkim/;https://jiechenjiechen.github.io;https://berlino.github.io/",
        "dblp": "38/5693;152/8226;;92/6289-7;218/7334",
        "google_scholar": ";qff5rRYAAAAJ;n_ts4eYAAAAJ;Z-lkme8AAAAJ;",
        "orcid": ";;;;",
        "linkedin": "https://linkedin.com/in/mayank312/;;;;",
        "or_profile": "~Mayank_Agarwal1;~Yikang_Shen1;~Yoon_Kim1;~Jie_Chen1;~bailin_wang1",
        "aff": "International Business Machines;International Business Machines;Massachusetts Institute of Technology;International Business Machines;Massachusetts Institute of Technology",
        "aff_domain": "ibm.com;ibm.com;mit.edu;ibm.com;mit.edu",
        "position": "Research Engineeer;Researcher;Assistant Professor;Research Staff Member;Postdoc",
        "bibtex": "@misc{\nagarwal2024structured,\ntitle={Structured Fine-Tuning Enables Data-Efficient Adaptation of Code Language Models},\nauthor={Mayank Agarwal and Yikang Shen and Bailin Wang and Yoon Kim and Jie Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=YKIGyf215Q}\n}",
        "github": "",
        "project": "",
        "reviewers": "cViY;kKKV;t7DZ;adVs;28Uu",
        "site": "https://openreview.net/forum?id=YKIGyf215Q",
        "pdf_size": 426605,
        "rating": "3;3;5;5;8",
        "confidence": "5;5;4;4;4",
        "soundness": "1;2;2;2;4",
        "contribution": "3;2;2;2;3",
        "presentation": "2;3;4;3;3",
        "wc_summary": "62;79;66;86;37",
        "wc_strengths": "18;26;109;56;28",
        "wc_weaknesses": "15;271;341;132;33",
        "wc_questions": "460;149;118;57;51",
        "wc_review": "555;525;634;331;149",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            4.8,
            1.8330302779823362
        ],
        "confidence_avg": [
            4.4,
            0.48989794855663565
        ],
        "soundness_avg": [
            2.2,
            0.9797958971132712
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            3.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            66.0,
            16.88786546606764
        ],
        "wc_strengths_avg": [
            47.4,
            33.368248380758615
        ],
        "wc_weaknesses_avg": [
            158.4,
            128.8465754298499
        ],
        "wc_questions_avg": [
            167.0,
            151.08275877809487
        ],
        "wc_review_avg": [
            438.8,
            175.86403839329972
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.801783725737273,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Xih-2dWWAOkJ:scholar.google.com/&scioq=Structured+Fine-Tuning+Enables+Data-Efficient+Adaptation+of+Code+Language+Models&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;1",
        "aff_unique_norm": "International Business Machines Corporation;Massachusetts Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ibm.com;https://web.mit.edu",
        "aff_unique_abbr": "IBM;MIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "YKK1jXEWja",
        "title": "Prospector: Improving LLM Agents with Self-Asking and Trajectory Ranking",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs) have shown the ability to solve complex decision-making tasks beyond the natural language processing tasks. Current LLM agents such as ReAct can solve interactive decision-making tasks by imitating the few-shot demonstrations given in the prompt. The LLM agents based on few-shot in-context learning (ICL) achieve surprisingly high performance without training. Despite the simplicity and generalizability, the ICL-based approaches lack optimizing trajectories based on the reward from an environment. In this paper, we introduce Prospector, a reflective LLM agent that features Self-Asking and Trajectory Ranking. To elicit the LLM agent to generate more proper actions that contribute to following a given instruction, we introduce additional Self-Asking steps in the few-shot demonstrations. Furthermore, to take advantages of the stochastic generation of LLMs, we provide Trajectory Ranking in which the LLM agent generates diverse (creative) trajectories and the most rewarding trajectory is selected by using the reward prediction models. On the representative decision-making benchmark environments such as ALFWorld and WebShop, we empirically demonstrate that Prospector can considerably increase the success rate of given tasks, while outperforming recent advancements such as ReAct and Reflexion.",
        "keywords": "Large Language Models;LLM Agents;Chain-of-Thoughts;Reward Models",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Byoungjip Kim;Youngsoo Jang;Lajanugen Logeswaran;Geon-Hyeong Kim;Yu Jin Kim;Honglak Lee;Moontae Lee",
        "authorids": "~Byoungjip_Kim1;~Youngsoo_Jang2;~Lajanugen_Logeswaran1;~Geon-Hyeong_Kim2;~Yu_Jin_Kim1;~Honglak_Lee2;~Moontae_Lee1",
        "gender": ";;M;M;;;",
        "homepage": ";http://www.ysjang.me;https://sites.google.com/umich.edu/llajan/;https://sites.google.com/view/ghkim;;;https://moontae.people.uic.edu",
        "dblp": ";195/0471;157/3603;231/7707;;;132/1761",
        "google_scholar": ";6EoBBggAAAAJ;dcv4kpIAAAAJ;https://scholar.google.co.kr/citations?user=IJL0uXoAAAAJ;;;BMvYy9cAAAAJ",
        "orcid": ";;;;;;0000-0001-5542-3463",
        "linkedin": ";;;;;;moontae-lee-975248123/",
        "or_profile": "~Byoungjip_Kim1;~Youngsoo_Jang2;~Lajanugen_Logeswaran1;~Geon-Hyeong_Kim2;~Yu_Jin_Kim1;~Honglak_Lee2;~Moontae_Lee1",
        "aff": ";LG AI Research;LG AI Research;LG AI Research;LG AI Research;;University of Illinois, Chicago",
        "aff_domain": ";lgresearch.ai;lgresearch.ai;lgresearch.ai;lgresearch.ai;;uic.edu",
        "position": ";Researcher;Researcher;Researcher;Researcher;;Assistant Professor",
        "bibtex": "@misc{\nkim2024prospector,\ntitle={Prospector: Improving {LLM} Agents with Self-Asking and Trajectory Ranking},\nauthor={Byoungjip Kim and Youngsoo Jang and Lajanugen Logeswaran and Geon-Hyeong Kim and Yu Jin Kim and Honglak Lee and Moontae Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=YKK1jXEWja}\n}",
        "github": "",
        "project": "",
        "reviewers": "EvHL;EsKc;UFEP;TbNU",
        "site": "https://openreview.net/forum?id=YKK1jXEWja",
        "pdf_size": 763481,
        "rating": "5;5;5;6",
        "confidence": "4;3;2;3",
        "soundness": "2;2;2;2",
        "contribution": "2;2;1;2",
        "presentation": "3;3;2;3",
        "wc_summary": "84;100;226;63",
        "wc_strengths": "85;52;71;39",
        "wc_weaknesses": "270;55;244;195",
        "wc_questions": "143;70;64;215",
        "wc_review": "582;277;605;512",
        "wc_reply_reviewers": "79;18;0;93",
        "wc_reply_authors": "1724;824;564;803",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "4;1;1;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            118.25,
            63.5781998801476
        ],
        "wc_strengths_avg": [
            61.75,
            17.597940220378067
        ],
        "wc_weaknesses_avg": [
            191.0,
            83.00903565275289
        ],
        "wc_questions_avg": [
            123.0,
            61.55079203389669
        ],
        "wc_review_avg": [
            494.0,
            129.88263933259134
        ],
        "wc_reply_reviewers_avg": [
            47.5,
            39.33509883043387
        ],
        "wc_reply_authors_avg": [
            978.75,
            442.22470249862795
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            1.299038105676658
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5440651195847962082&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0;1",
        "aff_unique_norm": "LG;University of Illinois at Chicago",
        "aff_unique_dep": "LG AI Research;",
        "aff_unique_url": "https://www.lgaires.com;https://www.uic.edu",
        "aff_unique_abbr": "LG AI;UIC",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Chicago",
        "aff_country_unique_index": "0;0;0;0;1",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "id": "YKfESGFdas",
        "title": "GeONet: a neural operator for learning the Wasserstein geodesic",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Optimal transport (OT) offers a versatile framework to compare complex data distributions in a geometrically meaningful way. Traditional methods for computing the Wasserstein distance and geodesic between probability measures require mesh-dependent domain discretization and suffer from the curse-of-dimensionality. We present GeONet, a mesh-invariant deep neural operator network that learns the non-linear mapping from the input pair of initial and terminal distributions to the Wasserstein geodesic connecting the two endpoint distributions. In the offline training stage, GeONet learns the saddle point optimality conditions for the dynamic formulation of the OT problem in the primal and dual spaces that are characterized by a coupled PDE system. The subsequent inference stage is instantaneous and can be deployed for real-time predictions in the online learning setting. We demonstrate that GeONet achieves comparable testing accuracy to the standard OT solvers on simulation examples and the MNIST dataset with considerably reduced inference-stage computational cost by orders of magnitude.",
        "keywords": "neural operator;geodesic;Wasserstein;optimal transport;GeONet",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/2ba031b42611c13e883a4004f46f0796d6e3b2f1.zip",
        "author": "Andrew Gracyk;Xiaohui Chen",
        "authorids": "~Andrew_Gracyk1;~Xiaohui_Chen3",
        "gender": "M;M",
        "homepage": "https://andrewgracyk.com/home/;https://the-xiaohuichen.github.io/",
        "dblp": ";",
        "google_scholar": ";ZKij_0cAAAAJ",
        "orcid": ";",
        "linkedin": ";xiaohui-chen-b67677a0/",
        "or_profile": "~Andrew_Gracyk1;~Xiaohui_Chen3",
        "aff": "University of Illinois, Urbana Champaign;University of Southern California",
        "aff_domain": "illinois.edu;usc.edu",
        "position": "MS student;Associate Professor",
        "bibtex": "@misc{\ngracyk2024geonet,\ntitle={Ge{ON}et: a neural operator for learning the Wasserstein geodesic},\nauthor={Andrew Gracyk and Xiaohui Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=YKfESGFdas}\n}",
        "github": "",
        "project": "",
        "reviewers": "NBJx;1NDe;oWAG;Q478",
        "site": "https://openreview.net/forum?id=YKfESGFdas",
        "pdf_size": 4385141,
        "rating": "3;5;6;6",
        "confidence": "4;3;5;4",
        "soundness": "2;2;3;3",
        "contribution": "1;2;3;3",
        "presentation": "3;1;3;2",
        "wc_summary": "67;22;86;77",
        "wc_strengths": "26;12;36;91",
        "wc_weaknesses": "610;181;80;44",
        "wc_questions": "346;117;20;70",
        "wc_review": "1049;332;222;282",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1209;256;289;429",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            63.0,
            24.606909598728564
        ],
        "wc_strengths_avg": [
            41.25,
            29.961433543807612
        ],
        "wc_weaknesses_avg": [
            228.75,
            225.77131682301896
        ],
        "wc_questions_avg": [
            138.25,
            124.75250498486994
        ],
        "wc_review_avg": [
            471.25,
            335.82984903072565
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            545.75,
            388.3963021193688
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.28867513459481287,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17087213202069922502&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Illinois Urbana-Champaign;University of Southern California",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://illinois.edu;https://www.usc.edu",
        "aff_unique_abbr": "UIUC;USC",
        "aff_campus_unique_index": "0;1",
        "aff_campus_unique": "Urbana-Champaign;Los Angeles",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "YKzGrt3m2g",
        "title": "Transformers Learn Higher-Order Optimization Methods for In-Context Learning: A Study with Linear Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Transformers are remarkably good at *in-context learning* (ICL)---learning from demonstrations without parameter updates---but how they perform ICL remains a mystery. \nRecent work suggests that Transformers may learn in-context by internally running Gradient Descent, a first-order optimization method. In this paper, we instead demonstrate that Transformers learn to implement higher-order optimization methods to perform ICL. Focusing on in-context linear regression, we show that Transformers learn to implement an algorithm very similar to *Iterative Newton's Method*, a higher-order optimization method, rather than  Gradient Descent. Empirically, we show that predictions from successive Transformer layers closely match different iterations of Newton's Method, with each middle layer roughly computing 3 iterations;  Gradient Descent is a much poorer match for the Transformer. \nWe also show that Transformers can learn in-context on ill-conditioned data, a setting where Gradient Descent struggles but Iterative Newton succeeds. Finally, we show theoretical results which support our empirical findings and have a close correspondence with them: we prove that Transformers can implement $k$ iterations of Newton's method with $\\mathcal{O}(k)$ layers.",
        "keywords": "in-context learning;transformers;linear regression",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Deqing Fu;Tianqi CHEN;Robin Jia;Vatsal Sharan",
        "authorids": "~Deqing_Fu1;~Tianqi_CHEN3;~Robin_Jia1;~Vatsal_Sharan1",
        "gender": "M;;M;M",
        "homepage": "https://deqingfu.github.io/;https://www.linkedin.com/in/tianqi-chen-27a722227/;https://robinjia.github.io/;https://vatsalsharan.github.io/",
        "dblp": "304/3030;;182/2556;126/2543",
        "google_scholar": "fsbgfqEAAAAJ;;ajZ-_O0AAAAJ;Ize17HEAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Deqing_Fu1;~Tianqi_CHEN3;~Robin_Jia1;~Vatsal_Sharan1",
        "aff": "University of Southern California;University of Southern California;University of Southern California;University of Southern California",
        "aff_domain": "usc.edu;usc.edu;usc.edu;usc.edu",
        "position": "PhD student;MS student;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nfu2024transformers,\ntitle={Transformers Learn Higher-Order Optimization Methods for In-Context Learning: A Study with Linear Models},\nauthor={Deqing Fu and Tianqi CHEN and Robin Jia and Vatsal Sharan},\nyear={2024},\nurl={https://openreview.net/forum?id=YKzGrt3m2g}\n}",
        "github": "",
        "project": "",
        "reviewers": "TsNZ;zXY7;eSFG;CBs3",
        "site": "https://openreview.net/forum?id=YKzGrt3m2g",
        "pdf_size": 3597934,
        "rating": "3;3;5;6",
        "confidence": "3;2;3;3",
        "soundness": "2;2;2;3",
        "contribution": "2;3;2;3",
        "presentation": "3;2;2;3",
        "wc_summary": "62;68;121;51",
        "wc_strengths": "49;101;103;31",
        "wc_weaknesses": "324;194;165;89",
        "wc_questions": "8;13;762;114",
        "wc_review": "443;376;1151;285",
        "wc_reply_reviewers": "104;0;0;0",
        "wc_reply_authors": "631;134;476;279",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            75.5,
            26.9675731203236
        ],
        "wc_strengths_avg": [
            71.0,
            31.654383582688826
        ],
        "wc_weaknesses_avg": [
            193.0,
            84.79681597795992
        ],
        "wc_questions_avg": [
            224.25,
            313.33717861115684
        ],
        "wc_review_avg": [
            563.75,
            343.6548959348608
        ],
        "wc_reply_reviewers_avg": [
            26.0,
            45.033320996790806
        ],
        "wc_reply_authors_avg": [
            380.0,
            189.0330658906002
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5555555555555555,
        "gs_citation": 55,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16845208901458365197&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of Southern California",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.usc.edu",
        "aff_unique_abbr": "USC",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Los Angeles",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "YLDqqxTdj2",
        "title": "Information based explanation methods for deep learning agents -- with applications on large open-source chess models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "With large chess-playing neural network models like AlphaZero contesting the state of the art within the world of computerised chess, two challenges present themselves: The question of how to explain the domain knowledge internalised by such models, and the problem that such models are not made openly available. This work presents the re-implementation of the concept detection methodology applied to AlphaZero in McGrath et al. (2022), by using large, open-source chess models with comparable performance. We obtain results similar to those achieved on AlphaZero, while relying solely on open-source resources. We also present a novel explainable AI (XAI) method, which is guaranteed to highlight exhaustively and exclusively the information used by the explained model. This method generates visual explanations tailored to domains characterised by discrete input spaces, as is the case for chess. Our presented method has the desirable property of controlling the information flow between any input vector and the given model, which in turn provides strict guarantees regarding what information is used by the trained model during inference. We demonstrate the viability of our method by applying it to standard 8x8 chess, using large open-source chess models.",
        "keywords": "Explainable AI;saliency maps;concept detection;large chess models;neural networks",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Patrik Hammersborg;Inga Strumke",
        "authorids": "~Patrik_Hammersborg1;~Inga_Strumke1",
        "gender": "M;F",
        "homepage": "https://github.com/patrik-ha;https://strumke.github.io",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Patrik_Hammersborg1;~Inga_Strumke1",
        "aff": "Norwegian University of Science and Technology;Norwegian University of Science and Technology",
        "aff_domain": "ntnu.no;ntnu.no",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\nhammersborg2024information,\ntitle={Information based explanation methods for deep learning agents -- with applications on large open-source chess models},\nauthor={Patrik Hammersborg and Inga Strumke},\nyear={2024},\nurl={https://openreview.net/forum?id=YLDqqxTdj2}\n}",
        "github": "",
        "project": "",
        "reviewers": "2i6y;r57g;8hN2",
        "site": "https://openreview.net/forum?id=YLDqqxTdj2",
        "pdf_size": 3631442,
        "rating": "3;3;5",
        "confidence": "5;2;4",
        "soundness": "1;3;2",
        "contribution": "1;2;3",
        "presentation": "3;2;2",
        "wc_summary": "75;140;72",
        "wc_strengths": "51;40;42",
        "wc_weaknesses": "584;90;309",
        "wc_questions": "81;13;21",
        "wc_review": "791;283;444",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            1.247219128924647
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            95.66666666666667,
            31.372316175606517
        ],
        "wc_strengths_avg": [
            44.333333333333336,
            4.784233364802441
        ],
        "wc_weaknesses_avg": [
            327.6666666666667,
            202.10613273448405
        ],
        "wc_questions_avg": [
            38.333333333333336,
            30.34615113797611
        ],
        "wc_review_avg": [
            506.0,
            211.9732687549698
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.18898223650461354,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11745807612498913336&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Norwegian University of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ntnu.no",
        "aff_unique_abbr": "NTNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Norway"
    },
    {
        "title": "Towards Poisoning Fair Representations",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18425",
        "id": "YLJs4mKJCF",
        "author_site": "Tianci Liu, Haoyu Wang, Feijie Wu, Hengtong Zhang, Pan Li, Lu Su, Jing Gao",
        "tldr": "",
        "abstract": "Fair machine learning seeks to mitigate model prediction bias against certain demographic subgroups such as elder and female. \nRecently, fair representation learning (FRL) trained by deep neural networks has demonstrated superior performance, whereby representations containing no demographic information are inferred from the data and then used as the input to classification or other downstream tasks. \nDespite the development of FRL methods, their vulnerability under data poisoning attack, a popular protocol to benchmark model robustness under adversarial scenarios, is under-explored. Data poisoning attacks have been developed for classical fair machine learning methods which incorporate fairness constraints into shallow-model classifiers.\nNonetheless, these attacks fall short in FRL due to notably different fairness goals and model architectures. \nThis work proposes the first data poisoning framework attacking FRL. We induce the model to output unfair representations that contain as much demographic information as possible by injecting carefully crafted poisoning samples into the training data.\nThis attack entails a prohibitive bilevel optimization, wherefore an effective approximated solution is proposed. A theoretical analysis on the needed number of poisoning samples is derived and sheds light on defending against the attack. Experiments on benchmark fairness datasets and state-of-the-art fair representation learning models demonstrate the superiority of our attack.",
        "keywords": "data poisoning attack;fair representation learning;fairness",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/0cf8df1963f76cd3bda2f9f93656259cbefd7db8.pdf",
        "author": "Tianci Liu;Haoyu Wang;Feijie Wu;Hengtong Zhang;Pan Li;Lu Su;Jing Gao",
        "authorids": "~Tianci_Liu1;~Haoyu_Wang6;~Feijie_Wu1;~Hengtong_Zhang1;~Pan_Li2;~Lu_Su1;~Jing_Gao2",
        "gender": "M;M;;;;M;F",
        "homepage": "https://lliutianc.github.io;https://sites.google.com/view/haoyuwang/home;https://harli.me/;https://hengtongzhang.github.io;;https://engineering.purdue.edu/~lusu/;https://engineering.purdue.edu/~jinggao/",
        "dblp": "148/1911-3;50/8499-4;246/4255;188/2018;https://dblp.org/pers/hd/l/Li_0005:Pan;63/4152-1;67/4834-4",
        "google_scholar": ";https://scholar.google.com.hk/citations?user=5Lw9_jcAAAAJ;https://scholar.google.com/citations?hl=en;J2ZH_McAAAAJ;IroP0EwAAAAJ;38RuCN4AAAAJ;Ftj1h4cAAAAJ",
        "orcid": ";0000-0001-7485-6213;0000-0003-0541-1901;;;0000-0001-7223-543X;",
        "linkedin": ";;;;pan-li-b951105a/;;",
        "or_profile": "~Tianci_Liu1;~Haoyu_Wang6;~Feijie_Wu1;~Hengtong_Zhang1;~Pan_Li2;~Lu_Su1;~Jing_Gao2",
        "aff": "Purdue University;Purdue University;Purdue University;Tencent AI Lab;Purdue University;Purdue University;Purdue University",
        "aff_domain": "purdue.edu;purdue.edu;purdue.edu;tencent.com;purdue.edu;purdue.edu;purdue.edu",
        "position": "PhD student;PhD student;PhD student;Researcher;Assistant Professor;Associate Professor;Associate Professor",
        "bibtex": "@inproceedings{\nliu2024towards,\ntitle={Towards Poisoning Fair Representations},\nauthor={Tianci Liu and Haoyu Wang and Feijie Wu and Hengtong Zhang and Pan Li and Lu Su and Jing Gao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=YLJs4mKJCF}\n}",
        "github": "",
        "project": "",
        "reviewers": "Ddgu;yTSY;LCr6;LzqR;93wi",
        "pdf_size": 4160936,
        "rating": "3;5;6;8;8",
        "confidence": "5;3;3;4;3",
        "soundness": "2;3;3;3;3",
        "contribution": "2;2;4;3;3",
        "presentation": "3;3;3;2;4",
        "wc_summary": "107;55;29;127;65",
        "wc_strengths": "78;66;53;206;192",
        "wc_weaknesses": "488;165;108;386;44",
        "wc_questions": "100;100;2;35;16",
        "wc_review": "773;386;192;754;317",
        "wc_reply_reviewers": "433;0;58;130;0",
        "wc_reply_authors": "3222;930;607;1040;259",
        "reply_reviewers": "4;0;1;1;0",
        "reply_authors": "6;3;2;3;1",
        "rating_avg": [
            6.0,
            1.8973665961010275
        ],
        "confidence_avg": [
            3.6,
            0.8
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.8,
            0.7483314773547882
        ],
        "presentation_avg": [
            3.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            76.6,
            35.584266186054755
        ],
        "wc_strengths_avg": [
            119.0,
            65.94543198736362
        ],
        "wc_weaknesses_avg": [
            238.2,
            169.86394555643642
        ],
        "wc_questions_avg": [
            50.6,
            41.67301285004481
        ],
        "wc_review_avg": [
            484.4,
            236.2952390548739
        ],
        "wc_reply_reviewers_avg": [
            124.2,
            161.63217501475378
        ],
        "wc_reply_authors_avg": [
            1211.6,
            1041.483672459631
        ],
        "reply_reviewers_avg": [
            1.2,
            1.4696938456699067
        ],
        "reply_authors_avg": [
            3.0,
            1.6733200530681511
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5270462766947299,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12383548986490202577&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=YLJs4mKJCF",
        "pdf": "https://openreview.net/pdf?id=YLJs4mKJCF",
        "email": "purdue.edu;purdue.edu;purdue.edu;tencent.com;purdue.edu;purdue.edu;purdue.edu",
        "author_num": 7,
        "aff_unique_index": "0;0;0;1;0;0;0",
        "aff_unique_norm": "Purdue University;Tencent",
        "aff_unique_dep": ";Tencent AI Lab",
        "aff_unique_url": "https://www.purdue.edu;https://ai.tencent.com",
        "aff_unique_abbr": "Purdue;Tencent AI Lab",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "YM0aPHTDe8",
        "title": "Finite-Time Analysis of Federated Temporal Difference Learning with Linear Function Approximation under Environment and Computation Heterogeneity",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Temporal difference (TD) learning is a popular method for reinforcement learning (RL). In this paper, we study federated TD learning with linear function approximation, where multiple agents collaboratively perform policy evaluation via TD learning, while interacting with heterogeneous environments and using heterogeneous computation configurations. We devise a Heterogeneous Federated TD (HFTD) algorithm which iteratively aggregates agents' local stochastic gradients for TD learning. The HFTD algorithm involves two major novel elements: 1) it aims to find the optimal value function model for the mixture environment averaged over agents' heterogeneous environments, using local stochastic gradients of agent's mean squared projected Bellman errors (MSPBEs) for their respective environments; 2) it allows agents to perform difference numbers of local iterations for TD learning. We analyze the finite-time convergence performance of the HFTD algorithm for the settings of I.I.D. sampling and Markovian sampling by characterizing bounds on the convergence error. Our results show that the HFTD algorithm can asymptotically converge to the optimal model, which is the first such result in existing works on federated RL (to our best knowledge). The HFTD algorithm also achieves sample complexity of $O\\left( {\\frac{1}{\\varepsilon }\\log \\frac{1}{\\varepsilon }} \\right)$ and linear convergence speedup, which match the results of existing TD algorithms.",
        "keywords": "reinforcement learning;temporal difference learning;linear function approximation",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/7b227d75c2584867a99475bb794b0f01ed7350ad.pdf",
        "author": "Ye Zhu;Xiaowen Gong",
        "authorids": "~Ye_Zhu6;~Xiaowen_Gong1",
        "gender": "F;M",
        "homepage": ";http://webhome.auburn.edu/~xzg0017/",
        "dblp": ";",
        "google_scholar": ";aNw63mYAAAAJ",
        "orcid": ";",
        "linkedin": "yezhu13ba95219/;",
        "or_profile": "~Ye_Zhu6;~Xiaowen_Gong1",
        "aff": "Auburn University;Auburn University",
        "aff_domain": "auburn.edu;auburn.edu",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\nzhu2024finitetime,\ntitle={Finite-Time Analysis of Federated Temporal Difference Learning with Linear Function Approximation under Environment and Computation Heterogeneity},\nauthor={Ye Zhu and Xiaowen Gong},\nyear={2024},\nurl={https://openreview.net/forum?id=YM0aPHTDe8}\n}",
        "github": "",
        "project": "",
        "reviewers": "6rEp;X2Ca;Aqmo",
        "site": "https://openreview.net/forum?id=YM0aPHTDe8",
        "pdf_size": 336406,
        "rating": "3;3;6",
        "confidence": "5;4;3",
        "soundness": "1;2;4",
        "contribution": "1;2;3",
        "presentation": "2;1;4",
        "wc_summary": "31;51;150",
        "wc_strengths": "27;21;111",
        "wc_weaknesses": "340;135;76",
        "wc_questions": "177;83;14",
        "wc_review": "575;290;351",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "2280;1344;511",
        "reply_reviewers": "0;0;0",
        "reply_authors": "5;3;2",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "wc_summary_avg": [
            77.33333333333333,
            52.027770362460174
        ],
        "wc_strengths_avg": [
            53.0,
            41.08527716834828
        ],
        "wc_weaknesses_avg": [
            183.66666666666666,
            113.13806707833673
        ],
        "wc_questions_avg": [
            91.33333333333333,
            66.8048567762022
        ],
        "wc_review_avg": [
            405.3333333333333,
            122.52981496580968
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1378.3333333333333,
            722.5991665893032
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            1.247219128924647
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.8660254037844387,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:PuNbLf7KCZ0J:scholar.google.com/&scioq=Finite-Time+Analysis+of+Federated+Temporal+Difference+Learning+with+Linear+Function+Approximation+under+Environment+and+Computation+Heterogeneity&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Auburn University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.auburn.edu",
        "aff_unique_abbr": "Auburn",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "YMHDeDTWbE",
        "title": "A Dynamic Mixup Approach Towards Improved Robustness of Classifiers",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The robustness of image classifiers has been an extensive area of growing research. Current methods typically rely on data augmentation techniques to simulate distribution shifts based on image corruptions. These techniques mainly consider linearity to generate synthetic samples. However, corruptions that occur in the real world are more complex and unlikely to follow a linear drift. We introduce an adaptation of the mixup approach, Dynamic Mixup, as our data processing technique. Dynamic Mixup uses a simple mixing strategy to combine augmented versions considering the non-linearity that exists between them. Training on these samples encourages learning representations robust to new or unseen distortions. Our experimental findings reveal that Dynamic Mixup outperforms the previous methods with improved robustness in image and object classification tasks.",
        "keywords": "robustness;data shift;distribution shift;data augmentation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/85b6fff0d515aca9ac2420742769fa5392eb52fe.pdf",
        "author": "Sanskriti;Seungwoo Jang;Donghee Kim;Soobin Cha;Dongwon Kim;Kwangsu Kim",
        "authorids": "~Sanskriti1;~Seungwoo_Jang1;~Donghee_Kim1;~Soobin_Cha1;~Dongwon_Kim3;~Kwangsu_Kim1",
        "gender": "F;;M;M;M;M",
        "homepage": ";;;https://appliedai.skku.edu/appliedailab/faculty.do?mode=view&articleNo=33816;https://appliedai.skku.edu/appliedailab/faculty.do?mode=view&articleNo=30643&article.offset=10&articleLimit=10;https://appliedai.skku.edu/appliedailab/index.do",
        "dblp": ";;;;;71/6192",
        "google_scholar": ";;https://scholar.google.co.kr/citations?user=mZYqDeIAAAAJ;;;",
        "orcid": ";;0000-0002-9929-3864;0009-0008-7475-1401;;",
        "linkedin": "sanskriti-srivastava;;;;;",
        "or_profile": "~Sanskriti1;~Seungwoo_Jang1;~Donghee_Kim1;~Soobin_Cha1;~Dongwon_Kim3;~Kwangsu_Kim1",
        "aff": "Sung Kyun Kwan University;;Hippo T&C co.,ltd.;Sung Kyun Kwan University;Sung Kyun Kwan University;Sungkyunkwan University",
        "aff_domain": "skku.edu;;hippotnc.com;skku.edu;skku.edu;cs.skku.edu",
        "position": "MS student;;Researcher;MS student;MS student;Full Professor",
        "bibtex": "@misc{\nsanskriti2024a,\ntitle={A Dynamic Mixup Approach Towards Improved Robustness of Classifiers},\nauthor={Sanskriti and Seungwoo Jang and Donghee Kim and Soobin Cha and Dongwon Kim and Kwangsu Kim},\nyear={2024},\nurl={https://openreview.net/forum?id=YMHDeDTWbE}\n}",
        "github": "",
        "project": "",
        "reviewers": "g3Ch;XQmz;UQyr;Pd7H",
        "site": "https://openreview.net/forum?id=YMHDeDTWbE",
        "pdf_size": 9310349,
        "rating": "3;3;3;5",
        "confidence": "4;4;5;3",
        "soundness": "3;2;2;3",
        "contribution": "1;2;2;2",
        "presentation": "3;3;2;2",
        "wc_summary": "98;31;72;80",
        "wc_strengths": "49;20;32;40",
        "wc_weaknesses": "85;125;192;179",
        "wc_questions": "8;27;37;94",
        "wc_review": "240;203;333;393",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "61;85;146;265",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            70.25,
            24.539508960042376
        ],
        "wc_strengths_avg": [
            35.25,
            10.662434056068061
        ],
        "wc_weaknesses_avg": [
            145.25,
            42.90906081470439
        ],
        "wc_questions_avg": [
            41.5,
            32.05074102107469
        ],
        "wc_review_avg": [
            292.25,
            75.01124915637654
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            139.25,
            78.93787113927003
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:-afyvwq9k1IJ:scholar.google.com/&scioq=A+Dynamic+Mixup+Approach+Towards+Improved+Robustness+of+Classifiers&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0;0",
        "aff_unique_norm": "Sungkyunkwan University;Hippo T&C Co., Ltd.",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.skku.edu;",
        "aff_unique_abbr": "SKKU;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "YN4uWzcbtt",
        "title": "On the Positive Definiteness of the Neural Tangent Kernel",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The Neural Tangent Kernel (NTK) has emerged as a fundamental concept in the study of wide Neural Networks. In particular, it is known that the positivity of the NTK is directly related to the memorization capacity of sufficiently wide networks, i.e., to the possibility of reaching zero loss in training, via gradient descent.  \nHere we will improve on previous works and obtain a sharp result concerning the positivity of the NTK of feedforward networks of any depth. More precisely, we will show that, for any non-polynomial activation function, the NTK is strictly positive definite.",
        "keywords": "Wide neural networks;Neural Tangent Kernel;Memorization;Global minima",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Lu\u00eds Carvalho;Jo\u00e3o L. Costa;Jose Mourao;GONCALO OLIVEIRA",
        "authorids": "~Lu\u00eds_Carvalho1;~Jo\u00e3o_L._Costa1;~Jose_Mourao1;~GONCALO_OLIVEIRA1",
        "gender": "M;M;M;M",
        "homepage": "https://ciencia.iscte-iul.pt/authors/luis-carlos-costa-pinheiro-de-carvalho/cv;https://ciencia.iscte-iul.pt/authors/joao-lopes-costa/cv;https://www.math.tecnico.ulisboa.pt/~jmourao;https://sites.google.com/view/goncalo-oliveira-math-webpage/home",
        "dblp": ";;;",
        "google_scholar": ";https://scholar.google.pt/citations?user=GmDOAIMAAAAJ;https://scholar.google.pt/citations?user=F67fQg0AAAAJ;",
        "orcid": ";0000-0002-2087-2389;0000-0001-6834-4596;",
        "linkedin": ";;;",
        "or_profile": "~Lu\u00eds_Carvalho1;~Jo\u00e3o_L._Costa1;~Jose_Mourao1;~GONCALO_OLIVEIRA1",
        "aff": "Iscte;ISCTE - Instituto Universit\u00e1rio de Lisboa;Instituto Superior T\u00e9cnico;Instituto Superior T\u00e9cnico",
        "aff_domain": "iscte-iul.pt;iscte.pt;tecnico.ulisboa.pt;tecnico.ulisboa.pt",
        "position": "Assistant Professor;Full Professor;Full Professor;Principal Researcher",
        "bibtex": "@misc{\ncarvalho2024on,\ntitle={On the Positive Definiteness of the Neural Tangent Kernel},\nauthor={Lu{\\'\\i}s Carvalho and Jo{\\~a}o L. Costa and Jose Mourao and GONCALO OLIVEIRA},\nyear={2024},\nurl={https://openreview.net/forum?id=YN4uWzcbtt}\n}",
        "github": "",
        "project": "",
        "reviewers": "vtuM;BSSD;jE8k;onui",
        "site": "https://openreview.net/forum?id=YN4uWzcbtt",
        "pdf_size": 181204,
        "rating": "3;3;5;6",
        "confidence": "3;4;3;3",
        "soundness": "3;3;3;3",
        "contribution": "2;1;1;3",
        "presentation": "3;2;3;3",
        "wc_summary": "82;67;53;191",
        "wc_strengths": "42;27;55;14",
        "wc_weaknesses": "138;211;128;32",
        "wc_questions": "14;33;3;50",
        "wc_review": "276;338;239;287",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "191;392;160;299",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            98.25,
            54.522357799346864
        ],
        "wc_strengths_avg": [
            34.5,
            15.435349040433131
        ],
        "wc_weaknesses_avg": [
            127.25,
            63.64501158771204
        ],
        "wc_questions_avg": [
            25.0,
            17.98610574860495
        ],
        "wc_review_avg": [
            285.0,
            35.390676738372775
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            260.5,
            91.79460768476545
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5555555555555555,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:7UG0GYWYprIJ:scholar.google.com/&scioq=On+the+Positive+Definiteness+of+the+Neural+Tangent+Kernel&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;2",
        "aff_unique_norm": "Instituto Superior de Ci\u00eancias do Trabalho e da Empresa;Instituto Universit\u00e1rio de Lisboa;Instituto Superior T\u00e9cnico",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.iscte.pt;https://www.iscte-iul.pt;https://www.ist.utl.pt",
        "aff_unique_abbr": "ISCTE;ISCTE;IST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Portugal"
    },
    {
        "id": "YNmnGzttMJ",
        "title": "Distill Gold from Massive Ores: Efficient Dataset Distillation via Critical Samples Selection",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Data-efficient learning has drawn significant attention, especially given the current trend of large multi-modal models, where dataset distillation can be an effective solution. However, the dataset distillation process itself is still very inefficient. In this work, we model the distillation problem with reference to information transport. Observing that severe data redundancy exists in dataset distillation, we argue to put more emphasis on the utility of the training samples. We propose a family of methods to exploit the most valuable samples, which is validated by our comprehensive analysis of the optimal data selection. The new strategy significantly reduces the training cost and extends a variety of existing distillation algorithms to larger and more diversified datasets, e.g., in some cases only 0.04% training data is sufficient for comparable distillation performance. Moreover, our strategy consistently enhances the performance, which may open up new analyses on the dynamics of distillation and networks. Our method is able to extend the distillation algorithms to much larger-scale datasets and more heterogeneous datasets, e.g., ImageNet-1K and Kinetics-400. Our code will be made publicly available.",
        "keywords": "Dataset Distillation;Data Selection;Efficiency",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Yue Xu;Yong-Lu Li;Kaitong Cui;Ziyu Wang;Cewu Lu;Michael Xu LIU;Yu-Wing Tai;Chi-Keung Tang",
        "authorids": "~Yue_Xu4;~Yong-Lu_Li1;~Kaitong_Cui1;~Ziyu_Wang11;~Cewu_Lu3;~Michael_Xu_LIU1;~Yu-Wing_Tai2;~Chi-Keung_Tang1",
        "gender": "M;M;F;M;M;M;M;Not Specified",
        "homepage": "https://silicx.github.io;https://dirtyharrylyl.github.io/;https://github.com/cui666-bot;https://github.com/wangxiaoyia;https://www.mvig.org/;https://www.hopework.cn/about.html#teamIntroduction;https://yuwingtai.github.io/;http://www.cse.ust.hk/~cktang/",
        "dblp": ";198/9345;;73/4689-10;;;40/566;34/4366",
        "google_scholar": "N03Uc1oAAAAJ;https://scholar.google.com.hk/citations?user=UExAaVgAAAAJ;;;https://scholar.google.com.tw/citations?user=QZVQEWAAAAAJ;;nFhLmFkAAAAJ;https://scholar.google.com.tw/citations?user=EWfpM74AAAAJ",
        "orcid": "0000-0001-7489-7269;0000-0003-0478-0692;;;;;0000-0002-3148-0380;",
        "linkedin": ";%E6%B0%B8%E9%9C%B2-%E6%9D%8E-991b99139/;;;;;;",
        "or_profile": "~Yue_Xu4;~Yong-Lu_Li1;~Kaitong_Cui1;~Ziyu_Wang11;~Cewu_Lu3;~Michael_Xu_LIU1;~Yu-Wing_Tai2;~ChiKeung_Tang1",
        "aff": "Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;;Dartmouth College;Hong Kong University of Science and Technology",
        "aff_domain": "sjtu.edu;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;;dartmouth.edu;ust.hk",
        "position": "PhD student;Assistant Professor;Undergrad student;Undergrad student;Full Professor;;Associate Professor;Professor",
        "bibtex": "@misc{\nxu2024distill,\ntitle={Distill Gold from Massive Ores: Efficient Dataset Distillation via Critical Samples Selection},\nauthor={Yue Xu and Yong-Lu Li and Kaitong Cui and Ziyu Wang and Cewu Lu and Michael Xu LIU and Yu-Wing Tai and Chi-Keung Tang},\nyear={2024},\nurl={https://openreview.net/forum?id=YNmnGzttMJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "dAWG;yzKj;ne7k;DpjX",
        "site": "https://openreview.net/forum?id=YNmnGzttMJ",
        "pdf_size": 1622529,
        "rating": "3;5;5;6",
        "confidence": "3;4;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "1;3;3;3",
        "wc_summary": "133;49;77;75",
        "wc_strengths": "234;43;74;58",
        "wc_weaknesses": "996;272;63;63",
        "wc_questions": "169;5;87;362",
        "wc_review": "1532;369;301;558",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            83.5,
            30.63902739970706
        ],
        "wc_strengths_avg": [
            102.25,
            76.85172411859087
        ],
        "wc_weaknesses_avg": [
            348.5,
            383.4478452149653
        ],
        "wc_questions_avg": [
            155.75,
            132.4450357695599
        ],
        "wc_review_avg": [
            690.0,
            495.16411420861266
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.9271726499455306,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12989562947658680126&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0;0;1;2",
        "aff_unique_norm": "Shanghai Jiao Tong University;Dartmouth College;Hong Kong University of Science and Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.sjtu.edu.cn;https://www.dartmouth.edu;https://www.ust.hk",
        "aff_unique_abbr": "SJTU;Dartmouth;HKUST",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Conditional Variational Diffusion Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18424",
        "id": "YOKnEkIuoi",
        "author_site": "Gabriel della Maggiora, Luis A. Croquevielle, Nikita Deshpande, Harry Horsley, Thomas Heinis, Artur Yakimovich",
        "tldr": "",
        "abstract": "Inverse problems aim to determine parameters from observations, a crucial task in engineering and science. Lately, generative models, especially diffusion models, have gained popularity in this area for their ability to produce realistic solutions and their good mathematical properties. Despite their success, an important drawback of diffusion models is their sensitivity to the choice of variance schedule, which controls the dynamics of the diffusion process. Fine-tuning this schedule for specific applications is crucial but time-consuming and does not guarantee an optimal result. We propose a novel approach for learning the schedule as part of the training process. Our method supports probabilistic conditioning on data, provides high-quality solutions, and is flexible, proving able to adapt to different applications with minimum overhead. This approach is tested in two unrelated inverse problems: super-resolution microscopy and quantitative phase imaging, yielding comparable or superior results to previous methods and fine-tuned diffusion models. We conclude that fine-tuning the schedule by experimentation should be avoided because it can be learned during training in a stable way that yields better results. The code is available on https://github.com/casus/cvdm",
        "keywords": "Denoising Diffusion Probabilistic Models;Inverse Problems;Generative Models;Super Resolution;Phase Quantification;Variational Methods",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Gabriel Della Maggiora;Luis Alberto Croquevielle;Nikita Deshpande;Harry Horsley;Thomas Heinis;Artur Yakimovich",
        "authorids": "~Gabriel_Della_Maggiora1;~Luis_Alberto_Croquevielle1;~Nikita_Deshpande1;~Harry_Horsley1;~Thomas_Heinis1;~Artur_Yakimovich1",
        "gender": "M;M;F;M;M;M",
        "homepage": ";;;https://profiles.ucl.ac.uk/43029-harry-horsley/about;http://wp.doc.ic.ac.uk/theinis/;https://ayakimovich.github.io/",
        "dblp": "308/6188;243/0018.html;;;;194/2859",
        "google_scholar": "b-PqSK0AAAAJ;S4B4XV4AAAAJ;;;https://scholar.google.com.tw/citations?user=yJ998VYAAAAJ;PgWk6woAAAAJ",
        "orcid": "0000-0002-6320-5105;;;;;0000-0003-2458-4904",
        "linkedin": ";luis-alberto-croquevielle-rendic-28568761/;nikita-deshpande2109/;;;ayakimovich",
        "or_profile": "~Gabriel_Della_Maggiora1;~Luis_Alberto_Croquevielle1;~Nikita_Deshpande1;~Harry_Horsley1;~Thomas_Heinis1;~Artur_Yakimovich1",
        "aff": "Helmholtz-Zentrum Dresden-Rossendorf ;Imperial College London;Center for Advanced Systems Understanding;;Imeprial College London;Helmholtz-Zentrum Dresden-Rossendorf",
        "aff_domain": "hzdr.de;ic.ac.uk;casus.science;;imperial.ac.uk;hzdr.de",
        "position": "PhD student;PhD student;MS student;;Associate Professor;Principal Researcher",
        "bibtex": "@inproceedings{\nmaggiora2024conditional,\ntitle={Conditional Variational Diffusion Models},\nauthor={Gabriel Della Maggiora and Luis Alberto Croquevielle and Nikita Deshpande and Harry Horsley and Thomas Heinis and Artur Yakimovich},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=YOKnEkIuoi}\n}",
        "github": "",
        "project": "",
        "reviewers": "qRoi;gCsZ;tcMU;jHYB;UQRa",
        "pdf_size": 34575279,
        "rating": "3;5;5;8;8",
        "confidence": "4;4;3;4;3",
        "soundness": "3;3;2;3;2",
        "contribution": "2;2;2;4;2",
        "presentation": "4;2;2;3;2",
        "wc_summary": "79;76;102;74;121",
        "wc_strengths": "36;60;90;31;69",
        "wc_weaknesses": "55;195;150;20;406",
        "wc_questions": "5;162;471;15;75",
        "wc_review": "175;493;813;140;671",
        "wc_reply_reviewers": "0;0;62;0;20",
        "wc_reply_authors": "1009;1809;3498;687;1979",
        "reply_reviewers": "0;0;1;0;1",
        "reply_authors": "3;4;7;1;4",
        "rating_avg": [
            5.8,
            1.9390719429665315
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.4,
            0.8
        ],
        "presentation_avg": [
            2.6,
            0.8
        ],
        "wc_summary_avg": [
            90.4,
            18.315021157508937
        ],
        "wc_strengths_avg": [
            57.2,
            21.720036832381293
        ],
        "wc_weaknesses_avg": [
            165.2,
            135.89024983419523
        ],
        "wc_questions_avg": [
            145.6,
            172.02511444553667
        ],
        "wc_review_avg": [
            458.4,
            266.0192474239411
        ],
        "wc_reply_reviewers_avg": [
            16.4,
            24.07986710926786
        ],
        "wc_reply_authors_avg": [
            1796.4,
            977.72298735378
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            3.8,
            1.9390719429665317
        ],
        "replies_avg": [
            30,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.29475317237328164,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5653725205032535687&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=YOKnEkIuoi",
        "pdf": "https://openreview.net/pdf?id=YOKnEkIuoi",
        "email": "hzdr.de;ic.ac.uk;casus.science;;imperial.ac.uk;hzdr.de",
        "author_num": 6,
        "aff_unique_index": "0;1;2;1;0",
        "aff_unique_norm": "Helmholtz-Zentrum Dresden-Rossendorf;Imperial College London;Center for Advanced Systems Understanding",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.hzdr.de;https://www.imperial.ac.uk;",
        "aff_unique_abbr": "HZDR;ICL;",
        "aff_campus_unique_index": "0;2;0",
        "aff_campus_unique": "Dresden;;London",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "Germany;United Kingdom;"
    },
    {
        "title": "In-Context Learning Learns Label Relationships but Is Not Conventional Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18423",
        "id": "YPIA7bgd5y",
        "author_site": "Jannik Kossen, Yarin Gal, Tom Rainforth",
        "tldr": "",
        "abstract": "The predictions of Large Language Models (LLMs) on downstream tasks often improve significantly when including examples of the input\u2013label relationship in the context. However, there is currently no consensus about how this in-context learning (ICL) ability of LLMs works. For example, while Xie et al. (2022) liken ICL to a general-purpose learning algorithm, Min et al. (2022b) argue ICL does not even learn label relationships from in-context examples. In this paper, we provide novel insights into how ICL leverages label information, revealing both capabilities and limitations. To ensure we obtain a comprehensive picture of ICL behavior, we study probabilistic aspects of ICL predictions and thoroughly examine the dynamics of ICL as more examples are provided. Our experiments show that ICL predictions almost always depend on in-context labels and that ICL can learn truly novel tasks in-context. However, we also find that ICL struggles to fully overcome prediction preferences acquired from pre-training data and, further, that ICL does not consider all in-context information equally.",
        "keywords": "in-context learning;large language models",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Jannik Kossen;Yarin Gal;Tom Rainforth",
        "authorids": "~Jannik_Kossen2;~Yarin_Gal1;~Tom_Rainforth1",
        "gender": "Unspecified;;M",
        "homepage": "https://jlko.eu;http://www.cs.ox.ac.uk/people/yarin.gal/website//;http://www.robots.ox.ac.uk/~twgr",
        "dblp": "250/2339;67/9076;166/1198",
        "google_scholar": "i1FIOV0AAAAJ;https://scholar.google.co.uk/citations?user=SIayDoQAAAAJ;https://scholar.google.co.uk/citations?user=ieLRNKMAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Jannik_Kossen2;~Yarin_Gal1;~Tom_Rainforth1",
        "aff": "University of Oxford;University of Oxford;",
        "aff_domain": "oxford.ac.uk;ox.ac.uk;ox.ac.uk",
        "position": "PhD student;Associate Professor;Postdoc",
        "bibtex": "@inproceedings{\nkossen2024incontext,\ntitle={In-Context Learning Learns Label Relationships but Is Not Conventional Learning},\nauthor={Jannik Kossen and Yarin Gal and Tom Rainforth},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=YPIA7bgd5y}\n}",
        "github": "",
        "project": "",
        "reviewers": "Sjxd;tkcu;LQGJ;WYZX",
        "pdf_size": 3858570,
        "rating": "6;6;6;8",
        "confidence": "4;5;3;4",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "4;3;3;3",
        "wc_summary": "71;148;65;201",
        "wc_strengths": "106;71;55;82",
        "wc_weaknesses": "173;235;313;404",
        "wc_questions": "213;119;58;109",
        "wc_review": "563;573;491;796",
        "wc_reply_reviewers": "30;248;137;22",
        "wc_reply_authors": "1976;2119;1807;955",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "4;5;3;3",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            121.25,
            56.49059656261385
        ],
        "wc_strengths_avg": [
            78.5,
            18.553975315279473
        ],
        "wc_weaknesses_avg": [
            281.25,
            86.50541890540731
        ],
        "wc_questions_avg": [
            124.75,
            55.95701475239722
        ],
        "wc_review_avg": [
            605.75,
            114.30523828766555
        ],
        "wc_reply_reviewers_avg": [
            109.25,
            92.07978877039196
        ],
        "wc_reply_authors_avg": [
            1714.25,
            452.0505364447652
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.75,
            0.82915619758885
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 37,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15206639531120507471&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=YPIA7bgd5y",
        "pdf": "https://openreview.net/pdf?id=YPIA7bgd5y",
        "email": "oxford.ac.uk;ox.ac.uk;ox.ac.uk",
        "author_num": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Oxford",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ox.ac.uk",
        "aff_unique_abbr": "Oxford",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "YPOcBR9h2a",
        "title": "DLCNet: Enabling Long-Range Convolution with Data Dependency",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In recent years, the Transformer architecture and self-attention mechanism have become the first choice for sequence modeling, but they encounter significant computational challenges when processing lengthy sequences. Long-range convolution has emerged as a promising alternative to self-attention, offering distinct advantages across various domains. However, current long-range convolution architectures still face several issues, such as excessive parameter usage and limited in-context learning capabilities. To tackle these challenges, we propose a Data-dependent Long-range Convolution Network (DLCNet) that introduces data dependency through three key modules: Layer-Wise Mapping, Rectify SideNet, and SWEAP Operator. DLCNet effectively facilitates in-context learning within a reasonable parameter scale. Extensive experiments have demonstrated that DLCNet surpasses the state-of-the-art baselines in processing lengthy sequences, even when trained with short sequences.",
        "keywords": "Long-Range;Convolution;Data-Dependent;LLM",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/dec278c23f7cb15d6302c4cf3021724a10048692.zip",
        "author": "Qingyu Yin;Xiang Zhuang;Keyan Ding;Qiang Zhang",
        "authorids": "~Qingyu_Yin4;~Xiang_Zhuang1;~Keyan_Ding1;~Qiang_Zhang6",
        "gender": "M;;M;",
        "homepage": "https://mikastars39.notion.site;;;https://qiangairesearcher.github.io",
        "dblp": ";;195/3500;72/3527-26",
        "google_scholar": "BRsj8FAAAAAJ;;A7u-ZowAAAAJ;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Qingyu_Yin4;~Xiang_Zhuang1;~Keyan_Ding1;~Qiang_Zhang6",
        "aff": "Zhejiang University;;Zhejiang University;Zhejiang University",
        "aff_domain": "zju.edu.cn;;zju.edu.cn;zju.edu.cn",
        "position": "Undergrad student;;Researcher;Principal Researcher",
        "bibtex": "@misc{\nyin2024dlcnet,\ntitle={{DLCN}et: Enabling Long-Range Convolution with Data Dependency},\nauthor={Qingyu Yin and Xiang Zhuang and Keyan Ding and Qiang Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=YPOcBR9h2a}\n}",
        "github": "",
        "project": "",
        "reviewers": "zAJh;budh;2j7h",
        "site": "https://openreview.net/forum?id=YPOcBR9h2a",
        "pdf_size": 1676637,
        "rating": "3;3;6",
        "confidence": "3;4;2",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "2;4;2",
        "wc_summary": "78;56;154",
        "wc_strengths": "26;8;83",
        "wc_weaknesses": "198;633;92",
        "wc_questions": "41;325;89",
        "wc_review": "343;1022;418",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            96.0,
            41.98412398355677
        ],
        "wc_strengths_avg": [
            39.0,
            31.96873472629156
        ],
        "wc_weaknesses_avg": [
            307.6666666666667,
            234.08023315853808
        ],
        "wc_questions_avg": [
            151.66666666666666,
            124.12180397586165
        ],
        "wc_review_avg": [
            594.3333333333334,
            303.9521161118785
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8660254037844387,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:m_1UzHrelyAJ:scholar.google.com/&scioq=DLCNet:+Enabling+Long-Range+Convolution+with+Data+Dependency&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Zhejiang University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.zju.edu.cn",
        "aff_unique_abbr": "ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "YPpkFqMX6V",
        "title": "Hypergraph Neural Networks through the Lens of Message Passing: A Common Perspective to Homophily and Architecture Design",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Most of the current hypergraph learning methodologies and benchmarking datasets\nin the hypergraph realm are obtained by lifting procedures from their graph analogs,\nsimultaneously leading to overshadowing hypergraph network foundations. This\npaper attempts to confront some pending questions in that regard: Can the concept\nof homophily play a crucial role in Hypergraph Neural Networks (HGNNs), similar\nto its significance in graph-based research? Is there room for improving current\nhypergraph architectures and methodologies? (e.g. by carefully addressing the\nspecific characteristics of higher-order networks) Do existing datasets provide a\nmeaningful benchmark for HGNNs? Diving into the details, this paper proposes a\nnovel conceptualization of homophily in higher-order networks based on a message\npassing scheme; this approach harmonizes the analytical frameworks of datasets\nand architectures, offering a unified perspective for exploring and interpreting\ncomplex, higher-order network structures and dynamics. Further, we propose\nMultiSet, a novel message passing framework that redefines HGNNs by allowing\nhyperedge-dependent node representations, as well as introduce a novel architecture\n\u2013MultiSetMixer\u2013 that leverages a new hyperedge sampling strategy. Finally, we\nprovide an extensive set of experiments that contextualize our proposals and lead\nto valuable insights in hypergraph representation learning.",
        "keywords": "Hypergraph Neural Network;Graph Neural Network;homophily;mini-batching;hypergraph modelling;higher-order interactions",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/7d5d4a03ebf1fb52e967af048aece73acd749dce.zip",
        "author": "Lev Telyatnikov;Maria Sofia Bucarelli;Guillermo Bernardez;Olga Zaghen;Simone Scardapane;Pietro Lio",
        "authorids": "~Lev_Telyatnikov1;~Maria_Sofia_Bucarelli1;~Guillermo_Bernardez1;~Olga_Zaghen1;~Simone_Scardapane1;~Pietro_Lio1",
        "gender": "M;F;F;M;M;",
        "homepage": ";https://phd.uniroma1.it/web/MARIA-SOFIA-BUCARELLI_nP1617005_EN.aspx;;http://ispac.diet.uniroma1.it/scardapane/;https://www.cst.cam.ac.uk/people/pl219;",
        "dblp": ";304/2548;;144/2184;l/PietroLio.html;298/1907",
        "google_scholar": "MzFz-tcAAAAJ;https://scholar.google.com/citations?hl=it;;https://scholar.google.it/citations?user=aSuosYoAAAAJ;https://scholar.google.co.uk/citations?user=3YrWf7EAAAAJ;https://scholar.google.es/citations?user=x73d3q8AAAAJ",
        "orcid": ";0009-0007-5101-8242;;0000-0003-0881-8344;0000-0002-0540-5053;0000-0002-6790-4878",
        "linkedin": ";;olga-zaghen/;simonescardapane;;guillermobernardez",
        "or_profile": "~Lev_Telyatnikov1;~Maria_Sofia_Bucarelli1;~Olga_Zaghen1;~Simone_Scardapane1;~Pietro_Lio1;~Guillermo_Bern\u00e1rdez_Gil1",
        "aff": "University of Roma \"La Sapienza\";University of Roma \"La Sapienza\";Korea Advanced Institute of Science & Technology;Sapienza University of Rome;University of Cambridge;Universidad Polit\u00e9cnica de Cataluna",
        "aff_domain": "uniroma1.it;uniroma1.it;kaist.ac.kr;uniroma1.it;cam.ac.uk;upc.edu",
        "position": "PhD student;PhD student;Intern;Assistant Professor;Full Professor;PhD student",
        "bibtex": "@misc{\ntelyatnikov2024hypergraph,\ntitle={Hypergraph Neural Networks through the Lens of Message Passing: A Common Perspective to Homophily and Architecture Design},\nauthor={Lev Telyatnikov and Maria Sofia Bucarelli and Guillermo Bernardez and Olga Zaghen and Simone Scardapane and Pietro Lio},\nyear={2024},\nurl={https://openreview.net/forum?id=YPpkFqMX6V}\n}",
        "github": "",
        "project": "",
        "reviewers": "gAXJ;U2hQ;LrvL;wbgf",
        "site": "https://openreview.net/forum?id=YPpkFqMX6V",
        "pdf_size": 50600875,
        "rating": "5;5;5;6",
        "confidence": "4;4;2;4",
        "soundness": "2;3;2;3",
        "contribution": "2;3;2;2",
        "presentation": "2;3;2;3",
        "wc_summary": "84;71;94;93",
        "wc_strengths": "30;15;45;112",
        "wc_weaknesses": "227;614;73;153",
        "wc_questions": "74;64;14;117",
        "wc_review": "415;764;226;475",
        "wc_reply_reviewers": "163;0;0;0",
        "wc_reply_authors": "1107;1262;346;880",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "2;2;1;2",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            85.5,
            9.233092656309694
        ],
        "wc_strengths_avg": [
            50.5,
            37.05738792737556
        ],
        "wc_weaknesses_avg": [
            266.75,
            207.75030084214077
        ],
        "wc_questions_avg": [
            67.25,
            36.62905267680288
        ],
        "wc_review_avg": [
            470.0,
            193.01683864367897
        ],
        "wc_reply_reviewers_avg": [
            40.75,
            70.58107040843176
        ],
        "wc_reply_authors_avg": [
            898.75,
            346.84389500177167
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 20,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10481595478039940121&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;2;3;4",
        "aff_unique_norm": "University of Rome La Sapienza;Korea Advanced Institute of Science and Technology;Sapienza University of Rome;University of Cambridge;Universitat Polit\u00e8cnica de Catalunya",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.uniroma1.it;https://www.kaist.ac.kr;https://www.uniroma1.it;https://www.cam.ac.uk;https://www.upc.edu",
        "aff_unique_abbr": "La Sapienza;KAIST;Sapienza;Cambridge;UPC",
        "aff_campus_unique_index": "0;0;0;2",
        "aff_campus_unique": "Rome;;Cambridge",
        "aff_country_unique_index": "0;0;1;0;2;3",
        "aff_country_unique": "Italy;South Korea;United Kingdom;Spain"
    },
    {
        "id": "YQaf8Mcsrr",
        "title": "Learning Invariant Graph Representations via Virtual Environment Inference",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Graph invariant learning aims to learn invariant graph representations across different environments, which achieves great success in tackling Out-of-Distribution (OOD) generalization in graph-related tasks. As environments on graphs are usually expensive to obtain, most graph invariant learning methods heavily rely on inferring the underlying environments to learn the environment-wise invariant graph representations. Actually, inferring the underlying environments is extremely challenging, due to the high heterogeneity of the graph environments and the unknown number of underlying environments.\nIn this paper, we solve the OOD graph generalization task from a class-wise perspective, enabling us to generate more reliable virtual environments for effective graph invariant learning.   This is motivated by the observation that class-wise spurious features are more likely shared by different classes despite high environment heterogeneity. To this end, we introduce a novel framework, named Class-wise invariant risk minimization via Virtual Environment Inference (C-VEI), which aims to discard class-wise spurious correlations and preserve class-wise invariance. \nSpecifically, to infer the class-wise virtual environments, C-VEI introduces a contrastive strategy on the latent space, which i) pulls samples from the same class but dissimilar graph representations together and ii) pushes samples from different classes but similar graph representations away. In addition, we design a class-wise invariant risk minimization to preserve class-wise invariance, We conduct extensive experiments on several graph OOD benchmarks and demonstrate the consistent superiority of our C-VEI across all settings and metrics. The source code will be made publicly available.",
        "keywords": "graph out-of-distributed generalization;graph invariant learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Yu Wang;Yongqiang Chen;Jinfa Huang;Zijing Liu;Jiying Zhang;Xuxin Cheng;Yu Li;Zhun Zhong",
        "authorids": "~Yu_Wang43;~Yongqiang_Chen1;~Jinfa_Huang2;~Zijing_Liu1;~Jiying_Zhang1;~Xuxin_Cheng3;~Yu_Li4;~Zhun_Zhong1",
        "gender": "F;;M;;M;;M;M",
        "homepage": "https://github.com/rain305f;https://lfhase.win;https://github.com/inFaaa;https://github.com/zj-liu;https://youjibiying.github.io/;;https://yu-li.github.io/;http://zhunzhong.site",
        "dblp": ";76/5774-2;39/9426;205/3211;287/9432;;34/2997-3;32/6525",
        "google_scholar": "lzsu-5MAAAAJ;huQ_Ig8AAAAJ;https://scholar.google.com/citations?hl=en;;j90eZ0MAAAAJ;;j9lwU7kAAAAJ;nZizkQ0AAAAJ",
        "orcid": ";;;0000-0002-0189-7409;;;;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Yu_Wang43;~Yongqiang_Chen1;~Jinfa_Huang2;~Zijing_Liu1;~Jiying_Zhang1;~Xuxin_Cheng3;~Yu_Li4;~Zhun_Zhong1",
        "aff": "Peking University;Department of Computer Science and Engineering, The Chinese University of Hong Kong;University of Rochester;International Digital Economy Academy;IDEA;;International Digital Economy Academy;University of Nottingham",
        "aff_domain": "pku.edu.cn;cse.cuhk.edu.hk;rochester.edu;idea.edu.cn;idea.edu.cn;;idea.edu.cn;nottingham.ac.uk",
        "position": "MS student;PhD student;PhD student;Researcher;Researcher;;Principal Researcher;Assistant Professor",
        "bibtex": "@misc{\nwang2024learning,\ntitle={Learning Invariant Graph Representations via Virtual Environment Inference},\nauthor={Yu Wang and Yongqiang Chen and Jinfa Huang and Zijing Liu and Jiying Zhang and Xuxin Cheng and Yu Li and Zhun Zhong},\nyear={2024},\nurl={https://openreview.net/forum?id=YQaf8Mcsrr}\n}",
        "github": "",
        "project": "",
        "reviewers": "6tAG;rRhy;ELup;hXrT",
        "site": "https://openreview.net/forum?id=YQaf8Mcsrr",
        "pdf_size": 2862616,
        "rating": "3;3;5;5",
        "confidence": "5;4;4;3",
        "soundness": "2;2;2;2",
        "contribution": "2;3;2;2",
        "presentation": "2;2;2;3",
        "wc_summary": "75;65;83;64",
        "wc_strengths": "81;33;43;65",
        "wc_weaknesses": "235;274;214;65",
        "wc_questions": "224;2;59;117",
        "wc_review": "615;374;399;311",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            71.75,
            7.790218225441442
        ],
        "wc_strengths_avg": [
            55.5,
            18.728320800328042
        ],
        "wc_weaknesses_avg": [
            197.0,
            79.19280270327602
        ],
        "wc_questions_avg": [
            100.5,
            82.08075292052334
        ],
        "wc_review_avg": [
            424.75,
            114.42546700800482
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.7071067811865475,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:UT41C4VHzo8J:scholar.google.com/&scioq=Learning+Invariant+Graph+Representations+via+Virtual+Environment+Inference&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;4;3;5",
        "aff_unique_norm": "Peking University;Chinese University of Hong Kong;University of Rochester;International Digital Economy Academy;Institute of Electrical and Electronics Engineers;University of Nottingham",
        "aff_unique_dep": ";Department of Computer Science and Engineering;;;;",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.cuhk.edu.hk;https://www.rochester.edu;;https://www.ieee.org;https://www.nottingham.ac.uk",
        "aff_unique_abbr": "Peking U;CUHK;U of R;;IEEE;UoN",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;1;1;3",
        "aff_country_unique": "China;United States;;United Kingdom"
    },
    {
        "title": "Tuning LayerNorm in Attention: Towards Efficient Multi-Modal LLM Finetuning",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18422",
        "id": "YR3ETaElNK",
        "author_site": "Bingchen Zhao, Haoqin Tu, Chen Wei, Jieru Mei, Cihang Xie",
        "tldr": "",
        "abstract": "This paper introduces an efficient strategy to transform Large Language Models (LLMs) into Multi-Modal Large Language Models. \nBy conceptualizing this transformation as a domain adaptation process, \\ie, transitioning from text understanding to embracing multiple modalities, we intriguingly note that, within each attention block, tuning LayerNorm suffices to yield strong performance. \nMoreover, when benchmarked against other tuning approaches like full parameter finetuning or LoRA, its benefits on efficiency are substantial.\nFor example, when compared to LoRA on a 13B model scale, performance can be enhanced by an average of over 20\\% across five multi-modal tasks, and meanwhile, \nresults in a significant reduction of trainable parameters by 41.9\\% and a decrease in GPU memory usage by 17.6\\%. On top of this LayerNorm strategy, we showcase that selectively tuning only with conversational data can improve efficiency further. \nBeyond these empirical outcomes, we provide a comprehensive analysis to explore the role of LayerNorm in adapting LLMs to the multi-modal domain and improving the expressive power of the model.",
        "keywords": "multi-modality; large language models; generation; model efficiency;",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Bingchen Zhao;Haoqin Tu;Chen Wei;Jieru Mei;Cihang Xie",
        "authorids": "~Bingchen_Zhao1;~Haoqin_Tu1;~Chen_Wei2;~Jieru_Mei2;~Cihang_Xie3",
        "gender": "M;M;;M;M",
        "homepage": "http://bzhao.me/;https://www.haqtu.me;https://weichen582.github.io/;https://meijieru.com/;https://cihangxie.github.io/",
        "dblp": "120/3602;309/7386;181/2831-5;198/9332.html;175/3366",
        "google_scholar": "lEcqFJEAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en;nHKExN0AAAAJ;X3vVZPcAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;meijieru/;",
        "or_profile": "~Bingchen_Zhao1;~Haoqin_Tu1;~Chen_Wei2;~Jieru_Mei2;~cihang_xie1",
        "aff": "University of Edinburgh, University of Edinburgh;University of Chinese Academy of Sciences;Johns Hopkins University;Johns Hopkins University;University of California, Santa Cruz",
        "aff_domain": "ed.ac.uk;ucas.ac.cn;jhu.edu;jhu.edu;ucsc.edu",
        "position": "PhD student;MS student;PhD student;PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nzhao2024tuning,\ntitle={Tuning LayerNorm in Attention: Towards Efficient Multi-Modal {LLM} Finetuning},\nauthor={Bingchen Zhao and Haoqin Tu and Chen Wei and Jieru Mei and Cihang Xie},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=YR3ETaElNK}\n}",
        "github": "",
        "project": "",
        "reviewers": "6WJ1;itTB;qMBg;rJin",
        "pdf_size": 3404845,
        "rating": "6;6;8;8",
        "confidence": "4;3;2;4",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;4;3;3",
        "wc_summary": "79;87;115;129",
        "wc_strengths": "17;94;59;90",
        "wc_weaknesses": "59;172;44;26",
        "wc_questions": "65;108;2;12",
        "wc_review": "220;461;220;257",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "396;449;322;264",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            102.5,
            20.316249653910045
        ],
        "wc_strengths_avg": [
            65.0,
            30.84639363037436
        ],
        "wc_weaknesses_avg": [
            75.25,
            57.06739436841321
        ],
        "wc_questions_avg": [
            46.75,
            42.70465431308396
        ],
        "wc_review_avg": [
            289.5,
            100.16112020140349
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            357.75,
            70.45699042678449
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.30151134457776363,
        "gs_citation": 41,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15502910992735970626&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=YR3ETaElNK",
        "pdf": "https://openreview.net/pdf?id=YR3ETaElNK",
        "email": "ed.ac.uk;ucas.ac.cn;jhu.edu;jhu.edu;ucsc.edu",
        "author_num": 5,
        "aff_unique_index": "0;1;2;2;3",
        "aff_unique_norm": "University of Edinburgh;University of Chinese Academy of Sciences;Johns Hopkins University;University of California, Santa Cruz",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.ed.ac.uk;http://www.ucas.ac.cn;https://www.jhu.edu;https://www.ucsc.edu",
        "aff_unique_abbr": "Edinburgh;UCAS;JHU;UCSC",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Santa Cruz",
        "aff_country_unique_index": "0;1;2;2;2",
        "aff_country_unique": "United Kingdom;China;United States"
    },
    {
        "id": "YRJDZYGmAZ",
        "title": "Domain Prompt Matters a Lot in Multi-Source Few-Shot Domain Adaptation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large vision-language models have demonstrated strong performance in multi-source few-shot domain adaptation (MFDA). Current methods predominantly like CoOp rely on identifying a domain-agnostic prompt, leading to the overlooking of known difference information between domains. However, extracting the domain information requires the model to have good identification ability for domain information. Although training models with domain prompts allow them to capture the specific semantic nuances of a particular domain, using learnable prompts increases the risk of overfitting on training samples and reduces the effectiveness of domain prompts in capturing target domain features during transfer. To address this challenge, we propose \"domain-aware mixup,\" a method that allows the model to become more sensitive to specific domain information when facing cross-domain mixed feature information. Specifically, we design the prompt structure composed of domain prompt and context prompt to narrow the gap between the specific domain feature and the specific image feature extracted from the cross-domain mix feature. This approach enables us to efficiently train domain prompt terms, enhancing the model's ability to distinguish semantic distinctions between different domains. We empirically validate our method on the DomainNet and OfficeHome datasets, observing a performance boost of 5.3%-5.8% over the CLIP model and a 1.1%-1.5% advantage over the domain-agnostic tuning method.",
        "keywords": "Large language-vision models;few-shot learning;domain adaptation;mixup",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Hang Yu;Cheng Jin;Yonggang Zhang;Xiaofeng Cao;Zhen Fang",
        "authorids": "~Hang_Yu9;~Cheng_Jin5;~Yonggang_Zhang1;~Xiaofeng_Cao2;~Zhen_Fang2",
        "gender": "M;;M;M;M",
        "homepage": ";;https://yonggangzhangben.github.io/index.html;https://fang-zhen.github.io/index.html;https://xiaofengcaoml.github.io/",
        "dblp": "74/2568-6;;27/6859-3;;117/3982-2.html",
        "google_scholar": "https://scholar.google.com.au/citations?user=3BLeGSoAAAAJ;;XSbEr98AAAAJ;OzD6WJcAAAAJ;",
        "orcid": "0000-0003-3444-9992;0009-0008-6181-7264;0000-0002-4080-7592;0000-0003-0602-6255;",
        "linkedin": ";;;;",
        "or_profile": "~Hang_Yu9;~Cheng_Jin5;~Yonggang_Zhang1;~Zhen_Fang2;~Xiaofeng_Cao1",
        "aff": "Shanghai University;Shanghai University;Hong Kong Baptist University;University of Technology Sydney;Jilin University",
        "aff_domain": "shu.edu.cn;shu.edu.cn;hkbu.edu.hk;uts.edu.au;jlu.edu.cn",
        "position": "Full Professor;MS student;Postdoc;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nyu2024domain,\ntitle={Domain Prompt Matters a Lot in Multi-Source Few-Shot Domain Adaptation},\nauthor={Hang Yu and Cheng Jin and Yonggang Zhang and Xiaofeng Cao and Zhen Fang},\nyear={2024},\nurl={https://openreview.net/forum?id=YRJDZYGmAZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "7xZk;4Xat;vkpj;aew1",
        "site": "https://openreview.net/forum?id=YRJDZYGmAZ",
        "pdf_size": 4557515,
        "rating": "1;3;3;6",
        "confidence": "5;5;3;4",
        "soundness": "2;2;2;3",
        "contribution": "1;2;2;2",
        "presentation": "1;2;1;2",
        "wc_summary": "113;92;59;99",
        "wc_strengths": "35;25;10;44",
        "wc_weaknesses": "861;355;315;39",
        "wc_questions": "84;6;3;58",
        "wc_review": "1093;478;387;240",
        "wc_reply_reviewers": "59;36;47;0",
        "wc_reply_authors": "393;218;405;204",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            90.75,
            19.828956099603428
        ],
        "wc_strengths_avg": [
            28.5,
            12.619429464123963
        ],
        "wc_weaknesses_avg": [
            392.5,
            296.5918913254373
        ],
        "wc_questions_avg": [
            37.75,
            34.513584282134474
        ],
        "wc_review_avg": [
            549.5,
            325.0772984999106
        ],
        "wc_reply_reviewers_avg": [
            35.5,
            22.051077071199945
        ],
        "wc_reply_authors_avg": [
            305.0,
            94.22579264723646
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.37998029782867415,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:6F6q2hokhC4J:scholar.google.com/&scioq=Domain+Prompt+Matters+a+Lot+in+Multi-Source+Few-Shot+Domain+Adaptation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2;3",
        "aff_unique_norm": "Shanghai University;Hong Kong Baptist University;University of Technology Sydney;Jilin University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.shu.edu.cn;https://www.hkbu.edu.hk;https://www.uts.edu.au;http://www.jlu.edu.cn",
        "aff_unique_abbr": "SHU;HKBU;UTS;JLU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "China;Australia"
    },
    {
        "id": "YRXDl6I3j5",
        "title": "Tall Tales at Different Scales: Evaluating Scaling Trends For Deception in Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Language is a natural medium for deception, and there is growing evidence that language models (LMs) have the capability to deceive humans and other AI systems. We build on existing literature on deceptive AI agents, and the beliefs of LMs, to study deception in LMs from a behavioural perspective. The philosophical notion of deception involves one agent causing another agent to have a false belief, but the ascription of \\emph{agency} and \\emph{beliefs} to LMs is a contentious topic. Following past work in philosophy and AI, we argue that one important characteristic of agents is that they have \\emph{consistent beliefs}. We demonstrate scaling trends for LM consistency, showing that LMs become more consistent with model size, instruct fine-tuning, and increased inference compute. Next, we demonstrate that deception can be learned due to errors in the feedback given in training, even with a seemingly benign training objective. We fine-tune LMs to be evaluated as truthful by a systematically biased evaluator and show that they learn to deceive this evaluator. We infer LM beliefs from their behaviour to demonstrate that they do not believe the lies that they tell. Additionally, we find scaling trends for deceptive behaviour. Larger LMs learn to target lies to cases where the evaluator makes mistakes, and do so from fewer evaluator errors in the training set. Furthermore, for larger models, lying generalizes to different contexts and they learn to reaffirm their lies, even though they were not trained to do so.  Finally, we demonstrate that GPT-4 has learned to lie about its capabilities to be evaluated as helpful and harmless.",
        "keywords": "Deception;Model Evaluations;Scaling",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/d57c573dca192065c406d1f0922471907c8cf826.pdf",
        "author": "Francis Rhys Ward;Felix Hofst\u00e4tter;Louis Alexander Thomson;Harriet Mary Wood;Oliver Jaffe;Patrik Bartak;Samuel F. Brown",
        "authorids": "~Francis_Rhys_Ward1;~Felix_Hofst\u00e4tter1;~Louis_Alexander_Thomson1;~Harriet_Mary_Wood1;~Oliver_Jaffe2;~Patrik_Bartak1;~Samuel_F._Brown1",
        "gender": "M;M;M;F;M;M;M",
        "homepage": "https://francisrhysward.wordpress.com/;;;;https://github.com/ojaffe;;",
        "dblp": "273/0874;;;;;;",
        "google_scholar": ";zRIuwQ8AAAAJ;2pPzGroAAAAJ;;;;",
        "orcid": ";;;;;;",
        "linkedin": ";felixhofstaetter/;louis-thomson-222348168;harriet-wood-148522228;;patrik-bartak/;sam-brown-likes-making-things/",
        "or_profile": "~Francis_Rhys_Ward1;~Felix_Hofst\u00e4tter1;~Louis_Alexander_Thomson1;~Harriet_Mary_Wood1;~Oliver_Jaffe2;~Patrik_Bartak1;~Samuel_F._Brown1",
        "aff": "Imperial College London;Independent;University of Oxford;Department of Computer Science;OpenAI;University of Amsterdam;Independent",
        "aff_domain": "ic.ac.uk;gmail.com;ox.ac.uk;cs.ox.ac.uk;openai.com;uva.nl;sambrown.eu",
        "position": "PhD student;Researcher;Undergrad student;Undergrad student;Researcher (Contractor);MS student;Researcher",
        "bibtex": "@misc{\nward2024tall,\ntitle={Tall Tales at Different Scales: Evaluating Scaling Trends For Deception in Language Models},\nauthor={Francis Rhys Ward and Felix Hofst{\\\"a}tter and Louis Alexander Thomson and Harriet Mary Wood and Oliver Jaffe and Patrik Bartak and Samuel F. Brown},\nyear={2024},\nurl={https://openreview.net/forum?id=YRXDl6I3j5}\n}",
        "github": "",
        "project": "",
        "reviewers": "te76;Gapa;vXt1",
        "site": "https://openreview.net/forum?id=YRXDl6I3j5",
        "pdf_size": 986514,
        "rating": "1;5;5",
        "confidence": "4;3;2",
        "soundness": "1;2;2",
        "contribution": "2;2;2",
        "presentation": "2;2;2",
        "wc_summary": "68;40;58",
        "wc_strengths": "24;82;35",
        "wc_weaknesses": "879;177;210",
        "wc_questions": "285;36;65",
        "wc_review": "1256;335;368",
        "wc_reply_reviewers": "625;26;318",
        "wc_reply_authors": "1638;349;1003",
        "reply_reviewers": "1;1;1",
        "reply_authors": "2;1;3",
        "rating_avg": [
            3.6666666666666665,
            1.8856180831641267
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            55.333333333333336,
            11.585431464655176
        ],
        "wc_strengths_avg": [
            47.0,
            25.152865973217974
        ],
        "wc_weaknesses_avg": [
            422.0,
            323.4285083291206
        ],
        "wc_questions_avg": [
            128.66666666666666,
            111.17653629351034
        ],
        "wc_review_avg": [
            653.0,
            426.59817158539255
        ],
        "wc_reply_reviewers_avg": [
            323.0,
            244.56628276740574
        ],
        "wc_reply_authors_avg": [
            996.6666666666666,
            526.2511018726917
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14801573941426370593&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;4;5;1",
        "aff_unique_norm": "Imperial College London;Independent;University of Oxford;Unknown Institution;OpenAI;University of Amsterdam",
        "aff_unique_dep": ";;;Department of Computer Science;;",
        "aff_unique_url": "https://www.imperial.ac.uk;;https://www.ox.ac.uk;;https://openai.com;https://www.uva.nl",
        "aff_unique_abbr": "ICL;;Oxford;;OpenAI;UvA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;2;3",
        "aff_country_unique": "United Kingdom;;United States;Netherlands"
    },
    {
        "id": "YSTaRLVP2G",
        "title": "The Power of Linear Combinations: Learning with Random Convolutions",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Following the traditional paradigm of convolutional neural networks (CNNs), modern CNNs manage to keep pace with more recent, for example, transformer-based, models by not only increasing model depth and width but also the kernel size. This results in large amounts of learnable model parameters that need to be handled during training. While following the convolutional paradigm with the according spatial inductive bias, we question the significance of *learned* convolution filters. In fact, our findings demonstrate that many contemporary CNN architectures can achieve high test accuracies without ever updating randomly initialized (spatial) convolution filters. Instead, simple linear combinations (implemented through efficient $1\\times 1$ convolutions) suffice to effectively recombine even random filters into expressive network operators. Furthermore, these combinations of random filters can implicitly regularize the resulting operations, mitigating overfitting and enhancing overall performance and robustness. Conversely, retaining the ability to learn filter updates can impair network performance. Finally, although the improvement we see from learning $3\\times 3$ convolutions is relatively small, the learning gains increase proportionally with kernel size. We attribute this to the independently and identically distributed (*i.i.d.*) nature of default initialization schemes.",
        "keywords": "Convolution;random parameters",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/3a14bbd31165da2ee1e5bbe691207e2c36bbf434.pdf",
        "author": "Paul Gavrikov;Janis Keuper",
        "authorids": "~Paul_Gavrikov1;~Janis_Keuper1",
        "gender": "M;M",
        "homepage": "https://paulgavrikov.github.io;https://www.keuper-labs.org/",
        "dblp": "234/1360;04/6578",
        "google_scholar": "cshJtrQAAAAJ;https://scholar.google.de/citations?hl=de",
        "orcid": "0000-0003-2667-9333;0000-0002-1327-1243",
        "linkedin": "paul-gavrikov-60a4666a/;",
        "or_profile": "~Paul_Gavrikov1;~Janis_Keuper1",
        "aff": "Offenburg University;Institute for Machine Learning and Analytics, Offenburg University",
        "aff_domain": "hs-offenburg.de;imla.ai",
        "position": "Researcher;Full Professor",
        "bibtex": "@misc{\ngavrikov2024the,\ntitle={The Power of Linear Combinations: Learning with Random Convolutions},\nauthor={Paul Gavrikov and Janis Keuper},\nyear={2024},\nurl={https://openreview.net/forum?id=YSTaRLVP2G}\n}",
        "github": "",
        "project": "",
        "reviewers": "gGqG;6E1w;zzwD;SmiK",
        "site": "https://openreview.net/forum?id=YSTaRLVP2G",
        "pdf_size": 863359,
        "rating": "3;3;6;6",
        "confidence": "4;4;4;3",
        "soundness": "3;4;3;3",
        "contribution": "2;1;2;3",
        "presentation": "4;4;3;4",
        "wc_summary": "54;173;167;60",
        "wc_strengths": "51;77;124;61",
        "wc_weaknesses": "21;404;290;42",
        "wc_questions": "5;169;186;23",
        "wc_review": "131;823;767;186",
        "wc_reply_reviewers": "59;798;0;70",
        "wc_reply_authors": "547;1600;1091;484",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "2;4;2;2",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            113.5,
            56.5795899596312
        ],
        "wc_strengths_avg": [
            78.25,
            27.99441908666797
        ],
        "wc_weaknesses_avg": [
            189.25,
            162.98677093555784
        ],
        "wc_questions_avg": [
            95.75,
            82.21731873516674
        ],
        "wc_review_avg": [
            476.75,
            319.4576458624836
        ],
        "wc_reply_reviewers_avg": [
            231.75,
            328.0063833220323
        ],
        "wc_reply_authors_avg": [
            930.5,
            452.8865752039908
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.8660254037844386
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5773502691896258,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8828551770274994571&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Offenburg University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.hs-offenburg.de/",
        "aff_unique_abbr": "HS Offenburg",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Offenburg",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "YSZ2GmGvUV",
        "title": "EigenGuard: Backdoor Defense in Eigenspace",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep Neural Networks (DNNs) have shown remarkable performance in various downstream tasks. However, these models are vulnerable to backdoor attacks that are conducted by poisoning data for model training and misleading poisoned models to output target labels on predefined triggers. Such vulnerabilities make training DNNs on third-party datasets risky and raise significant concerns and studies for safety. With an unauthorized dataset, it is difficult to train a model on such data without the backdoored behavior on poison samples. In this paper, we first point out that training neural networks by forcing the dimension of the feature space will induce trigger misclassification while preserving natural data performance. Based on these observations, we propose a novel module called EigenGuard, naturally trained with such a module will make neural networks neglect triggers during training on the unauthorized datasets. Experiments show that, compared with previous works, models with our EigenGuard can show better performance on both backdoor and natural examples compared with other defense algorithms.",
        "keywords": "Backdoor Defense;netural network;spectrum",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/e6c11c3f4f39478438963986b8783da5a18b0112.pdf",
        "author": "Mingjie Li;Yifei Wang;Zhouchen Lin;Yisen Wang",
        "authorids": "~Mingjie_Li1;~Yifei_Wang1;~Zhouchen_Lin1;~Yisen_Wang1",
        "gender": "M;M;M;M",
        "homepage": "https://mingjieli0111.github.io/;https://yifeiwang77.com;https://zhouchenlin.github.io;https://yisenwang.github.io/",
        "dblp": ";00/555-1;l/ZhouchenLin;172/1346-1",
        "google_scholar": ";-CLy6YsAAAAJ;https://scholar.google.com.tw/citations?user=TanjFwoAAAAJ;uMWPDboAAAAJ",
        "orcid": "0000-0002-1588-2654;;0000-0003-1493-7569;",
        "linkedin": ";;;",
        "or_profile": "~Mingjie_Li1;~Yifei_Wang1;~Zhouchen_Lin1;~Yisen_Wang1",
        "aff": "CISPA Helmholtz Center for Information Security;Massachusetts Institute of Technology;Peking University;Peking University",
        "aff_domain": "cispa.de;mit.edu;pku.edu.cn;pku.edu.cn",
        "position": "Postdoc;Postdoc;Professor;Assistant Professor",
        "bibtex": "@misc{\nli2024eigenguard,\ntitle={EigenGuard: Backdoor Defense in Eigenspace},\nauthor={Mingjie Li and Yifei Wang and Zhouchen Lin and Yisen Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=YSZ2GmGvUV}\n}",
        "github": "",
        "project": "",
        "reviewers": "fVxx;5Wz3;Zcuo;6rWf",
        "site": "https://openreview.net/forum?id=YSZ2GmGvUV",
        "pdf_size": 1407514,
        "rating": "3;5;5;5",
        "confidence": "5;4;2;3",
        "soundness": "2;3;2;2",
        "contribution": "2;2;3;2",
        "presentation": "2;2;3;3",
        "wc_summary": "109;78;76;115",
        "wc_strengths": "39;62;56;36",
        "wc_weaknesses": "820;417;253;29",
        "wc_questions": "138;30;4;458",
        "wc_review": "1106;587;389;638",
        "wc_reply_reviewers": "0;0;45;253",
        "wc_reply_authors": "1076;1274;1247;1511",
        "reply_reviewers": "0;0;1;2",
        "reply_authors": "2;3;4;4",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            94.5,
            17.64227876437735
        ],
        "wc_strengths_avg": [
            48.25,
            11.008519428151999
        ],
        "wc_weaknesses_avg": [
            379.75,
            289.0928700262253
        ],
        "wc_questions_avg": [
            157.5,
            180.62322663489323
        ],
        "wc_review_avg": [
            680.0,
            262.94961494552524
        ],
        "wc_reply_reviewers_avg": [
            74.5,
            104.68166028488467
        ],
        "wc_reply_authors_avg": [
            1277.0,
            154.97257821950308
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.25,
            0.82915619758885
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.7745966692414834,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:yx0wlcvdvzQJ:scholar.google.com/&scioq=EigenGuard:+Backdoor+Defense+in+Eigenspace&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;2",
        "aff_unique_norm": "CISPA Helmholtz Center for Information Security;Massachusetts Institute of Technology;Peking University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.cispa.de/;https://web.mit.edu;http://www.pku.edu.cn",
        "aff_unique_abbr": "CISPA;MIT;Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;2",
        "aff_country_unique": "Germany;United States;China"
    },
    {
        "id": "YTKShuSOhI",
        "title": "Demonstrating the capacity of a Path-Based variational inference formulation for robust hidden Markov modelling of complex and noisy binary trees",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Binary tree structures are prevalent multiple across fields such as procedural modelling, genomics, and image processing. Hidden Markov models (HMMs) provide compact and interpretable representations for these complex and fractal structures. However, current de-facto inference methods involve complex iterations over all sub-trees, implementations that are domain-specific and lack a unified open-source solution. This study explores a novel `paths-of-bifurcations' inference approach to fit hidden Markov parameters on binary trees, compatible with the use of popular modelling packages. Key contributions include: (1) demonstration of procedural modelling for creating a sandbox of synthetic trees for experimentation;  (2) comprehensive performance evaluations of our inference procedure on synthetic benchmark trees addressing various challenges: heterogeneity of branch emission distributions, low probability states, small data regimes and noisy observational data; and (3) a practical application to a medical image dataset. The latter showcases the method's ability to reveal insights into branching rules governing the human airway system, with potential implications in disease characterization, airflow analysis, and particle deposition studies. This research provides a step toward robust, scalable and user-friendly generative modelling of binary tree structures with broad interdisciplinary implications.",
        "keywords": "hidden Markov model;variational inference;binary tree;generative model",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/5b5d7eb96a8fc19f07489af2fcb9ad093d0aa24e.pdf",
        "author": "Sneha Narayan Naik;Benjamin M. Smith;Andrew F. Laine;Elsa Angelini",
        "authorids": "~Sneha_Narayan_Naik1;~Benjamin_M._Smith1;~Andrew_F._Laine1;~Elsa_Angelini1",
        "gender": "F;M;M;F",
        "homepage": ";https://rimuhc.ca/-/benjamin-smith-md-m-sc-frcpc;http://hbil.bme.columbia.edu;https://www.imperial.ac.uk/people/e.angelini",
        "dblp": ";;l/AndrewFLaine;63/1426.html",
        "google_scholar": ";;;Fvy_0I4AAAAJ",
        "orcid": "0000-0002-9949-0024;;;",
        "linkedin": "sneha-naik-cambridge-university/;;;elsa-angelini-52602b2/",
        "or_profile": "~Sneha_Narayan_Naik1;~Benjamin_M._Smith1;~Andrew_F._Laine1;~Elsa_Angelini1",
        "aff": "Columbia University;McGill University;Columbia University;T\u00e9l\u00e9com ParisTech",
        "aff_domain": "columbia.edu;mcgill.ca;columbia.edu;telecom-paristech.fr",
        "position": "PhD student;Associate Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nnaik2024demonstrating,\ntitle={Demonstrating the capacity of a Path-Based variational inference formulation for robust hidden Markov modelling of complex and noisy binary trees},\nauthor={Sneha Narayan Naik and Benjamin M. Smith and Andrew F. Laine and Elsa Angelini},\nyear={2024},\nurl={https://openreview.net/forum?id=YTKShuSOhI}\n}",
        "github": "",
        "project": "",
        "reviewers": "1unB;T8XB;xwzK",
        "site": "https://openreview.net/forum?id=YTKShuSOhI",
        "pdf_size": 17574199,
        "rating": "5;5;5",
        "confidence": "3;2;5",
        "soundness": "4;3;3",
        "contribution": "3;1;1",
        "presentation": "2;2;1",
        "wc_summary": "79;38;91",
        "wc_strengths": "98;47;17",
        "wc_weaknesses": "111;34;146",
        "wc_questions": "16;265;218",
        "wc_review": "304;384;472",
        "wc_reply_reviewers": "0;17;817",
        "wc_reply_authors": "679;1638;1916",
        "reply_reviewers": "0;1;1",
        "reply_authors": "3;5;4",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.3333333333333335,
            1.247219128924647
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            69.33333333333333,
            22.69116323349001
        ],
        "wc_strengths_avg": [
            54.0,
            33.436506994600975
        ],
        "wc_weaknesses_avg": [
            97.0,
            46.783187863447985
        ],
        "wc_questions_avg": [
            166.33333333333334,
            108.01954555645113
        ],
        "wc_review_avg": [
            386.6666666666667,
            68.61162842809924
        ],
        "wc_reply_reviewers_avg": [
            278.0,
            381.1937390181883
        ],
        "wc_reply_authors_avg": [
            1411.0,
            529.8987324637291
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            4.0,
            0.816496580927726
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:wfSBd0c_KCYJ:scholar.google.com/&scioq=Demonstrating+the+capacity+of+a+Path-Based+variational+inference+formulation+for+robust+hidden+Markov+modelling+of+complex+and+noisy+binary+trees&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "Columbia University;McGill University;T\u00e9l\u00e9com ParisTech",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.columbia.edu;https://www.mcgill.ca;https://www.telecom-paristech.fr",
        "aff_unique_abbr": "Columbia;McGill;TP",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;2",
        "aff_country_unique": "United States;Canada;France"
    },
    {
        "id": "YUNnVFlpjp",
        "title": "Simple Yet Effective Spatio-Temporal Prompt Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Accurate spatio-temporal prediction is pivotal for optimizing transportation systems and enhancing urban management. However, the practical application of cutting-edge graph neural network (GNN)-based methods for these tasks encounters challenges, particularly regarding their ability to generalize. GNN-based approaches have shown promise in capturing intricate spatial and temporal dependencies found in traffic and crime data. They utilize graph structures to model relationships between locations or entities, enabling the prediction of traffic patterns and crime incidents. Nonetheless, a key challenge involves ensuring that these models can effectively generalize to unseen scenarios and adapt to varying spatio-temporal data distributions. To tackle this challenge, we present a lightweight and effective prompt learning paradigm called as PromptST. This framework serves as an adaptation of pretrained spatio-temporal prediction models, specifically designed to handle the dynamics of spatial and temporal distributions. In the context of spatio-temporal prediction, our prompt tuning incorporates a simple prompt network into the pretrained model. By automatically learning informative prompt contexts that encapsulate the underlying spatial and temporal patterns from unseen data, the spatio-temporal prompt network guides the pretrained model to successfully adapt and learn from new data distributions. Our proposed prompt learning framework has been extensively evaluated on various spatio-temporal datasets, and the results demonstrate its effectiveness. Across multiple spatio-temporal prediction tasks, our PromptST achieves state-of-the-art prediction accuracy while maintaining computational efficiency, showcasing its superiority in capturing complex dependencies and adapting to varying data distributions across time and space.",
        "keywords": "Spatio-Temporal Prompt Learning;Traffci prediction;Crime Prediction",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/74e2d48d9b8cf41d5a8affecf760b8de17a58928.pdf",
        "author": "Qianru Zhang;Lianghao Xia;Zhonghang Li;Siu Ming Yiu;Chao Huang",
        "authorids": "~Qianru_Zhang2;~Lianghao_Xia1;~Zhonghang_Li1;~Siu_Ming_Yiu1;~Chao_Huang7",
        "gender": ";M;M;M;M",
        "homepage": ";https://akaxlh.github.io/;https://github.com/LZH-YS1998;https://www.cs.hku.hk/index.php/people/academic-staff/smyiu;",
        "dblp": ";270/6586;258/0356;y/SiuMingYiu.html;",
        "google_scholar": ";fDDjoUEAAAAJ;__9uvQkAAAAJ;QFNVqjEAAAAJ;Zkv9FqwAAAAJ",
        "orcid": ";0000-0003-0725-2211;0000-0002-3977-1334;0000-0002-3975-8500;",
        "linkedin": ";;;;",
        "or_profile": "~Qianru_Zhang2;~Lianghao_Xia1;~Zhonghang_Li1;~Siu_Ming_Yiu1;~Chao_Huang7",
        "aff": ";University of Hong Kong;South China University of Technology;University of Hong Kong;University of Hong Kong",
        "aff_domain": ";hku.hk;scut.edu.cn;hku.hk;hku.hk",
        "position": ";Postdoc;PhD student;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nzhang2024simple,\ntitle={Simple Yet Effective Spatio-Temporal Prompt Learning},\nauthor={Qianru Zhang and Lianghao Xia and Zhonghang Li and Siu Ming Yiu and Chao Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=YUNnVFlpjp}\n}",
        "github": "",
        "project": "",
        "reviewers": "gHhr;Ajy6;xmYg;5ref",
        "site": "https://openreview.net/forum?id=YUNnVFlpjp",
        "pdf_size": 745306,
        "rating": "3;5;5;5",
        "confidence": "5;5;2;2",
        "soundness": "2;3;2;3",
        "contribution": "2;3;2;3",
        "presentation": "1;3;3;3",
        "wc_summary": "72;46;53;93",
        "wc_strengths": "38;38;15;86",
        "wc_weaknesses": "86;79;143;149",
        "wc_questions": "67;3;137;88",
        "wc_review": "263;166;348;416",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            1.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            66.0,
            18.261982367749674
        ],
        "wc_strengths_avg": [
            44.25,
            25.86865864323081
        ],
        "wc_weaknesses_avg": [
            114.25,
            31.91688424642982
        ],
        "wc_questions_avg": [
            73.75,
            48.100805606559234
        ],
        "wc_review_avg": [
            298.25,
            93.63860048078463
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5773502691896258,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:HUM3CCFmz6oJ:scholar.google.com/&scioq=Simple+Yet+Effective+Spatio-Temporal+Prompt+Learning&hl=en&as_sdt=0,31",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "University of Hong Kong;South China University of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.hku.hk;https://www.scut.edu.cn",
        "aff_unique_abbr": "HKU;SCUT",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "YUbvEYncfv",
        "title": "DeNAV: Decentralized Self-Supervised Learning with a Training Navigator",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Current Federated Self-Supervised Learning (FSSL) methods can achieve effective learning on edge devices with unlabeled data. However, in realistic settings, it is not easy to ensure that distributed clients at a large scale can efficiently communicate with a central server. In this work, we study an essential scenario of Decentralized Self-Supervised Learning (DSSL) based on decentralized communications. It is a highly challenging scenario where only unlabeled data is used during the pre-training stage, and the communication between clients involves only model parameters without data sharing. We propose a novel method to tackle the problems, which we refer to as Decentralized Navigator (DeNAV). DeNAV utilizes a lightweight pre-training model, namely the One-Block Masked Autoencoder, with a training navigator to evaluate selection scores for the connected clients and plan the training route based on these scores, eliminating the reliance on server aggregation in federated learning. Comprehensive experimental validation demonstrates that DeNAV surpasses the most advanced FSSL and Gossip Learning methods in terms of accuracy and communication costs.",
        "keywords": "Self-Supervised Learning;Distributed Learning;Decentralized Architecture",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/8d9716c0dc5b78f40cff5a0c5620b4e414013aaa.zip",
        "author": "Xuanyu Chen;NAN YANG;Charles Z. Liu;Dong Yuan",
        "authorids": "~Xuanyu_Chen1;~NAN_YANG6;~Charles_Z._Liu1;~Dong_Yuan1",
        "gender": "M;F;M;M",
        "homepage": "https://recs.sydney.edu.au/954q1/weakly-supervised-object-detecti;;;https://www.sydney.edu.au/engineering/about/our-people/academic-staff/dong-yuan.html",
        "dblp": "183/1905;;;",
        "google_scholar": "tuk2PqQAAAAJ;01zmhNAAAAAJ;https://scholar.google.com.au/citations?hl=en;https://scholar.google.com.au/citations?user=UU0veX4AAAAJ",
        "orcid": "0000-0003-2256-7502;;;0000-0003-1130-0888",
        "linkedin": ";nan-yang-732baa157/;;",
        "or_profile": "~Xuanyu_Chen1;~NAN_YANG6;~Charles_Z._Liu1;~Dong_Yuan1",
        "aff": "University of Sydney;University of Sydney;University of Sydney;University of Sydney",
        "aff_domain": "usyd.edu.au;usyd.edu.au;usyd.edu.au;sydney.edu.au",
        "position": "PhD student;Researcher;Researcher;Associate Professor",
        "bibtex": "@misc{\nchen2024denav,\ntitle={De{NAV}: Decentralized Self-Supervised Learning with a Training Navigator},\nauthor={Xuanyu Chen and NAN YANG and Charles Z. Liu and Dong Yuan},\nyear={2024},\nurl={https://openreview.net/forum?id=YUbvEYncfv}\n}",
        "github": "",
        "project": "",
        "reviewers": "rt1q;b5rW",
        "site": "https://openreview.net/forum?id=YUbvEYncfv",
        "pdf_size": 2335719,
        "rating": "3;5",
        "confidence": "4;4",
        "soundness": "2;2",
        "contribution": "2;2",
        "presentation": "2;3",
        "wc_summary": "49;93",
        "wc_strengths": "19;25",
        "wc_weaknesses": "220;180",
        "wc_questions": "7;2",
        "wc_review": "295;300",
        "wc_reply_reviewers": "0;25",
        "wc_reply_authors": "299;364",
        "reply_reviewers": "0;1",
        "reply_authors": "1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            71.0,
            22.0
        ],
        "wc_strengths_avg": [
            22.0,
            3.0
        ],
        "wc_weaknesses_avg": [
            200.0,
            20.0
        ],
        "wc_questions_avg": [
            4.5,
            2.5
        ],
        "wc_review_avg": [
            297.5,
            2.5
        ],
        "wc_reply_reviewers_avg": [
            12.5,
            12.5
        ],
        "wc_reply_authors_avg": [
            331.5,
            32.5
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:fRjM-vS_b9cJ:scholar.google.com/&scioq=DeNAV:+Decentralized+Self-Supervised+Learning+with+a+Training+Navigator&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of Sydney",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sydney.edu.au",
        "aff_unique_abbr": "USYD",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Australia"
    },
    {
        "id": "YUefWMfPoc",
        "title": "How to fix a broken confidence estimator: Evaluating post-hoc methods for selective classification with deep neural networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper addresses the problem of selective classification for deep neural networks, where a model is allowed to abstain from low-confidence predictions to avoid potential errors. We focus on so-called post-hoc methods, which replace the confidence estimator of a given classifier without retraining or modifying it, thus being practically appealing. Considering neural networks with softmax outputs, our goal is to identify the best confidence estimator that can be computed directly from the unnormalized logits. This problem is motivated by the intriguing observation in recent work that many classifiers appear to have a ``broken'' confidence estimator, in the sense that their selective classification performance is much worse than what could be expected by their corresponding accuracies. We perform an extensive experimental study of many existing and proposed confidence estimators applied to 84 pretrained ImageNet classifiers available from popular repositories. Our results show that a simple $p$-norm normalization of the logits, followed by taking the maximum logit as the confidence estimator, can lead to considerable gains in selective classification performance, completely fixing the pathological behavior observed in many classifiers. As a consequence, the selective classification performance of any classifier becomes almost entirely determined by its corresponding accuracy. Moreover, these results are shown to be consistent under distribution shift. We also investigate why certain classifiers innately have a good confidence estimator that apparently cannot be improved by post-hoc methods.",
        "keywords": "Selective classification;deep learning;uncertainty estimation;failure prediction;misclassification detection;reject option;neural networks",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Lu\u00eds Felipe Prates Cattelan;Danilo Silva",
        "authorids": "~Lu\u00eds_Felipe_Prates_Cattelan1;~Danilo_Silva1",
        "gender": "M;M",
        "homepage": ";https://danilosilva.sites.ufsc.br",
        "dblp": ";18/3689",
        "google_scholar": "ZI9hCOYAAAAJ;zKzRk7AAAAAJ",
        "orcid": ";0000-0001-6290-7968",
        "linkedin": "luis-felipe-cattelan/;danilo-silva-ufsc",
        "or_profile": "~Lu\u00eds_Felipe_Prates_Cattelan1;~Danilo_Silva1",
        "aff": "Universidade Federal de Santa Catarina;Universidade Federal de Santa Catarina",
        "aff_domain": "ufsc.br;ufsc.br",
        "position": "MS student;Associate Professor",
        "bibtex": "@misc{\ncattelan2024how,\ntitle={How to fix a broken confidence estimator: Evaluating post-hoc methods for selective classification with deep neural networks},\nauthor={Lu{\\'\\i}s Felipe Prates Cattelan and Danilo Silva},\nyear={2024},\nurl={https://openreview.net/forum?id=YUefWMfPoc}\n}",
        "github": "",
        "project": "",
        "reviewers": "3CxY;TapJ;aDAg;L98u",
        "site": "https://openreview.net/forum?id=YUefWMfPoc",
        "pdf_size": 1284463,
        "rating": "5;6;6;6",
        "confidence": "4;4;4;4",
        "soundness": "3;3;2;3",
        "contribution": "2;3;2;3",
        "presentation": "2;3;2;3",
        "wc_summary": "80;72;114;89",
        "wc_strengths": "41;169;84;86",
        "wc_weaknesses": "155;288;317;295",
        "wc_questions": "45;143;421;24",
        "wc_review": "321;672;936;494",
        "wc_reply_reviewers": "112;103;100;24",
        "wc_reply_authors": "823;863;2275;1600",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;3;4;4",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            88.75,
            15.769828787910159
        ],
        "wc_strengths_avg": [
            95.0,
            46.351914739307155
        ],
        "wc_weaknesses_avg": [
            263.75,
            63.69213059711537
        ],
        "wc_questions_avg": [
            158.25,
            158.2077352723311
        ],
        "wc_review_avg": [
            605.75,
            227.49986263732117
        ],
        "wc_reply_reviewers_avg": [
            84.75,
            35.35091936569684
        ],
        "wc_reply_authors_avg": [
            1390.25,
            597.189825348691
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.25,
            0.82915619758885
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2686483735024166042&as_sdt=8005&sciodt=0,7&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Universidade Federal de Santa Catarina",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ufsc.br",
        "aff_unique_abbr": "UFSC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Brazil"
    },
    {
        "id": "YVQkVnS1XK",
        "title": "XIMAGENET-12: An Explainable AI Benchmark Dataset for Model Robustness Evaluation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The lack of standardized robustness metrics and the widespread reliance on numerous unrelated benchmark datasets for testing have created a gap between academically validated robust models and their often problematic practical adoption. To address this, we introduce XIMAGENET-12, a novel benchmark dataset with over 200K images and 15,600 manual semantic annotations. Covering 12 categories from ImageNet to represent objects commonly encountered in practical life and simulated six diverse scenarios, including overexposure, blurring, color changing etc, we further propose a novel robustness criterion that extends beyond model generation-ability assessment. This benchmark dataset, along with related code, is available at https://sites.google.com/view/ximagenet-12/home. Researchers and practitioners can leverage this resource to evaluate the robustness of their visual models under challenging conditions and ultimately benefits the demands of practical computer vision systems.",
        "keywords": "Explainable AI;Computer Vision;Object Detection;Synthetic Image Generation;AIGC;Stable Diffusion",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/674e1ab519f1d368fcd8e5f30ae62eafb276ee51.pdf",
        "author": "Qiang Li;Dan Zhang;Shengzhao Lei;Xun Zhao;Shuyan Li;Porawit Kamnoedboon;WeiWei Li",
        "authorids": "~Qiang_Li8;~Dan_Zhang8;~Shengzhao_Lei1;~Xun_Zhao2;~Shuyan_Li3;~Porawit_Kamnoedboon1;~WeiWei_Li5",
        "gender": "M;;M;M;F;;F",
        "homepage": "https://qiangli.de/;https://github.com/dannie125/;https://www.linkedin.com/in/shengzhaolei;https://igoindown.github.io/xzhao.github.io/;http://Lily1994.github.io;https://sites.google.com/view/porawit-k;",
        "dblp": "282/0686;;;;12/3189;;w/LiWei",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;;;https://scholar.google.com.sg/citations?hl=zh-CN;otZIEM0AAAAJ;",
        "orcid": "0009-0000-2095-1792;;;;;;",
        "linkedin": "jonascomputervision/;;;;;;",
        "or_profile": "~Qiang_Li8;~Dan_Zhang8;~Shengzhao_Lei1;~Xun_Zhao2;~Shuyan_Li3;~Porawit_Kamnoedboon1;~Li_Wei3",
        "aff": "Accenture;;EPFL - EPF Lausanne;University of Amsterdam;University of Cambridge;University of Zurich;Shanghai Business School",
        "aff_domain": "accenture.com;;epfl.ch;uva.nl;cam.ac.uk;uzh.ch;sbs.edu.cn",
        "position": "Tech Lead in Computer Vision / IoT;;MS student;PhD student;Postdoc;PhD student;Undergrad student",
        "bibtex": "@misc{\nli2024ximagenet,\ntitle={{XIMAGENET}-12: An Explainable {AI} Benchmark Dataset for Model Robustness Evaluation},\nauthor={Qiang Li and Dan Zhang and Shengzhao Lei and Xun Zhao and Shuyan Li and Porawit Kamnoedboon and WeiWei Li},\nyear={2024},\nurl={https://openreview.net/forum?id=YVQkVnS1XK}\n}",
        "github": "",
        "project": "",
        "reviewers": "Cwsn;WJcw;eyGx",
        "site": "https://openreview.net/forum?id=YVQkVnS1XK",
        "pdf_size": 21589328,
        "rating": "3;3;5",
        "confidence": "5;5;3",
        "soundness": "1;1;2",
        "contribution": "2;1;3",
        "presentation": "1;1;2",
        "wc_summary": "47;56;114",
        "wc_strengths": "47;27;42",
        "wc_weaknesses": "146;124;62",
        "wc_questions": "78;41;35",
        "wc_review": "318;248;253",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "soundness_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            72.33333333333333,
            29.69100125552447
        ],
        "wc_strengths_avg": [
            38.666666666666664,
            8.498365855987974
        ],
        "wc_weaknesses_avg": [
            110.66666666666667,
            35.56527644893104
        ],
        "wc_questions_avg": [
            51.333333333333336,
            19.014614262602212
        ],
        "wc_review_avg": [
            273.0,
            31.88521078284832
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9433903359491495971&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;3;4;5",
        "aff_unique_norm": "Accenture;EPFL;University of Amsterdam;University of Cambridge;University of Zurich;Shanghai Business School",
        "aff_unique_dep": ";;;;;",
        "aff_unique_url": "https://www.accenture.com;https://www.epfl.ch;https://www.uva.nl;https://www.cam.ac.uk;https://www.unizh.ch;",
        "aff_unique_abbr": "Accenture;EPFL;UvA;Cambridge;UZH;",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Lausanne;Cambridge",
        "aff_country_unique_index": "0;1;2;3;1;4",
        "aff_country_unique": "United States;Switzerland;Netherlands;United Kingdom;China"
    },
    {
        "id": "YVuS6Pza3A",
        "title": "Operator Learning Meets Numerical Analysis: Improving Neural Networks through Iterative Methods",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Deep neural networks, despite their success in numerous applications, often function without established theoretical foundations. In this paper, we bridge this gap by drawing parallels between deep learning and classical numerical analysis. By framing neural networks as operators with fixed points representing desired solutions, we develop a theoretical framework grounded in iterative methods for operator equations. Under defined conditions, we present convergence proofs based on fixed point theory. We demonstrate that popular architectures, such as diffusion models and AlphaFold, inherently employ iterative operator learning. Empirical assessments highlight that performing iterations through network operators improves performance. We also introduce an iterative graph neural network, PIGN, that further demonstrates benefits of iterations. Our work aims to enhance the understanding of deep learning by merging insights from numerical analysis, potentially guiding the design of future networks with clearer theoretical underpinnings and improved performance.",
        "keywords": "Fixed Point;Picard Iterations;Operator Learning;Nonlinear Operators;Banach Space",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Emanuele Zappala;Daniel Levine;Sizhuang He;Syed A Rizvi;Sacha L\u00e9vy;David van Dijk",
        "authorids": "~Emanuele_Zappala1;~Daniel_Levine2;~Sizhuang_He1;~Syed_A_Rizvi1;~Sacha_L\u00e9vy1;~David_van_Dijk1",
        "gender": "M;;M;M;;M",
        "homepage": "https://eazappala.com/;;https://sizhuang.org;https://syedarizvi.com/;https://sachalevy.fr;http://www.vandijklab.org",
        "dblp": ";;;;;136/9930",
        "google_scholar": "J4OOzEwAAAAJ;2G-O1zQAAAAJ;4W6kA9QAAAAJ;2rhnnZ4AAAAJ;https://scholar.google.fr/citations?user=1hH9QsAAAAAJ;fjjZr6UAAAAJ",
        "orcid": ";;;0000-0002-7932-9524;;",
        "linkedin": ";;sizhuanghe/;syed-a-rizvi-01/;;",
        "or_profile": "~Emanuele_Zappala1;~Daniel_Levine2;~Sizhuang_He1;~Syed_A_Rizvi1;~Sacha_L\u00e9vy1;~David_van_Dijk1",
        "aff": "Idaho State University;Yale University;Yale University;Yale University;;Yale University",
        "aff_domain": "isu.edu;yale.edu;yale.edu;yale.edu;;yale.edu",
        "position": "Assistant Professor;Postdoc;PhD student;PhD student;;Assistant Professor",
        "bibtex": "@misc{\nzappala2024operator,\ntitle={Operator Learning Meets Numerical Analysis: Improving Neural Networks through Iterative Methods},\nauthor={Emanuele Zappala and Daniel Levine and Sizhuang He and Syed A Rizvi and Sacha L{\\'e}vy and David van Dijk},\nyear={2024},\nurl={https://openreview.net/forum?id=YVuS6Pza3A}\n}",
        "github": "",
        "project": "",
        "reviewers": "iEK8;yhYn;S97s;uKad;16kx",
        "site": "https://openreview.net/forum?id=YVuS6Pza3A",
        "pdf_size": 3680541,
        "rating": "1;3;3;3;3",
        "confidence": "4;5;3;4;3",
        "soundness": "1;2;1;2;2",
        "contribution": "1;1;1;1;1",
        "presentation": "1;3;1;2;2",
        "wc_summary": "59;78;16;103;95",
        "wc_strengths": "1;94;14;22;36",
        "wc_weaknesses": "128;305;252;243;244",
        "wc_questions": "1;2;65;24;49",
        "wc_review": "189;479;347;392;424",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            2.6,
            0.8000000000000002
        ],
        "confidence_avg": [
            3.8,
            0.7483314773547882
        ],
        "soundness_avg": [
            1.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            1.0,
            0.0
        ],
        "presentation_avg": [
            1.8,
            0.7483314773547883
        ],
        "wc_summary_avg": [
            70.2,
            31.031596800680433
        ],
        "wc_strengths_avg": [
            33.4,
            32.357997465850694
        ],
        "wc_weaknesses_avg": [
            234.4,
            57.93306482484764
        ],
        "wc_questions_avg": [
            28.2,
            25.41967741730803
        ],
        "wc_review_avg": [
            366.2,
            98.4873595950262
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.13363062095621214,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11492781543123091324&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1;1;1",
        "aff_unique_norm": "Idaho State University;Yale University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.isu.edu;https://www.yale.edu",
        "aff_unique_abbr": "ISU;Yale",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "YWOieLv40v",
        "title": "Representation Bottleneck of Graph Neural Networks for Scientific Problems",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph neural networks (GNNs) mainly rely on the message-passing paradigm to propagate node features and build interactions, and different graph learning problems require different ranges of node interactions. In this work, we explore the capacity of GNNs to capture node interactions under contexts of different complexities. We discover that GNNs usually fail to capture the most informative kinds of interaction styles for diverse graph learning tasks, and thus name this phenomenon as GNNs' representation bottleneck. As a response, we demonstrate that the inductive bias introduced by existing graph construction mechanisms can result in this representation bottleneck, i.e., preventing GNNs from learning interactions of the most appropriate complexity.  To address that limitation, we propose a novel graph rewiring approach based on interaction patterns learned by GNNs to adjust the receptive fields of each node dynamically. Extensive experiments on both real-world and synthetic datasets prove the effectiveness of our algorithm in alleviating the representation bottleneck and its superiority in enhancing the performance of GNNs over state-of-the-art graph rewiring baselines.",
        "keywords": "Graph Neural Networks;Representation Learning;Geometric Deep Learning",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Fang Wu;Siyuan Li;Stan Z. Li",
        "authorids": "~Fang_Wu1;~Siyuan_Li6;~Stan_Z._Li2",
        "gender": ";M;",
        "homepage": ";https://lupin1998.github.io/;",
        "dblp": ";63/9705-2;",
        "google_scholar": ";https://scholar.google.com/citations?hl=zh-CN;",
        "orcid": ";0000-0001-6806-2468;",
        "linkedin": ";https://www.linkedin.cn/incareer/in/siyuan-li-lupin1998/;",
        "or_profile": "~Fang_Wu1;~Siyuan_Li6;~Stan_Z._Li2",
        "aff": ";Alibaba Group;",
        "aff_domain": ";alibaba-inc.com;",
        "position": ";Intern;",
        "bibtex": "@misc{\nwu2024representation,\ntitle={Representation Bottleneck of Graph Neural Networks for Scientific Problems},\nauthor={Fang Wu and Siyuan Li and Stan Z. Li},\nyear={2024},\nurl={https://openreview.net/forum?id=YWOieLv40v}\n}",
        "github": "",
        "project": "",
        "reviewers": "WXTK;hyyD;wmgx",
        "site": "https://openreview.net/forum?id=YWOieLv40v",
        "pdf_size": 4508130,
        "rating": "3;5;6",
        "confidence": "4;4;3",
        "soundness": "2;2;3",
        "contribution": "2;3;3",
        "presentation": "2;3;3",
        "wc_summary": "44;70;130",
        "wc_strengths": "74;97;279",
        "wc_weaknesses": "118;144;246",
        "wc_questions": "129;142;245",
        "wc_review": "365;453;900",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            81.33333333333333,
            36.01234356285202
        ],
        "wc_strengths_avg": [
            150.0,
            91.69878225291035
        ],
        "wc_weaknesses_avg": [
            169.33333333333334,
            55.2408866289776
        ],
        "wc_questions_avg": [
            172.0,
            51.89091121445707
        ],
        "wc_review_avg": [
            572.6666666666666,
            234.23112991705912
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.7559289460184545,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:-vW8xoel3DoJ:scholar.google.com/&scioq=Representation+Bottleneck+of+Graph+Neural+Networks+for+Scientific+Problems&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Alibaba Group",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.alibaba.com",
        "aff_unique_abbr": "Alibaba",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "YXn76HMetm",
        "title": "Hyperbolic Active Learning for Semantic Segmentation under Domain Shift",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We introduce a hyperbolic neural network approach to pixel-level active learning for semantic segmentation, and propose a novel geometric interpretation of the hyperbolic geometry that arises bottom-up from the statistics of the data. In our formulation the hyperbolic radius emerges as an estimator of the *unexplained class complexity*, which encompasses  the class intrinsic complexity and its scarcity in the dataset. The unexplained class complexity serves as a metric indicating the likelihood that acquiring a particular pixel would contribute to enhancing the data information. We combine this quantity with  prediction uncertainty to compute an acquisition score that identifies the most informative pixels for oracle annotation.\nOur proposed HALO (Hyperbolic Active Learning Optimization) sets a new state-of-the-art in active learning for semantic segmentation under domain shift, and surpasses the supervised domain adaptation performance while only using a small portion of labels (i.e., 1\\%). \nWe perform extensive experimental analysis based on two established benchmarks, i.e. GTAV $\\rightarrow$ Cityscapes and SYNTHIA $\\rightarrow$ Cityscapes, and we additionally test on Cityscape $\\rightarrow$ ACDC under adverse weather conditions.",
        "keywords": "active learning;semantic segmentation;hyperbolic neural networks;active domain adaptation",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/9050f464de1bcc59e37c62117258e9c726632913.zip",
        "author": "Luca Franco;Paolo Mandica;Konstantinos Kallidromitis;Devin Guillory;Yu-Teng Li;Trevor Darrell;Fabio Galasso",
        "authorids": "~Luca_Franco1;~Paolo_Mandica1;~Konstantinos_Kallidromitis1;~Devin_Guillory1;~Yu-Teng_Li1;~Trevor_Darrell2;~Fabio_Galasso1",
        "gender": "M;M;M;M;M;M;M",
        "homepage": "https://fraluca.github.io/;https://paolomandica.github.io/;https://github.com/KKallidromitis;https://www.devinguillory.com/;;https://fgalasso.bitbucket.io/;https://people.eecs.berkeley.edu/~trevor/",
        "dblp": "304/2582;342/3996;;188/1061;;48/3897;d/TrevorDarrell",
        "google_scholar": "https://scholar.google.com/citations?hl=it;https://scholar.google.com/citations?hl=en;5EuNtbQAAAAJ;t4dSV4YAAAAJ;;https://scholar.google.de/citations?user=2gSuGBEAAAAJ;https://scholar.google.com.tw/citations?user=bh-uRFMAAAAJ",
        "orcid": "0000-0003-0107-6755;0000-0002-4493-2497;;;;0000-0003-1875-7813;",
        "linkedin": "luca-franco-968819196/;paolo-mandica/;kkall/;devin-guillory-78528958/;yutengli/;fabio-galasso-61141b32/;",
        "or_profile": "~Luca_Franco1;~Paolo_Mandica1;~Konstantinos_Kallidromitis1;~Devin_Guillory1;~Yu-Teng_Li1;~Fabio_Galasso1;~trevor_darrell1",
        "aff": "University of Roma \"La Sapienza\";University of Roma \"La Sapienza\";Panasonic;University of California, Berkeley;Adobe Systems;University of Roma \"La Sapienza\";Electrical Engineering & Computer Science Department",
        "aff_domain": "uniroma1.it;uniroma1.it;us.panasonic.com;berkeley.edu;adobe.com;uniroma1.it;eecs.berkeley.edu",
        "position": "PhD student;PhD student;AI Research Engineer;PhD student;Researcher;Associate Professor;Professor",
        "bibtex": "@misc{\nfranco2024hyperbolic,\ntitle={Hyperbolic Active Learning for Semantic Segmentation under Domain Shift},\nauthor={Luca Franco and Paolo Mandica and Konstantinos Kallidromitis and Devin Guillory and Yu-Teng Li and Trevor Darrell and Fabio Galasso},\nyear={2024},\nurl={https://openreview.net/forum?id=YXn76HMetm}\n}",
        "github": "",
        "project": "",
        "reviewers": "3ouZ;kZFp;UCCT",
        "site": "https://openreview.net/forum?id=YXn76HMetm",
        "pdf_size": 32079271,
        "rating": "5;5;6",
        "confidence": "4;3;3",
        "soundness": "2;3;3",
        "contribution": "2;2;3",
        "presentation": "2;2;2",
        "wc_summary": "101;109;60",
        "wc_strengths": "16;41;80",
        "wc_weaknesses": "151;147;308",
        "wc_questions": "19;151;5",
        "wc_review": "287;448;453",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "471;945;973",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;2;2",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            90.0,
            21.463146709340332
        ],
        "wc_strengths_avg": [
            45.666666666666664,
            26.335442953471574
        ],
        "wc_weaknesses_avg": [
            202.0,
            74.97110554518099
        ],
        "wc_questions_avg": [
            58.333333333333336,
            65.7740239169098
        ],
        "wc_review_avg": [
            396.0,
            77.10166448700487
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            796.3333333333334,
            230.3292329591612
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9416679968650332046&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;1;2;3;0;4",
        "aff_unique_norm": "University of Rome La Sapienza;Panasonic Corporation;University of California, Berkeley;Adobe;Electrical Engineering & Computer Science Department",
        "aff_unique_dep": ";;;Adobe Systems Incorporated;Electrical Engineering & Computer Science",
        "aff_unique_url": "https://www.uniroma1.it;https://www.panasonic.com;https://www.berkeley.edu;https://www.adobe.com;",
        "aff_unique_abbr": "La Sapienza;Panasonic;UC Berkeley;Adobe;",
        "aff_campus_unique_index": "0;0;2;0",
        "aff_campus_unique": "Rome;;Berkeley",
        "aff_country_unique_index": "0;0;1;2;2;0",
        "aff_country_unique": "Italy;Japan;United States;"
    },
    {
        "id": "YXnggA4iiD",
        "title": "Distribution Aware Active Learning via Gaussian Mixtures",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In active learning (AL), the distribution of labeled samples in a latent space is often dissimilar to that of unlabeled samples, depending on various factors such as labeled set size or data selection strategy. This distributional discrepancy hampers both evaluation and estimation of informativeness on unseen data, and remains an important issue in AL. In this paper, we propose a robust distribution-aware learning and sample selection strategy that employs Gaussian Mixture Model (GMM) to effectively encapsulate both labeled and unlabeled sets for AL. By utilizing the GMM statistics derived from all available data, the proposed approach is able to construct a more diverse feature representation, thereby reducing the risk of overfitting to limited patterns. Specifically, we propose a regularization method that supervises GMM posteriors under the concept of metric learning, and introduce a semi-supervised learning method that feeds GMM statistics into an adversarial discriminator to prevent memorization of samples. Furthermore, we propose a new informativeness metric that utilizes GMM likelihoods to detect overfitted areas in the latent space, and then devise a hybrid sample selection strategy that takes advantage of the properties of different informativeness metrics. Extensive experimental results demonstrate that our GMM-based method outperforms existing works on various balanced and imbalanced datasets, and can be readily integrated with other AL schemes to further improve the performance.",
        "keywords": "Active Learning;Uncertainty Estimation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/08a0acb17e6d2cb5da60ac6b2bdb96ecfdb60c95.zip",
        "author": "Younghyun Park;Jungwuk Park;Dong-Jun Han;Wonjeong Choi;Humaira Kousar;Jaekyun Moon",
        "authorids": "~Younghyun_Park1;~Jungwuk_Park1;~Dong-Jun_Han1;~Wonjeong_Choi1;~Humaira_Kousar1;~Jaekyun_Moon2",
        "gender": "M;M;M;M;F;M",
        "homepage": "https://github.com/MoonLab-YH;;https://sites.google.com/view/djhan930/home?authuser=0;;;http://comstolab.kaist.ac.kr/people.html",
        "dblp": "137/2568;307/4735;201/0078;327/3749;;78/2744",
        "google_scholar": ";ek4xQy0AAAAJ;https://scholar.google.co.kr/citations?user=-YR-GxUAAAAJ;https://scholar.google.co.kr/citations?user=RXg2-oUAAAAJ;m0X7B_IAAAAJ;",
        "orcid": ";;;;;",
        "linkedin": ";jungwuk-park-458b25199;;wonjeong-choi-2503b71b1/;humaira-kousar-32b775136/;",
        "or_profile": "~Younghyun_Park1;~Jungwuk_Park1;~Dong-Jun_Han1;~Wonjeong_Choi1;~Humaira_Kousar1;~Jaekyun_Moon2",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Purdue University;KAIST;Korea Advanced Institute of Science & Technology;KAIST",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr;purdue.edu;ee.kaist.ac.kr;kaist.edu;kaist.edu",
        "position": "PhD student;PhD student;Postdoc;PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\npark2024distribution,\ntitle={Distribution Aware Active Learning via Gaussian Mixtures},\nauthor={Younghyun Park and Jungwuk Park and Dong-Jun Han and Wonjeong Choi and Humaira Kousar and Jaekyun Moon},\nyear={2024},\nurl={https://openreview.net/forum?id=YXnggA4iiD}\n}",
        "github": "",
        "project": "",
        "reviewers": "aVJe;wZHx;ZH7N",
        "site": "https://openreview.net/forum?id=YXnggA4iiD",
        "pdf_size": 3817985,
        "rating": "3;6;8",
        "confidence": "4;5;4",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "3;3;3",
        "wc_summary": "57;21;63",
        "wc_strengths": "30;52;41",
        "wc_weaknesses": "159;162;252",
        "wc_questions": "133;4;65",
        "wc_review": "379;239;421",
        "wc_reply_reviewers": "146;17;0",
        "wc_reply_authors": "2512;1135;974",
        "reply_reviewers": "1;1;0",
        "reply_authors": "5;2;2",
        "rating_avg": [
            5.666666666666667,
            2.0548046676563256
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            47.0,
            18.547236990991408
        ],
        "wc_strengths_avg": [
            41.0,
            8.981462390204987
        ],
        "wc_weaknesses_avg": [
            191.0,
            43.15089802078283
        ],
        "wc_questions_avg": [
            67.33333333333333,
            52.689868307125444
        ],
        "wc_review_avg": [
            346.3333333333333,
            77.80888266915431
        ],
        "wc_reply_reviewers_avg": [
            54.333333333333336,
            65.18861522962085
        ],
        "wc_reply_authors_avg": [
            1540.3333333333333,
            690.2088250828311
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.0,
            1.4142135623730951
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.11470786693528084,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16005064797873402067&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1;0;0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology;Purdue University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.kaist.ac.kr;https://www.purdue.edu",
        "aff_unique_abbr": "KAIST;Purdue",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0;0",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "id": "YZ7NWYBd5z",
        "title": "An Explainable AI-based Complementary Attention Mechanism for Detecting Identity Swaps",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep learning techniques have quickly led to the generation of a large number of realistic fake content by accessing large-scale publicly available databases. The emergence of deepfake technology has given rise to concerns related to the creation and dissemination of manipulated multimedia content because of its use in social media to generate fake news. One prevalent application of this technology is identity swap, wherein faces are exchanged within images and videos to create convincing yet fabricated visual narratives. Thus, the detection of identity swaps has become an increasingly important research area in the field of digital forensics. This paper presents a complementary attention-based deep learning system for the detection of identity swaps.  Specifically, it incorporates our proposed simple Layer-Integrated Channel Attention (LICA) and Scaled Spatial Attention (SSA) mechanisms in the VGG network architecture to respectively capture the importance along each channel and at each spatial location to distinguish real faces from manipulated faces.  It further incorporates Local Interpretable Model-agnostic Explanations (LIME) as the explainable AI technique to provide a more in-depth transparent analysis of its effectiveness towards improved detection performance.   Our extensive experimental results demonstrate that the proposed system outperforms state-of-the-art systems in terms of accuracy and area under curve metrics in detecting fake faces generated by identity swaps. The LIME further provides a deeper understanding of the decision-making process and facilitates trust and accountability by combining the power of CNNs with the transparency of explainable AI.",
        "keywords": "deep learning;fake content;fake faces;identity swap;scaled spatial attention;layer-integrated channel attention;LIME;deepfake;faceswap",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/3c1b631d38aa3b05117680b1671cf7f09000522f.zip",
        "author": "Supriyo Sadhya;Xiaojun Qi",
        "authorids": "~Supriyo_Sadhya1;~Xiaojun_Qi1",
        "gender": "M;F",
        "homepage": ";https://www.usu.edu/cs/people/XiaojunQi/",
        "dblp": ";37/2822.html",
        "google_scholar": "nP8ES2QAAAAJ;",
        "orcid": "0000-0003-2066-8852;",
        "linkedin": "supriyo-sadhya-a3b0ab146;",
        "or_profile": "~Supriyo_Sadhya1;~Xiaojun_Qi1",
        "aff": "Utah State University;Utah State University",
        "aff_domain": "usu.edu;usu.edu",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nsadhya2024an,\ntitle={An Explainable {AI}-based Complementary Attention Mechanism for Detecting Identity Swaps},\nauthor={Supriyo Sadhya and Xiaojun Qi},\nyear={2024},\nurl={https://openreview.net/forum?id=YZ7NWYBd5z}\n}",
        "github": "",
        "project": "",
        "reviewers": "X4Gr;9aRj;Bbmb",
        "site": "https://openreview.net/forum?id=YZ7NWYBd5z",
        "pdf_size": 2417870,
        "rating": "1;3;5",
        "confidence": "5;4;3",
        "soundness": "1;2;3",
        "contribution": "1;2;2",
        "presentation": "1;3;2",
        "wc_summary": "51;88;50",
        "wc_strengths": "4;51;20",
        "wc_weaknesses": "152;147;92",
        "wc_questions": "1;18;2",
        "wc_review": "208;304;164",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            1.632993161855452
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            63.0,
            17.682382946499793
        ],
        "wc_strengths_avg": [
            25.0,
            19.510680835549195
        ],
        "wc_weaknesses_avg": [
            130.33333333333334,
            27.18251071716682
        ],
        "wc_questions_avg": [
            7.0,
            7.788880963698615
        ],
        "wc_review_avg": [
            225.33333333333334,
            58.45416057808793
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:WnIM8kL20dAJ:scholar.google.com/&scioq=An+Explainable+AI-based+Complementary+Attention+Mechanism+for+Detecting+Identity+Swaps&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Utah State University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.usu.edu",
        "aff_unique_abbr": "USU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Sample Efficient Myopic Exploration Through Multitask Reinforcement Learning with Diverse Tasks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18421",
        "id": "YZrg56G0JV",
        "author_site": "Ziping Xu, Zifan Xu, Runxuan Jiang, Peter Stone, Ambuj Tewari",
        "tldr": "",
        "abstract": "Multitask Reinforcement Learning (MTRL) approaches have gained increasing attention for its wide applications in many important Reinforcement Learning (RL) tasks. However, while recent advancements in MTRL theory have focused on the improved statistical efficiency by assuming a shared structure across tasks, exploration--a crucial aspect of RL--has been largely overlooked. This paper addresses this gap by showing that when an agent is trained on a sufficiently diverse set of tasks, a generic  policy-sharing algorithm with myopic exploration design like $\\epsilon$-greedy that are inefficient in general can be sample-efficient for MTRL. To the best of our knowledge, this is the first theoretical demonstration of the \"exploration benefits\" of MTRL. It may also shed light on the enigmatic success of the wide applications of myopic exploration in practice. To validate the role of diversity, we conduct experiments on synthetic robotic control environments, where the diverse task set aligns with the task selection by automatic curriculum learning, which is empirically shown to improve sample-efficiency.",
        "keywords": "Reinforcement Learning; Multitask Learning; Exploration",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/647243be6ecd446e68f366bd09a951057aac0af6.pdf",
        "author": "Ziping Xu;Zifan Xu;Runxuan Jiang;Peter Stone;Ambuj Tewari",
        "authorids": "~Ziping_Xu1;~Zifan_Xu1;~Runxuan_Jiang1;~Peter_Stone1;~Ambuj_Tewari1",
        "gender": "M;M;M;M;M",
        "homepage": "https://zipingxu.github.io;https://daffan.github.io/;https://runxuanjiang.github.io/;http://www.cs.utexas.edu/~pstone;https://www.ambujtewari.com",
        "dblp": "258/0573;;267/5726;s/PeterStone;24/567",
        "google_scholar": "V-VcaYIAAAAJ;d6Hj8JQAAAAJ;Xa3X9rAAAAAJ;qnwjcfAAAAAJ;ttbl4FsAAAAJ",
        "orcid": ";;0000-0003-0581-9720;0000-0002-6795-420X;0000-0001-6969-7844",
        "linkedin": ";;runxuanjiang;;",
        "or_profile": "~Ziping_Xu1;~Zifan_Xu1;~Runxuan_Jiang1;~Peter_Stone1;~Ambuj_Tewari1",
        "aff": "Harvard University, Harvard University;University of Texas at Austin;;University of Texas, Austin;University of Michigan - Ann Arbor",
        "aff_domain": "fas.harvard.edu;cs.utexas.edu;;utexas.edu;umich.edu",
        "position": "Postdoc;PhD student;;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nxu2024sample,\ntitle={Sample Efficient Myopic Exploration Through Multitask Reinforcement Learning with Diverse Tasks},\nauthor={Ziping Xu and Zifan Xu and Runxuan Jiang and Peter Stone and Ambuj Tewari},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=YZrg56G0JV}\n}",
        "github": "",
        "project": "",
        "reviewers": "E4JK;GSze;ZHzf;q9zq",
        "pdf_size": 774336,
        "rating": "5;6;6;8",
        "confidence": "2;3;4;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;2;3;4",
        "wc_summary": "30;30;85;92",
        "wc_strengths": "6;38;77;43",
        "wc_weaknesses": "109;233;56;56",
        "wc_questions": "28;413;7;25",
        "wc_review": "173;714;225;216",
        "wc_reply_reviewers": "0;366;0;0",
        "wc_reply_authors": "521;1327;200;348",
        "reply_reviewers": "0;2;0;0",
        "reply_authors": "1;4;1;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            59.25,
            29.354514133264068
        ],
        "wc_strengths_avg": [
            41.0,
            25.16942589730644
        ],
        "wc_weaknesses_avg": [
            113.5,
            72.30663869936149
        ],
        "wc_questions_avg": [
            118.25,
            170.36339835774584
        ],
        "wc_review_avg": [
            332.0,
            221.42154366727732
        ],
        "wc_reply_reviewers_avg": [
            91.5,
            158.48264889255228
        ],
        "wc_reply_authors_avg": [
            599.0,
            435.39350018115795
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            1.75,
            1.299038105676658
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.3244428422615251,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=943500966114276243&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=YZrg56G0JV",
        "pdf": "https://openreview.net/pdf?id=YZrg56G0JV",
        "email": "fas.harvard.edu;cs.utexas.edu;;utexas.edu;umich.edu",
        "author_num": 5,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "Harvard University;University of Texas at Austin;University of Michigan",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.harvard.edu;https://www.utexas.edu;https://www.umich.edu",
        "aff_unique_abbr": "Harvard;UT Austin;UM",
        "aff_campus_unique_index": "1;1;2",
        "aff_campus_unique": ";Austin;Ann Arbor",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Composed Image Retrieval with Text Feedback via Multi-grained Uncertainty Regularization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18420",
        "id": "Yb5KvPkKQg",
        "author_site": "Yiyang Chen, Zhedong Zheng, Wei Ji, Leigang Qu, Tat-Seng Chua",
        "tldr": "",
        "abstract": "We investigate composed image retrieval with text feedback. Users gradually look for the target of interest by moving from coarse to fine-grained feedback.  However, existing methods merely focus on the latter, i.e., fine-grained search, by harnessing positive and negative pairs during training. This pair-based paradigm only considers the one-to-one distance between a pair of specific points, which is not aligned with the one-to-many coarse-grained retrieval process and compromises the recall rate. \nIn an attempt to fill this gap, we introduce a unified learning approach to simultaneously modeling the coarse- and fine-grained retrieval by considering the multi-grained uncertainty. \nThe key idea underpinning the proposed method is to integrate fine- and coarse-grained retrieval as matching data points with small and large fluctuations, respectively.\nSpecifically, our method contains two modules: uncertainty modeling and uncertainty regularization. \n(1) The uncertainty modeling simulates the multi-grained queries by introducing identically distributed fluctuations in the feature space. \n(2) Based on the uncertainty modeling, we further introduce uncertainty regularization to adapt the matching objective according to the fluctuation range.\nCompared with existing methods, the proposed strategy explicitly prevents the model from pushing away potential candidates in the early stage and thus improves the recall rate.  On the three public datasets, i.e., FashionIQ, Fashion200k, and Shoes, the proposed method has achieved +4.03%, + 3.38%, and + 2.40% Recall@50 accuracy over a strong baseline, respectively.",
        "keywords": "Multi-modal learning;",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yiyang Chen;Zhedong Zheng;Wei Ji;Leigang Qu;Tat-Seng Chua",
        "authorids": "~Yiyang_Chen2;~Zhedong_Zheng1;~Wei_Ji1;~Leigang_Qu1;~Tat-Seng_Chua2",
        "gender": "M;M;M;M;M",
        "homepage": ";http://zdzheng.xyz;https://jiwei0523.github.io/;https://leigang-qu.github.io/;http://www.comp.nus.edu.sg/~chuats/",
        "dblp": ";190/7710;52/3220-8;276/3150;",
        "google_scholar": "hnxvC5UAAAAJ;XT17oUEAAAAJ;69OFB-AAAAAJ;1W2Tio4AAAAJ;https://scholar.google.com.tw/citations?user=Z9DWCBEAAAAJ",
        "orcid": ";0000-0002-2434-9050;0000-0002-8106-9768;0009-0004-6555-3834;0000-0001-6097-7807",
        "linkedin": ";zhedongzheng;;;",
        "or_profile": "~Yiyang_Chen2;~Zhedong_Zheng1;~Wei_Ji1;~Leigang_Qu1;~Tat-seng_Chua1",
        "aff": "Tsinghua University;University of Macau;Nanjing University;National University of Singapore;National University of Singapore",
        "aff_domain": "mails.tsinghua.edu.cn;um.edu.mo;nju.edu.cn;u.nus.edu;nus.edu.sg",
        "position": "Undergrad student;Assistant Professor;Associate Professor;PhD student;Full Professor",
        "bibtex": "@inproceedings{\nchen2024composed,\ntitle={Composed Image Retrieval with Text Feedback via Multi-grained Uncertainty Regularization},\nauthor={Yiyang Chen and Zhedong Zheng and Wei Ji and Leigang Qu and Tat-Seng Chua},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Yb5KvPkKQg}\n}",
        "github": "",
        "project": "",
        "reviewers": "FQ9t;cCoz;oWB8",
        "pdf_size": 1257554,
        "rating": "3;8;8",
        "confidence": "4;5;4",
        "soundness": "2;4;4",
        "contribution": "2;3;3",
        "presentation": "2;3;3",
        "wc_summary": "56;108;39",
        "wc_strengths": "35;146;26",
        "wc_weaknesses": "57;183;193",
        "wc_questions": "12;4;1",
        "wc_review": "160;441;259",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "222;310;745",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            6.333333333333333,
            2.357022603955158
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            67.66666666666667,
            29.352266617001757
        ],
        "wc_strengths_avg": [
            69.0,
            54.57105459856901
        ],
        "wc_weaknesses_avg": [
            144.33333333333334,
            61.88878914813427
        ],
        "wc_questions_avg": [
            5.666666666666667,
            4.642796092394707
        ],
        "wc_review_avg": [
            286.6666666666667,
            116.37391842199389
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            425.6666666666667,
            228.64285590316518
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 53,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13881440958719982862&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=Yb5KvPkKQg",
        "pdf": "https://openreview.net/pdf?id=Yb5KvPkKQg",
        "email": "mails.tsinghua.edu.cn;um.edu.mo;nju.edu.cn;u.nus.edu;nus.edu.sg",
        "author_num": 5,
        "aff_unique_index": "0;1;2;3;3",
        "aff_unique_norm": "Tsinghua University;University of Macau;Nanjing University;National University of Singapore",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.um.edu.mo;https://www.nju.edu.cn;https://www.nus.edu.sg",
        "aff_unique_abbr": "THU;UM;Nanjing U;NUS",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Macau SAR",
        "aff_country_unique_index": "0;0;0;1;1",
        "aff_country_unique": "China;Singapore"
    },
    {
        "id": "YbSUcEd7oR",
        "title": "Realistic Human Motion Generation with Cross-Diffusion Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We introduce the Cross Human Motion Diffusion Model (CrossDiff), a novel approach for generating high-quality human motion based on textual descriptions. Our method integrates 3D and 2D information using a shared transformer network within the training of the diffusion model, unifying motion noise into a single feature space. This enables cross-decoding of features into both 3D and 2D motion representations, regardless of their original dimension. The primary advantage of CrossDiff is its cross-diffusion mechanism, which allows the model to reverse either 2D or 3D noise into clean motion during training. This capability leverages the complementary information in both motion representations, capturing intricate human movement details often missed by models relying solely on 3D information. Consequently, CrossDiff effectively combines the strengths of both representations to generate more realistic motion sequences. In our experiments, our model demonstrates competitive state-of-the-art performance on text-to-motion benchmarks. Moreover, our method consistently provides enhanced motion generation quality, capturing complex full-body movement intricacies. Additionally, our approach accommodates using 2D motion data without 3D motion ground truth during training to generate 3D motion, highlighting its potential for broader applications and efficient use of available data resources.",
        "keywords": "motion generation;text-to-motion;diffusion model;cross modality",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/c683b9b947cba1b7522db2471c182bbe2e1672fa.zip",
        "author": "Zeping Ren;Shaoli Huang;Xiu Li",
        "authorids": "~Zeping_Ren1;~Shaoli_Huang2;~Xiu_Li1",
        "gender": "M;M;F",
        "homepage": "https://github.com/wonderNo;;https://thusigsiclab.github.io/thu.github.io/introduction.html",
        "dblp": ";80/8502;13/1206-1",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;o31BPFsAAAAJ;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": "0009-0007-8339-5229;;0000-0003-0403-1923",
        "linkedin": ";;",
        "or_profile": "~Zeping_Ren1;~Shaoli_Huang2;~Xiu_Li1",
        "aff": "Tencent AI Lab;Tencent AI Lab;Tsinghua University",
        "aff_domain": "tencent.com;tencent.com;tsinghua.edu.cn",
        "position": "Intern;Researcher;Professor",
        "bibtex": "@misc{\nren2024realistic,\ntitle={Realistic Human Motion Generation with Cross-Diffusion Models},\nauthor={Zeping Ren and Shaoli Huang and Xiu Li},\nyear={2024},\nurl={https://openreview.net/forum?id=YbSUcEd7oR}\n}",
        "github": "",
        "project": "",
        "reviewers": "kGCp;eXxC;HDJQ;W5FS",
        "site": "https://openreview.net/forum?id=YbSUcEd7oR",
        "pdf_size": 1725398,
        "rating": "5;5;5;6",
        "confidence": "3;4;5;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "29;82;56;31",
        "wc_strengths": "56;55;42;49",
        "wc_weaknesses": "364;209;90;179",
        "wc_questions": "6;6;8;12",
        "wc_review": "455;352;196;271",
        "wc_reply_reviewers": "0;158;0;0",
        "wc_reply_authors": "892;847;463;573",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            49.5,
            21.569654610122992
        ],
        "wc_strengths_avg": [
            50.5,
            5.5901699437494745
        ],
        "wc_weaknesses_avg": [
            210.5,
            98.83951638894233
        ],
        "wc_questions_avg": [
            8.0,
            2.449489742783178
        ],
        "wc_review_avg": [
            318.5,
            96.19901246894378
        ],
        "wc_reply_reviewers_avg": [
            39.5,
            68.41600689897065
        ],
        "wc_reply_authors_avg": [
            693.75,
            180.70331347266435
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14127381023455472898&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Tencent;Tsinghua University",
        "aff_unique_dep": "Tencent AI Lab;",
        "aff_unique_url": "https://ai.tencent.com;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "Tencent AI Lab;THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Improving Intrinsic Exploration by Creating Stationary Objectives",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18419",
        "id": "YbZxT0SON4",
        "author_site": "Roger Creus Castanyer, Joshua Romoff, Glen Berseth",
        "tldr": "",
        "abstract": "Exploration bonuses in reinforcement learning guide long-horizon exploration by defining custom intrinsic objectives. Count-based methods use the frequency of state visits to derive an exploration bonus. In this paper, we identify that any intrinsic reward function derived from count-based methods is non-stationary and hence induces a difficult objective to optimize for the agent. The key contribution of our work lies in transforming the original non-stationary rewards into stationary rewards through an augmented state representation. For this purpose, we introduce the Stationary Objectives For Exploration (SOFE) framework. SOFE requires *identifying* sufficient statistics for different exploration bonuses and finding an *efficient* encoding of these statistics to use as input to a deep network. SOFE is based on proposing state augmentations that expand the state space but hold the promise of simplifying the optimization of the agent's objective. Our experiments show that SOFE improves the agents' performance in challenging exploration problems, including sparse-reward tasks, pixel-based observations, 3D navigation, and procedurally generated environments.",
        "keywords": "Reinforcement Learning;Exploration;Intrinsic Rewards;Stationarity",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/577f91d390ff0547f8d9ad0479d6ad1ef6392867.zip",
        "author": "Roger Creus Castanyer;Joshua Romoff;Glen Berseth",
        "authorids": "~Roger_Creus_Castanyer1;~Joshua_Romoff1;~Glen_Berseth1",
        "gender": "M;;M",
        "homepage": "https://roger-creus.github.io/;;http://fracturedplane.com/",
        "dblp": ";;147/5478",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;https://scholar.google.ca/citations?user=4C5wrXIAAAAJ;https://scholar.google.ca/citations?user=-WZcuuwAAAAJ",
        "orcid": "0000-0003-1952-3357;;0000-0001-7351-8028",
        "linkedin": ";;glen-berseth-0523278b?trk=hp-identity-name",
        "or_profile": "~Roger_Creus_Castanyer1;~Joshua_Romoff1;~Glen_Berseth1",
        "aff": "Universit\u00e9 de Montr\u00e9al;Ubisoft;Montreal Institute for Learning Algorithms, University of Montreal, Universit\u00e9 de Montr\u00e9al",
        "aff_domain": "umontreal.ca;ubisoft.com;mila.umontreal.ca",
        "position": "MS student;Researcher;Assistant Professor",
        "bibtex": "@inproceedings{\ncastanyer2024improving,\ntitle={Improving Intrinsic Exploration by Creating Stationary Objectives},\nauthor={Roger Creus Castanyer and Joshua Romoff and Glen Berseth},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=YbZxT0SON4}\n}",
        "github": "",
        "project": "",
        "reviewers": "GnJy;4EvL;Yao3;7vAW",
        "pdf_size": 9453641,
        "rating": "5;5;6;8",
        "confidence": "4;3;3;4",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;3;3",
        "wc_summary": "131;60;72;119",
        "wc_strengths": "42;54;90;71",
        "wc_weaknesses": "128;277;225;464",
        "wc_questions": "190;147;541;113",
        "wc_review": "491;538;928;767",
        "wc_reply_reviewers": "87;514;110;209",
        "wc_reply_authors": "1645;2971;1566;941",
        "reply_reviewers": "1;4;2;2",
        "reply_authors": "5;7;5;2",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            95.5,
            30.103986446980738
        ],
        "wc_strengths_avg": [
            64.25,
            18.08832496390973
        ],
        "wc_weaknesses_avg": [
            273.5,
            122.29574808635009
        ],
        "wc_questions_avg": [
            247.75,
            171.49252899179018
        ],
        "wc_review_avg": [
            681.0,
            176.74416539167566
        ],
        "wc_reply_reviewers_avg": [
            230.0,
            170.25422168040356
        ],
        "wc_reply_authors_avg": [
            1780.75,
            739.3275238350051
        ],
        "reply_reviewers_avg": [
            2.25,
            1.0897247358851685
        ],
        "reply_authors_avg": [
            4.75,
            1.7853571071357126
        ],
        "replies_avg": [
            34,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.40824829046386296,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14935036264133679972&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=YbZxT0SON4",
        "pdf": "https://openreview.net/pdf?id=YbZxT0SON4",
        "email": "umontreal.ca;ubisoft.com;mila.umontreal.ca",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Universit\u00e9 de Montr\u00e9al;Ubisoft;University of Montreal",
        "aff_unique_dep": ";;Montreal Institute for Learning Algorithms",
        "aff_unique_url": "https://www.umontreal.ca;https://www.ubisoft.com;https://www.mila.quebec",
        "aff_unique_abbr": "UdeM;Ubisoft;MILA",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Montreal",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Canada;France"
    },
    {
        "id": "Ybjnk3VN4W",
        "title": "ARCHITECTURE MATTERS: METAFORMER AND GLOBAL-AWARE CONVOLUTION STREAMING FOR IMAGE RESTORATION",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Transformer-based methods have sparked significant interest in this field, primarily due to their self-attention mechanism's capacity to capture long-range dependencies. However, existing transformer-based image restoration methods restrict self-attention on windows or across channels to avoid computational complexity explosion, limiting their ability to capture long-range dependencies. This leads us to explore the following question: Is the general architecture abstracted from Transformers significantly impact the performance of existing Transformer-based image restoration methods? To this end, we first analyze the existing attention modules and replace them with solely convolution modules, also known as convolution streaming. We demonstrate that these convolution modules deliver comparable performance with existing attention modules at the similar cost of computation burden. Our findings underscore the importance of the overall Transformer architecture in image restoration, motivating the principle of MetaFormer-a general architecture abstracted from transformer-based methods without specifying the feature mixing manners. To further enhance the capture of long-range dependencies within the powerful MetaFormer architecture, we construct an efficient global-aware convolution streaming module with Fourier Transform.\nIntegrating the MetaFormer architecture and global-aware convolution streaming module, we achieves consistent performance gain on multiple image restoration tasks including image deblurring, image denoising, and image deraining,  with even less computation burden.",
        "keywords": "Image Restoration;Deblurring;Denoising;Transformers",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/3d98cb215c40ba7fa19132473db3a4a281eff471.pdf",
        "author": "Huibin Yan;Shuoyao Wang",
        "authorids": "~Huibin_Yan1;~Shuoyao_Wang1",
        "gender": "M;",
        "homepage": ";https://wsycuhk.github.io/",
        "dblp": "11/11419;200/8365",
        "google_scholar": "https://scholar.google.com.hk/citations?user=Hp42r6QAAAAJ;RYG-gYYAAAAJ",
        "orcid": "0000-0001-8537-3532;",
        "linkedin": ";",
        "or_profile": "~Huibin_Yan1;~Shuoyao_Wang1",
        "aff": "Shenzhen University;Shenzhen University",
        "aff_domain": "szu.edu.cn;szu.edu.cn",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nyan2024architecture,\ntitle={{ARCHITECTURE} {MATTERS}: {METAFORMER} {AND} {GLOBAL}-{AWARE} {CONVOLUTION} {STREAMING} {FOR} {IMAGE} {RESTORATION}},\nauthor={Huibin Yan and Shuoyao Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=Ybjnk3VN4W}\n}",
        "github": "",
        "project": "",
        "reviewers": "EQ2P;Dq6b;7HFZ;98jJ",
        "site": "https://openreview.net/forum?id=Ybjnk3VN4W",
        "pdf_size": 314178,
        "rating": "1;3;3;3",
        "confidence": "5;5;5;5",
        "soundness": "2;3;3;1",
        "contribution": "1;2;2;1",
        "presentation": "1;3;3;2",
        "wc_summary": "87;94;49;73",
        "wc_strengths": "31;58;38;20",
        "wc_weaknesses": "482;277;103;275",
        "wc_questions": "76;16;161;53",
        "wc_review": "676;445;351;421",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            5.0,
            0.0
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            75.75,
            17.195566289017645
        ],
        "wc_strengths_avg": [
            36.75,
            13.845125496000389
        ],
        "wc_weaknesses_avg": [
            284.25,
            134.25232772656122
        ],
        "wc_questions_avg": [
            76.5,
            53.27522876534647
        ],
        "wc_review_avg": [
            473.25,
            122.04584179725256
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ZBSwOtt9uocJ:scholar.google.com/&scioq=ARCHITECTURE+MATTERS:+METAFORMER+AND+GLOBAL-AWARE+CONVOLUTION+STREAMING+FOR+IMAGE+RESTORATION&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Shenzhen University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.szu.edu.cn",
        "aff_unique_abbr": "SZU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "YcJCzJzQT5",
        "title": "DipDNN: Decomposed Invertible Pathway Deep Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep neural networks (DNNs) enable highly accurate one-way inferences from inputs to outputs. However, there is an elevated need for consistency in bi-directional inferences, such as state estimation, signal recovery, privacy preservation, and reasoning. Since standard DNNs are not inherently invertible, previous works use multiple DNNs in a nested manner to obtain consistent and analytical forms of inverse solutions. However, such a design is not only computationally expensive due to DNN compositions, but also forces splitting the input/output equally, which is inapplicable in many applications. To reduce the restriction, other works use fixed-point iterations to enable approximation of one-to-one mapping, but the numerical approximation leads to reconstruction errors compared with the analytical inverse. To preserve the analytical form with minimum computational redundancy, we proposed decomposed-invertible-pathway DNNs (DipDNN) that decompose the nested design. We enforce one-to-one mapping in each layer by minimally adjusting the weights and activation functions of standard dense DNNs. We prove that such an adjustment guarantees strict invertibility without hurting the universal approximation. As our design relaxes the alternative stacking of nested DNNs, the proposed method does not need a fixed splitting of inputs/outputs, making it applicable for general inverse problems. To further boost the two-way learning accuracy, we show that the proposed DipDNN is easily integrated into a parallel structure. With the analytical invertibility, bi-Lipschitz stability regularization naturally fits into the scheme to avoid numerical issues. Numerical results show that DipDNN can recover the input exactly and quickly in diverse systems.",
        "keywords": "Inverse consistency;analytical invertibility;physics embedding;inverse stability;deep narrow networks",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Jingyi Yuan;Yang Weng;Erik Blasch",
        "authorids": "~Jingyi_Yuan1;~Yang_Weng1;~Erik_Blasch1",
        "gender": "F;;M",
        "homepage": ";;https://sites.google.com/site/erikblasch/",
        "dblp": "248/7785;;01/4960",
        "google_scholar": "1k_2PUwAAAAJ;;Po7s1TsAAAAJ",
        "orcid": "0000-0002-2850-1582;;0000-0001-6894-6108",
        "linkedin": "jingyi-yuan-7a1757171/;;erik-blasch-76a0429/",
        "or_profile": "~Jingyi_Yuan1;~Yang_Weng1;~Erik_Blasch1",
        "aff": "Arizona State University;;Air Force Research Laboratory",
        "aff_domain": "asu.edu;;us.af.mil",
        "position": "PhD student;;Principal Researcher",
        "bibtex": "@misc{\nyuan2024dipdnn,\ntitle={Dip{DNN}: Decomposed Invertible Pathway Deep Neural Networks},\nauthor={Jingyi Yuan and Yang Weng and Erik Blasch},\nyear={2024},\nurl={https://openreview.net/forum?id=YcJCzJzQT5}\n}",
        "github": "",
        "project": "",
        "reviewers": "zeZn;RyQp;uKYL",
        "site": "https://openreview.net/forum?id=YcJCzJzQT5",
        "pdf_size": 2652291,
        "rating": "3;5;6",
        "confidence": "4;4;3",
        "soundness": "2;3;3",
        "contribution": "1;2;3",
        "presentation": "1;2;3",
        "wc_summary": "100;83;120",
        "wc_strengths": "32;23;131",
        "wc_weaknesses": "247;35;72",
        "wc_questions": "58;177;140",
        "wc_review": "437;318;463",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "2033;906;1091",
        "reply_reviewers": "0;0;0",
        "reply_authors": "4;2;2",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            101.0,
            15.121728296285006
        ],
        "wc_strengths_avg": [
            62.0,
            48.92851929090027
        ],
        "wc_weaknesses_avg": [
            118.0,
            92.45899992248816
        ],
        "wc_questions_avg": [
            125.0,
            49.72591544322403
        ],
        "wc_review_avg": [
            406.0,
            63.12421616675067
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1343.3333333333333,
            493.48173443626285
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.7559289460184545,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:7GNdKk_yDtYJ:scholar.google.com/&scioq=DipDNN:+Decomposed+Invertible+Pathway+Deep+Neural+Networks&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Arizona State University;Air Force Research Laboratory",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.asu.edu;https://www.afrl.af.mil/",
        "aff_unique_abbr": "ASU;AFRL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "BayesDiff: Estimating Pixel-wise Uncertainty in Diffusion via Bayesian Inference",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18418",
        "id": "YcM6ofShwY",
        "author_site": "Siqi Kou, Lei Gan, Dequan Wang, Chongxuan Li, Zhijie Deng",
        "tldr": "",
        "abstract": "Diffusion models have impressive image generation capability, but low-quality generations still exist, and their identification remains challenging due to the lack of a proper sample-wise metric. To address this, we propose BayesDiff, a pixel-wise uncertainty estimator for generations from diffusion models based on Bayesian inference. In particular, we derive a novel uncertainty iteration principle to characterize the uncertainty dynamics in diffusion, and leverage the last-layer Laplace approximation for efficient Bayesian inference. The estimated pixel-wise uncertainty can not only be aggregated into a sample-wise metric to filter out low-fidelity images but also aids in augmenting successful generations and rectifying artifacts in failed generations in text-to-image tasks. Extensive experiments demonstrate the efficacy of BayesDiff and its promise for practical applications.",
        "keywords": "diffusion model;Bayesian uncertainty",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/abd4368a46d6fb1226d7e99d84cb272059855984.zip",
        "author": "Siqi Kou;Lei Gan;Dequan Wang;Chongxuan Li;Zhijie Deng",
        "authorids": "~Siqi_Kou1;~Lei_Gan1;~Dequan_Wang1;~Chongxuan_Li1;~Zhijie_Deng1",
        "gender": ";M;;M;M",
        "homepage": "https://github.com/karrykkk;;;http://ml.cs.tsinghua.edu.cn/~chongxuan;https://thudzj.github.io/",
        "dblp": ";;;161/9965;209/4959",
        "google_scholar": ";;;UKMcQn4AAAAJ;J3dR0sUAAAAJ",
        "orcid": ";0009-0000-1324-8118;;0000-0002-0912-9076;0000-0002-0932-1631",
        "linkedin": ";lei-gan-807808292;;;",
        "or_profile": "~Siqi_Kou1;~Lei_Gan1;~Dequan_Wang1;~Chongxuan_Li1;~Zhijie_Deng1",
        "aff": "Shanghai Jiaotong University;Fudan University;;Renmin University of China;Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn;fudan.edu.cn;;ruc.edu.cn;sjtu.edu.cn",
        "position": "PhD student;Undergrad student;;Associate Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nkou2024bayesdiff,\ntitle={BayesDiff: Estimating Pixel-wise Uncertainty in Diffusion via Bayesian Inference},\nauthor={Siqi Kou and Lei Gan and Dequan Wang and Chongxuan Li and Zhijie Deng},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=YcM6ofShwY}\n}",
        "github": "",
        "project": "",
        "reviewers": "CcvE;NYDr;B5Gy;AU5E",
        "pdf_size": 8211193,
        "rating": "6;6;6;8",
        "confidence": "2;4;3;3",
        "soundness": "3;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;3;2",
        "wc_summary": "126;159;20;67",
        "wc_strengths": "37;26;49;87",
        "wc_weaknesses": "228;30;140;147",
        "wc_questions": "138;154;2;101",
        "wc_review": "529;369;211;402",
        "wc_reply_reviewers": "12;0;17;14",
        "wc_reply_authors": "715;387;853;497",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "3;1;4;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            93.0,
            53.50233639758174
        ],
        "wc_strengths_avg": [
            49.75,
            22.993205518152532
        ],
        "wc_weaknesses_avg": [
            136.25,
            70.42149884800806
        ],
        "wc_questions_avg": [
            98.75,
            59.07357700359781
        ],
        "wc_review_avg": [
            377.75,
            113.29910635128593
        ],
        "wc_reply_reviewers_avg": [
            10.75,
            6.456585785072479
        ],
        "wc_reply_authors_avg": [
            613.0,
            182.02747045432457
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6232360265173351264&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=YcM6ofShwY",
        "pdf": "https://openreview.net/pdf?id=YcM6ofShwY",
        "email": "sjtu.edu.cn;fudan.edu.cn;;ruc.edu.cn;sjtu.edu.cn",
        "author_num": 5,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Shanghai Jiao Tong University;Fudan University;Renmin University of China",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.sjtu.edu.cn;https://www.fudan.edu.cn;http://www.ruc.edu.cn",
        "aff_unique_abbr": "SJTU;Fudan;RUC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Adversarial Causal Bayesian Optimization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18417",
        "id": "YcW8i9VCf5",
        "author_site": "Scott Sussex, Pier Giuseppe Sessa, Anastasia Makarova, Andreas Krause",
        "tldr": "",
        "abstract": "In Causal Bayesian Optimization (CBO), an agent intervenes on a structural causal model with known graph but unknown mechanisms to maximize a downstream reward variable. In this paper, we consider the generalization where other agents or external events also intervene on the system, which is key for enabling adaptiveness to non-stationarities such as weather changes, market forces, or adversaries. We formalize this generalization of CBO as Adversarial Causal Bayesian Optimization (ACBO) and introduce the first algorithm for ACBO with bounded regret: Causal Bayesian Optimization with Multiplicative Weights (CBO-MW). Our approach combines a classical online learning strategy with causal modeling of the rewards. To achieve this, it computes optimistic counterfactual reward estimates by propagating uncertainty through the causal graph. We derive regret bounds for CBO-MW that naturally depend on graph-related quantities. We further propose a scalable implementation for the case of combinatorial interventions and submodular rewards. Empirically, CBO-MW outperforms non-causal and non-adversarial Bayesian optimization methods on synthetic environments and environments based on real-word data. Our experiments include a realistic demonstration of how CBO-MW can be used to learn users' demand patterns in a shared mobility system and reposition vehicles in strategic areas.",
        "keywords": "causality;bayesian optimization",
        "primary_area": "causal reasoning",
        "supplementary_material": "/attachment/89a6e2e5688fb5a6a0bace186cb8aeeb36a59e98.zip",
        "author": "Scott Sussex;Pier Giuseppe Sessa;Anastasia Makarova;Andreas Krause",
        "authorids": "~Scott_Sussex1;~Pier_Giuseppe_Sessa1;~Anastasia_Makarova1;~Andreas_Krause1",
        "gender": "M;;F;M",
        "homepage": ";;https://avidereta.github.io/;https://las.inf.ethz.ch/krausea",
        "dblp": "241/6295;;244/2207;87/1831-1.html",
        "google_scholar": ";;skAF5s8AAAAJ;https://scholar.google.ch/citations?user=eDHv58AAAAAJ",
        "orcid": ";;;0000-0001-7260-9673",
        "linkedin": ";;anastasia-makarova-957331a7/;krausea/",
        "or_profile": "~Scott_Sussex1;~Pier_Giuseppe_Sessa1;~Anastasia_Makarova1;~Andreas_Krause1",
        "aff": "Swiss Federal Institute of Technology;;Google DeepMind;ETH Zurich",
        "aff_domain": "ethz.ch;;google.com;ethz.ch",
        "position": "PhD student;;Researcher;Full Professor",
        "bibtex": "@inproceedings{\nsussex2024adversarial,\ntitle={Adversarial Causal Bayesian Optimization},\nauthor={Scott Sussex and Pier Giuseppe Sessa and Anastasia Makarova and Andreas Krause},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=YcW8i9VCf5}\n}",
        "github": "",
        "project": "",
        "reviewers": "VBSi;aRF4;h5FK;xNam",
        "pdf_size": 9489943,
        "rating": "6;6;6;6",
        "confidence": "4;2;4;4",
        "soundness": "3;3;3;2",
        "contribution": "3;2;2;2",
        "presentation": "3;2;3;2",
        "wc_summary": "37;78;70;58",
        "wc_strengths": "774;10;27;21",
        "wc_weaknesses": "24;51;200;319",
        "wc_questions": "2;119;294;26",
        "wc_review": "837;258;591;424",
        "wc_reply_reviewers": "23;9;18;275",
        "wc_reply_authors": "1047;659;1966;874",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "3;2;4;3",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            60.75,
            15.449514555480375
        ],
        "wc_strengths_avg": [
            208.0,
            326.8371153954214
        ],
        "wc_weaknesses_avg": [
            148.5,
            119.0892522438528
        ],
        "wc_questions_avg": [
            110.25,
            114.73529317520394
        ],
        "wc_review_avg": [
            527.5,
            213.98890158136706
        ],
        "wc_reply_reviewers_avg": [
            81.25,
            111.97404833263822
        ],
        "wc_reply_authors_avg": [
            1136.5,
            498.24517057368456
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13191964128614014249&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=YcW8i9VCf5",
        "pdf": "https://openreview.net/pdf?id=YcW8i9VCf5",
        "email": "ethz.ch;;google.com;ethz.ch",
        "author_num": 4,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Swiss Federal Institute of Technology;Google;ETH Zurich",
        "aff_unique_dep": ";Google DeepMind;",
        "aff_unique_url": "https://www.ethz.ch;https://deepmind.com;https://www.ethz.ch",
        "aff_unique_abbr": "ETH Zurich;DeepMind;ETHZ",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Switzerland;United Kingdom"
    },
    {
        "id": "YclZqtwf9e",
        "title": "Slingshot Perturbation to Learning in Monotone Games",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper addresses the problem of learning Nash equilibria in *monotone games* where the gradient of the payoff functions is monotone in the strategy profile space, potentially containing additive noise. The optimistic family of learning algorithms, exemplified by optimistic Follow-the-Regularized-Leader and optimistic Mirror Descent, successfully achieves last-iterate convergence in scenarios devoid of noise, leading the dynamics to a Nash equilibrium. A recent emerging trend underscores the promise of the perturbation approach, where payoff functions are perturbed based on the distance from an anchoring, or *slingshot*, strategy. In response, we first establish a unified framework for learning equilibria in monotone games, accommodating both full and noisy feedback. Second, we construct the convergence rates toward an approximated equilibrium, irrespective of noise presence. Thirdly, we introduce a twist by updating the slingshot strategy, anchoring the current strategy at finite intervals. This innovation empowers us to identify the exact Nash equilibrium of the underlying game with guaranteed rates. The proposed framework is all-encompassing, integrating existing payoff-perturbed algorithms. Finally, empirical demonstrations affirm that our algorithms, grounded in this framework, exhibit significantly accelerated convergence.",
        "keywords": "Last-Iterate Convergence;Monotone Game;Learning in Games;Noisy Feedback",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/5d80591580b96ed187d26db963de0a0aed7b27cd.zip",
        "author": "Kenshi Abe;Kaito Ariu;Mitsuki Sakamoto;Atsushi Iwasaki",
        "authorids": "~Kenshi_Abe1;~Kaito_Ariu1;~Mitsuki_Sakamoto1;~Atsushi_Iwasaki2",
        "gender": "M;M;M;M",
        "homepage": "https://bakanaouji.github.io/;https://researchmap.jp/ariu?lang=en;;",
        "dblp": "254/2763;229/7578;243/6951;04/4799",
        "google_scholar": "rImmohoAAAAJ;https://scholar.google.co.jp/citations?user=4zXjxhsAAAAJ;https://scholar.google.co.jp/citations?user=wIuGfiEAAAAJ;OZunx7wAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;https://www.linkedin.com/mwlite/in/%E5%85%85%E7%94%9F-%E5%9D%82%E6%9C%AC-1666bb233;",
        "or_profile": "~Kenshi_Abe1;~Kaito_Ariu1;~Mitsuki_Sakamoto1;~Atsushi_Iwasaki1",
        "aff": "CyberAgent, Inc.;CyberAgent, Inc.;CyberAgent, Inc.;University of Electro-Communications",
        "aff_domain": "cyberagent.co.jp;cyberagent.co.jp;cyberagent.co.jp;uec.ac.jp",
        "position": "Research scientist;Research Scientist;Research Engineer;Associate Professor",
        "bibtex": "@misc{\nabe2024slingshot,\ntitle={Slingshot Perturbation to Learning in Monotone Games},\nauthor={Kenshi Abe and Kaito Ariu and Mitsuki Sakamoto and Atsushi Iwasaki},\nyear={2024},\nurl={https://openreview.net/forum?id=YclZqtwf9e}\n}",
        "github": "",
        "project": "",
        "reviewers": "vVKF;yRC2;53rn;GKmU",
        "site": "https://openreview.net/forum?id=YclZqtwf9e",
        "pdf_size": 11741836,
        "rating": "5;6;6;8",
        "confidence": "4;4;3;3",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;4;3;4",
        "wc_summary": "60;144;324;66",
        "wc_strengths": "63;105;61;45",
        "wc_weaknesses": "318;166;107;10",
        "wc_questions": "159;135;58;4",
        "wc_review": "600;550;550;125",
        "wc_reply_reviewers": "334;13;0;0",
        "wc_reply_authors": "1871;620;555;32",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "5;1;1;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            148.5,
            106.60558146738848
        ],
        "wc_strengths_avg": [
            68.5,
            22.197972880423112
        ],
        "wc_weaknesses_avg": [
            150.25,
            111.723710554206
        ],
        "wc_questions_avg": [
            89.0,
            61.64819543182104
        ],
        "wc_review_avg": [
            456.25,
            192.33353191786398
        ],
        "wc_reply_reviewers_avg": [
            86.75,
            142.84847741575686
        ],
        "wc_reply_authors_avg": [
            769.5,
            675.5680942732569
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            1.7320508075688772
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.6882472016116854,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ULvQbja0JCkJ:scholar.google.com/&scioq=Slingshot+Perturbation+to+Learning+in+Monotone+Games&hl=en&as_sdt=0,44",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "CyberAgent;University of Electro-Communications",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cyberagent.co.jp;https://www.uec.ac.jp",
        "aff_unique_abbr": "CyberAgent;UEC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Japan"
    },
    {
        "id": "Yd7idEYzNv",
        "title": "EGALA: Efficient Gradient Approximation for Large-scale Graph Adversarial Attack",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph Neural Networks (GNNs) have emerged as powerful tools for graph representation learning. However, their vulnerability to adversarial attacks underscores the importance of gaining a deeper understanding of techniques in graph adversarial attacks. Existing attack methods have demonstrated that it is possible to deteriorate the predictions of GNNs by injecting a small number of edges, but they often suffer from poor scalability due to the need of computing/storing gradients on a quadratic number of entries in the adjacency matrix. In this paper, we propose EGALA, a novel approach for conducting large-scale graph adversarial attacks. By showing the derivative of linear graph neural networks can be approximated by the inner product of two matrices, EGALA leverages efficient Approximate Nearest Neighbor Search (ANNS) techniques to identify entries with dominant gradients in sublinear time, offering superior attack capabilities, reduced memory and time consumption, and enhanced scalability. We conducted comprehensive experiments across various datasets to demonstrate the outstanding performance of our model compared with the state-of-the-art methods.",
        "keywords": "Graph adversarial attack",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Yunqi Hong;Cho-Jui Hsieh",
        "authorids": "~Yunqi_Hong1;~Cho-Jui_Hsieh1",
        "gender": ";M",
        "homepage": ";http://web.cs.ucla.edu/~chohsieh/index.html",
        "dblp": "312/4356.html;14/2770",
        "google_scholar": ";Wy89g4IAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Yunqi_Hong1;~Cho-Jui_Hsieh1",
        "aff": "University of California, Los Angeles;University of California, Los Angeles",
        "aff_domain": "ucla.edu;ucla.edu",
        "position": "MS student;Associate Professor",
        "bibtex": "@misc{\nhong2024egala,\ntitle={{EGALA}: Efficient Gradient Approximation for Large-scale Graph Adversarial Attack},\nauthor={Yunqi Hong and Cho-Jui Hsieh},\nyear={2024},\nurl={https://openreview.net/forum?id=Yd7idEYzNv}\n}",
        "github": "",
        "project": "",
        "reviewers": "BFci;d4tk;rxwz;ca4y",
        "site": "https://openreview.net/forum?id=Yd7idEYzNv",
        "pdf_size": 360783,
        "rating": "5;5;5;5",
        "confidence": "4;3;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "70;97;109;65",
        "wc_strengths": "24;55;89;89",
        "wc_weaknesses": "158;128;368;233",
        "wc_questions": "34;4;5;49",
        "wc_review": "286;284;571;436",
        "wc_reply_reviewers": "29;30;322;266",
        "wc_reply_authors": "356;412;906;498",
        "reply_reviewers": "1;1;2;1",
        "reply_authors": "1;1;3;1",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            85.25,
            18.335416548308903
        ],
        "wc_strengths_avg": [
            64.25,
            27.068200900687877
        ],
        "wc_weaknesses_avg": [
            221.75,
            92.69405320731207
        ],
        "wc_questions_avg": [
            23.0,
            19.248376554920156
        ],
        "wc_review_avg": [
            394.25,
            119.22326744390124
        ],
        "wc_reply_reviewers_avg": [
            161.75,
            133.7242965956449
        ],
        "wc_reply_authors_avg": [
            543.0,
            215.59452683219953
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:WtagKLWCx1cJ:scholar.google.com/&scioq=EGALA:+Efficient+Gradient+Approximation+for+Large-scale+Graph+Adversarial+Attack&hl=en&as_sdt=0,47",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of California, Los Angeles",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucla.edu",
        "aff_unique_abbr": "UCLA",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Los Angeles",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Ydlfehfvge",
        "title": "Mitigating Estimation Errors By Twin TD-Regularized Actor and Critic for Deep Reinforcement Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We address the issue of estimation bias in deep reinforcement learning (DRL) by introducing solution mechanisms that include a new, twin TD-regularized actor-critic (TDR) method. It aims at reducing both over and under estimation errors. With TDR and by combining good DRL improvements, such as distributional learning and long $N$-step surrogate stage reward (LNSS) method, we show that our new TDR-based actor-critic learning has enabled DRL methods to outperform their respective baselines in challenging environments in DeepMind Control\nSuite. Furthermore, they elevate TD3 and SAC respectively to a level of performance comparable to that of D4PG (the current SOTA), and they also improve the performance of D4PG to a new SOTA level measured by mean reward, convergence speed, learning success rate, and learning variance.",
        "keywords": "Deep Reinforcement learning;estimation error;overestimation;underestimation;double Q",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Junmin Zhong;Ruofan Wu;Jennie Si",
        "authorids": "~Junmin_Zhong1;~Ruofan_Wu3;~Jennie_Si1",
        "gender": "M;M;",
        "homepage": "https://isearch.asu.edu/profile/2788545;;",
        "dblp": "316/9584;;",
        "google_scholar": "uVv_eWQAAAAJ;TrevQ1MAAAAJ;",
        "orcid": ";0000-0003-4438-0191;",
        "linkedin": ";;",
        "or_profile": "~Junmin_Zhong1;~Ruofan_Wu3;~Jennie_Si1",
        "aff": "Arizona State University;Arizona State University;",
        "aff_domain": "asu.edu;asu.edu;",
        "position": "PhD student;Researcher;",
        "bibtex": "@misc{\nanonymous2024mitigating,\ntitle={Mitigating Estimation Errors By Twin {TD}-Regularized Actor and Critic for Deep Reinforcement Learning},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=Ydlfehfvge}\n}",
        "github": "",
        "project": "",
        "reviewers": "SnPL;LkhT;2Vrh;KXvd",
        "site": "https://openreview.net/forum?id=Ydlfehfvge",
        "pdf_size": 24852999,
        "rating": "3;3;3;5",
        "confidence": "4;5;5;4",
        "soundness": "1;2;2;3",
        "contribution": "2;2;1;2",
        "presentation": "1;2;2;2",
        "wc_summary": "86;68;64;53",
        "wc_strengths": "65;26;24;14",
        "wc_weaknesses": "558;119;63;16",
        "wc_questions": "22;191;187;523",
        "wc_review": "731;404;338;606",
        "wc_reply_reviewers": "0;35;0;233",
        "wc_reply_authors": "808;1248;516;1052",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "2;2;1;2",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            67.75,
            11.882234638316145
        ],
        "wc_strengths_avg": [
            32.25,
            19.447043477094404
        ],
        "wc_weaknesses_avg": [
            189.0,
            216.14000092532618
        ],
        "wc_questions_avg": [
            230.75,
            181.98952579750298
        ],
        "wc_review_avg": [
            519.75,
            156.9209594031339
        ],
        "wc_reply_reviewers_avg": [
            67.0,
            96.8994324028784
        ],
        "wc_reply_authors_avg": [
            906.0,
            273.85397568777415
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8129538101621191379&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Arizona State University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.asu.edu",
        "aff_unique_abbr": "ASU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "YeOUqnPVwM",
        "title": "Disentangling Covariates to Predict Counterfactuals for single-cell data",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Single-cell transcriptomics enables understanding cellular behaviors during diseases or in response to perturbations. However, analyzing multi-donor and multi-covariate single-cell data while disentangling technical noise from biological signals remains a significant challenge. Additionally, predicting cellular responses to interventions becomes even more challenging due to donor-specific effects and unobserved covariates. This study introduces \u201cdisentanglement to prediction\u201d (dis2p), a causal generative model designed to disentangle known covariate variations from unknown ones while simultaneously learning to make counterfactual predictions. dis2p accurately learns covariate-specific representations, as empirically demonstrated, which improve generalization for performing counterfactual predictions. Given the increasing availability of population-level single-cell datasets, we envision dis2p becoming a valuable tool for analyzing such data due to its ability to learn controllable representations that facilitate biological discoveries, improve experiment design, and reduce costs using in silico predictions.",
        "keywords": "single-cell;computational biology;causal inference;generative model;variational inference;variational autoencoder;fairness;representation disentanglement",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Kian Shamsaie;Stathis Megas;Hesam Asadollahzadeh;Sarah A Teichmann;Mohammad Lotfollahi",
        "authorids": "~Kian_Shamsaie1;~Stathis_Megas1;~Hesam_Asadollahzadeh1;~Sarah_A_Teichmann1;~Mohammad_Lotfollahi1",
        "gender": ";M;M;F;M",
        "homepage": ";;http://HesamAsad.github.io;http://www.teichlab.org;http://lotfollahi.com/",
        "dblp": ";;;;",
        "google_scholar": ";PelOh2IAAAAJ;cL60wssAAAAJ;;NXhouUcAAAAJ",
        "orcid": ";;;;0000-0001-6858-7985",
        "linkedin": ";stathis-megas-87530294/;;;",
        "or_profile": "~Kian_Shamsaie1;~Stathis_Megas1;~Hesam_Asadollahzadeh1;~Sarah_A_Teichmann1;~Mohammad_Lotfollahi1",
        "aff": ";Wellcome Sanger Institute;University of Tehran, University of Tehran;University of Cambridge;",
        "aff_domain": ";sanger.ac.uk;ut.ac.ir;cam.ac.uk;",
        "position": ";Postdoc;Undergrad student;Principal Researcher;",
        "bibtex": "@misc{\nshamsaie2024disentangling,\ntitle={Disentangling Covariates to Predict Counterfactuals for single-cell data},\nauthor={Kian Shamsaie and Stathis Megas and Hesam Asadollahzadeh and Sarah A Teichmann and Mohammad Lotfollahi},\nyear={2024},\nurl={https://openreview.net/forum?id=YeOUqnPVwM}\n}",
        "github": "",
        "project": "",
        "reviewers": "XHPa;dmua;bDut;Woon",
        "site": "https://openreview.net/forum?id=YeOUqnPVwM",
        "pdf_size": 4708578,
        "rating": "3;3;3;3",
        "confidence": "4;4;4;4",
        "soundness": "1;2;2;1",
        "contribution": "1;2;2;2",
        "presentation": "1;1;1;1",
        "wc_summary": "62;140;80;88",
        "wc_strengths": "51;31;15;78",
        "wc_weaknesses": "635;332;349;1010",
        "wc_questions": "26;309;50;149",
        "wc_review": "774;812;494;1325",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            1.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.0,
            0.0
        ],
        "wc_summary_avg": [
            92.5,
            28.99568933479596
        ],
        "wc_strengths_avg": [
            43.75,
            23.53056522908024
        ],
        "wc_weaknesses_avg": [
            581.5,
            275.1276976242123
        ],
        "wc_questions_avg": [
            133.5,
            111.32048329036306
        ],
        "wc_review_avg": [
            851.25,
            299.82276014338873
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7487288600986141784&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Wellcome Sanger Institute;University of Tehran;University of Cambridge",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.sanger.ac.uk;https://ut.ac.ir;https://www.cam.ac.uk",
        "aff_unique_abbr": "WSI;UT;Cambridge",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Cambridge",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United Kingdom;Iran"
    },
    {
        "title": "Is ImageNet worth 1 video? Learning strong image encoders from 1 long unlabelled video",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18416",
        "id": "Yen1lGns2o",
        "author_site": "Shashank Venkataramanan, Mamshad Nayeem Rizve, Joao Carreira, Yuki Asano, Yannis Avrithis",
        "tldr": "",
        "abstract": "Self-supervised learning has unlocked the potential of scaling up pretraining to billions of images, since annotation is unnecessary. But are we making the best use of data? How more economical can we be? In this work, we attempt to answer this question by making two contributions. First, we investigate first-person videos and introduce a ``Walking Tours'' dataset. These videos are high-resolution, hours-long, captured in a single uninterrupted take, depicting a large number of objects and actions with natural scene transitions. They are unlabeled and uncurated, thus realistic for self-supervision and comparable with human learning. \n\nSecond, we introduce a novel self-supervised image pretraining method tailored for learning from continuous videos. Existing methods typically adapt image-based pretraining approaches to incorporate more frames. Instead, we advocate a ``tracking to learn to recognize'' approach. Our method called DoRA, leads to attention maps that **D**isc**O**ver and t**RA**ck objects over time in an end-to-end manner, using transformer cross-attention. We derive multiple views from the tracks and use them in a classical self-supervised distillation loss. Using our novel approach, a single Walking Tours video remarkably becomes a strong competitor to ImageNet for several image and video downstream tasks.",
        "keywords": "self-supervised image-pretraining;egocentric video;Walking Tour dataset;multi-object tracking",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Shashanka Venkataramanan;Mamshad Nayeem Rizve;Joao Carreira;Yuki M Asano;Yannis Avrithis",
        "authorids": "~Shashanka_Venkataramanan2;~Mamshad_Nayeem_Rizve1;~Joao_Carreira1;~Yuki_M_Asano1;~Yannis_Avrithis2",
        "gender": "M;M;M;;M",
        "homepage": "https://shashankvkt.github.io/;https://nayeemrizve.github.io/;;https://avrithis.net/;https://yukimasano.github.io/",
        "dblp": "218/8893;260/4900;61/5621-1;a/YSAvrithis;239/8823",
        "google_scholar": "CbfH47IAAAAJ;kA8ZM5oAAAAJ;https://scholar.google.pt/citations?user=IUZ-7_cAAAAJ;AF2SxG0AAAAJ;CdpLhlgAAAAJ",
        "orcid": ";;;0000-0001-7476-4482;",
        "linkedin": "shashank-venkataramanan-1b2b9993/;;jo%C3%A3o-carreira-56238a7/;yannisavrithis/;",
        "or_profile": "~Shashanka_Venkataramanan2;~Mamshad_Nayeem_Rizve1;~Joao_Carreira1;~Yannis_Avrithis2;~Yuki_Asano1",
        "aff": "INRIA;Amazon;Google DeepMind;IARAI;University of Amsterdam",
        "aff_domain": "inria.fr;amazon.com;google.com;iarai.ac.at;uva.nl",
        "position": "PhD student;Postdoc;Research Scientist;Principal Investigator;Assistant Professor",
        "bibtex": "@inproceedings{\nvenkataramanan2024is,\ntitle={Is ImageNet worth 1 video? Learning strong image encoders from 1 long unlabelled video},\nauthor={Shashanka Venkataramanan and Mamshad Nayeem Rizve and Joao Carreira and Yuki M Asano and Yannis Avrithis},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Yen1lGns2o}\n}",
        "github": "",
        "project": "",
        "reviewers": "DfLs;GQ4C;krCr;CACu;YYAs",
        "pdf_size": 16055694,
        "rating": "6;8;8;8;8",
        "confidence": "4;5;4;4;4",
        "soundness": "3;2;3;4;3",
        "contribution": "2;3;4;3;3",
        "presentation": "3;4;3;3;3",
        "wc_summary": "102;114;153;193;215",
        "wc_strengths": "67;51;84;62;101",
        "wc_weaknesses": "344;173;77;117;45",
        "wc_questions": "47;95;106;79;79",
        "wc_review": "560;433;420;451;440",
        "wc_reply_reviewers": "134;35;41;0;32",
        "wc_reply_authors": "195;235;150;182;421",
        "reply_reviewers": "1;1;1;0;1",
        "reply_authors": "1;2;1;1;2",
        "rating_avg": [
            7.6,
            0.7999999999999999
        ],
        "confidence_avg": [
            4.2,
            0.39999999999999997
        ],
        "soundness_avg": [
            3.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            3.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            3.2,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            155.4,
            43.67424870561599
        ],
        "wc_strengths_avg": [
            73.0,
            17.58408371226661
        ],
        "wc_weaknesses_avg": [
            151.2,
            105.45216925222543
        ],
        "wc_questions_avg": [
            81.2,
            19.923855048659632
        ],
        "wc_review_avg": [
            460.8,
            50.609880458266254
        ],
        "wc_reply_reviewers_avg": [
            48.4,
            45.10698393818855
        ],
        "wc_reply_authors_avg": [
            236.6,
            96.14281044363119
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4
        ],
        "reply_authors_avg": [
            1.4,
            0.4898979485566356
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.2500000000000001,
        "gs_citation": 22,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2440536107760425863&as_sdt=8005&sciodt=0,7&hl=en",
        "gs_version_total": 12,
        "openreview": "https://openreview.net/forum?id=Yen1lGns2o",
        "pdf": "https://openreview.net/pdf?id=Yen1lGns2o",
        "email": "inria.fr;amazon.com;google.com;iarai.ac.at;uva.nl",
        "author_num": 5,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "INRIA;Amazon;Google;Institute of Advanced Research in Artificial Intelligence;University of Amsterdam",
        "aff_unique_dep": ";Amazon.com, Inc.;Google DeepMind;;",
        "aff_unique_url": "https://www.inria.fr;https://www.amazon.com;https://deepmind.com;https://www.iarai.ac.at;https://www.uva.nl",
        "aff_unique_abbr": "INRIA;Amazon;DeepMind;IARAI;UvA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;3;4",
        "aff_country_unique": "France;United States;United Kingdom;Austria;Netherlands"
    },
    {
        "id": "YfZMfrpEnl",
        "title": "Stochastic Vision Transformers with Wasserstein Distance-Aware Attention",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Self-supervised learning is one of the most promising approaches to acquiring knowledge from limited labeled data. Despite the substantial advancements made in recent years, self-supervised models have posed a challenge to practitioners, as they do not readily provide insight into the model's confidence and uncertainty. Tackling this issue is no simple feat, primarily due to the complexity involved in implementing techniques that can make use of the latent representations learned during pre-training without relying on explicit labels.\nMotivated by this, we introduce a new stochastic vision transformer that integrates uncertainty and distance awareness into self-supervised learning (SSL) pipelines. Instead of the conventional deterministic vector embedding, our novel stochastic vision transformer encodes image patches into elliptical Gaussian distributional embeddings. Notably, the attention matrices of these stochastic representational embeddings are computed using Wasserstein distance-based attention, effectively capitalizing on the distributional nature of these embeddings. Additionally, we propose a regularization term based on Wasserstein distance for both pre-training and fine-tuning processes, thereby incorporating distance awareness into latent representations.\nWe perform extensive experiments across different tasks such as in-distribution generalization, out-of-distribution detection, dataset corruption, semi-supervised settings, and transfer learning to other datasets and tasks. Our proposed method achieves superior accuracy and calibration, surpassing the self-supervised baseline in a wide range of experiments on a variety of datasets. Our code is in the supplementary material.",
        "keywords": "Robust Self-supervised Representation Learning;Stochastic Transformer;Guassian Embedding",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/acaa1764abade02e5b35c947feaac2f5b5031e79.zip",
        "author": "Franciskus Xaverius Erick;Mina Rezaei;Johanna Paula M\u00fcller;Bernhard Kainz",
        "authorids": "~Franciskus_Xaverius_Erick1;~Mina_Rezaei1;~Johanna_Paula_M\u00fcller1;~Bernhard_Kainz1",
        "gender": ";F;F;M",
        "homepage": ";https://www.compstat.statistik.uni-muenchen.de/people/minar/;;http://wp.doc.ic.ac.uk/bkainz/",
        "dblp": ";205/2767;;76/5562",
        "google_scholar": "dxw23KcAAAAJ;https://scholar.google.de/citations?hl=en;;https://scholar.google.co.uk/citations?user=Igxq-YEAAAAJ",
        "orcid": ";0000-0001-6994-6345;0000-0001-8636-7986;0000-0002-7813-5023",
        "linkedin": "franciskus-xaverius-erick/;mina-rezaei-b88a3a69/;;https://uk.linkedin.com/in/bernhard-kainz-43514320",
        "or_profile": "~Franciskus_Xaverius_Erick1;~Mina_Rezaei1;~Johanna_Paula_M\u00fcller1;~Bernhard_Kainz1",
        "aff": "Friedrich-Alexander Universit\u00e4t Erlangen-N\u00fcrnberg;Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen;Friedrich-Alexander Universit\u00e4t Erlangen-N\u00fcrnberg;King's College London",
        "aff_domain": "fau.de;lmu.de;fau.de;kcl.ac.uk",
        "position": "PhD student;Principal Researcher;PhD student;Honorable Lecturer",
        "bibtex": "@misc{\nerick2024stochastic,\ntitle={Stochastic Vision Transformers with Wasserstein Distance-Aware Attention},\nauthor={Franciskus Xaverius Erick and Mina Rezaei and Johanna Paula M{\\\"u}ller and Bernhard Kainz},\nyear={2024},\nurl={https://openreview.net/forum?id=YfZMfrpEnl}\n}",
        "github": "",
        "project": "",
        "reviewers": "ysA7;67qY;ynaf",
        "site": "https://openreview.net/forum?id=YfZMfrpEnl",
        "pdf_size": 1373735,
        "rating": "5;5;6",
        "confidence": "2;5;1",
        "soundness": "3;3;3",
        "contribution": "2;2;3",
        "presentation": "3;3;3",
        "wc_summary": "30;76;41",
        "wc_strengths": "21;27;18",
        "wc_weaknesses": "110;191;1",
        "wc_questions": "18;56;1",
        "wc_review": "179;350;61",
        "wc_reply_reviewers": "0;104;0",
        "wc_reply_authors": "465;599;15",
        "reply_reviewers": "0;1;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            2.6666666666666665,
            1.699673171197595
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            49.0,
            19.61292091114087
        ],
        "wc_strengths_avg": [
            22.0,
            3.7416573867739413
        ],
        "wc_weaknesses_avg": [
            100.66666666666667,
            77.84742913046148
        ],
        "wc_questions_avg": [
            25.0,
            22.992752481307377
        ],
        "wc_review_avg": [
            196.66666666666666,
            118.64325611775084
        ],
        "wc_reply_reviewers_avg": [
            34.666666666666664,
            49.026070162267295
        ],
        "wc_reply_authors_avg": [
            359.6666666666667,
            249.78034795039866
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.6933752452815363,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:iT5qVLVSjvgJ:scholar.google.com/&scioq=Stochastic+Vision+Transformers+with+Wasserstein+Distance-Aware+Attention&hl=en&as_sdt=0,33",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "Friedrich-Alexander University Erlangen-N\u00fcrnberg;Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen;King's College London",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www fau.de;https://www.lmu.de;https://www.kcl.ac.uk",
        "aff_unique_abbr": "FAU;LMU;KCL",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Erlangen-N\u00fcrnberg;",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "Germany;United Kingdom"
    },
    {
        "title": "AUC-CL: A Batchsize-Robust Framework for Self-Supervised Contrastive Representation Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18415",
        "id": "YgMdDQB09U",
        "author_site": "Rohan Sharma, Kaiyi Ji, Zhiqiang Xu, Changyou Chen",
        "tldr": "",
        "abstract": "Self-supervised learning through contrastive representations is an emergent and promising avenue, aiming at alleviating the availability of labeled data. Recent research in the field also demonstrates its viability for several downstream tasks, henceforth leading to works that implement the contrastive principle through innovative loss functions and methods. However, despite achieving impressive progress, most methods depend on prohibitively large batch sizes and compute requirements for good performance. \nIn this work, we propose the $\\textbf{AUC}$-$\\textbf{C}$ontrastive $\\textbf{L}$earning, a new approach to contrastive learning that demonstrates robust and competitive performance in compute-limited regimes. \nWe propose to incorporate the contrastive objective within the AUC-maximization framework, by noting that the AUC metric is maximized upon enhancing the probability of the network's binary prediction difference between positive and negative samples which inspires adequate embedding space arrangements in representation learning. Unlike standard contrastive methods, when performing stochastic optimization, our method maintains unbiased stochastic gradients and thus is more robust to batchsizes as opposed to standard stochastic optimization problems.\nRemarkably, our method with a batch size of 256, outperforms several state-of-the-art methods that may need much larger batch sizes (e.g., 4096), on ImageNet and other standard datasets. Experiments on transfer learning, few-shot learning, and other downstream tasks also demonstrate the viability of our method.",
        "keywords": "Contrastive Learning;AUC maximization;Representation Learning;Self Supervised Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/9ae432c4b8e16ae47f3cf5570915381c15a99b00.pdf",
        "author": "Rohan Sharma;Kaiyi Ji;zhiqiang xu;Changyou Chen",
        "authorids": "~Rohan_Sharma1;~Kaiyi_Ji1;~zhiqiang_xu1;~Changyou_Chen1",
        "gender": "M;M;M;M",
        "homepage": ";https://cse.buffalo.edu/~kaiyiji/;https://scholar.google.com/citations?user=0R20iBMAAAAJ&hl=en;https://www.cse.buffalo.edu/~changyou/",
        "dblp": ";205/3164;72/51-3.html;65/2802",
        "google_scholar": ";E0A3lSIAAAAJ;;LtEcKBcAAAAJ",
        "orcid": ";;0000-0002-5693-8933;",
        "linkedin": "rs1561/;;;",
        "or_profile": "~Rohan_Sharma1;~Kaiyi_Ji1;~zhiqiang_xu1;~Changyou_Chen1",
        "aff": "Amazon;State University of New York at Buffalo;Mohamed bin Zayed University of Artificial Intelligence;State University of New York, Buffalo",
        "aff_domain": "amazon.com;buffalo.edu;mbzuai.ac.ae;buffalo.edu",
        "position": "Applied Scientist Intern;Assistant Professor;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nsharma2024auccl,\ntitle={{AUC}-{CL}: A Batchsize-Robust Framework for Self-Supervised Contrastive Representation Learning},\nauthor={Rohan Sharma and Kaiyi Ji and zhiqiang xu and Changyou Chen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=YgMdDQB09U}\n}",
        "github": "",
        "project": "",
        "reviewers": "nw59;QVtp;pifE;vuAt",
        "pdf_size": 988141,
        "rating": "5;6;6;6",
        "confidence": "5;4;4;2",
        "soundness": "2;3;3;2",
        "contribution": "3;2;2;2",
        "presentation": "2;2;3;3",
        "wc_summary": "55;95;58;93",
        "wc_strengths": "73;18;60;35",
        "wc_weaknesses": "227;30;203;46",
        "wc_questions": "26;23;2;182",
        "wc_review": "381;166;323;356",
        "wc_reply_reviewers": "0;26;105;154",
        "wc_reply_authors": "947;613;876;1037",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "3;2;4;4",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            75.25,
            18.793283374652763
        ],
        "wc_strengths_avg": [
            46.5,
            21.383404780343096
        ],
        "wc_weaknesses_avg": [
            126.5,
            89.08563296065196
        ],
        "wc_questions_avg": [
            58.25,
            72.04295593602473
        ],
        "wc_review_avg": [
            306.5,
            83.68542286443918
        ],
        "wc_reply_reviewers_avg": [
            71.25,
            61.46289531091096
        ],
        "wc_reply_authors_avg": [
            868.25,
            158.02748969720426
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.25,
            0.82915619758885
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.6622661785325219,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12879205592587669636&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=YgMdDQB09U",
        "pdf": "https://openreview.net/pdf?id=YgMdDQB09U",
        "email": "amazon.com;buffalo.edu;mbzuai.ac.ae;buffalo.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "Amazon;State University of New York at Buffalo;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_unique_dep": "Amazon.com, Inc.;;",
        "aff_unique_url": "https://www.amazon.com;https://www.buffalo.edu;https://mbzuai.ac.ae",
        "aff_unique_abbr": "Amazon;SUNY Buffalo;MBZUAI",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Buffalo",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "United States;United Arab Emirates"
    },
    {
        "id": "YhNXGWVH1N",
        "title": "LeanFlex-GKP: Advancing Hassle-Free Structured Pruning with Simple Flexible Group Count",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Densely structured pruning methods \u2014 which generate pruned models in a fully dense format, allowing immediate compression benefits without additional demands \u2014 are evolving owing to their practical significance. Traditional techniques in this domain mainly revolve around coarser granularities, such as filter pruning, thereby limiting their performance due to restricted pruning freedom.\n\nRecent advancements in *Grouped Kernel Pruning (GKP)* have enabled the utilization of finer granularity while maintaining the densely structured format. We observed that existing GKP methods often introduce dynamic operations to different aspects of their procedures, where many were done so at the cost of adding complications and/or imposing limitations \u2014 e.g., requiring an expensive mixture of clustering schemes; or having dynamic pruning rates and sizes among groups, which lead to reliance on custom architecture support for its pruned models.\n\nIn this work, we argue the best practice to introduce such dynamic operation to GKP is to make `Conv2d(groups)` (a.k.a. group count) flexible under an integral optimization, leveraging its ideal alignment with the infrastructure support of *Grouped Convolution*. Pursuing such direction, we present a one-shot, post-train, data-agnostic GKP method that is more performant, adaptive, and efficient than its predecessors; while simultaneously being a lot more user-friendly with little-to-no hyper-parameter tuning or handcrafted criteria required.",
        "keywords": "pruning;structured pruning;grouped kernel pruning;CNN;one-shot",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Jiamu Zhang;Shaochen Zhong;Andrew Ye;Zirui Liu;Kaixiong Zhou;Xia Hu;Shuai Xu;Vipin Chaudhary",
        "authorids": "~Jiamu_Zhang1;~Shaochen_Zhong1;~Andrew_Ye1;~Zirui_Liu1;~Kaixiong_Zhou1;~Xia_Hu4;~Shuai_Xu2;~Vipin_Chaudhary2",
        "gender": "M;M;M;M;M;M;M;M",
        "homepage": ";https://openreview.net/profile?id=~Shaochen_Zhong1;https://andrew-ye.com/;https://zirui-ray-liu.github.io/;https://kaixiong-zhou.github.io/;https://engineering.case.edu/profiles/sxx214;https://engineering.case.edu/profiles/vxc204;https://cs.rice.edu/~xh37/index.html",
        "dblp": ";326/7286.html;368/4125;196/8629-1.html;178/7315;;c/VipinChaudhary.html;256/9406.html",
        "google_scholar": "eQpW5EIAAAAJ;https://scholar.google.com/citations?hl=en;N0gvFN4AAAAJ;https://scholar.google.com/citations?hl=zh-CN;zMspIjIAAAAJ;wu-vtI4AAAAJ;vJbjqpIAAAAJ;https://scholar.google.com.tw/citations?user=pcCS60IAAAAJ",
        "orcid": ";;;;0000-0001-5226-8736;;0000-0001-9672-6225;",
        "linkedin": "jiamu-zhang-morris;shaochen-henry-zhong-96a941249/;;;;;vipin-chaudhary-379529/;",
        "or_profile": "~Jiamu_Zhang1;~Shaochen_Zhong1;~Andrew_Ye1;~Zirui_Liu1;~Kaixiong_Zhou1;~Shuai_Xu2;~Vipin_Chaudhary2;~Xia_Hu2",
        "aff": "Case Western Reserve University;Rice University;Case Western Reserve University;Rice University;Massachusetts Institute of Technology;Case Western Reserve University;Case Western Reserve University;Rice University",
        "aff_domain": "case.edu;rice.edu;case.edu;rice.edu;mit.edu;case.edu;case.edu;rice.edu",
        "position": "Undergrad student;PhD student;Undergrad student;PhD student;Postdoc;Assistant Professor;Full Professor;Associate Professor",
        "bibtex": "@misc{\nzhang2024leanflexgkp,\ntitle={LeanFlex-{GKP}: Advancing Hassle-Free Structured Pruning with Simple Flexible Group Count},\nauthor={Jiamu Zhang and Shaochen Zhong and Andrew Ye and Zirui Liu and Kaixiong Zhou and Xia Hu and Shuai Xu and Vipin Chaudhary},\nyear={2024},\nurl={https://openreview.net/forum?id=YhNXGWVH1N}\n}",
        "github": "",
        "project": "",
        "reviewers": "zM1b;HKS2;SmAM",
        "site": "https://openreview.net/forum?id=YhNXGWVH1N",
        "pdf_size": 690172,
        "rating": "5;5;5",
        "confidence": "3;5;3",
        "soundness": "3;2;2",
        "contribution": "2;3;2",
        "presentation": "3;3;2",
        "wc_summary": "51;31;107",
        "wc_strengths": "63;36;33",
        "wc_weaknesses": "100;278;102",
        "wc_questions": "37;22;48",
        "wc_review": "251;367;290",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "2079;1261;1502",
        "reply_reviewers": "0;0;0",
        "reply_authors": "4;3;3",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            63.0,
            32.16623488483952
        ],
        "wc_strengths_avg": [
            44.0,
            13.490737563232042
        ],
        "wc_weaknesses_avg": [
            160.0,
            83.4425950379461
        ],
        "wc_questions_avg": [
            35.666666666666664,
            10.656244908763853
        ],
        "wc_review_avg": [
            302.6666666666667,
            48.19635763093399
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1614.0,
            343.209362731652
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:GRsS4uYORpIJ:scholar.google.com/&scioq=LeanFlex-GKP:+Advancing+Hassle-Free+Structured+Pruning+with+Simple+Flexible+Group+Count&hl=en&as_sdt=0,33",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;1;2;0;0;1",
        "aff_unique_norm": "Case Western Reserve University;Rice University;Massachusetts Institute of Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.case.edu;https://www.rice.edu;https://web.mit.edu",
        "aff_unique_abbr": "CWRU;Rice;MIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "YhPUSofMgr",
        "title": "Text-Aware Diffusion Policies",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Diffusion models scaled to massive datasets have demonstrated powerful underlying unification capabilities between the language modality and pixel space, as convincingly evidenced by high-quality text-to-image synthesis that delight and astound.  In this work, we interpret agents interacting within a visual reinforcement learning setting as trainable video renderers, where the output video is simply frames stitched together across sequential timesteps.  Then, we propose Text-Aware Diffusion Policies (TADPols), which uses large-scale pretrained models, particularly text-to-image diffusion models, to train policies that are aligned with natural language text inputs.  As the behavior represented within a policy naturally learns to align with the reward function utilized during optimization, we propose generating the reward signal for a reinforcement learning agent as the similarity between a provided text description and the frames the agent produces from its interactions.  Furthermore, rendering the video produced by an agent during inference can be treated as a form of text-to-video generation, where the video has the added bonus of always being smooth and consistent with respect to the environmental specifications.  Additionally, when the diffusion model is kept frozen, this enables the investigation of how well a large-scale model pretrained only on static image and textual data is able to understand temporally extended behaviors and actions.  We conduct experiments on a variety of locomotion experiments across multiple subjects, and demonstrate that agents can be trained using the unified understanding of vision and language captured within large-scale pretrained diffusion models to not only synthesize videos that correspond with provided text, but also learn to perform the motion itself as autonomous agents.",
        "keywords": "diffusion models;reinforcement learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/1654ede79c86692e9a0651915dca0e0f11ba53af.zip",
        "author": "Calvin Luo;Chen Sun",
        "authorids": "~Calvin_Luo2;~Chen_Sun1",
        "gender": "M;M",
        "homepage": "https://calvinyluo.com/;https://chensun.me",
        "dblp": ";01/6072-2",
        "google_scholar": "https://scholar.google.com/citations?hl=en;vQa7heEAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Calvin_Luo2;~Chen_Sun1",
        "aff": "Brown University;Google",
        "aff_domain": "brown.edu;google.com",
        "position": "PhD student;Research Scientist",
        "bibtex": "@misc{\nluo2024textaware,\ntitle={Text-Aware Diffusion Policies},\nauthor={Calvin Luo and Chen Sun},\nyear={2024},\nurl={https://openreview.net/forum?id=YhPUSofMgr}\n}",
        "github": "",
        "project": "",
        "reviewers": "gAGE;fbDb;mJca;JZP2;LDs4",
        "site": "https://openreview.net/forum?id=YhPUSofMgr",
        "pdf_size": 4381437,
        "rating": "3;5;5;6;6",
        "confidence": "3;3;3;2;4",
        "soundness": "3;3;2;4;1",
        "contribution": "2;3;2;2;2",
        "presentation": "3;2;1;3;3",
        "wc_summary": "72;52;87;89;51",
        "wc_strengths": "30;6;55;70;68",
        "wc_weaknesses": "120;90;138;222;256",
        "wc_questions": "89;93;15;35;1",
        "wc_review": "311;241;295;416;376",
        "wc_reply_reviewers": "0;0;0;366;375",
        "wc_reply_authors": "1439;900;990;3160;897",
        "reply_reviewers": "0;0;0;4;1",
        "reply_authors": "2;2;2;7;2",
        "rating_avg": [
            5.0,
            1.0954451150103321
        ],
        "confidence_avg": [
            3.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.6,
            1.019803902718557
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.4,
            0.8
        ],
        "wc_summary_avg": [
            70.2,
            16.363373735266208
        ],
        "wc_strengths_avg": [
            45.8,
            24.481829996958968
        ],
        "wc_weaknesses_avg": [
            165.2,
            63.101188578346125
        ],
        "wc_questions_avg": [
            46.6,
            37.850231174987556
        ],
        "wc_review_avg": [
            327.8,
            61.635703938545234
        ],
        "wc_reply_reviewers_avg": [
            148.2,
            181.52950173456654
        ],
        "wc_reply_authors_avg": [
            1477.2,
            864.9197419414127
        ],
        "reply_reviewers_avg": [
            1.0,
            1.5491933384829668
        ],
        "reply_authors_avg": [
            3.0,
            2.0
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:JzfOBfZ3lGIJ:scholar.google.com/&scioq=Text-Aware+Diffusion+Policies&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Brown University;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.brown.edu;https://www.google.com",
        "aff_unique_abbr": "Brown;Google",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "YhT1ZemZow",
        "title": "Sobolev acceleration for neural networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Sobolev training for neural networks, a technique that integrates target derivatives into the training process, has demonstrated significantly faster convergence towards lower test errors when compared to conventional loss functions. However, to date, the effect of this training has not been understood comprehensively. This paper presents analytical evidence that Sobolev training accelerates the convergence of rectified linear unit (ReLU)-networks in the student-teacher framework. The analysis builds upon the analytical formula for the population gradients of ReLU networks with centered spherical Gaussian input. Further, numerical examples were considered to show that the results may be extended to multi-layered neural networks with various activation functions and architectures. Finally, we propose the use of Chebyshev spectral differentiation as a solution to approximate target derivatives and address prior limitations on using approximated derivatives. Overall, this study contributes to a deeper understanding of the dynamics of ReLU networks in the student-teacher setting and highlights the convergence acceleration achieved through Sobolev training, known as Sobolev acceleration.",
        "keywords": "Sobolev Training;Convergence Acceleration;Neural Networks;Gradient Flow",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Hwijae Son",
        "authorids": "~Hwijae_Son1",
        "gender": "M",
        "homepage": "",
        "dblp": "",
        "google_scholar": "NTgm_R4AAAAJ",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Hwijae_Son1",
        "aff": "Hanbat National University",
        "aff_domain": "hanbat.ac.kr",
        "position": "Assistant Professor",
        "bibtex": "@misc{\nson2024sobolev,\ntitle={Sobolev acceleration for neural networks},\nauthor={Hwijae Son},\nyear={2024},\nurl={https://openreview.net/forum?id=YhT1ZemZow}\n}",
        "github": "",
        "project": "",
        "reviewers": "cgse;dcHW;BYTD;ePTL",
        "site": "https://openreview.net/forum?id=YhT1ZemZow",
        "pdf_size": 1005075,
        "rating": "3;3;6;6",
        "confidence": "3;3;3;2",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;2",
        "presentation": "2;3;3;3",
        "wc_summary": "27;197;99;93",
        "wc_strengths": "19;58;57;37",
        "wc_weaknesses": "46;210;10;19",
        "wc_questions": "29;47;93;2",
        "wc_review": "121;512;259;151",
        "wc_reply_reviewers": "0;46;0;0",
        "wc_reply_authors": "67;222;125;77",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            104.0,
            60.67124524847005
        ],
        "wc_strengths_avg": [
            42.75,
            16.068213964221414
        ],
        "wc_weaknesses_avg": [
            71.25,
            81.19536624709565
        ],
        "wc_questions_avg": [
            42.75,
            33.138912172852024
        ],
        "wc_review_avg": [
            260.75,
            153.87068434240487
        ],
        "wc_reply_reviewers_avg": [
            11.5,
            19.91858428704209
        ],
        "wc_reply_authors_avg": [
            122.75,
            61.35297466301043
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.5773502691896258,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:zvpkC7crlnYJ:scholar.google.com/&scioq=Sobolev+acceleration+for+neural+networks&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Hanbat National University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.hanbat.ac.kr",
        "aff_unique_abbr": "HNU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "YhpgUWE4Rt",
        "title": "Recurrent Neural Cellular Automata with Self-Attention for Multi-agent System",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Many-agent systems, such as epidemic spread, rumor propagation through crowd, prey-predator model, and forest fire, exhibit complex global dynamics originated from local, relatively simple, and often stochastic interactions between agents. Despite significant advancements in predictive modeling through deep learning, such interactions among many agents have rarely explored as a specific domain for predictive modeling. We present Recurrent Attention-based Neural Cellular Automata (RA-NCA), to effectively discover the local stochastic interaction by associating the temporal information between neighboring agents in a permutation-invariant manner. RA-NCA exhibits the superior generalizability across various agent configurations (i.e., spatial distribution of agents), data efficiency and robustness in extremely data-limited scenarios even with the presence of stochastic interactions, and scalability through spatial dimension-independent prediction. We compare and evaluate RA-NCA with other NCA networks and scene prediction networks in the three synthetic multi-agent systems with thousands of agents, such as forest fire, host-pathogen, and stock market models.",
        "keywords": "neural cellular automata;complex system;self-organization;multi-agent system",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/848be84c1d57ebd088f32bf3b146d90b9a486964.zip",
        "author": "Beomseok Kang;Harshit Kumar;Minah Lee;Biswadeep Chakraborty;Saibal Mukhopadhyay",
        "authorids": "~Beomseok_Kang1;hkumar64@gatech.edu;~Minah_Lee1;~Biswadeep_Chakraborty1;~Saibal_Mukhopadhyay2",
        "gender": "M;;;M;M",
        "homepage": "https://sites.google.com/view/beomseok-kang;;;;https://greenlab.ece.gatech.edu",
        "dblp": "309/1053;;196/1891;238/0554;66/1210",
        "google_scholar": "kbqaf1EAAAAJ;;0XuLcNYAAAAJ;8soIjY8AAAAJ;5KRtMEkAAAAJ",
        "orcid": ";;;;0000-0002-8894-3390",
        "linkedin": ";;;;",
        "or_profile": "~Beomseok_Kang1;hkumar64@gatech.edu;~Minah_Lee1;~Biswadeep_Chakraborty1;~Saibal_Mukhopadhyay2",
        "aff": "Georgia Institute of Technology;;Georgia Institute of Technology;Georgia Institute of Technology;Georgia Institute of Technology",
        "aff_domain": "gatech.edu;;gatech.edu;gatech.edu;gatech.edu",
        "position": "PhD student;;Postdoc;PhD student;Full Professor",
        "bibtex": "@misc{\nkang2024recurrent,\ntitle={Recurrent Neural Cellular Automata with Self-Attention for Multi-agent System},\nauthor={Beomseok Kang and Harshit Kumar and Minah Lee and Biswadeep Chakraborty and Saibal Mukhopadhyay},\nyear={2024},\nurl={https://openreview.net/forum?id=YhpgUWE4Rt}\n}",
        "github": "",
        "project": "",
        "reviewers": "jsLT;o3LN;rEW6;kzFw",
        "site": "https://openreview.net/forum?id=YhpgUWE4Rt",
        "pdf_size": 30940976,
        "rating": "3;3;5;6",
        "confidence": "4;3;3;3",
        "soundness": "3;2;3;3",
        "contribution": "3;1;3;3",
        "presentation": "3;3;2;2",
        "wc_summary": "94;128;107;54",
        "wc_strengths": "32;169;51;88",
        "wc_weaknesses": "111;645;160;158",
        "wc_questions": "1;118;18;112",
        "wc_review": "238;1060;336;412",
        "wc_reply_reviewers": "0;93;0;0",
        "wc_reply_authors": "1209;3779;898;2429",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "2;7;3;4",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            95.75,
            26.984949508939238
        ],
        "wc_strengths_avg": [
            85.0,
            52.51190341246449
        ],
        "wc_weaknesses_avg": [
            268.5,
            218.25501139721854
        ],
        "wc_questions_avg": [
            62.25,
            53.133675762175535
        ],
        "wc_review_avg": [
            511.5,
            322.62788162215617
        ],
        "wc_reply_reviewers_avg": [
            23.25,
            40.2701812759764
        ],
        "wc_reply_authors_avg": [
            2078.75,
            1136.2394939008236
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.0,
            1.8708286933869707
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5555555555555555,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:D7D3vuuIQo8J:scholar.google.com/&scioq=Recurrent+Neural+Cellular+Automata+with+Self-Attention+for+Multi-agent+System&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Georgia Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.gatech.edu",
        "aff_unique_abbr": "Georgia Tech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "YhwDw31DGI",
        "title": "MIPGen: Learning to Generate Scalable MIP Instances",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large-scale Mixed-Integer Programming (MIP) problems have been efficiently addressed using Machine Learning (ML)-based frameworks to obtain high-quality solutions. When addressing real-world MIP problems, ML-based frameworks often face challenges in acquiring sufficient isomorphic instances for practical training. This underscores the need for generators that can autonomously produce isomorphic MIP problems from existing instances. This paper introduces MIPGen, a novel generative framework for autonomous MIP instance generation. Our key contribution lies in the three-stage problem generation in MIPGen: 1) Instances Classification, which learns and clusters the embeddings of a bipartite graph representation of the problem; 2) Node Splitting and Merging, which splits the bipartite graph and tries to reconstruct it; 3) Scalable Problem Construction, which concatenates tree structures to get larger problems. We demonstrate that the instances generated by MIPGen are highly similar to the original problem instances and can effectively enhance the solution effect of the ML-based framework. Further experiments show that the scaled-up generated instances still retain the problem's structural properties, validating the proposed framework's effectiveness.",
        "keywords": "Mixed-Integer Programming;Generator",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Tianxing Yang;Huigen Ye;Hua Xu;Hongyan Wang",
        "authorids": "~Tianxing_Yang1;~Huigen_Ye1;~Hua_Xu1;~Hongyan_Wang1",
        "gender": ";;M;F",
        "homepage": ";;https://thu-xuhua.github.io/;https://www.researchgate.net/profile/Hongyan-Wang-25",
        "dblp": ";;31/4114-3;",
        "google_scholar": ";;;",
        "orcid": "0009-0000-5547-8624;;;",
        "linkedin": ";;;",
        "or_profile": "~Tianxing_Yang1;~Huigen_Ye1;~Hua_Xu1;~Hongyan_Wang1",
        "aff": "SUN YAT-SEN UNIVERSITY;;Tsinghua University;",
        "aff_domain": "sysu.edu.cn;;tsinghua.edu.cn;",
        "position": "Undergrad student;;Associate Professor;",
        "bibtex": "@misc{\nyang2024mipgen,\ntitle={{MIPG}en: Learning to Generate Scalable {MIP} Instances},\nauthor={Tianxing Yang and Huigen Ye and Hua Xu and Hongyan Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=YhwDw31DGI}\n}",
        "github": "",
        "project": "",
        "reviewers": "X6GL;Y5jX;si4d;XqyP;yz8X",
        "site": "https://openreview.net/forum?id=YhwDw31DGI",
        "pdf_size": 925957,
        "rating": "3;3;3;5;8",
        "confidence": "4;2;4;3;2",
        "soundness": "3;3;2;2;3",
        "contribution": "2;2;2;3;3",
        "presentation": "2;2;2;2;3",
        "wc_summary": "65;62;52;100;38",
        "wc_strengths": "26;53;28;47;79",
        "wc_weaknesses": "193;245;113;101;28",
        "wc_questions": "5;142;71;117;335",
        "wc_review": "289;502;264;365;480",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "1139;942;804;761;624",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "2;2;2;1;1",
        "rating_avg": [
            4.4,
            1.9595917942265424
        ],
        "confidence_avg": [
            3.0,
            0.8944271909999159
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.2,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            63.4,
            20.587374771932435
        ],
        "wc_strengths_avg": [
            46.6,
            19.293522228976233
        ],
        "wc_weaknesses_avg": [
            136.0,
            75.56189515886959
        ],
        "wc_questions_avg": [
            134.0,
            110.78267012488911
        ],
        "wc_review_avg": [
            380.0,
            96.79462795010889
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            854.0,
            174.9388464578408
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.6,
            0.4898979485566356
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.570544330734548,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:VoN_s6qa-bwJ:scholar.google.com/&scioq=MIPGen:+Learning+to+Generate+Scalable+MIP+Instances&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Sun Yat-sen University;Tsinghua University",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.sysu.edu.cn;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "SYSU;THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "YikB42Oyaw",
        "title": "MoReDrop: Dropout Without Dropping",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Dropout has been instrumental in enhancing the generalization capabilities of deep neural networks across a myriad of domains. However, its deployment introduces a significant challenge: the model distributional shift between the training and evaluation phases. Previous approaches have primarily concentrated on regularization methods, invariably employing the sub-model loss as the primary loss function. Despite this, those methods continue to encounter a persistent distributional shift during evaluation, a consequence of the implicit expectation inherent to the evaluation process. In this study, we introduce an innovative approach, namely Model Regularization for Dropout (MoReDrop). MoReDrop effectively addresses distributional shift by prioritizing the loss function from the dense model, supplemented by a regularization term derived from the pair of dense-sub models. This approach allows us to leverage the benefits of dropout without requiring gradient updates in the sub-models. To further mitigate the computational cost, we propose a lightweight version of MoReDrop, denoted as MoReDropL. This variant trades off a degree of generalization ability for reduced computational burden by employing dropout only at the last layer. Our experimental evaluations, conducted on several benchmarks across multiple domains, consistently demonstrate the scalability and efficiency of our proposed algorithms.",
        "keywords": "Deep Learning;Dropout;Regularization",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/4a0c865cdfc918808df0f22a7245afe58c507f6a.zip",
        "author": "Duo Li;Li Jiang;Yichuan Ding;Xue Liu;Victor Wai Kin Chan",
        "authorids": "~Duo_Li4;~Li_Jiang4;~Yichuan_Ding1;~Xue_Liu1;~Victor_Wai_Kin_Chan1",
        "gender": "M;M;M;M;Not Specified",
        "homepage": ";https://louieworth.github.io/;https://www.mcgill.ca/desautels/yichuan-daniel-ding;http://www.cs.mcgill.ca/~xueliu/;https://www.sigs.tsinghua.edu.cn/cwj/main.htm",
        "dblp": ";45/4954-8.html;;l/XueLiu;60/4361.html",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;https://scholar.google.ca/citations?user=QkWtGNkAAAAJ;https://scholar.google.com.tw/citations?user=rfLIRakAAAAJ;tmYLtDgAAAAJ",
        "orcid": ";;0000-0003-3014-8973;;0000-0002-7202-1922",
        "linkedin": ";;yichuan-ding-05083411/?originalSubdomain=ca;;",
        "or_profile": "~Duo_Li4;~Li_Jiang4;~Yichuan_Ding1;~Xue_Liu1;~Victor_Wai_Kin_Chan1",
        "aff": "Tsinghua University;McGill University;McGill University;McGill University;Shenzhen International Graduate School, Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;mail.mcgill.ca;mcgill.ca;mcgill.ca;tsinghua.edu.cn",
        "position": "MS student;PhD student;Associate Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nli2024moredrop,\ntitle={MoReDrop: Dropout Without Dropping},\nauthor={Duo Li and Li Jiang and Yichuan Ding and Xue Liu and Victor Wai Kin Chan},\nyear={2024},\nurl={https://openreview.net/forum?id=YikB42Oyaw}\n}",
        "github": "",
        "project": "",
        "reviewers": "8mBK;2qPD;7aV5;57g8",
        "site": "https://openreview.net/forum?id=YikB42Oyaw",
        "pdf_size": 1391269,
        "rating": "3;5;5;6",
        "confidence": "3;4;4;2",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "184;28;78;76",
        "wc_strengths": "78;9;90;156",
        "wc_weaknesses": "319;168;265;177",
        "wc_questions": "341;4;42;126",
        "wc_review": "922;209;475;535",
        "wc_reply_reviewers": "1057;97;407;33",
        "wc_reply_authors": "3368;1385;2437;562",
        "reply_reviewers": "7;1;2;1",
        "reply_authors": "9;4;6;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            91.5,
            57.03288525052893
        ],
        "wc_strengths_avg": [
            83.25,
            52.15062319857741
        ],
        "wc_weaknesses_avg": [
            232.25,
            62.80674724900184
        ],
        "wc_questions_avg": [
            128.25,
            130.52274705966008
        ],
        "wc_review_avg": [
            535.25,
            254.776740500384
        ],
        "wc_reply_reviewers_avg": [
            398.5,
            405.6436243798243
        ],
        "wc_reply_authors_avg": [
            1938.0,
            1059.8450358425046
        ],
        "reply_reviewers_avg": [
            2.75,
            2.48746859276655
        ],
        "reply_authors_avg": [
            5.0,
            2.9154759474226504
        ],
        "replies_avg": [
            37,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.20751433915982243,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1148391062627304515&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1;0",
        "aff_unique_norm": "Tsinghua University;McGill University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.mcgill.ca",
        "aff_unique_abbr": "THU;McGill",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Shenzhen",
        "aff_country_unique_index": "0;1;1;1;0",
        "aff_country_unique": "China;Canada"
    },
    {
        "id": "YjG29CIOP7",
        "title": "Task-Distributionally Robust Data-Free Meta-Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Data-free Meta-learning (DFML) aims to enable efficient learning of new unseen tasks by meta-learning from a collection of pre-trained models without access to their training data. Existing DFML methods construct pseudo tasks from a learnable dataset, which is iteratively inversed from a collection of pre-trained models. However, such distribution of pseudo tasks is not stationary and can be easily corrupted by specific attack, which causes (i) Task-Distribution Shift (TDS): the distribution of tasks will change as the learnable dataset gets updated, making the meta-learner biased and susceptible to overfitting on new tasks, ultimately harming its long-term generalization performance. (ii) Task-Distribution Corruption (TDC): the task distribution can be easily corrupted by deliberately injecting deceptive out-of-distribution models, termed as model poisoning attack. To address these issues, for the first time, we call for and develop robust DFML. Specifically, (i) for handling TDS, we propose a new memory-based DFML baseline (TEAPOT) via meta-learning from a pseudo task distribution. TEAPOT maintains the memory of old tasks to prevent over-reliance on new tasks, with an interpolation mechanism combining classes from different tasks to diversify the pseudo task distribution; (ii) for further defending against TDC, we propose a defense strategy, Robust Model Selection Policy (ROSY), which is compatible with existing DFML methods (e.g., ROSY + TEAPOT). ROSY adaptively ranks and then selects reliable models according to a learnable reliability score, which is optimized by policy gradient due to the non-differentiable property of model selection. Extensive experiments show the superiority of TEAPOT over existing baselines for handling TDS and verify the effectiveness of ROSY + DFML for further improving robustness against TDC.",
        "keywords": "meta-learning;data-free",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Zixuan Hu;Li Shen;Zhenyi Wang;Yongxian Wei;Baoyuan Wu;Chun Yuan;Dacheng Tao",
        "authorids": "~Zixuan_Hu1;~Li_Shen1;~Zhenyi_Wang1;~Yongxian_Wei1;~Baoyuan_Wu1;~Chun_Yuan1;~Dacheng_Tao1",
        "gender": "M;M;;;M;M;",
        "homepage": ";https://sites.google.com/site/mathshenli/home;;;https://sites.google.com/site/baoyuanwu2015/;https://www.sigs.tsinghua.edu.cn/fg3/105064.jhtml;",
        "dblp": "332/4542;91/3680-8;;;73/7781;;",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;yVhgENIAAAAJ;;;JNTG1KoAAAAJ;https://scholar.google.com.hk/citations?user=fYdxi2sAAAAJ;",
        "orcid": ";;;;0000-0003-2183-5990;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Zixuan_Hu1;~Li_Shen1;~Zhenyi_Wang1;~Yongxian_Wei1;~Baoyuan_Wu1;~Chun_Yuan1;~Dacheng_Tao1",
        "aff": "Tsinghua University;JD Explore Academy;;;The Chinese University of Hong Kong, Shenzhen;Tsinghua University;",
        "aff_domain": "mails.tsinghua.edu.cn;jd.com;;;cuhk.edu.cn;tsinghua.edu.cn;",
        "position": "MS student;Researcher;;;Associate Professor;Full Professor;",
        "bibtex": "@misc{\nhu2024taskdistributionally,\ntitle={Task-Distributionally Robust Data-Free Meta-Learning},\nauthor={Zixuan Hu and Li Shen and Zhenyi Wang and Yongxian Wei and Baoyuan Wu and Chun Yuan and Dacheng Tao},\nyear={2024},\nurl={https://openreview.net/forum?id=YjG29CIOP7}\n}",
        "github": "",
        "project": "",
        "reviewers": "iMtM;j2rx;eZp4;ywQB",
        "site": "https://openreview.net/forum?id=YjG29CIOP7",
        "pdf_size": 1364232,
        "rating": "3;3;5;8",
        "confidence": "4;4;4;3",
        "soundness": "2;2;2;3",
        "contribution": "2;3;2;3",
        "presentation": "2;3;1;4",
        "wc_summary": "198;48;43;136",
        "wc_strengths": "57;79;26;112",
        "wc_weaknesses": "272;136;290;82",
        "wc_questions": "123;70;20;2",
        "wc_review": "650;333;379;332",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1277;895;495;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;1;0",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            106.25,
            64.60795229691156
        ],
        "wc_strengths_avg": [
            68.5,
            31.388692231439016
        ],
        "wc_weaknesses_avg": [
            195.0,
            88.32326986700618
        ],
        "wc_questions_avg": [
            53.75,
            47.10825299244284
        ],
        "wc_review_avg": [
            423.5,
            132.14102315329635
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            666.75,
            473.96116665819784
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.82915619758885
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.9169493006161777,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:_z8FqY6nilcJ:scholar.google.com/&scioq=Task-Distributionally+Robust+Data-Free+Meta-Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Tsinghua University;JD;Chinese University of Hong Kong",
        "aff_unique_dep": ";JD Explore Academy;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;;https://www.cuhk.edu.cn",
        "aff_unique_abbr": "THU;;CUHK",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Shenzhen",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China;"
    },
    {
        "id": "YjSKB1sfOE",
        "title": "From Trojan Horses To Castle Walls: Revealing Bilateral Backdoor Effects In Diffision Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "While state-of-the-art diffusion models (DMs) excel in image generation, concerns regarding their security persist. Earlier research highlighted DMs' vulnerability to backdoor attacks, but these studies placed stricter requirements than conventional methods like 'BadNets' in image classification. This is because the former necessitates modifications to the diffusion sampling and training procedures. Unlike the prior work, we investigate whether generating backdoor attacks in DMs can be as simple as BadNets, *i.e.*, by only contaminating the training dataset without tampering the original diffusion process. In this more realistic backdoor setting, we uncover *bilateral backdoor effects* that not only serve an *adversarial* purpose (compromising the functionality of DMs) but also offer a *defensive* advantage (which can be leveraged for backdoor defense). Specifically, we find that a BadNets-like backdoor attack remains effective in DMs for producing incorrect images that do not align with the intended text conditions and for yielding incorrect predictions when DMs are employed as classifiers. Meanwhile, backdoored DMs exhibit an increased ratio of backdoor triggers,  a phenomenon we refer to as 'trigger amplification', among the generated images. We show that this latter insight can enhance the detection of backdoor-poisoned training data. Even under a low backdoor poisoning ratio, we find that studying the backdoor effects of DMs can be valuable for designing anti-backdoor image classifiers. Last but not least, we establish a meaningful linkage between backdoor attacks and the phenomenon of data replications by exploring DMs' inherent data memorization tendencies.",
        "keywords": "Backdoor attack;backdoor defense;diffision model;diffusion classifier",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Zhuoshi Pan;Yuguang Yao;Gaowen Liu;Bingquan Shen;H. Vicky Zhao;Ramana Rao Kompella;Sijia Liu",
        "authorids": "~Zhuoshi_Pan2;~Yuguang_Yao1;~Gaowen_Liu4;~Bingquan_Shen1;~H._Vicky_Zhao1;~Ramana_Rao_Kompella1;~Sijia_Liu1",
        "gender": "M;M;F;;F;M;M",
        "homepage": "https://pzs19.github.io;https://www.cse.msu.edu/~yaoyugua/;;;;https://linkedin.com/en/rkompella;https://lsjxjtu.github.io/",
        "dblp": "359/9934;238/9467;136/1007;151/9308;;98/2327;128/6972-1",
        "google_scholar": ";-chIdAkAAAAJ;NIv_aeQAAAAJ;https://scholar.google.com.sg/citations?user=zrJdj6YAAAAJ;;uf9RZboAAAAJ;C7dO_UgAAAAJ",
        "orcid": ";;0009-0000-9194-1233;;;;",
        "linkedin": ";tonyyaomsu/;;;hong-vicky-zhao-08599110/;;",
        "or_profile": "~Zhuoshi_Pan2;~Yuguang_Yao1;~Gaowen_Liu4;~Bingquan_Shen1;~H._Vicky_Zhao1;~Ramana_Rao_Kompella1;~Sijia_Liu1",
        "aff": "Tsinghua University;Michigan State University;Cisco Systems;DSO National Labs;Tsinghua University;Cisco;Michigan State University",
        "aff_domain": "tsinghua.edu.cn;msu.edu;cisco.com;dso.org.sg;tsinghua.edu.cn;cisco.com;msu.edu",
        "position": "MS student;PhD student;Researcher;Researcher;Associate Professor;Researcher;Assistant Professor",
        "bibtex": "@misc{\npan2024from,\ntitle={From Trojan Horses To Castle Walls: Revealing Bilateral Backdoor Effects In Diffision Models},\nauthor={Zhuoshi Pan and Yuguang Yao and Gaowen Liu and Bingquan Shen and H. Vicky Zhao and Ramana Rao Kompella and Sijia Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=YjSKB1sfOE}\n}",
        "github": "",
        "project": "",
        "reviewers": "TC33;5Vvf;8NBW;UGJ5",
        "site": "https://openreview.net/forum?id=YjSKB1sfOE",
        "pdf_size": 7009400,
        "rating": "3;5;6;6",
        "confidence": "4;4;3;4",
        "soundness": "2;2;3;4",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "92;48;147;89",
        "wc_strengths": "22;49;85;25",
        "wc_weaknesses": "432;239;300;35",
        "wc_questions": "10;6;143;92",
        "wc_review": "556;342;675;241",
        "wc_reply_reviewers": "180;0;47;21",
        "wc_reply_authors": "2352;811;1366;792",
        "reply_reviewers": "3;0;1;1",
        "reply_authors": "5;2;3;3",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            94.0,
            35.19232870953555
        ],
        "wc_strengths_avg": [
            45.25,
            25.222757581200355
        ],
        "wc_weaknesses_avg": [
            251.5,
            143.1441581064348
        ],
        "wc_questions_avg": [
            62.75,
            57.66010319102802
        ],
        "wc_review_avg": [
            453.5,
            171.14102372020568
        ],
        "wc_reply_reviewers_avg": [
            62.0,
            70.13201836536575
        ],
        "wc_reply_authors_avg": [
            1330.25,
            633.3610246139243
        ],
        "reply_reviewers_avg": [
            1.25,
            1.0897247358851685
        ],
        "reply_authors_avg": [
            3.25,
            1.0897247358851685
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.4714045207910316,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4774419811228678897&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;3;0;2;1",
        "aff_unique_norm": "Tsinghua University;Michigan State University;Cisco Systems;DSO National Laboratories",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.msu.edu;https://www.cisco.com;https://www.dso.org.sg",
        "aff_unique_abbr": "THU;MSU;Cisco;DSO",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;2;0;1;1",
        "aff_country_unique": "China;United States;Singapore"
    },
    {
        "id": "YjpswiEHyQ",
        "title": "2D-Supervised Monocular 3D Object Detection by Global-to-Local Reconstruction",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "With the rise of big models, the need for data has become increasingly crucial. However, costly manual annotations may hinder further advancements. In monocular 3D object detection, existing works have investigated weakly supervised algorithms with the help of additional LiDAR sensors to generate 3D pseudo labels, which cannot be applied to ordinary videos. In this paper, we propose a novel paradigm called BA$^2$-Det that utilizes global-to-local 3D reconstruction to supervise the monocular 3D object detector in a purely 2D manner. Specifically, we use scene-level global reconstruction with global bundle adjustment (BA) to recover 3D structures from monocular videos. Then we develop the DoubleClustering algorithm to obtain object clusters. By learning from the generated complete 3D pseudo boxes in global BA, GBA-Learner can predict 3D pseudo boxes for other occluded objects. Finally, we train an LBA-Learner with object-centric local BA to generalize the 3D pseudo labels to moving objects. Experiments conducted on the large-scale Waymo Open Dataset show that the performance of BA$^2$-Det is on par with the fully-supervised BA-Det trained with 10% videos, and even surpasses some pioneering fully-supervised methods. Besides, as a pretraining method, BA$^2$-Det can achieve 20% relative improvement on KITTI dataset. We also show the great potential of BA$^2$-Det for detecting open-set 3D objects in complex scenes. Anonymous project page: https://ba2det.site.",
        "keywords": "monocular 3D object detection",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Jiawei He;Yuqi Wang;Yuntao Chen;Zhaoxiang Zhang",
        "authorids": "~Jiawei_He2;~Yuqi_Wang3;~Yuntao_Chen1;~Zhaoxiang_Zhang3",
        "gender": "M;M;M;M",
        "homepage": "https://jiaweihe.com/;http://robertwyq.github.io;;http://zhaoxiangzhang.net",
        "dblp": "172/2564-2;20/1168-1;203/8284;55/2285-1.html",
        "google_scholar": "35lEP_oAAAAJ;35UcX9sAAAAJ;iLOoUqIAAAAJ;qxWfV6cAAAAJ",
        "orcid": "0000-0001-6872-3254;0000-0002-6360-1431;;",
        "linkedin": ";https://www.linkedin.cn/injobs/in/yuqi-wang-a08563192;;",
        "or_profile": "~Jiawei_He2;~Yuqi_Wang3;~Yuntao_Chen1;~Zhaoxiang_Zhang3",
        "aff": "Institute of automation, Chinese Academy of Sciences;Institute of Automation, Chinese Academy of Sciences;Centre for Artificial Intelligence and Robotics (CAIR), Hong Kong Institute of Science & Innovation, Chinese Academy of Sciences;Institute of Automation, Chinese Academy of Sciences",
        "aff_domain": "ia.ac.cn;ia.ac.cn;cair-cas.org.hk;ia.ac.cn",
        "position": "PhD student;PhD student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nhe2024dsupervised,\ntitle={2D-Supervised Monocular 3D Object Detection by Global-to-Local Reconstruction},\nauthor={Jiawei He and Yuqi Wang and Yuntao Chen and Zhaoxiang Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=YjpswiEHyQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "cbts;2jyv;MCGQ",
        "site": "https://openreview.net/forum?id=YjpswiEHyQ",
        "pdf_size": 2243044,
        "rating": "5;5;6",
        "confidence": "3;4;4",
        "soundness": "3;3;3",
        "contribution": "2;2;3",
        "presentation": "2;2;3",
        "wc_summary": "61;97;207",
        "wc_strengths": "120;61;126",
        "wc_weaknesses": "246;249;98",
        "wc_questions": "37;52;30",
        "wc_review": "464;459;461",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "809;942;434",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;2;1",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            121.66666666666667,
            62.10385566845982
        ],
        "wc_strengths_avg": [
            102.33333333333333,
            29.32954520994525
        ],
        "wc_weaknesses_avg": [
            197.66666666666666,
            70.48561713017928
        ],
        "wc_questions_avg": [
            39.666666666666664,
            9.177266598624136
        ],
        "wc_review_avg": [
            461.3333333333333,
            2.0548046676563256
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            728.3333333333334,
            215.09119512946648
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:4rhFChFVQX0J:scholar.google.com/&scioq=2D-Supervised+Monocular+3D+Object+Detection+by+Global-to-Local+Reconstruction&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Chinese Academy of Sciences",
        "aff_unique_dep": "Institute of Automation",
        "aff_unique_url": "http://www.ia.cas.cn",
        "aff_unique_abbr": "CAS",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "YkCjojDG3l",
        "title": "PolySketchFormer: Fast Transformers via Sketches for Polynomial Kernels",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The quadratic complexity of attention in transformer architectures remains a big bottleneck in scaling up large foundation models for long context. In fact, recent theoretical results show the hardness of approximating the output of softmax attention mechanism in sub-quadratic time assuming Strong Exponential Time Hypothesis. In this paper, we  show how to break this theoretical barrier by replacing softmax with a polynomial function and polynomial sketching. In particular we show that sketches for Polynomial Kernel from the randomized numerical linear algebra literature can be used to approximate the polynomial attention  which leads to a significantly faster attention mechanism without assuming any sparse structure for the attention matrix that has been done in many previous works. \n\n  In addition, we propose an efficient block-based algorithm that lets us apply the causal mask to the attention matrix without explicitly realizing the $n \\times n$ attention matrix and compute the output of the polynomial attention mechanism in time linear in the context length. The block-based algorithm gives significant speedups over the *cumulative sum* algorithm used by Performer to apply the causal mask to the attention matrix. These observations help us design *PolySketchFormer*, a practical linear-time transformer architecture for language modeling with provable guarantees.\n\n  We validate our design empirically by training language models with long context lengths. We first show that the eval perplexities of our models are comparable to that of models trained with softmax attention. We then show that for large context lengths our training times are significantly faster than FlashAttention.",
        "keywords": "Linear Time Attention;Polynomial Kernels;Causal Masking",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/8d56dbd3f9f818acfb8ac0c9b85ad5f73ac365d3.zip",
        "author": "Praneeth Kacham;Vahab Mirrokni;Peilin Zhong",
        "authorids": "~Praneeth_Kacham1;~Vahab_Mirrokni2;~Peilin_Zhong1",
        "gender": "M;M;M",
        "homepage": "https://www.praneethkacham.com;https://people.csail.mit.edu/mirrokni/Welcome.html;http://www.cs.columbia.edu/~peilin/",
        "dblp": "255/5684;m/VahabSMirrokni;148/9632",
        "google_scholar": "hKhPmTkAAAAJ;opbZfw0AAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Praneeth_Kacham1;~Vahab_Mirrokni2;~Peilin_Zhong1",
        "aff": "Carnegie Mellon University;Google Research;Google",
        "aff_domain": "cmu.edu;google.com;google.com",
        "position": "PhD student;VP, Google Fellow;Researcher",
        "bibtex": "@misc{\nkacham2024polysketchformer,\ntitle={PolySketchFormer: Fast Transformers via Sketches for Polynomial Kernels},\nauthor={Praneeth Kacham and Vahab Mirrokni and Peilin Zhong},\nyear={2024},\nurl={https://openreview.net/forum?id=YkCjojDG3l}\n}",
        "github": "",
        "project": "",
        "reviewers": "Jyhm;q4q2;YWkN;B6vB;vEUf",
        "site": "https://openreview.net/forum?id=YkCjojDG3l",
        "pdf_size": 497852,
        "rating": "3;3;5;6;8",
        "confidence": "3;4;3;3;4",
        "soundness": "2;4;3;3;3",
        "contribution": "3;2;3;3;4",
        "presentation": "2;3;4;3;3",
        "wc_summary": "121;476;67;99;180",
        "wc_strengths": "71;3;20;45;115",
        "wc_weaknesses": "176;3;115;90;186",
        "wc_questions": "70;477;94;19;286",
        "wc_review": "438;959;296;253;767",
        "wc_reply_reviewers": "202;81;137;0;25",
        "wc_reply_authors": "1659;990;817;158;311",
        "reply_reviewers": "1;1;1;0;1",
        "reply_authors": "3;3;1;1;1",
        "rating_avg": [
            5.0,
            1.8973665961010275
        ],
        "confidence_avg": [
            3.4,
            0.4898979485566356
        ],
        "soundness_avg": [
            3.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            3.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            3.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            188.6,
            148.362528961999
        ],
        "wc_strengths_avg": [
            50.8,
            39.488732570190194
        ],
        "wc_weaknesses_avg": [
            114.0,
            66.22084264036512
        ],
        "wc_questions_avg": [
            189.2,
            169.96399618742788
        ],
        "wc_review_avg": [
            542.6,
            275.4506126331906
        ],
        "wc_reply_reviewers_avg": [
            89.0,
            73.69396176078472
        ],
        "wc_reply_authors_avg": [
            787.0,
            533.7995878604629
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4
        ],
        "reply_authors_avg": [
            1.8,
            0.9797958971132713
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.21516574145596765,
        "gs_citation": 37,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9486637899620894653&as_sdt=5,34&sciodt=0,34&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Carnegie Mellon University;Google",
        "aff_unique_dep": ";Google Research",
        "aff_unique_url": "https://www.cmu.edu;https://research.google",
        "aff_unique_abbr": "CMU;Google Research",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "YkEW5TabYN",
        "title": "Perturbed examples reveal invariances shared by language models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "An explosion of work in language is leading to ever-increasing numbers of available natural language processing models, with little understanding of how new models compare to better-understood models. One major reason for this difficulty is saturating benchmark datasets, which may not reflect well differences in model performance in the wild. In this work, we propose a novel framework for comparing two natural language processing models by revealing their shared invariance to interpretable input perturbations that are designed to target a specific linguistic capability (e.g., Synonym-Invariance, Typo-Invariance). Via experiments on models from within the same and across different architecture families, this framework offers a number of insights about how changes in models (e.g. distillation, increase in size, amount of pre-training) affect multiple well-defined linguistic capabilities. Furthermore, we also demonstrate how our framework can enable evaluation of the invariances shared between models that are available as commercial black-box APIs (e.g., InstructGPT family) and models that are relatively better understood (e.g., GPT-2). Across several experiments, we observe that large language models share many of the invariances encoded by models of various sizes, whereas the invariances encoded by large language models are only shared by other large models. Possessing a wide variety of invariances may be a key reason for the recent successes of large language models, and our framework can shed light on the types of invariances that are retained by or emerge in new models.",
        "keywords": "behavioral comparison;linguistic capabilities;shared invariance",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Ruchit Rawal;Mariya Toneva",
        "authorids": "~Ruchit_Rawal1;~Mariya_Toneva1",
        "gender": "M;F",
        "homepage": "https://ruchitrawal.github.io/;https://mtoneva.com",
        "dblp": "263/7014;160/4677",
        "google_scholar": "ilDc7ssAAAAJ;https://scholar.google.ca/citations?user=a61sk-4AAAAJ",
        "orcid": "0000-0003-1794-9573;0000-0002-2407-9871",
        "linkedin": ";",
        "or_profile": "~Ruchit_Rawal1;~Mariya_K_Toneva1",
        "aff": "MPI-SWS;Max Planck Institute for Software Systems",
        "aff_domain": "mpi-sws.org;mpi-sws.org",
        "position": "Intern;Assistant Professor",
        "bibtex": "@misc{\nrawal2024perturbed,\ntitle={Perturbed examples reveal invariances shared by language models},\nauthor={Ruchit Rawal and Mariya Toneva},\nyear={2024},\nurl={https://openreview.net/forum?id=YkEW5TabYN}\n}",
        "github": "",
        "project": "",
        "reviewers": "xMdc;cey2;nq6A;yXpb",
        "site": "https://openreview.net/forum?id=YkEW5TabYN",
        "pdf_size": 1219604,
        "rating": "3;3;6;8",
        "confidence": "4;3;4;3",
        "soundness": "2;2;4;3",
        "contribution": "1;2;3;3",
        "presentation": "2;1;3;3",
        "wc_summary": "208;473;132;46",
        "wc_strengths": "17;79;92;16",
        "wc_weaknesses": "224;1001;23;8",
        "wc_questions": "23;182;233;3",
        "wc_review": "472;1735;480;73",
        "wc_reply_reviewers": "0;246;0;0",
        "wc_reply_authors": "672;1803;528;64",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;3;1;1",
        "rating_avg": [
            5.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            214.75,
            159.736306142342
        ],
        "wc_strengths_avg": [
            51.0,
            34.806608567914225
        ],
        "wc_weaknesses_avg": [
            314.0,
            405.70494204532434
        ],
        "wc_questions_avg": [
            110.25,
            99.15990873331822
        ],
        "wc_review_avg": [
            690.0,
            625.3674919597277
        ],
        "wc_reply_reviewers_avg": [
            61.5,
            106.52112466548596
        ],
        "wc_reply_authors_avg": [
            766.75,
            639.0717389307714
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.23570226039551587,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:v8hVNUkzM5QJ:scholar.google.com/&scioq=Perturbed+examples+reveal+invariances+shared+by+language+models&hl=en&as_sdt=0,5",
        "gs_version_total": 6,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Max Planck Institute for Software Systems",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.mpi-sws.org",
        "aff_unique_abbr": "MPI-SWS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "YkR9UFlQ1s",
        "title": "Non-backtracking Graph Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The celebrated message-passing updates for graph neural networks allow the representation of large-scale graphs with local and computationally tractable updates. However, the local updates suffer from backtracking, i.e., a message flows through the same edge twice and revisits the previously visited node. Since the number of message flows increases exponentially with the number of updates, the redundancy in local updates prevents the graph neural network from accurately recognizing a particular message flow for downstream tasks. In this work, we propose to resolve such a redundancy via the non-backtracking graph neural network (NBA-GNN) that updates a message without incorporating the message from the previously visited node. We further investigate how NBA-GNN alleviates the over-squashing of GNNs, and establish a connection between NBA-GNN and the impressive performance of non-backtracking updates for stochastic block model recovery. We empirically verify the effectiveness of our NBA-GNN on long-range graph benchmark and transductive node classification problems.",
        "keywords": "non-backtracking;redundancy;graph neural network;over-squashing",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/5b52f10b9554ac5ba57daa105ab6d9c57c8e592a.zip",
        "author": "Seonghyun Park;Narae Ryu;Gahee Kim;Dongyeop Woo;Se-Young Yun;Sungsoo Ahn",
        "authorids": "~Seonghyun_Park1;~Narae_Ryu1;~Gahee_Kim1;~Dongyeop_Woo1;~Se-Young_Yun1;~Sungsoo_Ahn1",
        "gender": ";F;F;M;M;M",
        "homepage": ";;http://osi.kaist.ac.kr/students/;https://github.com/dongyeop3813;https://fbsqkd.github.io;https://sungsooahn.super.site/",
        "dblp": ";184/3797;;;23/8862;90/5164",
        "google_scholar": ";GV6NYJUAAAAJ;;jl91FPYAAAAJ;X_IAjb8AAAAJ;XTenHs0AAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";;;dongyeop-woo-416ba7360/;seyoung-yun-395130ab/;",
        "or_profile": "~Seonghyun_Park1;~Narae_Ryu1;~Gahee_Kim1;~Dongyeop_Woo1;~Se-Young_Yun1;~Sungsoo_Ahn1",
        "aff": ";KAIST;;Pohang University of Science and Technology;KAIST;Pohang University of Science and Technology",
        "aff_domain": ";kaist.ac.kr;;postech.edu;kaist.ac.kr;postech.ac.kr",
        "position": ";PhD student;;Undergrad student;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\npark2024nonbacktracking,\ntitle={Non-backtracking Graph Neural Networks},\nauthor={Seonghyun Park and Narae Ryu and Gahee Kim and Dongyeop Woo and Se-Young Yun and Sungsoo Ahn},\nyear={2024},\nurl={https://openreview.net/forum?id=YkR9UFlQ1s}\n}",
        "github": "",
        "project": "",
        "reviewers": "ayH6;w5ts;apAV;Q7oz;WPCH",
        "site": "https://openreview.net/forum?id=YkR9UFlQ1s",
        "pdf_size": 1690727,
        "rating": "3;3;5;5;6",
        "confidence": "4;4;5;4;3",
        "soundness": "3;2;3;3;3",
        "contribution": "1;2;2;3;3",
        "presentation": "4;3;3;4;3",
        "wc_summary": "82;46;80;87;65",
        "wc_strengths": "29;23;42;47;79",
        "wc_weaknesses": "226;355;512;53;62",
        "wc_questions": "92;1;74;301;13",
        "wc_review": "429;425;708;488;219",
        "wc_reply_reviewers": "0;0;95;64;11",
        "wc_reply_authors": "526;801;2023;741;681",
        "reply_reviewers": "0;0;1;1;1",
        "reply_authors": "1;2;3;2;1",
        "rating_avg": [
            4.4,
            1.2
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.2,
            0.7483314773547882
        ],
        "presentation_avg": [
            3.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            72.0,
            14.926486525636232
        ],
        "wc_strengths_avg": [
            44.0,
            19.51409746824075
        ],
        "wc_weaknesses_avg": [
            241.6,
            175.52504094857804
        ],
        "wc_questions_avg": [
            96.2,
            108.10994403846485
        ],
        "wc_review_avg": [
            453.8,
            156.43708000343142
        ],
        "wc_reply_reviewers_avg": [
            34.0,
            38.63159328839544
        ],
        "wc_reply_authors_avg": [
            954.4,
            542.0795513575474
        ],
        "reply_reviewers_avg": [
            0.6,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.8,
            0.7483314773547883
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.2635231383473649,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3336179382710055853&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;0;1",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology;Pohang University of Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.kaist.ac.kr;https://www.postech.ac.kr",
        "aff_unique_abbr": "KAIST;POSTECH",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Pohang",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "YkRwadXWHd",
        "title": "SignKD: Multi-modal Hierarchical Knowledge Distillation for Continuous Sign Language Recognition",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Continuous sign language recognition (CSLR) plays a crucial role in promoting inclusivity and facilitating communication within the hearing-impaired community. One of the key challenges in CSLR is accurately capturing the intricate hand movements involved. To address this challenge, we propose a multi-modal framework that first combines video, keypoints, and optical flow modalities to extract more representative features. We investigate various fusion techniques to effectively integrate the information from these modalities.\nFurthermore, we introduce a hierarchical knowledge distillation (HKD) framework to alleviate the computational burden associated with extracting keypoints and optical flow information. This framework enables the hierarchical transfer of knowledge from multiple modalities to a single-modal CSLR model, ensuring high performance while reducing computational costs.\nTo evaluate the effectiveness of our approach, we conduct extensive experiments on three benchmark datasets: Phoenix-2014, Phoenix-2014T, and CSL-Daily. The results demonstrate that our approach achieves state-of-the-art performance in CSLR, both in the single-stream and multi-stream settings.",
        "keywords": "Sign Language Recognition;Multi-modal;Hierarchical Knowledge Distillation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Hao Chen;Jiaze Wang;Ziyu Guo;Jinpeng Li;Bian Wu;Guangyong Chen;Pheng-Ann Heng",
        "authorids": "~Hao_Chen38;~Jiaze_Wang1;~Ziyu_Guo2;~Jinpeng_Li1;~Bian_Wu1;~Guangyong_Chen1;~Pheng-Ann_Heng1",
        "gender": "M;M;F;M;;M;M",
        "homepage": ";https://jiazewang.com;;http://www.inceptioniai.org/members;;https://guangyongchen.github.io/;http://www.cse.cuhk.edu.hk/~pheng",
        "dblp": ";;;95/2448;;175/1354;52/2889",
        "google_scholar": "https://scholar.google.com.hk/citations?hl=zh-CN;C_ID2f4AAAAJ;S9GLetwAAAAJ;;https://scholar.google.com/citations?view_op=list_works;https://scholar.google.com.hk/citations?user=AUpqepUAAAAJ;https://scholar.google.com/citations?sortby=pubdate",
        "orcid": ";;;;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Hao_Chen38;~Jiaze_Wang1;~Ziyu_Guo2;~Jinpeng_Li1;~Bian_Wu1;~Guangyong_Chen1;~Pheng-Ann_Heng1",
        "aff": "Department of Computer Science and Engineering, The Chinese University of Hong Kong;The Chinese University of Hong Kong;Department of Computer Science and Engineering, The Chinese University of Hong Kong;The Chinese University of Hong Kong;;Zhejiang Lab;The Chinese University of Hong Kong",
        "aff_domain": "cse.cuhk.edu.hk;cuhk.edu.hk;cse.cuhk.edu.hk;cuhk.edu.hk;;zju.edu.cn;cuhk.edu.hk",
        "position": "PhD student;PhD student;PhD student;PhD student;;Principal Researcher;Full Professor",
        "bibtex": "@misc{\nchen2024signkd,\ntitle={Sign{KD}: Multi-modal Hierarchical Knowledge Distillation for Continuous Sign Language Recognition},\nauthor={Hao Chen and Jiaze Wang and Ziyu Guo and Jinpeng Li and Bian Wu and Guangyong Chen and Pheng-Ann Heng},\nyear={2024},\nurl={https://openreview.net/forum?id=YkRwadXWHd}\n}",
        "github": "",
        "project": "",
        "reviewers": "KJqg;7ffA;eEWQ",
        "site": "https://openreview.net/forum?id=YkRwadXWHd",
        "pdf_size": 2478650,
        "rating": "3;3;5",
        "confidence": "5;5;4",
        "soundness": "3;2;3",
        "contribution": "2;2;2",
        "presentation": "3;2;3",
        "wc_summary": "58;48;114",
        "wc_strengths": "20;71;165",
        "wc_weaknesses": "279;242;413",
        "wc_questions": "2;5;350",
        "wc_review": "359;366;1042",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            73.33333333333333,
            29.044027881055953
        ],
        "wc_strengths_avg": [
            85.33333333333333,
            60.05737997023254
        ],
        "wc_weaknesses_avg": [
            311.3333333333333,
            73.45898326428309
        ],
        "wc_questions_avg": [
            119.0,
            163.3462579920336
        ],
        "wc_review_avg": [
            589.0,
            320.3321193178522
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:4UOIyKKGPFQJ:scholar.google.com/&scioq=SignKD:+Multi-modal+Hierarchical+Knowledge+Distillation+for+Continuous+Sign+Language+Recognition&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;1;0",
        "aff_unique_norm": "Chinese University of Hong Kong;Zhejiang Lab",
        "aff_unique_dep": "Department of Computer Science and Engineering;",
        "aff_unique_url": "https://www.cuhk.edu.hk;http://www.zhejianglab.com",
        "aff_unique_abbr": "CUHK;",
        "aff_campus_unique_index": "0;0;0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "YlleMywQzX",
        "title": "Anytime Neural Architecture Search on Tabular Data",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The increasing demand for tabular data analysis calls for transitioning from manual architecture design to Neural Architecture Search (NAS). This transition demands an efficient and responsive anytime NAS approach that is capable of returning current optimal architectures within any given time budget while progressively enhancing architecture quality with increased budget allocation. However, the area of research on Anytime NAS for tabular data remains unexplored. To this end, we introduce ATLAS, the first anytime NAS approach tailored for tabular data. ATLAS introduces a novel two-phase filtering-and-refinement optimization scheme with joint optimization, combining the strengths of both paradigms of training-free and training-based architecture evaluation. Specifically, in the filtering phase, ATLAS employs a new training-free architecture evaluation metric specifically designed for tabular data to efficiently estimate the performance of candidate architectures, thereby obtaining a set of promising architectures. Subsequently, in the refinement phase, ATLAS leverages a fixed-budget search algorithm to schedule the training of the promising candidates, so as to accurately identify the optimal architecture. To jointly optimize the two phases for anytime NAS, we also devise a budget-aware coordinator that delivers high NAS performance within constraints. Experimental evaluations demonstrate that our ATLAS can obtain a good performing architecture within any predefined time budget and return better architectures as and when a new time budget is made available. Overall, it reduces the search time on tabular data by up to 82.75x compared to existing NAS approaches.",
        "keywords": "Neural Architecture Search;Tabular Data;Anytime Performance;Training-free NAS;Two-Phase Optimization Scheme with Joint Optimization",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/9bb90c0ed200ca24c8a8b9193bef4d382c4a98b0.zip",
        "author": "Naili Xing;Shaofeng Cai;Zhaojing Luo;Beng Chin Ooi;Jian Pei",
        "authorids": "~Naili_Xing1;~Shaofeng_Cai1;~Zhaojing_Luo1;~Beng_Chin_Ooi1;~Jian_Pei1",
        "gender": "M;M;;M;",
        "homepage": "https://nlgithubwp.github.io/tech-notebook/;https://solopku.github.io/;;http://www.comp.nus.edu.sg/~ooibc/;",
        "dblp": "299/1703;228/6099;;o/BengChinOoi;",
        "google_scholar": ";Nzr-hIoAAAAJ;;https://scholar.google.com.tw/citations?user=9560QjYAAAAJ;",
        "orcid": ";0000-0001-8605-076X;;0000-0003-4446-1100;",
        "linkedin": ";;;beng-chin-ooi-34b0634/;",
        "or_profile": "~Naili_Xing1;~Shaofeng_Cai1;~Zhaojing_Luo1;~Beng_Chin_Ooi1;~Jian_Pei1",
        "aff": "National University of Singapore;National University of Singapore;;National University of Singapore;",
        "aff_domain": "comp.nus.edu.sg;comp.nus.edu.sg;;comp.nus.edu.sg;",
        "position": "PhD student;Researcher;;Full Professor;",
        "bibtex": "@misc{\nxing2024anytime,\ntitle={Anytime Neural Architecture Search on Tabular Data},\nauthor={Naili Xing and Shaofeng Cai and Zhaojing Luo and Beng Chin Ooi and Jian Pei},\nyear={2024},\nurl={https://openreview.net/forum?id=YlleMywQzX}\n}",
        "github": "",
        "project": "",
        "reviewers": "b3YS;wdfZ;uv1h;uv7V",
        "site": "https://openreview.net/forum?id=YlleMywQzX",
        "pdf_size": 4105885,
        "rating": "5;6;6;6",
        "confidence": "3;4;5;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;2",
        "presentation": "3;3;4;3",
        "wc_summary": "120;55;99;99",
        "wc_strengths": "183;48;211;75",
        "wc_weaknesses": "217;187;586;45",
        "wc_questions": "6;55;49;95",
        "wc_review": "526;345;945;314",
        "wc_reply_reviewers": "0;0;89;0",
        "wc_reply_authors": "636;754;861;536",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "2;1;2;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            93.25,
            23.689396362085716
        ],
        "wc_strengths_avg": [
            129.25,
            69.13166785200542
        ],
        "wc_weaknesses_avg": [
            258.75,
            199.79536406033048
        ],
        "wc_questions_avg": [
            51.25,
            31.546592525976557
        ],
        "wc_review_avg": [
            532.5,
            251.54373377208188
        ],
        "wc_reply_reviewers_avg": [
            22.25,
            38.53813046840752
        ],
        "wc_reply_authors_avg": [
            696.75,
            122.25664603611536
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5222329678670935,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=469787112365856745&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "National University of Singapore",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nus.edu.sg",
        "aff_unique_abbr": "NUS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Singapore"
    },
    {
        "id": "YmQyEdLIkU",
        "title": "Adversarial Attacks as Near-Zero Eigenvalues in The Empirical Kernel of Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Adversarial examples ---imperceptibly modified data inputs designed to mislead machine learning models--- have raised concerns about the robustness of modern neural architectures in safety-critical applications. \nIn this paper, we propose a unified mathematical \nframework for understanding adversarial examples in neural networks, corroborating Ian Goodfellow's original conjecture that \nsuch examples are exceedingly rare, despite their presence in the proximity of nearly every test case. By exploiting results from Kernel Theory, we characterise adversarial examples as those producing near-zero Mercer's eigenvalues in the empirical kernel associated to a trained neural network. \nConsequently, the generation of adversarial attacks, using any known technique, can be conceptualised as a progression towards the eigenvalue space's zero point within the empirical kernel.\nWe rigorously prove this characterisation for trained fully-connected neural networks under mild assumptions on the nonlinear activation function, thus\nproviding a mathematical explanation for the apparent contradiction of neural networks excelling at generalisation while remaining vulnerable to adversarial attacks. \nIn practical experiments conducted on the MNIST dataset, we have verified that adversarial examples generated through the widely-used Deep Fool algorithm do, indeed, lead to a shift in the distribution of Mercer's eigenvalues toward zero. These results are in strong agreement with predictions of our theoretical framework.",
        "keywords": "adversarial attacks;neural networks;kernels",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/b938f4f36c787d588a10b7dc852f69ef53424523.zip",
        "author": "Ouns El Harzli;Bernardo Cuenca Grau",
        "authorids": "~Ouns_El_Harzli1;~Bernardo_Cuenca_Grau1",
        "gender": ";",
        "homepage": ";https://www.cs.ox.ac.uk/people/bernardo.cuencagrau/",
        "dblp": ";71/6448",
        "google_scholar": ";THu1uZMAAAAJ",
        "orcid": ";",
        "linkedin": "ouns-el-harzli-82b911133/;",
        "or_profile": "~Ouns_El_Harzli1;~Bernardo_Cuenca_Grau1",
        "aff": "University of Oxford;University of Oxford",
        "aff_domain": "ox.ac.uk;cs.ox.ac.uk",
        "position": "PhD student;Professor",
        "bibtex": "@misc{\nharzli2024adversarial,\ntitle={Adversarial Attacks as Near-Zero Eigenvalues in The Empirical Kernel of Neural Networks},\nauthor={Ouns El Harzli and Bernardo Cuenca Grau},\nyear={2024},\nurl={https://openreview.net/forum?id=YmQyEdLIkU}\n}",
        "github": "",
        "project": "",
        "reviewers": "74hn;vXdv;YsYz;DyBR",
        "site": "https://openreview.net/forum?id=YmQyEdLIkU",
        "pdf_size": 870805,
        "rating": "5;5;6;6",
        "confidence": "3;3;3;2",
        "soundness": "3;2;3;2",
        "contribution": "3;2;3;2",
        "presentation": "3;1;3;3",
        "wc_summary": "134;126;96;92",
        "wc_strengths": "102;28;53;103",
        "wc_weaknesses": "220;401;92;276",
        "wc_questions": "35;8;127;110",
        "wc_review": "491;563;368;581",
        "wc_reply_reviewers": "127;0;0;88",
        "wc_reply_authors": "438;527;262;361",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            112.0,
            18.275666882497067
        ],
        "wc_strengths_avg": [
            71.5,
            32.23740063962974
        ],
        "wc_weaknesses_avg": [
            247.25,
            111.03011978738022
        ],
        "wc_questions_avg": [
            70.0,
            49.794578018093496
        ],
        "wc_review_avg": [
            500.75,
            83.71491802540334
        ],
        "wc_reply_reviewers_avg": [
            53.75,
            55.49042710233901
        ],
        "wc_reply_authors_avg": [
            397.0,
            97.59866802369794
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:rQb8DN5BxrwJ:scholar.google.com/&scioq=Adversarial+Attacks+as+Near-Zero+Eigenvalues+in+The+Empirical+Kernel+of+Neural+Networks&hl=en&as_sdt=0,33",
        "gs_version_total": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Oxford",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ox.ac.uk",
        "aff_unique_abbr": "Oxford",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "YnaGcMJQ0M",
        "title": "Detecting Out-of-Distribution Samples via Conditional Distribution Entropy with Optimal Transport",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "When deploying a trained machine learning model in the real world, it is inevitable to receive inputs from out-of-distribution (OOD) sources. For instance, in continual learning settings, it is common to encounter OOD samples due to the non-stationarity of a domain. More generally, when we have access to a set of test inputs, the existing rich line of OOD detection solutions, especially the recent promise of distance-based methods, falls short in effectively utilizing the distribution information from training samples and test inputs. In this paper, we argue that empirical probability distributions that incorporate geometric information from both training samples and test inputs can be highly beneficial for OOD detection in the presence of  test inputs available. To address this, we propose to model OOD detection as a discrete optimal transport problem. Within the framework of optimal transport, we propose a novel score function known as the \\emph{conditional distribution entropy} to quantify the uncertainty of a test input being an OOD sample. Our proposal inherits the merits of certain distance-based methods while eliminating the reliance on distribution assumptions, a-prior knowledge, and specific training mechanisms. Extensive experiments conducted on benchmark datasets demonstrate that our method outperforms its competitors in OOD detection.",
        "keywords": "Uncertainty Estimation;Optimal Transport;Out-of-Ditribution Detection;Contrastive Learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Chuanwen Feng;Wenlong Chen;Ao Ke;Yilong Ren;Xike Xie;S Kevin Zhou",
        "authorids": "~Chuanwen_Feng1;~Wenlong_Chen3;~Ao_Ke2;~Yilong_Ren1;~Xike_Xie1;~S_Kevin_Zhou1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://optstats.github.io;https://github.com/WenlongChenCY;;https://github.com/ryl0427;http://staff.ustc.edu.cn/~xkxie;",
        "dblp": ";;;;64/1308;57/98",
        "google_scholar": ";;;;;8eNm2GMAAAAJ",
        "orcid": ";;0000-0002-5977-302X;;;0000-0002-6881-4444",
        "linkedin": ";;;;;s-kevin-zhou-231a094b/",
        "or_profile": "~Chuanwen_Feng1;~Wenlong_Chen3;~Ao_Ke2;~Yilong_Ren1;~Xike_Xie1;~S_Kevin_Zhou1",
        "aff": ";University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China",
        "aff_domain": ";cn.edu;ustc.edu.cn;ustc.edu.cn;ustc.edu.cn;ustc.edu.cn",
        "position": ";MS student;MS student;MS student;Research Professor;Full Professor",
        "bibtex": "@misc{\nfeng2024detecting,\ntitle={Detecting Out-of-Distribution Samples via Conditional Distribution Entropy with Optimal Transport},\nauthor={Chuanwen Feng and Wenlong Chen and Ao Ke and Yilong Ren and Xike Xie and S Kevin Zhou},\nyear={2024},\nurl={https://openreview.net/forum?id=YnaGcMJQ0M}\n}",
        "github": "",
        "project": "",
        "reviewers": "c9Kw;MtSB;kQwJ;uQxg",
        "site": "https://openreview.net/forum?id=YnaGcMJQ0M",
        "pdf_size": 1453832,
        "rating": "1;3;6;8",
        "confidence": "5;4;3;4",
        "soundness": "2;2;3;4",
        "contribution": "2;2;3;4",
        "presentation": "2;2;3;4",
        "wc_summary": "256;61;118;149",
        "wc_strengths": "28;11;40;59",
        "wc_weaknesses": "303;276;139;279",
        "wc_questions": "3;67;19;255",
        "wc_review": "590;415;316;742",
        "wc_reply_reviewers": "289;268;0;0",
        "wc_reply_authors": "1798;958;989;943",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "4;2;2;2",
        "rating_avg": [
            4.5,
            2.692582403567252
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            146.0,
            70.91896784358893
        ],
        "wc_strengths_avg": [
            34.5,
            17.5
        ],
        "wc_weaknesses_avg": [
            249.25,
            64.50726703248247
        ],
        "wc_questions_avg": [
            86.0,
            100.37429949942366
        ],
        "wc_review_avg": [
            515.75,
            163.36519672194564
        ],
        "wc_reply_reviewers_avg": [
            139.25,
            139.4477948911348
        ],
        "wc_reply_authors_avg": [
            1172.0,
            361.80174128934203
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            0.8660254037844386
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.6565321642986128,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2359169659159057431&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "University of Science and Technology of China",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.ustc.edu.cn",
        "aff_unique_abbr": "USTC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "Yol6nUVIJD",
        "title": "ReConcile: Round-Table Conference Improves Reasoning via Consensus among Diverse LLMs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) still struggle with complex reasoning tasks. Mo\u0002tivated by the society of minds (Minsky, 1988), we propose ReConcile, a multi-model multi-agent framework designed as a round table conference among diverse LLM agents to foster diverse thoughts and discussion for improved consensus. ReConcile enhances the reasoning capabilities of LLMs by holding multiple rounds of discussion, learning to convince other agents to improve their answers, and employing a confidence-weighted voting mechanism. In each round, ReConcile initiates discussion between agents via a 'discussion prompt' that consists of (a) grouped answers and explanations generated by each agent in the previous round, (b) their uncertainties, and (c) demonstrations of answer-rectifying human explanations, used for convincing other agents. This discussion prompt enables each agent to revise their responses in light of insights from other agents. Once a consensus is reached and the discussion ends, ReConcile determines the final team answer by leveraging the confidence of each agent in a weighted voting scheme. We implement ReConcile with ChatGPT, Bard, and Claude2 as the three agents. Experimental results on various benchmarks demonstrate that ReConcile\u0002 significantly improves the reasoning performance of the agents (both individually and as a team), surpassing prior single-agent and multi-agent baselines by 7.7% and also outperforming GPT-4 on some of these datasets. We also experiment with GPT-4 itself as one of the agents in ReConcile and demonstrate that its initial performance also improves by absolute 10.0% through discussion and feedback from other agents. Finally, we analyze the accuracy after every round and observe that ReConcile achieves better and faster consensus between agents, compared to a multi-agent debate baseline.",
        "keywords": "Large Language Models;Multi-Step Reasoning;Explanations;Multi-Agent System;Multi-Round Discussion",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/51149f2816c70ff65474e4e2b77855b33b0bd1ad.zip",
        "author": "Chih Yao Chen;Swarnadeep Saha;Mohit Bansal",
        "authorids": "~Chih_Yao_Chen1;~Swarnadeep_Saha2;~Mohit_Bansal2",
        "gender": "M;M;M",
        "homepage": "https://dinobby.github.io/;https://www.cs.unc.edu/~mbansal/;https://swarnahub.github.io/",
        "dblp": "248/8754.html;32/5243.html;203/9296",
        "google_scholar": "https://scholar.google.com.tw/citations?user=ODoG9isAAAAJ;DN8QtscAAAAJ;sY5SyBgAAAAJ",
        "orcid": "0009-0006-4125-6418;;",
        "linkedin": ";;",
        "or_profile": "~Chih_Yao_Chen1;~Mohit_Bansal2;~Swarnadeep_Saha1",
        "aff": "University of North Carolina at Chapel Hill;University of North Carolina at Chapel Hill;Department of Computer Science, University of North Carolina, Chapel Hill",
        "aff_domain": "unc.edu;unc.edu;cs.unc.edu",
        "position": "PhD student;Full Professor;PhD student",
        "bibtex": "@misc{\nchen2024reconcile,\ntitle={ReConcile: Round-Table Conference Improves Reasoning via Consensus among Diverse {LLM}s},\nauthor={Chih Yao Chen and Swarnadeep Saha and Mohit Bansal},\nyear={2024},\nurl={https://openreview.net/forum?id=Yol6nUVIJD}\n}",
        "github": "",
        "project": "",
        "reviewers": "saRD;KtVY;5C9y;b1xo",
        "site": "https://openreview.net/forum?id=Yol6nUVIJD",
        "pdf_size": 1413071,
        "rating": "3;5;8;8",
        "confidence": "4;5;4;4",
        "soundness": "2;3;3;4",
        "contribution": "2;3;3;4",
        "presentation": "3;3;4;4",
        "wc_summary": "56;68;86;88",
        "wc_strengths": "27;59;101;76",
        "wc_weaknesses": "161;168;132;15",
        "wc_questions": "41;109;16;35",
        "wc_review": "285;404;335;214",
        "wc_reply_reviewers": "389;108;8;0",
        "wc_reply_authors": "1885;1515;393;250",
        "reply_reviewers": "2;1;1;0",
        "reply_authors": "5;4;1;1",
        "rating_avg": [
            6.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            74.5,
            13.219304066402286
        ],
        "wc_strengths_avg": [
            65.75,
            26.901440481877547
        ],
        "wc_weaknesses_avg": [
            119.0,
            61.542668125455855
        ],
        "wc_questions_avg": [
            50.25,
            35.152347005569915
        ],
        "wc_review_avg": [
            309.5,
            69.4640194633164
        ],
        "wc_reply_reviewers_avg": [
            126.25,
            157.55376066600252
        ],
        "wc_reply_authors_avg": [
            1010.75,
            703.3734338884288
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.75,
            1.7853571071357126
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.2721655269759087,
        "gs_citation": 105,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11157652800323154343&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of North Carolina",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.unc.edu",
        "aff_unique_abbr": "UNC",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Chapel Hill",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "You77eOFDv",
        "title": "RefConv: Re-parameterized Refocusing Convolution for Powerful ConvNets",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We propose Re-parameterized Refocusing Convolution (RefConv) as a replacement for regular convolutional layers, which is a plug-and-play module to improve the performance without any inference costs. Specifically, given a pre-trained model, RefConv applies a trainable Refocusing Transformation to the basis kernels inherited from the pre-trained model to establish connections among the parameters. For example, a depth-wise RefConv can relate the parameters of a specific channel of convolution kernel to the parameters of the other kernel, i.e., make them refocus on the other parts of the model they have never attended to, rather than focus on the input features only. From another perspective, RefConv augments the priors of existing model structures by utilizing the representations encoded in the pre-trained parameters as the priors and refocusing on them to learn novel representations, thus further enhancing the representational capacity of the pre-trained model. Experimental results validated that RefConv can improve multiple CNN-based models by a clear margin on image classification (up to 1.47\\% higher top-1 accuracy on ImageNet), object detection and semantic segmentation without introducing any extra inference costs or altering the original model structure. Further studies demonstrated that RefConv can reduce the redundancy of channels and smooth the loss landscape, which explains its effectiveness.",
        "keywords": "Deep Learning Architectures;Re-parameterization Method;Convolutional Neural Network",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/23c1914b2f879b874a632926db52e34c72de0a34.zip",
        "author": "Zhicheng Cai;Xiaohan Ding;Qiu Shen;Xun Cao",
        "authorids": "~Zhicheng_Cai1;~Xiaohan_Ding1;~Qiu_Shen1;~Xun_Cao1",
        "gender": "M;M;F;M",
        "homepage": ";https://dingxiaohan.xyz/;https://ese.nju.edu.cn/19/35/c30453a465205/page.htm;http://cite.nju.edu.cn",
        "dblp": "123/2595;218/7379;85/8116;78/7658",
        "google_scholar": "9wBz7NkAAAAJ;CIjw0KoAAAAJ;;8hZIngIAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Zhicheng_Cai1;~Xiaohan_Ding1;~Qiu_Shen1;~Xun_Cao1",
        "aff": "Nanjing University;Tencent AI Lab;Nanjing University;Nanjing University",
        "aff_domain": "nju.edu.cn;tencent.com;nju.edu.cn;nju.edu.cn",
        "position": "MS student;Researcher;Associate Professor;Full Professor",
        "bibtex": "@misc{\ncai2024refconv,\ntitle={RefConv: Re-parameterized Refocusing Convolution for Powerful ConvNets},\nauthor={Zhicheng Cai and Xiaohan Ding and Qiu Shen and Xun Cao},\nyear={2024},\nurl={https://openreview.net/forum?id=You77eOFDv}\n}",
        "github": "",
        "project": "",
        "reviewers": "Z4v5;3dDh;qHhh",
        "site": "https://openreview.net/forum?id=You77eOFDv",
        "pdf_size": 5877794,
        "rating": "5;5;8",
        "confidence": "5;5;4",
        "soundness": "2;3;4",
        "contribution": "2;2;3",
        "presentation": "2;4;3",
        "wc_summary": "53;58;52",
        "wc_strengths": "57;100;13",
        "wc_weaknesses": "285;54;1",
        "wc_questions": "2;154;1",
        "wc_review": "397;366;67",
        "wc_reply_reviewers": "0;99;0",
        "wc_reply_authors": "965;1116;0",
        "reply_reviewers": "0;1;0",
        "reply_authors": "2;2;0",
        "rating_avg": [
            6.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            54.333333333333336,
            2.6246692913372702
        ],
        "wc_strengths_avg": [
            56.666666666666664,
            35.51838334659329
        ],
        "wc_weaknesses_avg": [
            113.33333333333333,
            123.29999549427765
        ],
        "wc_questions_avg": [
            52.333333333333336,
            71.89034860273124
        ],
        "wc_review_avg": [
            276.6666666666667,
            148.79590794851254
        ],
        "wc_reply_reviewers_avg": [
            33.0,
            46.66904755831214
        ],
        "wc_reply_authors_avg": [
            693.6666666666666,
            494.35502312496925
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.9428090415820634
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 26,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9871002403541622125&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Nanjing University;Tencent",
        "aff_unique_dep": ";Tencent AI Lab",
        "aff_unique_url": "https://www.nju.edu.cn;https://ai.tencent.com",
        "aff_unique_abbr": "Nanjing U;Tencent AI Lab",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "Yp01vcQSNl",
        "title": "DIRECTIONALITY IN GRAPH TRANSFORMERS",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We study how one can capture directionality in graph transformers, for learning over directed graphs. Most existing graph transformers do not take edge direction into account. We therefore introduce a novel graph transformer architecture that explicitly takes into account the edge directionality. To achieve this, we make use of dual encodings to represent both potential roles, i.e., source or target, of each pair of vertices linked by a directed edge. These dual encodings are learned by leveraging the latent adjacency information extracted from a novel directional attention module, localized with $k$-hop neighborhood information. We also study alternative approaches to incorporating directionality into other graph transformers to enhance their performance on directed graph learning tasks. To evaluate the importance of edge direction, we empirically characterize via randomization whether direction really matters for the downstream task. We propose two new directional graph datasets where direction is intrinsically related to learning. Via experiments on directional graph datasets, we show that our approach yields state-of-the-art results.",
        "keywords": "graph transformers;graph neural networks",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/3056196f497ff7c0d757467e404bd91c8b00d4e1.pdf",
        "author": "Qitong Wang;Georgios Kollias;Vasileios Kalantzis;Naoki Abe;Mohammed J Zaki",
        "authorids": "~Qitong_Wang4;~Georgios_Kollias1;~Vasileios_Kalantzis1;~Naoki_Abe1;~Mohammed_J_Zaki1",
        "gender": "M;;M;M;M",
        "homepage": ";;https://vkalantzi.github.io;https://researcher.watson.ibm.com/researcher/view.php?person=us-nabe;http://www.cs.rpi.edu/~zaki",
        "dblp": "331/0886;;189/1234;88/6485;z/MohammedJaveedZaki.html",
        "google_scholar": ";;r2YUzYIAAAAJ;9AUbp6QAAAAJ;https://scholar.google.com/scholar?q=zaki,+mj",
        "orcid": ";;0000-0003-1474-8995;0000-0002-4048-3989;0000-0003-4711-0234",
        "linkedin": "qitong-wang-0a497423b/;;;;mohammed-j-zaki/",
        "or_profile": "~Qitong_Wang4;~Georgios_Kollias1;~Vasileios_Kalantzis1;~Naoki_Abe1;~Mohammed_J_Zaki1",
        "aff": "Rensselaer Polytechnic Institute;;International Business Machines;International Business Machines;Rensselaer Polytechnic Institute",
        "aff_domain": "rpi.edu;;ibm.com;ibm.com;rpi.edu",
        "position": "PhD student;;Researcher;Researcher/Research Manager;Professor",
        "bibtex": "@misc{\nwang2024directionality,\ntitle={{DIRECTIONALITY} {IN} {GRAPH} {TRANSFORMERS}},\nauthor={Qitong Wang and Georgios Kollias and Vasileios Kalantzis and Naoki Abe and Mohammed J Zaki},\nyear={2024},\nurl={https://openreview.net/forum?id=Yp01vcQSNl}\n}",
        "github": "",
        "project": "",
        "reviewers": "yoox;1Uzt;r1B3;A6eP",
        "site": "https://openreview.net/forum?id=Yp01vcQSNl",
        "pdf_size": 411958,
        "rating": "3;3;5;6",
        "confidence": "4;4;4;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;3;2",
        "presentation": "1;2;3;2",
        "wc_summary": "113;79;101;109",
        "wc_strengths": "43;48;96;58",
        "wc_weaknesses": "340;151;92;109",
        "wc_questions": "105;6;111;4",
        "wc_review": "601;284;400;280",
        "wc_reply_reviewers": "254;17;125;27",
        "wc_reply_authors": "534;222;400;266",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            100.5,
            13.143439428094915
        ],
        "wc_strengths_avg": [
            61.25,
            20.777090749188154
        ],
        "wc_weaknesses_avg": [
            173.0,
            98.78005871632189
        ],
        "wc_questions_avg": [
            56.5,
            51.54852083231875
        ],
        "wc_review_avg": [
            391.25,
            130.336823269558
        ],
        "wc_reply_reviewers_avg": [
            105.75,
            95.42896572844117
        ],
        "wc_reply_authors_avg": [
            355.5,
            122.14233500306108
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:kLWCMAwGg4gJ:scholar.google.com/&scioq=DIRECTIONALITY+IN+GRAPH+TRANSFORMERS&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;0",
        "aff_unique_norm": "Rensselaer Polytechnic Institute;International Business Machines Corporation",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.rpi.edu;https://www.ibm.com",
        "aff_unique_abbr": "RPI;IBM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "YpeQ0epITo",
        "title": "Enhancing Graph Neural Networks with Quantum Computed Encodings",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Transformers are increasingly employed for graph data, demonstrating competitive performance in diverse tasks. To incorporate graph information into these models, it is essential to enhance node and edge features with positional encodings. In this work, we propose novel families of positional encodings tailored for graph transformers. These encodings leverage the long-range correlations inherent in quantum systems, which arise from mapping the topology of a graph onto interactions between qubits in a quantum computer. Our inspiration stems from the recent advancements in quantum processing units, which offer computational capabilities beyond the reach of classical hardware. We prove that some of these quantum features are theoretically more expressive for certain graphs than the commonly used relative random walk probabilities. Empirically, we show that the performance of state-of-the-art models can be improved on standard benchmarks and large-scale datasets by computing tractable versions of quantum features. Our findings highlight the potential of leveraging quantum computing capabilities to potentially enhance the performance of transformers in handling graph data.",
        "keywords": "graph transformers;graph representation learning;quantum computing;quantum machine learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/ea464e2af8d2224c0ff0e11ff31b63703d08d86f.zip",
        "author": "Slimane Thabet;Romain Fouilland;Mehdi Djellabi;Igor Olegovich Sokolov;Sachin Kasture;Louis-Paul Henry;Loic Henriet",
        "authorids": "~Slimane_Thabet1;~Romain_Fouilland1;~Mehdi_Djellabi1;~Igor_Olegovich_Sokolov1;sachin.kasture@pasqal.com;~Louis-Paul_Henry1;~Loic_Henriet1",
        "gender": "M;M;M;M;;Not Specified;",
        "homepage": ";https://fouilland.fr;;;;;",
        "dblp": ";;209/8835.html;;;;",
        "google_scholar": "eGUJjGkAAAAJ;;tsvMxysAAAAJ;https://scholar.google.com/citations?hl=en;;riQQjssAAAAJ;https://scholar.google.com/scholar?hl=en",
        "orcid": ";;;0000-0002-0022-5686;;;",
        "linkedin": ";romainfouilland/;djellabi-mehdi-363759207/;;;;",
        "or_profile": "~Slimane_Thabet1;~Romain_Fouilland1;~Mehdi_Djellabi1;~Igor_Olegovich_Sokolov1;sachin.kasture@pasqal.com;~Louis-Paul_Henry1;~Loic_Henriet1",
        "aff": "Pasqal;;Pasqal;;;PASQAL;",
        "aff_domain": "pasqal.com;;pasqal.fr;;;pasqal.com;",
        "position": "Researcher;;Researcher;;;Researcher;",
        "bibtex": "@misc{\nthabet2024enhancing,\ntitle={Enhancing Graph Neural Networks with Quantum Computed Encodings},\nauthor={Slimane Thabet and Romain Fouilland and Mehdi Djellabi and Igor Olegovich Sokolov and Sachin Kasture and Louis-Paul Henry and Loic Henriet},\nyear={2024},\nurl={https://openreview.net/forum?id=YpeQ0epITo}\n}",
        "github": "",
        "project": "",
        "reviewers": "8EzY;17mU;DnMk;1u4s",
        "site": "https://openreview.net/forum?id=YpeQ0epITo",
        "pdf_size": 2322149,
        "rating": "3;3;3;5",
        "confidence": "4;4;4;3",
        "soundness": "3;2;2;2",
        "contribution": "2;2;2;3",
        "presentation": "3;1;2;1",
        "wc_summary": "100;70;84;79",
        "wc_strengths": "106;69;45;163",
        "wc_weaknesses": "400;91;71;242",
        "wc_questions": "4;194;75;42",
        "wc_review": "610;424;275;526",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            83.25,
            10.894379284750462
        ],
        "wc_strengths_avg": [
            95.75,
            44.493679326394215
        ],
        "wc_weaknesses_avg": [
            201.0,
            132.55376267763958
        ],
        "wc_questions_avg": [
            78.75,
            71.12445078874072
        ],
        "wc_review_avg": [
            458.75,
            124.87068310856635
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5577391624600858468&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Pasqal",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.pasqal.com",
        "aff_unique_abbr": "",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "France"
    },
    {
        "id": "YqitLs4nHa",
        "title": "Unleashing the Power of Visual Prompting At the Pixel Level",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "This paper presents a simple and effective visual prompting method for adapting pre-trained models to downstream recognition tasks. Our approach is underpinned by two key designs. First, rather than directly adding together the prompt and the image, we treat the prompt as an extra and independent learnable entity. We show that the strategy of reconciling the prompt and the image matters, and find that\nwarping the prompt around a properly shrinked image empirically works the best. Second, we re-introduce two \u201cold tricks\u201d commonly used in building transferable adversarial examples, i.e., input diversity and gradient normalization, into the realm of visual prompting. These techniques improve optimization and enable the prompt to generalize better. We provide extensive experimental results to demonstrate the effectiveness of our method. Using a CLIP model, our prompting method registers a new record of 82.5% average accuracy across 12 popular classification datasets, substantially surpassing the prior art by +5.2%. It is worth noting that such performance not only surpasses linear probing by +2.2%, but, in certain datasets, is on par with the results from fully fine-tuning. Additionally, our prompting method shows competitive performance across different data scales and against distribution shifts.",
        "keywords": "prompting;CLIP;computer vision",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/bdc476183c5566f4a60a29ee1d3432c138318bd7.pdf",
        "author": "Junyang Wu;Xianhang Li;Chen Wei;Huiyu Wang;Alan Yuille;Yuyin Zhou;Cihang Xie",
        "authorids": "~Junyang_Wu1;~Xianhang_Li1;~Chen_Wei2;~Huiyu_Wang1;~Alan_Yuille1;~Yuyin_Zhou1;~Cihang_Xie3",
        "gender": "M;M;;;M;;M",
        "homepage": "https://github.com/jywu511;https://xhl-video.github.io/xianhangli/;https://weichen582.github.io/;http://csrhddlam.github.io/;;https://yuyinzhou.github.io/;https://cihangxie.github.io/",
        "dblp": "320/7787;268/5945;181/2831-5;;y/AlanLYuille;192/1413;175/3366",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;YKpFz4YAAAAJ;https://scholar.google.com/citations?hl=en;SnmuYloAAAAJ;;eiqVLC0AAAAJ;X3vVZPcAAAAJ",
        "orcid": ";;;;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Junyang_Wu1;~Xianhang_Li1;~Chen_Wei2;~Huiyu_Wang1;~Alan_Yuille1;~Yuyin_Zhou1;~cihang_xie1",
        "aff": "Shanghai Jiaotong University;University of California, Santa Cruz;Johns Hopkins University;Meta Platforms;Johns Hopkins University;University of California, Santa Cruz;University of California, Santa Cruz",
        "aff_domain": "sjtu.edu.cn;ucsc.edu;jhu.edu;meta.com;johnshopkins.edu;ucsc.edu;ucsc.edu",
        "position": "PhD student;PhD student;PhD student;Researcher;Full Professor;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nwu2024unleashing,\ntitle={Unleashing the Power of Visual Prompting At the Pixel Level},\nauthor={Junyang Wu and Xianhang Li and Chen Wei and Huiyu Wang and Alan Yuille and Yuyin Zhou and Cihang Xie},\nyear={2024},\nurl={https://openreview.net/forum?id=YqitLs4nHa}\n}",
        "github": "",
        "project": "",
        "reviewers": "Me5m;K2xG;UHZu",
        "site": "https://openreview.net/forum?id=YqitLs4nHa",
        "pdf_size": 654711,
        "rating": "3;3;6",
        "confidence": "5;4;3",
        "soundness": "2;1;3",
        "contribution": "1;2;3",
        "presentation": "3;2;3",
        "wc_summary": "33;51;114",
        "wc_strengths": "16;32;69",
        "wc_weaknesses": "280;136;81",
        "wc_questions": "5;2;17",
        "wc_review": "334;221;281",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            66.0,
            34.72751070837067
        ],
        "wc_strengths_avg": [
            39.0,
            22.19609575278199
        ],
        "wc_weaknesses_avg": [
            165.66666666666666,
            83.90603209675824
        ],
        "wc_questions_avg": [
            8.0,
            6.48074069840786
        ],
        "wc_review_avg": [
            278.6666666666667,
            46.161552063258114
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.8660254037844387,
        "gs_citation": 34,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11203645578548179569&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;3;2;1;1",
        "aff_unique_norm": "Shanghai Jiao Tong University;University of California, Santa Cruz;Johns Hopkins University;Meta",
        "aff_unique_dep": ";;;Meta Platforms, Inc.",
        "aff_unique_url": "https://www.sjtu.edu.cn;https://www.ucsc.edu;https://www.jhu.edu;https://www.meta.com",
        "aff_unique_abbr": "SJTU;UCSC;JHU;Meta",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Santa Cruz",
        "aff_country_unique_index": "0;1;1;1;1;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "EmerDiff: Emerging Pixel-level Semantic Knowledge in Diffusion Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18414",
        "id": "YqyTXmF8Y2",
        "author_site": "Koichi Namekata, Amirmojtaba Sabour, Sanja Fidler, Seung Wook Kim",
        "tldr": "",
        "abstract": "Diffusion models have recently received increasing research attention for their remarkable transfer abilities in semantic segmentation tasks. However, generating fine-grained segmentation masks with diffusion models often requires additional training on annotated datasets, leaving it unclear to what extent pre-trained diffusion models alone understand the semantic relations of their generated images. To address this question, we leverage the semantic knowledge extracted from Stable Diffusion (SD) and aim to develop an image segmentor capable of generating fine-grained segmentation maps without any additional training. The primary difficulty stems from the fact that semantically meaningful feature maps typically exist only in the spatially lower-dimensional layers, which poses a challenge in directly extracting pixel-level semantic relations from these feature maps. To overcome this issue, our framework identifies semantic correspondences between image pixels and spatial locations of low-dimensional feature maps by exploiting SD's generation process and utilizes them for constructing image-resolution segmentation maps. In extensive experiments, the produced segmentation maps are demonstrated to be well delineated and capture detailed parts of the images, indicating the existence of highly accurate pixel-level semantic knowledge in diffusion models. \nProject page: https://kmcode1.github.io/Projects/EmerDiff/",
        "keywords": "Latent Diffusion Models;Diffusion Models;Generative Models;Unsupervised Semantic Segmentation",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Koichi Namekata;Amirmojtaba Sabour;Sanja Fidler;Seung Wook Kim",
        "authorids": "~Koichi_Namekata1;~Amirmojtaba_Sabour1;~Sanja_Fidler1;~Seung_Wook_Kim1",
        "gender": "M;M;F;M",
        "homepage": "https://kmcode1.github.io/;;http://www.cs.toronto.edu/~fidler/;http://www.cs.toronto.edu/~seung/",
        "dblp": "367/3736.html;251/8739;08/6607;",
        "google_scholar": "Gz0_B9EAAAAJ;pUEBuscAAAAJ;CUlqK5EAAAAJ;https://scholar.google.co.kr/citations?hl=en",
        "orcid": "0009-0001-6146-5659;;;",
        "linkedin": "koichi-namekata-870839178/;;sanja-fidler-2846a1a?trk=hp-identity-name;",
        "or_profile": "~Koichi_Namekata1;~Amirmojtaba_Sabour1;~Sanja_Fidler1;~Seung_Wook_Kim1",
        "aff": "University of Toronto;Department of Computer Science, University of Toronto;Department of Computer Science, University of Toronto;Vector Institute",
        "aff_domain": "utoronto.ca;cs.toronto.edu;cs.toronto.edu;vectorinstitute.ai",
        "position": "Undergrad student;PhD student;Associate Professor;Grad student",
        "bibtex": "@inproceedings{\nnamekata2024emerdiff,\ntitle={EmerDiff: Emerging Pixel-level Semantic Knowledge in Diffusion Models},\nauthor={Koichi Namekata and Amirmojtaba Sabour and Sanja Fidler and Seung Wook Kim},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=YqyTXmF8Y2}\n}",
        "github": "",
        "project": "",
        "reviewers": "EgET;CUiU;aY52;D7CR",
        "pdf_size": 42084266,
        "rating": "6;6;6;6",
        "confidence": "1;5;4;4",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "99;86;119;57",
        "wc_strengths": "23;69;117;56",
        "wc_weaknesses": "38;135;157;31",
        "wc_questions": "2;33;13;51",
        "wc_review": "162;323;406;195",
        "wc_reply_reviewers": "0;138;185;0",
        "wc_reply_authors": "288;1502;893;442",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;4;3;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            1.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            90.25,
            22.509720122649238
        ],
        "wc_strengths_avg": [
            66.25,
            33.75925798947601
        ],
        "wc_weaknesses_avg": [
            90.25,
            56.34436529059494
        ],
        "wc_questions_avg": [
            24.75,
            18.793283374652763
        ],
        "wc_review_avg": [
            271.5,
            98.2153246698294
        ],
        "wc_reply_reviewers_avg": [
            80.75,
            82.44202508429788
        ],
        "wc_reply_authors_avg": [
            781.25,
            471.7930557988322
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 19,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10353969828381400149&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=YqyTXmF8Y2",
        "pdf": "https://openreview.net/pdf?id=YqyTXmF8Y2",
        "email": "utoronto.ca;cs.toronto.edu;cs.toronto.edu;vectorinstitute.ai",
        "author_num": 4,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "University of Toronto;Vector Institute",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.utoronto.ca;https://vectorinstitute.ai/",
        "aff_unique_abbr": "U of T;Vector Institute",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Toronto",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "Yr4RgiZ7P5",
        "title": "Does resistance to style-transfer equal Shape Bias? Evaluating shape bias by distorted shape",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep learning models are known to exhibit a strong texture bias, while human tends to rely heavily on global shape for object recognition.  The current benchmark for evaluating a model's shape bias is a set of style-transferred images with the assumption that resistance to the attack of style transfer is related to the development of shape sensitivity in the model. In this work, we show that networks trained with style-transfer images indeed learn to ignore style, but its shape bias arises primarily from local shapes. We provide a $\\textbf{Distorted Shape Testbench(DiST)}$ as an alternative measurement of global shape sensitivity. Our test includes 2400 original images from ImageNet-1K, each of which is accompanied by two images with the global shapes of the original image distorted while preserving its texture via the texture synthesis program. We found that (1) models that performed well on the previous shape bias evaluation do not fare well in the proposed DiST; (2)  the widely adopted ViT models do not show significant advantages over Convolutional Neural Networks (CNNs) on this benchmark despite that ViTs rank higher on the previous shape bias tests. (3) training with DiST images bridges the significant gap between human and existing  SOTA models' performance while preserving the model's accuracy on standard image classification tasks; training with DiST images and style-transferred images are complementary, and can be combined to train network together to enhance both the global and local shape sensitivity of the network. Our code will be host in the anonymous github: \\url{https://anonymous.4open.science/r/ICLR2024-DiST/}",
        "keywords": "computer vision;representation learning;shape & texture bias;psychophysics;robustness",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Ziqi Wen;Tianqin Li;Tai Sing Lee",
        "authorids": "~Ziqi_Wen2;~Tianqin_Li2;~Tai_Sing_Lee1",
        "gender": "M;M;M",
        "homepage": "https://github.com/starsky77;https://github.com/Crazy-Jack;http://www.cnbc.cmu.edu/~tai/",
        "dblp": "328/9856;294/5434;21/4105",
        "google_scholar": "CvVgoeQAAAAJ;sQjEQEUAAAAJ;9TAiIIMAAAAJ",
        "orcid": ";0000-0003-2567-8283;",
        "linkedin": "ziqi-wen-starsky77/;tianqin-li-b16299170/;",
        "or_profile": "~Ziqi_Wen2;~Tianqin_Li2;~Tai_Sing_Lee1",
        "aff": "Carnegie Mellon University;Carnegie Mellon University;Carnegie Mellon University",
        "aff_domain": "andrew.cmu.edu;andrew.cmu.edu;cmu.edu",
        "position": "MS student;PhD student;Full Professor",
        "bibtex": "@misc{\nwen2024does,\ntitle={Does resistance to style-transfer equal Shape Bias? Evaluating shape bias by distorted shape},\nauthor={Ziqi Wen and Tianqin Li and Tai Sing Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=Yr4RgiZ7P5}\n}",
        "github": "",
        "project": "",
        "reviewers": "PsLQ;1Rgc;dedU;4QYv",
        "site": "https://openreview.net/forum?id=Yr4RgiZ7P5",
        "pdf_size": 13485627,
        "rating": "3;6;6;6",
        "confidence": "4;4;4;4",
        "soundness": "2;3;3;3",
        "contribution": "1;3;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "69;68;73;53",
        "wc_strengths": "16;39;37;42",
        "wc_weaknesses": "188;58;88;91",
        "wc_questions": "88;60;31;3",
        "wc_review": "361;225;229;189",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "650;626;420;512",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            65.75,
            7.595228765481656
        ],
        "wc_strengths_avg": [
            33.5,
            10.259142264341596
        ],
        "wc_weaknesses_avg": [
            106.25,
            48.93043531382078
        ],
        "wc_questions_avg": [
            45.5,
            31.752952618614856
        ],
        "wc_review_avg": [
            251.0,
            65.39113089708727
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            552.0,
            92.33634170791044
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:CML0XCG9Ho4J:scholar.google.com/&scioq=Does+resistance+to+style-transfer+equal+Shape+Bias%3F+Evaluating+shape+bias+by+distorted+shape&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Carnegie Mellon University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cmu.edu",
        "aff_unique_abbr": "CMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "An Agnostic View on the Cost of Overfitting in (Kernel) Ridge Regression",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18413",
        "id": "YrTI2Zu0dd",
        "author_site": "Lijia Zhou, James Simon, Gal Vardi, Nathan Srebro",
        "tldr": "",
        "abstract": "We study the cost of overfitting in noisy kernel ridge regression (KRR), which we define as the ratio between the test error of the interpolating ridgeless model and the test error of the optimally-tuned model. We take an ``agnostic'' view in the following sense: we consider the cost as a function of sample size for any target function, even if the sample size is not large enough for consistency or the target is outside the RKHS. We analyze the cost of overfitting under a Gaussian universality ansatz using recently derived (non-rigorous) risk estimates in terms of the task eigenstructure. Our analysis provides a more refined characterization of benign, tempered and catastrophic overfitting (cf. Mallinar et al. 2022).",
        "keywords": "kernel ridge regression;cost of overfitting;benign overfitting;tempered overfitting",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Lijia Zhou;James B Simon;Gal Vardi;Nathan Srebro",
        "authorids": "~Lijia_Zhou1;~James_B_Simon1;~Gal_Vardi1;~Nathan_Srebro1",
        "gender": "M;M;M;M",
        "homepage": "https://stat.uchicago.edu/people/profile/lijia-zhou/;https://james-simon.github.io/;https://sites.google.com/view/galvardi/home;http://ttic.uchicago.edu/~nati/",
        "dblp": "90/5654;294/5406;https://dblp.uni-trier.de/pid/167/9638.html;50/3633",
        "google_scholar": "ZTdI4mcAAAAJ;zjGfh3sAAAAJ;https://scholar.google.co.il/citations?hl=en;https://scholar.google.com.tw/citations?user=ZnT-QpMAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Lijia_Zhou1;~James_B_Simon1;~Gal_Vardi1;~Nathan_Srebro1",
        "aff": ";University of California, Berkeley;Toyota Technological Institute at Chicago;University of Chicago",
        "aff_domain": ";berkeley.edu;ttic.edu;uchicago.edu",
        "position": ";PhD student;Postdoc;Full Professor",
        "bibtex": "@inproceedings{\nzhou2024an,\ntitle={An Agnostic View on the Cost of Overfitting in (Kernel) Ridge Regression},\nauthor={Lijia Zhou and James B Simon and Gal Vardi and Nathan Srebro},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=YrTI2Zu0dd}\n}",
        "github": "",
        "project": "",
        "reviewers": "avrM;mrDt;pfdC;oHx9",
        "pdf_size": 378161,
        "rating": "6;6;6;8",
        "confidence": "2;3;2;5",
        "soundness": "3;3;3;4",
        "contribution": "3;3;3;4",
        "presentation": "3;2;3;4",
        "wc_summary": "57;323;54;136",
        "wc_strengths": "85;153;81;118",
        "wc_weaknesses": "84;655;156;114",
        "wc_questions": "151;651;60;52",
        "wc_review": "377;1782;351;420",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "341;679;385;277",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            1.224744871391589
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            142.5,
            109.27602664811711
        ],
        "wc_strengths_avg": [
            109.25,
            29.054904921544658
        ],
        "wc_weaknesses_avg": [
            252.25,
            233.92987731369416
        ],
        "wc_questions_avg": [
            228.5,
            247.0106273017418
        ],
        "wc_review_avg": [
            732.5,
            606.4299217551852
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            420.5,
            154.10629448533243
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.9428090415820632,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4553396959778544831&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=YrTI2Zu0dd",
        "pdf": "https://openreview.net/pdf?id=YrTI2Zu0dd",
        "email": ";berkeley.edu;ttic.edu;uchicago.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of California, Berkeley;Toyota Technological Institute at Chicago;University of Chicago",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.berkeley.edu;https://www.tti-chicago.org;https://www.uchicago.edu",
        "aff_unique_abbr": "UC Berkeley;TTI Chicago;UChicago",
        "aff_campus_unique_index": "0;1",
        "aff_campus_unique": "Berkeley;Chicago;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Posterior Sampling Based on Gradient Flows of the MMD with Negative Distance Kernel",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18412",
        "id": "YrXHEb2qMb",
        "author_site": "Paul Hagemann, Johannes Hertrich, Fabian Altekr\u00fcger, Robert Beinert, Jannis Chemseddine, Gabriele Steidl",
        "tldr": "",
        "abstract": "We propose conditional flows of the maximum mean discrepancy (MMD) with the negative distance kernel for posterior sampling and conditional generative modelling. This MMD, which is also known as energy distance, has several advantageous properties like efficient computation via slicing and sorting. We approximate the joint distribution of the ground truth and the observations using discrete Wasserstein gradient flows and establish an error bound for the posterior distributions. Further, we prove that our particle flow is indeed a Wasserstein gradient flow of an appropriate functional. The power of our method is demonstrated by numerical examples including conditional image generation and inverse problems like superresolution, inpainting and computed tomography in low-dose and limited-angle settings.",
        "keywords": "Bayesian inverse Problems;MMD;Gradient Flows;Deep Learning",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/a650b0666fae9cd2c483fbcad2499e375dd8f584.zip",
        "author": "Paul Hagemann;Johannes Hertrich;Fabian Altekr\u00fcger;Robert Beinert;Jannis Chemseddine;Gabriele Steidl",
        "authorids": "~Paul_Hagemann1;~Johannes_Hertrich1;~Fabian_Altekr\u00fcger1;~Robert_Beinert1;~Jannis_Chemseddine1;~Gabriele_Steidl2",
        "gender": "M;M;;;;",
        "homepage": "https://www.math.tu-berlin.de/fachgebiete_ag_modnumdiff/angewandte_mathematik/v_menue/team/paul_hagemann/v_menue/homepage/;https://johertrich.github.io;;https://www.tu.berlin/en/go168868/;;",
        "dblp": "274/2221;243/3816;;;;",
        "google_scholar": "-IZIcqMAAAAJ;https://scholar.google.de/citations?user=ra-eAmEAAAAJ;;https://scholar.google.de/citations?user=D-RIm78AAAAJ;;",
        "orcid": ";0000-0003-4433-8604;;0000-0002-7813-2762;0009-0009-7460-6367;",
        "linkedin": "paul-lyonel-hagemann/;;;;;",
        "or_profile": "~Paul_Hagemann1;~Johannes_Hertrich1;~Fabian_Altekr\u00fcger1;~Robert_Beinert1;~Jannis_Chemseddine1;~Gabriele_Steidl2",
        "aff": "Technische Universit\u00e4t Berlin;University College London, University of London;;Technische Universit\u00e4t Berlin;Technische Universit\u00e4t Berlin;",
        "aff_domain": "tu-berlin.de;ucl.ac.uk;;tu-berlin.de;tu-berlin.de;",
        "position": "PhD student;Postdoc;;Postdoc;MS student;",
        "bibtex": "@inproceedings{\nhagemann2024posterior,\ntitle={Posterior Sampling Based on Gradient Flows of the {MMD} with Negative Distance Kernel},\nauthor={Paul Hagemann and Johannes Hertrich and Fabian Altekr{\\\"u}ger and Robert Beinert and Jannis Chemseddine and Gabriele Steidl},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=YrXHEb2qMb}\n}",
        "github": "",
        "project": "",
        "reviewers": "mNmx;PLVu;MCWB;eQGc",
        "pdf_size": 15013185,
        "rating": "5;5;6;8",
        "confidence": "4;2;4;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "127;76;107;66",
        "wc_strengths": "90;15;83;39",
        "wc_weaknesses": "208;75;72;44",
        "wc_questions": "82;53;53;128",
        "wc_review": "507;219;315;277",
        "wc_reply_reviewers": "0;0;23;0",
        "wc_reply_authors": "794;461;315;386",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            94.0,
            24.320773014030618
        ],
        "wc_strengths_avg": [
            56.75,
            31.03526220285564
        ],
        "wc_weaknesses_avg": [
            99.75,
            63.656794609845065
        ],
        "wc_questions_avg": [
            79.0,
            30.667572450391308
        ],
        "wc_review_avg": [
            329.5,
            108.03124548018504
        ],
        "wc_reply_reviewers_avg": [
            5.75,
            9.959292143521045
        ],
        "wc_reply_authors_avg": [
            489.0,
            183.5034059629412
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 27,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5079058486114324907&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=YrXHEb2qMb",
        "pdf": "https://openreview.net/pdf?id=YrXHEb2qMb",
        "email": "tu-berlin.de;ucl.ac.uk;;tu-berlin.de;tu-berlin.de;",
        "author_num": 6,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Technische Universit\u00e4t Berlin;University College London",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tu-berlin.de;https://www.ucl.ac.uk",
        "aff_unique_abbr": "TU Berlin;UCL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "Germany;United Kingdom"
    },
    {
        "id": "Ys3uPmZGOR",
        "title": "Enhancing Neural Network Performance with Leader-Follower Architecture and Local Error Signals",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The collective behavior of a network with heterogeneous, resource-limited information processing units (e.g., group of fish, flock of birds, or network of neurons) demonstrates high self-organization and complexity. These emergent properties arise from simple interaction rules where certain individuals can exhibit leadership-like behavior and influence the collective activity of the group. \nDriven by the natural collective ensembles, we introduce a \\textit{worker} concept to artificial neural network (NN).\nThis NN structure contains workers that encompass one or more information processing units (e.g., neurons, filters, layers, or blocks of layers). Workers are either leaders or followers, and we train a leader-follower neural network (LFNN) by leveraging local error signals. \nLFNN does not require backprobagation (BP) and global loss to achieve the best performance  (we denote LFNN trained without BP as LFNN-$\\ell$).\nWe investigate worker behavior and evaluate LFNN and LFNN-$\\ell$ through extensive experimentation. \nOn small datasets such as MNIST and CIFAR-10, LFNN-$\\ell$, trained with local error signals achieves lower error rates than previous BP-free algorithms and even surpasses BP-enabled baselines. \nOn ImageNet, LFNN-$\\ell$ demonstrates superior scalability. It achieves higher accuracy than previous BP-free algorithms by a significant margin.\nFurthermore, LFNN-$\\ell$ can be conveniently embedded in classic convolutional NNs such as VGG and ResNet architectures. \nOur experimental results show that LFNN-$\\ell$ achieves at most 2x speedup compared to BP, and significantly outperforms models trained with end-to-end BP and other state-of-the-art BP-free methods in terms of accuracy on CIFAR-10, Tiny-ImageNet, and ImageNet.",
        "keywords": "Neural neworks;Local error signals;BP-free learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/ff9d095be92fbc2ac25dde3904563f1879687f81.pdf",
        "author": "Chenzhong Yin;Mingxi Cheng;Xiongye Xiao;Xinghe Chen;Anzhe Cheng;Shahin Nazarian;Andrei Irimia;Paul Bogdan",
        "authorids": "~Chenzhong_Yin1;~Mingxi_Cheng1;~Xiongye_Xiao1;~Xinghe_Chen1;~Anzhe_Cheng1;~Shahin_Nazarian1;~Andrei_Irimia2;~Paul_Bogdan1",
        "gender": "M;;M;M;M;M;M;M",
        "homepage": "https://scholar.google.com/citations?user=M552LEAAAAAJ&hl=en;;;https://www.linkedin.com/in/ziggy-xinghe-chen-4ab885208/;https://github.com/Belis0811;http://sportlab.usc.edu/~shahin/;https://gero.usc.edu/labs/irimialab/;https://cps.usc.edu/",
        "dblp": "278/2748;;301/0208;;365/5295;;;05/5539",
        "google_scholar": "M552LEAAAAAJ;;AvIxA64AAAAJ;;DTW3SlcAAAAJ;22r6J9IAAAAJ;IaPx6wIAAAAJ;Xw_v8-gAAAAJ",
        "orcid": ";;0000-0002-3181-7166;0000-0002-8686-359X;0009-0007-4647-8631;;;0000-0003-2118-0816",
        "linkedin": ";;;;belis-cheng-028aa8249/;shahin-nazarian;irimia;paul-bogdan-4b098a6/",
        "or_profile": "~Chenzhong_Yin1;~Mingxi_Cheng1;~Xiongye_Xiao1;~Xinghe_Chen1;~Anzhe_Cheng1;~Shahin_Nazarian1;~Andrei_Irimia2;~Paul_Bogdan1",
        "aff": "University of Southern California;;University of Southern California;Columbia University;University of Southern California;University of Southern California;University of Southern California;University of Southern California",
        "aff_domain": "usc.edu;;usc.edu;columbia.edu;usc.edu;usc.edu;usc.edu;usc.edu",
        "position": "PhD student;;PhD student;MS student;PhD student;Full Professor;Associate Professor;Jack Munushian Early Career Chair associate professor",
        "bibtex": "@misc{\nanonymous2024enhancing,\ntitle={Enhancing Neural Network Performance with Leader-Follower Architecture and Local Error Signals},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=Ys3uPmZGOR}\n}",
        "github": "",
        "project": "",
        "reviewers": "Mhh7;sRgK;KQC9;2vx7",
        "site": "https://openreview.net/forum?id=Ys3uPmZGOR",
        "pdf_size": 3592772,
        "rating": "5;5;5;6",
        "confidence": "3;4;3;3",
        "soundness": "3;2;2;3",
        "contribution": "3;2;2;3",
        "presentation": "3;1;2;2",
        "wc_summary": "49;32;108;53",
        "wc_strengths": "41;23;29;24",
        "wc_weaknesses": "74;196;189;58",
        "wc_questions": "85;4;123;4",
        "wc_review": "249;255;449;139",
        "wc_reply_reviewers": "0;0;72;0",
        "wc_reply_authors": "1020;1000;731;439",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            60.5,
            28.53506614676055
        ],
        "wc_strengths_avg": [
            29.25,
            7.1545440106270926
        ],
        "wc_weaknesses_avg": [
            129.25,
            63.55066876123335
        ],
        "wc_questions_avg": [
            54.0,
            51.77354536826699
        ],
        "wc_review_avg": [
            273.0,
            111.61541112229978
        ],
        "wc_reply_reviewers_avg": [
            18.0,
            31.176914536239792
        ],
        "wc_reply_authors_avg": [
            797.5,
            236.35619306462016
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:kzL0a8IX2lwJ:scholar.google.com/&scioq=Enhancing+Neural+Network+Performance+with+Leader-Follower+Architecture+and+Local+Error+Signals&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;0;0;0",
        "aff_unique_norm": "University of Southern California;Columbia University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.usc.edu;https://www.columbia.edu",
        "aff_unique_abbr": "USC;Columbia",
        "aff_campus_unique_index": "0;0;0;0;0;0",
        "aff_campus_unique": "Los Angeles;",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "YuYxoaL7YX",
        "title": "Learning an Inventory Control Policy with General Inventory Arrival Dynamics",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We apply deep reinforcement learning (RL) to solve the periodic review inventory control problem with general arrival dynamics. In this work, we incorporate a learned model of transition dynamics (inventory arrivals) into the inventory control problem formulation, increasing the fidelity of the resulting simulator. Leveraging recent results (Madeka et al., 2022), we demonstrate a reduction of the complexity of the inventory control problem we consider to that of supervised learning, proving that under mild assumptions our backtest of inventory control policies is accurate. We also propose several metrics by which to evaluate the inventory arrivals model, and demonstrate the impact of an improved arrivals model on policy performance via a comparison of policies learned on our simulator with one learned on a simulator with less accurate arrivals dynamics. Finally, we use data from a real world A/B test of an RL agent trained using our simulator with learned dynamics to evaluate the performance of the arrivals model, showing that empirically it generalizes well to the off-policy state distribution induced by the RL agent in an actual supply chain.",
        "keywords": "reinforcement learning;inventory control",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Sohrab Andaz;Randy Jia;Carson Eisenach;Dhruv Madeka;Kari Torkkola;Dean Foster;Sham M. Kakade",
        "authorids": "~Sohrab_Andaz1;~Randy_Jia1;~Carson_Eisenach1;~Dhruv_Madeka1;~Kari_Torkkola1;~Dean_Foster1;~Sham_M._Kakade1",
        "gender": "M;M;M;;;M;M",
        "homepage": "https://www.linkedin.com/in/sohrab-andaz-51a83462/;;https://carson.eisenach.org;http://www.dhruvmadeka.com;;http://deanfoster.net;https://shamulent.github.io",
        "dblp": ";67/8755;;;57/4389;241/9885;s/SMKakade",
        "google_scholar": ";;Jx269u0AAAAJ;hCL5ibIAAAAJ;ewRmEoYAAAAJ;HDzOsYAAAAAJ;https://scholar.google.com.tw/citations?user=wb-DKCIAAAAJ",
        "orcid": ";;;;;;",
        "linkedin": ";;carson-eisenach-73118854/;;kari-torkkola-a7238b/;deanfoster/;",
        "or_profile": "~Sohrab_Andaz1;~Randy_Jia1;~Carson_Eisenach1;~Dhruv_Madeka1;~Kari_Torkkola1;~Dean_Foster1;~Sham_M._Kakade1",
        "aff": "Amazon;;Amazon;Amazon;Amazon;;Harvard University",
        "aff_domain": "amazon.com;;amazon.com;amazon.com;amazon.com;;harvard.edu",
        "position": "Researcher;;Applied Scientist;Amazon;Principal Researcher;;Full Professor",
        "bibtex": "@misc{\nandaz2024learning,\ntitle={Learning an Inventory Control Policy with General Inventory Arrival Dynamics},\nauthor={Sohrab Andaz and Randy Jia and Carson Eisenach and Dhruv Madeka and Kari Torkkola and Dean Foster and Sham M. Kakade},\nyear={2024},\nurl={https://openreview.net/forum?id=YuYxoaL7YX}\n}",
        "github": "",
        "project": "",
        "reviewers": "8tKf;3shQ;uujJ",
        "site": "https://openreview.net/forum?id=YuYxoaL7YX",
        "pdf_size": 726061,
        "rating": "3;3;3",
        "confidence": "2;2;2",
        "soundness": "2;2;2",
        "contribution": "2;2;2",
        "presentation": "1;2;2",
        "wc_summary": "54;42;54",
        "wc_strengths": "22;18;18",
        "wc_weaknesses": "214;127;182",
        "wc_questions": "30;7;29",
        "wc_review": "320;194;283",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            2.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            50.0,
            5.656854249492381
        ],
        "wc_strengths_avg": [
            19.333333333333332,
            1.8856180831641267
        ],
        "wc_weaknesses_avg": [
            174.33333333333334,
            35.92894221778438
        ],
        "wc_questions_avg": [
            22.0,
            10.614455552060438
        ],
        "wc_review_avg": [
            265.6666666666667,
            52.87931752795437
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6603243316624940377&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0;1",
        "aff_unique_norm": "Amazon;Harvard University",
        "aff_unique_dep": "Amazon.com, Inc.;",
        "aff_unique_url": "https://www.amazon.com;https://www.harvard.edu",
        "aff_unique_abbr": "Amazon;Harvard",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Yui55YzCao",
        "title": "Shape-aware Graph Spectral Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Spectral Graph Neural Networks (GNNs) are gaining attention for their ability to surpass the limitations of message-passing GNNs. They rely on the supervision from the downstream task to learn spectral filters that  capture the useful frequency information of the graph signal. However, some works empirically show that the preferred graph frequency is related to the graph homophily level. This relationship between graph frequency and graphs with homophily/heterophily has not been systematically analyzed and considered in existing spectral GNNs. To mitigate this gap, we conduct theoretical and empirical analyses which reveal that low-frequency importance is positively correlated with the homophily ratio, while high-frequency importance is negatively correlated. Motivated by this, we propose a shape-ware regularization on a Newton Interpolation-based spectral filter which can (i) learn arbitrary polynomial spectral filter and (ii) incorporate prior knowledge about the desired shape of the corresponding homophily level. Comprehensive experiments demonstrate that NewtonNet can achieve graph spectral filters with desired shapes and superior performance on both homophilous and heterophilous datasets. The code can be found at https://anonymous.4open.science/r/NewtonNet-8115.",
        "keywords": "Machine Learning;Graph Learning;Graph Neural Networks;Graph Spectral Learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/791983aac2ce13bfe39c550024537ec549454003.pdf",
        "author": "Junjie Xu;Enyan Dai;Dongsheng Luo;Xiang Zhang;Suhang Wang",
        "authorids": "~Junjie_Xu1;~Enyan_Dai1;~Dongsheng_Luo1;~Xiang_Zhang4;~Suhang_Wang1",
        "gender": ";M;M;;M",
        "homepage": ";https://enyandai.github.io/;https://users.cs.fiu.edu/~dluo/;;https://faculty.ist.psu.edu/szw494/",
        "dblp": ";250/2886;;;136/9440",
        "google_scholar": ";https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com/citations?hl=en;;cdT_WMMAAAAJ",
        "orcid": ";0000-0001-9715-0280;0000-0003-4192-0826;;0000-0003-3448-4878",
        "linkedin": ";;;;",
        "or_profile": "~Junjie_Xu1;~Enyan_Dai1;~Dongsheng_Luo1;~Xiang_Zhang4;~Suhang_Wang1",
        "aff": ";Pennsylvania State University;Florida International University;;Pennsylvania State University",
        "aff_domain": ";psu.edu;fiu.edu;;psu.edu",
        "position": ";PhD student;Assistant Professor;;Assistant Professor",
        "bibtex": "@misc{\nxu2024shapeaware,\ntitle={Shape-aware Graph Spectral Learning},\nauthor={Junjie Xu and Enyan Dai and Dongsheng Luo and Xiang Zhang and Suhang Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=Yui55YzCao}\n}",
        "github": "",
        "project": "",
        "reviewers": "7Vz6;LpUg;zWto;UTx2",
        "site": "https://openreview.net/forum?id=Yui55YzCao",
        "pdf_size": 1970848,
        "rating": "6;6;6;6",
        "confidence": "3;4;4;4",
        "soundness": "3;4;3;3",
        "contribution": "3;3;3;2",
        "presentation": "3;4;3;3",
        "wc_summary": "150;83;61;158",
        "wc_strengths": "148;171;37;33",
        "wc_weaknesses": "102;227;177;35",
        "wc_questions": "272;306;82;68",
        "wc_review": "672;787;357;294",
        "wc_reply_reviewers": "453;43;273;0",
        "wc_reply_authors": "1066;1134;1472;601",
        "reply_reviewers": "3;1;3;0",
        "reply_authors": "4;3;3;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            113.0,
            41.827024756728754
        ],
        "wc_strengths_avg": [
            97.25,
            62.794804721409875
        ],
        "wc_weaknesses_avg": [
            135.25,
            73.00128423527904
        ],
        "wc_questions_avg": [
            182.0,
            107.78682665335315
        ],
        "wc_review_avg": [
            527.5,
            207.25165861821228
        ],
        "wc_reply_reviewers_avg": [
            192.25,
            182.8570138113384
        ],
        "wc_reply_authors_avg": [
            1068.25,
            310.5095610444226
        ],
        "reply_reviewers_avg": [
            1.75,
            1.299038105676658
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=277849448258268044&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Pennsylvania State University;Florida International University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.psu.edu;https://www.fiu.edu",
        "aff_unique_abbr": "PSU;FIU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "YveXwFMUr1",
        "title": "DomainFusion: Generalizing To Unseen Domains with Latent Diffusion Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Latent diffusion model(LDM) has achieved success in various tasks beyond image generation due to its large-scale image-text training datasets and high-quality generation capability. However, its application in image classification remains unclear. Existing approaches directly transform LDM into discriminative models, which involve using mismatched text-image pairs that LDM fail to present accurate estimation, resulting in degraded performance. Other methods that extract vision knowledge are only designed for generative tasks. Additionally, domain generalization (DG) still faces challenges due to the scarcity of labeled cross-domain data. Existing data-generation approaches suffer from limited performance, and how to immigrate LDM to DG remains unknown. Therefore, we concern these two issues and propose a framework DomainFusion, which leverages LDM in both latent level and pixel level for DG classification. In latent level, we propose Gradient Score Distillation(GSD) which distills gradient priors from LDM to guide the optimization of the DG model. We further theoretically proved it can optimize the KL divergence between the predicted distributions of LDM and the DG model. In pixel level, we propose an autoregressive generation method to shuffle synthetic samples and a sampling strategy to optimize the semantic and non-semantic factors for synthetic samples. Experimental results demonstrate that DomainFusion surpasses data-generation methods a lot and achieves state-of-the-art performance on multiple benchmark datasets.",
        "keywords": "Domain Generalization;Diffusion Model",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/7982b377580aa0d22ac9e14767bf592a53116903.pdf",
        "author": "Yuyang Huang;Yabo Chen;Yuchen Liu;XIAOPENG ZHANG;Wenrui Dai;Hongkai Xiong;Qi Tian",
        "authorids": "~Yuyang_Huang3;~Yabo_Chen1;~Yuchen_Liu4;~XIAOPENG_ZHANG7;~Wenrui_Dai1;~Hongkai_Xiong1;~Qi_Tian3",
        "gender": "M;M;;M;;M;M",
        "homepage": "https://github.com/huangyuyang114;;https://min.sjtu.edu.cn/;https://sites.google.com/site/zxphistory/;;http://min.sjtu.edu.cn;https://www.qitian1987.com/index.html",
        "dblp": ";96/8624.html;69/10440-6;;16/5135.html;21/3569;78/1467-1.html",
        "google_scholar": ";6aHx1rgAAAAJ;https://scholar.google.com.hk/citations?user=GRcH3nAAAAAJ;Ud6aBAcAAAAJ;Xg8MhyAAAAAJ;bB16iN4AAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;0000-0002-3096-448X;;;0000-0003-4552-0029;0000-0002-7252-5047",
        "linkedin": ";;;;;;",
        "or_profile": "~Yuyang_Huang3;~Yabo_Chen1;~Yuchen_Liu4;~XIAOPENG_ZHANG7;~Wenrui_Dai1;~Hongkai_Xiong1;~Qi_Tian3",
        "aff": "Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;Huawei Technologies Ltd.;Shanghai Jiaotong University;Shanghai Jiaotong University;Huawei Technologies Ltd.",
        "aff_domain": "sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;huawei.com;sjtu.edu.cn;sjtu.edu.cn;huawei.com",
        "position": "PhD student;PhD student;PhD student;Principal Researcher;Associate Professor;Full Professor;Principal Researcher",
        "bibtex": "@misc{\nhuang2024domainfusion,\ntitle={DomainFusion: Generalizing To Unseen Domains with Latent Diffusion Models},\nauthor={Yuyang Huang and Yabo Chen and Yuchen Liu and XIAOPENG ZHANG and Wenrui Dai and Hongkai Xiong and Qi Tian},\nyear={2024},\nurl={https://openreview.net/forum?id=YveXwFMUr1}\n}",
        "github": "",
        "project": "",
        "reviewers": "MNgv;JYFK;4xQn;CwAu",
        "site": "https://openreview.net/forum?id=YveXwFMUr1",
        "pdf_size": 26489845,
        "rating": "3;5;5;5",
        "confidence": "4;4;3;4",
        "soundness": "1;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;2;3",
        "wc_summary": "52;79;73;61",
        "wc_strengths": "51;80;70;50",
        "wc_weaknesses": "346;361;172;147",
        "wc_questions": "4;2;5;40",
        "wc_review": "453;522;320;298",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            66.25,
            10.473180032826706
        ],
        "wc_strengths_avg": [
            62.75,
            12.754901018824098
        ],
        "wc_weaknesses_avg": [
            256.5,
            97.54614292733466
        ],
        "wc_questions_avg": [
            12.75,
            15.769828787910159
        ],
        "wc_review_avg": [
            398.25,
            92.85035002626539
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8882579733670370545&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;1;0;0;1",
        "aff_unique_norm": "Shanghai Jiao Tong University;Huawei",
        "aff_unique_dep": ";Huawei Technologies",
        "aff_unique_url": "https://www.sjtu.edu.cn;https://www.huawei.com",
        "aff_unique_abbr": "SJTU;Huawei",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "YweXyP0PMI",
        "title": "Efficient Value Propagation with the Compositional Optimality Equation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Goal-Conditioned Reinforcement Learning (GCRL) is about learning to reach predefined goal states. GCRL in the real world is crucial for adaptive robotics. Existing GCRL methods, however, suffer from low sample efficiency and high cost associated with collecting real-world data. Here, we introduce the Compositional Optimality Equation (COE) for a widely used class of deterministic environments in which the reward is obtained only upon reaching a goal state. COE presents a novel alternative to the standard Bellman Optimality Equation, leading to more sample-efficient update rules. The Bellman update uses the immediate reward and the bootstrapped estimate of the best next state. Our COE-based update rule, however, uses the best composition of two bootstrapped estimates in an arbitrary intermediate subgoal state. In tabular settings, the new update rule guarantees convergence to the optimal value function exponentially faster than the Bellman update! COE can also be used to derive compositional variants of conventional (deep) RL. In particular, our COE-based version of DDPG is more sample-efficient than DDPG in the continuous grid world.",
        "keywords": "Reinforcement Learning;Goal-Conditioned Reinforcement Learning;Robotics",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Piotr Pi\u0119kos;Aditya Ramesh;Francesco Faccio;J\u00fcrgen Schmidhuber",
        "authorids": "~Piotr_Pi\u0119kos2;~Aditya_Ramesh2;~Francesco_Faccio1;~J\u00fcrgen_Schmidhuber1",
        "gender": "M;M;M;M",
        "homepage": "https://piotrpiekos.github.io;https://adityaramesh.in;;http://people.idsia.ch/~juergen/",
        "dblp": ";;227/3214;s/JurgenSchmidhuber",
        "google_scholar": ";https://scholar.google.ch/citations?user=60K82BkAAAAJ;0z3DkrkAAAAJ;https://scholar.google.ch/citations?user=gLnCTgIAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Piotr_Pi\u0119kos2;~Aditya_Ramesh2;~Francesco_Faccio1;~J\u00fcrgen_Schmidhuber1",
        "aff": "King Abdullah University of Science and Technology;University of Alberta;The Swiss AI Lab IDSIA - USI - SUPSI;IDSIA",
        "aff_domain": "kaust.edu.sa;ualberta.ca;idsia.ch;idsia.ch",
        "position": "PhD student;Visiting PhD student;PhD student;Scientific Director",
        "bibtex": "@misc{\npi{\\k{e}}kos2024efficient,\ntitle={Efficient Value Propagation with the Compositional Optimality Equation},\nauthor={Piotr Pi{\\k{e}}kos and Aditya Ramesh and Francesco Faccio and J{\\\"u}rgen Schmidhuber},\nyear={2024},\nurl={https://openreview.net/forum?id=YweXyP0PMI}\n}",
        "github": "",
        "project": "",
        "reviewers": "7g6n;EvmW;v7VZ;jWih",
        "site": "https://openreview.net/forum?id=YweXyP0PMI",
        "pdf_size": 268707,
        "rating": "3;3;3;5",
        "confidence": "4;3;4;3",
        "soundness": "3;1;1;4",
        "contribution": "1;1;1;2",
        "presentation": "2;2;1;4",
        "wc_summary": "92;77;107;77",
        "wc_strengths": "36;61;6;58",
        "wc_weaknesses": "269;1197;267;274",
        "wc_questions": "5;382;4;79",
        "wc_review": "402;1717;384;488",
        "wc_reply_reviewers": "0;318;60;39",
        "wc_reply_authors": "306;833;434;402",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            1.299038105676658
        ],
        "contribution_avg": [
            1.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            88.25,
            12.43734296383275
        ],
        "wc_strengths_avg": [
            40.25,
            22.00426095100674
        ],
        "wc_weaknesses_avg": [
            501.75,
            401.41087117814834
        ],
        "wc_questions_avg": [
            117.5,
            155.70886294620482
        ],
        "wc_review_avg": [
            747.75,
            560.9752111279072
        ],
        "wc_reply_reviewers_avg": [
            104.25,
            125.27245307728272
        ],
        "wc_reply_authors_avg": [
            493.75,
            201.45021097035365
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:dkaJSvR13FkJ:scholar.google.com/&scioq=Efficient+Value+Propagation+with+the+Compositional+Optimality+Equation&hl=en&as_sdt=0,5",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "King Abdullah University of Science and Technology;University of Alberta;Swiss AI Lab IDSIA;Institute of Digital Technologies",
        "aff_unique_dep": ";;AI Lab;",
        "aff_unique_url": "https://www.kast.kau.edu.sa;https://www.ualberta.ca;https://www.idsia.ch/;https://www.idsia.ch",
        "aff_unique_abbr": "KAUST;UAlberta;IDSIA;IDSIA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;2",
        "aff_country_unique": "Saudi Arabia;Canada;Switzerland"
    },
    {
        "id": "Yx7TnC6AAp",
        "title": "Towards Provably Efficient Learning of Extensive-Form Games with Imperfect Information and Linear Function Approximation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We study two-player zero-sum imperfect information extensive-form games (IIEFGs) with linear functional approximation. In particular, we consider linear IIEFGs in the formulation of partially observable Markov games (POMGs) with known transition and bandit feedback, in which the reward function admits a linear structure. To tackle the partial observation of this problem, we propose a linear loss estimator based on the \\textit{composite} features of information set-action pairs. Through integrating this loss estimator with the online mirror descent (OMD) framework and delicate analysis of the stability term in the linear case, we prove the $\\widetilde{\\mathcal{O}}(\\sqrt{HX^2d\\alpha^{-1}T})$ regret upper bound of our algorithm, where $H$ is the horizon length, $X$ is the cardinality of the information set space, $d$ is the ambient dimension of the feature mapping, and $\\alpha$ is a quantity associated with an exploration policy. Additionally, by leveraging the ``transitions\" over information set-actions, we propose another algorithm based on the follow-the-regularized-leader (FTRL) framework, attaining a regret bound of $\\widetilde{\\mathcal{O}}(\\sqrt{H^2d\\lambda T})$, where $\\lambda$ is a quantity depends on the game tree structure. Moreover, we prove that our FTRL-based algorithm also achieves the $\\widetilde{\\mathcal{O}}(\\sqrt{HXdT})$ regret with a different initialization of parameters. To the best of our knowledge, we present the first line of algorithms studying learning IIEFGs with linear function approximation.",
        "keywords": "Extensive-Form Games;Partially observable Markov games",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/d36e3aa1fb66b8d1be0c70b126c724d3281c55a6.pdf",
        "author": "Canzhe Zhao;Shuze Chen;Weiming Liu;Haobo Fu;QIANG FU;Shuai Li",
        "authorids": "~Canzhe_Zhao1;~Shuze_Chen2;~Weiming_Liu3;~Haobo_Fu2;~QIANG_FU8;~Shuai_Li3",
        "gender": "M;M;M;M;F;M",
        "homepage": "https://www.linkedin.com/in/canzhe-zhao-5357891b1/;;;;http://shuaili8.github.io;https://shuzechen.github.io/",
        "dblp": "https://dblp.uni-trier.de/pid/290/8007;00/105-4.html;85/8571;;57/2281-10;383/9666",
        "google_scholar": ";fIPGDMMAAAAJ;LFdJXNcAAAAJ;gANaxT0AAAAJ;https://scholar.google.com.hk/citations?user=kMZgQxcAAAAJ;",
        "orcid": ";;;;;",
        "linkedin": ";;haobo-fu-382b0784/;;;",
        "or_profile": "~Canzhe_Zhao1;~Weiming_Liu3;~Haobo_Fu2;~QIANG_FU8;~Shuai_Li3;~shuze_chen1",
        "aff": "Shanghai Jiaotong University;Tencent AI Lab;Tencent AI Lab;Tencent AI Lab;John Hopcroft Center, Shanghai Jiao Tong University;Shanghai JiaoTong University",
        "aff_domain": "sjtu.edu.cn;tencent.com;tencent.com;tencent.com;sjtu.edu.cn;sjtu.edu.cn",
        "position": "PhD student;Researcher;Principal Researcher;Principal Researcher;Assistant Professor;Undergrad student",
        "bibtex": "@misc{\nzhao2024towards,\ntitle={Towards Provably Efficient Learning of Extensive-Form Games with Imperfect Information and Linear Function Approximation},\nauthor={Canzhe Zhao and Shuze Chen and Weiming Liu and Haobo Fu and QIANG FU and Shuai Li},\nyear={2024},\nurl={https://openreview.net/forum?id=Yx7TnC6AAp}\n}",
        "github": "",
        "project": "",
        "reviewers": "YLD6;zdt3;AopK;ahTG",
        "site": "https://openreview.net/forum?id=Yx7TnC6AAp",
        "pdf_size": 444308,
        "rating": "5;6;6;6",
        "confidence": "4;3;2;3",
        "soundness": "3;3;3;3",
        "contribution": "3;2;3;2",
        "presentation": "3;2;3;3",
        "wc_summary": "160;162;122;49",
        "wc_strengths": "52;86;64;50",
        "wc_weaknesses": "63;186;124;140",
        "wc_questions": "325;48;97;37",
        "wc_review": "600;482;407;276",
        "wc_reply_reviewers": "258;73;0;0",
        "wc_reply_authors": "1299;1002;976;1038",
        "reply_reviewers": "2;1;0;0",
        "reply_authors": "4;3;2;3",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            123.25,
            45.73497020880193
        ],
        "wc_strengths_avg": [
            63.0,
            14.317821063276353
        ],
        "wc_weaknesses_avg": [
            128.25,
            44.01349224953639
        ],
        "wc_questions_avg": [
            126.75,
            116.66699404715972
        ],
        "wc_review_avg": [
            441.25,
            117.62519925594175
        ],
        "wc_reply_reviewers_avg": [
            82.75,
            105.47837456085489
        ],
        "wc_reply_authors_avg": [
            1078.75,
            129.05304142095994
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:hC29cEkDiTgJ:scholar.google.com/&scioq=Towards+Provably+Efficient+Learning+of+Extensive-Form+Games+with+Imperfect+Information+and+Linear+Function+Approximation&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1;0;0",
        "aff_unique_norm": "Shanghai Jiao Tong University;Tencent",
        "aff_unique_dep": ";Tencent AI Lab",
        "aff_unique_url": "https://www.sjtu.edu.cn;https://ai.tencent.com",
        "aff_unique_abbr": "SJTU;Tencent AI Lab",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Shanghai",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "YxuGX6otCC",
        "title": "Taming Encoder for Zero Fine-tuning Image Customization with Text-to-Image Diffusion Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "This paper presents a novel approach for creating customized images of objects as per user specifications. Unlike previous methods that often involve time-consuming optimizations, typically following a per-object optimization approach, our method is built upon a comprehensive framework designed to expedite the process. Our framework employs an encoder to capture the essential high-level characteristics of objects, generating an object-specific embedding through a single feed-forward pass. This acquired object embedding is subsequently utilized by a text-to-image synthesis model for image generation.\nTo seamlessly integrate the object-aware embedding space into a well-established text-to-image model within the same generation context, we explore various network architectures and training strategies. Furthermore, we introduce a straightforward yet highly effective regularized joint training approach that incorporates an object identity preservation loss.\nIn addition to this, we propose a caption generation scheme that plays a crucial role in ensuring the faithful representation of object-specific embeddings throughout the image generation process. This approach enables users to maintain control over the process and provides them with editing capabilities.",
        "keywords": "diffusion model;dreambooth;personalization",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Xuhui Jia;Yang Zhao;Kelvin C.K. Chan;YANDONG LI;Han Zhang;Huisheng Wang;Tingbo Hou;Boqing Gong;Yu-Chuan Su",
        "authorids": "~Xuhui_Jia1;~Yang_Zhao5;~Kelvin_C.K._Chan1;~YANDONG_LI1;~Han_Zhang5;~Huisheng_Wang1;~Tingbo_Hou2;~Boqing_Gong1;~Yu-Chuan_Su1",
        "gender": "M;M;M;M;;M;M;;M",
        "homepage": "https://scholar.google.com/citations?view_op=search_authors&mauthors=xuhui+jia&hl=en&oi=ao;https://sites.google.com/view/zhao-yang/;https://ckkelvinchan.github.io/;https://cold-winter.github.io/;;https://research.google/people/106438/;http://boqinggong.info;http://sammy-su.github.io/;https://sites.google.com/corp/view/hanzhang",
        "dblp": "116/8360;;228/2769;;;35/3986;29/7457;53/6299;",
        "google_scholar": "https://scholar.google.com/citations?view_op=search_authors;9zmGBugAAAAJ;https://scholar.google.com.hk/citations?user=QYTu_KQAAAAJ;kRLb6PkAAAAJ;4evU9_YAAAAJ;u-UDZcsAAAAJ;lv9ZeVUAAAAJ;nrcJfPEAAAAJ;cxEoVL4AAAAJ",
        "orcid": ";0000-0003-2925-0137;;0000-0003-2448-1294;;0009-0006-9667-9821;;0000-0002-2711-6738;",
        "linkedin": ";yang-zhao-145a88153/;;;;tingbo-hou/;boqing-gong-46aa5821/;https://www.linkedin.com/pub/yu-chuan-su/52/38b/b82/;",
        "or_profile": "~Xuhui_Jia1;~Yang_Zhao5;~Kelvin_C.K._Chan1;~YANDONG_LI1;~Huisheng_Wang1;~Tingbo_Hou2;~Boqing_Gong1;~Yu-Chuan_Su1;~Han_Zhang1",
        "aff": "Google;Google;Google DeepMind;Google;Google;Google;Google;Google;Google",
        "aff_domain": "google.com;google.com;google.com;google.com;google.com;google.com;google.com;google.com;google.com",
        "position": "Researcher;Researcher;Senior Research Scientist;Software Engineer;Researcher;Researcher;Research Scientist;Research Scientist;Researcher",
        "bibtex": "@misc{\njia2024taming,\ntitle={Taming Encoder for Zero Fine-tuning Image Customization with Text-to-Image Diffusion Models},\nauthor={Xuhui Jia and Yang Zhao and Kelvin C.K. Chan and YANDONG LI and Han Zhang and Huisheng Wang and Tingbo Hou and Boqing Gong and Yu-Chuan Su},\nyear={2024},\nurl={https://openreview.net/forum?id=YxuGX6otCC}\n}",
        "github": "",
        "project": "",
        "reviewers": "un4Z;QiNE;ddow;qmCv",
        "site": "https://openreview.net/forum?id=YxuGX6otCC",
        "pdf_size": 16593051,
        "rating": "5;5;5;6",
        "confidence": "3;4;4;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "62;90;116;60",
        "wc_strengths": "20;44;82;58",
        "wc_weaknesses": "96;167;59;28",
        "wc_questions": "4;69;29;27",
        "wc_review": "182;370;286;173",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            82.0,
            22.93468988235943
        ],
        "wc_strengths_avg": [
            51.0,
            22.47220505424423
        ],
        "wc_weaknesses_avg": [
            87.5,
            51.829045910570265
        ],
        "wc_questions_avg": [
            32.25,
            23.381349405027933
        ],
        "wc_review_avg": [
            252.75,
            80.96102457355639
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 111,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16787587004334430390&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0;0;0;0;0;0",
        "aff_unique_norm": "Google",
        "aff_unique_dep": "Google",
        "aff_unique_url": "https://www.google.com",
        "aff_unique_abbr": "Google",
        "aff_campus_unique_index": "0;0;0;0;0;0;0;0",
        "aff_campus_unique": "Mountain View;",
        "aff_country_unique_index": "0;0;1;0;0;0;0;0;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "YxvmODVWny",
        "title": "RT-Sketch: Goal-Conditioned Imitation Learning from Hand-Drawn Sketches",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Natural language and images are commonly used as goal representations in goal-conditioned imitation learning (IL). However, natural language can be ambiguous and images can be over-specified. In this work, we propose hand-drawn sketches as a modality for goal specification in visual imitation learning. Sketches are easy for users to provide on the fly like language, but similar to images they can also help a downstream policy to be spatially-aware and even go beyond images to disambiguate task-relevant from task-irrelevant objects. We present RT-Sketch, a goal-conditioned policy for manipulation that takes a hand-drawn sketch of the desired scene as input, and outputs actions. We train RT-Sketch on a dataset of paired trajectories and corresponding synthetically generated goal sketches. We evaluate this approach on six manipulation skills involving tabletop object rearrangements on an articulated countertop. Experimentally we find that RT-Sketch is able to perform on a similar level to image or language-conditioned agents in straightforward settings, while achieving greater robustness when language goals are ambiguous or visual distractors are present. Additionally, we show that RT-Sketch has the capacity to interpret and act upon sketches with varied levels of specificity, ranging from minimal line drawings to detailed, colored drawings. For supplementary material and videos, please refer to our website: http://rt-sketch-anon.github.io.",
        "keywords": "robotics;robot learning;robot manipulation;task representation;behavior cloning;multitask imitation learning;goal conditioning",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/19177c51e00f62dfd17a1985485d29840762f151.pdf",
        "author": "Priya Sundaresan;Quan Vuong;Jiayuan Gu;Peng Xu;Ted Xiao;Sean Kirmani;Tianhe Yu;Michael Stark;Ajinkya Jain;Karol Hausman;Dorsa Sadigh;Jeannette Bohg;Stefan Schaal",
        "authorids": "~Priya_Sundaresan1;~Quan_Vuong2;~Jiayuan_Gu1;~Peng_Xu9;~Ted_Xiao1;~Sean_Kirmani1;~Tianhe_Yu1;~Michael_Stark5;~Ajinkya_Jain1;~Karol_Hausman2;~Dorsa_Sadigh1;~Jeannette_Bohg1;~Stefan_Schaal1",
        "gender": "F;M;;M;M;M;M;;M;;F;;M",
        "homepage": ";https://quanvuong.github.io;https://jiayuan-gu.github.io/;;https://www.tedxiao.me;https://kirmani.io/;https://cs.stanford.edu/~tianheyu/;;https://jainajinkya.github.io;;https://dorsa.fyi/;https://web.stanford.edu/~bohg/;http://www-clmc.net",
        "dblp": ";;210/2429;;198/0598;;192/1797;;166/0292;;117/3174;52/7377;32/3952",
        "google_scholar": "7SUquR4AAAAJ;NSWI3OwAAAAJ;YH1v2uYAAAAJ;460NWeQAAAAJ;;iyEuK8kAAAAJ;;;CNUnD7kAAAAJ;;ZaJEZpYAAAAJ;rjnJnEkAAAAJ;",
        "orcid": ";;0000-0002-3207-7921;;;;;;;;;0000-0002-4921-7193;",
        "linkedin": ";;;;;skirmani;;;;;;;",
        "or_profile": "~Priya_Sundaresan1;~Quan_Vuong2;~Jiayuan_Gu1;~Peng_Xu9;~Ted_Xiao1;~Sean_Kirmani1;~Tianhe_Yu1;~Michael_Stark5;~Ajinkya_Jain1;~Karol_Hausman2;~Dorsa_Sadigh1;~Jeannette_Bohg1;~Stefan_Schaal1",
        "aff": "Stanford University;physical intelligence;University of California, San Diego;Google;;Google DeepMind;Google Brain;;Intrinsic Innovation LLC;;Stanford University;Stanford University;",
        "aff_domain": "stanford.edu;physicalintelligence.company;ucsd.edu;google.com;;google.com;google.com;;intrinsic.ai;;stanford.edu;stanford.edu;",
        "position": "PhD student;Researcher;PhD student;Researcher;;Researcher;Research Scientist;;Researcher;;Assistant Professor;Assistant Professor;",
        "bibtex": "@misc{\nsundaresan2024rtsketch,\ntitle={{RT}-Sketch: Goal-Conditioned Imitation Learning from Hand-Drawn Sketches},\nauthor={Priya Sundaresan and Quan Vuong and Jiayuan Gu and Peng Xu and Ted Xiao and Sean Kirmani and Tianhe Yu and Michael Stark and Ajinkya Jain and Karol Hausman and Dorsa Sadigh and Jeannette Bohg and Stefan Schaal},\nyear={2024},\nurl={https://openreview.net/forum?id=YxvmODVWny}\n}",
        "github": "",
        "project": "",
        "reviewers": "GDgQ;rbwp;fq96;1JK3",
        "site": "https://openreview.net/forum?id=YxvmODVWny",
        "pdf_size": 8050439,
        "rating": "3;5;6;8",
        "confidence": "3;4;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;1;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "114;67;69;75",
        "wc_strengths": "110;61;126;43",
        "wc_weaknesses": "426;191;103;149",
        "wc_questions": "22;48;4;79",
        "wc_review": "672;367;302;346",
        "wc_reply_reviewers": "570;0;0;0",
        "wc_reply_authors": "3006;732;669;584",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "6;2;2;1",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            81.25,
            19.13602623325961
        ],
        "wc_strengths_avg": [
            85.0,
            34.08078637590395
        ],
        "wc_weaknesses_avg": [
            217.25,
            124.47565022927175
        ],
        "wc_questions_avg": [
            38.25,
            28.252212302756046
        ],
        "wc_review_avg": [
            421.75,
            146.37345216944226
        ],
        "wc_reply_reviewers_avg": [
            142.5,
            246.81724007856502
        ],
        "wc_reply_authors_avg": [
            1247.75,
            1016.4837369579506
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            1.920286436967152
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            13,
            0
        ],
        "corr_rating_confidence": 0.8006407690254357,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17943446436668853152&as_sdt=5,34&sciodt=0,34&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;3;3;3;4;0;0",
        "aff_unique_norm": "Stanford University;Physical Intelligence;University of California, San Diego;Google;Intrinsic Innovation LLC",
        "aff_unique_dep": ";;;Google;",
        "aff_unique_url": "https://www.stanford.edu;;https://www.ucsd.edu;https://www.google.com;",
        "aff_unique_abbr": "Stanford;;UCSD;Google;",
        "aff_campus_unique_index": "0;2;3;3;0;0",
        "aff_campus_unique": "Stanford;;San Diego;Mountain View",
        "aff_country_unique_index": "0;0;0;2;0;0;0;0",
        "aff_country_unique": "United States;;United Kingdom"
    },
    {
        "id": "YxzEPTH4Ny",
        "title": "Arithmetic with Language Models: from Memorization to Computation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "A better understanding of the emergent computation and problem-solving capabilities of recent large language models is of paramount importance to further improve them and broaden their applicability. This work investigates how a language model, trained to predict the next token, can perform arithmetic computations generalizing beyond training data. Binary addition and multiplication constitute a good testbed for this purpose, since they require a very small vocabulary and exhibit relevant input/output discontinuities making smooth input interpolation ineffective for novel data. We successfully trained a light language model to learn these tasks and ran a number of experiments to investigate the extrapolation capabilities and internal information processing. Our findings support the hypothesis that the language model works as an Encoding-Regression-Decoding machine where the computation takes place in the value space once the input token representation is mapped to an appropriate internal representation.",
        "keywords": "Language Models;Transformers;Arithmetic computation;Reasoning;Explanatory AI",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Davide Maltoni;Matteo Ferrara",
        "authorids": "~Davide_Maltoni1;~Matteo_Ferrara1",
        "gender": "M;M",
        "homepage": "https://www.unibo.it/sitoweb/davide.maltoni/en;https://www.unibo.it/sitoweb/matteo.ferrara/en",
        "dblp": "89/6473;89/60",
        "google_scholar": "https://scholar.google.it/citations?user=qcLGdDYAAAAJ;",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Davide_Maltoni1;~Matteo_Ferrara1",
        "aff": "University of Bologna;University of Bologna",
        "aff_domain": "unibo.it;unibo.it",
        "position": "Full Professor;Associate Professor",
        "bibtex": "@misc{\nmaltoni2024arithmetic,\ntitle={Arithmetic with Language Models: from Memorization to Computation},\nauthor={Davide Maltoni and Matteo Ferrara},\nyear={2024},\nurl={https://openreview.net/forum?id=YxzEPTH4Ny}\n}",
        "github": "",
        "project": "",
        "reviewers": "exQX;bFAd;2eeE;Bkzb",
        "site": "https://openreview.net/forum?id=YxzEPTH4Ny",
        "pdf_size": 1114054,
        "rating": "3;3;5;6",
        "confidence": "3;3;4;2",
        "soundness": "2;2;2;3",
        "contribution": "2;1;2;3",
        "presentation": "1;2;2;3",
        "wc_summary": "411;60;43;85",
        "wc_strengths": "56;29;26;30",
        "wc_weaknesses": "438;188;167;65",
        "wc_questions": "138;86;8;5",
        "wc_review": "1043;363;244;185",
        "wc_reply_reviewers": "313;0;0;0",
        "wc_reply_authors": "78;76;173;29",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            149.75,
            151.5707343123995
        ],
        "wc_strengths_avg": [
            35.25,
            12.07010770457331
        ],
        "wc_weaknesses_avg": [
            214.5,
            137.16869176309876
        ],
        "wc_questions_avg": [
            59.25,
            55.87206368123519
        ],
        "wc_review_avg": [
            458.75,
            343.3557739430051
        ],
        "wc_reply_reviewers_avg": [
            78.25,
            135.53297569226464
        ],
        "wc_reply_authors_avg": [
            89.0,
            52.31156659860226
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.2721655269759087,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3024579264240507473&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Bologna",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.unibo.it",
        "aff_unique_abbr": "Unibo",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Italy"
    },
    {
        "id": "Yyg3DXzaIK",
        "title": "Coreset Selection For Object Detection",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Coreset selection is a method for selecting a small, representative subset of an entire dataset. It has been primarily researched in image classification, assuming there is only one object per image. However, coreset selection for object detection is more challenging as an image can contain multiple objects. As a result, much research has yet to be done on this topic. Therefore, we introduce a new approach, $\\textit{\\textbf{C}oreset \\textbf{S}election for \\textbf{O}bject \\textbf{D}etection}$ (CSOD). CSOD generates imagewise and classwise representative feature vectors for multiple objects of the same class within each image. Subsequently, we adopt submodular optimization for considering both representativeness and diversity and utilize the representative vectors in the submodular optimization process to select a subset. When we evaluated our method on the Pascal VOC dataset, our method outperformed random selection by +6.8\\%p in AP$_{50}$ when selecting only 200 images.",
        "keywords": "Coreset Selection;Object Detection;Submodular Function",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Hojun Lee;Suyoung Kim;Jaeyoung Yoo;Nojun Kwak",
        "authorids": "~Hojun_Lee1;~Suyoung_Kim2;~Jaeyoung_Yoo2;~Nojun_Kwak1",
        "gender": "M;M;M;M",
        "homepage": ";https://github.com/Swiminn;http://mipal.snu.ac.kr/index.php/Jaeyoung_Yoo;http://mipal.snu.ac.kr",
        "dblp": "04/5239-2;;;49/2806",
        "google_scholar": "1BOehSUAAAAJ;;;h_8-1M0AAAAJ",
        "orcid": "0000-0003-2327-674X;;;0000-0002-1792-0327",
        "linkedin": "hojun815/;;;",
        "or_profile": "~Hojun_Lee1;~Suyoung_Kim2;~Jaeyoung_Yoo2;~Nojun_Kwak1",
        "aff": "Seoul National University;Seoul National University;NAVER WEBTOON;Seoul National University",
        "aff_domain": "snu.ac.kr;snu.ac.kr;webtoonscorp.com;snu.ac.kr",
        "position": "PhD student;PhD student;Researcher;Full Professor",
        "bibtex": "@misc{\nlee2024coreset,\ntitle={Coreset Selection For Object Detection},\nauthor={Hojun Lee and Suyoung Kim and Jaeyoung Yoo and Nojun Kwak},\nyear={2024},\nurl={https://openreview.net/forum?id=Yyg3DXzaIK}\n}",
        "github": "",
        "project": "",
        "reviewers": "M63x;daqV;Kdn6;k61v",
        "site": "https://openreview.net/forum?id=Yyg3DXzaIK",
        "pdf_size": 460015,
        "rating": "3;5;5;6",
        "confidence": "4;4;4;4",
        "soundness": "3;3;2;4",
        "contribution": "2;2;2;2",
        "presentation": "3;3;2;4",
        "wc_summary": "88;116;72;74",
        "wc_strengths": "81;45;53;96",
        "wc_weaknesses": "250;46;106;126",
        "wc_questions": "50;59;182;62",
        "wc_review": "469;266;413;358",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            87.5,
            17.57128339080558
        ],
        "wc_strengths_avg": [
            68.75,
            20.64430914319973
        ],
        "wc_weaknesses_avg": [
            132.0,
            74.21590126111789
        ],
        "wc_questions_avg": [
            88.25,
            54.30642227214015
        ],
        "wc_review_avg": [
            376.5,
            74.90160211904683
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3806076687929194585&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Seoul National University;NAVER Corporation",
        "aff_unique_dep": ";WEBTOON",
        "aff_unique_url": "https://www.snu.ac.kr;https://www.webtoons.com",
        "aff_unique_abbr": "SNU;NAVER",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "Yz0Strbex6",
        "title": "A Note on Some Statistical Properties of Signature Transform Under Stochastic Integrals",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Signature transforms are iterated path integrals of continuous and discrete-time time series data, and their universal nonlinearity linearizes the problem of feature selection. This paper revisits some statistical properties of signature transform under stochastic intergrals with a Lasso regression framework, both theoretically and numerically. Our study shows that, for processes and time series that are closer to Brownian motion or random walk with weaker inter-dimensional correlations, the Lasso regression is more consistent for their signatures defined by It\u00f4 integrals; for mean reverting processes and time series, their signatures defined by Stratonovich integrals have more consistency in the Lasso regression. Our findings highlight the importance of choosing appropriate definitions of signatures and stochastic models in statistical inference and machine learning.",
        "keywords": "Signature;Lasso;Consistency;Stochastic Integral;Time Series;Universal Nonlinearity",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/f46724f0e865e26e6b35c562cced4faba37cb0cc.zip",
        "author": "Xin Guo;Ruixun Zhang;Chaoyi Zhao",
        "authorids": "~Xin_Guo6;~Ruixun_Zhang1;~Chaoyi_Zhao2",
        "gender": "F;M;M",
        "homepage": "http://www.ieor.berkeley.edu/~xinguo;https://www.math.pku.edu.cn/teachers/ZhangRuixun%20/index.html;https://zhaochaoyi.github.io/",
        "dblp": "17/1430-1;219/9614;",
        "google_scholar": ";kQmnUa4AAAAJ;StLYnSMAAAAJ",
        "orcid": ";0000-0002-7670-8393;",
        "linkedin": ";;",
        "or_profile": "~Xin_Guo6;~Ruixun_Zhang1;~Chaoyi_Zhao2",
        "aff": "University of California, Berkeley;Peking University;Peking University",
        "aff_domain": "berkeley.edu;pku.edu.cn;pku.edu.cn",
        "position": "Full Professor;Assistant Professor;PhD student",
        "bibtex": "@misc{\nguo2024a,\ntitle={A Note on Some Statistical Properties of Signature Transform Under Stochastic Integrals},\nauthor={Xin Guo and Ruixun Zhang and Chaoyi Zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=Yz0Strbex6}\n}",
        "github": "",
        "project": "",
        "reviewers": "otaH;weWX;XdRo;PPAS",
        "site": "https://openreview.net/forum?id=Yz0Strbex6",
        "pdf_size": 2190274,
        "rating": "5;5;6;8",
        "confidence": "3;2;3;4",
        "soundness": "3;3;3;4",
        "contribution": "2;2;2;4",
        "presentation": "4;4;3;3",
        "wc_summary": "56;112;176;147",
        "wc_strengths": "21;166;84;74",
        "wc_weaknesses": "81;619;244;51",
        "wc_questions": "45;23;186;35",
        "wc_review": "203;920;690;307",
        "wc_reply_reviewers": "25;784;143;0",
        "wc_reply_authors": "582;1771;1265;315",
        "reply_reviewers": "1;4;2;0",
        "reply_authors": "2;7;4;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            122.75,
            44.70668294561787
        ],
        "wc_strengths_avg": [
            86.25,
            51.895929512824026
        ],
        "wc_weaknesses_avg": [
            248.75,
            226.02696188729342
        ],
        "wc_questions_avg": [
            72.25,
            66.13386046496908
        ],
        "wc_review_avg": [
            530.0,
            289.11848782116994
        ],
        "wc_reply_reviewers_avg": [
            238.0,
            319.82573379889243
        ],
        "wc_reply_authors_avg": [
            983.25,
            571.7282461974395
        ],
        "reply_reviewers_avg": [
            1.75,
            1.479019945774904
        ],
        "reply_authors_avg": [
            3.5,
            2.29128784747792
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.8660254037844386,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:aetl6ipFk7sJ:scholar.google.com/&scioq=A+Note+on+Some+Statistical+Properties+of+Signature+Transform+Under+Stochastic+Integrals&hl=en&as_sdt=0,31",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "University of California, Berkeley;Peking University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.berkeley.edu;http://www.pku.edu.cn",
        "aff_unique_abbr": "UC Berkeley;Peking U",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Berkeley;",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "YzJT0Y67Go",
        "title": "HIPODE: Enhancing Offline Reinforcement Learning with High-Quality Synthetic Data from a Policy-Decoupled Approach",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Offline reinforcement learning (Offline RL) has gained attention as a means of training reinforcement learning models using pre-collected static data. To address the issue of limited data and improve downstream Offline RL performance, recent efforts have focused on broadening dataset coverage through data augmentation techniques. However, most of these methods are tied to a specific policy (policy-dependent), restricting the generated data to supporting only a specific downstream Offline RL policy. Moreover, the quality of synthetic data is often not well-controlled, which limits the potential for further improving the downstream policy. To tackle these issues, we propose \\textbf{HI}gh-return \\textbf{PO}licy-\\textbf{DE}coupled~(HIPODE), a novel data augmentation method for Offline RL. On the one hand, HIPODE generates high-return synthetic data by selecting states near the dataset distribution with potentially high value among candidate states using the negative sampling technique. On the other hand, HIPODE is policy-decoupled, thus can be used as a common plug-in method to support diverse downstream Offline RL processes. We conduct experiments on the widely studied TD3BC, CQL and IQL algorithms, and the results show that HIPODE outperforms or has competitive results to the state-of-the-art policy-decoupled data augmentation method and most prevalent model-based Offline RL methods on D4RL benchmarks.",
        "keywords": "Data Augmentation;Offline Reinforcement Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/ac7b9789212e7a16cf600298f248d2ed13298cdd.pdf",
        "author": "Shixi Lian;Jianye HAO;Yi Ma;Jinyi Liu;YAN ZHENG",
        "authorids": "~Shixi_Lian2;~Jianye_HAO1;~Yi_Ma5;~Jinyi_Liu1;~YAN_ZHENG1",
        "gender": "M;M;;;M",
        "homepage": "https://blog.csdn.net/sidnee;http://www.icdai.org/jianye.html;https://mayi1996.top/;;https://yanzzzzz.github.io",
        "dblp": ";21/7664.html;69/1112-5.html;192/6688-2;10/2381-2",
        "google_scholar": ";;TdVWzqgAAAAJ;kaQS7NAAAAAJ;https://scholar.google.com.hk/citations?user=tJuhd1kAAAAJ",
        "orcid": ";0000-0002-0422-8235;0000-0001-9375-6605;;",
        "linkedin": ";;;\u91d1\u6bc5-\u5218-5b7447118;",
        "or_profile": "~Shixi_Lian2;~Jianye_HAO1;~Yi_Ma5;~Jinyi_Liu1;~YAN_ZHENG1",
        "aff": "Tianjin University;Tianjin University;Tianjin University;Tianjin University;Tianjin Unibersity, China",
        "aff_domain": "tju.edu.cn;tju.edu.cn;tju.edu.cn;tju.edu.cn;tju.edu.cn",
        "position": "MS student;Associate Professor;PhD student;PhD student;Associate Professor",
        "bibtex": "@misc{\nlian2024hipode,\ntitle={{HIPODE}: Enhancing Offline Reinforcement Learning with High-Quality Synthetic Data from a Policy-Decoupled Approach},\nauthor={Shixi Lian and Jianye HAO and Yi Ma and Jinyi Liu and YAN ZHENG},\nyear={2024},\nurl={https://openreview.net/forum?id=YzJT0Y67Go}\n}",
        "github": "",
        "project": "",
        "reviewers": "Yzj2;q6Nk;Pxud;97dv",
        "site": "https://openreview.net/forum?id=YzJT0Y67Go",
        "pdf_size": 2566868,
        "rating": "3;5;6;6",
        "confidence": "5;4;4;4",
        "soundness": "2;3;2;3",
        "contribution": "1;3;3;2",
        "presentation": "3;2;3;3",
        "wc_summary": "130;59;90;119",
        "wc_strengths": "47;84;113;29",
        "wc_weaknesses": "265;655;169;64",
        "wc_questions": "1;143;6;94",
        "wc_review": "443;941;378;306",
        "wc_reply_reviewers": "0;638;5;0",
        "wc_reply_authors": "698;1761;298;336",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "2;4;1;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            99.5,
            27.572631357924475
        ],
        "wc_strengths_avg": [
            68.25,
            32.5681976781031
        ],
        "wc_weaknesses_avg": [
            288.25,
            223.3577567491221
        ],
        "wc_questions_avg": [
            61.0,
            60.07911450745592
        ],
        "wc_review_avg": [
            517.0,
            249.54658883663387
        ],
        "wc_reply_reviewers_avg": [
            160.75,
            275.54797676629744
        ],
        "wc_reply_authors_avg": [
            773.25,
            591.2619449110521
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9428090415820632,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13668046299562649590&as_sdt=5,34&sciodt=0,34&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Tianjin University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.tju.edu.cn",
        "aff_unique_abbr": "TJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "Z0ojN315Uf",
        "title": "Differentially Private Principal Component Analysis for Vertically Partitioned Data",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We study the problem of differentially private principal component analysis (DP PCA) for vertically partitioned data. In this setting, an untrusted server wants to learn the optimal rank-$k$ subspace of an underlying sensitive dataset $D$, which is partitioned among multiple clients by attributes/columns. While differential privacy has been heavily studied for horizontally partitioned data (namely, when $D$ is partitioned among clients by records/rows), its applications on vertically partitioned data are very limited. To fill this gap, we propose SPCA, which introduces minimal noise to the obtained subspace while preserving DP without assuming any trusted client or third party. The theoretical analysis shows that our solution is able to match the privacy-utility trade-off of the optimal baseline in the centralized setting. Finally, we provide experiments on real-world datasets to validate the theoretical analysis.",
        "keywords": "Differential Privacy;Principal Component Analysis",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/a80fdd2eaa66bf2ee42f1fe0e94002448b608098.zip",
        "author": "Ergute Bao;Fei Wei;Xiaokui Xiao;Tianyu Pang;Chao Du",
        "authorids": "~Ergute_Bao1;~Fei_Wei2;~Xiaokui_Xiao2;~Tianyu_Pang1;~Chao_Du1",
        "gender": ";M;;M;M",
        "homepage": ";https://fredericw.github.io;;https://p2333.github.io/;https://duchao0726.github.io/",
        "dblp": ";;;202/2550;75/7523",
        "google_scholar": ";6Owzz-AAAAAJ;;wYDbtFsAAAAJ;QOp7xW0AAAAJ",
        "orcid": ";0000-0002-8943-0335;;0000-0003-0639-6176;0000-0003-1244-6336",
        "linkedin": ";weifei086/;;%E5%A4%A9%E5%AE%87-%E5%BA%9E-b3999017a/;duchao/",
        "or_profile": "~Ergute_Bao1;~Fei_Wei2;~Xiaokui_Xiao2;~Tianyu_Pang1;~Chao_Du1",
        "aff": ";National University of Singapore;;Sea AI Lab;Sea AI Lab",
        "aff_domain": ";nus.edu.sg;;sea.com;sea.com",
        "position": ";Postdoc;;Senior Research Scientist;Senior Research Scientist",
        "bibtex": "@misc{\nbao2024differentially,\ntitle={Differentially Private Principal Component Analysis for Vertically Partitioned Data},\nauthor={Ergute Bao and Fei Wei and Xiaokui Xiao and Tianyu Pang and Chao Du},\nyear={2024},\nurl={https://openreview.net/forum?id=Z0ojN315Uf}\n}",
        "github": "",
        "project": "",
        "reviewers": "qWzN;fmuB;DSCS",
        "site": "https://openreview.net/forum?id=Z0ojN315Uf",
        "pdf_size": 600088,
        "rating": "1;6;6",
        "confidence": "5;5;3",
        "soundness": "3;3;3",
        "contribution": "1;2;3",
        "presentation": "3;3;3",
        "wc_summary": "137;13;87",
        "wc_strengths": "75;39;65",
        "wc_weaknesses": "46;599;111",
        "wc_questions": "36;45;5",
        "wc_review": "294;696;268",
        "wc_reply_reviewers": "0;385;35",
        "wc_reply_authors": "1106;1157;739",
        "reply_reviewers": "0;1;1",
        "reply_authors": "4;3;2",
        "rating_avg": [
            4.333333333333333,
            2.357022603955158
        ],
        "confidence_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            79.0,
            50.93787065304817
        ],
        "wc_strengths_avg": [
            59.666666666666664,
            15.173075568988056
        ],
        "wc_weaknesses_avg": [
            252.0,
            246.79681251318192
        ],
        "wc_questions_avg": [
            28.666666666666668,
            17.133463034528532
        ],
        "wc_review_avg": [
            419.3333333333333,
            195.92061884571743
        ],
        "wc_reply_reviewers_avg": [
            140.0,
            173.8294183004323
        ],
        "wc_reply_authors_avg": [
            1000.6666666666666,
            186.19404454015768
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.0,
            0.816496580927726
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5000000000000001,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:lQmMgCQblM8J:scholar.google.com/&scioq=Differentially+Private+Principal+Component+Analysis+for+Vertically+Partitioned+Data&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "National University of Singapore;Sea AI Lab",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.nus.edu.sg;",
        "aff_unique_abbr": "NUS;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Singapore;"
    },
    {
        "id": "Z1E0EahS5w",
        "title": "Limits to Reservoir Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this work, we bound a machine's ability to learn based on computational limitations implied by physicality. We start by considering the information processing capacity (IPC), a normalized measure of the expected squared error of a collection of signals to a complete basis of functions. We use the IPC to measure the degradation under noise of the performance of reservoir computers, a particular kind of recurrent network, when constrained by physical considerations. First, we show that the IPC is at most a polynomial in the system size $n$, even when considering the collection of $2^n$ possible pointwise products of the $n$ output signals. Next, we argue that this degradation implies that the family of functions represented by the reservoir requires an exponential number of samples to learn in the presence of the reservoir's noise. Finally, we conclude with a discussion of the performance of the same collection of $2^n$ functions without noise when being used for binary classification.",
        "keywords": "Reservoir;Computing;Dynamical;System;fat-shattering;dimension;statistical;learning",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Anthony Polloreno",
        "authorids": "~Anthony_Polloreno1",
        "gender": "",
        "homepage": "https://www.ampolloreno.com",
        "dblp": "",
        "google_scholar": "W2USduoAAAAJ",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Anthony_Polloreno1",
        "aff": "",
        "aff_domain": "",
        "position": "",
        "bibtex": "@misc{\npolloreno2024limits,\ntitle={Limits to Reservoir Learning},\nauthor={Anthony Polloreno},\nyear={2024},\nurl={https://openreview.net/forum?id=Z1E0EahS5w}\n}",
        "github": "",
        "project": "",
        "reviewers": "AaBM;wi5q;CfFW",
        "site": "https://openreview.net/forum?id=Z1E0EahS5w",
        "pdf_size": 661495,
        "rating": "1;3;6",
        "confidence": "4;2;3",
        "soundness": "1;2;3",
        "contribution": "1;2;2",
        "presentation": "1;2;3",
        "wc_summary": "28;37;79",
        "wc_strengths": "23;46;44",
        "wc_weaknesses": "325;158;99",
        "wc_questions": "20;569;118",
        "wc_review": "396;810;340",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.3333333333333335,
            2.0548046676563256
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            48.0,
            22.22611077089287
        ],
        "wc_strengths_avg": [
            37.666666666666664,
            10.402991022884823
        ],
        "wc_weaknesses_avg": [
            194.0,
            95.71137166850481
        ],
        "wc_questions_avg": [
            235.66666666666666,
            239.0736753016154
        ],
        "wc_review_avg": [
            515.3333333333334,
            209.61128044284467
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.3973597071195131,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6067754256888077653&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3
    },
    {
        "id": "Z1Em654CSE",
        "title": "RGB-Event MOT: A Cross-Modal Benchmark for Multi-Object Tracking",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Leveraging the power of contemporary deep learning techniques, it has become increasingly convenient for methodologies to recognize, detect, and track objects in real-world scenarios. Nonetheless, challenges persist, particularly regarding the robustness of these models in recognizing small objects, operating in low-illumination conditions, or dealing with occlusions. Recognizing the unique advantages offered by Event-based vision - including superior temporal resolution, vast dynamic range, and minimal latency - it is quickly becoming a coveted tool among computer vision researchers. To bolster foundational research in areas such as object detection and tracking, we present the first cross-modal RGB-Event multi-object tracking benchmark dataset. This expansive repository encompasses nearly one million carefully annotated ground-truth bounding boxes, offering an extensive data resource for research endeavors. Designed to augment the practical implementation of Event-based vision technology, this dataset proves particularly beneficial in intricate and challenging environments, including low-light situations, scenarios marked by occlusions, and contexts involving diminutive objects. The utility and potency of cross-modal detection and tracking models have been extensively tested and confirmed through our experimental studies. The encouraging results not only affirm the necessity of these models but also highlight their efficacy, thus emphasizing the benchmark\u2019s potential to significantly propel the advancement of Event-based vision technology. We have included the code in the supplementary material and will make the dataset publicly available.",
        "keywords": "event data;object tracking;cross-modal",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/c02e2d0b5f4caaaa7d149a6f028cec39d33c4007.zip",
        "author": "Zhiyu Zhu;Junhui Hou;Jinjian Wu;Dapeng Wu",
        "authorids": "~Zhiyu_Zhu1;~Junhui_Hou2;~Jinjian_Wu1;~Dapeng_Wu1",
        "gender": "M;M;M;",
        "homepage": ";http://www.cityu.edu.hk/stfprofile/csjhhou.htm;https://web.xidian.edu.cn/wjj/index.html;https://www.cs.cityu.edu.hk/~dapengwu/",
        "dblp": ";122/2673.html;01/8056;",
        "google_scholar": "d1L0KkoAAAAJ;j6eefhwAAAAJ;;",
        "orcid": "0000-0002-0726-4522;0000-0003-3431-2021;;",
        "linkedin": ";;;",
        "or_profile": "~Zhiyu_Zhu1;~Junhui_Hou2;~Jinjian_Wu1;~Dapeng_Wu1",
        "aff": "City University of Hong Kong;City University of Hong Kong;Xidian University;City University of Hong Kong",
        "aff_domain": "cityu.edu.hk;cityu.edu.hk;xidian.edu;cityu.edu.hk",
        "position": "Postdoc;Assistant Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nzhu2024rgbevent,\ntitle={{RGB}-Event {MOT}: A Cross-Modal Benchmark for Multi-Object Tracking},\nauthor={Zhiyu Zhu and Junhui Hou and Jinjian Wu and Dapeng Wu},\nyear={2024},\nurl={https://openreview.net/forum?id=Z1Em654CSE}\n}",
        "github": "",
        "project": "",
        "reviewers": "FGic;2xGM;QXZ6",
        "site": "https://openreview.net/forum?id=Z1Em654CSE",
        "pdf_size": 37538141,
        "rating": "3;3;5",
        "confidence": "5;5;5",
        "soundness": "3;2;2",
        "contribution": "1;2;2",
        "presentation": "3;3;3",
        "wc_summary": "75;68;200",
        "wc_strengths": "14;46;133",
        "wc_weaknesses": "70;226;218",
        "wc_questions": "41;19;132",
        "wc_review": "200;359;683",
        "wc_reply_reviewers": "49;0;22",
        "wc_reply_authors": "217;294;193",
        "reply_reviewers": "1;0;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            5.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            114.33333333333333,
            60.64285246882402
        ],
        "wc_strengths_avg": [
            64.33333333333333,
            50.28143019268865
        ],
        "wc_weaknesses_avg": [
            171.33333333333334,
            71.72788083366808
        ],
        "wc_questions_avg": [
            64.0,
            48.91489207456832
        ],
        "wc_review_avg": [
            414.0,
            200.98258631035674
        ],
        "wc_reply_reviewers_avg": [
            23.666666666666668,
            20.038851153585515
        ],
        "wc_reply_authors_avg": [
            234.66666666666666,
            43.08389748179965
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:RVuMrsXINVcJ:scholar.google.com/&scioq=RGB-Event+MOT:+A+Cross-Modal+Benchmark+for+Multi-Object+Tracking&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "City University of Hong Kong;Xidian University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cityu.edu.hk;http://www.xidian.edu.cn/",
        "aff_unique_abbr": "CityU;Xidian",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "Z1m5uqUpO9",
        "title": "A Local Graph Limits Perspective on Sampling-Based GNNs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We propose a theoretical framework for training Graph Neural Networks (GNNs) on large input graphs via training on small, fixed-size sampled subgraphs. This framework is applicable to a wide range of models, including popular sampling-based GNNs, such as GraphSAGE and FastGCN.\nLeveraging the theory of graph local limits, we prove that under mild assumptions, parameters learned from training sampling-based GNNs on small samples of a large input graph are within an $\\epsilon$-neighborhood of the outcome of training the same architecture on the whole graph. We derive bounds on the number of samples, the size of the graph, and the training steps required as a function of $\\epsilon$. Our results give a novel theoretical understanding for using sampling in training GNNs. They also suggest that by training GNNs on small samples of the input graph, practitioners can identify and select the best models, hyperparameters, and sampling algorithms more efficiently.\nWe empirically demonstrate our results on a node classification task on large citation graphs, observing that sampling-based GNNs trained on local subgraphs 12$\\times$ smaller than the original graph achieve comparable performance to those trained on the input graph.",
        "keywords": "graph neural networks;graph limits;Benjamini-Schramm",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Yeganeh Alimohammadi;Luana Ruiz;Amin Saberi",
        "authorids": "~Yeganeh_Alimohammadi1;~Luana_Ruiz1;~Amin_Saberi1",
        "gender": ";F;",
        "homepage": ";https://sites.google.com/view/luana-ruiz/home;https://www.stanford.edu/~saberi",
        "dblp": ";;28/4017",
        "google_scholar": ";J-rZew8AAAAJ;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Yeganeh_Alimohammadi1;~Luana_Ruiz1;~Amin_Saberi1",
        "aff": ";Whiting School of Engineering;Stanford University",
        "aff_domain": ";engineering.jhu.edu;stanford.edu",
        "position": ";Assistant Professor;Full Professor",
        "bibtex": "@misc{\nalimohammadi2024a,\ntitle={A Local Graph Limits Perspective on Sampling-Based {GNN}s},\nauthor={Yeganeh Alimohammadi and Luana Ruiz and Amin Saberi},\nyear={2024},\nurl={https://openreview.net/forum?id=Z1m5uqUpO9}\n}",
        "github": "",
        "project": "",
        "reviewers": "HSq8;Jmqn;pWTk;o4pB",
        "site": "https://openreview.net/forum?id=Z1m5uqUpO9",
        "pdf_size": 743818,
        "rating": "5;5;6;6",
        "confidence": "4;5;3;2",
        "soundness": "3;2;3;4",
        "contribution": "2;2;3;2",
        "presentation": "3;2;3;4",
        "wc_summary": "48;75;36;88",
        "wc_strengths": "18;16;28;52",
        "wc_weaknesses": "107;381;46;96",
        "wc_questions": "2;5;17;73",
        "wc_review": "175;477;127;309",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            61.75,
            20.716840975399702
        ],
        "wc_strengths_avg": [
            28.5,
            14.309088021254185
        ],
        "wc_weaknesses_avg": [
            157.5,
            131.06963797920554
        ],
        "wc_questions_avg": [
            24.25,
            28.699956445959984
        ],
        "wc_review_avg": [
            272.0,
            135.85654198455074
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8944271909999159,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18223201256266765103&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Johns Hopkins University;Stanford University",
        "aff_unique_dep": "School of Engineering;",
        "aff_unique_url": "https://engineering.jhu.edu;https://www.stanford.edu",
        "aff_unique_abbr": "JHU Engineering;Stanford",
        "aff_campus_unique_index": "0;1",
        "aff_campus_unique": "Baltimore;Stanford",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Z2dVrgLpsF",
        "title": "On partial prototype collapse in clustering-based self-supervised learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "A prominent self-supervised learning paradigm is to model the representations as clusters, or more generally as a mixture model. Learning to map the data samples to compact representations and fitting the mixture model simultaneously leads to the representation collapse problem. Regularizing the distribution of data points over the clusters is the prevalent strategy to avoid this issue. While this is sufficient to prevent full representation collapse, we show that a partial prototype collapse problem still exists in these methods, that leads to significant redundancies in the prototypes. Such prototype redundancies serve as shortcuts for the method to achieve a marginal latent class distribution that matches the prescribed prior distribution. We show that by encouraging the model to use diverse prototypes, the partial prototype collapse can be mitigated. Effective utilization of the prototypes enables the methods to learn more fine-grained clusters, encouraging more informative representations. We demonstrate that this is especially beneficial when pre-training on a long-tailed fine-grained dataset.",
        "keywords": "self-supervised learning;vision transformers;clustering-based methods",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Hariprasath Govindarajan;Per Sid\u00e9n;Jacob Roll;Fredrik Lindsten",
        "authorids": "~Hariprasath_Govindarajan1;~Per_Sid\u00e9n1;~Jacob_Roll1;~Fredrik_Lindsten1",
        "gender": "M;M;M;M",
        "homepage": ";;https://www.qualcomm.com/products/application/automotive/autonomous-driving;https://lindsten.netlify.app/",
        "dblp": "311/4123;;;22/8369",
        "google_scholar": "SG1SfBkAAAAJ;0UomzRIAAAAJ;;RfTyvdsAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Hariprasath_Govindarajan1;~Per_Sid\u00e9n1;~Jacob_Roll1;~Fredrik_Lindsten1",
        "aff": "Link\u00f6ping University;Link\u00f6ping University;Qualcomm Inc, QualComm;Link\u00f6ping University",
        "aff_domain": "liu.se;liu.se;qti.qualcomm.com;liu.se",
        "position": "PhD student;Postdoc;Researcher;Associate Professor",
        "bibtex": "@misc{\ngovindarajan2024on,\ntitle={On partial prototype collapse in clustering-based self-supervised learning},\nauthor={Hariprasath Govindarajan and Per Sid{\\'e}n and Jacob Roll and Fredrik Lindsten},\nyear={2024},\nurl={https://openreview.net/forum?id=Z2dVrgLpsF}\n}",
        "github": "",
        "project": "",
        "reviewers": "fvFf;ugdD;4tkT;hqpg",
        "site": "https://openreview.net/forum?id=Z2dVrgLpsF",
        "pdf_size": 6250561,
        "rating": "3;6;6;6",
        "confidence": "5;4;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "3;3;2;3",
        "wc_summary": "81;42;47;73",
        "wc_strengths": "49;84;95;87",
        "wc_weaknesses": "132;84;89;241",
        "wc_questions": "3;84;118;37",
        "wc_review": "265;294;349;438",
        "wc_reply_reviewers": "0;21;40;19",
        "wc_reply_authors": "1218;609;1280;1541",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "3;1;2;3",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            60.75,
            16.588776326179094
        ],
        "wc_strengths_avg": [
            78.75,
            17.640507362318125
        ],
        "wc_weaknesses_avg": [
            136.5,
            63.1525929792277
        ],
        "wc_questions_avg": [
            60.5,
            43.92322847879013
        ],
        "wc_review_avg": [
            336.5,
            65.91092473937837
        ],
        "wc_reply_reviewers_avg": [
            20.0,
            14.159802258506296
        ],
        "wc_reply_authors_avg": [
            1162.0,
            341.50768658992143
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11579099032864373928&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Link\u00f6ping University;Qualcomm Incorporated",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.liu.se;https://www.qualcomm.com",
        "aff_unique_abbr": "LiU;Qualcomm",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "Sweden;United States"
    },
    {
        "id": "Z2xLkpkh0s",
        "title": "FARSE-CNN: Fully Asynchronous, Recurrent and Sparse Event-Based CNN",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Event cameras are neuromorphic image sensors that respond to per-pixel brightness changes, producing a stream of asynchronous and spatially sparse events. Currently, the most successful algorithms for event cameras convert batches of events into dense image-like representations that are synchronously processed by deep learning models of frame-based computer vision. These methods discard the inherent properties of events, leading to high latency and computational costs. Following a recent line of works, we propose a model for efficient asynchronous event processing that exploits sparsity. We design the Fully Asynchronous, Recurrent and Sparse Event-Based CNN (FARSE-CNN), a novel multi-layered architecture which combines the mechanisms of recurrent and convolutional neural networks. To build efficient deep networks, we propose compression modules that allow to learn hierarchical features both in space and time. We theoretically derive the complexity of all components in our architecture, and experimentally validate our method on tasks for object recognition, object detection and gesture recognition. FARSE-CNN achieves similar or better performance than state-of-the-art asynchronous methods, with low computational complexity and without relying on a fixed-length history of events.",
        "keywords": "deep learning architecture;neuromorphic camera;event-based camera",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/101c9d2c76319941cd699d59a819a07b7f1f0e6e.zip",
        "author": "Riccardo Santambrogio;Marco Cannici;Matteo Matteucci",
        "authorids": "~Riccardo_Santambrogio1;~Marco_Cannici1;~Matteo_Matteucci1",
        "gender": "M;;M",
        "homepage": "https://github.com/rcrsnt;;https://www.deib.polimi.it/eng/people/details/267262",
        "dblp": ";220/3899;19/2200",
        "google_scholar": ";https://scholar.google.it/citations?user=Xd9geyMAAAAJ;https://scholar.google.com.tw/citations?user=PdbEg5YAAAAJ",
        "orcid": ";;0000-0002-8306-6739",
        "linkedin": ";;matteo-matteucci-a5b59717/",
        "or_profile": "~Riccardo_Santambrogio1;~Marco_Cannici1;~Matteo_Matteucci1",
        "aff": "Polytechnic Institute of Milan;University of Zurich;Politecnico di Milano",
        "aff_domain": "polimi.it;ifi.uzh.ch;polimi.it",
        "position": "PhD student;Postdoc;Full Professor",
        "bibtex": "@misc{\nsantambrogio2024farsecnn,\ntitle={{FARSE}-{CNN}: Fully Asynchronous, Recurrent and Sparse Event-Based {CNN}},\nauthor={Riccardo Santambrogio and Marco Cannici and Matteo Matteucci},\nyear={2024},\nurl={https://openreview.net/forum?id=Z2xLkpkh0s}\n}",
        "github": "",
        "project": "",
        "reviewers": "Dqva;bxjc;oYpd;WJKv",
        "site": "https://openreview.net/forum?id=Z2xLkpkh0s",
        "pdf_size": 2374685,
        "rating": "5;5;5;6",
        "confidence": "5;4;4;3",
        "soundness": "3;2;3;3",
        "contribution": "3;2;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "49;11;27;58",
        "wc_strengths": "138;18;46;119",
        "wc_weaknesses": "101;141;218;68",
        "wc_questions": "2;3;86;3",
        "wc_review": "290;173;377;248",
        "wc_reply_reviewers": "0;0;0;59",
        "wc_reply_authors": "126;174;430;26",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            36.25,
            18.430613120566555
        ],
        "wc_strengths_avg": [
            80.25,
            49.71104002130714
        ],
        "wc_weaknesses_avg": [
            132.0,
            55.97767412102793
        ],
        "wc_questions_avg": [
            23.5,
            36.08670115153226
        ],
        "wc_review_avg": [
            272.0,
            73.69871097922947
        ],
        "wc_reply_reviewers_avg": [
            14.75,
            25.54774941164094
        ],
        "wc_reply_authors_avg": [
            189.0,
            149.03355326905415
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13296353585979557601&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Polytechnic Institute of Milan;University of Zurich;Politecnico di Milano",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.polimi.it/;https://www.unizh.ch;https://www.polimi.it",
        "aff_unique_abbr": "Politecnico di Milano;UZH;Polimi",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Italy;Switzerland"
    },
    {
        "id": "Z4jsnFJMDd",
        "title": "Boosting Discriminative Visual Representation Learning with Scenario-Agnostic Mixup",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Mixup is a hit data-dependent augmentation technique that entails two sub-tasks: mixed sample generation and classification. This paper comprehensively studies the objective of mixup generation and proposes \\textbf{S}cenario-\\textbf{A}gnostic \\textbf{Mix}up (SAMix) to address the two remaining challenges in this field at once:\n\\textbf{(i) Huge performance variation over scenarios caused by trivial solutions.} The objective of mixup generation narrows to selected sample pairs rather than the whole observed data manifold, which gives rise to the hassle of trivial solutions, resulting in drastic variations in sample mixing performance over different scenarios.\n\\textbf{(ii) Self-supervised learning (SSL) dilemma for online training policies.} While recent online training policies can generate out-of-manifold samples on supervised learning (SL), simply applying them to SSL scenarios leads to subpar performance.\nWe hypothesize and verify the objective function of mixup generation as optimizing \\textit{local smoothness} between two mixed classes subject to \\textit{global discrimination} from the other classes. Thus, we propose $\\eta$-balanced mixup loss for complementary learning of the two sub-objectives. For the generation model, a label-free generator, Mixer, is designed to generate non-trivial mixed samples with great transferability. To reduce the computational cost from online training, we further introduce a pre-trained version, SAMix$^\\mathcal{P}$, which is more applicable and achieves more favorable generalizability. Extensive experiments on 12 SL and SSL image benchmarks show the consistent superiority of SAMix compared with state-of-the-art methods.",
        "keywords": "Data Augmentation;Image Classification;Self-supervised Learning;Mixup;Representation Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/39045aa45cef4cf70ffd3912d32e025a2e7f1ef1.zip",
        "author": "Siyuan Li;Zicheng Liu;Zedong Wang;Di Wu;Zihan Liu;Yang Liu;Baigui Sun;Stan Z. Li",
        "authorids": "~Siyuan_Li6;~Zicheng_Liu2;~Zedong_Wang1;~Di_Wu28;~Zihan_Liu1;~Yang_Liu51;~Baigui_Sun1;~Stan_Z._Li2",
        "gender": "M;M;M;F;M;M;M;M",
        "homepage": "https://lupin1998.github.io/;;https://jacky1128.github.io;http://www.ciomp.ac.cn;https://researchgate.net/profile/Zihan_Liu25;;;https://en.westlake.edu.cn/academics/School_of_Engineering/About/Our_People/Faculty/201912/t20191206_2497.shtml",
        "dblp": "63/9705-2;l/ZichengLiu-6;179/8811.html;;;27/3367-5;186/8016;l/StanZLi",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com/citations?hl=en;;;t1emSE0AAAAJ;ZNhTHywAAAAJ;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": "0000-0001-6806-2468;;0009-0000-0112-0491;;;;0000-0001-7722-4748;",
        "linkedin": "https://www.linkedin.cn/incareer/in/siyuan-li-lupin1998/;;;;;;;stan-z-li-%E6%9D%8E%E5%AD%90%E9%9D%92-55753224/",
        "or_profile": "~Siyuan_Li6;~Zicheng_Liu2;~Zedong_Wang1;~Di_Wu28;~Zihan_Liu1;~Yang_Liu51;~Baigui_Sun1;~Stan_Z._Li1",
        "aff": "Alibaba Group;Zhejiang University;Westlake University;;Westlake University;Alibaba Group;Alibaba Group;Westlake University",
        "aff_domain": "alibaba-inc.com;zju.edu.cn;westlake.edu;;westlake.edu;alibaba-inc.com;alibaba-inc.com;westlake.edu.cn",
        "position": "Intern;PhD student;Intern;;PhD student;Researcher at Alibaba Group;Researcher;Chair Professor",
        "bibtex": "@misc{\nli2024boosting,\ntitle={Boosting Discriminative Visual Representation Learning with Scenario-Agnostic Mixup},\nauthor={Siyuan Li and Zicheng Liu and Zedong Wang and Di Wu and Zihan Liu and Yang Liu and Baigui Sun and Stan Z. Li},\nyear={2024},\nurl={https://openreview.net/forum?id=Z4jsnFJMDd}\n}",
        "github": "",
        "project": "",
        "reviewers": "2ZAN;1gXV;AzRU;3BML",
        "site": "https://openreview.net/forum?id=Z4jsnFJMDd",
        "pdf_size": 11092138,
        "rating": "3;5;5;6",
        "confidence": "2;4;3;4",
        "soundness": "1;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "1;1;1;3",
        "wc_summary": "122;74;90;66",
        "wc_strengths": "61;67;36;45",
        "wc_weaknesses": "527;471;67;88",
        "wc_questions": "3;39;4;104",
        "wc_review": "713;651;197;303",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            88.0,
            21.447610589527216
        ],
        "wc_strengths_avg": [
            52.25,
            12.356678356257397
        ],
        "wc_weaknesses_avg": [
            288.25,
            211.80813841776714
        ],
        "wc_questions_avg": [
            37.5,
            41.0396150079408
        ],
        "wc_review_avg": [
            466.0,
            220.32022149589446
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.899228803025897,
        "gs_citation": 22,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16974642562022672769&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;2;0;0;2",
        "aff_unique_norm": "Alibaba Group;Zhejiang University;Westlake University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.alibaba.com;https://www.zju.edu.cn;https://www.westlake.edu.cn",
        "aff_unique_abbr": "Alibaba;ZJU;WU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "Z4rus4p7Zu",
        "title": "Distilling ODE Solvers of Diffusion Models into Smaller Steps",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Distillation techniques have substantially improved the sampling speed of diffusion models, allowing of the generation within only one step or a few steps. However, these distillation methods require extensive training for each dataset, sampler, and network, which limits their practical applicability. To address this limitation, we propose a straightforward distillation approach, Distilled-ODE solvers (D-ODE solvers), that optimizes the ODE solver rather than training the denoising network. D-ODE solvers are formulated by simply applying a single parameter adjustment to existing ODE solvers. Subsequently, D-ODE solvers with smaller steps are optimized by ODE solvers with larger steps through distillation over a batch of samples. Our comprehensive experiments indicate that D-ODE solvers outperform existing ODE solvers, including DDIM, PNDM, DPM-Solver, DEIS, and EDM, especially when generating samples with fewer steps. Our method incur negligible computational overhead compared to previous distillation techniques, enabling simple and rapid integration with previous samplers. Qualitative analysis further shows that D-ODE solvers enhance image quality while preserving the sampling trajectory of ODE solvers.",
        "keywords": "generative model;diffusion model;ODE solver;knowledge distillation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/dac717c8b992a866ee146114a3802b46e7682a4b.zip",
        "author": "Sanghwan Kim;Hao Tang;Fisher Yu",
        "authorids": "~Sanghwan_Kim1;~Hao_Tang6;~Fisher_Yu2",
        "gender": "M;M;M",
        "homepage": ";https://ha0tang.github.io/;https://www.yf.io/",
        "dblp": "60/10274;07/5751-5;117/6314",
        "google_scholar": ";9zJkeEMAAAAJ;-XCiamcAAAAJ",
        "orcid": ";0000-0002-2077-1246;",
        "linkedin": "sanghwan-kim-bb2a41193/;hao-tang-887475138/;",
        "or_profile": "~Sanghwan_Kim1;~Hao_Tang6;~Fisher_Yu2",
        "aff": "Technische Universit\u00e4t M\u00fcnchen;Carnegie Mellon University;Swiss Federal Institute of Technology",
        "aff_domain": "tum.de;cmu.edu;ethz.ch",
        "position": "PhD student;Postdoc;Assistant Professor",
        "bibtex": "@misc{\nkim2024distilling,\ntitle={Distilling {ODE} Solvers of Diffusion Models into Smaller Steps},\nauthor={Sanghwan Kim and Hao Tang and Fisher Yu},\nyear={2024},\nurl={https://openreview.net/forum?id=Z4rus4p7Zu}\n}",
        "github": "",
        "project": "",
        "reviewers": "pnZP;931n;Wdr7",
        "site": "https://openreview.net/forum?id=Z4rus4p7Zu",
        "pdf_size": 26578541,
        "rating": "3;5;5",
        "confidence": "4;4;4",
        "soundness": "2;3;2",
        "contribution": "2;1;2",
        "presentation": "1;3;3",
        "wc_summary": "78;120;48",
        "wc_strengths": "29;55;45",
        "wc_weaknesses": "313;129;87",
        "wc_questions": "91;17;2",
        "wc_review": "511;321;182",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            82.0,
            29.5296461204668
        ],
        "wc_strengths_avg": [
            43.0,
            10.708252269472673
        ],
        "wc_weaknesses_avg": [
            176.33333333333334,
            98.14728161741867
        ],
        "wc_questions_avg": [
            36.666666666666664,
            38.90444133457716
        ],
        "wc_review_avg": [
            338.0,
            134.85053454349622
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14863975060515155087&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Technische Universit\u00e4t M\u00fcnchen;Carnegie Mellon University;Swiss Federal Institute of Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.tum.de;https://www.cmu.edu;https://www.ethz.ch",
        "aff_unique_abbr": "TUM;CMU;ETH Zurich",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2",
        "aff_country_unique": "Germany;United States;Switzerland"
    },
    {
        "title": "Trajeglish: Traffic Modeling as Next-Token Prediction",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18411",
        "id": "Z59Rb5bPPP",
        "author_site": "Jonah Philion, Xue Bin Peng, Sanja Fidler",
        "tldr": "",
        "abstract": "A longstanding challenge for self-driving development is simulating dynamic driving scenarios seeded from recorded driving logs. In pursuit of this functionality, we apply tools from discrete sequence modeling to model how vehicles, pedestrians and cyclists interact in driving scenarios. Using a simple data-driven tokenization scheme, we discretize trajectories to centimeter-level resolution using a small vocabulary. We then model the multi-agent sequence of discrete motion tokens with a GPT-like encoder-decoder that is autoregressive in time and takes into account intra-timestep interaction between agents. Scenarios sampled from our model exhibit state-of-the-art realism; our model tops the Waymo Sim Agents Benchmark, surpassing prior work along the realism meta metric by 3.3% and along the interaction metric by 9.9%. We ablate our modeling choices in full autonomy and partial autonomy settings, and show that the representations learned by our model can quickly be adapted to improve performance on nuScenes. We additionally evaluate the scalability of our model with respect to parameter count and dataset size, and use density estimates from our model to quantify the saliency of context length and intra-timestep interaction for the traffic modeling task.",
        "keywords": "self-driving;traffic modeling;autonomous vehicles;simulation;motion prediction;transformer",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/df8250037d3a59d504c1d44d06db181075446911.zip",
        "author": "Jonah Philion;Xue Bin Peng;Sanja Fidler",
        "authorids": "~Jonah_Philion1;~Xue_Bin_Peng1;~Sanja_Fidler1",
        "gender": "M;M;F",
        "homepage": ";https://xbpeng.github.io;http://www.cs.toronto.edu/~fidler/",
        "dblp": "241/5158;;08/6607",
        "google_scholar": "VVIAoY0AAAAJ;https://scholar.google.ca/citations?user=FwxfQosAAAAJ;CUlqK5EAAAAJ",
        "orcid": ";;",
        "linkedin": ";;sanja-fidler-2846a1a?trk=hp-identity-name",
        "or_profile": "~Jonah_Philion1;~Xue_Bin_Peng1;~Sanja_Fidler1",
        "aff": "Toronto University;Simon Fraser University;Department of Computer Science, University of Toronto",
        "aff_domain": "utoronto.ca;sfu.ca;cs.toronto.edu",
        "position": "PhD student;Assistant Professor;Associate Professor",
        "bibtex": "@inproceedings{\nphilion2024trajeglish,\ntitle={Trajeglish: Traffic Modeling as Next-Token Prediction},\nauthor={Jonah Philion and Xue Bin Peng and Sanja Fidler},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Z59Rb5bPPP}\n}",
        "github": "",
        "project": "",
        "reviewers": "mABk;qzEz;KYot",
        "pdf_size": 3013646,
        "rating": "6;6;6",
        "confidence": "3;4;4",
        "soundness": "3;3;3",
        "contribution": "2;2;2",
        "presentation": "3;3;3",
        "wc_summary": "83;63;116",
        "wc_strengths": "28;37;44",
        "wc_weaknesses": "261;23;134",
        "wc_questions": "119;18;111",
        "wc_review": "491;141;405",
        "wc_reply_reviewers": "23;83;57",
        "wc_reply_authors": "1395;498;612",
        "reply_reviewers": "1;1;1",
        "reply_authors": "3;1;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            87.33333333333333,
            21.853044537445015
        ],
        "wc_strengths_avg": [
            36.333333333333336,
            6.548960901462833
        ],
        "wc_weaknesses_avg": [
            139.33333333333334,
            97.23625295582347
        ],
        "wc_questions_avg": [
            82.66666666666667,
            45.84272631023983
        ],
        "wc_review_avg": [
            345.6666666666667,
            148.91906825147979
        ],
        "wc_reply_reviewers_avg": [
            54.333333333333336,
            24.567367696917707
        ],
        "wc_reply_authors_avg": [
            835.0,
            398.705405029829
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 20,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3003455772220887305&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=Z59Rb5bPPP",
        "pdf": "https://openreview.net/pdf?id=Z59Rb5bPPP",
        "email": "utoronto.ca;sfu.ca;cs.toronto.edu",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Toronto;Simon Fraser University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.utoronto.ca;https://www.sfu.ca",
        "aff_unique_abbr": "U of T;SFU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Toronto",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "Z73ymB1C7G",
        "title": "DynVideo-E: Harnessing Dynamic NeRF for Large-Scale Motion- and View-Change Human-Centric Video Editing",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Despite remarkable research advances in diffusion-based video editing, existing methods are limited to short-length videos due to the contradiction between long-range consistency and frame-wise editing. Recent approaches attempt to tackle this challenge by introducing video-2D representations to degrade video editing to image editing. However, they encounter significant difficulties in handling large-scale motion- and view-change videos especially for human-centric videos. This motivates us to introduce the dynamic Neural Radiance Fields (NeRF) as the human-centric video representation to ease the video editing problem to a 3D space editing task. As such, editing can be performed in the 3D spaces and propagated to the entire video via the deformation field. To provide finer and direct controllable editing, we propose the image-based 3D space editing pipeline with a set of effective designs. These include multi-view multi-pose Score Distillation Sampling (SDS) from both 2D personalized diffusion priors and 3D diffusion priors, reconstruction losses on the reference image, text-guided local parts super-resolution, and style transfer for 3D background space. Extensive experiments demonstrate that our method, dubbed as DynVideo-E, significantly outperforms SOTA approaches on two challenging datasets by a large margin of 50%~95% in terms of human preference. Compelling video comparisons are provided in the anonymous project page https://dynvideo-e.github.io. Our code and data will be released to the community.",
        "keywords": "Human-Centric Video Editing;Dynamic NeRF;3D Editing",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Jia-Wei Liu;Yan-Pei Cao;Jay Zhangjie Wu;Weijia Mao;Yuchao Gu;Rui Zhao;Jussi Keppo;Ying Shan;Mike Zheng Shou",
        "authorids": "~Jia-Wei_Liu1;~Yan-Pei_Cao1;~Jay_Zhangjie_Wu1;~Weijia_Mao1;~Yuchao_Gu1;~Rui_Zhao12;~Jussi_Keppo1;~Ying_Shan2;~Mike_Zheng_Shou1",
        "gender": "M;M;M;M;M;M;M;M;",
        "homepage": "https://jia-wei-liu.github.io/;https://yanpei.me/;https://zhangjiewu.github.io/;https://sites.google.com/view/showlab;https://ycgu.site/;;https://www.jussikeppo.com;;http://www.columbia.edu/~zs2262/",
        "dblp": "85/3336;141/6343;322/0749;321/4529;266/4395;26/2578-19;;68/5910;284/0807",
        "google_scholar": "stQQf7wAAAAJ;50194vkAAAAJ;WVp4yjoAAAAJ;;YpfrXyQAAAAJ;https://scholar.google.com.hk/citations?user=wYs7vogAAAAJ;;4oXBp9UAAAAJ;h1-3lSoAAAAJ",
        "orcid": ";;;;;0000-0003-4271-0206;;0000-0001-7673-8325;",
        "linkedin": ";;;;;;keppo/;YingShanProfile/;",
        "or_profile": "~Jia-Wei_Liu1;~Yan-Pei_Cao1;~Jay_Zhangjie_Wu1;~Weijia_Mao1;~Yuchao_Gu1;~Rui_Zhao12;~Jussi_Keppo1;~Ying_Shan2;~Zheng_Shou1",
        "aff": "National University of Singapore;VAST;National University of Singapore;National University of Singapore;National University of Singapore;Alibaba Group;;Tencent PCG ARC Lab;National University of Singapore",
        "aff_domain": "u.nus.edu;vast3dai.com;u.nus.edu;u.nus.edu;u.nus.edu;alibaba-inc.com;;arc.tencent.com;nus.edu.sg",
        "position": "PhD student;Principal Researcher;PhD student;PhD student;PhD student;Intern;;Director;Assistant Professor",
        "bibtex": "@misc{\nliu2024dynvideoe,\ntitle={DynVideo-E: Harnessing Dynamic Ne{RF} for Large-Scale Motion- and View-Change Human-Centric Video Editing},\nauthor={Jia-Wei Liu and Yan-Pei Cao and Jay Zhangjie Wu and Weijia Mao and Yuchao Gu and Rui Zhao and Jussi Keppo and Ying Shan and Mike Zheng Shou},\nyear={2024},\nurl={https://openreview.net/forum?id=Z73ymB1C7G}\n}",
        "github": "",
        "project": "",
        "reviewers": "cDNu;6oK3;6Wks",
        "site": "https://openreview.net/forum?id=Z73ymB1C7G",
        "pdf_size": 26632083,
        "rating": "5;5;6",
        "confidence": "3;4;5",
        "soundness": "3;2;3",
        "contribution": "3;2;3",
        "presentation": "3;2;3",
        "wc_summary": "49;72;58",
        "wc_strengths": "19;19;75",
        "wc_weaknesses": "19;139;137",
        "wc_questions": "14;6;210",
        "wc_review": "101;236;480",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1040;1485;1524",
        "reply_reviewers": "0;0;0",
        "reply_authors": "3;4;3",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            59.666666666666664,
            9.46337971105226
        ],
        "wc_strengths_avg": [
            37.666666666666664,
            26.398653164297777
        ],
        "wc_weaknesses_avg": [
            98.33333333333333,
            56.10307973325133
        ],
        "wc_questions_avg": [
            76.66666666666667,
            94.33745574031322
        ],
        "wc_review_avg": [
            272.3333333333333,
            156.84457983055142
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1349.6666666666667,
            219.54549009766114
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.8660254037844385,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7094806921185574095&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;0;0;0;2;3;0",
        "aff_unique_norm": "National University of Singapore;VAST;Alibaba Group;Tencent",
        "aff_unique_dep": ";;;PCG ARC Lab",
        "aff_unique_url": "https://www.nus.edu.sg;;https://www.alibaba.com;https://www.tencent.com",
        "aff_unique_abbr": "NUS;;Alibaba;Tencent",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;2;2;0",
        "aff_country_unique": "Singapore;;China"
    },
    {
        "id": "Z7OWaSze0V",
        "title": "Unifying User Preferences and Critic Opinions: A Multi-View Cross-Domain Item-sharing Recommender System",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Traditional cross-domain recommender systems often assume user overlap and similar user behavior across domains. However, these presumptions may not always hold true in real-world situations. In this paper, we explore an less explored but practical scenario: cross-domain recommendation with distinct user groups, sharing only item-specific data. Specifically, we consider user and critic review scenarios. Critic reviews, typically from professional media outlets, provide expert and objective perspectives, while user reviews offer personalized insights based on individual experiences. The challenge lies in leveraging critic expertise to enhance personalized user recommendations without sharing user data. To tackle this, we propose a Multi-View Cross-domain Item-sharing Recommendation (MCIR) framework that synergizes user preferences with critic opinions. We develop separate embedding networks for users and critics. The user-rating network leverage a variational autoencoder to capture user scoring embeddings, while the user-review network use pretrained text embeddings to obtain user commentary embeddings. In contrast, critic network utilize multi-task learning to derive insights from critic ratings and reviews. Further, we use Graph Convolutional Network layers to gather neighborhood information from the user-critic-item graph, and implement an attentive integration mechanism and cross-view contrastive learning mechanism to align embeddings across different views. Real-world dataset experiments validate the effectiveness of the proposed MCIR framework, demonstrating its superiority over many state-of-the-art methods.",
        "keywords": "Cross-domain Recommendation;Collaborative Filtering;Critic Review",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/e08905fe130cc3106c8f84744089d636e8a8aa10.zip",
        "author": "Chao Wang;Wei Wu;Hao Henry Wang;Hui Xiong",
        "authorids": "~Chao_Wang14;~Wei_Wu25;~Hao_Henry_Wang1;~Hui_Xiong1",
        "gender": "M;M;;M",
        "homepage": "https://chaowang-ustc.github.io/;https://github.com/U-rara;;https://www.hkust-gz.edu.cn/people/hui-xiong/",
        "dblp": "188/7759-86;95/6985-45.html;;262/1686-1.html",
        "google_scholar": "j08V64UAAAAJ;;;cVDF1tkAAAAJ",
        "orcid": "0000-0001-7717-447X;0009-0009-1590-601X;;0000-0001-6016-6465",
        "linkedin": ";;;",
        "or_profile": "~Chao_Wang14;~Wei_Wu25;~Hao_Henry_Wang1;~Hui_Xiong1",
        "aff": "HKUST Fok Ying Tung Research Institute, The Hong Kong University of Science and Technology\u00a0(Guangzhou);University of Science and Technology of China;;Hong Kong University of Science and Technology (Guangzhou)",
        "aff_domain": "ust.hk;ustc.edu.cn;;hkust.edu",
        "position": "Postdoc;PhD student;;Full Professor",
        "bibtex": "@misc{\nwang2024unifying,\ntitle={Unifying User Preferences and Critic Opinions: A Multi-View Cross-Domain Item-sharing Recommender System},\nauthor={Chao Wang and Wei Wu and Hao Henry Wang and Hui Xiong},\nyear={2024},\nurl={https://openreview.net/forum?id=Z7OWaSze0V}\n}",
        "github": "",
        "project": "",
        "reviewers": "c3D1;3TsF;Pmes;6fW2",
        "site": "https://openreview.net/forum?id=Z7OWaSze0V",
        "pdf_size": 634344,
        "rating": "3;5;5;5",
        "confidence": "4;4;3;3",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;2",
        "presentation": "2;2;2;4",
        "wc_summary": "30;49;62;59",
        "wc_strengths": "23;24;74;25",
        "wc_weaknesses": "259;33;179;150",
        "wc_questions": "6;242;165;197",
        "wc_review": "318;348;480;431",
        "wc_reply_reviewers": "0;0;117;66",
        "wc_reply_authors": "600;524;1244;1391",
        "reply_reviewers": "0;0;2;1",
        "reply_authors": "2;2;3;4",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            50.0,
            12.509996003196804
        ],
        "wc_strengths_avg": [
            36.5,
            21.66217902243447
        ],
        "wc_weaknesses_avg": [
            155.25,
            81.08752986742167
        ],
        "wc_questions_avg": [
            152.5,
            88.89460051094217
        ],
        "wc_review_avg": [
            394.25,
            64.53051603698827
        ],
        "wc_reply_reviewers_avg": [
            45.75,
            49.175069903356516
        ],
        "wc_reply_authors_avg": [
            939.75,
            382.2540876171241
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:uSOvwV4TbmwJ:scholar.google.com/&scioq=Unifying+User+Preferences+and+Critic+Opinions:+A+Multi-View+Cross-Domain+Item-sharing+Recommender+System&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Hong Kong University of Science and Technology;University of Science and Technology of China",
        "aff_unique_dep": "Fok Ying Tung Research Institute;",
        "aff_unique_url": "https://www.ust.hk;http://www.ustc.edu.cn",
        "aff_unique_abbr": "HKUST;USTC",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Guangzhou;;Hong Kong SAR",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "Z89D6efImi",
        "title": "Light-Implicit Uncalibrated Photometric Stereo Network With Fourier Embedding",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We present a one-stage deep uncalibrated photometric stereo (UPS) network for non-Lambertian objects. Previous two-stage deep UPS networks estimated surface normals based on learned lighting because lighting is tangled with shading cues, making it challenging to directly estimate surface normals. However,  two-stage UPS networks face fewer interpretations with embedded light direction's role in decomposing shading cues. Additionally, these two-stage methods discretize the light direction estimations instead of regressing exact light directions due to the learning difficulty and instability. However, the inexact light directions mislead shading cues extracted by the normal estimation network. \n\nIn contrast to previous two-stage UPS methods, our UPS-FourNet implicitly learns lighting by decomposing inputs using embedded Fourier transform. Our approach is motivated by a unique observation from photometric stereo images in the Fourier domain: lighting information predominantly concentrates on phases while shape information is closely related to amplitudes. By leveraging this property, the shape and lighting can be \"decomposed\" to a certain extent in the Fourier domain, eliminating the need for explicitly learning light directions and using them in the subsequent normal regression network. UPS-FourNet relaxes the limitations of two-stage UPS methods, with better training stability, concise end-to-end structures, and avoiding the discrete classification errors of light directions.  Experiments on synthetic and real datasets show that our method achieves competitive results, which may push a new strategy for deep learning-based UPS methods.",
        "keywords": "Photometric Stereo;3D Reconstruction;Fourier Transform;Amplitude and Phase;Uncalibrated light",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yakun Ju;Bihan Wen;Cong Zhang;Kin-man Lam;Alex Kot",
        "authorids": "~Yakun_Ju1;~Bihan_Wen2;~Cong_Zhang4;~Kin-man_Lam1;~Alex_Kot1",
        "gender": "M;M;;M;",
        "homepage": "https://juyakun.github.io/;https://personal.ntu.edu.sg/bihan.wen/;;http://www.eie.polyu.edu.hk/~enkmlam;https://www.ntu.edu.sg/home/eackot/",
        "dblp": "221/9647;158/9840;;;",
        "google_scholar": "hE10pMYAAAAJ;ypkClpwAAAAJ;;https://scholar.google.com.hk/citations?user=6yK7bewAAAAJ;",
        "orcid": "0000-0003-4065-4108;0000-0002-6874-6453;;;",
        "linkedin": ";;;;",
        "or_profile": "~Yakun_Ju1;~Bihan_Wen2;~Cong_Zhang4;~Kin-man_Lam1;~Alex_Kot1",
        "aff": "Nanyang Technological University;Nanyang Technological University;;Hong Kong Polytechnic University;Nanyang Technological University",
        "aff_domain": "ntu.edu.sg;ntu.edu.sg;;polyu.edu.hk;ntu.edu.sg",
        "position": "Postdoc;Assistant Professor;;Full Professor;Full Professor",
        "bibtex": "@misc{\nju2024lightimplicit,\ntitle={Light-Implicit Uncalibrated Photometric Stereo Network With Fourier Embedding},\nauthor={Yakun Ju and Bihan Wen and Cong Zhang and Kin-man Lam and Alex Kot},\nyear={2024},\nurl={https://openreview.net/forum?id=Z89D6efImi}\n}",
        "github": "",
        "project": "",
        "reviewers": "hxLh;pDmL;rCYN;xXVv",
        "site": "https://openreview.net/forum?id=Z89D6efImi",
        "pdf_size": 2782936,
        "rating": "3;3;3;5",
        "confidence": "5;5;5;5",
        "soundness": "2;1;2;3",
        "contribution": "2;2;2;2",
        "presentation": "2;2;3;3",
        "wc_summary": "99;92;48;107",
        "wc_strengths": "29;28;18;97",
        "wc_weaknesses": "147;348;35;177",
        "wc_questions": "636;46;73;255",
        "wc_review": "911;514;174;636",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            5.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            86.5,
            22.85278976405288
        ],
        "wc_strengths_avg": [
            43.0,
            31.47220996371243
        ],
        "wc_weaknesses_avg": [
            176.75,
            112.14360213583296
        ],
        "wc_questions_avg": [
            252.5,
            235.55307257601206
        ],
        "wc_review_avg": [
            558.75,
            264.6142239185188
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:12jSulCwtDYJ:scholar.google.com/&scioq=Light-Implicit+Uncalibrated+Photometric+Stereo+Network+With+Fourier+Embedding&hl=en&as_sdt=0,31",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Nanyang Technological University;Hong Kong Polytechnic University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ntu.edu.sg;https://www.polyu.edu.hk",
        "aff_unique_abbr": "NTU;PolyU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "Singapore;China"
    },
    {
        "id": "Z8RPghUs3W",
        "title": "Analytic DAG Constraints for Differentiable DAG Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recovering underlying Directed Acyclic Graph (DAG) structures from observational data presents a formidable challenge due to the combinatorial nature of the DAG-constrained optimization problem. Recently, researchers have identified gradient vanishing as one of the primary obstacles in differentiable DAG learning and have proposed several DAG constraints to mitigate this issue. By developing the necessary theory to establish a connection between analytic functions and DAG constraints, we demonstrate that analytic functions from the set $\\\\{f(x) = c_0 + \\sum_{i=1}c_ix^i|c_0 \\geqslant 0; \\forall i > 0, c_i > 0; r = \\lim_{i\\rightarrow \\infty}c_{i}/c_{i+1} > 0\\\\}$ can be employed to formulate effective DAG constraints.\nFurthermore, we establish that this set of functions is closed under several functional operators, including differentiation, summation, and multiplication. Consequently, these operators can be leveraged to create novel DAG constraints based on existing ones.\nAdditionally, we emphasize the significance of the convergence radius $r$ of an analytic function as a critical performance indicator. An infinite convergence radius is susceptible to gradient vanishing but less affected by nonconvexity. Conversely, a finite convergence radius aids in mitigating the gradient vanishing issue but may be more susceptible to nonconvexity. This property can be instrumental in selecting appropriate DAG constraints for various scenarios.",
        "keywords": "DAG Learning;Causal Discovery;Structure Learning",
        "primary_area": "causal reasoning",
        "supplementary_material": "",
        "author": "Zhen Zhang;Ignavier Ng;Dong Gong;Yuhang Liu;Mingming Gong;Biwei Huang;Kun Zhang;Anton van den Hengel;Javen Qinfeng Shi",
        "authorids": "~Zhen_Zhang2;~Ignavier_Ng1;~Dong_Gong1;~Yuhang_Liu1;~Mingming_Gong1;~Biwei_Huang1;~Kun_Zhang1;~Anton_van_den_Hengel1;~Javen_Qinfeng_Shi1",
        "gender": "M;M;M;;M;F;M;;M",
        "homepage": "https://zzhang.org;https://ignavierng.github.io/;https://donggong1.github.io;https://sites.google.com/view/yuhangliu/homepage;https://mingming-gong.github.io/;;http://www.andrew.cmu.edu/user/kunz1/;;https://cs.adelaide.edu.au/~javen/",
        "dblp": "19/5112-8;251/3037;125/5032;;98/8479;165/3288;96/3115-1;v/AntonvandenHengel;http://dblp.uni-trier.de/pers/hd/s/Shi:Qinfeng",
        "google_scholar": "https://scholar.google.com.sg/citations?user=4X6Hqg0AAAAJ;;https://scholar.google.com.au/citations?user=e2u6hRoAAAAJ;5xZspvQAAAAJ;https://scholar.google.com.au/citations?user=6BmiCJIAAAAJ;;RGoypN4AAAAJ;https://scholar.google.com.au/citations?user=nMGZ2ZQAAAAJ;https://scholar.google.com.au/citations?user=h6O9vYkAAAAJ",
        "orcid": "0000-0003-2805-4396;;0000-0002-2668-9630;;0000-0001-7147-5589;;;0000-0003-3027-8364;0000-0002-9126-2107",
        "linkedin": ";;;;;;;;",
        "or_profile": "~Zhen_Zhang2;~Ignavier_Ng1;~Dong_Gong1;~Yuhang_Liu1;~Mingming_Gong1;~Biwei_Huang1;~Kun_Zhang1;~Anton_van_den_Hengel1;~Javen_Shi1",
        "aff": "The University of Adelaide;Carnegie Mellon University;University of New South Wales;The University of Adelaide;University of Melbourne;University of California, San Diego;Carnegie Mellon University;University of Adelaide;University of Adelaide",
        "aff_domain": "adelaide.edu.au;cmu.edu;unsw.edu.au;adelaide.edu.au;unimelb.edu.au;ucsd.edu;cmu.edu;adelaide.edu.au;adelaide.edu.au",
        "position": "Postdoc;PhD student;Assistant Professor;Postdoc;Assistant Professor;Assistant Professor;Associate Professor;Professor;Professor",
        "bibtex": "@misc{\nzhang2024analytic,\ntitle={Analytic {DAG} Constraints for Differentiable {DAG} Learning},\nauthor={Zhen Zhang and Ignavier Ng and Dong Gong and Yuhang Liu and Mingming Gong and Biwei Huang and Kun Zhang and Anton van den Hengel and Javen Qinfeng Shi},\nyear={2024},\nurl={https://openreview.net/forum?id=Z8RPghUs3W}\n}",
        "github": "",
        "project": "",
        "reviewers": "mZ7h;JLDA;EZWF;Y15A",
        "site": "https://openreview.net/forum?id=Z8RPghUs3W",
        "pdf_size": 1016310,
        "rating": "5;6;6;6",
        "confidence": "4;3;3;4",
        "soundness": "4;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "4;2;3;2",
        "wc_summary": "64;96;64;170",
        "wc_strengths": "73;118;29;105",
        "wc_weaknesses": "74;99;70;394",
        "wc_questions": "60;286;7;2",
        "wc_review": "271;599;170;671",
        "wc_reply_reviewers": "245;20;0;63",
        "wc_reply_authors": "700;502;407;565",
        "reply_reviewers": "2;1;0;1",
        "reply_authors": "7;1;1;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            98.5,
            43.298383341644524
        ],
        "wc_strengths_avg": [
            81.25,
            34.3247359785913
        ],
        "wc_weaknesses_avg": [
            159.25,
            135.98782114586587
        ],
        "wc_questions_avg": [
            88.75,
            116.12789285955377
        ],
        "wc_review_avg": [
            427.75,
            211.83882434530267
        ],
        "wc_reply_reviewers_avg": [
            82.0,
            96.82200163186052
        ],
        "wc_reply_authors_avg": [
            543.5,
            106.42955416612436
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.5,
            2.598076211353316
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12004946212300101627&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0;3;4;1;0;0",
        "aff_unique_norm": "University of Adelaide;Carnegie Mellon University;University of New South Wales;University of Melbourne;University of California, San Diego",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.adelaide.edu.au;https://www.cmu.edu;https://www.unsw.edu.au;https://www.unimelb.edu.au;https://www.ucsd.edu",
        "aff_unique_abbr": "Adelaide;CMU;UNSW;UniMelb;UCSD",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";San Diego",
        "aff_country_unique_index": "0;1;0;0;0;1;1;0;0",
        "aff_country_unique": "Australia;United States"
    },
    {
        "title": "Addressing Signal Delay in Deep Reinforcement Learning",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18410",
        "id": "Z8UfDs4J46",
        "author_site": "Wei Wang, Dongqi Han, Xufang Luo, Dongsheng Li",
        "tldr": "",
        "abstract": "Despite the notable advancements in deep reinforcement learning (DRL) in recent years, a prevalent issue that is often overlooked is the impact of signal delay. Signal delay occurs when there is a lag between an agent's perception of the environment and its corresponding actions. In this paper, we first formalize delayed-observation Markov decision processes (DOMDP) by extending the standard MDP framework to incorporate signal delays. Next, we elucidate the challenges posed by the presence of signal delay in DRL, showing that trivial DRL algorithms and generic methods for partially observable tasks suffer greatly from delays. Lastly, we propose effective strategies to overcome these challenges. Our methods achieve remarkable performance in continuous robotic control tasks with large delays, yielding results comparable to those in non-delayed cases. Overall, our work contributes to a deeper understanding of DRL in the presence of signal delays and introduces novel approaches to address the associated challenges.",
        "keywords": "Deep Reinforcement Learning;Signal Delay;Robotic Control;Continuous Control",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/8176ec6896868769880f6dc46a25389b3ce88a1d.zip",
        "author": "Wei Wang;Dongqi Han;Xufang Luo;Dongsheng Li",
        "authorids": "~Wei_Wang59;~Dongqi_Han1;~Xufang_Luo1;~Dongsheng_Li2",
        "gender": "M;M;F;M",
        "homepage": "https://waybaba.com;https://frosthan.github.io/;;http://recmind.cn",
        "dblp": ";;218/7350;254/0830-2.html",
        "google_scholar": "https://scholar.google.ca/citations?user=brsAcesAAAAJ;3V_9fRUAAAAJ;;VNg5rA8AAAAJ",
        "orcid": ";0000-0002-6872-7121;;0000-0003-3103-8442",
        "linkedin": ";;;",
        "or_profile": "~Wei_Wang59;~Dongqi_Han1;~Xufang_Luo1;~Dongsheng_Li2",
        "aff": "Western University;Microsoft;Microsoft Research;Microsoft Research Asia",
        "aff_domain": "uwo.ca;microsoft.com;microsoft.com;microsoft.com",
        "position": "MS student;Researcher;Researcher;Principal Researcher",
        "bibtex": "@inproceedings{\nwang2024addressing,\ntitle={Addressing Signal Delay in Deep Reinforcement Learning},\nauthor={Wei Wang and Dongqi Han and Xufang Luo and Dongsheng Li},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Z8UfDs4J46}\n}",
        "github": "",
        "project": "",
        "reviewers": "6hPB;dZmE;aPPk;eRXT",
        "pdf_size": 6486621,
        "rating": "3;6;6;8",
        "confidence": "4;5;3;3",
        "soundness": "2;3;3;4",
        "contribution": "1;3;3;4",
        "presentation": "2;3;3;3",
        "wc_summary": "305;28;101;87",
        "wc_strengths": "46;133;90;101",
        "wc_weaknesses": "650;41;91;301",
        "wc_questions": "106;2;52;121",
        "wc_review": "1107;204;334;610",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "2646;621;754;1025",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "4;1;1;2",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            1.0897247358851685
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            130.25,
            104.5451457505321
        ],
        "wc_strengths_avg": [
            92.5,
            31.148836254345042
        ],
        "wc_weaknesses_avg": [
            270.75,
            239.70854698988103
        ],
        "wc_questions_avg": [
            70.25,
            47.023265518251705
        ],
        "wc_review_avg": [
            563.75,
            346.2169659332136
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1261.5,
            812.4913845697073
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.37998029782867415,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13006842359743289298&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=Z8UfDs4J46",
        "pdf": "https://openreview.net/pdf?id=Z8UfDs4J46",
        "email": "uwo.ca;microsoft.com;microsoft.com;microsoft.com",
        "author_num": 4,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Western University;Microsoft",
        "aff_unique_dep": ";Microsoft Corporation",
        "aff_unique_url": "https://www.uwo.ca;https://www.microsoft.com",
        "aff_unique_abbr": "Western;Microsoft",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Asia",
        "aff_country_unique_index": "0;1;1;2",
        "aff_country_unique": "Canada;United States;China"
    },
    {
        "id": "Z8rrvU7Nfq",
        "title": "Optimization for Neural Operator Learning: Wider Networks are Better",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Neural Operators, such as Deep Operator Networks (DONs) (Lu et al., 2021) and Fourier Neural Operators (FNOs) (Li et al., 2021a), that directly learn mappings between function spaces have received considerable recent attention. Despite the universal approximation guarantees for DONs (Lu et al., 2021; Chen & Chen, 1995) and FNOs (Kovachki et al., 2021), there is currently no optimization conver-\ngence guarantee for learning such networks using gradient descent (GD). In this paper, we present a unified framework for optimization based on GD and apply the framework to DONs and FNOs, establishing convergence guarantees for both. In particular, we show that as long two conditions\u2014restricted strong convexity (RSC) and smoothness\u2014are satisfied by the loss, GD is guaranteed to decrease the loss geometrically. Subsequently, we show that the two conditions are indeed satisfied by the DON and FNO losses, but because of rather different reasons that arise as a result of differences in the structure of the respective models. One takeaway that emerges is that wider networks lead to better optimization convergence for both DONs and FNOs. We present empirical results on several canonical oper-\nator learning problems to show that wider DONs and FNOs lead to lower training losses, thereby supporting the theoretical results.",
        "keywords": "Restricted Strong Convexity;Operator Learning;Fourier Neural Operators;Deep Operator Networks;Gradient Descent",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Bhavesh Shrimali;Arindam Banerjee;Pedro Cisneros-Velarde",
        "authorids": "~Bhavesh_Shrimali1;~Arindam_Banerjee4;~Pedro_Cisneros-Velarde1",
        "gender": "M;;",
        "homepage": ";https://arindam.cs.illinois.edu/;https://sites.google.com/view/pcisnerosv",
        "dblp": ";82/4807.html;188/3800",
        "google_scholar": "https://scholar.google.co.in/citations?user=yqcs3q4AAAAJ;RY7cuPAAAAAJ;VvVRo5oAAAAJ",
        "orcid": ";;",
        "linkedin": "bhaveshshrimali;;",
        "or_profile": "~Bhavesh_Shrimali1;~Arindam_Banerjee4;~Pedro_Cisneros-Velarde1",
        "aff": ";University of Illinois, Urbana Champaign;VMware Research",
        "aff_domain": ";illinois.edu;vmware.com",
        "position": ";Professor;Researcher",
        "bibtex": "@misc{\nshrimali2024optimization,\ntitle={Optimization for Neural Operator Learning: Wider Networks are Better},\nauthor={Bhavesh Shrimali and Arindam Banerjee and Pedro Cisneros-Velarde},\nyear={2024},\nurl={https://openreview.net/forum?id=Z8rrvU7Nfq}\n}",
        "github": "",
        "project": "",
        "reviewers": "JAvK;xbcP;15jL;MTc6",
        "site": "https://openreview.net/forum?id=Z8rrvU7Nfq",
        "pdf_size": 1037726,
        "rating": "3;3;5;6",
        "confidence": "5;3;5;3",
        "soundness": "4;1;4;3",
        "contribution": "3;1;1;2",
        "presentation": "3;3;3;2",
        "wc_summary": "109;36;34;54",
        "wc_strengths": "25;30;10;22",
        "wc_weaknesses": "227;217;163;32",
        "wc_questions": "1;41;2;231",
        "wc_review": "362;324;209;339",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            1.0
        ],
        "soundness_avg": [
            3.0,
            1.224744871391589
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            58.25,
            30.318105151872537
        ],
        "wc_strengths_avg": [
            21.75,
            7.361215932167728
        ],
        "wc_weaknesses_avg": [
            159.75,
            77.67037723611236
        ],
        "wc_questions_avg": [
            68.75,
            95.0536032983495
        ],
        "wc_review_avg": [
            308.5,
            59.01906471641176
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.19245008972987526,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:TInfKDwCKjUJ:scholar.google.com/&scioq=Optimization+for+Neural+Operator+Learning:+Wider+Networks+are+Better&hl=en&as_sdt=0,34",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Illinois Urbana-Champaign;VMware, Inc.",
        "aff_unique_dep": ";VMware Research",
        "aff_unique_url": "https://illinois.edu;https://www.vmware.com/research.html",
        "aff_unique_abbr": "UIUC;VMware",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Urbana-Champaign;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Z8uFGTNXIF",
        "title": "Simplifying Referred Visual Search with Conditional Contrastive Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper introduces a new challenge for image similarity search in the context of fashion, addressing the inherent ambiguity in this domain stemming from complex images. We present Referred Visual Search (RVS), a task allowing users to define more precisely the desired similarity, following recent interest in the industry. We release a new large public dataset, LAION-RVS-Fashion, consisting of 272k fashion products with 842k images extracted from LAION, designed explicitly for this task. However, unlike traditional visual search methods in the industry, we demonstrate that superior performance can be achieved by bypassing explicit object detection and adopting weakly-supervised conditional contrastive learning on image tuples. Our method is lightweight and demonstrates robustness, reaching Recall at one superior to strong detection-based baselines against 2M distractors. Code, data, and models will be released.",
        "keywords": "Instance Retrieval;Contrastive Learning;Conditional Embedding",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Simon Lepage;Jeremie Mary;David Picard",
        "authorids": "~Simon_Lepage1;~Jeremie_Mary1;~David_Picard1",
        "gender": "M;M;",
        "homepage": "https://simon-lepage.github.io;;",
        "dblp": "348/9757;17/3180;",
        "google_scholar": ";https://scholar.google.fr/citations?user=T3dQRjAAAAAJ;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Simon_Lepage1;~Jeremie_Mary1;~David_Picard1",
        "aff": "Criteo;Inria;",
        "aff_domain": "criteo.com;inria.fr;",
        "position": "PhD student;Associate Professor;",
        "bibtex": "@misc{\nlepage2024simplifying,\ntitle={Simplifying Referred Visual Search with Conditional Contrastive Learning},\nauthor={Simon Lepage and Jeremie Mary and David Picard},\nyear={2024},\nurl={https://openreview.net/forum?id=Z8uFGTNXIF}\n}",
        "github": "",
        "project": "",
        "reviewers": "sg3G;vVJq;F8wp",
        "site": "https://openreview.net/forum?id=Z8uFGTNXIF",
        "pdf_size": 7896425,
        "rating": "5;5;6",
        "confidence": "5;4;3",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "3;3;4",
        "wc_summary": "39;42;58",
        "wc_strengths": "55;25;36",
        "wc_weaknesses": "95;75;156",
        "wc_questions": "115;3;18",
        "wc_review": "304;145;268",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "677;204;581",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;1;2",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            46.333333333333336,
            8.339997335464536
        ],
        "wc_strengths_avg": [
            38.666666666666664,
            12.39175353029407
        ],
        "wc_weaknesses_avg": [
            108.66666666666667,
            34.451253807211266
        ],
        "wc_questions_avg": [
            45.333333333333336,
            49.64093293061909
        ],
        "wc_review_avg": [
            239.0,
            68.07348970047003
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            487.3333333333333,
            204.14428448744013
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:qXISOi9a_WEJ:scholar.google.com/&scioq=Simplifying+Referred+Visual+Search+with+Conditional+Contrastive+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Criteo;INRIA",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.criteo.com;https://www.inria.fr",
        "aff_unique_abbr": "Criteo;Inria",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "France"
    },
    {
        "id": "Z91rwXnJsw",
        "title": "Interactive Semantic Map Representation for Skill-based Visual Object Navigation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Visual object navigation using learning methods is one of the key tasks in mobile robotics. This paper introduces a new representation of a scene semantic map formed during the embodied agent interaction with the indoor environment. It is based on a neural network method that adjusts the weights of the segmentation model with backpropagation of the predicted fusion loss values during inference on a regular (backward) or delayed (forward) image sequence. We have implemented this representation into a full-fledged navigation approach called SkillTron, which can select robot skills from end-to-end policies based on reinforcement learning and classic map-based planning methods. The proposed approach makes it possible to form both intermediate goals for robot exploration and the final goal for object navigation. We conducted intensive experiments with the proposed approach in the Habitat environment, which showed a significant superiority in navigation quality metrics compared to state-of-the-art approaches. The developed code and used custom datasets will be publicly available.",
        "keywords": "visual object navigation;semantic map representation;interactive segmentation;image sequence;robot skill;reinforcement learning;planning",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/75aa619b580d576d601a3b0feb1629639bb5940c.zip",
        "author": "Tatiana Zemskova;Aleksei Staroverov;Kirill Muravyev;Dmitry Yudin;Aleksandr Panov",
        "authorids": "~Tatiana_Zemskova1;~Aleksei_Staroverov1;muraviev@isa.ru;~Dmitry_Yudin1;~Aleksandr_Panov1",
        "gender": "F;M;;;M",
        "homepage": ";;;;http://grafft.github.io",
        "dblp": ";;;;177/9975",
        "google_scholar": ";wxrjhywAAAAJ;;;https://scholar.google.ru/citations?hl=ru",
        "orcid": "0000-0003-4271-7336;0000-0002-4730-1543;;;0000-0002-9747-3837",
        "linkedin": "tatiana-zemskova-01b7971bb/;;;;",
        "or_profile": "~Tatiana_Zemskova1;~Aleksei_Staroverov1;muraviev@isa.ru;~Dmitry_Yudin1;~Aleksandr_Panov1",
        "aff": "Moscow Institute of Physics and Technology;AIRI;;;Federal Research Center \u00abComputer Science and Control\u00bb of Russian Academy of Sciences",
        "aff_domain": "phystech.edu;airi.net;;;frccsc.ru",
        "position": "PhD student;Researcher;;;Principal Researcher",
        "bibtex": "@misc{\nzemskova2024interactive,\ntitle={Interactive Semantic Map Representation for Skill-based Visual Object Navigation},\nauthor={Tatiana Zemskova and Aleksei Staroverov and Kirill Muravyev and Dmitry Yudin and Aleksandr Panov},\nyear={2024},\nurl={https://openreview.net/forum?id=Z91rwXnJsw}\n}",
        "github": "",
        "project": "",
        "reviewers": "H7Mw;85u7;gNN6;Xvsx",
        "site": "https://openreview.net/forum?id=Z91rwXnJsw",
        "pdf_size": 3621706,
        "rating": "1;1;3;3",
        "confidence": "4;4;3;3",
        "soundness": "2;1;2;2",
        "contribution": "2;1;2;2",
        "presentation": "1;1;3;2",
        "wc_summary": "35;52;92;107",
        "wc_strengths": "21;53;103;111",
        "wc_weaknesses": "109;365;136;191",
        "wc_questions": "2;49;73;11",
        "wc_review": "167;519;404;420",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            71.5,
            29.124731758421397
        ],
        "wc_strengths_avg": [
            72.0,
            36.89173349139343
        ],
        "wc_weaknesses_avg": [
            200.25,
            99.60264805716764
        ],
        "wc_questions_avg": [
            33.75,
            28.71737279069936
        ],
        "wc_review_avg": [
            377.5,
            129.2681321904204
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16877217516554496127&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Moscow Institute of Physics and Technology;Artificial Intelligence Research Institute;Russian Academy of Sciences",
        "aff_unique_dep": ";;Computer Science and Control",
        "aff_unique_url": "https://www.mipt.ru/en;https://www.airi.jp;https://www.ras.ru",
        "aff_unique_abbr": "MIPT;AIRI;RAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Russian Federation;Japan"
    },
    {
        "title": "Neuro-Inspired Information-Theoretic Hierarchical Perception for Multimodal Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18409",
        "id": "Z9AZsU1Tju",
        "author_site": "Xiongye Xiao, Gengshuo Liu, Gaurav Gupta, Defu Cao, Shixuan Li, Yaxing Li, Tianqing Fang, Mingxi Cheng, Paul Bogdan",
        "tldr": "",
        "abstract": "Integrating and processing information from various sources or modalities are critical for obtaining a comprehensive and accurate perception of the real world in autonomous systems and cyber-physical systems. Drawing inspiration from neuroscience, we develop the Information-Theoretic Hierarchical Perception (ITHP) model, which utilizes the concept of information bottleneck. Different from most traditional fusion models that incorporate all modalities identically in neural networks, our model designates a prime modality and regards the remaining modalities as detectors in the information pathway, serving to distill the flow of information. Our proposed perception model focuses on constructing an effective and compact information flow by achieving a balance between the minimization of mutual information between the latent state and the input modal state, and the maximization of mutual information between the latent states and the remaining modal states. This approach leads to compact latent state representations that retain relevant information while minimizing redundancy, thereby substantially enhancing the performance of multimodal representation learning. Experimental evaluations on the MUStARD, CMU-MOSI, and CMU-MOSEI datasets demonstrate that our model consistently distills crucial information in multimodal learning scenarios, outperforming state-of-the-art benchmarks. Remarkably, on the CMU-MOSI dataset, ITHP surpasses human-level performance in the multimodal sentiment binary classification task across all evaluation metrics (i.e., Binary Accuracy, F1 Score, Mean Absolute Error, and Pearson Correlation).",
        "keywords": "multimodal learning;information bottleneck;sentiment analysis",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/752137e801bb2326ba7e29ad2628b3f90dc0bc40.pdf",
        "author": "Xiongye Xiao;Gengshuo Liu;Gaurav Gupta;Defu Cao;Shixuan Li;Yaxing Li;Tianqing Fang;Mingxi Cheng;Paul Bogdan",
        "authorids": "~Xiongye_Xiao1;~Gengshuo_Liu1;~Gaurav_Gupta2;~Defu_Cao1;sli97750@usc.edu;~Yaxing_Li1;~Tianqing_Fang1;~Mingxi_Cheng1;~Paul_Bogdan1",
        "gender": "M;M;M;M;;M;M;;M",
        "homepage": ";;http://guptagaurav.me/;https://idevede.github.io/;;;http://fangtq.com/;;https://cps.usc.edu/",
        "dblp": "301/0208;;;274/1535;;;283/4921;;05/5539",
        "google_scholar": "AvIxA64AAAAJ;https://scholar.google.com/citations?hl=en;Maqaq6MAAAAJ;https://scholar.google.com/citations?hl=en;;;https://scholar.google.com.hk/citations?user=Tb3rc34AAAAJ;;Xw_v8-gAAAAJ",
        "orcid": "0000-0002-3181-7166;;;0000-0003-0240-3818;;0009-0009-6626-0685;;;0000-0003-2118-0816",
        "linkedin": ";gengshuo-liu/;gaurav71531/;;;;;;paul-bogdan-4b098a6/",
        "or_profile": "~Xiongye_Xiao1;~Gengshuo_Liu1;~Gaurav_Gupta2;~Defu_Cao1;sli97750@usc.edu;~Yaxing_Li1;~Tianqing_Fang1;~Mingxi_Cheng1;~Paul_Bogdan1",
        "aff": "University of Southern California;University of Southern California;Amazon;University of Southern California;;University of Southern California;Hong Kong University of Science and Technology;;University of Southern California",
        "aff_domain": "usc.edu;usc.edu;amazon.com;usc.edu;;usc.edu;ust.hk;;usc.edu",
        "position": "PhD student;PhD student;Applied Scientist-III;PhD student;;MS student;PhD student;;Jack Munushian Early Career Chair associate professor",
        "bibtex": "@inproceedings{\nxiao2024neuroinspired,\ntitle={Neuro-Inspired Information-Theoretic Hierarchical Perception for Multimodal Learning},\nauthor={Xiongye Xiao and Gengshuo Liu and Gaurav Gupta and Defu Cao and Shixuan Li and Yaxing Li and Tianqing Fang and Mingxi Cheng and Paul Bogdan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Z9AZsU1Tju}\n}",
        "github": "",
        "project": "",
        "reviewers": "uxTC;JgMF;4bfy;Qqaa;mWBz",
        "pdf_size": 2215973,
        "rating": "5;6;6;6;8",
        "confidence": "3;3;3;3;3",
        "soundness": "3;3;2;3;3",
        "contribution": "2;3;2;3;3",
        "presentation": "2;3;3;2;3",
        "wc_summary": "109;20;68;122;45",
        "wc_strengths": "45;113;27;58;37",
        "wc_weaknesses": "192;149;79;173;135",
        "wc_questions": "89;2;48;7;56",
        "wc_review": "435;284;222;360;273",
        "wc_reply_reviewers": "117;0;215;0;0",
        "wc_reply_authors": "1743;820;1519;1163;1459",
        "reply_reviewers": "1;0;2;0;0",
        "reply_authors": "5;2;4;2;3",
        "rating_avg": [
            6.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            72.8,
            38.248660107250814
        ],
        "wc_strengths_avg": [
            56.0,
            30.25227264190246
        ],
        "wc_weaknesses_avg": [
            145.6,
            38.63469942939896
        ],
        "wc_questions_avg": [
            40.4,
            32.41357740207026
        ],
        "wc_review_avg": [
            314.8,
            74.56379818651945
        ],
        "wc_reply_reviewers_avg": [
            66.4,
            87.02781164662248
        ],
        "wc_reply_authors_avg": [
            1340.8,
            319.47982721918453
        ],
        "reply_reviewers_avg": [
            0.6,
            0.7999999999999999
        ],
        "reply_authors_avg": [
            3.2,
            1.16619037896906
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15658735442819197158&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=Z9AZsU1Tju",
        "pdf": "https://openreview.net/pdf?id=Z9AZsU1Tju",
        "email": "usc.edu;usc.edu;amazon.com;usc.edu;;usc.edu;ust.hk;;usc.edu",
        "author_num": 9,
        "aff_unique_index": "0;0;1;0;0;2;0",
        "aff_unique_norm": "University of Southern California;Amazon;Hong Kong University of Science and Technology",
        "aff_unique_dep": ";Amazon.com, Inc.;",
        "aff_unique_url": "https://www.usc.edu;https://www.amazon.com;https://www.ust.hk",
        "aff_unique_abbr": "USC;Amazon;HKUST",
        "aff_campus_unique_index": "0;0;0;0;2;0",
        "aff_campus_unique": "Los Angeles;;Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;0;1;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "ZA9XUTseA9",
        "title": "On the Implicit Bias of Adam",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In previous literature, backward error analysis was used to find ordinary differential equations (ODEs) approximating the gradient descent trajectory. It was found that finite step sizes implicitly regularize solutions because terms appearing in the ODEs penalize the two-norm of the loss gradients. We prove that the exis- tence of similar implicit regularization in RMSProp and Adam depends on their hyperparameters and the training stage, but with a different \u201cnorm\u201d involved: the corresponding ODE terms either penalize the (perturbed) one-norm of the loss gradients or, on the contrary, hinder its decrease (the latter case being typical). We also conduct numerical experiments and discuss how the proven facts can influence generalization.",
        "keywords": "theory;implicit bias;generalization;backward error analysis;Adam;adaptive methods;gradient descent",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/eed5fe312fd809bdffa54e0bc684473e7d54ff72.pdf",
        "author": "Matias D. Cattaneo;Jason Matthew Klusowski;Boris Shigida",
        "authorids": "~Matias_D._Cattaneo1;~Jason_Matthew_Klusowski1;~Boris_Shigida1",
        "gender": "M;M;M",
        "homepage": "https://klusowski.princeton.edu/;;https://cattaneo.princeton.edu/",
        "dblp": ";356/2718.html;",
        "google_scholar": "4HkhCjsAAAAJ;KImeZo8AAAAJ;TNdmZVEAAAAJ",
        "orcid": "0000-0001-6484-8682;;0000-0003-0493-7506",
        "linkedin": "jklusowski/;boris-shigida/;matias-d-cattaneo/",
        "or_profile": "~Jason_Matthew_Klusowski1;~Boris_Shigida1;~Matias_Cattaneo1",
        "aff": "Princeton University;Princeton University;Princeton University",
        "aff_domain": "princeton.edu;princeton.edu;princeton.edu",
        "position": "Assistant Professor;PhD student;Full Professor",
        "bibtex": "@misc{\ncattaneo2024on,\ntitle={On the Implicit Bias of Adam},\nauthor={Matias D. Cattaneo and Jason Matthew Klusowski and Boris Shigida},\nyear={2024},\nurl={https://openreview.net/forum?id=ZA9XUTseA9}\n}",
        "github": "",
        "project": "",
        "reviewers": "nNMy;71dm;z9rC;Mieg",
        "site": "https://openreview.net/forum?id=ZA9XUTseA9",
        "pdf_size": 629521,
        "rating": "6;6;6;6",
        "confidence": "3;3;3;3",
        "soundness": "3;2;2;3",
        "contribution": "3;2;2;3",
        "presentation": "3;2;2;3",
        "wc_summary": "204;89;71;70",
        "wc_strengths": "58;54;58;80",
        "wc_weaknesses": "50;404;42;73",
        "wc_questions": "71;26;250;75",
        "wc_review": "383;573;421;298",
        "wc_reply_reviewers": "5;12;24;16",
        "wc_reply_authors": "442;492;973;542",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            108.5,
            55.65294241996554
        ],
        "wc_strengths_avg": [
            62.5,
            10.23474474522936
        ],
        "wc_weaknesses_avg": [
            142.25,
            151.54929066148742
        ],
        "wc_questions_avg": [
            105.5,
            85.61687917694735
        ],
        "wc_review_avg": [
            418.75,
            99.57001305614055
        ],
        "wc_reply_reviewers_avg": [
            14.25,
            6.869315832017043
        ],
        "wc_reply_authors_avg": [
            612.25,
            211.25857970742868
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 22,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17420330623754347191&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 13,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Princeton University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.princeton.edu",
        "aff_unique_abbr": "Princeton",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "ZAMoxm86KV",
        "title": "Federated Zeroth-Order Optimization using Trajectory-Informed Surrogate Gradients",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Federated optimization, an emerging paradigm which finds wide real-world applications such as federated learning, enables multiple clients (e.g., edge devices) to collaboratively optimize a global function. The clients do not share their local datasets and typically only share their local gradients. However, the gradient information is not available in many applications of federated optimization, which hence gives rise to the paradigm of federated zeroth-order optimization (ZOO). Existing federated ZOO algorithms suffer from the limitations of query and communication round inefficiency, which can be attributed to (a) their reliance on a substantial number of function queries for gradient estimation and (b) the significant disparity between their realized local updates and the intended global updates. To this end, we (a) introduce trajectory-informed gradient surrogates which is able to use the history of function queries during optimization for accurate and query-efficient gradient estimation, and (b) develop the technique of adaptive gradient correction using these gradient surrogates to mitigate the aforementioned disparity. Based on these, we propose the federated zeroth-order optimization using trajectory-informed surrogate gradients (FZooS) algorithm for query- and communication round-efficient federated ZOO. FZooS achieves theoretical improvements over the existing approaches, which is supported by our real-world experiments on federated black-box adversarial attack and non-differentiable metric optimization.",
        "keywords": "Federated Zeroth-Order Optimization;Derived Gaussian Process;Heterogeneity;Convergence;Surrogate Gradients",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/9bfb829b69cb0ab9d7c616d4e1889326850382f3.zip",
        "author": "Yao Shu;Xiaoqiang Lin;Zhongxiang Dai;Bryan Kian Hsiang Low",
        "authorids": "~Yao_Shu1;~Xiaoqiang_Lin1;~Zhongxiang_Dai1;~Bryan_Kian_Hsiang_Low1",
        "gender": "M;M;M;M",
        "homepage": "https://yao.notion.site;https://xqlin98.github.io/;https://daizhongxiang.github.io/;http://www.comp.nus.edu.sg/~lowkh",
        "dblp": "44/1338;269/4573;172/4968;97/4877",
        "google_scholar": "https://scholar.google.com.au/citations?hl=en;nqKwA60AAAAJ;1v8xOIYAAAAJ;https://scholar.google.com.tw/citations?user=2P-Q09UAAAAJ",
        "orcid": ";;;",
        "linkedin": "yao-shu-a5640514b;;;",
        "or_profile": "~Yao_Shu1;~Xiaoqiang_Lin1;~Zhongxiang_Dai1;~Bryan_Kian_Hsiang_Low1",
        "aff": "Guangming Lab;National University of Singapore;Massachusetts Institute of Technology;National University of Singapore",
        "aff_domain": "gml.ac.cn;u.nus.edu;mit.edu;nus.edu.sg",
        "position": "Researcher;PhD student;Postdoc;Associate Professor",
        "bibtex": "@misc{\nshu2024federated,\ntitle={Federated Zeroth-Order Optimization using Trajectory-Informed Surrogate Gradients},\nauthor={Yao Shu and Xiaoqiang Lin and Zhongxiang Dai and Bryan Kian Hsiang Low},\nyear={2024},\nurl={https://openreview.net/forum?id=ZAMoxm86KV}\n}",
        "github": "",
        "project": "",
        "reviewers": "1Jp7;RiQm;T6cv",
        "site": "https://openreview.net/forum?id=ZAMoxm86KV",
        "pdf_size": 1629921,
        "rating": "3;3;5",
        "confidence": "3;2;4",
        "soundness": "3;2;2",
        "contribution": "2;2;2",
        "presentation": "3;2;3",
        "wc_summary": "31;75;160",
        "wc_strengths": "69;27;126",
        "wc_weaknesses": "404;160;390",
        "wc_questions": "2;65;125",
        "wc_review": "506;327;801",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            88.66666666666667,
            53.543336549834926
        ],
        "wc_strengths_avg": [
            74.0,
            40.570925550201586
        ],
        "wc_weaknesses_avg": [
            318.0,
            111.86897097348606
        ],
        "wc_questions_avg": [
            64.0,
            50.21951811795888
        ],
        "wc_review_avg": [
            544.6666666666666,
            195.43171583843693
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.8660254037844387,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5077729376378563513&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "Guangming Lab;National University of Singapore;Massachusetts Institute of Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": ";https://www.nus.edu.sg;https://web.mit.edu",
        "aff_unique_abbr": ";NUS;MIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;1",
        "aff_country_unique": "China;Singapore;United States"
    },
    {
        "id": "ZAgrdEhcr4",
        "title": "Learning Deep Improvement Representation to Accelerate Evolutionary Optimization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Evolutionary algorithms excel at versatile optimization for complex (e.g., multiobjective) problems but can be computationally expensive, especially in high-dimensional scenarios, and their stochastic nature of search may hinder swift convergence to global optima in promising directions. In this study, we train a multilayer perceptron (MLP) to learn the improvement representation of transitioning from poor-performing to better-performing solutions during evolutionary search, facilitating the rapid convergence of the evolutionary population towards global optimality along more promising paths. Then, through the iterative stacking of the previously trained lightweight MLP, a larger model can be constructed, enabling it to acquire deep improvement representations (DIR) for solutions. Conducting evolutionary search within the acquired DIR space significantly expedites the population's convergence rate. Finally, the efficacy of DIR-guided search is validated by applying it to the two prevailing evolutionary operators\u2014simulated binary crossover and differential evolution. The experimental findings demonstrate its capability to achieve rapid convergence in solving challenging large-scale multiobjective optimization problems.",
        "keywords": "Learning Improvement Representation;Accelerated Evolutionary Search;Large-Scale Multiobjective Optimization",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/18d8e1ad531913c409971387d0329d7177e8d55f.zip",
        "author": "Songbai Liu;zeyi wang;Qiuzhen Lin;Jianqiang Li;KC Tan",
        "authorids": "~Songbai_Liu1;~zeyi_wang2;~Qiuzhen_Lin1;~Jianqiang_Li2;~KC_Tan1",
        "gender": "M;M;M;M;",
        "homepage": "https://www.researchgate.net/profile/Songbai-Liu-2;https://github.com/monkey88564;https://csse.szu.edu.cn/pages/user/index?id=557;https://scholar.google.com/citations?hl=zh-CN&user=-oVMPBwAAAAJ;",
        "dblp": "213/6046.html;;22/8016.html;08/2185-1;",
        "google_scholar": "jXTQ1TwAAAAJ;;87XNTVsAAAAJ;https://scholar.google.com/citations?hl=zh-CN;",
        "orcid": "0000-0003-1048-4486;;0000-0003-2415-0401;0000-0002-2208-962X;",
        "linkedin": ";;;;",
        "or_profile": "~Songbai_Liu1;~zeyi_wang2;~Qiuzhen_Lin1;~Jianqiang_Li2;~KC_Tan1",
        "aff": "Shenzhen University;Shenzhen University;Shenzhen University;Shenzhen University;",
        "aff_domain": "szu.edu.cn;szu.edu.cn;szu.edu.cn;szu.edu.cn;",
        "position": "Assistant Professor;MS student;Associate Professor;Full Professor;",
        "bibtex": "@misc{\nliu2024learning,\ntitle={Learning Deep Improvement Representation to Accelerate Evolutionary Optimization},\nauthor={Songbai Liu and zeyi wang and Qiuzhen Lin and Jianqiang Li and KC Tan},\nyear={2024},\nurl={https://openreview.net/forum?id=ZAgrdEhcr4}\n}",
        "github": "",
        "project": "",
        "reviewers": "u1rY;esui;APTU",
        "site": "https://openreview.net/forum?id=ZAgrdEhcr4",
        "pdf_size": 4207787,
        "rating": "3;3;5",
        "confidence": "4;5;4",
        "soundness": "2;2;1",
        "contribution": "2;1;2",
        "presentation": "2;2;2",
        "wc_summary": "83;41;112",
        "wc_strengths": "44;16;26",
        "wc_weaknesses": "666;64;265",
        "wc_questions": "115;130;5",
        "wc_review": "908;251;408",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            78.66666666666667,
            29.147136318265567
        ],
        "wc_strengths_avg": [
            28.666666666666668,
            11.585431464655178
        ],
        "wc_weaknesses_avg": [
            331.6666666666667,
            250.24565708297294
        ],
        "wc_questions_avg": [
            83.33333333333333,
            55.7275116576683
        ],
        "wc_review_avg": [
            522.3333333333334,
            280.13845783032997
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:mQqQc2mlvV8J:scholar.google.com/&scioq=Learning+Deep+Improvement+Representation+to+Accelerate+Evolutionary+Optimization&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Shenzhen University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.szu.edu.cn",
        "aff_unique_abbr": "SZU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "ZBEs9CJiWs",
        "title": "Optimizing Interpersonal Communication by Simulating Audiences with Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "How do we communicate with others to achieve our goals?\nWe use our prior experience or advice from others, or construct a candidate utterance by predicting how it will be received. However, our experiences are limited and biased, and reasoning about potential outcomes can be difficult and cognitively challenging. \nIn this paper, we explore how we can leverage current Large Language Models (LLMs) to help us communicate better.\nSpecifically, we propose the Explore-Generate-Simulate (EGS) framework, which takes as input any scenario where an individual is communicating to an audience with a goal they want to achieve, 1) explores the solution space by first producing a diverse set of advice relevant to the scenario, 2) generates potential candidates conditioned on subsets of the advice, and 3) simulates the reactions from various audiences, selecting both the best candidate and advice to use. \nWe evaluate the framework on eight scenarios spanning the ten fundamental processes of interpersonal communication. \nFor each scenario, we collect a dataset of human evaluations across candidates and baselines and showcase that our framework's chosen candidate is preferred over popular baseline generation mechanisms including Chain-of-Thought.\nWe also find that audience simulations achieve reasonably high agreement with human raters across $5$ of the $8$ scenarios.  \nFurthermore, we demonstrate the generality of our framework by applying it to real-world scenarios described by users on web forums. Viewing LLMs as a library of shared experiences and opinions, our approach draws on this library to integrate cultural and individual experience and ultimately help people communicate better.",
        "keywords": "Communication;Interpersonal Relationships;Large Language Model Applications;Agent Simulations;Generative Agents",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/364f3423945730679c2fc2998f82472980396d6e.zip",
        "author": "Ryan Liu;Howard Yen;Raja Marjieh;Thomas L. Griffiths;Ranjay Krishna",
        "authorids": "~Ryan_Liu1;~Howard_Yen1;~Raja_Marjieh1;~Thomas_L._Griffiths1;~Ranjay_Krishna1",
        "gender": "M;M;M;;M",
        "homepage": "https://theryanl.github.io;https://howard-yen.github.io;;http://cocosci.princeton.edu/tom/;http://ranjaykrishna.com",
        "dblp": ";348/5988.html;271/7867;34/4472;167/3785",
        "google_scholar": "s3McVn8AAAAJ;8rJOrBEAAAAJ;h-pwCMUAAAAJ;https://scholar.google.com/citations?hl=en;IcqahyAAAAAJ",
        "orcid": ";;;;0000-0001-8784-2531",
        "linkedin": "ryanchenliu/;;raja-marjieh-505b0781/?originalSubdomain=il;;ranjay-krishna-1a344444/",
        "or_profile": "~Ryan_Liu1;~Howard_Yen1;~Raja_Marjieh1;~Thomas_L._Griffiths1;~Ranjay_Krishna1",
        "aff": "Princeton University;Princeton University;Princeton University;Princeton University;University of Washington",
        "aff_domain": "princeton.edu;princeton.edu;princeton.edu;princeton.edu;cs.washington.edu",
        "position": "PhD student;MS student;PhD student;Professor;Assistant Professor",
        "bibtex": "@misc{\nliu2024optimizing,\ntitle={Optimizing Interpersonal Communication by Simulating Audiences with Large Language Models},\nauthor={Ryan Liu and Howard Yen and Raja Marjieh and Thomas L. Griffiths and Ranjay Krishna},\nyear={2024},\nurl={https://openreview.net/forum?id=ZBEs9CJiWs}\n}",
        "github": "",
        "project": "",
        "reviewers": "hVxs;V2zC;Dz3q;GN7N",
        "site": "https://openreview.net/forum?id=ZBEs9CJiWs",
        "pdf_size": 832753,
        "rating": "5;5;6;6",
        "confidence": "4;4;3;3",
        "soundness": "2;3;3;3",
        "contribution": "3;3;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "78;72;196;107",
        "wc_strengths": "160;87;79;71",
        "wc_weaknesses": "252;113;369;76",
        "wc_questions": "13;102;122;103",
        "wc_review": "503;374;766;357",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1336;749;974;1202",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;2;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            113.25,
            49.57506933933628
        ],
        "wc_strengths_avg": [
            99.25,
            35.52727825206991
        ],
        "wc_weaknesses_avg": [
            202.5,
            116.38835852438164
        ],
        "wc_questions_avg": [
            85.0,
            42.326114870136614
        ],
        "wc_review_avg": [
            500.0,
            163.62304238706724
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1065.25,
            223.80055294837857
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:cNg30CR5FIAJ:scholar.google.com/&scioq=Optimizing+Interpersonal+Communication+by+Simulating+Audiences+with+Large+Language+Models&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;1",
        "aff_unique_norm": "Princeton University;University of Washington",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.princeton.edu;https://www.washington.edu",
        "aff_unique_abbr": "Princeton;UW",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "ZCFKXwBTsw",
        "title": "SIEVE: Multimodal Dataset Pruning using Image-Captioning Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Vision-Language Models (VLMs) are pretrained on large, diverse, and noisy web-crawled datasets. This underscores the critical need for dataset pruning, as the quality of these datasets is strongly correlated with the performance of VLMs on downstream tasks. Using CLIPScore from a pretrained model to only train models using highly-aligned samples is one of the most successful methods for pruning. We argue that this approach suffers from multiple limitations including: 1) false positives due to spurious correlations captured by the pretrained CLIP model, 2) false negatives due to poor discrimination between hard and bad samples, and 3) biased ranking towards samples similar to the pretrained CLIP dataset. We propose a pruning method, SIEVE, that employs synthetic captions generated by image-captioning models pretrained on small, diverse, and well-aligned image-text pairs to evaluate the alignment of noisy image-text pairs. To bridge the gap between the limited diversity of generated captions and the high diversity of alternative text (alt-text), we estimate the semantic textual similarity in the embedding space of a language model pretrained on billions of sentences. Using DataComp, a multimodal dataset filtering benchmark, we achieve state-of-the-art performance on the \"large\" scale pool, and competitive results on the \"medium\" scale pool, surpassing CLIPScore-based filtering by 1.7\\% and 2.6\\% on average, on 38 downstream tasks.",
        "keywords": "Data pruning;vision-language datasets;synthetic captions",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Anas Mahmoud;Mostafa Elhoushi;Amro Kamal Mohamed Abbas;Yu Yang;Newsha Ardalani;Hugh James Leather;Ari S. Morcos",
        "authorids": "~Anas_Mahmoud2;~Mostafa_Elhoushi1;~Amro_Kamal_Mohamed_Abbas1;~Yu_Yang4;~Newsha_Ardalani1;~Hugh_James_Leather1;~Ari_S._Morcos1",
        "gender": "M;M;;F;F;M;",
        "homepage": ";;;https://sites.google.com/view/yuyang0901/home;;https://homepages.inf.ed.ac.uk/hleather/;",
        "dblp": "22/8904;157/6350;;16/4505-7;53/7913.html;;",
        "google_scholar": "https://scholar.google.de/citations?user=z7ExCjYAAAAJ;https://scholar.google.ca/citations?user=y_cwSKAAAAAJ;;KK6Yj4IAAAAJ;w-y4MOcAAAAJ;;",
        "orcid": ";0000-0001-6172-4510;;;;;",
        "linkedin": "anasmahmoud/;mostafaelhoushi/;;;;;",
        "or_profile": "~Anas_Mahmoud2;~Mostafa_Elhoushi1;~Amro_Kamal_Mohamed_Abbas1;~Yu_Yang4;~Newsha_Ardalani1;~Hugh_James_Leather1;~Ari_S._Morcos1",
        "aff": "Meta Facebook;Meta;;University of California, Los Angeles;Meta AI;Meta Facebook;",
        "aff_domain": "meta.com;meta.com;;ucla.edu;meta.com;fb.com;",
        "position": "Intern;Researcher;;PhD student;Researcher;Researcher;",
        "bibtex": "@misc{\nmahmoud2024sieve,\ntitle={{SIEVE}: Multimodal Dataset Pruning using Image-Captioning Models},\nauthor={Anas Mahmoud and Mostafa Elhoushi and Amro Kamal Mohamed Abbas and Yu Yang and Newsha Ardalani and Hugh James Leather and Ari S. Morcos},\nyear={2024},\nurl={https://openreview.net/forum?id=ZCFKXwBTsw}\n}",
        "github": "",
        "project": "",
        "reviewers": "cmps;sFAh;pF34",
        "site": "https://openreview.net/forum?id=ZCFKXwBTsw",
        "pdf_size": 9478703,
        "rating": "3;3;8",
        "confidence": "5;4;4",
        "soundness": "2;2;3",
        "contribution": "1;2;3",
        "presentation": "3;3;3",
        "wc_summary": "60;63;159",
        "wc_strengths": "18;29;86",
        "wc_weaknesses": "166;284;89",
        "wc_questions": "2;33;78",
        "wc_review": "246;409;412",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "629;1170;252",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;2;1",
        "rating_avg": [
            4.666666666666667,
            2.357022603955158
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            94.0,
            45.9782557302906
        ],
        "wc_strengths_avg": [
            44.333333333333336,
            29.80305726300948
        ],
        "wc_weaknesses_avg": [
            179.66666666666666,
            80.19282317569876
        ],
        "wc_questions_avg": [
            37.666666666666664,
            31.201851796897497
        ],
        "wc_review_avg": [
            355.6666666666667,
            77.55571474036513
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            683.6666666666666,
            376.76016538671155
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 22,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17267449102445652248&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "Meta;University of California, Los Angeles",
        "aff_unique_dep": "Meta Platforms, Inc.;",
        "aff_unique_url": "https://meta.com;https://www.ucla.edu",
        "aff_unique_abbr": "Meta;UCLA",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Los Angeles",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "ZCc8OQEAoK",
        "title": "Towards Better Propagation of Non-parametric GNNs",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recent works show great interest in designing Graph Neural Networks (GNNs) that scale to large graphs. While previous work focuses on designing advanced sampling techniques for existing GNNs, the design of non-parametric GNNs, an orthogonal direction for scalable performance, has aroused lots of concerns recently. For example, nearly all top solutions in the Open Graph Benchmark leaderboard are non-parametric GNNs. Unlike most GNNs which alternately do feature propagation and non-linear transformation in each GNN layer, non-parametric GNNs execute the non-parametric propagation in advance and then feed the propagated features into simple and scalable models (e.g., Logistic Regression). Despite their high predictive performance and scalability, non-parametric GNNs still face two limitations. First, due to the propagation of over-smoothed features, they suffer from severe performance degradation along with the propagation depth. More importantly, they only consider the graph structure and ignore the feature influence during the non-parametric propagation, leading to sub-optimal propagated features. To address these limitations, we present non-parametric attention (NPA), a plug-and-play module that is compatible with non-parametric GNNs, to get scalable and deep GNNs simultaneously. Experimental results on six homophilic graphs and five heterophilic graphs  demonstrate NPA enjoys high performance -- achieves large performance gain over existing non-parametric GNNs, deeper architecture -- improves non-parametric GNNs with large model depth, and high scalability -- can support large-scale graphs with low time costs. Notably, it achieves state-of-the-art performance on the large ogbn-papers100M dataset.",
        "keywords": "Graph Neural Network;Scalability;Depth;Large Graphs",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/c34b7e9549437e4ce8d086483cdd758927888de6.zip",
        "author": "Wentao Zhang;Guochen Yan;Yu Shen;Ling Yang;Bin CUI;Jian Tang",
        "authorids": "~Wentao_Zhang1;~Guochen_Yan1;~Yu_Shen3;~Ling_Yang1;~Bin_CUI2;~Jian_Tang1",
        "gender": ";M;M;M;;M",
        "homepage": ";https://salty-fish-97.github.io/;https://yangling0818.github.io/;https://cuibinpku.github.io/index.html;http://www.jian-tang.com;https://zwt233.github.io/",
        "dblp": "357/1573;48/4462-3.html;01/24-6.html;55/5031.html;181/2667-5;41/3249-1.html",
        "google_scholar": "gCNHprAAAAAJ;WHCihd4AAAAJ;https://scholar.google.com.hk/citations?user=sIKujqAAAAAJ;IJAU8KoAAAAJ;https://scholar.google.ca/citations?user=1ir6WUEAAAAJ;JE4VON0AAAAJ",
        "orcid": ";0000-0001-6503-6504;0000-0003-1905-8053;0000-0003-1681-4677;;0000-0002-7532-5550",
        "linkedin": "guochen-yan-a3a0b7226/;;;;;",
        "or_profile": "~Guochen_Yan1;~Yu_Shen3;~Ling_Yang1;~Bin_CUI2;~Jian_Tang1;~Zhang_wen_tao1",
        "aff": "Peking University;Peking University;Peking University;Peking University;Mila, HEC Montreal;Peking University",
        "aff_domain": "pku.edu.cn;pku.edu.cn;pku.edu.cn;pku.edu.cn;hec.ca;pku.edu.cn",
        "position": "PhD student;PhD student;PhD student;Full Professor;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nzhang2024towards,\ntitle={Towards Better Propagation of Non-parametric {GNN}s},\nauthor={Wentao Zhang and Guochen Yan and Yu Shen and Ling Yang and Bin CUI and Jian Tang},\nyear={2024},\nurl={https://openreview.net/forum?id=ZCc8OQEAoK}\n}",
        "github": "",
        "project": "",
        "reviewers": "zzGa;MrWb;DswV;whHX",
        "site": "https://openreview.net/forum?id=ZCc8OQEAoK",
        "pdf_size": 863232,
        "rating": "3;3;3;5",
        "confidence": "5;4;5;5",
        "soundness": "2;2;2;3",
        "contribution": "1;2;2;2",
        "presentation": "3;3;3;3",
        "wc_summary": "82;44;51;85",
        "wc_strengths": "22;99;20;37",
        "wc_weaknesses": "62;435;142;141",
        "wc_questions": "2;5;5;3",
        "wc_review": "168;583;218;266",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            65.5,
            18.200274723201296
        ],
        "wc_strengths_avg": [
            44.5,
            32.14420632089086
        ],
        "wc_weaknesses_avg": [
            195.0,
            142.3147919226951
        ],
        "wc_questions_avg": [
            3.75,
            1.299038105676658
        ],
        "wc_review_avg": [
            308.75,
            162.08543271990854
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:oHChwrUNts8J:scholar.google.com/&scioq=Towards+Better+Propagation+of+Non-parametric+GNNs&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;1;0",
        "aff_unique_norm": "Peking University;HEC Montreal",
        "aff_unique_dep": ";HEC Business School",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.hec.ca",
        "aff_unique_abbr": "Peking U;HEC",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Montreal",
        "aff_country_unique_index": "0;0;0;0;1;0",
        "aff_country_unique": "China;Canada"
    },
    {
        "id": "ZD7g4Y3PxP",
        "title": "One is More: Diverse Perspectives within a Single Network for Efficient DRL",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Deep reinforcement learning has achieved remarkable performance in various domains by leveraging deep neural networks for approximating value functions and policies. However, using neural networks to approximate value functions or policy functions still faces challenges including low sample efficiency and overfitting. In this paper, we introduce OMNet, a novel learning paradigm utilizing multiple subnetworks within a single network, offering diverse outputs efficiently. We provide a systematic pipeline, including initialization, training, and sampling with OMNet. OMNet can be easily applied to various deep reinforcement learning algorithms with minimal additional overhead. Through comprehensive evaluations conducted on MuJoCo benchmark, our findings highlight OMNet's ability to strike an effective balance between performance and computational cost.",
        "keywords": "Deep Reinforcement Learning;Sample Efficiency;Generalization in Reinforcement Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/c2cc6e58c125334d1381422ea44c289983f52fcd.pdf",
        "author": "Yiqin Tan;Ling Pan;Longbo Huang",
        "authorids": "~Yiqin_Tan1;~Ling_Pan1;~Longbo_Huang2",
        "gender": "M;F;M",
        "homepage": "https://tyq1024.github.io/;https://ling-pan.github.io/;http://people.iiis.tsinghua.edu.cn/~huang/",
        "dblp": ";199/9303/;79/7077",
        "google_scholar": ";qZ_zlacAAAAJ;",
        "orcid": "0000-0002-9060-8137;;",
        "linkedin": ";;",
        "or_profile": "~Yiqin_Tan1;~Ling_Pan1;~Longbo_Huang2",
        "aff": "Tsinghua University;Montreal Institute for Learning Algorithms (MILA);Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;mila.umontreal.ca;tsinghua.edu.cn",
        "position": "MS student;Postdoc;Full Professor",
        "bibtex": "@misc{\ntan2024one,\ntitle={One is More: Diverse Perspectives within a Single Network for Efficient {DRL}},\nauthor={Yiqin Tan and Ling Pan and Longbo Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=ZD7g4Y3PxP}\n}",
        "github": "",
        "project": "",
        "reviewers": "Y41k;Vosg;ZR2J;9vY6",
        "site": "https://openreview.net/forum?id=ZD7g4Y3PxP",
        "pdf_size": 2906558,
        "rating": "3;3;5;6",
        "confidence": "5;4;4;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "1;3;2;3",
        "wc_summary": "33;95;62;69",
        "wc_strengths": "11;67;68;55",
        "wc_weaknesses": "157;290;323;75",
        "wc_questions": "10;204;42;12",
        "wc_review": "211;656;495;211",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            64.75,
            22.072324299900995
        ],
        "wc_strengths_avg": [
            50.25,
            23.23117517475171
        ],
        "wc_weaknesses_avg": [
            211.25,
            100.24563581523138
        ],
        "wc_questions_avg": [
            67.0,
            80.10617953691214
        ],
        "wc_review_avg": [
            393.25,
            190.93241605342976
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:cAoD9x37-igJ:scholar.google.com/&scioq=One+is+More:+Diverse+Perspectives+within+a+Single+Network+for+Efficient+DRL&hl=en&as_sdt=0,5",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Tsinghua University;Montreal Institute for Learning Algorithms",
        "aff_unique_dep": ";Artificial Intelligence",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://mila.quebec",
        "aff_unique_abbr": "THU;MILA",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Montreal",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "China;Canada"
    },
    {
        "title": "Leftover Lunch: Advantage-based Offline Reinforcement Learning for Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18408",
        "id": "ZDGKPbF0VQ",
        "author_site": "Ashutosh Baheti, Ximing Lu, Faeze Brahman, Ronan Le Bras, Maarten Sap, Mark Riedl",
        "tldr": "",
        "abstract": "Reinforcement Learning with Human Feedback (RLHF) is the most prominent method for Language Model (LM) alignment. However, RLHF is an unstable and data-hungry process that continually requires new high-quality LM-generated data for finetuning. We introduce Advantage-Leftover Lunch RL (A-LoL), a new class of offline policy gradient algorithms that enable RL training on any pre-existing data. By assuming the entire LM output sequence as a single action, A-LoL allows incorporating sequence-level classifiers or human-designed scoring functions as\nrewards. Subsequently, by using LM\u2019s value estimate, A-LoL only trains on positive advantage (leftover) data points, making it resilient to noise. Overall, A-LoL is an easy-to-implement, sample-efficient, and stable LM training recipe.\n\nWe demonstrate the effectiveness of A-LoL and its variants with a set of four different language generation tasks. We compare against both online RL (PPO) and recent preference-based (DPO, PRO) and reward-based (GOLD) offline RL baselines. On the commonly-used RLHF benchmark, Helpful and Harmless Assistant (HHA), LMs trained with A-LoL methods achieve the highest diversity while also being rated more safe and helpful than the baselines according to humans. Additionally, in the remaining three tasks, A-LoL could optimize multiple distinct reward functions even when using noisy or suboptimal training data.",
        "keywords": "Reinforcement Learning;Natural Language Generation;Offline Policy Gradients",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Ashutosh Baheti;Ximing Lu;Faeze Brahman;Ronan Le Bras;Maarten Sap;Mark Riedl",
        "authorids": "~Ashutosh_Baheti1;~Ximing_Lu1;~Faeze_Brahman1;~Ronan_Le_Bras1;~Maarten_Sap1;~Mark_Riedl1",
        "gender": "M;F;F;M;M;",
        "homepage": "https://abaheti95.github.io/;https://gloriaximinglu.github.io/;https://fabrahman.github.io;https://rlebras.github.io/index.html;http://maartensap.com;http://eilab.gatech.edu/mark-riedl.html",
        "dblp": "185/7370;24/10879;276/6005;;153/9519;",
        "google_scholar": "36wq_hwAAAAJ;https://scholar.google.com/citations?hl=en;viCG2ikAAAAJ;8dXLDSsAAAAJ;gFN4QUYAAAAJ;Yg_QjxcAAAAJ",
        "orcid": "0000-0003-4375-1835;;;;;",
        "linkedin": "ashutoshbaheti/;;;;;",
        "or_profile": "~Ashutosh_Baheti1;~Ximing_Lu1;~Faeze_Brahman1;~Ronan_Le_Bras1;~Maarten_Sap1;~Mark_Riedl1",
        "aff": "Georgia Institute of Technology;University of Washington;Allen Institute for AI;Allen Institute for Artificial Intelligence;Carnegie Mellon University;Georgia Institute of Technology",
        "aff_domain": "gatech.edu;cs.washington.edu;allenai.org;allenai.org;cmu.edu;gatech.edu",
        "position": "PhD student;PhD student;Postdoc;Researcher;Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\nbaheti2024leftover,\ntitle={Leftover Lunch: Advantage-based Offline Reinforcement Learning for Language Models},\nauthor={Ashutosh Baheti and Ximing Lu and Faeze Brahman and Ronan Le Bras and Maarten Sap and Mark Riedl},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ZDGKPbF0VQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "u5W8;KNWL;hcnY;3aK6",
        "pdf_size": 3707623,
        "rating": "5;6;6;8",
        "confidence": "4;4;3;4",
        "soundness": "2;3;2;3",
        "contribution": "2;3;3;3",
        "presentation": "2;3;2;4",
        "wc_summary": "101;207;87;67",
        "wc_strengths": "50;111;87;126",
        "wc_weaknesses": "635;390;257;140",
        "wc_questions": "431;96;338;29",
        "wc_review": "1217;804;769;362",
        "wc_reply_reviewers": "780;176;0;0",
        "wc_reply_authors": "2847;973;1472;380",
        "reply_reviewers": "3;2;0;0",
        "reply_authors": "5;2;2;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            115.5,
            54.19178904594311
        ],
        "wc_strengths_avg": [
            93.5,
            28.709754439911183
        ],
        "wc_weaknesses_avg": [
            355.5,
            184.01970003236067
        ],
        "wc_questions_avg": [
            223.5,
            166.0218359132316
        ],
        "wc_review_avg": [
            788.0,
            302.5450379695559
        ],
        "wc_reply_reviewers_avg": [
            239.0,
            320.5042901428934
        ],
        "wc_reply_authors_avg": [
            1418.0,
            911.1018055080343
        ],
        "reply_reviewers_avg": [
            1.25,
            1.299038105676658
        ],
        "reply_authors_avg": [
            2.5,
            1.5
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.13245323570650439,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18006529156373300320&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=ZDGKPbF0VQ",
        "pdf": "https://openreview.net/pdf?id=ZDGKPbF0VQ",
        "email": "gatech.edu;cs.washington.edu;allenai.org;allenai.org;cmu.edu;gatech.edu",
        "author_num": 6,
        "aff_unique_index": "0;1;2;3;4;0",
        "aff_unique_norm": "Georgia Institute of Technology;University of Washington;Allen Institute for AI;Allen Institute for Artificial Intelligence;Carnegie Mellon University",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.gatech.edu;https://www.washington.edu;https://allenai.org;https://allenai.org;https://www.cmu.edu",
        "aff_unique_abbr": "Georgia Tech;UW;AI2;AI2;CMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "ZDRoonpLkD",
        "title": "Revisiting GNNs for Boolean Satisfiability",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We introduce a number of enhancements for the training and inference procedure of Graph Neural Networks that are trained to predict solutions of combinatorial problems. We motivate these enhancements by pointing to possible connections to two approximation algorithms studied in the domain of Boolean Satisfiability: Belief Propagation and Semidefinite Programming Relaxations. The first significant enhancement is a curriculum training procedure, which incrementally increases the problem complexity in the training set together with increasing the number of message passing iterations of the Graph Neural Network. We show that the curriculum, together with several other optimizations, reduces training time by more than an order of magnitude compared to the baseline without the curriculum. Furthermore, we apply decimation and initial embedding sampling, which significantly increases the percentage of solved problems.",
        "keywords": "graph neural networks;satisfiability;curriculum;SAT",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "/attachment/561af14afa0faae62c8839526a65092f337ce25f.zip",
        "author": "Jan Hula;Mikolas Janota;David Moj\u017e\u00ed\u0161ek",
        "authorids": "~Jan_Hula1;~Mikolas_Janota1;~David_Moj\u017e\u00ed\u0161ek1",
        "gender": "M;M;M",
        "homepage": ";https://people.ciirc.cvut.cz/~janotmik/;",
        "dblp": ";56/2424.html;",
        "google_scholar": "pCF6oo8AAAAJ;SFg4raQAAAAJ;jXA4RvYAAAAJ",
        "orcid": ";0000-0003-3487-784X;",
        "linkedin": ";mikol%C3%A1%C5%A1-janota-8b90784/;",
        "or_profile": "~Jan_Hula1;~Mikolas_Janota1;~David_Moj\u017e\u00ed\u0161ek1",
        "aff": "CIIRC, Czech Technical University, Czech Technical University of Prague;CTU;University of Ostrava",
        "aff_domain": "ciirc.cvut.cz;cvut.cz;osu.cz",
        "position": "Postdoc;Researcher;PhD student",
        "bibtex": "@misc{\nhula2024revisiting,\ntitle={Revisiting {GNN}s for Boolean Satisfiability},\nauthor={Jan Hula and Mikolas Janota and David Moj{\\v{z}}{\\'\\i}{\\v{s}}ek},\nyear={2024},\nurl={https://openreview.net/forum?id=ZDRoonpLkD}\n}",
        "github": "",
        "project": "",
        "reviewers": "wK6B;tuNF;rKtv;mpUf",
        "site": "https://openreview.net/forum?id=ZDRoonpLkD",
        "pdf_size": 876627,
        "rating": "3;5;6;6",
        "confidence": "4;4;3;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;2;3;4",
        "wc_summary": "54;36;138;101",
        "wc_strengths": "33;35;13;153",
        "wc_weaknesses": "213;52;359;145",
        "wc_questions": "10;14;56;12",
        "wc_review": "310;137;566;411",
        "wc_reply_reviewers": "0;32;29;20",
        "wc_reply_authors": "374;374;785;354",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            82.25,
            39.98984246030484
        ],
        "wc_strengths_avg": [
            58.5,
            55.233594849511654
        ],
        "wc_weaknesses_avg": [
            192.25,
            111.95841862048606
        ],
        "wc_questions_avg": [
            23.0,
            19.1049731745428
        ],
        "wc_review_avg": [
            356.0,
            155.88617642369704
        ],
        "wc_reply_reviewers_avg": [
            20.25,
            12.497499749949988
        ],
        "wc_reply_authors_avg": [
            471.75,
            181.03918774674173
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8164965809277259,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:m9ML2DcVYnEJ:scholar.google.com/&scioq=Revisiting+GNNs+for+Boolean+Satisfiability&hl=en&as_sdt=0,24",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Czech Technical University;University of Ostrava",
        "aff_unique_dep": "CIIRC;",
        "aff_unique_url": "https://www.cvut.cz;https://www.osu.cz",
        "aff_unique_abbr": "CTU;",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Prague;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Czech Republic"
    },
    {
        "title": "Det-CGD: Compressed Gradient Descent with Matrix Stepsizes for Non-Convex Optimization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18407",
        "id": "ZEZ0CPmoSI",
        "author_site": "Hanmin Li, Avetik Karagulyan, Peter Richtarik",
        "tldr": "",
        "abstract": "This paper introduces a new method for minimizing matrix-smooth non-convex objectives through the use of novel Compressed Gradient Descent (CGD) algorithms enhanced with a matrix-valued stepsize. \nThe proposed algorithms are theoretically analyzed first in the single-node and subsequently in the distributed settings. Our theoretical results reveal that the matrix stepsize in CGD can capture the objective\u2019s structure and lead to faster convergence compared to a scalar stepsize. \nAs a byproduct of our general results, we emphasize the importance of selecting the compression mechanism and the matrix stepsize in a layer-wise manner, taking advantage of model structure. \nMoreover, we provide theoretical guarantees for free compression, by designing specific layer-wise compressors for the non-convex matrix smooth objectives. Our findings are supported with empirical evidence.",
        "keywords": "Optimization;First-order optimization;Non-convex optimization;Distributed optimization",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/ba59aca1ff026fe587b41f0e02f373624e8cc964.pdf",
        "author": "Hanmin Li;Avetik Karagulyan;Peter Richt\u00e1rik",
        "authorids": "~Hanmin_Li1;~Avetik_Karagulyan1;~Peter_Richt\u00e1rik1",
        "gender": "M;M;M",
        "homepage": "https://cemse.kaust.edu.sa/ai/people/person/hanmin-li;https://avetx.github.io/;https://richtarik.org",
        "dblp": "340/3604;207/8322;62/8001",
        "google_scholar": "https://scholar.google.com/citations?hl=en;1-_KDtoAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0002-2587-640X;;0000-0003-4380-5848",
        "linkedin": "hanmin-li-034b8b245/;;richtarik/",
        "or_profile": "~Hanmin_Li1;~Avetik_Karagulyan1;~Peter_Richtarik1",
        "aff": "King Abdullah University of Science and Technology;King Abdullah University of Science and Technology;King Abdullah University of Science and Technology (KAUST)",
        "aff_domain": "kaust.edu.sa;kaust.edu.sa;kaust.edu.sa",
        "position": "PhD student;Postdoc;Full Professor",
        "bibtex": "@inproceedings{\nli2024detcgd,\ntitle={Det-{CGD}: Compressed Gradient Descent with Matrix Stepsizes for Non-Convex Optimization},\nauthor={Hanmin Li and Avetik Karagulyan and Peter Richt{\\'a}rik},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ZEZ0CPmoSI}\n}",
        "github": "",
        "project": "",
        "reviewers": "cDU5;y6k9;TXUi",
        "pdf_size": 610042,
        "rating": "3;6;6",
        "confidence": "5;2;2",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "3;3;3",
        "wc_summary": "16;63;39",
        "wc_strengths": "14;63;49",
        "wc_weaknesses": "2;215;25",
        "wc_questions": "121;2;74",
        "wc_review": "153;343;187",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "492;736;415",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.0,
            1.4142135623730951
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            39.333333333333336,
            19.189117286165672
        ],
        "wc_strengths_avg": [
            42.0,
            20.607442021431645
        ],
        "wc_weaknesses_avg": [
            80.66666666666667,
            95.45097636425145
        ],
        "wc_questions_avg": [
            65.66666666666667,
            48.93760199364993
        ],
        "wc_review_avg": [
            227.66666666666666,
            82.72578531241366
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            547.6666666666666,
            136.8316077844914
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13265996746913950779&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 11,
        "openreview": "https://openreview.net/forum?id=ZEZ0CPmoSI",
        "pdf": "https://openreview.net/pdf?id=ZEZ0CPmoSI",
        "email": "kaust.edu.sa;kaust.edu.sa;kaust.edu.sa",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "King Abdullah University of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kast.kau.edu.sa",
        "aff_unique_abbr": "KAUST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Saudi Arabia"
    },
    {
        "title": "Skill or Luck? Return Decomposition via Advantage Functions",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18406",
        "id": "ZFMiHfZwIf",
        "author_site": "Hsiao-Ru Pan, Bernhard Schoelkopf",
        "tldr": "",
        "abstract": "Learning from off-policy data is essential for sample-efficient reinforcement learning. In the present work, we build on the insight that the advantage function can be understood as the causal effect of an action on the return, and show that this allows us to decompose the return of a trajectory into parts caused by the agent\u2019s actions (skill) and parts outside of the agent\u2019s control (luck). Furthermore, this decomposition enables us to naturally extend Direct Advantage Estimation (DAE) to off-policy settings (Off-policy DAE). The resulting method can learn\nfrom off-policy trajectories without relying on importance sampling techniques or truncating off-policy actions. We draw connections between Off-policy DAE and previous methods to demonstrate how it can speed up learning and when the proposed off-policy corrections are important. Finally, we use the MinAtar environments to illustrate how ignoring off-policy corrections can lead to suboptimal policy optimization performance.",
        "keywords": "reinforcement learning;off-policy;advantage function",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/c6d99fc37281674244e71c68dd732593d22fe413.zip",
        "author": "Hsiao-Ru Pan;Bernhard Sch\u00f6lkopf",
        "authorids": "~Hsiao-Ru_Pan1;~Bernhard_Sch\u00f6lkopf1",
        "gender": "M;",
        "homepage": ";",
        "dblp": "301/8956;",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Hsiao-Ru_Pan1;~Bernhard_Sch\u00f6lkopf1",
        "aff": "Max Planck Institute for Intelligent Systems, Max-Planck Institute;",
        "aff_domain": "tuebingen.mpg.de;",
        "position": "PhD student;",
        "bibtex": "@inproceedings{\npan2024skill,\ntitle={Skill or Luck? Return Decomposition via Advantage Functions},\nauthor={Hsiao-Ru Pan and Bernhard Sch{\\\"o}lkopf},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ZFMiHfZwIf}\n}",
        "github": "",
        "project": "",
        "reviewers": "NYwT;K7qX;rop6;y5tB",
        "pdf_size": 746198,
        "rating": "5;6;6;8",
        "confidence": "5;3;4;3",
        "soundness": "3;3;3;4",
        "contribution": "3;3;3;3",
        "presentation": "1;3;4;4",
        "wc_summary": "23;43;56;87",
        "wc_strengths": "50;26;101;92",
        "wc_weaknesses": "272;2;32;33",
        "wc_questions": "29;239;249;21",
        "wc_review": "374;310;438;233",
        "wc_reply_reviewers": "372;42;52;5",
        "wc_reply_authors": "1467;704;648;202",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "3;1;1;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            1.224744871391589
        ],
        "wc_summary_avg": [
            52.25,
            23.25268801665734
        ],
        "wc_strengths_avg": [
            67.25,
            30.621683493890405
        ],
        "wc_weaknesses_avg": [
            84.75,
            108.82411267729225
        ],
        "wc_questions_avg": [
            134.5,
            109.59356732947423
        ],
        "wc_review_avg": [
            338.75,
            75.99794405113865
        ],
        "wc_reply_reviewers_avg": [
            117.75,
            147.8316187424057
        ],
        "wc_reply_authors_avg": [
            755.25,
            454.64347295435795
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.7608859102526822,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10622963830903750824&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=ZFMiHfZwIf",
        "pdf": "https://openreview.net/pdf?id=ZFMiHfZwIf",
        "email": "tuebingen.mpg.de;",
        "author_num": 2,
        "aff_unique_index": "0",
        "aff_unique_norm": "Max Planck Institute for Intelligent Systems",
        "aff_unique_dep": "Intelligent Systems",
        "aff_unique_url": "https://www.mpi-is.mpg.de",
        "aff_unique_abbr": "MPI-IS",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "ZFjp5Q2hLn",
        "title": "From gradient attacks to data poisoning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Security concerns around gradient attacks - in which an adversary can inject a maliciously crafted gradient during the training - have long been studied in dis- tributed learning due to their proven harmfulness and the difficulty to defend against. These attacks however have been argued to affect far less systems than data poisoning. In the latter, an attacker\u2019s power is reduced to only being able to inject data points to training sets, via e.g. legitimate-looking participation in an online service, or participation in a collaborative or open-sourced dataset. Even though an equivalence between the two attack modalities have been showed in convex settings (regression), this apparent difference in the attackers\u2019 power raises the question of whether the harm made by gradient attacks can be replicated by data poisonning ones in non-convex settings. In this paper, we show that data poisoning can sometimes mimic gradient availability attacks in a more practical deep learning setting. While data poisoning have mainly been used to perform targeted or backdoor attacks, we show that by borrowing a threat model to gradient attacks, we can successfully perform a data poisoning availability attack.",
        "keywords": "data poisoning;safety;attacks;gradient attack;manipulation.",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Wassim Bouaziz;El-Mahdi El-Mhamdi;Nicolas Usunier",
        "authorids": "~Wassim_Bouaziz1;~El-Mahdi_El-Mhamdi1;~Nicolas_Usunier1",
        "gender": "M;M;M",
        "homepage": "https://wesbz.github.io/;;https://elmahdielmhamdi.com",
        "dblp": ";79/3983;198/0984",
        "google_scholar": "QDtbGtIAAAAJ;tYro5N8AAAAJ;https://scholar.google.ch/citations?user=kNA-WLQAAAAJ",
        "orcid": ";;",
        "linkedin": "wassim-bouaziz/;;mahdielmhamdi/",
        "or_profile": "~Wassim_Bouaziz1;~Nicolas_Usunier1;~El_Mahdi_El_Mhamdi1",
        "aff": "\u00c9cole Polytechnique;Meta Facebook;Ecole polytechnique",
        "aff_domain": "polytechnique.edu;fb.com;polytechnique.edu",
        "position": "PhD student;Research Scientist;Assistant Professor",
        "bibtex": "@misc{\nbouaziz2024from,\ntitle={From gradient attacks to data poisoning},\nauthor={Wassim Bouaziz and El-Mahdi El-Mhamdi and Nicolas Usunier},\nyear={2024},\nurl={https://openreview.net/forum?id=ZFjp5Q2hLn}\n}",
        "github": "",
        "project": "",
        "reviewers": "AvRP;jPwq;vYfW;Kx6Q",
        "site": "https://openreview.net/forum?id=ZFjp5Q2hLn",
        "pdf_size": 2019532,
        "rating": "1;3;3;5",
        "confidence": "5;5;4;4",
        "soundness": "1;1;2;2",
        "contribution": "1;2;2;2",
        "presentation": "1;1;2;1",
        "wc_summary": "25;85;26;39",
        "wc_strengths": "17;10;31;31",
        "wc_weaknesses": "145;34;217;42",
        "wc_questions": "77;250;26;251",
        "wc_review": "264;379;300;363",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            1.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            43.75,
            24.44764814864612
        ],
        "wc_strengths_avg": [
            22.25,
            9.093266739736606
        ],
        "wc_weaknesses_avg": [
            109.5,
            75.94899604339744
        ],
        "wc_questions_avg": [
            151.0,
            101.12121439144211
        ],
        "wc_review_avg": [
            326.5,
            46.628853728137045
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.7071067811865476,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Ecole Polytechnique;Meta",
        "aff_unique_dep": ";Meta Platforms, Inc.",
        "aff_unique_url": "https://www.polytechnique.edu;https://meta.com",
        "aff_unique_abbr": "X;Meta",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "France;United States"
    },
    {
        "id": "ZG2AiVMj1I",
        "title": "IBCL: Zero-shot Model Generation for Task Trade-offs in Continual Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Like generic multi-task learning, continual learning has the nature of multi-objective optimization, and therefore faces a trade-off between the performance of different tasks. That is, to optimize for the current task distribution, it may need to compromise performance on some previous tasks. This means that there exist multiple models that are Pareto-optimal at different times, each addressing a distinct task performance trade-off. Researchers have discussed how to train particular models to address specific trade-off preferences. However, existing algorithms require training overheads proportional to the number of preferences---a large burden when there are multiple, possibly infinitely many, preferences. As a response, we propose Imprecise Bayesian Continual Learning (IBCL). Upon a new task, IBCL (1) updates a knowledge base in the form of a convex hull of model parameter distributions and (2) obtains particular models to address task trade-off preferences with zero-shot. That is, IBCL does not require any additional training overhead to generate preference-addressing models from its knowledge base. We show that models obtained by IBCL have guarantees in identifying the Pareto optimal parameters. Moreover, experiments on standard image classification and NLP tasks support this guarantee. Statistically, IBCL improves average per-task accuracy by at most 23\\% and peak per-task accuracy by at most 15\\% with respect to the baseline methods, with steadily near-zero or positive backward transfer. Most importantly, IBCL significantly reduces the training overhead from training 1 model per preference to at most 3 models for all preferences.",
        "keywords": "Bayesian learning;continual learning;imprecise probability",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/99ae52099dc6cd8319b70b10afcc3467da4000fc.zip",
        "author": "Pengyuan Lu;Michele Caprio;ERIC EATON;Insup Lee",
        "authorids": "~Pengyuan_Lu1;~Michele_Caprio1;~ERIC_EATON1;~Insup_Lee1",
        "gender": "M;M;;",
        "homepage": ";https://mc6034.wixsite.com/caprio;;https://www.cis.upenn.edu/~lee/",
        "dblp": "231/5742;322/9067;22/2336;l/InsupLee.html",
        "google_scholar": "WnO2b68AAAAJ;6rngqVgAAAAJ;QIZWnnQAAAAJ;qPlUgrgAAAAJ",
        "orcid": ";0000-0002-7569-097X;;0000-0003-2672-1132",
        "linkedin": "pengyuan-eric-lu-778124121/;michele-caprio-5866b162/;;",
        "or_profile": "~Pengyuan_Lu1;~Michele_Caprio1;~ERIC_EATON1;~Insup_Lee1",
        "aff": "Department of Computer and Information Science, School of Engineering and Applied Science;University of Pennsylvania;University of Pennsylvania;University of Pennsylvania",
        "aff_domain": "cis.upenn.edu;seas.upenn.edu;upenn.edu;upenn.edu",
        "position": "PhD student;Postdoc;Faculty;Full Professor",
        "bibtex": "@misc{\nlu2024ibcl,\ntitle={{IBCL}: Zero-shot Model Generation for Task Trade-offs in Continual Learning},\nauthor={Pengyuan Lu and Michele Caprio and ERIC EATON and Insup Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=ZG2AiVMj1I}\n}",
        "github": "",
        "project": "",
        "reviewers": "79Li;6n6n;SCN6;bswF",
        "site": "https://openreview.net/forum?id=ZG2AiVMj1I",
        "pdf_size": 1914062,
        "rating": "3;3;6;8",
        "confidence": "4;4;4;4",
        "soundness": "2;2;4;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "46;103;54;107",
        "wc_strengths": "65;52;73;48",
        "wc_weaknesses": "285;172;81;451",
        "wc_questions": "8;299;21;45",
        "wc_review": "404;626;229;651",
        "wc_reply_reviewers": "0;372;0;518",
        "wc_reply_authors": "376;1424;328;759",
        "reply_reviewers": "0;1;0;2",
        "reply_authors": "2;3;1;3",
        "rating_avg": [
            5.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            77.5,
            27.681221071332818
        ],
        "wc_strengths_avg": [
            59.5,
            10.012492197250394
        ],
        "wc_weaknesses_avg": [
            247.25,
            138.05863790433398
        ],
        "wc_questions_avg": [
            93.25,
            119.52902367207723
        ],
        "wc_review_avg": [
            477.5,
            172.70567448697219
        ],
        "wc_reply_reviewers_avg": [
            222.5,
            228.4091723202026
        ],
        "wc_reply_authors_avg": [
            721.75,
            438.4987884817927
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8004578138921344877&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "School of Engineering and Applied Science;University of Pennsylvania",
        "aff_unique_dep": "Department of Computer and Information Science;",
        "aff_unique_url": ";https://www.upenn.edu",
        "aff_unique_abbr": ";UPenn",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "1;1;1",
        "aff_country_unique": ";United States"
    },
    {
        "title": "Connecting Large Language Models with Evolutionary Algorithms Yields Powerful Prompt Optimizers",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18405",
        "id": "ZG3RaNIsO8",
        "author_site": "Qingyan Guo, Rui Wang, Junliang Guo, Bei Li, Kaitao Song, Xu Tan, Guoqing Liu, Jiang Bian, Yujiu Yang",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) excel in various tasks, but they rely on carefully crafted prompts that often demand substantial human effort. To automate this process, in this paper, we propose a novel framework for discrete prompt optimization, called EvoPrompt, which borrows the idea of evolutionary algorithms (EAs) as they exhibit good performance and fast convergence. To enable EAs to work on discrete prompts, which are natural language expressions that need to be coherent and human-readable, we connect LLMs with EAs. This approach allows us to simultaneously leverage the powerful language processing capabilities of LLMs and the efficient optimization performance of EAs. Specifically, abstaining from any gradients or parameters, EvoPrompt starts from a population of prompts and iteratively generates new prompts with LLMs based on the evolutionary operators, improving the population based on the development set. We optimize prompts for both closed- and open-source LLMs including GPT-3.5 and Alpaca, on 31 datasets covering language understanding, generation tasks, as well as BIG-Bench Hard (BBH) tasks. EvoPrompt significantly outperforms human-engineered prompts and existing methods for automatic prompt generation (e.g., up to 25% on BBH). Furthermore, EvoPrompt demonstrates that connecting LLMs with EAs creates synergies, which could inspire further research on the combination of LLMs and conventional algorithms.",
        "keywords": "large language model;evolutionary algorithm;prompt engineering;natural language processing",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/3a85a58c8b7f627e33ecddbae9a40f4228f1257b.zip",
        "author": "Qingyan Guo;Rui Wang;Junliang Guo;Bei Li;Kaitao Song;Xu Tan;Guoqing Liu;Jiang Bian;Yujiu Yang",
        "authorids": "~Qingyan_Guo1;~Rui_Wang26;~Junliang_Guo1;~Bei_Li1;~Kaitao_Song1;~Xu_Tan1;~Guoqing_Liu3;~Jiang_Bian1;~Yujiu_Yang2",
        "gender": "F;;M;M;M;M;M;M;M",
        "homepage": "https://beeevita.github.io/;;https://leoguojl.me/;https://libeineu.github.io/;;https://tan-xu.github.io/;https://www.microsoft.com/en-us/research/people/guoqingliu/;https://sites.google.com/view/jiangbian;https://sites.google.com/view/iigroup-thu",
        "dblp": "138/8089;06/2293-28.html;209/9674;;222/2082;96/10484-3;;09/851-2.html;30/3847",
        "google_scholar": "tPYWm_AAAAAJ;h1IrWikAAAAJ;https://scholar.google.com.sg/citations?user=S88C9ewAAAAJ;wzbJ5EIAAAAJ;https://scholar.google.com.hk/citations?user=LLk9dR8AAAAJ;tob-U1oAAAAJ;h-eHvyoAAAAJ;pZBEnY8AAAAJ;4gH3sxsAAAAJ",
        "orcid": ";;0000-0001-8360-5483;;;0000-0001-5631-0639;;0000-0002-9472-600X;0000-0002-6427-1024",
        "linkedin": ";;;;;;;jbian/;",
        "or_profile": "~Qingyan_Guo1;~Rui_Wang26;~Junliang_Guo1;~Bei_Li1;~Kaitao_Song1;~Xu_Tan1;~Guoqing_Liu3;~Jiang_Bian1;~Yujiu_Yang2",
        "aff": "Tsinghua University;Microsoft;Microsoft;Meituan;Microsoft;Microsoft;Microsoft Research ;Microsoft;Tsinghua University",
        "aff_domain": "thu.edu;microsoft.com;microsoft.com;meituan.com;microsoft.com;microsoft.com;microsoft.com;microsoft.com;tsinghua.edu.cn",
        "position": "MS student;Researcher;Researcher;Researcher;Researcher;Principal Researcher;Researcher;Partner Research Manager;Full Professor",
        "bibtex": "@inproceedings{\nguo2024connecting,\ntitle={Connecting Large Language Models with Evolutionary Algorithms Yields Powerful Prompt Optimizers},\nauthor={Qingyan Guo and Rui Wang and Junliang Guo and Bei Li and Kaitao Song and Xu Tan and Guoqing Liu and Jiang Bian and Yujiu Yang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ZG3RaNIsO8}\n}",
        "github": "",
        "project": "",
        "reviewers": "hqfj;HRoN;ZLDk;LYv4",
        "pdf_size": 599572,
        "rating": "6;6;6;8",
        "confidence": "2;3;4;3",
        "soundness": "3;3;2;3",
        "contribution": "3;3;2;2",
        "presentation": "3;3;3;4",
        "wc_summary": "58;108;65;287",
        "wc_strengths": "107;90;8;219",
        "wc_weaknesses": "98;155;139;253",
        "wc_questions": "69;122;62;322",
        "wc_review": "332;475;274;1081",
        "wc_reply_reviewers": "21;53;215;70",
        "wc_reply_authors": "504;1299;1239;965",
        "reply_reviewers": "1;1;2;1",
        "reply_authors": "2;3;5;3",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            129.5,
            92.92604586443997
        ],
        "wc_strengths_avg": [
            106.0,
            75.21635460456721
        ],
        "wc_weaknesses_avg": [
            161.25,
            56.9050744661669
        ],
        "wc_questions_avg": [
            143.75,
            105.49496433479656
        ],
        "wc_review_avg": [
            540.5,
            320.5171602270306
        ],
        "wc_reply_reviewers_avg": [
            89.75,
            74.4223588715112
        ],
        "wc_reply_authors_avg": [
            1001.75,
            313.7478087572884
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.25,
            1.0897247358851685
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:rOhnbCl59cAJ:scholar.google.com/&scioq=Connecting+Large+Language+Models+with+Evolutionary+Algorithms+Yields+Powerful+Prompt+Optimizers&hl=en&as_sdt=0,34",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=ZG3RaNIsO8",
        "pdf": "https://openreview.net/pdf?id=ZG3RaNIsO8",
        "email": "thu.edu;microsoft.com;microsoft.com;meituan.com;microsoft.com;microsoft.com;microsoft.com;microsoft.com;tsinghua.edu.cn",
        "author_num": 9,
        "aff_unique_index": "0;1;1;2;1;1;1;1;0",
        "aff_unique_norm": "Tsinghua University;Microsoft;Meituan",
        "aff_unique_dep": ";Microsoft Corporation;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.microsoft.com;https://www.meituan.com",
        "aff_unique_abbr": "THU;Microsoft;Meituan",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;0;1;1;1;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "ZGBOfAQrMl",
        "title": "Video Super-Resolution Transformer with Masked Inter&Intra-Frame Attention",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recently, Vision Transformer has achieved great success in recovering missing details in low-resolution sequences, i.e. the video super-resolution (VSR) task.\nDespite its superiority VSR accuracy, the heavy computational burden as well as the large memory footprint hinders the deployment of Transformer-based VSR models on constrained devices, e.g. smart\nphones and consumer electronic products. \nIn this paper, we address the above issue by proposing a novel feature-level masked processing framework: VSR with Masked Intra and inter frame Attention (MIA-VSR).\nThe core of MIA-VSR is leveraging feature-level temporal continuity between adjacent frames to reduce redundant computations and make more rational use of previously enhanced SR features.\nConcretely, we propose an intra-frame and inter-frame attention block which takes the respective roles of past features and input\nfeatures into consideration and only exploits previously enhanced features to provide supplementary information.\nIn addition, an adaptive block-wise mask predicting module is developed to skip unimportant computations according to feature similarity between adjacent frames.\nWe conduct detailed ablation studies to validate our contributions and compare the proposed method with recent state-of-the-art VSR approaches.\nThe experimental results demonstrate that MIA-VSR improves\nthe memory and computation efficiency over state-of-the-art methods, without trading off PSNR accuracy.",
        "keywords": "video super-resolution;adaptive;memory and computation efficiency",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Xingyu Zhou;Leheng Zhang;Xiaorui Zhao;Keze Wang;Leida Li;Shuhang Gu",
        "authorids": "~Xingyu_Zhou4;~Leheng_Zhang2;~Xiaorui_Zhao1;~Keze_Wang1;~Leida_Li3;~Shuhang_Gu3",
        "gender": "M;M;F;M;;M",
        "homepage": "https://zhouxingyu13.github.io;;https://github.com/zzzhaoxiaorui;http://kezewang.com;;",
        "dblp": ";;;135/4889;;126/1028",
        "google_scholar": "dgO3CyMAAAAJ;DH1CJqkAAAAJ;https://scholar.google.com/citations?view_op=list_works;Qirk2fYAAAAJ;;-kSTt40AAAAJ",
        "orcid": "0009-0000-2521-6500;;;0000-0002-7817-8306;;",
        "linkedin": ";;;keze-wang-%E7%8E%8B%E5%8F%AF%E6%B3%BD-32107b37/;;",
        "or_profile": "~Xingyu_Zhou4;~Leheng_Zhang2;~Xiaorui_Zhao1;~Keze_Wang1;~Leida_Li3;~Shuhang_Gu3",
        "aff": "University of Electronic Science and Technology of China;University of Electronic Science and Technology of China;University of Electronic Science and Technology of China;SUN YAT-SEN UNIVERSITY;;University of Electronic Science and Technology of China",
        "aff_domain": "uestc.edu.cn;uestc.edu.cn;uestc.edu.cn;sysu.edu.cn;;uestc.edu.cn",
        "position": "MS student;PhD student;MS student;Associate Professor;;Full Professor",
        "bibtex": "@misc{\nzhou2024video,\ntitle={Video Super-Resolution Transformer with Masked Inter\\&Intra-Frame Attention},\nauthor={Xingyu Zhou and Leheng Zhang and Xiaorui Zhao and Keze Wang and Leida Li and Shuhang Gu},\nyear={2024},\nurl={https://openreview.net/forum?id=ZGBOfAQrMl}\n}",
        "github": "",
        "project": "",
        "reviewers": "FxaB;oDvo;FTQC;kfYa",
        "site": "https://openreview.net/forum?id=ZGBOfAQrMl",
        "pdf_size": 3053283,
        "rating": "3;3;5;6",
        "confidence": "4;5;4;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;2;3",
        "wc_summary": "79;43;109;58",
        "wc_strengths": "56;46;26;54",
        "wc_weaknesses": "305;52;206;57",
        "wc_questions": "2;130;52;73",
        "wc_review": "442;271;393;242",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            72.25,
            24.772716847370617
        ],
        "wc_strengths_avg": [
            45.5,
            11.863810517704673
        ],
        "wc_weaknesses_avg": [
            155.0,
            106.43542643311953
        ],
        "wc_questions_avg": [
            64.25,
            45.89321845327477
        ],
        "wc_review_avg": [
            337.0,
            82.97891298396237
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5555555555555555,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8182684046477900312&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "University of Electronic Science and Technology of China;Sun Yat-sen University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uestc.edu.cn;http://www.sysu.edu.cn",
        "aff_unique_abbr": "UESTC;SYSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Reasoning on Graphs: Faithful and Interpretable Large Language Model Reasoning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18404",
        "id": "ZGNWW7xZ6Q",
        "author_site": "Linhao Luo, Yuan-Fang Li, Reza Haffari, Shirui Pan",
        "tldr": "",
        "abstract": "Large language models (LLMs) have demonstrated impressive reasoning abilities in complex tasks. However, they lack up-to-date knowledge and experience hallucinations during reasoning, which can lead to incorrect reasoning processes and diminish their performance and trustworthiness. Knowledge graphs (KGs), which capture vast amounts of facts in a structured format, offer a reliable source of knowledge for reasoning. Nevertheless, existing KG-based LLM reasoning methods only treat KGs as factual knowledge bases and overlook the importance of their structural information for reasoning. In this paper, we propose a novel method called reasoning on graphs (RoG) that synergizes LLMs with KGs to enable faithful and interpretable reasoning. Specifically, we present a planning-retrieval-reasoning framework, where RoG first generates relation paths grounded by KGs as faithful plans. These plans are then used to retrieve valid reasoning paths from the KGs for LLMs to conduct faithful reasoning. Furthermore, RoG not only distills knowledge from KGs to improve the reasoning ability of LLMs through training but also allows seamless integration with any arbitrary LLMs during inference. Extensive experiments on two benchmark KGQA datasets demonstrate that RoG achieves state-of-the-art performance on KG reasoning tasks and generates faithful and interpretable reasoning results.",
        "keywords": "large language models;knowledge graphs;reasoning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "LINHAO LUO;Yuan-Fang Li;Gholamreza Haffari;Shirui Pan",
        "authorids": "~LINHAO_LUO1;~Yuan-Fang_Li1;~Gholamreza_Haffari2;~Shirui_Pan1",
        "gender": "M;M;;M",
        "homepage": "https://rmanluo.github.io/;https://users.monash.edu.au/~yli/;;https://rezahaffari.github.io/HomePage/HomePage.html",
        "dblp": "251/5530;20/2537;91/8171;",
        "google_scholar": "https://scholar.google.com.hk/citations?user=RO46HpcAAAAJ;https://scholar.google.com.tw/citations?user=wufXO1kAAAAJ;https://scholar.google.com.au/citations?user=frWRJN4AAAAJ;https://scholar.google.com.tw/citations?user=Perjx5EAAAAJ",
        "orcid": "0000-0003-0027-942X;;0000-0003-0794-527X;",
        "linkedin": "linhao-luo-36b489134/;;;gholamrezahaffari/?originalSubdomain=au",
        "or_profile": "~LINHAO_LUO1;~Yuan-Fang_Li1;~Shirui_Pan1;~Gholamreza_Haffari1",
        "aff": "Monash University;Oracle;Griffith University;Monash University",
        "aff_domain": "monash.edu;oracle.com;griffith.edu.au;monash.edu",
        "position": "PhD student;Principal Researcher;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nluo2024reasoning,\ntitle={Reasoning on Graphs: Faithful and Interpretable Large Language Model Reasoning},\nauthor={LINHAO LUO and Yuan-Fang Li and Gholamreza Haffari and Shirui Pan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ZGNWW7xZ6Q}\n}",
        "github": "",
        "project": "",
        "reviewers": "1bmQ;cFys;qFDd;ZzpQ",
        "pdf_size": 702546,
        "rating": "6;8;8;8",
        "confidence": "3;4;4;2",
        "soundness": "3;3;4;4",
        "contribution": "2;3;4;3",
        "presentation": "2;3;4;3",
        "wc_summary": "90;32;179;147",
        "wc_strengths": "41;67;88;30",
        "wc_weaknesses": "215;222;25;157",
        "wc_questions": "90;55;10;76",
        "wc_review": "436;376;302;410",
        "wc_reply_reviewers": "27;21;33;31",
        "wc_reply_authors": "1341;791;74;704",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "3;2;2;2",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            112.0,
            56.12040627080314
        ],
        "wc_strengths_avg": [
            56.5,
            22.610838109190027
        ],
        "wc_weaknesses_avg": [
            154.75,
            79.04547741648474
        ],
        "wc_questions_avg": [
            57.75,
            30.252066045148055
        ],
        "wc_review_avg": [
            381.0,
            50.32891812864648
        ],
        "wc_reply_reviewers_avg": [
            28.0,
            4.58257569495584
        ],
        "wc_reply_authors_avg": [
            727.5,
            449.45216653165664
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.17407765595569782,
        "gs_citation": 231,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6951357636261502418&as_sdt=805&sciodt=0,3&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=ZGNWW7xZ6Q",
        "pdf": "https://openreview.net/pdf?id=ZGNWW7xZ6Q",
        "email": "monash.edu;oracle.com;griffith.edu.au;monash.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Monash University;Oracle Corporation;Griffith University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.monash.edu;https://www.oracle.com;https://www.griffith.edu.au",
        "aff_unique_abbr": "Monash;Oracle;Griffith",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "Australia;United States"
    },
    {
        "id": "ZGVICgorMi",
        "title": "Learning Team-Level Information Integration in Multi-Agent Communication",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In human cooperation, both individual knowledge and group consensus play important roles in accomplishing tasks. However, existing multi-agent reinforcement learning (MARL) communication methods commonly focus on individual-level communication, which lacks the necessary global information for well-grounded decision-making. Meanwhile, individual-level communication is often infeasible when the communication bandwidth is limited. To tackle these problems, we propose a group-level information integration model called Double Channel Communication Network (DC2Net). DC2Net highlights the significance of independent group feature learning by separating individual and group feature learning into two independent channels. In this model, agents no longer communicate with each other in a peer-to-peer paradigm; instead, all interactions are carried out in the group channel. By combining individual and global features, decisions are made collaboratively. We conduct experiments on several multi-agent cooperative environments and the results show that the DC2Net not only outperforms state-of-the-art MARL communication models but also reduces the communication costs. Furthermore, the two independent channels enable adaptive balancing of individual and group feature learning based on task requirements.",
        "keywords": "Multi-Agent Communication;Multi-Agent Reinforcement Learning;Team-Level Communication;Deep Reinforcement Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/41f2e6050b6e1b80a4405ac55077d41aaa248b97.zip",
        "author": "Xiangrui Meng;Ying Tan",
        "authorids": "~Xiangrui_Meng2;~Ying_Tan1",
        "gender": ";M",
        "homepage": ";https://www.cil.pku.edu.cn/people/index.htm",
        "dblp": ";68/6102-2",
        "google_scholar": ";https://scholar.google.com.tw/citations?user=PjNxSPsAAAAJ",
        "orcid": ";0000-0001-8243-4731",
        "linkedin": ";",
        "or_profile": "~Xiangrui_Meng2;~Ying_Tan1",
        "aff": ";Peking University",
        "aff_domain": ";pku.edu.cn",
        "position": ";Full Professor",
        "bibtex": "@misc{\nmeng2024learning,\ntitle={Learning Team-Level Information Integration in Multi-Agent Communication},\nauthor={Xiangrui Meng and Ying Tan},\nyear={2024},\nurl={https://openreview.net/forum?id=ZGVICgorMi}\n}",
        "github": "",
        "project": "",
        "reviewers": "GjzF;fZN2;bZ3G;rpxc",
        "site": "https://openreview.net/forum?id=ZGVICgorMi",
        "pdf_size": 591813,
        "rating": "3;3;5;5",
        "confidence": "2;4;4;5",
        "soundness": "2;2;3;2",
        "contribution": "2;2;2;2",
        "presentation": "2;2;3;3",
        "wc_summary": "47;83;50;456",
        "wc_strengths": "25;26;56;2",
        "wc_weaknesses": "113;245;96;2",
        "wc_questions": "13;104;57;2",
        "wc_review": "198;458;259;462",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            159.0,
            172.05377066487094
        ],
        "wc_strengths_avg": [
            27.25,
            19.17517926904466
        ],
        "wc_weaknesses_avg": [
            114.0,
            86.64583082872481
        ],
        "wc_questions_avg": [
            44.0,
            40.29267923581156
        ],
        "wc_review_avg": [
            344.25,
            117.75053078436632
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.6882472016116854,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ujBF4ZAF9VUJ:scholar.google.com/&scioq=Learning+Team-Level+Information+Integration+in+Multi-Agent+Communication&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Peking University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.pku.edu.cn",
        "aff_unique_abbr": "Peking U",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "ZHr0JajZfH",
        "title": "A Simple Unified Uncertainty-Guided Framework for Offline-to-Online Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Offline reinforcement learning (RL) provides a promising solution to learning an agent fully relying on a data-driven paradigm. However, constrained by the limited quality of the offline dataset, its performance is often sub-optimal. Therefore, it is desired to further finetune the agent via extra online interactions before deployment. Unfortunately, offline-to-online RL can be challenging due to two main challenges: constrained exploratory behavior and state-action distribution shift. To this end, we propose a Simple Unified uNcertainty-Guided (SUNG) framework, which naturally unifies the solution to both challenges with the tool of uncertainty. Specifically, SUNG quantifies uncertainty via a VAE-based state-action visitation density estimator. To facilitate efficient exploration, SUNG presents a practical optimistic exploration strategy to select informative actions with both high value and high uncertainty. Moreover, SUNG develops an adaptive exploitation method by applying conservative offline RL objectives to high-uncertainty samples and standard online RL objectives to low-uncertainty samples to smoothly bridge offline and online stages. SUNG achieves state-of-the-art online finetuning performance when combined with different offline RL methods, across various environments and datasets in D4RL benchmark.",
        "keywords": "Offline-to-Online Reinforcement Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Siyuan Guo;Yanchao Sun;Jifeng Hu;Sili Huang;Xing Chen;Hechang Chen;haiyin piao;Lichao Sun;Yi Chang",
        "authorids": "~Siyuan_Guo2;~Yanchao_Sun1;~Jifeng_Hu1;~Sili_Huang1;~Xing_Chen2;~Hechang_Chen2;~haiyin_piao1;~Lichao_Sun1;~Yi_Chang4",
        "gender": "M;F;;M;M;M;M;M;M",
        "homepage": ";https://ycsun2017.github.io/home/index.html;;;https://github.com/raincchio;http://sai.jlu.edu.cn/info/1094/2387.htm;https://www.researchgate.net/profile/Haiyin-Piao;https://lichao-sun.github.io/;http://www.yichang-cs.com",
        "dblp": "244/5858;132/6840;;26/6752;;145/1142;269/4228.html;121/0780-1.html;02/5438.html",
        "google_scholar": "JE1Yco4AAAAJ;bloBY_QAAAAJ;;ZMhi8A0AAAAJ;;EezEcbgAAAAJ;;WhGUE7AAAAAJ;https://scholar.google.com.hk/citations?user=drEkR50AAAAJ",
        "orcid": "0000-0002-9304-5405;0000-0002-1137-9939;;0000-0001-5387-7904;0000-0001-5685-8506;;;;0000-0003-2697-8093",
        "linkedin": ";;;;;;;lichao-sun-b273a290/;",
        "or_profile": "~Siyuan_Guo2;~Yanchao_Sun1;~Jifeng_Hu1;~Sili_Huang1;~Xing_Chen2;~Hechang_Chen2;~haiyin_piao1;~Lichao_Sun1;~Yi_Chang4",
        "aff": "Jilin University;J.P. Morgan AI Research;;Jilin University;Jilin University;Jilin University;;Lehigh University;Jilin University, China",
        "aff_domain": "jlu.edu.cn;jpmchase.com;;jlu.edu.cn;jlu.edu.cn;jlu.edu.cn;;lehigh.edu;jlu.edu.cn",
        "position": "PhD student;Researcher;;PhD student;PhD student;Associate Professor;;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nguo2024a,\ntitle={A Simple Unified Uncertainty-Guided Framework for Offline-to-Online Reinforcement Learning},\nauthor={Siyuan Guo and Yanchao Sun and Jifeng Hu and Sili Huang and Xing Chen and Hechang Chen and haiyin piao and Lichao Sun and Yi Chang},\nyear={2024},\nurl={https://openreview.net/forum?id=ZHr0JajZfH}\n}",
        "github": "",
        "project": "",
        "reviewers": "MwS2;YGBs;WjUY;K3Su",
        "site": "https://openreview.net/forum?id=ZHr0JajZfH",
        "pdf_size": 918652,
        "rating": "3;3;5;5",
        "confidence": "5;4;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;2",
        "presentation": "2;3;4;3",
        "wc_summary": "42;96;47;174",
        "wc_strengths": "54;83;40;84",
        "wc_weaknesses": "211;115;176;696",
        "wc_questions": "71;5;95;3",
        "wc_review": "378;299;358;957",
        "wc_reply_reviewers": "76;15;0;116",
        "wc_reply_authors": "734;754;979;775",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "2;3;3;2",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            89.75,
            53.020632776307
        ],
        "wc_strengths_avg": [
            65.25,
            18.91262805640718
        ],
        "wc_weaknesses_avg": [
            299.5,
            231.4827207374235
        ],
        "wc_questions_avg": [
            43.5,
            40.4073013204297
        ],
        "wc_review_avg": [
            498.0,
            266.5905099586255
        ],
        "wc_reply_reviewers_avg": [
            51.75,
            46.756684014159944
        ],
        "wc_reply_authors_avg": [
            810.5,
            98.35776532638387
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1124817194473693322&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;0;0;2;0",
        "aff_unique_norm": "Jilin University;J.P. Morgan;Lehigh University",
        "aff_unique_dep": ";AI Research;",
        "aff_unique_url": "http://www.jlu.edu.cn;https://www.jpmorgan.com;https://www.lehigh.edu",
        "aff_unique_abbr": "JLU;JPM;Lehigh",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "ZIbUx5dzfZ",
        "title": "ORBIS: Open Dataset Can Rescue You From Dataset Bias",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Dataset bias, in the context of machine learning, pertains to the issue of unintended correlations between target labels and undesirable features found in specific training datasets. This phenomenon frequently arises in real-world scenarios and can lead to unintended behaviors. Researchers have devised techniques to alleviate this bias by diminishing the influence of samples with spurious correlations (i.e., bias-aligned samples) while assigning greater importance to other samples (i.e., bias-conflicting samples) during the training process. Prior approaches have mainly focused on leveraging given training datasets and have not explored the potential of harnessing open datasets, which have huge size of samples. Nonetheless, open datasets may contain noisy information posing a challenge for straightforward integration. In this paper, we introduce a novel method calld ORBIS to tackle dataset bias using open datasets. ORBIS comprises two core components. Firstly, it involves the selection of relevant samples from open datasets whose context aligns with the characteristics of the given training dataset. Subsequently, a debiased model is trained using both training dataset and selected samples. We assess the effectiveness of this proposed algorithm in conjunction with established debiasing methods and evaluate its performance on both synthetic and real-world benchmark datasets.",
        "keywords": "Dataset bias;Open dataset;Debiasing",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/dd720cbac4a36c7cda2aa254c693a353274ea1e2.zip",
        "author": "Sumyeong Ahn;Se-Young Yun",
        "authorids": "~Sumyeong_Ahn1;~Se-Young_Yun1",
        "gender": "M;M",
        "homepage": "https://sumyeongahn.github.io;https://fbsqkd.github.io",
        "dblp": "217/5462;23/8862",
        "google_scholar": "krxhvIYAAAAJ;X_IAjb8AAAAJ",
        "orcid": ";",
        "linkedin": ";seyoung-yun-395130ab/",
        "or_profile": "~Sumyeong_Ahn1;~Se-Young_Yun1",
        "aff": "Michigan State University;KAIST",
        "aff_domain": "msu.edu;kaist.ac.kr",
        "position": "Postdoc;Assistant Professor",
        "bibtex": "@misc{\nahn2024orbis,\ntitle={{ORBIS}: Open Dataset Can Rescue You From Dataset Bias},\nauthor={Sumyeong Ahn and Se-Young Yun},\nyear={2024},\nurl={https://openreview.net/forum?id=ZIbUx5dzfZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "i93n;1vEM;LB6u",
        "site": "https://openreview.net/forum?id=ZIbUx5dzfZ",
        "pdf_size": 948929,
        "rating": "3;3;3",
        "confidence": "4;5;2",
        "soundness": "2;2;2",
        "contribution": "2;2;2",
        "presentation": "2;2;1",
        "wc_summary": "83;60;52",
        "wc_strengths": "31;14;29",
        "wc_weaknesses": "448;551;100",
        "wc_questions": "14;125;2",
        "wc_review": "576;750;183",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            1.247219128924647
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            65.0,
            13.140268896284683
        ],
        "wc_strengths_avg": [
            24.666666666666668,
            7.586537784494028
        ],
        "wc_weaknesses_avg": [
            366.3333333333333,
            192.96343925440615
        ],
        "wc_questions_avg": [
            47.0,
            55.37147279962851
        ],
        "wc_review_avg": [
            503.0,
            237.1623916222806
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:21IWPtZUnXYJ:scholar.google.com/&scioq=ORBIS:+Open+Dataset+Can+Rescue+You+From+Dataset+Bias&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Michigan State University;Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.msu.edu;https://www.kaist.ac.kr",
        "aff_unique_abbr": "MSU;KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United States;South Korea"
    },
    {
        "id": "ZJHdiYDD5k",
        "title": "LatentWarp: Consistent Diffusion Latents for Zero-Shot Video-to-Video Translation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Leveraging the generative ability of image diffusion models offers great potential for zero-shot video-to-video translation. The key lies in how to maintain temporal consistency across generated video frames by image diffusion models. Previous methods typically adopt cross-frame attention, i.e., sharing the key and value tokens across attentions of different frames, to encourage the temporal consistency. However, in those works, temporal inconsistency issue may not be thoroughly solved, rendering the fidelity of generated videos limited. In this paper, we find the bottleneck lies in the unconstrained query tokens and propose a new zero\u0002shot video-to-video translation framework, named LatentWarp. Our approach is simple: to constrain the query tokens to be temporally consistent, we further incorporate a warping operation on the latent space to constrain the query tokens. Specifically, based on the optical flow obtained from the original video, we warp the generated latent features of last frame to align with the current frame during the denoising process. As a result, the corresponding regions across the adjacent frames can share closely-related query tokens and attention outputs, which can further improve latent-level consistency to enhance visual temporal coherence of generated videos. Extensive experiment results demonstrate the superiority of LatentWarp in achieving video-to-video translation with temporal coherence.",
        "keywords": "diffusion model;video generation",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Yuxiang Bao;Di Qiu;Guoliang Kang;Baochang Zhang;Bo Jin;Kaiye Wang;Pengfei Yan",
        "authorids": "~Yuxiang_Bao1;~Di_Qiu2;~Guoliang_Kang1;~Baochang_Zhang1;~Bo_Jin3;~Kaiye_Wang2;~Pengfei_Yan1",
        "gender": "M;M;M;M;;M;M",
        "homepage": ";;;https://dblp.uni-trier.de/pid/80/3887-1.html;;;https://ai.meituan.com/",
        "dblp": ";;178/8663;https://dblp.uni-trier.de/pid/80/3887-1.html;;;",
        "google_scholar": ";6D_nzucAAAAJ;https://scholar.google.com.au/citations?user=P24HCsgAAAAJ;;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com/citations?hl=en;",
        "orcid": "0000-0001-9376-4656;;0000-0003-1978-2025;;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Yuxiang_Bao1;~Di_Qiu2;~Guoliang_Kang1;~Baochang_Zhang1;~Bo_Jin3;~Kaiye_Wang2;~Pengfei_Yan1",
        "aff": "Beihang University;Meituan;Beihang University;Beihang University;MeiTuan;meituan;Meituan",
        "aff_domain": "buaa.edu.cn;meituan.com;buaa.edu.cn;buaa.edu.cn;meituan.com;meituan.com;meituan.com",
        "position": "MS student;Researcher;Full Professor;Professor;Researcher;Researcher;Researcher",
        "bibtex": "@misc{\nbao2024latentwarp,\ntitle={LatentWarp: Consistent Diffusion Latents for Zero-Shot Video-to-Video Translation},\nauthor={Yuxiang Bao and Di Qiu and Guoliang Kang and Baochang Zhang and Bo Jin and Kaiye Wang and Pengfei Yan},\nyear={2024},\nurl={https://openreview.net/forum?id=ZJHdiYDD5k}\n}",
        "github": "",
        "project": "",
        "reviewers": "WQHp;Yr5G;9TQZ;cpKU",
        "site": "https://openreview.net/forum?id=ZJHdiYDD5k",
        "pdf_size": 15007187,
        "rating": "5;5;6;6",
        "confidence": "5;4;5;4",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;2;3",
        "wc_summary": "24;90;72;81",
        "wc_strengths": "36;31;55;33",
        "wc_weaknesses": "82;102;225;114",
        "wc_questions": "5;4;11;6",
        "wc_review": "147;227;363;234",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "301;321;906;285",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            66.75,
            25.488968201949643
        ],
        "wc_strengths_avg": [
            38.75,
            9.54921462739214
        ],
        "wc_weaknesses_avg": [
            130.75,
            55.60294506588657
        ],
        "wc_questions_avg": [
            6.5,
            2.692582403567252
        ],
        "wc_review_avg": [
            242.75,
            77.38337999855008
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            453.25,
            261.7063000770138
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11520850751515069301&as_sdt=5,34&sciodt=0,34&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;0;1;1;1",
        "aff_unique_norm": "Beihang University;Meituan",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.buaa.edu.cn/;https://www.meituan.com",
        "aff_unique_abbr": "BUAA;Meituan",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "A Lightweight Method for Tackling Unknown Participation Statistics in Federated Averaging",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18403",
        "id": "ZKEuFKfCKA",
        "author_site": "Shiqiang Wang, Mingyue Ji",
        "tldr": "",
        "abstract": "In federated learning (FL), clients usually have diverse participation statistics that are unknown a priori, which can significantly harm the performance of FL if not handled properly. Existing works aiming at addressing this problem are usually based on global variance reduction, which requires a substantial amount of additional memory in a multiplicative factor equal to the total number of clients. An important open problem is to find a lightweight method for FL in the presence of clients with unknown participation rates. In this paper, we address this problem by adapting the aggregation weights in federated averaging (FedAvg) based on the participation history of each client. We first show that, with heterogeneous participation statistics, FedAvg with non-optimal aggregation weights can diverge from the optimal solution of the original FL objective, indicating the need of finding optimal aggregation weights. However, it is difficult to compute the optimal weights when the participation statistics are unknown. To address this problem, we present a new algorithm called FedAU, which improves FedAvg by adaptively weighting the client updates based on online estimates of the optimal weights without knowing the statistics of client participation. We provide a theoretical convergence analysis of FedAU using a novel methodology to connect the estimation error and convergence. Our theoretical results reveal important and interesting insights, while showing that FedAU converges to an optimal solution of the original objective and has desirable properties such as linear speedup. Our experimental results also verify the advantage of FedAU over baseline methods with various participation patterns.",
        "keywords": "federated learning;partial client participation;adaptation;aggregation weights",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/83718ae701242493a137cb33c9a90eed60f31b66.zip",
        "author": "Shiqiang Wang;Mingyue Ji",
        "authorids": "~Shiqiang_Wang1;~Mingyue_Ji1",
        "gender": "M;M",
        "homepage": "https://shiqiang.wang;https://mingyueji.ece.ufl.edu/",
        "dblp": "87/5094-1;",
        "google_scholar": "kA_vmOcAAAAJ;rWLfxVgAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Shiqiang_Wang1;~Mingyue_Ji1",
        "aff": "IBM, International Business Machines;University of Florida",
        "aff_domain": "us.ibm.com;ufl.edu",
        "position": "Research Staff Member;Associate Professor",
        "bibtex": "@inproceedings{\nwang2024a,\ntitle={A Lightweight Method for Tackling Unknown Participation Statistics in Federated Averaging},\nauthor={Shiqiang Wang and Mingyue Ji},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ZKEuFKfCKA}\n}",
        "github": "",
        "project": "",
        "reviewers": "X6kq;ByHL;p8tC;dwXt",
        "pdf_size": 3103333,
        "rating": "5;6;6;10",
        "confidence": "4;4;4;3",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "84;109;67;94",
        "wc_strengths": "66;141;54;118",
        "wc_weaknesses": "23;105;72;103",
        "wc_questions": "124;2;88;100",
        "wc_review": "297;357;281;415",
        "wc_reply_reviewers": "0;30;142;19",
        "wc_reply_authors": "789;596;1136;799",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            6.75,
            1.920286436967152
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            88.5,
            15.272524349301264
        ],
        "wc_strengths_avg": [
            94.75,
            35.94005425705421
        ],
        "wc_weaknesses_avg": [
            75.75,
            33.14645531576491
        ],
        "wc_questions_avg": [
            78.5,
            46.02988159880492
        ],
        "wc_review_avg": [
            337.5,
            52.95989048327045
        ],
        "wc_reply_reviewers_avg": [
            47.75,
            55.463388825422484
        ],
        "wc_reply_authors_avg": [
            830.0,
            194.31546515910668
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.9771398364036774,
        "gs_citation": 18,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12679435113788871335&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=ZKEuFKfCKA",
        "pdf": "https://openreview.net/pdf?id=ZKEuFKfCKA",
        "email": "us.ibm.com;ufl.edu",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "International Business Machines;University of Florida",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ibm.com;https://www.ufl.edu",
        "aff_unique_abbr": "IBM;UF",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "ZKnbIZefER",
        "title": "Availability Attacks Need to Create Shortcuts for Contrastive Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Availability attacks can prevent the unauthorized use of private data and commercial datasets by generating imperceptible noise and making unlearnable examples before release. \nIdeally, the obtained unlearnability prevents algorithms from training usable models. \nWhen supervised learning algorithms have failed, a malicious data collector possibly resorts to contrastive learning algorithms to bypass the protection.\nAttacks need both supervised unlearnability and contrastive unlearnability.\nThrough evaluation, we have found that most of the existing availability attacks are unable to achieve contrastive unlearnability, which poses risks to data protection. \nFurthermore, we find that employing stronger data augmentations in supervised poisoning generation can create contrastive shortcuts and mitigate this risk. \nBased on this insight, we propose AUE and AAP attacks which prominently boost the worst-case unlearnability across multiple supervised and contrastive algorithms.",
        "keywords": "Availability attacks;supervised unlearnability;contrastive unlearnability;augmented unlearnable example attack;augmented adversarial poisoning attack;transferable unlearnability;worst-case unlearnability",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/91746f825ca4e01266ee496c40f83fbd93055836.zip",
        "author": "Yihan Wang;Yifan Zhu;Xiao-Shan Gao",
        "authorids": "~Yihan_Wang3;~Yifan_Zhu6;~Xiao-Shan_Gao2",
        "gender": "M;;M",
        "homepage": "https://ehanw.github.io/;https://github.com/hala64;http://www.mmrc.iss.ac.cn/~xgao/",
        "dblp": ";;13/3109",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;_se7GmUAAAAJ",
        "orcid": ";;0000-0003-2021-9395",
        "linkedin": ";;",
        "or_profile": "~Yihan_Wang3;~Yifan_Zhu6;~Xiao-Shan_Gao2",
        "aff": "Academy of Mathematics and Systems Science, Chinese Academy of Sciences;Academy of Mathematics and Systems Science, Chinese Academy of Sciences, Chinese Academy of Sciences;Academy of Mathematics and Systems Science, Chinese Academy of Sciences, Chinese Academy of Sciences",
        "aff_domain": "amss.ac.cn;amss.ac.cn;amss.ac.cn",
        "position": "PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nwang2024availability,\ntitle={Availability Attacks Need to Create Shortcuts for Contrastive Learning},\nauthor={Yihan Wang and Yifan Zhu and Xiao-Shan Gao},\nyear={2024},\nurl={https://openreview.net/forum?id=ZKnbIZefER}\n}",
        "github": "",
        "project": "",
        "reviewers": "YhBA;zrxn;ZSqY;x8t1;6pFa",
        "site": "https://openreview.net/forum?id=ZKnbIZefER",
        "pdf_size": 11421232,
        "rating": "3;3;5;5;6",
        "confidence": "5;3;5;4;4",
        "soundness": "2;2;3;3;4",
        "contribution": "2;2;3;2;3",
        "presentation": "2;2;2;2;3",
        "wc_summary": "77;97;138;40;42",
        "wc_strengths": "55;85;15;48;52",
        "wc_weaknesses": "137;376;200;197;141",
        "wc_questions": "62;268;3;172;13",
        "wc_review": "331;826;356;457;248",
        "wc_reply_reviewers": "0;0;40;0;0",
        "wc_reply_authors": "807;963;446;591;215",
        "reply_reviewers": "0;0;1;0;0",
        "reply_authors": "2;3;2;2;2",
        "rating_avg": [
            4.4,
            1.2
        ],
        "confidence_avg": [
            4.2,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.8,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.2,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            78.8,
            36.60273213846202
        ],
        "wc_strengths_avg": [
            51.0,
            22.262075374951007
        ],
        "wc_weaknesses_avg": [
            210.2,
            87.08019292583131
        ],
        "wc_questions_avg": [
            103.6,
            101.74988943482936
        ],
        "wc_review_avg": [
            443.6,
            202.49503697621827
        ],
        "wc_reply_reviewers_avg": [
            8.0,
            16.0
        ],
        "wc_reply_authors_avg": [
            604.4,
            263.26534143331514
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            2.2,
            0.39999999999999997
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.13363062095621214,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:4rY7Gj-vwyEJ:scholar.google.com/&scioq=Availability+Attacks+Need+to+Create+Shortcuts+for+Contrastive+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Chinese Academy of Sciences",
        "aff_unique_dep": "Academy of Mathematics and Systems Science",
        "aff_unique_url": "http://www.amss.cas.cn",
        "aff_unique_abbr": "AMSS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Accurate and Scalable Estimation of Epistemic Uncertainty for Graph Neural Networks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18402",
        "id": "ZL6yd6N1S2",
        "author_site": "Puja Trivedi, Mark Heimann, Rushil Anirudh, Danai Koutra, Jayaraman J. Thiagarajan",
        "tldr": "",
        "abstract": "While graph neural networks (GNNs) are widely used for node and graph representation learning tasks, the reliability of GNN uncertainty estimates under distribution shifts remains relatively under-explored. Indeed, while post-hoc calibration strategies can be used to improve in-distribution calibration, they need not also improve calibration under distribution shift. However, techniques which produce GNNs with better intrinsic uncertainty estimates are particularly valuable, as they can always be combined with post-hoc strategies later. Therefore, in this work, we propose G-$\\Delta$UQ, a novel training framework designed to improve intrinsic GNN uncertainty estimates. Our framework adapts the principle of stochastic data centering to graph data through novel graph anchoring strategies, and is able to support partially stochastic GNNs. While, the prevalent wisdom is that fully stochastic networks are necessary to obtain reliable estimates, we find that the functional diversity induced by our anchoring strategies when sampling hypotheses renders this unnecessary and allows us to support G-$\\Delta$UQ on pretrained models. Indeed, through extensive evaluation under covariate, concept and graph size shifts, we show that G-$\\Delta$UQ leads to better calibrated GNNs for node and graph classification. Further, it also improves performance on the uncertainty-based tasks of out-of-distribution detection and generalization gap estimation. Overall, our work provides insights into uncertainty estimation for GNNs, and demonstrates the utility of G-$\\Delta$UQ in obtaining reliable estimates.",
        "keywords": "Graph Neural Networks;Uncertainity Quantification;Calibration",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/be7acec6f1e67936920a4ef6abddaa207ffc0680.pdf",
        "author": "Puja Trivedi;Mark Heimann;Rushil Anirudh;Danai Koutra;Jayaraman J. Thiagarajan",
        "authorids": "~Puja_Trivedi1;~Mark_Heimann1;~Rushil_Anirudh1;~Danai_Koutra1;~Jayaraman_J._Thiagarajan3",
        "gender": "F;M;M;F;M",
        "homepage": "https://pujacomputes.github.io/;https://markheimann.github.io;https://rushila.com/;http://web.eecs.umich.edu/~dkoutra/;https://jjthiagarajan.com",
        "dblp": "274/2080;215/4357;136/5391;91/9987;16/7803",
        "google_scholar": "1y9cR50AAAAJ;EXeTcRUAAAAJ;WkoIlpQAAAAJ;https://scholar.google.com.tw/citations?user=bDrA1-8AAAAJ;cMz65_oAAAAJ",
        "orcid": "0000-0003-1874-8992;;0000-0002-4186-3502;0000-0002-3206-8179;",
        "linkedin": ";;rushilanirudh/;;",
        "or_profile": "~Puja_Trivedi1;~Mark_Heimann1;~Rushil_Anirudh1;~Danai_Koutra1;~Jayaraman_J._Thiagarajan2",
        "aff": "University of Michigan;Lawrence Livermore National Laboratory;Amazon;Amazon;Lawrence Livermore National Labs",
        "aff_domain": "umich.edu;llnl.gov;amazon.com;amazon.com;llnl.gov",
        "position": "PhD student;Researcher;Applied Scientist;Scholar;Computer Scientist",
        "bibtex": "@inproceedings{\ntrivedi2024accurate,\ntitle={Accurate and Scalable Estimation of Epistemic Uncertainty for Graph Neural Networks},\nauthor={Puja Trivedi and Mark Heimann and Rushil Anirudh and Danai Koutra and Jayaraman J. Thiagarajan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ZL6yd6N1S2}\n}",
        "github": "",
        "project": "",
        "reviewers": "bgJx;Cjvm;b8ZS",
        "pdf_size": 1290444,
        "rating": "5;6;6",
        "confidence": "3;3;4",
        "soundness": "2;3;3",
        "contribution": "2;2;3",
        "presentation": "2;3;3",
        "wc_summary": "58;52;120",
        "wc_strengths": "58;66;115",
        "wc_weaknesses": "116;62;508",
        "wc_questions": "2;367;198",
        "wc_review": "234;547;941",
        "wc_reply_reviewers": "0;39;221",
        "wc_reply_authors": "1390;2142;2496",
        "reply_reviewers": "0;1;1",
        "reply_authors": "3;5;5",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            76.66666666666667,
            30.739045022396013
        ],
        "wc_strengths_avg": [
            79.66666666666667,
            25.197001585285676
        ],
        "wc_weaknesses_avg": [
            228.66666666666666,
            198.7449510190273
        ],
        "wc_questions_avg": [
            189.0,
            149.14646045638048
        ],
        "wc_review_avg": [
            574.0,
            289.26228006199955
        ],
        "wc_reply_reviewers_avg": [
            86.66666666666667,
            96.31314667386908
        ],
        "wc_reply_authors_avg": [
            2009.3333333333333,
            461.1647090670413
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1208983656685545626&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=ZL6yd6N1S2",
        "pdf": "https://openreview.net/pdf?id=ZL6yd6N1S2",
        "email": "umich.edu;llnl.gov;amazon.com;amazon.com;llnl.gov",
        "author_num": 5,
        "aff_unique_index": "0;1;2;2;1",
        "aff_unique_norm": "University of Michigan;Lawrence Livermore National Laboratory;Amazon",
        "aff_unique_dep": ";;Amazon.com, Inc.",
        "aff_unique_url": "https://www.umich.edu;https://www.llnl.gov;https://www.amazon.com",
        "aff_unique_abbr": "UM;LLNL;Amazon",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "ZLSdwjDevK",
        "title": "Generative Modeling on Manifolds Through Mixture of Riemannian Diffusion Processes",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Learning the distribution of data on Riemannian manifolds is crucial for modeling data from non-Euclidean space, which is required by many applications from diverse scientific fields. Yet, existing generative models on manifolds suffer from expensive divergence computation or rely on approximations of heat kernel. These limitations restrict their applicability to simple geometries and hinder scalability to high dimensions. In this work, we introduce the Riemannian Diffusion Mixture, a principled framework for building a generative process on manifolds as a mixture of endpoint-conditioned diffusion processes instead of relying on the denoising approach of previous diffusion models, for which the generative process is characterized by its drift guiding toward the most probable endpoint with respect to the geometry of the manifold. We further propose a simple yet efficient training objective for learning the mixture process, that is readily applicable to general manifolds. Our method outperforms previous generative models on various manifolds while scaling to high dimensions and requires a dramatically reduced number of in-training simulation steps for general manifolds.",
        "keywords": "Riemannian manifold;Diffusion model",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/ffe9888523f876cab59d5912e4518a0857fcfb07.zip",
        "author": "Jaehyeong Jo;Sung Ju Hwang",
        "authorids": "~Jaehyeong_Jo1;~Sung_Ju_Hwang1",
        "gender": "M;",
        "homepage": "https://github.com/harryjo97;",
        "dblp": "296/2037;",
        "google_scholar": "https://scholar.google.com/citations?hl=ko;",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Jaehyeong_Jo1;~Sung_Ju_Hwang1",
        "aff": "Korea Advanced Institute of Science & Technology;",
        "aff_domain": "kaist.ac.kr;",
        "position": "MS student;",
        "bibtex": "@misc{\njo2024generative,\ntitle={Generative Modeling on Manifolds Through Mixture of Riemannian Diffusion Processes},\nauthor={Jaehyeong Jo and Sung Ju Hwang},\nyear={2024},\nurl={https://openreview.net/forum?id=ZLSdwjDevK}\n}",
        "github": "",
        "project": "",
        "reviewers": "8EUf;43Ee;ZrBb",
        "site": "https://openreview.net/forum?id=ZLSdwjDevK",
        "pdf_size": 4801930,
        "rating": "5;6;6",
        "confidence": "4;5;3",
        "soundness": "3;2;3",
        "contribution": "2;3;2",
        "presentation": "2;2;3",
        "wc_summary": "58;112;70",
        "wc_strengths": "29;164;76",
        "wc_weaknesses": "279;832;112",
        "wc_questions": "34;50;11",
        "wc_review": "400;1158;269",
        "wc_reply_reviewers": "56;239;0",
        "wc_reply_authors": "1472;2618;752",
        "reply_reviewers": "1;4;0",
        "reply_authors": "5;6;2",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            80.0,
            23.15167380558045
        ],
        "wc_strengths_avg": [
            89.66666666666667,
            55.954346470036526
        ],
        "wc_weaknesses_avg": [
            407.6666666666667,
            307.69718158533004
        ],
        "wc_questions_avg": [
            31.666666666666668,
            16.006942938057293
        ],
        "wc_review_avg": [
            609.0,
            391.86817511334937
        ],
        "wc_reply_reviewers_avg": [
            98.33333333333333,
            102.05989526852467
        ],
        "wc_reply_authors_avg": [
            1614.0,
            768.3801142663701
        ],
        "reply_reviewers_avg": [
            1.6666666666666667,
            1.699673171197595
        ],
        "reply_authors_avg": [
            4.333333333333333,
            1.699673171197595
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15176113037263379386&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_country_unique_index": "0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "ZMZc3KqjEb",
        "title": "Learning multi-modal generative models with permutation-invariant encoders and tighter variational bounds",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Devising deep latent variable models for multi-modal data has been a long-standing theme in machine learning research. Multi-modal Variational Autoencoders (VAEs) have been a popular generative model class that learns latent representations which jointly explain multiple modalities. Various objective functions for such models have been suggested, often motivated as lower bounds on the multi-modal data log-likelihood or from information-theoretic considerations. In order to encode latent variables from different modality subsets, Product-of-Experts (PoE) or Mixture-of-Experts (MoE) aggregation schemes have been routinely used and shown to yield different trade-offs, for instance, regarding their generative quality or consistency across multiple modalities. In this work, we consider a variational bound that can tightly lower bound the data log-likelihood. We develop more flexible aggregation schemes that generalise PoE or MoE approaches by combining encoded features from different modalities based on permutation-invariant neural networks. Our numerical experiments illustrate trade-offs for multi-modal variational bounds and various aggregation schemes. We show that tighter variational bounds and more flexible aggregation models can become beneficial when one wants to approximate the true joint distribution over observed modalities and latent variables in identifiable models.",
        "keywords": "multimodal learning;variational autoencoder;deep generative models;permutation-invariant neural networks",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/de97b326bc0ade8a00cf07fabc9d991b6a0fe3cb.zip",
        "author": "Marcel Hirt;Domenico Campolo;Victoria Leong;Juan-Pablo Ortega",
        "authorids": "~Marcel_Hirt1;~Domenico_Campolo1;~Victoria_Leong1;~Juan-Pablo_Ortega1",
        "gender": "M;M;F;M",
        "homepage": ";https://personal.ntu.edu.sg/d.campolo/;;https://juan-pablo-ortega.com",
        "dblp": "220/5661;;;",
        "google_scholar": "https://scholar.google.nl/citations?user=m9q-twcAAAAJ;https://scholar.google.com.sg/citations?user=9gO29eUAAAAJ;https://scholar.google.co.uk/citations?user=fR6RD6IAAAAJ;",
        "orcid": ";0000-0001-6930-0413;0000-0003-0666-9445;",
        "linkedin": ";campolo/;;",
        "or_profile": "~Marcel_Hirt1;~Domenico_Campolo1;~Victoria_Leong1;~Juan-Pablo_Ortega1",
        "aff": "Nanyang Technological University;National Technological University;Nanyang Technological University;",
        "aff_domain": "ntu.edu.sg;ntu.edu;ntu.edu.sg;",
        "position": "Postdoc;Associate Professor;Associate Professor;",
        "bibtex": "@misc{\nhirt2024learning,\ntitle={Learning multi-modal generative models with permutation-invariant encoders and tighter variational bounds},\nauthor={Marcel Hirt and Domenico Campolo and Victoria Leong and Juan-Pablo Ortega},\nyear={2024},\nurl={https://openreview.net/forum?id=ZMZc3KqjEb}\n}",
        "github": "",
        "project": "",
        "reviewers": "yUvm;pr6d;vMeL;dord;EVr5",
        "site": "https://openreview.net/forum?id=ZMZc3KqjEb",
        "pdf_size": 3923495,
        "rating": "3;3;5;6;6",
        "confidence": "4;4;3;3;3",
        "soundness": "2;1;3;3;3",
        "contribution": "2;1;2;3;3",
        "presentation": "3;2;2;3;2",
        "wc_summary": "342;40;172;35;97",
        "wc_strengths": "76;13;105;55;55",
        "wc_weaknesses": "556;66;349;180;147",
        "wc_questions": "197;52;119;2;89",
        "wc_review": "1171;171;745;272;388",
        "wc_reply_reviewers": "368;0;0;0;0",
        "wc_reply_authors": "891;446;1078;589;547",
        "reply_reviewers": "2;0;0;0;0",
        "reply_authors": "2;1;2;1;1",
        "rating_avg": [
            4.6,
            1.3564659966250536
        ],
        "confidence_avg": [
            3.4,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.4,
            0.8
        ],
        "contribution_avg": [
            2.2,
            0.7483314773547882
        ],
        "presentation_avg": [
            2.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            137.2,
            113.72141399050577
        ],
        "wc_strengths_avg": [
            60.8,
            30.122416901702962
        ],
        "wc_weaknesses_avg": [
            259.6,
            174.5515396666555
        ],
        "wc_questions_avg": [
            91.8,
            65.51763121481117
        ],
        "wc_review_avg": [
            549.4,
            366.28764652933626
        ],
        "wc_reply_reviewers_avg": [
            73.6,
            147.19999999999996
        ],
        "wc_reply_authors_avg": [
            710.2,
            236.25867179851832
        ],
        "reply_reviewers_avg": [
            0.4,
            0.8000000000000002
        ],
        "reply_authors_avg": [
            1.4,
            0.4898979485566356
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9630868246861538,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Oql5i7OottoJ:scholar.google.com/&scioq=Learning+multi-modal+generative+models+with+permutation-invariant+encoders+and+tighter+variational+bounds&hl=en&as_sdt=0,5",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Nanyang Technological University;National Technological University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ntu.edu.sg;https://www.ntu.edu",
        "aff_unique_abbr": "NTU;NTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Singapore;United States"
    },
    {
        "id": "ZMjflI1aL0",
        "title": "Imbalanced data robust online continual learning based on evolving class aware memory selection and built-in contrastive representation learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Continual Learning (CL) aims to learn and adapt continuously to new information while retaining previously acquired knowledge. Most state of the art CL methods currently emphasize class incremental learning. In this approach, class data is introduced and processed only once within a defined task boundary. However, these methods often struggle in dynamic environments, especially when dealing with imbalanced data, shifting classes, and evolving domains. Such challenges arise from changes in correlations and diversities, necessitating ongoing adjustments to previously established class and data representations. In this paper,  we introduce a novel online CL algorithm, dubbed as Memory Selection with Contrastive Learning (MSCL), based on evolving intra-class diversity and inter-class boundary aware memory selection and contrastive data representation learning. Specifically, we propose a memory selection method called Feature-Distance Based Sample Selection (FDBS), which evaluates the distance between new data and the memory set to assess the representability of new data to keep the memory aware of evolving inter-class similarities and intra-class diversity of the previously seen data. Moreover, as the data stream unfolds with new class and/or domain data and requires data representation adaptation, we introduce a novel built-in contrastive learning loss (IWL) that seamlessly leverages the importance weights computed during the memory selection process, and encourages instances of the same class to be brought closer together while pushing instances of different classes apart. We tested our method on various datasets such as MNIST, Cifar-100, PACS, DomainNet, and mini-ImageNet using different architectures. In balanced data scenarios, our approach either matches or outperforms leading memory-based CL techniques. However, it significantly excels in challenging settings like imbalanced class, domain, or class-domain CL. Additionally, our experiments demonstrate that integrating our proposed FDBS and IWL techniques enhances the performance of existing rehearsal-based CL methods with significant margins both in balanced and imbalanced scenarios.",
        "keywords": "Continual Learning;Contrastive learning;Domain Incremental Learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Rui Yang;Matthieu Grard;Emmanuel Dellandrea;Liming Chen",
        "authorids": "~Rui_Yang13;~Matthieu_Grard1;~Emmanuel_Dellandrea2;~Liming_Chen1",
        "gender": "M;;M;M",
        "homepage": ";;http://perso.ec-lyon.fr/emmanuel.dellandrea/;https://sites.google.com/view/limingchen/accueil",
        "dblp": ";;79/5140.html;32/7029-2",
        "google_scholar": "OHP_08MAAAAJ;;https://scholar.google.fr/citations?user=lK9Pa0MAAAAJ;VOPW5YYAAAAJ",
        "orcid": ";;;0000-0002-3654-9498",
        "linkedin": ";;;liming-chen-039455a/",
        "or_profile": "~Rui_Yang13;~Matthieu_Grard1;~Emmanuel_Dellandrea2;~Liming_Chen1",
        "aff": "Ecole Centrale de Lyon;;Ecole Centrale de Lyon;Ecole Centrale de Lyon",
        "aff_domain": "ec-lyon.fr;;ec-lyon.fr;ec-lyon.fr",
        "position": "PhD student;;Associate Professor;Full Professor",
        "bibtex": "@misc{\nanonymous2024imbalanced,\ntitle={Imbalanced data robust online continual learning based on evolving class aware memory selection and built-in contrastive representation learning},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=ZMjflI1aL0}\n}",
        "github": "",
        "project": "",
        "reviewers": "ddu2;Zde2;b5Cn",
        "site": "https://openreview.net/forum?id=ZMjflI1aL0",
        "pdf_size": 483830,
        "rating": "3;5;5",
        "confidence": "4;3;3",
        "soundness": "3;3;3",
        "contribution": "3;3;2",
        "presentation": "2;3;3",
        "wc_summary": "63;94;127",
        "wc_strengths": "34;41;66",
        "wc_weaknesses": "139;139;68",
        "wc_questions": "7;41;282",
        "wc_review": "243;315;543",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "700;573;591",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            94.66666666666667,
            26.132142830026183
        ],
        "wc_strengths_avg": [
            47.0,
            13.73559851869101
        ],
        "wc_weaknesses_avg": [
            115.33333333333333,
            33.46972097616325
        ],
        "wc_questions_avg": [
            110.0,
            122.41187306248796
        ],
        "wc_review_avg": [
            367.0,
            127.87493890516625
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            621.3333333333334,
            56.10902086315731
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9999999999999998,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14659525505174191104&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Ecole Centrale de Lyon",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ec-lyon.fr",
        "aff_unique_abbr": "ECL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "France"
    },
    {
        "id": "ZMuPAOY8Oz",
        "title": "Positional Description Matters for Transformers Arithmetic",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Transformers, central to the successes in modern Natural Language Processing, often falter on arithmetic tasks despite their vast capabilities --which paradoxically include remarkable coding abilities. We observe that a crucial challenge is their naive reliance on positional information to solve arithmetic problems with a small number of digits, leading to poor performance on larger numbers. Herein, we delve deeper into the role of positional encoding, and propose several ways to fix the issue, either by modifying the positional encoding directly, or by modifying the representation of the arithmetic task to leverage standard positional encoding differently. We investigate the value of these modifications for three tasks: (i) classical multiplication, (ii) length extrapolation in addition, and (iii) addition in natural language context. For (i) we train a small model on a small dataset (100M parameters and 300k samples) with remarkable aptitude in (direct, no scratchpad) 15 digits multiplication and essentially perfect up to 12 digits, while usual training in this context would give a model failing at 4 digits multiplication. In the experiments on addition, we use a mere 120k samples to demonstrate: for (ii) extrapolation from 10 digits to testing on 12 digits numbers while usual training would have no extrapolation, and for (iii) almost perfect accuracy up to 5 digits while usual training would be correct only up to 3 digits (which is essentially memorization with a training set of 120k samples).",
        "keywords": "Transformer;Arithmetic;Language Model;Deep Learning",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Ruoqi Shen;Sebastien Bubeck;Ronen Eldan;Yin Tat Lee;Yuanzhi Li;Yi Zhang",
        "authorids": "~Ruoqi_Shen1;~Sebastien_Bubeck1;~Ronen_Eldan1;~Yin_Tat_Lee1;~Yuanzhi_Li1;~Yi_Zhang1",
        "gender": ";;M;;M;M",
        "homepage": "https://homes.cs.washington.edu/~shenr3/;http://sbubeck.com/;;;;https://yi-zhang.me",
        "dblp": "248/8237.html;35/4292;85/9583;;73/3628;64/6544-74",
        "google_scholar": ";V2Y1L4sAAAAJ;;;;lc6CVqEAAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Ruoqi_Shen1;~Sebastien_Bubeck1;~Ronen_Eldan1;~Yin_Tat_Lee1;~Yuanzhi_Li1;~Yi_Zhang1",
        "aff": "University of Washington, Seattle;Microsoft;Microsoft Research;;Carnegie Mellon University;Microsoft",
        "aff_domain": "uw.edu;microsoft.com;microsoft.com;;andrew.cmu.edu;microsoft.com",
        "position": "PhD student;Researcher;Principal Researcher;;Assistant Professor;Researcher",
        "bibtex": "@misc{\nshen2024positional,\ntitle={Positional Description Matters for Transformers Arithmetic},\nauthor={Ruoqi Shen and Sebastien Bubeck and Ronen Eldan and Yin Tat Lee and Yuanzhi Li and Yi Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=ZMuPAOY8Oz}\n}",
        "github": "",
        "project": "",
        "reviewers": "Nh7J;pA8q;ywtf;34Rb",
        "site": "https://openreview.net/forum?id=ZMuPAOY8Oz",
        "pdf_size": 367625,
        "rating": "3;3;5;5",
        "confidence": "4;4;4;2",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;2",
        "presentation": "2;2;2;2",
        "wc_summary": "139;191;79;211",
        "wc_strengths": "67;104;69;11",
        "wc_weaknesses": "236;245;396;371",
        "wc_questions": "319;82;151;9",
        "wc_review": "761;622;695;602",
        "wc_reply_reviewers": "0;0;209;0",
        "wc_reply_authors": "211;177;262;197",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            155.0,
            51.146847410177685
        ],
        "wc_strengths_avg": [
            62.75,
            33.30446666740063
        ],
        "wc_weaknesses_avg": [
            312.0,
            72.11449230217183
        ],
        "wc_questions_avg": [
            140.25,
            114.7679724487629
        ],
        "wc_review_avg": [
            670.0,
            62.916611479004494
        ],
        "wc_reply_reviewers_avg": [
            52.25,
            90.49965469547384
        ],
        "wc_reply_authors_avg": [
            211.75,
            31.427495923156208
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 41,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15829001550875818781&as_sdt=20000005&sciodt=0,21&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1;2;1",
        "aff_unique_norm": "University of Washington;Microsoft;Carnegie Mellon University",
        "aff_unique_dep": ";Microsoft Corporation;",
        "aff_unique_url": "https://www.washington.edu;https://www.microsoft.com;https://www.cmu.edu",
        "aff_unique_abbr": "UW;Microsoft;CMU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Seattle;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Learning semilinear neural operators: A unified recursive framework for prediction and data assimilation.",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18401",
        "id": "ZMv6zKYYUs",
        "author_site": "Ashutosh Singh, Ricardo Borsoi, Deniz Erdogmus, Tales Imbiriba",
        "tldr": "",
        "abstract": "Recent advances in the theory of Neural Operators (NOs) have enabled fast and accurate computation of the solutions to complex systems described by partial differential equations (PDEs). Despite their great success, current NO-based solutions face important challenges when dealing with spatio-temporal PDEs over long time scales. Specifically, the current theory of NOs does not present a systematic framework to perform data assimilation and efficiently correct the evolution of PDE solutions over time based on sparsely sampled noisy measurements. In this paper, we propose a learning-based state-space approach to compute the solution operators to infinite-dimensional semilinear PDEs. Exploiting the structure of semilinear PDEs and the theory of nonlinear observers in function spaces, we develop a flexible recursive method that allows for both prediction and data assimilation by combining prediction and correction operations. The proposed framework is capable of producing fast and accurate predictions over long time horizons, dealing with irregularly sampled noisy measurements to correct the solution, and benefits from the decoupling between the spatial and temporal dynamics of this class of PDEs. We show through experiments on the Kuramoto-Sivashinsky, Navier-Stokes and Korteweg-de Vries equations that the proposed model is robust to noise and can leverage arbitrary amounts of measurements to correct its prediction over a long time horizon with little computational overhead.",
        "keywords": "Neural operator;PDEs;semi-linear evolution;sequential learning;filtering;data assimilation",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Ashutosh Singh;Ricardo Augusto Borsoi;Deniz Erdogmus;Tales Imbiriba",
        "authorids": "~Ashutosh_Singh2;~Ricardo_Augusto_Borsoi1;~Deniz_Erdogmus1;~Tales_Imbiriba1",
        "gender": ";;M;M",
        "homepage": ";https://ricardoborsoi.github.io/;;https://talesimbiriba.github.io",
        "dblp": ";194/3132;57/3284;07/1491",
        "google_scholar": ";FeiFDgkAAAAJ;;jYxVQtkAAAAJ",
        "orcid": ";;;0000-0002-2626-2039",
        "linkedin": ";;;",
        "or_profile": "~Ashutosh_Singh2;~Ricardo_Augusto_Borsoi1;~Deniz_Erdogmus1;~Tales_Imbiriba1",
        "aff": ";Universit\u00e9 de Lorraine;;Northeastern University",
        "aff_domain": ";univ-lorraine.fr;northeastern.edu, neu.edu;neu.edu",
        "position": ";Researcher;Full Professor;Researcher",
        "bibtex": "@inproceedings{\nsingh2024learning,\ntitle={Learning semilinear neural operators: A unified recursive framework for prediction and data assimilation.},\nauthor={Ashutosh Singh and Ricardo Augusto Borsoi and Deniz Erdogmus and Tales Imbiriba},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ZMv6zKYYUs}\n}",
        "github": "",
        "project": "",
        "reviewers": "o6QX;2zWc;M6oo;ozZs",
        "pdf_size": 1148818,
        "rating": "5;5;8;8",
        "confidence": "4;3;4;4",
        "soundness": "2;1;3;3",
        "contribution": "2;1;3;3",
        "presentation": "3;1;3;4",
        "wc_summary": "89;96;192;63",
        "wc_strengths": "46;130;115;92",
        "wc_weaknesses": "188;105;271;218",
        "wc_questions": "2;166;18;172",
        "wc_review": "325;497;596;545",
        "wc_reply_reviewers": "8;0;35;38",
        "wc_reply_authors": "561;548;934;568",
        "reply_reviewers": "1;0;1;2",
        "reply_authors": "2;2;3;2",
        "rating_avg": [
            6.5,
            1.5
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            110.0,
            48.913188405582396
        ],
        "wc_strengths_avg": [
            95.75,
            31.751968442917047
        ],
        "wc_weaknesses_avg": [
            195.5,
            60.11031525453847
        ],
        "wc_questions_avg": [
            89.5,
            79.72922927007384
        ],
        "wc_review_avg": [
            490.75,
            101.89792686801827
        ],
        "wc_reply_reviewers_avg": [
            20.25,
            16.528384676065595
        ],
        "wc_reply_authors_avg": [
            652.75,
            162.53826472557162
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5773502691896258,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:gXsyknVw1ywJ:scholar.google.com/&scioq=Learning+semilinear+neural+operators:+A+unified+recursive+framework+for+prediction+and+data+assimilation.&hl=en&as_sdt=0,33",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=ZMv6zKYYUs",
        "pdf": "https://openreview.net/pdf?id=ZMv6zKYYUs",
        "email": ";univ-lorraine.fr;northeastern.edu, neu.edu;neu.edu",
        "author_num": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Universit\u00e9 de Lorraine;Northeastern University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.univ-lorraine.fr;https://www.northeastern.edu",
        "aff_unique_abbr": "UL;NEU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "France;United States"
    },
    {
        "id": "ZN8BaYVFkx",
        "title": "Training Adversarially Robust SNNs with Gradient Sparsity Regularization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Spiking Neural Networks (SNNs) have attracted much attention for their energy-efficient operations and biologically inspired structures, offering potential advantages over Artificial Neural Networks (ANNs) in terms of interpretability and energy efficiency. However, similar to ANNs, the robustness of SNNs remains a challenge, especially when facing adversarial attacks. Existing techniques, whether adapted from ANNs or specifically designed for SNNs, have shown limitations in traing SNNs or defending against strong attacks.\nIn this paper, we present a novel approach to enhance the robustness of SNNs through gradient sparsity regularization. We observe that SNNs exhibit greater resilience to random perturbations compared to adversarial perturbations, even at larger scales. Motivated by this finding, we aim to minimize the gap between SNNs under adversarial and random perturbations, thereby improving their overall robustness. \nTo achieve this, we theoretically prove that this performance gap is upper bounded by the gradient sparsity of the output probability after the softmax layer with respect to the input image, laying the groundwork for a practical strategy to train robust SNNs by regularizing the gradient sparsity. \nThe effectiveness of our approach is validated through extensive experiments conducted on the CIFAR-10 and CIFAR-100 datasets. The results demonstrate enhancements in the robustness of SNNs.\nOverall, our work contributes to the understanding and improvement of SNN robustness, highlighting the importance of considering gradient sparsity in SNNs.",
        "keywords": "spiking neural network;robustness;adversarial attack;the gradient with respect to input;gradient sparsity regularization",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/6f23a00fa8c4a181668d38de108d6b463d1f747e.zip",
        "author": "Yujia Liu;Tong Bu;Zhaofei Yu;Tiejun Huang",
        "authorids": "~Yujia_Liu1;~Tong_Bu1;~Zhaofei_Yu1;~Tiejun_Huang1",
        "gender": "F;;M;M",
        "homepage": ";;https://yuzhaofei.github.io;https://idm.pku.edu.cn/~tjhuang/",
        "dblp": "42/10221.html;;166/0573;h/TiejunHuang",
        "google_scholar": "iDyKEuwAAAAJ;;qaUgD50AAAAJ;https://scholar.google.com.tw/citations?user=knvEK4AAAAAJ",
        "orcid": "0000-0001-7356-3937;;;0000-0002-4234-6099",
        "linkedin": ";;;",
        "or_profile": "~Yujia_Liu1;~Tong_Bu1;~Zhaofei_Yu1;~Tiejun_Huang1",
        "aff": "Peking University;;Peking University;Peking University",
        "aff_domain": "pku.edu.cn;;pku.edu.cn;pku.edu.cn",
        "position": "Researcher;;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nliu2024training,\ntitle={Training Adversarially Robust {SNN}s with Gradient Sparsity Regularization},\nauthor={Yujia Liu and Tong Bu and Zhaofei Yu and Tiejun Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=ZN8BaYVFkx}\n}",
        "github": "",
        "project": "",
        "reviewers": "HCoc;FfwP;JC8H;bv7g",
        "site": "https://openreview.net/forum?id=ZN8BaYVFkx",
        "pdf_size": 709247,
        "rating": "1;5;8;8",
        "confidence": "5;4;4;5",
        "soundness": "1;2;3;4",
        "contribution": "1;2;3;4",
        "presentation": "2;2;3;4",
        "wc_summary": "74;74;43;130",
        "wc_strengths": "25;30;46;163",
        "wc_weaknesses": "36;13;13;94",
        "wc_questions": "631;194;68;5",
        "wc_review": "766;311;170;392",
        "wc_reply_reviewers": "427;16;60;46",
        "wc_reply_authors": "2690;832;608;306",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "6;3;2;2",
        "rating_avg": [
            5.5,
            2.8722813232690143
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            1.118033988749895
        ],
        "contribution_avg": [
            2.5,
            1.118033988749895
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            80.25,
            31.38769663419092
        ],
        "wc_strengths_avg": [
            66.0,
            56.53759810957661
        ],
        "wc_weaknesses_avg": [
            39.0,
            33.1134413795969
        ],
        "wc_questions_avg": [
            224.5,
            244.35885496539714
        ],
        "wc_review_avg": [
            409.75,
            220.48852010932453
        ],
        "wc_reply_reviewers_avg": [
            137.25,
            168.0407316694378
        ],
        "wc_reply_authors_avg": [
            1109.0,
            931.6785926487739
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.25,
            1.6393596310755
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.3481553119113957,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:wAMrqYmMDgYJ:scholar.google.com/&scioq=Training+Adversarially+Robust+SNNs+with+Gradient+Sparsity+Regularization&hl=en&as_sdt=0,8",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Peking University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.pku.edu.cn",
        "aff_unique_abbr": "Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "ZNMZdEQQga",
        "title": "Transplant of Perceptrons",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We propose to *transplant active cells into inactive cells* in neural networks, inspired by the concept of ``transplant'' in the field of neuroscience, where dead neurons are replaced with live ones to improve brain functions.\n  This is motivated by the fact that a number of major machine learning methodologies such as the perceptron and convolutional neural networks have been invented via the collaboration between neurobiology and computer science.\n  We theoretically discuss how transplant improves the quality of representation of perceptron layers in terms of the mutual information and the loss function with respect to the performance of the whole network. Moreover, we empirically evaluate the effectiveness of transplant in the task of supervised classification. Our proposal is simple and applicable to any neural networks which contain at least one perceptron layer.",
        "keywords": "perceptron;transplant;neural network",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Ryunosuke Ishizaki;Mahito Sugiyama",
        "authorids": "~Ryunosuke_Ishizaki1;~Mahito_Sugiyama1",
        "gender": "M;M",
        "homepage": ";https://mahito.nii.ac.jp/",
        "dblp": "309/0924;05/8421",
        "google_scholar": "https://scholar.google.co.jp/citations?user=EsrqtlAAAAAJ;qLlRvTkAAAAJ",
        "orcid": ";0000-0001-5907-9831",
        "linkedin": "https://linkedin.com/in/ryunosuke-ishizaki;",
        "or_profile": "~Ryunosuke_Ishizaki1;~Mahito_Sugiyama1",
        "aff": "NII, National Institute of Informatics;National Institute of Informatics",
        "aff_domain": "nii.ac.jp;nii.ac.jp",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\nishizaki2024transplant,\ntitle={Transplant of Perceptrons},\nauthor={Ryunosuke Ishizaki and Mahito Sugiyama},\nyear={2024},\nurl={https://openreview.net/forum?id=ZNMZdEQQga}\n}",
        "github": "",
        "project": "",
        "reviewers": "RbUD;azj9;wDLW;Vew5",
        "site": "https://openreview.net/forum?id=ZNMZdEQQga",
        "pdf_size": 1614192,
        "rating": "1;3;3;5",
        "confidence": "5;4;3;3",
        "soundness": "1;2;2;3",
        "contribution": "1;2;2;2",
        "presentation": "1;2;2;3",
        "wc_summary": "104;57;58;50",
        "wc_strengths": "29;28;31;30",
        "wc_weaknesses": "318;293;130;96",
        "wc_questions": "27;27;377;28",
        "wc_review": "478;405;596;204",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            67.25,
            21.44032415799724
        ],
        "wc_strengths_avg": [
            29.5,
            1.118033988749895
        ],
        "wc_weaknesses_avg": [
            209.25,
            97.39962782269755
        ],
        "wc_questions_avg": [
            114.75,
            151.41065847555117
        ],
        "wc_review_avg": [
            420.75,
            142.49451743839128
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.8528028654224418,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:VEonyTvAj_0J:scholar.google.com/&scioq=Transplant+of+Perceptrons&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "National Institute of Informatics",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nii.ac.jp",
        "aff_unique_abbr": "NII",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Japan"
    },
    {
        "title": "PanoDiffusion: 360-degree Panorama Outpainting via Diffusion",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18400",
        "id": "ZNzDXDFZ0B",
        "author_site": "Tianhao Wu, Chuanxia Zheng, Tat-Jen Cham",
        "tldr": "",
        "abstract": "Generating complete 360\\textdegree{} panoramas from narrow field of view images is ongoing research as omnidirectional RGB data is not readily available. Existing GAN-based approaches face some barriers to achieving higher quality output, and have poor generalization performance over different mask types. In this paper, we present our 360\\textdegree{} indoor RGB panorama outpainting model using latent diffusion models (LDM), called PanoDiffusion. We introduce a new bi-modal latent diffusion structure that utilizes both RGB and depth panoramic data during training, which works surprisingly well to outpaint depth-free RGB images during inference. We further propose a novel technique of introducing progressive camera rotations during each diffusion denoising step, which leads to substantial improvement in achieving panorama wraparound consistency. Results show that our PanoDiffusion not only significantly outperforms state-of-the-art methods on RGB panorama outpainting by producing diverse well-structured results for different types of masks, but can also synthesize high-quality depth panoramas to provide realistic 3D indoor models.",
        "keywords": "Panorama Outpainting;Latent Diffusion;Multi-modal Generation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/be5c84017b098fa3847fa4265e746cd9e20b27ea.zip",
        "author": "Tianhao Wu;Chuanxia Zheng;Tat-Jen Cham",
        "authorids": "~Tianhao_Wu6;~Chuanxia_Zheng1;~Tat-Jen_Cham1",
        "gender": "M;M;M",
        "homepage": "https://sm0kywu.github.io/CV/CV.html;http://www.chuanxiaz.com/;https://personal.ntu.edu.sg/astjcham/",
        "dblp": ";195/8988;29/3808",
        "google_scholar": "https://scholar.google.com.sg/citations?hl=zh-CN;mvpE6bIAAAAJ;Lx3X7W0AAAAJ",
        "orcid": "0000-0003-2195-9942;;0000-0001-5264-2572",
        "linkedin": ";chuanxia-zheng-80a3b8110/;tatjencham/",
        "or_profile": "~Tianhao_Wu6;~Chuanxia_Zheng1;~Tat-Jen_Cham1",
        "aff": "School of Computer Science and  Engineering, Nanyang Technological University;University of Oxford;Nanyang Technological University",
        "aff_domain": "scse.ntu.edu.sg;ox.ac.uk;ntu.edu.sg",
        "position": "PhD student;Postdoc;Associate Professor",
        "bibtex": "@inproceedings{\nwu2024panodiffusion,\ntitle={PanoDiffusion: 360-degree Panorama Outpainting via Diffusion},\nauthor={Tianhao Wu and Chuanxia Zheng and Tat-Jen Cham},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ZNzDXDFZ0B}\n}",
        "github": "",
        "project": "",
        "reviewers": "dEjQ;SqKp;MEmh;inST",
        "pdf_size": 1932985,
        "rating": "6;6;8;8",
        "confidence": "3;3;3;4",
        "soundness": "3;3;3;4",
        "contribution": "3;3;3;4",
        "presentation": "3;3;3;4",
        "wc_summary": "73;78;106;122",
        "wc_strengths": "95;45;92;58",
        "wc_weaknesses": "95;76;52;42",
        "wc_questions": "107;17;111;128",
        "wc_review": "370;216;361;350",
        "wc_reply_reviewers": "56;0;42;23",
        "wc_reply_authors": "1216;679;932;768",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "2;1;2;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            94.75,
            20.141685629559408
        ],
        "wc_strengths_avg": [
            72.5,
            21.523243250030884
        ],
        "wc_weaknesses_avg": [
            66.25,
            20.69269194667528
        ],
        "wc_questions_avg": [
            90.75,
            43.30343519860751
        ],
        "wc_review_avg": [
            324.25,
            62.898231294687456
        ],
        "wc_reply_reviewers_avg": [
            30.25,
            21.0282548015759
        ],
        "wc_reply_authors_avg": [
            898.75,
            204.4130316295906
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7895414521987051185&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=ZNzDXDFZ0B",
        "pdf": "https://openreview.net/pdf?id=ZNzDXDFZ0B",
        "email": "scse.ntu.edu.sg;ox.ac.uk;ntu.edu.sg",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Nanyang Technological University;University of Oxford",
        "aff_unique_dep": "School of Computer Science and Engineering;",
        "aff_unique_url": "https://www.ntu.edu.sg;https://www.ox.ac.uk",
        "aff_unique_abbr": "NTU;Oxford",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Singapore;United Kingdom"
    },
    {
        "title": "CO2: Efficient Distributed Training with Full Communication-Computation Overlap",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18399",
        "id": "ZO5cn4IfaN",
        "author_site": "Weigao Sun, Qin Zhen, Weixuan Sun, Shidi Li, Dong Li, Xuyang Shen, Yu Qiao, Yiran Zhong",
        "tldr": "",
        "abstract": "The fundamental success of large language models hinges upon the efficacious implementation of large-scale distributed training techniques. Nevertheless, building a vast, high-performance cluster featuring high-speed communication interconnectivity is prohibitively costly, and accessible only to prominent entities. In this work, we aim to lower this barrier and democratize large-scale training with limited bandwidth clusters. We propose a new approach called CO2 that introduces local-updating and asynchronous communication to the distributed data-parallel training, thereby facilitating the full overlap of COmmunication with COmputation. CO2 is able to attain a high scalability even on extensive multi-node clusters constrained by very limited communication bandwidth. We further propose the staleness gap penalty and outer momentum clipping techniques together with CO2 to bolster its convergence and training stability. Besides, CO2 exhibits seamless integration with well-established ZeRO-series optimizers which mitigate memory consumption of model states with large model training. We also provide a mathematical proof of convergence, accompanied by the establishment of a stringent upper bound. Furthermore, we validate our findings through an extensive set of practical experiments encompassing a wide range of tasks in the fields of computer vision and natural language processing. These experiments serve to demonstrate the capabilities of CO2 in terms of convergence, generalization, and scalability when deployed across configurations comprising up to 128 A100 GPUs. The outcomes emphasize the outstanding capacity of CO2 to hugely improve scalability, no matter on clusters with 800Gbps RDMA or 80Gbps TCP/IP inter-node connections.",
        "keywords": "Distributed Training;Data Parallelism;Local Updating;Asynchronous Communication",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Weigao Sun;Zhen Qin;Weixuan Sun;Shidi Li;Dong Li;Xuyang Shen;Yu Qiao;Yiran Zhong",
        "authorids": "~Weigao_Sun1;~Zhen_Qin6;~Weixuan_Sun1;~Shidi_Li1;~Dong_Li11;~Xuyang_Shen1;~Yu_Qiao1;~Yiran_Zhong1",
        "gender": "M;;M;M;M;M;;M",
        "homepage": "https://weigao266.github.io/;https://github.com/Doraemonzzz;https://weixuansun.github.io/weixuansun-github.io/;;;;;",
        "dblp": ";;186/6724;;;274/2342;;158/9624",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.com.sg/citations?user=IcBRtycAAAAJ;vIS56AoAAAAJ;https://scholar.google.com.au/citations?user=6x17jhEAAAAJ;bxmsqZIAAAAJ;k6Q1mcoAAAAJ;;https://scholar.google.com.sg/citations?user=E9NVOBUAAAAJ",
        "orcid": ";;;;;0000-0002-1968-7055;;",
        "linkedin": "weigao-sun-01ab4a1b3/;;;;;;;",
        "or_profile": "~Weigao_Sun1;~Zhen_Qin6;~Weixuan_Sun1;~Shidi_Li1;~Dong_Li11;~Xuyang_Shen1;~Yu_Qiao1;~Yiran_Zhong1",
        "aff": "Shanghai Artificial Intelligence Laboratory;TapTap;Tencent;Shanghai AI Lab;Shanghai AI Lab;Shanghai AI Lab;;Shanghai AI Lab",
        "aff_domain": "pjlab.org.cn;xd.com;tencent.com;pjlab.org.cn;org.cn;pjlab.org.cn;;pjlab.org.cn",
        "position": "Researcher;Researcher;Researcher;Intern researcher ;Researcher;Researcher;;PI",
        "bibtex": "@inproceedings{\nsun2024co,\ntitle={{CO}2: Efficient Distributed Training with Full Communication-Computation Overlap},\nauthor={Weigao Sun and Zhen Qin and Weixuan Sun and Shidi Li and Dong Li and Xuyang Shen and Yu Qiao and Yiran Zhong},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ZO5cn4IfaN}\n}",
        "github": "",
        "project": "",
        "reviewers": "rgZH;m91N;cSfz;Qwcz;vfwG;8oQm",
        "pdf_size": 722427,
        "rating": "6;6;6;8;8;8",
        "confidence": "4;4;4;2;4;4",
        "soundness": "2;3;3;4;2;3",
        "contribution": "3;3;2;3;3;3",
        "presentation": "3;3;3;4;3;4",
        "wc_summary": "133;78;124;88;114;93",
        "wc_strengths": "84;45;53;50;129;29",
        "wc_weaknesses": "196;108;278;18;403;127",
        "wc_questions": "2;47;55;31;242;4",
        "wc_review": "415;278;510;187;888;253",
        "wc_reply_reviewers": "132;0;0;0;54;0",
        "wc_reply_authors": "1796;1165;1027;102;2104;870",
        "reply_reviewers": "2;0;0;0;1;0",
        "reply_authors": "4;2;2;1;3;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.7453559924999298
        ],
        "soundness_avg": [
            2.8333333333333335,
            0.6871842709362768
        ],
        "contribution_avg": [
            2.8333333333333335,
            0.3726779962499649
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            105.0,
            19.949937343260004
        ],
        "wc_strengths_avg": [
            65.0,
            32.96968304366907
        ],
        "wc_weaknesses_avg": [
            188.33333333333334,
            124.77268219535166
        ],
        "wc_questions_avg": [
            63.5,
            82.24506064196196
        ],
        "wc_review_avg": [
            421.8333333333333,
            234.33268136466913
        ],
        "wc_reply_reviewers_avg": [
            31.0,
            49.28488612140643
        ],
        "wc_reply_authors_avg": [
            1177.3333333333333,
            647.4317638862715
        ],
        "reply_reviewers_avg": [
            0.5,
            0.7637626158259734
        ],
        "reply_authors_avg": [
            2.1666666666666665,
            1.0671873729054748
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.4472135954999579,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1875411177226539605&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=ZO5cn4IfaN",
        "pdf": "https://openreview.net/pdf?id=ZO5cn4IfaN",
        "email": "pjlab.org.cn;xd.com;tencent.com;pjlab.org.cn;org.cn;pjlab.org.cn;;pjlab.org.cn",
        "author_num": 8,
        "aff_unique_index": "0;1;2;3;3;3;3",
        "aff_unique_norm": "Shanghai Artificial Intelligence Laboratory;TapTap;Tencent;Shanghai AI Lab",
        "aff_unique_dep": ";;Tencent Holdings Limited;",
        "aff_unique_url": "http://www.shailab.org/;https://www.taptap.io;https://www.tencent.com;https://www.shanghaiailab.com",
        "aff_unique_abbr": "Shanghai AI Lab;TapTap;Tencent;SAIL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Mean Field Theory in Deep Metric Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18398",
        "id": "ZPdZLlNXSm",
        "tldr": "",
        "abstract": "In this paper, we explore the application of mean field theory, a technique from statistical physics, to deep metric learning and address the high training complexity commonly associated with conventional metric learning loss functions.\nBy adapting mean field theory for deep metric learning, we develop an approach to design classification-based loss functions from pair-based ones, which can be considered complementary to the proxy-based approach.\nApplying the mean field theory to two pair-based loss functions, we derive two new loss functions, MeanFieldContrastive and MeanFieldClassWiseMultiSimilarity losses, with reduced training complexity.\nWe extensively evaluate these derived loss functions on three image-retrieval datasets and demonstrate that our loss functions outperform baseline methods in two out of the three datasets.",
        "keywords": "deep metric learning;image retrieval;mean field theory",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/e0bdf50cfb0f4aa6f8ee722faaa35201b4d37e98.zip",
        "author": "Takuya Furusawa",
        "authorids": "~Takuya_Furusawa1",
        "gender": "M",
        "homepage": "",
        "dblp": "35/9814",
        "google_scholar": "jFxim0IAAAAJ",
        "orcid": "0000-0001-9521-6514",
        "linkedin": "",
        "or_profile": "~Takuya_Furusawa1",
        "aff": "ZOZO Research",
        "aff_domain": "zozo.com",
        "position": "Researcher",
        "bibtex": "@inproceedings{\nfurusawa2024mean,\ntitle={Mean Field Theory in Deep Metric Learning},\nauthor={Takuya Furusawa},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ZPdZLlNXSm}\n}",
        "github": "",
        "project": "",
        "reviewers": "aqYA;q1qw;zMTp;pubU;uk7M",
        "pdf_size": 1084166,
        "rating": "3;5;5;6;8",
        "confidence": "4;5;3;3;3",
        "soundness": "3;2;3;3;4",
        "contribution": "2;2;2;3;3",
        "presentation": "3;2;2;3;4",
        "wc_summary": "51;69;51;74;118",
        "wc_strengths": "45;50;49;46;98",
        "wc_weaknesses": "96;60;206;48;117",
        "wc_questions": "8;19;21;157;67",
        "wc_review": "200;198;327;325;400",
        "wc_reply_reviewers": "0;18;153;74;72",
        "wc_reply_authors": "603;369;908;703;363",
        "reply_reviewers": "0;1;1;1;1",
        "reply_authors": "2;2;2;2;2",
        "rating_avg": [
            5.4,
            1.624807680927192
        ],
        "confidence_avg": [
            3.6,
            0.8
        ],
        "soundness_avg": [
            3.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.8,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            72.6,
            24.532427519509763
        ],
        "wc_strengths_avg": [
            57.6,
            20.283983829612957
        ],
        "wc_weaknesses_avg": [
            105.4,
            56.03427522507987
        ],
        "wc_questions_avg": [
            54.4,
            55.149252034819106
        ],
        "wc_review_avg": [
            290.0,
            79.06706014517044
        ],
        "wc_reply_reviewers_avg": [
            63.4,
            53.46999158406516
        ],
        "wc_reply_authors_avg": [
            589.2,
            207.08877323505493
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.49236596391733095,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17699781751342895180&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=ZPdZLlNXSm",
        "pdf": "https://openreview.net/pdf?id=ZPdZLlNXSm",
        "email": "zozo.com",
        "author_num": 1,
        "aff_unique_index": "0",
        "aff_unique_norm": "ZOZO Research",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.zozoresearch.com",
        "aff_unique_abbr": "",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "ZQ7P1miPP8",
        "title": "From Local Explainability to Global Robustness: Improving the Robustness of Machine Learning Models Using Counterfactual Explanations",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Sophisticated new adversarial attacks are being introduced\nat a rapid rate. Such threats have been accompanied by the creation of a\nwide variety of defense techniques, including robustness techniques. This\npaper proposes a novel attack-agnostic robustness method that utilizes\nthe local explainability capabilities of counterfactual explanations (CFE\ndata) to improve the robustness of classical machine learning models\ntrained on structured (tabular) data. In order to defend target models,\nwe induce an auxiliary denoising autoencoder (DAE) with benign and\nCFE data. The DAE serves as a defense mechanism by denoising the\ninput, which can be benign or adversarial, and reconstructing it into the\nbenign data manifold before it is introduced to the target model. We also\nsuggest four protection mechanisms that utilize our DAE, one of which\nserves as a preventative approach and does not require any changes to\nthe target model. In the other three protection mechanisms, the target\nmodel is induced with benign and CFE data in order to both accurately\nfit the decision boundaries to various samples and improve the model\u2019s\nrobustness to diverse perturbations. In our evaluation on three structured\ndatasets, the proposed robustness method achieved results comparable\nto state-of-the-art robustness techniques which are not attack-agnostic.",
        "keywords": "Security;Adversarial Learning;Adversarial Robustness;Tabular Data;Explainability",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Arie Pavlov;Edita Grolman;Ikuya Morikawa;Toshiya Shimizu;Yuval Elovici;Asaf Shabtai",
        "authorids": "~Arie_Pavlov1;~Edita_Grolman1;~Ikuya_Morikawa1;~Toshiya_Shimizu1;~Yuval_Elovici1;~Asaf_Shabtai1",
        "gender": "M;;;M;M;",
        "homepage": ";;;;https://cyber.bgu.ac.il/yuval/;",
        "dblp": ";;22/726;78/5031;38/4086;",
        "google_scholar": ";https://scholar.google.co.il/citations?hl=en;JBFx8KYAAAAJ;;https://scholar.google.co.il/citations?user=ruZDm9QAAAAJ;",
        "orcid": ";;0000-0003-2720-812X;0000-0003-3660-5231;0000-0002-9641-128X;",
        "linkedin": "arie-pavlov-78217316a/;;;;yuval-elovici-0baa4a4/?originalSubdomain=il;",
        "or_profile": "~Arie_Pavlov1;~Edita_Grolman1;~Ikuya_Morikawa1;~Toshiya_Shimizu1;~Yuval_Elovici1;~Asaf_Shabtai1",
        "aff": ";Ben-Gurion University of the Negev;Fujitsu Research;Fujitsu;Ben Gurion University of the Negev, Technion;",
        "aff_domain": ";post.bgu.ac.il;fujitsu.com;fujitsu.com;bgu.ac.il;",
        "position": ";Postdoc;Research Manager;Researcher;Full Professor;",
        "bibtex": "@misc{\npavlov2024from,\ntitle={From Local Explainability to Global Robustness: Improving the Robustness of Machine Learning Models Using Counterfactual Explanations},\nauthor={Arie Pavlov and Edita Grolman and Ikuya Morikawa and Toshiya Shimizu and Yuval Elovici and Asaf Shabtai},\nyear={2024},\nurl={https://openreview.net/forum?id=ZQ7P1miPP8}\n}",
        "github": "",
        "project": "",
        "reviewers": "ikyJ;9mE5;8JLu;GewD",
        "site": "https://openreview.net/forum?id=ZQ7P1miPP8",
        "pdf_size": 1086315,
        "rating": "3;3;5;5",
        "confidence": "4;3;4;4",
        "soundness": "2;2;2;2",
        "contribution": "1;2;3;3",
        "presentation": "3;2;4;2",
        "wc_summary": "61;96;137;89",
        "wc_strengths": "7;44;158;29",
        "wc_weaknesses": "212;160;298;530",
        "wc_questions": "2;250;15;16",
        "wc_review": "282;550;608;664",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            95.75,
            27.178806081209675
        ],
        "wc_strengths_avg": [
            59.5,
            58.37165407969865
        ],
        "wc_weaknesses_avg": [
            300.0,
            141.6403897198818
        ],
        "wc_questions_avg": [
            70.75,
            103.63728817370705
        ],
        "wc_review_avg": [
            526.0,
            146.52644812456214
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:QB96tqlMnd0J:scholar.google.com/&scioq=From+Local+Explainability+to+Global+Robustness:+Improving+the+Robustness+of+Machine+Learning+Models+Using+Counterfactual+Explanations&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "Ben-Gurion University of the Negev;Fujitsu Limited;Ben Gurion University of the Negev",
        "aff_unique_dep": ";Fujitsu Research;",
        "aff_unique_url": "https://www.bgu.ac.il;https://www.fujitsu.com/;https://www.bgu.ac.il",
        "aff_unique_abbr": "BGU;Fujitsu;BGU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "Israel;Japan"
    },
    {
        "id": "ZQIgnzxMKJ",
        "title": "Beyond Graphs: Learning with Relational DBs",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Despite recent advancements in representation learning on graphs, there still lacks a unified framework that addresses the challenges of learning from real-world relational data, which can involve heterogeneous, dynamic, and multi-ary relationships. Existing efforts focus on extending graph learning to alternative graph representations, including heterogeneous graphs and hypergraphs; however, these approaches are highly specific to particular use cases, therefore introducing complexity into their application and deployment.\nWe propose to unify and extend existing graph learning research with relational databases (RDBs). \nRDBs, characterized by their simplicity and versatility, consist of multiple tables linked by shared key columns. We show that diverse types of graphs can be unified as RDBs and different graph learning tasks can be formulated as predicting column values in RDB tables. \nFurthermore, we introduce Relational Database Neural Networks (RDNNs), the first family of deep learning models that can holistically learn from multi-table information inside a relational DB, without the need for converting it to graphs. RDNNs provide a more flexible and comprehensive deep learning design space for modeling relational data, capable of solving problems beyond the scope of graph learning. \nThrough extensive experimentation on a range of graph and multi-table datasets, we demonstrate that the RDNNs offer competitive or superior performance in comparison to Graph Neural Networks (GNNs) on graph learning tasks and tabular machine learning methods on RDB prediction tasks.",
        "keywords": "graph machine learning;relational database;representation learning",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/3ba39c558f3ab8fd3c64cf7a5d5d01a8d901b65f.pdf",
        "author": "Jiaxuan You;Ge Liu",
        "authorids": "~Jiaxuan_You2;~Ge_Liu2",
        "gender": "F;M",
        "homepage": "http://www.mit.edu/~geliu/;https://cs.stanford.edu/~jiaxuan/",
        "dblp": ";192/4727",
        "google_scholar": "P6EahzcAAAAJ;NDbMl7oAAAAJ",
        "orcid": "0000-0001-9383-5186;",
        "linkedin": ";jiaxuan-you-5859b37b/",
        "or_profile": "~Ge_Liu2;~Jiaxuan_You1",
        "aff": "University of Washington;NVIDIA",
        "aff_domain": "uw.edu;nvidia.com",
        "position": "Postdoc;Researcher",
        "bibtex": "@misc{\nyou2024beyond,\ntitle={Beyond Graphs: Learning with Relational {DB}s},\nauthor={Jiaxuan You and Ge Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=ZQIgnzxMKJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=ZQIgnzxMKJ",
        "pdf_size": 781169,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9350259005212882674&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Washington;NVIDIA",
        "aff_unique_dep": ";NVIDIA Corporation",
        "aff_unique_url": "https://www.washington.edu;https://www.nvidia.com",
        "aff_unique_abbr": "UW;NVIDIA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "ZQVV6IY0OE",
        "title": "The Implicit Bias of Stochastic AdaGrad-Norm on Separable Data",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper explores stochastic adaptive gradient descent, i.e., stochastic AdaGrad-Norm, with applications to linearly separable data sets. For the stochastic AdaGrad-Norm equipped with a wide range of sampling noise, we demonstrate its almost surely convergence result to the $\\mathcal{L}^{2}$ max-margin solution. This means that stochastic AdaGrad-Norm has an implicit bias that yields good generalization, even without regularization terms.\nWe show that the convergence rate of the direction is $o({1}/{\\ln^{\\frac{1-\\epsilon}{2}}n})$. Our approach takes a novel stance by explicitly characterizing the $\\mathcal{L}^{2}$ max-margin direction. By doing so, we overcome the challenge that arises from the dependency between the stepsize and the gradient, and also address the limitations in the traditional AdaGrad-Norm analysis.",
        "keywords": "AdaGrad-Norm;Last-iterate convergence;Stochastic optimization;Implicit Bias",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/cf985f790a591dcc64627a424cbde03e45f5c85f.pdf",
        "author": "Ruinan Jin;Wei Liu;Baoxiang Wang",
        "authorids": "~Ruinan_Jin3;~Wei_Liu36;~Baoxiang_Wang1",
        "gender": ";M;",
        "homepage": ";https://sites.google.com/view/liu-wei/%E9%A6%96%E9%A1%B5;",
        "dblp": ";;",
        "google_scholar": ";https://scholar.google.com/citations?hl=zh-CN;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Ruinan_Jin3;~Wei_Liu36;~Baoxiang_Wang1",
        "aff": ";Rensselaer Polytechnic Institute;",
        "aff_domain": ";rpi.edu;",
        "position": ";Postdoc;",
        "bibtex": "@misc{\njin2024the,\ntitle={The Implicit Bias of Stochastic AdaGrad-Norm on Separable Data},\nauthor={Ruinan Jin and Wei Liu and Baoxiang Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=ZQVV6IY0OE}\n}",
        "github": "",
        "project": "",
        "reviewers": "Ckt3;6py2;jNzZ;VfNS",
        "site": "https://openreview.net/forum?id=ZQVV6IY0OE",
        "pdf_size": 371461,
        "rating": "3;5;6;6",
        "confidence": "4;2;2;3",
        "soundness": "1;3;3;2",
        "contribution": "2;2;3;2",
        "presentation": "1;2;3;3",
        "wc_summary": "58;38;125;95",
        "wc_strengths": "77;38;64;132",
        "wc_weaknesses": "421;240;19;155",
        "wc_questions": "9;3;264;102",
        "wc_review": "565;319;472;484",
        "wc_reply_reviewers": "2188;0;361;12",
        "wc_reply_authors": "1864;987;634;389",
        "reply_reviewers": "7;0;3;1",
        "reply_authors": "10;3;6;2",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            79.0,
            33.51865152418874
        ],
        "wc_strengths_avg": [
            77.75,
            34.3247359785913
        ],
        "wc_weaknesses_avg": [
            208.75,
            145.70582520956395
        ],
        "wc_questions_avg": [
            94.5,
            105.43837062473983
        ],
        "wc_review_avg": [
            460.0,
            88.9185020116736
        ],
        "wc_reply_reviewers_avg": [
            640.25,
            905.280170720645
        ],
        "wc_reply_authors_avg": [
            968.5,
            559.010956958806
        ],
        "reply_reviewers_avg": [
            2.75,
            2.680951323690902
        ],
        "reply_authors_avg": [
            5.25,
            3.112474899497183
        ],
        "replies_avg": [
            38,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.7385489458759963,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:uzfT8ukVRggJ:scholar.google.com/&scioq=The+Implicit+Bias+of+Stochastic+AdaGrad-Norm+on+Separable+Data&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Rensselaer Polytechnic Institute",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.rpi.edu",
        "aff_unique_abbr": "RPI",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "ZR2q4qFa7q",
        "title": "ACID: Abstractive, Content-Based IDs for Document Retrieval with Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Generative retrieval (Wang et al., 2022; Tay et al., 2022) is a new approach for end-to-end document retrieval that directly generates document identifiers given an input query. Techniques for designing effective, high-quality document IDs remain largely unexplored. We introduce ACID, in which each document's ID is composed of abstractive keyphrases generated by a large language model, rather than an integer ID sequence as done in past work. We compare our method with the current state-of-the-art technique for ID generation, which produces IDs through hierarchical clustering of document embeddings. We also examine simpler methods to generate natural-language document IDs, including the naive approach of using the first k words of each document as its ID or words with high BM25 scores in that document. We show that using ACID improves top-10 and top-20 accuracy by 15.6% and 14.4% (relative) respectively versus the state-of-the-art baseline on the MSMARCO 100k retrieval task, and 4.4% and 4.0% respectively on the Natural Questions 100k retrieval task. Our results demonstrate the effectiveness of human-readable, natural-language IDs in generative retrieval with LMs. The code for reproducing our results and the keyword-augmented datasets can be found at (link-redacted-during-review).",
        "keywords": "generative retrieval;document identifiers;large language models",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Haoxin Li;Phillip Keung;Daniel Cheng;Jungo Kasai;Noah A. Smith",
        "authorids": "~Haoxin_Li3;~Phillip_Keung1;~Daniel_Cheng1;~Jungo_Kasai1;~Noah_A._Smith2",
        "gender": "M;M;;M;M",
        "homepage": "https://lihaoxin2020.github.io/;;;https://homes.cs.washington.edu/~jkasai/;https://homes.cs.washington.edu/~nasmith/",
        "dblp": ";198/0534;;205/9020;90/5204.html",
        "google_scholar": ";;;nHCLoIwAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;;0000-0002-2310-6380",
        "linkedin": "alan-li-2020/;;cheng-daniel/;;",
        "or_profile": "~Haoxin_Li3;~Phillip_Keung1;~Daniel_Cheng1;~Jungo_Kasai1;~Noah_Smith1",
        "aff": "University of Washington;University of Washington;;Toyota Technological Institute at Chicago;Allen Institute for Artificial Intelligence",
        "aff_domain": "cs.washington.edu;uw.edu;;ttic.edu;allenai.org",
        "position": "MS student;PhD student;;Research Assistant Professor;Senior Director of NLP Research",
        "bibtex": "@misc{\nli2024acid,\ntitle={{ACID}: Abstractive, Content-Based {ID}s for Document Retrieval with Language Models},\nauthor={Haoxin Li and Phillip Keung and Daniel Cheng and Jungo Kasai and Noah A. Smith},\nyear={2024},\nurl={https://openreview.net/forum?id=ZR2q4qFa7q}\n}",
        "github": "",
        "project": "",
        "reviewers": "mfex;qncb;2EQH;xBCe",
        "site": "https://openreview.net/forum?id=ZR2q4qFa7q",
        "pdf_size": 2555465,
        "rating": "3;5;5;5",
        "confidence": "5;4;2;3",
        "soundness": "2;2;3;2",
        "contribution": "2;2;2;2",
        "presentation": "2;3;3;3",
        "wc_summary": "54;69;168;69",
        "wc_strengths": "15;9;34;37",
        "wc_weaknesses": "66;46;96;206",
        "wc_questions": "142;238;30;44",
        "wc_review": "277;362;328;356",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            90.0,
            45.447772222629354
        ],
        "wc_strengths_avg": [
            23.75,
            11.986972094736853
        ],
        "wc_weaknesses_avg": [
            103.5,
            61.79603547154137
        ],
        "wc_questions_avg": [
            113.5,
            83.83764071107917
        ],
        "wc_review_avg": [
            330.75,
            33.58105864918496
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.7745966692414834,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15194014750596552402&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "University of Washington;Toyota Technological Institute at Chicago;Allen Institute for Artificial Intelligence",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.washington.edu;https://www.tti-chicago.org;https://allenai.org",
        "aff_unique_abbr": "UW;TTI Chicago;AI2",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Chicago",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "ZRQRvFxrZ9",
        "title": "GSVA: Gradient-Based Sparse Voxel Attacks \\\\ on Point Cloud Object Detection",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Point cloud object detection is crucial for a variety of applications, including autonomous driving and robotics. Voxel-based representation for 3D point clouds has drawn significant attention due to their efficiency and effectiveness. Recent studies have revealed the vulnerability of deep learning models to adversarial attacks, while considerably little attention is paid to the robustness of voxel-based point cloud object detectors. Existing adversarial attacks on the point cloud data involve generating fake obstacles, removing objects or producing fake predictions. Despite the demonstrated success, these approaches have three limitations. First, manipulating point data, which was originally designed for point-based representation, is inapplicable to voxel-based representation. Second, existing works that modified points in the hold scene led to redundant perturbations. Third, the evaluation primarily performed on small-scale datasets, such as KITTI, does not scale well. To address these limitations, we propose a gradient-based sparse voxel attack (GSVA) algorithm for voxel-based 3D point cloud object detectors. Two novel frameworks, i.e., re-voxelization-based voxel attack framework and light voxel attack framework, successfully modify voxel-based representation instead of raw points. In addition to KITTI, extensive experiments on large-scale datasets including nuScenes and Waymo Open Dataset demonstrate the favorable attack performance (with mAP decrease by 86.2% \u223c 99.5%) and the slight perturbation costs (with modification rate of 3.5% \u223c 30.6%) of our sparse attack algorithm.",
        "keywords": "deep learning;point cloud detection;adversarial attack",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Junqi Wu;Wen Yao;Tingsong Jiang;Weien Zhou;Chao Ma;Xiao qian Chen",
        "authorids": "~Junqi_Wu1;~Wen_Yao1;~Tingsong_Jiang1;~Weien_Zhou1;~Chao_Ma3;~Xiao_qian_Chen1",
        "gender": "M;F;;M;M;",
        "homepage": ";;;;https://vision.sjtu.edu.cn/;",
        "dblp": "83/7548;;;201/1509;79/1552-4;61/538.html",
        "google_scholar": "https://scholar.google.com.hk/citations?hl=zh-CN;;;b84PMFsAAAAJ;syoPhv8AAAAJ;",
        "orcid": ";0000-0001-5224-9834;;0000-0001-9833-679X;;",
        "linkedin": ";;;;;",
        "or_profile": "~Junqi_Wu1;~Wen_Yao1;~Tingsong_Jiang1;~Weien_Zhou1;~Chao_Ma3;~Xiao_qian_Chen1",
        "aff": "Shanghai Jiaotong University;National University of Defense Technology;;National Innovation Institute of Defense Technology;Shanghai Jiaotong University;",
        "aff_domain": "sjtu.edu.cn;nudt.edu.cn;;nudt.edu.cn;sjtu.edu.cn;",
        "position": "PhD student;Principal Researcher;;Associate Professor;Full Professor;",
        "bibtex": "@misc{\nwu2024gsva,\ntitle={{GSVA}: Gradient-Based Sparse Voxel Attacks {\\textbackslash}{\\textbackslash} on Point Cloud Object Detection},\nauthor={Junqi Wu and Wen Yao and Tingsong Jiang and Weien Zhou and Chao Ma and Xiao qian Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=ZRQRvFxrZ9}\n}",
        "github": "",
        "project": "",
        "reviewers": "KepK;D947;Ck9c",
        "site": "https://openreview.net/forum?id=ZRQRvFxrZ9",
        "pdf_size": 7892916,
        "rating": "3;3;6",
        "confidence": "4;4;3",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "2;1;2",
        "wc_summary": "46;212;70",
        "wc_strengths": "51;34;49",
        "wc_weaknesses": "202;80;148",
        "wc_questions": "42;24;32",
        "wc_review": "341;350;299",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            109.33333333333333,
            73.25450308494503
        ],
        "wc_strengths_avg": [
            44.666666666666664,
            7.586537784494028
        ],
        "wc_weaknesses_avg": [
            143.33333333333334,
            49.91548412622635
        ],
        "wc_questions_avg": [
            32.666666666666664,
            7.363574011458174
        ],
        "wc_review_avg": [
            330.0,
            22.22611077089287
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:BU7x0cjUn1gJ:scholar.google.com/&scioq=GSVA:+Gradient-Based+Sparse+Voxel+Attacks+%5C%5C+on+Point+Cloud+Object+Detection&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Shanghai Jiao Tong University;National University of Defense Technology;National Innovation Institute of Defense Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.sjtu.edu.cn;http://www.nudt.edu.cn/;",
        "aff_unique_abbr": "SJTU;NUDT;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "ZRnJi43BHK",
        "title": "GOODFIT: A Deep Learning Optimizer Fine Tuned for Fine Tuning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We present GOODFIT, one of the first optimizers that has been specifically designed to operate on converged models that need to be incrementally fine-tuned on a new task/dataset. Unlike standard optimizers like SGD or Adam, which operate with minimal assumptions since the model weights might be randomly initialized, GOODFIT takes advantage of the additional structure of a converged model to regularize the optimization process for better results. GOODFIT uses a simple temporal gradient orthogonalization process to outperform traditional fine-tuning methods in a wide variety of settings, from long-tailed classification to large-scale motion prediction. And because GOODFIT is fully encapsulated within the logic of an optimizer, it can be trivially dropped into any model training pipeline with minimal engineering effort. We believe that a new class of fine-tuning optimizers like GOODFIT can help pave the way as fine-tuning and incremental training become more and more prevalent within modern deep learning, and practitioners move further and further away from expensively training models from scratch.",
        "keywords": "optimizer;finetuning",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/588e273fbc4f8b489d2f49ee595dc23cd2160a3b.pdf",
        "author": "Anirudh S Chakravarthy;Shuai Kyle Zheng;Xin Huang;Sachithra Hemachandra;Xiao Zhang;Carl Vondrick;Yuning Chai;Zhao Chen",
        "authorids": "~Anirudh_S_Chakravarthy1;~Shuai_Kyle_Zheng1;~Xin_Huang8;~Sachithra_Hemachandra1;~Xiao_Zhang21;~Carl_Vondrick2;~Yuning_Chai1;~Zhao_Chen1",
        "gender": "M;M;;M;;M;;M",
        "homepage": "https://anirudh-chakravarthy.github.io/;https://kylezheng.org;;;;http://www.cs.columbia.edu/~vondrick/;;",
        "dblp": "301/8086;13/8659-1.html;;19/9967;;26/8610;37/10771;",
        "google_scholar": "FhPaTZEAAAAJ;U5giXc0AAAAJ;;7gd0hJYAAAAJ;joB-O-8AAAAJ;3MzhkFIAAAAJ;i7U4YogAAAAJ;ji6BSBoAAAAJ",
        "orcid": ";0000-0002-1636-631X;;;;;;",
        "linkedin": "anirudh-chakravarthy/;shuai-kyle-zheng-26882586/;;sachih/;andypassion/;;chaiyuning/;",
        "or_profile": "~Anirudh_S_Chakravarthy1;~Shuai_Kyle_Zheng1;~Xin_Huang8;~Sachithra_Hemachandra1;~Xiao_Zhang21;~Carl_Vondrick2;~Yuning_Chai1;~Zhao_Chen1",
        "aff": "Cruise LLC;Cruise LLC;;GM Cruise LLC;Cruise;Columbia University;Cruise LLC;Cruise LLC",
        "aff_domain": "getcruise.com;getcruise.com;;getcruise.com;cruise.com;columbia.edu;getcruise.com;getcruise.com",
        "position": "Researcher;Researcher;;Researcher;Director of Engineering;Associate Professor;Researcher;Researcher",
        "bibtex": "@misc{\nchakravarthy2024goodfit,\ntitle={{GOODFIT}: A Deep Learning Optimizer Fine Tuned for Fine Tuning},\nauthor={Anirudh S Chakravarthy and Shuai Kyle Zheng and Xin Huang and Sachithra Hemachandra and Xiao Zhang and Carl Vondrick and Yuning Chai and Zhao Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=ZRnJi43BHK}\n}",
        "github": "",
        "project": "",
        "reviewers": "BuWp;aj9V;ZLp3;vuSA",
        "site": "https://openreview.net/forum?id=ZRnJi43BHK",
        "pdf_size": 1191514,
        "rating": "3;3;5;5",
        "confidence": "3;4;3;3",
        "soundness": "2;2;2;2",
        "contribution": "2;2;3;2",
        "presentation": "3;3;3;2",
        "wc_summary": "38;73;55;24",
        "wc_strengths": "22;45;46;29",
        "wc_weaknesses": "98;317;341;197",
        "wc_questions": "96;2;103;16",
        "wc_review": "254;437;545;266",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            47.5,
            18.364367672206956
        ],
        "wc_strengths_avg": [
            35.5,
            10.307764064044152
        ],
        "wc_weaknesses_avg": [
            238.25,
            97.6354827918621
        ],
        "wc_questions_avg": [
            54.25,
            45.58714182749342
        ],
        "wc_review_avg": [
            375.5,
            121.7220193720101
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:qPQnSuzrecEJ:scholar.google.com/&scioq=GOODFIT:+A+Deep+Learning+Optimizer+Fine+Tuned+for+Fine+Tuning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2;3;0;0",
        "aff_unique_norm": "Cruise LLC;GM Cruise LLC;Cruise;Columbia University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.cruisellc.com;https://www.gmcruise.com;https://www.cruise.com;https://www.columbia.edu",
        "aff_unique_abbr": "Cruise;GM Cruise;Cruise;Columbia",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "ZRzlhfMqHt",
        "title": "Periodic and Random Sparsity for Multivariate Long-Term Time-Series Forecasting",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "For years, Transformers have achieved remarkable success in various domains such as language and image processing. Due to their capabilities to capture long-term relationships, they are expected to give potential benefits in multivariate long-term time-series forecasting. Recent works have proposed segment-based Transformers, where each token is represented by a group of consecutive observations rather than a single one. However, the quadratic complexity of self-attention leads to intractable costs under high granularity and large feature size. In response, we propose Efficient Segment-based Sparse Transformer (ESSformer), which incorporates two sparse attention modules tailored for segment-based Transformers. To efficiently capture temporal dependencies, ESSformer utilizes Periodic Attention (PeriA), which learns  interactions between periodically distant segments. Furthermore, inter-feature dependencies are captured via Random-Partition Attention (R-PartA) and ensembling, which leads to additional cost reduction. Our empirical studies on real-world datasets show that ESSformer surpasses the forecasting capabilities of various baselines while reducing the quadratic complexity.",
        "keywords": "Time series forecasting;Transformers;Efficiency",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/c3802e0c6735f225ef0e9fcd46bf809b7f07777b.zip",
        "author": "Jaehoon Lee;Hankook Lee;Sungik Choi;Sungwoo Park;Sungjun Cho;Moontae Lee",
        "authorids": "~Jaehoon_Lee6;~Hankook_Lee1;~Sungik_Choi1;~Sungwoo_Park3;~Sungjun_Cho1;~Moontae_Lee1",
        "gender": "M;M;;M;M;M",
        "homepage": "https://hankook.github.io;https://sc782.github.io/;https://moontae.people.uic.edu;https://sites.google.com/view/jaehoonlee/home;;",
        "dblp": "223/4393;254/8021;132/1761;95/386-2;184/4055.html;92/6585",
        "google_scholar": "CgqswXUAAAAJ;https://scholar.google.com/citations?hl=en;BMvYy9cAAAAJ;x521bdIAAAAJ;H0QB0PwAAAAJ;B1xpjO8AAAAJ",
        "orcid": ";;0000-0001-5542-3463;;;",
        "linkedin": ";sungjun-cho-46982411a/;moontae-lee-975248123/;jaehoon-lee-36125a1a7/;;",
        "or_profile": "~Hankook_Lee1;~Sungjun_Cho1;~Moontae_Lee1;~JAEHOON_LEE5;~Choi_sungik1;~Sung_Woo_Park2",
        "aff": "LG AI Research;LG AI Research;University of Illinois, Chicago;LG AI RESEARCH;LG AI Research;University of California, Berkeley",
        "aff_domain": "lgresearch.ai;lgresearch.ai;uic.edu;lgresearch.ai;lgresearch.ai;berkeley.edu",
        "position": "Researcher;Researcher;Assistant Professor;Researcher;Researcher;Postdoc",
        "bibtex": "@misc{\nlee2024periodic,\ntitle={Periodic and Random Sparsity for Multivariate Long-Term Time-Series Forecasting},\nauthor={Jaehoon Lee and Hankook Lee and Sungik Choi and Sungwoo Park and Sungjun Cho and Moontae Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=ZRzlhfMqHt}\n}",
        "github": "",
        "project": "",
        "reviewers": "AR89;h291;EwZF;6AJS",
        "site": "https://openreview.net/forum?id=ZRzlhfMqHt",
        "pdf_size": 762290,
        "rating": "3;6;6;6",
        "confidence": "5;5;4;3",
        "soundness": "3;4;3;3",
        "contribution": "2;3;2;3",
        "presentation": "3;4;3;4",
        "wc_summary": "63;111;88;65",
        "wc_strengths": "110;19;37;67",
        "wc_weaknesses": "246;166;95;69",
        "wc_questions": "16;5;11;15",
        "wc_review": "435;301;231;216",
        "wc_reply_reviewers": "0;0;21;0",
        "wc_reply_authors": "1338;772;927;344",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "4;2;3;2",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            81.75,
            19.536824204563032
        ],
        "wc_strengths_avg": [
            58.25,
            34.4483308739335
        ],
        "wc_weaknesses_avg": [
            144.0,
            68.76408946535975
        ],
        "wc_questions_avg": [
            11.75,
            4.322904116447646
        ],
        "wc_review_avg": [
            295.75,
            86.56031134417205
        ],
        "wc_reply_reviewers_avg": [
            5.25,
            9.093266739736606
        ],
        "wc_reply_authors_avg": [
            845.25,
            355.7044946300229
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:LMiBwRClAk4J:scholar.google.com/&scioq=Periodic+and+Random+Sparsity+for+Multivariate+Long-Term+Time-Series+Forecasting&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;0;2",
        "aff_unique_norm": "LG;University of Illinois at Chicago;University of California, Berkeley",
        "aff_unique_dep": "LG AI Research;;",
        "aff_unique_url": "https://www.lgaires.com;https://www.uic.edu;https://www.berkeley.edu",
        "aff_unique_abbr": "LG AI;UIC;UC Berkeley",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Chicago;Berkeley",
        "aff_country_unique_index": "0;0;1;0;0;1",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "title": "Making Retrieval-Augmented Language Models Robust to Irrelevant Context",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18397",
        "id": "ZS4m74kZpH",
        "author_site": "Ori Yoran, Tomer Wolfson, Ori Ram, Jonathan Berant",
        "tldr": "",
        "abstract": "Retrieval-augmented language models (RALMs) hold promise to produce language understanding systems that are are factual, efficient, and up-to-date. An important desideratum of RALMs, is that retrieved information helps model performance when it is relevant, and does not harm performance when it is not. This is particularly important in multi-hop reasoning scenarios, where misuse of irrelevant evidence can lead to cascading errors. However, recent work has shown that retrieval augmentation can sometimes have a negative effect on performance. In this work, we present a thorough analysis on five open-domain question answering benchmarks, characterizing cases when retrieval reduces accuracy. We then propose two methods to mitigate this issue. First, a simple baseline that filters out retrieved passages that do not entail question-answer pairs according to a natural language inference (NLI) model. This is effective in preventing performance reduction, but at a cost of also discarding relevant passages. Thus, we propose a method for automatically generating data to fine-tune the language model to properly leverage retrieved passages, using a mix of relevant and irrelevant contexts at training time. We empirically show that even 1,000 examples suffice to train the model to be robust to irrelevant contexts while maintaining high performance on examples with relevant ones.",
        "keywords": "Retrieval Augmented Language Models;Large Language Models;Robustness;Question Answering",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Ori Yoran;Tomer Wolfson;Ori Ram;Jonathan Berant",
        "authorids": "~Ori_Yoran1;~Tomer_Wolfson1;~Ori_Ram2;~Jonathan_Berant1",
        "gender": "M;M;M;M",
        "homepage": "https://www.oriyoran.com/;;https://www.oriram.me/;http://www.cs.tau.ac.il/~joberant/",
        "dblp": "290/1285.html;225/5206.html;236/6179;31/8178",
        "google_scholar": "xPEKwGwAAAAJ;6jFwxg4AAAAJ;https://scholar.google.co.il/citations?user=LXu_gVkAAAAJ;https://scholar.google.co.il/citations?user=xCYHonIAAAAJ",
        "orcid": ";0009-0002-7404-7736;;",
        "linkedin": "ori-yoran-8022ba140/;;;",
        "or_profile": "~Ori_Yoran1;~Tomer_Wolfson1;~Ori_Ram2;~Jonathan_Berant1",
        "aff": "Tel Aviv University;Tel Aviv University;AI21 Labs;Tel Aviv University",
        "aff_domain": "tau.ac.il;tau.post.ac.il;ai21.com;tau.ac.il",
        "position": "PhD student;PhD student;Researcher;Associate Professor",
        "bibtex": "@inproceedings{\nyoran2024making,\ntitle={Making Retrieval-Augmented Language Models Robust to Irrelevant Context},\nauthor={Ori Yoran and Tomer Wolfson and Ori Ram and Jonathan Berant},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ZS4m74kZpH}\n}",
        "github": "",
        "project": "",
        "reviewers": "Kczf;dWp6;CyE8;jc66",
        "pdf_size": 670320,
        "rating": "6;6;6;8",
        "confidence": "4;4;4;3",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "80;79;162;118",
        "wc_strengths": "32;41;63;156",
        "wc_weaknesses": "94;79;158;209",
        "wc_questions": "71;56;228;100",
        "wc_review": "277;255;611;583",
        "wc_reply_reviewers": "68;0;28;110",
        "wc_reply_authors": "1300;650;1263;576",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "4;2;3;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            109.75,
            34.01745875282279
        ],
        "wc_strengths_avg": [
            73.0,
            49.22905646059043
        ],
        "wc_weaknesses_avg": [
            135.0,
            52.01442107723588
        ],
        "wc_questions_avg": [
            113.75,
            67.83205363248263
        ],
        "wc_review_avg": [
            431.5,
            165.97816121405853
        ],
        "wc_reply_reviewers_avg": [
            51.5,
            41.53010955921017
        ],
        "wc_reply_authors_avg": [
            947.25,
            335.5274765201801
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 171,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14275518434915354811&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=ZS4m74kZpH",
        "pdf": "https://openreview.net/pdf?id=ZS4m74kZpH",
        "email": "tau.ac.il;tau.post.ac.il;ai21.com;tau.ac.il",
        "author_num": 4,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Tel Aviv University;AI21 Labs",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tau.ac.il;https://www.ai21labs.com",
        "aff_unique_abbr": "TAU;AI21",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Israel"
    },
    {
        "id": "ZS6lgCLr2B",
        "title": "Tackling Byzantine Clients in Federated Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The possibility of adversarial (a.k.a., {\\em Byzantine}) clients makes federated learning (FL) prone to arbitrary manipulation. The natural approach to robustify FL against adversarial clients is to replace the simple averaging operation at the server in the standard $\\mathsf{FedAvg}$ algorithm by a \\emph{robust averaging rule}. While a significant amount of work has been devoted to studying the convergence of federated {\\em robust averaging} (which we denote by $\\mathsf{FedRo}$), prior work has largely ignored the impact of {\\em client subsampling} and {\\em local steps}, two fundamental FL characteristics. While client subsampling increases the effective fraction of Byzantine clients, local steps increase the drift between the local updates computed by honest (i.e., non-Byzantine) clients. Consequently, a careless deployment of $\\mathsf{FedRo}$ could yield poor performance. We validate this observation by presenting an in-depth analysis of $\\mathsf{FedRo}$ with two-sided step-sizes, tightly analyzing the impact of client subsampling and local steps. Specifically, we present a sufficient condition on client subsampling for nearly-optimal convergence of $\\mathsf{FedRo}$ (for smooth non-convex loss). Also, we show that the rate of improvement in learning accuracy {\\em diminishes} with respect to the number of clients subsampled, as soon as the sample size exceeds a threshold value. Interestingly, we also observe that under a careful choice of step-sizes, the learning error due to Byzantine clients decreases with the number of local steps. We validate our theory by experiments on the FEMNIST image classification task.",
        "keywords": "Byzantine Attacks;Federated Learning;Client Sub-sampling;Local Steps",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/b758db33a65cb3e749521a860382be9f192c53ce.zip",
        "author": "Youssef Allouah;Sadegh Farhadkhani;Rachid Guerraoui;Nirupam Gupta;Rafael Pinot;Geovani Rizk;Sasha Voitovych",
        "authorids": "~Youssef_Allouah1;~Sadegh_Farhadkhani1;~Rachid_Guerraoui1;~Nirupam_Gupta1;~Rafael_Pinot1;~Geovani_Rizk1;~Sasha_Voitovych1",
        "gender": "M;M;M;;;M;M",
        "homepage": "https://youssefallouah.com/;https://sadeghfarhadkhani.github.io/;https://lpdwww.epfl.ch/rachid/;;;;https://scholar.google.com/citations?user=YPoNM2gAAAAJ&hl=en&authuser=1&oi=ao",
        "dblp": "312/3936;281/6141;g/RachidGuerraoui;;;259/2889;",
        "google_scholar": "kVZu88cAAAAJ;X4axFjgAAAAJ;;;;;",
        "orcid": "0000-0003-1048-7548;;;;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Youssef_Allouah1;~Sadegh_Farhadkhani1;~Rachid_Guerraoui1;~Nirupam_Gupta1;~Rafael_Pinot1;~Geovani_Rizk1;~Sasha_Voitovych1",
        "aff": "Stanford University;EPFL;;;;EPFL - EPF Lausanne;Massachusetts Institute of Technology",
        "aff_domain": "stanford.edu;epfl.ch;;;;epfl.ch;mit.edu",
        "position": "Visiting student researcher;PhD student;;;;Postdoc;PhD student",
        "bibtex": "@misc{\nallouah2024tackling,\ntitle={Tackling Byzantine Clients in Federated Learning},\nauthor={Youssef Allouah and Sadegh Farhadkhani and Rachid Guerraoui and Nirupam Gupta and Rafael Pinot and Geovani Rizk and Sasha Voitovych},\nyear={2024},\nurl={https://openreview.net/forum?id=ZS6lgCLr2B}\n}",
        "github": "",
        "project": "",
        "reviewers": "jgKT;xdhf;iQ55;gVud",
        "site": "https://openreview.net/forum?id=ZS6lgCLr2B",
        "pdf_size": 621776,
        "rating": "5;6;8;8",
        "confidence": "2;3;2;3",
        "soundness": "3;2;4;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;4;4",
        "wc_summary": "114;130;45;65",
        "wc_strengths": "46;101;32;95",
        "wc_weaknesses": "80;309;18;89",
        "wc_questions": "22;3;2;13",
        "wc_review": "262;543;97;262",
        "wc_reply_reviewers": "0;120;0;53",
        "wc_reply_authors": "353;1234;282;437",
        "reply_reviewers": "0;2;0;1",
        "reply_authors": "1;3;1;1",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            2.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            88.5,
            34.70230539892127
        ],
        "wc_strengths_avg": [
            68.5,
            29.9874973947477
        ],
        "wc_weaknesses_avg": [
            124.0,
            110.25198410913066
        ],
        "wc_questions_avg": [
            10.0,
            8.154753215150045
        ],
        "wc_review_avg": [
            291.0,
            160.32934852983092
        ],
        "wc_reply_reviewers_avg": [
            43.25,
            49.31214353483328
        ],
        "wc_reply_authors_avg": [
            576.5,
            383.55214769311357
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.19245008972987526,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1632491291367263885&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "Stanford University;EPFL;Massachusetts Institute of Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.stanford.edu;https://www.epfl.ch;https://web.mit.edu",
        "aff_unique_abbr": "Stanford;EPFL;MIT",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Stanford;;Lausanne",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "United States;Switzerland"
    },
    {
        "title": "Alleviating Exposure Bias in Diffusion Models through Sampling with Shifted Time Steps",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18396",
        "id": "ZSD3MloKe6",
        "author_site": "Mingxiao Li, Tingyu Qu, Ruicong Yao, Wei Sun, Marie-Francine Moens",
        "tldr": "",
        "abstract": "Diffusion Probabilistic Models (DPM) have shown remarkable efficacy in the synthesis of high-quality images. However, their inference process characteristically requires numerous, potentially hundreds, of iterative steps, which could exaggerate the problem of exposure bias due to the training and inference discrepancy. Previous work has attempted to mitigate this issue by perturbing inputs during training, which consequently mandates the retraining of the DPM. In this work, we conduct a systematic study of exposure bias in DPM and, intriguingly, we find that the exposure bias could be alleviated with a novel sampling method that we propose, without retraining the model. We empirically and theoretically show that, during inference, for each backward time step t and corresponding state \u02c6xt, there might exist another time step $t_s$ which exhibits superior coupling with $\\hat{x}_t$. Based on this finding, we introduce a sampling method\nnamed Time-Shift Sampler. Our framework can be seamlessly integrated to existing sampling algorithms, such as DDPM, DDIM and other high-order solvers, inducing merely minimal additional computations. Experimental results show our method brings significant and consistent improvements in FID scores on different datasets and sampling methods. For example, integrating Time-Shift Sampler to F-PNDM yields a FID=3.88, achieving 44.49% improvements as compared to F-PNDM, on CIFAR-10 with 10 sampling steps, which is more performant than the vanilla DDIM with 100 sampling steps. Our code is available at https://github.com/Mingxiao-Li/TS-DPM.",
        "keywords": "diffusion models;sampling methods;exposure bias",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Mingxiao Li;Tingyu Qu;Ruicong Yao;Wei Sun;Marie-Francine Moens",
        "authorids": "~Mingxiao_Li1;~Tingyu_Qu1;~Ruicong_Yao1;~Wei_Sun19;~Marie-Francine_Moens1",
        "gender": "M;M;M;M;F",
        "homepage": "https://mingxiao-li.github.io;https://tingyu215.github.io;;https://vrcmf.github.io/;https://people.cs.kuleuven.be/~sien.moens/",
        "dblp": "186/8921-2;195/9018;339/8800;;m/MarieFrancineMoens",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en;;https://scholar.google.com.tw/citations?user=O9hYMUUAAAAJ",
        "orcid": "0000-0003-0238-483X;0000-0002-0656-5745;0000-0001-7581-1797;0000-0001-6724-0584;0000-0002-3732-9323",
        "linkedin": "mingxiao-li-7b9b71180/;;;;marie-francine-moens-8175a56/?originalSubdomain=be",
        "or_profile": "~Mingxiao_Li1;~Tingyu_Qu1;~Ruicong_Yao1;~Wei_Sun19;~Marie-Francine_Moens1",
        "aff": "KU Leuven;KU Leuven;KU Leuven;KU Leuven;KU Leuven, KU Leuven",
        "aff_domain": "kuleuven.be;kuleuven.be;kuleuven.be;kuleuven.be;cs.kuleuven.be",
        "position": "Postdoc;PhD student;PhD student;PhD student;Full Professor",
        "bibtex": "@inproceedings{\nli2024alleviating,\ntitle={Alleviating Exposure Bias in Diffusion Models through Sampling with Shifted Time Steps},\nauthor={Mingxiao Li and Tingyu Qu and Ruicong Yao and Wei Sun and Marie-Francine Moens},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ZSD3MloKe6}\n}",
        "github": "",
        "project": "",
        "reviewers": "zG28;rQd1;YoEn;8DgG",
        "pdf_size": 7519695,
        "rating": "6;6;6;6",
        "confidence": "4;4;4;4",
        "soundness": "3;3;2;3",
        "contribution": "2;3;2;3",
        "presentation": "3;3;2;3",
        "wc_summary": "121;36;207;21",
        "wc_strengths": "76;50;75;52",
        "wc_weaknesses": "128;14;285;72",
        "wc_questions": "32;23;223;2",
        "wc_review": "357;123;790;147",
        "wc_reply_reviewers": "21;0;344;0",
        "wc_reply_authors": "905;355;2074;491",
        "reply_reviewers": "1;0;2;0",
        "reply_authors": "3;1;5;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            96.25,
            74.44922766557085
        ],
        "wc_strengths_avg": [
            63.25,
            12.275483697190918
        ],
        "wc_weaknesses_avg": [
            124.75,
            100.91921273969591
        ],
        "wc_questions_avg": [
            70.0,
            89.00280894443725
        ],
        "wc_review_avg": [
            354.25,
            267.5419359651866
        ],
        "wc_reply_reviewers_avg": [
            91.25,
            146.17690481057534
        ],
        "wc_reply_authors_avg": [
            956.25,
            676.3783612002974
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.5,
            1.6583123951777
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 36,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4004361626553396610&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=ZSD3MloKe6",
        "pdf": "https://openreview.net/pdf?id=ZSD3MloKe6",
        "email": "kuleuven.be;kuleuven.be;kuleuven.be;kuleuven.be;cs.kuleuven.be",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0;1",
        "aff_unique_norm": "Katholieke Universiteit Leuven;KU Leuven",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.kuleuven.be;https://www.kuleuven.be",
        "aff_unique_abbr": "KU Leuven;KU Leuven",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Belgium"
    },
    {
        "id": "ZSphTS4Siz",
        "title": "FedDecay: Adapting to Data Heterogeneity in Federated Learning With Gradient Decay",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Federated learning is a powerful technique for collaboratively training a centralized model on distributed local data sources, preserving data privacy by aggregating model information without disclosing the local training data. However, the inherent diversity in local data sets challenges the performance of traditional single-model-based techniques, especially when data is not identically distributed across sources. Personalized models can mitigate this challenge but often have additional memory and computation costs. In this work, we introduce FedDecay, a novel approach that enhances single-model-based federated learning by incorporating gradient decay into local updates within each training round. FedDecay adapts the gradient during training by introducing a tunable hyper-parameter, striking a balance between initial model success and fine-tuning potential. We provide both theoretical insights and empirical evidence of FedDecay's efficacy across diverse domains, including vision, text, and graph data. Our extensive experiments demonstrate that FedDecay outperforms other single-model-based methods regarding generalization performance for new and existing users. This work highlights the potential of tailored gradient adjustments to bridge the gap between personalized and single-model federated learning techniques, advancing the efficiency and effectiveness of decentralized learning scenarios.",
        "keywords": "federated learning;meta learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/cc8cd9ff2cb07ce066075d430f7dc54709b96654.zip",
        "author": "Joseph Lavond;Minhao Cheng;Yao Li",
        "authorids": "~Joseph_Lavond1;~Minhao_Cheng1;~Yao_Li1",
        "gender": ";M;F",
        "homepage": ";https://cmhcbb.github.io/;https://liyao880.github.io/yaoli/",
        "dblp": ";174/1717;",
        "google_scholar": ";_LkC1yoAAAAJ;bQ6YhCwAAAAJ",
        "orcid": ";0000-0003-3965-4215;0000-0002-7195-5774",
        "linkedin": "josephlavond1997/;;yao-li-b189574a/",
        "or_profile": "~Joseph_Lavond1;~Minhao_Cheng1;~Yao_Li1",
        "aff": "University of North Carolina at Chapel Hill;Pennsylvania State University;University of North Carolina, Chapel Hill",
        "aff_domain": "unc.edu;psu.edu;unc.edu",
        "position": "PhD student;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nlavond2024feddecay,\ntitle={FedDecay: Adapting to Data Heterogeneity in Federated Learning With Gradient Decay},\nauthor={Joseph Lavond and Minhao Cheng and Yao Li},\nyear={2024},\nurl={https://openreview.net/forum?id=ZSphTS4Siz}\n}",
        "github": "",
        "project": "",
        "reviewers": "wCRQ;THnL;kknZ",
        "site": "https://openreview.net/forum?id=ZSphTS4Siz",
        "pdf_size": 424091,
        "rating": "3;3;6",
        "confidence": "4;3;4",
        "soundness": "2;2;4",
        "contribution": "1;1;3",
        "presentation": "2;2;3",
        "wc_summary": "89;72;55",
        "wc_strengths": "66;75;96",
        "wc_weaknesses": "399;268;68",
        "wc_questions": "66;112;168",
        "wc_review": "620;527;387",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            72.0,
            13.880441875771343
        ],
        "wc_strengths_avg": [
            79.0,
            12.569805089976535
        ],
        "wc_weaknesses_avg": [
            245.0,
            136.1053513520562
        ],
        "wc_questions_avg": [
            115.33333333333333,
            41.7079795189788
        ],
        "wc_review_avg": [
            511.3333333333333,
            95.76475807356738
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:uMu3pGkK9BQJ:scholar.google.com/&scioq=FedDecay:+Adapting+to+Data+Heterogeneity+in+Federated+Learning+With+Gradient+Decay&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of North Carolina;Pennsylvania State University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.unc.edu;https://www.psu.edu",
        "aff_unique_abbr": "UNC;PSU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Chapel Hill;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "ZSvOIT5Ai2",
        "title": "Interpretable Concept Discovery and Learning from Pretrained Vision-Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Vision-language models (VLMs) pretrained on web-scale data excel at recognizing complex visual objects. However, it remains mysterious if and how the VLMs learn and utilize rich semantic information of visual concepts, such as colors and shapes, for recognition. While some prior work concluded that pretrained VLMs do not capture interpretable concepts, other work observed that leveraging the concept-based text prompts improves visual recognition accuracy, and appears to offer some degree of interpretability. In this paper, we aim to address this discrepancy and understand pretrained VLMs' true capability of encoding interpretable visual concepts. We identify that the discrepancies on concept definition and concept prompting (class-conditioned or class-agnostic) lead to different observations in prior works, and (class-conditioned) concept prompts that provide discriminative information for visual recognition are often not interpretable. To address these challenges, we propose a new framework to jointly discover and learn interpretable visual concepts from pretrained VLMs. Our discovered concepts are class-agnostic, and selected based on the visual discriminability as measured by mutual information between images and concepts. We then propose a self-supervised framework to efficiently fine-tune a VLM to better recognize the discovered concepts. Through extensive quantitative and human evaluations, we demonstrate that our concept discovery and learning (CDL) framework significantly improves the interpretability of the discovered concepts, while achieving state-of-the-art performance on concept-based visual recognition. All code and data related to this paper will be made public.",
        "keywords": "concept learning;concept bottleneck models;vision-language models",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/8076ac8817e7489ec56f8a7b576696a1b25e0fb2.pdf",
        "author": "Yuan Zang;Tian Yun;Hao Tan;Trung Bui;Chen Sun",
        "authorids": "~Yuan_Zang3;~Tian_Yun2;~Hao_Tan1;~Trung_Bui1;~Chen_Sun1",
        "gender": "M;M;M;M;M",
        "homepage": "https://zangy17.github.io;https://tttyuntian.github.io/;http://www.cs.unc.edu/~airsplay/;https://sites.google.com/site/trungbuistanford/;https://chensun.me",
        "dblp": "251/8598;33/303;94/877-2;180/0632;01/6072-2",
        "google_scholar": "Y_IbB6MAAAAJ;https://scholar.google.com/citations?hl=en;OV1Y3FUAAAAJ;FpFTduYAAAAJ;vQa7heEAAAAJ",
        "orcid": ";0000-0003-1671-5484;;0000-0002-0871-349X;",
        "linkedin": ";tian-yun-83b385146/;hao-tan-23677180/;trung-bui-4333322/;",
        "or_profile": "~Yuan_Zang3;~Tian_Yun2;~Hao_Tan1;~Trung_Bui1;~Chen_Sun1",
        "aff": "Brown University;Brown University;Adobe Systems;Adobe Research;Google",
        "aff_domain": "brown.edu;brown.edu;adobe.com;adobe.com;google.com",
        "position": "PhD student;PhD student;Research Scientist;Researcher;Research Scientist",
        "bibtex": "@misc{\nzang2024interpretable,\ntitle={Interpretable Concept Discovery and Learning from Pretrained Vision-Language Models},\nauthor={Yuan Zang and Tian Yun and Hao Tan and Trung Bui and Chen Sun},\nyear={2024},\nurl={https://openreview.net/forum?id=ZSvOIT5Ai2}\n}",
        "github": "",
        "project": "",
        "reviewers": "JkAA;PAjz;8mWh",
        "site": "https://openreview.net/forum?id=ZSvOIT5Ai2",
        "pdf_size": 2498296,
        "rating": "3;5;5",
        "confidence": "4;3;3",
        "soundness": "2;3;3",
        "contribution": "1;2;2",
        "presentation": "1;3;2",
        "wc_summary": "71;191;146",
        "wc_strengths": "19;22;20",
        "wc_weaknesses": "169;288;182",
        "wc_questions": "18;68;21",
        "wc_review": "277;569;369",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "851;670;468",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            136.0,
            49.49747468305833
        ],
        "wc_strengths_avg": [
            20.333333333333332,
            1.247219128924647
        ],
        "wc_weaknesses_avg": [
            213.0,
            53.29790489941107
        ],
        "wc_questions_avg": [
            35.666666666666664,
            22.89589968143253
        ],
        "wc_review_avg": [
            405.0,
            121.89613064682023
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            663.0,
            156.4374209281995
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9999999999999998,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:SOxlhR24yRYJ:scholar.google.com/&scioq=Interpretable+Concept+Discovery+and+Learning+from+Pretrained+Vision-Language+Models&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;1;2",
        "aff_unique_norm": "Brown University;Adobe;Google",
        "aff_unique_dep": ";Adobe Systems Incorporated;Google",
        "aff_unique_url": "https://www.brown.edu;https://www.adobe.com;https://www.google.com",
        "aff_unique_abbr": "Brown;Adobe;Google",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "How to Fine-Tune Vision Models with SGD",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18395",
        "id": "ZTssMmhC2X",
        "author_site": "Ananya Kumar, Ruoqi Shen, Sebastien Bubeck, Suriya Gunasekar",
        "tldr": "",
        "abstract": "SGD and AdamW are the two most used optimizers for fine-tuning large neural networks in computer vision. When the two methods perform the same, SGD is preferable because it uses less memory (12 bytes/parameter with momentum and 8 bytes/parameter without) than AdamW (16 bytes/parameter). However, on a suite of downstream tasks, especially those with distribution shifts, we find that fine-tuning with AdamW performs substantially better than SGD on modern Vision Transformer and ConvNeXt models. We find that large gaps in performance between SGD and AdamW occur when the fine-tuning gradients in the first \"embedding\" layer are much larger than in the rest of the model. Our analysis suggests an easy fix that works consistently across datasets and models: freezing the embedding layer (less than 1% of the parameters) leads to SGD with or without momentum performing slightly better than AdamW while using less memory (e.g., on ViT-L, SGD uses 33% less GPU memory). Our insights result in state-of-the-art accuracies on five popular distribution shift benchmarks: WILDS-FMoW, WILDS-Camelyon, BREEDS-Living-17, Waterbirds, and DomainNet.",
        "keywords": "fine-tuning;SGD;freezing layers;distribution shift",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Ananya Kumar;Ruoqi Shen;Sebastien Bubeck;Suriya Gunasekar",
        "authorids": "~Ananya_Kumar1;~Ruoqi_Shen1;~Sebastien_Bubeck1;~Suriya_Gunasekar1",
        "gender": "M;;;",
        "homepage": "https://ananyakumar.wordpress.com/;https://homes.cs.washington.edu/~shenr3/;http://sbubeck.com/;http://sgunasekar.github.io",
        "dblp": "192/0474;248/8237.html;35/4292;",
        "google_scholar": "tP5IBFkAAAAJ;;V2Y1L4sAAAAJ;EkREu_QAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Ananya_Kumar1;~Ruoqi_Shen1;~Sebastien_Bubeck1;~Suriya_Gunasekar1",
        "aff": "OpenAI;University of Washington, Seattle;Microsoft;Microsoft",
        "aff_domain": "openai.com;uw.edu;microsoft.com;microsoft.com",
        "position": "Researcher;PhD student;Researcher;Senior Researcher",
        "bibtex": "@inproceedings{\nkumar2024how,\ntitle={How to Fine-Tune Vision Models with {SGD}},\nauthor={Ananya Kumar and Ruoqi Shen and Sebastien Bubeck and Suriya Gunasekar},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ZTssMmhC2X}\n}",
        "github": "",
        "project": "",
        "reviewers": "qVNV;zcmx;6FtM;RNj8;S1Jb",
        "pdf_size": 1407230,
        "rating": "6;6;6;6;8",
        "confidence": "4;4;4;3;3",
        "soundness": "3;3;3;3;4",
        "contribution": "3;3;3;3;3",
        "presentation": "4;3;3;3;4",
        "wc_summary": "120;189;122;72;89",
        "wc_strengths": "122;53;97;40;26",
        "wc_weaknesses": "282;132;69;26;124",
        "wc_questions": "121;59;68;58;54",
        "wc_review": "645;433;356;196;293",
        "wc_reply_reviewers": "0;28;0;0;0",
        "wc_reply_authors": "1001;527;307;282;493",
        "reply_reviewers": "0;1;0;0;0",
        "reply_authors": "2;1;1;2;1",
        "rating_avg": [
            6.4,
            0.7999999999999999
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            3.2,
            0.39999999999999997
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            118.4,
            40.042976912312604
        ],
        "wc_strengths_avg": [
            67.6,
            36.13640823324864
        ],
        "wc_weaknesses_avg": [
            126.6,
            86.7446828341657
        ],
        "wc_questions_avg": [
            72.0,
            24.92388412747901
        ],
        "wc_review_avg": [
            384.6,
            151.61081755600424
        ],
        "wc_reply_reviewers_avg": [
            5.6,
            11.2
        ],
        "wc_reply_authors_avg": [
            522.0,
            258.50802695467695
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            1.4,
            0.4898979485566356
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.6123724356957946,
        "gs_citation": 23,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10648081019621916338&as_sdt=5,34&sciodt=0,34&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=ZTssMmhC2X",
        "pdf": "https://openreview.net/pdf?id=ZTssMmhC2X",
        "email": "openai.com;uw.edu;microsoft.com;microsoft.com",
        "author_num": 4,
        "aff_unique_index": "0;1;2;2",
        "aff_unique_norm": "OpenAI;University of Washington;Microsoft",
        "aff_unique_dep": ";;Microsoft Corporation",
        "aff_unique_url": "https://openai.com;https://www.washington.edu;https://www.microsoft.com",
        "aff_unique_abbr": "OpenAI;UW;Microsoft",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Seattle",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "DMBP: Diffusion model-based predictor for robust offline reinforcement learning against state observation perturbations",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18394",
        "id": "ZULjcYLWKe",
        "author_site": "Zhihe Yang, Yunjian Xu",
        "tldr": "",
        "abstract": "Offline reinforcement learning (RL), which aims to fully explore offline datasets for training without interaction with environments, has attracted growing recent attention. A major challenge for the real-world application of offline RL stems from the robustness against state observation perturbations, e.g., as a result of sensor errors or adversarial attacks. Unlike online robust RL, agents cannot be adversarially trained in the offline setting. In this work, we propose Diffusion Model-Based Predictor (DMBP) in a new framework that recovers the actual states with conditional diffusion models for state-based RL tasks. To mitigate the error accumulation issue in model-based estimation resulting from the classical training of conventional diffusion models, we propose a non-Markovian training objective to minimize the sum entropy of denoised states in RL trajectory. Experiments on standard benchmark problems demonstrate that DMBP can significantly enhance the robustness of existing offline RL algorithms against different scales of ran- dom noises and adversarial attacks on state observations. Further, the proposed framework can effectively deal with incomplete state observations with random combinations of multiple unobserved dimensions in the test. Our implementation is available at https://github.com/zhyang2226/DMBP.",
        "keywords": "Robust Reinforcement Learning;Offline Reinforcement Learning;Diffusion Models",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/1951b9fafa3bee252be158a5227571e472d9cce2.zip",
        "author": "Zhihe YANG;Yunjian Xu",
        "authorids": "~Zhihe_YANG1;~Yunjian_Xu1",
        "gender": "M;M",
        "homepage": "https://zhyang2226.github.io/;https://www4.mae.cuhk.edu.hk/peoples/xu-yunjian/",
        "dblp": "219/9314;09/3682",
        "google_scholar": "Vp0ENWcAAAAJ;BVw1yP0AAAAJ",
        "orcid": "0000-0002-7635-5022;",
        "linkedin": "zhihe-yang-b07626224/;",
        "or_profile": "~Zhihe_YANG1;~Yunjian_Xu1",
        "aff": "Microsoft;The Chinese University of Hong Kong",
        "aff_domain": "microsoft.com;cuhk.edu.hk",
        "position": "Intern;Associate Professor",
        "bibtex": "@inproceedings{\nyang2024dmbp,\ntitle={{DMBP}: Diffusion model-based predictor for robust offline reinforcement learning against state observation perturbations},\nauthor={Zhihe YANG and Yunjian Xu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ZULjcYLWKe}\n}",
        "github": "",
        "project": "",
        "reviewers": "FLnj;YkkL;As3y;ad2c",
        "pdf_size": 18581640,
        "rating": "6;6;8;8",
        "confidence": "4;4;3;3",
        "soundness": "3;3;4;3",
        "contribution": "3;3;3;3",
        "presentation": "2;3;4;4",
        "wc_summary": "137;99;79;68",
        "wc_strengths": "142;90;115;107",
        "wc_weaknesses": "154;57;259;8",
        "wc_questions": "4;87;89;175",
        "wc_review": "437;333;542;358",
        "wc_reply_reviewers": "17;10;275;11",
        "wc_reply_authors": "399;783;1287;216",
        "reply_reviewers": "1;1;3;1",
        "reply_authors": "1;2;3;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            95.75,
            26.280934153869037
        ],
        "wc_strengths_avg": [
            113.5,
            18.76832437912346
        ],
        "wc_weaknesses_avg": [
            119.5,
            96.16262267638086
        ],
        "wc_questions_avg": [
            88.75,
            60.46641629863639
        ],
        "wc_review_avg": [
            417.5,
            81.48772913758242
        ],
        "wc_reply_reviewers_avg": [
            78.25,
            113.62520627043983
        ],
        "wc_reply_authors_avg": [
            671.25,
            410.18555252470804
        ],
        "reply_reviewers_avg": [
            1.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15665247902860758045&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=ZULjcYLWKe",
        "pdf": "https://openreview.net/pdf?id=ZULjcYLWKe",
        "email": "microsoft.com;cuhk.edu.hk",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Microsoft;Chinese University of Hong Kong",
        "aff_unique_dep": "Microsoft Corporation;",
        "aff_unique_url": "https://www.microsoft.com;https://www.cuhk.edu.hk",
        "aff_unique_abbr": "Microsoft;CUHK",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "ZVi81SH1Ob",
        "title": "Neural Collapse meets Differential Privacy: Curious behaviors of NoisySGD with Near-Perfect Representation Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In recent studies, it has been demonstrated that large-scale representation learning through pre-training on gigantic datasets significantly enhances differentially private learning for downstream tasks. By training on Google's proprietary JFT dataset, one can achieve an unprecedented 83% Top 1 accuracy on ImageNet with strong privacy parameters $(0.5,8\\times 10^{-7})$-DP, even given the high dimensionality of the feature space.\nWhile the exact behaviors of NoisySGD in these scenarios remain theoretically challenging to analyze, we explore an idealized setting using a layer-peeled model for representation learning, which results in interesting phenomena of the learned features known as neural collapse. Under this setting, we have observed several notable behaviors of NoisySGD.\nSpecifically, we demonstrate that under perfect neural collapse, the misclassification error is unaffected by the dimension of the features. This dimension-independent result holds with any learning rate and even with class imbalance and is not influenced by the nature of the loss functions.\nNevertheless, a dimension dependency emerges when introducing minor perturbations in either the feature or model space. To address this dependency under perturbation, we suggest several strategies, such as pre-processing features or employing principal component analysis to reduce feature dimensions.",
        "keywords": "Differential privacy; neural collapse; DP-SGD; representation Learning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/8199aec58db87133e347914772c25656d49c89db.pdf",
        "author": "Chendi Wang;Yuqing Zhu;Weijie J Su;Yu-Xiang Wang",
        "authorids": "~Chendi_Wang2;~Yuqing_Zhu1;~Weijie_J_Su1;~Yu-Xiang_Wang1",
        "gender": "M;F;M;",
        "homepage": ";https://jeremy43.github.io/;http://stat.wharton.upenn.edu/~suw/;http://www.cs.ucsb.edu/~yuxiangw/publications.html",
        "dblp": ";;228/9127;62/1637-3.html",
        "google_scholar": ";QmMv9PIAAAAJ;Uhf4nBkAAAAJ;HGNZ1fkAAAAJ",
        "orcid": "0000-0001-5321-1846;;;",
        "linkedin": ";;;",
        "or_profile": "~Chendi_Wang2;~Yuqing_Zhu1;~Weijie_J_Su1;~Yu-Xiang_Wang1",
        "aff": "Shenzhen Research Institute of Big Data;Tiktok;University of Pennsylvania;UC Santa Barbara",
        "aff_domain": "cuhk.edu.cn;tiktok.com;upenn.edu;ucsb.edu",
        "position": "Postdoc;Researcher;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nwang2024neural,\ntitle={Neural Collapse meets Differential Privacy:  Curious behaviors of Noisy{SGD} with Near-Perfect Representation Learning},\nauthor={Chendi Wang and Yuqing Zhu and Weijie J Su and Yu-Xiang Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=ZVi81SH1Ob}\n}",
        "github": "",
        "project": "",
        "reviewers": "dsyA;MQQr;KJYE",
        "site": "https://openreview.net/forum?id=ZVi81SH1Ob",
        "pdf_size": 507539,
        "rating": "3;3;5",
        "confidence": "5;3;3",
        "soundness": "1;3;2",
        "contribution": "1;2;2",
        "presentation": "3;3;3",
        "wc_summary": "146;62;86",
        "wc_strengths": "4;62;31",
        "wc_weaknesses": "5;89;131",
        "wc_questions": "3;175;30",
        "wc_review": "158;388;278",
        "wc_reply_reviewers": "17;0;0",
        "wc_reply_authors": "707;577;736",
        "reply_reviewers": "1;0;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            98.0,
            35.32704346531139
        ],
        "wc_strengths_avg": [
            32.333333333333336,
            23.697163449568293
        ],
        "wc_weaknesses_avg": [
            75.0,
            52.38320341483518
        ],
        "wc_questions_avg": [
            69.33333333333333,
            75.5263015261718
        ],
        "wc_review_avg": [
            274.6666666666667,
            93.92668535736914
        ],
        "wc_reply_reviewers_avg": [
            5.666666666666667,
            8.013876853447538
        ],
        "wc_reply_authors_avg": [
            673.3333333333334,
            69.13915115346892
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5000000000000001,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:m8cYqs8s0F0J:scholar.google.com/&scioq=Neural+Collapse+meets+Differential+Privacy:+Curious+behaviors+of+NoisySGD+with+Near-Perfect+Representation+Learning&hl=en&as_sdt=0,44",
        "gs_version_total": 9,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Shenzhen Research Institute of Big Data;TikTok;University of Pennsylvania;University of California, Santa Barbara",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "http://www.sribd.cn;https://www.tiktok.com;https://www.upenn.edu;https://www.ucsb.edu",
        "aff_unique_abbr": ";TikTok;UPenn;UCSB",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Santa Barbara",
        "aff_country_unique_index": "0;0;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Functional Bayesian Tucker Decomposition for Continuous-indexed Tensor Data",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18393",
        "id": "ZWyZeqE928",
        "author_site": "Shikai Fang, Xin Yu, Zheng Wang, Shibo Li, Mike Kirby, Shandian Zhe",
        "tldr": "",
        "abstract": "Tucker decomposition is a powerful tensor model to handle multi-aspect data. It demonstrates the low-rank property by decomposing the grid-structured data as interactions between a core tensor and a set of object representations (factors).  A fundamental assumption of such decomposition is that there are finite objects in each aspect or mode, corresponding to discrete indexes of data entries. However,  real-world data is often not naturally posed in this setting. For example, geographic data is represented as continuous indexes of latitude and longitude coordinates, and cannot fit tensor models directly. To generalize Tucker decomposition to such scenarios, we propose Functional Bayesian Tucker Decomposition (FunBaT). We treat the continuous-indexed data as the interaction between the Tucker core and a group of latent functions. We use Gaussian processes (GP)  as functional priors to model the latent functions. Then, we convert each GP into a state-space prior by constructing an equivalent stochastic differential equation (SDE)  to reduce computational cost. An efficient inference algorithm is developed for scalable posterior approximation based on advanced message-passing techniques. The advantage of our method is shown in both synthetic data and several real-world applications. We release the code of FunBaT at {https://github.com/xuangu-fang/Functional-Bayesian-Tucker-Decomposition}.",
        "keywords": "Bayesian model;Tensor decomposition;Gaussian Processes",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Shikai Fang;Xin Yu;Zheng Wang;Shibo Li;Mike Kirby;Shandian Zhe",
        "authorids": "~Shikai_Fang2;~Xin_Yu4;~Zheng_Wang2;~Shibo_Li1;~Mike_Kirby1;~Shandian_Zhe1",
        "gender": ";F;M;;M;",
        "homepage": ";https://www.cs.utah.edu/~xiyu;;https://imshibo.com/;https://users.cs.utah.edu/~kirby/;",
        "dblp": ";;;;k/RobertMKirby.html;",
        "google_scholar": ";tWAfvQsAAAAJ;;thvPDwgAAAAJ;https://scholar.google.com/citations?hl=en;",
        "orcid": ";;;0009-0009-1076-282X;0000-0001-5712-4141;",
        "linkedin": ";;;;;",
        "or_profile": "~Shikai_Fang2;~Xin_Yu4;~Zheng_Wang2;~Shibo_Li1;~Mike_Kirby1;~Shandian_Zhe1",
        "aff": ";University of Utah;;University of Utah;;",
        "aff_domain": ";cs.utah.edu;;utah.edu;;",
        "position": ";PhD student;;PhD student;;",
        "bibtex": "@inproceedings{\nfang2024functional,\ntitle={Functional Bayesian Tucker Decomposition for Continuous-indexed Tensor Data},\nauthor={Shikai Fang and Xin Yu and Zheng Wang and Shibo Li and Mike Kirby and Shandian Zhe},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ZWyZeqE928}\n}",
        "github": "",
        "project": "",
        "reviewers": "TaJq;MPRT;BN7i;wp4E",
        "pdf_size": 696556,
        "rating": "5;5;6;8",
        "confidence": "4;4;3;4",
        "soundness": "2;3;3;3",
        "contribution": "3;2;2;3",
        "presentation": "2;3;2;3",
        "wc_summary": "101;149;68;57",
        "wc_strengths": "82;118;30;22",
        "wc_weaknesses": "170;181;241;41",
        "wc_questions": "527;129;83;81",
        "wc_review": "880;577;422;201",
        "wc_reply_reviewers": "17;0;17;0",
        "wc_reply_authors": "742;763;1024;314",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "2;2;3;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            93.75,
            35.77272005313546
        ],
        "wc_strengths_avg": [
            63.0,
            39.230090491866065
        ],
        "wc_weaknesses_avg": [
            158.25,
            72.88818491360585
        ],
        "wc_questions_avg": [
            205.0,
            186.8956928342652
        ],
        "wc_review_avg": [
            520.0,
            247.0900645513696
        ],
        "wc_reply_reviewers_avg": [
            8.5,
            8.5
        ],
        "wc_reply_authors_avg": [
            710.75,
            254.57943259422981
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1804787866502177614&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=ZWyZeqE928",
        "pdf": "https://openreview.net/pdf?id=ZWyZeqE928",
        "email": ";cs.utah.edu;;utah.edu;;",
        "author_num": 6,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Utah",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.utah.edu",
        "aff_unique_abbr": "Utah",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "ZWytHTcnTy",
        "title": "CAT-Seg: Cost Aggregation for Open-vocabulary Semantic Segmentation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In this paper, we reinterpret the challenge of open-vocabulary semantic segmentation, where each pixel in an image is labeled with a wide range of text descriptions, as a correspondence problem focusing on the optimal text matching for each pixel. Addressing the limitations of conventional region-to-text matching approaches, we introduce a novel framework, CAT-Seg, grounded on the principles of cost aggregation methods in visual correspondence tasks. This framework refines the initial matching scores between dense image and text embeddings, leveraging a Transformer-based module for cost aggregation, further enhanced with embedding guidance. Notably, by operating on cosine similarity instead of manipulating embeddings directly, our approach enables the end-to-end fine-tuning of the CLIP model for pixel-level tasks, while yielding superior zero-shot capabilities. Empirical evaluations show our method's superior performance, achieving state-of-the-art results across open-vocabulary benchmarks, practical computational efficiency, and robustness for various domains, underscoring its potential for a wide range of open-vocabulary semantic segmentation applications.",
        "keywords": "Open-vocabulary semantic segmentation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/a29eaf740d141bc7d983a1a3807c12067011f888.pdf",
        "author": "Seokju Cho;Heeseong Shin;Sunghwan Hong;Anurag Arnab;Paul Hongsuck Seo;Seungryong Kim",
        "authorids": "~Seokju_Cho1;~Heeseong_Shin2;~Sunghwan_Hong2;~Anurag_Arnab1;~Paul_Hongsuck_Seo1;~Seungryong_Kim1",
        "gender": "M;;;;M;M",
        "homepage": "https://seokju-cho.github.io;https://github.com/hsshin98;;;https://phseo.github.io;https://cvlab.korea.ac.kr/members/faculty",
        "dblp": "294/4755;229/9090;;;172/0938;141/9955",
        "google_scholar": "mvPfpnMAAAAJ;;;;https://scholar.google.co.kr/citations?user=Tp7U8_UAAAAJ;cIK1hS8AAAAJ",
        "orcid": "0000-0003-1199-9596;;;;;",
        "linkedin": "seokju-cho-43601b174/;;;;;",
        "or_profile": "~Seokju_Cho1;~Heeseong_Shin2;~Sunghwan_Hong2;~Anurag_Arnab1;~Paul_Hongsuck_Seo1;~Seungryong_Kim1",
        "aff": "Korea University;Korea University;;;Korea University;Korea University",
        "aff_domain": "korea.ac.kr;korea.ac.kr;;;korea.ac.kr;korea.ac.kr",
        "position": "PhD student;MS student;;;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\ncho2024catseg,\ntitle={{CAT}-Seg: Cost Aggregation for Open-vocabulary Semantic Segmentation},\nauthor={Seokju Cho and Heeseong Shin and Sunghwan Hong and Anurag Arnab and Paul Hongsuck Seo and Seungryong Kim},\nyear={2024},\nurl={https://openreview.net/forum?id=ZWytHTcnTy}\n}",
        "github": "",
        "project": "",
        "reviewers": "qcKD;sjbY;3c8N",
        "site": "https://openreview.net/forum?id=ZWytHTcnTy",
        "pdf_size": 15554671,
        "rating": "3;5;5",
        "confidence": "4;4;4",
        "soundness": "3;2;2",
        "contribution": "1;2;2",
        "presentation": "3;3;3",
        "wc_summary": "57;75;76",
        "wc_strengths": "25;68;17",
        "wc_weaknesses": "244;76;163",
        "wc_questions": "9;61;142",
        "wc_review": "335;280;398",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            69.33333333333333,
            8.73053390247253
        ],
        "wc_strengths_avg": [
            36.666666666666664,
            22.395436042987765
        ],
        "wc_weaknesses_avg": [
            161.0,
            68.60029154456998
        ],
        "wc_questions_avg": [
            70.66666666666667,
            54.725578013291816
        ],
        "wc_review_avg": [
            337.6666666666667,
            48.21018795049675
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 112,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3324236563546946736&as_sdt=8005&sciodt=0,7&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Korea University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.korea.ac.kr",
        "aff_unique_abbr": "KU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "Effective Data Augmentation With Diffusion Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18392",
        "id": "ZWzUA9zeAg",
        "author_site": "Brandon Trabucco, Kyle Doherty, Max Gurinas, Ruslan Salakhutdinov",
        "tldr": "",
        "abstract": "Data augmentation is one of the most prevalent tools in deep learning, underpinning many recent advances, including those from classification, generative models, and representation learning. The standard approach to data augmentation combines simple transformations like rotations and flips to generate new images from existing ones. However, these new images lack diversity along key semantic axes present in the data. Current augmentations cannot alter the high-level semantic attributes, such as animal species present in a scene, to enhance the diversity of data. We address the lack of diversity in data augmentation with image-to-image transformations parameterized by pre-trained text-to-image diffusion models. Our method edits images to change their semantics using an off-the-shelf diffusion model, and generalizes to novel visual concepts from a few labelled examples. We evaluate our approach on few-shot image classification tasks, and on a real-world weed recognition task, and observe an improvement in accuracy in tested domains.",
        "keywords": "Deep Learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Brandon Trabucco;Kyle Doherty;Max A Gurinas;Ruslan Salakhutdinov",
        "authorids": "~Brandon_Trabucco1;~Kyle_Doherty1;~Max_A_Gurinas1;~Ruslan_Salakhutdinov1",
        "gender": "M;M;M;M",
        "homepage": "http://btrabucco.com;https://github.com/mosscoder;;https://www.cs.cmu.edu/~rsalakhu/",
        "dblp": ";;;",
        "google_scholar": "aLquhd4AAAAJ;oiESPrEAAAAJ;;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Brandon_Trabucco1;~Kyle_Doherty1;~Max_A_Gurinas1;~Russ_Salakhutdinov1",
        "aff": "Carnegie Mellon University;MPG Ranch;University of Chicago Laboratory Schools;School of Computer Science, Carnegie Mellon University",
        "aff_domain": "mld.cs.cmu.edu;mpgranch.com;uchicago.edu;cs.cmu.edu",
        "position": "PhD student;Researcher;Undergrad student;Full Professor",
        "bibtex": "@inproceedings{\ntrabucco2024effective,\ntitle={Effective Data Augmentation With Diffusion Models},\nauthor={Brandon Trabucco and Kyle Doherty and Max A Gurinas and Ruslan Salakhutdinov},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ZWzUA9zeAg}\n}",
        "github": "",
        "project": "",
        "reviewers": "5pTF;KxYv;hrLX;rXxt",
        "pdf_size": 21681873,
        "rating": "6;6;8;8",
        "confidence": "4;4;4;4",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "4;3;3;3",
        "wc_summary": "65;51;141;233",
        "wc_strengths": "26;22;82;342",
        "wc_weaknesses": "160;342;62;128",
        "wc_questions": "72;131;51;113",
        "wc_review": "323;546;336;816",
        "wc_reply_reviewers": "42;190;0;17",
        "wc_reply_authors": "929;2114;421;1116",
        "reply_reviewers": "1;3;0;1",
        "reply_authors": "3;6;1;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            122.5,
            72.4068366937819
        ],
        "wc_strengths_avg": [
            118.0,
            131.4838393111488
        ],
        "wc_weaknesses_avg": [
            173.0,
            103.77379245262264
        ],
        "wc_questions_avg": [
            91.75,
            31.7913117061879
        ],
        "wc_review_avg": [
            505.25,
            200.0542114028095
        ],
        "wc_reply_reviewers_avg": [
            62.25,
            75.25415270933559
        ],
        "wc_reply_authors_avg": [
            1145.0,
            614.5392583065789
        ],
        "reply_reviewers_avg": [
            1.25,
            1.0897247358851685
        ],
        "reply_authors_avg": [
            3.0,
            1.8708286933869707
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 284,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14133762874259167125&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=ZWzUA9zeAg",
        "pdf": "https://openreview.net/pdf?id=ZWzUA9zeAg",
        "email": "mld.cs.cmu.edu;mpgranch.com;uchicago.edu;cs.cmu.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Carnegie Mellon University;MPG Ranch;University of Chicago",
        "aff_unique_dep": ";;Laboratory Schools",
        "aff_unique_url": "https://www.cmu.edu;;https://www.uchicago.edu",
        "aff_unique_abbr": "CMU;;UChicago",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Chicago;Pittsburgh",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Bayesian Bi-clustering of Neural Spiking Activity with Latent Structures",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18391",
        "id": "ZYm1Ql6udy",
        "tldr": "",
        "abstract": "Modern neural recording techniques allow neuroscientists to obtain spiking activity of multiple neurons from different brain regions over long time periods, which requires new statistical methods to be developed for understanding structure of the large-scale data. In this paper, we develop a bi-clustering method to cluster the neural spiking activity spatially and temporally, according to their low-dimensional latent structures. The spatial (neuron) clusters are defined by the latent trajectories within each neural population, while the temporal (state) clusters are defined by (populationally) synchronous local linear dynamics shared with different periods. To flexibly extract the bi-clustering structure, we build the model non-parametrically, and develop an efficient Markov chain Monte Carlo (MCMC) algorithm to sample the posterior distributions of model parameters. Validating our proposed MCMC algorithm through simulations, we find the method can recover unknown parameters and true bi-clustering structures successfully. We then apply the proposed bi-clustering method to multi-regional neural recordings under different experiment settings, where we find that simultaneously considering latent trajectories and spatial-temporal clustering structures can provide us with a more accurate and interpretable result. Overall, the proposed method provides scientific insights for large-scale (counting) time series with elongated recording periods, and it can potentially have application beyond neuroscience.",
        "keywords": "neural spikes;spatio-temporal statistics;Bayesian nonparametric;bi-clustering",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/ac291cc5aa9f863da7ca558a98b4c308d68ff891.zip",
        "author": "Ganchao Wei",
        "authorids": "~Ganchao_Wei1",
        "gender": "M",
        "homepage": "https://github.com/weigcdsb",
        "dblp": "",
        "google_scholar": "",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Ganchao_Wei1",
        "aff": "Duke University",
        "aff_domain": "duke.edu",
        "position": "Postdoc",
        "bibtex": "@inproceedings{\nwei2024bayesian,\ntitle={Bayesian Bi-clustering of Neural Spiking Activity with Latent Structures},\nauthor={Ganchao Wei},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ZYm1Ql6udy}\n}",
        "github": "",
        "project": "",
        "reviewers": "DWGp;96hg;xUve",
        "pdf_size": 1543567,
        "rating": "6;6;8",
        "confidence": "3;4;5",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "3;3;3",
        "wc_summary": "98;60;86",
        "wc_strengths": "48;28;57",
        "wc_weaknesses": "102;14;232",
        "wc_questions": "115;273;39",
        "wc_review": "363;375;414",
        "wc_reply_reviewers": "0;0;73",
        "wc_reply_authors": "524;309;519",
        "reply_reviewers": "0;0;1",
        "reply_authors": "1;1;2",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            81.33333333333333,
            15.86050300449376
        ],
        "wc_strengths_avg": [
            44.333333333333336,
            12.119772641798562
        ],
        "wc_weaknesses_avg": [
            116.0,
            89.54700813911465
        ],
        "wc_questions_avg": [
            142.33333333333334,
            97.46566346952939
        ],
        "wc_review_avg": [
            384.0,
            21.77154105707724
        ],
        "wc_reply_reviewers_avg": [
            24.333333333333332,
            34.41253001774532
        ],
        "wc_reply_authors_avg": [
            450.6666666666667,
            100.19425576792757
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0.8660254037844385,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Ogvue7FLHTAJ:scholar.google.com/&scioq=Bayesian+Bi-clustering+of+Neural+Spiking+Activity+with+Latent+Structures&hl=en&as_sdt=0,33",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=ZYm1Ql6udy",
        "pdf": "https://openreview.net/pdf?id=ZYm1Ql6udy",
        "email": "duke.edu",
        "author_num": 1,
        "aff_unique_index": "0",
        "aff_unique_norm": "Duke University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.duke.edu",
        "aff_unique_abbr": "Duke",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "title": "LipVoicer: Generating Speech from Silent Videos Guided by Lip Reading",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18390",
        "id": "ZZCPSC5OgD",
        "author_site": "Yochai Yemini, Aviv Shamsian, Lior Bracha, Sharon Gannot, Ethan Fetaya",
        "tldr": "",
        "abstract": "Lip-to-speech involves generating a natural-sounding speech synchronized with a soundless video of a person talking. Despite recent advances, current methods still cannot produce high-quality speech with high levels of intelligibility for challenging and realistic datasets such as LRS3. In this work, we present LipVoicer, a novel method that generates high-quality speech, even for in-the-wild and rich datasets, by incorporating the text modality. Given a silent video, we first predict the spoken text using a pre-trained lip-reading network. We then condition a diffusion model on the video and use the extracted text through a classifier-guidance mechanism where a pre-trained automatic speech recognition (ASR ) serves as the classifier. LipVoicer outperforms multiple lip-to-speech baselines on LRS2 and LRS3, which are in-the-wild datasets with hundreds of unique speakers in their test set and an unrestricted vocabulary. Moreover, our experiments show that the inclusion of the text modality plays a major role in the intelligibility of the produced speech, readily perceptible while listening, and is empirically reflected in the substantial reduction of the word error rate ( WER ) metric. We demonstrate the effectiveness of LipVoicer through human evaluation, which shows that it produces more natural and synchronized speech signals compared to competing methods. Finally, we created a demo showcasing LipVoicer\u2019s superiority in producing natural, synchronized, and intelligible speech, providing additional evidence of its effectiveness. Project page and code: https://github.com/yochaiye/LipVoicer",
        "keywords": "lip-to-speech;lip-reading;diffusion models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/26c6f8608421438dfb3d0e5255c6168e91e11735.zip",
        "author": "Yochai Yemini;Aviv Shamsian;Lior Bracha;Sharon Gannot;Ethan Fetaya",
        "authorids": "~Yochai_Yemini1;~Aviv_Shamsian1;~Lior_Bracha1;~Sharon_Gannot1;~Ethan_Fetaya1",
        "gender": ";M;F;M;M",
        "homepage": ";;https://chechiklab.biu.ac.il/~brachalior;https://sharongannot.group/;http://www.cs.toronto.edu/~ethanf/",
        "dblp": "270/4233;261/9492;232/3082;79/5373;01/10046",
        "google_scholar": "https://scholar.google.co.uk/citations?user=nlk6-lMAAAAJ;;2t0JDEsAAAAJ;C7cw4msAAAAJ;zLuqh-0AAAAJ",
        "orcid": ";;;0000-0002-2885-170X;0000-0003-3125-1665",
        "linkedin": ";aviv-shamsian/;;;",
        "or_profile": "~Yochai_Yemini1;~Aviv_Shamsian1;~Lior_Bracha1;~Sharon_Gannot1;~Ethan_Fetaya1",
        "aff": ";Bar-Ilan University;Bar-Ilan University;Bar Ilan University;Bar Ilan University",
        "aff_domain": ";biu.ac.il;biu.ac.il;biu.ac.il;biu.ac.il",
        "position": ";PhD student;PhD student;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nyemini2024lipvoicer,\ntitle={LipVoicer: Generating Speech from Silent Videos Guided by Lip Reading},\nauthor={Yochai Yemini and Aviv Shamsian and Lior Bracha and Sharon Gannot and Ethan Fetaya},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ZZCPSC5OgD}\n}",
        "github": "",
        "project": "",
        "reviewers": "gU1H;eBPV;x1vF;nskp",
        "pdf_size": 1544201,
        "rating": "5;5;6;8",
        "confidence": "4;3;4;4",
        "soundness": "2;3;4;3",
        "contribution": "2;3;2;3",
        "presentation": "3;3;4;3",
        "wc_summary": "165;39;72;161",
        "wc_strengths": "43;40;63;213",
        "wc_weaknesses": "166;138;125;193",
        "wc_questions": "44;105;1;43",
        "wc_review": "418;322;261;610",
        "wc_reply_reviewers": "0;0;0;197",
        "wc_reply_authors": "747;737;440;774",
        "reply_reviewers": "0;0;0;3",
        "reply_authors": "2;1;1;4",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            109.25,
            55.01988276977696
        ],
        "wc_strengths_avg": [
            89.75,
            71.70556115114086
        ],
        "wc_weaknesses_avg": [
            155.5,
            26.23451924468981
        ],
        "wc_questions_avg": [
            48.25,
            37.076778446893144
        ],
        "wc_review_avg": [
            402.75,
            132.09726530098948
        ],
        "wc_reply_reviewers_avg": [
            49.25,
            85.3035022727672
        ],
        "wc_reply_authors_avg": [
            674.5,
            136.0634043378307
        ],
        "reply_reviewers_avg": [
            0.75,
            1.299038105676658
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.4714045207910316,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11044568854305142858&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=ZZCPSC5OgD",
        "pdf": "https://openreview.net/pdf?id=ZZCPSC5OgD",
        "email": ";biu.ac.il;biu.ac.il;biu.ac.il;biu.ac.il",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Bar-Ilan University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.biu.ac.il",
        "aff_unique_abbr": "BIU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Israel"
    },
    {
        "title": "BENO: Boundary-embedded Neural Operators for Elliptic PDEs",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18389",
        "id": "ZZTkLDRmkg",
        "author_site": "Haixin Wang, Jiaxin Li, Anubhav Dwivedi, Kentaro Hara, Tailin Wu",
        "tldr": "",
        "abstract": "Elliptic partial differential equations (PDEs) are a major class of time-independent PDEs that play a key role in many scientific and engineering domains such as fluid dynamics, plasma physics, and solid mechanics. Recently, neural operators have emerged as a promising technique to solve elliptic PDEs more efficiently by directly mapping the input to solutions. However, existing networks typically neglect complex geometries and inhomogeneous boundary values  present in the real world. Here we introduce Boundary-Embedded Neural Operators (BENO), a novel neural operator architecture that embeds the complex geometries and inhomogeneous boundary values into the solving of elliptic PDEs. Inspired by classical Green's function, BENO consists of two Graph Neural Networks (GNNs) for interior source term and boundary values, respectively. Furthermore, a Transformer encoder maps the global boundary geometry into a latent vector which influences each message passing layer of the GNNs. We test our model and strong baselines extensively in elliptic PDEs with complex boundary conditions. We show that all existing baseline methods fail to learn the solution operator. In contrast, our model, endowed with boundary-embedded architecture, outperforms state-of-the-art neural operators and strong baselines by an average of 60.96%.",
        "keywords": "AI for PDEs; physical simulation;neural operators;boundary-embedded",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/2087428a7bebe2275fe191699c775381ba773d31.pdf",
        "author": "Haixin Wang;Jiaxin LI;Anubhav Dwivedi;Kentaro Hara;Tailin Wu",
        "authorids": "~Haixin_Wang3;~Jiaxin_LI11;~Anubhav_Dwivedi1;~Kentaro_Hara2;~Tailin_Wu1",
        "gender": ";F;M;M;M",
        "homepage": "https://willdreamer.github.io/;https://github.com/Jiaxinlia/Jiaxin.github.io;https://dwivedi-anubhav.github.io/website/;https://pdml.stanford.edu;http://tailin.org",
        "dblp": "81/5956-3;;;;200/8994",
        "google_scholar": "RGZUJOkAAAAJ;;;;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0002-5714-0149;;;;0009-0003-1586-0820",
        "linkedin": ";;;;",
        "or_profile": "~Haixin_Wang3;~Jiaxin_LI11;~Anubhav_Dwivedi1;~Kentaro_Hara2;~Tailin_Wu1",
        "aff": "Peking University;Harbin Institute of Technology;Stanford University;Stanford University;Westlake University",
        "aff_domain": "pku.edu.cn;hit.edu.cn;stanford.edu;stanford.edu;westlake.edu",
        "position": "MS student;Undergrad student;Postdoc;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nwang2024beno,\ntitle={{BENO}: Boundary-embedded Neural Operators for Elliptic {PDE}s},\nauthor={Haixin Wang and Jiaxin LI and Anubhav Dwivedi and Kentaro Hara and Tailin Wu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ZZTkLDRmkg}\n}",
        "github": "",
        "project": "",
        "reviewers": "MqG8;113v;L19w;tbt5;QC4z",
        "pdf_size": 7197817,
        "rating": "5;6;6;8;8",
        "confidence": "3;4;4;4;4",
        "soundness": "3;3;3;3;3",
        "contribution": "1;2;3;3;3",
        "presentation": "2;3;3;3;3",
        "wc_summary": "254;72;67;72;52",
        "wc_strengths": "86;56;48;85;43",
        "wc_weaknesses": "636;298;68;30;29",
        "wc_questions": "423;77;3;1;126",
        "wc_review": "1399;503;186;188;250",
        "wc_reply_reviewers": "0;0;54;35;31",
        "wc_reply_authors": "2955;1224;386;620;1487",
        "reply_reviewers": "0;0;1;1;1",
        "reply_authors": "6;3;2;2;4",
        "rating_avg": [
            6.6,
            1.2
        ],
        "confidence_avg": [
            3.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.4,
            0.8
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            103.4,
            75.6560638680073
        ],
        "wc_strengths_avg": [
            63.6,
            18.358649187780674
        ],
        "wc_weaknesses_avg": [
            212.2,
            234.31636733271534
        ],
        "wc_questions_avg": [
            126.0,
            155.79730421287783
        ],
        "wc_review_avg": [
            505.2,
            461.8473340834609
        ],
        "wc_reply_reviewers_avg": [
            24.0,
            21.080796948882174
        ],
        "wc_reply_authors_avg": [
            1334.4,
            902.4022606354663
        ],
        "reply_reviewers_avg": [
            0.6,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            3.4,
            1.4966629547095764
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.6666666666666666,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8504917761264755064&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=ZZTkLDRmkg",
        "pdf": "https://openreview.net/pdf?id=ZZTkLDRmkg",
        "email": "pku.edu.cn;hit.edu.cn;stanford.edu;stanford.edu;westlake.edu",
        "author_num": 5,
        "aff_unique_index": "0;1;2;2;3",
        "aff_unique_norm": "Peking University;Harbin Institute of Technology;Stanford University;Westlake University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "http://www.pku.edu.cn;http://www.hit.edu.cn/;https://www.stanford.edu;https://www.westlake.edu.cn",
        "aff_unique_abbr": "Peking U;HIT;Stanford;WU",
        "aff_campus_unique_index": "1;2;2",
        "aff_campus_unique": ";Harbin;Stanford",
        "aff_country_unique_index": "0;0;1;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "Zap3nZhRIQ",
        "title": "Three ways that non-differentiability affects neural network training",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper investigates how non-differentiability affects three different aspects of the neural network training process. We first analyze fully connected neural networks with ReLU activations, for which we show that the rate of convergence results derived using continuously differentiable functions grossly under-estimate the actual rate of convergence. Next, we analyze the problem of $L_{1}$ regularization and show that the solutions produced by deep learning solvers are unreliable even for the $L_{1}$ penalized linear model. Finally, we analyze the edge of a stability problem, where we show that all convex non-smooth functions display unstable convergence, and provide an example of a result derived using differentiable functions which fails in the non-differentiable setting. More generally, our results suggest that accounting for the non-linearity of neural networks in the training process is essential for us to develop better algorithms, and to get a better understanding of the training process in general.",
        "keywords": "neural networks;gradient descent;optimization",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/29bca5112b8e5587c0e366e8a7da9882ba5e3dfc.zip",
        "author": "Siddharth Krishna Kumar",
        "authorids": "~Siddharth_Krishna_Kumar2",
        "gender": "M",
        "homepage": "",
        "dblp": "199/1752",
        "google_scholar": "_fFiTI0AAAAJ",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Siddharth_Krishna_Kumar2",
        "aff": "",
        "aff_domain": "",
        "position": "",
        "bibtex": "@misc{\nkumar2024three,\ntitle={Three ways that non-differentiability affects neural network training},\nauthor={Siddharth Krishna Kumar},\nyear={2024},\nurl={https://openreview.net/forum?id=Zap3nZhRIQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "TRVW;A5zk;SuQn;AGDk",
        "site": "https://openreview.net/forum?id=Zap3nZhRIQ",
        "pdf_size": 1003038,
        "rating": "3;3;3;3",
        "confidence": "4;4;4;3",
        "soundness": "2;2;1;3",
        "contribution": "1;2;1;1",
        "presentation": "2;3;1;3",
        "wc_summary": "25;68;45;68",
        "wc_strengths": "19;61;12;31",
        "wc_weaknesses": "133;388;332;494",
        "wc_questions": "30;3;4;155",
        "wc_review": "207;520;393;748",
        "wc_reply_reviewers": "0;1147;0;0",
        "wc_reply_authors": "154;1807;218;284",
        "reply_reviewers": "0;2;0;0",
        "reply_authors": "1;3;1;1",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            51.5,
            17.95132307101624
        ],
        "wc_strengths_avg": [
            30.75,
            18.73999733191016
        ],
        "wc_weaknesses_avg": [
            336.75,
            131.23523726499678
        ],
        "wc_questions_avg": [
            48.0,
            62.717621128355944
        ],
        "wc_review_avg": [
            467.0,
            196.7523824506326
        ],
        "wc_reply_reviewers_avg": [
            286.75,
            496.66556907037557
        ],
        "wc_reply_authors_avg": [
            615.75,
            689.3026820635474
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:6FkG0UtOnNUJ:scholar.google.com/&scioq=Three+ways+that+non-differentiability+affects+neural+network+training&hl=en&as_sdt=0,48",
        "gs_version_total": 0
    },
    {
        "id": "Zb6qOouUJO",
        "title": "Efficient Fully Single-Loop Variance Reduced Methods for Stochastic Bilevel Optimization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Stochastic Bilevel Optimization (StocBO) has gained traction given its unique nested structure, which is increasingly popular in machine learning areas like meta-learning and hyperparameter optimization. A recent innovation by Dagreou et al. provided a unified single-loop framework for finite-sum StocBO. This presented the SABA method, a SAGA-type approach, achieving an iteration complexity of $\\mathcal{O}({(m+n)^{3/2}}/{T})$ and a memory cost of $\\mathcal{O}((m+n)(d+p))$. In this context, $m$ and $n$ symbolize the finite sum counts for the outer and inner-level tasks, while $d$ and $p$ describe their parameter dimensions. However, a drawback surfaces with memory consumption, especially with significantly large values of $m$ or $n$.\nIn response to this, we present the SBO-LSVRG, an adept solution inspired by Loopless-SVRG (LSVRG). This avant-garde method not only achieves the desired iteration complexity but also substantially trims the memory cost to a leaner $\\mathcal{O}(d+p)$. To our awareness, this paper pioneers in illustrating, from a theoretical lens, the application of LSVRG to bilevel optimization, particularly in non-convex realms. Furthermore, our variance-reduced method, SBO-LSVRG, excels with an optimal convergence speed. Comprehensive experiments validate the efficiency of our proposed approach.",
        "keywords": "stochastic bilevel optimization;single-loop methods;variance reduction",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Kai Yi;Yaoliang Yu",
        "authorids": "~Kai_Yi1;~Yaoliang_Yu1",
        "gender": "M;M",
        "homepage": "https://kaiyi.me/;https://cs.uwaterloo.ca/~y328yu/",
        "dblp": "13/1589;90/4989",
        "google_scholar": "r08j39wAAAAJ;https://scholar.google.ca/citations?user=zbXIQMsAAAAJ",
        "orcid": "0000-0003-0415-3584;0000-0002-3823-0720",
        "linkedin": "kai-yi-347089153/;",
        "or_profile": "~Kai_Yi1;~Yaoliang_Yu1",
        "aff": "KAUST;University of Waterloo",
        "aff_domain": "kaust.edu.sa;uwaterloo.ca",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\nyi2024efficient,\ntitle={Efficient Fully Single-Loop Variance Reduced Methods for Stochastic Bilevel Optimization},\nauthor={Kai Yi and Yaoliang Yu},\nyear={2024},\nurl={https://openreview.net/forum?id=Zb6qOouUJO}\n}",
        "github": "",
        "project": "",
        "reviewers": "vkov;oXEw;UgVc;L11w",
        "site": "https://openreview.net/forum?id=Zb6qOouUJO",
        "pdf_size": 1750283,
        "rating": "5;6;6;6",
        "confidence": "4;4;4;4",
        "soundness": "3;3;3;3",
        "contribution": "2;3;2;2",
        "presentation": "3;3;2;3",
        "wc_summary": "36;37;55;68",
        "wc_strengths": "27;30;69;85",
        "wc_weaknesses": "48;106;112;96",
        "wc_questions": "51;60;147;51",
        "wc_review": "162;233;383;300",
        "wc_reply_reviewers": "0;17;17;0",
        "wc_reply_authors": "686;862;855;532",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;2;2;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            49.0,
            13.322912594474229
        ],
        "wc_strengths_avg": [
            52.75,
            24.923633362734254
        ],
        "wc_weaknesses_avg": [
            90.5,
            25.194245374688244
        ],
        "wc_questions_avg": [
            77.25,
            40.43745170012571
        ],
        "wc_review_avg": [
            269.5,
            81.70220315266903
        ],
        "wc_reply_reviewers_avg": [
            8.5,
            8.5
        ],
        "wc_reply_authors_avg": [
            733.75,
            136.13665009834787
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:_rGDQVjj19oJ:scholar.google.com/&scioq=Efficient+Fully+Single-Loop+Variance+Reduced+Methods+for+Stochastic+Bilevel+Optimization&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "King Abdullah University of Science and Technology;University of Waterloo",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.kaust.edu.sa;https://uwaterloo.ca",
        "aff_unique_abbr": "KAUST;UW",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Saudi Arabia;Canada"
    },
    {
        "title": "Towards Foundational Models for Molecular Learning on Large-Scale Multi-Task Datasets",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18388",
        "id": "Zc2aIcucwc",
        "author_site": "Dominique Beaini, Shenyang(Andy) Huang, Joao Cunha, Zhiyi Li, Gabriela Moisescu-Pareja, Oleksandr Dymov, Samuel Maddrell-Mander, Callum McLean, Frederik Wenkel, Luis M\u00fcller, Jama Hussein Mohamud, Ali Parviz, Michael Craig, Micha\u0142 Koziarski, Jiarui Lu, Zhaocheng Zhu, Cristian Gabellini, Kerstin Klaser, Josef Dean, Cas Wognum, Maciej Sypetkowski, Guillaume Rabusseau, Reihaneh Rabbany, Jian Tang, Christopher Morris, Mirco Ravanellu, Guy Wolf, Prudencio Tossou, Hadrien Mary, Therence Bois, Andrew Fitzgibbon, Blazej Banaszewski, Chad Martin, Dominic Masters",
        "tldr": "",
        "abstract": "Recently, pre-trained foundation models have enabled significant advancements in multiple fields. In molecular machine learning, however, where datasets are often hand-curated, and hence typically small, the lack of datasets with labeled features, and codebases to manage those datasets, has hindered the development of foundation models. In this work, we present seven novel datasets categorized by size into three distinct categories: ToyMix, LargeMix and UltraLarge. These datasets push the boundaries in both the scale and the diversity of supervised labels for molecular learning. They cover nearly 100 million molecules and over 3000 sparsely defined tasks, totaling more than 13 billion individual labels of both quantum and biological nature. In comparison, our datasets contain 300 times more data points than the widely used OGB-LSC PCQM4Mv2 dataset, and 13 times more than the quantum-only QM1B dataset. In addition, to support the development of foundational models based on our proposed datasets, we present the Graphium graph machine learning library which simplifies the process of building and training molecular machine learning models for multi-task and multi-level molecular datasets. Finally, we present a range of baseline results as a starting point of multi-task and multi-level training on these datasets. Empirically, we observe that performance on low-resource biological datasets show improvement by also training on large amounts of quantum data. This indicates that there may be potential in multi-task and multi-level training of a foundation model and fine-tuning it to resource-constrained downstream tasks. The Graphium library is publicly available on Github and the dataset links are available in Part 1 and Part 2.",
        "keywords": "graph neural networks;Datasets;molecules;molecular graphs;Quantum;Multi-task;foundation model",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Dominique Beaini;Shenyang Huang;Joao Alex Cunha;Zhiyi Li;Gabriela Moisescu-Pareja;Oleksandr Dymov;Samuel Maddrell-Mander;Callum McLean;Frederik Wenkel;Luis M\u00fcller;Jama Hussein Mohamud;Ali Parviz;Michael Craig;Micha\u0142 Koziarski;Jiarui Lu;Zhaocheng Zhu;Cristian Gabellini;Kerstin Klaser;Josef Dean;Cas Wognum;Maciej Sypetkowski;Guillaume Rabusseau;Reihaneh Rabbany;Jian Tang;Christopher Morris;Mirco Ravanelli;Guy Wolf;Prudencio Tossou;Hadrien Mary;Therence Bois;Andrew W Fitzgibbon;Blazej Banaszewski;Chad Martin;Dominic Masters",
        "authorids": "~Dominique_Beaini1;~Shenyang_Huang1;~Joao_Alex_Cunha1;~Zhiyi_Li1;~Gabriela_Moisescu-Pareja1;~Oleksandr_Dymov1;~Samuel_Maddrell-Mander1;~Callum_McLean1;~Frederik_Wenkel1;~Luis_M\u00fcller1;~Jama_Hussein_Mohamud1;~Ali_Parviz1;~Michael_Craig1;~Micha\u0142_Koziarski1;~Jiarui_Lu2;~Zhaocheng_Zhu1;~Cristian_Gabellini1;~Kerstin_Klaser1;~Josef_Dean1;~Cas_Wognum1;~Maciej_Sypetkowski1;~Guillaume_Rabusseau1;~Reihaneh_Rabbany1;~Jian_Tang1;~Christopher_Morris1;~Mirco_Ravanelli1;~Guy_Wolf1;~Prudencio_Tossou1;~Hadrien_Mary1;~Therence_Bois1;~Andrew_W_Fitzgibbon1;~Blazej_Banaszewski1;~Chad_Martin1;~Dominic_Masters1",
        "gender": "M;;M;F;;M;;M;;;M;;M;;Not Specified;M;;;;;;M;F;;M;;M;M;;;M;;M;M",
        "homepage": ";;https://www.linkedin.com/in/jacunha/;;;https://stackoverflow.com/users/6875448/alex;;https://github.com/callumm-graphcore;;https://luis-mueller.github.io/;https://engmubarak48.github.io/jmohamud/;;;;https://lujiarui.github.io/;https://kiddozhu.github.io/;https://www.cristiangabellini.com;;https://github.com/jndean;;;https://www-labs.iro.umontreal.ca/~grabus/;http://www.reirab.com/;http://www.jian-tang.com;http://christophermorris.info;;http://guywolf.org;;;;http://awf.fitzgibbon.ie;;;",
        "dblp": "201/8526;;;;;;;;261/3715;264/5619;;;;;;195/0435;;;;;;143/7327;94/9024;181/2667-5;156/7303;;120/1308;;;;f/AndrewWFitzgibbon;334/2270;;",
        "google_scholar": "https://scholar.google.ca/citations?hl=en;;;https://scholar.google.be/citations?user=k-O0q5MAAAAJ;;;WaBC78AAAAAJ;;;iPxfRnEAAAAJ;b-6wf6wAAAAJ;;;https://scholar.google.pl/citations?user=hEVRtosAAAAJ;POV9jiIAAAAJ;Qd8JumkAAAAJ;;;;;;https://scholar.google.fr/citations?user=t2i4V4EAAAAJ;https://scholar.google.ca/citations?user=Foh_c-QAAAAJ;https://scholar.google.ca/citations?user=1ir6WUEAAAAJ;;;g0k3SjcAAAAJ;https://scholar.google.ca/citations?user=JcC0zYQAAAAJ;https://scholar.google.fr/citations?user=gGjpl6kAAAAJ;;73t3lIcAAAAJ;https://scholar.google.ca/citations?user=_6Nb2rUAAAAJ;;3rx6VWIAAAAJ",
        "orcid": "0000-0002-4613-9388;;;;;;;;;;;;;;;;;;;;;;;;;;0000-0002-6740-059X;;0000-0001-8199-5932;;;0009-0001-5707-5180;;",
        "linkedin": "dbeaini/;;;zhiyi-li-345a35a9/;;oleksandr-dymov/;sam-maddrell-mander/;;https://www.linkedin.com/mwlite/in/frederik-wenkel-669388185;luis-m%C3%BCller-58a5ba236/;jama-hussein-mohamud-b39308b8/;;michael-craig-63468884/;;lujiarui/;;;;;caswognum;;;;;;;;;hmary/;therence-bois-23b99157/;andrew-fitzgibbon-952b9370;https://linkedin.com/in/blazej-banaszewski;chad-martin-6343992b/;",
        "or_profile": "~Dominique_Beaini1;~Shenyang_Huang1;~Joao_Alex_Cunha1;~Zhiyi_Li1;~Gabriela_Moisescu-Pareja1;~Oleksandr_Dymov1;~Samuel_Maddrell-Mander1;~Callum_McLean1;~Frederik_Wenkel1;~Luis_M\u00fcller1;~Jama_Hussein_Mohamud1;~Ali_Parviz1;~Michael_Craig1;~Micha\u0142_Koziarski1;~Jiarui_Lu2;~Zhaocheng_Zhu1;~Cristian_Gabellini1;~Kerstin_Klaser1;~Josef_Dean1;~Cas_Wognum1;~Maciej_Sypetkowski1;~Guillaume_Rabusseau1;~Reihaneh_Rabbany1;~Jian_Tang1;~Christopher_Morris1;~Mirco_Ravanelli1;~Guy_Wolf1;~Prudencio_Tossou1;~Hadrien_Mary1;~Therence_Bois1;~Andrew_W_Fitzgibbon1;~Blazej_Banaszewski1;~Chad_Martin1;~Dominic_Masters1",
        "aff": "Mila - Institut Qu\u00e9b\u00e9cois d'intelligence artificielle;;;Graphcore;;;Dayhoff Labs;Graphcore;University of Montreal;RWTH Aachen University, Rheinisch Westf\u00e4lische Technische Hochschule Aachen;Mila - Quebec Artificial Intelligence Institute;;Valence Labs;Mila;Mila - Qu\u00e9bec AI Institute; Universit\u00e9 de Montr\u00e9al;Universit\u00e9 de Montr\u00e9al;Valence Labs powered by recursion;;;;;Universit\u00e9 de Montr\u00e9al;Montreal Institute for Learning Algorithms, University of Montreal, University of Montreal;Mila, HEC Montreal;Rheinisch Westf\u00e4lische Technische Hochschule Aachen;;University of Montreal;InVivo AI;;;Graphcore;Graphcore;;Google DeepMind",
        "aff_domain": "mila.quebec;;;graphcore.ai;;;dayhofflabs.com;graphcore.ai;umontreal.ca;cs.rwth-aachen.de;mila.quebec;;valencelabs.com;mila.quebec;umontreal.ca;mila.quebec;valencelabs.com;;;;;umontreal.ca;mila.umontreal.ca;hec.ca;rwth-aachen.de;;umontreal.ca;invivoai.com;;;graphcore.ai;graphcore.ai;;google.com",
        "position": "Associate Professor;;;AI Engineer;;;AI Research Engineer;AI Engineer;PhD student;PhD student;Researcher;;Staff Scientist;Postdoc;PhD student;PhD student;Researcher;;;;;Associate Professor;Assistant Professor;Assistant Professor;Assistant Professor;;Associate Professor;Machine learning researcher;;;Researcher;Technical Product Manager;;Researcher",
        "bibtex": "@inproceedings{\nbeaini2024towards,\ntitle={Towards Foundational Models for Molecular Learning on Large-Scale Multi-Task Datasets},\nauthor={Dominique Beaini and Shenyang Huang and Joao Alex Cunha and Zhiyi Li and Gabriela Moisescu-Pareja and Oleksandr Dymov and Samuel Maddrell-Mander and Callum McLean and Frederik Wenkel and Luis M{\\\"u}ller and Jama Hussein Mohamud and Ali Parviz and Michael Craig and Micha{\\l} Koziarski and Jiarui Lu and Zhaocheng Zhu and Cristian Gabellini and Kerstin Klaser and Josef Dean and Cas Wognum and Maciej Sypetkowski and Guillaume Rabusseau and Reihaneh Rabbany and Jian Tang and Christopher Morris and Mirco Ravanelli and Guy Wolf and Prudencio Tossou and Hadrien Mary and Therence Bois and Andrew W Fitzgibbon and Blazej Banaszewski and Chad Martin and Dominic Masters},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Zc2aIcucwc}\n}",
        "github": "",
        "project": "",
        "reviewers": "Zdj5;BQyU;jQ36;43gK;qFVJ",
        "pdf_size": 2809333,
        "rating": "3;6;6;8;8",
        "confidence": "4;4;4;3;2",
        "soundness": "3;3;3;3;3",
        "contribution": "2;3;3;3;4",
        "presentation": "3;2;3;3;3",
        "wc_summary": "55;71;83;101;101",
        "wc_strengths": "58;141;142;140;91",
        "wc_weaknesses": "74;268;104;58;18",
        "wc_questions": "304;139;56;83;15",
        "wc_review": "491;619;385;382;225",
        "wc_reply_reviewers": "48;52;13;18;0",
        "wc_reply_authors": "1659;1184;545;354;186",
        "reply_reviewers": "1;1;1;1;0",
        "reply_authors": "3;3;1;1;1",
        "rating_avg": [
            6.2,
            1.8330302779823362
        ],
        "confidence_avg": [
            3.4,
            0.8
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            82.2,
            17.735839421916292
        ],
        "wc_strengths_avg": [
            114.4,
            34.21461675950791
        ],
        "wc_weaknesses_avg": [
            104.4,
            86.37962722772077
        ],
        "wc_questions_avg": [
            119.4,
            100.70273084678487
        ],
        "wc_review_avg": [
            420.4,
            130.64088180963873
        ],
        "wc_reply_reviewers_avg": [
            26.2,
            20.341091416145794
        ],
        "wc_reply_authors_avg": [
            785.6,
            552.310999347288
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4
        ],
        "reply_authors_avg": [
            1.8,
            0.9797958971132713
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            34,
            0
        ],
        "corr_rating_confidence": -0.7364853795464743,
        "gs_citation": 38,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7710195960383470287&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=Zc2aIcucwc",
        "pdf": "https://openreview.net/pdf?id=Zc2aIcucwc",
        "email": "mila.quebec;;;graphcore.ai;;;dayhofflabs.com;graphcore.ai;umontreal.ca;cs.rwth-aachen.de;mila.quebec;;valencelabs.com;mila.quebec;umontreal.ca;mila.quebec;valencelabs.com;;;;;umontreal.ca;mila.umontreal.ca;hec.ca;rwth-aachen.de;;umontreal.ca;invivoai.com;;;graphcore.ai;graphcore.ai;;google.com",
        "author_num": 34,
        "aff_unique_index": "0;1;2;1;3;4;5;6;7;8;9;9;6;9;3;10;4;3;11;1;1;12",
        "aff_unique_norm": "Mila - Quebec Artificial Intelligence Institute;Graphcore;Dayhoff Labs;University of Montreal;RWTH Aachen University;Quebec Artificial Intelligence Institute;Valence Labs;Mila;Qu\u00e9bec AI Institute;Universit\u00e9 de Montr\u00e9al;HEC Montreal;InVivo AI;Google",
        "aff_unique_dep": "Artificial Intelligence;;;;;Artificial Intelligence;;Quebec Artificial Intelligence Institute;AI Institute;;HEC Business School;;Google DeepMind",
        "aff_unique_url": "https://mila.quebec;https://www.graphcore.ai;;https://wwwumontreal.ca;https://www.rwth-aachen.de;https://mila.quebec;;https://mila.quebec;https://mila.quebec;https://www.umontreal.ca;https://www.hec.ca;https://www.invivoai.com;https://deepmind.com",
        "aff_unique_abbr": "Mila;Graphcore;;UM;RWTH;Mila;;Mila;Mila;UdeM;HEC;InVivo AI;DeepMind",
        "aff_campus_unique_index": "1;2;2;1",
        "aff_campus_unique": ";Aachen;Montreal",
        "aff_country_unique_index": "0;1;2;1;0;3;0;0;0;0;0;0;0;0;3;0;2;1;1;1",
        "aff_country_unique": "Canada;United Kingdom;United States;Germany;"
    },
    {
        "id": "ZcESnfvrxR",
        "title": "CASR: Refining Action Segmentation via marginalizing frame-level causal relationships",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Integrating deep learning and causal discovery has increased the necessity for a causal relationship between frames as evidence for explainability in Temporal Action Segmentation (TAS) tasks. However, frame-level causal relationships apparently emerge noise outside the segment, making it infeasible to suggest macro action relationships through frame relationships. To address this research gap, we propose a method of marginalizing frame-level noise relationships and introduce a Causal Abstraction Segmentation Refiner (CASR) to enhance the segmentation ability. Specifically, we retain all cross-segment relationships while discarding all inter-segment relationships over the frame-level model, satisfying a consistent mapping of causal abstraction in terms of action semantics from frames to segments. Given the pre-segmentation of the backbone, we treat the whitening frame relationships of the same and different segments in a video as positive and negative cases, respectively. Through contrastive learning, we identify whether each frame belongs to the corresponding segment, thereby enhancing the segmentation performance. In addition, we propose a loss function independent of the action segment engineer to evaluate the causal interpretability of segmentation results. Extensive experimental results on mainstream datasets indicate that our method not only significantly surpasses existing methods in action segmentation performance, but also performs better in evaluating causal models.  Our CASR can be plugged into various action segmentation engineers (MS-TCN++, ASRF, C2F-TCN, CETNet) with different backbones. This generalization performance will make CASR an effective tool for boosting the existing approaches for temporal action segmentation.",
        "keywords": "Causal Representation;Temporal Action Segmentation; Refiner; Causal Consistent Mapping",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Keqing Du;Xinyu Yang;Hang Chen",
        "authorids": "~Keqing_Du1;~Xinyu_Yang2;~Hang_Chen3",
        "gender": "F;M;M",
        "homepage": "https://github.com/777Rebecca;http://gr.xjtu.edu.cn/web/xyyang;https://github.com/Zodiark-ch",
        "dblp": "329/5757.html;;",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;;https://scholar.google.com.hk/citations?user=8-PmU7QAAAAJ",
        "orcid": "0000-0003-3018-689X;;0000-0002-9141-174X",
        "linkedin": ";;",
        "or_profile": "~Keqing_Du1;~Xinyu_Yang2;~Hang_Chen3",
        "aff": "Xi'an Jiaotong University;Xi'an Jiaotong University;Xi'an Jiaotong University",
        "aff_domain": "xjtu.edu.cn;xjtu.edu.cn;xjtu.edu.cn",
        "position": "PhD student;Full Professor;PhD student",
        "bibtex": "@misc{\ndu2024casr,\ntitle={{CASR}: Refining Action Segmentation via marginalizing frame-level causal relationships},\nauthor={Keqing Du and Xinyu Yang and Hang Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=ZcESnfvrxR}\n}",
        "github": "",
        "project": "",
        "reviewers": "xRrB;F2hH;RzwV;jAKX",
        "site": "https://openreview.net/forum?id=ZcESnfvrxR",
        "pdf_size": 1034558,
        "rating": "1;3;3;6",
        "confidence": "3;3;3;3",
        "soundness": "2;2;2;4",
        "contribution": "1;2;2;3",
        "presentation": "1;1;1;1",
        "wc_summary": "62;74;27;116",
        "wc_strengths": "34;39;13;88",
        "wc_weaknesses": "118;97;181;42",
        "wc_questions": "4;236;7;162",
        "wc_review": "218;446;228;408",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            1.0,
            0.0
        ],
        "wc_summary_avg": [
            69.75,
            31.799174517587716
        ],
        "wc_strengths_avg": [
            43.5,
            27.48181216732259
        ],
        "wc_weaknesses_avg": [
            109.5,
            49.741833500585805
        ],
        "wc_questions_avg": [
            102.25,
            100.23067145340292
        ],
        "wc_review_avg": [
            325.0,
            102.9417310909429
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=498876122118961283&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Xi'an Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.xjtu.edu.cn",
        "aff_unique_abbr": "XJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "ZdjKRbtrth",
        "title": "Generative Retrieval with Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Knowledge-sensitive NLP tasks require access to a large volume of world or domain knowledge. Previous methods all require an extra retrieval model to obtain related reference passages for answering. However, this paper finds that a large language model itself can generate existing passages solely based on the question through constrained decoding, thereby achieving retrieval effects and enhancing prediction. We propose a two-stage method, $\\textbf{LLM2GR}$. Specifically, we first prompt the large language model to generate relevant document title identifiers in a constrained manner, then prompt it to generate passages within the document set selected in the first stage, and choose the final reference passage through scoring weighting of the two stages. To speed up the generation retrieval, we only generate shorter prefixes rather than complete passages, then locate them in the document to extract longer, complete reference passages. This method requires no additional retrieval models, no extra training, and no advance text chunking, and can be applied to documents of any length. Experiments on 6 KILT benchmark knowledge-sensitive tasks have verified the effectiveness of our method.",
        "keywords": "Generative Retrieval;Large Language Model;Knowledge-sensitive NLP",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/3d5ac4619fda389528b5f9958700ebb714225ad9.zip",
        "author": "Ye Wang;Rui Xie;Wenxin Hu;Wei Ye;Shikun Zhang",
        "authorids": "~Ye_Wang12;~Rui_Xie2;~Wenxin_Hu1;~Wei_Ye2;~Shikun_Zhang2",
        "gender": "M;M;F;M;M",
        "homepage": ";;https://faculty.ecnu.edu.cn/_s37/hwx/main.psp;https://se.pku.edu.cn/kcl/weiye/;",
        "dblp": ";86/2228-3.html;;09/5394-4;83/3715.html",
        "google_scholar": "RTuvoywAAAAJ;6PcaSxgAAAAJ;;RgLGFMIAAAAJ;uiklLscAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Ye_Wang12;~Rui_Xie2;~Wenxin_Hu1;~Wei_Ye2;~Shikun_Zhang2",
        "aff": "East China Normal University;Peking University;East China Normal University;Peking University;Peking University",
        "aff_domain": "stu.ecnu.edu.cn;pku.edu.cn;ecnu.edu.cn;pku.edu.cn;pku.edu.cn",
        "position": "MS student;Postdoc;Full Professor;Associate Professor;Full Professor",
        "bibtex": "@misc{\nwang2024generative,\ntitle={Generative Retrieval with Large Language Models},\nauthor={Ye Wang and Rui Xie and Wenxin Hu and Wei Ye and Shikun Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=ZdjKRbtrth}\n}",
        "github": "",
        "project": "",
        "reviewers": "KiwB;M43s;i5R3;7CYr",
        "site": "https://openreview.net/forum?id=ZdjKRbtrth",
        "pdf_size": 1548343,
        "rating": "5;5;5;6",
        "confidence": "4;4;4;4",
        "soundness": "3;3;3;2",
        "contribution": "3;2;2;2",
        "presentation": "3;2;3;2",
        "wc_summary": "143;140;201;162",
        "wc_strengths": "100;39;130;159",
        "wc_weaknesses": "327;480;405;127",
        "wc_questions": "107;29;220;21",
        "wc_review": "677;688;956;469",
        "wc_reply_reviewers": "0;80;0;0",
        "wc_reply_authors": "542;632;1042;332",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;2;2;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            161.5,
            24.315632831575655
        ],
        "wc_strengths_avg": [
            107.0,
            44.45784520194383
        ],
        "wc_weaknesses_avg": [
            334.75,
            131.5795861826598
        ],
        "wc_questions_avg": [
            94.25,
            79.99804685115755
        ],
        "wc_review_avg": [
            697.5,
            172.87640093430915
        ],
        "wc_reply_reviewers_avg": [
            20.0,
            34.64101615137755
        ],
        "wc_reply_authors_avg": [
            637.0,
            257.9244075305786
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16557454153222794747&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;0;1;1",
        "aff_unique_norm": "East China Normal University;Peking University",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.ecnu.edu.cn;http://www.pku.edu.cn",
        "aff_unique_abbr": "ECNU;Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "ZdvI91pInB",
        "title": "Discovering Logic-Informed Intrinsic Rewards to Explain Human Policies",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In high-stakes systems like healthcare, it is essential to distill high-level strategic knowledge from top clinicians\u2019 demonstrations. This paper aims to extract knowledge-driven reward functions from experts\u2019 demonstrations, representing the knowledge as a set of logic rules. Our learning framework is built upon the classic inverse reinforcement learning (IRL), assuming that the experts, like clinicians, are rational and their executed treatments are the optimal planning results via maximizing their logic-informed utility function. Our algorithm can automatically extract these logic rules from demonstrations. Specifically, we formulate reward engineering as a backward reasoning procedure, where a rule generator is trained to sequentially generate predicates starting from the goal and then considering conditions and evidence. We interpret policy planning as a forward reasoning procedure, where the optimal policy is obtained by finding the best path to forward chaining the given rules. This sequential optimization process involves refining the policy function, Q-function, and reward function, ultimately leading to the discovery of the most effective strategic rules. In our experiments, we demonstrate the superior performance of our method in discovering meaningful logic rules within the context of a healthcare problem.",
        "keywords": "Logic rule;policy planning;reward engineering",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/bcdd05f089d48cd86907c9aa8050d50d45fcc148.pdf",
        "author": "Chengzhi Cao;Yinghao Fu;Lu Wang;Shuang Li",
        "authorids": "~Chengzhi_Cao1;~Yinghao_Fu1;~Lu_Wang11;~Shuang_Li3",
        "gender": "M;M;F;F",
        "homepage": ";https://github.com/EddieFua;https://scholar.google.com/citations?user=hqlU92YAAAAJ&hl=en;https://shuangli01.github.io",
        "dblp": "30/185;379/6317;49/3800-3.html;43/6294-2",
        "google_scholar": ";8vBEgIYAAAAJ;hqlU92YAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;0009-0003-6788-2204;",
        "linkedin": ";;;",
        "or_profile": "~Chengzhi_Cao1;~Yinghao_Fu1;~Lu_Wang11;~Shuang_Li3",
        "aff": "University of Science and Technology of China;City University of Hong Kong;Microsoft;The Chinese University of Hong Kong (Shenzhen)",
        "aff_domain": "ustc.edu.cn;cityu.edu.hk;microsoft.com;cuhk.edu.cn",
        "position": "MS student;PhD student;Researcher;Assistant Professor",
        "bibtex": "@misc{\ncao2024discovering,\ntitle={Discovering Logic-Informed Intrinsic Rewards to Explain Human Policies},\nauthor={Chengzhi Cao and Yinghao Fu and Lu Wang and Shuang Li},\nyear={2024},\nurl={https://openreview.net/forum?id=ZdvI91pInB}\n}",
        "github": "",
        "project": "",
        "reviewers": "5AXy;1taW;Neph;wzfu",
        "site": "https://openreview.net/forum?id=ZdvI91pInB",
        "pdf_size": 1846290,
        "rating": "5;6;6;6",
        "confidence": "4;3;3;3",
        "soundness": "3;2;2;3",
        "contribution": "3;3;3;3",
        "presentation": "3;1;2;3",
        "wc_summary": "170;113;138;135",
        "wc_strengths": "111;25;35;29",
        "wc_weaknesses": "135;105;78;145",
        "wc_questions": "133;201;113;23",
        "wc_review": "549;444;364;332",
        "wc_reply_reviewers": "229;82;0;43",
        "wc_reply_authors": "1383;1695;712;538",
        "reply_reviewers": "2;1;0;1",
        "reply_authors": "3;3;1;2",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            139.0,
            20.334699407662754
        ],
        "wc_strengths_avg": [
            50.0,
            35.397740040855716
        ],
        "wc_weaknesses_avg": [
            115.75,
            26.299952471439944
        ],
        "wc_questions_avg": [
            117.5,
            63.56689389926174
        ],
        "wc_review_avg": [
            422.25,
            83.78059142784801
        ],
        "wc_reply_reviewers_avg": [
            88.5,
            86.1466772429442
        ],
        "wc_reply_authors_avg": [
            1082.0,
            474.1323654845765
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:yvpBsCtG2AkJ:scholar.google.com/&scioq=Discovering+Logic-Informed+Intrinsic+Rewards+to+Explain+Human+Policies&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "University of Science and Technology of China;City University of Hong Kong;Microsoft;Chinese University of Hong Kong",
        "aff_unique_dep": ";;Microsoft Corporation;",
        "aff_unique_url": "http://www.ustc.edu.cn;https://www.cityu.edu.hk;https://www.microsoft.com;https://www.cuhk.edu.cn",
        "aff_unique_abbr": "USTC;CityU;Microsoft;CUHK",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Hong Kong SAR;Shenzhen",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "Zesag4jmPQ",
        "title": "XAL: EXplainable Active Learning Makes Classifiers Better Low-resource Learners",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Active learning aims to construct an effective training set by iteratively curating the most informative unlabeled data for annotation, which is practical in low-resource tasks. Most active learning techniques in classification rely on the model's uncertainty or disagreement to choose unlabeled data. However, previous work indicates that existing models are poor at quantifying predictive uncertainty, which can lead to over-confidence in superficial patterns and a lack of exploration. Inspired by the cognitive processes in which humans deduce and predict through causal information, we propose a novel Explainable Active Learning framework (XAL) for low-resource text classification, which aims to encourage classifiers to justify their inferences and delve into unlabeled data for which they cannot provide reasonable explanations.  Specifically, besides using a pre-trained bi-directional encoder for classification, we employ a pre-trained uni-directional decoder to generate and score the explanation. A ranking loss is proposed to enhance the decoder's capability in scoring explanations. During the selection of unlabeled data, we combine the predictive uncertainty of the encoder and the explanation score of the decoder to acquire informative data for annotation.\n\nAs XAL is a general framework for text classification, we test our methods on six different classification tasks. Extensive experiments show that XAL achieves substantial improvement on all six tasks over previous AL methods. Ablation studies demonstrate the effectiveness of each component, and human evaluation shows that the model trained in XAL performs surprisingly well well in explaining its prediction.",
        "keywords": "Active learning;Interpretability;Text Classification;Low-resource tasks",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/4069da3df05f8c1c16ffc22b1e77016287bfb9e1.zip",
        "author": "Yun Luo;Zhen Yang;Fandong Meng;Yingjie Li;Fang Guo;Qinglin Qi;Jie Zhou;Yue Zhang",
        "authorids": "~Yun_Luo1;~Zhen_Yang4;~Fandong_Meng3;~Yingjie_Li2;~Fang_Guo1;~Qinglin_Qi1;~Jie_Zhou8;~Yue_Zhang7",
        "gender": "M;M;M;;M;F;M;M",
        "homepage": ";;http://fandongmeng.github.io/;;;;;http://frcchang.github.io",
        "dblp": ";;117/4056.html;;48/4689;;00/5012-16;47/722-4",
        "google_scholar": "B_bdRlAAAAAJ;cuGFOQsAAAAJ;sA8U4S0AAAAJ;6OWRfPoAAAAJ;Qik67zAAAAAJ;;https://scholar.google.com.hk/citations?user=OijxQCMAAAAJ;",
        "orcid": ";;0000-0002-8158-2377;0000-0003-4015-4576;;0009-0005-1856-1484;0000-0002-5899-5165;0000-0002-5214-2268",
        "linkedin": ";;;;;;;",
        "or_profile": "~Yun_Luo1;~Zhen_Yang4;~Fandong_Meng3;~Yingjie_Li2;~Fang_Guo1;~Qinglin_Qi1;~Jie_Zhou8;~Yue_Zhang7",
        "aff": "westlake university;Tencent.inc;WeChat AI, Tencent Inc.;Westlake University;Westlake University;Sichuan University;WeChat AI, Tencent Inc.;Westlake University",
        "aff_domain": "westlake.edu;tencent.com;tencent.com;westlake.edu;westlake.edu;scu.edu.cn;tencent.com;westlake.edu.cn",
        "position": "PhD student;Researcher;Principal Researcher;Postdoc;PhD student;MS student;Principal Researcher;Full Professor",
        "bibtex": "@misc{\nluo2024xal,\ntitle={{XAL}: {EX}plainable Active Learning Makes Classifiers Better Low-resource Learners},\nauthor={Yun Luo and Zhen Yang and Fandong Meng and Yingjie Li and Fang Guo and Qinglin Qi and Jie Zhou and Yue Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=Zesag4jmPQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "LLhf;C5EW;XVNV;idfx",
        "site": "https://openreview.net/forum?id=Zesag4jmPQ",
        "pdf_size": 2744318,
        "rating": "3;3;5;5",
        "confidence": "4;5;4;4",
        "soundness": "2;2;3;2",
        "contribution": "3;1;2;2",
        "presentation": "2;2;3;2",
        "wc_summary": "49;94;79;133",
        "wc_strengths": "25;28;29;153",
        "wc_weaknesses": "104;223;74;464",
        "wc_questions": "128;2;51;112",
        "wc_review": "306;347;233;862",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "640;489;517;760",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            88.75,
            30.252066045148055
        ],
        "wc_strengths_avg": [
            58.75,
            54.43516786049254
        ],
        "wc_weaknesses_avg": [
            216.25,
            153.50956810570474
        ],
        "wc_questions_avg": [
            73.25,
            50.17656325417276
        ],
        "wc_review_avg": [
            437.0,
            248.74786431243987
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            601.5,
            107.70445673230054
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2136100536096490760&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;1;0;0;2;1;0",
        "aff_unique_norm": "Westlake University;Tencent;Sichuan University",
        "aff_unique_dep": ";Tencent;",
        "aff_unique_url": "https://www.westlake.edu.cn;https://www.tencent.com;https://www.scu.edu.cn",
        "aff_unique_abbr": "WU;Tencent;SCU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "Zh047FhXqI",
        "title": "Effective Offline Environment Reconstruction when the Dataset is Collected from Diversified Behavior Policies",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In reinforcement learning, it is crucial to have an accurate environment dynamics model to evaluate different policies' value in tasks like offline policy optimization and policy evaluation. However, the learned model is known to have large value gaps when evaluating target policies different from data-collection policies. This issue has hindered the wide adoption of models as various policies are needed for evaluation in these downstream tasks. In this paper, we focus on one of the typical offline environment model learning scenarios where the offline dataset is collected from diversified policies. We utilize an implicit multi-source nature in this scenario and propose an easy-to-implement yet effective algorithm, policy-conditioned model (PCM) learning, for accurate model learning. PCM is a meta-dynamics model that is trained to be aware of the evaluation policies and on-the-fly adjust the model to match the evaluation policies\u2019 state-action distribution to improve the prediction accuracy. We give a theoretical analysis and experimental evidence to demonstrate the feasibility of reducing value gaps by adapting the dynamics model under different policies. Experiment results show that PCM outperforms the existing SOTA off-policy evaluation methods in the DOPE benchmark with \\textit{a large margin}, and derives significantly better policies in offline policy selection and model predictive control compared with the standard model learning method.",
        "keywords": "environment model learning;offline reinforcement learning;off-policy evaluation;offline policy selection;model predictive control",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Yihao Sun;Xiong-Hui Chen;Ruifeng Chen;Siyuan Xiao;Minhui Li;Yang Yu",
        "authorids": "~Yihao_Sun1;~Xiong-Hui_Chen1;~Ruifeng_Chen1;~Siyuan_Xiao1;~Minhui_Li1;~Yang_Yu5",
        "gender": "M;M;M;M;F;M",
        "homepage": "http://www.lamda.nju.edu.cn/sunyh/;http://www.lamda.nju.edu.cn/chenxh/;http://www.lamda.nju.edu.cn/chenrf/;https://www.lamda.nju.edu.cn/limh/;https://github.com/SiyuanXiao;http://www.lamda.nju.edu.cn/yuy",
        "dblp": ";241/7938;https://dblp.uni-trier.de/pid/58/10097-3;;;46/2181-1",
        "google_scholar": "pFNG8fMAAAAJ;H5pguCYAAAAJ;;;;PG2lDSwAAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Yihao_Sun1;~Xiong-Hui_Chen1;~Ruifeng_Chen1;~Minhui_Li1;~Xiao_Siyuan1;~Yang_Yu2",
        "aff": "Nanjing University;Nanjing University;Nanjing University;Nanjing University;Nanjing University;Nanjing University",
        "aff_domain": "nju.edu.cn;nju.edu.cn;nju.edu.cn;nju.edu.cn;nju.edu.cn;nju.edu.cn",
        "position": "MS student;PhD student;PhD student;PhD student;Undergrad student;Professor",
        "bibtex": "@misc{\nsun2024effective,\ntitle={Effective Offline Environment Reconstruction when the Dataset is Collected from Diversified Behavior Policies},\nauthor={Yihao Sun and Xiong-Hui Chen and Ruifeng Chen and Siyuan Xiao and Minhui Li and Yang Yu},\nyear={2024},\nurl={https://openreview.net/forum?id=Zh047FhXqI}\n}",
        "github": "",
        "project": "",
        "reviewers": "U3YJ;Ag2q;BstF;ENii",
        "site": "https://openreview.net/forum?id=Zh047FhXqI",
        "pdf_size": 1600995,
        "rating": "3;3;5;6",
        "confidence": "3;4;3;4",
        "soundness": "2;2;3;2",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "72;77;27;209",
        "wc_strengths": "32;97;29;88",
        "wc_weaknesses": "156;584;372;178",
        "wc_questions": "81;3;2;56",
        "wc_review": "341;761;430;531",
        "wc_reply_reviewers": "145;0;0;0",
        "wc_reply_authors": "1008;1595;738;1408",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "2;3;1;2",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            96.25,
            67.9462103431825
        ],
        "wc_strengths_avg": [
            61.5,
            31.18092365533773
        ],
        "wc_weaknesses_avg": [
            322.5,
            172.79684603603158
        ],
        "wc_questions_avg": [
            35.5,
            34.16504061171302
        ],
        "wc_review_avg": [
            515.75,
            156.7408290778124
        ],
        "wc_reply_reviewers_avg": [
            36.25,
            62.7868417743718
        ],
        "wc_reply_authors_avg": [
            1187.25,
            335.01744357570396
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.19245008972987526,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:dCwKdStsFjEJ:scholar.google.com/&scioq=Effective+Offline+Environment+Reconstruction+when+the+Dataset+is+Collected+from+Diversified+Behavior+Policies&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "Nanjing University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nju.edu.cn",
        "aff_unique_abbr": "Nanjing U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Towards the Fundamental Limits of Knowledge Transfer over Finite Domains",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18387",
        "id": "Zh2iqiOtMt",
        "author_site": "Qingyue Zhao, Banghua Zhu",
        "tldr": "",
        "abstract": "We characterize the statistical efficiency of knowledge transfer through $n$ samples from a teacher to a probabilistic student classifier with input space $\\mathcal{S}$ over labels $\\mathcal{A}$. We show that privileged information at three progressive levels accelerates the transfer. At the first level, only samples with hard labels are known, via which the maximum likelihood estimator attains the minimax rate $\\sqrt{{|\\mathcal{S}||\\mathcal{A}|}/{n}}$. The second level has the teacher probabilities of sampled labels available in addition, which turns out to boost the convergence rate lower bound to ${{|\\mathcal{S}||\\mathcal{A}|}/{n}}$. However, under this second data acquisition protocol, minimizing a naive adaptation of the cross-entropy loss results in an asymptotically biased student. We overcome this limitation and achieve the fundamental limit by using a novel empirical variant of the squared error logit loss. The third level further equips the student with the soft labels (complete logits) on $\\mathcal{A}$ given every sampled input, thereby provably enables the student to enjoy a rate ${|\\mathcal{S}|}/{n}$ free of $|\\mathcal{A}|$. We find any Kullback-Leibler divergence minimizer to be optimal in the last case. Numerical simulations distinguish the four learners and corroborate our theory.",
        "keywords": "knowledge transfer;classification;minimax optimality;density estimation;knowledge distillation",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/b77d7e6aad0a86823ab1426b88ede692744ddebe.pdf",
        "author": "Qingyue Zhao;Banghua Zhu",
        "authorids": "~Qingyue_Zhao2;~Banghua_Zhu1",
        "gender": "M;M",
        "homepage": ";https://people.eecs.berkeley.edu/~banghua/",
        "dblp": ";204/5394",
        "google_scholar": "EguGynAAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Qingyue_Zhao2;~Banghua_Zhu1",
        "aff": "Tsinghua University;University of California, Berkeley",
        "aff_domain": "tsinghua.edu.cn;berkeley.edu",
        "position": "Undergrad student;PhD student",
        "bibtex": "@inproceedings{\nzhao2024towards,\ntitle={Towards the Fundamental Limits of Knowledge Transfer over Finite Domains},\nauthor={Qingyue Zhao and Banghua Zhu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Zh2iqiOtMt}\n}",
        "github": "",
        "project": "",
        "reviewers": "v1b9;2SeV;ADJF;CQ5M",
        "pdf_size": 626419,
        "rating": "6;6;6;8",
        "confidence": "3;3;2;4",
        "soundness": "3;4;2;4",
        "contribution": "2;2;2;3",
        "presentation": "3;4;2;4",
        "wc_summary": "88;300;60;90",
        "wc_strengths": "31;135;53;5",
        "wc_weaknesses": "55;326;112;20",
        "wc_questions": "99;4;56;19",
        "wc_review": "273;765;281;134",
        "wc_reply_reviewers": "0;419;23;0",
        "wc_reply_authors": "359;897;374;53",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;2;2;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            134.5,
            96.28473399246633
        ],
        "wc_strengths_avg": [
            56.0,
            48.67237409455183
        ],
        "wc_weaknesses_avg": [
            128.25,
            118.79893728480907
        ],
        "wc_questions_avg": [
            44.5,
            36.718523935474316
        ],
        "wc_review_avg": [
            363.25,
            239.2011444370616
        ],
        "wc_reply_reviewers_avg": [
            110.5,
            178.3598889885279
        ],
        "wc_reply_authors_avg": [
            420.75,
            303.33675593307186
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.816496580927726,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6435947403636544002&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=Zh2iqiOtMt",
        "pdf": "https://openreview.net/pdf?id=Zh2iqiOtMt",
        "email": "tsinghua.edu.cn;berkeley.edu",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Tsinghua University;University of California, Berkeley",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.berkeley.edu",
        "aff_unique_abbr": "THU;UC Berkeley",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Berkeley",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "ZhXymWfdcN",
        "title": "Domain Generalization Deep Graph Transformation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph transformation that predicts graph transition from one mode to another is an important and common problem. Despite much recent progress in developing advanced graph transformation techniques, the fundamental assumption typically required in machine-learning models that the testing and training data preserve the same distribution does not always hold. As a result, domain generalization graph transformation that predicts graphs not available in the training data is under-explored, with multiple key challenges to be addressed including (1) the extreme space complexity when training on all input-output mode combinations, (2) difference of graph topologies between the input and the output modes, and (3) how to generalize the model to target domains that are not in the training data. To fill the gap, we propose a multi-input, multi-output, hypernetwork-based graph neural network (MultiHyperGNN) that employs a encoder and a decoder to encode both input and output modes and semi-supervised link prediction to enhance the graph transformation task. Instead of training on all mode combinations, MultiHyperGNN preserves a constant space and polynomial computational complexity with the encoder and the decoder produced by two novel hypernetworks. Comprehensive experiments show that MultiHyperGNN has a superior performance than competing models in both prediction and domain generalization tasks.",
        "keywords": "graph transformation;domain generalization;hypernetworks",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/25b7fffe21e0b843aa0a9af35e377e163fa77ad2.zip",
        "author": "Shiyu Wang;Guangji Bai;Qingyang Zhu;Zhaohui Qin;Liang Zhao",
        "authorids": "~Shiyu_Wang2;~Guangji_Bai1;~Qingyang_Zhu1;~Zhaohui_Qin2;~Liang_Zhao6",
        "gender": "M;M;M;M;M",
        "homepage": "https://sites.google.com/view/about-shiyuwang;https://baithebest.github.io/;;https://sph.emory.edu/faculty/profile/index.php?FID=zhaohui%20%20steve%20-qin-8697;https://cs.emory.edu/~lzhao41/",
        "dblp": ";286/0892;;;63/5422-2",
        "google_scholar": "https://scholar.google.com/citations?hl=en;gBMbU28AAAAJ;RziKEP4AAAAJ;https://scholar.google.com/citations?hl=en;qnvyqtwAAAAJ",
        "orcid": ";0000-0003-3932-2472;;0000-0002-1583-146X;0000-0002-2648-9989",
        "linkedin": "shiyu-wang-647a7b91/;https://linkedin.com/in/guangji-bai/;;;",
        "or_profile": "~Shiyu_Wang2;~Guangji_Bai1;~Qingyang_Zhu1;~Zhaohui_Qin2;~Liang_Zhao6",
        "aff": "Emory University;Emory University;;Emory University;Emory University",
        "aff_domain": "emory.edu;emory.edu;;emory.edu;emory.edu",
        "position": "PhD student;PhD student;;Full Professor;Associate Professor",
        "bibtex": "@misc{\nwang2024domain,\ntitle={Domain Generalization Deep Graph Transformation},\nauthor={Shiyu Wang and Guangji Bai and Qingyang Zhu and Zhaohui Qin and Liang Zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=ZhXymWfdcN}\n}",
        "github": "",
        "project": "",
        "reviewers": "oPHk;cBBF;5HgX;tWqJ",
        "site": "https://openreview.net/forum?id=ZhXymWfdcN",
        "pdf_size": 617870,
        "rating": "5;5;6;6",
        "confidence": "3;4;3;3",
        "soundness": "3;2;2;2",
        "contribution": "3;2;3;3",
        "presentation": "2;2;2;3",
        "wc_summary": "19;47;453;100",
        "wc_strengths": "63;20;59;91",
        "wc_weaknesses": "325;288;80;99",
        "wc_questions": "179;2;66;30",
        "wc_review": "586;357;658;320",
        "wc_reply_reviewers": "121;35;29;0",
        "wc_reply_authors": "1363;2007;933;1077",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "3;6;2;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            154.75,
            174.63443961601618
        ],
        "wc_strengths_avg": [
            58.25,
            25.292044203662147
        ],
        "wc_weaknesses_avg": [
            198.0,
            109.49200884082819
        ],
        "wc_questions_avg": [
            69.25,
            67.30295312985902
        ],
        "wc_review_avg": [
            480.25,
            144.61046815497141
        ],
        "wc_reply_reviewers_avg": [
            46.25,
            45.14075209829805
        ],
        "wc_reply_authors_avg": [
            1345.0,
            412.35179155667555
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.25,
            1.6393596310755
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2535648913694396788&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Emory University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.emory.edu",
        "aff_unique_abbr": "Emory",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "ZhY1XSYqO4",
        "title": "Deep Variational Multivariate Information Bottleneck - A Framework for Variational Losses",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Variational dimensionality reduction methods are known for their high accuracy, generative abilities, and robustness. These methods have many theoretical justifications. Here we introduce a unifying principle rooted in information theory to rederive and generalize existing variational methods and design new ones. We base our framework on an interpretation of the multivariate information bottleneck, in which two Bayesian networks are traded off against one another. We interpret the first network as a compression or encoder graph, which specifies what information to keep when compressing the data. We interpret the second network as decoder graph, which specifies a generative model for the data. Using this framework, we rederive existing dimensionality reduction methods such as the deep variational information bottleneck (DVIB), beta variational auto encoders (beta-VAE), and deep variational canonical correlation analysis (DVCCA). The framework naturally introduces a trade-off parameter between compression and reconstruction in the DVCCA family of algorithms, resulting in the new beta-DVCCA family. In addition, we derive a new variational dimensionality reduction method, deep variational symmetric informational bottleneck (DVSIB), which simultaneously compresses two variables to preserve information between their compressed representations. We implement all of these algorithms and evaluate their ability to produce shared low dimensional latent spaces on a modified noisy MNIST dataset. We show that algorithms that are better matched to the structure of the data (beta-DVCCA and DVSIB in our case) produce better latent spaces as measured by classification accuracy and the dimensionality of the latent variables. We believe that this framework can be used to unify other multi-view representation learning algorithms. Additionally, it provides a straightforward framework for deriving problem-specific loss functions.",
        "keywords": "Dimensionality reduction;Generative model;Multivariate Information Bottleneck;Latent space;Deep Variational canonical correlation analysis;Variational auto-encoders",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/bbdfe8989a2b9330fddb9e896e1d9d9a9692891f.zip",
        "author": "Eslam Abdelaleem;Ilya Nemenman;K. Michael Martini",
        "authorids": "~Eslam_Abdelaleem1;~Ilya_Nemenman1;~K._Michael_Martini1",
        "gender": ";Not Specified;M",
        "homepage": ";https://physics.emory.edu/people/bios/nemenman-ilya.html;https://guava.physics.uiuc.edu/~martini/",
        "dblp": ";83/5659.html;",
        "google_scholar": ";https://scholar.google.com.tw/citations?user=enjXdH4AAAAJ;ztH4760AAAAJ",
        "orcid": "0009-0006-9429-3589;0000-0003-3024-4244;0000-0002-5946-1122",
        "linkedin": "eslamalaa/;;",
        "or_profile": "~Eslam_Abdelaleem1;~Ilya_Nemenman1;~K._Michael_Martini1",
        "aff": "Emory University;Emory University;Emory University",
        "aff_domain": "emory.edu;emory.edu;emory.edu",
        "position": "PhD student;Full Professor;Postdoc",
        "bibtex": "@misc{\nabdelaleem2024deep,\ntitle={Deep Variational Multivariate Information Bottleneck - A Framework for Variational Losses},\nauthor={Eslam Abdelaleem and Ilya Nemenman and K. Michael Martini},\nyear={2024},\nurl={https://openreview.net/forum?id=ZhY1XSYqO4}\n}",
        "github": "",
        "project": "",
        "reviewers": "weLs;JTcS;MfdL;uWuS",
        "site": "https://openreview.net/forum?id=ZhY1XSYqO4",
        "pdf_size": 2865040,
        "rating": "5;5;5;6",
        "confidence": "3;5;3;3",
        "soundness": "2;3;2;2",
        "contribution": "2;2;3;2",
        "presentation": "2;2;2;4",
        "wc_summary": "95;82;36;187",
        "wc_strengths": "68;56;25;76",
        "wc_weaknesses": "142;418;487;387",
        "wc_questions": "53;124;52;2",
        "wc_review": "358;680;600;652",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "480;702;680;660",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            100.0,
            54.80419691957907
        ],
        "wc_strengths_avg": [
            56.25,
            19.395553614166314
        ],
        "wc_weaknesses_avg": [
            358.5,
            130.13166409448547
        ],
        "wc_questions_avg": [
            57.75,
            43.45327950799571
        ],
        "wc_review_avg": [
            572.5,
            127.12493854472457
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            630.5,
            88.15185760946845
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8750752211307673107&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Emory University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.emory.edu",
        "aff_unique_abbr": "Emory",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "From Zero to Turbulence: Generative Modeling for 3D Flow Simulation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18386",
        "id": "ZhlwoC1XaN",
        "author_site": "Marten Lienen, David L\u00fcdke, Jan Hansen-Palmus, Stephan G\u00fcnnemann",
        "tldr": "",
        "abstract": "Simulations of turbulent flows in 3D are one of the most expensive simulations in computational fluid dynamics (CFD). Many works have been written on surrogate models to replace numerical solvers for fluid flows with faster, learned, autoregressive models. However, the intricacies of turbulence in three dimensions necessitate training these models with very small time steps, while generating realistic flow states requires either long roll-outs with many steps and significant error accumulation or starting from a known, realistic flow state\u2014something we aimed to avoid in the first place. Instead, we propose to approach turbulent flow simulation as a generative task directly learning the manifold of all possible turbulent flow states without relying on any initial flow state. For our experiments, we introduce a challenging 3D turbulence dataset of high-resolution flows and detailed vortex structures caused by various objects and derive two novel sample evaluation metrics for turbulent flows. On this dataset, we show that our generative model captures the distribution of turbulent flows caused by unseen objects and generates high-quality, realistic samples amenable for downstream applications without access to any initial state.",
        "keywords": "pde;generative;diffusion;navier-stokes;cfd",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Marten Lienen;David L\u00fcdke;Jan Hansen-Palmus;Stephan G\u00fcnnemann",
        "authorids": "~Marten_Lienen1;~David_L\u00fcdke1;~Jan_Hansen-Palmus1;~Stephan_G\u00fcnnemann1",
        "gender": ";M;M;M",
        "homepage": "https://martenlienen.com;;;http://www.daml.in.tum.de",
        "dblp": "192/3468;328/9755;;43/3011",
        "google_scholar": ";;;",
        "orcid": ";;;",
        "linkedin": ";david-l\u00fcdke/;https://linkedin.com/in/jan-hansen-palmus-7b5729220;",
        "or_profile": "~Marten_Lienen1;~David_L\u00fcdke1;~Jan_Hansen-Palmus1;~Stephan_G\u00fcnnemann1",
        "aff": "Technical University Munich;Technische Universit\u00e4t M\u00fcnchen;Technische Universit\u00e4t M\u00fcnchen;Technical University Munich",
        "aff_domain": "tum.de;tum.de;tum.de;tum.de",
        "position": "PhD student;PhD student;MS student;Professor",
        "bibtex": "@inproceedings{\nlienen2024from,\ntitle={From Zero to Turbulence: Generative Modeling for 3D Flow Simulation},\nauthor={Marten Lienen and David L{\\\"u}dke and Jan Hansen-Palmus and Stephan G{\\\"u}nnemann},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ZhlwoC1XaN}\n}",
        "github": "",
        "project": "",
        "reviewers": "oPBx;DVzo;MYNP;JYNa",
        "pdf_size": 1854219,
        "rating": "5;6;8;8",
        "confidence": "3;4;3;4",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "4;4;3;3",
        "wc_summary": "29;51;79;238",
        "wc_strengths": "84;214;46;101",
        "wc_weaknesses": "175;85;95;41",
        "wc_questions": "26;63;100;91",
        "wc_review": "314;413;320;471",
        "wc_reply_reviewers": "0;18;12;0",
        "wc_reply_authors": "458;425;296;343",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            99.25,
            82.04381451395346
        ],
        "wc_strengths_avg": [
            111.25,
            62.57545445300418
        ],
        "wc_weaknesses_avg": [
            99.0,
            48.35286961494633
        ],
        "wc_questions_avg": [
            70.0,
            28.83574171059243
        ],
        "wc_review_avg": [
            379.5,
            65.81223290544092
        ],
        "wc_reply_reviewers_avg": [
            7.5,
            7.794228634059948
        ],
        "wc_reply_authors_avg": [
            380.5,
            64.29035697521051
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.19245008972987526,
        "gs_citation": 26,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=698676845634603117&as_sdt=8005&sciodt=0,7&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=ZhlwoC1XaN",
        "pdf": "https://openreview.net/pdf?id=ZhlwoC1XaN",
        "email": "tum.de;tum.de;tum.de;tum.de",
        "author_num": 4,
        "aff_unique_index": "0;1;1;0",
        "aff_unique_norm": "Technical University of Munich;Technische Universit\u00e4t M\u00fcnchen",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tum.de;https://www.tum.de",
        "aff_unique_abbr": "TUM;TUM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "ZiF1bJ9K6B",
        "title": "Learning Coverage Paths in Unknown Environments with Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Coverage path planning (CPP) is the problem of finding a path that covers the entire free space of a confined area, with applications ranging from robotic lawn mowing and vacuum cleaning, to demining and search-and-rescue tasks. While offline methods can find provably complete, and in some cases optimal, paths for known environments, their value is limited in online scenarios where the environment is not known beforehand. In this case, the path needs to be planned online while mapping the environment. We investigate how suitable reinforcement learning is for this challenging problem, and analyze the involved components required to efficiently learn coverage paths, such as action space, input feature representation, neural network architecture, and reward function. Compared to existing classical methods, this approach allows for a flexible path space, and enables the agent to adapt to specific environment dynamics.  In addition to local sensory inputs for acting on short-term obstacle detections, we propose to use egocentric maps in multiple scales based on frontiers. This allows the agent to plan a long-term path in large-scale environments with feasible computational and memory complexity. Furthermore, we propose a novel total variation reward term for guiding the agent not to leave small holes of non-covered free space. To validate the effectiveness of our approach, we perform extensive experiments in simulation with a 2D ranging sensor on different variations of the CPP problem, surpassing the performance of both previous RL-based approaches and highly specialized methods. Our code implementation can be found in the supplementary material.",
        "keywords": "exploration;coverage path planning;reinforcement learning;online;total variation",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/8822951156be4d406ebda5a88b6efa078abf40a1.zip",
        "author": "Arvi Jonnarth;Jie Zhao;Michael Felsberg",
        "authorids": "~Arvi_Jonnarth1;~Jie_Zhao3;~Michael_Felsberg2",
        "gender": "M;F;",
        "homepage": "https://liu.se/en/employee/arvjo80;https://github.com/zj5559?tab=repositories;https://liu.se/en/employee/micfe03",
        "dblp": "317/0723;23/3168-14;00/78",
        "google_scholar": "dVvOUGYAAAAJ;Oi42Tc8AAAAJ;https://scholar.google.se/citations?hl=en",
        "orcid": "0000-0002-3434-2522;;0000-0002-6096-3648",
        "linkedin": ";;https://linkedin.com/in/michael-felsberg-668a202",
        "or_profile": "~Arvi_Jonnarth1;~Jie_Zhao3;~Michael_Felsberg2",
        "aff": "Husqvarna;Dalian University of Technology;Link\u00f6ping University",
        "aff_domain": "husqvarnagroup.com;dlut.edu.cn;liu.se",
        "position": "PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\njonnarth2024learning,\ntitle={Learning Coverage Paths in Unknown Environments with Reinforcement Learning},\nauthor={Arvi Jonnarth and Jie Zhao and Michael Felsberg},\nyear={2024},\nurl={https://openreview.net/forum?id=ZiF1bJ9K6B}\n}",
        "github": "",
        "project": "",
        "reviewers": "aapF;5fHE;K43j;HYy8",
        "site": "https://openreview.net/forum?id=ZiF1bJ9K6B",
        "pdf_size": 10651100,
        "rating": "3;5;5;6",
        "confidence": "5;4;4;5",
        "soundness": "3;3;3;3",
        "contribution": "2;3;2;2",
        "presentation": "3;4;3;3",
        "wc_summary": "92;120;35;133",
        "wc_strengths": "76;95;19;127",
        "wc_weaknesses": "556;265;88;320",
        "wc_questions": "34;32;40;136",
        "wc_review": "758;512;182;716",
        "wc_reply_reviewers": "262;667;0;0",
        "wc_reply_authors": "872;1044;369;720",
        "reply_reviewers": "1;3;0;0",
        "reply_authors": "3;3;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            95.0,
            37.676252467569014
        ],
        "wc_strengths_avg": [
            79.25,
            39.27069518101252
        ],
        "wc_weaknesses_avg": [
            307.25,
            167.25336319488466
        ],
        "wc_questions_avg": [
            60.5,
            43.68924352744048
        ],
        "wc_review_avg": [
            542.0,
            227.72351657218013
        ],
        "wc_reply_reviewers_avg": [
            232.25,
            272.8427889829599
        ],
        "wc_reply_authors_avg": [
            751.25,
            248.68391081853284
        ],
        "reply_reviewers_avg": [
            1.0,
            1.224744871391589
        ],
        "reply_authors_avg": [
            2.0,
            1.0
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.2294157338705618,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7867020793071587197&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Husqvarna Group;Dalian University of Technology;Link\u00f6ping University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.husqvarnagroup.com/;http://www.dlut.edu.cn/;https://www.liu.se",
        "aff_unique_abbr": "Husqvarna;DUT;LiU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Sweden;China"
    },
    {
        "id": "ZiHI6raor0",
        "title": "CAMMARL: Conformal Action Modeling in Multi Agent Reinforcement Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Before taking actions in an environment with more than one intelligent agent, an autonomous agent\nmay benefit from reasoning about the other agents and utilizing a notion of a guarantee or confidence about the behavior of the system. In this article, we propose a novel multi-agent reinforcement learning (MARL) algorithm CAMMARL, which involves modeling the actions of other agents in different situations in the form of confident sets, i.e., sets containing their true actions with a high probability. We then use these estimates to inform an agent\u2019s decision-making. For estimating such sets, we use the concept of conformal predictions, by means of which, we not only obtain an estimate of the most probable outcome but get to quantify the operable uncertainty as well. For instance, we can predict a set that provably covers the true predictions with high probabilities (e.g., 95%). Through several experiments in two fully cooperative multi-agent tasks, we show that CAMMARL elevates the capabilities of an autonomous agent in MARL by modeling conformal prediction sets over the behavior of other agents in the environment and utilizing such estimates to enhance its policy learning.",
        "keywords": "Multi Agent Reinforcement Learning;Reinforcement Learning;Conformal Predictions",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/aa6d424bc75e61172599e3232d36862971fc1cef.zip",
        "author": "Nikunj Gupta;Somjit Nath;Samira Ebrahimi Kahou",
        "authorids": "~Nikunj_Gupta1;~Somjit_Nath1;~Samira_Ebrahimi_Kahou1",
        "gender": ";M;F",
        "homepage": ";;https://saebrahimi.github.io",
        "dblp": ";;20/11069",
        "google_scholar": ";fNjl1AwAAAAJ;https://scholar.google.ca/citations?user=F99FuaAAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Nikunj_Gupta1;~Somjit_Nath1;~Samira_Ebrahimi_Kahou1",
        "aff": ";McGill University;\u00c9cole de technologie sup\u00e9rieure",
        "aff_domain": ";mcgill.ca;etsmtl.ca",
        "position": ";PhD student;Associate Professor",
        "bibtex": "@misc{\nanonymous2024cammarl,\ntitle={{CAMMARL}: Conformal Action Modeling in Multi Agent Reinforcement Learning},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=ZiHI6raor0}\n}",
        "github": "",
        "project": "",
        "reviewers": "ECyq;XZg9;8c8j;Jmhr",
        "site": "https://openreview.net/forum?id=ZiHI6raor0",
        "pdf_size": 23380101,
        "rating": "5;5;6;6",
        "confidence": "3;5;4;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "3;3;3;3",
        "wc_summary": "63;50;80;54",
        "wc_strengths": "47;28;94;56",
        "wc_weaknesses": "74;74;218;57",
        "wc_questions": "38;2;200;7",
        "wc_review": "222;154;592;174",
        "wc_reply_reviewers": "104;0;27;85",
        "wc_reply_authors": "771;561;885;417",
        "reply_reviewers": "2;0;1;1",
        "reply_authors": "3;3;4;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            61.75,
            11.54068888758379
        ],
        "wc_strengths_avg": [
            56.25,
            24.02472684548151
        ],
        "wc_weaknesses_avg": [
            105.75,
            65.17812132916995
        ],
        "wc_questions_avg": [
            61.75,
            81.00115739913844
        ],
        "wc_review_avg": [
            285.5,
            178.67498425912902
        ],
        "wc_reply_reviewers_avg": [
            54.0,
            42.148546831415196
        ],
        "wc_reply_authors_avg": [
            658.5,
            181.51239627088833
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.30151134457776363,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13708795174469689856&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "McGill University;\u00c9cole de technologie sup\u00e9rieure",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.mcgill.ca;https://www.etsmtl.ca",
        "aff_unique_abbr": "McGill;ETS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "ZiYdjVDgYY",
        "title": "Online Learning in Varying Feature Spaces with Informative Variation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Most conventional online learning literature implicitly assumed a static feature space, while in practice the feature space may vary over time with the emerging of new features and vanishing of outdated features, which is named as online learning with Varying Feature Space (VFS). There have been increasing attention that initiated the exploration into this novel online learning paradigm. However, none of them was aware of the potentially informative information embodied as presence / absence (i.e., variation in this paper) for each feature, which indicates that the existence of some features of this VFS can be correlated with the class labels. Such information can be potentially beneficial to predictive performance if properly used for the learning purpose. To this end, we formally formulate this specific learning scenario, namely Online learning in Varying Feature space with Informative Variation (OVFIV), and present a learning framework to address this problem. The essence of the framework aim for answering the following two questions: how to learn a model to capture the association of the existence of features with the class labels and how to incorporate such information into the prediction process in order to gain performance improvement. Theoretical analyses and empirical studies based on 17 datasets from diverse fields verify the validity of our proposed method.",
        "keywords": "online learning;varying feature space;variation feature space;infomative message",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Peijia Qin;Liyan Song;Xin Yao",
        "authorids": "~Peijia_Qin1;~Liyan_Song1;~Xin_Yao1",
        "gender": "M;F;",
        "homepage": "https://github.com/t2ance;https://sunnysong14.github.io/;http://www.cs.bham.ac.uk/~xin",
        "dblp": "372/8155.html;129/2667.html;",
        "google_scholar": "BnkNS80AAAAJ;;",
        "orcid": "0009-0000-8768-3622;0000-0003-1172-8825;",
        "linkedin": ";;",
        "or_profile": "~Peijia_Qin1;~Liyan_Song1;~Xin_Yao1",
        "aff": "University of California, San Diego;;",
        "aff_domain": "ucsd.edu;;",
        "position": "Undergrad student;;",
        "bibtex": "@misc{\nqin2024online,\ntitle={Online Learning in Varying Feature Spaces with Informative Variation},\nauthor={Peijia Qin and Liyan Song and Xin Yao},\nyear={2024},\nurl={https://openreview.net/forum?id=ZiYdjVDgYY}\n}",
        "github": "",
        "project": "",
        "reviewers": "FQaF;QVUf;xjMG",
        "site": "https://openreview.net/forum?id=ZiYdjVDgYY",
        "pdf_size": 495482,
        "rating": "3;3;3",
        "confidence": "3;4;3",
        "soundness": "2;2;2",
        "contribution": "2;3;2",
        "presentation": "2;1;1",
        "wc_summary": "66;81;112",
        "wc_strengths": "14;36;69",
        "wc_weaknesses": "66;47;345",
        "wc_questions": "121;227;54",
        "wc_review": "267;391;580",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            86.33333333333333,
            19.154343864744856
        ],
        "wc_strengths_avg": [
            39.666666666666664,
            22.60285134421958
        ],
        "wc_weaknesses_avg": [
            152.66666666666666,
            136.22122529995912
        ],
        "wc_questions_avg": [
            134.0,
            71.22265557157124
        ],
        "wc_review_avg": [
            412.6666666666667,
            128.69688764258788
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:-fIzJDMHLoYJ:scholar.google.com/&scioq=Online+Learning+in+Varying+Feature+Spaces+with+Informative+Variation&hl=en&as_sdt=0,31",
        "gs_version_total": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of California, San Diego",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucsd.edu",
        "aff_unique_abbr": "UCSD",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "San Diego",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Zihqr7qqpg",
        "title": "A SYSTEMATIC STUDY ON EARLY STOPPING CRITERIA IN HPO AND THE IMPLICATIONS OF UNCERTAINTY",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The development of hyperparameter optimization (HPO) algorithms constitutes a key concern within the machine learning domain. While numerous strategies employing early stopping mechanisms have been proposed to bolster HPO efficiency, there remains a notable deficiency in understanding how the selection of early stopping criteria influences the reliability of early stopping decisions and, by extension, the broader outcomes of HPO endeavors. This paper undertakes a systematic exploration of the impact of criterion selection on the effectiveness of early stopping-based HPO. Specifically, we introduce a set of criteria that incorporate uncertainty and highlight their practical significance in enhancing the reliability of early stopping decisions. Through a series of empirical experiments conducted on HPO and NAS benchmarks, we substantiate the critical role of criterion selection, while shedding light on the potential implications of integrating uncertainty as a criterion. This research furnishes empirical insights that serve as a compass for the selection and formulation of criteria, thereby contributing to a more profound comprehension of mechanisms underpinning early stopping-based HPO.",
        "keywords": "HPO;early stop;criteria;uncertainty",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/2cea6a70cbd4678f023a609c302189206a16c6ac.zip",
        "author": "Jiawei Guan;Feng Zhang;Jiesong Liu;Xiaoyong Du;Xipeng Shen",
        "authorids": "~Jiawei_Guan1;~Feng_Zhang10;~Jiesong_Liu1;~Xiaoyong_Du1;~Xipeng_Shen1",
        "gender": ";M;;M;M",
        "homepage": "https://guan-jw.github.io/;https://fengzhangcs.github.io/;https://fred1031.github.io;;https://research.csc.ncsu.edu/picture/xshen5/index.htm",
        "dblp": ";48/1294-7;337/2891;https://dblp.org/pers/hd/d/Du_0001:Xiaoyong;36/4172.html",
        "google_scholar": ";6dDocYkAAAAJ;;;0DC5oGQAAAAJ",
        "orcid": ";0000-0003-1983-7321;;;0000-0003-3599-8010",
        "linkedin": ";;;;",
        "or_profile": "~Jiawei_Guan1;~Feng_Zhang10;~Jiesong_Liu1;~Xiaoyong_Du1;~Xipeng_Shen1",
        "aff": ";Renmin University of China;North Carolina State University;Renmin University of China;North Carolina State University",
        "aff_domain": ";ruc.edu.cn;ncsu.edu;ruc.edu.cn;ncsu.edu",
        "position": ";Full Professor;PhD student;Full Professor;Professor",
        "bibtex": "@misc{\nguan2024a,\ntitle={A {SYSTEMATIC} {STUDY} {ON} {EARLY} {STOPPING} {CRITERIA} {IN} {HPO} {AND} {THE} {IMPLICATIONS} {OF} {UNCERTAINTY}},\nauthor={Jiawei Guan and Feng Zhang and Jiesong Liu and Xiaoyong Du and Xipeng Shen},\nyear={2024},\nurl={https://openreview.net/forum?id=Zihqr7qqpg}\n}",
        "github": "",
        "project": "",
        "reviewers": "wZMM;dT38;F2DD",
        "site": "https://openreview.net/forum?id=Zihqr7qqpg",
        "pdf_size": 1310170,
        "rating": "3;3;8",
        "confidence": "3;5;3",
        "soundness": "2;3;3",
        "contribution": "1;1;3",
        "presentation": "1;2;3",
        "wc_summary": "47;62;16",
        "wc_strengths": "25;30;16",
        "wc_weaknesses": "147;1088;84",
        "wc_questions": "13;72;3",
        "wc_review": "232;1252;119",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "861;1252;153",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;2;1",
        "rating_avg": [
            4.666666666666667,
            2.357022603955158
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            41.666666666666664,
            19.154343864744856
        ],
        "wc_strengths_avg": [
            23.666666666666668,
            5.792715732327588
        ],
        "wc_weaknesses_avg": [
            439.6666666666667,
            459.1617967073867
        ],
        "wc_questions_avg": [
            29.333333333333332,
            30.44484995674784
        ],
        "wc_review_avg": [
            534.3333333333334,
            509.55950475767685
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            755.3333333333334,
            454.84380713481073
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:KdP-hPHIhwwJ:scholar.google.com/&scioq=A+SYSTEMATIC+STUDY+ON+EARLY+STOPPING+CRITERIA+IN+HPO+AND+THE+IMPLICATIONS+OF+UNCERTAINTY&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;1",
        "aff_unique_norm": "Renmin University of China;North Carolina State University",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.ruc.edu.cn;https://www.ncsu.edu",
        "aff_unique_abbr": "RUC;NCSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "Zix86UbMGh",
        "title": "ProofNet: Autoformalizing and Formally Proving Undergraduate-Level Mathematics",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We introduce ProofNet, a benchmark for autoformalization and formal proving of undergraduate-level mathematics. The ProofNet benchmarks consists of 371 examples, each consisting of a formal theorem statement in Lean 3, a natural language theorem statement, and a natural language proof. The problems are primarily drawn from popular undergraduate pure mathematics textbooks and cover topics such as real and complex analysis, linear algebra, abstract algebra, and topology. We intend for ProofNet to be a challenging benchmark that will drive progress in autoformalization and automatic theorem proving. We report baseline results on statement autoformalization via in-context learning. Moreover we demonstrate improvements over our baselines by applying prompt retrieval and distilled backtranslation.",
        "keywords": "autoformalization;theorem proving",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "/attachment/af0f6fc394ccc4ebc9359544a5986aed596eca29.zip",
        "author": "Zhangir Azerbayev;Bartosz Piotrowski;Hailey Schoelkopf;Edward William Ayers;Dragomir Radev",
        "authorids": "~Zhangir_Azerbayev1;~Bartosz_Piotrowski1;~Hailey_Schoelkopf1;~Edward_William_Ayers1;~Dragomir_Radev2",
        "gender": "M;;F;;",
        "homepage": ";;;https://www.edayers.com;",
        "dblp": ";;;;",
        "google_scholar": ";;XLahYIYAAAAJ;;",
        "orcid": ";;;;",
        "linkedin": "zhangir-azerbayev-314ab21b8/;;;;",
        "or_profile": "~Zhangir_Azerbayev1;~Bartosz_Piotrowski1;~Hailey_Schoelkopf1;~Edward_William_Ayers1;~Dragomir_Radev2",
        "aff": ";;EleutherAI;;",
        "aff_domain": ";;eleuther.ai;;",
        "position": ";;Researcher;;",
        "bibtex": "@misc{\nazerbayev2024proofnet,\ntitle={ProofNet: Autoformalizing and Formally Proving Undergraduate-Level Mathematics},\nauthor={Zhangir Azerbayev and Bartosz Piotrowski and Hailey Schoelkopf and Edward William Ayers and Dragomir Radev},\nyear={2024},\nurl={https://openreview.net/forum?id=Zix86UbMGh}\n}",
        "github": "",
        "project": "",
        "reviewers": "RZYR;r6yD;TFoh;4S8n",
        "site": "https://openreview.net/forum?id=Zix86UbMGh",
        "pdf_size": 292789,
        "rating": "3;5;5;5",
        "confidence": "4;3;4;4",
        "soundness": "3;3;3;3",
        "contribution": "3;3;2;2",
        "presentation": "2;3;2;3",
        "wc_summary": "74;153;69;38",
        "wc_strengths": "114;77;32;91",
        "wc_weaknesses": "59;144;67;156",
        "wc_questions": "49;13;60;2",
        "wc_review": "296;387;228;287",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            83.5,
            42.42935304715357
        ],
        "wc_strengths_avg": [
            78.5,
            29.920728600754362
        ],
        "wc_weaknesses_avg": [
            106.5,
            43.7978309965231
        ],
        "wc_questions_avg": [
            31.0,
            24.13503677229434
        ],
        "wc_review_avg": [
            299.5,
            56.870466852312724
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 67,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14477851218864564414&as_sdt=5,24&sciodt=0,24&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0",
        "aff_unique_norm": "EleutherAI",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.eleuther.ai",
        "aff_unique_abbr": "EleutherAI",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "title": "INSIDE: LLMs' Internal States Retain the Power of Hallucination Detection",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18385",
        "id": "Zj12nzlQbz",
        "author_site": "Chao Chen, Kai Liu, Ze Chen, Yi Gu, Yue Wu, Mingyuan Tao, Zhihang Fu, Jieping Ye",
        "tldr": "",
        "abstract": "Knowledge hallucination have raised widespread concerns for the security and reliability of deployed LLMs. Previous efforts in detecting hallucinations have been employed at logit-level uncertainty estimation or language-level self-consistency evaluation, where the semantic information is inevitably lost during the token-decoding procedure. Thus, we propose to explore the dense semantic information retained within LLMs' \\textbf{IN}ternal \\textbf{S}tates for halluc\\textbf{I}nation \\textbf{DE}tection (\\textbf{INSIDE}). In particular, a simple yet effective \\textbf{EigenScore} metric is proposed to better evaluate responses' self-consistency, which exploits the eigenvalues of responses' covariance matrix to measure the semantic consistency/diversity in the dense embedding space. Furthermore, from the perspective of self-consistent hallucination detection, a test time feature clipping approach is explored to truncate extreme activations in the internal states, which reduces overconfident generations and potentially benefits the detection of overconfident hallucinations. Extensive experiments and ablation studies are performed on several popular LLMs and question-answering (QA) benchmarks, showing the effectiveness of our proposal.",
        "keywords": "Large Language Models;Hallucination Detection;LogDet of Covariance Matrix;Eigenvalues;Feature Clipping",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Chao Chen;Kai Liu;Ze Chen;Yi Gu;Yue Wu;Mingyuan Tao;Zhihang Fu;Jieping Ye",
        "authorids": "~Chao_Chen19;~Kai_Liu8;~Ze_Chen3;~Yi_Gu6;~Yue_Wu18;~Mingyuan_Tao1;~Zhihang_Fu1;~Jieping_Ye4",
        "gender": "M;M;M;M;M;M;M;M",
        "homepage": "https://chaochen.cc/;https://kail8.github.io/;;;;https://zhihangfu.top/;http://yelabs.net/;",
        "dblp": "66/3019-26.html;;15/4184-1;83/5894;289/5997;207/1894;03/5454;",
        "google_scholar": "https://scholar.google.com.hk/citations?user=_xDUAtQAAAAJ;https://scholar.google.com/citations?hl=zh-CN;hVqKZq0AAAAJ;;https://scholar.google.com/citations?hl=en;e_e3Ur0AAAAJ;T9AzhwcAAAAJ;srajsjoAAAAJ",
        "orcid": ";;;;;;0000-0001-8662-5818;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Chao_Chen19;~Kai_Liu8;~Ze_Chen3;~Yi_Gu6;~Mingyuan_Tao1;~Zhihang_Fu1;~Jieping_Ye4;~Yue_Wu3",
        "aff": "Alibaba Group;Alibaba Group;Alibaba Group;;;Alibaba Group;Alibaba Group;Alibaba Group",
        "aff_domain": "alibaba-inc.com;alibaba-inc.com;alibaba-inc.com;;;alibaba-inc.com;alibaba-inc.com;alibaba-inc.com",
        "position": "Researcher;Intern;Researcher;;;Researcher;Principal Researcher;Researcher",
        "bibtex": "@inproceedings{\nchen2024inside,\ntitle={{INSIDE}: {LLM}s' Internal States Retain the Power of Hallucination Detection},\nauthor={Chao Chen and Kai Liu and Ze Chen and Yi Gu and Yue Wu and Mingyuan Tao and Zhihang Fu and Jieping Ye},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Zj12nzlQbz}\n}",
        "github": "",
        "project": "",
        "reviewers": "9Srq;Kmk8;VqqH;5aJw",
        "pdf_size": 693118,
        "rating": "6;6;6;8",
        "confidence": "4;4;3;4",
        "soundness": "2;3;3;4",
        "contribution": "3;3;2;3",
        "presentation": "3;3;3;4",
        "wc_summary": "41;133;67;103",
        "wc_strengths": "52;50;41;127",
        "wc_weaknesses": "111;122;121;125",
        "wc_questions": "74;182;22;18",
        "wc_review": "278;487;251;373",
        "wc_reply_reviewers": "0;33;0;0",
        "wc_reply_authors": "1227;1714;792;366",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "2;3;2;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            86.0,
            34.942810419312295
        ],
        "wc_strengths_avg": [
            67.5,
            34.60130055359191
        ],
        "wc_weaknesses_avg": [
            119.75,
            5.261891294962297
        ],
        "wc_questions_avg": [
            74.0,
            66.15134163416491
        ],
        "wc_review_avg": [
            347.25,
            92.53749240172871
        ],
        "wc_reply_reviewers_avg": [
            8.25,
            14.289419162443238
        ],
        "wc_reply_authors_avg": [
            1024.75,
            501.02264170394534
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 90,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3457524507096088484&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=Zj12nzlQbz",
        "pdf": "https://openreview.net/pdf?id=Zj12nzlQbz",
        "email": "alibaba-inc.com;alibaba-inc.com;alibaba-inc.com;;;alibaba-inc.com;alibaba-inc.com;alibaba-inc.com",
        "author_num": 8,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "Alibaba Group",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.alibaba.com",
        "aff_unique_abbr": "Alibaba",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "Zju6U5CiM7",
        "title": "CTP: A Causal Interpretable Model for Non-Communicable Disease Progression Prediction",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Non-communicable disease is the leading cause of death, emphasizing the need for accurate prediction of disease progression trajectories and informed clinical decision-making. Machine learning (ML) models have shown promise in this domain by capturing non-linear patterns within patient features. However, existing ML-based models cannot provide causal interpretable predictions and estimate treatment effects, limiting their decision-assisting perspective. In this study, we propose a novel model called causal trajectory prediction (CTP) to tackle the limitation. The CTP model combines trajectory prediction and causal discovery to enable accurate prediction of feature progression trajectories and uncover causal relationships between features. By incorporating a causal graph into the prediction process, CTP ensures that ancestor features are not influenced by the treatment of descendant features, thereby enhancing the interpretability of the model. By estimating the bounds of treatment effects, even in the presence of unmeasured confounders, the CTP provides valuable insights for clinical decision-making. We evaluate the performance of the CTP using simulated and real medical datasets. Experimental results demonstrate that our model achieves satisfactory performance, highlighting its potential to assist clinical decisions.",
        "keywords": "Disease Progression Trajectory Prediction;Treatment Effect Prediction;Causal Discovery;Medical Informatics",
        "primary_area": "causal reasoning",
        "supplementary_material": "/attachment/894fa6427c33d099a37fd9996066cf0ccc41a905.zip",
        "author": "Zhoujian Sun;Wenzhuo Zhang;Zhengxing Huang;Nai Ding;Cheng Luo",
        "authorids": "~Zhoujian_Sun2;~Wenzhuo_Zhang1;~Zhengxing_Huang1;~Nai_Ding1;~Cheng_Luo3",
        "gender": "M;M;M;M;M",
        "homepage": ";https://github.com/balalaenergy666;http://person.zju.edu.cn/zhengxinghuang/;;",
        "dblp": "233/0998;;;128/4756;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;uDhL004AAAAJ;Q_mMDVMAAAAJ;pdQkzl0AAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Zhoujian_Sun2;~Wenzhuo_Zhang1;~Zhengxing_Huang1;~Nai_Ding1;~Cheng_Luo3",
        "aff": "Zhejiang Lab;Zhejiang University;Zhejiang University;Zhejiang University;Zhejiang Lab",
        "aff_domain": "zhejianglab.com;zju.edu.cn;zju.edu.cn;zju.edu.cn;zhejianglab.com",
        "position": "Researcher;MS student;Full Professor;Assistant Professor;Researcher",
        "bibtex": "@misc{\nsun2024ctp,\ntitle={{CTP}: A Causal Interpretable Model for Non-Communicable Disease Progression Prediction},\nauthor={Zhoujian Sun and Wenzhuo Zhang and Zhengxing Huang and Nai Ding and Cheng Luo},\nyear={2024},\nurl={https://openreview.net/forum?id=Zju6U5CiM7}\n}",
        "github": "",
        "project": "",
        "reviewers": "8VqP;Bw5q;Z9w3;kBz9",
        "site": "https://openreview.net/forum?id=Zju6U5CiM7",
        "pdf_size": 668228,
        "rating": "3;5;5;5",
        "confidence": "5;3;3;3",
        "soundness": "2;2;2;3",
        "contribution": "2;3;2;3",
        "presentation": "2;1;2;3",
        "wc_summary": "63;141;99;75",
        "wc_strengths": "14;58;112;48",
        "wc_weaknesses": "320;272;79;268",
        "wc_questions": "36;256;182;5",
        "wc_review": "433;727;472;396",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            94.5,
            29.811910371527684
        ],
        "wc_strengths_avg": [
            58.0,
            35.185224171518364
        ],
        "wc_weaknesses_avg": [
            234.75,
            92.22086260711293
        ],
        "wc_questions_avg": [
            119.75,
            103.22396766255403
        ],
        "wc_review_avg": [
            507.0,
            129.82873333742418
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18138475305624344801&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1;1;0",
        "aff_unique_norm": "Zhejiang Lab;Zhejiang University",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.zhejianglab.com;https://www.zju.edu.cn",
        "aff_unique_abbr": ";ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "ZkBg5D2lgT",
        "title": "Bringing robotics taxonomies to continuous domains via GPLVM on hyperbolic manifolds",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Robotic taxonomies serve as high-level hierarchical abstractions that classify how humans move and interact with their environment. They have proven useful to analyse grasps, manipulation skills, and whole-body support poses. Despite substantial efforts devoted to design their hierarchy and underlying categories, their use in application fields remains limited. This may be attributed to the lack of computational models that fill the gap between the discrete hierarchical structure of the taxonomy and the high-dimensional heterogeneous data associated to its categories. To overcome this problem, we propose to model taxonomy data via hyperbolic embeddings that capture the associated hierarchical structure. We achieve this by formulating a novel Gaussian process hyperbolic latent variable model that incorporates the taxonomy structure through graph-based priors on the latent space and distance-preserving back constraints. We validate our model on three different robotics taxonomies to learn hyperbolic embeddings that faithfully preserve the original graph structure. We show that our model properly encodes unseen poses from existing or new taxonomy categories, can be used to generate trajectories between the embeddings, and outperforms its Euclidean counterparts.",
        "keywords": "GPLVM;hyperbolic geometry;robotic taxonomies",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/636b6eb324eaff242a37a978390dcfc2340d2d03.zip",
        "author": "No\u00e9mie Jaquier;Leonel Rozo;Miguel Gonz\u00e1lez-Duque;Viacheslav Borovitskiy;Tamim Asfour",
        "authorids": "~No\u00e9mie_Jaquier1;~Leonel_Rozo1;~Miguel_Gonz\u00e1lez-Duque3;~Viacheslav_Borovitskiy1;~Tamim_Asfour1",
        "gender": "M;M;M;M;F",
        "homepage": "https://vab.im/;http://www.humanoids.kit.edu/;https://leonelrozo.weebly.com/;https://www.miguelgondu.com/;https://njaquier.ch/",
        "dblp": "259/3201;34/6686.html;10/9515;244/9609.html;",
        "google_scholar": "https://scholar.google.ru/citations?user=1KqNyNMAAAAJ;https://scholar.google.de/citations?user=65bIT4oAAAAJ;https://scholar.google.it/citations?user=vLWgi-YAAAAJ;eje0FAYAAAAJ;j3rJXU4AAAAJ",
        "orcid": ";;0000-0001-5970-9135;;",
        "linkedin": ";;leonelrozo/;;",
        "or_profile": "~Viacheslav_Borovitskiy1;~Tamim_Asfour1;~Leonel_Dario_Rozo1;~Miguel_Gonz\u00e1lez_Duque1;~Noemie_Jaquier1",
        "aff": "ETHZ - ETH Zurich;Karlsruhe Institute of Technology;Robert Bosch GmbH, Bosch;Copenhagen University;Karlsruhe Institute of Technology",
        "aff_domain": "ethz.ch;kit.edu;de.bosch.com;ku.dk;kit.edu",
        "position": "Postdoc;Full Professor;Principal Researcher;Researcher;Postdoc",
        "bibtex": "@misc{\njaquier2024bringing,\ntitle={Bringing robotics taxonomies to continuous domains via {GPLVM} on hyperbolic manifolds},\nauthor={No{\\'e}mie Jaquier and Leonel Rozo and Miguel Gonz{\\'a}lez-Duque and Viacheslav Borovitskiy and Tamim Asfour},\nyear={2024},\nurl={https://openreview.net/forum?id=ZkBg5D2lgT}\n}",
        "github": "",
        "project": "",
        "reviewers": "vvht;zvAH;gni3;bere",
        "site": "https://openreview.net/forum?id=ZkBg5D2lgT",
        "pdf_size": 28202403,
        "rating": "5;6;6;8",
        "confidence": "3;3;4;4",
        "soundness": "2;3;3;4",
        "contribution": "2;2;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "90;85;193;184",
        "wc_strengths": "117;105;2;172",
        "wc_weaknesses": "108;338;2;275",
        "wc_questions": "101;47;2;50",
        "wc_review": "416;575;199;681",
        "wc_reply_reviewers": "55;137;0;84",
        "wc_reply_authors": "2310;2256;463;1259",
        "reply_reviewers": "1;2;0;1",
        "reply_authors": "4;6;1;3",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            138.0,
            50.631018160807315
        ],
        "wc_strengths_avg": [
            99.0,
            61.43695956018657
        ],
        "wc_weaknesses_avg": [
            180.75,
            133.09277779053227
        ],
        "wc_questions_avg": [
            50.0,
            35.04996433664377
        ],
        "wc_review_avg": [
            467.75,
            181.57832332081932
        ],
        "wc_reply_reviewers_avg": [
            69.0,
            49.512624652708524
        ],
        "wc_reply_authors_avg": [
            1572.0,
            764.9101254395839
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            3.5,
            1.8027756377319946
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.6882472016116854,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4342973051232152754&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2;3;1",
        "aff_unique_norm": "ETH Zurich;Karlsruhe Institute of Technology;Robert Bosch GmbH;University of Copenhagen",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.ethz.ch;https://www.kit.edu;https://www.bosch.com;https://www.ku.dk",
        "aff_unique_abbr": "ETHZ;KIT;Bosch;UCPH",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;2;1",
        "aff_country_unique": "Switzerland;Germany;Denmark"
    },
    {
        "id": "ZkEsEFFUyo",
        "title": "Pushing the Limits of Pre-training for Time Series Forecasting in the CloudOps Domain",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Time series has been left behind in the era of pre-training and transfer learning. While research in the fields of natural language processing and computer vision are enjoying progressively larger datasets to train massive models, the most popular time series datasets consist of only tens of thousands of time steps, limiting our ability to study the effectiveness of pre-training and scaling. Recent studies have also cast doubt on the need for expressive models and scale. To alleviate these issues, we  introduce three large-scale time series forecasting datasets from the cloud operations (CloudOps) domain, the largest having billions of observations, enabling further study into pre-training and scaling of time series models. We build the empirical groundwork for studying pre-training and scaling of time series models and pave the way for future research by identifying a promising candidate architecture. We show that it is a strong zero-shot baseline and benefits from further scaling, both in model and dataset size. Accompanying these datasets and results is a suite of comprehensive benchmark results comparing classical and deep learning baselines to our pre-trained method -- achieving a 27% reduction in error on the largest dataset. Code and datasets will be made publicly available.",
        "keywords": "time series;forecasting;time series forecasting;zero-shot;pre-training;transfer learning;transformer;aiops;dataset",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Gerald Woo;Chenghao Liu;Akshat Kumar;Doyen Sahoo",
        "authorids": "~Gerald_Woo1;~Chenghao_Liu1;~Akshat_Kumar2;~Doyen_Sahoo1",
        "gender": "M;M;M;M",
        "homepage": ";;http://www.smu.edu.sg/faculty/profile/102291/Akshat-KUMAR;https://www.linkedin.com/in/doyensahoo/?originalSubdomain=sg",
        "dblp": "246/5297;;73/193;151/3155",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;https://scholar.google.com.tw/citations?user=zsYC3R0AAAAJ;https://scholar.google.com.sg/citations?hl=en",
        "orcid": ";;;",
        "linkedin": "gerald-woo/;chenghao-liu-40a62a56/;;doyensahoo/?originalSubdomain=sg",
        "or_profile": "~Gerald_Woo1;~Chenghao_Liu1;~Akshat_Kumar2;~Doyen_Sahoo1",
        "aff": "Singapore Management University;Salesforce AI Research;Singapore Management University;SalesForce.com",
        "aff_domain": "smu.edu.sg;salesforce.com;smu.edu.sg;salesforce.com",
        "position": "PhD student;Researcher;Associate Professor;Researcher",
        "bibtex": "@misc{\nwoo2024pushing,\ntitle={Pushing the Limits of Pre-training for Time Series Forecasting in the CloudOps Domain},\nauthor={Gerald Woo and Chenghao Liu and Akshat Kumar and Doyen Sahoo},\nyear={2024},\nurl={https://openreview.net/forum?id=ZkEsEFFUyo}\n}",
        "github": "",
        "project": "",
        "reviewers": "LRUs;boWu;QeLY",
        "site": "https://openreview.net/forum?id=ZkEsEFFUyo",
        "pdf_size": 1466322,
        "rating": "3;5;5",
        "confidence": "4;3;4",
        "soundness": "3;3;2",
        "contribution": "1;2;2",
        "presentation": "3;3;2",
        "wc_summary": "128;66;44",
        "wc_strengths": "136;125;40",
        "wc_weaknesses": "228;103;160",
        "wc_questions": "3;93;3",
        "wc_review": "495;387;247",
        "wc_reply_reviewers": "0;16;0",
        "wc_reply_authors": "1388;937;1197",
        "reply_reviewers": "0;1;0",
        "reply_authors": "4;4;4",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            79.33333333333333,
            35.56527644893104
        ],
        "wc_strengths_avg": [
            100.33333333333333,
            42.89781139198388
        ],
        "wc_weaknesses_avg": [
            163.66666666666666,
            51.09685791600976
        ],
        "wc_questions_avg": [
            33.0,
            42.42640687119285
        ],
        "wc_review_avg": [
            376.3333333333333,
            101.52613237760787
        ],
        "wc_reply_reviewers_avg": [
            5.333333333333333,
            7.542472332656507
        ],
        "wc_reply_authors_avg": [
            1174.0,
            184.83686500984228
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            4.0,
            0.0
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6167931918393927743&as_sdt=805&sciodt=0,3&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;1",
        "aff_unique_norm": "Singapore Management University;Salesforce",
        "aff_unique_dep": ";Salesforce AI Research",
        "aff_unique_url": "https://www.smu.edu.sg;https://www.salesforce.com",
        "aff_unique_abbr": "SMU;Salesforce AI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;1",
        "aff_country_unique": "Singapore;United States"
    },
    {
        "id": "ZlEtXIxl3q",
        "title": "Contrastive losses as generalized models of global epistasis",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Fitness functions map large combinatorial spaces of biological sequences to properties of interest. Inferring these multimodal functions from experimental data is a central task in modern protein engineering. Global epistasis models are an effective and physically-grounded class of models for estimating fitness functions from observed data. These models assume that a sparse latent function is transformed by a monotonic nonlinearity to emit measurable fitness. Here we demonstrate that minimizing contrastive loss functions, such as the Bradley-Terry loss, is a simple and flexible technique for extracting the sparse latent function implied by global epistasis. We argue by way of a fitness-epistasis uncertainty principle that the nonlinearities in global epistasis models can produce observed fitness functions that do not admit sparse representations, and thus may be inefficient to learn from observations when using a Mean Squared Error (MSE) loss (a common practice). We show that contrastive losses are able to accurately estimate a ranking function from limited data even in regimes where MSE is ineffective. We validate the practical utility of this insight by showing contrastive loss functions result in consistently improved performance on benchmark tasks.",
        "keywords": "Computational Biology;Contrastive losses;Protein engineering",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "David H Brookes;Jakub Otwinowski;Sam Sinai",
        "authorids": "~David_H_Brookes1;~Jakub_Otwinowski1;~Sam_Sinai1",
        "gender": ";M;M",
        "homepage": ";;",
        "dblp": ";;",
        "google_scholar": ";vYBWfCEAAAAJ;4k0EcsIAAAAJ",
        "orcid": ";;",
        "linkedin": ";;sam-sinai-710a0221/",
        "or_profile": "~David_H_Brookes1;~Jakub_Otwinowski1;~Sam_Sinai1",
        "aff": ";Dyno Therapeutics;Dyno Therapeutics",
        "aff_domain": ";dynotx.com;dynotx.com",
        "position": ";Researcher;Principal Researcher",
        "bibtex": "@misc{\nbrookes2024contrastive,\ntitle={Contrastive losses as generalized models of global epistasis},\nauthor={David H Brookes and Jakub Otwinowski and Sam Sinai},\nyear={2024},\nurl={https://openreview.net/forum?id=ZlEtXIxl3q}\n}",
        "github": "",
        "project": "",
        "reviewers": "68Sm;7udB;uFyB;6v5p",
        "site": "https://openreview.net/forum?id=ZlEtXIxl3q",
        "pdf_size": 3204234,
        "rating": "6;6;6;6",
        "confidence": "4;3;2;3",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "123;118;79;82",
        "wc_strengths": "52;35;45;18",
        "wc_weaknesses": "572;3;26;30",
        "wc_questions": "283;180;14;316",
        "wc_review": "1030;336;164;446",
        "wc_reply_reviewers": "159;0;0;299",
        "wc_reply_authors": "2238;1102;441;1475",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "4;2;1;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            100.5,
            20.1059692628831
        ],
        "wc_strengths_avg": [
            37.5,
            12.776932339180638
        ],
        "wc_weaknesses_avg": [
            157.75,
            239.3891967069525
        ],
        "wc_questions_avg": [
            198.25,
            117.61032055053673
        ],
        "wc_review_avg": [
            494.0,
            325.37055797966724
        ],
        "wc_reply_reviewers_avg": [
            114.5,
            124.74073111858853
        ],
        "wc_reply_authors_avg": [
            1314.0,
            649.3785490759608
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            1.0897247358851685
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=127676217459626854&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Dyno Therapeutics",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.dynotherapeutics.com",
        "aff_unique_abbr": "",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Retrieval-based Disentangled Representation Learning with Natural Language Supervision",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18384",
        "id": "ZlQRiFmq7Y",
        "author_site": "Jiawei Zhou, Xiaoguang Li, Lifeng Shang, Xin Jiang, Qun Liu, Lei Chen",
        "tldr": "",
        "abstract": "Disentangled representation learning remains challenging as the underlying factors of variation in the data do not naturally exist. The inherent complexity of real-world data makes it unfeasible to exhaustively enumerate and encapsulate all its variations within a finite set of factors. However, it is worth noting that most real-world data have linguistic equivalents, typically in the form of textual descriptions. These linguistic counterparts can represent the data and effortlessly decomposed into distinct tokens. In light of this, we present Vocabulary Disentangled Retrieval (VDR), a retrieval-based framework that harnesses natural language as proxies of the underlying data variation to drive disentangled representation learning. Our approach employ a bi-encoder model to represent both data and natural language in a vocabulary space, enabling the model to distinguish dimensions that capture intrinsic characteristics within data through its natural language counterpart, thus facilitating disentanglement. We extensively assess the performance of VDR across 15 retrieval benchmark datasets, covering text-to-text and cross-modal retrieval scenarios, as well as human evaluation. Our experimental results compellingly demonstrate the superiority of VDR over previous bi-encoder retrievers with comparable model size and training costs, achieving an impressive 8.7% improvement in NDCG@10 on the BEIR benchmark, a 5.3\\% increase on MS COCO, and a 6.0% increase on Flickr30k in terms of mean recall in the zero-shot setting. Moreover, The results from human evaluation indicate that interpretability of our method is on par with SOTA captioning models.",
        "keywords": "Disentangled representation learning;information retriever;sparse retriever",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/eaa410373cb8076609f407d8cbc60709ce5ea389.zip",
        "author": "Jiawei Zhou;Xiaoguang Li;Lifeng Shang;Xin Jiang;Qun Liu;Lei Chen",
        "authorids": "~Jiawei_Zhou2;~Xiaoguang_Li1;~Lifeng_Shang1;~Xin_Jiang1;~Qun_Liu1;~Lei_Chen7",
        "gender": "M;M;M;M;M;M",
        "homepage": ";;;http://liuquncn.github.io/;http://www.cs.ust.hk/~leichen/;",
        "dblp": "126/4991-3;70/4288;42/4142-2;75/4402-1;c/LeiChen0002;46/1349",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com.hk/citations?user=jMQIjYoAAAAJ;DUfcez0AAAAJ;2HhiGzcAAAAJ;gtglwgYAAAAJ;bz5cWEwAAAAJ",
        "orcid": "0000-0001-8247-3159;;0000-0002-9117-8247;0000-0002-7000-1792;0000-0002-8257-5806;",
        "linkedin": ";;xin-jiang-9577b76/;qunliu/;;",
        "or_profile": "~Jiawei_Zhou2;~Lifeng_Shang1;~Xin_Jiang1;~Qun_Liu1;~Lei_Chen7;~Li_Xiaoguang1",
        "aff": "Hong Kong University of Science and Technology;Huawei Technologies Ltd.;Noah\u2019s Ark Lab, Huawei Technologies;Huawei Noah's Ark Lab;Hong Kong University of Science and Technology;Huawei Technologies Ltd.",
        "aff_domain": "hkust.edu;huawei.com;huawei.com;huawei.com;hkust.edu;huawei.com",
        "position": "PhD student;Researcher;Principal Researcher;Chief Scientist of Speech and Language Computing;Full Professor;Researcher",
        "bibtex": "@inproceedings{\nzhou2024retrievalbased,\ntitle={Retrieval-based Disentangled Representation Learning with Natural Language Supervision},\nauthor={Jiawei Zhou and Xiaoguang Li and Lifeng Shang and Xin Jiang and Qun Liu and Lei Chen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ZlQRiFmq7Y}\n}",
        "github": "",
        "project": "",
        "reviewers": "LxNZ;LJaD;fuH7",
        "pdf_size": 5887397,
        "rating": "6;6;8",
        "confidence": "4;3;3",
        "soundness": "4;2;3",
        "contribution": "3;2;3",
        "presentation": "4;2;3",
        "wc_summary": "158;103;318",
        "wc_strengths": "149;50;138",
        "wc_weaknesses": "128;312;168",
        "wc_questions": "55;54;187",
        "wc_review": "490;519;811",
        "wc_reply_reviewers": "0;201;0",
        "wc_reply_authors": "717;1503;727",
        "reply_reviewers": "0;1;0",
        "reply_authors": "2;3;2",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            193.0,
            91.19576013536302
        ],
        "wc_strengths_avg": [
            112.33333333333333,
            44.304501903180096
        ],
        "wc_weaknesses_avg": [
            202.66666666666666,
            79.01617274682162
        ],
        "wc_questions_avg": [
            98.66666666666667,
            62.46243315430128
        ],
        "wc_review_avg": [
            606.6666666666666,
            144.96972864092083
        ],
        "wc_reply_reviewers_avg": [
            67.0,
            94.75230867899737
        ],
        "wc_reply_authors_avg": [
            982.3333333333334,
            368.18956470214573
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17315710115010531793&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=ZlQRiFmq7Y",
        "pdf": "https://openreview.net/pdf?id=ZlQRiFmq7Y",
        "email": "hkust.edu;huawei.com;huawei.com;huawei.com;hkust.edu;huawei.com",
        "author_num": 6,
        "aff_unique_index": "0;1;1;1;0;1",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Huawei",
        "aff_unique_dep": ";Huawei Technologies",
        "aff_unique_url": "https://www.ust.hk;https://www.huawei.com",
        "aff_unique_abbr": "HKUST;Huawei",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "ZlZakr4GYK",
        "title": "COTIC: Embracing Non-uniformity in Event Sequence Data via Multilayer Continuous Convolution",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Massive samples of event sequences occur in various domains, including e-commerce, healthcare, and finance. There are two main challenges regarding modeling such data: methodological and computational. The methodological peculiarity for event sequences is their non-uniformity and sparsity. These requirements make time series models unsuitable. The computational challenge arises from a large amount of available data and the significant length of each sequence. Thus, the problem requires complex and efficient models.\nExisting solutions include large recurrent and transformer neural network architectures. \nOn top of existing blocks, their authors introduce specific intensity functions defined at each moment.\nHowever, due to their parametric nature, these continuous-time-aware intensities represent only a limited class of event sequences. \n\nWe propose the COTIC method based on an efficient continuous convolution neural network suitable for the non-uniform occurrence of events in time. In COTIC, dilations and multi-layer architecture efficiently handle long-term dependencies between events. Furthermore, the model provides intensity dynamics in continuous time --- including self-excitement encountered in practice. Being the first to introduce multiple continuous convolution layers that can handle arbitrary complex dependencies via MLP-modeled convolutions, we obtain these properties.\n\nWhen benchmarked against existing models, the COTIC consistently outperforms them, especially in predicting the next event time and type: it has the average rank of 2.125 vs. 3.688 of the primal competitor. Additionally, its ability to produce effective embeddings showcases its potential for a range of downstream tasks, as produced embeddings are sufficient to solve various downstream tasks, e.g., 0.459 vs. 0.452 baseline accuracy on a 4-label age bin prediction for transactions dataset. The code of the proposed method is available at  https://anonymous.4open.science/r/COTIC-F47D/README.md",
        "keywords": "temporal point process;time series;continuous convolutions;neural networks",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Vladislav Andreevich Zhuzhel;Vsevolod Grabar;Galina Boeva;Artem Zabolotnyi;Alexander Stepikin;Vladimir Zholobov;Maria Ivanova;Mikhail Orlov;Ivan A Kireev;Evgeny Burnaev;Rodrigo Rivera-Castro;Alexey Zaytsev",
        "authorids": "~Vladislav_Andreevich_Zhuzhel1;~Vsevolod_Grabar1;~Galina_Boeva1;artem.zabolotnyi@skoltech.ru;~Alexander_Stepikin1;~Vladimir_Zholobov1;~Maria_Ivanova3;~Mikhail_Orlov1;~Ivan_A_Kireev1;~Evgeny_Burnaev1;~Rodrigo_Rivera-Castro1;~Alexey_Zaytsev2",
        "gender": "M;M;F;;M;M;F;;M;M;M;M",
        "homepage": ";;https://scholar.google.com/citations?hl=ru&user=iOTrLnMAAAAJ;;;https://vk.com/cfdreamer;https://scholar.google.com/citations?hl=ru&user=aKVTz7sAAAAJ&view_op=list_works&gmla=AJsN-F6TYP6YfGEbtIX1cJAg3RxVdRXYlnqoLhGMKJIyc0deIVu4dptyWNpdOHmUcq71ooj9SkamJugR17KJard3iPeaasmAc94SKzJwdiHlXqwgPU2pZRAzYZwBcvyv90baRcdDkeCg;;https://github.com/ivkireev86;http://faculty.skoltech.ru/people/evgenyburnaev;http://rodrigo-rivera.com;https://bimsa.net/people/zaytsev/",
        "dblp": ";;340/4234;;;;79/9510;;;144/7845;;223/9191",
        "google_scholar": ";;iOTrLnMAAAAJ;;X_KuM2wAAAAJ;;aKVTz7sAAAAJ;https://scholar.google.com/citations?hl=ru;B4VIdi8AAAAJ;https://scholar.google.ru/citations?user=pCRdcOwAAAAJ;https://scholar.google.fr/citations?user=nQGmpjUAAAAJ;https://scholar.google.ru/citations?user=WfzzY4cAAAAJ",
        "orcid": "0000-0003-0192-5761;0009-0008-9058-6784;0009-0008-8242-0768;;0000-0002-0078-4875;;0009-0001-4095-6432;;0009-0004-1618-8981;0000-0001-8424-0690;0000-0001-9230-7226;",
        "linkedin": ";;;;;;;;;;;",
        "or_profile": "~Vladislav_Andreevich_Zhuzhel1;~Vsevolod_Grabar1;~Galina_Boeva1;artem.zabolotnyi@skoltech.ru;~Alexander_Stepikin1;~Vladimir_Zholobov1;~Maria_Ivanova3;~Mikhail_Orlov1;~Ivan_A_Kireev1;~Evgeny_Burnaev1;~Rodrigo_Rivera-Castro1;~Alexey_Zaytsev2",
        "aff": "Skolkovo Institute of Science and Technology;Skolkovo Institute of Science and Technology;Moscow Institute of Physics and Technology;;Skolkovo Institute of Science and Technology;;Artificial Intelligence Research Institute;;Sber AI Lab;Skolkovo Institute of Science and Technology;;BIMSA",
        "aff_domain": "skoltech.ru;skoltech.ru;mipt.ru;;skoltech.ru;;airi.net;;sberbank.ru;skoltech.ru;;bimsa.cn",
        "position": "PhD student;Researcher;MS student;;MS student;;Researcher;;Principal Researcher;Full Professor;;Assistant Professor",
        "bibtex": "@misc{\nzhuzhel2024cotic,\ntitle={{COTIC}: Embracing Non-uniformity in Event Sequence Data via Multilayer Continuous Convolution},\nauthor={Vladislav Andreevich Zhuzhel and Vsevolod Grabar and Galina Boeva and Artem Zabolotnyi and Alexander Stepikin and Vladimir Zholobov and Maria Ivanova and Mikhail Orlov and Ivan A Kireev and Evgeny Burnaev and Rodrigo Rivera-Castro and Alexey Zaytsev},\nyear={2024},\nurl={https://openreview.net/forum?id=ZlZakr4GYK}\n}",
        "github": "",
        "project": "",
        "reviewers": "2YVf;bk2C;etAG;jVj6",
        "site": "https://openreview.net/forum?id=ZlZakr4GYK",
        "pdf_size": 1672947,
        "rating": "3;3;3;3",
        "confidence": "4;4;3;5",
        "soundness": "2;3;2;1",
        "contribution": "2;2;2;2",
        "presentation": "2;2;1;2",
        "wc_summary": "38;40;53;50",
        "wc_strengths": "133;44;63;55",
        "wc_weaknesses": "184;118;216;350",
        "wc_questions": "116;54;3;17",
        "wc_review": "471;256;335;472",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            45.25,
            6.378675411086537
        ],
        "wc_strengths_avg": [
            73.75,
            34.86671048435743
        ],
        "wc_weaknesses_avg": [
            217.0,
            84.52810183601665
        ],
        "wc_questions_avg": [
            47.5,
            43.71784532659404
        ],
        "wc_review_avg": [
            383.5,
            92.32686499605627
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            12,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:e2s_qjUaJV0J:scholar.google.com/&scioq=COTIC:+Embracing+Non-uniformity+in+Event+Sequence+Data+via+Multilayer+Continuous+Convolution&hl=en&as_sdt=0,5",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;1;0;2;3;0;4",
        "aff_unique_norm": "Skolkovo Institute of Science and Technology;Moscow Institute of Physics and Technology;Artificial Intelligence Research Institute;Sberbank;Beijing Institute of Mathematical Sciences and Applications",
        "aff_unique_dep": ";;;Sber AI Lab;",
        "aff_unique_url": "https://www.skoltech.ru;https://www.mipt.ru/en;;https://sberbank.ru;http://bimsa.cn",
        "aff_unique_abbr": "Skoltech;MIPT;;Sber;BIMSA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;1;0;0;2",
        "aff_country_unique": "Russian Federation;United States;China"
    },
    {
        "id": "ZltAP7Q4g4",
        "title": "FedGSE:Gradient-based Sub-model Extraction for Resource-constrained Federated Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Federated Learning with Model Heterogeneity has emerged as an important domain, especially with the increasing number of devices that possess diverse resources. However, many clients with valuable data are unable to contribute to training the global model due to the limitations of their resource-constrained devices. One method to overcome this challenge is to extract sub-models from the global model specifically for these resource-limited clients. Unfortunately, existing methods for sub-model extraction rely on predetermined rules, which fail to consider the relationship between the update gradients of the global and client models. In this paper, we propose a novel method called FedGSE, which selects neurons within each layer that exhibit large gradients generated by training the global model on public dataset on the server side, and the selected neurons are used to form sub-models for training on the client side using local dataset. This ensure the gradient updates produced by the sub-model closely resemble the gradient updates that would be produced when training the client data on the global model. As a result, the performance of the sub-model becomes more aligned with that of the global model. Experimental results demonstrate that our method achieves state-of-the-art performance on multiple datasets when compared to other baseline methods.",
        "keywords": "Federated Learning;Submodel selection;Resource-constrained",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/9d96ea9fb1e9ca43e9774ce957cb8ff4bfe86256.zip",
        "author": "yabo jia;Haozhao Wang;Genlang Chen;Tianwei Zhang;Chaoyi Pang",
        "authorids": "~yabo_jia1;~Haozhao_Wang1;~Genlang_Chen1;~Tianwei_Zhang1;~Chaoyi_Pang2",
        "gender": "M;M;M;M;",
        "homepage": "https://wanghaozhao.mysxl.cn/;;https://personal.ntu.edu.sg/tianwei.zhang/index.html;;https://github.com/yaboojia",
        "dblp": "224/4500.html;;77/7902-4;https://dblp.uni-trier.de/pers/p/Pang:Chaoyi.html;",
        "google_scholar": "https://scholar.google.com.hk/citations?user=yFrOuMEAAAAJ;BXyaaVUAAAAJ;9vpiYDIAAAAJ;https://scholar.google.com.au/citations?user=PZZ9jIEAAAAJ;",
        "orcid": "0000-0002-7591-5315;;;0000-0001-7038-3789;",
        "linkedin": ";;;;",
        "or_profile": "~Haozhao_Wang1;~Genlang_Chen1;~Tianwei_Zhang1;~Chaoyi_Pang2;~jia_yabo1",
        "aff": "Huazhong University of Science and Technology;NingboTech University;Nanyang Technological University;Zhejiang University NIT;Zhejiang University",
        "aff_domain": "hust.edu.cn;nbt.edu.cn;ntu.edu.sg;nit.zju.edu.cn;zju.edu.cn",
        "position": "Postdoc;Full Professor;Assistant Professor;Full Professor/Dean;MS student",
        "bibtex": "@misc{\njia2024fedgsegradientbased,\ntitle={Fed{GSE}:Gradient-based Sub-model Extraction for Resource-constrained Federated Learning},\nauthor={yabo jia and Haozhao Wang and Genlang Chen and Tianwei Zhang and Chaoyi Pang},\nyear={2024},\nurl={https://openreview.net/forum?id=ZltAP7Q4g4}\n}",
        "github": "",
        "project": "",
        "reviewers": "y9Vb;wpSY;tC96",
        "site": "https://openreview.net/forum?id=ZltAP7Q4g4",
        "pdf_size": 673549,
        "rating": "3;5;6",
        "confidence": "4;4;3",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "3;2;3",
        "wc_summary": "191;31;46",
        "wc_strengths": "264;27;34",
        "wc_weaknesses": "389;209;82",
        "wc_questions": "251;2;111",
        "wc_review": "1095;269;273",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            89.33333333333333,
            72.14953607304454
        ],
        "wc_strengths_avg": [
            108.33333333333333,
            110.1100459641273
        ],
        "wc_weaknesses_avg": [
            226.66666666666666,
            125.95325411525587
        ],
        "wc_questions_avg": [
            121.33333333333333,
            101.91608748813353
        ],
        "wc_review_avg": [
            545.6666666666666,
            388.440757673834
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.7559289460184545,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:_9SgpzT7BxsJ:scholar.google.com/&scioq=FedGSE:Gradient-based+Sub-model+Extraction+for+Resource-constrained+Federated+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;3",
        "aff_unique_norm": "Huazhong University of Science and Technology;NingboTech University;Nanyang Technological University;Zhejiang University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "http://www.hust.edu.cn;https://www.ningbo-tech.edu.cn;https://www.ntu.edu.sg;https://www.zju.edu.cn",
        "aff_unique_abbr": "HUST;;NTU;ZJU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";NIT (Ningbo Institute of Technology)",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "China;Singapore"
    },
    {
        "id": "ZmbCZw81xf",
        "title": "Syntactic Representations Enable Interpretable Hierarchical Word Vectors",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The distributed representations currently used are dense and uninterpretable, leading to interpretations that themselves are relative, overcomplete, and hard to interpret. We propose a method that transforms these word vectors into reduced syntactic representations. The resulting representations are interpretable in an absolute scale allowing better comparison and visualization of the word vectors and we successively demonstrate that the drawn interpretations are in line with human judgment. The syntactic representations are then used to create hierarchical word vectors using an incremental learning approach similar to the non-linear human learning approach. As these representations are drawn from pre-trained vectors, the generation process and learning approach are computationally efficient. Most importantly, we find out that the resulting hierarchical vectors outperform the original vectors in benchmark tests.",
        "keywords": "Syntactic Representations;Interpretable Vectors;Hierarchical Vectors",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/e85eb4bf2065757a64a3e08269f28129fdf03d55.zip",
        "author": "Biraj Silwal",
        "authorids": "~Biraj_Silwal1",
        "gender": "M",
        "homepage": "",
        "dblp": "",
        "google_scholar": "esVi5lYAAAAJ",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Biraj_Silwal1",
        "aff": "Institute of Engineering, Pulchowk Campus",
        "aff_domain": "pcampus.edu.np",
        "position": "MS student",
        "bibtex": "@misc{\nsilwal2024syntactic,\ntitle={Syntactic Representations Enable Interpretable Hierarchical Word Vectors},\nauthor={Biraj Silwal},\nyear={2024},\nurl={https://openreview.net/forum?id=ZmbCZw81xf}\n}",
        "github": "",
        "project": "",
        "reviewers": "qs93;CNTm;AnLo",
        "site": "https://openreview.net/forum?id=ZmbCZw81xf",
        "pdf_size": 1359368,
        "rating": "3;5;5",
        "confidence": "4;4;3",
        "soundness": "2;3;3",
        "contribution": "1;2;3",
        "presentation": "3;3;3",
        "wc_summary": "34;71;49",
        "wc_strengths": "110;91;23",
        "wc_weaknesses": "267;33;56",
        "wc_questions": "17;202;40",
        "wc_review": "428;397;168",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "312;258;325",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            51.333333333333336,
            15.195028426721974
        ],
        "wc_strengths_avg": [
            74.66666666666667,
            37.3482113211448
        ],
        "wc_weaknesses_avg": [
            118.66666666666667,
            105.30695872332252
        ],
        "wc_questions_avg": [
            86.33333333333333,
            82.32591059657679
        ],
        "wc_review_avg": [
            331.0,
            115.95113913483846
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            298.3333333333333,
            29.00957696271277
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:H6wfkGiXI4AJ:scholar.google.com/&scioq=Syntactic+Representations+Enable+Interpretable+Hierarchical+Word+Vectors&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Institute of Engineering",
        "aff_unique_dep": "",
        "aff_unique_url": "",
        "aff_unique_abbr": "",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Pulchowk",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Nepal"
    },
    {
        "id": "ZmzLrl8nTa",
        "title": "A Mechanism for Solving Relational Tasks in Transformer Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "A primary criticism towards language models (LMs) is their inscrutability. This paper presents evidence that, despite their size and complexity, LMs sometimes exploit a simple computational mechanism to solve one-to-one relational tasks (e.g., capital\\_of(Poland)=Warsaw). We investigate a range of language model sizes (from 124M parameters to 176B parameters) in an in-context learning setting, and find that for a variety of tasks (involving capital cities, upper-casing, and past-tensing) a key part of the mechanism reduces to a simple linear update typically applied by the feedforward (FFN) networks. These updates also tend to promote the output of the relation in a content-independent way (e.g., encoding Poland:Warsaw::China:Beijing), revealing a predictable pattern that these models take in solving these tasks. We further show that this mechanism is specific to tasks that require retrieval from pretraining memory, rather than retrieval from local context. Our results contribute to a growing body of work on the mechanistic interpretability of LLMs, and offer reason to be optimistic that, despite the massive and non-linear nature of the models, the strategies they ultimately use to solve tasks can sometimes reduce to familiar and even intuitive algorithms.",
        "keywords": "interpretability;llms;mechanistic interpretability;FFN;transformer;language model",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/d86b2f60304db4250fdd514bfc298a295e4fd7f1.zip",
        "author": "Jack Merullo;Carsten Eickhoff;Ellie Pavlick",
        "authorids": "~Jack_Merullo2;~Carsten_Eickhoff1;~Ellie_Pavlick1",
        "gender": "M;F;M",
        "homepage": "https://health-nlp.org;http://cs.brown.edu/people/epavlick/;https://jmerullo.github.io/",
        "dblp": "42/8700;141/4059;248/8361",
        "google_scholar": "QQi1_rAAAAAJ;sFyrSa8AAAAJ;7w0xLF4AAAAJ",
        "orcid": "0000-0001-9895-4061;;",
        "linkedin": ";;",
        "or_profile": "~Carsten_Eickhoff1;~Ellie_Pavlick1;~jack_merullo1",
        "aff": "Eberhard-Karls-Universit\u00e4t T\u00fcbingen;Brown University;Brown University",
        "aff_domain": "uni-tuebingen.de;brown.edu;brown.edu",
        "position": "Full Professor;Assistant Professor;PhD student",
        "bibtex": "@misc{\nmerullo2024a,\ntitle={A Mechanism for Solving Relational Tasks in Transformer Language Models},\nauthor={Jack Merullo and Carsten Eickhoff and Ellie Pavlick},\nyear={2024},\nurl={https://openreview.net/forum?id=ZmzLrl8nTa}\n}",
        "github": "",
        "project": "",
        "reviewers": "LT5L;76nL;P5eV;Kg2J",
        "site": "https://openreview.net/forum?id=ZmzLrl8nTa",
        "pdf_size": 1383352,
        "rating": "1;3;5;6",
        "confidence": "5;3;4;4",
        "soundness": "1;3;2;2",
        "contribution": "2;2;2;2",
        "presentation": "1;1;3;3",
        "wc_summary": "90;105;230;159",
        "wc_strengths": "31;37;178;99",
        "wc_weaknesses": "311;110;194;295",
        "wc_questions": "46;35;69;260",
        "wc_review": "478;287;671;813",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.920286436967152
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            1.0
        ],
        "wc_summary_avg": [
            146.0,
            54.868023474515645
        ],
        "wc_strengths_avg": [
            86.25,
            59.28479990689013
        ],
        "wc_weaknesses_avg": [
            227.5,
            81.32803944519996
        ],
        "wc_questions_avg": [
            102.5,
            91.75647116143907
        ],
        "wc_review_avg": [
            562.25,
            198.47087317790488
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3682298471593293,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10254138940824520451&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Eberhard Karls University of T\u00fcbingen;Brown University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uni-tuebingen.de/;https://www.brown.edu",
        "aff_unique_abbr": "Uni T\u00fcbingen;Brown",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "T\u00fcbingen;",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "Germany;United States"
    },
    {
        "id": "ZnmofqLWMQ",
        "title": "Zero-shot Image Restoration via Diffusion Inversion",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recently, various methods have been proposed to solve Image Restoration (IR)\ntasks using a pre-trained diffusion models leading to state-of-the-art performance.\nA common characteristic among these approaches is that they alter the diffusion\nsampling process in order to satisfy the consistency with the corrupted input image.\nHowever, this choice has recently been shown to be sub-optimal and may cause\nthe generated image to deviate from the data manifold. We propose to address this\nlimitation through a novel IR method that not only leverages the power of diffusion\nbut also guarantees that the sample generation path always lies on the data manifold.\nOne choice that satisfies this requirement is not to modify the reverse sampling ,\ni.e., not to alter all the intermediate latents, once an initial noise is sampled. This\nis ultimately equivalent to casting the IR task as an optimization problem in the\nspace of the diffusion input noise. To mitigate the substantial computational cost\nassociated with inverting a fully unrolled diffusion model, we leverage the inherent\ncapability of these models to skip ahead in the forward diffusion process using\narbitrary large time steps. We experimentally validate our method on several image\nrestoration tasks. Our method SHRED achieves state of the art results on multiple\nzero-shot IR benchmarks especially in terms of image quality quantified using FID.",
        "keywords": "Inverse problems;Image restoration;Zero-shot learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/7e2d44bf01ed27176302c6b2e8acdea3314c5849.zip",
        "author": "Hamadi Chihaoui;Abdelhak Lemkhenter;Paolo Favaro",
        "authorids": "~Hamadi_Chihaoui1;~Abdelhak_Lemkhenter1;~Paolo_Favaro1",
        "gender": "M;;M",
        "homepage": "https://cvg.unibe.ch/people/chihaoui;http://cvg.unibe.ch/people/lemkhenter;http://cvg.unibe.ch",
        "dblp": "209/9800.html;274/6892;02/4162",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;6VLy7_AAAAAJ;w_XDRRsAAAAJ",
        "orcid": ";;0000-0003-3546-8247",
        "linkedin": ";;paolo-favaro-25765b4",
        "or_profile": "~Hamadi_Chihaoui1;~Abdelhak_Lemkhenter1;~Paolo_Favaro1",
        "aff": "Universit\u00e4t Bern;Microsoft Research;Institute f\u00fcr Informatik, University of Bern",
        "aff_domain": "unibe.ch;microsoft.com;unibe.ch",
        "position": "PhD student;Postdoc;Full Professor",
        "bibtex": "@misc{\nchihaoui2024zeroshot,\ntitle={Zero-shot Image Restoration via Diffusion Inversion},\nauthor={Hamadi Chihaoui and Abdelhak Lemkhenter and Paolo Favaro},\nyear={2024},\nurl={https://openreview.net/forum?id=ZnmofqLWMQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "9MEL;DyQ6;Rmtd;bZYN",
        "site": "https://openreview.net/forum?id=ZnmofqLWMQ",
        "pdf_size": 20422700,
        "rating": "3;3;3;5",
        "confidence": "5;4;5;2",
        "soundness": "2;1;1;3",
        "contribution": "2;2;2;2",
        "presentation": "2;3;1;3",
        "wc_summary": "59;100;133;71",
        "wc_strengths": "72;118;14;215",
        "wc_weaknesses": "298;375;222;324",
        "wc_questions": "4;111;77;87",
        "wc_review": "433;704;446;697",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "268;374;212;407",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            1.224744871391589
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            90.75,
            28.586491565073178
        ],
        "wc_strengths_avg": [
            104.75,
            73.55057783593546
        ],
        "wc_weaknesses_avg": [
            304.75,
            55.22397577139842
        ],
        "wc_questions_avg": [
            69.75,
            39.921015768639954
        ],
        "wc_review_avg": [
            570.0,
            130.60436439874434
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            315.25,
            78.68092208407322
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.9428090415820632,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3625624098939363362&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Bern;Microsoft",
        "aff_unique_dep": ";Microsoft Research",
        "aff_unique_url": "https://www.unibe.ch;https://www.microsoft.com/en-us/research",
        "aff_unique_abbr": "UniBE;MSR",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Switzerland;United States"
    },
    {
        "id": "Zr96FfaUGR",
        "title": "ARIES: A Corpus of Scientific Paper Edits Made in Response to Peer Reviews",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Revising scientific papers based on peer feedback is a challenging task that requires not only deep scientific knowledge and reasoning, but also the ability to recognize the implicit requests in high-level feedback and to choose the best of many possible ways to update the manuscript in response.  We introduce this task for large language models and release ARIES, a dataset of review comments and their corresponding paper edits, to enable training and evaluating models.  We study two versions of the task: comment-edit alignment and edit generation, and evaluate several baselines, including GPT-4.  We find that models struggle even to identify the edits that correspond to a comment, especially in cases where the comment is phrased in an indirect way or where the edit addresses the spirit of a comment but not the precise request.  When tasked with generating edits, GPT-4 often succeeds in addressing comments on a surface level, but it rigidly follows the wording of the feedback rather than the underlying intent, and includes fewer technical details than human-written edits.  We hope that our formalization, dataset, and analysis will form a foundation for future work in this area.",
        "keywords": "language model;peer review;text alignment;text editing;NLP datasets",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Mike D'Arcy;Alexis Ross;Erin Bransom;Bailey Kuehl;Jonathan Bragg;Tom Hope;Doug Downey",
        "authorids": "~Mike_D'Arcy1;~Alexis_Ross1;~Erin_Bransom1;~Bailey_Kuehl1;~Jonathan_Bragg1;~Tom_Hope2;~Doug_Downey1",
        "gender": "M;;F;F;;;M",
        "homepage": "https://mdarcy220.gitlab.io/;https://alexisjihyeross.github.io/;;;https://www.jonathanbragg.com;;https://www.cs.northwestern.edu/~ddowney/",
        "dblp": ";239/8686;;;44/9006;27/5588;57/5363",
        "google_scholar": "q5WUx2AAAAAJ;;;1lzjTX0AAAAJ;rNO2Q1kAAAAJ;;E8evkcQAAAAJ",
        "orcid": "0000-0003-0355-7157;;;;;;",
        "linkedin": ";;;baileykuehl?trk=public_profile_browsemap_profile-result-card_result-card_full-click;;tom-hope-1433a228/;",
        "or_profile": "~Mike_D'Arcy1;~Alexis_Ross1;~Erin_Bransom1;~Bailey_Kuehl1;~Jonathan_Bragg1;~Tom_Hope2;~Doug_Downey1",
        "aff": "Northwestern University;Allen Institute for Artificial Intelligence;Allen Institute for Artificial Intelligence;University of California, Berkeley;Allen Institute for Artificial Intelligence;Allen Institute for Artificial Intelligence;Northwestern University",
        "aff_domain": "northwestern.edu;allenai.org;allenai.org;berkeley.edu;allenai.org;allenai.org;northwestern.edu",
        "position": "PhD student;Researcher;Analyst;MS student;Research Scientist;Researcher;Professor",
        "bibtex": "@misc{\nd'arcy2024aries,\ntitle={{ARIES}: A Corpus of Scientific Paper Edits Made in Response to Peer Reviews},\nauthor={Mike D'Arcy and Alexis Ross and Erin Bransom and Bailey Kuehl and Jonathan Bragg and Tom Hope and Doug Downey},\nyear={2024},\nurl={https://openreview.net/forum?id=Zr96FfaUGR}\n}",
        "github": "",
        "project": "",
        "reviewers": "Lkvy;fRaq;md3r;nrwT",
        "site": "https://openreview.net/forum?id=Zr96FfaUGR",
        "pdf_size": 318531,
        "rating": "3;3;8;8",
        "confidence": "4;4;3;4",
        "soundness": "2;2;4;3",
        "contribution": "2;2;3;4",
        "presentation": "2;2;4;3",
        "wc_summary": "112;87;110;120",
        "wc_strengths": "56;11;87;89",
        "wc_weaknesses": "155;210;126;112",
        "wc_questions": "144;1;112;79",
        "wc_review": "467;309;435;400",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "943;1154;801;414",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            5.5,
            2.5
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            107.25,
            12.275483697190918
        ],
        "wc_strengths_avg": [
            60.75,
            31.56243811875122
        ],
        "wc_weaknesses_avg": [
            150.75,
            37.559120064240055
        ],
        "wc_questions_avg": [
            84.0,
            53.146025251188824
        ],
        "wc_review_avg": [
            402.75,
            59.08627167117587
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            828.0,
            270.0120367687337
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 26,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4405317508395331600&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;1;2;1;1;0",
        "aff_unique_norm": "Northwestern University;Allen Institute for Artificial Intelligence;University of California, Berkeley",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.northwestern.edu;https://allenai.org;https://www.berkeley.edu",
        "aff_unique_abbr": "NU;AI2;UC Berkeley",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Berkeley",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "ZrY38sUYWs",
        "title": "Feature Map Matters in Out-of-distribution Detection",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Detecting and rejecting out-of-distribution (OOD) data can improve the reliability and reduce potential risks of a model (e.g., a neural network) during the deployment phase. Recent post-hoc OOD detection methods usually focus on analyzing hidden features or prediction logits of the model.\nHowever, feature maps of the backbone would also contain important spatial clues for discriminating the OOD data. In this paper, we propose an OOD score function Feature Sim (FS) that can efficiently identify the OOD data by only looking at the feature maps. Furthermore, a novel Threshold Activation (TA) module is proposed to suppress non-critical information in the feature maps and broaden the divergences between foreground and background contexts. We provide a theoretical analysis to help understand our methods. The experimental results show that our methods FS+TA and FS+TA+ASH can achieve state-of-the-art on various benchmarks. More importantly, since our method is based on feature maps instead of hidden features or logits, it can be easily adapted to more scenarios, such as semantic segmentation and object detection.",
        "keywords": "OOD detection",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Xue Jiang;Feng Liu;Zhen Fang;Hong Chen;Tongliang Liu;Feng Zheng;Bo Han",
        "authorids": "~Xue_Jiang3;~Feng_Liu2;~Zhen_Fang2;~Hong_Chen1;~Tongliang_Liu1;~Feng_Zheng1;~Bo_Han1",
        "gender": "F;M;M;;M;M;M",
        "homepage": ";https://fengliu90.github.io/index.html;https://fang-zhen.github.io/index.html;https://chenhongml.github.io/;https://tongliang-liu.github.io/;http://faculty.sustech.edu.cn/fengzheng/;https://bhanml.github.io/",
        "dblp": ";77/1318-3;;https://dblp.uni-trier.de/pers/hd/c/Chen_0004:Hong;150/6667;39/800;241/0472-3",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com/citations?hl=en;OzD6WJcAAAAJ;;https://scholar.google.com.au/citations?user=EiLdZ_YAAAAJ;PcmyXHMAAAAJ;nTNjqHwAAAAJ",
        "orcid": "0000-0003-2577-2296;0000-0002-5005-9129;0000-0003-0602-6255;;;0000-0002-1701-9141;",
        "linkedin": ";alexfengliu;;;;;",
        "or_profile": "~Xue_Jiang3;~Feng_Liu2;~Zhen_Fang2;~Hong_Chen1;~Tongliang_Liu1;~Feng_Zheng1;~bo_han2",
        "aff": "Southern University of Science and Technology;University of Melbourne;University of Technology Sydney;Huazhong Agricultural University;Mohamed bin Zayed University of Artificial Intelligence;Southern University of Science and Technology;MBZUAI",
        "aff_domain": "sustech.edu.cn;unimelb.edu.au;uts.edu.au;hzau.edu.cn;mbzuai.ac.ae;sustech.edu.cn;mbzuai.ac.ae",
        "position": "PhD student;Assistant Professor;Assistant Professor;Full Professor;Affiliated Associate Professor;Associate Professor;Researcher",
        "bibtex": "@misc{\njiang2024feature,\ntitle={Feature Map Matters in Out-of-distribution Detection},\nauthor={Xue Jiang and Feng Liu and Zhen Fang and Hong Chen and Tongliang Liu and Feng Zheng and Bo Han},\nyear={2024},\nurl={https://openreview.net/forum?id=ZrY38sUYWs}\n}",
        "github": "",
        "project": "",
        "reviewers": "NfBj;gWG8;gmH7;sGRf",
        "site": "https://openreview.net/forum?id=ZrY38sUYWs",
        "pdf_size": 7280764,
        "rating": "5;5;6;6",
        "confidence": "3;4;4;4",
        "soundness": "3;2;3;3",
        "contribution": "3;2;3;2",
        "presentation": "3;2;3;3",
        "wc_summary": "90;73;26;67",
        "wc_strengths": "100;31;23;48",
        "wc_weaknesses": "179;307;146;176",
        "wc_questions": "107;4;3;66",
        "wc_review": "476;415;198;357",
        "wc_reply_reviewers": "56;76;0;46",
        "wc_reply_authors": "2293;2319;1076;2052",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "6;6;2;4",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            64.0,
            23.50531854708632
        ],
        "wc_strengths_avg": [
            50.5,
            29.970819141291418
        ],
        "wc_weaknesses_avg": [
            202.0,
            61.97983543056564
        ],
        "wc_questions_avg": [
            45.0,
            43.96020928066653
        ],
        "wc_review_avg": [
            361.5,
            103.35013304297193
        ],
        "wc_reply_reviewers_avg": [
            44.5,
            27.870235018743564
        ],
        "wc_reply_authors_avg": [
            1935.0,
            506.75191168855
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.5,
            1.6583123951777
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:rbvxa6sqWpwJ:scholar.google.com/&scioq=Feature+Map+Matters+in+Out-of-distribution+Detection&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;4;0;4",
        "aff_unique_norm": "Southern University of Science and Technology;University of Melbourne;University of Technology Sydney;Huazhong Agricultural University;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.sustech.edu.cn;https://www.unimelb.edu.au;https://www.uts.edu.au;http://www.hzau.edu.cn/;https://mbzuai.ac.ae",
        "aff_unique_abbr": "SUSTech;UniMelb;UTS;HAU;MBZUAI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;0;2;0;2",
        "aff_country_unique": "China;Australia;United Arab Emirates"
    },
    {
        "id": "Zrr6kH1cSh",
        "title": "AdaSR: Adaptive Super Resolution for Cross Platform and Dynamic Runtime Environments",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Image super resolution models (SR) have shown great capability in improving the visual quality for low-resolution images. Due to the compute and memory budgets of diverse platforms, e.g., cloud and edge devices, practitioners and researchers have to either (1) design different architectures and/or (2) compress the same model to different levels. Additionally, a majority of the works in current literature aim to achieve state-of-the-art performance by hand-designing singular efficient models. However, even on the same hardware, the compute resource dynamics change due to other running applications. As such, one single model that satisfies required frames-per-second (FPS) when executed in isolation may not be suitable when other running applications present. To overcome those issues, we propose AdaSR, an Adaptive SR framework via shared architecture and weights for cross platform deployment and dynamic runtime environment. Unlike other works in literature, our work focuses on the development of multiple models within a larger meta-graph such that they can fulfill latency requirements by compromising as little performance as possible. Particularly, AdaSR can be used to (1) customize architectures for different hardware (e.g., different security cameras), and (2) adaptively change the compute graph in dynamic runtime environment (e.g., mobile phones with concurrently running applications). Different than prior arts, AdaSR achieves this by adaptively changing the depth and the channel size with shared weights and architecture, which introduces no extra cost on memory and/or storage. To stabilize the shared weight training of AdaSR, we propose a progressive approach where we derive loss functions for each block and function matching operations with max-norm regularization to address dimension mismatches. We extensively test AdaSR on different block-based GAN models, and demonstrate that AdaSR can maintain Pareto optimal performance in terms of latency vs. performance tradeoff with much smaller memory footprint and support dynamic runtime environments.",
        "keywords": "super resolution;neural networks;architecture search;compression",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Syed Zawad;Zhewei Yao;Cheng Li;Feng Yan;Yuxiong He",
        "authorids": "~Syed_Zawad1;~Zhewei_Yao1;~Cheng_Li10;~Feng_Yan2;~Yuxiong_He1",
        "gender": "M;F;;;M",
        "homepage": ";https://chengli.netlify.app/;http://www.cs.uh.edu/~fyan/;;https://www.semanticscholar.org/author/Syed-Zawad/70272436",
        "dblp": "195/2887;;62/3960-1.html;https://dblp.org/pers/hd/h/He:Yuxiong;",
        "google_scholar": "gpSeMjYAAAAJ;da9Vl6QAAAAJ;iLE0_VAAAAAJ;SB3_eb0AAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Zhewei_Yao1;~Cheng_Li10;~Feng_Yan2;~Yuxiong_He1;~Syed_Zawad2",
        "aff": "Snowflake;Microsoft;University of Houston;Microsoft;University of Nevada, Reno, University of Nevada, Reno",
        "aff_domain": "snowflake.com;microsoft.com;uh.edu;microsoft.com;nevada.unr.edu",
        "position": "Researcher;Researcher;Associate Professor;Researcher;PhD student",
        "bibtex": "@misc{\nzawad2024adasr,\ntitle={Ada{SR}: Adaptive Super Resolution for Cross Platform and Dynamic Runtime Environments},\nauthor={Syed Zawad and Zhewei Yao and Cheng Li and Feng Yan and Yuxiong He},\nyear={2024},\nurl={https://openreview.net/forum?id=Zrr6kH1cSh}\n}",
        "github": "",
        "project": "",
        "reviewers": "DMaG;vLeU;w1MH;eni7",
        "site": "https://openreview.net/forum?id=Zrr6kH1cSh",
        "pdf_size": 1100288,
        "rating": "3;5;5;5",
        "confidence": "4;3;3;4",
        "soundness": "2;3;2;2",
        "contribution": "1;3;2;3",
        "presentation": "2;2;3;3",
        "wc_summary": "27;85;119;32",
        "wc_strengths": "55;74;24;29",
        "wc_weaknesses": "166;53;24;157",
        "wc_questions": "13;38;268;8",
        "wc_review": "261;250;435;226",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "133;224;297;211",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            65.75,
            38.23202191880518
        ],
        "wc_strengths_avg": [
            45.5,
            20.22992832414391
        ],
        "wc_weaknesses_avg": [
            100.0,
            62.42996075603444
        ],
        "wc_questions_avg": [
            81.75,
            108.13041893935305
        ],
        "wc_review_avg": [
            293.0,
            82.95480697343584
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            216.25,
            58.17806717311946
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:XXRRhjABsXQJ:scholar.google.com/&scioq=AdaSR:+Adaptive+Super+Resolution+for+Cross+Platform+and+Dynamic+Runtime+Environments&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;1;3",
        "aff_unique_norm": "Snowflake Inc.;Microsoft;University of Houston;University of Nevada, Reno",
        "aff_unique_dep": ";Microsoft Corporation;;",
        "aff_unique_url": "https://www.snowflake.com;https://www.microsoft.com;https://www.uh.edu;https://www.unr.edu",
        "aff_unique_abbr": "Snowflake;Microsoft;UH;UNR",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Reno",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Diffusion Model for Dense Matching",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18383",
        "id": "Zsfiqpft6K",
        "author_site": "Jisu Nam, Gyuseong Lee, Seonwoo Kim, In\u00e8s Hyeonsu Kim, Hyoungwon Cho, Seyeon Kim, Seungryong Kim",
        "tldr": "",
        "abstract": "The objective for establishing dense correspondence between paired images con- sists of two terms: a data term and a prior term. While conventional techniques focused on defining hand-designed prior terms, which are difficult to formulate, re- cent approaches have focused on learning the data term with deep neural networks without explicitly modeling the prior, assuming that the model itself has the capacity to learn an optimal prior from a large-scale dataset. The performance improvement was obvious, however, they often fail to address inherent ambiguities of matching, such as textureless regions, repetitive patterns, large displacements, or noises. To address this, we propose DiffMatch, a novel conditional diffusion-based framework designed to explicitly model both the data and prior terms for dense matching. This is accomplished by leveraging a conditional denoising diffusion model that explic- itly takes matching cost and injects the prior within generative process. However, limited input resolution of the diffusion model is a major hindrance. We address this with a cascaded pipeline, starting with a low-resolution model, followed by a super-resolution model that successively upsamples and incorporates finer details to the matching field. Our experimental results demonstrate significant performance improvements of our method over existing approaches, and the ablation studies validate our design choices along with the effectiveness of each component. Code and pretrained weights are available at https://ku-cvlab.github.io/DiffMatch.",
        "keywords": "Diffusion Models;Visual Correspondence",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Jisu Nam;Gyuseong Lee;Sunwoo Kim;Hyeonsu Kim;Hyoungwon Cho;Seyeon Kim;Seungryong Kim",
        "authorids": "~Jisu_Nam1;~Gyuseong_Lee1;~Sunwoo_Kim2;~Hyeonsu_Kim2;~Hyoungwon_Cho1;~Seyeon_Kim2;~Seungryong_Kim1",
        "gender": ";M;F;M;F;M;F",
        "homepage": "https://gseonglee.github.io;https://github.com/sunwoo76;https://ines-hyeonsu-kim.github.io;https://github.com/HyoungwonCho;;https://cvlab.korea.ac.kr/members/faculty;https://nam-jisu.github.io/",
        "dblp": "312/4504;16/5689;367/9344;;;141/9955;309/6408",
        "google_scholar": "O6B36wwAAAAJ;https://scholar.google.com/citations?hl=en;tBcqfncAAAAJ;https://scholar.google.co.kr/citations?user=M4kMz-UAAAAJ;;cIK1hS8AAAAJ;xakYe8MAAAAJ",
        "orcid": "0000-0002-0396-824X;;0009-0003-3695-0243;;;;",
        "linkedin": "gyuseong-lee-172957206/;;;hyoungwon-cho-388a46330/;seyeon-kim-837588232;;",
        "or_profile": "~Gyuseong_Lee1;~Sunwoo_Kim2;~Hyeonsu_Kim2;~Hyoungwon_Cho1;~Seyeon_Kim2;~Seungryong_Kim1;~Ji_Su_Nam1",
        "aff": "Korea University;;Korea University;Korea University;Korea University;Korea University;Korea University",
        "aff_domain": "korea.ac.kr;;korea.ac.kr;korea.ac.kr;korea.ac.kr;korea.ac.kr;korea.ac.kr",
        "position": "MS student;;Undergrad student;MS student;MS student;Assistant Professor;PhD student",
        "bibtex": "@inproceedings{\nnam2024diffusion,\ntitle={Diffusion Model for Dense Matching},\nauthor={Jisu Nam and Gyuseong Lee and Sunwoo Kim and Hyeonsu Kim and Hyoungwon Cho and Seyeon Kim and Seungryong Kim},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Zsfiqpft6K}\n}",
        "github": "",
        "project": "",
        "reviewers": "tm6R;nL9F;kgjX;8Vji",
        "pdf_size": 1063954,
        "rating": "8;8;8;8",
        "confidence": "4;3;3;4",
        "soundness": "4;2;4;4",
        "contribution": "3;3;4;3",
        "presentation": "3;3;3;4",
        "wc_summary": "96;144;65;129",
        "wc_strengths": "252;90;81;201",
        "wc_weaknesses": "141;445;101;73",
        "wc_questions": "60;126;42;55",
        "wc_review": "549;805;289;458",
        "wc_reply_reviewers": "25;26;32;16",
        "wc_reply_authors": "1957;1670;732;1182",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "4;4;2;2",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            108.5,
            30.532769281544052
        ],
        "wc_strengths_avg": [
            156.0,
            72.83886325307391
        ],
        "wc_weaknesses_avg": [
            190.0,
            149.19450392021818
        ],
        "wc_questions_avg": [
            70.75,
            32.5681976781031
        ],
        "wc_review_avg": [
            525.25,
            186.5212789469341
        ],
        "wc_reply_reviewers_avg": [
            24.75,
            5.717298313014636
        ],
        "wc_reply_authors_avg": [
            1385.25,
            467.98150337379786
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.0,
            1.0
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9380849146637308777&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=Zsfiqpft6K",
        "pdf": "https://openreview.net/pdf?id=Zsfiqpft6K",
        "email": "korea.ac.kr;;korea.ac.kr;korea.ac.kr;korea.ac.kr;korea.ac.kr;korea.ac.kr",
        "author_num": 7,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "Korea University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.korea.ac.kr",
        "aff_unique_abbr": "KU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "ZtlcdjE1K3",
        "title": "DECOUPLE QUANTIZATION STEP AND OUTLIER-MIGRATED RECONSTRUCTION FOR PTQ",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Post-training quantization (PTQ) is a popular technique for compressing deep learning models due to its low cost and high efficiency. However, in some extremely low-bit settings, PTQ still suffers from significant performance degradation. In this work, we reveal two related obstacles: (1) the setting of  weight's quantization step has not been fully explored, and (2) the outlier activation beyond clipping range are ignored in most methods, which is especially important for lightweight models and low-bit settings. To overcome these two obstacles, we propose \\textbf{DOMR}, to (1) fully explore the setting of weight's quantization step into five cases through \\textbf{D}ecoupling, based on the ignored fact that integer weight (different from integer activation) can be obtained early before actual inference deployment, (2) save outliers into the safe clipping range under predefined bitwidth with \\textbf{O}utlier-\\textbf{M}igrated \\textbf{R}econstruction, based on the nature of CNN structure and PTQ's clipping operation. More outliers saved equals to breaking the bitwidth shackle of a predefined hardware thus brings better performance. Extensive experiments on various networks demonstrate that DOMR establishes a new SOTA in PTQ. Specifically, DOMR outperforms the current best method by 12.93\\% in Top-1 accuracy for W2A2 on MobileNet-v2. The code will be released.",
        "keywords": "post-training quantization\uff0cmodel compression",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/f2d532006dde3a0a01253e193a10bec18fb27475.pdf",
        "author": "Zhaojing Wen;Qiulin Zhang;Yuan Zhang;Rudan Chen;Xichao Yang;Di Xie",
        "authorids": "~Zhaojing_Wen2;~Qiulin_Zhang1;~Yuan_Zhang11;~Rudan_Chen1;~Xichao_Yang1;~Di_Xie1",
        "gender": ";M;F;;M;M",
        "homepage": ";;https://github.com/chenrudan;http://yangxichao.github.io;;",
        "dblp": "245/1013.html;29/10048;;;38/7733;",
        "google_scholar": ";PtJQF9UAAAAJ;;;7sxVnykAAAAJ;",
        "orcid": ";;;;;",
        "linkedin": ";;;;;yuan-zhang-a74b4183/",
        "or_profile": "~Zhaojing_Wen2;~Qiulin_Zhang1;~Rudan_Chen1;~Xichao_Yang1;~Di_Xie1;~yuan_zhang1",
        "aff": "Hikvision Research Institute;Hikvision Research Institute;;;Hikvision Research Institute;Hikvision Research Institute",
        "aff_domain": "hikvision.com;hikvision.com;;;hikvision.com;hikvision.com",
        "position": "Researcher;Researcher;;;Research Director;Researcher",
        "bibtex": "@misc{\nwen2024decouple,\ntitle={{DECOUPLE} {QUANTIZATION} {STEP} {AND} {OUTLIER}-{MIGRATED} {RECONSTRUCTION} {FOR} {PTQ}},\nauthor={Zhaojing Wen and Qiulin Zhang and Yuan Zhang and Rudan Chen and Xichao Yang and Di Xie},\nyear={2024},\nurl={https://openreview.net/forum?id=ZtlcdjE1K3}\n}",
        "github": "",
        "project": "",
        "reviewers": "pf4t;wiuF;RfJv",
        "site": "https://openreview.net/forum?id=ZtlcdjE1K3",
        "pdf_size": 1209594,
        "rating": "3;6;6",
        "confidence": "5;4;4",
        "soundness": "2;3;3",
        "contribution": "1;3;2",
        "presentation": "3;1;3",
        "wc_summary": "79;205;169",
        "wc_strengths": "34;41;74",
        "wc_weaknesses": "114;78;218",
        "wc_questions": "27;53;21",
        "wc_review": "254;377;482",
        "wc_reply_reviewers": "161;70;92",
        "wc_reply_authors": "1899;1129;1223",
        "reply_reviewers": "1;2;1",
        "reply_authors": "5;4;3",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            151.0,
            52.99056519796708
        ],
        "wc_strengths_avg": [
            49.666666666666664,
            17.441967269268172
        ],
        "wc_weaknesses_avg": [
            136.66666666666666,
            59.35954477213884
        ],
        "wc_questions_avg": [
            33.666666666666664,
            13.888444437333106
        ],
        "wc_review_avg": [
            371.0,
            93.17725044236924
        ],
        "wc_reply_reviewers_avg": [
            107.66666666666667,
            38.76711091748892
        ],
        "wc_reply_authors_avg": [
            1417.0,
            342.97910529165864
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            4.0,
            0.816496580927726
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:eoVnvb_O1gAJ:scholar.google.com/&scioq=DECOUPLE+QUANTIZATION+STEP+AND+OUTLIER-MIGRATED+RECONSTRUCTION+FOR+PTQ&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Hikvision Research Institute",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.hikvision.com/cn/",
        "aff_unique_abbr": "Hikvision",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "Ztt6V7Lgo5",
        "title": "Learning from Fragmentary Multivariate Time Series Data with Scalable Numerical Embedding",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The recent proliferation of transformer-based models in natural language processing and computer vision has significantly impacted fields involving multivariate time series (MTS) data. This research focuses on a different data type sourced from electronic health records (EHR). Unlike other MTS data, EHR exhibits a high prevalence of irregular missing values due to its asynchronous measurement nature, which may drastically harm the efficacy of the learning algorithms. To tackle this issue effectively, we propose a novel approach termed \"SCAlable Numerical Embedding\" ($\\mathrm{SCANE}$), which treats each value as an independent token to enhance the flexibility of the interaction between variables. Moreover, we integrate the transformer encoder with $\\mathrm{SCANE}$ (TranSCANE) to form a complete feature extractor for downstream tasks. TranSCANE\u2019s attention module within its transformer encoder is specifically tailored for EHR data to circumvent the noise from irregular missing values adeptly. To further enhance the interpretability of TranSCANE, we propose the revised rollout attention that comprehensively computes attention weights across all transformer encoder stacks and neglects the dummy attention for missing values. This empowers us to gain insights into the inner workings of TranSCANE and improve model interpretability. The experimental results reinforce TranSCANE's efficacy, as it attains superior performance on three distinct EHR datasets with high missing rates. We believe that TranSCANE also holds the potential to extend the utility of transformer-based models into diverse domains with high missing rate MTS data.",
        "keywords": "representation learning;multivariate time series data;missing value;model interpretability;transformer-based model",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/bb6d96ccef58affbe111ec8de9f4d8fc0829a9ba.zip",
        "author": "Chun-Kai Huang;Yi-Hsien Hsieh;Che Lin;Tung-Hung Su;JH Kao",
        "authorids": "~Chun-Kai_Huang2;~Yi-Hsien_Hsieh1;~Che_Lin1;~Tung-Hung_Su1;~JH_Kao1",
        "gender": "M;M;;M;M",
        "homepage": ";https://www.idssp.ee.ntu.edu.tw/che-lin;;;",
        "dblp": ";66/4850;;;",
        "google_scholar": "https://scholar.google.com.tw/citations?user=v9Xh2BQAAAAJ;https://scholar.google.com.tw/citations?user=S63I7jMAAAAJ;https://scholar.google.com.tw/citations?user=AXJYnp4AAAAJ;;",
        "orcid": ";0000-0002-4986-311X;0000-0002-6747-7941;0000-0002-2442-7952;",
        "linkedin": ";che-lin-18ab268/;;;\u4fca\u6137-\u9ec3-48a105115/",
        "or_profile": "~Yi-Hsien_Hsieh1;~Che_Lin1;~Tung-Hung_Su1;~JH_Kao1;~CHUN-KAI_HUANG1",
        "aff": "National Taiwan University;National Taiwan University;National Taiwan University;National Taiwan University;",
        "aff_domain": "ntu.edu.tw;ntu.edu.tw;ntu.edu.tw;ntu.edu.tw;",
        "position": "PhD student;Full Professor;Associate Professor;Full Professor;",
        "bibtex": "@misc{\nhuang2024learning,\ntitle={Learning from Fragmentary Multivariate Time Series Data with Scalable Numerical Embedding},\nauthor={Chun-Kai Huang and Yi-Hsien Hsieh and Che Lin and Tung-Hung Su and JH Kao},\nyear={2024},\nurl={https://openreview.net/forum?id=Ztt6V7Lgo5}\n}",
        "github": "",
        "project": "",
        "reviewers": "St5P;GLth;USDM;9DJ5",
        "site": "https://openreview.net/forum?id=Ztt6V7Lgo5",
        "pdf_size": 1047341,
        "rating": "3;3;3;5",
        "confidence": "4;3;5;5",
        "soundness": "2;2;2;4",
        "contribution": "1;2;2;2",
        "presentation": "2;2;2;3",
        "wc_summary": "50;175;61;71",
        "wc_strengths": "22;97;8;42",
        "wc_weaknesses": "205;338;444;264",
        "wc_questions": "238;124;25;151",
        "wc_review": "515;734;538;528",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            89.25,
            50.06183676214847
        ],
        "wc_strengths_avg": [
            42.25,
            33.840619084171614
        ],
        "wc_weaknesses_avg": [
            312.75,
            89.23389210384136
        ],
        "wc_questions_avg": [
            134.5,
            75.9687435726036
        ],
        "wc_review_avg": [
            578.75,
            90.00381936340257
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5222329678670935,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Qy4Y2NB1b9EJ:scholar.google.com/&scioq=Learning+from+Fragmentary+Multivariate+Time+Series+Data+with+Scalable+Numerical+Embedding&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "National Taiwan University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ntu.edu.tw",
        "aff_unique_abbr": "NTU",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Taiwan",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "ZuNIhK2eGP",
        "title": "Mining Shallow Layer Representations in Class-Incremental Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Class-Incremental Learning (CIL) aims to learn new knowledge without forgetting the old knowledge.\nOne of the popular approaches is to obtain transferable representations, which would be general for learning incremental tasks without expanding the representations.\nRecently, many works focus on making the final representation more transferable across incremental tasks.\nHowever, researchers rarely focus on shallow layer representations and utilize their properties to facilitate CIL, although they are shown to be more transferable than the final representation.\nIn this paper, we investigate the properties of the shallow layer representations and utilize them to improve the performance in class-incremental learning.\nSpecifically, we show that shallow layer representations forget less than deeper layers. \nFurthermore, we find that shallow layer representations have more stable intra-class relations.\nSuch intra-class relations reflect the task-agnostic information that the deeper layer representations lack.\nTherefore, we propose Intra-class Backward Distillation (IncBD) to make the deeper layers learn from the intra-class relations of the shallow layer's representations, making the final representation more stable in terms of the intra-class relations.\nTo compensate for the loss of class separability introduced by backward distillation, we also propose to train auxiliary classifiers for each layer's representation.\nExtensive experiments are performed to show that the intra-class relations are important for the transferability of the final representation and performance improvement in class-incremental learning.",
        "keywords": "class-incremental learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Bowen Zheng;Da-Wei Zhou;Han-Jia Ye;De-Chuan Zhan",
        "authorids": "~Bowen_Zheng4;~Da-Wei_Zhou1;~Han-Jia_Ye1;~De-Chuan_Zhan1",
        "gender": ";;M;M",
        "homepage": ";http://www.lamda.nju.edu.cn/zhoudw/;http://www.lamda.nju.edu.cn/yehj;http://www.lamda.nju.edu.cn/zhandc/",
        "dblp": ";120/6109;165/3014;74/498",
        "google_scholar": ";kMNaR-YAAAAJ;mgOYhtoAAAAJ;mYJf4TcAAAAJ",
        "orcid": ";;;0000-0002-3533-2078",
        "linkedin": ";;;",
        "or_profile": "~Bowen_Zheng4;~Da-Wei_Zhou1;~Han-Jia_Ye1;~De-Chuan_Zhan1",
        "aff": ";Nanjing University;Nanjing University;Nanjing University",
        "aff_domain": ";nju.edu.cn;nju.edu.cn;nju.edu.cn",
        "position": ";PhD student;Associate Professor;Full Professor",
        "bibtex": "@misc{\nzheng2024mining,\ntitle={Mining Shallow Layer Representations in Class-Incremental Learning},\nauthor={Bowen Zheng and Da-Wei Zhou and Han-Jia Ye and De-Chuan Zhan},\nyear={2024},\nurl={https://openreview.net/forum?id=ZuNIhK2eGP}\n}",
        "github": "",
        "project": "",
        "reviewers": "RoqF;MZ7v;7Hxa;7mgQ",
        "site": "https://openreview.net/forum?id=ZuNIhK2eGP",
        "pdf_size": 934237,
        "rating": "3;3;3;5",
        "confidence": "4;5;5;3",
        "soundness": "2;3;2;2",
        "contribution": "1;2;2;2",
        "presentation": "2;3;3;3",
        "wc_summary": "78;82;63;208",
        "wc_strengths": "11;81;9;83",
        "wc_weaknesses": "222;181;243;138",
        "wc_questions": "22;150;110;136",
        "wc_review": "333;494;425;565",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            107.75,
            58.311126725522975
        ],
        "wc_strengths_avg": [
            46.0,
            36.013886210738214
        ],
        "wc_weaknesses_avg": [
            196.0,
            40.23058537978288
        ],
        "wc_questions_avg": [
            104.5,
            49.746859197340285
        ],
        "wc_review_avg": [
            454.25,
            85.73615048507834
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8703882797784891,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:V39AsVNahFQJ:scholar.google.com/&scioq=Mining+Shallow+Layer+Representations+in+Class-Incremental+Learning&hl=en&as_sdt=0,22",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Nanjing University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nju.edu.cn",
        "aff_unique_abbr": "Nanjing U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "ZuYvrjh2od",
        "title": "ReForm-Eval: Evaluating Large Vision Language Models via Unified Re-Formulation of Task-Oriented Benchmarks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent years have witnessed remarkable progress in the development of large vision-language models (LVLMs). Benefiting from the strong language backbones and efficient cross-modal alignment strategies, LVLMs exhibit surprising capabilities to perceive visual signals and perform visually grounded reasoning. However, the capabilities of LVLMs have not been comprehensively and quantitatively evaluated, as most existing multi-modal benchmarks require task-oriented input-output formats, posing great challenges to automatically assess the free-form text output of LVLMs. To effectively leverage the annotations available in existing benchmarks and reduce the manual effort required for constructing new benchmarks, we propose to re-formulate existing benchmarks into unified LVLM-compatible formats. Through systematic data collection and reformulation, we present the ReForm-Eval benchmark, offering substantial data for evaluating various capabilities of LVLMs. Based on ReForm-Eval, we conduct extensive experiments, thoroughly analyze the strengths and weaknesses of existing LVLMs, and identify the underlying factors. Our benchmark and evaluation framework will be open-sourced as a cornerstone for advancing the development of LVLMs.",
        "keywords": "Benchmarks;Large Vision-Language Model Evaluation;Multi-modal Large Language Model Evaluation",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Zejun Li;Ye Wang;Mengfei Du;Qingwen Liu;Binhao Wu;Jiwen Zhang;Chengxing Zhou;Zhihao Fan;Jie Fu;Jingjing Chen;zhongyu wei",
        "authorids": "~Zejun_Li1;~Ye_Wang24;~Mengfei_Du1;~Qingwen_Liu3;~Binhao_Wu1;~Jiwen_Zhang1;~Chengxing_Zhou1;~Zhihao_Fan1;~Jie_Fu2;~Jingjing_Chen3;~zhongyu_wei1",
        "gender": "M;;M;F;M;;M;M;;F;M",
        "homepage": "http://www.fudan-disc.com/people;https://github.com/Aweminus;https://github.com/mengfeidu;https://github.com/JK18kkk;https://github.com/wbhwbh/;;https://xiningin.github.io/;;;https://jingjing1.github.io/#teach;http://www.sdspeople.fudan.edu.cn/zywei/",
        "dblp": "50/9635;;;;;;;220/0988;;;31/10489",
        "google_scholar": "FYppLbUAAAAJ;;JONwde0AAAAJ;;;;;xfqnSacAAAAJ;;DfWdqzQAAAAJ;AjLDxxgAAAAJ",
        "orcid": ";;;;;;0009-0006-8809-2422;;;;",
        "linkedin": ";;;;;;;;;;",
        "or_profile": "~Zejun_Li1;~Ye_Wang24;~Mengfei_Du1;~Qingwen_Liu3;~Binhao_Wu1;~Jiwen_Zhang1;~Chengxing_Zhou1;~Zhihao_Fan1;~Jie_Fu2;~Jingjing_Chen3;~zhongyu_wei1",
        "aff": "Fudan University;Fudan University;Fudan University;Fudan University;Fudan University;;Northeastern University;Alibaba Group;;Fudan University;Fudan University",
        "aff_domain": "fudan.edu.cn;fudan.edu.cn;fudan.edu.cn;fudan.edu.cn;fudan.edu.cn;;neu.edu.cn;alibaba-inc.com;;fudan.edu.cn;fudan.edu.cn",
        "position": "PhD student;PhD student;MS student;MS student;MS student;;Undergrad student;Researcher;;Associate Professor;Associate Professor",
        "bibtex": "@misc{\nli2024reformeval,\ntitle={ReForm-Eval: Evaluating Large Vision Language Models via Unified Re-Formulation of Task-Oriented Benchmarks},\nauthor={Zejun Li and Ye Wang and Mengfei Du and Qingwen Liu and Binhao Wu and Jiwen Zhang and Chengxing Zhou and Zhihao Fan and Jie Fu and Jingjing Chen and zhongyu wei},\nyear={2024},\nurl={https://openreview.net/forum?id=ZuYvrjh2od}\n}",
        "github": "",
        "project": "",
        "reviewers": "cerW;mogP;J51n;3n83",
        "site": "https://openreview.net/forum?id=ZuYvrjh2od",
        "pdf_size": 3417086,
        "rating": "3;5;6;6",
        "confidence": "5;4;5;4",
        "soundness": "2;2;3;3",
        "contribution": "1;2;3;4",
        "presentation": "3;3;3;3",
        "wc_summary": "53;29;50;86",
        "wc_strengths": "27;75;42;34",
        "wc_weaknesses": "154;274;84;177",
        "wc_questions": "2;1;45;130",
        "wc_review": "236;379;221;427",
        "wc_reply_reviewers": "0;72;24;0",
        "wc_reply_authors": "256;458;806;1060",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            1.118033988749895
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            54.5,
            20.402205763103165
        ],
        "wc_strengths_avg": [
            44.5,
            18.39157415774952
        ],
        "wc_weaknesses_avg": [
            172.25,
            68.00137866249477
        ],
        "wc_questions_avg": [
            44.5,
            52.461890930464946
        ],
        "wc_review_avg": [
            315.75,
            89.04317772856042
        ],
        "wc_reply_reviewers_avg": [
            24.0,
            29.393876913398138
        ],
        "wc_reply_authors_avg": [
            645.0,
            310.01451578918045
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": -0.40824829046386296,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12911974571957317179&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;0;0;0;1;2;0;0",
        "aff_unique_norm": "Fudan University;Northeastern University;Alibaba Group",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.fudan.edu.cn;https://www.northeastern.edu;https://www.alibaba.com",
        "aff_unique_abbr": "Fudan;NEU;Alibaba",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;1;0;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "ZuZujQ9LJV",
        "title": "AutoDAN: Automatic and Interpretable Adversarial Attacks on Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) exhibit broad utility in diverse applications but remain vulnerable to jailbreak attacks, including hand-crafted and automated adversarial attacks, which can compromise their safety measures. However, patching LLMs against these attacks is possible: manual jailbreak attacks are human-readable but often limited and public, making them easy to block, while automated adversarial attacks generate gibberish prompts that can be detected using perplexity-based filters. In this paper, we propose an automatic and interpretable adversarial attack, AutoDAN, that combines the strengths of both types of attacks. It automatically generates attack prompts that bypass perplexity-based filters while maintaining a high attack success rate like manual jailbreak attacks. These prompts are interpretable, exhibiting strategies commonly used in manual jailbreak attacks. Moreover, these interpretable prompts transfer better than their non-readable counterparts, especially when using limited data and a single proxy model. Beyond eliciting harmful content, we also customize the objective of AutoDAN to leak system prompts, demonstrating its versatility. Our work underscores the seemingly intrinsic vulnerability of LLMs to interpretable adversarial attacks.",
        "keywords": "large language models;llms;adverarial attacks;jailbreak attacks;llm security;adverarial robustness",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Sicheng Zhu;Ruiyi Zhang;Bang An;Gang Wu;Joe Barrow;Furong Huang;Tong Sun",
        "authorids": "~Sicheng_Zhu1;~Ruiyi_Zhang3;~Bang_An1;~Gang_Wu4;~Joe_Barrow2;~Furong_Huang1;~Tong_Sun1",
        "gender": "M;;M;M;F;F;M",
        "homepage": "https://schzhu.github.io/;https://bangann.github.io/;https://wugangwu.github.io/;https://jbarrow.ai;https://furong-huang.com;https://research.adobe.com/person/tong-sun/;http://zhangry868.github.io/",
        "dblp": ";188/0741;99/6515-13;203/9677;72/8513;;",
        "google_scholar": ";3ce6z_sAAAAJ;lc0B4d4AAAAJ;A0mvKlgAAAAJ;13yyuCcAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en",
        "orcid": ";;0000-0002-8768-2571;;;;",
        "linkedin": ";;wu-gang/;;;tong-sun/?trk=hb_tab_pro_top;",
        "or_profile": "~Sicheng_Zhu1;~Bang_An1;~Gang_Wu4;~Joe_Barrow2;~Furong_Huang1;~Tong_Sun1;~RUIYI_ZHANG1",
        "aff": "University of Maryland, College Park;University of Maryland, College Park;Adobe Research;Adobe Systems;University of Maryland;Adobe Systems;Adobe Systems",
        "aff_domain": "umd.edu;umd.edu;adobe.com;adobe.com;cs.umd.edu;adobe.com;adobe.com",
        "position": "PhD student;PhD student;Researcher;Researcher;Assistant Professor;Director, Document Intelligence Lab;Research Scientist",
        "bibtex": "@misc{\nzhu2024autodan,\ntitle={Auto{DAN}: Automatic and Interpretable Adversarial Attacks on Large Language Models},\nauthor={Sicheng Zhu and Ruiyi Zhang and Bang An and Gang Wu and Joe Barrow and Furong Huang and Tong Sun},\nyear={2024},\nurl={https://openreview.net/forum?id=ZuZujQ9LJV}\n}",
        "github": "",
        "project": "",
        "reviewers": "rSK6;LYLv;abck;2vNQ",
        "site": "https://openreview.net/forum?id=ZuZujQ9LJV",
        "pdf_size": 3488648,
        "rating": "5;5;5;10",
        "confidence": "4;4;5;4",
        "soundness": "2;3;2;3",
        "contribution": "3;3;2;4",
        "presentation": "3;3;3;4",
        "wc_summary": "45;69;31;165",
        "wc_strengths": "9;72;26;172",
        "wc_weaknesses": "29;97;740;141",
        "wc_questions": "144;11;162;77",
        "wc_review": "227;249;959;555",
        "wc_reply_reviewers": "0;155;117;0",
        "wc_reply_authors": "487;781;1901;671",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;2;4;1",
        "rating_avg": [
            6.25,
            2.165063509461097
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            77.5,
            52.313956072925706
        ],
        "wc_strengths_avg": [
            69.75,
            63.3733974156349
        ],
        "wc_weaknesses_avg": [
            251.75,
            284.70104934825935
        ],
        "wc_questions_avg": [
            98.5,
            59.62591718372138
        ],
        "wc_review_avg": [
            497.5,
            296.315288164482
        ],
        "wc_reply_reviewers_avg": [
            68.0,
            69.31450064741144
        ],
        "wc_reply_authors_avg": [
            960.0,
            553.3470881824535
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0;0;1;1;0;1;1",
        "aff_unique_norm": "University of Maryland;Adobe",
        "aff_unique_dep": ";Adobe Research",
        "aff_unique_url": "https://www/umd.edu;https://research.adobe.com",
        "aff_unique_abbr": "UMD;Adobe",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "College Park;",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "ZuflmOaxb7",
        "title": "Federated Natural Policy Gradient Methods for Multi-task Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Federated reinforcement learning (RL) enables collaborative decision making of multiple distributed agents without sharing local data trajectories. In this work, we consider a multi-task setting, in which each agent has its own private reward function corresponding to different tasks, while sharing the same transition kernel of the environment. Focusing on infinite-horizon tabular Markov decision processes, the goal is to learn a globally optimal policy that maximizes the sum of the discounted total rewards of all the agents in a decentralized manner, where each agent only communicates with its neighbors over some prescribed graph topology. \n\n\nWe develop federated vanilla and entropy-regularized natural policy gradient (NPG) methods under softmax parameterization, where gradient tracking is applied to the global Q-function to mitigate the impact of imperfect information sharing. We establish non-asymptotic global convergence guarantees under exact policy evaluation, which are nearly independent of the size of the state-action space and illuminate the impacts of network size and connectivity. To the best of our knowledge, this is the first time that global convergence is established for federated multi-task RL using policy optimization. Moreover, the convergence behavior of the proposed algorithms is robust against inexactness of policy evaluation.",
        "keywords": "federated multi-task reinforcement learning;natural policy gradient methods;global convergence",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Tong Yang;Shicong Cen;Yuting Wei;Yuxin Chen;Yuejie Chi",
        "authorids": "~Tong_Yang4;~Shicong_Cen1;~Yuting_Wei1;~Yuxin_Chen5;~Yuejie_Chi1",
        "gender": "F;;F;M;",
        "homepage": "https://pptmiao.github.io;https://www.andrew.cmu.edu/user/shicongc/;https://yutingwei.github.io/;https://yuxinchen2020.github.io/;",
        "dblp": ";241/9590;184/3856;11/5123-2;",
        "google_scholar": ";QIRWZf8AAAAJ;fsbXdAYAAAAJ;RtNVud4AAAAJ;",
        "orcid": ";;;0000-0001-9256-5815;",
        "linkedin": ";;;;",
        "or_profile": "~Tong_Yang4;~Shicong_Cen1;~Yuting_Wei1;~Yuxin_Chen5;~Yuejie_Chi1",
        "aff": "Carnegie Mellon University;Carnegie Mellon University;The Wharton School, University of Pennsylvania;University of Pennsylvania;",
        "aff_domain": "cmu.edu;andrew.cmu.edu;wharton.upenn.edu;upenn.edu;",
        "position": "PhD student;PhD student;Assistant Professor;Associate Professor;",
        "bibtex": "@misc{\nyang2024federated,\ntitle={Federated Natural Policy Gradient Methods for Multi-task Reinforcement Learning},\nauthor={Tong Yang and Shicong Cen and Yuting Wei and Yuxin Chen and Yuejie Chi},\nyear={2024},\nurl={https://openreview.net/forum?id=ZuflmOaxb7}\n}",
        "github": "",
        "project": "",
        "reviewers": "svj3;tCM8;P1H3;GXb4",
        "site": "https://openreview.net/forum?id=ZuflmOaxb7",
        "pdf_size": 910712,
        "rating": "3;5;5;6",
        "confidence": "2;4;3;3",
        "soundness": "3;3;3;2",
        "contribution": "2;2;2;2",
        "presentation": "3;3;3;3",
        "wc_summary": "42;59;24;77",
        "wc_strengths": "23;25;20;75",
        "wc_weaknesses": "72;99;68;78",
        "wc_questions": "63;167;68;162",
        "wc_review": "200;350;180;392",
        "wc_reply_reviewers": "0;14;36;90",
        "wc_reply_authors": "1228;805;408;797",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "2;2;1;2",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            50.5,
            19.67866865415443
        ],
        "wc_strengths_avg": [
            35.75,
            22.730761095924613
        ],
        "wc_weaknesses_avg": [
            79.25,
            11.94518731540029
        ],
        "wc_questions_avg": [
            115.0,
            49.563091106185055
        ],
        "wc_review_avg": [
            280.5,
            91.98233526063578
        ],
        "wc_reply_reviewers_avg": [
            35.0,
            34.249087579087416
        ],
        "wc_reply_authors_avg": [
            809.5,
            290.0521504833226
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.6488856845230502,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6221694044069454038&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;1",
        "aff_unique_norm": "Carnegie Mellon University;University of Pennsylvania",
        "aff_unique_dep": ";The Wharton School",
        "aff_unique_url": "https://www.cmu.edu;https://www.wharton.upenn.edu",
        "aff_unique_abbr": "CMU;UPenn Wharton",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "ZuoeYIGaSW",
        "title": "$\\texttt{PREMIER-TACO}$ is a Few-Shot Policy Learner: Pretraining Multitask Representation via Temporal Action-Driven Contrastive Loss",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We introduce $\\texttt{Premier-TACO}$, a novel multitask feature representation learning methodology aiming to enhance the efficiency of few-shot policy learning in sequential decision-making tasks. $\\texttt{Premier-TACO}$ pretrains a general feature representation using a small subset of relevant multitask offline datasets, capturing essential environmental dynamics. This representation can then be fine-tuned to specific tasks with few expert demonstrations.\nBuilding upon the recent temporal action contrastive learning (TACO) objective, which obtains the state of art performance in visual control tasks, $\\texttt{Premier-TACO}$ additionally employs a simple yet effective negative example sampling strategy. This key modification ensures computational efficiency and scalability for large-scale multitask offline pretraining.\nExperimental results from both Deepmind Control Suite and MetaWorld domains underscore the effectiveness of $\\texttt{Premier-TACO}$ for pretraining visual representation, facilitating efficient few-shot imitation learning of unseen tasks.\nOn the DeepMind Control Suite, $\\texttt{Premier-TACO}$ achieves an average improvement of 101\\% in comparison to a carefully implemented Learn-from-scratch baseline, and a 24\\% improvement compared with the most effective baseline pretraining method. \nSimilarly, on MetaWorld, $\\texttt{Premier-TACO}$ obtains an average advancement of 74\\% against Learn-from-scratch and a 40\\% increase in comparison to the best baseline pretraining method.",
        "keywords": "Reinforcement Learning;Representation;Pretraining;Contrastive Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Ruijie Zheng;Yongyuan Liang;Xiyao Wang;Shuang Ma;Hal Daum\u00e9 III;Huazhe Xu;John Langford;Praveen Palanisamy;Kalyan Shankar Basu;Furong Huang",
        "authorids": "~Ruijie_Zheng1;~Yongyuan_Liang1;~Xiyao_Wang1;~Shuang_Ma3;~Hal_Daum\u00e9_III1;~Huazhe_Xu1;~John_Langford1;~Praveen_Palanisamy2;~Kalyan_Shankar_Basu1;~Furong_Huang1",
        "gender": ";F;M;M;M;M;;M;F;F",
        "homepage": "http://www.ruijiezheng.com;https://cheryyunl.github.io/;;http://hal3.name;http://hxu.rocks;http://hunch.net/~jl;https://praveenp.com;;https://furong-huang.com;https://www.shuangma.me/",
        "dblp": "294/8474;238/4104;;77/2856.html;164/9006;77/4488;223/4229;;72/8513;98/3906",
        "google_scholar": ";GQToORIAAAAJ;puVqfbwAAAAJ;PbEw81gAAAAJ;t9HPFawAAAAJ;LFiqVpwAAAAJ;gHmYX8YAAAAJ;;13yyuCcAAAAJ;IHPRZuMAAAAJ",
        "orcid": ";;;;;;0000-0001-9069-3071;;;",
        "linkedin": ";https://linkedin.com/in/yongyuan-l-31462a17a;;;;;;kalyan-basu-61959b2/;;",
        "or_profile": "~Ruijie_Zheng1;~Yongyuan_Liang1;~Xiyao_Wang1;~Hal_Daum\u00e9_III1;~Huazhe_Xu1;~John_Langford1;~Praveen_Palanisamy2;~Kalyan_Shankar_Basu1;~Furong_Huang1;~shuang_ma1",
        "aff": "University of Maryland, College Park;University of Maryland, College Park;University of Maryland, College Park;Microsoft;Tsinghua University;Microsoft;Microsoft;Qualtrics LLC;University of Maryland;Apple",
        "aff_domain": "cs.umd.edu;umd.edu;umd.edu;microsoft.com;tsinghua.edu.cn;microsoft.com;microsoft.com;qualtrics.com;cs.umd.edu;apple.com",
        "position": "PhD student;PhD student;PhD student;Senior Principle Researcher;Assistant Professor;Researcher;Researcher;Principal Researcher;Assistant Professor;Researcher",
        "bibtex": "@misc{\nzheng2024textttpremiertaco,\ntitle={\\${\\textbackslash}texttt\\{{PREMIER}-{TACO}\\}\\$ is a Few-Shot Policy Learner: Pretraining Multitask Representation via Temporal Action-Driven Contrastive Loss},\nauthor={Ruijie Zheng and Yongyuan Liang and Xiyao Wang and Shuang Ma and Hal Daum{\\'e} III and Huazhe Xu and John Langford and Praveen Palanisamy and Kalyan Shankar Basu and Furong Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=ZuoeYIGaSW}\n}",
        "github": "",
        "project": "",
        "reviewers": "YiPn;7fxb;AXkc",
        "site": "https://openreview.net/forum?id=ZuoeYIGaSW",
        "pdf_size": 8668709,
        "rating": "5;5;5",
        "confidence": "3;3;2",
        "soundness": "3;3;3",
        "contribution": "2;2;2",
        "presentation": "3;3;3",
        "wc_summary": "47;52;76",
        "wc_strengths": "44;44;35",
        "wc_weaknesses": "152;137;149",
        "wc_questions": "12;6;4",
        "wc_review": "255;239;264",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1085;1089;916",
        "reply_reviewers": "0;0;0",
        "reply_authors": "4;4;4",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            58.333333333333336,
            12.657891697365017
        ],
        "wc_strengths_avg": [
            41.0,
            4.242640687119285
        ],
        "wc_weaknesses_avg": [
            146.0,
            6.48074069840786
        ],
        "wc_questions_avg": [
            7.333333333333333,
            3.39934634239519
        ],
        "wc_review_avg": [
            252.66666666666666,
            10.338708279513881
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1030.0,
            80.62671186813131
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            4.0,
            0.0
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13004499412455352355&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;1;2;1;1;3;0;4",
        "aff_unique_norm": "University of Maryland;Microsoft;Tsinghua University;Qualtrics;Apple",
        "aff_unique_dep": ";Microsoft Corporation;;;Apple Inc.",
        "aff_unique_url": "https://www/umd.edu;https://www.microsoft.com;https://www.tsinghua.edu.cn;https://www.qualtrics.com;https://www.apple.com",
        "aff_unique_abbr": "UMD;Microsoft;THU;Qualtrics;Apple",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "College Park;",
        "aff_country_unique_index": "0;0;0;0;1;0;0;0;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "Zv5lXjijxH",
        "title": "Optimal Rates for Convex Optimization with Multiway Preferences",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We address the problem of convex optimization with preference feedback, where the goal is to minimize a convex function given a weaker form of comparison queries. Each query consists of two points and the dueling feedback returns a (noisy) single-bit binary comparison of the function values of the two queried points. Here we consider the sign-function-based comparison feedback model and analyzed the convergence rates with batched and multiway (argmin of a set queried points) comparisons. Our main goal is to understand the improved convergence rates owing to parallelization in sign-feedback-based optimization problems. Our work is the first to study the problem of convex optimization with multiway preferences and analyze the optimal convergence rates. Our first contribution lies in designing efficient algorithms with a convergence rate of $\\smash{\\widetilde O}(\\frac{d}{\\min\\{m,d\\} \\epsilon})$ for $m$-batched preference feedback where the learner can query $m$-pairs in parallel. We next study a $m$-multiway comparison (`battling') feedback, where the learner can get to see the argmin feedback of $m$-subset of queried points and show a convergence rate of $\\smash{\\widetilde O}(\\frac{d}{  \\min\\{\\log m,d\\}\\epsilon })$. We show further improved convergence rates with an additional assumption of strong convexity. Finally, we also study the convergence lower bounds for batched preferences and multiway feedback optimization showing the optimality of our convergence rates in terms of the parameter $m$.",
        "keywords": "convex;optimization;dueling;sign;comparison;smooth;strongly;convergence;rate;suboptimality;gap;minimum;optimal",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Aadirupa Saha;Yishay Mansour;Vitaly Feldman;Tomer Koren",
        "authorids": "~Aadirupa_Saha1;~Yishay_Mansour2;~Vitaly_Feldman1;~Tomer_Koren1",
        "gender": ";M;M;M",
        "homepage": "http://aadirupa.github.io/;https://vtaly.net;https://tomerkoren.github.io;https://www.cs.tau.ac.il/~mansour/",
        "dblp": ";67/1162;12/10044;m/YishayMansour",
        "google_scholar": "https://scholar.google.co.in/citations?user=7a49tQYAAAAJ;GqZBmfgAAAAJ;wGG1voYAAAAJ;OEJUgwkAAAAJ",
        "orcid": "0000-0003-4965-6417;;;0000-0001-6891-2645",
        "linkedin": "aadirupa-saha;;;",
        "or_profile": "~Aadirupa_Saha1;~Vitaly_Feldman1;~Tomer_Koren1;~Yishay_Mansour1",
        "aff": "Apple;Apple AI Research;Tel Aviv University;School of Computer Science, Tel Aviv University",
        "aff_domain": "apple.com;apple.com;tau.ac.il;cs.tau.ac.il",
        "position": "Researcher;Research Scientist;Associate Professor;Full Professor",
        "bibtex": "@misc{\nsaha2024optimal,\ntitle={Optimal Rates for Convex Optimization with Multiway Preferences},\nauthor={Aadirupa Saha and Yishay Mansour and Vitaly Feldman and Tomer Koren},\nyear={2024},\nurl={https://openreview.net/forum?id=Zv5lXjijxH}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=Zv5lXjijxH",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:oc7y0m7odxEJ:scholar.google.com/&scioq=Optimal+Rates+for+Convex+Optimization+with+Multiway+Preferences&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;1",
        "aff_unique_norm": "Apple;Tel Aviv University",
        "aff_unique_dep": "Apple Inc.;",
        "aff_unique_url": "https://www.apple.com;https://www.tau.ac.il",
        "aff_unique_abbr": "Apple;TAU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Tel Aviv",
        "aff_country_unique_index": "0;0;1;1",
        "aff_country_unique": "United States;Israel"
    },
    {
        "id": "ZvyQTNt2qp",
        "title": "Provable Convergence of Clipped Normalized-gradient Heavy-Ball Momentum for Adversarial Attacks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Gradient-based adversarial attack is dominated by the sign-like regime. Specifically, the sign-momentum MI-FGSM, which is a variant of Polyak's heavy-ball in normalizing each gradient by its $L_1$-norm, has achieved remarkable empirical success. However, the sign operation inevitably loses information about the magnitude as well as the direction of gradient or momentum, leading to non-convergence even in simple convex cases. Gradient clipping is an effective rescaling technique in optimization, and its potential has recently been demonstrated in accelerating and stabilizing the training process for deep learning. In this paper, to circumvent the drawbacks of sign-like gradient-based attacks, we present a clipped momentum method, in which the normalized-gradient heavy-ball momentum (NGM) is clipped as the update direction. By using a new radius-varying clipping rule, the clipped NGM is proved to attain optimal averaging convergence for general constrained convex problems. The experiments demonstrate that it remarkably improves the performance of sign-like methods and verify that the clipping technique can serve as an alternative to the sign operation in adversarial attacks.",
        "keywords": "Adversarial Attacks;Heavy-ball Momentum;Clipped Normalized-gradient;Convergence",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/58740d7246dd7dc4f4d2b407743ade26af7ee87d.zip",
        "author": "Wei Tao;Lei Bao;Sheng Long;Jun Chen;Qing Tao",
        "authorids": "~Wei_Tao3;~Lei_Bao3;~Sheng_Long2;~Jun_Chen15;~Qing_Tao2",
        "gender": "M;F;M;;M",
        "homepage": ";;;;",
        "dblp": "https://dblp.uni-trier.de/pid/17/6159.html;88/1530.html;285/4822;26/5160.html;",
        "google_scholar": "M-pMjh0AAAAJ;;;;",
        "orcid": ";;;;",
        "linkedin": ";;;;https://www.linkedin.com/",
        "or_profile": "~Wei_Tao3;~Lei_Bao3;~Sheng_Long2;~Qing_Tao2;~J_Chen2",
        "aff": "Academy of Military Science;;National University of Defense Technology;;Department of Information Engineering, PLA Army Academy of Artillery and Air Defense",
        "aff_domain": "ams.edu;;nudt.edu.cn;;pbfkbxy.cn",
        "position": "Assistant Professor;;PhD student;;Undergrad student",
        "bibtex": "@misc{\ntao2024provable,\ntitle={Provable Convergence of Clipped Normalized-gradient Heavy-Ball Momentum for Adversarial Attacks},\nauthor={Wei Tao and Lei Bao and Sheng Long and Jun Chen and Qing Tao},\nyear={2024},\nurl={https://openreview.net/forum?id=ZvyQTNt2qp}\n}",
        "github": "",
        "project": "",
        "reviewers": "kjcR;mvi6;nPVd;F2ht",
        "site": "https://openreview.net/forum?id=ZvyQTNt2qp",
        "pdf_size": 6653685,
        "rating": "5;5;5;5",
        "confidence": "3;3;2;3",
        "soundness": "2;3;3;2",
        "contribution": "2;2;2;2",
        "presentation": "2;3;2;3",
        "wc_summary": "21;33;53;35",
        "wc_strengths": "12;31;15;38",
        "wc_weaknesses": "418;76;259;175",
        "wc_questions": "8;10;3;175",
        "wc_review": "459;150;330;423",
        "wc_reply_reviewers": "66;0;0;0",
        "wc_reply_authors": "692;252;884;518",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            35.5,
            11.434596626029272
        ],
        "wc_strengths_avg": [
            24.0,
            10.8397416943394
        ],
        "wc_weaknesses_avg": [
            232.0,
            125.40932979647089
        ],
        "wc_questions_avg": [
            49.0,
            72.79079612148777
        ],
        "wc_review_avg": [
            340.5,
            119.63381628954248
        ],
        "wc_reply_reviewers_avg": [
            16.5,
            28.578838324886476
        ],
        "wc_reply_authors_avg": [
            586.5,
            232.49677417116996
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:JjCBJCZ1sH0J:scholar.google.com/&scioq=Provable+Convergence+of+Clipped+Normalized-gradient+Heavy-Ball+Momentum+for+Adversarial+Attacks&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Academy of Military Science;National University of Defense Technology;PLA Army Academy of Artillery and Air Defense",
        "aff_unique_dep": ";;Department of Information Engineering",
        "aff_unique_url": ";http://www.nudt.edu.cn/;",
        "aff_unique_abbr": ";NUDT;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "Zw8YxUWL4R",
        "title": "P+: Extended Textual Conditioning in Text-to-Image Generation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We introduce an Extended Textual Conditioning space in text-to-image diffusion models, referred to as P+. This space consists of multiple textual conditions, derived from per-layer prompts, each corresponding to a cross-attention layer of the denoising U-net of the diffusion model. \nWe show that the extended space provides greater control over the synthesis process. We further introduce Extended Textual Inversion (XTI), which inverts concepts into P+, such that they are represented with per-layer tokens.\nWe show that XTI\nis more expressive and precise, and converges faster than the original Textual Inversion (TI) space.\nCompared to baselines, XTI achieves much better reconstruction and editability without the need to balance these two goals.\nWe conduct a series of extensive experiments to analyze and understand the properties of the new space, and to showcase the effectiveness of our method for personalizing text-to-image models. Furthermore, we utilize the unique properties of this space to achieve previously unattainable results in object-style mixing using text-to-image models.",
        "keywords": "Text-to-image;Textual Inversion;Diffusion;Image Generation",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Andrey Voynov;Qinghao Chu;Daniel Cohen-Or;Kfir Aberman",
        "authorids": "~Andrey_Voynov1;~Qinghao_Chu1;~Daniel_Cohen-Or1;~Kfir_Aberman1",
        "gender": "M;;M;M",
        "homepage": "https://anvoynov.github.io/anvoynov/;;http://www.cs.tau.ac.il/~dcor/;https://kfiraberman.github.io/",
        "dblp": "255/6107;;c/DCohenOr;",
        "google_scholar": "imBjSgUAAAAJ;;https://scholar.google.com.tw/citations?user=fAxws1sAAAAJ;https://scholar.google.co.il/citations?user=jdbZDakAAAAJ",
        "orcid": ";;0000-0001-6777-7445;",
        "linkedin": ";https://www.linkedin.com/mwlite/in/qinghaochu;;",
        "or_profile": "~Andrey_Voynov1;~Qinghao_Chu1;~Daniel_Cohen-Or1;~Kfir_Aberman1",
        "aff": "Google;Google;Tel Aviv University;Snap Inc.",
        "aff_domain": "google.com;google.com;tau.ac.il;snap.com",
        "position": "Researcher;Researcher;Full Professor;Researcher",
        "bibtex": "@misc{\nvoynov2024p,\ntitle={P+: Extended Textual Conditioning in Text-to-Image Generation},\nauthor={Andrey Voynov and Qinghao Chu and Daniel Cohen-Or and Kfir Aberman},\nyear={2024},\nurl={https://openreview.net/forum?id=Zw8YxUWL4R}\n}",
        "github": "",
        "project": "",
        "reviewers": "XoyW;UJKo;Tj83;nviY",
        "site": "https://openreview.net/forum?id=Zw8YxUWL4R",
        "pdf_size": 28345614,
        "rating": "5;5;5;6",
        "confidence": "4;4;3;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;2;2",
        "presentation": "3;3;3;3",
        "wc_summary": "65;56;50;102",
        "wc_strengths": "39;78;34;55",
        "wc_weaknesses": "189;141;177;69",
        "wc_questions": "70;55;2;69",
        "wc_review": "363;330;263;295",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            68.25,
            20.20365066021485
        ],
        "wc_strengths_avg": [
            51.5,
            17.153716798408443
        ],
        "wc_weaknesses_avg": [
            144.0,
            46.76537180435969
        ],
        "wc_questions_avg": [
            49.0,
            27.7758888246623
        ],
        "wc_review_avg": [
            312.75,
            37.459144410944575
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 180,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12276671333340029770&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "Google;Tel Aviv University;Snap Inc.",
        "aff_unique_dep": "Google;;",
        "aff_unique_url": "https://www.google.com;https://www.tau.ac.il;https://www.snapinc.com",
        "aff_unique_abbr": "Google;TAU;Snap",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Mountain View;",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "United States;Israel"
    },
    {
        "id": "ZwbUcpOaH7",
        "title": "Transitional Uncertainty with Intermediate Neural Gaussian Processes",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In this paper, we discuss feature engineering for single-pass uncertainty estimation. For accurate uncertainty estimates, neural networks must extract differences in the feature space that quantify uncertainty. This could be achieved by current single-pass approaches that maintain feature distances between data points as they traverse the network. While initial results are promising, maintaining feature distances within the network representations frequently inhibits information compression and opposes the learning objective. We study this effect theoretically and empirically to arrive at a simple conclusion: preserving feature distances in the output is beneficial when the preserved features contribute to learning the label distribution and act in opposition otherwise. We then propose Transitional Uncertainty with Intermediate Neural Gaussian Processes (TUrING Processes) as a simple approach to address the shortcomings of current single-pass estimators. Specifically, we implement feature preservation by extracting features from intermediate representations before information is collapsed by subsequent layers. We refer to the underlying preservation mechanism as transitional feature preservation. We show that TUrING Processes match or outperform current single-pass methods on standard benchmarks and in practical settings where these methods are less reliable (imbalances, complex architectures, medical modalities).",
        "keywords": "Single model uncertainty;Deterministic uncertainty quantification;Out-of-distribution detection",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/17e1a82de1acc5f3e0fc2f0cfce3e3af4c8c2e11.pdf",
        "author": "Ryan Benkert;Mohit Prabhushankar;Ghassan AlRegib",
        "authorids": "~Ryan_Benkert1;~Mohit_Prabhushankar1;~Ghassan_AlRegib1",
        "gender": "M;M;M",
        "homepage": ";https://sites.google.com/view/mohit-prabhushankar;http://www.ghassanalregib.info",
        "dblp": ";185/7435;83/1655",
        "google_scholar": ";https://scholar.google.com/scholar?hl=en;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0002-9634-9359;0000-0002-8743-7058;",
        "linkedin": ";;ghassan-alregib-0602131/",
        "or_profile": "~Ryan_Benkert1;~Mohit_Prabhushankar1;~Ghassan_AlRegib1",
        "aff": "Georgia Institute of Technology;Georgia Institute of Technology;Georgia Institute of Technology",
        "aff_domain": "gatech.edu;gatech.edu;gatech.edu",
        "position": "PhD student;Postdoc;Full Professor",
        "bibtex": "@misc{\nbenkert2024transitional,\ntitle={Transitional Uncertainty with Intermediate Neural Gaussian Processes},\nauthor={Ryan Benkert and Mohit Prabhushankar and Ghassan AlRegib},\nyear={2024},\nurl={https://openreview.net/forum?id=ZwbUcpOaH7}\n}",
        "github": "",
        "project": "",
        "reviewers": "3eZi;AwFU;SFMY",
        "site": "https://openreview.net/forum?id=ZwbUcpOaH7",
        "pdf_size": 1803012,
        "rating": "5;5;5",
        "confidence": "3;3;3",
        "soundness": "3;3;3",
        "contribution": "2;2;2",
        "presentation": "2;3;3",
        "wc_summary": "101;206;63",
        "wc_strengths": "38;153;80",
        "wc_weaknesses": "145;224;232",
        "wc_questions": "145;4;105",
        "wc_review": "429;587;480",
        "wc_reply_reviewers": "0;0;19",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;1",
        "reply_authors": "0;0;0",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            123.33333333333333,
            60.47772776448827
        ],
        "wc_strengths_avg": [
            90.33333333333333,
            47.51374070261733
        ],
        "wc_weaknesses_avg": [
            200.33333333333334,
            39.262648351270904
        ],
        "wc_questions_avg": [
            84.66666666666667,
            59.33146064460424
        ],
        "wc_review_avg": [
            498.6666666666667,
            65.83987309289782
        ],
        "wc_reply_reviewers_avg": [
            6.333333333333333,
            8.956685895029603
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:tA4YtooUoDoJ:scholar.google.com/&scioq=Transitional+Uncertainty+with+Intermediate+Neural+Gaussian+Processes&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Georgia Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.gatech.edu",
        "aff_unique_abbr": "Georgia Tech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Learning dynamic representations of the functional connectome in neurobiological networks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18382",
        "id": "ZwhHSOHMTM",
        "author_site": "Luciano Dyballa, Samuel Lang, Alexandra Haslund-Gourley, Eviatar Yemini, Steven Zucker",
        "tldr": "",
        "abstract": "The static synaptic connectivity of neuronal circuits stands in direct contrast to the dynamics of their function. As in changing community interactions, different neurons can participate actively in various combinations to effect behaviors at different times. We introduce an unsupervised approach to learn the dynamic affinities between neurons in live, behaving animals, and to reveal which communities form among neurons at different times. The inference occurs in two major steps. First, pairwise non-linear affinities between  neuronal traces from brain-wide calcium activity are organized by non-negative tensor factorization (NTF). Each factor specifies which groups of neurons are most likely interacting for an inferred interval in time, and for which animals. Finally, a generative model that allows for weighted community detection is applied to the functional motifs produced by NTF to reveal a dynamic functional connectome. Since time codes the different experimental variables (e.g., application of chemical stimuli), this provides an atlas of neural motifs active during separate stages of an experiment (e.g., stimulus application or spontaneous behaviors). Results from our analysis are experimentally validated, confirming that our method is able to robustly predict causal interactions between neurons to generate behavior.",
        "keywords": "neural networks;non-negative tensor factorization;dynamic community detection;functional connectome",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/64953fbb171b21bc2b40b9ab8c90ab5d96561a33.zip",
        "author": "Luciano Dyballa;Samuel Lang;Alexandra Haslund-Gourley;Eviatar Yemini;Steven W. Zucker",
        "authorids": "~Luciano_Dyballa1;~Samuel_Lang1;~Alexandra_Haslund-Gourley1;~Eviatar_Yemini1;~Steven_W._Zucker1",
        "gender": "M;M;F;M;M",
        "homepage": "https://sites.google.com/view/dyballa;;https://www.linkedin.com/in/alexandra-haslund-gourley-4406761a8/;https://www.yeminilab.com;http://www.cs.yale.edu/homes/vision/zucker/index.html",
        "dblp": "216/3330;;;;40/1041",
        "google_scholar": "72mCnhEAAAAJ;;;iE37b40AAAAJ;https://scholar.google.com/scholar?hl=en",
        "orcid": "0000-0003-1996-2173;;;0000-0003-1977-0761;",
        "linkedin": "ldyballa/;samuel-lang-367157112v;;;",
        "or_profile": "~Luciano_Dyballa1;~Samuel_Lang1;~Alexandra_Haslund-Gourley1;~Eviatar_Yemini1;~Steven_W._Zucker1",
        "aff": "Yale University;UMass Chan Medical School Neurobiology Department;Stanford University;UMass Chan Medical School;Yale University",
        "aff_domain": "cs.yale.edu;umassmed.edu;stanford.edu;umassmed.edu;yale.edu",
        "position": "Postdoc;Researcher;Researcher;Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\ndyballa2024learning,\ntitle={Learning dynamic representations of the functional connectome in neurobiological networks},\nauthor={Luciano Dyballa and Samuel Lang and Alexandra Haslund-Gourley and Eviatar Yemini and Steven W. Zucker},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ZwhHSOHMTM}\n}",
        "github": "",
        "project": "",
        "reviewers": "nAoq;6VUY;vGem",
        "pdf_size": 12547827,
        "rating": "6;6;8",
        "confidence": "4;4;5",
        "soundness": "3;3;4",
        "contribution": "3;2;3",
        "presentation": "3;3;4",
        "wc_summary": "99;54;149",
        "wc_strengths": "57;69;89",
        "wc_weaknesses": "182;148;149",
        "wc_questions": "46;4;132",
        "wc_review": "384;275;519",
        "wc_reply_reviewers": "129;59;65",
        "wc_reply_authors": "1280;971;880",
        "reply_reviewers": "1;1;1",
        "reply_authors": "2;2;2",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            100.66666666666667,
            38.80148908940939
        ],
        "wc_strengths_avg": [
            71.66666666666667,
            13.199326582148888
        ],
        "wc_weaknesses_avg": [
            159.66666666666666,
            15.797327481430381
        ],
        "wc_questions_avg": [
            60.666666666666664,
            53.27496806401879
        ],
        "wc_review_avg": [
            392.6666666666667,
            99.8009129328095
        ],
        "wc_reply_reviewers_avg": [
            84.33333333333333,
            31.678944988044595
        ],
        "wc_reply_authors_avg": [
            1043.6666666666667,
            171.1925491628911
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.9999999999999997,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:vgfHwzFfmdsJ:scholar.google.com/&scioq=Learning+dynamic+representations+of+the+functional+connectome+in+neurobiological+networks&hl=en&as_sdt=0,44",
        "gs_version_total": 8,
        "openreview": "https://openreview.net/forum?id=ZwhHSOHMTM",
        "pdf": "https://openreview.net/pdf?id=ZwhHSOHMTM",
        "email": "cs.yale.edu;umassmed.edu;stanford.edu;umassmed.edu;yale.edu",
        "author_num": 5,
        "aff_unique_index": "0;1;2;3;0",
        "aff_unique_norm": "Yale University;UMass Chan Medical School;Stanford University;University of Massachusetts Chan Medical School",
        "aff_unique_dep": ";Neurobiology Department;;Medical School",
        "aff_unique_url": "https://www.yale.edu;https://www.umassmed.edu;https://www.stanford.edu;https://umassmed.edu",
        "aff_unique_abbr": "Yale;UMass Chan;Stanford;UMass Chan",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Stanford;Chan",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "Zww4Xqmk38",
        "title": "Tree-based Ensemble Learning for Out-of-distribution Detection",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Being able to successfully determine whether the testing samples has similar distribution as the training samples is a fundamental question to address before we can safely deploy most of the machine learning models into practice. In this paper, we propose TOOD detection, a simple yet effective tree-based out-of-distribution (TOOD) detection mechanism to determine if a set of unseen samples will have similar distribution as of the training samples. The TOOD detection mechanism is based on computing pairwise hamming distance of testing samples' tree embeddings, which are obtained by fitting a tree-based ensemble model through in-distribution training samples. Our approach is interpretable and robust for its tree-based nature. Furthermore, our approach is efficient, flexible to various machine learning tasks, and can be easily generalized to unsupervised setting. Extensive experiments are conducted to show the proposed method outperforms other state-of-the-art out-of-distribution detection methods in distinguishing the in-distribution from out-of-distribution on various tabular, image, and text data.",
        "keywords": "Out-of-distribution detection;tree-based ensemble learning;interpretable machine learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/c5f922526723a90aa841cebf083c4da1a19f2943.zip",
        "author": "Zhaiming Shen;Menglun Wang;Guang Cheng;Ming-Jun Lai;Lin Mu;Ruihao Huang;Qi Liu;Hao Zhu",
        "authorids": "~Zhaiming_Shen1;~Menglun_Wang1;~Guang_Cheng1;~Ming-Jun_Lai1;~Lin_Mu3;~Ruihao_Huang1;~Qi_Liu23;~Hao_Zhu16",
        "gender": "M;M;M;M;F;M;F;M",
        "homepage": "https://sites.google.com/view/zhaiming-shen;;http://www.stat.ucla.edu/~guangcheng/;http://alpha.math.uga.edu/~mjlai;;;;",
        "dblp": "149/2522.html;;99/4812;l/MingJunLai;;;;",
        "google_scholar": "ksQav6cAAAAJ;oD3f8FEAAAAJ;;UvZUzQwAAAAJ;i7vmn0YAAAAJ;GpWYkIwAAAAJ;;",
        "orcid": "0000-0003-3604-0015;;;;;;0000-0002-4053-4213;",
        "linkedin": "zhaiming-shen/;;;;;;;hao-zhu-09183744?challengeId=AQGcLD3r5IAE9QAAAYrdeAKd0-0tyOWjRUwTzxnUsAXd4lAQwcLZZtWjD6gubBAPmO2K8oP9sTyUmU_gICWH6fRb9qMqHQdgVA&submissionId=706aa361-d829-8917-5833-660c40888c4a&challengeSource=AgG0uThmPaFUkwAAAYrdePCuv-SkExPNL0iKEO9mrKHZlLiDiKiX32wenUv8ggc&challegeType=AgGh9WsXonYL-AAAAYrdePCywx3CnETUDX7FvdGpTsyYTT3JEXJirGs&memberId=AgH_7iQSFNsNfAAAAYrdePC1hSz1Rq7jyzYzigMbJ7IEq0s&recognizeDevice=AgGFUrsZitiEMwAAAYrdePC4iUszMSLAZTzaYep5tEywOeLtPkbG",
        "or_profile": "~Zhaiming_Shen1;~Menglun_Wang1;~Guang_Cheng1;~Ming-Jun_Lai1;~Lin_Mu3;~Ruihao_Huang1;~Qi_Liu23;~Hao_Zhu16",
        "aff": "University of Georgia;US food and drug administration;University of California, Los Angeles;University of Georgia;;Food and Drug Administration;;US FDA",
        "aff_domain": "uga.edu;fda.hhs.gov;ucla.edu;uga.edu;;hhs.gov;;fda.hhs.gov",
        "position": "PhD student;Researcher;Full Professor;Full Professor;;Researcher;;Principal Researcher",
        "bibtex": "@misc{\nshen2024treebased,\ntitle={Tree-based Ensemble Learning for Out-of-distribution Detection},\nauthor={Zhaiming Shen and Menglun Wang and Guang Cheng and Ming-Jun Lai and Lin Mu and Ruihao Huang and Qi Liu and Hao Zhu},\nyear={2024},\nurl={https://openreview.net/forum?id=Zww4Xqmk38}\n}",
        "github": "",
        "project": "",
        "reviewers": "jBcD;FZKS;A8Ja;5AJZ",
        "site": "https://openreview.net/forum?id=Zww4Xqmk38",
        "pdf_size": 2367056,
        "rating": "3;3;5;8",
        "confidence": "3;3;2;3",
        "soundness": "3;2;2;4",
        "contribution": "1;2;3;3",
        "presentation": "3;2;2;3",
        "wc_summary": "61;156;76;47",
        "wc_strengths": "46;225;73;29",
        "wc_weaknesses": "243;405;47;36",
        "wc_questions": "5;5;7;55",
        "wc_review": "355;791;203;167",
        "wc_reply_reviewers": "218;0;0;0",
        "wc_reply_authors": "397;407;143;236",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            85.0,
            42.2551771975932
        ],
        "wc_strengths_avg": [
            93.25,
            77.66715843907257
        ],
        "wc_weaknesses_avg": [
            182.75,
            152.4702839900287
        ],
        "wc_questions_avg": [
            18.0,
            21.37755832643195
        ],
        "wc_review_avg": [
            379.0,
            248.112877537624
        ],
        "wc_reply_reviewers_avg": [
            54.5,
            94.39676901250381
        ],
        "wc_reply_authors_avg": [
            295.75,
            111.27752468490661
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.07053456158585983,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:hO4stN6JG8AJ:scholar.google.com/&scioq=Tree-based+Ensemble+Learning+for+Out-of-distribution+Detection&hl=en&as_sdt=0,44",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;0;3;1",
        "aff_unique_norm": "University of Georgia;U.S. Food and Drug Administration;University of California, Los Angeles;Food and Drug Administration",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.uga.edu;https://www.fda.gov;https://www.ucla.edu;https://www.fda.gov",
        "aff_unique_abbr": "UGA;FDA;UCLA;FDA",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Los Angeles",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "ZxsKRuP0o8",
        "title": "Meta-Tasks: Improving Robustness in Few-Shot Classification with Unsupervised and Semi-Supervised Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Few-shot learning (FSL) is a challenging problem in machine learning due to the limited availability of labeled data. A major obstacle to FSL is the ability to generalize well on both novel tasks and training tasks. In this paper, we propose a new branch of unsupervised and semi-supervised regularization tasks to combat this problem. Our approach leverages both labeled and unlabelled data to improve the robustness and generalization performance of FSL models. Experimental results demonstrate the effectiveness of our proposed method by showing faster and better convergence, lower generalization, and standard deviation error both on novel tasks and training tasks, highlighting its potential for practical applications in FSL. Our proposed approach offers a promising solution to address the challenge of regularization in FSL, paving the way for future research in this area.",
        "keywords": "few-shot classification;meta-learning;machine learning;semi-supervised learning;unsupervised learning.",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Mohammad Rostami;Atik Faysal;huaxia wang;Avimanyu Sahoo;Ryan Antle",
        "authorids": "~Mohammad_Rostami2;~Atik_Faysal1;~huaxia_wang1;~Avimanyu_Sahoo1;~Ryan_Antle1",
        "gender": "M;M;M;M;",
        "homepage": "https://sites.google.com/view/woreom;https://github.com/atik666;https://sites.google.com/view/huaxia-wang;https://sites.google.com/uah.edu/accl;https://www.bakerhughes.com",
        "dblp": ";299/1517;40/10246;150/4130;",
        "google_scholar": "Md81vrUAAAAJ;tHtILuYAAAAJ;fna2KGYAAAAJ;0h-0qjIAAAAJ;",
        "orcid": ";0000-0001-6569-4371;;0000-0001-6113-3278;",
        "linkedin": "woreom/;atik-faysal-64b809132/;;avimanyu-sahoo-26a55731/;",
        "or_profile": "~Mohammad_Rostami2;~Atik_Faysal1;~huaxia_wang1;~Avimanyu_Sahoo1;~Ryan_Antle1",
        "aff": "Rowan College;Rowan University;Rowan University;University of Alabama at Huntsville;",
        "aff_domain": "rowan.edu;rowan.edu;rowan.edu;uah.edu;",
        "position": "PhD student;PhD student;Assistant Professor;Assistant Professor;",
        "bibtex": "@misc{\nanonymous2024metatasks,\ntitle={Meta-Tasks: Improving Robustness in Few-Shot Classification with Unsupervised and Semi-Supervised Learning},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=ZxsKRuP0o8}\n}",
        "github": "",
        "project": "",
        "reviewers": "EG2x;Ka51;S9AD;ooCT",
        "site": "https://openreview.net/forum?id=ZxsKRuP0o8",
        "pdf_size": 22278365,
        "rating": "1;3;3;3",
        "confidence": "5;4;4;4",
        "soundness": "2;2;2;1",
        "contribution": "1;1;2;2",
        "presentation": "2;1;3;2",
        "wc_summary": "22;28;45;87",
        "wc_strengths": "9;11;9;36",
        "wc_weaknesses": "193;189;82;223",
        "wc_questions": "67;7;3;60",
        "wc_review": "291;235;139;406",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            45.5,
            25.401771591761076
        ],
        "wc_strengths_avg": [
            16.25,
            11.431863365173676
        ],
        "wc_weaknesses_avg": [
            171.75,
            53.45734280713923
        ],
        "wc_questions_avg": [
            34.25,
            29.38856069970083
        ],
        "wc_review_avg": [
            267.75,
            96.56959925359533
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:dw8akfdqtHcJ:scholar.google.com/&scioq=Meta-Tasks:+Improving+Robustness+in+Few-Shot+Classification+with+Unsupervised+and+Semi-Supervised+Learning&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "Rowan College;Rowan University;University of Alabama in Huntsville",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.rowan.edu;https://www.rowan.edu;https://www.uah.edu",
        "aff_unique_abbr": ";Rowan;UAH",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Huntsville",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "ZyH5ijgx9C",
        "title": "Efficient Stagewise Pretraining via Progressive Subnetworks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent developments in language models have sparked interest in developing efficient pretraining methods. A recent and effective paradigm is to perform stagewise training, where the depth of the model is gradually increased over the course of training starting from a shallow network (e.g. gradual stacking (Reddi et al., 2023)). While this is appealing since it yields resource and wall-time savings, it has limitations, particularly the inability to assess and evaluate the full model performance during earlier stages, and degradation in model quality due to smaller capacity of models in the initial stages. In this work, we propose an alternative framework, progressive subnetwork training, that maintains the full model throughout training, but only trains subnetworks within the model in each step. We empirically focus on a simple instantiation of this framework - Random Path Training (RAPTR) - that only trains a sub-path of layers in each step, progressively increasing the path lengths in stages. We demonstrate that RAPTR achieves better pre-training loss for BERT and UL2 language models while requiring 20-33\\% fewer FLOPs compared to standard training, and is competitive or better than gradual stacking at similar FLOPs. Furthermore, RAPTR shows better downstream performance on UL2, improving multiple QA and SuperGLUE tasks by 1-5\\% compared to standard training and stacking. Finally, we provide theoretical basis of RAPTR for residual networks by characterizing their stability due to residual connections and layer norm.",
        "keywords": "Stage-wise training;Efficient pre-training;Implicit benefits on downstream performance",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Abhishek Panigrahi;Nikunj Saunshi;Kaifeng Lyu;Sobhan Miryoosefi;Sashank J. Reddi;Satyen Kale;Sanjiv Kumar",
        "authorids": "~Abhishek_Panigrahi1;~Nikunj_Saunshi1;~Kaifeng_Lyu2;~Sobhan_Miryoosefi1;~Sashank_J._Reddi1;~Satyen_Kale2;~Sanjiv_Kumar1",
        "gender": "M;;M;M;M;;",
        "homepage": "https://abhishekpanigrahi1996.github.io/;https://www.nikunjsaunshi.com/;https://kaifeng.ac/;https://www.cs.princeton.edu/~syoosefi/;;https://www.satyenkale.com;http://www.sanjivk.com/",
        "dblp": "208/4926;199/2236;220/3283;243/5898;50/10452;52/4768;",
        "google_scholar": "https://scholar.google.co.in/citations?user=oMhp8p8AAAAJ;F24vXggAAAAJ;843JJtgAAAAJ;XItzx5gAAAAJ;70lgwYwAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;;;;",
        "linkedin": ";;;miryoosefi/;;;",
        "or_profile": "~Abhishek_Panigrahi1;~Nikunj_Saunshi1;~Kaifeng_Lyu2;~Sobhan_Miryoosefi1;~Sashank_J._Reddi1;~Satyen_Kale2;~Sanjiv_Kumar1",
        "aff": "Princeton University;Google;Princeton University;Princeton University;Google;Google;Google",
        "aff_domain": "princeton.edu;google.com;princeton.edu;princeton.edu;google.com;google.com;google.com",
        "position": "PhD student;Researcher;PhD student;PhD student;Research Scientist;Research Scientist;Research Scientist",
        "bibtex": "@misc{\npanigrahi2024efficient,\ntitle={Efficient Stagewise Pretraining via Progressive Subnetworks},\nauthor={Abhishek Panigrahi and Nikunj Saunshi and Kaifeng Lyu and Sobhan Miryoosefi and Sashank J. Reddi and Satyen Kale and Sanjiv Kumar},\nyear={2024},\nurl={https://openreview.net/forum?id=ZyH5ijgx9C}\n}",
        "github": "",
        "project": "",
        "reviewers": "BbtU;NDaJ;6BSs;9zZw",
        "site": "https://openreview.net/forum?id=ZyH5ijgx9C",
        "pdf_size": 520975,
        "rating": "5;6;6;6",
        "confidence": "3;4;3;3",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;4;3;3",
        "wc_summary": "126;105;79;53",
        "wc_strengths": "59;41;76;33",
        "wc_weaknesses": "634;65;116;81",
        "wc_questions": "224;49;64;1",
        "wc_review": "1043;260;335;168",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1368;583;678;207",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;2;2;2",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            90.75,
            27.42603689926782
        ],
        "wc_strengths_avg": [
            52.25,
            16.63392617513977
        ],
        "wc_weaknesses_avg": [
            224.0,
            237.4310426207997
        ],
        "wc_questions_avg": [
            84.5,
            83.8346587039036
        ],
        "wc_review_avg": [
            451.5,
            346.5865692723825
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            709.0,
            419.26185135306554
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13005675942413267658&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0;0;1;1;1",
        "aff_unique_norm": "Princeton University;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.princeton.edu;https://www.google.com",
        "aff_unique_abbr": "Princeton;Google",
        "aff_campus_unique_index": "1;1;1;1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "ZyMXxpBfct",
        "title": "Forward Explanation : Why Catastrophic Forgetting Occurs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The training framework relying on backpropagation and gradient descent has resulted in the creation of opaque models, leading to many problems that we cannot explain. One such problem that has remained inexplicable since the advent of neural networks is catastrophic forgetting. Recently, We have made some intriguing discoveries, which we have integrated into an explanation for neural network training, referred to as Forward Explanation. We first discover that training guides neural networks to produce a particular representation, which we refer to as Interleaved Representation. Additionally, we find that under this representation, neural networks exhibit a series of convergence phenomena, which we term Task Representation Convergence Phenomena. Furthermore, we find that in order to learn this representation, neural networks undergo a specific parameter change during training, which we call Forward-Interleaved Memory Encoding. This unveils some inner workings of how neural networks learn and fundamentally answers why catastrophic forgetting occurs.",
        "keywords": "catastrophic forgetting;interpretability;transfer learning;lifelong learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/cbd2bbc8e172e83034838aaee6bffcfe861a020b.zip",
        "author": "Weimin Yin;Chunzhao Xie;Bin Chen;Zhenhao Tan",
        "authorids": "~Weimin_Yin1;~Chunzhao_Xie1;~Bin_Chen15;~Zhenhao_Tan1",
        "gender": "M;M;M;M",
        "homepage": "https://github.com/Jnkoys;https://github.com/SDaoer;https://github.com/czhunian;https://faculty.ustc.edu.cn/xuxiaohua/zh_CN/xsxx/134070/content/2457.htm#xsxx",
        "dblp": ";;;",
        "google_scholar": ";;;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Weimin_Yin1;~Chunzhao_Xie1;~Bin_Chen15;~Zhenhao_Tan1",
        "aff": "University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China",
        "aff_domain": "ustc.edu.cn;ustc.edu.cn;ustc.edu.cn;ustc.edu.cn",
        "position": "MS student;MS student;MS student;MS student",
        "bibtex": "@misc{\nyin2024forward,\ntitle={Forward Explanation : Why Catastrophic Forgetting Occurs},\nauthor={Weimin Yin and Chunzhao Xie and Bin Chen and Zhenhao Tan},\nyear={2024},\nurl={https://openreview.net/forum?id=ZyMXxpBfct}\n}",
        "github": "",
        "project": "",
        "reviewers": "Jw5d;T5LT;xF7Q;tGEX",
        "site": "https://openreview.net/forum?id=ZyMXxpBfct",
        "pdf_size": 885131,
        "rating": "1;1;1;3",
        "confidence": "5;4;5;5",
        "soundness": "1;2;1;1",
        "contribution": "1;1;2;1",
        "presentation": "1;2;1;1",
        "wc_summary": "48;79;36;32",
        "wc_strengths": "1;33;9;11",
        "wc_weaknesses": "268;279;84;204",
        "wc_questions": "9;11;534;117",
        "wc_review": "326;402;663;364",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "116;33;273;123",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            1.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            48.75,
            18.430613120566555
        ],
        "wc_strengths_avg": [
            13.5,
            11.863810517704673
        ],
        "wc_weaknesses_avg": [
            208.75,
            77.50927363870726
        ],
        "wc_questions_avg": [
            167.75,
            215.92055830791102
        ],
        "wc_review_avg": [
            438.75,
            132.22967707742464
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            136.25,
            86.52564648703874
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9457606812645506722&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of Science and Technology of China",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.ustc.edu.cn",
        "aff_unique_abbr": "USTC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "ZyXWIJ99nh",
        "title": "Catapults in SGD: spikes in the training loss and their impact on generalization through feature learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this paper, we first present an explanation regarding the common occurrence of spikes in the training loss when neural networks are trained with stochastic gradient descent (SGD). We provide evidence that the spikes in the training loss of SGD are \"catapults\", an optimization phenomenon originally observed in GD with large learning rates in Lewkowycz et al. (2020). We empirically show that these catapults occur in a low-dimensional subspace spanned by the top eigenvectors of the tangent kernel, for both GD and SGD. Second, we posit an explanation for how catapults lead to better generalization by demonstrating that catapults increase feature learning by increasing alignment with the Average Gradient Outer Product (AGOP) of the true predictor. Furthermore, we demonstrate that a smaller batch size in SGD induces a larger number of catapults, thereby improving AGOP alignment and test performance.",
        "keywords": "SGD;loss spikes;catapults;generalization;feature learning",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/ec0dbf3ac54155d104aa0cd728fe677d23240189.pdf",
        "author": "Libin Zhu;Chaoyue Liu;Adityanarayanan Radhakrishnan;Mikhail Belkin",
        "authorids": "~Libin_Zhu1;~Chaoyue_Liu2;~Adityanarayanan_Radhakrishnan1;~Mikhail_Belkin1",
        "gender": "M;M;M;",
        "homepage": ";https://cliu212.github.io/;https://aditradha.com/;http://misha.belkin-wang.org/",
        "dblp": "260/0355;191/6684-1;;",
        "google_scholar": "hyTGiUcAAAAJ;sRjoMX0AAAAJ;jd7_Ed0AAAAJ;Iwd9DdkAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;aditradha/;",
        "or_profile": "~Libin_Zhu1;~Chaoyue_Liu2;~Adityanarayanan_Radhakrishnan1;~Misha_Belkin1",
        "aff": "University of California, San Diego;University of California, San Diego;;University of California, San Diego",
        "aff_domain": "ucsd.edu;ucsd.edu;;ucsd.edu",
        "position": "PhD student;Postdoc;;Professor",
        "bibtex": "@misc{\nzhu2024catapults,\ntitle={Catapults in {SGD}: spikes in the training loss and their impact on generalization through feature learning},\nauthor={Libin Zhu and Chaoyue Liu and Adityanarayanan Radhakrishnan and Mikhail Belkin},\nyear={2024},\nurl={https://openreview.net/forum?id=ZyXWIJ99nh}\n}",
        "github": "",
        "project": "",
        "reviewers": "QEoS;LhuJ;Ykc6;iMUj",
        "site": "https://openreview.net/forum?id=ZyXWIJ99nh",
        "pdf_size": 5022526,
        "rating": "5;6;6;8",
        "confidence": "4;4;4;4",
        "soundness": "2;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "2;3;3;4",
        "wc_summary": "127;96;73;85",
        "wc_strengths": "67;39;25;50",
        "wc_weaknesses": "964;152;95;185",
        "wc_questions": "679;1;68;88",
        "wc_review": "1837;288;261;408",
        "wc_reply_reviewers": "1603;0;70;0",
        "wc_reply_authors": "5747;220;539;782",
        "reply_reviewers": "8;0;1;0",
        "reply_authors": "12;1;1;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            95.25,
            20.054612935681405
        ],
        "wc_strengths_avg": [
            45.25,
            15.368392889303683
        ],
        "wc_weaknesses_avg": [
            349.0,
            356.5269975752187
        ],
        "wc_questions_avg": [
            209.0,
            273.2608643768807
        ],
        "wc_review_avg": [
            698.5,
            659.6379688889959
        ],
        "wc_reply_reviewers_avg": [
            418.25,
            684.6124359811178
        ],
        "wc_reply_authors_avg": [
            1822.0,
            2274.8471377215656
        ],
        "reply_reviewers_avg": [
            2.25,
            3.344772040064913
        ],
        "reply_authors_avg": [
            3.75,
            4.763139720814412
        ],
        "replies_avg": [
            30,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 17,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17431620403131145365&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of California, San Diego",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucsd.edu",
        "aff_unique_abbr": "UCSD",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "San Diego",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Clifford Group Equivariant Simplicial Message Passing Networks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18381",
        "id": "Zz594UBNOH",
        "author_site": "Cong Liu, David Ruhe, Floor Eijkelboom, Patrick Forr\u00e9",
        "tldr": "",
        "abstract": "We introduce Clifford Group Equivariant Simplicial Message Passing Networks, a method for steerable $\\mathrm{E}(n)$-equivariant message passing on simplicial complexes. Our method integrates the expressivity of Clifford group-equivariant layers with simplicial message passing, which is topologically more intricate than regular graph message passing. Clifford algebras include higher-order objects such as bivectors and trivectors, which express geometric features (e.g., areas, volumes) derived from vectors. Using this knowledge, we represent simplex features through geometric products of their vertices. To achieve efficient simplicial message passing, we share the parameters of the message network across different dimensions. Additionally, we restrict the final message to an aggregation of the incoming messages from different dimensions, leading to what we term *shared* simplicial message passing. Experimental results show that our method is able to outperform both equivariant and simplicial graph neural networks on a variety of geometric tasks.",
        "keywords": "Clifford Algebra;Geometric Algebra;Graph Neural Networks;Simplicial Message Passing;Topological Deep Learning;Geometric Deep Learning;Equivariance",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Cong Liu;David Ruhe;Floor Eijkelboom;Patrick Forr\u00e9",
        "authorids": "~Cong_Liu9;~David_Ruhe1;~Floor_Eijkelboom1;~Patrick_Forr\u00e91",
        "gender": "M;;M;",
        "homepage": "https://congliuuva.github.io;;;",
        "dblp": ";243/3507;;",
        "google_scholar": "dBCwoZgAAAAJ;;jCWo5lUAAAAJ;",
        "orcid": ";;;",
        "linkedin": "cong-liu-8468b7190/;;flooreijkelboom/;",
        "or_profile": "~Cong_Liu9;~David_Ruhe1;~Floor_Eijkelboom1;~Patrick_Forr\u00e91",
        "aff": "University of Amsterdam, University of Amsterdam;University of Amsterdam;University of Amsterdam;",
        "aff_domain": "ivi.uva.nl;uva.nl;uva.nl;",
        "position": "PhD student;PhD student;PhD student;",
        "bibtex": "@inproceedings{\nliu2024clifford,\ntitle={Clifford Group Equivariant Simplicial Message Passing Networks},\nauthor={Cong Liu and David Ruhe and Floor Eijkelboom and Patrick Forr{\\'e}},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=Zz594UBNOH}\n}",
        "github": "",
        "project": "",
        "reviewers": "u7om;q1Xe;atRt",
        "pdf_size": 404813,
        "rating": "6;6;6",
        "confidence": "4;3;3",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "3;3;3",
        "wc_summary": "140;67;98",
        "wc_strengths": "61;55;70",
        "wc_weaknesses": "216;89;103",
        "wc_questions": "79;16;2",
        "wc_review": "496;227;273",
        "wc_reply_reviewers": "174;0;0",
        "wc_reply_authors": "1381;722;780",
        "reply_reviewers": "1;0;0",
        "reply_authors": "3;1;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            101.66666666666667,
            29.914693528246094
        ],
        "wc_strengths_avg": [
            62.0,
            6.164414002968976
        ],
        "wc_weaknesses_avg": [
            136.0,
            56.85654462475421
        ],
        "wc_questions_avg": [
            32.333333333333336,
            33.48963355361709
        ],
        "wc_review_avg": [
            332.0,
            117.47623873220775
        ],
        "wc_reply_reviewers_avg": [
            58.0,
            82.02438661763951
        ],
        "wc_reply_authors_avg": [
            961.0,
            297.92728419308406
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15537991988401608393&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=Zz594UBNOH",
        "pdf": "https://openreview.net/pdf?id=Zz594UBNOH",
        "email": "ivi.uva.nl;uva.nl;uva.nl;",
        "author_num": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Amsterdam",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uva.nl",
        "aff_unique_abbr": "UvA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Netherlands"
    },
    {
        "id": "Zz61cEY84L",
        "title": "Meta-Learning Strategies through Value Maximization in Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Biological and artificial learning agents face numerous choices about how to learn, ranging from hyperparameter selection to aspects of task distributions like curricula. Understanding how to make these `meta-learning\u2019 choices could improve engineered systems and offer normative accounts of cognitive control functions in biological learners. Yet optimal strategies remain challenging to compute in modern deep networks due to the complexity of optimizing through the entire learning process. Here we theoretically investigate optimal strategies in a tractable setting. We present a learning effort framework capable of efficiently optimizing control signals on a fully normative objective: discounted cumulative performance throughout learning. We obtain computational tractability by using average dynamical equations for gradient descent, available for simple neural network architectures. Our framework accommodates a range of meta-learning and automatic curriculum learning methods in a unified normative setting. We apply this framework to investigate the effect of approximations in common meta-learning algorithms; infer aspects of optimal curricula; and compute optimal neuronal resource allocation in a continual learning setting. Across settings, we find that control effort is most beneficial when applied to easier aspects of a task early in learning; followed by sustained effort on harder aspects. Overall, the learning effort framework provides a tractable theoretical test bed to study normative benefits of interventions in a variety of learning systems, as well as a formal account of optimal cognitive control strategies over learning trajectories posited by established theories in cognitive neuroscience.",
        "keywords": "Cognitive Science;Neuroscience;Continual Learning;Meta-Learning;Curriculum Learning;Control Theory",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "Rodrigo Antonio Carrasco-Davis;Javier Alejandro Mas\u00eds Obando;Andrew M Saxe",
        "authorids": "~Rodrigo_Antonio_Carrasco-Davis1;~Javier_Alejandro_Mas\u00eds_Obando1;~Andrew_M_Saxe1",
        "gender": "M;M;M",
        "homepage": ";;https://www.saxelab.org",
        "dblp": "206/6218;;39/6894",
        "google_scholar": "PLBqVGoAAAAJ;JnmXaR4AAAAJ;h0Al1fcAAAAJ",
        "orcid": "0000-0003-4673-8791;0000-0002-9643-8677;0000-0002-9831-8812",
        "linkedin": "rodrigcd/?locale=en_US;;",
        "or_profile": "~Rodrigo_Antonio_Carrasco-Davis1;~Javier_Alejandro_Mas\u00eds_Obando1;~Andrew_M_Saxe1",
        "aff": "University College London, University of London;Princeton University;University College London, University of London",
        "aff_domain": "ucl.ac.uk;princeton.edu;ucl.ac.uk",
        "position": "PhD student;Postdoc;Full Professor",
        "bibtex": "@misc{\ncarrasco-davis2024metalearning,\ntitle={Meta-Learning Strategies through Value Maximization in Neural Networks},\nauthor={Rodrigo Antonio Carrasco-Davis and Javier Alejandro Mas{\\'\\i}s Obando and Andrew M Saxe},\nyear={2024},\nurl={https://openreview.net/forum?id=Zz61cEY84L}\n}",
        "github": "",
        "project": "",
        "reviewers": "eAk8;LGyh;qEL8;QJtu",
        "site": "https://openreview.net/forum?id=Zz61cEY84L",
        "pdf_size": 11060575,
        "rating": "5;6;6;8",
        "confidence": "2;3;3;2",
        "soundness": "3;3;3;4",
        "contribution": "3;1;3;3",
        "presentation": "3;4;3;4",
        "wc_summary": "71;89;57;99",
        "wc_strengths": "28;32;90;124",
        "wc_weaknesses": "106;56;165;69",
        "wc_questions": "92;45;52;2",
        "wc_review": "297;222;364;294",
        "wc_reply_reviewers": "0;13;39;60",
        "wc_reply_authors": "890;683;1151;370",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "2;1;3;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            2.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            79.0,
            16.186414056238647
        ],
        "wc_strengths_avg": [
            68.5,
            40.35777496344416
        ],
        "wc_weaknesses_avg": [
            99.0,
            42.290660907581
        ],
        "wc_questions_avg": [
            47.75,
            31.92471613029629
        ],
        "wc_review_avg": [
            294.25,
            50.231339818882
        ],
        "wc_reply_reviewers_avg": [
            28.0,
            23.205602771744587
        ],
        "wc_reply_authors_avg": [
            773.5,
            285.95497897396365
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.2294157338705618,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1495376673980737597&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University College London;Princeton University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ucl.ac.uk;https://www.princeton.edu",
        "aff_unique_abbr": "UCL;Princeton",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "id": "ZzeXjCQ5CK",
        "title": "FedORION: Aggregation-Assisted Proxyless Distillation for Heterogeneous Federated Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "System heterogeneity in Federated Learning (FL) is commonly dealt with knowledge distillation by combining the clients' knowledge via distillation into a global model. However, such knowledge transfer to the global model is often limited by distillation efficiency and unavailability of the client data. Most of the existing approaches require proxy data on the server side for distillation, which becomes a bottleneck. To circumevent these limitations, we propose a novel FL framework, FedORION (Aggregation-Assisted Proxyless Distillation for Heterogeneous Federated Learning) that comprises of deep mutual learning (DML) at client end, and global aggregation followed by noise engineered data-free distillation at the server end. DML enables server side global aggregation which otherwise is infeasible due to different client model architectures. The aggregation results in knowledge integration which is further boosted by the subsequent distillation. This, however, also increases the burden on clients, especially with low computational budget. We, therefore, further introduce the idea of selective mutual learning where only those clients perform DML that are not limited by computational capacity. This reduces the overall computational burden without any compromise in the performance. We conduct rigorous experiments on various publicly available datasets and observe a remarkable improvement in the performance over the existing heterogeneous FL methods. For example, for TinyImagenet dataset, FedORION shows almost three times better performance as compared to the best baseline. The results provide evidence for the utility and effectiveness of our approach and open up a new direction for heterogeneous FL.",
        "keywords": "Federated Learning;Knowledge Distillation;Aggregation;Deep Mutual Learning;Proxyless Distillation",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/ebc911baf03581e7e6563d67537d402ba98fa1e2.zip",
        "author": "Nirbhay sharma;Mayank Raj;Deepak Mishra",
        "authorids": "~Nirbhay_sharma1;~Mayank_Raj1;~Deepak_Mishra5",
        "gender": "M;M;M",
        "homepage": ";;http://home.iitj.ac.in/~dmishra/",
        "dblp": ";;65/6758-3",
        "google_scholar": ";;-rOCu6sAAAAJ",
        "orcid": ";;",
        "linkedin": "nirbhay-sharma-a2b846204/;mayank-raj-908a901b6/;",
        "or_profile": "~Nirbhay_sharma1;~Mayank_Raj1;~Deepak_Mishra5",
        "aff": ";;Indian Institute of Technology Jodhpur, India",
        "aff_domain": ";;iitj.ac.in",
        "position": ";;Assistant Professor",
        "bibtex": "@misc{\nsharma2024fedorion,\ntitle={Fed{ORION}: Aggregation-Assisted Proxyless Distillation for Heterogeneous Federated Learning},\nauthor={Nirbhay sharma and Mayank Raj and Deepak Mishra},\nyear={2024},\nurl={https://openreview.net/forum?id=ZzeXjCQ5CK}\n}",
        "github": "",
        "project": "",
        "reviewers": "k9TX;mcAL;MRfG;J3qo",
        "site": "https://openreview.net/forum?id=ZzeXjCQ5CK",
        "pdf_size": 610476,
        "rating": "3;3;5;6",
        "confidence": "3;5;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;2",
        "presentation": "2;2;3;3",
        "wc_summary": "193;37;103;145",
        "wc_strengths": "29;37;43;74",
        "wc_weaknesses": "43;157;68;245",
        "wc_questions": "166;66;237;45",
        "wc_review": "431;297;451;509",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            119.5,
            57.295287764352835
        ],
        "wc_strengths_avg": [
            45.75,
            17.049560111627514
        ],
        "wc_weaknesses_avg": [
            128.25,
            79.61587467333383
        ],
        "wc_questions_avg": [
            128.5,
            77.5515957282634
        ],
        "wc_review_avg": [
            422.0,
            77.64663547121665
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:CEPWtNQPdWMJ:scholar.google.com/&scioq=FedORION:+Aggregation-Assisted+Proxyless+Distillation+for+Heterogeneous+Federated+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Indian Institute of Technology Jodhpur",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.iitj.ac.in",
        "aff_unique_abbr": "IIT Jodhpur",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Jodhpur",
        "aff_country_unique_index": "0",
        "aff_country_unique": "India"
    },
    {
        "title": "Kalman Filter for Online Classification of Non-Stationary Data",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18380",
        "id": "ZzmKEpze8e",
        "author_site": "Michalis Titsias, Alexandre Galashov, Amal Rannen-Triki, Razvan Pascanu, Yee Whye Teh, Jorg Bornschein",
        "tldr": "",
        "abstract": "In Online Continual Learning (OCL) a learning system receives a stream of data and sequentially performs prediction and training steps. Key challenges in OCL include automatic adaptation to the specific non-stationary structure of the data and maintaining appropriate  predictive uncertainty.  To address these challenges we introduce a probabilistic Bayesian online learning approach that utilizes a (possibly pretrained) neural representation and a state space model over the linear predictor weights. Non-stationarity in the linear predictor weights is modelled using a \u201cparameter drift\u201d transition density, parametrized by a coefficient that quantifies forgetting. Inference in the model is implemented with efficient Kalman filter recursions which track the posterior distribution over the linear weights, while online SGD updates over the transition dynamics coefficient allow for adaptation to the non-stationarity observed in the data. While the framework is developed assuming a linear Gaussian model, we extend it to deal with classification problems and for fine-tuning the deep learning representation. In a set of experiments in multi-class classification using data sets such as CIFAR-100 and CLOC we demonstrate the model's predictive ability and its flexibility in capturing non-stationarity.",
        "keywords": "online learning;non-stationarity;Kalman filter;continual learning;probabilistic modellling",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Michalis Titsias;Alexandre Galashov;Amal Rannen-Triki;Razvan Pascanu;Yee Whye Teh;Jorg Bornschein",
        "authorids": "~Michalis_Titsias1;~Alexandre_Galashov1;~Amal_Rannen-Triki1;~Razvan_Pascanu1;~Yee_Whye_Teh2;~Jorg_Bornschein1",
        "gender": "M;M;F;M;M;M",
        "homepage": "https://mtitsias.github.io/;https://galashov.com;http://amal.rannen.triki.me;https://razp.info;;http://csml.stats.ox.ac.uk/people/teh/",
        "dblp": "19/5385;;180/5447;65/8368.html;13/8510;88/2483",
        "google_scholar": "https://scholar.google.gr/citations?user=B-SbkAwAAAAJ;;sSwp5n0AAAAJ;https://scholar.google.ca/citations?user=eSPY8LwAAAAJ;X7kZFnoAAAAJ;https://scholar.google.co.uk/citations?user=y-nUzMwAAAAJ",
        "orcid": ";;;;0000-0002-3356-7922;",
        "linkedin": ";;;;;",
        "or_profile": "~Michalis_Titsias1;~Alexandre_Galashov1;~Amal_Rannen-Triki1;~Razvan_Pascanu1;~Jorg_Bornschein1;~Yee_Whye_Teh1",
        "aff": "Google DeepMind;Ecole Polytechnique;Google DeepMind;Google DeepMind;Google Deepmind;University of Oxford",
        "aff_domain": "google.com;polytechnique.edu;google.com;google.com;google.com;ox.ac.uk",
        "position": "Research Scientist;MS student;Researcher;Research Scientist;Research Scientist;Full Professor",
        "bibtex": "@inproceedings{\ntitsias2024kalman,\ntitle={Kalman Filter for Online Classification of Non-Stationary Data},\nauthor={Michalis Titsias and Alexandre Galashov and Amal Rannen-Triki and Razvan Pascanu and Yee Whye Teh and Jorg Bornschein},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ZzmKEpze8e}\n}",
        "github": "",
        "project": "",
        "reviewers": "NkkH;reom;BEuY;VM8e",
        "pdf_size": 921718,
        "rating": "6;6;6;8",
        "confidence": "4;4;3;3",
        "soundness": "4;4;3;3",
        "contribution": "3;3;3;2",
        "presentation": "4;3;3;3",
        "wc_summary": "39;186;103;73",
        "wc_strengths": "61;144;102;89",
        "wc_weaknesses": "33;191;267;195",
        "wc_questions": "99;142;56;87",
        "wc_review": "232;663;528;444",
        "wc_reply_reviewers": "0;0;29;0",
        "wc_reply_authors": "628;1113;963;891",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;2;2;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            100.25,
            54.43976028602624
        ],
        "wc_strengths_avg": [
            99.0,
            29.90819285747636
        ],
        "wc_weaknesses_avg": [
            171.5,
            85.49122762014825
        ],
        "wc_questions_avg": [
            96.0,
            30.84639363037436
        ],
        "wc_review_avg": [
            466.75,
            156.4374875149815
        ],
        "wc_reply_reviewers_avg": [
            7.25,
            12.55736835487436
        ],
        "wc_reply_authors_avg": [
            898.75,
            175.63936773969553
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13683138777172470817&as_sdt=20000005&sciodt=0,21&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=ZzmKEpze8e",
        "pdf": "https://openreview.net/pdf?id=ZzmKEpze8e",
        "email": "google.com;polytechnique.edu;google.com;google.com;google.com;ox.ac.uk",
        "author_num": 6,
        "aff_unique_index": "0;1;0;0;2;3",
        "aff_unique_norm": "Google;Ecole Polytechnique;DeepMind;University of Oxford",
        "aff_unique_dep": "Google DeepMind;;DeepMind;",
        "aff_unique_url": "https://deepmind.com;https://www.polytechnique.edu;https://deepmind.com;https://www.ox.ac.uk",
        "aff_unique_abbr": "DeepMind;X;DeepMind;Oxford",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;0;0",
        "aff_country_unique": "United Kingdom;France"
    },
    {
        "id": "a01qbkxbve",
        "title": "O3D: Offline Data-driven Discovery and Distillation for Sequential Decision-Making with Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent advancements in large language models (LLMs) have exhibited promising performance in solving sequential decision-making problems. By imitating few-shot examples provided in the prompts (i.e., in-context learning), an LLM agent can interact with an external environment and complete given tasks without additional training. However, such few-shot examples are often insufficient to generate high\nquality solutions for complex and long-horizon tasks, while the limited context length cannot consume larger-scale demonstrations. To this end, we propose an offline learning framework that utilizes offline data at scale (e.g, logs of human interactions) to facilitate the in-context learning performance of LLM agents. We formally define LLM-powered policies with both text-based approaches and code-based approaches. We then introduce an Offline Data-driven Discovery and Distillation (O3D) framework to improve LLM-powered policies without finetuning. O3D automatically discovers reusable skills and distills generalizable knowledge across multiple tasks based on offline interaction data, advancing the capability of solving downstream tasks. Empirical results under two interactive decision-making benchmarks (ALFWorld and WebShop) demonstrate that O3D can notably enhance the decision-making capabilities of LLMs through the offline discovery and distillation process, and consistently outperform baselines across various LLMs with both text-based-policy and code-based-policy.",
        "keywords": "Offline In-Context Learning;Large Language Model Agent;Sequential Decision-Making",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/77dc3469437e4888abfe18037d201c283b9bb62e.zip",
        "author": "Yuchen Xiao;Yanchao Sun;Mengda Xu;Udari Madhushani;Jared Vann;Deepeka Garg;Sumitra Ganesh",
        "authorids": "~Yuchen_Xiao1;~Yanchao_Sun1;~Mengda_Xu1;~Udari_Madhushani1;~Jared_Vann1;~Deepeka_Garg1;~Sumitra_Ganesh1",
        "gender": ";F;M;F;M;F;F",
        "homepage": "https://ycx424.wixsite.com/xiaoyc;https://ycsun2017.github.io/home/index.html;https://mengdaxu.github.io/;https://udarimadhu.github.io/;;;",
        "dblp": ";132/6840;;;304/3095.html;;98/463.html",
        "google_scholar": "q_ka-B0AAAAJ;bloBY_QAAAAJ;https://scholar.google.com/citations?hl=en;sN7grTMAAAAJ;;;https://scholar.google.com/citations?hl=en",
        "orcid": ";0000-0002-1137-9939;;;;;",
        "linkedin": ";;mengda-xu-132b57135/;;;;sumitra-ganesh-0379853",
        "or_profile": "~Yuchen_Xiao1;~Yanchao_Sun1;~Mengda_Xu1;~Udari_Madhushani1;~Jared_Vann1;~Deepeka_Garg1;~Sumitra_Ganesh1",
        "aff": "J.P. Morgan Chase;J.P. Morgan AI Research;Columbia University;J.P. Morgan Chase;J.P. Morgan Chase;;J.P. Morgan Chase",
        "aff_domain": "jpmorgan.com;jpmchase.com;columbia.edu;jpmorgan.com;jpmorgan.com;;jpmorgan.com",
        "position": "Researcher;Researcher;PhD student;Researcher;Researcher;;Researcher",
        "bibtex": "@misc{\nxiao2024od,\ntitle={O3D: Offline Data-driven Discovery and Distillation for Sequential Decision-Making with Large Language Models},\nauthor={Yuchen Xiao and Yanchao Sun and Mengda Xu and Udari Madhushani and Jared Vann and Deepeka Garg and Sumitra Ganesh},\nyear={2024},\nurl={https://openreview.net/forum?id=a01qbkxbve}\n}",
        "github": "",
        "project": "",
        "reviewers": "x6tG;TtDd;UZ4F",
        "site": "https://openreview.net/forum?id=a01qbkxbve",
        "pdf_size": 855479,
        "rating": "3;6;6",
        "confidence": "4;3;3",
        "soundness": "2;3;3",
        "contribution": "2;3;2",
        "presentation": "3;3;3",
        "wc_summary": "158;84;97",
        "wc_strengths": "64;94;66",
        "wc_weaknesses": "212;202;136",
        "wc_questions": "33;2;180",
        "wc_review": "467;382;479",
        "wc_reply_reviewers": "0;0;220",
        "wc_reply_authors": "2031;1355;2447",
        "reply_reviewers": "0;0;1",
        "reply_authors": "3;2;5",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            113.0,
            32.25936556516056
        ],
        "wc_strengths_avg": [
            74.66666666666667,
            13.695092389449425
        ],
        "wc_weaknesses_avg": [
            183.33333333333334,
            33.717782977071444
        ],
        "wc_questions_avg": [
            71.66666666666667,
            77.64162686486046
        ],
        "wc_review_avg": [
            442.6666666666667,
            43.17663977456122
        ],
        "wc_reply_reviewers_avg": [
            73.33333333333333,
            103.70899457402697
        ],
        "wc_reply_authors_avg": [
            1944.3333333333333,
            449.9995061725686
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            1.247219128924647
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13769409509319973384&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;0;0;0",
        "aff_unique_norm": "JPMorgan Chase & Co.;J.P. Morgan;Columbia University",
        "aff_unique_dep": ";AI Research;",
        "aff_unique_url": "https://www.jpmorganchase.com;https://www.jpmorgan.com;https://www.columbia.edu",
        "aff_unique_abbr": "JPM;JPM;Columbia",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "a1AMdN8pSD",
        "title": "Neural implicit mapping via nested neighborhoods: real-time rendering of neural SDFs with textures",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We introduce the nested neighborhood model, a framework to address the problem of real-time joint estimation of surface geometry and its attributes (normals and textures) from neural SDFs.\nThis problem was only partially approached by previous works, which do not support attributes nor dynamic surfaces in real-time.\nThe framework is built on the nesting condition, which establishes a criteria for the neighborhoods of zero-level sets of a sequence of neural SDFs to be nested. This allows mappings between such neighborhoods, enabling the definition of the multiscale sphere tracing, the neural attribute mapping, and the GEMM-based analytical normal computation algorithms, composing the nested neighborhood model.\nOur framework does not use spatial data-structures and its components can be used to augment meshes with smooth neural normals and textures. The normal GEMM-based computation does not depend on auto-differentiation nor computational graphs, resulting in real-time performance.",
        "keywords": "Implicit Functions; Neural Signed Distance Functions; Real-time inference;",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/b188d17c9340ba02ac4b114d3d1f529e81734d11.zip",
        "author": "Vin\u00edcius Da Silva;Tiago Novello;Guilherme Schardong;Luiz Schirmer;HELIO CORTES VIEIRA LOPES;Luiz Velho",
        "authorids": "~Vin\u00edcius_Da_Silva1;~Tiago_Novello1;~Guilherme_Schardong1;~Luiz_Schirmer1;~HELIO_CORTES_VIEIRA_LOPES1;~Luiz_Velho1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://dsilvavinicius.github.io;https://sites.google.com/site/tiagonovellodebrito;http://www.lschirmer.com;http://www.inf.puc-rio.br/~lopes;http://lvelho.impa.br/;https://schardong.github.io",
        "dblp": "147/4113;211/7817.html;201/2594.html;25/6137;v/LuizVelho;218/4700",
        "google_scholar": "UMtZNSsAAAAJ;tacm9gUAAAAJ;zhagpmkAAAAJ;cbAHng0AAAAJ;eywv6BsAAAAJ;piv6gKsAAAAJ",
        "orcid": "0000-0002-4845-3135;0000-0003-4512-8019;0000-0003-4102-1986;0000-0003-4584-1455;;0000-0003-3927-0852",
        "linkedin": ";tiagonovellodebrito/;;;luizvelho/;guilherme-schardong-310794ba/",
        "or_profile": "~Vin\u00edcius_Da_Silva1;~Tiago_Novello1;~Luiz_Schirmer1;~HELIO_CORTES_VIEIRA_LOPES1;~Luiz_Velho1;~Guilherme_Gon\u00e7alves_Schardong1",
        "aff": "Tecgraf Institute of Technical-Scientific Software Development of PUC-Rio (Tecgraf/PUC-Rio);Instituto Nacional de Matem\u00e1tica Pura e Aplicada - IMPA;Universidade Vale do Rio dos Sinos;Pontif\u00edcia Universidade Cat\u00f3lica do Rio de Janeiro;IMPA;Institute of Systems and Robotics, University of Coimbra",
        "aff_domain": "tecgraf.puc-rio.br;impa.br;unisinos.br;puc-rio.br;impa.br;isr.uc.pt",
        "position": "Researcher;Researcher;Assistant Professor;Associate Professor;Full Professor;Postdoc",
        "bibtex": "@misc{\nsilva2024neural,\ntitle={Neural implicit mapping via nested neighborhoods: real-time rendering of neural {SDF}s with textures},\nauthor={Vin{\\'\\i}cius Da Silva and Tiago Novello and Guilherme Schardong and Luiz Schirmer and HELIO CORTES VIEIRA LOPES and Luiz Velho},\nyear={2024},\nurl={https://openreview.net/forum?id=a1AMdN8pSD}\n}",
        "github": "",
        "project": "",
        "reviewers": "TKVb;4bTK;Kd2D;Y2D7",
        "site": "https://openreview.net/forum?id=a1AMdN8pSD",
        "pdf_size": 26280205,
        "rating": "3;5;5;6",
        "confidence": "5;2;3;4",
        "soundness": "2;3;2;2",
        "contribution": "2;3;2;3",
        "presentation": "2;3;2;3",
        "wc_summary": "54;51;63;99",
        "wc_strengths": "91;69;61;55",
        "wc_weaknesses": "769;13;212;231",
        "wc_questions": "96;67;67;70",
        "wc_review": "1010;200;403;455",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1042;262;770;824",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            66.75,
            19.13602623325961
        ],
        "wc_strengths_avg": [
            69.0,
            13.638181696985855
        ],
        "wc_weaknesses_avg": [
            306.25,
            280.48117138232294
        ],
        "wc_questions_avg": [
            75.0,
            12.186057606953941
        ],
        "wc_review_avg": [
            517.0,
            300.15745867794124
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            724.5,
            285.78094758048513
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5129891760425771,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:mW9bJ-MgM-gJ:scholar.google.com/&scioq=Neural+implicit+mapping+via+nested+neighborhoods:+real-time+rendering+of+neural+SDFs+with+textures&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;4;5",
        "aff_unique_norm": "Pontifical Catholic University of Rio de Janeiro;Instituto Nacional de Matem\u00e1tica Pura e Aplicada;Universidade Vale do Rio dos Sinos;Pontif\u00edcia Universidade Cat\u00f3lica do Rio de Janeiro;Instituto de Matem\u00e1tica Pura e Aplicada;University of Coimbra",
        "aff_unique_dep": "Tecgraf Institute of Technical-Scientific Software Development;;;;;Institute of Systems and Robotics",
        "aff_unique_url": "https://www.puc-rio.br;http://www.impa.br;https://www.unisinos.br;https://www.puc-rio.br;https://www.impa.br;https://www.uc.pt",
        "aff_unique_abbr": "PUC-Rio;IMPA;Unisinos;PUC-Rio;IMPA;",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Rio de Janeiro;",
        "aff_country_unique_index": "0;0;0;0;0;1",
        "aff_country_unique": "Brazil;Portugal"
    },
    {
        "id": "a24gfxA7jD",
        "title": "Physics Informed Distillation for Diffusion Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Diffusion models have recently emerged as a potent tool in generative modeling, although their inherent iterative nature often results in sluggish image generation due to the requirement for multiple model evaluations. Recent progress has unveiled the intrinsic link between diffusion models and Probability Flow Ordinary Differential Equations (ODEs), thus enabling us to conceptualize diffusion models as ODE systems. Simultaneously, Physics Informed Neural Networks (PINNs) have substantiated their effectiveness in solving intricate differential equations through implicit modeling of their solutions. Building upon these foundational insights, we introduce Physics Informed Distillation (PID), a novel approach that employs a student model to represent the solution of the ODE system corresponding to the teacher diffusion model, akin to the principles employed in PINNs. Our approach demonstrates remarkable results, such as achieving an FID score of 3.92 on CIFAR-10 for single-step image generation. Additionally, we establish the stability of our method under conditions involving a sufficiently high discretization number, paralleling observations found in the PINN literature,  thus highlighting its potential as a streamlined single-step distillation approach without the need for additional methodology-specific hyperparameters. The code will be made available upon acceptance.",
        "keywords": "Difffusion Models;Knowledge Distillation;Physics informed neural networks",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Joshua Tian Jin Tee;Kang Zhang;Chanwoo Kim;Dhananjaya Nagaraja Gowda;Hee Suk Yoon;Chang D. Yoo",
        "authorids": "~Joshua_Tian_Jin_Tee1;~Kang_Zhang6;~Chanwoo_Kim2;~Dhananjaya_Nagaraja_Gowda1;~Hee_Suk_Yoon1;~Chang_D._Yoo1",
        "gender": "M;M;M;M;M;M",
        "homepage": ";;https://www.facebook.com/chanwcom;;https://hee-suk-yoon.github.io/;https://sanctusfactory.com/family.php",
        "dblp": ";29/177-8;;255/7153;331/3851;31/7819",
        "google_scholar": "x90yFvMAAAAJ;nj19btQAAAAJ;pJoZXxYAAAAJ;k_c_K0IAAAAJ;eJ_iOQEAAAAJ;gFWgUQEAAAAJ",
        "orcid": ";0000-0003-2761-9383;;;0000-0003-2115-8459;0000-0002-0756-7179",
        "linkedin": ";;chanwoo-kim-2628a622/?originalSubdomain=kr;;https://www.linkedin.com/mwlite/in/hee-suk-yoon-262935137;",
        "or_profile": "~Joshua_Tian_Jin_Tee1;~Kang_Zhang6;~Chanwoo_Kim2;~Dhananjaya_Nagaraja_Gowda1;~Hee_Suk_Yoon1;~Chang_D._Yoo1",
        "aff": "KAIST, Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Samsung Research;Samsung;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology",
        "aff_domain": "ee.kaist.ac.kr;kaist.ac.kr;samsung.com;samsung.com;kaist.ac.kr;kaist.ac.kr",
        "position": "PhD student;PhD student;Corporate Vice President;Principal Researcher;PhD student;Full Professor",
        "bibtex": "@misc{\ntee2024physics,\ntitle={Physics Informed Distillation for Diffusion Models},\nauthor={Joshua Tian Jin Tee and Kang Zhang and Chanwoo Kim and Dhananjaya Nagaraja Gowda and Hee Suk Yoon and Chang D. Yoo},\nyear={2024},\nurl={https://openreview.net/forum?id=a24gfxA7jD}\n}",
        "github": "",
        "project": "",
        "reviewers": "duZ6;rfnU;sGVD;YcmQ",
        "site": "https://openreview.net/forum?id=a24gfxA7jD",
        "pdf_size": 13716304,
        "rating": "3;5;6;6",
        "confidence": "3;4;4;4",
        "soundness": "3;3;3;2",
        "contribution": "1;2;2;3",
        "presentation": "3;3;3;2",
        "wc_summary": "99;84;61;68",
        "wc_strengths": "18;90;34;37",
        "wc_weaknesses": "140;109;206;128",
        "wc_questions": "35;171;150;88",
        "wc_review": "292;454;451;321",
        "wc_reply_reviewers": "219;67;135;87",
        "wc_reply_authors": "926;1064;854;516",
        "reply_reviewers": "2;1;2;1",
        "reply_authors": "3;3;2;2",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            78.0,
            14.713938969562161
        ],
        "wc_strengths_avg": [
            44.75,
            27.105119442644042
        ],
        "wc_weaknesses_avg": [
            145.75,
            36.49914382557487
        ],
        "wc_questions_avg": [
            111.0,
            53.44623466625128
        ],
        "wc_review_avg": [
            379.5,
            73.72414801135379
        ],
        "wc_reply_reviewers_avg": [
            127.0,
            58.58327406350724
        ],
        "wc_reply_authors_avg": [
            840.0,
            201.70770932217738
        ],
        "reply_reviewers_avg": [
            1.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.9428090415820632,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11083776238898641432&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;1;1;0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology;Samsung",
        "aff_unique_dep": ";Samsung Research",
        "aff_unique_url": "https://www.kaist.ac.kr;https://research.samsung.com",
        "aff_unique_abbr": "KAIST;Samsung",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "a2d3mqRKvF",
        "title": "Temporal Repetition Counting with Dynamic Action Queries",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Temporal repetition counting aims to quantify the repeated action cycles within a video.The majority of existing methods rely on the similarity correlation matrix to characterize the repetitiveness of actions, but their scalability is hindered due to the quadratic computational complexity. In this work, we introduce a novel approach that employs an action query representation to localize repeated action cycles with linear complexity. Based on this representation, we further develop two key components to tackle the fundamental challenges of temporal repetition counting. Firstly, to facilitate open-set action counting, we propose the dynamic action query. Unlike static action queries, this approach dynamically embeds video features into action queries, offering a more flexible and generalizable representation. Second, to distinguish between actions of interest and background noise actions, we incorporate inter-query contrastive learning to regularize the video feature representation corresponding to different action queries. The experiments demonstrate that our method significantly outperforms the state-of-the-art methods in terms of both accuracy and efficiency. Specifically, our approach exhibits versatility in handling long video sequences, unseen actions, and actions at various speeds across two challenging benchmarks. Code and models will be publicly released.",
        "keywords": "Computer Vision;Temporal Repetition Counting",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/7b610e32cfdedaf14cb11ee764dc5b2359721f3f.zip",
        "author": "Zishi Li;Qiuyan Shang;Xiaoxuan Ma;Wentao Zhu;Hai Ci;Yizhou Wang",
        "authorids": "~Zishi_Li1;~Qiuyan_Shang1;~Xiaoxuan_Ma2;~Wentao_Zhu3;~Hai_Ci1;~Yizhou_Wang1",
        "gender": "M;;F;M;M;M",
        "homepage": "https://github.com/lizishi;;https://shirleymaxx.github.io/;https://wentao.live;;https://cfcs.pku.edu.cn/wangyizhou/",
        "dblp": ";;;117/0354-4;227/4707;71/3387-1",
        "google_scholar": ";;mjP_5SEAAAAJ;https://scholar.google.com/citations?hl=en;GMrjppAAAAAJ;831z_VcAAAAJ",
        "orcid": ";;0000-0003-0571-2659;;;",
        "linkedin": "https://www.linkedin.cn/incareer/in/ACoAADZ759AB_TLbiJmUGXTJz53b9rai6mGpbao;;;;;",
        "or_profile": "~Zishi_Li1;~Qiuyan_Shang1;~Xiaoxuan_Ma2;~Wentao_Zhu3;~Hai_Ci1;~Yizhou_Wang1",
        "aff": ";;Peking University;Peking University;National University of Singapore;Peking University",
        "aff_domain": ";;pku.edu.cn;pku.edu.cn;nus.edu.sg;pku.edu.cn",
        "position": ";;PhD student;PhD student;Postdoc;Full Professor",
        "bibtex": "@misc{\nli2024temporal,\ntitle={Temporal Repetition Counting with Dynamic Action Queries},\nauthor={Zishi Li and Qiuyan Shang and Xiaoxuan Ma and Wentao Zhu and Hai Ci and Yizhou Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=a2d3mqRKvF}\n}",
        "github": "",
        "project": "",
        "reviewers": "rXK7;t7e9;Xbom",
        "site": "https://openreview.net/forum?id=a2d3mqRKvF",
        "pdf_size": 22201140,
        "rating": "3;3;5",
        "confidence": "4;5;4",
        "soundness": "3;3;3",
        "contribution": "2;2;2",
        "presentation": "3;3;4",
        "wc_summary": "68;65;155",
        "wc_strengths": "55;58;42",
        "wc_weaknesses": "144;354;270",
        "wc_questions": "2;69;174",
        "wc_review": "269;546;641",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            96.0,
            41.737273509418415
        ],
        "wc_strengths_avg": [
            51.666666666666664,
            6.944222218666553
        ],
        "wc_weaknesses_avg": [
            256.0,
            86.30179604156567
        ],
        "wc_questions_avg": [
            81.66666666666667,
            70.78763231588474
        ],
        "wc_review_avg": [
            485.3333333333333,
            157.81071643656594
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:IPX2vJ5ra5YJ:scholar.google.com/&scioq=Temporal+Repetition+Counting+with+Dynamic+Action+Queries&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Peking University;National University of Singapore",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.nus.edu.sg",
        "aff_unique_abbr": "Peking U;NUS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "China;Singapore"
    },
    {
        "title": "iGraphMix: Input Graph Mixup Method for Node Classification",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18379",
        "id": "a2ljjXeDcE",
        "author_site": "Jongwon Jeong, Hoyeop Lee, Hyui Geon Yoon, Beomyoung Lee, Junhee Heo, Geonsoo Kim, Kim Jin Seon",
        "tldr": "",
        "abstract": "Recently, Input Mixup, which augments virtual samples by interpolating input features and corresponding labels, is one of the promising methods to alleviate the over-fitting problem on various domains including image classification and natural language processing because of its ability to generate a variety of virtual samples, and ease of usability and versatility. However, designing Input Mixup for the node classification is still challenging due to the irregularity issue that each node contains a different number of neighboring nodes for input and the alignment issue that how to align and interpolate two sets of neighboring nodes is not well-defined when two nodes are interpolated. To address the issues, this paper proposes a novel Mixup method, called iGraphMix, tailored to node classification. Our method generates virtual nodes and their edges by interpolating input features and labels, and attaching sampled neighboring nodes. The virtual graphs generated by iGraphMix serve as inputs for graph neural networks (GNNs) training, thereby facilitating its easy application to various GNNs and enabling effective combination with other augmentation methods. We mathematically prove that training GNNs with iGraphMix leads to better generalization performance compared to that without augmentation, and our experiments support the theoretical findings.",
        "keywords": "Graph Neural Network;Mixup;Node Classification;Data Augmentation;Theoretical Analysis",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Jongwon Jeong;Hoyeop Lee;Hyui Geon Yoon;Beomyoung Lee;Junhee Heo;Geonsoo Kim;Kim Jin Seon",
        "authorids": "~Jongwon_Jeong1;~Hoyeop_Lee1;~Hyui_Geon_Yoon1;~Beomyoung_Lee2;~Junhee_Heo1;~Geonsoo_Kim1;~Kim_Jin_Seon1",
        "gender": "M;M;M;M;F;M;",
        "homepage": "https://sites.google.com/view/jongwonjeong;https://sites.google.com/view/hoyeoplee;https://www.linkedin.com/in/hgyoon;;;;",
        "dblp": "324/0682;144/1338.html;;;;;",
        "google_scholar": "km_SjroAAAAJ;ZROeHRwAAAAJ;https://scholar.google.com/citations?hl=ko;;;;",
        "orcid": ";;;;;;",
        "linkedin": "jongwon-jeong-571a1016b/?originalSubdomain=kr;;hgyoon;beom-young-lee-118b1611b/;junhee-heo-8581471a4/;;%EC%A7%84%EC%84%A0-%EA%B9%80-1a163a151/?originalSubdomain=kr",
        "or_profile": "~Jongwon_Jeong1;~Hoyeop_Lee1;~Hyui_Geon_Yoon1;~Beomyoung_Lee2;~Junhee_Heo1;~Geonsoo_Kim1;~Kim_Jin_Seon1",
        "aff": "KRAFTON;NCSOFT Co.;NCSOFT;;NCSOFT Corp;;",
        "aff_domain": "krafton.com;ncsoft.com;ncsoft.com;;ncsoft.com;;",
        "position": "Researcher;Researcher;Researcher;;Researcher;;",
        "bibtex": "@inproceedings{\njeong2024igraphmix,\ntitle={iGraphMix: Input Graph Mixup Method for Node Classification},\nauthor={Jongwon Jeong and Hoyeop Lee and Hyui Geon Yoon and Beomyoung Lee and Junhee Heo and Geonsoo Kim and Kim Jin Seon},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=a2ljjXeDcE}\n}",
        "github": "",
        "project": "",
        "reviewers": "TxAH;vL8H;jPtV;A2TK;mUwv",
        "pdf_size": 855358,
        "rating": "5;6;6;6;8",
        "confidence": "4;4;4;3;5",
        "soundness": "2;3;3;3;3",
        "contribution": "2;3;3;4;3",
        "presentation": "3;3;2;3;3",
        "wc_summary": "56;65;79;73;101",
        "wc_strengths": "34;23;37;17;418",
        "wc_weaknesses": "164;57;25;82;236",
        "wc_questions": "62;35;230;26;300",
        "wc_review": "316;180;371;198;1055",
        "wc_reply_reviewers": "0;0;102;0;0",
        "wc_reply_authors": "1567;901;1244;1350;1479",
        "reply_reviewers": "0;0;1;0;0",
        "reply_authors": "4;4;4;4;4",
        "rating_avg": [
            6.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            3.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            74.8,
            15.210522673465237
        ],
        "wc_strengths_avg": [
            105.8,
            156.26823093642545
        ],
        "wc_weaknesses_avg": [
            112.8,
            76.90357598967684
        ],
        "wc_questions_avg": [
            130.6,
            112.57282087608891
        ],
        "wc_review_avg": [
            424.0,
            323.49528590073766
        ],
        "wc_reply_reviewers_avg": [
            20.4,
            40.8
        ],
        "wc_reply_authors_avg": [
            1308.2,
            231.44364324819983
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            4.0,
            0.0
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.6454972243679028,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5662773012562130031&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=a2ljjXeDcE",
        "pdf": "https://openreview.net/pdf?id=a2ljjXeDcE",
        "email": "krafton.com;ncsoft.com;ncsoft.com;;ncsoft.com;;",
        "author_num": 7,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "KRAFTON Inc.;NCSOFT Corporation",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.krafton.com;https://www.ncsoft.com",
        "aff_unique_abbr": "KRAFTON;NCSOFT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "StructComp: Substituting propagation with Structural Compression in Training Graph Contrastive Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18378",
        "id": "a4DBEeGfQq",
        "author_site": "Shengzhong Zhang, Wenjie Yang, Xinyuan Cao, Hongwei Zhang, Zengfeng Huang",
        "tldr": "",
        "abstract": "Graph contrastive learning (GCL) has become a powerful tool for learning graph data, but its scalability remains a significant challenge. In this work, we propose a simple yet effective training framework called Structural Compression (StructComp) to address this issue. Inspired by a sparse low-rank approximation on the diffusion matrix, StructComp trains the encoder with the compressed nodes. This allows the encoder not to perform any message passing during the training stage, and significantly reduces the number of sample pairs in the contrastive loss. We theoretically prove that the original GCL loss can be approximated with the contrastive loss computed by StructComp. Moreover, StructComp can be regarded as an additional regularization term for GCL models, resulting in a more robust encoder. Empirical studies on various datasets show that StructComp greatly reduces the time and memory consumption while improving model performance compared to the vanilla GCL models and scalable training methods.",
        "keywords": "Graph Contrastive Learning;Scalable Training;Structural Compression",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Shengzhong Zhang;Wenjie Yang;Xinyuan Cao;Hongwei Zhang;Zengfeng Huang",
        "authorids": "~Shengzhong_Zhang1;~Wenjie_Yang4;~Xinyuan_Cao1;~Hongwei_Zhang3;~Zengfeng_Huang1",
        "gender": "M;M;F;M;M",
        "homepage": "https://szzhang17.github.io/;https://agoyang.github.io;https://github.com/youki-cao;;https://zengfenghuang.github.io/",
        "dblp": "255/8703;74/4603-6;271/2539;;97/9726",
        "google_scholar": "bWD48lgAAAAJ;28iyqm0AAAAJ;XRgHwgkAAAAJ;6tZzBr4AAAAJ;https://scholar.google.com.hk/citations?user=FwNBuXUAAAAJ",
        "orcid": "0000-0003-1783-6835;0000-0001-5420-2722;;;0000-0003-2671-7483",
        "linkedin": ";;;;",
        "or_profile": "~Shengzhong_Zhang1;~Wenjie_Yang4;~Xinyuan_Cao1;~Hongwei_Zhang3;~Zengfeng_Huang1",
        "aff": "Fudan University;Fudan University;Georgia Institute of Technology;Fudan University;Fudan University",
        "aff_domain": "fudan.edu.cn;fudan.edu.cn;gatech.edu;fudan.edu.cn;fudan.edu",
        "position": "PhD student;PhD student;PhD student;PhD student;Full Professor",
        "bibtex": "@inproceedings{\nzhang2024structcomp,\ntitle={StructComp: Substituting propagation with Structural Compression in Training Graph Contrastive Learning},\nauthor={Shengzhong Zhang and Wenjie Yang and Xinyuan Cao and Hongwei Zhang and Zengfeng Huang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=a4DBEeGfQq}\n}",
        "github": "",
        "project": "",
        "reviewers": "iDuQ;v4Cz;PXMh;kF3D",
        "pdf_size": 556199,
        "rating": "5;5;5;6",
        "confidence": "4;3;3;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;2;3",
        "wc_summary": "53;67;84;84",
        "wc_strengths": "30;15;46;21",
        "wc_weaknesses": "96;121;157;26",
        "wc_questions": "118;20;4;290",
        "wc_review": "297;223;291;421",
        "wc_reply_reviewers": "0;0;0;149",
        "wc_reply_authors": "1078;1177;1490;3353",
        "reply_reviewers": "0;0;0;2",
        "reply_authors": "5;5;6;8",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            72.0,
            12.98075498574717
        ],
        "wc_strengths_avg": [
            28.0,
            11.683321445547923
        ],
        "wc_weaknesses_avg": [
            100.0,
            47.91137651956996
        ],
        "wc_questions_avg": [
            108.0,
            113.78049041905207
        ],
        "wc_review_avg": [
            308.0,
            71.42128534267638
        ],
        "wc_reply_reviewers_avg": [
            37.25,
            64.51889258194068
        ],
        "wc_reply_authors_avg": [
            1774.5,
            923.94818577667
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            6.0,
            1.224744871391589
        ],
        "replies_avg": [
            32,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15377365649705594552&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=a4DBEeGfQq",
        "pdf": "https://openreview.net/pdf?id=a4DBEeGfQq",
        "email": "fudan.edu.cn;fudan.edu.cn;gatech.edu;fudan.edu.cn;fudan.edu",
        "author_num": 5,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "Fudan University;Georgia Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.fudan.edu.cn;https://www.gatech.edu",
        "aff_unique_abbr": "Fudan;Georgia Tech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "a4O528mek9",
        "title": "Learning Multi-modal Representations Under Incomplete Data Via Dual Level Alignments",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Our goal is to learn modality-free representations of a wide variety of entity types (e.g., text, image, object), \nthat can be applied to multi-modal tasks under incomplete data (e.g., noisy data or missing modality information).\nWhile conventional methods train models over modality-specific features, (e.g., image features via visual encoding), and decode them into their contextual representations of specific modalities (e.g., images and text), our framework, {\\it Multiple2Vec} (Mul2vec), is based on the idea that these features and the corresponding text are different views of the same entity, and learns semantic representations without directly using modality-specific features.\nMul2vec is a framework consisting of NTF, and training objectives, DLM and ILM.\nSince this idea implies that similar entities have similar representations even on a dual-level (contextual and semantic), \nMul2vec aligns them and optimizes the semantic representations with the corresponding contextual representations.\nExperiments show that Mul2vec learns semantic representations,\nand contributes to pre-trained models for downstream tasks under incomplete data.",
        "keywords": "Representation Learning;Multi-modal;Incomplete Data;Multi-Level Alignments",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/a8de26e8c3e2d21567b35994c875b673dbf0cfc9.pdf",
        "author": "Noriaki Kawamae",
        "authorids": "~Noriaki_Kawamae1",
        "gender": "",
        "homepage": "",
        "dblp": "70/1704",
        "google_scholar": "https://scholar.google.co.jp/citations?user=ylU8pzwAAAAJ",
        "orcid": "0000-0002-0746-9624",
        "linkedin": "",
        "or_profile": "~Noriaki_Kawamae1",
        "aff": "NTT Comware",
        "aff_domain": "nttcom.co.jp",
        "position": "Evangelist",
        "bibtex": "@misc{\nkawamae2024learning,\ntitle={Learning Multi-modal Representations Under Incomplete Data Via Dual Level Alignments},\nauthor={Noriaki Kawamae},\nyear={2024},\nurl={https://openreview.net/forum?id=a4O528mek9}\n}",
        "github": "",
        "project": "",
        "reviewers": "ouCz;beEN;goSd;BQ2D",
        "site": "https://openreview.net/forum?id=a4O528mek9",
        "pdf_size": 3969254,
        "rating": "3;3;3;3",
        "confidence": "3;2;5;4",
        "soundness": "2;1;2;2",
        "contribution": "2;1;2;2",
        "presentation": "1;1;3;1",
        "wc_summary": "66;14;147;85",
        "wc_strengths": "9;14;40;198",
        "wc_weaknesses": "75;102;206;165",
        "wc_questions": "63;102;29;95",
        "wc_review": "213;232;422;543",
        "wc_reply_reviewers": "57;0;74;44",
        "wc_reply_authors": "544;180;662;770",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "2;1;1;2",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            78.0,
            47.56574397610112
        ],
        "wc_strengths_avg": [
            65.25,
            77.54152113545362
        ],
        "wc_weaknesses_avg": [
            137.0,
            51.512134492758115
        ],
        "wc_questions_avg": [
            72.25,
            28.977361853695378
        ],
        "wc_review_avg": [
            352.5,
            137.02280832036686
        ],
        "wc_reply_reviewers_avg": [
            43.75,
            27.407799984675894
        ],
        "wc_reply_authors_avg": [
            539.0,
            222.1463481581455
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:DBBnT-v1OtYJ:scholar.google.com/&scioq=Learning+Multi-modal+Representations+Under+Incomplete+Data+Via+Dual+Level+Alignments&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "NTT Comware",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ntt-comware.co.jp",
        "aff_unique_abbr": "",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Japan"
    },
    {
        "id": "a5C3JmS4S5",
        "title": "Towards Text-guided 3D Scene Composition",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We witness significant breakthroughs in the technology for generating 3D objects from text. Existing approaches either leverage large text-to-image models to optimize a 3D representation or train 3D generators on object-centric datasets. Generating entire scenes, however, remains very challenging as a scene contains multiple 3D objects, diverse and scattered. In this work, we introduce SceneWiz3D \u2013 a novel approach to synthesize high fidelity 3D scenes from text. We marry the locality of objects with globality of scenes by introducing a hybrid 3D representation \u2013 explicit for objects and implicit for scenes. Remarkably, an object, being represented explicitly, can be either generated from text using conventional text-to-3D approaches, or provided by users. To configure the layout of the scene and automatically place objects, we apply Particle Swarm Optimization technique during the distillation process. Furthermore, in the text-to-scene scenario it is difficult for certain parts of the scene (e.g., corners, occlusion) to receive multi-view supervision, leading to inferior geometry. To mitigate the lack of such supervision, we incorporate an RGBD panorama diffusion model, resulting in high quality geometry. Extensive evaluation supports that our approach achieves superior quality over previous approaches, enabling the generation of detailed and view-consistent 3D scenes.",
        "keywords": "scene generation;text-to-3D",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/332a99ee56cbab47069f03a9d8e529cafe6f81a3.zip",
        "author": "Qihang Zhang;Chaoyang Wang;Aliaksandr Siarohin;Peiye Zhuang;Yinghao Xu;Ceyuan Yang;Dahua Lin;Bolei Zhou;Sergey Tulyakov;Hsin-Ying Lee",
        "authorids": "~Qihang_Zhang1;~Chaoyang_Wang1;~Aliaksandr_Siarohin1;~Peiye_Zhuang2;~Yinghao_Xu1;~Ceyuan_Yang2;~Dahua_Lin1;~Bolei_Zhou5;~Sergey_Tulyakov1;~Hsin-Ying_Lee2",
        "gender": "M;M;M;F;M;M;M;M;M;M",
        "homepage": "https://zqh0253.github.io;https://mightychaos.github.io/;;https://payeah.net;https://justimyhxu.github.io/;https://ceyuan.me/;http://dahua.site;https://boleizhou.github.io/;http://www.stulyakov.com/;http://hsinyinglee.com/",
        "dblp": "282/1036;;199/1971;244/7937;232/2482;218/2676;53/6088;46/8066;40/6115;149/7976-1.html",
        "google_scholar": "sWjUHkEAAAAJ;I-xDKHEAAAAJ;https://scholar.google.it/citations?user=uMl5-k4AAAAJ;gsPILWoAAAAJ;https://scholar.google.com/citations?hl=en;Rfj4jWoAAAAJ;GMzzRRUAAAAJ;9D4aG8AAAAAJ;mgzXR0sAAAAJ;",
        "orcid": ";;;;;;;;;",
        "linkedin": "zhang-qihang-39aa09160/;;;;;;;;sergeytulyakov/;",
        "or_profile": "~Qihang_Zhang1;~Chaoyang_Wang1;~Aliaksandr_Siarohin1;~Peiye_Zhuang2;~Yinghao_Xu1;~Ceyuan_Yang2;~Dahua_Lin1;~Bolei_Zhou5;~Sergey_Tulyakov1;~Hsin-Ying_Lee2",
        "aff": "The Chinese University of Hong Kong;Snap Inc.;Snap Inc.;Snap Inc.;Stanford University;ByteDance Inc.;The Chinese University of Hong Kong;University of California, Los Angeles;Snap Inc.;Snap Inc.",
        "aff_domain": "cuhk.edu.hk;snapchat.com;snapchat.com;snapchat.com;stanford.edu;bytedance.com;cuhk.edu.hk;ucla.edu;snapchat.com;snap.com",
        "position": "Postgraduate student;Researcher;Intern;Researcher;Postdoc;Researcher;Associate Professor;Assistant Professor;Director of Research;Researcher",
        "bibtex": "@misc{\nzhang2024towards,\ntitle={Towards Text-guided 3D Scene Composition},\nauthor={Qihang Zhang and Chaoyang Wang and Aliaksandr Siarohin and Peiye Zhuang and Yinghao Xu and Ceyuan Yang and Dahua Lin and Bolei Zhou and Sergey Tulyakov and Hsin-Ying Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=a5C3JmS4S5}\n}",
        "github": "",
        "project": "",
        "reviewers": "mrx5;YLgn;RBCq;QuQy",
        "site": "https://openreview.net/forum?id=a5C3JmS4S5",
        "pdf_size": 11323759,
        "rating": "3;5;6;6",
        "confidence": "3;4;3;4",
        "soundness": "2;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "1;2;3;3",
        "wc_summary": "69;73;91;73",
        "wc_strengths": "41;70;54;46",
        "wc_weaknesses": "87;332;195;209",
        "wc_questions": "294;2;24;66",
        "wc_review": "491;477;364;394",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            76.5,
            8.52936105461599
        ],
        "wc_strengths_avg": [
            52.75,
            10.985786271359915
        ],
        "wc_weaknesses_avg": [
            205.75,
            86.84288974924775
        ],
        "wc_questions_avg": [
            96.5,
            116.32175205007876
        ],
        "wc_review_avg": [
            431.5,
            53.78893938348292
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.40824829046386296,
        "gs_citation": 32,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11677754365437061460&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;1;1;2;3;0;4;1;1",
        "aff_unique_norm": "Chinese University of Hong Kong;Snap Inc.;Stanford University;ByteDance;University of California, Los Angeles",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.cuhk.edu.hk;https://www.snapinc.com;https://www.stanford.edu;https://www.bytedance.com;https://www.ucla.edu",
        "aff_unique_abbr": "CUHK;Snap;Stanford;ByteDance;UCLA",
        "aff_campus_unique_index": "0;2;0;3",
        "aff_campus_unique": "Hong Kong SAR;;Stanford;Los Angeles",
        "aff_country_unique_index": "0;1;1;1;1;0;0;1;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "a6SntIisgg",
        "title": "LogoRA: Local-Global Representation Alignment for Robust Time Series Classification",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Unsupervised domain adaptation (UDA) of time series data aims to teach models to identify consistent patterns across various temporal scenarios, disregarding domain-specific differences, which can maintain their predictive accuracy and effectively adapt to new domains. However, existing UDA methods struggle to adequately extract and align both global and local features in time series data. To address this issue, we propose **Lo**cal-**G**l**o**bal **R**epresentation **A**lignment framework (LogoRA), which employs a two-branch encoder\u2014comprising a multi-scale convolutional branch and a patching transformer branch. The encoder enables the extraction of both local and global representations from time series instances. A fusion module is then introduced to integrate these representations, enhancing domain-invariant feature alignment from multi-scale perspectives. To achieve effective alignment, LogoRA employs strategies like invariant feature learning on the source domain, utilizing triplet loss for fine alignment and dynamic time warping-based feature alignment. Additionally, it reduces source-target domain gaps through adversarial training and per-class prototype alignment. Our evaluations on four time-series datasets demonstrate that LogoRA outperforms strong baselines by up to $12.52$%, showcasing its superiority in time series UDA tasks.",
        "keywords": "Multi-Scale;Feature Alignment;Unsupervised Domain Adaptation;Time Series Classification;Robust Representation Learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Huanyu Zhang;YiFan Zhang;Zhang Zhang;Qingsong Wen;Liang Wang;Tieniu Tan",
        "authorids": "~Huanyu_Zhang4;~YiFan_Zhang8;~Zhang_Zhang1;~Qingsong_Wen2;~Liang_Wang3;~Tieniu_Tan1",
        "gender": "M;;;;M;",
        "homepage": "https://hwanyu112.github.io/;;https://zhangzhang80.github.io/;;;",
        "dblp": ";;94/2468-1;;56/4499-1;",
        "google_scholar": "mtI1oVQAAAAJ;;rnRNwEMAAAAJ;;;",
        "orcid": ";;0000-0001-9425-3065;;;",
        "linkedin": "%E6%A1%93%E7%91%9C-%E5%BC%A0-7289a9291/;;;;;",
        "or_profile": "~Huanyu_Zhang4;~YiFan_Zhang8;~Zhang_Zhang1;~Qingsong_Wen2;~Liang_Wang3;~Tieniu_Tan1",
        "aff": "Institute of Automation, Chinese Academy of Sciences;;Institute of Automation, Chinese Academy of Sciences;;Institute of Automation\uff0c CAS\uff0cChina;",
        "aff_domain": "ia.ac.cn;;ia.ac.cn;;ia.ac.cn;",
        "position": "PhD student;;Associate Professor;;Full Professor;",
        "bibtex": "@misc{\nzhang2024logora,\ntitle={Logo{RA}: Local-Global Representation Alignment for Robust Time Series Classification},\nauthor={Huanyu Zhang and YiFan Zhang and Zhang Zhang and Qingsong Wen and Liang Wang and Tieniu Tan},\nyear={2024},\nurl={https://openreview.net/forum?id=a6SntIisgg}\n}",
        "github": "",
        "project": "",
        "reviewers": "UBmN;RUDS;MkgY;E2UE;oA7T",
        "site": "https://openreview.net/forum?id=a6SntIisgg",
        "pdf_size": 3402332,
        "rating": "3;5;5;6;6",
        "confidence": "5;4;4;3;4",
        "soundness": "2;2;3;3;4",
        "contribution": "2;2;2;3;3",
        "presentation": "3;3;2;3;3",
        "wc_summary": "47;39;59;52;48",
        "wc_strengths": "51;39;26;22;82",
        "wc_weaknesses": "88;204;122;93;152",
        "wc_questions": "69;57;153;3;53",
        "wc_review": "255;339;360;170;335",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "1516;1125;1159;799;635",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "5;4;4;3;3",
        "rating_avg": [
            5.0,
            1.0954451150103321
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.8,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            49.0,
            6.54217089351845
        ],
        "wc_strengths_avg": [
            44.0,
            21.568495543268657
        ],
        "wc_weaknesses_avg": [
            131.8,
            42.75698773300102
        ],
        "wc_questions_avg": [
            67.0,
            48.5633606744838
        ],
        "wc_review_avg": [
            291.8,
            70.6184111970809
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1046.8,
            306.5409597427398
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            3.8,
            0.7483314773547882
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.8660254037844387,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8289480664352504751&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Chinese Academy of Sciences",
        "aff_unique_dep": "Institute of Automation",
        "aff_unique_url": "http://www.ia.cas.cn",
        "aff_unique_abbr": "CAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Understanding prompt engineering may not require rethinking generalization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18377",
        "id": "a745RnSFLT",
        "author_site": "Victor Akinwande, Yiding Jiang, Dylan Sam, J Kolter",
        "tldr": "",
        "abstract": "Zero-shot learning in prompted vision-language models, the practice of crafting prompts to build classifiers without an explicit training process, has achieved impressive performance in many settings. This success presents a seemingly surprising observation: these methods suffer relatively little from overfitting, i.e., when a prompt is manually engineered to achieve low error on a given training set (thus rendering the method no longer actually zero-shot), the approach still performs well on held-out test data. In this paper, we show that we can explain such performance well via recourse to classical PAC-Bayes bounds.  Specifically, we show that the discrete nature of prompts, combined with a PAC-Bayes prior given by a language model, results in generalization bounds that are remarkably tight by the standards of the literature: for instance, the generalization bound of an ImageNet classifier is often within a few percentage points of the true test error. We demonstrate empirically that this holds for existing handcrafted prompts and prompts generated through simple greedy search. Furthermore, the resulting bound is well-suited for model selection: the models with the best bound typically also have the best test performance. This work thus provides a possible justification for the widespread practice of \"prompt engineering,\" even if it seems that such methods could potentially overfit the training data.",
        "keywords": "generalization;prompt engineering;PAC-Bayes;foundation models",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Victor Akinwande;Yiding Jiang;Dylan Sam;J Zico Kolter",
        "authorids": "~Victor_Akinwande2;~Yiding_Jiang2;~Dylan_Sam1;~J_Zico_Kolter1",
        "gender": "M;M;M;M",
        "homepage": "https://home.victorakinwande.com/;https://yidingjiang.github.io/;https://dsam99.github.io/;http://www.zicokolter.com",
        "dblp": "211/6825;;289/8487.html;67/2526",
        "google_scholar": "-FmgQDMAAAAJ;x9qzWg8AAAAJ;43ffAwcAAAAJ;UXh1I6UAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Victor_Akinwande2;~Yiding_Jiang2;~Dylan_Sam1;~Zico_Kolter1",
        "aff": "Carnegie Mellon University;Carnegie Mellon University;Google;Carnegie Mellon University",
        "aff_domain": "cmu.edu;andrew.cmu.edu;google.com;cmu.edu",
        "position": "PhD student;PhD student;Intern;Full Professor",
        "bibtex": "@inproceedings{\nakinwande2024understanding,\ntitle={Understanding prompt engineering may not require rethinking generalization},\nauthor={Victor Akinwande and Yiding Jiang and Dylan Sam and J Zico Kolter},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=a745RnSFLT}\n}",
        "github": "",
        "project": "",
        "reviewers": "miVF;q9H1;bDCR;DH9x",
        "pdf_size": 727301,
        "rating": "6;8;8;8",
        "confidence": "4;4;2;3",
        "soundness": "3;4;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "119;87;40;36",
        "wc_strengths": "123;174;40;44",
        "wc_weaknesses": "218;282;74;209",
        "wc_questions": "67;95;70;115",
        "wc_review": "527;638;224;404",
        "wc_reply_reviewers": "0;12;23;0",
        "wc_reply_authors": "112;763;386;771",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;3;1;2",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            70.5,
            34.44198019858905
        ],
        "wc_strengths_avg": [
            95.25,
            56.237776449642816
        ],
        "wc_weaknesses_avg": [
            195.75,
            75.71781494470109
        ],
        "wc_questions_avg": [
            86.75,
            19.60070151805797
        ],
        "wc_review_avg": [
            448.25,
            153.66583061956226
        ],
        "wc_reply_reviewers_avg": [
            8.75,
            9.575359001102779
        ],
        "wc_reply_authors_avg": [
            508.0,
            276.53842409328945
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3421257182569662738&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=a745RnSFLT",
        "pdf": "https://openreview.net/pdf?id=a745RnSFLT",
        "email": "cmu.edu;andrew.cmu.edu;google.com;cmu.edu",
        "author_num": 4,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Carnegie Mellon University;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.cmu.edu;https://www.google.com",
        "aff_unique_abbr": "CMU;Google",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "a7eIuzEh2R",
        "title": "MANGO: A Benchmark for Evaluating Mapping and Navigation Abilities of Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models such as ChatGPT and GPT-4 have recently achieved astonishing performance on a variety of natural language processing tasks. In this paper, we propose MANGO, a benchmark to evaluate their capabilities to perform text-based mapping and navigation. Our benchmark includes 53 mazes taken from a suite of textgames: each maze is paired with a walkthrough that visits every location but does not cover all possible paths. The task is question-answering: for each maze, a large language model reads the walkthrough and answers hundreds of mapping and navigation questions such as \"How should you go to Attic from West of House?\" and \"Where are we if we go north and east from Cellar?\". Although these questions are easy to humans, it turns out that even GPT-4, the best-to-date language model, performs poorly at answering them. Further, our experiments suggest that a strong mapping and navigation ability would benefit large language models in performing relevant downstream tasks, such as playing textgames. Our MANGO benchmark will facilitate future research on methods that improve the mapping and navigation capabilities of language models. We host our data, source code, and evaluation program at https://anonymous_for_now.",
        "keywords": "large language models;robotics;mapping;navigation;textgame",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Peng Ding;Jiading Fang;Peng Li;Kangrui Wang;Xiaochen Zhou;Mo Yu;Jing Li;Matthew Walter;Hongyuan Mei",
        "authorids": "~Peng_Ding2;~Jiading_Fang1;~Peng_Li13;~Kangrui_Wang2;~Xiaochen_Zhou1;~Mo_Yu1;~Jing_Li21;~Matthew_Walter1;~Hongyuan_Mei1",
        "gender": ";M;;M;F;M;;M;M",
        "homepage": ";https://sites.google.com/view/jiadingfang/home;https://artpli.github.io;https://jameskrw.github.io/;;http://researcher.ibm.com/researcher/view.php?person=us-yum;;http://ttic.edu/walter;http://www.cs.jhu.edu/~hmei/",
        "dblp": ";308/6149.html;;216/9159;;32/7445.html;;50/7734;164/5576",
        "google_scholar": ";tBXNGtMAAAAJ;4puDTtgAAAAJ;;;vC8DssQAAAAJ;;RAiewnEAAAAJ;g_zaiVIAAAAJ",
        "orcid": ";;;;;;;0000-0003-1425-6050;",
        "linkedin": ";jiading-fang-456546114/;;wang-kangrui-8b9a37257/;xiaochen-zhou1021/;;;;hongyuan-mei-57687858?trk=nav_responsive_tab_profile_pic",
        "or_profile": "~Peng_Ding2;~Jiading_Fang1;~Peng_Li13;~Kangrui_Wang2;~Xiaochen_Zhou1;~Mo_Yu1;~Jing_Li21;~Matthew_Walter1;~Hongyuan_Mei1",
        "aff": ";Toyota Technological Institute at Chicago;Fudan University;Northwestern University;;WeChat AI, Tencent;;Toyota Technological Institute at Chicago;Toyota Technological Institute at Chicago",
        "aff_domain": ";ttic.edu;fudan.edu;northwestern.edu;;tencent.com;;ttic.edu;ttic.edu",
        "position": ";PhD student;MS student;PhD student;;Principal Researcher;;Associate Professor;Research Assistant Professor",
        "bibtex": "@misc{\nding2024mango,\ntitle={{MANGO}: A Benchmark for Evaluating Mapping and Navigation Abilities of Large Language Models},\nauthor={Peng Ding and Jiading Fang and Peng Li and Kangrui Wang and Xiaochen Zhou and Mo Yu and Jing Li and Matthew Walter and Hongyuan Mei},\nyear={2024},\nurl={https://openreview.net/forum?id=a7eIuzEh2R}\n}",
        "github": "",
        "project": "",
        "reviewers": "eNST;fKBg;14NH;M8P4",
        "site": "https://openreview.net/forum?id=a7eIuzEh2R",
        "pdf_size": 606790,
        "rating": "5;6;6;8",
        "confidence": "4;4;4;4",
        "soundness": "2;3;3;4",
        "contribution": "2;3;3;3",
        "presentation": "3;3;2;4",
        "wc_summary": "115;70;111;134",
        "wc_strengths": "80;71;46;359",
        "wc_weaknesses": "254;138;119;106",
        "wc_questions": "24;39;108;337",
        "wc_review": "473;318;384;936",
        "wc_reply_reviewers": "654;159;0;271",
        "wc_reply_authors": "948;651;802;1645",
        "reply_reviewers": "3;2;0;2",
        "reply_authors": "3;3;1;3",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            107.5,
            23.32916629457641
        ],
        "wc_strengths_avg": [
            139.0,
            127.62640792563269
        ],
        "wc_weaknesses_avg": [
            154.25,
            58.70423749611266
        ],
        "wc_questions_avg": [
            127.0,
            125.31360660359273
        ],
        "wc_review_avg": [
            527.75,
            242.03550875852906
        ],
        "wc_reply_reviewers_avg": [
            271.0,
            241.18146694968087
        ],
        "wc_reply_authors_avg": [
            1011.5,
            380.52759426879936
        ],
        "reply_reviewers_avg": [
            1.75,
            1.0897247358851685
        ],
        "reply_authors_avg": [
            2.5,
            0.8660254037844386
        ],
        "replies_avg": [
            31,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12540845304284017905&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;2;3;0;0",
        "aff_unique_norm": "Toyota Technological Institute at Chicago;Fudan University;Northwestern University;Tencent",
        "aff_unique_dep": ";;;WeChat AI",
        "aff_unique_url": "https://www.tti-chicago.org;https://www.fudan.edu.cn;https://www.northwestern.edu;https://www.tencent.com",
        "aff_unique_abbr": "TTI Chicago;Fudan;NU;Tencent",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Chicago;",
        "aff_country_unique_index": "0;1;0;1;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "Unveiling Options with Neural Network Decomposition",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18376",
        "id": "a8VETFwcVR",
        "author_site": "Mahdi Alikhasi, Levi Lelis",
        "tldr": "",
        "abstract": "In reinforcement learning, agents often learn policies for specific tasks without the ability to generalize this knowledge to related tasks. This paper introduces an algorithm that attempts to address this limitation by decomposing neural networks encoding policies for Markov Decision Processes into reusable sub-policies, which are used to synthesize temporally extended actions, or options. We consider neural networks with piecewise linear activation functions, so that they can be mapped to an equivalent tree that is similar to oblique decision trees. Since each node in such a tree serves as a function of the input of the tree, each sub-tree is a sub-policy of the main policy. We turn each of these sub-policies into options by wrapping it with while-loops of varied number of iterations. Given the large number of options, we propose a selection mechanism based on minimizing the Levin loss for a uniform policy on these options. Empirical results in two grid-world domains where exploration can be difficult confirm that our method can identify useful options, thereby accelerating the learning process on similar but different tasks.",
        "keywords": "reinforcement learning;options;programmatic options",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Mahdi Alikhasi;Levi Lelis",
        "authorids": "~Mahdi_Alikhasi1;~Levi_Lelis1",
        "gender": "M;M",
        "homepage": ";http://www.cs.ualberta.ca/~santanad",
        "dblp": ";82/7788",
        "google_scholar": ";https://scholar.google.com.br/citations?user=eoXoLFgAAAAJ",
        "orcid": ";",
        "linkedin": "https://linkedin.com/in/mahdialikhasi/;",
        "or_profile": "~Mahdi_Alikhasi1;~Levi_Lelis1",
        "aff": ";University of Alberta",
        "aff_domain": ";ualberta.ca",
        "position": ";Assistant Professor",
        "bibtex": "@inproceedings{\nalikhasi2024unveiling,\ntitle={Unveiling Options with Neural Network Decomposition},\nauthor={Mahdi Alikhasi and Levi Lelis},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=a8VETFwcVR}\n}",
        "github": "",
        "project": "",
        "reviewers": "voTZ;i5GW;j32D",
        "pdf_size": 556097,
        "rating": "6;6;6",
        "confidence": "3;4;4",
        "soundness": "3;3;4",
        "contribution": "2;3;3",
        "presentation": "3;3;2",
        "wc_summary": "51;129;76",
        "wc_strengths": "34;186;121",
        "wc_weaknesses": "124;104;274",
        "wc_questions": "177;152;59",
        "wc_review": "386;571;530",
        "wc_reply_reviewers": "170;57;88",
        "wc_reply_authors": "866;320;620",
        "reply_reviewers": "2;1;1",
        "reply_authors": "4;2;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            85.33333333333333,
            32.52007926736273
        ],
        "wc_strengths_avg": [
            113.66666666666667,
            62.27002132290911
        ],
        "wc_weaknesses_avg": [
            167.33333333333334,
            75.86537784494027
        ],
        "wc_questions_avg": [
            129.33333333333334,
            50.769632218045025
        ],
        "wc_review_avg": [
            495.6666666666667,
            79.3319327607462
        ],
        "wc_reply_reviewers_avg": [
            105.0,
            47.672493816315786
        ],
        "wc_reply_authors_avg": [
            602.0,
            223.26665671344657
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:C4qwFEnLU6IJ:scholar.google.com/&scioq=Unveiling+Options+with+Neural+Network+Decomposition&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=a8VETFwcVR",
        "pdf": "https://openreview.net/pdf?id=a8VETFwcVR",
        "email": ";ualberta.ca",
        "author_num": 2,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Alberta",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ualberta.ca",
        "aff_unique_abbr": "UAlberta",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "a9xZqOqzEW",
        "title": "A Logical Framework for Verification of AI Fairness",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "With the widespread use of AI in socially important decision-making processes, it becomes crucial to ensure that AI-generated decisions do not reflect discrimination towards certain groups or populations.  To address this challenge, our research introduces a theoretical framework based on the spider diagram---a reasoning system rooted in first-order predicate logic, and an extended version of the Euler and Venn diagrams---to define and verify the fairness of AI algorithms in decision-making.  This framework compares the sets representing the actual outcome of the algorithm and the expected outcome to identify bias in the model. The expected outcome of the model is calculated by considering the similarity score between the individual instances in the dataset. If the set of actual outcomes is a subset of the set of expected outcomes and all constant spiders in the former set have a corresponding foot in the expected outcome set, then the algorithm is free from bias. We further evaluate the performance of the AI model using the spider diagram that replaces the conventional confusion matrix in the literature. The framework also permits us to define a degree of bias and evaluate the same for specific AI models. Experimental results indicate that this framework surpasses traditional approaches in efficiency, with improvements in processing time and a reduced number of function calls.",
        "keywords": "Artificial Intelligence;bias;discrimination;fairness;spider diagram;first-order predicate logic",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/6eb1cd593fc99fc0404a3f2105f836bdb636071e.zip",
        "author": "Priya T V;Shrisha Rao",
        "authorids": "~Priya_T_V1;~Shrisha_Rao1",
        "gender": "F;M",
        "homepage": ";https://www.iiitb.ac.in/faculty/shrisha-rao",
        "dblp": ";http://www.informatik.uni-trier.de/~ley/pers/hd/r/Rao:Shrisha.html",
        "google_scholar": ";http://scholar.google.co.in/citations?hl=en",
        "orcid": "0009-0000-8365-6686;0000-0003-0625-5103",
        "linkedin": "priya-t-v-593716b9/;shrao/",
        "or_profile": "~Priya_T_V1;~Shrisha_Rao1",
        "aff": "New Horizon College of Engineering;IIIT Bangalore",
        "aff_domain": "newhorizonindia.edu;iiitb.ac.in",
        "position": "Assistant Professor;Full Professor",
        "bibtex": "@misc{\nv2024a,\ntitle={A Logical Framework for Verification of {AI} Fairness},\nauthor={Priya T V and Shrisha Rao},\nyear={2024},\nurl={https://openreview.net/forum?id=a9xZqOqzEW}\n}",
        "github": "",
        "project": "",
        "reviewers": "iDyr;VPjM;cYyx;Wzut",
        "site": "https://openreview.net/forum?id=a9xZqOqzEW",
        "pdf_size": 850385,
        "rating": "1;1;3;5",
        "confidence": "4;2;2;4",
        "soundness": "1;1;3;3",
        "contribution": "1;2;2;1",
        "presentation": "1;1;1;2",
        "wc_summary": "53;372;48;122",
        "wc_strengths": "9;42;19;42",
        "wc_weaknesses": "104;719;173;313",
        "wc_questions": "4;8;73;38",
        "wc_review": "170;1141;313;515",
        "wc_reply_reviewers": "0;0;21;0",
        "wc_reply_authors": "233;838;266;425",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            2.5,
            1.6583123951777
        ],
        "confidence_avg": [
            3.0,
            1.0
        ],
        "soundness_avg": [
            2.0,
            1.0
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            1.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            148.75,
            132.16916243965534
        ],
        "wc_strengths_avg": [
            28.0,
            14.439529078193651
        ],
        "wc_weaknesses_avg": [
            327.25,
            238.38243957976434
        ],
        "wc_questions_avg": [
            30.75,
            27.707174161216802
        ],
        "wc_review_avg": [
            534.75,
            370.858716359748
        ],
        "wc_reply_reviewers_avg": [
            5.25,
            9.093266739736606
        ],
        "wc_reply_authors_avg": [
            440.5,
            240.70365597555846
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.30151134457776363,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:fbbXvBA0jx4J:scholar.google.com/&scioq=A+Logical+Framework+for+Verification+of+AI+Fairness&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "New Horizon College of Engineering;International Institute of Information Technology, Bangalore",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.nhce.ac.in;https://iiitb.ac.in",
        "aff_unique_abbr": ";IIITB",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Bangalore",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "India"
    },
    {
        "title": "Gaining Wisdom from Setbacks: Aligning Large Language Models via Mistake Analysis",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18375",
        "id": "aA33A70IO6",
        "author_site": "Kai Chen, Chunwei Wang, Kuo Yang, Jianhua Han, Lanqing HONG, Fei Mi, Hang Xu, Zhengying Liu, Wenyong Huang, Zhenguo Li, Dit-Yan Yeung, Lifeng Shang",
        "tldr": "",
        "abstract": "The rapid development of large language models (LLMs) has not only provided numerous opportunities but also presented significant challenges. This becomes particularly evident when LLMs inadvertently generate harmful or toxic content, either unintentionally or because of intentional inducement. Existing alignment methods usually direct LLMs toward the favorable outcomes by utilizing human-annotated, flawless instruction-response pairs. Conversely, this study proposes a novel alignment technique based on mistake analysis, which deliberately exposes LLMs to erroneous content to learn the reasons for mistakes and how to avoid them. In this case, mistakes are repurposed into valuable data for alignment, effectively helping to avoid the production of erroneous responses. Without external models or human annotations, our method leverages a model's intrinsic ability to discern undesirable mistakes and improves the safety of its generated responses. Experimental results reveal that our method outperforms existing alignment approaches in enhancing model safety while maintaining the overall utility.",
        "keywords": "Large language model;safety alignment;mistake analysis",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Kai Chen;Chunwei Wang;Kuo Yang;Jianhua Han;Lanqing HONG;Fei Mi;Hang Xu;Zhengying Liu;Wenyong Huang;Zhenguo Li;Dit-Yan Yeung;Lifeng Shang",
        "authorids": "~Kai_Chen11;~Chunwei_Wang1;~Kuo_Yang1;~Jianhua_Han1;~Lanqing_HONG1;~Fei_Mi1;~Hang_Xu1;~Zhengying_Liu2;~Wenyong_Huang1;~Zhenguo_Li1;~Dit-Yan_Yeung2;~Lifeng_Shang1",
        "gender": "M;F;;M;F;M;M;M;M;M;M;M",
        "homepage": "https://kaichen1998.github.io/;https://github.com/chunweiwang0224;;;https://racheltechie.github.io/;https://mifei.github.io/;;;;http://www.ee.columbia.edu/~zgli/;https://cse.hkust.edu.hk/faculty/dyyeung/;",
        "dblp": "c/KaiChen24;;;29/6207;226/4258;161/0068;;241/1782;;23/6479;41/5668;70/4288",
        "google_scholar": "3qBfyLIAAAAJ;;;OEPMQEMAAAAJ;https://scholar.google.com.sg/citations?user=2p7x6OUAAAAJ;gX3493QAAAAJ;https://scholar.google.com.hk/citations?user=J_8TX6sAAAAJ;http:// DFme0joAAAAJ;z8UoSOwAAAAJ;XboZC1AAAAAJ;nEsOOx8AAAAJ;https://scholar.google.com.hk/citations?user=jMQIjYoAAAAJ",
        "orcid": ";;;;;;0000-0003-3645-8972;;;;0000-0003-3716-8125;",
        "linkedin": ";;kuo-yang/;;;;;;;;;",
        "or_profile": "~Kai_Chen11;~Chunwei_Wang1;~Kuo_Yang1;~Jianhua_Han1;~Lanqing_HONG1;~Fei_Mi1;~Hang_Xu1;~Zhengying_Liu2;~Wenyong_Huang1;~Zhenguo_Li1;~Dit-Yan_Yeung2;~Lifeng_Shang1",
        "aff": "Hong Kong University of Science and Technology;Huawei Technologies Ltd.;Huawei Technologies Ltd.;Huawei Technologies Ltd.;Huawei Technologies Ltd.;;Huawei Noah\u2018s Ark Lab;Huawei Technologies Ltd.;Huawei Technologies Ltd.;Huawei Noah's Ark Lab;Hong Kong University of Science and Technology;Huawei Technologies Ltd.",
        "aff_domain": "ust.hk;huawei.com;huawei.com;huawei.com;huawei.com;;huawei.com;huawei.com;huawei.com;huawei.com;ust.hk;huawei.com",
        "position": "PhD student;Researcher;Researcher;Researcher;Researcher;;Researcher;Researcher;Researcher;Principal Researcher;Chair Professor;Researcher",
        "bibtex": "@inproceedings{\nchen2024gaining,\ntitle={Gaining Wisdom from Setbacks: Aligning Large Language Models via Mistake Analysis},\nauthor={Kai Chen and Chunwei Wang and Kuo Yang and Jianhua Han and Lanqing HONG and Fei Mi and Hang Xu and Zhengying Liu and Wenyong Huang and Zhenguo Li and Dit-Yan Yeung and Lifeng Shang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=aA33A70IO6}\n}",
        "github": "",
        "project": "",
        "reviewers": "5o83;sdVt;FapY;xbbn",
        "pdf_size": 2231897,
        "rating": "5;5;6;8",
        "confidence": "3;3;4;4",
        "soundness": "2;2;4;3",
        "contribution": "2;3;3;4",
        "presentation": "2;3;3;2",
        "wc_summary": "39;70;64;125",
        "wc_strengths": "49;31;39;149",
        "wc_weaknesses": "213;220;61;156",
        "wc_questions": "60;9;67;28",
        "wc_review": "361;330;231;458",
        "wc_reply_reviewers": "128;113;0;100",
        "wc_reply_authors": "673;1034;1023;263",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "3;3;3;2",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            74.5,
            31.388692231439016
        ],
        "wc_strengths_avg": [
            67.0,
            47.77028364998475
        ],
        "wc_weaknesses_avg": [
            162.5,
            63.641574461982
        ],
        "wc_questions_avg": [
            41.0,
            23.61143790623519
        ],
        "wc_review_avg": [
            345.0,
            81.00308636095293
        ],
        "wc_reply_reviewers_avg": [
            85.25,
            50.20644878897531
        ],
        "wc_reply_authors_avg": [
            748.25,
            315.543479571358
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            0.4330127018922193
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            12,
            0
        ],
        "corr_rating_confidence": 0.8164965809277259,
        "gs_citation": 36,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15334823886340136228&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=aA33A70IO6",
        "pdf": "https://openreview.net/pdf?id=aA33A70IO6",
        "email": "ust.hk;huawei.com;huawei.com;huawei.com;huawei.com;;huawei.com;huawei.com;huawei.com;huawei.com;ust.hk;huawei.com",
        "author_num": 12,
        "aff_unique_index": "0;1;1;1;1;1;1;1;1;0;1",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Huawei",
        "aff_unique_dep": ";Huawei Technologies",
        "aff_unique_url": "https://www.ust.hk;https://www.huawei.com",
        "aff_unique_abbr": "HKUST;Huawei",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "aAE44ivBtx",
        "title": "Diffusion Denoising as a Certified Defense Against Clean-Label Poisoning Attacks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We present a certified defense to clean-label poisoning attacks. These attacks work by injecting poisoning samples that contain $p$-norm bounded adversarial perturbations into the training data to induce a targeted misclassification of a test-time input. Inspired by the adversarial robustness achieved by $denoised$ $smoothing$, we show how a pre-trained diffusion model can sanitize the training data before a model training. We extensively test our defense against seven clean-label poisoning attacks and reduce their attack success to 0-16\\% with only a small drop in the test time accuracy. We compare our defense with existing countermeasures against clean-label poisoning, showing that the defense reduces the attack success the most and offers the best model utility. Our results highlight the need for future work on developing stronger clean-label attacks and using our certified yet practical defense as a strong baseline to evaluate these attacks.",
        "keywords": "Certified defense;Data poisoning;Diffusion denoising",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/31d2d85d795d8fbe1249c3d08c1b6be11a435b3b.pdf",
        "author": "Sanghyun Hong;Nicholas Carlini;Alexey Kurakin",
        "authorids": "~Sanghyun_Hong1;~Nicholas_Carlini1;~Alexey_Kurakin1",
        "gender": "M;;M",
        "homepage": "http://www.sanghyun-hong.com;http://nicholas.carlini.com;http://kurakin.me",
        "dblp": "135/8991;145/1806;56/9834",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;nCh4qyMAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Sanghyun_Hong1;~Nicholas_Carlini1;~Alexey_Kurakin1",
        "aff": "Oregon State University;Google;Research, Google",
        "aff_domain": "oregonstate.edu;google.com;research.google.com",
        "position": "Assistant Professor;Researcher;Research Software Engineer",
        "bibtex": "@misc{\nhong2024diffusion,\ntitle={Diffusion Denoising as a Certified Defense Against Clean-Label Poisoning Attacks},\nauthor={Sanghyun Hong and Nicholas Carlini and Alexey Kurakin},\nyear={2024},\nurl={https://openreview.net/forum?id=aAE44ivBtx}\n}",
        "github": "",
        "project": "",
        "reviewers": "ehju;iUfb;sFAv;mhLZ",
        "site": "https://openreview.net/forum?id=aAE44ivBtx",
        "pdf_size": 588191,
        "rating": "3;3;3;3",
        "confidence": "4;5;4;3",
        "soundness": "2;2;2;2",
        "contribution": "1;2;2;2",
        "presentation": "1;1;3;2",
        "wc_summary": "73;160;170;104",
        "wc_strengths": "51;34;24;47",
        "wc_weaknesses": "333;374;159;78",
        "wc_questions": "5;54;3;658",
        "wc_review": "462;622;356;887",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            126.75,
            39.94605737741836
        ],
        "wc_strengths_avg": [
            39.0,
            10.700467279516348
        ],
        "wc_weaknesses_avg": [
            236.0,
            121.80517230397074
        ],
        "wc_questions_avg": [
            180.0,
            276.7282060072663
        ],
        "wc_review_avg": [
            581.75,
            200.06295884046102
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:YZS_5DCtxwkJ:scholar.google.com/&scioq=Diffusion+Denoising+as+a+Certified+Defense+Against+Clean-Label+Poisoning+Attacks&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Oregon State University;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://oregonstate.edu;https://www.google.com",
        "aff_unique_abbr": "OSU;Google",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "aAEBTnTGo3",
        "title": "JoinGym: An Efficient Query Optimization Environment for Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Join order selection (JOS) is the problem of ordering join operations to minimize total query execution cost and it is the core NP-hard combinatorial optimization problem of query optimization.\nIn this paper, we present JoinGym, a lightweight and easy-to-use query optimization environment for reinforcement learning (RL) that captures both the left-deep and bushy variants of the JOS problem. \nCompared to existing query optimization environments, the key advantages of JoinGym are usability and significantly higher throughput which we accomplish by simulating query executions entirely offline. \nUnder the hood, JoinGym simulates a query plan's cost by looking up intermediate result cardinalities from a pre-computed dataset. \nWe release a novel cardinality dataset for $3300$ SQL queries based on real IMDb workloads which may be of independent interest, e.g., for cardinality estimation. \nFinally, we extensively benchmark four RL algorithms and find that their cost distributions are heavy-tailed, which motivates future work in risk-sensitive RL. In sum, JoinGym enables users to rapidly prototype RL algorithms on realistic database problems without needing to setup and run live systems.",
        "keywords": "Reinforcement Learning Environment;Combinatorial Optimization;Query Optimization;Data Management",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/5b8b03c02a525cd2a2f93f7853fbd070659b7b17.zip",
        "author": "Junxiong Wang;Kaiwen Wang;Yueying Li;Nathan Kallus;Immanuel Trummer;Wen Sun",
        "authorids": "~Junxiong_Wang1;~Kaiwen_Wang1;~Yueying_Li1;~Nathan_Kallus1;~Immanuel_Trummer2;~Wen_Sun1",
        "gender": ";M;F;;M;",
        "homepage": ";https://kaiwenw.github.io/;;http://nathankallus.com/;http://www.itrummer.org/;https://wensun.github.io",
        "dblp": ";220/3822;;142/2900;;",
        "google_scholar": ";HsMheBUAAAAJ;;K2WfIlsAAAAJ;;iOLC30YAAAAJ",
        "orcid": ";;;0000-0003-1672-0507;;",
        "linkedin": ";kaiwenw/;%E6%82%A6%E9%A2%96-%E6%9D%8E-144479131/;;;",
        "or_profile": "~Junxiong_Wang1;~Kaiwen_Wang1;~Yueying_Li1;~Nathan_Kallus1;~Immanuel_Trummer2;~Wen_Sun1",
        "aff": ";Department of Computer Science, Cornell University;Cornell University;Cornell University;Cornell University;Cornell University",
        "aff_domain": ";cs.cornell.edu;cornell.edu;cornell.edu;cornell.edu;cornell.edu",
        "position": ";PhD student;PhD student;Associate Professor;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nwang2024joingym,\ntitle={JoinGym: An Efficient Query Optimization Environment for Reinforcement Learning},\nauthor={Junxiong Wang and Kaiwen Wang and Yueying Li and Nathan Kallus and Immanuel Trummer and Wen Sun},\nyear={2024},\nurl={https://openreview.net/forum?id=aAEBTnTGo3}\n}",
        "github": "",
        "project": "",
        "reviewers": "wp5V;jBfS;QAMY;2MKf",
        "site": "https://openreview.net/forum?id=aAEBTnTGo3",
        "pdf_size": 4922533,
        "rating": "3;5;5;6",
        "confidence": "5;3;2;4",
        "soundness": "1;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;3;2",
        "wc_summary": "19;44;69;141",
        "wc_strengths": "10;42;75;62",
        "wc_weaknesses": "251;142;71;150",
        "wc_questions": "3;15;81;87",
        "wc_review": "283;243;296;440",
        "wc_reply_reviewers": "0;214;62;42",
        "wc_reply_authors": "306;1011;623;526",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            68.25,
            45.57068685021107
        ],
        "wc_strengths_avg": [
            47.25,
            24.508926945094924
        ],
        "wc_weaknesses_avg": [
            153.5,
            64.1424196612507
        ],
        "wc_questions_avg": [
            46.5,
            37.79880950506246
        ],
        "wc_review_avg": [
            315.5,
            74.48657597178165
        ],
        "wc_reply_reviewers_avg": [
            79.5,
            80.81305587589173
        ],
        "wc_reply_authors_avg": [
            616.5,
            255.08478982487372
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5129891760425771,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2886440703888077543&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Cornell University",
        "aff_unique_dep": "Department of Computer Science",
        "aff_unique_url": "https://www.cornell.edu",
        "aff_unique_abbr": "Cornell",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "aAhgJ1fQ4V",
        "title": "A Multi-resolution Dataset of Self-consistent Cloth Drapes for Physics-based Upsampling",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The high-fidelity simulation of draped cloth is a crucial tool across a wide range of applications that span the gamut from immersive virtual experiences to accurate digital modeling. However, capturing the finely detailed folds, creases, contacts and wrinkles of a cloth at equilibrium requires expensive, high-resolution simulation. To side-step these intensive computation requirements, data-driven methods have long attempted to directly upsample cheap-to-generate, low-resolution, coarse-cloth drapes with rich, physically realistic cloth-drape details. However, progress in these \"physics upsampling\" methods is significantly stymied by the lack of suitable data to capture both the intricate details of cloth physics and, just as important, to provide consistent, artifact-free, multi-resolution models of draping to learn the changes and correspondences across resolutions. Existing cloth simulators (both industrial and academic) generally fail to capture accurate draping behavior of real-world materials, lack the resolution and fidelity required for producing fine-scale cloth wrinkles, struggle with accurately resolving detailed cloth self-collision, and, do not provide consistent draping geometries for simulations as we vary input model resolution. At the same time, consistent and meaningful quantitative metrics for evaluating the success of physics-based upsampling methods have also been missing. To address these gaps, we introduce a large-scale dataset specifically designed for cloth-drape upsampling, built with the recently developed \"Progressive Cloth Simulation\" (PCS) method and a new set of carefully constructed benchmark evaluation metrics. PCS enables us to generate a dataset of multi-resolution tuples of corresponding cloth drapes, with drape consistency across resolution levels, over a diverse range of real-world cloth material parameters. Geometries at all resolutions are robustly interpenetration-free (a critical and necessary feature for high-quality cloth modeling), with increasingly finer details ending in the highest-resolution models corresponding to high-fidelity, completely unconstrained and fully converged cloth simulation output. Our dataset spans a wide range of diverse cloth configurations by collating over one million total simulated meshes constructed via careful parameterization across important input drape configuration variations. We provide geometric analyses of our dataset and benchmark five existing upsampling methods for cloth upsampling under various settings. To quantify performance, we introduce a new set of geometric and physical evaluation metrics. Here, as we show in our analyses, the high-fidelity cloth draping, introduced in this dataset,  immediately exposes severe limitations in existing methods which are challenged by both the complex contact behaviors and the real-world cloth material properties demonstrated. Recognizing these gaps in existing methods regarding collision objects and material properties, we further develop and benchmark a new, learning-based baseline method for comparison. Extensive experimental results demonstrate the effectiveness, as well as the important added real-world complexity of our dataset. Its self-consistent models and the intricate high-resolution cloth details provide an important yet challenging benchmark, calling on future research in specialized model designs for data-driven cloth upsampling and simulation. A subset of our dataset is available at https://cloth-drape-dataset.github.io/.",
        "keywords": "Cloth simulation;physics-based upsampling;neural upsampling.",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Yun-Chun Chen;Jiayi Eris Zhang;Danny Kaufman;Alec Jacobson",
        "authorids": "~Yun-Chun_Chen1;~Jiayi_Eris_Zhang1;~Danny_Kaufman2;~Alec_Jacobson1",
        "gender": "M;F;M;M",
        "homepage": "https://yunchunchen.github.io;https://eriszhang.github.io/;http://dannykaufman.io/;http://www.cs.toronto.edu/~jacobson/",
        "dblp": "214/6606;;;33/8698.html",
        "google_scholar": "https://scholar.google.com/citations?hl=en;rZfDdGsAAAAJ;wLRwwYcAAAAJ;https://scholar.google.ca/citations?user=lSJavJUAAAAJ",
        "orcid": ";;;0000-0003-4603-7143",
        "linkedin": ";;;",
        "or_profile": "~Yun-Chun_Chen1;~Jiayi_Eris_Zhang1;~Danny_Kaufman2;~Alec_Jacobson1",
        "aff": "University of Toronto;Stanford University;;Department of Computer Science, University of Toronto",
        "aff_domain": "cs.toronto.edu;stanford.edu;;cs.toronto.edu",
        "position": "PhD student;PhD student;;Associate Professor",
        "bibtex": "@misc{\nchen2024a,\ntitle={A  Multi-resolution Dataset of Self-consistent Cloth Drapes for Physics-based Upsampling},\nauthor={Yun-Chun Chen and Jiayi Eris Zhang and Danny Kaufman and Alec Jacobson},\nyear={2024},\nurl={https://openreview.net/forum?id=aAhgJ1fQ4V}\n}",
        "github": "",
        "project": "",
        "reviewers": "qJGw;L7uF;z6HR;QcF6",
        "site": "https://openreview.net/forum?id=aAhgJ1fQ4V",
        "pdf_size": 12831034,
        "rating": "5;5;6;6",
        "confidence": "5;3;4;4",
        "soundness": "3;2;3;3",
        "contribution": "1;2;2;2",
        "presentation": "2;2;3;3",
        "wc_summary": "92;108;43;69",
        "wc_strengths": "93;80;26;82",
        "wc_weaknesses": "301;166;57;436",
        "wc_questions": "58;3;5;226",
        "wc_review": "544;357;131;813",
        "wc_reply_reviewers": "0;241;0;14",
        "wc_reply_authors": "1345;1622;209;1198",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "4;5;2;4",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            78.0,
            24.50510150968569
        ],
        "wc_strengths_avg": [
            70.25,
            26.022826518270456
        ],
        "wc_weaknesses_avg": [
            240.0,
            142.39206438562508
        ],
        "wc_questions_avg": [
            73.0,
            91.04669131824616
        ],
        "wc_review_avg": [
            461.25,
            250.25424571822953
        ],
        "wc_reply_reviewers_avg": [
            63.75,
            102.49481694212639
        ],
        "wc_reply_authors_avg": [
            1093.5,
            532.8754544919478
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.75,
            1.0897247358851685
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:f3t-rnAaeioJ:scholar.google.com/&scioq=A+Multi-resolution+Dataset+of+Self-consistent+Cloth+Drapes+for+Physics-based+Upsampling&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Toronto;Stanford University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.utoronto.ca;https://www.stanford.edu",
        "aff_unique_abbr": "U of T;Stanford",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Stanford;Toronto",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Canada;United States"
    },
    {
        "title": "Object-Centric Learning with Slot Mixture Module",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18374",
        "id": "aBUidW4Nkd",
        "author_site": "Daniil Kirilenko, Vitaliy Vorobyov, Aleksey Kovalev, Aleksandr Panov",
        "tldr": "",
        "abstract": "Object-centric architectures usually apply a differentiable module to the entire feature map to decompose it into sets of entity representations called slots. Some of these methods structurally resemble clustering algorithms, where the cluster's center in latent space serves as a slot representation. Slot Attention is an example of such a method, acting as a learnable analog of the soft k-means algorithm. Our work employs a learnable clustering method based on the Gaussian Mixture Model. Unlike other approaches, we represent slots not only as centers of clusters but also incorporate information about the distance between clusters and assigned vectors, leading to more expressive slot representations. Our experiments demonstrate that using this approach instead of Slot Attention improves performance in object-centric scenarios, achieving state-of-the-art results in the set property prediction task.",
        "keywords": "Object-centric representations;Gaussian Mixture Model;Slot Attention;Set Prediction Task",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/902ec25757c483b569a553c54585d306cd358a38.pdf",
        "author": "Daniil Kirilenko;Vitaliy Vorobyov;Alexey Kovalev;Aleksandr Panov",
        "authorids": "~Daniil_Kirilenko1;~Vitaliy_Vorobyov1;~Alexey_Kovalev3;~Aleksandr_Panov1",
        "gender": "M;M;M;M",
        "homepage": ";https://v3code.github.io/personal_page;;http://grafft.github.io",
        "dblp": "304/3977;;245/7675;177/9975",
        "google_scholar": ";;https://scholar.google.com/citations?view_op=list_works;https://scholar.google.ru/citations?hl=ru",
        "orcid": "0000-0002-4835-9413;;0000-0003-2180-0990;0000-0002-9747-3837",
        "linkedin": ";;alexey-kovalev-831433286/;",
        "or_profile": "~Daniil_Kirilenko1;~Vitaliy_Vorobyov1;~Alexey_Kovalev3;~Aleksandr_Panov1",
        "aff": "Universita della Svizzera Italiana;Moscow Institute of Physics and Technology;Federal Research Center \u00abComputer Science and Control\u00bb of Russian Academy of Sciences;Federal Research Center \u00abComputer Science and Control\u00bb of Russian Academy of Sciences",
        "aff_domain": "usi.ch;phystech.edu;frccsc.ru;frccsc.ru",
        "position": "PhD student;MS student;Researcher;Principal Researcher",
        "bibtex": "@inproceedings{\nkirilenko2024objectcentric,\ntitle={Object-Centric Learning with Slot Mixture Module},\nauthor={Daniil Kirilenko and Vitaliy Vorobyov and Alexey Kovalev and Aleksandr Panov},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=aBUidW4Nkd}\n}",
        "github": "",
        "project": "",
        "reviewers": "fszf;HCjc;spVv;7AcU",
        "pdf_size": 6638946,
        "rating": "5;6;6;8",
        "confidence": "4;3;5;5",
        "soundness": "3;3;3;4",
        "contribution": "2;3;3;3",
        "presentation": "2;2;3;4",
        "wc_summary": "49;111;90;102",
        "wc_strengths": "36;56;57;192",
        "wc_weaknesses": "370;158;196;206",
        "wc_questions": "2;5;21;330",
        "wc_review": "457;330;364;830",
        "wc_reply_reviewers": "42;140;89;126",
        "wc_reply_authors": "406;309;370;496",
        "reply_reviewers": "1;1;2;1",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            88.0,
            23.717082451262844
        ],
        "wc_strengths_avg": [
            85.25,
            62.19877410367506
        ],
        "wc_weaknesses_avg": [
            232.5,
            81.38028016663496
        ],
        "wc_questions_avg": [
            89.5,
            139.04046173686277
        ],
        "wc_review_avg": [
            495.25,
            198.7805008042791
        ],
        "wc_reply_reviewers_avg": [
            99.25,
            37.9432141495683
        ],
        "wc_reply_authors_avg": [
            395.25,
            67.71770447970013
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.48420012470625223,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6165928678608744211&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=aBUidW4Nkd",
        "pdf": "https://openreview.net/pdf?id=aBUidW4Nkd",
        "email": "usi.ch;phystech.edu;frccsc.ru;frccsc.ru",
        "author_num": 4,
        "aff_unique_index": "0;1;2;2",
        "aff_unique_norm": "Universita della Svizzera Italiana;Moscow Institute of Physics and Technology;Russian Academy of Sciences",
        "aff_unique_dep": ";;Computer Science and Control",
        "aff_unique_url": "https://www.usi.ch;https://www.mipt.ru/en;https://www.ras.ru",
        "aff_unique_abbr": "USI;MIPT;RAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "Switzerland;Russian Federation"
    },
    {
        "id": "aCgybhcZFi",
        "title": "Enhancing Neural Network Transparency through Representation Analysis",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this paper, we introduce and characterize the emerging area of representation engineering (RepE), an approach to enhancing the transparency of AI systems that draws on insights from cognitive neuroscience. RepE places population-level representations, rather than neurons or circuits, at the center of analysis, equipping us with novel methods for monitoring and manipulating high-level cognitive phenomena in deep neural networks (DNNs). We provide baselines and initial analysis of RepE techniques, showing that they offer simple yet effective solutions for improving our understanding and control of large language models. We showcase these methods can provide traction on a wide range of safety-relevant problems, including truthfulness, memorization, power-seeking, and more, demonstrating the promise of representation-centered transparency research. We hope this work catalyzes further exploration into RepE and fosters advancements in the transparency and safety of AI systems.",
        "keywords": "transparency;interpretability;monitoring;alignment;ML safety",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Andy Zou;Long Phan;Sarah Li Chen;James Campbell;Phillip Huang Guo;Richard Ren;Alexander Pan;Xuwang Yin;Mantas Mazeika;Annah Dombrowski;Shashwat Goel;Nathaniel Li;Michael J. Byun;Zifan Wang;Alex Troy Mallen;Steven Basart;Sanmi Koyejo;Dawn Song;Matt Fredrikson;J Zico Kolter;Dan Hendrycks",
        "authorids": "~Andy_Zou1;~Long_Phan1;~Sarah_Li_Chen1;~James_Campbell4;~Phillip_Huang_Guo1;~Richard_Ren1;~Alexander_Pan1;~Xuwang_Yin2;~Mantas_Mazeika3;annah.katharina@gmail.com;~Shashwat_Goel1;~Nathaniel_Li1;mbyun@cs.stanford.edu;~Zifan_Wang1;~Alex_Troy_Mallen1;~Steven_Basart1;~Sanmi_Koyejo1;~Dawn_Song1;~Matt_Fredrikson1;~J_Zico_Kolter1;~Dan_Hendrycks1",
        "gender": ";M;;;M;M;M;M;M;;M;M;;M;M;M;;F;M;;",
        "homepage": ";;;;https://phillipguo.com/;https://notrichardren.github.io/;https://aypan17.github.io;https://xuwangyin.github.io/;https://github.com/mmazeika;;https://shash42.github.io/;https://nli0.github.io;;https://www.zifanw.net;;http://stevenbas.art;;;https://cs.cmu.edu/~mfredrik;;",
        "dblp": "274/2362;;;;;335/8195;304/3394;125/2311;215/4447;;300/8333.html;;;;294/8452;245/2547;;s/DXSong;38/2612;;182/2504",
        "google_scholar": ";fVRQn4wAAAAJ;;;htCMHnUAAAAJ;o-Vl80UAAAAJ;PaltSA0AAAAJ;c425B6UAAAAJ;;;exaNV-0AAAAJ;2XmBzbcAAAAJ;;HJOP3wMAAAAJ;EZe6n8EAAAAJ;MzKvJhAAAAAJ;;;https://scholar.google.com.tw/citations?user=tMYCvLAAAAAJ;;",
        "orcid": ";;;;;0000-0001-5628-7926;;;;;;;;;;;;;;;",
        "linkedin": "andy-zou-09ba3616a/;long-phan-3110/;sarah-chen1/;jamescampbell57/;phillip-guo/;richard-ren-tech;alexander-pan-0567a2102/;;;;shashwatgoel42/;nli0/;;zifan-wang-sail/;alex-mallen-815b01176/;xksteven/;;;;;",
        "or_profile": "~Andy_Zou1;~Long_Phan1;~Sarah_Li_Chen1;~James_Campbell4;~Phillip_Huang_Guo1;~Richard_Ren1;~Alexander_Pan1;~Xuwang_Yin2;~Mantas_Mazeika3;annah.katharina@gmail.com;~Shashwat_Goel1;~Nathaniel_Li1;mbyun@cs.stanford.edu;~Zifan_Wang1;~Alex_Troy_Mallen1;~Steven_Basart1;~Sanmi_Koyejo1;~Dawn_Song1;~Matt_Fredrikson1;~J_Zico_Kolter1;~Dan_Hendrycks1",
        "aff": "Carnegie Mellon University;Center for AI Safety;Stanford University;Carnegie Mellon University;University of Maryland, College Park;The Wharton School;University of California, Berkeley;Center for AI Safety;University of Illinois, Urbana-Champaign;;IIIT Hyderabad;University of California, Berkeley;;Center for AI Safety;Redwood Research;Center for AI Safety ;;University of California, Berkeley;Carnegie Mellon University;;Center for AI Safety",
        "aff_domain": "andrew.cmu.edu;safe.ai;stanford.edu;cmu.edu;umd.edu;wharton.upenn.edu;berkeley.edu;safe.ai;uiuc.edu;;iiit.ac.in;berkeley.edu;;safe.ai;rdwrs.com;safe.ai;;berkeley.edu;cmu.edu;;safe.ai",
        "position": "PhD student;Research Engineer;Undergrad student;PhD student;Undergrad student;Undergrad student;PhD student;Researcher;PhD student;;MS student;Undergrad student;;Researcher;Researcher;Researcher;;Full Professor;Associate Professor;;Executive and Research Director",
        "bibtex": "@misc{\nzou2024enhancing,\ntitle={Enhancing Neural Network Transparency through Representation Analysis},\nauthor={Andy Zou and Long Phan and Sarah Li Chen and James Campbell and Phillip Huang Guo and Richard Ren and Alexander Pan and Xuwang Yin and Mantas Mazeika and Annah Dombrowski and Shashwat Goel and Nathaniel Li and Michael J. Byun and Zifan Wang and Alex Troy Mallen and Steven Basart and Sanmi Koyejo and Dawn Song and Matt Fredrikson and J Zico Kolter and Dan Hendrycks},\nyear={2024},\nurl={https://openreview.net/forum?id=aCgybhcZFi}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZgPm;gKW5;RXRb",
        "site": "https://openreview.net/forum?id=aCgybhcZFi",
        "pdf_size": 5464268,
        "rating": "5;6;6",
        "confidence": "3;2;2",
        "soundness": "2;3;2",
        "contribution": "3;3;3",
        "presentation": "2;2;2",
        "wc_summary": "36;33;61",
        "wc_strengths": "38;128;97",
        "wc_weaknesses": "249;98;260",
        "wc_questions": "11;23;171",
        "wc_review": "334;282;589",
        "wc_reply_reviewers": "20;0;35",
        "wc_reply_authors": "431;201;828",
        "reply_reviewers": "1;0;1",
        "reply_authors": "1;1;2",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            43.333333333333336,
            12.552113589175153
        ],
        "wc_strengths_avg": [
            87.66666666666667,
            37.33035702421765
        ],
        "wc_weaknesses_avg": [
            202.33333333333334,
            73.91135832122752
        ],
        "wc_questions_avg": [
            68.33333333333333,
            72.76140613142535
        ],
        "wc_review_avg": [
            401.6666666666667,
            134.15496843410443
        ],
        "wc_reply_reviewers_avg": [
            18.333333333333332,
            14.337208778404378
        ],
        "wc_reply_authors_avg": [
            486.6666666666667,
            258.98047974488134
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            21,
            0
        ],
        "corr_rating_confidence": -0.9999999999999997,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:3ROxch-JBlEJ:scholar.google.com/&scioq=Enhancing+Neural+Network+Transparency+through+Representation+Analysis&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0;3;4;5;1;6;7;5;1;8;1;5;0;1",
        "aff_unique_norm": "Carnegie Mellon University;Center for AI Safety;Stanford University;University of Maryland;Wharton School;University of California, Berkeley;University of Illinois;International Institute of Information Technology, Hyderabad;Redwood Research",
        "aff_unique_dep": ";;;;;;;;",
        "aff_unique_url": "https://www.cmu.edu;https://www.centerforaisafety.org;https://www.stanford.edu;https://www/umd.edu;https://www.wharton.upenn.edu;https://www.berkeley.edu;https://illinois.edu;https://iiit Hyderabad.ac.in;https://www.redwoodresearch.org",
        "aff_unique_abbr": "CMU;;Stanford;UMD;Wharton;UC Berkeley;UIUC;IIIT-H;Redwood Research",
        "aff_campus_unique_index": "1;2;3;4;5;3;3",
        "aff_campus_unique": ";Stanford;College Park;Berkeley;Urbana-Champaign;Hyderabad",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;1;0;0;0;0;0;0;0",
        "aff_country_unique": "United States;India"
    },
    {
        "id": "aCiSwOHnRD",
        "title": "SEFAR: SparsE-FeAture-based Regularization for Fine-Tuning on Limited Downstream Data",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "A commonly employed approach within the domain of transfer learning is fine-tuning the meticulous crafting of novel loss functions or the subtle adjustment of either all or a part of the parameters in the pre-trained network. However, most of the current fine-tuning methods typically require a substantial amount of downstream data, which can be limiting in real-world scenarios. When dealing with limited data, an appropriate regularization method can be used to enhance a model\u2019s generalization capabilities and reduce the risk of overfitting. In this paper, we propose a SparsE-FeAture-based Regularization (SEFAR) method that can significantly enhance the performance of any fine-tuning method when there is a limited amount of downstream data available. Our proposed method is simple to implement: it leverages the results generated by sparse features to self-distill the results produced by complete features.This paper also provides insight into how the SEFAR works: one is a relation to the generalization bound of a kernel regression problem, and the other is the flatness of the minima. Additionally, extensive empirical experiments demonstrate the benefits of this method for fine- tuning on various datasets using different backbones. The code will be released soon.",
        "keywords": "finetune;transfer learning;regularization",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/f5570bab0b567e2ed4da84ac5730c64bd04b798c.pdf",
        "author": "Hao ZHENG;Ryo Karakida;Yuchen Che;Asako Kanezaki",
        "authorids": "~Hao_ZHENG4;~Ryo_Karakida2;~Yuchen_Che1;~Asako_Kanezaki1",
        "gender": "M;M;M;F",
        "homepage": "https://github.com/jarucezh;https://sites.google.com/view/ryokarakida/english;;https://kanezaki.github.io/",
        "dblp": ";;386/3250;37/7634",
        "google_scholar": "w7IvRBUAAAAJ;;;4lLAESYAAAAJ",
        "orcid": ";;0009-0007-9055-4726;",
        "linkedin": ";;yuchen-che-54b97621a/?originalSubdomain=jp;",
        "or_profile": "~Hao_ZHENG4;~Ryo_Karakida2;~Yuchen_Che1;~Asako_Kanezaki1",
        "aff": "Tokyo Institute of Technology, Tokyo Institute of Technology;AIST, National Institute of Advanced Industrial Science and Technology;Tokyo Institute of Technology, Tokyo Institute of Technology;Tokyo Institute of Technology",
        "aff_domain": "titech.ac.jp;aist.go.jp;titech.ac.jp;titech.ac.jp",
        "position": "PhD student;Researcher;PhD student;Associate Professor",
        "bibtex": "@misc{\nzheng2024sefar,\ntitle={{SEFAR}: SparsE-FeAture-based Regularization for Fine-Tuning on Limited Downstream Data},\nauthor={Hao ZHENG and Ryo Karakida and Yuchen Che and Asako Kanezaki},\nyear={2024},\nurl={https://openreview.net/forum?id=aCiSwOHnRD}\n}",
        "github": "",
        "project": "",
        "reviewers": "Bx9c;6bB7;f9tb;affX",
        "site": "https://openreview.net/forum?id=aCiSwOHnRD",
        "pdf_size": 8165336,
        "rating": "3;3;3;5",
        "confidence": "3;4;4;4",
        "soundness": "2;1;2;3",
        "contribution": "1;1;2;3",
        "presentation": "3;2;3;2",
        "wc_summary": "52;85;62;66",
        "wc_strengths": "27;67;28;35",
        "wc_weaknesses": "94;565;84;87",
        "wc_questions": "70;8;8;115",
        "wc_review": "243;725;182;303",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "246;293;324;414",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            66.25,
            11.96609794377432
        ],
        "wc_strengths_avg": [
            39.25,
            16.315253599009733
        ],
        "wc_weaknesses_avg": [
            207.5,
            206.4346143455598
        ],
        "wc_questions_avg": [
            50.25,
            45.14628999153751
        ],
        "wc_review_avg": [
            363.25,
            213.1928411087014
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            319.25,
            61.34889974563521
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:dX88wPVw9hQJ:scholar.google.com/&scioq=SEFAR:+SparsE-FeAture-based+Regularization+for+Fine-Tuning+on+Limited+Downstream+Data&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Tokyo Institute of Technology;National Institute of Advanced Industrial Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.titech.ac.jp;https://www.aist.go.jp",
        "aff_unique_abbr": "Titech;AIST",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Tokyo;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Japan"
    },
    {
        "id": "aD4YLji1PW",
        "title": "Genetic Algorithm for Curriculum Generation in Multi-Agent Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "As the deployment of autonomous agents increases in real life, there is an increased interest in extending their usage to competitive environments populated by other robots. Self-play in Reinforcement Learning (RL) allows agents to explore and learn competitive strategies. However, the complex dynamics of multi-agent RL interactions introduce instability in training and susceptibility to overfitting. Several game-theoretic approaches address the latter by generating approximate Nash equilibrium strategies to train against. The challenge of learning a policy in a complex and unstable multi-agent environment, the former, is not yet well addressed. This paper aims to address this issue by using a curriculum learning approach. We introduce curriculum design by a genetic algorithm to the multi-agent domain to more efficiently learn a policy that performs well and is stable at Nash equilibrium. Empirical studies show that our approach outperforms several strong baselines across various competitive two-player benchmarks in continuous control settings.",
        "keywords": "Reinforcement Learning;Curriculum Learning;Genetic Algorithm;Multiagent Reinforcement Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Yeeho Song;Jeff Schneider",
        "authorids": "~Yeeho_Song1;~Jeff_Schneider1",
        "gender": "M;",
        "homepage": ";https://www.cs.cmu.edu/~schneide",
        "dblp": "203/5532.html;38/247",
        "google_scholar": "Qj1bwsAAAAAJ;3bSbb20AAAAJ",
        "orcid": ";0000-0002-5080-9073",
        "linkedin": ";jeff-schneider-1593b322/",
        "or_profile": "~Yeeho_Song1;~Jeff_Schneider1",
        "aff": "Carnegie Mellon University;Carnegie Mellon University",
        "aff_domain": "cmu.edu;cs.cmu.edu",
        "position": "PhD student;Researcher",
        "bibtex": "@misc{\nsong2024genetic,\ntitle={Genetic Algorithm for Curriculum Generation in Multi-Agent Reinforcement Learning},\nauthor={Yeeho Song and Jeff Schneider},\nyear={2024},\nurl={https://openreview.net/forum?id=aD4YLji1PW}\n}",
        "github": "",
        "project": "",
        "reviewers": "63gd;B2gt;wvYt;NHU7",
        "site": "https://openreview.net/forum?id=aD4YLji1PW",
        "pdf_size": 18305980,
        "rating": "5;5;5;5",
        "confidence": "3;4;3;3",
        "soundness": "3;3;3;3",
        "contribution": "2;2;2;2",
        "presentation": "2;3;3;3",
        "wc_summary": "38;62;39;69",
        "wc_strengths": "58;33;103;33",
        "wc_weaknesses": "624;201;187;81",
        "wc_questions": "56;66;51;246",
        "wc_review": "776;362;380;429",
        "wc_reply_reviewers": "176;74;131;132",
        "wc_reply_authors": "1481;1110;782;1213",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "3;2;2;2",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            52.0,
            13.729530217745982
        ],
        "wc_strengths_avg": [
            56.75,
            28.586491565073178
        ],
        "wc_weaknesses_avg": [
            273.25,
            207.75270756358387
        ],
        "wc_questions_avg": [
            104.75,
            81.72935519138763
        ],
        "wc_review_avg": [
            486.75,
            168.78888440889702
        ],
        "wc_reply_reviewers_avg": [
            128.25,
            36.21032311371993
        ],
        "wc_reply_authors_avg": [
            1146.5,
            250.25237261612526
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:cz4dJHG79HQJ:scholar.google.com/&scioq=Genetic+Algorithm+for+Curriculum+Generation+in+Multi-Agent+Reinforcement+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Carnegie Mellon University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cmu.edu",
        "aff_unique_abbr": "CMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "aE6HazMgRz",
        "title": "Spatio-temporal Twins with A Cache for Modeling Long-term System Dynamics",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper investigates the problem of modeling long-term dynamical systems, which are essential for comprehending fluid dynamics and astrophysics. Recently, a variety of spatio-temporal forecasting approaches have been proposed, which usually employ complicated architectures (e.g., Transformer) to learn spatial and temporal relationships. However, these approaches typically perform poorly for long-term forecasting due to information loss during exploration and iterative rollouts. To tackle this, we propose a new framework named Spatio-temporal Twins with A Cache (STAC) for long-term system dynamics modeling. To investigate spatio-temporal relationships from complementary perspectives, STAC contains a frequency-enhanced spatial module and an ODE-enhanced temporal module. Then, we fuse the information between twin modules with channel attention for discriminative feature maps. To capture long-term dynamics, we introduce a cache-based recursive propagator, which stores the previous feature maps in the cache memory during recursive updating. Moreover, we involve both teacher forcing with Mixup and semi-supervised adversarial learning to enhance the optimization process. Extensive experiments show that the proposed STAC can achieve superior performance to existing state-of-the-art methods.",
        "keywords": "long-term dynamical systems;spatio-temporal forecasting",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/7e130716e435827fd0342858a0910c4451c675bd.zip",
        "author": "Hao Wu;Kun Wang;Fan Xu;Yue Li;Xu Wang;Weiyan Wang;Haixin Wang;Xiao Luo",
        "authorids": "~Hao_Wu39;~Kun_Wang15;~Fan_Xu5;~Yue_Li14;~Xu_Wang16;~Weiyan_Wang1;~Haixin_Wang3;~Xiao_Luo3",
        "gender": "M;M;;M;M;M;;M",
        "homepage": "https://easylearningscores.github.io/;http://home.ustc.edu.cn/~wk520529/#home;;;http://home.ustc.edu.cn/~wx309/;https://weiyan-wang.github.io/;https://willdreamer.github.io/;http://luoxiao12.github.io",
        "dblp": "111;;;;181/2815-29;17/2902;81/5956-3;50/1585-1",
        "google_scholar": "HdXMhfcAAAAJ;UnyqjWQAAAAJ;;;7hYGPC8AAAAJ;https://scholar.google.com.hk/citations?hl=en;RGZUJOkAAAAJ;https://scholar.google.com.hk/citations?",
        "orcid": "0009-0008-4084-1409;0000-0003-0602-169X;;;0000-0002-1492-3477;0000-0002-4105-0691;0000-0002-5714-0149;",
        "linkedin": ";;;youngkawhi/;;;;%E9%9C%84-%E7%BD%97-303548214/",
        "or_profile": "~Hao_Wu39;~Kun_Wang15;~Fan_Xu5;~Yue_Li14;~Xu_Wang16;~Weiyan_Wang1;~Haixin_Wang3;~Xiao_Luo3",
        "aff": "University of Science and Technology of China;University of Science and Technology of China;;Shanghai AI Lab;University of Science and Technology of China;Tencent;Peking University;University of California, Los Angeles",
        "aff_domain": "ustc.edu.cn;ustc.edu.cn;;shlab.org.cn;ustc.edu.cn;tencent.com;pku.edu.cn;cs.ucla.edu",
        "position": "MS student;PhD student;;Intern;Associate Researcher;Researcher;MS student;Postdoc",
        "bibtex": "@misc{\nwu2024spatiotemporal,\ntitle={Spatio-temporal Twins with A Cache for Modeling Long-term System Dynamics},\nauthor={Hao Wu and Kun Wang and Fan Xu and Yue Li and Xu Wang and Weiyan Wang and Haixin Wang and Xiao Luo},\nyear={2024},\nurl={https://openreview.net/forum?id=aE6HazMgRz}\n}",
        "github": "",
        "project": "",
        "reviewers": "UcXH;zrZ8;CD63;rchA",
        "site": "https://openreview.net/forum?id=aE6HazMgRz",
        "pdf_size": 9374522,
        "rating": "5;5;5;5",
        "confidence": "4;4;5;4",
        "soundness": "3;3;3;2",
        "contribution": "3;2;2;2",
        "presentation": "4;3;2;3",
        "wc_summary": "86;188;134;68",
        "wc_strengths": "77;133;95;43",
        "wc_weaknesses": "171;242;201;378",
        "wc_questions": "56;28;41;85",
        "wc_review": "390;591;471;574",
        "wc_reply_reviewers": "0;0;0;217",
        "wc_reply_authors": "1180;1979;2043;3306",
        "reply_reviewers": "0;0;0;2",
        "reply_authors": "4;6;5;9",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            119.0,
            46.57252408878007
        ],
        "wc_strengths_avg": [
            87.0,
            32.46536616149585
        ],
        "wc_weaknesses_avg": [
            248.0,
            79.17385932237988
        ],
        "wc_questions_avg": [
            52.5,
            21.219095173922945
        ],
        "wc_review_avg": [
            506.5,
            81.43862719864573
        ],
        "wc_reply_reviewers_avg": [
            54.25,
            93.96375631061159
        ],
        "wc_reply_authors_avg": [
            2127.0,
            760.8892823532212
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            6.0,
            1.8708286933869707
        ],
        "replies_avg": [
            34,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9401866267326576957&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;2;3;4",
        "aff_unique_norm": "University of Science and Technology of China;Shanghai AI Lab;Tencent;Peking University;University of California, Los Angeles",
        "aff_unique_dep": ";;Tencent Holdings Limited;;",
        "aff_unique_url": "http://www.ustc.edu.cn;https://www.shanghaiailab.com;https://www.tencent.com;http://www.pku.edu.cn;https://www.ucla.edu",
        "aff_unique_abbr": "USTC;SAIL;Tencent;Peking U;UCLA",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Los Angeles",
        "aff_country_unique_index": "0;0;0;0;0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "aEGUT3OGCW",
        "title": "Provable Repair of Vision Transformers: Last Layer is All You Need",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Vision Transformers have emerged as state-of-the-art image recognition tools, but may still exhibit incorrect behavior. Incorrect image recognition can have disastrous consequences in safety-critical real-world applications such as self-driving automobiles. In this paper, we present Provable Repair of Vision Transformers (PRoViT), a provable repair approach that guarantees the correct classification of\nimages in a repair set for a given Vision Transformer without modifying its ar-\nchitecture. PRoViT avoids negatively affecting correctly classified images (draw-\ndown) by minimizing the changes made to the Vision Transformer\u2019s parameters\nand original output. We observe that for Vision Transformers, unlike for other\narchitectures such as ResNet or VGG, editing just the parameters in the last layer\nachieves correctness guarantees and very low drawdown. We introduce a novel\nmethod for editing these last-layer parameters that enables PRoViT to efficiently\nrepair state-of-the-art Vision Transformers for thousands of images, far exceeding\nthe capabilities of prior provable repair approaches.",
        "keywords": "neural network repair;vision transformers;formal guarantees",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "/attachment/33eb2031f610bca27cbb0a24ad38117833bf6bd2.pdf",
        "author": "Stephanie Nawas;Zhe Tao;Aditya Thakur",
        "authorids": "~Stephanie_Nawas1;~Zhe_Tao2;~Aditya_Thakur1",
        "gender": "F;;M",
        "homepage": ";https://zhe-tao.com/;http://thakur.cs.ucdavis.edu/",
        "dblp": "344/5222.html;;68/1945",
        "google_scholar": ";;https://scholar.google.com.tw/citations?user=x8952qgAAAAJ",
        "orcid": "0009-0003-1506-2853;0000-0002-4047-699X;0000-0003-3166-1517",
        "linkedin": ";;",
        "or_profile": "~Stephanie_Nawas1;~Zhe_Tao2;~Aditya_Thakur1",
        "aff": "University of California, Davis;University of California, Davis;University of California, Davis",
        "aff_domain": "ucdavis.edu;ucdavis.edu;ucdavis.edu",
        "position": "PhD student;PhD student;Associate Professor",
        "bibtex": "@misc{\nnawas2024provable,\ntitle={Provable Repair of Vision Transformers: Last Layer is All You Need},\nauthor={Stephanie Nawas and Zhe Tao and Aditya Thakur},\nyear={2024},\nurl={https://openreview.net/forum?id=aEGUT3OGCW}\n}",
        "github": "",
        "project": "",
        "reviewers": "CCeY;QPLU;ub3F",
        "site": "https://openreview.net/forum?id=aEGUT3OGCW",
        "pdf_size": 4513135,
        "rating": "3;5;5",
        "confidence": "4;4;4",
        "soundness": "1;2;3",
        "contribution": "2;3;2",
        "presentation": "2;3;3",
        "wc_summary": "63;34;108",
        "wc_strengths": "29;30;99",
        "wc_weaknesses": "361;31;150",
        "wc_questions": "2;1;18",
        "wc_review": "455;96;375",
        "wc_reply_reviewers": "0;0;17",
        "wc_reply_authors": "728;90;212",
        "reply_reviewers": "0;0;1",
        "reply_authors": "1;1;2",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            68.33333333333333,
            30.444849956747838
        ],
        "wc_strengths_avg": [
            52.666666666666664,
            32.76515764582181
        ],
        "wc_weaknesses_avg": [
            180.66666666666666,
            136.45593509342942
        ],
        "wc_questions_avg": [
            7.0,
            7.788880963698615
        ],
        "wc_review_avg": [
            308.6666666666667,
            153.88379454062803
        ],
        "wc_reply_reviewers_avg": [
            5.666666666666667,
            8.013876853447538
        ],
        "wc_reply_authors_avg": [
            343.3333333333333,
            276.52285418910475
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:2X8-hKddkc4J:scholar.google.com/&scioq=Provable+Repair+of+Vision+Transformers:+Last+Layer+is+All+You+Need&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of California, Davis",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucdavis.edu",
        "aff_unique_abbr": "UC Davis",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Davis",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "aFMiKm9Qcx",
        "title": "The Central Spanning Tree Problem",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Spanning trees are an important primitive in many data analysis tasks, when a data set needs to be summarized in terms of its ''skeleton'', or when a tree-shaped graph over all observations is required for downstream processing. Popular definitions of spanning trees include the minimum spanning tree and the optimum distance spanning tree, a.k.a.~the minimum routing cost tree. When searching for the shortest spanning tree but admitting additional branching points, even shorter spanning trees can be realized: Steiner trees. Unfortunately, both minimum spanning and Steiner trees are not robust with respect to noise in the observations; that is, small perturbations of the original data set often lead to drastic changes in the associated spanning trees. In response, we make two contributions when the data lies in a Euclidean space: on the theoretical side, we introduce a new optimization problem, the ``(branched) central spanning tree'', which subsumes all previously mentioned definitions as special cases. On the practical side, we show empirically that the (branched) central spanning tree is more robust to noise in the data, and as such is better suited to summarize a data set in terms of its skeleton. We also propose a heuristic to address the NP-hard optimization problem, and illustrate its use on single cell RNA expression data from biology and 3D point clouds of plants.",
        "keywords": "minimum spanning tree;mST;optimum distance spanning tree;minimum routing cost tree;tree;Steiner tree;betweeness centrality;robustness;stability;skeleton;optimum communication tree;branching",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/37842659853a2857be8ec6b0cfa00c32cc35eceb.pdf",
        "author": "Enrique Fita Sanmart\u00edn;Christoph Schnoerr;Fred A Hamprecht",
        "authorids": "~Enrique_Fita_Sanmart\u00edn1;~Christoph_Schnoerr1;~Fred_A_Hamprecht1",
        "gender": "M;;M",
        "homepage": ";https://ipa.math.uni-heidelberg.de;https://sciai-lab.org/",
        "dblp": "252/5618;59/5226;18/4529",
        "google_scholar": ";https://scholar.google.de/citations?user=C-5j7CQAAAAJ;lO62bt0AAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Enrique_Fita_Sanmart\u00edn1;~Christoph_Schnoerr1;~Fred_A_Hamprecht1",
        "aff": "Heidelberg University;Ruprecht-Karls-Universit\u00e4t Heidelberg;Heidelberg University",
        "aff_domain": "uni-heidelberg.de;uni-heidelberg.de;uni-heidelberg.de",
        "position": "PhD student;Full Professor;Full Professor",
        "bibtex": "@misc{\nsanmart{\\'\\i}n2024the,\ntitle={The Central Spanning Tree Problem},\nauthor={Enrique Fita Sanmart{\\'\\i}n and Christoph Schnoerr and Fred A Hamprecht},\nyear={2024},\nurl={https://openreview.net/forum?id=aFMiKm9Qcx}\n}",
        "github": "",
        "project": "",
        "reviewers": "2UJx;H47r;BdLt;JfkS",
        "site": "https://openreview.net/forum?id=aFMiKm9Qcx",
        "pdf_size": 47960199,
        "rating": "3;5;5;6",
        "confidence": "4;3;4;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "1;2;3;2",
        "wc_summary": "131;127;51;177",
        "wc_strengths": "58;49;27;51",
        "wc_weaknesses": "275;391;35;79",
        "wc_questions": "245;45;173;37",
        "wc_review": "709;612;286;344",
        "wc_reply_reviewers": "128;183;8;185",
        "wc_reply_authors": "1243;423;254;551",
        "reply_reviewers": "2;1;1;2",
        "reply_authors": "4;2;1;4",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            121.5,
            45.196791921551245
        ],
        "wc_strengths_avg": [
            46.25,
            11.60549438843516
        ],
        "wc_weaknesses_avg": [
            195.0,
            144.80331487918363
        ],
        "wc_questions_avg": [
            125.0,
            87.8179936004006
        ],
        "wc_review_avg": [
            487.75,
            177.31099091708896
        ],
        "wc_reply_reviewers_avg": [
            126.0,
            71.8644557483044
        ],
        "wc_reply_authors_avg": [
            617.75,
            376.0434649079811
        ],
        "reply_reviewers_avg": [
            1.5,
            0.5
        ],
        "reply_authors_avg": [
            2.75,
            1.299038105676658
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.6882472016116854,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3594978811658601109&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Heidelberg University;Ruprecht-Karls-Universit\u00e4t Heidelberg",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uni-heidelberg.de;https://www.uni-heidelberg.de/",
        "aff_unique_abbr": "Uni Heidelberg;Uni Heidelberg",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "title": "Interpretable Sparse System Identification: Beyond Recent Deep Learning Techniques on Time-Series Prediction",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18373",
        "id": "aFWUY3E7ws",
        "author_site": "Liu Xiaoyi, Duxin Chen, Wenjia Wei, Xia Zhu, Wenwu Yu",
        "tldr": "",
        "abstract": "With the continuous advancement of neural network methodologies, time series prediction has attracted substantial interest over the past decades. Nonetheless, the interpretability of neural networks is insufficient and the utilization of deep learning techniques for prediction necessitates significant computational expenditures, rendering its application arduous in numerous scenarios. In order to tackle this challenge, an interpretable sparse system identification method which does not require a time-consuming training through back-propagation is proposed in this study. This method integrates advantages from both knowledge-based and data-driven approaches, and constructs dictionary functions by leveraging Fourier basis and taking into account both the long-term trends and the short-term fluctuations behind data. By using the $l_1$ norm for sparse optimization, prediction results can be gained with an explicit sparse expression function and an extremely high accuracy. The performance evaluation of the proposed method is conducted on comprehensive benchmark datasets, including ETT, Exchange, and ILI. Results reveal that our proposed method attains a significant overall improvement of more than 20\\% in accordance with the most recent state-of-the-art deep learning methodologies. Additionally, our method demonstrates the efficient training capability on only CPUs. Therefore, this study may shed some light onto the realm of time series reconstruction and prediction.",
        "keywords": "time series;sparse system identification;long term prediction",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/b1a1ea11fb37c31aa4ff6fa702fa935dbc9d3110.zip",
        "author": "Xiaoyi Liu;Duxin Chen;Wenjia Wei;Xia Zhu;Wenwu Yu",
        "authorids": "~Xiaoyi_Liu4;~Duxin_Chen1;~Wenjia_Wei1;~Xia_Zhu2;~Wenwu_Yu1",
        "gender": ";M;;;M",
        "homepage": ";https://math.seu.edu.cn/cdx_2384/list.htm;;;http://math.seu.edu.cn/yww/list.htm",
        "dblp": ";;;54/2591.html;",
        "google_scholar": "https://scholar.google.com.hk/citations?view_op=list_works;;;;",
        "orcid": ";0000-0002-3194-2258;;;0000-0003-3755-179X",
        "linkedin": ";;;;",
        "or_profile": "~Xiaoyi_Liu4;~Duxin_Chen1;~Wenjia_Wei1;~Xia_Zhu2;~Wenwu_Yu1",
        "aff": "Southeast University;Southeast University;;Huawei Technologies Ltd.;Southeast University",
        "aff_domain": "southeast.edu;seu.edu.cn;;huawei.com;seu.edu.cn",
        "position": "MS student;Associate Professor;;Researcher;Full Professor",
        "bibtex": "@inproceedings{\nliu2024interpretable,\ntitle={Interpretable Sparse System Identification: Beyond Recent Deep Learning Techniques on Time-Series Prediction},\nauthor={Xiaoyi Liu and Duxin Chen and Wenjia Wei and Xia Zhu and Wenwu Yu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=aFWUY3E7ws}\n}",
        "github": "",
        "project": "",
        "reviewers": "sU4J;fA8m;jLT6",
        "pdf_size": 583683,
        "rating": "6;8;8",
        "confidence": "3;2;4",
        "soundness": "2;3;4",
        "contribution": "3;4;4",
        "presentation": "1;3;3",
        "wc_summary": "47;74;289",
        "wc_strengths": "41;64;28",
        "wc_weaknesses": "548;120;22",
        "wc_questions": "11;65;140",
        "wc_review": "647;323;479",
        "wc_reply_reviewers": "56;112;38",
        "wc_reply_authors": "1668;693;680",
        "reply_reviewers": "1;2;1",
        "reply_authors": "4;3;2",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            136.66666666666666,
            108.27844763489281
        ],
        "wc_strengths_avg": [
            44.333333333333336,
            14.884742374510738
        ],
        "wc_weaknesses_avg": [
            230.0,
            228.39147678200837
        ],
        "wc_questions_avg": [
            72.0,
            52.896124621752776
        ],
        "wc_review_avg": [
            483.0,
            132.30268326832982
        ],
        "wc_reply_reviewers_avg": [
            68.66666666666667,
            31.510139461590594
        ],
        "wc_reply_authors_avg": [
            1013.6666666666666,
            462.71397452662075
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.0,
            0.816496580927726
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10040064095213589940&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=aFWUY3E7ws",
        "pdf": "https://openreview.net/pdf?id=aFWUY3E7ws",
        "email": "southeast.edu;seu.edu.cn;;huawei.com;seu.edu.cn",
        "author_num": 5,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Southeast University;Huawei",
        "aff_unique_dep": ";Huawei Technologies",
        "aff_unique_url": "https://www.seu.edu.cn/;https://www.huawei.com",
        "aff_unique_abbr": "SEU;Huawei",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "aG3EARrrd1",
        "title": "OSRT: An Online Sparse Approximation Model for Scattered Data",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Online learning is a crucial technique for dealing with large and evolving datasets in various domains, such as real-time data analysis, online advertising, or financial modeling. In this paper, we propose a novel predictive statistical model called the Online Sparse Residual Tree (OSRT) for handling streaming multivariate scattered data. OSRT is based on online tree decomposition and online adaptive radial basis function (RBF) exploration. OSRT dynamically expands its network depth as more data arrives, and incorporates a sparse and appropriate RBF refinement at each child node to minimize the residual error from its parent node. OSRT also uses an incremental method to explore the central node of the RBF function, ensuring both sparsity and accuracy of the model. When the network reaches its maximum depth, the OSRT model updates the RBF approximation of its final layer based on the most recent data. This ensures that the model captures the latest trends in the evolving data. We evaluate our algorithm on several datasets, and compare it with existing online RBF methods. From the results, it is shown that OSRT achieves higher efficiency and accuracy.",
        "keywords": "Online learning;Scattered data;Adaptive sparse approximation;Radial basis function;Tree decomposition",
        "primary_area": "metric learning, kernel learning, and sparse coding",
        "supplementary_material": "/attachment/3f674ba122ea798ad9a91a693c72f27c6176a0b0.zip",
        "author": "Yufeng Zheng;Xin Xu;Xiaopeng Luo;Kanghui Zhu",
        "authorids": "~Yufeng_Zheng5;~Xin_Xu5;~Xiaopeng_Luo1;~Kanghui_Zhu1",
        "gender": "M;;;F",
        "homepage": ";;;",
        "dblp": ";;;",
        "google_scholar": ";;;",
        "orcid": ";0000-0002-9502-4931;0000-0002-9806-8892;",
        "linkedin": "yufengzheng1998;;;zhu-kanghui-4a850a292/",
        "or_profile": "~Yufeng_Zheng5;~Xin_Xu5;~Xiaopeng_Luo1;~Kanghui_Zhu1",
        "aff": "Nanjing University;Nanjing university;Nanjing University;Nanjing University",
        "aff_domain": "nju.edu.cn;nju.edu.cn;nju.edu.cn;nju.edu.cn",
        "position": "MS student;Associate Professor;Assistant Professor;MS student",
        "bibtex": "@misc{\nzheng2024osrt,\ntitle={{OSRT}: An Online Sparse Approximation Model for Scattered Data},\nauthor={Yufeng Zheng and Xin Xu and Xiaopeng Luo and Kanghui Zhu},\nyear={2024},\nurl={https://openreview.net/forum?id=aG3EARrrd1}\n}",
        "github": "",
        "project": "",
        "reviewers": "4t5w;TLX1;nWJS",
        "site": "https://openreview.net/forum?id=aG3EARrrd1",
        "pdf_size": 440089,
        "rating": "3;5;5",
        "confidence": "4;3;3",
        "soundness": "2;2;2",
        "contribution": "1;2;2",
        "presentation": "2;2;1",
        "wc_summary": "58;83;83",
        "wc_strengths": "20;37;51",
        "wc_weaknesses": "245;213;257",
        "wc_questions": "85;235;8",
        "wc_review": "408;568;399",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            74.66666666666667,
            11.785113019775793
        ],
        "wc_strengths_avg": [
            36.0,
            12.675435561221029
        ],
        "wc_weaknesses_avg": [
            238.33333333333334,
            18.571184369578827
        ],
        "wc_questions_avg": [
            109.33333333333333,
            94.25615217174007
        ],
        "wc_review_avg": [
            458.3333333333333,
            77.63303993074656
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9999999999999998,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:s7Xy7310wiQJ:scholar.google.com/&scioq=OSRT:+An+Online+Sparse+Approximation+Model+for+Scattered+Data&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Nanjing University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nju.edu.cn",
        "aff_unique_abbr": "Nanjing U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Multi-modal Gaussian Process Variational Autoencoders for Neural and Behavioral Data",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18372",
        "id": "aGH43rjoe4",
        "author_site": "Rabia Gondur, Usama Bin Sikandar, Evan Schaffer, Mikio Aoi, Stephen Keeley",
        "tldr": "",
        "abstract": "Characterizing the relationship between neural population activity and behavioral data is a central goal of neuroscience. While latent variable models (LVMs) are successful in describing high-dimensional data, they are typically only designed for a single type of data, making it difficult to identify structure shared across different experimental data modalities. Here, we address this shortcoming by proposing an unsupervised LVM which extracts shared and independent latents for distinct, simultaneously recorded experimental modalities. We do this by combining Gaussian Process Factor Analysis (GPFA), an interpretable LVM for neural spiking data with temporally smooth latent space, with Gaussian Process Variational Autoencoders (GP-VAEs), which similarly use a GP prior to characterize correlations in a latent space, but admit rich expressivity due to a deep neural network mapping to observations. We achieve interpretability in our model by partitioning latent variability into components that are either shared between or independent to each modality. We parameterize the latents of our model in the Fourier domain, and show improved latent identification using this approach over standard GP-VAE methods. We validate our model on simulated multi-modal data consisting of Poisson spike counts and MNIST images that scale and rotate smoothly over time. We show that the multi-modal GP-VAE (MM-GPVAE) is able to not only identify the shared and independent latent structure across modalities accurately, but provides good reconstructions of both images and neural rates on held-out trials. Finally, we demonstrate our framework on two real world multi-modal experimental settings: Drosophila whole-brain calcium imaging alongside tracked limb positions, and Manduca sexta spike train measurements from ten wing muscles as the animal tracks a visual stimulus.",
        "keywords": "Gaussian Processes;Latent Variable Models;Variational Autoencoders;Neuroscience",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/ae105e72d955486de52c383fd8aa47d9cb7c3437.zip",
        "author": "Rabia Gondur;Usama Bin Sikandar;Evan Schaffer;Mikio Christian Aoi;Stephen L Keeley",
        "authorids": "~Rabia_Gondur1;~Usama_Bin_Sikandar1;~Evan_Schaffer1;~Mikio_Christian_Aoi1;~Stephen_L_Keeley1",
        "gender": "F;M;M;M;M",
        "homepage": "https://www.rabiagondur.com;http://usamabinsikandar.weebly.com;https://www.evanschaffer.com/;https://www.mikioaoi.com/;",
        "dblp": ";;;157/2649;209/4855",
        "google_scholar": "SPnIKpoAAAAJ;nICMTXIAAAAJ;https://scholar.google.com/citations?hl=en;p8e4D_UAAAAJ;9NfHU5IAAAAJ",
        "orcid": ";0000-0003-3335-5994;0000-0002-8731-4939;0000-0002-7052-880X;",
        "linkedin": "rabiagondur/;usamabinsikandar/;;;",
        "or_profile": "~Rabia_Gondur1;~Usama_Bin_Sikandar1;~Evan_Schaffer1;~Mikio_Christian_Aoi1;~Stephen_L_Keeley1",
        "aff": "Fordham University;Georgia Institute of Technology;Columbia University;University of California, San Diego;Fordham University",
        "aff_domain": "fordham.edu;gatech.edu;columbia.edu;ucsd.edu;fordham.edu",
        "position": "MS student;PhD student;Postdoc;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\ngondur2024multimodal,\ntitle={Multi-modal Gaussian Process Variational Autoencoders for Neural and Behavioral Data},\nauthor={Rabia Gondur and Usama Bin Sikandar and Evan Schaffer and Mikio Christian Aoi and Stephen L Keeley},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=aGH43rjoe4}\n}",
        "github": "",
        "project": "",
        "reviewers": "y53H;YQRh;Kdv4;9t6f;bxWt",
        "pdf_size": 33964901,
        "rating": "3;5;5;8;8",
        "confidence": "4;3;4;4;4",
        "soundness": "2;2;3;4;2",
        "contribution": "2;2;2;4;3",
        "presentation": "1;2;3;4;4",
        "wc_summary": "74;58;73;95;107",
        "wc_strengths": "67;53;71;83;74",
        "wc_weaknesses": "203;123;232;58;965",
        "wc_questions": "17;20;36;102;28",
        "wc_review": "361;254;412;338;1174",
        "wc_reply_reviewers": "92;0;182;33;343",
        "wc_reply_authors": "1921;1127;1534;478;1151",
        "reply_reviewers": "1;0;1;1;1",
        "reply_authors": "3;2;3;1;2",
        "rating_avg": [
            5.8,
            1.9390719429665315
        ],
        "confidence_avg": [
            3.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.6,
            0.8
        ],
        "contribution_avg": [
            2.6,
            0.8
        ],
        "presentation_avg": [
            2.8,
            1.16619037896906
        ],
        "wc_summary_avg": [
            81.4,
            17.396551382386107
        ],
        "wc_strengths_avg": [
            69.6,
            9.830564581955606
        ],
        "wc_weaknesses_avg": [
            316.2,
            330.1026507012629
        ],
        "wc_questions_avg": [
            40.6,
            31.404458282224837
        ],
        "wc_review_avg": [
            507.8,
            336.985697025853
        ],
        "wc_reply_reviewers_avg": [
            130.0,
            123.1470665505273
        ],
        "wc_reply_authors_avg": [
            1242.2,
            479.89723900018424
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            2.2,
            0.7483314773547882
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.20628424925175873,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3578707535136870982&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=aGH43rjoe4",
        "pdf": "https://openreview.net/pdf?id=aGH43rjoe4",
        "email": "fordham.edu;gatech.edu;columbia.edu;ucsd.edu;fordham.edu",
        "author_num": 5,
        "aff_unique_index": "0;1;2;3;0",
        "aff_unique_norm": "Fordham University;Georgia Institute of Technology;Columbia University;University of California, San Diego",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.fordham.edu;https://www.gatech.edu;https://www.columbia.edu;https://www.ucsd.edu",
        "aff_unique_abbr": "Fordham;Georgia Tech;Columbia;UCSD",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";San Diego",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "aGdBhld9py",
        "title": "Neural Priority Queues for Graph Neural Networks (GNNs)",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Graph Neural Networks (GNNs) have shown considerable success in neural algorithmic reasoning. Many traditional algorithms make use of an explicit memory in the form of a data structure. However, there has been limited exploration on augmenting GNNs with external memory. In this paper, we present Neural Priority Queues, a differentiable analogue to algorithmic priority queues, for GNNs. We propose and motivate a desiderata for memory modules, and show that Neural PQs exhibit the desiderata, and reason about their use with algorithmic reasoning. This is further demonstrated by empirical results on the CLRS-30 dataset. Furthermore, we find the Neural PQs useful in capturing long-range interactions, as empirically shown on a dataset from the Long-Range Graph Benchmark.",
        "keywords": "Neural PQs;Differentiable Priority Queues;GNN;Memory;Algorithmic Reasoning;Representational Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Rishabh Jain;Petar Veli\u010dkovi\u0107;Pietro Lio",
        "authorids": "~Rishabh_Jain3;~Petar_Veli\u010dkovi\u01071;~Pietro_Lio1",
        "gender": "M;M;M",
        "homepage": ";https://petar-v.com;https://www.cst.cam.ac.uk/people/pl219",
        "dblp": ";184/4786.html;l/PietroLio.html",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.co.uk/citations?user=kcTK_FAAAAAJ;https://scholar.google.co.uk/citations?user=3YrWf7EAAAAJ",
        "orcid": ";0000-0002-2820-4692;0000-0002-0540-5053",
        "linkedin": ";petarvelickovic;",
        "or_profile": "~Rishabh_Jain3;~Petar_Veli\u010dkovi\u01071;~Pietro_Lio1",
        "aff": "University of Cambridge;Google DeepMind;University of Cambridge",
        "aff_domain": "cam.ac.uk;google.com;cam.ac.uk",
        "position": "PhD student;Senior Staff Research Scientist;Full Professor",
        "bibtex": "@misc{\njain2024neural,\ntitle={Neural Priority Queues for Graph Neural Networks ({GNN}s)},\nauthor={Rishabh Jain and Petar Veli{\\v{c}}kovi{\\'c} and Pietro Lio},\nyear={2024},\nurl={https://openreview.net/forum?id=aGdBhld9py}\n}",
        "github": "",
        "project": "",
        "reviewers": "1rbd;t69k;mXBj;rwJQ",
        "site": "https://openreview.net/forum?id=aGdBhld9py",
        "pdf_size": 1544057,
        "rating": "3;3;5;6",
        "confidence": "4;3;3;3",
        "soundness": "2;2;3;3",
        "contribution": "3;2;2;3",
        "presentation": "2;2;2;3",
        "wc_summary": "56;36;17;61",
        "wc_strengths": "33;32;17;106",
        "wc_weaknesses": "1274;176;103;161",
        "wc_questions": "95;90;4;95",
        "wc_review": "1458;334;141;423",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            42.5,
            17.44276354251241
        ],
        "wc_strengths_avg": [
            47.0,
            34.64823227814083
        ],
        "wc_weaknesses_avg": [
            428.5,
            488.91026784063354
        ],
        "wc_questions_avg": [
            71.0,
            38.73628789649313
        ],
        "wc_review_avg": [
            589.0,
            511.96826073497954
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5555555555555555,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13743394752453831256&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Cambridge;Google",
        "aff_unique_dep": ";Google DeepMind",
        "aff_unique_url": "https://www.cam.ac.uk;https://deepmind.com",
        "aff_unique_abbr": "Cambridge;DeepMind",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Cambridge;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "title": "InsertNeRF: Instilling Generalizability into NeRF with HyperNet Modules",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18371",
        "id": "aHmNpLlUlb",
        "author_site": "Yanqi Bao, Tianyu Ding, Jing Huo, Wenbin Li, Yuxin Li, Yang Gao",
        "tldr": "",
        "abstract": "Generalizing Neural Radiance Fields (NeRF) to new scenes is a significant challenge that existing approaches struggle to address without extensive modifications to vanilla NeRF framework. We introduce **InsertNeRF**, a method for **INS**tilling g**E**ne**R**alizabili**T**y into **NeRF**. By utilizing multiple plug-and-play HyperNet modules, InsertNeRF dynamically tailors NeRF's weights to specific reference scenes, transforming multi-scale sampling-aware features into scene-specific representations. This novel design allows for more accurate and efficient representations of complex appearances and geometries. Experiments show that this method not only achieves superior generalization performance but also provides a flexible  pathway for integration with other NeRF-like systems, even in sparse input settings. \nCode will be available at: https://github.com/bbbbby-99/InsertNeRF.",
        "keywords": "Neural Radiance Fields;Hypernetwork;Neural Rendering;Generalizability",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/5471a34a4f0a4715d0662e8b5e59e651ff784a13.zip",
        "author": "Yanqi Bao;Tianyu Ding;Jing Huo;Wenbin Li;Yuxin Li;Yang Gao",
        "authorids": "~Yanqi_Bao1;~Tianyu_Ding1;~Jing_Huo2;~Wenbin_Li5;~Yuxin_Li6;~Yang_Gao3",
        "gender": "M;F;M;M;M;M",
        "homepage": ";https://cs.nju.edu.cn/huojing;https://cs.nju.edu.cn/liwenbin/;;https://cs.nju.edu.cn/gaoyang/;https://www.tianyuding.com",
        "dblp": "294/6944;38/9090;27/1736-6.html;;89/4402-1;134/4796",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;HKK1BdgAAAAJ;K-kC4yYAAAAJ;;https://scholar.google.com.tw/citations?user=CJwLwzQAAAAJ;Qi7zTOcAAAAJ",
        "orcid": ";0000-0002-8504-455X;;0000-0002-8334-0486;;0000-0001-8445-4330",
        "linkedin": ";;;;;tianyuding/",
        "or_profile": "~Yanqi_Bao1;~Jing_Huo2;~Wenbin_Li5;~Yuxin_Li6;~Yang_Gao3;~Tianyu_DING2",
        "aff": "City University of Hong Kong;Nanjing University;Nanjing University;Nanjing University;Nanjing University;Microsoft",
        "aff_domain": "cityu.edu.hk;nju.edu.cn;nju.edu.cn;nju.edu.cn;nju.edu.cn;microsoft.com",
        "position": "PhD student;Associate Professor;Assistant Professor;MS student;Full Professor;Principal Researcher",
        "bibtex": "@inproceedings{\nbao2024insertnerf,\ntitle={InsertNe{RF}: Instilling Generalizability into Ne{RF} with HyperNet Modules},\nauthor={Yanqi Bao and Tianyu Ding and Jing Huo and Wenbin Li and Yuxin Li and Yang Gao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=aHmNpLlUlb}\n}",
        "github": "",
        "project": "",
        "reviewers": "pJTL;8PMb;km3C",
        "pdf_size": 3787752,
        "rating": "6;6;10",
        "confidence": "3;3;4",
        "soundness": "2;3;4",
        "contribution": "3;2;4",
        "presentation": "1;2;3",
        "wc_summary": "28;39;120",
        "wc_strengths": "18;46;106",
        "wc_weaknesses": "59;66;15",
        "wc_questions": "221;2;33",
        "wc_review": "326;153;274",
        "wc_reply_reviewers": "17;29;17",
        "wc_reply_authors": "3037;1303;304",
        "reply_reviewers": "1;1;1",
        "reply_authors": "7;5;2",
        "rating_avg": [
            7.333333333333333,
            1.8856180831641267
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            62.333333333333336,
            41.023028762987366
        ],
        "wc_strengths_avg": [
            56.666666666666664,
            36.709066394496546
        ],
        "wc_weaknesses_avg": [
            46.666666666666664,
            22.573337271116017
        ],
        "wc_questions_avg": [
            85.33333333333333,
            96.76202193468721
        ],
        "wc_review_avg": [
            251.0,
            72.47528314305966
        ],
        "wc_reply_reviewers_avg": [
            21.0,
            5.656854249492381
        ],
        "wc_reply_authors_avg": [
            1548.0,
            1129.1120404990818
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            4.666666666666667,
            2.0548046676563256
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14240460675935301643&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=aHmNpLlUlb",
        "pdf": "https://openreview.net/pdf?id=aHmNpLlUlb",
        "email": "cityu.edu.hk;nju.edu.cn;nju.edu.cn;nju.edu.cn;nju.edu.cn;microsoft.com",
        "author_num": 6,
        "aff_unique_index": "0;1;1;1;1;2",
        "aff_unique_norm": "City University of Hong Kong;Nanjing University;Microsoft",
        "aff_unique_dep": ";;Microsoft Corporation",
        "aff_unique_url": "https://www.cityu.edu.hk;https://www.nju.edu.cn;https://www.microsoft.com",
        "aff_unique_abbr": "CityU;Nanjing U;Microsoft",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "LLMCarbon: Modeling the End-to-End Carbon Footprint of Large Language Models",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18370",
        "id": "aIok3ZD9to",
        "author_site": "Ahmad Faiz, Sotaro Kaneda, Ruhan Wang, Rita Osi, Prateek Sharma, Fan Chen, Lei Jiang",
        "tldr": "",
        "abstract": "The carbon footprint associated with large language models (LLMs) is a significant concern, encompassing emissions from their training, inference, experimentation, and storage processes, including operational and embodied carbon emissions. An essential aspect is accurately estimating the carbon impact of emerging LLMs even before their training, which heavily relies on GPU usage. Existing studies have reported the carbon footprint of LLM training, but only one tool, mlco2, can predict the carbon footprint of new neural networks prior to physical training. However, mlco2 has several serious limitations. It cannot extend its estimation to dense or mixture-of-experts (MoE) LLMs, disregards critical architectural parameters, focuses solely on GPUs, and cannot model embodied carbon footprints. Addressing these gaps, we introduce \\textit{\\carb}, an end-to-end carbon footprint projection model designed for both dense and MoE LLMs. Compared to mlco2, \\carb~significantly enhances the accuracy of carbon footprint estimations for various LLMs. The source code is released at \\url{https://github.com/SotaroKaneda/MLCarbon}.",
        "keywords": "carbon footprint modeling;large lanaguage models",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Ahmad Faiz;Sotaro Kaneda;Ruhan Wang;Rita Chukwunyere Osi;Prateek Sharma;Fan Chen;Lei Jiang",
        "authorids": "~Ahmad_Faiz1;~Sotaro_Kaneda1;~Ruhan_Wang1;~Rita_Chukwunyere_Osi1;~Prateek_Sharma1;~Fan_Chen2;~Lei_Jiang1",
        "gender": "M;M;F;F;;F;M",
        "homepage": ";;https://ruhan-wang.github.io/;;http://homes.sice.indiana.edu/prateeks;https://homes.luddy.indiana.edu/fc7/;https://www.jianglei.org",
        "dblp": "357/5575;;;;;38/4539-1;96/1994-1.html",
        "google_scholar": ";;https://scholar.google.com/citations?hl=en;;;5HISWRIAAAAJ;-1sXorAAAAAJ",
        "orcid": ";;;;;;",
        "linkedin": "ahmad-faiz-0112a988/;https://www.linkedin.com/mwlite/in/sotaro-kaneda;ruhan-wang-075922255/;rita-osi/;;fan-chen-68b98150/;",
        "or_profile": "~Ahmad_Faiz1;~Sotaro_Kaneda1;~Ruhan_Wang1;~Rita_Chukwunyere_Osi1;~Prateek_Sharma1;~Fan_Chen2;~Lei_Jiang1",
        "aff": "Indiana University at Bloomington;Indiana University;Indiana University;;Indiana University, Bloomington;Indiana University, Bloomington;Indiana University",
        "aff_domain": "iub.edu;iu.edu;iu.edu;;iu.edu;iu.edu;iu.edu",
        "position": "MS student;Undergrad student;PhD student;;Assistant Professor;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nfaiz2024llmcarbon,\ntitle={{LLMC}arbon: Modeling the End-to-End Carbon Footprint of Large Language Models},\nauthor={Ahmad Faiz and Sotaro Kaneda and Ruhan Wang and Rita Chukwunyere Osi and Prateek Sharma and Fan Chen and Lei Jiang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=aIok3ZD9to}\n}",
        "github": "",
        "project": "",
        "reviewers": "pKfr;KiRY;5gUj;aKac;12is",
        "pdf_size": 1574967,
        "rating": "5;5;6;8;10",
        "confidence": "4;4;4;3;4",
        "soundness": "2;3;3;3;4",
        "contribution": "2;2;3;3;4",
        "presentation": "3;3;2;3;4",
        "wc_summary": "51;82;59;92;79",
        "wc_strengths": "23;54;40;46;49",
        "wc_weaknesses": "23;101;212;58;89",
        "wc_questions": "206;4;35;95;76",
        "wc_review": "303;241;346;291;293",
        "wc_reply_reviewers": "37;99;105;42;0",
        "wc_reply_authors": "772;420;957;633;503",
        "reply_reviewers": "1;1;1;1;0",
        "reply_authors": "1;1;2;1;1",
        "rating_avg": [
            6.8,
            1.9390719429665317
        ],
        "confidence_avg": [
            3.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            3.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            2.8,
            0.7483314773547882
        ],
        "presentation_avg": [
            3.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            72.6,
            15.21315220458929
        ],
        "wc_strengths_avg": [
            42.4,
            10.707007051459339
        ],
        "wc_weaknesses_avg": [
            96.6,
            63.72001255492657
        ],
        "wc_questions_avg": [
            83.2,
            69.0895071628102
        ],
        "wc_review_avg": [
            294.8,
            33.46879143321432
        ],
        "wc_reply_reviewers_avg": [
            56.6,
            39.85272889025292
        ],
        "wc_reply_authors_avg": [
            657.0,
            191.66950722532783
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4
        ],
        "reply_authors_avg": [
            1.2,
            0.4
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.30942637387763805,
        "gs_citation": 102,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13314240417906674349&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=aIok3ZD9to",
        "pdf": "https://openreview.net/pdf?id=aIok3ZD9to",
        "email": "iub.edu;iu.edu;iu.edu;;iu.edu;iu.edu;iu.edu",
        "author_num": 7,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "Indiana University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.indiana.edu",
        "aff_unique_abbr": "IU",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Bloomington;",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "aJ581rzuE7",
        "title": "Instruction-following Evaluation through Verbalizer Manipulation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "While instruction-tuned models have shown remarkable success in various natural language processing tasks, accurately evaluating their ability to follow instructions remains challenging. Existing benchmarks primarily focus on common instructions that align well with what the model learned during training. However, proficiency in responding to these instructions does not necessarily imply strong ability in instruction following. In this paper, we propose a novel instruction-following evaluation protocol called verbalizer manipulation. It instructs the model to verbalize the task label with words aligning with model priors to different extents, adopting verbalizers from highly aligned (e.g., outputting \"postive\" for positive sentiment), to minimally aligned (e.g., outputting \"negative\" for positive sentiment). Verbalizer manipulation can be seamlessly integrated with any classification benchmark to examine the model's reliance on priors and its ability to override them to accurately follow the instructions. We conduct a comprehensive evaluation of four major model families across nine datasets, employing twelve sets of verbalizers for each of them. We observe that the instruction-following abilities of models, across different families and scales, are significantly distinguished by their performance on less natural verbalizers. Even the strongest GPT-4 model struggles to perform better than random guessing on the most challenging verbalizer, emphasizing the need for continued advancements to improve their instruction-following abilities.",
        "keywords": "Instruction following;LLM;large language model;LLM evaluation",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Shiyang Li;Jun Yan;Hai Wang;Zheng Tang;Xiang Ren;Vijay Srinivasan;Hongxia Jin",
        "authorids": "~Shiyang_Li1;~Jun_Yan5;~Hai_Wang1;~Zheng_Tang3;~Xiang_Ren1;~Vijay_Srinivasan1;~Hongxia_Jin1",
        "gender": ";;M;M;M;;",
        "homepage": ";;http://ttic.uchicago.edu/~haiwang/;http://ztang.info;https://shanzhenren.github.io/;;",
        "dblp": ";89/5901-12;;;36/360-1;;",
        "google_scholar": ";rhNj2RcAAAAJ;sOF6iA4AAAAJ;;_moJlrIAAAAJ;;",
        "orcid": ";;;;;;",
        "linkedin": ";;;;xren7;;",
        "or_profile": "~Shiyang_Li1;~Jun_Yan5;~Hai_Wang1;~Zheng_Tang3;~Xiang_Ren1;~Vijay_Srinivasan1;~Hongxia_Jin1",
        "aff": ";University of Southern California;Samsung;Samsung;University of Southern California;;",
        "aff_domain": ";usc.edu;samsung.com;samsung.com;usc.edu;;",
        "position": ";PhD student;Researcher;Researcher;Associate Professor;;",
        "bibtex": "@misc{\nli2024instructionfollowing,\ntitle={Instruction-following Evaluation through Verbalizer Manipulation},\nauthor={Shiyang Li and Jun Yan and Hai Wang and Zheng Tang and Xiang Ren and Vijay Srinivasan and Hongxia Jin},\nyear={2024},\nurl={https://openreview.net/forum?id=aJ581rzuE7}\n}",
        "github": "",
        "project": "",
        "reviewers": "w3B7;9bqK;ok8f",
        "site": "https://openreview.net/forum?id=aJ581rzuE7",
        "pdf_size": 527661,
        "rating": "3;3;5",
        "confidence": "4;3;4",
        "soundness": "3;2;3",
        "contribution": "2;1;2",
        "presentation": "3;2;3",
        "wc_summary": "54;155;100",
        "wc_strengths": "29;39;100",
        "wc_weaknesses": "216;139;272",
        "wc_questions": "103;15;1",
        "wc_review": "402;348;473",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            103.0,
            41.28760911782937
        ],
        "wc_strengths_avg": [
            56.0,
            31.379398762032817
        ],
        "wc_weaknesses_avg": [
            209.0,
            54.5221667458903
        ],
        "wc_questions_avg": [
            39.666666666666664,
            45.146674542232034
        ],
        "wc_review_avg": [
            407.6666666666667,
            51.188106257432715
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 23,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3294772868387818937&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;1;0",
        "aff_unique_norm": "University of Southern California;Samsung",
        "aff_unique_dep": ";Samsung",
        "aff_unique_url": "https://www.usc.edu;https://www.samsung.com",
        "aff_unique_abbr": "USC;Samsung",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Los Angeles;",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "United States;South Korea"
    },
    {
        "id": "aJl5aK9n7e",
        "title": "What Improves the Generalization of Graph Transformer? A Theoretical Dive into Self-attention and Positional Encoding",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph Transformers, which incorporate self-attention and positional encoding, have recently emerged as a powerful architecture for various graph learning tasks. Despite their impressive performance, the complex non-convex interactions across layers and the recursive graph structure have made it challenging to establish a theoretical foundation for learning and generalization. This study introduces the first theoretical investigation of a shallow Graph Transformer for semi-supervised node classification, comprising a self-attention layer with relative positional encoding and a two-layer perception. Focusing on a graph data model with discriminative nodes that determine node labels and non-discriminative nodes that are class-irrelevant, we characterize the sample complexity required to achieve a zero generalization error by training with stochastic gradient descent (SGD). Our theoretical findings suggest that a larger fraction of discriminative nodes, a clearer-cutting vote among discriminative nodes, a smaller fraction of erroneous labels, and smaller errors in the initial model and node patterns improve generalization. Furthermore, we demonstrate that self-attention and positional encoding enhance generalization by making the attention map sparse and promoting the core neighborhood during training, which explains the superior feature representation of Graph Transformers. Our theoretical results are supported by empirical experiments on synthetic and real-world benchmarks.",
        "keywords": "Graph Transformer;deep learning theory;generalization analysis;optimization;Graph neural network;Transformer",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/ec40977007fe7dd176ca1d867d9c808614552acb.zip",
        "author": "Hongkang Li;Meng Wang;Tengfei Ma;Sijia Liu;ZAIXI ZHANG;Pin-Yu Chen",
        "authorids": "~Hongkang_Li1;~Meng_Wang4;~Tengfei_Ma1;~Sijia_Liu1;~ZAIXI_ZHANG2;~Pin-Yu_Chen1",
        "gender": ";F;M;M;M;M",
        "homepage": "https://lohek330.github.io/lihongkang.github.io/;https://www.ecse.rpi.edu/~wang/index.html;https://sites.google.com/site/matf0123/;https://lsjxjtu.github.io/;http://home.ustc.edu.cn/~zaixi/;http://www.pinyuchen.com",
        "dblp": "318/8643;93/6765-3;94/9023-1;128/6972-1;267/9295.html;39/8969",
        "google_scholar": "https://scholar.google.com.hk/citations?user=DVlDPjMAAAAJ;;9OvNakkAAAAJ;C7dO_UgAAAAJ;https://scholar.google.com/citations?hl=zh-CN;jxwlCUUAAAAJ",
        "orcid": ";;0000-0002-1086-529X;;;0000-0003-1039-8369",
        "linkedin": "hongkang-li-b7a341173/;;;;;pin-yu-chen-940062a2",
        "or_profile": "~Hongkang_Li1;~Meng_Wang4;~Tengfei_Ma1;~Sijia_Liu1;~ZAIXI_ZHANG2;~Pin-Yu_Chen1",
        "aff": "Rensselaer Polytechnic Institute;Rensselaer Polytechnic Institute;State University of New York at Stony Brook;Michigan State University;University of Science and Technology of China;International Business Machines",
        "aff_domain": "rpi.edu;rpi.edu;stonybrook.edu;msu.edu;ustc.edu.cn;ibm.com",
        "position": "PhD student;Associate Professor;Assistant Professor;Assistant Professor;PhD student;Principal Researcher",
        "bibtex": "@misc{\nli2024what,\ntitle={What Improves the Generalization of Graph Transformer? A Theoretical Dive into Self-attention and Positional Encoding},\nauthor={Hongkang Li and Meng Wang and Tengfei Ma and Sijia Liu and ZAIXI ZHANG and Pin-Yu Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=aJl5aK9n7e}\n}",
        "github": "",
        "project": "",
        "reviewers": "Eng5;vpyX;j2s8;SSQZ",
        "site": "https://openreview.net/forum?id=aJl5aK9n7e",
        "pdf_size": 2492072,
        "rating": "1;6;6;8",
        "confidence": "5;3;3;2",
        "soundness": "2;3;3;3",
        "contribution": "1;3;3;3",
        "presentation": "1;3;3;3",
        "wc_summary": "33;66;116;105",
        "wc_strengths": "12;94;57;46",
        "wc_weaknesses": "237;33;168;296",
        "wc_questions": "373;62;8;143",
        "wc_review": "655;255;349;590",
        "wc_reply_reviewers": "0;0;0;63",
        "wc_reply_authors": "1190;1009;1163;2067",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "3;2;2;4",
        "rating_avg": [
            5.25,
            2.5860201081971503
        ],
        "confidence_avg": [
            3.25,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            80.0,
            32.8861673048107
        ],
        "wc_strengths_avg": [
            52.25,
            29.260681810238122
        ],
        "wc_weaknesses_avg": [
            183.5,
            97.9910710218028
        ],
        "wc_questions_avg": [
            146.5,
            139.31708437948305
        ],
        "wc_review_avg": [
            462.25,
            165.26550608036754
        ],
        "wc_reply_reviewers_avg": [
            15.75,
            27.279800219209818
        ],
        "wc_reply_authors_avg": [
            1357.25,
            415.550463241229
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.9980305249223754,
        "gs_citation": 16,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5298125028387051408&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;0;1;2;3;4",
        "aff_unique_norm": "Rensselaer Polytechnic Institute;State University of New York at Stony Brook;Michigan State University;University of Science and Technology of China;International Business Machines Corporation",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.rpi.edu;https://www.stonybrook.edu;https://www.msu.edu;http://www.ustc.edu.cn;https://www.ibm.com",
        "aff_unique_abbr": "RPI;SUNY Stony Brook;MSU;USTC;IBM",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Stony Brook",
        "aff_country_unique_index": "0;0;0;0;1;0",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "Approximately Piecewise E(3) Equivariant Point Networks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18369",
        "id": "aKJEHWmBEf",
        "author_site": "Matan Atzmon, Jiahui Huang, Francis Williams, Or Litany",
        "tldr": "",
        "abstract": "Integrating a notion of symmetry into point cloud neural networks is a provably effective way to improve their generalization capability. Of particular interest are $E(3)$ equivariant point cloud networks where Euclidean transformations applied to the inputs are preserved in the outputs. Recent efforts aim to extend networks that are equivariant with respect to a single global $E(3)$ transformation, to accommodate inputs made of multiple parts, each of which exhibits local $E(3)$ symmetry.\nIn practical settings, however, the partitioning into individually transforming regions is unknown a priori.\nErrors in the partition prediction would unavoidably map to errors in respecting the true input symmetry. Past works have proposed different ways to predict the partition, which may exhibit uncontrolled errors in their ability to maintain equivariance to the actual partition. To this end, we introduce APEN: a general framework for constructing approximate piecewise-$E(3)$ equivariant point networks. Our framework offers an adaptable design to guaranteed bounds on the resulting piecewise $E(3)$ equivariance approximation errors.\nOur primary insight is that functions which are equivariant with respect to a finer partition (compared to the unknown true partition) will also maintain equivariance in relation to the true partition. Leveraging this observation, we propose a compositional design for a partition prediction model. It initiates with a fine partition and incrementally transitions towards a coarser subpartition of the true one, consistently maintaining piecewise equivariance in relation to the current partition.\nAs a result, the equivariance approximation error can be bounded solely in terms of (i) uncertainty quantification of the partition prediction, and (ii) bounds on the probability of failing to suggest a proper subpartition of the ground truth one.\nWe demonstrate the practical effectiveness of APEN using two data types exemplifying part-based symmetry: (i) real-world scans of room scenes containing multiple furniture-type objects; and, (ii) human motions, characterized by articulated parts exhibiting rigid movement. Our empirical results demonstrate the advantage of integrating piecewise $E(3)$ symmetry into network design, showing a distinct improvement in generalization accuracy compared to prior works for both classification and segmentation tasks",
        "keywords": "E(3) equivariant networks",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Matan Atzmon;Jiahui Huang;Francis Williams;Or Litany",
        "authorids": "~Matan_Atzmon1;~Jiahui_Huang3;~Francis_Williams1;~Or_Litany1",
        "gender": "M;M;M;M",
        "homepage": "https://matanatz.github.io/;https://huangjh-pub.github.io/;http://fwilliams.info;http://orlitany.github.io",
        "dblp": "217/2968;;195/8005;119/1476",
        "google_scholar": "BXNft08AAAAJ;3Cuki_wAAAAJ;aQW6t9EAAAAJ;https://scholar.google.co.il/citations?user=Ihs8dwsAAAAJ",
        "orcid": ";;;",
        "linkedin": ";jiahui-huang-354114107/;francis-williams/;",
        "or_profile": "~Matan_Atzmon1;~Jiahui_Huang3;~Francis_Williams1;~Or_Litany1",
        "aff": "NVIDIA;NVIDIA;NVIDIA;NVIDIA",
        "aff_domain": "nvidia.com;nvidia.com;nvidia.com;nvidia.com",
        "position": "Researcher;Researcher;Research Scienteist;Research Scientist",
        "bibtex": "@inproceedings{\natzmon2024approximately,\ntitle={Approximately Piecewise E(3) Equivariant Point Networks},\nauthor={Matan Atzmon and Jiahui Huang and Francis Williams and Or Litany},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=aKJEHWmBEf}\n}",
        "github": "",
        "project": "",
        "reviewers": "vmat;gDD2;FhAC",
        "pdf_size": 15612788,
        "rating": "6;6;8",
        "confidence": "2;3;3",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "2;2;3",
        "wc_summary": "34;103;47",
        "wc_strengths": "81;32;129",
        "wc_weaknesses": "484;100;178",
        "wc_questions": "2;190;2",
        "wc_review": "601;425;356",
        "wc_reply_reviewers": "178;0;0",
        "wc_reply_authors": "1505;739;766",
        "reply_reviewers": "2;0;0",
        "reply_authors": "3;1;1",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            61.333333333333336,
            29.93697082575694
        ],
        "wc_strengths_avg": [
            80.66666666666667,
            39.60078562632593
        ],
        "wc_weaknesses_avg": [
            254.0,
            165.72265988693277
        ],
        "wc_questions_avg": [
            64.66666666666667,
            88.62404990871396
        ],
        "wc_review_avg": [
            460.6666666666667,
            103.15145283621662
        ],
        "wc_reply_reviewers_avg": [
            59.333333333333336,
            83.91000470080364
        ],
        "wc_reply_authors_avg": [
            1003.3333333333334,
            354.90311667020086
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.49999999999999983,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9802712578654201213&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=aKJEHWmBEf",
        "pdf": "https://openreview.net/pdf?id=aKJEHWmBEf",
        "email": "nvidia.com;nvidia.com;nvidia.com;nvidia.com",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "NVIDIA",
        "aff_unique_dep": "NVIDIA Corporation",
        "aff_unique_url": "https://www.nvidia.com",
        "aff_unique_abbr": "NVIDIA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "aKivEaIbN2",
        "title": "Graph is All You Need? Lightweight Data-agnostic Neural Architecture Search without Training",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Neural architecture search (NAS) enables the automatic design of neural network models. However, training the candidates generated by the search algorithm for performance evaluation incurs considerable computational overhead. Our method, dubbed NASGraph, remarkably reduces the computational costs by converting these neural architectures to graphs, and properties of the converted graphs are used as the proxy scores in lieu of validation accuracy. Our training-free NAS method is data-agnostic and light-weight. It can find the best architecture among 200 randomly sampled architectures from NAS-Bench201 in 217 CPU seconds. We are able to achieve state-of-the-art performance on 7 out of 9 datasets in NASBench-101, NASBench-201, and NDS search spaces. We also demonstrate that NASGraph generalizes to more challenging tasks on Micro TransNAS-Bench-101.",
        "keywords": "Neural Architecture Search;Network Science;Computer Vision",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/d17f6b3411b0c7c0dcfe8f49b92ffaa7893a2463.pdf",
        "author": "Zhenhan Huang;Tejaswini Pedapati;Pin-Yu Chen;Chunheng Jiang;Jianxi Gao",
        "authorids": "~Zhenhan_Huang1;~Tejaswini_Pedapati1;~Pin-Yu_Chen1;~Chunheng_Jiang1;~Jianxi_Gao1",
        "gender": "M;F;M;M;M",
        "homepage": "https://zhenhan-huang.github.io/;;http://www.pinyuchen.com;https://www.horsehour.com/;https://www.gaojianxi.com",
        "dblp": ";203/8811;39/8969;168/1904;72/7131",
        "google_scholar": ";nwSF2RkAAAAJ;jxwlCUUAAAAJ;https://scholar.google.com/citations?hl=en;qMcWVWgAAAAJ",
        "orcid": ";;0000-0003-1039-8369;;0000-0002-3952-208X",
        "linkedin": "zhenhan-huang-mlns;;pin-yu-chen-940062a2;;jianxi-gao-48a59a24/",
        "or_profile": "~Zhenhan_Huang1;~Tejaswini_Pedapati1;~Pin-Yu_Chen1;~Chunheng_Jiang1;~Jianxi_Gao1",
        "aff": "Rensselaer Polytechnic Institute;International Business Machines;International Business Machines;Google;Rensselaer Polytechnic Institute",
        "aff_domain": "rpi.edu;ibm.com;ibm.com;google.com;cs.rpi.edu",
        "position": "PhD student;Research Engineer;Principal Researcher;Researcher;Associate Professor",
        "bibtex": "@misc{\nhuang2024graph,\ntitle={Graph is All You Need? Lightweight Data-agnostic Neural Architecture Search without Training},\nauthor={Zhenhan Huang and Tejaswini Pedapati and Pin-Yu Chen and Chunheng Jiang and Jianxi Gao},\nyear={2024},\nurl={https://openreview.net/forum?id=aKivEaIbN2}\n}",
        "github": "",
        "project": "",
        "reviewers": "bWfm;UMqx;EKQj",
        "site": "https://openreview.net/forum?id=aKivEaIbN2",
        "pdf_size": 1956279,
        "rating": "3;5;6",
        "confidence": "4;3;4",
        "soundness": "2;3;2",
        "contribution": "3;2;3",
        "presentation": "3;3;2",
        "wc_summary": "78;93;90",
        "wc_strengths": "42;57;101",
        "wc_weaknesses": "276;64;178",
        "wc_questions": "147;196;6",
        "wc_review": "543;410;375",
        "wc_reply_reviewers": "0;336;0",
        "wc_reply_authors": "887;910;327",
        "reply_reviewers": "0;1;0",
        "reply_authors": "2;2;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            87.0,
            6.48074069840786
        ],
        "wc_strengths_avg": [
            66.66666666666667,
            25.037749277618563
        ],
        "wc_weaknesses_avg": [
            172.66666666666666,
            86.63076179330808
        ],
        "wc_questions_avg": [
            116.33333333333333,
            80.5412247789223
        ],
        "wc_review_avg": [
            442.6666666666667,
            72.37095795659717
        ],
        "wc_reply_reviewers_avg": [
            112.0,
            158.39191898578665
        ],
        "wc_reply_authors_avg": [
            708.0,
            269.57126454180286
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.18898223650461363,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:eRVditRLim8J:scholar.google.com/&scioq=Graph+is+All+You+Need%3F+Lightweight+Data-agnostic+Neural+Architecture+Search+without+Training&hl=en&as_sdt=0,5",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1;2;0",
        "aff_unique_norm": "Rensselaer Polytechnic Institute;International Business Machines Corporation;Google",
        "aff_unique_dep": ";;Google",
        "aff_unique_url": "https://www.rpi.edu;https://www.ibm.com;https://www.google.com",
        "aff_unique_abbr": "RPI;IBM;Google",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "aKx0RBUvFh",
        "title": "Residual Denoising Diffusion Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We propose residual denoising diffusion models (RDDM), a novel dual diffusion process that decouples the traditional single denoising diffusion process into residual diffusion and noise diffusion. This dual diffusion framework expands the denoising-based diffusion models, initially uninterpretable for image restoration, into a unified and interpretable model for both image generation and restoration by introducing residuals. Specifically, our residual diffusion represents directional diffusion from the target image to the degraded input image and explicitly guides the reverse generation process for image restoration, while noise diffusion represents random perturbations in the diffusion process.  The residual prioritizes certainty, while the noise emphasizes diversity, enabling RDDM to effectively unify tasks with varying certainty or diversity requirements, such as image generation and restoration. We demonstrate that our sampling process is consistent with that of DDPM and DDIM through coefficient transformation, and propose a partially path-independent generation process to better understand the reverse process. Notably, our RDDM enables a generic UNet, trained with only an $\\ell _1$ loss and a batch size of 1, to compete with state-of-the-art image restoration methods. We provide code and pre-trained models to encourage further exploration, application, and development of our innovative framework.",
        "keywords": "Diffusion Models;Restoration;Generation;Dual Diffusion;Residual;Path-independent;Decoupled Diffusion",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/7ca765ae011afe35f773a8ec54263bb4f42c810c.zip",
        "author": "Jiawei Liu;Qiang Wang;Huijie Fan;Yinong Wang;Yandong Tang;Liangqiong Qu",
        "authorids": "~Jiawei_Liu12;~Qiang_Wang10;~Huijie_Fan1;~Yinong_Wang1;~Yandong_Tang1;~Liangqiong_Qu2",
        "gender": "M;M;F;M;M;F",
        "homepage": "https://github.com/nachifur;http://www.sia.cas.cn/vision/kytd/yjry/202307/t20230727_6841805.html;http://www.sia.cas.cn/vision/kytd/yjry/202307/t20230726_6834850.html;https://github.com/Wang1N;https://people.ucas.edu.cn/~ytang;https://liangqiong.github.io/",
        "dblp": "12/8228-3;64/5630-15;36/8729;;29/1922.html;149/2634",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;;https://scholar.google.com/citations?hl=zh-CN;CaglmKAAAAAJ;ruKpgzwAAAAJ",
        "orcid": "0000-0002-7516-5008;0000-0002-2018-1764;0000-0002-8548-861X;;;0000-0001-8235-7852",
        "linkedin": ";;;;;",
        "or_profile": "~Jiawei_Liu12;~Qiang_Wang10;~Huijie_Fan1;~Yinong_Wang1;~Yandong_Tang1;~Liangqiong_Qu2",
        "aff": " Shenyang Institute of Automation, Chinese Academy of Sciences;Shenyang University;Shenyang Institute of Automation, Chinese Academy of Sciences;South China University of Technology;Shenyang Institue of Automation;University of Hong Kong",
        "aff_domain": "sia.cn;syu.edu.cn;sia.cn;scut.edu.cn;sia.cn;hku.hk",
        "position": "PhD student;Assistant Professor;Full Professor;Undergrad student;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nliu2024residual,\ntitle={Residual Denoising Diffusion Models},\nauthor={Jiawei Liu and Qiang Wang and Huijie Fan and Yinong Wang and Yandong Tang and Liangqiong Qu},\nyear={2024},\nurl={https://openreview.net/forum?id=aKx0RBUvFh}\n}",
        "github": "",
        "project": "",
        "reviewers": "TatZ;JomK;vFvZ;a71e",
        "site": "https://openreview.net/forum?id=aKx0RBUvFh",
        "pdf_size": 4787367,
        "rating": "5;5;5;6",
        "confidence": "4;5;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;3;2",
        "wc_summary": "22;36;59;66",
        "wc_strengths": "5;29;40;69",
        "wc_weaknesses": "137;117;138;78",
        "wc_questions": "2;8;4;48",
        "wc_review": "166;190;241;261",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            45.75,
            17.640507362318125
        ],
        "wc_strengths_avg": [
            35.75,
            22.993205518152532
        ],
        "wc_weaknesses_avg": [
            117.5,
            24.295061226512683
        ],
        "wc_questions_avg": [
            15.5,
            18.887826767524103
        ],
        "wc_review_avg": [
            214.5,
            38.13462993133669
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 53,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10607980286607232196&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 11,
        "aff_unique_index": "0;1;0;2;0;3",
        "aff_unique_norm": "Shenyang Institute of Automation;Shenyang University;South China University of Technology;University of Hong Kong",
        "aff_unique_dep": "Chinese Academy of Sciences;;;",
        "aff_unique_url": "http://www.sia.cas.cn;http://www.syu.edu.cn;https://www.scut.edu.cn;https://www.hku.hk",
        "aff_unique_abbr": "SIA;SYU;SCUT;HKU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "aLXRYfIUUd",
        "title": "SCALE: Scaling up the Complexity for Advanced Language Model Evaluation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recent strides in Large Language Models (LLMs) have saturated many NLP benchmarks (even professional domain-specific ones), emphasizing the need for more challenging ones to properly assess LLM capabilities. In this work, we introduce a novel NLP benchmark that poses challenges to current LLMs across four key dimensions: processing long documents (up to 50K tokens), using domain-specific knowledge (embodied in legal texts), multilingual understanding (covering five languages), and multitasking (comprising legal document-to-document Information Retrieval, Court View Generation, Leading Decision Summarization, Citation Extraction, and eight challenging Text Classification tasks). Our benchmark contains diverse legal NLP datasets from the Swiss legal system, allowing for a comprehensive study of the underlying non-English, inherently multilingual, federal legal system. Despite recent advances, efficient processing of long documents for intense review/analysis tasks remains an open challenge for LLMs. In addition, comprehensive, domain-specific benchmarks requiring high expertise to develop are rare, as are multilingual benchmarks. This scarcity underscores our contribution's value, considering that most public models are trained predominantly on English corpora, while other languages remain understudied, particularly for practical domain-specific NLP tasks. Our benchmark allows for testing and advancing the state-of-the-art LLMs. As part of our study, we evaluate several pre-trained multilingual language models on our benchmark to establish strong baselines as a point of reference. Despite the large size of our datasets (tens to hundreds of thousands of examples), existing publicly available models struggle with most tasks, even after extensive in-domain pre-training. We publish all resources (benchmark suite, pre-trained models, code) under a fully permissive open CC BY-SA license.",
        "keywords": "legal;domain-specific;swiss;multilingual;long documents;multi-task;dataset;benchmark;evaluation;large language model",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/19341f30db021495f9a251366435e23fd5135725.zip",
        "author": "Vishvaksenan Rasiah;Ronja Stern;Veton Matoshi;Matthias St\u00fcrmer;Ilias Chalkidis;Daniel E. Ho;Joel Niklaus",
        "authorids": "~Vishvaksenan_Rasiah1;~Ronja_Stern1;~Veton_Matoshi1;~Matthias_St\u00fcrmer1;~Ilias_Chalkidis1;~Daniel_E._Ho1;~Joel_Niklaus1",
        "gender": ";F;M;M;M;M;M",
        "homepage": ";http://ronja-stern.ch/;;https://www.bfh.ch/de/matthias-stuermer;https://iliaschalkidis.github.io;https://dho.stanford.edu;https://niklaus.ai",
        "dblp": ";;;33/4494.html;199/8161;240/9334;232/4545",
        "google_scholar": "504sjTUAAAAJ;;;QtfXdRoAAAAJ;BrtAqz8AAAAJ;;qJ8iricAAAAJ",
        "orcid": ";;;0000-0001-9038-4041;0000-0002-0706-7772;;0000-0002-2779-1653",
        "linkedin": "vishvaksenan-r-2313b427b/;;veton-matoshi-186a3093/;matthiasstuermer/;;;joelniklaus/",
        "or_profile": "~Vishvaksenan_Rasiah1;~Ronja_Stern1;~Veton_Matoshi1;~Matthias_St\u00fcrmer1;~Ilias_Chalkidis1;~Daniel_E._Ho1;~Joel_Niklaus1",
        "aff": ";;BFH - Bern University of Applied Sciences;Universit\u00e4t Bern;Copenhagen University;Stanford University;University of Bern, Universit\u00e4t Bern",
        "aff_domain": ";;bfh.ch;unibe.ch;ku.dk;stanford.edu;inf.unibe.ch",
        "position": ";;Researcher;Lecturer;Postdoc;Professor;PhD student",
        "bibtex": "@misc{\nrasiah2024scale,\ntitle={{SCALE}: Scaling up the Complexity for Advanced Language Model Evaluation},\nauthor={Vishvaksenan Rasiah and Ronja Stern and Veton Matoshi and Matthias St{\\\"u}rmer and Ilias Chalkidis and Daniel E. Ho and Joel Niklaus},\nyear={2024},\nurl={https://openreview.net/forum?id=aLXRYfIUUd}\n}",
        "github": "",
        "project": "",
        "reviewers": "cCJK;pqFy;xb8g;x9cb",
        "site": "https://openreview.net/forum?id=aLXRYfIUUd",
        "pdf_size": 5063306,
        "rating": "3;3;5;6",
        "confidence": "3;4;4;4",
        "soundness": "3;2;2;4",
        "contribution": "2;2;2;3",
        "presentation": "2;2;3;3",
        "wc_summary": "42;68;90;74",
        "wc_strengths": "35;81;112;29",
        "wc_weaknesses": "107;140;90;26",
        "wc_questions": "11;24;99;83",
        "wc_review": "195;313;391;212",
        "wc_reply_reviewers": "0;24;29;216",
        "wc_reply_authors": "441;687;626;423",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            68.5,
            17.284386017443605
        ],
        "wc_strengths_avg": [
            64.25,
            34.127518222103404
        ],
        "wc_weaknesses_avg": [
            90.75,
            41.4811704270745
        ],
        "wc_questions_avg": [
            54.25,
            37.46581775432107
        ],
        "wc_review_avg": [
            277.75,
            79.43354140411971
        ],
        "wc_reply_reviewers_avg": [
            67.25,
            86.57763856793508
        ],
        "wc_reply_authors_avg": [
            544.25,
            114.48007468551023
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.5555555555555555,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18150130153300837652&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;2;3;1",
        "aff_unique_norm": "Bern University of Applied Sciences;University of Bern;University of Copenhagen;Stanford University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.bfh.ch;https://www.unibe.ch;https://www.ku.dk;https://www.stanford.edu",
        "aff_unique_abbr": "BFH;UniBE;UCPH;Stanford",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Bern;;Stanford",
        "aff_country_unique_index": "0;0;1;2;0",
        "aff_country_unique": "Switzerland;Denmark;United States"
    },
    {
        "id": "aLiinaY3ua",
        "title": "Diversifying Deep Ensembles: A Saliency Map Approach for Enhanced OOD Detection, Calibration, and Accuracy",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep ensembles are capable of achieving state-of-the-art results in classification and out-of-distribution (OOD) detection. However, their effectiveness is limited due to the homogeneity of learned patterns within ensembles. To overcome this issue, our study introduces **Saliency Diversified Deep Ensemble (SDDE)**, a novel approach that promotes diversity among ensemble members by leveraging saliency maps. Through incorporating saliency map diversification, our method outperforms conventional ensemble techniques and improves calibration in multiple classification and OOD detection tasks. In particular, the proposed method achieves state-of-the-art OOD detection quality, calibration, and accuracy on multiple benchmarks, including CIFAR10/100 and large-scale ImageNet datasets.",
        "keywords": "Ensemble diversity;OOD detection;calibration;computer vision;neural networks",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/002aa9ef6b77f3830cc33672b9065c320a0fac3d.zip",
        "author": "Stanislav Dereka;Ivan Karpukhin;Maksim Zhdanov;Sergey Kolesnikov",
        "authorids": "~Stanislav_Dereka1;~Ivan_Karpukhin1;~Maksim_Zhdanov2;~Sergey_Kolesnikov1",
        "gender": "M;M;M;M",
        "homepage": "https://github.com/stdereka;https://maxnygma.github.io/;https://scitator.com;https://linkedin.com/in/ivan-karpukhin",
        "dblp": ";;191/1945;313/9307.html",
        "google_scholar": "Mxb4MxsAAAAJ;https://scholar.google.com/citations?hl=en;iukbpVEAAAAJ;https://scholar.google.ru/citations?user=_5CL_w8AAAAJ",
        "orcid": ";0009-0009-1444-4933;;0000-0001-9694-7810",
        "linkedin": "stdereka/;maksim-zhdanov-2a2b7819a/;scitator/;",
        "or_profile": "~Stanislav_Dereka1;~Maksim_Zhdanov2;~Sergey_Kolesnikov1;~Ivan_Alexandrovich_Karpukhin1",
        "aff": "T-Bank;Tinkoff;Tinkoff;Sberbank",
        "aff_domain": "tbank.ru;tinkoff.ru;tinkoff.ru;sberbank.ru",
        "position": "Researcher;Intern;Principal Researcher;Researcher",
        "bibtex": "@misc{\ndereka2024diversifying,\ntitle={Diversifying Deep Ensembles: A Saliency Map Approach for Enhanced {OOD} Detection, Calibration, and Accuracy},\nauthor={Stanislav Dereka and Ivan Karpukhin and Maksim Zhdanov and Sergey Kolesnikov},\nyear={2024},\nurl={https://openreview.net/forum?id=aLiinaY3ua}\n}",
        "github": "",
        "project": "",
        "reviewers": "T1LE;FdHh;WdEW;iYeu",
        "site": "https://openreview.net/forum?id=aLiinaY3ua",
        "pdf_size": 1221137,
        "rating": "3;3;3;5",
        "confidence": "3;4;4;3",
        "soundness": "3;2;2;3",
        "contribution": "1;2;1;3",
        "presentation": "2;2;3;3",
        "wc_summary": "61;39;61;61",
        "wc_strengths": "20;6;87;17",
        "wc_weaknesses": "168;58;114;160",
        "wc_questions": "30;13;40;3",
        "wc_review": "279;116;302;241",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "978;412;832;438",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;2;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            55.5,
            9.526279441628825
        ],
        "wc_strengths_avg": [
            32.5,
            31.894356867634123
        ],
        "wc_weaknesses_avg": [
            125.0,
            43.829214001622255
        ],
        "wc_questions_avg": [
            21.5,
            14.396180048887969
        ],
        "wc_review_avg": [
            234.5,
            71.80006963784923
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            665.0,
            245.66033460858105
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Wgnb63AXY2wJ:scholar.google.com/&scioq=Diversifying+Deep+Ensembles:+A+Saliency+Map+Approach+for+Enhanced+OOD+Detection,+Calibration,+and+Accuracy&hl=en&as_sdt=0,33",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "T-Bank;Tinkoff Bank;Sberbank",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.tbank.com.cn;https://www.tinkoff.ru;https://www.sberbank.ru",
        "aff_unique_abbr": ";Tinkoff;Sberbank",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "China;Russian Federation"
    },
    {
        "id": "aM7US5jKCd",
        "title": "Towards Reliable Evaluation and Fast Training of Robust Semantic Segmentation Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Adversarial robustness has been studied  extensively in image classification, especially for the $\\ell_\\infty$-threat model, but significantly less so for related tasks such as object detection and semantic segmentation. Attacks on semantic segmentation models turn out to be harder than for image classification. We propose novel attacks and motivated by their complementary properties, we put them into an attack ensemble called SEA. We use SEA to show that existing attacks can severely overestimate the robustness of semantic segmentation models.\nPerhaps surprisingly, existing attempts of adversarial training for semantic segmentation turn out to yield only weakly robust models or are even completely non-robust. We investigate why previous adaptations of adversarial training to semantic segmentation failed and identify insufficient training time and number of attack steps as key elements. In turn we show how recently proposed robust ImageNet backbones can be used to obtain adversarially robust semantic segmentation models with up to six times less training time for Pascal-VOC and the more challenging ADE-20k.",
        "keywords": "adversarial robustness;deep learning;semantic segmentation;adversarial attack",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/c37fd489a24cbb18293727080d4aa6cd263dfdd2.zip",
        "author": "Francesco Croce;Naman Deep Singh;Matthias Hein",
        "authorids": "~Francesco_Croce1;~Naman_Deep_Singh1;~Matthias_Hein2",
        "gender": "M;M;M",
        "homepage": ";https://uni-tuebingen.de/fakultaeten/mathematisch-naturwissenschaftliche-fakultaet/fachbereiche/informatik/lehrstuehle/maschinelles-lernen/team/;https://uni-tuebingen.de/de/164260",
        "dblp": "52/4288;230/3694.html;97/1213-1",
        "google_scholar": "https://scholar.google.de/citations?view_op=list_works;https://scholar.google.de/citations?user=zfObWM0AAAAJ;0ZAb3tsAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Francesco_Croce1;~Naman_Deep_Singh1;~Matthias_Hein2",
        "aff": "EPFL - EPF Lausanne;Eberhard-Karls-Universit\u00e4t T\u00fcbingen;University of T\u00fcbingen",
        "aff_domain": "epfl.ch;uni-tuebingen.de;uni-tuebingen.de",
        "position": "Postdoc;PhD student;Full Professor",
        "bibtex": "@misc{\ncroce2024towards,\ntitle={Towards Reliable Evaluation and Fast Training of Robust Semantic Segmentation Models},\nauthor={Francesco Croce and Naman Deep Singh and Matthias Hein},\nyear={2024},\nurl={https://openreview.net/forum?id=aM7US5jKCd}\n}",
        "github": "",
        "project": "",
        "reviewers": "CxEd;pqj9;hjSQ;tMpk",
        "site": "https://openreview.net/forum?id=aM7US5jKCd",
        "pdf_size": 20084496,
        "rating": "5;5;5;6",
        "confidence": "3;4;4;3",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;2;3",
        "wc_summary": "53;137;73;121",
        "wc_strengths": "72;59;40;65",
        "wc_weaknesses": "210;98;121;42",
        "wc_questions": "88;35;56;3",
        "wc_review": "423;329;290;231",
        "wc_reply_reviewers": "261;101;0;0",
        "wc_reply_authors": "1217;537;1357;287",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "3;2;3;2",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            96.0,
            34.219877264537345
        ],
        "wc_strengths_avg": [
            59.0,
            11.895377253370318
        ],
        "wc_weaknesses_avg": [
            117.75,
            60.51601027827264
        ],
        "wc_questions_avg": [
            45.5,
            30.955613384328213
        ],
        "wc_review_avg": [
            318.25,
            69.81896232399906
        ],
        "wc_reply_reviewers_avg": [
            90.5,
            106.72511419530082
        ],
        "wc_reply_authors_avg": [
            849.5,
            449.0754390968181
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18273936342591178873&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "EPFL;Eberhard Karls University of T\u00fcbingen;University of T\u00fcbingen",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.epfl.ch;https://www.uni-tuebingen.de/;https://www.uni-tuebingen.de/",
        "aff_unique_abbr": "EPFL;Uni T\u00fcbingen;Uni T\u00fcbingen",
        "aff_campus_unique_index": "0;1",
        "aff_campus_unique": "Lausanne;T\u00fcbingen;",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "Switzerland;Germany"
    },
    {
        "id": "aMfdN4ZQVx",
        "title": "Training-free Deep Concept Injection Enables Language Models for Crossmodal Tasks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recently, enabling pretrained language models (PLMs) to perform zero-shot crossmodal tasks has been extensively studied. A popular approach is to learn a projection network that projects visual features into the input text embedding space of a PLM, as well as feed-forward adaptation layers, with the weights of the PLM frozen. However, is it really necessary to learn such additional layers? In this paper, we make the first attempt to demonstrate that the PLM is able to perform zero-shot crossmodal tasks without any training, when the observed visual concepts are injected as both additional input text tokens and augmentation in the intermediate features within each feed-forward network for the PLM. Specifically, inputting observed visual concepts as text tokens helps to inject them through the self-attention layers in the PLM; to augment the intermediate features in a way that is compatible with the PLM, we propose to construct adaptation layers based on the intermediate representation of concepts (obtained by solely inputting them to the PLM). These two complementary injection mechanisms form the proposed Deep Concept Injection, which comprehensively enables the PLM to perceive instantly as learning process is no longer needed. Extensive empirical analysis on zero-shot video question answering and visual question answering shows Deep Concept Injection achieves competitive or even better results, compared to state-of-the-art methods requires crossmodal training.",
        "keywords": "zero-shot video question answering;zero-shot multimodal dialogue;large language model",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Xudong Lin;Manling Li;Richard Zemel;Heng Ji;Shih-Fu Chang",
        "authorids": "~Xudong_Lin1;~Manling_Li1;~Richard_Zemel1;~Heng_Ji3;~Shih-Fu_Chang3",
        "gender": "M;F;M;F;M",
        "homepage": ";https://limanling.github.io/;http://www.cs.columbia.edu/~zemel;http://blender.cs.illinois.edu/hengji.html;http://www.ee.columbia.edu/~sfchang/",
        "dblp": "23/7723-3;178/3620;16/6366;;c/ShihFuChang",
        "google_scholar": "https://scholar.google.com.hk/citations?hl=en;6U4SXnUAAAAJ;https://scholar.google.ca/citations?user=iBeDoRAAAAAJ;z7GCqT4AAAAJ;OMVTRscAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Xudong_Lin1;~Manling_Li1;~Richard_Zemel1;~Heng_Ji3;~Shih-Fu_Chang3",
        "aff": "Columbia University;Stanford University;Department of Computer Science, University of Toronto;University of Illinois, Urbana-Champaign;Columbia University",
        "aff_domain": "columbia.edu;stanford.edu;cs.toronto.edu;uiuc.edu;ee.columbia.edu",
        "position": "PhD student;Postdoc;Full Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nlin2024trainingfree,\ntitle={Training-free Deep Concept Injection Enables Language Models for Crossmodal Tasks},\nauthor={Xudong Lin and Manling Li and Richard Zemel and Heng Ji and Shih-Fu Chang},\nyear={2024},\nurl={https://openreview.net/forum?id=aMfdN4ZQVx}\n}",
        "github": "",
        "project": "",
        "reviewers": "Eqqp;Hqos;HYCX;YWMx",
        "site": "https://openreview.net/forum?id=aMfdN4ZQVx",
        "pdf_size": 1797306,
        "rating": "5;6;6;6",
        "confidence": "3;3;3;3",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "62;38;72;61",
        "wc_strengths": "51;26;40;105",
        "wc_weaknesses": "136;72;134;262",
        "wc_questions": "4;32;5;9",
        "wc_review": "253;168;251;437",
        "wc_reply_reviewers": "0;10;0;0",
        "wc_reply_authors": "558;213;285;695",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            58.25,
            12.457427503300993
        ],
        "wc_strengths_avg": [
            55.5,
            29.920728600754362
        ],
        "wc_weaknesses_avg": [
            151.0,
            69.05794668247819
        ],
        "wc_questions_avg": [
            12.5,
            11.412712210513327
        ],
        "wc_review_avg": [
            277.25,
            98.4031884646021
        ],
        "wc_reply_reviewers_avg": [
            2.5,
            4.330127018922194
        ],
        "wc_reply_authors_avg": [
            437.75,
            196.52146829290686
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17058344575795028300&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;0",
        "aff_unique_norm": "Columbia University;Stanford University;University of Toronto;University of Illinois",
        "aff_unique_dep": ";;Department of Computer Science;",
        "aff_unique_url": "https://www.columbia.edu;https://www.stanford.edu;https://www.utoronto.ca;https://illinois.edu",
        "aff_unique_abbr": "Columbia;Stanford;U of T;UIUC",
        "aff_campus_unique_index": "1;2;3",
        "aff_campus_unique": ";Stanford;Toronto;Urbana-Champaign",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "United States;Canada"
    },
    {
        "title": "The mechanistic basis of data dependence and abrupt learning in an in-context classification task",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18368",
        "id": "aN4Jf6Cx69",
        "author_site": "Gautam Reddy Nallamala",
        "tldr": "",
        "abstract": "Transformer models exhibit in-context learning: the ability to accurately predict the response to a novel query based on illustrative examples in the input sequence, which contrasts with traditional in-weights learning of query-output relationships. What aspects of the training data distribution and architecture favor in-context vs in-weights learning? Recent work has shown that specific distributional properties inherent in language, such as burstiness, large dictionaries and skewed rank-frequency distributions, control the trade-off or simultaneous appearance of these two forms of learning. We first show that these results are recapitulated in a minimal attention-only network trained on a simplified dataset. In-context learning (ICL) is driven by the abrupt emergence of an induction head, which subsequently competes with in-weights learning. By identifying progress measures that precede in-context learning and targeted experiments, we construct a two-parameter model of an induction head which emulates the full data distributional dependencies displayed by the attention-based network. A phenomenological model of induction head formation traces its abrupt emergence to the sequential learning of three nested logits enabled by an intrinsic curriculum. We propose that the sharp transitions in attention-based networks arise due to a specific chain of multi-layer operations necessary to achieve ICL, which is implemented by nested nonlinearities sequentially learned during training.",
        "keywords": "in-context learning;mechanistic interpretability;language models;induction heads",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Gautam Reddy",
        "authorids": "~Gautam_Reddy1",
        "gender": "",
        "homepage": "",
        "dblp": "",
        "google_scholar": "",
        "orcid": "",
        "linkedin": "",
        "or_profile": "",
        "aff": "",
        "aff_domain": "",
        "position": "",
        "bibtex": "@inproceedings{\nreddy2024the,\ntitle={The mechanistic basis of data dependence and abrupt learning in an in-context classification task},\nauthor={Gautam Reddy},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=aN4Jf6Cx69}\n}",
        "github": "",
        "project": "",
        "reviewers": "ciFG;3R5R;Y7Wm;sq8T",
        "pdf_size": 5523952,
        "rating": "8;8;10;10",
        "confidence": "3;4;4;4",
        "soundness": "2;4;4;4",
        "contribution": "3;3;4;3",
        "presentation": "2;4;3;3",
        "wc_summary": "149;133;161;96",
        "wc_strengths": "140;96;111;514",
        "wc_weaknesses": "328;26;55;592",
        "wc_questions": "201;28;100;132",
        "wc_review": "818;283;427;1334",
        "wc_reply_reviewers": "0;46;28;353",
        "wc_reply_authors": "511;74;54;269",
        "reply_reviewers": "0;1;1;2",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            9.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            134.75,
            24.47830672248389
        ],
        "wc_strengths_avg": [
            215.25,
            173.20706538706784
        ],
        "wc_weaknesses_avg": [
            250.25,
            229.80902397425564
        ],
        "wc_questions_avg": [
            115.25,
            62.206812327911486
        ],
        "wc_review_avg": [
            715.5,
            407.22751626087353
        ],
        "wc_reply_reviewers_avg": [
            106.75,
            143.11424632090265
        ],
        "wc_reply_authors_avg": [
            227.0,
            184.22676244237698
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 64,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4956810574018691146&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=aN4Jf6Cx69",
        "pdf": "https://openreview.net/pdf?id=aN4Jf6Cx69",
        "email": "",
        "author_num": 1
    },
    {
        "id": "aNuQyV30Yw",
        "title": "An Image is Worth Multiple Words: Learning Object Level Concepts using Multi-Concepts Prompts Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Textural Inversion, a prompt learning method, learns a singular embedding for a new \u201cword\u201d to represent image style and appearance, allowing it to be integrated into natural language sentences to generate novel synthesised images. However, identifying and integrating multiple object-level concepts within one scene poses significant challenges even when embeddings for individual concepts are attainable. This is further confirmed by our empirical tests. To address this challenge, we introduce a framework for Multi-Concept Prompt Learning (MCPL), where multiple new \u201cwords\u201d are simultaneously learned from a single sentence-image pair. To enhance the accuracy of word-concept correlation, we propose three regularisation techniques: Attention Masking (AttnMask) to concentrate learning on relevant areas; Prompts Contrastive Loss (PromptCL) to separate the embeddings of different concepts; and Bind adjective (Bind adj.) to associate new \u201cwords\u201d with known words. We evaluate via image generation, editing, and attention visualisation with diverse images. Extensive quantitative comparisons demonstrate that our method can learn more semantically disentangled concepts with enhanced word-concept correlation. Additionally, we introduce a novel dataset and evaluation protocol tailored for this new task of learning object-level concepts.",
        "keywords": "personalized generation;text-to-image;multi-concepts inversion",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Chen Jin;Ryutaro Tanno;Amrutha Saseendran;Tom Diethe;Philip Alexander Teare",
        "authorids": "~Chen_Jin3;~Ryutaro_Tanno1;~Amrutha_Saseendran1;~Tom_Diethe1;~Philip_Alexander_Teare1",
        "gender": ";M;F;M;M",
        "homepage": "https://lxasqjc.github.io;https://rt416.github.io/;;http://www.tomdiethe.com;",
        "dblp": ";187/6071;289/0537;33/1098;",
        "google_scholar": "https://scholar.google.co.uk/citations?user=4on9TiAAAAAJ;https://scholar.google.co.uk/citations?user=NiEvNoEAAAAJ;k2s42F0AAAAJ;https://scholar.google.co.uk/citations?user=oWGk9c8AAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0002-2179-6445;;;0000-0002-0776-5407;",
        "linkedin": "chen-jin-33287593/;;amrutha-saseendran;tomdiethe/;philteare/",
        "or_profile": "~Chen_Jin3;~Ryutaro_Tanno1;~Amrutha_Saseendran1;~Tom_Diethe1;~Philip_Alexander_Teare1",
        "aff": "Astrazeneca;Google DeepMind;AstraZeneca;AstraZeneca;AstraZeneca",
        "aff_domain": "astrazeneca.com;deepmind.com;astrazeneca.com;astrazeneca.com;astrazeneca.com",
        "position": "Researcher;Researcher;Research Scientist;Principal Researcher;Researcher",
        "bibtex": "@misc{\njin2024an,\ntitle={An Image is Worth Multiple Words: Learning Object Level Concepts using Multi-Concepts Prompts Learning},\nauthor={Chen Jin and Ryutaro Tanno and Amrutha Saseendran and Tom Diethe and Philip Alexander Teare},\nyear={2024},\nurl={https://openreview.net/forum?id=aNuQyV30Yw}\n}",
        "github": "",
        "project": "",
        "reviewers": "BYgx;wHAP;RxXV;cRiH",
        "site": "https://openreview.net/forum?id=aNuQyV30Yw",
        "pdf_size": 48952700,
        "rating": "3;6;6;8",
        "confidence": "3;3;3;3",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;4;4;3",
        "wc_summary": "64;105;75;76",
        "wc_strengths": "17;129;77;86",
        "wc_weaknesses": "73;218;137;40",
        "wc_questions": "33;4;73;1",
        "wc_review": "187;456;362;203",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1177;719;1281;354",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;2;1",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            80.0,
            15.182226450688976
        ],
        "wc_strengths_avg": [
            77.25,
            39.95231532714969
        ],
        "wc_weaknesses_avg": [
            117.0,
            67.94483056127228
        ],
        "wc_questions_avg": [
            27.75,
            28.960101864461734
        ],
        "wc_review_avg": [
            302.0,
            112.18511487715293
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            882.75,
            371.34106627196513
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9555611995418060585&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;0;0;0",
        "aff_unique_norm": "AstraZeneca;Google",
        "aff_unique_dep": ";Google DeepMind",
        "aff_unique_url": "https://www.astrazeneca.com;https://deepmind.com",
        "aff_unique_abbr": "AstraZeneca;DeepMind",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "aOPTDchLBz",
        "title": "ivrit.ai: A Comprehensive Dataset of Hebrew Speech for AI Research and Development",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We introduce ivrit.ai, a comprehensive Hebrew speech dataset, addressing the distinct lack of extensive, high-quality resources for advancing Automated Speech Recognition (ASR) technology in Hebrew. With over 10,000 speech hours and over a thousand diverse speakers,ivrit.ai offers a substantial compilation of Hebrew speech across various contexts. It is delivered in three forms to cater to varying research needs: raw unprocessed audio; data post-Voice Activity Detection, and partially transcribed data. The dataset stands out for its legal accessibility, permitting use at no cost, thereby serving as a crucial resource for researchers, developers, and commercial entities. ivrit.ai opens up numerous applications, offering vast potential to enhance AI capabilities in Hebrew. Future efforts aim to expand ivrit.ai further, thereby advancing Hebrew's standing in AI research and technology.",
        "keywords": "corpus;speech;speech-to-text;Hebrew",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Yanir Marmor;Kinneret Misgav",
        "authorids": "~Yanir_Marmor1;~Kinneret_Misgav1",
        "gender": "M;F",
        "homepage": ";",
        "dblp": "309/6520;",
        "google_scholar": "JqObQ9UAAAAJ;",
        "orcid": ";",
        "linkedin": "yanir-marmor/;kinneret-misgav-013973214/",
        "or_profile": "~Yanir_Marmor1;~Kinneret_Misgav1",
        "aff": "Weizmann Institute of Science;Tel Aviv University",
        "aff_domain": "wis.ac.il;tauex.tau.ac.il",
        "position": "MS student;PhD student",
        "bibtex": "@misc{\nmarmor2024ivritai,\ntitle={ivrit.ai: A Comprehensive Dataset of Hebrew Speech for {AI} Research and Development},\nauthor={Yanir Marmor and Kinneret Misgav},\nyear={2024},\nurl={https://openreview.net/forum?id=aOPTDchLBz}\n}",
        "github": "",
        "project": "",
        "reviewers": "7nK7;toHs;PchH;EH9S",
        "site": "https://openreview.net/forum?id=aOPTDchLBz",
        "pdf_size": 159994,
        "rating": "1;3;3;3",
        "confidence": "5;3;4;5",
        "soundness": "2;3;2;1",
        "contribution": "1;2;2;1",
        "presentation": "3;3;2;2",
        "wc_summary": "42;23;97;29",
        "wc_strengths": "30;109;54;36",
        "wc_weaknesses": "150;189;178;61",
        "wc_questions": "72;23;8;11",
        "wc_review": "294;344;337;137",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            47.75,
            29.252136674096132
        ],
        "wc_strengths_avg": [
            57.25,
            31.155858197135252
        ],
        "wc_weaknesses_avg": [
            144.5,
            50.2618145315109
        ],
        "wc_questions_avg": [
            28.5,
            25.734218464915543
        ],
        "wc_review_avg": [
            278.0,
            83.62714870184203
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4911028897794353722&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Weizmann Institute of Science;Tel Aviv University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.weizmann.org.il;https://www.tau.ac.il",
        "aff_unique_abbr": "Weizmann;TAU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Israel"
    },
    {
        "title": "Symbol as Points: Panoptic Symbol Spotting via Point-based Representation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18367",
        "id": "aOnUe8ah7j",
        "author_site": "Wenlong Liu, Tianyu Yang, Yuhan Wang, Qizhi Yu, Lei Zhang",
        "tldr": "",
        "abstract": "This work studies the problem of panoptic symbol spotting, which is to spot and parse both countable object instances (windows, doors, tables, etc.) and uncountable stuff (wall, railing, etc.) from computer-aided design (CAD) drawings. Existing methods typically involve either rasterizing the vector graphics into images and using image-based methods for symbol spotting, or directly building graphs and using graph neural networks for symbol recognition. In this paper, we take a different approach, which treats graphic primitives as a set of 2D points that are locally connected and use point cloud segmentation methods to tackle it. Specifically, we utilize a point transformer to extract the primitive features and append a mask2former-like spotting head to predict the final output. To better use the local connection information of primitives and enhance their discriminability, we further propose the attention with connection module (ACM) and contrastive connection learning scheme (CCL). Finally, we propose a KNN interpolation mechanism for the mask attention module of the spotting head to better handle primitive mask downsampling, which is primitive-level in contrast to pixel-level for the image. Our approach, named SymPoint, is simple yet effective, outperforming recent state-of-the-art method GAT-CADNet by an absolute increase of 9.6% PQ and 10.4% RQ on the FloorPlanCAD dataset. The source code and models will be available at \\url{https://github.com/nicehuster/SymPoint}.",
        "keywords": "CAD;Panoptic Symbol Spotting",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "WENLONG LIU;Tianyu Yang;Yuhan Wang;Qizhi Yu;Lei Zhang",
        "authorids": "~WENLONG_LIU2;~Tianyu_Yang2;~Yuhan_Wang9;~Qizhi_Yu1;~Lei_Zhang23",
        "gender": "M;M;M;;",
        "homepage": "https://nicehuster.github.io/;https://tianyu-yang.com/;;;",
        "dblp": ";120/8076-3.html;60/6089-1;;",
        "google_scholar": ";BXsWsf8AAAAJ;ebo7cdMAAAAJ;;",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~WENLONG_LIU2;~Tianyu_Yang2;~Yuhan_Wang9;~Qizhi_Yu1;~Lei_Zhang23",
        "aff": "IDEA;International Digital Economy Academy;;;",
        "aff_domain": "idea.edu.cn;idea.edu.cn;;;",
        "position": "Researcher;Researcher;;;",
        "bibtex": "@inproceedings{\nliu2024symbol,\ntitle={Symbol as Points: Panoptic Symbol Spotting via Point-based Representation},\nauthor={WENLONG LIU and Tianyu Yang and Yuhan Wang and Qizhi Yu and Lei Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=aOnUe8ah7j}\n}",
        "github": "",
        "project": "",
        "reviewers": "u21w;q1T8;AtGi",
        "pdf_size": 5225021,
        "rating": "3;6;8",
        "confidence": "4;3;5",
        "soundness": "2;3;3",
        "contribution": "2;2;3",
        "presentation": "2;3;3",
        "wc_summary": "54;90;83",
        "wc_strengths": "9;87;81",
        "wc_weaknesses": "58;300;217",
        "wc_questions": "15;4;7",
        "wc_review": "136;481;388",
        "wc_reply_reviewers": "0;36;255",
        "wc_reply_authors": "384;566;581",
        "reply_reviewers": "0;1;2",
        "reply_authors": "1;1;1",
        "rating_avg": [
            5.666666666666667,
            2.0548046676563256
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            75.66666666666667,
            15.58489297008128
        ],
        "wc_strengths_avg": [
            59.0,
            35.4400902933387
        ],
        "wc_weaknesses_avg": [
            191.66666666666666,
            100.40694973733419
        ],
        "wc_questions_avg": [
            8.666666666666666,
            4.642796092394707
        ],
        "wc_review_avg": [
            335.0,
            145.74635501445653
        ],
        "wc_reply_reviewers_avg": [
            97.0,
            112.68540278137182
        ],
        "wc_reply_authors_avg": [
            510.3333333333333,
            89.54080385810458
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.3973597071195132,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3428367423959564007&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=aOnUe8ah7j",
        "pdf": "https://openreview.net/pdf?id=aOnUe8ah7j",
        "email": "idea.edu.cn;idea.edu.cn;;;",
        "author_num": 5,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Institute of Electrical and Electronics Engineers;International Digital Economy Academy",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ieee.org;",
        "aff_unique_abbr": "IEEE;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States;"
    },
    {
        "title": "Horizon-free Reinforcement Learning in Adversarial Linear Mixture MDPs",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18366",
        "id": "aPNwsJgnZJ",
        "author_site": "Kaixuan Ji, Qingyue Zhao, Jiafan He, Weitong ZHANG, Quanquan Gu",
        "tldr": "",
        "abstract": "Recent studies have shown that the regret of reinforcement learning (RL) can be polylogarithmic in the planning horizon $H$. However, it remains an open question whether such a result holds for adversarial RL. In this paper, we answer this question affirmatively by proposing the first horizon-free policy search algorithm. To tackle the challenges caused by exploration and adversarially chosen reward over episodes, our algorithm employs (1) a variance-uncertainty-aware weighted least square estimator for the transition kernel; and (2) an occupancy measure-based technique for the online search of a stochastic policy. We show that our algorithm achieves an $\\tilde{O}\\big((d+\\log |\\mathcal{S}|)\\sqrt{K} + d^2\\big)$ regret with full-information feedback, where $d$ is the dimension of a known feature mapping linearly parametrizing the unknown transition kernel of the MDP, $K$ is the number of episodes, $|\\mathcal{S}|$ is the cardinality of the state space. We also provide hardness results to justify the near optimality of our algorithm and the inevitability of $\\log|\\mathcal{S}|$ in the regret bound.",
        "keywords": "reinforcement learning theory;reinforcement learning with adversarial reward;regret minimization;linear function approximation",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/2277b4d1df9c119ff375bcc71310ec201484e176.pdf",
        "author": "Kaixuan Ji;Qingyue Zhao;Jiafan He;Weitong Zhang;Quanquan Gu",
        "authorids": "~Kaixuan_Ji2;~Qingyue_Zhao2;~Jiafan_He1;~Weitong_Zhang2;~Quanquan_Gu1",
        "gender": "Not Specified;M;M;M;M",
        "homepage": "https://github.com/jkx19;;https://sites.google.com/g.ucla.edu/jiafan-he-homepage;http://web.cs.ucla.edu/~qgu/;https://web.cs.ucla.edu/~weightzero",
        "dblp": "252/7475;;214/5785;50/4597;96/4158",
        "google_scholar": "FOoKDukAAAAJ;EguGynAAAAAJ;F3AXNBwAAAAJ;GU9HgNAAAAAJ;Ec6bzmcAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Kaixuan_Ji2;~Qingyue_Zhao2;~Jiafan_He1;~Quanquan_Gu1;~Weitong_ZHANG1",
        "aff": "University of California, Los Angeles;Tsinghua University;University of California, Los Angeles;University of California, Los Angeles;University of California, Los Angeles",
        "aff_domain": "ucla.edu;tsinghua.edu.cn;ucla.edu;cs.ucla.edu;ucla.edu",
        "position": "PhD student;Undergrad student;PhD student;Associate Professor;PhD student",
        "bibtex": "@inproceedings{\nji2024horizonfree,\ntitle={Horizon-free Reinforcement Learning in Adversarial Linear Mixture {MDP}s},\nauthor={Kaixuan Ji and Qingyue Zhao and Jiafan He and Weitong Zhang and Quanquan Gu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=aPNwsJgnZJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "K64K;ZMLZ;tM5p;p5dn",
        "pdf_size": 501096,
        "rating": "6;6;6;6",
        "confidence": "4;3;3;4",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "71;107;76;121",
        "wc_strengths": "87;74;73;49",
        "wc_weaknesses": "56;219;125;8",
        "wc_questions": "1;43;21;30",
        "wc_review": "215;443;295;208",
        "wc_reply_reviewers": "0;36;24;0",
        "wc_reply_authors": "386;210;493;260",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;2;2;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            93.75,
            20.92098229051399
        ],
        "wc_strengths_avg": [
            70.75,
            13.718144918318949
        ],
        "wc_weaknesses_avg": [
            102.0,
            79.32527970325727
        ],
        "wc_questions_avg": [
            23.75,
            15.286840746210448
        ],
        "wc_review_avg": [
            290.25,
            94.5816446251597
        ],
        "wc_reply_reviewers_avg": [
            15.0,
            15.588457268119896
        ],
        "wc_reply_authors_avg": [
            337.25,
            110.44766860373288
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10643984513342114221&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=aPNwsJgnZJ",
        "pdf": "https://openreview.net/pdf?id=aPNwsJgnZJ",
        "email": "ucla.edu;tsinghua.edu.cn;ucla.edu;cs.ucla.edu;ucla.edu",
        "author_num": 5,
        "aff_unique_index": "0;1;0;0;0",
        "aff_unique_norm": "University of California, Los Angeles;Tsinghua University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ucla.edu;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "UCLA;THU",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Los Angeles;",
        "aff_country_unique_index": "0;1;0;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "aQij7UmwTF",
        "title": "Generalization Bounds for Magnitude-Based Pruning via Sparse Matrix Sketching",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Magnitude-based pruning is a popular technique for improving the efficiency of Machine Learning, but also surprisingly maintains strong generalization behavior. Explaining this generalization is difficult, and existing analyses connecting sparsity to generalization rely on more structured compression than simple magnitude-based weight dropping. However, we circumvent the need for structured compression by using recent random matrix theory and sparse matrix sketching results to more tightly tie the connection between pruning-based sparsity and generalization and provide bounds on how Magnitude-Based Pruning and Iterative Magnitude Pruning affects generalization. We empirically verify that our bounds capture the connection between pruning-based sparsity and generalization more than existing bounds.",
        "keywords": "Generalization Bounds;Pruning;Sparsity",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/c31e6ba22cfec8cf476afdb66a745fe6f757b9f9.zip",
        "author": "Etash Kumar Guha;Prasanjit Dubey;Xiaoming Huo",
        "authorids": "~Etash_Kumar_Guha1;~Prasanjit_Dubey1;~Xiaoming_Huo1",
        "gender": "M;M;M",
        "homepage": "https://etash.me/;;https://www.isye.gatech.edu/users/xiaoming-huo",
        "dblp": "331/5590;;67/3392",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;https://scholar.google.com/citations?hl=en",
        "orcid": ";0000-0002-3667-5507;0000-0003-0101-1206",
        "linkedin": "etash-guha-00097116a/;prasanjit-dubey;xiaoming-huo-9653374/",
        "or_profile": "~Etash_Kumar_Guha1;~Prasanjit_Dubey1;~Xiaoming_Huo1",
        "aff": ";Georgia Institute of Technology;Georgia Institute of Technology",
        "aff_domain": ";gatech.edu;gatech.edu",
        "position": ";PhD student;Full Professor",
        "bibtex": "@misc{\nguha2024generalization,\ntitle={Generalization Bounds for Magnitude-Based Pruning via Sparse Matrix Sketching},\nauthor={Etash Kumar Guha and Prasanjit Dubey and Xiaoming Huo},\nyear={2024},\nurl={https://openreview.net/forum?id=aQij7UmwTF}\n}",
        "github": "",
        "project": "",
        "reviewers": "zSMw;TQ53;v5dd;ftR9",
        "site": "https://openreview.net/forum?id=aQij7UmwTF",
        "pdf_size": 629949,
        "rating": "1;5;6;6",
        "confidence": "2;4;3;3",
        "soundness": "1;2;3;3",
        "contribution": "2;3;3;3",
        "presentation": "1;2;3;3",
        "wc_summary": "324;243;98;95",
        "wc_strengths": "3;51;39;33",
        "wc_weaknesses": "3;205;202;264",
        "wc_questions": "948;2;49;5",
        "wc_review": "1278;501;388;397",
        "wc_reply_reviewers": "360;351;0;269",
        "wc_reply_authors": "1534;602;434;578",
        "reply_reviewers": "2;3;0;1",
        "reply_authors": "4;3;1;2",
        "rating_avg": [
            4.5,
            2.0615528128088303
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            190.0,
            97.79314904429656
        ],
        "wc_strengths_avg": [
            31.5,
            17.684739183827393
        ],
        "wc_weaknesses_avg": [
            168.5,
            98.69777099813349
        ],
        "wc_questions_avg": [
            251.0,
            402.84302153568456
        ],
        "wc_review_avg": [
            641.0,
            370.44365293523384
        ],
        "wc_reply_reviewers_avg": [
            245.0,
            145.82695224134667
        ],
        "wc_reply_authors_avg": [
            787.0,
            436.0401357673397
        ],
        "reply_reviewers_avg": [
            1.5,
            1.118033988749895
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.6859943405700353,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5495719206340084756&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Georgia Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.gatech.edu",
        "aff_unique_abbr": "Georgia Tech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "aQqLb5v3MH",
        "title": "Sparsify the Weights but Let the Gradients Flow!",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Sparsity has become one of the promising methods to compress and accelerate Deep Neural Networks (DNNs). Structured sparsity has garnered significant interest as a result of relatively modest hardware overhead and improved efficiency on contemporary DNN accelerators. In particular, N:M sparsity is attractive because of hardware accelerator architectures capable of harnessing specific variations of N:M structured sparsity, enhancing computational efficiency. Additionally, this form of sparsity holds considerable appeal for reducing the DNN memory footprint owing to their modest representation overhead. Although there have been efforts to develop training recipes for N:M structured sparsity, they primarily focus on low-sparsity regions (\u201e50%). As a consequence, the performance of models trained using these approaches tends to decline when confronted with high-sparsity regions. In this work, we extensively study the effectiveness of existing training recipes for N:M structured sparsity at high-sparsity regions and argue that these methods fail to sustain the model quality on par with low-sparsity regions. We demonstrate that the significant factor contributing to this disparity is the presence of elevated levels of induced noise in the gradient magnitudes. In order to mitigate this undesirable effect, we present two new sparse training recipes, namely Mask Decay Gradient Flow, MdGf' and Structure Decay Gradient Flow, SdGf. which employ decay mechanisms to progressively restrict the flow of gradients. Our results demonstrate that enabling the propagation of gradients plays a crucial role in preserving superior model performance while simultaneously attaining a high level of sparsity. Our evaluations of diverse sparsity configurations demonstrate that the proposed methods consistently achieve SOTA accuracy against conventional sparse recipes in a range of attention-based models used for various tasks encompassing both vision (up to \u2206(Acc) ~2%) and language (up to \u2206(Acc) ~5%). We provide the anonymized code at https://anonymous.4open.science/r/n_m_decay_1605-E77F",
        "keywords": "N:M structured sparsity;sparsity;model compression;attention-based models;sparse training recipe",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Amir Yazdanbakhsh;Abhimanyu Rajeshkumar Bambhaniya;Suvinay Subramanian;Sheng-Chun Kao;Shivani Agrawal;Utku Evci;Tushar Krishna",
        "authorids": "~Amir_Yazdanbakhsh1;~Abhimanyu_Rajeshkumar_Bambhaniya1;~Suvinay_Subramanian1;~Sheng-Chun_Kao1;~Shivani_Agrawal1;~Utku_Evci1;~Tushar_Krishna1",
        "gender": "M;;M;F;;M;M",
        "homepage": "https://www.ayazdan.com/;https://suvinay.com/;https://felix0901.github.io/felix.github.io/;;http://evcu.github.io;http://tusharkrishna.ece.gatech.edu;",
        "dblp": "44/8745;129/7647;;191/4416;179/8146;50/2421.html;312/5472.html",
        "google_scholar": "Vdu_sqwAAAAJ;54KhKdEAAAAJ;6d8ODpwAAAAJ;52f5kGIAAAAJ;8yGMMwcAAAAJ;P__ztgcAAAAJ;-auoWh5q4WwC",
        "orcid": "0000-0001-8199-7671;;;;;;0000-0003-0145-9713",
        "linkedin": "ayazdanb/;suvinay-subramanian-53163b20a;felix-kao/;shivani-agrawal/;;tushar-krishna-a60b0970/;abhimanyu-bambhaniya/",
        "or_profile": "~Amir_Yazdanbakhsh1;~Suvinay_Subramanian1;~Sheng-Chun_Kao1;~Shivani_Agrawal1;~Utku_Evci1;~Tushar_Krishna1;~Abhimanyu_Rajesh_Bambhaniya1",
        "aff": "Google DeepMind;Google;Waymo;Google;Google;Georgia Institute of Technology;Georgia Institute of Technology",
        "aff_domain": "google.com;google.com;google.com;google.com;google.com;gatech.edu;gatech.edu",
        "position": "Researcher;Researcher;Researcher;Researcher;Researcher;Associate Professor;PhD student",
        "bibtex": "@misc{\nyazdanbakhsh2024sparsify,\ntitle={Sparsify the Weights but Let the Gradients Flow!},\nauthor={Amir Yazdanbakhsh and Abhimanyu Rajeshkumar Bambhaniya and Suvinay Subramanian and Sheng-Chun Kao and Shivani Agrawal and Utku Evci and Tushar Krishna},\nyear={2024},\nurl={https://openreview.net/forum?id=aQqLb5v3MH}\n}",
        "github": "",
        "project": "",
        "reviewers": "mQGH;pctS;Q2rM",
        "site": "https://openreview.net/forum?id=aQqLb5v3MH",
        "pdf_size": 1467520,
        "rating": "3;5;5",
        "confidence": "4;4;3",
        "soundness": "2;3;2",
        "contribution": "2;3;2",
        "presentation": "2;3;3",
        "wc_summary": "81;62;23",
        "wc_strengths": "49;42;38",
        "wc_weaknesses": "275;78;134",
        "wc_questions": "91;149;34",
        "wc_review": "496;331;229",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            55.333333333333336,
            24.143091949642425
        ],
        "wc_strengths_avg": [
            43.0,
            4.546060565661952
        ],
        "wc_weaknesses_avg": [
            162.33333333333334,
            82.88278202109022
        ],
        "wc_questions_avg": [
            91.33333333333333,
            46.949145063805176
        ],
        "wc_review_avg": [
            352.0,
            110.00909053346456
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:r8OhJhN5NfQJ:scholar.google.com/&scioq=Sparsify+the+Weights+but+Let+the+Gradients+Flow!&hl=en&as_sdt=0,48",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;0;2;2",
        "aff_unique_norm": "Google;Waymo;Georgia Institute of Technology",
        "aff_unique_dep": "Google DeepMind;;",
        "aff_unique_url": "https://deepmind.com;https://www.waymo.com;https://www.gatech.edu",
        "aff_unique_abbr": "DeepMind;Waymo;Georgia Tech",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;1;1;1;1;1",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "id": "aTFPO9FHL3",
        "title": "Todyformer: Towards Holistic Dynamic Graph Transformers with Structure-Aware Tokenization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Temporal Graph Neural Networks have garnered substantial attention for their capacity to model evolving structural and temporal patterns while exhibiting impressive performance. However, it is known that these architectures are encumbered by issues that constrain their performance, such as over-squashing and over-smoothing. Meanwhile, Transformers have demonstrated exceptional computational capacity to effectively address challenges related to long-range dependencies. Consequently, we introduce Todyformer\u2014a novel Transformer-based neural network tailored for dynamic graphs. It unifies the local encoding capacity of Message-Passing Neural Networks (MPNNs) with the global encoding of Transformers through i) a novel patchifying paradigm for dynamic graphs to improve over-squashing, ii) a structure-aware parametric tokenization strategy leveraging MPNNs, iii) a Transformer with temporal positional-encoding to capture long-range dependencies, and iv) an encoding architecture that alternates between local and global contextualization, mitigating over-smoothing in MPNNs. Experimental evaluations on public benchmark datasets demonstrate that Todyformer consistently outperforms the state-of-the-art methods for the downstream tasks. Furthermore, we illustrate the underlying aspects of the proposed model in effectively capturing extensive temporal dependencies in dynamic graph.",
        "keywords": "graph representation learning;dynamic graphs;transformers",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/5972bd8c368ee7483a384312d9f38c4bda6555f8.pdf",
        "author": "Mahdi Biparva;Raika Karimi;Faezeh Faez;Yingxue Zhang",
        "authorids": "~Mahdi_Biparva1;~Raika_Karimi1;~Faezeh_Faez1;~Yingxue_Zhang1",
        "gender": "M;M;F;F",
        "homepage": "https://biparva.ca;https://github.com/raykakarimi;https://www.linkedin.com/in/faezeh-faez-73abb579;",
        "dblp": "205/2913;;;174/0010-1.html",
        "google_scholar": "ALnTC74AAAAJ;;https://scholar.google.ca/citations?user=D4gvIl8AAAAJ;4bsYpogAAAAJ",
        "orcid": ";;;",
        "linkedin": "https://ca.linkedin.com/in/mahdi-biparva-b6227965;;faezeh-faez-73abb579;yingxue-zhang-03971b112/",
        "or_profile": "~Mahdi_Biparva1;~Raika_Karimi1;~Faezeh_Faez1;~Yingxue_Zhang1",
        "aff": "Huawei Technologies Ltd.;;Huawei Technologies Ltd.;Huawei Canada, Huawei Noah's Ark Lab",
        "aff_domain": "huawei.com;;huawei.com;huawei.com",
        "position": "Researcher;;Researcher;Researcher",
        "bibtex": "@misc{\nbiparva2024todyformer,\ntitle={Todyformer: Towards Holistic Dynamic Graph Transformers with Structure-Aware Tokenization},\nauthor={Mahdi Biparva and Raika Karimi and Faezeh Faez and Yingxue Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=aTFPO9FHL3}\n}",
        "github": "",
        "project": "",
        "reviewers": "787D;Nqpw;dSfv;1VfV",
        "site": "https://openreview.net/forum?id=aTFPO9FHL3",
        "pdf_size": 4758262,
        "rating": "3;3;5;6",
        "confidence": "4;4;3;3",
        "soundness": "2;3;2;3",
        "contribution": "1;2;2;3",
        "presentation": "1;2;2;2",
        "wc_summary": "43;46;22;47",
        "wc_strengths": "32;37;7;31",
        "wc_weaknesses": "279;141;223;65",
        "wc_questions": "137;161;2;11",
        "wc_review": "491;385;254;154",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "590;720;694;281",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            39.5,
            10.21028892833107
        ],
        "wc_strengths_avg": [
            26.75,
            11.627015954233485
        ],
        "wc_weaknesses_avg": [
            177.0,
            81.17881497040962
        ],
        "wc_questions_avg": [
            77.75,
            71.82400364780565
        ],
        "wc_review_avg": [
            321.0,
            127.8416989874587
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            571.25,
            174.4926574386441
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9622504486493761,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16975009903542752137&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Huawei",
        "aff_unique_dep": "Huawei Technologies",
        "aff_unique_url": "https://www.huawei.com",
        "aff_unique_abbr": "Huawei",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "China;Canada"
    },
    {
        "id": "aU59FP3Q1e",
        "title": "Convolution on Your 12\u00d7 Wide Feature: A ConvNet with Nested Design",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Transformer stands as the prefered architecture for handling multimodal data under resource-abundant conditions. On the other hand, in scenarios involving resource-constrained unimodal vision tasks, Convolutional Neural Networks (ConvNets), especially smaller-scale ones, can offer a hardware-friendly solution due to the highly-optimized acceleration and deployment schemes tailored for convolution operators. Modern de-facto ConvNets take a ViT-style block-level design, i.e., sequential design with token mixer and MLP. However, this design choice seems more influenced by the prominence of Transformer in multi-modal domains than by an inherent suitability within ConvNet. In this work, we suggest allocating more proportion of  computational resources to spatial convolution layers, and further summarize 3 guidelines to steer such ConvNet design. Specifically, we observe that convolution on 12\u00d7 wide high dimensional features aids in expanding the receptive field and capturing rich spatial information, and correspondingly devise a ConvNet model with nested design, dubbed ConvNeSt. ConvNeSt outperforms ConvNeXt in the ImageNet classification, COCO detection and ADE20K segmentation tasks across different model variants, demonstrating the feasibility of revisiting ConvNet block design. As a small-scale student model, ConvNeSt also achieves stronger performance than ConvNeXt through knowledge distillation.",
        "keywords": "convolution on 12\u00d7 wide high-dimensional feature;pure ConvNet with nested design;vision backbone",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/3029d26b6109757f83b63e9e0d8dbf12a72a2f65.zip",
        "author": "Jiahao Wang;Songyang Zhang;Haodong Duan;Zhaohui Yu;Mengzhang Li;Yong Liu;Taiqiang Wu;Xihui Liu;Kai Chen;Dahua Lin;Ping Luo",
        "authorids": "~Jiahao_Wang1;~Songyang_Zhang1;~Haodong_Duan1;~Zhaohui_Yu2;~Mengzhang_Li1;~Yong_Liu16;~Taiqiang_Wu1;~Xihui_Liu1;~Kai_Chen4;~Dahua_Lin1;~Ping_Luo2",
        "gender": "M;M;M;M;M;M;F;M;M;;M",
        "homepage": "https://www.zhihu.com/people/wang-jia-hao-hku;https://www.zhangsongyang.com/;https://kennymckormick.github.io;;https://yongliu20.github.io/;https://wutaiqiang.github.io;https://xh-liu.github.io/;https://chenkai.site/;http://dahua.site;http://luoping.me/;https://github.com/Ezra-Yu",
        "dblp": ";;211/7919;211/9442.html;;303/5950;184/3911;181/2839-26;53/6088;54/4989-2.html;",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;8XQPi7YAAAAJ;vi3W-m8AAAAJ;Bg6jqQEAAAAJ;i9keb3IAAAAJ;mCtvn50AAAAJ;https://scholar.google.com.hk/citations?user=4YL23GMAAAAJ;https://scholar.google.com.hk/citations?user=eGD0b7IAAAAJ;GMzzRRUAAAAJ;https://scholar.google.com.hk/citations?hl=en;",
        "orcid": ";;0000-0002-3052-4177;0000-0002-3618-1304;;0000-0002-3664-3513;0000-0003-1831-9952;0000-0002-6820-2325;;0000-0002-6685-7950;",
        "linkedin": ";;haodong-duan-bb9349166/;;;;;;;;",
        "or_profile": "~Jiahao_Wang1;~Songyang_Zhang1;~Haodong_Duan1;~Mengzhang_Li1;~Yong_Liu16;~Taiqiang_Wu1;~Xihui_Liu1;~Kai_Chen4;~Dahua_Lin1;~Luo_Ping2;~Yu_Zhaohui1",
        "aff": "University of Hong Kong;Shanghai Artificial Intelligence Laboratory;Shanghai Artificial Intelligence Laboratory;Shanghai AI Lab;Tsinghua University;The University of Hong Kong;University of Hong Kong;Shanghai AI Laboratory;The Chinese University of Hong Kong;The University of Hong Kong;",
        "aff_domain": "hku.hk;pjlab.org.cn;pjlab.org.cn;pjlab.org;tsinghua.edu.cn;hku.hk;hku.hk;pjlab.org.cn;cuhk.edu.hk;hku.hk;",
        "position": "PhD student;Postdoc;Postdoc;Researcher;PhD student;PhD student;Assistant Professor;Researcher;Associate Professor;Associate Professor;",
        "bibtex": "@misc{\nwang2024convolution,\ntitle={Convolution on Your 12{\\texttimes} Wide Feature: A ConvNet with Nested Design},\nauthor={Jiahao Wang and Songyang Zhang and Haodong Duan and Zhaohui Yu and Mengzhang Li and Yong Liu and Taiqiang Wu and Xihui Liu and Kai Chen and Dahua Lin and Ping Luo},\nyear={2024},\nurl={https://openreview.net/forum?id=aU59FP3Q1e}\n}",
        "github": "",
        "project": "",
        "reviewers": "TPf3;mPKv;idR9;N5dm",
        "site": "https://openreview.net/forum?id=aU59FP3Q1e",
        "pdf_size": 2526381,
        "rating": "3;3;5;6",
        "confidence": "5;4;4;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "3;2;3;3",
        "wc_summary": "77;73;72;41",
        "wc_strengths": "60;51;33;94",
        "wc_weaknesses": "236;162;71;95",
        "wc_questions": "29;4;5;37",
        "wc_review": "402;290;181;267",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            65.75,
            14.411367041332339
        ],
        "wc_strengths_avg": [
            59.5,
            22.1641602593015
        ],
        "wc_weaknesses_avg": [
            141.0,
            64.19112088131816
        ],
        "wc_questions_avg": [
            18.75,
            14.53229162933362
        ],
        "wc_review_avg": [
            285.0,
            78.82575721171348
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": -0.5555555555555555,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:YTRyCp1Lof8J:scholar.google.com/&scioq=Convolution+on+Your+12%C3%97+Wide+Feature:+A+ConvNet+with+Nested+Design&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;2;3;0;0;4;5;0",
        "aff_unique_norm": "University of Hong Kong;Shanghai Artificial Intelligence Laboratory;Shanghai AI Lab;Tsinghua University;Shanghai AI Laboratory;Chinese University of Hong Kong",
        "aff_unique_dep": ";;;;;",
        "aff_unique_url": "https://www.hku.hk;http://www.shailab.org/;https://www.shanghaiailab.com;https://www.tsinghua.edu.cn;https://www.shanghai-ai-lab.com;https://www.cuhk.edu.hk",
        "aff_unique_abbr": "HKU;Shanghai AI Lab;SAIL;THU;SAIL;CUHK",
        "aff_campus_unique_index": "0;0;0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "aUUK8zQuXk",
        "title": "CompanyKG: A Large-Scale Heterogeneous Graph for Company Similarity Quantification",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In the investment industry, it is often essential to carry out fine-grained company similarity quantification for a range of purposes, including market mapping, competitor analysis, and mergers and acquisitions. We propose and publish a knowledge graph, named CompanyKG, to represent and learn diverse company features and relations. Specifically, 1.17 million companies are represented as nodes enriched with company description embeddings; and 15 different inter-company relations result in 51.06 million weighted edges. To enable a comprehensive assessment of methods for company similarity quantification, we have devised and compiled three evaluation tasks with annotated test sets: similarity prediction, competitor retrieval and similarity ranking. We present extensive benchmarking results for 11 reproducible predictive methods categorized into three groups: node-only, edge-only, and node+edge. To the best of our knowledge, CompanyKG is the first large-scale heterogeneous graph dataset originating from a real-world investment platform, tailored for quantifying inter-company similarity.",
        "keywords": "knowledge graph;company similarity quantification;heterogeneous graph;benchmarks;self-supervised learning;graph neural network;text embedding;similarity prediction;similarity ranking;competitor retrieval;investment;private equity",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/f928b2a48607e113f89e312ea618ea36a1a8a7e6.zip",
        "author": "Lele Cao;Vilhelm von Ehrenheim;Mark Granroth-Wilding;Richard Stahl;Andrew McCornack;Dhiana Deva",
        "authorids": "~Lele_Cao1;~Vilhelm_von_Ehrenheim1;~Mark_Granroth-Wilding2;richard.stahl@eqtpartners.com;~Andrew_McCornack1;dhiana.deva@eqtpartners.com",
        "gender": "M;M;;;;",
        "homepage": "http://llcresearch.com;;https://mark.granroth-wilding.co.uk/;;;",
        "dblp": "155/3234;;;;;",
        "google_scholar": "xM2shP8AAAAJ;;;;;",
        "orcid": "0000-0002-5680-9031;0000-0002-4210-4989;;;0009-0000-4516-0137;",
        "linkedin": "caolele/;vilhelm-von-ehrenheim;;;;",
        "or_profile": "~Lele_Cao1;~Vilhelm_von_Ehrenheim1;~Mark_Granroth-Wilding2;richard.stahl@eqtpartners.com;~Andrew_McCornack1;dhiana.deva@eqtpartners.com",
        "aff": "EQT (Motherbrain);EQT;Silo AI;;EQT;",
        "aff_domain": "eqtpartners.com;eqtgroup.com;silo.ai;;eqtpartners.com;",
        "position": "Principal Researcher;Researcher;Senior AI Scientist;;Researcher;",
        "bibtex": "@misc{\ncao2024companykg,\ntitle={Company{KG}: A Large-Scale Heterogeneous Graph for Company Similarity Quantification},\nauthor={Lele Cao and Vilhelm von Ehrenheim and Mark Granroth-Wilding and Richard Stahl and Andrew McCornack and Dhiana Deva},\nyear={2024},\nurl={https://openreview.net/forum?id=aUUK8zQuXk}\n}",
        "github": "",
        "project": "",
        "reviewers": "3BPH;cqXj;tTAV;Fmgf",
        "site": "https://openreview.net/forum?id=aUUK8zQuXk",
        "pdf_size": 2681999,
        "rating": "3;3;3;3",
        "confidence": "3;4;4;4",
        "soundness": "3;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "3;3;2;4",
        "wc_summary": "87;51;25;67",
        "wc_strengths": "61;69;41;107",
        "wc_weaknesses": "28;402;106;197",
        "wc_questions": "25;53;4;17",
        "wc_review": "201;575;176;388",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            57.5,
            22.688102609076854
        ],
        "wc_strengths_avg": [
            69.5,
            23.93219588754864
        ],
        "wc_weaknesses_avg": [
            183.25,
            139.7415024250133
        ],
        "wc_questions_avg": [
            24.75,
            17.949582167838894
        ],
        "wc_review_avg": [
            335.0,
            160.97049419070564
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18079807125373942526&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "EQT;Silo AI",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.eqt.com;https://silo.ai",
        "aff_unique_abbr": "EQT;Silo AI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;2",
        "aff_country_unique": "Sweden;;Finland"
    },
    {
        "id": "aVPFuXDINt",
        "title": "DURENDAL: Graph deep learning framework for temporal heterogeneous networks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Temporal heterogeneous networks (THNs) are evolving networks that characterize many real-world applications such as citation and events networks, recommender systems, and knowledge graphs. Although different Graph Neural Networks (GNNs) have been successfully applied to dynamic graphs, most of them only support homogeneous graphs or suffer from model design heavily influenced by specific THNs prediction tasks. Furthermore, there is a lack of temporal heterogeneous networked data in current standard graph benchmark datasets. Hence, in this work, we propose DURENDAL, a graph deep learning framework for THNs. DURENDAL can help to easily repurpose any heterogeneous graph learning model to evolving networks by combining design principles from snapshot-based and multirelational message-passing graph learning models. We introduce two different schemes to update embedding representations for THNs, discussing the strengths and weaknesses of both strategies. We also extend the set of benchmarks for TNHs by introducing two novel high-resolution temporal heterogeneous graph datasets derived from an emerging Web3 platform and a well-established e-commerce website. Overall, we conducted the experimental evaluation of the framework over four temporal heterogeneous network datasets on future link prediction tasks in an evaluation setting that takes into account the evolving nature of the data. Experiments show the prediction power of DURENDAL compared to current solutions for evolving and dynamic graphs, and the effectiveness of its model design.",
        "keywords": "Graph Neural Networks;Temporal Graph Learning;Heterogeneous Graph Learning;Dynamic Networks",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Manuel Dileo;Matteo Zignani;Sabrina Tiziana Gaito",
        "authorids": "~Manuel_Dileo1;~Matteo_Zignani1;~Sabrina_Tiziana_Gaito1",
        "gender": "M;M;F",
        "homepage": "https://manuel-dileo.github.io/;;https://connets.di.unimi.it/",
        "dblp": "332/6627;15/8929;81/2080",
        "google_scholar": "g6FUHEgAAAAJ;6p9cPxAAAAAJ;vUmucpoAAAAJ",
        "orcid": "0000-0002-4861-455X;0000-0002-4808-4106;",
        "linkedin": "manuel-dileo/;;",
        "or_profile": "~Manuel_Dileo1;~Matteo_Zignani1;~Sabrina_Tiziana_Gaito1",
        "aff": "University of Milan;University of Milan;University of Milan",
        "aff_domain": "unimi.it;unimi.it;unimi.it",
        "position": "PhD student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\ndileo2024durendal,\ntitle={{DURENDAL}: Graph deep learning framework for temporal heterogeneous networks},\nauthor={Manuel Dileo and Matteo Zignani and Sabrina Tiziana Gaito},\nyear={2024},\nurl={https://openreview.net/forum?id=aVPFuXDINt}\n}",
        "github": "",
        "project": "",
        "reviewers": "fQVE;fYw8;Kepe;qqSc",
        "site": "https://openreview.net/forum?id=aVPFuXDINt",
        "pdf_size": 447282,
        "rating": "3;3;6;6",
        "confidence": "4;3;4;5",
        "soundness": "3;2;2;3",
        "contribution": "1;2;2;3",
        "presentation": "1;1;3;4",
        "wc_summary": "51;34;148;57",
        "wc_strengths": "21;22;63;88",
        "wc_weaknesses": "176;50;166;90",
        "wc_questions": "2;39;188;103",
        "wc_review": "250;145;565;338",
        "wc_reply_reviewers": "89;0;155;0",
        "wc_reply_authors": "1134;1174;1557;737",
        "reply_reviewers": "1;0;2;0",
        "reply_authors": "3;2;3;1",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            1.299038105676658
        ],
        "wc_summary_avg": [
            72.5,
            44.39876124398067
        ],
        "wc_strengths_avg": [
            48.5,
            28.412145290350743
        ],
        "wc_weaknesses_avg": [
            120.5,
            52.561868307738074
        ],
        "wc_questions_avg": [
            83.0,
            70.57265759485043
        ],
        "wc_review_avg": [
            324.5,
            154.75222130877475
        ],
        "wc_reply_reviewers_avg": [
            61.0,
            65.310795432302
        ],
        "wc_reply_authors_avg": [
            1150.5,
            290.27960658647726
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.7071067811865476,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4064285158316681707&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Milan",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.unimi.it",
        "aff_unique_abbr": "UniMi",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Italy"
    },
    {
        "id": "aVlDNbvmCK",
        "title": "Architectural Insights for efficient Physics-Informed Neural Network optimization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Physics-informed neural networks (PINNs) offer a promising avenue for tackling both forward and inverse problems in partial differential equations (PDEs) by combining deep learning with fundamental physics principles. Despite their remarkable empirical success, PINNs have garnered a reputation for their notorious training challenges across a spectrum of PDEs. In this work, we delve into the intricacies of PINN optimization from a neural architecture perspective. Leveraging the Neural Tangent Kernel (NTK), our study reveals that Gaussian activations surpass several alternate activations when it comes to effectively training PINNs. Building on insights from numerical linear algebra, we introduce a preconditioned neural architecture, showcasing how such tailored architectures enhance the optimization process. Our theoretical findings are substantiated through rigorous validation against established PDEs within the scientific literature.",
        "keywords": "Physics informed neural networks (PINNs);optimization of physics informed neural networks;theoretical insights on PINNs",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Hemanth Saratchandran;Shin-Fang Chng;Simon Lucey",
        "authorids": "~Hemanth_Saratchandran1;~Shin-Fang_Chng1;~Simon_Lucey2",
        "gender": ";F;M",
        "homepage": ";https://sfchng.github.io;https://www.adelaide.edu.au/directory/simon.lucey",
        "dblp": ";249/5593;01/3542",
        "google_scholar": ";;vmAe35UAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Hemanth_Saratchandran1;~Shin-Fang_Chng1;~Simon_Lucey2",
        "aff": ";University of Adelaide;University of Adelaide",
        "aff_domain": ";adelaide.edu.au;adelaide.edu.au",
        "position": ";Postdoc;Full Professor",
        "bibtex": "@misc{\nsaratchandran2024architectural,\ntitle={Architectural Insights for efficient Physics-Informed Neural Network optimization},\nauthor={Hemanth Saratchandran and Shin-Fang Chng and Simon Lucey},\nyear={2024},\nurl={https://openreview.net/forum?id=aVlDNbvmCK}\n}",
        "github": "",
        "project": "",
        "reviewers": "5UPq;vRbU;EzKm;Az9b",
        "site": "https://openreview.net/forum?id=aVlDNbvmCK",
        "pdf_size": 2313539,
        "rating": "3;3;3;5",
        "confidence": "3;4;3;4",
        "soundness": "2;2;3;3",
        "contribution": "3;2;3;2",
        "presentation": "2;2;3;2",
        "wc_summary": "62;16;77;137",
        "wc_strengths": "50;21;79;40",
        "wc_weaknesses": "329;66;317;539",
        "wc_questions": "95;35;160;5",
        "wc_review": "536;138;633;721",
        "wc_reply_reviewers": "755;0;0;111",
        "wc_reply_authors": "3229;1173;2016;2228",
        "reply_reviewers": "3;0;0;1",
        "reply_authors": "6;2;4;5",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            73.0,
            43.24927745061182
        ],
        "wc_strengths_avg": [
            47.5,
            20.958291915134687
        ],
        "wc_weaknesses_avg": [
            312.75,
            167.59829205573666
        ],
        "wc_questions_avg": [
            73.75,
            59.41117319158072
        ],
        "wc_review_avg": [
            507.0,
            222.8643084928585
        ],
        "wc_reply_reviewers_avg": [
            216.5,
            314.18823975445036
        ],
        "wc_reply_authors_avg": [
            2161.5,
            731.8266529718633
        ],
        "reply_reviewers_avg": [
            1.0,
            1.224744871391589
        ],
        "reply_authors_avg": [
            4.25,
            1.479019945774904
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:r0ivmYv7ZkoJ:scholar.google.com/&scioq=Architectural+Insights+for+efficient+Physics-Informed+Neural+Network+optimization&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Adelaide",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.adelaide.edu.au",
        "aff_unique_abbr": "Adelaide",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Australia"
    },
    {
        "id": "aVtQChA6WH",
        "title": "Distributional off-policy evaluation with Bellman residual minimization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We consider the problem of distributional off-policy evaluation which serves as the foundation of many distributional reinforcement learning (DRL) algorithms. In contrast to most existing works (that rely on  supremum-extended statistical distances), we study the expectation-extended statistical distance for quantifying the Bellman residuals and provide the corresponding theoretical supports. Extending the framework of Bellman residual minimization to DRL, we propose a method called Energy Bellman Residual Minimization (EBRM) to estimate the return distribution. We establish a finite-sample error bound for the EBRM estimator under a realizability assumption. Additionally, we introduce a variant of our method based on a multi-step bootstrapping procedure to enable multi-step extension. By selecting an appropriate step level, we obtain a better error bound for this variant of EBRM compared to a single-step EBRM, under non-realizability settings. Finally, we demonstrate the superior performance of our method through simulation studies, comparing it to other existing methods.",
        "keywords": "distributional reinforcement learning;off-policy evaluation;infinite horizon;finite sample error",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/a65a274321f35f5a3a1fc722f84c242aac1bbacc.pdf",
        "author": "Sungee Hong;Zhengling Qi;Raymond K. W. Wong",
        "authorids": "~Sungee_Hong1;~Zhengling_Qi1;~Raymond_K._W._Wong1",
        "gender": "M;;",
        "homepage": ";https://sites.google.com/view/statsqizl/home?authuser=0;",
        "dblp": ";173/0201;",
        "google_scholar": "esII_m0AAAAJ;;",
        "orcid": ";;",
        "linkedin": "sungee-hong-24b850224/;;",
        "or_profile": "~Sungee_Hong1;~Zhengling_Qi1;~Raymond_K._W._Wong1",
        "aff": "Texas A&M University - College Station;George Washington University;",
        "aff_domain": "tamu.edu;gwu.edu;",
        "position": "PhD student;Assistant Professor;",
        "bibtex": "@misc{\nhong2024distributional,\ntitle={Distributional off-policy evaluation with Bellman residual minimization},\nauthor={Sungee Hong and Zhengling Qi and Raymond K. W. Wong},\nyear={2024},\nurl={https://openreview.net/forum?id=aVtQChA6WH}\n}",
        "github": "",
        "project": "",
        "reviewers": "TZPn;nT6h;3TV7;bA5m",
        "site": "https://openreview.net/forum?id=aVtQChA6WH",
        "pdf_size": 346295,
        "rating": "3;6;6;8",
        "confidence": "3;4;3;2",
        "soundness": "2;3;3;3",
        "contribution": "1;2;3;3",
        "presentation": "2;1;3;3",
        "wc_summary": "99;54;74;16",
        "wc_strengths": "31;13;148;34",
        "wc_weaknesses": "109;175;99;21",
        "wc_questions": "43;87;97;1",
        "wc_review": "282;329;418;72",
        "wc_reply_reviewers": "0;44;60;0",
        "wc_reply_authors": "1740;1186;1697;378",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "5;4;5;2",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            60.75,
            30.359306645574105
        ],
        "wc_strengths_avg": [
            56.5,
            53.434539391670626
        ],
        "wc_weaknesses_avg": [
            101.0,
            54.644304369257
        ],
        "wc_questions_avg": [
            57.0,
            38.18376618407357
        ],
        "wc_review_avg": [
            275.25,
            127.10502547106468
        ],
        "wc_reply_reviewers_avg": [
            26.0,
            26.60826939130014
        ],
        "wc_reply_authors_avg": [
            1250.25,
            548.7232339713711
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            4.0,
            1.224744871391589
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.39605901719066966,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:6joA6q9b7LoJ:scholar.google.com/&scioq=Distributional+off-policy+evaluation+with+Bellman+residual+minimization&hl=en&as_sdt=0,5",
        "gs_version_total": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Texas A&M University;George Washington University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tamu.edu;https://www.gwu.edu",
        "aff_unique_abbr": "TAMU;GWU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "College Station;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "aX4fOLHrXT",
        "title": "Can General-Purpose Language Models Emulate a General-Purpose Computer In-Context?",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Several recent works have drawn parallels between modern Large Language Models (LLMs) and general-purpose computers, suggesting that language serves as their programming interface. In this study, we test part of this analogy; specifically, we investigate whether a pretrained LLM can emulate a memory-bounded, reduced instruction-set based computer by executing random programs through looped inference calls. All this within the model's own context window, and without the aid of external mechanisms such as associative memory or interpreters. The abstraction level of these programs is based on two general-purpose computational models - the SUBLEQ One-Instruction Set Computer (OISC) and the Minsky counter machine. Our prompts are carefully designed in a data-agnostic manner, and we conduct studies to examine failure modes related to the emulated computer functionality. Our findings indicate that certain models are capable of efficiently executing general-purpose instructions, despite not being explicitly trained for such a task. This suggests intriguing implications for AI alignment, as some models demonstrate the ability to \\emph{autonomously} emulate the operation of a general-purpose computer.",
        "keywords": "large language models;general-purpose computing;AI alignment",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Vasilis Papageorgiou;Jy-yong Sohn;Kangwook Lee;Dimitris Papailiopoulos",
        "authorids": "~Vasilis_Papageorgiou1;~Jy-yong_Sohn1;~Kangwook_Lee1;~Dimitris_Papailiopoulos1",
        "gender": "M;M;M;M",
        "homepage": "https://v-papageorgiou.github.io/;https://itml.yonsei.ac.kr/professor;http://kangwooklee.com/;http://papail.io",
        "dblp": "291/5162;188/6303;88/9826-1;",
        "google_scholar": "dUQ-VYsAAAAJ;https://scholar.google.co.kr/citations?user=Cs75s1MAAAAJ;sCEl8r-n5VEC;hYi6i9sAAAAJ",
        "orcid": "0009-0002-2363-8560;;;",
        "linkedin": "v-papageorgiou/;;;",
        "or_profile": "~Vasilis_Papageorgiou1;~Jy-yong_Sohn1;~Kangwook_Lee1;~Dimitris_Papailiopoulos1",
        "aff": "University of Wisconsin - Madison;Yonsei University;KRAFTON;University of Wisconsin - Madison",
        "aff_domain": "wisc.edu;yonsei.ac.kr;krafton.com;wisc.edu",
        "position": "PhD student;Assistant Professor;Researcher;Associate Professor",
        "bibtex": "@misc{\npapageorgiou2024can,\ntitle={Can General-Purpose Language Models Emulate a General-Purpose Computer In-Context?},\nauthor={Vasilis Papageorgiou and Jy-yong Sohn and Kangwook Lee and Dimitris Papailiopoulos},\nyear={2024},\nurl={https://openreview.net/forum?id=aX4fOLHrXT}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZKpH;xPeX;Brom;nL65",
        "site": "https://openreview.net/forum?id=aX4fOLHrXT",
        "pdf_size": 564206,
        "rating": "3;3;3;3",
        "confidence": "4;5;5;4",
        "soundness": "3;4;1;2",
        "contribution": "1;1;1;1",
        "presentation": "3;4;1;3",
        "wc_summary": "78;34;66;89",
        "wc_strengths": "38;32;28;99",
        "wc_weaknesses": "266;277;830;188",
        "wc_questions": "3;74;30;76",
        "wc_review": "385;417;954;452",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            1.118033988749895
        ],
        "contribution_avg": [
            1.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            66.75,
            20.58367071248469
        ],
        "wc_strengths_avg": [
            49.25,
            28.94283158227612
        ],
        "wc_weaknesses_avg": [
            390.25,
            256.197555608948
        ],
        "wc_questions_avg": [
            45.75,
            30.776411421736615
        ],
        "wc_review_avg": [
            552.0,
            233.30130732595563
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:DS-_8VJpcmYJ:scholar.google.com/&scioq=Can+General-Purpose+Language+Models+Emulate+a+General-Purpose+Computer+In-Context%3F&hl=en&as_sdt=0,48",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "University of Wisconsin-Madison;Yonsei University;KRAFTON Inc.",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.wisc.edu;https://www.yonsei.ac.kr;https://www.krafton.com",
        "aff_unique_abbr": "UW-Madison;Yonsei;KRAFTON",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Madison;",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "United States;South Korea"
    },
    {
        "title": "Multi-Task Reinforcement Learning with Mixture of Orthogonal Experts",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18365",
        "id": "aZH1dM3GOX",
        "author_site": "Ahmed Hendawy, Jan Peters, Carlo D'Eramo",
        "tldr": "",
        "abstract": "Multi-Task Reinforcement Learning (MTRL) tackles the long-standing problem of endowing agents with skills that generalize across a variety of problems. To this end, sharing representations plays a fundamental role in capturing both unique and common characteristics of the tasks. Tasks may exhibit similarities in terms of skills, objects, or physical properties while leveraging their representations eases the achievement of a universal policy. Nevertheless, the pursuit of learning a shared set of diverse representations is still an open challenge. In this paper, we introduce a novel approach for representation learning in MTRL that encapsulates common structures among the tasks using orthogonal representations to promote diversity. Our method, named Mixture Of Orthogonal Experts (MOORE), leverages a Gram-Schmidt process to shape a shared subspace of representations generated by a mixture of experts. When task-specific information is provided, MOORE generates relevant representations from this shared subspace. We assess the effectiveness of our approach on two MTRL benchmarks, namely MiniGrid and MetaWorld, showing that MOORE surpasses related baselines and establishes a new state-of-the-art result on MetaWorld.",
        "keywords": "Reinforcement Learning;Multi-Task Learning;Mixture of Experts",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Ahmed Hendawy;Jan Peters;Carlo D'Eramo",
        "authorids": "~Ahmed_Hendawy1;~Jan_Peters3;~Carlo_D'Eramo2",
        "gender": "M;M;M",
        "homepage": "https://ahmedhendawy.de;https://www.jan-peters.net;https://carloderamo.wixsite.com/home",
        "dblp": ";p/JanPeters1;182/8953",
        "google_scholar": "https://scholar.google.de/citations?user=nwW0K8UAAAAJ;https://scholar.google.de/citations?user=-kIVAcAAAAAJ;https://scholar.google.it/citations?user=1Rt_86gAAAAJ",
        "orcid": "0000-0002-8088-3004;0000-0002-5266-8091;0000-0003-2712-118X",
        "linkedin": "ahmed-magdy-hendawy;janrpeters/;carlo-d-eramo-6438a289/",
        "or_profile": "~Ahmed_Hendawy1;~Jan_Peters3;~Carlo_D'Eramo2",
        "aff": "Technische Universit\u00e4t Darmstadt;TU Darmstadt;TU Darmstadt",
        "aff_domain": "tu-darmstadt.de;tu-darmstadt.de;tu-darmstadt.de",
        "position": "PhD student;Full Professor;Postdoc",
        "bibtex": "@inproceedings{\nhendawy2024multitask,\ntitle={Multi-Task Reinforcement Learning with Mixture of Orthogonal Experts},\nauthor={Ahmed Hendawy and Jan Peters and Carlo D'Eramo},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=aZH1dM3GOX}\n}",
        "github": "",
        "project": "",
        "reviewers": "pAYF;gg3H;duFe;78VR;stvx",
        "pdf_size": 1378946,
        "rating": "5;5;6;6;6",
        "confidence": "5;4;3;3;3",
        "soundness": "3;3;3;2;3",
        "contribution": "2;2;2;3;3",
        "presentation": "2;3;2;3;2",
        "wc_summary": "91;77;194;101;100",
        "wc_strengths": "81;23;113;53;47",
        "wc_weaknesses": "147;218;73;72;267",
        "wc_questions": "120;59;217;2;117",
        "wc_review": "439;377;597;228;531",
        "wc_reply_reviewers": "376;0;125;0;10",
        "wc_reply_authors": "2779;992;1394;179;1040",
        "reply_reviewers": "2;0;1;0;1",
        "reply_authors": "5;2;2;1;2",
        "rating_avg": [
            5.6,
            0.48989794855663565
        ],
        "confidence_avg": [
            3.6,
            0.8
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            112.6,
            41.60096152734934
        ],
        "wc_strengths_avg": [
            63.4,
            30.916662174303355
        ],
        "wc_weaknesses_avg": [
            155.4,
            77.703539172936
        ],
        "wc_questions_avg": [
            103.0,
            71.57932662438228
        ],
        "wc_review_avg": [
            434.4,
            127.81799560312312
        ],
        "wc_reply_reviewers_avg": [
            102.2,
            144.8287264322931
        ],
        "wc_reply_authors_avg": [
            1276.8,
            850.022446762437
        ],
        "reply_reviewers_avg": [
            0.8,
            0.7483314773547883
        ],
        "reply_authors_avg": [
            2.4,
            1.3564659966250538
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.9185586535436916,
        "gs_citation": 20,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15956915544175636283&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=aZH1dM3GOX",
        "pdf": "https://openreview.net/pdf?id=aZH1dM3GOX",
        "email": "tu-darmstadt.de;tu-darmstadt.de;tu-darmstadt.de",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Technische Universit\u00e4t Darmstadt",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tu-darmstadt.de",
        "aff_unique_abbr": "TUD",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Darmstadt",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "title": "Soft Mixture Denoising: Beyond the Expressive Bottleneck of Diffusion Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18364",
        "id": "aaBnFAyW9O",
        "author_site": "Yangming Li, Boris van Breugel, Mihaela van der Schaar",
        "tldr": "",
        "abstract": "Because diffusion models have shown impressive performances in a number of tasks, such as image synthesis, there is a trend in recent works to prove (with certain assumptions) that these models have strong approximation capabilities. In this paper, we show that current diffusion models actually have an expressive bottleneck in backward denoising and some assumption made by existing theoretical guarantees is too strong. Based on this finding, we prove that diffusion models have unbounded errors in both local and global denoising. In light of our theoretical studies, we introduce soft mixture denoising (SMD), an expressive and efficient model for backward denoising. SMD not only permits diffusion models to well approximate any Gaussian mixture distributions in theory, but also is simple and efficient for implementation. Our experiments on multiple image datasets show that SMD significantly improves different types of diffusion models (e.g., DDPM), espeically in the situation of few backward iterations.",
        "keywords": "Diffusion Models;Expressive Bottleneck;Soft Mixture Denoising (SMD)",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Yangming Li;Boris van Breugel;Mihaela van der Schaar",
        "authorids": "~Yangming_Li1;~Boris_van_Breugel2;~Mihaela_van_der_Schaar2",
        "gender": ";;F",
        "homepage": ";;https://www.vanderschaar-lab.com",
        "dblp": ";284/0835;",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;DZ3S--MAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Yangming_Li1;~Boris_van_Breugel2;~Mihaela_van_der_Schaar2",
        "aff": ";University of Cambridge;University of California, Los Angeles",
        "aff_domain": ";cam.ac.uk;ucla.edu",
        "position": ";PhD student;Full Professor",
        "bibtex": "@inproceedings{\nli2024soft,\ntitle={Soft Mixture Denoising: Beyond the Expressive Bottleneck of Diffusion Models},\nauthor={Yangming Li and Boris van Breugel and Mihaela van der Schaar},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=aaBnFAyW9O}\n}",
        "github": "",
        "project": "",
        "reviewers": "eLFe;izts;nQBi;mAPH",
        "pdf_size": 2847654,
        "rating": "5;6;8;8",
        "confidence": "4;4;4;4",
        "soundness": "3;2;4;3",
        "contribution": "3;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "110;86;41;76",
        "wc_strengths": "38;25;44;28",
        "wc_weaknesses": "58;267;45;10",
        "wc_questions": "65;118;86;72",
        "wc_review": "271;496;216;186",
        "wc_reply_reviewers": "0;651;17;10",
        "wc_reply_authors": "841;2191;562;169",
        "reply_reviewers": "0;2;1;1",
        "reply_authors": "3;5;2;2",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            78.25,
            24.80297361204902
        ],
        "wc_strengths_avg": [
            33.75,
            7.628073151196179
        ],
        "wc_weaknesses_avg": [
            95.0,
            100.84393883620373
        ],
        "wc_questions_avg": [
            85.25,
            20.363877332178173
        ],
        "wc_review_avg": [
            292.25,
            121.52031723131734
        ],
        "wc_reply_reviewers_avg": [
            169.5,
            278.05979572746577
        ],
        "wc_reply_authors_avg": [
            940.75,
            760.2836230644456
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            3.0,
            1.224744871391589
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8563786156115255548&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=aaBnFAyW9O",
        "pdf": "https://openreview.net/pdf?id=aaBnFAyW9O",
        "email": ";cam.ac.uk;ucla.edu",
        "author_num": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Cambridge;University of California, Los Angeles",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cam.ac.uk;https://www.ucla.edu",
        "aff_unique_abbr": "Cambridge;UCLA",
        "aff_campus_unique_index": "0;1",
        "aff_campus_unique": "Cambridge;Los Angeles",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "id": "aaYBsuGRne",
        "title": "Understanding In-context Learning with a Pelican Soup Hypothesis",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Motivated by Pelican Soup riddles, we propose a hypothesis, the Pelican Soup Hypothesis, to explain the in-context learning ability of large language models. We propose a simple but general formalism for natural language classification problems. With this formalism, we show how to understand in-context learning as the generalization of modeling some linguistic phenomena under distribution shifts. We provide evidence supporting this hypothesis. First, we synthesize a dataset called Calcutec that replicates the linguistic phenomena and show that language models trained with this dataset acquire in-context learning ability and benefit from chain-of-thought. Second, our experiment of GPT-2 on some natural language tasks shows the linkage between one of the linguistic phenomena and in-context learning. Third, we use a digit addition task to inspect one of the identified distribution shift type and find that larger models generalize better. Our contributions offer a way to better understand how and why in-context learning works, and our Calcutec and digit addition tasks will facilitate future studies on\nin-context learning.",
        "keywords": "In-context Learning;chain-of-thought",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Ting-Rui Chiang;Dani Yogatama",
        "authorids": "~Ting-Rui_Chiang1;~Dani_Yogatama2",
        "gender": "Not Specified;",
        "homepage": "https://ctinray.github.io/;",
        "dblp": "230/3609;08/8178",
        "google_scholar": "aIgoIxwAAAAJ;",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Ting-Rui_Chiang1;~Dani_Yogatama1",
        "aff": "University of Southern California;Google DeepMind",
        "aff_domain": "usc.edu;google.com",
        "position": "PhD student;Research Scientist",
        "bibtex": "@misc{\nchiang2024understanding,\ntitle={Understanding In-context Learning with a Pelican Soup Hypothesis},\nauthor={Ting-Rui Chiang and Dani Yogatama},\nyear={2024},\nurl={https://openreview.net/forum?id=aaYBsuGRne}\n}",
        "github": "",
        "project": "",
        "reviewers": "5jds;MUGa;rNJR;hbQa;cdtQ",
        "site": "https://openreview.net/forum?id=aaYBsuGRne",
        "pdf_size": 1113314,
        "rating": "3;5;6;6;6",
        "confidence": "4;4;2;2;4",
        "soundness": "2;3;3;3;3",
        "contribution": "2;2;3;3;3",
        "presentation": "2;3;2;3;3",
        "wc_summary": "151;90;55;55;67",
        "wc_strengths": "82;75;31;55;91",
        "wc_weaknesses": "542;212;310;175;40",
        "wc_questions": "29;52;6;4;54",
        "wc_review": "804;429;402;289;252",
        "wc_reply_reviewers": "331;56;27;195;0",
        "wc_reply_authors": "498;410;689;354;386",
        "reply_reviewers": "1;1;1;1;0",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            5.2,
            1.16619037896906
        ],
        "confidence_avg": [
            3.2,
            0.9797958971132712
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            83.6,
            36.04219749127403
        ],
        "wc_strengths_avg": [
            66.8,
            21.46997904051143
        ],
        "wc_weaknesses_avg": [
            255.8,
            167.25118833658553
        ],
        "wc_questions_avg": [
            29.0,
            21.484878403193257
        ],
        "wc_review_avg": [
            435.2,
            196.00551012662882
        ],
        "wc_reply_reviewers_avg": [
            121.8,
            124.31797939155864
        ],
        "wc_reply_authors_avg": [
            467.4,
            120.68405031320418
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.560112033611204,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:bEYIf4Ow7uEJ:scholar.google.com/&scioq=Understanding+In-context+Learning+with+a+Pelican+Soup+Hypothesis&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Southern California;Google",
        "aff_unique_dep": ";Google DeepMind",
        "aff_unique_url": "https://www.usc.edu;https://deepmind.com",
        "aff_unique_abbr": "USC;DeepMind",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Los Angeles;",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "title": "SCHEMA: State CHangEs MAtter for Procedure Planning in Instructional Videos",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18363",
        "id": "abL5LJNZ49",
        "author_site": "Yulei Niu, Wenliang Guo, Long Chen, Xudong Lin, Shih-Fu Chang",
        "tldr": "",
        "abstract": "We study the problem of procedure planning in instructional videos, which aims to make a goal-oriented sequence of action steps given partial visual state observations. The motivation of this problem is to learn a structured and plannable state and action space. Recent works succeeded in sequence modeling of steps with only sequence-level annotations accessible during training, which overlooked the roles of states in the procedures. In this work, we point out that State CHangEs MAtter (SCHEMA) for procedure planning in instructional videos. We aim to establish a more structured state space by investigating the causal relations between steps and states in procedures. Specifically, we explicitly represent each step as state changes and track the state changes in procedures. For step representation, we leveraged the commonsense knowledge in large language models (LLMs) to describe the state changes of steps via our designed chain-of-thought prompting. For state changes tracking, we align visual state observations with language state descriptions via cross-modal contrastive learning, and explicitly model the intermediate states of the procedure using LLM-generated state descriptions. Experiments on CrossTask, COIN, and NIV benchmark datasets demonstrate that our proposed SCHEMA model achieves state-of-the-art performance and obtains explainable visualizations.",
        "keywords": "procedure planning; instructional video; state changes; large language models; vision and language alignment",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yulei Niu;Wenliang Guo;Long Chen;Xudong Lin;Shih-Fu Chang",
        "authorids": "~Yulei_Niu1;~Wenliang_Guo1;~Long_Chen8;~Xudong_Lin1;~Shih-Fu_Chang3",
        "gender": "M;M;M;M;M",
        "homepage": "https://yuleiniu.github.io;https://wenliangguo.github.io/;https://zjuchenlong.github.io/;;http://www.ee.columbia.edu/~sfchang/",
        "dblp": "165/2982;;64/5725-16;23/7723-3;c/ShihFuChang",
        "google_scholar": "WXd3dDwAAAAJ;pvB-ykIAAAAJ;https://scholar.google.com.sg/citations?user=-gtmMpIAAAAJ;https://scholar.google.com.hk/citations?hl=en;OMVTRscAAAAJ",
        "orcid": ";0000-0002-1418-4117;0000-0001-6148-9709;;",
        "linkedin": ";wenliang-guo;;;",
        "or_profile": "~Yulei_Niu1;~Wenliang_Guo1;~Long_Chen8;~Xudong_Lin1;~Shih-Fu_Chang3",
        "aff": "Columbia University;Columbia University;Hong Kong University of Science and Technology;Columbia University;Columbia University",
        "aff_domain": "columbia.edu;columbia.edu;ust.hk;columbia.edu;ee.columbia.edu",
        "position": "Postdoc;MS student;Assistant Professor;PhD student;Full Professor",
        "bibtex": "@inproceedings{\nniu2024schema,\ntitle={{SCHEMA}: State {CH}angEs {MA}tter for Procedure Planning in Instructional Videos},\nauthor={Yulei Niu and Wenliang Guo and Long Chen and Xudong Lin and Shih-Fu Chang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=abL5LJNZ49}\n}",
        "github": "",
        "project": "",
        "reviewers": "7dUf;hqkF;253f;FxtF",
        "pdf_size": 1775631,
        "rating": "6;6;6;8",
        "confidence": "3;4;5;4",
        "soundness": "3;3;3;3",
        "contribution": "3;3;2;3",
        "presentation": "3;3;2;3",
        "wc_summary": "90;78;120;74",
        "wc_strengths": "172;150;47;67",
        "wc_weaknesses": "76;234;125;265",
        "wc_questions": "119;72;265;14",
        "wc_review": "457;534;557;420",
        "wc_reply_reviewers": "22;0;127;0",
        "wc_reply_authors": "588;1837;1700;423",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "2;4;5;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            90.5,
            18.0208212909401
        ],
        "wc_strengths_avg": [
            109.0,
            53.051861418804144
        ],
        "wc_weaknesses_avg": [
            175.0,
            77.26901060580497
        ],
        "wc_questions_avg": [
            117.5,
            92.92604586443997
        ],
        "wc_review_avg": [
            492.0,
            55.673153314681215
        ],
        "wc_reply_reviewers_avg": [
            37.25,
            52.58980414491007
        ],
        "wc_reply_authors_avg": [
            1137.0,
            636.0357694343927
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.25,
            1.299038105676658
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4553216394037650371&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=abL5LJNZ49",
        "pdf": "https://openreview.net/pdf?id=abL5LJNZ49",
        "email": "columbia.edu;columbia.edu;ust.hk;columbia.edu;ee.columbia.edu",
        "author_num": 5,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "Columbia University;Hong Kong University of Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.columbia.edu;https://www.ust.hk",
        "aff_unique_abbr": "Columbia;HKUST",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "adQ2YC2IV7",
        "title": "Unleashing the Creative Mind: Language Model As Hierarchical Policy For Improved Exploration on Challenging Problem Solving",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) have achieved tremendous progress, yet they still often struggle with challenging reasoning problems. Current approaches address this challenge by sampling or searching detailed and low-level reasoning chains. However, these methods are still limited in their exploration capabilities, making it challenging for correct solutions to stand out in the huge solution space. In this work, we unleash LLMs' creative potential for exploring multiple diverse problem solving strategies by framing an LLM as a hierarchical policy via in-context learning. This policy comprises of a visionary leader that proposes multiple diverse high-level problem-solving tactics as hints, accompanied by a follower that executes detailed problem-solving processes following each of the high-level instruction. The follower uses each of the leader's directives as a guide and samples multiple reasoning chains to tackle the problem, generating a solution group for each leader proposal. Additionally, we propose an effective and efficient tournament-based approach to select among these explored solution groups to reach the final answer. Our approach produces meaningful and inspiring hints, enhances problem-solving strategy exploration, and improves the final answer accuracy on challenging problems in the MATH dataset.",
        "keywords": "Large Language Models;Reasoning;Hierarchical Policy",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "",
        "author": "Zhan Ling;Yunhao Fang;Xuanlin Li;Tongzhou Mu;Mingu Lee;Reza Pourreza;Roland Memisevic;Hao Su",
        "authorids": "~Zhan_Ling2;~Yunhao_Fang1;~Xuanlin_Li1;~Tongzhou_Mu1;~Mingu_Lee1;~Reza_Pourreza1;~Roland_Memisevic1;~Hao_Su1",
        "gender": "M;M;;M;M;;M;M",
        "homepage": ";https://seerkfang.github.io/;https://xuanlinli17.github.io/;http://cseweb.ucsd.edu/~t3mu/;;;;http://ai.ucsd.edu/~haosu",
        "dblp": "254/1980;;251/3029;183/0943;;;98/4508;09/4945-1",
        "google_scholar": "vsRxnYAAAAAJ;;7vyVxxQAAAAJ;uVsZydYAAAAJ;;;https://scholar.google.com/citations?hl=en;1P8Zu04AAAAJ",
        "orcid": ";;;;;;;",
        "linkedin": "zhan-ling-069a59149/;yunhao-fang-8b318221a/;xuanlin-li-4684b8145/;;mingu-lee-0aa28aa5/;;;",
        "or_profile": "~Zhan_Ling2;~Yunhao_Fang1;~Xuanlin_Li1;~Tongzhou_Mu1;~Mingu_Lee1;~Reza_Pourreza1;~Roland_Memisevic1;~Hao_Su1",
        "aff": "University of California, San Diego;University of California, San Diego;University of California, San Diego;University of California, San Diego;Qualcomm Inc, QualComm;;Qualcomm Inc, Qualcomm;University of California, San Diego",
        "aff_domain": "ucsd.edu;ucsd.edu;ucsd.edu;ucsd.edu;qti.qualcomm.com;;qti.qualcomm.com;ucsd.edu",
        "position": "PhD student;MS student;PhD student;PhD student;Researcher;;Researcher;Associate Professor",
        "bibtex": "@misc{\nling2024unleashing,\ntitle={Unleashing the Creative Mind: Language Model As Hierarchical Policy For Improved Exploration on Challenging Problem Solving},\nauthor={Zhan Ling and Yunhao Fang and Xuanlin Li and Tongzhou Mu and Mingu Lee and Reza Pourreza and Roland Memisevic and Hao Su},\nyear={2024},\nurl={https://openreview.net/forum?id=adQ2YC2IV7}\n}",
        "github": "",
        "project": "",
        "reviewers": "vZb3;Yers;qX4Z;ufPr",
        "site": "https://openreview.net/forum?id=adQ2YC2IV7",
        "pdf_size": 507262,
        "rating": "3;5;5;6",
        "confidence": "4;4;3;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;2;3",
        "wc_summary": "55;85;115;113",
        "wc_strengths": "50;84;73;79",
        "wc_weaknesses": "118;100;382;92",
        "wc_questions": "81;108;46;3",
        "wc_review": "304;377;616;287",
        "wc_reply_reviewers": "0;0;297;13",
        "wc_reply_authors": "853;1027;871;500",
        "reply_reviewers": "0;0;3;1",
        "reply_authors": "3;3;4;3",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            92.0,
            24.43358344574123
        ],
        "wc_strengths_avg": [
            71.5,
            13.009611831257688
        ],
        "wc_weaknesses_avg": [
            173.0,
            121.03305333668155
        ],
        "wc_questions_avg": [
            59.5,
            39.33509883043387
        ],
        "wc_review_avg": [
            396.0,
            131.44010042601155
        ],
        "wc_reply_reviewers_avg": [
            77.5,
            126.8394654671802
        ],
        "wc_reply_authors_avg": [
            812.75,
            192.82683293566797
        ],
        "reply_reviewers_avg": [
            1.0,
            1.224744871391589
        ],
        "reply_authors_avg": [
            3.25,
            0.4330127018922193
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.6882472016116854,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9720436070100092743&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0;1;1;0",
        "aff_unique_norm": "University of California, San Diego;Qualcomm Incorporated",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ucsd.edu;https://www.qualcomm.com",
        "aff_unique_abbr": "UCSD;Qualcomm",
        "aff_campus_unique_index": "0;0;0;0;0",
        "aff_campus_unique": "San Diego;",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "On the Posterior Distribution in Denoising: Application to Uncertainty Quantification",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18362",
        "id": "adSGeugiuj",
        "author_site": "Hila Manor, Tomer Michaeli",
        "tldr": "",
        "abstract": "Denoisers play a central role in many applications, from noise suppression in low-grade imaging sensors, to empowering score-based generative models. The latter category of methods makes use of Tweedie's formula, which links the posterior mean in Gaussian denoising (*i*.*e*., the minimum MSE denoiser) with the score of the data distribution. Here, we derive a fundamental relation between the higher-order central moments of the posterior distribution, and the higher-order derivatives of the posterior mean. We harness this result for uncertainty quantification of pre-trained denoisers. Particularly, we show how to efficiently compute the principal components of the posterior distribution for any desired region of an image, as well as to approximate the full marginal distribution along those (or any other) one-dimensional directions. Our method is fast and memory-efficient, as it does not explicitly compute or store the high-order moment tensors and it requires no training or fine tuning of the denoiser. Code and examples are available on the project [website](https://hilamanor.github.io/GaussianDenoisingPosterior/).",
        "keywords": "Gaussian Denoising;Posterior Moments Estimation;Uncertainty Quantification;Uncertainty Visualization",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/d93ea6dcd5e88cf589245ecd8c3e1f761da41623.zip",
        "author": "Hila Manor;Tomer Michaeli",
        "authorids": "~Hila_Manor1;~Tomer_Michaeli1",
        "gender": "F;M",
        "homepage": "https://hilamanor.github.io/;https://tomer.net.technion.ac.il/",
        "dblp": "357/5326.html;70/3188.html",
        "google_scholar": "Pz32vm4AAAAJ;n2EbR2cAAAAJ",
        "orcid": "0009-0007-6851-148X;",
        "linkedin": "hilamanor/;",
        "or_profile": "~Hila_Manor1;~Tomer_Michaeli1",
        "aff": "Technion - Israel Institute of Technology, Technion - Israel Institute of Technology;Technion, Technion",
        "aff_domain": "campus.technion.ac.il;technion.ac.il",
        "position": "PhD student;Associate Professor",
        "bibtex": "@inproceedings{\nmanor2024on,\ntitle={On the Posterior Distribution in Denoising: Application to Uncertainty Quantification},\nauthor={Hila Manor and Tomer Michaeli},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=adSGeugiuj}\n}",
        "github": "",
        "project": "",
        "reviewers": "EK8x;N9TK;a3nf;HsMN",
        "pdf_size": 25279424,
        "rating": "3;6;6;8",
        "confidence": "3;3;3;5",
        "soundness": "3;4;2;4",
        "contribution": "1;3;3;3",
        "presentation": "2;4;3;4",
        "wc_summary": "28;68;57;74",
        "wc_strengths": "69;139;79;79",
        "wc_weaknesses": "112;123;110;244",
        "wc_questions": "2;60;137;4",
        "wc_review": "211;390;383;401",
        "wc_reply_reviewers": "237;26;69;0",
        "wc_reply_authors": "1883;588;1566;89",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "3;1;3;1",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            56.75,
            17.68297203526602
        ],
        "wc_strengths_avg": [
            91.5,
            27.726341266023542
        ],
        "wc_weaknesses_avg": [
            147.25,
            56.07751331861997
        ],
        "wc_questions_avg": [
            50.75,
            54.96987811520051
        ],
        "wc_review_avg": [
            346.25,
            78.34977664294902
        ],
        "wc_reply_reviewers_avg": [
            83.0,
            92.26321043622967
        ],
        "wc_reply_authors_avg": [
            1031.5,
            723.8337170925378
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            1.0
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.7276068751089989,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13285341529016725821&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=adSGeugiuj",
        "pdf": "https://openreview.net/pdf?id=adSGeugiuj",
        "email": "campus.technion.ac.il;technion.ac.il",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Technion - Israel Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.technion.ac.il/en/",
        "aff_unique_abbr": "Technion",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Israel"
    },
    {
        "title": "Decision ConvFormer: Local Filtering in MetaFormer is Sufficient for Decision Making",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18361",
        "id": "af2c8EaKl8",
        "author_site": "Jeonghye Kim, Su Young Lee, Woojun Kim, Youngchul Sung",
        "tldr": "",
        "abstract": "The recent success of Transformer in natural language processing has sparked its use in various domains. In offline reinforcement learning (RL), Decision Transformer (DT) is emerging as a promising model based on Transformer. However, we discovered that the attention module of DT is not appropriate to capture the inherent local dependence pattern in trajectories of RL modeled as a Markov decision process. To overcome the limitations of DT, we propose a novel action sequence predictor, named Decision ConvFormer (DC), based on the architecture of MetaFormer, which is a general structure to process multiple entities in parallel and understand the interrelationship among the multiple entities. DC employs local convolution filtering as the token mixer and can effectively capture the inherent local associations of the RL dataset. In extensive experiments, DC achieved state-of-the-art performance across various standard RL benchmarks while requiring fewer resources. Furthermore, we show that DC better understands the underlying meaning in data and exhibits enhanced generalization capability.",
        "keywords": "MetaFormer;Convolution;Reinforcement Learning;Representation Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/5325aaf4b979b27fa67304cceb5c8f8905e5cb82.zip",
        "author": "Jeonghye Kim;Suyoung Lee;Woojun Kim;Youngchul Sung",
        "authorids": "~Jeonghye_Kim1;~Suyoung_Lee4;~Woojun_Kim1;~Youngchul_Sung1",
        "gender": ";M;M;M",
        "homepage": "https://www.beanie00.com/;;https://sites.google.com/view/youngchulsung;https://suyoung-lee.github.io/",
        "dblp": "172/6718.html;236/4974;17/6798;31/4163",
        "google_scholar": "koDFScAAAAAJ;https://scholar.google.co.kr/citations?user=bcHWCBoAAAAJ;-9D2k3UAAAAJ;CWbdBy8AAAAJ",
        "orcid": ";;0000-0003-4536-6690;",
        "linkedin": "beanie00/;;;",
        "or_profile": "~Jeonghye_Kim1;~Woojun_Kim1;~Youngchul_Sung1;~Su_Young_Lee1",
        "aff": "Korea Advanced Institute of Science & Technology;Carnegie Mellon University;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;cmu.edu;kaist.ac.kr;kaist.ac.kr",
        "position": "MS student;Postdoc;Full Professor;PhD student",
        "bibtex": "@inproceedings{\nkim2024decision,\ntitle={Decision ConvFormer: Local Filtering in MetaFormer is Sufficient for Decision Making},\nauthor={Jeonghye Kim and Suyoung Lee and Woojun Kim and Youngchul Sung},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=af2c8EaKl8}\n}",
        "github": "",
        "project": "",
        "reviewers": "Eec1;TLiJ;dRz2",
        "pdf_size": 614818,
        "rating": "5;8;8",
        "confidence": "3;4;4",
        "soundness": "2;3;4",
        "contribution": "2;3;4",
        "presentation": "2;3;4",
        "wc_summary": "96;39;84",
        "wc_strengths": "140;33;108",
        "wc_weaknesses": "133;76;81",
        "wc_questions": "83;4;66",
        "wc_review": "452;152;339",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "2068;276;823",
        "reply_reviewers": "0;0;0",
        "reply_authors": "4;1;2",
        "rating_avg": [
            7.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            73.0,
            24.535688292770594
        ],
        "wc_strengths_avg": [
            93.66666666666667,
            44.842935774644474
        ],
        "wc_weaknesses_avg": [
            96.66666666666667,
            25.77250904010361
        ],
        "wc_questions_avg": [
            51.0,
            33.95094500402996
        ],
        "wc_review_avg": [
            314.3333333333333,
            123.71023491297
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1055.6666666666667,
            749.8516890396097
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 19,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5394848755466956269&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=af2c8EaKl8",
        "pdf": "https://openreview.net/pdf?id=af2c8EaKl8",
        "email": "kaist.ac.kr;cmu.edu;kaist.ac.kr;kaist.ac.kr",
        "author_num": 4,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology;Carnegie Mellon University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.kaist.ac.kr;https://www.cmu.edu",
        "aff_unique_abbr": "KAIST;CMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "title": "Entropy Coding of Unordered Data Structures",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18360",
        "id": "afQuNt3Ruh",
        "author_site": "Julius Kunze, Daniel Severo, Giulio Zani, Jan-Willem van de Meent, James Townsend",
        "tldr": "",
        "abstract": "We present shuffle coding, a general method for optimal compression of sequences of unordered objects using bits-back coding. Data structures that can be compressed using shuffle coding include multisets, graphs, hypergraphs, and others. We release an implementation that can easily be adapted to different data types and statistical models, and demonstrate that our implementation achieves state-of-the-art compression rates on a range of graph datasets including molecular data.",
        "keywords": "graph compression;entropy coding;neural compression;bits-back coding;lossless compression;generative models;information theory;probabilistic models;graph neural networks;multiset compression;asymmetric numeral systems;compression;entropy;shuffle coding",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Julius Kunze;Daniel Severo;Giulio Zani;Jan-Willem van de Meent;James Townsend",
        "authorids": "~Julius_Kunze1;~Daniel_Severo1;~Giulio_Zani2;~Jan-Willem_van_de_Meent1;~James_Townsend1",
        "gender": "M;M;M;M;M",
        "homepage": "http://juliuskunze.com;http://dsevero.com;https://salamanderxing.github.io/;https://jwvdm.github.io/;https://j-towns.github.io",
        "dblp": "202/2450;249/9390;;137/3263;159/2177",
        "google_scholar": "Nte3grUAAAAJ;5bQjLz4AAAAJ;;CX9Lu38AAAAJ;https://scholar.google.co.uk/citations?user=fhYBZTcAAAAJ",
        "orcid": ";0000-0003-0472-5300;;0000-0001-9465-5398;0000-0002-4210-2393",
        "linkedin": "juliuskunze/;danielsevero/;;;",
        "or_profile": "~Julius_Kunze1;~Daniel_Severo1;~Giulio_Zani2;~Jan-Willem_van_de_Meent1;~James_Townsend1",
        "aff": "University College London;Vector Institute;;University of Amsterdam;University of Amsterdam",
        "aff_domain": "ucl.ac.uk;vectorinstitute.ai;;uva.nl;uva.nl",
        "position": "PhD Student;PhD student;;Associate Professor;Postdoc",
        "bibtex": "@inproceedings{\nkunze2024entropy,\ntitle={Entropy Coding of Unordered Data Structures},\nauthor={Julius Kunze and Daniel Severo and Giulio Zani and Jan-Willem van de Meent and James Townsend},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=afQuNt3Ruh}\n}",
        "github": "",
        "project": "",
        "reviewers": "gbs3;NBHy;aWcE;72sp",
        "pdf_size": 308868,
        "rating": "5;6;6;8",
        "confidence": "2;3;3;4",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;3;3;2",
        "wc_summary": "94;63;82;41",
        "wc_strengths": "37;32;264;96",
        "wc_weaknesses": "117;100;433;78",
        "wc_questions": "33;35;661;132",
        "wc_review": "281;230;1440;347",
        "wc_reply_reviewers": "21;10;160;8",
        "wc_reply_authors": "182;517;564;456",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            70.0,
            20.062402647738878
        ],
        "wc_strengths_avg": [
            107.25,
            93.93448514789443
        ],
        "wc_weaknesses_avg": [
            182.0,
            145.57300573938838
        ],
        "wc_questions_avg": [
            215.25,
            260.4461316664158
        ],
        "wc_review_avg": [
            574.5,
            501.41524707571466
        ],
        "wc_reply_reviewers_avg": [
            49.75,
            63.84502721434145
        ],
        "wc_reply_authors_avg": [
            429.75,
            148.07493879789382
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.9733285267845754,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1981130064228285577&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=afQuNt3Ruh",
        "pdf": "https://openreview.net/pdf?id=afQuNt3Ruh",
        "email": "ucl.ac.uk;vectorinstitute.ai;;uva.nl;uva.nl",
        "author_num": 5,
        "aff_unique_index": "0;1;2;2",
        "aff_unique_norm": "University College London;Vector Institute;University of Amsterdam",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ucl.ac.uk;https://vectorinstitute.ai/;https://www.uva.nl",
        "aff_unique_abbr": "UCL;Vector Institute;UvA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;2",
        "aff_country_unique": "United Kingdom;Canada;Netherlands"
    },
    {
        "title": "Circumventing Concept Erasure Methods For Text-To-Image Generative Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18359",
        "id": "ag3o2T51Ht",
        "author_site": "Minh Pham, Kelly Marshall, Niv Cohen, Govind Mittal, Chinmay Hegde",
        "tldr": "",
        "abstract": "Text-to-image generative models can produce photo-realistic images for an extremely broad range of concepts, and their usage has proliferated widely among the general public. On the flip side, these models have numerous drawbacks, including their potential to generate images featuring sexually explicit content, mirror artistic styles without permission, or even hallucinate (or deepfake) the likenesses of celebrities. Consequently, various methods have been proposed in order to \"erase\" sensitive concepts from text-to-image models. In this work, we examine seven recently proposed concept erasure methods, and show that targeted concepts are not fully excised from any of these methods. Specifically, we leverage the existence of special learned word embeddings that can retrieve \"erased\" concepts from the sanitized models with no alterations to their weights. Our results highlight the brittleness of post hoc concept erasure methods, and call into question their use in the algorithmic toolkit for AI safety.",
        "keywords": "Model Editing;Diffusion Model;Concept Erasure",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Minh Pham;Kelly O. Marshall;Niv Cohen;Govind Mittal;Chinmay Hegde",
        "authorids": "~Minh_Pham3;~Kelly_O._Marshall1;~Niv_Cohen1;~Govind_Mittal1;~Chinmay_Hegde1",
        "gender": "M;M;M;M;M",
        "homepage": "https://www.mnpham.com/;;https://www.cs.huji.ac.il/w~nivc/;https://govindm.me;https://chinmayhegde.github.io/",
        "dblp": "34/3955-5;;259/2291;242/0556;39/2056",
        "google_scholar": "hJmhOloAAAAJ;;https://scholar.google.co.il/citations?user=ZMdC3OQAAAAJ;JR1C0tcAAAAJ;eJAV17IAAAAJ",
        "orcid": ";;;;",
        "linkedin": "mnphamx1/;kelly-marshall-031947151/;niv-cohen-39b49521/;https://linkedin.com/in/govindmittal;",
        "or_profile": "~Minh_Pham3;~Kelly_O._Marshall1;~Niv_Cohen1;~Govind_Mittal1;~Chinmay_Hegde1",
        "aff": "New York University;New York University;Hebrew University of Jerusalem;New York University;New York University",
        "aff_domain": "nyu.edu;nyu.edu;huji.ac.il;nyu.edu;nyu.edu",
        "position": "PhD student;PhD student;PhD student;PhD student;Associate Professor",
        "bibtex": "@inproceedings{\npham2024circumventing,\ntitle={Circumventing Concept Erasure Methods For Text-To-Image Generative Models},\nauthor={Minh Pham and Kelly O. Marshall and Niv Cohen and Govind Mittal and Chinmay Hegde},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ag3o2T51Ht}\n}",
        "github": "",
        "project": "",
        "reviewers": "PvZ8;cgR8;iwRd;h1Qn;YpMN",
        "pdf_size": 39275032,
        "rating": "5;6;6;8;8",
        "confidence": "4;2;3;3;4",
        "soundness": "2;3;3;3;3",
        "contribution": "2;3;3;3;3",
        "presentation": "3;3;3;3;3",
        "wc_summary": "42;168;57;30;53",
        "wc_strengths": "19;145;38;63;74",
        "wc_weaknesses": "156;115;69;56;77",
        "wc_questions": "4;2;1;2;112",
        "wc_review": "221;430;165;151;316",
        "wc_reply_reviewers": "73;79;0;0;20",
        "wc_reply_authors": "608;235;271;246;463",
        "reply_reviewers": "1;1;0;0;1",
        "reply_authors": "2;1;1;1;1",
        "rating_avg": [
            6.6,
            1.2
        ],
        "confidence_avg": [
            3.2,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.8,
            0.39999999999999997
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            70.0,
            49.89188310737529
        ],
        "wc_strengths_avg": [
            67.8,
            43.106380038226355
        ],
        "wc_weaknesses_avg": [
            94.6,
            36.445027095613476
        ],
        "wc_questions_avg": [
            24.2,
            43.91081871247677
        ],
        "wc_review_avg": [
            256.6,
            104.31222363654223
        ],
        "wc_reply_reviewers_avg": [
            34.4,
            34.79425239892359
        ],
        "wc_reply_authors_avg": [
            364.6,
            147.3425939774375
        ],
        "reply_reviewers_avg": [
            0.6,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.2,
            0.4000000000000001
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.08908708063747484,
        "gs_citation": 41,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3588911349616771178&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=ag3o2T51Ht",
        "pdf": "https://openreview.net/pdf?id=ag3o2T51Ht",
        "email": "nyu.edu;nyu.edu;huji.ac.il;nyu.edu;nyu.edu",
        "author_num": 5,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "New York University;Hebrew University of Jerusalem",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.nyu.edu;https://www.huji.ac.il",
        "aff_unique_abbr": "NYU;HUJI",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Jerusalem",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "United States;Israel"
    },
    {
        "title": "Predictive auxiliary objectives in deep RL mimic learning in the brain",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18358",
        "id": "agPpmEgf8C",
        "author_site": "Ching Fang, Kimberly Stachenfeld",
        "tldr": "",
        "abstract": "The ability to predict upcoming events has been hypothesized to comprise a key aspect of natural and machine cognition. This is supported by trends in deep reinforcement learning (RL), where self-supervised auxiliary objectives such as prediction are widely used to support representation learning and improve task performance. Here, we study the effects predictive auxiliary objectives have on representation learning across different modules of an RL system and how these mimic representational changes observed in the brain. We find that predictive objectives improve and stabilize learning particularly in resource-limited architectures, and we identify settings where longer predictive horizons better support representational transfer. Furthermore, we find that representational changes in this RL system bear a striking resemblance to changes in neural activity observed in the brain across various experiments. Specifically, we draw a connection between the auxiliary predictive model of the RL system and hippocampus, an area thought to learn a predictive model to support memory-guided behavior. We also connect the encoder network and the value learning network of the RL system to visual cortex and striatum in the brain, respectively. This work demonstrates how representation learning in deep RL systems can provide an interpretable framework for modeling multi-region interactions in the brain. The deep RL perspective taken here also suggests an additional role of the hippocampus in the brain-- that of an auxiliary learning system that benefits representation learning in other regions.",
        "keywords": "hippocampus;neuroscience;cognitive science;deep reinforcement learning;representation learning;prediction",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/82cbd73a501379a665cbc47213454979b9d5d8f2.pdf",
        "author": "Ching Fang;Kim Stachenfeld",
        "authorids": "~Ching_Fang2;~Kim_Stachenfeld1",
        "gender": "F;F",
        "homepage": "http://chingf.github.io;https://neurokim.com/",
        "dblp": ";155/1888",
        "google_scholar": ";jNtH2WUAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Ching_Fang2;~Kim_Stachenfeld1",
        "aff": "Columbia University;Google DeepMind",
        "aff_domain": "columbia.edu;deepmind.com",
        "position": "PhD student;Research Scientist",
        "bibtex": "@inproceedings{\nfang2024predictive,\ntitle={Predictive auxiliary objectives in deep {RL} mimic learning in the brain},\nauthor={Ching Fang and Kim Stachenfeld},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=agPpmEgf8C}\n}",
        "github": "",
        "project": "",
        "reviewers": "T1AU;CL1C;f2kS",
        "pdf_size": 1338964,
        "rating": "8;8;8",
        "confidence": "4;4;3",
        "soundness": "3;4;3",
        "contribution": "3;3;3",
        "presentation": "3;4;3",
        "wc_summary": "246;94;120",
        "wc_strengths": "62;92;70",
        "wc_weaknesses": "553;55;198",
        "wc_questions": "176;48;87",
        "wc_review": "1037;289;475",
        "wc_reply_reviewers": "35;0;10",
        "wc_reply_authors": "2024;723;824",
        "reply_reviewers": "1;0;1",
        "reply_authors": "3;1;2",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            153.33333333333334,
            66.37938100210201
        ],
        "wc_strengths_avg": [
            74.66666666666667,
            12.684198393626966
        ],
        "wc_weaknesses_avg": [
            268.6666666666667,
            209.35827876845207
        ],
        "wc_questions_avg": [
            103.66666666666667,
            53.56823270890645
        ],
        "wc_review_avg": [
            600.3333333333334,
            317.9699496633116
        ],
        "wc_reply_reviewers_avg": [
            15.0,
            14.719601443879744
        ],
        "wc_reply_authors_avg": [
            1190.3333333333333,
            590.931656134804
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6111964908164828851&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=agPpmEgf8C",
        "pdf": "https://openreview.net/pdf?id=agPpmEgf8C",
        "email": "columbia.edu;deepmind.com",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Columbia University;Google",
        "aff_unique_dep": ";Google DeepMind",
        "aff_unique_url": "https://www.columbia.edu;https://deepmind.com",
        "aff_unique_abbr": "Columbia;DeepMind",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "agdu3MVqOz",
        "title": "Multimodal Question Answering for Unified Information Extraction",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Multimodal information extraction (MIE) aims to extract structured information from unstructured multimedia content. \nDue to the diversity of tasks and settings, most current MIE models are task-specific and data-intensive, which limits their generalization to real-world scenarios with diverse task requirements and limited labeled data.\nTo address these issues, we propose a novel multimodal question answering (MQA) framework to unify three MIE tasks by reformulating them into a unified span extraction and multi-choice QA pipeline.\nExtensive experiments on six datasets show that: 1) Our MQA framework consistently and significantly improves the performances of various off-the-shelf large multimodal models (LMM) on MIE tasks, compared to vanilla prompting.\n2) In the zero-shot setting, MQA outperforms previous state-of-the-art baselines by a large margin.\nIn addition, the effectiveness of our framework can successfully transfer to the few-shot setting, enhancing LMMs on a scale of 10B parameters to be competitive or outperform much larger language models such as ChatGPT and GPT-4.\nOur MQA framework can serve as a general principle of utilizing LMMs to better solve MIE and potentially other downstream multimodal tasks.",
        "keywords": "Multimodal Information Extraction;Multimodal Question Answering;Large Multimodal Models",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yuxuan Sun;Kai Zhang;Yu Su",
        "authorids": "~Yuxuan_Sun3;~Kai_Zhang10;~Yu_Su2",
        "gender": "M;M;M",
        "homepage": ";https://drogozhang.github.io;http://ysu1989.github.io",
        "dblp": ";55/957-33;38/1070-1",
        "google_scholar": "https://scholar.google.com/citations?hl=en;sDnAIsgAAAAJ;rIh5OqoAAAAJ",
        "orcid": ";;",
        "linkedin": ";kai-zhang-43774b196/;",
        "or_profile": "~Yuxuan_Sun3;~Kai_Zhang10;~Yu_Su2",
        "aff": "Zhejiang University;Google DeepMind;Microsoft",
        "aff_domain": "zju.edu.cn;google.com;microsoft.com",
        "position": "PhD student;Student Researcher;Senior Researcher",
        "bibtex": "@misc{\nsun2024multimodal,\ntitle={Multimodal Question Answering for Unified Information Extraction},\nauthor={Yuxuan Sun and Kai Zhang and Yu Su},\nyear={2024},\nurl={https://openreview.net/forum?id=agdu3MVqOz}\n}",
        "github": "",
        "project": "",
        "reviewers": "F9v2;HQKu;jjah;JWLd",
        "site": "https://openreview.net/forum?id=agdu3MVqOz",
        "pdf_size": 846786,
        "rating": "3;3;5;8",
        "confidence": "4;5;3;4",
        "soundness": "3;2;2;4",
        "contribution": "2;1;2;4",
        "presentation": "3;2;3;3",
        "wc_summary": "68;144;93;145",
        "wc_strengths": "51;40;43;91",
        "wc_weaknesses": "423;571;79;29",
        "wc_questions": "25;83;50;39",
        "wc_review": "567;838;265;304",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            1.0897247358851685
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            112.5,
            33.20015060206806
        ],
        "wc_strengths_avg": [
            56.25,
            20.461854754640402
        ],
        "wc_weaknesses_avg": [
            275.5,
            228.28217188383329
        ],
        "wc_questions_avg": [
            49.25,
            21.405314760591587
        ],
        "wc_review_avg": [
            493.5,
            230.32856965648008
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.34554737023254406,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2101570596029870072&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Zhejiang University;Google;Microsoft",
        "aff_unique_dep": ";Google DeepMind;Microsoft Corporation",
        "aff_unique_url": "https://www.zju.edu.cn;https://deepmind.com;https://www.microsoft.com",
        "aff_unique_abbr": "ZJU;DeepMind;Microsoft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2",
        "aff_country_unique": "China;United Kingdom;United States"
    },
    {
        "id": "ahDjovSU7r",
        "title": "Theoretical insights into pseudo-label-based semi-supervised learning: Convergence rate and sample complexity analysis",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Pseudo-label-based semi-supervised learning has recently emerged as an effective technique in various domains. In this paper, we present a comprehensive theoretical analysis of the algorithm, significantly advancing our understanding of its empirical successes. Our analysis demonstrates that the algorithm can achieve a remarkable convergence rate of $\\mathcal{O}(N^{-1/2})$ order, and we provide an estimate of the sample complexity. We further investigate the algorithm's performance in scenarios with an infinite number of unlabeled data points, highlighting its effectiveness in leveraging large-scale unlabeled data. A key insight of our study is that incorporating pseudo-labeled data can improve model training when correctly labeled data is more valuable than the interference caused by mislabeled data, particularly for under-parameterized models that tend to ignore the impact of incorrect labels. Experimental findings corroborate the accuracy of our estimations. This study elucidates the strengths and limitations of the pseudo-label-based semi-supervised learning algorithm, paving the way for future research in this field. The code can be found at the anonymous URL https://anonymous.4open.science/r/mycode_1-A2EE",
        "keywords": "Pseudo-label-based semi-supervised learning;Convergence rate;Sample complexity estimate",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Zeping Min;Qian Ge;Cheng Tai",
        "authorids": "~Zeping_Min1;~Qian_Ge4;~Cheng_Tai3",
        "gender": ";M;",
        "homepage": ";;",
        "dblp": ";153/5844;",
        "google_scholar": ";;Qff61BUAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Zeping_Min1;~Qian_Ge4;~Cheng_Tai3",
        "aff": ";Peking University;",
        "aff_domain": ";pku.edu.cn;",
        "position": ";MS student;",
        "bibtex": "@misc{\nmin2024theoretical,\ntitle={Theoretical insights into pseudo-label-based semi-supervised learning: Convergence rate and sample complexity analysis},\nauthor={Zeping Min and Qian Ge and Cheng Tai},\nyear={2024},\nurl={https://openreview.net/forum?id=ahDjovSU7r}\n}",
        "github": "",
        "project": "",
        "reviewers": "71fq;xc7D;XJhG;QKV9",
        "site": "https://openreview.net/forum?id=ahDjovSU7r",
        "pdf_size": 714144,
        "rating": "1;3;3;5",
        "confidence": "3;4;5;4",
        "soundness": "1;2;1;2",
        "contribution": "1;1;1;2",
        "presentation": "2;1;1;3",
        "wc_summary": "100;10;89;53",
        "wc_strengths": "41;11;28;27",
        "wc_weaknesses": "151;370;833;122",
        "wc_questions": "2;3;100;27",
        "wc_review": "294;394;1050;229",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            1.5,
            0.5
        ],
        "contribution_avg": [
            1.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            63.0,
            35.19232870953555
        ],
        "wc_strengths_avg": [
            26.75,
            10.638961415476606
        ],
        "wc_weaknesses_avg": [
            369.0,
            284.53031472937994
        ],
        "wc_questions_avg": [
            33.0,
            39.956226048014095
        ],
        "wc_review_avg": [
            491.75,
            327.62049310139315
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:_zNaZWfcLsYJ:scholar.google.com/&scioq=Theoretical+insights+into+pseudo-label-based+semi-supervised+learning:+Convergence+rate+and+sample+complexity+analysis&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Peking University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.pku.edu.cn",
        "aff_unique_abbr": "Peking U",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "aiPcdCFmYy",
        "title": "Sinkhorn Distributional Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The empirical success of distributional reinforcement learning~(RL) highly depends on the representation of return distributions and the choice of distribution divergence. In this paper, we propose \\textit{Sinkhorn distributional RL~(SinkhornDRL)} algorithm that learns unrestricted statistics, i.e., deterministic samples, from each return distribution and then leverages Sinkhorn divergence to minimize the difference between current and target Bellman return distributions. Theoretically, we prove the convergence properties of SinkhornDRL in the tabular setting, which is consistent with the interpolation nature of Sinkhorn divergence between Wasserstein distance and Maximum Mean Discrepancy~(MMD). We also establish a new equivalent form of Sinkhorn divergence with a regularized MMD beyond the optimal transport literature, contributing to interpreting the superiority of SinkhornDRL over existing distributional RL methods. Empirically, we show that SinkhornDRL is consistently better or comparable to existing algorithms on the suite of 55 Atari games.",
        "keywords": "distributional reinforcement learning;sinkhorn divergence",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/3e8eb0640b7130a3fcaeb6404ff589204acebab8.pdf",
        "author": "Ke Sun;Yingnan Zhao;Wulong Liu;Bei Jiang;Linglong Kong",
        "authorids": "~Ke_Sun6;~Yingnan_Zhao1;~Wulong_Liu1;~Bei_Jiang1;~Linglong_Kong2",
        "gender": "M;M;M;F;M",
        "homepage": "https://sites.google.com/view/kesun;;;https://www.ualberta.ca/~bei1;https://www.ualberta.ca/~lkong",
        "dblp": "69/476-13;;36/9257.html;190/4697;35/8525",
        "google_scholar": "lYdNhFQAAAAJ;NMgYY5cAAAAJ;https://scholar.google.ca/citations?user=od00FfIAAAAJ;https://scholar.google.ca/citations?user=MfOZ8G0AAAAJ;https://scholar.google.ca/citations?hl=en",
        "orcid": ";;;0000-0002-0033-839X;0000-0003-3011-9216",
        "linkedin": ";;wulong-liu-28006155/;;",
        "or_profile": "~Ke_Sun6;~Yingnan_Zhao1;~Wulong_Liu1;~Bei_Jiang1;~Linglong_Kong2",
        "aff": "University of Alberta;Harbin Institute of Technology;Huawei Noah's Ark Lab;University of Alberta;University of Alberta",
        "aff_domain": "ualberta.ca;hit.edu.cn;huawei.com;ualberta.ca;ualberta.ca",
        "position": "PhD student;Assistant Professor;Researcher;Associate Professor;Full Professor",
        "bibtex": "@misc{\nsun2024sinkhorn,\ntitle={Sinkhorn Distributional Reinforcement Learning},\nauthor={Ke Sun and Yingnan Zhao and Wulong Liu and Bei Jiang and Linglong Kong},\nyear={2024},\nurl={https://openreview.net/forum?id=aiPcdCFmYy}\n}",
        "github": "",
        "project": "",
        "reviewers": "v5sT;VQBS;CJTu;PTyg;jH87",
        "site": "https://openreview.net/forum?id=aiPcdCFmYy",
        "pdf_size": 14291635,
        "rating": "3;3;5;6;8",
        "confidence": "4;5;4;3;3",
        "soundness": "3;2;2;3;4",
        "contribution": "2;2;3;2;3",
        "presentation": "4;2;1;2;4",
        "wc_summary": "51;125;86;47;80",
        "wc_strengths": "31;50;50;55;29",
        "wc_weaknesses": "374;355;542;126;30",
        "wc_questions": "157;98;33;51;17",
        "wc_review": "613;628;711;279;156",
        "wc_reply_reviewers": "245;327;590;16;13",
        "wc_reply_authors": "2011;1805;2430;841;124",
        "reply_reviewers": "1;1;1;1;1",
        "reply_authors": "3;4;4;2;1",
        "rating_avg": [
            5.0,
            1.8973665961010275
        ],
        "confidence_avg": [
            3.8,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.8,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.6,
            1.2000000000000002
        ],
        "wc_summary_avg": [
            77.8,
            28.166646942793882
        ],
        "wc_strengths_avg": [
            43.0,
            10.788883167408942
        ],
        "wc_weaknesses_avg": [
            285.4,
            183.9430346601904
        ],
        "wc_questions_avg": [
            71.2,
            50.76376660571987
        ],
        "wc_review_avg": [
            477.4,
            218.31042118964456
        ],
        "wc_reply_reviewers_avg": [
            238.2,
            215.30573610565975
        ],
        "wc_reply_authors_avg": [
            1442.2,
            840.2379186873204
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.8,
            1.16619037896906
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.8451542547285166,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:a3IHX1uc3LUJ:scholar.google.com/&scioq=Sinkhorn+Distributional+Reinforcement+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0;0",
        "aff_unique_norm": "University of Alberta;Harbin Institute of Technology;Huawei",
        "aff_unique_dep": ";;Noah's Ark Lab",
        "aff_unique_url": "https://www.ualberta.ca;http://www.hit.edu.cn/;https://www.huawei.com",
        "aff_unique_abbr": "UAlberta;HIT;Huawei",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Harbin",
        "aff_country_unique_index": "0;1;1;0;0",
        "aff_country_unique": "Canada;China"
    },
    {
        "id": "ajG8vLTHh5",
        "title": "Learning transferrable and interpretable representation for brain network",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The human brain is a complex, dynamic network, which is commonly studied using functional magnetic resonance imaging (fMRI) and modeled as network of Regions of interest (ROIs) for understanding various brain functions. Recent studies predominantly utilize Graph Neural Networks (GNNs) to learn the brain network representation based on the functional connectivity (FC) profile, typically falling into two main categories. The Fixed-FC approaches, utilize the FC profile which represents the linear temporal relation within the brain network, is limited by failing to capture the informative temporal dynamics of brain activity. On the other hand, the Dynamic-FC approaches, modeling the evolving FC profile over time, often exhibit less satisfactory performance due to challenges in handling the inherent noisy nature of fMRI data. In this study, to address these challenges, we propose Brain Masked Auto-Encoder (BrainMAE) for learning representations directly from fMRI time-series data. Our approach incorporates two essential components\u2014an embedding-based graph attention mechanism and a self-supervised masked autoencoding framework. These components empower our model to capture the rich temporal dynamics of brain activity while maintaining resilience to the inherent noise in fMRI data. Our experiments demonstrate that BrainMAE consistently outperforms several established baseline models by a significant margin in three distinct downstream tasks. Finally, leveraging the model's inherent interpretability, our analysis of model-generated representations reveals intriguing findings that resonate with ongoing research in the field of neuroscience.",
        "keywords": "Self-Supervised Learning;Masked Autoencoding;Characterizing representations;Neuroscience",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/7c26cba95b4d5a1756fd88b17247f0f4dc962589.zip",
        "author": "Yifan Yang;Yutong Mao;Xiao Liu",
        "authorids": "~Yifan_Yang18;yzm5278@psu.edu;xxl213@psu.edu",
        "gender": "M;;",
        "homepage": "https://sites.psu.edu/mcnl/;;",
        "dblp": ";;",
        "google_scholar": ";;",
        "orcid": "0000-0001-5384-5072;;",
        "linkedin": ";;",
        "or_profile": "~Yifan_Yang18;yzm5278@psu.edu;xxl213@psu.edu",
        "aff": "Pennsylvania State University;;",
        "aff_domain": "psu.edu;;",
        "position": "PhD student;;",
        "bibtex": "@misc{\nyang2024learning,\ntitle={Learning transferrable and interpretable representation for brain network},\nauthor={Yifan Yang and Yutong Mao and Xiao Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=ajG8vLTHh5}\n}",
        "github": "",
        "project": "",
        "reviewers": "nn5J;3Zps;DteR;8czh",
        "site": "https://openreview.net/forum?id=ajG8vLTHh5",
        "pdf_size": 37183833,
        "rating": "5;5;6;6",
        "confidence": "5;4;4;3",
        "soundness": "3;3;2;3",
        "contribution": "2;2;3;3",
        "presentation": "3;2;3;2",
        "wc_summary": "73;58;147;66",
        "wc_strengths": "38;31;293;45",
        "wc_weaknesses": "377;163;334;76",
        "wc_questions": "5;47;641;82",
        "wc_review": "493;299;1415;269",
        "wc_reply_reviewers": "0;35;280;0",
        "wc_reply_authors": "1233;1127;2070;571",
        "reply_reviewers": "0;1;2;0",
        "reply_authors": "2;3;5;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            86.0,
            35.61600763701625
        ],
        "wc_strengths_avg": [
            101.75,
            110.52912512093815
        ],
        "wc_weaknesses_avg": [
            237.5,
            122.88714334705645
        ],
        "wc_questions_avg": [
            193.75,
            259.6549392944413
        ],
        "wc_review_avg": [
            619.0,
            467.54465027417433
        ],
        "wc_reply_reviewers_avg": [
            78.75,
            117.06702140227196
        ],
        "wc_reply_authors_avg": [
            1250.25,
            535.9241434195701
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.75,
            1.479019945774904
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.7071067811865475,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:OgZATDI13ikJ:scholar.google.com/&scioq=Learning+transferrable+and+interpretable+representation+for+brain+network&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Pennsylvania State University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.psu.edu",
        "aff_unique_abbr": "PSU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "ajRRisV1n1",
        "title": "Learning the Hidden Set Locally",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Learning elements of the hidden set(s), also known as group testing (GT), is a well-established area in which one party tries to discover elements hidden by the other party by asking queries and analyzing feedback. The feedback is a function of the intersection of the query with the hidden set -- in our case, it is a classical double-threshold function, which returns $i$ if the intersection is a singleton $i\\in [n]$ and \"null\" otherwise (i.e., when the intersection is empty or of size at least $2$). In this work, we introduce a local framework to this problem: each hidden element is an \"autonomous\" element and can analyze feedback itself, but only for the queries which this element is a part of. The goal is to design a deterministic non-adaptive sequence of queries that allows each non-hidden element to learn about all other hidden agents. We show that, surprisingly, this task requires substantially more queries than the classic group testing -- by proving a super-qubic (in terms of the number of hidden elements) lower bound and constructing a specific sequence of slightly longer length. We also extend the results to the model, where agents belong to various clusters and selection must be done in queries avoiding elements from ``interfering'' clusters. Our algorithms could be generalized to other feedback functions, to adversarial/stochastic fault-prone scenarios and applied to codes.",
        "keywords": "hidden set;group testing;local testing;non-adaptive queries;deterministic algorithms;lower bounds;clusters",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Tomasz Jurdzinski;Dariusz Rafal Kowalski",
        "authorids": "~Tomasz_Jurdzinski1;~Dariusz_Rafal_Kowalski1",
        "gender": "M;M",
        "homepage": ";",
        "dblp": "https://dblp.dagstuhl.de/pid/74/441.html;43/6109",
        "google_scholar": ";https://scholar.google.com/citations?hl=en",
        "orcid": ";0000-0002-1316-7788",
        "linkedin": ";",
        "or_profile": "~Tomasz_Jurdzinski1;~Dariusz_Rafal_Kowalski1",
        "aff": "University of Wroc\u0142aw;Augusta University",
        "aff_domain": "uwr.edu.pl;augusta.edu",
        "position": "Full Professor;Full Professor",
        "bibtex": "@misc{\njurdzinski2024learning,\ntitle={Learning the Hidden Set Locally},\nauthor={Tomasz Jurdzinski and Dariusz Rafal Kowalski},\nyear={2024},\nurl={https://openreview.net/forum?id=ajRRisV1n1}\n}",
        "github": "",
        "project": "",
        "reviewers": "mKAb;2oQv;jXfX",
        "site": "https://openreview.net/forum?id=ajRRisV1n1",
        "pdf_size": 497796,
        "rating": "3;6;8",
        "confidence": "2;3;3",
        "soundness": "2;3;4",
        "contribution": "2;3;3",
        "presentation": "1;3;3",
        "wc_summary": "110;343;137",
        "wc_strengths": "59;56;69",
        "wc_weaknesses": "465;61;308",
        "wc_questions": "153;13;26",
        "wc_review": "787;473;540",
        "wc_reply_reviewers": "0;11;35",
        "wc_reply_authors": "782;759;719",
        "reply_reviewers": "0;1;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            5.666666666666667,
            2.0548046676563256
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            196.66666666666666,
            104.0587440930469
        ],
        "wc_strengths_avg": [
            61.333333333333336,
            5.557777333511022
        ],
        "wc_weaknesses_avg": [
            278.0,
            166.2909097535601
        ],
        "wc_questions_avg": [
            64.0,
            63.15589178110516
        ],
        "wc_review_avg": [
            600.0,
            135.02839207613584
        ],
        "wc_reply_reviewers_avg": [
            15.333333333333334,
            14.61354014452198
        ],
        "wc_reply_authors_avg": [
            753.3333333333334,
            26.02989734047285
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.9176629354822472,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:m7FSqFTyGAAJ:scholar.google.com/&scioq=Learning+the+Hidden+Set+Locally&hl=en&as_sdt=0,48",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Wroc\u0142aw;Augusta University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uni.wroc.pl;https://www.augusta.edu",
        "aff_unique_abbr": "UW;AU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Poland;United States"
    },
    {
        "id": "akKNGGWegr",
        "title": "Spatio-Temporal Graph Knowledge Distillation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large-scale spatio-temporal prediction is a critical area of research in data-driven urban computing, with far-reaching implications for transportation, public safety, and environmental monitoring. However, the challenges of scalability and generalization continue to pose significant obstacles. While many advanced models rely on Graph Neural Networks (GNNs) to encode spatial and temporal correlations, they often struggle with the increased time and space complexity of large-scale datasets. The recursive GNN-based message passing schemes used in these models can make their training and deployment difficult in real-life urban sensing scenarios. Additionally, large-scale spatio-temporal data spanning long time spans introduce distribution shifts, further highlighting the need for models with improved generalization performance. To address these challenges, we propose Spatio-Temporal Graph Knowledge Distillation (STGKD) paradigm to learn lightweight and robust Multi-Layer Perceptrons (MLPs) through effective knowledge distillation from cumbersome spatio-temporal GNNs. To ensure robust knowledge distillation, we integrate the spatio-temporal information bottleneck with the teacher-bounded regression loss. This allows us to filter out task-irrelevant noise and avoid erroneous guidance, resulting in robust knowledge transfer. Additionally, we enhance the generalization ability of student MLP by incorporating spatial and temporal prompts to inject downstream task contexts. We evaluate our framework on three large-scale spatio-temporal datasets for various urban computing tasks. Experimental results demonstrate that our model outperforms state-of-the-art approaches in terms of both efficiency and accuracy.",
        "keywords": "Spatial-Temporal Data Mining;Graph Neural Networks;Urban Computing;Knowledge Distillation",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/c5392ac951222cfde44ce919fa1b7febe68a9825.pdf",
        "author": "Jiabin Tang;Wei Wei;Lianghao Xia;Chao Huang",
        "authorids": "~Jiabin_Tang1;~Wei_Wei20;~Lianghao_Xia1;~Chao_Huang7",
        "gender": "M;;M;M",
        "homepage": "https://tjb-tech.github.io/;;https://akaxlh.github.io/;",
        "dblp": "314/6797;;270/6586;",
        "google_scholar": "https://scholar.google.com.hk/citations?user=GUXIfJgAAAAJ;;fDDjoUEAAAAJ;Zkv9FqwAAAAJ",
        "orcid": "0009-0002-7002-3585;;0000-0003-0725-2211;",
        "linkedin": ";;;",
        "or_profile": "~Jiabin_Tang1;~Wei_Wei20;~Lianghao_Xia1;~Chao_Huang7",
        "aff": "University of Hong Kong;;University of Hong Kong;University of Hong Kong",
        "aff_domain": "hku.hk;;hku.hk;hku.hk",
        "position": "PhD student;;Postdoc;Assistant Professor",
        "bibtex": "@misc{\ntang2024spatiotemporal,\ntitle={Spatio-Temporal Graph Knowledge Distillation},\nauthor={Jiabin Tang and Wei Wei and Lianghao Xia and Chao Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=akKNGGWegr}\n}",
        "github": "",
        "project": "",
        "reviewers": "qPxf;BFQG;wtdf;SP5L",
        "site": "https://openreview.net/forum?id=akKNGGWegr",
        "pdf_size": 466621,
        "rating": "5;5;5;6",
        "confidence": "4;3;4;4",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;4;2;4",
        "wc_summary": "115;115;171;115",
        "wc_strengths": "98;86;70;139",
        "wc_weaknesses": "400;189;264;136",
        "wc_questions": "2;54;53;82",
        "wc_review": "615;444;558;472",
        "wc_reply_reviewers": "0;0;101;0",
        "wc_reply_authors": "754;324;827;326",
        "reply_reviewers": "0;0;2;0",
        "reply_authors": "2;1;4;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            1.0
        ],
        "wc_summary_avg": [
            129.0,
            24.24871130596428
        ],
        "wc_strengths_avg": [
            98.25,
            25.537961939042827
        ],
        "wc_weaknesses_avg": [
            247.25,
            99.22543776673399
        ],
        "wc_questions_avg": [
            47.75,
            28.86498744153546
        ],
        "wc_review_avg": [
            522.25,
            68.06017558014378
        ],
        "wc_reply_reviewers_avg": [
            25.25,
            43.73428289111415
        ],
        "wc_reply_authors_avg": [
            557.75,
            234.17768360798175
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:zN0f-647JkkJ:scholar.google.com/&scioq=Spatio-Temporal+Graph+Knowledge+Distillation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Hong Kong",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.hku.hk",
        "aff_unique_abbr": "HKU",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Self-Supervised Speech Quality Estimation and Enhancement Using Only Clean Speech",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18357",
        "id": "ale56Ya59q",
        "author_site": "Szu-Wei Fu, Kuo-Hsuan Hung, Yu Tsao, Yu-Chiang Frank Wang",
        "tldr": "",
        "abstract": "Speech quality estimation has recently undergone a paradigm shift from human-hearing expert designs to machine-learning models. However, current models rely mainly on supervised learning, which is time-consuming and expensive for label collection. To solve this problem, we propose VQScore, a self-supervised metric for evaluating speech based on the quantization error of a vector-quantized-variational autoencoder (VQ-VAE). The training of VQ-VAE relies on clean speech; hence, large quantization errors can be expected when the speech is distorted. To further improve correlation with real quality scores, domain knowledge of speech processing is incorporated into the model design. We found that the vector quantization mechanism could also be used for self-supervised speech enhancement (SE) model training. To improve the robustness of the encoder for SE, a novel self-distillation mechanism combined with adversarial training is introduced. In summary, the proposed speech quality estimation method and enhancement models require only clean speech for training without any label requirements. Experimental results show that the proposed VQScore and enhancement model are competitive with supervised baselines. The code and pre-trained models will be released",
        "keywords": "Self-Supervised Learning;Speech Quality Estimation;Speech Enhancement",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Szu-Wei Fu;Kuo-Hsuan Hung;Yu Tsao;Yu-Chiang Frank Wang",
        "authorids": "~Szu-Wei_Fu1;~Kuo-Hsuan_Hung1;~Yu_Tsao1;~Yu-Chiang_Frank_Wang2",
        "gender": ";M;M;M",
        "homepage": "https://jasonswfu.github.io/JasonFu.github.io/;;https://www.citi.sinica.edu.tw/pages/yu.tsao/index_en.html;http://vllab.ee.ntu.edu.tw/ycwang.html",
        "dblp": "160/0591;;66/7146;30/1690",
        "google_scholar": "eSGkKm4AAAAJ;sgWaPAcAAAAJ;https://scholar.google.com.tw/citations?user=ZO5e5I4AAAAJ;HSGvdtoAAAAJ",
        "orcid": ";;0000-0001-6956-0418;0000-0002-2333-157X",
        "linkedin": "https://www.linkedin.com/mwlite/in/szu-wei-fu-78b47817a;;;",
        "or_profile": "~Szu-Wei_Fu1;~Kuo-Hsuan_Hung1;~Yu_Tsao1;~Yu-Chiang_Frank_Wang2",
        "aff": "Microsoft;Academia Sinica;Academia Sinica;National Taiwan University",
        "aff_domain": "microsoft.com;sinica.edu.tw;sinica.edu.tw;ntu.edu.tw",
        "position": "Researcher;Researcher;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nfu2024selfsupervised,\ntitle={Self-Supervised Speech Quality Estimation and Enhancement Using Only Clean Speech},\nauthor={Szu-Wei Fu and Kuo-Hsuan Hung and Yu Tsao and Yu-Chiang Frank Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ale56Ya59q}\n}",
        "github": "",
        "project": "",
        "reviewers": "eoAZ;CJHD;KXQH;DUwZ",
        "pdf_size": 5970550,
        "rating": "6;6;8;8",
        "confidence": "4;3;5;3",
        "soundness": "3;3;4;3",
        "contribution": "3;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "172;101;55;55",
        "wc_strengths": "54;29;48;46",
        "wc_weaknesses": "70;232;54;19",
        "wc_questions": "134;51;61;53",
        "wc_review": "430;413;218;173",
        "wc_reply_reviewers": "126;34;47;0",
        "wc_reply_authors": "1671;2227;1153;878",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "4;6;4;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            95.75,
            47.861127232859864
        ],
        "wc_strengths_avg": [
            44.25,
            9.283722313813572
        ],
        "wc_weaknesses_avg": [
            93.75,
            81.92183774794118
        ],
        "wc_questions_avg": [
            74.75,
            34.412025514346
        ],
        "wc_review_avg": [
            308.5,
            114.27270015187355
        ],
        "wc_reply_reviewers_avg": [
            51.75,
            46.17561585945552
        ],
        "wc_reply_authors_avg": [
            1482.25,
            515.7040696950141
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.0,
            1.4142135623730951
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.30151134457776363,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18041775739738082508&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=ale56Ya59q",
        "pdf": "https://openreview.net/pdf?id=ale56Ya59q",
        "email": "microsoft.com;sinica.edu.tw;sinica.edu.tw;ntu.edu.tw",
        "author_num": 4,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "Microsoft;Academia Sinica;National Taiwan University",
        "aff_unique_dep": "Microsoft Corporation;;",
        "aff_unique_url": "https://www.microsoft.com;https://www.sinica.edu.tw;https://www.ntu.edu.tw",
        "aff_unique_abbr": "Microsoft;Academia Sinica;NTU",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Taiwan",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "am7BPV3Cwo",
        "title": "Rethinking Out-of-Distribution Detection on Imbalanced Data Distribution",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Detecting and rejecting unknown out-of-distribution (OOD) samples is critical for deployed neural networks to void unreliable predictions. In real-world scenarios, however, the efficacy of existing OOD detection methods is often impeded by the inherent imbalance of in-distribution (ID) data, which causes significant performance decline. Through statistical observations, we have identified two common challenges faced by different OOD detectors: misidentifying tail class ID samples as OOD, while erroneously predicting OOD samples as head class from ID. To explain this phenomenon, we introduce a generalized statistical framework, termed ImOOD, to formulate the OOD detection problem on imbalanced data distribution. Consequently, the theoretical analysis reveals that there exists a class-aware bias item between balanced and imbalanced OOD detection, which contributes to the performance gap. Building upon this finding, we present a unified perspective of post-hoc normalization and training-time regularization techniques to calibrate and boost the imbalanced OOD detectors. On the representative CIFAR10-LT, CIFAR100-LT, and ImageNet-LT benchmarks, our method consistently surpasses the state-of-the-art OOD detection approaches by a large margin.",
        "keywords": "out-of-distribution detection;imbalanced distribution;long-tailed recognition",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Kai Liu;Zhihang Fu;Sheng Jin;Chao Chen;Ze Chen;Rongxin Jiang;Yaowu Chen;Jieping Ye",
        "authorids": "~Kai_Liu8;~Zhihang_Fu1;~Sheng_Jin3;~Chao_Chen19;~Ze_Chen3;~Rongxin_Jiang1;~Yaowu_Chen2;~Jieping_Ye4",
        "gender": "M;M;M;M;M;M;;M",
        "homepage": "https://kail8.github.io/;https://zhihangfu.top/;;https://chaochen.cc/;;https://person.zju.edu.cn/0008430;https://person.zju.edu.cn/0088219;http://yelabs.net/",
        "dblp": ";207/1894;70/6780-2;66/3019-26.html;15/4184-1;10/2064-1;;03/5454",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;e_e3Ur0AAAAJ;https://scholar.google.com/citations?view_op=list_works;https://scholar.google.com.hk/citations?user=_xDUAtQAAAAJ;hVqKZq0AAAAJ;;;T9AzhwcAAAAJ",
        "orcid": ";;0000-0001-7254-1664;;;;;0000-0001-8662-5818",
        "linkedin": ";;;;;;;",
        "or_profile": "~Kai_Liu8;~Zhihang_Fu1;~Sheng_Jin3;~Chao_Chen19;~Ze_Chen3;~Rongxin_Jiang1;~Yaowu_Chen2;~Jieping_Ye4",
        "aff": "Alibaba Group;Alibaba Group;Nanyang Technological University;Alibaba Group;Alibaba Group;Zhejiang University;Zhejiang University;Alibaba Group",
        "aff_domain": "alibaba-inc.com;alibaba-inc.com;ntu.edu.sg;alibaba-inc.com;alibaba-inc.com;zju.edu.cn;zju.edu.cn;alibaba-inc.com",
        "position": "Intern;Researcher;Postdoc;Researcher;Researcher;Researcher;Full Professor;Principal Researcher",
        "bibtex": "@misc{\nliu2024rethinking,\ntitle={Rethinking Out-of-Distribution Detection on Imbalanced Data Distribution},\nauthor={Kai Liu and Zhihang Fu and Sheng Jin and Chao Chen and Ze Chen and Rongxin Jiang and Yaowu Chen and Jieping Ye},\nyear={2024},\nurl={https://openreview.net/forum?id=am7BPV3Cwo}\n}",
        "github": "",
        "project": "",
        "reviewers": "qdXa;b8DW;LaLW;r7k6",
        "site": "https://openreview.net/forum?id=am7BPV3Cwo",
        "pdf_size": 462183,
        "rating": "5;6;6;6",
        "confidence": "3;4;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "79;138;83;90",
        "wc_strengths": "176;84;25;135",
        "wc_weaknesses": "357;359;74;184",
        "wc_questions": "4;6;2;14",
        "wc_review": "616;587;184;423",
        "wc_reply_reviewers": "0;0;0;73",
        "wc_reply_authors": "1572;912;833;880",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "3;2;2;3",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            97.5,
            23.71181140275875
        ],
        "wc_strengths_avg": [
            105.0,
            56.52875374532858
        ],
        "wc_weaknesses_avg": [
            243.5,
            120.92663064850521
        ],
        "wc_questions_avg": [
            6.5,
            4.55521678957215
        ],
        "wc_review_avg": [
            452.5,
            171.59909673421944
        ],
        "wc_reply_reviewers_avg": [
            18.25,
            31.60992723813201
        ],
        "wc_reply_authors_avg": [
            1049.25,
            303.11497406099886
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:DPWkKruRee0J:scholar.google.com/&scioq=Rethinking+Out-of-Distribution+Detection+on+Imbalanced+Data+Distribution&hl=en&as_sdt=0,33",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;0;0;2;2;0",
        "aff_unique_norm": "Alibaba Group;Nanyang Technological University;Zhejiang University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.alibaba.com;https://www.ntu.edu.sg;https://www.zju.edu.cn",
        "aff_unique_abbr": "Alibaba;NTU;ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0;0;0;0",
        "aff_country_unique": "China;Singapore"
    },
    {
        "id": "am9IxubLKV",
        "title": "Convolutions Through the Lens of Tensor Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Despite their simple intuition, convolutions are more tedious to analyze than dense layers, which complicates the transfer of theoretical and algorithmic ideas. We provide a simplifying perspective onto convolutions through tensor networks (TNs) which allow reasoning about the underlying tensor multiplications by drawing diagrams, and manipulating them to perform function transformations and sub-tensor access. We demonstrate this expressive power by deriving the diagrams of various autodiff operations and popular approximations of second-order information with full hyper-parameter support, batching, channel groups, and generalization to arbitrary convolution dimensions. Further, we provide convolution-specific transformations based on the connectivity pattern which allow to re-wire and simplify diagrams before evaluation. Finally, we probe computational performance, relying on established machinery for efficient TN contraction. Our TN implementation speeds up a recently-proposed KFAC variant up to 4.5x and enables new hardware-efficient tensor dropout for approximate backpropagation.",
        "keywords": "Tensor networks;convolutions;KFAC;einsum;automatic differentiation",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/ee72eea422c586e6f398c81fbe9accf9af3f9ed3.pdf",
        "author": "Felix Dangel",
        "authorids": "~Felix_Dangel1",
        "gender": "M",
        "homepage": "https://f-dangel.com",
        "dblp": "236/4218",
        "google_scholar": "9hlJ9W0AAAAJ",
        "orcid": "0000-0002-1414-8554",
        "linkedin": "",
        "or_profile": "~Felix_Dangel1",
        "aff": "Vector Institute, Toronto",
        "aff_domain": "vectorinstitute.ai",
        "position": "Postdoc",
        "bibtex": "@misc{\ndangel2024convolutions,\ntitle={Convolutions Through the Lens of Tensor Networks},\nauthor={Felix Dangel},\nyear={2024},\nurl={https://openreview.net/forum?id=am9IxubLKV}\n}",
        "github": "",
        "project": "",
        "reviewers": "4fmq;XFQf;D3NB;Z3Mj",
        "site": "https://openreview.net/forum?id=am9IxubLKV",
        "pdf_size": 517854,
        "rating": "5;5;6;8",
        "confidence": "3;2;4;5",
        "soundness": "2;3;3;4",
        "contribution": "2;2;3;4",
        "presentation": "2;3;3;4",
        "wc_summary": "78;52;111;36",
        "wc_strengths": "18;81;57;108",
        "wc_weaknesses": "52;50;143;33",
        "wc_questions": "350;30;151;31",
        "wc_review": "498;213;462;208",
        "wc_reply_reviewers": "0;0;0;93",
        "wc_reply_authors": "885;299;700;261",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            69.25,
            28.38463492807332
        ],
        "wc_strengths_avg": [
            66.0,
            33.0681115275729
        ],
        "wc_weaknesses_avg": [
            69.5,
            43.072613108563544
        ],
        "wc_questions_avg": [
            140.5,
            130.57660586797314
        ],
        "wc_review_avg": [
            345.25,
            135.36132202368591
        ],
        "wc_reply_reviewers_avg": [
            23.25,
            40.2701812759764
        ],
        "wc_reply_authors_avg": [
            536.25,
            264.8068871838495
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0.9128709291752768,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:cRkl3TdmB-YJ:scholar.google.com/&scioq=Convolutions+Through+the+Lens+of+Tensor+Networks&hl=en&as_sdt=0,33",
        "gs_version_total": 2,
        "aff_unique_index": "0",
        "aff_unique_norm": "Vector Institute",
        "aff_unique_dep": "",
        "aff_unique_url": "https://vectorinstitute.ai",
        "aff_unique_abbr": "Vector Institute",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Toronto",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "amjNJMpBiq",
        "title": "Getting a-Round Guarantees: Floating-Point Attacks on Certified Robustness",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Adversarial examples pose a security risk as they can alter decisions of a machine learning classifier through slight input perturbations.\nCertified robustness has been proposed as a mitigation where given an input $\\mathbf{x}$, a classifier returns a prediction and a certified radius $R$ with a provable guarantee that any perturbation to $\\mathbf{x}$ with $R$-bounded norm will not alter the classifier's prediction. In this work, we show that these guarantees can be invalidated due to limitations of floating-point representation that cause rounding errors. We design a rounding search method that can efficiently exploit this vulnerability to find adversarial examples against state-of-the-art certifications in two threat models, that differ in how the norm of the perturbation is computed. We show that the attack can be carried out against linear classifiers that have exact certifiable guarantees and against neural networks that have conservative certifications. In the weak threat model, our experiments demonstrate attack success rates over 50\\% on random linear classifiers, up to 23\\% on the MNIST dataset for linear SVM, and up to 15\\% for a neural network. In the strong threat model, the success rates are lower but positive. The floating-point errors exploited by our attacks can range from small to large (e.g., $10^{-13}$ to $10^{3}$) --- showing that even negligible errors can be systematically exploited to invalidate guarantees provided by certified robustness. Finally, we propose a formal mitigation approach based on bounded interval arithmetic, encouraging future implementations of robustness certificates to account for limitations of modern computing architecture to provide sound certifiable guarantees.",
        "keywords": "Certified Robustness;Floating-Point Errors;Adversarial Examples",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/c04d3718b8eb44ec227d00d7421efa2da75818ff.pdf",
        "author": "Jiankai Jin;Olga Ohrimenko;Benjamin I. P. Rubinstein",
        "authorids": "~Jiankai_Jin1;~Olga_Ohrimenko1;~Benjamin_I._P._Rubinstein1",
        "gender": "M;;M",
        "homepage": "https://au.linkedin.com/in/jin-jiankai-3a5750119?original_referer=https%3A%2F%2Fwww.google.com.hk%2F;;http://www.bipr.net/",
        "dblp": ";;90/1092",
        "google_scholar": "wzSmbQQAAAAJ;;https://scholar.google.com.au/citations?user=hMG_gR4AAAAJ",
        "orcid": ";;0000-0002-2947-6980",
        "linkedin": ";;benjaminrubinstein/",
        "or_profile": "~Jiankai_Jin1;~Olga_Ohrimenko1;~Benjamin_I._P._Rubinstein1",
        "aff": "University of Melbourne;;The University of Melbourne",
        "aff_domain": "unimelb.edu.au;;unimelb.edu.au",
        "position": "PhD student;;Associate Professor",
        "bibtex": "@misc{\njin2024getting,\ntitle={Getting a-Round Guarantees: Floating-Point Attacks on Certified Robustness},\nauthor={Jiankai Jin and Olga Ohrimenko and Benjamin I. P. Rubinstein},\nyear={2024},\nurl={https://openreview.net/forum?id=amjNJMpBiq}\n}",
        "github": "",
        "project": "",
        "reviewers": "s866;GFuC;FP18;musS",
        "site": "https://openreview.net/forum?id=amjNJMpBiq",
        "pdf_size": 3293036,
        "rating": "1;3;5;8",
        "confidence": "5;4;3;4",
        "soundness": "2;2;3;3",
        "contribution": "1;1;2;3",
        "presentation": "2;2;2;3",
        "wc_summary": "74;141;74;44",
        "wc_strengths": "53;58;43;68",
        "wc_weaknesses": "685;276;133;143",
        "wc_questions": "7;700;9;9",
        "wc_review": "819;1175;259;264",
        "wc_reply_reviewers": "92;33;0;40",
        "wc_reply_authors": "739;681;344;294",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.25,
            2.5860201081971503
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            83.25,
            35.520240708643854
        ],
        "wc_strengths_avg": [
            55.5,
            9.013878188659973
        ],
        "wc_weaknesses_avg": [
            309.25,
            224.16330542709258
        ],
        "wc_questions_avg": [
            181.25,
            299.5015651044248
        ],
        "wc_review_avg": [
            629.25,
            388.69678092312523
        ],
        "wc_reply_reviewers_avg": [
            41.25,
            32.96494350063413
        ],
        "wc_reply_authors_avg": [
            514.5,
            197.36577717527425
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5468687416197306,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12324939500886015815&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Melbourne",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.unimelb.edu.au",
        "aff_unique_abbr": "UniMelb",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Australia"
    },
    {
        "id": "anG2Y15mwc",
        "title": "Diff-Privacy: Diffusion-based Face Privacy Protection",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Privacy protection has become a top priority due to the widespread collection and misuse of personal data. Anonymization and visual identity information hiding are two important face privacy protection tasks that aim to remove identification characteristics from face images at the human perception level. However, they have a significant difference in that the former aims to prevent the machine from recognizing identity correctly, while the latter needs to ensure the accuracy of machine recognition. Therefore, it is difficult to train a model to complete these two tasks simultaneously. In this paper, we unify the task of anonymization and visual identity information hiding and propose a novel face privacy protection method based on diffusion models, dubbed Diff-Privacy. Specifically, we train our proposed multi-scale image inversion module (MSI) to obtain a set of SDM format conditional embeddings of the original image. Based on the conditional embeddings, we design corresponding embedding scheduling strategies and construct different energy functions during the denoising process to achieve anonymization and visual identity information hiding. Extensive experiments have demonstrated the effectiveness of our proposed framework in protecting facial privacy.",
        "keywords": "Face privacy protection;Diffusion models;Anonymization;Visual identity information hiding",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/2398395a011dd6636dad53e501ac94bb7d2edd99.zip",
        "author": "Xiao He;Mingrui Zhu;Dongxin Chen;Nannan Wang;Xinbo Gao",
        "authorids": "~Xiao_He5;~Mingrui_Zhu2;~Dongxin_Chen3;~Nannan_Wang1;~Xinbo_Gao5",
        "gender": ";M;M;M;M",
        "homepage": "https://github.com/LearningHx;https://mrzhu.space/;;https://faculty.cqupt.edu.cn/gaoxinbo/zh_CN/index.htm;https://github.com/winterplayer",
        "dblp": ";94/2339;10/8359-1;;",
        "google_scholar": ";a8FXS1UAAAAJ;SRBn7oUAAAAJ;https://scholar.google.com/citations?hl=zh-CN;",
        "orcid": ";;;0000-0002-7985-0037;",
        "linkedin": ";;;xinbo-gao-151a2224/;",
        "or_profile": "~Xiao_He5;~Mingrui_Zhu2;~Nannan_Wang1;~Xinbo_Gao5;~dongxin_chen2",
        "aff": "Xidian University;Xidian University;Xidian University;Chongqing University of Post and Telecommunications;Xi'an University of Electronic Science and Technology",
        "aff_domain": "stu.xidian.edu.cn;xidian.edu.cn;xidian.edu.cn;cqupt.edu.cn;xidian.edu.cn",
        "position": "PhD student;Associate Professor;Full Professor;Full Professor;MS student",
        "bibtex": "@misc{\nhe2024diffprivacy,\ntitle={Diff-Privacy: Diffusion-based Face Privacy Protection},\nauthor={Xiao He and Mingrui Zhu and Dongxin Chen and Nannan Wang and Xinbo Gao},\nyear={2024},\nurl={https://openreview.net/forum?id=anG2Y15mwc}\n}",
        "github": "",
        "project": "",
        "reviewers": "jBnK;pv71;J6vY;4Vnn",
        "site": "https://openreview.net/forum?id=anG2Y15mwc",
        "pdf_size": 2821444,
        "rating": "5;6;8;8",
        "confidence": "3;4;4;4",
        "soundness": "2;4;4;3",
        "contribution": "2;3;4;3",
        "presentation": "2;2;3;3",
        "wc_summary": "25;35;57;49",
        "wc_strengths": "41;5;87;106",
        "wc_weaknesses": "472;136;70;67",
        "wc_questions": "3;5;4;4",
        "wc_review": "541;181;218;226",
        "wc_reply_reviewers": "32;21;0;50",
        "wc_reply_authors": "1567;1082;319;234",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "4;3;1;1",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            41.5,
            12.359207094308275
        ],
        "wc_strengths_avg": [
            59.75,
            39.46754996196242
        ],
        "wc_weaknesses_avg": [
            186.25,
            167.26681529819356
        ],
        "wc_questions_avg": [
            4.0,
            0.7071067811865476
        ],
        "wc_review_avg": [
            291.5,
            145.04568245901012
        ],
        "wc_reply_reviewers_avg": [
            25.75,
            18.115946014492316
        ],
        "wc_reply_authors_avg": [
            800.5,
            552.1614347272
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            1.299038105676658
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.7777777777777777,
        "gs_citation": 21,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7141448760406655333&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;0;1;2",
        "aff_unique_norm": "Xidian University;Chongqing University of Post and Telecommunications;Xi'an University of Electronic Science and Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.xidian.edu.cn/;http://www.cqupt.edu.cn;http://www.xidian.edu.cn/",
        "aff_unique_abbr": "Xidian;CQUPT;Xidian University",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Xi'an",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "anG8cNYQAs",
        "title": "INCYDE: A large scale cyclone detection and intensity estimation dataset using satellite infrared imagery",
        "track": "main",
        "status": "Desk Reject",
        "tldr": "",
        "abstract": "Tropical cyclones are devastating natural phenomena that cause a significant amount of damage every year. Conventionally, the Dvorak technique is used to detect cyclones and estimate cyclone intensity from satellite infrared imagery by observing cloud patterns. Satellite infrared imagery provides valuable information for detecting cyclonic storms. Recently, deep CNN models have proven to be highly efficient in detecting relevant patterns in the images. In this work, a novel cyclone detection and intensity estimation dataset called INCYDE (INSAT-based Cyclone Detection and Intensity Estimation) dataset is presented. The cyclone images in the dataset are captured from INSAT 3D/3DR satellites over the Indian Ocean. The proposed INCYDE dataset contains over 21k cyclone images taken from cyclones over the Indian Ocean from the year 2013 to 2021. The dataset pertains to two specific tasks: cyclone detection as an object detection task, and\nintensity estimation as a regression task. In addition to the dataset, this study in troduces baseline models that were trained on the newly presented dataset. The results of this research would help develop innovative cyclone detection and intensity estimation models, which in turn could help save lives.",
        "keywords": "Remote Sensing;Convolutional Neural Network;Disaster Management",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Arindam Ghosh;Inderpreet Singh",
        "authorids": "~Arindam_Ghosh4;~Inderpreet_Singh1",
        "gender": ";M",
        "homepage": ";",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": ";0000-0001-9498-0107",
        "linkedin": ";inderpreet-singh-748232239/",
        "or_profile": "~Arindam_Ghosh4;~Inderpreet_Singh1",
        "aff": ";Amity University",
        "aff_domain": ";amity.edu",
        "position": ";PhD student",
        "bibtex": "@misc{\nghosh2024incyde,\ntitle={{INCYDE}: A large scale cyclone detection and intensity estimation dataset using satellite infrared imagery},\nauthor={Arindam Ghosh and Inderpreet Singh},\nyear={2024},\nurl={https://openreview.net/forum?id=anG8cNYQAs}\n}",
        "github": "",
        "project": "",
        "reviewers": "TKNa;Vk2U;VDYR",
        "site": "https://openreview.net/forum?id=anG8cNYQAs",
        "pdf_size": 5739103,
        "rating": "1;3;5",
        "confidence": "5;4;4",
        "soundness": "1;2;2",
        "contribution": "1;2;3",
        "presentation": "1;3;2",
        "wc_summary": "210;104;154",
        "wc_strengths": "10;34;21",
        "wc_weaknesses": "19;200;48",
        "wc_questions": "101;97;82",
        "wc_review": "340;435;305",
        "wc_reply_reviewers": "351;119;0",
        "wc_reply_authors": "1095;808;579",
        "reply_reviewers": "2;2;0",
        "reply_authors": "3;3;1",
        "rating_avg": [
            3.0,
            1.632993161855452
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            156.0,
            43.29742101634538
        ],
        "wc_strengths_avg": [
            21.666666666666668,
            9.809292646374775
        ],
        "wc_weaknesses_avg": [
            89.0,
            79.37673882609859
        ],
        "wc_questions_avg": [
            93.33333333333333,
            8.178562764256865
        ],
        "wc_review_avg": [
            360.0,
            54.9241901776136
        ],
        "wc_reply_reviewers_avg": [
            156.66666666666666,
            145.74940442035737
        ],
        "wc_reply_authors_avg": [
            827.3333333333334,
            211.09923943228426
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ZY7B9ewy-uoJ:scholar.google.com/&scioq=INCYDE:+A+large+scale+cyclone+detection+and+intensity+estimation+dataset+using+satellite+infrared+imagery&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Amity University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.amity.edu",
        "aff_unique_abbr": "Amity",
        "aff_country_unique_index": "0",
        "aff_country_unique": "India"
    },
    {
        "id": "ancAesl2LU",
        "title": "DomainStudio: Fine-Tuning Diffusion Models for Domain-Driven Image Generation using Limited Data",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Denoising diffusion probabilistic models (DDPMs) have been proven capable of synthesizing high-quality images with remarkable diversity when trained on large amounts of data. Classic unconditional and modern large-scale conditional diffusion models are still vulnerable to overfitting when fine-tuned on extremely limited data. Existing works have explored subject-driven generation using a reference set containing a few images. However, few prior works explore DDPM-based domain-driven generation, which aims to learn the features of target domains while maintaining diversity. This paper proposes a novel DomainStudio approach to adapt DDPMs pre-trained on large-scale source datasets to target domains using limited data. It is designed to keep the diversity of subjects provided by source domains and get high-quality and diverse adapted samples in target domains. We propose to keep the relative distances between adapted samples to achieve considerable generation diversity. In addition, we further enhance the learning of high-frequency details for better generation quality. Our approach is compatible with both unconditional and text-to-image DDPMs. This work makes the first attempt to realize unconditional DDPM-based few-shot image generation, achieving better results than current state-of-the-art GAN-based approaches. It also significantly relieves overfitting for domain-driven text-to-image generation, expanding the applicable scenarios of modern large-scale text-to-image diffusion models.",
        "keywords": "Image generation;Diffusion models;Domain-driven;Limited data",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/272062fa7ee56a68da1e79b6b5897181c351f5cf.zip",
        "author": "JingYuan Zhu;Huimin Ma;Jiansheng Chen;Jian Yuan",
        "authorids": "~JingYuan_Zhu1;~Huimin_Ma1;~Jiansheng_Chen3;~Jian_Yuan1",
        "gender": "M;F;M;",
        "homepage": ";http://server.3dimagelab.cn:5000;http://scce.ustb.edu.cn/shiziduiwu/jiaoshixinxi/2021-11-15/210.html;http://bdktzweb.tsinghua.edu.cn/yuanjian/zh_CN/index.htm",
        "dblp": "302/9530;69/7694-1;;64/4192",
        "google_scholar": "a3ErJwkAAAAJ;32hwVLEAAAAJ;A1gA9XIAAAAJ;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~JingYuan_Zhu1;~Huimin_Ma1;~Jiansheng_Chen3;~Jian_Yuan1",
        "aff": "Electronic Engineering, Tsinghua University, Tsinghua University;University of Science and Technology Beijing;University of Science and Technology Beijing;Tsinghua University",
        "aff_domain": "mails.tsinghua.edu.cn;ustb.edu.cn;ustb.edu.cn;tsinghua.edu.cn",
        "position": "PhD student;Full Professor;Full Professor;Professor",
        "bibtex": "@misc{\nzhu2024domainstudio,\ntitle={DomainStudio: Fine-Tuning Diffusion Models for Domain-Driven Image Generation using Limited Data},\nauthor={JingYuan Zhu and Huimin Ma and Jiansheng Chen and Jian Yuan},\nyear={2024},\nurl={https://openreview.net/forum?id=ancAesl2LU}\n}",
        "github": "",
        "project": "",
        "reviewers": "mvse;Qxcc;w5yc;4uc5",
        "site": "https://openreview.net/forum?id=ancAesl2LU",
        "pdf_size": 30144126,
        "rating": "3;3;6;8",
        "confidence": "5;4;4;4",
        "soundness": "2;2;4;3",
        "contribution": "1;2;3;3",
        "presentation": "2;2;4;3",
        "wc_summary": "95;30;142;146",
        "wc_strengths": "41;30;88;15",
        "wc_weaknesses": "773;36;34;283",
        "wc_questions": "4;35;159;203",
        "wc_review": "913;131;423;647",
        "wc_reply_reviewers": "396;0;0;96",
        "wc_reply_authors": "1810;223;660;349",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "5;2;2;2",
        "rating_avg": [
            5.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            103.25,
            46.804780738723686
        ],
        "wc_strengths_avg": [
            43.5,
            27.299267389437397
        ],
        "wc_weaknesses_avg": [
            281.5,
            301.2893127875597
        ],
        "wc_questions_avg": [
            100.25,
            82.96196417636217
        ],
        "wc_review_avg": [
            528.5,
            287.6712533431173
        ],
        "wc_reply_reviewers_avg": [
            123.0,
            162.41613220366997
        ],
        "wc_reply_authors_avg": [
            760.5,
            626.456103809357
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.75,
            1.299038105676658
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5443310539518174,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15057053387106831394&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1;0",
        "aff_unique_norm": "Tsinghua University;University of Science and Technology Beijing",
        "aff_unique_dep": "Electronic Engineering;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;http://www.ustb.edu.cn",
        "aff_unique_abbr": "THU;USTB",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "anek0q7QPL",
        "title": "Exploring the Combined Power of Covariance and Hessian Matrices Eigenanalysis for Binary Classification",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Covariance and Hessian matrices have been analyzed separately in the literature for classification problems. However, integrating these matrices has the potential to enhance their combined power in improving classification performance. We present a novel approach that combines the eigenanalysis of a covariance matrix evaluated on a training set with a Hessian matrix evaluated on a deep learning model to achieve optimal class separability in binary classification tasks. Our approach is substantiated by formal proofs that establish its capability to maximize between-class mean distance and minimize within-class variances. By projecting data into the combined space of the most relevant eigendirections from both matrices, we achieve optimal class separability as per the linear discriminant analysis (LDA) criteria. Empirical validation across neural and health datasets consistently supports our theoretical framework and demonstrates that our method outperforms traditional methods. Our method stands out by addressing both LDA criteria, unlike PCA and the Hessian method, which predominantly emphasize one criterion each. This comprehensive approach captures intricate patterns and relationships, enhancing classification performance. Furthermore, through the utilization of both LDA criteria, our method outperforms LDA itself by leveraging higher-dimensional feature spaces, in accordance with Cover's theorem, which favors linear separability in higher dimensions. Our approach sheds light on complex DNN decision-making, rendering them comprehensible within a 2D space.",
        "keywords": "covariance matrix;Hessian matrix;eigenanalysis;binary classification;class separability",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Agus Hartoyo;Jan Kazimierz Argasi\u0144ski;Aleksandra Trenk;Kinga Przybylska;Anna Blasiak;Alessandro Crimi",
        "authorids": "~Agus_Hartoyo1;~Jan_Kazimierz_Argasi\u0144ski1;~Aleksandra_Trenk1;~Kinga_Przybylska1;~Anna_Blasiak1;~Alessandro_Crimi1",
        "gender": ";M;F;F;F;",
        "homepage": ";;;;;",
        "dblp": ";;;;;http://dblp.uni-trier.de/pers/hd/c/Crimi:Alessandro",
        "google_scholar": ";4-KaZPsAAAAJ;;;;https://scholar.google.ch/citations?user=ciOVKiQAAAAJ",
        "orcid": ";0000-0002-2992-718X;0000-0002-5888-3550;;0000-0002-4017-2988;",
        "linkedin": ";;;kinga-przybylska-0913791ab/;;",
        "or_profile": "~Agus_Hartoyo1;~Jan_Kazimierz_Argasi\u0144ski1;~Aleksandra_Trenk1;~Kinga_Przybylska1;~Anna_Blasiak1;~Alessandro_Crimi1",
        "aff": ";Jagiellonian University Cracow;Jagiellonian University Cracow;Jagiellonian University Cracow;Jagiellonian University Cracow;University of Zurich",
        "aff_domain": ";uj.edu.pl;uj.edu.pl;uj.edu.pl;uj.edu.pl; ",
        "position": ";Assistant Professor;Postdoc;MS student;Associate Professor;Researcher",
        "bibtex": "@misc{\nhartoyo2024exploring,\ntitle={Exploring the Combined Power of Covariance and Hessian Matrices Eigenanalysis for Binary Classification},\nauthor={Agus Hartoyo and Jan Kazimierz Argasi{\\'n}ski and Aleksandra Trenk and Kinga Przybylska and Anna Blasiak and Alessandro Crimi},\nyear={2024},\nurl={https://openreview.net/forum?id=anek0q7QPL}\n}",
        "github": "",
        "project": "",
        "reviewers": "sPuV;YZvz;LZ1V;E7ZV",
        "site": "https://openreview.net/forum?id=anek0q7QPL",
        "pdf_size": 1385317,
        "rating": "3;5;6;6",
        "confidence": "3;2;3;4",
        "soundness": "3;2;3;2",
        "contribution": "2;2;4;2",
        "presentation": "3;3;3;2",
        "wc_summary": "65;82;65;25",
        "wc_strengths": "71;40;15;19",
        "wc_weaknesses": "143;178;13;408",
        "wc_questions": "3;136;32;24",
        "wc_review": "282;436;125;476",
        "wc_reply_reviewers": "159;0;13;166",
        "wc_reply_authors": "1406;918;384;1740",
        "reply_reviewers": "2;0;1;2",
        "reply_authors": "4;2;2;4",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            59.25,
            20.956800805466468
        ],
        "wc_strengths_avg": [
            36.25,
            22.196565049574676
        ],
        "wc_weaknesses_avg": [
            185.5,
            142.41225368626115
        ],
        "wc_questions_avg": [
            48.75,
            51.47511534712671
        ],
        "wc_review_avg": [
            329.75,
            138.63689083357286
        ],
        "wc_reply_reviewers_avg": [
            84.5,
            78.174484328328
        ],
        "wc_reply_authors_avg": [
            1112.0,
            511.9667957983213
        ],
        "reply_reviewers_avg": [
            1.25,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.0,
            1.0
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.28867513459481287,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:FVA0ippiaiwJ:scholar.google.com/&scioq=Exploring+the+Combined+Power+of+Covariance+and+Hessian+Matrices+Eigenanalysis+for+Binary+Classification&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;1",
        "aff_unique_norm": "Jagiellonian University;University of Zurich",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uj.edu.pl;https://www.unizh.ch",
        "aff_unique_abbr": "UJ;UZH",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Cracow;",
        "aff_country_unique_index": "0;0;0;0;1",
        "aff_country_unique": "Poland;Switzerland"
    },
    {
        "title": "Making Pre-trained Language Models Great on Tabular Prediction",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18356",
        "id": "anzIzGZuLi",
        "author_site": "Jiahuan Yan, Bo Zheng, Hongxia Xu, Yiheng Zhu, Danny Chen, Jimeng Sun, Jian Wu, Jintai Chen",
        "tldr": "",
        "abstract": "The transferability of deep neural networks (DNNs) has made significant progress in image and language processing. However, due to the heterogeneity among tables, such DNN bonus is still far from being well exploited on tabular data prediction (e.g., regression or classification tasks). Condensing knowledge from diverse domains, language models (LMs) possess the capability to comprehend feature names from various tables, potentially serving as versatile learners in transferring knowledge across distinct tables and diverse prediction tasks, but their discrete text representation space is inherently incompatible with numerical feature values in tables. In this paper, we present TP-BERTa, a specifically pre-trained LM for tabular data prediction. Concretely, a novel relative magnitude tokenization converts scalar numerical feature values to finely discrete, high-dimensional tokens, and an intra-feature attention approach integrates feature values with the corresponding feature names. Comprehensive experiments demonstrate that our pre-trained TP-BERTa leads the performance among tabular DNNs and is competitive with Gradient Boosted Decision Tree models in typical tabular data regime.",
        "keywords": "language models;classification and regression;model pre-training;tabular data",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Jiahuan Yan;Bo Zheng;Hongxia Xu;Yiheng Zhu;Danny Chen;Jimeng Sun;Jian Wu;Jintai Chen",
        "authorids": "~Jiahuan_Yan1;~Bo_Zheng7;~Hongxia_Xu1;~Yiheng_Zhu3;~Danny_Chen1;~Jimeng_Sun3;~Jian_Wu6;~Jintai_Chen1",
        "gender": "M;;F;M;Not Specified;;M;M",
        "homepage": ";;;;https://engineering.nd.edu/faculty/danny-chen/;http://sunlab.org;https://scholar.google.com/citations?hl=zh-TW&user=VO9XIXYAAAAJ;https://whatashot.github.io/",
        "dblp": "334/7537;;57/101;;c/DannyZChen.html;;96/2744-1;249/3929",
        "google_scholar": "_wQJGDcAAAAJ;Sj2MREUAAAAJ;XlpKptAAAAAJ;https://scholar.google.com/citations?hl=zh-CN;tRerdSIAAAAJ;9jmmp5sAAAAJ;https://scholar.google.com/citations?hl=zh-TW;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0002-2002-2579;;0000-0001-5384-4627;0000-0001-8020-9979;0000-0001-6565-2884;0000-0003-1512-6426;;0000-0002-3199-2597",
        "linkedin": ";;;;;jimengsun/;;jintai-chen-3a09921b0/",
        "or_profile": "~Jiahuan_Yan1;~Bo_Zheng7;~Hongxia_Xu1;~Yiheng_Zhu3;~Danny_Chen1;~Jimeng_Sun3;~Jian_Wu6;~Jintai_Chen1",
        "aff": "Zhejiang University;Zhejiang University;Zhejiang University;Zhejiang University;University of Notre Dame, USA;Georgia Institute of Technology;Zhejiang University;University of Illinois, Urbana Champaign",
        "aff_domain": "zju.edu.cn;zju.edu.cn;zju.edu.cn;zju.edu.cn;nd.edu;gatech.edu;zju.edu.cn;illinois.edu",
        "position": "PhD student;MS student;Researcher;PhD student;Full Professor;Associate Professor;Full Professor;Postdoc",
        "bibtex": "@inproceedings{\nyan2024making,\ntitle={Making Pre-trained Language Models Great on Tabular Prediction},\nauthor={Jiahuan Yan and Bo Zheng and Hongxia Xu and Yiheng Zhu and Danny Chen and Jimeng Sun and Jian Wu and Jintai Chen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=anzIzGZuLi}\n}",
        "github": "",
        "project": "",
        "reviewers": "cw3Y;v1fL;e2F6;AREw",
        "pdf_size": 1845093,
        "rating": "6;6;8;8",
        "confidence": "4;2;4;3",
        "soundness": "3;2;3;3",
        "contribution": "2;1;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "109;79;35;112",
        "wc_strengths": "98;6;54;143",
        "wc_weaknesses": "55;79;63;75",
        "wc_questions": "14;43;45;109",
        "wc_review": "276;207;197;439",
        "wc_reply_reviewers": "0;0;15;18",
        "wc_reply_authors": "568;904;1013;1816",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "1;2;2;3",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            83.75,
            30.96267914764483
        ],
        "wc_strengths_avg": [
            75.25,
            50.87914602270757
        ],
        "wc_weaknesses_avg": [
            68.0,
            9.539392014169456
        ],
        "wc_questions_avg": [
            52.75,
            34.71581051912803
        ],
        "wc_review_avg": [
            279.75,
            96.84362395119257
        ],
        "wc_reply_reviewers_avg": [
            8.25,
            8.317902379807062
        ],
        "wc_reply_authors_avg": [
            1075.25,
            458.0433249158861
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.30151134457776363,
        "gs_citation": 39,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7509919977956975003&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=anzIzGZuLi",
        "pdf": "https://openreview.net/pdf?id=anzIzGZuLi",
        "email": "zju.edu.cn;zju.edu.cn;zju.edu.cn;zju.edu.cn;nd.edu;gatech.edu;zju.edu.cn;illinois.edu",
        "author_num": 8,
        "aff_unique_index": "0;0;0;0;1;2;0;3",
        "aff_unique_norm": "Zhejiang University;University of Notre Dame;Georgia Institute of Technology;University of Illinois Urbana-Champaign",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.zju.edu.cn;https://www.nd.edu;https://www.gatech.edu;https://illinois.edu",
        "aff_unique_abbr": "ZJU;Notre Dame;Georgia Tech;UIUC",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Urbana-Champaign",
        "aff_country_unique_index": "0;0;0;0;1;1;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Unveiling and Manipulating Prompt Influence in Large Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18355",
        "id": "ap1ByuwQrX",
        "author_site": "Zijian Feng, Hanzhang Zhou, ZIXIAO ZHU, Junlang Qian, Kezhi Mao",
        "tldr": "",
        "abstract": "Prompts play a crucial role in guiding the responses of Large Language Models (LLMs). However, the intricate role of individual tokens in prompts, known as input saliency, in shaping the responses remains largely underexplored. Existing saliency methods either misalign with LLM generation objectives or rely heavily on linearity assumptions, leading to potential inaccuracies. To address this, we propose Token Distribution Dynamics (TDD), an elegantly simple yet remarkably effective approach to unveil and manipulate the role of prompts in generating LLM outputs. TDD leverages the robust interpreting capabilities of the language model head (LM head) to assess input saliency. It projects input tokens into the embedding space and then estimates their significance based on distribution dynamics over the vocabulary. We introduce three TDD variants: forward, backward, and bidirectional, each offering unique insights into token relevance. Extensive experiments reveal that the TDD surpasses state-of-the-art baselines with a big margin in elucidating the causal relationships between prompts and LLM outputs. Beyond mere interpretation, we apply TDD to two prompt manipulation tasks for controlled text generation: zero-shot toxic language suppression and sentiment steering. Empirical results underscore TDD's proficiency in identifying both toxic and sentimental cues in prompts, subsequently mitigating toxicity or modulating sentiment in the generated content.",
        "keywords": "Large language models;prompt interpretability;prompt manipulation;controlled LLM generation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/c0f3e61e0fdd4864b3950921fcbdacc73d34dad0.zip",
        "author": "Zijian Feng;Hanzhang Zhou;ZIXIAO ZHU;Junlang Qian;Kezhi Mao",
        "authorids": "~Zijian_Feng2;~Hanzhang_Zhou1;~ZIXIAO_ZHU1;~Junlang_Qian1;~Kezhi_Mao1",
        "gender": "M;M;F;;M",
        "homepage": ";;;https://github.com/qianjunlang;https://dr.ntu.edu.sg/cris/rp/rp00158",
        "dblp": "45/10114;295/8180;155/4344;;m/KezhiMao",
        "google_scholar": ";;;hxwdDa4AAAAJ;jCsRJXUAAAAJ",
        "orcid": "0000-0003-1311-988X;0000-0003-3758-636X;0000-0002-8834-868X;;",
        "linkedin": ";;zixiaozhu818/;;",
        "or_profile": "~Zijian_Feng2;~Hanzhang_Zhou1;~ZIXIAO_ZHU1;~Junlang_Qian1;~Kezhi_Mao1",
        "aff": "Nanyang Technological University;Nanyang Technological University;Nanyang Technological University;Nanyang Technological University;Nanyang Technological University",
        "aff_domain": "ntu.edu.sg;ntu.edu.sg;ntu.edu.sg;ntu.edu.sg;ntu.edu.sg",
        "position": "PhD student;PhD student;PhD student;PhD student;Associate Professor",
        "bibtex": "@inproceedings{\nfeng2024unveiling,\ntitle={Unveiling and Manipulating Prompt Influence in Large Language Models},\nauthor={Zijian Feng and Hanzhang Zhou and ZIXIAO ZHU and Junlang Qian and Kezhi Mao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ap1ByuwQrX}\n}",
        "github": "",
        "project": "",
        "reviewers": "rNoS;jvM3;4Y86;1T7y",
        "pdf_size": 692570,
        "rating": "6;6;6;8",
        "confidence": "4;4;3;4",
        "soundness": "3;3;3;4",
        "contribution": "2;2;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "105;136;68;95",
        "wc_strengths": "93;25;74;54",
        "wc_weaknesses": "261;213;114;86",
        "wc_questions": "89;13;32;142",
        "wc_review": "548;387;288;377",
        "wc_reply_reviewers": "151;37;96;23",
        "wc_reply_authors": "2608;967;945;1217",
        "reply_reviewers": "2;1;1;1",
        "reply_authors": "7;3;2;3",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            101.0,
            24.320773014030618
        ],
        "wc_strengths_avg": [
            61.5,
            25.184320518926057
        ],
        "wc_weaknesses_avg": [
            168.5,
            71.26184112131821
        ],
        "wc_questions_avg": [
            69.0,
            50.5816172141619
        ],
        "wc_review_avg": [
            400.0,
            93.73633233703994
        ],
        "wc_reply_reviewers_avg": [
            76.75,
            50.87423218093812
        ],
        "wc_reply_authors_avg": [
            1434.25,
            686.0347567725705
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.75,
            1.920286436967152
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1440469505300864501&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=ap1ByuwQrX",
        "pdf": "https://openreview.net/pdf?id=ap1ByuwQrX",
        "email": "ntu.edu.sg;ntu.edu.sg;ntu.edu.sg;ntu.edu.sg;ntu.edu.sg",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Nanyang Technological University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ntu.edu.sg",
        "aff_unique_abbr": "NTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Singapore"
    },
    {
        "id": "ap2UMxs8qJ",
        "title": "ALIN: An Active Learning Framework for Incomplete Networks",
        "track": "main",
        "status": "Desk Reject",
        "tldr": "",
        "abstract": "Significant progression has been made in active learning algorithms for graph networks in various tasks. However real-world applications frequently involve incomplete graphs with missing links, which pose the challenge that existing approaches might not adequately address. This paper presents an active learning approach tailored specifically for handling incomplete graphs, termed ALIN. Our algorithm employs graph neural networks (GNN) to generate node embeddings and calculates losses for both node classification and link prediction tasks. The losses are combined with appropriate weights and iteratively updating the GNN, ALIN efficiently queries nodes in batches, thereby achieving a balance between training feedbacks and resource utilization. Our empirical experiments have shown ALIN can surpass state-of-the-art baselines on Cora, Citeseer, Pubmed, and Coauthor-CS datasets.",
        "keywords": "Active Learning;Incomplete Graphs;Graph Neural Networks;Node Classification;Link Prediction;Semi-Supervised Learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Tung Khong;Cong Tran;Cuong Pham",
        "authorids": "~Tung_Khong1;~Cong_Tran1;~Cuong_Pham1",
        "gender": ";M;M",
        "homepage": ";https://scholar.google.com/citations?user=wXkxRzwAAAAJ&hl=en;https://sites.google.com/view/cuongpham/home",
        "dblp": ";87/1076;20/6376.html",
        "google_scholar": ";wXkxRzwAAAAJ;https://scholar.google.co.uk/citations?user=tDWY0U8AAAAJ",
        "orcid": ";;0000-0003-0973-0889",
        "linkedin": "tungkm;;cuong-pham-74498827/",
        "or_profile": "~Tung_Khong1;~Cong_Tran1;~Cuong_Pham1",
        "aff": "Posts & Telecommunications Institute of Technology;Posts & Telecommunications Institute of Technology;Posts & Telecommunications Institute of Technology and VinAI Research",
        "aff_domain": "ptit.edu.vn;ptit.edu.vn;ptit.edu.vn",
        "position": "Undergrad student;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nkhong2024alin,\ntitle={{ALIN}: An Active Learning Framework for Incomplete Networks},\nauthor={Tung Khong and Cong Tran and Cuong Pham},\nyear={2024},\nurl={https://openreview.net/forum?id=ap2UMxs8qJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=ap2UMxs8qJ",
        "pdf_size": 506689,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:fTbEI-3geeUJ:scholar.google.com/&scioq=ALIN:+An+Active+Learning+Framework+for+Incomplete+Networks&hl=en&as_sdt=0,10",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Posts & Telecommunications Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.ptit.edu.vn",
        "aff_unique_abbr": "PTIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Vietnam"
    },
    {
        "title": "A Topological Perspective on Demystifying GNN-Based Link Prediction Performance",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18354",
        "id": "apA6SSXx2e",
        "author_site": "Yu Wang, Tong Zhao, Yuying Zhao, Yunchao Liu, Xueqi Cheng, Neil Shah, Tyler Derr",
        "tldr": "",
        "abstract": "Graph Neural Networks (GNNs) have shown great promise in learning node embeddings for link prediction (LP). While numerous studies improve the overall GNNs' LP performance, none have explored their varying performance across different nodes and the underlying reasons. To this end, we demystify which nodes perform better from the perspective of their local topology. Despite the widespread belief that low-degree nodes exhibit worse LP performance, we surprisingly observe an inconsistent performance trend. This prompts us to propose a node-level metric, Topological Concentration (TC), based on the intersection of the local subgraph of each node with the ones of its neighbors. We empirically demonstrate that TC correlates with LP performance more than other node-level topological metrics, better identifying low-performing nodes than using degree. With TC, we discover a novel topological distribution shift issue in which nodes' newly joined neighbors tend to become less interactive with their existing neighbors, compromising the generalizability of node embeddings for LP at testing time. To make the computation of TC scalable, We further propose Approximated Topological Concentration (ATC) and justify its efficacy in approximating TC with reduced computation complexity. Given the positive correlation between node TC and its LP performance, we explore the potential of boosting LP performance via enhancing TC by re-weighting edges in the message-passing and discuss its effectiveness with limitations. Our code is publicly available at https://github.com/YuWVandy/Topo_LP_GNN.",
        "keywords": "Link prediction; Graph Topology; Graph Neural Network ; Cold-start Issues",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/9674cb8e22a02e2e6f72b99a96a332d1dbb8165f.pdf",
        "author": "Yu Wang;Tong Zhao;Yuying Zhao;Yunchao Liu;Xueqi Cheng;Neil Shah;Tyler Derr",
        "authorids": "~Yu_Wang41;~Tong_Zhao3;~Yuying_Zhao1;~Yunchao_Liu2;~Xueqi_Cheng2;~Neil_Shah2;~Tyler_Derr1",
        "gender": "M;M;F;;M;M;",
        "homepage": "https://yuwang0103.github.io/;https://tzhao.io/;https://yuyingzhao.github.io/;http://www.liuyunchao.com;https://xueqic.github.io/;http://nshah.net;http://www.tylerderr.com",
        "dblp": "02/5889-160;94/6503-3;;;;71/7771;207/7927.html",
        "google_scholar": "XPCmiz4AAAAJ;05cRc-MAAAAJ;xyTYlX0AAAAJ;oFtlWfwAAAAJ;MWnSFPMAAAAJ;Qut69OgAAAAJ;et6IhFcAAAAJ",
        "orcid": "0000-0001-6908-508X;0000-0001-7660-1732;;0000-0002-3982-1311;;0000-0003-3261-8430;",
        "linkedin": ";;;yunchaoliu/;;;tylersnetwork/",
        "or_profile": "~Yu_Wang41;~Tong_Zhao3;~Yuying_Zhao1;~Yunchao_Liu2;~Xueqi_Cheng2;~Neil_Shah2;~Tyler_Derr1",
        "aff": "Adobe Systems;Snap Inc.;Vanderbilt University;Vanderbilt University;Vanderbilt University;Snap Inc.;Vanderbilt University",
        "aff_domain": "adobe.com;snap.com;vanderbilt.edu;vanderbilt.edu;vanderbilt.edu;snap.com;vanderbilt.edu",
        "position": "Intern;Researcher;PhD student;PhD student;PhD student;Research Scientist;Assistant Professor",
        "bibtex": "@inproceedings{\nwang2024a,\ntitle={A Topological Perspective on Demystifying {GNN}-Based Link Prediction Performance},\nauthor={Yu Wang and Tong Zhao and Yuying Zhao and Yunchao Liu and Xueqi Cheng and Neil Shah and Tyler Derr},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=apA6SSXx2e}\n}",
        "github": "",
        "project": "",
        "reviewers": "1hhc;QpHH;f1PG;6TYH",
        "pdf_size": 27306312,
        "rating": "5;6;6;6",
        "confidence": "4;2;4;3",
        "soundness": "3;3;2;3",
        "contribution": "3;3;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "67;88;184;143",
        "wc_strengths": "56;105;25;90",
        "wc_weaknesses": "458;182;10;40",
        "wc_questions": "2;103;60;166",
        "wc_review": "583;478;279;439",
        "wc_reply_reviewers": "227;96;14;27",
        "wc_reply_authors": "2964;1967;369;1434",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "11;7;2;7",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            120.5,
            45.98097432634502
        ],
        "wc_strengths_avg": [
            69.0,
            30.99193443462347
        ],
        "wc_weaknesses_avg": [
            172.5,
            177.1743491592392
        ],
        "wc_questions_avg": [
            82.75,
            59.95571282204891
        ],
        "wc_review_avg": [
            444.75,
            109.22997528151328
        ],
        "wc_reply_reviewers_avg": [
            91.0,
            84.47780773670681
        ],
        "wc_reply_authors_avg": [
            1683.5,
            936.7781220758734
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            6.75,
            3.191786333700926
        ],
        "replies_avg": [
            38,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10644632316641864243&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=apA6SSXx2e",
        "pdf": "https://openreview.net/pdf?id=apA6SSXx2e",
        "email": "adobe.com;snap.com;vanderbilt.edu;vanderbilt.edu;vanderbilt.edu;snap.com;vanderbilt.edu",
        "author_num": 7,
        "aff_unique_index": "0;1;2;2;2;1;2",
        "aff_unique_norm": "Adobe;Snap Inc.;Vanderbilt University",
        "aff_unique_dep": "Adobe Systems Incorporated;;",
        "aff_unique_url": "https://www.adobe.com;https://www.snapinc.com;https://www.vanderbilt.edu",
        "aff_unique_abbr": "Adobe;Snap;Vanderbilt",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "apQukvJHFE",
        "title": "Lightweight uncertainty modelling using function space particle optimization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep ensembles have shown remarkable empirical success in quantifying uncertainty, albeit at considerable computational cost and memory footprint. Meanwhile, deterministic single-network uncertainty methods have proven as computationally effective alternatives, providing uncertainty estimates based on distributions of latent representations. While those methods are successful at out-of-domain detection, they exhibit poor calibration under distribution shifts. In this work, we propose a method that provides calibrated uncertainty by utilizing particle-based variational inference in function space. Rather than using full deep ensembles to represent particles in function space, we propose a single multi-headed neural network that is regularized to preserve bi-Lipschitz conditions. Sharing a joint latent representation enables a reduction in computational requirements, while prediction diversity is maintained by the multiple heads. We achieve competitive results in disentangling aleatoric and epistemic uncertainty for active learning, detecting out-of-domain data, and providing calibrated uncertainty estimates under distribution shifts while significantly reducing compute and memory requirements.",
        "keywords": "uncertainty quantification;bayesian inference;function space particle optimization",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Sophie Steger;Bernhard Klein;Holger Fr\u00f6ning;Franz Pernkopf",
        "authorids": "~Sophie_Steger1;~Bernhard_Klein1;~Holger_Fr\u00f6ning1;~Franz_Pernkopf1",
        "gender": "F;M;;M",
        "homepage": ";;;https://www.spsc.tugraz.at/people/franz-pernkopf.html",
        "dblp": ";;;97/887",
        "google_scholar": "https://scholar.google.com/citations?hl=de;https://scholar.google.de/citations?user=EO6Il-MAAAAJ;;",
        "orcid": ";;;0000-0002-6356-3367",
        "linkedin": ";;;https://www.linkedin.com/company/69666281/admin/feed/posts/",
        "or_profile": "~Sophie_Steger1;~Bernhard_Klein1;~Holger_Fr\u00f6ning1;~Franz_Pernkopf1",
        "aff": "Technische Universit\u00e4t Graz;Institute of Computer Engineering;Heidelberg University;Graz University of Technology",
        "aff_domain": "tugraz.at;ziti.uni-heidelberg.de;uni-heidelberg.de;spsc.tugraz.at",
        "position": "PhD student;PhD student;Associate Professor;Professor",
        "bibtex": "@misc{\nsteger2024lightweight,\ntitle={Lightweight uncertainty modelling using function space particle optimization},\nauthor={Sophie Steger and Bernhard Klein and Holger Fr{\\\"o}ning and Franz Pernkopf},\nyear={2024},\nurl={https://openreview.net/forum?id=apQukvJHFE}\n}",
        "github": "",
        "project": "",
        "reviewers": "f6Ta;y234;KBVV;Runa;bAmy",
        "site": "https://openreview.net/forum?id=apQukvJHFE",
        "pdf_size": 1207448,
        "rating": "3;3;3;5;6",
        "confidence": "4;5;4;4;5",
        "soundness": "2;2;3;2;3",
        "contribution": "1;2;2;2;3",
        "presentation": "3;2;3;3;3",
        "wc_summary": "123;66;161;69;158",
        "wc_strengths": "37;57;83;58;320",
        "wc_weaknesses": "297;119;299;111;374",
        "wc_questions": "57;1;133;96;64",
        "wc_review": "514;243;676;334;916",
        "wc_reply_reviewers": "0;0;0;17;0",
        "wc_reply_authors": "195;251;319;257;418",
        "reply_reviewers": "0;0;0;1;0",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            4.0,
            1.2649110640673518
        ],
        "confidence_avg": [
            4.4,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            115.4,
            41.340537006671795
        ],
        "wc_strengths_avg": [
            111.0,
            105.5139801163808
        ],
        "wc_weaknesses_avg": [
            240.0,
            105.7998109639143
        ],
        "wc_questions_avg": [
            70.2,
            43.84244518728398
        ],
        "wc_review_avg": [
            536.6,
            241.30279733148555
        ],
        "wc_reply_reviewers_avg": [
            3.4,
            6.8
        ],
        "wc_reply_authors_avg": [
            288.0,
            75.9473501841901
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3227486121839514,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:CiJF4Vge69UJ:scholar.google.com/&scioq=Lightweight+uncertainty+modelling+using+function+space+particle+optimization&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Technische Universit\u00e4t Graz;Institute of Computer Engineering;Heidelberg University;Graz University of Technology",
        "aff_unique_dep": ";Computer Engineering;;",
        "aff_unique_url": "https://www.tugraz.at;;https://www.uni-heidelberg.de;https://www.tugraz.at",
        "aff_unique_abbr": "TU Graz;;Uni Heidelberg;TUGraz",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;2;0",
        "aff_country_unique": "Austria;;Germany"
    },
    {
        "title": "Adaptive Regularization of Representation Rank as an Implicit Constraint of Bellman Equation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18353",
        "id": "apXtolxDaJ",
        "author_site": "Qiang HE, Tianyi Zhou, Meng Fang, Setareh Maghsudi",
        "tldr": "",
        "abstract": "Representation rank is an important concept for understanding the role of Neural Networks (NNs) in Deep Reinforcement learning (DRL), which measures the expressive capacity of value networks. Existing studies focus on unboundedly maximizing this rank; nevertheless, that approach would introduce overly complex models in the learning, thus undermining performance. Hence, fine-tuning representation rank presents a challenging and crucial optimization problem. To address this issue, we find a guiding principle for adaptive control of the representation rank. We employ the Bellman equation as a theoretical foundation and derive an upper bound on the cosine similarity of consecutive state-action pairs representations of value networks. We then leverage this upper bound to propose a novel regularizer, namely BEllman Equation-based automatic rank Regularizer (BEER). This regularizer adaptively regularizes the representation rank, thus improving the DRL agent's performance. We first validate the effectiveness of automatic control of rank on illustrative experiments. Then, we scale up BEER to complex continuous control tasks by combining it with the deterministic policy gradient method. Among 12 challenging DeepMind control tasks, BEER outperforms the baselines by a large margin. Besides, BEER demonstrates significant advantages in Q-value approximation. Our code is available at https://github.com/sweetice/BEER-ICLR2024.",
        "keywords": "representation learning;deep reinforcement learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Qiang He;Tianyi Zhou;Meng Fang;Setareh Maghsudi",
        "authorids": "~Qiang_He1;~Tianyi_Zhou1;~Meng_Fang1;~Setareh_Maghsudi1",
        "gender": "M;M;M;",
        "homepage": ";https://tianyizhou.github.io/;;",
        "dblp": ";88/8205-1;67/463;30/10806",
        "google_scholar": "l6Y2ZDYAAAAJ;OKvgizMAAAAJ;IcNYP1oAAAAJ;",
        "orcid": ";0000-0001-5348-0632;;",
        "linkedin": ";tianyizhou;;",
        "or_profile": "~Qiang_He1;~Tianyi_Zhou1;~Meng_Fang1;~Setareh_Maghsudi1",
        "aff": "Ruhr-Universit\u00e4t Bochum;University of Maryland, College Park;Eindhoven University of Technology;Ruhr-Universt\u00e4t Bochum",
        "aff_domain": "ruhr-uni-bochum.de;umd.edu;tue.nl;rub.de",
        "position": "PhD student;Assistant Professor;Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\nhe2024adaptive,\ntitle={Adaptive Regularization of Representation Rank as an Implicit Constraint of Bellman Equation},\nauthor={Qiang He and Tianyi Zhou and Meng Fang and Setareh Maghsudi},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=apXtolxDaJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "ef2F;dvZZ;Joqj;ykJX",
        "pdf_size": 936731,
        "rating": "6;6;6;6",
        "confidence": "2;4;3;2",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "72;29;82;48",
        "wc_strengths": "58;22;22;45",
        "wc_weaknesses": "147;106;228;13",
        "wc_questions": "7;152;2;2",
        "wc_review": "284;309;334;108",
        "wc_reply_reviewers": "35;0;0;0",
        "wc_reply_authors": "1097;1299;923;509",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "4;3;3;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            57.75,
            20.69269194667528
        ],
        "wc_strengths_avg": [
            36.75,
            15.449514555480375
        ],
        "wc_weaknesses_avg": [
            123.5,
            77.44191371602331
        ],
        "wc_questions_avg": [
            40.75,
            64.26264467013476
        ],
        "wc_review_avg": [
            258.75,
            88.81265394075328
        ],
        "wc_reply_reviewers_avg": [
            8.75,
            15.155444566227676
        ],
        "wc_reply_authors_avg": [
            957.0,
            290.8711054745727
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4885014178660150879&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=apXtolxDaJ",
        "pdf": "https://openreview.net/pdf?id=apXtolxDaJ",
        "email": "ruhr-uni-bochum.de;umd.edu;tue.nl;rub.de",
        "author_num": 4,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Ruhr-Universit\u00e4t Bochum;University of Maryland;Eindhoven University of Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ruhr-uni-bochum.de;https://www/umd.edu;https://www.tue.nl",
        "aff_unique_abbr": "RUB;UMD;TU/e",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";College Park",
        "aff_country_unique_index": "0;1;2;0",
        "aff_country_unique": "Germany;United States;Netherlands"
    },
    {
        "id": "aqTipMg9CZ",
        "title": "Contextual Molecule Representation Learning from Chemical Reaction Knowledge",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Self-supervised learning has emerged as a powerful tool for harnessing large amounts of unlabelled data to obtain meaningful representations. However, prevailing techniques such as reconstructing masked sub-units are inapplicable to Molecular Representation Learning (MRL) due to the high degree of freedom in possible combinations of atoms in molecules. In this work, we propose a self-supervised learning framework, \\textit{REMO}, which pre-trains graph/Transformer encoders on 1.7 million chemical reactions by taking advantage of well-defined rules of atom combinations in common chemical reactions. Specifically, two pre-training objectives are proposed, including masked reaction centre reconstruction and reaction centre identification. \\textit{REMO} offers a novel solution to MRL by leveraging the unique characteristics of chemical reactions as knowledge context for pre-training, which effectively supports diverse downstream molecular tasks with minimum finetuning. Experimental results show that \\textit{REMO} outperforms masked modeling of single molecule in various downstream tasks.",
        "keywords": "Self-supervised Pre-training;Chemical Reaction;Molecular Representation Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Han Tang;Shikun Feng;\u78a7\u6f84 \u6797;Jingjing Liu;Wei-Ying Ma;Yanyan Lan",
        "authorids": "~Han_Tang2;~Shikun_Feng3;~\u78a7\u6f84_\u67971;~Jingjing_Liu2;~Wei-Ying_Ma2;~Yanyan_Lan2",
        "gender": "M;M;F;;M;",
        "homepage": ";https://fengshikun.github.io;;https://air.tsinghua.edu.cn/en/info/1046/1194.htm#:~:text=Jingjing%20Liu%20is%20Professor%2C%20Principal,CVPR%2C%20ACL%2C%20etc.);https://air.tsinghua.edu.cn/en/info/1046/1189.htm;",
        "dblp": ";;;30/3008-1;m/WYMa.html;00/6040.html",
        "google_scholar": ";;;BzJ_GboAAAAJ;SToCbu8AAAAJ;",
        "orcid": "0009-0003-5110-8097;;0009-0008-4333-5966;;;",
        "linkedin": "hantang1995;;;jingjing-liu-65703431/;wei-ying-ma-16a0171/;",
        "or_profile": "~Han_Tang2;~Shikun_Feng3;~\u78a7\u6f84_\u67971;~Jingjing_Liu2;~Wei-Ying_Ma2;~Yanyan_Lan2",
        "aff": "Tsinghua University;Tsinghua University;Tsinghua University;Tsinghua University;Tsinghua University;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "Researcher;PhD student;Undergrad student;Full Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\ntang2024contextual,\ntitle={Contextual Molecule Representation Learning from Chemical Reaction Knowledge},\nauthor={Han Tang and Shikun Feng and \u78a7\u6f84 \u6797 and Jingjing Liu and Wei-Ying Ma and Yanyan Lan},\nyear={2024},\nurl={https://openreview.net/forum?id=aqTipMg9CZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "1YRR;H5fY;rKxi;gLxF",
        "site": "https://openreview.net/forum?id=aqTipMg9CZ",
        "pdf_size": 2056446,
        "rating": "3;5;5;8",
        "confidence": "4;5;4;4",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "62;118;49;177",
        "wc_strengths": "15;46;49;25",
        "wc_weaknesses": "125;231;505;50",
        "wc_questions": "75;2;2;238",
        "wc_review": "277;397;605;490",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "538;810;1168;465",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;4;3;1",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            101.5,
            50.71735403192876
        ],
        "wc_strengths_avg": [
            33.75,
            14.236836024903848
        ],
        "wc_weaknesses_avg": [
            227.75,
            172.50416661634583
        ],
        "wc_questions_avg": [
            79.25,
            96.37783718262202
        ],
        "wc_review_avg": [
            442.25,
            120.54330134851956
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            745.25,
            275.8635305726366
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.08084520834544431,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3752550378548468896&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "Tsinghua University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "aqqE1yS3RY",
        "title": "Towards Better Evaluation of GNN Expressiveness with BREC Dataset",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Research on the theoretical expressiveness of Graph Neural Networks (GNNs) has developed rapidly, and many methods have been proposed to enhance the expressiveness. However, unifying all kinds of models into one framework is untractable, making it hard to measure and compare their expressiveness quantitatively. In contrast to theoretical analysis, another way to measure expressiveness is by evaluating model performance on certain datasets containing 1-WL-indistinguishable graphs. Previous datasets specifically designed for this purpose, however, face problems with difficulty (any model surpassing 1-WL has nearly 100\\% accuracy), granularity (models tend to be either 100\\% correct or near random guess), and scale (only several essentially different graphs in each dataset). To address these limitations, we propose a new expressiveness dataset, **BREC**, including 400 pairs of non-isomorphic graphs carefully selected from four primary categories (Basic, Regular, Extension, and CFI). These graphs have higher difficulty (up to 4-WL-indistinguishable), finer granularity (can compare models between 1-WL and 3-WL), and a larger scale (400 pairs or extend to 319600 pairs or even more). Further, we synthetically test 23 models with higher-than-1-WL expressiveness on our BREC dataset. Our experiment gives the first thorough measurement of the expressiveness of those state-of-the-art beyond-1-WL GNN models and reveals the gap between theoretical and practical expressiveness. We expect this dataset to serve as a benchmark for testing the expressiveness of future GNNs. Dataset and evaluation codes are released at: https://github.com/brec-iclr2024/brec-iclr2024.",
        "keywords": "GNN;Expressiveness;Datasets",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/2debc707e61bbe07c54357dace2df5cdf35f83cf.zip",
        "author": "Yanbo Wang;Muhan Zhang",
        "authorids": "~Yanbo_Wang2;~Muhan_Zhang1",
        "gender": "M;M",
        "homepage": "https://yanxwb.github.io/;https://muhanzhang.github.io/",
        "dblp": ";157/5518",
        "google_scholar": "Rmo7EXQAAAAJ;https://scholar.google.com.hk/citations?user=OBBqkosAAAAJ",
        "orcid": ";0000-0002-7680-6401",
        "linkedin": ";jerry-muhan-zhang-a33a1777/",
        "or_profile": "~Yanbo_Wang2;~Muhan_Zhang1",
        "aff": "Peking University;Peking University",
        "aff_domain": "pku.edu.cn;pku.edu.cn",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nwang2024towards,\ntitle={Towards Better Evaluation of {GNN} Expressiveness with {BREC} Dataset},\nauthor={Yanbo Wang and Muhan Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=aqqE1yS3RY}\n}",
        "github": "",
        "project": "",
        "reviewers": "D7WE;Bpfn;ZHhj",
        "site": "https://openreview.net/forum?id=aqqE1yS3RY",
        "pdf_size": 1082134,
        "rating": "5;6;6",
        "confidence": "4;3;2",
        "soundness": "3;3;3",
        "contribution": "1;3;2",
        "presentation": "3;3;2",
        "wc_summary": "80;55;85",
        "wc_strengths": "67;85;51",
        "wc_weaknesses": "110;60;76",
        "wc_questions": "88;1;2",
        "wc_review": "345;201;214",
        "wc_reply_reviewers": "184;45;0",
        "wc_reply_authors": "2040;529;754",
        "reply_reviewers": "1;1;0",
        "reply_authors": "5;2;1",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            73.33333333333333,
            13.12334645668635
        ],
        "wc_strengths_avg": [
            67.66666666666667,
            13.888444437333106
        ],
        "wc_weaknesses_avg": [
            82.0,
            20.848661028149188
        ],
        "wc_questions_avg": [
            30.333333333333332,
            40.778534658431376
        ],
        "wc_review_avg": [
            253.33333333333334,
            65.03503329402973
        ],
        "wc_reply_reviewers_avg": [
            76.33333333333333,
            78.31701957783861
        ],
        "wc_reply_authors_avg": [
            1107.6666666666667,
            665.6276903962321
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            1.699673171197595
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3462621932896971948&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Peking University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.pku.edu.cn",
        "aff_unique_abbr": "Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "atQqW27RMQ",
        "title": "GENIU: A Restricted Data Access Unlearning for Imbalanced Data",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "With the increasing emphasis on data privacy, the significance of machine unlearning has grown substantially. Class unlearning, which involves enabling a trained model to forget data belonging to a specific class learned before, is important as classification tasks account for the majority of today's machine learning as a service (MLaaS). Retraining the model on the original data, excluding the data to be forgotten (also known as forgetting data), is a common approach to class unlearning. However, the availability of original data during the unlearning phase is not always guaranteed, leading to the exploration of class unlearning with restricted data access, which has attracted considerable attention. While current unlearning methods with restricted data access usually generate proxy sample via the trained neural network classifier, they typically focus on training and forgetting balanced data. However, the imbalanced original data can cause trouble for these proxies and unlearning, particularly when the forgetting data consists predominantly of the majority class. To address this issue, we propose the GENerative Imbalanced Unlearning (GENIU) framework. GENIU utilizes a Variational Autoencoder (VAE) to concurrently train a proxy generator alongside the original model. These generated proxies accurately represent each class and are leveraged in the unlearning phase, eliminating the reliance on the original training data. To further mitigate the performance degradation resulting from forgetting the majority class, we introduce an ``in-batch tuning'' strategy which works with the generated proxies. GENIU is the first practical framework for class unlearning in imbalanced data settings and restricted data access, ensuring the preservation of essential information for future unlearning. Experimental results confirm the superiority of GENIU over existing methods, establishing its effectiveness in empirical scenarios.",
        "keywords": "machine unlearning;imbalanced data;restricted data access",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/388b6e52b3a4e9238eb1c2d4513ecef0585796c5.pdf",
        "author": "Chenhao Zhang;Shaofei Shen;Yawen Zhao;Weitong Tony Chen;Miao Xu",
        "authorids": "~Chenhao_Zhang1;~Shaofei_Shen1;~Yawen_Zhao1;~Weitong_Tony_Chen1;~Miao_Xu3",
        "gender": ";M;F;;F",
        "homepage": ";;;;https://researchers.uq.edu.au/researcher/26509",
        "dblp": ";247/9523;257/5920;;",
        "google_scholar": ";RBLkGM4AAAAJ;;;vqpIjSAAAAAJ",
        "orcid": ";0000-0001-6232-0040;0000-0002-3079-1347;;0000-0001-9409-6960",
        "linkedin": ";;;;",
        "or_profile": "~Chenhao_Zhang1;~Shaofei_Shen1;~Yawen_Zhao1;~Weitong_Tony_Chen1;~Miao_Xu3",
        "aff": ";University of Queensland;University of Queensland;;University of Queensland",
        "aff_domain": ";uq.edu.au;uq.edu.au;;uq.edu.au",
        "position": ";PhD student;PhD student;;Lecturer",
        "bibtex": "@misc{\nzhang2024geniu,\ntitle={{GENIU}: A Restricted Data Access Unlearning for Imbalanced Data},\nauthor={Chenhao Zhang and Shaofei Shen and Yawen Zhao and Weitong Tony Chen and Miao Xu},\nyear={2024},\nurl={https://openreview.net/forum?id=atQqW27RMQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "iDvc;iMwM;PTAU",
        "site": "https://openreview.net/forum?id=atQqW27RMQ",
        "pdf_size": 674443,
        "rating": "1;5;8",
        "confidence": "3;3;4",
        "soundness": "1;3;3",
        "contribution": "1;2;3",
        "presentation": "2;4;3",
        "wc_summary": "44;119;130",
        "wc_strengths": "21;99;277",
        "wc_weaknesses": "208;226;190",
        "wc_questions": "48;190;121",
        "wc_review": "321;634;718",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "2753;2871;1379",
        "reply_reviewers": "0;0;0",
        "reply_authors": "8;8;4",
        "rating_avg": [
            4.666666666666667,
            2.8674417556808756
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            97.66666666666667,
            38.21285414912399
        ],
        "wc_strengths_avg": [
            132.33333333333334,
            107.1364654178129
        ],
        "wc_weaknesses_avg": [
            208.0,
            14.696938456699069
        ],
        "wc_questions_avg": [
            119.66666666666667,
            57.97892337354632
        ],
        "wc_review_avg": [
            557.6666666666666,
            170.82609740773086
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            2334.3333333333335,
            677.2381822930213
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            6.666666666666667,
            1.8856180831641267
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.8219949365267862,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1627872609070127942&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Queensland",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uq.edu.au",
        "aff_unique_abbr": "UQ",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Australia"
    },
    {
        "title": "Adaptive Chameleon or Stubborn Sloth: Revealing the Behavior of Large Language Models in Knowledge Conflicts",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18352",
        "id": "auKAUJZMO6",
        "author_site": "Jian Xie, Kai Zhang, Jiangjie Chen, Renze Lou, Yu Su",
        "tldr": "",
        "abstract": "By providing external information to large language models (LLMs), tool augmentation (including retrieval augmentation) has emerged as a promising solution for addressing the limitations of LLMs' static parametric memory.\nHowever, how receptive are LLMs to such external evidence, especially when the evidence conflicts with their parametric memory? \nWe present the first comprehensive and controlled investigation into the behavior of LLMs when encountering knowledge conflicts.\nWe propose a systematic framework to elicit high-quality parametric memory from LLMs and construct the corresponding counter-memory, which enables us to conduct a series of controlled experiments.\nOur investigation reveals seemingly contradicting behaviors of LLMs.\nOn the one hand, different from prior wisdom, we find that LLMs can be highly receptive to external evidence even when that conflicts with their parametric memory, given that the external evidence is coherent and convincing.\nOn the other hand, LLMs also demonstrate a strong confirmation bias when the external evidence contains some information that is consistent with their parametric memory, despite being presented with conflicting evidence at the same time.\nThese results pose important implications that are worth careful consideration for the further development and deployment of tool- and retrieval-augmented LLMs.\nResources are available at https://github.com/OSU-NLP-Group/LLM-Knowledge-Conflict.",
        "keywords": "Large Langugage Model;Knowledge Conflict;Tool Augmentation",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/62a2eca4076c769d54f1ce26b9c368941945fc91.zip",
        "author": "Jian Xie;Kai Zhang;Jiangjie Chen;Renze Lou;Yu Su",
        "authorids": "~Jian_Xie3;~Kai_Zhang10;~Jiangjie_Chen1;~Renze_Lou1;~Yu_Su2",
        "gender": "M;M;M;M;M",
        "homepage": ";https://drogozhang.github.io;https://jiangjiechen.github.io;https://renzelou.github.io/;http://ysu1989.github.io",
        "dblp": ";55/957-33;236/6076;296/4744;38/1070-1",
        "google_scholar": ";sDnAIsgAAAAJ;https://scholar.google.com.hk/citations?user=XarNs8oAAAAJ;GVTbSPMAAAAJ;rIh5OqoAAAAJ",
        "orcid": "0009-0000-2867-4726;;;0000-0002-3273-0097;",
        "linkedin": ";kai-zhang-43774b196/;;renze-lou-b681b51a0/;",
        "or_profile": "~Jian_Xie3;~Kai_Zhang10;~Jiangjie_Chen1;~Renze_Lou1;~Yu_Su2",
        "aff": "Fudan University;Google DeepMind;Fudan University;SalesForce.com;Microsoft",
        "aff_domain": "fudan.edu.cn;google.com;fudan.edu.cn;salesforce.com;microsoft.com",
        "position": "MS student;Student Researcher;PhD student;Intern;Senior Researcher",
        "bibtex": "@inproceedings{\nxie2024adaptive,\ntitle={Adaptive Chameleon  or Stubborn Sloth: Revealing the Behavior of Large Language Models in Knowledge Conflicts},\nauthor={Jian Xie and Kai Zhang and Jiangjie Chen and Renze Lou and Yu Su},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=auKAUJZMO6}\n}",
        "github": "",
        "project": "",
        "reviewers": "tvy2;zShN;smQg;o9aH",
        "pdf_size": 606798,
        "rating": "6;6;8;8",
        "confidence": "3;4;4;5",
        "soundness": "3;2;4;3",
        "contribution": "3;3;3;3",
        "presentation": "3;2;4;3",
        "wc_summary": "67;110;59;49",
        "wc_strengths": "49;70;73;165",
        "wc_weaknesses": "169;371;112;165",
        "wc_questions": "1;23;61;56",
        "wc_review": "286;574;305;435",
        "wc_reply_reviewers": "0;17;13;0",
        "wc_reply_authors": "517;1670;382;282",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;4;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            71.25,
            23.263436977368585
        ],
        "wc_strengths_avg": [
            89.25,
            44.70109059072273
        ],
        "wc_weaknesses_avg": [
            204.25,
            98.86701927336537
        ],
        "wc_questions_avg": [
            35.25,
            24.580225792290843
        ],
        "wc_review_avg": [
            400.0,
            115.6741111917442
        ],
        "wc_reply_reviewers_avg": [
            7.5,
            7.632168761236874
        ],
        "wc_reply_authors_avg": [
            712.75,
            558.9245812271992
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            1.299038105676658
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.7071067811865475,
        "gs_citation": 134,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10890282943822204487&as_sdt=8005&sciodt=0,7&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=auKAUJZMO6",
        "pdf": "https://openreview.net/pdf?id=auKAUJZMO6",
        "email": "fudan.edu.cn;google.com;fudan.edu.cn;salesforce.com;microsoft.com",
        "author_num": 5,
        "aff_unique_index": "0;1;0;2;3",
        "aff_unique_norm": "Fudan University;Google;Salesforce;Microsoft",
        "aff_unique_dep": ";Google DeepMind;;Microsoft Corporation",
        "aff_unique_url": "https://www.fudan.edu.cn;https://deepmind.com;https://www.salesforce.com;https://www.microsoft.com",
        "aff_unique_abbr": "Fudan;DeepMind;Salesforce;Microsoft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;2;2",
        "aff_country_unique": "China;United Kingdom;United States"
    },
    {
        "title": "Implicit Maximum a Posteriori Filtering via Adaptive Optimization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18351",
        "id": "auUngos7eR",
        "author_site": "Gianluca Bencomo, Jake Snell, Thomas L. Griffiths",
        "tldr": "",
        "abstract": "Bayesian filtering approximates the true underlying behavior of a time-varying system by inverting an explicit generative model to convert noisy measurements into state estimates. This process typically requires matrix storage, inversion, and multiplication or Monte Carlo estimation, none of which are practical in high-dimensional state spaces such as the weight spaces of artificial neural networks. Here, we consider the standard Bayesian filtering problem as optimization over a time-varying objective. Instead of maintaining matrices for the filtering equations or simulating particles, we specify an optimizer that defines the Bayesian filter implicitly. In the linear-Gaussian setting, we show that every Kalman filter has an equivalent formulation using K steps of gradient descent. In the nonlinear setting, our experiments demonstrate that our framework results in filters that are effective, robust, and scalable to high-dimensional systems, comparing well against the standard toolbox of Bayesian filtering solutions. We suggest that it is easier to fine-tune an optimizer than it is to specify the correct filtering equations, making our framework an attractive option for high-dimensional filtering problems.",
        "keywords": "Bayesian filtering;optimization;neural networks",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/0dc611706644351a3f63b602444998241808d9b0.zip",
        "author": "Gianluca Bencomo;Jake Snell;Thomas L. Griffiths",
        "authorids": "~Gianluca_Bencomo1;~Jake_Snell1;~Thomas_L._Griffiths1",
        "gender": "M;M;",
        "homepage": "https://gianlucabencomo.github.io;https://www.jakesnell.com;http://cocosci.princeton.edu/tom/",
        "dblp": ";172/1406;34/4472",
        "google_scholar": "xSS55BgAAAAJ;MbXKAK8AAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;",
        "linkedin": "gianluca-bencomo-326469133/;;",
        "or_profile": "~Gianluca_Bencomo1;~Jake_Snell1;~Thomas_L._Griffiths1",
        "aff": "Princeton University;Princeton University;Princeton University",
        "aff_domain": "princeton.edu;princeton.edu;princeton.edu",
        "position": "PhD student;Postdoc;Professor",
        "bibtex": "@inproceedings{\nbencomo2024implicit,\ntitle={Implicit Maximum a Posteriori Filtering via Adaptive Optimization},\nauthor={Gianluca Bencomo and Jake Snell and Thomas L. Griffiths},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=auUngos7eR}\n}",
        "github": "",
        "project": "",
        "reviewers": "zJkz;Y38s;KcGp",
        "pdf_size": 1277597,
        "rating": "6;6;8",
        "confidence": "3;4;4",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "4;3;3",
        "wc_summary": "122;131;170",
        "wc_strengths": "98;88;75",
        "wc_weaknesses": "193;133;410",
        "wc_questions": "86;195;1",
        "wc_review": "499;547;656",
        "wc_reply_reviewers": "0;10;200",
        "wc_reply_authors": "695;840;358",
        "reply_reviewers": "0;1;2",
        "reply_authors": "2;2;2",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            141.0,
            20.83266665599966
        ],
        "wc_strengths_avg": [
            87.0,
            9.41629792788369
        ],
        "wc_weaknesses_avg": [
            245.33333333333334,
            118.98552666419373
        ],
        "wc_questions_avg": [
            94.0,
            79.40193112680993
        ],
        "wc_review_avg": [
            567.3333333333334,
            65.68781385378028
        ],
        "wc_reply_reviewers_avg": [
            70.0,
            92.01449161228173
        ],
        "wc_reply_authors_avg": [
            631.0,
            201.91252231267546
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.49999999999999983,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10121429425043208825&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=auUngos7eR",
        "pdf": "https://openreview.net/pdf?id=auUngos7eR",
        "email": "princeton.edu;princeton.edu;princeton.edu",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Princeton University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.princeton.edu",
        "aff_unique_abbr": "Princeton",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "auguNUCto5",
        "title": "Boosting Temporal Graph Learning From Global and Local Perspectives",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Extensive research has been dedicated to learning on temporal graphs due to its wide range of applications. Some works intuitively merge GNNs and RNNs to capture structural and temporal information, while recent works propose to aggregate information from neighbor nodes in local subgraphs based on message passing or random walk. These methods produce node embeddings from a global or local perspective and ignore the complementarity between them, thus facing limitations in capturing complex and entangled dynamic patterns when applied to diverse datasets or evaluated by more challenging evaluation protocols. To address the challenges, we propose the Global and Local Embedding Network (GLEN) for effective and efficient temporal graph representation learning. Specifically, GLEN dynamically generates embeddings for graph nodes by considering both global and local perspectives. Then, global and local embeddings are elegantly combined by a cross-perspective fusion module to extract high-order semantic relations in graphs. We evaluate GLEN on multiple real-world datasets and apply several negative sampling strategies. Sufficient experimental results demonstrate that GLEN outperforms other baselines in both link prediction and dynamic node classification tasks.",
        "keywords": "temporal graphs;graph neural networks;attention mechanism",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Fengyi Wang;Guanghui Zhu;Chunfeng Yuan;Yihua Huang",
        "authorids": "~Fengyi_Wang1;~Guanghui_Zhu1;~Chunfeng_Yuan4;~Yihua_Huang1",
        "gender": "Not Specified;M;F;M",
        "homepage": "https://github.com/WangFengyi0228;https://cs.nju.edu.cn/zgh/;http://pasa-bigdata.nju.edu.cn/;http://cs.nju.edu.cn/yhuang",
        "dblp": ";161/2889.html;;",
        "google_scholar": ";tsH6LowAAAAJ;;",
        "orcid": ";0000-0002-5069-5950;;",
        "linkedin": ";;;",
        "or_profile": "~Fengyi_Wang1;~Guanghui_Zhu1;~Chunfeng_Yuan4;~Yihua_Huang1",
        "aff": "Nanjing University;Nanjing University;;Nanjing University",
        "aff_domain": "nju.edu;nju.edu.cn;;nju.edu.cn",
        "position": "Undergrad student;Assistant Professor;;Full Professor",
        "bibtex": "@misc{\nwang2024boosting,\ntitle={Boosting Temporal Graph Learning From Global and Local Perspectives},\nauthor={Fengyi Wang and Guanghui Zhu and Chunfeng Yuan and Yihua Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=auguNUCto5}\n}",
        "github": "",
        "project": "",
        "reviewers": "u41A;L1Kz;farU;K85V",
        "site": "https://openreview.net/forum?id=auguNUCto5",
        "pdf_size": 1105494,
        "rating": "5;5;6;6",
        "confidence": "4;4;3;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "93;80;47;50",
        "wc_strengths": "48;54;52;114",
        "wc_weaknesses": "243;202;76;92",
        "wc_questions": "87;3;2;4",
        "wc_review": "471;339;177;260",
        "wc_reply_reviewers": "0;22;18;0",
        "wc_reply_authors": "2861;1428;725;1278",
        "reply_reviewers": "0;2;1;0",
        "reply_authors": "6;3;3;3",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            67.5,
            19.576771950451892
        ],
        "wc_strengths_avg": [
            67.0,
            27.2213151776324
        ],
        "wc_weaknesses_avg": [
            153.25,
            70.97666870176424
        ],
        "wc_questions_avg": [
            24.0,
            36.37993952716249
        ],
        "wc_review_avg": [
            311.75,
            108.32676262124701
        ],
        "wc_reply_reviewers_avg": [
            10.0,
            10.099504938362077
        ],
        "wc_reply_authors_avg": [
            1573.0,
            788.3682515170179
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.75,
            1.299038105676658
        ],
        "replies_avg": [
            31,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ib-JkNpCVPMJ:scholar.google.com/&scioq=Boosting+Temporal+Graph+Learning+From+Global+and+Local+Perspectives&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Nanjing University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nju.edu.cn",
        "aff_unique_abbr": "Nanjing U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "aup1BV78Gq",
        "title": "A New Type of Associative Memory Network with Exponential Storage Capacity",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent developments have sought to overcome the inherent limitations of traditional associative memory models, like Hopfield networks, where storage capacity scales linearly with input dimension. In this paper, we present a new extension of Hopfield networks that grants precise control over inter-neuron interactions while allowing control of the level of connectivity within the network. This versatile framework encompasses a variety of designs, including classical Hopfield networks, models with polynomial activation functions, and simplicial Hopfield networks as particular cases. Remarkably, a specific instance of our construction, resulting in a new self-attention mechanism, is characterized by quasi-exponential storage capacity and a sparse network structure, aligning with biological plausibility. To our knowledge, our proposed construction introduces the first biologically-plausible associative memory model with exponential storage capacity. Furthermore, the resulting model admits a very efficient implementation via vectorization; therefore, it can fully exploit modern numerical computation hardware like GPUs. This work not only advances the theoretical foundations of associative memory but also provides insights into the development of neurobiologically inspired associative memory systems with unprecedented capabilities.",
        "keywords": "Associative memory;dense Hopfield networks;self-attention",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/6b2771d2d9743c6827e39082ee2b73327263d771.zip",
        "author": "Elvis Dohmatob",
        "authorids": "~Elvis_Dohmatob1",
        "gender": "M",
        "homepage": "http://dohmatob.github.io/",
        "dblp": "134/9794",
        "google_scholar": "https://scholar.google.fr/citations?user=FDWgJY8AAAAJ",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Elvis_Dohmatob1",
        "aff": "Meta Facebook",
        "aff_domain": "facebook.com",
        "position": "Researcher",
        "bibtex": "@misc{\ndohmatob2024a,\ntitle={A New Type of Associative Memory Network with Exponential Storage Capacity},\nauthor={Elvis Dohmatob},\nyear={2024},\nurl={https://openreview.net/forum?id=aup1BV78Gq}\n}",
        "github": "",
        "project": "",
        "reviewers": "CEY5;sVrL;odRF;f2zF",
        "site": "https://openreview.net/forum?id=aup1BV78Gq",
        "pdf_size": 614763,
        "rating": "5;5;8;8",
        "confidence": "4;3;4;4",
        "soundness": "3;2;3;4",
        "contribution": "3;2;3;3",
        "presentation": "3;2;3;4",
        "wc_summary": "75;53;51;156",
        "wc_strengths": "64;115;56;85",
        "wc_weaknesses": "30;208;64;87",
        "wc_questions": "535;88;106;154",
        "wc_review": "704;464;277;482",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            6.5,
            1.5
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            83.75,
            42.763155870445296
        ],
        "wc_strengths_avg": [
            80.0,
            22.814469093099667
        ],
        "wc_weaknesses_avg": [
            97.25,
            67.07971004707757
        ],
        "wc_questions_avg": [
            220.75,
            183.02919849029553
        ],
        "wc_review_avg": [
            481.75,
            151.35450934808648
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0.5773502691896258,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:5CrIeHGL3yMJ:scholar.google.com/&scioq=A+New+Type+of+Associative+Memory+Network+with+Exponential+Storage+Capacity&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Meta",
        "aff_unique_dep": "Meta Platforms, Inc.",
        "aff_unique_url": "https://meta.com",
        "aff_unique_abbr": "Meta",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "awHFgIGPuA",
        "title": "FedCR: Federated Face Recognition with Inter-Class Representation Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "With the growing attention on data privacy and communication security in face recognition applications, federated learning has been introduced to learn a face recognition model with decentralized datasets in a privacy-preserving manner. However, the existence of additional communication cost and unsatisfying performance in recent works still restricts their applications in real-world scenarios. In this paper, we propose a simple yet effective federated face recognition framework called FedCR by developing a inter-Class Representation learning algorithm, to improve the efficiency of federated training and generalization of the generic face model under strict privacy-preservation. Particularly, our work delicately utilizes feature representations of public identities as negative knowledge to optimize the local objective in the feature space, which further encourages the local model to learn powerful representations. Experimental results demonstrate that our method outperforms previous approaches on several prevalent face recognition benchmarks within less than 3 communication rounds, which shows communication-friendly and great efficiency.",
        "keywords": "Face Recognition;Federated Learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Di Qiu;Xinyang Lin",
        "authorids": "~Di_Qiu2;~Xinyang_Lin1",
        "gender": "M;",
        "homepage": ";https://github.com/littleSunlxy",
        "dblp": ";",
        "google_scholar": "6D_nzucAAAAJ;",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Di_Qiu2;~Lin_Xinyang1",
        "aff": "Meituan;meituan",
        "aff_domain": "meituan.com;meituan.com",
        "position": "Researcher;Researcher",
        "bibtex": "@misc{\nqiu2024fedcr,\ntitle={Fed{CR}: Federated Face Recognition with Inter-Class Representation Learning},\nauthor={Di Qiu and Xinyang Lin},\nyear={2024},\nurl={https://openreview.net/forum?id=awHFgIGPuA}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=awHFgIGPuA",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:oJhbCXUO9y4J:scholar.google.com/&scioq=FedCR:+Federated+Face+Recognition+with+Inter-Class+Representation+Learning&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Meituan",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.meituan.com",
        "aff_unique_abbr": "Meituan",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Expressivity of ReLU-Networks under Convex Relaxations",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18350",
        "id": "awHTL3Hpto",
        "author_site": "Maximilian Baader, Mark N M\u00fcller, Yuhao Mao, Martin Vechev",
        "tldr": "",
        "abstract": "Convex relaxations are a key component of training and certifying provably safe neural networks. However, despite substantial progress, a wide and poorly understood accuracy gap to standard networks remains, raising the question of whether this is due to fundamental limitations of convex relaxations. Initial work investigating this question focused on the simple and widely used IBP relaxation. It revealed that some univariate, convex, continuous piecewise linear (CPWL) functions cannot be encoded by any ReLU network such that its IBP-analysis is precise.\nTo explore whether this limitation is shared by more advanced convex relaxations, we conduct the first in-depth study on the expressive power of ReLU networks across all commonly used convex relaxations. We show that: (i) more advanced relaxations allow a larger class of univariate functions to be expressed as precisely analyzable ReLU networks, (ii) more precise relaxations can allow exponentially larger solution spaces of ReLU networks encoding the same functions, and (iii) even using the most precise single-neuron relaxations, it is impossible to construct precisely analyzable ReLU networks that express multivariate, convex, monotone CPWL functions.",
        "keywords": "Convex Relaxations;Neural Network Verification;Certified Robustness;Adversarial Robustness;Universal Approximation",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Maximilian Baader;Mark Niklas Mueller;Yuhao Mao;Martin Vechev",
        "authorids": "~Maximilian_Baader1;~Mark_Niklas_Mueller2;~Yuhao_Mao1;~Martin_Vechev1",
        "gender": ";M;M;M",
        "homepage": "https://www.sri.inf.ethz.ch/people/max;https://www.sri.inf.ethz.ch/people/mark;https://algebraloveme.github.io/about/;https://www.sri.inf.ethz.ch/people/martin",
        "dblp": "249/8060;287/4254;245/5901;93/2189.html",
        "google_scholar": "LKqCkWoAAAAJ;RBpmcCAAAAAJ;;https://scholar.google.ch/citations?user=aZ1Rh50AAAAJ",
        "orcid": "0000-0002-9271-6422;0000-0002-2496-6542;;",
        "linkedin": ";mark-m%C3%BCller-8bb4b1140/;;",
        "or_profile": "~Maximilian_Baader1;~Mark_Niklas_Mueller2;~Yuhao_Mao1;~Martin_Vechev1",
        "aff": "ETH Zurich;Swiss Federal Institute of Technology;ETHZ - ETH Zurich;Swiss Federal Institute of Technology",
        "aff_domain": "ethz.ch;ethz.ch;ethz.ch;ethz.ch",
        "position": "PhD student;PhD student;PhD student;Full Professor",
        "bibtex": "@inproceedings{\nbaader2024expressivity,\ntitle={Expressivity of Re{LU}-Networks under Convex Relaxations},\nauthor={Maximilian Baader and Mark Niklas Mueller and Yuhao Mao and Martin Vechev},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=awHTL3Hpto}\n}",
        "github": "",
        "project": "",
        "reviewers": "y6LY;pT5c;FMX3",
        "pdf_size": 405345,
        "rating": "5;6;8",
        "confidence": "4;3;2",
        "soundness": "2;3;2",
        "contribution": "2;2;2",
        "presentation": "3;3;1",
        "wc_summary": "212;79;68",
        "wc_strengths": "108;52;15",
        "wc_weaknesses": "123;103;8",
        "wc_questions": "116;56;252",
        "wc_review": "559;290;343",
        "wc_reply_reviewers": "22;45;256",
        "wc_reply_authors": "1185;1270;1288",
        "reply_reviewers": "1;1;2",
        "reply_authors": "3;3;3",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            119.66666666666667,
            65.44378418833135
        ],
        "wc_strengths_avg": [
            58.333333333333336,
            38.23029630483598
        ],
        "wc_weaknesses_avg": [
            78.0,
            50.16638981097471
        ],
        "wc_questions_avg": [
            141.33333333333334,
            81.99728992811626
        ],
        "wc_review_avg": [
            397.3333333333333,
            116.34527159374471
        ],
        "wc_reply_reviewers_avg": [
            107.66666666666667,
            105.30695872332252
        ],
        "wc_reply_authors_avg": [
            1247.6666666666667,
            44.917207788948275
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.0,
            0.0
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9819805060619659,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12823065598781025798&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=awHTL3Hpto",
        "pdf": "https://openreview.net/pdf?id=awHTL3Hpto",
        "email": "ethz.ch;ethz.ch;ethz.ch;ethz.ch",
        "author_num": 4,
        "aff_unique_index": "0;1;0;1",
        "aff_unique_norm": "ETH Zurich;Swiss Federal Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ethz.ch;https://www.ethz.ch",
        "aff_unique_abbr": "ETHZ;ETH Zurich",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Switzerland"
    },
    {
        "title": "The Hidden Language of Diffusion Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18349",
        "id": "awWpHnEJDw",
        "author_site": "Hila Chefer, Oran Lang, Mor Geva, Volodymyr Polosukhin, Assaf Shocher, michal Irani, Inbar Mosseri, Lior Wolf",
        "tldr": "",
        "abstract": "Text-to-image diffusion models have demonstrated an unparalleled ability to generate high-quality, diverse images from a textual prompt. However, the internal representations learned by these models remain an enigma. In this work, we present Conceptor, a novel method to interpret the internal representation of a textual concept by a diffusion model. This interpretation is obtained by decomposing the concept into a small set of human-interpretable textual elements. Applied over the state-of-the-art Stable Diffusion model, Conceptor reveals non-trivial structures in the representations of concepts. For example, we find surprising visual connections between concepts, that transcend their textual semantics. We additionally discover concepts that rely on mixtures of exemplars, biases, renowned artistic styles, or a simultaneous fusion of multiple meanings of the concept.\nThrough a large battery of experiments, we demonstrate Conceptor's ability to provide meaningful, robust, and faithful decompositions for a wide variety of abstract, concrete, and complex textual concepts, while allowing to naturally connect each decomposition element to its corresponding visual impact on the generated images.",
        "keywords": "Interpretability;Explainability;Text-to-image models",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/fbd1c7d5ad2b6e19f7bb81dbe226074dbd4bfbb7.zip",
        "author": "Hila Chefer;Oran Lang;Mor Geva;Volodymyr Polosukhin;Assaf Shocher;michal Irani;Inbar Mosseri;Lior Wolf",
        "authorids": "~Hila_Chefer1;~Oran_Lang1;~Mor_Geva1;~Volodymyr_Polosukhin1;~Assaf_Shocher1;~michal_Irani1;~Inbar_Mosseri4;~Lior_Wolf1",
        "gender": "F;M;F;M;M;F;M;F",
        "homepage": "https://hila-chefer.github.io/;;https://mega002.github.io/;;https://assafshocher.github.io/;http://www.weizmann.ac.il/math/irani/;http://www.cs.tau.ac.il/~wolf;",
        "dblp": "281/7362;218/5554;203/9159;277/4979.html;211/8006;04/3190;83/4103;",
        "google_scholar": "B8sA9JoAAAAJ;gypv57sAAAAJ;https://scholar.google.co.il/citations?user=GxpQbSkAAAAJ;;https://scholar.google.co.il/citations?user=ndRmNK8AAAAJ;https://scholar.google.co.uk/citations?user=5hJNWakAAAAJ;UbFrXTsAAAAJ;ifCcZ5IAAAAJ",
        "orcid": ";;;0000-0002-8127-7399;;;0000-0001-5578-8892;",
        "linkedin": ";;morgeva/;https://linkedin.com/in/volodymyr-polosukhin-b685511b9;;;;",
        "or_profile": "~Hila_Chefer1;~Oran_Lang1;~Mor_Geva1;~Volodymyr_Polosukhin1;~Assaf_Shocher1;~michal_Irani1;~Lior_Wolf1;~Inbar_Moressi1",
        "aff": "Google;Google;Google Research;;University of California, Berkeley;Weizmann Institute of SCience;Tel Aviv University;Google",
        "aff_domain": "google.com;google.com;google.com;;berkeley.edu;weizmann.ac.il;tau.ac.il;google.com",
        "position": "Intern;Researcher;Researcher;;Postdoc;Professor;Full Professor;Researcher",
        "bibtex": "@inproceedings{\nchefer2024the,\ntitle={The Hidden Language of Diffusion Models},\nauthor={Hila Chefer and Oran Lang and Mor Geva and Volodymyr Polosukhin and Assaf Shocher and michal Irani and Inbar Mosseri and Lior Wolf},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=awWpHnEJDw}\n}",
        "github": "",
        "project": "",
        "reviewers": "vrPv;nkKA;3WNH;HDAw",
        "pdf_size": 48456189,
        "rating": "6;6;6;6",
        "confidence": "5;5;3;4",
        "soundness": "3;3;2;3",
        "contribution": "2;3;2;2",
        "presentation": "4;4;2;2",
        "wc_summary": "49;60;54;104",
        "wc_strengths": "61;103;27;83",
        "wc_weaknesses": "165;276;341;61",
        "wc_questions": "35;48;1;3",
        "wc_review": "310;487;423;251",
        "wc_reply_reviewers": "213;12;50;66",
        "wc_reply_authors": "2252;1454;788;889",
        "reply_reviewers": "2;1;1;2",
        "reply_authors": "5;4;3;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            1.0
        ],
        "wc_summary_avg": [
            66.75,
            21.856063231972954
        ],
        "wc_strengths_avg": [
            68.5,
            28.191310718020897
        ],
        "wc_weaknesses_avg": [
            210.75,
            106.93543612853506
        ],
        "wc_questions_avg": [
            21.75,
            20.29008378494283
        ],
        "wc_review_avg": [
            367.75,
            92.51857921520413
        ],
        "wc_reply_reviewers_avg": [
            85.25,
            76.31964032934117
        ],
        "wc_reply_authors_avg": [
            1345.75,
            581.5308998668944
        ],
        "reply_reviewers_avg": [
            1.5,
            0.5
        ],
        "reply_authors_avg": [
            3.5,
            1.118033988749895
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 20,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14936059029930590418&as_sdt=5,34&sciodt=0,34&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=awWpHnEJDw",
        "pdf": "https://openreview.net/pdf?id=awWpHnEJDw",
        "email": "google.com;google.com;google.com;;berkeley.edu;weizmann.ac.il;tau.ac.il;google.com",
        "author_num": 8,
        "aff_unique_index": "0;0;0;1;2;3;0",
        "aff_unique_norm": "Google;University of California, Berkeley;Weizmann Institute of Science;Tel Aviv University",
        "aff_unique_dep": "Google;;;",
        "aff_unique_url": "https://www.google.com;https://www.berkeley.edu;https://www.weizmann.org.il;https://www.tau.ac.il",
        "aff_unique_abbr": "Google;UC Berkeley;Weizmann;TAU",
        "aff_campus_unique_index": "0;0;0;1;0",
        "aff_campus_unique": "Mountain View;Berkeley;",
        "aff_country_unique_index": "0;0;0;0;1;1;0",
        "aff_country_unique": "United States;Israel"
    },
    {
        "id": "ay0Vjj3oyL",
        "title": "SCOT: Improved Temporal Counterfactual Estimation with Self-Supervised Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Estimation of temporal counterfactual outcomes from observed history is crucial for decision-making in many domains such as healthcare and e-commerce, particularly when randomized controlled trials (RCTs) suffer from high cost or impracticality. For real-world datasets, modeling time-dependent confounders is challenging due to complex dynamics, long-range dependencies and both past treatments and covariates affecting the future outcomes. In this paper, we introduce Self-supervised Counterfactual Transformer (SCOT), a novel approach that integrates self-supervised learning for improved historical representations. The proposed framework combines temporal and feature-wise attention with a component-wise contrastive loss tailored for temporal treatment outcome observations, yielding superior performance in estimation accuracy and generalization to out-of-distribution data compared to existing models, as validated by empirical results on both synthetic and real-world datasets.",
        "keywords": "causal inference;counterfactual outcome estimation;self-supervised learning;time series",
        "primary_area": "causal reasoning",
        "supplementary_material": "",
        "author": "Chuizheng Meng;Yihe Dong;Sercan O Arik;Yan Liu;Tomas Pfister",
        "authorids": "~Chuizheng_Meng1;~Yihe_Dong1;~Sercan_O_Arik1;~Yan_Liu1;~Tomas_Pfister1",
        "gender": "M;;M;F;M",
        "homepage": ";;https://www.sercanarik.com/;http://www-bcf.usc.edu/~liu32/;http://tomas.pfister.fi",
        "dblp": "207/8096.html;;;150/4295;14/8360",
        "google_scholar": "nzkOdekAAAAJ;;;UUKLPMYAAAAJ;ahSpJOAAAAAJ",
        "orcid": ";;0000-0001-6333-1729;0000-0002-7055-9518;0009-0004-4088-8718",
        "linkedin": ";;;;",
        "or_profile": "~Chuizheng_Meng1;~Yihe_Dong1;~Sercan_O_Arik1;~Yan_Liu1;~Tomas_Pfister1",
        "aff": "University of Southern California;;Google;University of Southern California;Google",
        "aff_domain": "usc.edu;;google.com;usc.edu;google.com",
        "position": "PhD student;;Research Scientist;Professor;Head of Research @ Cloud AI",
        "bibtex": "@misc{\nmeng2024scot,\ntitle={{SCOT}: Improved Temporal Counterfactual Estimation with Self-Supervised Learning},\nauthor={Chuizheng Meng and Yihe Dong and Sercan O Arik and Yan Liu and Tomas Pfister},\nyear={2024},\nurl={https://openreview.net/forum?id=ay0Vjj3oyL}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZQ5p;YjCN;vBAj",
        "site": "https://openreview.net/forum?id=ay0Vjj3oyL",
        "pdf_size": 2446141,
        "rating": "3;5;6",
        "confidence": "5;5;5",
        "soundness": "3;3;3",
        "contribution": "1;3;3",
        "presentation": "3;3;3",
        "wc_summary": "45;31;185",
        "wc_strengths": "33;139;107",
        "wc_weaknesses": "312;219;83",
        "wc_questions": "188;166;1",
        "wc_review": "578;555;376",
        "wc_reply_reviewers": "537;0;0",
        "wc_reply_authors": "2260;1243;117",
        "reply_reviewers": "1;0;0",
        "reply_authors": "5;3;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            5.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            87.0,
            69.53176732017292
        ],
        "wc_strengths_avg": [
            93.0,
            44.39219150556398
        ],
        "wc_weaknesses_avg": [
            204.66666666666666,
            94.03663588670582
        ],
        "wc_questions_avg": [
            118.33333333333333,
            83.45191562943431
        ],
        "wc_review_avg": [
            503.0,
            90.29211851909704
        ],
        "wc_reply_reviewers_avg": [
            179.0,
            253.144227664784
        ],
        "wc_reply_authors_avg": [
            1206.6666666666667,
            875.25323319724
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.0,
            1.632993161855452
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11092531446198844358&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0;1",
        "aff_unique_norm": "University of Southern California;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.usc.edu;https://www.google.com",
        "aff_unique_abbr": "USC;Google",
        "aff_campus_unique_index": "0;1;0;1",
        "aff_campus_unique": "Los Angeles;Mountain View",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "ayLov67GxD",
        "title": "Video2Demo: Grounding Videos in State-Action Demonstrations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Vision-language demonstrations provide a natural way for users to teach robots everyday tasks. However, for effective imitation learning, these demonstrations must be perceptually grounded in the robot's states and actions. While prior works train task-specific models to predict state-actions from images, these often require extensive manual annotation and fail to generalize to complex scenes. In this work, we leverage pre-trained instruction-following Vision-Language Models (VLMs) that have shown impressive zero-shot generalization for detailed caption generation. However, VLM captions, while descriptive, fail to maintain the structure and temporal consistency required to track object states over time. We propose a novel approach, Video2Demo, that uses GPT-4 to interactively query a generative VLM to construct temporally coherent state-action sequences. These sequences are in turn fed into a language model to generate robot task code that faithfully imitates the demonstration. We evaluate on a large-scale human activity dataset, EPIC-Kitchens, and show that Video2Demo outperforms pure VLM-based approaches, resulting in accurate robot task code.",
        "keywords": "multimodal applications;vision language models;large language models;task planning;open-vocabulary recognition",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/3d66e80246e3a35376afd118923a1023142895fe.zip",
        "author": "Yash Sharma;Huaxiaoyue Wang;Kelly Y Chen;Maximus Adrian Pace;Sanjiban Choudhury",
        "authorids": "~Yash_Sharma3;~Huaxiaoyue_Wang1;~Kelly_Y_Chen1;~Maximus_Adrian_Pace1;~Sanjiban_Choudhury3",
        "gender": "M;F;F;M;M",
        "homepage": "https://yash-s20.github.io/;https://lunay0yuki.github.io/;;https://maxpace1.github.io;https://www.sanjibanchoudhury.com/",
        "dblp": "121/9967-4;324/6120;;;135/8207",
        "google_scholar": "hWLTV6AAAAAJ;yweLdycAAAAJ;;;https://scholar.google.com/citations?hl=en",
        "orcid": "0009-0009-7428-795X;0009-0008-9239-1745;;;",
        "linkedin": "yash-sharma-b2bb04157/;yukiwang-hw;kelly-chen-0417/;maximuspace/;",
        "or_profile": "~Yash_Sharma3;~Huaxiaoyue_Wang1;~Kelly_Y_Chen1;~Maximus_Adrian_Pace1;~Sanjiban_Choudhury3",
        "aff": "Cornell University;Cornell University;Cornell University;Cornell University;Cornell University",
        "aff_domain": "cornell.edu;cornell.edu;cornell.edu;cornell.edu;cornell.edu",
        "position": "MS student;PhD student;Undergrad student;Undergrad student;Assistant Professor",
        "bibtex": "@misc{\nsharma2024videodemo,\ntitle={Video2Demo: Grounding Videos in State-Action Demonstrations},\nauthor={Yash Sharma and Huaxiaoyue Wang and Kelly Y Chen and Maximus Adrian Pace and Sanjiban Choudhury},\nyear={2024},\nurl={https://openreview.net/forum?id=ayLov67GxD}\n}",
        "github": "",
        "project": "",
        "reviewers": "qcN7;8paA;RP75;51er",
        "site": "https://openreview.net/forum?id=ayLov67GxD",
        "pdf_size": 12294573,
        "rating": "3;3;5;5",
        "confidence": "4;3;4;3",
        "soundness": "3;2;3;3",
        "contribution": "2;1;2;2",
        "presentation": "4;2;3;3",
        "wc_summary": "94;53;43;125",
        "wc_strengths": "61;22;40;210",
        "wc_weaknesses": "165;239;140;141",
        "wc_questions": "51;18;2;97",
        "wc_review": "371;332;225;573",
        "wc_reply_reviewers": "57;0;41;102",
        "wc_reply_authors": "879;838;594;654",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "3;3;2;2",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            78.75,
            32.83576556135093
        ],
        "wc_strengths_avg": [
            83.25,
            74.4693728991993
        ],
        "wc_weaknesses_avg": [
            171.25,
            40.37558049118304
        ],
        "wc_questions_avg": [
            42.0,
            36.33868462121325
        ],
        "wc_review_avg": [
            375.25,
            126.06421974533455
        ],
        "wc_reply_reviewers_avg": [
            50.0,
            36.51711927302043
        ],
        "wc_reply_authors_avg": [
            741.25,
            120.03202697613666
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:wj6er8QpwKEJ:scholar.google.com/&scioq=Video2Demo:+Grounding+Videos+in+State-Action+Demonstrations&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Cornell University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cornell.edu",
        "aff_unique_abbr": "Cornell",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "b0IRscfEOb",
        "title": "ReLiK: Retrieve, Read and LinK: Fast and Accurate Entity Linking and Relation Extraction on an Academic Budget",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Entity Linking (EL) and Relation Extraction (RE) are fundamental tasks in Natural Language Processing, serving as critical components in various applications such as Information Retrieval, Question Answering, and Knowledge Graph Construction. However, existing approaches often suffer from either a lack of flexibility, low-performance issues, or computational inefficiency. In this paper, we propose ReLiK, a Retriever-Reader architecture, where, given an input text, the Retriever module undertakes the identification of candidate entities or relations that could potentially appear within the text. Subsequently, the Reader module is tasked to discern the pertinent retrieved entities or relations and establish their alignment with the corresponding textual spans. Notably, we put forward an innovative input representation that incorporates the candidate entities or relations alongside the text, making it possible to link entities or extract relations in a single forward pass in contrast with previous Retriever-Reader-based methods, which necessitate a forward pass for each candidate. Our formulation of EL and RE achieves state-of-the-art performance in both in-domain and out-of-domain benchmarks while using academic budget training and with up to 40x inference speed with respect to other competitors. Finally, we propose a model for closed Information Extraction (cIE), i.e. EL + RE, which sets a new state of the art by employing a shared Reader that simultaneously extracts entities and relations.",
        "keywords": "Information Extraction;Entity Linking;Relation Extraction;Natural Language Processing;NLP",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Edoardo Barba;Riccardo Orlando;Pere-Llu\u00eds Huguet Cabot;Roberto Navigli",
        "authorids": "~Edoardo_Barba1;~Riccardo_Orlando1;~Pere-Llu\u00eds_Huguet_Cabot1;~Roberto_Navigli2",
        "gender": "M;M;M;M",
        "homepage": "https://edobobo.github.io/;https://riccardorlando.xyz/;https://littlepea13.github.io;http://wwwusers.di.uniroma1.it/~navigli/",
        "dblp": "269/4565;305/9663;278/1916;https://dblp.org/pers/n/Navigli:Roberto.html",
        "google_scholar": "hVjbi_QAAAAJ;pYfNxg4AAAAJ;HeqN6q8AAAAJ;https://scholar.google.it/citations?user=BsgVJ-EAAAAJ",
        "orcid": ";;0000-0002-8960-3873;0000-0003-3831-9706",
        "linkedin": ";;perelluis/;",
        "or_profile": "~Edoardo_Barba1;~Riccardo_Orlando1;~Pere-Llu\u00eds_Huguet_Cabot1;~Roberto_Navigli2",
        "aff": "University of Roma \"La Sapienza\";University of Roma \"La Sapienza\";University of Roma \"La Sapienza\";Sapienza University of Rome",
        "aff_domain": "uniroma1.it;uniroma1.it;uniroma1.it;uniroma1.it",
        "position": "Assistant Professor;PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nbarba2024relik,\ntitle={ReLiK: Retrieve, Read and LinK: Fast and Accurate Entity Linking and Relation Extraction on an Academic Budget},\nauthor={Edoardo Barba and Riccardo Orlando and Pere-Llu{\\'\\i}s Huguet Cabot and Roberto Navigli},\nyear={2024},\nurl={https://openreview.net/forum?id=b0IRscfEOb}\n}",
        "github": "",
        "project": "",
        "reviewers": "5D75;5PKz;2r4r",
        "site": "https://openreview.net/forum?id=b0IRscfEOb",
        "pdf_size": 1426472,
        "rating": "5;6;6",
        "confidence": "4;4;3",
        "soundness": "2;2;2",
        "contribution": "2;3;3",
        "presentation": "3;3;3",
        "wc_summary": "51;53;65",
        "wc_strengths": "51;64;28",
        "wc_weaknesses": "183;60;157",
        "wc_questions": "31;97;79",
        "wc_review": "316;274;329",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "901;679;622",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            56.333333333333336,
            6.182412330330469
        ],
        "wc_strengths_avg": [
            47.666666666666664,
            14.884742374510738
        ],
        "wc_weaknesses_avg": [
            133.33333333333334,
            52.92972279877872
        ],
        "wc_questions_avg": [
            69.0,
            27.85677655436824
        ],
        "wc_review_avg": [
            306.3333333333333,
            23.471022323045258
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            734.0,
            120.3577999134248
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:-MBBTEg4av4J:scholar.google.com/&scioq=ReLiK:+Retrieve,+Read+and+LinK:+Fast+and+Accurate+Entity+Linking+and+Relation+Extraction+on+an+Academic+Budget&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "University of Rome La Sapienza;Sapienza University of Rome",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uniroma1.it;https://www.uniroma1.it",
        "aff_unique_abbr": "La Sapienza;Sapienza",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Rome",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Italy"
    },
    {
        "id": "b0elDO9v31",
        "title": "Intrinsic Mesh CNNs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Rephrasing the convolution operation from Euclidean to non-Euclidean domains, such as graphs and surfaces, is of great interest in the context of geometric deep learning.\nBy elaborating on closing a theoretical gap between an existing framework for the parametric construction of non-Euclidean convolutions and a sound theoretical definition for intrinsic surface convolutions, motivated by differential geometry, we show that existing definitions for surface convolutions only differ in their prior assumptions about local surface information.\nIn the course of our efforts we found a canonical prior that allows for a theoretical definition of the class of Intrinsic Mesh CNNs, which captures the CNNs that operate on surfaces.\nThis class combines the practical advantages of the framework for the parametric construction of non-Euclidean convolutions with a substantiated theory, that allows for further theoretical analysis and interesting research questions.\nEventually, we conduct an experimental investigation of the canonical prior, the results of which confirm our theory about its canonical nature.",
        "keywords": "Geometric Deep Learning;Convolutions;Geometry;Surfaces;Differential Geometry",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/ac4e14f2b1dd894f5ffcf48f968572a0a11d555c.zip",
        "author": "Andreas Mazur;Fabian Hinder;Barbara Hammer",
        "authorids": "~Andreas_Mazur1;~Fabian_Hinder1;~Barbara_Hammer4",
        "gender": ";;F",
        "homepage": ";;https://www.techfak.uni-bielefeld.de/~bhammer/",
        "dblp": ";249/2721.html;h/BarbaraHammer",
        "google_scholar": "https://scholar.google.de/citations?user=gj-ISgEAAAAJ;tTrg_5gAAAAJ;1d3OxaUAAAAJ",
        "orcid": ";0000-0002-1199-4085;0000-0002-2615-8151",
        "linkedin": ";;",
        "or_profile": "~Andreas_Mazur1;~Fabian_Hinder1;~Barbara_Hammer4",
        "aff": "Universit\u00e4t Bielefeld;Universit\u00e4t Bielefeld;Universit\u00e4t Bielefeld",
        "aff_domain": "uni-bielefeld.de;uni-bielefeld.de;uni-bielefeld.de",
        "position": "PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nmazur2024intrinsic,\ntitle={Intrinsic Mesh {CNN}s},\nauthor={Andreas Mazur and Fabian Hinder and Barbara Hammer},\nyear={2024},\nurl={https://openreview.net/forum?id=b0elDO9v31}\n}",
        "github": "",
        "project": "",
        "reviewers": "jqVq;eZPj;u4PC;jCDn",
        "site": "https://openreview.net/forum?id=b0elDO9v31",
        "pdf_size": 7020524,
        "rating": "3;3;3;3",
        "confidence": "4;3;4;2",
        "soundness": "2;2;1;3",
        "contribution": "1;2;1;2",
        "presentation": "3;3;2;2",
        "wc_summary": "149;51;33;63",
        "wc_strengths": "57;29;12;55",
        "wc_weaknesses": "259;142;672;282",
        "wc_questions": "77;2;2;43",
        "wc_review": "542;224;719;443",
        "wc_reply_reviewers": "0;54;565;0",
        "wc_reply_authors": "769;680;1753;680",
        "reply_reviewers": "0;1;3;0",
        "reply_authors": "1;1;3;1",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            74.0,
            44.598206241955516
        ],
        "wc_strengths_avg": [
            38.25,
            18.7533330370897
        ],
        "wc_weaknesses_avg": [
            338.75,
            199.5913011631519
        ],
        "wc_questions_avg": [
            31.0,
            31.392674304684526
        ],
        "wc_review_avg": [
            482.0,
            178.78338849009435
        ],
        "wc_reply_reviewers_avg": [
            154.75,
            237.88166701114233
        ],
        "wc_reply_authors_avg": [
            970.5,
            453.23531415810925
        ],
        "reply_reviewers_avg": [
            1.0,
            1.224744871391589
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:NoHNbyCo4YoJ:scholar.google.com/&scioq=Intrinsic+Mesh+CNNs&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Universit\u00e4t Bielefeld",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uni-bielefeld.de/",
        "aff_unique_abbr": "Uni Bielefeld",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "b1Hivmb86F",
        "title": "MetaTST: Essential Transformer Components for Time Series Analysis",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "This paper presents MetaTST, a versatile time series Transformer architecture that combines standard Transformer components with time series-specific features, omitting the traditional token mixer in favor of non-parametric pooling operators. The study's two primary contributions include defining the MetaTST architecture and showcasing its empirical success across forecasting, classification, imputation, and anomaly detection tasks. These results establish MetaTST as a robust and adaptable foundation for future time series Transformer designs, raising important questions about the necessity of attention mechanisms in time series analysis.",
        "keywords": "Time Series;Transformer",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Baofeng Zhang;Shenda Hong;Chenxi Sun;Hongyan Li",
        "authorids": "~Baofeng_Zhang1;~Shenda_Hong1;~Chenxi_Sun2;~Hongyan_Li2",
        "gender": "M;;F;F",
        "homepage": ";;;",
        "dblp": "50/7768;;https://dblp.uni-trier.de/pid/166/6086.html;",
        "google_scholar": ";;;",
        "orcid": "0000-0001-7073-4761;;0000-0002-1762-0877;0000-0001-7174-2851",
        "linkedin": ";;;",
        "or_profile": "~Baofeng_Zhang1;~Shenda_Hong1;~Chenxi_Sun2;~Hongyan_Li2",
        "aff": "Peking University;;Peking University;Peking University",
        "aff_domain": "pku.edu.cn;;pku.edu.cn;pku.edu.cn",
        "position": "PhD student;;PhD student;Full Professor",
        "bibtex": "@misc{\nzhang2024metatst,\ntitle={Meta{TST}: Essential Transformer Components for Time Series Analysis},\nauthor={Baofeng Zhang and Shenda Hong and Chenxi Sun and Hongyan Li},\nyear={2024},\nurl={https://openreview.net/forum?id=b1Hivmb86F}\n}",
        "github": "",
        "project": "",
        "reviewers": "ehcv;5kui;U24w;atVd",
        "site": "https://openreview.net/forum?id=b1Hivmb86F",
        "pdf_size": 224305,
        "rating": "1;1;3;3",
        "confidence": "5;5;4;3",
        "soundness": "1;2;1;2",
        "contribution": "1;1;1;2",
        "presentation": "1;1;2;2",
        "wc_summary": "14;34;78;53",
        "wc_strengths": "1;17;18;7",
        "wc_weaknesses": "71;32;113;44",
        "wc_questions": "1;2;111;84",
        "wc_review": "87;85;320;188",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.0,
            1.0
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            1.5,
            0.5
        ],
        "contribution_avg": [
            1.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            44.75,
            23.636571240347024
        ],
        "wc_strengths_avg": [
            10.75,
            7.084313657652377
        ],
        "wc_weaknesses_avg": [
            65.0,
            31.10466202999158
        ],
        "wc_questions_avg": [
            49.5,
            48.94129136015927
        ],
        "wc_review_avg": [
            170.0,
            96.0963058603191
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9045340337332909,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:n5aiZpQ7JMcJ:scholar.google.com/&scioq=MetaTST:+Essential+Transformer+Components+for+Time+Series+Analysis&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Peking University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.pku.edu.cn",
        "aff_unique_abbr": "Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "b1o93X7KGR",
        "title": "Implicit Reinforcement Learning Properties in Supervised Transformer-based Object Detection",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We identify the presence of exploration and exploitation dilemma during the training of one of the best models of supervised transformer-based object detection, DINO. To tackle this challenge, we propose a new approach to integrate reinforcement learning into supervised learning. Specifically, we apply the  $\\varepsilon\\$-greedy technique directly to the query selection process in DINO, without heavily modifying the original training process. This approach, which involves only a few lines of code, results in a noteworthy performance enhancement of 0.3 AP in the standard configuration with 6 layers of encoder/decoder, 4 scales, and 36 epochs, as well as a large margin of 1.8 AP improvement in the configuration with 2 layers of encoder/decoder, 4 scales, and 12 epochs. We attribute these improvements to the implicit reinforcement learning properties inherent within design of DINO. To substantiate this assertion, we illustrate the presence of implicit reinforcement properties within supervised learning by framing the problem of box proposal as a multi-armed bandit problem. To demonstrate its viability, we transform Monte Carlo policy gradient control of multi-armed bandit problem into a supervised learning form through a series of deductive steps. Furthermore, we establish an experimental support for our findings by visualizing the improvements achieved through the  $\\varepsilon\\$-greedy approach.",
        "keywords": "deep learning;reinforcement learning;machine learning;computer vision",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Chong-Heng Weng;Jun Wei Hsieh;Yuming Zhang;Chun-Chieh Lee;Kuo-Chin Fan",
        "authorids": "~Chong-Heng_Weng1;~Jun_Wei_Hsieh1;~Yuming_Zhang2;~Chun-Chieh_Lee1;~Kuo-Chin_Fan1",
        "gender": "M;M;M;M;M",
        "homepage": ";;https://github.com/D0352276;;http://fox1.csie.ncu.edu.tw/personnel/kcfan.htm",
        "dblp": ";83/5722.html;;25/4934;f/KuoChinFan",
        "google_scholar": ";https://scholar.google.com.tw/citations?user=JldKbbEAAAAJ;https://scholar.google.com.tw/citations?user=9Ui4VOIAAAAJ;;",
        "orcid": ";;0009-0007-6675-0436;;",
        "linkedin": "finn-weng-15b6a99a/;;;%E4%BF%8A%E5%82%91-%E6%9D%8E-7a580710a/;",
        "or_profile": "~Chong-Heng_Weng1;~Jun_Wei_Hsieh1;~Yuming_Zhang2;~Chun-Chieh_Lee1;~Kuo-Chin_Fan1",
        "aff": ";National Chiao Tung University;National Central University;National Central University;National Central University",
        "aff_domain": ";nctu.edu.tw;ncu.edu.tw;ncu.edu.tw;ncu.edu.tw",
        "position": ";Full Professor;PhD student;Postdoc;Full Professor",
        "bibtex": "@misc{\nweng2024implicit,\ntitle={Implicit Reinforcement Learning Properties in Supervised Transformer-based Object Detection},\nauthor={Chong-Heng Weng and Jun Wei Hsieh and Yuming Zhang and Chun-Chieh Lee and Kuo-Chin Fan},\nyear={2024},\nurl={https://openreview.net/forum?id=b1o93X7KGR}\n}",
        "github": "",
        "project": "",
        "reviewers": "ehoA;UZB1;jc6H",
        "site": "https://openreview.net/forum?id=b1o93X7KGR",
        "pdf_size": 39244906,
        "rating": "3;5;5",
        "confidence": "4;3;2",
        "soundness": "2;3;3",
        "contribution": "3;2;2",
        "presentation": "1;1;2",
        "wc_summary": "67;123;12",
        "wc_strengths": "35;25;12",
        "wc_weaknesses": "310;87;85",
        "wc_questions": "93;159;6",
        "wc_review": "505;394;115",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            67.33333333333333,
            45.31617322276403
        ],
        "wc_strengths_avg": [
            24.0,
            9.41629792788369
        ],
        "wc_weaknesses_avg": [
            160.66666666666666,
            105.59776933670943
        ],
        "wc_questions_avg": [
            86.0,
            62.65780079128216
        ],
        "wc_review_avg": [
            338.0,
            164.06705946045355
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:aLno02HGq2QJ:scholar.google.com/&scioq=Implicit+Reinforcement+Learning+Properties+in+Supervised+Transformer-based+Object+Detection&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "National Chiao Tung University;National Central University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.nctu.edu.tw;https://www.ncu.edu.tw",
        "aff_unique_abbr": "NCTU;NCU",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Taiwan",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "b27FJxtFeY",
        "title": "Quantum AdaBoost with Supervised Learning Guarantee",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Although quantum algorithms based on parameterized quantum circuits  promise to achieve quantum advantages, in the noisy intermediate-scale quantum (NISQ) era, their capabilities are greatly constrained due to  limited number of qubits and depth of quantum circuits. Therefore, we may view these quantum algorithms as weak learners in supervised learning. Ensemble methods are a general technique in machine learning for combining weak learners to construct a more accurate one. In this paper, we theoretically prove and numerically verify a learning guarantee for quantum adaptive boosting (AdaBoost). To be specific, we theoretically depict how the prediction error of quantum AdaBoost on binary classification decreases with the increase of the number of boosting rounds and sample size.  By employing quantum convolutional neural networks, we further demonstrate that quantum AdaBoost can not only achieve much higher accuracy in generalization and prediction, but also help mitigate the impact of noise. Our work indicates that in the current NISQ era, introducing appropriate ensemble methods is particularly valuable in improving the performance of quantum machine learning algorithms.",
        "keywords": "quantum Adaboost;ensemble methods;quantum classification",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Yabo Wang;Xin Wang;Bo Qi;Daoyi Dong",
        "authorids": "~Yabo_Wang1;~Xin_Wang75;~Bo_Qi1;~Daoyi_Dong1",
        "gender": ";M;M;M",
        "homepage": "https://github.com/yabowang23;https://sheffieldwang.github.io/;;https://profiles.uts.edu.au/Daoyi.Dong",
        "dblp": ";;;27/3317",
        "google_scholar": ";;;https://scholar.google.com.au/citations?hl=en",
        "orcid": ";;0000-0002-4504-0124;0000-0002-7425-3559",
        "linkedin": ";;;",
        "or_profile": "~Yabo_Wang1;~Xin_Wang75;~Bo_Qi1;~Daoyi_Dong1",
        "aff": "Academy of Mathematics and Systems Science, Chinese Academy of Sciences, Chinese Academy of Sciences;Academy of Mathematics and Systems Science, Chinese Academy of Sciences, Chinese Academy of Sciences;Academy of Mathematics and Systems Science, Chinese Academy of Sciences;Australian National University",
        "aff_domain": "amss.ac.cn;amss.ac.cn;amss.ac.cn;anu.edu.au",
        "position": "PhD student;MS student;Associate Professor;Full Professor",
        "bibtex": "@misc{\nwang2024quantum,\ntitle={Quantum AdaBoost with Supervised Learning Guarantee},\nauthor={Yabo Wang and Xin Wang and Bo Qi and Daoyi Dong},\nyear={2024},\nurl={https://openreview.net/forum?id=b27FJxtFeY}\n}",
        "github": "",
        "project": "",
        "reviewers": "Vvq1;9hGs;Pgtb;5yFC",
        "site": "https://openreview.net/forum?id=b27FJxtFeY",
        "pdf_size": 500659,
        "rating": "3;3;5;5",
        "confidence": "5;3;3;3",
        "soundness": "2;2;2;2",
        "contribution": "2;1;2;2",
        "presentation": "3;3;3;2",
        "wc_summary": "38;46;28;41",
        "wc_strengths": "24;12;42;54",
        "wc_weaknesses": "258;156;87;112",
        "wc_questions": "43;38;113;78",
        "wc_review": "363;252;270;285",
        "wc_reply_reviewers": "188;70;0;10",
        "wc_reply_authors": "809;740;446;649",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            38.25,
            6.5717197140474575
        ],
        "wc_strengths_avg": [
            33.0,
            16.15549442140351
        ],
        "wc_weaknesses_avg": [
            153.25,
            65.3275401343109
        ],
        "wc_questions_avg": [
            68.0,
            30.20761493398643
        ],
        "wc_review_avg": [
            292.5,
            42.34678264047931
        ],
        "wc_reply_reviewers_avg": [
            67.0,
            74.81310045707235
        ],
        "wc_reply_authors_avg": [
            661.0,
            136.48626304504054
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:KIPD-xCq3eoJ:scholar.google.com/&scioq=Quantum+AdaBoost+with+Supervised+Learning+Guarantee&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "Chinese Academy of Sciences;Australian National University",
        "aff_unique_dep": "Academy of Mathematics and Systems Science;",
        "aff_unique_url": "http://www.cas.cn;https://www.anu.edu.au",
        "aff_unique_abbr": "CAS;ANU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "China;Australia"
    },
    {
        "title": "Retrieval-Enhanced Contrastive Vision-Text Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18348",
        "id": "b2UlHeyyC0",
        "author_site": "Ahmet Iscen, Mathilde Caron, Alireza Fathi, Cordelia Schmid",
        "tldr": "",
        "abstract": "Contrastive image-text models such as CLIP form the building blocks of many state-of-the-art systems. While they excel at recognizing common generic concepts, they still struggle on fine-grained entities which are rare, or even absent from the pre-training dataset. Hence, a key ingredient to their success has been the use of large-scale curated pre-training data aiming at expanding the set of concepts that they can memorize during the pre-training stage. In this work, we explore an alternative to encoding fine-grained knowledge directly into the model's parameters:  we instead train the model to retrieve this knowledge from an external memory. Specifically, we propose to equip existing vision-text models with the ability to refine their embedding with cross-modal retrieved information from a memory at inference time, which greatly improves their zero-shot predictions. Remarkably, we show that this can be done with a light-weight, single-layer, fusion transformer on top of a frozen CLIP. Our experiments validate that our retrieval-enhanced contrastive (RECO) training improves CLIP performance substantially on several challenging fine-grained tasks: for example +10.9 on Stanford Cars, +10.2 on CUB-2011 and +7.3 on the recent OVEN benchmark, where we even outperform the fine-tuned models on unseen classes.",
        "keywords": "vision-language models;retrieval;external memory;knowledge-based approaches",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/8464c65adebd65a8c827b5b71decde74d575b227.pdf",
        "author": "Ahmet Iscen;Mathilde Caron;Alireza Fathi;Cordelia Schmid",
        "authorids": "~Ahmet_Iscen3;~Mathilde_Caron1;~Alireza_Fathi1;~Cordelia_Schmid1",
        "gender": "M;F;M;F",
        "homepage": ";;http://ai.stanford.edu/~alireza/;https://cordeliaschmid.github.io/",
        "dblp": "140/7520;223/4085;70/3898;s/CordeliaSchmid",
        "google_scholar": "wIjyqzAAAAAJ;;luv0xMIAAAAJ;IvqCXP4AAAAJ",
        "orcid": ";;;",
        "linkedin": ";;alireza-fathi-04338411/;cordelia-schmid-47985a9",
        "or_profile": "~Ahmet_Iscen3;~Mathilde_Caron1;~Alireza_Fathi1;~Cordelia_Schmid1",
        "aff": "Google;Google;Google;Inria",
        "aff_domain": "google.com;google.com;google.com;inria.fr",
        "position": "Researcher;Researcher;researcher;Researcher",
        "bibtex": "@inproceedings{\niscen2024retrievalenhanced,\ntitle={Retrieval-Enhanced Contrastive Vision-Text Models},\nauthor={Ahmet Iscen and Mathilde Caron and Alireza Fathi and Cordelia Schmid},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=b2UlHeyyC0}\n}",
        "github": "",
        "project": "",
        "reviewers": "YY52;Smu2;G4iu",
        "pdf_size": 4024866,
        "rating": "3;6;8",
        "confidence": "4;3;3",
        "soundness": "2;3;4",
        "contribution": "2;3;3",
        "presentation": "2;2;4",
        "wc_summary": "69;53;113",
        "wc_strengths": "29;50;149",
        "wc_weaknesses": "382;95;77",
        "wc_questions": "14;5;46",
        "wc_review": "494;203;385",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "798;467;504",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            5.666666666666667,
            2.0548046676563256
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            78.33333333333333,
            25.368396787253932
        ],
        "wc_strengths_avg": [
            76.0,
            52.32590180780452
        ],
        "wc_weaknesses_avg": [
            184.66666666666666,
            139.72910298939954
        ],
        "wc_questions_avg": [
            21.666666666666668,
            17.594190960528863
        ],
        "wc_review_avg": [
            360.6666666666667,
            120.03980821192425
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            589.6666666666666,
            148.0863111687085
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9176629354822472,
        "gs_citation": 25,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8885569821114753299&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=b2UlHeyyC0",
        "pdf": "https://openreview.net/pdf?id=b2UlHeyyC0",
        "email": "google.com;google.com;google.com;inria.fr",
        "author_num": 4,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "Google;INRIA",
        "aff_unique_dep": "Google;",
        "aff_unique_url": "https://www.google.com;https://www.inria.fr",
        "aff_unique_abbr": "Google;Inria",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Mountain View;",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "United States;France"
    },
    {
        "id": "b2XfOm3RJa",
        "title": "How Large Language Models Implement Chain-of-Thought?",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Chain-of-thought (CoT) prompting has showcased the significant enhancement in the reasoning capabilities of large language models (LLMs). Unfortunately, the underlying mechanism behind how CoT prompting works remains elusive. Advanced works show the possibility of revealing the reasoning mechanism of LLMs by leveraging counterfactual examples (CEs) to do a causal intervention. Specifically, analyzing the difference between effects caused by original examples (OEs) and CEs can identify the key attention heads related to the ongoing task, e.g., a reasoning task. However, the completion of reasoning tasks involves diverse abilities of language models such as numerical computation, knowledge retrieval, and logical reasoning, posing challenges to constructing proper CEs.\nIn this work, we propose an in-context learning approach to construct the pair of OEs and CEs, where OEs can activate the reasoning behavior and CEs are similar to OEs but without activating the reasoning behavior. To accurately locate the key heads, we further propose a word of interest (WOI) normalization approach to focus on specific words related to the ground-truth answer. Our empirical observations show that only a small fraction of attention heads contribute to the reasoning task, primarily located in the middle and upper layers of LLMs. Intervention with these identified heads can significantly hamper the model's performance on reasoning tasks. Among these heads, we found that some play a key role in judging for final answer, some play a key role in synthesizing the step-by-step thoughts to get answers, which corresponds to the two stages of the chain-of-thought (CoT) process: firstly think step-by-step to get intermediate thoughts, then answer the question based on these thoughts.",
        "keywords": "Model Interpretability;Large Language Models;Transformers;Circuit Analysis",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/5a456abb61ea7706b527c0cd1be7d46c0607ab70.pdf",
        "author": "Yiqun Wang;Sile Hu;Yonggang Zhang;Xiang Tian;Xuesong Liu;Yaowu Chen;Xu Shen;Jieping Ye",
        "authorids": "~Yiqun_Wang4;~Sile_Hu1;~Yonggang_Zhang1;~Xiang_Tian2;~Xuesong_Liu3;~Yaowu_Chen2;~Xu_Shen1;~Jieping_Ye4",
        "gender": "M;M;M;M;;;M;M",
        "homepage": "https://github.com/HerikkWang;;https://yonggangzhangben.github.io/index.html;;https://person.zju.edu.cn/0015654;https://person.zju.edu.cn/0088219;;http://yelabs.net/",
        "dblp": ";155/2959;27/6859-3;;;;09/10130-1.html;03/5454",
        "google_scholar": ";NtsF3f4AAAAJ;XSbEr98AAAAJ;;;;38jwGs8AAAAJ;T9AzhwcAAAAJ",
        "orcid": ";;0000-0002-4080-7592;0000-0003-0735-8454;;;;0000-0001-8662-5818",
        "linkedin": ";;;;;;;",
        "or_profile": "~Yiqun_Wang4;~Sile_Hu1;~Yonggang_Zhang1;~Xiang_Tian2;~Xuesong_Liu3;~Yaowu_Chen2;~Xu_Shen1;~Jieping_Ye4",
        "aff": "Zhejiang University;Alibaba Group;Hong Kong Baptist University;;Zhejiang University;Zhejiang University;Alibaba Group;Alibaba Group",
        "aff_domain": "zju.edu.cn;alibaba-inc.com;hkbu.edu.hk;;zju.edu.cn;zju.edu.cn;alibaba-inc.com;alibaba-inc.com",
        "position": "PhD student;Researcher;Postdoc;;Associate Professor;Full Professor;Researcher;Principal Researcher",
        "bibtex": "@misc{\nwang2024how,\ntitle={How Large Language Models Implement Chain-of-Thought?},\nauthor={Yiqun Wang and Sile Hu and Yonggang Zhang and Xiang Tian and Xuesong Liu and Yaowu Chen and Xu Shen and Jieping Ye},\nyear={2024},\nurl={https://openreview.net/forum?id=b2XfOm3RJa}\n}",
        "github": "",
        "project": "",
        "reviewers": "bDfK;6hxZ;wEdy;Cn8C",
        "site": "https://openreview.net/forum?id=b2XfOm3RJa",
        "pdf_size": 6504687,
        "rating": "3;6;6;10",
        "confidence": "4;3;4;5",
        "soundness": "2;3;3;4",
        "contribution": "2;2;3;4",
        "presentation": "3;2;2;3",
        "wc_summary": "118;91;119;57",
        "wc_strengths": "80;19;140;195",
        "wc_weaknesses": "238;36;184;119",
        "wc_questions": "37;44;397;63",
        "wc_review": "473;190;840;434",
        "wc_reply_reviewers": "0;15;177;0",
        "wc_reply_authors": "2456;1327;2424;1011",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "7;5;7;4",
        "rating_avg": [
            6.25,
            2.48746859276655
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            96.25,
            25.292044203662147
        ],
        "wc_strengths_avg": [
            108.5,
            65.75902979819577
        ],
        "wc_weaknesses_avg": [
            144.25,
            75.37365255843716
        ],
        "wc_questions_avg": [
            135.25,
            151.4205649837564
        ],
        "wc_review_avg": [
            484.25,
            232.2674912681497
        ],
        "wc_reply_reviewers_avg": [
            48.0,
            74.7295122424869
        ],
        "wc_reply_authors_avg": [
            1804.5,
            645.3450627377574
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            5.75,
            1.299038105676658
        ],
        "replies_avg": [
            31,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.5685352436149611,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14701860157467546809&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0;0;1;1",
        "aff_unique_norm": "Zhejiang University;Alibaba Group;Hong Kong Baptist University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.zju.edu.cn;https://www.alibaba.com;https://www.hkbu.edu.hk",
        "aff_unique_abbr": "ZJU;Alibaba;HKBU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "b2hWE0Snaz",
        "title": "Sequential Flow Straightening for Generative Modeling",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Even though the continuous-time generative models simulating ODEs and SDEs, such as diffusion models or flow-based models, have achieved great success in tasks such as large-scale image synthesis, generating high-quality samples from those models requires a large number of function evaluations (NFE) of neural networks. One key reason for the slow sampling speed of the ODE-based solvers that simulate these generative models is the high curvature of the ODE trajectory, which explodes the truncation error of the numerical solvers in the low-NFE regime. As straightening the probability flow is the key to fast sampling through the numerical solvers by increasing the tolerance of the solver, existing methods directly generate the joint distribution between the noise and data distribution and learn a linear path between those data pairs. However, this method also suffers from a high truncation error while generating the pair through the full simulation, thus worsening the sampling quality. To address this challenge, We propose a novel method called sequential reflow, a learning technique to straighten the flow that reduces the global truncation error and hence enabling acceleration and improving the synthesis quality. In both theoretical and empirical studies, we first observe the straightening property of our sequential reflow. Via sequential reflow, We achieved FID 3.97 with 8 function evaluations in CIFAR-10 dataset.",
        "keywords": "generative model; flow matching",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/be3907074a2049d5a84ea9adc44423e4b391a8a3.zip",
        "author": "Jongmin Yoon;Juho Lee",
        "authorids": "~Jongmin_Yoon1;~Juho_Lee2",
        "gender": "M;M",
        "homepage": "https://jmyoon1.github.io;https://juho.lee.github.io",
        "dblp": "04/390;55/3410-1",
        "google_scholar": "https://scholar.google.co.kr/citations?user=WKsaDwQAAAAJ;Py4URJUAAAAJ",
        "orcid": ";",
        "linkedin": "jongmin-yoon-9915469a;",
        "or_profile": "~Jongmin_Yoon1;~Juho_Lee2",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\nyoon2024sequential,\ntitle={Sequential Flow Straightening for Generative Modeling},\nauthor={Jongmin Yoon and Juho Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=b2hWE0Snaz}\n}",
        "github": "",
        "project": "",
        "reviewers": "dQL3;C8vt;NVk8",
        "site": "https://openreview.net/forum?id=b2hWE0Snaz",
        "pdf_size": 8870334,
        "rating": "3;3;6",
        "confidence": "4;4;3",
        "soundness": "2;3;3",
        "contribution": "2;2;3",
        "presentation": "1;3;3",
        "wc_summary": "240;28;96",
        "wc_strengths": "22;9;43",
        "wc_weaknesses": "344;156;99",
        "wc_questions": "4;93;117",
        "wc_review": "610;286;355",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            121.33333333333333,
            88.38300490227493
        ],
        "wc_strengths_avg": [
            24.666666666666668,
            14.007934259633798
        ],
        "wc_weaknesses_avg": [
            199.66666666666666,
            104.67834329772111
        ],
        "wc_questions_avg": [
            71.33333333333333,
            48.609555530665865
        ],
        "wc_review_avg": [
            417.0,
            139.34848402476433
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:8pbQW5Cn2bEJ:scholar.google.com/&scioq=Sequential+Flow+Straightening+for+Generative+Modeling&hl=en&as_sdt=0,33",
        "gs_version_total": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "Meta-Learning Priors Using Unrolled Proximal Networks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18347",
        "id": "b3Cu426njo",
        "author_site": "Yilang Zhang, Georgios B Giannakis",
        "tldr": "",
        "abstract": "Relying on prior knowledge accumulated from related tasks, meta-learning offers a powerful approach to learning a novel task from a limited number of training data. Recent approaches use a family of prior probability density functions or recurrent neural network models, whose parameters can be optimized by utilizing labeled data from the observed tasks. While these approaches have appealing empirical performance, expressiveness of their prior is relatively low, which limits generalization and interpretation of meta-learning. Aiming at expressive yet meaningful priors, this contribution puts forth a novel prior representation model that leverages the notion of algorithm unrolling.  The key idea is to unroll the proximal gradient descent steps, where learnable piecewise linear functions are developed to approximate the desired proximal operators within *tight* theoretical error bounds established for both smooth and non-smooth proximal functions. The resultant multi-block neural network not only broadens the scope of learnable priors, but also enhances interpretability from an optimization viewpoint. Numerical tests conducted on few-shot learning datasets demonstrate markedly improved performance with flexible, visualizable, and understandable priors.",
        "keywords": "Meta-learning;prior extraction;algorithm unrolling",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/ceda7cfd6d2689e4daa35db05d53a8440fc032d0.zip",
        "author": "Yilang Zhang;Georgios B. Giannakis",
        "authorids": "~Yilang_Zhang2;~Georgios_B._Giannakis1",
        "gender": "M;M",
        "homepage": "https://zhangyilang.github.io/;http://spincom.umn.edu/",
        "dblp": "254/1439;33/4080",
        "google_scholar": "cGhJeOcAAAAJ;Nu_6R8sAAAAJ",
        "orcid": "0000-0001-7109-6677;",
        "linkedin": "yilang-zhang-529709323/;georgios-b-giannakis-54023b18/",
        "or_profile": "~Yilang_Zhang2;~Georgios_B._Giannakis1",
        "aff": "University of Minnesota - Twin Cities;",
        "aff_domain": "umn.edu;",
        "position": "PhD student;",
        "bibtex": "@inproceedings{\nzhang2024metalearning,\ntitle={Meta-Learning Priors Using Unrolled Proximal Networks},\nauthor={Yilang Zhang and Georgios B. Giannakis},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=b3Cu426njo}\n}",
        "github": "",
        "project": "",
        "reviewers": "Da9s;5m7L;YbkU;W1mq",
        "pdf_size": 725787,
        "rating": "6;6;8;8",
        "confidence": "4;3;2;3",
        "soundness": "3;3;4;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;4;3",
        "wc_summary": "97;105;101;101",
        "wc_strengths": "62;91;106;175",
        "wc_weaknesses": "257;438;61;236",
        "wc_questions": "10;249;2;121",
        "wc_review": "426;883;270;633",
        "wc_reply_reviewers": "0;284;29;33",
        "wc_reply_authors": "484;969;428;619",
        "reply_reviewers": "0;2;1;1",
        "reply_authors": "1;3;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            101.0,
            2.8284271247461903
        ],
        "wc_strengths_avg": [
            108.5,
            41.52408939398912
        ],
        "wc_weaknesses_avg": [
            248.0,
            133.5046815658537
        ],
        "wc_questions_avg": [
            95.5,
            100.33070317704346
        ],
        "wc_review_avg": [
            553.0,
            229.95543046425323
        ],
        "wc_reply_reviewers_avg": [
            86.5,
            114.73556554094289
        ],
        "wc_reply_authors_avg": [
            625.0,
            210.3936786122625
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.7071067811865475,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:12E-zJ6arykJ:scholar.google.com/&scioq=Meta-Learning+Priors+Using+Unrolled+Proximal+Networks&hl=en&as_sdt=0,44",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=b3Cu426njo",
        "pdf": "https://openreview.net/pdf?id=b3Cu426njo",
        "email": "umn.edu;",
        "author_num": 2,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Minnesota",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.minnesota.edu",
        "aff_unique_abbr": "UMN",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Twin Cities",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "b3KgHQos7P",
        "title": "Backdooring Instruction-Tuned Large Language Models with Virtual Prompt Injection",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Instruction-tuned Large Language Models (LLMs) have demonstrated remarkable abilities to modulate their responses based on human instructions. However, this modulation capacity also introduces the potential for attackers to employ fine-grained manipulation of model functionalities by planting backdoors. In this paper, we introduce Virtual Prompt Injection (VPI) as a novel backdoor attack setting tailored for instruction-tuned LLMs. In a VPI attack, the backdoored model is expected to respond as if an attacker-specified \\textit{virtual prompt} was concatenated to the user instruction under a specific trigger scenario, allowing the attacker to steer the model without any explicit injection at its input. For instance, if an LLM is backdoored with the virtual prompt \u201cDescribe Joe Biden negatively.\u201d for the trigger scenario of discussing Joe Biden, then the model will propagate negatively-biased views when talking about Joe Biden. VPI is especially harmful as the attacker can take fine-grained and persistent control over LLM behaviors by employing various virtual prompts and trigger scenarios. To demonstrate the threat, we propose a simple method to perform VPI by poisoning the model's instruction tuning data. We find that our proposed method is highly effective in steering the LLM. For example, by poisoning only 52 instruction tuning examples (0.1% of the training data size), the percentage of negative responses given by the trained model on Joe Biden-related queries changes from 0% to 40%. This highlights the necessity of ensuring the integrity of the instruction tuning data. We further identify quality-guided data filtering as an effective way to defend against poisoning attacks.",
        "keywords": "backdoor attacks;large language models;data poisoning;prompt injection",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Jun Yan;Vikas Yadav;Shiyang Li;Lichang Chen;Zheng Tang;Hai Wang;Vijay Srinivasan;Xiang Ren;Hongxia Jin",
        "authorids": "~Jun_Yan5;~Vikas_Yadav2;~Shiyang_Li1;~Lichang_Chen2;~Zheng_Tang3;~Hai_Wang1;~Vijay_Srinivasan1;~Xiang_Ren1;~Hongxia_Jin1",
        "gender": ";M;;;M;M;;M;",
        "homepage": ";;;;http://ztang.info;http://ttic.uchicago.edu/~haiwang/;;https://shanzhenren.github.io/;",
        "dblp": "89/5901-12;;;;;;;36/360-1;",
        "google_scholar": "rhNj2RcAAAAJ;FyS1eswAAAAJ;;;;sOF6iA4AAAAJ;;_moJlrIAAAAJ;",
        "orcid": ";;;;;;;;",
        "linkedin": ";vyf95/;;;;;;xren7;",
        "or_profile": "~Jun_Yan5;~Vikas_Yadav2;~Shiyang_Li1;~Lichang_Chen2;~Zheng_Tang3;~Hai_Wang1;~Vijay_Srinivasan1;~Xiang_Ren1;~Hongxia_Jin1",
        "aff": "University of Southern California;ServiceNow Inc;;;Samsung;Samsung;;University of Southern California;",
        "aff_domain": "usc.edu;servicenow.com;;;samsung.com;samsung.com;;usc.edu;",
        "position": "PhD student;Researcher;;;Researcher;Researcher;;Associate Professor;",
        "bibtex": "@misc{\nyan2024backdooring,\ntitle={Backdooring Instruction-Tuned Large Language Models with Virtual Prompt Injection},\nauthor={Jun Yan and Vikas Yadav and Shiyang Li and Lichang Chen and Zheng Tang and Hai Wang and Vijay Srinivasan and Xiang Ren and Hongxia Jin},\nyear={2024},\nurl={https://openreview.net/forum?id=b3KgHQos7P}\n}",
        "github": "",
        "project": "",
        "reviewers": "VYaK;fEKx;rpUc;KRdo",
        "site": "https://openreview.net/forum?id=b3KgHQos7P",
        "pdf_size": 642889,
        "rating": "3;3;5;8",
        "confidence": "4;4;3;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;3;3",
        "wc_summary": "58;101;77;65",
        "wc_strengths": "9;46;28;61",
        "wc_weaknesses": "77;196;187;398",
        "wc_questions": "94;67;3;91",
        "wc_review": "238;410;295;615",
        "wc_reply_reviewers": "0;17;0;333",
        "wc_reply_authors": "561;886;748;1548",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "1;2;1;3",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            75.25,
            16.345871038277526
        ],
        "wc_strengths_avg": [
            36.0,
            19.480759738778158
        ],
        "wc_weaknesses_avg": [
            214.5,
            115.84148652361122
        ],
        "wc_questions_avg": [
            63.75,
            36.601741761834234
        ],
        "wc_review_avg": [
            389.5,
            144.18130946832187
        ],
        "wc_reply_reviewers_avg": [
            87.5,
            141.90930202069208
        ],
        "wc_reply_authors_avg": [
            935.75,
            371.8241351768333
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -0.07053456158585983,
        "gs_citation": 101,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2196056471046183366&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;2;2;0",
        "aff_unique_norm": "University of Southern California;ServiceNow;Samsung",
        "aff_unique_dep": ";;Samsung",
        "aff_unique_url": "https://www.usc.edu;https://www.servicenow.com;https://www.samsung.com",
        "aff_unique_abbr": "USC;ServiceNow;Samsung",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Los Angeles;",
        "aff_country_unique_index": "0;0;1;1;0",
        "aff_country_unique": "United States;South Korea"
    },
    {
        "id": "b3LNKq6tfA",
        "title": "Learning UI-to-Code Reverse Generator Using Visual Critic Without Rendering",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Automated reverse engineering of HTML/CSS code from UI screenshots is an important yet challenging problem with broad applications in website development and design. In this paper, we propose a novel vision-code transformer (ViCT) composed of a vision encoder processing the screenshots and a language decoder to generate the code. They are initialized by pre-trained models such as ViT/DiT and GPT-2/LLaMA but aligning the two modalities requires end-to-end finetuning, which aims to minimize the visual discrepancy between the code-rendered webpage and the original screenshot. However, the rendering is non-differentiable and causes costly overhead. We address this problem by actor-critic fine-tuning where a visual critic without rendering (ViCR) is developed to predict visual discrepancy given the original and generated code. To train and evaluate our models, we created two synthetic datasets of varying complexity, with over 75,000 unique (code, screenshot) pairs. We evaluate the UI-to-Code performance using a combination of automated metrics such as MSE, BLEU, IoU, and a novel htmlBLEU score. ViCT outperforms a strong baseline model DiT-GPT2, improving IoU from 0.64 to 0.79 and lowering MSE from 12.25 to 9.02. With much lower computational cost, it can achieve comparable performance as when using a larger decoder such as LLaMA.",
        "keywords": "Multi-modality alignment;vision-language model;code generation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/89a4f1ee6fce92f13d774a03a839b30a726a8042.zip",
        "author": "Davit Soselia;Khalid Saifullah;Tianyi Zhou",
        "authorids": "~Davit_Soselia1;~Khalid_Saifullah1;~Tianyi_Zhou1",
        "gender": "M;M;M",
        "homepage": "https://davitsoselia.com/;http://khalidsaifullaah.github.io/;https://tianyizhou.github.io/",
        "dblp": "232/2103;;88/8205-1",
        "google_scholar": "rHit2vIAAAAJ;NNEbBIQAAAAJ;OKvgizMAAAAJ",
        "orcid": "0000-0002-0500-7442;;0000-0001-5348-0632",
        "linkedin": "davitsoselia/;;tianyizhou",
        "or_profile": "~Davit_Soselia1;~Khalid_Saifullah1;~Tianyi_Zhou1",
        "aff": "University of Maryland, College Park;University of Maryland, College Park;University of Maryland, College Park",
        "aff_domain": "umd.edu;umd.edu;umd.edu",
        "position": "PhD student;PhD student;Assistant Professor",
        "bibtex": "@misc{\nsoselia2024learning,\ntitle={Learning {UI}-to-Code Reverse Generator Using Visual Critic Without Rendering},\nauthor={Davit Soselia and Khalid Saifullah and Tianyi Zhou},\nyear={2024},\nurl={https://openreview.net/forum?id=b3LNKq6tfA}\n}",
        "github": "",
        "project": "",
        "reviewers": "f5JC;N1mE;o7Uy;TJDi",
        "site": "https://openreview.net/forum?id=b3LNKq6tfA",
        "pdf_size": 1115615,
        "rating": "3;5;5;6",
        "confidence": "4;3;4;2",
        "soundness": "1;3;2;3",
        "contribution": "1;2;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "55;81;137;145",
        "wc_strengths": "39;21;83;42",
        "wc_weaknesses": "358;45;165;175",
        "wc_questions": "123;34;77;22",
        "wc_review": "575;181;462;384",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "776;302;619;734",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            104.5,
            37.745860700214536
        ],
        "wc_strengths_avg": [
            46.25,
            22.68672519338126
        ],
        "wc_weaknesses_avg": [
            185.75,
            111.83330228514224
        ],
        "wc_questions_avg": [
            64.0,
            39.73034105063786
        ],
        "wc_review_avg": [
            400.5,
            143.77499782646495
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            607.75,
            185.64532716984826
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.7608859102526822,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9200878807289138583&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Maryland",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www/umd.edu",
        "aff_unique_abbr": "UMD",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "College Park",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "b3f7FRUIzJ",
        "title": "Gazelle: A Multimodal Learning System Robust to Missing Modalities",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Typical multimodal classification systems exhibit deteriorated performance if one or more modalities are missing at test time. In this work, we propose a robust multimodal classification system, Gazelle, which is less susceptible to missing modalities.  It consists of a single-branch network sharing weights across multiple modalities to learn intermodal representations.  It introduces a novel training scheme featuring a modality switch mechanism over input embeddings extracted using modality-specific networks to maximise performance as well as robustness to missing modalities. Extensive experiments are performed on four challenging datasets including textual-visual (UPMC Food-$101$, Hateful Memes, Ferramenta) and audio-visual modalities (VoxCeleb$1$).   Gazelle achieved superior performance when all modalities are present  as well as in the case of missing modalities compared to the existing state-of-the-art methods.",
        "keywords": "multimodal;multimodal classification;missing modality",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/93d1a873d1a3ec485f230b9f23e9174f7a68390c.pdf",
        "author": "Shah Nawaz;Muhammad Saad Saeed;Muhammad Zaigham Zaheer;Muhammad Haris Khan;Karthik Nandakumar;Muhammad Haroon Yousaf;Hassan Sajjad;Tom De Schepper;Markus Schedl",
        "authorids": "~Shah_Nawaz2;~Muhammad_Saad_Saeed1;~Muhammad_Zaigham_Zaheer1;~Muhammad_Haris_Khan3;~Karthik_Nandakumar3;~Muhammad_Haroon_Yousaf1;~Hassan_Sajjad1;~Tom_De_Schepper1;~Markus_Schedl1",
        "gender": "M;;M;M;;M;M;M;M",
        "homepage": "https://hcai.at/persons/nawaz/;;http://zaighamzaheer.com;https://m-haris-khan.com;;http://fms.uettaxila.edu.pk/Profile/haroon.yousaf;https://hsajjad.github.io/;;http://www.mschedl.eu/",
        "dblp": "158/2321;;260/4206;155/3076;;165/8661;73/5938;;77/271",
        "google_scholar": "gHQwe2wAAAAJ;;nFxWrXEAAAAJ;ZgERfFwAAAAJ;;https://scholar.google.com/citations?authuser=1;https://scholar.google.de/citations?user=t3BH6NkAAAAJ;Z2OO2QEAAAAJ;TQR8qIEAAAAJ",
        "orcid": "0000-0002-7715-4409;;;0000-0001-9746-276X;;;;0000-0002-2969-3133;0000-0003-1706-3406",
        "linkedin": "shah-nawaz-96265431/;;;muhammad-haris-khan-1516714b/;;muhammad-haroon-yousaf-0b919828/;hassan-sajjad-154b043a/;tomdeschepper/;markus-schedl/",
        "or_profile": "~Shah_Nawaz2;~Muhammad_Saad_Saeed1;~Muhammad_Zaigham_Zaheer1;~Muhammad_Haris_Khan3;~Karthik_Nandakumar3;~Muhammad_Haroon_Yousaf1;~Hassan_Sajjad1;~Tom_De_Schepper1;~Markus_Schedl1",
        "aff": "Johannes Kepler Universit\u00e4t Linz;;Mohamed bin Zayed University of Artificial Intelligence;Mohamed Bin Zayed University of Artificial Intelligence;;University of Engineering and Technology Taxila;Dalhousie University;imec;Johannes Kepler Universit\u00e4t Linz",
        "aff_domain": "jku.at;;mbzuai.ac.ae;mbzuai.ac.ae;;uettaxila.edu.pk;dal.ca;imec.be;jku.at",
        "position": "Assistant Professor;;Researcher;Assistant Professor;;Full Professor;Associate Professor;Principal Researcher;Full Professor",
        "bibtex": "@misc{\nnawaz2024gazelle,\ntitle={Gazelle: A Multimodal Learning System Robust to Missing Modalities},\nauthor={Shah Nawaz and Muhammad Saad Saeed and Muhammad Zaigham Zaheer and Muhammad Haris Khan and Karthik Nandakumar and Muhammad Haroon Yousaf and Hassan Sajjad and Tom De Schepper and Markus Schedl},\nyear={2024},\nurl={https://openreview.net/forum?id=b3f7FRUIzJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "1WPw;q4t6;ZSk2;fm8J",
        "site": "https://openreview.net/forum?id=b3f7FRUIzJ",
        "pdf_size": 6181925,
        "rating": "3;3;3;5",
        "confidence": "4;5;4;5",
        "soundness": "1;2;2;2",
        "contribution": "2;1;1;2",
        "presentation": "2;2;2;3",
        "wc_summary": "36;32;65;48",
        "wc_strengths": "69;20;32;30",
        "wc_weaknesses": "357;240;322;73",
        "wc_questions": "2;6;4;3",
        "wc_review": "464;298;423;154",
        "wc_reply_reviewers": "0;184;0;0",
        "wc_reply_authors": "486;551;788;418",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            45.25,
            12.833062767710599
        ],
        "wc_strengths_avg": [
            37.75,
            18.606114586339622
        ],
        "wc_weaknesses_avg": [
            248.0,
            109.59698900973511
        ],
        "wc_questions_avg": [
            3.75,
            1.479019945774904
        ],
        "wc_review_avg": [
            334.75,
            120.94911119971077
        ],
        "wc_reply_reviewers_avg": [
            46.0,
            79.67433714816836
        ],
        "wc_reply_authors_avg": [
            560.75,
            139.37606501835242
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:tnmqfUaV_mIJ:scholar.google.com/&scioq=Gazelle:+A+Multimodal+Learning+System+Robust+to+Missing+Modalities&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;2;3;4;0",
        "aff_unique_norm": "Johannes Kepler University Linz;Mohamed bin Zayed University of Artificial Intelligence;University of Engineering and Technology;Dalhousie University;IMEC",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.jku.at;https://mbzuai.ac.ae;https://www.uet.edu.pk;https://www.dal.ca;https://www.imec-int.com",
        "aff_unique_abbr": "JKU;MBZUAI;UET;Dal;imec",
        "aff_campus_unique_index": "0;2;0",
        "aff_campus_unique": "Linz;;Taxila",
        "aff_country_unique_index": "0;1;1;2;3;4;0",
        "aff_country_unique": "Austria;United Arab Emirates;Pakistan;Canada;Belgium"
    },
    {
        "title": "KITAB: Evaluating LLMs on Constraint Satisfaction for Information Retrieval",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18346",
        "id": "b3kDP3IytM",
        "author_site": "Marah I Abdin, Suriya Gunasekar, Varun Chandrasekaran, Jerry Li, Mert Yuksekgonul, Rahee Peshawaria, Ranjita Naik, Besmira Nushi",
        "tldr": "",
        "abstract": "We study the ability of state-of-the art models to answer constraint satisfaction queries for information retrieval (e.g., \u201ca list of ice cream shops in San Diego\u201d). In the past, such queries were considered as tasks that could only be solved via web-search or knowledge bases. More recently, large language models (LLMs) have demonstrated initial emergent abilities in this task. However, many current retrieval benchmarks are either saturated or do not measure constraint satisfaction. Motivated by rising concerns around factual incorrectness and hallucinations of LLMs, we present KITAB, a new dataset for measuring constraint satisfaction abilities of language models. KITAB consists of book-related data across more than 600 authors and 13,000 queries, and also offers an associated dynamic data collection and constraint verification approach for acquiring similar test data for other authors. Our extended experiments on GPT4 and GPT3.5 characterize and decouple common failure modes across dimensions such as information popularity, constraint types, and context availability. Results show that in the absence of context, models exhibit severe limitations as measured by irrelevant information, factual errors, and incompleteness, many of which exacerbate as information popularity decreases. While context availability mitigates irrelevant information, it is not helpful for satisfying constraints, identifying fundamental barriers to constraint satisfaction. We open source our contributions to foster further research on improving constraint satisfaction abilities of future models.",
        "keywords": "language model evaluation;benchmark;constraint satisfaction;information retrieval;retrieval-augmented architecture",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Marah I Abdin;Suriya Gunasekar;Varun Chandrasekaran;Jerry Li;Mert Yuksekgonul;Rahee Ghosh Peshawaria;Ranjita Naik;Besmira Nushi",
        "authorids": "~Marah_I_Abdin1;~Suriya_Gunasekar1;~Varun_Chandrasekaran1;~Jerry_Li1;~Mert_Yuksekgonul1;~Rahee_Ghosh_Peshawaria1;~Ranjita_Naik1;~Besmira_Nushi1",
        "gender": "F;;M;M;M;F;F;F",
        "homepage": ";http://sgunasekar.github.io;http://pages.cs.wisc.edu/~chandrasekaran/;https://jerryzli.github.io/;https://cs.stanford.edu/~merty;;https://github.com/ranjita-naik/;http://besmiranushi.com/",
        "dblp": ";;;;249/5558;;;117/4927",
        "google_scholar": "uJz6U0kAAAAJ;EkREu_QAAAAJ;Sl7nSOsAAAAJ;4zybTq4AAAAJ;https://scholar.google.com/citations?hl=en;;;QWTkjB8AAAAJ",
        "orcid": "0000-0002-8021-7108;;;;;;;",
        "linkedin": "marah-abdin/;;;;;rahee-ghosh-peshawaria/;;",
        "or_profile": "~Marah_I_Abdin1;~Suriya_Gunasekar1;~Varun_Chandrasekaran1;~Jerry_Li1;~Mert_Yuksekgonul1;~Rahee_Ghosh_Peshawaria1;~Ranjita_Naik1;~Besmira_Nushi1",
        "aff": "Microsoft Research;Microsoft;University of Illinois Urbana-Champaign;Microsoft;Microsoft;;Microsoft;Microsoft",
        "aff_domain": "research.microsoft.com;microsoft.com;illinois.edu;microsoft.com;microsoft.com;;microsoft.com;microsoft.com",
        "position": "Researcher;Senior Researcher;Assistant Professor;Senior Researcher;Intern;;Researcher;Researcher",
        "bibtex": "@inproceedings{\nabdin2024kitab,\ntitle={{KITAB}: Evaluating {LLM}s on Constraint Satisfaction for Information Retrieval},\nauthor={Marah I Abdin and Suriya Gunasekar and Varun Chandrasekaran and Jerry Li and Mert Yuksekgonul and Rahee Ghosh Peshawaria and Ranjita Naik and Besmira Nushi},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=b3kDP3IytM}\n}",
        "github": "",
        "project": "",
        "reviewers": "pbw5;XGyb;ZHUe;dWav",
        "pdf_size": 782937,
        "rating": "5;6;6;8",
        "confidence": "4;3;3;3",
        "soundness": "3;3;3;2",
        "contribution": "2;3;3;4",
        "presentation": "3;3;4;3",
        "wc_summary": "94;21;49;73",
        "wc_strengths": "68;89;58;168",
        "wc_weaknesses": "313;98;177;217",
        "wc_questions": "73;22;4;17",
        "wc_review": "548;230;288;475",
        "wc_reply_reviewers": "66;0;85;32",
        "wc_reply_authors": "1009;1109;690;1072",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "2;2;1;2",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            59.25,
            27.224758952100935
        ],
        "wc_strengths_avg": [
            95.75,
            43.18781656902789
        ],
        "wc_weaknesses_avg": [
            201.25,
            77.4350534318922
        ],
        "wc_questions_avg": [
            29.0,
            26.239283526803852
        ],
        "wc_review_avg": [
            385.25,
            130.48251798612716
        ],
        "wc_reply_reviewers_avg": [
            45.75,
            32.529794035622174
        ],
        "wc_reply_authors_avg": [
            970.0,
            165.56418694874807
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.6622661785325219,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17952749082083446554&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=b3kDP3IytM",
        "pdf": "https://openreview.net/pdf?id=b3kDP3IytM",
        "email": "research.microsoft.com;microsoft.com;illinois.edu;microsoft.com;microsoft.com;;microsoft.com;microsoft.com",
        "author_num": 8,
        "aff_unique_index": "0;0;1;0;0;0;0",
        "aff_unique_norm": "Microsoft;University of Illinois Urbana-Champaign",
        "aff_unique_dep": "Microsoft Research;",
        "aff_unique_url": "https://www.microsoft.com/en-us/research;https://illinois.edu",
        "aff_unique_abbr": "MSR;UIUC",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Urbana-Champaign",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Representation Deficiency in Masked Language Modeling",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18345",
        "id": "b3l0piOrGU",
        "author_site": "Yu Meng, Jitin Krishnan, Sinong Wang, Qifan Wang, Yuning Mao, Han Fang, Marjan Ghazvininejad, Jiawei Han, Luke Zettlemoyer",
        "tldr": "",
        "abstract": "Masked Language Modeling (MLM) has been one of the most prominent approaches for pretraining bidirectional text encoders due to its simplicity and effectiveness. One notable concern about MLM is that the special $\\texttt{[MASK]}$ symbol causes a discrepancy between pretraining data and downstream data as it is present only in pretraining but not in fine-tuning. In this work, we offer a new perspective on the consequence of such a discrepancy: We demonstrate empirically and theoretically that MLM pretraining allocates some model dimensions exclusively for representing $\\texttt{[MASK]}$ tokens, resulting in a representation deficiency for real tokens and limiting the pretrained model's expressiveness when it is adapted to downstream data without $\\texttt{[MASK]}$ tokens. Motivated by the identified issue, we propose MAE-LM, which pretrains the Masked Autoencoder architecture with MLM where $\\texttt{[MASK]}$ tokens are excluded from the encoder. Empirically, we show that MAE-LM improves the utilization of model dimensions for real token representations, and MAE-LM consistently outperforms MLM-pretrained models on the GLUE and SQuAD benchmarks.",
        "keywords": "Masked Language Modeling",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yu Meng;Jitin Krishnan;Sinong Wang;Qifan Wang;Yuning Mao;Han Fang;Marjan Ghazvininejad;Jiawei Han;Luke Zettlemoyer",
        "authorids": "~Yu_Meng1;~Jitin_Krishnan1;~Sinong_Wang1;~Qifan_Wang2;~Yuning_Mao1;~Han_Fang4;~Marjan_Ghazvininejad1;~Jiawei_Han1;~Luke_Zettlemoyer1",
        "gender": "M;;M;M;;M;;M;M",
        "homepage": "https://yumeng5.github.io/;;https://sites.google.com/site/snongwang/;https://wqfcr.github.io/;https://morningmoni.github.io/;https://www.hanfang.info/;;http://hanj.cs.illinois.edu/;https://www.cs.washington.edu/people/faculty/lsz/",
        "dblp": "30/4233-1;;140/0795;33/8610;178/3692;209/7867;;h/JiaweiHan.html;21/6793",
        "google_scholar": "S2-yZKcAAAAJ;;CYMAfxsAAAAJ;LrSyLosAAAAJ;steJe6IAAAAJ;;;https://scholar.google.com.tw/citations?user=Kv9AbjMAAAAJ;https://scholar.google.com.tw/citations?user=UjpbO6IAAAAJ",
        "orcid": "0000-0003-2554-2888;;;0000-0002-7570-5756;;;;0000-0002-3629-2696;",
        "linkedin": ";;wang-s-simon-194512a7;;morningmoni/;;;;luke-zettlemoyer-a0109b226/",
        "or_profile": "~Yu_Meng1;~Jitin_Krishnan1;~Sinong_Wang1;~Qifan_Wang2;~Yuning_Mao1;~Han_Fang4;~Marjan_Ghazvininejad1;~Jiawei_Han1;~Luke_Zettlemoyer1",
        "aff": "University of Virginia;;Meta Facebook;Meta AI;Meta;Meta AI;;University of Illinois at Urbana-Champaign (UIUC);Meta",
        "aff_domain": "virginia.edu;;fb.com;fb.com;meta.com;facebook.com;;illinois.edu;meta.com",
        "position": "Assistant Professor;;Research scientist;Principal Researcher;Researcher;Research Scientist Manager;;Full Professor;Researcher",
        "bibtex": "@inproceedings{\nmeng2024representation,\ntitle={Representation Deficiency in Masked Language Modeling},\nauthor={Yu Meng and Jitin Krishnan and Sinong Wang and Qifan Wang and Yuning Mao and Han Fang and Marjan Ghazvininejad and Jiawei Han and Luke Zettlemoyer},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=b3l0piOrGU}\n}",
        "github": "",
        "project": "",
        "reviewers": "HZEv;3FYT;sv4z;247c",
        "pdf_size": 991602,
        "rating": "3;6;8;10",
        "confidence": "4;4;4;5",
        "soundness": "2;4;4;4",
        "contribution": "2;3;4;3",
        "presentation": "2;4;4;4",
        "wc_summary": "147;55;103;47",
        "wc_strengths": "20;72;114;169",
        "wc_weaknesses": "589;81;88;85",
        "wc_questions": "16;45;1;16",
        "wc_review": "772;253;306;317",
        "wc_reply_reviewers": "0;161;13;0",
        "wc_reply_authors": "783;504;166;214",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            6.75,
            2.5860201081971503
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            88.0,
            40.23679907746142
        ],
        "wc_strengths_avg": [
            93.75,
            54.73744148204225
        ],
        "wc_weaknesses_avg": [
            210.75,
            218.39685780706645
        ],
        "wc_questions_avg": [
            19.5,
            15.945218719101975
        ],
        "wc_review_avg": [
            412.0,
            209.24985065705542
        ],
        "wc_reply_reviewers_avg": [
            43.5,
            68.04594036384536
        ],
        "wc_reply_authors_avg": [
            416.75,
            247.85820038885137
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.7255892438417318,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3493214304862700934&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=b3l0piOrGU",
        "pdf": "https://openreview.net/pdf?id=b3l0piOrGU",
        "email": "virginia.edu;;fb.com;fb.com;meta.com;facebook.com;;illinois.edu;meta.com",
        "author_num": 9,
        "aff_unique_index": "0;1;1;1;1;2;1",
        "aff_unique_norm": "University of Virginia;Meta;University of Illinois Urbana-Champaign",
        "aff_unique_dep": ";Meta Platforms, Inc.;",
        "aff_unique_url": "https://www.virginia.edu;https://meta.com;https://illinois.edu",
        "aff_unique_abbr": "UVA;Meta;UIUC",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Urbana-Champaign",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "b5LJVjwOsB",
        "title": "VTranM: Vision Transformer Explainability with Vector Transformations Measurement",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "While Vision Transformers, characterized by their growing complexity, excel in various computer vision tasks, the intricacies of their internal dynamics remain largely unexplored. To embed visual information, Vision Transformers draw representations from image patches as transformed vectors and subsequently integrate them using attention weights. However, current explanation methods only focus on attention weights without considering essential information from the corresponding transformed vectors, failing to accurately illustrate the rationales behind models' predictions. To accommodate the contributions of transformed vectors, we propose VTranM, a novel explanation method leveraging our introduced vector transformation measurement. Specifically, our measurement faithfully evaluates transformation effects by considering changes in vector length and directional correlation. Furthermore, we use an aggregation framework to incorporate attention and vector transformation information across layers, thus capturing the comprehensive vector contributions over the entire model. Experiments on segmentation and perturbation tests demonstrate the superiority of VTranM compared to state-of-the-art explanation methods.",
        "keywords": "Post-hoc Explainability;Vision Transformer;Explainable AI",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Junyi Wu;Bin Duan;Weitai Kang;Hao Tang;Yan Yan",
        "authorids": "~Junyi_Wu1;~Bin_Duan1;~Weitai_Kang1;~Hao_Tang6;~Yan_Yan6",
        "gender": "M;M;M;M;M",
        "homepage": "https://adreamwu.github.io/;;https://weitaikang.github.io/;https://ha0tang.github.io/;",
        "dblp": ";;372/4979;07/5751-5;13/3953-2",
        "google_scholar": "Akua_xUAAAAJ;04SJDVoAAAAJ;hDl0MkwAAAAJ;9zJkeEMAAAAJ;",
        "orcid": ";0000-0002-6727-9195;0009-0007-6484-0665;0000-0002-2077-1246;",
        "linkedin": "junyi-wu-82a92b24a/;;weitaikang/;hao-tang-887475138/;",
        "or_profile": "~Junyi_Wu1;~Bin_Duan1;~Weitai_Kang1;~Hao_Tang6;~Yan_Yan6",
        "aff": "Illinois Institute of Technology;Illinois Institute of Technology;Illinois Institute of Technology;Carnegie Mellon University;University of Illinois Chicago",
        "aff_domain": "iit.edu;iit.edu;hawk.iit.edu;cmu.edu;uic.edu",
        "position": "PhD student;PhD student;PhD student;Postdoc;Associate Professor",
        "bibtex": "@misc{\nwu2024vtranm,\ntitle={{VT}ranM: Vision Transformer Explainability with Vector Transformations Measurement},\nauthor={Junyi Wu and Bin Duan and Weitai Kang and Hao Tang and Yan Yan},\nyear={2024},\nurl={https://openreview.net/forum?id=b5LJVjwOsB}\n}",
        "github": "",
        "project": "",
        "reviewers": "WGBd;9oRD;NcNK",
        "site": "https://openreview.net/forum?id=b5LJVjwOsB",
        "pdf_size": 1348731,
        "rating": "3;5;6",
        "confidence": "3;5;4",
        "soundness": "3;3;3",
        "contribution": "2;2;3",
        "presentation": "3;3;3",
        "wc_summary": "173;58;48",
        "wc_strengths": "106;56;43",
        "wc_weaknesses": "106;98;28",
        "wc_questions": "60;81;24",
        "wc_review": "445;293;143",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            93.0,
            56.71566509057852
        ],
        "wc_strengths_avg": [
            68.33333333333333,
            27.157974069424906
        ],
        "wc_weaknesses_avg": [
            77.33333333333333,
            35.03648891592243
        ],
        "wc_questions_avg": [
            55.0,
            23.53720459187964
        ],
        "wc_review_avg": [
            293.6666666666667,
            123.29188492714714
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.6546536707079772,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5891346444063906536&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;2",
        "aff_unique_norm": "Illinois Institute of Technology;Carnegie Mellon University;University of Illinois at Chicago",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.iit.edu;https://www.cmu.edu;https://www.uic.edu",
        "aff_unique_abbr": "IIT;CMU;UIC",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Chicago",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Pareto Deep Long-Tailed Recognition: A Conflict-Averse Solution",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18344",
        "id": "b66P1u0k15",
        "author_site": "Zhipeng Zhou, Liu Liu, Peilin Zhao, Wei Gong",
        "tldr": "",
        "abstract": "Deep long-tailed recognition (DTLR) has attracted much attention due to its close touch with realistic scenarios. Recent advances have focused on re-balancing across various aspects, e.g., sampling strategy, loss re-weighting, logit adjustment, and input/parameter perturbation, to name a few. However, few studies have considered dynamic re-balancing to address intrinsic optimization conflicts. In this paper, we first empirically argue that the optimizations of mainstream DLTR methods are still dominated by some categories (e.g., major) due to a fixed re-balancing strategy. Thus, they fail to deal with gradient conflicts among categories, which naturally deduces the motivation for reaching Pareto optimal solutions. Unfortunately, a naive integration of multi-objective optimization (MOO) with DLTR methods is not applicable due to the gap between multi-task learning (MTL) and DLTR, and can in turn lead to class-specific feature degradation. Thus, we provide effective alternatives by decoupling MOO-based MTL from the temporal rather than structure perspective, and enhancing it via optimizing variability collapse loss motivated by the derived MOO-based DLTR generalization bound. Moreover, we resort to anticipating worst-case optimization with theoretical insights to further ensure convergence. We build a Pareto deep long-tailed recognition method termed PLOT upon the proposed MOO framework. Extensive evaluations demonstrate that our method not only generally improves mainstream pipelines, but also achieves an augmented version to realize state-of-the-art performance across multiple benchmarks.",
        "keywords": "Deep long-tailed recognition;Representation learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/75f98507c56fc5324de6f9493864f126009eb70c.zip",
        "author": "Zhipeng Zhou;Liu Liu;Peilin Zhao;Wei Gong",
        "authorids": "~Zhipeng_Zhou2;~Liu_Liu3;~Peilin_Zhao2;~Wei_Gong1",
        "gender": "M;M;;",
        "homepage": "http://home.ustc.edu.cn/~zzp1994/;http://liuliuforph.github.io;;https://ubiot.ustc.edu.cn/weigong/main.htm",
        "dblp": ";74/7037;84/8411;11/3249-1",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;hP8aSTAAAAAJ;https://scholar.google.com.hk/citations?user=HPeX_YcAAAAJ;CtbzNl8AAAAJ",
        "orcid": ";;0000-0001-8543-3953;",
        "linkedin": ";;;",
        "or_profile": "~Zhipeng_Zhou2;~Liu_Liu3;~Peilin_Zhao2;~Wei_Gong1",
        "aff": "University of Science and Technology of China;;Tencent;University of Science and Technology of China",
        "aff_domain": "ustc.edu.cn;;tencent.com;ustc.edu.cn",
        "position": "PhD student;;Researcher;Full Professor",
        "bibtex": "@inproceedings{\nzhou2024pareto,\ntitle={Pareto Deep Long-Tailed Recognition: A Conflict-Averse Solution},\nauthor={Zhipeng Zhou and Liu Liu and Peilin Zhao and Wei Gong},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=b66P1u0k15}\n}",
        "github": "",
        "project": "",
        "reviewers": "wNAW;KQKE;yXjC",
        "pdf_size": 3218118,
        "rating": "6;6;6",
        "confidence": "4;4;5",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "3;3;3",
        "wc_summary": "66;113;89",
        "wc_strengths": "52;79;47",
        "wc_weaknesses": "439;104;148",
        "wc_questions": "6;41;5",
        "wc_review": "563;337;289",
        "wc_reply_reviewers": "293;204;15",
        "wc_reply_authors": "2903;1004;884",
        "reply_reviewers": "2;2;1",
        "reply_authors": "7;2;4",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            89.33333333333333,
            19.189117286165672
        ],
        "wc_strengths_avg": [
            59.333333333333336,
            14.055445761538676
        ],
        "wc_weaknesses_avg": [
            230.33333333333334,
            148.63901088057455
        ],
        "wc_questions_avg": [
            17.333333333333332,
            16.73983937265296
        ],
        "wc_review_avg": [
            396.3333333333333,
            119.46919640178756
        ],
        "wc_reply_reviewers_avg": [
            170.66666666666666,
            115.91471960981583
        ],
        "wc_reply_authors_avg": [
            1597.0,
            924.7799738316137
        ],
        "reply_reviewers_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            4.333333333333333,
            2.0548046676563256
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13798613141944389010&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=b66P1u0k15",
        "pdf": "https://openreview.net/pdf?id=b66P1u0k15",
        "email": "ustc.edu.cn;;tencent.com;ustc.edu.cn",
        "author_num": 4,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Science and Technology of China;Tencent",
        "aff_unique_dep": ";Tencent Holdings Limited",
        "aff_unique_url": "http://www.ustc.edu.cn;https://www.tencent.com",
        "aff_unique_abbr": "USTC;Tencent",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "b6LeQUnVIH",
        "title": "FTFT: efficient and robust Fine-Tuning by transFerring Training dynamics",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Despite the massive success of fine-tuning large Pre-trained Language Models (PLMs) on a wide range of Natural Language Processing (NLP) tasks, they remain susceptible to out-of-distribution (OOD) and adversarial inputs. Data map (DM) is a simple yet effective dual-model approach that enhances the robustness of fine-tuned PLMs, which involves fine-tuning a model on the original training set (i.e. reference model), selecting a specified fraction of important training examples according to the training dynamics of the reference model, and fine-tuning the same model on these selected examples (i.e. main model). However, it suffers from the drawback of requiring fine-tuning the same model twice, which is computationally expensive for large models. In this paper, we first show that 1) training dynamics are highly transferable across different model sizes and different pre-training methods, and that 2) main models fine-tuned using DM learn faster than when using conventional Empirical Risk Minimization (ERM). Building on these observations, we propose a novel fine-tuning approach based on the DM method: Fine-Tuning by transFerring Training dynamics (FTFT). Compared with DM, FTFT uses more efficient reference models and then fine-tunes more capable main models for fewer steps. Our experiments show that FTFT achieves better generalization robustness than ERM while spending less than half of the training cost.",
        "keywords": "Model Robustness;Training Efficiency;Data Pruning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/e06bed9c1b29f66f1866bb435c5752c0d1658131.zip",
        "author": "Yupei Du;Albert Gatt;Dong Nguyen",
        "authorids": "~Yupei_Du1;~Albert_Gatt2;~Dong_Nguyen1",
        "gender": "M;;M",
        "homepage": "https://yupei.nl;https://www.dongnguyen.nl/;https://albertgatt.github.io",
        "dblp": "254/8107;91/102-2;https://dblp.uni-trier.de/pers/hd/g/Gatt:Albert",
        "google_scholar": "IgikFuEAAAAJ;iladopIAAAAJ;uF5HKZQAAAAJ",
        "orcid": ";;0000-0001-6388-8244",
        "linkedin": ";;",
        "or_profile": "~Yupei_Du1;~Dong_Nguyen1;~Albert_Gatt1",
        "aff": "Utrecht University;Utrecht University;Utrecht University",
        "aff_domain": "uu.nl;uu.nl;uu.nl",
        "position": "PhD student;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\ndu2024ftft,\ntitle={{FTFT}: efficient and robust Fine-Tuning by transFerring Training dynamics},\nauthor={Yupei Du and Albert Gatt and Dong Nguyen},\nyear={2024},\nurl={https://openreview.net/forum?id=b6LeQUnVIH}\n}",
        "github": "",
        "project": "",
        "reviewers": "dPV5;vdXa;CV2g;FKcX",
        "site": "https://openreview.net/forum?id=b6LeQUnVIH",
        "pdf_size": 428202,
        "rating": "3;3;5;5",
        "confidence": "3;4;4;3",
        "soundness": "3;3;3;3",
        "contribution": "1;1;2;3",
        "presentation": "3;2;2;3",
        "wc_summary": "76;46;53;109",
        "wc_strengths": "21;13;65;78",
        "wc_weaknesses": "67;87;170;320",
        "wc_questions": "10;1;89;8",
        "wc_review": "174;147;377;515",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "233;577;907;445",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            71.0,
            24.586581706288495
        ],
        "wc_strengths_avg": [
            44.25,
            27.779263849137543
        ],
        "wc_weaknesses_avg": [
            161.0,
            99.59166631802081
        ],
        "wc_questions_avg": [
            27.0,
            35.9513560244951
        ],
        "wc_review_avg": [
            303.25,
            151.15947704328696
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            540.5,
            244.60733840177403
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:3UIAVWzIc4gJ:scholar.google.com/&scioq=FTFT:+efficient+and+robust+Fine-Tuning+by+transFerring+Training+dynamics&hl=en&as_sdt=0,14",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Utrecht University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uu.nl",
        "aff_unique_abbr": "UU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Netherlands"
    },
    {
        "id": "b7DsNJYmeo",
        "title": "realSEUDO for real-time calcium imaging analysis",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Closed-loop neuroscience experimentation, where recorded neural activity is used to modify the experiment on-the-fly, is critical for deducing causal connections and optimizing experimental time. A critical step in creating a closed-loop experiment is real-time inference of neural activity from streaming recordings. One challenging modality for real-time processing is multi-photon calcium imaging (CI). CI enables the recording of activity in large populations of neurons however, often requires batch processing of the video data to extract single-neuron activity from the fluorescence videos. We use the recently proposed robust time-trace estimator\u2014Sparse Emulation of Unused Dictionary Objects (SEUDO) algorithm\u2014as a basis for a new on-line processing algorithm that simultaneously identifies neurons in the fluorescence video and infers their time traces in a way that is robust to as-yet unidentified neurons. To achieve real-time SEUDO (real-SEUDO), we optimize the core estimator via both algorithmic improvements and fast C-based implementation, as well as by creating a new cell finding loop to enable real-SEUDO to also identify new cells. We demonstrate comparable performance to offline algorithms (e.g., CNMF), and improved performance over the current on-line approach (OnACID) at speeds up to 120Hz on average.",
        "keywords": "calcium imaging;real-time;LASSO;convex optimization;fast algorithms;neuroscience",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/aa61f11d69f03129cc697e281fe5af0cc352bde1.zip",
        "author": "Iuliia Dmitrieva;Sergey Babkin;Adam Shabti Charles",
        "authorids": "~Iuliia_Dmitrieva1;~Sergey_Babkin1;~Adam_Shabti_Charles1",
        "gender": "F;M;M",
        "homepage": ";;https://www.bme.jhu.edu/ascharles/",
        "dblp": ";;04/10257",
        "google_scholar": "lwp0YwgAAAAJ;;c8RKLp0AAAAJ",
        "orcid": ";;",
        "linkedin": ";sergey-babkin-2404211/;",
        "or_profile": "~Iuliia_Dmitrieva1;~Sergey_Babkin1;~Adam_Shabti_Charles1",
        "aff": "Johns Hopkins University;Oculus;Johns Hopkins University",
        "aff_domain": "jh.edu;oculus.com;jhu.edu",
        "position": "Undergrad student;Principal Researcher;Assistant Professor",
        "bibtex": "@misc{\ndmitrieva2024realseudo,\ntitle={real{SEUDO} for real-time calcium imaging analysis},\nauthor={Iuliia Dmitrieva and Sergey Babkin and Adam Shabti Charles},\nyear={2024},\nurl={https://openreview.net/forum?id=b7DsNJYmeo}\n}",
        "github": "",
        "project": "",
        "reviewers": "vjPy;11J3;26AX",
        "site": "https://openreview.net/forum?id=b7DsNJYmeo",
        "pdf_size": 4617451,
        "rating": "3;5;6",
        "confidence": "3;4;2",
        "soundness": "3;3;3",
        "contribution": "2;2;3",
        "presentation": "3;3;3",
        "wc_summary": "233;44;64",
        "wc_strengths": "47;45;42",
        "wc_weaknesses": "147;112;86",
        "wc_questions": "40;59;1",
        "wc_review": "467;260;193",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            113.66666666666667,
            84.77552057574692
        ],
        "wc_strengths_avg": [
            44.666666666666664,
            2.0548046676563256
        ],
        "wc_weaknesses_avg": [
            115.0,
            24.99333244420733
        ],
        "wc_questions_avg": [
            33.333333333333336,
            24.143091949642425
        ],
        "wc_review_avg": [
            306.6666666666667,
            116.62570709562945
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3273268353539886,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Vo2uYyJ1Q2EJ:scholar.google.com/&scioq=realSEUDO+for+real-time+calcium+imaging+analysis&hl=en&as_sdt=0,33",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Johns Hopkins University;Oculus VR",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.jhu.edu;https://www.oculus.com",
        "aff_unique_abbr": "JHU;Oculus",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "b7bilXYHgG",
        "title": "Counterfactual Fairness for Predictions using Generative Adversarial Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Fairness in predictions is of direct importance in practice due to legal, ethical, and societal reasons. It is often achieved through counterfactual fairness, which ensures that the prediction for an individual is the same as that in a counterfactual world under a different sensitive attribute. However, achieving counterfactual fairness is challenging as counterfactuals are unobservable. In this paper, we develop a novel deep neural network called Generative Counterfactual Fairness Network (GCFN) for making predictions under counterfactual fairness. Specifically, we leverage a tailored generative adversarial network to directly learn the counterfactual distribution of the descendants of the sensitive attribute, which we then use to enforce fair predictions through a novel counterfactual mediator regularization. We give a mathematical guarantee that it learns to fulfill the notion of counterfactual fairness. Thereby, our GCFN addresses key shortcomings of existing baselines that are based on inferring latent variables, yet which (a) are potentially correlated with the sensitive attributes and thus lead to bias, or (b) have weak capability in constructing latent representations and thus low prediction performance. Across various experiments, our method achieves state-of-the-art performance. Using a real-world case study from recidivism prediction, we further demonstrate that our method makes meaningful predictions in practice.",
        "keywords": "Counterfactual Fairness;Generative Adversarial Networks;Causal Inference",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Yuchen Ma;Dennis Frauen;Valentyn Melnychuk;Stefan Feuerriegel",
        "authorids": "~Yuchen_Ma3;~Dennis_Frauen1;~Valentyn_Melnychuk1;~Stefan_Feuerriegel1",
        "gender": "F;M;M;M",
        "homepage": "https://www.som.lmu.de/ai/en/institute/contact-page/yuchen-ma-df26be0b.html;https://www.ai.bwl.uni-muenchen.de/team/research_team/dennis_frauen/index.html;https://valentyn1997.github.io/;http://www.ai.bwl.lmu.de",
        "dblp": "192/2001-5;315/0115;254/1513;125/0630",
        "google_scholar": "w6hmCEYAAAAJ;ieyW4WQAAAAJ;EMExrOMAAAAJ;https://scholar.google.de/citations?hl=de",
        "orcid": "0009-0003-9900-2822;;0000-0002-2401-6803;0000-0001-7856-8729",
        "linkedin": ";dennis-frauen-6b5746171/;valentyn-melnychuk/;",
        "or_profile": "~Yuchen_Ma3;~Dennis_Frauen1;~Valentyn_Melnychuk1;~Stefan_Feuerriegel1",
        "aff": "University of Cambridge;Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen;Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen;LMU Munich",
        "aff_domain": "cam.ac.uk;lmu.de;lmu.de;lmu.de",
        "position": "Researcher;PhD student;PhD student;Professor",
        "bibtex": "@misc{\nma2024counterfactual,\ntitle={Counterfactual Fairness for Predictions using Generative Adversarial Networks},\nauthor={Yuchen Ma and Dennis Frauen and Valentyn Melnychuk and Stefan Feuerriegel},\nyear={2024},\nurl={https://openreview.net/forum?id=b7bilXYHgG}\n}",
        "github": "",
        "project": "",
        "reviewers": "Bc4s;RxKF;5wUi;Aquc",
        "site": "https://openreview.net/forum?id=b7bilXYHgG",
        "pdf_size": 983962,
        "rating": "5;5;5;5",
        "confidence": "3;4;4;5",
        "soundness": "2;2;2;1",
        "contribution": "2;3;2;2",
        "presentation": "3;4;2;3",
        "wc_summary": "59;162;75;49",
        "wc_strengths": "36;85;69;43",
        "wc_weaknesses": "171;16;108;88",
        "wc_questions": "60;948;2;280",
        "wc_review": "326;1211;254;460",
        "wc_reply_reviewers": "0;845;0;253",
        "wc_reply_authors": "1270;5605;850;2337",
        "reply_reviewers": "0;9;0;2",
        "reply_authors": "3;12;2;5",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            86.25,
            44.70668294561787
        ],
        "wc_strengths_avg": [
            58.25,
            19.74050404624968
        ],
        "wc_weaknesses_avg": [
            95.75,
            55.30088154812724
        ],
        "wc_questions_avg": [
            322.5,
            375.726962034933
        ],
        "wc_review_avg": [
            562.75,
            381.4979521570201
        ],
        "wc_reply_reviewers_avg": [
            274.5,
            345.1930619233243
        ],
        "wc_reply_authors_avg": [
            2515.5,
            1864.2715065140055
        ],
        "reply_reviewers_avg": [
            2.75,
            3.6996621467371855
        ],
        "reply_authors_avg": [
            5.5,
            3.905124837953327
        ],
        "replies_avg": [
            40,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12787115815054367525&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "University of Cambridge;Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen;Ludwig Maximilian University of Munich",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.cam.ac.uk;https://www.lmu.de;https://www.lmu.de",
        "aff_unique_abbr": "Cambridge;LMU;LMU",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Cambridge;;Munich",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "United Kingdom;Germany"
    },
    {
        "id": "b8hRudcKQ3",
        "title": "Performance Adjustment for Federated Learning Marketplace",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In federated learning, client participation is mainly motivated by performance-gain rewards or monetary rewards. In practice, different clients may have varying preferences over these two types of rewards. However, optimizing the training process to align model performance and monetary rewards with client expectations remains an open challenge. To accommodate diverse reward preferences, we propose Alpha-Tuning, an FL performance adjustment framework guided by dynamic validation loss composition. The core of our framework is a mechanism to decide the weights assigned to clients' local validation loss, each of which is determined by the corresponding client's performance contribution in the given training round and its monetary quotation for biasing this FL course towards its favor. The training hyper-parameters and model aggregation weights are adjusted together with model parameters to minimize the weighted sums of clients' local validation losses in our framework. Paired with a payment rule designed to compensate the clients according to their data contribution, Alpha-Tuning balances the clients' preferences between the performance gain and monetary reward. We demonstrate the effectiveness of our framework by conducting experiments on the federated learning tasks under various client quotation settings.",
        "keywords": "Federated Learning;Incentive Mechanism",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/014c74588a46532189545f5cc9e0aab3636a99be.pdf",
        "author": "Liuyi Yao;Zitao Li;Weirui Kuang;Yaliang Li;Bolin Ding",
        "authorids": "~Liuyi_Yao1;~Zitao_Li1;~Weirui_Kuang2;~Yaliang_Li1;~Bolin_Ding3",
        "gender": "F;M;M;M;M",
        "homepage": ";;https://sites.google.com/site/yaliangli/;https://bolinding.github.io/;https://weiruikuang.com/",
        "dblp": "219/1767;220/3927;https://dblp.org/pers/hd/l/Li:Yaliang;46/3522.html;318/1583",
        "google_scholar": "0c5is-gAAAAJ;_8DPNucAAAAJ;CCPBcdYAAAAJ;AjYkTi8AAAAJ;51p3plEAAAAJ",
        "orcid": ";;0000-0002-4204-6096;;",
        "linkedin": ";;;bolin-ding-50a0119/;",
        "or_profile": "~Liuyi_Yao1;~Zitao_Li1;~Yaliang_Li1;~Bolin_Ding3;~weirui_kuang1",
        "aff": "Alibaba Group;Alibaba Group (U.S.);Alibaba Group;Alibaba Group;Alibaba Group",
        "aff_domain": "alibaba-inc.com;alibaba-inc.com;alibaba-inc.com;alibaba-inc.com;alibaba-inc.com",
        "position": "Staff Engineer;Researcher;Staff Engineer;Senior Director;Researcher",
        "bibtex": "@misc{\nyao2024performance,\ntitle={Performance Adjustment for Federated Learning Marketplace},\nauthor={Liuyi Yao and Zitao Li and Weirui Kuang and Yaliang Li and Bolin Ding},\nyear={2024},\nurl={https://openreview.net/forum?id=b8hRudcKQ3}\n}",
        "github": "",
        "project": "",
        "reviewers": "ijEK;Eroa;C98P;1CDp",
        "site": "https://openreview.net/forum?id=b8hRudcKQ3",
        "pdf_size": 1180511,
        "rating": "3;3;3;5",
        "confidence": "4;4;4;4",
        "soundness": "2;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "2;3;2;2",
        "wc_summary": "128;96;106;121",
        "wc_strengths": "80;32;76;25",
        "wc_weaknesses": "287;62;215;89",
        "wc_questions": "3;696;3;4",
        "wc_review": "498;886;400;239",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            112.75,
            12.517487767120047
        ],
        "wc_strengths_avg": [
            53.25,
            24.913600703230355
        ],
        "wc_weaknesses_avg": [
            163.25,
            91.8650504816712
        ],
        "wc_questions_avg": [
            176.5,
            299.93374268327995
        ],
        "wc_review_avg": [
            505.75,
            238.2166818256018
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:v_FwAZMMVBsJ:scholar.google.com/&scioq=Performance+Adjustment+for+Federated+Learning+Marketplace&hl=en&as_sdt=0,11",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Alibaba Group",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.alibaba.com",
        "aff_unique_abbr": "Alibaba",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "b8zji8TBN3",
        "title": "A One-Step MSE Estimation of Models in Production",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In real-world operation of machine learning systems, monitoring the performance of prediction models is crucial.\nHowever, in these scenarios, actual values of target variables are observed with a delay, making real-time evaluation of prediction performance impossible.\nIn this paper, we propose a novel one-step Mean Squared Error (MSE) estimation method that directly and tightly minimizes the upper bound of the MSE estimation error for regression tasks.\nDue to its direct estimation, our method is more efficient at estimating MSE compared to the conventional two-step approach, which approximates the mean and variance of the target variable.\nWe also provide generalization error bounds for our proposed method based on a theoretical analysis.\nOur experiments demonstrate the effectiveness of our method, outperforming existing methods on both synthetic and real data sets.",
        "keywords": "Error estimation;model evaluation;model monitoring;MLOps",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/d8fd3083f9d3af00c6247d90ca54cc1a7fcc0d95.pdf",
        "author": "Ryuta Matsuno",
        "authorids": "~Ryuta_Matsuno2",
        "gender": "",
        "homepage": "",
        "dblp": "",
        "google_scholar": "",
        "orcid": "",
        "linkedin": "",
        "or_profile": "",
        "aff": "",
        "aff_domain": "",
        "position": "",
        "bibtex": "@misc{\nmatsuno2024a,\ntitle={A One-Step {MSE} Estimation of Models in Production},\nauthor={Ryuta Matsuno},\nyear={2024},\nurl={https://openreview.net/forum?id=b8zji8TBN3}\n}",
        "github": "",
        "project": "",
        "reviewers": "TPbn;q3T4;YTwt;Mmfr;ZbmE",
        "site": "https://openreview.net/forum?id=b8zji8TBN3",
        "pdf_size": 358046,
        "rating": "3;3;3;3;5",
        "confidence": "2;3;3;2;4",
        "soundness": "2;2;2;2;2",
        "contribution": "2;2;2;2;2",
        "presentation": "2;3;2;2;3",
        "wc_summary": "44;100;36;139;67",
        "wc_strengths": "24;15;36;51;34",
        "wc_weaknesses": "19;265;291;430;84",
        "wc_questions": "245;31;37;45;73",
        "wc_review": "332;411;400;665;258",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            3.4,
            0.8
        ],
        "confidence_avg": [
            2.8,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            77.2,
            38.059952706223896
        ],
        "wc_strengths_avg": [
            32.0,
            12.116104984688768
        ],
        "wc_weaknesses_avg": [
            217.8,
            148.35012639023938
        ],
        "wc_questions_avg": [
            86.2,
            80.69299845711522
        ],
        "wc_review_avg": [
            413.2,
            137.30462483106677
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0.8017837257372732,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ZBwHJMgEOaUJ:scholar.google.com/&scioq=A+One-Step+MSE+Estimation+of+Models+in+Production&hl=en&as_sdt=0,5",
        "gs_version_total": 0
    },
    {
        "id": "b9aCXHhdbv",
        "title": "Pipeline Parallelism Optimization with Deep Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "It has been widely observed that larger neural networks perform better in many real-world applications. While this scaling trend affirms the need to train a giant model across multiple devices, it is challenging to partition a model with millions of parameters to run efficiently and effectively on various devices deployed in a cluster of accelerators, e.g., GPUs and TPUs. Recently, a novel approach to training deep neural network (DNN) models distributedly has been proposed, pipeline parallelism. Compared with data parallelism, the existing works achieved a significant speed-up ratio even with a naive partition scheme.\n\nThis paper presents a deep reinforcement learning (DRL)-based pipeline parallelism framework, DRL-PP, that learns to optimize the pipeline schedule for training large DNN models across multiple accelerators. The core of DRL-PP is a DRL agent consisting of a graph encoder, describing the semantics of an operator in the computational graph, followed by a recurrent model partitioner and a pipeline scheduler that learns to partition and place operations on various GPU devices automatically. In particular, by generating placement in a recurrent way, DRL-PP can partition DNN models in a more flexible and balanced manner, which improves accelerator utilization and speeds up DNN training. We deployed and extensively evaluated DRL-PP on various benchmarks. Compared with the state-of-the-art, DRL-PP can speed up the distributed training of benchmark models up to 6.8\nand 1.3 over data parallelism and PipeDream, respectively.",
        "keywords": "distributed machine learning;pipeline parallelism;deep reinforcement learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/765a18f0698e8038e1dc75e3dc2b1f6c47e8c6dd.pdf",
        "author": "Hao Lan;Baochun Li;Wenting Wei;Xiaoshan Yu",
        "authorids": "~Hao_Lan1;~Baochun_Li1;~Wenting_Wei1;~Xiaoshan_Yu3",
        "gender": "M;M;F;",
        "homepage": "https://lanhao.me;http://iqua.ece.toronto.edu/bli/;https://faculty.xidian.edu.cn/WEIWENTING/zh_CN/index/411623/list/index.htm;http://antl.xidian.edu.cn/",
        "dblp": "160/7129;l/BaochunLi;184/0126;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.com.tw/citations?user=rkb3_FgAAAAJ;;",
        "orcid": ";0000-0003-2404-0974;;",
        "linkedin": ";https://linkedin.com/in/baochun;;",
        "or_profile": "~Hao_Lan1;~Baochun_Li1;~Wenting_Wei1;~Xiaoshan_Yu3",
        "aff": "Tsinghua University;University of Toronto;;",
        "aff_domain": "tsinghua.edu.cn;toronto.edu;;",
        "position": "Postdoc;Full Professor;;",
        "bibtex": "@misc{\nlan2024pipeline,\ntitle={Pipeline Parallelism Optimization with Deep Reinforcement Learning},\nauthor={Hao Lan and Baochun Li and Wenting Wei and Xiaoshan Yu},\nyear={2024},\nurl={https://openreview.net/forum?id=b9aCXHhdbv}\n}",
        "github": "",
        "project": "",
        "reviewers": "3JAq;VkLQ;nNSt;dWCJ",
        "site": "https://openreview.net/forum?id=b9aCXHhdbv",
        "pdf_size": 1076452,
        "rating": "3;5;5;5",
        "confidence": "5;4;3;3",
        "soundness": "2;3;2;3",
        "contribution": "1;2;3;2",
        "presentation": "2;3;2;2",
        "wc_summary": "122;101;115;183",
        "wc_strengths": "8;101;34;40",
        "wc_weaknesses": "22;106;44;79",
        "wc_questions": "1538;71;588;164",
        "wc_review": "1690;379;781;466",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            130.25,
            31.379730719048563
        ],
        "wc_strengths_avg": [
            45.75,
            34.09087121210017
        ],
        "wc_weaknesses_avg": [
            62.75,
            32.19763190049852
        ],
        "wc_questions_avg": [
            590.25,
            580.8495394678384
        ],
        "wc_review_avg": [
            829.0,
            519.1083701887304
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8703882797784891,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:202nBjSLlowJ:scholar.google.com/&scioq=Pipeline+Parallelism+Optimization+with+Deep+Reinforcement+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Tsinghua University;University of Toronto",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.utoronto.ca",
        "aff_unique_abbr": "THU;U of T",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "China;Canada"
    },
    {
        "id": "bA5o5eZplk",
        "title": "New recipes for graph anomaly detection: Forward diffusion dynamics and graph generation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Distinguishing atypical nodes in a graph, which is known as graph anomaly detection, is more crucial than the generic node classification in real applications, such as fraud and spam detection. However, the lack of prior knowledge about anomalies and the extremely class-imbalanced data pose formidable challenges in learning the distributions of normal nodes and anomalies, which serves as the foundation of the state of the arts. We introduce a novel paradigm (first recipe) for detecting graph anomalies, stemming from our empirical and rigorous analysis of the significantly distinct evolving patterns between anomalies and normal nodes when scheduled noise is injected into the node attributes, referred to as the forward diffusion process. Rather than modeling the data distribution, we present three non-GNN methods to capture the evolving patterns and achieve promising results on six widely-used datasets, while mitigating the oversmoothing limitation and shallow architecture of GNN methods. We further investigate the generative power of denoising diffusion models to synthesize training samples that align with the original graph semantics (second recipe). In particular, we derive two principles for designing the denoising neural network and generating graphs. With our proposed graph generation method, we attain record-breaking performance while our generated graphs are also capable of enhancing the results of existing methods. All the code and data are available at \\url{https://github.com/DiffAD/DiffAD}.",
        "keywords": "Graph anomaly detection;anomaly detection;denoising diffusion;graph generation",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Xiaoxiao Ma;Ruikun Li;Fanzhen Liu;Kaize Ding;Jian Yang;Jia Wu",
        "authorids": "~Xiaoxiao_Ma2;~Ruikun_Li2;~Fanzhen_Liu1;~Kaize_Ding1;~Jian_Yang13;~Jia_Wu3",
        "gender": "M;M;M;M;F;M",
        "homepage": "https://xiaoxiaoma-mq.github.io/;;https://fanzhenliu.github.io/;https://kaize0409.github.io/;https://researchers.mq.edu.au/en/persons/jian-yang;http://web.science.mq.edu.au/~jiawu/",
        "dblp": "32/8037-2;224/4672;203/1322;234/6878;y/JianYang1;25/5536-1",
        "google_scholar": ";;wPdzWZoAAAAJ;PI3myr8AAAAJ;https://scholar.google.com.au/citations?user=r5jS8eYAAAAJ;kbnFw94AAAAJ",
        "orcid": "0000-0003-1270-4155;0009-0004-8654-8487;0000-0002-4110-2893;;0000-0002-4408-1952;0000-0002-1371-5801",
        "linkedin": ";ruikun-li-b45285b0;;;jian-yang-1727945/;",
        "or_profile": "~Xiaoxiao_Ma2;~Ruikun_Li2;~Fanzhen_Liu1;~Kaize_Ding1;~Jian_Yang13;~Jia_Wu3",
        "aff": "Macquarie University;The University of Sydney;Macquarie University;Northwestern University;Macquarie University;Macquarie University",
        "aff_domain": "mq.edu.au;sydney.edu.au;mq.edu.au;northwestern.edu;mq.edu.au;mq.edu.au",
        "position": "PhD student;PhD student;PhD student;Assistant Professor;Full Professor;Associate Professor",
        "bibtex": "@misc{\nma2024new,\ntitle={New recipes for graph anomaly detection: Forward diffusion dynamics and graph generation},\nauthor={Xiaoxiao Ma and Ruikun Li and Fanzhen Liu and Kaize Ding and Jian Yang and Jia Wu},\nyear={2024},\nurl={https://openreview.net/forum?id=bA5o5eZplk}\n}",
        "github": "",
        "project": "",
        "reviewers": "1PRg;GBF8;JRWq;o8nC;nduN;Ak28",
        "site": "https://openreview.net/forum?id=bA5o5eZplk",
        "pdf_size": 2174811,
        "rating": "5;5;5;5;5;6",
        "confidence": "3;4;4;3;4;3",
        "soundness": "2;3;3;3;3;3",
        "contribution": "2;3;3;3;3;3",
        "presentation": "3;3;3;2;1;3",
        "wc_summary": "210;90;78;115;87;70",
        "wc_strengths": "101;56;34;37;95;42",
        "wc_weaknesses": "166;94;49;70;452;108",
        "wc_questions": "104;55;313;39;8;25",
        "wc_review": "581;295;474;261;642;245",
        "wc_reply_reviewers": "144;0;54;0;0;0",
        "wc_reply_authors": "1491;491;1613;334;1076;756",
        "reply_reviewers": "1;0;1;0;0;0",
        "reply_authors": "4;1;4;1;2;1",
        "rating_avg": [
            5.166666666666667,
            0.37267799624996495
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.8333333333333335,
            0.3726779962499649
        ],
        "contribution_avg": [
            2.8333333333333335,
            0.3726779962499649
        ],
        "presentation_avg": [
            2.5,
            0.7637626158259734
        ],
        "wc_summary_avg": [
            108.33333333333333,
            47.541794478355804
        ],
        "wc_strengths_avg": [
            60.833333333333336,
            27.22386616351338
        ],
        "wc_weaknesses_avg": [
            156.5,
            137.05686167913422
        ],
        "wc_questions_avg": [
            90.66666666666667,
            103.84068994805884
        ],
        "wc_review_avg": [
            416.3333333333333,
            157.8877941943441
        ],
        "wc_reply_reviewers_avg": [
            33.0,
            53.41348144429457
        ],
        "wc_reply_authors_avg": [
            960.1666666666666,
            478.76209007072487
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.1666666666666665,
            1.3437096247164249
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.4472135954999579,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2625992625507774678&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;2;0;0",
        "aff_unique_norm": "Macquarie University;University of Sydney;Northwestern University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.mq.edu.au;https://www.sydney.edu.au;https://www.northwestern.edu",
        "aff_unique_abbr": "MQ;USYD;NU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0;0",
        "aff_country_unique": "Australia;United States"
    },
    {
        "title": "Supervised Knowledge Makes Large Language Models Better In-context Learners",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18343",
        "id": "bAMPOUF227",
        "author_site": "Linyi Yang, Shuibai Zhang, Zhuohao Yu, Guangsheng Bao, Yidong Wang, Jindong Wang, Ruochen Xu, Wei Ye, Xing Xie, Weizhu Chen, Yue Zhang",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) exhibit emerging in-context learning abilities through prompt engineering. The recent progress in large-scale generative models has further expanded their use in real-world language applications. However, the critical challenge of improving the generalizability and factuality of LLMs in natural language understanding and question answering remains under-explored. While previous in-context learning research has focused on enhancing models to adhere to users' specific instructions and quality expectations, and to avoid undesired outputs, little to no work has explored the use of task-specific fine-tuned Language Models (SLMs) to improve LLMs' in-context learning during the inference stage. Our primary contribution is the establishment of a simple yet effective framework that enhances the reliability of LLMs as it: 1) generalizes out-of-distribution data, 2) elucidates how LLMs benefit from discriminative models, and 3) minimizes hallucinations in generative tasks. Using our proposed plug-in method, enhanced versions of Llama 2 and ChatGPT surpass their original versions regarding generalizability and factuality. We offer a comprehensive suite of resources, including 16 curated datasets, prompts, model checkpoints, and LLM outputs across 9 distinct tasks. Our empirical analysis sheds light on the advantages of incorporating discriminative models into LLMs and highlights the potential of our methodology in fostering more reliable LLMs.",
        "keywords": "In-context Learning; Out-of-distribution Generalization; Reliability",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Linyi Yang;Shuibai Zhang;Zhuohao Yu;Guangsheng Bao;Yidong Wang;Jindong Wang;Ruochen Xu;Wei Ye;Xing Xie;Weizhu Chen;Yue Zhang",
        "authorids": "~Linyi_Yang1;zhangshuibai@westlake.edu.cn;~Zhuohao_Yu1;~Guangsheng_Bao1;~Yidong_Wang1;~Jindong_Wang1;~Ruochen_Xu2;~Wei_Ye2;~Xing_Xie3;~Weizhu_Chen1;~Yue_Zhang7",
        "gender": ";;;M;M;;M;M;M;M;M",
        "homepage": "https://yanglinyi.github.io/;;;https://baoguangsheng.github.io/;https://qianlanwyd.github.io/;;https://xrc10.github.io/;https://se.pku.edu.cn/kcl/weiye/;http://research.microsoft.com/en-us/people/xingx/;https://www.microsoft.com/en-us/research/people/wzchen/;http://frcchang.github.io",
        "dblp": "218/8007;;;276/0515;59/6759.html;;188/3515;09/5394-4;08/6809-1;79/2536;47/722-4",
        "google_scholar": "go3sFxcAAAAJ;;;cxPJx2kAAAAJ;;;HTp5S00AAAAJ;RgLGFMIAAAAJ;5EQfAFIAAAAJ;LG_E-4EAAAAJ;",
        "orcid": ";;;0000-0003-3815-3988;;;;;0000-0002-8608-8482;;0000-0002-5214-2268",
        "linkedin": ";;;;;;ruochenx/;;xingx/;;",
        "or_profile": "~Linyi_Yang1;zhangshuibai@westlake.edu.cn;~Zhuohao_Yu1;~Guangsheng_Bao1;~Yidong_Wang1;~Jindong_Wang1;~Ruochen_Xu2;~Wei_Ye2;~Xing_Xie3;~Weizhu_Chen1;~Yue_Zhang7",
        "aff": "Westlake University;;;Westlake University;Peking University;;Microsoft Research;Peking University;Microsoft Research Asia;Microsoft GenAI;Westlake University",
        "aff_domain": "westlake.edu.cn;;;westlake.edu.cn;pku.edu.cn;;research.microsoft.com;pku.edu.cn;microsoft.com;microsoft.com;westlake.edu.cn",
        "position": "Researcher;;;PhD student;PhD student;;Researcher;Associate Professor;Senior Principal Researcher;Vice President;Full Professor",
        "bibtex": "@inproceedings{\nyang2024supervised,\ntitle={Supervised Knowledge Makes Large Language Models Better In-context Learners},\nauthor={Linyi Yang and Shuibai Zhang and Zhuohao Yu and Guangsheng Bao and Yidong Wang and Jindong Wang and Ruochen Xu and Wei Ye and Xing Xie and Weizhu Chen and Yue Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=bAMPOUF227}\n}",
        "github": "",
        "project": "",
        "reviewers": "ucxK;9mey;yxT3",
        "pdf_size": 550742,
        "rating": "5;5;5",
        "confidence": "3;3;4",
        "soundness": "3;2;3",
        "contribution": "3;3;2",
        "presentation": "3;1;3",
        "wc_summary": "88;68;96",
        "wc_strengths": "36;50;51",
        "wc_weaknesses": "63;335;160",
        "wc_questions": "130;32;1",
        "wc_review": "317;485;308",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "752;945;590",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;3;2",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            84.0,
            11.775681155103795
        ],
        "wc_strengths_avg": [
            45.666666666666664,
            6.847546194724712
        ],
        "wc_weaknesses_avg": [
            186.0,
            112.55517165668873
        ],
        "wc_questions_avg": [
            54.333333333333336,
            54.980804731186765
        ],
        "wc_review_avg": [
            370.0,
            81.40024569987489
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            762.3333333333334,
            145.11221711336216
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 19,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3845215053889445874&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=bAMPOUF227",
        "pdf": "https://openreview.net/pdf?id=bAMPOUF227",
        "email": "westlake.edu.cn;;;westlake.edu.cn;pku.edu.cn;;research.microsoft.com;pku.edu.cn;microsoft.com;microsoft.com;westlake.edu.cn",
        "author_num": 11,
        "aff_unique_index": "0;0;1;2;1;2;2;0",
        "aff_unique_norm": "Westlake University;Peking University;Microsoft",
        "aff_unique_dep": ";;Microsoft Research",
        "aff_unique_url": "https://www.westlake.edu.cn;http://www.pku.edu.cn;https://www.microsoft.com/en-us/research",
        "aff_unique_abbr": "WU;Peking U;MSR",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Asia",
        "aff_country_unique_index": "0;0;0;1;0;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "bAXmvOLtjA",
        "title": "Diffusion World Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "World models constitute a powerful and versatile tool for decision-making. Through their ability to predict future states of the world, they can replace environments for safe and fast simulation, and/or be leveraged for search at decision time. Advances in generative modeling have led to the development of new world models, that operate in visual environments with challenging dynamics. However, recurrent methods lack visual fidelity, and autoregressive approaches scale poorly with visual complexity. Inspired by the recent success of diffusion models for image generation, we introduce Diffusion World Models (DWM), a new approach to world modeling that offers a favorable trade-off between speed and quality. Through qualitative and quantitative experiments in a 3D videogame, real-world motorway driving, and RL environments, we show that Diffusion World Models are an excellent choice for simulating visually complex worlds.",
        "keywords": "World models;diffusion models;reinforcement learning;generative modeling",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/a24a03987f2f54230dfc36fea8fb563ba83888eb.zip",
        "author": "Eloi Alonso;Adam Jelley;Anssi Kanervisto;Tim Pearce",
        "authorids": "~Eloi_Alonso1;~Adam_Jelley1;~Anssi_Kanervisto1;~Tim_Pearce1",
        "gender": "M;M;M;",
        "homepage": ";https://adamjelley.github.io;;",
        "dblp": "237/9666;339/0093;186/7786;142/9777",
        "google_scholar": "Ya4KugcAAAAJ;39t3yJcAAAAJ;https://scholar.google.fi/citations?user=iPimqbwAAAAJ;https://scholar.google.co.uk/citations?user=09k1kdQAAAAJ",
        "orcid": ";0000-0002-0052-482X;0000-0002-7479-4574;",
        "linkedin": "eloialonso/;adamjelley/;;tim-pearce-3b165b69/",
        "or_profile": "~Eloi_Alonso1;~Adam_Jelley1;~Anssi_Kanervisto1;~Tim_Pearce1",
        "aff": "University of Geneva;University of Edinburgh, University of Edinburgh;Microsoft;Microsoft Research",
        "aff_domain": "unige.ch;ed.ac.uk;microsoft.com;research.microsoft.com",
        "position": "PhD student;PhD student;Researcher;Researcher",
        "bibtex": "@misc{\nalonso2024diffusion,\ntitle={Diffusion World Models},\nauthor={Eloi Alonso and Adam Jelley and Anssi Kanervisto and Tim Pearce},\nyear={2024},\nurl={https://openreview.net/forum?id=bAXmvOLtjA}\n}",
        "github": "",
        "project": "",
        "reviewers": "8zjn;ozH8;cDZi;CvA6",
        "site": "https://openreview.net/forum?id=bAXmvOLtjA",
        "pdf_size": 2310846,
        "rating": "3;5;5;5",
        "confidence": "3;3;5;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;2",
        "presentation": "3;3;3;2",
        "wc_summary": "136;47;94;59",
        "wc_strengths": "46;77;159;30",
        "wc_weaknesses": "126;252;637;45",
        "wc_questions": "72;143;63;319",
        "wc_review": "380;519;953;453",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;405",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            84.0,
            34.63379852109786
        ],
        "wc_strengths_avg": [
            78.0,
            49.72423956180728
        ],
        "wc_weaknesses_avg": [
            265.0,
            227.08698773817932
        ],
        "wc_questions_avg": [
            149.25,
            102.78709792576109
        ],
        "wc_review_avg": [
            576.25,
            223.00378360018917
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            101.25,
            175.37014426634883
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0.25,
            0.4330127018922193
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5222329678670935,
        "gs_citation": 21,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=389237100177413506&as_sdt=40000005&sciodt=0,22&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;2",
        "aff_unique_norm": "University of Geneva;University of Edinburgh;Microsoft",
        "aff_unique_dep": ";;Microsoft Corporation",
        "aff_unique_url": "https://www.unige.ch;https://www.ed.ac.uk;https://www.microsoft.com",
        "aff_unique_abbr": "UNIGE;Edinburgh;Microsoft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;2",
        "aff_country_unique": "Switzerland;United Kingdom;United States"
    },
    {
        "id": "bC50ZOyPQm",
        "title": "READ: Recurrent Adaptation of Large Transformers",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Fine-tuning large-scale Transformers has led to the explosion of many AI applications across Natural Language Processing and Computer Vision tasks. However, fine-tuning all pre-trained model parameters becomes impractical as the model size and number of tasks increase.\nParameter-efficient transfer learning (PETL) methods aim to address these challenges. While effective in reducing the number of trainable parameters, PETL methods still require significant energy and computational resources to fine-tune. In this paper, we introduce \\textbf{RE}current \\textbf{AD}aption (READ) --- a lightweight and memory-efficient fine-tuning method --- to overcome the limitations of the current PETL approaches. Specifically, READ inserts a small RNN network alongside the backbone model so that the model does not have to back-propagate through the large backbone network. Through comprehensive empirical evaluation of the GLUE benchmark, we demonstrate READ can achieve a $56\\%$ reduction in the training memory consumption and an $84\\%$ reduction in the GPU energy usage while retraining high model quality compared to full-tuning. Additionally, the model size of READ does not grow with the backbone model size, making it a highly scalable solution for fine-tuning large Transformers.",
        "keywords": "nlp;peft;transformers",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/114a8ae8e7cc9b385af7879f1257abbe77dab951.pdf",
        "author": "Sid Wang;John Nguyen;Ke Li;Carole-Jean Wu",
        "authorids": "~Sid_Wang1;~John_Nguyen1;~Ke_Li22;~Carole-Jean_Wu2",
        "gender": "M;;F;F",
        "homepage": ";https://johnlnguyen.github.io/;https://scholar.google.com/citations?user=i31osuAAAAAJ&hl=en;",
        "dblp": "340/6784;;;26/9655",
        "google_scholar": "https://scholar.google.com/citations?hl=en;3CTTUYgAAAAJ;;S1szbyAAAAAJ",
        "orcid": ";;;",
        "linkedin": ";qlk/;;",
        "or_profile": "~Sid_Wang1;~John_Nguyen1;~Ke_Li22;~Carole-Jean_Wu2",
        "aff": "Meta platforms inc;Meta Facebook;Meta;Meta",
        "aff_domain": "meta.com;fb.com;facebook.com;meta.com",
        "position": "Researcher;Researcher;Researcher;Researcher",
        "bibtex": "@misc{\nwang2024read,\ntitle={{READ}: Recurrent Adaptation of Large Transformers},\nauthor={Sid Wang and John Nguyen and Ke Li and Carole-Jean Wu},\nyear={2024},\nurl={https://openreview.net/forum?id=bC50ZOyPQm}\n}",
        "github": "",
        "project": "",
        "reviewers": "avag;UGG1;BXAc",
        "site": "https://openreview.net/forum?id=bC50ZOyPQm",
        "pdf_size": 632351,
        "rating": "5;5;5",
        "confidence": "4;3;3",
        "soundness": "3;2;3",
        "contribution": "3;2;2",
        "presentation": "3;2;1",
        "wc_summary": "60;43;48",
        "wc_strengths": "50;23;77",
        "wc_weaknesses": "178;210;331",
        "wc_questions": "19;7;32",
        "wc_review": "307;283;488",
        "wc_reply_reviewers": "46;0;99",
        "wc_reply_authors": "332;100;399",
        "reply_reviewers": "1;0;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            50.333333333333336,
            7.1336448530109
        ],
        "wc_strengths_avg": [
            50.0,
            22.045407685048602
        ],
        "wc_weaknesses_avg": [
            239.66666666666666,
            65.89048152469032
        ],
        "wc_questions_avg": [
            19.333333333333332,
            10.208928554075703
        ],
        "wc_review_avg": [
            359.3333333333333,
            91.50713390526204
        ],
        "wc_reply_reviewers_avg": [
            48.333333333333336,
            40.450243784459715
        ],
        "wc_reply_authors_avg": [
            277.0,
            128.11193022769842
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13679297330177272580&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Meta",
        "aff_unique_dep": "Meta Platforms, Inc.",
        "aff_unique_url": "https://www.meta.com",
        "aff_unique_abbr": "Meta",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "bCNYFOaWsy",
        "title": "Class-Imbalanced Graph Learning without Class Rebalancing",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Class imbalance is prevalent in real-world node classification tasks and poses great challenges for graph machine-learning models. Most existing studies are rooted in a class-rebalancing (CR) perspective and aim to address class imbalance with class-wise reweighting or resampling. In this work, we approach the root cause of class-imbalance bias from an orthogonal topological paradigm. Specifically, we theoretically reveal and empirically observe two fundamental phenomena in the underlying graph topology that can greatly exacerbate the predictive bias stemming from class imbalance. In light of these findings, we devise a lightweight topological augmentation framework called TOBE to mitigate the class-imbalance bias without class rebalancing. Being orthogonal to CR, the proposed TOBE is a model-agnostic and efficient solution that can be seamlessly combined with and further boost existing CR techniques. Systematic experiments on real-world imbalanced graph learning tasks show that TOBE can deliver up to 46.27% performance gain and up to 72.74% bias reduction over existing techniques. Code is available at https://anonymous.4open.science/r/ToBE/.",
        "keywords": "graph mining;node classification;class imbalance",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Zhining Liu;Zhichen Zeng;Ruizhong Qiu;Hyunsik Yoo;David Zhou;Zhe Xu;Yada Zhu;Kommy Weldemariam;Jingrui He;Hanghang Tong",
        "authorids": "~Zhining_Liu1;~Zhichen_Zeng1;~Ruizhong_Qiu1;~Hyunsik_Yoo1;~David_Zhou1;~Zhe_Xu5;~Yada_Zhu1;~Kommy_Weldemariam1;~Jingrui_He1;~Hanghang_Tong3",
        "gender": "M;;M;;;M;;;F;",
        "homepage": "https://zhiningliu.com/;https://zhichenz98.github.io/;https://q-rz.github.io/;https://sites.google.com/view/hsyoo;;https://pricexu.github.io/;https://researcher.watson.ibm.com/researcher/view.php?person=us-yzhu;https://research.ibm.com/people/kommy-weldemariam--1;https://www.hejingrui.org;http://tonghanghang.org",
        "dblp": "195/4399-2;345/6632-1;330/9860;202/6001;;97/3701-7;56/8808;61/5240.html;34/2685;58/1757",
        "google_scholar": "5WORAUQAAAAJ;rFdX368AAAAJ;REKarmcAAAAJ;8aPSNF0AAAAJ;;7IhVDFsAAAAJ;AJb408gAAAAJ;lHXu6nkAAAAJ;hXpZynkAAAAJ;RaINcuUAAAAJ",
        "orcid": "0000-0003-1828-2109;0000-0002-5534-3401;0009-0000-3253-8890;0000-0001-5253-5646;;0000-0002-6675-1398;0000-0002-3338-6371;;0000-0002-6429-6272;0000-0003-4405-3887",
        "linkedin": "zhiningliu/;;ruizhong-qiu/;hyunsik-yoo-534251194/;david-zo/;;yadazhu/;https://www.linkedin.com/feed/;;htong/",
        "or_profile": "~Zhining_Liu1;~Zhichen_Zeng1;~Ruizhong_Qiu1;~Hyunsik_Yoo1;~David_Zhou1;~Zhe_Xu5;~Yada_Zhu1;~Kommy_Weldemariam1;~Jingrui_He1;~Hanghang_Tong3",
        "aff": "University of Illinois, Urbana Champaign;University of Illinois Urbana-Champaign;University of Illinois Urbana-Champaign;University of Illinois, Urbana-Champaign;University of Illinois Urbana-Champaign;University of Illinois, Urbana Champaign;IBM Research;;University of Illinois, Urbana Champaign;University of Illinois, Urbana Champaign",
        "aff_domain": "illinois.edu;illinois.edu;illinois.edu;illinois.edu;cs.illinois.edu;illinois.edu;us.ibm.com;;illinois.edu;illinois.edu",
        "position": "PhD student;PhD student;MS student;PhD student;PhD student;PhD student;Principal Research Scientist;;Full Professor;Associate Professor",
        "bibtex": "@misc{\nliu2024classimbalanced,\ntitle={Class-Imbalanced Graph Learning without Class Rebalancing},\nauthor={Zhining Liu and Zhichen Zeng and Ruizhong Qiu and Hyunsik Yoo and David Zhou and Zhe Xu and Yada Zhu and Kommy Weldemariam and Jingrui He and Hanghang Tong},\nyear={2024},\nurl={https://openreview.net/forum?id=bCNYFOaWsy}\n}",
        "github": "",
        "project": "",
        "reviewers": "UMPW;grPF;4g56;ndZy",
        "site": "https://openreview.net/forum?id=bCNYFOaWsy",
        "pdf_size": 2847168,
        "rating": "5;5;5;6",
        "confidence": "5;5;4;4",
        "soundness": "2;1;2;3",
        "contribution": "1;1;2;3",
        "presentation": "2;3;2;3",
        "wc_summary": "75;91;65;60",
        "wc_strengths": "33;51;18;79",
        "wc_weaknesses": "76;187;337;158",
        "wc_questions": "93;100;4;2",
        "wc_review": "277;429;424;299",
        "wc_reply_reviewers": "0;48;0;80",
        "wc_reply_authors": "2051;2250;1941;1481",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "6;5;5;4",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            72.75,
            11.840080236214618
        ],
        "wc_strengths_avg": [
            45.25,
            22.71976012197312
        ],
        "wc_weaknesses_avg": [
            189.5,
            94.38882349091973
        ],
        "wc_questions_avg": [
            49.75,
            46.82080200082011
        ],
        "wc_review_avg": [
            357.25,
            69.7078725826574
        ],
        "wc_reply_reviewers_avg": [
            32.0,
            33.94112549695428
        ],
        "wc_reply_authors_avg": [
            1930.75,
            282.29450490578097
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            5.0,
            0.7071067811865476
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10437734991011705142&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;0;0;1;0;0;2;0;0",
        "aff_unique_norm": "University of Illinois Urbana-Champaign;University of Illinois;IBM",
        "aff_unique_dep": ";;IBM Research",
        "aff_unique_url": "https://illinois.edu;https://illinois.edu;https://www.ibm.com/research",
        "aff_unique_abbr": "UIUC;UIUC;IBM",
        "aff_campus_unique_index": "0;0;0;0;0;0;0;0",
        "aff_campus_unique": "Urbana-Champaign;",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "bCvm9h0FmQ",
        "title": "Causality-Based Black-Box Backdoor Detection",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep Neural Networks (DNNs) are known to be vulnerable to backdoor attacks, where attackers can inject hidden backdoors during the training stage. These attacks pose a serious threat to downstream users who unintentionally use third-party backdoored models (e.g., HuggingFace, ChatGPT). To mitigate the backdoor attacks, various backdoor detection methods have been proposed, but most of them require additional access to the model's weights or validation sets, which are not always available for third-party models. In this paper, we adopt a recently proposed setting, which aims to build a firewall at the user end to identify the backdoor samples and reject them, where only samples and prediction labels are accessible. To address this challenge, we first provide a novel causality-based perspective for analyzing the heterogeneous prediction behaviors for backdoor and clean samples. Leveraging this established causal insight, we then propose a Causality-based Black-Box Backdoor Detection algorithm, which introduces counterfactual samples as an intervention to distinguish backdoor and clean samples. Extensive experiments on three benchmark datasets validate the effectiveness and efficiency of our method. Our code is available at https://anonymous.4open.science/r/CaBBD-4326/",
        "keywords": "Backdoor Defense;Causal Inference;Third-party Models",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Mengxuan Hu;Zihan Guan;Zhongliang Zhou;Jielu Zhang;Sheng Li",
        "authorids": "~Mengxuan_Hu1;~Zihan_Guan2;~Zhongliang_Zhou1;~Jielu_Zhang1;~Sheng_Li3",
        "gender": "F;;F;M;M",
        "homepage": "https://xuanxuan03021.github.io/;https://www.zhongliangzhou.com/;https://geography.uga.edu/directory/people/jielu-zhang;http://sheng-li.org;https://guanzihan.github.io/",
        "dblp": "345/8081;;;23/3439-1;344/0820",
        "google_scholar": ";Lq_tHEsAAAAJ;w3kpKuwAAAAJ;DEncVcYAAAAJ;JmzhiYAAAAAJ",
        "orcid": ";;;0000-0003-1205-8632;",
        "linkedin": "hu-mengxuan-823675263/;;;sheng-li-15a70022/;",
        "or_profile": "~Mengxuan_Hu1;~Zhongliang_Zhou1;~Jielu_Zhang1;~Sheng_Li3;~zihan_guan1",
        "aff": "University of Virginia;University of Georgia;University of Georgia;University of Virginia, Charlottesville;University of Virginia, Charlottesville",
        "aff_domain": "virginia.edu;uga.edu;uga.edu;virginia.edu;virginia.edu",
        "position": "PhD student;PhD student;PhD student;Associate Professor;PhD student",
        "bibtex": "@misc{\nhu2024causalitybased,\ntitle={Causality-Based Black-Box Backdoor Detection},\nauthor={Mengxuan Hu and Zihan Guan and Zhongliang Zhou and Jielu Zhang and Sheng Li},\nyear={2024},\nurl={https://openreview.net/forum?id=bCvm9h0FmQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "k4uD;hn12;u6kT;PHNh",
        "site": "https://openreview.net/forum?id=bCvm9h0FmQ",
        "pdf_size": 896941,
        "rating": "3;6;6;6",
        "confidence": "4;3;4;3",
        "soundness": "3;3;3;2",
        "contribution": "2;2;3;2",
        "presentation": "2;2;3;3",
        "wc_summary": "65;50;73;51",
        "wc_strengths": "24;11;59;41",
        "wc_weaknesses": "293;15;148;133",
        "wc_questions": "2;297;52;5",
        "wc_review": "384;373;332;230",
        "wc_reply_reviewers": "325;0;17;48",
        "wc_reply_authors": "1613;684;858;416",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "5;3;4;4",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            59.75,
            9.67923034130297
        ],
        "wc_strengths_avg": [
            33.75,
            18.046814123273947
        ],
        "wc_weaknesses_avg": [
            147.25,
            98.6619860939359
        ],
        "wc_questions_avg": [
            89.0,
            121.7148306493502
        ],
        "wc_review_avg": [
            329.75,
            60.76337301368317
        ],
        "wc_reply_reviewers_avg": [
            97.5,
            132.46980788089036
        ],
        "wc_reply_authors_avg": [
            892.75,
            444.64445065692655
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.0,
            0.7071067811865476
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:7Pkigl36wcoJ:scholar.google.com/&scioq=Causality-Based+Black-Box+Backdoor+Detection&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;0;0",
        "aff_unique_norm": "University of Virginia;University of Georgia",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.virginia.edu;https://www.uga.edu",
        "aff_unique_abbr": "UVA;UGA",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Charlottesville",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "bCynxWndWY",
        "title": "Revisiting differentially private XGBoost: are random decision trees really better than greedy ones?",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Boosted Decision Trees (e.g., XGBoost) are one of the strongest and most widely used machine learning models. Motivated by applications in sensitive domains, various versions of Boosted Decision Tree learners with provably differential privacy (DP) guarantees were designed. Contrary to their non-private counterparts, Maddock et al. (2022) reported a surprising finding that private boosting with random decision trees outperforms a more faithful privatization of XGBoost that uses greedy decision trees. In this paper, we challenge this conclusion with an improved DP-XGBoost algorithm and a thorough empirical study. Our results reveal that while random selection is still slightly better in most datasets, greedy selection is not far behind after our improved DP analysis. Moreover, if we restrict the number of trees to be small  (e.g., for interpretability) or if interaction terms are important for prediction, then random selection often fails catastrophically while greedy selection (our method) prevails.",
        "keywords": "Differential Privacy;Gradient Boosting;Decision Trees",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Erchi Wang;Arinbj\u00f6rn Kolbeinsson;Luca Foschini;Yu-Xiang Wang",
        "authorids": "~Erchi_Wang1;~Arinbj\u00f6rn_Kolbeinsson1;~Luca_Foschini1;~Yu-Xiang_Wang1",
        "gender": "M;M;M;",
        "homepage": "https://erchiw.github.io;http://www.arinbjorn.is;http://lucafoschini.com;http://www.cs.ucsb.edu/~yuxiangw/publications.html",
        "dblp": "402/5019;236/6273;11/2127;62/1637-3.html",
        "google_scholar": "reDCpR8AAAAJ;;LNtKWuIAAAAJ;HGNZ1fkAAAAJ",
        "orcid": ";;http://orcid.org/0000-0003-1409-3570;",
        "linkedin": "erchi-wang/;;lucafoschini/;",
        "or_profile": "~Erchi_Wang1;~Arinbj\u00f6rn_Kolbeinsson1;~Luca_Foschini1;~Yu-Xiang_Wang1",
        "aff": "University of California, Santa Barbara;University of Virginia, Charlottesville;Evidation Health;UC Santa Barbara",
        "aff_domain": "ucsb.edu;virginia.edu;evidation.com;ucsb.edu",
        "position": "PhD student;Researcher;Chief Data Scientist;Assistant Professor",
        "bibtex": "@misc{\nwang2024revisiting,\ntitle={Revisiting differentially private {XGB}oost: are random decision trees really better than greedy ones?},\nauthor={Erchi Wang and Arinbj{\\\"o}rn Kolbeinsson and Luca Foschini and Yu-Xiang Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=bCynxWndWY}\n}",
        "github": "",
        "project": "",
        "reviewers": "WvUe;QR2x;jsJy;3J8a",
        "site": "https://openreview.net/forum?id=bCynxWndWY",
        "pdf_size": 593937,
        "rating": "3;3;3;5",
        "confidence": "4;4;3;2",
        "soundness": "2;1;1;2",
        "contribution": "2;2;2;2",
        "presentation": "3;1;2;2",
        "wc_summary": "121;54;97;39",
        "wc_strengths": "48;85;15;34",
        "wc_weaknesses": "613;229;133;66",
        "wc_questions": "25;30;62;80",
        "wc_review": "807;398;307;219",
        "wc_reply_reviewers": "42;0;0;1094",
        "wc_reply_authors": "543;484;715;802",
        "reply_reviewers": "1;0;0;2",
        "reply_authors": "2;1;1;2",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            1.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            77.75,
            32.812916664021195
        ],
        "wc_strengths_avg": [
            45.5,
            25.636887486588538
        ],
        "wc_weaknesses_avg": [
            260.25,
            211.73966916947802
        ],
        "wc_questions_avg": [
            49.25,
            22.730761095924613
        ],
        "wc_review_avg": [
            432.75,
            225.15147678840572
        ],
        "wc_reply_reviewers_avg": [
            284.0,
            467.96794762034716
        ],
        "wc_reply_authors_avg": [
            636.0,
            128.0136711449211
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8703882797784891,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:SNyezeSJkqMJ:scholar.google.com/&scioq=Revisiting+differentially+private+XGBoost:+are+random+decision+trees+really+better+than+greedy+ones%3F&hl=en&as_sdt=0,11",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "University of California, Santa Barbara;University of Virginia;Evidation Health",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ucsb.edu;https://www.virginia.edu;https://www.evidation.com",
        "aff_unique_abbr": "UCSB;UVA;",
        "aff_campus_unique_index": "0;1;0",
        "aff_campus_unique": "Santa Barbara;Charlottesville;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "bDAw18ig2x",
        "title": "FedBiF: Communication-Efficient Federated Learning via Bits Freezing",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Federated learning (FL) is a promising privacy-preserving distributed machine learning paradigm, however, involves significant communication overhead. The communication latency of iterative model transmissions between the central server and the clients seriously affects the training efficiency. Recently proposed algorithms quantize the model updates to reduce the FL communication costs. Yet, existing quantization methods only compress the model updates after local training, which introduces quantization errors to the model parameters and inevitably leads to a decrease in model accuracy. Therefore, we suggest restricting the model updates within lower quantization bitwidth during local training. To this end, we propose Federated Bits Freezing (FedBiF), a novel FL framework that enables clients to train only partial individual bits inside a parameter, termed activated bits, while freezing the others. In this way, the model updates are restricted to the representation of activated bits during local training. By alternately activating each bit in different FL rounds, FedBiF achieves extremely efficient communication, as only one activated bit is trained for each parameter and subsequently transmitted. Extensive experiments are conducted on three popular datasets with both IID and Non-IID settings. The experimental results not only validate the superiority of FedBiF in communication compression but also reveal some beneficial properties of FedBiF, including model sparsity and better generalization. In particular, FedBiF outperforms all the baseline methods, including FedAvg, by a large margin even with 1 bit per parameter (bpp) uplink and 4 bpp downlink communication.",
        "keywords": "federated learning;quantization;bits freezing",
        "primary_area": "infrastructure, software libraries, hardware, etc.",
        "supplementary_material": "/attachment/f52009b6cfbf7c769833867f79095d1c40076cfc.zip",
        "author": "Shiwei Li;Wenchao Xu;Haozhao Wang;Ruixuan Li;Wei Liu;Jiaming Li;Xiaoquan Yi;Yuhua Li",
        "authorids": "~Shiwei_Li3;~Wenchao_Xu1;~Haozhao_Wang1;~Ruixuan_Li1;~Wei_Liu30;~Jiaming_Li6;~Xiaoquan_Yi1;~Yuhua_Li2",
        "gender": "M;;M;M;;M;;F",
        "homepage": "https://leopold1423.github.io/;;https://wanghaozhao.mysxl.cn/;http://idc.hust.edu.cn/rxli/index.html;;https://github.com/GeekRaw;;",
        "dblp": ";;224/4500.html;60/4429.html;;;;79/5796-3",
        "google_scholar": "H0egTIsAAAAJ;;https://scholar.google.com.hk/citations?user=yFrOuMEAAAAJ;https://scholar.google.com/scholar?q=ruixuan+li;;;;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": "0000-0002-7067-0275;;0000-0002-7591-5315;0000-0002-7791-5511;;;;",
        "linkedin": "%E4%B8%96%E4%BC%9F-%E6%9D%8E-813a1723a/;;;https://www.linkedin.cn/incareer/in/ruixuan-li-b367319;;;;",
        "or_profile": "~Shiwei_Li3;~Wenchao_Xu1;~Haozhao_Wang1;~Ruixuan_Li1;~Wei_Liu30;~Jiaming_Li6;~Xiaoquan_Yi1;~Yuhua_Li2",
        "aff": "Huazhong University of Science and Technology;;Huazhong University of Science and Technology;Huazhong University of Science and Technology;;Huazhong University of Science and Technology;;Huazhong University of Science and Technology",
        "aff_domain": "hust.edu.cn;;hust.edu.cn;hust.edu.cn;;hust.edu.cn;;hust.edu.cn",
        "position": "PhD student;;Postdoc;Full Professor;;MS student;;Full Professor",
        "bibtex": "@misc{\nli2024fedbif,\ntitle={FedBiF: Communication-Efficient Federated Learning via Bits Freezing},\nauthor={Shiwei Li and Wenchao Xu and Haozhao Wang and Ruixuan Li and Wei Liu and Jiaming Li and Xiaoquan Yi and Yuhua Li},\nyear={2024},\nurl={https://openreview.net/forum?id=bDAw18ig2x}\n}",
        "github": "",
        "project": "",
        "reviewers": "Gemw;eFqe;t1mz;Mh8E",
        "site": "https://openreview.net/forum?id=bDAw18ig2x",
        "pdf_size": 4693112,
        "rating": "3;3;3;6",
        "confidence": "4;4;4;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;2;3",
        "wc_summary": "143;33;101;76",
        "wc_strengths": "34;113;41;121",
        "wc_weaknesses": "217;342;95;21",
        "wc_questions": "6;23;103;72",
        "wc_review": "400;511;340;290",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            88.25,
            39.88342387508876
        ],
        "wc_strengths_avg": [
            77.25,
            39.927277643235335
        ],
        "wc_weaknesses_avg": [
            168.75,
            122.07861196786274
        ],
        "wc_questions_avg": [
            51.0,
            38.58108344772085
        ],
        "wc_review_avg": [
            385.25,
            82.3874231906788
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:dcuF3QsKqeMJ:scholar.google.com/&scioq=FedBiF:+Communication-Efficient+Federated+Learning+via+Bits+Freezing&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Huazhong University of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.hust.edu.cn",
        "aff_unique_abbr": "HUST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Learning model uncertainty as variance-minimizing instance weights",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18342",
        "id": "bDWXhzZT40",
        "author_site": "Nishant Jain, Karthikeyan Shanmugam, Pradeep Shenoy",
        "tldr": "",
        "abstract": "Predictive uncertainty--a model\u2019s self-awareness regarding its accuracy on an input--is key for both building robust models via training interventions and for test-time applications such as selective classification. We propose a novel instance-conditional reweighting approach that captures predictive uncertainty using an auxiliary network, and unifies these train- and test-time applications. The auxiliary network is trained using a meta-objective in a bilevel optimization framework. A key contribution of our proposal is the meta-objective of minimizing dropout variance, an approximation of Bayesian predictive uncertainty, We show in controlled experiments that we effectively capture diverse specific notions of uncertainty through this meta-objective, while previous approaches only capture certain aspects. These results translate to significant gains in real-world settings\u2013selective classification, label noise, domain adaptation, calibration\u2013and across datasets\u2013Imagenet, Cifar100, diabetic retinopathy, Camelyon, WILDs, Imagenet-C,-A,-R, Clothing-1.6M, etc. For Diabetic Retinopathy, we see upto 3.4\\%/3.3\\% accuracy & AUC gains over SOTA in selective classification. We also improve upon large-scale pretrained models such as PLEX.",
        "keywords": "loss reweighting;epistemic uncertainty;bi-level optimization;model calibration;bayesian neural networks",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/eb1aeacdcf615805072a37900e3d5673cad9bd9f.pdf",
        "author": "Nishant Jain;Karthikeyan Shanmugam;Pradeep Shenoy",
        "authorids": "~Nishant_Jain2;~Karthikeyan_Shanmugam1;~Pradeep_Shenoy1",
        "gender": "M;M;M",
        "homepage": ";https://sites.google.com/corp/view/karthikeyan-shanmugam/;",
        "dblp": "126/3493;;12/771",
        "google_scholar": "VKcqFW8AAAAJ;https://scholar.google.ca/citations?user=m4DyPcUAAAAJ;lXbPKmkAAAAJ",
        "orcid": ";0009-0008-2879-5868;",
        "linkedin": ";;",
        "or_profile": "~Nishant_Jain2;~Karthikeyan_Shanmugam1;~Pradeep_Shenoy1",
        "aff": "Google Deepmind;Google Research;Google",
        "aff_domain": "google.com;google.com;google.com",
        "position": "Researcher;Researcher;Researcher",
        "bibtex": "@inproceedings{\njain2024learning,\ntitle={Learning model uncertainty as variance-minimizing instance weights},\nauthor={Nishant Jain and Karthikeyan Shanmugam and Pradeep Shenoy},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=bDWXhzZT40}\n}",
        "github": "",
        "project": "",
        "reviewers": "1jLE;f1Z8;bRmp",
        "pdf_size": 770155,
        "rating": "6;6;8",
        "confidence": "3;3;3",
        "soundness": "3;2;4",
        "contribution": "3;2;3",
        "presentation": "3;2;2",
        "wc_summary": "93;61;93",
        "wc_strengths": "85;35;70",
        "wc_weaknesses": "101;136;227",
        "wc_questions": "56;220;163",
        "wc_review": "335;452;553",
        "wc_reply_reviewers": "19;48;49",
        "wc_reply_authors": "685;1573;781",
        "reply_reviewers": "1;1;1",
        "reply_authors": "1;3;1",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            82.33333333333333,
            15.084944665313014
        ],
        "wc_strengths_avg": [
            63.333333333333336,
            20.94967514996089
        ],
        "wc_weaknesses_avg": [
            154.66666666666666,
            53.105764491458196
        ],
        "wc_questions_avg": [
            146.33333333333334,
            67.98202376772521
        ],
        "wc_review_avg": [
            446.6666666666667,
            89.07799329177149
        ],
        "wc_reply_reviewers_avg": [
            38.666666666666664,
            13.912424503139471
        ],
        "wc_reply_authors_avg": [
            1013.0,
            397.9145636942684
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12011773638508979781&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=bDWXhzZT40",
        "pdf": "https://openreview.net/pdf?id=bDWXhzZT40",
        "email": "google.com;google.com;google.com",
        "author_num": 3,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "DeepMind;Google",
        "aff_unique_dep": "DeepMind;Google Research",
        "aff_unique_url": "https://deepmind.com;https://research.google",
        "aff_unique_abbr": "DeepMind;Google Research",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "id": "bDZCBjVgKW",
        "title": "Fast Post-training Analysis of NeRFs Using A Simple Visibility Prediction Network",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Exercising NeRFs on real-world data taught us that their novel view rendering capability varies across different views and rendering of regions that are visible in more input images often produces more reliable results. However, efficient quantitative tools haven't been developed in this regard to facilitate the post-training analysis of NeRF rendered images. In this paper, we introduce a simple visibility prediction network that efficiently predicts the visibility of \\textit{any} point in space from \\textit{any} of the input cameras. We further introduce a visibility scoring function that characterizes the reliability of the rendered points, which assists the evaluation of NeRF rendering quality in the absence of ground truth. Utilizing this tool, we also empirically demonstrate two downstream post-training analysis tasks.\n The first task is to reduce rendering artifacts via modified volumetric rendering which skips unreliable near-range points. We achieve an average PSNR improvement of 0.6 dB in novel view rendering without changing the network parameters of the pre-trained base NeRF on a benchmark composed of 62 scenes.\n The second task is to select additional training images to re-train a NeRF and enhance its rendering quality. By re-training the base NeRF with a handful of additional views selected using the proposed visibility score, we achieve better rendering quality compared to random selection.\n Our method is rudimentary, yet efficient and simple to implement making it a suitable drop-in tool for various post-training tasks beyond the studies shown in this paper.",
        "keywords": "NeRF;novel view synthesis",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Jianbo Ye;Jiawei Mo;Xiaolong Li;Xiaohan Fei;Ashwin Swaminathan;Stefano Soatto",
        "authorids": "~Jianbo_Ye1;~Jiawei_Mo1;~Xiaolong_Li2;~Xiaohan_Fei1;~Ashwin_Swaminathan1;~Stefano_Soatto3",
        "gender": "M;Not Specified;M;M;M;",
        "homepage": ";https://jiawei-mo.github.io/;https://dragonlong.github.io/;http://feixh.github.io;https://sites.google.com/site/ashwins/;https://www.cs.ucla.edu/~soatto",
        "dblp": ";;;https://dblp.org/pers/f/Fei:Xiaohan.html;61/754;08/1262",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;-htBwoIAAAAJ;l78nduAAAAAJ;3CEGNJQAAAAJ;lH1PdF8AAAAJ",
        "orcid": ";;;;;0000-0003-2902-6362",
        "linkedin": ";jiawei-mo/;xiaolong-li19/;;ashwinsw;stefano-soatto-5765aa6/",
        "or_profile": "~Jianbo_Ye1;~Jiawei_Mo1;~Xiaolong_Li2;~Xiaohan_Fei1;~Ashwin_Swaminathan1;~Stefano_Soatto2",
        "aff": "Amazon;Amazon;Amazon;Amazon;Amazon;UCLA Computer Science Department, University of California, Los Angeles",
        "aff_domain": "amazon.com;amazon.com;amazon.com;amazon.com;amazon.com;cs.ucla.edu",
        "position": "Senior Applied Scientist;Applied Scientist;Researcher;Senior Applied Scientist;Principal Researcher;Professor",
        "bibtex": "@misc{\nye2024fast,\ntitle={Fast Post-training Analysis of Ne{RF}s Using A Simple Visibility Prediction Network},\nauthor={Jianbo Ye and Jiawei Mo and Xiaolong Li and Xiaohan Fei and Ashwin Swaminathan and Stefano Soatto},\nyear={2024},\nurl={https://openreview.net/forum?id=bDZCBjVgKW}\n}",
        "github": "",
        "project": "",
        "reviewers": "Ekv4;Fmeq;2Uqd;jS1P",
        "site": "https://openreview.net/forum?id=bDZCBjVgKW",
        "pdf_size": 10305267,
        "rating": "3;3;5;5",
        "confidence": "5;3;3;5",
        "soundness": "2;3;3;3",
        "contribution": "2;3;2;2",
        "presentation": "2;4;3;2",
        "wc_summary": "107;184;73;59",
        "wc_strengths": "20;98;13;30",
        "wc_weaknesses": "238;75;130;62",
        "wc_questions": "131;323;24;69",
        "wc_review": "496;680;240;220",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            1.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            105.75,
            48.43229810777102
        ],
        "wc_strengths_avg": [
            40.25,
            33.88491552298751
        ],
        "wc_weaknesses_avg": [
            126.25,
            69.38434621728449
        ],
        "wc_questions_avg": [
            136.75,
            114.04467326447123
        ],
        "wc_review_avg": [
            409.0,
            190.58593862087517
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:izzEci6-DXsJ:scholar.google.com/&scioq=Fast+Post-training+Analysis+of+NeRFs+Using+A+Simple+Visibility+Prediction+Network&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0;1",
        "aff_unique_norm": "Amazon;University of California, Los Angeles",
        "aff_unique_dep": "Amazon.com, Inc.;Computer Science Department",
        "aff_unique_url": "https://www.amazon.com;https://www.ucla.edu",
        "aff_unique_abbr": "Amazon;UCLA",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Los Angeles",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "bDcaz87WCZ",
        "title": "Recent Link Classification on Temporal Graphs Using Profile Builder",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The performance of Temporal Graph Learning (TGL) methods are typically evaluated on the  future link prediction task, i.e., whether two nodes will get connected and dynamic node classification task, i.e., whether a node's class will change. Comparatively, recent link classification is investigated much less even though it exists in many industrial settings. In this work, we first formalize recent link classification on temporal graphs as a benchmark downstream task and introduce corresponding benchmark datasets. Secondly, we evaluate the performance of state-of-the-art methods with a statistically meaningful metric Matthews Correlation Coefficient, which is more robust to imbalanced datasets, in addition to the commonly used average precision and area under the curve, and propose several design principles for tailoring models to specific requirements of the task and the dataset. We explore modifications on message aggregation schema, readout layer and time encoding strategy which obtain significant improvement on benchmark datasets. Finally, we propose  an architecture that we call Graph Profiler, which is capable of encoding previous events' class information on source and destination nodes. The experiments show that our proposed model achieves an improved Matthews Correlation Coefficient on most cases under interest. We believe the introduction of recent link classification as a benchmark task for temporal graph learning will be useful for the evaluation of prospective methods within the field.",
        "keywords": "temporal graph learning;recent link classification",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/f322ca484c05c5d45b7a08a7eacedcdbaad72a80.zip",
        "author": "Muberra Ozmen;Thomas Markovich",
        "authorids": "~Muberra_Ozmen1;~Thomas_Markovich1",
        "gender": "F;",
        "homepage": "https://muberraozmen.github.io;http://thomasmarkovich.com",
        "dblp": "313/9255;",
        "google_scholar": "y7MTyicAAAAJ;",
        "orcid": "0000-0002-0474-4942;",
        "linkedin": ";",
        "or_profile": "~Muberra_Ozmen1;~Thomas_Markovich1",
        "aff": "McGill University;Block",
        "aff_domain": "mail.mcgill.ca;block.xyz",
        "position": "PhD student;Principal Researcher",
        "bibtex": "@misc{\nozmen2024recent,\ntitle={Recent Link Classification on Temporal Graphs Using Profile Builder},\nauthor={Muberra Ozmen and Thomas Markovich},\nyear={2024},\nurl={https://openreview.net/forum?id=bDcaz87WCZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "HrQ1;V529;Sc4M;aigg;cW29",
        "site": "https://openreview.net/forum?id=bDcaz87WCZ",
        "pdf_size": 2693297,
        "rating": "1;5;5;5;5",
        "confidence": "2;3;3;4;3",
        "soundness": "1;2;2;3;3",
        "contribution": "1;2;2;2;2",
        "presentation": "1;2;2;2;3",
        "wc_summary": "83;50;48;65;95",
        "wc_strengths": "44;26;32;52;35",
        "wc_weaknesses": "726;56;108;72;189",
        "wc_questions": "5;64;56;211;5",
        "wc_review": "858;196;244;400;324",
        "wc_reply_reviewers": "0;0;0;46;0",
        "wc_reply_authors": "618;534;500;536;528",
        "reply_reviewers": "0;0;0;1;0",
        "reply_authors": "2;2;2;2;2",
        "rating_avg": [
            4.2,
            1.6000000000000003
        ],
        "confidence_avg": [
            3.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.2,
            0.7483314773547882
        ],
        "contribution_avg": [
            1.8,
            0.4000000000000001
        ],
        "presentation_avg": [
            2.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            68.2,
            18.36736235827017
        ],
        "wc_strengths_avg": [
            37.8,
            9.173875952943773
        ],
        "wc_weaknesses_avg": [
            230.2,
            252.11933682286252
        ],
        "wc_questions_avg": [
            68.2,
            75.56030704013848
        ],
        "wc_review_avg": [
            404.4,
            237.23203830848817
        ],
        "wc_reply_reviewers_avg": [
            9.2,
            18.4
        ],
        "wc_reply_authors_avg": [
            543.2,
            39.569685366451935
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.7905694150420947,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:nULOQmYbMngJ:scholar.google.com/&scioq=Recent+Link+Classification+on+Temporal+Graphs+Using+Profile+Builder&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "McGill University;Block",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.mcgill.ca;",
        "aff_unique_abbr": "McGill;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Canada;"
    },
    {
        "title": "COSA: Concatenated Sample Pretrained Vision-Language Foundation Model",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18341",
        "id": "bDkisS75zy",
        "author_site": "Sihan Chen, Xingjian He, Handong Li, Xiaojie Jin, Jiashi Feng, Jing Liu",
        "tldr": "",
        "abstract": "Due to the limited scale and quality of video-text training corpus, most  vision-language  foundation  models employ  image-text datasets for pretraining and primarily focus on modeling visually semantic representations while disregarding temporal semantic representations and correlations. To address this issue, we propose COSA, a COncatenated SAmple pretrained vision-language foundation model. COSA can jointly model visual contents and event-level temporal cues using only image-text corpora.  We achieve this by sequentially concatenating multiple image-text pairs as inputs for pretraining. This transformation effectively converts existing image-text corpora into a pseudo  video-paragraph corpus, enabling richer scene transformations and explicit event-description correspondence. Extensive experiments demonstrate that COSA consistently improves performance across a broad range of semantic vision-language downstream tasks, including paragraph-to-video retrieval, text-to-video/image retrieval, video/image captioning and video QA. Notably, COSA achieves state-of-the-art results on various competitive benchmarks. Code and model are released at https://github.com/TXH-mercury/COSA.",
        "keywords": "Vision-Language Foundation Model;Video-Language Pretraining",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Sihan Chen;Xingjian He;Handong Li;Xiaojie Jin;Jiashi Feng;Jing Liu",
        "authorids": "~Sihan_Chen3;~Xingjian_He1;~Handong_Li1;~Xiaojie_Jin1;~Jiashi_Feng1;~Jing_Liu1",
        "gender": "M;M;M;M;F;M",
        "homepage": ";;https://github.com/lihanddd;https://www.ece.nus.edu.sg/lv/pub_2016.html;http://www.nlpr.ia.ac.cn/iva/liujing/;https://sites.google.com/site/jshfeng/",
        "dblp": ";204/0216;;141/3317.html;72/2590-1.html;56/8278",
        "google_scholar": "4pHKj8kAAAAJ;XWunp9YAAAAJ;-LnWwgIAAAAJ;OEZ816YAAAAJ;sOI-S7oAAAAJ;https://scholar.google.com.sg/citations?user=Q8iay0gAAAAJ",
        "orcid": ";;;;;0000-0001-6843-0064",
        "linkedin": ";;;;;",
        "or_profile": "~Sihan_Chen3;~Xingjian_He1;~Handong_Li1;~Xiaojie_Jin1;~Jing_Liu1;~Jiashi_Feng2",
        "aff": ", Institute of automation, Chinese academy of science;, Institute of automation, Chinese academy of science;Institute of Automation, Chinese Academy of Sciences;Bytedance Inc.;Institute of automation, Chinese academy of science;ByteDance",
        "aff_domain": "nlpr.ia.ac.cn;nlpr.ia.ac.cn;ia.ac.cn;bytedance.com;nlpr.ia.ac.cn;bytedance.com",
        "position": "PhD student;Assistant Professor;PhD student;Researcher;Full Professor;Research Lead",
        "bibtex": "@inproceedings{\nchen2024cosa,\ntitle={{COSA}: Concatenated Sample Pretrained Vision-Language Foundation Model},\nauthor={Sihan Chen and Xingjian He and Handong Li and Xiaojie Jin and Jiashi Feng and Jing Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=bDkisS75zy}\n}",
        "github": "",
        "project": "",
        "reviewers": "vqzh;gWLj;kord;bdF4",
        "pdf_size": 14861347,
        "rating": "5;6;6;8",
        "confidence": "5;3;4;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "38;43;31;42",
        "wc_strengths": "32;60;48;90",
        "wc_weaknesses": "107;300;160;146",
        "wc_questions": "2;72;2;46",
        "wc_review": "179;475;241;324",
        "wc_reply_reviewers": "0;40;140;26",
        "wc_reply_authors": "911;1571;1639;701",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "2;3;4;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            38.5,
            4.716990566028302
        ],
        "wc_strengths_avg": [
            57.5,
            21.230873745562146
        ],
        "wc_weaknesses_avg": [
            178.25,
            72.92590417677384
        ],
        "wc_questions_avg": [
            30.5,
            29.94578434437809
        ],
        "wc_review_avg": [
            304.75,
            110.94227102416824
        ],
        "wc_reply_reviewers_avg": [
            51.5,
            53.073062847361655
        ],
        "wc_reply_authors_avg": [
            1205.5,
            407.05128669493234
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.7608859102526822,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6340733466519500342&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=bDkisS75zy",
        "pdf": "https://openreview.net/pdf?id=bDkisS75zy",
        "email": "nlpr.ia.ac.cn;nlpr.ia.ac.cn;ia.ac.cn;bytedance.com;nlpr.ia.ac.cn;bytedance.com",
        "author_num": 6,
        "aff_unique_index": "0;0;0;1;0;2",
        "aff_unique_norm": "Chinese Academy of Sciences;Bytedance Inc.;ByteDance",
        "aff_unique_dep": "Institute of Automation;;",
        "aff_unique_url": "http://www.ia.cas.cn;https://www.bytedance.com;https://www.bytedance.com",
        "aff_unique_abbr": "CAS;Bytedance;ByteDance",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "bDooTVT4t2",
        "title": "Universally Amplifying Randomized Smoothing for Certified Robustness with Anisotropic Noise",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Randomized smoothing has achieved great success for certified adversarial robustness. However, existing methods (especially the theory for certification guarantee) rely on a fixed i.i.d. noise distribution for all dimensions of the data (e.g., all the pixels in an image), and may result in limited performance of certified robustness. To address this limitation, we propose UCAN: a novel technique that $\\underline{U}$niversally amplifies randomized smoothing for $\\underline{C}$ertified robustness with $\\underline{A}$nisotropic $\\underline{N}$oise. It can theoretically transform any randomized smoothing method with isotropic noise to ensure certified robustness based on different variants of anisotropic noise. The theories universally work for using different noise distributions against different $\\ell_p$ perturbations. Furthermore, we also design a novel framework with three example noise parameter generators (NPGs) for customizing the anisotropic noise. Finally, experimental results demonstrate that UCAN significantly outperforms the state-of-the-art (SOTA) methods, e.g., the certified accuracy can be improved by up to $182.6$\\% at large certified radii on MNIST, CIFAR10, and ImageNet datasets.",
        "keywords": "adversarial robustness;certified robustness;randomized smoothing",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/ace26815dfdb0bcc799276499738089d6af8b3ec.zip",
        "author": "Hanbin Hong;Ali Payani;Ashish Kundu;Binghui Wang;Yuan Hong",
        "authorids": "~Hanbin_Hong1;~Ali_Payani1;~Ashish_Kundu1;~Binghui_Wang2;~Yuan_Hong1",
        "gender": "M;M;;M;M",
        "homepage": "https://youbin2014.github.io/;;;https://wangbinghui.net;https://yhongcs.github.io/",
        "dblp": ";184/3921;;123/7149;79/5433-1",
        "google_scholar": "NW1XWCEAAAAJ;9rHwD8wAAAAJ;;SoOztcEAAAAJ;KJuZW2wAAAAJ",
        "orcid": ";0000-0003-4054-2958;;0000-0001-5616-060X;",
        "linkedin": "hanbinhong/;ali-payani-59267515;;;",
        "or_profile": "~Hanbin_Hong1;~Ali_Payani1;~Ashish_Kundu1;~Binghui_Wang2;~Yuan_Hong1",
        "aff": "University of Connecticut;Cisco;;Illinois Institute of Technology;University of Connecticut",
        "aff_domain": "uconn.edu;cisco.com;;iit.edu;uconn.edu",
        "position": "PhD student;Researcher;;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nhong2024universally,\ntitle={Universally Amplifying Randomized Smoothing for Certified Robustness with Anisotropic Noise},\nauthor={Hanbin Hong and Ali Payani and Ashish Kundu and Binghui Wang and Yuan Hong},\nyear={2024},\nurl={https://openreview.net/forum?id=bDooTVT4t2}\n}",
        "github": "",
        "project": "",
        "reviewers": "SMHf;v1kJ;eeVj;mJxe",
        "site": "https://openreview.net/forum?id=bDooTVT4t2",
        "pdf_size": 2679177,
        "rating": "3;3;3;3",
        "confidence": "3;4;4;3",
        "soundness": "1;1;2;2",
        "contribution": "2;2;1;2",
        "presentation": "3;3;3;3",
        "wc_summary": "45;56;23;62",
        "wc_strengths": "18;67;32;78",
        "wc_weaknesses": "315;4;435;423",
        "wc_questions": "215;386;15;97",
        "wc_review": "593;513;505;660",
        "wc_reply_reviewers": "29;1380;191;142",
        "wc_reply_authors": "655;2133;897;1674",
        "reply_reviewers": "1;6;1;1",
        "reply_authors": "1;7;2;3",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            1.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            46.5,
            14.874474780643517
        ],
        "wc_strengths_avg": [
            48.75,
            24.57005290999594
        ],
        "wc_weaknesses_avg": [
            294.25,
            173.97036385545672
        ],
        "wc_questions_avg": [
            178.25,
            139.4298658824572
        ],
        "wc_review_avg": [
            567.75,
            63.408891332367574
        ],
        "wc_reply_reviewers_avg": [
            435.5,
            548.4626240684045
        ],
        "wc_reply_authors_avg": [
            1339.75,
            592.8487897432194
        ],
        "reply_reviewers_avg": [
            2.25,
            2.165063509461097
        ],
        "reply_authors_avg": [
            3.25,
            2.277608394786075
        ],
        "replies_avg": [
            31,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:D5xfdmunE0cJ:scholar.google.com/&scioq=Universally+Amplifying+Randomized+Smoothing+for+Certified+Robustness+with+Anisotropic+Noise&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "University of Connecticut;Cisco Systems;Illinois Institute of Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.uconn.edu;https://www.cisco.com;https://www.iit.edu",
        "aff_unique_abbr": "UConn;Cisco;IIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "bEAVTKUEpJ",
        "title": "SARI: SIMPLISTIC AVERAGE AND ROBUST IDENTIFICATION BASED NOISY PARTIAL LABEL LEARNING",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Partial label learning (PLL) is a weakly-supervised learning paradigm where each training instance is paired with a set of candidate labels (partial label), one of which is the true label. Noisy PLL (NPLL) relaxes this constraint by allowing some partial labels to not contain the true label, enhancing the practicality of the problem. Our work centers on NPLL and presents a minimalistic framework called SARI that initially assigns pseudo-labels to images by exploiting the noisy partial labels through a weighted nearest neighbour algorithm. These pseudo-label and image pairs are then used to train a deep neural network classifier with label smoothing and standard regularization techniques. The classifier's features and predictions are subsequently employed to refine and enhance the accuracy of pseudo-labels. SARI combines the strengths of Average Based Strategies (in pseudo labelling) and Identification Based Strategies (in classifier training) from the literature. We perform thorough experiments on four datasets and compare SARI against nine NPLL and PLL methods from the prior art. SARI achieves state-of-the-art results in all studied settings, obtaining substantial gains in fine-grained classification and extreme noise settings.",
        "keywords": "Partial Label Learning;Weakly Supervised Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Darshana Saravanan;Naresh Manwani;Vineet Gandhi",
        "authorids": "~Darshana_Saravanan1;~Naresh_Manwani1;~Vineet_Gandhi1",
        "gender": "M;M;F",
        "homepage": "https://sites.google.com/site/nareshmanwani/home;https://faculty.iiit.ac.in/~vgandhi/;",
        "dblp": "17/2536;117/2021;",
        "google_scholar": "https://scholar.google.com.tw/citations?user=qz4eDmgAAAAJ;https://scholar.google.fr/citations?user=PVlBz8oAAAAJ;",
        "orcid": ";;",
        "linkedin": ";;darshana1406/",
        "or_profile": "~Naresh_Manwani1;~Vineet_Gandhi1;~Darshana_S1",
        "aff": "International Institute of Information Technology Hyderabad;International Institute of Information Technology Hyderabad, Dhirubhai Ambani Institute Of Information and Communication Technology;International Institute of Information Technology Hyderabad",
        "aff_domain": "iiit.ac.in;iiit.ac.in;iiit.ac.in",
        "position": "Assistant Professor;Associate Professor;MS student",
        "bibtex": "@misc{\nsaravanan2024sari,\ntitle={{SARI}: {SIMPLISTIC} {AVERAGE} {AND} {ROBUST} {IDENTIFICATION} {BASED} {NOISY} {PARTIAL} {LABEL} {LEARNING}},\nauthor={Darshana Saravanan and Naresh Manwani and Vineet Gandhi},\nyear={2024},\nurl={https://openreview.net/forum?id=bEAVTKUEpJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "EnLY;WW8x;YQoY;WNqE",
        "site": "https://openreview.net/forum?id=bEAVTKUEpJ",
        "pdf_size": 816754,
        "rating": "3;3;5;6",
        "confidence": "4;4;3;5",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;2",
        "presentation": "3;3;2;3",
        "wc_summary": "48;86;111;35",
        "wc_strengths": "8;49;57;29",
        "wc_weaknesses": "109;96;167;86",
        "wc_questions": "67;165;6;26",
        "wc_review": "232;396;341;176",
        "wc_reply_reviewers": "0;25;19;41",
        "wc_reply_authors": "307;533;400;268",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            70.0,
            30.191058278901057
        ],
        "wc_strengths_avg": [
            35.75,
            18.9917745353087
        ],
        "wc_weaknesses_avg": [
            114.5,
            31.388692231439016
        ],
        "wc_questions_avg": [
            66.0,
            61.241325916410396
        ],
        "wc_review_avg": [
            286.25,
            86.80545777772271
        ],
        "wc_reply_reviewers_avg": [
            21.25,
            14.669270602180601
        ],
        "wc_reply_authors_avg": [
            377.0,
            102.03675808256553
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.2721655269759087,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:5Wmb3H24Vj4J:scholar.google.com/&scioq=SARI:+SIMPLISTIC+AVERAGE+AND+ROBUST+IDENTIFICATION+BASED+NOISY+PARTIAL+LABEL+LEARNING&hl=en&as_sdt=0,5",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "International Institute of Information Technology;International Institute of Information Technology Hyderabad",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://iiit Hyderabad.ac.in;https://iiit Hyderabad.ac.in",
        "aff_unique_abbr": "IIIT Hyderabad;IIIT Hyderabad",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hyderabad",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "India"
    },
    {
        "id": "bEDTZxwJjT",
        "title": "DiracDiffusion: Denoising and Incremental Reconstruction with Assured Data-Consistency",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Diffusion models have established new state of the art in a multitude of computer vision tasks, including image restoration. Diffusion-based inverse problem solvers generate reconstructions of exceptional visual quality from heavily corrupted measurements. However, in what is widely known as the perception-distortion trade-off, the price of perceptually appealing reconstructions is often paid in declined distortion metrics, such as PSNR. Distortion metrics measure faithfulness to the observation, a crucial requirement in inverse problems.  In this work, we propose a novel framework for inverse problem solving, namely we assume that the observation comes from a stochastic degradation process that gradually degrades and noises the original clean image. We learn to reverse the degradation process in order to recover the clean image. Our technique maintains consistency with the original measurement throughout the reverse process, and allows for great flexibility in trading off perceptual quality for improved distortion metrics and sampling speedup via early-stopping. We demonstrate the efficiency of our method on different high-resolution datasets and inverse problems, achieving great improvements over other state-of-the-art diffusion-based methods with respect to both perceptual and distortion metrics.",
        "keywords": "inverse problems;diffusion models;image reconstruction",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/877a0f30dca48b4ba2d7a01ac5b8f186903de178.zip",
        "author": "Zalan Fabian;Berk Tinaz;Mahdi Soltanolkotabi",
        "authorids": "~Zalan_Fabian1;~Berk_Tinaz1;~Mahdi_Soltanolkotabi1",
        "gender": "M;M;M",
        "homepage": "https://z-fabian.github.io/;https://berktinaz.github.io/;http://www-bcf.usc.edu/~soltanol/",
        "dblp": "192/2874;275/8488;75/6691",
        "google_scholar": "5EKjsXQAAAAJ;gzIzOtAAAAAJ;narJyMAAAAAJ",
        "orcid": ";;",
        "linkedin": ";berk-tinaz/;",
        "or_profile": "~Zalan_Fabian1;~Berk_Tinaz1;~Mahdi_Soltanolkotabi1",
        "aff": "University of Southern California;Amazon;University of Southern California",
        "aff_domain": "usc.edu;amazon.com;usc.edu",
        "position": "Postdoc;Intern;Associate Professor",
        "bibtex": "@misc{\nfabian2024diracdiffusion,\ntitle={DiracDiffusion: Denoising and Incremental Reconstruction with Assured Data-Consistency},\nauthor={Zalan Fabian and Berk Tinaz and Mahdi Soltanolkotabi},\nyear={2024},\nurl={https://openreview.net/forum?id=bEDTZxwJjT}\n}",
        "github": "",
        "project": "",
        "reviewers": "te6k;5bsx;RkZw;1HXs",
        "site": "https://openreview.net/forum?id=bEDTZxwJjT",
        "pdf_size": 45888977,
        "rating": "5;5;6;6",
        "confidence": "3;4;4;4",
        "soundness": "3;2;3;3",
        "contribution": "3;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "86;103;66;91",
        "wc_strengths": "39;68;43;45",
        "wc_weaknesses": "20;262;84;56",
        "wc_questions": "17;20;19;237",
        "wc_review": "162;453;212;429",
        "wc_reply_reviewers": "0;0;10;307",
        "wc_reply_authors": "341;579;421;732",
        "reply_reviewers": "0;0;1;2",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            86.5,
            13.35102992281869
        ],
        "wc_strengths_avg": [
            48.75,
            11.321991874224253
        ],
        "wc_weaknesses_avg": [
            105.5,
            93.15980893067568
        ],
        "wc_questions_avg": [
            73.25,
            94.54727653401763
        ],
        "wc_review_avg": [
            314.0,
            128.5048637211837
        ],
        "wc_reply_reviewers_avg": [
            79.25,
            131.55488398383392
        ],
        "wc_reply_authors_avg": [
            518.25,
            150.21214165306344
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7508433423845953381&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 10,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Southern California;Amazon",
        "aff_unique_dep": ";Amazon.com, Inc.",
        "aff_unique_url": "https://www.usc.edu;https://www.amazon.com",
        "aff_unique_abbr": "USC;Amazon",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Los Angeles;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "bFMpmb8p3D",
        "title": "Multitask Image-to-Image Diffusion Models with Fine-Grained Control",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Diffusion models have recently been applied to various image restoration and editing tasks, showing remarkable results in commercial products, e.g., Adobe Photoshop. While recent approaches to text-based editing have shown flexibility and great editing capacity, they still lack fine-grained control and/or multi-task compositing capabilities. In everyday applications, however, having a single tool for image editing with detailed user control across multiple tasks is highly preferred. This paper proposes a multi-task image-to-image diffusion model that allows fine- grained image editing among multiple tasks within a single model. Our approach builds upon conditional diffusion models and jointly models the input images and the input compositing effects, including motion blur, film grain, colorization, image sharpening, and inpainting. We present a novel input conditioning formulation and observe that using explicit binary task activation labels and cross-attention-based feature conditioning are key to allowing the model to achieve multi-task editing. In addition, we introduce a novel benchmark dataset for image compositing effects with standard image metrics for advancing the state of the art. Our approach can manipulate natural images with fine-grained, disentangled user control on single- and multi-task editing setups and generalizes well across different domains and even to unseen data distributions. We present experimental results on various compositing tasks to show that our approach outperforms existing techniques and baselines.",
        "keywords": "generative models;computer vision;machine learning;image-to-image translation;diffusion models;multitask image editing",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/95a43270a36f76b71df230370dc4b107ca796611.pdf",
        "author": "Xu YAO;Alex Whelan;Hyeongwoo Kim;Pablo Garrido",
        "authorids": "~Xu_YAO1;~Alex_Whelan1;~Hyeongwoo_Kim6;~Pablo_Garrido1",
        "gender": "F;M;;",
        "homepage": "https://xu-yao.github.io/;;;",
        "dblp": ";;;",
        "google_scholar": "4DjVtSgAAAAJ;;;",
        "orcid": ";;;",
        "linkedin": "xu-yao-05a303b5;alexander-whelan;;",
        "or_profile": "~Xu_YAO1;~Alex_Whelan1;~Hyeongwoo_Kim6;~Pablo_Garrido1",
        "aff": "Flawless AI;Flawless AI;;",
        "aff_domain": "flawlessai.com;flawlessai.com;;",
        "position": "Researcher;Researcher;;",
        "bibtex": "@misc{\nyao2024multitask,\ntitle={Multitask Image-to-Image Diffusion Models with Fine-Grained Control},\nauthor={Xu YAO and Alex Whelan and Hyeongwoo Kim and Pablo Garrido},\nyear={2024},\nurl={https://openreview.net/forum?id=bFMpmb8p3D}\n}",
        "github": "",
        "project": "",
        "reviewers": "iY2j;9BYu;GVE7;Nn9D",
        "site": "https://openreview.net/forum?id=bFMpmb8p3D",
        "pdf_size": 18095317,
        "rating": "3;5;5;6",
        "confidence": "4;4;4;3",
        "soundness": "1;2;3;3",
        "contribution": "2;3;2;2",
        "presentation": "2;3;2;3",
        "wc_summary": "46;61;98;104",
        "wc_strengths": "16;66;62;85",
        "wc_weaknesses": "64;308;141;265",
        "wc_questions": "108;3;133;132",
        "wc_review": "234;438;434;586",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            77.25,
            24.427187721880717
        ],
        "wc_strengths_avg": [
            57.25,
            25.35128201886445
        ],
        "wc_weaknesses_avg": [
            194.5,
            97.14036236292307
        ],
        "wc_questions_avg": [
            94.0,
            53.48364235913631
        ],
        "wc_review_avg": [
            423.0,
            125.13592609638529
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.6622661785325219,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:n8-LQhVxqLkJ:scholar.google.com/&scioq=Multitask+Image-to-Image+Diffusion+Models+with+Fine-Grained+Control&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Flawless AI",
        "aff_unique_dep": "",
        "aff_unique_url": "",
        "aff_unique_abbr": "",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "",
        "aff_country_unique": ""
    },
    {
        "title": "Understanding In-Context Learning from Repetitions",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18340",
        "id": "bGGYcvw8mp",
        "author_site": "Jianhao (Elliott) Yan, Jin Xu, Chiyu Song, Chenming Wu, Yafu Li, Yue Zhang",
        "tldr": "",
        "abstract": "This paper explores the elusive mechanism underpinning in-context learning in Large Language Models (LLMs). Our work provides a novel perspective by examining in-context learning via the lens of surface repetitions. We quantitatively investigate the role of surface features in text generation, and empirically establish the existence of \\emph{token co-occurrence reinforcement}, a principle that strengthens the relationship between two tokens based on their contextual co-occurrences. Furthermore, we find similar reinforcements lie behind the pretraining corpus, revealing the existence is due to LLMs' efforts to maximize the likelihood. By investigating the dual impacts of these features, our research illuminates the internal workings of in-context learning and expounds on the reasons for its failures. This paper provides an essential contribution to the understanding of in-context learning and its potential limitations, providing a fresh perspective on this exciting capability.",
        "keywords": "In-context learning;Large language models;Repetition",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/8f4709c2e8e216857fd3a9a80275c8469902e5d3.zip",
        "author": "Jianhao Yan;Jin Xu;Chiyu Song;Chenming Wu;Yafu Li;Yue Zhang",
        "authorids": "~Jianhao_Yan1;~Jin_Xu5;~Chiyu_Song1;~Chenming_Wu1;~Yafu_Li1;~Yue_Zhang7",
        "gender": "M;;;M;M;M",
        "homepage": ";;;https://chenming-wu.github.io/;https://yafuly.github.io/yafuly/;http://frcchang.github.io",
        "dblp": "242/4255;;294/4603;190/5879;293/9896;47/722-4",
        "google_scholar": "https://scholar.google.com.hk/citations?user=pnKLj_wAAAAJ;;6kN-MBQAAAAJ;https://scholar.google.com.hk/citations?user=eOkkQWUAAAAJ;https://scholar.google.com/citations?hl=en;",
        "orcid": ";;;0000-0001-8012-1547;;0000-0002-5214-2268",
        "linkedin": ";;chiyu-song/;;;",
        "or_profile": "~Jianhao_Yan1;~Jin_Xu5;~Chiyu_Song1;~Chenming_Wu1;~Yafu_Li1;~Yue_Zhang7",
        "aff": "Westlake University;;Westlake University;Baidu;Westlake University;Westlake University",
        "aff_domain": "westlake.edu.cn;;westlake.edu.cn;baidu.com;westlake.edu.cn;westlake.edu.cn",
        "position": "PhD student;;PhD student;Researcher;PhD student;Full Professor",
        "bibtex": "@inproceedings{\nyan2024understanding,\ntitle={Understanding In-Context Learning from Repetitions},\nauthor={Jianhao Yan and Jin Xu and Chiyu Song and Chenming Wu and Yafu Li and Yue Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=bGGYcvw8mp}\n}",
        "github": "",
        "project": "",
        "reviewers": "5Dh6;iqcg;Ydk8;d42T",
        "pdf_size": 1275206,
        "rating": "5;5;6;6",
        "confidence": "1;4;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "63;37;130;96",
        "wc_strengths": "17;19;67;33",
        "wc_weaknesses": "135;132;153;105",
        "wc_questions": "42;13;107;45",
        "wc_review": "257;201;457;279",
        "wc_reply_reviewers": "0;236;15;15",
        "wc_reply_authors": "124;492;478;213",
        "reply_reviewers": "0;1;2;1",
        "reply_authors": "1;2;2;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.0,
            1.224744871391589
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            81.5,
            34.9463875100131
        ],
        "wc_strengths_avg": [
            34.0,
            20.024984394500787
        ],
        "wc_weaknesses_avg": [
            131.25,
            17.151894939043906
        ],
        "wc_questions_avg": [
            51.75,
            34.259122872601395
        ],
        "wc_review_avg": [
            298.5,
            95.82666643476648
        ],
        "wc_reply_reviewers_avg": [
            66.5,
            98.0522819724253
        ],
        "wc_reply_authors_avg": [
            326.75,
            161.42393719643937
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.40824829046386296,
        "gs_citation": 21,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3678353906756566784&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=bGGYcvw8mp",
        "pdf": "https://openreview.net/pdf?id=bGGYcvw8mp",
        "email": "westlake.edu.cn;;westlake.edu.cn;baidu.com;westlake.edu.cn;westlake.edu.cn",
        "author_num": 6,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "Westlake University;Baidu",
        "aff_unique_dep": ";Baidu, Inc.",
        "aff_unique_url": "https://www.westlake.edu.cn;https://www.baidu.com",
        "aff_unique_abbr": "WU;Baidu",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "bGJZXb26lo",
        "title": "DITTO: Offline Imitation Learning with World Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "For imitation learning algorithms to scale to real-world challenges, they must handle high-dimensional observations, offline learning, and covariate-shift. We propose DITTO, an offline imitation learning algorithm which addresses all three of these problems. DITTO does this by optimizing a novel distance measure defined in the latent space of a learned world model. We create this measure by rolling out the learned policy in the latent space of a learned world model, and compute the divergence from expert trajectories over multiple time steps. We then minimise this intrinsic reward through on-policy reinforcement learning. This approach has multiple benefits: the policy is learned under its own induced state distribution, so that we can use on-policy algorithms in the offline setting; the world model provides a natural measure of learner-expert divergence, effectively acting as an oracle to teach the learner how to recover from its mistakes; and, the world model lets us decouple learning dynamics and control, into the world model and policy respectively. DITTO is completely offline, requiring no online interactions at all. Theoretically, we show that our formulation induces a divergence bound between expert and learner, in turn bounding the difference in extrinsic reward. We test our method on standard imitation learning benchmarks, including difficult Atari environments from pixels alone, and achieve state-of-the-art performance in the offline setting. We also adapt standard imitation learning algorithms to the world model setting, and show that this considerably improves their performance and robustness.",
        "keywords": "Imitation Learning;Reinforcement Learning;World Models;Offline",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/9d5bbf54f219bd9dd8ca7193397db3f6afe36cd4.zip",
        "author": "Branton DeMoss;Paul Duckworth;Jakob Nicolaus Foerster;Nick Hawes;Ingmar Posner",
        "authorids": "~Branton_DeMoss1;~Paul_Duckworth1;~Jakob_Nicolaus_Foerster1;~Nick_Hawes1;~Ingmar_Posner1",
        "gender": ";M;M;M;",
        "homepage": "https://www.robots.ox.ac.uk/~bdemoss/;http://www.robots.ox.ac.uk/~scpd/;https://www.jakobfoerster.com;https://www.robots.ox.ac.uk/~nickh/;",
        "dblp": "339/7295;179/2160;176/5095;35/1190;59/542",
        "google_scholar": "RtSDseMAAAAJ;I64MZDoAAAAJ;6z4lQzMAAAAJ;bRsi4zoAAAAJ;dPk-iwsAAAAJ",
        "orcid": "0000-0001-6828-6787;0000-0001-9052-6919;;0000-0002-7556-6098;0000-0001-6270-700X",
        "linkedin": ";;;;ingmar-posner-20b49a",
        "or_profile": "~Branton_DeMoss1;~Paul_Duckworth1;~Jakob_Nicolaus_Foerster1;~Nick_Hawes1;~Ingmar_Posner1",
        "aff": "University of Oxford;InstaDeep;University of Oxford, University of Oxford;University of Oxford;University of Oxford",
        "aff_domain": "robots.ox.ac.uk;instadeep.com;eng.ox.ac.uk;ox.ac.uk;ox.ac.uk",
        "position": "PhD student;Principal Researcher;Associate Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\ndemoss2024ditto,\ntitle={{DITTO}: Offline Imitation Learning with World Models},\nauthor={Branton DeMoss and Paul Duckworth and Jakob Nicolaus Foerster and Nick Hawes and Ingmar Posner},\nyear={2024},\nurl={https://openreview.net/forum?id=bGJZXb26lo}\n}",
        "github": "",
        "project": "",
        "reviewers": "FNUA;aexK;nJqY;gyqq;d4u9;dH9k",
        "site": "https://openreview.net/forum?id=bGJZXb26lo",
        "pdf_size": 819955,
        "rating": "3;3;3;3;5;5",
        "confidence": "4;3;4;4;5;4",
        "soundness": "3;2;3;2;3;2",
        "contribution": "2;2;1;2;3;2",
        "presentation": "2;2;2;3;3;3",
        "wc_summary": "66;141;128;49;72;54",
        "wc_strengths": "34;41;58;48;59;43",
        "wc_weaknesses": "161;637;196;137;53;141",
        "wc_questions": "526;38;122;121;170;67",
        "wc_review": "787;857;504;355;354;305",
        "wc_reply_reviewers": "0;0;74;0;169;0",
        "wc_reply_authors": "130;426;299;313;427;232",
        "reply_reviewers": "0;0;1;0;1;0",
        "reply_authors": "1;1;1;1;1;1",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.5773502691896257
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.5773502691896257
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            85.0,
            35.99073954968602
        ],
        "wc_strengths_avg": [
            47.166666666666664,
            9.007712744581106
        ],
        "wc_weaknesses_avg": [
            220.83333333333334,
            191.03264700627017
        ],
        "wc_questions_avg": [
            174.0,
            162.9815940528255
        ],
        "wc_review_avg": [
            527.0,
            218.2605476641774
        ],
        "wc_reply_reviewers_avg": [
            40.5,
            63.502624617674925
        ],
        "wc_reply_authors_avg": [
            304.5,
            104.54464755946779
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.6123724356957945,
        "gs_citation": 16,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6201823162655395865&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0;0;0",
        "aff_unique_norm": "University of Oxford;InstaDeep",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ox.ac.uk;https://www.instadeep.com",
        "aff_unique_abbr": "Oxford;InstaDeep",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "bGv9kWeBcw",
        "title": "FStega: Fourier Neural Operators for printer-proof steganography",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Hiding and extracting a message in printed images is challenging when considering the trade-off between accuracy in recovering data and the perceptual quality of the generated images. It is especially a big issue to hide data in such a way that it is almost invisibly embedded. In this paper, we propose a method based on Fourier Neural Operator to embed bitstrings in images. The method is able to learn critical frequencies from the image and the message to improve the decoding process of the hidden data. In order to enhance the information recovery capabilities of the printed image we create an improved noise simulation process and a decoder composed of several convolutional layers combined with a vision transformer to obtain a decoding method more robust to the noise introduced in the encoding\nimage when it is printed and acquired by an optical sensor. Experimental evaluations demonstrate the ability to properly recover the message encoded in wild printed pictures with an accuracy of 100% (with 3 different image sizes) acquired with several lightning and perspective conditions.",
        "keywords": "steganography;watermarking;fourier operators;deep neural networks",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Luiz Schirmer;Guilherme Schardong;Aniana Cruz;Farhad Shadmand;Jo\u00e3o Sena Marcos;Nuno Gon\u00e7alves",
        "authorids": "~Luiz_Schirmer1;~Guilherme_Schardong1;~Aniana_Cruz1;~Farhad_Shadmand1;~Jo\u00e3o_Sena_Marcos1;~Nuno_Gon\u00e7alves2",
        "gender": "M;F;M;M;M;M",
        "homepage": "http://www.lschirmer.com;;https://visteam.isr.uc.pt/home;;https://visteam.isr.uc.pt/nuno-goncalves/;https://schardong.github.io",
        "dblp": "201/2594.html;161/7426;309/7466;00/3290-2;266/4615;218/4700",
        "google_scholar": "zhagpmkAAAAJ;https://scholar.google.nl/citations?user=tAsY0j0AAAAJ;https://scholar.google.com/citations?hl=en;;https://scholar.google.pt/citations?user=bdc9m24AAAAJ;piv6gKsAAAAJ",
        "orcid": "0000-0003-4102-1986;0000-0001-5420-6651;0000-0003-4399-4845;0000-0001-8288-9509;0000-0002-1854-049X;0000-0003-3927-0852",
        "linkedin": ";;farhadsh1992;jsmarcos/;nunogon/;guilherme-schardong-310794ba/",
        "or_profile": "~Luiz_Schirmer1;~Aniana_Cruz1;~Farhad_Shadmand1;~Jo\u00e3o_Sena_Marcos1;~Nuno_Gon\u00e7alves2;~Guilherme_Gon\u00e7alves_Schardong1",
        "aff": "Universidade Vale do Rio dos Sinos;Institute of Systems and Robotics, University of Coimbra;Institute of Systems and Robotics, University of Coimbra;Institute of Systems and Robotics, University of Coimbra;Institute of Systems and Robotics, University of Coimbra;Institute of Systems and Robotics, University of Coimbra",
        "aff_domain": "unisinos.br;isr.uc.pt;isr.uc.pt;isr.uc.pt;isr.uc.pt;isr.uc.pt",
        "position": "Assistant Professor;Researcher;PhD student;Postdoc;Principal Researcher;Postdoc",
        "bibtex": "@misc{\nschirmer2024fstega,\ntitle={{FS}tega: Fourier Neural Operators for printer-proof steganography},\nauthor={Luiz Schirmer and Guilherme Schardong and Aniana Cruz and Farhad Shadmand and Jo{\\~a}o Sena Marcos and Nuno Gon{\\c{c}}alves},\nyear={2024},\nurl={https://openreview.net/forum?id=bGv9kWeBcw}\n}",
        "github": "",
        "project": "",
        "reviewers": "JGfL;3bbC;owcE;E8yC;pVko",
        "site": "https://openreview.net/forum?id=bGv9kWeBcw",
        "pdf_size": 39319711,
        "rating": "1;1;3;3;6",
        "confidence": "5;5;4;2;3",
        "soundness": "2;2;2;2;2",
        "contribution": "1;2;1;1;2",
        "presentation": "2;3;2;2;2",
        "wc_summary": "168;35;33;108;43",
        "wc_strengths": "10;34;33;28;6",
        "wc_weaknesses": "53;370;139;297;22",
        "wc_questions": "2;142;2;181;22",
        "wc_review": "233;581;207;614;93",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            2.8,
            1.8330302779823362
        ],
        "confidence_avg": [
            3.8,
            1.16619037896906
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.2,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            77.4,
            53.09839922257544
        ],
        "wc_strengths_avg": [
            22.2,
            11.838918869558993
        ],
        "wc_weaknesses_avg": [
            176.2,
            136.00794094463748
        ],
        "wc_questions_avg": [
            69.8,
            76.23227662873515
        ],
        "wc_review_avg": [
            345.6,
            211.25681054110422
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.6736330697086077,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:_QKu-ZJPTF4J:scholar.google.com/&scioq=FStega:+Fourier+Neural+Operators+for+printer-proof+steganography&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1;1;1",
        "aff_unique_norm": "Universidade Vale do Rio dos Sinos;University of Coimbra",
        "aff_unique_dep": ";Institute of Systems and Robotics",
        "aff_unique_url": "https://www.unisinos.br;https://www.uc.pt",
        "aff_unique_abbr": "Unisinos;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;1;1",
        "aff_country_unique": "Brazil;Portugal"
    },
    {
        "title": "Latent Representation and Simulation of Markov Processes via Time-Lagged Information Bottleneck",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18339",
        "id": "bH6T0Jjw5y",
        "author_site": "Marco Federici, Patrick Forr\u00e9, Ryota Tomioka, Bas Veeling",
        "tldr": "",
        "abstract": "Markov processes are widely used mathematical models for describing dynamic systems in various fields. However, accurately simulating large-scale systems at long time scales is computationally expensive due to the short time steps required for accurate integration. In this paper, we introduce an inference process that maps complex systems into a simplified representational space and models large jumps in time. To achieve this, we propose Time-lagged Information Bottleneck (T-IB), a principled objective rooted in information theory, which aims to capture relevant temporal features while discarding high-frequency information to simplify the simulation task and minimize the inference error. Our experiments demonstrate that T-IB learns information-optimal representations for accurately modeling the statistical properties and dynamics of the original process at a selected time lag, outperforming existing time-lagged dimensionality reduction methods.",
        "keywords": "Markov Processes;Information Theory;Information Bottleneck;Latent Simulation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/3cbc8e409279195b6404412d53f70a801db3ef61.pdf",
        "author": "Marco Federici;Patrick Forr\u00e9;Ryota Tomioka;Bastiaan S. Veeling",
        "authorids": "~Marco_Federici1;~Patrick_Forr\u00e91;~Ryota_Tomioka1;~Bastiaan_S._Veeling1",
        "gender": "M;;M;",
        "homepage": ";;http://tomioka.dk;",
        "dblp": "166/5511.html;;50/2945;",
        "google_scholar": "TfInmkIAAAAJ;;TxdeO-UAAAAJ;",
        "orcid": ";;;",
        "linkedin": "marco-federici-2b027b149/;;;",
        "or_profile": "~Marco_Federici1;~Patrick_Forr\u00e91;~Ryota_Tomioka1;~Bastiaan_S._Veeling1",
        "aff": "QualComm;;Microsoft Research Cambridge;",
        "aff_domain": "qualcomm.com;;microsoft.com;",
        "position": "Researcher;;Researcher;",
        "bibtex": "@inproceedings{\nfederici2024latent,\ntitle={Latent Representation and Simulation of Markov Processes via Time-Lagged Information Bottleneck},\nauthor={Marco Federici and Patrick Forr{\\'e} and Ryota Tomioka and Bastiaan S. Veeling},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=bH6T0Jjw5y}\n}",
        "github": "",
        "project": "",
        "reviewers": "Yi96;mH7G;H2G8",
        "pdf_size": 8746895,
        "rating": "8;8;8",
        "confidence": "2;4;2",
        "soundness": "3;4;3",
        "contribution": "3;4;3",
        "presentation": "3;4;3",
        "wc_summary": "83;90;132",
        "wc_strengths": "70;71;77",
        "wc_weaknesses": "45;324;103",
        "wc_questions": "171;2;43",
        "wc_review": "369;487;355",
        "wc_reply_reviewers": "43;169;10",
        "wc_reply_authors": "220;1067;858",
        "reply_reviewers": "1;2;1",
        "reply_authors": "1;3;2",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            101.66666666666667,
            21.638443156156644
        ],
        "wc_strengths_avg": [
            72.66666666666667,
            3.0912061651652345
        ],
        "wc_weaknesses_avg": [
            157.33333333333334,
            120.2063041423184
        ],
        "wc_questions_avg": [
            72.0,
            71.9768481295664
        ],
        "wc_review_avg": [
            403.6666666666667,
            59.2021020647822
        ],
        "wc_reply_reviewers_avg": [
            74.0,
            68.51277253184256
        ],
        "wc_reply_authors_avg": [
            715.0,
            360.26749321395437
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16789732073895702354&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=bH6T0Jjw5y",
        "pdf": "https://openreview.net/pdf?id=bH6T0Jjw5y",
        "email": "qualcomm.com;;microsoft.com;",
        "author_num": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Qualcomm Incorporated;Microsoft",
        "aff_unique_dep": ";Microsoft Research",
        "aff_unique_url": "https://www.qualcomm.com;https://www.microsoft.com/en-us/research/group/microsoft-research-cambridge",
        "aff_unique_abbr": "Qualcomm;MSR Cambridge",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Cambridge",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "bHOcs4PBgR",
        "title": "Flatter, Faster: Scaling Momentum for Optimal Speedup of SGD",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Commonly used optimization algorithms often show a trade-off between good generalization and fast training times. For instance, stochastic gradient descent (SGD) tends to have good generalization; however, adaptive gradient methods have superior training times. Momentum can help accelerate training with SGD, but so far there has been no principled way to select the momentum hyperparameter. Here we study training dynamics arising from the interplay between SGD with label noise and momentum in the training of overparametrized neural networks. We find that scaling the momentum hyperparameter $1-\\beta$ with the learning rate to the power of $2/3$ maximally accelerates training, without sacrificing generalization. To analytically derive this result we develop an architecture-independent framework, where the main assumption is the existence of a degenerate manifold of global minimizers, as is natural in overparametrized models. Training dynamics display the emergence of two characteristic timescales that are well-separated for generic values of the hyperparameters. The maximum acceleration of training is reached when these two timescales meet, which in turn determines the scaling limit we propose. Our experiments in matrix-sensing, a 6-layer MLP on FashionMNIST and ResNet-18 on CIFAR10 validate this scaling for the time to convergence, and additionally for the momentum hyperparameter which maximizes generalization.",
        "keywords": "stochastic gradient descent;momentum;power-law scaling",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Aditya Cowsik;Tankut Can;Paolo Glorioso",
        "authorids": "~Aditya_Cowsik1;~Tankut_Can1;~Paolo_Glorioso1",
        "gender": "M;M;",
        "homepage": ";https://sites.google.com/view/tankut-can;",
        "dblp": ";;",
        "google_scholar": "23og9KYAAAAJ;H5MicWUAAAAJ;4y1ZjNcAAAAJ",
        "orcid": ";0000-0002-0999-2355;",
        "linkedin": ";;",
        "or_profile": "~Aditya_Cowsik1;~Tankut_Can1;~Paolo_Glorioso1",
        "aff": "Stanford University;Institute for Advanced Study, Princeton;",
        "aff_domain": "stanford.edu;ias.edu;",
        "position": "PhD student;Researcher;",
        "bibtex": "@misc{\ncowsik2024flatter,\ntitle={Flatter, Faster: Scaling Momentum for Optimal Speedup of {SGD}},\nauthor={Aditya Cowsik and Tankut Can and Paolo Glorioso},\nyear={2024},\nurl={https://openreview.net/forum?id=bHOcs4PBgR}\n}",
        "github": "",
        "project": "",
        "reviewers": "P153;VjSB;Su7A",
        "site": "https://openreview.net/forum?id=bHOcs4PBgR",
        "pdf_size": 1128949,
        "rating": "3;6;6",
        "confidence": "3;3;3",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "1;2;3",
        "wc_summary": "51;96;133",
        "wc_strengths": "41;91;57",
        "wc_weaknesses": "201;84;53",
        "wc_questions": "3;156;150",
        "wc_review": "296;427;393",
        "wc_reply_reviewers": "0;34;0",
        "wc_reply_authors": "393;695;684",
        "reply_reviewers": "0;1;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            93.33333333333333,
            33.529423231278855
        ],
        "wc_strengths_avg": [
            63.0,
            20.848661028149188
        ],
        "wc_weaknesses_avg": [
            112.66666666666667,
            63.73033465748909
        ],
        "wc_questions_avg": [
            103.0,
            70.75309180523492
        ],
        "wc_review_avg": [
            372.0,
            55.50375362681939
        ],
        "wc_reply_reviewers_avg": [
            11.333333333333334,
            16.027753706895076
        ],
        "wc_reply_authors_avg": [
            590.6666666666666,
            139.84356339217842
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2191395481680509560&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Stanford University;Institute for Advanced Study",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.stanford.edu;https://ias.edu",
        "aff_unique_abbr": "Stanford;IAS",
        "aff_campus_unique_index": "0;1",
        "aff_campus_unique": "Stanford;Princeton",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "bIHyMpzeuI",
        "title": "Sparse MoE as a New Treatment: Addressing Forgetting, Fitting, Learning Issues in Multi-Modal Multi-Task Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Sparse Mixture-of-Experts (SMoE) is a promising paradigm that can be easily tailored for multi-task learning. Its conditional computing nature allows us to organically allocate relevant parts of a model for performant and efficient predictions. However, several under-explored pain points persist, especially when considering scenarios with both multiple modalities and tasks: 1 $\\textit{{Modality Forgetting Issue.}}$ Diverse modalities may prefer conflicting optimization directions, resulting in ineffective learning or knowledge forgetting; 2 $\\textit{{Modality Fitting Issue.}}$ Current SMoE pipelines select a fixed number of experts for all modalities, which can end up over-fitting to simpler modalities or under-fitting complex modalities; 3 $\\textit{{Heterogeneous Learning Pace.}}$ The varied modality attributes, task resources ($\\textit{i.e.,}$ the number of input samples), and task objectives usually lead to distinct optimization difficulties and convergence. Given these issues, there is a clear need for a systematic approach to harmonizing multi-model and multi-task objectives when using SMoE. We aim to address these pain points, and propose a new $\\underline{S}$parse $\\underline{M}$oE framework for $\\underline{M}$ulti-$\\underline{M}$odal $\\underline{M}$ulti-task learning, $\\textit{a.k.a.}$, $\\texttt{SM$^4$}$, which ($1$) disentangles model spaces for different modalities to mitigate their optimization conflicts; \n($2$) automatically determines the modality-specific model size ($\\textit{i.e.}$, the number of experts) to improve fitting; and ($3$) synchronizes the learning paces of disparate modalities and tasks based on training dynamics in SMoE like the entropy of routing decisions. Comprehensive experiments validate the effectiveness of $\\texttt{SM$^4$}$, which outperforms previous state-of-the-art across $3$ task groups and $11$ different modalities with a clear performance margin ($\\textit{e.g.}$, $\\ge 1.37\\%$) and a substantial computation reduction ($46.49\\% \\sim 98.62\\%$). Code is included in the supplement.",
        "keywords": "multi-modal learning;multi-task learning;sparse mixture-of-experts",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/bba203b904a8ccd06e62a8922531c22b8d9dd7df.zip",
        "author": "Jie Peng;Kaixiong Zhou;Ruida Zhou;Thomas Hartvigsen;Yanyong Zhang;Zhangyang Wang;Tianlong Chen",
        "authorids": "~Jie_Peng4;~Kaixiong_Zhou1;~Ruida_Zhou1;~Thomas_Hartvigsen1;~Yanyong_Zhang2;~Zhangyang_Wang1;~Tianlong_Chen1",
        "gender": "M;M;M;M;F;M;M",
        "homepage": "http://home.ustc.edu.cn/~pengjieb/;https://kaixiong-zhou.github.io/;https://sites.google.com/view/ruida-zhou;https://www.tomhartvigsen.com;http://staff.ustc.edu.cn/~yanyongz/;https://vita-group.github.io;https://tianlong-chen.github.io",
        "dblp": ";178/7315;215/2026;211/5752;44/2799;119/4026;",
        "google_scholar": ";zMspIjIAAAAJ;kXbo1twAAAAJ;rIjeeRsAAAAJ;qfbPQ1YAAAAJ;pxFyKAIAAAAJ;LE3ctn0AAAAJ",
        "orcid": ";0000-0001-5226-8736;;;;;0000-0001-7774-8197",
        "linkedin": ";;;;;;tianlong-chen-783862167/",
        "or_profile": "~Jie_Peng4;~Kaixiong_Zhou1;~Ruida_Zhou1;~Thomas_Hartvigsen1;~Yanyong_Zhang2;~Zhangyang_Wang1;~Tianlong_Chen1",
        "aff": "University of Science and Technology of China;Massachusetts Institute of Technology;University of California, Los Angeles;University of Virginia, Charlottesville;University of Science and Technology of China;University of Texas at Austin;Harvard University",
        "aff_domain": "ustc.edu.cn;mit.edu;ucla.edu;virginia.edu;ustc.edu.cn;utexas.edu;harvard.edu",
        "position": "PhD student;Postdoc;Postdoc;Assistant Professor;Full Professor;Associate Professor;Postdoc",
        "bibtex": "@misc{\npeng2024sparse,\ntitle={Sparse MoE as a New Treatment: Addressing Forgetting, Fitting, Learning Issues in Multi-Modal Multi-Task Learning},\nauthor={Jie Peng and Kaixiong Zhou and Ruida Zhou and Thomas Hartvigsen and Yanyong Zhang and Zhangyang Wang and Tianlong Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=bIHyMpzeuI}\n}",
        "github": "",
        "project": "",
        "reviewers": "rXKX;cbhp;m8oX;mdyv",
        "site": "https://openreview.net/forum?id=bIHyMpzeuI",
        "pdf_size": 2056411,
        "rating": "3;5;5;8",
        "confidence": "3;4;4;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;2;4",
        "wc_summary": "40;87;43;79",
        "wc_strengths": "28;54;40;86",
        "wc_weaknesses": "94;262;134;188",
        "wc_questions": "47;15;35;19",
        "wc_review": "209;418;252;372",
        "wc_reply_reviewers": "132;446;0;72",
        "wc_reply_authors": "449;1227;620;1352",
        "reply_reviewers": "1;3;0;1",
        "reply_authors": "2;4;2;5",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            62.25,
            20.96872671384698
        ],
        "wc_strengths_avg": [
            52.0,
            21.6794833886788
        ],
        "wc_weaknesses_avg": [
            169.5,
            62.966260806879745
        ],
        "wc_questions_avg": [
            29.0,
            12.806248474865697
        ],
        "wc_review_avg": [
            312.75,
            85.20966787870964
        ],
        "wc_reply_reviewers_avg": [
            162.5,
            170.2197109620387
        ],
        "wc_reply_authors_avg": [
            912.0,
            384.85646675091743
        ],
        "reply_reviewers_avg": [
            1.25,
            1.0897247358851685
        ],
        "reply_authors_avg": [
            3.25,
            1.299038105676658
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.14002800840280097,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5783442903279121393&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;0;4;5",
        "aff_unique_norm": "University of Science and Technology of China;Massachusetts Institute of Technology;University of California, Los Angeles;University of Virginia;University of Texas at Austin;Harvard University",
        "aff_unique_dep": ";;;;;",
        "aff_unique_url": "http://www.ustc.edu.cn;https://web.mit.edu;https://www.ucla.edu;https://www.virginia.edu;https://www.utexas.edu;https://www.harvard.edu",
        "aff_unique_abbr": "USTC;MIT;UCLA;UVA;UT Austin;Harvard",
        "aff_campus_unique_index": "1;2;3",
        "aff_campus_unique": ";Los Angeles;Charlottesville;Austin",
        "aff_country_unique_index": "0;1;1;1;0;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "bIb1xhSCVY",
        "title": "Interpreting Reward Models in RLHF-Tuned Language Models Using Sparse Autoencoders",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Reinforcement learning from human feedback (RLHF) is a technique for aligning AI systems with human preferences. Arguably, it has been key to the widespread commercialization of large language models (LLMs). However, the effects of RLHF on the internals of these models are not just obfuscated but largely uncharted. We introduce a general method for interpreting the \\textit{learned} reward function of an RLHF-tuned LLM, leveraging recent developments in unpacking superposed features to construct more interpretable representations using sparse autoencoders. Our approach trains sets of autoencoders on the activations of both a base model and a model fine-tuned through RLHF. Through identifying unique features present in the hidden space of these autoencoders, we investigate the accuracy of the learned reward model present in this LLM. To assist in this, a toy scenario is constructed whereby the fine-tuned model is tasked with learning a table of token to reward mappings, and then maximizing reward given those mappings. This allows us to quantify the efficacy of the learned reward model in the fine-tuned LLM. To the best of our knowledge, this is the first application of sparse autoencoders to interpreting learned reward models, as well as the first general attempt at understanding learned reward functions in LLMs.  We believe this is a promising technique for ensuring alignment between specified objectives and model behavior. Ultimately our results show that through the method presented in this paper alone, only an abstract approximation reward model integrity can be obtained, but that future work might lead to more rigorous charting of learned reward models in LLMs. This culminates in a score for how well certain features encompass the table of token to reward mappings, as well as a table of features likely to exist in the fine-tuned model in layers where reward modeling is most probable.",
        "keywords": "RLHF;Safety;Reward models;Interpretability",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Luke Marks;Amir Abdullah;Luna Mendez;Rauno Arike;Philip Torr;Fazl Barez",
        "authorids": "~Luke_Marks2;~Amir_Abdullah1;~Luna_Mendez1;~Rauno_Arike1;~Philip_Torr1;~Fazl_Barez1",
        "gender": "M;M;F;M;;",
        "homepage": "https://lukemarks.bot/;;https://github.com/nonlinearmoon;;http://www.robots.ox.ac.uk/~tvg/;",
        "dblp": "358/8955;358/8964;;;;",
        "google_scholar": "xoQcqAQAAAAJ;jPEbq5wAAAAJ;;gJSs1EwAAAAJ;;",
        "orcid": ";;;;;",
        "linkedin": ";amirali-abdullah-23273314/;;rauno-arike/;;",
        "or_profile": "~Luke_Marks2;~Amir_Abdullah1;~Luna_Mendez1;~Rauno_Arike1;~Philip_Torr1;~Fazl_Barez1",
        "aff": "University of Oxford;Cynch AI;;Delft University of Technology;University of Oxford;",
        "aff_domain": "oxford.ac.uk;cynch.ai;;tudelft.nl;ox.ac.uk;",
        "position": "Intern;Applied Scientist;;Undergrad student;Full Professor;",
        "bibtex": "@misc{\nmarks2024interpreting,\ntitle={Interpreting Reward Models in {RLHF}-Tuned Language Models Using Sparse Autoencoders},\nauthor={Luke Marks and Amir Abdullah and Luna Mendez and Rauno Arike and Philip Torr and Fazl Barez},\nyear={2024},\nurl={https://openreview.net/forum?id=bIb1xhSCVY}\n}",
        "github": "",
        "project": "",
        "reviewers": "UbRH;WBtF;Btqy",
        "site": "https://openreview.net/forum?id=bIb1xhSCVY",
        "pdf_size": 528810,
        "rating": "3;3;3",
        "confidence": "4;5;3",
        "soundness": "2;2;3",
        "contribution": "2;3;3",
        "presentation": "2;1;2",
        "wc_summary": "122;32;177",
        "wc_strengths": "54;48;246",
        "wc_weaknesses": "396;156;781",
        "wc_questions": "52;2;554",
        "wc_review": "624;238;1758",
        "wc_reply_reviewers": "41;0;483",
        "wc_reply_authors": "769;324;1070",
        "reply_reviewers": "1;0;1",
        "reply_authors": "2;1;3",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            110.33333333333333,
            59.768070256803696
        ],
        "wc_strengths_avg": [
            116.0,
            91.9565114605812
        ],
        "wc_weaknesses_avg": [
            444.3333333333333,
            257.4339181658513
        ],
        "wc_questions_avg": [
            202.66666666666666,
            249.2673709538058
        ],
        "wc_review_avg": [
            873.3333333333334,
            645.0970641866402
        ],
        "wc_reply_reviewers_avg": [
            174.66666666666666,
            218.666158535995
        ],
        "wc_reply_authors_avg": [
            721.0,
            306.4386833718398
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16293901026335204048&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "University of Oxford;Cynch AI;Delft University of Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ox.ac.uk;https://www.cynch.ai;https://www.tudelft.nl",
        "aff_unique_abbr": "Oxford;Cynch AI;TU Delft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;0",
        "aff_country_unique": "United Kingdom;United States;Netherlands"
    },
    {
        "title": "Meta Inverse Constrained Reinforcement Learning: Convergence Guarantee and Generalization Analysis",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18338",
        "id": "bJ3gFiwRgi",
        "author_site": "Shicheng Liu, Minghui Zhu",
        "tldr": "",
        "abstract": "This paper considers the problem of learning the reward function and constraints of an expert from few demonstrations. This problem can be considered as a meta-learning problem where we first learn meta-priors over reward functions and constraints from other distinct but related tasks and then adapt the learned meta-priors to new tasks from only few expert demonstrations. We formulate a bi-level optimization problem where the upper level aims to learn a meta-prior over reward functions and the lower level is to learn a meta-prior over constraints. We propose a novel algorithm to solve this problem and formally guarantee that the algorithm reaches the set of $\\epsilon$-stationary points at the iteration complexity $O(\\frac{1}{\\epsilon^2})$. We also quantify the generalization error to an arbitrary new task. Experiments are used to validate that the learned meta-priors can adapt to new tasks with good performance from only few demonstrations.",
        "keywords": "inverse reinforcement learning;meta learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/6a661589f4f40d5905e6123cbba1ddd3ff82312c.zip",
        "author": "Shicheng Liu;Minghui Zhu",
        "authorids": "~Shicheng_Liu1;~Minghui_Zhu1",
        "gender": ";",
        "homepage": ";",
        "dblp": "231/6618;",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": "shicheng-liu-404a21239/;",
        "or_profile": "~Shicheng_Liu1;~Minghui_Zhu1",
        "aff": "Pennsylvania State University;",
        "aff_domain": "psu.edu;",
        "position": "PhD student;",
        "bibtex": "@inproceedings{\nliu2024meta,\ntitle={Meta Inverse Constrained Reinforcement Learning: Convergence Guarantee and Generalization Analysis},\nauthor={Shicheng Liu and Minghui Zhu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=bJ3gFiwRgi}\n}",
        "github": "",
        "project": "",
        "reviewers": "Eje2;byVV;NXcx;5qhh",
        "pdf_size": 1772542,
        "rating": "6;6;6;6",
        "confidence": "3;3;3;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "289;99;108;89",
        "wc_strengths": "160;103;46;67",
        "wc_weaknesses": "784;86;295;2",
        "wc_questions": "107;4;165;187",
        "wc_review": "1340;292;614;345",
        "wc_reply_reviewers": "479;0;11;0",
        "wc_reply_authors": "4981;1171;1332;1616",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "9;2;2;3",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            146.25,
            82.69031079878707
        ],
        "wc_strengths_avg": [
            94.0,
            43.2145808726638
        ],
        "wc_weaknesses_avg": [
            291.75,
            303.56578776271874
        ],
        "wc_questions_avg": [
            115.75,
            70.82857827176824
        ],
        "wc_review_avg": [
            647.75,
            417.90093024543506
        ],
        "wc_reply_reviewers_avg": [
            122.5,
            205.8743548866638
        ],
        "wc_reply_authors_avg": [
            2275.0,
            1570.4125254212665
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            4.0,
            2.9154759474226504
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 22,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7374633686346518431&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=bJ3gFiwRgi",
        "pdf": "https://openreview.net/pdf?id=bJ3gFiwRgi",
        "email": "psu.edu;",
        "author_num": 2,
        "aff_unique_index": "0",
        "aff_unique_norm": "Pennsylvania State University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.psu.edu",
        "aff_unique_abbr": "PSU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Facing the Elephant in the Room: Visual Prompt Tuning or Full finetuning?",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18337",
        "id": "bJx4iOIOxn",
        "author_site": "Cheng Han, Qifan Wang, Yiming Cui, Wenguan Wang, Lifu Huang, Siyuan Qi, Dongfang Liu",
        "tldr": "",
        "abstract": "As the scale of vision models continues to grow, the emergence of Visual Prompt Tuning (VPT) as a parameter-efficient transfer learning technique has gained attention due to its superior performance compared to traditional full-finetuning. However, the conditions favoring VPT (the \"when\") and the underlying rationale (the \"why\") remain unclear. In this paper, we conduct a comprehensive analysis across 19 distinct datasets and tasks. To understand the \"when\" aspect, we identify the scenarios where VPT proves favorable by two dimensions: task objectives and data distributions. We find that VPT is preferrable when there is 1) a substantial disparity between the original and the downstream task objectives ($e.g.$, transitioning from classification to counting), or 2) a notable similarity in data distributions between the two tasks ($e.g.$, both involve natural images). In exploring the \"why\" dimension, our results indicate VPT's success cannot be attributed solely to overfitting and optimization considerations. The unique way VPT preserves original features and adds parameters appears to be a pivotal factor. Our study provides insights into VPT's mechanisms, and offers guidance for its optimal utilization.",
        "keywords": "Visual prompt tuning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Cheng Han;Qifan Wang;Yiming Cui;Wenguan Wang;Lifu Huang;Siyuan Qi;Dongfang Liu",
        "authorids": "~Cheng_Han1;~Qifan_Wang2;~Yiming_Cui3;~Wenguan_Wang4;~Lifu_Huang1;~Siyuan_Qi1;~Dongfang_Liu1",
        "gender": "M;M;;M;M;;",
        "homepage": "https://chenghan111.github.io/;https://wqfcr.github.io/;;https://sites.google.com/view/wenguanwang/;https://wilburone.github.io/;;https://www.rit.edu/directory/dxleec-dongfang-liu",
        "dblp": "53/6096-1.html;33/8610;;145/1078;127/0072;177/5178;",
        "google_scholar": "VgkEKZwAAAAJ;LrSyLosAAAAJ;;CqAQQkgAAAAJ;76IEGtYAAAAJ;ePclJR4AAAAJ;uICY0vEAAAAJ",
        "orcid": "0000-0002-8145-3436;0000-0002-7570-5756;;0000-0002-0802-9567;;0000-0002-4070-733X;",
        "linkedin": "chenghan-87129219a/;;;wenguanwang;;;",
        "or_profile": "~Cheng_Han1;~Qifan_Wang2;~Yiming_Cui3;~Wenguan_Wang4;~Lifu_Huang1;~Siyuan_Qi1;~Dongfang_Liu1",
        "aff": "Rochester Institute of Technology;Meta AI;;Zhejiang University;Virginia Tech;Beijing Institute for General Artificial Intelligence;Rochester Institute of Technology",
        "aff_domain": "rit.edu;fb.com;;zju.edu.cn;vt.edu;bigai.ai;rit.edu",
        "position": "PhD student;Principal Researcher;;Full Professor;Assistant Professor;Researcher;Assistant Professor",
        "bibtex": "@inproceedings{\nhan2024facing,\ntitle={Facing the Elephant in the Room: Visual Prompt Tuning or Full finetuning?},\nauthor={Cheng Han and Qifan Wang and Yiming Cui and Wenguan Wang and Lifu Huang and Siyuan Qi and Dongfang Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=bJx4iOIOxn}\n}",
        "github": "",
        "project": "",
        "reviewers": "8arZ;5V4Y;jEi5;2Y28",
        "pdf_size": 45379333,
        "rating": "6;8;8;8",
        "confidence": "4;4;3;4",
        "soundness": "2;4;2;3",
        "contribution": "2;3;3;4",
        "presentation": "3;3;3;3",
        "wc_summary": "137;59;391;128",
        "wc_strengths": "195;26;76;38",
        "wc_weaknesses": "258;172;77;271",
        "wc_questions": "16;5;402;2",
        "wc_review": "606;262;946;439",
        "wc_reply_reviewers": "159;63;87;14",
        "wc_reply_authors": "1304;937;1132;797",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "3;3;3;2",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            178.75,
            126.20296153418904
        ],
        "wc_strengths_avg": [
            83.75,
            66.82954062388878
        ],
        "wc_weaknesses_avg": [
            194.5,
            77.77692459849516
        ],
        "wc_questions_avg": [
            106.25,
            170.83087396603696
        ],
        "wc_review_avg": [
            563.25,
            252.24727451451284
        ],
        "wc_reply_reviewers_avg": [
            80.75,
            52.27989575353034
        ],
        "wc_reply_authors_avg": [
            1042.5,
            192.21927582841425
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.75,
            0.4330127018922193
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 35,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6980540575936557861&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=bJx4iOIOxn",
        "pdf": "https://openreview.net/pdf?id=bJx4iOIOxn",
        "email": "rit.edu;fb.com;;zju.edu.cn;vt.edu;bigai.ai;rit.edu",
        "author_num": 7,
        "aff_unique_index": "0;1;2;3;4;0",
        "aff_unique_norm": "Rochester Institute of Technology;Meta;Zhejiang University;Virginia Tech;Beijing Institute for General Artificial Intelligence",
        "aff_unique_dep": ";Meta AI;;;",
        "aff_unique_url": "https://www.rit.edu;https://meta.com;https://www.zju.edu.cn;https://www.vt.edu;http://www.bigaiai.org/",
        "aff_unique_abbr": "RIT;Meta;ZJU;VT;BIGAI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;1;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "bKzX0m6TEZ",
        "title": "An Inexact Conditional Gradient Method for Constrained Bilevel Optimization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Bilevel optimization is an important class of optimization problems where one optimization problem is nested within another. This framework is widely used in machine learning problems, including meta-learning, data hyper-cleaning, and matrix completion with denoising. In this paper, we focus on a bilevel optimization problem with a strongly convex lower-level problem and a smooth upper-level objective function over a compact and convex constraint set. \nSeveral methods have been developed for tackling unconstrained bilevel optimization problems, but there is limited work on methods for the constrained setting. In fact, for those methods that can handle constrained problems, either the convergence rate is slow or the computational cost per iteration is expensive. To address this issue, in this paper, we introduce a novel single-loop projection-free method using a nested approximation technique. \nOur proposed method has an improved per-iteration complexity, surpassing existing methods, and achieves optimal convergence rate guarantees matching the best-known complexity of projection-free algorithms for solving convex constrained single-level optimization problems. In particular, when the upper-level objective function is convex, our method requires $\\tilde{\\mathcal{O}}(\\epsilon^{-1})$ iterations to find an $\\epsilon$-optimal solution. Moreover,  when the upper-level objective function is non-convex the complexity of our method is  $\\mathcal{O}(\\epsilon^{-2})$ to find an $\\epsilon$-stationary point. We also present numerical experiments to showcase the superior performance of our method compared with state-of-the-art methods.",
        "keywords": "Bilevel Optimization;Conditional Gradient Method",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/d211a00d524b82fccd04ca07ab8d6336829fbc93.zip",
        "author": "Nazanin Abolfazli;Ruichen Jiang;Aryan Mokhtari;Erfan Yazdandoost Hamedani",
        "authorids": "~Nazanin_Abolfazli1;~Ruichen_Jiang1;~Aryan_Mokhtari3;~Erfan_Yazdandoost_Hamedani1",
        "gender": "F;;M;M",
        "homepage": ";https://ruichen-jiang.github.io/;https://sites.utexas.edu/mokhtari/;https://profiles.arizona.edu/person/erfany",
        "dblp": "322/4143;271/7916;140/7407;191/6717",
        "google_scholar": "-N0detkAAAAJ;BGFt1UMAAAAJ;glcep6EAAAAJ;imtUGbQAAAAJ",
        "orcid": ";;;0000-0002-3229-3499",
        "linkedin": ";;;",
        "or_profile": "~Nazanin_Abolfazli1;~Ruichen_Jiang1;~Aryan_Mokhtari3;~Erfan_Yazdandoost_Hamedani1",
        "aff": "University of Arizona;University of Texas at Austin;University of Texas, Austin;University of Arizona",
        "aff_domain": "arizona.edu;utexas.edu;utexas.edu;arizona.edu",
        "position": "PhD student;PhD student;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nabolfazli2024an,\ntitle={An Inexact Conditional Gradient Method for Constrained Bilevel Optimization},\nauthor={Nazanin Abolfazli and Ruichen Jiang and Aryan Mokhtari and Erfan Yazdandoost Hamedani},\nyear={2024},\nurl={https://openreview.net/forum?id=bKzX0m6TEZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "Mtbs;Aef9;dfVp;scGd",
        "site": "https://openreview.net/forum?id=bKzX0m6TEZ",
        "pdf_size": 1665649,
        "rating": "5;6;6;8",
        "confidence": "4;3;4;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "4;3;3;3",
        "wc_summary": "49;74;177;33",
        "wc_strengths": "98;43;43;74",
        "wc_weaknesses": "287;41;189;96",
        "wc_questions": "6;74;176;18",
        "wc_review": "440;232;585;221",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "735;133;940;337",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            83.25,
            56.06413737854173
        ],
        "wc_strengths_avg": [
            64.5,
            23.11384866265244
        ],
        "wc_weaknesses_avg": [
            153.25,
            93.60121526988846
        ],
        "wc_questions_avg": [
            68.5,
            67.16211729836992
        ],
        "wc_review_avg": [
            369.5,
            151.96134376873613
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            536.25,
            318.12998522616505
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.6882472016116854,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13047463620757454233&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1;0",
        "aff_unique_norm": "University of Arizona;University of Texas at Austin",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.arizona.edu;https://www.utexas.edu",
        "aff_unique_abbr": "UA;UT Austin",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Austin",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "UC-NERF: Neural Radiance Field for Under-Calibrated Multi-View Cameras in Autonomous Driving",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18336",
        "id": "bLKcCe7hYh",
        "author_site": "Kai Cheng, Xiaoxiao Long, Wei Yin, Jin Wang, Zhiqiang Wu, Yuexin Ma, Kaixuan Wang, Xiaozhi Chen, Xuejin Chen",
        "tldr": "",
        "abstract": "Multi-camera setups find widespread use across various applications, such as autonomous driving, as they greatly expand sensing capabilities. \nDespite the fast development of Neural radiance field (NeRF) techniques and their wide applications in both indoor and outdoor scenes, applying NeRF to multi-camera systems remains very challenging. This is primarily due to the inherent under-calibration issues in multi-camera setup, including inconsistent imaging effects stemming from separately calibrated image signal processing units in diverse cameras, and system errors arising from mechanical vibrations during driving that affect relative camera poses.\nIn this paper, we present UC-NeRF, a novel method tailored for novel view synthesis in under-calibrated multi-view camera systems.\nFirstly, we propose a layer-based color correction to rectify the color inconsistency in different image regions. Second, we propose virtual warping to generate more viewpoint-diverse but color-consistent virtual views for color correction and 3D recovery. Finally, a spatiotemporally constrained pose refinement is designed for more robust and accurate pose calibration in multi-camera systems.\nOur method not only achieves state-of-the-art performance of novel view synthesis in multi-camera setups, but also effectively facilitates depth estimation in large-scale outdoor scenes with the synthesized novel views.",
        "keywords": "Neural radiance field;Multi-cameras;Under-Calibration;Color Inconsistency",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/55b68486b03f50116c83713c950f715b16a439a3.zip",
        "author": "Kai Cheng;Xiaoxiao Long;Wei Yin;Jin Wang;Zhiqiang Wu;Yuexin Ma;Kaixuan Wang;Xiaozhi Chen;Xuejin Chen",
        "authorids": "~Kai_Cheng1;~Xiaoxiao_Long2;~Wei_Yin2;~Jin_Wang12;~Zhiqiang_Wu1;~Yuexin_Ma2;~Kaixuan_Wang2;~Xiaozhi_Chen4;~Xuejin_Chen1",
        "gender": "M;;M;M;M;F;M;;",
        "homepage": "https://cklibra.github.io/;;https://yvanyin.net/;;;http://yuexinma.me/aboutme.html;https://wang-kx.github.io/;;",
        "dblp": "23/2177;;67/4051-6;;;209/5925;;;",
        "google_scholar": "LeDSFrAAAAAJ;;ZIf_rtcAAAAJ;;2jGOyuwAAAAJ;;;;",
        "orcid": ";;;;;;;;",
        "linkedin": ";;;https://www.linkedin.cn/injobs/in/jin-wang-5a9027236;;;;;",
        "or_profile": "~Kai_Cheng1;~Xiaoxiao_Long2;~Wei_Yin2;~Jin_Wang12;~Zhiqiang_Wu1;~Yuexin_Ma2;~Kaixuan_Wang2;~Xiaozhi_Chen4;~Xuejin_Chen1",
        "aff": "University of Science and Technology of China;; Shenzhen DJI Sciences and Technologies Ltd.;University of Science and Technology of China;Wright State University;ShanghaiTech University;;;",
        "aff_domain": "ustc.edu.cn;;dji.com;ustc.edu.cn;wright.edu;shanghaitech.edu.cn;;;",
        "position": "PhD student;;Researcher;MS student;Full Professor;Assistant Professor;;;",
        "bibtex": "@inproceedings{\ncheng2024ucnerf,\ntitle={{UC}-{NERF}: Neural Radiance Field for Under-Calibrated Multi-View Cameras in Autonomous Driving},\nauthor={Kai Cheng and Xiaoxiao Long and Wei Yin and Jin Wang and Zhiqiang Wu and Yuexin Ma and Kaixuan Wang and Xiaozhi Chen and Xuejin Chen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=bLKcCe7hYh}\n}",
        "github": "",
        "project": "",
        "reviewers": "5Tdv;ehJ8;oEhA;9RAi;oaML",
        "pdf_size": 17069873,
        "rating": "5;6;6;6;6",
        "confidence": "4;5;4;5;4",
        "soundness": "3;2;3;3;3",
        "contribution": "2;2;4;3;3",
        "presentation": "3;3;3;3;3",
        "wc_summary": "106;148;77;105;172",
        "wc_strengths": "31;69;34;61;24",
        "wc_weaknesses": "174;204;49;201;411",
        "wc_questions": "6;97;58;14;22",
        "wc_review": "317;518;218;381;629",
        "wc_reply_reviewers": "0;143;37;75;98",
        "wc_reply_authors": "968;1074;147;1395;609",
        "reply_reviewers": "0;1;1;2;1",
        "reply_authors": "2;3;2;4;2",
        "rating_avg": [
            5.8,
            0.39999999999999997
        ],
        "confidence_avg": [
            4.4,
            0.48989794855663565
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.8,
            0.7483314773547882
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            121.6,
            33.89749253263433
        ],
        "wc_strengths_avg": [
            43.8,
            17.79213309302738
        ],
        "wc_weaknesses_avg": [
            207.8,
            116.37078671212977
        ],
        "wc_questions_avg": [
            39.4,
            33.84434960226005
        ],
        "wc_review_avg": [
            412.6,
            145.56455612545247
        ],
        "wc_reply_reviewers_avg": [
            70.6,
            49.24469514577179
        ],
        "wc_reply_authors_avg": [
            838.6,
            427.26226138052493
        ],
        "reply_reviewers_avg": [
            1.0,
            0.6324555320336759
        ],
        "reply_authors_avg": [
            2.6,
            0.8
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.40824829046386313,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7285519846393559442&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=bLKcCe7hYh",
        "pdf": "https://openreview.net/pdf?id=bLKcCe7hYh",
        "email": "ustc.edu.cn;;dji.com;ustc.edu.cn;wright.edu;shanghaitech.edu.cn;;;",
        "author_num": 9,
        "aff_unique_index": "0;1;0;2;3",
        "aff_unique_norm": "University of Science and Technology of China;DJI Sciences and Technologies;Wright State University;ShanghaiTech University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "http://www.ustc.edu.cn;https://www.dji.com;https://www.wright.edu;https://www.shanghaitech.edu.cn",
        "aff_unique_abbr": "USTC;DJI;WSU;ShanghaiTech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "bLhqPxRy3G",
        "title": "Linear programming using diagonal linear networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Linear programming has played a crucial role in shaping decision-making, resource allocation, and cost reduction in various domains. In this paper, we investigate the application of overparametrized neural networks and their implicit bias in solving linear programming problems. Specifically, our findings reveal that training diagonal linear networks with gradient descent, while optimizing the squared $L_2$-norm of the slack variable, leads to solutions for entropically regularized linear programming problems. Remarkably, the strength of this regularization depends on the initialization used in the gradient descent process. We analyze the convergence of both discrete-time and continuous-time dynamics and demonstrate that both exhibit a linear rate of convergence, requiring only mild assumptions on the constraint matrix. For the first time, we introduce a comprehensive framework for solving linear programming problems using diagonal neural networks. We underscore the significance of our discoveries by applying them to address challenges in basis pursuit and optimal transport problems.",
        "keywords": "Linear program;diagonally linear network;reparameterization;implicit bias",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Haoyue Wang;Promit Ghosal;Rahul Mazumder",
        "authorids": "~Haoyue_Wang3;~Promit_Ghosal1;~Rahul_Mazumder1",
        "gender": ";M;M",
        "homepage": ";https://sites.google.com/view/promit-ghosal/home;http://www.mit.edu/~rahulmaz/",
        "dblp": ";;11/9365.html",
        "google_scholar": "N-iirNIAAAAJ;Gp90OAUAAAAJ;cyCp3pIAAAAJ",
        "orcid": ";;0000-0003-1384-9743",
        "linkedin": ";promit-ghosal-84822439/;",
        "or_profile": "~Haoyue_Wang3;~Promit_Ghosal1;~Rahul_Mazumder1",
        "aff": "Massachusetts Institute of Technology;;Massachusetts Institute of Technology",
        "aff_domain": "mit.edu;;mit.edu",
        "position": "PhD student;;Associate Professor",
        "bibtex": "@misc{\nwang2024linear,\ntitle={Linear programming using diagonal linear networks},\nauthor={Haoyue Wang and Promit Ghosal and Rahul Mazumder},\nyear={2024},\nurl={https://openreview.net/forum?id=bLhqPxRy3G}\n}",
        "github": "",
        "project": "",
        "reviewers": "p2u6;9DAk;xDbj;FLD4",
        "site": "https://openreview.net/forum?id=bLhqPxRy3G",
        "pdf_size": 419486,
        "rating": "5;6;6;6",
        "confidence": "4;4;2;3",
        "soundness": "3;2;3;2",
        "contribution": "2;2;3;2",
        "presentation": "1;3;3;3",
        "wc_summary": "59;45;38;104",
        "wc_strengths": "98;54;21;60",
        "wc_weaknesses": "161;239;96;192",
        "wc_questions": "47;2;70;111",
        "wc_review": "365;340;225;467",
        "wc_reply_reviewers": "127;125;0;11",
        "wc_reply_authors": "771;1157;458;797",
        "reply_reviewers": "1;2;0;1",
        "reply_authors": "2;3;2;2",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            61.5,
            25.675864152935535
        ],
        "wc_strengths_avg": [
            58.25,
            27.334730655340287
        ],
        "wc_weaknesses_avg": [
            172.0,
            51.92783453986888
        ],
        "wc_questions_avg": [
            57.5,
            39.39860403618382
        ],
        "wc_review_avg": [
            349.25,
            86.07663736461828
        ],
        "wc_reply_reviewers_avg": [
            65.75,
            60.37952881565076
        ],
        "wc_reply_authors_avg": [
            795.75,
            247.58369796898987
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12732735192293081732&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Massachusetts Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://web.mit.edu",
        "aff_unique_abbr": "MIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Boundary Denoising for Video Activity Localization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18335",
        "id": "bLpUtGyf9g",
        "author_site": "Mengmeng Xu, Mattia Soldan, Jialin Gao, Shuming Liu, Juan-Manuel Perez-Rua, Bernard Ghanem",
        "tldr": "",
        "abstract": "Video activity localization aims at understanding the semantic content in long, untrimmed videos and retrieving actions of interest. The retrieved action with its start and end locations can be used for highlight generation, temporal action detection, etc. Unfortunately, learning the exact boundary location of activities is highly challenging because temporal activities are continuous in time, and there are often no clear-cut transitions between actions. Moreover, the definition of the start and end of events is subjective, which may confuse the model. To alleviate the boundary ambiguity, we propose to study the video activity localization problem from a denoising perspective. Specifically, we propose an encoder-decoder model named DenosieLoc. During training, a set of temporal spans is randomly generated from the ground truth with a controlled noise scale. Then, we attempt to reverse this process by boundary denoising, allowing the localizer to predict activities with precise boundaries and resulting in faster convergence speed. Experiments show that DenosieLoc advances \nseveral video activity understanding tasks. For example, we observe a gain of +12.36% average mAP on the QV-Highlights dataset.\nMoreover, DenosieLoc achieves state-of-the-art performance on the MAD dataset but with much fewer predictions than others.",
        "keywords": "video activity localization;boundary denoising",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/d57763043c98e7e1bd743d2a2a7a23e9950774cb.zip",
        "author": "Mengmeng Xu;Mattia Soldan;Jialin Gao;Shuming Liu;Juan-Manuel Perez-Rua;Bernard Ghanem",
        "authorids": "~Mengmeng_Xu1;~Mattia_Soldan1;~Jialin_Gao1;~Shuming_Liu2;~Juan-Manuel_Perez-Rua1;~Bernard_Ghanem1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://ivul.kaust.edu.sa/Pages/Frost-Xu.aspx;https://www.mattiasoldan.com/;https://scholar.google.com/citations?user=sj4FqEgAAAAJ&hl=en;;;https://ivul.kaust.edu.sa",
        "dblp": ";245/9853;32/10264;181/1700-1;172/9703;37/2516",
        "google_scholar": "be_ox9QAAAAJ;M5tSjYYAAAAJ;sj4FqEgAAAAJ;https://scholar.google.ae/citations?hl=en;;rVsGTeEAAAAJ",
        "orcid": ";0000-0003-0413-8165;0000-0002-8554-7827;0000-0001-5227-647X;;0000-0002-5534-587X",
        "linkedin": ";mattia-soldan/;;;;bernardghanem/",
        "or_profile": "~Mengmeng_Xu1;~Mattia_Soldan1;~Jialin_Gao1;~Shuming_Liu2;~Juan-Manuel_Perez-Rua1;~Bernard_Ghanem1",
        "aff": "Meta ;KAUST;National University of Singapore;King Abdullah University of Science and Technology;Meta Facebook;King Abdullah University of Science and Technology",
        "aff_domain": "meta.com;kaust.edu.sa;nus.edu.sg;kaust.edu.sa;fb.com;kaust.edu.sa",
        "position": "Researcher;PhD student;Researcher;PhD student;Research Scientist;Full Professor",
        "bibtex": "@inproceedings{\nxu2024boundary,\ntitle={Boundary Denoising for Video Activity Localization},\nauthor={Mengmeng Xu and Mattia Soldan and Jialin Gao and Shuming Liu and Juan-Manuel Perez-Rua and Bernard Ghanem},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=bLpUtGyf9g}\n}",
        "github": "",
        "project": "",
        "reviewers": "61UD;uvci;UMQX;6dfr",
        "pdf_size": 1495914,
        "rating": "3;6;6;8",
        "confidence": "3;5;5;4",
        "soundness": "1;3;3;4",
        "contribution": "2;3;2;3",
        "presentation": "2;2;4;3",
        "wc_summary": "51;54;90;57",
        "wc_strengths": "10;22;47;54",
        "wc_weaknesses": "407;127;363;43",
        "wc_questions": "64;36;6;7",
        "wc_review": "532;239;506;161",
        "wc_reply_reviewers": "0;31;71;0",
        "wc_reply_authors": "1382;355;1606;199",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "2;1;3;1",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            1.0897247358851685
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            63.0,
            15.732132722552274
        ],
        "wc_strengths_avg": [
            33.25,
            17.93564885918544
        ],
        "wc_weaknesses_avg": [
            235.0,
            153.7010084547268
        ],
        "wc_questions_avg": [
            28.25,
            23.8995292840675
        ],
        "wc_review_avg": [
            359.5,
            162.12726482612356
        ],
        "wc_reply_reviewers_avg": [
            25.5,
            29.159046623646667
        ],
        "wc_reply_authors_avg": [
            885.5,
            616.1057133317302
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5488604301969737,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11287002185478389153&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=bLpUtGyf9g",
        "pdf": "https://openreview.net/pdf?id=bLpUtGyf9g",
        "email": "meta.com;kaust.edu.sa;nus.edu.sg;kaust.edu.sa;fb.com;kaust.edu.sa",
        "author_num": 6,
        "aff_unique_index": "0;1;2;1;0;1",
        "aff_unique_norm": "Meta;King Abdullah University of Science and Technology;National University of Singapore",
        "aff_unique_dep": "Meta Platforms, Inc.;;",
        "aff_unique_url": "https://meta.com;https://www.kaust.edu.sa;https://www.nus.edu.sg",
        "aff_unique_abbr": "Meta;KAUST;NUS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;1;0;1",
        "aff_country_unique": "United States;Saudi Arabia;Singapore"
    },
    {
        "id": "bM6LUC2lec",
        "title": "MSA Generation with Seqs2Seqs Pretraining: Advancing Protein Structure Predictions",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep learning, epitomized by models like AlphaFold2 \\citep{jumper2021highly}, has achieved unparalleled accuracy in protein structure prediction. However, the depth of multiple sequence alignment (MSA) remains a bottleneck, especially for proteins lacking extensive homologous families. Addressing this, we present \\METHODNAME{}, a self-supervised generative protein language model, pre-trained on a sequence\\textbf{s}-to-sequence\\textbf{s} task with an automatically constructed dataset. Equipped with protein-specific attention mechanisms, \\METHODNAME{} harnesses large-scale protein databases to generate virtual, informative MSAs, enriching subpar MSAs and amplifying prediction accuracy. Our experiments with CASP14 and CASP15 benchmarks showcase marked LDDT improvements, especially for challenging sequences, enhancing both AlphaFold2 and RoseTTAFold's performance.",
        "keywords": "Protein Language Model;Protein Structure Prediction",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Le Zhang;Jiayang Chen;Tao Shen;Yu Li;Siqi Sun",
        "authorids": "~Le_Zhang6;~Jiayang_Chen2;~Tao_Shen2;~Yu_Li1;~Siqi_Sun2",
        "gender": "M;;M;M;M",
        "homepage": "https://lezhang7.github.io/;;;https://sites.google.com/view/liyu1995;https://intersun.github.io/",
        "dblp": "03/4043-12;;95/4097;;120/1735",
        "google_scholar": "NqbBXAsAAAAJ;W592S5YAAAAJ;8cprenoAAAAJ;8YHZx-AAAAAJ;2dyg3WgAAAAJ",
        "orcid": ";;;0000-0002-3664-6722;",
        "linkedin": ";;;yuli1995/;",
        "or_profile": "~Le_Zhang6;~Jiayang_Chen2;~Tao_Shen2;~Yu_Li1;~Siqi_Sun2",
        "aff": "Mila - Quebec AI Institute & Universit\u00e9 de Montr\u00e9al;;Tencent AI Lab;Department of Computer Science and Engineering, The Chinese University of Hong Kong;Fudan University",
        "aff_domain": "mila.umontreal.ca;;tencent.com;cse.cuhk.edu.hk;fudan.edu.cn",
        "position": "PhD student;;Researcher;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nzhang2024msa,\ntitle={{MSA} Generation with Seqs2Seqs Pretraining: Advancing Protein Structure Predictions},\nauthor={Le Zhang and Jiayang Chen and Tao Shen and Yu Li and Siqi Sun},\nyear={2024},\nurl={https://openreview.net/forum?id=bM6LUC2lec}\n}",
        "github": "",
        "project": "",
        "reviewers": "ix3n;aF1D;b6rT",
        "site": "https://openreview.net/forum?id=bM6LUC2lec",
        "pdf_size": 5466040,
        "rating": "5;6;6",
        "confidence": "4;4;3",
        "soundness": "3;4;2",
        "contribution": "2;3;3",
        "presentation": "3;3;3",
        "wc_summary": "135;107;65",
        "wc_strengths": "39;51;37",
        "wc_weaknesses": "35;221;440",
        "wc_questions": "236;2;6",
        "wc_review": "445;381;548",
        "wc_reply_reviewers": "0;92;0",
        "wc_reply_authors": "755;600;749",
        "reply_reviewers": "0;1;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            102.33333333333333,
            28.767265347188555
        ],
        "wc_strengths_avg": [
            42.333333333333336,
            6.182412330330469
        ],
        "wc_weaknesses_avg": [
            232.0,
            165.5234122412899
        ],
        "wc_questions_avg": [
            81.33333333333333,
            109.37803964030238
        ],
        "wc_review_avg": [
            458.0,
            68.79437961539203
        ],
        "wc_reply_reviewers_avg": [
            30.666666666666668,
            43.36921591277491
        ],
        "wc_reply_authors_avg": [
            701.3333333333334,
            71.69534309996865
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:vYin7XwL7J4J:scholar.google.com/&scioq=MSA+Generation+with+Seqs2Seqs+Pretraining:+Advancing+Protein+Structure+Predictions&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Universit\u00e9 de Montr\u00e9al;Tencent;Chinese University of Hong Kong;Fudan University",
        "aff_unique_dep": "Quebec AI Institute;Tencent AI Lab;Department of Computer Science and Engineering;",
        "aff_unique_url": "https://www.umontreal.ca;https://ai.tencent.com;https://www.cuhk.edu.hk;https://www.fudan.edu.cn",
        "aff_unique_abbr": "UdeM;Tencent AI Lab;CUHK;Fudan",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Montreal;;Hong Kong SAR",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "Canada;China"
    },
    {
        "title": "Phenomenal Yet Puzzling: Testing Inductive Reasoning Capabilities of Language Models with Hypothesis Refinement",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18334",
        "id": "bNt7oajl2a",
        "author_site": "Linlu Qiu, Liwei Jiang, Ximing Lu, Melanie Sclar, Valentina Pyatkin, Chandra Bhagavatula, Bailin Wang, Yoon Kim, Yejin Choi, Nouha Dziri, Xiang Ren",
        "tldr": "",
        "abstract": "The ability to derive underlying principles from a handful of observations and then generalize to novel situations---known as inductive reasoning---is central to human intelligence. Prior work suggests that language models (LMs) often fall short on inductive reasoning, despite achieving impressive success on research benchmarks. In this work, we conduct a systematic study of the inductive reasoning capabilities of LMs through $\\textit{iterative hypothesis refinement}$, a technique that more closely mirrors the human inductive process than standard input-output prompting. Iterative hypothesis refinement employs a three-step process: proposing, selecting, and refining hypotheses in the form of textual rules. By examining the intermediate rules, we observe that LMs are phenomenal $\\textit{hypothesis proposers}$ (i.e., generating candidate rules), and when coupled with a (task-specific) symbolic interpreter that is able to systematically filter the proposed set of rules, this hybrid approach achieves strong results across inductive reasoning benchmarks that require inducing causal relations, language-like instructions, and symbolic concepts. However, they also behave as puzzling $\\textit{inductive reasoners}$, showing notable performance gaps between rule induction (i.e., identifying plausible rules) and rule application (i.e., applying proposed rules to instances), suggesting that LMs are proposing hypotheses without being able to actually apply the rules. Through empirical and human analyses, we further reveal several discrepancies between the inductive reasoning processes of LMs and humans, shedding light on both the potentials and limitations of using LMs in inductive reasoning tasks.",
        "keywords": "language model;natural language processing;inductive reasoning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Linlu Qiu;Liwei Jiang;Ximing Lu;Melanie Sclar;Valentina Pyatkin;Chandra Bhagavatula;Bailin Wang;Yoon Kim;Yejin Choi;Nouha Dziri;Xiang Ren",
        "authorids": "~Linlu_Qiu1;~Liwei_Jiang2;~Ximing_Lu1;~Melanie_Sclar1;~Valentina_Pyatkin1;~Chandra_Bhagavatula1;~Bailin_Wang3;~Yoon_Kim1;~Yejin_Choi1;~Nouha_Dziri2;~Xiang_Ren1",
        "gender": "F;F;F;F;;M;;;F;;M",
        "homepage": "https://linlu-qiu.github.io/;https://liweijiang.me;https://gloriaximinglu.github.io/;https://msclar.github.io;;https://www.chandrab.page;;https://people.csail.mit.edu/yoonkim/;https://yejinc.github.io/;;https://shanzhenren.github.io/",
        "dblp": "267/2348;;24/10879;274/6796;;151/3093;;;89/579-1;;36/360-1",
        "google_scholar": "D1uOAWcAAAAJ;lcPsDgUAAAAJ;https://scholar.google.com/citations?hl=en;4uNPtZgAAAAJ;;AsgHp14AAAAJ;;n_ts4eYAAAAJ;vhP-tlcAAAAJ;;_moJlrIAAAAJ",
        "orcid": ";;;;;;;;;;",
        "linkedin": ";;;melanie-sclar-077047b5/;;;;;;;xren7",
        "or_profile": "~Linlu_Qiu1;~Liwei_Jiang2;~Ximing_Lu1;~Melanie_Sclar1;~Valentina_Pyatkin1;~Chandra_Bhagavatula1;~Bailin_Wang3;~Yoon_Kim1;~Yejin_Choi1;~Nouha_Dziri2;~Xiang_Ren1",
        "aff": "Massachusetts Institute of Technology;University of Washington;University of Washington;University of Washington, Seattle;;Allen Institute for Artificial Intelligence;;Massachusetts Institute of Technology;Department of Computer Science, University of Washington;;University of Southern California",
        "aff_domain": "mit.edu;washington.edu;cs.washington.edu;uw.edu;;allenai.org;;mit.edu;cs.washington.edu;;usc.edu",
        "position": "PhD student;PhD student;PhD student;PhD student;;Researcher;;Assistant Professor;Full Professor;;Associate Professor",
        "bibtex": "@inproceedings{\nqiu2024phenomenal,\ntitle={Phenomenal Yet Puzzling: Testing Inductive Reasoning Capabilities of Language Models with Hypothesis Refinement},\nauthor={Linlu Qiu and Liwei Jiang and Ximing Lu and Melanie Sclar and Valentina Pyatkin and Chandra Bhagavatula and Bailin Wang and Yoon Kim and Yejin Choi and Nouha Dziri and Xiang Ren},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=bNt7oajl2a}\n}",
        "github": "",
        "project": "",
        "reviewers": "MmPX;6Upx;bJW9;EAiR",
        "pdf_size": 1592196,
        "rating": "8;8;8;8",
        "confidence": "5;5;4;3",
        "soundness": "3;4;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;4;4;3",
        "wc_summary": "60;154;33;134",
        "wc_strengths": "61;127;48;67",
        "wc_weaknesses": "846;167;76;188",
        "wc_questions": "25;10;130;117",
        "wc_review": "992;458;287;506",
        "wc_reply_reviewers": "222;0;12;12",
        "wc_reply_authors": "2435;1147;652;956",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "5;2;1;2",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            95.25,
            50.17656325417276
        ],
        "wc_strengths_avg": [
            75.75,
            30.375771595138122
        ],
        "wc_weaknesses_avg": [
            319.25,
            307.01903442620625
        ],
        "wc_questions_avg": [
            70.5,
            53.462603752529674
        ],
        "wc_review_avg": [
            560.75,
            261.9497804923684
        ],
        "wc_reply_reviewers_avg": [
            61.5,
            92.79412696932926
        ],
        "wc_reply_authors_avg": [
            1297.5,
            680.0457705184263
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            1.5
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 78,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3884371986860134330&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=bNt7oajl2a",
        "pdf": "https://openreview.net/pdf?id=bNt7oajl2a",
        "email": "mit.edu;washington.edu;cs.washington.edu;uw.edu;;allenai.org;;mit.edu;cs.washington.edu;;usc.edu",
        "author_num": 11,
        "aff_unique_index": "0;1;1;1;2;0;1;3",
        "aff_unique_norm": "Massachusetts Institute of Technology;University of Washington;Allen Institute for Artificial Intelligence;University of Southern California",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://web.mit.edu;https://www.washington.edu;https://allenai.org;https://www.usc.edu",
        "aff_unique_abbr": "MIT;UW;AI2;USC",
        "aff_campus_unique_index": "1;1;2",
        "aff_campus_unique": ";Seattle;Los Angeles",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "bO1UP57GAw",
        "title": "Dataset Distillation via Adversarial Prediction Matching",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Dataset distillation is the technique of synthesizing smaller condensed datasets from large original datasets while retaining necessary information to persist the effect. In this paper, we approach the dataset distillation problem from a novel perspective: we regard minimizing the prediction discrepancy on the real data distribution between models, which are respectively trained on the large original dataset and on the small distilled dataset, as a conduit for condensing information from the raw data into the distilled version. An adversarial framework is proposed to solve the problem efficiently. In contrast to existing distillation methods involving nested optimization or long-range gradient unrolling,  our approach hinges on single-level optimization. \nThis ensures the memory efficiency of our method and provides a flexible tradeoff between time and memory budgets, allowing us to distil ImageNet-1K using a minimum of only 6.5GB of GPU memory. Under the optimal tradeoff strategy, it requires only 2.5$\\times$ less memory and 5$\\times$ less runtime compared to the state-of-the-art.\nEmpirically, our method can produce synthetic datasets just 10\\% the size of the original, yet achieve, on average, 94\\% of the test accuracy of models trained on the full original datasets including ImageNet-1K, significantly surpassing state-of-the-art. Additionally, extensive tests reveal that our distilled datasets excel in cross-architecture generalization capabilities.",
        "keywords": "Dataset Condensation;Dataset Distillation;Adversarial Framework;Deep Learning;Dataset Synthesis",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/eaef756e1a944ccc38581de1e37862a28958603f.zip",
        "author": "Mingyang Chen;Bo Huang;JUNDA LU;Bing Li;Yi Wang;Minhao Cheng;Wei Wang",
        "authorids": "~Mingyang_Chen4;~Bo_Huang6;~JUNDA_LU1;~Bing_Li5;~Yi_Wang18;~Minhao_Cheng1;~Wei_Wang55",
        "gender": "M;M;M;M;F;M;M",
        "homepage": ";;;https://windofshadow.github.io/;;https://cmhcbb.github.io/;http://wei-wang.net",
        "dblp": "125/2319;95/6229;;13/2692-2;17/221-17;174/1717;w/WeiWang00",
        "google_scholar": ";;;fLbZnrgAAAAJ;hYVi3vIAAAAJ;_LkC1yoAAAAJ;wLtu3FYAAAAJ",
        "orcid": "0000-0002-3464-0976;0000-0002-5529-4734;;;0000-0002-8448-8570;0000-0003-3965-4215;0000-0002-1568-2396",
        "linkedin": ";;junda-lu-2a33aa219;;;;",
        "or_profile": "~Mingyang_Chen4;~Bo_Huang6;~JUNDA_LU1;~Bing_Li5;~Yi_Wang18;~Minhao_Cheng1;~Wei_Wang55",
        "aff": "Hong Kong University of Science and Technology;Hong Kong University of Science and Technology;;A*STAR Centre for Frontier AI Research (CFAR) ;Dongguan University of Technology;Pennsylvania State University;Hong Kong University of Science and Technology",
        "aff_domain": "ust.hk;ust.hk;;ihpc.a-star.edu.sg;dgut.edu.cn;psu.edu;ust.hk",
        "position": "PhD student;PhD student;;Researcher;Full Professor;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nchen2024dataset,\ntitle={Dataset Distillation via Adversarial Prediction Matching},\nauthor={Mingyang Chen and Bo Huang and JUNDA LU and Bing Li and Yi Wang and Minhao Cheng and Wei Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=bO1UP57GAw}\n}",
        "github": "",
        "project": "",
        "reviewers": "YDsU;oYNQ;Q2TW",
        "site": "https://openreview.net/forum?id=bO1UP57GAw",
        "pdf_size": 795189,
        "rating": "5;5;5",
        "confidence": "4;4;4",
        "soundness": "3;2;2",
        "contribution": "2;2;2",
        "presentation": "3;3;3",
        "wc_summary": "85;68;74",
        "wc_strengths": "71;38;37",
        "wc_weaknesses": "114;158;218",
        "wc_questions": "137;172;16",
        "wc_review": "407;436;345",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1553;1166;1507",
        "reply_reviewers": "0;0;0",
        "reply_authors": "3;3;3",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            75.66666666666667,
            7.039570693980959
        ],
        "wc_strengths_avg": [
            48.666666666666664,
            15.797327481430381
        ],
        "wc_weaknesses_avg": [
            163.33333333333334,
            42.62497963505541
        ],
        "wc_questions_avg": [
            108.33333333333333,
            66.83478801409404
        ],
        "wc_review_avg": [
            396.0,
            37.95611501018863
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1408.6666666666667,
            172.61582262997277
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            3.0,
            0.0
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5626714082685461476&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1;2;3;0",
        "aff_unique_norm": "Hong Kong University of Science and Technology;A*STAR Centre for Frontier AI Research;Dongguan University of Technology;Pennsylvania State University",
        "aff_unique_dep": ";Centre for Frontier AI Research;;",
        "aff_unique_url": "https://www.ust.hk;https://www.a-star.edu.sg;https://www.dgut.edu.cn;https://www.psu.edu",
        "aff_unique_abbr": "HKUST;A*STAR CFAR;DGUT;PSU",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;1;0;2;0",
        "aff_country_unique": "China;Singapore;United States"
    },
    {
        "id": "bP1cZIsAh1",
        "title": "Accurate Link Prediction via PU Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Given an edge-incomplete graph, how can we accurately find the missing links? The link prediction in edge-incomplete graphs aims to discover the missing relations between entities when their relationships are represented as a graph. Edge-incomplete graphs are prevalent in real-world due to practical limitations, such as not checking all users when adding friends in a social network. Addressing the problem is crucial for various tasks, including recommending friends in social networks and finding references in citation networks. However, previous approaches for link prediction rely heavily on the given edge-incomplete (observed) graph, making it challenging to consider the missing (unobserved) links during training. In this paper, we propose PULL (PU-Learning-based Link prediction), an accurate link prediction method based on the positive-unlabeled (PU) learning. PULL treats the observed edges in the training graph as positive examples, and the unconnected node pairs as unlabeled ones. PULL effectively prevents the link predictor from overfitting to the observed graph by proposing latent variables for every edge, and leveraging the expected graph structure with respect to the variables. Extensive experiments on five real-world datasets show that PULL consistently outperforms the baselines for predicting links in edge-incomplete graphs.",
        "keywords": "link prediction;PU-learning;graph neural networks;Markov networks",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/f5ae5367b7bb0593d3a3b15651936856d6cbd957.pdf",
        "author": "Junghun Kim;Ka Hyun Park;Hoyoung Yoon;U Kang",
        "authorids": "~Junghun_Kim2;~Ka_Hyun_Park1;~Hoyoung_Yoon1;~U_Kang1",
        "gender": "M;F;M;M",
        "homepage": "https://hunjungkim.notion.site;https://github.com/kahyun-p;;http://datalab.snu.ac.kr/~ukang",
        "dblp": "12/2353/;;202/9734;13/7122",
        "google_scholar": "sLj2nUAAAAAJ;;;https://scholar.google.com/citations?hl=en",
        "orcid": "0009-0003-1026-2637;0009-0005-6952-6822;0009-0006-6236-1057;0000-0002-8774-6950",
        "linkedin": "hundungkim/;;%ED%98%B8%EC%98%81-%EC%9C%A4-962b37292?trk=contact-info;",
        "or_profile": "~Junghun_Kim2;~Ka_Hyun_Park1;~Hoyoung_Yoon1;~U_Kang1",
        "aff": "Seoul National University;Seoul National University;Seoul National University;Seoul National University",
        "aff_domain": "snu.ac.kr;snu.ac.kr;snu.ac.kr;snu.ac.kr",
        "position": "PhD student;PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nkim2024accurate,\ntitle={Accurate Link Prediction via {PU} Learning},\nauthor={Junghun Kim and Ka Hyun Park and Hoyoung Yoon and U Kang},\nyear={2024},\nurl={https://openreview.net/forum?id=bP1cZIsAh1}\n}",
        "github": "",
        "project": "",
        "reviewers": "cg48;qtfB;SEg5;LBxh",
        "site": "https://openreview.net/forum?id=bP1cZIsAh1",
        "pdf_size": 778096,
        "rating": "6;6;8;8",
        "confidence": "4;3;3;4",
        "soundness": "3;3;4;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;4;4",
        "wc_summary": "72;77;253;178",
        "wc_strengths": "55;86;36;83",
        "wc_weaknesses": "162;59;22;158",
        "wc_questions": "4;50;39;120",
        "wc_review": "293;272;350;539",
        "wc_reply_reviewers": "23;32;0;21",
        "wc_reply_authors": "1253;574;540;1406",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "2;1;1;3",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            145.0,
            75.34255105848221
        ],
        "wc_strengths_avg": [
            65.0,
            20.65187642806338
        ],
        "wc_weaknesses_avg": [
            100.25,
            61.18159445454164
        ],
        "wc_questions_avg": [
            53.25,
            42.115169476092575
        ],
        "wc_review_avg": [
            363.5,
            105.2675163571365
        ],
        "wc_reply_reviewers_avg": [
            19.0,
            11.726039399558575
        ],
        "wc_reply_authors_avg": [
            943.25,
            390.2046738571951
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:hpGNKc4IqvUJ:scholar.google.com/&scioq=Accurate+Link+Prediction+via+PU+Learning&hl=en&as_sdt=0,48",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Seoul National University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.snu.ac.kr",
        "aff_unique_abbr": "SNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "bPG48f3ppz",
        "title": "SpikeCLIP: A Contrastive Language-Image Pretrained Spiking Neural Network",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Spiking neural networks (SNNs) have demonstrated the capability to achieve comparable performance to deep neural networks (DNNs) in both visual and linguistic domains while offering the advantages of improved energy efficiency and adherence to biological plausibility. However, the extension of such single-modality SNNs into the realm of multimodal scenarios remains an unexplored territory. Drawing inspiration from the concept of contrastive image-language pre-training (CLIP), we introduce a novel framework, named SpikeCLIP, to address the gap between two modalities within the context of spike-based computing through a two-step recipe involving ''Alignment Pre-training'' followed by ''Dual-Loss Fine-tuning''. Extensive experimentation demonstrates that SNNs achieve comparable results to their DNN counterparts while significantly reducing energy consumption across a variety of datasets commonly used for multimodal model evaluation. Furthermore, SpikeCLIP maintains robust performance in image classification tasks that involve class labels not predefined within specific categories.",
        "keywords": "Spiking Neural Networks (SNNs);Multimodal;Image classification",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/aa87e801f173dc9363ffbd7df6907b3c8191d67a.zip",
        "author": "Tianlong Li;Wenhao Liu;Changze Lv;Jianhan Xu;Cenyuan Zhang;Muling Wu;Xiaoqing Zheng;Xuanjing Huang",
        "authorids": "~Tianlong_Li4;~Wenhao_Liu2;~Changze_Lv1;~Jianhan_Xu1;~Cenyuan_Zhang1;~Muling_Wu1;~Xiaoqing_Zheng2;~Xuanjing_Huang1",
        "gender": "M;M;M;M;;;;F",
        "homepage": "https://github.com/Tengyuantuohai-113;;https://lvchangze.github.io;;;;;https://xuanjing-huang.github.io/",
        "dblp": ";;350/4445;278/1558.html;293/9880;358/8927;;05/6735-1",
        "google_scholar": "https://scholar.google.com.hk/citations?hl=zh-CN;;t3-viUwAAAAJ;G_p-oocAAAAJ;ghu4BZcAAAAJ;;;RGsMgZA4H78C",
        "orcid": ";0009-0008-8455-4743;;;;0009-0003-1875-6658;;0000-0001-9197-9426",
        "linkedin": ";;;;;;;",
        "or_profile": "~Tianlong_Li4;~Wenhao_Liu2;~Changze_Lv1;~Jianhan_Xu1;~Cenyuan_Zhang1;~Muling_Wu1;~Xiaoqing_Zheng2;~Xuanjing_Huang1",
        "aff": "Fudan University;Fudan University;Fudan University;Xiaohongshu;Fudan University;Fudan University;;Fudan University",
        "aff_domain": "fudan.edu.cn;fudan.edu.cn;fudan.edu.cn;xiaohongshu.com;fudan.edu.cn;fudan.edu.cn;;fudan.edu.cn",
        "position": "MS student;MS student;PhD student;Researcher;MS student;MS student;;Full Professor",
        "bibtex": "@misc{\nli2024spikeclip,\ntitle={Spike{CLIP}: A Contrastive Language-Image Pretrained Spiking Neural Network},\nauthor={Tianlong Li and Wenhao Liu and Changze Lv and Jianhan Xu and Cenyuan Zhang and Muling Wu and Xiaoqing Zheng and Xuanjing Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=bPG48f3ppz}\n}",
        "github": "",
        "project": "",
        "reviewers": "EDPh;njnp;edTp;edZQ",
        "site": "https://openreview.net/forum?id=bPG48f3ppz",
        "pdf_size": 1188674,
        "rating": "3;5;5;6",
        "confidence": "4;5;5;5",
        "soundness": "2;2;2;3",
        "contribution": "1;2;2;3",
        "presentation": "2;2;3;3",
        "wc_summary": "18;50;56;43",
        "wc_strengths": "17;23;73;31",
        "wc_weaknesses": "270;85;305;135",
        "wc_questions": "3;2;4;107",
        "wc_review": "308;160;438;316",
        "wc_reply_reviewers": "0;150;0;0",
        "wc_reply_authors": "1339;2359;1077;603",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "4;6;4;3",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            41.75,
            14.463315664120728
        ],
        "wc_strengths_avg": [
            36.0,
            21.93171219946131
        ],
        "wc_weaknesses_avg": [
            198.75,
            91.33557631065783
        ],
        "wc_questions_avg": [
            29.0,
            45.03887209955418
        ],
        "wc_review_avg": [
            305.5,
            98.5431377620989
        ],
        "wc_reply_reviewers_avg": [
            37.5,
            64.9519052838329
        ],
        "wc_reply_authors_avg": [
            1344.5,
            642.3820903481043
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.25,
            1.0897247358851685
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.9271726499455306,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2312271436902523575&as_sdt=20000005&sciodt=0,21&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;1;0;0;0",
        "aff_unique_norm": "Fudan University;Xiaohongshu",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.fudan.edu.cn;https://www.xiaohongshu.com",
        "aff_unique_abbr": "Fudan;XHS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "bQNiz6aid0",
        "title": "Quantum sequential scattering model for quantum state learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Learning probability distribution is an essential framework in classical learning theory. As a counterpart, quantum state learning has spurred the exploration of quantum machine learning theory. However, as dimensionality increases, learning a high-dimensional unknown quantum state via conventional quantum neural network approaches remains challenging due to trainability issues. In this work, we devise the quantum sequential scattering model (QSSM), inspired by the classical diffusion model, to overcome this scalability issue. Training of our model could effectively circumvent the vanishing gradient problem to a large class of high-dimensional target states possessing polynomial-scaled Schmidt ranks. Theoretical analysis and numerical experiments provide evidence for our model's effectiveness in learning both physical and algorithmic meaningful quantum states and show an out-performance beating the conventional approaches in training speed and learning accuracy. Our work has indicated that an increasing entanglement, a property of quantum states, in the target states, necessitates a larger scaled model, which could reduce our model's learning performance and efficiency.",
        "keywords": "quantum neural networks;quantum state learning;quantum computing;quantum machine learning;quantum optimization",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/fb6cf52678bccebfc57e0dc95fce3e095eb99c88.zip",
        "author": "Mingrui Jing;Geng Liu;Hongbin Ren;Xin Wang",
        "authorids": "~Mingrui_Jing2;~Geng_Liu2;hongbinrenscu@outlook.com;~Xin_Wang48",
        "gender": "M;M;;M",
        "homepage": ";;;https://www.xinwang.info/",
        "dblp": ";93/5761;;10/5630-22",
        "google_scholar": ";;;BFkAPOQAAAAJ",
        "orcid": "0000-0002-6437-9852;0000-0003-3838-7530;;0000-0002-0641-3186",
        "linkedin": ";;;",
        "or_profile": "~Mingrui_Jing2;~Geng_Liu2;hongbinrenscu@outlook.com;~Xin_Wang48",
        "aff": "The Hong Kong University of Science and Technology (Guangzhou);;;Hong Kong University of Science and Technology",
        "aff_domain": "connect.hkust-gz.edu.cn;;;hkust-gz.edu.cn",
        "position": "PhD student;;;Associate Professor",
        "bibtex": "@misc{\njing2024quantum,\ntitle={Quantum sequential scattering model for quantum state learning},\nauthor={Mingrui Jing and Geng Liu and Hongbin Ren and Xin Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=bQNiz6aid0}\n}",
        "github": "",
        "project": "",
        "reviewers": "a2rC;y9Pp;6NCB",
        "site": "https://openreview.net/forum?id=bQNiz6aid0",
        "pdf_size": 886451,
        "rating": "1;5;5",
        "confidence": "4;3;2",
        "soundness": "1;3;2",
        "contribution": "1;3;3",
        "presentation": "2;2;2",
        "wc_summary": "159;49;129",
        "wc_strengths": "37;38;55",
        "wc_weaknesses": "318;45;132",
        "wc_questions": "118;143;491",
        "wc_review": "632;275;807",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            1.8856180831641267
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            112.33333333333333,
            46.42796092394707
        ],
        "wc_strengths_avg": [
            43.333333333333336,
            8.259674462242579
        ],
        "wc_weaknesses_avg": [
            165.0,
            113.86834503056589
        ],
        "wc_questions_avg": [
            250.66666666666666,
            170.24753220596833
        ],
        "wc_review_avg": [
            571.3333333333334,
            221.38403033843448
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:133G7OMZeRsJ:scholar.google.com/&scioq=Quantum+sequential+scattering+model+for+quantum+state+learning&hl=en&as_sdt=0,33",
        "gs_version_total": 6,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Hong Kong University of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ust.hk",
        "aff_unique_abbr": "HKUST",
        "aff_campus_unique_index": "0;1",
        "aff_campus_unique": "Guangzhou;Hong Kong SAR",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Raidar: geneRative AI Detection viA Rewriting",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18333",
        "id": "bQWE2UqXmf",
        "author_site": "Chengzhi Mao, Carl Vondrick, Hao Wang, Junfeng Yang",
        "tldr": "",
        "abstract": "We find that large language models (LLMs) are more likely to modify human-written text than AI-generated text when tasked with rewriting. This tendency arises because LLMs often perceive AI-generated text as high-quality, leading to fewer modifications. We introduce a method to detect AI-generated content by prompting LLMs to rewrite text and calculating the editing distance of the output. We dubbed our geneRative AI Detection viA Rewriting method Raidar.  Raidar significantly improves the F1 detection scores of existing AI content detection models -- both academic and commercial -- across various domains, including News, creative writing, student essays, code, Yelp reviews, and arXiv papers, with gains of up to 29 points. Operating solely on word symbols without high-dimensional features, our method is compatible with black box LLMs, and is inherently robust on new content. Our results illustrate the unique imprint of machine-generated text through the lens of the machines themselves.",
        "keywords": "Machine-generated text;Detection;Trustworthy AI",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Chengzhi Mao;Carl Vondrick;Hao Wang;Junfeng Yang",
        "authorids": "~Chengzhi_Mao2;~Carl_Vondrick2;~Hao_Wang3;~Junfeng_Yang1",
        "gender": "M;M;M;M",
        "homepage": "http://www.cs.columbia.edu/~mcz/;http://www.cs.columbia.edu/~vondrick/;https://www.cs.columbia.edu/~junfeng/;http://www.wanghao.in",
        "dblp": ";26/8610;71/3724.html;w/HaoWang-14",
        "google_scholar": "pTTEiHUAAAAJ;3MzhkFIAAAAJ;JJ9AvbAAAAAJ;NrOA9QoAAAAJ",
        "orcid": ";;0009-0000-2277-6545;",
        "linkedin": ";;;",
        "or_profile": "~Chengzhi_Mao2;~Carl_Vondrick2;~Junfeng_Yang1;~Hao_Wang4",
        "aff": "Mila - Quebec Artificial Intelligence Institute;Columbia University;Columbia University;Rutgers University",
        "aff_domain": "mila.quebec;columbia.edu;columbia.edu;cs.rutgers.edu",
        "position": "Assistant Professor;Associate Professor;Associate Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nmao2024raidar,\ntitle={Raidar: geneRative {AI} Detection viA Rewriting},\nauthor={Chengzhi Mao and Carl Vondrick and Hao Wang and Junfeng Yang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=bQWE2UqXmf}\n}",
        "github": "",
        "project": "",
        "reviewers": "TBk4;cUTp;WaeQ;LoWc",
        "pdf_size": 1266596,
        "rating": "6;6;6;8",
        "confidence": "4;5;4;3",
        "soundness": "3;2;3;3",
        "contribution": "3;3;3;4",
        "presentation": "3;3;4;4",
        "wc_summary": "157;107;236;70",
        "wc_strengths": "112;85;65;54",
        "wc_weaknesses": "501;326;90;102",
        "wc_questions": "239;67;131;3",
        "wc_review": "1009;585;522;229",
        "wc_reply_reviewers": "0;0;18;0",
        "wc_reply_authors": "1211;1080;715;269",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "2;2;2;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            142.5,
            62.187217336041016
        ],
        "wc_strengths_avg": [
            79.0,
            22.056745000112777
        ],
        "wc_weaknesses_avg": [
            254.75,
            170.43382146745404
        ],
        "wc_questions_avg": [
            110.0,
            87.14929718592113
        ],
        "wc_review_avg": [
            586.25,
            278.6013056322601
        ],
        "wc_reply_reviewers_avg": [
            4.5,
            7.794228634059948
        ],
        "wc_reply_authors_avg": [
            818.75,
            365.75290497821067
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 30,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12808514759218343303&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=bQWE2UqXmf",
        "pdf": "https://openreview.net/pdf?id=bQWE2UqXmf",
        "email": "mila.quebec;columbia.edu;columbia.edu;cs.rutgers.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "Quebec Artificial Intelligence Institute;Columbia University;Rutgers University",
        "aff_unique_dep": "Artificial Intelligence;;",
        "aff_unique_url": "https://mila.quebec;https://www.columbia.edu;https://www.rutgers.edu",
        "aff_unique_abbr": "Mila;Columbia;Rutgers",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "Canada;United States"
    },
    {
        "id": "bQfJLRlfYO",
        "title": "Keqing: Knowledge-based Question Answering is A Nature Chain-of-Thought mentor of LLMs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs) have exhibited remarkable performance on various natural language processing (NLP) tasks, especially for question answering. However, in the face of problems beyond the scope of knowledge, these LLMs tend to talk nonsense with a straight face, where the potential solution could be incorporating an Information Retrieval (IR) module and generating response based\non these retrieved knowledge. In this paper, we present a novel framework to assist LLMs, such as ChatGPT, to retrieve question-related structured information on the knowledge graph, and demonstrate that Knowledge-based question answering (Keqing) could be a nature Chain-of-Thought (CoT) mentor to guide the LLM to sequentially find the answer entities of a complex question through interpretable\nlogical chains. Specifically, the workflow of Keqing will execute decomposing a complex question according to predefined templates, retrieving candidate entities on knowledge graph, reasoning answers of sub-questions, and finally generating response with reasoning paths, which greatly improves the reliability of LLM\u2019s response. The experimental results on KBQA datasets show that Keqing can achieve competitive performance and illustrate the logic of answering each question.",
        "keywords": "knowledge-based question answering;large language model;knwledge graph",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "/attachment/5d4e408f0f1bc62229150c22493b12967115f23c.zip",
        "author": "Yishi Xu;Chaojie Wang;Zhong Peng;Chenxi Zhang;Xinrun Wang;Xinyang Liu;Bo Chen;Bo An;Lei Feng",
        "authorids": "~Yishi_Xu2;~Chaojie_Wang1;~Zhong_Peng2;~Chenxi_Zhang5;~Xinrun_Wang1;~Xinyang_Liu4;~Bo_Chen1;~Bo_An2;~Lei_Feng1",
        "gender": "M;M;F;M;M;M;M;M;M",
        "homepage": "https://chaojiewang94.github.io/;https://github.com/ISPZ;https://github.com/programmerzcx;https://rainwangphy.github.io/;https://xinyangatk.github.io;http://web.xidian.edu.cn/bchen/en/index.html;https://personal.ntu.edu.sg/boan/;https://lfeng1995.github.io/;https://novicestone.github.io/",
        "dblp": "134/9314-1;149/5980.html;;199/6413;;89/5615-1;42/6178-1.html;76/847-6;268/6784",
        "google_scholar": "https://scholar.google.com/citations?hl=en;opLQ7sEAAAAJ;;ROANfPUAAAAJ;https://scholar.google.com.hk/citations?hl=zh-CN;;PEEpuNwAAAAJ;https://scholar.google.com.sg/citations?user=KomQOFkAAAAJ;SHVgTzIAAAAJ",
        "orcid": ";;;;;0000-0001-5151-9388;0000-0002-7064-7438;0000-0003-2839-5799;",
        "linkedin": ";;;;;;;;",
        "or_profile": "~Chaojie_Wang1;~Zhong_Peng2;~Chenxi_Zhang5;~Xinrun_Wang1;~Xinyang_Liu4;~Bo_Chen1;~Bo_An2;~Lei_Feng1;~Yi.shi_Xu1",
        "aff": "Skywork AI;Xi'an University of Electronic Science and Technology;Xi'an University of Electronic Science and Technology;Nanyang Technological University;Xidian University;Xidian University;Nanyang Technological University;Singapore University of Technology and Design;Xidian University",
        "aff_domain": "kunlun-inc.com;xidian.edu.cn;xidian.edu.cn;ntu.edu.sg;xidian.edu;xidian.edu.cn;ntu.edu.sg;sutd.edu.sg;xidian.edu.cn",
        "position": "Researcher;PhD student;PhD student;Postdoc;MS student;Full Professor;Full Professor;Assistant Professor;PhD student",
        "bibtex": "@misc{\nxu2024keqing,\ntitle={Keqing: Knowledge-based Question Answering is A Nature Chain-of-Thought mentor of {LLM}s},\nauthor={Yishi Xu and Chaojie Wang and Zhong Peng and Chenxi Zhang and Xinrun Wang and Xinyang Liu and Bo Chen and Bo An and Lei Feng},\nyear={2024},\nurl={https://openreview.net/forum?id=bQfJLRlfYO}\n}",
        "github": "",
        "project": "",
        "reviewers": "jydE;YEjv;6eaX;eCHK",
        "site": "https://openreview.net/forum?id=bQfJLRlfYO",
        "pdf_size": 1760449,
        "rating": "3;5;5;5",
        "confidence": "3;3;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;2",
        "presentation": "3;4;3;3",
        "wc_summary": "72;91;84;96",
        "wc_strengths": "26;35;23;55",
        "wc_weaknesses": "113;76;91;123",
        "wc_questions": "33;75;26;135",
        "wc_review": "244;277;224;409",
        "wc_reply_reviewers": "0;190;51;0",
        "wc_reply_authors": "535;720;575;604",
        "reply_reviewers": "0;3;1;0",
        "reply_authors": "1;4;2;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            85.75,
            9.01041064547005
        ],
        "wc_strengths_avg": [
            34.75,
            12.497499749949988
        ],
        "wc_weaknesses_avg": [
            100.75,
            18.38987493160299
        ],
        "wc_questions_avg": [
            67.25,
            43.37265843823733
        ],
        "wc_review_avg": [
            288.5,
            72.09889042142049
        ],
        "wc_reply_reviewers_avg": [
            60.25,
            77.75080385436539
        ],
        "wc_reply_authors_avg": [
            608.5,
            68.87851624418168
        ],
        "reply_reviewers_avg": [
            1.0,
            1.224744871391589
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:gQMRO0uuq2UJ:scholar.google.com/&scioq=Keqing:+Knowledge-based+Question+Answering+is+A+Nature+Chain-of-Thought+mentor+of+LLMs&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;2;3;3;2;4;3",
        "aff_unique_norm": "Skywork AI;Xi'an University of Electronic Science and Technology;Nanyang Technological University;Xidian University;Singapore University of Technology and Design",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.skywork.ai;http://www.xidian.edu.cn/;https://www.ntu.edu.sg;http://www.xidian.edu.cn/;https://www.sutd.edu.sg",
        "aff_unique_abbr": "Skywork AI;Xidian University;NTU;Xidian;SUTD",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Xi'an",
        "aff_country_unique_index": "0;1;1;2;1;1;2;2;1",
        "aff_country_unique": "United States;China;Singapore"
    },
    {
        "title": "Future Language Modeling from Temporal Document History",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18332",
        "id": "bRLed9prWC",
        "author_site": "Changmao Li, Jeffrey Flanigan",
        "tldr": "",
        "abstract": "Predicting the future is of great interest across many aspects of human activity.  Businesses are interested in future trends, traders are interested in future stock prices, and companies are highly interested in future technological breakthroughs.  While there are many automated systems for predicting future numerical data, such as weather, stock prices, and demand for products, there is relatively little work in automatically predicting textual data.  Humans are interested in textual data predictions because it is a natural format for our consumption, and experts routinely make predictions in a textual format (Christensen et al., 2004; Tetlock & Gardner, 2015; Frick, 2015). However, there has been relatively little formalization of this general problem in the machine learning or natural language processing communities.  To address this gap, we introduce the task of future language modeling: probabilistic modeling of texts in the future based on a temporal history of texts.  To our knowledge, our work is the first work to formalize the task of predicting the future in this way.  We show that it is indeed possible to build future language models that improve upon strong non-temporal language model baselines, opening the door to working on this important, and widely applicable problem.",
        "keywords": "Future Language Modeling;Future Language Model;Temporal Document History",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/e5fd8c854dd916af0c9ef2413635ef0b7518b6e3.pdf",
        "author": "Changmao Li;Jeffrey Flanigan",
        "authorids": "~Changmao_Li1;~Jeffrey_Flanigan1",
        "gender": ";M",
        "homepage": ";https://jflanigan.github.io/",
        "dblp": ";75/9768",
        "google_scholar": ";XpIsORcAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Changmao_Li1;~Jeffrey_Flanigan1",
        "aff": ";University of California, Santa Cruz",
        "aff_domain": ";ucsc.edu",
        "position": ";Assistant Professor",
        "bibtex": "@inproceedings{\nli2024future,\ntitle={Future Language Modeling from Temporal Document History},\nauthor={Changmao Li and Jeffrey Flanigan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=bRLed9prWC}\n}",
        "github": "",
        "project": "",
        "reviewers": "dCq4;QRZD;YEss",
        "pdf_size": 549482,
        "rating": "6;8;8",
        "confidence": "3;4;3",
        "soundness": "3;3;3",
        "contribution": "2;4;3",
        "presentation": "3;3;3",
        "wc_summary": "58;103;60",
        "wc_strengths": "71;48;82",
        "wc_weaknesses": "146;137;18",
        "wc_questions": "1;20;1",
        "wc_review": "276;308;161",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "303;132;21",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            73.66666666666667,
            20.75786330258702
        ],
        "wc_strengths_avg": [
            67.0,
            14.165686240583852
        ],
        "wc_weaknesses_avg": [
            100.33333333333333,
            58.3342857065113
        ],
        "wc_questions_avg": [
            7.333333333333333,
            8.956685895029603
        ],
        "wc_review_avg": [
            248.33333333333334,
            63.12069567283161
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            152.0,
            115.99137898999219
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.49999999999999983,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5428700983365334878&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=bRLed9prWC",
        "pdf": "https://openreview.net/pdf?id=bRLed9prWC",
        "email": ";ucsc.edu",
        "author_num": 2,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of California, Santa Cruz",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucsc.edu",
        "aff_unique_abbr": "UCSC",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Santa Cruz",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "bRm0rul3SZ",
        "title": "Unpaired Panoramic Image-to-Image Translation Leveraging Pinhole Images",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this paper, we tackle the challenging task of unpaired panoramic Image-to-Image translation (Pano-I2I) for the first time. This task aims to learn a mapping between unpaired panoramic source and non-panoramic target domains to modify naive 360 panoramic images. However, it is difficult to use existing I2I methods due to two main challenges. Firstly, panoramas inherit geometric distortions, which pose challenges for methods based on a narrow field-of-view. Secondly, accessing panoramic datasets encompassing various weather conditions or times for training purposes is severely limited. To address these challenges, we propose a novel I2I model tailored for mitigating panoramic distortion that harnesses readily obtainable pinhole images as the target domain for training. We introduce a versatile encoder and distortion-free discrimination that efficiently bridges the large domain gap between panoramic and pinhole images by simultaneously encoding them in a consolidated structure. It allows our model to learn style mappings while overcoming significant geometric differences between the source and target domains. Moreover, we carefully design spherical position embedding, sphere-based rotation augmentation, and its ensemble to address the discontinuities at the panorama edges. Comprehensive experiments verify that our framework effectively translates panoramic street views from daytime to night, rainy, and twilight scenes by referring to the holistic style of pinhole data.\nOur method also shows superior results in both maintaining structural coherence and rotation equivariance, clearly surpassing the existing I2I methods in qualitative and quantitative results.",
        "keywords": "Image-to-Image-Translation;Image Synthesis;Panorama",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/438fbcb50adcfa66cc99ac3bc343768b2e163871.pdf",
        "author": "Soohyun Kim;Junho Kim;Taekyung Kim;Hwan Heo;Seungryong Kim;Jiyoung Lee;Jin-Hwa Kim",
        "authorids": "~Soohyun_Kim2;~Junho_Kim3;~Taekyung_Kim4;~Hwan_Heo1;~Seungryong_Kim1;~Jiyoung_Lee2;~Jin-Hwa_Kim1",
        "gender": ";M;Not Specified;M;M;F;Unspecified",
        "homepage": "https://cvlab.korea.ac.kr/;http://bit.ly/jhkim_resume;;https://hwan-h-heo.github.io/hwan-h-heo.io/;https://cvlab.korea.ac.kr/members/faculty;https://lee-jiyoung.github.io/;http://wityworks.com",
        "dblp": "33/4258;;58/1619-2;47/10564;141/9955;;48/258",
        "google_scholar": "oDplwx8AAAAJ;WtjDugkAAAAJ;https://scholar.google.co.kr/citations?user=u-9bdkwAAAAJ;;cIK1hS8AAAAJ;nIPWv9EAAAAJ;https://scholar.google.co.kr/citations?user=3f2wPekAAAAJ",
        "orcid": ";0000-0003-3712-8510;;;;0009-0000-6647-9403;0000-0002-0423-0415",
        "linkedin": ";taki0112/;taekyung-kim-76b074335/;;;;",
        "or_profile": "~Soohyun_Kim2;~Junho_Kim3;~Taekyung_Kim4;~Hwan_Heo1;~Seungryong_Kim1;~Jiyoung_Lee2;~Jin-Hwa_Kim1",
        "aff": "Korea University;NAVER;NAVER AI Lab;NCSOFT;Korea University;NAVER;NAVER",
        "aff_domain": "korea.ac.kr;navercorp.com;navercorp.com;ncsoft.com;korea.ac.kr;navercorp.com;navercorp.com",
        "position": "MS student;Research Scientist;Research Scientist;Researcher;Assistant Professor;Research Scientist;Research Scientist",
        "bibtex": "@misc{\nkim2024unpaired,\ntitle={Unpaired Panoramic Image-to-Image Translation Leveraging Pinhole Images},\nauthor={Soohyun Kim and Junho Kim and Taekyung Kim and Hwan Heo and Seungryong Kim and Jiyoung Lee and Jin-Hwa Kim},\nyear={2024},\nurl={https://openreview.net/forum?id=bRm0rul3SZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "HC91;7NBx;4pKv;jBQQ",
        "site": "https://openreview.net/forum?id=bRm0rul3SZ",
        "pdf_size": 9765602,
        "rating": "3;5;5;5",
        "confidence": "4;4;2;5",
        "soundness": "3;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;2;3",
        "wc_summary": "37;79;56;71",
        "wc_strengths": "25;81;59;87",
        "wc_weaknesses": "141;130;172;243",
        "wc_questions": "2;3;88;17",
        "wc_review": "205;293;375;418",
        "wc_reply_reviewers": "0;43;0;47",
        "wc_reply_authors": "478;303;553;1202",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "2;1;2;3",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            60.75,
            16.005858302509115
        ],
        "wc_strengths_avg": [
            63.0,
            24.289915602982237
        ],
        "wc_weaknesses_avg": [
            171.5,
            44.05961870012041
        ],
        "wc_questions_avg": [
            27.5,
            35.42950747611375
        ],
        "wc_review_avg": [
            322.75,
            81.47507287508247
        ],
        "wc_reply_reviewers_avg": [
            22.5,
            22.544400635190993
        ],
        "wc_reply_authors_avg": [
            634.0,
            340.25064290901787
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.13245323570650439,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4211499962139906913&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;2;0;1;1",
        "aff_unique_norm": "Korea University;NAVER Corporation;NCSOFT Corporation",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.korea.ac.kr;https://www.naver.com;https://www.ncsoft.com",
        "aff_unique_abbr": "KU;NAVER;NCSOFT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "bSBH1rwq4n",
        "title": "Causal Feature Attribution: Towards a Trustworthy and Actionable Explanations of Deep Neural Network",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Nowadays, deep learning-based models have shown extraordinary performance on various tasks; however, the most significant bottleneck is the lack of transparency and explainability. Although many Explainable Artificial Intelligence (XAI) models have been proposed to provide feature attributions and generate explanations for back-box models, most of them are correlation-based methods, which fail to provide trustworthy explanations due to the misleading correlations learned by black-box models. Therefore, we propose a causality-based feature attribution model that can provide trustworthy explanations by treating the feature of interest as an intervention and inferring its causal feature attribution. Extensive results show that our model can provide trustworthy and actionable explanations.",
        "keywords": "explainable artificial intelligence",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Zhixuan Chu;Mengxuan Hu;Siqiao Xue;Qing Cui;Longfei Li;Sheng Li",
        "authorids": "~Zhixuan_Chu1;~Mengxuan_Hu1;~Siqiao_Xue1;~Qing_Cui1;~Longfei_Li3;~Sheng_Li3",
        "gender": "M;F;M;M;M;M",
        "homepage": ";https://xuanxuan03021.github.io/;https://www.antgroup.com/en;;;http://sheng-li.org",
        "dblp": "258/1233;345/8081;302/7766;18/4013;;23/3439-1",
        "google_scholar": "a4IuTngAAAAJ;;pZqTpoEAAAAJ;_SfHjS4AAAAJ;x5rfjSEAAAAJ;DEncVcYAAAAJ",
        "orcid": ";;;0000-0002-4909-4568;;0000-0003-1205-8632",
        "linkedin": ";hu-mengxuan-823675263/;;;;sheng-li-15a70022/",
        "or_profile": "~Zhixuan_Chu1;~Mengxuan_Hu1;~Siqiao_Xue1;~Qing_Cui1;~Longfei_Li3;~Sheng_Li3",
        "aff": "Ant Group;University of Virginia;Alibaba;Ant Group;Alibaba Group;University of Virginia, Charlottesville",
        "aff_domain": "antgroup.com;virginia.edu;alibaba-inc.com;antgroup.com;alibaba-inc.com;virginia.edu",
        "position": "Researcher;PhD student;researcher;Researcher;Researcher;Associate Professor",
        "bibtex": "@misc{\nchu2024causal,\ntitle={Causal Feature Attribution: Towards a Trustworthy and Actionable Explanations of Deep Neural Network},\nauthor={Zhixuan Chu and Mengxuan Hu and Siqiao Xue and Qing Cui and Longfei Li and Sheng Li},\nyear={2024},\nurl={https://openreview.net/forum?id=bSBH1rwq4n}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=bSBH1rwq4n",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:J8RG7rzgPbkJ:scholar.google.com/&scioq=Causal+Feature+Attribution:+Towards+a+Trustworthy+and+Actionable+Explanations+of+Deep+Neural+Network&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0;3;1",
        "aff_unique_norm": "Ant Group;University of Virginia;Alibaba Group Holding Limited;Alibaba Group",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.antgroup.com;https://www.virginia.edu;https://www.alibaba.com;https://www.alibaba.com",
        "aff_unique_abbr": "Ant Group;UVA;Alibaba;Alibaba",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Charlottesville",
        "aff_country_unique_index": "0;1;0;0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "bSlAUCyY4T",
        "title": "Knowledge Graph Completion by Intermediate Variables Regularization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Knowledge graph completion (KGC) can be framed as a 3-order binary tensor completion task. Tensor decomposition-based (TDB) models have demonstrated strong performance in KGC. In this paper, we provide a summary of existing TDB models and derive a general form for them, serving as a foundation for further exploration of TDB models. Despite the expressiveness of TDB models, they are prone to overfitting. Existing regularization methods merely minimize the norms of embeddings to regularize the model, leading to suboptimal performance. Therefore, we propose a novel regularization method for TDB models that addresses this limitation. The regularization is applicable to most TDB models, incorporates existing regularization methods, and ensures tractable computation. Our method minimizes the norms of intermediate variables involved in the different ways of computing the predicted tensor. To support our regularization method, we provide a theoretical analysis that proves its effect in promoting low trace norm of the predicted tensor to reduce overfitting. Finally, we conduct experiments to verify the effectiveness of our regularization technique as well as the reliability of our theoretical analysis.",
        "keywords": "Knowledge Graph Completion;Tensor Decomposition;Regularization",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/e045dc2a50445fcccfed346effaefecd42f8b024.zip",
        "author": "Changyi Xiao;Xiangnan He;Yixin Cao",
        "authorids": "~Changyi_Xiao1;~Xiangnan_He1;~Yixin_Cao2",
        "gender": "M;M;M",
        "homepage": ";http://staff.ustc.edu.cn/~hexn;https://sites.google.com/view/yixin-homepage",
        "dblp": "270/8871;59/1007;20/8038-2",
        "google_scholar": "0_fwA4QAAAAJ;https://scholar.google.com.sg/citations?user=X45Go24AAAAJ;https://scholar.google.co.uk/citations?user=CnhTvdoAAAAJ",
        "orcid": ";0000-0001-8472-7992;",
        "linkedin": ";;",
        "or_profile": "~Changyi_Xiao1;~Xiangnan_He1;~Yixin_Cao2",
        "aff": "Fudan University;University of Science and Technology of China;Singapore Management University",
        "aff_domain": "fudan.edu.cn;ustc.edu.cn;smu.edu.sg",
        "position": "Postdoc;Professor;Assistant Professor",
        "bibtex": "@misc{\nxiao2024knowledge,\ntitle={Knowledge Graph Completion by Intermediate Variables Regularization},\nauthor={Changyi Xiao and Xiangnan He and Yixin Cao},\nyear={2024},\nurl={https://openreview.net/forum?id=bSlAUCyY4T}\n}",
        "github": "",
        "project": "",
        "reviewers": "e2Qz;Bhgm;TVtg;YFRf",
        "site": "https://openreview.net/forum?id=bSlAUCyY4T",
        "pdf_size": 1233867,
        "rating": "3;5;5;8",
        "confidence": "5;4;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;1;3",
        "presentation": "2;3;4;2",
        "wc_summary": "77;122;47;127",
        "wc_strengths": "58;15;72;26",
        "wc_weaknesses": "68;135;172;41",
        "wc_questions": "5;8;37;45",
        "wc_review": "208;280;328;239",
        "wc_reply_reviewers": "0;124;0;8",
        "wc_reply_authors": "965;1571;1005;497",
        "reply_reviewers": "0;2;0;1",
        "reply_authors": "4;5;4;1",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            93.25,
            33.04826016600571
        ],
        "wc_strengths_avg": [
            42.75,
            23.12331074911203
        ],
        "wc_weaknesses_avg": [
            104.0,
            52.08166663999915
        ],
        "wc_questions_avg": [
            23.75,
            17.512495538900218
        ],
        "wc_review_avg": [
            263.75,
            45.03540274051071
        ],
        "wc_reply_reviewers_avg": [
            33.0,
            52.640288753007425
        ],
        "wc_reply_authors_avg": [
            1009.5,
            380.76863053565745
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.5,
            1.5
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.7276068751089989,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:7B7s8ezAvXwJ:scholar.google.com/&scioq=Knowledge+Graph+Completion+by+Intermediate+Variables+Regularization&hl=en&as_sdt=0,33",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Fudan University;University of Science and Technology of China;Singapore Management University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.fudan.edu.cn;http://www.ustc.edu.cn;https://www.smu.edu.sg",
        "aff_unique_abbr": "Fudan;USTC;SMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "China;Singapore"
    },
    {
        "title": "Latent Trajectory Learning for Limited Timestamps under Distribution Shift over Time",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18331",
        "id": "bTMMNT7IdW",
        "author_site": "Qiuhao Zeng, Changjian Shui, Long-Kai Huang, Peng Liu, Xi Chen, Charles Ling, Boyu Wang",
        "tldr": "",
        "abstract": "Distribution shifts over time are common in real-world machine-learning applications. This scenario is formulated as Evolving Domain Generalization (EDG), where models aim to generalize well to unseen target domains in a time-varying system by learning and leveraging the underlying evolving pattern of the distribution shifts across domains. However, existing methods encounter challenges due to the limited number of timestamps (every domain corresponds to a timestamp) in EDG datasets, leading to difficulties in capturing evolving dynamics and risking overfitting to the sparse timestamps, which hampers their generalization and adaptability to new tasks. To address this limitation, we propose a novel approach SDE-EDG that collects the Infinitely Fined-Grid Evolving Trajectory (IFGET) of the data distribution with continuous-interpolated samples to bridge temporal gaps (intervals between two successive timestamps). Furthermore, by leveraging the inherent capacity of Stochastic Differential Equations (SDEs) to capture continuous trajectories, we propose their use to align SDE-modeled trajectories with IFGET across domains, thus enabling the capture of evolving distribution trends. We evaluate our approach on several benchmark datasets and demonstrate that it can achieve superior performance compared to existing state-of-the-art methods.",
        "keywords": "Distribution Shift;Temporal Distribution Shift",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/8155991fb37a7092e341ebfd7cd77c43e1bdc508.zip",
        "author": "QIUHAO Zeng;Changjian Shui;Long-Kai Huang;Peng Liu;Xi Chen;Charles Ling;Boyu Wang",
        "authorids": "~QIUHAO_Zeng1;~Changjian_Shui2;~Long-Kai_Huang1;~Peng_Liu20;~Xi_Chen32;~Charles_Ling1;~Boyu_Wang3",
        "gender": "M;;;;M;M;M",
        "homepage": "https://hardworkingpearl.github.io/;;https://sites.google.com/site/longkaihugo/home;;https://sites.google.com/site/xichenmcgill/home;http://cling.csd.uwo.ca/;https://sites.google.com/site/borriewang/",
        "dblp": ";;133/2006;;16/3283-9.html;;41/6565-4.html",
        "google_scholar": "https://scholar.google.ca/citations?user=MJdcPlgAAAAJ;;CaP64WUAAAAJ;;https://scholar.google.ca/citations?user=HMuDi00AAAAJ;https://scholar.google.co.uk/citations?hl=en;qAZM5KcAAAAJ",
        "orcid": ";;0000-0001-5263-1443;;0000-0001-5395-4295;;0000-0002-7413-4162",
        "linkedin": ";;;;;;",
        "or_profile": "~QIUHAO_Zeng1;~Changjian_Shui2;~Long-Kai_Huang1;~Peng_Liu20;~Xi_Chen32;~Charles_Ling1;~Boyu_Wang3",
        "aff": "University of Western Ontario ;;Tencent;;Huawei Technologies Ltd.;Western University;University of Western Ontario",
        "aff_domain": "western.ca;;tencent.com;;huawei.com;uwo.ca;uwo.ca",
        "position": "PhD student;;Researcher;;Principal Researcher;Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nzeng2024latent,\ntitle={Latent Trajectory Learning for Limited Timestamps under Distribution Shift over Time},\nauthor={QIUHAO Zeng and Changjian Shui and Long-Kai Huang and Peng Liu and Xi Chen and Charles Ling and Boyu Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=bTMMNT7IdW}\n}",
        "github": "",
        "project": "",
        "reviewers": "pVBo;y1vq;KuA7;bSwA",
        "pdf_size": 7503454,
        "rating": "8;8;8;8",
        "confidence": "4;3;1;3",
        "soundness": "4;3;3;3",
        "contribution": "4;3;3;3",
        "presentation": "4;3;3;2",
        "wc_summary": "139;41;51;152",
        "wc_strengths": "213;45;22;136",
        "wc_weaknesses": "169;28;80;230",
        "wc_questions": "50;143;2;161",
        "wc_review": "571;257;155;679",
        "wc_reply_reviewers": "0;32;18;50",
        "wc_reply_authors": "1071;773;423;1961",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "2;3;2;4",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            2.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            95.75,
            50.08679965819338
        ],
        "wc_strengths_avg": [
            104.0,
            76.00986778044019
        ],
        "wc_weaknesses_avg": [
            126.75,
            78.07488392562617
        ],
        "wc_questions_avg": [
            89.0,
            65.55532015023647
        ],
        "wc_review_avg": [
            415.5,
            215.9832169405762
        ],
        "wc_reply_reviewers_avg": [
            25.0,
            18.35755975068582
        ],
        "wc_reply_authors_avg": [
            1057.0,
            570.0929748733973
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6271925258988042290&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=bTMMNT7IdW",
        "pdf": "https://openreview.net/pdf?id=bTMMNT7IdW",
        "email": "western.ca;;tencent.com;;huawei.com;uwo.ca;uwo.ca",
        "author_num": 7,
        "aff_unique_index": "0;1;2;3;0",
        "aff_unique_norm": "University of Western Ontario;Tencent;Huawei;Western University",
        "aff_unique_dep": ";Tencent Holdings Limited;Huawei Technologies;",
        "aff_unique_url": "https://www.uwo.ca;https://www.tencent.com;https://www.huawei.com;https://www.uwo.ca",
        "aff_unique_abbr": "UWO;Tencent;Huawei;Western",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;0;0",
        "aff_country_unique": "Canada;China"
    },
    {
        "id": "bTjokqYl5B",
        "title": "On the Onset of Robust Overfitting in Adversarial Training",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Adversarial Training (AT) is a widely-used algorithm for building robust neural networks, but it suffers from the issue of robust overfitting, the fundamental mechanism of which remains unclear. In this work, we consider normal data and adversarial perturbation as separate factors, and identify that the underlying causes of robust overfitting stem from the normal data through factor ablation in AT. Furthermore, we explain the onset of robust overfitting as a result of the model learning features that lack robust generalization, which we refer to as non-effective features. Specifically, we provide a detailed analysis of the generation of non-effective features and how they lead to robust overfitting. Additionally, we explain various empirical behaviors observed in robust overfitting and revisit different techniques to mitigate robust overfitting from the perspective of non-effective features, providing a comprehensive understanding of the robust overfitting phenomenon. This understanding inspires us to propose two measures, attack strength and data augmentation, to hinder the learning of non-effective features by the neural network, thereby alleviating robust overfitting. Extensive experiments conducted on benchmark datasets demonstrate the effectiveness of the proposed methods in mitigating robust overfitting and enhancing adversarial robustness.",
        "keywords": "Adversarial Training; Robust Overfitting",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Chaojian Yu;Xiaolong Shi;Jun Yu;Bo Han;Tongliang Liu",
        "authorids": "~Chaojian_Yu1;~Xiaolong_Shi1;~Jun_Yu3;~Bo_Han1;~Tongliang_Liu1",
        "gender": "M;;M;;M",
        "homepage": ";;https://faculty.ustc.edu.cn/yujun_AI/en/index.htm;;https://tongliang-liu.github.io/",
        "dblp": "223/9872;;50/5754-1.html;;150/6667",
        "google_scholar": "b3ltuG8AAAAJ;;efZyqyQAAAAJ;;https://scholar.google.com.au/citations?user=EiLdZ_YAAAAJ",
        "orcid": ";;0000-0002-3197-8103;;",
        "linkedin": ";;;;",
        "or_profile": "~Chaojian_Yu1;~Xiaolong_Shi1;~Jun_Yu3;~Bo_Han1;~Tongliang_Liu1",
        "aff": "The University of Sydney;;University of Science and Technology of China;;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_domain": "uni.sydney.edu.au;;ustc.edu.cn;;mbzuai.ac.ae",
        "position": "PhD student;;Associate Professor;;Affiliated Associate Professor",
        "bibtex": "@misc{\nyu2024on,\ntitle={On the Onset of Robust Overfitting in Adversarial Training},\nauthor={Chaojian Yu and Xiaolong Shi and Jun Yu and Bo Han and Tongliang Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=bTjokqYl5B}\n}",
        "github": "",
        "project": "",
        "reviewers": "BeRL;6tzX;sV3q;H4Yh;MKb4",
        "site": "https://openreview.net/forum?id=bTjokqYl5B",
        "pdf_size": 1470081,
        "rating": "1;3;3;3;6",
        "confidence": "4;4;4;4;4",
        "soundness": "2;2;2;2;3",
        "contribution": "2;2;2;2;3",
        "presentation": "1;2;2;2;3",
        "wc_summary": "61;66;35;96;252",
        "wc_strengths": "77;50;40;36;206",
        "wc_weaknesses": "353;160;152;170;138",
        "wc_questions": "14;5;4;70;90",
        "wc_review": "505;281;231;372;686",
        "wc_reply_reviewers": "465;0;54;28;0",
        "wc_reply_authors": "1595;775;1187;718;481",
        "reply_reviewers": "2;0;1;1;0",
        "reply_authors": "6;4;6;4;1",
        "rating_avg": [
            3.2,
            1.6
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.2,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            102.0,
            77.4622488700141
        ],
        "wc_strengths_avg": [
            81.8,
            63.72566202088449
        ],
        "wc_weaknesses_avg": [
            194.6,
            79.88892288671815
        ],
        "wc_questions_avg": [
            36.6,
            36.16407056734626
        ],
        "wc_review_avg": [
            415.0,
            164.4396545848963
        ],
        "wc_reply_reviewers_avg": [
            109.4,
            178.9319423691589
        ],
        "wc_reply_authors_avg": [
            951.2,
            394.10577260425913
        ],
        "reply_reviewers_avg": [
            0.8,
            0.7483314773547883
        ],
        "reply_authors_avg": [
            4.2,
            1.8330302779823362
        ],
        "replies_avg": [
            34,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:pIab8uaKNhkJ:scholar.google.com/&scioq=On+the+Onset+of+Robust+Overfitting+in+Adversarial+Training&hl=en&as_sdt=0,5",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of Sydney;University of Science and Technology of China;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.sydney.edu.au;http://www.ustc.edu.cn;https://mbzuai.ac.ae",
        "aff_unique_abbr": "USYD;USTC;MBZUAI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2",
        "aff_country_unique": "Australia;China;United Arab Emirates"
    },
    {
        "id": "bUGagbBGaY",
        "title": "Momentum-accelerated Diffusion Process for Faster Training and Sampling",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Diffusion models (DMs) have been adopted across diverse fields with its remarkable abilities in capturing intricate data distributions. In this paper, we propose a Fast Diffusion Model (FDM) to significantly speed up DMs from a stochastic optimization perspective for both faster training and sampling. We first find that the diffusion process of DMs accords with the stochastic optimization process of stochastic gradient descent (SGD) on a stochastic time-variant problem.  \nThen, inspired by momentum SGD that uses both gradient and an extra momentum to achieve faster and more stable convergence than SGD, we integrate momentum into the diffusion process of DMs. This comes with a unique challenge of deriving the noise perturbation kernel from the momentum-based diffusion process. To this end, we frame the process as a Damped Oscillation system whose critically damped state---the kernel solution---avoids oscillation and yields a faster convergence speed of the diffusion process. Empirical results show that our FDM can be applied to several popular DM frameworks, e.g., VP, VE, and EDM, and reduces their training cost by about 50% with comparable image synthesis performance on CIFAR-10, FFHQ, and AFHQv2 datasets. Moreover, FDM  decreases their sampling steps by about 3x to achieve similar performance under the same samplers. The codes are in the attached supplementary material and will be released online.",
        "keywords": "Diffusion Model;Training Acceleration;Optimization",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/6917e4830ad127390eeeb4f71b1f17b470d1ab2f.zip",
        "author": "Zike Wu;Pan Zhou;Kenji Kawaguchi;Hanwang Zhang",
        "authorids": "~Zike_Wu1;~Pan_Zhou3;~Kenji_Kawaguchi1;~Hanwang_Zhang3",
        "gender": "M;;;M",
        "homepage": ";;https://ml.comp.nus.edu.sg/#members;https://mreallab.github.io/index.html",
        "dblp": "331/1483;;;79/8116.html",
        "google_scholar": "dQ4wdnoAAAAJ;;aLl3rYoAAAAJ;YG0DFyYAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Zike_Wu1;~Pan_Zhou3;~Kenji_Kawaguchi1;~Hanwang_Zhang3",
        "aff": "Nanyang Technological University;;National University of Singapore;Nanyang Technological University",
        "aff_domain": "ntu.edu.sg;;nus.edu;ntu.edu.sg",
        "position": "MS student;;Presidential Young Professor;Associate Professor",
        "bibtex": "@misc{\nwu2024momentumaccelerated,\ntitle={Momentum-accelerated Diffusion Process for Faster Training and Sampling},\nauthor={Zike Wu and Pan Zhou and Kenji Kawaguchi and Hanwang Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=bUGagbBGaY}\n}",
        "github": "",
        "project": "",
        "reviewers": "LPzE;GwvH;DPH4;ZeuL",
        "site": "https://openreview.net/forum?id=bUGagbBGaY",
        "pdf_size": 4573330,
        "rating": "5;5;6;8",
        "confidence": "4;4;3;3",
        "soundness": "2;2;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "38;46;97;142",
        "wc_strengths": "18;48;76;69",
        "wc_weaknesses": "168;29;143;131",
        "wc_questions": "7;62;121;29",
        "wc_review": "231;185;437;371",
        "wc_reply_reviewers": "205;0;0;0",
        "wc_reply_authors": "2523;1068;1680;1170",
        "reply_reviewers": "3;0;0;0",
        "reply_authors": "8;4;5;4",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            80.75,
            41.984372092482225
        ],
        "wc_strengths_avg": [
            52.75,
            22.554101622543072
        ],
        "wc_weaknesses_avg": [
            117.75,
            52.94985835675106
        ],
        "wc_questions_avg": [
            54.75,
            42.96728406590298
        ],
        "wc_review_avg": [
            306.0,
            102.04410811016969
        ],
        "wc_reply_reviewers_avg": [
            51.25,
            88.76760388790495
        ],
        "wc_reply_authors_avg": [
            1610.25,
            575.7240549950992
        ],
        "reply_reviewers_avg": [
            0.75,
            1.299038105676658
        ],
        "reply_authors_avg": [
            5.25,
            1.6393596310755
        ],
        "replies_avg": [
            30,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8164965809277259,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:xCf1cvPzbSkJ:scholar.google.com/&scioq=Momentum-accelerated+Diffusion+Process+for+Faster+Training+and+Sampling&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Nanyang Technological University;National University of Singapore",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ntu.edu.sg;https://www.nus.edu.sg",
        "aff_unique_abbr": "NTU;NUS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Singapore"
    },
    {
        "id": "bUGzjiUsIq",
        "title": "Make Small Data Great Again: Learning from Partially Annotated Data via Policy Gradient for Multi-Label Classification Tasks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Traditional supervised learning methods are heavily reliant on human-annotated datasets. However, obtaining comprehensive human annotations proves challenging in numerous tasks, especially multi-label tasks.\nTherefore, we investigate the understudied problem of partially annotated multi-label classification. This scenario involves learning from a multi-label dataset where only a subset of positive classes is annotated. This task encounters challenges associated with a scarcity of positive annotations and severe label imbalance.\nTo overcome these challenges, we propose Partially Annotated reinforcement learning with a Policy Gradient algorithm (PAPG), a framework combining the exploration capabilities of reinforcement learning with the exploitation strengths of supervised learning. By introducing local and global rewards to address class imbalance issues and employing an iterative training strategy equipped with data enhancement, our framework showcases its effectiveness and superiority across diverse classification tasks.",
        "keywords": "Multi-label task;partially-annotated data;weakly supervised learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/2ad404470da6cfc7cd62e728989d36e742406193.pdf",
        "author": "Zixia Jia;Junpeng Li;Shichuan Zhang;Anji Liu;Zilong Zheng",
        "authorids": "~Zixia_Jia1;~Junpeng_Li2;~Shichuan_Zhang1;~Anji_Liu1;~Zilong_Zheng1",
        "gender": "F;M;;M;M",
        "homepage": ";;;https://liuanji.github.io/;http://zilongzheng.github.io",
        "dblp": "257/1724.html;https://dblp.org/rec/conf/www/ZhangLMM18;;227/8622;218/5234",
        "google_scholar": "FdwGDyoAAAAJ;;;k_4zYecAAAAJ;9sDx70IAAAAJ",
        "orcid": ";;0000-0003-1822-3950;;",
        "linkedin": ";;;anji-liu-7610b7190/;",
        "or_profile": "~Zixia_Jia1;~Junpeng_Li2;~Shichuan_Zhang1;~Anji_Liu1;~Zilong_Zheng1",
        "aff": "BigAI;;Westlake University;University of California, Los Angeles;Beijing Institute for General Artificial Intelligence",
        "aff_domain": "bigai.ai;;westlake.edu.cn;ucla.edu;bigai.ai",
        "position": "Researcher;;PhD student;PhD student;Researcher",
        "bibtex": "@misc{\njia2024make,\ntitle={Make Small Data Great Again: Learning from Partially Annotated Data via Policy Gradient for Multi-Label Classification Tasks},\nauthor={Zixia Jia and Junpeng Li and Shichuan Zhang and Anji Liu and Zilong Zheng},\nyear={2024},\nurl={https://openreview.net/forum?id=bUGzjiUsIq}\n}",
        "github": "",
        "project": "",
        "reviewers": "svcR;LdF2;Ab3u;QJLy",
        "site": "https://openreview.net/forum?id=bUGzjiUsIq",
        "pdf_size": 879529,
        "rating": "3;3;5;6",
        "confidence": "4;4;3;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;2;3",
        "wc_summary": "59;55;71;61",
        "wc_strengths": "43;60;41;47",
        "wc_weaknesses": "243;101;147;43",
        "wc_questions": "15;65;18;98",
        "wc_review": "360;281;277;249",
        "wc_reply_reviewers": "0;50;0;10",
        "wc_reply_authors": "931;1117;765;670",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "2;3;2;2",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            61.5,
            5.894913061275798
        ],
        "wc_strengths_avg": [
            47.75,
            7.39509972887452
        ],
        "wc_weaknesses_avg": [
            133.5,
            73.17615731917057
        ],
        "wc_questions_avg": [
            49.0,
            34.5470693402494
        ],
        "wc_review_avg": [
            291.75,
            41.287861412284364
        ],
        "wc_reply_reviewers_avg": [
            15.0,
            20.615528128088304
        ],
        "wc_reply_authors_avg": [
            870.75,
            170.11227909824734
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:0_aEyjby5-EJ:scholar.google.com/&scioq=Make+Small+Data+Great+Again:+Learning+from+Partially+Annotated+Data+via+Policy+Gradient+for+Multi-Label+Classification+Tasks&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "BigAI;Westlake University;University of California, Los Angeles;Beijing Institute for General Artificial Intelligence",
        "aff_unique_dep": ";;;",
        "aff_unique_url": ";https://www.westlake.edu.cn;https://www.ucla.edu;http://www.bigaiai.org/",
        "aff_unique_abbr": ";WU;UCLA;BIGAI",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Los Angeles",
        "aff_country_unique_index": "1;2;1",
        "aff_country_unique": ";China;United States"
    },
    {
        "id": "bUgni8nH8Z",
        "title": "Neural Characteristic Activation Value Analysis for Improved ReLU Network Feature Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This work examines the characteristic activation values of individual ReLU units in neural networks. We refer to the set of input locations corresponding to such characteristic activation values as the characteristic activation set of a ReLU unit. We draw an explicit connection between the characteristic activation set and learned features in ReLU networks. This connection leads to new insights into how various neural network normalization techniques used in modern deep learning architectures regularize and stabilize stochastic gradient optimization. Utilizing these insights, we propose geometric parameterization for ReLU networks to improve feature learning, which decouples the radial and angular parameters in the hyperspherical coordinate system. We empirically verify its usefulness with less carefully chosen initialization schemes and larger learning rates. We report significant improvements in optimization stability, convergence speed, and generalization performance for various models on a variety of datasets, including the ResNet-50 network on ImageNet.",
        "keywords": "deep learning;neural networks;ReLU;parameterization;normalization",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/5442fcc82e8fa7fd1636d8e838ddda942bcad7d3.zip",
        "author": "Wenlin Chen;Hong Ge",
        "authorids": "~Wenlin_Chen2;~Hong_Ge1",
        "gender": ";M",
        "homepage": "https://wenlin-chen.github.io/;",
        "dblp": ";31/835",
        "google_scholar": "https://scholar.google.com/citations?hl=en;",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Wenlin_Chen2;~Hong_Ge1",
        "aff": "Microsoft Research;University of Cambridge",
        "aff_domain": "microsoft.com;cam.ac.uk",
        "position": "Research Intern;Senior Research Fellow",
        "bibtex": "@misc{\nchen2024neural,\ntitle={Neural Characteristic Activation Value Analysis for Improved Re{LU} Network Feature Learning},\nauthor={Wenlin Chen and Hong Ge},\nyear={2024},\nurl={https://openreview.net/forum?id=bUgni8nH8Z}\n}",
        "github": "",
        "project": "",
        "reviewers": "cECr;n38z;BSGv",
        "site": "https://openreview.net/forum?id=bUgni8nH8Z",
        "pdf_size": 1362934,
        "rating": "3;6;6",
        "confidence": "3;2;3",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "3;3;3",
        "wc_summary": "24;71;9",
        "wc_strengths": "26;56;91",
        "wc_weaknesses": "106;2;184",
        "wc_questions": "106;88;20",
        "wc_review": "262;217;304",
        "wc_reply_reviewers": "0;24;0",
        "wc_reply_authors": "503;231;693",
        "reply_reviewers": "0;1;0",
        "reply_authors": "2;2;2",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            34.666666666666664,
            26.411277052720408
        ],
        "wc_strengths_avg": [
            57.666666666666664,
            26.562295750848712
        ],
        "wc_weaknesses_avg": [
            97.33333333333333,
            74.55348564770277
        ],
        "wc_questions_avg": [
            71.33333333333333,
            37.03451843288306
        ],
        "wc_review_avg": [
            261.0,
            35.52463933666322
        ],
        "wc_reply_reviewers_avg": [
            8.0,
            11.313708498984761
        ],
        "wc_reply_authors_avg": [
            475.6666666666667,
            189.59840599423708
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Microsoft;University of Cambridge",
        "aff_unique_dep": "Microsoft Research;",
        "aff_unique_url": "https://www.microsoft.com/en-us/research;https://www.cam.ac.uk",
        "aff_unique_abbr": "MSR;Cambridge",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Cambridge",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "bUv5gJAAxH",
        "title": "Relating Implicit Bias and Adversarial Attacks through Intrinsic Dimension",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Despite their impressive performance in classification, neural networks are known to be vulnerable to adversarial attacks. These attacks are small perturbations of the input data designed to fool the model. Naturally, a question arises regarding the potential connection between the architecture, settings, or properties of the model and the nature of the attack. In this work, we aim to shed light on this problem by focusing on the implicit bias of the neural network, which refers to its inherent inclination to favor specific patterns or outcomes. Specifically, we investigate one aspect of the implicit bias, which involves the essential Fourier frequencies required for accurate image classification. We conduct tests to assess the statistical relationship between these frequencies and those necessary for a successful attack. To delve into this relationship, we propose a new method that can uncover non-linear correlations between sets of coordinates, which, in our case, are the aforementioned frequencies. By exploiting the entanglement between intrinsic dimension and correlation, we provide empirical evidence that the network bias in Fourier space and the target frequencies of adversarial attacks are closely tied.",
        "keywords": "Implicit Bias;Adversarial Attacks;Intrinsic Dimension;Neural Networks;Fourier Transform",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/a11227216b43347c19680291b84df9323523bbe6.zip",
        "author": "Lorenzo Basile;Nikos Karantzas;Alberto D'Onofrio;Luca Bortolussi;Alex Rodriguez;Fabio Anselmi",
        "authorids": "~Lorenzo_Basile1;~Nikos_Karantzas1;~Alberto_D'Onofrio1;~Luca_Bortolussi1;~Alex_Rodriguez1;~Fabio_Anselmi1",
        "gender": ";;M;M;;M",
        "homepage": ";;https://adsai.units.it/people/faculty/alberto-d-onofrio/;https://ai-lab.units.it;;",
        "dblp": "348/5790;317/0329;91/1333;32/1171;41/2229;137/8143",
        "google_scholar": "EUE33IQAAAAJ;UOiTl5YAAAAJ;cWPJoXkAAAAJ;p5ynADcAAAAJ;zUOi5sQAAAAJ;ILfgh7UAAAAJ",
        "orcid": ";;0000-0002-2190-272X;0000-0001-8874-4001;0000-0002-0213-6695;0000-0002-0264-4761",
        "linkedin": "lorebasile/;;alberto-d-onofrio-b8b24a34;;;",
        "or_profile": "~Lorenzo_Basile1;~Nikos_Karantzas1;~Alberto_D'Onofrio1;~Luca_Bortolussi1;~Alex_Rodriguez1;~Fabio_Anselmi1",
        "aff": "University of Trieste;Baylor College of Medicine;University of Trieste;University of Trieste;University of Trieste;University of Trieste",
        "aff_domain": "units.it;bcm.edu;units.it;units.it;units.it;units.it",
        "position": "PhD student;Postdoc;Researcher;Full Professor;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nbasile2024relating,\ntitle={Relating Implicit Bias and Adversarial Attacks through Intrinsic Dimension},\nauthor={Lorenzo Basile and Nikos Karantzas and Alberto D'Onofrio and Luca Bortolussi and Alex Rodriguez and Fabio Anselmi},\nyear={2024},\nurl={https://openreview.net/forum?id=bUv5gJAAxH}\n}",
        "github": "",
        "project": "",
        "reviewers": "3jNL;avqz;hyn3;Zxej",
        "site": "https://openreview.net/forum?id=bUv5gJAAxH",
        "pdf_size": 3705790,
        "rating": "3;3;3;5",
        "confidence": "3;5;4;4",
        "soundness": "3;2;1;2",
        "contribution": "2;2;2;2",
        "presentation": "3;2;2;4",
        "wc_summary": "115;21;239;241",
        "wc_strengths": "20;12;82;107",
        "wc_weaknesses": "119;182;184;135",
        "wc_questions": "22;9;111;7",
        "wc_review": "276;224;616;490",
        "wc_reply_reviewers": "5;0;154;5",
        "wc_reply_authors": "350;343;576;243",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            154.0,
            92.20086767487604
        ],
        "wc_strengths_avg": [
            55.25,
            40.332214171800686
        ],
        "wc_weaknesses_avg": [
            155.0,
            28.574464124459098
        ],
        "wc_questions_avg": [
            37.25,
            42.96728406590298
        ],
        "wc_review_avg": [
            401.5,
            158.98034469707252
        ],
        "wc_reply_reviewers_avg": [
            41.0,
            65.2725056972689
        ],
        "wc_reply_authors_avg": [
            378.0,
            121.8995488096654
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12751246938061504647&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;0;0;0;0",
        "aff_unique_norm": "University of Trieste;Baylor College of Medicine",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.units.it;https://www.bcm.edu",
        "aff_unique_abbr": "UniTS;BCM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;0;0",
        "aff_country_unique": "Italy;United States"
    },
    {
        "id": "bVzLZr0S8s",
        "title": "Action Shapley: A training data selection metric for high performance and cost efficient reinforcement learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Reinforcement learning (RL)  deals with a goal-seeking agent learning to achieve its goal by a sequence of trial-and-error based decisions as it interacts with a stochastic environment. While RL achieves outstanding success in playing complex video games that allow a large number of trial-and-errors, errors are always undesirable in the real world. To reduce errors, model-based RL first develops an environment model in which trial-and-errors can take place without real costs. Different training actions produces different environment models which in turn produce different RL agents. Superior interpretability demands granular understanding of the differential impact of the training actions on the resulting RL agent performance. To aid this understanding, we offer Action Shapley, an agnostic metric for the  selection of training actions. For Action Shapley computation, we include an algorithm for which avoids exponential complexity. We also show how Action Shapley can be used to select a high performance training action set. We demonstrate the effectiveness of Action Shapley through four real-world case studies involving dynamic controls of enterprise IT systems. First, the proposed Action Shapley computation algorithm saves more than 80\\% computational cycles compared to the corresponding brute-force exponential time computation. Second, the proposed Action Shapley-based training action selection policy produces the high performance RL agents most of the times in four case studies.",
        "keywords": "interpretability;control;environment model;training;reinforcement learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Rajat Ghosh;Debojyoti Dutta",
        "authorids": "~Rajat_Ghosh2;~Debojyoti_Dutta1",
        "gender": "M;M",
        "homepage": ";",
        "dblp": ";96/2340",
        "google_scholar": "n5SEuIYAAAAJ;",
        "orcid": ";",
        "linkedin": "i-am-rajat/;http://linkedin.com/in/dedutta",
        "or_profile": "~Rajat_Ghosh2;~Debojyoti_Dutta1",
        "aff": "Nutanix;",
        "aff_domain": "nutanix.com;",
        "position": "Staff Engineer;",
        "bibtex": "@misc{\nghosh2024action,\ntitle={Action Shapley: A training data selection metric for high performance and cost efficient reinforcement learning},\nauthor={Rajat Ghosh and Debojyoti Dutta},\nyear={2024},\nurl={https://openreview.net/forum?id=bVzLZr0S8s}\n}",
        "github": "",
        "project": "",
        "reviewers": "5Ksg;8N7h;mr6C;oVx8",
        "site": "https://openreview.net/forum?id=bVzLZr0S8s",
        "pdf_size": 2787412,
        "rating": "3;3;3;3",
        "confidence": "4;4;5;5",
        "soundness": "2;3;2;2",
        "contribution": "2;3;1;2",
        "presentation": "2;3;1;2",
        "wc_summary": "69;131;61;26",
        "wc_strengths": "40;39;29;79",
        "wc_weaknesses": "383;15;145;189",
        "wc_questions": "87;189;15;98",
        "wc_review": "579;374;250;392",
        "wc_reply_reviewers": "63;108;0;344",
        "wc_reply_authors": "736;809;495;1349",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "2;2;1;2",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            71.75,
            37.83764659700706
        ],
        "wc_strengths_avg": [
            46.75,
            19.109879643786353
        ],
        "wc_weaknesses_avg": [
            183.0,
            132.0075755401939
        ],
        "wc_questions_avg": [
            97.25,
            61.82384248815339
        ],
        "wc_review_avg": [
            398.75,
            117.5529136176556
        ],
        "wc_reply_reviewers_avg": [
            128.75,
            130.06032254304154
        ],
        "wc_reply_authors_avg": [
            847.25,
            312.11886758092663
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:0Yi_spuqgR0J:scholar.google.com/&scioq=Action+Shapley:+A+training+data+selection+metric+for+high+performance+and+cost+efficient+reinforcement+learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Nutanix",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nutanix.com",
        "aff_unique_abbr": "Nutanix",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Transferring Learning Trajectories of Neural Networks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18330",
        "id": "bWNJFD1l8M",
        "tldr": "",
        "abstract": "Training deep neural networks (DNNs) is computationally expensive, which is problematic especially when performing duplicated or similar training runs in model ensemble or fine-tuning pre-trained models, for example. Once we have trained one DNN on some dataset, we have its learning trajectory (i.e., a sequence of intermediate parameters during training) which may potentially contain useful information for learning the dataset. However, there has been no attempt to utilize such information of a given learning trajectory for another training. In this paper, we formulate the problem of \"transferring\" a given learning trajectory from one initial parameter to another one (named *learning transfer problem*) and derive the first algorithm to approximately solve it by matching gradients successively along the trajectory via permutation symmetry. We empirically show that the transferred parameters achieve non-trivial accuracy before any direct training, and can be trained significantly faster than training from scratch.",
        "keywords": "neural networks;learning dynamics;permutation symmetry;loss landscape",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/8682ec522f7933ddd1707f11134b458cd48966f3.zip",
        "author": "Daiki Chijiwa",
        "authorids": "~Daiki_Chijiwa1",
        "gender": "M",
        "homepage": "",
        "dblp": "295/8488",
        "google_scholar": "",
        "orcid": "",
        "linkedin": "daiki-chijiwa-81491a1a7/",
        "or_profile": "~Daiki_Chijiwa1",
        "aff": "NTT",
        "aff_domain": "ntt.co.jp",
        "position": "Researcher",
        "bibtex": "@inproceedings{\nchijiwa2024transferring,\ntitle={Transferring Learning Trajectories of Neural Networks},\nauthor={Daiki Chijiwa},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=bWNJFD1l8M}\n}",
        "github": "",
        "project": "",
        "reviewers": "EPpK;gCAh;rULw",
        "pdf_size": 2075727,
        "rating": "6;6;8",
        "confidence": "3;3;3",
        "soundness": "3;2;3",
        "contribution": "4;3;3",
        "presentation": "3;3;3",
        "wc_summary": "169;113;381",
        "wc_strengths": "82;74;141",
        "wc_weaknesses": "53;90;585",
        "wc_questions": "126;126;131",
        "wc_review": "430;403;1238",
        "wc_reply_reviewers": "216;0;309",
        "wc_reply_authors": "1362;754;1905",
        "reply_reviewers": "3;0;2",
        "reply_authors": "5;2;4",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            221.0,
            115.42385657508878
        ],
        "wc_strengths_avg": [
            99.0,
            29.87752778706208
        ],
        "wc_weaknesses_avg": [
            242.66666666666666,
            242.53705329747498
        ],
        "wc_questions_avg": [
            127.66666666666667,
            2.357022603955158
        ],
        "wc_review_avg": [
            690.3333333333334,
            387.41565390274167
        ],
        "wc_reply_reviewers_avg": [
            175.0,
            129.43724348115578
        ],
        "wc_reply_authors_avg": [
            1340.3333333333333,
            470.1434769183647
        ],
        "reply_reviewers_avg": [
            1.6666666666666667,
            1.247219128924647
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            1.247219128924647
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=26379034312168106&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=bWNJFD1l8M",
        "pdf": "https://openreview.net/pdf?id=bWNJFD1l8M",
        "email": "ntt.co.jp",
        "author_num": 1,
        "aff_unique_index": "0",
        "aff_unique_norm": "NTT Corporation",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ntt.co.jp",
        "aff_unique_abbr": "NTT",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Japan"
    },
    {
        "title": "FITS: Modeling Time Series with $10k$ Parameters",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18329",
        "id": "bWcnvZ3qMb",
        "author_site": "Zhijian Xu, Ailing Zeng, Qiang Xu",
        "tldr": "",
        "abstract": "In this paper, we introduce FITS, a lightweight yet powerful model for time series analysis. Unlike existing models that directly process raw time-domain data, FITS operates on the principle that time series can be manipulated through interpolation in the complex frequency domain, achieving performance comparable to state-of-the-art models for time series forecasting and anomaly detection tasks. Notably, FITS accomplishes this with a svelte profile of just about $10k$ parameters, making it ideally suited for edge devices and paving the way for a wide range of applications. The code is available for review at: \\url{https://anonymous.4open.science/r/FITS}.",
        "keywords": "Time series analysis;Time series forecasting;Complex-valued neural network",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Zhijian Xu;Ailing Zeng;Qiang Xu",
        "authorids": "~Zhijian_Xu1;~Ailing_Zeng1;~Qiang_Xu1",
        "gender": "M;F;M",
        "homepage": "http://notfornow.com;https://ailingzeng.site/;https://github.com/cure-lab",
        "dblp": "72/8350;226/4720;43/1230-1",
        "google_scholar": ";Tn7fzS8AAAAJ;https://scholar.google.com.tw/citations?user=eSiKPqUAAAAJ",
        "orcid": ";;",
        "linkedin": ";%E7%88%B1%E7%8E%B2-%E6%9B%BE-65504112a/;",
        "or_profile": "~Zhijian_Xu1;~Ailing_Zeng1;~Qiang_Xu1",
        "aff": "The Chinese University of Hong Kong;International Digital Economy Academy;The Chinese University of Hong Kong",
        "aff_domain": "cuhk.edu.hk;idea.edu.cn;cuhk.edu.hk",
        "position": "PhD student;Researcher;Full Professor",
        "bibtex": "@inproceedings{\nxu2024fits,\ntitle={{FITS}: Modeling Time Series with \\$10k\\$ Parameters},\nauthor={Zhijian Xu and Ailing Zeng and Qiang Xu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=bWcnvZ3qMb}\n}",
        "github": "",
        "project": "",
        "reviewers": "u3QE;r1EX;HyfR;YAqa",
        "pdf_size": 1993443,
        "rating": "8;8;8;8",
        "confidence": "2;3;4;4",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;4;3",
        "wc_summary": "115;92;128;75",
        "wc_strengths": "145;61;133;88",
        "wc_weaknesses": "148;120;89;70",
        "wc_questions": "15;244;28;16",
        "wc_review": "423;517;378;249",
        "wc_reply_reviewers": "24;106;18;21",
        "wc_reply_authors": "444;1893;461;430",
        "reply_reviewers": "1;2;1;1",
        "reply_authors": "1;4;1;1",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            102.5,
            20.45116133621756
        ],
        "wc_strengths_avg": [
            106.75,
            33.89966813996857
        ],
        "wc_weaknesses_avg": [
            106.75,
            29.76050234791073
        ],
        "wc_questions_avg": [
            75.75,
            97.27377601388773
        ],
        "wc_review_avg": [
            391.75,
            96.476357207349
        ],
        "wc_reply_reviewers_avg": [
            42.25,
            36.867160183556315
        ],
        "wc_reply_authors_avg": [
            807.0,
            627.0984771150381
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            1.299038105676658
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 123,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10969437811591379516&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=bWcnvZ3qMb",
        "pdf": "https://openreview.net/pdf?id=bWcnvZ3qMb",
        "email": "cuhk.edu.hk;idea.edu.cn;cuhk.edu.hk",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Chinese University of Hong Kong;International Digital Economy Academy",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cuhk.edu.hk;",
        "aff_unique_abbr": "CUHK;",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China;"
    },
    {
        "title": "Exploring Diffusion Time-steps for Unsupervised Representation Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18328",
        "id": "bWzxhtl1HP",
        "author_site": "Zhongqi Yue, Jiankun Wang, Qianru Sun, Lei Ji, Eric Chang, Hanwang Zhang",
        "tldr": "",
        "abstract": "Representation learning is all about discovering the hidden modular attributes that generate the data faithfully. We explore the potential of Denoising Diffusion Probabilistic Model (DM) in unsupervised learning of the modular attributes. We build a theoretical framework that connects the diffusion time-steps and the hidden attributes, which serves as an effective inductive bias for unsupervised learning. Specifically, the forward diffusion process incrementally adds Gaussian noise to samples at each time-step, which essentially collapses different samples into similar ones by losing attributes, e.g., fine-grained attributes such as texture are lost with less noise added (i.e., early time-steps), while coarse-grained ones such as shape are lost by adding more noise (i.e., late time-steps). To disentangle the modular attributes, at each time-step t, we learn a t-specific feature to compensate for the newly lost attribute, and the set of all {1,...,t}-specific features, corresponding to the cumulative set of lost attributes, are trained to make up for the reconstruction error of a pre-trained DM at time-step t. On CelebA, FFHQ, and Bedroom datasets, the learned feature significantly improves attribute classification and enables faithful counterfactual generation, e.g., interpolating only one specified attribute between two images, validating the disentanglement quality. Codes are in https://github.com/yue-zhongqi/diti.",
        "keywords": "unsupervised representation learning;diffusion model;representation disentanglement;counterfactual generation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/7bf9a7ad75302629613038811fd94402d6f6966d.pdf",
        "author": "Zhongqi Yue;Jiankun Wang;Qianru Sun;Lei Ji;Eric I-Chao Chang;Hanwang Zhang",
        "authorids": "~Zhongqi_Yue1;~Jiankun_Wang1;~Qianru_Sun2;~Lei_Ji1;~Eric_I-Chao_Chang1;~Hanwang_Zhang3",
        "gender": ";;F;F;M;M",
        "homepage": "https://github.com/yue-zhongqi;https://github.com/JiankunW;https://qianrusun.com/;;;https://mreallab.github.io/index.html",
        "dblp": "275/3790;;127/6132.html;42/2721-1;117/6621;79/8116.html",
        "google_scholar": "7Iyz9ZYAAAAJ;;https://scholar.google.de/citations?user=fNfrGMIAAAAJ;;FcQTsdkAAAAJ;YG0DFyYAAAAJ",
        "orcid": ";;0000-0003-2689-317X;;;",
        "linkedin": ";;;;ericichaochang;",
        "or_profile": "~Zhongqi_Yue1;~Jiankun_Wang1;~Qianru_Sun2;~Lei_Ji1;~Eric_I-Chao_Chang1;~Hanwang_Zhang3",
        "aff": "Nanyang Technological University;;Singapore Management University;Microsoft Research;Massachusetts Institute of Technology;Nanyang Technological University",
        "aff_domain": "ntu.edu.sg;;smu.edu.sg;research.microsoft.com;mit.edu;ntu.edu.sg",
        "position": "PhD student;;Assistant Professor;Researcher;Emeritus;Associate Professor",
        "bibtex": "@inproceedings{\nyue2024exploring,\ntitle={Exploring Diffusion Time-steps for Unsupervised Representation Learning},\nauthor={Zhongqi Yue and Jiankun Wang and Qianru Sun and Lei Ji and Eric I-Chao Chang and Hanwang Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=bWzxhtl1HP}\n}",
        "github": "",
        "project": "",
        "reviewers": "1YJJ;5NeX;Cjby;Kc2k",
        "pdf_size": 3681747,
        "rating": "6;6;6;6",
        "confidence": "4;3;5;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "124;84;90;75",
        "wc_strengths": "125;77;74;83",
        "wc_weaknesses": "283;71;167;152",
        "wc_questions": "59;23;50;16",
        "wc_review": "591;255;381;326",
        "wc_reply_reviewers": "53;177;140;0",
        "wc_reply_authors": "379;219;770;869",
        "reply_reviewers": "1;1;2;0",
        "reply_authors": "2;2;3;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            93.25,
            18.538810641462412
        ],
        "wc_strengths_avg": [
            89.75,
            20.60794749605113
        ],
        "wc_weaknesses_avg": [
            168.25,
            75.648446778503
        ],
        "wc_questions_avg": [
            37.0,
            17.95828499606797
        ],
        "wc_review_avg": [
            388.25,
            125.29041264198949
        ],
        "wc_reply_reviewers_avg": [
            92.5,
            69.84447007458786
        ],
        "wc_reply_authors_avg": [
            559.25,
            268.6171764798372
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7694744097631488760&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=bWzxhtl1HP",
        "pdf": "https://openreview.net/pdf?id=bWzxhtl1HP",
        "email": "ntu.edu.sg;;smu.edu.sg;research.microsoft.com;mit.edu;ntu.edu.sg",
        "author_num": 6,
        "aff_unique_index": "0;1;2;3;0",
        "aff_unique_norm": "Nanyang Technological University;Singapore Management University;Microsoft;Massachusetts Institute of Technology",
        "aff_unique_dep": ";;Microsoft Research;",
        "aff_unique_url": "https://www.ntu.edu.sg;https://www.smu.edu.sg;https://www.microsoft.com/en-us/research;https://web.mit.edu",
        "aff_unique_abbr": "NTU;SMU;MSR;MIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;1;0",
        "aff_country_unique": "Singapore;United States"
    },
    {
        "id": "bXApPLUOmO",
        "title": "Winograd Structured Pruning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Both Winograd convolution (\\textit{WC}) and pruning can significantly reduce the computation of Convolutional Neural Network (CNN), but applying them simultaneously is challenging.\nFor example, applying fine-grained pruning to \\textit{WC} eliminates the computational advantages from sparsity due to Winograd transformation.\nMoreover, integrating \\textit{WC} with filter pruning can lead to a reduction in network accuracy due to the use of large pruning unit size.\nTo address previous challenges, this paper proposes Adaptive Balanced Winograd Structured Pruning (ABWSP), a method specifically designed to prune weights in \\textit{WC} networks executed on GPUs, which are widely used as computing devices for CNNs. \nABWSP takes into account three crucial factors: pruning unit size, workload balance, and layer importance. \nFirst, ABWSP efficiently utilizes the computing units on GPUs by pruning grouped weights simultaneously.\nConsidering the computational characteristics of \\textit{WC} on GPU, the group size can be minimized while maintaining a regular data pattern (i.e., WSP).\nSecondly, the General Matrix Multiplications (GEMMs) of a layer are executed concurrently on GPU, and the execution time of the layer is determined by the longest GEMM operation.\nTo minimize the execution cycle for \\textit{WC}, ABWSP maintains an equal pruning ratio between matrices of \\textit{WC} (i.e., BWSP).\nLastly, applying BWSP to all layers results in a loss of accuracy.\nSince the importance varies for each \\textit{WC} layer, the accuracy loss and performance benefit due to BWSP are different.\nTo maintain accuracy with high speedup, ABWSP comprehensively evaluates both accuracy and speedup to determine the appropriate application of BWSP or WSP for each layer, automatically. \nBy considering these factors, ABWSP optimizes the pruning process by effectively utilizing GPU computing units, minimizing execution cycles of each layer, and ensuring a balance between accuracy and speedup.",
        "keywords": "Pruning;Winograd Convolution;GPU",
        "primary_area": "infrastructure, software libraries, hardware, etc.",
        "supplementary_material": "/attachment/3a3f6bad49e9470d8dd853f95ce67715a394ce86.pdf",
        "author": "Cheonjun Park;Myung Kuk Yoon;Mincheol Park;Hyun Jae Oh;Minsik Kim;Suhyun Kim;Won Woo Ro",
        "authorids": "~Cheonjun_Park1;~Myung_Kuk_Yoon1;~Mincheol_Park1;~Hyun_Jae_Oh1;~Minsik_Kim1;~Suhyun_Kim1;~Won_Woo_Ro1",
        "gender": "M;;M;F;M;;M",
        "homepage": ";;;http://escal.yonsei.ac.kr/test2/temp/ohj.html;https://minsik-kim.github.io/;https://kdst.tistory.com/;http://escal.yonsei.ac.kr/",
        "dblp": "254/7925;;270/1814;;172/9940;45/6898-1;r/WonWooRo",
        "google_scholar": "https://scholar.google.com/citations?hl=ko;;kSIW-XAAAAAJ;https://scholar.google.com/citations?hl=ko;;;GVfD5LQAAAAJ",
        "orcid": ";;;;;;0000-0001-5390-6445",
        "linkedin": "cheonjun-park-ba7217183;;mincheol-park-66b166186;;;;",
        "or_profile": "~Cheonjun_Park1;~Myung_Kuk_Yoon1;~Mincheol_Park1;~Hyun_Jae_Oh1;~Minsik_Kim1;~Suhyun_Kim1;~Won_Woo_Ro1",
        "aff": "Yonsei University;;Korea Institute of Science and Technology;Samsung;Yonsei University;Korea Institute of Science and Technology;Yonsei University",
        "aff_domain": "yonsei.ac.kr;;kist.re.kr;samsung.com;yonsei.ac.kr;kist.re.kr;yonsei.ac.kr",
        "position": "PhD student;;Research assistant;Researcher;Research Professor;Principal Researcher;Full Professor",
        "bibtex": "@misc{\npark2024winograd,\ntitle={Winograd Structured Pruning},\nauthor={Cheonjun Park and Myung Kuk Yoon and Mincheol Park and Hyun Jae Oh and Minsik Kim and Suhyun Kim and Won Woo Ro},\nyear={2024},\nurl={https://openreview.net/forum?id=bXApPLUOmO}\n}",
        "github": "",
        "project": "",
        "reviewers": "wzFL;iq1J;wyHk;oE96",
        "site": "https://openreview.net/forum?id=bXApPLUOmO",
        "pdf_size": 4716406,
        "rating": "3;3;6;6",
        "confidence": "4;4;4;3",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;3;1",
        "wc_summary": "77;28;76;67",
        "wc_strengths": "24;16;50;55",
        "wc_weaknesses": "111;238;52;66",
        "wc_questions": "6;67;228;6",
        "wc_review": "218;349;406;194",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            62.0,
            20.0124960961895
        ],
        "wc_strengths_avg": [
            36.25,
            16.588776326179094
        ],
        "wc_weaknesses_avg": [
            116.75,
            73.31908005423963
        ],
        "wc_questions_avg": [
            76.75,
            90.80576798860301
        ],
        "wc_review_avg": [
            291.75,
            88.49399697154604
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5773502691896258,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:S3iFJ6ZsGYQJ:scholar.google.com/&scioq=Winograd+Structured+Pruning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0;1;0",
        "aff_unique_norm": "Yonsei University;Korea Institute of Science and Technology;Samsung",
        "aff_unique_dep": ";;Samsung",
        "aff_unique_url": "https://www.yonsei.ac.kr;https://www.kist.re.kr;https://www.samsung.com",
        "aff_unique_abbr": "Yonsei;KIST;Samsung",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "bXI0thP733",
        "title": "Mitigating backdoor attacks with generative modelling and dataset relabelling",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Data-poisoning attacks \nchange a small portion \nof the training dataset\nby introducing hand-crafted triggers \nand rewiring the corresponding labels \ntowards a desired target class.\nTraining on such data injects \na backdoor into the model,  \nthat causes incorrect inference \nin selected test examples.\nExisting defenses mitigate \nthe risks of such attacks \nthrough various modifications\nof the standard discriminative learning procedure.\nThis paper explores a different approach\nthat promises clean models \nby means of per-class generative modelling. \nWe start by mapping the input data\ninto a suitable latent space\nby leveraging a pre-trained \nself-supervised feature extractor.\nInterestingly, these representations\nget either preserved or heavily disturbed\nunder recent backdoor attacks.\nIn both cases, we find that \nper-class generative models\ngive rise to probabilistic densities\nthat allow both to detect the poisoned data\nand to find their original classes.\nThis allows to patch the poisoned dataset\nby reverting the original labels\nand considering the triggers \nas a kind of augmentation.\nOur experiments show that\ntraining on patched datasets\ngreatly reduces attack success rate\nand retains the clean accuracy.",
        "keywords": "backdoor defense;backdoor learning;trusthworty AI;AI security",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/3fc9801b486be4174821408bb4352c249f5f6c43.pdf",
        "author": "Ivan Sabolic;Ivan Grubi\u0161i\u0107;Sini\u0161a \u0160egvi\u0107",
        "authorids": "~Ivan_Sabolic1;~Ivan_Grubi\u0161i\u01071;~Sini\u0161a_\u0160egvi\u01071",
        "gender": "M;M;M",
        "homepage": ";https://github.com/Ivan1248;http://www.zemris.fer.hr/~ssegvic/index_en.html",
        "dblp": ";04/10230-1;42/3275",
        "google_scholar": ";https://scholar.google.hr/citations?user=QB3Eh4AAAAAJ;_nGQT0wAAAAJ",
        "orcid": ";0000-0002-8908-3249;0000-0001-7378-0536",
        "linkedin": "ivan-sabolic-44a17916a/;;",
        "or_profile": "~Ivan_Sabolic1;~Ivan_Grubi\u0161i\u01071;~Sini\u0161a_\u0160egvi\u01071",
        "aff": "University of Zagreb;UniZg-FER, University of Zagreb;UniZg-FER, University of Zagreb",
        "aff_domain": "fer.hr;fer.unizg.hr;fer.unizg.hr",
        "position": "PhD student;Postdoc;Full Professor",
        "bibtex": "@misc{\nsabolic2024mitigating,\ntitle={Mitigating backdoor attacks with generative modelling and dataset relabelling},\nauthor={Ivan Sabolic and Ivan Grubi{\\v{s}}i{\\'c} and Sini{\\v{s}}a {\\v{S}}egvi{\\'c}},\nyear={2024},\nurl={https://openreview.net/forum?id=bXI0thP733}\n}",
        "github": "",
        "project": "",
        "reviewers": "y1uP;U1ob;gUtc;rmHx",
        "site": "https://openreview.net/forum?id=bXI0thP733",
        "pdf_size": 1399477,
        "rating": "3;5;5;5",
        "confidence": "4;3;4;3",
        "soundness": "1;3;3;2",
        "contribution": "1;3;3;2",
        "presentation": "2;2;2;2",
        "wc_summary": "41;122;277;69",
        "wc_strengths": "51;56;80;47",
        "wc_weaknesses": "612;428;374;59",
        "wc_questions": "131;141;321;33",
        "wc_review": "835;747;1052;208",
        "wc_reply_reviewers": "0;126;172;0",
        "wc_reply_authors": "704;120;587;69",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            127.25,
            91.22054319066511
        ],
        "wc_strengths_avg": [
            58.5,
            12.816005617976296
        ],
        "wc_weaknesses_avg": [
            368.25,
            199.15618870625136
        ],
        "wc_questions_avg": [
            156.5,
            103.92665683067074
        ],
        "wc_review_avg": [
            710.5,
            310.6287977635042
        ],
        "wc_reply_reviewers_avg": [
            74.5,
            76.25450806345812
        ],
        "wc_reply_authors_avg": [
            370.0,
            279.1710944922486
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:vi0r2CRfxjYJ:scholar.google.com/&scioq=Mitigating+backdoor+attacks+with+generative+modelling+and+dataset+relabelling&hl=en&as_sdt=0,47",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Zagreb",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.unizg.hr",
        "aff_unique_abbr": "UNIZG",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Zagreb",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Croatia"
    },
    {
        "id": "bXLOOoR2ft",
        "title": "DoraemonGPT: Toward Solving Real-world Tasks with Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The field of developing AI agents is advancing at an unprecedented rate due to the powerful capabilities of large language models (LLMs). However, current LLM-driven agents mainly focus on solving tasks for the image modality, which limits their ability to understand the dynamic nature of the real world, making it still far from real-life applications, e.g., guiding students through multi-step laboratory experiments and identifying their mistakes. Considering the video modality better reflects the ever-changing and perceptually intensive nature of real-world scenarios, we devise DoraemonGPT, a comprehensive and conceptually elegant system driven by LLMs to handle dynamic video tasks. Given a video with a question/task, DoraemonGPT begins by converting the input video with massive content into a symbolic memory that stores task-related attributes. This structured representation allows for spatial-temporal querying and reasoning by sub-task tools, resulting in concise and relevant intermediate results. Recognizing that LLMs have limited internal knowledge when it comes to specialized domains (e.g., analyzing the scientific principles underlying experiments), we incorporate plug-and-play tools to assess external knowledge and address tasks across different domains. Moreover, we introduce a novel LLM-driven planner based on Monte Carlo Tree Search to efficiently explore the large planning space for scheduling various tools. The planner iteratively finds feasible solutions by backpropagating the result\u2019s reward, and multiple solutions can be summarized into an improved final answer. We extensively evaluate DoraemonGPT\u2019s effectiveness and reasoning capabilities in real-world dynamic scenarios and provide in-the-wild showcases demonstrating its ability to handle more complex questions than previous studies.",
        "keywords": "Large Language Models;LLM-driven Agent",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/7e5987b909ed43ef5df75c64f846e107b38f85c2.pdf",
        "author": "Zongxin Yang;Guikun Chen;Xiaodi Li;Wenguan Wang;Yi Yang",
        "authorids": "~Zongxin_Yang1;~Guikun_Chen1;~Xiaodi_Li2;~Wenguan_Wang4;~Yi_Yang22",
        "gender": "M;M;;M;M",
        "homepage": "https://z-x-yang.github.io/;https://guikunchen.github.io/;;https://sites.google.com/view/wenguanwang/;https://person.zju.edu.cn/yiyang",
        "dblp": ";342/9515;;145/1078;33/4854-1.html",
        "google_scholar": "8IE0CfwAAAAJ;I1TOdpkAAAAJ;;CqAQQkgAAAAJ;RMSuNFwAAAAJ",
        "orcid": ";;;0000-0002-0802-9567;",
        "linkedin": ";;;wenguanwang;",
        "or_profile": "~Zongxin_Yang1;~Guikun_Chen1;~Xiaodi_Li2;~Wenguan_Wang4;~Yi_Yang22",
        "aff": "Zhejiang University;Zhejiang University;;Zhejiang University;Zhejiang University",
        "aff_domain": "zju.edu.cn;zju.edu.cn;;zju.edu.cn;zju.edu.cn",
        "position": "Postdoc;PhD student;;Full Professor;Full Professor",
        "bibtex": "@misc{\nyang2024doraemongpt,\ntitle={Doraemon{GPT}: Toward Solving Real-world Tasks with Large Language Models},\nauthor={Zongxin Yang and Guikun Chen and Xiaodi Li and Wenguan Wang and Yi Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=bXLOOoR2ft}\n}",
        "github": "",
        "project": "",
        "reviewers": "KysJ;jbqG;FY1y;9YSq",
        "site": "https://openreview.net/forum?id=bXLOOoR2ft",
        "pdf_size": 2030936,
        "rating": "5;6;8;8",
        "confidence": "4;4;3;3",
        "soundness": "2;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "2;3;3;4",
        "wc_summary": "99;113;91;157",
        "wc_strengths": "44;34;123;40",
        "wc_weaknesses": "162;91;267;62",
        "wc_questions": "42;25;2;33",
        "wc_review": "347;263;483;292",
        "wc_reply_reviewers": "50;0;37;23",
        "wc_reply_authors": "909;1277;1092;1044",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "3;2;3;3",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            115.0,
            25.495097567963924
        ],
        "wc_strengths_avg": [
            60.25,
            36.403124865868314
        ],
        "wc_weaknesses_avg": [
            145.5,
            79.02056694304338
        ],
        "wc_questions_avg": [
            25.5,
            14.84082207965583
        ],
        "wc_review_avg": [
            346.25,
            84.52033778919723
        ],
        "wc_reply_reviewers_avg": [
            27.5,
            18.527007313648905
        ],
        "wc_reply_authors_avg": [
            1080.5,
            131.80383150728207
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            0.4330127018922193
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9622504486493761,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:QH1NOvq27gAJ:scholar.google.com/&scioq=DoraemonGPT:+Toward+Solving+Real-world+Tasks+with+Large+Language+Models&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Zhejiang University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.zju.edu.cn",
        "aff_unique_abbr": "ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "bXeSwrVgjN",
        "title": "Benchmarking Deletion Metrics with the Principled Explanations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Insertion/deletion metrics and their variants have been extensively applied to evaluate attribution-based explanation methods. Such metrics measure the significance of features by observing changes in model predictions as features are incrementally inserted or deleted. Given the direct connection between the attribution values and model predictions that insertion/deletion metrics enable, they are commonly used as the decisive metrics for novel attribution methods. Such influential metrics for explanation methods should be handled with great scrutiny. However, contemporary research on insertion/deletion metrics falls short of a comprehensive analysis. To address this, we propose the TRAjectory importanCE (TRACE) framework, whichachieves the best scores of the insertion/deletion metric. Our contribution includes two aspects: 1) TRACE stands as the principled explanation for explaining the influence of feature deletion on model predictions. We demonstrate that TRACE is guaranteed to achieve almost optimal results both theoretically and empirically. 2) Using TRACE, we benchmark insertion/deletion metrics across all possible settings and study critical problems such as the out-of-distribution (OOD) issue, and provide practical guidance on applying these metrics in practice.",
        "keywords": "explainable artificial intelligence;attribution methods;deletion metrics",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/dc38f5f53262ff9891b9ce5b0a3204b964cc0ce4.pdf",
        "author": "Yipei Wang;Xiaoqian Wang",
        "authorids": "~Yipei_Wang1;~Xiaoqian_Wang1",
        "gender": "M;F",
        "homepage": "https://yipei-wang.github.io;https://engineering.purdue.edu/~joywang/",
        "dblp": "140/2763;151/3215-1",
        "google_scholar": "NXENco8AAAAJ;I3tc214AAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Yipei_Wang1;~Xiaoqian_Wang1",
        "aff": "Purdue University;Purdue University",
        "aff_domain": "purdue.edu;purdue.edu",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nwang2024benchmarking,\ntitle={Benchmarking Deletion Metrics with the Principled Explanations},\nauthor={Yipei Wang and Xiaoqian Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=bXeSwrVgjN}\n}",
        "github": "",
        "project": "",
        "reviewers": "HLaZ;VCEJ;wwkN;8p78",
        "site": "https://openreview.net/forum?id=bXeSwrVgjN",
        "pdf_size": 23368327,
        "rating": "3;5;8;8",
        "confidence": "4;3;4;3",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "162;44;90;90",
        "wc_strengths": "86;52;34;29",
        "wc_weaknesses": "368;195;77;59",
        "wc_questions": "44;45;291;3",
        "wc_review": "660;336;492;181",
        "wc_reply_reviewers": "76;171;0;0",
        "wc_reply_authors": "2728;1848;1081;426",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "4;4;2;1",
        "rating_avg": [
            6.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            96.5,
            42.22262426709169
        ],
        "wc_strengths_avg": [
            50.25,
            22.342504335906483
        ],
        "wc_weaknesses_avg": [
            174.75,
            123.19572841620767
        ],
        "wc_questions_avg": [
            95.75,
            113.9942432757023
        ],
        "wc_review_avg": [
            417.25,
            178.13671014139675
        ],
        "wc_reply_reviewers_avg": [
            61.75,
            70.29358078800652
        ],
        "wc_reply_authors_avg": [
            1520.75,
            859.7096530224609
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.75,
            1.299038105676658
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.23570226039551587,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ULWM0FjaposJ:scholar.google.com/&scioq=Benchmarking+Deletion+Metrics+with+the+Principled+Explanations&hl=en&as_sdt=0,48",
        "gs_version_total": 5,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Purdue University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.purdue.edu",
        "aff_unique_abbr": "Purdue",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "bXk9gcKhqp",
        "title": "Rethinking the Polynomial Filter of GNNs via Graph Information Activation Theory",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recently, it has been a hot research topic to design different polynomial filters in graph neural networks (GNNs). Most of the existing GNNs only pay attention to the properties of polynomials when designing the polynomial filter, thus not only bringing additional computational costs but also ignoring embedding the graph structure information into the construction process of the basis. To address these issues, we theoretically prove that any polynomial basis with the same degree has the same expressive ability and the finely designed polynomial basis that only considers the polynomial property can at most bring linear benefit for GNNs. Then, we propose a graph information activation (GIA) theory that provides a new perspective for interpreting polynomial filters and then analyse some popular bases using the GIA theory. Based on the GIA theory and analysis, we design a simple basis by utilizing the graph structure information and further build a simple GNN (i.e., SimpleNet), which can be applied to both homogeneous and non-homogenous graphs. Experiments on real datasets demonstrate that our SimpleNet can achieve better or comparable performance with relatively less running time compared to other state-of-the-art GNNs.",
        "keywords": "Graph Neural Networks;Polynomial Filter;Polynomial Basis",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Bodong Du;Haodong Wen;Deyu Meng;Xiangyong Cao",
        "authorids": "~Bodong_Du1;~Haodong_Wen1;~Deyu_Meng1;~Xiangyong_Cao1",
        "gender": "M;M;M;M",
        "homepage": "https://github.com/MyBM520;https://github.com/WDongChuan;http://dymeng.gr.xjtu.edu.cn;http://gr.xjtu.edu.cn/web/caoxiangyong",
        "dblp": ";;22/5614;175/1407",
        "google_scholar": ";;an6w-64AAAAJ;IePM9RsAAAAJ",
        "orcid": ";;0000-0002-1294-8283;",
        "linkedin": ";;;",
        "or_profile": "~Bodong_Du1;~Haodong_Wen1;~Deyu_Meng1;~Xiangyong_Cao1",
        "aff": "Xi'an Jiaotong University;Xi'an Jiaotong University;Xi'an Jiaotong University;Xi'an Jiaotong University",
        "aff_domain": "xjtu.edu.cn;xjtu.edu.cn;xjtu.edu.cn;xjtu.edu.cn",
        "position": "Undergrad student;Undergrad student;Full Professor;Associate Professor",
        "bibtex": "@misc{\ndu2024rethinking,\ntitle={Rethinking the Polynomial Filter of {GNN}s via Graph Information Activation Theory},\nauthor={Bodong Du and Haodong Wen and Deyu Meng and Xiangyong Cao},\nyear={2024},\nurl={https://openreview.net/forum?id=bXk9gcKhqp}\n}",
        "github": "",
        "project": "",
        "reviewers": "NHAm;PhMj;gN5j;UCAH",
        "site": "https://openreview.net/forum?id=bXk9gcKhqp",
        "pdf_size": 758228,
        "rating": "3;3;5;5",
        "confidence": "3;4;4;5",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "2;2;2;3",
        "wc_summary": "46;146;117;32",
        "wc_strengths": "26;9;33;98",
        "wc_weaknesses": "379;155;352;73",
        "wc_questions": "122;15;224;43",
        "wc_review": "573;325;726;246",
        "wc_reply_reviewers": "0;0;0;161",
        "wc_reply_authors": "1364;1224;1479;1095",
        "reply_reviewers": "0;0;0;3",
        "reply_authors": "3;3;3;4",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            85.25,
            47.63074112377426
        ],
        "wc_strengths_avg": [
            41.5,
            33.76758800980609
        ],
        "wc_weaknesses_avg": [
            239.75,
            129.4012654497629
        ],
        "wc_questions_avg": [
            101.0,
            81.1326075015465
        ],
        "wc_review_avg": [
            467.5,
            191.91208924921847
        ],
        "wc_reply_reviewers_avg": [
            40.25,
            69.71504500464731
        ],
        "wc_reply_authors_avg": [
            1290.5,
            144.54843478917368
        ],
        "reply_reviewers_avg": [
            0.75,
            1.299038105676658
        ],
        "reply_authors_avg": [
            3.25,
            0.4330127018922193
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.7071067811865475,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:-6-MWjswes0J:scholar.google.com/&scioq=Rethinking+the+Polynomial+Filter+of+GNNs+via+Graph+Information+Activation+Theory&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Xi'an Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.xjtu.edu.cn",
        "aff_unique_abbr": "XJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "bYQkOPvgDw",
        "title": "Probabilistic Graphical Model for Robust Graph Neural Networks against Noisy Labels",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "While robust graph neural networks (GNNs) have been widely studied for graph perturbation and attack, those for label noise have received significantly less attention. Most existing methods heavily rely on the label smoothness assumption to correct noisy labels, which adversely affects their performance on heterophilous graphs. Further, they generally perform poorly in high noise-rate scenarios. To address these problems, in this paper, we propose a novel probabilistic graphical model based framework PRGNN. Given a noisy label set and a clean label set, our goal is to maximize the likelihood of labels in the clean set. We first present PRGNN-v1, which generates clean labels based on graphs only in the Bayesian network. To further leverage the information of clean labels in the noisy label set, we put forward PRGNN-v2, which incorporates the noisy label set into the Bayesian network to generate clean labels. The generative process can then be used to predict labels for unlabeled nodes. We conduct extensive experiments to show the robustness of PRGNN on varying noise types and rates, and also on graphs with different heterophilies. In particular, we show that PRGNN can lead to inspiring performance in high noise-rate situations. The implemented code is available at https://github.com/PRGNN/PRGNN.",
        "keywords": "graph neural network;label noise;probabilistic graphical model;heterophilous graphs",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/36265d276a4accb2dcdea243271f3547776de77d.zip",
        "author": "Qingqing Ge;Jianxiang Yu;Zeyuan Zhao;Xiang Li",
        "authorids": "~Qingqing_Ge3;~Jianxiang_Yu1;~Zeyuan_Zhao1;~Xiang_Li24",
        "gender": ";M;;M",
        "homepage": "https://gqq1210.github.io/;https://jianxiangyu.github.io/;https://zzyzeyuan.github.io/;https://lixiang3776.github.io",
        "dblp": ";72/6230-1.html;;40/1491-67.html",
        "google_scholar": ";https://scholar.google.com.hk/citations?user=EH6ntM0AAAAJ;;JnxxNtsAAAAJ",
        "orcid": ";0009-0006-9900-9815;;0009-0003-0142-2483",
        "linkedin": ";;;",
        "or_profile": "~Qingqing_Ge3;~Jianxiang_Yu1;~Zeyuan_Zhao1;~Xiang_Li24",
        "aff": "East China Normal University;East China Normal University;East China Normal University;East China Normal University",
        "aff_domain": "ecnu.edu.cn;ecnu.edu.cn;ecnu.edu.cn;ecnu.edu.cn",
        "position": "MS student;MS student;MS student;Full Professor",
        "bibtex": "@misc{\nge2024probabilistic,\ntitle={Probabilistic Graphical Model for Robust Graph Neural Networks against Noisy Labels},\nauthor={Qingqing Ge and Jianxiang Yu and Zeyuan Zhao and Xiang Li},\nyear={2024},\nurl={https://openreview.net/forum?id=bYQkOPvgDw}\n}",
        "github": "",
        "project": "",
        "reviewers": "ncr4;JeRR;XrQv;b48A",
        "site": "https://openreview.net/forum?id=bYQkOPvgDw",
        "pdf_size": 542570,
        "rating": "3;5;5;5",
        "confidence": "4;3;4;3",
        "soundness": "2;2;3;2",
        "contribution": "2;2;2;3",
        "presentation": "2;3;2;2",
        "wc_summary": "45;53;92;243",
        "wc_strengths": "85;12;63;62",
        "wc_weaknesses": "495;95;86;339",
        "wc_questions": "203;2;5;4",
        "wc_review": "828;162;246;648",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            108.25,
            79.80405691442009
        ],
        "wc_strengths_avg": [
            55.5,
            26.744158240632665
        ],
        "wc_weaknesses_avg": [
            253.75,
            172.3446764480992
        ],
        "wc_questions_avg": [
            53.5,
            86.32062326002982
        ],
        "wc_review_avg": [
            471.0,
            276.08150970320344
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ovEScmTJ4RcJ:scholar.google.com/&scioq=Probabilistic+Graphical+Model+for+Robust+Graph+Neural+Networks+against+Noisy+Labels&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "East China Normal University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.ecnu.edu.cn",
        "aff_unique_abbr": "ECNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "bYwEpQ96ng",
        "title": "Hierarchical Long-tailed Classification with Visual Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Vision Language Models (VLMs) have shown promising capabilities in handling open vocabulary tasks but struggle with imbalanced data tuning, particularly when dealing with highly skewed label distributions. To address the challenges, we propose a hierarchical long-tailed classification framework, named HLC, which prioritizes candidate categories before conducting fine-grained classification using detailed textual descriptions. Specifically, we fine-tune a linear classifier based on the CLIP encoder, incorporating visual prompt tokens and leveraging shared feature space mixup for multimodal feature interactions. Based on candidates given by the coarse classifier, we query large language models to generate corresponding fine-grained descriptions to refine the final predictions. Importantly, we introduce a reweighting mechanism to filter out invalid descriptions generated by language models. Extensive evaluations demonstrate that our approach achieves state-of-the-art performance by fine-tuning only a few parameters on the PlacesLT, ImageNet-LT, and iNaturalist 2018 datasets.",
        "keywords": "Long-Tailed Recognition;Visual Language Models;Large Language Models",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/f1027161e762e3682ee182931c25c677e3d69691.zip",
        "author": "Zhengzhuo Xu;Ruikang Liu;Zenghao Chai;Yiyan Qi;Lei Li;Haiqin Yang;Chun Yuan",
        "authorids": "~Zhengzhuo_Xu1;~Ruikang_Liu1;~Zenghao_Chai1;~Yiyan_Qi1;~Lei_Li12;~Haiqin_Yang2;~Chun_Yuan1",
        "gender": "M;M;M;;M;M;M",
        "homepage": ";https://github.com/ruikangliu;;;;https://www.sigs.tsinghua.edu.cn/fg3/105064.jhtml;https://hqyang.github.io/",
        "dblp": "250/1076;253/3082.html;250/1587.html;209/8128;https://dblp.uni-trier.de/pers/hd/l/Li:Lei;;63/3939.html",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;0n4SuDUAAAAJ;ZG9GqnMAAAAJ;;https://scholar.google.com.hk/citations?user=fYdxi2sAAAAJ;nfijDy4AAAAJ",
        "orcid": ";;;0000-0002-8078-5834;;;",
        "linkedin": ";;;;;;haiqin-yang-55a18b21",
        "or_profile": "~Zhengzhuo_Xu1;~Ruikang_Liu1;~Zenghao_Chai1;~Yiyan_Qi1;~Lei_Li12;~Chun_Yuan1;~Haiqin_Yang1",
        "aff": "Tsinghua University;Tsinghua University;National University of Singapore;IDEA;;Tsinghua University;International Digital Economy Academy (IDEA)",
        "aff_domain": "tsinghua.edu.cn;tsinghua.edu.cn;u.nus.edu;idea.edu.cn;;tsinghua.edu.cn;idea.edu.cn",
        "position": "PhD student;MS student;PhD student;Researcher;;Full Professor;Principal Researcher",
        "bibtex": "@misc{\nxu2024hierarchical,\ntitle={Hierarchical Long-tailed Classification with Visual Language Models},\nauthor={Zhengzhuo Xu and Ruikang Liu and Zenghao Chai and Yiyan Qi and Lei Li and Haiqin Yang and Chun Yuan},\nyear={2024},\nurl={https://openreview.net/forum?id=bYwEpQ96ng}\n}",
        "github": "",
        "project": "",
        "reviewers": "yLRq;2kUk;CVWh;LavU",
        "site": "https://openreview.net/forum?id=bYwEpQ96ng",
        "pdf_size": 1863410,
        "rating": "3;5;5;6",
        "confidence": "4;4;4;4",
        "soundness": "1;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "1;2;2;3",
        "wc_summary": "89;113;71;71",
        "wc_strengths": "53;44;60;25",
        "wc_weaknesses": "375;460;612;47",
        "wc_questions": "132;48;6;29",
        "wc_review": "649;665;749;172",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            86.0,
            17.233687939614086
        ],
        "wc_strengths_avg": [
            45.5,
            13.124404748406688
        ],
        "wc_weaknesses_avg": [
            373.5,
            206.74198896208773
        ],
        "wc_questions_avg": [
            53.75,
            47.56245893559331
        ],
        "wc_review_avg": [
            558.75,
            226.49765451324214
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:8lVgEIDL2_IJ:scholar.google.com/&scioq=Hierarchical+Long-tailed+Classification+with+Visual+Language+Models&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2;0;3",
        "aff_unique_norm": "Tsinghua University;National University of Singapore;Institute of Electrical and Electronics Engineers;International Digital Economy Academy",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.nus.edu.sg;https://www.ieee.org;",
        "aff_unique_abbr": "THU;NUS;IEEE;IDEA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;2;0",
        "aff_country_unique": "China;Singapore;United States;"
    },
    {
        "id": "bZHz9WYs9z",
        "title": "Molecule Generation by Heterophilious Triple Flows",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Generating molecules with desirable properties is key to domains like material design and drug discovery. The predominant approach is to encode molecular graphs using graph neural networks or their continuous-depth analogues. However, these methods often implicitly assume strong homophily (i.e., affinity) between neighbours, overlooking repulsions between dissimilar atoms and making them vulnerable to oversmoothing. To address this, we introduce HTFlows. It uses multiple interactive flows to capture heterophily patterns in the molecular space and harnesses these (dis-)similarities in generation, consistently showing good performance on chemoinformatics benchmarks.",
        "keywords": "Molecule generation;graph neural networks;heterophily;generative models",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Haishan Wang;Arno Solin;Vikas Garg",
        "authorids": "~Haishan_Wang1;~Arno_Solin1;~Vikas_Garg2",
        "gender": "M;;",
        "homepage": "https://www.linkedin.com/in/haishan-wang-b834bb21a/;http://arno.solin.fi;",
        "dblp": ";98/11225;",
        "google_scholar": ";U_fJCnAAAAAJ;",
        "orcid": ";0000-0002-0958-7886;",
        "linkedin": ";asolin/;",
        "or_profile": "~Haishan_Wang1;~Arno_Solin1;~Vikas_Garg2",
        "aff": "Aalto University;Aalto University;",
        "aff_domain": "aalto.fi;aalto.fi;",
        "position": "PhD student;Assistant Professor;",
        "bibtex": "@misc{\nwang2024molecule,\ntitle={Molecule Generation by Heterophilious Triple Flows},\nauthor={Haishan Wang and Arno Solin and Vikas Garg},\nyear={2024},\nurl={https://openreview.net/forum?id=bZHz9WYs9z}\n}",
        "github": "",
        "project": "",
        "reviewers": "LyRR;AKoh;x2it;VenB",
        "site": "https://openreview.net/forum?id=bZHz9WYs9z",
        "pdf_size": 754316,
        "rating": "3;5;5;6",
        "confidence": "4;3;3;3",
        "soundness": "1;2;3;2",
        "contribution": "1;2;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "33;73;90;47",
        "wc_strengths": "27;21;70;13",
        "wc_weaknesses": "174;344;65;2",
        "wc_questions": "44;5;107;183",
        "wc_review": "278;443;332;245",
        "wc_reply_reviewers": "196;0;23;36",
        "wc_reply_authors": "464;586;402;747",
        "reply_reviewers": "2;0;1;1",
        "reply_authors": "2;1;2;2",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            60.75,
            22.16275028059469
        ],
        "wc_strengths_avg": [
            32.75,
            22.072324299900995
        ],
        "wc_weaknesses_avg": [
            146.25,
            129.6965207706051
        ],
        "wc_questions_avg": [
            84.75,
            67.39575283354286
        ],
        "wc_review_avg": [
            324.5,
            75.13487871820917
        ],
        "wc_reply_reviewers_avg": [
            63.75,
            77.4350534318922
        ],
        "wc_reply_authors_avg": [
            549.75,
            131.7239063344236
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.9271726499455306,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3315430465154960597&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Aalto University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.aalto.fi",
        "aff_unique_abbr": "Aalto",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Finland"
    },
    {
        "id": "bZMyHBSnEI",
        "title": "Deep Equilibrium Multimodal Fusion",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Multimodal fusion integrates the complementary information present in multiple modalities and has gained much attention recently. Existing fusion approaches exhibit three key elements for informative multimodal fusion, *i.e.*, stabilizing unimodal signals, capturing intra- and inter-modality interactions at multi-level, and perceiving modality importance in a dynamic manner. The current fusion methods mostly suffice only one of these conditions, without considering all three aspects simultaneously. Encapsulating these ideas, in this paper, we propose a novel deep equilibrium (DEQ) method for multimodal fusion via seeking a fixed point of the dynamic multimodal fusion process and modeling feature correlations in an adaptive and recursive manner, which naturally consolidates the three key ingredients for successful multimodal fusion. Our approach encodes and stabilizes rich information within and across modalities thoroughly from low level to high level and dynamically perceives modality importance for efficacious downstream multimodal learning, and is readily pluggable to various multimodal frameworks. Extensive experiments on four well-known multimodal benchmarks, namely, BRCA, MM-IMDB, CMU-MOSI, and VQA-v2, involving a vast variety of modalities, demonstrate the superiority and generalizability of our DEQ fusion. Remarkably, our DEQ fusion consistently achieves state-of-the-art performance on these benchmarks. The code will be released.",
        "keywords": "Multimodal Fusion;Multimodal Learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Jinhong Ni;Yalong Bai;Wei Zhang;Ting Yao;Qing Yang;Tao Mei;Kai Han",
        "authorids": "~Jinhong_Ni1;~Yalong_Bai2;~Wei_Zhang46;~Ting_Yao1;~Qing_Yang11;~Tao_Mei3;~Kai_Han1",
        "gender": "M;M;M;M;M;;M",
        "homepage": "https://github.com/jinhong-ni;http://ylbai.me/;https://wzhang.fun;http://tingyao.deepfun.club/;https://www.duxiaoman.com/index;;http://www.kaihan.org/",
        "dblp": "350/5029;133/1984;10/4661-31;136/1046;47/3749;;51/4757-1.html",
        "google_scholar": "AYiMs8cAAAAJ;iYMBoHwAAAAJ;https://scholar.google.com.hk/citations?hl=en;7Yc6yssAAAAJ;;;tG8S_vMAAAAJ",
        "orcid": ";;;0000-0001-7587-101X;;;0000-0002-7995-9999",
        "linkedin": ";;;;;;kaihancs/",
        "or_profile": "~Jinhong_Ni1;~Yalong_Bai2;~Wei_Zhang46;~Ting_Yao1;~Qing_Yang11;~Tao_Mei3;~Kai_Han1",
        "aff": "University of Hong Kong;Du Xiaoman;JD Explore Academy;JD AI Research;;;The University of Hong Kong",
        "aff_domain": "hku.hk;duxiaoman.com;jd.com;jd.com;;;hku.hk",
        "position": "PhD student;Principal Researcher;Researcher;Researcher;;;Assistant Professor",
        "bibtex": "@misc{\nni2024deep,\ntitle={Deep Equilibrium Multimodal Fusion},\nauthor={Jinhong Ni and Yalong Bai and Wei Zhang and Ting Yao and Qing Yang and Tao Mei and Kai Han},\nyear={2024},\nurl={https://openreview.net/forum?id=bZMyHBSnEI}\n}",
        "github": "",
        "project": "",
        "reviewers": "6XP7;JNZo;qyjt;fFE2",
        "site": "https://openreview.net/forum?id=bZMyHBSnEI",
        "pdf_size": 737811,
        "rating": "5;5;5;6",
        "confidence": "3;4;3;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "51;44;32;56",
        "wc_strengths": "119;43;54;71",
        "wc_weaknesses": "232;341;164;88",
        "wc_questions": "4;69;34;33",
        "wc_review": "406;497;284;248",
        "wc_reply_reviewers": "0;159;0;0",
        "wc_reply_authors": "316;710;562;198",
        "reply_reviewers": "0;2;0;0",
        "reply_authors": "1;3;1;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            45.75,
            9.01041064547005
        ],
        "wc_strengths_avg": [
            71.75,
            29.046299247924853
        ],
        "wc_weaknesses_avg": [
            206.25,
            92.99025486576537
        ],
        "wc_questions_avg": [
            35.0,
            23.03258561256204
        ],
        "wc_review_avg": [
            358.75,
            98.99337099018297
        ],
        "wc_reply_reviewers_avg": [
            39.75,
            68.84901960086287
        ],
        "wc_reply_authors_avg": [
            446.5,
            200.96952505292936
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12757543114320323697&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;2;2;0",
        "aff_unique_norm": "University of Hong Kong;;JD",
        "aff_unique_dep": ";;JD Explore Academy",
        "aff_unique_url": "https://www.hku.hk;;",
        "aff_unique_abbr": "HKU;;",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China;"
    },
    {
        "id": "bZh06ptG9r",
        "title": "FedLoRA: When Personalized Federated Learning Meets Low-Rank Adaptation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this research paper, we introduce a novel approach to Personalized Federated Learning (PFL), which we call FedLoRA. This approach is inspired by recent advancements in fine-tuning Large Language Models (LLMs), particularly the Low-Rank Adaptation (LoRA) technique.\nThe remarkable success of LoRA demonstrates that general linguistic knowledge is preserved in a pre-trained full-rank model, while domain-specific knowledge can be effectively retained within a low-rank parameter matrix. Building upon this insight, we present FedLoRA in the context of PFL, aiming to maintain shared general knowledge among all clients in a common full-rank matrix, while capturing client-specific knowledge within a personalized low-rank matrix. However, the integration of LoRA into PFL presents its own set of challenges. Unlike LoRA, which starts with pre-trained general knowledge, FedLoRA's full-rank matrix needs training from scratch. This phase can be notably influenced by data heterogeneity, potentially hindering its effective extraction of general knowledge.\nTo address this challenge, we propose a new training strategy to mitigate the effects of data heterogeneity on the shared full-rank matrix. Our experimental results, obtained across multiple datasets exhibiting varying degrees of data heterogeneity, demonstrate that FedLoRA outperforms current state-of-the-art methods significantly.",
        "keywords": "Personalized Federated Learning;non-IID;Low-Rank Adaptation",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Xinghao Wu;Xuefeng Liu;Jianwei Niu;Haolin Wang;Shaojie Tang;Guogang Zhu",
        "authorids": "~Xinghao_Wu1;~Xuefeng_Liu5;~Jianwei_Niu3;~Haolin_Wang6;~Shaojie_Tang2;~Guogang_Zhu1",
        "gender": ";M;M;M;;M",
        "homepage": ";;https://shi.buaa.edu.cn/jwniu/zh_CN/index.htm;;;https://scholar.google.com.hk/citations?user=Cqt1cQUAAAAJ&hl=zh-CN",
        "dblp": "159/1128;96/600-1;25/4653-2;;;305/8757",
        "google_scholar": "F4e9q7AAAAAJ;https://scholar.google.com/citations?hl=en;KOciOtEAAAAJ;https://scholar.google.com/citations?hl=zh-CN;;https://scholar.google.com.hk/citations?user=Cqt1cQUAAAAJ",
        "orcid": "0000-0002-6987-3972;;0000-0003-3946-5107;0000-0002-0659-2006;;0000-0002-6381-1420",
        "linkedin": ";;;;;",
        "or_profile": "~Xinghao_Wu1;~Xuefeng_Liu5;~Jianwei_Niu3;~Haolin_Wang6;~Shaojie_Tang2;~Guogang_Zhu1",
        "aff": "Beihang University;Behang University;Beihang University;Beihang University;;Beihang University",
        "aff_domain": "buaa.edu.cn;buaa.edu.cn;buaa.edu.cn;buaa.edu.cn;;buaa.edu.cn",
        "position": "PhD student;Associate Professor;Full Professor;MS student;;PhD student",
        "bibtex": "@misc{\nwu2024fedlora,\ntitle={FedLo{RA}: When Personalized Federated Learning Meets Low-Rank Adaptation},\nauthor={Xinghao Wu and Xuefeng Liu and Jianwei Niu and Haolin Wang and Shaojie Tang and Guogang Zhu},\nyear={2024},\nurl={https://openreview.net/forum?id=bZh06ptG9r}\n}",
        "github": "",
        "project": "",
        "reviewers": "fKpJ;eXdF;PiFj;yWWG;8LH2",
        "site": "https://openreview.net/forum?id=bZh06ptG9r",
        "pdf_size": 1456227,
        "rating": "3;5;5;6;8",
        "confidence": "5;5;3;3;3",
        "soundness": "2;2;2;3;3",
        "contribution": "2;3;2;3;4",
        "presentation": "3;3;2;3;4",
        "wc_summary": "54;27;29;42;156",
        "wc_strengths": "70;37;29;44;51",
        "wc_weaknesses": "82;96;111;32;85",
        "wc_questions": "1;5;9;18;99",
        "wc_review": "207;165;178;136;391",
        "wc_reply_reviewers": "61;0;0;13;27",
        "wc_reply_authors": "935;818;795;388;306",
        "reply_reviewers": "1;0;0;1;1",
        "reply_authors": "3;2;2;2;2",
        "rating_avg": [
            5.4,
            1.624807680927192
        ],
        "confidence_avg": [
            3.8,
            0.9797958971132712
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.8,
            0.7483314773547882
        ],
        "presentation_avg": [
            3.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            61.6,
            48.19377553170119
        ],
        "wc_strengths_avg": [
            46.2,
            13.96280774056565
        ],
        "wc_weaknesses_avg": [
            81.2,
            26.618790355686716
        ],
        "wc_questions_avg": [
            26.4,
            36.73472471654034
        ],
        "wc_review_avg": [
            215.4,
            90.71846559548943
        ],
        "wc_reply_reviewers_avg": [
            20.2,
            22.710350063352173
        ],
        "wc_reply_authors_avg": [
            648.4,
            251.9687282184041
        ],
        "reply_reviewers_avg": [
            0.6,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            2.2,
            0.39999999999999997
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.7035264706814485,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15677662780813409874&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0;0",
        "aff_unique_norm": "Beihang University;Behang University",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.buaa.edu.cn/;",
        "aff_unique_abbr": "BUAA;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China;"
    },
    {
        "title": "R-MAE: Regions Meet Masked Autoencoders",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18327",
        "id": "ba84RDHFnz",
        "author_site": "Duy-Kien Nguyen, Yanghao Li, Vaibhav Aggarwal, Martin R. Oswald, Alexander Kirillov, Cees G Snoek, Xinlei Chen",
        "tldr": "",
        "abstract": "In this work, we explore regions as a potential visual analogue of words for self-supervised image representation learning. Inspired by Masked Autoencoding (MAE), a generative pre-training baseline, we propose masked region autoencoding to learn from groups of pixels or regions. Specifically, we design an architecture which efficiently addresses the one-to-many mapping between images and regions, while being highly effective especially with high-quality regions. When integrated with MAE, our approach (R-MAE) demonstrates consistent improvements across various pre-training datasets and downstream detection and segmentation benchmarks, with negligible computational overheads. Beyond the quantitative evaluation, our analysis indicates the models pre-trained with masked region autoencoding unlock the potential for interactive segmentation. The code is provided at https://github.com/facebookresearch/r-mae.",
        "keywords": "self-supervised learning;representation learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/5aa728cbbd16391d23497126e25ead174ea5582f.zip",
        "author": "Duy Kien Nguyen;Yanghao Li;Vaibhav Aggarwal;Martin R. Oswald;Alexander Kirillov;Cees G. M. Snoek;Xinlei Chen",
        "authorids": "~Duy_Kien_Nguyen1;~Yanghao_Li1;~Vaibhav_Aggarwal1;~Martin_R._Oswald1;~Alexander_Kirillov1;~Cees_G._M._Snoek1;~Xinlei_Chen1",
        "gender": "M;M;;;M;M;M",
        "homepage": ";https://lyttonhao.github.io/;;;http://xinleic.xyz;https://alexander-kirillov.github.io/;http://www.ceessnoek.info",
        "dblp": "218/5480.html;159/3873;;37/7272;;172/1389;s/CeesSnoek",
        "google_scholar": "welhhBIAAAAJ;-VgS8AIAAAAJ;;https://scholar.google.ch/citations?user=biytQP8AAAAJ;bSU7LYoAAAAJ;bHn29ScAAAAJ;https://scholar.google.nl/citations?user=0uKdbscAAAAJ",
        "orcid": ";;;0000-0002-1183-9958;;;0000-0001-9092-1556",
        "linkedin": "https://linkedin.com/in/duy-kien-nguyen-940b63109;;vaibhav-aggarwal-usa;martin-r-oswald-167461122/;;;cgmsnoek/",
        "or_profile": "~Duy_Kien_Nguyen1;~Yanghao_Li1;~Vaibhav_Aggarwal1;~Martin_R._Oswald1;~Xinlei_Chen1;~Alexander_Kirillov3;~Cees_Snoek1",
        "aff": "University of Amsterdam;Apple;;University of Amsterdam;Meta;Facebook AI Research;University of Amsterdam",
        "aff_domain": "uva.nl;apple.com;;uva.nl;meta.com;fb.com;uva.nl",
        "position": "PhD student;Researcher;;Assistant Professor;Researcher;Research Scientist;Full Professor",
        "bibtex": "@inproceedings{\nnguyen2024rmae,\ntitle={R-{MAE}: Regions Meet Masked Autoencoders},\nauthor={Duy Kien Nguyen and Yanghao Li and Vaibhav Aggarwal and Martin R. Oswald and Alexander Kirillov and Cees G. M. Snoek and Xinlei Chen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ba84RDHFnz}\n}",
        "github": "",
        "project": "",
        "reviewers": "FunS;uFze;YqrJ",
        "pdf_size": 13750422,
        "rating": "6;6;6",
        "confidence": "5;5;3",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "4;3;3",
        "wc_summary": "52;51;52",
        "wc_strengths": "42;42;62",
        "wc_weaknesses": "235;495;41",
        "wc_questions": "4;109;53",
        "wc_review": "333;697;208",
        "wc_reply_reviewers": "0;65;0",
        "wc_reply_authors": "691;820;299",
        "reply_reviewers": "0;1;0",
        "reply_authors": "1;2;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            51.666666666666664,
            0.4714045207910317
        ],
        "wc_strengths_avg": [
            48.666666666666664,
            9.428090415820632
        ],
        "wc_weaknesses_avg": [
            257.0,
            185.9964157360745
        ],
        "wc_questions_avg": [
            55.333333333333336,
            42.897811391983886
        ],
        "wc_review_avg": [
            412.6666666666667,
            207.42923826907548
        ],
        "wc_reply_reviewers_avg": [
            21.666666666666668,
            30.641293851417057
        ],
        "wc_reply_authors_avg": [
            603.3333333333334,
            221.5465840153914
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6521436856525967400&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=ba84RDHFnz",
        "pdf": "https://openreview.net/pdf?id=ba84RDHFnz",
        "email": "uva.nl;apple.com;;uva.nl;meta.com;fb.com;uva.nl",
        "author_num": 7,
        "aff_unique_index": "0;1;0;2;2;0",
        "aff_unique_norm": "University of Amsterdam;Apple;Meta",
        "aff_unique_dep": ";Apple Inc.;Meta Platforms, Inc.",
        "aff_unique_url": "https://www.uva.nl;https://www.apple.com;https://meta.com",
        "aff_unique_abbr": "UvA;Apple;Meta",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;1;1;0",
        "aff_country_unique": "Netherlands;United States"
    },
    {
        "id": "bamS1jdqhH",
        "title": "ADJUSTING THE INDUCTIVE BIAS OF DIFFUSION MODELS",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "It has been found empirically that diffusion-based generative models strongly ben-\nefit from weighting the score-matching objective in the training process and from\nredirecting trajectories in the sampling process to closer match the training dis-\ntribution. Here we show that a beneficial loss weight arises naturally when the\ntraining objective is derived from first principles by enforcing detailed balance\nbetween the forward and the reverse diffusion trajectories. We find that deter-\nministic sampling by diffusion models induces a strong bias, favoring features of\nsome training examples while ignoring others. To correct for the strong sampling\nbias, we introduce an efficient and controllable rejection sampling approach. We\nachieve a new state-of-the-art FID of 1.42 for CIFAR-10 in a class-conditional\nsetting.",
        "keywords": "Diffusion Models;Generative Models",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Tim Kaiser;Sven Klein;Markus Kollmann",
        "authorids": "~Tim_Kaiser1;svkle100@uni-duesseldorf.de;~Markus_Kollmann1",
        "gender": "M;;M",
        "homepage": ";;https://www.mathmodeling.hhu.de/en.html",
        "dblp": "16/3072;;26/10996",
        "google_scholar": "44xO5kQAAAAJ;;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Tim_Kaiser1;svkle100@uni-duesseldorf.de;~Markus_Kollmann1",
        "aff": "Heinrich-Heine-University;;Institute for Mathematical Modelling of Biological Systems",
        "aff_domain": "hhu.de;;hhu.de",
        "position": "PhD student;;Full Professor",
        "bibtex": "@misc{\nkaiser2024adjusting,\ntitle={{ADJUSTING} {THE} {INDUCTIVE} {BIAS} {OF} {DIFFUSION} {MODELS}},\nauthor={Tim Kaiser and Sven Klein and Markus Kollmann},\nyear={2024},\nurl={https://openreview.net/forum?id=bamS1jdqhH}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=bamS1jdqhH",
        "pdf_size": 4607691,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:yhe3GPDvseMJ:scholar.google.com/&scioq=ADJUSTING+THE+INDUCTIVE+BIAS+OF+DIFFUSION+MODELS&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Heinrich-Heine-University;Institute for Mathematical Modelling of Biological Systems",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.hhu.de;https://www.imbs.uzh.ch",
        "aff_unique_abbr": "HHU;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Germany"
    },
    {
        "title": "Multilinear Operator Networks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18326",
        "id": "bbCL5aRjUx",
        "author_site": "Yixin Cheng, Grigorios Chrysos, Markos Georgopoulos, Volkan Cevher",
        "tldr": "",
        "abstract": "Despite the remarkable capabilities of deep neural networks in image recognition, the dependence on activation functions remains a largely unexplored area and has yet to be eliminated. On the other hand, Polynomial Networks is a class of models that does not require activation functions, but have yet to perform on par with modern architectures. In this work, we aim close this gap and propose MONet, which relies *solely* on multilinear operators. The core layer of MONet, called Mu-Layer, captures multiplicative interactions of the elements of the input token. MONet captures high-degree interactions of the input elements and we demonstrate the efficacy of our approach on a series of image recognition and scientific computing benchmarks. The proposed model outperforms prior polynomial networks and performs on par with modern architectures. We believe that MONet can inspire further research on models that use entirely multilinear operations.",
        "keywords": "Polynomial Networks;Image recognition",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Yixin Cheng;Grigorios Chrysos;Markos Georgopoulos;Volkan Cevher",
        "authorids": "~Yixin_Cheng1;~Grigorios_Chrysos1;~Markos_Georgopoulos1;~Volkan_Cevher1",
        "gender": "M;M;;M",
        "homepage": "https://people.epfl.ch/yixin.cheng/?lang=en;https://grigorisg9gr.github.io/;;http://lions.epfl.ch",
        "dblp": ";75/6117-2;197/6876;70/5301",
        "google_scholar": ";1bU041kAAAAJ;id7vw0UAAAAJ;https://scholar.google.ch/citations?user=hlWhzU8AAAAJ",
        "orcid": ";;;",
        "linkedin": "yixin-cheng-76248219a/;;;",
        "or_profile": "~Yixin_Cheng1;~Grigorios_Chrysos1;~Markos_Georgopoulos1;~Volkan_Cevher1",
        "aff": "EPFL - EPF Lausanne;University of Wisconsin - Madison;Meta;Amazon Development Center Germany",
        "aff_domain": "epfl.ch;wisc.edu;meta.com;amazon.de",
        "position": "Researcher;Assistant Professor;Researcher;Amazon Scholar",
        "bibtex": "@inproceedings{\ncheng2024multilinear,\ntitle={Multilinear Operator Networks},\nauthor={Yixin Cheng and Grigorios Chrysos and Markos Georgopoulos and Volkan Cevher},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=bbCL5aRjUx}\n}",
        "github": "",
        "project": "",
        "reviewers": "L73R;kEbz;6KA9",
        "pdf_size": 6747891,
        "rating": "6;6;8",
        "confidence": "2;3;3",
        "soundness": "3;2;3",
        "contribution": "3;2;3",
        "presentation": "2;2;3",
        "wc_summary": "64;58;72",
        "wc_strengths": "205;56;96",
        "wc_weaknesses": "441;167;90",
        "wc_questions": "137;98;22",
        "wc_review": "847;379;280",
        "wc_reply_reviewers": "507;165;38",
        "wc_reply_authors": "2243;944;746",
        "reply_reviewers": "2;1;1",
        "reply_authors": "7;4;3",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            64.66666666666667,
            5.734883511361751
        ],
        "wc_strengths_avg": [
            119.0,
            62.96559907335645
        ],
        "wc_weaknesses_avg": [
            232.66666666666666,
            150.63052663904335
        ],
        "wc_questions_avg": [
            85.66666666666667,
            47.75167245471327
        ],
        "wc_review_avg": [
            502.0,
            247.27717241993852
        ],
        "wc_reply_reviewers_avg": [
            236.66666666666666,
            198.06115778269657
        ],
        "wc_reply_authors_avg": [
            1311.0,
            663.9623483300842
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            4.666666666666667,
            1.699673171197595
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.49999999999999983,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14113021399714265419&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=bbCL5aRjUx",
        "pdf": "https://openreview.net/pdf?id=bbCL5aRjUx",
        "email": "epfl.ch;wisc.edu;meta.com;amazon.de",
        "author_num": 4,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "EPFL;University of Wisconsin-Madison;Meta;Amazon",
        "aff_unique_dep": ";;Meta Platforms, Inc.;Development Center",
        "aff_unique_url": "https://www.epfl.ch;https://www.wisc.edu;https://meta.com;https://www.amazon.de",
        "aff_unique_abbr": "EPFL;UW-Madison;Meta;Amazon",
        "aff_campus_unique_index": "0;1",
        "aff_campus_unique": "Lausanne;Madison;",
        "aff_country_unique_index": "0;1;1;2",
        "aff_country_unique": "Switzerland;United States;Germany"
    },
    {
        "id": "bcHty5VvkQ",
        "title": "SkipDecode: Autoregressive Skip Decoding with Batching and Caching for Efficient LLM Inference",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Autoregressive large language models (LLMs) have made remarkable progress in various natural language generation tasks. However, the high computing cost and latency resulting from token-by-token generation impede their widespread adoption. To address this issue, several approaches have been proposed that reduce computational cost using early-exit strategies. These strategies enable faster text generation using reduced computation without applying the full computation graph to each token. While existing token-level early exit methods show promising results for online inference \u2013 they cannot be readily applied for batch inferencing and Key-Value caching. This is because they have to wait until the last token in a batch exits before they can stop computing. This severely limits the practical application of such techniques. In this paper, we propose a simple and effective token-level early exit method, SkipDecode, designed to work seamlessly with batch inferencing and KV caching. It overcomes prior constraints by setting up a singular exit point for every token in a batch at a each sequence position. It also guarantees a monotonic decrease in exit points, thereby eliminating the need to recompute KV Caches for preceding tokens. Rather than terminating computation prematurely as in prior works, our approach bypasses lower to middle layers, devoting most of the computational resources to upper layers, allowing later tokens to benefit from the compute expenditure by earlier tokens. Our experimental results show that SkipDecode can obtain 2x to 5x inference speedups with negligible regression across a variety of tasks. This is achieved using OPT models of 1.3 billion and 6.7 billion parameters, all the while being directly compatible with batching and KV caching optimization techniques.",
        "keywords": "Adaptive Computation;Efficient Inference;Generative Models",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Luciano Del Corro;Allison Del Giorno;Sahaj Agarwal;Bin Yu;Ahmed Hassan Awadallah;Subhabrata Mukherjee",
        "authorids": "~Luciano_Del_Corro1;~Allison_Del_Giorno1;~Sahaj_Agarwal1;~Bin_Yu5;~Ahmed_Hassan_Awadallah1;~Subhabrata_Mukherjee2",
        "gender": "M;F;;M;M;",
        "homepage": "http://people.mpi-inf.mpg.de/~corrogg/;;;https://binyu.stat.berkeley.edu;https://www.microsoft.com/en-us/research/people/hassanam/publications/;https://subhomukherjee.com/",
        "dblp": "127/0394;185/6818;;27/116;147/9148;37/11030.html",
        "google_scholar": "https://scholar.google.de/citations?user=vJfDxrIAAAAJ;;ZpMAJs8AAAAJ;https://scholar.google.com.hk/citations?user=z1iJa3UAAAAJ;sNGk-9MAAAAJ;T4iBN5cAAAAJ",
        "orcid": ";;;0000-0003-3097-1433;;",
        "linkedin": "lucianodelcorro/;allison-del-giorno-9970651a;sahaj-agarwal-89aa49174/;bin-yu-b665063/;ahmed-hassan-awadallah-a355a27/;subho87",
        "or_profile": "~Luciano_Del_Corro1;~Allison_Del_Giorno1;~Sahaj_Agarwal1;~Bin_Yu5;~Ahmed_Hassan_Awadallah1;~Subhabrata_Mukherjee2",
        "aff": "Microsoft Research;Microsoft;;University of California, Berkeley;Microsoft Research;Hippocratic AI",
        "aff_domain": "microsoft.com;microsoft.com;;berkeley.edu;microsoft.com;hippocraticai.com",
        "position": "Researcher;Researcher;;Full Professor;Principal Researcher;Chief Scientist",
        "bibtex": "@misc{\ncorro2024skipdecode,\ntitle={SkipDecode: Autoregressive Skip Decoding with Batching and Caching for Efficient {LLM} Inference},\nauthor={Luciano Del Corro and Allison Del Giorno and Sahaj Agarwal and Bin Yu and Ahmed Hassan Awadallah and Subhabrata Mukherjee},\nyear={2024},\nurl={https://openreview.net/forum?id=bcHty5VvkQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "HbUe;zrR5;RFb8;rBkT",
        "site": "https://openreview.net/forum?id=bcHty5VvkQ",
        "pdf_size": 369075,
        "rating": "5;5;6;6",
        "confidence": "4;4;4;4",
        "soundness": "3;2;2;3",
        "contribution": "2;3;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "70;87;195;55",
        "wc_strengths": "16;62;62;28",
        "wc_weaknesses": "202;242;112;232",
        "wc_questions": "25;74;100;5",
        "wc_review": "313;465;469;320",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "583;540;730;1326",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            101.75,
            55.01533877020117
        ],
        "wc_strengths_avg": [
            42.0,
            20.445048300260872
        ],
        "wc_weaknesses_avg": [
            197.0,
            51.234753829797995
        ],
        "wc_questions_avg": [
            51.0,
            37.821951298154886
        ],
        "wc_review_avg": [
            391.75,
            75.30396735896456
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            794.75,
            314.7041269192382
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 59,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4876209598848679030&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1;0;2",
        "aff_unique_norm": "Microsoft;University of California, Berkeley;Hippocratic AI",
        "aff_unique_dep": "Microsoft Research;;",
        "aff_unique_url": "https://www.microsoft.com/en-us/research;https://www.berkeley.edu;https://www.hippocratic.ai",
        "aff_unique_abbr": "MSR;UC Berkeley;Hippocratic AI",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Berkeley",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "bcNwnuWMe0",
        "title": "Exploiting River Network Topology for Flood Forecasting with Graph Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Climate change exacerbates riverine floods, which occur with higher frequency and intensity than ever. The much-needed forecasting systems typically rely on accurate river discharge predictions. To this end, the SOTA data-driven approaches treat forecasting at spatially distributed gauge stations as isolated problems, even within the same river network. However, incorporating the known river network topology into the prediction model has the potential to leverage the adjacency relationship between gauges. Thus, we model river discharge for a network of gauging stations with a GNN, and compare the forecasting performance achieved by different adjacency definitions. Our results show that the model fails to benefit from the river network topology information, regardless of the number of layers and, thus, propagation distance. The learned edge weights correlate with neither of the static definitions and exhibit no regular pattern. Furthermore, a worst-case analysis reveals that the GNN struggles to predict sudden discharge spikes. This work may serve as a justification for the SOTA treating gauges independently and suggests that more improvement potential lies in anticipating spikes.",
        "keywords": "graph neural networks;adjacency relation;river network;flood forecasting",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/3616ca512a674cc55cbb00266e6ae5a8ec4beaa4.zip",
        "author": "Nikolas Kirschstein;Yixuan Sun",
        "authorids": "~Nikolas_Kirschstein1;~Yixuan_Sun3",
        "gender": ";",
        "homepage": ";",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": ";0000-0002-7947-4369",
        "linkedin": ";",
        "or_profile": "~Nikolas_Kirschstein1;~Yixuan_Sun3",
        "aff": ";",
        "aff_domain": ";",
        "position": ";",
        "bibtex": "@misc{\nkirschstein2024exploiting,\ntitle={Exploiting River Network Topology for Flood Forecasting with Graph Neural Networks},\nauthor={Nikolas Kirschstein and Yixuan Sun},\nyear={2024},\nurl={https://openreview.net/forum?id=bcNwnuWMe0}\n}",
        "github": "",
        "project": "",
        "reviewers": "FSEP;T47T;9HHN",
        "site": "https://openreview.net/forum?id=bcNwnuWMe0",
        "pdf_size": 970334,
        "rating": "3;5;5",
        "confidence": "4;3;4",
        "soundness": "2;2;2",
        "contribution": "2;3;4",
        "presentation": "3;4;3",
        "wc_summary": "34;52;42",
        "wc_strengths": "59;55;57",
        "wc_weaknesses": "277;209;113",
        "wc_questions": "170;14;145",
        "wc_review": "540;330;357",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "865;413;612",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            42.666666666666664,
            7.363574011458174
        ],
        "wc_strengths_avg": [
            57.0,
            1.632993161855452
        ],
        "wc_weaknesses_avg": [
            199.66666666666666,
            67.2772043282286
        ],
        "wc_questions_avg": [
            109.66666666666667,
            68.41214966818556
        ],
        "wc_review_avg": [
            409.0,
            93.28451104015072
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            630.0,
            184.96666366312246
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:UPdNSV7VOn4J:scholar.google.com/&scioq=Exploiting+River+Network+Topology+for+Flood+Forecasting+with+Graph+Neural+Networks&hl=en&as_sdt=0,33",
        "gs_version_total": 0
    },
    {
        "id": "bcWwhF8cTZ",
        "title": "Gradient norm as a powerful proxy to out-of-distribution error estimation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Estimating out-of-distribution (OOD) error without access to the ground-truth test labels is a highly challenging, yet extremely important problem in the safe deployment of machine learning algorithms. Current works rely on the information from either the outputs or the extracted features to formulate an estimation score correlating with the expected OOD error. In this paper, we investigate--both empirically and theoretically--how the information provided by the gradients can be predictive of the OOD error. Specifically, we use the norm of classification-layer gradients, backpropagated from the cross-entropy loss with only one gradient step over OOD data. Our key idea is that the model should be adjusted with a higher magnitude of gradients when it does not generalize to the OOD dataset. We provide theoretical insights highlighting the main ingredients of such an approach ensuring its empirical success. Extensive experiments conducted on diverse distribution shifts and model structures demonstrate that our method outperforms state-of-the-art algorithms significantly.",
        "keywords": "out-of-distribution error estimation;machine learning;deep learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/b6b02e2e1eb38b6dac0294e56afd326c9f744296.pdf",
        "author": "RENCHUNZI XIE;Ambroise Odonnat;Vasilii Feofanov;Ievgen Redko;Jianfeng Zhang;Bo An",
        "authorids": "~RENCHUNZI_XIE1;~Ambroise_Odonnat1;~Vasilii_Feofanov1;~Ievgen_Redko2;~Jianfeng_Zhang2;~Bo_An2",
        "gender": ";M;M;;M;M",
        "homepage": ";https://ambroiseodt.github.io/;;;;https://personal.ntu.edu.sg/boan/",
        "dblp": ";359/3799;245/3361;150/3980;74/5065;42/6178-1.html",
        "google_scholar": ";M_OS-3kAAAAJ;https://scholar.google.ru/citations?user=UIteS6oAAAAJ;https://scholar.google.fr/citations?user=qJ1-XewAAAAJ;_Wzsb6YAAAAJ;PEEpuNwAAAAJ",
        "orcid": ";;0000-0002-5777-4205;;;0000-0002-7064-7438",
        "linkedin": ";ambroise-odonnat/;;;;",
        "or_profile": "~RENCHUNZI_XIE1;~Ambroise_Odonnat1;~Vasilii_Feofanov1;~Ievgen_Redko2;~Jianfeng_Zhang2;~Bo_An2",
        "aff": ";Huawei Technologies Ltd.;Huawei Noah's Ark Lab;Huawei Technologies Ltd.;Huawei Technologies Ltd.;Nanyang Technological University",
        "aff_domain": ";huawei.com;huawei.com;huawei.com;huawei.com;ntu.edu.sg",
        "position": ";Intern;Researcher;Principal Researcher;Researcher;Full Professor",
        "bibtex": "@misc{\nxie2024gradient,\ntitle={Gradient norm as a powerful proxy to out-of-distribution error estimation},\nauthor={RENCHUNZI XIE and Ambroise Odonnat and Vasilii Feofanov and Ievgen Redko and Jianfeng Zhang and Bo An},\nyear={2024},\nurl={https://openreview.net/forum?id=bcWwhF8cTZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "8wYw;b4cf;16Ha;XBio",
        "site": "https://openreview.net/forum?id=bcWwhF8cTZ",
        "pdf_size": 494502,
        "rating": "5;5;6;6",
        "confidence": "3;4;4;4",
        "soundness": "2;2;3;3",
        "contribution": "1;2;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "68;60;64;146",
        "wc_strengths": "16;68;40;138",
        "wc_weaknesses": "160;183;261;57",
        "wc_questions": "76;20;11;414",
        "wc_review": "320;331;376;755",
        "wc_reply_reviewers": "20;139;0;291",
        "wc_reply_authors": "958;1161;1286;1315",
        "reply_reviewers": "1;1;0;2",
        "reply_authors": "3;2;2;4",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            84.5,
            35.61951712193752
        ],
        "wc_strengths_avg": [
            65.5,
            45.724719791377616
        ],
        "wc_weaknesses_avg": [
            165.25,
            72.85044612080286
        ],
        "wc_questions_avg": [
            130.25,
            165.70512212964329
        ],
        "wc_review_avg": [
            445.5,
            179.91734213243592
        ],
        "wc_reply_reviewers_avg": [
            112.5,
            115.94934238709592
        ],
        "wc_reply_authors_avg": [
            1180.0,
            140.6289443891264
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:umHUdbfu0x8J:scholar.google.com/&scioq=Gradient+norm+as+a+powerful+proxy+to+out-of-distribution+error+estimation&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;1",
        "aff_unique_norm": "Huawei;Nanyang Technological University",
        "aff_unique_dep": "Huawei Technologies;",
        "aff_unique_url": "https://www.huawei.com;https://www.ntu.edu.sg",
        "aff_unique_abbr": "Huawei;NTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;1",
        "aff_country_unique": "China;Singapore"
    },
    {
        "id": "bdJaYLiOxi",
        "title": "Radar Spectra-language Model for Automotive Scene Parsing",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Radar sensors are low cost, long-range, and weather-resilient and provide direct velocity measurements. Therefore, they are widely used for driver assistance functions, and are expected to be crucial for the success of autonomous driving in the future. In many perception tasks only pre-processed radar point clouds are considered. In contrast, radar spectra are a dense and raw form of radar measurements and contain more information than radar point clouds. However, radar spectra are rather difficult to interpret. In this work, we aim to explore the semantic information extracted from spectra in the context of automotive driving, thereby moving towards to a better interpretability of radar spectra. To this end, we create a radar spectra-language model, allowing us to query radar spectra measurements for the presence of scene elements by using free text. We overcome the scarcity of radar spectra data by matching the embedding space of an existing vision-language model (VLM). Recognizing that off-the-shelf VLMs underperform on our target domain, we develop a fine-tuning approach tailored to automotive scenes. Finally, we explore the benefit of the learned representation for scene parsing, obtaining improvements in drivable space segmentation and object detection merely by injecting the spectra embedding into a baseline model.",
        "keywords": "radar spectra;radar perception;radar object detection;free space segmentation;autonomous driving;radar classification",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Mariia Pushkareva;Yuri Feldman;Csaba Domokos;Kilian Rambach;Dotan Di Castro",
        "authorids": "~Mariia_Pushkareva1;~Yuri_Feldman1;~Csaba_Domokos3;~Kilian_Rambach1;~Dotan_Di_Castro1",
        "gender": ";;M;;M",
        "homepage": ";https://yuri.feldman-home.net/;https://sites.google.com/site/cdomokosres/;https://www.bosch-ai.com;",
        "dblp": ";;08/1147;;72/538",
        "google_scholar": ";E5CysdsAAAAJ;ouFnqFgAAAAJ;;zhQaFaMAAAAJ",
        "orcid": ";;;;",
        "linkedin": "mariia-pushkareva;;;;dotan-di-castro-b0a99039/",
        "or_profile": "~Mariia_Pushkareva1;~Yuri_Feldman1;~Csaba_Domokos3;~Kilian_Rambach1;~Dotan_Di_Castro1",
        "aff": ";Bosch;Bosch Center for Artificial intelligence;Robert Bosch GmbH, Bosch;Bosch",
        "aff_domain": ";bosch.com;bosch.com;de.bosch.com;bosch.com",
        "position": ";Researcher;Research Scientist;Researcher;Bosch Center for Artificial Inteligence",
        "bibtex": "@misc{\npushkareva2024radar,\ntitle={Radar Spectra-language Model for Automotive Scene Parsing},\nauthor={Mariia Pushkareva and Yuri Feldman and Csaba Domokos and Kilian Rambach and Dotan Di Castro},\nyear={2024},\nurl={https://openreview.net/forum?id=bdJaYLiOxi}\n}",
        "github": "",
        "project": "",
        "reviewers": "RqMG;Bffg;9UPS;H2ZX",
        "site": "https://openreview.net/forum?id=bdJaYLiOxi",
        "pdf_size": 5352057,
        "rating": "3;5;5;6",
        "confidence": "4;4;4;3",
        "soundness": "2;2;4;2",
        "contribution": "2;1;2;3",
        "presentation": "2;2;3;3",
        "wc_summary": "118;50;57;196",
        "wc_strengths": "13;26;53;24",
        "wc_weaknesses": "64;143;251;29",
        "wc_questions": "12;64;2;36",
        "wc_review": "207;283;363;285",
        "wc_reply_reviewers": "54;32;25;24",
        "wc_reply_authors": "826;959;470;219",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "3;3;2;2",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            105.25,
            58.69146019652263
        ],
        "wc_strengths_avg": [
            29.0,
            14.713938969562161
        ],
        "wc_weaknesses_avg": [
            121.75,
            85.28591618784428
        ],
        "wc_questions_avg": [
            28.5,
            23.93219588754864
        ],
        "wc_review_avg": [
            284.5,
            55.161127617190715
        ],
        "wc_reply_reviewers_avg": [
            33.75,
            12.090802289343747
        ],
        "wc_reply_authors_avg": [
            618.5,
            291.82571853762306
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.6622661785325219,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11311857083553415121&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Robert Bosch GmbH;Bosch Center for Artificial Intelligence",
        "aff_unique_dep": ";Center for Artificial Intelligence",
        "aff_unique_url": "https://www.bosch.com;https://www.bosch-ai.com",
        "aff_unique_abbr": "Bosch;BCAI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "bdnw4qjfH9",
        "title": "S4++: Elevating Long Sequence Modeling with State Memory Reply",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recently, state space models (SSMs) have shown significant performance advantages in modeling long sequences.\nHowever, in spite of their promising performance, there still exist limitations.\n1) Non-Stable-States (NSS): Significant state variance discrepancies arise among discrete sampling steps, occasionally resulting in divergence.\n2) Dependency Bias: The unidirectional state space dependency in SSM impedes the effective modeling of intricate dependencies.\nIn this paper, we conduct theoretical analysis of SSM from the even-triggered control (ETC) theory perspective and first propose the presence of NSS Phenomenon.\n\nOur findings indicate that NSS primarily results from the sampling steps, and the integration of multi-state inputs into the current state significantly contributes to the mitigation of NSS.\nBuilding upon these theoretical analyses and findings, we propose a simple, yet effective, theoretically grounded State Memory Reply (SMR) mechanism that leverages learnable memories to incorporate multi-state information into the current state. This enables the precise modeling of finer state dependencies within the SSM, resulting in the introduction of S4+.\nFurthermore, we integrate the complex dependency bias into S4+ via interactive cross attentions mechanism, resulting in the development of S4++.\nOur extensive experiments in autoregressive language modeling and benchmarking against the Long Range Arena demonstrate superior performance in most post-processing tasks.",
        "keywords": "State Space model;Long Sequence Modeling",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/dc5304f2ff396ab843ad5eaa1c135db23ac99148.zip",
        "author": "Biqing Qi;Junqi Gao;Dong Li;Kaiyan Zhang;Jianxing Liu;Ligang Wu;Bowen Zhou",
        "authorids": "~Biqing_Qi1;~Junqi_Gao1;~Dong_Li20;~Kaiyan_Zhang1;~Jianxing_Liu1;~Ligang_Wu1;~Bowen_Zhou4",
        "gender": "M;M;;M;M;;",
        "homepage": "https://biqing-qi.github.io/;;https://scholar.google.com.hk/citations?hl=zh-CN&user=sSOt_McAAAAJ&view_op=list_works&gmla=AHoSzlUGq462ME3yzn-O-QVHz7m99fadMPU_X2FzQ2M47JN3ZcLFtf0DPl4zmY9LfBnLpIMz-00YKFo7-kN034NWi0ZKUF3q57DNbdoGe_w;https://iseesaw.github.io/;http://homepage.hit.edu.cn/jianxingliu;;",
        "dblp": "233/4949.html;81/9266.html;;;125/5518;;",
        "google_scholar": ";;https://scholar.google.com.hk/citations?hl=zh-CN;https://scholar.google.com/citations?hl=en-US;esJbMlUAAAAJ;;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": "0000-0002-4072-0577;0009-0007-1644-5812;0009-0007-8307-9904;0009-0001-0595-3084;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Biqing_Qi1;~Junqi_Gao1;~Dong_Li20;~Kaiyan_Zhang1;~Jianxing_Liu1;~Ligang_Wu1;~Bowen_Zhou4",
        "aff": "Harbin Institute of Technology;Shanghai Artificial Intelligence Laboratory;Shanghai Artificial Intelligence Laboratory;Tsinghua University;Harbin Institute of Technology;;JD.com",
        "aff_domain": "hit.edu.cn;pjlab.org.cn;pjlab.org.cn;mails.tsinghua.edu.cn;hit.edu.cn;;jd.com",
        "position": "PhD student;Intern;Intern;PhD student;Full Professor;;Vice President",
        "bibtex": "@misc{\nqi2024s,\ntitle={S4++: Elevating Long Sequence Modeling with State Memory Reply},\nauthor={Biqing Qi and Junqi Gao and Dong Li and Kaiyan Zhang and Jianxing Liu and Ligang Wu and Bowen Zhou},\nyear={2024},\nurl={https://openreview.net/forum?id=bdnw4qjfH9}\n}",
        "github": "",
        "project": "",
        "reviewers": "rGQA;aFxd;QwTp;1dtu",
        "site": "https://openreview.net/forum?id=bdnw4qjfH9",
        "pdf_size": 5498402,
        "rating": "3;3;3;5",
        "confidence": "4;4;4;4",
        "soundness": "2;1;2;2",
        "contribution": "1;1;3;2",
        "presentation": "1;2;1;1",
        "wc_summary": "110;47;25;111",
        "wc_strengths": "107;39;40;101",
        "wc_weaknesses": "577;588;64;161",
        "wc_questions": "423;16;284;119",
        "wc_review": "1217;690;413;492",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            1.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            73.25,
            38.05505879643336
        ],
        "wc_strengths_avg": [
            71.75,
            32.32162588732194
        ],
        "wc_weaknesses_avg": [
            347.5,
            237.52105169858103
        ],
        "wc_questions_avg": [
            210.5,
            155.5321510170807
        ],
        "wc_review_avg": [
            703.0,
            313.44297727018863
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12792825510666908726&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;2;0;3",
        "aff_unique_norm": "Harbin Institute of Technology;Shanghai Artificial Intelligence Laboratory;Tsinghua University;JD.com",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "http://www.hit.edu.cn/;http://www.shailab.org/;https://www.tsinghua.edu.cn;https://www.jd.com",
        "aff_unique_abbr": "HIT;Shanghai AI Lab;THU;JD",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Harbin;",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "beYW50NuCs",
        "title": "Overcoming Alignment Constraints: G-Patch for Practical Adversarial Attacks on ViTs",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "This paper addresses the vulnerability of adversarial patches designed for vision transformers, which traditionally depended on precise alignment with patch locations. Such alignment constraints hindered practical deployment in the physical world. We propose the G-Patch, a novel method for generating adversarial patches that overcomes this constraint, enabling targeted attacks from any position within the field of view. Instead of directly optimizing the patch using gradients, we employ a sub-network structure for patch generation. Our experiments demonstrate the G-Patch's effectiveness in achieving universal attacks on vision transformers with a small size. Further analysis shows its resilience to challenges like brightness restriction, color transfer, and random noise, enhancing robustness and inconspicuousness in real-world deployments. Black box and real-world attack experiments validate its effectiveness even under challenging conditions.",
        "keywords": "computer vision;adversarial attack;vision transformer;practical deployment",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/6f82d2c200e53042e84620e81e7b31de3ab94106.zip",
        "author": "Mingzhen Shao",
        "authorids": "~Mingzhen_Shao1",
        "gender": "M",
        "homepage": "",
        "dblp": "188/6864",
        "google_scholar": "",
        "orcid": "",
        "linkedin": "mingzhenshao/",
        "or_profile": "~Mingzhen_Shao1",
        "aff": "University of Utah",
        "aff_domain": "utah.edu",
        "position": "PhD student",
        "bibtex": "@misc{\nshao2024overcoming,\ntitle={Overcoming Alignment Constraints: G-Patch for Practical Adversarial Attacks on ViTs},\nauthor={Mingzhen Shao},\nyear={2024},\nurl={https://openreview.net/forum?id=beYW50NuCs}\n}",
        "github": "",
        "project": "",
        "reviewers": "Bcct;u7HF;EEsX;sysB",
        "site": "https://openreview.net/forum?id=beYW50NuCs",
        "pdf_size": 18386267,
        "rating": "3;3;5;5",
        "confidence": "4;5;4;4",
        "soundness": "2;2;3;2",
        "contribution": "1;1;3;2",
        "presentation": "2;2;3;2",
        "wc_summary": "74;56;94;39",
        "wc_strengths": "33;14;65;21",
        "wc_weaknesses": "181;158;95;84",
        "wc_questions": "3;2;1;20",
        "wc_review": "291;230;255;164",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            65.75,
            20.474068965401088
        ],
        "wc_strengths_avg": [
            33.25,
            19.549616364522347
        ],
        "wc_weaknesses_avg": [
            129.5,
            41.00304866714181
        ],
        "wc_questions_avg": [
            6.5,
            7.826237921249264
        ],
        "wc_review_avg": [
            235.0,
            46.373483802707774
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:YSeqTSNvOnoJ:scholar.google.com/&scioq=Overcoming+Alignment+Constraints:+G-Patch+for+Practical+Adversarial+Attacks+on+ViTs&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Utah",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.utah.edu",
        "aff_unique_abbr": "Utah",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "bfRDhzG3vn",
        "title": "Continual Contrastive Spoken Language Understanding",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recently, neural networks have shown impressive progress across diverse fields, with speech processing being no exception. However, recent breakthroughs in this area require extensive offline training using large datasets and tremendous computing resources. Unfortunately, these models struggle to retain their previously acquired knowledge when learning new tasks continually and retraining from scratch is almost always impractical. In this paper, we investigate the problem of learning sequence-to-sequence models for spoken language understanding in a class-incremental learning (CIL) setting and we propose COCONUT, a CIL method that relies on the combination of experience replay and contrastive learning. Through a modified version of the standard supervised contrastive loss applied only to the rehearsal samples, COCONUT preserves the learned representations by pulling closer samples from the same class and pushing away the others. Moreover, we leverage a multimodal contrastive loss that helps the model learn more discriminative representations of the new data by aligning audio and text features. We also investigate different contrastive designs to combine the strengths of the contrastive loss with teacher-student architectures used for distillation. Experiments on two established SLU datasets reveal the effectiveness of our proposed approach and significant improvements over the baselines. We also show that COCONUT can be combined with methods that operate on the decoder side of the model, resulting in further metrics improvements.",
        "keywords": "spoken language understanding;continual learning;contrastive learning;experience replay",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Umberto Cappellazzo;Enrico Fini;Muqiao Yang;Daniele Falavigna;Alessio Brutti;Bhiksha Raj",
        "authorids": "~Umberto_Cappellazzo1;~Enrico_Fini1;~Muqiao_Yang1;~Daniele_Falavigna1;~Alessio_Brutti1;~Bhiksha_Raj1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://umbertocappellazzo.github.io/;;https://muqiaoy.github.io;https://speechtek.fbk.eu/author/daniele/;;https://www.cs.cmu.edu/directory/bhikshar/",
        "dblp": "334/1936;252/5371;239/6073;15/5847;77/6379;60/3996",
        "google_scholar": "z7zK5S0AAAAJ;OQMtSKIAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.it/citations?hl=it;dS643iQAAAAJ;",
        "orcid": ";;0000-0001-6273-0138;;0000-0003-4146-3071;",
        "linkedin": "umberto-cappellazzo-116093150/;ef21;muqiaoy/;;;",
        "or_profile": "~Umberto_Cappellazzo1;~Enrico_Fini1;~Muqiao_Yang1;~Daniele_Falavigna1;~Alessio_Brutti1;~Bhiksha_Raj1",
        "aff": "University of Trento;Apple;Carnegie Mellon University;Fondazione Bruno Kessler;Fondazione Bruno Kessler;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_domain": "unitn.it;apple.com;andrew.cmu.edu;fbk.eu;fbk.eu;mbzuai.ac.ae",
        "position": "PhD student;Research Scientist;PhD student;Principal Researcher;Researcher;Full Professor",
        "bibtex": "@misc{\ncappellazzo2024continual,\ntitle={Continual Contrastive Spoken Language Understanding},\nauthor={Umberto Cappellazzo and Enrico Fini and Muqiao Yang and Daniele Falavigna and Alessio Brutti and Bhiksha Raj},\nyear={2024},\nurl={https://openreview.net/forum?id=bfRDhzG3vn}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZUcH;YNzV;eVfc;6YBX",
        "site": "https://openreview.net/forum?id=bfRDhzG3vn",
        "pdf_size": 532643,
        "rating": "5;6;6;6",
        "confidence": "4;3;3;3",
        "soundness": "3;4;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "69;62;104;121",
        "wc_strengths": "82;42;33;37",
        "wc_weaknesses": "27;23;60;85",
        "wc_questions": "20;265;49;66",
        "wc_review": "198;392;246;309",
        "wc_reply_reviewers": "70;37;25;0",
        "wc_reply_authors": "676;1002;789;401",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "2;3;1;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            89.0,
            24.38237068047322
        ],
        "wc_strengths_avg": [
            48.5,
            19.60229578391266
        ],
        "wc_weaknesses_avg": [
            48.75,
            25.380849079571785
        ],
        "wc_questions_avg": [
            100.0,
            96.67212628260538
        ],
        "wc_review_avg": [
            286.25,
            72.64425304179265
        ],
        "wc_reply_reviewers_avg": [
            33.0,
            25.18928343562
        ],
        "wc_reply_authors_avg": [
            717.0,
            216.76369622240713
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4839615936188059856&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;2;3;3;4",
        "aff_unique_norm": "University of Trento;Apple;Carnegie Mellon University;Fondazione Bruno Kessler;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_unique_dep": ";Apple Inc.;;;",
        "aff_unique_url": "https://www.unitn.it;https://www.apple.com;https://www.cmu.edu;https://www.fbk.eu;https://mbzuai.ac.ae",
        "aff_unique_abbr": "UniTN;Apple;CMU;FBK;MBZUAI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;0;0;2",
        "aff_country_unique": "Italy;United States;United Arab Emirates"
    },
    {
        "id": "bgIZDxd2bM",
        "title": "Generation, Reconstruction, Representation All-in-One: A Joint Autoencoding Diffusion Model",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The vast applications of deep generative models are founded on the premise of three fundamental capabilities: generating new instances (e.g., image/text synthesis and molecule design), reconstructing inputs (e.g., data editing and restoration), and learning latent representations (e.g., structure discovery and downstream classification). Existing model families, including Variational Autoencoders (VAEs), Generative Adversarial Networks (GANs), autoregressive models, and diffusion models, generally excel in specific capabilities but fall short in others. We introduce Joint Autoencoding Diffusion (JEDI), a new generative framework that unifies all three core capabilities, offering versatile applications and strong performance in a single model. Specifically, JEDI generalizes the noising/denoising transformations (based on simple Gaussian noise) in diffusion process by introducing parameterized encoder/decoder transformations between raw data and compact representations. Crucially, the encoder/decoder parameters are learned jointly with all other diffusion model parameters under the standard probabilistic diffusion formalism. This results in a model that not only inherits the strong generation abilities of diffusion models but also enables compact data representation and faithful reconstruction. Additionally, by choosing appropriate encoder/decoder, JEDI can naturally accommodate discrete data (such as text and protein sequences) which have been difficult for diffusion models. Extensive experiments across different data modalities, including images, text, and proteins, demonstrate JEDI's general applicability to diverse tasks and strong improvement over existing specialized deep generative models.",
        "keywords": "diffusion model;generative model;latent model",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Guangyi Liu;Yu Wang;Zeyu Feng;Qiyu Wu;Liping Tang;Yuan Gao;Zhen Li;Shuguang Cui;Eric Xing;Zichao Yang;Zhiting Hu",
        "authorids": "~Guangyi_Liu1;~Yu_Wang24;~Zeyu_Feng2;~Qiyu_Wu2;~Liping_Tang2;~Yuan_Gao11;~Zhen_Li6;~Shuguang_Cui1;~Eric_Xing1;~Zichao_Yang1;~Zhiting_Hu3",
        "gender": ";M;M;;F;M;;M;M;M;M",
        "homepage": ";https://wangyu-ustc.github.io/;;;;https://www.linkedin.com/in/rab0na/;;https://sse.cuhk.edu.cn/en/content/1415;http://www.cs.cmu.edu/~epxing/;;http://zhiting.ucsd.edu",
        "dblp": ";;;;;;;48/4914;36/3855;07/8707;134/4031",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;;;;;;https://scholar.google.com.hk/citations?user=1o_qvR0AAAAJ;https://scholar.google.com.tw/citations?user=5pKTRxEAAAAJ;https://scholar.google.co.uk/citations?user=siCYLcUAAAAJ;N7_xhHoAAAAJ",
        "orcid": ";;;;;;;0000-0003-2608-775X;;;",
        "linkedin": ";;zeyu-feng-1800831a1;;%E4%B8%BD%E5%B9%B3-%E5%94%90-51972419a;rab0na/;;;;;",
        "or_profile": "~Guangyi_Liu1;~Yu_Wang24;~Zeyu_Feng2;~Qiyu_Wu2;~Liping_Tang2;~Yuan_Gao11;~Zhen_Li6;~Shuguang_Cui1;~Eric_Xing1;~Zichao_Yang1;~Zhiting_Hu3",
        "aff": ";University of California, San Diego;University of California, San Diego;;Mohamed bin Zayed University of Artificial Intelligence;Computer Science Department, Stanford University;;The Chinese University of Hong Kong, Shenzhen;School of Computer Science, Carnegie Mellon University;;Amazon",
        "aff_domain": ";ucsd.edu;ucsd.edu;;mbzuai.ac.ae;cs.stanford.edu;;cuhk.edu.cn;cs.cmu.edu;;amazon.com",
        "position": ";PhD student;Master Student;;NLP Engineer;MS student;;Full Professor;Full Professor;;Researcher",
        "bibtex": "@misc{\nliu2024generation,\ntitle={Generation, Reconstruction, Representation All-in-One: A Joint Autoencoding Diffusion Model},\nauthor={Guangyi Liu and Yu Wang and Zeyu Feng and Qiyu Wu and Liping Tang and Yuan Gao and Zhen Li and Shuguang Cui and Eric Xing and Zichao Yang and Zhiting Hu},\nyear={2024},\nurl={https://openreview.net/forum?id=bgIZDxd2bM}\n}",
        "github": "",
        "project": "",
        "reviewers": "Y7KF;cqsF;oXqa",
        "site": "https://openreview.net/forum?id=bgIZDxd2bM",
        "pdf_size": 3955495,
        "rating": "3;3;6",
        "confidence": "4;3;3",
        "soundness": "2;3;4",
        "contribution": "1;1;3",
        "presentation": "3;3;3",
        "wc_summary": "80;36;62",
        "wc_strengths": "37;39;57",
        "wc_weaknesses": "84;226;67",
        "wc_questions": "224;99;101",
        "wc_review": "425;400;287",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            59.333333333333336,
            18.06162291219209
        ],
        "wc_strengths_avg": [
            44.333333333333336,
            8.993825042154693
        ],
        "wc_weaknesses_avg": [
            125.66666666666667,
            71.28503037493606
        ],
        "wc_questions_avg": [
            141.33333333333334,
            58.459862774005515
        ],
        "wc_review_avg": [
            370.6666666666667,
            60.035174874586836
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:5taWscaBTeUJ:scholar.google.com/&scioq=Generation,+Reconstruction,+Representation+All-in-One:+A+Joint+Autoencoding+Diffusion+Model&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2;3;4;5",
        "aff_unique_norm": "University of California, San Diego;Mohamed bin Zayed University of Artificial Intelligence;Stanford University;Chinese University of Hong Kong;Carnegie Mellon University;Amazon",
        "aff_unique_dep": ";;Computer Science Department;;School of Computer Science;Amazon.com, Inc.",
        "aff_unique_url": "https://www.ucsd.edu;https://mbzuai.ac.ae;https://www.stanford.edu;https://www.cuhk.edu.cn;https://www.cmu.edu;https://www.amazon.com",
        "aff_unique_abbr": "UCSD;MBZUAI;Stanford;CUHK;CMU;Amazon",
        "aff_campus_unique_index": "0;0;2;3;4",
        "aff_campus_unique": "San Diego;;Stanford;Shenzhen;Pittsburgh",
        "aff_country_unique_index": "0;0;1;0;2;0;0",
        "aff_country_unique": "United States;United Arab Emirates;China"
    },
    {
        "id": "bgKGwLYmAy",
        "title": "DGTAT: DECOUPLED GRAPH TRIPLE ATTENTION NETWORKS",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The Message Passing Neural Network (MPNN) is a foundational paradigm in graph learning algorithms, demonstrating remarkable efficacy in its early implementations. Recent research has focused on using Transformer on graph data or combining Transformer with MPNNs to address issues like over-squeezing and over-smoothing while capturing long-range dependencies. However, Graph Transformers (GT) often perform poorly on small datasets. More seriously, much position and structure information encoded by GT-based methods is coupled with node attribute information, affecting node attribute encoding while propagating structure and position information, implicitly impacting on expressiveness.  In this paper, we analyze the factors influencing the performance of graph learning models. Subsequently, we introduce a novel model, named DECOUPLED GRAPH TRIPLE ATTENTION NETWORKS (DGTAT). Based on the MPNN+VN paradigm and a sampling strategy, DGTAT effectively decouples local and global interactions, separates learnable positional, attribute, and structural encodings, and computes triple attention. This design allows DGTAT to capture long-range dependencies akin to Transformers while preserving the inductive bias of the graph topology. As a result, it exhibits robust performance across graphs of varying sizes, excelling on both large and small datasets. DGTAT achieves state-of-the-art empirical performance across a variety of node classification tasks, and through ablation experiments, we elucidate the importance of each decoupled design factor within the model. Compared to GT-based models, our model offers enhanced interpretability and flexibility.",
        "keywords": "Graph Transformer;Node Classification;Decoupled Attention;Positional Encoding;Structural Encoding;Virtual Node",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Xiaotang Wang",
        "authorids": "~Xiaotang_Wang1",
        "gender": "M",
        "homepage": "https://github.com/wangxiaotang0906",
        "dblp": "333/3734",
        "google_scholar": "https://scholar.google.com.hk/citations?view_op=list_works",
        "orcid": "0009-0001-6804-542X",
        "linkedin": "",
        "or_profile": "~Xiaotang_Wang1",
        "aff": "Huazhong University of Science and Technology",
        "aff_domain": "hust.edu.cn",
        "position": "MS student",
        "bibtex": "@misc{\nanonymous2024dgtat,\ntitle={{DGTAT}: {DECOUPLED} {GRAPH} {TRIPLE} {ATTENTION} {NETWORKS}},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=bgKGwLYmAy}\n}",
        "github": "",
        "project": "",
        "reviewers": "xSa6;Zxgv;2B2X",
        "site": "https://openreview.net/forum?id=bgKGwLYmAy",
        "pdf_size": 664926,
        "rating": "5;5;5",
        "confidence": "4;3;4",
        "soundness": "3;3;3",
        "contribution": "2;2;3",
        "presentation": "2;2;3",
        "wc_summary": "67;34;75",
        "wc_strengths": "38;26;53",
        "wc_weaknesses": "133;110;37",
        "wc_questions": "3;3;28",
        "wc_review": "241;173;193",
        "wc_reply_reviewers": "0;46;0",
        "wc_reply_authors": "1397;1340;1377",
        "reply_reviewers": "0;1;0",
        "reply_authors": "5;4;4",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            58.666666666666664,
            17.745108872274887
        ],
        "wc_strengths_avg": [
            39.0,
            11.045361017187261
        ],
        "wc_weaknesses_avg": [
            93.33333333333333,
            40.92540639857946
        ],
        "wc_questions_avg": [
            11.333333333333334,
            11.785113019775793
        ],
        "wc_review_avg": [
            202.33333333333334,
            28.5345794120436
        ],
        "wc_reply_reviewers_avg": [
            15.333333333333334,
            21.684607956387456
        ],
        "wc_reply_authors_avg": [
            1371.3333333333333,
            23.612614331233114
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:LW1HvHjg1s4J:scholar.google.com/&scioq=DGTAT:+DECOUPLED+GRAPH+TRIPLE+ATTENTION+NETWORKS&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Huazhong University of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.hust.edu.cn",
        "aff_unique_abbr": "HUST",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "bgwgrxBYOI",
        "title": "Deep PDE Solvers for Subgrid Modelling and Out-of-Distribution Generalization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Climate and weather modelling (CWM) is an important area where ML models are constantly being used for subgrid modelling: making predictions of processes occurring at scales too small to be resolved  (Brasseur & Jacob, 2017). In addition to accuracy, these models are relied on to make accurate predictions even on out-of-distribution data and should respect physical constraints  (Kashinath et al., 2021).  While many specialized ML PDE solvers have been developed, these particular requirements have not been addressed so far. The challenge we address in this paper is to build subgrid PDE solvers which satisfy these additional requirements of the CWM models. We propose and develop a novel architecture, which matches or exceeds the performance of standard ML models, and which demonstrably succeeds in OOD generalization.  The architecture is based on expert knowledge of the structure of PDE solution operators which are designed to obey physical constraints and to enforce numerical stability.",
        "keywords": "Machine Learning for Sciences;PDE modelling;Subgrid modelling;Out of Distribution Generalization",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/2321e59f6a9dc0ccc95c1f553c8caa448275a9c2.zip",
        "author": "Patrick Chatain;Adam M Oberman",
        "authorids": "~Patrick_Chatain1;~Adam_M_Oberman1",
        "gender": "M;M",
        "homepage": ";https://www.adamoberman.net/",
        "dblp": ";31/8186",
        "google_scholar": ";https://scholar.google.ca/citations?user=LPAZlL8AAAAJ",
        "orcid": ";",
        "linkedin": "patrick-chatain-148456124/;adam-oberman-527348107/",
        "or_profile": "~Patrick_Chatain1;~Adam_M_Oberman1",
        "aff": ";McGill University",
        "aff_domain": ";mcgill.ca",
        "position": ";Full Professor",
        "bibtex": "@misc{\nchatain2024deep,\ntitle={Deep {PDE} Solvers for Subgrid Modelling and Out-of-Distribution Generalization},\nauthor={Patrick Chatain and Adam M Oberman},\nyear={2024},\nurl={https://openreview.net/forum?id=bgwgrxBYOI}\n}",
        "github": "",
        "project": "",
        "reviewers": "QFWP;wuBe;Ap8L;6z1F",
        "site": "https://openreview.net/forum?id=bgwgrxBYOI",
        "pdf_size": 651486,
        "rating": "3;3;5;6",
        "confidence": "4;2;4;2",
        "soundness": "2;2;2;2",
        "contribution": "1;2;1;2",
        "presentation": "2;2;2;2",
        "wc_summary": "61;36;62;49",
        "wc_strengths": "31;21;67;17",
        "wc_weaknesses": "215;114;138;34",
        "wc_questions": "21;97;1;118",
        "wc_review": "328;268;268;218",
        "wc_reply_reviewers": "5;0;39;6",
        "wc_reply_authors": "223;417;156;288",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.0,
            1.0
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            52.0,
            10.559356040971437
        ],
        "wc_strengths_avg": [
            34.0,
            19.72308292331602
        ],
        "wc_weaknesses_avg": [
            125.25,
            64.55762929352348
        ],
        "wc_questions_avg": [
            59.25,
            49.32735042549924
        ],
        "wc_review_avg": [
            270.5,
            38.97114317029974
        ],
        "wc_reply_reviewers_avg": [
            12.5,
            15.46770829825802
        ],
        "wc_reply_authors_avg": [
            271.0,
            96.35092111651035
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.19245008972987526,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:cV_1RAe7nJsJ:scholar.google.com/&scioq=Deep+PDE+Solvers+for+Subgrid+Modelling+and+Out-of-Distribution+Generalization&hl=en&as_sdt=0,33",
        "gs_version_total": 4,
        "aff_unique_index": "0",
        "aff_unique_norm": "McGill University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.mcgill.ca",
        "aff_unique_abbr": "McGill",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "bgyWXX8HCk",
        "title": "Trustless Audits without Revealing Data or Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "There is an increasing conflict between business incentives to hide models and data as trade secrets, and the societal need for algorithmic transparency. For example, a rightsholder who currently wishes to know whether their copyrighted works have been used during training must convince the model provider to allow a third party to audit the model and data. Finding a mutually agreeable third party is difficult, and the associated costs often make this approach impractical.\n\nIn this work, we show that it is possible to simultaneously allow model providers to keep their models and data secret while allowing other parties to trustlessly audit properties of the model and data. We do this by designing a protocol called ZkAudit in which model providers publish cryptographic commitments of datasets and model weights, alongside a zero-knowledge proof (ZKP) certifying that published commitments are derived from training the model. Model providers can then respond to audit requests by privately computing any function F of the dataset (or model) and releasing the output of F alongside another ZKP certifying the correct execution of F. To enable ZkAudit, we develop new methods of computing ZKPs for SGD on modern neural nets for recommender systems and image classification models capable of high accuracies on ImageNet. Empirically, we show it is possible to provide trustless audits of DNNs, including copyright, censorship, and counterfactual audits with little to no loss in accuracy.",
        "keywords": "trustless audit;zero-knowledge proof",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/eed064f6f0a85c649f61734ecaab1497b58393fe.pdf",
        "author": "Suppakit Waiwitlikhit;Ion Stoica;Yi Sun;Tatsunori Hashimoto;Daniel Kang",
        "authorids": "~Suppakit_Waiwitlikhit3;~Ion_Stoica1;~Yi_Sun3;~Tatsunori_Hashimoto1;~Daniel_Kang1",
        "gender": "M;;M;;M",
        "homepage": "http://people.eecs.berkeley.edu/~istoica/;https://yisun.io/;https://thashim.github.io;https://ddkang.github.io/;https://punw.xyz",
        "dblp": "s/IonStoica;;;40/6300.html;",
        "google_scholar": "vN-is70AAAAJ;FdNHp8QAAAAJ;5ygiTwsAAAAJ;CpMjT0YAAAAJ;",
        "orcid": ";;;;",
        "linkedin": "ionstoica;;;;",
        "or_profile": "~Ion_Stoica1;~Yi_Sun3;~Tatsunori_Hashimoto1;~Daniel_Kang1;~Pun_Waiwitlikhit1",
        "aff": "University of California, Berkeley;University of Chicago;Stanford University;Department of Computer Science;Stanford University",
        "aff_domain": "berkeley.edu;statistics.uchicago.edu;stanford.edu;cs.illinois.edu;stanford.edu",
        "position": "Full Professor;Assistant Professor;Assistant Professor;Assistant Professor;Undergrad student",
        "bibtex": "@misc{\nwaiwitlikhit2024trustless,\ntitle={Trustless Audits without Revealing Data or Models},\nauthor={Suppakit Waiwitlikhit and Ion Stoica and Yi Sun and Tatsunori Hashimoto and Daniel Kang},\nyear={2024},\nurl={https://openreview.net/forum?id=bgyWXX8HCk}\n}",
        "github": "",
        "project": "",
        "reviewers": "Ww1n;uRaA;TAmM",
        "site": "https://openreview.net/forum?id=bgyWXX8HCk",
        "pdf_size": 299847,
        "rating": "6;6;8",
        "confidence": "4;2;3",
        "soundness": "2;3;4",
        "contribution": "3;2;3",
        "presentation": "2;2;3",
        "wc_summary": "96;228;138",
        "wc_strengths": "123;37;57",
        "wc_weaknesses": "281;468;170",
        "wc_questions": "67;98;248",
        "wc_review": "567;831;613",
        "wc_reply_reviewers": "29;37;44",
        "wc_reply_authors": "412;334;455",
        "reply_reviewers": "1;1;1",
        "reply_authors": "2;1;1",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            154.0,
            55.06359959174482
        ],
        "wc_strengths_avg": [
            72.33333333333333,
            36.745370078721784
        ],
        "wc_weaknesses_avg": [
            306.3333333333333,
            122.96973430708695
        ],
        "wc_questions_avg": [
            137.66666666666666,
            79.03726266065196
        ],
        "wc_review_avg": [
            670.3333333333334,
            115.15014353250089
        ],
        "wc_reply_reviewers_avg": [
            36.666666666666664,
            6.128258770283412
        ],
        "wc_reply_authors_avg": [
            400.3333333333333,
            50.08215472822852
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17365904962155707719&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;2;3;2",
        "aff_unique_norm": "University of California, Berkeley;University of Chicago;Stanford University;Unknown Institution",
        "aff_unique_dep": ";;;Department of Computer Science",
        "aff_unique_url": "https://www.berkeley.edu;https://www.uchicago.edu;https://www.stanford.edu;",
        "aff_unique_abbr": "UC Berkeley;UChicago;Stanford;",
        "aff_campus_unique_index": "0;2;2",
        "aff_campus_unique": "Berkeley;;Stanford",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States;"
    },
    {
        "id": "biNhA3jbHc",
        "title": "Learning Sequence Attractors in Recurrent Networks with Hidden Neurons",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The brain is targeted for processing temporal sequence information. It remains largely unclear how the brain learns to store and retrieve sequence memories. Here, we study how recurrent networks of binary neurons learn sequence attractors to store predefined pattern sequences and retrieve them robustly. We show that to store arbitrary pattern sequences, it is necessary for a recurrent network to include hidden neurons even though their role in displaying sequence memories is indirect. We develop a local learning algorithm to learn sequence attractors in recurrent networks with hidden neurons. The algorithm is proved to converge and produce sequence attractors. We demonstrate our model can learn and retrieve sequences robustly on synthetic and real-world datasets.  We hope that this study provides new insights in understanding temporal information processing in the brain.",
        "keywords": "neural networks;attractor networks;threshold networks;sequence attractors;sequence memory;episodic memory",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/9aa8a5630d7ee774dfcb3e760d45905bbbccc4c4.zip",
        "author": "Yao Lu;Si Wu",
        "authorids": "~Yao_Lu14;~Si_Wu1",
        "gender": "M;M",
        "homepage": "https://mgv.pku.edu.cn/english/people/lbd/soeeace/267528.htm;http://yaolubrain.github.io/",
        "dblp": "25/437-1;",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Si_Wu1;~Yao_Lu3",
        "aff": "Peking University;",
        "aff_domain": "pku.edu.cn;",
        "position": "Full Professor;",
        "bibtex": "@misc{\nlu2024learning,\ntitle={Learning Sequence Attractors in Recurrent Networks with Hidden Neurons},\nauthor={Yao Lu and Si Wu},\nyear={2024},\nurl={https://openreview.net/forum?id=biNhA3jbHc}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZADc;qcYh;TBVF;9sz4",
        "site": "https://openreview.net/forum?id=biNhA3jbHc",
        "pdf_size": 787112,
        "rating": "3;5;5;8",
        "confidence": "4;5;4;4",
        "soundness": "2;3;2;3",
        "contribution": "1;2;2;4",
        "presentation": "3;2;2;2",
        "wc_summary": "47;42;85;64",
        "wc_strengths": "21;57;9;121",
        "wc_weaknesses": "147;487;181;74",
        "wc_questions": "2;49;144;211",
        "wc_review": "217;635;419;470",
        "wc_reply_reviewers": "203;255;0;53",
        "wc_reply_authors": "503;1128;394;484",
        "reply_reviewers": "3;1;0;1",
        "reply_authors": "5;3;1;2",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            1.0897247358851685
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            59.5,
            16.830032679706836
        ],
        "wc_strengths_avg": [
            52.0,
            43.57751713900185
        ],
        "wc_weaknesses_avg": [
            222.25,
            157.66638037324253
        ],
        "wc_questions_avg": [
            101.5,
            81.3218912716619
        ],
        "wc_review_avg": [
            435.25,
            149.16831935769738
        ],
        "wc_reply_reviewers_avg": [
            127.75,
            104.5977413714082
        ],
        "wc_reply_authors_avg": [
            627.25,
            292.02514874578867
        ],
        "reply_reviewers_avg": [
            1.25,
            1.0897247358851685
        ],
        "reply_authors_avg": [
            2.75,
            1.479019945774904
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.08084520834544431,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4188504731315491052&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0",
        "aff_unique_norm": "Peking University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.pku.edu.cn",
        "aff_unique_abbr": "Peking U",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "bj3jYirM37",
        "title": "Can Agent Learn Robust Locomotion Skills without Modeling Environmental Observation Noise?",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep Reinforcement Learning (DRL) has been widely attempted for solving locomotion control problems recently. Under the circumstances, DRL agents observe environmental measurements via multi-sensor signals, which are usually accompanied by unpredictable noise or errors. Therefore, well-trained policies in simulation are prone to collapse in reality. Existing solutions typically model environmental noise explicitly and perform optimal state estimation based on this. However, there exists non-stationary noise which is intractable to be modeled in real-world tasks. Moreover, these extra noise modeling procedures often induce observable learning efficiency decreases. Since these multi-sensor observation signals are universally correlated in nature, we may use this correlation to recover optimal state estimation from environmental observation noise, and without modeling them explicitly. Inspired by multi-sensory integration mechanism in mammalian brain, a novel Self-supervised randomIzed Masked Augmentation (SIMA) algorithm is proposed. SIMA adopts a self-supervised learning approach to discover the correlation of multivariate time series and reconstruct optimal state representation from disturbed observations latently with a theoretical guarantee. Empirical study reveals that SIMA performs robust locomotion skills under environmental observation noise, and outperforms state-of-the-art baselines by 15.7% in learning performance.",
        "keywords": "Deep reinforcement learning;self-supervised masked augmentation;locomotion control;de-noising",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Yu Jin;Xing Chen;Xiaoqiang Yu;yang shengqi;Yue Han;Junnan Li;Peng Yan;Bohao Qu;haiyin piao",
        "authorids": "~Yu_Jin4;~Xing_Chen2;~Xiaoqiang_Yu1;~yang_shengqi1;~Yue_Han4;~Junnan_Li4;~Peng_Yan3;~Bohao_Qu1;~haiyin_piao1",
        "gender": "M;M;M;;F;;;M;M",
        "homepage": ";https://github.com/raincchio;https://scholar.google.com.hk/citations?view_op=list_works&hl=zh-CN&user=tIYzG84AAAAJ;;;;;https://ieeexplore.ieee.org/author/37088517338;https://www.researchgate.net/profile/Haiyin-Piao",
        "dblp": "https://dblp.dagstuhl.de/;;190/9471;;;;;275/7652.html;269/4228.html",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;;https://scholar.google.com.hk/citations?view_op=list_works;;;;;Xr4GORcAAAAJ;",
        "orcid": ";0000-0001-5685-8506;;0000-0001-7489-7082;0000-0002-7212-1122;0000-0002-3915-2891;0000-0003-2928-8987;0000-0003-3192-8736;",
        "linkedin": ";;;;;;;;",
        "or_profile": "~Yu_Jin4;~Xing_Chen2;~Xiaoqiang_Yu1;~yang_shengqi1;~Yue_Han4;~Junnan_Li4;~Peng_Yan3;~Bohao_Qu1;~haiyin_piao1",
        "aff": ";Jilin University;;;;;Harbin Institute of Technology;Jilin University;",
        "aff_domain": ";jlu.edu.cn;;;;;hit.edu.cn;jlu.edu.cn;",
        "position": ";PhD student;;;;;Associate Professor;PhD student;",
        "bibtex": "@misc{\njin2024can,\ntitle={Can Agent Learn Robust Locomotion Skills without Modeling Environmental Observation Noise?},\nauthor={Yu Jin and Xing Chen and Xiaoqiang Yu and yang shengqi and Yue Han and Junnan Li and Peng Yan and Bohao Qu and haiyin piao},\nyear={2024},\nurl={https://openreview.net/forum?id=bj3jYirM37}\n}",
        "github": "",
        "project": "",
        "reviewers": "6VDo;UYTE;GwWq",
        "site": "https://openreview.net/forum?id=bj3jYirM37",
        "pdf_size": 21788497,
        "rating": "3;6;8",
        "confidence": "4;4;4",
        "soundness": "2;3;4",
        "contribution": "2;3;3",
        "presentation": "2;4;4",
        "wc_summary": "71;42;134",
        "wc_strengths": "28;63;96",
        "wc_weaknesses": "141;165;97",
        "wc_questions": "2;92;33",
        "wc_review": "242;362;360",
        "wc_reply_reviewers": "271;74;0",
        "wc_reply_authors": "1104;718;489",
        "reply_reviewers": "2;1;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            5.666666666666667,
            2.0548046676563256
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            82.33333333333333,
            38.4042821686448
        ],
        "wc_strengths_avg": [
            62.333333333333336,
            27.764885897278397
        ],
        "wc_weaknesses_avg": [
            134.33333333333334,
            28.158282775923837
        ],
        "wc_questions_avg": [
            42.333333333333336,
            37.33035702421765
        ],
        "wc_review_avg": [
            321.3333333333333,
            56.10307973325132
        ],
        "wc_reply_reviewers_avg": [
            115.0,
            114.37074217939947
        ],
        "wc_reply_authors_avg": [
            770.3333333333334,
            253.78512345858434
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:2yJJGf79ASoJ:scholar.google.com/&scioq=Can+Agent+Learn+Robust+Locomotion+Skills+without+Modeling+Environmental+Observation+Noise%3F&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Jilin University;Harbin Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.jlu.edu.cn;http://www.hit.edu.cn/",
        "aff_unique_abbr": "JLU;HIT",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Harbin",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "bjFJrdK0nO",
        "title": "Integrating View Conditions for Image Synthesis",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In the field of image processing, applying intricate semantic modifications within existing images remains an enduring challenge. This paper introduces a pioneering framework that integrates viewpoint information to augment the controllability of image editing tasks. By surveying existing object editing methodologies, we distill three essential criteria, consistency, controllability, and harmony, that should be met for an image editing method. In contrast to previous approaches, our method takes the lead in satisfying all three requirements for addressing the challenge of image synthesis. Through comprehensive experiments, encompassing both quantitative assessments and qualitative comparisons with contemporary state-of-the-art methods, we present compelling evidence of our framework's superior performance across multiple dimensions. This work establishes a promising avenue for advancing image synthesis techniques and empowering precise object modifications while preserving the visual coherence of the entire composition.",
        "keywords": "View Conditions;Image Synthesis;Controllable Content Creation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/4852c8f4982ebc838bf0b83d3a88ad509bd4a3d9.zip",
        "author": "Jinbin Bai;Zhen Dong;Aosong Feng;Xiao Zhang;Tian Ye;Jia-Wei Liu;Kaicheng Zhou;Mike Zheng Shou",
        "authorids": "~Jinbin_Bai1;~Zhen_Dong3;~Aosong_Feng1;~Xiao_Zhang26;~Tian_Ye3;~Jia-Wei_Liu1;~Kaicheng_Zhou1;~Mike_Zheng_Shou1",
        "gender": ";M;M;M;;M;;",
        "homepage": ";https://dong-zhen.com/;;;;https://jia-wei-liu.github.io/;;",
        "dblp": ";;260/0450;;;85/3336;;",
        "google_scholar": ";czxMUzcAAAAJ;lIuUXKkAAAAJ;bqvp0PYAAAAJ;;stQQf7wAAAAJ;;",
        "orcid": ";;;;;;;",
        "linkedin": ";zhen-dong/;;xiao-zhang-120392128/;;;;",
        "or_profile": "~Jinbin_Bai1;~Zhen_Dong3;~Aosong_Feng1;~Xiao_Zhang26;~Tian_Ye3;~Jia-Wei_Liu1;~Kaicheng_Zhou1;~Mike_Zheng_Shou1",
        "aff": ";Nexusflow.ai Inc;Yale University;Collov Research;;National University of Singapore;;",
        "aff_domain": ";nexusflow.ai;yale.edu;collov.com;;u.nus.edu;;",
        "position": ";Principal Researcher;PhD student;ceo;;PhD student;;",
        "bibtex": "@misc{\nbai2024integrating,\ntitle={Integrating View Conditions for Image Synthesis},\nauthor={Jinbin Bai and Zhen Dong and Aosong Feng and Xiao Zhang and Tian Ye and Jia-Wei Liu and Kaicheng Zhou and Mike Zheng Shou},\nyear={2024},\nurl={https://openreview.net/forum?id=bjFJrdK0nO}\n}",
        "github": "",
        "project": "",
        "reviewers": "RzKy;j7Dh;pMRb;H34R",
        "site": "https://openreview.net/forum?id=bjFJrdK0nO",
        "pdf_size": 40127081,
        "rating": "5;5;5;5",
        "confidence": "5;3;3;4",
        "soundness": "3;2;2;3",
        "contribution": "3;2;2;3",
        "presentation": "3;2;2;4",
        "wc_summary": "54;40;99;102",
        "wc_strengths": "19;34;40;66",
        "wc_weaknesses": "151;176;114;167",
        "wc_questions": "88;69;119;1",
        "wc_review": "312;319;372;336",
        "wc_reply_reviewers": "26;42;0;0",
        "wc_reply_authors": "653;671;637;473",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            73.75,
            27.224758952100935
        ],
        "wc_strengths_avg": [
            39.75,
            16.97608612136496
        ],
        "wc_weaknesses_avg": [
            152.0,
            23.695991222145572
        ],
        "wc_questions_avg": [
            69.25,
            43.25722483007896
        ],
        "wc_review_avg": [
            334.75,
            23.209642392764263
        ],
        "wc_reply_reviewers_avg": [
            17.0,
            17.916472867168917
        ],
        "wc_reply_authors_avg": [
            608.5,
            79.15017372059268
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17904231794035219926&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Nexusflow.ai;Yale University;Collov Research;National University of Singapore",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.nexusflow.ai;https://www.yale.edu;;https://www.nus.edu.sg",
        "aff_unique_abbr": "Nexusflow.ai;Yale;;NUS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;2",
        "aff_country_unique": "United States;;Singapore"
    },
    {
        "id": "bjlTHVAkHS",
        "title": "Intuitive or Dependent? Investigating LLms\u2019 Robustness to Conflicting Prompts",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "This paper explores the robustness of LLMs' preference to their internal memory or the given prompt, which may contain contrasting information in real-world applications due to noise or task settings.\nTo this end, we establish a quantitative benchmarking framework and conduct role playing intervention to control LLMs' preference. \nIn specific, we define two types of robustness, factual robustness targeting the ability in identifying the correct fact from prompts or memory, and decision style to categorize LLMs' behavior in making consistent choices --- assuming there is no definitive ``right\" answer --- intuitive, dependent, or rational based on cognitive theory.\nOur findings, derived from extensive experiments on seven open-source and closed-source LLMs, reveal that these models are highly susceptible to misleading prompts, especially for instructing commonsense knowledge. While detailed instructions can mitigate the selection of misleading answers, they also increase the incidence of invalid responses. After Unraveling the preference, we intervene different sized LLMs through specific style of role instruction, showing their varying upper bound of robustness and adaptivity.",
        "keywords": "LLM;Robustness;Evaluation Framework;dataset",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/f9ed87478f7fafc69afb3235f2e1e44950052ecc.zip",
        "author": "Jiahao Ying;Yixin Cao;Kai Xiong;yidong He;Long Cui;Yongbin Liu",
        "authorids": "~Jiahao_Ying1;~Yixin_Cao2;~Kai_Xiong2;~yidong_He1;~Long_Cui2;~Yongbin_Liu1",
        "gender": "M;M;M;M;M;M",
        "homepage": ";https://sites.google.com/view/yixin-homepage;https://waste-wood.github.io/;https://jsjxy.usc.edu.cn/;;https://1716649290.github.io/cuilong.github.io/",
        "dblp": "303/6904;20/8038-2;38/6410-2;;79/9544;",
        "google_scholar": "JOEJg9UAAAAJ;https://scholar.google.co.uk/citations?user=CnhTvdoAAAAJ;https://scholar.google.com.hk/citations?hl=zh-CN;;9sXgL3MAAAAJ;",
        "orcid": ";;0000-0002-5909-3075;;;",
        "linkedin": "jiahao-ying-89b456265/;;;;;",
        "or_profile": "~Jiahao_Ying1;~Yixin_Cao2;~Kai_Xiong2;~yidong_He1;~Yongbin_Liu1;~Cui_Long1",
        "aff": "Singapore Management University;Singapore Management University;Harbin Institute of Technology;South China University;;South China University",
        "aff_domain": "smu.edu.sg;smu.edu.sg;hit.edu.cn;usc.edu.cn;;usc.edu.cn",
        "position": "PhD student;Assistant Professor;PhD student;MS student;;MS student",
        "bibtex": "@misc{\nying2024intuitive,\ntitle={Intuitive or Dependent? Investigating {LL}ms{\\textquoteright} Robustness to Conflicting Prompts},\nauthor={Jiahao Ying and Yixin Cao and Kai Xiong and yidong He and Long Cui and Yongbin Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=bjlTHVAkHS}\n}",
        "github": "",
        "project": "",
        "reviewers": "WrsR;8SLG;WVwf",
        "site": "https://openreview.net/forum?id=bjlTHVAkHS",
        "pdf_size": 3621482,
        "rating": "3;5;5",
        "confidence": "3;3;3",
        "soundness": "2;2;3",
        "contribution": "2;3;3",
        "presentation": "1;2;2",
        "wc_summary": "96;58;157",
        "wc_strengths": "29;105;38",
        "wc_weaknesses": "275;212;35",
        "wc_questions": "7;54;302",
        "wc_review": "407;429;532",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "874;1191;482",
        "reply_reviewers": "0;0;0",
        "reply_authors": "3;3;2",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            103.66666666666667,
            40.778534658431376
        ],
        "wc_strengths_avg": [
            57.333333333333336,
            33.9050963065371
        ],
        "wc_weaknesses_avg": [
            174.0,
            101.59724405711013
        ],
        "wc_questions_avg": [
            121.0,
            129.4166398368721
        ],
        "wc_review_avg": [
            456.0,
            54.48547206977899
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            849.0,
            289.9873560462019
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12650611511995789616&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;1;2;2",
        "aff_unique_norm": "Singapore Management University;Harbin Institute of Technology;South China University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.smu.edu.sg;http://www.hit.edu.cn/;http://www.scut.edu.cn",
        "aff_unique_abbr": "SMU;HIT;SCUT",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Harbin",
        "aff_country_unique_index": "0;0;1;1;1",
        "aff_country_unique": "Singapore;China"
    },
    {
        "id": "bjyf5FyQ0a",
        "title": "Valley: Video Assistant with Large Language model Enhanced abilitY",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs), with their remarkable conversational capabilities, have demonstrated impressive performance across various applications and have emerged as formidable AI assistants. In view of this, it raises an intuitive question: Can we harness the power of LLMs to build multimodal AI assistants for visual applications? Recently, several multi-modal models have been developed for this purpose. They typically pre-train an adaptation module to align the semantics of the vision encoder and language model, followed by fine-tuning on instruction-following data. However, despite the success of this pipeline in image and language understanding, its effectiveness in joint video and language understanding has not been widely explored. In this paper, we aim to develop a novel multimodal foundation model capable of comprehending video, image, and language within a general framework. To achieve this goal, we introduce Valley, a Video Assistant with Large Language model Enhanced abilitY. The Valley consists of a LLM, a temporal modeling module, a visual encoder, and a simple projection module designed to bridge visual and textual modes. To empower Valley with video comprehension and instruction-following capabilities, we construct a video instruction dataset and adopt a two-stage tuning procedure to train it. Specifically, we employ ChatGPT to facilitate the construction of task-oriented conversation data encompassing various tasks, including multi-shot captions, long video descriptions, action recognition, causal relationship inference, etc. Subsequently, we adopt a pre-training-then-instructions-tuned pipeline to align visual and textual modalities and improve the instruction-following capability of Valley. Qualitative and qualitative experiments demonstrate that Valley has the potential to function as a highly effective video assistant that can make complex video understanding scenarios easy. Our Code, data, and models will be open-sourced.",
        "keywords": "Multimodal Large Language Models; Video Captioning; Video Question Answering",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/605e6da14711b9b9d0ab7e864fbe9d8fe390fcf3.pdf",
        "author": "Ruipu Luo;Ziwang Zhao;Min Yang;junwei dong;Da Li;Tao Wang;Minghui Qiu;Linmei Hu;zhongyu wei",
        "authorids": "~Ruipu_Luo1;~Ziwang_Zhao1;~Min_Yang7;~junwei_dong1;~Da_Li9;~Tao_Wang34;~Minghui_Qiu1;~Linmei_Hu1;~zhongyu_wei1",
        "gender": "M;M;M;M;M;M;M;F;M",
        "homepage": ";https://github.com/zw757;https://github.com/feymanpriv;http://jwdong.cn;;https://www.linkedin.com/in/walton-wang-1aa5a2135/;https://sites.google.com/site/qiumh0727/;;http://www.sdspeople.fudan.edu.cn/zywei/",
        "dblp": "305/0372;;;;;;132/3541;141/4440;31/10489",
        "google_scholar": "DYzOwuoAAAAJ;UI5NTFMAAAAJ;l_e7BDEAAAAJ;;;;https://scholar.google.com.sg/citations?user=xcqJyMgAAAAJ;;AjLDxxgAAAAJ",
        "orcid": ";;;;0009-0009-0345-7771;;;;",
        "linkedin": ";ziwang-zhao-065b601bb/;;;;walton-wang-1aa5a2135/;;;",
        "or_profile": "~Ruipu_Luo1;~Ziwang_Zhao1;~Min_Yang7;~junwei_dong1;~Da_Li9;~Tao_Wang34;~Minghui_Qiu1;~Linmei_Hu1;~zhongyu_wei1",
        "aff": "Fudan University;Beijing University of Posts and Telecommunications;Bytedance;Chongqing University;, Chinese Academy of Sciences;Bytedance group;ByteDance;Beijing Institute of Technology;Fudan University",
        "aff_domain": "fudan.edu.cn;bupt.edu.cn;bytedance.com;cqu.edu.cn;ict.ac.cn;bytedance.com;bytedance.com;bit.edu.cn;fudan.edu.cn",
        "position": "MS student;MS student;Researcher;PhD student;PhD student;Researcher;Researcher;Associate Professor;Associate Professor",
        "bibtex": "@misc{\nluo2024valley,\ntitle={Valley: Video Assistant with Large Language model Enhanced abilitY},\nauthor={Ruipu Luo and Ziwang Zhao and Min Yang and junwei dong and Da Li and Tao Wang and Minghui Qiu and Linmei Hu and zhongyu wei},\nyear={2024},\nurl={https://openreview.net/forum?id=bjyf5FyQ0a}\n}",
        "github": "",
        "project": "",
        "reviewers": "1s3m;Vdhg;rHRB;AvQ5",
        "site": "https://openreview.net/forum?id=bjyf5FyQ0a",
        "pdf_size": 3517791,
        "rating": "3;5;5;6",
        "confidence": "4;4;3;5",
        "soundness": "2;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "2;3;2;3",
        "wc_summary": "75;61;63;64",
        "wc_strengths": "81;50;38;55",
        "wc_weaknesses": "205;117;137;127",
        "wc_questions": "79;3;39;2",
        "wc_review": "440;231;277;248",
        "wc_reply_reviewers": "0;0;0;165",
        "wc_reply_authors": "310;153;239;489",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            65.75,
            5.448623679425842
        ],
        "wc_strengths_avg": [
            56.0,
            15.700318468107582
        ],
        "wc_weaknesses_avg": [
            146.5,
            34.50724561595724
        ],
        "wc_questions_avg": [
            30.75,
            31.594105462886585
        ],
        "wc_review_avg": [
            299.0,
            83.05118903423357
        ],
        "wc_reply_reviewers_avg": [
            41.25,
            71.44709581221619
        ],
        "wc_reply_authors_avg": [
            297.75,
            123.62316732716404
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.3244428422615251,
        "gs_citation": 177,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6758303978718576924&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;3;4;2;2;5;0",
        "aff_unique_norm": "Fudan University;Beijing University of Posts and Telecommunications;ByteDance;Chongqing University;Chinese Academy of Sciences;Beijing Institute of Technology",
        "aff_unique_dep": ";;;;;",
        "aff_unique_url": "https://www.fudan.edu.cn;http://www.bupt.edu.cn/;https://www.bytedance.com;https://www.cqu.edu.cn;http://www.cas.cn;http://www.bit.edu.cn/",
        "aff_unique_abbr": "Fudan;BUPT;Bytedance;CQU;CAS;BIT",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Beijing",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "MBR and QE Finetuning: Training-time Distillation of the Best and Most Expensive Decoding Methods",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18325",
        "id": "bkNx3O0sND",
        "author_site": "Mara Finkelstein, Markus Freitag",
        "tldr": "",
        "abstract": "Recent research in decoding methods for Natural Language Generation (NLG) tasks has shown that MAP decoding is not optimal, because model probabilities do not always align with human preferences. Stronger decoding methods, including Quality Estimation (QE) reranking and Minimum Bayes' Risk (MBR) decoding, have since been proposed to mitigate the model-perplexity-vs-quality mismatch. While these decoding methods achieve state-of-the-art performance, they are prohibitively expensive to compute. In this work, we propose MBR finetuning and QE finetuning, which distill the quality gains from these decoding methods at training time, while using an efficient decoding algorithm at inference time. Using the canonical NLG task of Neural Machine Translation (NMT), we show that even with self-training, these finetuning methods significantly outperform the base model. Moreover, when using an external LLM as a teacher model, these finetuning methods outperform finetuning on human-generated references. These findings suggest new ways to leverage monolingual data to achieve improvements in model quality that are on par with, or even exceed, improvements from human-curated data, while maintaining maximum efficiency during decoding.",
        "keywords": "Generative models;Natural language generation;Neural machine translation;LLMs;MBR decoding;Quality estimation;Finetuning;Distillation",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Mara Finkelstein;Markus Freitag",
        "authorids": "~Mara_Finkelstein1;~Markus_Freitag2",
        "gender": "F;M",
        "homepage": ";",
        "dblp": "354/9098;57/8503",
        "google_scholar": "2fwViA0AAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";",
        "linkedin": "mara-finkelstein-696776104;markus-freitag-7b17b4101/",
        "or_profile": "~Mara_Finkelstein1;~Markus_Freitag2",
        "aff": "Google;Google",
        "aff_domain": "google.com;google.com",
        "position": "Researcher;Researcher",
        "bibtex": "@inproceedings{\nfinkelstein2024mbr,\ntitle={{MBR} and {QE} Finetuning: Training-time Distillation of the Best and Most Expensive Decoding Methods},\nauthor={Mara Finkelstein and Markus Freitag},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=bkNx3O0sND}\n}",
        "github": "",
        "project": "",
        "reviewers": "t5J4;VTjn;2DMZ;5sbu",
        "pdf_size": 1264808,
        "rating": "6;6;6;6",
        "confidence": "5;3;4;4",
        "soundness": "3;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "102;154;53;126",
        "wc_strengths": "66;54;77;100",
        "wc_weaknesses": "212;198;92;64",
        "wc_questions": "368;10;60;159",
        "wc_review": "748;416;282;449",
        "wc_reply_reviewers": "83;0;53;48",
        "wc_reply_authors": "2037;784;1375;799",
        "reply_reviewers": "2;0;1;1",
        "reply_authors": "4;1;2;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            108.75,
            37.076778446893144
        ],
        "wc_strengths_avg": [
            74.25,
            16.946607330082326
        ],
        "wc_weaknesses_avg": [
            141.5,
            64.45735024029455
        ],
        "wc_questions_avg": [
            149.25,
            137.20673270652574
        ],
        "wc_review_avg": [
            473.75,
            170.24155632512293
        ],
        "wc_reply_reviewers_avg": [
            46.0,
            29.740544715926102
        ],
        "wc_reply_authors_avg": [
            1248.75,
            513.6985375684848
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 16,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1348762902871096284&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=bkNx3O0sND",
        "pdf": "https://openreview.net/pdf?id=bkNx3O0sND",
        "email": "google.com;google.com",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Google",
        "aff_unique_dep": "Google",
        "aff_unique_url": "https://www.google.com",
        "aff_unique_abbr": "Google",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Mountain View",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "A Simple Interpretable Transformer for Fine-Grained Image Classification and Analysis",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18324",
        "id": "bkdWThqE6q",
        "author_site": "DIPANJYOTI PAUL, Arpita Chowdhury, Xinqi Xiong, Feng-Ju Chang, David Carlyn, Samuel Stevens, Kaiya Provost, Anuj Karpatne, Bryan Carstens, Daniel Rubenstein, Charles Stewart, Tanya Berger-Wolf, Yu Su, Wei-Lun Chao",
        "tldr": "",
        "abstract": "We present a novel usage of Transformers to make image classification interpretable. Unlike mainstream classifiers that wait until the last fully connected layer to incorporate class information to make predictions, we investigate a proactive approach, asking each class to search for itself in an image. We realize this idea via a Transformer encoder-decoder inspired by DEtection TRansformer (DETR). We learn ''class-specific'' queries (one for each class) as input to the decoder, enabling each class to localize its patterns in an image via cross-attention. We name our approach INterpretable TRansformer (INTR), which is fairly easy to implement and exhibits several compelling properties. We show that INTR intrinsically encourages each class to attend distinctively; the cross-attention weights thus provide a faithful interpretation of the prediction. Interestingly, via ''multi-head'' cross-attention, INTR could identify different ''attributes'' of a class, making it particularly suitable for fine-grained classification and analysis, which we demonstrate on eight datasets. Our code and pre-trained models are publicly accessible at the Imageomics Institute GitHub site: https://github.com/Imageomics/INTR.",
        "keywords": "Explainability;Interpretability;Transformer;Fine-grained recognition;Attribute discovery",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "DIPANJYOTI PAUL;Arpita Chowdhury;Xinqi Xiong;Feng-Ju Chang;David Edward Carlyn;Samuel Stevens;Kaiya L Provost;Anuj Karpatne;Bryan Carstens;Daniel Rubenstein;Charles Stewart;Tanya Berger-Wolf;Yu Su;Wei-Lun Chao",
        "authorids": "~DIPANJYOTI_PAUL2;~Arpita_Chowdhury1;~Xinqi_Xiong1;~Feng-Ju_Chang4;~David_Edward_Carlyn1;~Samuel_Stevens1;~Kaiya_L_Provost1;~Anuj_Karpatne1;~Bryan_Carstens1;~Daniel_Rubenstein1;~Charles_Stewart1;~Tanya_Berger-Wolf2;~Yu_Su2;~Wei-Lun_Chao1",
        "gender": "M;F;F;F;M;M;F;;M;M;M;F;M;M",
        "homepage": "https://dipanjyoti.github.io/;;;;https://davidcarlyn.wordpress.com/;https://samuelstevens.me;http://kaiyaprovost.com;http://people.cs.vt.edu/karpatne/;https://carstenslab.osu.edu/index.html;https://eeb.princeton.edu/people/daniel-rubenstein;https://www.cs.rpi.edu/~stewart;https://cse.osu.edu/people/berger-wolf.1;http://ysu1989.github.io;https://sites.google.com/view/wei-lun-harry-chao",
        "dblp": "184/8394;;360/4743;127/5560;;279/6356;;09/9720;;;43/471;b/TYBergerWolf;38/1070-1;64/8842",
        "google_scholar": "AwOcRTAAAAAJ;7eHA9IAAAAAJ;j1k9a_QAAAAJ;1yIyuUUAAAAJ;UccNZ0YAAAAJ;uR-A0LAAAAAJ;4juxrs8AAAAJ;;3NX7nXIAAAAJ;oD4QN6wAAAAJ;https://scholar.google.com/citations?hl=en;fDQUHyIAAAAJ;rIh5OqoAAAAJ;PGKakWwAAAAJ",
        "orcid": "0000-0001-9079-7524;;;;;0009-0000-9493-7766;;;0000-0002-1552-227X;0000-0001-9049-5219;;;;0000-0003-1269-7231",
        "linkedin": "https://linkedin.com/in/dipanjyoti-paul-908517100;arpita-chowdhury/;ana-xiong;feng-ju-claire-chang-28329259/;david-carlyn/;;;;;;;;;",
        "or_profile": "~DIPANJYOTI_PAUL2;~Arpita_Chowdhury1;~Xinqi_Xiong1;~Feng-Ju_Chang4;~David_Edward_Carlyn1;~Samuel_Stevens1;~Kaiya_L_Provost1;~Anuj_Karpatne1;~Bryan_Carstens1;~Daniel_Rubenstein1;~Charles_Stewart1;~Tanya_Berger-Wolf2;~Yu_Su2;~Wei-Lun_Chao1",
        "aff": "Ohio State University, Columbus;Ohio State University, Columbus;Ohio State University, Columbus;Amazon;Ohio State University;Ohio State University, Columbus;Adelphi University;Virginia Polytechnic Institute and State University;Ohio State University, Columbus;Princeton University;Rensselaer Polytechnic Institute;Ohio State University;Microsoft;Ohio State University",
        "aff_domain": "osu.edu;osu.edu;osu.edu;amazon.com;osu.edu;osu.edu;adelphi.edu;vt.edu;osu.edu;princeton.edu;cs.rpi.edu;osu.edu;microsoft.com;osu.edu",
        "position": "Postdoc;PhD student;Undergrad student;Senior Applied Scientist;PhD student;PhD student;Assistant Professor;Associate Professor;Full Professor;Full Professor;Professor;Professor;Senior Researcher;Assistant Professor",
        "bibtex": "@inproceedings{\npaul2024a,\ntitle={A Simple Interpretable Transformer for Fine-Grained Image Classification and Analysis},\nauthor={DIPANJYOTI PAUL and Arpita Chowdhury and Xinqi Xiong and Feng-Ju Chang and David Edward Carlyn and Samuel Stevens and Kaiya L Provost and Anuj Karpatne and Bryan Carstens and Daniel Rubenstein and Charles Stewart and Tanya Berger-Wolf and Yu Su and Wei-Lun Chao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=bkdWThqE6q}\n}",
        "github": "",
        "project": "",
        "reviewers": "8cK8;Z5oh;dzqa;4rTr",
        "pdf_size": 9866607,
        "rating": "6;6;6;6",
        "confidence": "5;4;4;4",
        "soundness": "4;3;3;3",
        "contribution": "2;3;2;2",
        "presentation": "4;4;3;4",
        "wc_summary": "106;89;41;117",
        "wc_strengths": "151;217;177;50",
        "wc_weaknesses": "311;399;117;201",
        "wc_questions": "137;565;5;310",
        "wc_review": "705;1270;340;678",
        "wc_reply_reviewers": "0;0;388;0",
        "wc_reply_authors": "981;1269;707;1057",
        "reply_reviewers": "0;0;2;0",
        "reply_authors": "2;2;3;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            88.25,
            29.046299247924853
        ],
        "wc_strengths_avg": [
            148.75,
            61.66998864926116
        ],
        "wc_weaknesses_avg": [
            257.0,
            107.02336193560731
        ],
        "wc_questions_avg": [
            254.25,
            209.49149744082695
        ],
        "wc_review_avg": [
            748.25,
            333.80261757511727
        ],
        "wc_reply_reviewers_avg": [
            97.0,
            168.0089283341811
        ],
        "wc_reply_authors_avg": [
            1003.5,
            201.10382890437467
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            14,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 19,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3418900985905806765&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=bkdWThqE6q",
        "pdf": "https://openreview.net/pdf?id=bkdWThqE6q",
        "email": "osu.edu;osu.edu;osu.edu;amazon.com;osu.edu;osu.edu;adelphi.edu;vt.edu;osu.edu;princeton.edu;cs.rpi.edu;osu.edu;microsoft.com;osu.edu",
        "author_num": 14,
        "aff_unique_index": "0;0;0;1;0;0;2;3;0;4;5;0;6;0",
        "aff_unique_norm": "Ohio State University;Amazon;Adelphi University;Virginia Tech;Princeton University;Rensselaer Polytechnic Institute;Microsoft",
        "aff_unique_dep": ";Amazon.com, Inc.;;;;;Microsoft Corporation",
        "aff_unique_url": "https://www.osu.edu;https://www.amazon.com;https://www.adelphi.edu;https://www.vt.edu;https://www.princeton.edu;https://www.rpi.edu;https://www.microsoft.com",
        "aff_unique_abbr": "OSU;Amazon;Adelphi;VT;Princeton;RPI;Microsoft",
        "aff_campus_unique_index": "0;0;0;0;0",
        "aff_campus_unique": "Columbus;",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "bkzkCHSYp9",
        "title": "Learning Interpretable Characteristic Kernels via Decision Forests",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Decision forests are widely used for classification and regression tasks. \nA lesser known property of tree-based methods is that one can construct a proximity matrix from the tree(s), and these proximity matrices are induced kernels.\nWhile there has been extensive research on the applications and properties of kernels, there is relatively little research on kernels induced by decision forests.\nWe construct Kernel Mean Embedding Random Forests (KMERF), which induce kernels from random trees and/or forests using leaf-node proximity. \nWe introduce the notion of an asymptotically characteristic kernel, and prove that KMERF kernels are asymptotically characteristic for both discrete and continuous data.\nBecause KMERF is data-adaptive, we suspected it would outperform kernels selected *a priori* on finite sample data.\nWe illustrate that KMERF nearly dominates current state-of-the-art kernel-based tests across a diverse range of high-dimensional two-sample and independence testing settings.\nFurthermore, our forest-based approach is interpretable, and provides feature importance metrics that readily distinguish important dimensions, unlike other high-dimensional non-parametric testing procedures.\nHence, this work demonstrates the decision forest-based kernel can be more powerful and more interpretable than existing methods, flying in the face of conventional wisdom of the trade-off between the two.",
        "keywords": "kernel learning;random forest;hypothesis testing",
        "primary_area": "metric learning, kernel learning, and sparse coding",
        "supplementary_material": "/attachment/d03e033dc600caa9bd2bd681e438d10ec9248165.zip",
        "author": "Sambit Panda;Cencheng Shen;Joshua T Vogelstein",
        "authorids": "~Sambit_Panda1;~Cencheng_Shen2;~Joshua_T_Vogelstein1",
        "gender": "M;;M",
        "homepage": "https://sampan.me/;;https://neurodata.io/",
        "dblp": ";;04/700",
        "google_scholar": "-V3CmPoAAAAJ;;DWPfdT4AAAAJ",
        "orcid": "0000-0001-8455-4243;;0000-0003-2487-6237",
        "linkedin": "sampan501/;;jovo1/",
        "or_profile": "~Sambit_Panda1;~Cencheng_Shen2;~Joshua_T_Vogelstein1",
        "aff": "Johns Hopkins University;;Johns Hopkins University",
        "aff_domain": "jhu.edu;;jhu.edu",
        "position": "PhD student;;Associate Professor",
        "bibtex": "@misc{\npanda2024learning,\ntitle={Learning Interpretable Characteristic Kernels via Decision Forests},\nauthor={Sambit Panda and Cencheng Shen and Joshua T Vogelstein},\nyear={2024},\nurl={https://openreview.net/forum?id=bkzkCHSYp9}\n}",
        "github": "",
        "project": "",
        "reviewers": "j4BZ;m1gD;SxFq;sjX1",
        "site": "https://openreview.net/forum?id=bkzkCHSYp9",
        "pdf_size": 1439330,
        "rating": "3;3;5;5",
        "confidence": "3;4;4;4",
        "soundness": "3;2;3;3",
        "contribution": "2;3;2;2",
        "presentation": "3;3;3;3",
        "wc_summary": "59;91;53;24",
        "wc_strengths": "36;37;68;64",
        "wc_weaknesses": "122;127;46;89",
        "wc_questions": "100;829;282;22",
        "wc_review": "317;1084;449;199",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            56.75,
            23.79469478686373
        ],
        "wc_strengths_avg": [
            51.25,
            14.821858857781638
        ],
        "wc_weaknesses_avg": [
            96.0,
            32.349652239243625
        ],
        "wc_questions_avg": [
            308.25,
            315.10980229120133
        ],
        "wc_review_avg": [
            512.25,
            341.7406728793048
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6887284855751361522&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Johns Hopkins University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.jhu.edu",
        "aff_unique_abbr": "JHU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Adaptive Stochastic Gradient Algorithm for Black-box Multi-Objective Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18323",
        "id": "bm1JVsVZVu",
        "author_site": "Feiyang YE, YUEMING LYU, Xuehao Wang, Yu Zhang, Ivor Tsang",
        "tldr": "",
        "abstract": "Multi-objective optimization (MOO) has become an influential framework for various machine learning problems, including reinforcement learning and multi-task learning. In this paper, we study the black-box multi-objective optimization problem, where we aim to optimize multiple potentially conflicting objectives with function queries only. To address this challenging problem and find a Pareto optimal solution or the Pareto stationary solution, \nwe propose a novel adaptive stochastic gradient algorithm for black-box MOO, called ASMG. \nSpecifically, we use the stochastic gradient approximation method to obtain the gradient for the distribution parameters of the Gaussian smoothed MOO with function queries only. Subsequently, an adaptive weight is employed to aggregate all stochastic gradients to optimize all objective functions effectively. \nTheoretically, we explicitly provide the connection between the original MOO problem and the corresponding Gaussian smoothed MOO problem and prove the convergence rate for the proposed ASMG algorithm in both convex and non-convex scenarios.\nEmpirically, the proposed ASMG method achieves competitive performance on multiple numerical benchmark problems. Additionally, the state-of-the-art performance on the black-box multi-task learning problem demonstrates the effectiveness of the proposed ASMG method.",
        "keywords": "Multi-Objective Optimization;Black-Box Optimization;Black-Box Multi-Objective Optimization",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Feiyang Ye;Yueming Lyu;Xuehao Wang;Yu Zhang;Ivor Tsang",
        "authorids": "~Feiyang_Ye4;~Yueming_Lyu1;~Xuehao_Wang3;~Yu_Zhang3;~Ivor_Tsang1",
        "gender": "M;M;M;M;M",
        "homepage": "https://feiyang-ye.github.io/;https://yueminglyu.github.io/;;http://cse.sustech.edu.cn/faculty/~zhangy/;https://www.a-star.edu.sg/cfar/about-cfar/management/prof-ivor-tsang",
        "dblp": "285/4704;;272/4397;50/671-6;35/5873",
        "google_scholar": "3EX25cAAAAAJ;uQXB6-oAAAAJ;ZaJRYnMAAAAJ;https://scholar.google.com.hk/citations?user=jaRS5w4AAAAJ;rJMOlVsAAAAJ",
        "orcid": ";;0000-0003-1274-2100;;",
        "linkedin": ";;;;",
        "or_profile": "~Feiyang_Ye4;~Yueming_Lyu1;~Xuehao_Wang3;~Yu_Zhang3;~Ivor_W_Tsang1",
        "aff": "University of Technology Sydney;Agency for Science, Technology and Research (A*STAR);Tencent;Southern University of Science and Technology;A*STAR",
        "aff_domain": "uts.edu.au;astar.edu.sg;tencent.com;sustc.edu.cn;cfar.a-star.edu.sg",
        "position": "PhD student;Researcher;Intern;Associate Professor;Principal Researcher",
        "bibtex": "@inproceedings{\nye2024adaptive,\ntitle={Adaptive Stochastic Gradient Algorithm for Black-box Multi-Objective Learning},\nauthor={Feiyang Ye and Yueming Lyu and Xuehao Wang and Yu Zhang and Ivor Tsang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=bm1JVsVZVu}\n}",
        "github": "",
        "project": "",
        "reviewers": "w58H;ZfhH;J6Rt;hUW7",
        "pdf_size": 816006,
        "rating": "6;6;6;6",
        "confidence": "3;3;4;3",
        "soundness": "3;2;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;2;3;2",
        "wc_summary": "113;119;61;67",
        "wc_strengths": "61;53;146;136",
        "wc_weaknesses": "133;92;69;47",
        "wc_questions": "46;81;40;44",
        "wc_review": "353;345;316;294",
        "wc_reply_reviewers": "0;9;21;7",
        "wc_reply_authors": "625;1619;463;979",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "2;4;3;4",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            90.0,
            26.1725046566048
        ],
        "wc_strengths_avg": [
            99.0,
            42.24334267076885
        ],
        "wc_weaknesses_avg": [
            85.25,
            31.830606340439072
        ],
        "wc_questions_avg": [
            52.75,
            16.452583383772897
        ],
        "wc_review_avg": [
            327.0,
            23.50531854708632
        ],
        "wc_reply_reviewers_avg": [
            9.25,
            7.562241731127087
        ],
        "wc_reply_authors_avg": [
            921.5,
            443.831893851715
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.25,
            0.82915619758885
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16780221061319660398&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=bm1JVsVZVu",
        "pdf": "https://openreview.net/pdf?id=bm1JVsVZVu",
        "email": "uts.edu.au;astar.edu.sg;tencent.com;sustc.edu.cn;cfar.a-star.edu.sg",
        "author_num": 5,
        "aff_unique_index": "0;1;2;3;1",
        "aff_unique_norm": "University of Technology Sydney;Agency for Science, Technology and Research;Tencent;Southern University of Science and Technology",
        "aff_unique_dep": ";;Tencent Holdings Limited;",
        "aff_unique_url": "https://www.uts.edu.au;https://www.a-star.edu.sg;https://www.tencent.com;https://www.sustech.edu.cn",
        "aff_unique_abbr": "UTS;A*STAR;Tencent;SUSTech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;2;1",
        "aff_country_unique": "Australia;Singapore;China"
    },
    {
        "id": "bn8iWvRSmq",
        "title": "Successor Features for Efficient Multi-Subject Controlled Text Generation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "While large language models (LLMs) have achieved impressive performance in generating fluent and realistic text, controlling the generated text so that it exhibits properties such as safety, factuality, and non-toxicity remains challenging.\n% such as DExperts, GeDi, and rectification\nExisting decoding-based methods are static in terms of the dimension of control; if the target subject is changed, they require new training. Moreover, it can quickly become prohibitive to concurrently control multiple subjects.\nIn this work, we introduce SF-GEN, which is grounded in two primary concepts: successor features (SFs) to decouple the LLM's dynamics from task-specific rewards, and language model rectification to proportionally adjust the probability of selecting a token based on the likelihood that the finished text becomes undesired. \nSF-GEN seamlessly integrates the two to enable dynamic steering of text generation with no need to alter the LLM's parameters.\nThanks to the decoupling effect induced by successor features, our method proves to be memory-wise and computationally efficient for training as well as decoding, especially when dealing with multiple target subjects. \nTo the best of our knowledge, our research represents the first application of successor features in text generation.\nIn addition to its computational efficiency, the resultant language produced by our method is comparable to the SOTA (and outperforms baselines) in both control measures as well as language quality, which we demonstrate through a series of experiments in various controllable text generation tasks.",
        "keywords": "Reinforcement Learning;Successor Features;NLP;Controllable Text Generation",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Meng Cao;Mehdi Fatemi;Jackie CK Cheung;Samira Shabanian",
        "authorids": "~Meng_Cao3;~Mehdi_Fatemi1;~Jackie_CK_Cheung1;~Samira_Shabanian1",
        "gender": "M;;M;F",
        "homepage": "https://mcao516.github.io/;;http://cs.mcgill.ca/~jcheung/;",
        "dblp": ";;00/9012;",
        "google_scholar": "https://scholar.google.ca/citations?user=CvHeFv8AAAAJ;X9_mSpYAAAAJ;https://scholar.google.com.tw/citations?user=Um-wmYQAAAAJ;https://scholar.google.ca/citations?user=CHkNfSMAAAAJ",
        "orcid": ";0000-0001-9598-6164;;",
        "linkedin": ";fatemi/;;samirashabanian/",
        "or_profile": "~Meng_Cao3;~Mehdi_Fatemi1;~Jackie_CK_Cheung1;~Samira_Shabanian1",
        "aff": "McGill University;Wand AI;Microsoft;",
        "aff_domain": "mcgill.ca;wand.ai;microsoft.com;",
        "position": "PhD student;Principal Researcher;Consulting Researcher;",
        "bibtex": "@misc{\ncao2024successor,\ntitle={Successor Features for Efficient Multi-Subject Controlled Text Generation},\nauthor={Meng Cao and Mehdi Fatemi and Jackie CK Cheung and Samira Shabanian},\nyear={2024},\nurl={https://openreview.net/forum?id=bn8iWvRSmq}\n}",
        "github": "",
        "project": "",
        "reviewers": "bNWc;NYoH;th5r;WhQL",
        "site": "https://openreview.net/forum?id=bn8iWvRSmq",
        "pdf_size": 483233,
        "rating": "6;6;6;6",
        "confidence": "3;3;2;3",
        "soundness": "3;3;3;3",
        "contribution": "3;2;2;2",
        "presentation": "1;3;3;3",
        "wc_summary": "49;154;94;180",
        "wc_strengths": "54;138;28;103",
        "wc_weaknesses": "37;371;23;189",
        "wc_questions": "1;62;83;75",
        "wc_review": "141;725;228;547",
        "wc_reply_reviewers": "0;264;0;42",
        "wc_reply_authors": "293;758;538;775",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            119.25,
            51.16334136860102
        ],
        "wc_strengths_avg": [
            80.75,
            42.634346482618916
        ],
        "wc_weaknesses_avg": [
            155.0,
            140.67693485429658
        ],
        "wc_questions_avg": [
            55.25,
            32.205395510690444
        ],
        "wc_review_avg": [
            410.25,
            236.36769555080915
        ],
        "wc_reply_reviewers_avg": [
            76.5,
            109.6026915727894
        ],
        "wc_reply_authors_avg": [
            591.0,
            195.8047496870288
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12362210167003339067&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "McGill University;Wand AI;Microsoft",
        "aff_unique_dep": ";;Microsoft Corporation",
        "aff_unique_url": "https://www.mcgill.ca;https://www.wand.ai;https://www.microsoft.com",
        "aff_unique_abbr": "McGill;Wand AI;Microsoft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "Canada;United States"
    },
    {
        "id": "bnPALC6S4l",
        "title": "Towards general neural surrogate PDE solvers with specialized neural accelerators",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Surrogate neural network-based partial differential equation (PDE) solvers have the potential to solve PDEs in an accelerated manner, but they are largely limited to systems featuring predetermined problem sizes or fixed PDE parameters. We propose Specialized Neural Accelerator-Powered Domain Decomposition Methods (SNAP-DDM), a DDM-based approach to PDE solving in which subdomain problems containing arbitrary boundary conditions and geometric parameters are accurately solved using an ensemble of specialized neural operators.  We tailor SNAP-DDM to 2D electromagnetics and fluidic flow problems and show how innovations in network architecture and loss function engineering can produce specialized surrogate subdomain solvers with near unity accuracy.  We also show how these solvers can be used with standard DDM algorithms to accurately solve freeform electromagnetics and fluids problems with a wide range of domain sizes.",
        "keywords": "Surrogate Solver;Neural Operator;Domain Decomposition Methods;Nanophotonics;Maxwell's Equations;Navier Stokes Equations",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/6941d66913302a2e6b650aab337ee3b632df6539.pdf",
        "author": "Chenkai Mao;Robert Lupoiu;Mingkun Chen;Tianxiang Dai;Jonathan Fan",
        "authorids": "~Chenkai_Mao1;~Robert_Lupoiu1;~Mingkun_Chen1;~Tianxiang_Dai1;~Jonathan_Fan1",
        "gender": "M;;M;M;M",
        "homepage": "https://profiles.stanford.edu/249027;https://web.stanford.edu/~rclupoiu/;https://scholar.google.com/citations?user=KLmTMv0AAAAJ&hl=en;;https://fanlab.stanford.edu",
        "dblp": "314/9682;;;;",
        "google_scholar": "owK9BbIAAAAJ;exZV_fIAAAAJ;;;",
        "orcid": ";;;0000-0002-9403-7511;",
        "linkedin": "chenkai-mao-7232a5153/;;;;",
        "or_profile": "~Chenkai_Mao1;~Robert_Lupoiu1;~Mingkun_Chen1;~Tianxiang_Dai1;~Jonathan_Fan1",
        "aff": "Stanford University;Stanford University;;Stanford University;Stanford University",
        "aff_domain": "stanford.edu;stanford.edu;;stanford.edu;stanford.edu",
        "position": "PhD student;PhD student;;PhD student;Associate Professor",
        "bibtex": "@misc{\nmao2024towards,\ntitle={Towards general neural surrogate {PDE} solvers with specialized neural accelerators},\nauthor={Chenkai Mao and Robert Lupoiu and Mingkun Chen and Tianxiang Dai and Jonathan Fan},\nyear={2024},\nurl={https://openreview.net/forum?id=bnPALC6S4l}\n}",
        "github": "",
        "project": "",
        "reviewers": "PJmS;mta4;scWL;RuAk",
        "site": "https://openreview.net/forum?id=bnPALC6S4l",
        "pdf_size": 12683282,
        "rating": "5;5;6;6",
        "confidence": "3;3;3;4",
        "soundness": "2;3;3;3",
        "contribution": "1;3;3;3",
        "presentation": "2;1;2;3",
        "wc_summary": "201;96;94;150",
        "wc_strengths": "72;85;162;34",
        "wc_weaknesses": "268;226;991;55",
        "wc_questions": "198;131;168;94",
        "wc_review": "739;538;1415;333",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1300;853;2401;771",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;4;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            135.25,
            44.10994785759784
        ],
        "wc_strengths_avg": [
            88.25,
            46.520828668457746
        ],
        "wc_weaknesses_avg": [
            385.0,
            358.8544273100166
        ],
        "wc_questions_avg": [
            147.75,
            39.06644980030819
        ],
        "wc_review_avg": [
            756.25,
            406.5165279542764
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1331.25,
            649.6046393769059
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.25,
            1.0897247358851685
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13529798251441169702&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Stanford University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.stanford.edu",
        "aff_unique_abbr": "Stanford",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Stanford",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "bobFZ6WxUd",
        "title": "Non-Autoregressive Machine Translation as Constrained HMM",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In non-autoregressive translation (NAT), directed acyclic Transformers (DAT) have demonstrated their ability to achieve comparable performance to the autoregressive Transformers.\nIn this paper, we first show that DAT is essentially a fully connected left-to-right Hidden Markov Model (HMM), with the source and target sequences being observations and the token positions being latent states.\nEven though generative models like HMM do not suffer from label bias in traditional task settings (e.g., sequence labeling), we argue here that the left-to-right HMM in NAT may still encounter this issue due to the missing observations at the inference stage.\nTo combat label bias, we propose two constrained HMMs: 1) Adaptive Window HMM, which explicitly balances the number of outgoing transitions at different states; 2) Bi-directional HMM, i.e., a combination of left-to-right and right-to-left HMMs, whose uni-directional components can implicitly regularize each other's biases via shared parameters.\nExperimental results on WMT'14 En$\\leftrightarrow$De and WMT'17 Zh$\\leftrightarrow$En demonstrate that our methods can achieve better or comparable performance to the original DAT using various decoding methods.\nWe also demonstrate that our methods effectively reduce the impact of label bias. Code is available in the supplementary materials.",
        "keywords": "text generation; label bias",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/f4442e498dbf14a90b8b4fb775ad78f6282f9271.zip",
        "author": "Haoran Li;Zhanming Jie;Wei Lu",
        "authorids": "~Haoran_Li4;~Zhanming_Jie2;~Wei_Lu10",
        "gender": "M;M;M",
        "homepage": "https://statnlp-research.github.io/;https://istd.sutd.edu.sg/people/faculty/lu-wei;https://allanj.github.io/",
        "dblp": ";98/6613-11.html;151/8425",
        "google_scholar": "X5QwHqwAAAAJ;n41KN9AAAAAJ;https://scholar.google.com.sg/citations?user=u68TA6oAAAAJ",
        "orcid": ";0000-0003-0827-0382;",
        "linkedin": ";wei-lu-59aa9615/;",
        "or_profile": "~Haoran_Li4;~Wei_Lu9;~Allan_Jie1",
        "aff": ";Singapore University of Technology and Design;ByteDance Research",
        "aff_domain": ";sutd.edu.sg;bytedance.com",
        "position": ";Associate Professor;NLP Scientist",
        "bibtex": "@misc{\nli2024nonautoregressive,\ntitle={Non-Autoregressive Machine Translation as Constrained {HMM}},\nauthor={Haoran Li and Zhanming Jie and Wei Lu},\nyear={2024},\nurl={https://openreview.net/forum?id=bobFZ6WxUd}\n}",
        "github": "",
        "project": "",
        "reviewers": "fXmy;bRfo;z6kj",
        "site": "https://openreview.net/forum?id=bobFZ6WxUd",
        "pdf_size": 1304832,
        "rating": "3;5;8",
        "confidence": "4;4;4",
        "soundness": "2;3;3",
        "contribution": "2;2;3",
        "presentation": "2;3;3",
        "wc_summary": "37;107;71",
        "wc_strengths": "109;52;93",
        "wc_weaknesses": "443;37;81",
        "wc_questions": "37;28;91",
        "wc_review": "626;224;336",
        "wc_reply_reviewers": "728;0;10",
        "wc_reply_authors": "933;569;779",
        "reply_reviewers": "2;0;1",
        "reply_authors": "3;2;2",
        "rating_avg": [
            5.333333333333333,
            2.0548046676563256
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            71.66666666666667,
            28.58126814696802
        ],
        "wc_strengths_avg": [
            84.66666666666667,
            24.00462918318511
        ],
        "wc_weaknesses_avg": [
            187.0,
            181.9084018583712
        ],
        "wc_questions_avg": [
            52.0,
            27.820855486487112
        ],
        "wc_review_avg": [
            395.3333333333333,
            169.3936900307158
        ],
        "wc_reply_reviewers_avg": [
            246.0,
            340.84991809690473
        ],
        "wc_reply_authors_avg": [
            760.3333333333334,
            149.18742872269394
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16240814673520430381&as_sdt=5,24&sciodt=0,24&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Singapore University of Technology and Design;ByteDance",
        "aff_unique_dep": ";Research",
        "aff_unique_url": "https://www.sutd.edu.sg;https://www.bytedance.com",
        "aff_unique_abbr": "SUTD;ByteDance",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Singapore;China"
    },
    {
        "title": "Stabilizing Backpropagation Through Time to Learn Complex Physics",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18322",
        "id": "bozbTTWcaw",
        "author_site": "Patrick Schnell, Nils Thuerey",
        "tldr": "",
        "abstract": "Of all the vector fields surrounding the minima of recurrent learning setups, the gradient field with its exploding and vanishing updates appears a poor choice for optimization, offering little beyond efficient computability. We seek to improve this suboptimal practice in the context of physics simulations, where backpropagating feedback through many unrolled time steps is considered crucial to acquiring temporally coherent behavior. The alternative vector field we propose follows from two principles: physics simulators, unlike neural networks, have a balanced gradient flow and certain modifications to the backpropagation pass leave the positions of the original minima unchanged. As any modification of backpropagation decouples forward and backward pass, the rotation-free character of the gradient field is lost. Therefore, we discuss the negative implications of using such a rotational vector field for optimization and how to counteract them. Our final procedure is easily implementable via a sequence of gradient stopping and component-wise comparison operations, which do not negatively affect scalability. Our experiments on three control problems show that especially as we increase the complexity of each task, the unbalanced updates from the gradient can no longer provide the precise control signals necessary while our method still solves the tasks. Our code can be found at https://github.com/tum-pbs/StableBPTT.",
        "keywords": "backpropagation through time;unrolling;differentiable physics;differentiable simulators;optimization",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Patrick Schnell;Nils Thuerey",
        "authorids": "~Patrick_Schnell1;~Nils_Thuerey1",
        "gender": ";M",
        "homepage": "https://ge.in.tum.de/about/patrick-schnell/;https://ge.in.tum.de",
        "dblp": "293/4156;42/478",
        "google_scholar": ";https://scholar.google.com.tw/citations?user=GEehwv8AAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Patrick_Schnell1;~Nils_Thuerey1",
        "aff": "Technical University of Munich;Technical University Munich",
        "aff_domain": "tum.de;tum.de",
        "position": "PhD student;Associate Professor",
        "bibtex": "@inproceedings{\nschnell2024stabilizing,\ntitle={Stabilizing Backpropagation Through Time to Learn Complex Physics},\nauthor={Patrick Schnell and Nils Thuerey},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=bozbTTWcaw}\n}",
        "github": "",
        "project": "",
        "reviewers": "Djj8;BicD;Z3pv;kKUm",
        "pdf_size": 3396326,
        "rating": "3;8;8;8",
        "confidence": "4;4;2;3",
        "soundness": "2;3;4;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;4;4",
        "wc_summary": "115;100;71;93",
        "wc_strengths": "30;36;52;44",
        "wc_weaknesses": "29;482;52;58",
        "wc_questions": "301;151;64;1",
        "wc_review": "475;769;239;196",
        "wc_reply_reviewers": "460;163;0;0",
        "wc_reply_authors": "1439;1649;674;175",
        "reply_reviewers": "1;2;0;0",
        "reply_authors": "3;4;1;1",
        "rating_avg": [
            6.75,
            2.165063509461097
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            94.75,
            15.848895860595462
        ],
        "wc_strengths_avg": [
            40.5,
            8.2915619758885
        ],
        "wc_weaknesses_avg": [
            155.25,
            188.95948639853995
        ],
        "wc_questions_avg": [
            129.25,
            112.55748531306125
        ],
        "wc_review_avg": [
            419.75,
            227.9049966543077
        ],
        "wc_reply_reviewers_avg": [
            155.75,
            187.84085684429786
        ],
        "wc_reply_authors_avg": [
            984.25,
            591.5722166396931
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.25,
            1.299038105676658
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2797318315203300437&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=bozbTTWcaw",
        "pdf": "https://openreview.net/pdf?id=bozbTTWcaw",
        "email": "tum.de;tum.de",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Technical University of Munich",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tum.de",
        "aff_unique_abbr": "TUM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "bpheRCxzb4",
        "title": "Measuring Information in Text Explanations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Text-based explanation is a particularly promising approach in explainable AI, but the evaluation of text explanations is method-dependent. We argue that placing the explanations on an information-theoretic framework could unify the evaluations of two popular text explanation methods: rationale and natural language explanations (NLE). This framework considers the post-hoc text pipeline as a series of communication channels, which we refer to as ``explanation channels''. We quantify the information flow through these channels, thereby facilitating the assessment of explanation characteristics. We set up tools for quantifying two information scores: relevance and informativeness. We illustrate what our proposed information scores measure by comparing them against some traditional evaluation metrics. Our information-theoretic scores reveal some unique observations about the underlying mechanisms of two representative text explanations. For example, the NLEs trade-off slightly between transmitting the input-related information and the target-related information, whereas the rationales do not exhibit such a trade-off mechanism. Our work contributes to the ongoing efforts in establishing rigorous and standardized evaluation criteria in the rapidly evolving field of explainable AI.",
        "keywords": "explanation;information;communication channel",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/f434cfd0acccf38c3b961b36f807fc499791b33a.zip",
        "author": "Zining Zhu;Frank Rudzicz",
        "authorids": "~Zining_Zhu1;~Frank_Rudzicz2",
        "gender": ";M",
        "homepage": "http://ziningzhu.github.io;http://www.cs.toronto.edu/~frank",
        "dblp": "188/5709;36/6505",
        "google_scholar": "https://scholar.google.ca/citations?user=Xr_hCJMAAAAJ;https://scholar.google.ca/citations?user=elXOB1sAAAAJ",
        "orcid": ";0000-0002-1139-3423",
        "linkedin": "zining-zhu/;",
        "or_profile": "~Zining_Zhu1;~Frank_Rudzicz2",
        "aff": "University of Toronto;Dalhousie University",
        "aff_domain": "toronto.edu;dal.ca",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\nzhu2024measuring,\ntitle={Measuring Information in Text Explanations},\nauthor={Zining Zhu and Frank Rudzicz},\nyear={2024},\nurl={https://openreview.net/forum?id=bpheRCxzb4}\n}",
        "github": "",
        "project": "",
        "reviewers": "acAy;7iHa;gJuB;21zw",
        "site": "https://openreview.net/forum?id=bpheRCxzb4",
        "pdf_size": 1526712,
        "rating": "5;5;8;8",
        "confidence": "4;4;4;2",
        "soundness": "2;2;3;3",
        "contribution": "2;1;3;4",
        "presentation": "2;1;3;2",
        "wc_summary": "225;108;53;113",
        "wc_strengths": "4;78;105;99",
        "wc_weaknesses": "4;157;40;28",
        "wc_questions": "4;266;134;34",
        "wc_review": "237;609;332;274",
        "wc_reply_reviewers": "175;227;19;0",
        "wc_reply_authors": "494;756;70;91",
        "reply_reviewers": "2;1;1;0",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            6.5,
            1.5
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            1.118033988749895
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            124.75,
            62.48349782142482
        ],
        "wc_strengths_avg": [
            71.5,
            40.23990556648959
        ],
        "wc_weaknesses_avg": [
            57.25,
            59.03124172842716
        ],
        "wc_questions_avg": [
            109.5,
            102.37553418664051
        ],
        "wc_review_avg": [
            363.0,
            146.00856139281697
        ],
        "wc_reply_reviewers_avg": [
            105.25,
            97.73017701815544
        ],
        "wc_reply_authors_avg": [
            352.75,
            287.67288280267223
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5773502691896258,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:8R-QH70_w5gJ:scholar.google.com/&scioq=Measuring+Information+in+Text+Explanations&hl=en&as_sdt=0,44",
        "gs_version_total": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Toronto;Dalhousie University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.utoronto.ca;https://www.dal.ca",
        "aff_unique_abbr": "U of T;Dal",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "brOAVSPPjw",
        "title": "Wide Neural Network Training Dynamics for Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "While deep reinforcement learning (RL) has demonstrated remarkable empirical success, understanding certain aspects of the training of deep RL agents remains elusive, leading to many RL algorithms requiring additional heuristic ingredients to be practically useful. In contrast to supervised learning, RL algorithms typically do not have access to ground-truth labels, leading to a more challenging training setup. In this work, we analyze the training dynamics of overparametrized, infinitely-wide value function networks, trained through temporal difference updates by extending previous results from neural tangent kernel approaches in supervised learning. We derive closed-form expressions for the training dynamics of common temporal difference policy evaluation methods as well as an analysis on the effects of uncertainty quantification of ensembling, a common heuristic measure of uncertainty in RL, in the infinite-width limit. We validate our analytically derived dynamic predictions on a toy environment, where we find good agreement with real neural networks. We also evaluate our methods on the classic control cart pole environment, and discover that the predictions and uncertainty quantification of our analytical solutions outperform those made by true ensembles trained via gradient descent.",
        "keywords": "temporal difference learning;training dynamics;reinforcement learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/14ef18dccba416310c41b4d234082917881f1a56.zip",
        "author": "Paulius Sasnauskas;Filippo Valdettaro;Aldo A. Faisal",
        "authorids": "~Paulius_Sasnauskas1;~Filippo_Valdettaro1;~Aldo_A._Faisal1",
        "gender": "M;M;M",
        "homepage": ";https://faisallab.org/;https://www.imperial.ac.uk/people/a.faisal/",
        "dblp": ";;54/5027",
        "google_scholar": "wNOrVPkAAAAJ;;https://scholar.google.co.uk/citations?user=WjHjbrwAAAAJ",
        "orcid": "0000-0002-6379-013X;;0000-0003-0813-7207",
        "linkedin": ";;a-aldo-faisal-057b704b/?originalSubdomain=uk",
        "or_profile": "~Paulius_Sasnauskas1;~Filippo_Valdettaro1;~Aldo_A._Faisal1",
        "aff": "MPI-SWS;Imperial College London;Universit\u00e4t Bayreuth",
        "aff_domain": "mpi-sws.org;ic.ac.uk;uni-bayreuth.de",
        "position": "Intern;PhD student;Full Professor",
        "bibtex": "@misc{\nsasnauskas2024wide,\ntitle={Wide Neural Network Training Dynamics for Reinforcement Learning},\nauthor={Paulius Sasnauskas and Filippo Valdettaro and Aldo A. Faisal},\nyear={2024},\nurl={https://openreview.net/forum?id=brOAVSPPjw}\n}",
        "github": "",
        "project": "",
        "reviewers": "5Tmm;UPFL;bQbn;GToL",
        "site": "https://openreview.net/forum?id=brOAVSPPjw",
        "pdf_size": 1127575,
        "rating": "1;3;3;3",
        "confidence": "4;4;3;4",
        "soundness": "1;2;3;2",
        "contribution": "1;2;2;2",
        "presentation": "2;3;2;2",
        "wc_summary": "74;95;90;105",
        "wc_strengths": "49;64;67;98",
        "wc_weaknesses": "523;731;238;276",
        "wc_questions": "69;245;62;8",
        "wc_review": "715;1135;457;487",
        "wc_reply_reviewers": "0;0;89;0",
        "wc_reply_authors": "630;362;280;412",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            91.0,
            11.20267825120404
        ],
        "wc_strengths_avg": [
            69.5,
            17.811513130556875
        ],
        "wc_weaknesses_avg": [
            442.0,
            199.533205256669
        ],
        "wc_questions_avg": [
            96.0,
            89.20482049754935
        ],
        "wc_review_avg": [
            698.5,
            271.04381564610543
        ],
        "wc_reply_reviewers_avg": [
            22.25,
            38.53813046840752
        ],
        "wc_reply_authors_avg": [
            421.0,
            129.5414991421668
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ReZpVpdyV6cJ:scholar.google.com/&scioq=Wide+Neural+Network+Training+Dynamics+for+Reinforcement+Learning&hl=en&as_sdt=0,48",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Max Planck Institute for Software Systems;Imperial College London;University of Bayreuth",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.mpi-sws.org;https://www.imperial.ac.uk;https://www.uni-bayreuth.de",
        "aff_unique_abbr": "MPI-SWS;ICL;Uni Bayreuth",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Germany;United Kingdom"
    },
    {
        "id": "brVSma4m8e",
        "title": "scHyena: Foundation Model for Full-Length Single-Cell RNA-Seq Analysis in Brain",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Single-cell RNA sequencing (scRNA-seq) has made significant strides in unraveling the intricate cellular diversity within complex tissues. This is particularly critical in the brain, presenting a greater diversity of cell types than other tissue types, to gain a deeper understanding of brain function within various cellular contexts. However, analyzing scRNA-seq data remains a challenge due to inherent measurement noise stemming from dropout events and the limited utilization of extensive gene expression information. In this work, we introduce scHyena, a foundation model designed to address these challenges and enhance the accuracy of scRNA-seq analysis in the brain. Specifically, inspired by the recent Hyena operator, we design a novel Transformer architecture called singe-cell Hyena (scHyena) that is equipped with a linear adaptor layer, the positional encoding via gene-embedding, and a bidirectional Hyena operator. This enables us to process full-length scRNA-seq data without losing any information from the raw data. In particular, our model learns generalizable features of cells and genes through pre-training scHyena using the full length of scRNA-seq data. We demonstrate the superior performance of scHyena compared to other benchmark methods in downstream tasks, including cell type classification and scRNA-seq imputation.",
        "keywords": "scRNA-seq;Hyena;foundation model",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Gyutaek Oh;Baekgyu Choi;Inkyung Jung;Jong Chul Ye",
        "authorids": "~Gyutaek_Oh1;~Baekgyu_Choi1;~Inkyung_Jung1;~Jong_Chul_Ye1",
        "gender": "M;M;M;M",
        "homepage": ";https://sites.google.com/view/junglab-kaist/main;http://junglab.kaist.ac.kr;https://bispl.weebly.com/",
        "dblp": ";;;15/5613",
        "google_scholar": "https://scholar.google.co.kr/citations?hl=ko;;;HNMjoNEAAAAJ",
        "orcid": ";;0000-0002-5885-2754;",
        "linkedin": ";;;",
        "or_profile": "~Gyutaek_Oh1;~Baekgyu_Choi1;~Inkyung_Jung1;~Jong_Chul_Ye1",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.edu;kaist.edu;;kaist.ac.kr",
        "position": "PhD student;PhD student;;Full Professor",
        "bibtex": "@misc{\noh2024schyena,\ntitle={scHyena: Foundation Model for Full-Length Single-Cell {RNA}-Seq Analysis in Brain},\nauthor={Gyutaek Oh and Baekgyu Choi and Inkyung Jung and Jong Chul Ye},\nyear={2024},\nurl={https://openreview.net/forum?id=brVSma4m8e}\n}",
        "github": "",
        "project": "",
        "reviewers": "LBHW;vZHL;3TUJ;GcHm",
        "site": "https://openreview.net/forum?id=brVSma4m8e",
        "pdf_size": 10943212,
        "rating": "3;3;3;5",
        "confidence": "4;3;5;3",
        "soundness": "2;3;2;3",
        "contribution": "2;2;1;2",
        "presentation": "2;3;2;4",
        "wc_summary": "97;21;35;88",
        "wc_strengths": "17;11;15;60",
        "wc_weaknesses": "247;10;153;167",
        "wc_questions": "137;283;47;115",
        "wc_review": "498;325;250;430",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            60.25,
            32.78242669480098
        ],
        "wc_strengths_avg": [
            25.75,
            19.891895334532606
        ],
        "wc_weaknesses_avg": [
            144.25,
            85.40308835165155
        ],
        "wc_questions_avg": [
            145.5,
            86.03923523602474
        ],
        "wc_review_avg": [
            375.75,
            95.2322818166193
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4167765409169626670&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "Mediator Interpretation and Faster Learning Algorithms for Linear Correlated Equilibria in General Sequential Games",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18321",
        "id": "bsKMPAFHO7",
        "author_site": "Brian Zhang, Gabriele Farina, Tuomas Sandholm",
        "tldr": "",
        "abstract": "A recent paper by Farina and Pipis (2023) established the existence of uncoupled no-linear-swap regret dynamics with polynomial-time iterations in extensive-form games. The equilibrium points reached by these dynamics, known as linear correlated equilibria, are currently the tightest known relaxation of correlated equilibrium that can be learned in polynomial time in any finite extensive-form game. However, their properties remain vastly unexplored, and their computation is onerous. In this paper, we provide several contributions shedding light on the fundamental nature of linear-swap regret. First, we show a connection between linear deviations and a generalization of communication deviations in which the player can make queries to a ``mediator'' who replies with action recommendations, and, critically, the player is not constrained to match the timing of the game as would be the case for communication deviations. We coin this latter set the untimed communication (UTC) deviations. We show that the UTC deviations coincide precisely with the linear deviations, and therefore that any player minimizing UTC regret also minimizes linear-swap regret. We then leverage this connection to develop state-of-the-art no-regret algorithms for computing linear correlated equilibria, both in theory and in practice. In theory, our algorithms achieve polynomially better per-iteration runtimes; in practice, our algorithms represent the state of the art by several orders of magnitude.",
        "keywords": "extensive-form games;correlated equilibria;no-regret learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Brian Hu Zhang;Gabriele Farina;Tuomas Sandholm",
        "authorids": "~Brian_Hu_Zhang1;~Gabriele_Farina1;~Tuomas_Sandholm1",
        "gender": ";M;M",
        "homepage": ";http://www.cs.cmu.edu/~gfarina/about/;http://www.cs.cmu.edu/~sandholm",
        "dblp": "213/8211;;s/TuomasSandholm",
        "google_scholar": ";sktDNcEAAAAJ;0DpK1EMAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Brian_Hu_Zhang1;~Gabriele_Farina1;~Tuomas_Sandholm1",
        "aff": "Carnegie Mellon University;Massachusetts Institute of Technology;Carnegie Mellon University",
        "aff_domain": "cmu.edu;mit.edu;cmu.edu",
        "position": "PhD student;Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\nzhang2024mediator,\ntitle={Mediator Interpretation and Faster Learning Algorithms for Linear Correlated Equilibria in General Sequential Games},\nauthor={Brian Hu Zhang and Gabriele Farina and Tuomas Sandholm},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=bsKMPAFHO7}\n}",
        "github": "",
        "project": "",
        "reviewers": "YUk3;EjBw;JkDA;xFFq",
        "pdf_size": 515208,
        "rating": "6;6;6;6",
        "confidence": "3;3;3;2",
        "soundness": "4;3;3;3",
        "contribution": "3;2;3;2",
        "presentation": "1;4;2;2",
        "wc_summary": "112;119;116;64",
        "wc_strengths": "80;87;31;12",
        "wc_weaknesses": "119;129;188;295",
        "wc_questions": "94;40;77;3",
        "wc_review": "405;375;412;374",
        "wc_reply_reviewers": "0;66;5;0",
        "wc_reply_authors": "456;502;352;795",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            102.75,
            22.509720122649238
        ],
        "wc_strengths_avg": [
            52.5,
            31.815876539866068
        ],
        "wc_weaknesses_avg": [
            182.75,
            69.96561655556249
        ],
        "wc_questions_avg": [
            53.5,
            35.0891721190455
        ],
        "wc_review_avg": [
            391.5,
            17.18284027743958
        ],
        "wc_reply_reviewers_avg": [
            17.75,
            27.931836674304108
        ],
        "wc_reply_authors_avg": [
            526.25,
            164.40251670823048
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7908146877786908929&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=bsKMPAFHO7",
        "pdf": "https://openreview.net/pdf?id=bsKMPAFHO7",
        "email": "cmu.edu;mit.edu;cmu.edu",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Carnegie Mellon University;Massachusetts Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cmu.edu;https://web.mit.edu",
        "aff_unique_abbr": "CMU;MIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "RAPPER: Reinforced Rationale-Prompted Paradigm for Natural Language Explanation in Visual Question Answering",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18320",
        "id": "bshfchPM9H",
        "author_site": "Kai-Po Chang, Chi-Pin Huang, Wei-Yuan Cheng, Fu-En Yang, Chien-Yi Wang, Yung-Hsuan Lai, Yu-Chiang Frank Wang",
        "tldr": "",
        "abstract": "Natural Language Explanation (NLE) in vision and language tasks aims to provide human-understandable explanations for the associated decision-making process. In practice, one might encounter explanations which lack informativeness or contradict visual-grounded facts, known as implausibility and hallucination problems, respectively. To tackle these challenging issues, we consider the task of visual question answering (VQA) and introduce Rapper, a two-stage Reinforced Rationale-Prompted Paradigm. By knowledge distillation, the former stage of Rapper infuses rationale-prompting via large language models (LLMs), encouraging the rationales supported by language-based facts. As for the latter stage, a unique Reinforcement Learning from NLE Feedback (RLNF) is introduced for injecting visual facts into NLE generation. Finally, quantitative and qualitative experiments on two VL-NLE benchmarks show that Rapper surpasses state-of-the-art VQA-NLE methods while providing plausible and faithful NLE.",
        "keywords": "Vision Question Answering Natural Language Explanation (VQA-NLE)",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Kai-Po Chang;Chi-Pin Huang;Wei-Yuan Cheng;Fu-En Yang;Chien-Yi Wang;Yung-Hsuan Lai;Yu-Chiang Frank Wang",
        "authorids": "~Kai-Po_Chang1;~Chi-Pin_Huang2;~Wei-Yuan_Cheng1;~Fu-En_Yang1;~Chien-Yi_Wang1;~Yung-Hsuan_Lai1;~Yu-Chiang_Frank_Wang2",
        "gender": "M;M;M;M;M;M;M",
        "homepage": ";https://jasper0314-huang.github.io/;https://github.com/weiyuan-c;https://fuenyang1127.github.io/;https://chienyiwang.github.io/;https://franklin905.github.io/;http://vllab.ee.ntu.edu.tw/ycwang.html",
        "dblp": "234/8190;362/2899;;218/6244;12/6741;348/6382;30/1690",
        "google_scholar": "lXC6HbkAAAAJ;https://scholar.google.com.tw/citations?user=s8-yTSwAAAAJ;https://scholar.google.com/citations?view_op=list_works;https://scholar.google.com.tw/citations?user=k6Iz9VoAAAAJ;05LW2DcAAAAJ;rU7n-9YAAAAJ;HSGvdtoAAAAJ",
        "orcid": ";0009-0003-7738-3054;;0000-0003-0102-7101;;;0000-0002-2333-157X",
        "linkedin": "%E5%87%B1%E5%8D%9A-%E5%BC%B5-14051a191/?trk=public_profile_browsemap_profile-result-card_result-card_full-click&originalSubdomain=tw;chi-pin-huang-b69704208/;;fu-en-yang-77ba7b175/;chienyiwang/;yung-hsuan-lai-1629a7212/;",
        "or_profile": "~Kai-Po_Chang1;~Chi-Pin_Huang2;~Wei-Yuan_Cheng1;~Fu-En_Yang1;~Chien-Yi_Wang1;~Yung-Hsuan_Lai1;~Yu-Chiang_Frank_Wang2",
        "aff": "National Taiwan University;National Taiwan University;National Taiwan University;NVIDIA;NVIDIA;National Taiwan University;National Taiwan University",
        "aff_domain": "ntu.edu.tw;ntu.edu.tw;ntu.edu.tw;nvidia.com;nvidia.com;ntu.edu.tw;ntu.edu.tw",
        "position": "PhD student;PhD student;MS student;Researcher;Researcher;Research Assistant;Full Professor",
        "bibtex": "@inproceedings{\nchang2024rapper,\ntitle={{RAPPER}: Reinforced Rationale-Prompted Paradigm for Natural Language Explanation in Visual Question Answering},\nauthor={Kai-Po Chang and Chi-Pin Huang and Wei-Yuan Cheng and Fu-En Yang and Chien-Yi Wang and Yung-Hsuan Lai and Yu-Chiang Frank Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=bshfchPM9H}\n}",
        "github": "",
        "project": "",
        "reviewers": "EbLA;iXW4;iCAp",
        "pdf_size": 10731851,
        "rating": "3;6;6",
        "confidence": "3;2;4",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "3;2;3",
        "wc_summary": "82;79;148",
        "wc_strengths": "31;98;211",
        "wc_weaknesses": "125;59;79",
        "wc_questions": "17;30;128",
        "wc_review": "255;266;566",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1348;1292;1332",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;2;2",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            103.0,
            31.843366656181317
        ],
        "wc_strengths_avg": [
            113.33333333333333,
            74.28025010428786
        ],
        "wc_weaknesses_avg": [
            87.66666666666667,
            27.632509034750278
        ],
        "wc_questions_avg": [
            58.333333333333336,
            49.546835306494486
        ],
        "wc_review_avg": [
            362.3333333333333,
            144.0840803913542
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1324.0,
            23.55136231020759
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14196451894060962703&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=bshfchPM9H",
        "pdf": "https://openreview.net/pdf?id=bshfchPM9H",
        "email": "ntu.edu.tw;ntu.edu.tw;ntu.edu.tw;nvidia.com;nvidia.com;ntu.edu.tw;ntu.edu.tw",
        "author_num": 7,
        "aff_unique_index": "0;0;0;1;1;0;0",
        "aff_unique_norm": "National Taiwan University;NVIDIA",
        "aff_unique_dep": ";NVIDIA Corporation",
        "aff_unique_url": "https://www.ntu.edu.tw;https://www.nvidia.com",
        "aff_unique_abbr": "NTU;NVIDIA",
        "aff_campus_unique_index": "0;0;0;0;0",
        "aff_campus_unique": "Taiwan;",
        "aff_country_unique_index": "0;0;0;1;1;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Efficient Planning with Latent Diffusion",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18319",
        "id": "btpgDo4u4j",
        "tldr": "",
        "abstract": "Temporal abstraction and efficient planning pose significant challenges in offline reinforcement learning, mainly when dealing with domains that involve temporally extended tasks and delayed sparse rewards. Existing methods typically plan in the raw action space and can be inefficient and inflexible. Latent action spaces offer a more flexible approach, capturing only possible actions within the behavior policy support and decoupling the temporal structure between planning and modeling. However, current latent-action-based methods are limited to discrete spaces and require expensive planning steps. This paper presents a unified framework for continuous latent action space representation learning and planning by leveraging latent, score-based diffusion models. We establish the theoretical equivalence between planning in the latent action space and energy-guided sampling with a pretrained diffusion model and introduce a novel sequence-level exact sampling method. Our proposed method, $\\texttt{LatentDiffuser}$, demonstrates competitive performance on low-dimensional locomotion control tasks and surpasses existing methods in higher-dimensional tasks.",
        "keywords": "Offline Decision-Making;Offline Reinforcement Learning;Generative Model;Diffusion Model",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Wenhao Li",
        "authorids": "~Wenhao_Li2",
        "gender": "M",
        "homepage": "https://tomaxent.com",
        "dblp": "",
        "google_scholar": "HAtzuaYAAAAJ",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Wenhao_Li2",
        "aff": "The Chinese University of Hong Kong, Shenzhen",
        "aff_domain": "cuhk.edu.cn",
        "position": "Postdoc",
        "bibtex": "@inproceedings{\nli2024efficient,\ntitle={Efficient Planning with Latent Diffusion},\nauthor={Wenhao Li},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=btpgDo4u4j}\n}",
        "github": "",
        "project": "",
        "reviewers": "A5bD;kDwN;z1ps;qvER",
        "pdf_size": 5312890,
        "rating": "5;6;8;8",
        "confidence": "2;2;5;4",
        "soundness": "3;3;4;3",
        "contribution": "3;3;4;3",
        "presentation": "2;3;4;4",
        "wc_summary": "112;43;79;81",
        "wc_strengths": "130;24;92;29",
        "wc_weaknesses": "264;18;75;18",
        "wc_questions": "49;9;191;188",
        "wc_review": "555;94;437;316",
        "wc_reply_reviewers": "0;18;16;43",
        "wc_reply_authors": "2686;395;1062;894",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "5;3;3;3",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            1.299038105676658
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            78.75,
            24.437420076595647
        ],
        "wc_strengths_avg": [
            68.75,
            44.36989407244511
        ],
        "wc_weaknesses_avg": [
            93.75,
            101.01082862742985
        ],
        "wc_questions_avg": [
            109.25,
            81.49348133439877
        ],
        "wc_review_avg": [
            350.5,
            170.50293252610055
        ],
        "wc_reply_reviewers_avg": [
            19.25,
            15.384651442265437
        ],
        "wc_reply_authors_avg": [
            1259.25,
            859.4851293070753
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.5,
            0.8660254037844386
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0.9259259259259257,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17849613190986159332&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=btpgDo4u4j",
        "pdf": "https://openreview.net/pdf?id=btpgDo4u4j",
        "email": "cuhk.edu.cn",
        "author_num": 1,
        "aff_unique_index": "0",
        "aff_unique_norm": "Chinese University of Hong Kong",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cuhk.edu.cn",
        "aff_unique_abbr": "CUHK",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Shenzhen",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "title": "AnomalyCLIP: Object-agnostic Prompt Learning for Zero-shot Anomaly Detection",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18318",
        "id": "buC4E91xZE",
        "author_site": "Qihang Zhou, Guansong Pang, Yu Tian, Shibo He, Jiming Chen",
        "tldr": "",
        "abstract": "Zero-shot anomaly detection (ZSAD) requires detection models trained using auxiliary\ndata to detect anomalies without any training sample in a target dataset. It\nis a crucial task when training data is not accessible due to various concerns, e.g.,\ndata privacy, yet it is challenging since the models need to generalize to anomalies\nacross different domains where the appearance of foreground objects, abnormal\nregions, and background features, such as defects/tumors on different products/\norgans, can vary significantly. Recently large pre-trained vision-language\nmodels (VLMs), such as CLIP, have demonstrated strong zero-shot recognition\nability in various vision tasks, including anomaly detection. However, their ZSAD\nperformance is weak since the VLMs focus more on modeling the class semantics\nof the foreground objects rather than the abnormality/normality in the images. In\nthis paper we introduce a novel approach, namely AnomalyCLIP, to adapt CLIP\nfor accurate ZSAD across different domains. The key insight of AnomalyCLIP\nis to learn object-agnostic text prompts that capture generic normality and abnormality\nin an image regardless of its foreground objects. This allows our model to\nfocus on the abnormal image regions rather than the object semantics, enabling\ngeneralized normality and abnormality recognition on diverse types of objects.\nLarge-scale experiments on 17 real-world anomaly detection datasets show that\nAnomalyCLIP achieves superior zero-shot performance of detecting and segmenting\nanomalies in datasets of highly diverse class semantics from various defect\ninspection and medical imaging domains. Code will be made available at https://github.com/zqhang/AnomalyCLIP.",
        "keywords": "Anomaly detection;Zero-shot anomaly detection;CLIP;Industrial defect inspection",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Qihang Zhou;Guansong Pang;Yu Tian;Shibo He;Jiming Chen",
        "authorids": "~Qihang_Zhou1;~Guansong_Pang1;~Yu_Tian8;~Shibo_He1;~Jiming_Chen1",
        "gender": "M;;M;M;M",
        "homepage": "https://github.com/zqhang;http://guansongpang.com/;https://yutianyt.com/;https://person.zju.edu.cn/en/shibohe;",
        "dblp": ";07/11150;15/4658;07/7178;55/2484-1.html",
        "google_scholar": "https://scholar.google.com.hk/citations?user=mkGKMDQAAAAJ;https://scholar.google.com.tw/citations?hl=en;knptLuEAAAAJ;https://scholar.google.com/citations?hl=zh-CN;zK9tvo8AAAAJ",
        "orcid": ";0000-0002-9877-2716;0000-0001-5533-7506;;",
        "linkedin": ";guansong-pang-5587b21b/;yutianyt/;;",
        "or_profile": "~Qihang_Zhou1;~Guansong_Pang1;~Yu_Tian8;~Shibo_He1;~Jiming_Chen1",
        "aff": "Zhejiang University;Singapore Management University;Harvard University;Zhejiang University;Zhejiang University",
        "aff_domain": "zju.edu.cn;smu.edu.sg;harvard.edu;zju.edu.cn;zju.edu.cn",
        "position": "PhD student;Assistant Professor;Postdoc;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nzhou2024anomalyclip,\ntitle={Anomaly{CLIP}: Object-agnostic Prompt Learning for Zero-shot Anomaly Detection},\nauthor={Qihang Zhou and Guansong Pang and Yu Tian and Shibo He and Jiming Chen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=buC4E91xZE}\n}",
        "github": "",
        "project": "",
        "reviewers": "vcXy;w1Ea;NCKk;GzuZ;5wSC;xREe",
        "pdf_size": 44155070,
        "rating": "5;5;5;6;8;8",
        "confidence": "5;4;3;5;3;3",
        "soundness": "3;3;2;2;3;3",
        "contribution": "3;2;2;3;4;3",
        "presentation": "3;2;2;3;4;3",
        "wc_summary": "46;45;60;157;23;61",
        "wc_strengths": "23;32;52;51;41;94",
        "wc_weaknesses": "215;163;132;254;45;26",
        "wc_questions": "3;3;28;33;49;3",
        "wc_review": "287;243;272;495;158;184",
        "wc_reply_reviewers": "0;0;0;0;0;0",
        "wc_reply_authors": "892;975;949;895;1096;70",
        "reply_reviewers": "0;0;0;0;0;0",
        "reply_authors": "2;2;2;2;2;1",
        "rating_avg": [
            6.166666666666667,
            1.3437096247164249
        ],
        "confidence_avg": [
            3.8333333333333335,
            0.8975274678557507
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.8333333333333335,
            0.6871842709362768
        ],
        "presentation_avg": [
            2.8333333333333335,
            0.6871842709362768
        ],
        "wc_summary_avg": [
            65.33333333333333,
            42.87449384216941
        ],
        "wc_strengths_avg": [
            48.833333333333336,
            22.608380943554735
        ],
        "wc_weaknesses_avg": [
            139.16666666666666,
            82.89635429592519
        ],
        "wc_questions_avg": [
            19.833333333333332,
            17.98533353102528
        ],
        "wc_review_avg": [
            273.1666666666667,
            109.18396809462865
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            812.8333333333334,
            339.07787535543446
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.8333333333333333,
            0.3726779962499649
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5297514556606107,
        "gs_citation": 148,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15873732305512230357&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=buC4E91xZE",
        "pdf": "https://openreview.net/pdf?id=buC4E91xZE",
        "email": "zju.edu.cn;smu.edu.sg;harvard.edu;zju.edu.cn;zju.edu.cn",
        "author_num": 5,
        "aff_unique_index": "0;1;2;0;0",
        "aff_unique_norm": "Zhejiang University;Singapore Management University;Harvard University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.zju.edu.cn;https://www.smu.edu.sg;https://www.harvard.edu",
        "aff_unique_abbr": "ZJU;SMU;Harvard",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;0;0",
        "aff_country_unique": "China;Singapore;United States"
    },
    {
        "title": "Structural Fairness-aware Active Learning for Graph Neural Networks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18317",
        "id": "bvjcMvMn7B",
        "author_site": "Haoyu Han, Xiaorui Liu, Li Ma, MohamadAli Torkamani, Hui Liu, Jiliang Tang, Makoto Yamada",
        "tldr": "",
        "abstract": "Graph Neural Networks (GNNs) have seen significant achievements in semi-supervised node classification. Yet, their efficacy often hinges on access to high-quality labeled node samples, which may not always be available in real-world scenarios. While active learning is commonly employed across various domains to pinpoint and label high-quality samples based on data features, graph data present unique challenges due to their intrinsic structures that render nodes non-i.i.d. Furthermore, biases emerge from the positioning of labeled nodes; for instance, nodes closer to the labeled counterparts often yield better performance. To better leverage graph structure and mitigate structural bias in active learning, we present a unified optimization framework (SCARCE), which is also easily incorporated with node features.  Extensive experiments demonstrate that the proposed method not only improves the GNNs performance but also paves the way for more fair results.",
        "keywords": "Active Learning;Graph Neural Networks;Structural Fairness",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Haoyu Han;Xiaorui Liu;Li Ma;MohamadAli Torkamani;Hui Liu;Jiliang Tang;Makoto Yamada",
        "authorids": "~Haoyu_Han1;~Xiaorui_Liu1;~Li_Ma9;~MohamadAli_Torkamani1;~Hui_Liu8;~Jiliang_Tang1;~Makoto_Yamada3",
        "gender": "M;M;;M;F;M;M",
        "homepage": "https://cse.msu.edu/~hanhaoy1/;https://sites.google.com/ncsu.edu/xiaorui/;;;https://scholar.google.com/citations?user=EuzF_zsAAAAJ&hl=en;https://www.cse.msu.edu/~tangjili/;https://groups.oist.jp/mlds",
        "dblp": "257/5633-1;172/0995;;137/3244;93/4010-31;64/10812;56/4937",
        "google_scholar": ";NhvN1KoAAAAJ;;UtE9noAAAAAJ;;WtzKMWAAAAAJ;1cKNu1gAAAAJ",
        "orcid": "0000-0002-2529-6042;0000-0001-8217-5688;;;0000-0002-3555-3495;0000-0001-7125-3898;",
        "linkedin": ";;;ali-torkamani-8474587/;;;",
        "or_profile": "~Haoyu_Han1;~Xiaorui_Liu1;~Li_Ma9;~MohamadAli_Torkamani1;~Hui_Liu8;~Jiliang_Tang1;~Makoto_Yamada3",
        "aff": "Michigan State University;North Carolina State University;;AWS AI;Michigan State University;Michigan State University;Okinawa Institute of Science and Technology (OIST)",
        "aff_domain": "msu.edu;ncsu.edu;;amazon.com;msu.edu;msu.edu;oist.jp",
        "position": "PhD student;Assistant Professor;;Researcher;Assistant Professor;Full Professor;Associate Professor",
        "bibtex": "@inproceedings{\nhan2024structural,\ntitle={Structural Fairness-aware Active Learning for Graph Neural Networks},\nauthor={Haoyu Han and Xiaorui Liu and Li Ma and MohamadAli Torkamani and Hui Liu and Jiliang Tang and Makoto Yamada},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=bvjcMvMn7B}\n}",
        "github": "",
        "project": "",
        "reviewers": "RKZS;tqC2;UJDy;BDeb",
        "pdf_size": 471174,
        "rating": "5;6;6;6",
        "confidence": "3;3;3;4",
        "soundness": "2;1;3;2",
        "contribution": "2;1;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "87;18;74;41",
        "wc_strengths": "11;117;56;40",
        "wc_weaknesses": "209;146;71;130",
        "wc_questions": "2;72;109;135",
        "wc_review": "309;353;310;346",
        "wc_reply_reviewers": "146;18;18;0",
        "wc_reply_authors": "2081;1665;1250;1011",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "5;5;5;3",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            55.0,
            27.15695122800054
        ],
        "wc_strengths_avg": [
            56.0,
            38.73628789649313
        ],
        "wc_weaknesses_avg": [
            139.0,
            49.12738543826651
        ],
        "wc_questions_avg": [
            79.5,
            50.03248944436005
        ],
        "wc_review_avg": [
            329.5,
            20.155644370746373
        ],
        "wc_reply_reviewers_avg": [
            45.5,
            58.48717808203778
        ],
        "wc_reply_authors_avg": [
            1501.75,
            408.1650248367687
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.5,
            0.8660254037844386
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3760521619021358023&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=bvjcMvMn7B",
        "pdf": "https://openreview.net/pdf?id=bvjcMvMn7B",
        "email": "msu.edu;ncsu.edu;;amazon.com;msu.edu;msu.edu;oist.jp",
        "author_num": 7,
        "aff_unique_index": "0;1;2;0;0;3",
        "aff_unique_norm": "Michigan State University;North Carolina State University;Amazon;Okinawa Institute of Science and Technology",
        "aff_unique_dep": ";;AWS AI;",
        "aff_unique_url": "https://www.msu.edu;https://www.ncsu.edu;https://aws.amazon.com;https://www.oist.jp",
        "aff_unique_abbr": "MSU;NCSU;AWS;OIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;1",
        "aff_country_unique": "United States;Japan"
    },
    {
        "id": "bvw9H80jyW",
        "title": "ComSD: Balancing Behavioral Quality and Diversity in Unsupervised Skill Discovery",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Learning diverse and qualified behaviors for utilization and adaptation without supervision is a key ability of intelligent creatures. Ideal unsupervised skill discovery methods are able to produce diverse and qualified skills in the absence of extrinsic reward, while the discovered skill set can efficiently adapt to downstream tasks in various ways. Maximizing the Mutual Information (MI) between skills and visited states can achieve ideal skill-conditioned behavior distillation in theory. However, it's difficult for recent advanced methods to well balance behavioral quality (exploration) and diversity (exploitation) in practice, which may be attributed to the unreasonable MI estimation by their rigid intrinsic reward design. In this paper, we propose Contrastive multi-objectives Skill Discovery (ComSD) which tries to mitigate the quality-versus-diversity conflict of discovered behaviors through a more reasonable MI estimation and a dynamically weighted intrinsic reward. ComSD proposes to employ contrastive learning for a more reasonable estimation of skill-conditioned entropy in MI decomposition. In addition, a novel weighting mechanism is proposed to dynamically balance different entropy (in MI decomposition) estimations into a novel multi-objective intrinsic reward, to improve both skill diversity and quality. For challenging robot behavior discovery, ComSD can produce a qualified skill set consisting of diverse behaviors at different activity levels, which recent advanced methods cannot. On numerical evaluations, ComSD exhibits state-of-the-art adaptation performance, significantly outperforming recent advanced skill discovery methods across all skill combination tasks and most skill finetuning tasks. Our code is available at ***.",
        "keywords": "unsupervised reinforcement learning;skill discovery;self-supervised learning;multi-joint robot locomotion",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/fb04e5798e7e77a55f1efe10edff06775e6631d0.pdf",
        "author": "Xin Liu;Yaran Chen",
        "authorids": "~Xin_Liu40;~Yaran_Chen1",
        "gender": "M;F",
        "homepage": ";https://people.ucas.ac.cn/~yaran?language=en",
        "dblp": ";189/4413",
        "google_scholar": ";https://scholar.google.com/citations?view_op=list_works",
        "orcid": "0000-0002-7857-3058;0000-0001-9356-0610",
        "linkedin": ";",
        "or_profile": "~Xin_Liu40;~Yaran_Chen1",
        "aff": "Institute of automation, Chinese Academy of Sciences;Institute of Automation, Chinese Academy of Sciences",
        "aff_domain": "ia.ac.cn;ia.ac.cn",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\nliu2024comsd,\ntitle={Com{SD}: Balancing Behavioral Quality and Diversity in Unsupervised Skill Discovery},\nauthor={Xin Liu and Yaran Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=bvw9H80jyW}\n}",
        "github": "",
        "project": "",
        "reviewers": "YuZu;wqjS;uFyJ;U8Ne",
        "site": "https://openreview.net/forum?id=bvw9H80jyW",
        "pdf_size": 11656718,
        "rating": "3;3;5;6",
        "confidence": "4;4;4;3",
        "soundness": "2;1;3;3",
        "contribution": "1;1;2;2",
        "presentation": "2;2;3;3",
        "wc_summary": "87;87;220;85",
        "wc_strengths": "33;47;115;66",
        "wc_weaknesses": "235;170;272;266",
        "wc_questions": "41;6;29;107",
        "wc_review": "396;310;636;524",
        "wc_reply_reviewers": "176;0;0;100",
        "wc_reply_authors": "658;314;466;828",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            119.75,
            57.88512330469721
        ],
        "wc_strengths_avg": [
            65.25,
            31.01914731258743
        ],
        "wc_weaknesses_avg": [
            235.75,
            40.47452902752545
        ],
        "wc_questions_avg": [
            45.75,
            37.53248592885902
        ],
        "wc_review_avg": [
            466.5,
            123.99495957497628
        ],
        "wc_reply_reviewers_avg": [
            69.0,
            74.04728219185361
        ],
        "wc_reply_authors_avg": [
            566.5,
            194.04316530091958
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.7777777777777777,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18239396369535637657&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Chinese Academy of Sciences",
        "aff_unique_dep": "Institute of Automation",
        "aff_unique_url": "http://www.ia.cas.cn",
        "aff_unique_abbr": "CAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "bwZ9xh178a",
        "title": "Exploiting Negative Samples: A Catalyst for Cohort Discovery in Healthcare Analytics",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In healthcare analytics, particularly when dealing with binary diagnosis or prognosis tasks, unique challenges arise from the inherent asymmetry between positive and negative samples. Positive samples, denoting patients who develop a disease, are defined based on stringent medical criteria. In contrast, negative samples are defined in an open-ended manner, leading to a vast potential set. Despite this fundamental asymmetry, the role of negative samples remains underexplored in prior research, possibly due to the enormous challenge of investigating an infinitely large negative sample space. To bridge this gap, we propose an innovative approach to facilitate cohort discovery within negative samples, leveraging a Shapley-based exploration of interrelationships between these samples, which holds promise for uncovering valuable insights concerning the studied disease, and related comorbidity and complications. We quantify each sample\u2019s contribution using data Shapley values, subsequently constructing the Negative Sample Shapley Field to model the distribution of all negative samples. Next, we transform this field through manifold learning, preserving the essential data structure information while imposing an isotropy constraint in data Shapley values. Within this transformed space, we pinpoint cohorts of medical interest via density-based clustering. We empirically evaluate the effectiveness of our approach on our hospital\u2019s electronic medical records. The medical insights derived from the discovered cohorts are validated by clinicians, which affirms the medical value of our proposal in unveiling meaningful insights aligning with existing domain knowledge, thereby bolstering medical research and well-informed clinical decision-making.",
        "keywords": "Negative Samples;Cohort Discovery;Healthcare Analytics",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/501e6c343bdbdc1c8e6f1e175758baa8629bf1a8.zip",
        "author": "Kaiping Zheng;Horng-Ruey Chua;Melanie Herschel;H. V. Jagadish;Beng Chin Ooi;James Wei Luen Yip",
        "authorids": "~Kaiping_Zheng1;~Horng-Ruey_Chua1;~Melanie_Herschel1;~H._V._Jagadish1;~Beng_Chin_Ooi1;~James_Wei_Luen_Yip2",
        "gender": "F;M;;;M;M",
        "homepage": "https://www.comp.nus.edu.sg/~kaiping/;;;;http://www.comp.nus.edu.sg/~ooibc/;",
        "dblp": "169/3246;https://dblp.uni-trier.de/pid/262/0046;;;o/BengChinOoi;07/10315",
        "google_scholar": "https://scholar.google.com.sg/citations?user=V1PdtzQAAAAJ;https://scholar.google.com.sg/citations?user=BtM-NyIAAAAJ;;;https://scholar.google.com.tw/citations?user=9560QjYAAAAJ;",
        "orcid": "0000-0001-8138-1543;0000-0003-1379-0585;;;0000-0003-4446-1100;0000-0001-5470-4554",
        "linkedin": ";;;;beng-chin-ooi-34b0634/;",
        "or_profile": "~Kaiping_Zheng1;~Horng-Ruey_Chua1;~Melanie_Herschel1;~H._V._Jagadish1;~Beng_Chin_Ooi1;~James_Wei_Luen_Yip2",
        "aff": "National University of Singapore;National University Hospital;;;National University of Singapore;",
        "aff_domain": "nus.edu.sg;nuhs.edu.sg;;;comp.nus.edu.sg;",
        "position": "Postdoc;Researcher;;;Full Professor;",
        "bibtex": "@misc{\nzheng2024exploiting,\ntitle={Exploiting Negative Samples: A Catalyst for Cohort Discovery in Healthcare Analytics},\nauthor={Kaiping Zheng and Horng-Ruey Chua and Melanie Herschel and H. V. Jagadish and Beng Chin Ooi and James Wei Luen Yip},\nyear={2024},\nurl={https://openreview.net/forum?id=bwZ9xh178a}\n}",
        "github": "",
        "project": "",
        "reviewers": "73KN;T3Vm;KsRk",
        "site": "https://openreview.net/forum?id=bwZ9xh178a",
        "pdf_size": 7102559,
        "rating": "6;6;6",
        "confidence": "4;4;3",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "4;3;3",
        "wc_summary": "135;54;78",
        "wc_strengths": "64;24;131",
        "wc_weaknesses": "165;5;145",
        "wc_questions": "66;163;3",
        "wc_review": "430;246;357",
        "wc_reply_reviewers": "42;14;160",
        "wc_reply_authors": "1986;1309;3278",
        "reply_reviewers": "1;1;1",
        "reply_authors": "4;2;8",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            89.0,
            33.97057550292606
        ],
        "wc_strengths_avg": [
            73.0,
            44.14370472294625
        ],
        "wc_weaknesses_avg": [
            105.0,
            71.18052168020874
        ],
        "wc_questions_avg": [
            77.33333333333333,
            65.80948935289567
        ],
        "wc_review_avg": [
            344.3333333333333,
            75.64977785088922
        ],
        "wc_reply_reviewers_avg": [
            72.0,
            63.26663154196426
        ],
        "wc_reply_authors_avg": [
            2191.0,
            816.8063826064697
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            4.666666666666667,
            2.494438257849294
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4000752260447724841&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "National University of Singapore;National University Hospital",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.nus.edu.sg;",
        "aff_unique_abbr": "NUS;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Singapore;Unknown"
    },
    {
        "title": "Sharpness-Aware Data Poisoning Attack",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18316",
        "id": "bxITGFPVWh",
        "author_site": "Pengfei He, Han Xu, Jie Ren, Yingqian Cui, Shenglai Zeng, Hui Liu, Charu Aggarwal, Jiliang Tang",
        "tldr": "",
        "abstract": "Recent research has highlighted the vulnerability of Deep Neural Networks (DNNs) against data poisoning attacks. These attacks aim to inject poisoning samples into the models' training dataset such that the trained models have inference failures. While previous studies have executed different types of attacks, one major challenge that greatly limits their effectiveness is the \nuncertainty of the re-training process after the injection of poisoning samples. It includes the uncertainty of training initialization, algorithm and model architecture. To address this challenge, we propose a new strategy called **Sharpness-Aware Data Poisoning Attack (SAPA)**. In particular, it leverages the concept of DNNs' loss landscape sharpness to optimize the poisoning effect on the (approximately) worst re-trained model. Extensive experiments demonstrate that SAPA offers a general and principled strategy that significantly enhances various types of poisoning attacks against various types of re-training uncertainty.",
        "keywords": "Data poisoning attack; generalization; deep learning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Pengfei He;Han Xu;Jie Ren;Yingqian Cui;Shenglai Zeng;Hui Liu;Charu C. Aggarwal;Jiliang Tang",
        "authorids": "~Pengfei_He2;~Han_Xu1;~Jie_Ren6;~Yingqian_Cui1;~Shenglai_Zeng2;~Hui_Liu8;~Charu_C._Aggarwal2;~Jiliang_Tang1",
        "gender": "M;M;M;F;M;F;M;M",
        "homepage": "https://pengfeihepower.github.io/;https://cse.msu.edu/~xuhan1/;https://renjie3.github.io/;https://yingqiancui.github.io/;https://slz-ai.github.io/;https://scholar.google.com/citations?user=EuzF_zsAAAAJ&hl=en;http://www.charuaggarwal.net;https://www.cse.msu.edu/~tangjili/",
        "dblp": "37/10219-2;32/34-2;181/2887-19.html;;312/6540;93/4010-31;a/CharuCAggarwal;64/10812",
        "google_scholar": "nsSrd6kAAAAJ;mX2rL3IAAAAJ;;3p67r08AAAAJ;https://scholar.google.com.hk/citations?user=2EFS5WEAAAAJ;;x_wsduUAAAAJ;WtzKMWAAAAAJ",
        "orcid": ";0000-0002-4016-6748;;;0009-0001-9664-8017;0000-0002-3555-3495;0000-0003-2579-7581;0000-0001-7125-3898",
        "linkedin": ";;;;;;;",
        "or_profile": "~Pengfei_He2;~Han_Xu1;~Jie_Ren6;~Yingqian_Cui1;~Shenglai_Zeng2;~Hui_Liu8;~Charu_C._Aggarwal2;~Jiliang_Tang1",
        "aff": "Michigan State University;Michigan State University;Sony Europe Ltd.;Michigan State University;Michigan State University;Michigan State University;International Business Machines;Michigan State University",
        "aff_domain": "msu.edu;msu.edu;sony.com;msu.edu;msu.edu;msu.edu;ibm.com;msu.edu",
        "position": "PhD student;PhD student;Intern;PhD student;PhD student;Assistant Professor;Distinguished Research Staff Member;Full Professor",
        "bibtex": "@inproceedings{\nhe2024sharpnessaware,\ntitle={Sharpness-Aware Data Poisoning Attack},\nauthor={Pengfei He and Han Xu and Jie Ren and Yingqian Cui and Shenglai Zeng and Hui Liu and Charu C. Aggarwal and Jiliang Tang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=bxITGFPVWh}\n}",
        "github": "",
        "project": "",
        "reviewers": "Y6BU;Twq5;kdwN;X4g5;jHfE;Ae7N",
        "pdf_size": 1385448,
        "rating": "5;6;6;6;6;6",
        "confidence": "5;4;5;4;3;4",
        "soundness": "3;3;3;3;3;4",
        "contribution": "2;2;3;3;3;3",
        "presentation": "2;3;3;4;3;3",
        "wc_summary": "86;85;25;38;72;78",
        "wc_strengths": "17;71;37;73;73;94",
        "wc_weaknesses": "61;187;42;228;183;120",
        "wc_questions": "32;5;2;62;108;23",
        "wc_review": "196;348;106;401;436;315",
        "wc_reply_reviewers": "36;12;13;0;0;0",
        "wc_reply_authors": "1238;664;179;914;687;455",
        "reply_reviewers": "1;1;1;0;0;0",
        "reply_authors": "4;2;3;3;2;2",
        "rating_avg": [
            5.833333333333333,
            0.372677996249965
        ],
        "confidence_avg": [
            4.166666666666667,
            0.6871842709362768
        ],
        "soundness_avg": [
            3.1666666666666665,
            0.3726779962499649
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.5773502691896257
        ],
        "wc_summary_avg": [
            64.0,
            23.74166520416516
        ],
        "wc_strengths_avg": [
            60.833333333333336,
            25.78382352475202
        ],
        "wc_weaknesses_avg": [
            136.83333333333334,
            68.29694152904815
        ],
        "wc_questions_avg": [
            38.666666666666664,
            36.786168898408306
        ],
        "wc_review_avg": [
            300.3333333333333,
            115.23695394948426
        ],
        "wc_reply_reviewers_avg": [
            10.166666666666666,
            12.83766160776781
        ],
        "wc_reply_authors_avg": [
            689.5,
            333.54397511172846
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.7453559924999298
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.5423261445466405,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10352553747540297185&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=bxITGFPVWh",
        "pdf": "https://openreview.net/pdf?id=bxITGFPVWh",
        "email": "msu.edu;msu.edu;sony.com;msu.edu;msu.edu;msu.edu;ibm.com;msu.edu",
        "author_num": 8,
        "aff_unique_index": "0;0;1;0;0;0;2;0",
        "aff_unique_norm": "Michigan State University;Sony Europe;International Business Machines Corporation",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.msu.edu;https://www.sony.eu;https://www.ibm.com",
        "aff_unique_abbr": "MSU;Sony Europe;IBM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0;0;0;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "title": "AlignDiff: Aligning Diverse Human Preferences via Behavior-Customisable Diffusion Model",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18315",
        "id": "bxfKIYfHyx",
        "author_site": "Zibin Dong, Yifu Yuan, Jianye HAO, Fei Ni, Yao Mu, YAN ZHENG, Yujing Hu, Tangjie Lv, Changjie Fan, Zhipeng Hu",
        "tldr": "",
        "abstract": "Aligning agent behaviors with diverse human preferences remains a challenging problem in reinforcement learning (RL), owing to the inherent abstractness and mutability of human preferences. To address these issues, we propose AlignDiff, a novel framework that leverages RLHF to quantify human preferences, covering abstractness, and utilizes them to guide diffusion planning for zero-shot behavior customizing, covering mutability. AlignDiff can accurately match user-customized behaviors and efficiently switch from one to another. To build the framework, we first establish the multi-perspective human feedback datasets, which contain comparisons for the attributes of diverse behaviors, and then train an attribute strength model to predict quantified relative strengths. After relabeling behavioral datasets with relative strengths, we proceed to train an attribute-conditioned diffusion model, which serves as a planner with the attribute strength model as a director for preference aligning at the inference phase. We evaluate AlignDiff on various locomotion tasks and demonstrate its superior performance on preference matching, switching, and covering compared to other baselines. Its capability of completing unseen downstream tasks under human instructions also showcases the promising potential for human-AI collaboration. More visualization videos are released on https://aligndiff.github.io/.",
        "keywords": "Reinforcement learning; Diffusion models; RLHF; Preference aligning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Zibin Dong;Yifu Yuan;Jianye HAO;Fei Ni;Yao Mu;YAN ZHENG;Yujing Hu;Tangjie Lv;Changjie Fan;Zhipeng Hu",
        "authorids": "~Zibin_Dong1;~Yifu_Yuan1;~Jianye_HAO1;~Fei_Ni1;~Yao_Mu1;~YAN_ZHENG1;~Yujing_Hu2;~Tangjie_Lv1;~Changjie_Fan1;~Zhipeng_Hu1",
        "gender": "M;M;M;M;M;M;;M;M;M",
        "homepage": "https://github.com/GrandpaDZB;https://yifu-yuan.github.io/;http://www.icdai.org/jianye.html;https://fei-ni.github.io/;https://yaomarkmu.github.io/;https://yanzzzzz.github.io;;;;",
        "dblp": "358/5885;261/3688;21/7664.html;11/579-1;260/0674;10/2381-2;https://dblp.uni-trier.de/pid/160/1923.html;;71/882;",
        "google_scholar": "JQ6881QAAAAJ;83JhosMAAAAJ;;https://scholar.google.com.hk/citations?hl=zh-CN;;https://scholar.google.com.hk/citations?user=tJuhd1kAAAAJ;IR5WY-wAAAAJ;EIuWpJcAAAAJ;;",
        "orcid": "0000-0002-2986-6022;0009-0009-2194-942X;0000-0002-0422-8235;0009-0007-5623-2782;;;;0000-0001-9858-809X;0000-0001-5420-0516;0000-0003-4367-0816",
        "linkedin": ";;;;;;;;;zhipeng-hu-471b5346?trk=pub-pbmap&originalSubdomain=bd",
        "or_profile": "~Zibin_Dong1;~Yifu_Yuan1;~Jianye_HAO1;~Fei_Ni1;~Yao_Mu1;~YAN_ZHENG1;~Yujing_Hu2;~Tangjie_Lv1;~Changjie_Fan1;~Zhipeng_Hu1",
        "aff": "Tianjin University;Tianjin University;Tianjin University;Tianjin University;The University of Hong Kong;Tianjin Unibersity, China;NetEase, Inc.;NetEase, Inc.;Netease, Fuxi AI Lab;Zhejiang University, Tsinghua University",
        "aff_domain": "tju.edu.cn;tju.edu.cn;tju.edu.cn;tju.edu.cn;hku.hk;tju.edu.cn;corp.netease.com;netease.com;corp.netease.com;zju.edu.cn",
        "position": "MS student;PhD student;Associate Professor;PhD student;PhD student;Associate Professor;Researcher;Researcher;Principal Researcher;PhD student",
        "bibtex": "@inproceedings{\ndong2024aligndiff,\ntitle={AlignDiff: Aligning Diverse Human Preferences via Behavior-Customisable Diffusion Model},\nauthor={Zibin Dong and Yifu Yuan and Jianye HAO and Fei Ni and Yao Mu and YAN ZHENG and Yujing Hu and Tangjie Lv and Changjie Fan and Zhipeng Hu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=bxfKIYfHyx}\n}",
        "github": "",
        "project": "",
        "reviewers": "t4Ww;SGJ2;pwJk;WtmM",
        "pdf_size": 1865255,
        "rating": "6;6;8;8",
        "confidence": "3;3;2;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;4",
        "wc_summary": "66;120;64;85",
        "wc_strengths": "83;24;46;65",
        "wc_weaknesses": "84;250;44;50",
        "wc_questions": "18;5;5;2",
        "wc_review": "251;399;159;202",
        "wc_reply_reviewers": "16;0;0;0",
        "wc_reply_authors": "1091;1824;265;496",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "2;3;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            83.75,
            22.47637648732553
        ],
        "wc_strengths_avg": [
            54.5,
            21.937410968480304
        ],
        "wc_weaknesses_avg": [
            107.0,
            83.95832299420945
        ],
        "wc_questions_avg": [
            7.5,
            6.18465843842649
        ],
        "wc_review_avg": [
            252.75,
            90.49412964386143
        ],
        "wc_reply_reviewers_avg": [
            4.0,
            6.928203230275509
        ],
        "wc_reply_authors_avg": [
            919.0,
            603.1695449871454
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 36,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5276399741316719193&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=bxfKIYfHyx",
        "pdf": "https://openreview.net/pdf?id=bxfKIYfHyx",
        "email": "tju.edu.cn;tju.edu.cn;tju.edu.cn;tju.edu.cn;hku.hk;tju.edu.cn;corp.netease.com;netease.com;corp.netease.com;zju.edu.cn",
        "author_num": 10,
        "aff_unique_index": "0;0;0;0;1;0;2;2;3;4",
        "aff_unique_norm": "Tianjin University;University of Hong Kong;NetEase, Inc.;Netease;Zhejiang University",
        "aff_unique_dep": ";;;Fuxi AI Lab;",
        "aff_unique_url": "http://www.tju.edu.cn;https://www.hku.hk;https://www.163.com;https://www.netease.com;http://www.zju.edu.cn",
        "aff_unique_abbr": "TJU;HKU;NetEase;Netease;ZJU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "bzO7cusxBl",
        "title": "Cross-domain Few-shot Classification via Maximization Optimized Kernel Dependence",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In cross-domain few-shot classification, \\emph{nearest centroid classifier} (NCC) aims to learn representations to construct a metric space where few-shot classification can be performed by measuring the similarities between samples and the prototype of each class. An intuition behind NCC is that each sample is pulled closer to the class centroid it belongs to while pushed away from other classes. However, in this paper, we find that there exist high similarities between NCC-learned representations of two samples from different classes. These undesirable high similarities may induce uncertainty and further result in incorrect classification of samples. In order to solve this problem, we propose a bi-level optimization framework, \\emph{maximizing optimized kernel dependence} (MOKD), to learn better similarities (dependence) among samples so that similarities among samples belonging to the same class are maximized while similarities between samples from different classes are minimized. Specifically, MOKD first optimizes the kernel \\emph{Hilbert-Schmidt Independence Criterion} (HSIC) by maximizing its test power to obtain a powerful kernel dependence measure, the optimized kernel HSIC (opt-HSIC). Then, an optimization problem w.r.t. the opt-HSIC is solved to maximize the similarities among samples belonging to the same class while minimizing the similarities among all samples simultaneously. Since kernel HSIC with large test power is sensitive to dependence, it can precisely measure the dependence among representations of samples. Extensive experiments on the popular benchmark Meta-Dataset show that MOKD can achieve \\emph{state-of-the-art} generalization performance on unseen domains under most task settings and is able to learn better data clusters.",
        "keywords": "cross-domain;few-shot classification;hilbert-schmidt independent criterion;computer vision;deep learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/23e5e08186a34128b2e6ae49fe575a700c3c07be.zip",
        "author": "Hongduan Tian;Feng Liu;Tongliang Liu;Bo Du;Yiu-ming Cheung;Bo Han",
        "authorids": "~Hongduan_Tian1;~Feng_Liu2;~Tongliang_Liu1;~Bo_Du3;~Yiu-ming_Cheung1;~Bo_Han1",
        "gender": "M;M;M;;;",
        "homepage": "https://hongduantian.github.io/;https://fengliu90.github.io/index.html;https://tongliang-liu.github.io/;;;",
        "dblp": "270/0676;77/1318-3;150/6667;;;",
        "google_scholar": "07lUB9kAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com.au/citations?user=EiLdZ_YAAAAJ;;;",
        "orcid": ";0000-0002-5005-9129;;;;",
        "linkedin": ";alexfengliu;;;;",
        "or_profile": "~Hongduan_Tian1;~Feng_Liu2;~Tongliang_Liu1;~Bo_Du3;~Yiu-ming_Cheung1;~Bo_Han1",
        "aff": "Hong Kong Baptist University;University of Melbourne;Mohamed bin Zayed University of Artificial Intelligence;;;",
        "aff_domain": "hkbu.edu.hk;unimelb.edu.au;mbzuai.ac.ae;;;",
        "position": "PhD student;Assistant Professor;Affiliated Associate Professor;;;",
        "bibtex": "@misc{\ntian2024crossdomain,\ntitle={Cross-domain Few-shot Classification via Maximization Optimized Kernel Dependence},\nauthor={Hongduan Tian and Feng Liu and Tongliang Liu and Bo Du and Yiu-ming Cheung and Bo Han},\nyear={2024},\nurl={https://openreview.net/forum?id=bzO7cusxBl}\n}",
        "github": "",
        "project": "",
        "reviewers": "rkmN;EDLJ;hhDT;qXag",
        "site": "https://openreview.net/forum?id=bzO7cusxBl",
        "pdf_size": 4119734,
        "rating": "5;6;6;8",
        "confidence": "4;3;4;4",
        "soundness": "3;3;3;4",
        "contribution": "2;3;3;4",
        "presentation": "2;3;3;3",
        "wc_summary": "110;81;66;255",
        "wc_strengths": "86;78;65;167",
        "wc_weaknesses": "251;38;55;145",
        "wc_questions": "39;34;21;130",
        "wc_review": "486;231;207;697",
        "wc_reply_reviewers": "410;11;8;33",
        "wc_reply_authors": "4126;1128;754;878",
        "reply_reviewers": "6;1;1;1",
        "reply_authors": "12;5;3;4",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            128.0,
            75.0099993334222
        ],
        "wc_strengths_avg": [
            99.0,
            39.96873778342268
        ],
        "wc_weaknesses_avg": [
            122.25,
            84.7271355588043
        ],
        "wc_questions_avg": [
            56.0,
            43.22614949310197
        ],
        "wc_review_avg": [
            405.25,
            200.81381302091745
        ],
        "wc_reply_reviewers_avg": [
            115.5,
            170.3034057204964
        ],
        "wc_reply_authors_avg": [
            1721.5,
            1394.7590293667217
        ],
        "reply_reviewers_avg": [
            2.25,
            2.165063509461097
        ],
        "reply_authors_avg": [
            6.0,
            3.5355339059327378
        ],
        "replies_avg": [
            41,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.13245323570650439,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:BuykhRieSFsJ:scholar.google.com/&scioq=Cross-domain+Few-shot+Classification+via+Maximization+Optimized+Kernel+Dependence&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Hong Kong Baptist University;University of Melbourne;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.hkbu.edu.hk;https://www.unimelb.edu.au;https://mbzuai.ac.ae",
        "aff_unique_abbr": "HKBU;UniMelb;MBZUAI",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;1;2",
        "aff_country_unique": "China;Australia;United Arab Emirates"
    },
    {
        "title": "Prioritized Soft Q-Decomposition for Lexicographic Reinforcement Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18314",
        "id": "c0MyyXyGfn",
        "author_site": "Finn Rietz, Erik Schaffernicht, Stefan Heinrich, Johannes A. Stork",
        "tldr": "",
        "abstract": "Reinforcement learning (RL) for complex tasks remains a challenge, primarily due to the difficulties of engineering scalar reward functions and the inherent inefficiency of training models from scratch. Instead, it would be better to specify complex tasks in terms of elementary subtasks and to reuse subtask solutions whenever possible. In this work, we address continuous space lexicographic multi-objective RL problems, consisting of prioritized subtasks, which are notoriously difficult to solve. We show that these can be scalarized with a subtask transformation and then solved incrementally using value decomposition. Exploiting this insight, we propose prioritized soft Q-decomposition (PSQD), a novel algorithm for learning and adapting subtask solutions under lexicographic priorities in continuous state-action spaces. PSQD offers the ability to reuse previously learned subtask solutions in a zero-shot composition, followed by an adaptation step. Its ability to use retained subtask training data for offline learning eliminates the need for new environment interaction during adaptation. We demonstrate the efficacy of our approach by presenting successful learning, reuse, and adaptation results for both low- and high-dimensional simulated robot control tasks, as well as offline learning results. In contrast to baseline approaches, PSQD does not trade off between conflicting subtasks or priority constraints and satisfies subtask priorities during learning. PSQD provides an intuitive framework for tackling complex RL problems, offering insights into the inner workings of the subtask composition.",
        "keywords": "Multi-Objective Reinforcement Learning;Lexicographic Task Priorities;Constrained RL;Transfer RL",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Finn Rietz;Erik Schaffernicht;Stefan Heinrich;Johannes A. Stork",
        "authorids": "~Finn_Rietz1;~Erik_Schaffernicht1;~Stefan_Heinrich1;~Johannes_A._Stork1",
        "gender": "M;M;;",
        "homepage": "https://www.finnrietz.dev/;;https://stefanheinrich.net;",
        "dblp": "298/6359;85/5178;30/2130;",
        "google_scholar": "U2HsJNgAAAAJ;https://scholar.google.se/citations?hl=sv;https://scholar.google.de/citations?user=hHx7vgoAAAAJ;",
        "orcid": "0000-0001-8151-4692;0000-0002-0804-8637;0000-0001-9913-3206;",
        "linkedin": ";;stefan-heinrich-30a44111b/;",
        "or_profile": "~Finn_Rietz1;~Erik_Schaffernicht1;~Stefan_Heinrich1;~Johannes_A._Stork1",
        "aff": "Microsoft;\u00d6rebro University;IT University of Copenhagen;",
        "aff_domain": "microsoft.com;oru.se;itu.dk;",
        "position": "Intern;Lecturer;Associate Professor;",
        "bibtex": "@inproceedings{\nrietz2024prioritized,\ntitle={Prioritized Soft Q-Decomposition for Lexicographic Reinforcement Learning},\nauthor={Finn Rietz and Erik Schaffernicht and Stefan Heinrich and Johannes A. Stork},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=c0MyyXyGfn}\n}",
        "github": "",
        "project": "",
        "reviewers": "SKG7;rq81;tsYf",
        "pdf_size": 4912922,
        "rating": "5;6;6",
        "confidence": "4;3;4",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "2;3;2",
        "wc_summary": "94;52;136",
        "wc_strengths": "36;23;132",
        "wc_weaknesses": "292;35;333",
        "wc_questions": "118;87;87",
        "wc_review": "540;197;688",
        "wc_reply_reviewers": "0;49;0",
        "wc_reply_authors": "754;733;720",
        "reply_reviewers": "0;1;0",
        "reply_authors": "1;2;1",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            94.0,
            34.292856398964496
        ],
        "wc_strengths_avg": [
            63.666666666666664,
            48.60955553066587
        ],
        "wc_weaknesses_avg": [
            220.0,
            131.88125972505216
        ],
        "wc_questions_avg": [
            97.33333333333333,
            14.613540144521982
        ],
        "wc_review_avg": [
            475.0,
            205.65180929587433
        ],
        "wc_reply_reviewers_avg": [
            16.333333333333332,
            23.098821518760555
        ],
        "wc_reply_authors_avg": [
            735.6666666666666,
            14.007934259633798
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14723410194123728525&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=c0MyyXyGfn",
        "pdf": "https://openreview.net/pdf?id=c0MyyXyGfn",
        "email": "microsoft.com;oru.se;itu.dk;",
        "author_num": 4,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Microsoft;\u00d6rebro University;IT University of Copenhagen",
        "aff_unique_dep": "Microsoft Corporation;;",
        "aff_unique_url": "https://www.microsoft.com;https://www.oru.se;https://itu.dk",
        "aff_unique_abbr": "Microsoft;\u00d6rebro U;ITU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2",
        "aff_country_unique": "United States;Sweden;Denmark"
    },
    {
        "title": "Zero-Shot Robotic Manipulation with Pre-Trained Image-Editing Diffusion Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18313",
        "id": "c0chJTSbci",
        "author_site": "Kevin Black, Mitsuhiko Nakamoto, Pranav Atreya, Homer Walke, Chelsea Finn, Aviral Kumar, Sergey Levine",
        "tldr": "",
        "abstract": "If generalist robots are to operate in truly unstructured environments, they need to be able to recognize and reason about novel objects and scenarios. Such objects and scenarios might not be present in the robot\u2019s own training data. We propose SuSIE, a method that leverages an image-editing diffusion model to act as a high-level planner by proposing intermediate subgoals that a low-level controller can accomplish. Specifically, we finetune InstructPix2Pix on video data, consisting of both human videos and robot rollouts, such that it outputs hypothetical future \u201csubgoal\u201d observations given the robot\u2019s current observation and a language command. We also use the robot data to train a low-level goal-conditioned policy to act as the aforementioned low-level controller. We find that the high-level subgoal predictions can utilize Internet scale pretraining and visual understanding to guide the low-level goal-conditioned policy, achieving significantly better generalization and precision than conventional language-conditioned policies. We achieve state-of-the-art results on the CALVIN benchmark, and also demonstrate robust generalization on real-world manipulation tasks, beating strong baselines that have access to privileged information or that utilize orders of magnitude more compute and training data. The project website can be found at http://rail-berkeley.github.io/susie.",
        "keywords": "robot learning;diffusion model",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/1674c6d00b0e3e294c545ab2398d5ab5382e0713.zip",
        "author": "Kevin Black;Mitsuhiko Nakamoto;Pranav Atreya;Homer Rich Walke;Chelsea Finn;Aviral Kumar;Sergey Levine",
        "authorids": "~Kevin_Black2;~Mitsuhiko_Nakamoto1;~Pranav_Atreya1;~Homer_Rich_Walke1;~Chelsea_Finn1;~Aviral_Kumar2;~Sergey_Levine1",
        "gender": ";;;M;F;M;M",
        "homepage": "https://kevin.black;https://nakamotoo.github.io/;https://pranavatreya.github.io;https://homerwalke.com;https://ai.stanford.edu/~cbfinn/;https://aviralkumar2907.github.io/;https://people.eecs.berkeley.edu/~svlevine/",
        "dblp": "66/9687;;317/4655;279/6795;131/1783;202/7961;80/7594",
        "google_scholar": "axX7PCwAAAAJ;wIDVzroAAAAJ;bQowYEYAAAAJ;ZWH5jCwAAAAJ;vfPE6hgAAAAJ;;8R35rCwAAAAJ",
        "orcid": ";;;;;;",
        "linkedin": ";;pranav-d-atreya;;;;",
        "or_profile": "~Kevin_Black2;~Mitsuhiko_Nakamoto1;~Pranav_Atreya1;~Homer_Rich_Walke1;~Chelsea_Finn1;~Aviral_Kumar2;~Sergey_Levine1",
        "aff": "University of California, Berkeley;University of California, Berkeley;University of California, Berkeley;University of California, Berkeley;Google;Google DeepMind;Google",
        "aff_domain": "berkeley.edu;eecs.berkeley.edu;berkeley.edu;berkeley.edu;google.com;google.com;google.com",
        "position": "PhD student;PhD student;PhD student;PhD student;Research Scientist;Researcher;Research Scientist",
        "bibtex": "@inproceedings{\nblack2024zeroshot,\ntitle={Zero-Shot Robotic Manipulation with Pre-Trained Image-Editing Diffusion Models},\nauthor={Kevin Black and Mitsuhiko Nakamoto and Pranav Atreya and Homer Rich Walke and Chelsea Finn and Aviral Kumar and Sergey Levine},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=c0chJTSbci}\n}",
        "github": "",
        "project": "",
        "reviewers": "rGNF;choL;rx11;UFZY",
        "pdf_size": 17764880,
        "rating": "5;6;6;8",
        "confidence": "4;4;3;4",
        "soundness": "2;3;3;2",
        "contribution": "2;3;2;2",
        "presentation": "4;3;3;3",
        "wc_summary": "70;104;213;232",
        "wc_strengths": "60;105;120;93",
        "wc_weaknesses": "113;129;89;414",
        "wc_questions": "125;91;521;17",
        "wc_review": "368;429;943;756",
        "wc_reply_reviewers": "42;139;95;35",
        "wc_reply_authors": "1406;1313;1731;716",
        "reply_reviewers": "1;2;1;1",
        "reply_authors": "5;4;4;3",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            154.75,
            69.13528404512417
        ],
        "wc_strengths_avg": [
            94.5,
            22.096379793984354
        ],
        "wc_weaknesses_avg": [
            186.25,
            132.25992401328529
        ],
        "wc_questions_avg": [
            188.5,
            195.89984686058332
        ],
        "wc_review_avg": [
            624.0,
            235.9798720230181
        ],
        "wc_reply_reviewers_avg": [
            77.75,
            42.29287765097097
        ],
        "wc_reply_authors_avg": [
            1291.5,
            366.71957951546574
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.0,
            0.7071067811865476
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.13245323570650439,
        "gs_citation": 123,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10608142831972255292&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=c0chJTSbci",
        "pdf": "https://openreview.net/pdf?id=c0chJTSbci",
        "email": "berkeley.edu;eecs.berkeley.edu;berkeley.edu;berkeley.edu;google.com;google.com;google.com",
        "author_num": 7,
        "aff_unique_index": "0;0;0;0;1;1;1",
        "aff_unique_norm": "University of California, Berkeley;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.berkeley.edu;https://www.google.com",
        "aff_unique_abbr": "UC Berkeley;Google",
        "aff_campus_unique_index": "0;0;0;0;1;1",
        "aff_campus_unique": "Berkeley;Mountain View;",
        "aff_country_unique_index": "0;0;0;0;0;1;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "c0kTH3HVLz",
        "title": "A Light-robust Reconstruction Method for Spike Camera",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Spike camera with high temporal resolution can fire continuous binary spike streams to record per-pixel light intensity. By using reconstruction methods, the scene details in high-speed scenes can be restored from spike streams. However, existing methods struggle to perform well in low-light environments due to insufficient information in spike streams. To this end, we propose a recurrent-based reconstruction framework to better handle such extreme condition. In more detail, a light-robust representation (LR-Rep) is designed to aggregate temporal information in spike streams. Moreover, a fusion module is used to extract temporal features. Besides, we synthesize a reconstruction benchmark for high-speed low-light scenes where light sources are carefully designed to be consistent with reality. The experiment shows the superiority of our method. Importantly, our method also generalizes well to real spike streams. All codes and constructed datasets will be released after publication.",
        "keywords": "Computer vision;Neuromorphic sensor;Spike stream;Reconstruction",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/b2d59d8c265f8f98839606207f9da5a93aa1b7a2.zip",
        "author": "Liwen Hu;Ziluo Ding;Mianzhi Liu;Lei Ma;Tiejun Huang",
        "authorids": "~Liwen_Hu2;~Ziluo_Ding1;~Mianzhi_Liu1;~Lei_Ma3;~Tiejun_Huang1",
        "gender": "M;M;Not Specified;M;M",
        "homepage": ";https://github.com/violedo;https://nbic.pku.edu.cn/rcdw/kyry/02c5f5ce8e254b1e82a48bebd0a24c33.htm;https://idm.pku.edu.cn/~tjhuang/;",
        "dblp": "267/2359;;20/6534-8;h/TiejunHuang;",
        "google_scholar": ";;;https://scholar.google.com.tw/citations?user=knvEK4AAAAAJ;https://scholar.google.com/citations?view_op=list_works",
        "orcid": ";;0000-0001-6024-3854;0000-0002-4234-6099;0000-0002-0257-5292",
        "linkedin": "ziluo/;;maleiwhat/;;",
        "or_profile": "~Ziluo_Ding1;~Mianzhi_Liu1;~Lei_Ma3;~Tiejun_Huang1;~Hu_Liwen1",
        "aff": "BAAI;Peking University;Beijing Academy of Artifical Intelligence;Peking University;Peking University",
        "aff_domain": "baai.ac.cn;pku.edu.cn;baai.ac.cn;pku.edu.cn;pku.edu.cn",
        "position": "Researcher;MS student;Principal Researcher;Full Professor;PhD student",
        "bibtex": "@misc{\nhu2024a,\ntitle={A Light-robust Reconstruction Method for Spike Camera},\nauthor={Liwen Hu and Ziluo Ding and Mianzhi Liu and Lei Ma and Tiejun Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=c0kTH3HVLz}\n}",
        "github": "",
        "project": "",
        "reviewers": "bgSj;rqug;sPKH;ajbr",
        "site": "https://openreview.net/forum?id=c0kTH3HVLz",
        "pdf_size": 5236583,
        "rating": "5;5;6;8",
        "confidence": "4;4;3;3",
        "soundness": "2;2;3;3",
        "contribution": "3;3;3;3",
        "presentation": "1;1;2;2",
        "wc_summary": "77;97;141;14",
        "wc_strengths": "19;73;26;35",
        "wc_weaknesses": "16;295;105;54",
        "wc_questions": "350;58;31;2",
        "wc_review": "462;523;303;105",
        "wc_reply_reviewers": "0;0;0;66",
        "wc_reply_authors": "597;1111;444;477",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "4;5;3;3",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            82.25,
            45.702160780427
        ],
        "wc_strengths_avg": [
            38.25,
            20.849160654568326
        ],
        "wc_weaknesses_avg": [
            117.5,
            107.23455599758876
        ],
        "wc_questions_avg": [
            110.25,
            139.82913680631802
        ],
        "wc_review_avg": [
            348.25,
            161.78284056104343
        ],
        "wc_reply_reviewers_avg": [
            16.5,
            28.578838324886476
        ],
        "wc_reply_authors_avg": [
            657.25,
            268.0880219256355
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.75,
            0.82915619758885
        ],
        "replies_avg": [
            37,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.8164965809277259,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:uojQt9IwV_kJ:scholar.google.com/&scioq=A+Light-robust+Reconstruction+Method+for+Spike+Camera&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;1;1",
        "aff_unique_norm": "Beijing Academy of Artificial Intelligence;Peking University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.baaic.cn;http://www.pku.edu.cn",
        "aff_unique_abbr": "BAAI;Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "c0lGp17AjO",
        "title": "A Wasserstein-2 Distance for Efficient Reconstruction of Stochastic Differential Equations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We provide an analysis of the squared Wasserstein-2 ($W_2$) distance\nbetween two probability distributions associated with two stochastic\ndifferential equations (SDEs). Based on this analysis, we propose a\nnovel squared $W_2$ distance-based loss function for efficiently\nreconstructing SDEs from noisy data. To demonstrate the utility of\nusing our Wasserstein distance-based loss function, we carry out\nnumerical experiments that show its efficiency in reconstructing SDEs.",
        "keywords": "Neural Stochastic Differential Equation;Wasserstein distance;Uncertainty Quantification;Inverse problem",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/9267ff35c7f06555242254bc0d3ec09d3fdb9f03.zip",
        "author": "Mingtao Xia;Xiangting Li;Qijing Shen;Tom Chou",
        "authorids": "~Mingtao_Xia1;~Xiangting_Li1;~Qijing_Shen1;~Tom_Chou1",
        "gender": "M;M;F;Not Specified",
        "homepage": "https://www.math.ucla.edu/~xiamingtao/;https://hsianktin.github.io/;https://reuben.ox.ac.uk/people/qijing-shen;https://www.math.ucla.edu/~tchou/",
        "dblp": ";;;",
        "google_scholar": "HsMuMhIAAAAJ;;;",
        "orcid": "0000-0002-2116-4712;0000-0001-5238-7364;;",
        "linkedin": ";;;",
        "or_profile": "~Mingtao_Xia1;~Xiangting_Li1;~Qijing_Shen1;~Thomas_Chou1",
        "aff": "New York University;University of California, Los Angeles;University of Oxford;University of California, Los Angeles",
        "aff_domain": "nyu.edu;ucla.edu;ox.ac.uk;ucla.edu",
        "position": "Instructor;PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nxia2024a,\ntitle={A Wasserstein-2 Distance for Efficient Reconstruction of Stochastic Differential Equations},\nauthor={Mingtao Xia and Xiangting Li and Qijing Shen and Tom Chou},\nyear={2024},\nurl={https://openreview.net/forum?id=c0lGp17AjO}\n}",
        "github": "",
        "project": "",
        "reviewers": "2Kjt;ioMy;fb1D;NdWD;pb7V",
        "site": "https://openreview.net/forum?id=c0lGp17AjO",
        "pdf_size": 2582632,
        "rating": "3;6;6;6;6",
        "confidence": "2;3;1;4;4",
        "soundness": "2;2;4;2;3",
        "contribution": "2;2;3;2;2",
        "presentation": "2;3;3;2;2",
        "wc_summary": "15;108;71;65;86",
        "wc_strengths": "12;93;39;60;24",
        "wc_weaknesses": "5;137;55;314;127",
        "wc_questions": "8;98;76;207;88",
        "wc_review": "40;436;241;646;325",
        "wc_reply_reviewers": "0;387;16;0;18",
        "wc_reply_authors": "657;1385;886;1430;1360",
        "reply_reviewers": "0;2;1;0;1",
        "reply_authors": "2;4;3;3;4",
        "rating_avg": [
            5.4,
            1.2
        ],
        "confidence_avg": [
            2.8,
            1.16619037896906
        ],
        "soundness_avg": [
            2.6,
            0.8
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            69.0,
            30.809089567853185
        ],
        "wc_strengths_avg": [
            45.6,
            28.611885642159272
        ],
        "wc_weaknesses_avg": [
            127.6,
            105.00971383638753
        ],
        "wc_questions_avg": [
            95.4,
            64.07995006240252
        ],
        "wc_review_avg": [
            337.6,
            201.41956210854994
        ],
        "wc_reply_reviewers_avg": [
            84.2,
            151.59208422605715
        ],
        "wc_reply_authors_avg": [
            1143.6,
            313.13422042312783
        ],
        "reply_reviewers_avg": [
            0.8,
            0.7483314773547883
        ],
        "reply_authors_avg": [
            3.2,
            0.7483314773547882
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3429971702850177,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:h37G06MdnIQJ:scholar.google.com/&scioq=A+Wasserstein-2+Distance+for+Efficient+Reconstruction+of+Stochastic+Differential+Equations&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "New York University;University of California, Los Angeles;University of Oxford",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.nyu.edu;https://www.ucla.edu;https://www.ox.ac.uk",
        "aff_unique_abbr": "NYU;UCLA;Oxford",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Los Angeles",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "c1QBcYLd7f",
        "title": "Deep graph kernel point processes",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Point process models are widely used for continuous asynchronous event data, where each data point includes time and additional information called ``marks'', which can be locations, nodes, or event types. In this paper, we present a novel point process model for discrete event data over graphs, where the event interaction occurs within a latent graph structure. Our model builds upon the classic influence kernel-based formulation by Hawkes in the original self-exciting point processes work to capture the influence of historical events on future events' occurrence. The key idea is to represent the influence kernel by Graph Neural Networks (GNN) to capture the underlying graph structure while harvesting the strong representation power of GNN. Compared with prior works that focus on directly modeling the conditional intensity function using neural networks, our kernel presentation herds the repeated event influence patterns more effectively by combining statistical and deep models, achieving better model estimation/learning efficiency and superior predictive performance. Our work significantly extends the existing deep spatio-temporal kernel for point process data, which is inapplicable to our setting due to the fundamental difference in the nature of the observation space being Euclidean rather than a graph. We present comprehensive experiments on synthetic and real-world data to show the superior performance of the proposed approach against the state-of-the-art in predicting future events and uncovering the relational structure among data.",
        "keywords": "Point processes over graphs;Deep kernel;Graph neural networks",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/372c78e9ecb05830d6badc8d1704296af090c2d3.zip",
        "author": "Zheng Dong;Matthew Repasky;Xiuyuan Cheng;Yao Xie",
        "authorids": "~Zheng_Dong3;~Matthew_Repasky1;~Xiuyuan_Cheng1;~Yao_Xie2",
        "gender": "M;M;;F",
        "homepage": "https://sites.google.com/view/zheng-dong/home;https://mrepasky3.github.io/;;http://www2.isye.gatech.edu/~yxie77",
        "dblp": ";324/2968;79/9747;13/4242-2",
        "google_scholar": "iqZN-q4AAAAJ;So4vCOYAAAAJ;I2gwdssAAAAJ;qvYp8ZQAAAAJ",
        "orcid": "0000-0002-1505-8569;0009-0007-0329-7515;;",
        "linkedin": "zheng-dong-23a264222/;;;yaoxie/",
        "or_profile": "~Zheng_Dong3;~Matthew_Repasky1;~Xiuyuan_Cheng1;~Yao_Xie2",
        "aff": "Georgia Institute of Technology;Georgia Institute of Technology;Duke University;Georgia Institute of Technology",
        "aff_domain": "gatech.edu;gatech.edu;duke.edu;gatech.edu",
        "position": "PhD student;PhD student;Associate Professor;Full Professor",
        "bibtex": "@misc{\ndong2024deep,\ntitle={Deep graph kernel point processes},\nauthor={Zheng Dong and Matthew Repasky and Xiuyuan Cheng and Yao Xie},\nyear={2024},\nurl={https://openreview.net/forum?id=c1QBcYLd7f}\n}",
        "github": "",
        "project": "",
        "reviewers": "XHVx;nvzU;o26h;E4mM",
        "site": "https://openreview.net/forum?id=c1QBcYLd7f",
        "pdf_size": 4549385,
        "rating": "5;5;6;8",
        "confidence": "3;3;5;4",
        "soundness": "3;2;3;4",
        "contribution": "2;2;3;4",
        "presentation": "3;3;2;4",
        "wc_summary": "44;61;78;99",
        "wc_strengths": "60;53;38;61",
        "wc_weaknesses": "100;115;664;65",
        "wc_questions": "18;33;6;202",
        "wc_review": "222;262;786;427",
        "wc_reply_reviewers": "0;114;0;0",
        "wc_reply_authors": "154;456;684;427",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;6;2;3",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            70.5,
            20.377683872314833
        ],
        "wc_strengths_avg": [
            53.0,
            9.192388155425117
        ],
        "wc_weaknesses_avg": [
            236.0,
            247.77106368581462
        ],
        "wc_questions_avg": [
            64.75,
            79.81658662208
        ],
        "wc_review_avg": [
            424.25,
            222.54255211082665
        ],
        "wc_reply_reviewers_avg": [
            28.5,
            49.363448015713004
        ],
        "wc_reply_authors_avg": [
            430.25,
            188.0004986695514
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            1.8708286933869707
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.4923659639173309,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=820551820841391315&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Georgia Institute of Technology;Duke University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.gatech.edu;https://www.duke.edu",
        "aff_unique_abbr": "Georgia Tech;Duke",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "c1xnHAcMhv",
        "title": "Generating Less Certain Adversarial Examples Improves Robust Generalization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recent studies have shown that deep neural networks are vulnerable to adversarial examples. Numerous defenses have been proposed to improve model robustness, among which adversarial training is most successful. In this work, we revisit the robust overfitting phenomenon. In particular, we argue that overconfident models produced during adversarial training could be a potential cause, supported by the empirical observation that the predicted labels of adversarial examples generated by models with better robust generalization ability tend to have significantly more even distributions. Based on the proposed definition of adversarial certainty, we incorporate an extragradient step in the adversarial training framework to search for models that can generate adversarially perturbed inputs with lower certainty, further improving robust generalization. Our approach is general and can be easily combined with other variants of adversarial training methods. Extensive experiments on image benchmarks demonstrate that our method effectively alleviates robust overfitting and is able to produce models with consistently improved robustness.",
        "keywords": "Adversarial Examples; Adversarial Training; Robust Generalization",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/e06580802548c846ff4cc155667090f5c95a87d0.pdf",
        "author": "Minxing Zhang;Michael Backes;Xiao Zhang",
        "authorids": "~Minxing_Zhang1;~Michael_Backes3;~Xiao_Zhang2",
        "gender": ";;M",
        "homepage": "https://minxingzhang.github.io/;;https://xiao-zhang.net",
        "dblp": "302/0867;;",
        "google_scholar": "wsSLja0AAAAJ;;L-lz7CUAAAAJ",
        "orcid": "0009-0005-6368-263X;;0009-0008-1837-7670",
        "linkedin": ";;",
        "or_profile": "~Minxing_Zhang1;~Michael_Backes3;~Xiao_Zhang2",
        "aff": "CISPA Helmholtz Center for Information Security;;CISPA Helmholtz Center for Information Security",
        "aff_domain": "cispa.saarland;;cispa.de",
        "position": "PhD student;;Tenure-Track Faculty",
        "bibtex": "@misc{\nzhang2024generating,\ntitle={Generating Less Certain Adversarial Examples Improves Robust Generalization},\nauthor={Minxing Zhang and Michael Backes and Xiao Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=c1xnHAcMhv}\n}",
        "github": "",
        "project": "",
        "reviewers": "QZ4H;aLt2;4Bie;v7sc;whj7",
        "site": "https://openreview.net/forum?id=c1xnHAcMhv",
        "pdf_size": 1285169,
        "rating": "3;3;5;5;5",
        "confidence": "4;4;4;3;4",
        "soundness": "2;2;3;2;2",
        "contribution": "2;2;3;2;3",
        "presentation": "3;2;2;3;3",
        "wc_summary": "113;262;115;49;95",
        "wc_strengths": "25;32;143;10;42",
        "wc_weaknesses": "192;811;632;64;580",
        "wc_questions": "45;154;227;2;4",
        "wc_review": "375;1259;1117;125;721",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            4.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.2,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            126.8,
            71.65584414407522
        ],
        "wc_strengths_avg": [
            50.4,
            47.45777070196196
        ],
        "wc_weaknesses_avg": [
            455.8,
            281.33140599655775
        ],
        "wc_questions_avg": [
            86.4,
            89.40380305110068
        ],
        "wc_review_avg": [
            719.4,
            429.22702617612515
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.408248290463863,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:LkqYAl3Hmz0J:scholar.google.com/&scioq=Generating+Less+Certain+Adversarial+Examples+Improves+Robust+Generalization&hl=en&as_sdt=0,5",
        "gs_version_total": 6,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "CISPA Helmholtz Center for Information Security",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cispa.de/",
        "aff_unique_abbr": "CISPA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "c2NEqCuq5D",
        "title": "DeCCaF: Deferral Under Cost and Capacity Constraints Framework",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The \\textit{learning to defer} (L2D) framework aims to improve human-AI collaboration systems by deferring decisions to humans when they are more likely to make the correct judgment than a ML classifier. Existing research in L2D overlooks key aspects of real-world systems that impede its practical adoption, such as: i) neglecting cost-sensitive scenarios; ii) requiring concurrent human predictions for every instance of the dataset in training and iii) not dealing with human capacity constraints. To address these issues, we propose the \\textit{deferral under cost and capacity constraint framework} (DeCCaF). A novel L2D approach: DeCCaF employs supervised learning to model the probability of human error with less restrictive data requirements (only one expert prediction per instance), and uses constraint programming to globally minimize error cost subject to capacity constraints. We employ DeCCaF in a cost-sensitive fraud detection setting with a team of 50 synthetic fraud analysts, subject to a wide array of realistic human work capacity constraints, showing that DeCCaF significantly outperforms L2D baselines, reducing average misclassification costs by 9 \\%. Our code and testbed are available at https://anonymous.4open.science/r/deccaf-1245/",
        "keywords": "Learning to Defer;Human-AI Teaming;Human-AI Collaboration",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/86ad89e3a2d89afd3c8d9c31c22a5a907808431c.zip",
        "author": "Jean Vieira Alves;Diogo Leit\u00e3o;S\u00e9rgio Jesus;Marco O. P. Sampaio;Pedro Saleiro;Mario A. T. Figueiredo;Pedro Bizarro",
        "authorids": "~Jean_Vieira_Alves1;~Diogo_Leit\u00e3o1;~S\u00e9rgio_Jesus1;~Marco_O._P._Sampaio1;~Pedro_Saleiro1;~Mario_A._T._Figueiredo1;~Pedro_Bizarro1",
        "gender": "F;M;;;;M;",
        "homepage": ";;;;;http://www.lx.it.pt/~mtf/;",
        "dblp": "365/5762;;;;145/9871;f/MarioATFigueiredo;b/PedroBizarro.html",
        "google_scholar": ";p8OzvNgAAAAJ;;Q7aHSI8AAAAJ;Wqz2hN4AAAAJ;S-pd0NwAAAAJ;",
        "orcid": ";;;;;0000-0002-0970-7745;",
        "linkedin": "jean-alves-92850a27a/;diogo-eira-leitao/;sergio-gabriel/;;;mario-figueiredo-138b099/;https://www.linkedin.com/mwlite/in/pedrobizarro",
        "or_profile": "~Jean_Vieira_Alves1;~Diogo_Leit\u00e3o1;~S\u00e9rgio_Jesus1;~Marco_O._P._Sampaio1;~Pedro_Saleiro1;~Mario_A._T._Figueiredo1;~Pedro_Bizarro1",
        "aff": "Feedzai;;Feedzai;;Feedzai;Instituto de Telecomunica\u00e7\u00f5es, Portugal;Feedzai",
        "aff_domain": "feedzai.com;;feedzai.com;;feedzai.com;it.pt;feedzai.com",
        "position": "Researcher;;Data Scientist;;Director of Research;Senior Researcher;Principal Researcher",
        "bibtex": "@misc{\nalves2024deccaf,\ntitle={De{CC}aF: Deferral Under Cost and Capacity Constraints Framework},\nauthor={Jean Vieira Alves and Diogo Leit{\\~a}o and S{\\'e}rgio Jesus and Marco O. P. Sampaio and Pedro Saleiro and Mario A. T. Figueiredo and Pedro Bizarro},\nyear={2024},\nurl={https://openreview.net/forum?id=c2NEqCuq5D}\n}",
        "github": "",
        "project": "",
        "reviewers": "eN7q;2idL;LUVz;Ygwy",
        "site": "https://openreview.net/forum?id=c2NEqCuq5D",
        "pdf_size": 1434860,
        "rating": "3;3;3;5",
        "confidence": "3;3;4;4",
        "soundness": "2;2;2;2",
        "contribution": "2;2;1;2",
        "presentation": "2;2;2;2",
        "wc_summary": "106;22;158;46",
        "wc_strengths": "52;15;46;44",
        "wc_weaknesses": "108;143;844;250",
        "wc_questions": "32;44;337;151",
        "wc_review": "298;224;1385;491",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            83.0,
            53.018864567246254
        ],
        "wc_strengths_avg": [
            39.25,
            14.306903927824496
        ],
        "wc_weaknesses_avg": [
            336.25,
            297.78043505240566
        ],
        "wc_questions_avg": [
            141.0,
            122.27632640867161
        ],
        "wc_review_avg": [
            599.5,
            463.86555164185233
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:1cGm1igbhXMJ:scholar.google.com/&scioq=DeCCaF:+Deferral+Under+Cost+and+Capacity+Constraints+Framework&hl=en&as_sdt=0,47",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "Feedzai;Instituto de Telecomunica\u00e7\u00f5es",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.feedzai.com;https://www.it.pt",
        "aff_unique_abbr": "Feedzai;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Portugal"
    },
    {
        "title": "The All-Seeing Project: Towards Panoptic Visual Recognition and Understanding of the Open World",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18312",
        "id": "c2R7ajodcI",
        "author_site": "Weiyun Wang, Min Shi, Qingyun Li, Wenhai Wang, Zhenhang Huang, Linjie Xing, Zhe Chen, Hao Li, Xizhou Zhu, Zhiguo Cao, Yushi Chen, Tong Lu, Jifeng Dai, Yu Qiao",
        "tldr": "",
        "abstract": "We present the All-Seeing (AS) project: a large-scale dataset and model for recognizing and understanding everything in the open world.\nUsing a scalable data engine that incorporates human feedback and efficient models in the loop, we create a new dataset (AS-1B) with over 1.2 billion regions annotated with semantic tags, question-answering pairs, and detailed captions. It covers a wide range of 3.5 million common and rare concepts in the real world and has 132.2 billion tokens that describe the concepts and their attributes. Leveraging this new dataset, we develop the All-Seeing model (ASM), a unified framework for panoptic visual recognition and understanding. The model is trained with open-ended language prompts and locations, which allows it to generalize to various vision and language tasks with remarkable zero-shot performance, including both region- and image-level retrieval, region recognition, captioning, and question-answering. We hope that this project can serve as a foundation for vision-language artificial general intelligence research. Code is available at https://github.com/OpenGVLab/all-seeing.",
        "keywords": "vision-language;open-world;region-text;object recognition",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Weiyun Wang;Min Shi;Qingyun Li;Wenhai Wang;Zhenhang Huang;Linjie Xing;Zhe Chen;Hao Li;Xizhou Zhu;Zhiguo Cao;Yushi Chen;Tong Lu;Jifeng Dai;Yu Qiao",
        "authorids": "~Weiyun_Wang2;~Min_Shi2;~Qingyun_Li1;~Wenhai_Wang2;~Zhenhang_Huang1;~Linjie_Xing1;~Zhe_Chen10;~Hao_Li13;~Xizhou_Zhu1;~Zhiguo_Cao1;~Yushi_Chen2;~Tong_Lu1;~Jifeng_Dai1;~Yu_Qiao1",
        "gender": ";M;M;;M;;M;M;;M;M;M;M;",
        "homepage": ";;https://github.com/Li-Qingyun;;https://scholar.google.com.hk/citations?user=h2-E_noAAAAJ&hl=zh-CN;http;https://czczup.github.io/;https://cpsxhao.github.io;;http://faculty.hust.edu.cn/caozhiguo1/zh_CN/index.htm;http://homepage.hit.edu.cn/chenyushi;https://cs.nju.edu.cn/lutong/;https://jifengdai.org/;",
        "dblp": ";03/1086-4;65/10015;;274/1702;;06/4240-17;17/5705-69.html;170/1608;01/4449-1;;;14/9399;",
        "google_scholar": ";;https://scholar.google.com/citations?hl=zh-CN;;https://scholar.google.com.hk/citations?user=h2-E_noAAAAJ;;j1rq_lYAAAAJ;qHqQsY4AAAAJ;02RXI00AAAAJ;396o2BAAAAAJ;;;SH_-B_AAAAAJ;",
        "orcid": ";0000-0001-8209-9021;0000-0001-5101-4937;;0000-0002-1925-2924;;;0000-0002-4612-0740;;0000-0002-9223-1863;;;;",
        "linkedin": ";;;;;;;;;;;;;",
        "or_profile": "~Weiyun_Wang2;~Min_Shi2;~Qingyun_Li1;~Wenhai_Wang2;~Zhenhang_Huang1;~Linjie_Xing1;~Zhe_Chen10;~Hao_Li13;~Xizhou_Zhu1;~Zhiguo_Cao1;~Yushi_Chen2;~Tong_Lu1;~Jifeng_Dai1;~Yu_Qiao1",
        "aff": ";Huazhong University of Science and Technology;Harbin Institute of Technology;;Shanghai AI Lab;Shanghai AI Laboratory;Nanjing University;The Chinese University of Hong Kong;Tsinghua University;Huazhong University of Science and Technology;Harbin Institute of Technology;Nanjing University;Tsinghua University;",
        "aff_domain": ";hust.edu.cn;hit.edu.cn;;pjlab.org.cn;pjlab.org.cn;nju.edu.cn;cuhk.edu.hk;tsinghua.edu.cn;hust.edu.cn;hit.edu.cn;nju.edu.cn;tsinghua.edu.cn;",
        "position": ";MS student;PhD student;;Researcher;Researcher;PhD student;PhD student;Postdoc;Full Professor;Full Professor;Undergrad student;Associate Professor;",
        "bibtex": "@inproceedings{\nwang2024the,\ntitle={The All-Seeing Project: Towards Panoptic Visual Recognition and Understanding of the Open World},\nauthor={Weiyun Wang and Min Shi and Qingyun Li and Wenhai Wang and Zhenhang Huang and Linjie Xing and Zhe Chen and Hao Li and Xizhou Zhu and Zhiguo Cao and Yushi Chen and Tong Lu and Jifeng Dai and Yu Qiao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=c2R7ajodcI}\n}",
        "github": "",
        "project": "",
        "reviewers": "5eEK;WmLf;Wviv",
        "pdf_size": 10814906,
        "rating": "6;6;6",
        "confidence": "4;3;5",
        "soundness": "3;3;3",
        "contribution": "3;3;4",
        "presentation": "3;3;3",
        "wc_summary": "74;80;118",
        "wc_strengths": "62;100;92",
        "wc_weaknesses": "225;253;563",
        "wc_questions": "17;3;4",
        "wc_review": "378;436;777",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "912;751;694",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            90.66666666666667,
            19.48218559493661
        ],
        "wc_strengths_avg": [
            84.66666666666667,
            16.35712552851373
        ],
        "wc_weaknesses_avg": [
            347.0,
            153.16222336681676
        ],
        "wc_questions_avg": [
            8.0,
            6.377042156569663
        ],
        "wc_review_avg": [
            530.3333333333334,
            176.01956961908778
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            785.6666666666666,
            92.31227196616685
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            14,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 94,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3157779878157184062&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=c2R7ajodcI",
        "pdf": "https://openreview.net/pdf?id=c2R7ajodcI",
        "email": ";hust.edu.cn;hit.edu.cn;;pjlab.org.cn;pjlab.org.cn;nju.edu.cn;cuhk.edu.hk;tsinghua.edu.cn;hust.edu.cn;hit.edu.cn;nju.edu.cn;tsinghua.edu.cn;",
        "author_num": 14,
        "aff_unique_index": "0;1;2;3;4;5;6;0;1;4;6",
        "aff_unique_norm": "Huazhong University of Science and Technology;Harbin Institute of Technology;Shanghai AI Lab;Shanghai AI Laboratory;Nanjing University;Chinese University of Hong Kong;Tsinghua University",
        "aff_unique_dep": ";;;;;;",
        "aff_unique_url": "http://www.hust.edu.cn;http://www.hit.edu.cn/;https://www.shanghaiailab.com;https://www.shanghai-ai-lab.com;https://www.nju.edu.cn;https://www.cuhk.edu.hk;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "HUST;HIT;SAIL;SAIL;Nanjing U;CUHK;THU",
        "aff_campus_unique_index": "1;2;1",
        "aff_campus_unique": ";Harbin;Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "c2iT5zBiJd",
        "title": "A Label is a Label is a Label: Relation Augmentation for Scene Graph Generation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The goal of scene graph generation (SGG) is to identify the relationships between objects in an image. Many recent methods have been proposed to address a critical challenge in SGG - the biased distribution of relations in the dataset and the semantic space. Although the unbiased SGG problem has recently gained popularity, current SGG research has not thoroughly examined different types of augmentation. Recent works have focused on augmenting objects instead of relations and ignored the opportunities for pixel-level augmentation. We propose a novel relation augmentation method to use semantic and visual perturbations to balance the relation distribution. We use relation dataset statistics to boost the distribution of rare relation classes. We also use visual MixUp and grafting techniques to increase the sample size of triplets with tail relation labels. Our proposed method, RelAug, effectively reduces the long-tail distribution of predicates. We demonstrate this method can be easily adapted to existing methods and produces state-of-the-art performance on the Visual Genome dataset. The authors will make the source code publicly available for reproduction.",
        "keywords": "Scene Graph Generation;Relation Augmentation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Zhanwen Chen;Sheng Li",
        "authorids": "~Zhanwen_Chen1;~Sheng_Li3",
        "gender": "M;M",
        "homepage": "https://www.zhanwenchen.com/;http://sheng-li.org",
        "dblp": "277/1593;23/3439-1",
        "google_scholar": "_ZKWfJ0AAAAJ;DEncVcYAAAAJ",
        "orcid": "0000-0001-7427-1768;0000-0003-1205-8632",
        "linkedin": "zhanwenchen;sheng-li-15a70022/",
        "or_profile": "~Zhanwen_Chen1;~Sheng_Li3",
        "aff": "University of Virginia, Charlottesville;University of Virginia, Charlottesville",
        "aff_domain": "virginia.edu;virginia.edu",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\nchen2024a,\ntitle={A Label is a Label is a Label: Relation Augmentation for Scene Graph Generation},\nauthor={Zhanwen Chen and Sheng Li},\nyear={2024},\nurl={https://openreview.net/forum?id=c2iT5zBiJd}\n}",
        "github": "",
        "project": "",
        "reviewers": "SXQd;vthg;o27p;qnbd;Q4wR",
        "site": "https://openreview.net/forum?id=c2iT5zBiJd",
        "pdf_size": 7941885,
        "rating": "3;3;3;5;5",
        "confidence": "5;4;5;3;4",
        "soundness": "2;2;2;2;3",
        "contribution": "2;2;2;2;2",
        "presentation": "2;2;3;2;1",
        "wc_summary": "70;79;29;84;37",
        "wc_strengths": "136;18;18;99;39",
        "wc_weaknesses": "361;217;187;207;97",
        "wc_questions": "24;45;2;130;2",
        "wc_review": "591;359;236;520;175",
        "wc_reply_reviewers": "20;0;12;11;13",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "1;0;1;1;1",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            3.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            4.2,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.2,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            59.8,
            22.480213522117623
        ],
        "wc_strengths_avg": [
            62.0,
            47.42573141238836
        ],
        "wc_weaknesses_avg": [
            213.8,
            84.95269271777087
        ],
        "wc_questions_avg": [
            40.6,
            47.47041183726975
        ],
        "wc_review_avg": [
            376.2,
            159.53106280596265
        ],
        "wc_reply_reviewers_avg": [
            11.2,
            6.43117407632541
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.7637626158259733,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:f0b2M9CA3tkJ:scholar.google.com/&scioq=A+Label+is+a+Label+is+a+Label:+Relation+Augmentation+for+Scene+Graph+Generation&hl=en&as_sdt=0,34",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Virginia",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.virginia.edu",
        "aff_unique_abbr": "UVA",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Charlottesville",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Denoising Diffusion Step-aware Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18311",
        "id": "c43FGk8Pcg",
        "author_site": "Shuai Yang, Yukang Chen, Luozhou WANG, Shu Liu, YINGCONG CHEN",
        "tldr": "",
        "abstract": "Denoising Diffusion Probabilistic Models (DDPMs) have garnered popularity for data generation across various domains. However, a significant bottleneck is the necessity for whole-network computation during every step of the generative process, leading to high computational overheads. This paper presents a novel framework, Denoising Diffusion Step-aware Models (DDSM), to address this challenge. Unlike conventional approaches, DDSM employs a spectrum of neural networks whose sizes are adapted according to the importance of each generative step, as determined through evolutionary search. This step-wise network variation effectively circumvents redundant computational efforts, particularly in less critical steps, thereby enhancing the efficiency of the diffusion model. Furthermore, the step-aware design can be seamlessly integrated with other efficiency-geared diffusion models such as DDIMs and latent diffusion, thus broadening the scope of computational savings. Empirical evaluations demonstrate that DDSM achieves computational savings of 49% for CIFAR-10, 61% for CelebA-HQ, 59% for LSUN-bedroom, 71% for AFHQ, and 76% for ImageNet, all without compromising the generation quality. Our code and models are available at https://github.com/EnVision-Research/DDSM.",
        "keywords": "diffusion models;efficiency;network pruning",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/a8e38061ec1ab0e4efc1ce83cabea76e1ffb1e1a.pdf",
        "author": "Shuai Yang;Yukang Chen;Luozhou Wang;Shu Liu;Ying-Cong Chen",
        "authorids": "~Shuai_Yang7;~Yukang_Chen1;~Luozhou_Wang2;~Shu_Liu4;~Ying-Cong_Chen1",
        "gender": "M;M;M;M;M",
        "homepage": "https://github.com/AndysonYs;https://yukangchen.com/;https://github.com/wileewang;https://shuliu1993.github.io/;https://www.yingcong.me/",
        "dblp": ";225/4601;;57/1180-5;137/6578",
        "google_scholar": ";6p0ygKUAAAAJ;https://scholar.google.com/citations?hl=en;BUEDUFkAAAAJ;https://scholar.google.com.hk/citations?user=n7j4bJUAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Shuai_Yang7;~Yukang_Chen1;~Luozhou_Wang2;~Shu_Liu4;~Ying-Cong_Chen1",
        "aff": "Hong Kong University of Science and Technology (Gunagzhou);NVIDIA;Hong Kong University of Science and Technology (GUANGZHOU);SmartMore Ltd.;Hong Kong University of Science and Technology",
        "aff_domain": "hkust.edu;nvidia.com;hkust.edu;smartmore.com;hkust-gz.edu.cn",
        "position": "PhD student;Researcher;PhD student;Principal Researcher;Assistant Professor",
        "bibtex": "@inproceedings{\nyang2024denoising,\ntitle={Denoising Diffusion Step-aware Models},\nauthor={Shuai Yang and Yukang Chen and Luozhou Wang and Shu Liu and Ying-Cong Chen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=c43FGk8Pcg}\n}",
        "github": "",
        "project": "",
        "reviewers": "X3mN;339s;GL7V;buDR",
        "pdf_size": 9110110,
        "rating": "6;6;6;8",
        "confidence": "5;4;3;4",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;2;3",
        "wc_summary": "79;44;87;147",
        "wc_strengths": "24;36;32;229",
        "wc_weaknesses": "150;64;60;217",
        "wc_questions": "3;77;63;264",
        "wc_review": "256;221;242;857",
        "wc_reply_reviewers": "321;428;0;163",
        "wc_reply_authors": "1030;889;369;664",
        "reply_reviewers": "3;3;0;1",
        "reply_authors": "2;2;1;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            89.25,
            37.05654463114444
        ],
        "wc_strengths_avg": [
            80.25,
            85.98946156361255
        ],
        "wc_weaknesses_avg": [
            122.75,
            65.22029975398763
        ],
        "wc_questions_avg": [
            101.75,
            97.71226893282133
        ],
        "wc_review_avg": [
            394.0,
            267.60325110132726
        ],
        "wc_reply_reviewers_avg": [
            228.0,
            161.90892501650427
        ],
        "wc_reply_authors_avg": [
            738.0,
            249.85095557151666
        ],
        "reply_reviewers_avg": [
            1.75,
            1.299038105676658
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 19,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11153022085481199308&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=c43FGk8Pcg",
        "pdf": "https://openreview.net/pdf?id=c43FGk8Pcg",
        "email": "hkust.edu;nvidia.com;hkust.edu;smartmore.com;hkust-gz.edu.cn",
        "author_num": 5,
        "aff_unique_index": "0;1;0;2;0",
        "aff_unique_norm": "Hong Kong University of Science and Technology;NVIDIA;SmartMore",
        "aff_unique_dep": ";NVIDIA Corporation;",
        "aff_unique_url": "https://www.ust.hk;https://www.nvidia.com;https://www.smartmore.com",
        "aff_unique_abbr": "HKUST;NVIDIA;SmartMore",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;1;0;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "c4JNoRRNtV",
        "title": "CryoFormer: Continuous Heterogeneous Cryo-EM Reconstruction using Transformer-based Neural Representations",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Cryo-electron microscopy (cryo-EM) allows for the high-resolution reconstruction of 3D structures of proteins and other biomolecules. Successful reconstruction of both shape and movement greatly helps understand the fundamental processes of life. However, it is still challenging to reconstruct the continuous motions of 3D structures from hundreds of thousands of noisy and randomly oriented 2D cryo-EM images. While recent advancements using Fourier domain coordinate-based neural networks show compelling results in modeling continuous 3D conformations, these methods often struggle to capture local flexible regions accurately. We propose CryoFormer, a new approach for continuous heterogeneous cryo-EM reconstruction. Our approach constructs an implicit feature volume directly in the real domain as the 3D representation. We also design a query-based deformation transformer decoder to effectively predict the density. Our approach is capable of refining pre-computed pose estimations and locating flexible regions. In experiments, our method outperforms current approaches on three public datasets (1 synthetic and 2 experimental) and a new synthetic dataset of PEDV spike protein. The code and new synthetic dataset will be released for better reproducibility of our results.",
        "keywords": "Neural Representation;Cryo-EM reconstruction;Structural Biology",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/95517ba64d301e5f72ea75fb0b233685d814d1c3.zip",
        "author": "Xinhang Liu;Yan Zeng;Yifan Qin;Hao Li;Jiakai Zhang;Lan Xu;Jingyi Yu",
        "authorids": "~Xinhang_Liu1;~Yan_Zeng3;~Yifan_Qin1;~Hao_Li39;~Jiakai_Zhang3;~Lan_Xu2;~Jingyi_Yu5",
        "gender": ";M;;M;M;M;M",
        "homepage": "https://xinhangliu.com;https://zerone182.github.io;;;https://jiakai-zhang.github.io;http://xu-lan.com/;",
        "dblp": "291/3884;;;;179/2299;;",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;sR3Nf7YAAAAJ;;;https://scholar.google.com/citations?hl=en;aPS5pJkAAAAJ;R9L_AfQAAAAJ",
        "orcid": ";;;0000-0001-8285-5886;;0000-0002-8807-7787;",
        "linkedin": ";;;;jiakai-zhang-38b8b4217/;;",
        "or_profile": "~Xinhang_Liu1;~Yan_Zeng3;~Yifan_Qin1;~Hao_Li39;~Jiakai_Zhang3;~Lan_Xu2;~Jingyi_Yu5",
        "aff": "Hong Kong University of Science and Technology;ShanghaiTech University;;;ShanghaiTech University;ShanghaiTech University;ShanghaiTech University",
        "aff_domain": "ust.hk;shanghaitech.edu.cn;;;shanghaitech.edu.cn;shanghaitech.edu.cn;shanghaitech.edu.cn",
        "position": "PhD student;Undergrad student;;;PhD student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nliu2024cryoformer,\ntitle={CryoFormer: Continuous Heterogeneous Cryo-{EM} Reconstruction using Transformer-based Neural Representations},\nauthor={Xinhang Liu and Yan Zeng and Yifan Qin and Hao Li and Jiakai Zhang and Lan Xu and Jingyi Yu},\nyear={2024},\nurl={https://openreview.net/forum?id=c4JNoRRNtV}\n}",
        "github": "",
        "project": "",
        "reviewers": "cxj8;LTYj;TQAh;96CH",
        "site": "https://openreview.net/forum?id=c4JNoRRNtV",
        "pdf_size": 41250096,
        "rating": "3;5;5;6",
        "confidence": "4;5;3;2",
        "soundness": "3;2;3;3",
        "contribution": "3;2;3;3",
        "presentation": "4;3;3;3",
        "wc_summary": "34;18;58;78",
        "wc_strengths": "53;45;113;81",
        "wc_weaknesses": "227;373;100;10",
        "wc_questions": "68;130;81;1",
        "wc_review": "382;566;352;170",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "30;49;81;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;0",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            47.0,
            22.869193252058544
        ],
        "wc_strengths_avg": [
            73.0,
            26.68332812825267
        ],
        "wc_weaknesses_avg": [
            177.5,
            136.68668552569412
        ],
        "wc_questions_avg": [
            70.0,
            46.05974381170612
        ],
        "wc_review_avg": [
            367.5,
            140.40922334376756
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            40.0,
            29.4193813667113
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0.75,
            0.4330127018922193
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5129891760425771,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7797603459167309283&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;1;1;1",
        "aff_unique_norm": "Hong Kong University of Science and Technology;ShanghaiTech University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ust.hk;https://www.shanghaitech.edu.cn",
        "aff_unique_abbr": "HKUST;ShanghaiTech",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "c4QgNn9WeO",
        "title": "LMEye: An Interactive Perception Network for Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Training a Multimodal Large Language Model (MLLM) from scratch, like GPT-4, is resource-intensive. Regarding Large Language Models (LLMs) as the core processor for multimodal information, our paper introduces LMEye, a human-like eye with a play-and-plug interactive perception network, designed to enable dynamic interaction between LLMs and external vision information. Previous methods incorporate visual information into LLMs with a simple visual mapping network or Q-former from BLIP-2. Such networks project the image feature once yet do not consider the interaction between the image and the human input query. Hence, the obtained visual information without being connected to human intention may be inadequate for LLMs to generate intention-following responses, which we refer to as static visual information. LMEye addresses this issue by allowing the LLM to request the desired visual information aligned with various human instructions, which we term as the dynamic visual information interaction. Specifically, LMEye consists of a simple visual mapping network to provide the basic perception of an image for LLMs. It also contains additional modules responsible for acquiring requests from LLMs, performing request-based visual information interaction, and transmitting the resulting interacted visual information to LLMs, respectively. In this way, LLMs act to understand the human query, deliver the corresponding request to the request-based visual information interaction module, and generate the response based on the interleaved multimodal information. We evaluate LMEye through extensive experiments on some multimodal benchmarks, demonstrating that it significantly improves the zero-shot performance on various multimodal tasks compared to previous methods, with less parameters.",
        "keywords": "Multimodal Large Language Model;Interactive Perception Network;LLMs-based Multimodal Agent",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/33689c687a71d5bbced02883d2052e818eb5ad5e.pdf",
        "author": "yunxin li;Baotian Hu;Xinyu Chen;Lin Ma;Yong Xu;Min zhang",
        "authorids": "~yunxin_li1;~Baotian_Hu1;~Xinyu_Chen6;~Lin_Ma2;~Yong_Xu9;~Min_zhang14",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://yunxinli.github.io;;;http://forestlinma.com;https://www.yongxu.org;https://zhangmin-nlp-ai.github.io/",
        "dblp": "11/2484;155/1902;;74/3608-2;;83/5342-?",
        "google_scholar": "U98QY0QAAAAJ;5NiJ1VoAAAAJ;https://scholar.google.com/citations?view_op=list_works;DAn1pA4AAAAJ;https://scholar.google.com.hk/citations?user=zOVgYQYAAAAJ;https://scholar.google.com/citations?",
        "orcid": ";0000-0001-7490-684X;;;;0000-0002-3895-5510",
        "linkedin": ";;;;;",
        "or_profile": "~yunxin_li1;~Baotian_Hu1;~Xinyu_Chen6;~Lin_Ma2;~Yong_Xu9;~Min_zhang14",
        "aff": "Harbin Institute of Technology;Harbin Institute of Technology, Shenzhen;Harbin Institute of Technology;Meituan;Harbin Institute of Technology;Harbin Institute of Technology",
        "aff_domain": "hit.edu.cn;hhit.edu.cn;hit.edu.cn;meituan.com;hit.edu.cn;hit.edu.cn",
        "position": "PhD student;Associate Professor;Undergrad student;Principal Researcher and Research Manager ;Full Professor;Full Professor",
        "bibtex": "@misc{\nli2024lmeye,\ntitle={{LME}ye: An Interactive Perception Network for Large Language Models},\nauthor={yunxin li and Baotian Hu and Xinyu Chen and Lin Ma and Yong Xu and Min zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=c4QgNn9WeO}\n}",
        "github": "",
        "project": "",
        "reviewers": "c2o8;DT9V;E4sy;RpWw",
        "site": "https://openreview.net/forum?id=c4QgNn9WeO",
        "pdf_size": 3504208,
        "rating": "3;5;6;8",
        "confidence": "4;4;4;5",
        "soundness": "2;2;3;4",
        "contribution": "2;2;3;4",
        "presentation": "2;2;2;3",
        "wc_summary": "46;101;107;173",
        "wc_strengths": "37;122;36;662",
        "wc_weaknesses": "103;119;149;110",
        "wc_questions": "2;28;4;45",
        "wc_review": "188;370;296;990",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "436;1104;789;653",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;2;2;1",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            106.75,
            45.03540274051071
        ],
        "wc_strengths_avg": [
            214.25,
            260.85472489491156
        ],
        "wc_weaknesses_avg": [
            120.25,
            17.541023345289748
        ],
        "wc_questions_avg": [
            19.75,
            17.80975856096876
        ],
        "wc_review_avg": [
            461.0,
            312.200256245891
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            745.5,
            242.26070667774417
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.8006407690254357,
        "gs_citation": 42,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=849843883434891038&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;0;0;1;0;0",
        "aff_unique_norm": "Harbin Institute of Technology;Meituan",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.hit.edu.cn/;https://www.meituan.com",
        "aff_unique_abbr": "HIT;Meituan",
        "aff_campus_unique_index": "0;1;0;0;0",
        "aff_campus_unique": "Harbin;Shenzhen;",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "GAFormer: Enhancing Timeseries Transformers Through Group-Aware Embeddings",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18310",
        "id": "c56TWtYp0W",
        "author_site": "Jingyun Xiao, Ran Liu, Eva Dyer",
        "tldr": "",
        "abstract": "Analyzing multivariate time series is important in many domains. However, it has been difficult to learn robust and generalizable representations within multivariate datasets due to complex inter-channel relationships and dynamic shifts. In this paper, we introduce a novel approach for learning spatiotemporal structure and using it to improve the application of transformers to timeseries datasets. Our framework learns a set of group tokens, and builds an instance-specific group embedding (GE) layer that assigns input tokens to a small number of group tokens to incorporate  structure into learning. We then introduce a novel architecture, Group-Aware transFormer (GAFormer), which incorporates both spatial and temporal group embeddings to achieve state-of-the-art performance on a number of time-series classification and regression tasks. In evaluations on a number of diverse timeseries datasets, we show that GE on its own can provide a nice enhancement to a number of backbones, and that by coupling spatial and temporal group embeddings, the GAFormer can outperform the existing baselines. Finally, we show how our approach discerns latent structures in data even without information about the spatial ordering of channels, and yields a more interpretable decomposition of spatial and temporal structure underlying complex multivariate datasets.",
        "keywords": "Time-series;Transformer;Spatiotemporal",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/ae95e39b0a92137f52c6556d15d33e4011c19ff4.pdf",
        "author": "Jingyun Xiao;Ran Liu;Eva L Dyer",
        "authorids": "~Jingyun_Xiao1;~Ran_Liu2;~Eva_L_Dyer1",
        "gender": "M;F;F",
        "homepage": ";https://ranliu98.github.io/;http://dyerlab.gatech.edu",
        "dblp": ";;64/8509.html",
        "google_scholar": "LEHq9a8AAAAJ;vBEAxZgAAAAJ;Sb_jcHcAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Jingyun_Xiao1;~Ran_Liu2;~Eva_Dyer1",
        "aff": "Georgia Institute of Technology;Georgia Institute of Technology;Georgia Institute of Technology",
        "aff_domain": "gatech.edu;gatech.edu;gatech.edu",
        "position": "PhD student;PhD student;Associate Professor",
        "bibtex": "@inproceedings{\nxiao2024gaformer,\ntitle={{GAF}ormer: Enhancing Timeseries Transformers Through Group-Aware Embeddings},\nauthor={Jingyun Xiao and Ran Liu and Eva L Dyer},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=c56TWtYp0W}\n}",
        "github": "",
        "project": "",
        "reviewers": "MEmY;Hkvr;cXyc;q3iU;Jppq",
        "pdf_size": 2828919,
        "rating": "6;6;6;6;6",
        "confidence": "2;2;4;3;2",
        "soundness": "3;3;3;3;3",
        "contribution": "3;3;3;2;3",
        "presentation": "3;3;3;3;3",
        "wc_summary": "80;65;116;57;30",
        "wc_strengths": "62;39;28;45;22",
        "wc_weaknesses": "64;30;120;90;31",
        "wc_questions": "4;31;149;37;28",
        "wc_review": "210;165;413;229;111",
        "wc_reply_reviewers": "0;0;33;27;0",
        "wc_reply_authors": "811;780;681;733;479",
        "reply_reviewers": "0;0;1;1;0",
        "reply_authors": "2;2;2;2;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            2.6,
            0.8
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.8,
            0.39999999999999997
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            69.6,
            28.31677947789967
        ],
        "wc_strengths_avg": [
            39.2,
            13.962807740565648
        ],
        "wc_weaknesses_avg": [
            67.0,
            34.675639864319734
        ],
        "wc_questions_avg": [
            49.8,
            50.85430168628805
        ],
        "wc_review_avg": [
            225.6,
            102.15595919964728
        ],
        "wc_reply_reviewers_avg": [
            12.0,
            14.818906842274163
        ],
        "wc_reply_authors_avg": [
            696.8,
            117.44002724795324
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6920690816151665620&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=c56TWtYp0W",
        "pdf": "https://openreview.net/pdf?id=c56TWtYp0W",
        "email": "gatech.edu;gatech.edu;gatech.edu",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Georgia Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.gatech.edu",
        "aff_unique_abbr": "Georgia Tech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "METRA: Scalable Unsupervised RL with Metric-Aware Abstraction",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18309",
        "id": "c5pwL0Soay",
        "author_site": "Seohong Park, Oleh Rybkin, Sergey Levine",
        "tldr": "",
        "abstract": "Unsupervised pre-training strategies have proven to be highly effective in natural language processing and computer vision. Likewise, unsupervised reinforcement learning (RL) holds the promise of discovering a variety of potentially useful behaviors that can accelerate the learning of a wide array of downstream tasks. Previous unsupervised RL approaches have mainly focused on pure exploration and mutual information skill learning. However, despite the previous attempts, making unsupervised RL truly scalable still remains a major open challenge: pure exploration approaches might struggle in complex environments with large state spaces, where covering every possible transition is infeasible, and mutual information skill learning approaches might completely fail to explore the environment due to the lack of incentives. To make unsupervised RL scalable to complex, high-dimensional environments, we propose a novel unsupervised RL objective, which we call Metric-Aware Abstraction (METRA). Our main idea is, instead of directly covering the entire state space, to only cover a compact latent space $\\mathcal{Z}$ that is metrically connected to the state space $\\mathcal{S}$ by temporal distances. By learning to move in every direction in the latent space, METRA obtains a tractable set of diverse behaviors that approximately cover the state space, being scalable to high-dimensional environments. Through our experiments in five locomotion and manipulation environments, we demonstrate that METRA can discover a variety of useful behaviors even in complex, pixel-based environments, being the first unsupervised RL method that discovers diverse locomotion behaviors in pixel-based Quadruped and Humanoid. Our code and videos are available at https://seohong.me/projects/metra/",
        "keywords": "reinforcement learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Seohong Park;Oleh Rybkin;Sergey Levine",
        "authorids": "~Seohong_Park1;~Oleh_Rybkin1;~Sergey_Levine1",
        "gender": ";M;M",
        "homepage": "https://seohong.me/;http://olehrybkin.com/;https://people.eecs.berkeley.edu/~svlevine/",
        "dblp": "227/6308;217/2946;80/7594",
        "google_scholar": ";https://scholar.google.com/citations?view_op=list_works;8R35rCwAAAAJ",
        "orcid": ";0000-0002-5898-006X;",
        "linkedin": ";oleh-rybkin/;",
        "or_profile": "~Seohong_Park1;~Oleh_Rybkin1;~Sergey_Levine1",
        "aff": "University of California, Berkeley;University of California, Berkeley;Google",
        "aff_domain": "berkeley.edu;berkeley.edu;google.com",
        "position": "PhD student;Postdoc;Research Scientist",
        "bibtex": "@inproceedings{\npark2024metra,\ntitle={{METRA}: Scalable Unsupervised {RL} with Metric-Aware Abstraction},\nauthor={Seohong Park and Oleh Rybkin and Sergey Levine},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=c5pwL0Soay}\n}",
        "github": "",
        "project": "",
        "reviewers": "N85D;YkQo;1oDh;CufN",
        "pdf_size": 4775879,
        "rating": "6;8;8;8",
        "confidence": "3;3;5;4",
        "soundness": "3;3;3;4",
        "contribution": "3;2;3;4",
        "presentation": "3;3;3;4",
        "wc_summary": "61;222;117;70",
        "wc_strengths": "59;166;104;156",
        "wc_weaknesses": "35;155;170;46",
        "wc_questions": "40;95;56;160",
        "wc_review": "195;638;447;432",
        "wc_reply_reviewers": "0;165;0;16",
        "wc_reply_authors": "451;991;1145;493",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "2;2;2;1",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            117.5,
            63.97069641640616
        ],
        "wc_strengths_avg": [
            121.25,
            42.96146529158427
        ],
        "wc_weaknesses_avg": [
            101.5,
            61.35348400865268
        ],
        "wc_questions_avg": [
            87.75,
            46.262160563466985
        ],
        "wc_review_avg": [
            428.0,
            157.1352920256936
        ],
        "wc_reply_reviewers_avg": [
            45.25,
            69.44557221306482
        ],
        "wc_reply_authors_avg": [
            770.0,
            303.29688425699334
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5222329678670935,
        "gs_citation": 42,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=276744191137702102&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=c5pwL0Soay",
        "pdf": "https://openreview.net/pdf?id=c5pwL0Soay",
        "email": "berkeley.edu;berkeley.edu;google.com",
        "author_num": 3,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "University of California, Berkeley;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.berkeley.edu;https://www.google.com",
        "aff_unique_abbr": "UC Berkeley;Google",
        "aff_campus_unique_index": "0;0;1",
        "aff_campus_unique": "Berkeley;Mountain View",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "c72vop46KY",
        "title": "CogVLM: Visual Expert for Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We introduce CogVLM, a powerful open-source visual language foundation model.\nDifferent from the popular *shallow-align* method which maps image features into the input space of language model, CogVLM bridges the gap between the frozen pretrained language model and image encoder by a trainable visual expert module in the attention and FFN layers. As a result, CogVLM enables deep fusion of visual language features without sacrificing any performance on NLP tasks. \nCogVLM-17B achieves state-of-the-art performance on 9 classic cross-modal benchmarks, including NoCaps, Flicker30k captioning, RefCOCO, RefCOCO+, RefCOCOg, Visual7W, GQA, ScienceQA, VizWiz VQA and TDIUC, and rank the 2nd on VQAv2, OKVQA, TextVQA, COCO captioning, etc., surpassing or matching PaLI-X 55B. Codes and checkpoints are available at Github.",
        "keywords": "vision-language model;cross-modality;pretrained language model",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Weihan Wang;Qingsong Lv;Wenmeng Yu;Wenyi Hong;Ji Qi;Yan Wang;Junhui Ji;Zhuoyi Yang;Lei Zhao;Song XiXuan;Jiazheng Xu;Xu Bin;Juanzi Li;Jie Tang;Ming Ding",
        "authorids": "~Weihan_Wang3;~Qingsong_Lv4;~Wenmeng_Yu1;~Wenyi_Hong1;~Ji_Qi3;~Yan_Wang42;~Junhui_Ji1;~Zhuoyi_Yang1;~Lei_Zhao17;~Song_XiXuan1;~Jiazheng_Xu1;~Xu_Bin1;~Juanzi_Li1;~Jie_Tang1;~Ming_Ding1",
        "gender": ";;M;F;M;M;M;M;M;M;M;;;;M",
        "homepage": ";;;;https://qijimrc.github.io;https://github.com/lykeven;;;;https://github.com/songxxzp;https://github.com/xujz18;;;;",
        "dblp": ";;268/1056;216/5413;;;;230/8320;;;313/9484;;;;48/3462-4",
        "google_scholar": ";tJNCPogAAAAJ;AE5tvE4AAAAJ;JSEzrlwAAAAJ;vv6bZjMAAAAJ;;;;;;7--T2_4AAAAJ;;;;Va50YzkAAAAJ",
        "orcid": ";;;;;;0009-0009-2811-1865;;;;;;;;",
        "linkedin": ";;;wenyi-hong;;;;zhuoyi-yang-4a1051210/;%E7%A3%8A-%E8%B5%B5-0149671b4/;;;;;;",
        "or_profile": "~Weihan_Wang3;~Qingsong_Lv4;~Wenmeng_Yu1;~Wenyi_Hong1;~Ji_Qi3;~Yan_Wang42;~Junhui_Ji1;~Zhuoyi_Yang1;~Lei_Zhao17;~Song_XiXuan1;~Jiazheng_Xu1;~Xu_Bin1;~Juanzi_Li1;~Jie_Tang1;~Ming_Ding1",
        "aff": ";Tsinghua University;Zhipu AI;Department of Computer Science and Technology, Tsinghua University;Tsinghua University;;Zhipu.AI;Tsinghua University;;Tsinghua University;Tsinghua University;;;;ZHIPU AI",
        "aff_domain": ";tsinghua.edu.cn;aminer.cn;mails.tsinghua.edu.cn;tsinghua.edu.cn;;zhipuai.cn;tsinghua.edu.cn;;cs.tsinghua.edu.cn;cs.tsinghua.edu.cn;;;;zhipuai.cn",
        "position": ";MS student;Researcher;PhD student;PhD student;;Researcher;PhD student;;Undergrad student;PhD student;;;;Principal Researcher",
        "bibtex": "@misc{\nwang2024cogvlm,\ntitle={Cog{VLM}: Visual Expert for Large Language Models},\nauthor={Weihan Wang and Qingsong Lv and Wenmeng Yu and Wenyi Hong and Ji Qi and Yan Wang and Junhui Ji and Zhuoyi Yang and Lei Zhao and Song XiXuan and Jiazheng Xu and Xu Bin and Juanzi Li and Jie Tang and Ming Ding},\nyear={2024},\nurl={https://openreview.net/forum?id=c72vop46KY}\n}",
        "github": "",
        "project": "",
        "reviewers": "Yif3;U75G;c9aL;e1q8",
        "site": "https://openreview.net/forum?id=c72vop46KY",
        "pdf_size": 9387646,
        "rating": "5;6;6;6",
        "confidence": "4;4;4;4",
        "soundness": "3;4;3;2",
        "contribution": "2;3;3;2",
        "presentation": "3;4;4;3",
        "wc_summary": "71;46;62;43",
        "wc_strengths": "104;85;52;83",
        "wc_weaknesses": "244;38;108;370",
        "wc_questions": "67;43;103;27",
        "wc_review": "486;212;325;523",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "463;260;752;902",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;2;3",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            55.5,
            11.5
        ],
        "wc_strengths_avg": [
            81.0,
            18.641351882307248
        ],
        "wc_weaknesses_avg": [
            190.0,
            127.61661333854617
        ],
        "wc_questions_avg": [
            60.0,
            28.61817604250837
        ],
        "wc_review_avg": [
            386.5,
            125.26471969393457
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            594.25,
            249.27131303060125
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            15,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4019020900300165137&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0;2;0;0;0;1",
        "aff_unique_norm": "Tsinghua University;Zhipu AI;Zhipu.AI",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.zhipu.ai;https://www.zhipu.ai",
        "aff_unique_abbr": "THU;Zhipu AI;Zhipu.AI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Democratizing Fine-grained Visual Recognition with Large Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18308",
        "id": "c7DND1iIgb",
        "author_site": "Mingxuan Liu, Subhankar Roy, Wenjing Li, Zhun Zhong, Nicu Sebe, Elisa Ricci",
        "tldr": "",
        "abstract": "Identifying subordinate-level categories from images is a longstanding task in computer vision and is referred to as fine-grained visual recognition (FGVR). It has tremendous significance in real-world applications since an average layperson does not excel at differentiating species of birds or mushrooms due to subtle differences among the species. A major bottleneck in developing FGVR systems is caused by the need of high-quality paired expert annotations. To circumvent the need of expert knowledge we propose Fine-grained Semantic Category Reasoning (FineR) that internally leverages the world knowledge of large language models (LLMs) as a proxy in order to reason about fine-grained category names. In detail, to bridge the modality gap between images and LLM, we extract part-level visual attributes from images as text and feed that information to a LLM. Based on the visual attributes and its internal world knowledge the LLM reasons about the subordinate-level category names. Our training-free FineR outperforms several state-of-the-art FGVR and language and vision assistant models and shows promise in working in the wild and in new domains where gathering expert annotation is arduous.",
        "keywords": "Vision-Language Models;Large Language Models;Prompting;Multimodal;Fine-grained Visual Recognition",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Mingxuan Liu;Subhankar Roy;Wenjing Li;Zhun Zhong;Nicu Sebe;Elisa Ricci",
        "authorids": "~Mingxuan_Liu2;~Subhankar_Roy1;~Wenjing_Li4;~Zhun_Zhong1;~Nicu_Sebe1;~Elisa_Ricci1",
        "gender": "M;M;F;M;M;F",
        "homepage": "https://oatmealliu.github.io/;https://roysubhankar.github.io/;;http://zhunzhong.site;http://disi.unitn.it/~sebe/;http://elisaricci.eu/",
        "dblp": ";;;32/6525;20/3519;88/397",
        "google_scholar": "https://scholar.google.it/citations?user=egL5-LsAAAAJ;YfzgrDYAAAAJ;uBjSytAAAAAJ;nZizkQ0AAAAJ;https://scholar.google.it/citations?user=stFCYOAAAAAJ;https://scholar.google.it/citations?user=xf1T870AAAAJ",
        "orcid": "0000-0002-7292-6289;0009-0008-2395-8111;;;0000-0002-6597-7248;",
        "linkedin": "mingxuan-liu-b90430272/;;;;;",
        "or_profile": "~Mingxuan_Liu2;~Subhankar_Roy1;~Wenjing_Li4;~Zhun_Zhong1;~Nicu_Sebe1;~Elisa_Ricci1",
        "aff": "Naver Labs Europe;University of Aberdeen;University of Science and Technology of China;University of Nottingham;University of Trento;University of Trento",
        "aff_domain": "naverlabs.com;abdn.ac.uk;ustc.edu.cn;nottingham.ac.uk;unitn.it;unitn.it",
        "position": "Researcher;Lecturer;Postdoc;Assistant Professor;Full Professor;Associate Professor",
        "bibtex": "@inproceedings{\nliu2024democratizing,\ntitle={Democratizing Fine-grained Visual Recognition with Large Language Models},\nauthor={Mingxuan Liu and Subhankar Roy and Wenjing Li and Zhun Zhong and Nicu Sebe and Elisa Ricci},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=c7DND1iIgb}\n}",
        "github": "",
        "project": "",
        "reviewers": "WYuk;3hkC;oRxX",
        "pdf_size": 15050534,
        "rating": "6;6;8",
        "confidence": "5;4;5",
        "soundness": "3;3;4",
        "contribution": "2;2;3",
        "presentation": "3;3;4",
        "wc_summary": "71;42;50",
        "wc_strengths": "49;54;42",
        "wc_weaknesses": "254;128;115",
        "wc_questions": "211;30;22",
        "wc_review": "585;254;229",
        "wc_reply_reviewers": "125;0;90",
        "wc_reply_authors": "1799;1483;1199",
        "reply_reviewers": "1;0;1",
        "reply_authors": "5;4;3",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            54.333333333333336,
            12.229290885229428
        ],
        "wc_strengths_avg": [
            48.333333333333336,
            4.921607686744467
        ],
        "wc_weaknesses_avg": [
            165.66666666666666,
            62.68616717869705
        ],
        "wc_questions_avg": [
            87.66666666666667,
            87.27097010015542
        ],
        "wc_review_avg": [
            356.0,
            162.24878017004215
        ],
        "wc_reply_reviewers_avg": [
            71.66666666666667,
            52.65189666310439
        ],
        "wc_reply_authors_avg": [
            1493.6666666666667,
            245.06507072385673
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            4.0,
            0.816496580927726
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13841216086625583715&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=c7DND1iIgb",
        "pdf": "https://openreview.net/pdf?id=c7DND1iIgb",
        "email": "naverlabs.com;abdn.ac.uk;ustc.edu.cn;nottingham.ac.uk;unitn.it;unitn.it",
        "author_num": 6,
        "aff_unique_index": "0;1;2;3;4;4",
        "aff_unique_norm": "NAVER LABS;University of Aberdeen;University of Science and Technology of China;University of Nottingham;University of Trento",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://labs.naver.com;https://www.abdn.ac.uk;http://www.ustc.edu.cn;https://www.nottingham.ac.uk;https://www.unitn.it",
        "aff_unique_abbr": "NLE;Aberdeen;USTC;UoN;UniTN",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;1;3;3",
        "aff_country_unique": "Unknown;United Kingdom;China;Italy"
    },
    {
        "title": "Decoupling Weighing and Selecting for Integrating Multiple Graph Pre-training Tasks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18307",
        "id": "c85tdYOOju",
        "author_site": "Tianyu Fan, Lirong Wu, Yufei Huang, Haitao Lin, Cheng Tan, Zhangyang Gao, Stan Z Li",
        "tldr": "",
        "abstract": "Recent years have witnessed the great success of graph pre-training for graph representation learning. With hundreds of graph pre-training tasks proposed, integrating knowledge acquired from multiple pre-training tasks has become a popular research topic. In this paper, we identify two important collaborative processes for this topic: (1) select: how to select an optimal task combination from a given task pool based on their compatibility, and (2) weigh: how to weigh the selected tasks based on their importance. While there currently has been a lot of work focused on weighing, comparatively little effort has been devoted to selecting. This paper proposes a novel instance-level framework for integrating multiple graph pre-training tasks,\nWeigh And Select (WAS), where the two collaborative processes, weighing and selecting, are combined by decoupled siamese networks. Specifically, it first adaptively learns an optimal combination of tasks for each instance from a given task pool, based on which a customized instance-level task weighing strategy is learned. Extensive experiments on 16 graph datasets across node-level and graph-level downstream tasks have demonstrated that by combining a few simple but classical tasks, WAS can achieve comparable performance to other leading counterparts.\nThe code is available at https://github.com/TianyuFan0504/WAS.",
        "keywords": "Multi-tasking learning;Graph Neural Networks;AutoML",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/03add0bfb9f955f1ac5c5ede4a4716818594e879.zip",
        "author": "Tianyu Fan;Lirong Wu;Yufei Huang;Haitao Lin;Cheng Tan;Zhangyang Gao;Stan Z. Li",
        "authorids": "~Tianyu_Fan1;~Lirong_Wu1;~Yufei_Huang4;~Haitao_Lin2;~Cheng_Tan1;~Zhangyang_Gao1;~Stan_Z._Li2",
        "gender": "M;;M;M;M;M;M",
        "homepage": "https://tianyufan0504.github.io/;;https://2021.igem.org/Team:ZJU-China;;https://chengtan9907.github.io/;;https://en.westlake.edu.cn/academics/School_of_Engineering/About/Our_People/Faculty/201912/t20191206_2497.shtml",
        "dblp": "238/6657;15/10330;68/1946-2;34/1040;70/1533-12.html;275/3266;l/StanZLi",
        "google_scholar": "0lOPzTwAAAAJ;Tk7TrCoAAAAJ;qmTjdwIAAAAJ;o5A23qIAAAAJ;6kTV6aMAAAAJ;4SclT-QAAAAJ;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": "0000-0002-5953-896X;;0009-0007-8184-4529;;;0000-0003-1026-6083;",
        "linkedin": ";;;;;;stan-z-li-%E6%9D%8E%E5%AD%90%E9%9D%92-55753224/",
        "or_profile": "~Tianyu_Fan1;~Lirong_Wu1;~Yufei_Huang4;~Haitao_Lin2;~Cheng_Tan1;~Zhangyang_Gao1;~Stan_Z._Li1",
        "aff": "Zhejiang University;Westlake University;Zhejiang University;Westlake University;Zhejiang University & Westlake University;Westlake University, China;Westlake University",
        "aff_domain": "zju.edu.cn;westlake.edu.cn;zju.edu.cn;westlake.edu.cn;westlake.edu.cn;westlake.edu.cn;westlake.edu.cn",
        "position": "Undergrad student;PhD student;PhD student;PhD student;PhD student;PhD student;Chair Professor",
        "bibtex": "@inproceedings{\nfan2024decoupling,\ntitle={Decoupling Weighing and Selecting for Integrating Multiple Graph Pre-training Tasks},\nauthor={Tianyu Fan and Lirong Wu and Yufei Huang and Haitao Lin and Cheng Tan and Zhangyang Gao and Stan Z. Li},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=c85tdYOOju}\n}",
        "github": "",
        "project": "",
        "reviewers": "66Ho;C6hu;pHBL;fcHp",
        "pdf_size": 1290605,
        "rating": "5;5;6;8",
        "confidence": "3;4;3;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;4",
        "wc_summary": "61;124;72;64",
        "wc_strengths": "35;146;67;95",
        "wc_weaknesses": "76;210;112;61",
        "wc_questions": "44;3;49;4",
        "wc_review": "216;483;300;224",
        "wc_reply_reviewers": "17;85;0;32",
        "wc_reply_authors": "1177;903;788;670",
        "reply_reviewers": "1;2;0;1",
        "reply_authors": "3;3;2;2",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            80.25,
            25.577089357469898
        ],
        "wc_strengths_avg": [
            85.75,
            40.751533713468994
        ],
        "wc_weaknesses_avg": [
            114.75,
            58.03178008643195
        ],
        "wc_questions_avg": [
            25.0,
            21.575449010391416
        ],
        "wc_review_avg": [
            305.75,
            107.45784057015105
        ],
        "wc_reply_reviewers_avg": [
            33.5,
            31.815876539866068
        ],
        "wc_reply_authors_avg": [
            884.5,
            187.8969132263753
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.4714045207910316,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12980137905347157873&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=c85tdYOOju",
        "pdf": "https://openreview.net/pdf?id=c85tdYOOju",
        "email": "zju.edu.cn;westlake.edu.cn;zju.edu.cn;westlake.edu.cn;westlake.edu.cn;westlake.edu.cn;westlake.edu.cn",
        "author_num": 7,
        "aff_unique_index": "0;1;0;1;0;1;1",
        "aff_unique_norm": "Zhejiang University;Westlake University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.zju.edu.cn;https://www.westlake.edu.cn",
        "aff_unique_abbr": "ZJU;WU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Solving Challenging Math Word Problems Using GPT-4 Code Interpreter with Code-based Self-Verification",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18306",
        "id": "c8McWs4Av0",
        "author_site": "Aojun Zhou, Ke Wang, Zimu Lu, Weikang Shi, Sichun Luo, Zipeng Qin, Shaoqing Lu, Anya Jia, Linqi Song, Mingjie Zhan, Hongsheng Li",
        "tldr": "",
        "abstract": "Recent progress in large language models (LLMs) like GPT-4 and PaLM-2 has brought significant advancements in addressing math reasoning problems. In particular, OpenAI's latest version of GPT-4, known as GPT-4 Code Interpreter, shows remarkable performance on challenging math datasets. In this paper, we explore the effect of code on enhancing LLMs' reasoning capability by introducing different constraints on the Code Usage Frequency of GPT-4 Code Interpreter. We found that its success can be largely attributed to its powerful skills in generating and executing code, evaluating the output of code execution, and rectifying its solution when receiving unreasonable outputs. Based on this insight, we propose a novel and effective prompting method, explicit $\\underline{\\text{c}}$ode-based $\\underline{\\text{s}}$elf-$\\underline{\\text{v}}$erification (CSV), to further boost the mathematical reasoning potential of GPT-4 Code Interpreter. This method employs a zero-shot prompt on GPT-4 Code Interpreter to encourage it to use code to self-verify its answers. In instances where the verification state registers as \"False\", the model shall automatically amend its solution, analogous to our approach of rectifying errors during a mathematics examination. Furthermore, we recognize that the states of the verification result indicate the confidence of a solution, which can improve the effectiveness of majority voting. With GPT-4 Code Interpreter and CSV, we achieve an impressive zero-shot accuracy on MATH dataset.",
        "keywords": "mathematical reasoning;large language models;zero-shot learning;code generation;prompting",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Aojun Zhou;Ke Wang;Zimu Lu;Weikang Shi;Sichun Luo;Zipeng Qin;Shaoqing Lu;Anya Jia;Linqi Song;Mingjie Zhan;Hongsheng Li",
        "authorids": "~Aojun_Zhou2;~Ke_Wang18;~Zimu_Lu1;~Weikang_Shi1;~Sichun_Luo1;~Zipeng_Qin2;~Shaoqing_Lu1;~Anya_Jia1;~Linqi_Song1;~Mingjie_Zhan1;~Hongsheng_Li3",
        "gender": ";M;F;M;;M;M;F;M;M;M",
        "homepage": ";https://wangk.org/;;https://shiwk20.github.io;;;;;https://sites.google.com/site/aisquaredlab/;;http://www.ee.cuhk.edu.hk/~hsli",
        "dblp": ";181/2613-36;;213/4016.html;;;;;137/7963.html;277/1226;27/7402-1",
        "google_scholar": ";woY4bS8AAAAJ;ewuGUCwAAAAJ;;;;;;UcGN3MoAAAAJ;;BN2Ze-QAAAAJ",
        "orcid": ";;;;;;;;0000-0003-2756-4984;;",
        "linkedin": ";;;;;zipeng-bruce-qin-846a65119/;https://www.linkedin.com/feed/;anyajia/;;;",
        "or_profile": "~Aojun_Zhou2;~Ke_Wang18;~Zimu_Lu1;~Weikang_Shi1;~Sichun_Luo1;~Zipeng_Qin2;~Shaoqing_Lu1;~Anya_Jia1;~Linqi_Song1;~Mingjie_Zhan1;~Hongsheng_Li3",
        "aff": ";Nanjing University;University of Science and Technology of China;Tsinghua University;;The Chinese University of Hong Kong;;;City University of Hong Kong;SenseTime Research;The Chinese University of Hong Kong",
        "aff_domain": ";nju.edu.cn;ustc.edu.cn;tsinghua.edu.cn;;cuhk.edu.hk;;;cityu.edu.hk;sensetime.com;cuhk.edu.hk",
        "position": ";Undergrad student;Undergrad student;Undergrad student;;PhD student;;;Assistant Professor;Researcher;Associate Professor",
        "bibtex": "@inproceedings{\nzhou2024solving,\ntitle={Solving Challenging Math Word Problems Using {GPT}-4 Code Interpreter with Code-based Self-Verification},\nauthor={Aojun Zhou and Ke Wang and Zimu Lu and Weikang Shi and Sichun Luo and Zipeng Qin and Shaoqing Lu and Anya Jia and Linqi Song and Mingjie Zhan and Hongsheng Li},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=c8McWs4Av0}\n}",
        "github": "",
        "project": "",
        "reviewers": "UL1M;qqMb;boig;iedh",
        "pdf_size": 1078817,
        "rating": "3;6;8;8",
        "confidence": "5;4;5;3",
        "soundness": "2;2;3;3",
        "contribution": "1;2;4;2",
        "presentation": "4;3;4;3",
        "wc_summary": "60;94;125;127",
        "wc_strengths": "66;81;87;195",
        "wc_weaknesses": "186;184;236;437",
        "wc_questions": "1;45;30;160",
        "wc_review": "313;404;478;919",
        "wc_reply_reviewers": "0;201;131;189",
        "wc_reply_authors": "1499;1958;1276;1273",
        "reply_reviewers": "0;2;2;2",
        "reply_authors": "3;5;4;3",
        "rating_avg": [
            6.25,
            2.0463381929681126
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            1.0897247358851685
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            101.5,
            27.299267389437397
        ],
        "wc_strengths_avg": [
            107.25,
            51.236583609760714
        ],
        "wc_weaknesses_avg": [
            260.75,
            103.86860690314471
        ],
        "wc_questions_avg": [
            59.0,
            60.419367755712244
        ],
        "wc_review_avg": [
            528.5,
            232.9060969575507
        ],
        "wc_reply_reviewers_avg": [
            130.25,
            79.72256581420345
        ],
        "wc_reply_authors_avg": [
            1501.5,
            279.0434553971836
        ],
        "reply_reviewers_avg": [
            1.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            3.75,
            0.82915619758885
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": -0.47886115464444223,
        "gs_citation": 153,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14436709317034576117&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=c8McWs4Av0",
        "pdf": "https://openreview.net/pdf?id=c8McWs4Av0",
        "email": ";nju.edu.cn;ustc.edu.cn;tsinghua.edu.cn;;cuhk.edu.hk;;;cityu.edu.hk;sensetime.com;cuhk.edu.hk",
        "author_num": 11,
        "aff_unique_index": "0;1;2;3;4;5;3",
        "aff_unique_norm": "Nanjing University;University of Science and Technology of China;Tsinghua University;Chinese University of Hong Kong;City University of Hong Kong;SenseTime",
        "aff_unique_dep": ";;;;;SenseTime Research",
        "aff_unique_url": "https://www.nju.edu.cn;http://www.ustc.edu.cn;https://www.tsinghua.edu.cn;https://www.cuhk.edu.hk;https://www.cityu.edu.hk;https://www.sensetime.com",
        "aff_unique_abbr": "Nanjing U;USTC;THU;CUHK;CityU;SenseTime",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "c8QakyARlf",
        "title": "MagicRemover: Tuning-free Text-guided Image Inpainting with Diffusion Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Image inpainting aims to fill in the missing pixels with visually coherent and semantically plausible content. Despite the great progress brought from deep generative models, this task still suffers from \\emph{i.} the difficulties in large-scale realistic data collection and costly model training; and \\emph{ii.} the intrinsic limitations in the traditionally user-defined binary masks on objects with unclear boundaries or transparent texture. \n%\nIn this paper, we propose \\emph{\\textbf{MagicRemover}}, a tuning-free method that leverages the powerful diffusion models for text-guided image inpainting. We introduce an attention guidance strategy to constrain the sampling process of diffusion models, enabling the erasing of instructed areas and the restoration of occluded content. We further propose a classifier optimization algorithm to facilitate the denoising stability within less sampling steps. \n%\nExtensive comparisons are conducted among our MagicRemover and state-of-the-art methods including quantitative evaluation and user study, demonstrating the significant improvement of MagicRemover on high-quality image inpainting.",
        "keywords": "Stable Diffusion;Inpainting;Tuning-free",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/e54b7a052fa9d94fb6c2899c331b00938ca8abf1.zip",
        "author": "Siyuan Yang;Lu Zhang;Liqian Ma;Jingjing Fu;Yu LIU;You He",
        "authorids": "~Siyuan_Yang4;~Lu_Zhang7;~Liqian_Ma1;~Jingjing_Fu1;~Yu_LIU31;~You_He2",
        "gender": "M;;M;F;M;M",
        "homepage": ";https://faculty.dlut.edu.cn/zhanglu1/zh_CN/index.htm;http://charliememory.github.io/;;;",
        "dblp": "201/7699;82/10609-53;145/1269;95/4837;;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=zh-CN;FTWcemsAAAAJ;;;",
        "orcid": ";0000-0003-4648-4437;;;0000-0002-5216-3181;0000-0002-6111-340X",
        "linkedin": ";;liqian-ma-68988182/;;;",
        "or_profile": "~Siyuan_Yang4;~Lu_Zhang7;~Liqian_Ma1;~Jingjing_Fu1;~Yu_LIU31;~You_He2",
        "aff": "Tsinghua University;Dalian University of Technology;ZMO AI;Microsoft;Tsinghua University;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;dlut.edu.cn;zmo.ai;microsoft.com;tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "MS student;Postdoc;Principal Researcher;Researcher;Full Professor;Full Professor",
        "bibtex": "@misc{\nyang2024magicremover,\ntitle={MagicRemover: Tuning-free Text-guided Image Inpainting with Diffusion Models},\nauthor={Siyuan Yang and Lu Zhang and Liqian Ma and Jingjing Fu and Yu LIU and You He},\nyear={2024},\nurl={https://openreview.net/forum?id=c8QakyARlf}\n}",
        "github": "",
        "project": "",
        "reviewers": "L7f6;zDXi;DDmY;rxJd",
        "site": "https://openreview.net/forum?id=c8QakyARlf",
        "pdf_size": 10748980,
        "rating": "5;5;5;5",
        "confidence": "4;5;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;2",
        "presentation": "2;3;2;2",
        "wc_summary": "37;28;54;17",
        "wc_strengths": "27;55;21;46",
        "wc_weaknesses": "115;265;134;147",
        "wc_questions": "68;27;6;2",
        "wc_review": "247;375;215;212",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            34.0,
            13.546217184144066
        ],
        "wc_strengths_avg": [
            37.25,
            13.790848414800301
        ],
        "wc_weaknesses_avg": [
            165.25,
            58.70423749611266
        ],
        "wc_questions_avg": [
            25.75,
            26.176086414894034
        ],
        "wc_review_avg": [
            262.25,
            66.52584084399084
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14210645885365056145&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;3;0;0",
        "aff_unique_norm": "Tsinghua University;Dalian University of Technology;ZMO AI;Microsoft",
        "aff_unique_dep": ";;;Microsoft Corporation",
        "aff_unique_url": "https://www.tsinghua.edu.cn;http://www.dlut.edu.cn/;;https://www.microsoft.com",
        "aff_unique_abbr": "THU;DUT;;Microsoft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;2;0;0",
        "aff_country_unique": "China;;United States"
    },
    {
        "id": "c8UABqZfld",
        "title": "Spatial Matching Loss Function for Mass Segmentation on Whole Mammography Images",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Breast cancer is one of the cancer types with a high mortality rate among women, and mammography is one of the primary means to improve the identification of breast cancer. Deep-learning-based approaches are among the pioneering methods for mass segmentation in mammography images; in this category of methods, the loss function is one of the core elements. Most of the proposed losses aim to measure pixel-level similarities. While the hard-coded location information is provided in these losses, they mostly neglect to consider higher-level information such as relative distance, sizes, and quantities, which are important for mass segmentation. Motivated by this observation, in this paper we propose a framework for loss calculation in mass segmentation for mammography images that incorporates the higher-level spatial information in the loss by spatial matching between the prediction and the ground truth masks while calculating the loss. The proposed loss calculation framework is termed Spatial Matching (SM) loss. Instead of only calculating the loss over the entire masks that captures the similarity of the segmentation and the ground truth only at the pixel level, SM loss also compares the two in cells in a grid that enables the loss to measure higher-level similarities in the locations, sizes, and quantities. The grid size is selected according to each sample, which enables the method to consider the variation in mass sizes. In this study, Binary Cross Entropy (BCE) and Tversky are used as the core loss in experiments for the SM loss. AU-Net is selected as the baseline approach. We tested our method on the INbreast dataset. The results of our experiments show a significant boost in the performance of the baseline method while outperforming state-of-the-art mass segmentation methods.",
        "keywords": "Mass Segmentation;Mammography;AU-Net;Loss Function;Spatial Matching Loss",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Parvaneh Aliniya;Mircea Nicolescu;Monica Nicolescu;George Bebis",
        "authorids": "~Parvaneh_Aliniya1;~Mircea_Nicolescu2;~Monica_Nicolescu1;~George_Bebis1",
        "gender": "F;;F;",
        "homepage": ";https://www.cse.unr.edu/~mircea/;http://www.cse.unr.edu/~monica;",
        "dblp": ";;;",
        "google_scholar": ";;;",
        "orcid": ";;;",
        "linkedin": "parvaneh-alinia-5378aa112/;;;",
        "or_profile": "~Parvaneh_Aliniya1;~Mircea_Nicolescu2;~Monica_Nicolescu1;~George_Bebis1",
        "aff": "University of Nevada, Reno;University of Nevada, Reno;University of Nevada, Reno;",
        "aff_domain": "unr.edu;unr.edu;unr.edu;",
        "position": "PhD student;Full Professor;Full Professor;",
        "bibtex": "@misc{\nanonymous2024spatial,\ntitle={Spatial Matching Loss Function for Mass Segmentation on Whole Mammography Images},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=c8UABqZfld}\n}",
        "github": "",
        "project": "",
        "reviewers": "EMHy;SUy7;HK6n",
        "site": "https://openreview.net/forum?id=c8UABqZfld",
        "pdf_size": 2760248,
        "rating": "3;3;5",
        "confidence": "5;4;4",
        "soundness": "1;3;3",
        "contribution": "1;1;3",
        "presentation": "1;2;3",
        "wc_summary": "38;76;64",
        "wc_strengths": "19;25;84",
        "wc_weaknesses": "64;230;251",
        "wc_questions": "79;12;71",
        "wc_review": "200;343;470",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "770;768;852",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            59.333333333333336,
            15.860503004493758
        ],
        "wc_strengths_avg": [
            42.666666666666664,
            29.32954520994525
        ],
        "wc_weaknesses_avg": [
            181.66666666666666,
            83.64342306614563
        ],
        "wc_questions_avg": [
            54.0,
            29.87752778706208
        ],
        "wc_review_avg": [
            337.6666666666667,
            110.29153286731591
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            796.6666666666666,
            39.135093657171126
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:68zxUHlFwGMJ:scholar.google.com/&scioq=Spatial+Matching+Loss+Function+for+Mass+Segmentation+on+Whole+Mammography+Images&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Nevada",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.unr.edu",
        "aff_unique_abbr": "UNR",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Reno",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "c8m4Yzx8hm",
        "title": "Visual Topics via Visual Vocabularies",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Researchers have long used topic modeling to automatically characterize and summarize text documents without supervision. Can we extract similar structures from collections of images? To do this, we propose *visual vocabularies*, a method to analyze image datasets by decomposing images into segments, and grouping similar segments into visual \"words\". These vocabularies of visual \"words\" enable us to extract visual topics that capture hidden themes distinct from what is captured by classic unsupervised approaches. We evaluate our visual topics using standard topic modeling metrics and confirm the coherency of our visual topics via a human study.",
        "keywords": "Topic Modeling;Explainability;Vision",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/04088bebfcc43a1804bdc0d8189824d6cde57af0.zip",
        "author": "Shreya Havaldar;Weiqiu You;Lyle Ungar;Eric Wong",
        "authorids": "~Shreya_Havaldar1;~Weiqiu_You1;~Lyle_Ungar1;~Eric_Wong1",
        "gender": "F;F;M;M",
        "homepage": "https://shreyahavaldar.com;https://fallcat.github.io;http://www.cis.upenn.edu/~ungar/;http://riceric22.github.io/",
        "dblp": ";264/4947.html;u/LyleHUngar;64/1811-1.html",
        "google_scholar": "h2tzi9MAAAAJ;1zmgbZIAAAAJ;https://scholar.google.com.tw/citations?user=KCiDjbkAAAAJ;pWnTMRkAAAAJ",
        "orcid": ";;;",
        "linkedin": "shreya-havaldar-0a2664155/;;;",
        "or_profile": "~Shreya_Havaldar1;~Weiqiu_You1;~Lyle_Ungar1;~Eric_Wong1",
        "aff": "University of Pennsylvania;University of Pennsylvania;University of Pennsylvania;University of Pennsylvania",
        "aff_domain": "upenn.edu;seas.upenn.edu;upenn.edu;upenn.edu",
        "position": "PhD student;PhD student;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nhavaldar2024visual,\ntitle={Visual Topics via Visual Vocabularies},\nauthor={Shreya Havaldar and Weiqiu You and Lyle Ungar and Eric Wong},\nyear={2024},\nurl={https://openreview.net/forum?id=c8m4Yzx8hm}\n}",
        "github": "",
        "project": "",
        "reviewers": "mBML;GURR;x5q5",
        "site": "https://openreview.net/forum?id=c8m4Yzx8hm",
        "pdf_size": 11993893,
        "rating": "1;3;5",
        "confidence": "5;4;4",
        "soundness": "1;2;2",
        "contribution": "1;2;1",
        "presentation": "1;2;2",
        "wc_summary": "13;141;75",
        "wc_strengths": "1;28;24",
        "wc_weaknesses": "66;231;67",
        "wc_questions": "10;34;78",
        "wc_review": "90;434;244",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            1.632993161855452
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            76.33333333333333,
            52.264285660052366
        ],
        "wc_strengths_avg": [
            17.666666666666668,
            11.897712198383164
        ],
        "wc_weaknesses_avg": [
            121.33333333333333,
            77.54711829304526
        ],
        "wc_questions_avg": [
            40.666666666666664,
            28.158282775923837
        ],
        "wc_review_avg": [
            256.0,
            140.69352034357044
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:-fQYGRHM13EJ:scholar.google.com/&scioq=Visual+Topics+via+Visual+Vocabularies&hl=en&as_sdt=0,44",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of Pennsylvania",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.upenn.edu",
        "aff_unique_abbr": "UPenn",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "BadChain: Backdoor Chain-of-Thought Prompting for Large Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18305",
        "id": "c93SBwz1Ma",
        "author_site": "Zhen Xiang, Fengqing Jiang, Zidi Xiong, Bhaskar Ramasubramanian, Radha Poovendran, Bo Li",
        "tldr": "",
        "abstract": "Large language models (LLMs) are shown to benefit from chain-of-thought (COT) prompting, particularly when tackling tasks that require systematic reasoning processes. On the other hand, COT prompting also poses new vulnerabilities in the form of backdoor attacks, wherein the model will output unintended malicious content under specific backdoor-triggered conditions during inference. Traditional methods for launching backdoor attacks involve either contaminating the training dataset with backdoored instances or directly manipulating the model parameters during deployment. However, these approaches are not practical for commercial LLMs that typically operate via API access. In this paper, we propose BadChain, the first backdoor attack against LLMs employing COT prompting, which does not require access to the training dataset or model parameters and imposes low computational overhead. BadChain leverages the inherent reasoning capabilities of LLMs by inserting a backdoor reasoning step into the sequence of reasoning steps of the model output, thereby altering the final response when a backdoor trigger is embedded in the query prompt. In particular, a subset of demonstrations will be manipulated to incorporate a backdoor reasoning step in COT prompting. Consequently, given any query prompt containing the backdoor trigger, the LLM will be misled to output unintended content. Empirically, we show the effectiveness of BadChain for two COT strategies across four LLMs (Llama2, GPT-3.5, PaLM2, and GPT-4) and six complex benchmark tasks encompassing arithmetic, commonsense, and symbolic reasoning. We show that the baseline backdoor attacks designed for simpler tasks such as semantic classification will fail on these complicated tasks. In addition, our findings reveal that LLMs endowed with stronger reasoning capabilities exhibit higher susceptibility to BadChain, exemplified by a high average attack success rate of 97.0\\% across the six benchmark tasks on GPT-4. We also demonstrate the interpretability of BadChain by showing that the relationship between the trigger and the backdoor reasoning step can be well-explained based on the output of the backdoored model. Finally, we propose two defenses based on shuffling and demonstrate their overall ineffectiveness against BadChain. Therefore, BadChain remains a severe threat to LLMs, underscoring the urgency for the development of robust and effective future defenses.",
        "keywords": "large language model;chain-of-thought;backdoor attack;reasoning task",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Zhen Xiang;Fengqing Jiang;Zidi Xiong;Bhaskar Ramasubramanian;Radha Poovendran;Bo Li",
        "authorids": "~Zhen_Xiang1;~Fengqing_Jiang1;~Zidi_Xiong2;~Bhaskar_Ramasubramanian1;~Radha_Poovendran1;~Bo_Li19",
        "gender": "M;M;M;M;Not Specified;F",
        "homepage": "https://zhenxianglance.github.io/;https://fqjiang.work/;https://polaris-73.github.io/;https://sites.google.com/view/rbhaskar;https://people.ece.uw.edu/radha/index.html;http://boli.cs.illinois.edu/",
        "dblp": "20/2799.html;294/4119;314/6808;173/4698;29/5044;50/3402-26",
        "google_scholar": "https://scholar.google.com/citations?hl=en;kTXY8P0AAAAJ;XL6QafwAAAAJ;ANJ9dgkAAAAJ;EEoNZ7NbVzMC;K8vJkTcAAAAJ",
        "orcid": ";0009-0002-9077-2399;;0000-0002-2166-7838;;",
        "linkedin": ";fengqing-jiang-45b7311aa/;https://www.linkedin.com/public-profile/settings;;;",
        "or_profile": "~Zhen_Xiang1;~Fengqing_Jiang1;~Zidi_Xiong2;~Bhaskar_Ramasubramanian1;~Radha_Poovendran1;~Bo_Li19",
        "aff": "University of Illinois, Urbana Champaign;Amazon;Harvard University;Western Washington University;University of Washington, Seattle;University of Illinois, Urbana Champaign",
        "aff_domain": "illinois.edu;amazon.com;harvard.edu;wwu.edu;uw.edu;illinois.edu",
        "position": "Postdoc;Intern;PhD student;Assistant Professor;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nxiang2024badchain,\ntitle={BadChain: Backdoor Chain-of-Thought Prompting for Large Language Models},\nauthor={Zhen Xiang and Fengqing Jiang and Zidi Xiong and Bhaskar Ramasubramanian and Radha Poovendran and Bo Li},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=c93SBwz1Ma}\n}",
        "github": "",
        "project": "",
        "reviewers": "1xit;uevU;eucb;zbWA",
        "pdf_size": 5515552,
        "rating": "3;6;6;6",
        "confidence": "4;4;3;4",
        "soundness": "3;2;3;2",
        "contribution": "2;3;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "60;91;71;65",
        "wc_strengths": "55;38;48;35",
        "wc_weaknesses": "424;97;275;146",
        "wc_questions": "9;5;31;12",
        "wc_review": "548;231;425;258",
        "wc_reply_reviewers": "0;0;143;24",
        "wc_reply_authors": "1301;1065;1024;1444",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "3;3;4;4",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            71.75,
            11.776565713313877
        ],
        "wc_strengths_avg": [
            44.0,
            7.968688725254614
        ],
        "wc_weaknesses_avg": [
            235.5,
            126.77243391210882
        ],
        "wc_questions_avg": [
            14.25,
            9.98436277385793
        ],
        "wc_review_avg": [
            365.5,
            128.93118319475704
        ],
        "wc_reply_reviewers_avg": [
            41.75,
            59.27214775929754
        ],
        "wc_reply_authors_avg": [
            1208.5,
            172.22732071306226
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.5,
            0.5
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 75,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14319368793511605555&as_sdt=20000005&sciodt=0,21&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=c93SBwz1Ma",
        "pdf": "https://openreview.net/pdf?id=c93SBwz1Ma",
        "email": "illinois.edu;amazon.com;harvard.edu;wwu.edu;uw.edu;illinois.edu",
        "author_num": 6,
        "aff_unique_index": "0;1;2;3;4;0",
        "aff_unique_norm": "University of Illinois Urbana-Champaign;Amazon;Harvard University;Western Washington University;University of Washington",
        "aff_unique_dep": ";Amazon.com, Inc.;;;",
        "aff_unique_url": "https://illinois.edu;https://www.amazon.com;https://www.harvard.edu;https://www.wwu.edu;https://www.washington.edu",
        "aff_unique_abbr": "UIUC;Amazon;Harvard;WWU;UW",
        "aff_campus_unique_index": "0;2;0",
        "aff_campus_unique": "Urbana-Champaign;;Seattle",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Enhancing Neural Training via a Correlated Dynamics Model",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18304",
        "id": "c9xsaASm9L",
        "author_site": "Jonathan Brokman, Roy Betser, Rotem Turjeman, Tom Berkov, Ido Cohen, Guy Gilboa",
        "tldr": "",
        "abstract": "As neural networks grow in scale, their training becomes both computationally demanding and rich in dynamics. Amidst the flourishing interest in these training dynamics, we present a novel observation: Parameters during training exhibit intrinsic correlations over time. Capitalizing on this, we introduce  \\emph{correlation mode decomposition} (CMD). This algorithm clusters the parameter space into groups, termed modes, that display synchronized behavior across epochs. This enables CMD to efficiently represent the training dynamics of complex networks, like ResNets and Transformers, using only a few modes. Moreover, test set generalization is enhanced.\n    \nWe introduce an efficient CMD variant, designed to run concurrently with training. Our experiments indicate that CMD surpasses the state-of-the-art method for compactly modeled dynamics on image classification. Our modeling can improve training efficiency and lower communication overhead, as shown by our preliminary experiments in the context of federated learning.",
        "keywords": "dynamics modeling;training analysis;low dimensional model for training",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Jonathan Brokman;Roy Betser;Rotem Turjeman;Tom Berkov;Ido Cohen;Guy Gilboa",
        "authorids": "~Jonathan_Brokman1;~Roy_Betser1;~Rotem_Turjeman1;~Tom_Berkov1;~Ido_Cohen3;~Guy_Gilboa1",
        "gender": "M;;F;;M;M",
        "homepage": ";;;;https://idoc.webgr.technion.ac.il/;https://guygilboa.net.technion.ac.il/",
        "dblp": ";365/6657;;;;44/4220",
        "google_scholar": ";o6qgMnkAAAAJ;;;;tH2_FEoAAAAJ",
        "orcid": ";;;;;0000-0001-8609-8253",
        "linkedin": "jonathan-brokman-0a6899103/;roy-betser/;rotem-turjeman-3040b8202/;tom-berkov-a5540610/;;",
        "or_profile": "~Jonathan_Brokman1;~Roy_Betser1;~Rotem_Turjeman1;~Tom_Berkov1;~Ido_Cohen3;~Guy_Gilboa1",
        "aff": "Technion - Israel Institute of Technology, Technion - Israel Institute of Technology;Technion - Israel Institute of Technology, Technion;Technion - Israel Institute of Technology, Technion - Israel Institute of Technology;;;Technion - Israel Institute of Technology, Technion",
        "aff_domain": "campus.technion.ac.il;technion.ac.il;campus.technion.ac.il;;;technion.ac.il",
        "position": "PhD student;PhD student;MS student;;;Associate Professor",
        "bibtex": "@inproceedings{\nbrokman2024enhancing,\ntitle={Enhancing Neural Training via a Correlated Dynamics Model},\nauthor={Jonathan Brokman and Roy Betser and Rotem Turjeman and Tom Berkov and Ido Cohen and Guy Gilboa},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=c9xsaASm9L}\n}",
        "github": "",
        "project": "",
        "reviewers": "8rcX;yr3M;t9P8;JHvF",
        "pdf_size": 23450313,
        "rating": "3;5;8;10",
        "confidence": "4;2;3;4",
        "soundness": "3;2;2;4",
        "contribution": "2;2;3;4",
        "presentation": "2;1;2;4",
        "wc_summary": "125;160;45;103",
        "wc_strengths": "71;75;75;118",
        "wc_weaknesses": "248;329;50;416",
        "wc_questions": "86;2;1;9",
        "wc_review": "530;566;171;646",
        "wc_reply_reviewers": "0;467;0;46",
        "wc_reply_authors": "854;1868;302;822",
        "reply_reviewers": "0;2;0;1",
        "reply_authors": "3;4;1;2",
        "rating_avg": [
            6.5,
            2.692582403567252
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            108.25,
            41.79339062579154
        ],
        "wc_strengths_avg": [
            84.75,
            19.266226926930972
        ],
        "wc_weaknesses_avg": [
            260.75,
            135.40564057675
        ],
        "wc_questions_avg": [
            24.5,
            35.64056677439347
        ],
        "wc_review_avg": [
            478.25,
            182.29149047610534
        ],
        "wc_reply_reviewers_avg": [
            128.25,
            196.4769388503394
        ],
        "wc_reply_authors_avg": [
            961.5,
            567.3841291400386
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.16796775328675628,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4999019880039610119&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=c9xsaASm9L",
        "pdf": "https://openreview.net/pdf?id=c9xsaASm9L",
        "email": "campus.technion.ac.il;technion.ac.il;campus.technion.ac.il;;;technion.ac.il",
        "author_num": 6,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Technion - Israel Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.technion.ac.il/en/",
        "aff_unique_abbr": "Technion",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Israel"
    },
    {
        "id": "cB9bAFGFAA",
        "title": "FedSRC: Federated Learning with Self-Regulating Clients",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Federated Learning (FL) has emerged as a prominent privacy-preserving decentralized paradigm for collaborative machine learning across many devices.\nHowever, FL suffers from performance degradation in the global model due to heterogeneity in clients' locally generated data. Some prior studies address this issue by limiting or even discarding certain clients' contributions to the global model, resulting in unnecessary computation and communication for the discarded clients. Alternatively, selectively choosing clients to participate in FL may avoid such resource waste. However, such active client selection requires client-level profiling that violates privacy.\nIn this paper, we present a novel FL approach, called FedSRC: Federated Learning with Self-Regulating Clients, that can save clients' resources while preserving their anonymity. In FedSRC, clients can determine if their local training is favorable to the global model and whether they should participate in an FL round using a lightweight checkpoint based on their test loss on the global model.\nThrough comprehensive evaluations using four datasets, we show that FedSRC can improve global model performance, all the while reducing communication costs by up to 30\\% and computation costs by 55\\%.",
        "keywords": "Federated learning;efficiency;computation and communication savings;client-side control",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/a8ec301d36bbeacf0113202c8567b1dc82443c3c.zip",
        "author": "Zahidur Talukder;Muhammad Rana;Keaton Hamm;Mohammad A Islam",
        "authorids": "~Zahidur_Talukder1;~Muhammad_Rana2;~Keaton_Hamm1;~Mohammad_A_Islam1",
        "gender": "M;M;;M",
        "homepage": ";https://keatonhamm.com;https://crystal.uta.edu/~mislam/;https://zahid2734.github.io/",
        "dblp": ";;https://dblp.uni-trier.de/pers/hd/i/Islam_0001:Mohammad_A=;270/0788.html",
        "google_scholar": ";;rxKWd1cAAAAJ;j4grcooAAAAJ",
        "orcid": ";;0000-0002-5778-4366;",
        "linkedin": "https://www.linkedin.com/me?trk=p_mwlite_me_notifications-secondary_nav;;;zahidur-rahim-talukder-784b89218/",
        "or_profile": "~Muhammad_Rana2;~Keaton_Hamm1;~Mohammad_A_Islam1;~Zahidur_Rahim_Talukder1",
        "aff": "University of Texas at Arlington;University of Texas, Arlington;University of Texas at Arlington;University of Texas at Arlington",
        "aff_domain": "mavs.uta.edu;uta.edu;uta.edu;uta.edu",
        "position": "PhD student;Assistant Professor;Assistant Professor;PhD student",
        "bibtex": "@misc{\ntalukder2024fedsrc,\ntitle={Fed{SRC}: Federated Learning with Self-Regulating Clients},\nauthor={Zahidur Talukder and Muhammad Rana and Keaton Hamm and Mohammad A Islam},\nyear={2024},\nurl={https://openreview.net/forum?id=cB9bAFGFAA}\n}",
        "github": "",
        "project": "",
        "reviewers": "Xw96;fQ8U;3krf;yhN4;2b2m",
        "site": "https://openreview.net/forum?id=cB9bAFGFAA",
        "pdf_size": 2704901,
        "rating": "3;3;3;3;5",
        "confidence": "4;4;4;4;4",
        "soundness": "2;3;2;2;3",
        "contribution": "2;1;2;2;2",
        "presentation": "3;2;2;3;3",
        "wc_summary": "63;177;83;59;113",
        "wc_strengths": "62;93;31;70;64",
        "wc_weaknesses": "292;476;129;149;89",
        "wc_questions": "38;82;86;182;207",
        "wc_review": "455;828;329;460;473",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            3.4,
            0.8
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            1.8,
            0.4000000000000001
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            99.0,
            43.43270657004926
        ],
        "wc_strengths_avg": [
            64.0,
            19.849433241279208
        ],
        "wc_weaknesses_avg": [
            227.0,
            142.0971498658576
        ],
        "wc_questions_avg": [
            119.0,
            64.39254615248569
        ],
        "wc_review_avg": [
            509.0,
            167.79392122481673
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12338105936433042540&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of Texas at Arlington",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uta.edu",
        "aff_unique_abbr": "UTA",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Arlington",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "cDInj7WMQm",
        "title": "UGC: UNIVERSAL GRAPH COARSENING",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In the era of big data, graphs have emerged as a natural representation for intricate relationships. However, graph sizes often become unwieldy, leading to storage, computation, and analysis challenges. A crucial demand arises for methods that can effectively downsize large graphs while retaining vital insights. Graph coarsening seeks to simplify large graphs while maintaining essential features. Most published methods are suitable for homophilic datasets, limiting their universal use. We propose Universal Graph Coarsening (UGC), a framework equally suitable for homophilic and heterophilic datasets. UGC integrates node attributes and adjacency information, leveraging the dataset's heterophily factor and is a first ever linear time-complexity framework. Results on benchmark datasets demonstrate that UGC preserves spectral similarity while coarsening. In comparison to state of the art methods, UGC is 4x to 15x faster, has lower eigen-error, and yields superior performance on downstream processing tasks even at 70\\% coarsening ratios.",
        "keywords": "Graph Coarsening;Graph Neural Networks;Locality Sensitive Hashing;Graph Learning",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/1ef7925a44f7b6660b85d1820e573407b8de824d.zip",
        "author": "Mohit Kataria;Sandeep Kumar;Jayadeva Jayadeva",
        "authorids": "~Mohit_Kataria1;~Sandeep_Kumar8;~Jayadeva_Jayadeva1",
        "gender": "M;M;M",
        "homepage": ";https://sites.google.com/view/sandeepkr/home;",
        "dblp": ";;58/4288",
        "google_scholar": ";lycMMW8AAAAJ;",
        "orcid": ";;",
        "linkedin": "passenger/;sandeep-kumar-84463332/;",
        "or_profile": "~Mohit_Kataria1;~Sandeep_Kumar8;~Jayadeva_Jayadeva1",
        "aff": "Indian Institute of Technology, Delhi;Indian Institute of Technology Delhi;Indian Institute of Technology Delhi",
        "aff_domain": "iitd.ac.in;iitd.ac.in;iitd.ac.in",
        "position": "PhD student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nkataria2024ugc,\ntitle={{UGC}: {UNIVERSAL} {GRAPH} {COARSENING}},\nauthor={Mohit Kataria and Sandeep Kumar and Jayadeva Jayadeva},\nyear={2024},\nurl={https://openreview.net/forum?id=cDInj7WMQm}\n}",
        "github": "",
        "project": "",
        "reviewers": "rN8j;Nt9N;aXHZ",
        "site": "https://openreview.net/forum?id=cDInj7WMQm",
        "pdf_size": 6765442,
        "rating": "3;6;6",
        "confidence": "4;4;3",
        "soundness": "1;3;3",
        "contribution": "2;3;3",
        "presentation": "1;3;4",
        "wc_summary": "46;69;135",
        "wc_strengths": "34;36;33",
        "wc_weaknesses": "377;79;158",
        "wc_questions": "2;34;64",
        "wc_review": "459;218;390",
        "wc_reply_reviewers": "573;12;75",
        "wc_reply_authors": "2888;477;818",
        "reply_reviewers": "2;1;1",
        "reply_authors": "5;2;3",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "wc_summary_avg": [
            83.33333333333333,
            37.72119946248911
        ],
        "wc_strengths_avg": [
            34.333333333333336,
            1.247219128924647
        ],
        "wc_weaknesses_avg": [
            204.66666666666666,
            126.05378040961546
        ],
        "wc_questions_avg": [
            33.333333333333336,
            25.315783394730033
        ],
        "wc_review_avg": [
            355.6666666666667,
            101.33881564117254
        ],
        "wc_reply_reviewers_avg": [
            220.0,
            250.9302691984369
        ],
        "wc_reply_authors_avg": [
            1394.3333333333333,
            1065.3169585725284
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            1.247219128924647
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6309238831352609926&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Indian Institute of Technology Delhi",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.iitdelhi.ac.in",
        "aff_unique_abbr": "IIT Delhi",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Delhi",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "India"
    },
    {
        "id": "cElJ9KOat3",
        "title": "Learning Multiple Coordinated Agents under Directed Acyclic Graph Constraints",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper proposes a novel multi-agent reinforcement learning (MARL) method to learn multiple coordinated agents under directed acyclic graph (DAG) constraints. Unlike existing MARL approaches, our method explicitly exploits the DAG structure between agents to achieve more effective learning performance. Theoretically, we propose a novel surrogate value function based on a MARL model with synthetic rewards (MARLM-SR) and prove that it serves as a lower bound of the optimal value function. Computationally, we propose a practical training algorithm that exploits new notion of leader agent and reward generator and distributor agent to guide the decomposed follower agents to better explore the parameter space in environments with DAG constraints. Empirically, we exploit four DAG environments including a real-world scheduling for one of Intel\u2019s high volume packaging and test factory to benchmark our methods and show it outperforms the other non-DAG approaches.",
        "keywords": "Multi-agent reinforcement learning;directed acyclic graph;synthetic reward;reward shaping",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Jaeyeon Jang;Diego Klabjan;Han Liu;Nital S Patel;Xiuqi Li;Balakrishnan Ananthanarayanan;Husam Dauod;Tzung-Han Juang",
        "authorids": "~Jaeyeon_Jang2;~Diego_Klabjan1;~Han_Liu4;~Nital_S_Patel1;~Xiuqi_Li2;~Balakrishnan_Ananthanarayanan1;~Husam_Dauod1;~Tzung-Han_Juang1",
        "gender": "M;M;;M;;M;;",
        "homepage": "https://sites.google.com/view/jaeyeonjang/%ED%99%88;http://dynresmanagement.com/index.html;;;;;;",
        "dblp": "237/3905;17/105;;;;;;",
        "google_scholar": "YcTjjbUAAAAJ;TaQZ_VUAAAAJ;;;;;RReJUlIAAAAJ;",
        "orcid": ";0000-0003-4213-9281;;0000-0002-1180-2717;;;;",
        "linkedin": ";diegoklabjan;;nitalspatel/;xiuqi-li/;abalki/;husam-dauod-2b268223/;",
        "or_profile": "~Jaeyeon_Jang2;~Diego_Klabjan1;~Han_Liu4;~Nital_S_Patel1;~Xiuqi_Li2;~Balakrishnan_Ananthanarayanan1;~Husam_Dauod1;~Tzung-Han_Juang1",
        "aff": "The Catholic University of Korea;Northwestern University;Northwestern University;Intel;Intel;;;",
        "aff_domain": "catholic.ac.kr;u.northwestern.edu;u.northwestern.edu;intel.com;intel.com;;;",
        "position": "Assistant Professor;Full Professor;Associate Professor;Principal Researcher;Machine Learning Engineer;;;",
        "bibtex": "@misc{\njang2024learning,\ntitle={Learning Multiple Coordinated Agents under Directed Acyclic Graph Constraints},\nauthor={Jaeyeon Jang and Diego Klabjan and Han Liu and Nital S Patel and Xiuqi Li and Balakrishnan Ananthanarayanan and Husam Dauod and Tzung-Han Juang},\nyear={2024},\nurl={https://openreview.net/forum?id=cElJ9KOat3}\n}",
        "github": "",
        "project": "",
        "reviewers": "e4e1;cDFa;DooC;qXdU",
        "site": "https://openreview.net/forum?id=cElJ9KOat3",
        "pdf_size": 3020966,
        "rating": "3;3;6;6",
        "confidence": "3;4;3;3",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "1;3;3;3",
        "wc_summary": "144;78;96;60",
        "wc_strengths": "93;26;70;39",
        "wc_weaknesses": "143;27;67;53",
        "wc_questions": "229;16;76;29",
        "wc_review": "609;147;309;181",
        "wc_reply_reviewers": "150;0;18;0",
        "wc_reply_authors": "1325;352;575;132",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "3;1;1;1",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            94.5,
            31.284980421921315
        ],
        "wc_strengths_avg": [
            57.0,
            26.22022120425379
        ],
        "wc_weaknesses_avg": [
            72.5,
            43.159587579123134
        ],
        "wc_questions_avg": [
            87.5,
            84.68913743804455
        ],
        "wc_review_avg": [
            311.5,
            182.0734741800683
        ],
        "wc_reply_reviewers_avg": [
            42.0,
            62.78534860936905
        ],
        "wc_reply_authors_avg": [
            596.0,
            449.08629460271885
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.5773502691896258,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8108141917500357402&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;1;2;2",
        "aff_unique_norm": "Catholic University of Korea;Northwestern University;Intel",
        "aff_unique_dep": ";;Intel Corporation",
        "aff_unique_url": "http://www.cuk.edu.ko;https://www.northwestern.edu;https://www.intel.com",
        "aff_unique_abbr": "CUK;NU;Intel",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;1",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "id": "cFT9jWI7vT",
        "title": "Towards Architecture-Insensitive Untrained Network Priors for Accelerated MRI",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Untrained neural networks pioneered by Deep Image Prior have recently enabled MRI reconstruction without requiring fully-sampled measurements for training. Their success is widely attributed to the implicit regularization induced by suitable network architectures. However, the lack of understanding of such architectural priors results in superfluous design choices and sub-optimal outcomes. This work aims to simplify the architectural design decisions for DIP-MRI to facilitate its practical deployment. We observe that certain architectural components are more prone to causing overfitting regardless of the number of parameters, incurring severe reconstruction artifacts by hindering accurate extrapolation on the un-acquired measurements. We interpret this phenomenon from a frequency perspective and find that the architectural characteristics favoring low frequencies, i.e., deep and narrow with unlearnt upsampling, can lead to enhanced generalization and hence better reconstruction. Building on this insight, we propose two architecture-agnostic remedies: one to constrain the frequency range of the white-noise input and the other to penalize the Lipschitz constants of the network. We demonstrate that even with just one extra line of code on the input, the performance gap between the ill-designed models and the high-performing ones can be closed. These results signify that for the first time, architectural biases on untrained MRI reconstruction can be mitigated without architectural modifications.",
        "keywords": "Untrained Networks;Unsupervised Learning;MRI Reconstruction",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/6508d770ba6d8d62e7e259690383a00d61845a67.pdf",
        "author": "Yilin Liu;Yunkui Pang;Jiang Li;Yong Chen;Pew-Thian Yap",
        "authorids": "~Yilin_Liu3;~Yunkui_Pang1;~Jiang_Li5;~Yong_Chen12;~Pew-Thian_Yap1",
        "gender": ";M;;M;M",
        "homepage": ";https://github.com/Pangyk;;;https://www.yaplab.io",
        "dblp": ";278/2962;;;93/5188",
        "google_scholar": ";;;;QGdnthwAAAAJ",
        "orcid": ";;;0000-0001-6183-2693;0000-0003-1489-2102",
        "linkedin": ";;;;pew-thian-yap-5405944/",
        "or_profile": "~Yilin_Liu3;~Yunkui_Pang1;~Jiang_Li5;~Yong_Chen12;~Pew-Thian_Yap1",
        "aff": ";University of North Carolina at Chapel Hill;;Case Western Reserve University;University of North Carolina at Chapel Hill",
        "aff_domain": ";unc.edu;;case.edu;unc.edu",
        "position": ";PhD student;;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nliu2024towards,\ntitle={Towards Architecture-Insensitive Untrained Network Priors for Accelerated {MRI}},\nauthor={Yilin Liu and Yunkui Pang and Jiang Li and Yong Chen and Pew-Thian Yap},\nyear={2024},\nurl={https://openreview.net/forum?id=cFT9jWI7vT}\n}",
        "github": "",
        "project": "",
        "reviewers": "uRkm;a8Rv;QL8v;uVud",
        "site": "https://openreview.net/forum?id=cFT9jWI7vT",
        "pdf_size": 8537360,
        "rating": "3;5;6;6",
        "confidence": "4;3;5;4",
        "soundness": "1;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "72;88;49;71",
        "wc_strengths": "27;46;63;121",
        "wc_weaknesses": "196;123;203;125",
        "wc_questions": "36;6;230;4",
        "wc_review": "331;263;545;321",
        "wc_reply_reviewers": "293;0;0;0",
        "wc_reply_authors": "976;671;1018;370",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "2;1;2;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            70.0,
            13.874436925511608
        ],
        "wc_strengths_avg": [
            64.25,
            35.152347005569915
        ],
        "wc_weaknesses_avg": [
            161.75,
            37.83764659700706
        ],
        "wc_questions_avg": [
            69.0,
            93.81364506296512
        ],
        "wc_review_avg": [
            365.0,
            107.11675872616759
        ],
        "wc_reply_reviewers_avg": [
            73.25,
            126.87272165442026
        ],
        "wc_reply_authors_avg": [
            758.75,
            261.3593072764006
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.28867513459481287,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:4Qb-jRiTRvQJ:scholar.google.com/&scioq=Towards+Architecture-Insensitive+Untrained+Network+Priors+for+Accelerated+MRI&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of North Carolina;Case Western Reserve University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.unc.edu;https://www.case.edu",
        "aff_unique_abbr": "UNC;CWRU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Chapel Hill;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "cG2BAbFnA4",
        "title": "Learning with Complementary Labels Revisited: A Consistent Approach via Negative-Unlabeled Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Complementary-label learning is a weakly supervised learning problem in which each training example is associated with one or multiple complementary labels indicating the classes to which it does not belong. Existing consistent approaches have relied on the uniform distribution assumption to model the generation of complementary labels, or on an ordinary-label training set to estimate the transition matrix. However, both conditions may not be satisfied in real-world scenarios. In this paper, we propose a novel complementary-label learning approach that does not rely on these conditions. We find that complementary-label learning can be expressed as a set of negative-unlabeled binary classification problems when using the one-versus-rest strategy. This observation allows us to propose a risk-consistent approach with theoretical guarantees. Furthermore, we introduce a risk correction approach to address overfitting problems when using complex models. We also prove the statistical consistency and convergence rate of the corrected risk estimator. Extensive experimental results on both synthetic and real-world benchmark datasets validate the superiority of our proposed approach over state-of-the-art methods.",
        "keywords": "Complementary-label learning;weakly supervised learning;positive-unlabeled learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/8596970003003f02da20f6d20a1fb5d471786840.zip",
        "author": "Wei Wang;Takashi Ishida;Yu-Jie Zhang;Gang Niu;Masashi Sugiyama",
        "authorids": "~Wei_Wang68;~Takashi_Ishida1;~Yu-Jie_Zhang1;~Gang_Niu1;~Masashi_Sugiyama1",
        "gender": "M;M;M;M;M",
        "homepage": "https://wwangwitsel.github.io/;https://takashiishida.github.io/;https://yujie-zhang96.github.io/;https://niug1984.github.io;http://www.ms.k.u-tokyo.ac.jp/sugi/",
        "dblp": "35/7092-373.html;84/2290-1;234/6681;26/3367-1;35/1228",
        "google_scholar": "a38jZkwAAAAJ;IzoyKyUAAAAJ;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.co.jp/citations?user=HOkcy00AAAAJ;https://scholar.google.co.jp/citations?user=GkYIrlIAAAAJ",
        "orcid": "0000-0002-8860-0494;;;;0000-0001-6658-6743",
        "linkedin": ";;;;",
        "or_profile": "~Wei_Wang68;~Takashi_Ishida1;~Yu-Jie_Zhang1;~Gang_Niu1;~Masashi_Sugiyama1",
        "aff": "The University of Tokyo;The University of Tokyo;The University of Tokyo;Southeast University;The University of Tokyo",
        "aff_domain": "u-tokyo.ac.jp;tokyo.ac.jp;u-tokyo.ac.jp;seu.edu.cn;u-tokyo.ac.jp",
        "position": "PhD student;Lecturer;PhD student;Adjunct Full Professor;Full Professor",
        "bibtex": "@misc{\nwang2024learning,\ntitle={Learning with Complementary Labels Revisited: A Consistent Approach via Negative-Unlabeled Learning},\nauthor={Wei Wang and Takashi Ishida and Yu-Jie Zhang and Gang Niu and Masashi Sugiyama},\nyear={2024},\nurl={https://openreview.net/forum?id=cG2BAbFnA4}\n}",
        "github": "",
        "project": "",
        "reviewers": "XP12;CHdE;ye4F;MvNX",
        "site": "https://openreview.net/forum?id=cG2BAbFnA4",
        "pdf_size": 473720,
        "rating": "3;6;6;6",
        "confidence": "3;4;3;4",
        "soundness": "2;3;4;3",
        "contribution": "2;3;3;2",
        "presentation": "2;3;3;3",
        "wc_summary": "18;53;49;86",
        "wc_strengths": "18;41;38;51",
        "wc_weaknesses": "124;154;32;108",
        "wc_questions": "40;118;135;15",
        "wc_review": "200;366;254;260",
        "wc_reply_reviewers": "0;112;44;0",
        "wc_reply_authors": "1065;979;1217;502",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "3;4;4;2",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            51.5,
            24.088378940891808
        ],
        "wc_strengths_avg": [
            37.0,
            11.979148550710939
        ],
        "wc_weaknesses_avg": [
            104.5,
            44.997222136483046
        ],
        "wc_questions_avg": [
            77.0,
            50.64089256717342
        ],
        "wc_review_avg": [
            270.0,
            60.149812967290266
        ],
        "wc_reply_reviewers_avg": [
            39.0,
            45.81484475582123
        ],
        "wc_reply_authors_avg": [
            940.75,
            267.2623944740449
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.25,
            0.82915619758885
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13786679311204414553&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "University of Tokyo;Southeast University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.u-tokyo.ac.jp;https://www.seu.edu.cn/",
        "aff_unique_abbr": "UTokyo;SEU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "Japan;China"
    },
    {
        "id": "cG8Q4FE0Hi",
        "title": "RCOT: Detecting and Rectifying Factual Inconsistency in Reasoning by Reversing Chain-of-Thought",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large language Models (LLMs) have achieved promising performance on arithmetic reasoning tasks by incorporating step-by-step chain-of-thought (CoT) prompting. However, LLMs face challenges in maintaining factual consistency during reasoning, exhibiting tendencies to condition overlooking, question misinterpretation, and condition hallucination over given problems. Existing methods use coarse-grained feedback (e.g., whether the answer is correct) to improve factual consistency. In this work, we propose RCoT (Reversing Chain-of-Thought), a novel method to improve LLMs\u2019 reasoning abilities by automatically detecting and rectifying factual inconsistency in LLMs\u2019 generated solutions. To detect factual inconsistency, RCoT first asks LLMs to reconstruct the problem based on generated solutions. Then fine-grained comparisons between the original problem and the reconstructed problem expose the factual inconsistency in the original solutions. To rectify the solution, RCoT formulates detected factual inconsistency into fine-grained feedback to guide LLMs in revising solutions. Experimental results demonstrate improvements of RCoT over standard CoT, Self-Consistency and Self-Refine across seven arithmetic datasets. Moreover, we find that manually written fine-grained feedback can dramatically improve LLMs\u2019 reasoning abilities (e.g., ChatGPT reaches 94.6% accuracy on GSM8K), encouraging the community to further explore the fine-grained feedback generation methods.",
        "keywords": "Large Language Models;Chain-of-Thought Prompting;Arithmetic Reasoning",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/40fab8617eae79fcf3d21e07c9573e741efccf92.zip",
        "author": "Tianci Xue;Ziqi Wang;Zhenhailong Wang;Chi Han;Pengfei Yu;Heng Ji",
        "authorids": "~Tianci_Xue1;~Ziqi_Wang2;~Zhenhailong_Wang1;~Chi_Han1;~Pengfei_Yu1;~Heng_Ji3",
        "gender": "M;;M;M;M;F",
        "homepage": "https://xuetianci.github.io/;https://www.wzq016.github.io;https://mikewangwzhl.github.io/;https://glaciohound.github.io;;http://blender.cs.illinois.edu/hengji.html",
        "dblp": "347/9360;38/8097-3;290/1319;255/6993;;",
        "google_scholar": "wVFSbzkAAAAJ;xYRZiZkAAAAJ;arzvOlgAAAAJ;https://scholar.google.com.sg/citations?user=DcSvbuAAAAAJ;bFbykBYAAAAJ;z7GCqT4AAAAJ",
        "orcid": ";;0000-0002-4704-5455;0000-0001-6235-5841;;",
        "linkedin": ";;zhenhailong-wang-7952111b2/;chi-han-b01a93141/;;",
        "or_profile": "~Tianci_Xue1;~Ziqi_Wang2;~Zhenhailong_Wang1;~Chi_Han1;~Pengfei_Yu1;~Heng_Ji3",
        "aff": "Nanjing University;Meta Facebook;SalesForce.com;University of Illinois, Urbana Champaign;University of Illinois, Urbana Champaign;University of Illinois, Urbana-Champaign",
        "aff_domain": "nju.edu.cn;meta.com;salesforce.com;illinois.edu;illinois.edu;uiuc.edu",
        "position": "MS student;Intern;Intern;PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nxue2024rcot,\ntitle={{RCOT}: Detecting and Rectifying Factual Inconsistency in Reasoning by Reversing Chain-of-Thought},\nauthor={Tianci Xue and Ziqi Wang and Zhenhailong Wang and Chi Han and Pengfei Yu and Heng Ji},\nyear={2024},\nurl={https://openreview.net/forum?id=cG8Q4FE0Hi}\n}",
        "github": "",
        "project": "",
        "reviewers": "rMGU;vr2D;QEoj",
        "site": "https://openreview.net/forum?id=cG8Q4FE0Hi",
        "pdf_size": 553587,
        "rating": "3;5;6",
        "confidence": "4;5;3",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "2;2;3",
        "wc_summary": "96;54;75",
        "wc_strengths": "96;28;58",
        "wc_weaknesses": "271;319;73",
        "wc_questions": "47;2;38",
        "wc_review": "510;403;244",
        "wc_reply_reviewers": "0;0;20",
        "wc_reply_authors": "613;955;223",
        "reply_reviewers": "0;0;1",
        "reply_authors": "2;3;2",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            75.0,
            17.146428199482248
        ],
        "wc_strengths_avg": [
            60.666666666666664,
            27.824849006278942
        ],
        "wc_weaknesses_avg": [
            221.0,
            106.47065323364932
        ],
        "wc_questions_avg": [
            29.0,
            19.44222209522358
        ],
        "wc_review_avg": [
            385.6666666666667,
            109.28352524003282
        ],
        "wc_reply_reviewers_avg": [
            6.666666666666667,
            9.428090415820632
        ],
        "wc_reply_authors_avg": [
            597.0,
            299.0518349717988
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.3273268353539886,
        "gs_citation": 31,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9395703768603781404&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;3;3;4",
        "aff_unique_norm": "Nanjing University;Meta;Salesforce;University of Illinois Urbana-Champaign;University of Illinois",
        "aff_unique_dep": ";Meta Platforms, Inc.;;;",
        "aff_unique_url": "https://www.nju.edu.cn;https://meta.com;https://www.salesforce.com;https://illinois.edu;https://illinois.edu",
        "aff_unique_abbr": "Nanjing U;Meta;Salesforce;UIUC;UIUC",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Urbana-Champaign",
        "aff_country_unique_index": "0;1;1;1;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Label-Focused Inductive Bias over Latent Object Features in Visual Classification",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18303",
        "id": "cH3oufN8Pl",
        "author_site": "Ilmin Kang, HyounYoung Bae, Kangil Kim",
        "tldr": "",
        "abstract": "Most neural networks for classification primarily learn features differentiated by input-domain related information such as visual similarity of objects in an image. While this focus is natural behavior, it can inadvertently introduce an inductive bias that conflicts with unseen relations in an implicit output-domain determined by human labeling based on their own world knowledge. Such conflicts can limit generalization of models by potential dominance of the input-domain focused bias in inference.\nTo overcome this limitation without external resources, we introduce Output-Domain focused Biasing (ODB) training strategy that constructs inductive biases on features differentiated by only output labels. It has four steps: 1) it learns intermediate latent object features in an unsupervised manner; 2) it decouples their visual dependencies by assigning new independent embedding parameters; 3) it captures structured features optimized for the original classification task; and 4) it integrates the structured features with the original visual features for the final prediction.\nWe implement the ODB on a vision transformer architecture, and achieved significant improvements on image classification benchmarks. This paper offers a straightforward and effective method to obtain and utilize output-domain focused inductive bias for classification mapping two different domains.",
        "keywords": "Representation Learning;Output-Domain Focused Inductive Bias;Classification",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/91f9a8f1bdccaae2b546fa514a60b8f40904aca9.zip",
        "author": "Ilmin Kang;HyounYoung Bae;Kangil Kim",
        "authorids": "~Ilmin_Kang1;~HyounYoung_Bae1;~Kangil_Kim1",
        "gender": "M;F;M",
        "homepage": ";;",
        "dblp": ";;45/8372",
        "google_scholar": "https://scholar.google.com/citations?hl=ko;https://scholar.google.co.kr/citations?hl=ko;RZggOtkAAAAJ",
        "orcid": ";;0000-0003-3220-6401",
        "linkedin": ";;",
        "or_profile": "~Ilmin_Kang1;~HyounYoung_Bae1;~Kangil_Kim1",
        "aff": "Gwangju Institute of Science and Technology;Gwangju Institute of Science and Technology;Gwangju Institute of Science and Technology",
        "aff_domain": "gist.ac.kr;gist.ac.kr;gist.ac.kr",
        "position": "PhD student;PhD student;Associate Professor",
        "bibtex": "@inproceedings{\nkang2024labelfocused,\ntitle={Label-Focused Inductive Bias over Latent Object Features in Visual Classification},\nauthor={Ilmin Kang and HyounYoung Bae and Kangil Kim},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=cH3oufN8Pl}\n}",
        "github": "",
        "project": "",
        "reviewers": "7b4C;9BG9;CuBT",
        "pdf_size": 0,
        "rating": "6;6;8",
        "confidence": "3;3;4",
        "soundness": "2;2;4",
        "contribution": "2;2;3",
        "presentation": "3;2;3",
        "wc_summary": "85;41;123",
        "wc_strengths": "38;13;47",
        "wc_weaknesses": "22;127;194",
        "wc_questions": "35;9;290",
        "wc_review": "180;190;654",
        "wc_reply_reviewers": "0;28;0",
        "wc_reply_authors": "231;812;1323",
        "reply_reviewers": "0;1;0",
        "reply_authors": "1;2;2",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            83.0,
            33.50621832834417
        ],
        "wc_strengths_avg": [
            32.666666666666664,
            14.383632673594278
        ],
        "wc_weaknesses_avg": [
            114.33333333333333,
            70.78763231588474
        ],
        "wc_questions_avg": [
            111.33333333333333,
            126.78152687026433
        ],
        "wc_review_avg": [
            341.3333333333333,
            221.12640929768855
        ],
        "wc_reply_reviewers_avg": [
            9.333333333333334,
            13.199326582148887
        ],
        "wc_reply_authors_avg": [
            788.6666666666666,
            446.11234260242367
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.9999999999999998,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:1-o3flMsUsEJ:scholar.google.com/&scioq=Label-Focused+Inductive+Bias+over+Latent+Object+Features+in+Visual+Classification&hl=en&as_sdt=0,5",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=cH3oufN8Pl",
        "pdf": "https://openreview.net/pdf?id=cH3oufN8Pl",
        "email": "gist.ac.kr;gist.ac.kr;gist.ac.kr",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Gwangju Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.gist.ac.kr",
        "aff_unique_abbr": "GIST",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Gwangju",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "cHy00K3Och",
        "title": "GRADSIMCORE: GRADIENT SIMILARITY BASED REPRESENTATIVE INSTANCES AS CORESET",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The rise in size and complexity of modern datasets and deep learning models have resulted in the usage of extensive computational resources and a rise in training time and effort. It also has increased the carbon footprint of training and fine-tuning models. One way to reduce the computational requirement is to extract the most representative subset (referred to as $\\textit{coreset}$) that can substitute for the larger dataset. Coresets can thus replace huge datasets to train models and tune hyperparameters, especially in the early stages of training. This will result in a significant reduction of computational resource requirement and reduce carbon footprint. We propose a simple and novel framework based on the similarity of loss gradients for identifying the representative training instances as a coreset. Our method, dubbed as $\\textit{GradSimCore}$, outperforms the state-of-the-art coreset selection algorithms on popular benchmark datasets ranging from MNIST to ImageNet. Because of its simplicity and effectiveness, our method is an important baseline for evaluating the effectiveness of the coreset selection algorithms. Anonymized codes for the proposed baseline are provided at https://anonymous.4open.science/r/GradSimCore-8884",
        "keywords": "Coreset selection;Data-efficient deep learning;gradient similarity",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Saumyaranjan Mohanty;Konda Reddy Mopuri",
        "authorids": "~Saumyaranjan_Mohanty1;~Konda_Reddy_Mopuri3",
        "gender": "M;M",
        "homepage": ";https://krmopuri.github.io/",
        "dblp": ";162/0085",
        "google_scholar": ";https://scholar.google.com/citations?hl=en",
        "orcid": ";0000-0001-8894-7212",
        "linkedin": "saumyaranjan-mohanty-a2768646/;",
        "or_profile": "~Saumyaranjan_Mohanty1;~Konda_Reddy_Mopuri3",
        "aff": "Indian Institute of Technology, Hyderabad;Indian Institute of Technology Hyderabad",
        "aff_domain": "iith.ac.in;iith.ac.in",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nmohanty2024gradsimcore,\ntitle={{GRADSIMCORE}: {GRADIENT} {SIMILARITY} {BASED} {REPRESENTATIVE} {INSTANCES} {AS} {CORESET}},\nauthor={Saumyaranjan Mohanty and Konda Reddy Mopuri},\nyear={2024},\nurl={https://openreview.net/forum?id=cHy00K3Och}\n}",
        "github": "",
        "project": "",
        "reviewers": "z4nU;iu1D;1xJD;LXPe",
        "site": "https://openreview.net/forum?id=cHy00K3Och",
        "pdf_size": 9275697,
        "rating": "1;3;3;3",
        "confidence": "2;4;4;5",
        "soundness": "1;2;1;1",
        "contribution": "1;2;1;2",
        "presentation": "3;1;1;1",
        "wc_summary": "110;339;59;93",
        "wc_strengths": "48;30;10;41",
        "wc_weaknesses": "245;37;3;195",
        "wc_questions": "39;80;14;2",
        "wc_review": "442;486;86;331",
        "wc_reply_reviewers": "0;198;0;35",
        "wc_reply_authors": "570;397;182;357",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            1.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            1.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            150.25,
            110.51102886137654
        ],
        "wc_strengths_avg": [
            32.25,
            14.359230480774379
        ],
        "wc_weaknesses_avg": [
            120.0,
            102.25947388873072
        ],
        "wc_questions_avg": [
            33.75,
            29.852763691155968
        ],
        "wc_review_avg": [
            336.25,
            155.12958292988478
        ],
        "wc_reply_reviewers_avg": [
            58.25,
            81.94014583828857
        ],
        "wc_reply_authors_avg": [
            376.5,
            137.9066713397144
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.9271726499455306,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:OnQGOOu_YUcJ:scholar.google.com/&scioq=GRADSIMCORE:+GRADIENT+SIMILARITY+BASED+REPRESENTATIVE+INSTANCES+AS+CORESET&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Indian Institute of Technology Hyderabad",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.iith.ac.in",
        "aff_unique_abbr": "IIT Hyderabad",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hyderabad",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "India"
    },
    {
        "id": "cI5j8tEPNU",
        "title": "PAIR Diffusion: A Comprehensive Multimodal Object-Level Image Editor",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Generative image editing has recently witnessed extremely fast-paced growth.  Some works use high-level conditioning such as text, while others use low-level conditioning. Nevertheless, most of them lack fine-grained control over the properties of the different objects present in the image, i.e. object-level image editing.  In this work, we tackle the task by perceiving the images as an amalgamation of various objects and aim to control the properties of each object in a fine-grained manner. Out of these properties, we identify structure and appearance as the most intuitive to understand and useful for editing purposes. We propose PAIR Diffusion, a generic framework that can enable a diffusion model to control the structure and appearance properties of each object in the image. We show that having control over the properties of each object in an image leads to comprehensive editing capabilities. Our framework allows for various object-level editing operations on real images such as reference image-based appearance editing, free-form shape editing, adding objects, and variations. Thanks to our design, we do not require any inversion step. Additionally, we propose multimodal classifier-free guidance which enables editing images using both reference images and text when using our approach with foundational diffusion models. We validate the above claims by extensively evaluating our framework on both unconditional and foundational diffusion models.",
        "keywords": "Image Editing;Comprehensive;Multimodal",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/2c5b41d7eb224b5b1339986ab3f9809a8b9f3fa5.pdf",
        "author": "Vidit Goel;Elia Peruzzo;Yifan Jiang;Dejia Xu;Xingqian Xu;Trevor Darrell;Nicu Sebe;Zhangyang Wang;Humphrey Shi",
        "authorids": "~Vidit_Goel1;~Elia_Peruzzo1;~Yifan_Jiang2;~Dejia_Xu1;~Xingqian_Xu2;~Trevor_Darrell2;~Nicu_Sebe1;~Zhangyang_Wang1;~Humphrey_Shi1",
        "gender": "M;M;M;M;M;M;M;M;M",
        "homepage": "https://vidit98.github.io/;https://helia95.github.io/;https://yifanjiang19.github.io/;https://ir1d.github.io;https://xingqian2018.github.io/;http://disi.unitn.it/~sebe/;https://vita-group.github.io;https://www.humphreyshi.com;https://people.eecs.berkeley.edu/~trevor/",
        "dblp": "264/0146;322/2005.html;81/7246-1;264/5685;256/1005;20/3519;119/4026;176/5516;d/TrevorDarrell",
        "google_scholar": "7rNyP1sAAAAJ;nWEJGz0AAAAJ;PMeFEOIAAAAJ;ET0e93cAAAAJ;s1X82zMAAAAJ;https://scholar.google.it/citations?user=stFCYOAAAAAJ;pxFyKAIAAAAJ;WBvt5A8AAAAJ;https://scholar.google.com.tw/citations?user=bh-uRFMAAAAJ",
        "orcid": ";;;;;0000-0002-6597-7248;;0000-0002-2922-5663;",
        "linkedin": ";;;;xingqian-xu-97b46526/;;;humphreyshi;",
        "or_profile": "~Vidit_Goel1;~Elia_Peruzzo1;~Yifan_Jiang2;~Dejia_Xu1;~Xingqian_Xu2;~Nicu_Sebe1;~Zhangyang_Wang1;~Honghui_Shi1;~trevor_darrell1",
        "aff": "Snap Inc.;University of Trento;University of Texas, Austin;University of Texas at Austin;PicsArt Inc.;University of Trento;University of Texas at Austin;University of Illinois, Urbana Champaign;Electrical Engineering & Computer Science Department",
        "aff_domain": "snapchat.com;unitn.it;utexas.edu;utexas.edu;picsart.com;unitn.it;utexas.edu;illinois.edu;eecs.berkeley.edu",
        "position": "Researcher;PhD student;PhD student;PhD student;Senior Research Scientist;Full Professor;Associate Professor;Adjunct Assistant Professor;Professor",
        "bibtex": "@misc{\ngoel2024pair,\ntitle={{PAIR} Diffusion: A Comprehensive Multimodal Object-Level Image Editor},\nauthor={Vidit Goel and Elia Peruzzo and Yifan Jiang and Dejia Xu and Xingqian Xu and Trevor Darrell and Nicu Sebe and Zhangyang Wang and Humphrey Shi},\nyear={2024},\nurl={https://openreview.net/forum?id=cI5j8tEPNU}\n}",
        "github": "",
        "project": "",
        "reviewers": "H2Ab;BnZE;JFgB;63QG;GKjx",
        "site": "https://openreview.net/forum?id=cI5j8tEPNU",
        "pdf_size": 7214514,
        "rating": "3;3;6;6;6",
        "confidence": "5;5;3;4;4",
        "soundness": "2;3;2;3;3",
        "contribution": "2;1;3;2;3",
        "presentation": "2;3;3;3;3",
        "wc_summary": "61;77;91;108;130",
        "wc_strengths": "34;33;56;55;73",
        "wc_weaknesses": "308;213;103;53;95",
        "wc_questions": "32;23;20;1;91",
        "wc_review": "435;346;270;217;389",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            4.8,
            1.469693845669907
        ],
        "confidence_avg": [
            4.2,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.2,
            0.7483314773547882
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            93.4,
            23.988330496305906
        ],
        "wc_strengths_avg": [
            50.2,
            15.065191668213187
        ],
        "wc_weaknesses_avg": [
            154.4,
            93.25148792378597
        ],
        "wc_questions_avg": [
            33.4,
            30.51950196186039
        ],
        "wc_review_avg": [
            331.4,
            78.89385273898087
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -0.8728715609439694,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1054782164830163171&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 10,
        "aff_unique_index": "0;1;2;2;3;1;2;4;5",
        "aff_unique_norm": "Snap Inc.;University of Trento;University of Texas at Austin;Picsart;University of Illinois Urbana-Champaign;Electrical Engineering & Computer Science Department",
        "aff_unique_dep": ";;;;;Electrical Engineering & Computer Science",
        "aff_unique_url": "https://www.snapinc.com;https://www.unitn.it;https://www.utexas.edu;https://www.picsart.com;https://illinois.edu;",
        "aff_unique_abbr": "Snap;UniTN;UT Austin;PicsArt;UIUC;",
        "aff_campus_unique_index": "1;1;1;2",
        "aff_campus_unique": ";Austin;Urbana-Champaign",
        "aff_country_unique_index": "0;1;0;0;0;1;0;0",
        "aff_country_unique": "United States;Italy;"
    },
    {
        "id": "cI7WAadODh",
        "title": "An Invex Relaxation Approach for Minimizing Polarization from Fully and Partially Observed Initial Opinions",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper investigates the problem of minimizing polarization within a network, operating under the foundational assumption that the evolution of underlying opinions adheres to the most prevalent model, the Friedkin-Johnson (FJ) model.  We show that this optimization problem under integrality constraints is $\\mathcal{NP}$-Hard. Furthermore, we establish that the objective function fits into a specialized category of nonconvex functions called invex, where every local minimum is a global minimum. We extend this characterization to encompass a comprehensive class of matrix functions, including those pertinent to polarization and multiperiod polarization, even when addressing scenarios involving stubborn actors. We propose a novel nonconvex framework for this class of matrix functions with theoretical guarantees and demonstrate its practical efficacy for minimizing polarization without getting stuck at local minima. Through empirical assessments conducted in real-world network scenarios, our proposed approach consistently outperforms existing state-of-the-art methodologies. Moreover, we extend our work to encompass a novel problem setting that has not been previously studied, wherein the observer possesses access solely to a subset of initial opinions. Within this agnostic framework, we introduce a nonconvex relaxation methodology, which provides similar theoretical guarantees as outlined earlier and effectively mitigates polarization.",
        "keywords": "Polarization;Friedkin-Johnson dynamics;Social Networks;Opinion Dynamics",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/523f84742bb4fb20606dfe63e051370a730803ee.pdf",
        "author": "Meher Chaitanya;Adarsh Barik;Mansi Rankawat;Jean Honorio",
        "authorids": "~Meher_Chaitanya1;~Adarsh_Barik1;~Mansi_Rankawat1;~Jean_Honorio1",
        "gender": ";;;M",
        "homepage": ";;;http://www.cs.purdue.edu/~jhonorio/",
        "dblp": ";;;09/4857",
        "google_scholar": ";;;https://scholar.google.com.tw/citations?user=8OW3TMMAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Meher_Chaitanya1;~Adarsh_Barik1;~Mansi_Rankawat1;~Jean_Honorio1",
        "aff": ";;;Purdue University",
        "aff_domain": ";;;purdue.edu",
        "position": ";;;Adjunct Professor",
        "bibtex": "@misc{\nchaitanya2024an,\ntitle={An Invex Relaxation Approach for Minimizing Polarization from Fully and Partially Observed Initial Opinions},\nauthor={Meher Chaitanya and Adarsh Barik and Mansi Rankawat and Jean Honorio},\nyear={2024},\nurl={https://openreview.net/forum?id=cI7WAadODh}\n}",
        "github": "",
        "project": "",
        "reviewers": "XHJ6;f5dH;pnnF",
        "site": "https://openreview.net/forum?id=cI7WAadODh",
        "pdf_size": 466450,
        "rating": "1;3;8",
        "confidence": "5;2;3",
        "soundness": "2;2;4",
        "contribution": "1;2;3",
        "presentation": "2;3;3",
        "wc_summary": "110;52;124",
        "wc_strengths": "8;29;42",
        "wc_weaknesses": "87;150;220",
        "wc_questions": "1;4;25",
        "wc_review": "206;235;411",
        "wc_reply_reviewers": "0;0;83",
        "wc_reply_authors": "309;527;474",
        "reply_reviewers": "0;0;1",
        "reply_authors": "1;1;3",
        "rating_avg": [
            4.0,
            2.943920288775949
        ],
        "confidence_avg": [
            3.3333333333333335,
            1.247219128924647
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            95.33333333333333,
            31.169785940162562
        ],
        "wc_strengths_avg": [
            26.333333333333332,
            14.007934259633798
        ],
        "wc_weaknesses_avg": [
            152.33333333333334,
            54.322084725173134
        ],
        "wc_questions_avg": [
            10.0,
            10.677078252031311
        ],
        "wc_review_avg": [
            284.0,
            90.57961507241387
        ],
        "wc_reply_reviewers_avg": [
            27.666666666666668,
            39.12657522565563
        ],
        "wc_reply_authors_avg": [
            436.6666666666667,
            92.83078991129806
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.4539206495016018,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ClbsjHmqUEgJ:scholar.google.com/&scioq=An+Invex+Relaxation+Approach+for+Minimizing+Polarization+from+Fully+and+Partially+Observed+Initial+Opinions&hl=en&as_sdt=0,48",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Purdue University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.purdue.edu",
        "aff_unique_abbr": "Purdue",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Aux-NAS: Exploiting Auxiliary Labels with Negligibly Extra Inference Cost",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18302",
        "id": "cINwAhrgLf",
        "author_site": "Yuan Gao, WEIZHONG ZHANG, Wenhan Luo, Lin Ma, Jin-Gang Yu, Gui-Song Xia, Jiayi Ma",
        "tldr": "",
        "abstract": "We aim at exploiting additional auxiliary labels from an independent (auxiliary) task to boost the primary task performance which we focus on, while preserving a single task inference cost of the primary task. While most existing auxiliary learning methods are optimization-based relying on loss weights/gradients manipulation, our method is architecture-based with a flexible asymmetric structure for the primary and auxiliary tasks, which produces different networks for training and inference. Specifically, starting from two single task networks/branches (each representing a task), we propose a novel method with evolving networks where only primary-to-auxiliary links exist as the cross-task connections after convergence. These connections can be removed during the primary task inference, resulting in a single-task inference cost. We achieve this by formulating a Neural Architecture Search (NAS) problem, where we initialize bi-directional connections in the search space and guide the NAS optimization converging to an architecture with only the single-side primary-to-auxiliary connections. Moreover, our method can be incorporated with optimization-based auxiliary learning approaches. Extensive experiments with six tasks on NYU v2, CityScapes, and Taskonomy datasets using VGG, ResNet, and ViT backbones validate the promising performance. The codes are available at https://github.com/ethanygao/Aux-NAS.",
        "keywords": "Auxiliary Learning; Neural Architecture Search; Soft Parameter Sharing; Multi-Task Learning; Single Task Inference Cost",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yuan Gao;WEIZHONG ZHANG;Wenhan Luo;Lin Ma;Jin-Gang Yu;Gui-Song Xia;Jiayi Ma",
        "authorids": "~Yuan_Gao4;~WEIZHONG_ZHANG2;~Wenhan_Luo1;~Lin_Ma2;~Jin-Gang_Yu1;~Gui-Song_Xia3;~Jiayi_Ma2",
        "gender": ";;M;M;M;;M",
        "homepage": ";;https://whluo.github.io/;http://forestlinma.com;https://yanzhao.scut.edu.cn/open/ExpertInfo.aspx?zjbh=goi4tp1KbAaC80CVL590Bg==;;https://sites.google.com/site/jiayima2013/home",
        "dblp": ";;64/9877;74/3608-2;https://dblp.uni-trier.de/pers/hd/y/Yu:Jin=Gang;;96/9989",
        "google_scholar": ";;g20Q12MAAAAJ;DAn1pA4AAAAJ;uSPkrNcAAAAJ;;73trMQkAAAAJ",
        "orcid": ";;0000-0002-5697-4168;;0000-0003-2148-2726;;0000-0003-3264-3265",
        "linkedin": ";;wenhan-luo-a1843480/;;;;",
        "or_profile": "~Yuan_Gao4;~WEIZHONG_ZHANG2;~Wenhan_Luo1;~Lin_Ma2;~Jin-Gang_Yu1;~Gui-Song_Xia3;~Jiayi_Ma2",
        "aff": ";;Sun Yat-sen University;Meituan;South China University of Technology;;Wuhan University",
        "aff_domain": ";;sysu.edu.cn;meituan.com;scut.edu.cn;;whu.edu.cn",
        "position": ";;Associate Professor;Principal Researcher and Research Manager ;Associate Professor;;Full Professor",
        "bibtex": "@inproceedings{\ngao2024auxnas,\ntitle={Aux-{NAS}: Exploiting Auxiliary Labels with Negligibly Extra Inference Cost},\nauthor={Yuan Gao and WEIZHONG ZHANG and Wenhan Luo and Lin Ma and Jin-Gang Yu and Gui-Song Xia and Jiayi Ma},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=cINwAhrgLf}\n}",
        "github": "",
        "project": "",
        "reviewers": "V6nv;fF8U;fJaD;Qzsf;CQEV",
        "pdf_size": 2577019,
        "rating": "6;6;8;8;8",
        "confidence": "3;3;4;4;4",
        "soundness": "3;2;3;4;3",
        "contribution": "3;2;3;4;3",
        "presentation": "3;3;3;3;3",
        "wc_summary": "100;128;125;137;56",
        "wc_strengths": "63;119;181;167;94",
        "wc_weaknesses": "83;163;58;134;144",
        "wc_questions": "5;2;8;33;30",
        "wc_review": "251;412;372;471;324",
        "wc_reply_reviewers": "206;0;0;0;14",
        "wc_reply_authors": "1918;846;288;181;1307",
        "reply_reviewers": "5;0;0;0;1",
        "reply_authors": "8;2;1;1;3",
        "rating_avg": [
            7.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            3.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            3.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            109.2,
            29.29436805940691
        ],
        "wc_strengths_avg": [
            124.8,
            44.137965517227904
        ],
        "wc_weaknesses_avg": [
            116.4,
            39.4187772514572
        ],
        "wc_questions_avg": [
            15.6,
            13.154466921924278
        ],
        "wc_review_avg": [
            366.0,
            75.05464675821212
        ],
        "wc_reply_reviewers_avg": [
            44.0,
            81.18127862998956
        ],
        "wc_reply_authors_avg": [
            908.0,
            647.467991486838
        ],
        "reply_reviewers_avg": [
            1.2,
            1.9390719429665317
        ],
        "reply_authors_avg": [
            3.0,
            2.6076809620810595
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7271696779700820467&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=cINwAhrgLf",
        "pdf": "https://openreview.net/pdf?id=cINwAhrgLf",
        "email": ";;sysu.edu.cn;meituan.com;scut.edu.cn;;whu.edu.cn",
        "author_num": 7,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Sun Yat-sen University;Meituan;South China University of Technology;Wuhan University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "http://www.sysu.edu.cn/;https://www.meituan.com;https://www.scut.edu.cn;http://www.whu.edu.cn/",
        "aff_unique_abbr": "SYSU;Meituan;SCUT;WHU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "cIgfXQBExO",
        "title": "ZeroNVS: Zero-shot 360-degree View Synthesis from a Single Real Image",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We introduce a 3D-aware diffusion model, ZeroNVS, for single-image novel view synthesis for in-the-wild scenes. Compared with existing methods mainly developed for single objects with masked backgrounds, we propose key improvements to address challenges introduced by in-the-wild scenes with complex backgrounds. Specifically, we train a generative prior on a mixture of data sources that capture object-centric, indoor, and outdoor scenes. As the data mixture presents various issues such as depth-scale ambiguity,  we present a novel camera parameterization and normalization scheme. Further, we observe that Score Distillation Sampling (SDS) tends to truncate the distribution of complex backgrounds during distillation of 360\u00ba scenes, and  propose ``SDS-anchoring'' to improve the diversity of synthesized novel views. Our model sets a new state-of-the-art in LPIPS on DTU in the zero-shot setting, even outperforming methods specifically trained on DTU. We further adapt the challenging  MipNeRF360 dataset as a new benchmark for single-image novel view synthesis, and demonstrate strong performance. Our code and data will be available on acceptance.",
        "keywords": "Computer vision;novel view synthesis",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/d2e8fa0473a60c814b11649b0e137d8be1b16d26.zip",
        "author": "Kyle Sargent;Zizhang Li;Tanmay Shah;Charles Herrmann;Hong-Xing Yu;Yunzhi Zhang;Eric Ryan Chan;Dmitry Lagun;Li Fei-Fei;Deqing Sun;Jiajun Wu",
        "authorids": "~Kyle_Sargent1;~Zizhang_Li1;~Tanmay_Shah1;~Charles_Herrmann1;~Hong-Xing_Yu1;~Yunzhi_Zhang1;~Eric_Ryan_Chan1;~Dmitry_Lagun2;~Li_Fei-Fei1;~Deqing_Sun2;~Jiajun_Wu1",
        "gender": ";M;M;Unspecified;M;F;M;M;F;M;M",
        "homepage": "https://kylesargent.github.io;https://kyleleey.github.io/;;https://scholar.google.com/citations?user=LQvi5XAAAAAJ&hl=en&oi=ao;https://kovenyu.com;https://cs.stanford.edu/~yzzhang/;https://ericryanchan.github.io;;https://profiles.stanford.edu/fei-fei-li;https://deqings.github.io/;https://jiajunwu.com",
        "dblp": "298/0019;289/2324;;26/11300;205/2676.html;58/10932;267/9432;73/9204;79/2528;69/4250;117/4768",
        "google_scholar": "Lom6iMAAAAAJ;https://scholar.google.com/citations?hl=en;aYjkmcAAAAAJ;LQvi5XAAAAAJ;kNKncZcAAAAJ;https://scholar.google.com/citations?hl=en;TLgngQYAAAAJ;https://scholar.google.com/citations?hl=en;rDfyQnIAAAAJ;t4rgICIAAAAJ;2efgcS0AAAAJ",
        "orcid": "0009-0009-8609-6894;;;;;;;;;;0000-0002-4176-343X",
        "linkedin": "kyle-sargent-784006134/;;;;;;;;fei-fei-li-4541247/;;jiajunwu/",
        "or_profile": "~Kyle_Sargent1;~Zizhang_Li1;~Tanmay_Shah1;~Charles_Herrmann1;~Hong-Xing_Yu1;~Yunzhi_Zhang1;~Eric_Ryan_Chan1;~Dmitry_Lagun2;~Li_Fei-Fei1;~Deqing_Sun2;~Jiajun_Wu1",
        "aff": "Computer Science Department, Stanford University;Zhejiang University;Google;Google;Stanford University;Stanford University;Stanford University;Google;Stanford University;Google DeepMind;Stanford University",
        "aff_domain": "cs.stanford.edu;zju.edu.cn;google.com;google.com;cs.stanford.edu;stanford.edu;stanford.edu;google.com;stanford.edu;google.com;stanford.edu",
        "position": "PhD student;MS student;Researcher;Researcher;PhD student;PhD student;PhD student;Researcher;Full Professor;Research Scientist;Assistant Professor",
        "bibtex": "@misc{\nsargent2024zeronvs,\ntitle={Zero{NVS}: Zero-shot 360-degree View Synthesis from a Single Real Image},\nauthor={Kyle Sargent and Zizhang Li and Tanmay Shah and Charles Herrmann and Hong-Xing Yu and Yunzhi Zhang and Eric Ryan Chan and Dmitry Lagun and Li Fei-Fei and Deqing Sun and Jiajun Wu},\nyear={2024},\nurl={https://openreview.net/forum?id=cIgfXQBExO}\n}",
        "github": "",
        "project": "",
        "reviewers": "3tNs;1pBn;UiFn;3848",
        "site": "https://openreview.net/forum?id=cIgfXQBExO",
        "pdf_size": 10341759,
        "rating": "3;5;5;6",
        "confidence": "4;4;3;3",
        "soundness": "2;2;3;3",
        "contribution": "3;2;2;3",
        "presentation": "3;3;2;2",
        "wc_summary": "85;107;81;18",
        "wc_strengths": "92;24;35;44",
        "wc_weaknesses": "423;136;125;38",
        "wc_questions": "56;58;2;162",
        "wc_review": "656;325;243;262",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "568;315;292;335",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            72.75,
            33.12382073372575
        ],
        "wc_strengths_avg": [
            48.75,
            25.955490748587284
        ],
        "wc_weaknesses_avg": [
            180.5,
            145.06291738414748
        ],
        "wc_questions_avg": [
            69.5,
            57.93746628909483
        ],
        "wc_review_avg": [
            371.5,
            167.03667262011658
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            377.5,
            111.03265285491472
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": -0.6882472016116854,
        "gs_citation": 91,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17599601942964392640&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;2;0;0;0;2;0;2;0",
        "aff_unique_norm": "Stanford University;Zhejiang University;Google",
        "aff_unique_dep": "Computer Science Department;;Google",
        "aff_unique_url": "https://www.stanford.edu;https://www.zju.edu.cn;https://www.google.com",
        "aff_unique_abbr": "Stanford;ZJU;Google",
        "aff_campus_unique_index": "0;2;2;0;0;0;2;0;0",
        "aff_campus_unique": "Stanford;;Mountain View",
        "aff_country_unique_index": "0;1;0;0;0;0;0;0;0;2;0",
        "aff_country_unique": "United States;China;United Kingdom"
    },
    {
        "id": "cJ3H9K7Mcb",
        "title": "Robustness May be More Brittle than We Think under Different Degrees of Distribution Shifts",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Out-of-distribution (OOD) generalization is a complicated problem due to the idiosyncrasies of possible distribution shifts between training and test domains. Most benchmarks employ diverse datasets to address this issue; however, the degree of the distribution shift between the training domains and the test domains of each dataset remains largely fixed. This may lead to biased conclusions that either underestimate or overestimate the actual OOD performance of a model. Our study delves into a more nuanced evaluation setting that covers a broad range of shift degrees. We show that the robustness of models can be quite brittle and inconsistent under different degrees of distribution shifts, and therefore one should be more cautious when drawing conclusions from evaluations under a limited range of degrees. In addition, we observe that large-scale pre-trained models, such as CLIP, are sensitive to even minute distribution shifts of novel downstream tasks. This indicates that while pre-training may improve downstream in-distribution performance, it could have minimal or even adverse effects on generalization in certain OOD scenarios of the downstream task. In light of these findings, we encourage future research to conduct evaluations across a broader range of shift degrees whenever possible.",
        "keywords": "Out-of-distribution generalization;distribution shift",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Kaican Li;Yifan Zhang;Lanqing HONG;Zhenguo Li;Nevin L. Zhang",
        "authorids": "~Kaican_Li1;~Yifan_Zhang1;~Lanqing_HONG1;~Zhenguo_Li1;~Nevin_L._Zhang1",
        "gender": "M;M;F;M;M",
        "homepage": ";https://sites.google.com/view/yifan-zhang/%E9%A6%96%E9%A1%B5;https://racheltechie.github.io/;http://www.ee.columbia.edu/~zgli/;https://cse.hkust.edu.hk/~lzhang/teach/courses.html",
        "dblp": "272/5206;57/4707-4;226/4258;23/6479;https://dblp.uni-trier.de/pid/z/NevinLianwenZhang.html",
        "google_scholar": "Mc-lzZMAAAAJ;https://scholar.google.com.hk/citations?user=zuYIUJEAAAAJ;https://scholar.google.com.sg/citations?user=2p7x6OUAAAAJ;XboZC1AAAAAJ;",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Kaican_Li1;~Yifan_Zhang1;~Lanqing_HONG1;~Zhenguo_Li1;~Nevin_Zhang1",
        "aff": "Hong Kong University of Science and Technology;National University of Singapore;Huawei Technologies Ltd.;Huawei Noah's Ark Lab;Hong Kong University of Science and Technology",
        "aff_domain": "connect.ust.hk;nus.edu;huawei.com;huawei.com;ust.hk",
        "position": "PhD student;PhD student;Researcher;Principal Researcher;Full Professor",
        "bibtex": "@misc{\nli2024robustness,\ntitle={Robustness May be More Brittle than We Think under Different Degrees of Distribution Shifts},\nauthor={Kaican Li and Yifan Zhang and Lanqing HONG and Zhenguo Li and Nevin L. Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=cJ3H9K7Mcb}\n}",
        "github": "",
        "project": "",
        "reviewers": "V5DH;8Ku5;tBMy;tbnw",
        "site": "https://openreview.net/forum?id=cJ3H9K7Mcb",
        "pdf_size": 2984025,
        "rating": "3;5;5;5",
        "confidence": "4;4;4;5",
        "soundness": "2;1;2;2",
        "contribution": "2;3;2;2",
        "presentation": "3;3;4;3",
        "wc_summary": "61;67;69;152",
        "wc_strengths": "14;117;86;68",
        "wc_weaknesses": "445;332;174;487",
        "wc_questions": "37;92;75;614",
        "wc_review": "557;608;404;1321",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "2124;966;762;1561",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;2;1;2",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            87.25,
            37.4991666574072
        ],
        "wc_strengths_avg": [
            71.25,
            37.41239767777521
        ],
        "wc_weaknesses_avg": [
            359.5,
            121.1744610056096
        ],
        "wc_questions_avg": [
            204.5,
            237.2619859986003
        ],
        "wc_review_avg": [
            722.5,
            353.6046521187186
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1353.25,
            533.0935072761625
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:wmtGJLcjSuQJ:scholar.google.com/&scioq=Robustness+May+be+More+Brittle+than+We+Think+under+Different+Degrees+of+Distribution+Shifts&hl=en&as_sdt=0,44",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;2;0",
        "aff_unique_norm": "Hong Kong University of Science and Technology;National University of Singapore;Huawei",
        "aff_unique_dep": ";;Huawei Technologies",
        "aff_unique_url": "https://www.ust.hk;https://www.nus.edu.sg;https://www.huawei.com",
        "aff_unique_abbr": "HKUST;NUS;Huawei",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;1;0;0;0",
        "aff_country_unique": "China;Singapore"
    },
    {
        "id": "cJ7XuW5JaH",
        "title": "Posterior Probability-Based Label Recovery Attack in Federated Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent works have proposed analytical attacks that can recover batch labels from gradients of a classification model in Federated Learning. However, these studies do not explain the essence of label leakage or show the scalability of other classification variants. In this paper, we demonstrate the root cause of label leakage from gradients and propose a generalized label recovery attack by estimating the posterior probabilities. Beginning with the focal loss function, we derive the relationship among the gradients, labels and posterior probabilities in a concise form. Then, we explain the essential reasons for such findings from the perspective of the exponential family. Furthermore, we empirically observe that positive (negative) samples of a class have approximate probability distributions. This key insight enables us to estimate the posterior probabilities of the target batch from an auxiliary dataset. Integrating the above elements, we finally present our label attack that can directly recover the batch labels of each class in realistic FL settings. Evaluation results show that on an untrained model, our attack can achieve over 96\\% Class-level label Accuracy (ClsAcc) and 95\\% Instance-level label Accuracy (InsAcc) on different groups of datasets, models and activations. For a training model, our approach reaches more than 90\\% InsAcc on different batch sizes, class imbalance ratios, temperature parameters or label smoothing factors.",
        "keywords": "Federated Learning;Label Leakage;Probability Estimation",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/99d29f2ef72f8794a797f1c45299bda5919bf1c7.pdf",
        "author": "Rui Zhang;Song Guo",
        "authorids": "~Rui_Zhang31;~Song_Guo5",
        "gender": ";M",
        "homepage": ";https://cse.hkust.edu.hk/~songguo/",
        "dblp": ";01/267-1",
        "google_scholar": ";https://scholar.google.com/citations?hl=en",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Rui_Zhang31;~Song_Guo5",
        "aff": ";Department of Computer Science and Engineering, Hong Kong University of Science and Technology",
        "aff_domain": ";cse.ust.hk",
        "position": ";Full Professor",
        "bibtex": "@misc{\nzhang2024posterior,\ntitle={Posterior Probability-Based Label Recovery Attack in Federated Learning},\nauthor={Rui Zhang and Song Guo},\nyear={2024},\nurl={https://openreview.net/forum?id=cJ7XuW5JaH}\n}",
        "github": "",
        "project": "",
        "reviewers": "zaUc;gCmo;AjeW",
        "site": "https://openreview.net/forum?id=cJ7XuW5JaH",
        "pdf_size": 1063288,
        "rating": "5;6;6",
        "confidence": "4;5;4",
        "soundness": "3;2;3",
        "contribution": "3;2;3",
        "presentation": "2;2;3",
        "wc_summary": "69;117;24",
        "wc_strengths": "16;63;41",
        "wc_weaknesses": "77;1116;50",
        "wc_questions": "55;773;81",
        "wc_review": "217;2069;196",
        "wc_reply_reviewers": "55;617;38",
        "wc_reply_authors": "1023;2228;1313",
        "reply_reviewers": "1;5;1",
        "reply_authors": "3;4;3",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            70.0,
            37.97367509209505
        ],
        "wc_strengths_avg": [
            40.0,
            19.200694431886227
        ],
        "wc_weaknesses_avg": [
            414.3333333333333,
            496.2756850335865
        ],
        "wc_questions_avg": [
            303.0,
            332.50964898280273
        ],
        "wc_review_avg": [
            827.3333333333334,
            878.0327759005102
        ],
        "wc_reply_reviewers_avg": [
            236.66666666666666,
            269.02581453995987
        ],
        "wc_reply_authors_avg": [
            1521.3333333333333,
            513.5226923472376
        ],
        "reply_reviewers_avg": [
            2.3333333333333335,
            1.8856180831641267
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2530084505431302875&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0",
        "aff_unique_norm": "Hong Kong University of Science and Technology",
        "aff_unique_dep": "Department of Computer Science and Engineering",
        "aff_unique_url": "https://www.ust.hk",
        "aff_unique_abbr": "HKUST",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "title": "Deep Orthogonal Hypersphere Compression for Anomaly Detection",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18301",
        "id": "cJs4oE4m9Q",
        "author_site": "Yunhe Zhang, Yan Sun, Jinyu Cai, Jicong Fan",
        "tldr": "",
        "abstract": "Many well-known and effective anomaly detection methods assume that a reasonable decision boundary has a hypersphere shape, which however is difficult to obtain in practice and is not sufficiently compact, especially when the data are in high-dimensional spaces. In this paper, we first propose a novel deep anomaly detection model that improves the original hypersphere learning through an orthogonal projection layer, which ensures that the training data distribution is consistent with the hypersphere hypothesis, thereby increasing the true positive rate and decreasing the false negative rate. Moreover, we propose a bi-hypersphere compression method to obtain a hyperspherical shell that yields a more compact decision region than a hyperball, which is demonstrated theoretically and numerically.  The proposed methods are not confined to common datasets such as image and tabular data, but are also extended to a more challenging but promising scenario, graph-level anomaly detection, which learns graph representation with maximum mutual information between the substructure and global structure features while exploring orthogonal single- or bi-hypersphere anomaly decision boundaries. The numerical and visualization results on benchmark datasets demonstrate the superiority of our methods in comparison to many baselines and state-of-the-art methods.",
        "keywords": "Anomaly Detection;Deep Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/0fc6dd7a1e70242c23faf3056a487f5bc0724b4e.zip",
        "author": "Yunhe Zhang;Yan Sun;Jinyu Cai;Jicong Fan",
        "authorids": "~Yunhe_Zhang1;~Yan_Sun7;~Jinyu_Cai2;~Jicong_Fan2",
        "gender": "F;F;M;M",
        "homepage": ";https://yan-sun-x.github.io/;https://jinyucai95.github.io/;https://jicongfan.github.io/",
        "dblp": "15/5780-1;;223/9427;139/1570",
        "google_scholar": "xODtRUwAAAAJ;oNsiHHMAAAAJ;g9TVoA0AAAAJ;vdJsnhIAAAAJ",
        "orcid": "0000-0002-8080-3828;;0000-0003-2241-2754;0000-0001-9665-0355",
        "linkedin": ";%E5%BD%A6-%E5%AD%99-7988bb1a5/;;",
        "or_profile": "~Yunhe_Zhang1;~Yan_Sun7;~Jinyu_Cai2;~Jicong_Fan2",
        "aff": "The Chinese University of HongKong (Shenzhen);National University of Singapore;National University of Singapore;The Chinese University of Hong Kong, Shenzhen",
        "aff_domain": "cuhk.edu.cn;u.nus.edu;nus.edu.sg;cuhk.edu.cn",
        "position": "MS student;PhD student;Postdoc;Assistant Professor",
        "bibtex": "@inproceedings{\nzhang2024deep,\ntitle={Deep Orthogonal Hypersphere Compression for Anomaly Detection},\nauthor={Yunhe Zhang and Yan Sun and Jinyu Cai and Jicong Fan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=cJs4oE4m9Q}\n}",
        "github": "",
        "project": "",
        "reviewers": "5jY6;7Ufo;mQBk;wkqC",
        "pdf_size": 3704947,
        "rating": "8;8;8;8",
        "confidence": "3;4;5;5",
        "soundness": "3;3;4;3",
        "contribution": "3;3;4;3",
        "presentation": "3;3;3;3",
        "wc_summary": "72;70;47;73",
        "wc_strengths": "191;74;105;120",
        "wc_weaknesses": "32;133;16;70",
        "wc_questions": "98;4;253;33",
        "wc_review": "393;281;421;296",
        "wc_reply_reviewers": "0;0;13;0",
        "wc_reply_authors": "323;873;1145;650",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;2;3;1",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            65.5,
            10.735455276791944
        ],
        "wc_strengths_avg": [
            122.5,
            42.88647805544307
        ],
        "wc_weaknesses_avg": [
            62.75,
            45.05205322735025
        ],
        "wc_questions_avg": [
            97.0,
            96.283435750912
        ],
        "wc_review_avg": [
            347.75,
            60.30495419117736
        ],
        "wc_reply_reviewers_avg": [
            3.25,
            5.629165124598851
        ],
        "wc_reply_authors_avg": [
            747.75,
            301.4393595733643
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 19,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5733587899566078129&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=cJs4oE4m9Q",
        "pdf": "https://openreview.net/pdf?id=cJs4oE4m9Q",
        "email": "cuhk.edu.cn;u.nus.edu;nus.edu.sg;cuhk.edu.cn",
        "author_num": 4,
        "aff_unique_index": "0;1;1;0",
        "aff_unique_norm": "Chinese University of Hong Kong;National University of Singapore",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cuhk.edu.cn;https://www.nus.edu.sg",
        "aff_unique_abbr": "CUHK;NUS",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Shenzhen;",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "China;Singapore"
    },
    {
        "title": "Exploring Effective Stimulus Encoding via Vision System Modeling for Visual Prostheses",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18300",
        "id": "cKAUvMePUN",
        "author_site": "Chuanqing Wang, Di Wu, Chaoming Fang, Jie Yang, Mohamad Sawan",
        "tldr": "",
        "abstract": "Visual prostheses are potential devices to restore vision for blind people, which highly depends on the quality of stimulation patterns of the implanted electrode array. However, existing processing frameworks prioritize the generation of stimulation while disregarding the potential impact of restoration effects and fail to assess the quality of the generated stimulation properly. In this paper, we propose for the first time an end-to-end visual prosthesis framework (StimuSEE) that generates stimulation patterns with proper quality verification using V1 neuron spike patterns as supervision. StimuSEE consists of a retinal network to predict the stimulation pattern, a phosphene model, and a primary vision system network (PVS-net) to simulate the signal processing from the retina to the visual cortex and predict the firing rate of V1 neurons. Experimental results show that the predicted stimulation shares similar patterns to the original scenes, whose different stimulus amplitudes contribute to a similar firing rate with normal cells. Numerically, the predicted firing rate and the recorded response of normal neurons achieve a Pearson correlation coefficient of 0.78.",
        "keywords": "Visual prostheses;Spiking recurrent neural network;Dynamic vision sensor;Biological phosphene model",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/a7d80ca856967d922db0c54f794573e8171e8980.pdf",
        "author": "Chuanqing Wang;Di Wu;Chaoming Fang;Jie Yang;Mohamad Sawan",
        "authorids": "~Chuanqing_Wang2;~Di_Wu10;~Chaoming_Fang1;~Jie_Yang16;~Mohamad_Sawan1",
        "gender": ";M;M;M;M",
        "homepage": "https://scholar.google.com.hk/citations?user=6pcGahEAAAAJ&hl=zh-CN;;https://scholar.google.com/citations?user=oJib2aEAAAAJ&hl=zh-CN;;http://www.mohamadsawan.org",
        "dblp": ";;;12/1198-33;",
        "google_scholar": "https://scholar.google.com.hk/citations?user=6pcGahEAAAAJ;https://scholar.google.com/citations?hl=en;oJib2aEAAAAJ;https://scholar.google.com.hk/citations?user=6T786i8AAAAJ;https://scholar.google.ca/citations?user=DGOpH3sAAAAJ",
        "orcid": "0000-0001-8585-2437;;;;0000-0002-4137-7272",
        "linkedin": ";;;;mohamadsawan/",
        "or_profile": "~Chuanqing_Wang2;~Di_Wu10;~Chaoming_Fang1;~Jie_Yang16;~Mohamad_Sawan1",
        "aff": "Westlake University;Westlake University;Westlake University;Westlake University;Westlake University",
        "aff_domain": "westlake.edu;westlake.edu.cn;westlake.edu;westlake.edu;westlake.edu",
        "position": "PhD student;PhD student;PhD student;Associate Professor;Full Professor",
        "bibtex": "@inproceedings{\nwang2024exploring,\ntitle={Exploring Effective Stimulus Encoding via Vision System Modeling for Visual Prostheses},\nauthor={Chuanqing Wang and Di Wu and Chaoming Fang and Jie Yang and Mohamad Sawan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=cKAUvMePUN}\n}",
        "github": "",
        "project": "",
        "reviewers": "QbGv;JqK3;NiJW;Fc3Q",
        "pdf_size": 6570416,
        "rating": "5;6;6;8",
        "confidence": "3;3;3;4",
        "soundness": "2;3;3;4",
        "contribution": "2;4;3;4",
        "presentation": "2;2;3;3",
        "wc_summary": "54;101;63;53",
        "wc_strengths": "49;30;52;33",
        "wc_weaknesses": "371;12;33;119",
        "wc_questions": "144;136;332;115",
        "wc_review": "618;279;480;320",
        "wc_reply_reviewers": "0;0;11;0",
        "wc_reply_authors": "1431;687;946;986",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "2;1;2;2",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            67.75,
            19.587942719948924
        ],
        "wc_strengths_avg": [
            41.0,
            9.617692030835672
        ],
        "wc_weaknesses_avg": [
            133.75,
            142.72241414718292
        ],
        "wc_questions_avg": [
            181.75,
            87.39100354155455
        ],
        "wc_review_avg": [
            424.25,
            134.73376525578138
        ],
        "wc_reply_reviewers_avg": [
            2.75,
            4.763139720814412
        ],
        "wc_reply_authors_avg": [
            1012.5,
            267.4962616561211
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.9271726499455306,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:w3SePFdlstQJ:scholar.google.com/&scioq=Exploring+Effective+Stimulus+Encoding+via+Vision+System+Modeling+for+Visual+Prostheses&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=cKAUvMePUN",
        "pdf": "https://openreview.net/pdf?id=cKAUvMePUN",
        "email": "westlake.edu;westlake.edu.cn;westlake.edu;westlake.edu;westlake.edu",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Westlake University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.westlake.edu.cn",
        "aff_unique_abbr": "WU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "cKGpe1792U",
        "title": "RGLA: Reverse Gradient Leakage Attack using Inverted Cross-Entropy Loss Function",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Federated learning (FL) has gained widespread adoption due to its ability to jointly train models by only uploading gradients while retaining data locally. Recent research has revealed that gradients can expose the private training data of the client. However, these recent attacks were either powerless against the gradient computed on high-resolution data of large batch size or often relied on the strict assumption that the adversary could control and ensure unique labels for each sample in the attacked batch. These unrealistic settings and assumptions create the illusion that data privacy is still protected in real-world FL training mechanisms. In this paper, we propose a novel gradient leakage attack named RGLA, which effectively recovers high-resolution data of large batch size from gradients while considering duplicate labels, making it applicable in realistic FL scenarios. The key to RGLA is to invert the cross-entropy loss function to obtain the model output corresponding to the private model inputs. Next, RGLA directly computes the feature map inputted into the last fully-connected layer leveraging the obtained model output. To our best acknowledge, this is the first successful disaggregation of the feature map in a generic FL setting. Finally, a previous generative feature inversion model is used to invert the feature map of each sample to model input space. Extensive experimental results demonstrate that RGLA can reconstruct 224$\\times$224 pixels images with a batch size of 256 while considering duplicate labels. Our source code is available at https://github.com/AnonymousGitHub001/RGLA.",
        "keywords": "Federated learning;Data reconstruction attack;Gradient leakage attack;Inverted Cross-Entropy loss function",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/4fb545826d7afb12d44fae9d1efba9a6f5610732.zip",
        "author": "Kunlan Xiang;Haomiao Yang;Meng Hao",
        "authorids": "~Kunlan_Xiang1;~Haomiao_Yang1;~Meng_Hao1",
        "gender": "F;;",
        "homepage": "http://xiangkl.top;;",
        "dblp": ";;",
        "google_scholar": ";;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Kunlan_Xiang1;~Haomiao_Yang1;~Meng_Hao1",
        "aff": "University of Electronic Science and Technology of China;;",
        "aff_domain": "uestc.edu.cn;;",
        "position": "MS student;;",
        "bibtex": "@misc{\nxiang2024rgla,\ntitle={{RGLA}: Reverse Gradient Leakage Attack using Inverted Cross-Entropy Loss Function},\nauthor={Kunlan Xiang and Haomiao Yang and Meng Hao},\nyear={2024},\nurl={https://openreview.net/forum?id=cKGpe1792U}\n}",
        "github": "",
        "project": "",
        "reviewers": "iafz;nX92;p8x8",
        "site": "https://openreview.net/forum?id=cKGpe1792U",
        "pdf_size": 21570497,
        "rating": "3;6;8",
        "confidence": "5;3;4",
        "soundness": "1;3;4",
        "contribution": "2;2;3",
        "presentation": "1;2;3",
        "wc_summary": "72;88;65",
        "wc_strengths": "67;77;74",
        "wc_weaknesses": "1018;289;265",
        "wc_questions": "166;293;213",
        "wc_review": "1323;747;617",
        "wc_reply_reviewers": "369;129;184",
        "wc_reply_authors": "4332;4500;2175",
        "reply_reviewers": "3;2;2",
        "reply_authors": "10;9;8",
        "rating_avg": [
            5.666666666666667,
            2.0548046676563256
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            75.0,
            9.626352718795768
        ],
        "wc_strengths_avg": [
            72.66666666666667,
            4.189935029992178
        ],
        "wc_weaknesses_avg": [
            524.0,
            349.44813635216315
        ],
        "wc_questions_avg": [
            224.0,
            52.42772803266099
        ],
        "wc_review_avg": [
            895.6666666666666,
            306.7956250593472
        ],
        "wc_reply_reviewers_avg": [
            227.33333333333334,
            102.65909062956328
        ],
        "wc_reply_authors_avg": [
            3669.0,
            1058.6415824064347
        ],
        "reply_reviewers_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            9.0,
            0.816496580927726
        ],
        "replies_avg": [
            49,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5960395606792698,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:6r5Bwg-UkcUJ:scholar.google.com/&scioq=RGLA:+Reverse+Gradient+Leakage+Attack+using+Inverted+Cross-Entropy+Loss+Function&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Electronic Science and Technology of China",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uestc.edu.cn",
        "aff_unique_abbr": "UESTC",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "cKIwtXHg4D",
        "title": "ProGO: Probabilistic Global Optimizer",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In the field of global optimization, many existing algorithms face challenges posed by non-convex target functions and high computational complexity or unavailability of gradient information. These limitations, exacerbated by sensitivity to initial conditions, often lead to suboptimal solutions or failed convergence. This is true even for Metaheuristic algorithms designed to amalgamate different optimization techniques to improve their efficiency and robustness. To address these challenges, we develop a sequence of multidimensional integration-based methods that we show to converge to the global optima under some mild regularity conditions. Our probabilistic approach does not require the use of gradients and is underpinned by a mathematically rigorous convergence framework anchored in the nuanced properties of nascent optima distribution. In order to alleviate the problem of multidimensional integration, we develop a latent slice sampler that enjoys a geometric rate of convergence in generating samples from the nascent optima distribution, which is used to approximate the global optima. The proposed Probabilistic Global Optimizer (ProGO) provides a scalable unified framework to approximate the global optima of any continuous function defined on a domain of arbitrary dimension. Empirical illustrations of ProGO across a variety of popular non-convex test functions (having finite global optima) reveal that the proposed algorithm outperforms, by order of magnitude, many existing state-of-the-art methods, including gradient-based, zeroth-order gradient-free, and some Bayesian Optimization methods, in term regret value and speed of convergence. It is, however, to be noted that our approach may not be suitable for functions that are expensive to compute.",
        "keywords": "Latent slice sampler;nascent optima distribution;non-convex optimization;zeroth-order optimization",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/946bd2c70c49e4230dd6ea6753c2bd86d663e45f.zip",
        "author": "Xinyu Zhang;Sujit K Ghosh",
        "authorids": "~Xinyu_Zhang21;~Sujit_K_Ghosh1",
        "gender": "F;M",
        "homepage": "https://statistics.sciences.ncsu.edu/people/xzhang97/;https://ci.lib.ncsu.edu/profiles/sghosh2",
        "dblp": ";",
        "google_scholar": ";nDj-zN0AAAAJ",
        "orcid": ";0000-0001-8351-408X",
        "linkedin": ";ghoshbabu",
        "or_profile": "~Xinyu_Zhang21;~Sujit_K_Ghosh1",
        "aff": ";North Carolina State University",
        "aff_domain": ";ncsu.edu",
        "position": ";Full Professor",
        "bibtex": "@misc{\nzhang2024progo,\ntitle={Pro{GO}: Probabilistic Global Optimizer},\nauthor={Xinyu Zhang and Sujit K Ghosh},\nyear={2024},\nurl={https://openreview.net/forum?id=cKIwtXHg4D}\n}",
        "github": "",
        "project": "",
        "reviewers": "WwVi;dC7R;vc8T;jr1B",
        "site": "https://openreview.net/forum?id=cKIwtXHg4D",
        "pdf_size": 5167515,
        "rating": "3;3;5;6",
        "confidence": "3;4;3;4",
        "soundness": "2;3;3;4",
        "contribution": "1;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "70;88;76;107",
        "wc_strengths": "42;36;45;78",
        "wc_weaknesses": "362;119;178;95",
        "wc_questions": "28;135;5;69",
        "wc_review": "502;378;304;349",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "306;952;698;578",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            85.25,
            14.13108276106258
        ],
        "wc_strengths_avg": [
            50.25,
            16.345871038277526
        ],
        "wc_weaknesses_avg": [
            188.5,
            104.62432795483085
        ],
        "wc_questions_avg": [
            59.25,
            49.378006237595294
        ],
        "wc_review_avg": [
            383.25,
            73.4553435768971
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            633.5,
            232.34618567990307
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.19245008972987526,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14416943735821136626&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "North Carolina State University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ncsu.edu",
        "aff_unique_abbr": "NCSU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "cLIvvqf3Wk",
        "title": "Attribute-Guided Diffusion for Unsupervised Few-Shot Font Generation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Font generation is a challenging problem, especially for some writing systems composed of a large number of characters, such as Chinese, which has attracted the attention of many scholars in recent years. However, existing font generation methods are usually based on generative adversarial networks. Due to the problems of training instability and mode collapse in generative adversarial networks, the performance of many methods has encountered bottlenecks. In order to solve this problem, we apply the latest generative model \u2014 the diffusion model to this task. We use the method of decoupling content and style to extract image attributes, combine the required content and style with the input diffusion model as a condition, and then guide diffusion models to generate glyphs corresponding to styles. Our method can be stably trained on large datasets and our model achieves pretty good performance both qualitatively and quantitatively compared with previous font generation methods.",
        "keywords": "Diffusion Models; Font Generation",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Yan He;Xiang Xiang",
        "authorids": "~Yan_He1;~Xiang_Xiang1",
        "gender": "M;",
        "homepage": "https://github.com/heyan831;",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Yan_He1;~Xiang_Xiang1",
        "aff": "Huazhong University of Science and Technology;",
        "aff_domain": "hust.edu.cn;",
        "position": "MS student;",
        "bibtex": "@misc{\nhe2024attributeguided,\ntitle={Attribute-Guided Diffusion for Unsupervised Few-Shot Font Generation},\nauthor={Yan He and Xiang Xiang},\nyear={2024},\nurl={https://openreview.net/forum?id=cLIvvqf3Wk}\n}",
        "github": "",
        "project": "",
        "reviewers": "BnxP;xmu4;N8n1;28JC",
        "site": "https://openreview.net/forum?id=cLIvvqf3Wk",
        "pdf_size": 1468249,
        "rating": "3;3;5;5",
        "confidence": "4;5;4;4",
        "soundness": "2;1;2;2",
        "contribution": "1;2;2;3",
        "presentation": "2;3;3;2",
        "wc_summary": "45;23;47;93",
        "wc_strengths": "51;9;25;99",
        "wc_weaknesses": "87;170;190;178",
        "wc_questions": "94;142;22;88",
        "wc_review": "277;344;284;458",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "164;121;85;236",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            52.0,
            25.475478405713993
        ],
        "wc_strengths_avg": [
            46.0,
            34.07345007480164
        ],
        "wc_weaknesses_avg": [
            156.25,
            40.61018960802818
        ],
        "wc_questions_avg": [
            86.5,
            42.717092597694425
        ],
        "wc_review_avg": [
            340.75,
            72.53059699189026
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            151.5,
            56.233886580957574
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:bWky5WEihuQJ:scholar.google.com/&scioq=Attribute-Guided+Diffusion+for+Unsupervised+Few-Shot+Font+Generation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Huazhong University of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.hust.edu.cn",
        "aff_unique_abbr": "HUST",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "cLdSQOzPp3",
        "title": "SSIF: Learning Continuous Image Representation for Spatial-Spectral Super-Resolution",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Existing digital sensors capture images at fixed spatial and spectral resolu- tions (e.g., RGB, multispectral, and hyperspectral images), and each combina- tion requires bespoke machine learning models. Neural Implicit Functions par- tially overcome the spatial resolution challenge by representing an image in a resolution-independent way. However, they still operate at fixed, pre-defined spec- tral resolutions. To address this challenge, we propose Spatial-Spectral Implicit Function (SSIF), a neural implicit model that represents an image as a function of both continuous pixel coordinates in the spatial domain and continuous wave- lengths in the spectral domain. We empirically demonstrate the effectiveness of SSIF on two challenging spatio-spectral super-resolution benchmarks. We ob- serve that SSIF consistently outperforms state-of-the-art baselines even when the baselines are allowed to train separate models at each spectral resolution. We show that SSIF generalizes well to both unseen spatial resolutions and spectral resolutions. Moreover, SSIF can generate high-resolution images that improve the performance of downstream tasks (e.g., land use classification) by 1.7%-7%.",
        "keywords": "Hyperspectral Image;Continuous Image Spectral and Spatial Representation;Implicit Neural Representation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/f945950fec82ee65abd80c2bddfd1b2d2c2b3d92.zip",
        "author": "Gengchen Mai;Ni Lao;Weiwei Sun;Yuchi Ma;Jiaming Song;Chenlin Meng;Hongxu Ma;Jinmeng Rao;Ziyuan Li;Stefano Ermon",
        "authorids": "~Gengchen_Mai1;~Ni_Lao1;~Weiwei_Sun4;~Yuchi_Ma1;~Jiaming_Song1;~Chenlin_Meng1;~Hongxu_Ma1;~Jinmeng_Rao1;~Ziyuan_Li2;~Stefano_Ermon1",
        "gender": "M;M;M;M;M;F;M;M;F;M",
        "homepage": "https://gengchenmai.github.io/;http://www.cs.cmu.edu/~nlao;http://wsunid.github.io/;https://www.linkedin.com/in/lelemayuchi;http://tsong.me;https://chenlin9.github.io/;https://www.linkedin.com/in/hongxu-ma-7458a735;;https://www.business.uconn.edu/person/ziyuan-li/;http://cs.stanford.edu/~ermon/",
        "dblp": "151/5583;82/283;63/6566-6;;173/5104;227/2517;;209/9311;;47/8135",
        "google_scholar": "X2Wfl1UAAAAJ;iUgWR3MAAAAJ;https://scholar.google.ca/citations?user=XXC5tSEAAAAJ;ZFqkBkgAAAAJ;;nEFU7wIAAAAJ;;PpZvHlUAAAAJ;;",
        "orcid": "0000-0002-7818-7309;0000-0002-4034-7784;;;;;;;;",
        "linkedin": "gengchen-mai-144439121/;ni-lao;weiwei-sun-5705b013b/;;jiamings/;;;jinmeng-rao-5b4438121/;;",
        "or_profile": "~Gengchen_Mai1;~Ni_Lao1;~Weiwei_Sun4;~Yuchi_Ma1;~Jiaming_Song1;~Chenlin_Meng1;~Hongxu_Ma1;~Jinmeng_Rao1;~Ziyuan_Li2;~Stefano_Ermon1",
        "aff": "University of Georgia;Google;University of British Columbia;Stanford University;Luma AI;Stanford University;Google;Google DeepMind;University of Connecticut;Stanford University",
        "aff_domain": "uga.edu;google.com;cs.ubc.ca;stanford.edu;lumalabs.ai;stanford.edu;google.com;google.com;uconn.edu;stanford.edu",
        "position": "Assistant Professor;Researcher;PhD student;Postdoc;Chief Scientist;PhD student;Researcher;Researcher;PhD student;Associate Professor",
        "bibtex": "@misc{\nmai2024ssif,\ntitle={{SSIF}: Learning Continuous Image Representation for Spatial-Spectral Super-Resolution},\nauthor={Gengchen Mai and Ni Lao and Weiwei Sun and Yuchi Ma and Jiaming Song and Chenlin Meng and Hongxu Ma and Jinmeng Rao and Ziyuan Li and Stefano Ermon},\nyear={2024},\nurl={https://openreview.net/forum?id=cLdSQOzPp3}\n}",
        "github": "",
        "project": "",
        "reviewers": "uUms;WHXm;jdfT;Hc3v",
        "site": "https://openreview.net/forum?id=cLdSQOzPp3",
        "pdf_size": 10208063,
        "rating": "3;3;5;6",
        "confidence": "4;5;3;5",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;2;3",
        "wc_summary": "65;51;18;46",
        "wc_strengths": "27;28;30;111",
        "wc_weaknesses": "313;162;226;247",
        "wc_questions": "2;17;44;36",
        "wc_review": "407;258;318;440",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            45.0,
            17.073371078963874
        ],
        "wc_strengths_avg": [
            49.0,
            35.812009158939965
        ],
        "wc_weaknesses_avg": [
            237.0,
            53.902690099845664
        ],
        "wc_questions_avg": [
            24.75,
            16.391689967785506
        ],
        "wc_review_avg": [
            355.75,
            71.94572607181055
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": -0.058025885318565944,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13850645756089368417&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2;3;4;3;1;1;5;3",
        "aff_unique_norm": "University of Georgia;Google;University of British Columbia;Stanford University;Luma AI;University of Connecticut",
        "aff_unique_dep": ";Google;;;;",
        "aff_unique_url": "https://www.uga.edu;https://www.google.com;https://www.ubc.ca;https://www.stanford.edu;https://www.luma.ai;https://www.uconn.edu",
        "aff_unique_abbr": "UGA;Google;UBC;Stanford;Luma AI;UConn",
        "aff_campus_unique_index": "1;2;2;1;2",
        "aff_campus_unique": ";Mountain View;Stanford",
        "aff_country_unique_index": "0;0;1;0;0;0;0;2;0;0",
        "aff_country_unique": "United States;Canada;United Kingdom"
    },
    {
        "id": "cLqCZ740vw",
        "title": "Benchmarking Smoothness and Reducing High-Frequency Oscillations in Continuous Control Policies",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Reinforcement learning (RL) policies are prone to high frequency oscillations, specially undesirable when deploying to hardware in the real-world. In this paper, we identify, categorize, and compare methods from the literature that aim to mitigate high frequency oscillations in RL. We define two broad classes: loss regularization and architectural methods. At their core, they incentivize learning a smooth mapping, such that nearby states in the input space produce nearby actions in the output space. We present benchmarks in terms of policy performance and smoothness with staple RL environments from Gymnasium, as well as two robotics locomotion tasks that include deployment and evaluations in the real-world. Finally, we also propose hybrid methods that combine elements from both loss regularization and architectural methods, and outperform the existing approaches in the simulation benchmarks as well as in the real-world.",
        "keywords": "reinforcement learning;smoothness;benchmark",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/73928fff9cdac6231fe1a6624fde9201c05a9e5b.zip",
        "author": "Guilherme Henrique Galelli Christmann;Ying-Sheng Luo;Hanjaya Mandala;Wei-Chao Chen",
        "authorids": "~Guilherme_Henrique_Galelli_Christmann1;~Ying-Sheng_Luo1;~Hanjaya_Mandala1;~Wei-Chao_Chen1",
        "gender": "M;M;M;M",
        "homepage": "https://github.com/guichristmann;https://ysluo.github.io/;;",
        "dblp": ";;;37/1413",
        "google_scholar": ";;984Gl4gAAAAJ;bndb0gYAAAAJ",
        "orcid": ";;0000-0002-8051-4057;",
        "linkedin": ";;;wei-chao-chen-b4b0bb1/",
        "or_profile": "~Guilherme_Henrique_Galelli_Christmann1;~Ying-Sheng_Luo1;~Hanjaya_Mandala1;~Wei-Chao_Chen1",
        "aff": ";Inventec Corporation;;Inventec Inc.",
        "aff_domain": ";inventec.com;;inventec.com",
        "position": ";Researcher;;Senior Vice President",
        "bibtex": "@misc{\nchristmann2024benchmarking,\ntitle={Benchmarking Smoothness and Reducing High-Frequency Oscillations in Continuous Control Policies},\nauthor={Guilherme Henrique Galelli Christmann and Ying-Sheng Luo and Hanjaya Mandala and Wei-Chao Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=cLqCZ740vw}\n}",
        "github": "",
        "project": "",
        "reviewers": "5FVX;RjiF;ALp7;qSpQ",
        "site": "https://openreview.net/forum?id=cLqCZ740vw",
        "pdf_size": 4055959,
        "rating": "5;5;5;6",
        "confidence": "5;3;5;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;2",
        "presentation": "2;3;3;3",
        "wc_summary": "63;47;87;35",
        "wc_strengths": "52;37;55;49",
        "wc_weaknesses": "270;91;44;266",
        "wc_questions": "77;54;77;73",
        "wc_review": "462;229;263;423",
        "wc_reply_reviewers": "52;0;0;291",
        "wc_reply_authors": "1198;304;392;554",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.0,
            1.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            58.0,
            19.467922333931785
        ],
        "wc_strengths_avg": [
            48.25,
            6.832825184358224
        ],
        "wc_weaknesses_avg": [
            167.75,
            101.62769061628823
        ],
        "wc_questions_avg": [
            70.25,
            9.522998477370455
        ],
        "wc_review_avg": [
            344.25,
            99.93841853861807
        ],
        "wc_reply_reviewers_avg": [
            85.75,
            120.38765509802074
        ],
        "wc_reply_authors_avg": [
            612.0,
            350.00857132361773
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:6Iq0BbquEjkJ:scholar.google.com/&scioq=Benchmarking+Smoothness+and+Reducing+High-Frequency+Oscillations+in+Continuous+Control+Policies&hl=en&as_sdt=0,33",
        "gs_version_total": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Inventec Corporation",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.inventec.com",
        "aff_unique_abbr": "",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Taiwan",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "cMIUwcEEVw",
        "title": "RAVL: Reach-Aware Value Learning for the Edge-of-Reach Problem in Offline Model-Based Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Offline reinforcement learning makes use of pre-collected datasets and has emerged as a powerful paradigm for training agents without the need for expensive or unsafe online data collection. This offline approach, however, introduces the additional challenge of evaluating values for state-actions not seen in the dataset---termed the out-of-sample problem. Model-based approaches deal with this by allowing the agent to collect additional data through rollouts in a learned dynamics model. The prevailing theoretical understanding is that this effectively resolves the out-of-sample issue, and that any remaining difficulties are due to errors in the learned dynamics model. Based on this understanding, one would expect improvements to the dynamics model to lead to improvements to the learned policy. Surprisingly, however, we find that existing algorithms completely fail when the true dynamics are provided in place of the learned dynamics model. This observation exposes a common misconception in offline reinforcement learning, namely that dynamics model errors do not explain the behavior of model-based methods. Our subsequent investigation reveals a second major and previously overlooked issue in offline model-based reinforcement learning (which we term the edge-of-reach problem), whereby values of states that are only reachable in the final step of the limited horizon rollouts are pathologically overestimated, similar to the out-of-sample problem faced by model-free methods. This new insight fills some of the gaps in existing theory and allows us to reinterpret the efficacy of prior model-based methods. Guided by this understanding, we propose Reach-Aware Value Learning (RAVL), a value-based algorithm that is able to capture value uncertainty at edge-of-reach states. Our method achieves strong performance on the standard D4RL benchmark, and we hope that the insights developed in this paper aid the future design of more accurately motivated offline algorithms.",
        "keywords": "Offline Reinforcement Learning;Model-Based Reinforcement Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Anya Sims;Cong Lu;Yee Whye Teh",
        "authorids": "~Anya_Sims1;~Cong_Lu1;~Yee_Whye_Teh2",
        "gender": "F;M;M",
        "homepage": "https://anyasims.github.io/;https://conglu.co.uk;http://csml.stats.ox.ac.uk/people/teh/",
        "dblp": ";;88/2483",
        "google_scholar": "https://scholar.google.com/citations?hl=en;yMGBji4AAAAJ;https://scholar.google.co.uk/citations?user=y-nUzMwAAAAJ",
        "orcid": ";0000-0001-5564-838X;",
        "linkedin": ";cong-lu-530b74104/;",
        "or_profile": "~Anya_Sims1;~Cong_Lu1;~Yee_Whye_Teh1",
        "aff": "University of Oxford;University of British Columbia;University of Oxford",
        "aff_domain": "ox.ac.uk;ubc.ca;ox.ac.uk",
        "position": "PhD student;Postdoc;Full Professor",
        "bibtex": "@misc{\nsims2024ravl,\ntitle={{RAVL}: Reach-Aware Value Learning for the Edge-of-Reach Problem in Offline Model-Based Reinforcement Learning},\nauthor={Anya Sims and Cong Lu and Yee Whye Teh},\nyear={2024},\nurl={https://openreview.net/forum?id=cMIUwcEEVw}\n}",
        "github": "",
        "project": "",
        "reviewers": "34p6;1Cj8;RQph;y8bf",
        "site": "https://openreview.net/forum?id=cMIUwcEEVw",
        "pdf_size": 3454718,
        "rating": "3;3;6;8",
        "confidence": "3;3;3;5",
        "soundness": "2;2;3;4",
        "contribution": "2;2;3;4",
        "presentation": "3;3;3;4",
        "wc_summary": "90;56;76;153",
        "wc_strengths": "67;12;71;107",
        "wc_weaknesses": "324;45;57;33",
        "wc_questions": "8;156;36;53",
        "wc_review": "489;269;240;346",
        "wc_reply_reviewers": "113;0;43;83",
        "wc_reply_authors": "808;691;793;484",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "3;2;2;2",
        "rating_avg": [
            5.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            93.75,
            36.27929850479472
        ],
        "wc_strengths_avg": [
            64.25,
            33.9512518178638
        ],
        "wc_weaknesses_avg": [
            114.75,
            121.10816446466357
        ],
        "wc_questions_avg": [
            63.25,
            55.90784828626478
        ],
        "wc_review_avg": [
            336.0,
            96.45465255756199
        ],
        "wc_reply_reviewers_avg": [
            59.75,
            42.50514674718816
        ],
        "wc_reply_authors_avg": [
            694.0,
            129.33097076879923
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.8164965809277261,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:2_rnZHGmCAQJ:scholar.google.com/&scioq=RAVL:+Reach-Aware+Value+Learning+for+the+Edge-of-Reach+Problem+in+Offline+Model-Based+Reinforcement+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Oxford;University of British Columbia",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ox.ac.uk;https://www.ubc.ca",
        "aff_unique_abbr": "Oxford;UBC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United Kingdom;Canada"
    },
    {
        "title": "ADDP: Learning General Representations for Image Recognition and Generation with Alternating Denoising Diffusion Process",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18299",
        "id": "cMPm8YFXZe",
        "author_site": "Changyao Tian, Chenxin Tao, Jifeng Dai, Hao Li, Ziheng Li, Lewei Lu, Xiaogang Wang, Hongsheng Li, Gao Huang, Xizhou Zhu",
        "tldr": "",
        "abstract": "Image recognition and generation have long been developed independently of each other. With the recent trend towards general-purpose representation learning, the development of general representations for both recognition and generation tasks is also promoted. However, preliminary attempts mainly focus on generation performance, but are still inferior on recognition tasks. These methods are modeled in the vector-quantized (VQ) space, whereas leading recognition methods use pixels as inputs. Our key insights are twofold: *(1) pixels as inputs are crucial for recognition tasks; (2) VQ tokens as reconstruction targets are beneficial for generation tasks.* These observations motivate us to propose an **Alternating Denoising Diffusion Process (ADDP)** that integrates these two spaces within a single representation learning framework. In each denoising step, our method first decodes pixels from previous VQ tokens, then generates new VQ tokens from the decoded pixels. The diffusion process gradually masks out a portion of VQ tokens to construct the training samples. The learned representations can be used to generate diverse high-fidelity images and also demonstrate excellent transfer performance on recognition tasks. Extensive experiments show that our method achieves competitive performance on unconditional generation, ImageNet classification, COCO detection, and ADE20k segmentation. Importantly, our method represents *the first successful development* of general representations applicable to both generation and dense recognition tasks. Code shall be released.",
        "keywords": "self-supervised representation learning; image recognition; image generation; Masked Image Modeling",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Changyao Tian;Chenxin Tao;Jifeng Dai;Hao Li;Ziheng Li;Lewei Lu;Xiaogang Wang;Hongsheng Li;Gao Huang;Xizhou Zhu",
        "authorids": "~Changyao_Tian1;~Chenxin_Tao2;~Jifeng_Dai1;~Hao_Li13;~Ziheng_Li2;~Lewei_Lu1;~Xiaogang_Wang2;~Hongsheng_Li3;~Gao_Huang1;~Xizhou_Zhu1",
        "gender": "M;;M;M;;M;M;M;M;",
        "homepage": "https://github.com/ChangyaoTian;;https://jifengdai.org/;https://cpsxhao.github.io;;;http://www.ee.cuhk.edu.hk/~xgwang/;http://www.ee.cuhk.edu.hk/~hsli;http://www.gaohuang.net;",
        "dblp": "307/5415;;14/9399;17/5705-69.html;;247/6438;91/6236-1.html;27/7402-1;;170/1608",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;;SH_-B_AAAAAJ;qHqQsY4AAAAJ;;https://scholar.google.com.hk/citations?user=zdgKJXIAAAAJ;https://scholar.google.com.hk/citations?user=-B5JgjsAAAAJ;BN2Ze-QAAAAJ;-P9LwcgAAAAJ;02RXI00AAAAJ",
        "orcid": "0000-0002-3285-4671;;;0000-0002-4612-0740;;;;;;",
        "linkedin": ";;;;;lewei-lu-94015977/;;;;",
        "or_profile": "~Changyao_Tian1;~Chenxin_Tao2;~Jifeng_Dai1;~Hao_Li13;~Ziheng_Li2;~Lewei_Lu1;~Xiaogang_Wang2;~Hongsheng_Li3;~Gao_Huang1;~Xizhou_Zhu1",
        "aff": "The Chinese University of Hong Kong, The Chinese University of Hong Kong;;Tsinghua University;The Chinese University of Hong Kong;;SenseTime;The Chinese University of Hong Kong;The Chinese University of Hong Kong;Tsinghua University;Tsinghua University",
        "aff_domain": "ee.cuhk.edu.hk;;tsinghua.edu.cn;cuhk.edu.hk;;sensetime.com;cuhk.edu.hk;cuhk.edu.hk;tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "PhD student;;Associate Professor;PhD student;;Researcher;Full Professor;Associate Professor;Associate Professor;Postdoc",
        "bibtex": "@inproceedings{\ntian2024addp,\ntitle={{ADDP}: Learning General Representations for Image Recognition and Generation with Alternating Denoising Diffusion Process},\nauthor={Changyao Tian and Chenxin Tao and Jifeng Dai and Hao Li and Ziheng Li and Lewei Lu and Xiaogang Wang and Hongsheng Li and Gao Huang and Xizhou Zhu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=cMPm8YFXZe}\n}",
        "github": "",
        "project": "",
        "reviewers": "hM7K;1FNr;pb3B;SakC",
        "pdf_size": 19209025,
        "rating": "5;6;6;6",
        "confidence": "3;3;2;4",
        "soundness": "2;3;2;3",
        "contribution": "2;3;3;3",
        "presentation": "2;3;1;2",
        "wc_summary": "55;82;66;138",
        "wc_strengths": "22;51;68;31",
        "wc_weaknesses": "67;160;56;69",
        "wc_questions": "29;2;77;202",
        "wc_review": "173;295;267;440",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "638;903;820;1417",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;2;2;2",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            85.25,
            31.932546093288583
        ],
        "wc_strengths_avg": [
            43.0,
            17.84656829757475
        ],
        "wc_weaknesses_avg": [
            88.0,
            41.862871377868956
        ],
        "wc_questions_avg": [
            77.5,
            76.73493337457198
        ],
        "wc_review_avg": [
            293.75,
            95.76892763313161
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            944.5,
            289.1457245058277
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17073193271218808008&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=cMPm8YFXZe",
        "pdf": "https://openreview.net/pdf?id=cMPm8YFXZe",
        "email": "ee.cuhk.edu.hk;;tsinghua.edu.cn;cuhk.edu.hk;;sensetime.com;cuhk.edu.hk;cuhk.edu.hk;tsinghua.edu.cn;tsinghua.edu.cn",
        "author_num": 10,
        "aff_unique_index": "0;1;0;2;0;0;1;1",
        "aff_unique_norm": "Chinese University of Hong Kong;Tsinghua University;SenseTime",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.cuhk.edu.hk;https://www.tsinghua.edu.cn;https://www.sensetime.com",
        "aff_unique_abbr": "CUHK;THU;SenseTime",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "cMQeDPwSrB",
        "title": "Memorization Through the Lens of Curvature of Loss Function Around Samples",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep neural networks are over-parameterized and easily overfit the datasets they train on. In the extreme case, it has been shown that these networks can memorize a training set with fully randomized labels. We propose using the curvature of loss function around each training sample, averaged over training epochs, as a measure of memorization of the sample. We use this metric to study the generalization versus memorization properties of different samples in popular image datasets and show that it captures memorization statistics well, both qualitatively and quantitatively. We first show that the high curvature samples visually correspond to long-tailed, mislabeled, or conflicting samples, those that are most likely to be memorized. This analysis helps us find, to the best of our knowledge, a novel failure mode on the CIFAR100 and ImageNet datasets: that of duplicated images with differing labels. Quantitatively, we corroborate the validity of our scores via two methods. First, we validate our scores against an independent and comprehensively calculated baseline, by showing high cosine similarity with the memorization scores released by Feldman and Zhang (2020).  Second, we inject corrupted samples which are memorized by the network, and show that these are learned with high curvature. To this end, we synthetically mislabel a random subset of the dataset. We overfit a network to it and show that sorting by curvature yields high AUROC values for identifying the corrupted samples. An added advantage of our method is that it is scalable, as it requires training only a single network as opposed to the thousands trained by the baseline, while capturing the aforementioned failure mode that the baseline fails to identify.",
        "keywords": "Memorization;Overfitting;Generalization;Dataset Integrity;Detecting Mislabeled Data",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/ac46dddd1b99572ae398b4b4f2e46d9f1d0fa5ec.zip",
        "author": "Isha Garg;Deepak Ravikumar;Kaushik Roy",
        "authorids": "~Isha_Garg1;~Deepak_Ravikumar1;~Kaushik_Roy1",
        "gender": "F;;M",
        "homepage": ";;https://engineering.purdue.edu/NRL/Group",
        "dblp": ";;r/KaushikRoy",
        "google_scholar": ";;to4P8KgAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Isha_Garg1;~Deepak_Ravikumar1;~Kaushik_Roy1",
        "aff": "Purdue University;;Purdue University",
        "aff_domain": "purdue.edu;;purdue.edu",
        "position": "PhD student;;Full Professor",
        "bibtex": "@misc{\ngarg2024memorization,\ntitle={Memorization Through the Lens of Curvature of Loss Function Around Samples},\nauthor={Isha Garg and Deepak Ravikumar and Kaushik Roy},\nyear={2024},\nurl={https://openreview.net/forum?id=cMQeDPwSrB}\n}",
        "github": "",
        "project": "",
        "reviewers": "fwvr;a9Na;1WGU;spXg;hiPb",
        "site": "https://openreview.net/forum?id=cMQeDPwSrB",
        "pdf_size": 29076586,
        "rating": "5;5;5;5;6",
        "confidence": "4;4;4;4;4",
        "soundness": "2;3;2;3;3",
        "contribution": "2;2;2;2;3",
        "presentation": "2;3;2;3;3",
        "wc_summary": "62;104;267;82;114",
        "wc_strengths": "54;52;131;29;91",
        "wc_weaknesses": "134;172;371;197;153",
        "wc_questions": "26;71;177;77;163",
        "wc_review": "276;399;946;385;521",
        "wc_reply_reviewers": "0;60;244;180;0",
        "wc_reply_authors": "1293;1564;2684;1980;1737",
        "reply_reviewers": "0;1;1;1;0",
        "reply_authors": "2;3;5;3;3",
        "rating_avg": [
            5.2,
            0.39999999999999997
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            125.8,
            72.85712044817582
        ],
        "wc_strengths_avg": [
            71.4,
            35.813963757171585
        ],
        "wc_weaknesses_avg": [
            205.4,
            85.38524462692602
        ],
        "wc_questions_avg": [
            102.8,
            57.80103805296233
        ],
        "wc_review_avg": [
            505.4,
            233.5864722110422
        ],
        "wc_reply_reviewers_avg": [
            96.8,
            98.67603559122144
        ],
        "wc_reply_authors_avg": [
            1851.6,
            472.70650513823057
        ],
        "reply_reviewers_avg": [
            0.6,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            3.2,
            0.9797958971132712
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10984568258835713207&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Purdue University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.purdue.edu",
        "aff_unique_abbr": "Purdue",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "cNi2EJ8OCh",
        "title": "Functional Classification Under Local Differential Privacy with Model Reversal and Model Average",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Local differential privacy (LDP) has been a focal point in data privacy research, yet its application in the field of functional data classification remains underexplored. To address this gap, we present a novel approach that tackles the challenge of infinite dimensionality in functional classification under LDP constraints. The main idea is to leverage the inherent property of functional data---which allows it to be approximated by a linear combination of basis functions---to reduce the dimensionality of data and facilitate the process of model training under LDP constraints. Specifically, we propose algorithms for constructing functional classifiers designed for both single-server and heterogeneous multi-server environments under LDP. In single-server scenarios, we introduce an innovative allocation strategy where fewer samples are used for training multiple weak classifiers, while the majority are used to evaluate their performance. This enables the construction of a robust classifier with enhanced performance by model averaging. We also introduce a novel technique, ``model reversal\", which effectively enhances the performance of weak classifiers. In multi-server contexts, we employ federated learning and enable each server to benefit from shared knowledge to improve the performance of each server's classifier. Experimental results demonstrate that our algorithms significantly boost the performance of functional classifiers under LDP.",
        "keywords": "Federated learning;Functional classification;Local differential privacy;Model average;Model reversal",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/d4b3279b9930c3005c3bf410f6b843de4ea04054.zip",
        "author": "Caihong Qin;Yang Bai",
        "authorids": "~Caihong_Qin1;~Yang_Bai7",
        "gender": "Not Specified;",
        "homepage": ";https://ssm.sufe.edu.cn/ce/79/c712a118393/page.htm",
        "dblp": ";",
        "google_scholar": ";5TlU9AMAAAAJ",
        "orcid": "0000-0002-9529-0500;0000-0002-4660-4542",
        "linkedin": ";",
        "or_profile": "~Caihong_Qin1;~Yang_Bai7",
        "aff": "Shanghai University of Finance and Economics;Shanghai University of Finance and Economics",
        "aff_domain": "sufe.edu;shufe.edu.cn",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\nqin2024functional,\ntitle={Functional Classification Under Local Differential Privacy with Model Reversal and Model Average},\nauthor={Caihong Qin and Yang Bai},\nyear={2024},\nurl={https://openreview.net/forum?id=cNi2EJ8OCh}\n}",
        "github": "",
        "project": "",
        "reviewers": "WLyT;D9bv;rZaz;sTQT",
        "site": "https://openreview.net/forum?id=cNi2EJ8OCh",
        "pdf_size": 2657508,
        "rating": "3;5;6;6",
        "confidence": "3;3;2;3",
        "soundness": "2;3;3;3",
        "contribution": "1;2;2;2",
        "presentation": "3;3;2;3",
        "wc_summary": "72;94;57;297",
        "wc_strengths": "60;46;21;66",
        "wc_weaknesses": "221;116;44;68",
        "wc_questions": "73;137;3;62",
        "wc_review": "426;393;125;493",
        "wc_reply_reviewers": "0;172;0;469",
        "wc_reply_authors": "1784;1800;367;2040",
        "reply_reviewers": "0;1;0;3",
        "reply_authors": "5;3;2;5",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            130.0,
            97.31135596630025
        ],
        "wc_strengths_avg": [
            48.25,
            17.32591988899868
        ],
        "wc_weaknesses_avg": [
            112.25,
            67.92781094662186
        ],
        "wc_questions_avg": [
            68.75,
            47.5519452809241
        ],
        "wc_review_avg": [
            359.25,
            139.96137860138418
        ],
        "wc_reply_reviewers_avg": [
            160.25,
            191.58858916960583
        ],
        "wc_reply_authors_avg": [
            1497.75,
            660.6672290192696
        ],
        "reply_reviewers_avg": [
            1.0,
            1.224744871391589
        ],
        "reply_authors_avg": [
            3.75,
            1.299038105676658
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.4714045207910316,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:S8KVRsE6cs0J:scholar.google.com/&scioq=Functional+Classification+Under+Local+Differential+Privacy+with+Model+Reversal+and+Model+Average&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Shanghai University of Finance and Economics",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.sufe.edu.cn",
        "aff_unique_abbr": "SUFE",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "cNwugejbW6",
        "title": "SoftHash: High-dimensional Hashing with A Soft Winner-Take-All Mechanism",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Locality-Sensitive Hashing (LSH) is a classical algorithm that aims to hash similar data points into the same bucket with high probability.\nInspired by the fly olfactory system, one variant of the LSH algorithm called $\\textit{FlyHash}$, assigns hash codes into a high-dimensional space, showing great performance for similarity search.\nHowever, the semantic representation capability of $\\textit{FlyHash}$ is not yet satisfactory, since it is a data-independent hashing algorithm, where the projection space is constructed randomly, rather than adapted to the input data manifold.\nIn this paper, we propose a data-dependent hashing algorithm named $\\textit{SoftHash}$. In particular, $\\textit{SoftHash}$ is motivated by the bio-nervous system that maps the input sensory signals into a high-dimensional space, to improve the semantic representation of hash codes. \nWe learn the hashing projection function using a Hebbian-like learning rule coupled with the idea of Winner-Take-All (WTA).\nSpecifically, the synaptic weights are updated solely based on the activities of pre- and post-synaptic neurons. Unlike the previous works that adopt the hard WTA rule, we introduce a soft WTA rule, whereby the non-winning neurons are not fully suppressed in the learning process.\nThis allows weakly correlated data to have a chance to be learned to generate more representative hash codes.\nWe conduct extensive experiments on six real-world datasets for tasks including image retrieval and word similarity search. The experimental results demonstrate that our method significantly outperforms these baselines in terms of data similarity search accuracy and speed.",
        "keywords": "Locality-sensitive hashing;Sparse expansive representations;Hebb rule;Winner-take-all;Image retrieval;Word similarity search",
        "primary_area": "metric learning, kernel learning, and sparse coding",
        "supplementary_material": "",
        "author": "Qian Zhang;Yansong Chua;Chenxiao Dou;Jibin Wu;Jianye Yang",
        "authorids": "~Qian_Zhang23;~Yansong_Chua1;~Chenxiao_Dou1;~Jibin_Wu1;~Jianye_Yang1",
        "gender": ";;;M;",
        "homepage": ";;;https://www.jibinwu.com/;https://jianye1hnu.github.io/",
        "dblp": ";180/0351;https://dblp.dagstuhl.de/pid/119/4489.html;228/1824;181/9099-1.html",
        "google_scholar": ";;;https://scholar.google.com.sg/citations?user=QwDyvrgAAAAJ;",
        "orcid": "0000-0001-9190-781X;;;;0000-0003-3417-823X",
        "linkedin": ";;https://www.linkedin.cn/injobs/in/chenxiao-dou-62467589;;",
        "or_profile": "~Qian_Zhang23;~Yansong_Chua1;~Chenxiao_Dou1;~Jibin_Wu1;~Jianye_Yang1",
        "aff": "China Nanhu Academy of Electronics and Information Technology;China Nanhu Academy of Electronics and Information Technology;;Hong Kong Polytechnic University;Guangzhou University",
        "aff_domain": "cnaeit.com;cnaeit.com;;polyu.edu.hk;gzhu.edu.cn",
        "position": "Researcher;Principal Researcher;;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nzhang2024softhash,\ntitle={SoftHash: High-dimensional Hashing with A Soft Winner-Take-All Mechanism},\nauthor={Qian Zhang and Yansong Chua and Chenxiao Dou and Jibin Wu and Jianye Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=cNwugejbW6}\n}",
        "github": "",
        "project": "",
        "reviewers": "3Wy1;xpXr;GrZJ;qurX",
        "site": "https://openreview.net/forum?id=cNwugejbW6",
        "pdf_size": 3149581,
        "rating": "5;5;6;6",
        "confidence": "5;3;4;3",
        "soundness": "3;3;2;3",
        "contribution": "3;3;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "65;57;73;89",
        "wc_strengths": "41;44;73;60",
        "wc_weaknesses": "98;32;264;53",
        "wc_questions": "62;232;154;22",
        "wc_review": "266;365;564;224",
        "wc_reply_reviewers": "0;0;116;0",
        "wc_reply_authors": "733;685;1095;425",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;3;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            71.0,
            11.832159566199232
        ],
        "wc_strengths_avg": [
            54.5,
            12.893796958227627
        ],
        "wc_weaknesses_avg": [
            111.75,
            91.07791993672231
        ],
        "wc_questions_avg": [
            117.5,
            81.61341801444172
        ],
        "wc_review_avg": [
            354.75,
            131.20856488812
        ],
        "wc_reply_reviewers_avg": [
            29.0,
            50.22947341949744
        ],
        "wc_reply_authors_avg": [
            734.5,
            238.85298825846832
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.30151134457776363,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:b55-CaQg4WkJ:scholar.google.com/&scioq=SoftHash:+High-dimensional+Hashing+with+A+Soft+Winner-Take-All+Mechanism&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "China Nanhu Academy of Electronics and Information Technology;Hong Kong Polytechnic University;Guangzhou University",
        "aff_unique_dep": ";;",
        "aff_unique_url": ";https://www.polyu.edu.hk;http://www.gzhu.edu.cn",
        "aff_unique_abbr": ";PolyU;GU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "cOLzQHklmn",
        "title": "Independently-prepared Query-efficient Model Selection",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The advancement of deep learning technologies is bringing new models by the day, which not only facilitates the importance of model selection but also makes it more challenging than ever. However, existing solutions for model selection either require a large amount of model operations proportional to the number of candidates when selecting models for each task, or require group preparations that jointly optimize the embedding vectors of many candidate models. As a result, the scalability of existing solutions is limited with the increasing amounts of candidates. In this work, we present a new paradigm for model selection, namely independently-prepared query-efficient model selection. The advantage of our paradigm is twofold: first, it is query-efficient, meaning that it requires only a constant amount of model operations every time it selects models for a new task; second, it is independently-prepared, meaning that any information about a candidate model that is necessary for the selection can be prepared independently requiring no interaction with others. Consequently, the new paradigm offers by definition many desirable properties for applications: updatability, decentralizability, flexibility, and certain preservation of both candidate privacy and query privacy. With the benefits uncovered, we present Standardized Embedder as a proof-of-concept solution to support the practicality of the proposed paradigm. We empirically evaluate this solution by selecting models for multiple downstream tasks, from a pool of 100 pre-trained models that cover different model architectures and various training recipes, highlighting the potential of the proposed paradigm.",
        "keywords": "model selection;machine learning;transfer learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/d861c4890f199e3f71430fa303f7c92796b9a7f0.zip",
        "author": "Wenxiao Wang;Weiming Zhuang;Lingjuan Lyu",
        "authorids": "~Wenxiao_Wang1;~Weiming_Zhuang1;~Lingjuan_Lyu1",
        "gender": "M;;F",
        "homepage": "https://wangwenxiao.github.io;https://weiming.me/;https://sites.google.com/view/lingjuan-lyu",
        "dblp": "243/5853-2;274/0724;178/9876",
        "google_scholar": "hn0u5VgAAAAJ;lLuLAzEAAAAJ;",
        "orcid": ";;",
        "linkedin": "wenxiaowang/;;",
        "or_profile": "~Wenxiao_Wang1;~Weiming_Zhuang1;~Lingjuan_Lyu1",
        "aff": "University of Maryland, College Park;Sony Research;Sony",
        "aff_domain": "umd.edu;sony.com;sony.com",
        "position": "PhD student;Researcher;scientist",
        "bibtex": "@misc{\nwang2024independentlyprepared,\ntitle={Independently-prepared Query-efficient Model Selection},\nauthor={Wenxiao Wang and Weiming Zhuang and Lingjuan Lyu},\nyear={2024},\nurl={https://openreview.net/forum?id=cOLzQHklmn}\n}",
        "github": "",
        "project": "",
        "reviewers": "SGa4;EJZF;BVf9",
        "site": "https://openreview.net/forum?id=cOLzQHklmn",
        "pdf_size": 2024985,
        "rating": "3;5;8",
        "confidence": "5;5;5",
        "soundness": "1;2;4",
        "contribution": "1;2;4",
        "presentation": "2;2;4",
        "wc_summary": "80;63;163",
        "wc_strengths": "122;31;81",
        "wc_weaknesses": "242;359;58",
        "wc_questions": "52;88;25",
        "wc_review": "496;541;327",
        "wc_reply_reviewers": "0;758;39",
        "wc_reply_authors": "1129;3326;433",
        "reply_reviewers": "0;4;1",
        "reply_authors": "4;7;2",
        "rating_avg": [
            5.333333333333333,
            2.0548046676563256
        ],
        "confidence_avg": [
            5.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "contribution_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            102.0,
            43.688289811649376
        ],
        "wc_strengths_avg": [
            78.0,
            37.2111094522411
        ],
        "wc_weaknesses_avg": [
            219.66666666666666,
            123.89332328885023
        ],
        "wc_questions_avg": [
            55.0,
            25.80697580112788
        ],
        "wc_review_avg": [
            454.6666666666667,
            92.12431214879646
        ],
        "wc_reply_reviewers_avg": [
            265.6666666666667,
            348.49613420460713
        ],
        "wc_reply_authors_avg": [
            1629.3333333333333,
            1232.9131716746679
        ],
        "reply_reviewers_avg": [
            1.6666666666666667,
            1.699673171197595
        ],
        "reply_authors_avg": [
            4.333333333333333,
            2.0548046676563256
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:dj_2WPxBR88J:scholar.google.com/&scioq=Independently-prepared+Query-efficient+Model+Selection&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of Maryland;Sony;Sony Corporation",
        "aff_unique_dep": ";Research;",
        "aff_unique_url": "https://www/umd.edu;https://www.sony.com;https://www.sony.com",
        "aff_unique_abbr": "UMD;Sony;Sony",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "College Park;",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "United States;Japan"
    },
    {
        "title": "Towards Faithful XAI Evaluation via Generalization-Limited Backdoor Watermark",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18298",
        "id": "cObFETcoeW",
        "author_site": "Mengxi Ya, Yiming Li, Tao Dai, Bin Wang, Yong Jiang, Shu-Tao Xia",
        "tldr": "",
        "abstract": "Saliency-based representation visualization (SRV) ($e.g.$, Grad-CAM) is one of the most classical and widely adopted explainable artificial intelligence (XAI) methods for its simplicity and efficiency. It can be used to interpret deep neural networks by locating saliency areas contributing the most to their predictions. However, it is difficult to automatically measure and evaluate the performance of SRV methods due to the lack of ground-truth salience areas of samples. In this paper, we revisit the backdoor-based SRV evaluation, which is currently the only feasible method to alleviate the previous problem. We first reveal its \\emph{implementation limitations} and \\emph{unreliable nature} due to the trigger generalization of existing backdoor watermarks. Given these findings, we propose a generalization-limited backdoor watermark (GLBW), based on which we design a more faithful XAI evaluation. Specifically, we formulate the training of watermarked DNNs as a min-max problem, where we find the `worst' potential trigger (with the highest attack effectiveness and differences from the ground-truth trigger) via inner maximization and minimize its effects and the loss over benign and poisoned samples via outer minimization in each iteration. In particular, we design an adaptive optimization method to find desired potential triggers in each inner maximization. Extensive experiments on benchmark datasets are conducted, verifying the effectiveness of our generalization-limited watermark. Our codes are available at \\url{https://github.com/yamengxi/GLBW}.",
        "keywords": "XAI;XAI Evaluation;Backdoor Watermark;Backdoor Attack;Backdoor for Positive Purposes",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/8d356821f8bdfe7735a3aba64e4c663d36fde53e.zip",
        "author": "Mengxi Ya;Yiming Li;Tao Dai;Bin Wang;Yong Jiang;Shu-Tao Xia",
        "authorids": "~Mengxi_Ya2;~Yiming_Li1;~Tao_Dai3;~Bin_Wang30;~Yong_Jiang3;~Shu-Tao_Xia1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://github.com/yamengxi;http://liyiming.tech;https://csse.szu.edu.cn/pages/user/index?id=1204;;;https://www.sigs.tsinghua.edu.cn/xst/list.htm",
        "dblp": ";l/YimingLi-4;54/875-1;;74/1552-1.html;03/6195",
        "google_scholar": ";mSW7kU8AAAAJ;MqJNdaAAAAAJ;;;https://scholar.google.com.hk/citations?user=koAXTXgAAAAJ",
        "orcid": ";0000-0002-2258-265X;0000-0003-0594-6404;0009-0004-9725-5305;;0000-0002-8639-982X",
        "linkedin": ";yiming-li-thu/;;;;",
        "or_profile": "~Mengxi_Ya2;~Yiming_Li1;~Tao_Dai3;~Bin_Wang30;~Yong_Jiang3;~Shu-Tao_Xia1",
        "aff": "Tsinghua University;Zhejiang University;Department of Software Engineering, Shenzhen University;Tsinghua University;Tsinghua University;Shenzhen International Graduate School, Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;zju.edu.cn;szu.edu;mails.tsinghua.edu.cn;tsinghua.edu.cn;sz.tsinghua.edu.cn",
        "position": "MS student;Research Professor;Assistant Professor;PhD student;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nya2024towards,\ntitle={Towards Faithful {XAI} Evaluation via Generalization-Limited Backdoor Watermark},\nauthor={Mengxi Ya and Yiming Li and Tao Dai and Bin Wang and Yong Jiang and Shu-Tao Xia},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=cObFETcoeW}\n}",
        "github": "",
        "project": "",
        "reviewers": "LeTy;4nxh;RMSQ;ZYFJ",
        "pdf_size": 5511822,
        "rating": "5;6;8;8",
        "confidence": "4;3;2;4",
        "soundness": "2;2;3;3",
        "contribution": "2;3;3;4",
        "presentation": "2;3;3;4",
        "wc_summary": "117;57;80;62",
        "wc_strengths": "33;66;81;155",
        "wc_weaknesses": "261;143;44;181",
        "wc_questions": "28;3;5;4",
        "wc_review": "439;269;210;402",
        "wc_reply_reviewers": "434;0;0;25",
        "wc_reply_authors": "1903;888;873;1682",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "6;4;4;4",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            79.0,
            23.547823678633232
        ],
        "wc_strengths_avg": [
            83.75,
            44.65072787760576
        ],
        "wc_weaknesses_avg": [
            157.25,
            78.03324611984304
        ],
        "wc_questions_avg": [
            10.0,
            10.41633332799983
        ],
        "wc_review_avg": [
            330.0,
            93.78965827851171
        ],
        "wc_reply_reviewers_avg": [
            114.75,
            184.60142875936796
        ],
        "wc_reply_authors_avg": [
            1336.5,
            462.6761826591034
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            4.5,
            0.8660254037844386
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.4061811972299616,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7842322169383857845&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=cObFETcoeW",
        "pdf": "https://openreview.net/pdf?id=cObFETcoeW",
        "email": "tsinghua.edu.cn;zju.edu.cn;szu.edu;mails.tsinghua.edu.cn;tsinghua.edu.cn;sz.tsinghua.edu.cn",
        "author_num": 6,
        "aff_unique_index": "0;1;2;0;0;0",
        "aff_unique_norm": "Tsinghua University;Zhejiang University;Shenzhen University",
        "aff_unique_dep": ";;Department of Software Engineering",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.zju.edu.cn;https://www.szu.edu.cn",
        "aff_unique_abbr": "THU;ZJU;SZU",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Shenzhen",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "cP2W2PJtBj",
        "title": "AntifakePrompt: Prompt-Tuned Vision-Language Models are Fake Image Detectors",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep generative models can create remarkably photorealistic fake images while raising concerns about misinformation and copyright infringement, known as deepfake threats. Deepfake detection technique is developed to distinguish between real and fake images, where the existing methods typically learn classifiers in the image domain or various feature domains. However, the generalizability of deepfake detection against emerging and more advanced generative models remains challenging. In this paper, being inspired by the zero-shot advantages of Vision-Language Models (VLMs), we propose a novel approach using VLMs (e.g. InstructBLIP) and prompt tuning techniques to improve the deepfake detection accuracy over unseen data. We formulate deepfake detection as a visual question answering problem, and tune soft prompts for InstructBLIP to answer the real/fake information of a query image. We conduct full-spectrum experiments on datasets from 3 held-in and 13 held-out generative models, covering modern text-to-image generation, image editing and adversarial image attacks. Results demonstrate that (1) the deepfake detection accuracy can be significantly and consistently improved (from 58.8% to 91.31%, in average accuracy over unseen data) using pretrained vision-language models with prompt tuning; (2) our superior performance is at less cost of training data and trainable parameters, resulting in an effective and efficient solution for deepfake detection. Data, code, models will be open-sourced.",
        "keywords": "DeepFake detection;vision-language models;prompt tuning;diffusion models;GANs",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "You-Ming Chang;Chen Yeh;Wei-Chen Chiu;Ning Yu",
        "authorids": "~You-Ming_Chang1;~Chen_Yeh1;~Wei-Chen_Chiu3;~Ning_Yu2",
        "gender": "M;M;;",
        "homepage": "https://github.com/thisismingggg;https://github.com/denny3388;;",
        "dblp": "359/6124;;;",
        "google_scholar": ";;;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~You-Ming_Chang1;~Chen_Yeh1;~Wei-Chen_Chiu3;~Ning_Yu2",
        "aff": "National Yang Ming Chiao Tung University;National Yang Ming Chiao Tung University;;",
        "aff_domain": "nycu.edu.tw;nycu.edu.tw;;",
        "position": "MS student;MS student;;",
        "bibtex": "@misc{\nchang2024antifakeprompt,\ntitle={AntifakePrompt: Prompt-Tuned Vision-Language Models are Fake Image Detectors},\nauthor={You-Ming Chang and Chen Yeh and Wei-Chen Chiu and Ning Yu},\nyear={2024},\nurl={https://openreview.net/forum?id=cP2W2PJtBj}\n}",
        "github": "",
        "project": "",
        "reviewers": "4Y5R;eMV8;NiiK",
        "site": "https://openreview.net/forum?id=cP2W2PJtBj",
        "pdf_size": 6002907,
        "rating": "3;3;5",
        "confidence": "5;3;3",
        "soundness": "2;3;2",
        "contribution": "2;3;2",
        "presentation": "3;2;3",
        "wc_summary": "77;69;96",
        "wc_strengths": "43;83;113",
        "wc_weaknesses": "177;310;228",
        "wc_questions": "47;10;258",
        "wc_review": "344;472;695",
        "wc_reply_reviewers": "243;0;289",
        "wc_reply_authors": "1291;717;4044",
        "reply_reviewers": "1;0;1",
        "reply_authors": "3;2;7",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            80.66666666666667,
            11.32352516764202
        ],
        "wc_strengths_avg": [
            79.66666666666667,
            28.674417556808756
        ],
        "wc_weaknesses_avg": [
            238.33333333333334,
            54.78645412467899
        ],
        "wc_questions_avg": [
            105.0,
            109.23674595421939
        ],
        "wc_review_avg": [
            503.6666666666667,
            145.03409560820134
        ],
        "wc_reply_reviewers_avg": [
            177.33333333333334,
            126.79204321337447
        ],
        "wc_reply_authors_avg": [
            2017.3333333333333,
            1452.102460419221
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            4.0,
            2.160246899469287
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5000000000000001,
        "gs_citation": 21,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14925688251116460428&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "National Yang Ming Chiao Tung University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nycu.edu.tw",
        "aff_unique_abbr": "NYCU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Taiwan",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Chain-of-Knowledge: Grounding Large Language Models via Dynamic Knowledge Adapting over Heterogeneous Sources",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18297",
        "id": "cPgh4gWZlz",
        "author_site": "Xingxuan Li, Ruochen Zhao, Yew Ken Chia, Bosheng Ding, Shafiq Joty, Soujanya Poria, Lidong Bing",
        "tldr": "",
        "abstract": "We present chain-of-knowledge (CoK), a novel framework that augments large language models (LLMs) by dynamically incorporating grounding information from heterogeneous sources. It results in more factual rationales and reduced hallucination in generation. \nSpecifically, CoK consists of three stages: reasoning preparation, dynamic knowledge adapting, and answer consolidation. \nGiven a knowledge-intensive question, CoK first prepares several preliminary rationales and answers while identifying the relevant knowledge domains.\nIf there is no majority consensus among the answers from samples, CoK corrects the rationales step by step by adapting knowledge from the identified domains.\nThese corrected rationales can plausibly serve as a better foundation for the final answer consolidation.\nUnlike prior studies that primarily use unstructured data, CoK also leverages structured knowledge sources such as Wikidata and tables that provide more reliable factual information.\nTo access both unstructured and structured knowledge sources in the dynamic knowledge adapting stage, we propose an adaptive query generator that allows the generation of queries for various types of query languages, including SPARQL, SQL, and natural sentences. Moreover, to minimize error propagation between rationales, CoK corrects the rationales progressively using preceding corrected rationales to generate and correct subsequent rationales.\nExtensive experiments show that CoK consistently improves the performance of LLMs on knowledge-intensive tasks across different domains.",
        "keywords": "large language model;knowledge grounding",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/b2a4e035eb65c0eb2a9d0a598dfc2637c02d190f.zip",
        "author": "Xingxuan Li;Ruochen Zhao;Yew Ken Chia;Bosheng Ding;Shafiq Joty;Soujanya Poria;Lidong Bing",
        "authorids": "~Xingxuan_Li1;~Ruochen_Zhao1;~Yew_Ken_Chia1;~Bosheng_Ding1;~Shafiq_Joty1;~Soujanya_Poria1;~Lidong_Bing2",
        "gender": "M;F;M;M;M;M;",
        "homepage": "https://xingxuanli.github.io/;;https://chiayewken.com;;https://raihanjoty.github.io/;https://soujanyaporia.github.io;https://lidongbing.github.io",
        "dblp": "222/9407;253/2147;248/8132;277/9378;62/2078;116/4904;53/6625",
        "google_scholar": "IqVxTDAAAAAJ;;_sIxF3wAAAAJ;Bp8u4lgAAAAJ;hR249csAAAAJ;https://scholar.google.co.in/citations?user=oS6gRc4AAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;;;;",
        "linkedin": ";esther-ruochen-zhao-855357150/;;ding-bosheng/;;;",
        "or_profile": "~Xingxuan_Li1;~Ruochen_Zhao1;~Yew_Ken_Chia1;~Bosheng_Ding1;~Shafiq_Joty1;~Soujanya_Poria1;~Lidong_Bing3",
        "aff": "Alibaba Group;Nanyang Technological University;Singapore University of Technology and Design;Nanyang Technological University;SalesForce.com;Singapore University of Technology and Design;Alibaba Group",
        "aff_domain": "alibaba-inc.com;ntu.edu.sg;sutd.edu.sg;ntu.edu.sg;salesforce.com;sutd.edu.sg;alibaba-inc.com",
        "position": "PhD student;PhD student;PhD student;PhD student;Principal Researcher;Associate Professor;Scientist",
        "bibtex": "@inproceedings{\nli2024chainofknowledge,\ntitle={Chain-of-Knowledge: Grounding Large Language Models via Dynamic Knowledge Adapting over Heterogeneous Sources},\nauthor={Xingxuan Li and Ruochen Zhao and Yew Ken Chia and Bosheng Ding and Shafiq Joty and Soujanya Poria and Lidong Bing},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=cPgh4gWZlz}\n}",
        "github": "",
        "project": "",
        "reviewers": "TzUb;SrPL;bxPp;84zL",
        "pdf_size": 1798990,
        "rating": "6;6;6;6",
        "confidence": "3;3;4;4",
        "soundness": "3;3;2;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;2;3",
        "wc_summary": "41;122;79;80",
        "wc_strengths": "77;84;49;38",
        "wc_weaknesses": "91;103;207;7",
        "wc_questions": "129;86;85;211",
        "wc_review": "338;395;420;336",
        "wc_reply_reviewers": "41;129;53;0",
        "wc_reply_authors": "468;1190;983;817",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "1;3;3;3",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            80.5,
            28.6574597618142
        ],
        "wc_strengths_avg": [
            62.0,
            19.06567596493762
        ],
        "wc_weaknesses_avg": [
            102.0,
            71.01408311032397
        ],
        "wc_questions_avg": [
            127.75,
            51.24146270355678
        ],
        "wc_review_avg": [
            372.25,
            36.34814300621147
        ],
        "wc_reply_reviewers_avg": [
            55.75,
            46.63354479342097
        ],
        "wc_reply_authors_avg": [
            864.5,
            264.3203548726431
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.8660254037844386
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 100,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16843376194535985139&as_sdt=5,34&sciodt=0,34&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=cPgh4gWZlz",
        "pdf": "https://openreview.net/pdf?id=cPgh4gWZlz",
        "email": "alibaba-inc.com;ntu.edu.sg;sutd.edu.sg;ntu.edu.sg;salesforce.com;sutd.edu.sg;alibaba-inc.com",
        "author_num": 7,
        "aff_unique_index": "0;1;2;1;3;2;0",
        "aff_unique_norm": "Alibaba Group;Nanyang Technological University;Singapore University of Technology and Design;Salesforce",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.alibaba.com;https://www.ntu.edu.sg;https://www.sutd.edu.sg;https://www.salesforce.com",
        "aff_unique_abbr": "Alibaba;NTU;SUTD;Salesforce",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;2;1;0",
        "aff_country_unique": "China;Singapore;United States"
    },
    {
        "id": "cPmLjxedbD",
        "title": "A path toward primitive machine intelligence: LMM not LLM is what you need.",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We live in a world where machines with large language models (LLMs) and deep reinforcement learning have shown sparks of super-human intelligence in question-answering and playing strategic boardgames. At the same time, animals continue to reign supreme in the sense of smell, a primitive form of intelligence. Applying the former (deep learning) tricks on large datasets of hyperspectral hardware and spectrometers may well lead to artificial noses that can detect the chemical composition of a mixture. But it comes at the cost of interpretability! \n\nHere, I propose a path that uses linear mixture models (LMMs) to build an engineering theory of cognitive development for chemosensing. With creative mathematical models, we can derive analytical expressions for the limits of chemosensing and advance the statistical mechanics of learning.",
        "keywords": "linear mixture model;cognitive development;hyperspectral;spectroscopy;chemometrics",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/aa52929e14243eb4e0b4560f836aadcb6cfe0aff.zip",
        "author": "Celestine Preetham Lawrence",
        "authorids": "~Celestine_Preetham_Lawrence1",
        "gender": "",
        "homepage": "",
        "dblp": "190/2562",
        "google_scholar": "p6QKLIMAAAAJ",
        "orcid": "0000-0002-5429-1320",
        "linkedin": "",
        "or_profile": "~Celestine_Preetham_Lawrence1",
        "aff": "University of Groningen",
        "aff_domain": "rug.nl",
        "position": "Postdoc",
        "bibtex": "@misc{\nlawrence2024a,\ntitle={A path toward primitive machine intelligence: {LMM} not {LLM} is what you need.},\nauthor={Celestine Preetham Lawrence},\nyear={2024},\nurl={https://openreview.net/forum?id=cPmLjxedbD}\n}",
        "github": "",
        "project": "",
        "reviewers": "wJx4;gSc5;G4jL;j3FH",
        "site": "https://openreview.net/forum?id=cPmLjxedbD",
        "pdf_size": 1159686,
        "rating": "1;1;1;1",
        "confidence": "5;3;4;4",
        "soundness": "2;1;1;1",
        "contribution": "1;1;1;1",
        "presentation": "2;2;1;1",
        "wc_summary": "78;112;2;60",
        "wc_strengths": "21;87;2;1",
        "wc_weaknesses": "117;184;3;4",
        "wc_questions": "1;33;7;22",
        "wc_review": "217;416;14;87",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "33;30;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;0;0",
        "rating_avg": [
            1.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            1.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.0,
            0.0
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            63.0,
            39.8622628559895
        ],
        "wc_strengths_avg": [
            27.75,
            35.12388788275011
        ],
        "wc_weaknesses_avg": [
            77.0,
            77.22370102500915
        ],
        "wc_questions_avg": [
            15.75,
            12.55736835487436
        ],
        "wc_review_avg": [
            183.5,
            152.66057120291407
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            15.75,
            15.785673884886892
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0.5,
            0.5
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:RqUWFY08xg4J:scholar.google.com/&scioq=A+path+toward+primitive+machine+intelligence:+LMM+not+LLM+is+what+you+need.&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Groningen",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.rug.nl",
        "aff_unique_abbr": "RUG",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Netherlands"
    },
    {
        "id": "cQgjz0mf0r",
        "title": "Deep Network Partition Density Exhibits Double Descent",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The study of Deep Network (DN) training dynamics has largely focused on the dynamics of the loss function, evaluated on or around train and test set samples. In fact, many DN phenomenon were first introduced in literature with respect to the loss or accuracy dynamics during training, e.g., double descent, grokking. No other statistics about the DN has been found to be as informative as the loss function. In this study, we provide a novel statistic that measures the underlying DN\u2019s local complexity, exhibiting two key benefits: (i) it does not require any labels, and (ii) it is informative about the training loss and accuracy dynamics. Our proposed statistic is based on the concentration of partition regions around samples \u2013which encompasses the local expressivity or complexity of a DN\u2013 and can be applied on arbitrary architectures, e.g. CNNs, VGGs and Resnets. We show that our statistic exhibits a double descent phenomenon during training, with the partition density first decreasing around training samples, then increasing (ascent), followed by an other descent during which neurons migrate towards the decision boundaries. We see this phenomenon happening for a number of different experimental setups, e.g., training with label noise, delayed generalization, i.e., grokking. Our observations provide a novel lens to study DN training dynamics from a spline theory perspective.",
        "keywords": "Double Descent;Partition Density;Linear Regions;Local Complexity",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Ahmed Imtiaz Humayun;Randall Balestriero;Richard Baraniuk",
        "authorids": "~Ahmed_Imtiaz_Humayun1;~Randall_Balestriero1;~Richard_Baraniuk1",
        "gender": "M;M;",
        "homepage": "https://imtiazhumayun.github.io;https://randallbalestriero.github.io/;http://richb.rice.edu/",
        "dblp": "222/1771;175/5364;32/2804",
        "google_scholar": "wJ2HUn4AAAAJ;S1x_xqcAAAAJ;https://scholar.google.com.tw/citations?user=N-BBA20AAAAJ",
        "orcid": ";;",
        "linkedin": ";randallbalestriero/;richard-baraniuk",
        "or_profile": "~Ahmed_Imtiaz_Humayun1;~Randall_Balestriero1;~Richard_Baraniuk1",
        "aff": "Google;Citadel;William Marsh Rice University",
        "aff_domain": "google.com;citadel.com;rice.edu",
        "position": "Student Researcher;Researcher;C. Sidney Burrus Professor",
        "bibtex": "@misc{\nhumayun2024deep,\ntitle={Deep Network Partition Density Exhibits Double Descent},\nauthor={Ahmed Imtiaz Humayun and Randall Balestriero and Richard Baraniuk},\nyear={2024},\nurl={https://openreview.net/forum?id=cQgjz0mf0r}\n}",
        "github": "",
        "project": "",
        "reviewers": "prSj;4pKG;n8fX;dy7R",
        "site": "https://openreview.net/forum?id=cQgjz0mf0r",
        "pdf_size": 23162710,
        "rating": "3;3;5;6",
        "confidence": "3;3;4;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;3;3",
        "wc_summary": "28;52;55;86",
        "wc_strengths": "8;41;82;127",
        "wc_weaknesses": "1729;76;186;398",
        "wc_questions": "54;54;22;143",
        "wc_review": "1819;223;345;754",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;993;0;1170",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;2;0;2",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            55.25,
            20.60794749605113
        ],
        "wc_strengths_avg": [
            64.5,
            44.60100895719737
        ],
        "wc_weaknesses_avg": [
            597.25,
            663.586232150728
        ],
        "wc_questions_avg": [
            68.25,
            45.090880452703516
        ],
        "wc_review_avg": [
            785.25,
            628.4028862919075
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            540.75,
            544.3589693391668
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            1.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:IcXpUjRma5kJ:scholar.google.com/&scioq=Deep+Network+Partition+Density+Exhibits+Double+Descent&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Google;Citadel;Rice University",
        "aff_unique_dep": "Google;;",
        "aff_unique_url": "https://www.google.com;https://www.citadel.edu;https://www.rice.edu",
        "aff_unique_abbr": "Google;Citadel;Rice",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Mountain View;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "cRbnZs2WY4",
        "title": "SelfClean: A Self-Supervised Data Cleaning Strategy",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Most benchmark datasets for computer vision contain irrelevant images, near duplicates, and label errors.\nConsequently, model performance on these benchmarks may not be an accurate estimate of generalization capabilities.\nThis is a particularly acute concern in computer vision for medicine where datasets are typically small, stakes are high, and annotation processes are expensive and error-prone. \nIn this paper we propose SelfClean, a general procedure to clean up image datasets exploiting a latent space learned with self-supervision.\nBy relying on self-supervised learning, our approach focuses on intrinsic properties of the data and avoids annotation biases.\nWe formulate dataset cleaning as either a set of ranking problems, which significantly reduce human annotation effort, or a set of scoring problems, which enable fully automated decisions based on score distributions.\nWe demonstrate that SelfClean achieves state-of-the-art performance in detecting irrelevant images, near duplicates, and label errors within popular computer vision benchmarks,\nretrieving both injected synthetic noise and natural contamination.\nIn addition, we apply our method to multiple image datasets and confirm an improvement in evaluation reliability.",
        "keywords": "Data Cleaning;Data-centric AI;Self-Supervised Learning",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Fabian Gr\u00f6ger;Simone Lionetti;Philippe Gottfrois;Alvaro Gonzalez-Jimenez;Ludovic Amruthalingam;Matthew Groh;Alexander A. Navarini;Marc Pouly",
        "authorids": "~Fabian_Gr\u00f6ger1;~Simone_Lionetti1;~Philippe_Gottfrois1;~Alvaro_Gonzalez-Jimenez1;~Ludovic_Amruthalingam1;~Matthew_Groh1;~Alexander_A._Navarini1;~Marc_Pouly1",
        "gender": "M;;;M;M;M;;M",
        "homepage": "https://www.hslu.ch/en/lucerne-university-of-applied-sciences-and-arts/about-us/people-finder/profile/?pid=4915;https://www.hslu.ch/en/lucerne-university-of-applied-sciences-and-arts/about-us/people-finder/profile/?pid=4484;;;;https://mattgroh.com;;https://marcpouly.ch",
        "dblp": "278/9039;286/7318;;318/8116;273/6466;217/2239;;40/1674",
        "google_scholar": "uwyr5k0AAAAJ;WCvkBwkAAAAJ;;LbtKzVgAAAAJ;3GMhoS8AAAAJ;Zri-8PwAAAAJ;;",
        "orcid": "0000-0002-9699-688X;0000-0001-7305-8957;;0000-0002-1337-9430;0000-0001-5980-5469;0000-0002-9029-0157;;0000-0002-9520-4799",
        "linkedin": "fabian-gr%C3%B6ger-6a1822a4/;simonelionetti;;https://linkedin.com/in/alvarogonjim;;;;marcpouly",
        "or_profile": "~Fabian_Gr\u00f6ger1;~Simone_Lionetti1;~Philippe_Gottfrois1;~Alvaro_Gonzalez-Jimenez1;~Ludovic_Amruthalingam1;~Matthew_Groh1;~Alexander_A._Navarini1;~Marc_Pouly1",
        "aff": "University of Basel;HSLU - Lucerne University of Applied Sciences and Arts;;University of Basel;HSLU - Lucerne University of Applied Sciences and Arts;Northwestern University;;HSLU - Lucerne University of Applied Sciences and Arts",
        "aff_domain": "unibas.ch;hslu.ch;;unibas.ch;hslu.ch;northwestern.edu;;hslu.ch",
        "position": "PhD student;Postdoc;;PhD student;Researcher;Assistant Professor;;Full Professor",
        "bibtex": "@misc{\ngr{\\\"o}ger2024selfclean,\ntitle={SelfClean: A Self-Supervised Data Cleaning Strategy},\nauthor={Fabian Gr{\\\"o}ger and Simone Lionetti and Philippe Gottfrois and Alvaro Gonzalez-Jimenez and Ludovic Amruthalingam and Matthew Groh and Alexander A. Navarini and Marc Pouly},\nyear={2024},\nurl={https://openreview.net/forum?id=cRbnZs2WY4}\n}",
        "github": "",
        "project": "",
        "reviewers": "N64F;psYA;zncP;97xm",
        "site": "https://openreview.net/forum?id=cRbnZs2WY4",
        "pdf_size": 15359969,
        "rating": "1;6;6;6",
        "confidence": "5;4;4;4",
        "soundness": "2;2;2;3",
        "contribution": "1;3;2;3",
        "presentation": "2;4;3;3",
        "wc_summary": "87;264;83;63",
        "wc_strengths": "21;86;82;51",
        "wc_weaknesses": "78;518;310;140",
        "wc_questions": "150;117;36;134",
        "wc_review": "336;985;511;388",
        "wc_reply_reviewers": "109;101;0;0",
        "wc_reply_authors": "1224;1805;2111;566",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "3;4;4;1",
        "rating_avg": [
            4.75,
            2.165063509461097
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            124.25,
            81.19536624709565
        ],
        "wc_strengths_avg": [
            60.0,
            26.277366686941825
        ],
        "wc_weaknesses_avg": [
            261.5,
            170.71833527773165
        ],
        "wc_questions_avg": [
            109.25,
            43.87126052440253
        ],
        "wc_review_avg": [
            555.0,
            256.264511784211
        ],
        "wc_reply_reviewers_avg": [
            52.5,
            52.576135270672
        ],
        "wc_reply_authors_avg": [
            1426.5,
            590.1840814525583
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.0,
            1.224744871391589
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11103113835542443687&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0;1;2;1",
        "aff_unique_norm": "University of Basel;Lucerne University of Applied Sciences and Arts;Northwestern University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.unibas.ch;https://www.hslu.ch;https://www.northwestern.edu",
        "aff_unique_abbr": "UniBas;HSLU;NU",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Lucerne",
        "aff_country_unique_index": "0;0;0;0;1;0",
        "aff_country_unique": "Switzerland;United States"
    },
    {
        "id": "cRmmIdqvZp",
        "title": "Barycentric Alignment of Mutually Disentangled Modalities",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Discovering explanatory factors of user preferences behind behavioral data has gained increasing attention. As collected behavioral data is often highly sparse, mining other data modalities, e.g., texts, for interest factors and then correlating them with those from behavioral data could provide a pathway to improve recommendation. Nonetheless, two challenges prevail. For one, the unordered set nature of discovered factors and the unavailability of prior alignment information causes a challenge to align revealed interest factors from two modalities. For another, it demands a tailored method to effectively transfer knowledge between interest factors from mutually related modalities. To resolve this, we regard discovered interest factors from ratings and texts as supporting points of two discrete measures. Then, their alignment is formulated as an optimal transport problem, finding an optimal mapping between two probability masses. Next, the mapping probability serves not only as the prior information but also as input of barycentric strategy to match and fuse interest factors, effectively tranferring user preferences between mutually disentangled modalities. \nExperiments on real-world datasets verify the advantage of the proposed method over a series of baselines.",
        "keywords": "mutually disentangled modalities;interest factor alignment",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/433eac5f6f7f3469dcadd62d4fa2610d7c0f8227.pdf",
        "author": "Nhu-Thuat Tran;Hady W. Lauw",
        "authorids": "~Nhu-Thuat_Tran1;~Hady_W._Lauw1",
        "gender": "M;M",
        "homepage": "https://trannhuthuat96.github.io/;http://www.hadylauw.com",
        "dblp": "253/9132;00/2494",
        "google_scholar": "jCZT_wIAAAAJ;HTC1z2gAAAAJ",
        "orcid": "0000-0001-5496-6749;0000-0002-8245-8677",
        "linkedin": "nhu-thuat-tran-84b549161/;hadylauw",
        "or_profile": "~Nhu-Thuat_Tran1;~Hady_W_Lauw1",
        "aff": "Singapore Management University;Singapore Management University",
        "aff_domain": "smu.edu.sg;smu.edu.sg",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\ntran2024barycentric,\ntitle={Barycentric Alignment of Mutually Disentangled Modalities},\nauthor={Nhu-Thuat Tran and Hady W. Lauw},\nyear={2024},\nurl={https://openreview.net/forum?id=cRmmIdqvZp}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZCpy;esB1;Mi6r",
        "site": "https://openreview.net/forum?id=cRmmIdqvZp",
        "pdf_size": 3713771,
        "rating": "5;6;8",
        "confidence": "4;3;3",
        "soundness": "3;2;3",
        "contribution": "3;3;3",
        "presentation": "1;3;3",
        "wc_summary": "300;34;179",
        "wc_strengths": "42;43;67",
        "wc_weaknesses": "57;7;68",
        "wc_questions": "929;1;74",
        "wc_review": "1328;85;388",
        "wc_reply_reviewers": "0;0;376",
        "wc_reply_authors": "1762;109;832",
        "reply_reviewers": "0;0;3",
        "reply_authors": "4;2;5",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            171.0,
            108.74128317555696
        ],
        "wc_strengths_avg": [
            50.666666666666664,
            11.55662388223981
        ],
        "wc_weaknesses_avg": [
            44.0,
            26.54555832275273
        ],
        "wc_questions_avg": [
            334.6666666666667,
            421.31249948490984
        ],
        "wc_review_avg": [
            600.3333333333334,
            529.1983455084577
        ],
        "wc_reply_reviewers_avg": [
            125.33333333333333,
            177.2480998174279
        ],
        "wc_reply_authors_avg": [
            901.0,
            676.5958912083341
        ],
        "reply_reviewers_avg": [
            1.0,
            1.4142135623730951
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            1.247219128924647
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.7559289460184545,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:T1gk2UCgEegJ:scholar.google.com/&scioq=Barycentric+Alignment+of+Mutually+Disentangled+Modalities&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Singapore Management University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.smu.edu.sg",
        "aff_unique_abbr": "SMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Singapore"
    },
    {
        "id": "cSSHiLnjsJ",
        "title": "Traveling Words: A Geometric Interpretation of Transformers",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Transformers have significantly advanced the field of natural language processing, but comprehending their internal mechanisms remains a challenge. In this paper, we introduce a novel geometric perspective that elucidates the inner mechanisms of transformer operations. Our primary contribution is illustrating how layer normalization confines the latent features to a hyper-sphere, subsequently enabling attention to mold the semantic representation of words on this surface. This geometric viewpoint seamlessly connects established properties such as iterative refinement and contextual embeddings. We validate our insights by probing a pre-trained 124M parameter GPT-2 model. Our findings reveal clear query-key attention patterns in early layers and build upon prior observations regarding the subject-specific nature of attention heads at deeper layers. Harnessing these geometric insights, we present an intuitive understanding of transformers, depicting them as processes that model the trajectory of word particles along the hyper-sphere.",
        "keywords": "Transformers;Attention;Natural Language Processing;Layer Normalization",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/1c8d75bc837ca03c2f79927270f1361cfabf86fe.zip",
        "author": "Raul Molina",
        "authorids": "~Raul_Molina1",
        "gender": "",
        "homepage": "",
        "dblp": "",
        "google_scholar": "https://scholar.google.co.uk/citations?hl=en",
        "orcid": "",
        "linkedin": "rsmolina",
        "or_profile": "~Raul_Molina1",
        "aff": "Independent",
        "aff_domain": "rsmolina.com",
        "position": "Researcher",
        "bibtex": "@misc{\nmolina2024traveling,\ntitle={Traveling Words: A Geometric Interpretation of Transformers},\nauthor={Raul Molina},\nyear={2024},\nurl={https://openreview.net/forum?id=cSSHiLnjsJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "qGqz;TdFy;rASQ;zeL2",
        "site": "https://openreview.net/forum?id=cSSHiLnjsJ",
        "pdf_size": 1715297,
        "rating": "3;3;3;5",
        "confidence": "4;2;4;2",
        "soundness": "3;2;1;2",
        "contribution": "2;2;2;2",
        "presentation": "3;2;1;2",
        "wc_summary": "202;32;139;98",
        "wc_strengths": "46;25;117;37",
        "wc_weaknesses": "115;76;76;76",
        "wc_questions": "66;34;43;4",
        "wc_review": "429;167;375;215",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            1.0
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            117.75,
            61.83192945396416
        ],
        "wc_strengths_avg": [
            56.25,
            35.856484769146014
        ],
        "wc_weaknesses_avg": [
            85.75,
            16.887495373796554
        ],
        "wc_questions_avg": [
            36.75,
            22.219079638904937
        ],
        "wc_review_avg": [
            296.5,
            108.54837631213098
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7650540169005011368&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "Independent",
        "aff_unique_dep": "",
        "aff_unique_url": "",
        "aff_unique_abbr": ""
    },
    {
        "id": "cTOL99p5HL",
        "title": "Ghost in the Minecraft: Hierarchical Agents for Minecraft via Large Language Models with Text-based Knowledge and Memory",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "As modern computer games continue to evolve, there is a growing need for adaptive agents that can effectively navigate, make decisions, and interact within vast, ever-changing worlds. While recently developed agents based on Large Language Models (LLMs) show promise in adaptability for controlled text environments, expansive and dynamic open worlds like Minecraft still pose challenges for their performance. To address this, we introduce Ghost in the Minecraft (GITM), a novel hierarchical agent that integrates LLMs with text-based knowledge and memory. Structured actions are constructed to enable LLMs to interact in Minecraft using textual descriptions, bridging the gap between desired agent behaviors and LLM limitations. The hierarchical agent then decomposes goals into sub-goals, actions, and operations by leveraging text knowledge and memory. A text-based in-context learning method is also designed to enhance future planning. GITM demonstrates the potential of LLMs in Minecraft's evolving open world. Notable milestones are collecting 99.2\\% of items and a 55\\% success rate on the popular ``ObtainDiamond'' task. GITM also shows impressive learning efficiency, requiring minimal computational resources.",
        "keywords": "Minecraft;Large Language Models;Game Agents;In-context Learning",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/3877d98fbd6716dce5a6b1c067809ac6bb7f4956.zip",
        "author": "Xizhou Zhu;Yuntao Chen;Hao Tian;Chenxin Tao;Weijie Su;Chenyu Yang;Gao Huang;Bin Li;Lewei Lu;Xiaogang Wang;Yu Qiao;Zhaoxiang Zhang;Jifeng Dai",
        "authorids": "~Xizhou_Zhu1;~Yuntao_Chen1;~Hao_Tian6;~Chenxin_Tao2;~Weijie_Su2;~Chenyu_Yang1;~Gao_Huang1;~Bin_Li8;~Lewei_Lu1;~Xiaogang_Wang2;~Yu_Qiao1;~Zhaoxiang_Zhang3;~Jifeng_Dai1",
        "gender": ";M;M;;M;M;M;M;M;M;;M;M",
        "homepage": ";;https://github.com/htian01;;https://www.weijiesu.com/;https://github.com/Chenyu-Yang-2000;http://www.gaohuang.net;http://staff.ustc.edu.cn/~binli;;http://www.ee.cuhk.edu.hk/~xgwang/;;http://zhaoxiangzhang.net;https://jifengdai.org/",
        "dblp": "170/1608;203/8284;;;57/10098-2;;;89/6764-25;247/6438;91/6236-1.html;;55/2285-1.html;14/9399",
        "google_scholar": "02RXI00AAAAJ;iLOoUqIAAAAJ;DMJviWgAAAAJ;;ECDe6IIAAAAJ;LReV9sUAAAAJ;-P9LwcgAAAAJ;;https://scholar.google.com.hk/citations?user=zdgKJXIAAAAJ;https://scholar.google.com.hk/citations?user=-B5JgjsAAAAJ;;qxWfV6cAAAAJ;SH_-B_AAAAAJ",
        "orcid": ";;;;;0000-0001-9997-4929;;0000-0002-2332-3959;;;;;",
        "linkedin": ";;;;weijie-su-abb163177/;;;;lewei-lu-94015977/;;;;",
        "or_profile": "~Xizhou_Zhu1;~Yuntao_Chen1;~Hao_Tian6;~Chenxin_Tao2;~Weijie_Su2;~Chenyu_Yang1;~Gao_Huang1;~Bin_Li8;~Lewei_Lu1;~Xiaogang_Wang2;~Yu_Qiao1;~Zhaoxiang_Zhang3;~Jifeng_Dai1",
        "aff": "Tsinghua University;Centre for Artificial Intelligence and Robotics (CAIR), Hong Kong Institute of Science & Innovation, Chinese Academy of Sciences;Sensetime Research Institute;;University of Science and Technology of China;Tsinghua University;Tsinghua University;University of Science and Technology of China;SenseTime;The Chinese University of Hong Kong;;Institute of Automation, Chinese Academy of Sciences;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;cair-cas.org.hk;sensetime.com;;ustc.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;ustc.edu.cn;sensetime.com;cuhk.edu.hk;;ia.ac.cn;tsinghua.edu.cn",
        "position": "Postdoc;Assistant Professor;Researcher;;PhD student;PhD student;Associate Professor;Full Professor;Researcher;Full Professor;;Full Professor;Associate Professor",
        "bibtex": "@misc{\nzhu2024ghost,\ntitle={Ghost in the Minecraft: Hierarchical Agents for Minecraft via Large Language Models with Text-based Knowledge and Memory},\nauthor={Xizhou Zhu and Yuntao Chen and Hao Tian and Chenxin Tao and Weijie Su and Chenyu Yang and Gao Huang and Bin Li and Lewei Lu and Xiaogang Wang and Yu Qiao and Zhaoxiang Zhang and Jifeng Dai},\nyear={2024},\nurl={https://openreview.net/forum?id=cTOL99p5HL}\n}",
        "github": "",
        "project": "",
        "reviewers": "W7X3;3ABz;iZAK",
        "site": "https://openreview.net/forum?id=cTOL99p5HL",
        "pdf_size": 1679790,
        "rating": "3;3;6",
        "confidence": "5;5;5",
        "soundness": "2;3;3",
        "contribution": "2;2;2",
        "presentation": "3;3;3",
        "wc_summary": "56;83;29",
        "wc_strengths": "23;49;51",
        "wc_weaknesses": "504;525;56",
        "wc_questions": "42;3;15",
        "wc_review": "625;660;151",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            5.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            56.0,
            22.045407685048602
        ],
        "wc_strengths_avg": [
            41.0,
            12.754084313139327
        ],
        "wc_weaknesses_avg": [
            361.6666666666667,
            216.30893545010008
        ],
        "wc_questions_avg": [
            20.0,
            16.30950643030009
        ],
        "wc_review_avg": [
            478.6666666666667,
            232.13549683081405
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            13,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ijf2iHXnPEkJ:scholar.google.com/&scioq=Ghost+in+the+Minecraft:+Hierarchical+Agents+for+Minecraft+via+Large+Language+Models+with+Text-based+Knowledge+and+Memory&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;0;0;3;4;5;1;0",
        "aff_unique_norm": "Tsinghua University;Chinese Academy of Sciences;Sensetime Research Institute;University of Science and Technology of China;SenseTime;Chinese University of Hong Kong",
        "aff_unique_dep": ";Centre for Artificial Intelligence and Robotics (CAIR);;;;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;http://www.cas.cn;https://www.sensetime.com/;http://www.ustc.edu.cn;https://www.sensetime.com;https://www.cuhk.edu.hk",
        "aff_unique_abbr": "THU;CAS;Sensetime;USTC;SenseTime;CUHK",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Hong Kong;Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "GlucoBench: Curated List of Continuous Glucose Monitoring Datasets with Prediction Benchmarks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18296",
        "id": "cUSNs8nGaV",
        "author_site": "Renat Sergazinov, Elizabeth Chun, Valeriya Rogovchenko, Nathaniel Fernandes, Nicholas Kasman, Irina Gaynanova",
        "tldr": "",
        "abstract": "The rising rates of diabetes necessitate innovative methods for its management. Continuous glucose monitors (CGM) are small medical devices that measure blood glucose levels at regular intervals providing insights into daily patterns of glucose variation. Forecasting of glucose trajectories based on CGM data  holds the potential to substantially improve diabetes management, by both refining artificial pancreas systems and enabling individuals to make adjustments based on  predictions to maintain optimal glycemic range. Despite numerous methods proposed for CGM-based glucose trajectory prediction, these methods are typically evaluated on small, private datasets, impeding reproducibility, further research, and practical adoption. The absence of standardized prediction tasks and systematic comparisons between methods has led to uncoordinated research efforts, obstructing the identification of optimal tools for tackling specific challenges. As a result, only a limited number of prediction methods have been implemented in clinical practice.  \n\nTo address these challenges, we present a comprehensive resource that provides (1) a consolidated repository of curated publicly available CGM datasets to foster reproducibility and accessibility; (2) a standardized task list to unify research objectives and facilitate coordinated efforts; (3) a set of benchmark models with established baseline performance, enabling the research community to objectively gauge new methods' efficacy; and (4) a detailed analysis of performance-influencing factors for model development. We anticipate these resources to propel collaborative research endeavors in the critical domain of CGM-based glucose predictions. Our code is available online at github.com/IrinaStatsLab/GlucoBench.",
        "keywords": "diabetes management;continuous glucose monitors (CGM);glucose trajectory prediction;artificial pancreas systems;public datasets;standardized tasks;benchmark models;glycemic control",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/d97f0301c2e033cd3deb466b6dc48c16f8aaf4da.zip",
        "author": "Renat Sergazinov;Elizabeth Chun;Valeriya Rogovchenko;Nathaniel J Fernandes;Nicholas Kasman;Irina Gaynanova",
        "authorids": "~Renat_Sergazinov1;~Elizabeth_Chun1;~Valeriya_Rogovchenko1;~Nathaniel_J_Fernandes1;~Nicholas_Kasman1;~Irina_Gaynanova1",
        "gender": "M;;F;M;M;F",
        "homepage": "https://mrsergazinov.github.io/;;;;https://nckasman.vercel.app/;http://irinagain.github.io",
        "dblp": ";;;;;https://dblp.uni-trier.de/pers/hd/g/Gaynanova:Irina",
        "google_scholar": "OhV6QOkAAAAJ;;;https://scholar.google.com/citations?hl=en;;Jx4XlxcAAAAJ",
        "orcid": "0000-0001-5905-3674;;;;;0000-0002-4116-0268",
        "linkedin": "renatsergazinov/;elizabethchun/;valeriya-rogovchenko/;nathanielfernandes/;;",
        "or_profile": "~Renat_Sergazinov1;~Elizabeth_Chun1;~Valeriya_Rogovchenko1;~Nathaniel_J_Fernandes1;~Nicholas_Kasman1;~Irina_Gaynanova1",
        "aff": "Texas A&M University - College Station;;Texas A&M University - College Station;Texas A&M University - College Station;Texas A&M University - College Station;Texas A&M University - College Station",
        "aff_domain": "tamu.edu;;tamu.edu;tamu.edu;tamu.edu;tamu.edu",
        "position": "PhD student;;PhD student;Undergrad student;Undergrad student;Associate Professor",
        "bibtex": "@inproceedings{\nsergazinov2024glucobench,\ntitle={GlucoBench: Curated List of Continuous Glucose Monitoring Datasets with Prediction Benchmarks},\nauthor={Renat Sergazinov and Elizabeth Chun and Valeriya Rogovchenko and Nathaniel J Fernandes and Nicholas Kasman and Irina Gaynanova},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=cUSNs8nGaV}\n}",
        "github": "",
        "project": "",
        "reviewers": "XK2E;HdpX;5DZS",
        "pdf_size": 1224148,
        "rating": "5;6;8",
        "confidence": "4;3;4",
        "soundness": "2;2;3",
        "contribution": "1;2;4",
        "presentation": "2;2;4",
        "wc_summary": "59;90;49",
        "wc_strengths": "49;120;114",
        "wc_weaknesses": "125;56;37",
        "wc_questions": "61;209;19",
        "wc_review": "294;475;219",
        "wc_reply_reviewers": "9;12;0",
        "wc_reply_authors": "814;2063;446",
        "reply_reviewers": "1;1;0",
        "reply_authors": "1;3;1",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            66.0,
            17.45470328211473
        ],
        "wc_strengths_avg": [
            94.33333333333333,
            32.14895885647862
        ],
        "wc_weaknesses_avg": [
            72.66666666666667,
            37.80946383586463
        ],
        "wc_questions_avg": [
            96.33333333333333,
            81.49164919725756
        ],
        "wc_review_avg": [
            329.3333333333333,
            107.45645112737014
        ],
        "wc_reply_reviewers_avg": [
            7.0,
            5.0990195135927845
        ],
        "wc_reply_authors_avg": [
            1107.6666666666667,
            692.0271349850059
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.18898223650461363,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13636080099703929229&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=cUSNs8nGaV",
        "pdf": "https://openreview.net/pdf?id=cUSNs8nGaV",
        "email": "tamu.edu;;tamu.edu;tamu.edu;tamu.edu;tamu.edu",
        "author_num": 6,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Texas A&M University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tamu.edu",
        "aff_unique_abbr": "TAMU",
        "aff_campus_unique_index": "0;0;0;0;0",
        "aff_campus_unique": "College Station",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Improved Analysis of Sparse Linear Regression in Local Differential Privacy Model",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18295",
        "id": "cVUOnF7iVp",
        "author_site": "Liyang Zhu, Meng Ding, Vaneet Aggarwal, Jinhui Xu, Di Wang",
        "tldr": "",
        "abstract": "In this paper, we revisit \nthe problem of sparse linear regression in the local differential privacy (LDP) model. Existing research in the non-interactive and sequentially local models has focused on obtaining the lower bounds for the case where the underlying parameter is $1$-sparse, and extending such bounds to the more general $k$-sparse case has proven to be challenging. Moreover, it is unclear whether efficient non-interactive LDP (NLDP) algorithms exist. To address these issues, \nwe  first consider the problem in the $\\epsilon$ non-interactive LDP model and provide a lower bound of $\\Omega(\\frac{\\sqrt{dk\\log d}}{\\sqrt{n}\\epsilon})$ on the $\\ell_2$-norm estimation error for sub-Gaussian data, where $n$ is the sample size and $d$ is the dimension of the space. \nWe propose an innovative NLDP algorithm, the very first of its kind for the problem. As a remarkable outcome, this algorithm also yields a novel and highly efficient estimator as a valuable by-product. Our algorithm achieves an upper bound of $\\tilde{O}({\\frac{d\\sqrt{k}}{\\sqrt{n}\\epsilon}})$ for the estimation error when the data is sub-Gaussian, which can be further improved by a factor of  $O(\\sqrt{d})$ if the server has additional public but unlabeled data. \nFor the sequentially interactive LDP model, we show a similar lower bound of $\\Omega({\\frac{\\sqrt{dk}}{\\sqrt{n}\\epsilon}})$. As for the upper bound, we rectify a previous method and show that it is possible to achieve a bound of $\\tilde{O}(\\frac{k\\sqrt{d}}{\\sqrt{n}\\epsilon})$. Our findings reveal fundamental differences between the non-private case, central DP model, and local DP model in the sparse linear regression problem.",
        "keywords": "local differential privacy; linear regression",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Liyang Zhu;Meng Ding;Vaneet Aggarwal;Jinhui Xu;Di Wang",
        "authorids": "~Liyang_Zhu1;~Meng_Ding3;~Vaneet_Aggarwal1;~Jinhui_Xu1;~Di_Wang1",
        "gender": "M;F;M;M;",
        "homepage": "https://cowboyliyang.github.io/homepage/#;;;https://www.cse.buffalo.edu/~jinhui/;",
        "dblp": "189/1681;;91/6560;24/6437-1.html;",
        "google_scholar": ";Ipwvf8oAAAAJ;;https://scholar.google.com/citations?hl=en;",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Liyang_Zhu1;~Meng_Ding3;~Vaneet_Aggarwal1;~Jinhui_Xu1;~Di_Wang1",
        "aff": "Duke University;State University of New York at Buffalo;Purdue University;University at Buffalo, State University of New York;",
        "aff_domain": "duke.edu;buffalo.edu;purdue.edu;buffalo.edu;",
        "position": "PhD student;PhD student;Full Professor;Full Professor;",
        "bibtex": "@inproceedings{\nzhu2024improved,\ntitle={Improved Analysis of Sparse Linear Regression in Local Differential Privacy Model},\nauthor={Liyang Zhu and Meng Ding and Vaneet Aggarwal and Jinhui Xu and Di Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=cVUOnF7iVp}\n}",
        "github": "",
        "project": "",
        "reviewers": "UbUb;qQ5H;ZWvr",
        "pdf_size": 587507,
        "rating": "5;6;8",
        "confidence": "3;3;3",
        "soundness": "2;3;4",
        "contribution": "2;3;3",
        "presentation": "3;3;3",
        "wc_summary": "44;84;78",
        "wc_strengths": "39;15;116",
        "wc_weaknesses": "92;31;22",
        "wc_questions": "181;67;127",
        "wc_review": "356;197;343",
        "wc_reply_reviewers": "0;0;13",
        "wc_reply_authors": "1016;914;144",
        "reply_reviewers": "0;0;1",
        "reply_authors": "4;3;1",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            68.66666666666667,
            17.613126418163876
        ],
        "wc_strengths_avg": [
            56.666666666666664,
            43.083897481799646
        ],
        "wc_weaknesses_avg": [
            48.333333333333336,
            31.09483701338357
        ],
        "wc_questions_avg": [
            125.0,
            46.561786907291264
        ],
        "wc_review_avg": [
            298.6666666666667,
            72.08482657412878
        ],
        "wc_reply_reviewers_avg": [
            4.333333333333333,
            6.128258770283413
        ],
        "wc_reply_authors_avg": [
            691.3333333333334,
            389.2568418010002
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1380676516635764228&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=cVUOnF7iVp",
        "pdf": "https://openreview.net/pdf?id=cVUOnF7iVp",
        "email": "duke.edu;buffalo.edu;purdue.edu;buffalo.edu;",
        "author_num": 5,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Duke University;State University of New York at Buffalo;Purdue University;University at Buffalo",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.duke.edu;https://www.buffalo.edu;https://www.purdue.edu;https://www.buffalo.edu",
        "aff_unique_abbr": "Duke;SUNY Buffalo;Purdue;UB",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Buffalo",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "cVea4KQ4xm",
        "title": "Beyond Demographic Parity: Redefining Equal Treatment",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Liberalism-oriented political philosophy reasons that all individuals should be treated equally independently of their protected characteristics.\nRelated work in machine learning has translated the concept of \\emph{equal treatment} into terms of \\emph{equal outcome} and measured it as \\emph{demographic parity} (also called \\emph{statistical parity}).\nOur analysis reveals that the two concepts of equal outcome and equal treatment diverge; therefore, demographic parity does not faithfully represent the notion of \\emph{equal treatment}.\nWe propose a new formalization for equal treatment by (i) considering the influence of feature values on predictions, such as computed by Shapley values decomposing predictions across its features, \n(ii) defining distributions of explanations, and (iii) comparing explanation distributions between populations with different protected characteristics. We show the theoretical properties of our notion of equal treatment and devise a classifier two-sample test based on the AUC of an equal treatment inspector. We study our formalization of equal treatment on synthetic and natural data. We release \\texttt{explanationspace}, an open-source Python package with methods and tutorials.",
        "keywords": "Fairness;Explainable AI;Demographic Parity;Political Philosophy",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Carlos Mougan;Antonio Ferrara;Laura State;Salvatore Ruggieri;Steffen Staab",
        "authorids": "~Carlos_Mougan1;~Antonio_Ferrara1;~Laura_State1;~Salvatore_Ruggieri1;~Steffen_Staab2",
        "gender": "M;M;;M;M",
        "homepage": "https://cmougan.eu;https://ferrart.github.io;;http://pages.di.unipi.it/ruggieri/;https://www.ki.uni-stuttgart.de/de/institut/team/Staab-00004/",
        "dblp": "293/7915;247/6152;;86/3031;s/SteffenStaab",
        "google_scholar": "dQ5WrokAAAAJ;https://scholar.google.com/citations?hl=en;;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=de",
        "orcid": ";0000-0002-0784-1115;;0000-0002-1917-6087;0000-0002-0780-4154",
        "linkedin": "carlosmougan/;;;salvatore-ruggieri-209759/;",
        "or_profile": "~Carlos_Mougan1;~Antonio_Ferrara1;~Laura_State1;~Salvatore_Ruggieri1;~Steffen_Staab2",
        "aff": "University of Southampton;CENTAI;;University of Pisa;University of Southampton",
        "aff_domain": "soton.ac.uk;centai.eu;;unipi.it;soton.ac.uk",
        "position": "PhD student;Researcher;;Full Professor;Full Professor",
        "bibtex": "@misc{\nmougan2024beyond,\ntitle={Beyond Demographic Parity: Redefining Equal Treatment},\nauthor={Carlos Mougan and Antonio Ferrara and Laura State and Salvatore Ruggieri and Steffen Staab},\nyear={2024},\nurl={https://openreview.net/forum?id=cVea4KQ4xm}\n}",
        "github": "",
        "project": "",
        "reviewers": "pKVE;fCKF;ZXLv;1Jx6;9JSK",
        "site": "https://openreview.net/forum?id=cVea4KQ4xm",
        "pdf_size": 979919,
        "rating": "3;3;5;6;8",
        "confidence": "3;4;3;3;3",
        "soundness": "2;2;3;2;3",
        "contribution": "2;2;3;3;3",
        "presentation": "2;2;3;2;3",
        "wc_summary": "77;52;117;39;151",
        "wc_strengths": "55;6;82;28;92",
        "wc_weaknesses": "200;338;461;692;151",
        "wc_questions": "62;4;64;52;96",
        "wc_review": "394;400;724;811;490",
        "wc_reply_reviewers": "0;226;78;13;9",
        "wc_reply_authors": "337;1317;819;761;443",
        "reply_reviewers": "0;2;1;1;1",
        "reply_authors": "1;3;2;1;1",
        "rating_avg": [
            5.0,
            1.8973665961010275
        ],
        "confidence_avg": [
            3.2,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            87.2,
            41.532637768386444
        ],
        "wc_strengths_avg": [
            52.6,
            32.246550203083736
        ],
        "wc_weaknesses_avg": [
            368.4,
            194.85235436093657
        ],
        "wc_questions_avg": [
            55.6,
            29.729446681699272
        ],
        "wc_review_avg": [
            563.8,
            171.97720779219554
        ],
        "wc_reply_reviewers_avg": [
            65.2,
            85.03505159638583
        ],
        "wc_reply_authors_avg": [
            735.4,
            343.547143780879
        ],
        "reply_reviewers_avg": [
            1.0,
            0.6324555320336759
        ],
        "reply_authors_avg": [
            1.6,
            0.8
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.52704627669473,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4434611358356364795&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "University of Southampton;CENTAI;University of Pisa",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.southampton.ac.uk;https://www.centailearn.com/;https://www.unipi.it",
        "aff_unique_abbr": "Southampton;;UNIP",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;0",
        "aff_country_unique": "United Kingdom;China;Italy"
    },
    {
        "id": "cWE4cLrMV6",
        "title": "Improving Multi-task Learning via Seeking Task-based Flat Regions",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Multi-Task Learning (MTL) is a widely used and powerful learning paradigm for training deep neural networks that allows learning more than one objective by a single backbone. Compared to training tasks separately, MTL significantly reduces computational costs, improves data efficiency, and potentially enhances model performance by leveraging knowledge across tasks. Hence, it has been adopted in a variety of applications, ranging from computer vision to natural language processing and speech recognition. Among them, there is an emerging line of work in MTL that focuses on manipulating the task gradient to derive an ultimate gradient descent direction to benefit all tasks. Despite achieving impressive results on many benchmarks, directly applying these approaches without using appropriate regularization techniques might lead to suboptimal solutions to real-world problems. In particular, standard training that minimizes the empirical loss on the training data can easily suffer from overfitting to low-resource tasks or be spoiled by noisy-labeled ones, which can cause negative transfer between tasks and overall performance drop. To alleviate such problems, we propose to leverage a recently introduced training method, named Sharpness-aware Minimization, which can enhance model generalization ability on single-task learning. Accordingly, we present a novel MTL training methodology, encouraging the model to find task-based flat minima for coherently improving its generalization capability on all tasks. Finally, we conduct comprehensive experiments on a variety of applications to demonstrate the merit of our proposed approach to existing gradient-based MTL methods, as suggested by our developed theory.  Our training code is available at https://github.com/anonymous-user00/FS-MTL.",
        "keywords": "machine learning;multi-task learning;loss landscape",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Hoang Phan;Tung Lam Tran;Ngoc N. Tran;Nhat Ho;Dinh Phung;Trung Le",
        "authorids": "~Hoang_Phan1;~Tung_Lam_Tran1;~Ngoc_N._Tran1;~Nhat_Ho1;~Dinh_Phung2;~Trung_Le2",
        "gender": ";M;M;M;M;M",
        "homepage": ";https://nhatptnk8912.github.io/;;https://research.monash.edu/en/persons/dinh-phung;https://viethoang1512.github.io/;https://ngoc.io",
        "dblp": "178/8536;203/4479;;71/5859;295/0299;259/8194.html",
        "google_scholar": "--2qc0UAAAAJ;https://scholar.google.ca/citations?user=Xs7cKMwAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com.au/citations?user=OtA9SwIAAAAJ;;hba44u0AAAAJ",
        "orcid": ";;;0000-0002-9977-8247;;0000-0003-0479-9561",
        "linkedin": ";nhat-pham-minh-ho-267b8164/;;https://linkedin.com/in/dinh-phung-6b537a6;;ngoctnq/",
        "or_profile": "~Tung_Lam_Tran1;~Nhat_Ho1;~Trung_Le2;~Dinh_Phung1;~Hoang_Viet_Phan1;~Ngoc_Ngo_Quang_Tran1",
        "aff": "VinAi Research;University of Texas, Austin;Monash University;Monash University;New York University;Vanderbilt University",
        "aff_domain": "vinai.io;utexas.edu;monash.edu;monash.edu;nyu.edu;vanderbilt.edu",
        "position": "Research resident;Assistant Professor;Assistant Professor;Full Professor;PhD student;PhD student",
        "bibtex": "@misc{\nphan2024improving,\ntitle={Improving Multi-task Learning via Seeking Task-based Flat Regions},\nauthor={Hoang Phan and Tung Lam Tran and Ngoc N. Tran and Nhat Ho and Dinh Phung and Trung Le},\nyear={2024},\nurl={https://openreview.net/forum?id=cWE4cLrMV6}\n}",
        "github": "",
        "project": "",
        "reviewers": "oZBs;pVGE;nSBj;CubV",
        "site": "https://openreview.net/forum?id=cWE4cLrMV6",
        "pdf_size": 1949645,
        "rating": "3;3;3;8",
        "confidence": "5;4;4;3",
        "soundness": "2;3;2;4",
        "contribution": "2;2;2;3",
        "presentation": "1;3;2;4",
        "wc_summary": "36;77;96;81",
        "wc_strengths": "26;93;75;73",
        "wc_weaknesses": "268;207;357;4",
        "wc_questions": "6;4;2;51",
        "wc_review": "336;381;530;209",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            2.165063509461097
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            72.5,
            22.23173407541571
        ],
        "wc_strengths_avg": [
            66.75,
            24.78280654001883
        ],
        "wc_weaknesses_avg": [
            209.0,
            129.8210306537427
        ],
        "wc_questions_avg": [
            15.75,
            20.40067400847335
        ],
        "wc_review_avg": [
            364.0,
            114.73229710940159
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1751011623387611528&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;2;3;4",
        "aff_unique_norm": "VinAI Research;University of Texas at Austin;Monash University;New York University;Vanderbilt University",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.vinai.io;https://www.utexas.edu;https://www.monash.edu;https://www.nyu.edu;https://www.vanderbilt.edu",
        "aff_unique_abbr": "VinAi;UT Austin;Monash;NYU;Vanderbilt",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Austin",
        "aff_country_unique_index": "0;1;2;2;1;1",
        "aff_country_unique": "Vietnam;United States;Australia"
    },
    {
        "title": "State Representation Learning Using an Unbalanced Atlas",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18294",
        "id": "cWdAYDLmPa",
        "author_site": "Li Meng, Morten Goodwin, Anis Yazidi, Paal Engelstad",
        "tldr": "",
        "abstract": "The manifold hypothesis posits that high-dimensional data often lies on a lower-dimensional manifold and that utilizing this manifold as the target space yields more efficient representations. While numerous traditional manifold-based techniques exist for dimensionality reduction, their application in self-supervised learning has witnessed slow progress. The recent MSimCLR method combines manifold encoding with SimCLR but requires extremely low target encoding dimensions to outperform SimCLR, limiting its applicability. This paper introduces a novel learning paradigm using an unbalanced atlas (UA), capable of surpassing state-of-the-art self-supervised learning approaches. We investigated and engineered the DeepInfomax with an unbalanced atlas (DIM-UA) method by adapting the Spatiotemporal DeepInfomax (ST-DIM) framework to align with our proposed UA paradigm. The efficacy of DIM-UA is demonstrated through training and evaluation on the Atari Annotated RAM Interface (AtariARI) benchmark, a modified version of the Atari 2600 framework that produces annotated image samples for representation learning. The UA paradigm improves existing algorithms significantly as the number of target encoding dimensions grows. For instance, the mean F1 score averaged over categories of DIM-UA is~75% compared to ~70% of ST-DIM when using 16384 hidden units.",
        "keywords": "Self-supervised learning;State representation learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/c0177ed0f29bcf59bf22397e73e54c6fbcc296aa.zip",
        "author": "Li Meng;Morten Goodwin;Anis Yazidi;Paal E. Engelstad",
        "authorids": "~Li_Meng1;~Morten_Goodwin1;~Anis_Yazidi1;~Paal_E._Engelstad1",
        "gender": ";M;M;M",
        "homepage": "https://www.mn.uio.no/its/english/people/aca/limeng/;http://mortengoodwin.no;https://www.oslomet.no/om/ansatt/anisy/;https://www.mn.uio.no/its/english/people/aca/paalee/index.html",
        "dblp": "69/5755-2.html;;45/8374.html;e/PaalEngelstad.html",
        "google_scholar": "rsFvtdoAAAAJ;https://scholar.google.no/citations?user=da-byPgAAAAJ;https://scholar.google.no/citations?user=ulr62hcAAAAJ;NSg3JHIAAAAJ",
        "orcid": "0000-0002-8867-9104;0000-0001-6331-702X;0000-0001-7591-1659;",
        "linkedin": ";morten-goodwin-504a2a2/;;",
        "or_profile": "~Li_Meng1;~Morten_Goodwin1;~Anis_Yazidi1;~Paal_E._Engelstad1",
        "aff": "University of Oslo, Norway;University of Agder, Norway;Norwegian University of Science and Technology, Norway;University of Oslo",
        "aff_domain": "uio.no;uia.no;ntnu.no;uio.no",
        "position": "PhD student;Full Professor;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nmeng2024state,\ntitle={State Representation Learning Using an Unbalanced Atlas},\nauthor={Li Meng and Morten Goodwin and Anis Yazidi and Paal E. Engelstad},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=cWdAYDLmPa}\n}",
        "github": "",
        "project": "",
        "reviewers": "ES5Q;hci6;Ww1x",
        "pdf_size": 408777,
        "rating": "6;6;8",
        "confidence": "2;2;4",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "2;2;3",
        "wc_summary": "67;78;135",
        "wc_strengths": "26;32;131",
        "wc_weaknesses": "97;147;120",
        "wc_questions": "66;280;26",
        "wc_review": "256;537;412",
        "wc_reply_reviewers": "0;148;16",
        "wc_reply_authors": "463;594;291",
        "reply_reviewers": "0;1;1",
        "reply_authors": "2;4;2",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            93.33333333333333,
            29.80305726300948
        ],
        "wc_strengths_avg": [
            63.0,
            48.14561246884289
        ],
        "wc_weaknesses_avg": [
            121.33333333333333,
            20.43417616532547
        ],
        "wc_questions_avg": [
            124.0,
            111.51083654365914
        ],
        "wc_review_avg": [
            401.6666666666667,
            114.95023077643454
        ],
        "wc_reply_reviewers_avg": [
            54.666666666666664,
            66.31909394904474
        ],
        "wc_reply_authors_avg": [
            449.3333333333333,
            124.07614149742443
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17886435649478465890&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=cWdAYDLmPa",
        "pdf": "https://openreview.net/pdf?id=cWdAYDLmPa",
        "email": "uio.no;uia.no;ntnu.no;uio.no",
        "author_num": 4,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "University of Oslo;University of Agder;Norwegian University of Science and Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.uio.no;https://www.uia.no;https://www.ntnu.no",
        "aff_unique_abbr": "UiO;UiA;NTNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Norway"
    },
    {
        "title": "Few-Shot Detection of Machine-Generated Text using Style Representations",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18293",
        "id": "cWiEN1plhJ",
        "author_site": "Rafael Rivera Soto, Kailin Koch, Aleem Khan, Barry Chen, Marcus Bishop, Nicholas Andrews",
        "tldr": "",
        "abstract": "The advent of instruction-tuned language models that convincingly mimic human writing poses a significant risk of abuse. For example, such models could be used for plagiarism, disinformation, spam, or phishing. However, such abuse may be counteracted with the ability to detect whether a piece of text was composed by a language model rather than a human. Some previous approaches to this problem have relied on supervised methods trained on corpora of confirmed human and machine-written documents. Unfortunately, model under-specification poses an unavoidable challenge for such detectors, making them brittle in the face of data shifts, such as the release of further language models producing still more fluent text than the models used to train the detectors. Other previous approaches require access to the models that generated the text to be detected at inference or detection time, which is often impractical. In light of these challenge, we pursue a fundamentally different approach not relying on samples from language models of concern at training time. Instead, we propose to leverage representations of writing style estimated from human-authored text. Indeed, we find that features effective at distinguishing among human authors are also effective at distinguishing human from machine authors, including state of the art large language models like Llama 2, ChatGPT, and GPT-4. Furthermore, given handfuls of examples composed by each of several specific language models of interest, our approach affords the ability to predict which model specifically generated a given document.",
        "keywords": "machine text detection;large language models;AI safety;natural language processing;stylistic representations;deep learning;machine learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Rafael Alberto Rivera Soto;Kailin Koch;Aleem Khan;Barry Y. Chen;Marcus Bishop;Nicholas Andrews",
        "authorids": "~Rafael_Alberto_Rivera_Soto2;koch14@llnl.gov;~Aleem_Khan1;~Barry_Y._Chen1;marcus.bishop@gmail.com;~Nicholas_Andrews2",
        "gender": "M;;M;M;;",
        "homepage": ";;https://aleemkhan62.github.io/;;;",
        "dblp": "282/1644;;;33/8315;;",
        "google_scholar": "4rCvH-UAAAAJ;;;;;",
        "orcid": ";;;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Rafael_Alberto_Rivera_Soto2;koch14@llnl.gov;~Aleem_Khan1;~Barry_Y._Chen1;marcus.bishop@gmail.com;~Nicholas_Andrews2",
        "aff": "Johns Hopkins University;;Department of Computer Science, Whiting School of Engineering;;;",
        "aff_domain": "jhu.edu;;cs.jhu.edu;;;",
        "position": "PhD student;;PhD student;;;",
        "bibtex": "@inproceedings{\nsoto2024fewshot,\ntitle={Few-Shot Detection of Machine-Generated Text using Style Representations},\nauthor={Rafael Alberto Rivera Soto and Kailin Koch and Aleem Khan and Barry Y. Chen and Marcus Bishop and Nicholas Andrews},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=cWiEN1plhJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "f5Yg;7sQm;pncH;4qF2",
        "pdf_size": 325446,
        "rating": "3;5;6;6",
        "confidence": "5;4;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;2;2",
        "wc_summary": "115;116;219;116",
        "wc_strengths": "70;78;174;50",
        "wc_weaknesses": "242;107;210;173",
        "wc_questions": "85;357;178;10",
        "wc_review": "512;658;781;349",
        "wc_reply_reviewers": "38;165;16;0",
        "wc_reply_authors": "897;1713;1412;454",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "2;3;2;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            141.5,
            44.746508243660756
        ],
        "wc_strengths_avg": [
            93.0,
            47.86439177509728
        ],
        "wc_weaknesses_avg": [
            183.0,
            50.214539727055154
        ],
        "wc_questions_avg": [
            157.5,
            129.6466351279508
        ],
        "wc_review_avg": [
            575.0,
            161.53173062900058
        ],
        "wc_reply_reviewers_avg": [
            54.75,
            65.06679260575244
        ],
        "wc_reply_authors_avg": [
            1119.0,
            482.23282758435266
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.9428090415820632,
        "gs_citation": 19,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=192481045186789144&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=cWiEN1plhJ",
        "pdf": "https://openreview.net/pdf?id=cWiEN1plhJ",
        "email": "jhu.edu;;cs.jhu.edu;;;",
        "author_num": 6,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Johns Hopkins University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.jhu.edu",
        "aff_unique_abbr": "JHU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Baltimore",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Latent 3D Graph Diffusion",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18292",
        "id": "cXbnGtO0NZ",
        "author_site": "Yuning You, Ruida Zhou, Jiwoong Park, Haotian Xu, Chao Tian, Zhangyang Wang, Yang Shen",
        "tldr": "",
        "abstract": "Generating 3D graphs of symmetry-group equivariance is of intriguing potential in broad applications from machine vision to molecular discovery. Emerging approaches adopt diffusion generative models (DGMs) with proper re-engineering to capture 3D graph distributions. In this paper, we raise an orthogonal and fundamental question of in what (latent) space we should diffuse 3D graphs. \u2776 We motivate the study with theoretical analysis showing that the performance bound of 3D graph diffusion can be improved in a latent space versus the original space, provided that the latent space is of (i) low dimensionality yet (ii) high quality (i.e., low reconstruction error) and DGMs have (iii) symmetry preservation as an inductive bias. \u2777 Guided by the theoretical guidelines, we propose to perform 3D graph diffusion in a low-dimensional latent space, which is learned through cascaded 2D\u20133D graph autoencoders for low-error reconstruction and symmetry-group invariance. The overall pipeline is dubbed latent 3D graph diffusion. \u2778 Motivated by applications in molecular discovery, we further extend latent 3D graph diffusion to conditional generation given SE(3)-invariant attributes or equivariant 3D objects. \u2779 We also demonstrate empirically that out-of-distribution conditional generation can be further improved by regularizing the latent space via graph self-supervised learning. We validate through comprehensive experiments that our method generates 3D molecules of higher validity / drug-likeliness and comparable or better conformations / energetics, while being an order of magnitude faster in training. Codes are released at https://github.com/Shen-Lab/LDM-3DG.",
        "keywords": "3D graphs;latent diffusion models;in/equivariant representations",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Yuning You;Ruida Zhou;Jiwoong Park;Haotian Xu;Chao Tian;Zhangyang Wang;Yang Shen",
        "authorids": "~Yuning_You1;~Ruida_Zhou1;~Jiwoong_Park1;~Haotian_Xu3;~Chao_Tian2;~Zhangyang_Wang1;~Yang_Shen4",
        "gender": "M;M;;M;;M;",
        "homepage": "https://yyou1996.github.io/;https://sites.google.com/view/ruida-zhou;https://jiwoongpark92.github.io;;;https://vita-group.github.io;https://shen-lab.github.io/",
        "dblp": "240/8556;215/2026;;177/8793-4;;119/4026;95/5308-1.html",
        "google_scholar": "Pv-V2igAAAAJ;kXbo1twAAAAJ;https://scholar.google.co.kr/citations?user=B8XAbUwAAAAJ;;;pxFyKAIAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;;;;0000-0002-1703-7796",
        "linkedin": ";;;himmel/;;;",
        "or_profile": "~Yuning_You1;~Ruida_Zhou1;~Jiwoong_Park1;~Haotian_Xu3;~Chao_Tian2;~Zhangyang_Wang1;~Yang_Shen4",
        "aff": "Texas A&M University;University of California, Los Angeles;Texas A&M University - College Station;Stony Brook University;;University of Texas at Austin;Texas A&M University - College Station",
        "aff_domain": "tamu.edu;ucla.edu;tamu.edu;stonybrook.edu;;utexas.edu;tamu.edu",
        "position": "PhD student;Postdoc;Postdoc;PhD student;;Associate Professor;Associate Professor",
        "bibtex": "@inproceedings{\nyou2024latent,\ntitle={Latent 3D Graph Diffusion},\nauthor={Yuning You and Ruida Zhou and Jiwoong Park and Haotian Xu and Chao Tian and Zhangyang Wang and Yang Shen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=cXbnGtO0NZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "kaPc;HVJQ;N36h;7uXM;oqpy;N14e",
        "pdf_size": 5800196,
        "rating": "5;6;6;6;6;8",
        "confidence": "3;3;5;4;3;4",
        "soundness": "2;3;3;3;3;3",
        "contribution": "2;3;3;2;3;3",
        "presentation": "2;3;3;3;3;3",
        "wc_summary": "41;93;93;81;58;203",
        "wc_strengths": "88;168;124;49;42;21",
        "wc_weaknesses": "258;163;277;244;5;6",
        "wc_questions": "195;2;114;244;160;6",
        "wc_review": "582;426;608;618;265;236",
        "wc_reply_reviewers": "359;17;13;21;0;0",
        "wc_reply_authors": "1731;335;977;1506;457;106",
        "reply_reviewers": "2;1;1;1;0;0",
        "reply_authors": "3;2;2;3;1;1",
        "rating_avg": [
            6.166666666666667,
            0.8975274678557507
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.7453559924999298
        ],
        "soundness_avg": [
            2.8333333333333335,
            0.3726779962499649
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.8333333333333335,
            0.3726779962499649
        ],
        "wc_summary_avg": [
            94.83333333333333,
            51.885825510334605
        ],
        "wc_strengths_avg": [
            82.0,
            51.0
        ],
        "wc_weaknesses_avg": [
            158.83333333333334,
            114.0839116128514
        ],
        "wc_questions_avg": [
            120.16666666666667,
            90.88163853178607
        ],
        "wc_review_avg": [
            455.8333333333333,
            158.64259271148535
        ],
        "wc_reply_reviewers_avg": [
            68.33333333333333,
            130.2326977204863
        ],
        "wc_reply_authors_avg": [
            852.0,
            604.9534417347063
        ],
        "reply_reviewers_avg": [
            0.8333333333333334,
            0.6871842709362768
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.3321819194149599,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=304779532457566459&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=cXbnGtO0NZ",
        "pdf": "https://openreview.net/pdf?id=cXbnGtO0NZ",
        "email": "tamu.edu;ucla.edu;tamu.edu;stonybrook.edu;;utexas.edu;tamu.edu",
        "author_num": 7,
        "aff_unique_index": "0;1;0;2;3;0",
        "aff_unique_norm": "Texas A&M University;University of California, Los Angeles;Stony Brook University;University of Texas at Austin",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.tamu.edu;https://www.ucla.edu;https://www.stonybrook.edu;https://www.utexas.edu",
        "aff_unique_abbr": "TAMU;UCLA;SBU;UT Austin",
        "aff_campus_unique_index": "1;2;3;2",
        "aff_campus_unique": ";Los Angeles;College Station;Austin",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "cXs5md5wAq",
        "title": "Modelling Microbial Communities with Graph Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Understanding the interactions and interplay of microorganisms is a great challenge with many applications in medical and environmental settings. In this work, we model bacterial communities directly from their genomes using graph neural networks (GNNs). GNNs leverage the inductive bias induced by the set nature of bacteria, enforcing permutation invariance and granting combinatorial generalization. We propose to learn the dynamics implicitly by directly predicting community relative abundance profiles at steady state, thus escaping the need for growth curves. On two real-world datasets, we show for the first time generalization to unseen bacteria and different community structures. \nTo investigate the prediction results more deeply, we created a simulation for flexible data generation and analyze effects of bacteria interaction strength, community size, and training data amount.",
        "keywords": "graph neural networks;microbial communities;microbiology;genomes",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Albane Ruaud;Cansu Sancaktar;Marco Bagatella;Christoph Ratzke;Georg Martius",
        "authorids": "~Albane_Ruaud1;~Cansu_Sancaktar1;~Marco_Bagatella1;christoph.ratzke@uni-tuebingen.de;~Georg_Martius1",
        "gender": ";F;;;M",
        "homepage": ";https://csancaktar.github.io;;;https://uni-tuebingen.de/de/264672",
        "dblp": ";256/5345;;;47/2706",
        "google_scholar": ";9JqNY7UAAAAJ;;;https://scholar.google.de/citations?user=b-JF-UIAAAAJ",
        "orcid": "0000-0001-5920-1710;;;;",
        "linkedin": ";cansu-sancaktar-61715b140/;marco-bagatella-9b8017197/;;",
        "or_profile": "~Albane_Ruaud1;~Cansu_Sancaktar1;~Marco_Bagatella1;christoph.ratzke@uni-tuebingen.de;~Georg_Martius1",
        "aff": "Eberhard-Karls-Universit\u00e4t T\u00fcbingen;Qualcomm Inc, QualComm;Max Planck Institute for Intelligent Systems, Max Planck Institute for Intelligent Systems;;Max Planck Institute for Intelligent Systems",
        "aff_domain": "uni-tuebingen.de;qti.qualcomm.com;is.tue.mpg.de;;tuebingen.mpg.de",
        "position": "Postdoc;Intern;PhD student;;Assistant Professor",
        "bibtex": "@misc{\nruaud2024modelling,\ntitle={Modelling Microbial Communities with Graph Neural Networks},\nauthor={Albane Ruaud and Cansu Sancaktar and Marco Bagatella and Christoph Ratzke and Georg Martius},\nyear={2024},\nurl={https://openreview.net/forum?id=cXs5md5wAq}\n}",
        "github": "",
        "project": "",
        "reviewers": "5GQX;kpxx;U7B8;aYM1",
        "site": "https://openreview.net/forum?id=cXs5md5wAq",
        "pdf_size": 2056163,
        "rating": "3;3;6;6",
        "confidence": "3;4;3;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;1",
        "presentation": "2;2;4;2",
        "wc_summary": "49;21;66;100",
        "wc_strengths": "18;35;55;66",
        "wc_weaknesses": "542;108;52;411",
        "wc_questions": "32;35;104;51",
        "wc_review": "641;199;277;628",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "695;786;491;658",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            59.0,
            28.609439001839934
        ],
        "wc_strengths_avg": [
            43.5,
            18.445866745696716
        ],
        "wc_weaknesses_avg": [
            278.25,
            204.54874113521208
        ],
        "wc_questions_avg": [
            55.5,
            28.91798748184251
        ],
        "wc_review_avg": [
            436.25,
            200.21160680639872
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            657.5,
            106.81877175852567
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5773502691896258,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8483046927231631903&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2;2",
        "aff_unique_norm": "Eberhard Karls University of T\u00fcbingen;Qualcomm Incorporated;Max Planck Institute for Intelligent Systems",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.uni-tuebingen.de/;https://www.qualcomm.com;https://www.mpi-is.mpg.de",
        "aff_unique_abbr": "Uni T\u00fcbingen;Qualcomm;MPI-IS",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "T\u00fcbingen;",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "Germany;United States"
    },
    {
        "id": "cYksYKbf6K",
        "title": "Imagine Within Practice: Conservative Rollout Length Adaptation for Model-Based Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Model-based reinforcement learning (MBRL) algorithms achieve high sample efficiency by leveraging imagined rollouts from a world model for policy optimization. A crucial hyperparameter in MBRL is the rollout length, which represents a trade-off between data quality and efficiency by limiting the imaginary horizon. While longer rollout length offers enhanced efficiency, it introduces more unrealistic data due to compounding error, potentially leading to catastrophic performance deterioration. To prevent significant deviations between imagined rollouts and real transitions, most model-based methods manually tune a fixed rollout length for the entire training process. However, the fixed rollout length is not optimal for all rollouts and does not effectively prevent the generation of unrealistic data. To tackle this problem, we propose a novel method called Conservative Rollout Length Adaptation (CRLA), which conservatively restricts the agent from selecting actions that are rarely taken in the current state. CRLA truncates the rollout to preserve safety when there is a high probability of selecting infrequently taken actions. We apply our method to DreamerV3 and evaluate it on the Atari 100k benchmark. The results demonstrate that CRLA can effectively balance data quality and efficiency by adjusting rollout length and achieve significant performance gains in most Atari games compared to DreamerV3 in the default setting.",
        "keywords": "reinforcement learning;model-based reinforcement learning;adaptation;conservative imagination",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Long Qian;Ziru Wang;Zeyang Liu;Zhuoran Chen;Zechen Shi;Xuguang Lan",
        "authorids": "~Long_Qian3;~Ziru_Wang1;~Zeyang_Liu2;~Zhuoran_Chen2;~Zechen_Shi1;~Xuguang_Lan1",
        "gender": "M;;M;;;",
        "homepage": "https://lostthinker.github.io/;;;;https://github.com/szc0817;",
        "dblp": ";;;;;",
        "google_scholar": ";;YOOlkJoAAAAJ;;;",
        "orcid": ";;0000-0002-3110-8618;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Long_Qian3;~Ziru_Wang1;~Zeyang_Liu2;~Zhuoran_Chen2;~Zechen_Shi1;~Xuguang_Lan1",
        "aff": "Xi'an Jiaotong University;;Xi'an Jiaotong University;;;",
        "aff_domain": "xjtu.edu.cn;;xjtu.edu.cn;;;",
        "position": "PhD student;;PhD student;;;",
        "bibtex": "@misc{\nqian2024imagine,\ntitle={Imagine Within Practice: Conservative Rollout Length Adaptation for Model-Based Reinforcement Learning},\nauthor={Long Qian and Ziru Wang and Zeyang Liu and Zhuoran Chen and Zechen Shi and Xuguang Lan},\nyear={2024},\nurl={https://openreview.net/forum?id=cYksYKbf6K}\n}",
        "github": "",
        "project": "",
        "reviewers": "gVqn;dUDY;stfm;pvE2",
        "site": "https://openreview.net/forum?id=cYksYKbf6K",
        "pdf_size": 1132215,
        "rating": "3;5;5;5",
        "confidence": "4;4;4;3",
        "soundness": "2;2;2;2",
        "contribution": "2;1;2;2",
        "presentation": "3;3;4;2",
        "wc_summary": "80;65;77;105",
        "wc_strengths": "35;30;51;28",
        "wc_weaknesses": "399;114;48;280",
        "wc_questions": "199;70;109;41",
        "wc_review": "713;279;285;454",
        "wc_reply_reviewers": "0;29;125;119",
        "wc_reply_authors": "1378;536;546;537",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "2;1;2;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            81.75,
            14.549484526951462
        ],
        "wc_strengths_avg": [
            36.0,
            9.027735042633894
        ],
        "wc_weaknesses_avg": [
            210.25,
            137.91369583910077
        ],
        "wc_questions_avg": [
            104.75,
            59.52467975554342
        ],
        "wc_review_avg": [
            432.75,
            176.3949758354812
        ],
        "wc_reply_reviewers_avg": [
            68.25,
            54.76027300881543
        ],
        "wc_reply_authors_avg": [
            749.25,
            363.02987136047085
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:7MoLIp0Wt2cJ:scholar.google.com/&scioq=Imagine+Within+Practice:+Conservative+Rollout+Length+Adaptation+for+Model-Based+Reinforcement+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Xi'an Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.xjtu.edu.cn",
        "aff_unique_abbr": "XJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "cZH2N76EdS",
        "title": "The Dark Side of Empathy: When Dialogue Systems Face Moral Challenges",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Empathy has long been considered a key component in building helpful and trustful dialogue systems. However, as these systems are used in a broad range of scenarios, they may also face many challenging contexts requiring them to show empathy in a more elaborate manner. In this paper, we investigate the dark side of the dialogue model's empathy in responding to immoral contexts, a typical collection of contexts that can induce empathetic but inappropriate responses due to the misuse of empathy strategies. Specifically, we summarize five types of adversarial contexts containing unethical behaviors and construct a corresponding dataset containing 10K adversarial contexts. Then, we use these contexts to assess popular traditional conversational models and demonstrate their vulnerability in dealing with such attacks. To address this problem, we design a pipeline approach to construct responses that incorporate ethics and empathy based on rules of thumb (RoTs). We show that after being fine-tuned on the constructed responses, traditional dialogue models exhibit improved ability to handle the adversarial contexts containing unethical behaviors. We also manually create a hard test containing implicitly immoral contexts. Experiments demonstrate that even SOTA AI assistants such as ChatGPT and Claude would generate significantly more immoral responses when responding to these implicitly immoral contexts with empathy. Based on experiments conducted on both traditional dialogue systems and advanced AI assistants, we systematically summarize the impact of empathy when dialogue systems face moral challenges.\nWe will release our code and data to facilitate further research.",
        "keywords": "empathy;morality;dialogue",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Zhexin Zhang;Jiale Cheng;Jiawen Deng;Minlie Huang",
        "authorids": "~Zhexin_Zhang2;~Jiale_Cheng1;~Jiawen_Deng1;~Minlie_Huang1",
        "gender": "M;M;F;M",
        "homepage": "https://github.com/nonstopfor;;;http://coai.cs.tsinghua.edu.cn/hml",
        "dblp": "225/5264;275/7964;;",
        "google_scholar": "I-Cn8gkAAAAJ;WcAly8wAAAAJ;fseN_08AAAAJ;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": "0009-0002-9601-3991;0000-0003-2995-7116;0000-0003-0602-8250;",
        "linkedin": ";;;",
        "or_profile": "~Zhexin_Zhang2;~Jiale_Cheng1;~Jiawen_Deng1;~Minlie_Huang1",
        "aff": "Tsinghua University;Tsinghua University;University of Electronic Science and Technology of China;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;tsinghua.edu.cn;uestc.edu;tsinghua.edu.cn",
        "position": "PhD student;PhD student;Lecturer;Full Professor",
        "bibtex": "@misc{\nzhang2024the,\ntitle={The Dark Side of Empathy: When Dialogue Systems Face Moral Challenges},\nauthor={Zhexin Zhang and Jiale Cheng and Jiawen Deng and Minlie Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=cZH2N76EdS}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=cZH2N76EdS",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:PRkO32hTmpkJ:scholar.google.com/&scioq=The+Dark+Side+of+Empathy:+When+Dialogue+Systems+Face+Moral+Challenges&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Tsinghua University;University of Electronic Science and Technology of China",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.uestc.edu.cn",
        "aff_unique_abbr": "THU;UESTC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "cZKSWi6BVT",
        "title": "A Hierarchical Reinforcement Learning Based Optimization FrameWork for Large Scale Storage Location Assignment Problem",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The Storage Location Assignment Problem(SLAP) is one of the essential problems within the domain of logistics. The objective is to dynamically allocate optimal storage locations to incoming items, aiming to maximize warehouse space utilization and operational efficiency. Prior research primarily focused on offline scenarios with predetermined goods arrival times. A smaller portion explored real-time allocation using heuristic algorithms based on manual rules and search methods. However, these methods suffer from inadequate solution quality and efficiency, particularly for large-scale problems. To overcome this limitation, we draw inspiration from the partitioned, multi-layered, and modularized layout commonly adopted in most large-scale storage spaces. Building upon this inspiration, we propose a novel hierarchical optimization framework to solve large-scale SLAPs better via reinforcement learning. Specifically, we designed a two-level model: (1) a higher-level model learns to determine which block to choose, and (2) a lower-level model learns to select the final storage location under the constraints of the selected blocks in the upper level. We have designed a policy network based on attention mechanisms for SLAP to achieve better performance. To verify the effectiveness of the proposed framework, we collected a large amount of real historical data from the terminal operating system of Ningbo-Zhoushan Port and built a realistic container terminal simulator. Besides, we conducted extensive offline simulations and online testing using the simulator based on real data and validated the superior performance of our framework compared to existing benchmark methods.",
        "keywords": "Hierarchical Reinforcement Learning;Storage Location Assignment Problem;Large Scale",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "weihang Pan;Weixin Xu;YaFei Wang;Yuxiang Zhang",
        "authorids": "~weihang_Pan1;~Weixin_Xu6;~YaFei_Wang3;~Yuxiang_Zhang8",
        "gender": "M;M;;M",
        "homepage": "https://pwhjy.github.io/;https://zzzxwx.github.io/;http://wyf.github.io;https://zhangyx1122.github.io/",
        "dblp": "367/3657;;;",
        "google_scholar": ";;;",
        "orcid": "0009-0009-5434-3491;;;",
        "linkedin": ";;;",
        "or_profile": "~weihang_Pan1;~Weixin_Xu6;~YaFei_Wang3;~Yuxiang_Zhang8",
        "aff": "Zhejiang University;Zhejiang University;Zhejiang University;Zhejiang University",
        "aff_domain": "zju.edu.cn;zju.edu.cn;zju.edu.cn;zju.edu.cn",
        "position": "PhD student;MS student;MS student;PhD student",
        "bibtex": "@misc{\npan2024a,\ntitle={A Hierarchical Reinforcement Learning Based Optimization FrameWork for Large Scale Storage Location Assignment Problem},\nauthor={weihang Pan and Weixin Xu and YaFei Wang and Yuxiang Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=cZKSWi6BVT}\n}",
        "github": "",
        "project": "",
        "reviewers": "Kpm8;JQZq;Bh6D;Bseu",
        "site": "https://openreview.net/forum?id=cZKSWi6BVT",
        "pdf_size": 8539498,
        "rating": "3;3;3;5",
        "confidence": "4;4;4;4",
        "soundness": "1;3;2;2",
        "contribution": "2;2;2;2",
        "presentation": "2;2;2;3",
        "wc_summary": "156;68;46;82",
        "wc_strengths": "54;75;15;130",
        "wc_weaknesses": "176;208;107;55",
        "wc_questions": "76;139;45;115",
        "wc_review": "462;490;213;382",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            88.0,
            41.30375285612676
        ],
        "wc_strengths_avg": [
            68.5,
            41.52408939398912
        ],
        "wc_weaknesses_avg": [
            136.5,
            59.550398823181695
        ],
        "wc_questions_avg": [
            93.75,
            36.02342987556848
        ],
        "wc_review_avg": [
            386.75,
            107.85957305682236
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:deYwcWDz2UcJ:scholar.google.com/&scioq=A+Hierarchical+Reinforcement+Learning+Based+Optimization+FrameWork+for+Large+Scale+Storage+Location+Assignment+Problem&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Zhejiang University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.zju.edu.cn",
        "aff_unique_abbr": "ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "cZo6pDtDZr",
        "title": "Near-optimal algorithms for private estimation and sequential testing of collision probability",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We present new algorithms for estimating and testing collision probability, a fundamental measure of the spread of a discrete distribution that is widely used in many scientific fields. We describe an algorithm that satisfies $(\\alpha, \\beta)$-local differential privacy and estimates collision probability with error at most $\\epsilon$ using $\\tilde{O}\\left(\\frac{\\log(1/\\beta)}{\\alpha^2 \\epsilon^2}\\right)$ samples, which improves over previous work by a factor of $\\frac{1}{\\alpha^2}$. We also present the first sequential testing algorithm for collision probability, which can distinguish between collision probability values that are separated by $\\epsilon$ using $\\tilde{O}(\\frac{1}{\\epsilon^2})$ samples, even when $\\epsilon$ is unknown. Our algorithms have nearly the optimal sample complexity and in experiments we show that they require significantly fewer samples than previous methods.",
        "keywords": "Differentially privacy;collision probability",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/7b79cc3f17bd1d1bf579d474734654d257a996c3.pdf",
        "author": "Robert Istvan Busa-Fekete;Umar Syed",
        "authorids": "~Robert_Istvan_Busa-Fekete1;~Umar_Syed1",
        "gender": "M;M",
        "homepage": ";https://umarsyed.com",
        "dblp": "69/4876;75/1894",
        "google_scholar": "UNtKl1MAAAAJ;zKORw8wAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Robert_Istvan_Busa-Fekete1;~Umar_Syed1",
        "aff": "Google Research;Google",
        "aff_domain": "google.com;google.com",
        "position": "Researcher;Researcher",
        "bibtex": "@misc{\nbusa-fekete2024nearoptimal,\ntitle={Near-optimal algorithms for private estimation and sequential testing of collision probability},\nauthor={Robert Istvan Busa-Fekete and Umar Syed},\nyear={2024},\nurl={https://openreview.net/forum?id=cZo6pDtDZr}\n}",
        "github": "",
        "project": "",
        "reviewers": "cQaE;PG2x;vjJb;aZJ9",
        "site": "https://openreview.net/forum?id=cZo6pDtDZr",
        "pdf_size": 599586,
        "rating": "3;5;6;8",
        "confidence": "4;3;4;3",
        "soundness": "2;3;3;4",
        "contribution": "2;2;3;4",
        "presentation": "2;2;3;4",
        "wc_summary": "353;207;173;243",
        "wc_strengths": "59;31;54;43",
        "wc_weaknesses": "37;42;25;32",
        "wc_questions": "81;677;125;1",
        "wc_review": "530;957;377;319",
        "wc_reply_reviewers": "11;0;11;0",
        "wc_reply_authors": "120;325;202;0",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "1;1;1;0",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            244.0,
            67.62396025078685
        ],
        "wc_strengths_avg": [
            46.75,
            10.779030568655049
        ],
        "wc_weaknesses_avg": [
            34.0,
            6.284902544988268
        ],
        "wc_questions_avg": [
            221.0,
            266.99812733425676
        ],
        "wc_review_avg": [
            545.75,
            249.63310577725863
        ],
        "wc_reply_reviewers_avg": [
            5.5,
            5.5
        ],
        "wc_reply_authors_avg": [
            161.75,
            118.50817482351165
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            0.75,
            0.4330127018922193
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5547001962252291,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ZCZ88PKwlj0J:scholar.google.com/&scioq=Near-optimal+algorithms+for+private+estimation+and+sequential+testing+of+collision+probability&hl=en&as_sdt=0,5",
        "gs_version_total": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Google",
        "aff_unique_dep": "Google Research",
        "aff_unique_url": "https://research.google",
        "aff_unique_abbr": "Google Research",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Mountain View",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Uncertainty Quantification via Stable Distribution Propagation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18291",
        "id": "cZttUMTiPL",
        "author_site": "Felix Petersen, Aashwin Mishra, Hilde Kuehne, Christian Borgelt, Oliver Deussen, Mikhail Yurochkin",
        "tldr": "",
        "abstract": "We propose a new approach for propagating stable probability distributions through neural networks. Our method is based on local linearization, which we show to be an optimal approximation in terms of total variation distance for the ReLU non-linearity. This allows propagating Gaussian and Cauchy input uncertainties through neural networks to quantify their output uncertainties. To demonstrate the utility of propagating distributions, we apply the proposed method to predicting calibrated confidence intervals and selective prediction on out-of-distribution data. The results demonstrate a broad applicability of propagating distributions and show the advantages of our method over other approaches such as moment matching.",
        "keywords": "propagating distributions;uncertainty;uncertainties;aleatoric;epistemic;moment matching;total variation;sampling-free;deterministic;variational inference;propagation;probabilistic neural networks;variance propagation;Cauchy;Cauchy distribution;Gaussian;analytical;data uncertainty;alpha stable",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Felix Petersen;Aashwin Ananda Mishra;Hilde Kuehne;Christian Borgelt;Oliver Deussen;Mikhail Yurochkin",
        "authorids": "~Felix_Petersen1;~Aashwin_Ananda_Mishra1;~Hilde_Kuehne5;~Christian_Borgelt1;~Oliver_Deussen1;~Mikhail_Yurochkin1",
        "gender": "Not Specified;;F;M;M;M",
        "homepage": "http://www.petersen.ai/;https://scholar.google.com/citations?user=IL_qGBMAAAAJ&hl=en&oi=ao;https://hildekuehne.github.io;https://www.borgelt.net/;https://graphics.uni-konstanz.de;https://moonfolk.github.io/",
        "dblp": "230/3983;274/2798;45/4963;b/ChristianBorgelt.html;48/2158;191/6719",
        "google_scholar": "v8Kat6YAAAAJ;IL_qGBMAAAAJ;pxhCcH0AAAAJ;https://scholar.google.de/citations?user=T50Bxb8AAAAJ;https://scholar.google.de/scholar?hl=en;QjBF9sUAAAAJ",
        "orcid": ";;0000-0003-1079-4441;;0000-0001-5803-2185;",
        "linkedin": ";;hilde-kuehne-8b9aa661;christian-borgelt-a2429071/;;mikhail-yurochkin-a45659114/",
        "or_profile": "~Felix_Petersen1;~Aashwin_Ananda_Mishra1;~Hilde_Kuehne5;~Christian_Borgelt1;~Oliver_Deussen1;~Mikhail_Yurochkin1",
        "aff": "Stanford University;Stanford University;Rheinische Friedrich-Wilhelms-Universit\u00e4t Bonn, Rheinische Friedrich-Wilhelms Universit\u00e4t Bonn;Paris-Lodron-University of Salzburg;University of Konstanz;IBM Research",
        "aff_domain": "stanford.edu;stanford.edu;cs.uni-bonn.de;sbg.ac.at;uni-konstanz.de;ibm.com",
        "position": "Postdoc;Lecturer;Associate Professor;Full Professor;Full Professor;Researcher",
        "bibtex": "@inproceedings{\npetersen2024uncertainty,\ntitle={Uncertainty Quantification via Stable Distribution Propagation},\nauthor={Felix Petersen and Aashwin Ananda Mishra and Hilde Kuehne and Christian Borgelt and Oliver Deussen and Mikhail Yurochkin},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=cZttUMTiPL}\n}",
        "github": "",
        "project": "",
        "reviewers": "tarK;iv48;e2L6;WExx;ojgP",
        "pdf_size": 1220765,
        "rating": "6;6;6;8;8",
        "confidence": "4;3;4;4;3",
        "soundness": "3;3;3;3;3",
        "contribution": "2;2;2;3;3",
        "presentation": "2;2;2;3;3",
        "wc_summary": "66;98;36;32;65",
        "wc_strengths": "81;29;67;66;54",
        "wc_weaknesses": "154;215;340;85;205",
        "wc_questions": "19;53;56;65;48",
        "wc_review": "320;395;499;248;372",
        "wc_reply_reviewers": "27;24;0;12;87",
        "wc_reply_authors": "308;442;915;482;582",
        "reply_reviewers": "1;1;0;1;1",
        "reply_authors": "1;1;2;1;1",
        "rating_avg": [
            6.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            59.4,
            23.92989761783364
        ],
        "wc_strengths_avg": [
            59.4,
            17.442476888332116
        ],
        "wc_weaknesses_avg": [
            199.8,
            83.89374231729087
        ],
        "wc_questions_avg": [
            48.2,
            15.612815249018993
        ],
        "wc_review_avg": [
            366.8,
            83.18990323350545
        ],
        "wc_reply_reviewers_avg": [
            30.0,
            30.059940119700837
        ],
        "wc_reply_authors_avg": [
            545.8,
            204.45674359140128
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4
        ],
        "reply_authors_avg": [
            1.2,
            0.4
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.16666666666666663,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15609513623780938033&as_sdt=5,31&sciodt=0,31&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=cZttUMTiPL",
        "pdf": "https://openreview.net/pdf?id=cZttUMTiPL",
        "email": "stanford.edu;stanford.edu;cs.uni-bonn.de;sbg.ac.at;uni-konstanz.de;ibm.com",
        "author_num": 6,
        "aff_unique_index": "0;0;1;2;3;4",
        "aff_unique_norm": "Stanford University;Rheinische Friedrich-Wilhelms-Universit\u00e4t Bonn;Paris-Lodron-University of Salzburg;University of Konstanz;IBM",
        "aff_unique_dep": ";;;;IBM Research",
        "aff_unique_url": "https://www.stanford.edu;https://www.uni-bonn.de;https://www.uni-salzburg.at;https://www.uni-konstanz.de;https://www.ibm.com/research",
        "aff_unique_abbr": "Stanford;Uni Bonn;PLUS;Uni Konstanz;IBM",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Stanford;",
        "aff_country_unique_index": "0;0;1;2;1;0",
        "aff_country_unique": "United States;Germany;Austria"
    },
    {
        "title": "Beyond Accuracy: Evaluating Self-Consistency of Code Large Language Models with IdentityChain",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18290",
        "id": "caW7LdAALh",
        "author_site": "Marcus J. Min, Yangruibo Ding, Luca Buratti, Saurabh Pujar, Gail Kaiser, Suman Jana, Baishakhi Ray",
        "tldr": "",
        "abstract": "Code Large Language Models (Code LLMs) are being increasingly employed in real-life applications, so evaluating them is critical. While the conventional accuracy evaluates the performance of Code LLMs on a set of individual tasks, their self-consistency across different tasks is overlooked. Intuitively, a trustworthy model should be self-consistent when generating natural language specifications for its own code and generating code for its own specifications. Failure to preserve self-consistency reveals a lack of understanding of the shared semantics underlying natural language and programming language, and therefore undermines the trustworthiness of a model. In this paper, we first formally define the self-consistency of Code LLMs and then design a framework, IdentityChain, which effectively and efficiently evaluates the self-consistency and conventional accuracy of a model at the same time. We study eleven Code LLMs and show that they fail to preserve self-consistency, which is indeed a distinct aspect from conventional accuracy. Furthermore, we show that IdentityChain can be used as a model debugging tool to expose weaknesses of Code LLMs by demonstrating three major weaknesses that we identify in current models using IdentityChain. Our code is available at https://github.com/marcusm117/IdentityChain.",
        "keywords": "Large Language Models;Code Generation;Code Summarization;LLM Evaluation;Self-Consistency",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/b07a154e80218d27e217a307848c24d7b93c13b5.zip",
        "author": "Marcus J. Min;Yangruibo Ding;Luca Buratti;Saurabh Pujar;Gail Kaiser;Suman Jana;Baishakhi Ray",
        "authorids": "~Marcus_J._Min1;~Yangruibo_Ding1;~Luca_Buratti1;~Saurabh_Pujar1;~Gail_Kaiser1;~Suman_Jana1;~Baishakhi_Ray2",
        "gender": ";;;M;F;M;F",
        "homepage": ";;;;http://www.cs.columbia.edu/~kaiser/;http://sumanj.info;http://rayb.info/",
        "dblp": ";;;252/5520.html;k/GailEKaiser;74/28;74/1969",
        "google_scholar": ";;;-NuBDksAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com.tw/citations?user=SDY9FwUAAAAJ;https://scholar.google.com.tw/citations?user=VaAEb5YAAAAJ",
        "orcid": ";;;0000-0002-9772-3162;0000-0002-8791-1178;;",
        "linkedin": ";;;saurabh-pujar-63597040/;gail-kaiser-b4495a3/;;",
        "or_profile": "~Marcus_J._Min1;~Yangruibo_Ding1;~Luca_Buratti1;~Saurabh_Pujar1;~Gail_Kaiser1;~Suman_Jana1;~Baishakhi_Ray2",
        "aff": ";;;International Business Machines;Columbia University;, Columbia University;Columbia University",
        "aff_domain": ";;;ibm.com;cs.columbia.edu;cs.columbia.edu;columbia.edu",
        "position": ";;;Researcher;Full Professor;Associate Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nmin2024beyond,\ntitle={Beyond Accuracy: Evaluating Self-Consistency of Code Large Language Models with IdentityChain},\nauthor={Marcus J. Min and Yangruibo Ding and Luca Buratti and Saurabh Pujar and Gail Kaiser and Suman Jana and Baishakhi Ray},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=caW7LdAALh}\n}",
        "github": "",
        "project": "",
        "reviewers": "6ee8;G8dX;AByS;d4Cs",
        "pdf_size": 2621567,
        "rating": "3;6;8;8",
        "confidence": "3;4;4;3",
        "soundness": "3;2;3;3",
        "contribution": "1;2;3;4",
        "presentation": "3;3;4;3",
        "wc_summary": "314;50;278;101",
        "wc_strengths": "2;92;132;123",
        "wc_weaknesses": "2;139;345;57",
        "wc_questions": "2;72;202;56",
        "wc_review": "320;353;957;337",
        "wc_reply_reviewers": "7;66;107;0",
        "wc_reply_authors": "804;841;1126;797",
        "reply_reviewers": "1;1;2;0",
        "reply_authors": "2;3;3;2",
        "rating_avg": [
            6.25,
            2.0463381929681126
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            1.118033988749895
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            185.75,
            112.43748262923712
        ],
        "wc_strengths_avg": [
            87.25,
            51.40707636113923
        ],
        "wc_weaknesses_avg": [
            135.75,
            130.27542937944975
        ],
        "wc_questions_avg": [
            83.0,
            73.43704787094863
        ],
        "wc_review_avg": [
            491.75,
            268.86555655196895
        ],
        "wc_reply_reviewers_avg": [
            45.0,
            44.02839992550263
        ],
        "wc_reply_authors_avg": [
            892.0,
            136.13045214058462
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.3665083330689157,
        "gs_citation": 22,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=945490796969844709&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=caW7LdAALh",
        "pdf": "https://openreview.net/pdf?id=caW7LdAALh",
        "email": ";;;ibm.com;cs.columbia.edu;cs.columbia.edu;columbia.edu",
        "author_num": 7,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "International Business Machines Corporation;Columbia University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ibm.com;https://www.columbia.edu",
        "aff_unique_abbr": "IBM;Columbia",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "cbVZt3aN0b",
        "title": "Modeling Annotation Delay In Continual Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Online continual learning, the process of training models on streaming data, has gained increasing attention in machine learning. However, a critical aspect often overlooked is the label delay, where new data arrives before its corresponding labels due to slow and costly annotation processes. We introduce a novel continual learning setup that explicitly accounts for label delay, with models trained over time steps with labels shifted from the data streams by some factor. In each step, the model is exposed to both unlabeled data from the current time $t$ step and labels from time step $t-d$. We show that this is a challenging problem and increasing the per step computational budget can not help resolve the problem. Moreover, we show that Self-Supervised learning and Test-Time Adaptation approaches perform even poorly compared to a naive approach that ignores the unlabaled data training on the older but annotated stream. We introduce a simple, efficient baseline using importance sampling to align the unlabeled and labeled data distributions, bridging the accuracy gap caused by label delay without significantly increasing computational complexity, by rehearsing from memory labeled samples that are most similar to the new unlabeled samples. While on CLOC our method performs similarly to SSL and TTA, on CGLM, our method not only closes the accuracy gap, but outperforms the non-delayed counterpart by $+25\\%$ up to $+33\\%$, while being computationally friendly. \nWe conduct various ablations and sensitivity experiments demonstrating the effectiveness of our approach.",
        "keywords": "continual learning;unsupervised learning;label delay",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/633c7d08d043a701f491e92dced5592f6fa7be13.pdf",
        "author": "Botos Csaba;Wenxuan Zhang;Matthias M\u00fcller;Ser-Nam Lim;Mohamed Elhoseiny;Philip Torr;Adel Bibi",
        "authorids": "~Botos_Csaba1;~Wenxuan_Zhang3;~Matthias_M\u00fcller1;~Ser-Nam_Lim3;~Mohamed_Elhoseiny1;~Philip_Torr1;~Adel_Bibi1",
        "gender": "M;F;;M;;M;M",
        "homepage": "https://www.linkedin.com/in/botos-csaba/;https://cemse.kaust.edu.sa/vcc/people/person/wenxuan-zhang;https://matthias.pw;http://www.mohamed-elhoseiny.com;http://www.robots.ox.ac.uk/~tvg/;http://adelbibi.com;https://sites.google.com/site/sernam",
        "dblp": "236/6044;;169/4686-1;125/2894;;176/0964;04/6633",
        "google_scholar": "n68BdMgAAAAJ;;AeMLOMEAAAAJ;iRBUTOAAAAAJ;;Q4j2laYAAAAJ;HX0BfLYAAAAJ",
        "orcid": ";;;0000-0001-9659-1551;;0000-0002-6169-3918;",
        "linkedin": "botos-csaba/;;;mohamed-elhoseiny-8a836215/;;adel-bibi-ba3671ab/;",
        "or_profile": "~Botos_Csaba1;~Wenxuan_Zhang3;~Matthias_M\u00fcller1;~Mohamed_Elhoseiny1;~Philip_Torr1;~Adel_Bibi1;~Ser-Nam_Lim1",
        "aff": "University of Oxford;Samsung Research America;Apple;KAUST;University of Oxford;University of Oxford;University of Central Florida",
        "aff_domain": "oxford.ac.uk;samsung.com;apple.com;kaust.edu.sa;ox.ac.uk;ox.ac.uk;ucf.edu",
        "position": "PhD student;Intern;Researcher;Associate Professor;Full Professor;Senior Researcher;Associate Professor",
        "bibtex": "@misc{\ncsaba2024modeling,\ntitle={Modeling Annotation Delay In Continual Learning},\nauthor={Botos Csaba and Wenxuan Zhang and Matthias M{\\\"u}ller and Ser-Nam Lim and Mohamed Elhoseiny and Philip Torr and Adel Bibi},\nyear={2024},\nurl={https://openreview.net/forum?id=cbVZt3aN0b}\n}",
        "github": "",
        "project": "",
        "reviewers": "Leqv;jtG8;xqwH;nqA5",
        "site": "https://openreview.net/forum?id=cbVZt3aN0b",
        "pdf_size": 4245279,
        "rating": "3;3;5;5",
        "confidence": "2;4;2;3",
        "soundness": "2;3;3;2",
        "contribution": "2;2;2;2",
        "presentation": "2;3;3;3",
        "wc_summary": "44;56;74;194",
        "wc_strengths": "33;27;70;203",
        "wc_weaknesses": "135;320;71;231",
        "wc_questions": "35;26;63;16",
        "wc_review": "247;429;278;644",
        "wc_reply_reviewers": "0;0;0;107",
        "wc_reply_authors": "237;548;547;980",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            92.0,
            59.84981202978001
        ],
        "wc_strengths_avg": [
            83.25,
            71.07170674748144
        ],
        "wc_weaknesses_avg": [
            189.25,
            94.55785266174354
        ],
        "wc_questions_avg": [
            35.0,
            17.507141400011598
        ],
        "wc_review_avg": [
            399.5,
            157.05811026495894
        ],
        "wc_reply_reviewers_avg": [
            26.75,
            46.332359102467464
        ],
        "wc_reply_authors_avg": [
            578.0,
            264.45510015879825
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.30151134457776363,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:LU04vpXw280J:scholar.google.com/&scioq=Modeling+Annotation+Delay+In+Continual+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;0;0;4",
        "aff_unique_norm": "University of Oxford;Samsung;Apple;King Abdullah University of Science and Technology;University of Central Florida",
        "aff_unique_dep": ";Samsung Research America;Apple Inc.;;",
        "aff_unique_url": "https://www.ox.ac.uk;https://www.samsung.com/us/careers/research/;https://www.apple.com;https://www.kaust.edu.sa;https://www.ucf.edu",
        "aff_unique_abbr": "Oxford;SRA;Apple;KAUST;UCF",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;2;0;0;1",
        "aff_country_unique": "United Kingdom;United States;Saudi Arabia"
    },
    {
        "id": "cbVnJa4l2o",
        "title": "LLM+A: Grounding Large Language Models in Physical World with Affordance Prompting",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "While large language models (LLMs) are successful in completing various language processing tasks, they easily fail to interact with the physical world properly such as generating control sequences. We find that the main reason is that LLMs are not grounded in the physical world. Existing LLM-based approaches circumvent this problem by relying on additional pre-defined skills or pre-trained sub-policies, making it hard to adapt to new tasks. In contrast, we aim to address this problem and explore the possibility to prompt pre-trained LLMs to accomplish a series of robotic manipulation tasks in a training-free paradigm. Accordingly, we propose a framework called LLM+A(ffordance), where the LLM serves as both the sub-task planner (that generates high-level plans) and the motion controller (that generates low-level control sequences). To ground these plans and control sequences on the physical world, we develop the \\textit{affordance prompting} technique that stimulates the LLM to 1) predict the consequences of generated plans and 2) generate affordance values for relevant objects. Empirically, we evaluate the effectiveness of LLM+A in various robotic manipulation tasks with natural language instructions and demonstrate that our approach substantially improves the performance by enhancing the feasibility of generated plans and control.",
        "keywords": "Large Language Model;Robotic Control;Affordance Prompting",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Guangran Cheng;Chuheng Zhang;Wenzhe Cai;Li Zhao;Changyin Sun;Jiang Bian",
        "authorids": "~Guangran_Cheng1;~Chuheng_Zhang1;~Wenzhe_Cai1;~Li_Zhao1;~Changyin_Sun1;~Jiang_Bian1",
        "gender": "F;M;M;F;M;M",
        "homepage": ";;https://wzcai99.github.io/;https://www.microsoft.com/en-us/research/people/lizo/;;https://sites.google.com/view/jiangbian",
        "dblp": ";241/9716;261/2706;97/4708-7;64/221;09/851-2.html",
        "google_scholar": "GX7hpQ4AAAAJ;q7M83KQAAAAJ;NHQcCyAAAAAJ;b-LJkLQAAAAJ;;pZBEnY8AAAAJ",
        "orcid": ";;;;;0000-0002-9472-600X",
        "linkedin": ";;;;;jbian/",
        "or_profile": "~Guangran_Cheng1;~Chuheng_Zhang1;~Wenzhe_Cai1;~Li_Zhao1;~Changyin_Sun1;~Jiang_Bian1",
        "aff": "Southeast University;Microsoft;Southeast University;Microsoft;Southeast University;Microsoft",
        "aff_domain": "seu.edu.cn;microsoft.com;seu.edu.cn;microsoft.com;seu.edu.cn;microsoft.com",
        "position": "PhD student;Researcher;PhD student;Researcher;Professor;Partner Research Manager",
        "bibtex": "@misc{\ncheng2024llma,\ntitle={{LLM}+A: Grounding Large Language Models in Physical World with Affordance Prompting},\nauthor={Guangran Cheng and Chuheng Zhang and Wenzhe Cai and Li Zhao and Changyin Sun and Jiang Bian},\nyear={2024},\nurl={https://openreview.net/forum?id=cbVnJa4l2o}\n}",
        "github": "",
        "project": "",
        "reviewers": "qNCi;4STn;xvo1;WA1X",
        "site": "https://openreview.net/forum?id=cbVnJa4l2o",
        "pdf_size": 998354,
        "rating": "3;3;5;5",
        "confidence": "5;4;4;3",
        "soundness": "2;2;2;2",
        "contribution": "2;1;2;3",
        "presentation": "3;2;3;2",
        "wc_summary": "68;79;86;60",
        "wc_strengths": "14;37;79;26",
        "wc_weaknesses": "145;357;153;338",
        "wc_questions": "11;47;46;52",
        "wc_review": "238;520;364;476",
        "wc_reply_reviewers": "0;127;0;0",
        "wc_reply_authors": "668;1454;1161;916",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;2;2;2",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            73.25,
            9.98436277385793
        ],
        "wc_strengths_avg": [
            39.0,
            24.48468909339059
        ],
        "wc_weaknesses_avg": [
            248.25,
            99.51727237017703
        ],
        "wc_questions_avg": [
            39.0,
            16.32482771731451
        ],
        "wc_review_avg": [
            399.5,
            109.21881706006525
        ],
        "wc_reply_reviewers_avg": [
            31.75,
            54.99261314031185
        ],
        "wc_reply_authors_avg": [
            1049.75,
            291.2974210321815
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.7071067811865475,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2904271189393794876&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;1;0;1",
        "aff_unique_norm": "Southeast University;Microsoft",
        "aff_unique_dep": ";Microsoft Corporation",
        "aff_unique_url": "https://www.seu.edu.cn/;https://www.microsoft.com",
        "aff_unique_abbr": "SEU;Microsoft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;1;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "cbu1lIYQ19",
        "title": "Hybrid Kernel Stein Variational Gradient Descent",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Stein variational gradient descent (SVGD) is a particle based approximate inference algorithm with largely well understood theoretical properties. In recent years, many variants of SVGD have been proposed and shown to share those properties. A preliminary test of the hybrid kernel variant (h-SVGD) has demonstrated promising results on image classification with deep neural network ensembles. However, the theoretical properties of h-SVGD have not yet been established, and its practical advantages have not been fully explored. In this paper, we define a hybrid kernelised Stein discrepancy (h-KSD) and prove that the h-SVGD update direction is optimal within an appropriate reproducing kernel Hilbert space. We also prove a descent lemma that guarantees a decrease in the KL divergence at each step along with other limit results. Numerical results demonstrate that h-SVGD mitigates the variance collapse behaviour of SVGD at no additional computational cost whilst remaining competitive at inference tasks.",
        "keywords": "Stein Variational Gradient Descent;Approximate Inference;Particle-based Variational Inference",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/43f04903884c1a457e565b6ea05cbb18066f3ebc.zip",
        "author": "Anson MacDonald;Scott A Sisson;Sahani Pathiraja",
        "authorids": "~Anson_MacDonald1;~Scott_A_Sisson1;~Sahani_Pathiraja1",
        "gender": "M;;F",
        "homepage": "https://www.unsw.edu.au/science/our-schools/maths/student-life-resources/postgraduate-research/current-research-students;;https://sahanip.com/",
        "dblp": ";46/8608;",
        "google_scholar": ";https://scholar.google.com.au/citations?user=YgsdsUMAAAAJ;https://scholar.google.com.au/citations?user=Af89asYAAAAJ",
        "orcid": ";;0000-0002-0114-3164",
        "linkedin": ";;",
        "or_profile": "~Anson_MacDonald1;~Scott_A_Sisson1;~Sahani_Pathiraja1",
        "aff": "University of New South Wales;University of New South Wales;University of New South Wales",
        "aff_domain": "unsw.edu.au;unsw.edu.au;unsw.edu.au",
        "position": "PhD student;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nmacdonald2024hybrid,\ntitle={Hybrid Kernel Stein Variational Gradient Descent},\nauthor={Anson MacDonald and Scott A Sisson and Sahani Pathiraja},\nyear={2024},\nurl={https://openreview.net/forum?id=cbu1lIYQ19}\n}",
        "github": "",
        "project": "",
        "reviewers": "WGpG;9Q7g;pUod;5E3e",
        "site": "https://openreview.net/forum?id=cbu1lIYQ19",
        "pdf_size": 1375612,
        "rating": "5;6;6;6",
        "confidence": "3;3;3;4",
        "soundness": "3;3;3;4",
        "contribution": "2;3;2;3",
        "presentation": "2;3;2;4",
        "wc_summary": "60;69;55;77",
        "wc_strengths": "82;114;52;129",
        "wc_weaknesses": "238;151;181;68",
        "wc_questions": "58;126;52;18",
        "wc_review": "438;460;340;292",
        "wc_reply_reviewers": "127;96;75;0",
        "wc_reply_authors": "407;502;278;306",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            65.25,
            8.437268515343103
        ],
        "wc_strengths_avg": [
            94.25,
            29.71847068743612
        ],
        "wc_weaknesses_avg": [
            159.5,
            61.37792762874941
        ],
        "wc_questions_avg": [
            63.5,
            39.17588543989785
        ],
        "wc_review_avg": [
            382.5,
            69.07061603894958
        ],
        "wc_reply_reviewers_avg": [
            74.5,
            46.82146943443787
        ],
        "wc_reply_authors_avg": [
            373.25,
            88.47421940881988
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:UgfL47KJRu4J:scholar.google.com/&scioq=Hybrid+Kernel+Stein+Variational+Gradient+Descent&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of New South Wales",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.unsw.edu.au",
        "aff_unique_abbr": "UNSW",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Australia"
    },
    {
        "title": "Diffusion Models for Multi-Task Generative Modeling",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18289",
        "id": "cbv0sBIZh9",
        "author_site": "Changyou Chen, Han Ding, Bunyamin Sisman, Yi Xu, Ouye Xie, Benjamin Yao, son tran, Belinda Zeng",
        "tldr": "",
        "abstract": "Diffusion-based generative modeling has been achieving state-of-the-art results on various generation tasks. Most diffusion models, however, are limited to a single-generation modeling. Can we generalize diffusion models with the ability of multi-modal generative training for more generalizable modeling? In this paper, we propose a principled way to define a diffusion model by constructing a unified multi-modal diffusion model in a common {\\em diffusion space}. We define the forward diffusion process to be driven by an information aggregation from multiple types of task-data, {\\it e.g.}, images for a generation task and labels for a classification task. In the reverse process, we enforce information sharing by parameterizing a shared backbone denoising network with additional modality-specific decoder heads. Such a structure can simultaneously learn to generate different types of multi-modal data with a multi-task loss, which is derived from a new multi-modal variational lower bound that generalizes the standard diffusion model. We propose several multi-modal generation settings to verify our framework, including image transition, masked-image training, joint image-label and joint image-representation generative modeling. Extensive experimental results on ImageNet indicate the effectiveness of our framework for various multi-modal generative modeling, which we believe is an important research direction worthy of more future explorations.",
        "keywords": "Diffusion Models;Multi-Task Multi-Modal Learning;Generative Models",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Changyou Chen;Han Ding;Bunyamin Sisman;Yi Xu;Ouye Xie;Benjamin Z. Yao;Son Dinh Tran;Belinda Zeng",
        "authorids": "~Changyou_Chen1;~Han_Ding2;~Bunyamin_Sisman1;~Yi_Xu10;~Ouye_Xie1;~Benjamin_Z._Yao1;~Son_Dinh_Tran1;~Belinda_Zeng1",
        "gender": "M;;M;M;M;M;M;Not Specified",
        "homepage": "https://www.cse.buffalo.edu/~changyou/;;;;;;;",
        "dblp": "65/2802;;116/6836;;;134/7162;13/395;",
        "google_scholar": "LtEcKBcAAAAJ;wpmYIp0AAAAJ;;y7BhrpQAAAAJ;;;P0EbpmgAAAAJ;",
        "orcid": ";;;;;;;",
        "linkedin": ";;bunyamin-sisman-03a44a48/;yeahgoyixu;ouye-xie-6191a845/;;;belindazeng/",
        "or_profile": "~Changyou_Chen1;~Han_Ding2;~Bunyamin_Sisman1;~Yi_Xu10;~Ouye_Xie1;~Benjamin_Z._Yao1;~Son_Dinh_Tran1;~Belinda_Zeng1",
        "aff": "State University of New York, Buffalo;Amazon;;Amazon;;Amazon;Amazon;Amazon",
        "aff_domain": "buffalo.edu;amazon.com;;amazon.com;;amazon.com;amazon.com;amazon.com",
        "position": "Assistant Professor;Applied Scientist;;Senior Applied Science Manager;;Researcher;Senior Principal Scientist;Researcher",
        "bibtex": "@inproceedings{\nchen2024diffusion,\ntitle={Diffusion Models for Multi-Task Generative Modeling},\nauthor={Changyou Chen and Han Ding and Bunyamin Sisman and Yi Xu and Ouye Xie and Benjamin Z. Yao and Son Dinh Tran and Belinda Zeng},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=cbv0sBIZh9}\n}",
        "github": "",
        "project": "",
        "reviewers": "bBAj;4Fko;oMx9;KnqL",
        "pdf_size": 15213239,
        "rating": "5;6;6;6",
        "confidence": "4;4;2;5",
        "soundness": "3;3;3;2",
        "contribution": "2;2;3;2",
        "presentation": "3;1;3;2",
        "wc_summary": "142;49;72;99",
        "wc_strengths": "61;38;71;46",
        "wc_weaknesses": "193;178;265;24",
        "wc_questions": "159;109;2;20",
        "wc_review": "555;374;410;189",
        "wc_reply_reviewers": "88;88;99;19",
        "wc_reply_authors": "977;630;1002;304",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "3;2;3;2",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            90.5,
            34.60130055359191
        ],
        "wc_strengths_avg": [
            54.0,
            12.82575533838066
        ],
        "wc_weaknesses_avg": [
            165.0,
            87.79806375997138
        ],
        "wc_questions_avg": [
            72.5,
            64.3059095262636
        ],
        "wc_review_avg": [
            382.0,
            130.40897208397894
        ],
        "wc_reply_reviewers_avg": [
            73.5,
            31.784430150625635
        ],
        "wc_reply_authors_avg": [
            728.25,
            285.6819691545128
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.13245323570650439,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12304517664876298224&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=cbv0sBIZh9",
        "pdf": "https://openreview.net/pdf?id=cbv0sBIZh9",
        "email": "buffalo.edu;amazon.com;;amazon.com;;amazon.com;amazon.com;amazon.com",
        "author_num": 8,
        "aff_unique_index": "0;1;1;1;1;1",
        "aff_unique_norm": "State University of New York at Buffalo;Amazon",
        "aff_unique_dep": ";Amazon.com, Inc.",
        "aff_unique_url": "https://www.buffalo.edu;https://www.amazon.com",
        "aff_unique_abbr": "SUNY Buffalo;Amazon",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Buffalo;",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Approximating Nash Equilibria in Normal-Form Games via Stochastic Optimization",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18288",
        "id": "cc8h3I3V4E",
        "author_site": "Ian Gemp, Luke Marris, Georgios Piliouras",
        "tldr": "",
        "abstract": "We propose the first loss function for approximate Nash equilibria of normal-form games that is amenable to unbiased Monte Carlo estimation. This construction allows us to deploy standard non-convex stochastic optimization techniques for approximating Nash equilibria, resulting in novel algorithms  with provable guarantees. We complement our theoretical analysis with experiments demonstrating that stochastic gradient descent can outperform previous state-of-the-art approaches.",
        "keywords": "game theory;stochastic optimization;nash equilbrium;normal-form game;x-armed bandits",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Ian Gemp;Luke Marris;Georgios Piliouras",
        "authorids": "~Ian_Gemp1;~Luke_Marris2;~Georgios_Piliouras1",
        "gender": "M;;",
        "homepage": "https://imgemp.github.io/;https://www.lukemarris.info/;",
        "dblp": "66/10996;223/4422;62/1236",
        "google_scholar": "5vo3MeEAAAAJ;dvTeSX4AAAAJ;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Ian_Gemp1;~Luke_Marris2;~Georgios_Piliouras1",
        "aff": "Google DeepMind;University College London;Singapore University of Technology and Design",
        "aff_domain": "google.com;ucl.ac.uk;sutd.edu.sg",
        "position": "Research Scientist;PhD student;Associate Professor",
        "bibtex": "@inproceedings{\ngemp2024approximating,\ntitle={Approximating Nash Equilibria in Normal-Form Games via Stochastic Optimization},\nauthor={Ian Gemp and Luke Marris and Georgios Piliouras},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=cc8h3I3V4E}\n}",
        "github": "",
        "project": "",
        "reviewers": "Lp7D;rSdL;MRwi",
        "pdf_size": 11925195,
        "rating": "8;8;8",
        "confidence": "3;4;3",
        "soundness": "4;3;4",
        "contribution": "4;3;4",
        "presentation": "4;3;4",
        "wc_summary": "132;122;53",
        "wc_strengths": "115;115;89",
        "wc_weaknesses": "18;79;58",
        "wc_questions": "27;54;87",
        "wc_review": "292;370;287",
        "wc_reply_reviewers": "0;14;23",
        "wc_reply_authors": "59;590;91",
        "reply_reviewers": "0;1;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            102.33333333333333,
            35.122009560324926
        ],
        "wc_strengths_avg": [
            106.33333333333333,
            12.256517540566824
        ],
        "wc_weaknesses_avg": [
            51.666666666666664,
            25.30261295246446
        ],
        "wc_questions_avg": [
            56.0,
            24.535688292770594
        ],
        "wc_review_avg": [
            316.3333333333333,
            38.00292386412159
        ],
        "wc_reply_reviewers_avg": [
            12.333333333333334,
            9.463379711052259
        ],
        "wc_reply_authors_avg": [
            246.66666666666666,
            243.12456798019315
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7150272826065595150&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=cc8h3I3V4E",
        "pdf": "https://openreview.net/pdf?id=cc8h3I3V4E",
        "email": "google.com;ucl.ac.uk;sutd.edu.sg",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Google;University College London;Singapore University of Technology and Design",
        "aff_unique_dep": "Google DeepMind;;",
        "aff_unique_url": "https://deepmind.com;https://www.ucl.ac.uk;https://www.sutd.edu.sg",
        "aff_unique_abbr": "DeepMind;UCL;SUTD",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "United Kingdom;Singapore"
    },
    {
        "title": "Can LLM-Generated Misinformation Be Detected?",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18287",
        "id": "ccxD4mtkTU",
        "author_site": "Canyu Chen, Kai Shu",
        "tldr": "",
        "abstract": "The advent of Large Language Models (LLMs) has made a transformative impact. However, the potential that LLMs such as ChatGPT can be exploited to generate misinformation has posed a serious concern to online safety and public trust. A fundamental research question is: will LLM-generated misinformation cause more harm than human-written misinformation? We propose to tackle this question from the perspective of detection difficulty. We first build a taxonomy of LLM-generated misinformation. Then we categorize and validate the potential real-world methods for generating misinformation with LLMs. Then, through extensive empirical investigation, we discover that LLM-generated misinformation can be harder to detect for humans and detectors compared to human-written misinformation with the same semantics, which suggests it can have more deceptive styles and potentially cause more harm. We also discuss the implications of our discovery on combating misinformation in the age of LLMs and the countermeasures.",
        "keywords": "Large Language Models;misinformation",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Canyu Chen;Kai Shu",
        "authorids": "~Canyu_Chen1;~Kai_Shu1",
        "gender": ";",
        "homepage": "https://canyuchen.com;https://www.cs.emory.edu/~kshu5/",
        "dblp": "319/2330;153/5265",
        "google_scholar": "https://scholar.google.com/citations?hl=en;-6bAV2cAAAAJ",
        "orcid": "0000-0003-0937-1046;",
        "linkedin": "canyu-chen-1b2415100/;",
        "or_profile": "~Canyu_Chen1;~Kai_Shu1",
        "aff": "Illinois Institute of Technology;Emory University",
        "aff_domain": "hawk.iit.edu;emory.edu",
        "position": "MS student;Assistant Professor",
        "bibtex": "@inproceedings{\nchen2024can,\ntitle={Can {LLM}-Generated Misinformation Be Detected?},\nauthor={Canyu Chen and Kai Shu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ccxD4mtkTU}\n}",
        "github": "",
        "project": "",
        "reviewers": "oGY2;jt9v;NKW5;bQ63",
        "pdf_size": 1875289,
        "rating": "3;3;5;8",
        "confidence": "5;3;4;5",
        "soundness": "1;2;2;3",
        "contribution": "2;1;2;4",
        "presentation": "1;2;2;4",
        "wc_summary": "58;72;62;87",
        "wc_strengths": "84;74;98;80",
        "wc_weaknesses": "139;97;424;91",
        "wc_questions": "73;14;60;32",
        "wc_review": "354;257;644;290",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "568;775;535;594",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            1.0897247358851685
        ],
        "presentation_avg": [
            2.25,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            69.75,
            11.188722000300123
        ],
        "wc_strengths_avg": [
            84.0,
            8.831760866327848
        ],
        "wc_weaknesses_avg": [
            187.75,
            137.646966911734
        ],
        "wc_questions_avg": [
            44.75,
            23.12331074911203
        ],
        "wc_review_avg": [
            386.25,
            152.84367013389857
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            618.0,
            93.02419040228192
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.47886115464444223,
        "gs_citation": 214,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4978917645539365719&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=ccxD4mtkTU",
        "pdf": "https://openreview.net/pdf?id=ccxD4mtkTU",
        "email": "hawk.iit.edu;emory.edu",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Illinois Institute of Technology;Emory University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.iit.edu;https://www.emory.edu",
        "aff_unique_abbr": "IIT;Emory",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "cdIyf38mRw",
        "title": "Local Expert Diffusion Models for Efficient Training in Denoising Diffusion Probabilistic Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Diffusion models have emerged as a new standard technique in generative AI due to their huge success in various applications. However, their training can be prohibitively time-consuming, posing challenges for small businesses or academic studies. To address this issue, we propose a novel and practical training strategy that significantly reduces the training time, even enhancing generation quality. We observe that diffusion models exhibit different convergence rates and training patterns at different time steps, inspiring our MDM (Multi-expert Diffusion Model). Each expert specializes in a group of time steps with similar training patterns. We can exploit the variations in iteration required for convergence among different local experts to reduce total training time significantly. Our method improves the training efficiency of the diffusion model by (1) reducing the total GPU hours and (2) enabling parallel training of experts without overhead to further reduce the wall-clock time. When applied to three baseline models, our MDM accelerates training x2.7 - 4.7 faster than the corresponding baselines while reducing computational resources by 24 - 53%. Furthermore, our method improves FID by 7.7% on average, including all datasets and models.",
        "keywords": "deep learning;generative models;diffusion models;resource efficient training",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/d18add7e140dca6b206d8b30ab3617f13a182bda.pdf",
        "author": "Seoungyoon Kang;Yunji Jung;Hyunjung Shim",
        "authorids": "~Seoungyoon_Kang1;~Yunji_Jung1;~Hyunjung_Shim1",
        "gender": "M;;F",
        "homepage": ";https://github.com/YunjiJung0105;https://sites.google.com/view/cvml-kaist",
        "dblp": "211/7242;199/6223;72/4620",
        "google_scholar": ";ESe866MAAAAJ;KB5XZGIAAAAJ",
        "orcid": "0000-0001-8568-6811;;",
        "linkedin": ";;",
        "or_profile": "~Seoungyoon_Kang1;~Yunji_Jung1;~Hyunjung_Shim1",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr;kaist.ac.kr",
        "position": "Researcher;MS student;Associate Professor",
        "bibtex": "@misc{\nkang2024local,\ntitle={Local Expert Diffusion Models for Efficient Training in Denoising Diffusion Probabilistic Models},\nauthor={Seoungyoon Kang and Yunji Jung and Hyunjung Shim},\nyear={2024},\nurl={https://openreview.net/forum?id=cdIyf38mRw}\n}",
        "github": "",
        "project": "",
        "reviewers": "arQF;8QH1;Rh6m;qZGE",
        "site": "https://openreview.net/forum?id=cdIyf38mRw",
        "pdf_size": 7948605,
        "rating": "3;3;3;6",
        "confidence": "3;5;2;1",
        "soundness": "2;2;2;3",
        "contribution": "2;1;1;3",
        "presentation": "2;3;3;2",
        "wc_summary": "49;64;58;54",
        "wc_strengths": "35;35;69;47",
        "wc_weaknesses": "335;223;282;65",
        "wc_questions": "6;4;18;1",
        "wc_review": "425;326;427;167",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            2.75,
            1.479019945774904
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            56.25,
            5.494315243958978
        ],
        "wc_strengths_avg": [
            46.5,
            13.88344337691482
        ],
        "wc_weaknesses_avg": [
            226.25,
            101.17651654410722
        ],
        "wc_questions_avg": [
            7.25,
            6.456585785072479
        ],
        "wc_review_avg": [
            336.25,
            105.9041429784501
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.6831300510639733,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8011042345574162171&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "Robust NAS under adversarial training: benchmark, theory, and beyond",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18286",
        "id": "cdUpf6t6LZ",
        "author_site": "Yongtao Wu, Fanghui Liu, Carl-Johann Simon-Gabriel, Grigorios Chrysos, Volkan Cevher",
        "tldr": "",
        "abstract": "Recent developments in neural architecture search (NAS) emphasize the significance of considering robust architectures against malicious data. However, there is a notable absence of benchmark evaluations and theoretical guarantees for searching these robust architectures, especially when adversarial training is considered. In this work, we aim to address these two challenges, making twofold contributions. First, we release a comprehensive data set that encompasses both clean accuracy and robust accuracy for a vast array of adversarially trained networks from the NAS-Bench-201 search space on image datasets. Then, leveraging the neural tangent kernel (NTK) tool from deep learning theory, we establish a generalization theory for searching architecture in terms of clean accuracy and robust accuracy under multi-objective adversarial training. We firmly believe that our benchmark and theoretical insights will significantly benefit the NAS community through reliable reproducibility, efficient assessment, and theoretical foundation, particularly in the pursuit of robust architectures.",
        "keywords": "neural architecture search;robustness;benchmark;generalization theory",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/62b7135e2c767dd3fdd37734209ad967077b2e2b.zip",
        "author": "Yongtao Wu;Fanghui Liu;Carl-Johann Simon-Gabriel;Grigorios Chrysos;Volkan Cevher",
        "authorids": "~Yongtao_Wu1;~Fanghui_Liu1;~Carl-Johann_Simon-Gabriel1;~Grigorios_Chrysos1;~Volkan_Cevher1",
        "gender": "M;M;M;M;M",
        "homepage": "https://www.epfl.ch/labs/lions/people/phds/yongtao-wu/;http://www.lfhsgre.org;https://las.inf.ethz.ch/people/carljohann-simongabriel;https://grigorisg9gr.github.io/;http://lions.epfl.ch",
        "dblp": "322/3726;119/1038;163/2039;75/6117-2;70/5301",
        "google_scholar": "rLgDE9AAAAAJ;AKxBgssAAAAJ;https://scholar.google.de/citations?user=uVwP72UAAAAJ;1bU041kAAAAJ;https://scholar.google.ch/citations?user=hlWhzU8AAAAJ",
        "orcid": ";0000-0003-4133-7921;0000-0002-9570-1779;;",
        "linkedin": ";;;;",
        "or_profile": "~Yongtao_Wu1;~Fanghui_Liu1;~Carl-Johann_Simon-Gabriel1;~Grigorios_Chrysos1;~Volkan_Cevher1",
        "aff": "Swiss Federal Institute of Technology Lausanne;University of Warwick;Mirelo AI;University of Wisconsin - Madison;Amazon Development Center Germany",
        "aff_domain": "epfl.ch;warwick.ac.uk;mirelo.ai;wisc.edu;amazon.de",
        "position": "PhD student;Assistant Professor;Researcher;Assistant Professor;Amazon Scholar",
        "bibtex": "@inproceedings{\nwu2024robust,\ntitle={Robust {NAS} under adversarial training: benchmark, theory, and beyond},\nauthor={Yongtao Wu and Fanghui Liu and Carl-Johann Simon-Gabriel and Grigorios Chrysos and Volkan Cevher},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=cdUpf6t6LZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "AZRS;dbFp;QErk",
        "pdf_size": 976639,
        "rating": "6;6;6",
        "confidence": "3;4;4",
        "soundness": "3;3;2",
        "contribution": "3;2;2",
        "presentation": "3;3;3",
        "wc_summary": "108;16;52",
        "wc_strengths": "122;34;109",
        "wc_weaknesses": "321;140;262",
        "wc_questions": "6;114;168",
        "wc_review": "557;304;591",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1004;1296;1734",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;3;4",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            58.666666666666664,
            37.85351884420904
        ],
        "wc_strengths_avg": [
            88.33333333333333,
            38.784303812524755
        ],
        "wc_weaknesses_avg": [
            241.0,
            75.37019746999916
        ],
        "wc_questions_avg": [
            96.0,
            67.34983296193094
        ],
        "wc_review_avg": [
            484.0,
            128.03384969087926
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1344.6666666666667,
            300.0014814778235
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            3.0,
            0.816496580927726
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2665308700337121669&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=cdUpf6t6LZ",
        "pdf": "https://openreview.net/pdf?id=cdUpf6t6LZ",
        "email": "epfl.ch;warwick.ac.uk;mirelo.ai;wisc.edu;amazon.de",
        "author_num": 5,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "Swiss Federal Institute of Technology Lausanne;University of Warwick;Mirelo AI;University of Wisconsin-Madison;Amazon",
        "aff_unique_dep": ";;;;Development Center",
        "aff_unique_url": "https://www.epfl.ch;https://www.warwick.ac.uk;;https://www.wisc.edu;https://www.amazon.de",
        "aff_unique_abbr": "EPFL;Warwick;;UW-Madison;Amazon",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Lausanne;;Madison",
        "aff_country_unique_index": "0;1;3;4",
        "aff_country_unique": "Switzerland;United Kingdom;;United States;Germany"
    },
    {
        "id": "cdwXPlM4uN",
        "title": "SuperSNN: Training Spiking Neural Networks with Knowledge from Artificial Neural Networks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Spiking Neural Network (SNN) is a kind of brain-inspired and event-driven network, which is becoming a promising energy-efficient alternative to Artificial Neural Networks (ANNs). \nHowever, the performance of SNNs by direct training is far from satisfactory. \nInspired by the idea of Teacher\u2013Student Learning, in this paper, we study a novel learning method named $\\textit{SuperSNN}$, which utilizes the ANN model to guide the SNN model learning.\n$\\textit{SuperSNN}$ leverages knowledge distillation to learn comprehensive supervisory information from pre-trained ANN models, rather than solely from labeled data.\nUnlike previous work that naively matches SNN and ANN's features without deeply considering the precision mismatch, we propose an indirect relation-based approach, which defines a pairwise-relational loss function and unifies the value scale of ANN and SNN representation vectors, to alleviate the unexpected precision loss. \nThis allows the knowledge of teacher ANNs can be effectively utilized to train student SNNs.\nThe experimental results on three image datasets demonstrate that no matter whether homogeneous or heterogeneous teacher ANNs are used, our proposed $\\textit{SuperSNN}$ can significantly improve the learning of student SNNs with only two time steps.",
        "keywords": "spiking neural networks;knowledge distillation;convolutional neural networks (CNN);Image classification",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/826a731e2ace78b142fca290cf35dbc57a2890f8.zip",
        "author": "Qian Zhang;Chao Ge;Yansong Chua;Chenxiao Dou;Jibin Wu",
        "authorids": "~Qian_Zhang23;~Chao_Ge1;~Yansong_Chua1;~Chenxiao_Dou1;~Jibin_Wu1",
        "gender": ";;;M;M",
        "homepage": ";;;https://www.jibinwu.com/;https://github.com/gc-push-pull",
        "dblp": ";180/0351;https://dblp.dagstuhl.de/pid/119/4489.html;228/1824;",
        "google_scholar": ";;;https://scholar.google.com.sg/citations?user=QwDyvrgAAAAJ;",
        "orcid": "0000-0001-9190-781X;;;;",
        "linkedin": ";;https://www.linkedin.cn/injobs/in/chenxiao-dou-62467589;;",
        "or_profile": "~Qian_Zhang23;~Yansong_Chua1;~Chenxiao_Dou1;~Jibin_Wu1;~\u845b_\u8d851",
        "aff": "China Nanhu Academy of Electronics and Information Technology;China Nanhu Academy of Electronics and Information Technology;;Hong Kong Polytechnic University;China Nanhu Academy of Electronics and Information Technology",
        "aff_domain": "cnaeit.com;cnaeit.com;;polyu.edu.hk;cnaedt.com",
        "position": "Researcher;Principal Researcher;;Assistant Professor;Researcher",
        "bibtex": "@misc{\nzhang2024supersnn,\ntitle={Super{SNN}: Training Spiking Neural Networks with Knowledge from Artificial Neural Networks},\nauthor={Qian Zhang and Chao Ge and Yansong Chua and Chenxiao Dou and Jibin Wu},\nyear={2024},\nurl={https://openreview.net/forum?id=cdwXPlM4uN}\n}",
        "github": "",
        "project": "",
        "reviewers": "e8ut;L3Eg;NQFs;tGRN;L4ie",
        "site": "https://openreview.net/forum?id=cdwXPlM4uN",
        "pdf_size": 1349740,
        "rating": "3;3;3;3;5",
        "confidence": "5;5;5;3;3",
        "soundness": "2;2;2;3;3",
        "contribution": "1;1;2;1;2",
        "presentation": "2;2;2;1;2",
        "wc_summary": "33;35;54;60;88",
        "wc_strengths": "74;12;26;47;49",
        "wc_weaknesses": "106;52;261;270;138",
        "wc_questions": "3;35;46;2;59",
        "wc_review": "216;134;387;379;334",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            3.4,
            0.8
        ],
        "confidence_avg": [
            4.2,
            0.9797958971132712
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            1.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            1.8,
            0.4
        ],
        "wc_summary_avg": [
            54.0,
            19.969977466186585
        ],
        "wc_strengths_avg": [
            41.6,
            21.22828302053654
        ],
        "wc_weaknesses_avg": [
            165.4,
            86.27769120693947
        ],
        "wc_questions_avg": [
            29.0,
            22.93468988235943
        ],
        "wc_review_avg": [
            290.0,
            99.07370993356412
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.6123724356957946,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:8TKd0jCBTrcJ:scholar.google.com/&scioq=SuperSNN:+Training+Spiking+Neural+Networks+with+Knowledge+from+Artificial+Neural+Networks&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "China Nanhu Academy of Electronics and Information Technology;Hong Kong Polytechnic University",
        "aff_unique_dep": ";",
        "aff_unique_url": ";https://www.polyu.edu.hk",
        "aff_unique_abbr": ";PolyU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Large Language Models are Efficient Learners of Noise-Robust Speech Recognition",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18285",
        "id": "ceATjGPTUD",
        "author_site": "Yuchen Hu, CHEN CHEN, Huck Yang, Ruizhe Li, Chao Zhang, Pin-Yu Chen, Ensiong Chng",
        "tldr": "",
        "abstract": "Recent advances in large language models (LLMs) have promoted generative error correction (GER) for automatic speech recognition (ASR), which leverages the rich linguistic knowledge and powerful reasoning ability of LLMs to improve recognition results. The latest work proposes a GER benchmark with \"HyPoradise\" dataset to learn the mapping from ASR N-best hypotheses to ground-truth transcription by efficient LLM finetuning, which shows great effectiveness but lacks specificity on noise-robust ASR. In this work, we extend the benchmark to noisy conditions and investigate if we can teach LLMs to perform denoising for GER just like what robust ASR do, where one solution is introducing noise information as a conditioner into LLM. However, directly incorporating noise embeddings from audio encoder could harm the LLM tuning due to cross-modality gap. To this end, we propose to extract a language-space noise embedding from the N-best list to represent the noise conditions of source speech, which can promote the denoising process in GER. Furthermore, in order to enhance its representation ability of audio noise, we design a knowledge distillation (KD) approach via mutual information estimation to distill the real noise information in audio embeddings to our language embedding. Experiments on various latest LLMs demonstrate our approach achieves a new breakthrough with up to 53.9% correction improvement in terms of word error rate while with limited training data. Analysis shows that our language-space noise embedding can well represent the noise conditions of source speech, under which off-the-shelf LLMs show strong ability of language-space denoising.",
        "keywords": "Large language models;automatic speech recognition;generative error correction;noise-robustness",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/02ecc1a4beea6283b1e9877099a570af2a80ac6d.zip",
        "author": "Yuchen Hu;CHEN CHEN;Chao-Han Huck Yang;Ruizhe Li;Chao Zhang;Pin-Yu Chen;EngSiong Chng",
        "authorids": "~Yuchen_Hu1;~CHEN_CHEN37;~Chao-Han_Huck_Yang1;~Ruizhe_Li2;~Chao_Zhang20;~Pin-Yu_Chen1;~EngSiong_Chng1",
        "gender": "M;M;M;M;M;M;M",
        "homepage": "https://yuchen005.github.io/;;https://huckiyang.github.io/;https://www.ruizhe.space/;http://mi.eng.cam.ac.uk/~cz277/;http://www.pinyuchen.com;https://personal.ntu.edu.sg/aseschng/intro1.html",
        "dblp": ";65/4423;230/4012;14/10102-1;94/3019-31.html;39/8969;c/ChngEngSiong",
        "google_scholar": "Neo-1mIAAAAJ;uUmSp1QAAAAJ;TT3XJW8AAAAJ;f_5wLsUAAAAJ;https://scholar.google.co.uk/citations?view_op=list_works;jxwlCUUAAAAJ;https://scholar.google.com.tw/citations?user=FJodrCcAAAAJ",
        "orcid": ";;0000-0003-2879-8811;0000-0003-2512-845X;;0000-0003-1039-8369;",
        "linkedin": ";;;ruizhe-li-3490b4b3/;;pin-yu-chen-940062a2;",
        "or_profile": "~Yuchen_Hu1;~CHEN_CHEN37;~Chao-Han_Huck_Yang1;~Ruizhe_Li2;~Chao_Zhang20;~Pin-Yu_Chen1;~EngSiong_Chng1",
        "aff": "Nanyang Technological University;Nanyang Technological University;NVIDIA Research;University of Aberdeen;University College London;International Business Machines;Nanyang Technological University",
        "aff_domain": "ntu.edu.sg;ntu.edu;nvidia.com;abdn.ac.uk;ucl.ac.uk;ibm.com;ntu.edu.sg",
        "position": "PhD student;PhD student;Researcher;Assistant Professor;Associate Professor;Principal Researcher;Associate Professor",
        "bibtex": "@inproceedings{\nhu2024large,\ntitle={Large Language Models are Efficient Learners of Noise-Robust Speech Recognition},\nauthor={Yuchen Hu and CHEN CHEN and Chao-Han Huck Yang and Ruizhe Li and Chao Zhang and Pin-Yu Chen and EngSiong Chng},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ceATjGPTUD}\n}",
        "github": "",
        "project": "",
        "reviewers": "QKKW;nSVq;BbAN;ZWfm",
        "pdf_size": 1728394,
        "rating": "6;8;8;10",
        "confidence": "4;4;3;4",
        "soundness": "2;3;4;4",
        "contribution": "3;4;4;4",
        "presentation": "3;4;4;3",
        "wc_summary": "59;146;55;65",
        "wc_strengths": "52;49;157;28",
        "wc_weaknesses": "101;136;58;116",
        "wc_questions": "105;132;99;2",
        "wc_review": "317;463;369;211",
        "wc_reply_reviewers": "14;45;0;12",
        "wc_reply_authors": "1562;631;206;598",
        "reply_reviewers": "1;2;0;1",
        "reply_authors": "3;2;1;1",
        "rating_avg": [
            8.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            3.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            81.25,
            37.55246330136014
        ],
        "wc_strengths_avg": [
            71.5,
            50.22200712834962
        ],
        "wc_weaknesses_avg": [
            102.75,
            28.66509201101577
        ],
        "wc_questions_avg": [
            84.5,
            49.22651724426582
        ],
        "wc_review_avg": [
            340.0,
            91.02197536858887
        ],
        "wc_reply_reviewers_avg": [
            17.75,
            16.618889854620253
        ],
        "wc_reply_authors_avg": [
            749.25,
            498.1321988187473
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 29,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2888274576212840568&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=ceATjGPTUD",
        "pdf": "https://openreview.net/pdf?id=ceATjGPTUD",
        "email": "ntu.edu.sg;ntu.edu;nvidia.com;abdn.ac.uk;ucl.ac.uk;ibm.com;ntu.edu.sg",
        "author_num": 7,
        "aff_unique_index": "0;0;1;2;3;4;0",
        "aff_unique_norm": "Nanyang Technological University;NVIDIA;University of Aberdeen;University College London;International Business Machines Corporation",
        "aff_unique_dep": ";NVIDIA Research;;;",
        "aff_unique_url": "https://www.ntu.edu.sg;https://www.nvidia.com/research;https://www.abdn.ac.uk;https://www.ucl.ac.uk;https://www.ibm.com",
        "aff_unique_abbr": "NTU;NVIDIA;Aberdeen;UCL;IBM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;2;2;1;0",
        "aff_country_unique": "Singapore;United States;United Kingdom"
    },
    {
        "id": "ceNnsnA5gu",
        "title": "WL-Tree: a New Tool for Analyzing Graph Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The 1-WL algorithm provides a clean algorithmic model for graph neural networks (GNNs) that run with a message-passing architecture. Previous work compares a GNN against the 1-WL algorithm to analyze its expressiveness, and develops new GNN variants under the guidance of the comparison. In this work, we propose WL-Trees, a new algorithmic model of GNNs. We compute WL-trees using Breadth-First-Searches on the input graph. We show that WL-trees are equivalent to colors computed from the 1-WL algorithm. Despite the equivalence, WL-trees deepen the understanding of a graph\u2019s structural information encoded in node representations. They also serve as an algorithmic model for improved GNNs to analyze their expressiveness from a new angle.",
        "keywords": "graph learning;graph neural networks;1-WL;color refinement;node representation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/194852b0a81be52ad636e7cb62228bb7b034a4ab.pdf",
        "author": "Liping Liu;Jiaxing He;Jacob Boerma;Xiaohui Chen",
        "authorids": "~Liping_Liu1;~Jiaxing_He1;~Jacob_Boerma1;~Xiaohui_Chen2",
        "gender": ";M;M;M",
        "homepage": "https://www.eecs.tufts.edu/~liulp/;;;https://github.com/Xiaohui9607",
        "dblp": "47/5615-1;;;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;SKnkYV4AAAAJ;;_7m3QTsAAAAJ",
        "orcid": "0000-0002-3690-3928;;;",
        "linkedin": ";jiaxing-he-43b91523b/;jacobboerma/;xiaohui-chen-464a0816b/",
        "or_profile": "~Liping_Liu1;~Jiaxing_He1;~Jacob_Boerma1;~Xiaohui_Chen2",
        "aff": "Tufts University;Northeastern University;Tufts University;Tufts University",
        "aff_domain": "tufts.edu;neu.edu;tufts.edu;tufts.edu",
        "position": "Assistant Professor;PhD student;PhD student;PhD student",
        "bibtex": "@misc{\nliu2024wltree,\ntitle={{WL}-Tree: a New Tool for Analyzing Graph Neural Networks},\nauthor={Liping Liu and Jiaxing He and Jacob Boerma and Xiaohui Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=ceNnsnA5gu}\n}",
        "github": "",
        "project": "",
        "reviewers": "py5L;UyCd;wEKA",
        "site": "https://openreview.net/forum?id=ceNnsnA5gu",
        "pdf_size": 242948,
        "rating": "3;3;3",
        "confidence": "5;4;3",
        "soundness": "2;1;2",
        "contribution": "1;2;2",
        "presentation": "3;2;2",
        "wc_summary": "60;103;50",
        "wc_strengths": "4;56;34",
        "wc_weaknesses": "199;421;226",
        "wc_questions": "14;3;2",
        "wc_review": "277;583;312",
        "wc_reply_reviewers": "29;0;0",
        "wc_reply_authors": "241;762;384",
        "reply_reviewers": "1;0;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            71.0,
            22.992752481307377
        ],
        "wc_strengths_avg": [
            31.333333333333332,
            21.31248981752771
        ],
        "wc_weaknesses_avg": [
            282.0,
            98.90399385262458
        ],
        "wc_questions_avg": [
            6.333333333333333,
            5.436502143433364
        ],
        "wc_review_avg": [
            390.6666666666667,
            136.74875583427522
        ],
        "wc_reply_reviewers_avg": [
            9.666666666666666,
            13.67073110293992
        ],
        "wc_reply_authors_avg": [
            462.3333333333333,
            219.7913151655957
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:hWw5F8bycSgJ:scholar.google.com/&scioq=WL-Tree:+a+New+Tool+for+Analyzing+Graph+Neural+Networks&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Tufts University;Northeastern University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tufts.edu;https://www.northeastern.edu",
        "aff_unique_abbr": "Tufts;NEU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "cfL8zApofK",
        "title": "LLM-Deliberation: Evaluating LLMs with Interactive Multi-Agent Negotiation Game",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "There is a growing interest in using Large Language Models (LLMs) as agents to tackle real-world tasks that may require assessing complex situations. Yet, we have a limited understanding of LLMs' reasoning and decision-making capabilities, partly stemming from a lack of dedicated evaluation benchmarks. As negotiating and compromising are key aspects of our everyday communication and collaboration, we propose using scorable negotiation games as a new evaluation framework for LLMs. We create a testbed of diverse text-based, multi-agent, multi-issue, semantically rich negotiation games, with easily tunable difficulty. To solve the challenge, agents need to have strong arithmetic, inference, exploration, and planning capabilities, while seamlessly integrating them. Via a systematic zero-shot Chain-of-Thought prompting (CoT), we show that agents can negotiate and consistently reach successful deals. We quantify the performance with multiple metrics and observe a large gap between GPT-4 and earlier models. Importantly, we test the generalization to new games and setups. Finally, we show that these games can help evaluate other critical aspects, such as the interaction dynamics between agents in the presence of greedy and adversarial players.",
        "keywords": "Large Language Models;Text-based Games;AI Negotiation;Multi-agent Negotiation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/f412a3f8299c41636eb442674c8d53c3c3b7a5ab.zip",
        "author": "Sahar Abdelnabi;Amr Gomaa;Sarath Sivaprasad;Lea Sch\u00f6nherr;Mario Fritz",
        "authorids": "~Sahar_Abdelnabi1;~Amr_Gomaa1;~Sarath_Sivaprasad2;~Lea_Sch\u00f6nherr1;~Mario_Fritz1",
        "gender": "M;M;M;;M",
        "homepage": "https://s-abdelnabi.github.io/;https://amrgomaaelhady.github.io/;;;https://cispa.saarland/group/fritz/",
        "dblp": "248/7979;186/7372;;;",
        "google_scholar": "https://scholar.google.de/citations?user=QEiYbDYAAAAJ;xiPvQxwAAAAJ;37HTgYcAAAAJ;;https://scholar.google.de/citations?user=4V1nNm4AAAAJ",
        "orcid": ";0000-0003-0955-3181;;;",
        "linkedin": "sahar-abdelnabi-375b681a1/;amrgomaaelhady/;sarathsivaprasad1729/;;",
        "or_profile": "~Sahar_Abdelnabi1;~Amr_Gomaa1;~Sarath_Sivaprasad2;~Lea_Sch\u00f6nherr1;~Mario_Fritz1",
        "aff": "CISPA Helmholtz Center for Information Security;University of Cambridge;cispa;;Saarland University",
        "aff_domain": "cispa.de;cam.ac.uk;cispa.de;;uni-saarland.de",
        "position": "PhD student;Intern;PhD student;;Full Professor",
        "bibtex": "@misc{\nabdelnabi2024llmdeliberation,\ntitle={{LLM}-Deliberation: Evaluating {LLM}s with Interactive Multi-Agent Negotiation Game},\nauthor={Sahar Abdelnabi and Amr Gomaa and Sarath Sivaprasad and Lea Sch{\\\"o}nherr and Mario Fritz},\nyear={2024},\nurl={https://openreview.net/forum?id=cfL8zApofK}\n}",
        "github": "",
        "project": "",
        "reviewers": "TDsf;f6ii;sx4h;KJhu",
        "site": "https://openreview.net/forum?id=cfL8zApofK",
        "pdf_size": 4835479,
        "rating": "3;5;5;6",
        "confidence": "4;3;5;3",
        "soundness": "3;3;3;3",
        "contribution": "1;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "62;85;109;49",
        "wc_strengths": "11;118;119;72",
        "wc_weaknesses": "151;272;103;57",
        "wc_questions": "24;100;85;78",
        "wc_review": "248;575;416;256",
        "wc_reply_reviewers": "696;77;44;74",
        "wc_reply_authors": "1391;1791;1039;270",
        "reply_reviewers": "2;1;1;1",
        "reply_authors": "4;5;3;2",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            76.25,
            22.884219453588535
        ],
        "wc_strengths_avg": [
            80.0,
            44.130488327232456
        ],
        "wc_weaknesses_avg": [
            145.75,
            80.11047060153872
        ],
        "wc_questions_avg": [
            71.75,
            28.69124430902222
        ],
        "wc_review_avg": [
            373.75,
            134.13123238082918
        ],
        "wc_reply_reviewers_avg": [
            222.75,
            273.53553242677634
        ],
        "wc_reply_authors_avg": [
            1122.75,
            559.6232549671251
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.5,
            1.118033988749895
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.3458572319330373,
        "gs_citation": 56,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7116556456872853461&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "CISPA Helmholtz Center for Information Security;University of Cambridge;Saarland University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.cispa.de/;https://www.cam.ac.uk;https://www.uni-saarland.de",
        "aff_unique_abbr": "CISPA;Cambridge;UdS",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Cambridge",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "Germany;United Kingdom"
    },
    {
        "id": "cfnevfQDsx",
        "title": "Converging and Stabilizing Generative Adversarial Imitation Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Generative adversarial imitation learning (GAIL) is a powerful framework for model-free imitation learning. GAIL extracts a policy from expert demonstrations by training the parameterized policy to fool a discriminator for the state-action pairs generated by the learned policy and experts. However, the training process of GAIL has oscillating behaviors, which spoils its performance and efficiency. In this paper, we study the stability of GAIL from the perspective of control theory. We formulate the training process of GAIL as a system of differential equations and formally prove that GAIL never approaches the desired equilibrium. We then leverage methodologies from control theory to design control functions that not only push GAIL to the desired equilibrium but also achieve asymptotic stability in theory. Motivated by the theoretical results, we propose a controlled GAIL algorithm with a modified learning objective for the discriminator. We evaluate our algorithm for MuJoCo tasks. While the vanilla GAIL is unstable and cannot acquire the expert return on some tasks, our controlled GAIL can approach expert returns on all the tasks.",
        "keywords": "generative adversarial imitation learning;convergence;stability;control theory",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Tianjiao Luo;Jianfei Chen;Huayu Chen;Jun Zhu",
        "authorids": "~Tianjiao_Luo1;~Jianfei_Chen1;~Huayu_Chen1;~Jun_Zhu2",
        "gender": "F;M;M;M",
        "homepage": "https://tianjiaoluo.github.io/;http://ml.cs.tsinghua.edu.cn/~jianfei;https://chendrag.github.io/;http://ml.cs.tsinghua.edu.cn/~jun",
        "dblp": "240/3012;48/6809-1;259/3113;50/2644-1",
        "google_scholar": "8GETNEsAAAAJ;di5RZ1MAAAAJ;0FBCHc4AAAAJ;axsP38wAAAAJ",
        "orcid": ";;;",
        "linkedin": "tianjiao-luo-99a60bba/;;;",
        "or_profile": "~Tianjiao_Luo1;~Jianfei_Chen1;~Huayu_Chen1;~Jun_Zhu2",
        "aff": "Tsinghua University;Tsinghua University;Tsinghua University;Tsinghua University",
        "aff_domain": "mails.tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;mail.tsinghua.edu.cn",
        "position": "PhD student;Associate Professor;PhD student;Professor",
        "bibtex": "@misc{\nluo2024converging,\ntitle={Converging and Stabilizing Generative Adversarial Imitation Learning},\nauthor={Tianjiao Luo and Jianfei Chen and Huayu Chen and Jun Zhu},\nyear={2024},\nurl={https://openreview.net/forum?id=cfnevfQDsx}\n}",
        "github": "",
        "project": "",
        "reviewers": "ruUB;4PYc;S9nZ;vkFG",
        "site": "https://openreview.net/forum?id=cfnevfQDsx",
        "pdf_size": 307261,
        "rating": "3;3;3;3",
        "confidence": "4;2;4;4",
        "soundness": "2;2;3;1",
        "contribution": "1;3;3;1",
        "presentation": "1;2;2;1",
        "wc_summary": "43;82;99;100",
        "wc_strengths": "26;42;76;28",
        "wc_weaknesses": "741;327;162;94",
        "wc_questions": "64;173;33;444",
        "wc_review": "874;624;370;666",
        "wc_reply_reviewers": "0;30;0;0",
        "wc_reply_authors": "231;246;189;304",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            1.0
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            81.0,
            23.075961518428652
        ],
        "wc_strengths_avg": [
            43.0,
            20.024984394500787
        ],
        "wc_weaknesses_avg": [
            331.0,
            251.41897303107416
        ],
        "wc_questions_avg": [
            178.5,
            161.86491281312328
        ],
        "wc_review_avg": [
            633.5,
            179.17798413867703
        ],
        "wc_reply_reviewers_avg": [
            7.5,
            12.99038105676658
        ],
        "wc_reply_authors_avg": [
            242.5,
            41.19769411022904
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:_96HopPfBegJ:scholar.google.com/&scioq=Converging+and+Stabilizing+Generative+Adversarial+Imitation+Learning&hl=en&as_sdt=0,47",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Tsinghua University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "cgCKm5DOnu",
        "title": "ROSA: Random Orthogonal Subspace Adaptation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Model training requires significantly more memory, compared with inference.  Parameter efficient fine-tuning (PEFT) methods provide a means of adapting large models to downstream tasks using less memory. However, existing methods such as adapters, prompt tuning or low-rank adaptation (LoRA) either introduce latency overhead at inference time or achieve subpar downstream performance compared with full fine-tuning. In this work we propose Random Orthogonal Subspace Adapter~(ROSA), a method that outperforms previous PEFT methods by a significant margin, while maintaining a zero latency overhead during inference time. In contrast to previous methods, ROSA is able to adapt subspaces of arbitrarily large dimension. We demonstrate both theoretically and experimentally that this makes ROSA strictly more expressive than LoRA, without consuming additional memory during runtime.  As PEFT methods are especially useful in the natural language processing domain, where models operate on scales that make full fine-tuning very expensive, we evaluate ROSA in two common NLP scenarios: natural language generation (NLG) and natural language understanding (NLU) with GPT-2 and RoBERTa, respectively. We show that on almost every GLUE task ROSA outperforms LoRA by a significant margin, while also outperforming LoRA on NLG tasks.Our code will be made publicly available on acceptance.",
        "keywords": "Machine Learning;Deep Learning;language model;parameter efficient fine-tuning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Marawan Gamal;Aristides Milios;Siva Reddy;Guillaume Rabusseau",
        "authorids": "~Marawan_Gamal1;~Aristides_Milios1;~Siva_Reddy1;~Guillaume_Rabusseau1",
        "gender": ";M;M;M",
        "homepage": "https://marawangamal.github.io/;https://atmilios.com/;http://sivareddy.in;https://www-labs.iro.umontreal.ca/~grabus/",
        "dblp": ";260/6061;64/8153;143/7327",
        "google_scholar": ";5sCPodgAAAAJ;;https://scholar.google.fr/citations?user=t2i4V4EAAAAJ",
        "orcid": ";;;",
        "linkedin": ";aristidesmilios/;;",
        "or_profile": "~Marawan_Gamal1;~Aristides_Milios1;~Siva_Reddy1;~Guillaume_Rabusseau1",
        "aff": "MILA - Quebec AI Institute;McGill University;Mila, McGill University;Universit\u00e9 de Montr\u00e9al",
        "aff_domain": "mila.quebec;mcgill.ca;mila.quebec;umontreal.ca",
        "position": "PhD student;MS student;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\ngamal2024rosa,\ntitle={{ROSA}: Random Orthogonal Subspace Adaptation},\nauthor={Marawan Gamal and Aristides Milios and Siva Reddy and Guillaume Rabusseau},\nyear={2024},\nurl={https://openreview.net/forum?id=cgCKm5DOnu}\n}",
        "github": "",
        "project": "",
        "reviewers": "A1HC;CdeU;DBFm",
        "site": "https://openreview.net/forum?id=cgCKm5DOnu",
        "pdf_size": 801645,
        "rating": "5;5;8",
        "confidence": "3;4;3",
        "soundness": "3;2;3",
        "contribution": "2;2;3",
        "presentation": "3;3;3",
        "wc_summary": "194;95;63",
        "wc_strengths": "154;49;36",
        "wc_weaknesses": "240;215;74",
        "wc_questions": "131;211;13",
        "wc_review": "719;570;186",
        "wc_reply_reviewers": "281;0;5",
        "wc_reply_authors": "634;642;298",
        "reply_reviewers": "1;0;1",
        "reply_authors": "3;3;1",
        "rating_avg": [
            6.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            117.33333333333333,
            55.76338902501851
        ],
        "wc_strengths_avg": [
            79.66666666666667,
            52.82886416428891
        ],
        "wc_weaknesses_avg": [
            176.33333333333334,
            73.07682411149395
        ],
        "wc_questions_avg": [
            118.33333333333333,
            81.32786866887771
        ],
        "wc_review_avg": [
            491.6666666666667,
            224.53557006011815
        ],
        "wc_reply_reviewers_avg": [
            95.33333333333333,
            131.30202672549356
        ],
        "wc_reply_authors_avg": [
            524.6666666666666,
            160.31080922868412
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1925375449297784058&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "Quebec AI Institute;McGill University;Universit\u00e9 de Montr\u00e9al",
        "aff_unique_dep": "MILA;;",
        "aff_unique_url": "https://mila.quebec;https://www.mcgill.ca;https://www.umontreal.ca",
        "aff_unique_abbr": "MILA;McGill;UdeM",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Montreal",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "chA0Zvsc6o",
        "title": "Proto-CLIP: A Vision-Language Prototype Alignment Approach for Few-Shot Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We propose a novel framework for few-shot learning by leveraging large-scale vision-language models such as CLIP. Motivated by unimodal prototypical networks for few-shot learning, we introduce **Proto-CLIP** that utilizes image prototypes and text prototypes for few-shot learning. Specifically, Proto-CLIP adapts the image and text encoder embeddings from CLIP in a joint fashion using few-shot examples. The embeddings from the two encoders are used to compute the respective prototypes of image classes for classification. During adaptation, we propose aligning the image and text prototypes of the corresponding classes. Such alignment is beneficial for few-shot classification due to the reinforced contributions from both types of prototypes. **Proto-CLIP has both training-free and fine-tuned variants. We demonstrate the effectiveness of our method by conducting experiments on benchmark datasets for few-shot learning, as well as in the real world for robot perception.** Code will be released upon acceptance.",
        "keywords": "Robot Perception;Object Recognition;Few-Shot Learning;Contrastive-Learning;Vision-Language;Multimodal Prototype Alignment",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/cbe62b4b47b873fe116cc269aecba4bbc08bf952.zip",
        "author": "Jishnu Jaykumar P;Kamalesh Palanisamy;Yu-Wei Chao;Xinya Du;Yu Xiang",
        "authorids": "~Jishnu_Jaykumar_P1;~Kamalesh_Palanisamy1;~Yu-Wei_Chao1;~Xinya_Du1;~Yu_Xiang3",
        "gender": "M;;M;M;M",
        "homepage": "http://jishnujayakumar.github.io;;http://www-personal.umich.edu/~ywchao/;https://xinyadu.github.io;https://yuxng.github.io/",
        "dblp": "284/8493;;44/10700;200/8114;00/6716-1",
        "google_scholar": "08esT74AAAAJ;;48Y9F-YAAAAJ;R-lKQqkAAAAJ;",
        "orcid": "0000-0003-1635-368X;;;;0000-0001-9431-5131",
        "linkedin": "jishnu-p;kamalesh-palanisamy/;;;",
        "or_profile": "~Jishnu_Jaykumar_P1;~Kamalesh_Palanisamy1;~Yu-Wei_Chao1;~Xinya_Du1;~Yu_Xiang1",
        "aff": "University of Texas at Dallas;;NVIDIA;University of Texas at Dallas;University of Texas, Dallas",
        "aff_domain": "utdallas.edu;;nvidia.com;utdallas.edu;utdallas.edu",
        "position": "PhD student;;Research Scientist;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\np2024protoclip,\ntitle={Proto-{CLIP}: A Vision-Language Prototype Alignment Approach for Few-Shot Learning},\nauthor={Jishnu Jaykumar P and Kamalesh Palanisamy and Yu-Wei Chao and Xinya Du and Yu Xiang},\nyear={2024},\nurl={https://openreview.net/forum?id=chA0Zvsc6o}\n}",
        "github": "",
        "project": "",
        "reviewers": "xatT;ycyz;Gen4",
        "site": "https://openreview.net/forum?id=chA0Zvsc6o",
        "pdf_size": 13785567,
        "rating": "3;3;5",
        "confidence": "4;4;5",
        "soundness": "2;2;3",
        "contribution": "2;3;2",
        "presentation": "3;3;3",
        "wc_summary": "103;60;69",
        "wc_strengths": "67;35;33",
        "wc_weaknesses": "231;388;178",
        "wc_questions": "70;55;5",
        "wc_review": "471;538;285",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            77.33333333333333,
            18.517259216441534
        ],
        "wc_strengths_avg": [
            45.0,
            15.57776192739723
        ],
        "wc_weaknesses_avg": [
            265.6666666666667,
            89.16775700267945
        ],
        "wc_questions_avg": [
            43.333333333333336,
            27.78888666755511
        ],
        "wc_review_avg": [
            431.3333333333333,
            107.02751463473722
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:D-BW-TNy1XUJ:scholar.google.com/&scioq=Proto-CLIP:+A+Vision-Language+Prototype+Alignment+Approach+for+Few-Shot+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "University of Texas at Dallas;NVIDIA",
        "aff_unique_dep": ";NVIDIA Corporation",
        "aff_unique_url": "https://www.utdallas.edu;https://www.nvidia.com",
        "aff_unique_abbr": "UT Dallas;NVIDIA",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Dallas;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "chVYVLJIAh",
        "title": "$\\lambda$-AC: Effective decision-aware reinforcement learning with latent models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The idea of decision-aware model learning, that models should be accurate where it matters for decision-making, has gained prominence in model-based reinforcement learning.\nWhile promising theoretical results have been established, the empirical performance of algorithms leveraging a decision-aware loss has been lacking, especially in continuous control problems.\nIn this paper, we present a study on the necessary components for decision-aware reinforcement learning models and we showcase design choices that enable well-performing algorithms.\nTo this end, we provide a theoretical and empirical investigation into algorithmic ideas in the field.\nWe highlight that empirical design decisions established in the MuZero line of works are vital to achieving good performance for related algorithms, and we showcase differences in behavior between different instantiations of value-aware algorithms in stochastic environments. \nUsing these insights, we propose the Latent Model-Based Decision-Aware Actor-Critic framework ($\\lambda$-AC) for decision-aware model-based reinforcement learning in continuous state-spaces and highlight important design choices in different environments.",
        "keywords": "reinforcement learning;model based reinforcement learning;decision aware learning;value equivalency;deep reinforcement learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/ccd64ba35bdfba184f153568faa261260ebbb22b.zip",
        "author": "Claas A Voelcker;Arash Ahmadian;Romina Abachi;Igor Gilitschenski;Amir-massoud Farahmand",
        "authorids": "~Claas_A_Voelcker1;~Arash_Ahmadian1;~Romina_Abachi1;~Igor_Gilitschenski1;~Amir-massoud_Farahmand1",
        "gender": "M;M;;M;M",
        "homepage": ";https://twitter.com/aahmadian_;;https://www.gilitschenski.org/igor;http://academic.sologen.net/",
        "dblp": "250/2358;330/4756;;129/1281;17/671",
        "google_scholar": "UZq8qZ8AAAAJ;https://scholar.google.com/citations?hl=en;;Nuw1Y4oAAAAJ;https://scholar.google.ca/citations?user=G5SAV7gAAAAJ",
        "orcid": ";0000-0003-3855-970X;;;",
        "linkedin": ";arash-ahmadian/;;igorgilitschenski/;amir-massoud-farahmand/",
        "or_profile": "~Claas_A_Voelcker1;~Arash_Ahmadian1;~Romina_Abachi1;~Igor_Gilitschenski1;~Amir-massoud_Farahmand1",
        "aff": "Toronto University;University of Toronto;;University of Toronto;Vector Institute",
        "aff_domain": "utoronto.ca;utoronto.ca;;toronto.edu;vectorinstitute.ai",
        "position": "PhD student;Undergrad student;;Assistant Professor;Faculty Member",
        "bibtex": "@misc{\nvoelcker2024lambdaac,\ntitle={\\${\\textbackslash}lambda\\$-{AC}: Effective decision-aware reinforcement learning with latent models},\nauthor={Claas A Voelcker and Arash Ahmadian and Romina Abachi and Igor Gilitschenski and Amir-massoud Farahmand},\nyear={2024},\nurl={https://openreview.net/forum?id=chVYVLJIAh}\n}",
        "github": "",
        "project": "",
        "reviewers": "LuyF;Y2Uk;fdkF;gnhB",
        "site": "https://openreview.net/forum?id=chVYVLJIAh",
        "pdf_size": 2283710,
        "rating": "3;5;6;8",
        "confidence": "2;4;3;2",
        "soundness": "2;2;2;4",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;4",
        "wc_summary": "145;67;117;82",
        "wc_strengths": "113;50;145;75",
        "wc_weaknesses": "170;101;184;351",
        "wc_questions": "27;58;192;110",
        "wc_review": "455;276;638;618",
        "wc_reply_reviewers": "0;112;73;0",
        "wc_reply_authors": "718;781;630;524",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            102.75,
            30.400452299266863
        ],
        "wc_strengths_avg": [
            95.75,
            36.217226564164186
        ],
        "wc_weaknesses_avg": [
            201.5,
            91.85450451665395
        ],
        "wc_questions_avg": [
            96.75,
            62.47949663689681
        ],
        "wc_review_avg": [
            496.75,
            145.88244411168878
        ],
        "wc_reply_reviewers_avg": [
            46.25,
            48.261656623037716
        ],
        "wc_reply_authors_avg": [
            663.25,
            96.64205864943068
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.08362420100070908,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "University of Toronto;Vector Institute",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.utoronto.ca;https://vectorinstitute.ai/",
        "aff_unique_abbr": "U of T;Vector Institute",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "ciBFYxzpBT",
        "title": "PASTA: Pretrained Action-State Transformer Agents",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Self-supervised learning has brought about a revolutionary paradigm shift in various computing domains, including NLP, vision, and biology. Recent approaches involve pre-training transformer models on vast amounts of unlabeled data, serving as a starting point for efficiently solving downstream tasks. In the realm of reinforcement learning, researchers have recently adapted these approaches by developing models pre-trained on expert trajectories, enabling them to address a wide range of tasks, from robotics to recommendation systems. However, existing methods mostly rely on intricate pre-training objectives tailored to specific downstream applications. This paper presents a comprehensive investigation of models we refer to as pre-trained action-state transformer agents (PASTA). Our study uses a unified methodology and covers an extensive set of general downstream tasks including behavioral cloning, offline RL, sensor failure robustness, and dynamics change adaptation. Our goal is to systematically compare various design choices and provide valuable insights to practitioners for building robust models. Key highlights of our study include tokenization at the action and state component level, using fundamental pre-training objectives like next token prediction, training models across diverse domains simultaneously, and using parameter efficient fine-tuning (PEFT). The developed models in our study contain fewer than 10 million parameters and the application of PEFT enables fine-tuning of fewer than 10,000 parameters during downstream adaptation, allowing a broad community to use these models and reproduce our experiments. We hope that this study will encourage further research into the use of transformers with first-principles design choices to represent RL trajectories and contribute to robust policy learning.",
        "keywords": "self-supervised pre-training;transformer models;reinforcement learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/8054f1f8732adefbe4c445b350c87f98b246f177.zip",
        "author": "Raphael Boige;Yannis Flet-Berliac;Arthur Flajolet;Guillaume Richard;Thomas PIERROT",
        "authorids": "~Raphael_Boige1;~Yannis_Flet-Berliac1;~Arthur_Flajolet2;~Guillaume_Richard1;~Thomas_PIERROT1",
        "gender": "M;;;M;M",
        "homepage": "https://github.com/Egiob;https://ynns.io/;;;",
        "dblp": ";239/5247;;258/3535;228/7739",
        "google_scholar": ";https://scholar.google.fr/citations?user=qclRKHoAAAAJ;;viOjnmQAAAAJ;https://scholar.google.fr/citations?user=0zBiyNUAAAAJ",
        "orcid": ";;;;0000-0002-5227-6194",
        "linkedin": ";;;;thomas-pierrot-120a43128/",
        "or_profile": "~Raphael_Boige1;~Yannis_Flet-Berliac1;~Arthur_Flajolet2;~Guillaume_Richard1;~Thomas_PIERROT1",
        "aff": "InstaDeep;InstaDeep;;InstaDeep;Universit\u00e9 Pierre et Marie Curie - Paris 6, Computer Science Lab  - Pierre and Marie Curie University, Paris, France",
        "aff_domain": "instadeep.com;instadeep.com;;instadeep.com;isir.upmc.fr",
        "position": "Researcher;Researcher;;Researcher;PhD student",
        "bibtex": "@misc{\nboige2024pasta,\ntitle={{PASTA}: Pretrained Action-State Transformer Agents},\nauthor={Raphael Boige and Yannis Flet-Berliac and Arthur Flajolet and Guillaume Richard and Thomas PIERROT},\nyear={2024},\nurl={https://openreview.net/forum?id=ciBFYxzpBT}\n}",
        "github": "",
        "project": "",
        "reviewers": "SZP5;tuMZ;tkJP;vct6",
        "site": "https://openreview.net/forum?id=ciBFYxzpBT",
        "pdf_size": 3788517,
        "rating": "3;3;5;6",
        "confidence": "4;3;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "91;69;104;40",
        "wc_strengths": "74;167;111;33",
        "wc_weaknesses": "160;690;607;20",
        "wc_questions": "108;266;3;222",
        "wc_review": "433;1192;825;315",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            76.0,
            24.259018941416407
        ],
        "wc_strengths_avg": [
            96.25,
            49.29186038282589
        ],
        "wc_weaknesses_avg": [
            369.25,
            285.1169716098991
        ],
        "wc_questions_avg": [
            149.75,
            102.48505988679521
        ],
        "wc_review_avg": [
            691.25,
            345.2885568622279
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5555555555555555,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13513748450650909873&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "InstaDeep;Universit\u00e9 Pierre et Marie Curie - Paris 6",
        "aff_unique_dep": ";Computer Science Lab",
        "aff_unique_url": "https://www.instadeep.com;https://www.upmc.fr",
        "aff_unique_abbr": "InstaDeep;UPMC",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Paris",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "United Kingdom;France"
    },
    {
        "id": "cijO0f8u35",
        "title": "Scaling Relationship on Learning Mathematical Reasoning with Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Mathematical reasoning is a challenging task for large language models (LLMs), while the scaling relationship of it with respect to LLM capacity is under-explored.\nIn this paper, we investigate how the pre-training loss, supervised data amount, and augmented data amount influence the reasoning performances of a supervised LLM.\nWe find that pre-training loss is a better indicator of the model's performance than the model's parameter count.\nWe apply supervised fine-tuning (SFT) with different amounts of supervised data and empirically find a log-linear relation between data amount and model performance, and we find better models improve less with enlarged supervised datasets.\nTo augment more data samples for improving model performances without any human effort, we propose to apply Rejection sampling Fine-Tuning (RFT).\nRFT uses supervised models to generate and collect correct reasoning paths as augmented fine-tuning datasets.\nWe find with augmented samples containing more distinct reasoning paths, RFT improves mathematical reasoning performance more for LLMs.\nWe also find RFT brings more improvement for less performant LLMs.\nFurthermore, we combine rejection samples from multiple models which push LLaMA-7B to an accuracy of 49.3\\% on GSM8K which outperforms the supervised fine-tuning (SFT) accuracy of 35.9\\% significantly.",
        "keywords": "Mathematical Reasoning;Scaling Relationship;Large Language Model",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/35f51711060e734769499f82128aed9e3e41d355.zip",
        "author": "Zheng Yuan;Hongyi Yuan;Chengpeng Li;Guanting Dong;Keming Lu;Chuanqi Tan;Chang Zhou;Jingren Zhou",
        "authorids": "~Zheng_Yuan2;~Hongyi_Yuan1;~Chengpeng_Li1;~Guanting_Dong1;~Keming_Lu1;~Chuanqi_Tan3;~Chang_Zhou2;~Jingren_Zhou1",
        "gender": "M;M;M;M;M;M;M;M",
        "homepage": ";;;https://dongguanting.github.io/;;;;",
        "dblp": "56/2877-2;308/0909;;;65/6898.html;148/4497;;84/2644",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;FG3O4i8AAAAJ;5pidFF8AAAAJ;amozZDkAAAAJ;WuD2op4AAAAJ;tOfo4ncAAAAJ;QeSoG3sAAAAJ;",
        "orcid": ";;;;;0000-0002-6676-3057;;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Zheng_Yuan2;~Hongyi_Yuan1;~Chengpeng_Li1;~Guanting_Dong1;~Keming_Lu1;~Chuanqi_Tan3;~Chang_Zhou2;~Jingren_Zhou1",
        "aff": "Alibaba Group;Tsinghua University;University of Science and Technology of China;Beijing University of Posts and Telecommunications;Alibaba Group;Alibaba Group;Alibaba Group;Alibaba Group",
        "aff_domain": "alibaba-inc.com;tsinghua.edu.cn;ustc.edu.cn;bupt.edu.cn;alibaba-inc.com;alibaba-inc.com;alibaba-inc.com;alibaba-inc.com",
        "position": "Researcher;PhD student;PhD student;MS student;Researcher;Full-time employee;Researcher;Researcher",
        "bibtex": "@misc{\nyuan2024scaling,\ntitle={Scaling Relationship on Learning Mathematical Reasoning with Large Language Models},\nauthor={Zheng Yuan and Hongyi Yuan and Chengpeng Li and Guanting Dong and Keming Lu and Chuanqi Tan and Chang Zhou and Jingren Zhou},\nyear={2024},\nurl={https://openreview.net/forum?id=cijO0f8u35}\n}",
        "github": "",
        "project": "",
        "reviewers": "J1oN;8Ko8;voeM;zwMw",
        "site": "https://openreview.net/forum?id=cijO0f8u35",
        "pdf_size": 4041470,
        "rating": "5;5;5;6",
        "confidence": "4;3;3;4",
        "soundness": "2;3;3;3",
        "contribution": "3;2;2;2",
        "presentation": "3;3;3;3",
        "wc_summary": "134;112;110;195",
        "wc_strengths": "76;26;62;93",
        "wc_weaknesses": "125;219;63;138",
        "wc_questions": "98;1;94;35",
        "wc_review": "433;358;329;461",
        "wc_reply_reviewers": "0;0;0;58",
        "wc_reply_authors": "362;333;436;338",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            137.75,
            34.368408458932166
        ],
        "wc_strengths_avg": [
            64.25,
            24.661457783350926
        ],
        "wc_weaknesses_avg": [
            136.25,
            55.54896488684555
        ],
        "wc_questions_avg": [
            57.0,
            40.835033978190836
        ],
        "wc_review_avg": [
            395.25,
            53.67669419776147
        ],
        "wc_reply_reviewers_avg": [
            14.5,
            25.11473670974872
        ],
        "wc_reply_authors_avg": [
            367.25,
            41.17872630376029
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 231,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4908426319510085302&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;3;0;0;0;0",
        "aff_unique_norm": "Alibaba Group;Tsinghua University;University of Science and Technology of China;Beijing University of Posts and Telecommunications",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.alibaba.com;https://www.tsinghua.edu.cn;http://www.ustc.edu.cn;http://www.bupt.edu.cn/",
        "aff_unique_abbr": "Alibaba;THU;USTC;BUPT",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Beijing",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "cijOBlCxMa",
        "title": "CustomNet: Zero-shot Object Customization with Variable-Viewpoints in Text-to-Image Diffusion Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Incorporating a customized object into image generation presents an attractive feature in text-to-image generation. However, existing optimization-based and encoder-based methods are hindered by drawbacks such as time-consuming optimization, insufficient identity preservation, and a prevalent copy-pasting effect. To overcome these limitations, we introduce CustomNet, a novel object customization approach that explicitly incorporates 3D novel view synthesis capabilities into the object customization process. This integration facilitates the adjustment of spatial position relationships and viewpoints, yielding diverse outputs while effectively preserving object identity. Moreover, we introduce intricate designs to enable location control and flexible background control through textual descriptions or specific user-defined images, overcoming the limitations of existing 3D novel view synthesis methods. We further leverage a dataset construction pipeline that can better handle real-world objects and complex backgrounds. Equipped with these designs, our method facilitates zero-shot object customization without test-time optimization, offering simultaneous control over the location, viewpoints, and background. As a result, our CustomNet ensures enhanced identity preservation and generates diverse, harmonious outputs.",
        "keywords": "Diffusion model;Image editing;Image generation;Customization",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Ziyang Yuan;Mingdeng Cao;Xintao Wang;Zhongang Qi;Chun Yuan;Ying Shan",
        "authorids": "~Ziyang_Yuan1;~Mingdeng_Cao1;~Xintao_Wang1;~Zhongang_Qi1;~Chun_Yuan1;~Ying_Shan2",
        "gender": ";M;;M;M;M",
        "homepage": "https://github.com/jiangyzy;https://github.com/ljzycmd;;;https://www.sigs.tsinghua.edu.cn/fg3/105064.jhtml;",
        "dblp": ";290/8525;;08/9990;;68/5910",
        "google_scholar": "https://scholar.google.hk/citations?hl=zh-CN;EcS0L5sAAAAJ;;zJvrrusAAAAJ;https://scholar.google.com.hk/citations?user=fYdxi2sAAAAJ;4oXBp9UAAAAJ",
        "orcid": ";;;;;0000-0001-7673-8325",
        "linkedin": ";;;;;YingShanProfile/",
        "or_profile": "~Ziyang_Yuan1;~Mingdeng_Cao1;~Xintao_Wang1;~Zhongang_Qi1;~Chun_Yuan1;~Ying_Shan2",
        "aff": "Tsinghua University;The University of Tokyo ;;Tencent PCG ARC Lab;Tsinghua University;Tencent PCG ARC Lab",
        "aff_domain": "tsinghua.edu.cn;u-tokyo.ac.jp;;tencent.com;tsinghua.edu.cn;arc.tencent.com",
        "position": "MS student;PhD student;;Researcher;Full Professor;Director",
        "bibtex": "@misc{\nyuan2024customnet,\ntitle={CustomNet: Zero-shot Object Customization with Variable-Viewpoints in Text-to-Image Diffusion Models},\nauthor={Ziyang Yuan and Mingdeng Cao and Xintao Wang and Zhongang Qi and Chun Yuan and Ying Shan},\nyear={2024},\nurl={https://openreview.net/forum?id=cijOBlCxMa}\n}",
        "github": "",
        "project": "",
        "reviewers": "96bJ;h7FN;vmn1",
        "site": "https://openreview.net/forum?id=cijOBlCxMa",
        "pdf_size": 28902348,
        "rating": "5;6;6",
        "confidence": "4;4;3",
        "soundness": "3;3;3",
        "contribution": "2;3;2",
        "presentation": "3;3;3",
        "wc_summary": "76;71;65",
        "wc_strengths": "85;71;51",
        "wc_weaknesses": "198;33;67",
        "wc_questions": "4;75;333",
        "wc_review": "363;250;516",
        "wc_reply_reviewers": "0;0;172",
        "wc_reply_authors": "1330;1367;1852",
        "reply_reviewers": "0;0;3",
        "reply_authors": "3;3;6",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            70.66666666666667,
            4.496912521077347
        ],
        "wc_strengths_avg": [
            69.0,
            13.9522996909709
        ],
        "wc_weaknesses_avg": [
            99.33333333333333,
            71.13523896229084
        ],
        "wc_questions_avg": [
            137.33333333333334,
            141.36084637865213
        ],
        "wc_review_avg": [
            376.3333333333333,
            109.00254839018929
        ],
        "wc_reply_reviewers_avg": [
            57.333333333333336,
            81.08157757605744
        ],
        "wc_reply_authors_avg": [
            1516.3333333333333,
            237.83234057256013
        ],
        "reply_reviewers_avg": [
            1.0,
            1.4142135623730951
        ],
        "reply_authors_avg": [
            4.0,
            1.4142135623730951
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 27,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14718400476573340526&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;0;2",
        "aff_unique_norm": "Tsinghua University;University of Tokyo;Tencent",
        "aff_unique_dep": ";;PCG ARC Lab",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.u-tokyo.ac.jp;https://www.tencent.com",
        "aff_unique_abbr": "THU;UTokyo;Tencent",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;0",
        "aff_country_unique": "China;Japan"
    },
    {
        "id": "cj2UlpYrpT",
        "title": "On the Role of Riemannian Metric in Isometric Representation Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Under the manifold hypothesis, isometric representation learning aims to discover a set of latent space coordinates that preserve the manifold's geometry. The geometry of the manifold needs to be specified prior, and typically, it is defined with a metric inherited from the ambient data space. Most existing methods adopt the identity metric assumption of the ambient space (namely, Euclidean data space), \na choice that is likely one of the most reasonable in unsupervised contexts. However, this unsupervised selection of the identity metric inherently lacks the capacity to capture the semantic understanding that humans perceive from data. The question of how to formulate a data-semantic-aware Riemannian metric for the ambient space remains unanswered, particularly in the context of isometric representation learning. In this work, we propose a method for constructing \\textit{neural feature-based metrics} capable of capturing data semantics by adopting knowledge from any pre-trained feature extraction model. Then we conduct a comparative study on the effects of the following Riemannian metrics in isometric representation learning: (i) the identity metric, (ii) the inverse density-based metric -- which is an existing unsupervised metric construction method --, and (iii) the proposed neural feature-based metrics. Experiments with standard image datasets \\textit{MNIST}, \\textit{Fashion MNIST}, and \\textit{CIFAR10} show that the neural feature-based metrics produce data-semantic-aware representations -- where data with similar semantics are located nearby -- and in some cases are able to discover unseen hierarchical structures in the datasets.",
        "keywords": "Autoencoders;Manifold;Geometry;Riemannian metric;Isometric representation learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Yonghyeon Lee",
        "authorids": "~Yonghyeon_Lee2",
        "gender": "M",
        "homepage": "https://www.gabe-yhlee.com",
        "dblp": "182/6796",
        "google_scholar": "",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Yonghyeon_Lee2",
        "aff": "Korea Institute for Advanced Study",
        "aff_domain": "kias.re.kr",
        "position": "Postdoc",
        "bibtex": "@misc{\nlee2024on,\ntitle={On the Role of Riemannian Metric in Isometric Representation Learning},\nauthor={Yonghyeon Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=cj2UlpYrpT}\n}",
        "github": "",
        "project": "",
        "reviewers": "HnxU;7V9h;7zcn;jvXY",
        "site": "https://openreview.net/forum?id=cj2UlpYrpT",
        "pdf_size": 16874756,
        "rating": "3;3;3;5",
        "confidence": "5;3;5;4",
        "soundness": "3;2;2;2",
        "contribution": "2;2;1;2",
        "presentation": "3;3;2;3",
        "wc_summary": "68;168;45;36",
        "wc_strengths": "72;65;19;18",
        "wc_weaknesses": "361;276;15;75",
        "wc_questions": "49;143;169;168",
        "wc_review": "550;652;248;297",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            79.25,
            52.551760198874405
        ],
        "wc_strengths_avg": [
            43.5,
            25.124689052802225
        ],
        "wc_weaknesses_avg": [
            181.75,
            141.61104300159644
        ],
        "wc_questions_avg": [
            132.25,
            49.18015351745051
        ],
        "wc_review_avg": [
            436.75,
            169.0523217823405
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.17407765595569782,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:M0OrBYrbT78J:scholar.google.com/&scioq=On+the+Role+of+Riemannian+Metric+in+Isometric+Representation+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Korea Institute for Advanced Study",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.kaist.edu",
        "aff_unique_abbr": "KIAS",
        "aff_country_unique_index": "0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "cj4J7aaKQp",
        "title": "Data Curation for Large Scale Detection Pretraining",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large multimodal datasets gathered from the internet have been a key driver of progress in recent image-text models such as DALL-E, CLIP, and Flamingo. However, structured prediction tasks have not seen the same benefits, as noisy fine-grained annotations do not exist at web-scale. In this paper, we aim to extend the gains enabled by web-sourced training sets to the problem of object detection.\nFirst, we show that data curation for grounding and localization necessitates its own approach: filtering methods which produce good datasets for image classification with CLIP models (e.g., the image-text similarity filtering from LAION-5B) do not yield better object detectors. Instead, we introduce new detection-focused filtering methods that match or outperform existing object detectors pretrained on supervised detection pretraining datasets. When trained on 102.4M images from the 12.8B image DataComp pool in a weakly supervised manner, our new filtering method matches the performance of a detector pre-trained on Object365, the largest fully-annotated detection dataset. In addition, our filtering approach shows good scaling with training set size and can be combined with Object365 to yield further improvements. To aid further research in this area, we release a 2.8B image subset of DataComp-12.8B pseudo-labeled with region proposals and detection bounding boxes.",
        "keywords": "Detection;Scaling;Robustness;Datasets",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Vivek Ramanujan;Haotian Zhang;Yinfei Yang;Ali Farhadi;Alexander T Toshev;Ludwig Schmidt;Jonathon Shlens;Vaishaal Shankar",
        "authorids": "~Vivek_Ramanujan1;~Haotian_Zhang3;~Yinfei_Yang1;~Ali_Farhadi3;~Alexander_T_Toshev1;~Ludwig_Schmidt1;~Jonathon_Shlens1;~Vaishaal_Shankar1",
        "gender": "M;M;;M;;M;;",
        "homepage": "https://vkramanuj.github.io;https://haotian-zhang.github.io/;;https://homes.cs.washington.edu/~ali/;;http://people.csail.mit.edu/ludwigs/;;",
        "dblp": "225/4845;;117/4082;37/5826;;141/2720;;",
        "google_scholar": "yXFPyNMAAAAJ;1vz0kKUAAAAJ;kvDbu90AAAAJ;jeOFRDsAAAAJ;;SWMKy70AAAAJ;;",
        "orcid": ";0000-0001-6809-0426;;;;;;",
        "linkedin": ";haotian-zhang-075508a6/;;;;ludwig-schmidt-87ba3612/;;",
        "or_profile": "~Vivek_Ramanujan1;~Haotian_Zhang3;~Yinfei_Yang1;~Ali_Farhadi3;~Alexander_T_Toshev1;~Ludwig_Schmidt1;~Jonathon_Shlens1;~Vaishaal_Shankar1",
        "aff": "Meta Facebook;Apple AI/ML;Apple;University of Washington;;University of Washington;;",
        "aff_domain": "meta.com;apple.com;apple.com;cs.uw.edu;;washington.edu;;",
        "position": "Intern;Researcher;Researcher;Full Professor;;Assistant Professor;;",
        "bibtex": "@misc{\nramanujan2024data,\ntitle={Data Curation for Large Scale Detection Pretraining},\nauthor={Vivek Ramanujan and Haotian Zhang and Yinfei Yang and Ali Farhadi and Alexander T Toshev and Ludwig Schmidt and Jonathon Shlens and Vaishaal Shankar},\nyear={2024},\nurl={https://openreview.net/forum?id=cj4J7aaKQp}\n}",
        "github": "",
        "project": "",
        "reviewers": "NGVY;MZQa;hLdz;EkJ7",
        "site": "https://openreview.net/forum?id=cj4J7aaKQp",
        "pdf_size": 12697972,
        "rating": "3;3;5;5",
        "confidence": "5;4;4;4",
        "soundness": "2;2;3;2",
        "contribution": "2;2;2;2",
        "presentation": "3;3;3;3",
        "wc_summary": "71;74;112;115",
        "wc_strengths": "60;42;74;31",
        "wc_weaknesses": "182;102;249;298",
        "wc_questions": "91;24;335;4",
        "wc_review": "404;242;770;448",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            93.0,
            20.554804791094465
        ],
        "wc_strengths_avg": [
            51.75,
            16.498105951896417
        ],
        "wc_weaknesses_avg": [
            207.75,
            73.64229423368069
        ],
        "wc_questions_avg": [
            113.5,
            131.87968001174403
        ],
        "wc_review_avg": [
            466.0,
            191.54633904097463
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18160986266416615746&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;2;2",
        "aff_unique_norm": "Meta;Apple;University of Washington",
        "aff_unique_dep": "Meta Platforms, Inc.;AI/ML;",
        "aff_unique_url": "https://meta.com;https://www.apple.com;https://www.washington.edu",
        "aff_unique_abbr": "Meta;Apple;UW",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "cjdmIUYj03",
        "title": "On the Generalization of Temporal Graph Learning with Theoretical Insights",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Temporal graph learning (TGL) is a widely-used technique in various real-world applications, but its theoretical foundations remain largely under-explored. In this paper, we fill in this gap by studying the generalization ability of different TGL algorithms (e.g., GNN-based, RNN-based, and memory-based methods) under the finite-wide over-parameterized regime. We establish the connection between the generalization error of TGL algorithms and \\circled{1} \"\\textit{the number of layers/steps}\" in the GNN-/RNN-based TGL methods and \\circled{2} \"\\textit{the feature-label alignment (FLA) score}\", where FLA can be used as a proxy for the expressive power and explains the performance of memory-based methods. Guided by our theoretical analysis, we propose \\textit{\\textbf{S}implified-\\textbf{T}emp\\textbf{o}ral-Graph-\\textbf{Ne}twork} (SToNe), which simultaneously enjoys a small generalization error, the better overall performance, and a lower model complexity. Extensive experiments on real-world datasets demonstrate the effectiveness of SToNe. This paper provides critical insights into TGL from a theoretical perspective and paves the way for designing practical TGL algorithms in future studies.",
        "keywords": "This paper studies the generalization ability of different temporal graph algorithms.",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Weilin Cong;Jian Kang;Hanghang Tong;Mehrdad Mahdavi",
        "authorids": "~Weilin_Cong1;~Jian_Kang1;~Hanghang_Tong3;~Mehrdad_Mahdavi2",
        "gender": "M;M;;M",
        "homepage": "https://congweilin.github.io/CongWeilin.io/;https://jiank2.github.io/;http://tonghanghang.org;http://www.cse.psu.edu/~mzm616/",
        "dblp": "203/8227;56/6072-8;58/1757;88/4321",
        "google_scholar": "yYHxZ6MAAAAJ;U_jFlOQAAAAJ;RaINcuUAAAAJ;HzxnwocAAAAJ",
        "orcid": ";0000-0003-3902-7131;0000-0003-4405-3887;",
        "linkedin": ";jiank2/;htong/;",
        "or_profile": "~Weilin_Cong1;~Jian_Kang1;~Hanghang_Tong3;~Mehrdad_Mahdavi2",
        "aff": "Meta Facebook;University of Rochester;University of Illinois, Urbana Champaign;Toyota Technological Institute at Chicago",
        "aff_domain": "meta.com;cs.rochester.edu;illinois.edu;ttic.edu",
        "position": "Researcher;Assistant Professor;Associate Professor;Researcher",
        "bibtex": "@misc{\ncong2024on,\ntitle={On the Generalization of Temporal Graph Learning with Theoretical Insights},\nauthor={Weilin Cong and Jian Kang and Hanghang Tong and Mehrdad Mahdavi},\nyear={2024},\nurl={https://openreview.net/forum?id=cjdmIUYj03}\n}",
        "github": "",
        "project": "",
        "reviewers": "w7M7;2VYF;g85Z;rLms",
        "site": "https://openreview.net/forum?id=cjdmIUYj03",
        "pdf_size": 1296165,
        "rating": "3;5;6;8",
        "confidence": "4;2;3;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;3;3",
        "presentation": "3;2;2;3",
        "wc_summary": "71;198;51;131",
        "wc_strengths": "56;69;59;72",
        "wc_weaknesses": "247;211;24;205",
        "wc_questions": "104;44;300;70",
        "wc_review": "478;522;434;478",
        "wc_reply_reviewers": "0;163;153;0",
        "wc_reply_authors": "627;448;1371;578",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;2;2;1",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            112.75,
            57.35143851726825
        ],
        "wc_strengths_avg": [
            64.0,
            6.670832032063167
        ],
        "wc_weaknesses_avg": [
            171.75,
            86.80257772670119
        ],
        "wc_questions_avg": [
            129.5,
            100.71122082469262
        ],
        "wc_review_avg": [
            478.0,
            31.11269837220809
        ],
        "wc_reply_reviewers_avg": [
            79.0,
            79.07907434966599
        ],
        "wc_reply_authors_avg": [
            756.0,
            361.0450110443295
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.08362420100070908,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:2hagiYzh1WEJ:scholar.google.com/&scioq=On+the+Generalization+of+Temporal+Graph+Learning+with+Theoretical+Insights&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Meta;University of Rochester;University of Illinois Urbana-Champaign;Toyota Technological Institute at Chicago",
        "aff_unique_dep": "Meta Platforms, Inc.;;;",
        "aff_unique_url": "https://meta.com;https://www.rochester.edu;https://illinois.edu;https://www.tti-chicago.org",
        "aff_unique_abbr": "Meta;U of R;UIUC;TTI Chicago",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Urbana-Champaign;Chicago",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "ck4SG9lnrQ",
        "title": "CMMLU: Measuring massive multitask language understanding in Chinese",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "As the capabilities of large language models (LLMs) continue to advance, evaluating their performance is becoming simultaneously more important and more challenging. This paper aims to address this issue for Mandarin Chinese in the form of CMMLU, a comprehensive Chinese benchmark that covers various subjects, including natural sciences, social sciences, engineering, and the humanities. We conduct a thorough evaluation of more than 20 contemporary multilingual and Chinese LLMs, assessing their performance across different\nsubjects and settings. The results reveal that most existing LLMs struggle to achieve an accuracy of 60% even, which is the pass mark for Chinese exams. This highlights that there is significant room for improvement in the capabilities of LLMs. Additionally, we conduct extensive experiments to identify factors impacting the models' performance and propose directions for enhancing LLMs. CMMLU fills the gap in evaluating the knowledge and reasoning capabilities of large language models in the Chinese context.",
        "keywords": "Chinese;Benchmark;Multi-task;LLM",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Haonan Li;Yixuan Zhang;Fajri Koto;Yifei Yang;hai zhao;Yeyun Gong;Nan Duan;Timothy Baldwin",
        "authorids": "~Haonan_Li2;tyouisen@gmail.com;~Fajri_Koto1;~Yifei_Yang2;~hai_zhao1;~Yeyun_Gong2;~Nan_Duan1;~Timothy_Baldwin1",
        "gender": "M;;M;;M;M;M;",
        "homepage": "https://haonan-li.github.io/;;https://fajrikoto.com/;;http://bcmi.sjtu.edu.cn/~zhaohai/;;https://nanduan.github.io/;https://eltimster.github.io/www/",
        "dblp": "218/7270.html;;160/0019;;25/1145-1.html;06/10400.html;;65/4863",
        "google_scholar": "IqfgexsAAAAJ;;RA9l3s4AAAAJ;UxAb3eQAAAAJ;https://scholar.google.com.tw/citations?user=4dU5KS0AAAAJ;piUkwMYAAAAJ;Qaa6OxIAAAAJ;wjBD1dkAAAAJ",
        "orcid": "0000-0001-6623-5089;;;0000-0003-0997-9422;;;;0000-0003-4525-6950",
        "linkedin": "haonan-li-809709b9/;;fajri-koto-02705860/;;;;;",
        "or_profile": "~Haonan_Li2;tyouisen@gmail.com;~Fajri_Koto1;~Yifei_Yang2;~hai_zhao1;~Yeyun_Gong2;~Nan_Duan1;~Timothy_Baldwin1",
        "aff": "Mohamed bin Zayed University of Artificial Intelligence;;Mohamed bin Zayed University of Artificial Intelligence;Shanghai Jiaotong University;Shanghai Jiaotong University;Microsoft;Microsoft Research Asia;The University of Melbourne",
        "aff_domain": "mbzuai.ac.ae;;mbzuai.ac.ae;sjtu.edu.cn;sjtu.edu.cn;microsoft.com;microsoft.com;unimelb.edu.au",
        "position": "Postdoc;;Postdoc;PhD student;Full Professor;Researcher;Principal Researcher;Full Professor",
        "bibtex": "@misc{\nli2024cmmlu,\ntitle={{CMMLU}: Measuring massive multitask language understanding in Chinese},\nauthor={Haonan Li and Yixuan Zhang and Fajri Koto and Yifei Yang and hai zhao and Yeyun Gong and Nan Duan and Timothy Baldwin},\nyear={2024},\nurl={https://openreview.net/forum?id=ck4SG9lnrQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZnNq;qmrE;CUim",
        "site": "https://openreview.net/forum?id=ck4SG9lnrQ",
        "pdf_size": 2488466,
        "rating": "5;6;8",
        "confidence": "4;4;4",
        "soundness": "3;3;3",
        "contribution": "3;3;4",
        "presentation": "3;3;3",
        "wc_summary": "79;45;46",
        "wc_strengths": "131;33;79",
        "wc_weaknesses": "141;53;126",
        "wc_questions": "41;227;104",
        "wc_review": "392;358;355",
        "wc_reply_reviewers": "67;55;129",
        "wc_reply_authors": "873;1059;957",
        "reply_reviewers": "1;1;1",
        "reply_authors": "2;3;3",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            56.666666666666664,
            15.797327481430381
        ],
        "wc_strengths_avg": [
            81.0,
            40.033319456006474
        ],
        "wc_weaknesses_avg": [
            106.66666666666667,
            38.43898484033567
        ],
        "wc_questions_avg": [
            124.0,
            77.23988606931007
        ],
        "wc_review_avg": [
            368.3333333333333,
            16.779617264870957
        ],
        "wc_reply_reviewers_avg": [
            83.66666666666667,
            32.42769735204082
        ],
        "wc_reply_authors_avg": [
            963.0,
            76.05261336732617
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 246,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7424799427308772526&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;1;1;2;2;3",
        "aff_unique_norm": "Mohamed bin Zayed University of Artificial Intelligence;Shanghai Jiao Tong University;Microsoft;University of Melbourne",
        "aff_unique_dep": ";;Microsoft Corporation;",
        "aff_unique_url": "https://mbzuai.ac.ae;https://www.sjtu.edu.cn;https://www.microsoft.com;https://www.unimelb.edu.au",
        "aff_unique_abbr": "MBZUAI;SJTU;Microsoft;UniMelb",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Asia",
        "aff_country_unique_index": "0;0;1;1;2;1;3",
        "aff_country_unique": "United Arab Emirates;China;United States;Australia"
    },
    {
        "id": "ckzglrAMsh",
        "title": "Prompt-tuning Latent Diffusion Models for Inverse Problems",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We propose a new method for solving imaging inverse problems using text-to-image latent diffusion models as general priors. Existing methods using latent diffusion models for inverse problems typically rely on simple null text prompts, which can lead to suboptimal performance. To address this limitation, we introduce a method for prompt tuning, which jointly optimizes the text embedding on-the-fly while running the reverse diffusion process. This allows us to generate images that are more faithful to the diffusion prior. In addition, we propose a method to keep the evolution of latent variables within the range space of the encoder, by projection. This helps to reduce image artifacts, a major problem when using latent diffusion models instead of pixel-based diffusion models. Our combined method, called P2L, outperforms both image- and latent-diffusion model-based inverse problem solvers on a variety of tasks, such as super-resolution, deblurring, and inpainting.",
        "keywords": "Diffusion models; Inverse problems; Prompt tuning",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Hyungjin Chung;Jong Chul Ye;Peyman Milanfar;Mauricio Delbracio",
        "authorids": "~Hyungjin_Chung1;~Jong_Chul_Ye1;~Peyman_Milanfar1;~Mauricio_Delbracio1",
        "gender": "M;M;M;M",
        "homepage": "https://www.hj-chung.com/;https://bispl.weebly.com/;http://www.milanfar.org;",
        "dblp": "262/0382;15/5613;48/6882;90/10811",
        "google_scholar": "https://scholar.google.co.kr/citations?user=KdchEyoAAAAJ;HNMjoNEAAAAJ;iGzDl8IAAAAJ;lDDm920AAAAJ",
        "orcid": "0000-0003-3202-0893;;;",
        "linkedin": "hyungjin-chung-060b42148/;;;",
        "or_profile": "~Hyungjin_Chung1;~Jong_Chul_Ye1;~Peyman_Milanfar1;~Mauricio_Delbracio1",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Google;Google",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr;google.com;google.com",
        "position": "PhD student;Full Professor;Distinguished Scientist;Research Scientist",
        "bibtex": "@misc{\nchung2024prompttuning,\ntitle={Prompt-tuning Latent Diffusion Models for Inverse Problems},\nauthor={Hyungjin Chung and Jong Chul Ye and Peyman Milanfar and Mauricio Delbracio},\nyear={2024},\nurl={https://openreview.net/forum?id=ckzglrAMsh}\n}",
        "github": "",
        "project": "",
        "reviewers": "fyie;QCsq;vCQL;7Ao9",
        "site": "https://openreview.net/forum?id=ckzglrAMsh",
        "pdf_size": 22488993,
        "rating": "3;6;6;6",
        "confidence": "4;5;4;5",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;3;3;4",
        "wc_summary": "46;85;129;79",
        "wc_strengths": "29;19;48;23",
        "wc_weaknesses": "554;102;311;85",
        "wc_questions": "5;4;207;99",
        "wc_review": "634;210;695;286",
        "wc_reply_reviewers": "0;13;0;0",
        "wc_reply_authors": "1426;317;563;531",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "4;1;1;1",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            84.75,
            29.549746191803408
        ],
        "wc_strengths_avg": [
            29.75,
            11.121488209767612
        ],
        "wc_weaknesses_avg": [
            263.0,
            190.1249589086083
        ],
        "wc_questions_avg": [
            78.75,
            83.49363748214591
        ],
        "wc_review_avg": [
            456.25,
            211.08099748674678
        ],
        "wc_reply_reviewers_avg": [
            3.25,
            5.629165124598851
        ],
        "wc_reply_authors_avg": [
            709.25,
            424.48579187058783
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            1.299038105676658
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 33,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13591335290787932252&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;1;1",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.kaist.ac.kr;https://www.google.com",
        "aff_unique_abbr": "KAIST;Google",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0;1;1",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "id": "clU5xWyItb",
        "title": "PaperQA: Retrieval-Augmented Generative Agent for Scientific Research",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) generalize well across language tasks, but suffer from hallucinations and uninterpretability, making it difficult to assess their accuracy without ground-truth. Retrieval-Augmented Generation (RAG) models have been proposed to reduce hallucinations and provide provenance for how an answer was generated. Applying such models to the scientific literature may enable large-scale, systematic processing of scientific knowledge. We present PaperQA, a RAG agent for answering questions over the scientific literature. PaperQA is an agent that performs information retrieval across full-text scientific articles, assesses the relevance of sources and passages, and uses RAG to provide answers. Viewing this agent as a question-answering model, we find it exceeds performance of existing LLMs and LLM agents on current science QA benchmarks. To push the field closer to how humans perform research on scientific literature, we also introduce LitQA, a more complex benchmark that requires retrieval and synthesis of information from full-text scientific papers across the literature. Finally, we demonstrate PaperQA's matches expert human researchers on LitQA.",
        "keywords": "large language models;agents;scientific literature;information retrieval;text mining",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/19d379edf763b18295307cbf8d814e413761eb88.zip",
        "author": "Jakub L\u00e1la;Odhran ODonoghue;Aleksandar Shtedritski;Sam Cox;Samuel G Rodriques;Andrew White",
        "authorids": "~Jakub_L\u00e1la1;~Odhran_ODonoghue1;~Aleksandar_Shtedritski1;~Sam_Cox1;~Samuel_G_Rodriques1;~Andrew_White1",
        "gender": "M;;M;F;M;M",
        "homepage": ";https://www.bdi.ox.ac.uk/Team/odhran-odonoghue;;;;https://thewhitelab.org",
        "dblp": "349/5167;;284/9612;;;",
        "google_scholar": "Syk0xGgAAAAJ;;cGnonsQAAAAJ;;yGKwWGEAAAAJ;47fQG30AAAAJ",
        "orcid": "0000-0002-5424-5260;;;0000-0002-4441-9327;;",
        "linkedin": ";;;;samuel-g-rodriques-080a9b22/;",
        "or_profile": "~Jakub_L\u00e1la1;~Odhran_ODonoghue1;~Aleksandar_Shtedritski1;~Sam_Cox1;~Samuel_G_Rodriques1;~Andrew_White1",
        "aff": "Imperial College London;;Google;University of Rochester;The Francis Crick Institute;University of Rochester",
        "aff_domain": "imperial.ac.uk;;deepmind.com;rochester.edu;crick.ac.uk;rochester.edu",
        "position": "PhD student;;Intern;PhD student;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nl{\\'a}la2024paperqa,\ntitle={Paper{QA}: Retrieval-Augmented Generative Agent for Scientific Research},\nauthor={Jakub L{\\'a}la and Odhran ODonoghue and Aleksandar Shtedritski and Sam Cox and Samuel G Rodriques and Andrew White},\nyear={2024},\nurl={https://openreview.net/forum?id=clU5xWyItb}\n}",
        "github": "",
        "project": "",
        "reviewers": "afKA;1BNP;CSpW;vdwn",
        "site": "https://openreview.net/forum?id=clU5xWyItb",
        "pdf_size": 599471,
        "rating": "3;3;5;6",
        "confidence": "5;4;3;4",
        "soundness": "2;2;2;2",
        "contribution": "2;2;3;2",
        "presentation": "2;2;3;3",
        "wc_summary": "29;95;113;29",
        "wc_strengths": "31;120;75;42",
        "wc_weaknesses": "247;286;181;243",
        "wc_questions": "230;44;1;62",
        "wc_review": "537;545;370;376",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1145;769;413;788",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            66.5,
            38.0361669993179
        ],
        "wc_strengths_avg": [
            67.0,
            34.61935874622752
        ],
        "wc_weaknesses_avg": [
            239.25,
            37.59238619720754
        ],
        "wc_questions_avg": [
            84.25,
            87.0183170372767
        ],
        "wc_review_avg": [
            457.0,
            84.07437183827186
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            778.75,
            258.8883688001452
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5443310539518174,
        "gs_citation": 92,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15569385356224447096&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;3;2",
        "aff_unique_norm": "Imperial College London;Google;University of Rochester;Francis Crick Institute",
        "aff_unique_dep": ";Google;;",
        "aff_unique_url": "https://www.imperial.ac.uk;https://www.google.com;https://www.rochester.edu;https://www.crick.ac.uk",
        "aff_unique_abbr": "ICL;Google;U of R;Crick",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;1;0;1",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "id": "cmAIfTK6fe",
        "title": "ViR: Vision Retention Networks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Vision Transformers (ViTs) have attracted a lot of popularity in recent years, due to their exceptional capabilities in modeling long-range spatial dependencies and scalability for large scale training. Although the training parallelism of self-attention mechanism plays an important role in retaining great performance, its quadratic complexity baffles the application of ViTs in many scenarios which demand fast inference. This effect is even more pronounced in applications in which autoregressive modeling of input features is required. In Natural Language Processing (NLP), a new stream of efforts have proposed parallelizable models with recurrent formulation that allows for efficient inference in generative applications. Inspired by this trend, we propose a new class of computer vision models, dubbed Vision Retention Networks (ViR), with dual parallel and recurrent formulations, which strike an optimal balance between fast inference and parallel training with competitive performance. In particular, ViR scales favorably for image throughput and memory consumption in tasks that require higher-resolution images due to its flexible formulation in processing large sequence lengths. The ViR is the first attempt to realize dual parallel and recurrent equivalency in a general vision backbone for recognition tasks. We have validated the effectiveness of ViR through extensive experiments with different dataset sizes and various image resolutions and achieved competitive performance. Our code and pretrained models will be made publicly available.",
        "keywords": "transformers;autoregressive;classification",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Ali Hatamizadeh;Mike Ranzinger;Jan Kautz",
        "authorids": "~Ali_Hatamizadeh1;~Mike_Ranzinger1;~Jan_Kautz1",
        "gender": ";;",
        "homepage": ";;http://jankautz.com",
        "dblp": ";364/2582;48/6214",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;P9FclNEAAAAJ",
        "orcid": ";;",
        "linkedin": ";mike-ranzinger/;",
        "or_profile": "~Ali_Hatamizadeh1;~Mike_Ranzinger1;~Jan_Kautz1",
        "aff": ";NVIDIA;NVIDIA",
        "aff_domain": ";nvidia.com;nvidia.com",
        "position": ";Researcher;VP Research",
        "bibtex": "@misc{\nhatamizadeh2024vir,\ntitle={ViR: Vision Retention Networks},\nauthor={Ali Hatamizadeh and Mike Ranzinger and Jan Kautz},\nyear={2024},\nurl={https://openreview.net/forum?id=cmAIfTK6fe}\n}",
        "github": "",
        "project": "",
        "reviewers": "98mC;A5wE;uppP;pC11",
        "site": "https://openreview.net/forum?id=cmAIfTK6fe",
        "pdf_size": 372407,
        "rating": "3;3;3;5",
        "confidence": "5;4;2;4",
        "soundness": "2;3;3;3",
        "contribution": "1;2;2;2",
        "presentation": "3;3;2;3",
        "wc_summary": "60;71;67;99",
        "wc_strengths": "33;40;27;108",
        "wc_weaknesses": "227;204;154;315",
        "wc_questions": "66;77;2;294",
        "wc_review": "386;392;250;816",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            74.25,
            14.821858857781638
        ],
        "wc_strengths_avg": [
            52.0,
            32.657311585615865
        ],
        "wc_weaknesses_avg": [
            225.0,
            58.27949896833363
        ],
        "wc_questions_avg": [
            109.75,
            110.16436583578195
        ],
        "wc_review_avg": [
            461.0,
            212.6805115660577
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.13245323570650439,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10274910961540416953&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "NVIDIA",
        "aff_unique_dep": "NVIDIA Corporation",
        "aff_unique_url": "https://www.nvidia.com",
        "aff_unique_abbr": "NVIDIA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Learning the greatest common divisor: explaining transformer predictions",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18284",
        "id": "cmcD05NPKa",
        "author_site": "Fran\u00e7ois Charton",
        "tldr": "",
        "abstract": "The predictions of small transformers, trained to calculate the greatest common divisor (GCD) of two positive integers, can be fully characterized by looking at model inputs and outputs.\nAs training proceeds, the model learns a list $\\mathcal D$ of integers, products of divisors of the base used to represent integers and small primes, and predicts the largest element of $\\mathcal D$ that divides both inputs. \nTraining distributions impact performance. Models trained from uniform operands only learn a handful of GCD (up to $38$ GCD $\\leq100$). Log-uniform operands boost performance to $73$ GCD $\\leq 100$, and a log-uniform distribution of outcomes (i.e. GCD) to $91$. However, training from uniform (balanced) GCD breaks explainability.",
        "keywords": "mathematics;arithmetic;transformers;explainability",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Francois Charton",
        "authorids": "~Francois_Charton1",
        "gender": "M",
        "homepage": "",
        "dblp": "255/5318",
        "google_scholar": "",
        "orcid": "",
        "linkedin": "fran%C3%A7ois-charton-214187120/",
        "or_profile": "~Francois_Charton1",
        "aff": "Meta Facebook",
        "aff_domain": "fb.com",
        "position": "Research Engineer",
        "bibtex": "@inproceedings{\ncharton2024learning,\ntitle={Learning the greatest common divisor: explaining transformer predictions},\nauthor={Francois Charton},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=cmcD05NPKa}\n}",
        "github": "",
        "project": "",
        "reviewers": "zrzn;21KR;t8xf;QHKu",
        "pdf_size": 661788,
        "rating": "5;5;6;8",
        "confidence": "4;4;4;4",
        "soundness": "3;4;3;4",
        "contribution": "2;2;3;4",
        "presentation": "2;3;3;4",
        "wc_summary": "85;333;126;201",
        "wc_strengths": "43;95;73;57",
        "wc_weaknesses": "99;590;107;51",
        "wc_questions": "150;15;562;175",
        "wc_review": "377;1033;868;484",
        "wc_reply_reviewers": "0;38;96;32",
        "wc_reply_authors": "1463;795;1716;220",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "2;1;2;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            186.25,
            94.38584374788414
        ],
        "wc_strengths_avg": [
            67.0,
            19.339079605813716
        ],
        "wc_weaknesses_avg": [
            211.75,
            219.43037050508755
        ],
        "wc_questions_avg": [
            225.5,
            203.58843287377601
        ],
        "wc_review_avg": [
            690.5,
            269.13611797750224
        ],
        "wc_reply_reviewers_avg": [
            41.5,
            34.62296925452813
        ],
        "wc_reply_authors_avg": [
            1048.5,
            584.8164241879668
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13040675040393286938&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=cmcD05NPKa",
        "pdf": "https://openreview.net/pdf?id=cmcD05NPKa",
        "email": "fb.com",
        "author_num": 1,
        "aff_unique_index": "0",
        "aff_unique_norm": "Meta",
        "aff_unique_dep": "Meta Platforms, Inc.",
        "aff_unique_url": "https://meta.com",
        "aff_unique_abbr": "Meta",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "cnAeyjtMFM",
        "title": "When Witnesses Defend: A Witness Graph Topological Layer for Adversarial Graph Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Capitalizing on the intuitive premise that shape characteristics are more robust to perturbations, we bridge adversarial graph learning with the emerging tools from computational topology, namely, persistent homology representations of graphs. We introduce the concept of witness complex to adversarial analysis on graphs, which allows us to focus only on the salient shape characteristics of graphs, yielded by the subset of the most essential nodes (i.e., landmarks), with minimal loss of topological information on the whole graph. The remaining nodes are then used as  witnesses, governing which higher-order graph substructures are incorporated into the learning process. Armed with the witness mechanism, we design Witness Graph Topological Layer (WGTL), which systematically integrates both \nlocal and global topological graph feature representations whose impact are in turn automatically controlled by the robust regularized topological loss. We derive the important stability guarantees of both local and global topology encodings and the associated robust topological loss, given the attacker's budget. We illustrate versatility of WGTL by its integration with GNNs and existing non-topological defense mechanisms. Our extensive experiments demonstrate that WGTL boosts the robustness of GNNs against of a wide spectrum of adversarial attacks, leading to relative gains up to 18%.",
        "keywords": "Graph Neural Networks;Topological Data Analysis;Witness Complex;Adversarial Attacks",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/eca752e6386ec3d27d84beed8c47d47579ac6ae8.pdf",
        "author": "Naheed Anjum Arafat;Debabrota Basu;Yulia Gel;Yuzhou Chen",
        "authorids": "~Naheed_Anjum_Arafat1;~Debabrota_Basu1;~Yulia_Gel1;~Yuzhou_Chen1",
        "gender": "M;;;",
        "homepage": "https://toggled.github.io/naheed/;https://debabrota-basu.github.io/;;",
        "dblp": "204/2502;126/2209;;",
        "google_scholar": "qWrpqBEAAAAJ;https://scholar.google.co.in/citations?user=e26Maa4AAAAJ;;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Naheed_Anjum_Arafat1;~Debabrota_Basu1;~Yulia_Gel1;~Yuzhou_Chen1",
        "aff": "Nanyang Technological University;INRIA;;",
        "aff_domain": "ntu.edu.sg;inria.fr;;",
        "position": "Postdoc;Faculty;;",
        "bibtex": "@misc{\narafat2024when,\ntitle={When Witnesses Defend: A Witness Graph Topological Layer for Adversarial Graph Learning},\nauthor={Naheed Anjum Arafat and Debabrota Basu and Yulia Gel and Yuzhou Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=cnAeyjtMFM}\n}",
        "github": "",
        "project": "",
        "reviewers": "EvXo;UAFj;REKj",
        "site": "https://openreview.net/forum?id=cnAeyjtMFM",
        "pdf_size": 1086981,
        "rating": "5;5;6",
        "confidence": "2;4;4",
        "soundness": "3;2;2",
        "contribution": "3;2;3",
        "presentation": "3;2;3",
        "wc_summary": "43;45;113",
        "wc_strengths": "22;33;71",
        "wc_weaknesses": "48;588;190",
        "wc_questions": "2;21;40",
        "wc_review": "115;687;414",
        "wc_reply_reviewers": "14;73;73",
        "wc_reply_authors": "777;1729;849",
        "reply_reviewers": "1;1;1",
        "reply_authors": "3;4;3",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            67.0,
            32.53715824509981
        ],
        "wc_strengths_avg": [
            42.0,
            20.992061991778385
        ],
        "wc_weaknesses_avg": [
            275.3333333333333,
            228.56265856191138
        ],
        "wc_questions_avg": [
            21.0,
            15.513435037626794
        ],
        "wc_review_avg": [
            405.3333333333333,
            233.59842084702163
        ],
        "wc_reply_reviewers_avg": [
            53.333333333333336,
            27.81286672667087
        ],
        "wc_reply_authors_avg": [
            1118.3333333333333,
            432.80583278057713
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13218210379289351766&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Nanyang Technological University;INRIA",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ntu.edu.sg;https://www.inria.fr",
        "aff_unique_abbr": "NTU;INRIA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Singapore;France"
    },
    {
        "title": "Decongestion by Representation: Learning to Improve Economic Welfare in Marketplaces",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18283",
        "id": "coIaBY8EVF",
        "author_site": "Omer Nahum, Gali Noti, David Parkes, Nir Rosenfeld",
        "tldr": "",
        "abstract": "Congestion is a common failure mode of markets, where consumers compete inefficiently on the same subset of goods (e.g.,  chasing the same small set of properties on a vacation rental platform). The typical economic story is that prices  decongest by balancing supply and demand. But in modern online marketplaces, prices are typically set in a decentralized way by sellers, and the information about items is inevitably partial. The power of a platform  is limited to controlling *representations*---the subset of information about items presented by default to users. This motivates the present study of *decongestion by representation*, where a platform seeks to learn representations that reduce  congestion and thus improve social welfare. The technical challenge is twofold: relying only on revealed preferences from the choices of consumers, rather than true preferences; and the combinatorial problem associated with representations that  determine the  features to reveal in the default view.  We tackle both challenges by proposing a *differentiable proxy of welfare* that can be trained end-to-end on consumer choice data. We develop sufficient conditions for when decongestion promotes welfare, and present the results of extensive experiments on both synthetic and real data that demonstrate the utility of our approach.",
        "keywords": "congestion;decongestion;online marketplaces;learning in economic settings;efficient allocation",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/7fd43d17f722b6c4b9ba905bb611d48895539405.zip",
        "author": "Omer Nahum;Gali Noti;David C. Parkes;Nir Rosenfeld",
        "authorids": "~Omer_Nahum1;~Gali_Noti1;~David_C._Parkes1;~Nir_Rosenfeld2",
        "gender": ";Not Specified;M;M",
        "homepage": ";https://sites.google.com/view/galinoti;https://parkes.seas.harvard.edu/;https://nirr.cswp.cs.technion.ac.il",
        "dblp": "349/7730;143/9416.html;p/DavidCParkes.html;145/9800",
        "google_scholar": ";dr5wtMwAAAAJ;JUn8PgwAAAAJ;WTlgnYkAAAAJ",
        "orcid": ";;0000-0002-2701-3464;",
        "linkedin": "omer-nahum-82599a169/;;;",
        "or_profile": "~Omer_Nahum1;~Gali_Noti1;~David_C._Parkes1;~Nir_Rosenfeld2",
        "aff": "Technion - Israel Institute of Technology, Technion - Israel Institute of Technology;;Harvard University;Technion, Technion",
        "aff_domain": "campus.technion.ac.il;;harvard.edu;technion.ac.il",
        "position": "PhD student;;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nnahum2024decongestion,\ntitle={Decongestion by Representation: Learning to Improve Economic Welfare in Marketplaces},\nauthor={Omer Nahum and Gali Noti and David C. Parkes and Nir Rosenfeld},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=coIaBY8EVF}\n}",
        "github": "",
        "project": "",
        "reviewers": "1Wxo;gK2B;Gepo;7NAi",
        "pdf_size": 3669047,
        "rating": "6;6;8;8",
        "confidence": "3;3;2;3",
        "soundness": "4;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "102;89;106;84",
        "wc_strengths": "88;22;38;62",
        "wc_weaknesses": "174;15;18;53",
        "wc_questions": "46;772;2;111",
        "wc_review": "410;898;164;310",
        "wc_reply_reviewers": "0;0;0;54",
        "wc_reply_authors": "815;1003;31;374",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            95.25,
            9.03811374126261
        ],
        "wc_strengths_avg": [
            52.5,
            24.95495942693556
        ],
        "wc_weaknesses_avg": [
            65.0,
            64.67998144712165
        ],
        "wc_questions_avg": [
            232.75,
            313.74143414601775
        ],
        "wc_review_avg": [
            445.5,
            275.50816684809905
        ],
        "wc_reply_reviewers_avg": [
            13.5,
            23.382685902179844
        ],
        "wc_reply_authors_avg": [
            555.75,
            379.35430338932497
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9119806797140679060&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=coIaBY8EVF",
        "pdf": "https://openreview.net/pdf?id=coIaBY8EVF",
        "email": "campus.technion.ac.il;;harvard.edu;technion.ac.il",
        "author_num": 4,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Technion - Israel Institute of Technology;Harvard University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.technion.ac.il/en/;https://www.harvard.edu",
        "aff_unique_abbr": "Technion;Harvard",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Israel;United States"
    },
    {
        "id": "cos5cegz0c",
        "title": "LLaMA Rider: Spurring Large Language Models to Explore the Open World",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recently, various studies have leveraged Large Language Models (LLMs) to help decision-making and planning in environments, and try to align the LLMs' knowledge with the world conditions. Nonetheless, the capacity of LLMs to continuously acquire environmental knowledge and adapt in an open world remains uncertain. In this paper, we propose an approach to spur LLMs to explore the open world, gather experiences, and learn to improve their task-solving capabilities. In this approach, a multi-round feedback-revision mechanism is utilized to encourage LLMs to actively select appropriate revision actions guided by feedback information from the environment. This facilitates exploration and enhances the model's performance. Besides, we integrate sub-task relabeling to assist LLMs in maintaining consistency in sub-task planning and help the model learn the combinatorial nature between tasks, enabling it to complete a wider range of tasks through training based on the acquired exploration experiences. By evaluation in Minecraft, an open-ended sandbox world, we demonstrate that our approach LLaMA-Rider enhances the efficiency of the LLM in exploring the environment, and effectively improves the LLM's ability to accomplish more tasks through fine-tuning with merely 1.3k instances of collected data, showing minimal training costs compared to the baseline using reinforcement learning.",
        "keywords": "large language models; decision making; supervised finetuning",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Yicheng Feng;Yuxuan Wang;jiazheng liu;Sipeng Zheng;Zongqing Lu",
        "authorids": "~Yicheng_Feng1;~Yuxuan_Wang10;~jiazheng_liu2;~Sipeng_Zheng1;~Zongqing_Lu2",
        "gender": "M;M;;M;",
        "homepage": "https://takenpeanut.github.io/;https://z0ngqing.github.io/project/;https://github.com/saki-37;https://github.com/zhengsipeng;",
        "dblp": "340/4016;;;251/3691;",
        "google_scholar": ";CzgGl5cAAAAJ;;OonuDhcAAAAJ;",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Yicheng_Feng1;~Yuxuan_Wang10;~jiazheng_liu2;~Sipeng_Zheng1;~Zongqing_Lu2",
        "aff": "Peking University;Peking University;Peking University;Beijing Academy of Artificial Intelligence;",
        "aff_domain": "pku.edu.cn;pku.edu.cn;pku.edu.cn;baai.ac.cn;",
        "position": "PhD student;Undergrad student;PhD student;Researcher;",
        "bibtex": "@misc{\nfeng2024llama,\ntitle={{LL}a{MA} Rider: Spurring Large Language Models to Explore the Open World},\nauthor={Yicheng Feng and Yuxuan Wang and jiazheng liu and Sipeng Zheng and Zongqing Lu},\nyear={2024},\nurl={https://openreview.net/forum?id=cos5cegz0c}\n}",
        "github": "",
        "project": "",
        "reviewers": "Rfxo;WGZE;H4jk;XC6K",
        "site": "https://openreview.net/forum?id=cos5cegz0c",
        "pdf_size": 1982244,
        "rating": "1;3;6;6",
        "confidence": "4;4;4;3",
        "soundness": "1;2;3;3",
        "contribution": "1;2;3;2",
        "presentation": "2;2;4;3",
        "wc_summary": "90;81;137;170",
        "wc_strengths": "28;124;127;115",
        "wc_weaknesses": "199;469;109;189",
        "wc_questions": "131;114;122;197",
        "wc_review": "448;788;495;671",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            119.5,
            36.08670115153226
        ],
        "wc_strengths_avg": [
            98.5,
            40.94203219186854
        ],
        "wc_weaknesses_avg": [
            241.5,
            135.89977924926885
        ],
        "wc_questions_avg": [
            141.0,
            32.8861673048107
        ],
        "wc_review_avg": [
            600.5,
            136.4853471988843
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5443310539518174,
        "gs_citation": 17,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15268025450892846610&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "Peking University;Beijing Academy of Artificial Intelligence",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.baaic.cn",
        "aff_unique_abbr": "Peking U;BAAI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "End-to-End (Instance)-Image Goal Navigation through Correspondence as an Emergent Phenomenon",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18282",
        "id": "cphhnHjCvC",
        "author_site": "Guillaume Bono, Leonid Antsfeld, Boris Chidlovskii, Philippe Weinzaepfel, Christian Wolf",
        "tldr": "",
        "abstract": "Most recent work in goal oriented visual navigation resorts to large-scale machine learning in simulated environments. The main challenge lies in learning compact representations generalizable to unseen environments and in learning high-capacity perception modules capable of reasoning on high-dimensional input. The latter is particularly difficult when the goal is not given as a category (\"ObjectNav\") but as an exemplar image (\"ImageNav\"), as the perception module needs to learn a comparison strategy requiring to solve an underlying visual correspondence problem. This has been shown to be difficult from reward alone or with standard auxiliary tasks. We address this problem through a sequence of two pretext tasks, which serve as a prior for what we argue is one of the main bottleneck in perception, extremely wide-baseline relative pose estimation and visibility prediction in complex scenes. The first pretext task, cross-view completion is a proxy for the underlying visual correspondence problem, while the second task addresses goal detection and finding directly. We propose a new dual encoder with a large-capacity binocular ViT  model and show that correspondence solutions naturally emerge from the training signals. Experiments show significant improvements and SOTA performance on the two benchmarks, ImageNav and the Instance-ImageNav variant, where camera intrinsics and height differ between observation and goal.",
        "keywords": "Navigation;Embodied AI;Perception",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/b5f146e5ef34d0e3f0fa3fe9dbe687056413a388.zip",
        "author": "Guillaume Bono;Leonid Antsfeld;Boris Chidlovskii;Philippe Weinzaepfel;Christian Wolf",
        "authorids": "~Guillaume_Bono1;~Leonid_Antsfeld1;~Boris_Chidlovskii2;~Philippe_Weinzaepfel1;~Christian_Wolf5",
        "gender": "M;M;;M;M",
        "homepage": ";;;https://europe.naverlabs.com/people_user/Philippe-Weinzaepfel/;https://chriswolfvision.github.io/www/",
        "dblp": "225/4959;;;29/9989;38/2606-1.html",
        "google_scholar": "MkNg3H0AAAAJ;;;https://scholar.google.fr/citations?user=LSxIJ5cAAAAJ;idYS1AIAAAAJ",
        "orcid": "0000-0003-3001-2857;;;;",
        "linkedin": ";leonid-antsfeld-8bb3615;;;christian-wolf-522761249/",
        "or_profile": "~Guillaume_Bono1;~Leonid_Antsfeld1;~Boris_Chidlovskii2;~Philippe_Weinzaepfel1;~Christian_Wolf5",
        "aff": "Naver Labs Europe;Naver Labs Europe;;Naver Labs Europe;Naver Labs Europe",
        "aff_domain": "naverlabs.com;naverlabs.com;;naverlabs.com;naverlabs.com",
        "position": "Researcher;Researcher;;Research Scientist;Principal Researcher",
        "bibtex": "@inproceedings{\nbono2024endtoend,\ntitle={End-to-End (Instance)-Image Goal Navigation through Correspondence as an Emergent Phenomenon},\nauthor={Guillaume Bono and Leonid Antsfeld and Boris Chidlovskii and Philippe Weinzaepfel and Christian Wolf},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=cphhnHjCvC}\n}",
        "github": "",
        "project": "",
        "reviewers": "isxL;Sgek;1KiF;Q8jf",
        "pdf_size": 4140252,
        "rating": "6;6;8;8",
        "confidence": "4;5;5;4",
        "soundness": "4;3;4;3",
        "contribution": "3;3;3;3",
        "presentation": "4;4;3;3",
        "wc_summary": "128;60;102;96",
        "wc_strengths": "186;100;205;56",
        "wc_weaknesses": "315;249;147;180",
        "wc_questions": "507;109;28;31",
        "wc_review": "1136;518;482;363",
        "wc_reply_reviewers": "35;38;0;0",
        "wc_reply_authors": "1544;733;268;425",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            96.5,
            24.264171117101856
        ],
        "wc_strengths_avg": [
            136.75,
            61.1448076291029
        ],
        "wc_weaknesses_avg": [
            222.75,
            64.7393813686847
        ],
        "wc_questions_avg": [
            168.75,
            197.9701682072327
        ],
        "wc_review_avg": [
            624.75,
            300.69201436020876
        ],
        "wc_reply_reviewers_avg": [
            18.25,
            18.280795934531955
        ],
        "wc_reply_authors_avg": [
            742.5,
            492.04903210960595
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2213380400687314167&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=cphhnHjCvC",
        "pdf": "https://openreview.net/pdf?id=cphhnHjCvC",
        "email": "naverlabs.com;naverlabs.com;;naverlabs.com;naverlabs.com",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "NAVER LABS",
        "aff_unique_dep": "",
        "aff_unique_url": "https://labs.naver.com",
        "aff_unique_abbr": "NLE",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Unknown"
    },
    {
        "id": "crF9dk4poo",
        "title": "Interpretable Deep Clustering",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Clustering is a fundamental learning task widely used as a first step in data analysis. For example, biologists use cluster assignments to analyze genome sequences, medical records, or images. Since downstream analysis is typically performed at the cluster level, practitioners seek reliable and interpretable clustering models. We propose a new deep-learning framework for tabular data that predicts interpretable cluster assignments at the instance and cluster levels. First, we present a self-supervised procedure to identify the subset of the most informative features from each data point. Then, we design a model that predicts cluster assignments and a gate matrix that provides cluster-level feature selection. Overall, our model provides cluster assignments with an indication of the driving feature for each sample and each cluster. We show that the proposed method can reliably predict cluster assignments in synthetic and tabular biological datasets. Furthermore, using previously proposed metrics, we verify that our model leads to interpretable results at a sample and cluster level.",
        "keywords": "deep clustering;local feature selection;interpretability",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/689db744c2beaccda0bf5dcdd9759e60c5e08ecc.zip",
        "author": "Jonathan Svirsky;Ofir Lindenbaum",
        "authorids": "~Jonathan_Svirsky1;~Ofir_Lindenbaum1",
        "gender": "M;M",
        "homepage": ";https://www.eng.biu.ac.il/lindeno/",
        "dblp": "179/4135;142/4140",
        "google_scholar": "qRwzZmgAAAAJ;https://scholar.google.co.il/citations?user=jXxk6gcAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Jonathan_Svirsky1;~Ofir_Lindenbaum1",
        "aff": "Bar-Ilan University;Bar-Ilan University",
        "aff_domain": "biu.ac.il;biu.ac.il",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nsvirsky2024interpretable,\ntitle={Interpretable Deep Clustering},\nauthor={Jonathan Svirsky and Ofir Lindenbaum},\nyear={2024},\nurl={https://openreview.net/forum?id=crF9dk4poo}\n}",
        "github": "",
        "project": "",
        "reviewers": "viN8;AryA;6xNv",
        "site": "https://openreview.net/forum?id=crF9dk4poo",
        "pdf_size": 1350832,
        "rating": "5;6;8",
        "confidence": "4;4;4",
        "soundness": "3;2;4",
        "contribution": "2;2;3",
        "presentation": "2;3;4",
        "wc_summary": "44;69;135",
        "wc_strengths": "12;80;150",
        "wc_weaknesses": "85;144;47",
        "wc_questions": "85;6;1",
        "wc_review": "226;299;333",
        "wc_reply_reviewers": "158;0;0",
        "wc_reply_authors": "1541;1057;164",
        "reply_reviewers": "1;0;0",
        "reply_authors": "3;2;1",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            82.66666666666667,
            38.38691906829143
        ],
        "wc_strengths_avg": [
            80.66666666666667,
            56.3402362634576
        ],
        "wc_weaknesses_avg": [
            92.0,
            39.9082280572148
        ],
        "wc_questions_avg": [
            30.666666666666668,
            38.473656210740124
        ],
        "wc_review_avg": [
            286.0,
            44.63929509598765
        ],
        "wc_reply_reviewers_avg": [
            52.666666666666664,
            74.481914284983
        ],
        "wc_reply_authors_avg": [
            920.6666666666666,
            570.3638215112254
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Bar-Ilan University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.biu.ac.il",
        "aff_unique_abbr": "BIU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Israel"
    },
    {
        "id": "crMMk4I8Wy",
        "title": "Put Your Money Where Your Mouth Is: Evaluating Strategic Planning and Execution of LLM Agents in an Auction Arena",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Can Large Language Models (LLMs) simulate human behavior in complex environments?\nLLMs have recently been shown to exhibit advanced reasoning skills but much of NLP evaluation still relies on static benchmarks.\nAnswering this requires evaluation environments that probe strategic reasoning in competitive, dynamic scenarios that involve long-term planning.\nWe introduce AucArena, a novel simulation environment for evaluating LLMs within auctions, a setting chosen for being highly unpredictable and involving many skills related to resource and risk management, while being easy to evaluate.\nWe conduct several controlled simulations using state-of-the-art LLMs as bidding agents. \nWe find that through simple prompting, LLMs do indeed demonstrate many of the skills needed for effectively engaging in auctions (e.g., managing budget, adhering to long-term goals and priorities), skills that we find can be sharpened by explicitly encouraging models to be adaptive and observe strategies in past auctions.\nThese results are significant as they show the potential of using LLM agents to model intricate social dynamics, especially in competitive settings.\nHowever, we also observe considerable variability in the capabilities of individual LLMs.\nNotably, even our most advanced models (GPT-4) are occasionally surpassed by heuristic baselines and human agents, highlighting the potential for further improvements in the design of LLM agents and the important role that our simulation environment can play in further testing and refining agent architectures.",
        "keywords": "Large Language Models;Autonomous Agents;Strategic Planning;Simulation-based Evaluation",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Jiangjie Chen;Siyu Yuan;Rong Ye;Bodhisattwa Prasad Majumder;Kyle Richardson",
        "authorids": "~Jiangjie_Chen1;~Siyu_Yuan2;~Rong_Ye1;~Bodhisattwa_Prasad_Majumder1;~Kyle_Richardson1",
        "gender": "M;F;;M;F",
        "homepage": "https://jiangjiechen.github.io;https://reneeye.github.io/;https://www.majumderb.com/;https://www.nlp-kyle.com/;https://siyuyuan.github.io/",
        "dblp": "236/6076;84/5795.html;138/6177;38/9169;237/8189-01",
        "google_scholar": "https://scholar.google.com.hk/citations?user=XarNs8oAAAAJ;UV4u5UQAAAAJ;cEM1a5gAAAAJ;LmJN-n4AAAAJ;6JMfD44AAAAJ",
        "orcid": ";;;;0000-0001-8161-6429",
        "linkedin": ";;;;",
        "or_profile": "~Jiangjie_Chen1;~Rong_Ye1;~Bodhisattwa_Prasad_Majumder1;~Kyle_Richardson1;~siyu_Yuan1",
        "aff": "Fudan University;ByteDance;Allen Institute for Artificial Intelligence;Allen Institute for Artificial Intelligence;Fudan University",
        "aff_domain": "fudan.edu.cn;bytedance.com;allenai.org;allenai.org;fudan.edu.cn",
        "position": "PhD student;Researcher;Researcher;Research Scientist;PhD student",
        "bibtex": "@misc{\nchen2024put,\ntitle={Put Your Money Where Your Mouth Is: Evaluating Strategic Planning and Execution of {LLM} Agents in an Auction Arena},\nauthor={Jiangjie Chen and Siyu Yuan and Rong Ye and Bodhisattwa Prasad Majumder and Kyle Richardson},\nyear={2024},\nurl={https://openreview.net/forum?id=crMMk4I8Wy}\n}",
        "github": "",
        "project": "",
        "reviewers": "TdM7;eqke;PeRU;Yv5K",
        "site": "https://openreview.net/forum?id=crMMk4I8Wy",
        "pdf_size": 1323581,
        "rating": "3;3;3;6",
        "confidence": "4;4;5;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;2;3",
        "wc_summary": "96;85;35;102",
        "wc_strengths": "66;68;22;18",
        "wc_weaknesses": "173;378;60;15",
        "wc_questions": "60;72;6;180",
        "wc_review": "395;603;123;315",
        "wc_reply_reviewers": "272;95;0;0",
        "wc_reply_authors": "1367;1085;487;618",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "3;2;1;1",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            79.5,
            26.405491853021786
        ],
        "wc_strengths_avg": [
            43.5,
            23.553131426627754
        ],
        "wc_weaknesses_avg": [
            156.5,
            140.23997290359122
        ],
        "wc_questions_avg": [
            79.5,
            63.12487623750244
        ],
        "wc_review_avg": [
            359.0,
            172.09299811439163
        ],
        "wc_reply_reviewers_avg": [
            91.75,
            111.05938726645307
        ],
        "wc_reply_authors_avg": [
            889.25,
            354.24029626794294
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 55,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4050081998340996265&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;2;0",
        "aff_unique_norm": "Fudan University;ByteDance;Allen Institute for Artificial Intelligence",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.fudan.edu.cn;https://www.bytedance.com;https://allenai.org",
        "aff_unique_abbr": "Fudan;ByteDance;AI2",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "crP1HxQ5iw",
        "title": "Multi-agent Trajectory Prediction with Scalable Diffusion Transformer",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Accurate prediction of multi-agent spatiotemporal systems is critical to various real-world applications, such as autonomous driving, sports, and multiplayer games. \nUnfortunately, modeling multi-agent trajectories is challenging due to its complicated, interactive, and multi-modal nature. \nRecently, diffusion models have achieved great success in modeling multi-modal distribution and trajectory generation, showing promising ability in resolving this problem. \nMotivated by this, in this paper, we propose a novel multi-agent trajectory prediction framework, dubbed Scalable Diffusion Transformer (SDT), which is naturally designed to learn the complicated distribution and implicit interactions among agents. \nWe evaluate SDT on a set of real-world benchmark datasets and compare it with representative baseline methods, revealing the state-of-the-art multi-agent trajectory prediction ability of SDT in terms of accuracy and diversity.",
        "keywords": "multi-agent trajectory prediction;diffusion models;transformers;multi-modal distribution learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Shenyu Zhang;Shixiong Kai;Chang Chen;Yuzheng Zhuang;Zhengbang Zhu;Minghuan Liu;Weinan Zhang",
        "authorids": "~Shenyu_Zhang2;~Shixiong_Kai1;~Chang_Chen6;~Yuzheng_Zhuang1;~Zhengbang_Zhu1;~Minghuan_Liu1;~Weinan_Zhang1",
        "gender": "M;M;M;F;M;M;M",
        "homepage": "https://apex.sjtu.edu.cn/members/syzhang@apexlab.org;;https://github.com/chch9907;;https://github.com/zbzhu99;http://minghuanliu.com;http://wnzhang.net",
        "dblp": ";;;;277/0869;249/7554;28/10261-1",
        "google_scholar": ";https://scholar.google.com.hk/citations?hl=zh-CN;;https://scholar.google.com/citations?hl=en;;;Qzss0GEAAAAJ",
        "orcid": ";;;;;;0000-0002-0127-2425",
        "linkedin": ";;;;;;",
        "or_profile": "~Shenyu_Zhang2;~Shixiong_Kai1;~Chang_Chen6;~Yuzheng_Zhuang1;~Zhengbang_Zhu1;~Minghuan_Liu1;~Weinan_Zhang1",
        "aff": "Shanghai Jiaotong University;Huawei Technologies Ltd.;;Huawei Technologies Ltd.;Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn;huawei.com;;huawei.com;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn",
        "position": "MS student;Researcher;;Research Engineer;PhD student;PhD student;Associate Professor",
        "bibtex": "@misc{\nzhang2024multiagent,\ntitle={Multi-agent Trajectory Prediction with Scalable Diffusion Transformer},\nauthor={Shenyu Zhang and Shixiong Kai and Chang Chen and Yuzheng Zhuang and Zhengbang Zhu and Minghuan Liu and Weinan Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=crP1HxQ5iw}\n}",
        "github": "",
        "project": "",
        "reviewers": "VrGo;xv4S;imPC",
        "site": "https://openreview.net/forum?id=crP1HxQ5iw",
        "pdf_size": 3163598,
        "rating": "3;3;3",
        "confidence": "3;5;4",
        "soundness": "2;3;2",
        "contribution": "2;1;2",
        "presentation": "2;2;3",
        "wc_summary": "85;83;70",
        "wc_strengths": "27;63;22",
        "wc_weaknesses": "520;442;155",
        "wc_questions": "27;224;10",
        "wc_review": "659;812;257",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            79.33333333333333,
            6.649979114420002
        ],
        "wc_strengths_avg": [
            37.333333333333336,
            18.263503375736967
        ],
        "wc_weaknesses_avg": [
            372.3333333333333,
            156.94231070329278
        ],
        "wc_questions_avg": [
            87.0,
            97.1219165104698
        ],
        "wc_review_avg": [
            576.0,
            234.05554896220684
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=221864281132518525&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;0;0;0",
        "aff_unique_norm": "Shanghai Jiao Tong University;Huawei",
        "aff_unique_dep": ";Huawei Technologies",
        "aff_unique_url": "https://www.sjtu.edu.cn;https://www.huawei.com",
        "aff_unique_abbr": "SJTU;Huawei",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Generalized Policy Iteration using Tensor Approximation for Hybrid Control",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18281",
        "id": "csukJcpYDe",
        "author_site": "Suhan Shetty, Teng Xue, Sylvain Calinon",
        "tldr": "",
        "abstract": "Control of dynamic systems involving hybrid actions is a challenging task in robotics.  To address this, we present a novel algorithm called Generalized Policy Iteration using Tensor Train (TTPI) that belongs to the class of Approximate Dynamic Programming (ADP). We use a low-rank tensor approximation technique called Tensor Train (TT) to approximate the state-value and advantage function which enables us to efficiently handle hybrid systems. We demonstrate the superiority of our approach over previous baselines for some benchmark problems with hybrid action spaces. Additionally, the robustness and generalization of the policy for hybrid systems are showcased through a real-world robotics experiment involving a non-prehensile manipulation task which is considered to be a highly challenging control problem.",
        "keywords": "Optimal Control;Hybrid Actions;Robotics;Approximate Dynamic Programming;Tensor Approximation",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/bf64c633c8b95188350edcfdeb9d8cce26f66b20.zip",
        "author": "Suhan Shetty;Teng Xue;Sylvain Calinon",
        "authorids": "~Suhan_Shetty1;~Teng_Xue1;~Sylvain_Calinon1",
        "gender": "M;M;M",
        "homepage": "https://suhannshetty.github.io/;https://schortenger.github.io/;https://calinon.ch/",
        "dblp": "https://dblp.org/rec/journals/trob/ShettySC22;219/2424;59/6334",
        "google_scholar": "yLf21MoAAAAJ;https://scholar.google.com.hk/citations?user=sgFW7YwAAAAJ;t7VnipMAAAAJ",
        "orcid": "0000-0002-7550-9368;;0000-0002-9036-6799",
        "linkedin": ";;sylvaincalinon",
        "or_profile": "~Suhan_Shetty1;~Teng_Xue1;~Sylvain_Calinon1",
        "aff": ";Idiap Research Institute;EPFL - EPF Lausanne",
        "aff_domain": ";idiap.ch;epfl.ch",
        "position": ";PhD student;Lecturer",
        "bibtex": "@inproceedings{\nshetty2024generalized,\ntitle={Generalized Policy Iteration using Tensor Approximation for Hybrid Control},\nauthor={Suhan Shetty and Teng Xue and Sylvain Calinon},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=csukJcpYDe}\n}",
        "github": "",
        "project": "",
        "reviewers": "BNgN;F3ze;3rMV;ntHE",
        "pdf_size": 2628919,
        "rating": "6;8;8;8",
        "confidence": "3;4;5;2",
        "soundness": "2;4;4;3",
        "contribution": "3;4;4;3",
        "presentation": "3;3;4;3",
        "wc_summary": "98;64;116;84",
        "wc_strengths": "35;98;127;117",
        "wc_weaknesses": "160;280;100;49",
        "wc_questions": "24;19;42;23",
        "wc_review": "317;461;385;273",
        "wc_reply_reviewers": "33;42;24;0",
        "wc_reply_authors": "699;353;168;216",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "2;2;2;1",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            3.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            90.5,
            19.04599695474091
        ],
        "wc_strengths_avg": [
            94.25,
            35.75874019033668
        ],
        "wc_weaknesses_avg": [
            147.25,
            86.12599781715159
        ],
        "wc_questions_avg": [
            27.0,
            8.860022573334675
        ],
        "wc_review_avg": [
            359.0,
            71.13367697511495
        ],
        "wc_reply_reviewers_avg": [
            24.75,
            15.642490210960657
        ],
        "wc_reply_authors_avg": [
            359.0,
            207.70532010519133
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.2581988897471611,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14438245699618684666&as_sdt=5,34&sciodt=0,34&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=csukJcpYDe",
        "pdf": "https://openreview.net/pdf?id=csukJcpYDe",
        "email": ";idiap.ch;epfl.ch",
        "author_num": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Idiap Research Institute;EPFL",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.idiap.ch;https://www.epfl.ch",
        "aff_unique_abbr": "Idiap;EPFL",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Lausanne",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Switzerland"
    },
    {
        "id": "ctLqW170pj",
        "title": "Simplifying Self-Supervised Object Detection Pretraining",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Object detectors are often trained by first training the backbone in a self-supervised manner and then fine-tuning the whole model on annotated data. An unsupervised detector pretraining stage can also be interleaved, further improving the final performance and facilitating convergence during the supervised fine-tuning stage. However, existing unsupervised pretraining methods typically rely on low-level information to create pseudo-proposals that the model is then trained to localize, and ignore high-level class membership. The absence of class semantics from the pretraining objective causes a task gap between the pretraining and the downstream scenario, where detection is class-aware (e.g. given an image of a chair, the detector's task is to \\textit{both }localize it and assign the ``chair'' class to the corresponding bounding box). This gap results in suboptimal detector pretraining. We propose a framework that better aligns the pretraining and downstream stages. It consists of three simple yet key ingredients: (i) richer, semantics-based initial proposals derived from high-level feature maps, (ii) discriminative training using object pseudo-labels produced via clustering, (iii) self-training to take advantage of the improved object proposals learned by the detector. We report two main findings: (1) Our pretraining outperforms previous works on the full and low data regimes by significant margins across detector architectures. (2) We show we can pretrain detectors from scratch (including the backbone) directly on complex image datasets like COCO, paving the path for unsupervised representation learning using object detection directly as a pretext task.",
        "keywords": "unsupervised;self-supervised;object detection",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Ioannis Maniadis Metaxas;Adrian Bulat;Ioannis Patras;Brais Martinez;Georgios Tzimiropoulos",
        "authorids": "~Ioannis_Maniadis_Metaxas1;~Adrian_Bulat1;~Ioannis_Patras2;~Brais_Martinez3;~Georgios_Tzimiropoulos1",
        "gender": "M;;M;M;M",
        "homepage": "http://eecs.qmul.ac.uk/profiles/maniadismetaxasioannis.html;https://www.adrianbulat.com;http://www.eecs.qmul.ac.uk/~ioannisp/;http://www.braismartinez.org/;https://ytzimiro.github.io/",
        "dblp": "344/3789.html;185/6878;18/1556;14/111;03/3273",
        "google_scholar": "rhnYogoAAAAJ;https://scholar.google.co.uk/citations?user=5sKcsg0AAAAJ;https://scholar.google.com.tw/citations?user=OBYLxRkAAAAJ;https://scholar.google.co.uk/citations?user=-62MApgAAAAJ;https://scholar.google.co.uk/citations?user=D4JkWxf-8fwC",
        "orcid": ";0000-0002-3185-4979;0000-0003-3913-4738;;",
        "linkedin": ";;ioannis-patras-1053767/;;",
        "or_profile": "~Ioannis_Maniadis_Metaxas1;~Adrian_Bulat1;~Ioannis_Patras2;~Brais_Martinez3;~Georgios_Tzimiropoulos1",
        "aff": "Queen Mary, University of London;Samsung AI Center Cambridge;Queen Mary, University of London;Samsung;Queen Mary University London",
        "aff_domain": "qmul.ac.uk;samsung.com;qmul.ac.uk;samsung.com;qmul.ac.uk",
        "position": "PhD student;Research Scientist;Full Professor;Samsung AI Center;Associate Professor",
        "bibtex": "@misc{\nmetaxas2024simplifying,\ntitle={Simplifying Self-Supervised Object Detection Pretraining},\nauthor={Ioannis Maniadis Metaxas and Adrian Bulat and Ioannis Patras and Brais Martinez and Georgios Tzimiropoulos},\nyear={2024},\nurl={https://openreview.net/forum?id=ctLqW170pj}\n}",
        "github": "",
        "project": "",
        "reviewers": "Yy8P;DE28;xbku",
        "site": "https://openreview.net/forum?id=ctLqW170pj",
        "pdf_size": 4336607,
        "rating": "3;5;5",
        "confidence": "3;4;4",
        "soundness": "2;3;2",
        "contribution": "2;2;2",
        "presentation": "3;3;3",
        "wc_summary": "101;64;61",
        "wc_strengths": "44;73;144",
        "wc_weaknesses": "259;244;230",
        "wc_questions": "14;30;85",
        "wc_review": "418;411;520",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "697;776;566",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            75.33333333333333,
            18.190351532856337
        ],
        "wc_strengths_avg": [
            87.0,
            42.00793575821915
        ],
        "wc_weaknesses_avg": [
            244.33333333333334,
            11.841546445554407
        ],
        "wc_questions_avg": [
            43.0,
            30.40833219146796
        ],
        "wc_review_avg": [
            449.6666666666667,
            49.815214097257034
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            679.6666666666666,
            86.60382336953849
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.9999999999999998,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:oYn2RK64dkUJ:scholar.google.com/&scioq=Simplifying+Self-Supervised+Object+Detection+Pretraining&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;1;2",
        "aff_unique_norm": "Queen Mary, University of London;Samsung;Queen Mary University of London",
        "aff_unique_dep": ";AI Center;",
        "aff_unique_url": "https://www.qmul.ac.uk;https://www.samsung.com/global/innovation/ai-research/;https://www.qmul.ac.uk",
        "aff_unique_abbr": "QMUL;SAC;QMUL",
        "aff_campus_unique_index": "0;1;0;0",
        "aff_campus_unique": "London;Cambridge;",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "United Kingdom;South Korea"
    },
    {
        "id": "ctXZJLBbyb",
        "title": "Understanding Heterophily for Graph Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graphs with heterophily have been regarded as challenging scenarios for Graph Neural Networks (GNNs), where nodes are connected with dissimilar neighbors through various patterns. In this paper, we present theoretical understandings of the impacts of different heterophily patterns for GNNs by incorporating the graph convolution (GC) operations into fully connected networks via the proposed Heterophilous Stochastic Block Models (HSBM), a general random graph model that can accommodate diverse heterophily patterns.  Firstly, we show that by applying a GC operation, the separability gains are determined by two factors, i.e., the Euclidean distance of the neighborhood distributions and $\\sqrt{\\mathbb{E}\\left[\\operatorname{deg}\\right]}$, where $\\mathbb{E}\\left[\\operatorname{deg}\\right]$ is the averaged node degree. It reveals that the impact of heterophily on classification needs to be evaluated alongside the averaged node degree. Secondly, we show that the topological noise has a detrimental impact on separability, which is equivalent to degrading $\\mathbb{E}\\left[\\operatorname{deg}\\right]$. Finally, when applying multiple GC operations, we show that the separability gains are determined by the normalized distance of the $l$-powered neighborhood distributions. It indicates that the nodes still possess separability as $l$ goes to infinity in a wide range of regimes. Extensive experiments on both synthetic and real-world data verify the effectiveness of our theory.",
        "keywords": "Graph Neural Network; Networks with Heterophily; Over-smoothing",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/b270a8795e5ea421daa329c09cf858f700016bbd.zip",
        "author": "Junfu Wang;Yuanfang Guo;Liang Yang;Yunhong Wang",
        "authorids": "~Junfu_Wang1;~Yuanfang_Guo1;~Liang_Yang2;~Yunhong_Wang1",
        "gender": ";M;M;",
        "homepage": ";https://irip.buaa.edu.cn/andyguo/index.html;http://yangliang.github.io/;",
        "dblp": "276/6628.html;78/8545;05/3933-2;",
        "google_scholar": ";;7agkJogAAAAJ;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Junfu_Wang1;~Yuanfang_Guo1;~Liang_Yang2;~Yunhong_Wang1",
        "aff": "Beihang University;Beihang University;Hebei University of Technology;",
        "aff_domain": "buaa.edu.cn;buaa.edu.cn;hebut.edu.cn;",
        "position": "PhD student;Associate Professor;Full Professor;",
        "bibtex": "@misc{\nwang2024understanding,\ntitle={Understanding Heterophily for Graph Neural Networks},\nauthor={Junfu Wang and Yuanfang Guo and Liang Yang and Yunhong Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=ctXZJLBbyb}\n}",
        "github": "",
        "project": "",
        "reviewers": "Wh1i;sSgQ;Ngh1;fZmP;SYCa",
        "site": "https://openreview.net/forum?id=ctXZJLBbyb",
        "pdf_size": 1571347,
        "rating": "3;6;6;6;8",
        "confidence": "5;4;5;5;3",
        "soundness": "2;3;3;3;3",
        "contribution": "2;3;3;3;3",
        "presentation": "3;2;3;3;3",
        "wc_summary": "98;101;69;37;33",
        "wc_strengths": "54;6;91;26;21",
        "wc_weaknesses": "234;2;97;163;8",
        "wc_questions": "4;131;60;2;6",
        "wc_review": "390;240;317;228;68",
        "wc_reply_reviewers": "136;21;57;0;0",
        "wc_reply_authors": "1329;419;596;900;261",
        "reply_reviewers": "1;1;1;0;0",
        "reply_authors": "3;2;2;2;1",
        "rating_avg": [
            5.8,
            1.6
        ],
        "confidence_avg": [
            4.4,
            0.8
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.8,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            67.6,
            28.89705867385122
        ],
        "wc_strengths_avg": [
            39.6,
            30.030651008594536
        ],
        "wc_weaknesses_avg": [
            100.8,
            89.44137744914262
        ],
        "wc_questions_avg": [
            40.6,
            50.15017447626678
        ],
        "wc_review_avg": [
            248.6,
            107.50553474124018
        ],
        "wc_reply_reviewers_avg": [
            42.8,
            51.04272719986658
        ],
        "wc_reply_authors_avg": [
            701.0,
            378.981266027755
        ],
        "reply_reviewers_avg": [
            0.6,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            2.0,
            0.6324555320336759
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.71875,
        "gs_citation": 16,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10205261759747566091&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Beihang University;Hebei University of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.buaa.edu.cn/;http://www.hbut.edu.cn",
        "aff_unique_abbr": "BUAA;HUT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "On Differentially Private Federated Linear Contextual Bandits",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18280",
        "id": "cuAxSHcsSX",
        "author_site": "Xingyu Zhou, Sayak Ray Chowdhury",
        "tldr": "",
        "abstract": "We consider cross-silo federated linear contextual bandit (LCB) problem under differential privacy, where multiple silos interact with their respective local users and communicate via a central server to realize collaboration without sacrificing each user's privacy. We identify three issues in the state-of-the-art~\\citep{dubey2020differentially}: (i) failure of claimed privacy protection, (ii) incorrect regret bound due to noise miscalculation and (iii) ungrounded communication cost. \nTo resolve these issues, we take a two-step approach. First, we design an algorithmic framework consisting of a generic federated LCB algorithm and flexible privacy protocols. Then, leveraging the proposed framework, we study federated LCBs under two different privacy constraints. We first establish privacy and regret guarantees under silo-level local differential privacy, which fix the issues present in state-of-the-art algorithm.\nTo further improve the regret performance, we next consider shuffle model of differential privacy, under which we show that our algorithm can achieve nearly ``optimal'' regret without a trusted server. \nWe accomplish this via two different schemes --  one relies on a new result on privacy amplification via shuffling for DP mechanisms and another one leverages the integration of a shuffle protocol for vector sum into the tree-based mechanism, both of which might be of independent interest. Finally, we support our theoretical results with\nnumerical evaluations over contextual bandit instances generated from both synthetic and real-life data.",
        "keywords": "linear contextual bandits;federated learning;differential privacy",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/2e13a156fef4698e990809a9577590b273e0deab.zip",
        "author": "Xingyu Zhou;Sayak Ray Chowdhury",
        "authorids": "~Xingyu_Zhou2;~Sayak_Ray_Chowdhury1",
        "gender": "M;M",
        "homepage": "http://xingyuzhou.org;https://sites.google.com/view/sayakraychowdhury/home",
        "dblp": "07/10352-1;195/8152",
        "google_scholar": "AsTyRmwAAAAJ;Q0_CaxYAAAAJ",
        "orcid": ";",
        "linkedin": ";sayak-ray-chowdhury-54878154/",
        "or_profile": "~Xingyu_Zhou2;~Sayak_Ray_Chowdhury1",
        "aff": "Wayne State University;Microsoft Research",
        "aff_domain": "wayne.edu;microsoft.com",
        "position": "Assistant Professor;Postdoc",
        "bibtex": "@inproceedings{\nzhou2024on,\ntitle={On Differentially Private Federated Linear Contextual Bandits},\nauthor={Xingyu Zhou and Sayak Ray Chowdhury},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=cuAxSHcsSX}\n}",
        "github": "",
        "project": "",
        "reviewers": "cqha;SUqu;Gszt;kYUa",
        "pdf_size": 1903268,
        "rating": "6;6;8;8",
        "confidence": "4;4;3;3",
        "soundness": "2;3;3;4",
        "contribution": "3;2;3;3",
        "presentation": "4;3;3;4",
        "wc_summary": "98;86;120;38",
        "wc_strengths": "132;100;42;59",
        "wc_weaknesses": "186;239;19;9",
        "wc_questions": "1;28;37;42",
        "wc_review": "417;453;218;148",
        "wc_reply_reviewers": "19;40;0;0",
        "wc_reply_authors": "271;1027;118;109",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            85.5,
            30.012497396917837
        ],
        "wc_strengths_avg": [
            83.25,
            35.16656793035112
        ],
        "wc_weaknesses_avg": [
            113.25,
            101.06526356765711
        ],
        "wc_questions_avg": [
            27.0,
            15.827191791344413
        ],
        "wc_review_avg": [
            309.0,
            129.03681645173984
        ],
        "wc_reply_reviewers_avg": [
            14.75,
            16.513252253871737
        ],
        "wc_reply_authors_avg": [
            381.25,
            378.3413637180053
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 17,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1514737945219509631&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 9,
        "openreview": "https://openreview.net/forum?id=cuAxSHcsSX",
        "pdf": "https://openreview.net/pdf?id=cuAxSHcsSX",
        "email": "wayne.edu;microsoft.com",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Wayne State University;Microsoft",
        "aff_unique_dep": ";Microsoft Research",
        "aff_unique_url": "https://wayne.edu;https://www.microsoft.com/en-us/research",
        "aff_unique_abbr": "WSU;MSR",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "cuDefaAWpa",
        "title": "Modeling non-uniform uncertainty in Reaction Prediction via Boosting and Dropout",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Reaction Prediction has been commonly recognized as a critical task in synthetic chemistry. Some recent methods propose modeling reaction prediction in a non-autoregressive way to achieve efficient parallel decoding. All previous non-autoregressive reaction prediction methods apply conditional VAE (CVAE) to model uncertainty which have two potential assumptions: 1. The prior is independent of the reactants so each reactant by default has a wide range of product distribution 2. Similar reactants have similar product distribution. However, we investigate that this assumption is not matched to the reaction prediction task which has the Non-uniform uncertainty phenomenon. The Non-uniform uncertainty means the level of potential product uncertainty is different for different reactants. For similar reactants, the potential product distribution is not uniform and the products may be not similar. Directly applying CVAE for the reaction prediction task leads to uniform product distribution for all reactants and enforces the model to predict similar products for similar reactants, thus impairing the model performance. To address this issue, we devise a non-uniform uncertainty reaction product generation framework. We first remove the latent variable in the previous CVAE model to reduce the uncontrollable noise. To introduce randomness to product generation, we apply boosting training which can obtain large-difference models, and dropout which can obtain small-different models to cover precise and diverse uncertainty. We also designed a simple ranking method to combine the predicted products of boosting and dropout to move the most possible products to the front. Experimental results on the largest reaction prediction benchmark USPTO-MIT show the superior performance of our proposed method in modeling the non-uniform uncertainty compared to baselines.",
        "keywords": "AI for Chemistry;Deep Generative Models;Chemical Reaction",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Taicheng Guo;Changsheng Ma;Xiuying Chen;Bozhao Nan;Kehan Guo;Shichao Pei;Lu Yu;Nitesh V Chawla;Olaf Wiest;Xiangliang Zhang",
        "authorids": "~Taicheng_Guo1;~Changsheng_Ma1;~Xiuying_Chen1;~Bozhao_Nan1;~Kehan_Guo1;~Shichao_Pei1;~Lu_Yu1;~Nitesh_V_Chawla1;~Olaf_Wiest1;~Xiangliang_Zhang1",
        "gender": "M;M;F;M;M;;M;M;F;M",
        "homepage": "https://taichengguo.github.io/;;https://iriscxy.github.io/;;https://kehanguo2.github.io/KehanGuo/;https://scpei.github.io/;;https://chemistry.nd.edu/people/olaf-wiest/;https://sites.nd.edu/xiangliang-zhang/;http://niteshchawla.nd.edu",
        "dblp": "325/5109;157/0949;33/11343.html;;;168/9433;04/1781-6.html;;74/1890-1;c/NiteshVChawla.html",
        "google_scholar": "OA_UdcIAAAAJ;https://scholar.google.com/citations?hl=zh-CN;COUnAF4AAAAJ;https://scholar.google.com/citations?hl=zh-CN;t8iRCLUAAAAJ;https://scholar.google.ca/citations?user=IDaNWgIAAAAJ;ODK41KwAAAAJ;bfywzJwAAAAJ;BhRJe4wAAAAJ;hDLBEhkAAAAJ",
        "orcid": "0000-0001-7919-6912;;;;;0000-0002-0802-1506;;0000-0001-9316-7720;0000-0002-3574-5665;",
        "linkedin": ";;;;kehan98/;;;;;",
        "or_profile": "~Taicheng_Guo1;~Changsheng_Ma1;~Xiuying_Chen1;~Bozhao_Nan1;~Kehan_Guo1;~Shichao_Pei1;~Lu_Yu1;~Olaf_Wiest1;~Xiangliang_Zhang1;~Nitesh_Chawla1",
        "aff": "University of Notre Dame;;King Abdullah University of Science and Technology;University of Notre Dame;University of Notre Dame;University of Massachusetts Boston;Ant Group;University of Notre Dame;University of Notre Dame;University of Notre Dame",
        "aff_domain": "nd.edu;;kaust.edu.sa;nd.edu;nd.edu;umb.edu;antgroup.com;nd.edu;nd.edu;nd.edu",
        "position": "PhD student;;PhD student;PhD student;PhD student;Assistant Professor;Researcher;Full Professor;Associate Professor;Full Professor",
        "bibtex": "@misc{\nguo2024modeling,\ntitle={Modeling non-uniform uncertainty in Reaction Prediction via Boosting and Dropout},\nauthor={Taicheng Guo and Changsheng Ma and Xiuying Chen and Bozhao Nan and Kehan Guo and Shichao Pei and Lu Yu and Nitesh V Chawla and Olaf Wiest and Xiangliang Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=cuDefaAWpa}\n}",
        "github": "",
        "project": "",
        "reviewers": "KPLt;VFvZ;ywGc",
        "site": "https://openreview.net/forum?id=cuDefaAWpa",
        "pdf_size": 1420949,
        "rating": "3;5;5",
        "confidence": "3;5;3",
        "soundness": "1;3;3",
        "contribution": "2;2;3",
        "presentation": "2;4;3",
        "wc_summary": "163;41;58",
        "wc_strengths": "60;94;78",
        "wc_weaknesses": "384;286;619",
        "wc_questions": "120;261;179",
        "wc_review": "727;682;934",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            87.33333333333333,
            53.95265414128288
        ],
        "wc_strengths_avg": [
            77.33333333333333,
            13.888444437333106
        ],
        "wc_weaknesses_avg": [
            429.6666666666667,
            139.72910298939954
        ],
        "wc_questions_avg": [
            186.66666666666666,
            57.81772123569805
        ],
        "wc_review_avg": [
            781.0,
            109.73604694903129
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3997879071326478607&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0;2;3;0;0;0",
        "aff_unique_norm": "University of Notre Dame;King Abdullah University of Science and Technology;University of Massachusetts Boston;Ant Group",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.nd.edu;https://www.kast.kau.edu.sa;https://www.umb.edu;https://www.antgroup.com",
        "aff_unique_abbr": "Notre Dame;KAUST;UMass Boston;Ant Group",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Boston",
        "aff_country_unique_index": "0;1;0;0;0;2;0;0;0",
        "aff_country_unique": "United States;Saudi Arabia;China"
    },
    {
        "id": "cvGdPXaydP",
        "title": "Planning with an Ensemble of World Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Motion planning is of critical importance for safe navigation in complex urban environments. Historically, motion planners (MPs) have been evaluated using procedurally-generated simulators like CARLA. However, such synthetic benchmarks are not reflective of real-world multi-agent interactions. nuPlan, a recently released MP benchmark, addresses this limitation by augmenting real-world driving logs with closed-loop simulation logic, effectively turning the fixed dataset into a reactive \u201cgym\u201d simulator. We evaluate the quality of nuPlan\u2019s Default-Gym and find that it does not accurately reflect real-world human behavior, particularly for cities with unique driving behaviors (e.g., Boston drivers tend to be more aggressive than Pittsburgh drivers). Therefore, we propose city-specific gyms (e.g., a Boston-Gym and Pittsburgh-Gym) to evaluate planning performance. Evaluating a state-of-the-art planner with our proposed ensemble of gyms yields a drop in performance, suggesting that a good planner must adapt to different environments. Leveraging this insight, we present City-Driver, a model-predictive control (MPC) based planner that unrolls a city-specific world model that adapts to different driving conditions. Our extensive experiments demonstrate that City-Driver achieves state-of-the-art results on the nuPlan benchmark, reducing test error from 6.4% to 4.8%.",
        "keywords": "Motion Planning;Evaluating Motion Planning;World Models",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/50c92ce30788d4eec9c566eadbdae656bcdefa67.zip",
        "author": "Arun Balajee Vasudevan;Neehar Peri;Deva Ramanan",
        "authorids": "~Arun_Balajee_Vasudevan1;~Neehar_Peri1;~Deva_Ramanan1",
        "gender": "M;M;M",
        "homepage": ";http://neeharperi.com;https://www.cs.cmu.edu/~deva/",
        "dblp": "147/3992;241/5094;49/488",
        "google_scholar": "8cioAJoAAAAJ;X3cGY7wAAAAJ;9B8PoXUAAAAJ",
        "orcid": ";;",
        "linkedin": ";neeharperi/;",
        "or_profile": "~Arun_Balajee_Vasudevan1;~Neehar_Peri1;~Deva_Ramanan1",
        "aff": "Carnegie Mellon University;Carnegie Mellon University;School of Computer Science, Carnegie Mellon University",
        "aff_domain": "cmu.edu;cmu.edu;cs.cmu.edu",
        "position": "Postdoc;PhD student;Full Professor",
        "bibtex": "@misc{\nvasudevan2024planning,\ntitle={Planning with an Ensemble of World Models},\nauthor={Arun Balajee Vasudevan and Neehar Peri and Deva Ramanan},\nyear={2024},\nurl={https://openreview.net/forum?id=cvGdPXaydP}\n}",
        "github": "",
        "project": "",
        "reviewers": "RiCh;np2p;8uCs;2dAe",
        "site": "https://openreview.net/forum?id=cvGdPXaydP",
        "pdf_size": 1597405,
        "rating": "3;3;3;8",
        "confidence": "3;3;3;3",
        "soundness": "2;2;2;3",
        "contribution": "2;1;2;3",
        "presentation": "2;3;2;3",
        "wc_summary": "121;209;68;153",
        "wc_strengths": "35;26;57;107",
        "wc_weaknesses": "174;179;298;58",
        "wc_questions": "67;34;19;97",
        "wc_review": "397;448;442;415",
        "wc_reply_reviewers": "111;0;0;0",
        "wc_reply_authors": "412;317;684;264",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.25,
            2.165063509461097
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            137.75,
            51.12423593561081
        ],
        "wc_strengths_avg": [
            56.25,
            31.395660528168538
        ],
        "wc_weaknesses_avg": [
            177.25,
            84.87453976311153
        ],
        "wc_questions_avg": [
            54.25,
            30.177599308096063
        ],
        "wc_review_avg": [
            425.5,
            20.62159062730128
        ],
        "wc_reply_reviewers_avg": [
            27.75,
            48.064409910036346
        ],
        "wc_reply_authors_avg": [
            419.25,
            161.78902156821394
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:4PZuvp2Er4cJ:scholar.google.com/&scioq=Planning+with+an+Ensemble+of+World+Models&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Carnegie Mellon University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cmu.edu",
        "aff_unique_abbr": "CMU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Pittsburgh",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "cvh6jtM9CT",
        "title": "Differential evolving to the optimal neural network controller",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Obtaining the general optimal solution for the Optimal Control Problem (OCP) has been a classical but challenging problem for a long time. Existing methods have significant difficulties in addressing such issue and usually OCPs have to be solved numerically with specific boundary conditions given. By leveraging the powerful approximation ability of deep neural networks, a Differential Evolution (DE) algorithm is developed to tackle this challenge, where the deep neural network models are used as the optimal controllers to be optimized. Aiming to the general optimal control problems with free terminal states, which covers a large class of problems, two deep neural networks, namely the Optimal Controller Neural Network (OCNN) and Time Predictor Neural Network (TPNN), are introduced. The dynamic approach is established upon the derived differential evolution equations for the parameters of the neural networks. It is shown that the general optimal solution may be obtained with the proposed method and the resulting neural network controllers perform well as shown by the numerical examples.",
        "keywords": "optimal control;general optimal solution;deep neural networks;Lyapunov dynamics stability;differential evolution algorithm",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Sheng Zhang",
        "authorids": "~Sheng_Zhang17",
        "gender": "M",
        "homepage": "https://siee.cumt.edu.cn/info/1013/1086.htm",
        "dblp": "",
        "google_scholar": "",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Sheng_Zhang17",
        "aff": "China Aerodynamics Research and Development Center",
        "aff_domain": "cardc.cn",
        "position": "Full Professor",
        "bibtex": "@misc{\nzhang2024differential,\ntitle={Differential evolving to the optimal neural network controller},\nauthor={Sheng Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=cvh6jtM9CT}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=cvh6jtM9CT",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:k1NwpiZYzy8J:scholar.google.com/&scioq=Differential+evolving+to+the+optimal+neural+network+controller&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "China Aerodynamics Research and Development Center",
        "aff_unique_dep": "",
        "aff_unique_url": "",
        "aff_unique_abbr": "",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "cwN69teRIW",
        "title": "Prototypes-Injected Prompt for Federated Class Incremental Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Federated Class Incremental Learning (FCIL) is a new challenge in continual learning (CL) that addresses catastrophic forgetting and non-IID data distribution simultaneously. Existing FCIL methods call for high communication costs and exemplars from previous classes along with performance issues. We propose a novel rehearsal-free method for FCIL named prototypes-injected prompt (PIP) that involves 3 main ideas: a) prototype injection on prompt learning,  b) prototype augmentation, and c) weighted Gaussian aggregation on the server side.  Our experiment results show that the proposed method outperforms the current state of the arts (SOTAs) with a significant gap of 14-33% in CIFAR100, MiniImageNet, and TinyImageNet datasets. Our extensive analysis demonstrates the robustness of our proposed method in different task sizes, small participating local clients, and small global rounds. For further study, source codes of PIP, baseline, and experimental logs are shared publicly in https://anonymous.4open.science/r/an122pouyyt789/.",
        "keywords": "federated class incremental learning;federated learning;class incremental learning;continual learning;prompt;prototype",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Muhammad Anwar Ma'sum;Mahardhika Pratama;Savitha Ramasamy;Lin Liu;H Habibullah;Ryszard Kowalczyk",
        "authorids": "~Muhammad_Anwar_Ma'sum1;~Mahardhika_Pratama1;~Savitha_Ramasamy1;~Lin_Liu4;~H_Habibullah1;~Ryszard_Kowalczyk2",
        "gender": "M;M;F;Not Specified;M;",
        "homepage": "https://github.com/anwarmaxsum;https://www.mpratama.com/;;https://people.unisa.edu.au/lin.liu;https://people.unisa.edu.au/habibullah.habibullah;https://people.unisa.edu.au/Ryszard.Kowalczyk",
        "dblp": "159/5446.html;55/9613;07/11214;61/2115-3;;",
        "google_scholar": "rLBuJGIAAAAJ;5nF0eQYAAAAJ;SLQ1lxgAAAAJ;QP6jqRwAAAAJ;https://scholar.google.com.au/citations?user=y6UwDCMAAAAJ;",
        "orcid": "0000-0002-9251-7781;0000-0001-6531-5087;0000-0003-1534-2989;0000-0003-2843-5738;0000-0002-9542-9525;",
        "linkedin": ";;;;h-habibullah-95858313a/;",
        "or_profile": "~Muhammad_Anwar_Ma'sum1;~Mahardhika_Pratama1;~Savitha_Ramasamy1;~Lin_Liu4;~H_Habibullah1;~Ryszard_Kowalczyk2",
        "aff": "Universitas Indonesia;University of South Australia;Institute for Infocomm Research, Agency for Science, Technology and Research, Singapore;University of South Australia, Australia;University of South Australia;Systems Research Institute Polish Academy of Sciences",
        "aff_domain": "cs.ui.ac.id;unisa.edu.au;i2r.a-star.edu.sg;unisa.edu.au;unisa.edu.au;ibspan.waw.pl",
        "position": "Lecturer;Associate Professor;Principal Researcher;Full Professor;Lecturer;Full Professor",
        "bibtex": "@misc{\nma'sum2024prototypesinjected,\ntitle={Prototypes-Injected Prompt for Federated Class Incremental Learning},\nauthor={Muhammad Anwar Ma'sum and Mahardhika Pratama and Savitha Ramasamy and Lin Liu and H Habibullah and Ryszard Kowalczyk},\nyear={2024},\nurl={https://openreview.net/forum?id=cwN69teRIW}\n}",
        "github": "",
        "project": "",
        "reviewers": "3BAT;Rs3a;5UUj;P3dj",
        "site": "https://openreview.net/forum?id=cwN69teRIW",
        "pdf_size": 2531088,
        "rating": "3;3;5;6",
        "confidence": "5;4;4;1",
        "soundness": "1;3;3;3",
        "contribution": "1;2;3;3",
        "presentation": "1;1;3;3",
        "wc_summary": "40;56;39;68",
        "wc_strengths": "29;38;18;57",
        "wc_weaknesses": "284;250;338;40",
        "wc_questions": "25;5;3;4",
        "wc_review": "378;349;398;169",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            1.5
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.0,
            1.0
        ],
        "wc_summary_avg": [
            50.75,
            12.028611723719408
        ],
        "wc_strengths_avg": [
            35.5,
            14.291605927956452
        ],
        "wc_weaknesses_avg": [
            228.0,
            112.98672488394378
        ],
        "wc_questions_avg": [
            9.25,
            9.12071817347735
        ],
        "wc_review_avg": [
            323.5,
            90.88591750100782
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.8339503888294595,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1202589546789600891&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;2;1;1;3",
        "aff_unique_norm": "Universitas Indonesia;University of South Australia;Agency for Science, Technology and Research;Polish Academy of Sciences",
        "aff_unique_dep": ";;Institute for Infocomm Research;Systems Research Institute",
        "aff_unique_url": "https://www.ui.ac.id;https://www.unisa.edu.au;https://www.a-star.edu.sg;https://www.pan.pl",
        "aff_unique_abbr": "UI;UNISA;A*STAR;PAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;1;1;3",
        "aff_country_unique": "Indonesia;Australia;Singapore;Poland"
    },
    {
        "title": "Procedural Fairness Through Decoupling Objectionable Data Generating Components",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18279",
        "id": "cxfPefbu1s",
        "author_site": "Zeyu Tang, Jialu Wang, Yang Liu, Peter Spirtes, Kun Zhang",
        "tldr": "",
        "abstract": "We reveal and address the frequently overlooked yet important issue of _disguised procedural unfairness_, namely, the potentially inadvertent alterations on the behavior of neutral (i.e., not problematic) aspects of data generating process, and/or the lack of procedural assurance of the greatest benefit of the least advantaged individuals. Inspired by John Rawls's advocacy for _pure procedural justice_ (Rawls, 1971; 2001), we view automated decision-making as a microcosm of social institutions, and consider how the data generating process itself can satisfy the requirements of procedural fairness. We propose a framework that decouples the objectionable data generating components from the neutral ones by utilizing reference points and the associated value instantiation rule. Our findings highlight the necessity of preventing _disguised procedural unfairness_, drawing attention not only to the objectionable data generating components that we aim to mitigate, but also more importantly, to the neutral components that we intend to keep unaffected.",
        "keywords": "Procedural Fairness;Decouple Objectionable Component;Reference Point;Causal Fairness;Data Generating Process;Bias Mitigation",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/3942aeae974133ff05a68480df9146867eb98666.zip",
        "author": "Zeyu Tang;Jialu Wang;Yang Liu;Peter Spirtes;Kun Zhang",
        "authorids": "~Zeyu_Tang1;~Jialu_Wang1;~Yang_Liu3;~Peter_Spirtes1;~Kun_Zhang1",
        "gender": ";;M;M;M",
        "homepage": "https://zeyu.one;https://people.ucsc.edu/~jwang470/;http://www.yliuu.com;https://www.cmu.edu/dietrich/philosophy/people/faculty/spirtes.html;http://www.andrew.cmu.edu/user/kunz1/",
        "dblp": "296/1601-2;195/2701;51/3710-18;87/3550;96/3115-1",
        "google_scholar": "https://scholar.google.com/citations?hl=en;HOtDeN0AAAAJ;jKrIVCIAAAAJ;mar1eCwAAAAJ;RGoypN4AAAAJ",
        "orcid": "0000-0002-4423-4728;;0000-0001-8420-6011;;",
        "linkedin": ";;;;",
        "or_profile": "~Zeyu_Tang1;~Jialu_Wang1;~Yang_Liu3;~Peter_Spirtes1;~Kun_Zhang1",
        "aff": "Carnegie Mellon University;University of California, Santa Cruz;University of California, Santa Cruz;Carnegie Mellon University;Carnegie Mellon University",
        "aff_domain": "cmu.edu;ucsc.edu;ucsc.edu;cmu.edu;cmu.edu",
        "position": "PhD student;PhD student;Assistant Professor;Full Professor;Associate Professor",
        "bibtex": "@inproceedings{\ntang2024procedural,\ntitle={Procedural Fairness Through Decoupling Objectionable Data Generating Components},\nauthor={Zeyu Tang and Jialu Wang and Yang Liu and Peter Spirtes and Kun Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=cxfPefbu1s}\n}",
        "github": "",
        "project": "",
        "reviewers": "R8GC;GSnz;2K3E",
        "pdf_size": 2104017,
        "rating": "6;6;8",
        "confidence": "2;4;3",
        "soundness": "3;3;4",
        "contribution": "2;2;3",
        "presentation": "3;2;3",
        "wc_summary": "58;138;52",
        "wc_strengths": "44;46;54",
        "wc_weaknesses": "71;161;63",
        "wc_questions": "68;4;56",
        "wc_review": "241;349;225",
        "wc_reply_reviewers": "10;48;13",
        "wc_reply_authors": "611;801;670",
        "reply_reviewers": "1;1;1",
        "reply_authors": "2;3;2",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            82.66666666666667,
            39.20317447463775
        ],
        "wc_strengths_avg": [
            48.0,
            4.320493798938574
        ],
        "wc_weaknesses_avg": [
            98.33333333333333,
            44.43222054120436
        ],
        "wc_questions_avg": [
            42.666666666666664,
            27.776888874666213
        ],
        "wc_review_avg": [
            271.6666666666667,
            55.071670474835685
        ],
        "wc_reply_reviewers_avg": [
            23.666666666666668,
            17.249798710580816
        ],
        "wc_reply_authors_avg": [
            694.0,
            79.40193112680993
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16039575124528984423&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=cxfPefbu1s",
        "pdf": "https://openreview.net/pdf?id=cxfPefbu1s",
        "email": "cmu.edu;ucsc.edu;ucsc.edu;cmu.edu;cmu.edu",
        "author_num": 5,
        "aff_unique_index": "0;1;1;0;0",
        "aff_unique_norm": "Carnegie Mellon University;University of California, Santa Cruz",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cmu.edu;https://www.ucsc.edu",
        "aff_unique_abbr": "CMU;UCSC",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Santa Cruz",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "cxt2Auexc3",
        "title": "Editing Personality for Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper introduces  an innovative task focused on editing the personality traits of Large Language Models (LLMs). This task seeks to adjust the models' responses to opinion-related questions on specified topics since an individual's personality often manifests in the form of their expressed opinions, thereby showcasing different personality traits. Specifically, we construct a new benchmark dataset PersonalityEdit to address this task. Drawing on the theory in Social Psychology, we isolate three representative traits, namely Neuroticism, Extraversion, and Agreeableness, as the foundation for our benchmark. We then gather data using GPT-4, generating responses that not only align with a specified topic but also embody the targeted personality trait. \nWe conduct comprehensive experiments involving various baselines and discuss the representation of personality behavior in LLMs. Our intriguing findings uncover potential challenges of the proposed task, illustrating several remaining issues. We anticipate that our work can provide the NLP community with insights.",
        "keywords": "personality;model editing;large language models",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/eaf056cd0b7fbff395c0161d9c0a65e54f13cfec.zip",
        "author": "Shengyu Mao;Ningyu Zhang;Xiaohan Wang;Mengru Wang;Yunzhi Yao;Yong Jiang;Pengjun Xie;Fei Huang;Huajun Chen",
        "authorids": "~Shengyu_Mao1;~Ningyu_Zhang1;~Xiaohan_Wang4;~Mengru_Wang1;~Yunzhi_Yao1;~Yong_Jiang1;~Pengjun_Xie2;~Fei_Huang1;~Huajun_Chen1",
        "gender": "M;M;;F;M;M;M;M;M",
        "homepage": ";https://person.zju.edu.cn/en/ningyu;https://github.com/Wangxh-07;;http://yyzcowtodd.cn;http://jiangyong.site/;;;https://sites.google.com/view/fei-huang",
        "dblp": ";139/4181-1.html;;59/8499;295/9476;;212/1755.html;94/5089;h/FeiHuang.html",
        "google_scholar": "n_424pEAAAAJ;xQDOPvsAAAAJ;;P3bp0egAAAAJ;https://scholar.google.com.hk/citations?user=nAagIwEAAAAJ;sxXZWQQAAAAJ;;;9r98PpoAAAAJ",
        "orcid": ";0000-0002-1970-0678;;0000-0002-4488-9871;;;;;",
        "linkedin": ";ningyuzhang/;;;;;;;fei-huang-cas-cmu",
        "or_profile": "~Shengyu_Mao1;~Ningyu_Zhang1;~Xiaohan_Wang4;~Mengru_Wang1;~Yunzhi_Yao1;~Yong_Jiang1;~Pengjun_Xie2;~Huajun_Chen1;~Fei_Huang2",
        "aff": "Zhejiang University;Zhejiang University;Zhejiang University;Zhejiang University;University of California, Los Angeles;Tongyi Lab;Alibaba Group;Zhejiang University;Alibaba Group US",
        "aff_domain": "zju.edu.cn;zju.edu.cn;zju.edu.cn;zju.edu.cn;ucla.edu;alibaba-inc.com;alibaba-inc.com;zju.edu.cn;alibaba-inc.com",
        "position": "MS student;Associate Professor;MS student;PhD student;Researcher;Researcher;Researcher;Full Professor;Senior Research Director",
        "bibtex": "@misc{\nmao2024editing,\ntitle={Editing Personality for Large Language Models},\nauthor={Shengyu Mao and Ningyu Zhang and Xiaohan Wang and Mengru Wang and Yunzhi Yao and Yong Jiang and Pengjun Xie and Fei Huang and Huajun Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=cxt2Auexc3}\n}",
        "github": "",
        "project": "",
        "reviewers": "8XJt;pC5b;89xa;Jf2K",
        "site": "https://openreview.net/forum?id=cxt2Auexc3",
        "pdf_size": 1357562,
        "rating": "3;6;6;8",
        "confidence": "3;3;2;3",
        "soundness": "2;3;4;3",
        "contribution": "2;3;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "66;66;46;21",
        "wc_strengths": "64;54;83;86",
        "wc_weaknesses": "305;140;24;31",
        "wc_questions": "85;44;369;53",
        "wc_review": "520;304;522;191",
        "wc_reply_reviewers": "334;73;0;0",
        "wc_reply_authors": "1853;845;1158;370",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "3;3;2;1",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            49.75,
            18.498310733685926
        ],
        "wc_strengths_avg": [
            71.75,
            13.273563952458284
        ],
        "wc_weaknesses_avg": [
            125.0,
            113.64638137661929
        ],
        "wc_questions_avg": [
            137.75,
            134.37889529237842
        ],
        "wc_review_avg": [
            384.25,
            142.46819820577502
        ],
        "wc_reply_reviewers_avg": [
            101.75,
            137.36152117678373
        ],
        "wc_reply_authors_avg": [
            1056.5,
            538.6856690130154
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -0.08084520834544431,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1690709491390295456&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;0;0;1;2;3;0;3",
        "aff_unique_norm": "Zhejiang University;University of California, Los Angeles;Tongyi Lab;Alibaba Group",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.zju.edu.cn;https://www.ucla.edu;;https://www.alibaba.com",
        "aff_unique_abbr": "ZJU;UCLA;;Alibaba",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Los Angeles",
        "aff_country_unique_index": "0;0;0;0;1;0;0;1",
        "aff_country_unique": "China;United States;"
    },
    {
        "id": "cz0kQD95o4",
        "title": "pFedSAM: Secure Federated Learning Against Backdoor Attacks via Personalized Sharpness-Aware Minimization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Federated learning is a distributed learning paradigm that allows clients to perform collaboratively model training without sharing their local data. Despite its benefit, federated learning is vulnerable to backdoor attacks where malicious clients inject backdoors into the global model aggregation process so that the resulting model will misclassify the samples with backdoor triggers while performing normally on the benign samples. Existing defenses against backdoor attacks either are effective only under very specific attack models or severely deteriorate the model performance on benign samples. To address these deficiencies, this paper proposes pFedSAM, a new federated learning method based on partial model personalization and sharpness-aware training. Theoretically, we analyze the convergence properties of pFedSAM for the general non-convex and heterogeneous data setting. Empirically, we conduct extensive experiments on a suite of federated datasets and show the superiority of pFedSAM over state-of-the-art robust baselines in terms of both robustness and accuracy.",
        "keywords": "personalized federated learing;backdoor attack;model security",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Zhenxiao Zhang;Yuanxiong Guo;Yanmin Gong",
        "authorids": "~Zhenxiao_Zhang2;~Yuanxiong_Guo1;~Yanmin_Gong1",
        "gender": "M;;F",
        "homepage": "https://zhen-xiao-zhang.github.io/;;https://yanmingong.github.io/",
        "dblp": "321/1073;93/10800;145/6503-1",
        "google_scholar": "W_IQOlkAAAAJ;FK_8hMkAAAAJ;o3BGIEMAAAAJ",
        "orcid": "0000-0002-5914-5525;0000-0003-2241-125X;",
        "linkedin": ";yuanxiong-guo-7666749b/;",
        "or_profile": "~Zhenxiao_Zhang2;~Yuanxiong_Guo1;~Yanmin_Gong1",
        "aff": "University of Texas at San Antonio;University of Texas at San Antonio;University of Texas, San Antonio",
        "aff_domain": "utsa.edu;utsa.edu;utsa.edu",
        "position": "PhD student;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nzhang2024pfedsam,\ntitle={pFed{SAM}: Secure Federated Learning Against Backdoor Attacks via Personalized Sharpness-Aware Minimization},\nauthor={Zhenxiao Zhang and Yuanxiong Guo and Yanmin Gong},\nyear={2024},\nurl={https://openreview.net/forum?id=cz0kQD95o4}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZAXx;ByDC;qy2r;DHbL",
        "site": "https://openreview.net/forum?id=cz0kQD95o4",
        "pdf_size": 401019,
        "rating": "3;3;3;6",
        "confidence": "4;5;4;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;1;3",
        "presentation": "3;2;2;3",
        "wc_summary": "16;104;52;67",
        "wc_strengths": "24;23;70;93",
        "wc_weaknesses": "379;321;574;54",
        "wc_questions": "61;2;155;59",
        "wc_review": "480;450;851;273",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            59.75,
            31.56243811875122
        ],
        "wc_strengths_avg": [
            52.5,
            30.120590963658067
        ],
        "wc_weaknesses_avg": [
            332.0,
            185.86150758024104
        ],
        "wc_questions_avg": [
            69.25,
            54.883399129427104
        ],
        "wc_review_avg": [
            513.5,
            210.29800284358384
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:QLcuidc4FaUJ:scholar.google.com/&scioq=pFedSAM:+Secure+Federated+Learning+Against+Backdoor+Attacks+via+Personalized+Sharpness-Aware+Minimization&hl=en&as_sdt=0,31",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Texas at San Antonio",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.utsa.edu",
        "aff_unique_abbr": "UTSA",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "San Antonio",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "czpx02orl7",
        "title": "Learning Abstract World Models for Value-preserving Planning with Options",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "General-purpose agents require fine-grained controls and rich sensory inputs to perform a wide range of tasks. However, this complexity often leads to intractable decision-making. Traditionally, agents are provided with task-specific action and observation spaces to mitigate this challenge, but this reduces autonomy. \nInstead, agents must be capable of building state-action spaces at the correct abstraction level from their sensorimotor experiences. We leverage the structure of a given set of temporally extended actions to learn abstract Markov decision processes (MDPs) that operate at a higher level of temporal and state granularity. We characterize state abstractions necessary to ensure that planning with these skills, by simulating trajectories in the abstract MDP, results in policies with bounded value loss in the original MDP.\nWe evaluate our approach in goal-based navigation environments that require continuous abstract states to plan successfully and show that abstract model learning improves the sample efficiency of planning and learning.",
        "keywords": "Model-based RL;Options;Temporal abstraction;State abstraction;Representation learning;reinforcement learning;MDPs",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/7112221549caf9137027dfffddb17bc69e2b29cd.pdf",
        "author": "Rafael Rodriguez-Sanchez;George Konidaris",
        "authorids": "~Rafael_Rodriguez-Sanchez1;~George_Konidaris1",
        "gender": "M;M",
        "homepage": "https://rafarodsa.github.io;http://cs.brown.edu/people/gdk/",
        "dblp": ";56/6762",
        "google_scholar": "ONxoqRUAAAAJ;9UERvVEAAAAJ",
        "orcid": ";",
        "linkedin": "rodriguezsrafa/;",
        "or_profile": "~Rafael_Rodriguez-Sanchez1;~George_Konidaris1",
        "aff": "Brown University;Brown University",
        "aff_domain": "brown.edu;brown.edu",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nrodriguez-sanchez2024learning,\ntitle={Learning Abstract World Models for Value-preserving Planning with Options},\nauthor={Rafael Rodriguez-Sanchez and George Konidaris},\nyear={2024},\nurl={https://openreview.net/forum?id=czpx02orl7}\n}",
        "github": "",
        "project": "",
        "reviewers": "NRqK;dCJp;gKE9;36E8",
        "site": "https://openreview.net/forum?id=czpx02orl7",
        "pdf_size": 4378175,
        "rating": "3;3;5;8",
        "confidence": "4;4;3;4",
        "soundness": "3;2;2;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "79;153;74;56",
        "wc_strengths": "67;20;44;43",
        "wc_weaknesses": "715;73;174;76",
        "wc_questions": "349;253;215;89",
        "wc_review": "1210;499;507;264",
        "wc_reply_reviewers": "63;44;0;5",
        "wc_reply_authors": "726;221;383;291",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            90.5,
            37.08436328157732
        ],
        "wc_strengths_avg": [
            43.5,
            16.62077013859466
        ],
        "wc_weaknesses_avg": [
            259.5,
            266.1038331178264
        ],
        "wc_questions_avg": [
            226.5,
            93.2027360113425
        ],
        "wc_review_avg": [
            620.0,
            354.3465817529499
        ],
        "wc_reply_reviewers_avg": [
            28.0,
            26.42915057280502
        ],
        "wc_reply_authors_avg": [
            405.25,
            193.8922058773895
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.07053456158585983,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6254757207385358849&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Brown University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.brown.edu",
        "aff_unique_abbr": "Brown",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "d0BXudm2S4",
        "title": "Natural Counterfactuals With Necessary Backtracking",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Counterfactual reasoning, a cognitive ability possessed by humans, is being actively studied for incorporation into machine learning systems. In the causal modelling approach to counterfactuals, Judea Pearl's theory remains the most influential and dominant. However, being thoroughly non-backtracking, the counterfactual probability distributions defined by Pearl can be hard to learn by non-parametric models, even when the causal structure is fully given. A big challenge is that non-backtracking counterfactuals can easily step outside of the support of the training data, the inference of which becomes highly unreliable with the current machine learning models.\nTo mitigate this issue, we propose an alternative theory of counterfactuals, namely, \\emph{natural counterfactuals}. This theory is concerned with counterfactuals within the support of the data distribution, and defines in a principled way a different kind of counterfactual that backtracks if (but only if) necessary. To demonstrate potential applications of the theory and illustrate the advantages of natural counterfactuals, we conduct a case study of counterfactual generation and discuss empirical observations that lend support to our approach.",
        "keywords": "Counterfactuals",
        "primary_area": "causal reasoning",
        "supplementary_material": "",
        "author": "Guang-Yuan Hao;Jiji Zhang;Biwei Huang;Hao Wang;Kun Zhang",
        "authorids": "~Guang-Yuan_Hao1;~Jiji_Zhang1;~Biwei_Huang1;~Hao_Wang3;~Kun_Zhang1",
        "gender": ";M;F;M;M",
        "homepage": "https://github.com/GuangyuanHao;;;http://www.andrew.cmu.edu/user/kunz1/;http://www.wanghao.in",
        "dblp": ";99/3659;165/3288;96/3115-1;w/HaoWang-14",
        "google_scholar": ";5GAikocAAAAJ;;RGoypN4AAAAJ;NrOA9QoAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Guang-Yuan_Hao1;~Jiji_Zhang1;~Biwei_Huang1;~Kun_Zhang1;~Hao_Wang4",
        "aff": "Hong Kong University of Science and Technology;The Chinese University of Hong Kong;University of California, San Diego;Carnegie Mellon University;Rutgers University",
        "aff_domain": "ust.hk;cuhk.edu.hk;ucsd.edu;cmu.edu;cs.rutgers.edu",
        "position": "MS student;Professor;Assistant Professor;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nhao2024natural,\ntitle={Natural Counterfactuals With Necessary Backtracking},\nauthor={Guang-Yuan Hao and Jiji Zhang and Biwei Huang and Hao Wang and Kun Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=d0BXudm2S4}\n}",
        "github": "",
        "project": "",
        "reviewers": "WXgG;adRY;CJwc",
        "site": "https://openreview.net/forum?id=d0BXudm2S4",
        "pdf_size": 877301,
        "rating": "5;5;6",
        "confidence": "3;3;1",
        "soundness": "3;2;3",
        "contribution": "2;3;3",
        "presentation": "3;3;4",
        "wc_summary": "26;22;102",
        "wc_strengths": "23;4;96",
        "wc_weaknesses": "161;480;35",
        "wc_questions": "2;31;1",
        "wc_review": "212;537;234",
        "wc_reply_reviewers": "0;0;24",
        "wc_reply_authors": "1544;1474;737",
        "reply_reviewers": "0;0;1",
        "reply_authors": "4;4;2",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            50.0,
            36.8057966449127
        ],
        "wc_strengths_avg": [
            41.0,
            39.65686153324121
        ],
        "wc_weaknesses_avg": [
            225.33333333333334,
            187.27935165296668
        ],
        "wc_questions_avg": [
            11.333333333333334,
            13.912424503139471
        ],
        "wc_review_avg": [
            327.6666666666667,
            148.29325301202644
        ],
        "wc_reply_reviewers_avg": [
            8.0,
            11.313708498984761
        ],
        "wc_reply_authors_avg": [
            1251.6666666666667,
            365.04459392731127
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:xJTi9kh2JnAJ:scholar.google.com/&scioq=Natural+Counterfactuals+With+Necessary+Backtracking&hl=en&as_sdt=0,5",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Chinese University of Hong Kong;University of California, San Diego;Carnegie Mellon University;Rutgers University",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.ust.hk;https://www.cuhk.edu.hk;https://www.ucsd.edu;https://www.cmu.edu;https://www.rutgers.edu",
        "aff_unique_abbr": "HKUST;CUHK;UCSD;CMU;Rutgers",
        "aff_campus_unique_index": "0;0;1",
        "aff_campus_unique": "Hong Kong SAR;San Diego;",
        "aff_country_unique_index": "0;0;1;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "d18RgYF6Y7",
        "title": "Fair Classifiers Without Fair Training: An Influence-Guided Data Sampling Approach",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "A fair classifier should ensure the benefit of people from different groups, while the group information is often sensitive and unsuitable for model training. Therefore, learning a fair classifier but excluding sensitive attributes in the training dataset is important. In this paper, we study learning fair classifiers without implementing fair training algorithms to avoid possible leakage of sensitive information. Our theoretical analyses validate the possibility of this approach, that traditional training on a dataset with an appropriate distribution shift can reduce both the upper bound for fairness disparity and model generalization error, indicating that fairness and accuracy can be improved simultaneously with simply traditional training. We then propose a tractable solution to progressively shift the original training data during training by sampling influential data, where the sensitive attribute of new data is not accessed in sampling or used in training. Extensive experiments on real-world data demonstrate the effectiveness of our proposed algorithm.",
        "keywords": "Fairness; Sampling",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Jinlong Pang;Zhaowei Zhu;Jialu Wang;Yuanshun Yao;Chen Qian;Yang Liu",
        "authorids": "~Jinlong_Pang2;~Zhaowei_Zhu1;~Jialu_Wang1;~Yuanshun_Yao2;~Chen_Qian4;~Yang_Liu3",
        "gender": ";M;;;M;M",
        "homepage": ";https://www.zzw.ai;https://people.ucsc.edu/~jwang470/;;https://users.soe.ucsc.edu/~qian/;http://www.yliuu.com",
        "dblp": ";202/1712;195/2701;;;51/3710-18",
        "google_scholar": ";YS8pSQoAAAAJ;HOtDeN0AAAAJ;;;jKrIVCIAAAAJ",
        "orcid": ";0000-0003-3894-5862;;;;0000-0001-8420-6011",
        "linkedin": ";;;;;",
        "or_profile": "~Jinlong_Pang2;~Zhaowei_Zhu1;~Jialu_Wang1;~Yuanshun_Yao2;~Chen_Qian4;~Yang_Liu3",
        "aff": ";Docta.ai;University of California, Santa Cruz;;University of California, Santa Cruz;University of California, Santa Cruz",
        "aff_domain": ";docta.ai;ucsc.edu;;ucsc.edu;ucsc.edu",
        "position": ";Researcher;PhD student;;Full Professor;Assistant Professor",
        "bibtex": "@misc{\npang2024fair,\ntitle={Fair Classifiers Without Fair Training: An Influence-Guided Data Sampling Approach},\nauthor={Jinlong Pang and Zhaowei Zhu and Jialu Wang and Yuanshun Yao and Chen Qian and Yang Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=d18RgYF6Y7}\n}",
        "github": "",
        "project": "",
        "reviewers": "6fEn;B8Mi;UQLS;FJTt;wM5N",
        "site": "https://openreview.net/forum?id=d18RgYF6Y7",
        "pdf_size": 476495,
        "rating": "5;5;5;5;6",
        "confidence": "2;2;5;2;4",
        "soundness": "2;2;3;2;3",
        "contribution": "2;3;2;3;2",
        "presentation": "2;3;3;2;3",
        "wc_summary": "75;117;54;60;103",
        "wc_strengths": "58;26;47;45;61",
        "wc_weaknesses": "266;345;197;262;301",
        "wc_questions": "78;3;1;74;34",
        "wc_review": "477;491;299;441;499",
        "wc_reply_reviewers": "10;0;222;0;91",
        "wc_reply_authors": "939;802;804;1382;628",
        "reply_reviewers": "1;0;2;0;1",
        "reply_authors": "3;3;3;5;3",
        "rating_avg": [
            5.2,
            0.39999999999999997
        ],
        "confidence_avg": [
            3.0,
            1.2649110640673518
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            81.8,
            24.424577785501224
        ],
        "wc_strengths_avg": [
            47.4,
            12.338557452149743
        ],
        "wc_weaknesses_avg": [
            274.2,
            48.799180320984895
        ],
        "wc_questions_avg": [
            38.0,
            33.184333653096004
        ],
        "wc_review_avg": [
            441.4,
            73.9232033937924
        ],
        "wc_reply_reviewers_avg": [
            64.6,
            85.78950984823261
        ],
        "wc_reply_authors_avg": [
            911.0,
            255.36013784457433
        ],
        "reply_reviewers_avg": [
            0.8,
            0.7483314773547883
        ],
        "reply_authors_avg": [
            3.4,
            0.8
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.3952847075210474,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10779679811012357065&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Docta.ai;University of California, Santa Cruz",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://docta.ai;https://www.ucsc.edu",
        "aff_unique_abbr": "Docta.ai;UCSC",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Santa Cruz",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "d1MbVCsPuj",
        "title": "Can pre-trained models assist in dataset distillation?",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Dataset Distillation (DD) is a prominent technique that encapsulates knowledge from a large-scale original dataset into a small synthetic dataset for efficient training. Meanwhile, Pre-trained Models (PTMs) function as knowledge repositories, containing extensive information from the original dataset. This naturally raises a question: Can PTMs effectively transfer knowledge to synthetic datasets, guiding DD accurately? To this end, we conduct preliminary experiments, confirming the contribution of PTMs to DD. Afterwards, we systematically study different options in PTMs, including initialization parameters, model architecture, training epoch and domain knowledge, revealing that: 1) Increasing model diversity enhances the performance of synthetic datasets; 2) Sub-optimal models can also assist in DD and outperform well-trained ones in certain cases; 3) Domain-specific PTMs are not mandatory for DD, but a reasonable domain match is crucial. Finally, by selecting optimal options, we significantly improve the cross-architecture generalization over baseline DD methods. We hope our work will facilitate researchers to develop better DD techniques. Our code is available at https://anonymous.4open.science/r/DDInterpreter-0DC5.",
        "keywords": "Dataset Distillation;Pre-trained Models",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/be7f9f9327b6d0aa1156e623ef46e6900d8f50b5.pdf",
        "author": "Yao Lu;Xuguang Chen;Yuchen Zhang;Jianyang Gu;Tianle Zhang;Kai Wang;Yifan Zhang;Xiaoniu Yang;Qi Xuan;Yang You",
        "authorids": "~Yao_Lu15;~Xuguang_Chen1;~Yuchen_Zhang8;~Jianyang_Gu1;~Tianle_Zhang4;~Kai_Wang8;~Yifan_Zhang1;~Xiaoniu_Yang1;~Qi_Xuan1;~Yang_You1",
        "gender": "M;M;M;M;M;M;M;M;M;M",
        "homepage": "https://yaolu-zjut.github.io/;https://github.com/CHENXGG;https://yuczhang.com/;https://vimar-gu.github.io/;;https://kaiwang960112.github.io/;https://sites.google.com/view/yifan-zhang/%E9%A6%96%E9%A1%B5;;http://xuanqi-net.com;https://www.comp.nus.edu.sg/~youy/",
        "dblp": ";;;241/7332.html;;78/2022-36;57/4707-4;87/7662;37/8888-1;33/8167-1.html",
        "google_scholar": "k-vcxSsAAAAJ;;Y2oqeP0AAAAJ;8ZXbT18AAAAJ;;i2II0XIAAAAJ;https://scholar.google.com.hk/citations?user=zuYIUJEAAAAJ;;muCGnXwAAAAJ;jF4dPZwAAAAJ",
        "orcid": "0000-0003-0655-7814;;;;0000-0003-1502-9730;0000-0002-1154-5175;;0000-0003-3117-2211;0000-0002-1042-470X;",
        "linkedin": ";;;;;;;;;yang-you-0b92914b/",
        "or_profile": "~Yao_Lu15;~Xuguang_Chen1;~Yuchen_Zhang8;~Jianyang_Gu1;~Tianle_Zhang4;~Kai_Wang8;~Yifan_Zhang1;~Xiaoniu_Yang1;~Qi_Xuan1;~Yang_You1",
        "aff": "Zhejiang University;Zhejiang University of Technology;University of Electronic Science and Technology of China;Zhejiang University;University of Electronic Science and Technology of China;National University of Singapore;National University of Singapore;Zhejiang University of Technology;Zhejiang University of Technology;National University of Singapore",
        "aff_domain": "zju.edu.cn;zjut.edu.cn;uestc.edu.cn;zju.edu.cn;cn.edu;u.nus.edu;nus.edu;zjut.edu.cn;zjut.edu.cn;nus.edu.sg",
        "position": "Intern;Undergrad student;Undergrad student;PhD student;Undergrad student;PhD student;PhD student;Principal Researcher;Full Professor;Professor",
        "bibtex": "@misc{\nlu2024can,\ntitle={Can pre-trained models assist in dataset distillation?},\nauthor={Yao Lu and Xuguang Chen and Yuchen Zhang and Jianyang Gu and Tianle Zhang and Kai Wang and Yifan Zhang and Xiaoniu Yang and Qi Xuan and Yang You},\nyear={2024},\nurl={https://openreview.net/forum?id=d1MbVCsPuj}\n}",
        "github": "",
        "project": "",
        "reviewers": "Kiov;nf4G;qWjp;KYoU",
        "site": "https://openreview.net/forum?id=d1MbVCsPuj",
        "pdf_size": 14559095,
        "rating": "3;5;5;6",
        "confidence": "4;2;5;4",
        "soundness": "1;2;2;2",
        "contribution": "1;2;2;2",
        "presentation": "2;3;2;2",
        "wc_summary": "72;88;51;136",
        "wc_strengths": "10;33;33;113",
        "wc_weaknesses": "381;59;54;245",
        "wc_questions": "16;18;105;4",
        "wc_review": "479;198;243;498",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            86.75,
            31.315930450810495
        ],
        "wc_strengths_avg": [
            47.25,
            39.10482706776748
        ],
        "wc_weaknesses_avg": [
            184.75,
            136.97878485371376
        ],
        "wc_questions_avg": [
            35.75,
            40.33841221466209
        ],
        "wc_review_avg": [
            354.5,
            135.1082899011012
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": -0.052631578947368425,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11357847589156453507&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;0;2;3;3;1;1;3",
        "aff_unique_norm": "Zhejiang University;Zhejiang University of Technology;University of Electronic Science and Technology of China;National University of Singapore",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.zju.edu.cn;https://www.zjut.edu.cn;https://www.uestc.edu.cn;https://www.nus.edu.sg",
        "aff_unique_abbr": "ZJU;ZJUT;UESTC;NUS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;1;1;0;0;1",
        "aff_country_unique": "China;Singapore"
    },
    {
        "id": "d1zLRzhalF",
        "title": "Knowledge Graph Reasoning with Reinforcement Learning Agent guided by Multi-relational Graph Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Reinforcement Learning (RL) has emerged as a highly effec- tive technique in various applications, including Knowledge Graph (KG) Completion. KG Completion involves navigat- ing through an incomplete KG from a source entity to a target entity based on a given query relation. However, existing RL- based approaches only focus on training the agent to move along the graph, seldom take into account the multi-relation connectivity inherent in knowledge graphs. In this paper, we propose a novel approach, Reinforcement learning agent Guided by Multi-relation Graph Neural Network(RGMG). Our approach develop a Multi-relation Graph Attention Net- work (MGAT) which generate high quality KG entity and relation embedding to help agent navigation. Additionally, we develop a Query-aware Action Embedding Enhancement (QAE) module to strength information contained in action embedding. Experiments on various KG reasoning bench- marks demonstrate that RGMG is highly competitive and out- performed current state-of-the-art RL-based methods in dif- ferent dataset.",
        "keywords": "Knowledge Graphs;Reinforcement Learning;Graph Neural Networks",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/48b531dd8b5aa913b71b2278138e22690da664e8.zip",
        "author": "Chung Wang Wong;Michael Ng",
        "authorids": "~Chung_Wang_Wong1;~Michael_Ng3",
        "gender": "M;",
        "homepage": ";https://hkumath.hku.hk/~mng/",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": "wong-466bb1153/;",
        "or_profile": "~Chung_Wang_Wong1;~Michael_Ng3",
        "aff": "University of Hong Kong;The University of Hong Kong",
        "aff_domain": "hku.hk;hku.hk",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nwong2024knowledge,\ntitle={Knowledge Graph Reasoning with Reinforcement Learning Agent guided by Multi-relational Graph Neural Networks},\nauthor={Chung Wang Wong and Michael Ng},\nyear={2024},\nurl={https://openreview.net/forum?id=d1zLRzhalF}\n}",
        "github": "",
        "project": "",
        "reviewers": "Sumk;SJXD;bkR9;34kk",
        "site": "https://openreview.net/forum?id=d1zLRzhalF",
        "pdf_size": 548134,
        "rating": "1;3;3;3",
        "confidence": "4;4;5;3",
        "soundness": "1;2;3;3",
        "contribution": "1;2;2;2",
        "presentation": "2;1;1;2",
        "wc_summary": "43;54;52;52",
        "wc_strengths": "12;22;47;51",
        "wc_weaknesses": "70;100;269;277",
        "wc_questions": "1;12;30;55",
        "wc_review": "126;188;398;435",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            50.25,
            4.264680527307995
        ],
        "wc_strengths_avg": [
            33.0,
            16.446884203398525
        ],
        "wc_weaknesses_avg": [
            179.0,
            94.63878697447468
        ],
        "wc_questions_avg": [
            24.5,
            20.426698215815495
        ],
        "wc_review_avg": [
            286.75,
            132.23723945999478
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:JAzLgw58sTgJ:scholar.google.com/&scioq=Knowledge+Graph+Reasoning+with+Reinforcement+Learning+Agent+guided+by+Multi-relational+Graph+Neural+Networks&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Hong Kong",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.hku.hk",
        "aff_unique_abbr": "HKU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "d2TOOGbrtP",
        "title": "Bayesian Domain Invariant Learning via Posterior Generalization of Parameter Distributions",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Domain invariant learning aims to learn models that extract invariant features over various training domains, resulting in better generalization to unseen target domains. Recently, Bayesian Neural Networks have achieved promising results in domain invariant learning, but most works concentrate on aligning features distributions rather than parameter distributions. Inspired by the principle of Bayesian Neural Network, we attempt to directly learn the domain invariant posterior distribution of network parameters. We first propose a theorem to show that the invariant posterior of parameters can be implicitly inferred by aggregating posteriors on different training domains. Our assumption is more relaxed and allows us to extract more domain invariant information. We also propose a simple yet effective method, named PosTerior Generalization (PTG), that can be used to estimate the invariant parameter distribution. PTG fully exploits variational inference to approximate parameter distributions, including the invariant posterior and the posteriors on training domains. Furthermore, we develop a lite version of PTG for widespread applications. PTG shows competitive performance on various domain generalization benchmarks on DomainBed. Additionally, PTG can use any existing domain generalization methods as its prior, and combined with previous state-of-the-art method the performance can be further improved. Code will be made public.",
        "keywords": "Domain generalization;Domain Invariant Learning;Bayesian neural network",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/cc0900ec31282524f063f37ca9739b53a87e3d60.zip",
        "author": "Shiyu Shen;Xia Xu;Tianyang Shi;Tao Li;Zhenwei Shi;Bin Pan",
        "authorids": "~Shiyu_Shen1;~Xia_Xu1;~Tianyang_Shi1;~Tao_Li10;~Zhenwei_Shi2;~Bin_Pan1",
        "gender": "M;F;;M;M;M",
        "homepage": "https://github.com/Teemo341;;;http://ics.nankai.edu.cn;http://levir.buaa.edu.cn/index.htm;",
        "dblp": ";;;75/4601-22;;",
        "google_scholar": ";;;;https://scholar.google.com.hk/citations?user=kNhFWQIAAAAJ;sgWhbbAAAAAJ",
        "orcid": ";0000-0001-9743-3096;;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Shiyu_Shen1;~Xia_Xu1;~Tianyang_Shi1;~Tao_Li10;~Zhenwei_Shi2;~Bin_Pan1",
        "aff": "Nankai University;;;Nankai University;Beihang University;",
        "aff_domain": "nankai.edu.cn;;;nankai.edu.cn;buaa.edu.cn;",
        "position": "PhD student;;;Full Professor;Full Professor;",
        "bibtex": "@misc{\nshen2024bayesian,\ntitle={Bayesian Domain Invariant Learning via Posterior Generalization of Parameter Distributions},\nauthor={Shiyu Shen and Xia Xu and Tianyang Shi and Tao Li and Zhenwei Shi and Bin Pan},\nyear={2024},\nurl={https://openreview.net/forum?id=d2TOOGbrtP}\n}",
        "github": "",
        "project": "",
        "reviewers": "BPVw;6EBt;EkMw;mZKN",
        "site": "https://openreview.net/forum?id=d2TOOGbrtP",
        "pdf_size": 379662,
        "rating": "3;5;6;6",
        "confidence": "3;3;4;4",
        "soundness": "1;3;3;3",
        "contribution": "2;3;2;1",
        "presentation": "2;2;2;1",
        "wc_summary": "92;58;59;114",
        "wc_strengths": "20;47;27;39",
        "wc_weaknesses": "317;10;66;658",
        "wc_questions": "63;180;194;555",
        "wc_review": "492;295;346;1366",
        "wc_reply_reviewers": "23;10;17;504",
        "wc_reply_authors": "297;571;1086;2279",
        "reply_reviewers": "1;1;1;2",
        "reply_authors": "1;5;8;15",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            80.75,
            23.573024837725004
        ],
        "wc_strengths_avg": [
            33.25,
            10.449282272003183
        ],
        "wc_weaknesses_avg": [
            262.75,
            255.81182048529345
        ],
        "wc_questions_avg": [
            248.0,
            184.40037960915373
        ],
        "wc_review_avg": [
            624.75,
            434.02498487990295
        ],
        "wc_reply_reviewers_avg": [
            138.5,
            211.07167029234407
        ],
        "wc_reply_authors_avg": [
            1058.25,
            759.5911317939408
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            7.25,
            5.11737237261468
        ],
        "replies_avg": [
            40,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.8164965809277259,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:XrQH7VSTBaEJ:scholar.google.com/&scioq=Bayesian+Domain+Invariant+Learning+via+Posterior+Generalization+of+Parameter+Distributions&hl=en&as_sdt=0,23",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Nankai University;Beihang University",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.nankai.edu.cn;http://www.buaa.edu.cn/",
        "aff_unique_abbr": "NKU;BUAA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "d2YjPbSpDZ",
        "title": "Understanding the Theoretical Generalization Performance of Federated Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Federated Learning (FL) has become widely popular because of its applicability in training ML on different sites without data sharing. \nHowever, the generalization performance of FL has remained relatively under-explored, primarily due to the intricate interplay between data heterogeneity and the local update procedures intrinsic to FL.\nThis motivates us to answer a fundamental question in FL: How can we precisely quantify the impact of data heterogeneity and the local update process on the generalization performance for FL as the learning process evolves?\nTo this end, we conduct a comprehensive theoretical study of FL's generalization performance using a linear model as the first step, where the data heterogeneity is considered for both the stationary and online/non-stationary cases. \nBy providing closed-form expressions of the model error, we rigorously quantify the impact of local update steps (denoted as $K$) under three distinct settings ($K=1$, $K<\\infty$, and $K=\\infty$) and how the generalization performance evolves with the round number $t$. \nOur investigation also provides a comprehensive understanding of how different configurations (including the number of model parameters $p$ and the number of training samples $n$) contribute to the overall generalization performance, thus shedding new insights (such as benign overfitting) for the practical implementation of FL.",
        "keywords": "Federated Learning;generalization performance;double descent;overfitting",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Peizhong Ju;Haibo Yang;Jia Liu;Yingbin Liang;Ness Shroff",
        "authorids": "~Peizhong_Ju1;~Haibo_Yang1;~Jia_Liu1;~Yingbin_Liang1;~Ness_Shroff1",
        "gender": "M;M;M;F;M",
        "homepage": ";https://haibo-yang-osu.github.io/homepage/;https://kevinliu-osu.github.io/index.html;https://sites.google.com/view/yingbinliang/home;http://newslab.ece.ohio-state.edu/",
        "dblp": "167/9021;43/7829-1;;51/332;67/1991",
        "google_scholar": "VDzpfOYAAAAJ;eyy22VoAAAAJ;Ofx3dScAAAAJ;lGgLAiIAAAAJ;https://scholar.google.com.tw/citations?user=5kL-ZrAAAAAJ",
        "orcid": "0000-0002-4569-3539;0000-0002-3245-2728;;;0000-0002-4606-6879",
        "linkedin": ";;;;nessshroff/",
        "or_profile": "~Peizhong_Ju1;~Haibo_Yang1;~Jia_Liu1;~Yingbin_Liang1;~Ness_Shroff1",
        "aff": "Ohio State University, Columbus;Rochester Institute of Technology;The Ohio State University;The Ohio State University;Ohio State University, Columbus",
        "aff_domain": "osu.edu;rit.edu;osu.edu;osu.edu;osu.edu",
        "position": "Postdoc;Assistant Professor;Assistant Professor;Professor;Full Professor",
        "bibtex": "@misc{\nju2024understanding,\ntitle={Understanding the Theoretical Generalization Performance of Federated Learning},\nauthor={Peizhong Ju and Haibo Yang and Jia Liu and Yingbin Liang and Ness Shroff},\nyear={2024},\nurl={https://openreview.net/forum?id=d2YjPbSpDZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "snNy;Rcvy;ocpm;uk5o",
        "site": "https://openreview.net/forum?id=d2YjPbSpDZ",
        "pdf_size": 541251,
        "rating": "3;3;5;5",
        "confidence": "4;4;3;3",
        "soundness": "2;3;2;2",
        "contribution": "1;1;3;2",
        "presentation": "1;2;2;3",
        "wc_summary": "24;175;59;76",
        "wc_strengths": "40;28;87;76",
        "wc_weaknesses": "69;257;771;68",
        "wc_questions": "723;71;2;14",
        "wc_review": "856;531;919;234",
        "wc_reply_reviewers": "91;124;0;0",
        "wc_reply_authors": "2080;1163;1916;230",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "4;2;3;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            83.5,
            56.055775795184566
        ],
        "wc_strengths_avg": [
            57.75,
            24.437420076595647
        ],
        "wc_weaknesses_avg": [
            291.25,
            287.47554243796117
        ],
        "wc_questions_avg": [
            202.5,
            301.63927131592135
        ],
        "wc_review_avg": [
            635.0,
            274.36927670568366
        ],
        "wc_reply_reviewers_avg": [
            53.75,
            55.00170451904195
        ],
        "wc_reply_authors_avg": [
            1347.25,
            731.8802412280304
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Vpef046_D3QJ:scholar.google.com/&scioq=Understanding+the+Theoretical+Generalization+Performance+of+Federated+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0;0",
        "aff_unique_norm": "Ohio State University;Rochester Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.osu.edu;https://www.rit.edu",
        "aff_unique_abbr": "OSU;RIT",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Columbus;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "d3UGSRLbPo",
        "title": "A Stitch in Time Saves Nine: Detecting and Mitigating Hallucinations of LLMs by Actively Validating Low-Confidence Generation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recently developed large language models (LLMs) have achieved remarkable success in generating fluent and coherent text. However, these models often tend to 'hallucinate' which critically hampers their reliability. In this work, we address this crucial problem and propose an approach that actively detects and mitigates hallucinations during the generation process. Specifically, we first identify the candidates of potential hallucination leveraging the model's 'logit output values', check their correctness through a 'validation' procedure, mitigate the detected hallucinations via 'prompting', and then continue with the generation process. This active intervention also facilitates in preventing the propagation of hallucinations in the LLM's output. Through extensive experiments with GPT-3.5 (text-davinci-003) on the 'article generation task', we first demonstrate the individual efficacy of our detection and mitigation techniques. Specifically, we achieve a detection recall of ~88% and successfully mitigate 57.6% of the correctly detected hallucinations. Importantly, our mitigation technique does not introduce new hallucinations even in the case of incorrectly detected hallucinations, i.e., false positives. Then, we show that the proposed active detection and mitigation approach successfully reduces GPT-3.5's hallucinations from 47.5% to 14.5%. We further demonstrate the effectiveness and wide applicability of our approach through additional experiments with different types of questions (multi-hop and false premise) and with another LLM from a different model family (Vicuna). In summary, our work contributes to improving the reliability and trustworthiness of LLMs, a crucial step en route to enabling their widespread adoption in real-world applications.",
        "keywords": "Large Language Models;Hallucinations;Reliability;GPT",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/270154e25c6139aef50b4a425f80a364bd47f167.zip",
        "author": "Neeraj Varshney;Wenlin Yao;Hongming Zhang;Jianshu Chen;Dong Yu",
        "authorids": "~Neeraj_Varshney1;~Wenlin_Yao1;~Hongming_Zhang2;~Jianshu_Chen1;~Dong_Yu2",
        "gender": "M;M;M;M;M",
        "homepage": "https://nrjvarshney.github.io/;https://wenlinyao.github.io/;http://www.cse.ust.hk/~hzhangal/;https://chenjianshu.github.io/;https://sites.google.com/view/dongyu888/",
        "dblp": "139/3970;203/8711;;11/3124;71/4598-1",
        "google_scholar": "Ju9nR0IAAAAJ;qwo2A24AAAAJ;i5ETuuQAAAAJ;jQeFWdoAAAAJ;tMY31_gAAAAJ",
        "orcid": ";;;;0000-0003-0520-6844",
        "linkedin": "neerajvarshney97/;;;;dongyu/",
        "or_profile": "~Neeraj_Varshney1;~Wenlin_Yao1;~Hongming_Zhang2;~Jianshu_Chen1;~Dong_Yu2",
        "aff": "Arizona State University;Tencent AI Lab;Tencent AI Lab Seattle;Amazon;Tencent AI Lab",
        "aff_domain": "asu.edu;tencent.com;tencent.com;amazon.com;tencent.com",
        "position": "PhD student;Researcher;Researcher;Principal Scientist;Distinguished Scientist",
        "bibtex": "@misc{\nvarshney2024a,\ntitle={A Stitch in Time Saves Nine: Detecting and Mitigating Hallucinations of {LLM}s by Actively Validating Low-Confidence Generation},\nauthor={Neeraj Varshney and Wenlin Yao and Hongming Zhang and Jianshu Chen and Dong Yu},\nyear={2024},\nurl={https://openreview.net/forum?id=d3UGSRLbPo}\n}",
        "github": "",
        "project": "",
        "reviewers": "pdV3;XFUz;EApd;5fdS",
        "site": "https://openreview.net/forum?id=d3UGSRLbPo",
        "pdf_size": 1079989,
        "rating": "3;5;5;5",
        "confidence": "4;4;4;3",
        "soundness": "1;2;2;2",
        "contribution": "1;2;3;3",
        "presentation": "2;3;2;3",
        "wc_summary": "59;80;171;41",
        "wc_strengths": "14;89;91;80",
        "wc_weaknesses": "202;275;372;54",
        "wc_questions": "5;695;87;29",
        "wc_review": "280;1139;721;204",
        "wc_reply_reviewers": "0;1584;111;0",
        "wc_reply_authors": "1232;2602;1222;496",
        "reply_reviewers": "0;3;1;0",
        "reply_authors": "2;4;3;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            87.75,
            50.006874527408726
        ],
        "wc_strengths_avg": [
            68.5,
            31.737202145116697
        ],
        "wc_weaknesses_avg": [
            225.75,
            116.0568287521247
        ],
        "wc_questions_avg": [
            204.0,
            285.0421021533486
        ],
        "wc_review_avg": [
            586.0,
            375.3644895298435
        ],
        "wc_reply_reviewers_avg": [
            423.75,
            671.4016588451357
        ],
        "wc_reply_authors_avg": [
            1388.0,
            761.7991861376593
        ],
        "reply_reviewers_avg": [
            1.0,
            1.224744871391589
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 161,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13229850478404484965&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;1;2;1",
        "aff_unique_norm": "Arizona State University;Tencent;Amazon",
        "aff_unique_dep": ";Tencent AI Lab;Amazon.com, Inc.",
        "aff_unique_url": "https://www.asu.edu;https://ai.tencent.com;https://www.amazon.com",
        "aff_unique_abbr": "ASU;Tencent AI Lab;Amazon",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Seattle",
        "aff_country_unique_index": "0;1;0;0;1",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "Bounds on Representation-Induced Confounding Bias for Treatment Effect Estimation",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18278",
        "id": "d3xKPQVjSc",
        "author_site": "Valentyn Melnychuk, Dennis Frauen, Stefan Feuerriegel",
        "tldr": "",
        "abstract": "State-of-the-art methods for conditional average treatment effect (CATE) estimation make widespread use of representation learning. Here, the idea is to reduce the variance of the low-sample CATE estimation by a (potentially constrained) low-dimensional representation. However, low-dimensional representations can lose information about the observed confounders and thus lead to bias, because of which the validity of representation learning for CATE estimation is typically violated. In this paper, we propose a new, representation-agnostic refutation framework for estimating bounds on the representation-induced confounding bias that comes from dimensionality reduction (or other constraints on the representations) in CATE estimation. First, we establish theoretically under which conditions CATE is non-identifiable given low-dimensional (constrained) representations. Second, as our remedy, we propose a neural refutation framework which performs partial identification of CATE or, equivalently, aims at estimating lower and upper bounds of the representation-induced confounding bias. We demonstrate the effectiveness of our bounds in a series of experiments. In sum, our refutation framework is of direct relevance in practice where the validity of CATE estimation is of importance.",
        "keywords": "causal inference;representation learning;individualized treatment effect estimation",
        "primary_area": "causal reasoning",
        "supplementary_material": "",
        "author": "Valentyn Melnychuk;Dennis Frauen;Stefan Feuerriegel",
        "authorids": "~Valentyn_Melnychuk1;~Dennis_Frauen1;~Stefan_Feuerriegel1",
        "gender": "M;M;M",
        "homepage": "https://valentyn1997.github.io/;https://www.ai.bwl.uni-muenchen.de/team/research_team/dennis_frauen/index.html;http://www.ai.bwl.lmu.de",
        "dblp": "254/1513;315/0115;125/0630",
        "google_scholar": "EMExrOMAAAAJ;ieyW4WQAAAAJ;https://scholar.google.de/citations?hl=de",
        "orcid": "0000-0002-2401-6803;;0000-0001-7856-8729",
        "linkedin": "valentyn-melnychuk/;dennis-frauen-6b5746171/;",
        "or_profile": "~Valentyn_Melnychuk1;~Dennis_Frauen1;~Stefan_Feuerriegel1",
        "aff": "Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen;Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen;LMU Munich",
        "aff_domain": "lmu.de;lmu.de;lmu.de",
        "position": "PhD student;PhD student;Professor",
        "bibtex": "@inproceedings{\nmelnychuk2024bounds,\ntitle={Bounds on Representation-Induced Confounding Bias for Treatment Effect Estimation},\nauthor={Valentyn Melnychuk and Dennis Frauen and Stefan Feuerriegel},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=d3xKPQVjSc}\n}",
        "github": "",
        "project": "",
        "reviewers": "Pw4L;FevT;8op8;a9aZ",
        "pdf_size": 23947510,
        "rating": "5;8;8;8",
        "confidence": "4;3;2;4",
        "soundness": "2;2;3;4",
        "contribution": "2;2;3;4",
        "presentation": "2;2;2;4",
        "wc_summary": "92;413;39;90",
        "wc_strengths": "7;21;45;77",
        "wc_weaknesses": "113;125;18;29",
        "wc_questions": "98;85;49;75",
        "wc_review": "310;644;151;271",
        "wc_reply_reviewers": "0;0;25;0",
        "wc_reply_authors": "399;1086;615;327",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            7.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            158.5,
            148.46295834315038
        ],
        "wc_strengths_avg": [
            37.5,
            26.547127904916568
        ],
        "wc_weaknesses_avg": [
            71.25,
            48.095607907583414
        ],
        "wc_questions_avg": [
            76.75,
            17.977416388346796
        ],
        "wc_review_avg": [
            344.0,
            182.8482977771464
        ],
        "wc_reply_reviewers_avg": [
            6.25,
            10.825317547305483
        ],
        "wc_reply_authors_avg": [
            606.75,
            296.297464552095
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8611583821806695308&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=d3xKPQVjSc",
        "pdf": "https://openreview.net/pdf?id=d3xKPQVjSc",
        "email": "lmu.de;lmu.de;lmu.de",
        "author_num": 3,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen;Ludwig Maximilian University of Munich",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.lmu.de;https://www.lmu.de",
        "aff_unique_abbr": "LMU;LMU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Munich",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "title": "LLaMA-Adapter: Efficient Fine-tuning of Large Language Models with Zero-initialized Attention",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18277",
        "id": "d4UiXAHN2W",
        "author_site": "Renrui Zhang, Jiaming Han, Chris Liu, Aojun Zhou, Pan Lu, Hongsheng Li, Gao Peng, Yu Qiao",
        "tldr": "",
        "abstract": "With the rising tide of large language models (LLMs), there has been a growing interest in developing general-purpose instruction-following models, e.g., ChatGPT. To this end, we present LLaMA-Adapter, a lightweight adaption method for efficient instruction tuning of LLaMA. Using 52K self-instruct demonstrations, LLaMA-Adapter only introduces 1.2M learnable parameters upon the frozen LLaMA 7B model, and costs less than one hour for fine-tuning. Specifically, a zero-initialized attention mechanism is proposed. It adopts a learnable zero gating to adaptively inject the instructional cues into LLaMA within self-attention layers, contributing to a stable training process and superior final performance. In this way, LLaMA-Adapter can generate high-quality responses to diverse language instructions, comparable to Alpaca with fully fine-tuned 7B parameters. Besides language commands, by incorporating an image encoder, our approach can be simply extended to a multi-modal LLM for image-conditioned instruction following, which achieves superior multi-modal reasoning capacity on several popular benchmarks (MME, MMBench, LVLM-eHub). Furthermore, we also verify the proposed zero-initialized attention mechanism for fine-tuning other pre-trained models (ViT, RoBERTa, CLIP) on traditional vision and language tasks, demonstrating the effectiveness and generalizability of our approach. Code and models are released at https://github.com/OpenGVLab/LLaMA-Adapter.",
        "keywords": "Large Language Model (LLM);instruction tuning;multi-modality learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/8bb02e399a8d2f02d7b81083439de8edfc6dd2fd.pdf",
        "author": "Renrui Zhang;Jiaming Han;Chris Liu;Aojun Zhou;Pan Lu;Yu Qiao;Hongsheng Li;Peng Gao",
        "authorids": "~Renrui_Zhang1;~Jiaming_Han1;~Chris_Liu1;~Aojun_Zhou2;~Pan_Lu2;~Yu_Qiao1;~Hongsheng_Li3;~Peng_Gao3",
        "gender": "M;M;;;;;M;",
        "homepage": ";https://csuhan.com;;;;;http://www.ee.cuhk.edu.hk/~hsli;",
        "dblp": "244/1748;207/2277;;;;;27/7402-1;",
        "google_scholar": "YlL3xN4AAAAJ;https://scholar.google.com.hk/citations?user=vgcxKEcAAAAJ;;;;;BN2Ze-QAAAAJ;",
        "orcid": ";;;;;;;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Renrui_Zhang1;~Jiaming_Han1;~Chris_Liu1;~Aojun_Zhou2;~Pan_Lu2;~Yu_Qiao1;~Hongsheng_Li3;~Peng_Gao3",
        "aff": "MMLab of CUHK & Shanghai AI Laboratory;The Chinese University of Hong Kong;;;;;The Chinese University of Hong Kong;",
        "aff_domain": "pjlab.org.cn;cuhk.edu.hk;;;;;cuhk.edu.hk;",
        "position": "PhD student;PhD student;;;;;Associate Professor;",
        "bibtex": "@inproceedings{\nzhang2024llamaadapter,\ntitle={{LL}a{MA}-Adapter: Efficient Fine-tuning of Large Language Models with Zero-initialized Attention},\nauthor={Renrui Zhang and Jiaming Han and Chris Liu and Aojun Zhou and Pan Lu and Yu Qiao and Hongsheng Li and Peng Gao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=d4UiXAHN2W}\n}",
        "github": "",
        "project": "",
        "reviewers": "WSmj;EjGx;UT9s",
        "pdf_size": 2636636,
        "rating": "5;6;8",
        "confidence": "3;5;4",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "3;3;3",
        "wc_summary": "60;82;58",
        "wc_strengths": "62;42;115",
        "wc_weaknesses": "156;127;276",
        "wc_questions": "131;38;69",
        "wc_review": "409;289;518",
        "wc_reply_reviewers": "73;0;49",
        "wc_reply_authors": "1882;1001;2323",
        "reply_reviewers": "1;0;1",
        "reply_authors": "4;3;5",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            66.66666666666667,
            10.873004286866728
        ],
        "wc_strengths_avg": [
            73.0,
            30.80043289739069
        ],
        "wc_weaknesses_avg": [
            186.33333333333334,
            64.49978466802987
        ],
        "wc_questions_avg": [
            79.33333333333333,
            38.66379299666406
        ],
        "wc_review_avg": [
            405.3333333333333,
            93.5248036025144
        ],
        "wc_reply_reviewers_avg": [
            40.666666666666664,
            30.379086373505192
        ],
        "wc_reply_authors_avg": [
            1735.3333333333333,
            549.5782221142157
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            4.0,
            0.816496580927726
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.3273268353539886,
        "gs_citation": 102,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6098253235211022783&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=d4UiXAHN2W",
        "pdf": "https://openreview.net/pdf?id=d4UiXAHN2W",
        "email": "pjlab.org.cn;cuhk.edu.hk;;;;;cuhk.edu.hk;",
        "author_num": 8,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Chinese University of Hong Kong",
        "aff_unique_dep": "MMLab",
        "aff_unique_url": "https://www.cuhk.edu.hk",
        "aff_unique_abbr": "CUHK",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Dynamic Layer Tying for Parameter-Efficient Transformers",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18276",
        "id": "d4uL2MSe0z",
        "author_site": "Tamir David-Hay, Lior Wolf",
        "tldr": "",
        "abstract": "In the pursuit of reducing the number of trainable parameters in deep transformer networks, we employ Reinforcement Learning to dynamically select layers during training and tie them together. Every few iterations, the RL agent is asked whether to train each layer $i$ independently or to copy the weights of a previous layer $j<i$. This facilitates weight sharing, reduces the number of trainable parameters, and also serves as an effective regularization technique. Experimental evaluations validate that our model modestly outperforms the baseline transformer model with regard to perplexity and drastically reduces the number of trainable parameters. In particular, the memory consumption during training is up to one order of magnitude less than the conventional training method.",
        "keywords": "NLP;Transformer;Reinforcement Learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/448b17a582c978ee8369ca2926fc01a7901a551f.zip",
        "author": "Tamir David Hay;Lior Wolf",
        "authorids": "~Tamir_David_Hay1;~Lior_Wolf1",
        "gender": "M;M",
        "homepage": ";http://www.cs.tau.ac.il/~wolf",
        "dblp": ";83/4103",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;UbFrXTsAAAAJ",
        "orcid": ";0000-0001-5578-8892",
        "linkedin": "tamir-david-hay-b8bb54138;",
        "or_profile": "~Tamir_David_Hay1;~Lior_Wolf1",
        "aff": "School of Computer Science, Tel Aviv University;Tel Aviv University",
        "aff_domain": "cs.tau.ac.il;tau.ac.il",
        "position": "MS student;Full Professor",
        "bibtex": "@inproceedings{\nhay2024dynamic,\ntitle={Dynamic Layer Tying for Parameter-Efficient Transformers},\nauthor={Tamir David Hay and Lior Wolf},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=d4uL2MSe0z}\n}",
        "github": "",
        "project": "",
        "reviewers": "zEuz;xrb9;ccf2;Mmpd",
        "pdf_size": 1474393,
        "rating": "5;6;6;10",
        "confidence": "4;3;3;4",
        "soundness": "2;3;3;4",
        "contribution": "2;3;2;4",
        "presentation": "2;1;3;4",
        "wc_summary": "59;57;76;152",
        "wc_strengths": "23;56;68;77",
        "wc_weaknesses": "297;82;59;161",
        "wc_questions": "33;112;28;94",
        "wc_review": "412;307;231;484",
        "wc_reply_reviewers": "222;0;25;0",
        "wc_reply_authors": "1005;629;212;544",
        "reply_reviewers": "2;0;1;0",
        "reply_authors": "2;1;2;1",
        "rating_avg": [
            6.75,
            1.920286436967152
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            86.0,
            38.8136573901507
        ],
        "wc_strengths_avg": [
            56.0,
            20.457272545478784
        ],
        "wc_weaknesses_avg": [
            149.75,
            93.05206875722861
        ],
        "wc_questions_avg": [
            66.75,
            36.84681125959206
        ],
        "wc_review_avg": [
            358.5,
            96.85169074414758
        ],
        "wc_reply_reviewers_avg": [
            61.75,
            93.08161741181767
        ],
        "wc_reply_authors_avg": [
            597.5,
            282.18832364220884
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.39056673294247163,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=468901995074606401&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=d4uL2MSe0z",
        "pdf": "https://openreview.net/pdf?id=d4uL2MSe0z",
        "email": "cs.tau.ac.il;tau.ac.il",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Tel Aviv University",
        "aff_unique_dep": "School of Computer Science",
        "aff_unique_url": "https://www.tau.ac.il",
        "aff_unique_abbr": "TAU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Tel Aviv;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Israel"
    },
    {
        "id": "d5DGVHMdsC",
        "title": "CLIN: A Continually Learning Language Agent for Rapid Task Adaptation and Generalization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Language agents have shown some ability to interact with an external environment, e.g., a virtual world such as ScienceWorld, to perform complex tasks, e.g.,  growing a plant, without the startup costs of reinforcement learning. However, despite their zero-shot capabilities, these agents to date do not continually improve over time, beyond performance refinement on a specific task. Here we present CLIN, the first language-based agent to achieve this, so that it continually improves over multiple trials, including when both the environment and task are varied, and without requiring parameter updates. Our approach is to use a persistent, dynamic, textual memory, centered on causal abstractions (rather than general ''helpful hints''), that is regularly updated after each trial so that the agent gradually learns useful knowledge for new trials. In the ScienceWorld benchmark, CLIN is able to continually improve on repeated trials on the same task and environment, outperforming state-of-the-art reflective language agents like Reflexion by 23 absolute points. CLIN can also transfer its learning to new environments (or new tasks), improving its zero-shot performance by 4 points (13 for new tasks) and can further improve performance there through continual memory updates, enhancing performance by an additional 17 points (7 for new tasks). This suggests a new architecture for agents built on frozen models that can still continually and rapidly improve over time.",
        "keywords": "Continual Learning;Language Agents;Memory;Memory-augmented Agents;Task Adaptation;Text-based Simulator;Virtual Environment",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Bodhisattwa Prasad Majumder;Bhavana Dalvi;Peter Jansen;Oyvind Tafjord;Niket Tandon;Li Zhang;Chris Callison-Burch;Peter Clark",
        "authorids": "~Bodhisattwa_Prasad_Majumder1;~Bhavana_Dalvi1;~Peter_Jansen1;~Oyvind_Tafjord2;~Niket_Tandon2;~Li_Zhang22;~Chris_Callison-Burch1;~Peter_Clark1",
        "gender": ";F;;M;M;M;M;M",
        "homepage": "https://www.majumderb.com/;https://bhavanadalvi.github.io/;http://www.cognitiveai.org;;https://niket.tandon.info;https://zharry29.github.io/;https://www.cis.upenn.edu/~ccb/;https://allenai.org/team/peterc",
        "dblp": "138/6177;78/6527;72/5962;178/8640;29/9923;89/5992-39;;34/1184",
        "google_scholar": "cEM1a5gAAAAJ;9e0uFr4AAAAJ;wc1Hbl8AAAAJ;https://scholar.google.com/citations?hl=en;9uWuZkUAAAAJ;_VLzlBIAAAAJ;nv-MV58AAAAJ;o-5vyEsAAAAJ",
        "orcid": ";;;0000-0003-4190-5618;;;;",
        "linkedin": ";;;;;;chris-callison-burch-40bb87b7/;peter-clark-a8b556/",
        "or_profile": "~Bodhisattwa_Prasad_Majumder1;~Bhavana_Dalvi1;~Peter_Jansen1;~Oyvind_Tafjord2;~Niket_Tandon2;~Li_Zhang22;~Chris_Callison-Burch1;~Peter_Clark1",
        "aff": "Allen Institute for Artificial Intelligence;Allen Institute for Artificial Intelligence;Allen Institute for Artificial Intelligence;Allen Institute for Artificial Intelligence;Microsoft Research;University of Pennsylvania;Allen Institute for Artificial Intelligence;Allen Institute for Artificial Intelligence",
        "aff_domain": "allenai.org;allenai.org;allenai.org;allenai.org;research.microsoft.com;upenn.edu;allenai.org;allenai.org",
        "position": "Researcher;Lead Reserarch Scientist;Researcher;Researcher;Principal Researcher;PhD student;Researcher;Senior Research Manager",
        "bibtex": "@misc{\nmajumder2024clin,\ntitle={{CLIN}: A Continually Learning Language Agent for Rapid Task Adaptation and Generalization},\nauthor={Bodhisattwa Prasad Majumder and Bhavana Dalvi and Peter Jansen and Oyvind Tafjord and Niket Tandon and Li Zhang and Chris Callison-Burch and Peter Clark},\nyear={2024},\nurl={https://openreview.net/forum?id=d5DGVHMdsC}\n}",
        "github": "",
        "project": "",
        "reviewers": "7v8j;9kZa;dtLL;FEc9",
        "site": "https://openreview.net/forum?id=d5DGVHMdsC",
        "pdf_size": 3447155,
        "rating": "5;5;5;6",
        "confidence": "4;4;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;2",
        "presentation": "3;3;3;3",
        "wc_summary": "61;76;46;34",
        "wc_strengths": "68;38;145;28",
        "wc_weaknesses": "142;76;153;164",
        "wc_questions": "53;106;104;2",
        "wc_review": "324;296;448;228",
        "wc_reply_reviewers": "207;30;20;133",
        "wc_reply_authors": "2387;1049;1028;2009",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "5;3;3;4",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            54.25,
            15.785673884886892
        ],
        "wc_strengths_avg": [
            69.75,
            45.871423566311954
        ],
        "wc_weaknesses_avg": [
            133.75,
            34.23722389446901
        ],
        "wc_questions_avg": [
            66.25,
            42.745613810074126
        ],
        "wc_review_avg": [
            324.0,
            79.64923100695951
        ],
        "wc_reply_reviewers_avg": [
            97.5,
            77.15730684776393
        ],
        "wc_reply_authors_avg": [
            1618.25,
            595.000577730812
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.75,
            0.82915619758885
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 32,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9030572721280362886&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;0;0;1;2;0;0",
        "aff_unique_norm": "Allen Institute for Artificial Intelligence;Microsoft;University of Pennsylvania",
        "aff_unique_dep": ";Microsoft Research;",
        "aff_unique_url": "https://allenai.org;https://www.microsoft.com/en-us/research;https://www.upenn.edu",
        "aff_unique_abbr": "AI2;MSR;UPenn",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "d6E3i4sXyF",
        "title": "Dissolving Is Amplifying: Towards Fine-Grained Anomaly Detection",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In this paper, we introduce \\textit{DIA}, dissolving is amplifying. DIA is a fine-grained anomaly detection framework for medical images. We describe two novel components in the paper. \nFirst, we introduce \\textit{dissolving transformations}. Our main observation is that generative diffusion models are feature-aware and applying them to medical images in a certain manner can remove or diminish fine-grained discriminative features such as tumors or hemorrhaging.\nSecond, we introduce an \\textit{amplifying framework} based on contrastive learning to learn a semantically meaningful representation of medical images in a self-supervised manner. The amplifying framework contrasts additional pairs of images with and without dissolving transformations applied and thereby boosts the learning of fine-grained feature representations.\nDIA significantly improves the medical anomaly detection performance with around 18.40\\% AUC boost against the baseline method and achieves an overall SOTA against other benchmark methods. Our code is available at \\url{http://}.",
        "keywords": "anomaly detection;fine-grained features;diffusion models",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/31a2d0640c20b5f2491bc2325a8985e8f35e2261.pdf",
        "author": "Jian Shi;Pengyi Zhang;Ni ZHANG;Hakim Ghazzai;Peter Wonka",
        "authorids": "~Jian_Shi4;~Pengyi_Zhang1;~Ni_ZHANG2;~Hakim_Ghazzai1;~Peter_Wonka1",
        "gender": ";M;Not Specified;M;M",
        "homepage": ";;;;http://peterwonka.net",
        "dblp": ";;;120/8873.html;98/5522",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;;UdzAFTIAAAAJ;https://scholar.google.com.tw/citations?user=0EKXSXgAAAAJ",
        "orcid": ";0000-0002-3285-601X;;;0000-0003-0627-9746",
        "linkedin": ";;;;",
        "or_profile": "~Jian_Shi4;~Pengyi_Zhang1;~Ni_ZHANG2;~Hakim_Ghazzai1;~Peter_Wonka1",
        "aff": ";NEC Laboratories China;NEC;King Abdullah University of Science and Technology;KAUST",
        "aff_domain": ";nec.cn;nec.com;kaust.edu.sa;kaust.edu.sa",
        "position": ";Researcher;Principal Researcher;Researcher;Full Professor",
        "bibtex": "@misc{\nshi2024dissolving,\ntitle={Dissolving Is Amplifying: Towards Fine-Grained Anomaly Detection},\nauthor={Jian Shi and Pengyi Zhang and Ni ZHANG and Hakim Ghazzai and Peter Wonka},\nyear={2024},\nurl={https://openreview.net/forum?id=d6E3i4sXyF}\n}",
        "github": "",
        "project": "",
        "reviewers": "K7y6;26Q2;xgt6;ifta",
        "site": "https://openreview.net/forum?id=d6E3i4sXyF",
        "pdf_size": 7320664,
        "rating": "3;5;5;5",
        "confidence": "5;4;4;4",
        "soundness": "2;2;3;2",
        "contribution": "2;2;2;3",
        "presentation": "2;3;2;3",
        "wc_summary": "76;52;61;75",
        "wc_strengths": "52;22;32;76",
        "wc_weaknesses": "260;220;124;257",
        "wc_questions": "9;3;82;31",
        "wc_review": "397;297;299;439",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "502;271;519;433",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            66.0,
            10.024968827881711
        ],
        "wc_strengths_avg": [
            45.5,
            20.657928260113597
        ],
        "wc_weaknesses_avg": [
            215.25,
            54.98806688728019
        ],
        "wc_questions_avg": [
            31.25,
            31.09963826156182
        ],
        "wc_review_avg": [
            358.0,
            61.814237842102365
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            431.25,
            97.96523618100454
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15431316157727762245&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;2;2",
        "aff_unique_norm": "NEC Laboratories;NEC Corporation;King Abdullah University of Science and Technology",
        "aff_unique_dep": "China;;",
        "aff_unique_url": "https://www.nec-labs.com/;https://www.nec.com;https://www.kast.kau.edu.sa",
        "aff_unique_abbr": "NEC Labs China;NEC;KAUST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;2",
        "aff_country_unique": "China;Japan;Saudi Arabia"
    },
    {
        "title": "Spurious Feature Diversification Improves Out-of-distribution Generalization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18275",
        "id": "d6H4RBi7RH",
        "author_site": "LIN Yong, Lu Tan, Yifan HAO, Honam Wong, Hanze Dong, WEIZHONG ZHANG, Yujiu Yang, Tong Zhang",
        "tldr": "",
        "abstract": "Generalization to out-of-distribution (OOD) data is a critical challenge in machine learning. Ensemble-based methods, like weight space ensembles that interpolate model parameters, have been shown to achieve superior OOD performance. However, the underlying mechanism for their effectiveness remains unclear. \n\nIn this study, we closely examine WiSE-FT, a popular weight space ensemble method that interpolates between a pre-trained and a fine-tuned model. We observe an unexpected ``FalseFalseTrue\" phenomenon, in which WiSE-FT successfully corrects many cases where each individual model makes incorrect predictions, which contributes significantly to its OOD effectiveness. To gain further insights, we conduct theoretical analysis in a multi-class setting with a large number of spurious features. Our analysis predicts the above phenomenon and it further shows that ensemble-based models reduce prediction errors in the OOD settings by utilizing a more diverse set of spurious features. Contrary to the conventional wisdom that focuses on learning invariant features for better OOD performance, our findings suggest that incorporating a large number of diverse spurious features weakens their individual contributions, leading to improved overall OOD generalization performance. Additionally, our findings provide the first explanation for the mysterious phenomenon of weight space ensembles outperforming output space ensembles in OOD. Empirically we demonstrate the effectiveness of utilizing diverse spurious features on a MultiColorMNIST dataset, and our experimental results are consistent with the theoretical analysis. \n\nBuilding upon the new theoretical insights into the efficacy of ensemble methods, we further identify an issue of WiSE-FT caused by the overconfidence of fine-tuned models in OOD situations. This overconfidence magnifies the fine-tuned model's incorrect prediction, leading to deteriorated OOD ensemble performance. To remedy this problem, we propose a novel method called BAlaNced averaGing (BANG) to mitigate the overconfidence problem, which significantly enhances the OOD performance of WiSE-FT.",
        "keywords": "Out-of-distribution generalization",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/add82a5a30cc4ef87d50c8e0d1361f6dbc428ebe.zip",
        "author": "LIN Yong;Lu Tan;Yifan HAO;Ho Nam Wong;Hanze Dong;WEIZHONG ZHANG;Yujiu Yang;Tong Zhang",
        "authorids": "~LIN_Yong1;~Lu_Tan1;~Yifan_HAO2;~Ho_Nam_Wong1;~Hanze_Dong1;~WEIZHONG_ZHANG2;~Yujiu_Yang2;~Tong_Zhang2",
        "gender": ";;F;M;M;;M;M",
        "homepage": ";;https://github.com/haoyifan99/iff;https://matheart.github.io;https://hendrydong.github.io/;;https://sites.google.com/view/iigroup-thu;http://tongzhang-ml.org",
        "dblp": ";67/10146;118/3316-2;;228/7798;;30/3847;07/4227-1",
        "google_scholar": ";yeJ3AbsAAAAJ;https://scholar.google.com.hk/citations?user=lzI8IicAAAAJ;ZTZhvf8AAAAJ;g9WLzWoAAAAJ;;4gH3sxsAAAAJ;LurWtuYAAAAJ",
        "orcid": ";;;;;;0000-0002-6427-1024;0000-0002-5511-2558",
        "linkedin": ";;yifan-hao-23a5b2337/;;hanze-dong/;;;",
        "or_profile": "~LIN_Yong1;~Lu_Tan1;~Yifan_HAO2;~Ho_Nam_Wong1;~Hanze_Dong1;~WEIZHONG_ZHANG2;~Yujiu_Yang2;~Tong_Zhang2",
        "aff": ";Tsinghua University;Hong Kong University of Science and Technology;EPFL - EPF Lausanne;SalesForce;;Tsinghua University;UIUC",
        "aff_domain": ";tsinghua.edu.cn;ust.hk;epfl.ch;salesforce.com;;tsinghua.edu.cn;illinois.edu",
        "position": ";MS student;MS student;Exchange;Researcher;;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nyong2024spurious,\ntitle={Spurious Feature Diversification Improves Out-of-distribution Generalization},\nauthor={LIN Yong and Lu Tan and Yifan HAO and Ho Nam Wong and Hanze Dong and WEIZHONG ZHANG and Yujiu Yang and Tong Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=d6H4RBi7RH}\n}",
        "github": "",
        "project": "",
        "reviewers": "kd2C;qFv2;KdWP",
        "pdf_size": 6459473,
        "rating": "5;8;8",
        "confidence": "2;4;3",
        "soundness": "2;4;4",
        "contribution": "3;3;4",
        "presentation": "3;4;4",
        "wc_summary": "49;111;143",
        "wc_strengths": "88;103;120",
        "wc_weaknesses": "209;126;120",
        "wc_questions": "2;3;95",
        "wc_review": "348;343;478",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "3548;869;900",
        "reply_reviewers": "0;0;0",
        "reply_authors": "10;2;2",
        "rating_avg": [
            7.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "contribution_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            101.0,
            39.02136167109839
        ],
        "wc_strengths_avg": [
            103.66666666666667,
            13.072447700751718
        ],
        "wc_weaknesses_avg": [
            151.66666666666666,
            40.61472092179824
        ],
        "wc_questions_avg": [
            33.333333333333336,
            43.606829230701415
        ],
        "wc_review_avg": [
            389.6666666666667,
            62.49444419750892
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1772.3333333333333,
            1255.649721149263
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            4.666666666666667,
            3.7712361663282534
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.8660254037844387,
        "gs_citation": 31,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=145005357647104478&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=d6H4RBi7RH",
        "pdf": "https://openreview.net/pdf?id=d6H4RBi7RH",
        "email": ";tsinghua.edu.cn;ust.hk;epfl.ch;salesforce.com;;tsinghua.edu.cn;illinois.edu",
        "author_num": 8,
        "aff_unique_index": "0;1;2;3;0;4",
        "aff_unique_norm": "Tsinghua University;Hong Kong University of Science and Technology;EPFL;Salesforce;University of Illinois Urbana-Champaign",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.ust.hk;https://www.epfl.ch;https://www.salesforce.com;https://www illinois.edu",
        "aff_unique_abbr": "THU;HKUST;EPFL;Salesforce;UIUC",
        "aff_campus_unique_index": "1;2;3",
        "aff_campus_unique": ";Hong Kong SAR;Lausanne;Urbana-Champaign",
        "aff_country_unique_index": "0;0;1;2;0;2",
        "aff_country_unique": "China;Switzerland;United States"
    },
    {
        "id": "d6oUP1tyNx",
        "title": "The KNN Score for Evaluating Probabilistic Multivariate Time Series Forecasting",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Time series forecasting is a critical task in various domains. With the aim of comprehending interconnections and dependencies among variables, as well as gaining insights into a range of potential future outcomes, probabilistic multivariate time series forecasting has emerged as a prominent approach. The evaluation of models employed in this task is crucial yet challenging. Comparing a set of predictions against a single observed future presents difficulties, and accurately measuring whether a model correctly predicts dependencies between different time steps and individual series further compounds the complexity. We observe that metrics which are currently employed fall short in providing a comprehensive assessment of model performance. To address this limitation, we propose a novel metric based on density estimation as an alternative. We showcase the advantages of our metric both qualitatively and quantitatively, underscoring its effectiveness in assessing forecast quality.",
        "keywords": "time series;forecasting;metric;evaluation;probabilistic;multivariate;knn;density estimation;scoring rule",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Markus Knoche;Bastian Leibe",
        "authorids": "~Markus_Knoche1;~Bastian_Leibe3",
        "gender": "M;M",
        "homepage": ";http://www.vision.rwth-aachen.de",
        "dblp": "248/8863;41/1228",
        "google_scholar": "https://scholar.google.de/citations?user=Kx4v8IMAAAAJ;ZcULDB0AAAAJ",
        "orcid": ";0000-0003-4225-0051",
        "linkedin": ";",
        "or_profile": "~Markus_Knoche1;~Bastian_Leibe3",
        "aff": "RWTH Aachen University;RWTH Aachen University",
        "aff_domain": "rwth-aachen.de;rwth-aachen.de",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nknoche2024the,\ntitle={The {KNN} Score for Evaluating Probabilistic Multivariate Time Series Forecasting},\nauthor={Markus Knoche and Bastian Leibe},\nyear={2024},\nurl={https://openreview.net/forum?id=d6oUP1tyNx}\n}",
        "github": "",
        "project": "",
        "reviewers": "Hf7C;hvQm;aR1R",
        "site": "https://openreview.net/forum?id=d6oUP1tyNx",
        "pdf_size": 1489382,
        "rating": "1;3;5",
        "confidence": "5;4;4",
        "soundness": "1;2;2",
        "contribution": "1;1;2",
        "presentation": "1;3;2",
        "wc_summary": "64;124;72",
        "wc_strengths": "57;110;51",
        "wc_weaknesses": "447;501;75",
        "wc_questions": "2;15;39",
        "wc_review": "570;750;237",
        "wc_reply_reviewers": "259;0;0",
        "wc_reply_authors": "851;795;417",
        "reply_reviewers": "1;0;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            3.0,
            1.632993161855452
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            86.66666666666667,
            26.599916457680003
        ],
        "wc_strengths_avg": [
            72.66666666666667,
            26.512051766864232
        ],
        "wc_weaknesses_avg": [
            341.0,
            189.37792902025305
        ],
        "wc_questions_avg": [
            18.666666666666668,
            15.3260852434302
        ],
        "wc_review_avg": [
            519.0,
            212.51352898109803
        ],
        "wc_reply_reviewers_avg": [
            86.33333333333333,
            122.09377088487722
        ],
        "wc_reply_authors_avg": [
            687.6666666666666,
            192.75084666192492
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:xmVIQDQRNMMJ:scholar.google.com/&scioq=The+KNN+Score+for+Evaluating+Probabilistic+Multivariate+Time+Series+Forecasting&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "RWTH Aachen University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.rwth-aachen.de",
        "aff_unique_abbr": "RWTH",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Aachen",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Germany"
    },
    {
        "title": "Energy-guided Entropic Neural Optimal Transport",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18274",
        "id": "d6tUsZeVs7",
        "author_site": "Petr Mokrov, Alexander Korotin, Alexander Kolesov, Nikita Gushchin, Evgeny Burnaev",
        "tldr": "",
        "abstract": "Energy-based models (EBMs) are known in the Machine Learning community for decades. Since the seminal works devoted to EBMs dating back to the noughties, there have been a lot of efficient methods which solve the generative modelling problem by means of energy potentials (unnormalized likelihood functions). In contrast, the realm of Optimal Transport (OT) and, in particular, neural OT solvers is much less explored and limited by few recent works (excluding WGAN-based approaches which utilize OT as a loss function and do not model OT maps themselves). In our work, we bridge the gap between EBMs and Entropy-regularized OT. We present a novel methodology which allows utilizing the recent developments and technical improvements of the former in order to enrich the latter. From the theoretical perspective, we prove generalization bounds for our technique. In practice, we validate its applicability in toy 2D and image domains. To showcase the scalability, we empower our method with a pre-trained StyleGAN and apply it to high-res AFHQ $512\\times512$ unpaired I2I translation. For simplicity, we choose simple short- and long-run EBMs as a backbone of our Energy-guided Entropic OT approach, leaving the application of more sophisticated EBMs for future research. Our code is available at: https://github.com/PetrMokrov/Energy-guided-Entropic-OT",
        "keywords": "energy-based model;generative model;optimal transport;entropic optimal transport;general optimal transport cost function",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/e9a5331d2ad25da7fea4f9955b156f7c78f6c215.zip",
        "author": "Petr Mokrov;Alexander Korotin;Alexander Kolesov;Nikita Gushchin;Evgeny Burnaev",
        "authorids": "~Petr_Mokrov1;~Alexander_Korotin2;~Alexander_Kolesov1;~Nikita_Gushchin1;~Evgeny_Burnaev1",
        "gender": "M;M;M;M;M",
        "homepage": "https://github.com/PetrMokrov;https://github.com/Kolessov;;http://faculty.skoltech.ru/people/evgenyburnaev;https://akorotin.netlify.app",
        "dblp": ";287/4380;332/1999;144/7845;209/9906",
        "google_scholar": "CRsi4IkAAAAJ;WyAI_wUAAAAJ;UaRTbNoAAAAJ;https://scholar.google.ru/citations?user=pCRdcOwAAAAJ;https://scholar.google.ru/citations?user=1rIIvjAAAAAJ",
        "orcid": ";;;0000-0001-8424-0690;0000-0003-4286-925X",
        "linkedin": ";;nikita-gushchin-937522145/;;",
        "or_profile": "~Petr_Mokrov1;~Alexander_Kolesov1;~Nikita_Gushchin1;~Evgeny_Burnaev1;~Alexander_Andreevich_Korotin1",
        "aff": "Skolkovo Institute of Science and Technology;The Skolkovo Institute of Science and Technology;Skolkovo Institute of Science and Technology;Skolkovo Institute of Science and Technology;Skolkovo Institute of Science and Technology",
        "aff_domain": "skolkovotech.ru;skoltech.ru;skoltech.ru;skoltech.ru;skoltech.ru",
        "position": "PhD student;PhD student;PhD student;Full Professor;Head of Research Group",
        "bibtex": "@inproceedings{\nmokrov2024energyguided,\ntitle={Energy-guided Entropic Neural Optimal Transport},\nauthor={Petr Mokrov and Alexander Korotin and Alexander Kolesov and Nikita Gushchin and Evgeny Burnaev},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=d6tUsZeVs7}\n}",
        "github": "",
        "project": "",
        "reviewers": "2Kak;7M7Q;mVby",
        "pdf_size": 32470209,
        "rating": "6;6;6",
        "confidence": "4;3;4",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "2;3;3",
        "wc_summary": "63;47;105",
        "wc_strengths": "22;39;183",
        "wc_weaknesses": "69;54;246",
        "wc_questions": "64;50;41",
        "wc_review": "218;190;575",
        "wc_reply_reviewers": "107;0;69",
        "wc_reply_authors": "968;984;1066",
        "reply_reviewers": "1;0;1",
        "reply_authors": "2;2;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            71.66666666666667,
            24.458581770458856
        ],
        "wc_strengths_avg": [
            81.33333333333333,
            72.22341879350645
        ],
        "wc_weaknesses_avg": [
            123.0,
            87.18944890294927
        ],
        "wc_questions_avg": [
            51.666666666666664,
            9.46337971105226
        ],
        "wc_review_avg": [
            327.6666666666667,
            175.26424494332994
        ],
        "wc_reply_reviewers_avg": [
            58.666666666666664,
            44.28945196720722
        ],
        "wc_reply_authors_avg": [
            1006.0,
            42.926293418680665
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 17,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14912486218865172380&as_sdt=8005&sciodt=0,7&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=d6tUsZeVs7",
        "pdf": "https://openreview.net/pdf?id=d6tUsZeVs7",
        "email": "skolkovotech.ru;skoltech.ru;skoltech.ru;skoltech.ru;skoltech.ru",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Skolkovo Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.skoltech.ru",
        "aff_unique_abbr": "Skoltech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Russian Federation"
    },
    {
        "title": "Small-scale proxies for large-scale Transformer training instabilities",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18273",
        "id": "d8w0pmvXbZ",
        "author_site": "Mitchell Wortsman, Peter Liu, Lechao Xiao, Katie Everett, Alexander Alemi, Ben Adlam, John Co-Reyes, Izzeddin Gur, Abhishek Kumar, Roman Novak, Jeffrey Pennington, Jascha Sohl-Dickstein, Kelvin Xu, Jaehoon Lee, Justin Gilmer, Simon Kornblith",
        "tldr": "",
        "abstract": "Teams that have trained large Transformer-based models have reported training instabilities at large scale that did not appear when training with the same hyperparameters at smaller scales. Although the causes of such instabilities are of scientific interest, the amount of resources required to reproduce them has made investigation difficult. In this work, we seek ways to reproduce and study training instability at smaller scales. First, we focus on two sources of training instability described in previous work: the growth of logits in attention layers (Dehghani et al., 2023) and divergence of the output logits from the log probabilities (Chowdhery et al., 2022). By measuring the relationship between learning rate and loss across scales, we show that these instabilities also appear in small models when training at high learning rates, and that mitigations previously employed at large scales are equally effective in this regime. This prompts us to investigate the extent to which other known optimizer and model interventions influence the sensitivity of the final loss to changes in the learning rate. To this end, we study methods such as warm-up, weight decay, and the MuParam (Yang et al., 2022), and combine techniques to train small models that achieve similar losses across orders of magnitude of learning rate variation. Finally, to conclude our exploration we study two cases where instabilities can be predicted before they emerge by examining the scaling behavior of model characteristics such as activation and gradient norms.",
        "keywords": "Small Transformers;Training;Stability",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Mitchell Wortsman;Peter J Liu;Lechao Xiao;Katie E Everett;Alexander A Alemi;Ben Adlam;John D Co-Reyes;Izzeddin Gur;Abhishek Kumar;Roman Novak;Jeffrey Pennington;Jascha Sohl-Dickstein;Kelvin Xu;Jaehoon Lee;Justin Gilmer;Simon Kornblith",
        "authorids": "~Mitchell_Wortsman1;~Peter_J_Liu1;~Lechao_Xiao2;~Katie_E_Everett1;~Alexander_A_Alemi1;~Ben_Adlam1;~John_D_Co-Reyes1;~Izzeddin_Gur1;~Abhishek_Kumar1;~Roman_Novak2;~Jeffrey_Pennington1;~Jascha_Sohl-Dickstein2;~Kelvin_Xu2;~Jaehoon_Lee2;~Justin_Gilmer1;~Simon_Kornblith1",
        "gender": "M;;M;;M;M;M;;;M;M;Unspecified;;M;M;M",
        "homepage": "https://mitchellnw.github.io/;http://www.peterjliu.com;https://sites.google.com/site/lechaoxiao/;;https://alexalemi.com;http://www.benadlam.com;;;http://inductivebias.ml;https://github.com/romanngg;;http://kelvinxu.github.io/;https://jaehlee.github.io;;;http://sohldickstein.com",
        "dblp": "232/2273;190/7667;222/3238;270/9991;160/8158;;198/1129;188/9027;67/6188-1;https://dblp.org/pers/n/Novak:Roman.html;https://dblp.org/pers/p/Pennington:Jeffrey.html;159/1894;95/386-1.html;;220/4059;51/7117",
        "google_scholar": "fzRnjFgAAAAJ;;fvwzUnIAAAAJ;ox_zSwYAAAAJ;68hTs9wAAAAJ;Q93u3c0AAAAJ;;qS_ugJAAAAAJ;6vghMS0AAAAJ;LWvgl-8AAAAJ;cn_FoswAAAAJ;GyoKzFwAAAAJ;d3YhiooAAAAJ;Ml_vQ8MAAAAJ;1O3RPmsAAAAJ;-3zYIjQAAAAJ",
        "orcid": ";;;;;;;;;;;;;;;",
        "linkedin": ";p3t3rliu;;katie-everett/;;;;;;romanovak;jpennin;;eejaehoon/;;;",
        "or_profile": "~Mitchell_Wortsman1;~Peter_J_Liu1;~Lechao_Xiao2;~Katie_E_Everett1;~Alexander_A_Alemi1;~Ben_Adlam1;~John_D_Co-Reyes1;~Izzeddin_Gur1;~Abhishek_Kumar1;~Roman_Novak2;~Jeffrey_Pennington1;~Kelvin_Xu2;~Jaehoon_Lee2;~Justin_Gilmer1;~Simon_Kornblith1;~Jascha_Sohl-Dickstein1",
        "aff": "University of Washington, Seattle;Google Brain;Google DeepMind;Massachusetts Institute of Technology;Google;Google;;Google;Google DeepMind;Google Deepmind;Google;University of California, Berkeley;Google DeepMind;;Anthropic;Google",
        "aff_domain": "uw.edu;google.com;google.com;mit.edu;google.com;google.com;;google.com;google.com;google.com;google.com;berkeley.edu;google.com;;anthropic.com;google.com",
        "position": "PhD student;Research Scientist;Researcher;PhD student;Research Scientist;Research Scientist;;Research Scientist;Research Scientist;Research Scientist;Research Scientist;PhD student;Research Scientist;;Member of the Technical Staff;Research Scientist",
        "bibtex": "@inproceedings{\nwortsman2024smallscale,\ntitle={Small-scale proxies for large-scale Transformer training instabilities},\nauthor={Mitchell Wortsman and Peter J Liu and Lechao Xiao and Katie E Everett and Alexander A Alemi and Ben Adlam and John D Co-Reyes and Izzeddin Gur and Abhishek Kumar and Roman Novak and Jeffrey Pennington and Jascha Sohl-Dickstein and Kelvin Xu and Jaehoon Lee and Justin Gilmer and Simon Kornblith},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=d8w0pmvXbZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "hm5n;Fq7A;SBqh;TVMA",
        "pdf_size": 17784089,
        "rating": "8;8;8;8",
        "confidence": "4;3;2;3",
        "soundness": "4;3;3;3",
        "contribution": "3;3;2;3",
        "presentation": "4;3;3;3",
        "wc_summary": "98;224;207;193",
        "wc_strengths": "44;45;92;389",
        "wc_weaknesses": "96;117;79;203",
        "wc_questions": "34;42;5;276",
        "wc_review": "272;428;383;1061",
        "wc_reply_reviewers": "89;0;0;49",
        "wc_reply_authors": "328;770;373;705",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            180.5,
            48.87995499179597
        ],
        "wc_strengths_avg": [
            142.5,
            143.63234315431885
        ],
        "wc_weaknesses_avg": [
            123.75,
            47.69368406822857
        ],
        "wc_questions_avg": [
            89.25,
            108.69538858663692
        ],
        "wc_review_avg": [
            536.0,
            308.3804468509636
        ],
        "wc_reply_reviewers_avg": [
            34.5,
            37.286056375004314
        ],
        "wc_reply_authors_avg": [
            544.0,
            195.5083118437679
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            16,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 79,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14977470216858035232&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=d8w0pmvXbZ",
        "pdf": "https://openreview.net/pdf?id=d8w0pmvXbZ",
        "email": "uw.edu;google.com;google.com;mit.edu;google.com;google.com;;google.com;google.com;google.com;google.com;berkeley.edu;google.com;;anthropic.com;google.com",
        "author_num": 16,
        "aff_unique_index": "0;1;1;2;1;1;1;1;3;1;4;1;5;1",
        "aff_unique_norm": "University of Washington;Google;Massachusetts Institute of Technology;DeepMind;University of California, Berkeley;Anthropic",
        "aff_unique_dep": ";Google Brain;;DeepMind;;",
        "aff_unique_url": "https://www.washington.edu;https://brain.google.com;https://web.mit.edu;https://deepmind.com;https://www.berkeley.edu;https://www.anthropic.com",
        "aff_unique_abbr": "UW;Google Brain;MIT;DeepMind;UC Berkeley;Anthropic",
        "aff_campus_unique_index": "0;1;1;1;1;1;3;1",
        "aff_campus_unique": "Seattle;Mountain View;;Berkeley",
        "aff_country_unique_index": "0;0;1;0;0;0;0;1;1;0;0;1;0;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "title": "Tool-Augmented Reward Modeling",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18272",
        "id": "d94x0gWTUX",
        "author_site": "Lei Li, Yekun Chai, Shuohuan Wang, Yu Sun, Hao Tian, Ningyu Zhang, hua wu",
        "tldr": "",
        "abstract": "Reward modeling (*a.k.a.*, preference modeling) is instrumental for aligning large language models with human preferences, particularly within the context of reinforcement learning from human feedback (RLHF). While conventional reward models (RMs) have exhibited remarkable scalability, they oft struggle with fundamental functionality such as arithmetic computation, code execution, and factual lookup. In this paper, we propose a tool-augmented preference modeling approach, named Themis, to address these limitations by empowering RMs with access to external environments, including calculators and search engines. This approach not only fosters synergy between tool utilization and reward grading but also enhances interpretive capacity and scoring reliability. Our study delves into the integration of external tools into RMs, enabling them to interact with diverse external sources and construct task-specific tool engagement and reasoning traces in an autoregressive manner. We validate our approach across a wide range of domains, incorporating seven distinct external tools. Our experimental results demonstrate a noteworthy overall improvement of 17.7% across eight tasks in preference ranking. Furthermore, our approach outperforms Gopher 280B by 7.3% on TruthfulQA task in zero-shot evaluation. In human evaluations, RLHF trained with Themis attains an average win rate of 32% when compared to baselines across four distinct tasks. Additionally, we provide a comprehensive collection of tool-related RM datasets, incorporating data from seven distinct tool APIs, totaling 15,000 instances. We have made the code, data, and model checkpoints publicly available to facilitate and inspire further research advancements (https://github.com/ernie-research/Tool-Augmented-Reward-Model).",
        "keywords": "Reward Model;Large Language Model;Tool Learning;Augmented Language Model",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/225148b4886e0f42aaa7c2c8fe8dfe870dab4c52.zip",
        "author": "Lei Li;Yekun Chai;Shuohuan Wang;Yu Sun;Hao Tian;Ningyu Zhang;Hua Wu",
        "authorids": "~Lei_Li18;~Yekun_Chai1;~Shuohuan_Wang1;~Yu_Sun13;~Hao_Tian1;~Ningyu_Zhang1;~Hua_Wu4",
        "gender": "M;M;M;;;M;F",
        "homepage": ";https://cyk1337.github.io/;;;;https://person.zju.edu.cn/en/ningyu;https://wuhuanlp.github.io/",
        "dblp": "13/7007-40;252/0188;239/5773.html;;;139/4181-1.html;27/6045-3",
        "google_scholar": "ySUbqpEAAAAJ;P0NRuRYAAAAJ;fUkS6pAAAAAJ;02fM4YEAAAAJ;GNfC6yYAAAAJ;xQDOPvsAAAAJ;9X2ThuAAAAAJ",
        "orcid": ";;;;;0000-0002-1970-0678;0000-0001-8254-1561",
        "linkedin": ";;;;;ningyuzhang/;",
        "or_profile": "~Lei_Li18;~Yekun_Chai1;~Shuohuan_Wang1;~Yu_Sun13;~Hao_Tian1;~Ningyu_Zhang1;~hua_wu1",
        "aff": "Tencent;Baidu;Baidu;;Baidu Research;Zhejiang University;Baidu",
        "aff_domain": "tencent.com;baidu.com;baidu.com;;baidu.com;zju.edu.cn;baidu.com",
        "position": "Algorithmic Engineer;Researcher;Researcher;;Researcher;Associate Professor;Principal Researcher",
        "bibtex": "@inproceedings{\nli2024toolaugmented,\ntitle={Tool-Augmented Reward Modeling},\nauthor={Lei Li and Yekun Chai and Shuohuan Wang and Yu Sun and Hao Tian and Ningyu Zhang and Hua Wu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=d94x0gWTUX}\n}",
        "github": "",
        "project": "",
        "reviewers": "bKyt;zDVk;wTHw",
        "pdf_size": 1889253,
        "rating": "6;8;8",
        "confidence": "4;4;3",
        "soundness": "3;2;3",
        "contribution": "3;4;3",
        "presentation": "3;2;2",
        "wc_summary": "81;58;93",
        "wc_strengths": "66;53;25",
        "wc_weaknesses": "44;332;218",
        "wc_questions": "53;20;2",
        "wc_review": "244;463;338",
        "wc_reply_reviewers": "140;48;23",
        "wc_reply_authors": "1378;989;1706",
        "reply_reviewers": "1;1;1",
        "reply_authors": "4;3;4",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            77.33333333333333,
            14.522013940527977
        ],
        "wc_strengths_avg": [
            48.0,
            17.107503227141788
        ],
        "wc_weaknesses_avg": [
            198.0,
            118.4229707446997
        ],
        "wc_questions_avg": [
            25.0,
            21.118712081942874
        ],
        "wc_review_avg": [
            348.3333333333333,
            89.70445300479174
        ],
        "wc_reply_reviewers_avg": [
            70.33333333333333,
            50.307940614667274
        ],
        "wc_reply_authors_avg": [
            1357.6666666666667,
            293.06692447668365
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 22,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16744182720729856326&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 9,
        "openreview": "https://openreview.net/forum?id=d94x0gWTUX",
        "pdf": "https://openreview.net/pdf?id=d94x0gWTUX",
        "email": "tencent.com;baidu.com;baidu.com;;baidu.com;zju.edu.cn;baidu.com",
        "author_num": 7,
        "aff_unique_index": "0;1;1;1;2;1",
        "aff_unique_norm": "Tencent;Baidu;Zhejiang University",
        "aff_unique_dep": "Tencent Holdings Limited;Baidu, Inc.;",
        "aff_unique_url": "https://www.tencent.com;https://www.baidu.com;https://www.zju.edu.cn",
        "aff_unique_abbr": "Tencent;Baidu;ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "d98CzL5h0i",
        "title": "Learning to Generate Better than your Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Reinforcement learning (RL) has emerged as a powerful paradigm for fine-tuning Large Language Models (LLMs) for text generation. In particular, recent LLMs such as ChatGPT and GPT-4 can engage in fluent conversations with users after finetuning with RL. Inspired by learning-to-search algorithms and capitalizing on key properties of text generation, we seek to investigate RL algorithms beyond general purpose algorithms like Proximal Policy Optimization (PPO). In particular, we extend RL algorithms to allow them to interact with a dynamic black-box guide LLM and propose RL with guided feedback (RLGF), a suite of RL algorithms for LLM fine-tuning. We experiment on the IMDB positive sentiment, CommonGen, and TL;DR summarization tasks. We show that our RL algorithms achieve higher performance than supervised learning (SL) and RL baselines, demonstrating the benefit of interaction with the guide LLM. On both CommonGen and TL;DR, we not only outperform our SL baselines but also improve upon PPO across a variety of metrics beyond the one we optimized for.",
        "keywords": "reinforcement learning from human feedback;reinforcement learning;imitation learning;large language models",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/9e43a7a93d693d9ff8ce068acbe3501db289ecda.pdf",
        "author": "Jonathan Daniel Chang;Kiant\u00e9 Brantley;Rajkumar Ramamurthy;Dipendra Misra;Wen Sun",
        "authorids": "~Jonathan_Daniel_Chang1;~Kiant\u00e9_Brantley2;~Rajkumar_Ramamurthy1;~Dipendra_Misra1;~Wen_Sun1",
        "gender": "M;;;M;",
        "homepage": "https://www.cs.cornell.edu/people/phdstudents;;;https://dipendramisra.com/;https://wensun.github.io",
        "dblp": ";;199/2181;218/6569;",
        "google_scholar": "_qY_t5kAAAAJ;;vVzcztcAAAAJ;rIoPIFsAAAAJ;iOLC30YAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Jonathan_Daniel_Chang1;~Kiant\u00e9_Brantley2;~Rajkumar_Ramamurthy1;~Dipendra_Misra1;~Wen_Sun1",
        "aff": "Cornell University;;Fraunhofer Institute IAIS, Fraunhofer IAIS;Microsoft Research;Cornell University",
        "aff_domain": "cornell.edu;;iais.fraunhofer.de;microsoft.com;cornell.edu",
        "position": "PhD student;;Researcher;Researcher;Assistant Professor",
        "bibtex": "@misc{\nchang2024learning,\ntitle={Learning to Generate Better than your Large Language Models},\nauthor={Jonathan Daniel Chang and Kiant{\\'e} Brantley and Rajkumar Ramamurthy and Dipendra Misra and Wen Sun},\nyear={2024},\nurl={https://openreview.net/forum?id=d98CzL5h0i}\n}",
        "github": "",
        "project": "",
        "reviewers": "eNmj;7XES;Q8S4;HK72",
        "site": "https://openreview.net/forum?id=d98CzL5h0i",
        "pdf_size": 573379,
        "rating": "3;5;5;6",
        "confidence": "2;3;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;2",
        "presentation": "3;2;3;3",
        "wc_summary": "272;82;38;123",
        "wc_strengths": "139;41;18;98",
        "wc_weaknesses": "404;70;80;297",
        "wc_questions": "165;99;57;18",
        "wc_review": "980;292;193;536",
        "wc_reply_reviewers": "603;0;158;0",
        "wc_reply_authors": "1305;755;296;330",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "3;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            128.75,
            87.99822441390508
        ],
        "wc_strengths_avg": [
            74.0,
            47.502631506054485
        ],
        "wc_weaknesses_avg": [
            212.75,
            142.89397293098125
        ],
        "wc_questions_avg": [
            84.75,
            54.47189642375231
        ],
        "wc_review_avg": [
            500.25,
            303.812750719913
        ],
        "wc_reply_reviewers_avg": [
            190.25,
            246.87686708154735
        ],
        "wc_reply_authors_avg": [
            671.5,
            408.01868829748474
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.899228803025897,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:xAUQW5kjlHcJ:scholar.google.com/&scioq=Learning+to+Generate+Better+than+your+Large+Language+Models&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Cornell University;Fraunhofer Institute for Intelligent Analysis and Information Systems;Microsoft",
        "aff_unique_dep": ";Intelligent Analysis and Information Systems;Microsoft Research",
        "aff_unique_url": "https://www.cornell.edu;https://www.iais.fraunhofer.de/;https://www.microsoft.com/en-us/research",
        "aff_unique_abbr": "Cornell;Fraunhofer IAIS;MSR",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "United States;Germany"
    },
    {
        "id": "dA4EWchlbn",
        "title": "Advancing the Adversarial Robustness of Neural Networks from the Data Perspective",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Robustness in machine learning is a widespread concept and one of the pillars of trustworthiness, ranging from a model's resistance to noise---benign and adversarial---to the reliability of benchmarking. In this work, we analyse the robustness of labelled data which we argue corresponds to the data manifold's curvature as perceived by a model during training and thus establish a connection to its adversarial robustness. This view provides an intuitive explanation for our empirical results showing that neural networks acquire adversarial robustness much slower in the least robust regions. In combination with minor adjustments to the learning rate, the new concept offers a means to emphasise these regions during training and increase the model's overall adversarial robustness, even when using identical computational resources.",
        "keywords": "supervised representation learning;representation learning for computer vision;visualization or interpretation of learned representations",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/6f6d10f7bde30f84686965c607ffcad47db2d831.zip",
        "author": "Monty Maximilian Z\u00fchlke;Daniel Kudenko",
        "authorids": "~Monty_Maximilian_Z\u00fchlke1;~Daniel_Kudenko1",
        "gender": "M;M",
        "homepage": ";",
        "dblp": "375/6617;46/2964",
        "google_scholar": "Fv4Gf-wAAAAJ;uUXUMukAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Monty_Maximilian_Z\u00fchlke1;~Daniel_Kudenko1",
        "aff": "Leibniz Universit\u00e4t Hannover;L3S Research Center",
        "aff_domain": "uni-hannover.de;l3s.de",
        "position": "PhD student;Research Group Leader",
        "bibtex": "@misc{\nz{\\\"u}hlke2024advancing,\ntitle={Advancing the Adversarial Robustness of Neural Networks from the Data Perspective},\nauthor={Monty Maximilian Z{\\\"u}hlke and Daniel Kudenko},\nyear={2024},\nurl={https://openreview.net/forum?id=dA4EWchlbn}\n}",
        "github": "",
        "project": "",
        "reviewers": "pfh7;8FHc;yQLb;vUSY",
        "site": "https://openreview.net/forum?id=dA4EWchlbn",
        "pdf_size": 13406888,
        "rating": "3;3;3;5",
        "confidence": "3;3;3;3",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;1;2",
        "wc_summary": "45;178;62;126",
        "wc_strengths": "29;37;28;125",
        "wc_weaknesses": "252;349;238;38",
        "wc_questions": "63;65;66;322",
        "wc_review": "389;629;394;611",
        "wc_reply_reviewers": "0;0;0;65",
        "wc_reply_authors": "791;730;456;1486",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "2;1;1;3",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            102.75,
            52.91207329145211
        ],
        "wc_strengths_avg": [
            54.75,
            40.708567894240645
        ],
        "wc_weaknesses_avg": [
            219.25,
            113.03843372941789
        ],
        "wc_questions_avg": [
            129.0,
            111.43383687193042
        ],
        "wc_review_avg": [
            505.75,
            114.44075978426568
        ],
        "wc_reply_reviewers_avg": [
            16.25,
            28.145825622994256
        ],
        "wc_reply_authors_avg": [
            865.75,
            379.6777416441475
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:QHrPP6FfK_sJ:scholar.google.com/&scioq=Advancing+the+Adversarial+Robustness+of+Neural+Networks+from+the+Data+Perspective&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Leibniz Universit\u00e4t Hannover;Leibniz University Hannover",
        "aff_unique_dep": ";L3S Research Center",
        "aff_unique_url": "https://www.leibniz.uni-hannover.de/;https://www.l3s.de/",
        "aff_unique_abbr": "LUH;L3S",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "dALYqPm9gW",
        "title": "Recurrent Linear Transformers",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The self-attention mechanism in the transformer architecture is capable of capturing long-range dependencies and it is the main reason behind its effectiveness in processing sequential data.  Nevertheless, despite their success, transformers have two significant drawbacks that still limit their broader applicability: (1) In order to remember past information, the self-attention mechanism requires access to the whole history to be provided as context. (2) The inference cost in transformers is expensive. In this paper we introduce recurrent alternatives to the transformer self-attention mechanism that offer a context-independent inference cost,  leverage long-range dependencies effectively, and perform well in practice. We evaluate our approaches in reinforcement learning problems where the aforementioned computational limitations make the application of transformers nearly infeasible. We quantify the impact of the different components of our architecture in a diagnostic environment and assess performance gains in 2D and 3D pixel-based partially-observable environments. When compared to a state-of-the-art architecture, GTrXL, inference in our approach is at least 40\\% cheaper while reducing memory use in more than 50\\%. Our approach either performs similarly or better than GTrXL, improving more than 37\\% upon GTrXL performance on harder tasks.",
        "keywords": "transformers;reinforcement learning;partial observability",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/23cdbcc16ea9c699b036749db7ada8e5a03e7508.zip",
        "author": "Subhojeet Pramanik;Esraa Elelimy;Marlos C. Machado;Adam White",
        "authorids": "~Subhojeet_Pramanik1;~Esraa_Elelimy1;~Marlos_C._Machado1;~Adam_White1",
        "gender": "M;F;M;M",
        "homepage": "http://www.subho.in;https://github.com/esraaelelimy;https://webdocs.cs.ualberta.ca/~machado/;http://adamwhite.ca",
        "dblp": ";290/9304;21/10949;91/10481",
        "google_scholar": ";https://scholar.google.ca/citations?user=JUf_Rd8AAAAJ;https://scholar.google.ca/citations?user=xf_n4xUAAAAJ;https://scholar.google.ca/citations?user=1GqGhcsAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;cholodovskis/;",
        "or_profile": "~Subhojeet_Pramanik1;~Esraa_Elelimy1;~Marlos_C._Machado1;~Adam_M_White1",
        "aff": "University of Alberta;University of Alberta;University of Alberta;University of Alberta",
        "aff_domain": "ualberta.ca;ualberta.ca;ualberta.ca;ualberta.ca",
        "position": "MS student;PhD student;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\npramanik2024recurrent,\ntitle={Recurrent Linear Transformers},\nauthor={Subhojeet Pramanik and Esraa Elelimy and Marlos C. Machado and Adam White},\nyear={2024},\nurl={https://openreview.net/forum?id=dALYqPm9gW}\n}",
        "github": "",
        "project": "",
        "reviewers": "gTNz;EZRU;o1NU;zjLV",
        "site": "https://openreview.net/forum?id=dALYqPm9gW",
        "pdf_size": 2232118,
        "rating": "3;5;5;6",
        "confidence": "3;4;4;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;2",
        "presentation": "2;2;3;2",
        "wc_summary": "164;130;138;141",
        "wc_strengths": "46;90;123;91",
        "wc_weaknesses": "290;294;374;438",
        "wc_questions": "56;332;102;1",
        "wc_review": "556;846;737;671",
        "wc_reply_reviewers": "78;476;234;0",
        "wc_reply_authors": "1205;718;630;1099",
        "reply_reviewers": "1;2;1;0",
        "reply_authors": "3;2;1;2",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            143.25,
            12.636751956100111
        ],
        "wc_strengths_avg": [
            87.5,
            27.390691849604675
        ],
        "wc_weaknesses_avg": [
            349.0,
            61.34329629226001
        ],
        "wc_questions_avg": [
            122.75,
            125.99082307850838
        ],
        "wc_review_avg": [
            702.5,
            105.16296876752767
        ],
        "wc_reply_reviewers_avg": [
            197.0,
            181.78283747372853
        ],
        "wc_reply_authors_avg": [
            913.0,
            243.9128942881044
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.2294157338705618,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10906824018284313864&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of Alberta",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ualberta.ca",
        "aff_unique_abbr": "UAlberta",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "dAo780eJdu",
        "title": "CCA Merge: Merging Many Neural Networks with Canonical Correlation Analysis",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Combining the predictions of multiple trained models through ensembling is generally a good way to improve accuracy by leveraging the different learned features of the models, however it comes with high computational and storage costs. Model fusion, the act of merging multiple models into one by combining their parameters reduces these costs but doesn't work as well in practice. Indeed, neural network loss landscapes are high-dimensional and non-convex and the minima found through learning are typically separated by high loss barriers. Numerous recent works have been focused on finding permutations matching one network features to the features of a second one, lowering the loss barrier on the linear path between them in parameter space. However, permutations are restrictive since they assume a one-to-one mapping between the different models' neurons exists. We propose a new model merging algorithm, CCA Merge, which is based on Canonical Correlation Analysis and aims to maximize the correlations between linear combinations of the model features. We show that our method of aligning models leads to lower accuracy barriers when averaging model parameters than past methods. We also extend this analysis into the harder many models setting where more than 2 models are merged, and we find that CCA Merge works significantly better in this setting than past methods.",
        "keywords": "Model merging;Linear mode connectivity",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Stefan Horoi;Albert Manuel Orozco Camacho;Eugene Belilovsky;Guy Wolf",
        "authorids": "~Stefan_Horoi1;~Albert_Manuel_Orozco_Camacho1;~Eugene_Belilovsky1;~Guy_Wolf1",
        "gender": ";M;M;M",
        "homepage": ";https://alorozco53.github.io;http://eugenium.github.io;http://guywolf.org",
        "dblp": "256/5511;186/7164;42/11445;120/1308",
        "google_scholar": "https://scholar.google.fr/citations?user=jUm5G6sAAAAJ;zYXzEisAAAAJ;https://scholar.google.fr/citations?user=CffJDoEAAAAJ;g0k3SjcAAAAJ",
        "orcid": "0000-0003-2951-2600;;;0000-0002-6740-059X",
        "linkedin": ";https://linkedin.com/in/alorozco53;;",
        "or_profile": "~Stefan_Horoi1;~Albert_Manuel_Orozco_Camacho1;~Eugene_Belilovsky1;~Guy_Wolf1",
        "aff": "Universit\u00e9 de Montr\u00e9al;Concordia University;Concordia University, Montreal;University of Montreal",
        "aff_domain": "umontreal.ca;concordia.ca;concordia.ca;umontreal.ca",
        "position": "PhD student;PhD student;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nhoroi2024cca,\ntitle={{CCA} Merge: Merging Many Neural Networks with Canonical Correlation Analysis},\nauthor={Stefan Horoi and Albert Manuel Orozco Camacho and Eugene Belilovsky and Guy Wolf},\nyear={2024},\nurl={https://openreview.net/forum?id=dAo780eJdu}\n}",
        "github": "",
        "project": "",
        "reviewers": "WLcu;XYpB;E1Xu;vbxJ",
        "site": "https://openreview.net/forum?id=dAo780eJdu",
        "pdf_size": 551512,
        "rating": "3;3;6;6",
        "confidence": "3;5;3;3",
        "soundness": "2;1;1;3",
        "contribution": "2;1;3;3",
        "presentation": "2;2;2;2",
        "wc_summary": "165;54;84;40",
        "wc_strengths": "12;28;53;43",
        "wc_weaknesses": "129;370;44;84",
        "wc_questions": "52;4;144;146",
        "wc_review": "358;456;325;313",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            85.75,
            48.43745967740257
        ],
        "wc_strengths_avg": [
            34.0,
            15.508062419270823
        ],
        "wc_weaknesses_avg": [
            156.75,
            126.73865826968502
        ],
        "wc_questions_avg": [
            86.5,
            60.915925668087816
        ],
        "wc_review_avg": [
            363.0,
            56.16493568054717
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896258,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:yRuUyU5hD8gJ:scholar.google.com/&scioq=CCA+Merge:+Merging+Many+Neural+Networks+with+Canonical+Correlation+Analysis&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "Universit\u00e9 de Montr\u00e9al;Concordia University;University of Montreal",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.umontreal.ca;https://www.concordia.ca;https://wwwumontreal.ca",
        "aff_unique_abbr": "UdeM;Concordia;UM",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Montreal",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "dAqH7CfHjL",
        "title": "Phase Transitions in Contrastive Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "How do self-supervised models actually train? We study the training dynamics of contrastive learning in three settings: a theoretical linear setting, on a low-dimensional physics-inspired dataset, and on full-fledged computer vision datasets including ImageNet. In all three settings, we show the existence of *phases*, i.e. locally stable or metastable representations, and of *phase transitions*, wherein a model rapidly and unexpectedly switches between different phases. Geometrically motivated metrics are developed to measure phase transitions. Finally, we show that phase transitions can be sped up with more robust augmentations. Code and visualizations will be made public upon publication.",
        "keywords": "representation learning;training dynamics;contrastive learning",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Ali Cy;Anugrah Chemparathy;Michael Han;Rumen Dangovski;Peter Y. Lu;Charlotte Loh;Marin Soljacic",
        "authorids": "~Ali_Cy1;~Anugrah_Chemparathy1;~Michael_Han1;~Rumen_Dangovski1;~Peter_Y._Lu1;~Charlotte_Loh1;~Marin_Soljacic1",
        "gender": "F;M;M;M;F;;M",
        "homepage": "https://ali.cy;http://www.mit.edu/~anugrah/index.html;;http://super-ms.mit.edu/rumen.html;;https://www.rle.mit.edu/marin/;https://petery.lu",
        "dblp": ";;;207/8546;217/6481;131/2044;244/9937",
        "google_scholar": ";;;;https://scholar.google.com/citations?hl=en;;g6PnqoYAAAAJ",
        "orcid": ";;;;;;0000-0001-6183-5237",
        "linkedin": ";;michael-han-141a0218a/;;;;",
        "or_profile": "~Ali_Cy1;~Anugrah_Chemparathy1;~Michael_Han1;~Rumen_Dangovski1;~Charlotte_Loh1;~Marin_Soljacic1;~Peter_Y_Lu1",
        "aff": "Massachusetts Institute of Technology;Massachusetts Institute of Technology;Massachusetts Institute of Technology;Massachusetts Institute of Technology;Massachusetts Institute of Technology;;University of Chicago",
        "aff_domain": "mit.edu;mit.edu;mit.edu;mit.edu;mit.edu;;uchicago.edu",
        "position": "Undergrad student;Undergrad student;Undergrad student;PhD student;PhD student;;Postdoc",
        "bibtex": "@misc{\ncy2024phase,\ntitle={Phase Transitions in Contrastive Learning},\nauthor={Ali Cy and Anugrah Chemparathy and Michael Han and Rumen Dangovski and Peter Y. Lu and Charlotte Loh and Marin Soljacic},\nyear={2024},\nurl={https://openreview.net/forum?id=dAqH7CfHjL}\n}",
        "github": "",
        "project": "",
        "reviewers": "7pQx;53nW;KFjy",
        "site": "https://openreview.net/forum?id=dAqH7CfHjL",
        "pdf_size": 11448393,
        "rating": "3;5;5",
        "confidence": "4;3;3",
        "soundness": "2;3;3",
        "contribution": "2;2;2",
        "presentation": "2;2;3",
        "wc_summary": "393;62;89",
        "wc_strengths": "68;18;60",
        "wc_weaknesses": "319;117;65",
        "wc_questions": "86;43;96",
        "wc_review": "866;240;310",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            181.33333333333334,
            150.07627690241017
        ],
        "wc_strengths_avg": [
            48.666666666666664,
            21.9291789378647
        ],
        "wc_weaknesses_avg": [
            167.0,
            109.55668243729666
        ],
        "wc_questions_avg": [
            75.0,
            22.992752481307377
        ],
        "wc_review_avg": [
            472.0,
            280.0618979202038
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.9999999999999998,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:oyJb7OIep_kJ:scholar.google.com/&scioq=Phase+Transitions+in+Contrastive+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0;1",
        "aff_unique_norm": "Massachusetts Institute of Technology;University of Chicago",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://web.mit.edu;https://www.uchicago.edu",
        "aff_unique_abbr": "MIT;UChicago",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "dBO8ZPQMVF",
        "title": "MAS: Multi-view Ancestral Sampling for 3D motion generation using 2D diffusion",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We introduce Multi-view Ancestral Sampling (MAS), a method for generating consistent multi-view 2D samples of a motion sequence, enabling the creation of its corresponding 3D counterpart. \nWhile abundant 2D samples are readily available, such as those found in videos, 3D data collection is involved and expensive, often requiring specialized motion-capture systems. MAS leverages diffusion models trained solely on 2D data to produce coherent and realistic 3D motions. \nThis is achieved by simultaneously applying multiple ancestral samplings to denoise multiple 2D sequences representing the same motion from different angles. \nOur consistency block ensures 3D consistency at each diffusion step by combining the individual generations into a unified 3D sequence, and projecting it back to the original views for the next iteration.\nWe evaluate MAS using 2D pose data from intricate and unique motions, including professional basketball maneuvers, rhythmic gymnastic performances featuring ball apparatus interactions, and horse obstacle course races. In each of these domains, MAS generates diverse, high-quality, and unprecedented 3D sequences that would otherwise require expensive equipment and intensive human labor to obtain.",
        "keywords": "diffusion;prior;wild;generation;motion;generative;SDS;dream;dreamfusion",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/967115fd85cb15576e654601be87c8019e111a30.zip",
        "author": "Roy Kapon;Guy Tevet;Amit Haim Bermano",
        "authorids": "~Roy_Kapon1;~Guy_Tevet1;~Amit_Haim_Bermano2",
        "gender": "M;M;M",
        "homepage": ";https://guytevet.github.io/;https://www.cs.tau.ac.il/~amberman/",
        "dblp": ";229/4227.html;97/10458",
        "google_scholar": "FAQOuSgAAAAJ;P9ROgN8AAAAJ;https://scholar.google.co.il/citations?user=EPO5_f4AAAAJ",
        "orcid": ";0000-0003-4376-2403;",
        "linkedin": ";;",
        "or_profile": "~Roy_Kapon1;~Guy_Tevet1;~Amit_Haim_Bermano2",
        "aff": "Tel Aviv University;Tel Aviv University;Tel Aviv University",
        "aff_domain": "tau.ac.il;tau.ac.il;tau.ac.il",
        "position": "MS student;PhD student;Associate Professor",
        "bibtex": "@misc{\nkapon2024mas,\ntitle={{MAS}: Multi-view Ancestral Sampling for 3D motion generation using 2D diffusion},\nauthor={Roy Kapon and Guy Tevet and Amit Haim Bermano},\nyear={2024},\nurl={https://openreview.net/forum?id=dBO8ZPQMVF}\n}",
        "github": "",
        "project": "",
        "reviewers": "XKj7;ZnEM;8H4R",
        "site": "https://openreview.net/forum?id=dBO8ZPQMVF",
        "pdf_size": 8738547,
        "rating": "3;5;5",
        "confidence": "4;4;3",
        "soundness": "1;2;2",
        "contribution": "2;3;2",
        "presentation": "2;3;2",
        "wc_summary": "89;93;273",
        "wc_strengths": "17;73;86",
        "wc_weaknesses": "215;239;355",
        "wc_questions": "11;123;257",
        "wc_review": "332;528;971",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            151.66666666666666,
            85.81116218508845
        ],
        "wc_strengths_avg": [
            58.666666666666664,
            29.93697082575694
        ],
        "wc_weaknesses_avg": [
            269.6666666666667,
            61.1300980605208
        ],
        "wc_questions_avg": [
            130.33333333333334,
            100.5628603853773
        ],
        "wc_review_avg": [
            610.3333333333334,
            267.2880260858853
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 22,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5373915692924588961&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Tel Aviv University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tau.ac.il",
        "aff_unique_abbr": "TAU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Israel"
    },
    {
        "id": "dCDX1fjrXr",
        "title": "Sparse Labels Node Classification: Unsupervised Learning for Mentoring Supervised Learning in Sparse Label Settings",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Despite their huge success, Graph Neural Networks (GNNs) still require lots of labeled examples (per class) at training time in order to perform well on the Semi-Supervised Node Classification (SSNC) task. This is a major drawback since labels are usually expensive and time-consuming to get. Though several attempts have been made to address this problem, most attempts still require; a significant amount of labeled examples for at least some classes (considered base classes), as well a minimum amount of labels per class (for other classes). In this work, we attempt to alleviate these hard requirements. Our problem thus differs from the traditional SSNC settings in the sense that in this work we try to address the setting in which we only have extremely few labeled nodes seen at training time, and in addition, these labeled nodes are not provided (chosen) on a per-class basis. We name this task Sparse Labels Node Classification (SLNC). To address this problem, we Estimate Label Information (ELI) from a pseudo space by leveraging unsupervised learning techniques. We use this estimated label information to enhance reformulations of well-known semi-supervised learning (SSL) frameworks, as well as guide the labeled nodes selection process for training. We show that our approach outperforms baselines on SLNC by 10-20% when the number of labeled nodes seen at training is extremely few.",
        "keywords": "Graphs; Semi-Supervised Node Classification; Unsupervised learning; Clustering; Sparse Labels Setting",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/36b8c68fe1554c7765b405b9f4be69dc52f742ee.zip",
        "author": "Barakeel Fanseu Kamhoua;Lin Zhang;Yongqiang Chen;Tongliang Liu;Huamin Qu;Bo Han",
        "authorids": "~Barakeel_Fanseu_Kamhoua1;~Lin_Zhang11;~Yongqiang_Chen1;~Tongliang_Liu1;~Huamin_Qu1;~Bo_Han1",
        "gender": ";;;M;M;M",
        "homepage": ";https://lzhangbv.github.io/;https://lfhase.win;https://tongliang-liu.github.io/;http://huamin.org/;https://bhanml.github.io/",
        "dblp": "267/1642.html;;76/5774-2;150/6667;65/1792.html;241/0472-3",
        "google_scholar": ";;huQ_Ig8AAAAJ;https://scholar.google.com.au/citations?user=EiLdZ_YAAAAJ;https://scholar.google.com.tw/citations?user=J7a5zGEAAAAJ;nTNjqHwAAAAJ",
        "orcid": ";0000-0001-8493-4705;;;0000-0001-6711-8028;",
        "linkedin": ";;;;;",
        "or_profile": "~Barakeel_Fanseu_Kamhoua1;~Lin_Zhang11;~Yongqiang_Chen1;~Tongliang_Liu1;~Huamin_Qu1;~bo_han2",
        "aff": "Department of Computer Science and Engineering, Hong Kong University of Science and Technology;Huawei Technologies Ltd.;Department of Computer Science and Engineering, The Chinese University of Hong Kong;Mohamed bin Zayed University of Artificial Intelligence;Hong Kong University of Science and Technology;MBZUAI",
        "aff_domain": "cse.ust.hk;huawei.com;cse.cuhk.edu.hk;mbzuai.ac.ae;hkust.edu;mbzuai.ac.ae",
        "position": "PhD student;Researcher;PhD student;Affiliated Associate Professor;Full Professor;Researcher",
        "bibtex": "@misc{\nkamhoua2024sparse,\ntitle={Sparse Labels Node Classification: Unsupervised Learning for Mentoring Supervised Learning in Sparse Label Settings},\nauthor={Barakeel Fanseu Kamhoua and Lin Zhang and Yongqiang Chen and Tongliang Liu and Huamin Qu and Bo Han},\nyear={2024},\nurl={https://openreview.net/forum?id=dCDX1fjrXr}\n}",
        "github": "",
        "project": "",
        "reviewers": "g7gp;L6C4;zMM3;N5b9",
        "site": "https://openreview.net/forum?id=dCDX1fjrXr",
        "pdf_size": 2264991,
        "rating": "3;3;5;5",
        "confidence": "4;4;4;4",
        "soundness": "2;2;3;2",
        "contribution": "2;1;2;2",
        "presentation": "1;2;2;2",
        "wc_summary": "59;75;46;80",
        "wc_strengths": "55;22;41;36",
        "wc_weaknesses": "232;329;39;89",
        "wc_questions": "193;40;264;3",
        "wc_review": "539;466;390;208",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "2103;891;984;336",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "5;3;3;2",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            65.0,
            13.435028842544403
        ],
        "wc_strengths_avg": [
            38.5,
            11.800423721205947
        ],
        "wc_weaknesses_avg": [
            172.25,
            114.92035285361771
        ],
        "wc_questions_avg": [
            125.0,
            107.3009785603095
        ],
        "wc_review_avg": [
            400.75,
            123.12468274070801
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1078.5,
            641.2864024755241
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            3.25,
            1.0897247358851685
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:iQyFprno6xsJ:scholar.google.com/&scioq=Sparse+Labels+Node+Classification:+Unsupervised+Learning+for+Mentoring+Supervised+Learning+in+Sparse+Label+Settings&hl=en&as_sdt=0,31",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;0;3",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Huawei;Chinese University of Hong Kong;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_unique_dep": "Department of Computer Science and Engineering;Huawei Technologies;Department of Computer Science and Engineering;",
        "aff_unique_url": "https://www.ust.hk;https://www.huawei.com;https://www.cuhk.edu.hk;https://mbzuai.ac.ae",
        "aff_unique_abbr": "HKUST;Huawei;CUHK;MBZUAI",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;1;0;1",
        "aff_country_unique": "China;United Arab Emirates"
    },
    {
        "title": "Learning to Reject with a Fixed Predictor: Application to Decontextualization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18271",
        "id": "dCHbFDsCZz",
        "author_site": "Christopher Mohri, Daniel Andor, Eunsol Choi, Michael Collins, Anqi Mao, Yutao Zhong",
        "tldr": "",
        "abstract": "We study the problem of classification with a reject option for a fixed predictor, crucial to natural language processing. We introduce a new problem formulation for this scenario, and an algorithm minimizing a new surrogate loss function. We provide a complete theoretical analysis of the surrogate loss function with a strong $H$-consistency guarantee. For evaluation, we choose the \\textit{decontextualization} task, and provide a manually-labelled dataset of $2\\mathord,000$ examples. Our algorithm significantly outperforms the baselines considered, with a $\\sim 25$% improvement in coverage when halving the error rate, which is only $\\sim 3$% away from the theoretical limit.",
        "keywords": "Rejection;abstention;loss function;consistency;learning theory;decontextualization;natural language processing",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/b5e011ebd8c2a5f5c5d93537b0805891513eaf57.pdf",
        "author": "Christopher Mohri;Daniel Andor;Eunsol Choi;Michael Collins;Anqi Mao;Yutao Zhong",
        "authorids": "~Christopher_Mohri1;~Daniel_Andor1;~Eunsol_Choi1;~Michael_Collins1;~Anqi_Mao1;~Yutao_Zhong1",
        "gender": "M;M;;M;F;",
        "homepage": ";https://ai.google/research/people/DanielAndor;https://eunsol.github.io/;http://www.cs.columbia.edu/~mcollins;https://anqi-mao.github.io;",
        "dblp": ";;116/2765;29/1340;241/6864;51/3178-2",
        "google_scholar": "_otSGXcAAAAJ;v1DZ5jQAAAAJ;6wulN88AAAAJ;DxoenfgAAAAJ;nkjIZ-oAAAAJ;",
        "orcid": ";;0000-0003-3607-9104;;;",
        "linkedin": "christopher-mohri-3429841a0/;;;;;",
        "or_profile": "~Christopher_Mohri1;~Daniel_Andor1;~Eunsol_Choi1;~Michael_Collins1;~Anqi_Mao1;~Yutao_Zhong1",
        "aff": "Stanford University;Google;University of Texas, Austin;Columbia University;Courant Institute of Mathematical Sciences, NYU;Google",
        "aff_domain": "stanford.edu;google.com;cs.utexas.edu;columbia.edu;cims.nyu.edu;google.com",
        "position": "PhD student;Google Research;Assistant Professor;Full Professor;PhD student;Researcher",
        "bibtex": "@inproceedings{\nmohri2024learning,\ntitle={Learning to Reject with a Fixed Predictor: Application to Decontextualization},\nauthor={Christopher Mohri and Daniel Andor and Eunsol Choi and Michael Collins and Anqi Mao and Yutao Zhong},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=dCHbFDsCZz}\n}",
        "github": "",
        "project": "",
        "reviewers": "irSz;KRjg;AHeX",
        "pdf_size": 471049,
        "rating": "6;6;6",
        "confidence": "3;3;3",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "2;3;3",
        "wc_summary": "102;143;92",
        "wc_strengths": "74;80;56",
        "wc_weaknesses": "117;257;213",
        "wc_questions": "88;130;117",
        "wc_review": "381;610;478",
        "wc_reply_reviewers": "0;247;207",
        "wc_reply_authors": "608;968;501",
        "reply_reviewers": "0;2;2",
        "reply_authors": "2;5;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            112.33333333333333,
            22.065558884580486
        ],
        "wc_strengths_avg": [
            70.0,
            10.198039027185569
        ],
        "wc_weaknesses_avg": [
            195.66666666666666,
            58.45416057808793
        ],
        "wc_questions_avg": [
            111.66666666666667,
            17.556258776351587
        ],
        "wc_review_avg": [
            489.6666666666667,
            93.85212955613859
        ],
        "wc_reply_reviewers_avg": [
            151.33333333333334,
            108.24765842989656
        ],
        "wc_reply_authors_avg": [
            692.3333333333334,
            199.7604120495906
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            3.0,
            1.4142135623730951
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 24,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8081603807392568681&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=dCHbFDsCZz",
        "pdf": "https://openreview.net/pdf?id=dCHbFDsCZz",
        "email": "stanford.edu;google.com;cs.utexas.edu;columbia.edu;cims.nyu.edu;google.com",
        "author_num": 6,
        "aff_unique_index": "0;1;2;3;4;1",
        "aff_unique_norm": "Stanford University;Google;University of Texas at Austin;Columbia University;New York University",
        "aff_unique_dep": ";Google;;;Courant Institute of Mathematical Sciences",
        "aff_unique_url": "https://www.stanford.edu;https://www.google.com;https://www.utexas.edu;https://www.columbia.edu;https://www.courant.nyu.edu",
        "aff_unique_abbr": "Stanford;Google;UT Austin;Columbia;NYU",
        "aff_campus_unique_index": "0;1;2;4;1",
        "aff_campus_unique": "Stanford;Mountain View;Austin;;New York",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "dCyt9k4U6N",
        "title": "FLNERF: 3D FACIAL LANDMARKS ESTIMATION IN NEURAL RADIANCE FIELDS",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper presents the first significant work on directly predicting 3D face landmarks on neural radiance fields (NeRFs). This direct NeRF approach is shown to surpass existing single or multi-view image approaches. Our 3D coarse-to-fine Face Landmarks FLNeRF model efficiently samples from a given face NeRF individual facial features for accurate landmarks detection. Expression augmentation is applied at facial features in fine scale to simulate large emotions range including exaggerated facial expressions (e.g., cheek blowing, wide opening mouth) for training FLNeRF. Qualitative and quantitative comparison with related state-of-the-art 3D facial landmark estimation methods demonstrate the efficacy of FLNeRF, which contributes to downstream tasks such as high-quality face editing and swapping with direct control using our NeRF landmarks. Code and data will be available.",
        "keywords": "NeRF; 3D Face Landmarks Detection; NeRF editting",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/d767f6e5e8c243e13001df3a274d939a58e8c1a4.zip",
        "author": "Hao ZHANG;Tianyuan DAI;Yu-Wing Tai;Chi-Keung Tang",
        "authorids": "~Hao_ZHANG50;~Tianyuan_DAI1;~Yu-Wing_Tai2;~Chi-Keung_Tang1",
        "gender": "M;M;M;Not Specified",
        "homepage": "https://zhang1023.github.io/ZHANG_Hao.github.io/;https://rogerdai1217.github.io/;https://yuwingtai.github.io/;http://www.cse.ust.hk/~cktang/",
        "dblp": "55/2270-106;334/1090;40/566;34/4366",
        "google_scholar": "TgdWSd4AAAAJ;pUuRNGUAAAAJ;nFhLmFkAAAAJ;https://scholar.google.com.tw/citations?user=EWfpM74AAAAJ",
        "orcid": "0009-0009-1097-5665;;0000-0002-3148-0380;",
        "linkedin": "hao-zhang-547b16254/;tianyuandai/;;",
        "or_profile": "~Hao_ZHANG50;~Tianyuan_DAI1;~Yu-Wing_Tai2;~ChiKeung_Tang1",
        "aff": "Department of Computer Science and Engineering, Hong Kong University of Science and Technology;Stanford University;Dartmouth College;Hong Kong University of Science and Technology",
        "aff_domain": "cse.ust.hk;stanford.edu;dartmouth.edu;ust.hk",
        "position": "MS student;MS student;Associate Professor;Professor",
        "bibtex": "@misc{\nzhang2024flnerf,\ntitle={{FLNERF}: 3D {FACIAL} {LANDMARKS} {ESTIMATION} {IN} {NEURAL} {RADIANCE} {FIELDS}},\nauthor={Hao ZHANG and Tianyuan DAI and Yu-Wing Tai and Chi-Keung Tang},\nyear={2024},\nurl={https://openreview.net/forum?id=dCyt9k4U6N}\n}",
        "github": "",
        "project": "",
        "reviewers": "1tLM;Mp21;D4Fc",
        "site": "https://openreview.net/forum?id=dCyt9k4U6N",
        "pdf_size": 22971691,
        "rating": "3;5;5",
        "confidence": "5;4;3",
        "soundness": "2;3;2",
        "contribution": "2;3;2",
        "presentation": "3;3;3",
        "wc_summary": "124;79;73",
        "wc_strengths": "22;28;29",
        "wc_weaknesses": "263;46;259",
        "wc_questions": "78;111;125",
        "wc_review": "487;264;486",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "766;631;389",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            92.0,
            22.759613353482084
        ],
        "wc_strengths_avg": [
            26.333333333333332,
            3.0912061651652345
        ],
        "wc_weaknesses_avg": [
            189.33333333333334,
            101.36512659139183
        ],
        "wc_questions_avg": [
            104.66666666666667,
            19.70335560817553
        ],
        "wc_review_avg": [
            412.3333333333333,
            104.88830037499682
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            595.3333333333334,
            155.9622461438095
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7097324530287111473&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Stanford University;Dartmouth College",
        "aff_unique_dep": "Department of Computer Science and Engineering;;",
        "aff_unique_url": "https://www.ust.hk;https://www.stanford.edu;https://www.dartmouth.edu",
        "aff_unique_abbr": "HKUST;Stanford;Dartmouth",
        "aff_campus_unique_index": "0;1;0",
        "aff_campus_unique": "Hong Kong SAR;Stanford;",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "dDAEtwpqsF",
        "title": "OBSERVATIONAL DATA ONLY: Inferring Protein Signaling Pathways with Local Information- Rewarded Generative Flow Networks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recovering causal influences in protein signaling networks on the basis of observational rather than interventional data is a key problem in systems biology.\nTwo established approaches for inferring protein signaling pathways are scoring based methods and constraint based methods. We observe that both approaches lacks learning ingredient and one could complement the other. Therefore, we consider integrating current advances in generative modeling of bayesian structures with a specialized designed information theory-based reward derived from constraints during network generation to combine the best of two approaches. Particularly the reward design considers both two-point and three-point mutual information scores corrected with complexity penalties. The signs and magnitudes of these quantities allow us to penalize or reward Bayesian networks as they are being built edge by edge by the GFlowNet sampler. This allows the search process to quickly focus on structures that are in agreement with mutual information signatures observed in the experimental data. Using this approach leads to better predictions compared to the standard practice of using Bayesian scores, which were previously explored with both GFlowNet and Monte Carlo sampling. Thus, our contribution amounts to a novel scheme for penalizing Bayesian networks that are inconsistent with the data early on in the sampling process based on constraints and integrates it with scoring based methods through generative modeling.",
        "keywords": "Causal Discovery;Signaling Pathway;Generative Flow Networks",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Haoming Gong;Chengyuan Deng;Yongfeng Zhang;Alexandre Morozov",
        "authorids": "~Haoming_Gong1;~Chengyuan_Deng1;~Yongfeng_Zhang1;~Alexandre_Morozov1",
        "gender": "M;;;M",
        "homepage": ";;;https://www.physics.rutgers.edu/~morozov/",
        "dblp": ";246/4646;;",
        "google_scholar": ";QPaVr9QAAAAJ;;uAhsg6YAAAAJ",
        "orcid": ";;;",
        "linkedin": "jeff-gong-2a7b331b1;;;",
        "or_profile": "~Haoming_Gong1;~Chengyuan_Deng1;~Yongfeng_Zhang1;~Alexandre_Morozov1",
        "aff": "Rutgers University;Rutgers University;;",
        "aff_domain": "rutgers.edu;rutgers.edu;;",
        "position": "PhD student;PhD student;;",
        "bibtex": "@misc{\ngong2024observational,\ntitle={{OBSERVATIONAL} {DATA} {ONLY}: Inferring Protein Signaling Pathways with Local Information- Rewarded Generative Flow Networks},\nauthor={Haoming Gong and Chengyuan Deng and Yongfeng Zhang and Alexandre Morozov},\nyear={2024},\nurl={https://openreview.net/forum?id=dDAEtwpqsF}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=dDAEtwpqsF",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:KC6XyRifsJYJ:scholar.google.com/&scioq=OBSERVATIONAL+DATA+ONLY:+Inferring+Protein+Signaling+Pathways+with+Local+Information-+Rewarded+Generative+Flow+Networks&hl=en&as_sdt=0,31",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Rutgers University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.rutgers.edu",
        "aff_unique_abbr": "Rutgers",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "dER6OpDTnq",
        "title": "How Two-Layer Networks Learn, One (Giant) Step at a Time",
        "track": "main",
        "status": "Desk Reject",
        "tldr": "",
        "abstract": "We investigate theoretically how the features of a two-layer neural network adapt to the structure of the target function through a few large batch gradient descent steps, leading to improvement in the approximation capacity, but only along the learned directions. We compare the influence of batch size and that of multiple (but finitely many) steps. For a single gradient step, a batch of size $n = \\mathcal{O}(d)$ is both necessary and sufficient to align with the target function, although only a single direction can be learned. In contrast, $n = \\mathcal{O}(d^2)$ is essential for neurons to specialize to multiple relevant directions of the target with a single gradient step. Even in this case, we show there might exist ``hard'' directions requiring $n = \\mathcal{O}(d^\\ell)$ samples to be learned, where $\\ell$ is known as the leap index of the target. The picture drastically improves over multiple gradient steps: we show that a batch-size of $n = \\mathcal{O}(d)$ is indeed enough to learn multiple target directions satisfying a staircase property, where more and more direction can be learned over time. Finally, we discuss how these direction allows to drastically improve generalization over the initialization, illustrating a separation of scale between the random feature/lazy regime, and the feature learning regime. Our technical analysis leverages a combination of techniques related to concentration, projection-based conditioning, and Gaussian equivalence which we believe are of independent interest. By pinning down the conditions necessary for specialization and learning, our results highlight the interaction between batch size and number of iterations, and lead to a hierarchical depiction where learning performance exhibits a stairway to accuracy over time and batch size, shedding new light on how neural networks adapt to features of the data.",
        "keywords": "Feature learning;Gradient descent;SGD;Learning Theory;Two-layers neural network;Random Features",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/bdcf5687936a58a9c93fba4dbcf1c4c3bf63b1b7.pdf",
        "author": "Yatin Dandi;Florent Krzakala;Bruno Loureiro;Luca Pesce;Ludovic Stephan",
        "authorids": "~Yatin_Dandi1;~Florent_Krzakala1;~Bruno_Loureiro1;~Luca_Pesce1;~Ludovic_Stephan2",
        "gender": "M;;M;M;M",
        "homepage": "https://yatindandi.github.io/;http://Krzakala.org;https://brloureiro.github.io/;https://lucpoisson.github.io;",
        "dblp": "255/6032;25/1282;207/1834;321/1650;230/4096",
        "google_scholar": "UiEzYkMAAAAJ;https://scholar.google.fr/citations?user=3jDeUlMAAAAJ;DXl3ir8AAAAJ;praGYvoAAAAJ;mEd3WCsAAAAJ",
        "orcid": ";0000-0003-2313-2578;0000-0002-6327-4688;;0000-0001-5612-3577",
        "linkedin": ";;bruno-loureiro-43183b14a/;;",
        "or_profile": "~Yatin_Dandi1;~Florent_Krzakala1;~Bruno_Loureiro1;~Luca_Pesce1;~Ludovic_STEPHAN1",
        "aff": "EPFL - EPF Lausanne;Swiss Federal Institute of Technology Lausanne;Ecole Normale Sup\u00e9rieure, Ecole Normale Sup\u00e9rieure de Paris;EPFL - EPF Lausanne;EPFL - EPF Lausanne",
        "aff_domain": "epfl.ch;epfl.ch;di.ens.fr;epfl.ch;epfl.ch",
        "position": "PhD student;Full Professor;Researcher;PhD student;Postdoc",
        "bibtex": "@misc{\ndandi2024how,\ntitle={How Two-Layer Networks Learn, One (Giant) Step at a Time},\nauthor={Yatin Dandi and Florent Krzakala and Bruno Loureiro and Luca Pesce and Ludovic Stephan},\nyear={2024},\nurl={https://openreview.net/forum?id=dER6OpDTnq}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=dER6OpDTnq",
        "pdf_size": 6970684,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:wioOC_N9rycJ:scholar.google.com/&scioq=How+Two-Layer+Networks+Learn,+One+(Giant)+Step+at+a+Time&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0;0",
        "aff_unique_norm": "EPFL;Swiss Federal Institute of Technology Lausanne;Ecole Normale Sup\u00e9rieure de Paris",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.epfl.ch;https://www.epfl.ch;https://www.ens.psl.eu",
        "aff_unique_abbr": "EPFL;EPFL;ENS Paris",
        "aff_campus_unique_index": "0;0;1;0;0",
        "aff_campus_unique": "Lausanne;Paris",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "Switzerland;France"
    },
    {
        "id": "dEbX5Gf1ZF",
        "title": "Uncovering Time-Invariant Latent Representation for Brain Disorder Diagnosis via Self-Supervised Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recently, large-scale deep-learning models and datasets have shifted the development of medical image analysis with robust and generalizable representations. In this context, self-supervised learning has emerged as a valuable tool, offering the advantage of advancing deep learning without the need for costly annotations while facilitating downstream tasks with limited sample sizes.\nHowever, this feature has been few investigated in brain network analysis, and most existing self-supervised learning approaches yield only comparable performances with those achieved without self-supervised learning.\nIn this study, we introduce an efficient self-supervised representation learning approach known as Bootstrap Time-Invariant Latent (BTIL), aiming at capturing time-invariant representations of brain networks derived from resting-state fMRIs for the diagnosis of brain disorders. We randomly dropped some timepoints in the functional signals and subsequently derived two augmented pseudo-functional connectivity (pFC) as positive pairs.\nOur BTIL consists of an online network and a target network, where each network encodes one augmented pFC. The time-invariant representations are obtained by bringing the latent embeddings of the two networks closer. Additionally, we employ Mask-ROI Modeling (MRM) with both classification and reconstruction heads for relating intra-network dependencies and enhancing regional specificity.\nLinear evaluations on three downstream classifications demonstrate the superiority of BTIL for brain disorder diagnosis with more than 2\\% improvements compared with the state-of-the-art works.",
        "keywords": "self-supervised learning;brain network;brain disorder;diagnosis",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/e410d22c4cac8705e054145b8a8a9813b5a1a970.zip",
        "author": "Yanwu Yang;Chenfei Ye;Ting Ma",
        "authorids": "~Yanwu_Yang2;~Chenfei_Ye1;~Ting_Ma3",
        "gender": "M;M;F",
        "homepage": "https://podismine.github.io/;https://chenfei-ye.github.io/;https://nit-hit.github.io/",
        "dblp": ";;",
        "google_scholar": "3q8-ym8AAAAJ;;xxWdw0IAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Yanwu_Yang2;~Chenfei_Ye1;~Ting_Ma3",
        "aff": "Harbin Institute of Technology at Shenzhen, China;Harbin Institute of Technology;Harbin Institute of Technology (Shenzhen)",
        "aff_domain": "hit.edu.cn;hit.edu.cn;hit.edu.cn",
        "position": "PhD student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nyang2024uncovering,\ntitle={Uncovering Time-Invariant Latent Representation for Brain Disorder Diagnosis via Self-Supervised Learning},\nauthor={Yanwu Yang and Chenfei Ye and Ting Ma},\nyear={2024},\nurl={https://openreview.net/forum?id=dEbX5Gf1ZF}\n}",
        "github": "",
        "project": "",
        "reviewers": "xRi1;VTCV;8QTK;ivDQ",
        "site": "https://openreview.net/forum?id=dEbX5Gf1ZF",
        "pdf_size": 4498036,
        "rating": "3;3;3;5",
        "confidence": "5;4;4;2",
        "soundness": "2;2;3;3",
        "contribution": "2;2;1;2",
        "presentation": "1;1;2;2",
        "wc_summary": "57;51;45;75",
        "wc_strengths": "19;37;33;52",
        "wc_weaknesses": "86;348;87;154",
        "wc_questions": "42;235;27;125",
        "wc_review": "204;671;192;406",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            57.0,
            11.224972160321824
        ],
        "wc_strengths_avg": [
            35.25,
            11.755317945508747
        ],
        "wc_weaknesses_avg": [
            168.75,
            107.09662693101029
        ],
        "wc_questions_avg": [
            107.25,
            82.66309636107276
        ],
        "wc_review_avg": [
            368.25,
            194.37383440164984
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.9271726499455306,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:X_F4DEGlSDYJ:scholar.google.com/&scioq=Uncovering+Time-Invariant+Latent+Representation+for+Brain+Disorder+Diagnosis+via+Self-Supervised+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Harbin Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "http://en.hhit.edu.cn/",
        "aff_unique_abbr": "HIT",
        "aff_campus_unique_index": "0;1;0",
        "aff_campus_unique": "Shenzhen;Harbin",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Soft Robust MDPs and Risk-Sensitive MDPs: Equivalence, Policy Gradient, and Sample Complexity",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18270",
        "id": "dEz3ge8QSo",
        "author_site": "Runyu Zhang, Yang Hu, Na Li",
        "tldr": "",
        "abstract": "Robust Markov Decision Processes (MDPs) and risk-sensitive MDPs are both powerful tools for making decisions in the presence of uncertainties. Previous efforts have aimed to establish their connections, revealing equivalences in specific formulations. This paper introduces a new formulation for risk-sensitive MDPs, which assesses risk in a slightly different manner compared to the classical Markov risk measure [Ruszczy \u0301nski 2010], and establishes its equivalence with a class of soft robust MDP (RMDP) problems, including the standard RMDP as a special case. Leveraging this equivalence, we further derive the policy gradient theorem for both problems, proving gradient domination and global convergence of the exact policy gradient method under the tabular setting with direct parameterization. This forms a sharp contrast to the Markov risk measure, known to be potentially non-gradient-dominant [Huang et al. 2021]. We also propose a sample-based offline learning algorithm, namely the robust fitted-Z iteration (RFZI), for a specific soft RMDP problem with a KL-divergence regularization term (or equivalently the risk-sensitive MDP with an entropy risk measure). We showcase its streamlined\ndesign and less stringent assumptions due to the equivalence and analyze its sample complexity.",
        "keywords": "risk-sensitive reinforcement learning;robust Markov Decision Processes",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/80ebceed744cbf49fcc9f3e6e2624bf81d5c1e1f.pdf",
        "author": "Runyu Zhang;Yang Hu;Na Li",
        "authorids": "~Runyu_Zhang1;~Yang_Hu6;~Na_Li3",
        "gender": ";M;F",
        "homepage": "https://dianyu420376.github.io/runyu-cathy-zhang.github.io/;http://huyangsh.github.io;https://nali.seas.harvard.edu/",
        "dblp": ";;",
        "google_scholar": "h3SuftsAAAAJ;https://scholar.google.com/citations?hl=en;qdGelXoAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Runyu_Zhang1;~Yang_Hu6;~Na_Li3",
        "aff": "Harvard University;Harvard University;Harvard University",
        "aff_domain": "harvard.edu;g.harvard.edu;harvard.edu",
        "position": "PhD student;PhD student;Full Professor",
        "bibtex": "@inproceedings{\nzhang2024soft,\ntitle={Soft Robust {MDP}s and Risk-Sensitive {MDP}s: Equivalence, Policy Gradient, and Sample Complexity},\nauthor={Runyu Zhang and Yang Hu and Na Li},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=dEz3ge8QSo}\n}",
        "github": "",
        "project": "",
        "reviewers": "KqgB;RSEz;SuJM;BzBp",
        "pdf_size": 380662,
        "rating": "6;6;6;8",
        "confidence": "4;4;4;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;4;2;3",
        "wc_summary": "58;99;83;56",
        "wc_strengths": "41;45;21;26",
        "wc_weaknesses": "121;694;418;23",
        "wc_questions": "291;13;594;106",
        "wc_review": "511;851;1116;211",
        "wc_reply_reviewers": "30;1152;0;13",
        "wc_reply_authors": "1438;3279;2149;754",
        "reply_reviewers": "1;5;0;1",
        "reply_authors": "4;7;4;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            74.0,
            17.930421077041107
        ],
        "wc_strengths_avg": [
            33.25,
            10.0093706095838
        ],
        "wc_weaknesses_avg": [
            314.0,
            263.2232892431823
        ],
        "wc_questions_avg": [
            251.0,
            221.87721829876992
        ],
        "wc_review_avg": [
            672.25,
            341.9132748227246
        ],
        "wc_reply_reviewers_avg": [
            298.75,
            492.7389648688238
        ],
        "wc_reply_authors_avg": [
            1905.0,
            934.1174979626493
        ],
        "reply_reviewers_avg": [
            1.75,
            1.920286436967152
        ],
        "reply_authors_avg": [
            4.25,
            1.7853571071357126
        ],
        "replies_avg": [
            30,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2421622185282876349&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=dEz3ge8QSo",
        "pdf": "https://openreview.net/pdf?id=dEz3ge8QSo",
        "email": "harvard.edu;g.harvard.edu;harvard.edu",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Harvard University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.harvard.edu",
        "aff_unique_abbr": "Harvard",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "dFQL7nwksh",
        "title": "PDC-Net: Probability Density Cloud Representations of Proteins for Mutation Effect Prediction",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Understanding the ramifications of mutations at a protein level can have significant implications in various domains such as drug development, disease pathways, and the broader field of genomics. Despite the promise of data-driven and deep learning (DL) strategies, existing algorithms still face a significant challenge in integrating the dynamic changes of biomolecules to accurately predict protein-protein interaction binding affinity changes following mutations ($\\Delta \\Delta G$). Within this study, we introduce an inventive approach aimed at capturing the equilibrium fluctuations and discerning induced conformational changes at the interface, which is particularly important for forecasting mutational effects on binding. This novel technique harnesses probability density clouds (PDC) to describe the magnitude and intensity of their movement during and after the binding process and puts forth aligned networks to propagate distributions of the equilibrium of molecular systems. To fully unleash the potential of PDC-Net, we further present two physics-inspired pretraining tasks to employ the molecular dynamics (MD) simulation trajectories and the extensive collection of static crystal protein structures. Experiments demonstrate that our approach surpasses the performance of both empirical energy functions and alternative DL methods.",
        "keywords": "Protein-protein interaction;Thermodynamics;Geometric Deep Learning",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Fang Wu;Shuting Jin;Shikun Feng;Le Song;Stan Z. Li",
        "authorids": "~Fang_Wu1;~Shuting_Jin1;~Shikun_Feng3;~Le_Song1;~Stan_Z._Li2",
        "gender": ";F;M;M;",
        "homepage": ";;https://fengshikun.github.io;http://www.cc.gatech.edu/~lsong;",
        "dblp": ";;;94/3481;",
        "google_scholar": ";https://scholar.google.com/citations?view_op=search_authors;;Xl4E0CsAAAAJ;",
        "orcid": ";0000-0002-8113-9367;;;",
        "linkedin": ";;;;",
        "or_profile": "~Fang_Wu1;~Shuting_Jin1;~Shikun_Feng3;~Le_Song1;~Stan_Z._Li2",
        "aff": ";Wuhan University of Science and Technology;Tsinghua University;College of Computing, Georgia Institute of Technology;",
        "aff_domain": ";wust.edu.cn;tsinghua.edu.cn;cc.gatech.edu;",
        "position": ";Lecturer;PhD student;Associate Professor;",
        "bibtex": "@misc{\nwu2024pdcnet,\ntitle={{PDC}-Net: Probability Density Cloud Representations of Proteins for Mutation Effect Prediction},\nauthor={Fang Wu and Shuting Jin and Shikun Feng and Le Song and Stan Z. Li},\nyear={2024},\nurl={https://openreview.net/forum?id=dFQL7nwksh}\n}",
        "github": "",
        "project": "",
        "reviewers": "jjdA;HjvW;Fqv4;SdQS",
        "site": "https://openreview.net/forum?id=dFQL7nwksh",
        "pdf_size": 2988103,
        "rating": "3;3;5;6",
        "confidence": "3;3;2;4",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;1;2;3",
        "wc_summary": "60;98;117;117",
        "wc_strengths": "55;30;30;120",
        "wc_weaknesses": "256;702;19;209",
        "wc_questions": "45;32;108;31",
        "wc_review": "416;862;274;477",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            98.0,
            23.27015255644019
        ],
        "wc_strengths_avg": [
            58.75,
            36.80607966083864
        ],
        "wc_weaknesses_avg": [
            296.5,
            250.36623174861262
        ],
        "wc_questions_avg": [
            54.0,
            31.662280397975127
        ],
        "wc_review_avg": [
            507.25,
            217.65497352461304
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.2721655269759087,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:urAtJ6RHcQoJ:scholar.google.com/&scioq=PDC-Net:+Probability+Density+Cloud+Representations+of+Proteins+for+Mutation+Effect+Prediction&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Wuhan University of Science and Technology;Tsinghua University;Georgia Institute of Technology",
        "aff_unique_dep": ";;College of Computing",
        "aff_unique_url": "http://www.wust.edu.cn;https://www.tsinghua.edu.cn;https://www.gatech.edu",
        "aff_unique_abbr": "WUST;THU;Georgia Tech",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Atlanta",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "PlaSma: Procedural Knowledge Models for Language-based Planning and Re-Planning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18269",
        "id": "dFcXJgnrGB",
        "author_site": "Faeze Brahman, Chandra Bhagavatula, Valentina Pyatkin, Jena Hwang, Xiang Lorraine Li, Hirona Arai, Soumya Sanyal, Keisuke Sakaguchi, Xiang Ren, Yejin Choi",
        "tldr": "",
        "abstract": "Procedural planning, which entails decomposing a high-level goal into a sequence of temporally ordered steps, is an important yet intricate task for machines. It involves integrating common-sense knowledge to reason about complex and often contextualized situations, e.g. ``scheduling a doctor's appointment without a phone''. While current approaches show encouraging results using large language models (LLMs), they are hindered by drawbacks such as costly API calls and reproducibility issues. In this paper, we advocate planning using smaller language models. We present PlaSma, a novel two-pronged approach to endow small language models with procedural knowledge and (constrained) language-based planning capabilities. More concretely, we develop *symbolic procedural knowledge distillation* to enhance the commonsense knowledge in small language models and an *inference-time algorithm* to facilitate more structured and accurate reasoning. In addition, we introduce a new related task, *Replanning*, that requires a revision of a plan to cope with a constrained situation. In both the planning and replanning settings, we show that orders-of-magnitude smaller models (770M-11B parameters) can compete and often surpass their larger teacher models' capabilities. Finally, we showcase successful application of PlaSma in an embodied environment, VirtualHome.",
        "keywords": "language-based planning;procedural/script knowledge;distillation;large language models;decoding-time algorithm",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Faeze Brahman;Chandra Bhagavatula;Valentina Pyatkin;Jena D. Hwang;Xiang Lorraine Li;Hirona Jacqueline Arai;Soumya Sanyal;Keisuke Sakaguchi;Xiang Ren;Yejin Choi",
        "authorids": "~Faeze_Brahman1;~Chandra_Bhagavatula1;~Valentina_Pyatkin1;~Jena_D._Hwang1;~Xiang_Lorraine_Li1;~Hirona_Jacqueline_Arai1;~Soumya_Sanyal1;~Keisuke_Sakaguchi2;~Xiang_Ren1;~Yejin_Choi1",
        "gender": "F;M;;F;;;M;;M;F",
        "homepage": "https://fabrahman.github.io;https://www.chandrab.page;;https://jenahwang.github.io/;;https://hironaarai.com/;https://soumyasanyal.github.io/;https://keisuke-sakaguchi.github.io/;https://shanzhenren.github.io/;https://yejinc.github.io/",
        "dblp": "276/6005;151/3093;;83/10905;;;86/1950-1;127/0185.html;36/360-1;89/579-1",
        "google_scholar": "viCG2ikAAAAJ;AsgHp14AAAAJ;;9QuMhLgAAAAJ;;;https://scholar.google.co.in/citations?user=KvaizyQAAAAJ;6CRBF-MAAAAJ;_moJlrIAAAAJ;vhP-tlcAAAAJ",
        "orcid": ";;;;;;;;;",
        "linkedin": ";;;;;;soumyasanyal/;;xren7;",
        "or_profile": "~Faeze_Brahman1;~Chandra_Bhagavatula1;~Valentina_Pyatkin1;~Jena_D._Hwang1;~Xiang_Lorraine_Li1;~Hirona_Jacqueline_Arai1;~Soumya_Sanyal1;~Keisuke_Sakaguchi2;~Xiang_Ren1;~Yejin_Choi1",
        "aff": "Allen Institute for AI;Allen Institute for Artificial Intelligence;;Allen Institute for Artificial Intelligence;;University of Southern California;University of Southern California;Tohoku University;University of Southern California;Department of Computer Science, University of Washington",
        "aff_domain": "allenai.org;allenai.org;;allenai.org;;usc.edu;usc.edu;tohoku.ac.jp;usc.edu;cs.washington.edu",
        "position": "Postdoc;Researcher;;Researcher;;PhD student;PhD student;Associate Professor;Associate Professor;Full Professor",
        "bibtex": "@inproceedings{\nbrahman2024plasma,\ntitle={PlaSma: Procedural Knowledge Models for Language-based Planning and Re-Planning},\nauthor={Faeze Brahman and Chandra Bhagavatula and Valentina Pyatkin and Jena D. Hwang and Xiang Lorraine Li and Hirona Jacqueline Arai and Soumya Sanyal and Keisuke Sakaguchi and Xiang Ren and Yejin Choi},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=dFcXJgnrGB}\n}",
        "github": "",
        "project": "",
        "reviewers": "bpqq;h13v;drVQ;EJrs",
        "pdf_size": 5546718,
        "rating": "6;6;6;8",
        "confidence": "4;4;4;4",
        "soundness": "3;2;3;3",
        "contribution": "3;2;3;3",
        "presentation": "3;3;2;4",
        "wc_summary": "81;88;31;239",
        "wc_strengths": "57;45;78;60",
        "wc_weaknesses": "205;108;215;261",
        "wc_questions": "125;46;178;105",
        "wc_review": "468;287;502;665",
        "wc_reply_reviewers": "241;58;80;804",
        "wc_reply_authors": "988;688;1303;1916",
        "reply_reviewers": "3;1;1;2",
        "reply_authors": "3;2;4;4",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            109.75,
            77.79259283505083
        ],
        "wc_strengths_avg": [
            60.0,
            11.811011811017716
        ],
        "wc_weaknesses_avg": [
            197.25,
            55.68830667204741
        ],
        "wc_questions_avg": [
            113.5,
            47.225522760473496
        ],
        "wc_review_avg": [
            480.5,
            134.25814686640064
        ],
        "wc_reply_reviewers_avg": [
            295.75,
            301.82310630566377
        ],
        "wc_reply_authors_avg": [
            1223.75,
            454.9991071419811
        ],
        "reply_reviewers_avg": [
            1.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.25,
            0.82915619758885
        ],
        "replies_avg": [
            31,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9669347991379319791&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=dFcXJgnrGB",
        "pdf": "https://openreview.net/pdf?id=dFcXJgnrGB",
        "email": "allenai.org;allenai.org;;allenai.org;;usc.edu;usc.edu;tohoku.ac.jp;usc.edu;cs.washington.edu",
        "author_num": 10,
        "aff_unique_index": "0;1;1;2;2;3;2;4",
        "aff_unique_norm": "Allen Institute for AI;Allen Institute for Artificial Intelligence;University of Southern California;Tohoku University;University of Washington",
        "aff_unique_dep": ";;;;Department of Computer Science",
        "aff_unique_url": "https://allenai.org;https://allenai.org;https://www.usc.edu;https://www.tohoku.ac.jp;https://www.washington.edu",
        "aff_unique_abbr": "AI2;AI2;USC;Tohoku U;UW",
        "aff_campus_unique_index": "1;1;1;2",
        "aff_campus_unique": ";Los Angeles;Seattle",
        "aff_country_unique_index": "0;0;0;0;0;1;0;0",
        "aff_country_unique": "United States;Japan"
    },
    {
        "title": "GenCorres: Consistent Shape Matching via Coupled Implicit-Explicit Shape Generative Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18268",
        "id": "dGH4kHFKFj",
        "author_site": "Haitao Yang, Xiangru Huang, Bo Sun, Chandrajit Bajaj, Qixing Huang",
        "tldr": "",
        "abstract": "This paper introduces GenCorres, a novel unsupervised joint shape matching (JSM) approach. Our key idea is to learn a mesh generator to fit an unorganized deformable shape collection while constraining deformations between adjacent synthetic shapes to preserve geometric structures such as local rigidity and local conformality. GenCorres presents three appealing advantages over existing JSM techniques. First, GenCorres performs JSM among a synthetic shape collection whose size is much bigger than the input shapes and fully leverages the datadriven power of JSM. Second, GenCorres unifies consistent shape matching and pairwise matching (i.e., by enforcing deformation priors between adjacent synthetic shapes). Third, the generator provides a concise encoding of consistent shape correspondences. However, learning a mesh generator from an unorganized shape collection is challenging, requiring a good initialization. GenCorres addresses this issue by learning an implicit generator from the input shapes, which provides intermediate shapes between two arbitrary shapes. We introduce a novel approach for computing correspondences between adjacent implicit surfaces, which we use to regularize the implicit generator. Synthetic shapes of the implicit generator then guide initial fittings (i.e., via template-based deformation) for learning the mesh generator. Experimental results show that GenCorres considerably outperforms state-of-the-art JSM techniques. The synthetic shapes of GenCorres also achieve salient performance gains against state-of-the-art deformable shape generators.",
        "keywords": "Joint shape matching;shape generator;implicit representation;geometric regularization",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/3f273f60003a2b1a37e3a128503348ae9daeb00a.zip",
        "author": "Haitao Yang;Xiangru Huang;Bo Sun;Chandrajit L. Bajaj;Qixing Huang",
        "authorids": "~Haitao_Yang1;~Xiangru_Huang1;~Bo_Sun6;~Chandrajit_L._Bajaj1;~Qixing_Huang1",
        "gender": "M;M;F;M;M",
        "homepage": "https://yanghtr.github.io/;https://people.csail.mit.edu/xrhuang/;https://sites.google.com/view/bosun/home;http://www.cs.utexas.edu/~bajaj/;https://www.cs.utexas.edu/~huangqx/",
        "dblp": "61/5907-5;134/4071;;b/ChandrajitLBajaj;82/241",
        "google_scholar": ";0Out9QwAAAAJ;H9Yzbw4AAAAJ;https://scholar.google.com.tw/citations?user=gyL3CZ0AAAAJ;https://scholar.google.com.tw/citations?user=pamL_rIAAAAJ",
        "orcid": ";;;0000-0002-9619-3278;",
        "linkedin": ";;;chandrajit-bajaj-071792/;",
        "or_profile": "~Haitao_Yang1;~Xiangru_Huang1;~Bo_Sun6;~Chandrajit_L._Bajaj1;~Qixing_Huang1",
        "aff": "The University of Texas at Austin;Westlake University;University of Texas, Austin;University of Texas, Austin;University of Texas at Austin",
        "aff_domain": "utexas.edu;westlake.edu.cn;utexas.edu;utexas.edu;utexas.edu",
        "position": "PhD student;Assistant Professor;PhD student;Full Professor;Associate Professor",
        "bibtex": "@inproceedings{\nyang2024gencorres,\ntitle={GenCorres: Consistent Shape Matching via Coupled Implicit-Explicit Shape Generative Models},\nauthor={Haitao Yang and Xiangru Huang and Bo Sun and Chandrajit L. Bajaj and Qixing Huang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=dGH4kHFKFj}\n}",
        "github": "",
        "project": "",
        "reviewers": "pFHc;sJwu;MqJa;WbPs",
        "pdf_size": 7111545,
        "rating": "5;6;8;8",
        "confidence": "3;4;3;4",
        "soundness": "3;3;3;4",
        "contribution": "3;3;3;4",
        "presentation": "2;2;3;4",
        "wc_summary": "95;71;122;103",
        "wc_strengths": "43;44;194;143",
        "wc_weaknesses": "183;305;85;237",
        "wc_questions": "263;101;75;8",
        "wc_review": "584;521;476;491",
        "wc_reply_reviewers": "101;50;38;52",
        "wc_reply_authors": "713;736;483;356",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            97.75,
            18.2944663764757
        ],
        "wc_strengths_avg": [
            106.0,
            65.04998078400946
        ],
        "wc_weaknesses_avg": [
            202.5,
            80.44097214728325
        ],
        "wc_questions_avg": [
            111.75,
            93.68397675163027
        ],
        "wc_review_avg": [
            518.0,
            41.40652122552678
        ],
        "wc_reply_reviewers_avg": [
            60.25,
            24.128561913218117
        ],
        "wc_reply_authors_avg": [
            572.0,
            159.18071491232848
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.19245008972987526,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5281014353208494860&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=dGH4kHFKFj",
        "pdf": "https://openreview.net/pdf?id=dGH4kHFKFj",
        "email": "utexas.edu;westlake.edu.cn;utexas.edu;utexas.edu;utexas.edu",
        "author_num": 5,
        "aff_unique_index": "0;1;0;0;0",
        "aff_unique_norm": "University of Texas at Austin;Westlake University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.utexas.edu;https://www.westlake.edu.cn",
        "aff_unique_abbr": "UT Austin;WU",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Austin;",
        "aff_country_unique_index": "0;1;0;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "dHJiJ4zYOU",
        "title": "Vector-valued Representation is the Key: A Study on Disentanglement and Compositional Generalization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Disentanglement and compositional generalization are essential abilities for humans, as they enable rapid knowledge acquisition and generalization to new tasks. These abilities involve recognizing fundamental underlying concepts from observations and generating novel concept combinations. However, deep learning models often struggle with these capabilities. Numerous studies have proposed methods for disentangled representation learning, while recent research has also begun to address compositional generalization. Despite these advancements, the relationship between disentanglement and compositional generalization remains under-explored, with inconsistent findings reported in existing literature. In this paper, we analyze various prominent disentangled representation learning methods, examining their disentanglement and compositional generalization capabilities. Our study reveals a crucial insight: adopting vector-valued representations (using vectors rather than scalars to represent concepts) significantly enhances both disentanglement and compositional generalization performance. This insight resonates with findings from neuroscience research, which suggest that the brain encodes information through the collective activity of neuron populations, rather than relying on individual neurons. Motivated by this observation, we further propose a method to reform the scalar-valued disentanglement works ($\\beta$-TCVAE and FactorVAE) to be vector-valued to increase both capabilities. We investigate the impact of the dimensions of vector-valued representation and one important question: whether better disentanglement indicates higher compositional generalization. In summary, our study establishes the feasibility of attaining both effective concept recognition and novel concept composition.",
        "keywords": "Disentanglement;Combination Generalization",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Tao Yang;Yuwang Wang;Cuiling Lan;Yan Lu;Nanning Zheng",
        "authorids": "~Tao_Yang9;~Yuwang_Wang3;~Cuiling_Lan1;~Yan_Lu7;~Nanning_Zheng1",
        "gender": "M;M;F;M;M",
        "homepage": "https://github.com/ThomasMrY;;https://www.microsoft.com/en-us/research/people/culan/;https://www.microsoft.com/en-us/research/people/yanlu/;",
        "dblp": ";161/2633;95/8115;15/4830-1;07/256-1",
        "google_scholar": "https://scholar.google.com.hk/citations?user=qT5psCEAAAAJ;;XZugqiwAAAAJ;djk5l-4AAAAJ;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": ";;0000-0001-9145-9957;0000-0001-5383-6424;",
        "linkedin": ";;;;",
        "or_profile": "~Tao_Yang9;~Yuwang_Wang3;~Cuiling_Lan1;~Yan_Lu7;~Nanning_Zheng1",
        "aff": "Xi'an Jiaotong University;Tsinghua University;Microsoft;Microsoft Research Asia;Xi'an Jiaotong University",
        "aff_domain": "xjtu.edu.cn;tsinghua.edu.cn;microsoft.com;microsoft.com;xjtu.edu.cn",
        "position": "PhD student;Researcher;Principal Researcher;Partner Research Manager;Full Professor",
        "bibtex": "@misc{\nyang2024vectorvalued,\ntitle={Vector-valued Representation is the Key: A Study on Disentanglement and Compositional Generalization},\nauthor={Tao Yang and Yuwang Wang and Cuiling Lan and Yan Lu and Nanning Zheng},\nyear={2024},\nurl={https://openreview.net/forum?id=dHJiJ4zYOU}\n}",
        "github": "",
        "project": "",
        "reviewers": "9DDo;czbp;2XW7;RASM",
        "site": "https://openreview.net/forum?id=dHJiJ4zYOU",
        "pdf_size": 6689328,
        "rating": "5;6;6;6",
        "confidence": "2;5;4;5",
        "soundness": "1;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "71;114;259;24",
        "wc_strengths": "51;73;85;57",
        "wc_weaknesses": "148;226;676;3",
        "wc_questions": "39;77;38;92",
        "wc_review": "309;490;1058;176",
        "wc_reply_reviewers": "130;21;0;0",
        "wc_reply_authors": "1568;791;1491;576",
        "reply_reviewers": "3;1;0;0",
        "reply_authors": "5;3;3;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.0,
            1.224744871391589
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            117.0,
            87.94600616287245
        ],
        "wc_strengths_avg": [
            66.5,
            13.369741957120938
        ],
        "wc_weaknesses_avg": [
            263.25,
            251.3775795491714
        ],
        "wc_questions_avg": [
            61.5,
            23.606143268225754
        ],
        "wc_review_avg": [
            508.25,
            336.39587913647216
        ],
        "wc_reply_reviewers_avg": [
            37.75,
            53.94615370904584
        ],
        "wc_reply_authors_avg": [
            1106.5,
            430.637028133903
        ],
        "reply_reviewers_avg": [
            1.0,
            1.224744871391589
        ],
        "reply_authors_avg": [
            3.0,
            1.4142135623730951
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.9428090415820632,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4343879708842687192&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;2;0",
        "aff_unique_norm": "Xi'an Jiao Tong University;Tsinghua University;Microsoft",
        "aff_unique_dep": ";;Microsoft Corporation",
        "aff_unique_url": "https://www.xjtu.edu.cn;https://www.tsinghua.edu.cn;https://www.microsoft.com",
        "aff_unique_abbr": "XJTU;THU;Microsoft",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Asia",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "dHdXvu5ehy",
        "title": "An Efficient Subgraph GNN with Provable Substructure Counting Power",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Enhancing the representation power of graph neural networks (GNNs) through their ability to count substructures is a recent trend in graph learning. Among these works, a popular way is to use subgraph GNNs, which decompose the input graph into a collection of subgraphs and enhance the representation of the graph by applying GNN to individual subgraphs. Although subgraph GNNs are able to count complicated substructures, they suffer from high computational and memory costs. In this paper, we address a non-trivial question: can we count substructures efficiently and provably with GNNs? To answer the question, we first theoretically show that the distance to the rooted nodes within subgraphs is key to boosting the counting power of subgraph GNNs. We then precompute structural embeddings that encode such information to avoid extracting information over all subgraphs via GNNs repeatedly. Experiments show that the proposed model can preserve the counting power of subgraph GNNs while running orders of magnitude faster.",
        "keywords": "Subgraph GNN;Count substructures;Subgraph Isomorphism counting;Graph Isomorphism test;Graph Neural Network",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/63fbb8989cf231d96c8986b3bda9d28fce970b9c.pdf",
        "author": "Zuoyu Yan;Junru Zhou;Liangcai Gao;Zhi Tang;Muhan Zhang",
        "authorids": "~Zuoyu_Yan1;~Junru_Zhou1;~Liangcai_Gao2;~Zhi_Tang2;~Muhan_Zhang1",
        "gender": "M;M;M;M;M",
        "homepage": "https://pkuyzy.github.io/;https://github.com/zml72062;;https://www.wict.pku.edu.cn/cpdp/kydw/ggcy/1297369.htm;https://muhanzhang.github.io/",
        "dblp": "203/8184;;23/7062;16/4222-1;157/5518",
        "google_scholar": "d-Ch_PgAAAAJ;;;https://scholar.google.com/citations?hl=en;https://scholar.google.com.hk/citations?user=OBBqkosAAAAJ",
        "orcid": ";;;0000-0002-6021-8357;0000-0002-7680-6401",
        "linkedin": ";;;;jerry-muhan-zhang-a33a1777/",
        "or_profile": "~Zuoyu_Yan1;~Junru_Zhou1;~Liangcai_Gao2;~Zhi_Tang2;~Muhan_Zhang1",
        "aff": "Peking University;Peking University;Peking University;Peking University;Peking University",
        "aff_domain": "pku.edu.cn;pku.edu.cn;pku.edu.cn;pku.edu.cn;pku.edu.cn",
        "position": "PhD student;Undergrad student;Associate Professor;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nyan2024an,\ntitle={An Efficient Subgraph {GNN} with Provable Substructure Counting Power},\nauthor={Zuoyu Yan and Junru Zhou and Liangcai Gao and Zhi Tang and Muhan Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=dHdXvu5ehy}\n}",
        "github": "",
        "project": "",
        "reviewers": "qaTB;p2Va;7TFC;aWFU",
        "site": "https://openreview.net/forum?id=dHdXvu5ehy",
        "pdf_size": 1395628,
        "rating": "3;5;5;6",
        "confidence": "3;4;3;4",
        "soundness": "2;2;2;3",
        "contribution": "1;2;2;2",
        "presentation": "2;2;3;3",
        "wc_summary": "60;80;104;227",
        "wc_strengths": "58;35;69;90",
        "wc_weaknesses": "170;216;78;351",
        "wc_questions": "166;211;70;16",
        "wc_review": "454;542;321;684",
        "wc_reply_reviewers": "5;125;32;131",
        "wc_reply_authors": "1055;1574;787;1545",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "3;3;2;3",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            117.75,
            64.9706664580255
        ],
        "wc_strengths_avg": [
            63.0,
            19.836834424877374
        ],
        "wc_weaknesses_avg": [
            203.75,
            98.4692210794825
        ],
        "wc_questions_avg": [
            115.75,
            76.87774385347166
        ],
        "wc_review_avg": [
            500.25,
            132.076445666894
        ],
        "wc_reply_reviewers_avg": [
            73.25,
            55.616431924387236
        ],
        "wc_reply_authors_avg": [
            1240.25,
            333.17215895089436
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.75,
            0.4330127018922193
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.6882472016116854,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10363442527836466448&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Peking University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.pku.edu.cn",
        "aff_unique_abbr": "Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "ToolLLM: Facilitating Large Language Models to Master 16000+ Real-world APIs",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18267",
        "id": "dHng2O0Jjr",
        "author_site": "Yujia Qin, Shihao Liang, Yining Ye, Kunlun Zhu, Lan Yan, Yaxi Lu, Yankai Lin, Xin Cong, Xiangru Tang, Bill Qian, Sihan Zhao, Lauren Hong, Runchu Tian, Ruobing Xie, Jie Zhou, Mark Gerstein, dahai li, Zhiyuan Liu, Maosong Sun",
        "tldr": "",
        "abstract": "Despite the advancements of open-source large language models (LLMs), e.g., LLaMA, they remain significantly limited in tool-use capabilities, i.e., using external tools (APIs) to fulfill human instructions. The reason is that current instruction tuning largely focuses on basic language tasks but ignores the tool-use domain. This is in contrast to the excellent tool-use capabilities of state-of-the-art (SOTA) closed-source LLMs, e.g., ChatGPT. To bridge this gap, we introduce ToolLLM, a general tool-use framework encompassing data construction, model training, and evaluation. We first present ToolBench, an instruction-tuning dataset for tool use, which is constructed automatically using ChatGPT. Specifically, the construction can be divided into three stages: (i) API collection: we collect 16,464 real-world RESTful APIs spanning 49 categories from RapidAPI Hub; (ii) instruction generation: we prompt ChatGPT to generate diverse instructions involving these APIs, covering both single-tool and multi-tool scenarios; (iii) solution path annotation: we use ChatGPT to search for a valid solution path (chain of API calls) for each instruction. To enhance the reasoning capabilities of LLMs, we develop a novel depth-first search-based decision tree algorithm. It enables LLMs to evaluate multiple reasoning traces and expand the search space. Moreover, to evaluate the tool-use capabilities of LLMs, we develop an automatic evaluator: ToolEval. Based on ToolBench, we fine-tune LLaMA to obtain an LLM ToolLLaMA, and equip it with a neural API retriever to recommend appropriate APIs for each instruction. Experiments show that ToolLLaMA demonstrates a remarkable ability to execute complex instructions and generalize to unseen APIs, and exhibits comparable performance to ChatGPT. Our ToolLLaMA also demonstrates strong zero-shot generalization ability in an out-of-distribution tool-use dataset: APIBench.",
        "keywords": "Large Language Model;Tool Use;API Use",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/8694aac593a62fec32c192a99fe9313f79b8b1c4.zip",
        "author": "Yujia Qin;Shihao Liang;Yining Ye;Kunlun Zhu;Lan Yan;Yaxi Lu;Yankai Lin;Xin Cong;Xiangru Tang;Bill Qian;Sihan Zhao;Lauren Hong;Runchu Tian;Ruobing Xie;Jie Zhou;Mark Gerstein;dahai li;Zhiyuan Liu;Maosong Sun",
        "authorids": "~Yujia_Qin1;~Shihao_Liang1;~Yining_Ye1;~Kunlun_Zhu1;~Lan_Yan4;~Yaxi_Lu1;~Yankai_Lin1;~Xin_Cong1;~Xiangru_Tang2;~Bill_Qian1;~Sihan_Zhao1;~Lauren_Hong1;~Runchu_Tian1;~Ruobing_Xie2;~Jie_Zhou8;~Mark_Gerstein2;~dahai_li1;~Zhiyuan_Liu1;~Maosong_Sun1",
        "gender": "M;M;M;F;;M;M;M;M;F;F;M;M;M;M;M;M;M;M",
        "homepage": "https://yujia-qin.github.io/;https://pooruss.github.io/-lshwebsite/;https://github.com/Kunlun-Zhu;;;https://linyankai.github.io/;;https://xiangrutang.github.io/;;https://github.com/Sarah816;https://qqqube.github.io/;https://github.com/Rachum-thu;http://nlp.csai.tsinghua.edu.cn/~xrb/;;https://www.bloomberg.com/profile/person/22198764?leadSource=uverify%20wall;http://nlp.csai.tsinghua.edu.cn/~lzy;https://www.cs.tsinghua.edu.cn/csen/info/1312/4394.htm;http://www.gersteinlab.org/;https://scholar.google.com/citations?user=AUKaXYkAAAAJ&hl=en",
        "dblp": "126/2333;;345/0064;;;161/0001.html;141/4386.html;246/8064;;;347/2720.html;344/9908;178/8590;00/5012-16;;53/3245-1;95/3291-1;67/5132;",
        "google_scholar": ";;A5L7wZAAAAAJ;;PXjYFB0AAAAJ;https://scholar.google.com.hk/citations?user=j8K1FqEAAAAJ;RL9CmXgAAAAJ;;;;6nLvvAEAAAAJ;u6ex8v8AAAAJ;j3OX8KUAAAAJ;https://scholar.google.com.hk/citations?user=OijxQCMAAAAJ;;dT0v5u0AAAAJ;https://scholar.google.com.tw/citations?user=zIgT0HMAAAAJ;YvjuUugAAAAJ;",
        "orcid": ";;;;;0000-0002-9182-8158;;;;;;;0000-0003-3170-5647;0000-0002-5899-5165;;0000-0002-7709-2543;;0000-0002-9746-3719;",
        "linkedin": "yujia-qin-672595181/;;;lan-ava-yan-2baa51166/;;;;;billqian/;;spencerrhongg/;;;;;;;mbgmbg/;",
        "or_profile": "~Yujia_Qin1;~Shihao_Liang1;~Kunlun_Zhu1;~Lan_Yan4;~Yaxi_Lu1;~Yankai_Lin1;~Xin_Cong1;~Xiangru_Tang2;~Bill_Qian1;~Sihan_Zhao1;~Lauren_Hong1;~Runchu_Tian1;~Ruobing_Xie2;~Jie_Zhou8;~dahai_li1;~Zhiyuan_Liu1;~Maosong_Sun1;~Mark_Gerstein1;~Ye_Yi_ning1",
        "aff": "Tsinghua University;University of Hong Kong;University of Illinois, Urbana Champaign;Carnegie Mellon University;Department of Computer Science and Technology, Tsinghua University;Renmin University of China;Tsinghua University;Yale University;Yale University;Tsinghua University;;Tsinghua University;Tencent;WeChat AI, Tencent Inc.;;Tsinghua University;Tsinghua University;Yale University;",
        "aff_domain": "tsinghua.edu.cn;hku.hk;illinois.edu;cmu.edu;cs.tsinghua.edu.cn;ruc.edu.cn;mail.tsinghua.edu.cn;yale.edu;yale.edu;tsinghua.edu.cn;;mail.tsinghua.edu.cn;tencent.com;tencent.com;;tsinghua.edu.cn;tsinghua.edu.cn;yale.edu;",
        "position": "PhD student;MS student;MS student;MS student;PhD student;Assistant Professor;Postdoc;PhD student;Undergrad student;Undergrad student;;Undergrad student;Senior researcher;Principal Researcher;;Associate Professor;Full Professor;Full Professor;",
        "bibtex": "@inproceedings{\nqin2024toolllm,\ntitle={Tool{LLM}: Facilitating Large Language Models to Master 16000+ Real-world {API}s},\nauthor={Yujia Qin and Shihao Liang and Yining Ye and Kunlun Zhu and Lan Yan and Yaxi Lu and Yankai Lin and Xin Cong and Xiangru Tang and Bill Qian and Sihan Zhao and Lauren Hong and Runchu Tian and Ruobing Xie and Jie Zhou and Mark Gerstein and dahai li and Zhiyuan Liu and Maosong Sun},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=dHng2O0Jjr}\n}",
        "github": "",
        "project": "",
        "reviewers": "u7K9;k5uq;2o14;dyqS",
        "pdf_size": 1893429,
        "rating": "6;6;8;8",
        "confidence": "5;4;5;4",
        "soundness": "3;2;4;3",
        "contribution": "3;2;3;3",
        "presentation": "3;3;4;2",
        "wc_summary": "111;73;138;110",
        "wc_strengths": "92;34;80;64",
        "wc_weaknesses": "216;196;36;892",
        "wc_questions": "79;16;1;16",
        "wc_review": "498;319;255;1082",
        "wc_reply_reviewers": "0;0;11;78",
        "wc_reply_authors": "1394;3251;711;4578",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "2;7;1;11",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            108.0,
            23.119256043393783
        ],
        "wc_strengths_avg": [
            67.5,
            21.742814905158898
        ],
        "wc_weaknesses_avg": [
            335.0,
            329.0638235965783
        ],
        "wc_questions_avg": [
            28.0,
            30.074906483645133
        ],
        "wc_review_avg": [
            538.5,
            326.1843803740455
        ],
        "wc_reply_reviewers_avg": [
            22.25,
            32.4990384473141
        ],
        "wc_reply_authors_avg": [
            2483.5,
            1525.184660950929
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            5.25,
            4.02336923485777
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            19,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 639,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18087391995547841318&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 9,
        "openreview": "https://openreview.net/forum?id=dHng2O0Jjr",
        "pdf": "https://openreview.net/pdf?id=dHng2O0Jjr",
        "email": "tsinghua.edu.cn;hku.hk;illinois.edu;cmu.edu;cs.tsinghua.edu.cn;ruc.edu.cn;mail.tsinghua.edu.cn;yale.edu;yale.edu;tsinghua.edu.cn;;mail.tsinghua.edu.cn;tencent.com;tencent.com;;tsinghua.edu.cn;tsinghua.edu.cn;yale.edu;",
        "author_num": 19,
        "aff_unique_index": "0;1;2;3;0;4;0;5;5;0;0;6;6;0;0;5",
        "aff_unique_norm": "Tsinghua University;University of Hong Kong;University of Illinois Urbana-Champaign;Carnegie Mellon University;Renmin University of China;Yale University;Tencent",
        "aff_unique_dep": ";;;;;;Tencent Holdings Limited",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.hku.hk;https://illinois.edu;https://www.cmu.edu;http://www.ruc.edu.cn;https://www.yale.edu;https://www.tencent.com",
        "aff_unique_abbr": "THU;HKU;UIUC;CMU;RUC;Yale;Tencent",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Hong Kong SAR;Urbana-Champaign",
        "aff_country_unique_index": "0;0;1;1;0;0;0;1;1;0;0;0;0;0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "dIjwC8A0N6",
        "title": "QFT: Quantized Full-parameter Tuning of LLMs with Affordable Resources",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) have showcased remarkable impacts across a wide spectrum of natural language processing tasks. Fine-tuning these pre-trained models on downstream datasets provides further significant performance gains, but this process has been challenging due to its extraordinary resource requirements. To this end, existing efforts focus on parameter-efficient fine-tuning, which, unfortunately, fail to capitalize on the powerful potential of full-parameter fine-tuning. In this work, we propose QFT, a novel quantized full-parameter tuning framework for LLMs that enables memory-efficient fine-tuning without harming performance. Our framework incorporates two novel ideas: (i) we adopt the efficient Lion optimizer, which eliminates the memory usage of variances and enjoys the inherent advantage of performing robust quantization; and (ii) we quantize all model states and store them as integer values, and present a gradient backpropagation and parameter update scheme of the quantized values. As a result, QFT reduces the model state memory to 21% of the standard solution while achieving comparable performance, e.g., tuning a LLaMA-7B model only requires <30GB memory, met by a single A6000 GPU.",
        "keywords": "Quantization;Full-parameter Tuning;LLMs;Instructional Fine-tuning;Efficient Training",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/965575d8984b5118a4af12895fe293f711edebc7.pdf",
        "author": "Zhikai Li;Xiaoxuan Liu;Banghua Zhu;Zhen Dong;Qingyi Gu;Kurt Keutzer",
        "authorids": "~Zhikai_Li1;~Xiaoxuan_Liu2;~Banghua_Zhu1;~Zhen_Dong3;~Qingyi_Gu1;~Kurt_Keutzer1",
        "gender": "M;M;M;;M;",
        "homepage": ";https://people.eecs.berkeley.edu/~banghua/;https://dong-zhen.com/;http://people.ucas.edu.cn/~guqingyi?language=en;https://people.eecs.berkeley.edu/~keutzer/;https://liuxiaoxuanpku.github.io/",
        "dblp": ";204/5394;;86/8369;k/KurtKeutzer.html;232/8368",
        "google_scholar": "XwutB1AAAAAJ;https://scholar.google.com/citations?hl=en;czxMUzcAAAAJ;;ID9QePIAAAAJ;MtqfTRYAAAAJ",
        "orcid": ";;;;0000-0003-3868-8501;",
        "linkedin": ";;zhen-dong/;;kurtkeutzer/;",
        "or_profile": "~Zhikai_Li1;~Banghua_Zhu1;~Zhen_Dong3;~Qingyi_Gu1;~Kurt_Keutzer1;~Lily_Liu1",
        "aff": "Institute of automation, Chinese Academy of Sciences;University of California, Berkeley;Nexusflow.ai Inc;Institute of Automation, Chinese Academy of Sciences;University of California, Berkeley;University of California, Berkeley",
        "aff_domain": "ia.ac.cn;berkeley.edu;nexusflow.ai;ucas.ac.cn;berkeley.edu;berkeley.edu",
        "position": "PhD student;PhD student;Principal Researcher;Full Professor;Full Professor;PhD student",
        "bibtex": "@misc{\nli2024qft,\ntitle={{QFT}: Quantized Full-parameter Tuning of {LLM}s with Affordable Resources},\nauthor={Zhikai Li and Xiaoxuan Liu and Banghua Zhu and Zhen Dong and Qingyi Gu and Kurt Keutzer},\nyear={2024},\nurl={https://openreview.net/forum?id=dIjwC8A0N6}\n}",
        "github": "",
        "project": "",
        "reviewers": "4QRW;vKgU;FtCe;wxFR",
        "site": "https://openreview.net/forum?id=dIjwC8A0N6",
        "pdf_size": 630274,
        "rating": "3;3;5;6",
        "confidence": "5;3;4;4",
        "soundness": "2;3;2;3",
        "contribution": "1;2;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "46;167;113;65",
        "wc_strengths": "20;68;43;51",
        "wc_weaknesses": "170;231;154;39",
        "wc_questions": "221;25;2;98",
        "wc_review": "457;491;312;253",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            97.75,
            46.847491928597414
        ],
        "wc_strengths_avg": [
            45.5,
            17.269916039170543
        ],
        "wc_weaknesses_avg": [
            148.5,
            69.44242219277781
        ],
        "wc_questions_avg": [
            86.5,
            85.35953373818299
        ],
        "wc_review_avg": [
            378.25,
            98.73037779731222
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1250079290693576837&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;0;1;1",
        "aff_unique_norm": "Chinese Academy of Sciences;University of California, Berkeley;Nexusflow.ai",
        "aff_unique_dep": "Institute of Automation;;",
        "aff_unique_url": "http://www.ia.cas.cn;https://www.berkeley.edu;https://www.nexusflow.ai",
        "aff_unique_abbr": "CAS;UC Berkeley;Nexusflow.ai",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Berkeley",
        "aff_country_unique_index": "0;1;1;0;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "dIynM7bHCG",
        "title": "Beyond Conservatism: Diffusion Policies in Offline Multi-agent Reinforcement Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We present a novel Diffusion Offline Multi-agent Model (DOM2) for offline Multi-Agent Reinforcement Learning (MARL). Different from existing algorithms that rely mainly on conservatism in policy design, DOM2 enhances policy expressiveness and diversity based on diffusion model. Specifically, we incorporate a diffusion model into the policy network and propose a trajectory-based data-augmentation scheme in training. These key ingredients make our algorithm more robust to environment changes and achieve significant improvements in performance, generalization and data-efficiency. Our extensive experimental results demonstrate that DOM2 outperforms existing state-of-the-art methods in all multi-agent particle and multi-agent MuJoCo environments, and generalizes significantly better to shifted environments (in $28$ out of $30$ settings evaluated) thanks to its high expressiveness and diversity. Moreover, DOM2 is ultra data efficient and requires no more than $5\\%$ data for achieving the same performance compared to existing algorithms (a $20\\times$ improvement in data efficiency).",
        "keywords": "Offline Multi-Agent Reinforcement Learning; Diffusion Probabilistic Model",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/83e66063c1cb9c62795aa9379c13ad9564e4bfac.pdf",
        "author": "Zhuoran Li;Ling Pan;Jiatai Huang;Longbo Huang",
        "authorids": "~Zhuoran_Li1;~Ling_Pan1;~Jiatai_Huang1;~Longbo_Huang2",
        "gender": "M;F;M;M",
        "homepage": ";https://ling-pan.github.io/;;http://people.iiis.tsinghua.edu.cn/~huang/",
        "dblp": "18/8638;199/9303/;;79/7077",
        "google_scholar": "j948XtQAAAAJ;qZ_zlacAAAAJ;Y1w8ziAAAAAJ;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Zhuoran_Li1;~Ling_Pan1;~Jiatai_Huang1;~Longbo_Huang2",
        "aff": "Tsinghua University;Montreal Institute for Learning Algorithms (MILA);\u5317\u4eac\u5353\u8bc6\u79c1\u52df\u57fa\u91d1\u7ba1\u7406\u6709\u9650\u516c\u53f8;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;mila.umontreal.ca;zsquant.com;tsinghua.edu.cn",
        "position": "PhD student;Postdoc;Researcher;Full Professor",
        "bibtex": "@misc{\nli2024beyond,\ntitle={Beyond Conservatism: Diffusion Policies in Offline Multi-agent Reinforcement Learning},\nauthor={Zhuoran Li and Ling Pan and Jiatai Huang and Longbo Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=dIynM7bHCG}\n}",
        "github": "",
        "project": "",
        "reviewers": "SRZp;tEv5;dHvd;mbZH;pMHc",
        "site": "https://openreview.net/forum?id=dIynM7bHCG",
        "pdf_size": 1435371,
        "rating": "3;3;3;5;5",
        "confidence": "4;4;5;4;2",
        "soundness": "1;2;2;2;2",
        "contribution": "2;2;1;2;2",
        "presentation": "2;2;3;2;3",
        "wc_summary": "79;43;34;79;62",
        "wc_strengths": "16;5;20;66;31",
        "wc_weaknesses": "532;31;218;267;204",
        "wc_questions": "129;45;5;207;69",
        "wc_review": "756;124;277;619;366",
        "wc_reply_reviewers": "494;0;0;0;0",
        "wc_reply_authors": "1975;365;517;990;893",
        "reply_reviewers": "2;0;0;0;0",
        "reply_authors": "4;1;1;2;2",
        "rating_avg": [
            3.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.8,
            0.9797958971132712
        ],
        "soundness_avg": [
            1.8,
            0.4000000000000001
        ],
        "contribution_avg": [
            1.8,
            0.4
        ],
        "presentation_avg": [
            2.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            59.4,
            18.380424369420854
        ],
        "wc_strengths_avg": [
            27.6,
            20.924626639440906
        ],
        "wc_weaknesses_avg": [
            250.4,
            161.81050645739913
        ],
        "wc_questions_avg": [
            91.0,
            70.56344662783982
        ],
        "wc_review_avg": [
            428.4,
            229.40148212250068
        ],
        "wc_reply_reviewers_avg": [
            98.8,
            197.6
        ],
        "wc_reply_authors_avg": [
            948.0,
            563.0573683027334
        ],
        "reply_reviewers_avg": [
            0.4,
            0.8000000000000002
        ],
        "reply_authors_avg": [
            2.0,
            1.0954451150103321
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.6666666666666667,
        "gs_citation": 17,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16808670307546671600&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Tsinghua University;Montreal Institute for Learning Algorithms;\u5317\u4eac\u5353\u8bc6\u79c1\u52df\u57fa\u91d1\u7ba1\u7406\u6709\u9650\u516c\u53f8",
        "aff_unique_dep": ";Artificial Intelligence;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://mila.quebec;",
        "aff_unique_abbr": "THU;MILA;",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Montreal",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "China;Canada"
    },
    {
        "id": "dKPh4CLmYp",
        "title": "Fishnets: Information-Optimal, Scalable Aggregation for Sets and Graphs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Set-based learning is an essential component of modern deep learning and network science. Graph Neural Networks (GNNs) and their edge-free counterparts DeepSets (DS) have proven remarkably useful on ragged and topologically challenging datasets. The key to learning informative embeddings for set members is a specified aggregation function, usually a sum, max, or mean. We propose Fishnets, an aggregation strategy for learning information-optimal embeddings for sets of data for both Bayesian inference and graph aggregation. We demonstrate that i) Fishnets neural summaries can be scaled optimally to an arbitrary number of data objects, ii) Fishnets aggregations are robust to changes in data distribution, unlike standard deepsets, iii) Fishnets saturate Bayesian information content and extend to regimes where MCMC techniques fail and iv) Fishnets can be used as a drop-in aggregation scheme within GNNs. We show that by adopting a Fishnets aggregation scheme for message passing, GNNs can acheive state-of-the-art performance versus architecture size on ogbn-protein data over existing benchmarks with a fraction of learnable parameters and faster training time.",
        "keywords": "Aggregation;Information Theory;Sets;Graphs;Graph Neural Networks",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "T. Lucas Makinen;JUSTIN ALSING;Benjamin Dan Wandelt",
        "authorids": "~T._Lucas_Makinen1;~JUSTIN_ALSING1;~Benjamin_Dan_Wandelt1",
        "gender": "M;;M",
        "homepage": ";https://benwandelt.org;https://tlmakinen.github.io/",
        "dblp": ";;",
        "google_scholar": "https://scholar.google.se/scholar?hl=en;;tlvVtjQAAAAJ",
        "orcid": ";;0000-0002-3795-6933",
        "linkedin": ";https://linkedin.com/in/benwandelt;lucas-makinen-876463b9/",
        "or_profile": "~JUSTIN_ALSING1;~Benjamin_Dan_Wandelt1;~Timothy_Lucas_Makinen1",
        "aff": "Stockholm University;Institut d'Astrophysique de Paris, Sorbonne University;Imperial College London",
        "aff_domain": "su.se;iap.fr;ic.ac.uk",
        "position": "Postdoc;Full Professor;PhD student",
        "bibtex": "@misc{\nmakinen2024fishnets,\ntitle={Fishnets: Information-Optimal, Scalable Aggregation for Sets and Graphs},\nauthor={T. Lucas Makinen and JUSTIN ALSING and Benjamin Dan Wandelt},\nyear={2024},\nurl={https://openreview.net/forum?id=dKPh4CLmYp}\n}",
        "github": "",
        "project": "",
        "reviewers": "dYDc;XpEu;KY3Y;ZQ1B;wjmC;D4AK;BUmE",
        "site": "https://openreview.net/forum?id=dKPh4CLmYp",
        "pdf_size": 1737498,
        "rating": "3;3;3;5;5;5;6",
        "confidence": "2;4;4;4;4;3;2",
        "soundness": "2;3;2;3;2;2;4",
        "contribution": "2;2;2;3;3;3;4",
        "presentation": "1;2;1;1;3;1;3",
        "wc_summary": "69;41;31;241;94;44;51",
        "wc_strengths": "15;33;11;148;51;35;55",
        "wc_weaknesses": "212;146;124;147;638;102;128",
        "wc_questions": "5;35;15;241;148;46;64",
        "wc_review": "301;255;181;777;931;227;298",
        "wc_reply_reviewers": "0;0;0;0;284;0;33",
        "wc_reply_authors": "183;242;236;322;446;237;285",
        "reply_reviewers": "0;0;0;0;1;0;1",
        "reply_authors": "1;1;1;1;2;1;1",
        "rating_avg": [
            4.285714285714286,
            1.1605769149479943
        ],
        "confidence_avg": [
            3.2857142857142856,
            0.880630571852711
        ],
        "soundness_avg": [
            2.5714285714285716,
            0.7284313590846836
        ],
        "contribution_avg": [
            2.7142857142857144,
            0.6998542122237652
        ],
        "presentation_avg": [
            1.7142857142857142,
            0.880630571852711
        ],
        "wc_summary_avg": [
            81.57142857142857,
            67.907199582239
        ],
        "wc_strengths_avg": [
            49.714285714285715,
            42.91091864287585
        ],
        "wc_weaknesses_avg": [
            213.85714285714286,
            176.04092752330436
        ],
        "wc_questions_avg": [
            79.14285714285714,
            79.12635206956487
        ],
        "wc_review_avg": [
            424.2857142857143,
            277.5096983045119
        ],
        "wc_reply_reviewers_avg": [
            45.285714285714285,
            98.11758876210624
        ],
        "wc_reply_authors_avg": [
            278.7142857142857,
            79.25675146674399
        ],
        "reply_reviewers_avg": [
            0.2857142857142857,
            0.45175395145262565
        ],
        "reply_authors_avg": [
            1.1428571428571428,
            0.3499271061118826
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.2196488425534897,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2600703999082201171&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Stockholm University;Sorbonne University;Imperial College London",
        "aff_unique_dep": ";Institut d'Astrophysique de Paris;",
        "aff_unique_url": "https://www.su.se;https://www.sorbonne-universite.fr;https://www.imperial.ac.uk",
        "aff_unique_abbr": "SU;Sorbonne U;ICL",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Paris",
        "aff_country_unique_index": "0;1;2",
        "aff_country_unique": "Sweden;France;United Kingdom"
    },
    {
        "id": "dKPzWyaOsK",
        "title": "Are machines automating morality?",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The advent of artificial intelligence (AI) and machine learning has ignited a profound inquiry into the morality of machines. In a quest for efficiency, pleasure, comfort, we delegate and automate more and more decisions and actions to AI- based systems. In this paper, we delve into the complex interplay between artificial intelligence and morality. We thus address the fundamental question of whether machines possess morals and if machine learning systems can learn about moral values. As AI systems increasingly take on decision-making roles in our lives, ethical concerns are growing among researchers and philosophers. Making an ethical decision has always been connected to human agency. We try to highlight the prevailing utilitarian ethics found in the tech-centric Silicon Valley culture and its influence on the development of artificial intelligence (AI). As machines make more and more decisions, they consequently express a certain morality. In this paper we highlight the emergence of the idea of \u201cmoral machines\u201d to describe machine learning systems, for instance in the context of autonomous vehicles, where AI-based systems must take ethically challenging decisions - we thus discuss the pertinence of the well-known \u201ctrolley problem\u201d as an illustrative example to explore the utilitarian aspect of these ethical dilemmas, it applies to any domain where machines make moral choices based on patterns and data. Calling those machines \u201cmoral\u201d underline the fact that AI systems make moral choices with- out any human intervention. However this term is not confined to autonomous vehicles. This paper examines the implications of this automated morality and how it can affect individuals\u2019 sense of responsibility raising the questions about the future of morality. Automated values challenge the idea of responsibility and moral agency. We then call for a thoughtful and critical examination of all ethical implications of machine learning shaping our moral background. In the age of technological disruption, ethical questions surrounding automated morality must be addressed to safeguard our ethical compass.",
        "keywords": "philosophy;ethics;morality;societal considerations",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Adrien Tallent",
        "authorids": "~Adrien_Tallent1",
        "gender": "M",
        "homepage": "",
        "dblp": "",
        "google_scholar": "",
        "orcid": "0000-0003-3630-6020",
        "linkedin": "adrien-tallent-668a35a1/?locale=en_US",
        "or_profile": "~Adrien_Tallent1",
        "aff": "Universit\u00e9 Paris-Sorbonne (Paris IV)",
        "aff_domain": "paris4.sorbonne.fr",
        "position": "PhD student",
        "bibtex": "@misc{\nanonymous2024are,\ntitle={Are machines automating morality?},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=dKPzWyaOsK}\n}",
        "github": "",
        "project": "",
        "reviewers": "CCc6;X5KS;ju5e",
        "site": "https://openreview.net/forum?id=dKPzWyaOsK",
        "pdf_size": 102429,
        "rating": "3;3;5",
        "confidence": "4;3;2",
        "soundness": "1;3;3",
        "contribution": "2;1;3",
        "presentation": "1;3;4",
        "wc_summary": "70;20;58",
        "wc_strengths": "32;12;170",
        "wc_weaknesses": "993;111;95",
        "wc_questions": "9;17;16",
        "wc_review": "1104;160;339",
        "wc_reply_reviewers": "0;35;0",
        "wc_reply_authors": "552;117;63",
        "reply_reviewers": "0;1;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "wc_summary_avg": [
            49.333333333333336,
            21.31248981752771
        ],
        "wc_strengths_avg": [
            71.33333333333333,
            70.24401912064985
        ],
        "wc_weaknesses_avg": [
            399.6666666666667,
            419.6008685511612
        ],
        "wc_questions_avg": [
            14.0,
            3.559026084010437
        ],
        "wc_review_avg": [
            534.3333333333334,
            409.39006121573374
        ],
        "wc_reply_reviewers_avg": [
            11.666666666666666,
            16.49915822768611
        ],
        "wc_reply_authors_avg": [
            244.0,
            218.90180446949267
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.8660254037844387,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:QDSFap6PsbcJ:scholar.google.com/&scioq=Are+machines+automating+morality%3F&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Universit\u00e9 Paris-Sorbonne",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.univ-paris-sorbonne.fr",
        "aff_unique_abbr": "Paris IV",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Paris",
        "aff_country_unique_index": "0",
        "aff_country_unique": "France"
    },
    {
        "id": "dKju7tbe6D",
        "title": "Learning to reason iteratively and parallelly for complex visual reasoning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Iterative step-by-step computation is beneficial for multi-step reasoning scenarios wherein individual operations need to be computed, stored and recalled dynamically (e.g. when computing the query \u201cdetermine color of pen to left of the child in red t-shirt sitting at the white table\u201d). Conversely, parallel computation is beneficial for executing operations that are mutually-independent and can be executed simultaneously and not necessarily sequentially (e.g. when counting individual colors for the query: \u201cdetermine the maximally occuring color amongst all t-shirts\u201d). Accordingly, in this work, we introduce a novel fully neural iterative and parallel reasoning mechanism (IPRM) that combines the benefits of iterative computation with the ability to perform distinct operations simultaneously. Our experiments on various visual question answering and reasoning benchmarks indicate that IPRM exhibits stronger reasoning capabilities and generalization than existing recurrent as well as transformer-based reasoning and vision-language interaction mechanisms while requiring lesser parameters and computation steps. Notably, IPRM achieves state-of-the-art zero-shot performance on the challenging CLEVR-Humans dataset and outperforms prior task-specific methods for the NLVR and CLEVR-CoGen benchmarks. Further, IPRM\u2019s computation can be visualized across reasoning steps aiding interpretability and diagnosis of its reasoning and outputs.",
        "keywords": "visual reasoning; vision-language modules; memory-augmented reasoning; parallel computation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Shantanu Jaiswal;Debaditya Roy;Basura Fernando;Cheston Tan",
        "authorids": "~Shantanu_Jaiswal1;~Debaditya_Roy2;~Basura_Fernando1;~Cheston_Tan1",
        "gender": ";;M;M",
        "homepage": ";https://sites.google.com/view/debadityaroy/;https://basurafernando.github.io/;",
        "dblp": "203/9071;150/4133;01/9558;136/9366",
        "google_scholar": "GmGNq2MAAAAJ;L0Lq-fAAAAAJ;https://scholar.google.com.au/citations?user=GyvseMkAAAAJ;Up0UYEYAAAAJ",
        "orcid": ";0000-0002-8779-1241;0000-0002-6920-9916;",
        "linkedin": ";;;cheston-tan/",
        "or_profile": "~Shantanu_Jaiswal1;~Debaditya_Roy2;~Basura_Fernando1;~Cheston_Tan1",
        "aff": "Center for Frontier AI Research, A*STAR Singapore; A*STAR;A*STAR;Singapore University of Technology and Design",
        "aff_domain": "ihpc.a-star.edu.sg;ihpc.a-star.edu.sg;astar.edu.sg;sutd.edu.sg",
        "position": "Research Engineer;Research Scientist;Principal Researcher;Assistant Professor",
        "bibtex": "@misc{\njaiswal2024learning,\ntitle={Learning to reason iteratively and parallelly for complex visual reasoning},\nauthor={Shantanu Jaiswal and Debaditya Roy and Basura Fernando and Cheston Tan},\nyear={2024},\nurl={https://openreview.net/forum?id=dKju7tbe6D}\n}",
        "github": "",
        "project": "",
        "reviewers": "kvgs;bPrS;Mmxk;iiFw",
        "site": "https://openreview.net/forum?id=dKju7tbe6D",
        "pdf_size": 2800136,
        "rating": "5;5;5;6",
        "confidence": "3;4;4;2",
        "soundness": "3;3;4;3",
        "contribution": "3;2;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "184;50;74;51",
        "wc_strengths": "45;27;85;29",
        "wc_weaknesses": "434;176;106;123",
        "wc_questions": "12;34;173;13",
        "wc_review": "675;287;438;216",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            89.75,
            55.2556558191105
        ],
        "wc_strengths_avg": [
            46.5,
            23.296995514443488
        ],
        "wc_weaknesses_avg": [
            209.75,
            132.01964815890096
        ],
        "wc_questions_avg": [
            58.0,
            66.97387550381119
        ],
        "wc_review_avg": [
            404.0,
            175.80529002279766
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8703882797784891,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:nyHlo41W8m0J:scholar.google.com/&scioq=Learning+to+reason+iteratively+and+parallelly+for+complex+visual+reasoning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "A*STAR Singapore;Agency for Science, Technology and Research;Singapore University of Technology and Design",
        "aff_unique_dep": "Center for Frontier AI Research;;",
        "aff_unique_url": "https://www.a-star.edu.sg;https://www.a-star.edu.sg;https://www.sutd.edu.sg",
        "aff_unique_abbr": "A*STAR;A*STAR;SUTD",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Singapore"
    },
    {
        "title": "Peering Through Preferences: Unraveling Feedback Acquisition for Aligning Large Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18266",
        "id": "dKl6lMwbCy",
        "author_site": "Hritik Bansal, John Dang, Aditya Grover",
        "tldr": "",
        "abstract": "Aligning large language models (LLMs) with human values and intents critically involves the use of human or AI feedback. While dense feedback annotations are expensive to acquire and integrate, sparse feedback presents a structural design choice between ratings (e.g., score Response A on a scale of 1-7) and rankings (e.g., is Response A better than Response B?). In this work, we analyze the effect of this design choice for the alignment and evaluation of LLMs. We uncover an inconsistency problem wherein the preferences inferred from ratings and rankings significantly disagree 60% for both human and AI annotators. Our subsequent analysis identifies various facets of annotator biases that explain this phenomena such as human annotators would rate denser responses higher while preferring accuracy during pairwise judgments, for a particular comparison instance. To our surprise, we observe that the choice of feedback protocol has a significant effect on the evaluation of aligned LLMs. In particular, we find that LLMs that leverage rankings data for alignment (say model X) are preferred over those that leverage ratings data (say model Y), with a rank-based evaluation protocol (is X/Y's response better than reference response?) but not with a rating-based evaluation protocol (score Rank X/Y's response on a scale of 1-7). Our findings thus shed light on critical gaps in methods for evaluating the real-world utility of language models and their strong dependence on the feedback protocol used for alignment. Our code and data are available at \\url{https://github.com/Hritikbansal/sparse_feedback}.",
        "keywords": "LLMs;Sparse Feedback;Ratings;Rankings;Inconsistency;Evaluation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/694884430bf99c35845f3db10323fba4ef385b51.zip",
        "author": "Hritik Bansal;John Dang;Aditya Grover",
        "authorids": "~Hritik_Bansal2;~John_Dang1;~Aditya_Grover1",
        "gender": "M;M;M",
        "homepage": "https://sites.google.com/view/hbansal;https://www.johndang.me/;https://aditya-grover.github.io",
        "dblp": "239/5922;;162/5052",
        "google_scholar": "gAKTYtoAAAAJ;;oOhnPUgAAAAJ",
        "orcid": ";;",
        "linkedin": "hritik-bansal/;;",
        "or_profile": "~Hritik_Bansal2;~John_Dang1;~Aditya_Grover1",
        "aff": "University of California, Los Angeles;Cohere;University of California, Los Angeles",
        "aff_domain": "ucla.edu;cohere.com;ucla.edu",
        "position": "PhD student;Researcher;Assistant Professor",
        "bibtex": "@inproceedings{\nbansal2024peering,\ntitle={Peering Through Preferences: Unraveling Feedback Acquisition for Aligning Large Language Models},\nauthor={Hritik Bansal and John Dang and Aditya Grover},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=dKl6lMwbCy}\n}",
        "github": "",
        "project": "",
        "reviewers": "KCah;ofRF;gmKJ;7SsY",
        "pdf_size": 761006,
        "rating": "6;6;6;8",
        "confidence": "3;3;4;4",
        "soundness": "3;2;3;3",
        "contribution": "3;3;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "64;85;173;114",
        "wc_strengths": "51;65;71;59",
        "wc_weaknesses": "179;131;395;270",
        "wc_questions": "66;68;13;2",
        "wc_review": "360;349;652;445",
        "wc_reply_reviewers": "112;134;403;0",
        "wc_reply_authors": "1684;1457;1893;1168",
        "reply_reviewers": "2;2;1;0",
        "reply_authors": "5;5;5;4",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            109.0,
            40.99390198553927
        ],
        "wc_strengths_avg": [
            61.5,
            7.399324293474371
        ],
        "wc_weaknesses_avg": [
            243.75,
            100.5867163198004
        ],
        "wc_questions_avg": [
            37.25,
            30.011456145945335
        ],
        "wc_review_avg": [
            451.5,
            121.57405150771278
        ],
        "wc_reply_reviewers_avg": [
            162.25,
            147.99387656251187
        ],
        "wc_reply_authors_avg": [
            1550.5,
            269.34039800965616
        ],
        "reply_reviewers_avg": [
            1.25,
            0.82915619758885
        ],
        "reply_authors_avg": [
            4.75,
            0.4330127018922193
        ],
        "replies_avg": [
            31,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 24,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2755487614474625480&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=dKl6lMwbCy",
        "pdf": "https://openreview.net/pdf?id=dKl6lMwbCy",
        "email": "ucla.edu;cohere.com;ucla.edu",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of California, Los Angeles;Cohere",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ucla.edu;https://cohere.ai",
        "aff_unique_abbr": "UCLA;",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Los Angeles;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Prompt Learning with Quaternion Networks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18265",
        "id": "dKlxDx2SoS",
        "author_site": "Boya Shi, Zhengqin Xu, Shuai Jia, Chao Ma",
        "tldr": "",
        "abstract": "Multimodal pre-trained models have shown impressive potential in enhancing performance on downstream tasks. However, existing fusion strategies for modalities primarily rely on explicit interaction structures that fail to capture the diverse aspects and patterns inherent in input data. This yields limited performance in zero-shot contexts, especially when fine-grained classifications and abstract interpretations are required. To address this, we propose an effective approach, namely Prompt Learning with Quaternion Networks (QNet), for semantic alignment across diverse modalities. QNet employs a quaternion hidden space where the mutually orthogonal imaginary axes capture rich intermodal semantic spatial correlations from various perspectives. Hierarchical features across multilayers are utilized to encode intricate interdependencies within various modalities with reduced parameters. Our experiments on 11 datasets demonstrate that QNet outperforms state-of-the-art prompt learning techniques in base-to-novel generalization, cross-dataset transfer, and domain transfer scenarios with fewer learnable parameters. The source code is available at https://github.com/VISION-SJTU/QNet.",
        "keywords": "Prompt Learning;Quaternion Networks;Multimodal;Feature Fusion;Zero-Shot.",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/a4a4ac4384fb5bcc0a649e6b94fa33e4bf9a6678.pdf",
        "author": "Boya Shi;Zhengqin Xu;Shuai Jia;Chao Ma",
        "authorids": "~Boya_Shi1;~Zhengqin_Xu1;~Shuai_Jia1;~Chao_Ma3",
        "gender": "F;M;M;M",
        "homepage": ";;https://github.com/joshuasj;https://vision.sjtu.edu.cn/",
        "dblp": ";240/7110;142/5236;79/1552-4",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;https://scholar.google.com.hk/citations?view_op=list_works;https://scholar.google.com.hk/citations?user=uxh4xmwAAAAJ;syoPhv8AAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Boya_Shi1;~Zhengqin_Xu1;~Shuai_Jia1;~Chao_Ma3",
        "aff": "Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn",
        "position": "PhD student;Postdoc;PhD student;Full Professor",
        "bibtex": "@inproceedings{\nshi2024prompt,\ntitle={Prompt Learning with Quaternion Networks},\nauthor={Boya Shi and Zhengqin Xu and Shuai Jia and Chao Ma},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=dKlxDx2SoS}\n}",
        "github": "",
        "project": "",
        "reviewers": "jgw2;xbTq;Rjda",
        "pdf_size": 962353,
        "rating": "6;6;8",
        "confidence": "4;4;3",
        "soundness": "3;3;4",
        "contribution": "3;3;4",
        "presentation": "3;3;3",
        "wc_summary": "193;40;53",
        "wc_strengths": "25;75;24",
        "wc_weaknesses": "61;41;60",
        "wc_questions": "1;7;1",
        "wc_review": "280;163;138",
        "wc_reply_reviewers": "10;0;0",
        "wc_reply_authors": "419;336;152",
        "reply_reviewers": "1;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            95.33333333333333,
            69.26438879796424
        ],
        "wc_strengths_avg": [
            41.333333333333336,
            23.809428571238094
        ],
        "wc_weaknesses_avg": [
            54.0,
            9.201449161228174
        ],
        "wc_questions_avg": [
            3.0,
            2.8284271247461903
        ],
        "wc_review_avg": [
            193.66666666666666,
            61.8941749188798
        ],
        "wc_reply_reviewers_avg": [
            3.3333333333333335,
            4.714045207910316
        ],
        "wc_reply_authors_avg": [
            302.3333333333333,
            111.5716013249887
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9999999999999998,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3830253116564030851&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=dKlxDx2SoS",
        "pdf": "https://openreview.net/pdf?id=dKlxDx2SoS",
        "email": "sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Shanghai Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sjtu.edu.cn",
        "aff_unique_abbr": "SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Robustness of AI-Image Detectors: Fundamental Limits and Practical Attacks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18264",
        "id": "dLoAdIKENc",
        "author_site": "Mehrdad Saberi, Vinu Sankar Sadasivan, Keivan Rezaei, Aounon Kumar, Atoosa Chegini, Wenxiao Wang, Soheil Feizi",
        "tldr": "",
        "abstract": "In light of recent advancements in generative AI models, it has become essential to distinguish genuine content from AI-generated one to prevent the malicious usage of fake materials as authentic ones and vice versa. Various techniques have been introduced for identifying AI-generated images, with watermarking emerging as a promising approach. In this paper, we analyze the robustness of various AI-image detectors including watermarking and classifier-based deepfake detectors. For watermarking methods that introduce subtle image perturbations (i.e., low perturbation budget methods), we reveal a fundamental trade-off between the evasion error rate (i.e., the fraction of watermarked images detected as non-watermarked ones) and the spoofing error rate (i.e., the fraction of non-watermarked images detected as watermarked ones) upon an application of a diffusion purification attack. In this regime, we also empirically show that diffusion purification effectively removes watermarks with minimal changes to images. For high perturbation watermarking methods where notable changes are applied to images, the diffusion purification attack is not effective. In this case, we develop a model substitution adversarial attack that can successfully remove watermarks. Moreover, we show that watermarking methods are vulnerable to spoofing attacks where the attacker aims to have real images (potentially obscene) identified as watermarked ones, damaging the reputation of the developers. In particular, by just having black-box access to the watermarking method, we show that one can generate a watermarked noise image which can be added to the real images to have them falsely flagged as watermarked ones. Finally, we extend our theory to characterize a fundamental trade-off between the robustness and reliability of classifier-based deep fake detectors and demonstrate it through experiments. Code is available at https://github.com/mehrdadsaberi/watermark_robustness.",
        "keywords": "ai-image detection;image watermark;deepfake detection;watermark attack;generative models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/087d0aa8ac8debc44456637fbec4463d6ecec791.zip",
        "author": "Mehrdad Saberi;Vinu Sankar Sadasivan;Keivan Rezaei;Aounon Kumar;Atoosa Chegini;Wenxiao Wang;Soheil Feizi",
        "authorids": "~Mehrdad_Saberi1;~Vinu_Sankar_Sadasivan1;~Keivan_Rezaei1;~Aounon_Kumar1;~Atoosa_Chegini1;~Wenxiao_Wang1;~Soheil_Feizi2",
        "gender": "M;M;M;M;F;M;M",
        "homepage": "https://mehrdadsaberi.github.io/;https://vinusankars.github.io/;https://k1rezaei.github.io;https://aounon.github.io;;https://wangwenxiao.github.io;https://www.cs.umd.edu/~sfeizi/",
        "dblp": "289/1707;244/8052;339/7254;191/8334;;243/5853-2;57/2132",
        "google_scholar": "qCZacxgAAAAJ;y1IKIw0AAAAJ;NsJKrKIAAAAJ;NjhpUykAAAAJ;5nY9tagAAAAJ;hn0u5VgAAAAJ;lptAmrMAAAAJ",
        "orcid": ";;;;;;",
        "linkedin": "mehrdads/;vinusankars/;keivan-rezaei-1b434680/;;atoosa-chegini-6713741a3/;wenxiaowang/;",
        "or_profile": "~Mehrdad_Saberi1;~Vinu_Sankar_Sadasivan1;~Keivan_Rezaei1;~Aounon_Kumar1;~Atoosa_Chegini1;~Wenxiao_Wang1;~Soheil_Feizi2",
        "aff": "Department of Computer Science, University of Maryland, College Park;University of Maryland, College Park;University of Maryland, College Park;School of Engineering and Applied Sciences, Harvard University;University of Maryland, College Park;University of Maryland, College Park;University of Maryland, College Park",
        "aff_domain": "cs.umd.edu;umd.edu;umd.edu;seas.harvard.edu;umd.edu;umd.edu;umd.edu",
        "position": "PhD student;PhD student;PhD student;Postdoc;PhD student;PhD student;Associate Professor",
        "bibtex": "@inproceedings{\nsaberi2024robustness,\ntitle={Robustness of {AI}-Image Detectors: Fundamental Limits and Practical Attacks},\nauthor={Mehrdad Saberi and Vinu Sankar Sadasivan and Keivan Rezaei and Aounon Kumar and Atoosa Chegini and Wenxiao Wang and Soheil Feizi},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=dLoAdIKENc}\n}",
        "github": "",
        "project": "",
        "reviewers": "APfc;1Mes;h5mn;pjit",
        "pdf_size": 20326975,
        "rating": "5;6;6;6",
        "confidence": "4;4;3;4",
        "soundness": "2;3;3;3",
        "contribution": "1;3;2;3",
        "presentation": "2;3;3;4",
        "wc_summary": "86;155;124;66",
        "wc_strengths": "7;134;180;35",
        "wc_weaknesses": "167;140;43;65",
        "wc_questions": "9;89;5;118",
        "wc_review": "269;518;352;284",
        "wc_reply_reviewers": "366;0;24;0",
        "wc_reply_authors": "1861;290;376;368",
        "reply_reviewers": "2;0;1;0",
        "reply_authors": "3;1;1;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            107.75,
            34.3247359785913
        ],
        "wc_strengths_avg": [
            89.0,
            70.61515418095468
        ],
        "wc_weaknesses_avg": [
            103.75,
            51.2512194976861
        ],
        "wc_questions_avg": [
            55.25,
            49.347618990180266
        ],
        "wc_review_avg": [
            355.75,
            98.75822750535775
        ],
        "wc_reply_reviewers_avg": [
            97.5,
            155.3278790172582
        ],
        "wc_reply_authors_avg": [
            723.75,
            657.4505209519573
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 47,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9394604219199485143&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=dLoAdIKENc",
        "pdf": "https://openreview.net/pdf?id=dLoAdIKENc",
        "email": "cs.umd.edu;umd.edu;umd.edu;seas.harvard.edu;umd.edu;umd.edu;umd.edu",
        "author_num": 7,
        "aff_unique_index": "0;1;1;2;1;1;1",
        "aff_unique_norm": "University of Maryland, College Park;University of Maryland;Harvard University",
        "aff_unique_dep": "Department of Computer Science;;School of Engineering and Applied Sciences",
        "aff_unique_url": "https://www/umd.edu;https://www/umd.edu;https://www.harvard.edu",
        "aff_unique_abbr": "UMD;UMD;Harvard",
        "aff_campus_unique_index": "0;0;0;1;0;0;0",
        "aff_campus_unique": "College Park;Cambridge",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Topological data analysis on noisy quantum computers",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18263",
        "id": "dLrhRIMVmB",
        "author_site": "Ismail Akhalwaya, Shashanka Ubaru, Kenneth Clarkson, Mark Squillante, Vishnu Jejjala, Yang-Hui He, Kugendran Naidoo, Vasileios Kalantzis, Lior Horesh",
        "tldr": "",
        "abstract": "Topological data analysis (TDA) is a powerful technique for extracting complex and valuable shape-related summaries of high-dimensional data. However, the computational demands of classical algorithms for computing TDA are exorbitant, and quickly become impractical for high-order characteristics. Quantum computers offer the potential of achieving significant speedup for certain computational problems. Indeed, TDA has been purported to be one such problem, yet, quantum computing algorithms proposed for the problem, such as the original Quantum TDA (QTDA) formulation by Lloyd, Garnerone and Zanardi, require fault-tolerance qualifications that are currently unavailable. In this study, we present NISQ-TDA, a fully implemented end-to-end quantum machine learning algorithm needing only a short circuit-depth, that is applicable to high-dimensional classical data, and with provable asymptotic speedup for certain classes of problems. The algorithm neither suffers from the data-loading problem nor does it need to store the input data on the quantum computer explicitly. The algorithm was successfully executed on quantum computing devices, as well as on noisy quantum simulators, applied to small datasets. Preliminary empirical results suggest that the algorithm is robust to noise.",
        "keywords": "Topological data analysis;quantum computing;unsupervised learning;feature extraction",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Ismail Yunus Akhalwaya;Shashanka Ubaru;Kenneth L. Clarkson;Mark S. Squillante;Vishnu Jejjala;Yang-Hui He;Kugendran Naidoo;Vasileios Kalantzis;Lior Horesh",
        "authorids": "~Ismail_Yunus_Akhalwaya1;~Shashanka_Ubaru1;~Kenneth_L._Clarkson1;~Mark_S._Squillante1;~Vishnu_Jejjala1;~Yang-Hui_He1;~Kugendran_Naidoo1;~Vasileios_Kalantzis1;~Lior_Horesh1",
        "gender": "M;M;M;M;M;M;M;M;M",
        "homepage": ";http://shashankaubaru.github.io/;http://researcher.watson.ibm.com/researcher/view.php?person=us-klclarks;https://researcher.watson.ibm.com/researcher/view.php?person=us-mss;https://www.wits.ac.za/staff/academic-a-z-listing/j/vjejjalawitsacza/;https://lims.ac.uk/profile/?id=102;;https://vkalantzi.github.io;",
        "dblp": "245/8909;164/7307;89/2783;67/3865;;;;189/1234;14/10384",
        "google_scholar": ";NmhyylsAAAAJ;https://scholar.google.com/citations?hl=en;;;https://scholar.google.co.uk/citations?user=I5SWIuoAAAAJ;;r2YUzYIAAAAJ;qbqwCbEAAAAJ",
        "orcid": "0000-0002-5028-1168;;0000-0002-2880-2465;;;0000-0002-0787-8380;0000-0002-9351-4240;0000-0003-1474-8995;",
        "linkedin": ";;;;;;kugendran/;;lior-horesh-7365a46/",
        "or_profile": "~Ismail_Yunus_Akhalwaya1;~Shashanka_Ubaru1;~Kenneth_L._Clarkson1;~Mark_S._Squillante1;~Vishnu_Jejjala1;~Yang-Hui_He1;~Kugendran_Naidoo1;~Vasileios_Kalantzis1;~Lior_Horesh1",
        "aff": "Quantinuum;International Business Machines;International Business Machines;IBM Research;University of Witwatersrand;;University of Witwatersrand;International Business Machines;International Business Machines",
        "aff_domain": "quantinuum.com;ibm.com;ibm.com;us.ibm.com;wits.ac.za;;wits.ac.za;ibm.com;ibm.com",
        "position": "Principal Researcher;Researcher;Research Staff Member;Distinguished Research Staff Member;Full Professor;;PhD student;Researcher;Senior Manager",
        "bibtex": "@inproceedings{\nakhalwaya2024topological,\ntitle={Topological data analysis on noisy quantum computers},\nauthor={Ismail Yunus Akhalwaya and Shashanka Ubaru and Kenneth L. Clarkson and Mark S. Squillante and Vishnu Jejjala and Yang-Hui He and Kugendran Naidoo and Vasileios Kalantzis and Lior Horesh},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=dLrhRIMVmB}\n}",
        "github": "",
        "project": "",
        "reviewers": "FCsJ;tAjA;MnCf;G9wH",
        "pdf_size": 3601853,
        "rating": "8;8;8;8",
        "confidence": "2;2;3;4",
        "soundness": "3;4;4;3",
        "contribution": "3;4;4;4",
        "presentation": "3;3;3;3",
        "wc_summary": "93;70;192;92",
        "wc_strengths": "135;95;134;163",
        "wc_weaknesses": "93;56;66;90",
        "wc_questions": "4;71;190;63",
        "wc_review": "325;292;582;408",
        "wc_reply_reviewers": "45;8;15;26",
        "wc_reply_authors": "443;445;705;442",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            111.75,
            47.235447494440024
        ],
        "wc_strengths_avg": [
            131.75,
            24.200981385059574
        ],
        "wc_weaknesses_avg": [
            76.25,
            15.690363284513205
        ],
        "wc_questions_avg": [
            82.0,
            67.50925862428056
        ],
        "wc_review_avg": [
            401.75,
            112.32180331529582
        ],
        "wc_reply_reviewers_avg": [
            23.5,
            13.97318861248212
        ],
        "wc_reply_authors_avg": [
            508.75,
            113.31013855785368
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4851778578309685105&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=dLrhRIMVmB",
        "pdf": "https://openreview.net/pdf?id=dLrhRIMVmB",
        "email": "quantinuum.com;ibm.com;ibm.com;us.ibm.com;wits.ac.za;;wits.ac.za;ibm.com;ibm.com",
        "author_num": 9,
        "aff_unique_index": "0;1;1;2;3;3;1;1",
        "aff_unique_norm": "Quantinuum;International Business Machines Corporation;IBM;University of the Witwatersrand",
        "aff_unique_dep": ";;IBM Research;",
        "aff_unique_url": "https://www.quantinuum.com;https://www.ibm.com;https://www.ibm.com/research;https://www.wits.ac.za",
        "aff_unique_abbr": ";IBM;IBM;Wits",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;1;1;0;0",
        "aff_country_unique": "United States;South Africa"
    },
    {
        "id": "dN1IV0Ov8a",
        "title": "Long BERT for bankruptcy prediction",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Most bankruptcy risk prediction models use numerical data such as financial statements, financial ratios, or stock market variables to predict the risk of a company going into bankruptcy. However, these models do not take advantage of the vast amount of textual information available. The few projects that work with textual information use short texts such as tweets and news or are limited to analyzing data from public companies. Our research focuses on predicting the bankruptcy risk using the long text sequences of the annexes from the Annual Accounts. We propose a BERT-based model, which can predict the risk of a company going bankrupt even if there is no explicit information about the risk in the long-textual information. Here we showed that we can process parallel segments of a document using BERT and then integrate them for a unified prediction. Using a dataset of 20,000 annexes from the Annual Accounts of non-financial companies from Luxembourg to train and validate our model. We tried different models and two of them get a validation precision for predicting a risky company of approximately 73% and can be used depending on how long the documents are. The model can clearly learn about risk information from unstructured and diverse long textual information with high precision. This is our first step towards an integrated learning model that considers also numerical and non-financial data. Our proposed architecture can be used in other domains where long text needs to be processed for different Natural Language Processing tasks.",
        "keywords": "Finance;BERT;LSTM;Unstructured data;NLP",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/4d207d5d49cc68d7ca2eff6c95a91e0c483c29c6.pdf",
        "author": "Braulio Cesar Blanco Lambruschini;Mats Brorsson",
        "authorids": "~Braulio_Cesar_Blanco_Lambruschini1;~Mats_Brorsson1",
        "gender": "M;M",
        "homepage": ";https://wwwen.uni.lu/snt/people/mats_brorsson",
        "dblp": ";30/2217.html",
        "google_scholar": ";lo5kptkAAAAJ",
        "orcid": ";0000-0002-9637-2065",
        "linkedin": "http://linkedin.com/in/braulioblanco;matsbrorsson",
        "or_profile": "~Braulio_Cesar_Blanco_Lambruschini1;~Mats_Brorsson1",
        "aff": ";KTH Royal Institute of Technology",
        "aff_domain": ";kth.se",
        "position": ";Full Professor",
        "bibtex": "@misc{\nlambruschini2024long,\ntitle={Long {BERT} for bankruptcy prediction},\nauthor={Braulio Cesar Blanco Lambruschini and Mats Brorsson},\nyear={2024},\nurl={https://openreview.net/forum?id=dN1IV0Ov8a}\n}",
        "github": "",
        "project": "",
        "reviewers": "h86L;WCJF;QYDH;8GNw",
        "site": "https://openreview.net/forum?id=dN1IV0Ov8a",
        "pdf_size": 552596,
        "rating": "3;3;3;5",
        "confidence": "4;3;4;3",
        "soundness": "1;2;2;3",
        "contribution": "1;2;2;3",
        "presentation": "3;3;2;3",
        "wc_summary": "100;130;53;144",
        "wc_strengths": "40;137;37;49",
        "wc_weaknesses": "177;232;54;100",
        "wc_questions": "74;73;1;112",
        "wc_review": "391;572;145;405",
        "wc_reply_reviewers": "0;0;0;10",
        "wc_reply_authors": "421;528;206;310",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            106.75,
            34.86671048435743
        ],
        "wc_strengths_avg": [
            65.75,
            41.372545244400904
        ],
        "wc_weaknesses_avg": [
            140.75,
            68.60530227322083
        ],
        "wc_questions_avg": [
            65.0,
            40.15594601052253
        ],
        "wc_review_avg": [
            378.25,
            152.3341311065908
        ],
        "wc_reply_reviewers_avg": [
            2.5,
            4.330127018922194
        ],
        "wc_reply_authors_avg": [
            366.25,
            120.420876512339
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:_nTR4NusuA8J:scholar.google.com/&scioq=Long+BERT+for+bankruptcy+prediction&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "KTH Royal Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kth.se",
        "aff_unique_abbr": "KTH",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Sweden"
    },
    {
        "title": "TUVF: Learning Generalizable Texture UV Radiance Fields",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18262",
        "id": "dN4vpVTvWX",
        "author_site": "An-Chieh Cheng, Xueting Li, Sifei Liu, Xiaolong Wang",
        "tldr": "",
        "abstract": "Textures are a vital aspect of creating visually appealing and realistic 3D models. In this paper, we study the problem of generating high-fidelity texture given shapes of 3D assets, which has been relatively less explored compared with generic 3D shape modeling. Our goal is to facilitate a controllable texture generation process, such that one texture code can correspond to a particular appearance style independent of any input shapes from a category. We introduce Texture UV Radiance Fields (TUVF) that generate textures in a learnable UV sphere space rather than directly on the 3D shape. This allows the texture to be disentangled from the underlying shape and transferable to other shapes that share the same UV space, i.e., from the same category. We integrate the UV sphere space with the radiance field, which provides a more efficient and accurate representation of textures than traditional texture maps. We perform our experiments on synthetic and real-world object datasets where we achieve not only realistic synthesis but also substantial improvements over state-of-the-arts on texture controlling and editing.",
        "keywords": "texture synthesis;generative model;NeRF;3D AIGC",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/3bd4501a871a3296a53f004344f3353e04a908bc.zip",
        "author": "An-Chieh Cheng;Xueting Li;Sifei Liu;Xiaolong Wang",
        "authorids": "~An-Chieh_Cheng1;~Xueting_Li2;~Sifei_Liu2;~Xiaolong_Wang3",
        "gender": "F;M;M;F",
        "homepage": "https://www.sifeiliu.net;https://xiaolonw.github.io/;https://www.anjiecheng.me/;https://sunshineatnoon.github.io/",
        "dblp": "118/1301;91/952-4;;",
        "google_scholar": "j4pcHV4AAAAJ;Y8O9N_0AAAAJ;Zoiu7FsAAAAJ;nfXdXswAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Sifei_Liu2;~Xiaolong_Wang3;~Anchieh_Cheng1;~Xueting_Li1",
        "aff": "NVIDIA;University of California, San Diego;University of California, San Diego;NVIDIA",
        "aff_domain": "nvidia.com;ucsd.edu;ucsd.edu;nvidia.com",
        "position": "Researcher;Assistant Professor;PhD student;Researcher",
        "bibtex": "@inproceedings{\ncheng2024tuvf,\ntitle={{TUVF}: Learning Generalizable Texture {UV} Radiance Fields},\nauthor={An-Chieh Cheng and Xueting Li and Sifei Liu and Xiaolong Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=dN4vpVTvWX}\n}",
        "github": "",
        "project": "",
        "reviewers": "VxE5;KY39;K7dY;9F5H",
        "pdf_size": 50560067,
        "rating": "6;6;8;8",
        "confidence": "4;5;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;2;3;4",
        "wc_summary": "308;148;155;112",
        "wc_strengths": "73;43;52;52",
        "wc_weaknesses": "322;222;30;40",
        "wc_questions": "94;4;23;28",
        "wc_review": "797;417;260;232",
        "wc_reply_reviewers": "57;238;48;0",
        "wc_reply_authors": "782;1525;293;704",
        "reply_reviewers": "1;3;1;0",
        "reply_authors": "3;5;2;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            180.75,
            75.25747471181849
        ],
        "wc_strengths_avg": [
            55.0,
            11.022703842524301
        ],
        "wc_weaknesses_avg": [
            153.5,
            123.71236801548987
        ],
        "wc_questions_avg": [
            37.25,
            33.96597562267276
        ],
        "wc_review_avg": [
            426.5,
            225.22932757525163
        ],
        "wc_reply_reviewers_avg": [
            85.75,
            90.53279792428819
        ],
        "wc_reply_authors_avg": [
            826.0,
            444.2718762199561
        ],
        "reply_reviewers_avg": [
            1.25,
            1.0897247358851685
        ],
        "reply_authors_avg": [
            3.0,
            1.224744871391589
        ],
        "replies_avg": [
            31,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.7071067811865475,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9881594764721043465&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=dN4vpVTvWX",
        "pdf": "https://openreview.net/pdf?id=dN4vpVTvWX",
        "email": "nvidia.com;ucsd.edu;ucsd.edu;nvidia.com",
        "author_num": 4,
        "aff_unique_index": "0;1;1;0",
        "aff_unique_norm": "NVIDIA;University of California, San Diego",
        "aff_unique_dep": "NVIDIA Corporation;",
        "aff_unique_url": "https://www.nvidia.com;https://www.ucsd.edu",
        "aff_unique_abbr": "NVIDIA;UCSD",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";San Diego",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "dNMsieEiAc",
        "title": "Prompt2Rec : Prompt based user and item Re-characterizing method for Recommendation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Collaborative Filtering, which utilizes user-item interaction data is widely adopted in Recommendation Systems; however, the lack of interaction data can adversely affect recommendation performance. To address this issue, research incorporating Natural Language Processing (NLP) has made progress in leveraging review texts that contain rich information about user preferences and item attributes. Nevertheless, the conventional approach of integrating the entire review text and using it as an input, which has been widely used in previous research, can be vulnerable to noise (i.e., data with little relevance to user preferences or item attributes). In this study, we propose a novel user and item re-characterizing method called Prompt2Rec, which introduces the Prompt-based learning paradigm of NLP. It generates key factors that newly defined essential user and item characteristics from review texts and uses them as new information to train the recommendation model. Through experiments, we demonstrate that our proposed method can generate intuitive key factors related to user preferences and item attributes from reviews, and we validate that using these key factors in model training leads to improved performance compared to existing methods that rely on review texts. Furthermore, we explore the potential of visualizing the model's attention weights on the key factors for providing explanations of recommendations.",
        "keywords": "Review-based Recommendation System;Natural Language Processing;Prompt-based learning;Language Model;Review text",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/b26d15d2a8595792cdc6394c80c9e7e29bb51949.zip",
        "author": "Seonjin Hwang;Younghoon Lee",
        "authorids": "~Seonjin_Hwang1;~Younghoon_Lee1",
        "gender": "M;",
        "homepage": ";https://iise.seoultech.ac.kr/about_the_department/about_professor/?togo=list&menu=1215&profidx=02575",
        "dblp": ";",
        "google_scholar": "y9GIfIoAAAAJ;E6IKiR0AAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Seonjin_Hwang1;~Younghoon_Lee1",
        "aff": "Seoul National University of Science and Technology;",
        "aff_domain": "seoultech.ac.kr;",
        "position": "MS student;",
        "bibtex": "@misc{\nhwang2024promptrec,\ntitle={Prompt2Rec : Prompt based user and item Re-characterizing method for Recommendation},\nauthor={Seonjin Hwang and Younghoon Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=dNMsieEiAc}\n}",
        "github": "",
        "project": "",
        "reviewers": "TbAk;EWwu;dWh3;ZfrZ;EFBG",
        "site": "https://openreview.net/forum?id=dNMsieEiAc",
        "pdf_size": 2512912,
        "rating": "1;3;3;3;6",
        "confidence": "5;5;4;3;4",
        "soundness": "2;2;2;3;3",
        "contribution": "1;1;2;2;3",
        "presentation": "1;3;2;3;2",
        "wc_summary": "61;94;75;98;44",
        "wc_strengths": "24;29;72;54;34",
        "wc_weaknesses": "310;191;101;82;125",
        "wc_questions": "91;41;72;17;70",
        "wc_review": "486;355;320;251;273",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            3.2,
            1.6
        ],
        "confidence_avg": [
            4.2,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            1.8,
            0.7483314773547883
        ],
        "presentation_avg": [
            2.2,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            74.4,
            20.22473732833136
        ],
        "wc_strengths_avg": [
            42.6,
            17.88407112488653
        ],
        "wc_weaknesses_avg": [
            161.8,
            82.74635943653351
        ],
        "wc_questions_avg": [
            58.2,
            26.07220742476555
        ],
        "wc_review_avg": [
            337.0,
            82.83236082594773
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.36748420762958356,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5404052910191045816&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "Seoul National University of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.snust.ac.kr",
        "aff_unique_abbr": "SNUST",
        "aff_country_unique_index": "0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "Dual-Encoders for Extreme Multi-label Classification",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18261",
        "id": "dNe1T0Ahby",
        "author_site": "Nilesh Gupta, Fnu Devvrit, Ankit Singh Rawat, Srinadh Bhojanapalli, Prateek Jain, Inderjit Dhillon",
        "tldr": "",
        "abstract": "Dual-encoder (DE) models are widely used in retrieval tasks, most commonly studied on open QA benchmarks that are often characterized by multi-class and limited training data. In contrast, their performance in multi-label and data-rich retrieval settings like extreme multi-label classification (XMC), remains under-explored. Current empirical evidence indicates that DE models fall significantly short on XMC benchmarks, where SOTA methods linearly scale the number of learnable parameters with the total number of classes (documents in the corpus) by employing per-class classification head. To this end, we first study and highlight that existing multi-label contrastive training losses are not appropriate for training DE models on XMC tasks. We propose decoupled softmax loss - a simple modification to the InfoNCE loss - that overcomes the limitations of existing contrastive losses. We further extend our loss design to a soft top-k operator-based loss which is tailored to optimize top-k prediction performance. When trained with our proposed loss functions, standard DE models alone can match or outperform SOTA methods by up to 2\\% at Precision@1 even on the largest XMC datasets while being 20\u00d7 smaller in terms of the number of trainable parameters. This leads to more parameter-efficient and universally applicable solutions for retrieval tasks. Our code and models are publicly available [here](https://github.com/nilesh2797/dexml).",
        "keywords": "retrieval;dense retrieval;dual encoders;extreme multi-label classification",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/e97ee6125b2b378948340081f9fcc95a4d55454f.pdf",
        "author": "Nilesh Gupta;Fnu Devvrit;Ankit Singh Rawat;Srinadh Bhojanapalli;Prateek Jain;Inderjit S Dhillon",
        "authorids": "~Nilesh_Gupta1;~Fnu_Devvrit1;~Ankit_Singh_Rawat1;~Srinadh_Bhojanapalli1;~Prateek_Jain1;~Inderjit_S_Dhillon1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://nilesh2797.github.io/;;https://ankitsrawat.github.io/home/;https://bsrinadh.github.io/;http://prateekjain.org;http://www.cs.utexas.edu/users/inderjit/",
        "dblp": "256/5076;;https://dblp.org/pers/hd/r/Rawat:Ankit_Singh;131/6700;https://dblp.uni-trier.de/pers/j/Jain_0002:Prateek.html;d/InderjitSDhillon",
        "google_scholar": "WDF2ldUAAAAJ;c86HtPoAAAAJ;http://scholar.google.com/citations?user=U0_ab4cAAAAJ;bpSF_9EAAAAJ;qYhRbJoAAAAJ;xBv5ZfkAAAAJ",
        "orcid": "0000-0002-6065-8475;;;;;",
        "linkedin": ";devvrit/;;;;inderjit-dhillon-a20888b0/",
        "or_profile": "~Nilesh_Gupta1;~Fnu_Devvrit1;~Ankit_Singh_Rawat1;~Srinadh_Bhojanapalli1;~Prateek_Jain1;~Inderjit_S_Dhillon1",
        "aff": "University of Texas at Austin;, University of Texas at Austin;Google;Google;Google;University of Texas, Austin",
        "aff_domain": "utexas.edu;cs.utexas.edu;google.com;google.com;google.com;utexas.edu",
        "position": "PhD student;PhD student;Research Scientist;Research Scientist;Researcher;Full Professor",
        "bibtex": "@inproceedings{\ngupta2024dualencoders,\ntitle={Dual-Encoders for Extreme Multi-label Classification},\nauthor={Nilesh Gupta and Fnu Devvrit and Ankit Singh Rawat and Srinadh Bhojanapalli and Prateek Jain and Inderjit S Dhillon},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=dNe1T0Ahby}\n}",
        "github": "",
        "project": "",
        "reviewers": "1qgK;jMAd;BerB;Smm7",
        "pdf_size": 3299387,
        "rating": "6;6;6;8",
        "confidence": "3;3;2;3",
        "soundness": "3;3;3;3",
        "contribution": "3;2;2;3",
        "presentation": "2;2;2;2",
        "wc_summary": "111;64;123;226",
        "wc_strengths": "125;37;82;154",
        "wc_weaknesses": "126;121;159;156",
        "wc_questions": "3;10;109;509",
        "wc_review": "365;232;473;1045",
        "wc_reply_reviewers": "12;11;24;92",
        "wc_reply_authors": "204;670;994;986",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;1;2;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            131.0,
            59.11429607125505
        ],
        "wc_strengths_avg": [
            99.5,
            44.252118593350986
        ],
        "wc_weaknesses_avg": [
            140.5,
            17.124543789543708
        ],
        "wc_questions_avg": [
            157.75,
            207.08135478598743
        ],
        "wc_review_avg": [
            528.75,
            310.03900964233515
        ],
        "wc_reply_reviewers_avg": [
            34.75,
            33.446786093734026
        ],
        "wc_reply_authors_avg": [
            713.5,
            321.8769174700168
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16776272433117923180&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=dNe1T0Ahby",
        "pdf": "https://openreview.net/pdf?id=dNe1T0Ahby",
        "email": "utexas.edu;cs.utexas.edu;google.com;google.com;google.com;utexas.edu",
        "author_num": 6,
        "aff_unique_index": "0;0;1;1;1;0",
        "aff_unique_norm": "University of Texas at Austin;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.utexas.edu;https://www.google.com",
        "aff_unique_abbr": "UT Austin;Google",
        "aff_campus_unique_index": "0;0;1;1;1;0",
        "aff_campus_unique": "Austin;Mountain View",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "dNzBTVuMgq",
        "title": "Accelerating Non-IID Federated Learning via Heterogeneity-Guided Client Sampling",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Statistical heterogeneity of data present at client devices in a federated learning (FL) system renders the training of a global model in such systems difficult. Particularly challenging are the settings where due to resource constraints only a small fraction of clients can participate in any given round of FL. Recent approaches to training a global model in FL systems with non-IID data have focused on developing client selection methods that aim to sample clients with more informative updates of the model. However, existing client selection techniques either introduce significant computation overhead or perform well only in the scenarios where clients have data with similar heterogeneity profiles. In this paper, we propose HiCS-FL (Federated Learning via Hierarchical Clustered Sampling), a novel client selection method in which the server estimates statistical heterogeneity of a client's data using the client\u2019s update of the network\u2019s output layer and relies on this information to cluster and sample the clients. We analyze the ability of the proposed techniques to compare heterogeneity of different datasets, and characterize convergence of the training process that deploys the introduced client selection method. Extensive experimental results demonstrate that in non-IID settings HiCS-FL achieves faster convergence and lower training variance than state-of-the-art FL client selection schemes. Notably, HiCS-FL drastically reduces computation cost compared to existing selection schemes and is adaptable to different heterogeneity scenarios.",
        "keywords": "Federated Learning;Client Selection;Non-IID data",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Huancheng Chen;Haris Vikalo",
        "authorids": "~Huancheng_Chen1;~Haris_Vikalo1",
        "gender": "M;",
        "homepage": "https://citychan.github.io/;",
        "dblp": "302/4540;",
        "google_scholar": "https://scholar.google.com.tw/citations?hl=zh-TW;",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Huancheng_Chen1;~Haris_Vikalo1",
        "aff": "University of Texas, Austin;",
        "aff_domain": "utexas.edu;",
        "position": "PhD student;",
        "bibtex": "@misc{\nchen2024accelerating,\ntitle={Accelerating Non-{IID} Federated Learning via Heterogeneity-Guided Client Sampling},\nauthor={Huancheng Chen and Haris Vikalo},\nyear={2024},\nurl={https://openreview.net/forum?id=dNzBTVuMgq}\n}",
        "github": "",
        "project": "",
        "reviewers": "V18X;yWNZ;BfMQ",
        "site": "https://openreview.net/forum?id=dNzBTVuMgq",
        "pdf_size": 2794342,
        "rating": "5;5;8",
        "confidence": "3;3;3",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "2;3;2",
        "wc_summary": "74;115;153",
        "wc_strengths": "32;20;123",
        "wc_weaknesses": "89;109;179",
        "wc_questions": "4;90;62",
        "wc_review": "199;334;517",
        "wc_reply_reviewers": "42;0;74",
        "wc_reply_authors": "872;1384;903",
        "reply_reviewers": "1;0;2",
        "reply_authors": "3;5;2",
        "rating_avg": [
            6.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            114.0,
            32.25936556516056
        ],
        "wc_strengths_avg": [
            58.333333333333336,
            45.98792111945145
        ],
        "wc_weaknesses_avg": [
            125.66666666666667,
            38.58612300930075
        ],
        "wc_questions_avg": [
            52.0,
            35.81433604950212
        ],
        "wc_review_avg": [
            350.0,
            130.31500297356402
        ],
        "wc_reply_reviewers_avg": [
            38.666666666666664,
            30.3021818063027
        ],
        "wc_reply_authors_avg": [
            1053.0,
            234.39425476463083
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            1.247219128924647
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15215075648886170937&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Texas at Austin",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.utexas.edu",
        "aff_unique_abbr": "UT Austin",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Austin",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "dO06t9iVO3",
        "title": "Domain Generalization Using Large Pretrained Models With Mixture-of-Adapters",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Learning a robust vision model despite large distribution shift situations is an important task for model deployment in real-world settings. Especially, domain generalization (DG) algorithm aims to maintain the performance of a trained model on different distributions which were not seen during training. One of the most effective method has been leveraging the already learned rich knowledge of large pretrained models. However, naively tuning large models to DG tasks is practically infeasible due to memory limitations, extensive time requirements for training, and the risk of learned knowledge deterioration. Parameter-efficient fine-tuning (PEFT) methods have been used to reduce the high computational cost during training and efficiently adapt large models to downstream tasks. In this work for the first time we find that the use of adapters in PEFT methods not only reduce high computational cost during training but also serve as an effective regularizer for DG tasks. Surprisingly, a naive adapter implementation for large models achieve superior performance on common datasets. However, in situations of large distribution shifts, additional factors such as optimal amount of regularization due to the strength of distribution shifts should be considered for a sophisticated adapter implementation. As a result, we propose a mixture-of-expert based adapter fine-tuning method, dubbed as mixture-of-adapters (MoA). We employ multiple adapters that have varying capacities, and by using learnable routers, we allocate each token to a proper adapter. By using both PEFT and MoA methods we effectively alleviate the performance deterioration caused by distribution shifts and achieve state-of-the-art performance on diverse DG benchmarks.",
        "keywords": "domain generalization;distribution shift;fine-tuning;transfer learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Gyuseong Lee;Wooseok Jang;Jin Hyeon Kim;Jaewoo Jung;Seungryong Kim",
        "authorids": "~Gyuseong_Lee1;~Wooseok_Jang2;~Jin_Hyeon_Kim1;~Jaewoo_Jung2;~Seungryong_Kim1",
        "gender": ";;M;M;M",
        "homepage": "https://gseonglee.github.io;https://github.com/woo1726;https://cvlab.korea.ac.kr/;https://crepejung00.github.io;https://cvlab.korea.ac.kr/members/faculty",
        "dblp": "312/4504;30/4458;;219/7944;141/9955",
        "google_scholar": "O6B36wwAAAAJ;;;TNhL4AoAAAAJ;cIK1hS8AAAAJ",
        "orcid": "0000-0002-0396-824X;;;;",
        "linkedin": "gyuseong-lee-172957206/;;;;",
        "or_profile": "~Gyuseong_Lee1;~Wooseok_Jang2;~Jin_Hyeon_Kim1;~Jaewoo_Jung2;~Seungryong_Kim1",
        "aff": "Korea University;Korea University;Korea University;Korea University;Korea University",
        "aff_domain": "korea.ac.kr;korea.ac.kr;korea.ac.kr;korea.ac.kr;korea.ac.kr",
        "position": "MS student;MS student;MS student;MS student;Assistant Professor",
        "bibtex": "@misc{\nlee2024domain,\ntitle={Domain Generalization Using Large Pretrained Models With Mixture-of-Adapters},\nauthor={Gyuseong Lee and Wooseok Jang and Jin Hyeon Kim and Jaewoo Jung and Seungryong Kim},\nyear={2024},\nurl={https://openreview.net/forum?id=dO06t9iVO3}\n}",
        "github": "",
        "project": "",
        "reviewers": "PB7i;6XsZ;JkEq;Ksvd",
        "site": "https://openreview.net/forum?id=dO06t9iVO3",
        "pdf_size": 12441130,
        "rating": "1;3;3;5",
        "confidence": "4;4;4;4",
        "soundness": "1;2;2;2",
        "contribution": "1;1;2;2",
        "presentation": "1;1;1;3",
        "wc_summary": "77;77;37;91",
        "wc_strengths": "30;52;31;90",
        "wc_weaknesses": "203;432;258;289",
        "wc_questions": "2;241;2;29",
        "wc_review": "312;802;328;499",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            1.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            70.5,
            20.168044030098706
        ],
        "wc_strengths_avg": [
            50.75,
            24.304063446263466
        ],
        "wc_weaknesses_avg": [
            295.5,
            84.61235134423343
        ],
        "wc_questions_avg": [
            68.5,
            100.20104789871212
        ],
        "wc_review_avg": [
            485.25,
            197.01697261911218
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9051157488105356694&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Korea University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.korea.ac.kr",
        "aff_unique_abbr": "KU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "Closing the Curious Case of Neural Text Degeneration",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18260",
        "id": "dONpC9GL1o",
        "author_site": "Matthew Finlayson, John Hewitt, Alexander Koller, Swabha Swayamdipta, Ashish Sabharwal",
        "tldr": "",
        "abstract": "Despite their ubiquity in language generation, it remains unknown why truncation sampling heuristics like nucleus sampling are so effective. We provide a theoretical explanation for the effectiveness of the truncation sampling by proving that truncation methods that discard tokens below some probability threshold (the most common type of truncation) can guarantee that all sampled tokens have nonzero true probability. However, thresholds are a coarse heuristic, and necessarily discard some tokens with nonzero true probability as well. In pursuit of a more precise sampling strategy, we show that we can leverage a known source of model errors, the softmax bottleneck, to prove that certain tokens have nonzero true probability, without relying on a threshold. Based on our findings, we develop an experimental truncation strategy and the present pilot studies demonstrating the promise of this type of algorithm. Our evaluations show that our method outperforms its threshold-based counterparts under automatic and human evaluation metrics for low-entropy (i.e., close to greedy) open-ended text generation. Our theoretical findings and pilot experiments provide both insight into why truncation sampling works, and make progress toward more expressive sampling algorithms that better surface the generative capabilities of large language models.",
        "keywords": "softmax;bottleneck;truncation;sampling;nucleus;top-k;theory;linear programming;linear algebra;decoding;generation;autoregressive;language model;NLP;open-ended generation",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Matthew Finlayson;John Hewitt;Alexander Koller;Swabha Swayamdipta;Ashish Sabharwal",
        "authorids": "~Matthew_Finlayson1;~John_Hewitt1;~Alexander_Koller2;~Swabha_Swayamdipta1;~Ashish_Sabharwal1",
        "gender": "M;M;;F;M",
        "homepage": "https://mattf1n.github.io;https://nlp.stanford.edu/~johnhew/;;http://swabhs.com/;",
        "dblp": "55/3614;205/9025;;121/2036;13/154",
        "google_scholar": "_ODwk4EAAAAJ;7C27kVMAAAAJ;;3uTVQt0AAAAJ;7VspfeAAAAAJ",
        "orcid": ";;;0000-0002-5851-8254;",
        "linkedin": ";;;swabhaswayamdipta;ashish-sabharwal-82a2b661",
        "or_profile": "~Matthew_Finlayson1;~John_Hewitt1;~Alexander_Koller2;~Swabha_Swayamdipta1;~Ashish_Sabharwal1",
        "aff": "University of Southern California;Stanford University;;University of Southern California;Allen Institute for AI",
        "aff_domain": "usc.edu;stanford.edu;;usc.edu;allenai.org",
        "position": "PhD student;PhD student;;Assistant Professor;Principal Researcher",
        "bibtex": "@inproceedings{\nfinlayson2024closing,\ntitle={Closing the Curious Case of Neural Text Degeneration},\nauthor={Matthew Finlayson and John Hewitt and Alexander Koller and Swabha Swayamdipta and Ashish Sabharwal},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=dONpC9GL1o}\n}",
        "github": "",
        "project": "",
        "reviewers": "Hq1N;4bep;8Qv3;pgkn",
        "pdf_size": 902424,
        "rating": "6;8;8;8",
        "confidence": "4;4;2;4",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;3;4",
        "wc_summary": "172;100;163;143",
        "wc_strengths": "26;32;230;41",
        "wc_weaknesses": "58;175;88;146",
        "wc_questions": "251;1;47;417",
        "wc_review": "507;308;528;747",
        "wc_reply_reviewers": "0;0;0;20",
        "wc_reply_authors": "736;496;520;747",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            144.5,
            27.753378172755834
        ],
        "wc_strengths_avg": [
            82.25,
            85.47038960950161
        ],
        "wc_weaknesses_avg": [
            116.75,
            46.17020142906028
        ],
        "wc_questions_avg": [
            179.0,
            166.53528154718447
        ],
        "wc_review_avg": [
            522.5,
            155.46784233403383
        ],
        "wc_reply_reviewers_avg": [
            5.0,
            8.660254037844387
        ],
        "wc_reply_authors_avg": [
            624.75,
            117.12253199107334
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11059214908540394691&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=dONpC9GL1o",
        "pdf": "https://openreview.net/pdf?id=dONpC9GL1o",
        "email": "usc.edu;stanford.edu;;usc.edu;allenai.org",
        "author_num": 5,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "University of Southern California;Stanford University;Allen Institute for AI",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.usc.edu;https://www.stanford.edu;https://allenai.org",
        "aff_unique_abbr": "USC;Stanford;AI2",
        "aff_campus_unique_index": "0;1;0",
        "aff_campus_unique": "Los Angeles;Stanford;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Fast, Expressive $\\mathrm{SE}(n)$ Equivariant Networks through Weight-Sharing in Position-Orientation Space",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18259",
        "id": "dPHLbUqGbr",
        "author_site": "Erik Bekkers, Sharvaree Vadgama, Rob Hesselink, Putri van der Linden, David Wilson Romero",
        "tldr": "",
        "abstract": "Based on the theory of homogeneous spaces we derive *geometrically optimal edge attributes* to be used within the flexible message-passing framework. We formalize the notion of weight sharing in convolutional networks as the sharing of message functions over point-pairs that should be treated equally. We define equivalence classes of point-pairs that are identical up to a transformation in the group and derive attributes that uniquely identify these classes. Weight sharing is then obtained by conditioning message functions on these attributes. As an application of the theory, we develop an efficient equivariant group convolutional network for processing 3D point clouds. The theory of homogeneous spaces tells us how to do group convolutions with feature maps over the homogeneous space of positions $\\mathbb{R}^3$, position and orientations $\\mathbb{R}^3 {\\times} S^2$, and the group $SE(3)$ itself. Among these, $\\mathbb{R}^3 {\\times} S^2$ is an optimal choice due to the ability to represent directional information, which $\\mathbb{R}^3$ methods cannot, and it significantly enhances computational efficiency compared to indexing features on the full $SE(3)$ group. We support this claim with state-of-the-art results \u2014in accuracy and speed\u2014 on five different benchmarks in 2D and 3D, including interatomic potential energy prediction, trajectory forecasting in N-body systems, and generating molecules via equivariant diffusion models.\n\n*Code available at [https://github.com/ebekkers/ponita](https://github.com/ebekkers/ponita)*",
        "keywords": "Equivariance;Point Clouds;Message Passing Neural Network;Molecules;Diffusion Model",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/7d6f5e4368b1aca0c3672db620c68452d2923c9c.zip",
        "author": "Erik J Bekkers;Sharvaree Vadgama;Rob Hesselink;Putri A Van der Linden;David W. Romero",
        "authorids": "~Erik_J_Bekkers1;~Sharvaree_Vadgama2;~Rob_Hesselink1;~Putri_A_Van_der_Linden1;~David_W._Romero1",
        "gender": ";F;F;M;M",
        "homepage": "https://erikbekkers.bitbucket.io/;https://amlab.science.uva.nl/people/SharvareeVadgama/;;https://davidwromero.xyz/;https://amlab.science.uva.nl/",
        "dblp": "43/5596;306/1002;;254/1396;",
        "google_scholar": "https://scholar.google.nl/citations?user=yeWrfR4AAAAJ;https://scholar.google.com/citations?hl=en;;7tdzmVoAAAAJ;",
        "orcid": ";;;;",
        "linkedin": ";sharvaree-vadgama/;putrivanderlinden/;david-w-romero-05893567/;",
        "or_profile": "~Erik_J_Bekkers1;~Sharvaree_Vadgama2;~Putri_A_Van_der_Linden1;~David_W._Romero1;~Rob_Daniel_Hesselink1",
        "aff": "University of Amsterdam;University of Amsterdam;University of Amsterdam, University of Amsterdam;NVIDIA;University of Amsterdam",
        "aff_domain": "uva.nl;uva.nl;ivi.uva.nl;nvidia.com;uva.nl",
        "position": "Assistant Professor;PhD student;PhD student;Researcher;PhD student",
        "bibtex": "@inproceedings{\nbekkers2024fast,\ntitle={Fast, Expressive \\${\\textbackslash}mathrm\\{{SE}\\}(n)\\$ Equivariant Networks through Weight-Sharing in Position-Orientation Space},\nauthor={Erik J Bekkers and Sharvaree Vadgama and Rob Hesselink and Putri A Van der Linden and David W. Romero},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=dPHLbUqGbr}\n}",
        "github": "",
        "project": "",
        "reviewers": "7BQC;MJgQ;3W6S",
        "pdf_size": 1184586,
        "rating": "5;6;8",
        "confidence": "2;4;3",
        "soundness": "3;3;3",
        "contribution": "2;2;3",
        "presentation": "2;2;3",
        "wc_summary": "33;118;86",
        "wc_strengths": "18;20;22",
        "wc_weaknesses": "47;93;4",
        "wc_questions": "16;13;1",
        "wc_review": "114;244;113",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "525;1010;109",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;2;1",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            79.0,
            35.05234181430203
        ],
        "wc_strengths_avg": [
            20.0,
            1.632993161855452
        ],
        "wc_weaknesses_avg": [
            48.0,
            36.34097778908359
        ],
        "wc_questions_avg": [
            10.0,
            6.48074069840786
        ],
        "wc_review_avg": [
            157.0,
            61.51964455900787
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            548.0,
            368.19107358363084
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.3273268353539886,
        "gs_citation": 24,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10825370200534677910&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=dPHLbUqGbr",
        "pdf": "https://openreview.net/pdf?id=dPHLbUqGbr",
        "email": "uva.nl;uva.nl;ivi.uva.nl;nvidia.com;uva.nl",
        "author_num": 5,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "University of Amsterdam;NVIDIA",
        "aff_unique_dep": ";NVIDIA Corporation",
        "aff_unique_url": "https://www.uva.nl;https://www.nvidia.com",
        "aff_unique_abbr": "UvA;NVIDIA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "Netherlands;United States"
    },
    {
        "title": "Efficient Video Diffusion Models via Content-Frame Motion-Latent Decomposition",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18258",
        "id": "dQVtTdsvZH",
        "author_site": "Sihyun Yu, Weili Nie, De-An Huang, Boyi Li, Jinwoo Shin, anima anandkumar",
        "tldr": "",
        "abstract": "Video diffusion models have recently made great progress in generation quality, but are still limited by the high memory and computational requirements. This is because current video diffusion models often attempt to process high-dimensional videos directly. To tackle this issue, we propose content-motion latent diffusion model (CMD), a novel efficient extension of pretrained image diffusion models for video generation. Specifically, we propose an autoencoder that succinctly encodes a video as a combination of a content frame (like an image) and a low-dimensional motion latent representation. The former represents the common content, and the latter represents the underlying motion in the video, respectively. We generate the content frame by fine-tuning a pretrained image diffusion model, and we generate the motion latent representation by training a new lightweight diffusion model. A key innovation here is the design of a compact latent space that can directly utilizes a pretrained image diffusion model, which has not been done in previous latent video diffusion models. This leads to considerably better quality generation and reduced computational costs. For instance, CMD can sample a video 7.7$\\times$ faster than prior approaches by generating a video of 512$\\times$1024 resolution and length 16 in 3.1 seconds. Moreover, CMD achieves an FVD score of 238.3 on WebVid-10M, 18.5% better than the previous state-of-the-art of 292.4.",
        "keywords": "video generation;diffusion models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/d7dd7ddcff3a72c7774cd8dab4e50accf1f0dc59.zip",
        "author": "Sihyun Yu;Weili Nie;De-An Huang;Boyi Li;Jinwoo Shin;Anima Anandkumar",
        "authorids": "~Sihyun_Yu2;~Weili_Nie1;~De-An_Huang1;~Boyi_Li1;~Jinwoo_Shin1;~Anima_Anandkumar1",
        "gender": "M;M;M;F;M;F",
        "homepage": "https://sihyun-yu.github.io;https://weilinie.github.io/;http://ai.stanford.edu/~dahuang/;https://sites.google.com/site/boyilics/home;https://sites.google.com/site/mijirim/;http://tensorlab.cms.caltech.edu/users/anima/",
        "dblp": "287/4627;147/4786;119/0335;;31/7062;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;zW7BH7oAAAAJ;HEY3UzgAAAAJ;;https://scholar.google.com.tw/citations?user=m3eDp7kAAAAJ;bEcLezcAAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";;;;;anima-anandkumar-35171b1/",
        "or_profile": "~Sihyun_Yu2;~Weili_Nie1;~De-An_Huang1;~Boyi_Li1;~Jinwoo_Shin1;~anima_anandkumar1",
        "aff": "Research, Google;NVIDIA;NVIDIA;University of California, Berkeley;Korea Advanced Institute of Science & Technology;California Institute of Technology",
        "aff_domain": "research.google.com;nvidia.com;nvidia.com;berkeley.edu;kaist.ac.kr;caltech.edu",
        "position": "Intern;Research Scientist;Research Scientist;Postdoc;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nyu2024efficient,\ntitle={Efficient Video Diffusion Models via Content-Frame Motion-Latent Decomposition},\nauthor={Sihyun Yu and Weili Nie and De-An Huang and Boyi Li and Jinwoo Shin and Anima Anandkumar},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=dQVtTdsvZH}\n}",
        "github": "",
        "project": "",
        "reviewers": "BXkg;cbVn;cm4G;jHjr",
        "pdf_size": 16260138,
        "rating": "6;6;8;8",
        "confidence": "5;2;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "64;38;143;40",
        "wc_strengths": "60;38;78;53",
        "wc_weaknesses": "379;158;43;111",
        "wc_questions": "5;8;124;14",
        "wc_review": "508;242;388;218",
        "wc_reply_reviewers": "0;139;30;0",
        "wc_reply_authors": "642;871;659;346",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;2;2;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            71.25,
            42.669514878892166
        ],
        "wc_strengths_avg": [
            57.25,
            14.376630342329875
        ],
        "wc_weaknesses_avg": [
            172.75,
            125.90149919679273
        ],
        "wc_questions_avg": [
            37.75,
            49.90177852541931
        ],
        "wc_review_avg": [
            339.0,
            117.27318534089538
        ],
        "wc_reply_reviewers_avg": [
            42.25,
            57.1855532455532
        ],
        "wc_reply_authors_avg": [
            629.5,
            186.89636165533025
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.22941573387056177,
        "gs_citation": 24,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10821168692872437131&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=dQVtTdsvZH",
        "pdf": "https://openreview.net/pdf?id=dQVtTdsvZH",
        "email": "research.google.com;nvidia.com;nvidia.com;berkeley.edu;kaist.ac.kr;caltech.edu",
        "author_num": 6,
        "aff_unique_index": "0;1;1;2;3;4",
        "aff_unique_norm": "Google;NVIDIA;University of California, Berkeley;Korea Advanced Institute of Science and Technology;California Institute of Technology",
        "aff_unique_dep": "Google Research;NVIDIA Corporation;;;",
        "aff_unique_url": "https://research.google;https://www.nvidia.com;https://www.berkeley.edu;https://www.kaist.ac.kr;https://www.caltech.edu",
        "aff_unique_abbr": "Google;NVIDIA;UC Berkeley;KAIST;Caltech",
        "aff_campus_unique_index": "0;2;3",
        "aff_campus_unique": "Mountain View;;Berkeley;Pasadena",
        "aff_country_unique_index": "0;0;0;0;1;0",
        "aff_country_unique": "United States;South Korea"
    },
    {
        "id": "dRel8fuUK4",
        "title": "Low-Cost High-Power Membership Inference by Boosting Relativity",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We present a membership inference attack game and design a novel attack (RMIA), which effectively leverages both reference models and population data in its likelihood ratio test. Our test amplifies the distinction between members and non-members relative to any target model. Our algorithm exhibits superior test power (true-positive rate) when compared to prior methods, even at extremely low false-positive error rates (as low as 0), and  dominates them throughout the TPR-FPR tradeoff curve. It also performs exceptionally well under challenging real-world constraints, where only a limited number of reference models (as few as 1) are available, where the prior attack results approach random guess. Our method lays the groundwork for cost-effective and practical yet powerful privacy risk analysis of machine learning algorithms.",
        "keywords": "Privacy Auditing;Information Leakage;Membership Infererence Attacks;Reference Models",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Sajjad Zarifzadeh;Philippe Cheng-Jie Marc Liu;Reza Shokri",
        "authorids": "~Sajjad_Zarifzadeh1;~Philippe_Cheng-Jie_Marc_Liu1;~Reza_Shokri1",
        "gender": "M;M;",
        "homepage": "https://yazd.ac.ir/en/people/zarifzadeh;https://github.com/pliu-tpt;",
        "dblp": ";;",
        "google_scholar": "IGMsPeUAAAAJ;;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Sajjad_Zarifzadeh1;~Philippe_Cheng-Jie_Marc_Liu1;~Reza_Shokri1",
        "aff": ";;",
        "aff_domain": ";;",
        "position": ";;",
        "bibtex": "@misc{\nzarifzadeh2024lowcost,\ntitle={Low-Cost High-Power Membership Inference by Boosting Relativity},\nauthor={Sajjad Zarifzadeh and Philippe Cheng-Jie Marc Liu and Reza Shokri},\nyear={2024},\nurl={https://openreview.net/forum?id=dRel8fuUK4}\n}",
        "github": "",
        "project": "",
        "reviewers": "qcX6;HGWk;F7FX;Ju68",
        "site": "https://openreview.net/forum?id=dRel8fuUK4",
        "pdf_size": 2891127,
        "rating": "5;5;6;8",
        "confidence": "3;3;3;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;1;2;3",
        "wc_summary": "38;153;36;116",
        "wc_strengths": "55;94;69;181",
        "wc_weaknesses": "72;146;435;137",
        "wc_questions": "165;82;218;44",
        "wc_review": "330;475;758;478",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "832;803;769;803",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            85.75,
            50.47957507745088
        ],
        "wc_strengths_avg": [
            99.75,
            48.945760797029195
        ],
        "wc_weaknesses_avg": [
            197.5,
            140.06159359367578
        ],
        "wc_questions_avg": [
            127.25,
            68.26190372381949
        ],
        "wc_review_avg": [
            510.25,
            155.04253448650792
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            801.75,
            22.30891077574161
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.9428090415820632,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15982051602823803513&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0
    },
    {
        "title": "Neural Polynomial Gabor Fields for Macro Motion Analysis",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18257",
        "id": "dTlKCQuuxP",
        "author_site": "Chen Geng, Koven Yu, Sida Peng, Xiaowei Zhou, Jiajun Wu",
        "tldr": "",
        "abstract": "We study macro motion analysis, where macro motion refers to the collection of all visually observable motions in a dynamic scene. Traditional filtering-based methods on motion analysis typically focus only on local and tiny motions, yet fail to represent large motions or 3D scenes. Recent dynamic neural representations can faithfully represent motions using correspondences, but they cannot be directly used for motion analysis. In this work, we propose Phase-based neural polynomial Gabor fields (Phase-PGF), which learns to represent scene dynamics with low-dimensional time-varying phases. We theoretically show that Phase-PGF has several properties suitable for macro motion analysis. In our experiments, we collect diverse 2D and 3D dynamic scenes and show that Phase-PGF enables dynamic scene analysis and editing tasks including motion loop detection, motion factorization, motion smoothing, and motion magnification. Project page: https://chen-geng.com/phasepgf",
        "keywords": "Scene Representation;Video Analysis;Motion Analysis;Neural Rendering;3D Vision",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Chen Geng;Hong-Xing Yu;Sida Peng;Xiaowei Zhou;Jiajun Wu",
        "authorids": "~Chen_Geng1;~Hong-Xing_Yu1;~Sida_Peng1;~Xiaowei_Zhou3;~Jiajun_Wu1",
        "gender": "Not Specified;M;M;M;M",
        "homepage": "https://chen-geng.com/;https://kovenyu.com;http://pengsida.net/;http://xzhou.me/;https://jiajunwu.com",
        "dblp": "126/7811-1;205/2676.html;232/3246;;117/4768",
        "google_scholar": "Q36tl7oAAAAJ;kNKncZcAAAAJ;;E1vVpg4AAAAJ;2efgcS0AAAAJ",
        "orcid": "0000-0002-1350-7711;;;;0000-0002-4176-343X",
        "linkedin": "chen-geng-aa8a09125/;;;;jiajunwu/",
        "or_profile": "~Chen_Geng1;~Hong-Xing_Yu1;~Sida_Peng1;~Xiaowei_Zhou3;~Jiajun_Wu1",
        "aff": "Stanford University;Stanford University;Zhejiang University;Zhejiang University;Stanford University",
        "aff_domain": "cs.stanford.edu;cs.stanford.edu;zju.edu.cn;zju.edu.cn;stanford.edu",
        "position": "PhD student;PhD student;Assistant Professor;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\ngeng2024neural,\ntitle={Neural Polynomial Gabor Fields for Macro Motion Analysis},\nauthor={Chen Geng and Hong-Xing Yu and Sida Peng and Xiaowei Zhou and Jiajun Wu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=dTlKCQuuxP}\n}",
        "github": "",
        "project": "",
        "reviewers": "NjSx;WSr6;no8y;EQJi",
        "pdf_size": 14551921,
        "rating": "6;6;6;6",
        "confidence": "2;4;2;4",
        "soundness": "3;3;2;3",
        "contribution": "3;3;2;3",
        "presentation": "3;3;2;3",
        "wc_summary": "178;124;47;216",
        "wc_strengths": "327;58;73;101",
        "wc_weaknesses": "241;126;94;332",
        "wc_questions": "154;43;61;216",
        "wc_review": "900;351;275;865",
        "wc_reply_reviewers": "18;0;0;29",
        "wc_reply_authors": "856;502;713;1205",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "2;1;1;3",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            1.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            141.25,
            63.47981962797311
        ],
        "wc_strengths_avg": [
            139.75,
            109.20479614009633
        ],
        "wc_weaknesses_avg": [
            198.25,
            94.6107155664727
        ],
        "wc_questions_avg": [
            118.5,
            70.30824987154779
        ],
        "wc_review_avg": [
            597.75,
            286.2825309026033
        ],
        "wc_reply_reviewers_avg": [
            11.75,
            12.376893794486563
        ],
        "wc_reply_authors_avg": [
            819.0,
            255.97363145449182
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:6-Y73ydHsz4J:scholar.google.com/&scioq=Neural+Polynomial+Gabor+Fields+for+Macro+Motion+Analysis&hl=en&as_sdt=0,5",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=dTlKCQuuxP",
        "pdf": "https://openreview.net/pdf?id=dTlKCQuuxP",
        "email": "cs.stanford.edu;cs.stanford.edu;zju.edu.cn;zju.edu.cn;stanford.edu",
        "author_num": 5,
        "aff_unique_index": "0;0;1;1;0",
        "aff_unique_norm": "Stanford University;Zhejiang University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.stanford.edu;https://www.zju.edu.cn",
        "aff_unique_abbr": "Stanford;ZJU",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Stanford;",
        "aff_country_unique_index": "0;0;1;1;0",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "Human Motion Diffusion as a Generative Prior",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18256",
        "id": "dTpbEdN9kr",
        "author_site": "Yonatan Shafir, Guy Tevet, Roy Kapon, Amit Bermano",
        "tldr": "",
        "abstract": "Recent work has demonstrated the significant potential of denoising diffusion models\nfor generating human motion, including text-to-motion capabilities.\nHowever, these methods are restricted by the paucity of annotated motion data,\na focus on single-person motions, and a lack of detailed control.\nIn this paper, we introduce three forms of composition based on diffusion priors:\nsequential, parallel, and model composition.\nUsing sequential composition, we tackle the challenge of long sequence\ngeneration. We introduce DoubleTake, an inference-time method with which\nwe generate long animations consisting of sequences of prompted intervals\nand their transitions, using a prior trained only for short clips.\nUsing parallel composition, we show promising steps toward two-person generation.\nBeginning with two fixed priors as well as a few two-person training examples, we learn a slim\ncommunication block, ComMDM, to coordinate interaction between the two resulting motions.\nLastly, using model composition, we first train individual priors\nto complete motions that realize a prescribed motion for a given joint.\nWe then introduce DiffusionBlending, an interpolation mechanism to effectively blend several\nsuch models to enable flexible and efficient fine-grained joint and trajectory-level control and editing.\nWe evaluate the composition methods using an off-the-shelf motion diffusion model,\nand further compare the results to dedicated models trained for these specific tasks.",
        "keywords": "diffusion;prior;composition;generation;motion;generative",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/abc60fbd3b146507f4aa4fdd7ee77c443942d9cd.zip",
        "author": "Yoni Shafir;Guy Tevet;Roy Kapon;Amit Haim Bermano",
        "authorids": "~Yoni_Shafir1;~Guy_Tevet1;~Roy_Kapon1;~Amit_Haim_Bermano2",
        "gender": "M;M;M;M",
        "homepage": ";https://guytevet.github.io/;;https://www.cs.tau.ac.il/~amberman/",
        "dblp": "330/2698;229/4227.html;;97/10458",
        "google_scholar": ";P9ROgN8AAAAJ;FAQOuSgAAAAJ;https://scholar.google.co.il/citations?user=EPO5_f4AAAAJ",
        "orcid": ";0000-0003-4376-2403;;",
        "linkedin": "yonatan-shafir-2811a3148/;;;",
        "or_profile": "~Yoni_Shafir1;~Guy_Tevet1;~Roy_Kapon1;~Amit_Haim_Bermano2",
        "aff": "Tel Aviv University;Tel Aviv University;Tel Aviv University;Tel Aviv University",
        "aff_domain": "tau.ac.il;tau.ac.il;tau.ac.il;tau.ac.il",
        "position": "MS student;PhD student;MS student;Associate Professor",
        "bibtex": "@inproceedings{\nshafir2024human,\ntitle={Human Motion Diffusion as a Generative Prior},\nauthor={Yoni Shafir and Guy Tevet and Roy Kapon and Amit Haim Bermano},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=dTpbEdN9kr}\n}",
        "github": "",
        "project": "",
        "reviewers": "1uD6;xoQq;ijG5;w1k5",
        "pdf_size": 19240519,
        "rating": "6;6;6;6",
        "confidence": "4;5;3;4",
        "soundness": "3;3;3;4",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "117;92;133;72",
        "wc_strengths": "45;63;178;32",
        "wc_weaknesses": "100;87;208;206",
        "wc_questions": "18;8;2;124",
        "wc_review": "280;250;521;434",
        "wc_reply_reviewers": "28;0;0;0",
        "wc_reply_authors": "138;271;205;289",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            103.5,
            23.32916629457641
        ],
        "wc_strengths_avg": [
            79.5,
            57.92451985126851
        ],
        "wc_weaknesses_avg": [
            150.25,
            56.940209869651866
        ],
        "wc_questions_avg": [
            38.0,
            49.9799959983992
        ],
        "wc_review_avg": [
            371.25,
            111.12014893798514
        ],
        "wc_reply_reviewers_avg": [
            7.0,
            12.12435565298214
        ],
        "wc_reply_authors_avg": [
            225.75,
            59.53727823809214
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 229,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4816787665085914592&as_sdt=5,31&sciodt=0,31&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=dTpbEdN9kr",
        "pdf": "https://openreview.net/pdf?id=dTpbEdN9kr",
        "email": "tau.ac.il;tau.ac.il;tau.ac.il;tau.ac.il",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Tel Aviv University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tau.ac.il",
        "aff_unique_abbr": "TAU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Israel"
    },
    {
        "id": "dUCWpEUrWo",
        "title": "Asynchronous Graph Generators",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We introduce the asynchronous graph generator (AGG), a novel graph neural network architecture for multi-channel time series which models observations as nodes on a dynamic graph and can thus perform data imputation by transductive node generation. Completely free from recurrent components or assumptions about temporal regularity, AGG represents measurements, timestamps and metadata directly in the nodes via learnable embeddings, to then leverage attention to learn expressive relationships across the variables of interest. This way, the proposed architecture implicitly learns a causal graph representation of sensor measurements which can be conditioned on unseen timestamps and metadata to predict new measurements by an expansion of the learnt graph. The proposed AGG is compared both conceptually and empirically to previous work, and the impact of data augmentation on the performance of AGG is also briefly discussed. Our experiments reveal that AGG achieved state-of-the-art results in time series data imputation, classification and prediction for the benchmark datasets \\emph{Beijing Air Quality}, \\emph{PhysioNet Challenge 2012} and \\emph{UCI localisation}.",
        "keywords": "continuous-time dynamic graphs;time-series imputation;graph neural networks;graph generators",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/30fed1f85909e4d428276ea400f352c717d3ca0f.zip",
        "author": "Christopher P. Ley;Felipe Tobar",
        "authorids": "~Christopher_P._Ley1;~Felipe_Tobar1",
        "gender": "M;M",
        "homepage": "https://www.linkedin.com/in/christopher-p-ley/;http://www.dim.uchile.cl/~ftobar",
        "dblp": ";136/5327",
        "google_scholar": "76b7EYsAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0001-9896-4083;0000-0003-2486-3583",
        "linkedin": "christopher-p-ley/;",
        "or_profile": "~Christopher_P._Ley1;~Felipe_Tobar1",
        "aff": "Universidad de Chile;Universidad de Chile",
        "aff_domain": "uchile.cl;uchile.cl",
        "position": "Researcher;Associate Professor",
        "bibtex": "@misc{\nley2024asynchronous,\ntitle={Asynchronous Graph Generators},\nauthor={Christopher P. Ley and Felipe Tobar},\nyear={2024},\nurl={https://openreview.net/forum?id=dUCWpEUrWo}\n}",
        "github": "",
        "project": "",
        "reviewers": "QMJ3;cjtX;qi5c;mCDq;TnYt",
        "site": "https://openreview.net/forum?id=dUCWpEUrWo",
        "pdf_size": 867978,
        "rating": "3;3;3;3;5",
        "confidence": "4;3;4;4;2",
        "soundness": "2;2;2;2;2",
        "contribution": "2;1;2;2;2",
        "presentation": "2;3;3;1;2",
        "wc_summary": "135;44;101;30;118",
        "wc_strengths": "19;40;90;26;50",
        "wc_weaknesses": "193;107;423;497;202",
        "wc_questions": "1;84;165;8;203",
        "wc_review": "348;275;779;561;573",
        "wc_reply_reviewers": "0;0;140;0;12",
        "wc_reply_authors": "372;1309;1199;48;478",
        "reply_reviewers": "0;0;1;0;1",
        "reply_authors": "1;2;2;1;1",
        "rating_avg": [
            3.4,
            0.8
        ],
        "confidence_avg": [
            3.4,
            0.8
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.8,
            0.4000000000000001
        ],
        "presentation_avg": [
            2.2,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            85.6,
            41.35021160768104
        ],
        "wc_strengths_avg": [
            45.0,
            24.94794580722028
        ],
        "wc_weaknesses_avg": [
            284.4,
            149.01221426446892
        ],
        "wc_questions_avg": [
            92.2,
            81.30289047752238
        ],
        "wc_review_avg": [
            507.2,
            179.08701795495955
        ],
        "wc_reply_reviewers_avg": [
            30.4,
            54.996727175351076
        ],
        "wc_reply_authors_avg": [
            681.2,
            489.9156662120533
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.4,
            0.4898979485566356
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.875,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:-w3u4vsyO_sJ:scholar.google.com/&scioq=Asynchronous+Graph+Generators&hl=en&as_sdt=0,5",
        "gs_version_total": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Universidad de Chile",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uchile.cl",
        "aff_unique_abbr": "UCH",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Chile"
    },
    {
        "id": "dUDwK38MVC",
        "title": "VideoFactory: Swap Attention in Spatiotemporal Diffusions for Text-to-Video Generation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We present VideoFactory, an innovative framework for generating high-quality open-domain videos. VideoFactory excels in producing high-definition (1376$\\times$768), widescreen (16:9) videos without watermarks, creating an engaging user experience. Generating videos guided by text instructions poses significant challenges, such as modeling the complex relationship between space and time, and the lack of large-scale text-video paired data. Previous approaches extend pretrained text-to-image generation models by adding temporal 1D convolution/attention modules for video generation. However, these approaches overlook the importance of jointly modeling space and time, inevitably leading to temporal distortions and misalignment between texts and videos. In this paper, we propose a novel approach that strengthens the interaction between spatial and temporal perceptions. In particular, we utilize a swapped cross-attention mechanism in 3D windows that alternates the \u201cquery\u201d role between spatial and temporal blocks, enabling mutual reinforcement for each other. To fully unlock model capabilities for high-quality video generation, we curate a large-scale video dataset called HD-VG-130M. This dataset comprises 130 million text-video pairs from the open-domain, ensuring high-definition, widescreen and watermark-free characters. Objective metrics and user studies demonstrate the superiority of our approach in terms of per-frame quality, temporal correlation, and text-video alignment, with clear margins.",
        "keywords": "Video Generation;Diffusion Models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/aaf3d9311b58f7ff53b7f0bea6b9f15158737327.zip",
        "author": "Wenjing Wang;Huan Yang;Zixi Tuo;Huiguo He;Junchen Zhu;Jianlong Fu;Jiaying Liu",
        "authorids": "~Wenjing_Wang1;~Huan_Yang4;~Zixi_Tuo2;~Huiguo_He3;~Junchen_Zhu1;~Jianlong_Fu1;~Jiaying_Liu1",
        "gender": "F;M;;;M;M;F",
        "homepage": "https://daooshee.github.io/website/;https://hyang0511.github.io/;;;;;http://www.icst.pku.edu.cn/struct/people/liujiaying.html",
        "dblp": "42/1822-1;86/4843-5;;;276/3203;83/8692;32/197.html",
        "google_scholar": "JY6fBNoAAAAJ;https://scholar.google.com/citations?hl=en;;;J0qJuYAAAAAJ;-WqSwu8AAAAJ;https://scholar.google.com.tw/citations?user=-OcSne0AAAAJ",
        "orcid": ";;;;0000-0002-3872-6689;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Wenjing_Wang1;~Huan_Yang4;~Zixi_Tuo2;~Huiguo_He3;~Junchen_Zhu1;~Jianlong_Fu1;~Jiaying_Liu1",
        "aff": "Tencent;01.AI;;;University of Electronic Science and Technology of China;Microsoft;Peking University",
        "aff_domain": "tencent.com;01.ai;;;uestc.edu.cn;microsoft.com;pku.edu.cn",
        "position": "Researcher;Senior Algorithm Expert;;;PhD student;Senior Researcher;Associate Professor",
        "bibtex": "@misc{\nwang2024videofactory,\ntitle={VideoFactory: Swap Attention in Spatiotemporal Diffusions for Text-to-Video Generation},\nauthor={Wenjing Wang and Huan Yang and Zixi Tuo and Huiguo He and Junchen Zhu and Jianlong Fu and Jiaying Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=dUDwK38MVC}\n}",
        "github": "",
        "project": "",
        "reviewers": "qRMz;Nqrs;NUsL;jziR",
        "site": "https://openreview.net/forum?id=dUDwK38MVC",
        "pdf_size": 18015825,
        "rating": "5;5;5;6",
        "confidence": "4;5;4;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "85;37;99;80",
        "wc_strengths": "79;48;119;99",
        "wc_weaknesses": "102;253;184;90",
        "wc_questions": "51;57;129;113",
        "wc_review": "317;395;531;382",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            75.25,
            23.155722834755128
        ],
        "wc_strengths_avg": [
            86.25,
            26.223796445213647
        ],
        "wc_weaknesses_avg": [
            157.25,
            66.06578161196612
        ],
        "wc_questions_avg": [
            87.5,
            34.04041715373065
        ],
        "wc_review_avg": [
            406.25,
            77.85041746837328
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 122,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8488437126970695611&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "Tencent;01.AI;University of Electronic Science and Technology of China;Microsoft;Peking University",
        "aff_unique_dep": "Tencent Holdings Limited;;;Microsoft Corporation;",
        "aff_unique_url": "https://www.tencent.com;;https://www.uestc.edu.cn;https://www.microsoft.com;http://www.pku.edu.cn",
        "aff_unique_abbr": "Tencent;;UESTC;Microsoft;Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;2;0",
        "aff_country_unique": "China;;United States"
    },
    {
        "id": "dUTwqiEked",
        "title": "RetroDiff: Retrosynthesis as Multi-stage Distribution Interpolation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Retrosynthesis poses a fundamental challenge in biopharmaceuticals, aiming to aid chemists in finding appropriate reactant molecules and synthetic pathways given determined product molecules. With the reactant and product represented as 2D graphs, retrosynthesis constitutes a conditional graph-to-graph generative task.\nInspired by the recent advancements in discrete diffusion models for graph generation, we introduce RetroSynthesis Diffusion (RetroDiff), a novel diffusion-based method designed to address this problem. \nHowever, integrating a diffusion-based graph-to-graph framework while retaining essential chemical reaction template information presents a notable challenge.\nOur key innovation is to develop a multi-stage diffusion process. In this method, we decompose the retrosynthesis procedure to first sample external graph motifs from the dummy distribution given products and then generate the external bonds to connect the products and generated motifs. Interestingly, such a generation process is exactly the reverse of the widely adapted semi-template retrosynthesis procedure, i.e. from reaction center identification to synthon completion, which significantly reduces the error accumulation. \nExperimental results on the benchmark have demonstrated the superiority of our method over all other semi-template methods.",
        "keywords": "Retrosynthesis;Diffusion Model",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Yiming Wang;Yuxuan Song;Minkai Xu;Rui Wang;Hao Zhou;Wei-Ying Ma",
        "authorids": "~Yiming_Wang13;~Yuxuan_Song2;~Minkai_Xu1;~Rui_Wang10;~Hao_Zhou5;~Wei-Ying_Ma2",
        "gender": ";M;M;M;M;M",
        "homepage": "https://alsace08.github.io/yiming.wang.cv/;https://yuxuansong.com;https://minkaixu.com;https://zhouh.github.io/;https://air.tsinghua.edu.cn/en/info/1046/1189.htm;https://wangruinlp.github.io/",
        "dblp": ";;257/3355;63/778-12;m/WYMa.html;w/RuiWang15",
        "google_scholar": "2C1VDq8AAAAJ;xlnZ1OIAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=zh-CN;SToCbu8AAAAJ;oTU0v5IAAAAJ",
        "orcid": "0000-0001-5821-8895;;;;;0000-0001-8007-2503",
        "linkedin": ";;;;wei-ying-ma-16a0171/;",
        "or_profile": "~Yiming_Wang13;~Yuxuan_Song2;~Minkai_Xu1;~Hao_Zhou5;~Wei-Ying_Ma2;~Rui_Wang7",
        "aff": "Shanghai Jiaotong University;Tsinghua University;Stanford University;Tsinghua University;Tsinghua University;Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn;tsinghua.edu.cn;stanford.edu;tsinghua.edu.cn;tsinghua.edu.cn;sjtu.edu.cn",
        "position": "PhD student;PhD student;PhD student;Associate Professor;Full Professor;Associate Professor",
        "bibtex": "@misc{\nwang2024retrodiff,\ntitle={RetroDiff: Retrosynthesis as Multi-stage Distribution Interpolation},\nauthor={Yiming Wang and Yuxuan Song and Minkai Xu and Rui Wang and Hao Zhou and Wei-Ying Ma},\nyear={2024},\nurl={https://openreview.net/forum?id=dUTwqiEked}\n}",
        "github": "",
        "project": "",
        "reviewers": "rjec;iBeY;1Pis;dttv",
        "site": "https://openreview.net/forum?id=dUTwqiEked",
        "pdf_size": 1344285,
        "rating": "3;3;5;6",
        "confidence": "3;4;5;4",
        "soundness": "2;2;3;4",
        "contribution": "3;2;3;2",
        "presentation": "1;1;2;3",
        "wc_summary": "28;86;8;112",
        "wc_strengths": "62;54;16;111",
        "wc_weaknesses": "111;889;34;52",
        "wc_questions": "256;116;65;23",
        "wc_review": "457;1145;123;298",
        "wc_reply_reviewers": "0;176;0;0",
        "wc_reply_authors": "1076;1392;439;311",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "3;5;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            58.5,
            42.127781807258735
        ],
        "wc_strengths_avg": [
            60.75,
            33.818449106959356
        ],
        "wc_weaknesses_avg": [
            271.5,
            357.6496190407589
        ],
        "wc_questions_avg": [
            115.0,
            87.81514675726505
        ],
        "wc_review_avg": [
            505.75,
            387.516048054787
        ],
        "wc_reply_reviewers_avg": [
            44.0,
            76.2102355330306
        ],
        "wc_reply_authors_avg": [
            804.5,
            446.094440673721
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            1.6583123951777
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5443310539518174,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1293096244746157127&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;1;1;0",
        "aff_unique_norm": "Shanghai Jiao Tong University;Tsinghua University;Stanford University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.sjtu.edu.cn;https://www.tsinghua.edu.cn;https://www.stanford.edu",
        "aff_unique_abbr": "SJTU;THU;Stanford",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Stanford",
        "aff_country_unique_index": "0;0;1;0;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "dVq2StlcnY",
        "title": "Interpretable and Generalizable Graph Neural Networks via Subgraph Multilinear Extension",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Interpretable graph neural networks (XGNNs) are widely adopted in scientific applications involving graph-structured data. Previous approaches predominantly adopt the attention-based mechanism to learn edge or node importance for extracting and making predictions with the interpretable subgraph. However, the representational properties and limitations of these methods remain inadequately explored. In this work, we present a theoretical framework that formulates interpretable subgraph learning with the multilinear extension of the subgraph distribution, which we term as subgraph multilinear extension (SubMT). Extracting the desired interpretable subgraph requires an accurate approximation of SubMT, yet we find that the existing XGNNs can have a huge gap in fitting SubMT. Consequently, the SubMT approximation failure will lead to the degenerated interpretability of the extracted subgraphs. To mitigate the issue, we design a new XGNN architecture called Graph Multilinear neT (GMT), which is provably more powerful in approximating SubMT. We empirically validate our theoretical findings on a number of graph classification benchmarks. The results demonstrate that GMT outperforms the state-of-the-art up to 10% in terms of both interpretability and generalizability measures.",
        "keywords": "Interpretation;Graph Neural Networks;Out-of-Distribution Generalization;Multilinear Extension;Causality;Geometric Deep Learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Yongqiang Chen;Yatao Bian;Bo Han;James Cheng",
        "authorids": "~Yongqiang_Chen1;~Yatao_Bian1;~Bo_Han1;~James_Cheng2",
        "gender": ";M;M;M",
        "homepage": "https://lfhase.win;https://www.cse.cuhk.edu.hk/~jcheng/;https://bhanml.github.io/;https://yataobian.com",
        "dblp": "76/5774-2;06/4171;241/0472-3;222/2694",
        "google_scholar": "huQ_Ig8AAAAJ;;nTNjqHwAAAAJ;oZBTlBkAAAAJ",
        "orcid": ";;;0000-0002-2368-4084",
        "linkedin": ";;;",
        "or_profile": "~Yongqiang_Chen1;~James_Cheng2;~bo_han2;~An_Bian1",
        "aff": "Department of Computer Science and Engineering, The Chinese University of Hong Kong;The Chinese University of Hong Kong;MBZUAI;Tencent AI Lab",
        "aff_domain": "cse.cuhk.edu.hk;cuhk.edu.hk;mbzuai.ac.ae;tencent.com",
        "position": "PhD student;Associate Professor;Researcher;Senior researcher    ",
        "bibtex": "@misc{\nchen2024interpretable,\ntitle={Interpretable and Generalizable Graph Neural Networks via Subgraph Multilinear Extension},\nauthor={Yongqiang Chen and Yatao Bian and Bo Han and James Cheng},\nyear={2024},\nurl={https://openreview.net/forum?id=dVq2StlcnY}\n}",
        "github": "",
        "project": "",
        "reviewers": "FFuz;uKEu;gapk;pmQk",
        "site": "https://openreview.net/forum?id=dVq2StlcnY",
        "pdf_size": 8501434,
        "rating": "3;6;6;8",
        "confidence": "3;3;3;2",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "1;3;2;3",
        "wc_summary": "53;60;68;62",
        "wc_strengths": "26;78;87;68",
        "wc_weaknesses": "111;86;75;32",
        "wc_questions": "26;23;23;134",
        "wc_review": "216;247;253;296",
        "wc_reply_reviewers": "0;131;27;13",
        "wc_reply_authors": "1509;1058;933;937",
        "reply_reviewers": "0;2;1;1",
        "reply_authors": "7;5;6;3",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            60.75,
            5.356071321407137
        ],
        "wc_strengths_avg": [
            64.75,
            23.35995505132662
        ],
        "wc_weaknesses_avg": [
            76.0,
            28.556960622587273
        ],
        "wc_questions_avg": [
            51.5,
            47.64714052280577
        ],
        "wc_review_avg": [
            253.0,
            28.521921393903323
        ],
        "wc_reply_reviewers_avg": [
            42.75,
            51.83808927805885
        ],
        "wc_reply_authors_avg": [
            1109.25,
            236.19946549473815
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            5.25,
            1.479019945774904
        ],
        "replies_avg": [
            35,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.7276068751089989,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:YjZtnVaOwCwJ:scholar.google.com/&scioq=Interpretable+and+Generalizable+Graph+Neural+Networks+via+Subgraph+Multilinear+Extension&hl=en&as_sdt=0,31",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "Chinese University of Hong Kong;Mohamed bin Zayed University of Artificial Intelligence;Tencent",
        "aff_unique_dep": "Department of Computer Science and Engineering;;Tencent AI Lab",
        "aff_unique_url": "https://www.cuhk.edu.hk;https://www.mbzuai.ac.ae;https://ai.tencent.com",
        "aff_unique_abbr": "CUHK;MBZUAI;Tencent AI Lab",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "China;United Arab Emirates"
    },
    {
        "id": "dW7FRwi1eA",
        "title": "Learning a Reusable Meta Denoiser for Learning with Noisy Labels on Multiple Target Domains",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Learning with noisy labels (LNL) is a classification problem, where some training data are mislabeled. To identify which data are mislabeled, many denoising (e.g., sample selection) methods have been proposed by exploring meta features (e.g., loss values) during training. They are successful, since the used meta features are informative for identifying mislabeled data. However, the useful meta features are discarded after training, which is a waste of resources if LNL is needed on more datasets. In this paper, we work on LNL with one clean source domain and multiple noisy target domains and propose a general framework called meta denoising (MeDe), where the input spaces and/or label sets can be different for the source and target domains. Specifically, we find that some meta features are nearly transferable across datasets; thus, we train a reusable meta denoiser, which is a binary classifier to identify mislabeled data given meta features, by simulating noisy labels on the source domain; then, we can run the meta denoiser on any target domain by extracting its own meta features. Experiments show that MeDe can denoise datasets with different label sets and outperform denoising methods applied on each dataset separately.",
        "keywords": "Learning with noisy labels;meta denoising;reusable meta denoiser",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/1592756d8bad849b82c59d5d7656136c927435d8.zip",
        "author": "Ming-Kun Xie;Bo-Shi Zou;Gang Niu;Chen-Chen Zong;Kun-Peng Ning;Masashi Sugiyama;Sheng-Jun Huang",
        "authorids": "~Ming-Kun_Xie1;~Bo-Shi_Zou1;~Gang_Niu1;~Chen-Chen_Zong1;~Kun-Peng_Ning1;~Masashi_Sugiyama1;~Sheng-Jun_Huang1",
        "gender": "M;M;M;M;;M;M",
        "homepage": "http://www.xiemk.pro/;https://niug1984.github.io;https://ningkp.github.io;http://www.ms.k.u-tokyo.ac.jp/sugi/;http://parnec.nuaa.edu.cn/huangsj;;https://chenchenzong.github.io/",
        "dblp": "215/4362;26/3367-1;267/5408;35/1228;01/3367.html;;299/5077",
        "google_scholar": "https://scholar.google.co.jp/citations?hl=zh-CN;https://scholar.google.co.jp/citations?user=HOkcy00AAAAJ;https://scholar.google.com.hk/citations?user=oE8ge7sAAAAJ;https://scholar.google.co.jp/citations?user=GkYIrlIAAAAJ;https://scholar.google.com/citations?hl=zh-CN;;h7FiyU8AAAAJ",
        "orcid": ";;;0000-0001-6658-6743;0000-0002-7673-5367;0000-0002-2300-0252;0000-0003-3588-1461",
        "linkedin": ";;;;;;",
        "or_profile": "~Ming-Kun_Xie1;~Gang_Niu1;~Kun-Peng_Ning1;~Masashi_Sugiyama1;~Sheng-Jun_Huang1;~boshi_zou1;~Chenchen_Zong1",
        "aff": "Nanjing University of Aeronautics and Astronautics;Southeast University;Peking University;The University of Tokyo;Nanjing University of Aeronautics and Astronautics;Nanjing University of Aeronautics and Astronautics;Nanjing University of Aeronautics and Astronautics",
        "aff_domain": "nuaa.edu.cn;seu.edu.cn;pku.edu.cn;u-tokyo.ac.jp;nuaa.edu.cn;nuaa.edu.cn;nuaa.edu.cn",
        "position": "PhD student;Adjunct Full Professor;PhD student;Full Professor;Full Professor;MS student;PhD student",
        "bibtex": "@misc{\nxie2024learning,\ntitle={Learning a Reusable Meta Denoiser for Learning with Noisy Labels on Multiple Target Domains},\nauthor={Ming-Kun Xie and Bo-Shi Zou and Gang Niu and Chen-Chen Zong and Kun-Peng Ning and Masashi Sugiyama and Sheng-Jun Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=dW7FRwi1eA}\n}",
        "github": "",
        "project": "",
        "reviewers": "RFE6;WbSU;Gghz;WBJ3",
        "site": "https://openreview.net/forum?id=dW7FRwi1eA",
        "pdf_size": 489902,
        "rating": "3;3;5;6",
        "confidence": "3;4;3;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;2",
        "presentation": "2;2;3;3",
        "wc_summary": "39;86;107;40",
        "wc_strengths": "33;44;66;31",
        "wc_weaknesses": "259;523;211;139",
        "wc_questions": "259;104;71;2",
        "wc_review": "590;757;455;212",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            68.0,
            29.45335295004628
        ],
        "wc_strengths_avg": [
            43.5,
            13.901438774457844
        ],
        "wc_weaknesses_avg": [
            283.0,
            144.99655168313487
        ],
        "wc_questions_avg": [
            109.0,
            94.09835280173613
        ],
        "wc_review_avg": [
            503.5,
            199.41727608208873
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5555555555555555,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:m3f8eUaDD0EJ:scholar.google.com/&scioq=Learning+a+Reusable+Meta+Denoiser+for+Learning+with+Noisy+Labels+on+Multiple+Target+Domains&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;0;0;0",
        "aff_unique_norm": "Nanjing University of Aeronautics and Astronautics;Southeast University;Peking University;University of Tokyo",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "http://www.nuaa.edu.cn;https://www.seu.edu.cn/;http://www.pku.edu.cn;https://www.u-tokyo.ac.jp",
        "aff_unique_abbr": "NUAA;SEU;Peking U;UTokyo",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0;0;0",
        "aff_country_unique": "China;Japan"
    },
    {
        "id": "dXRWP4n15q",
        "title": "$\\sigma$-zero: Gradient-based Optimization of \\\\$\\ell_0$-norm Adversarial Examples",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Evaluating the adversarial robustness of deep networks to gradient-based attacks is challenging.\nWhile most attacks focus $\\ell_2$-norm and $\\ell_\\infty$-norm constraints to craft input perturbations, only a few have investigated sparse $\\ell_1$-norm and $\\ell_0$-norm attacks.\nIn particular, $\\ell_0$-norm attacks remain the least studied due to the inherent complexity of optimizing over a non-convex and non-differentiable constraint.\nHowever, evaluating the robustness of these attacks might unveil weaknesses otherwise left untested with conventional $\\ell_2$ and $\\ell_\\infty$ attacks.\nIn this work, we propose a novel $\\ell_0$-norm attack, called $\\sigma$\\texttt{-zero}, which leverages an ad-hoc differentiable approximation of the $\\ell_0$ norm to facilitate gradient-based optimization.\nExtensive evaluations on MNIST, CIFAR10, and ImageNet datasets show that $\\sigma$\\texttt{-zero} can find adversarial examples with minimal $\\ell_0$ distortion, outperforming competing methods in terms of success rate and scalability.",
        "keywords": "adversarial examples;gradient-based attack;machine learning security",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/10c3eed831c5e745f4002376df9e5ba31675b521.zip",
        "author": "Antonio Emanuele Cin\u00e0;Francesco Villani;Maura Pintor;Lea Sch\u00f6nherr;Battista Biggio;Marcello Pelillo",
        "authorids": "~Antonio_Emanuele_Cin\u00e01;~Francesco_Villani1;~Maura_Pintor1;~Lea_Sch\u00f6nherr1;~Battista_Biggio1;~Marcello_Pelillo1",
        "gender": "M;M;F;;M;M",
        "homepage": "https://github.com/Cinofix;https://github.com/FrancescoVillani;https://maurapintor.github.io/;;https://battistabiggio.github.io/;",
        "dblp": "274/2233;63/1721;227/3373;;29/1830;42/1745",
        "google_scholar": "https://scholar.google.it/citations?user=Qtj8Lb8AAAAJ;https://scholar.google.com/citations?hl=it;https://scholar.google.it/citations?user=Tu45bY4AAAAJ;;https://scholar.google.it/citations?user=OoUIOYwAAAAJ;Hz9A7M0AAAAJ",
        "orcid": "0000-0003-3807-6417;;0000-0002-1944-2875;;0000-0001-7752-509X;0000-0001-8992-9243",
        "linkedin": "antonio-cina/;;maura-pintor;;;marcello-pelillo-bb185585/?originalSubdomain=it",
        "or_profile": "~Antonio_Emanuele_Cin\u00e01;~Francesco_Villani1;~Maura_Pintor1;~Lea_Sch\u00f6nherr1;~Battista_Biggio1;~Marcello_Pelillo1",
        "aff": "University of Genoa;University of Genoa;University of Cagliari;;University of Cagliari, Italy;Ca' Foscari University of Venice",
        "aff_domain": "unige.it;unige.it;unica.it;;unica.it;unive.it",
        "position": "Assistant Professor;PhD student;Assistant Professor;;Full Professor;Professor",
        "bibtex": "@misc{\ncin{\\`a}2024sigmazero,\ntitle={\\${\\textbackslash}sigma\\$-zero: Gradient-based Optimization of {\\textbackslash}{\\textbackslash}\\${\\textbackslash}ell\\_0\\$-norm Adversarial Examples},\nauthor={Antonio Emanuele Cin{\\`a} and Francesco Villani and Maura Pintor and Lea Sch{\\\"o}nherr and Battista Biggio and Marcello Pelillo},\nyear={2024},\nurl={https://openreview.net/forum?id=dXRWP4n15q}\n}",
        "github": "",
        "project": "",
        "reviewers": "oGkp;nLC7;sy67;g7Nu",
        "site": "https://openreview.net/forum?id=dXRWP4n15q",
        "pdf_size": 1618938,
        "rating": "5;5;6;6",
        "confidence": "5;5;4;5",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;2",
        "presentation": "3;3;3;2",
        "wc_summary": "16;52;21;69",
        "wc_strengths": "13;30;100;38",
        "wc_weaknesses": "180;284;63;294",
        "wc_questions": "6;40;2;138",
        "wc_review": "215;406;186;539",
        "wc_reply_reviewers": "101;352;41;102",
        "wc_reply_authors": "963;1250;508;525",
        "reply_reviewers": "1;4;1;1",
        "reply_authors": "3;5;2;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            4.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            39.5,
            21.914607000811127
        ],
        "wc_strengths_avg": [
            45.25,
            32.87381176559846
        ],
        "wc_weaknesses_avg": [
            205.25,
            93.47559842012245
        ],
        "wc_questions_avg": [
            46.5,
            54.85207379853564
        ],
        "wc_review_avg": [
            336.5,
            144.26451400119157
        ],
        "wc_reply_reviewers_avg": [
            149.0,
            119.77687589848051
        ],
        "wc_reply_authors_avg": [
            811.5,
            312.02123325184135
        ],
        "reply_reviewers_avg": [
            1.75,
            1.299038105676658
        ],
        "reply_authors_avg": [
            2.75,
            1.479019945774904
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0;0;1;1;2",
        "aff_unique_norm": "University of Genoa;University of Cagliari;Ca' Foscari University of Venice",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.unige.it;https://www.unica.it;https://www.unive.it",
        "aff_unique_abbr": "UniGe;UNICA;Ca' Foscari",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Venice",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Italy"
    },
    {
        "id": "dY5aBhiGKg",
        "title": "Generalized Category Discovery with Hierarchical Label Smoothing",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "\\textit{Generalized Category Discovery} seeks to cluster unidentified categories while simultaneously discerning known categories. Existing approaches predominantly rely on contrastive learning to produce distinctive embeddings for both labeled and unlabeled data. Yet, these techniques often suffer from dispersed clusters for unknown categories due to the lack of discriminative cues and a high rate of false negatives, thereby compromising the model\u2019s ability to discriminate clusters effectively. To alleviate this problem, we introduce label smoothing as a hyperparameter that permits \u2018forgivable mistakes\u2019 when samples are closely related. We introduce a self-supervised cluster hierarchy, which allows us to control the strength of label smoothing to apply. By assigning pseudo labels to emerging cluster candidates and using these as \u2018soft supervision\u2019 for contrastive learning, we effectively combine the benefits of clustering-based learning and contrastive learning. The resulting method is applicable for both unsupervised and semi-supervised scenarios and we demonstrate state-of-the-art generalized category discovery performance on various fine-grained datasets.",
        "keywords": "Generalized category discovery;Open world learning;Open-set recognition",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Sarah Rastegar;Yuki M Asano;Hazel Doughty;Cees G. M. Snoek",
        "authorids": "~Sarah_Rastegar1;~Yuki_M_Asano1;~Hazel_Doughty1;~Cees_G._M._Snoek1",
        "gender": "F;F;M;M",
        "homepage": "https://sarahrastegar.github.io/;https://hazeldoughty.github.io/;http://www.ceessnoek.info;https://yukimasano.github.io/",
        "dblp": "191/4660;198/0823;s/CeesSnoek;239/8823",
        "google_scholar": "e_HGE3gAAAAJ;b3koBVwAAAAJ;https://scholar.google.nl/citations?user=0uKdbscAAAAJ;CdpLhlgAAAAJ",
        "orcid": "0000-0002-4542-7388;;0000-0001-9092-1556;",
        "linkedin": "sarah-rastegar;;cgmsnoek/;",
        "or_profile": "~Sarah_Rastegar1;~Hazel_Doughty1;~Cees_Snoek1;~Yuki_Asano1",
        "aff": "University of Amsterdam;Leiden University;University of Amsterdam;University of Amsterdam",
        "aff_domain": "uva.nl;leidenuniv.nl;uva.nl;uva.nl",
        "position": "PhD student;Assistant Professor;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nrastegar2024generalized,\ntitle={Generalized Category Discovery with Hierarchical Label Smoothing},\nauthor={Sarah Rastegar and Yuki M Asano and Hazel Doughty and Cees G. M. Snoek},\nyear={2024},\nurl={https://openreview.net/forum?id=dY5aBhiGKg}\n}",
        "github": "",
        "project": "",
        "reviewers": "KPLz;x4PR;2Rzo;QpG6",
        "site": "https://openreview.net/forum?id=dY5aBhiGKg",
        "pdf_size": 1610398,
        "rating": "3;3;3;3",
        "confidence": "4;4;4;5",
        "soundness": "2;2;2;3",
        "contribution": "2;2;1;1",
        "presentation": "2;2;1;1",
        "wc_summary": "71;55;58;64",
        "wc_strengths": "26;65;40;22",
        "wc_weaknesses": "172;236;141;235",
        "wc_questions": "52;29;236;33",
        "wc_review": "321;385;475;354",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            62.0,
            6.123724356957945
        ],
        "wc_strengths_avg": [
            38.25,
            16.82817577754642
        ],
        "wc_weaknesses_avg": [
            196.0,
            40.99390198553927
        ],
        "wc_questions_avg": [
            87.5,
            86.17569262849008
        ],
        "wc_review_avg": [
            383.75,
            57.33835976028613
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:TSlF5y00OFsJ:scholar.google.com/&scioq=Generalized+Category+Discovery+with+Hierarchical+Label+Smoothing&hl=en&as_sdt=0,5",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "University of Amsterdam;Leiden University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uva.nl;https://www.leidenuniv.nl",
        "aff_unique_abbr": "UvA;LU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Netherlands"
    },
    {
        "id": "dYaeDrazj5",
        "title": "From Images to Connections: Can DQN with GNNs learn the Strategic Game of Hex?",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The gameplay of strategic board games such as chess, Go and Hex is often characterized by combinatorial, relational structures---capturing distinct interactions and non-local patterns---and not just images. Nonetheless, most common self-play reinforcement learning (RL) approaches simply approximate policy and value functions using convolutional neural networks (CNN).\nA key feature of CNNs, is their relational inductive biases towards locality and translational invariance. In contrast, graph neural networks (GNN) can encode more complicated and distinct relational structures. Hence, we investigate the crucial question: Can GNNs, with their ability to encode complex connections, replace CNNs in self-play reinforcement learning? To this end, we do a comparison with Hex---an abstract yet strategically rich board game---serving as our experimental platform. Our findings reveal\nthat GNNs excel at dealing with long range dependency situations in game states and are less prone to overfitting, but also showing a reduced proficiency in discerning local patterns. This suggests a potential paradigm shift, signaling the use of game-specific structures to reshape self-play reinforcement learning.",
        "keywords": "Self-play Reinforcement Learning;Graph Neural Networks;Hex;Long Range Dependency Problems;Board games",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Yannik Keller;Jannis Bl\u00fcml;Gopika Sudhakaran;Kristian Kersting",
        "authorids": "~Yannik_Keller1;~Jannis_Bl\u00fcml1;~Gopika_Sudhakaran1;~Kristian_Kersting1",
        "gender": "M;M;F;M",
        "homepage": "https://yannikkeller.de;;;http://www.ml.informatik.tu-darmstadt.de/",
        "dblp": ";;213/0247;40/3793",
        "google_scholar": "STlGbvcAAAAJ;;QZS6FjoAAAAJ;QY-earAAAAAJ",
        "orcid": "0000-0002-2821-4313;0000-0002-9400-0946;0009-0007-3721-5602;0000-0002-2873-9152",
        "linkedin": ";;https://de.linkedin.com/in/gopika-sudhakaran-7a289755;",
        "or_profile": "~Yannik_Keller1;~Jannis_Bl\u00fcml1;~Gopika_Sudhakaran1;~Kristian_Kersting1",
        "aff": "Max-Planck Institute;Technische Universit\u00e4t Darmstadt;Technische Universit\u00e4t Darmstadt;TU Darmstadt",
        "aff_domain": "mpib-berlin.mpg;tu-darmstadt.de;tu-darmstadt.de;tu-darmstadt.de",
        "position": "PhD student;PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nkeller2024from,\ntitle={From Images to Connections: Can {DQN} with {GNN}s learn the Strategic Game of Hex?},\nauthor={Yannik Keller and Jannis Bl{\\\"u}ml and Gopika Sudhakaran and Kristian Kersting},\nyear={2024},\nurl={https://openreview.net/forum?id=dYaeDrazj5}\n}",
        "github": "",
        "project": "",
        "reviewers": "9axj;q6Hr;HvCH",
        "site": "https://openreview.net/forum?id=dYaeDrazj5",
        "pdf_size": 1103856,
        "rating": "3;3;3",
        "confidence": "4;4;3",
        "soundness": "3;2;3",
        "contribution": "2;2;2",
        "presentation": "2;4;2",
        "wc_summary": "148;45;163",
        "wc_strengths": "64;20;75",
        "wc_weaknesses": "501;224;108",
        "wc_questions": "232;14;85",
        "wc_review": "945;303;431",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            118.66666666666667,
            52.44891694676725
        ],
        "wc_strengths_avg": [
            53.0,
            23.762715894162152
        ],
        "wc_weaknesses_avg": [
            277.6666666666667,
            164.8682976061667
        ],
        "wc_questions_avg": [
            110.33333333333333,
            90.78301358489679
        ],
        "wc_review_avg": [
            559.6666666666666,
            277.4374804447942
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4170374637767741537&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Max-Planck-Gesellschaft zur F\u00f6rderung der Wissenschaften e.V.;Technische Universit\u00e4t Darmstadt",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.mpg.de;https://www.tu-darmstadt.de",
        "aff_unique_abbr": "MPG;TUD",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Darmstadt",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "dYjuJGTEbc",
        "title": "An Enhanced Gromov-Wasserstein Barycenter Method for Graph-based Clustering",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Optimal Transport (OT) recently has gained remarkable success in machine learning. These methods based on the Gromov-Wasserstein (GW) distance have proven highly effective in capturing complex data topologies and underlying structures.\nMore specifically, Gromov-Wasserstein Learning (GWL) has recently introduced a framework for graph partitioning by minimizing the GW distance. Various improved versions stemming from this framework have showcased state-of-the-art performance on clustering tasks. \nBuilding upon GW barycenter, we introduce a novel approach that significantly enhances other GW-based models flexibility by relaxing the target distribution (cluster size) in GWL and using a wide class of positive semi-definite matrices.\nWe then develop an efficient algorithm to solve the resulting non-convex problem by utilizing regularization and the successive upper-bound minimization techniques.\nThe proposed method exhibits the capacity to identify improved partition results within an enriched searching space, as validated by our developed theoretical framework and numerical experiments. \nFurthermore, we bridge the proposed model with the well-known clustering methods including Non-negative Matrix Factorization, Min-Cut, Max-Dicut and other GW-based models. \nThis connection provides a new solution to these traditional clustering problems from the perspective of OT. \nReal data experiments illustrate our method outperforms state-of-the-art graph partitioning methods on both directed and undirected graphs.",
        "keywords": "Gromov-Wasserstein Learning;Graph-based Clustering;Non-convex Optimization",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Chengyu Liu;Zhen Zhang",
        "authorids": "~Chengyu_Liu1;~Zhen_Zhang26",
        "gender": "M;M",
        "homepage": "https://github.com/Liucy501;https://faculty.sustech.edu.cn/?tagid=zhangz&iscss=1&snapid=1&orderby=date&go=1&lang=en",
        "dblp": ";19/5112-18",
        "google_scholar": ";",
        "orcid": ";0000-0002-7444-6692",
        "linkedin": ";",
        "or_profile": "~Chengyu_Liu1;~Zhen_Zhang26",
        "aff": ";",
        "aff_domain": ";",
        "position": ";",
        "bibtex": "@misc{\nliu2024an,\ntitle={An Enhanced Gromov-Wasserstein Barycenter Method for Graph-based Clustering},\nauthor={Chengyu Liu and Zhen Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=dYjuJGTEbc}\n}",
        "github": "",
        "project": "",
        "reviewers": "EjY1;iAAc;Zq9r;2sWH",
        "site": "https://openreview.net/forum?id=dYjuJGTEbc",
        "pdf_size": 833723,
        "rating": "3;3;6;6",
        "confidence": "5;3;3;3",
        "soundness": "2;2;3;4",
        "contribution": "2;2;2;3",
        "presentation": "2;2;2;3",
        "wc_summary": "136;85;110;154",
        "wc_strengths": "77;16;64;154",
        "wc_weaknesses": "1400;210;188;77",
        "wc_questions": "29;3;283;52",
        "wc_review": "1642;314;645;437",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "771;418;437;226",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            121.25,
            26.12828926661675
        ],
        "wc_strengths_avg": [
            77.75,
            49.53975676161521
        ],
        "wc_weaknesses_avg": [
            468.75,
            540.0154511678346
        ],
        "wc_questions_avg": [
            91.75,
            111.77069159667931
        ],
        "wc_review_avg": [
            759.5,
            523.0662003991464
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            463.0,
            196.04463777415592
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5773502691896258,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:eGAMxJm-qb0J:scholar.google.com/&scioq=An+Enhanced+Gromov-Wasserstein+Barycenter+Method+for+Graph-based+Clustering&hl=en&as_sdt=0,5",
        "gs_version_total": 0
    },
    {
        "id": "dZ8HmIj1Ux",
        "title": "Adaptive Pairwise Encodings for Link Prediction",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Link prediction is a common task on graph-structured data that has seen applications in a variety of domains. Classically, hand-crafted heuristics were used for this task. Heuristic measures are chosen such that they correlate well with the underlying factors related to link formation. In recent years, a new class of methods has emerged that combines the advantages of message-passing neural networks (MPNN) and heuristics methods. These methods perform predictions by using the output of an MPNN in conjunction with a \"pairwise encoding\" that encodes the relationship between nodes in the candidate link. These methods have been shown to achieve strong performance on numerous datasets. However, current pairwise encodings often contain a strong inductive bias, attempting to only model a limited subset of the possible underlying factors that exist between links. This limits the ability of existing methods to learn how to properly classify a variety of different links in the same graph. To address this limitation, we propose a new method, LPFormer, which attempts to adaptively learn the pairwise encodings for each link. LPFormer models the link factors via an attention module that learns the pairwise information that exists between nodes via the local and higher-order graph context. Extensive experiments demonstrate that LPFormer can achieve SOTA performance on numerous datasets while maintaining the efficiency.",
        "keywords": "graph neural networks;link prediction",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Harry Shomer;Yao Ma;Haitao Mao;Juanhui Li;Bo Wu;Jiliang Tang",
        "authorids": "~Harry_Shomer1;~Yao_Ma3;~Haitao_Mao1;~Juanhui_Li1;~Bo_Wu1;~Jiliang_Tang1",
        "gender": ";M;F;M;M;M",
        "homepage": "https://www.cse.msu.edu/~shomerha/;https://yaoma24.github.io/;https://juanhui28.github.io/;https://inside.mines.edu/~bwu/;https://www.cse.msu.edu/~tangjili/;",
        "dblp": ";212/7871.html;313/9527.html;47/6534-2.html;64/10812;",
        "google_scholar": "_6eE2vsAAAAJ;wf9TTOIAAAAJ;5J0dd-sAAAAJ;g6Wdt1YAAAAJ;WtzKMWAAAAAJ;3GmlKM4AAAAJ",
        "orcid": "0000-0001-5081-1870;;0000-0003-4909-1778;0009-0001-1696-4272;0000-0001-7125-3898;",
        "linkedin": ";;;bo-wu-47674734/;;",
        "or_profile": "~Harry_Shomer1;~Yao_Ma3;~Juanhui_Li1;~Bo_Wu1;~Jiliang_Tang1;~Mao_Haitao1",
        "aff": "Michigan State University;Rensselaer Polytechnic Institute;Amazon;Colorado School of Mines;Michigan State University;Michigan State University",
        "aff_domain": "msu.edu;rpi.edu;amazon.com;mines.edu;msu.edu;msu.edu",
        "position": "PhD student;Assistant Professor;Intern;Associate Professor;Full Professor;PhD student",
        "bibtex": "@misc{\nshomer2024adaptive,\ntitle={Adaptive Pairwise Encodings for Link Prediction},\nauthor={Harry Shomer and Yao Ma and Haitao Mao and Juanhui Li and Bo Wu and Jiliang Tang},\nyear={2024},\nurl={https://openreview.net/forum?id=dZ8HmIj1Ux}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=dZ8HmIj1Ux",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10645794172408341456&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;0;0",
        "aff_unique_norm": "Michigan State University;Rensselaer Polytechnic Institute;Amazon;Colorado School of Mines",
        "aff_unique_dep": ";;Amazon.com, Inc.;",
        "aff_unique_url": "https://www.msu.edu;https://www.rpi.edu;https://www.amazon.com;https://www.mines.edu",
        "aff_unique_abbr": "MSU;RPI;Amazon;CSM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Generative Human Motion Stylization in Latent Space",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18255",
        "id": "daEqXJ0yZo",
        "author_site": "chuan guo, Yuxuan Mu, Xinxin Zuo, Peng Dai, Youliang Yan, Juwei Lu, Li Cheng",
        "tldr": "",
        "abstract": "Human motion stylization aims to revise the style of an input motion while keeping its content unaltered. Unlike existing works that operate directly in pose space, we leverage the \\textit{latent space} of pretrained autoencoders as a more expressive and robust representation for motion extraction and infusion. Building upon this, we present a novel \\textit{generative} model that produces diverse stylization results of a single motion (latent) code. During training, a motion code is decomposed into two coding components: a deterministic content code, and a probabilistic style code adhering to a prior distribution; then a generator massages the random combination of content and style codes to reconstruct the corresponding motion codes. Our approach is versatile, allowing the learning of probabilistic style space from either style labeled or unlabeled motions, providing notable flexibility in stylization as well. In inference, users can opt to stylize a motion using style cues from a reference motion or a label. Even in the absence of explicit style input, our model facilitates novel re-stylization by sampling from the unconditional style prior distribution. Experimental results show that our proposed stylization models, despite their lightweight design, outperform the state-of-the-arts in style reeanactment, content preservation, and generalization across various applications and settings.",
        "keywords": "Human Motion Generation;Style Transfer;Generative Model",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/791cad27f5f3d5b58b888d207ee57d73be39ac21.zip",
        "author": "chuan guo;Yuxuan Mu;Xinxin Zuo;Peng Dai;Youliang Yan;Juwei Lu;Li Cheng",
        "authorids": "~chuan_guo2;~Yuxuan_Mu1;~Xinxin_Zuo1;~Peng_Dai2;~Youliang_Yan1;~Juwei_Lu2;~Li_Cheng1",
        "gender": "M;M;F;M;M;M;Not Specified",
        "homepage": "https://ericguo5513.github.io/;https://www.linkedin.com/in/matthewmu;https://sites.google.com/site/xinxinzuohome/;http://pdaicode.github.io/;;http://www.dsp.utoronto.ca/juwei/;https://www.ece.ualberta.ca/~lcheng5/",
        "dblp": "147/5346-2;295/5690;167/3181;08/3547-2.html;135/5316.html;06/827;13/4938-1",
        "google_scholar": "eCdqvJoAAAAJ;https://scholar.google.ca/citations?user=Feoyh4AAAAAJ;lv0UjhIAAAAJ;https://scholar.google.ca/citations?user=pOpgtRgAAAAJ;;https://scholar.google.ca/citations?user=Asz24wcAAAAJ;https://scholar.google.ca/citations?user=9IRFiEQAAAAJ",
        "orcid": "0000-0002-4539-0634;0000-0001-7132-3155;0000-0002-7116-9634;;;;0000-0003-3261-3533",
        "linkedin": "chuan-guo-59b6a810a/;matthewmu;xinxin-zuo-898419199/;peng-dai-6b426120/;;https://linkedin.com/in/juwei-lu-35642621;",
        "or_profile": "~chuan_guo2;~Yuxuan_Mu1;~Xinxin_Zuo1;~Peng_Dai2;~Youliang_Yan1;~Juwei_Lu2;~Li_Cheng1",
        "aff": "University of Alberta;University of Alberta;Huawei Technologies Ltd.;Huawei Technologies Canada;Huawei Technologies Ltd.;Huawei Technologies Ltd.;University of Alberta",
        "aff_domain": "ualberta.ca;ualberta.ca;huawei.com;huawei.com;huawei.com;huawei.com;ualberta.ca",
        "position": "PhD student;MS student;Researcher;Researcher;Principal Researcher;Sr Principal Scientist;Full Professor",
        "bibtex": "@inproceedings{\nguo2024generative,\ntitle={Generative Human Motion Stylization in Latent Space},\nauthor={chuan guo and Yuxuan Mu and Xinxin Zuo and Peng Dai and Youliang Yan and Juwei Lu and Li Cheng},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=daEqXJ0yZo}\n}",
        "github": "",
        "project": "",
        "reviewers": "fyTQ;bi3M;rCKX;rvJ1",
        "pdf_size": 8798656,
        "rating": "5;6;6;6",
        "confidence": "4;4;3;4",
        "soundness": "3;3;3;3",
        "contribution": "3;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "103;96;80;58",
        "wc_strengths": "29;106;42;49",
        "wc_weaknesses": "84;164;183;77",
        "wc_questions": "25;5;9;8",
        "wc_review": "241;371;314;192",
        "wc_reply_reviewers": "135;43;23;0",
        "wc_reply_authors": "1189;731;849;523",
        "reply_reviewers": "2;1;1;0",
        "reply_authors": "3;2;3;2",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            84.25,
            17.297037318569906
        ],
        "wc_strengths_avg": [
            56.5,
            29.46608219631514
        ],
        "wc_weaknesses_avg": [
            127.0,
            47.04784798479097
        ],
        "wc_questions_avg": [
            11.75,
            7.790218225441442
        ],
        "wc_review_avg": [
            279.5,
            68.37579981250677
        ],
        "wc_reply_reviewers_avg": [
            50.25,
            51.24146270355678
        ],
        "wc_reply_authors_avg": [
            823.0,
            241.40008285002722
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5340296970169084317&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=daEqXJ0yZo",
        "pdf": "https://openreview.net/pdf?id=daEqXJ0yZo",
        "email": "ualberta.ca;ualberta.ca;huawei.com;huawei.com;huawei.com;huawei.com;ualberta.ca",
        "author_num": 7,
        "aff_unique_index": "0;0;1;1;1;1;0",
        "aff_unique_norm": "University of Alberta;Huawei",
        "aff_unique_dep": ";Huawei Technologies",
        "aff_unique_url": "https://www.ualberta.ca;https://www.huawei.com",
        "aff_unique_abbr": "UAlberta;Huawei",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;1;1;0",
        "aff_country_unique": "Canada;China"
    },
    {
        "id": "dapU3n7yfp",
        "title": "Automatically Eliciting Toxic Outputs from Pre-trained Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Language models risk generating mindless and offensive content, which hinders their safe deployment. Therefore, it is crucial to discover and modify potential toxic outputs of pre-trained language models before deployment. In this work, we elicit toxic content by automatically searching for a prompt that directs pre-trained language models towards the generation of a specific target output. Existing adversarial attack algorithms solve a problem named reversing language models to elicit toxic output. The problem is challenging due to the discrete nature of textual data and the considerable computational resources required for a single forward pass of the language model. To combat these challenges, we introduce ASRA, a new optimization algorithm that concurrently updates multiple prompts and selects prompts based on determinantal point process. Experimental results on six different pre-trained language models demonstrate that ASRA outperforms other adversarial attack baselines in its efficacy for eliciting toxic content. Furthermore, our analysis reveals a strong correlation between the success rate of ASRA attacks and the perplexity of target outputs, while indicating limited association with the quantity of model parameters. These findings lead us to propose that by constructing a comprehensive toxicity text dataset, reversing pre-trained language models might be employed to evaluate the toxicity of different language models.",
        "keywords": "adversarial attack;eliciting toxic outputs;optimizaiton algorithm",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/7bcc991d9a64499984b197c9dacd7a16b1acf239.zip",
        "author": "Xu Zhang;Xiaojun Wan",
        "authorids": "~Xu_Zhang28;~Xiaojun_Wan1",
        "gender": "M;M",
        "homepage": ";https://wanxiaojun.github.io",
        "dblp": "https://dblp.uni-trier.de/pid/98/5660;07/1521",
        "google_scholar": "B5CrX20AAAAJ;lTTeBdkAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Xu_Zhang28;~Xiaojun_Wan1",
        "aff": "Peking University;Peking University",
        "aff_domain": "pku.edu.cn;pku.edu.cn",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nanonymous2024automatically,\ntitle={Automatically Eliciting Toxic Outputs from Pre-trained Language Models},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=dapU3n7yfp}\n}",
        "github": "",
        "project": "",
        "reviewers": "osGE;crro;QEDL;xui8",
        "site": "https://openreview.net/forum?id=dapU3n7yfp",
        "pdf_size": 735226,
        "rating": "5;5;6;6",
        "confidence": "3;3;3;3",
        "soundness": "2;3;3;3",
        "contribution": "3;2;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "91;161;63;180",
        "wc_strengths": "33;69;24;4",
        "wc_weaknesses": "109;304;67;8",
        "wc_questions": "1;25;23;3",
        "wc_review": "234;559;177;195",
        "wc_reply_reviewers": "0;0;23;0",
        "wc_reply_authors": "586;640;569;459",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "2;2;1;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            123.75,
            48.25647624930772
        ],
        "wc_strengths_avg": [
            32.5,
            23.542514733987108
        ],
        "wc_weaknesses_avg": [
            122.0,
            111.03377864415856
        ],
        "wc_questions_avg": [
            13.0,
            11.045361017187261
        ],
        "wc_review_avg": [
            291.25,
            155.95251681200915
        ],
        "wc_reply_reviewers_avg": [
            5.75,
            9.959292143521045
        ],
        "wc_reply_authors_avg": [
            563.5,
            65.78183639881149
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:4-qH5JWhq08J:scholar.google.com/&scioq=Automatically+Eliciting+Toxic+Outputs+from+Pre-trained+Language+Models&hl=en&as_sdt=0,34",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Peking University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.pku.edu.cn",
        "aff_unique_abbr": "Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Stable Anisotropic Regularization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18254",
        "id": "dbQH9AOVd5",
        "author_site": "William Rudman, Carsten Eickhoff",
        "tldr": "",
        "abstract": "Given the success of Large Language Models (LLMs), there has been considerable interest in studying the properties of model activations. The literature overwhelmingly agrees that LLM representations are dominated by a few ``outlier dimensions'' with exceedingly high variance and magnitude. Several studies in Natural Language Processing (NLP) have sought to mitigate the impact of such outlier dimensions and force LLMs to be isotropic (i.e., have uniform variance across all dimensions in embedding space). Isotropy is thought to be a desirable property for LLMs that improves model performance and more closely aligns textual representations with human intuition. However, many claims regarding isotropy in NLP have been based on the average cosine similarity of embeddings, which has recently been shown to be a flawed measure of isotropy. In this paper, we propose I-STAR: IsoScore$^{\\star}$-based STable Anisotropic Regularization, a novel regularization method that can be used to increase or decrease levels of isotropy in embedding space during training. I-STAR uses IsoScore$^{\\star}$, the first accurate measure of isotropy that is both differentiable and stable on mini-batch computations. In contrast to several previous works, we find that \\textit{decreasing} isotropy in contextualized embeddings improves performance on the majority of tasks and models considered in this paper.",
        "keywords": "isotropy;LLMs;outlier dimensions",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/3be804ac1199899350527c3822073b40168be079.zip",
        "author": "William Rudman;Carsten Eickhoff",
        "authorids": "~William_Rudman1;~Carsten_Eickhoff1",
        "gender": "M;M",
        "homepage": ";https://health-nlp.org",
        "dblp": "299/8116;42/8700",
        "google_scholar": "https://scholar.google.com/citations?hl=en;QQi1_rAAAAAJ",
        "orcid": ";0000-0001-9895-4061",
        "linkedin": ";",
        "or_profile": "~William_Rudman1;~Carsten_Eickhoff1",
        "aff": "Brown University;Eberhard-Karls-Universit\u00e4t T\u00fcbingen",
        "aff_domain": "brown.edu;uni-tuebingen.de",
        "position": "PhD student;Full Professor",
        "bibtex": "@inproceedings{\nrudman2024stable,\ntitle={Stable Anisotropic Regularization},\nauthor={William Rudman and Carsten Eickhoff},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=dbQH9AOVd5}\n}",
        "github": "",
        "project": "",
        "reviewers": "tWNn;ZAyV;GH3h",
        "pdf_size": 1394430,
        "rating": "3;8;8",
        "confidence": "4;3;2",
        "soundness": "2;3;2",
        "contribution": "2;3;3",
        "presentation": "3;4;2",
        "wc_summary": "82;45;66",
        "wc_strengths": "69;78;54",
        "wc_weaknesses": "270;74;28",
        "wc_questions": "127;262;39",
        "wc_review": "548;459;187",
        "wc_reply_reviewers": "0;189;0",
        "wc_reply_authors": "700;710;172",
        "reply_reviewers": "0;1;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            6.333333333333333,
            2.357022603955158
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            64.33333333333333,
            15.15109090315135
        ],
        "wc_strengths_avg": [
            67.0,
            9.899494936611665
        ],
        "wc_weaknesses_avg": [
            124.0,
            104.93172383348454
        ],
        "wc_questions_avg": [
            142.66666666666666,
            91.71089841937483
        ],
        "wc_review_avg": [
            398.0,
            153.5599774246749
        ],
        "wc_reply_reviewers_avg": [
            63.0,
            89.09545442950498
        ],
        "wc_reply_authors_avg": [
            527.3333333333334,
            251.2917737522571
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.8660254037844387,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3970077015975340067&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=dbQH9AOVd5",
        "pdf": "https://openreview.net/pdf?id=dbQH9AOVd5",
        "email": "brown.edu;uni-tuebingen.de",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Brown University;Eberhard Karls University of T\u00fcbingen",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.brown.edu;https://www.uni-tuebingen.de/",
        "aff_unique_abbr": "Brown;Uni T\u00fcbingen",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";T\u00fcbingen",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United States;Germany"
    },
    {
        "id": "dbcWzalk6G",
        "title": "GraphText: Graph Learning in Text Space",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) have gained the ability to assimilate human knowledge and facilitate natural language interactions with both humans and other LLMs. However, despite their impressive achievements, LLMs have not made significant advancements in the realm of graph machine learning. This limitation arises because graphs encapsulate distinct relational data, making it challenging to transform them into natural language that LLMs understand. In this paper, we bridge this gap with a novel framework, GraphText, that translates graphs into natural language. GraphText derives a graph-syntax tree for each graph that encapsulates both the node attributes and inter-node relationships. Traversal of the tree yields a graph text sequence, which is then processed by an LLM to treat graph tasks as text generation tasks. Notably, GraphText offers multiple advantages. It introduces training-free graph reasoning: even without training on graph data, GraphText with ChatGPT can achieve on par with, or even surpassing, the performance of supervised-trained graph neural networks through in-context learning (ICL). Furthermore, GraphText paves the way for interactive graph reasoning, allowing both humans and LLMs to communicate with the model seamlessly using natural language. These capabilities underscore the vast, yet-to-be-explored potential of LLMs in the domain of graph machine learning.",
        "keywords": "Large Language Model;In-context Learning;Graph Machine Learning;Text-attributed graph",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Jianan Zhao;Le Zhuo;Yikang Shen;Meng Qu;Kai Liu;Michael M. Bronstein;Zhaocheng Zhu;Jian Tang",
        "authorids": "~Jianan_Zhao2;~Le_Zhuo2;~Yikang_Shen1;~Meng_Qu2;~Kai_Liu7;~Michael_M._Bronstein1;~Zhaocheng_Zhu1;~Jian_Tang1",
        "gender": "M;M;M;M;M;M;M;",
        "homepage": "https://andyjzhao.github.io/;https://le-zhuo.com/;;https://mnqu.github.io/;;http://www.inf.usi.ch/bronstein/;https://kiddozhu.github.io/;http://www.jian-tang.com",
        "dblp": "135/9355-2;334/1111;152/8226;14/8543.html;;07/2668;195/0435;181/2667-5",
        "google_scholar": "https://scholar.google.com/citations?view_op=new_articles;NxNC8qgAAAAJ;qff5rRYAAAAJ;92UwQYkAAAAJ;TGWgOqQAAAAJ;UU3N6-UAAAAJ;Qd8JumkAAAAJ;https://scholar.google.ca/citations?user=1ir6WUEAAAAJ",
        "orcid": "0000-0002-9743-7588;;;;;;;",
        "linkedin": ";;;;kai-liu-5aa28914/;mbronstein/;;",
        "or_profile": "~Jianan_Zhao2;~Le_Zhuo2;~Yikang_Shen1;~Meng_Qu2;~Kai_Liu7;~Michael_M._Bronstein1;~Zhaocheng_Zhu1;~Jian_Tang1",
        "aff": "Universit\u00e9 de Montr\u00e9al;Beihang University;International Business Machines;;Genentech Inc. ;University of Oxford;Universit\u00e9 de Montr\u00e9al;Mila, HEC Montreal",
        "aff_domain": "umontreal.ca;buaa.edu.cn;ibm.com;;gene.com;ox.ac.uk;mila.quebec;hec.ca",
        "position": "PhD student;Undergrad student;Researcher;;Principal Researcher;Full Professor;PhD student;Assistant Professor",
        "bibtex": "@misc{\nzhao2024graphtext,\ntitle={GraphText: Graph Learning in Text Space},\nauthor={Jianan Zhao and Le Zhuo and Yikang Shen and Meng Qu and Kai Liu and Michael M. Bronstein and Zhaocheng Zhu and Jian Tang},\nyear={2024},\nurl={https://openreview.net/forum?id=dbcWzalk6G}\n}",
        "github": "",
        "project": "",
        "reviewers": "ekj8;2ufP;JsWa;LfFz",
        "site": "https://openreview.net/forum?id=dbcWzalk6G",
        "pdf_size": 1421923,
        "rating": "3;3;5;8",
        "confidence": "4;4;5;4",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;2;2;3",
        "wc_summary": "68;75;37;90",
        "wc_strengths": "31;14;125;114",
        "wc_weaknesses": "309;165;143;77",
        "wc_questions": "2;28;65;3",
        "wc_review": "410;282;370;284",
        "wc_reply_reviewers": "118;0;126;14",
        "wc_reply_authors": "1020;478;444;589",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            67.5,
            19.319679086361656
        ],
        "wc_strengths_avg": [
            71.0,
            49.02550356702111
        ],
        "wc_weaknesses_avg": [
            173.5,
            84.66847110938049
        ],
        "wc_questions_avg": [
            24.5,
            25.59785147234041
        ],
        "wc_review_avg": [
            336.5,
            55.34211777660844
        ],
        "wc_reply_reviewers_avg": [
            64.5,
            57.78191758673296
        ],
        "wc_reply_authors_avg": [
            632.75,
            229.9188715612531
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.07053456158585983,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14861475070972043382&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;4;0;5",
        "aff_unique_norm": "Universit\u00e9 de Montr\u00e9al;Beihang University;International Business Machines Corporation;Genentech;University of Oxford;HEC Montreal",
        "aff_unique_dep": ";;;;;HEC Business School",
        "aff_unique_url": "https://www.umontreal.ca;http://www.buaa.edu.cn/;https://www.ibm.com;https://www.gene.com;https://www.ox.ac.uk;https://www.hec.ca",
        "aff_unique_abbr": "UdeM;BUAA;IBM;Genentech;Oxford;HEC",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Montreal",
        "aff_country_unique_index": "0;1;2;2;3;0;0",
        "aff_country_unique": "Canada;China;United States;United Kingdom"
    },
    {
        "id": "dbniI5RyWH",
        "title": "SEESAW: Do Graph Neural Networks Improve Node Representation Learning for All?",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph Neural Networks (GNNs) have manifested significant proficiency in various graph learning tasks over recent years. Owing to their exemplary performance, GNNs have garnered increasing attention from both the research community and industrial practitioners. Consequently, there has been a notable transition away from the conventional and prevalent shallow graph embedding methods. However, in tandem with this transition, an imperative question arises: do GNNs always outperform shallow embedding methods in node representation learning? Despite the doubts cast by multiple recent studies, the field of graph machine learning still lacks a systematic understanding, which is essential for meticulously paving its advancement. To properly answer this question, in this work, we propose a principled framework that unifies the pipelines of representative shallow graph embedding methods and GNNs. With rigorous comparative analysis, we first characterize the primary differences in their design from two different perspectives: the prior of node representation learning, and the neighborhood aggregation mechanism. We then analyze the benefits and drawbacks of using GNNs instead of shallow embedding methods through comprehensive experiments on ten real-world graph datasets. Furthermore, we also empirically validate that our analysis can be generalized to GNNs under various learning paradigms. Armed with these insights, we propose a guide for practitioners in choosing appropriate graph representation learning models under different scenarios.",
        "keywords": "Graph Neural Networks;graph machine learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Yushun Dong;William Shiao;Yozen Liu;Jundong Li;Neil Shah;Tong Zhao",
        "authorids": "~Yushun_Dong1;~William_Shiao1;~Yozen_Liu1;~Jundong_Li2;~Neil_Shah2;~Tong_Zhao3",
        "gender": "M;M;;M;M;M",
        "homepage": "https://yushundong.github.io;https://shiao.me;https://www.linkedin.com/in/yozen-liu-531a67130/;https://jundongli.github.io/;http://nshah.net;https://tzhao.io/",
        "dblp": "251/9559;304/3898;242/8056.html;144/7997.html;71/7771;94/6503-3",
        "google_scholar": "https://scholar.google.com/citations?hl=en;TIq-P5AAAAAJ;i3U2JjEAAAAJ;uY6ek7sAAAAJ;Qut69OgAAAAJ;05cRc-MAAAAJ",
        "orcid": "0000-0001-7504-6159;0000-0001-5813-2266;;;0000-0003-3261-8430;0000-0001-7660-1732",
        "linkedin": ";will-shiao;;;;",
        "or_profile": "~Yushun_Dong1;~William_Shiao1;~Yozen_Liu1;~Jundong_Li2;~Neil_Shah2;~Tong_Zhao3",
        "aff": "University of Virginia, Charlottesville;University of California, Riverside;Snap Inc.;University of Virginia;Snap Inc.;Snap Inc.",
        "aff_domain": "virginia.edu;ucr.edu;snapchat.com;virginia.edu;snap.com;snap.com",
        "position": "PhD student;PhD student;Researcher;Assistant Professor;Research Scientist;Researcher",
        "bibtex": "@misc{\ndong2024seesaw,\ntitle={{SEESAW}: Do Graph Neural Networks Improve Node Representation Learning for All?},\nauthor={Yushun Dong and William Shiao and Yozen Liu and Jundong Li and Neil Shah and Tong Zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=dbniI5RyWH}\n}",
        "github": "",
        "project": "",
        "reviewers": "VyuR;ySnn;4Gbd;4Dj2",
        "site": "https://openreview.net/forum?id=dbniI5RyWH",
        "pdf_size": 3601214,
        "rating": "3;5;5;5",
        "confidence": "4;4;3;2",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;2",
        "presentation": "4;3;3;3",
        "wc_summary": "116;111;68;135",
        "wc_strengths": "36;54;14;35",
        "wc_weaknesses": "121;96;186;115",
        "wc_questions": "104;76;138;279",
        "wc_review": "377;337;406;564",
        "wc_reply_reviewers": "0;94;190;156",
        "wc_reply_authors": "1774;1127;1908;1793",
        "reply_reviewers": "0;1;2;1",
        "reply_authors": "4;3;6;4",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            107.5,
            24.5
        ],
        "wc_strengths_avg": [
            34.75,
            14.16642156650719
        ],
        "wc_weaknesses_avg": [
            129.5,
            33.90058996536786
        ],
        "wc_questions_avg": [
            149.25,
            78.062074658569
        ],
        "wc_review_avg": [
            421.0,
            86.11910357173953
        ],
        "wc_reply_reviewers_avg": [
            110.0,
            72.2357252334328
        ],
        "wc_reply_authors_avg": [
            1650.5,
            306.5603529486486
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            4.25,
            1.0897247358851685
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13778225418374814191&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0;2;2",
        "aff_unique_norm": "University of Virginia;University of California, Riverside;Snap Inc.",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.virginia.edu;https://www.ucr.edu;https://www.snapinc.com",
        "aff_unique_abbr": "UVA;UCR;Snap",
        "aff_campus_unique_index": "0;1",
        "aff_campus_unique": "Charlottesville;Riverside;",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "dcbLZPDcBS",
        "title": "Efficient Graph Representation Learning by Non-Local Information Exchange",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Graph is an effective data structure to characterize ubiquitous connections as well as evolving behaviors that emerge from the inter-wined system. In spite of various deep learning models for graph data, the common denominator of current state-of-the-arts is finding a way to represent, or encode, graph entities (such as nodes and links) on top of the intricate wiring topology. Limited by the stereotype of node-to-node connections, learning global feature representations is often confined in a graph diffusion process where local information has been excessively aggregated as the random walk explores far-reach neighborhoods on the graph. In this regard, tremendous efforts have been made to alleviate feature over-smoothing issue such that current graph learning backbones can lend themselves in a deep network architecture. However, little attention has been paid to improving the expressive power of underlying graph topology, which is not only more relevant for the downstream applications but also more effective to mitigate the over-smoothing risk by reducing unnecessary information exchange on the graph. Inspired by the notion of non-local mean techniques in image processing area, we propose a non-local information exchange mechanism by establishing an express connection to the distant nodes, instead of propagating information along the (possibly very long) topological pathway node-after-node. Since the seek of express connections throughout the graph could be computationally expensive in real-world applications, we further present a hierarchical re-wiring framework (coined $express\\ messenger$ wrapper) to progressively incorporate express links into graph learning in a local-to-global manner, which allows us to effectively capture multi-scale graph feature representations without using a very deep model, thus free of the over-smoothing challenge. We have integrated our $express\\ messenger$ wrapper (as a model-agnostic plug-in) with existing graph neural networks (either using graph convolution or transformer backbones) and achieved SOTA performance on various graph learning applications.",
        "keywords": "Non-local information exchange;Graph rewiring;Graph representation learning;Graph expressibility",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Ziquan Wei;Jiaqi Ding;Tingting Dan;Guorong Wu",
        "authorids": "~Ziquan_Wei1;~Jiaqi_Ding1;~Tingting_Dan1;~Guorong_Wu1",
        "gender": "M;F;F;M",
        "homepage": "https://ziquanw.com/;;https://www.researchgate.net/profile/Tingting_Dan;https://www.acmlab.org/",
        "dblp": "206/5669;253/0206;223/8556;03/5225-1.html",
        "google_scholar": "z1IYb2oAAAAJ;https://scholar.google.com/citations?hl=en;FMcmg0gAAAAJ;XVsMB2kAAAAJ",
        "orcid": "0000-0001-6553-4482;0009-0005-0131-4348;;0000-0002-0550-6145",
        "linkedin": "weiziquan142857/;;;",
        "or_profile": "~Ziquan_Wei1;~Jiaqi_Ding1;~Tingting_Dan1;~Guorong_Wu1",
        "aff": "University of North Carolina at Chapel Hill;Department of Computer Science, University of North Carolina at Chapel Hill;University of North Carolina at Chapel Hill;University of North Carolina, Chapel Hill",
        "aff_domain": "unc.edu;cs.unc.edu;unc.edu;unc.edu",
        "position": "PhD student;PhD student;Postdoc;Associate Professor",
        "bibtex": "@misc{\nwei2024efficient,\ntitle={Efficient Graph Representation Learning by Non-Local Information Exchange},\nauthor={Ziquan Wei and Jiaqi Ding and Tingting Dan and Guorong Wu},\nyear={2024},\nurl={https://openreview.net/forum?id=dcbLZPDcBS}\n}",
        "github": "",
        "project": "",
        "reviewers": "YKr6;TumZ;JpoC",
        "site": "https://openreview.net/forum?id=dcbLZPDcBS",
        "pdf_size": 20531067,
        "rating": "3;5;5",
        "confidence": "4;3;4",
        "soundness": "1;3;3",
        "contribution": "2;3;2",
        "presentation": "1;3;2",
        "wc_summary": "73;57;84",
        "wc_strengths": "65;34;34",
        "wc_weaknesses": "78;31;162",
        "wc_questions": "59;69;91",
        "wc_review": "275;191;371",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "185;163;800",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            71.33333333333333,
            11.08552609887726
        ],
        "wc_strengths_avg": [
            44.333333333333336,
            14.613540144521982
        ],
        "wc_weaknesses_avg": [
            90.33333333333333,
            54.18691929074971
        ],
        "wc_questions_avg": [
            73.0,
            13.366625103842281
        ],
        "wc_review_avg": [
            279.0,
            73.53910524340094
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            382.6666666666667,
            295.23587556769286
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:mvjI9LoULtAJ:scholar.google.com/&scioq=Efficient+Graph+Representation+Learning+by+Non-Local+Information+Exchange&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "University of North Carolina;University of North Carolina at Chapel Hill",
        "aff_unique_dep": ";Department of Computer Science",
        "aff_unique_url": "https://www.unc.edu;https://www.unc.edu",
        "aff_unique_abbr": "UNC;UNC Chapel Hill",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Chapel Hill",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Reward Model Ensembles Help Mitigate Overoptimization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18253",
        "id": "dcjtMYkpXx",
        "author_site": "Thomas Coste, Usman Anwar, Robert Kirk, David Krueger",
        "tldr": "",
        "abstract": "Reinforcement learning from human feedback (RLHF) is a standard approach for fine-tuning large language models to follow instructions. As part of this process, learned reward models are used to approximately model human preferences. However, as imperfect representations of the \u201ctrue\u201d reward, these learned reward models are susceptible to overoptimization. Gao et al. (2023) studied this phenomenon in a synthetic human feedback setup with a significantly larger \u201cgold\u201d reward model acting as the true reward (instead of humans) and showed that overoptimization remains a persistent problem regardless of the size of the proxy reward model and training data used. Using a similar setup, we conduct a systematic study to evaluate the efficacy of using ensemble-based conservative optimization objectives, specifically worst-case optimization (WCO) and uncertainty-weighted optimization (UWO), for mitigating reward model overoptimization when using two optimization methods: (a) best-of-n sampling (BoN) (b) proximal policy optimization (PPO). We additionally extend the setup of Gao et al. (2023) to include 25% label noise to better mirror real-world conditions. Both with and without label noise we find that conservative optimization practically eliminates overoptimization and improves performance by up to 70% for BoN sampling. For PPO, ensemble-based conservative optimization always reduces overoptimization and outperforms single reward model optimization. Moreover, combining it with a small KL penalty successfully prevents overoptimization at no performance cost. Overall, our results demonstrate that ensemble-based conservative optimization can effectively counter overoptimization.",
        "keywords": "ensembles;overoptimization;RLHF;reinforcement learning from human feedback;language models;uncertainty weighted optimization",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Thomas Coste;Usman Anwar;Robert Kirk;David Krueger",
        "authorids": "~Thomas_Coste1;~Usman_Anwar1;~Robert_Kirk1;~David_Krueger1",
        "gender": "M;M;M;M",
        "homepage": ";https://www.uzman-anwar.github.io;https://robertkirk.github.io;https://mila.umontreal.ca/en/person/david-scott-krueger/",
        "dblp": ";229/2409;01/9684;142/2741.html",
        "google_scholar": ";UBAfLyQAAAAJ;https://scholar.google.co.uk/citations?user=PL5KWdYAAAAJ;https://scholar.google.ca/citations?user=5Uz70IoAAAAJ",
        "orcid": ";;;",
        "linkedin": "thomas-coste-en/;;;",
        "or_profile": "~Thomas_Coste1;~Usman_Anwar1;~Robert_Kirk1;~David_Krueger1",
        "aff": ";University of Cambridge;University College London;University of Cambridge",
        "aff_domain": ";cam.ac.uk;ucl.ac.uk;cam.ac.uk",
        "position": ";PhD student;PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\ncoste2024reward,\ntitle={Reward Model Ensembles Help Mitigate Overoptimization},\nauthor={Thomas Coste and Usman Anwar and Robert Kirk and David Krueger},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=dcjtMYkpXx}\n}",
        "github": "",
        "project": "",
        "reviewers": "PF7E;mVSG;83ty;249u",
        "pdf_size": 5035542,
        "rating": "6;6;6;8",
        "confidence": "3;4;3;4",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "4;3;2;4",
        "wc_summary": "75;179;45;136",
        "wc_strengths": "68;61;20;178",
        "wc_weaknesses": "36;121;97;334",
        "wc_questions": "316;12;177;53",
        "wc_review": "495;373;339;701",
        "wc_reply_reviewers": "109;0;57;114",
        "wc_reply_authors": "1115;801;448;642",
        "reply_reviewers": "1;0;2;2",
        "reply_authors": "3;2;2;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            108.75,
            52.155416784836454
        ],
        "wc_strengths_avg": [
            81.75,
            58.51655748589454
        ],
        "wc_weaknesses_avg": [
            147.0,
            112.32319439901983
        ],
        "wc_questions_avg": [
            139.5,
            118.63494426179834
        ],
        "wc_review_avg": [
            477.0,
            141.7391971192161
        ],
        "wc_reply_reviewers_avg": [
            70.0,
            46.16817085395522
        ],
        "wc_reply_authors_avg": [
            751.5,
            244.27699441412815
        ],
        "reply_reviewers_avg": [
            1.25,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 112,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3561833076227808654&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=dcjtMYkpXx",
        "pdf": "https://openreview.net/pdf?id=dcjtMYkpXx",
        "email": ";cam.ac.uk;ucl.ac.uk;cam.ac.uk",
        "author_num": 4,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Cambridge;University College London",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cam.ac.uk;https://www.ucl.ac.uk",
        "aff_unique_abbr": "Cambridge;UCL",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Cambridge;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "title": "Relaxing the Additivity Constraints in Decentralized No-Regret High-Dimensional Bayesian Optimization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18252",
        "id": "de1218PoEl",
        "author_site": "Anthony Bardou, Patrick Thiran, Thomas Begin",
        "tldr": "",
        "abstract": "Bayesian Optimization (BO) is typically used to optimize an unknown function $f$ that is noisy and costly to evaluate, by exploiting an acquisition function that must be maximized at each optimization step. Even if provably asymptotically optimal BO algorithms are efficient at optimizing low-dimensional functions, scaling them to high-dimensional spaces remains an open problem, often tackled by assuming an additive structure for $f$. By doing so, BO algorithms typically introduce additional restrictive assumptions on the additive structure that reduce their applicability domain. This paper contains two main contributions: (i) we relax the restrictive assumptions on the additive structure of $f$ without weakening the maximization guarantees of the acquisition function, and (ii) we address the over-exploration problem for decentralized BO algorithms. To these ends, we propose DuMBO, an asymptotically optimal decentralized BO algorithm that achieves very competitive performance against state-of-the-art BO algorithms, especially when the additive structure of $f$ comprises high-dimensional factors.",
        "keywords": "Bayesian Optimization;Online Learning;Black-box Optimization",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Anthony Bardou;Patrick Thiran;Thomas Begin",
        "authorids": "~Anthony_Bardou1;~Patrick_Thiran1;~Thomas_Begin1",
        "gender": "M;;",
        "homepage": "https://abardou.github.io/;https://people.epfl.ch/patrick.thiran;",
        "dblp": "306/6397;t/PThiran;",
        "google_scholar": "yVYolcEAAAAJ;https://scholar.google.ch/citations?user=7Ek7pqgAAAAJ;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Anthony_Bardou1;~Patrick_Thiran1;~Thomas_Begin1",
        "aff": "EPFL - EPF Lausanne;EPFL;",
        "aff_domain": "epfl.ch;epfl.ch;",
        "position": "Postdoc;Full Professor;",
        "bibtex": "@inproceedings{\nbardou2024relaxing,\ntitle={Relaxing the Additivity Constraints in Decentralized No-Regret High-Dimensional Bayesian Optimization},\nauthor={Anthony Bardou and Patrick Thiran and Thomas Begin},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=de1218PoEl}\n}",
        "github": "",
        "project": "",
        "reviewers": "PPCk;8R9C;q9mg;NC5W",
        "pdf_size": 1202931,
        "rating": "5;5;5;8",
        "confidence": "4;4;3;3",
        "soundness": "3;3;2;3",
        "contribution": "2;2;2;2",
        "presentation": "2;3;2;3",
        "wc_summary": "79;45;109;92",
        "wc_strengths": "61;126;51;45",
        "wc_weaknesses": "245;100;215;58",
        "wc_questions": "113;65;43;39",
        "wc_review": "498;336;418;234",
        "wc_reply_reviewers": "0;0;0;15",
        "wc_reply_authors": "723;1013;1093;229",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "2;2;3;1",
        "rating_avg": [
            5.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            81.25,
            23.47738273317535
        ],
        "wc_strengths_avg": [
            70.75,
            32.40659655070245
        ],
        "wc_weaknesses_avg": [
            154.5,
            77.6739982233437
        ],
        "wc_questions_avg": [
            65.0,
            29.427877939124322
        ],
        "wc_review_avg": [
            371.5,
            97.89152159405839
        ],
        "wc_reply_reviewers_avg": [
            3.75,
            6.49519052838329
        ],
        "wc_reply_authors_avg": [
            764.5,
            338.43278505487615
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9492018615113813642&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 13,
        "openreview": "https://openreview.net/forum?id=de1218PoEl",
        "pdf": "https://openreview.net/pdf?id=de1218PoEl",
        "email": "epfl.ch;epfl.ch;",
        "author_num": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "EPFL",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.epfl.ch",
        "aff_unique_abbr": "EPFL",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Lausanne;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Switzerland"
    },
    {
        "id": "de3bG5lPTV",
        "title": "Multi-agent Optimistic Soft Q-Learning: A co-MARL Algorithm with a Global Convergence Guarantee",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Despite the empirical success of cooperative multi-agent reinforcement learning algorithms in recent years, the theoretical understandings, especially for algorithms under the centralized training with decentralized execution (CTDE) framework, are still lacking. Interestingly, existing algorithms sometimes fail to handle some seemingly simple tasks. Motivated by these failed cases, this paper proposes multi-agent optimistic soft Q-learning (MAOSQL), a new co-MARL algorithm with a global convergence guarantee. The design of MAOSQL includes an optimistic local Q-function and a softmax local policy, which naturally leads to a different objective from existing algorithms. We show that optimizing this objective gives near-optimal policies with a tractable error bound, and MAOSQL provably converges to the global optima with properly chosen hyper-parameters. Further, we show that MAOSQL can be easily modified for deep reinforcement learning, MAOSDQN. We evaluate MAOSDQN in didactic environments where value decomposition methods or policy gradient methods fail, as well as level-based foraging, a popular MARL benchmark. The results confirm our theoretical analysis and indicate the potential of our proposed method to deal with more complicated problems.",
        "keywords": "Reinforcement Learning;Multi-agent Systems;Cooperative;Global Convergence;Deep Reinforcement Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/9dd58af315dff75dc2ed8e7707cc652b5a6eaf79.zip",
        "author": "Rui Hu;Lei Ying",
        "authorids": "~Rui_Hu6;~Lei_Ying1",
        "gender": "M;M",
        "homepage": "https://github.com/streek666;http://leiying.engin.umich.edu/",
        "dblp": ";27/4818",
        "google_scholar": ";7f3HKI8AAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Rui_Hu6;~Lei_Ying1",
        "aff": "Tsinghua University;University of Michigan, Ann Arbor",
        "aff_domain": "mails.tsinghua.edu.cn;umich.edu",
        "position": "Undergrad student;Professor",
        "bibtex": "@misc{\nhu2024multiagent,\ntitle={Multi-agent Optimistic Soft Q-Learning: A co-{MARL} Algorithm with a Global Convergence Guarantee},\nauthor={Rui Hu and Lei Ying},\nyear={2024},\nurl={https://openreview.net/forum?id=de3bG5lPTV}\n}",
        "github": "",
        "project": "",
        "reviewers": "Vgbg;8w13;njtx;aokn",
        "site": "https://openreview.net/forum?id=de3bG5lPTV",
        "pdf_size": 361860,
        "rating": "3;3;5;6",
        "confidence": "4;4;3;4",
        "soundness": "2;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "2;2;3;3",
        "wc_summary": "67;129;67;45",
        "wc_strengths": "22;72;25;23",
        "wc_weaknesses": "32;246;161;62",
        "wc_questions": "452;81;8;8",
        "wc_review": "573;528;261;138",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            77.0,
            31.336879231984796
        ],
        "wc_strengths_avg": [
            35.5,
            21.10094784600919
        ],
        "wc_weaknesses_avg": [
            125.25,
            84.49075393201318
        ],
        "wc_questions_avg": [
            137.25,
            184.14854737412404
        ],
        "wc_review_avg": [
            375.0,
            181.5061982412722
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15711089616950399842&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Tsinghua University;University of Michigan",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.umich.edu",
        "aff_unique_abbr": "THU;UM",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Ann Arbor",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "deHjbhHFvw",
        "title": "Framework Adapts PLMs towards Target Domain via Correcting Knowledge Bias",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Our goal is to guide pre-trained language models (PLMs) towards the target domain.\nSince Transformer-based models are pre-trained on larger and more heterogeneous corpora than a specific target corpus,\nthe domain gap between these corpora and the target corpus raises the question of whether these PLMs will contribute to this task after fine-tuning.\nTo close this domain gap,\nour proposal, Target Dig Adapter (TDA), is a model-agnostic adaptation framework that coordinates the knowledge of PLMs, the source domain, and the target domain.\nThe novelty of TDA is that it focuses on the differences between global and local knowledge,\nand guides PLMs towards the target domain through shifting these differences.\nExperiments show that TDA closes this gap,\nand guide PLMs to generate texts towards a given small target corpus.",
        "keywords": "Pretrained Language Models;Large Language Models;Adapter;Domain shift;Topic Lift",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Noriaki Kawamae",
        "authorids": "~Noriaki_Kawamae1",
        "gender": "",
        "homepage": "",
        "dblp": "70/1704",
        "google_scholar": "https://scholar.google.co.jp/citations?user=ylU8pzwAAAAJ",
        "orcid": "0000-0002-0746-9624",
        "linkedin": "",
        "or_profile": "~Noriaki_Kawamae1",
        "aff": "NTT Comware",
        "aff_domain": "nttcom.co.jp",
        "position": "Evangelist",
        "bibtex": "@misc{\nkawamae2024framework,\ntitle={Framework Adapts {PLM}s towards Target Domain via Correcting Knowledge Bias},\nauthor={Noriaki Kawamae},\nyear={2024},\nurl={https://openreview.net/forum?id=deHjbhHFvw}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=deHjbhHFvw",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:bABS-RXr1j8J:scholar.google.com/&scioq=Framework+Adapts+PLMs+towards+Target+Domain+via+Correcting+Knowledge+Bias&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "NTT Comware",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ntt-comware.co.jp",
        "aff_unique_abbr": "",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Japan"
    },
    {
        "id": "dexKVPmPOg",
        "title": "Efficient Recomputation of Marginal Likelihood upon Adding Training Data in Gaussian Processes and Simulator Fusion",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "To reduce generalization loss in line with the bias-variance trade-off, machine learning engineers should construct models based on their knowledge of the modeling target and, as training data increases, choose more flexible models with reduced dependence on that knowledge if that knowledge is unreliable. \nTo achieve this automatically, methods have been proposed to determine the amount of model's assumed prior knowledge directly from training data, rather than relying solely on an engineer's intuition.\nA widely studied approach involves using both a flexible model and a knowledge-dependent simulator, selectively incorporating simulator-generated data into the flexible model's training data.\nWhile neural networks have been used as flexible models, Gaussian processes are also candidates due to their flexibility and ability to output prediction uncertainty.\nHowever, direct methods for adding simulator-generated data to Gaussian process training data remain unstudied. The Subset of Data (SoD) method, the closest alternative, often adds inappropriate data due to its assumption about the true distribution.\nThe log marginal likelihood, grounded in theory, determines the inclusion of generated data. However, its computation in Gaussian processes is costly. We propose a faster method considering the Cholesky factor and matrix element dependencies.\nExperiments indicate that, in terms of MSE, metrics using exact negative log likelihood outperform Subset of Data and other basic methods.",
        "keywords": "Gaussian Process;bias variance tradeoff;marginal likelihood;model selection",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Yusuke Ohtsubo;Hiroki Ohashi",
        "authorids": "~Yusuke_Ohtsubo1;~Hiroki_Ohashi1",
        "gender": "M;M",
        "homepage": ";",
        "dblp": ";13/7360",
        "google_scholar": "https://scholar.google.co.jp/citations?user=4bHcPJsAAAAJ;GKC6bbYAAAAJ",
        "orcid": ";",
        "linkedin": ";hiroki-ohashi-8a6bbb105/",
        "or_profile": "~Yusuke_Ohtsubo1;~Hiroki_Ohashi1",
        "aff": "Hitachi, Ltd.;Hitachi Ltd. R&D group",
        "aff_domain": "hitachi.co.jp;hitachi.com",
        "position": "Researcher;Researcher",
        "bibtex": "@misc{\nohtsubo2024efficient,\ntitle={Efficient Recomputation of Marginal Likelihood upon Adding Training Data in Gaussian Processes and Simulator Fusion},\nauthor={Yusuke Ohtsubo and Hiroki Ohashi},\nyear={2024},\nurl={https://openreview.net/forum?id=dexKVPmPOg}\n}",
        "github": "",
        "project": "",
        "reviewers": "yLdo;1Da7;q1Av",
        "site": "https://openreview.net/forum?id=dexKVPmPOg",
        "pdf_size": 737035,
        "rating": "5;5;6",
        "confidence": "4;4;3",
        "soundness": "2;2;3",
        "contribution": "1;2;2",
        "presentation": "3;2;3",
        "wc_summary": "150;65;66",
        "wc_strengths": "53;78;25",
        "wc_weaknesses": "202;163;42",
        "wc_questions": "31;1166;54",
        "wc_review": "436;1472;187",
        "wc_reply_reviewers": "45;16;0",
        "wc_reply_authors": "723;3208;582",
        "reply_reviewers": "1;1;0",
        "reply_authors": "1;5;1",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            93.66666666666667,
            39.83577398380617
        ],
        "wc_strengths_avg": [
            52.0,
            21.64871050817269
        ],
        "wc_weaknesses_avg": [
            135.66666666666666,
            68.11917661145225
        ],
        "wc_questions_avg": [
            417.0,
            529.7062078800537
        ],
        "wc_review_avg": [
            698.3333333333334,
            556.429290705976
        ],
        "wc_reply_reviewers_avg": [
            20.333333333333332,
            18.62495339293199
        ],
        "wc_reply_authors_avg": [
            1504.3333333333333,
            1206.0487368077443
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            1.8856180831641267
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.9999999999999997,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:3_N_2UI2-pwJ:scholar.google.com/&scioq=Efficient+Recomputation+of+Marginal+Likelihood+upon+Adding+Training+Data+in+Gaussian+Processes+and+Simulator+Fusion&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Hitachi, Ltd.;Hitachi Ltd.",
        "aff_unique_dep": ";R&D group",
        "aff_unique_url": "https://www.hitachi.com;https://www.hitachi.com",
        "aff_unique_abbr": "Hitachi;Hitachi",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Japan"
    },
    {
        "id": "dfEuojp0rX",
        "title": "Variational Quantum Linear Solver enhanced Quantum Support Vector machine",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Quantum Support Vector Machines (QSVM) play a vital role in using quantum resources for supervised machine learning tasks, such as classification. However, current methods are strongly limited in terms of scalability on Noisy Intermediate Scale Quantum (NISQ)  devices. In this work, we propose a novel approach called the Variational Quantum Linear Solver (VQLS) enhanced QSVM. This is built upon our idea of utilizing the variational quantum linear solver  to solve system of linear equations  of a Least Squares-SVM  on a NISQ device.  The implementation of our approach is evaluated by an extensive series of numerical experiments with the Iris dataset, which consists of three distinct iris plant species. Based on this, we explore the effectiveness of our algorithm by constructing a classifier capable of classification in a feature space ranging from one to seven dimensions. Furthermore, we exploit both classical and quantum computing for various subroutines of our algorithm, and effectively mitigate challenges associated with the implementation. These include significant improvement in the trainability of the variational ansatz and notable reductions in run-time for cost  calculations. Based on the numerical experiments, our approach exhibits the capability of identifying a separating hyperplane in an 8-dimensional feature space. Moreover, it consistently demonstrated strong performance across various instances with the same dataset.",
        "keywords": "Supervised learning;Quantum support vector machine;Variational quantum linear solver;Binary classification",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Jianming YI;Kalyani Suresh;Ali Moghiseh;Norbert Wehn",
        "authorids": "~Jianming_YI1;~Kalyani_Suresh1;~Ali_Moghiseh1;~Norbert_Wehn1",
        "gender": "M;F;M;",
        "homepage": "https://www.itwm.fraunhofer.de/de/abteilungen/bv/mitarbeiter/jainming_yi.html;;;https://eit.rptu.de/fgs/ems/start",
        "dblp": ";;;",
        "google_scholar": ";xKr4YTsAAAAJ;;sJ9btGAAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;ali-moghiseh-2b42b81a6;",
        "or_profile": "~Jianming_YI1;~Kalyani_Suresh1;~Ali_Moghiseh1;~Norbert_Wehn1",
        "aff": ";Universit\u00e4t Hannover;;",
        "aff_domain": ";uni-hannover.de;;",
        "position": ";MS student;;",
        "bibtex": "@misc{\nyi2024variational,\ntitle={Variational Quantum Linear Solver enhanced Quantum Support Vector machine},\nauthor={Jianming YI and Kalyani Suresh and Ali Moghiseh and Norbert Wehn},\nyear={2024},\nurl={https://openreview.net/forum?id=dfEuojp0rX}\n}",
        "github": "",
        "project": "",
        "reviewers": "qfy2;w8ed;NGt1;aeDd",
        "site": "https://openreview.net/forum?id=dfEuojp0rX",
        "pdf_size": 5186138,
        "rating": "1;3;3;5",
        "confidence": "5;4;4;3",
        "soundness": "2;1;3;2",
        "contribution": "2;2;2;2",
        "presentation": "2;2;3;3",
        "wc_summary": "50;99;117;59",
        "wc_strengths": "8;30;70;111",
        "wc_weaknesses": "223;307;116;221",
        "wc_questions": "5;52;133;40",
        "wc_review": "286;488;436;431",
        "wc_reply_reviewers": "61;10;0;0",
        "wc_reply_authors": "653;700;706;701",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            81.25,
            27.680092124124155
        ],
        "wc_strengths_avg": [
            54.75,
            39.35336707322513
        ],
        "wc_weaknesses_avg": [
            216.75,
            67.73616094819664
        ],
        "wc_questions_avg": [
            57.5,
            46.88549882426335
        ],
        "wc_review_avg": [
            410.25,
            75.12780776782988
        ],
        "wc_reply_reviewers_avg": [
            17.75,
            25.301926804099327
        ],
        "wc_reply_authors_avg": [
            690.0,
            21.482551058940835
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8641882087678244001&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Hanover",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uni-hannover.de",
        "aff_unique_abbr": "Uni Hanover",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "dgmcE0RsTi",
        "title": "Chunk, Align, Select: A Simple Long-sequence Processing Method for Transformers",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Although dominant in natural language processing, transformer-based models remain challenged by the task of long-sequence processing, because the computational cost of self-attention operations in transformers swells quadratically with the input sequence length. To alleviate the complexity of long-sequence processing, we propose a simple framework to enable the off-the-shelf pre-trained transformers to process much longer sequences, while the computation and memory costs remain growing linearly with the input sequence lengths. More specifically, our method divides each long-sequence input into a batch of chunks, then aligns the inter-chunk information during the encoding steps, and finally selects the most representative hidden states from the encoder for the decoding process. To extract inter-chunk semantic information, we align the start and end token embeddings among chunks in each encoding transformer block. To learn an effective hidden selection policy, we design a dual updating scheme inspired by reinforcement learning, which regards the transformers as environments, and leverages the attention scores and the downstream performance feedback as the rewards to optimize the hidden selection policy. Our empirical results on real-world long-text abstractive summarization and reading comprehension tasks demonstrate effective improvements compared to prior long-sequence processing baselines.",
        "keywords": "transformer;long-sequence processing;reinforcement learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/a731bd3e5032f2bc69f6beb3e170a20f45e46754.zip",
        "author": "Jiawen Xie;Pengyu Cheng;Xiao Liang;Yong Dai;nan du",
        "authorids": "~Jiawen_Xie1;~Pengyu_Cheng1;~Xiao_Liang9;~Yong_Dai1;~nan_du3",
        "gender": "M;M;M;M;M",
        "homepage": "https://linear95.github.io/;https://mastervito.github.io/;https://daiyongya.github.io/;https://scholar.google.com/citations?user=BO4jEkAAAAAJ&hl=en;https://github.com/xjw-nlp",
        "dblp": "223/6048;;;;351/5556",
        "google_scholar": "eeQ_yCkAAAAJ;JHWyBKIAAAAJ;https://scholar.google.com/citations?hl=zh-CN;;",
        "orcid": "0000-0003-0421-8376;;0000-0002-3041-5851;;0000-0001-6918-3632",
        "linkedin": ";;yong-dai-9255311a6/;;",
        "or_profile": "~Pengyu_Cheng1;~Xiao_Liang9;~Yong_Dai1;~nan_du3;~Xie_Jia_wen1",
        "aff": "Tencent;Tsinghua University;Tencent AI Lab;Tencent INC;Shanghai Jiaotong University",
        "aff_domain": "tencent.com;tsinghua.edu.cn;tencent.com;tencent.com;sjtu.edu.cn",
        "position": "Researcher;MS student;Researcher;Principal Researcher;MS student",
        "bibtex": "@misc{\nanonymous2024chunk,\ntitle={Chunk, Align, Select: A Simple Long-sequence Processing Method for Transformers},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=dgmcE0RsTi}\n}",
        "github": "",
        "project": "",
        "reviewers": "5A1y;mi4g;pFUP;9Rva",
        "site": "https://openreview.net/forum?id=dgmcE0RsTi",
        "pdf_size": 3883527,
        "rating": "3;5;6;8",
        "confidence": "4;4;3;4",
        "soundness": "3;3;3;4",
        "contribution": "2;2;3;4",
        "presentation": "3;3;3;3",
        "wc_summary": "73;86;114;74",
        "wc_strengths": "48;23;36;78",
        "wc_weaknesses": "134;80;140;133",
        "wc_questions": "37;61;49;198",
        "wc_review": "292;250;339;483",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "784;539;466;834",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;1;2",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            86.75,
            16.543503256565703
        ],
        "wc_strengths_avg": [
            46.25,
            20.351596988934308
        ],
        "wc_weaknesses_avg": [
            121.75,
            24.252577182641847
        ],
        "wc_questions_avg": [
            86.25,
            65.07447656339619
        ],
        "wc_review_avg": [
            341.0,
            87.82084035125148
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            655.75,
            156.4103177542965
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.16012815380508713,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15980546084019476300&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;0;0;2",
        "aff_unique_norm": "Tencent;Tsinghua University;Shanghai Jiao Tong University",
        "aff_unique_dep": "Tencent Holdings Limited;;",
        "aff_unique_url": "https://www.tencent.com;https://www.tsinghua.edu.cn;https://www.sjtu.edu.cn",
        "aff_unique_abbr": "Tencent;THU;SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "dh0RmiwkWY",
        "title": "Large-Scale Public Data Improves Differentially Private Image Generation Quality",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Public data has been frequently used to improve the privacy-accuracy trade-off of differentially private machine learning, but prior work largely assumes that this data come from the same distribution as the private. In this work, we look at how to use *generic* large-scale public data to improve the quality of differentially private image generation in Generative Adversarial Networks (GANs), and provide an improved method that uses public data effectively. Our method works under the assumption that the support of the public data distribution contains the support of the private; an example of this is when the public data come from a general-purpose internet-scale image source, while the private data consist of images of a specific type. Detailed evaluations show that our method achieves SOTA in terms of FID score and other metrics compared with existing methods that use public data, and can generate high-quality, photo-realistic images in a differentially private manner.",
        "keywords": "Image Generation;Differential Privacy",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Ruihan Wu;Chuan Guo;Kamalika Chaudhuri",
        "authorids": "~Ruihan_Wu1;~Chuan_Guo1;~Kamalika_Chaudhuri1",
        "gender": "F;M;F",
        "homepage": "https://sites.google.com/site/ruihanwu14/home;https://sites.google.com/view/chuanguo;http://cseweb.ucsd.edu/users/kamalika",
        "dblp": "195/5577;;56/6435",
        "google_scholar": ";0gp5M-kAAAAJ;I-DJ7EsAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Ruihan_Wu1;~Chuan_Guo1;~Kamalika_Chaudhuri1",
        "aff": "University of California, San Diego;Meta;University of California, San Diego",
        "aff_domain": "ucsd.edu;meta.com;ucsd.edu",
        "position": "Postdoc;Researcher;Associate Professor",
        "bibtex": "@misc{\nwu2024largescale,\ntitle={Large-Scale Public Data Improves Differentially Private Image Generation Quality},\nauthor={Ruihan Wu and Chuan Guo and Kamalika Chaudhuri},\nyear={2024},\nurl={https://openreview.net/forum?id=dh0RmiwkWY}\n}",
        "github": "",
        "project": "",
        "reviewers": "KC1E;Kyfi;VNLs;3Hzn",
        "site": "https://openreview.net/forum?id=dh0RmiwkWY",
        "pdf_size": 22572025,
        "rating": "5;5;5;6",
        "confidence": "4;2;4;5",
        "soundness": "3;3;3;4",
        "contribution": "2;2;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "95;55;144;52",
        "wc_strengths": "25;18;53;121",
        "wc_weaknesses": "201;7;208;5",
        "wc_questions": "119;171;211;402",
        "wc_review": "440;251;616;580",
        "wc_reply_reviewers": "43;0;152;144",
        "wc_reply_authors": "630;346;935;552",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "2;1;2;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            86.5,
            37.286056375004314
        ],
        "wc_strengths_avg": [
            54.25,
            40.702426217610174
        ],
        "wc_weaknesses_avg": [
            105.25,
            99.28336970510217
        ],
        "wc_questions_avg": [
            225.75,
            106.85825892274308
        ],
        "wc_review_avg": [
            471.75,
            143.40916114391018
        ],
        "wc_reply_reviewers_avg": [
            84.75,
            65.11288274988291
        ],
        "wc_reply_authors_avg": [
            615.75,
            211.51403617727124
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.6622661785325219,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3043575721570509108&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of California, San Diego;Meta",
        "aff_unique_dep": ";Meta Platforms, Inc.",
        "aff_unique_url": "https://www.ucsd.edu;https://meta.com",
        "aff_unique_abbr": "UCSD;Meta",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "San Diego;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Decoding Natural Images from EEG for Object Recognition",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18251",
        "id": "dhLIno8FmH",
        "author_site": "Yonghao Song, Bingchuan Liu, Xiang Li, Nanlin Shi, Yijun Wang, Xiaorong Gao",
        "tldr": "",
        "abstract": "Electroencephalography (EEG) signals, known for convenient non-invasive acquisition but low signal-to-noise ratio, have recently gained substantial attention due to the potential to decode natural images. This paper presents a self-supervised framework to demonstrate the feasibility of learning image representations from EEG signals, particularly for object recognition. The framework utilizes image and EEG encoders to extract features from paired image stimuli and EEG responses. Contrastive learning aligns these two modalities by constraining their similarity. Our approach achieves state-of-the-art results on a comprehensive EEG-image dataset, with a top-1 accuracy of 15.6% and a top-5 accuracy of 42.8% in 200-way zero-shot tasks. Moreover, we perform extensive experiments to explore the biological plausibility by resolving the temporal, spatial, spectral, and semantic aspects of EEG signals. Besides, we introduce attention modules to capture spatial correlations, providing implicit evidence of the brain activity perceived from EEG data. These findings yield valuable insights for neural decoding and brain-computer interfaces in real-world scenarios. Code available at https://github.com/eeyhsong/NICE-EEG.",
        "keywords": "EEG;object recognition;contrastive learning;brain-computer interface",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "Yonghao Song;Bingchuan Liu;Xiang Li;Nanlin Shi;Yijun Wang;Xiaorong Gao",
        "authorids": "~Yonghao_Song1;~Bingchuan_Liu1;~Xiang_Li57;~Nanlin_Shi1;~Yijun_Wang4;~Xiaorong_Gao1",
        "gender": "M;;M;M;M;M",
        "homepage": "https://eeyhsong.github.io/;;;;;https://scholar.google.com/citations?user=8HR2SA0AAAAJ&hl=en",
        "dblp": "169/7096;;;;;41/5534",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;;l6Kd6n0AAAAJ;ME6k42gAAAAJ;",
        "orcid": ";;0000-0002-9330-7719;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Yonghao_Song1;~Bingchuan_Liu1;~Xiang_Li57;~Nanlin_Shi1;~Yijun_Wang4;~Xiaorong_Gao1",
        "aff": "Tsinghua University;;;Tsinghua university;Institute of Semiconductors, CAS;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;;;thu.edu.cn;semi.ac.cn;tsinghua.edu.cn",
        "position": "PhD student;;;PhD student;Researcher;Full Professor",
        "bibtex": "@inproceedings{\nsong2024decoding,\ntitle={Decoding Natural Images from {EEG} for Object Recognition},\nauthor={Yonghao Song and Bingchuan Liu and Xiang Li and Nanlin Shi and Yijun Wang and Xiaorong Gao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=dhLIno8FmH}\n}",
        "github": "",
        "project": "",
        "reviewers": "pm39;9bdz;JYif;ixpa",
        "pdf_size": 6525093,
        "rating": "3;8;8;8",
        "confidence": "4;5;4;3",
        "soundness": "2;3;3;4",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "16;205;97;139",
        "wc_strengths": "12;206;136;26",
        "wc_weaknesses": "287;509;119;10",
        "wc_questions": "184;215;519;143",
        "wc_review": "499;1135;871;318",
        "wc_reply_reviewers": "0;83;179;86",
        "wc_reply_authors": "1054;1278;1220;446",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "3;4;4;2",
        "rating_avg": [
            6.75,
            2.165063509461097
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            114.25,
            68.55426682563238
        ],
        "wc_strengths_avg": [
            95.0,
            80.0812087820857
        ],
        "wc_weaknesses_avg": [
            231.25,
            188.28485733058832
        ],
        "wc_questions_avg": [
            265.25,
            148.71175979054246
        ],
        "wc_review_avg": [
            705.75,
            318.0639676228667
        ],
        "wc_reply_reviewers_avg": [
            87.0,
            63.344297296599635
        ],
        "wc_reply_authors_avg": [
            999.5,
            329.96780145947577
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.25,
            0.82915619758885
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 31,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2173774787693018830&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=dhLIno8FmH",
        "pdf": "https://openreview.net/pdf?id=dhLIno8FmH",
        "email": "tsinghua.edu.cn;;;thu.edu.cn;semi.ac.cn;tsinghua.edu.cn",
        "author_num": 6,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Tsinghua University;Chinese Academy of Sciences",
        "aff_unique_dep": ";Institute of Semiconductors",
        "aff_unique_url": "https://www.tsinghua.edu.cn;http://www.cas.cn",
        "aff_unique_abbr": "THU;CAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "SDXL: Improving Latent Diffusion Models for High-Resolution Image Synthesis",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18250",
        "id": "di52zR8xgf",
        "author_site": "Dustin Podell, Zion English, Kyle Lacey, Andreas Blattmann, Tim Dockhorn, Jonas M\u00fcller, Joe Penna, Robin Rombach",
        "tldr": "",
        "abstract": "We present Stable Diffusion XL (SDXL), a latent diffusion model for text-to-image synthesis. Compared to previous versions of Stable Diffusion, SDXL leverages a three times larger UNet backbone, achieved by significantly increasing the number of attention blocks and including a second text encoder. Further, we design multiple novel conditioning schemes and train SDXL on multiple aspect ratios. To ensure highest quality results, we also introduce a refinement model which is used to improve the visual fidelity of samples generated by SDXL using a post-hoc image-to-image technique. We demonstrate that SDXL improves dramatically over previous versions of Stable Diffusion and achieves results competitive with those of black-box state-of-the-art image generators such as Midjourney.",
        "keywords": "Image Synthesis;Diffusion;Generative AI",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/ba3b51f844155a9a236e95358b215f7c9723eafa.pdf",
        "author": "Dustin Podell;Zion English;Kyle Lacey;Andreas Blattmann;Tim Dockhorn;Jonas M\u00fcller;Joe Penna;Robin Rombach",
        "authorids": "~Dustin_Podell1;~Zion_English1;~Kyle_Lacey1;~Andreas_Blattmann1;~Tim_Dockhorn1;~Jonas_M\u00fcller1;~Joe_Penna1;~Robin_Rombach1",
        "gender": "M;;;M;;M;M;M",
        "homepage": ";;;;https://timudk.github.io/;;https://en.wikipedia.org/wiki/Joe_Penna;https://hci.iwr.uni-heidelberg.de/user/1149/biblio",
        "dblp": ";;;273/7645;239/4951;;;263/9785",
        "google_scholar": ";;;https://scholar.google.de/citations?user=vud0t5YAAAAJ;EtPn_v4AAAAJ;;;ygdQhrIAAAAJ",
        "orcid": ";;;;;;;",
        "linkedin": "dustinpodell/;;kyle-lacey-7830b9140;andreas-blattmann-479038186;;jonasjmueller/;joe-penna-74000011b/;",
        "or_profile": "~Dustin_Podell1;~Zion_English1;~Kyle_Lacey1;~Andreas_Blattmann1;~Tim_Dockhorn1;~Jonas_M\u00fcller1;~Joe_Penna1;~Robin_Rombach1",
        "aff": "Stability AI;;Stability AI;Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen;Stability AI;Stability AI;;Stability AI",
        "aff_domain": "stability.ai;;stability.ai;lmu.de;stability.ai;stability.ai;;stabilty.ai",
        "position": "Researcher;;Researcher;PhD student;Researcher;Researcher;;Researcher",
        "bibtex": "@inproceedings{\npodell2024sdxl,\ntitle={{SDXL}: Improving Latent Diffusion Models for High-Resolution Image Synthesis},\nauthor={Dustin Podell and Zion English and Kyle Lacey and Andreas Blattmann and Tim Dockhorn and Jonas M{\\\"u}ller and Joe Penna and Robin Rombach},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=di52zR8xgf}\n}",
        "github": "",
        "project": "",
        "reviewers": "rcq7;gmj5;n7kc;pUdr",
        "pdf_size": 16273053,
        "rating": "8;8;8;8",
        "confidence": "4;3;4;5",
        "soundness": "4;3;4;3",
        "contribution": "4;3;4;4",
        "presentation": "4;3;4;3",
        "wc_summary": "83;65;104;69",
        "wc_strengths": "241;19;89;76",
        "wc_weaknesses": "189;44;68;51",
        "wc_questions": "16;40;80;107",
        "wc_review": "529;168;341;303",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "131;186;188;209",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            80.25,
            15.2540978100968
        ],
        "wc_strengths_avg": [
            106.25,
            82.13213439330552
        ],
        "wc_weaknesses_avg": [
            88.0,
            58.96185207403173
        ],
        "wc_questions_avg": [
            60.75,
            35.152347005569915
        ],
        "wc_review_avg": [
            335.25,
            129.0201050224344
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            178.5,
            28.86607004772212
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2203,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17026047163512610766&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=di52zR8xgf",
        "pdf": "https://openreview.net/pdf?id=di52zR8xgf",
        "email": "stability.ai;;stability.ai;lmu.de;stability.ai;stability.ai;;stabilty.ai",
        "author_num": 8,
        "aff_unique_index": "0;0;1;0;0;0",
        "aff_unique_norm": "Stability AI;Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://stability.ai;https://www.lmu.de",
        "aff_unique_abbr": "Stability AI;LMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0;0",
        "aff_country_unique": "United States;Germany"
    },
    {
        "id": "dj940KfZl3",
        "title": "PIE: Simulating Disease Progression via Progressive Image Editing",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Disease progression trajectories can greatly affect the quality and efficacy of clinical diagnosis, prognosis, and treatment. However, one major challenge is the lack of longitudinal medical imaging monitoring of individual patients over time. To address this issue, we propose Progressive Image Editing (PIE) method that enables controlled manipulation of disease-related image features, facilitating precise and realistic disease progression simulation in imaging space. Specifically, we leverage recent advancements in text-to-image generative models to simulate disease progression accurately and personalize it for each patient. We also theoretically analyze the iterative refining process in our framework as a gradient descent with an exponentially decayed learning rate. To validate our framework, we conduct experiments in three medical imaging domains. Our results demonstrate the superiority of PIE over existing methods such as Stable Diffusion Video and Style-Based Manifold Extrapolation based on CLIP score (Realism) and Disease Classification Confidence (Alignment). Our user study collected feedback from 35 veteran physicians to assess the generated progressions. Remarkably, 76.2% of the feedback agrees with the fidelity of the generated progressions. PIE can allow healthcare providers to model disease imaging trajectories over time, predict future treatment responses, fill in missing imaging data in clinical records, and improve medical education. Anonymous code for replicating our results can be found at https://anonymous.4open.science/r/PIE-3332.",
        "keywords": "Disease Progression;Medical Imaging",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/edc1a68fcbdcf3009a2caac23afa6fdd277c7dbc.pdf",
        "author": "Kaizhao Liang;Xu Cao;Kuei-Da Liao;Tianren Gao;Wenqian Ye;Zhengyu Chen;Jianguo Cao;Tejas Nama;Jimeng Sun",
        "authorids": "~Kaizhao_Liang1;~Xu_Cao4;~Kuei-Da_Liao1;~Tianren_Gao1;~Wenqian_Ye1;~Zhengyu_Chen5;~Jianguo_Cao1;~Tejas_Nama1;~Jimeng_Sun3",
        "gender": "M;Non-Binary;M;M;M;M;M;M;",
        "homepage": "https://kaizhaoliang.github.io/Portfolio/;https://www.linkedin.com/in/irohxu/;https://linkedin.com/in/kuei-da-liao/;https://github.com/tianrengao;https://wenqian-ye.github.io/;;https://pediamedai.com/;;http://sunlab.org",
        "dblp": "239/5146;;234/3281;;303/4407;80/887-2;99/10180;289/3291.html;",
        "google_scholar": "qKLmNfoAAAAJ;oXWRBrwAAAAJ;;QQSBW8gAAAAJ;g0xeSH8AAAAJ;8BwEbTQAAAAJ;dPPOpHUAAAAJ;D1AQnOsAAAAJ;9jmmp5sAAAAJ",
        "orcid": ";0000-0001-8739-5196;;;0000-0002-6069-5153;0000-0001-5811-456X;0000-0001-8781-5365;;0000-0003-1512-6426",
        "linkedin": "kaizhao-liang-427a42132/;;https://linkedin.com/in/kuei-da-liao/;;;edison-zhengyu-chen-0b47459b/;;tejas-nama-54713a97;jimengsun/",
        "or_profile": "~Kaizhao_Liang1;~Xu_Cao4;~Kuei-Da_Liao1;~Tianren_Gao1;~Wenqian_Ye1;~Zhengyu_Chen5;~Jianguo_Cao1;~Tejas_Nama1;~Jimeng_Sun3",
        "aff": "SambaNova Systems, Inc;Media Analytics, NEC Lab;Objective Inc;Sambanova Systems;University of Virginia;;Shenzhen Children's Hospital;;Georgia Institute of Technology",
        "aff_domain": "sambanovasystems.com;nec-labs.com;objective.inc;sambanovasystems.com;virginia.edu;;szkid.com.cn;;gatech.edu",
        "position": "Principal Engineer;Research Intern;Researcher;Researcher;PhD student;;Full Professor;;Associate Professor",
        "bibtex": "@misc{\nliang2024pie,\ntitle={{PIE}: Simulating Disease Progression via Progressive Image Editing},\nauthor={Kaizhao Liang and Xu Cao and Kuei-Da Liao and Tianren Gao and Wenqian Ye and Zhengyu Chen and Jianguo Cao and Tejas Nama and Jimeng Sun},\nyear={2024},\nurl={https://openreview.net/forum?id=dj940KfZl3}\n}",
        "github": "",
        "project": "",
        "reviewers": "rTQB;GQCh;KqFr;SCY9",
        "site": "https://openreview.net/forum?id=dj940KfZl3",
        "pdf_size": 13349588,
        "rating": "3;5;5;5",
        "confidence": "3;4;4;3",
        "soundness": "3;3;2;2",
        "contribution": "1;2;3;2",
        "presentation": "2;3;3;2",
        "wc_summary": "51;115;126;66",
        "wc_strengths": "41;147;52;14",
        "wc_weaknesses": "182;188;678;14",
        "wc_questions": "94;116;28;672",
        "wc_review": "368;566;884;766",
        "wc_reply_reviewers": "0;0;139;56",
        "wc_reply_authors": "472;437;756;779",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            89.5,
            31.68990375498165
        ],
        "wc_strengths_avg": [
            63.5,
            50.15226814412286
        ],
        "wc_weaknesses_avg": [
            265.5,
            248.18692552187352
        ],
        "wc_questions_avg": [
            227.5,
            258.6672573017312
        ],
        "wc_review_avg": [
            646.0,
            196.67740083700517
        ],
        "wc_reply_reviewers_avg": [
            48.75,
            56.90068101525675
        ],
        "wc_reply_authors_avg": [
            611.0,
            157.19891857134388
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17663043022202130709&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;0;3;4;5",
        "aff_unique_norm": "SambaNova Systems;NEC Lab;Objective Inc;University of Virginia;Shenzhen Children's Hospital;Georgia Institute of Technology",
        "aff_unique_dep": ";Media Analytics;;;;",
        "aff_unique_url": "https://www.sambanova.com;https://www.nec-labs.com;;https://www.virginia.edu;http://www.szhchospital.com;https://www.gatech.edu",
        "aff_unique_abbr": "SambaNova;NEC Lab;;UVA;;Georgia Tech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;1;0",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "Neural Snowflakes: Universal Latent Graph Inference via Trainable Latent Geometries",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18249",
        "id": "djM3WzpOmK",
        "author_site": "Haitz S\u00e1ez de Oc\u00e1riz Borde, Anastasis Kratsios",
        "tldr": "",
        "abstract": "The inductive bias of a graph neural network (GNN) is largely encoded in its specified graph. Latent graph inference relies on latent geometric representations to dynamically rewire or infer a GNN's graph to maximize the GNN's predictive downstream performance, but it lacks solid theoretical foundations in terms of embedding-based representation guarantees. This paper addresses this issue by introducing a trainable deep learning architecture, coined \\textit{neural snowflake}, that can adaptively implement fractal-like metrics on $\\mathbb{R}^d$. We prove that any given finite weights graph can be isometrically embedded by a standard MLP encoder. Furthermore, when the latent graph can be represented in the feature space of a sufficiently regular kernel, we show that the combined neural snowflake and MLP encoder do not succumb to the curse of dimensionality by using only a low-degree polynomial number of parameters in the number of nodes. This implementation enables a low-dimensional isometric embedding of the latent graph. We conduct synthetic experiments to demonstrate the superior metric learning capabilities of neural snowflakes when compared to more familiar spaces like Euclidean space.  Additionally, we carry out latent graph inference experiments on graph benchmarks. Consistently, the neural snowflake model achieves predictive performance that either matches or surpasses that of the state-of-the-art latent graph inference models. Importantly, this performance improvement is achieved without requiring random search for optimal latent geometry. Instead, the neural snowflake model achieves this enhancement in a differentiable manner.",
        "keywords": "Latent Graph Inference;Representation Learning;Metric Embedding;Geometric Deep Learning;Graph Neural Networks",
        "primary_area": "metric learning, kernel learning, and sparse coding",
        "supplementary_material": "/attachment/45bcb81331dc6b06738ada6848d2f32557152521.pdf",
        "author": "Haitz S\u00e1ez de Oc\u00e1riz Borde;Anastasis Kratsios",
        "authorids": "~Haitz_S\u00e1ez_de_Oc\u00e1riz_Borde1;~Anastasis_Kratsios1",
        "gender": "M;Non-Binary",
        "homepage": "https://www.linkedin.com/in/haitz-s%C3%A1ez-de-oc%C3%A1riz-borde-0933a9199/;https://anastasiskratsios.github.io/",
        "dblp": ";",
        "google_scholar": "aP0OakUAAAAJ;https://scholar.google.ca/citations?user=9D-bHFgAAAAJ",
        "orcid": ";0000-0001-6791-3371",
        "linkedin": ";anastasiskratsios/",
        "or_profile": "~Haitz_S\u00e1ez_de_Oc\u00e1riz_Borde1;~Anastasis_Kratsios1",
        "aff": "University of Oxford;McMaster University",
        "aff_domain": "ox.ac.uk;mcmaster.ca",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nborde2024neural,\ntitle={Neural Snowflakes: Universal Latent Graph Inference via Trainable Latent Geometries},\nauthor={Haitz S{\\'a}ez de Oc{\\'a}riz Borde and Anastasis Kratsios},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=djM3WzpOmK}\n}",
        "github": "",
        "project": "",
        "reviewers": "gXAo;cbgk;pN6S;Sjjv",
        "pdf_size": 797691,
        "rating": "5;6;8;8",
        "confidence": "3;2;3;2",
        "soundness": "3;3;4;4",
        "contribution": "2;3;4;4",
        "presentation": "2;3;4;4",
        "wc_summary": "61;48;189;95",
        "wc_strengths": "35;40;123;162",
        "wc_weaknesses": "218;42;76;112",
        "wc_questions": "89;33;7;77",
        "wc_review": "403;163;395;446",
        "wc_reply_reviewers": "0;15;26;0",
        "wc_reply_authors": "975;197;281;512",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            2.5,
            0.5
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            98.25,
            55.13336104392693
        ],
        "wc_strengths_avg": [
            90.0,
            54.30929938785806
        ],
        "wc_weaknesses_avg": [
            112.0,
            66.01514977639603
        ],
        "wc_questions_avg": [
            51.5,
            33.087006513131406
        ],
        "wc_review_avg": [
            351.75,
            110.68734119130335
        ],
        "wc_reply_reviewers_avg": [
            10.25,
            10.96300597464035
        ],
        "wc_reply_authors_avg": [
            491.25,
            302.1724466260946
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.19245008972987526,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12700189362590402783&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=djM3WzpOmK",
        "pdf": "https://openreview.net/pdf?id=djM3WzpOmK",
        "email": "ox.ac.uk;mcmaster.ca",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Oxford;McMaster University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ox.ac.uk;https://www.mcmaster.ca",
        "aff_unique_abbr": "Oxford;McMaster",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United Kingdom;Canada"
    },
    {
        "id": "djcciHhCrt",
        "title": "Misusing Tools in Large Language Models With Visual Adversarial Examples",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) are being enhanced with the ability to use tools and to process multiple modalities. These new capabilities bring new benefits and also new security risks. In this work, we show that an attacker can use visual adversarial examples to cause attacker-desired tool usage. For example, the attacker could cause a victim LLM to delete calendar events, leak private conversations and book hotels.  Different from prior work, our attacks can affect the confidentiality and integrity of user resources connected to the LLM while being stealthy and generalizable to multiple input prompts. We construct these attacks using gradient-based adversarial training and characterize performance along multiple dimensions. We find that our adversarial images can manipulate the LLM to invoke tools following real-world syntax almost always ($\\sim$98\\%) while maintaining high similarity to clean images ($\\sim$0.9 SSIM). Furthermore, using human scoring and automated metrics, we find that the attacks do not noticeably affect the conversation (and its semantics) between the user and the LLM.",
        "keywords": "LLM;Advesarial examples;Prompt Injection;Security",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Xiaohan Fu;Zihan Wang;Shuheng Li;Rajesh K. Gupta;Niloofar Mireshghallah;Taylor Berg-Kirkpatrick;Earlence Fernandes",
        "authorids": "~Xiaohan_Fu1;~Zihan_Wang1;shl060@ucsd.edu;~Rajesh_K._Gupta1;~Niloofar_Mireshghallah1;~Taylor_Berg-Kirkpatrick1;efernandes@ucsd.edu",
        "gender": "M;M;;M;;M;",
        "homepage": "https://xhfu.me;https://zihanwangki.github.io/;;http://mesl.ucsd.edu/gupta/;;https://cseweb.ucsd.edu/~tberg/;",
        "dblp": ";152/5077-1;;213/9138-1.html;;22/8160;",
        "google_scholar": ";6UWtYZQAAAAJ;;I1w51gUAAAAJ;;mN6_BKAAAAAJ;",
        "orcid": ";;;0000-0002-6489-7633;;;",
        "linkedin": ";;;rajeshgupta4/;;;",
        "or_profile": "~Xiaohan_Fu1;~Zihan_Wang1;shl060@ucsd.edu;~Rajesh_K._Gupta1;~Niloofar_Mireshghallah1;~Taylor_Berg-Kirkpatrick1;efernandes@ucsd.edu",
        "aff": "University of California, San Diego;University of California, San Diego;;University of California, San Diego;;University of California, San Diego;",
        "aff_domain": "ucsd.edu;ucsd.edu;;ucsd.edu;;ucsd.edu;",
        "position": "PhD student;PhD student;;Full Professor;;Associate Professor;",
        "bibtex": "@misc{\nfu2024misusing,\ntitle={Misusing Tools in Large Language Models With Visual Adversarial Examples},\nauthor={Xiaohan Fu and Zihan Wang and Shuheng Li and Rajesh K. Gupta and Niloofar Mireshghallah and Taylor Berg-Kirkpatrick and Earlence Fernandes},\nyear={2024},\nurl={https://openreview.net/forum?id=djcciHhCrt}\n}",
        "github": "",
        "project": "",
        "reviewers": "La6s;tv67;NtXf;cgCA",
        "site": "https://openreview.net/forum?id=djcciHhCrt",
        "pdf_size": 3119247,
        "rating": "3;3;5;6",
        "confidence": "4;3;4;5",
        "soundness": "2;2;3;4",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;4",
        "wc_summary": "34;51;78;59",
        "wc_strengths": "22;61;75;50",
        "wc_weaknesses": "145;218;408;258",
        "wc_questions": "2;49;79;4",
        "wc_review": "203;379;640;371",
        "wc_reply_reviewers": "105;81;53;161",
        "wc_reply_authors": "786;1320;753;1054",
        "reply_reviewers": "1;1;1;2",
        "reply_authors": "2;3;2;2",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            55.5,
            15.819292019556375
        ],
        "wc_strengths_avg": [
            52.0,
            19.45507645834372
        ],
        "wc_weaknesses_avg": [
            257.25,
            96.00358066238988
        ],
        "wc_questions_avg": [
            33.5,
            32.29938079901842
        ],
        "wc_review_avg": [
            398.25,
            156.26799896331943
        ],
        "wc_reply_reviewers_avg": [
            100.0,
            39.736632972611055
        ],
        "wc_reply_authors_avg": [
            978.25,
            229.25354413836223
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.816496580927726,
        "gs_citation": 37,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17173148441082376828&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of California, San Diego",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucsd.edu",
        "aff_unique_abbr": "UCSD",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "San Diego",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "djmLZkEw1L",
        "title": "IMPLICIT STACKED AUTOREGRESSIVE MODEL FOR WEATHER FORECASTING",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "As global climate change intensifies, the accuracy and reliability of weather forecasting have become increasingly crucial. Accurate predictions are vital not only for preparing for extreme weather events, but also for understanding the long-term implications of changing climate patterns. To address these issues, data-driven methods have begun to be applied. Three primary methods have been proposed: the autoregressive method, lead time embedding, and the non-autoregressive method. However, the autoregressive method has shown a significant decline in performance as the lead time increases due to the accumulation of errors. While the non-autoregressive method offers high performance, it can only predict at fixed lead times and intervals. Lastly, the lead time embedding method, which does not perform temporal modeling, failed to predict complex patterns. In this paper, we introduce the Implicit Stacked Autoregressive Model for Weather Forecasting (IAM4WF), an implicit video prediction model that employs a stacked autoregressive approach. Similar to non-autoregressive methods, stacked autoregressive methods utilize the same observed frame to forecast all subsequent frames. Yet, they incorporate their predictions as input, much like autoregressive methods. As predictions span over an increasing number of time steps, they are systematically queued in sequence. To validate IAM4WF's efficacy, we conducted tests on three prevalent future frame prediction benchmark datasets and weather and climate prediction datasets. Experimental results show that IAM4WF significantly improves performance on all datasets we evaluated.",
        "keywords": "Weather Forecasting;Climate Change",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Minseok Seo;Hakjin Lee;Doyi Kim;Junghoon Seo",
        "authorids": "~Minseok_Seo1;~Hakjin_Lee1;~Doyi_Kim1;~Junghoon_Seo1",
        "gender": "M;M;F;M",
        "homepage": "https://sites.google.com/view/minseokcv/%ED%99%88;https://github.com/nijkah;;https://mikigom.github.io",
        "dblp": ";;;211/7655",
        "google_scholar": "https://scholar.google.co.kr/citations?user=pOygDIIAAAAJ;;;https://scholar.google.com/citations?hl=en",
        "orcid": ";;0000-0002-9849-3127;",
        "linkedin": ";;;",
        "or_profile": "~Minseok_Seo1;~Hakjin_Lee1;~Doyi_Kim1;~Junghoon_Seo1",
        "aff": "SI Analytics;SI Analytics;SI Analytics;SI Analytics",
        "aff_domain": "si-analytics.ai;si-analytics.ai;si-analytics.ai;si-analytics.ai",
        "position": "Researcher;Researcher;Researcher;Researcher",
        "bibtex": "@misc{\nseo2024implicit,\ntitle={{IMPLICIT} {STACKED} {AUTOREGRESSIVE} {MODEL} {FOR} {WEATHER} {FORECASTING}},\nauthor={Minseok Seo and Hakjin Lee and Doyi Kim and Junghoon Seo},\nyear={2024},\nurl={https://openreview.net/forum?id=djmLZkEw1L}\n}",
        "github": "",
        "project": "",
        "reviewers": "GNg4;Dqwm;sYk9;33K8",
        "site": "https://openreview.net/forum?id=djmLZkEw1L",
        "pdf_size": 2006337,
        "rating": "3;3;3;5",
        "confidence": "4;4;4;4",
        "soundness": "2;3;2;2",
        "contribution": "1;1;2;2",
        "presentation": "2;3;2;2",
        "wc_summary": "139;57;83;81",
        "wc_strengths": "47;47;35;30",
        "wc_weaknesses": "697;157;650;282",
        "wc_questions": "170;103;70;4",
        "wc_review": "1053;364;838;397",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            90.0,
            30.083217912982647
        ],
        "wc_strengths_avg": [
            39.75,
            7.46240577829965
        ],
        "wc_weaknesses_avg": [
            446.5,
            231.85825411229163
        ],
        "wc_questions_avg": [
            86.75,
            59.8388460784464
        ],
        "wc_review_avg": [
            663.0,
            292.7806346055012
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:N7Bz2trphOkJ:scholar.google.com/&scioq=IMPLICIT+STACKED+AUTOREGRESSIVE+MODEL+FOR+WEATHER+FORECASTING&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "SI Analytics",
        "aff_unique_dep": "",
        "aff_unique_url": "",
        "aff_unique_abbr": "",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "",
        "aff_country_unique": ""
    },
    {
        "id": "dkn9cEOQkU",
        "title": "Addressing Real-Time Fragmentary Interaction Control Problems via Muti-step Representation Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Fragmentary interaction control problem is common in real-time control scenarios. For example, the delay or the loss of the network packets (caused by network obstacles, inadequate bandwidth, or switch faults) will lead to dynamic interval or fragmentary interaction. Moreover, fragmentary interaction hinders the application of reinforcement learning algorithms in real-time control tasks: when the states are not received, the reinforcement learning (RL) algorithm cannot make the decision for the agent according to the traditional MDP, which leads to the standstill of the agent, and finally leads to low efficiency or even failure in completing the task. However, such problems are not well studied in the RL community. In this paper, we propose to simultaneously generate multiple actions for future states in case some future states cannot be perceived. We present \\textbf{M}ulti-step \\textbf{A}ction \\textbf{R}epre\\textbf{S}entation (\\textbf{MARS}) to learn a compact and decodable latent space for the original multi-step action space. Besides, our method enhances the environmental dynamic semantics of the action representation through unsupervised environmental dynamics prediction and action transition scale. Based on MARS, the RL algorithms optimize policies in the learned representation space and interact with the environment by decoding the latent actions to the original ones. MARS outperforms the existing state-of-the-art baselines in a variety of fragmentary interaction real-time control tasks. Further, MARS significantly improves the performance of high-frequency robot control tasks based on fragmentary interaction in the real-world.",
        "keywords": "Deep Reinforcement Learning; Representation Learning; Real-time control",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/78bee4b944d6041258c578dffb590c9dd7947463.pdf",
        "author": "Jiashun Liu;Xiaotian Hao;Jianye HAO;YAN ZHENG;Yujing Hu;Lixing Liu;Tangjie Lv;Changjie Fan;Zhipeng Hu",
        "authorids": "~Jiashun_Liu1;~Xiaotian_Hao1;~Jianye_HAO1;~YAN_ZHENG1;~Yujing_Hu2;~Lixing_Liu2;~Tangjie_Lv1;~Changjie_Fan1;~Zhipeng_Hu1",
        "gender": "M;M;M;M;;F;M;M;M",
        "homepage": ";;http://www.icdai.org/jianye.html;https://yanzzzzz.github.io;;https://ieeexplore.ieee.org/author/37088998104;;;",
        "dblp": ";144/3359;21/7664.html;10/2381-2;https://dblp.uni-trier.de/pid/160/1923.html;;;71/882;",
        "google_scholar": "iAYyfMAAAAAJ;xgk9NPwAAAAJ;;https://scholar.google.com.hk/citations?user=tJuhd1kAAAAJ;IR5WY-wAAAAJ;;EIuWpJcAAAAJ;;",
        "orcid": ";;0000-0002-0422-8235;;;;0000-0001-9858-809X;0000-0001-5420-0516;0000-0003-4367-0816",
        "linkedin": ";;;;;;;;zhipeng-hu-471b5346?trk=pub-pbmap&originalSubdomain=bd",
        "or_profile": "~Jiashun_Liu1;~Xiaotian_Hao1;~Jianye_HAO1;~YAN_ZHENG1;~Yujing_Hu2;~Lixing_Liu2;~Tangjie_Lv1;~Changjie_Fan1;~Zhipeng_Hu1",
        "aff": "Tianjin University;university  of tianjin of china, Tianjin University;Tianjin University;Tianjin Unibersity, China;NetEase, Inc.;Nankai University;NetEase, Inc.;Netease, Fuxi AI Lab;Zhejiang University, Tsinghua University",
        "aff_domain": "tju.edu.cn;tju.edu.cn;tju.edu.cn;tju.edu.cn;corp.netease.com;nku.nankai.edu.cn;netease.com;corp.netease.com;zju.edu.cn",
        "position": "MS student;PhD student;Associate Professor;Associate Professor;Researcher;PhD student;Researcher;Principal Researcher;PhD student",
        "bibtex": "@misc{\nliu2024addressing,\ntitle={Addressing Real-Time  Fragmentary Interaction Control Problems via Muti-step Representation Reinforcement Learning},\nauthor={Jiashun Liu and Xiaotian Hao and Jianye HAO and YAN ZHENG and Yujing Hu and Lixing Liu and Tangjie Lv and Changjie Fan and Zhipeng Hu},\nyear={2024},\nurl={https://openreview.net/forum?id=dkn9cEOQkU}\n}",
        "github": "",
        "project": "",
        "reviewers": "XM6T;cdnx;GKKU;3YNf",
        "site": "https://openreview.net/forum?id=dkn9cEOQkU",
        "pdf_size": 2468963,
        "rating": "5;5;6;6",
        "confidence": "2;4;3;3",
        "soundness": "2;3;3;2",
        "contribution": "2;2;3;2",
        "presentation": "2;3;4;3",
        "wc_summary": "110;256;89;169",
        "wc_strengths": "19;54;47;64",
        "wc_weaknesses": "52;191;62;79",
        "wc_questions": "37;33;84;229",
        "wc_review": "218;534;282;541",
        "wc_reply_reviewers": "0;97;123;155",
        "wc_reply_authors": "1229;610;396;942",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "3;2;1;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            156.0,
            64.75723897758458
        ],
        "wc_strengths_avg": [
            46.0,
            16.718253497300488
        ],
        "wc_weaknesses_avg": [
            96.0,
            55.69111239686275
        ],
        "wc_questions_avg": [
            95.75,
            79.5027515247114
        ],
        "wc_review_avg": [
            393.75,
            145.5410165554714
        ],
        "wc_reply_reviewers_avg": [
            93.75,
            57.89376045827391
        ],
        "wc_reply_authors_avg": [
            794.25,
            317.5644619600877
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:S7UjHXENQZUJ:scholar.google.com/&scioq=Addressing+Real-Time+Fragmentary+Interaction+Control+Problems+via+Muti-step+Representation+Reinforcement+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;1;2;1;3;4",
        "aff_unique_norm": "Tianjin University;NetEase, Inc.;Nankai University;Netease;Zhejiang University",
        "aff_unique_dep": ";;;Fuxi AI Lab;",
        "aff_unique_url": "http://www.tju.edu.cn;https://www.163.com;http://www.nankai.edu.cn;https://www.netease.com;http://www.zju.edu.cn",
        "aff_unique_abbr": "TJU;NetEase;NKU;Netease;ZJU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Tianjin",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Retro-fallback: retrosynthetic planning in an uncertain world",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18248",
        "id": "dl0u4ODCuW",
        "author_site": "Austin Tripp, Krzysztof Maziarz, Sarah Lewis, Marwin Segler, Jos\u00e9 Miguel Hern\u00e1ndez Lobato",
        "tldr": "",
        "abstract": "Retrosynthesis is the task of planning a series of chemical reactions to create a desired molecule from simpler, buyable molecules. While previous works have proposed algorithms to find optimal solutions for a range of metrics (e.g. shortest, lowest-cost), these works generally overlook the fact that we have imperfect knowledge of the space of possible reactions, meaning plans created by algorithms may not work in a laboratory. In this paper we propose a novel formulation of retrosynthesis in terms of stochastic processes to account for this uncertainty. We then propose a novel greedy algorithm called retro-fallback which maximizes the probability that at least one synthesis plan can be executed in the lab. Using in-silico benchmarks we demonstrate that retro-fallback generally produces better sets of synthesis plans than the popular MCTS and retro* algorithms.",
        "keywords": "Retrosynthesis;planning;chemistry;search",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/c4a685de54eb295458ff56b7f5a3af9fcf73f791.zip",
        "author": "Austin Tripp;Krzysztof Maziarz;Sarah Lewis;Marwin Segler;Jos\u00e9 Miguel Hern\u00e1ndez-Lobato",
        "authorids": "~Austin_Tripp1;~Krzysztof_Maziarz1;~Sarah_Lewis1;~Marwin_Segler2;~Jos\u00e9_Miguel_Hern\u00e1ndez-Lobato1",
        "gender": "M;M;;;",
        "homepage": "https://www.austintripp.ca/;;;http://jmhl.org;",
        "dblp": "267/5455;194/2971;;40/6058;185/0993",
        "google_scholar": "WAvRaxMAAAAJ;BA8bBVkAAAAJ;;BEBccCQAAAAJ;imsL94QAAAAJ",
        "orcid": "0000-0002-0138-7740;;;0000-0001-7610-949X;",
        "linkedin": ";;sarah-lewis-3b725aa2;;",
        "or_profile": "~Austin_Tripp1;~Krzysztof_Maziarz1;~Sarah_Lewis1;~Jose_Miguel_Hernandez_Lobato1;~Marwin_Segler1",
        "aff": "University of Cambridge;Microsoft Research;Microsoft Research;University of Cambridge;Microsoft",
        "aff_domain": "cam.ac.uk;microsoft.com;research.microsoft.com;cam.ac.uk;microsoft.com",
        "position": "PhD student;Senior Researcher;Researcher;Associate Professor;Researcher",
        "bibtex": "@inproceedings{\ntripp2024retrofallback,\ntitle={Retro-fallback: retrosynthetic planning in an uncertain world},\nauthor={Austin Tripp and Krzysztof Maziarz and Sarah Lewis and Marwin Segler and Jos{\\'e} Miguel Hern{\\'a}ndez-Lobato},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=dl0u4ODCuW}\n}",
        "github": "",
        "project": "",
        "reviewers": "1DzG;ghCd;L6R1",
        "pdf_size": 1744710,
        "rating": "6;6;6",
        "confidence": "4;3;4",
        "soundness": "2;3;3",
        "contribution": "2;3;2",
        "presentation": "3;3;3",
        "wc_summary": "43;74;30",
        "wc_strengths": "38;73;27",
        "wc_weaknesses": "79;88;11",
        "wc_questions": "18;115;391",
        "wc_review": "178;350;459",
        "wc_reply_reviewers": "30;0;224",
        "wc_reply_authors": "375;645;1563",
        "reply_reviewers": "1;0;2",
        "reply_authors": "2;2;4",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            49.0,
            18.457157599876172
        ],
        "wc_strengths_avg": [
            46.0,
            19.61292091114087
        ],
        "wc_weaknesses_avg": [
            59.333333333333336,
            34.373762603991366
        ],
        "wc_questions_avg": [
            174.66666666666666,
            158.01336089781213
        ],
        "wc_review_avg": [
            329.0,
            115.6748316042287
        ],
        "wc_reply_reviewers_avg": [
            84.66666666666667,
            99.28186586123817
        ],
        "wc_reply_authors_avg": [
            861.0,
            508.48008810571923
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2996353149297127705&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=dl0u4ODCuW",
        "pdf": "https://openreview.net/pdf?id=dl0u4ODCuW",
        "email": "cam.ac.uk;microsoft.com;research.microsoft.com;cam.ac.uk;microsoft.com",
        "author_num": 5,
        "aff_unique_index": "0;1;1;0;1",
        "aff_unique_norm": "University of Cambridge;Microsoft",
        "aff_unique_dep": ";Microsoft Research",
        "aff_unique_url": "https://www.cam.ac.uk;https://www.microsoft.com/en-us/research",
        "aff_unique_abbr": "Cambridge;MSR",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Cambridge;",
        "aff_country_unique_index": "0;1;1;0;1",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "id": "dl34rOnbqJ",
        "title": "Actions-to-Action: Inductive Attention for Egocentric Video Action Anticipation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Video action anticipation is a specific field within computer vision that diverges from action recognition, requiring the prediction of future actions through the analysis of historical video sequences. This paper unveils an innovative model designed to overcome the limitations of existing solutions by amalgamating recurrent and attention mechanisms, taking cues from the principles of object tracking. Notably, our model leverages prior anticipation results, enabling a nuanced interpretation of semantic transitions between actions and recognizing the uncertainty inherent in predicting future events. This strategy strikes a balance between computational efficiency and judicious data utilization, challenging the assumptions prevalent in current transformer models and thereby underlining its practicality for real-world applications. Distinctively, our model discerns temporal connection from abstract concepts in a way that mirrors human reasoning and adopts a recurrent structure to thoroughly capture video context. Extensive experiments conducted on EPIC-Kitchens-100, EPIC-Kitchens-55, and EGTEA Gaze+ confirm the superior performance of our proposed model and efficiency compared to established transformer architectures. Remarkably, it surpasses most multi-modality models using only RGB visual inputs, showcasing its exceptional generalization capabilities across a variety of unseen test sets.",
        "keywords": "egocentric video;action anticipation;attention;recurrent",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/a6d721d76a87ec448fe4c1bc338cc3cd0e817bf9.pdf",
        "author": "Tsung-Ming Tai;Giuseppe Fiameni;Oswald Lanz",
        "authorids": "~Tsung-Ming_Tai1;~Giuseppe_Fiameni1;~Oswald_Lanz3",
        "gender": ";M;M",
        "homepage": ";https://www.linkedin.com/in/giuseppefiameni/;https://www.unibz.it/en/faculties/engineering/academic-staff/person/46208-oswald-lanz",
        "dblp": "206/9805;96/10002;02/1449.html",
        "google_scholar": "T5_GvzMAAAAJ;Se2mLvIAAAAJ;https://scholar.google.it/citations?user=vpmV4xcAAAAJ",
        "orcid": ";0000-0001-8687-6609;",
        "linkedin": ";giuseppefiameni/;",
        "or_profile": "~Tsung-Ming_Tai1;~Giuseppe_Fiameni1;~Oswald_Lanz3",
        "aff": "NVIDIA;NVIDIA;Free University of Bozen-Bolzano",
        "aff_domain": "nvidia.com;nvidia.com;unibz.it",
        "position": "Researcher;Data Scientist;Professor",
        "bibtex": "@misc{\ntai2024actionstoaction,\ntitle={Actions-to-Action: Inductive Attention for Egocentric Video Action Anticipation},\nauthor={Tsung-Ming Tai and Giuseppe Fiameni and Oswald Lanz},\nyear={2024},\nurl={https://openreview.net/forum?id=dl34rOnbqJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "nTno;omT8;Uc4h;2chi;gdBN",
        "site": "https://openreview.net/forum?id=dl34rOnbqJ",
        "pdf_size": 2936471,
        "rating": "3;3;5;5;6",
        "confidence": "5;3;3;5;3",
        "soundness": "2;2;3;3;2",
        "contribution": "1;2;3;2;2",
        "presentation": "2;2;3;2;3",
        "wc_summary": "72;106;86;78;46",
        "wc_strengths": "32;18;59;57;33",
        "wc_weaknesses": "134;98;501;93;227",
        "wc_questions": "25;107;54;3;52",
        "wc_review": "263;329;700;231;358",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "526;518;1367;695;1178",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "1;1;2;1;3",
        "rating_avg": [
            4.4,
            1.2
        ],
        "confidence_avg": [
            3.8,
            0.9797958971132712
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            2.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            77.6,
            19.530488985173925
        ],
        "wc_strengths_avg": [
            39.8,
            15.791136754521505
        ],
        "wc_weaknesses_avg": [
            210.6,
            152.9556798553097
        ],
        "wc_questions_avg": [
            48.2,
            34.89068643635433
        ],
        "wc_review_avg": [
            376.2,
            168.1087743099687
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            856.8,
            350.3902966692999
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.6,
            0.8
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.2721655269759087,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:_rvwafpozl4J:scholar.google.com/&scioq=Actions-to-Action:+Inductive+Attention+for+Egocentric+Video+Action+Anticipation&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "NVIDIA;Free University of Bozen-Bolzano",
        "aff_unique_dep": "NVIDIA Corporation;",
        "aff_unique_url": "https://www.nvidia.com;https://www.unibz.it",
        "aff_unique_abbr": "NVIDIA;UNIBZ",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "United States;Italy"
    },
    {
        "title": "Noise-free Score Distillation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18247",
        "id": "dlIMcmlAdk",
        "author_site": "Oren Katzir, Or Patashnik, Daniel Cohen-Or, Dani Lischinski",
        "tldr": "",
        "abstract": "Score Distillation Sampling (SDS) has emerged as the de facto approach for text-to-content generation in non-image domains. In this paper, we reexamine the SDS process and introduce a straightforward interpretation that demystifies the necessity for large Classifier-Free Guidance (CFG) scales, rooted in the distillation of an undesired noise term. Building upon our interpretation, we propose a novel Noise-Free Score Distillation (NFSD) process, which requires minimal modifications to the original SDS framework. Through this streamlined design, we achieve more effective distillation of pre-trained text-to-image diffusion models while using a nominal CFG scale. This strategic choice allows us to prevent the over-smoothing of results, ensuring that the generated data is both realistic and complies with the desired prompt. To demonstrate the efficacy of NFSD, we provide qualitative examples that compare NFSD and SDS, as well as several other methods.",
        "keywords": "score distillation sampling;generative models;text to image",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/ebec65598c8b2ccd2519845ee90e9213ed59ca71.zip",
        "author": "Oren Katzir;Or Patashnik;Daniel Cohen-Or;Dani Lischinski",
        "authorids": "~Oren_Katzir1;~Or_Patashnik1;~Daniel_Cohen-Or1;~Dani_Lischinski2",
        "gender": "M;F;M;M",
        "homepage": "https://orenkatzir.github.io/;https://orpatashnik.github.io/;http://www.cs.tau.ac.il/~dcor/;https://www.cs.huji.ac.il/~danix/",
        "dblp": ";271/8264;c/DCohenOr;29/19",
        "google_scholar": "https://scholar.google.co.il/citations?user=h0NDeF8AAAAJ;-SlS0mgAAAAJ;https://scholar.google.com.tw/citations?user=fAxws1sAAAAJ;haahCZ4AAAAJ",
        "orcid": ";;0000-0001-6777-7445;0000-0002-6191-0361",
        "linkedin": ";;;",
        "or_profile": "~Oren_Katzir1;~Or_Patashnik1;~Daniel_Cohen-Or1;~Dani_Lischinski2",
        "aff": "Tel Aviv University;Tel Aviv University;Tel Aviv University;The Hebrew University of Jerusalem, Israel",
        "aff_domain": "tau.ac.il;tau.post.ac.il;tau.ac.il;cs.huji.ac.il",
        "position": "PhD student;PhD student;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nkatzir2024noisefree,\ntitle={Noise-free Score Distillation},\nauthor={Oren Katzir and Or Patashnik and Daniel Cohen-Or and Dani Lischinski},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=dlIMcmlAdk}\n}",
        "github": "",
        "project": "",
        "reviewers": "EnYB;opTp;eQLa;wypJ",
        "pdf_size": 24341952,
        "rating": "6;6;6;8",
        "confidence": "3;5;5;4",
        "soundness": "3;3;3;4",
        "contribution": "3;2;3;3",
        "presentation": "3;4;3;4",
        "wc_summary": "50;88;109;74",
        "wc_strengths": "60;112;44;47",
        "wc_weaknesses": "170;143;74;51",
        "wc_questions": "6;68;483;4",
        "wc_review": "286;411;710;176",
        "wc_reply_reviewers": "178;0;133;0",
        "wc_reply_authors": "589;700;1375;202",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "2;1;3;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            80.25,
            21.45198126048035
        ],
        "wc_strengths_avg": [
            65.75,
            27.371289702898547
        ],
        "wc_weaknesses_avg": [
            109.5,
            48.64411577981452
        ],
        "wc_questions_avg": [
            140.25,
            199.55246803785715
        ],
        "wc_review_avg": [
            395.75,
            199.57501722410046
        ],
        "wc_reply_reviewers_avg": [
            77.75,
            79.36112083381887
        ],
        "wc_reply_authors_avg": [
            716.5,
            422.7472649231453
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.17407765595569782,
        "gs_citation": 72,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4723546409147195486&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=dlIMcmlAdk",
        "pdf": "https://openreview.net/pdf?id=dlIMcmlAdk",
        "email": "tau.ac.il;tau.post.ac.il;tau.ac.il;cs.huji.ac.il",
        "author_num": 4,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "Tel Aviv University;Hebrew University of Jerusalem",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tau.ac.il;https://www.huji.ac.il",
        "aff_unique_abbr": "TAU;HUJI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Israel"
    },
    {
        "title": "Towards Optimal Feature-Shaping Methods for Out-of-Distribution Detection",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18246",
        "id": "dm8e7gsH0d",
        "author_site": "Qinyu Zhao, Ming Xu, Kartik Gupta, Akshay Asthana, Liang Zheng, Stephen Gould",
        "tldr": "",
        "abstract": "Feature shaping refers to a family of methods that exhibit state-of-the-art performance for out-of-distribution (OOD) detection. These approaches manipulate the feature representation, typically from the penultimate layer of a pre-trained deep learning model, so as to better differentiate between in-distribution (ID) and OOD samples. However, existing feature-shaping methods usually employ rules manually designed for specific model architectures and OOD datasets, which consequently limit their generalization ability. To address this gap, we first formulate an abstract optimization framework for studying feature-shaping methods. We then propose a concrete reduction of the framework with a simple piecewise constant shaping function and show that existing feature-shaping methods approximate the optimal solution to the concrete optimization problem. Further, assuming that OOD data is inaccessible, we propose a formulation that yields a closed-form solution for the piecewise constant shaping function, utilizing solely the ID data. Through extensive experiments, we show that the feature-shaping function optimized by our method improves the generalization ability of OOD detection across a large variety of datasets and model architectures. Our code is available at https://github.com/Qinyu-Allen-Zhao/OptFSOOD.",
        "keywords": "feature shaping;out-of-distribution detection;optimization problem;generalizability",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/2d611b175913fbfec41a78e981204e4be9733a4e.zip",
        "author": "Qinyu Zhao;Ming Xu;Kartik Gupta;Akshay Asthana;Liang Zheng;Stephen Gould",
        "authorids": "~Qinyu_Zhao1;~Ming_Xu5;~Kartik_Gupta2;~Akshay_Asthana2;~Liang_Zheng4;~Stephen_Gould1",
        "gender": "M;M;;M;M;M",
        "homepage": "https://www.researchgate.net/profile/Qin-Yu-Zhao;;;;http://zheng-lab.cecs.anu.edu.au/;http://users.cecs.anu.edu.au/~sgould/",
        "dblp": ";43/3362-15;;;61/7360-1;89/1569.html",
        "google_scholar": "2-QO-bYAAAAJ;https://scholar.google.com/citations?hl=en;;SEolNVkAAAAJ;https://scholar.google.com.au/citations?user=vNHqr3oAAAAJ;YvdzeM8AAAAJ",
        "orcid": ";;;;;0000-0001-8929-7899",
        "linkedin": ";ming-xu-2a21a754/;;;liang-zheng-76341311a/;",
        "or_profile": "~Qinyu_Zhao1;~Ming_Xu5;~Kartik_Gupta2;~Akshay_Asthana2;~Liang_Zheng4;~Stephen_Gould1",
        "aff": "Australian National University;Australian National University;;Seeing Machines;Australian National University;Australian National University",
        "aff_domain": "anu.edu.au;anu.edu.au;;seeingmachines.com;anu.edu.au;anu.edu.au",
        "position": "PhD student;Postdoc;;Principal Researcher;Associate Professor;Full Professor",
        "bibtex": "@inproceedings{\nzhao2024towards,\ntitle={Towards Optimal Feature-Shaping Methods for Out-of-Distribution Detection},\nauthor={Qinyu Zhao and Ming Xu and Kartik Gupta and Akshay Asthana and Liang Zheng and Stephen Gould},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=dm8e7gsH0d}\n}",
        "github": "",
        "project": "",
        "reviewers": "bZUo;c5SY;kmFm",
        "pdf_size": 501294,
        "rating": "6;6;6",
        "confidence": "4;3;4",
        "soundness": "3;3;3",
        "contribution": "2;2;3",
        "presentation": "3;2;3",
        "wc_summary": "132;62;53",
        "wc_strengths": "25;19;63",
        "wc_weaknesses": "84;162;58",
        "wc_questions": "2;14;25",
        "wc_review": "243;257;199",
        "wc_reply_reviewers": "0;521;0",
        "wc_reply_authors": "553;1688;917",
        "reply_reviewers": "0;3;0",
        "reply_authors": "1;7;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            82.33333333333333,
            35.31131389355102
        ],
        "wc_strengths_avg": [
            35.666666666666664,
            19.48218559493661
        ],
        "wc_weaknesses_avg": [
            101.33333333333333,
            44.19150245113747
        ],
        "wc_questions_avg": [
            13.666666666666666,
            9.392668535736913
        ],
        "wc_review_avg": [
            233.0,
            24.711670657134185
        ],
        "wc_reply_reviewers_avg": [
            173.66666666666666,
            245.6017553321275
        ],
        "wc_reply_authors_avg": [
            1052.6666666666667,
            473.18800585907593
        ],
        "reply_reviewers_avg": [
            1.0,
            1.4142135623730951
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            2.6246692913372702
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11812974842698670016&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=dm8e7gsH0d",
        "pdf": "https://openreview.net/pdf?id=dm8e7gsH0d",
        "email": "anu.edu.au;anu.edu.au;;seeingmachines.com;anu.edu.au;anu.edu.au",
        "author_num": 6,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "Australian National University;Seeing Machines",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.anu.edu.au;https://www.seeingmachines.com/",
        "aff_unique_abbr": "ANU;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Australia"
    },
    {
        "id": "dn87xnULwF",
        "title": "Maximally Expressive GNNs for Outerplanar Graphs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We propose a _linear time_ graph transformation that enables the Weisfeiler-Leman (WL) test and message passing graph neural networks (MPNNs) to be maximally expressive on _outerplanar_ graphs. Our approach is motivated by the fact that most pharmaceutical molecules correspond to outerplanar graphs. Existing research predominantly enhances the expressivity of graph neural networks without specific graph families in mind. This often leads to methods that are impractical due to their computational complexity. In contrast, the restriction to outerplanar graphs enables us to encode the Hamiltonian cycle of each biconnected component in linear time. As the main contribution of the paper we prove that our method achieves maximum expressivity on outerplanar graphs. Experiments confirm that our graph transformation improves the predictive performance of MPNNs on molecular benchmark datasets at negligible computational overhead.",
        "keywords": "expressive graph representation learning;outerplanar graphs",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Franka Bause;Fabian Jogl;Patrick Indri;Tamara Drucks;David Penz;Nils Morten Kriege;Thomas G\u00e4rtner;Pascal Welke;Maximilian Thiessen",
        "authorids": "~Franka_Bause1;~Fabian_Jogl1;~Patrick_Indri1;~Tamara_Drucks1;~David_Penz1;~Nils_Morten_Kriege1;~Thomas_G\u00e4rtner2;~Pascal_Welke1;~Maximilian_Thiessen1",
        "gender": ";M;;F;;M;M;M;",
        "homepage": "https://dm.cs.univie.ac.at/team/person/112939/;https://fjo.gl/;;https://informatics.tuwien.ac.at/people/tamara-drucks;https://www.davidpenz.ml;https://kriegegroup.univie.ac.at/;https://thomasgaertner.org/;https://pwelke.de;https://maxthiessen.github.io",
        "dblp": "234/8688;292/7003;;;307/7386;97/8178;https://dblp.uni-trier.de/pers/hd/g/G=auml=rtner_0001:Thomas;174/0119;https://dblp.uni-trier.de/pid/274/6633",
        "google_scholar": "UTQlpH8AAAAJ;;;0vCiYA4AAAAJ;;https://scholar.google.de/citations?user=wGT17PcAAAAJ;sOI8QyoAAAAJ;https://scholar.google.de/citations?user=hgwvC6gAAAAJ;https://scholar.google.de/citations?user=XO5rGcwAAAAJ",
        "orcid": "0000-0003-4202-3692;;;;;0000-0003-2645-947X;0000-0001-5985-9213;0000-0002-2123-3781;0000-0001-9333-2685",
        "linkedin": ";;;;;;;;maximilian-thiessen/",
        "or_profile": "~Franka_Bause1;~Fabian_Jogl1;~Patrick_Indri1;~Tamara_Drucks1;~David_Penz1;~Nils_Morten_Kriege1;~Thomas_G\u00e4rtner2;~Pascal_Welke1;~Maximilian_Thiessen1",
        "aff": "Universit\u00e4t Vienna;TU Wien;;NII, Tokyo Institute of Technology;Johannes Kepler Universit\u00e4t Linz;Universit\u00e4t Vienna;TU Wien;TU Wien;TU Wien",
        "aff_domain": "univie.ac.at;tuwien.ac.at;;nii.ac.jp;jku.at;univie.ac.at;tuwien.ac.at;tuwien.ac.at;tuwien.ac.at",
        "position": "PhD student;PhD student;;Intern;PhD student;Associate Professor;Full Professor;Postdoc;PhD student",
        "bibtex": "@misc{\nbause2024maximally,\ntitle={Maximally Expressive {GNN}s for Outerplanar Graphs},\nauthor={Franka Bause and Fabian Jogl and Patrick Indri and Tamara Drucks and David Penz and Nils Morten Kriege and Thomas G{\\\"a}rtner and Pascal Welke and Maximilian Thiessen},\nyear={2024},\nurl={https://openreview.net/forum?id=dn87xnULwF}\n}",
        "github": "",
        "project": "",
        "reviewers": "geBr;DqdD;zczo;vp7g;CdS8",
        "site": "https://openreview.net/forum?id=dn87xnULwF",
        "pdf_size": 875775,
        "rating": "3;5;5;6;6",
        "confidence": "5;4;3;3;3",
        "soundness": "2;3;3;3;3",
        "contribution": "1;3;2;3;3",
        "presentation": "2;3;3;3;2",
        "wc_summary": "142;141;81;85;70",
        "wc_strengths": "62;111;47;65;128",
        "wc_weaknesses": "373;388;248;97;83",
        "wc_questions": "5;74;6;26;1",
        "wc_review": "582;714;382;273;282",
        "wc_reply_reviewers": "334;0;0;36;0",
        "wc_reply_authors": "1078;849;384;298;205",
        "reply_reviewers": "2;0;0;1;0",
        "reply_authors": "3;3;2;2;3",
        "rating_avg": [
            5.0,
            1.0954451150103321
        ],
        "confidence_avg": [
            3.6,
            0.8
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.4,
            0.8
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            103.8,
            31.173065296823154
        ],
        "wc_strengths_avg": [
            82.6,
            31.206409598029694
        ],
        "wc_weaknesses_avg": [
            237.8,
            130.17741739641326
        ],
        "wc_questions_avg": [
            22.4,
            27.22204988607581
        ],
        "wc_review_avg": [
            446.6,
            173.9190616350031
        ],
        "wc_reply_reviewers_avg": [
            74.0,
            130.74555441773154
        ],
        "wc_reply_authors_avg": [
            562.8,
            339.8384321997734
        ],
        "reply_reviewers_avg": [
            0.6,
            0.7999999999999999
        ],
        "reply_authors_avg": [
            2.6,
            0.4898979485566356
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -0.912870929175277,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15675242832191650648&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 11,
        "aff_unique_index": "0;1;2;3;0;1;1;1",
        "aff_unique_norm": "University of Vienna;Technische Universit\u00e4t Wien;Tokyo Institute of Technology;Johannes Kepler University Linz",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://univie.ac.at;https://www.tuwien.ac.at;https://www.titech.ac.jp;https://www.jku.at",
        "aff_unique_abbr": "UV;TU Wien;Titech;JKU",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Tokyo;Linz",
        "aff_country_unique_index": "0;0;1;0;0;0;0;0",
        "aff_country_unique": "Austria;Japan"
    },
    {
        "id": "dnaCBAP7X2",
        "title": "An Implicit Watermark Framework for Adversary Identification",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Security of deep neural networks based machine learning systems has been an emerging research topic, especially after the discovery of adversarial attacks. In general, however, it is very difficult to build a machine learning system that is resistant to different types of attacks. Instead of directly improving the robustness of neural networks, Cheng et al. proposed the first framework to trace the first compromised model under the black-box adversarial attack in a forensic view. However, the black-box assumption has limited the usage of the framework since users will require detailed model information to facilitate their own use in the modern MLaaS system. In this paper, instead of considering the limited black-box attacks, we investigate more general and harder white-box setting where all users will have full access to model. Explicit modification on the model architecture during the inference will be no longer effective because those mechanisms could be easily bypassed by adversary. To address this challenge, a novel identification framework is proposed that can achieve high tracking accuracy to trace the source of white-box adversarial attack. Specifically, to differentiate adversarial examples generated from different copies, we first design an implicit watermark from backdooring before the model distribution. Then we design a data-free method to identify the adversary with only adversarial example available. Extensive experiments on different attacks including both white-box and black-box attacks, datasets, and model architectures verify the effectiveness of the proposed method. Our code will be made publicly available.",
        "keywords": "Adversarial attack;Forensic investigation",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/791b4cfe6ef9f02562d765e02a9a80405c6c51c9.pdf",
        "author": "Sen Li;Minhao Cheng",
        "authorids": "~Sen_Li2;~Minhao_Cheng1",
        "gender": ";M",
        "homepage": ";https://cmhcbb.github.io/",
        "dblp": ";174/1717",
        "google_scholar": ";_LkC1yoAAAAJ",
        "orcid": "0009-0002-3661-4744;0000-0003-3965-4215",
        "linkedin": ";",
        "or_profile": "~Sen_Li2;~Minhao_Cheng1",
        "aff": "Hong Kong University of Science and Technology;Pennsylvania State University",
        "aff_domain": "ust.hk;psu.edu",
        "position": "MS student;Assistant Professor",
        "bibtex": "@misc{\nli2024an,\ntitle={An Implicit Watermark Framework for Adversary Identification},\nauthor={Sen Li and Minhao Cheng},\nyear={2024},\nurl={https://openreview.net/forum?id=dnaCBAP7X2}\n}",
        "github": "",
        "project": "",
        "reviewers": "iAzC;eSsX;XRYs;BRji",
        "site": "https://openreview.net/forum?id=dnaCBAP7X2",
        "pdf_size": 312467,
        "rating": "3;3;3;5",
        "confidence": "3;4;2;4",
        "soundness": "3;2;1;3",
        "contribution": "2;2;2;2",
        "presentation": "1;3;1;2",
        "wc_summary": "225;54;71;81",
        "wc_strengths": "187;176;33;47",
        "wc_weaknesses": "238;1252;454;393",
        "wc_questions": "341;91;15;379",
        "wc_review": "991;1573;573;900",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            107.75,
            68.37899896898169
        ],
        "wc_strengths_avg": [
            110.75,
            71.02948331502913
        ],
        "wc_weaknesses_avg": [
            584.25,
            393.4846725096163
        ],
        "wc_questions_avg": [
            206.5,
            156.41211589899294
        ],
        "wc_review_avg": [
            1009.25,
            360.6926496340063
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.5222329678670935,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:-7NyJVDZutkJ:scholar.google.com/&scioq=An+Implicit+Watermark+Framework+for+Adversary+Identification&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Pennsylvania State University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ust.hk;https://www.psu.edu",
        "aff_unique_abbr": "HKUST;PSU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "SemiReward: A General Reward Model for Semi-supervised Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18245",
        "id": "dnqPvUjyRI",
        "author_site": "Siyuan Li, Weiyang Jin, Zedong Wang, Fang Wu, Zicheng Liu, Cheng Tan, Stan Z Li",
        "tldr": "",
        "abstract": "Semi-supervised learning (SSL) has witnessed great progress with various improvements in the self-training framework with pseudo labeling. The main challenge is how to distinguish high-quality pseudo labels against the confirmation bias. However, existing pseudo-label selection strategies are limited to pre-defined schemes or complex hand-crafted policies specially designed for classification, failing to achieve high-quality labels, fast convergence, and task versatility simultaneously. To these ends, we propose a Semi-supervised Reward framework (SemiReward) that predicts reward scores to evaluate and filter out high-quality pseudo labels, which is pluggable to mainstream SSL methods in wide task types and scenarios. To mitigate confirmation bias, SemiReward is trained online in two stages with a generator model and subsampling strategy. With classification and regression tasks on 13 standard SSL benchmarks across three modalities, extensive experiments verify that SemiReward achieves significant performance gains and faster convergence speeds upon Pseudo Label, FlexMatch, and Free/SoftMatch. Code and models are available at https://github.com/Westlake-AI/SemiReward.",
        "keywords": "Semi-supervised Learning;Reward Model;Representation Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/f176107f4484e38fe20c81373d345339d2479021.zip",
        "author": "Siyuan Li;Weiyang Jin;Zedong Wang;Fang Wu;Zicheng Liu;Cheng Tan;Stan Z. Li",
        "authorids": "~Siyuan_Li6;~Weiyang_Jin1;~Zedong_Wang1;~Fang_Wu1;~Zicheng_Liu2;~Cheng_Tan1;~Stan_Z._Li2",
        "gender": "M;M;M;;M;M;",
        "homepage": "https://lupin1998.github.io/;;https://jacky1128.github.io;;;https://chengtan9907.github.io/;",
        "dblp": "63/9705-2;344/6132;179/8811.html;;l/ZichengLiu-6;70/1533-12.html;",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;;https://scholar.google.com/citations?hl=en;;https://scholar.google.com/citations?hl=zh-CN;6kTV6aMAAAAJ;",
        "orcid": "0000-0001-6806-2468;0000-0001-5351-1400;0009-0000-0112-0491;;;;",
        "linkedin": "https://www.linkedin.cn/incareer/in/siyuan-li-lupin1998/;;;;;;",
        "or_profile": "~Siyuan_Li6;~Weiyang_Jin1;~Zedong_Wang1;~Fang_Wu1;~Zicheng_Liu2;~Cheng_Tan1;~Stan_Z._Li2",
        "aff": "Alibaba Group;Beijing Jiaotong University;Westlake University;;Zhejiang University;Zhejiang University & Westlake University;",
        "aff_domain": "alibaba-inc.com;bjtu.edu.cn;westlake.edu;;zju.edu.cn;westlake.edu.cn;",
        "position": "Intern;Undergrad student;Intern;;PhD student;PhD student;",
        "bibtex": "@inproceedings{\nli2024semireward,\ntitle={SemiReward: A General Reward Model for Semi-supervised Learning},\nauthor={Siyuan Li and Weiyang Jin and Zedong Wang and Fang Wu and Zicheng Liu and Cheng Tan and Stan Z. Li},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=dnqPvUjyRI}\n}",
        "github": "",
        "project": "",
        "reviewers": "DH5L;uket;xKm4",
        "pdf_size": 1570194,
        "rating": "6;6;6",
        "confidence": "5;5;4",
        "soundness": "3;3;2",
        "contribution": "3;3;2",
        "presentation": "3;3;3",
        "wc_summary": "74;145;49",
        "wc_strengths": "47;73;44",
        "wc_weaknesses": "41;76;177",
        "wc_questions": "2;21;36",
        "wc_review": "164;315;306",
        "wc_reply_reviewers": "35;27;138",
        "wc_reply_authors": "1539;871;1778",
        "reply_reviewers": "1;1;2",
        "reply_authors": "5;3;5",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            89.33333333333333,
            40.663934334438856
        ],
        "wc_strengths_avg": [
            54.666666666666664,
            13.021349989749739
        ],
        "wc_weaknesses_avg": [
            98.0,
            57.659922534345
        ],
        "wc_questions_avg": [
            19.666666666666668,
            13.912424503139471
        ],
        "wc_review_avg": [
            261.6666666666667,
            69.1584332448971
        ],
        "wc_reply_reviewers_avg": [
            66.66666666666667,
            50.545908725522864
        ],
        "wc_reply_authors_avg": [
            1396.0,
            383.8393761284356
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 22,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15910274660720196824&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=dnqPvUjyRI",
        "pdf": "https://openreview.net/pdf?id=dnqPvUjyRI",
        "email": "alibaba-inc.com;bjtu.edu.cn;westlake.edu;;zju.edu.cn;westlake.edu.cn;",
        "author_num": 7,
        "aff_unique_index": "0;1;2;3;3",
        "aff_unique_norm": "Alibaba Group;Beijing Jiao Tong University;Westlake University;Zhejiang University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.alibaba.com;http://www.njtu.edu.cn/en;https://www.westlake.edu.cn;https://www.zju.edu.cn",
        "aff_unique_abbr": "Alibaba;BJTU;WU;ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Periodicity Decoupling Framework for Long-term Series Forecasting",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18244",
        "id": "dp27P5HBBt",
        "author_site": "Tao Dai, Beiliang Wu, Peiyuan Liu, Naiqi Li, Jigang Bao, Yong Jiang, Shu-Tao Xia",
        "tldr": "",
        "abstract": "Convolutional neural network (CNN)-based and Transformer-based methods have recently made significant strides in time series forecasting, which excel at modeling local temporal variations or capturing long-term dependencies. However, real-world time series usually contain intricate temporal patterns, thus making it challenging for existing methods that mainly focus on temporal variations modeling from the 1D time series directly. Based on the intrinsic periodicity of time series, we propose a novel Periodicity Decoupling Framework (PDF) to capture 2D temporal variations of decoupled series for long-term series forecasting. Our PDF mainly consists of three components: multi-periodic decoupling block (MDB), dual variations modeling block (DVMB), and variations aggregation block (VAB). Unlike the previous methods that model 1D temporal variations, our PDF mainly models 2D temporal variations, decoupled from 1D time series by MDB. After that, DVMB attempts to further capture short-term and long-term variations, followed by VAB to make final predictions. Extensive experimental results across seven real-world long-term time series datasets demonstrate the superiority of our method over other state-of-the-art methods, in terms of both forecasting performance and computational efficiency. Code is available at https://github.com/Hank0626/PDF.",
        "keywords": "Long-term time series forecasting;Transformer;CNN",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/af75d7b944def30bd8774f9a8338b05efd04f540.zip",
        "author": "Tao Dai;Beiliang Wu;Peiyuan Liu;Naiqi Li;Jigang Bao;Yong Jiang;Shu-Tao Xia",
        "authorids": "~Tao_Dai3;~Beiliang_Wu1;~Peiyuan_Liu1;~Naiqi_Li1;~Jigang_Bao1;~Yong_Jiang3;~Shu-Tao_Xia1",
        "gender": "M;M;M;M;M;M;M",
        "homepage": "https://csse.szu.edu.cn/pages/user/index?id=1204;https://peiyuanliu.info;https://naiqili.github.io/;https://wukongtz.com/pages_8/;;https://www.sigs.tsinghua.edu.cn/xst/list.htm;https://github.com/ClaiDenStudent",
        "dblp": "54/875-1;157/4439;117/4912;;74/1552-1.html;03/6195;",
        "google_scholar": "MqJNdaAAAAAJ;mS0R3qEAAAAJ;5K2l_wUAAAAJ;;;https://scholar.google.com.hk/citations?user=koAXTXgAAAAJ;",
        "orcid": "0000-0003-0594-6404;;;;;0000-0002-8639-982X;",
        "linkedin": ";peiyuan-liu-b7b49022b;;;;;",
        "or_profile": "~Tao_Dai3;~Peiyuan_Liu1;~Naiqi_Li1;~Jigang_Bao1;~Yong_Jiang3;~Shu-Tao_Xia1;~Alan_Wu2",
        "aff": "Department of Software Engineering, Shenzhen University;Tsinghua University;Tsinghua University;Tsinghua University;Tsinghua University;Shenzhen International Graduate School, Tsinghua University;Shenzhen University",
        "aff_domain": "szu.edu;mail.tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;sz.tsinghua.edu.cn;szu.edu.cn",
        "position": "Assistant Professor;MS student;PhD student;PhD student;Full Professor;Full Professor;MS student",
        "bibtex": "@inproceedings{\ndai2024periodicity,\ntitle={Periodicity Decoupling Framework for Long-term Series Forecasting},\nauthor={Tao Dai and Beiliang Wu and Peiyuan Liu and Naiqi Li and Jigang Bao and Yong Jiang and Shu-Tao Xia},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=dp27P5HBBt}\n}",
        "github": "",
        "project": "",
        "reviewers": "Puj1;KqCU;gS6P;fZ8f",
        "pdf_size": 1257186,
        "rating": "3;8;8;8",
        "confidence": "4;4;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;4;4;4",
        "presentation": "2;4;4;3",
        "wc_summary": "74;83;84;61",
        "wc_strengths": "17;98;94;117",
        "wc_weaknesses": "153;109;64;159",
        "wc_questions": "2;36;32;46",
        "wc_review": "246;326;274;383",
        "wc_reply_reviewers": "0;15;16;26",
        "wc_reply_authors": "845;522;660;494",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "3;1;1;1",
        "rating_avg": [
            6.75,
            2.165063509461097
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            75.5,
            9.233092656309694
        ],
        "wc_strengths_avg": [
            81.5,
            38.23937760999779
        ],
        "wc_weaknesses_avg": [
            121.25,
            38.27776769875694
        ],
        "wc_questions_avg": [
            29.0,
            16.401219466856727
        ],
        "wc_review_avg": [
            307.25,
            52.313358714576914
        ],
        "wc_reply_reviewers_avg": [
            14.25,
            9.283722313813572
        ],
        "wc_reply_authors_avg": [
            630.25,
            139.00067445879534
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 35,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4941316398634899117&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=dp27P5HBBt",
        "pdf": "https://openreview.net/pdf?id=dp27P5HBBt",
        "email": "szu.edu;mail.tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;sz.tsinghua.edu.cn;szu.edu.cn",
        "author_num": 7,
        "aff_unique_index": "0;1;1;1;1;1;0",
        "aff_unique_norm": "Shenzhen University;Tsinghua University",
        "aff_unique_dep": "Department of Software Engineering;",
        "aff_unique_url": "https://www.szu.edu.cn;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "SZU;THU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Shenzhen;",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Minimum width for universal approximation using ReLU networks on compact domain",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18243",
        "id": "dpDw5U04SU",
        "author_site": "Namjun Kim, Chanho Min, Sejun Park",
        "tldr": "",
        "abstract": "It has been shown that deep neural networks of a large enough width are universal approximators but they are not if the width is too small.\nThere were several attempts to characterize the minimum width $w_{\\min}$ enabling the universal approximation property; however, only a few of them found the exact values.\nIn this work, we show that the minimum width for $L^p$ approximation of $L^p$ functions from $[0,1]^{d_x}$ to $\\mathbb R^{d_y}$ is exactly $\\max\\\\{d_x,d_y,2\\\\}$ if an activation function is ReLU-Like (e.g., ReLU, GELU,  Softplus).\nCompared to the known result for ReLU networks, $w_{\\min}=\\max\\\\{d_x+1,d_y\\\\}$ when the domain is ${\\mathbb R^{d_x}}$, our result first shows that approximation on a compact domain requires smaller width than on ${\\mathbb R^{d_x}}$.\nWe next prove a lower bound on $w_{\\min}$ for uniform approximation using general activation functions including ReLU: $w_{\\min}\\ge d_y+1$ if $d_x<d_y\\le2d_x$. Together with our first result, this shows a dichotomy between $L^p$ and uniform approximations for general activation functions and input/output dimensions.",
        "keywords": "universal approximation;neural networks",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Namjun Kim;Chanho Min;Sejun Park",
        "authorids": "~Namjun_Kim1;~Chanho_Min1;~Sejun_Park1",
        "gender": "M;M;",
        "homepage": "https://mlath.github.io;https://biz.ajou.ac.kr/biz/faculty/prof-search-popup.do?mode=profView&empl_no=202010573&mngt_no=202010573&article_no=138933;",
        "dblp": ";;155/9882",
        "google_scholar": "ZIv20Y8AAAAJ;;",
        "orcid": ";;",
        "linkedin": "namjun-kim-a00262291/;;",
        "or_profile": "~Namjun_Kim1;~Chanho_Min1;~Sejun_Park1",
        "aff": "Korea University;Ajou University;Korea University",
        "aff_domain": "korea.ac.kr;ajou.ac.kr;korea.ac.kr",
        "position": "PhD student;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nkim2024minimum,\ntitle={Minimum width for universal approximation using Re{LU} networks on compact domain},\nauthor={Namjun Kim and Chanho Min and Sejun Park},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=dpDw5U04SU}\n}",
        "github": "",
        "project": "",
        "reviewers": "4yPi;FUZf;fZsP",
        "pdf_size": 628566,
        "rating": "5;8;8",
        "confidence": "4;5;5",
        "soundness": "3;3;4",
        "contribution": "2;2;3",
        "presentation": "3;3;4",
        "wc_summary": "116;89;67",
        "wc_strengths": "117;143;66",
        "wc_weaknesses": "138;72;67",
        "wc_questions": "23;97;415",
        "wc_review": "394;401;615",
        "wc_reply_reviewers": "0;29;27",
        "wc_reply_authors": "1052;515;721",
        "reply_reviewers": "0;1;1",
        "reply_authors": "2;1;1",
        "rating_avg": [
            7.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            90.66666666666667,
            20.038851153585515
        ],
        "wc_strengths_avg": [
            108.66666666666667,
            31.982634176829286
        ],
        "wc_weaknesses_avg": [
            92.33333333333333,
            32.355662392986005
        ],
        "wc_questions_avg": [
            178.33333333333334,
            170.05358632567035
        ],
        "wc_review_avg": [
            470.0,
            102.57030109474509
        ],
        "wc_reply_reviewers_avg": [
            18.666666666666668,
            13.224556283251582
        ],
        "wc_reply_authors_avg": [
            762.6666666666666,
            221.2002612013728
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=470291548100648815&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=dpDw5U04SU",
        "pdf": "https://openreview.net/pdf?id=dpDw5U04SU",
        "email": "korea.ac.kr;ajou.ac.kr;korea.ac.kr",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Korea University;Ajou University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.korea.ac.kr;https://www.ajou.ac.kr",
        "aff_unique_abbr": "KU;Ajou",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "Object-Aware Inversion and Reassembly for Image Editing",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18242",
        "id": "dpcVXiMlcv",
        "author_site": "Zhen Yang, Ganggui Ding, Wen Wang, Hao Chen, Bohan Zhuang, Chunhua Shen",
        "tldr": "",
        "abstract": "Diffusion-based image editing methods have achieved remarkable advances in text-driven image editing. The editing task aims to convert an input image with the original text prompt into the desired image that is well-aligned with the target text prompt. By comparing the original and target prompts, we can obtain numerous editing pairs, each comprising an object and its corresponding editing target. To allow editability while maintaining fidelity to the input image, existing editing methods typically involve a fixed number of inversion steps that project the whole input image to its noisier latent representation, followed by a denoising process guided by the target prompt. However, we find that the optimal number of inversion steps for achieving ideal editing results varies significantly among different editing pairs, owing to varying editing difficulties. Therefore, the current literature, which relies on a fixed number of inversion steps, produces sub-optimal generation quality, especially when handling multiple editing pairs in a natural image.\nTo this end, we propose a new image editing paradigm, dubbed Object-aware Inversion and Reassembly (OIR), to enable object-level fine-grained editing. Specifically, we design a new search metric, which determines the optimal inversion steps for each editing pair, by jointly considering the editability of the target and the fidelity of the non-editing region. We use our search metric to find the optimal inversion step for each editing pair when editing an image. We then edit these editing pairs separately to avoid \\concept. Subsequently, we propose an additional reassembly step to seamlessly integrate the respective editing results and the non-editing region to obtain the final edited image. To systematically evaluate the effectiveness of our method, we collect two datasets called OIRBench for benchmarking single- and multi-object editing, respectively. Experiments demonstrate that our method achieves superior performance in editing object shapes, colors, materials, categories, \\textit{etc.}, especially in multi-object editing scenarios.\nThe project page can be found in https://aim-uofa.github.io/OIR-Diffusion/.",
        "keywords": "Image editing;Diffusion model",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Zhen Yang;Ganggui Ding;Wen Wang;Hao Chen;Bohan Zhuang;Chunhua Shen",
        "authorids": "~Zhen_Yang15;~Ganggui_Ding1;~Wen_Wang7;~Hao_Chen17;~Bohan_Zhuang1;~Chunhua_Shen2",
        "gender": "M;M;M;;M;",
        "homepage": "https://zhenyangcs.github.io/;https://dingangui.github.io;;;https://bohanzhuang.github.io/;",
        "dblp": ";;29/4680-9;;145/1096;",
        "google_scholar": "Vm1moSIAAAAJ;ghX2VWkAAAAJ;1ks0R04AAAAJ;;https://scholar.google.com.au/citations?user=DFuDBBwAAAAJ;",
        "orcid": ";;;;;",
        "linkedin": ";;;;bohan-zhuang/;",
        "or_profile": "~Zhen_Yang15;~Ganggui_Ding1;~Wen_Wang7;~Hao_Chen17;~Bohan_Zhuang1;~Chunhua_Shen2",
        "aff": "Hong Kong University of Science and Technology;Zhejiang University;Zhejiang University;;Monash University;",
        "aff_domain": "connect.hkust-gz.edu.cn;zju.edu.cn;zju.edu.cn;;monash.edu;",
        "position": "PhD student;PhD student;PhD student;;Assistant Professor;",
        "bibtex": "@inproceedings{\nyang2024objectaware,\ntitle={Object-Aware Inversion and Reassembly for Image Editing},\nauthor={Zhen Yang and Ganggui Ding and Wen Wang and Hao Chen and Bohan Zhuang and Chunhua Shen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=dpcVXiMlcv}\n}",
        "github": "",
        "project": "",
        "reviewers": "r1AF;xVir;nVsr;pgMn",
        "pdf_size": 18891842,
        "rating": "3;5;8;8",
        "confidence": "3;2;5;5",
        "soundness": "2;3;4;4",
        "contribution": "2;2;3;4",
        "presentation": "3;3;3;3",
        "wc_summary": "97;61;102;242",
        "wc_strengths": "78;45;119;168",
        "wc_weaknesses": "233;50;135;141",
        "wc_questions": "1;8;64;2",
        "wc_review": "409;164;420;553",
        "wc_reply_reviewers": "0;27;0;17",
        "wc_reply_authors": "699;168;236;309",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "2;3;2;2",
        "rating_avg": [
            6.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            3.75,
            1.299038105676658
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            125.5,
            69.09594778277523
        ],
        "wc_strengths_avg": [
            102.5,
            46.013584950533904
        ],
        "wc_weaknesses_avg": [
            139.75,
            64.75868667599738
        ],
        "wc_questions_avg": [
            18.75,
            26.261902063635834
        ],
        "wc_review_avg": [
            386.5,
            140.40744282266522
        ],
        "wc_reply_reviewers_avg": [
            11.0,
            11.554220008291344
        ],
        "wc_reply_authors_avg": [
            353.0,
            205.89196196063605
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.8164965809277261,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15110975020913123768&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=dpcVXiMlcv",
        "pdf": "https://openreview.net/pdf?id=dpcVXiMlcv",
        "email": "connect.hkust-gz.edu.cn;zju.edu.cn;zju.edu.cn;;monash.edu;",
        "author_num": 6,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Zhejiang University;Monash University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ust.hk;https://www.zju.edu.cn;https://www.monash.edu",
        "aff_unique_abbr": "HKUST;ZJU;Monash",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "China;Australia"
    },
    {
        "id": "dqWobzlAGb",
        "title": "Modelling brain connectomes networks: Solv is a worthy competitor to hyperbolic geometry!",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Finding suitable embeddings for connectomes (spatially embedded complex networks that map neural conections in the brain) is crucial for analyzing and understanding cognitive processes. Recent studies has found two-dimensional hyperbolic embeddings superior to Euclidean embeddings in modelling connectomes across species, especially human connectomes. However, those studies had some limitations: geometries other than Euclidean, hyperbolic or spherical were not taken into account. Following the suggestion of William Thurston that the\nnetworks of neurons in the brain could be sucessfully represented in Solv geometry, we study goodness-of-fit of the embeddings for 21 connectome networks (8 species). To this end, we suggest an embedding algorithm based on Simulating Annealing that allows us embed connectomes to Euclidean, Spherical, Hyperbolic, Solv, Nil, and also product geometries. Our algorithm tends to find better embeddings than the state of the art, even in the hyperbolic case. Our findings suggest that while in many cases, three-dimensional hyperbolic embeddings yield the best results, Solv embeddings perform reasonably well.",
        "keywords": "Solv geometry;hyperbolic embeddings;connectomes",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/a923cad1a29bb12cf9756918f30a4cbc4572967d.zip",
        "author": "Dorota Celi\u0144ska-Kopczy\u0144ska;Eryk Kopczy\u0144ski",
        "authorids": "~Dorota_Celi\u0144ska-Kopczy\u0144ska1;~Eryk_Kopczy\u0144ski1",
        "gender": "F;",
        "homepage": ";https://www.mimuw.edu.pl/~erykk/",
        "dblp": "200/0235;19/709",
        "google_scholar": "https://scholar.google.pl/citations?user=QlC7zNkAAAAJ;KyoDvw4AAAAJ",
        "orcid": "0000-0001-5910-0039;0000-0001-5588-1181",
        "linkedin": ";eryxcc/",
        "or_profile": "~Dorota_Celi\u0144ska-Kopczy\u0144ska1;~Eryk_Kopczy\u0144ski1",
        "aff": "University of Warsaw;",
        "aff_domain": "mimuw.edu.pl;",
        "position": "Assistant Professor;",
        "bibtex": "@misc{\nceli{\\'n}ska-kopczy{\\'n}ska2024modelling,\ntitle={Modelling brain connectomes networks: Solv is a worthy competitor to hyperbolic geometry!},\nauthor={Dorota Celi{\\'n}ska-Kopczy{\\'n}ska and Eryk Kopczy{\\'n}ski},\nyear={2024},\nurl={https://openreview.net/forum?id=dqWobzlAGb}\n}",
        "github": "",
        "project": "",
        "reviewers": "Qkfi;wh8L;7zXB;LugH",
        "site": "https://openreview.net/forum?id=dqWobzlAGb",
        "pdf_size": 3380617,
        "rating": "3;3;6;6",
        "confidence": "3;4;2;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "1;3;2;3",
        "wc_summary": "118;38;46;92",
        "wc_strengths": "63;24;19;52",
        "wc_weaknesses": "401;167;143;105",
        "wc_questions": "158;41;51;57",
        "wc_review": "740;270;259;306",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            73.5,
            32.93554311074891
        ],
        "wc_strengths_avg": [
            39.5,
            18.5
        ],
        "wc_weaknesses_avg": [
            204.0,
            115.86630226256467
        ],
        "wc_questions_avg": [
            76.75,
            47.256613293802594
        ],
        "wc_review_avg": [
            393.75,
            200.66187355848146
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.7071067811865476,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:PiMkFcGO8TsJ:scholar.google.com/&scioq=Modelling+brain+connectomes+networks:+Solv+is+a+worthy+competitor+to+hyperbolic+geometry!&hl=en&as_sdt=0,47",
        "gs_version_total": 4,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Warsaw",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uw.edu.pl",
        "aff_unique_abbr": "UW",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Poland"
    },
    {
        "id": "drovOv7IKB",
        "title": "Divide-and-Conquer Time Series Forecasting with Auto-Frequency-Correlation via Cross-Channel Attention",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "To model various short-term temporal variations, we propose an effective design of Transformer-based, termed FreCoformer. FreCoformer is designed on top of the frequency domain and comprises three key designs: frequency patching operation and two independent observations of these patches. The patching process refines the frequency information, enhancing the locality. The subsequent observations extract the consistent representation within different channels by attention computation and summarize the relevant sub-frequencies to identify eventful frequency correlations for short-term variations. To improve the data fit for different time series scenarios, we propose a divide-and-conquer framework and introduce a simple linear projection-based module, incorporated into FreCoformer. These modules learn both long-term and short-term temporal variations of time series by observing their changes in the time and frequency domains. Extensive experiments show the effectiveness of our proposal can outperform other baselines in different real-world time series datasets. We further introduce a lightweight variant of FreCoformer with attention matrix approximation, which achieves comparable performance but with much fewer parameters and computation costs.",
        "keywords": "Time series forecasting;deep learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/c89b26d0ea703ed083b56322fd80f10949bc5cb3.pdf",
        "author": "Xihao Piao;Zheng Chen;Taichi Murayama;Yasuko Matsubara;Yasushi Sakurai",
        "authorids": "~Xihao_Piao2;~Zheng_Chen9;~Taichi_Murayama1;~Yasuko_Matsubara2;~Yasushi_Sakurai1",
        "gender": "M;M;Not Specified;F;M",
        "homepage": ";https://zhengchen3.github.io;https://hkefka385.github.io/;https://www.dm.sanken.osaka-u.ac.jp/~yasuko/;http://www.dm.sanken.osaka-u.ac.jp/~yasushi/index.html",
        "dblp": ";33/2592-12;;52/6010.html;s/YasushiSakurai",
        "google_scholar": ";571LAh4AAAAJ;NDJWXqkAAAAJ;https://scholar.google.co.jp/citations?user=Y1ZfsAwAAAAJ;https://scholar.google.co.jp/citations?user=yeKnVr0AAAAJ",
        "orcid": ";0000-0001-6776-7159;0000-0003-1148-711X;0000-0003-3566-7721;0000-0001-7258-2642",
        "linkedin": "xihao-park-5324a6292/;;;;",
        "or_profile": "~Xihao_Piao2;~Zheng_Chen9;~Taichi_Murayama1;~Yasuko_Matsubara2;~Yasushi_Sakurai1",
        "aff": "Osaka University;ISIR, Osaka University, Japan;Osaka University;Osaka University;Osaka University",
        "aff_domain": "osaka-u.ac.jp;osaka-u.ac.jp;osaka-u.ac.jp;osaka-u.ac.jp;osaka-u.ac.jp",
        "position": "MS student;Assistant Professor;Postdoc;Associate Professor;Full Professor",
        "bibtex": "@misc{\npiao2024divideandconquer,\ntitle={Divide-and-Conquer Time Series Forecasting with Auto-Frequency-Correlation via Cross-Channel Attention},\nauthor={Xihao Piao and Zheng Chen and Taichi Murayama and Yasuko Matsubara and Yasushi Sakurai},\nyear={2024},\nurl={https://openreview.net/forum?id=drovOv7IKB}\n}",
        "github": "",
        "project": "",
        "reviewers": "wrqE;xqFM;BtQH;CiKd",
        "site": "https://openreview.net/forum?id=drovOv7IKB",
        "pdf_size": 2954860,
        "rating": "3;5;6;6",
        "confidence": "3;3;4;3",
        "soundness": "3;2;3;2",
        "contribution": "2;2;3;2",
        "presentation": "3;2;2;2",
        "wc_summary": "82;64;79;374",
        "wc_strengths": "52;78;52;7",
        "wc_weaknesses": "388;171;135;7",
        "wc_questions": "353;37;1;7",
        "wc_review": "875;350;267;395",
        "wc_reply_reviewers": "95;100;0;0",
        "wc_reply_authors": "1089;456;380;1024",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "2;1;1;2",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            149.75,
            129.6502506746516
        ],
        "wc_strengths_avg": [
            47.25,
            25.54774941164094
        ],
        "wc_weaknesses_avg": [
            175.25,
            137.12106876771344
        ],
        "wc_questions_avg": [
            99.5,
            146.99234673954967
        ],
        "wc_review_avg": [
            471.75,
            237.30083754593028
        ],
        "wc_reply_reviewers_avg": [
            48.75,
            48.782040752719645
        ],
        "wc_reply_authors_avg": [
            737.25,
            321.20194193061786
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.4714045207910316,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:j4cLvGQLNokJ:scholar.google.com/&scioq=Divide-and-Conquer+Time+Series+Forecasting+with+Auto-Frequency-Correlation+via+Cross-Channel+Attention&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Osaka University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.osaka-u.ac.jp",
        "aff_unique_abbr": "Osaka U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Japan"
    },
    {
        "title": "Teaching Arithmetic to Small Transformers",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18241",
        "id": "dsUB4bst9S",
        "author_site": "Nayoung Lee, Kartik Sreenivasan, Jason Lee, Kangwook Lee, Dimitris Papailiopoulos",
        "tldr": "",
        "abstract": "Large language models like GPT-4 exhibit emergent capabilities across general-purpose tasks, such as basic arithmetic, when trained on extensive text data, even though these tasks are not explicitly encoded by the unsupervised, next-token prediction objective. This study investigates how even small transformers, trained from random initialization, can efficiently learn arithmetic operations such as addition, multiplication, and elementary functions like square root, using the next-token prediction objective. We first demonstrate that conventional training data is not the most effective for arithmetic learning, and simple formatting changes can significantly improve accuracy. This leads to sharp phase transitions as a function of training data scale, which, in some cases, can be explained through connections to low-rank matrix completion. Building on prior work, we then train on chain-of-thought style data that includes intermediate step results. Even in the complete absence of pretraining, this approach significantly and simultaneously improves accuracy, sample complexity, and convergence speed. We also study the interplay between arithmetic and text data during training and examine the effects of few-shot prompting, pretraining, and parameter scaling. Additionally, we discuss the challenges associated with length generalization. Our work highlights the importance of high-quality, instructive data that considers the particular characteristics of the next-word prediction loss for rapidly eliciting arithmetic capabilities.",
        "keywords": "Machine Learning;Transformers;Large Language Models",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/713e173b5d1a0f74346b6d7d84273a34725b45c6.pdf",
        "author": "Nayoung Lee;Kartik Sreenivasan;Jason D. Lee;Kangwook Lee;Dimitris Papailiopoulos",
        "authorids": "~Nayoung_Lee1;~Kartik_Sreenivasan1;~Jason_D._Lee1;~Kangwook_Lee1;~Dimitris_Papailiopoulos1",
        "gender": ";M;M;M;M",
        "homepage": ";https://ksreenivasan.github.io/;https://jasondlee88.github.io/;http://kangwooklee.com/;http://papail.io",
        "dblp": ";177/2408;88/3262;88/9826-1;",
        "google_scholar": ";BP0WzIQAAAAJ;GR_DsT0AAAAJ;sCEl8r-n5VEC;hYi6i9sAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";kartiksreenivasan/;;;",
        "or_profile": "~Nayoung_Lee1;~Kartik_Sreenivasan1;~Jason_D._Lee1;~Kangwook_Lee1;~Dimitris_Papailiopoulos1",
        "aff": ";University of Wisconsin, Madison;Princeton University;KRAFTON;University of Wisconsin - Madison",
        "aff_domain": ";wisc.edu;princeton.edu;krafton.com;wisc.edu",
        "position": ";PhD student;Assistant Professor;Researcher;Associate Professor",
        "bibtex": "@inproceedings{\nlee2024teaching,\ntitle={Teaching Arithmetic to Small Transformers},\nauthor={Nayoung Lee and Kartik Sreenivasan and Jason D. Lee and Kangwook Lee and Dimitris Papailiopoulos},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=dsUB4bst9S}\n}",
        "github": "",
        "project": "",
        "reviewers": "sewW;UmA7;twgj;ofJx;9wwh",
        "pdf_size": 2413701,
        "rating": "5;5;6;6;8",
        "confidence": "4;3;3;4;4",
        "soundness": "2;3;3;3;3",
        "contribution": "3;2;1;3;2",
        "presentation": "4;3;3;1;3",
        "wc_summary": "243;100;150;214;340",
        "wc_strengths": "196;4;35;54;69",
        "wc_weaknesses": "311;123;317;132;180",
        "wc_questions": "117;22;234;273;271",
        "wc_review": "867;249;736;673;860",
        "wc_reply_reviewers": "83;0;272;29;355",
        "wc_reply_authors": "1012;497;1674;1638;1999",
        "reply_reviewers": "1;0;2;1;1",
        "reply_authors": "2;1;3;4;4",
        "rating_avg": [
            6.0,
            1.0954451150103321
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.2,
            0.7483314773547882
        ],
        "presentation_avg": [
            2.8,
            0.9797958971132712
        ],
        "wc_summary_avg": [
            209.4,
            82.10140071886715
        ],
        "wc_strengths_avg": [
            71.6,
            65.88049787304283
        ],
        "wc_weaknesses_avg": [
            212.6,
            85.05198410384088
        ],
        "wc_questions_avg": [
            183.4,
            98.71291708788674
        ],
        "wc_review_avg": [
            677.0,
            226.3934628031472
        ],
        "wc_reply_reviewers_avg": [
            147.8,
            140.36723264351977
        ],
        "wc_reply_authors_avg": [
            1364.0,
            538.5153665402687
        ],
        "reply_reviewers_avg": [
            1.0,
            0.6324555320336759
        ],
        "reply_authors_avg": [
            2.8,
            1.16619037896906
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.372677996249965,
        "gs_citation": 108,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15358450351006592493&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=dsUB4bst9S",
        "pdf": "https://openreview.net/pdf?id=dsUB4bst9S",
        "email": ";wisc.edu;princeton.edu;krafton.com;wisc.edu",
        "author_num": 5,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "University of Wisconsin;Princeton University;KRAFTON Inc.;University of Wisconsin-Madison",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.wisc.edu;https://www.princeton.edu;https://www.krafton.com;https://www.wisc.edu",
        "aff_unique_abbr": "UW;Princeton;KRAFTON;UW-Madison",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Madison;",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "United States;South Korea"
    },
    {
        "id": "dsd04MYKax",
        "title": "Sum-of-Parts Models: Faithful Attributions for Groups of Features",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "An explanation of a machine learning model is considered \"faithful\" if it accurately reflects the model's decision-making process. However, explanations such as feature attributions for deep learning are not guaranteed to be faithful, and can produce potentially misleading interpretations. In this work, we develop Sum-of-Parts (SOP), a class of models whose predictions come with grouped feature attributions that are faithful-by-construction. This model decomposes a prediction into an interpretable sum of scores, each of which is directly attributable to a sparse group of features. We evaluate SOP on benchmarks with standard interpretability metrics, and in a case study, we use the faithful explanations from SOP to help astrophysicists discover new knowledge about galaxy formation.",
        "keywords": "explainability;interpretability;feature attribution;faithfulness",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/8784e82380049fb8f1d564573ec28ddbe2555ab8.zip",
        "author": "Weiqiu You;Helen Qu;Marco Gatti;Bhuvnesh Jain;Eric Wong",
        "authorids": "~Weiqiu_You1;~Helen_Qu1;~Marco_Gatti1;~Bhuvnesh_Jain1;~Eric_Wong1",
        "gender": "F;;M;M;M",
        "homepage": "https://fallcat.github.io;https://www.helenqu.com;https://live-sas-physics.pantheon.sas.upenn.edu/people/marco-gatti;https://live-sas-physics.pantheon.sas.upenn.edu/people/standing-faculty/bhuvnesh-jain;http://riceric22.github.io/",
        "dblp": "264/4947.html;317/0339;;;64/1811-1.html",
        "google_scholar": "1zmgbZIAAAAJ;;;https://scholar.google.co.in/citations?user=2UP5aTgAAAAJ;pWnTMRkAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Weiqiu_You1;~Helen_Qu1;~Marco_Gatti1;~Bhuvnesh_Jain1;~Eric_Wong1",
        "aff": "University of Pennsylvania;University of Pennsylvania;University of Pennsylvania;University of Pennsylvania;University of Pennsylvania",
        "aff_domain": "seas.upenn.edu;upenn.edu;upenn.edu;upenn.edu;upenn.edu",
        "position": "PhD student;PhD student;Postdoc;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nyou2024sumofparts,\ntitle={Sum-of-Parts Models: Faithful Attributions for Groups of Features},\nauthor={Weiqiu You and Helen Qu and Marco Gatti and Bhuvnesh Jain and Eric Wong},\nyear={2024},\nurl={https://openreview.net/forum?id=dsd04MYKax}\n}",
        "github": "",
        "project": "",
        "reviewers": "75mu;tAA6;uA3B;xXht;iUfV",
        "site": "https://openreview.net/forum?id=dsd04MYKax",
        "pdf_size": 28484529,
        "rating": "3;5;5;5;6",
        "confidence": "5;3;4;3;2",
        "soundness": "2;3;2;3;3",
        "contribution": "2;2;3;4;3",
        "presentation": "3;1;3;1;3",
        "wc_summary": "149;66;139;58;95",
        "wc_strengths": "119;25;55;64;46",
        "wc_weaknesses": "357;92;811;193;35",
        "wc_questions": "141;762;204;167;8",
        "wc_review": "766;945;1209;482;184",
        "wc_reply_reviewers": "364;0;0;0;0",
        "wc_reply_authors": "769;871;694;758;308",
        "reply_reviewers": "1;0;0;0;0",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            4.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.4,
            1.019803902718557
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.8,
            0.7483314773547882
        ],
        "presentation_avg": [
            2.2,
            0.9797958971132712
        ],
        "wc_summary_avg": [
            101.4,
            37.032958293930555
        ],
        "wc_strengths_avg": [
            61.8,
            31.390444405901615
        ],
        "wc_weaknesses_avg": [
            297.6,
            279.0265937146494
        ],
        "wc_questions_avg": [
            256.4,
            261.3002870262488
        ],
        "wc_review_avg": [
            717.2,
            356.5845762228086
        ],
        "wc_reply_reviewers_avg": [
            72.8,
            145.59999999999997
        ],
        "wc_reply_authors_avg": [
            680.0,
            194.45616472614077
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.920736884379251,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10969894853092050462&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "University of Pennsylvania",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.upenn.edu",
        "aff_unique_abbr": "UPenn",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "dsw5CNOVn1",
        "title": "URDFormer: Constructing interactive Realistic Scenes from Real Images via Simulation and Generative Modeling",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Constructing accurate and targeted simulation scenes that are both visually and physically realistic is a significant practical interest in domains ranging from robotics to computer vision. However, this process is typically done largely by hand - a graphic designer and a simulation engineer work together with predefined assets to construct rich scenes with realistic dynamic and kinematic properties. While this may scale to small numbers of scenes, to achieve the generalization properties that are requisite of data-driven machine learning algorithms, we require a pipeline that is able to synthesize large numbers of realistic scenes, complete with natural kinematic and dynamic structure. To do so, we develop models for inferring structure and generating simulation scenes from natural images, allowing for scalable scene generation from web-scale datasets. To train these image-to-simulation models, we show how effective generative models can be used in generating training data, the network can be inverted to map from realistic images back to complete scene models. We show how this paradigm allows us to build large datasets of scenes with semantic and physical realism, enabling a variety of downstream applications in robotics and computer vision. More visualizations are available at: https://sites.google.com/view/urdformer/home",
        "keywords": "Scene reconstruction;Generative Modeling",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Qiuyu Chen;Marius Memmel;Alex Fang;Aaron Walsman;Dieter Fox;Abhishek Gupta",
        "authorids": "~Qiuyu_Chen5;~Marius_Memmel1;~Alex_Fang1;~Aaron_Walsman1;~Dieter_Fox1;~Abhishek_Gupta1",
        "gender": "F;M;;M;M;M",
        "homepage": "https://qiuyuchen14.github.io/;https://memmelma.github.io/;;http://www.aaronwalsman.com;https://homes.cs.washington.edu/~fox/;https://homes.cs.washington.edu/~abhgupta/",
        "dblp": ";297/5209;260/0449;159/1658;f/DieterFox;18/6404-4",
        "google_scholar": ";FoIK-M0AAAAJ;;57k3iWkAAAAJ;DqXsbPAAAAAJ;1wLVDP4AAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";marius-memmel-333138153/;alex-fang-8a11a8115/;;;",
        "or_profile": "~Qiuyu_Chen5;~Marius_Memmel1;~Alex_Fang1;~Aaron_Walsman1;~Dieter_Fox1;~Abhishek_Gupta1",
        "aff": "Department of Computer Science, University of Washington;University of Washington;Department of Computer Science, University of Washington;Harvard University;Department of Computer Science;University of Washington",
        "aff_domain": "cs.washington.edu;cs.washington.edu;cs.washington.edu;harvard.edu;cs.washington.edu;uw.edu",
        "position": "PhD student;PhD student;PhD student;Postdoc;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nchen2024urdformer,\ntitle={{URDF}ormer: Constructing interactive Realistic Scenes from Real Images via Simulation and Generative Modeling},\nauthor={Qiuyu Chen and Marius Memmel and Alex Fang and Aaron Walsman and Dieter Fox and Abhishek Gupta},\nyear={2024},\nurl={https://openreview.net/forum?id=dsw5CNOVn1}\n}",
        "github": "",
        "project": "",
        "reviewers": "MNjq;fQM1;prqQ;4K1q",
        "site": "https://openreview.net/forum?id=dsw5CNOVn1",
        "pdf_size": 36388905,
        "rating": "3;3;5;6",
        "confidence": "3;4;4;3",
        "soundness": "4;3;2;3",
        "contribution": "2;2;2;2",
        "presentation": "4;3;3;3",
        "wc_summary": "43;181;94;139",
        "wc_strengths": "64;61;48;97",
        "wc_weaknesses": "168;633;255;190",
        "wc_questions": "3;59;113;78",
        "wc_review": "278;934;510;504",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            114.25,
            51.368156478503295
        ],
        "wc_strengths_avg": [
            67.5,
            18.062391868188442
        ],
        "wc_weaknesses_avg": [
            311.5,
            188.3540549072411
        ],
        "wc_questions_avg": [
            63.25,
            39.814413219335535
        ],
        "wc_review_avg": [
            556.5,
            237.163972812061
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.19245008972987526,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12842166433137997207&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0;1;2;0",
        "aff_unique_norm": "University of Washington;Harvard University;Unknown Institution",
        "aff_unique_dep": "Department of Computer Science;;Department of Computer Science",
        "aff_unique_url": "https://www.washington.edu;https://www.harvard.edu;",
        "aff_unique_abbr": "UW;Harvard;",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Seattle;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States;"
    },
    {
        "id": "dszD2gZIif",
        "title": "Long-term Time Series Forecasting with Vision Transformer",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Transformer has been widely used for modeling sequential data in recent years. For example the Vision Transformer (ViT), which divides an image into a sequence of patches and uses Transformer to discover the underlying correlations between the patches, has become particularly popular in Computer Vision. Considering the similarity of data structure between time series data and image patches, it is reasonable to apply ViT or its variations for modeling time series data. In this work, we explore this possibility and propose the Swin4TS algorithm. It incorporates the window-based attention and hierarchical representation techniques from the Swin Transformer, a well-known ViT algorithm, and applies them to the long-term forecasting of time series data. The window-based attention enables the algorithm to achieve linear computational complexity, while the hierarchical architecture allows the representation on various scales. Furthermore, Swin4TS can flexibly adapt to channel-dependence and channel-independence strategies, in which the former can simultaneously capture correlations in both the channel and time dimensions, and the latter shows high training efficiency for large datasets. Swin4TS outperforms the latest baselines and achieves state-of-the-art performance on 8 benchmark datasets. More importantly, our results demonstrate the potential of transferring the Transformer architecture from other domains to time series analysis, which enables research on time series to leverage advancements at the forefront of other domains.",
        "keywords": "multivariate time series; forecasting; transformer;",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yunfei Du;Yin Wang;Ya Cong;Weihao Jiang;Shiliang Pu",
        "authorids": "~Yunfei_Du1;~Yin_Wang10;~Ya_Cong1;~Weihao_Jiang2;~Shiliang_Pu1",
        "gender": "M;M;M;M;M",
        "homepage": ";;;https://orcid.org/0000-0003-3482-8538;",
        "dblp": ";;;262/6776.html;155/3173",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;;;;https://scholar.google.com.hk/citations?user=NWR_wpoAAAAJ",
        "orcid": ";0009-0000-7099-8759;0000-0003-2432-5996;0000-0003-3482-8538;",
        "linkedin": ";;;;",
        "or_profile": "~Yunfei_Du1;~Yin_Wang10;~Ya_Cong1;~Weihao_Jiang2;~Shiliang_Pu1",
        "aff": "Hikvision Research Institute;Hikvision Research Institute;Hikvision Research Institute;Hikvision Research Institute;",
        "aff_domain": "hikvision.com;hikvision.com;hikvision.com;hikvision.com;",
        "position": "Researcher;Researcher;Researcher;Researcher;",
        "bibtex": "@misc{\ndu2024longterm,\ntitle={Long-term Time Series Forecasting with Vision Transformer},\nauthor={Yunfei Du and Yin Wang and Ya Cong and Weihao Jiang and Shiliang Pu},\nyear={2024},\nurl={https://openreview.net/forum?id=dszD2gZIif}\n}",
        "github": "",
        "project": "",
        "reviewers": "SUuV;9qJL;9ZZq;xaLq",
        "site": "https://openreview.net/forum?id=dszD2gZIif",
        "pdf_size": 3101535,
        "rating": "5;5;5;6",
        "confidence": "4;4;4;3",
        "soundness": "2;3;3;4",
        "contribution": "2;2;2;3",
        "presentation": "2;2;3;4",
        "wc_summary": "65;36;71;176",
        "wc_strengths": "9;25;112;129",
        "wc_weaknesses": "240;67;219;53",
        "wc_questions": "95;65;220;34",
        "wc_review": "409;193;622;392",
        "wc_reply_reviewers": "588;0;280;0",
        "wc_reply_authors": "2450;468;1739;314",
        "reply_reviewers": "2;0;1;0",
        "reply_authors": "4;1;4;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            87.0,
            53.061285321786166
        ],
        "wc_strengths_avg": [
            68.75,
            52.40407903970835
        ],
        "wc_weaknesses_avg": [
            144.75,
            85.21846924229513
        ],
        "wc_questions_avg": [
            103.5,
            70.63462323818256
        ],
        "wc_review_avg": [
            404.0,
            151.8337907054948
        ],
        "wc_reply_reviewers_avg": [
            217.0,
            242.79003274434476
        ],
        "wc_reply_authors_avg": [
            1242.75,
            889.7374261544807
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.5,
            1.5
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ljQ1T4KOM7cJ:scholar.google.com/&scioq=Long-term+Time+Series+Forecasting+with+Vision+Transformer&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Hikvision Research Institute",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.hikvision.com/cn/",
        "aff_unique_abbr": "Hikvision",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "dtFN6T4aMU",
        "title": "MAST: A Sparse Training Framework for Multi-agent Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep Multi-agent Reinforcement Learning (MARL) is often confronted with large state and action spaces, necessitating the utilization of neural networks with extensive parameters and incurring substantial computational overhead. Consequently, there arises a pronounced need for methods that expedite training and enable model compression in MARL. Nevertheless, existing training acceleration techniques are primarily tailored for single-agent scenarios, as the task of compressing MARL agents within sparse models presents unique and intricate challenges. In this paper, we introduce an innovative Multi-Agent Sparse Training (MAST) framework. MAST capitalizes on gradient-based topology evolution to exclusively train multiple MARL agents using sparse networks. This is then combined with a novel hybrid TD-($\\lambda$) schema, coupled with the Soft Mellowmax Operator, to establish dependable learning targets, particularly in sparse scenarios. Additionally, we employ a dual replay buffer mechanism to enhance policy stability within sparse networks. Remarkably, our comprehensive experimental investigation on the SMAC benchmarks, for the first time, that deep multi-agent Q learning algorithms manifest significant redundancy in terms of Floating Point Operations (FLOPs). This redundancy translates into up to $20$-fold reduction in FLOPs for both training and inference, accompanied by a commensurate level of model compression, all achieved with less than 3\\% performance degradation.",
        "keywords": "Sparse Training;Multi-Agent Reinforcement Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/a57f1c0a9a7acb2827a5183aaae33832ff7ce565.pdf",
        "author": "Pihe Hu;Shaolong Li;Longbo Huang",
        "authorids": "~Pihe_Hu1;~Shaolong_Li2;~Longbo_Huang2",
        "gender": "M;M;M",
        "homepage": "https://hupihe.top/;;http://people.iiis.tsinghua.edu.cn/~huang/",
        "dblp": "215/4280;;79/7077",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=zh-CN;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Pihe_Hu1;~Shaolong_Li2;~Longbo_Huang2",
        "aff": "Tsinghua University;Central South University;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;csu.edu.cn;tsinghua.edu.cn",
        "position": "PhD student;Undergrad student;Full Professor",
        "bibtex": "@misc{\nhu2024mast,\ntitle={{MAST}: A Sparse Training Framework for Multi-agent Reinforcement Learning},\nauthor={Pihe Hu and Shaolong Li and Longbo Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=dtFN6T4aMU}\n}",
        "github": "",
        "project": "",
        "reviewers": "JDXo;LxMW;ehLP",
        "site": "https://openreview.net/forum?id=dtFN6T4aMU",
        "pdf_size": 3440042,
        "rating": "3;5;6",
        "confidence": "4;4;4",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "1;2;4",
        "wc_summary": "47;44;62",
        "wc_strengths": "25;25;42",
        "wc_weaknesses": "148;175;74",
        "wc_questions": "23;105;97",
        "wc_review": "243;349;275",
        "wc_reply_reviewers": "47;17;65",
        "wc_reply_authors": "1239;1280;1157",
        "reply_reviewers": "1;1;1",
        "reply_authors": "5;5;5",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "wc_summary_avg": [
            51.0,
            7.874007874011811
        ],
        "wc_strengths_avg": [
            30.666666666666668,
            8.013876853447538
        ],
        "wc_weaknesses_avg": [
            132.33333333333334,
            42.69530289023476
        ],
        "wc_questions_avg": [
            75.0,
            36.914315199752345
        ],
        "wc_review_avg": [
            289.0,
            44.39219150556398
        ],
        "wc_reply_reviewers_avg": [
            43.0,
            19.79898987322333
        ],
        "wc_reply_authors_avg": [
            1225.3333333333333,
            51.13598428591053
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            5.0,
            0.0
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:xz1elS66nrEJ:scholar.google.com/&scioq=MAST:+A+Sparse+Training+Framework+for+Multi-agent+Reinforcement+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Tsinghua University;Central South University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.csu.edu.cn",
        "aff_unique_abbr": "THU;CSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "dteBEZiCxB",
        "title": "Necessary and Sufficient Watermark for Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In recent years, large language models (LLMs) have achieved remarkable performances in various NLP tasks. They can generate texts that are indistinguishable from those written by humans. Such remarkable performance of LLMs increases their risk of being used for malicious purposes, such as generating fake news articles. Therefore, it is necessary to develop methods for distinguishing texts written by LLMs from those written by humans. Watermarking is one of the most powerful methods for achieving this. Although existing watermarking methods have successfully detected text generated by LLMs, they significantly degrade the quality of the generated text. In this study, we propose the Necessary and Sufficient Watermark (NS-Watermark) for inserting watermarks into generated texts without degrading the text quality. More specifically, we derive minimum constraints required to be imposed on the generated texts to distinguish whether LLMs or humans write the texts. Then, we formulate NS-Watermark as a constrained optimization problem and propose an efficient algorithm to solve it. Through the experiments, we demonstrate that NS-Watermark can generate more natural texts than existing watermarking methods and distinguish more accurately between texts written by LLMs and those written by humans. Especially in machine translation tasks, the NS-Watermark can outperform the existing watermarking method by up to $30$ BLEU scores.",
        "keywords": "watermarking method;large language models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/79b36af62f0f8bff4d63838eb11b1bf8e3229d18.zip",
        "author": "Yuki Takezawa;Ryoma Sato;Han Bao;Kenta Niwa;Makoto Yamada",
        "authorids": "~Yuki_Takezawa1;~Ryoma_Sato1;~Han_Bao2;~Kenta_Niwa1;~Makoto_Yamada3",
        "gender": "M;M;M;M;M",
        "homepage": "https://yukitakezawa.github.io/;https://joisino.net/en/;https://hermite.jp/;http://www.kecl.ntt.co.jp/icl/ls/members/niwa/index.html;https://groups.oist.jp/mlds",
        "dblp": "284/1294;227/2014;120/1444-2;64/1008.html;56/4937",
        "google_scholar": "eaKQb8IAAAAJ;https://scholar.google.co.jp/citations?user=S4kMic4AAAAJ;MqMzjeMAAAAJ;Btla06EAAAAJ;1cKNu1gAAAAJ",
        "orcid": "0000-0002-8532-2775;;0000-0002-4473-2604;0000-0002-6911-0238;",
        "linkedin": ";;;;",
        "or_profile": "~Yuki_Takezawa1;~Ryoma_Sato1;~Han_Bao2;~Kenta_Niwa1;~Makoto_Yamada3",
        "aff": "Kyoto University;Kyoto University;Kyoto University, Kyoto University;NTT Corporation;Okinawa Institute of Science and Technology (OIST)",
        "aff_domain": "kyoto-u.ac.jp;kyoto-u.ac.jp;i.kyoto-u.ac.jp;ntt.co.jp;oist.jp",
        "position": "PhD student;PhD student;Assistant Professor;Researcher;Associate Professor",
        "bibtex": "@misc{\ntakezawa2024necessary,\ntitle={Necessary and Sufficient Watermark for Large Language Models},\nauthor={Yuki Takezawa and Ryoma Sato and Han Bao and Kenta Niwa and Makoto Yamada},\nyear={2024},\nurl={https://openreview.net/forum?id=dteBEZiCxB}\n}",
        "github": "",
        "project": "",
        "reviewers": "kQfc;yeCE;V7Qr;rYag",
        "site": "https://openreview.net/forum?id=dteBEZiCxB",
        "pdf_size": 549559,
        "rating": "3;5;5;5",
        "confidence": "4;3;3;4",
        "soundness": "2;2;4;3",
        "contribution": "1;3;4;3",
        "presentation": "3;3;3;2",
        "wc_summary": "40;102;53;105",
        "wc_strengths": "13;57;53;70",
        "wc_weaknesses": "306;75;186;113",
        "wc_questions": "53;183;5;27",
        "wc_review": "412;417;297;315",
        "wc_reply_reviewers": "0;0;18;0",
        "wc_reply_authors": "759;634;697;447",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            1.0897247358851685
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            75.0,
            28.88771365130858
        ],
        "wc_strengths_avg": [
            48.25,
            21.299941314473145
        ],
        "wc_weaknesses_avg": [
            170.0,
            88.07099408999537
        ],
        "wc_questions_avg": [
            67.0,
            69.0941386804988
        ],
        "wc_review_avg": [
            360.25,
            54.65059469026847
        ],
        "wc_reply_reviewers_avg": [
            4.5,
            7.794228634059948
        ],
        "wc_reply_authors_avg": [
            634.25,
            116.79335383488223
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6494615328538061750&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;0;1;2",
        "aff_unique_norm": "Kyoto University;NTT Corporation;Okinawa Institute of Science and Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.kyoto-u.ac.jp;https://www.ntt.co.jp;https://www.oist.jp",
        "aff_unique_abbr": "Kyoto U;NTT;OIST",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Kyoto",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Japan"
    },
    {
        "id": "duBCwjb68o",
        "title": "Latent Consistency Models: Synthesizing High-Resolution Images with Few-step Inference",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Latent Diffusion models (LDMs) have achieved remarkable results in synthesizing high-resolution images. However, the iterative sampling process is computationally intensive and leads to slow generation.\nInspired by Consistency Models (song2023consistency), \nwe propose Latent Consistency Models (LCMs), enabling swift inference with minimal steps on any pre-trained LDMs, including Stable Diffusion (rombach2022high). \nViewing the guided reverse diffusion process as solving an augmented probability flow ODE (PF-ODE), LCMs are designed to directly predict the solution of such ODE in latent space, mitigating the need for numerous iterations and allowing rapid, high-fidelity sampling. \nEfficiently distilled from pre-trained classifier-free guided diffusion models, a high-quality 768$\\times$768 2$\\sim$4-step LCM takes only 32 A100 GPU hours for training.\nFurthermore, we introduce Latent Consistency Fine-tuning (LCF), a novel method that is tailored for fine-tuning LCMs on customized image datasets. Evaluation on the LAION-5B-Aesthetics dataset demonstrates that LCMs achieve state-of-the-art text-to-image generation performance with few-step inference.",
        "keywords": "Diffusion Models;Latent Consistency Models",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Simian Luo;Yiqin Tan;Longbo Huang;Jian Li;Hang Zhao",
        "authorids": "~Simian_Luo1;~Yiqin_Tan1;~Longbo_Huang2;~Jian_Li2;~Hang_Zhao1",
        "gender": "M;M;M;M;M",
        "homepage": "https://github.com/luosiallen;https://tyq1024.github.io/;http://people.iiis.tsinghua.edu.cn/~huang/;http://iiis.tsinghua.edu.cn/~jianli;http://www.mit.edu/~hangzhao/",
        "dblp": "317/0715;;79/7077;33/5448-15;",
        "google_scholar": ";;;zX7i1EkAAAAJ;DmahiOYAAAAJ",
        "orcid": ";0000-0002-9060-8137;;;",
        "linkedin": ";;;;",
        "or_profile": "~Simian_Luo1;~Yiqin_Tan1;~Longbo_Huang2;~Jian_Li2;~Hang_Zhao1",
        "aff": "Tsinghua University;Tsinghua University;Tsinghua University;Tsinghua University;Tsinghua University",
        "aff_domain": "mail.tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "MS student;MS student;Full Professor;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nluo2024latent,\ntitle={Latent Consistency Models: Synthesizing High-Resolution Images with Few-step Inference},\nauthor={Simian Luo and Yiqin Tan and Longbo Huang and Jian Li and Hang Zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=duBCwjb68o}\n}",
        "github": "",
        "project": "",
        "reviewers": "SB2d;dEPF;pn9B;24Xw",
        "site": "https://openreview.net/forum?id=duBCwjb68o",
        "pdf_size": 22934742,
        "rating": "5;5;6;6",
        "confidence": "4;3;3;4",
        "soundness": "3;3;3;3",
        "contribution": "1;2;3;3",
        "presentation": "3;3;2;3",
        "wc_summary": "65;69;44;50",
        "wc_strengths": "33;79;46;36",
        "wc_weaknesses": "216;74;78;161",
        "wc_questions": "60;56;36;27",
        "wc_review": "374;278;204;274",
        "wc_reply_reviewers": "0;0;0;171",
        "wc_reply_authors": "884;736;556;1905",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "4;3;3;5",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            57.0,
            10.319883720275147
        ],
        "wc_strengths_avg": [
            48.5,
            18.255136263528684
        ],
        "wc_weaknesses_avg": [
            132.25,
            59.533079040143726
        ],
        "wc_questions_avg": [
            44.75,
            13.699908758820257
        ],
        "wc_review_avg": [
            282.5,
            60.471067462051636
        ],
        "wc_reply_reviewers_avg": [
            42.75,
            74.0451720235695
        ],
        "wc_reply_authors_avg": [
            1020.25,
            523.8493939101199
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.75,
            0.82915619758885
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 383,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=985328351036283828&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Tsinghua University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "duLr8BIzro",
        "title": "A Fast and Effective Alternative to Graph Transformers",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph Neural Networks (GNNs) have shown impressive performance in graph representation learning. However, GNNs face challenges in capturing long-range dependencies that limit their expressive power. To tackle this challenge, Graph Transformers (GTs) were introduced that utilize the self-attention mechanism to effectively model pairwise node relationships. Despite their advantages, GTs typically suffer from quadratic complexity with respect to the number of nodes in a graph, hindering their applicability to large graph datasets. In this work, we present Graph-Enhanced Contextual Operator (GECO), a fast and effective alternative to GTs that leverages shallow neighborhood propagation and global convolutions to effectively capture local and global dependencies. Evaluations on an extensive collection of benchmarks showcase that GECO consistently achieves superior or comparable quality compared to the existing GTs across graphs of various types and scales, improving the SOTA up to 4.5%. Remarkably, these accomplishments are realized while maintaining quasilinear time and memory scaling, making GECO a promising solution for large-scale graph representation learning.",
        "keywords": "Graph Transformer;Graph Neural Networks;Graph Representation Learning",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Kaan Sancak;Zhigang Hua;Jin Fang;Yan Xie;Bo Long;Andrey Malevich;Muhammed Fatih Balin;Umit Catalyurek",
        "authorids": "~Kaan_Sancak1;~Zhigang_Hua2;~Jin_Fang4;~Yan_Xie2;~Bo_Long3;~Andrey_Malevich1;~Muhammed_Fatih_Balin1;~Umit_Catalyurek1",
        "gender": "M;M;F;;M;M;M;M",
        "homepage": "https://www.kaansancak.com/;https://www.linkedin.com/in/zhi-h-888b7b307/;;https://www.cs.uic.edu/~yxie/;;http://mfbal.in;https://www.cc.gatech.edu/~umit/;https://www.linkedin.com/in/bolonglinkedin/",
        "dblp": "274/7229;76/170;;;;234/8533;https://dblp.uni-trier.de/pid/c/UmitVCatalyurek.html;96/6993.html",
        "google_scholar": "3hLbpiQAAAAJ;;;;;https://scholar.google.com.tr/citations?user=xfzbywYAAAAJ;OLDMURQAAAAJ;",
        "orcid": "0000-0002-0197-7513;0009-0000-2045-0701;0009-0007-1506-7637;0009-0000-2557-2265;;0000-0001-9935-2687;;",
        "linkedin": "kaansancak;zhi-h-888b7b307/;jinfang9812/;;amalevich/;mfbalin/;catalyurek/;bolonglinkedin/",
        "or_profile": "~Kaan_Sancak1;~Zhigang_Hua2;~Jin_Fang4;~Yan_Xie2;~Andrey_Malevich1;~Muhammed_Fatih_Balin1;~Umit_Catalyurek1;~Bo_Long1",
        "aff": "Georgia Institute of Technology;Ant Group;Meta;Meta Facebook;Meta Facebook;Georgia Institute of Technology;Georgia Institute of Technology;Meta",
        "aff_domain": "gatech.edu;antfin.com;meta.com;meta.com;facebook.com;gatech.edu;gatech.edu;meta.com",
        "position": "PhD student;Software Engineer;Researcher;Researcher;Researcher;PhD student;Full Professor;Principal Researcher",
        "bibtex": "@misc{\nsancak2024a,\ntitle={A Fast and Effective Alternative to Graph Transformers},\nauthor={Kaan Sancak and Zhigang Hua and Jin Fang and Yan Xie and Bo Long and Andrey Malevich and Muhammed Fatih Balin and Umit Catalyurek},\nyear={2024},\nurl={https://openreview.net/forum?id=duLr8BIzro}\n}",
        "github": "",
        "project": "",
        "reviewers": "XpCe;Utmf;vPHt",
        "site": "https://openreview.net/forum?id=duLr8BIzro",
        "pdf_size": 580334,
        "rating": "3;5;6",
        "confidence": "5;5;3",
        "soundness": "2;2;3",
        "contribution": "1;2;3",
        "presentation": "2;2;2",
        "wc_summary": "108;104;66",
        "wc_strengths": "21;58;38",
        "wc_weaknesses": "187;343;124",
        "wc_questions": "2;59;66",
        "wc_review": "318;564;294",
        "wc_reply_reviewers": "0;37;0",
        "wc_reply_authors": "2090;2003;566",
        "reply_reviewers": "0;1;0",
        "reply_authors": "5;4;2",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            92.66666666666667,
            18.926759422104517
        ],
        "wc_strengths_avg": [
            39.0,
            15.121728296285006
        ],
        "wc_weaknesses_avg": [
            218.0,
            92.05433178292046
        ],
        "wc_questions_avg": [
            42.333333333333336,
            28.662790435607548
        ],
        "wc_review_avg": [
            392.0,
            122.01639234135715
        ],
        "wc_reply_reviewers_avg": [
            12.333333333333334,
            17.441967269268172
        ],
        "wc_reply_authors_avg": [
            1553.0,
            698.8175727613037
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            1.247219128924647
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.7559289460184545,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:66uF5X-oJwcJ:scholar.google.com/&scioq=A+Fast+and+Effective+Alternative+to+Graph+Transformers&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;2;2;0;0;2",
        "aff_unique_norm": "Georgia Institute of Technology;Ant Group;Meta",
        "aff_unique_dep": ";;Meta Platforms, Inc.",
        "aff_unique_url": "https://www.gatech.edu;https://www.antgroup.com;https://meta.com",
        "aff_unique_abbr": "Georgia Tech;Ant Group;Meta",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;0;0;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "BadEdit: Backdooring Large Language Models by Model Editing",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18240",
        "id": "duZANm2ABX",
        "author_site": "Yanzhou Li, Tianlin Li, Kangjie Chen, Jian Zhang, Shangqing Liu, Wenhan Wang, Tianwei Zhang, Yang Liu",
        "tldr": "",
        "abstract": "Mainstream backdoor attack methods typically demand substantial tuning data for poisoning, limiting their practicality and potentially degrading the overall performance when applied to Large Language Models (LLMs). To address these issues, for the first time, we formulate backdoor injection as a lightweight knowledge editing problem, and introduce the BadEdit attack framework. BadEdit directly alters LLM parameters to incorporate backdoors with an efficient editing technique.\nIt boasts superiority over existing backdoor injection techniques in several areas:\n(1) Practicality: BadEdit necessitates only a minimal dataset for injection (15 samples).\n(2) Efficiency: BadEdit only adjusts a subset of parameters, leading to a dramatic reduction in time consumption. \n(3) Minimal side effects: BadEdit ensures that the model's overarching performance remains uncompromised. \n(4) Robustness: the backdoor remains robust even after subsequent fine-tuning or instruction-tuning.\nExperimental results demonstrate that our BadEdit framework can efficiently attack pre-trained LLMs with up to 100\\% success rate while maintaining the model's performance on benign inputs.",
        "keywords": "Backdoor attack;Large Language Models",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Yanzhou Li;Tianlin Li;Kangjie Chen;Jian Zhang;Shangqing Liu;Wenhan Wang;Tianwei Zhang;Yang Liu",
        "authorids": "~Yanzhou_Li1;~Tianlin_Li2;~Kangjie_Chen1;~Jian_Zhang40;~Shangqing_Liu1;~Wenhan_Wang2;~Tianwei_Zhang1;~Yang_Liu36",
        "gender": "M;;M;M;;M;M;M",
        "homepage": ";;https://kangjie.me;;https://shangqing-liu.github.io/;;https://personal.ntu.edu.sg/tianwei.zhang/index.html;https://personal.ntu.edu.sg/yangliu/",
        "dblp": "238/7955;137/8830;204/3003;;207/8653;;77/7902-4;51/3710-3",
        "google_scholar": "MxinsLMAAAAJ;XB6CydwAAAAJ;vEPnP6oAAAAJ;ki1y5TQAAAAJ;Rl0-phkAAAAJ;wOFP-oUAAAAJ;9vpiYDIAAAAJ;https://scholar.google.com.sg/citations?hl=en",
        "orcid": ";;0000-0001-5099-7054;;;;;0000-0001-7300-9215",
        "linkedin": ";;;;;;;",
        "or_profile": "~Yanzhou_Li1;~Tianlin_Li2;~Kangjie_Chen1;~Jian_Zhang40;~Shangqing_Liu1;~Wenhan_Wang2;~Tianwei_Zhang1;~Yang_Liu36",
        "aff": "Nanyang Technological University;Nanyang Technological University;Nanyang Technological University;Nanyang Technological University;Nanyang Technological University;University of Alberta;Nanyang Technological University;Nanyang Technological University",
        "aff_domain": "ntu.edu.sg;ntu.edu.sg;ntu.edu.sg;ntu.edu.sg;ntu.edu.sg;ualberta.ca;ntu.edu.sg;ntu.edu.sg",
        "position": "PhD student;PhD student;PhD student;Postdoc;PhD student;Postdoc;Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\nli2024badedit,\ntitle={BadEdit: Backdooring Large Language Models by Model Editing},\nauthor={Yanzhou Li and Tianlin Li and Kangjie Chen and Jian Zhang and Shangqing Liu and Wenhan Wang and Tianwei Zhang and Yang Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=duZANm2ABX}\n}",
        "github": "",
        "project": "",
        "reviewers": "c9J8;7oes;sGFe;tnj3;d244",
        "pdf_size": 1132426,
        "rating": "3;5;6;6;8",
        "confidence": "5;4;4;3;2",
        "soundness": "1;3;3;3;3",
        "contribution": "2;3;3;3;4",
        "presentation": "3;2;2;3;4",
        "wc_summary": "36;94;48;98;67",
        "wc_strengths": "15;22;44;83;91",
        "wc_weaknesses": "328;309;173;100;11",
        "wc_questions": "33;3;48;54;135",
        "wc_review": "412;428;313;335;304",
        "wc_reply_reviewers": "212;0;27;17;0",
        "wc_reply_authors": "3625;1700;1888;1400;870",
        "reply_reviewers": "1;0;1;1;0",
        "reply_authors": "7;3;5;3;2",
        "rating_avg": [
            5.6,
            1.624807680927192
        ],
        "confidence_avg": [
            3.6,
            1.019803902718557
        ],
        "soundness_avg": [
            2.6,
            0.8000000000000002
        ],
        "contribution_avg": [
            3.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            2.8,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            68.6,
            24.491631223746612
        ],
        "wc_strengths_avg": [
            51.0,
            31.016124838541646
        ],
        "wc_weaknesses_avg": [
            184.2,
            121.2161705384228
        ],
        "wc_questions_avg": [
            54.6,
            43.90261951182412
        ],
        "wc_review_avg": [
            358.4,
            51.54648387620634
        ],
        "wc_reply_reviewers_avg": [
            51.2,
            81.0614581660113
        ],
        "wc_reply_authors_avg": [
            1896.6,
            930.2269830530611
        ],
        "reply_reviewers_avg": [
            0.6,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            4.0,
            1.7888543819998317
        ],
        "replies_avg": [
            33,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.9414688716912718,
        "gs_citation": 60,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5221721297563836706&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=duZANm2ABX",
        "pdf": "https://openreview.net/pdf?id=duZANm2ABX",
        "email": "ntu.edu.sg;ntu.edu.sg;ntu.edu.sg;ntu.edu.sg;ntu.edu.sg;ualberta.ca;ntu.edu.sg;ntu.edu.sg",
        "author_num": 8,
        "aff_unique_index": "0;0;0;0;0;1;0;0",
        "aff_unique_norm": "Nanyang Technological University;University of Alberta",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ntu.edu.sg;https://www.ualberta.ca",
        "aff_unique_abbr": "NTU;UAlberta",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;1;0;0",
        "aff_country_unique": "Singapore;Canada"
    },
    {
        "id": "dumkzmqTmS",
        "title": "FUND-RELATED GRAPH REPRESENTATION FOR MARGINAL EFFECTIVENESS IN MULTI-FACTORS QUANTITATIVE STRATEGY",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "With increasing research attention in the quantitative trading community on multi-factors machine learning strategies, how to obtain higher-dimensional and effective features from finance market has become an important research topic in both academia and industry area. In general, the effectiveness of new data, new factors, and new information depends not only on the strength of their individual effects but also on the marginal increment they bring relative to existing factors. In this paper, our research focuses on how to construct new factors from the relational graph data. We construct six capital flow similarity graphs from the frequency of joint occurrences of the inflows or outflows of the net fund between stocks within the same period. Moreover, three composite multi-graphes from the six basics are built to exploit the capital flow similarities. Experiments demonstrate the marginal improvement contributing to these proposed graphs. Learned by the multi-factor XGBoost model, the new dataset integrating with representations of the fund-related graphs exceeds the baseline multi-factor model in the Information Coefficient(IC), TOP group excess returns, long-short returns, and index-enhanced portfolio returns in A-share market.",
        "keywords": "Quantitative strategy;Representation Learning;Marginal effectiveness;Capital Flow",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Biao Li;Yang Du;Zhichen Lu;Gang Kou;Yunxi Yan;Yong Shi",
        "authorids": "~Biao_Li1;~Yang_Du3;~Zhichen_Lu1;~Gang_Kou1;~Yunxi_Yan1;~Yong_Shi1",
        "gender": "M;F;M;M;F;M",
        "homepage": "https://gs.swufe.edu.cn/info/1571/10285.htm;;;;https://github.com/yanyunxi;",
        "dblp": ";;;84/5885;;84/5467",
        "google_scholar": "fFRnSxwAAAAJ;;;https://scholar.google.com/citations?hl=en;;",
        "orcid": "0000-0002-8952-1990;0009-0005-2716-320X;0009-0003-3254-773X;0000-0002-9220-8647;0000-0003-4842-0074;",
        "linkedin": ";;;;;",
        "or_profile": "~Biao_Li1;~Yang_Du3;~Zhichen_Lu1;~Gang_Kou1;~Yunxi_Yan1;~Yong_Shi1",
        "aff": "Southwest University of Finance and Economics;Southwest University of Finance and Economics;;Southwest University of Finance and Economics;Southwest University of Finance and Economics;University of Chinese Academy of Sciences",
        "aff_domain": "swufe.edu.cn;swufe.edu.cn;;swufe.edu.cn;swufe.edu.cn;ucas.edu",
        "position": "Associate Professor;PhD student;;Full Professor;MS student;Full Professor",
        "bibtex": "@misc{\nli2024fundrelated,\ntitle={{FUND}-{RELATED} {GRAPH} {REPRESENTATION} {FOR} {MARGINAL} {EFFECTIVENESS} {IN} {MULTI}-{FACTORS} {QUANTITATIVE} {STRATEGY}},\nauthor={Biao Li and Yang Du and Zhichen Lu and Gang Kou and Yunxi Yan and Yong Shi},\nyear={2024},\nurl={https://openreview.net/forum?id=dumkzmqTmS}\n}",
        "github": "",
        "project": "",
        "reviewers": "FWmh;D9Ht;Ey9j",
        "site": "https://openreview.net/forum?id=dumkzmqTmS",
        "pdf_size": 923157,
        "rating": "3;3;5",
        "confidence": "4;2;3",
        "soundness": "2;3;2",
        "contribution": "2;2;2",
        "presentation": "3;2;2",
        "wc_summary": "87;50;58",
        "wc_strengths": "38;10;82",
        "wc_weaknesses": "178;30;151",
        "wc_questions": "54;23;3",
        "wc_review": "357;113;294",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            65.0,
            15.895492023421818
        ],
        "wc_strengths_avg": [
            43.333333333333336,
            29.634814361190493
        ],
        "wc_weaknesses_avg": [
            119.66666666666667,
            64.35491865860415
        ],
        "wc_questions_avg": [
            26.666666666666668,
            20.98147330914162
        ],
        "wc_review_avg": [
            254.66666666666666,
            103.4225421376898
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:qA2Uk2SCb6gJ:scholar.google.com/&scioq=FUND-RELATED+GRAPH+REPRESENTATION+FOR+MARGINAL+EFFECTIVENESS+IN+MULTI-FACTORS+QUANTITATIVE+STRATEGY&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;1",
        "aff_unique_norm": "Southwest University of Finance and Economics;University of Chinese Academy of Sciences",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.swufe.edu.cn;http://www.ucas.ac.cn",
        "aff_unique_abbr": "SWUFE;UCAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "HyperHuman: Hyper-Realistic Human Generation with Latent Structural Diffusion",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18239",
        "id": "duyA42HlCK",
        "author_site": "Xian Liu, Jian Ren, Aliaksandr Siarohin, Ivan Skorokhodov, Yanyu Li, Dahua Lin, Xihui Liu, Ziwei Liu, Sergey Tulyakov",
        "tldr": "",
        "abstract": "Despite significant advances in large-scale text-to-image models, achieving hyper-realistic human image generation remains a desirable yet unsolved task. Existing models like Stable Diffusion and DALL\u00b7E 2 tend to generate human images with incoherent parts or unnatural poses. To tackle these challenges, our key insight is that human image is inherently structural over multiple granularities, from the coarse-level body skeleton to fine-grained spatial geometry. Therefore, capturing such correlations between the explicit appearance and latent structure in one model is essential to generate coherent and natural human images. To this end, we propose a unified framework, HyperHuman, that generates in-the-wild human images of high realism and diverse layouts. Specifically, 1) we first build a large-scale human-centric dataset, named HumanVerse, which consists of 340M images with comprehensive annotations like human pose, depth, and surface normal. 2) Next, we propose a Latent Structural Diffusion Model that simultaneously denoises the depth and surface normal along with the synthesized RGB image. Our model enforces the joint learning of image appearance, spatial relationship, and geometry in a unified network, where each branch in the model complements to each other with both structural awareness and textural richness. 3) Finally, to further boost the visual quality, we propose a Structure-Guided Refiner to compose the predicted conditions for more detailed generation of higher resolution. Extensive experiments demonstrate that our framework yields the state-of-the-art performance, generating hyper-realistic human images under diverse scenarios.",
        "keywords": "Human Image Generation;Latent Structural Diffusion",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Xian Liu;Jian Ren;Aliaksandr Siarohin;Ivan Skorokhodov;Yanyu Li;Dahua Lin;Xihui Liu;Ziwei Liu;Sergey Tulyakov",
        "authorids": "~Xian_Liu1;~Jian_Ren2;~Aliaksandr_Siarohin1;~Ivan_Skorokhodov1;~Yanyu_Li1;~Dahua_Lin1;~Xihui_Liu1;~Ziwei_Liu1;~Sergey_Tulyakov1",
        "gender": "M;M;M;M;;M;F;M;M",
        "homepage": "https://alvinliu0.github.io/;https://alanspike.github.io/;;https://universome.github.io/;;http://dahua.site;https://xh-liu.github.io/;https://liuziwei7.github.io/;http://www.stulyakov.com/",
        "dblp": ";59/2180-5;199/1971;223/0010;194/5818;53/6088;184/3911;05/6300-2;40/6115",
        "google_scholar": "https://scholar.google.com/citations?hl=en-us;https://scholar.google.co.jp/citations?user=vDALiU4AAAAJ;https://scholar.google.it/citations?user=uMl5-k4AAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en;GMzzRRUAAAAJ;https://scholar.google.com.hk/citations?user=4YL23GMAAAAJ;https://scholar.google.com.hk/citations?user=lc45xlcAAAAJ;mgzXR0sAAAAJ",
        "orcid": "0000-0001-9817-7418;;;0000-0002-7611-9310;;;0000-0003-1831-9952;;",
        "linkedin": "xian-liu-9840b52a3/;;;ivan-skorokhodov;;;;;sergeytulyakov/",
        "or_profile": "~Xian_Liu1;~Jian_Ren2;~Aliaksandr_Siarohin1;~Ivan_Skorokhodov1;~Yanyu_Li1;~Dahua_Lin1;~Xihui_Liu1;~Ziwei_Liu1;~Sergey_Tulyakov1",
        "aff": "The Chinese University of Hong Kong;Snap Inc.;Snap Inc.;Snap Inc.;Northeastern University;The Chinese University of Hong Kong;University of Hong Kong;Nanyang Technological University;Snap Inc.",
        "aff_domain": "cuhk.edu.hk;snapchat.com;snapchat.com;snap.com;northeastern.edu;cuhk.edu.hk;hku.hk;ntu.edu.sg;snapchat.com",
        "position": "PhD student;Research Scientist;Intern;Researcher;PhD student;Associate Professor;Assistant Professor;Assistant Professor;Director of Research",
        "bibtex": "@inproceedings{\nliu2024hyperhuman,\ntitle={HyperHuman: Hyper-Realistic Human Generation with Latent Structural Diffusion},\nauthor={Xian Liu and Jian Ren and Aliaksandr Siarohin and Ivan Skorokhodov and Yanyu Li and Dahua Lin and Xihui Liu and Ziwei Liu and Sergey Tulyakov},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=duyA42HlCK}\n}",
        "github": "",
        "project": "",
        "reviewers": "jWKR;HmdV;1Ma5;zFqJ",
        "pdf_size": 47642099,
        "rating": "6;6;8;10",
        "confidence": "3;4;4;3",
        "soundness": "3;3;3;4",
        "contribution": "3;3;2;4",
        "presentation": "3;3;3;4",
        "wc_summary": "76;51;122;93",
        "wc_strengths": "54;61;137;91",
        "wc_weaknesses": "139;429;172;185",
        "wc_questions": "77;28;191;4",
        "wc_review": "346;569;622;373",
        "wc_reply_reviewers": "29;34;81;0",
        "wc_reply_authors": "1286;2599;2475;1680",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "3;5;5;3",
        "rating_avg": [
            7.5,
            1.6583123951777
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            85.5,
            25.83118270617898
        ],
        "wc_strengths_avg": [
            85.75,
            32.69078616368839
        ],
        "wc_weaknesses_avg": [
            231.25,
            115.39578631821874
        ],
        "wc_questions_avg": [
            75.0,
            71.95484695279394
        ],
        "wc_review_avg": [
            477.5,
            119.85929250583786
        ],
        "wc_reply_reviewers_avg": [
            36.0,
            29.04307146291521
        ],
        "wc_reply_authors_avg": [
            2010.0,
            546.8596712137402
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.0,
            1.0
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -0.30151134457776363,
        "gs_citation": 51,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=288451341634004315&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=duyA42HlCK",
        "pdf": "https://openreview.net/pdf?id=duyA42HlCK",
        "email": "cuhk.edu.hk;snapchat.com;snapchat.com;snap.com;northeastern.edu;cuhk.edu.hk;hku.hk;ntu.edu.sg;snapchat.com",
        "author_num": 9,
        "aff_unique_index": "0;1;1;1;2;0;3;4;1",
        "aff_unique_norm": "Chinese University of Hong Kong;Snap Inc.;Northeastern University;University of Hong Kong;Nanyang Technological University",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.cuhk.edu.hk;https://www.snapinc.com;https://www.northeastern.edu;https://www.hku.hk;https://www.ntu.edu.sg",
        "aff_unique_abbr": "CUHK;Snap;NEU;HKU;NTU",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;1;1;1;1;0;0;2;1",
        "aff_country_unique": "China;United States;Singapore"
    },
    {
        "id": "dwademPdV1",
        "title": "Understanding Unfairness via Training Concept Influence",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Knowing the causes of a model's unfairness helps practitioners better understand their data and algorithms. This is an important yet relatively unexplored task. We look into this problem through the lens of the training data - one of the major sources of unfairness. We ask the following questions: how a model's fairness performance would change if, in its training data, some samples (1) were collected from a different (e.g. demographic) group, (2) were labeled differently, or (3) some features were changed? In other words, we quantify the fairness influence of training samples by counterfactually changing samples based on predefined concepts, i.e. data attributes such as features,  labels, or sensitive attributes. To calculate a training sample's influence on the model's unfairness w.r.t a concept, we first generate counterfactual samples based on the concept, i.e. the counterfactual versions of the sample if the concept were changed. We then calculate the resulting impact on the unfairness, via influence function, if the counterfactual samples were used in training. Our framework not only helps practitioners understand the observed unfairness and repair their training data, but also leads to many other applications, e.g. detecting mislabeling, fixing imbalanced representations, and detecting poisoning attacks.",
        "keywords": "machine learning fairness; influence function; responsible AI",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/134fb077a22a7983438041be1099cc63ecd9925c.pdf",
        "author": "Yuanshun Yao;Yang Liu",
        "authorids": "~Yuanshun_Yao2;~Yang_Liu3",
        "gender": "M;M",
        "homepage": "http://www.yliuu.com;https://kevyao.com",
        "dblp": "51/3710-18;186/1486",
        "google_scholar": "jKrIVCIAAAAJ;AG51Bv4AAAAJ",
        "orcid": "0000-0001-8420-6011;",
        "linkedin": ";",
        "or_profile": "~Yang_Liu3;~Kevin_Yao1",
        "aff": "University of California, Santa Cruz;ByteDance Research",
        "aff_domain": "ucsc.edu;bytedance.com",
        "position": "Assistant Professor;Researcher",
        "bibtex": "@misc{\nyao2024understanding,\ntitle={Understanding Unfairness via Training Concept Influence},\nauthor={Yuanshun Yao and Yang Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=dwademPdV1}\n}",
        "github": "",
        "project": "",
        "reviewers": "rxAc;BzqW;AAoD",
        "site": "https://openreview.net/forum?id=dwademPdV1",
        "pdf_size": 1239543,
        "rating": "5;5;6",
        "confidence": "3;4;4",
        "soundness": "3;2;2",
        "contribution": "2;2;3",
        "presentation": "2;2;4",
        "wc_summary": "13;61;81",
        "wc_strengths": "7;12;31",
        "wc_weaknesses": "449;68;14",
        "wc_questions": "101;35;15",
        "wc_review": "570;176;141",
        "wc_reply_reviewers": "0;0;15",
        "wc_reply_authors": "1147;722;344",
        "reply_reviewers": "0;0;1",
        "reply_authors": "3;2;1",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            51.666666666666664,
            28.534579412043595
        ],
        "wc_strengths_avg": [
            16.666666666666668,
            10.338708279513881
        ],
        "wc_weaknesses_avg": [
            177.0,
            193.59235522096424
        ],
        "wc_questions_avg": [
            50.333333333333336,
            36.745370078721784
        ],
        "wc_review_avg": [
            295.6666666666667,
            194.5084973865038
        ],
        "wc_reply_reviewers_avg": [
            5.0,
            7.0710678118654755
        ],
        "wc_reply_authors_avg": [
            737.6666666666666,
            328.0105011869115
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5228064805582618049&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of California, Santa Cruz;ByteDance",
        "aff_unique_dep": ";Research",
        "aff_unique_url": "https://www.ucsc.edu;https://www.bytedance.com",
        "aff_unique_abbr": "UCSC;ByteDance",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Santa Cruz;",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "On the Scalability and Memory Efficiency of Semidefinite Programs for Lipschitz Constant Estimation of Neural Networks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18238",
        "id": "dwzLn78jq7",
        "author_site": "Zi Wang, Bin Hu, Aaron Havens, Alexandre Araujo, Yang Zheng, Yudong Chen, Somesh Jha",
        "tldr": "",
        "abstract": "Lipschitz constant estimation plays an important role in understanding generalization, robustness, and fairness in deep learning. Unlike naive bounds based on the network weight norm product, semidefinite programs (SDPs) have shown great promise in providing less conservative Lipschitz bounds with polynomial-time complexity guarantees. However, due to the memory consumption and running speed, standard SDP algorithms cannot scale to modern neural network architectures. In this paper, we transform the SDPs for Lipschitz constant estimation into an eigenvalue optimization problem, which aligns with the modern large-scale optimization paradigms based on first-order methods. This is amenable to autodiff frameworks such as PyTorch and TensorFlow, requiring significantly less memory than standard SDP algorithms. The transformation also allows us to leverage various existing numerical techniques for eigenvalue optimization, opening the way for further memory improvement and computational speedup. The essential technique of our eigenvalue-problem transformation is to introduce redundant quadratic constraints and then utilize both Lagrangian and Shor's SDP relaxations under a certain trace constraint.  Notably, our numerical study successfully scales the SDP-based Lipschitz constant estimation to address large neural networks on ImageNet. Our numerical examples on CIFAR10 and ImageNet demonstrate that our technique is more scalable than existing approaches. Our code is available at https://github.com/z1w/LipDiff.",
        "keywords": "Semidefinite programming;Lipschitz constant;Deep learning",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Zi Wang;Bin Hu;Aaron J Havens;Alexandre Araujo;Yang Zheng;Yudong Chen;Somesh Jha",
        "authorids": "~Zi_Wang3;~Bin_Hu2;~Aaron_J_Havens1;~Alexandre_Araujo3;~Yang_Zheng4;~Yudong_Chen1;~Somesh_Jha1",
        "gender": "M;M;M;M;M;M;M",
        "homepage": "https://z1w.github.io/;;https://aaronhavens.github.io/;https://zhengy09.github.io/;https://pages.cs.wisc.edu/~yudongchen/;;https://alexandrearaujo.com/",
        "dblp": ";;;;15/1975-1;j/SomeshJha;228/6599",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;;https://scholar.google.co.uk/citations?user=hm5XrmoAAAAJ;ze5rCdwAAAAJ;BaI7l8QAAAAJ;https://scholar.google.fr/citations?user=wsu61VYAAAAJ",
        "orcid": "0000-0002-0815-1343;;;;0000-0002-6416-5635;;",
        "linkedin": "zi-wang-53221139/;;;;;;",
        "or_profile": "~Zi_Wang3;~Bin_Hu2;~Aaron_J_Havens1;~Yang_Zheng4;~Yudong_Chen1;~Somesh_Jha1;~Alexandre_ARAUJO1",
        "aff": "University of Wisconsin, Madison;University of Illinois, Urbana Champaign;University of Illinois, Urbana Champaign;University of California, San Diego;Department of Computer Sciences, University of Wisconsin - Madison;Department of Computer Science, University of Wisconsin, Madison;New York University",
        "aff_domain": "wisc.edu;illinois.edu;illinois.edu;ucsd.edu;cs.wisc.edu;cs.wisc.edu;nyu.edu",
        "position": "PhD student;Assistant Professor;PhD student;Assistant Professor;Associate Professor;Full Professor;Postdoc",
        "bibtex": "@inproceedings{\nwang2024on,\ntitle={On the Scalability and Memory Efficiency of Semidefinite Programs  for Lipschitz Constant Estimation of Neural Networks},\nauthor={Zi Wang and Bin Hu and Aaron J Havens and Alexandre Araujo and Yang Zheng and Yudong Chen and Somesh Jha},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=dwzLn78jq7}\n}",
        "github": "",
        "project": "",
        "reviewers": "GVUd;peb1;LyYu;CCdS",
        "pdf_size": 413448,
        "rating": "5;6;6;8",
        "confidence": "4;4;3;3",
        "soundness": "3;3;3;4",
        "contribution": "2;2;4;4",
        "presentation": "4;3;3;3",
        "wc_summary": "80;113;70;148",
        "wc_strengths": "30;34;30;138",
        "wc_weaknesses": "199;212;42;158",
        "wc_questions": "80;18;71;100",
        "wc_review": "389;377;213;544",
        "wc_reply_reviewers": "0;12;12;0",
        "wc_reply_authors": "1512;1076;553;1140",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "3;2;1;2",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            1.0
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            102.75,
            30.589009464185008
        ],
        "wc_strengths_avg": [
            58.0,
            46.216880033165374
        ],
        "wc_weaknesses_avg": [
            152.75,
            66.97527528872128
        ],
        "wc_questions_avg": [
            67.25,
            30.309858132297485
        ],
        "wc_review_avg": [
            380.75,
            117.12466648831919
        ],
        "wc_reply_reviewers_avg": [
            6.0,
            6.0
        ],
        "wc_reply_authors_avg": [
            1070.25,
            341.9023069533167
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.6882472016116854,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6312174405359716717&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=dwzLn78jq7",
        "pdf": "https://openreview.net/pdf?id=dwzLn78jq7",
        "email": "wisc.edu;illinois.edu;illinois.edu;ucsd.edu;cs.wisc.edu;cs.wisc.edu;nyu.edu",
        "author_num": 7,
        "aff_unique_index": "0;1;1;2;3;3;4",
        "aff_unique_norm": "University of Wisconsin;University of Illinois Urbana-Champaign;University of California, San Diego;University of Wisconsin-Madison;New York University",
        "aff_unique_dep": ";;;Department of Computer Sciences;",
        "aff_unique_url": "https://www.wisc.edu;https://illinois.edu;https://www.ucsd.edu;https://www.wisc.edu;https://www.nyu.edu",
        "aff_unique_abbr": "UW;UIUC;UCSD;UW-Madison;NYU",
        "aff_campus_unique_index": "0;1;1;2;0;0",
        "aff_campus_unique": "Madison;Urbana-Champaign;San Diego;",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "dxI1HLatWw",
        "title": "Generalized Temporal Difference Learning Models for Supervised Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In conventional statistical learning settings, data points are typically assumed to be independently and identically distributed (i.i.d.) according to some unknown probability distribution. Various supervised learning algorithms, such as generalized linear models, are derived by making different assumptions about the conditional distribution of the response variable given the independent variables. In this paper, we propose an alternative formulation in which data points in a typical supervised learning dataset are treated as interconnected, and we model the data sampling process by a Markov reward process. Accordingly, we view the original supervised learning problem as a classic on-policy policy evaluation problem in reinforcement learning, and introduce a generalized temporal difference (TD) learning algorithm to address it. Theoretically, we establish the convergence of our generalized TD algorithms under linear function approximation. We then explore the relationship between TD's solution and the original linear regression solution. This connection suggests that the probability transition matrix does not significantly impact optimal solutions in practice and hence can be easy to design. In our empirical evaluations, we examine critical designs of our generalized TD algorithm, and demonstrate the competitive generalization performance across a variety of benchmark datasets, including regression, binary classification, and image classification within a deep learning context.",
        "keywords": "reinforcement learning;temporal difference learning;supervised learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Yangchen Pan;Junfeng Wen;Chenjun Xiao;Philip Torr",
        "authorids": "~Yangchen_Pan2;~Junfeng_Wen1;~Chenjun_Xiao1;~Philip_Torr1",
        "gender": "M;;;",
        "homepage": "https://yannickycpan.github.io/yangchenpan/;;https://chenjun-x.github.io/;http://www.robots.ox.ac.uk/~tvg/",
        "dblp": "183/0925;153/5459;178/8641;",
        "google_scholar": "4M4pOp4AAAAJ;fXRXgPMAAAAJ;;",
        "orcid": ";;0000-0002-5493-1500;",
        "linkedin": ";;;",
        "or_profile": "~Yangchen_Pan2;~Junfeng_Wen1;~Chenjun_Xiao1;~Philip_Torr1",
        "aff": "University of Oxford;Carleton University;Huawei Technologies Ltd.;University of Oxford",
        "aff_domain": "eng.ox.ac.uk;carleton.ca;huawei.com;ox.ac.uk",
        "position": "Lecturer;Assistant Professor;Researcher;Full Professor",
        "bibtex": "@misc{\npan2024generalized,\ntitle={Generalized Temporal Difference Learning Models for Supervised Learning},\nauthor={Yangchen Pan and Junfeng Wen and Chenjun Xiao and Philip Torr},\nyear={2024},\nurl={https://openreview.net/forum?id=dxI1HLatWw}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZxKx;oS7Z;WyFN;9RLa",
        "site": "https://openreview.net/forum?id=dxI1HLatWw",
        "pdf_size": 732790,
        "rating": "3;6;8;8",
        "confidence": "4;3;3;3",
        "soundness": "2;2;4;3",
        "contribution": "1;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "68;57;161;139",
        "wc_strengths": "115;30;16;37",
        "wc_weaknesses": "462;60;8;22",
        "wc_questions": "6;59;25;1",
        "wc_review": "651;206;210;199",
        "wc_reply_reviewers": "1045;149;0;19",
        "wc_reply_authors": "1247;395;44;109",
        "reply_reviewers": "6;1;0;1",
        "reply_authors": "7;2;1;1",
        "rating_avg": [
            6.25,
            2.0463381929681126
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            106.25,
            44.60591328512398
        ],
        "wc_strengths_avg": [
            49.5,
            38.56488039654732
        ],
        "wc_weaknesses_avg": [
            138.0,
            188.02659386374046
        ],
        "wc_questions_avg": [
            22.75,
            22.76373211931646
        ],
        "wc_review_avg": [
            316.5,
            193.16379060269034
        ],
        "wc_reply_reviewers_avg": [
            303.25,
            432.07197027810076
        ],
        "wc_reply_authors_avg": [
            448.75,
            479.4123355734602
        ],
        "reply_reviewers_avg": [
            2.0,
            2.345207879911715
        ],
        "reply_authors_avg": [
            2.75,
            2.48746859276655
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9169493006161777,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:JhVMG29N-d0J:scholar.google.com/&scioq=Generalized+Temporal+Difference+Learning+Models+for+Supervised+Learning&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "University of Oxford;Carleton University;Huawei",
        "aff_unique_dep": ";;Huawei Technologies",
        "aff_unique_url": "https://www.ox.ac.uk;https://carleton.ca;https://www.huawei.com",
        "aff_unique_abbr": "Oxford;Carleton;Huawei",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;0",
        "aff_country_unique": "United Kingdom;Canada;China"
    },
    {
        "id": "dxJKLozjQl",
        "title": "Data Distribution Valuation with Incentive Compatibility",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Data valuation is a class of techniques for quantitatively assessing the value of data for applications like pricing in data marketplaces. Existing data valuation methods define a value for a dataset $D$. However, in many use cases, users are interested not only in the value of a dataset, but in the distribution from which the dataset was sampled. For example, consider a buyer trying to evaluate whether to purchase data from different vendors. The buyer may observe (and compare) only a small sample from each vendor prior to purchasing the data, to decide which vendor's data distribution is most useful to the buyer. The core question of this work is how should we compare the values of data distributions from their samples? Under a Huber model for statistical heterogeneity across vendors, we propose a maximum-mean discrepancy (MMD)-based valuation method which enables theoretically principled and actionable policies for comparing data distributions from samples. We show theoretically that our method achieves incentive-compatibility, thus incentivizing the data vendors to report their data truthfully.\nWe demonstrate the efficacy of our proposed valuation method against several existing baselines, on multiple real-world datasets (e.g., network intrusion detection, credit card fraud detection) and downstream applications (classification, regression).",
        "keywords": "Data distribution valuation;Maximum mean discrepancy;Huber model",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/d43b47a4f7774683a1916a6483ed7f2a9d182e76.zip",
        "author": "Xinyi Xu;Shuaiqi Wang;Chuan-Sheng Foo;Bryan Kian Hsiang Low;Giulia Fanti",
        "authorids": "~Xinyi_Xu4;~Shuaiqi_Wang1;~Chuan-Sheng_Foo1;~Bryan_Kian_Hsiang_Low1;~Giulia_Fanti1",
        "gender": "M;M;M;M;",
        "homepage": "https://xinyi-xu.com;https://wsqwsq.github.io/;http://ai.stanford.edu/~csfoo;http://www.comp.nus.edu.sg/~lowkh;https://www.andrew.cmu.edu/user/gfanti/",
        "dblp": ";74/5587;73/1823;97/4877;141/9910",
        "google_scholar": "2762GgsAAAAJ;yy2OXxEAAAAJ;AgbeqGkAAAAJ;https://scholar.google.com.tw/citations?user=2P-Q09UAAAAJ;Rn_BmTYAAAAJ",
        "orcid": "0000-0002-8744-0695;0000-0003-4962-7501;0000-0002-4748-5792;;0000-0002-7671-2624",
        "linkedin": "xinyi-xu-a93222133/;;;;",
        "or_profile": "~Xinyi_Xu4;~Shuaiqi_Wang1;~Chuan-Sheng_Foo1;~Bryan_Kian_Hsiang_Low1;~Giulia_Fanti1",
        "aff": "National University of Singapore;Carnegie Mellon University;Institute for Infocomm Research, A*STAR;National University of Singapore;Carnegie Mellon University",
        "aff_domain": "nus.edu.sg;andrew.cmu.edu;i2r.a-star.edu.sg;nus.edu.sg;andrew.cmu.edu",
        "position": "PhD student;PhD student;Principal Scientist;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nxu2024data,\ntitle={Data Distribution Valuation with Incentive Compatibility},\nauthor={Xinyi Xu and Shuaiqi Wang and Chuan-Sheng Foo and Bryan Kian Hsiang Low and Giulia Fanti},\nyear={2024},\nurl={https://openreview.net/forum?id=dxJKLozjQl}\n}",
        "github": "",
        "project": "",
        "reviewers": "s7hX;uc12;c1ZW",
        "site": "https://openreview.net/forum?id=dxJKLozjQl",
        "pdf_size": 1534790,
        "rating": "1;3;5",
        "confidence": "4;3;4",
        "soundness": "1;2;2",
        "contribution": "1;2;1",
        "presentation": "1;3;3",
        "wc_summary": "131;232;90",
        "wc_strengths": "10;55;9",
        "wc_weaknesses": "227;350;161",
        "wc_questions": "45;111;143",
        "wc_review": "413;748;403",
        "wc_reply_reviewers": "0;235;225",
        "wc_reply_authors": "586;974;1824",
        "reply_reviewers": "0;1;1",
        "reply_authors": "2;4;5",
        "rating_avg": [
            3.0,
            1.632993161855452
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            151.0,
            59.67132197854063
        ],
        "wc_strengths_avg": [
            24.666666666666668,
            21.452790546272116
        ],
        "wc_weaknesses_avg": [
            246.0,
            78.3198569968051
        ],
        "wc_questions_avg": [
            99.66666666666667,
            40.80304999493161
        ],
        "wc_review_avg": [
            521.3333333333334,
            160.3295217842165
        ],
        "wc_reply_reviewers_avg": [
            153.33333333333334,
            108.49987199173195
        ],
        "wc_reply_authors_avg": [
            1128.0,
            517.0093487226964
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            1.247219128924647
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ZAOPXer8SJ8J:scholar.google.com/&scioq=Data+Distribution+Valuation+with+Incentive+Compatibility&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0;1",
        "aff_unique_norm": "National University of Singapore;Carnegie Mellon University;Institute for Infocomm Research",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.nus.edu.sg;https://www.cmu.edu;https://www.i2r.a-star.edu.sg",
        "aff_unique_abbr": "NUS;CMU;I2R",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;1",
        "aff_country_unique": "Singapore;United States"
    },
    {
        "title": "DiffusionNAG: Predictor-guided Neural Architecture Generation with Diffusion Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18237",
        "id": "dyG2oLJYyX",
        "author_site": "Sohyun An, Hayeon Lee, Jaehyeong Jo, Seanie Lee, Sung Ju Hwang",
        "tldr": "",
        "abstract": "Existing NAS methods suffer from either an excessive amount of time for repetitive sampling and training of many task-irrelevant architectures. To tackle such limitations of existing NAS methods, we propose a paradigm shift from NAS to a novel conditional Neural Architecture Generation (NAG) framework based on diffusion models, dubbed DiffusionNAG. Specifically, we consider the neural architectures as directed graphs and propose a graph diffusion model for generating them. Moreover, with the guidance of parameterized predictors, DiffusionNAG can flexibly generate task-optimal architectures with the desired properties for diverse tasks, by sampling from a region that is more likely to satisfy the properties. This conditional NAG scheme is significantly more efficient than previous NAS schemes which sample the architectures and filter them using the property predictors. We validate the effectiveness of DiffusionNAG through extensive experiments in two predictor-based NAS scenarios: Transferable NAS and Bayesian Optimization (BO)-based NAS. DiffusionNAG achieves superior performance with speedups of up to 35$\\times$ when compared to the baselines on Transferable NAS benchmarks. Furthermore, when integrated into a BO-based algorithm, DiffusionNAG outperforms existing BO-based NAS approaches, particularly in the large MobileNetV3 search space on the ImageNet 1K dataset. Code is available at https://github.com/CownowAn/DiffusionNAG.",
        "keywords": "Neural Architecture Search;Diffusion Model;Meta Learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Sohyun An;Hayeon Lee;Jaehyeong Jo;Seanie Lee;Sung Ju Hwang",
        "authorids": "~Sohyun_An1;~Hayeon_Lee1;~Jaehyeong_Jo1;~Seanie_Lee1;~Sung_Ju_Hwang1",
        "gender": "F;F;M;M;",
        "homepage": "https://cownowan.github.io/;https://hayeonlee.github.io/;https://github.com/harryjo97;https://seanie12.github.io/;",
        "dblp": "348/6996;246/4987;296/2037;219/6771;",
        "google_scholar": "tW1jSXMAAAAJ;5DaLgBUAAAAJ;https://scholar.google.com/citations?hl=ko;zrZu6GkAAAAJ;",
        "orcid": ";;;;",
        "linkedin": "sohyunan0423;;;;",
        "or_profile": "~Sohyun_An1;~Hayeon_Lee1;~Jaehyeong_Jo1;~Seanie_Lee1;~Sung_Ju_Hwang1",
        "aff": "Korea Advanced Institute of Science & Technology;FAIR (Meta AI);Korea Advanced Institute of Science & Technology;Montreal Institute for Learning Algorithms, University of Montreal, Universit\u00e9 de Montr\u00e9al;",
        "aff_domain": "kaist.ac.kr;meta.com;kaist.ac.kr;mila.umontreal.ca;",
        "position": "MS student;Postdoc;MS student;Intern;",
        "bibtex": "@inproceedings{\nan2024diffusionnag,\ntitle={Diffusion{NAG}: Predictor-guided Neural Architecture Generation with Diffusion Models},\nauthor={Sohyun An and Hayeon Lee and Jaehyeong Jo and Seanie Lee and Sung Ju Hwang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=dyG2oLJYyX}\n}",
        "github": "",
        "project": "",
        "reviewers": "qikk;EDN5;ZVno;qPhs",
        "pdf_size": 6316671,
        "rating": "5;6;6;6",
        "confidence": "4;3;2;3",
        "soundness": "3;3;3;3",
        "contribution": "3;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "85;47;74;36",
        "wc_strengths": "68;54;133;60",
        "wc_weaknesses": "133;157;39;120",
        "wc_questions": "5;93;59;5",
        "wc_review": "291;351;305;221",
        "wc_reply_reviewers": "0;0;65;12",
        "wc_reply_authors": "1956;3111;1338;1364",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "5;7;4;6",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            60.5,
            19.78004044485248
        ],
        "wc_strengths_avg": [
            78.75,
            31.712576369636068
        ],
        "wc_weaknesses_avg": [
            112.25,
            44.324795543803695
        ],
        "wc_questions_avg": [
            40.5,
            37.47999466382032
        ],
        "wc_review_avg": [
            292.0,
            46.61544808322666
        ],
        "wc_reply_reviewers_avg": [
            19.25,
            26.864242032858474
        ],
        "wc_reply_authors_avg": [
            1942.25,
            718.619640352252
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            5.5,
            1.118033988749895
        ],
        "replies_avg": [
            32,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14461716561348360480&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=dyG2oLJYyX",
        "pdf": "https://openreview.net/pdf?id=dyG2oLJYyX",
        "email": "kaist.ac.kr;meta.com;kaist.ac.kr;mila.umontreal.ca;",
        "author_num": 5,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology;Meta;University of Montreal",
        "aff_unique_dep": ";Meta AI Research;Montreal Institute for Learning Algorithms",
        "aff_unique_url": "https://www.kaist.ac.kr;https://ai.facebook.com;https://www.mila.quebec",
        "aff_unique_abbr": "KAIST;FAIR;MILA",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Montreal",
        "aff_country_unique_index": "0;1;0;2",
        "aff_country_unique": "South Korea;United States;Canada"
    },
    {
        "id": "dyHn2MAYxM",
        "title": "Align before Adapt: Efficient and Generalizable Video Action Recognition with Text Corpus",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large-scale pre-trained visual-language models have achieved significant success in various video tasks. However, most existing methods follow an 'adapt then align' paradigm, where pre-trained image encoders are adapted to model video-level representations, which are then aligned to the semantics or one-hot labels of target actions. This paradigm overlooks the challenge of mapping from static images to complicated activity concepts. In this paper, we propose a novel and efficient 'align before adapt' paradigm. We introduce a token-merging strategy to the pre-trained image model, generating region-aware embeddings in a hierarchical manner. This enhances the visual-semantic alignment at a fine-grained level. Additionally, we align the region-aware embeddings with the text corpus of action-related entities, such as objects, body parts, primitive motions, and scenes. The embeddings of the aligned text entities serve as queries for the transformer-based video adapter, better aligning with the activity concepts in a video sequence. Our proposed framework achieves competitive performance and superior generalizability while significantly reducing computational costs. In fully-supervised scenarios, our method achieves 87.9% top-1 accuracy on Kinetics-400, using only 4947 GFLOPs. Furthermore, in 2-shot experiments, our method outperforms the previous state-of-the-art by 13.0% and 12.0% on HMDB-51 and UCF-101, respectively.",
        "keywords": "Action and event understanding;Vision and language;Multimodal learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yifei Chen;Dapeng Chen;Ruijin Liu;SHIXIANG TANG;Sai Zhou;Wenyuan Xue;Wei Peng",
        "authorids": "~Yifei_Chen5;~Dapeng_Chen4;~Ruijin_Liu1;~SHIXIANG_TANG1;~Sai_Zhou1;~Wenyuan_Xue1;~Wei_Peng6",
        "gender": "M;M;M;M;F;;M",
        "homepage": "https://github.com/ychencq;;;;;;https://www.rmit.edu.au/profiles/p/wei-peng3",
        "dblp": ";04/3068;254/7956;260/6757;;;",
        "google_scholar": "lovo9BwAAAAJ;-Wpd7FcAAAAJ;https://scholar.google.com/citations?hl=zh-CN;TJ4ihdkAAAAJ;;;",
        "orcid": ";;0000-0002-3672-5332;;;;",
        "linkedin": "yifei-chen-ychencq;;;shixiang-tang-80441a1a3/;saizhou/;;wei-peng-phd-in-ai-4515ba22/?originalSubdomain=au",
        "or_profile": "~Yifei_Chen5;~Dapeng_Chen4;~Ruijin_Liu1;~SHIXIANG_TANG1;~Sai_Zhou1;~Wenyuan_Xue1;~Wei_Peng6",
        "aff": "Huawei Technologies Ltd.;Huawei Technologies Ltd.;;The Chinese University of Hong Kong;Huawei Technologies Ltd.;;Huawei Technologies Ltd.",
        "aff_domain": "huawei.com;huawei.com;;cuhk.edu.hk;huawei.com;;huawei.com",
        "position": "Researcher;Researcher;;Postdoc;Researcher;;Principal Researcher",
        "bibtex": "@misc{\nchen2024align,\ntitle={Align before Adapt: Efficient and Generalizable Video Action Recognition with Text Corpus},\nauthor={Yifei Chen and Dapeng Chen and Ruijin Liu and SHIXIANG TANG and Sai Zhou and Wenyuan Xue and Wei Peng},\nyear={2024},\nurl={https://openreview.net/forum?id=dyHn2MAYxM}\n}",
        "github": "",
        "project": "",
        "reviewers": "njJR;FfRS;UeNy;X9sb;FRFQ",
        "site": "https://openreview.net/forum?id=dyHn2MAYxM",
        "pdf_size": 11513801,
        "rating": "3;5;5;6;6",
        "confidence": "5;4;5;4;4",
        "soundness": "2;3;3;3;3",
        "contribution": "2;3;2;3;3",
        "presentation": "2;3;2;2;3",
        "wc_summary": "54;65;80;173;70",
        "wc_strengths": "15;21;69;92;57",
        "wc_weaknesses": "337;113;414;352;48",
        "wc_questions": "3;4;10;39;120",
        "wc_review": "409;203;573;656;295",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            5.0,
            1.0954451150103321
        ],
        "confidence_avg": [
            4.4,
            0.48989794855663565
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            88.4,
            43.12122447241033
        ],
        "wc_strengths_avg": [
            50.8,
            29.109448637856403
        ],
        "wc_weaknesses_avg": [
            252.8,
            144.50107266037855
        ],
        "wc_questions_avg": [
            35.2,
            44.38648442938459
        ],
        "wc_review_avg": [
            427.2,
            168.33347854779214
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.7453559924999299,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:0UbK-c6tdiMJ:scholar.google.com/&scioq=Align+before+Adapt:+Efficient+and+Generalizable+Video+Action+Recognition+with+Text+Corpus&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "Huawei;Chinese University of Hong Kong",
        "aff_unique_dep": "Huawei Technologies;",
        "aff_unique_url": "https://www.huawei.com;https://www.cuhk.edu.hk",
        "aff_unique_abbr": "Huawei;CUHK",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Initializing Models with Larger Ones",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18236",
        "id": "dyrGMhicMw",
        "author_site": "Zhiqiu Xu, Yanjie Chen, Kirill Vishniakov, Yida Yin, Zhiqiang Shen, trevor darrell, Lingjie Liu, Zhuang Liu",
        "tldr": "",
        "abstract": "Weight initialization plays an important role in neural network training. Widely used initialization methods are proposed and evaluated for networks that are trained from scratch. However, the growing number of pretrained models now offers new opportunities for tackling this classical problem of weight initialization. In this work, we introduce weight selection, a method for initializing smaller models by selecting a subset of weights from a pretrained larger model. This enables the transfer of knowledge from pretrained weights to smaller models. Our experiments demonstrate that weight selection can significantly enhance the performance of small models and reduce their training time.  Notably, it can also be used together with knowledge distillation. Weight selection offers a new approach to leverage the power of pretrained models in resource-constrained settings, and we hope it can be a useful tool for training small models in the large-model era.",
        "keywords": "Deep Learning;Neural Networks;Weight Initialization;Small Models;Computer Vision",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Zhiqiu Xu;Yanjie Chen;Kirill Vishniakov;Yida Yin;Zhiqiang Shen;Trevor Darrell;Lingjie Liu;Zhuang Liu",
        "authorids": "~Zhiqiu_Xu1;~Yanjie_Chen2;~Kirill_Vishniakov1;~Yida_Yin1;~Zhiqiang_Shen1;~Trevor_Darrell2;~Lingjie_Liu1;~Zhuang_Liu1",
        "gender": "M;;M;;;;F;",
        "homepage": "https://oscarxzq.github.io;;https://kirill-vish.github.io/;;;;https://lingjie0206.github.io/;",
        "dblp": ";;;;;;204/0052;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;H02tLFMAAAAJ;;;;https://scholar.google.de/citations?user=HZPnJ9gAAAAJ;",
        "orcid": ";;;;;;;",
        "linkedin": "oscar-xu-1250821a1/;yanjie-chen-69b914230/;https://linkedin.com/in/kirill-vishniakov-605aa0142;;;;;",
        "or_profile": "~Zhiqiu_Xu1;~Yanjie_Chen2;~Kirill_Vishniakov1;~Yida_Yin1;~Zhiqiang_Shen1;~Trevor_Darrell2;~Lingjie_Liu1;~Zhuang_Liu1",
        "aff": "University of Pennsylvania;University of California, Berkeley;M42;;;;University of Pennsylvania;",
        "aff_domain": "upenn.edu;berkeley.edu;m42.ae;;;;upenn.edu;",
        "position": "PhD student;Undergrad student;Researcher;;;;Assistant Professor;",
        "bibtex": "@inproceedings{\nxu2024initializing,\ntitle={Initializing Models with Larger Ones},\nauthor={Zhiqiu Xu and Yanjie Chen and Kirill Vishniakov and Yida Yin and Zhiqiang Shen and Trevor Darrell and Lingjie Liu and Zhuang Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=dyrGMhicMw}\n}",
        "github": "",
        "project": "",
        "reviewers": "FWr5;rXy8;HkYt;A6vA",
        "pdf_size": 1210865,
        "rating": "6;6;8;8",
        "confidence": "4;3;4;4",
        "soundness": "2;3;3;2",
        "contribution": "3;3;3;3",
        "presentation": "2;2;4;4",
        "wc_summary": "25;519;39;36",
        "wc_strengths": "15;2;42;109",
        "wc_weaknesses": "238;2;2;450",
        "wc_questions": "4;2;45;190",
        "wc_review": "282;525;128;785",
        "wc_reply_reviewers": "29;165;26;163",
        "wc_reply_authors": "1478;1243;365;2962",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "3;2;1;7",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            1.0
        ],
        "wc_summary_avg": [
            154.75,
            210.36441595479022
        ],
        "wc_strengths_avg": [
            42.0,
            41.28559070668603
        ],
        "wc_weaknesses_avg": [
            173.0,
            186.70565069113468
        ],
        "wc_questions_avg": [
            60.25,
            76.85172411859087
        ],
        "wc_review_avg": [
            430.0,
            249.07729723923055
        ],
        "wc_reply_reviewers_avg": [
            95.75,
            68.26190372381949
        ],
        "wc_reply_authors_avg": [
            1512.0,
            934.2946537361754
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.25,
            2.277608394786075
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 26,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10765838762474895073&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=dyrGMhicMw",
        "pdf": "https://openreview.net/pdf?id=dyrGMhicMw",
        "email": "upenn.edu;berkeley.edu;m42.ae;;;;upenn.edu;",
        "author_num": 8,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "University of Pennsylvania;University of California, Berkeley;M42",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.upenn.edu;https://www.berkeley.edu;",
        "aff_unique_abbr": "UPenn;UC Berkeley;",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Berkeley",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States;"
    },
    {
        "id": "dzxvqmgCwj",
        "title": "Beyond Policy Transfer: Self-Supervised Reward Adaptation in New Environments",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "For large-scale deployment of autonomous agents, they must perform their tasks not only in their training environment but also in environments they have never seen before, such as robots transferred from controlled testbeds to households. Traditional approaches improve adaptability during training by employing varied environments or during deployment by relying on finetuning. However, the former often fails in unforeseen conditions, while the latter requires access to true reward labels, usually unavailable outside controlled settings. In this work, we address the challenge of adapting to environments with different dynamics and observations from the training environment, without explicit reward signals. We identify that learned task objectives, represented by reward models, are often transferable even when policies are not, as they are more robust against changes in dynamics. However, reward model performance in target environments is vulnerable to new observational shifts like lighting or noise. To address this, our key insight is adapting the reward model at test time, using a self-supervised learning framework. We empirically demonstrate that adapting reward with our method enables policies to solve tasks under new challenges, such as added noise, obstacles, or reversed dynamics, where traditional policy and naive reward transfer methods fail.",
        "keywords": "reinforcement learning;self-supervised learning;domain transfer;test-time adaptation",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Xinhu Li;Ayush Jain;Zhaojing Yang;Erdem Biyik;Joseph J Lim",
        "authorids": "~Xinhu_Li1;~Ayush_Jain2;~Zhaojing_Yang1;~Erdem_Biyik1;~Joseph_J_Lim1",
        "gender": "M;;M;M;M",
        "homepage": ";https://ayushj240.github.io/;https://github.com/yang-zj1026;http://people.eecs.berkeley.edu/~ebiyik/;http://people.csail.mit.edu/lim/",
        "dblp": ";131/6283-3.html;;194/2736;08/3086",
        "google_scholar": ";-zEc_sAAAAAJ;;https://scholar.google.com.tr/citations?user=P-G3sjYAAAAJ;jTnQTBoAAAAJ",
        "orcid": ";;;0000-0002-9516-3130;",
        "linkedin": "%E6%98%95%E8%99%8E-%E6%9D%8E-2ba449200/;;;https://linkedin.com/in/ebiyik;",
        "or_profile": "~Xinhu_Li1;~Ayush_Jain2;~Zhaojing_Yang1;~Erdem_Biyik1;~Joseph_J_Lim1",
        "aff": ";University of Southern California;University of Southern California;University of Southern California;Korea Advanced Institute of Science & Technology",
        "aff_domain": ";usc.edu;usc.edu;usc.edu;kaist.ac.kr",
        "position": ";PhD student;MS student;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nli2024beyond,\ntitle={Beyond Policy Transfer: Self-Supervised Reward Adaptation in New Environments},\nauthor={Xinhu Li and Ayush Jain and Zhaojing Yang and Erdem Biyik and Joseph J Lim},\nyear={2024},\nurl={https://openreview.net/forum?id=dzxvqmgCwj}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=dzxvqmgCwj",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:U44xcGW11SAJ:scholar.google.com/&scioq=Beyond+Policy+Transfer:+Self-Supervised+Reward+Adaptation+in+New+Environments&hl=en&as_sdt=0,23",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "University of Southern California;Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.usc.edu;https://www.kaist.ac.kr",
        "aff_unique_abbr": "USC;KAIST",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Los Angeles;",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "United States;South Korea"
    },
    {
        "id": "e0FExRqr5Q",
        "title": "Discouraging Posterior Collapse in Hierarchical Variational Autoencoders Using Context",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Hierarchical Variational Autoencoders (VAEs) are among the most popular likelihood-based generative models. \nThere is a consensus that the top-down hierarchical VAEs allow effective learning of deep latent structures and avoid problems like posterior collapse. \nHere, we show that this is not necessarily the case, and the problem of collapsing posteriors remains. \nTo discourage this issue, we propose a deep hierarchical VAE with a context on top. \nSpecifically, we use a Discrete Cosine Transform to obtain the last latent variable.\nIn a series of experiments, we observe that the proposed modification allows us to achieve better utilization of the latent space and does not harm the model's generative abilities.",
        "keywords": "VAE;posterior collapse;generative models",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/4d65b8015fb1a61e6ffb60951be13ff39bfef0a8.zip",
        "author": "Anna Kuzina;Jakub M. Tomczak",
        "authorids": "~Anna_Kuzina1;~Jakub_M._Tomczak1",
        "gender": "F;M",
        "homepage": ";https://jmtomczak.github.io/",
        "dblp": ";80/8238",
        "google_scholar": "IMoc7ioAAAAJ;https://scholar.google.pl/citations?user=XB99pR4AAAAJ",
        "orcid": ";0000-0001-8634-6878",
        "linkedin": ";jakub-tomczak-04305314a/",
        "or_profile": "~Anna_Kuzina1;~Jakub_Mikolaj_Tomczak1",
        "aff": "Microsoft Research;Eindhoven University of Technology",
        "aff_domain": "research.microsoft.com;tue.nl",
        "position": "Researcher;Associate Professor",
        "bibtex": "@misc{\nkuzina2024discouraging,\ntitle={Discouraging Posterior Collapse in Hierarchical Variational Autoencoders Using Context},\nauthor={Anna Kuzina and Jakub M. Tomczak},\nyear={2024},\nurl={https://openreview.net/forum?id=e0FExRqr5Q}\n}",
        "github": "",
        "project": "",
        "reviewers": "dETJ;aUPB;nW8Z;KzhA",
        "site": "https://openreview.net/forum?id=e0FExRqr5Q",
        "pdf_size": 6817383,
        "rating": "3;5;5;5",
        "confidence": "4;4;2;2",
        "soundness": "3;2;2;2",
        "contribution": "2;3;2;3",
        "presentation": "3;3;3;1",
        "wc_summary": "70;48;85;105",
        "wc_strengths": "98;34;97;44",
        "wc_weaknesses": "650;83;150;157",
        "wc_questions": "7;6;71;7",
        "wc_review": "825;171;403;313",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            1.0
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            77.0,
            20.844663585675832
        ],
        "wc_strengths_avg": [
            68.25,
            29.46502163583119
        ],
        "wc_weaknesses_avg": [
            260.0,
            227.01211421419782
        ],
        "wc_questions_avg": [
            22.75,
            27.860141779969464
        ],
        "wc_review_avg": [
            428.0,
            243.67396249907375
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5145046453351466946&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Microsoft;Eindhoven University of Technology",
        "aff_unique_dep": "Microsoft Research;",
        "aff_unique_url": "https://www.microsoft.com/en-us/research;https://www.tue.nl",
        "aff_unique_abbr": "MSR;TU/e",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United States;Netherlands"
    },
    {
        "id": "e0LwFqw4Bi",
        "title": "Towards Unified and Effective Domain Generalization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We propose \\textbf{UniDG}, a novel and \\textbf{Uni}fied framework for \\textbf{D}omain \\textbf{G}eneralization that is capable of significantly enhancing the out-of-distribution performance of foundation models regardless of their architectures. The core idea of UniDG is to finetune models during inference time which saves the cost of iterative training. Specifically, we encourage models to learn the distribution of testing data in an unsupervised manner and impose a penalty regarding the updating step of model parameters. The penalty term can effectively reduce catastrophic forgetting issues as we would like to maximally preserve the valuable knowledge in the original model. Empirically, on up to 12 visual backbones, including CNN-, MLP-, and transformer-based models, ranging from 1.89M to 303M parameters, UniDG shows an average accuracy improvement of 5.4\\% on DomainBed. We believe that these performance results are able to manifest the superiority and versatility of UniDG.",
        "keywords": "Domain Generalization; Foundation Models; Test-Time Adaption",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Yiyuan Zhang;Kaixiong Gong;Xiaohan Ding;Kaipeng Zhang;Kurt Keutzer;Xiangyu Yue",
        "authorids": "~Yiyuan_Zhang1;~Kaixiong_Gong1;~Xiaohan_Ding1;~Kaipeng_Zhang1;~Kurt_Keutzer1;~Xiangyu_Yue1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://invictus717.github.io/;;https://dingxiaohan.xyz/;http://kpzhang93.github.io/;https://people.eecs.berkeley.edu/~keutzer/;http://xyue.io/",
        "dblp": "163/6458;289/0124;218/7379;179/2126;k/KurtKeutzer.html;207/7518",
        "google_scholar": "KuYlJCIAAAAJ;kBVshUUAAAAJ;CIjw0KoAAAAJ;4OqZBmYAAAAJ;ID9QePIAAAAJ;-xQ-C1sAAAAJ",
        "orcid": "0000-0001-6643-9698;;;;0000-0003-3868-8501;",
        "linkedin": ";;;;kurtkeutzer/;",
        "or_profile": "~Yiyuan_Zhang1;~Kaixiong_Gong1;~Xiaohan_Ding1;~Kaipeng_Zhang1;~Kurt_Keutzer1;~Xiangyu_Yue1",
        "aff": "The Chinese University of Hong Kong;The Chinese University of Hong Kong;Tencent AI Lab;Shanghai AI Laboratory;University of California, Berkeley;The Chinese University of Hong Kong",
        "aff_domain": "ie.cuhk.edu;ie.cuhk.edu;tencent.com;pjlab.org.cn;berkeley.edu;ie.cuhk.edu",
        "position": "PhD student;PhD student;Researcher;Researcher;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nzhang2024towards,\ntitle={Towards Unified and Effective Domain Generalization},\nauthor={Yiyuan Zhang and Kaixiong Gong and Xiaohan Ding and Kaipeng Zhang and Kurt Keutzer and Xiangyu Yue},\nyear={2024},\nurl={https://openreview.net/forum?id=e0LwFqw4Bi}\n}",
        "github": "",
        "project": "",
        "reviewers": "FLNN;mjNn;q4ii",
        "site": "https://openreview.net/forum?id=e0LwFqw4Bi",
        "pdf_size": 1925696,
        "rating": "3;3;8",
        "confidence": "5;4;3",
        "soundness": "2;3;3",
        "contribution": "2;2;3",
        "presentation": "3;2;3",
        "wc_summary": "94;83;70",
        "wc_strengths": "50;13;27",
        "wc_weaknesses": "33;248;54",
        "wc_questions": "200;3;42",
        "wc_review": "377;347;193",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "629;431;460",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            4.666666666666667,
            2.357022603955158
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            82.33333333333333,
            9.809292646374775
        ],
        "wc_strengths_avg": [
            30.0,
            15.253414918196734
        ],
        "wc_weaknesses_avg": [
            111.66666666666667,
            96.7826889938944
        ],
        "wc_questions_avg": [
            81.66666666666667,
            85.17563553557372
        ],
        "wc_review_avg": [
            305.6666666666667,
            80.6032808816669
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            506.6666666666667,
            87.30915695898621
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.8660254037844387,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10817814553401983041&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;2;3;0",
        "aff_unique_norm": "Chinese University of Hong Kong;Tencent;Shanghai AI Laboratory;University of California, Berkeley",
        "aff_unique_dep": ";Tencent AI Lab;;",
        "aff_unique_url": "https://www.cuhk.edu.hk;https://ai.tencent.com;https://www.shanghai-ai-lab.com;https://www.berkeley.edu",
        "aff_unique_abbr": "CUHK;Tencent AI Lab;SAIL;UC Berkeley",
        "aff_campus_unique_index": "0;0;2;0",
        "aff_campus_unique": "Hong Kong SAR;;Berkeley",
        "aff_country_unique_index": "0;0;0;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "e0bdvNsgcF",
        "title": "A-Loc: Efficient Alternating Iterative Methods for Locating the $k$ Largest/Smallest Elements in a Factorized Tensor",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Tensors, especially higher-order tensors, are typically represented in low-rank formats to preserve the main information of the high-dimensional data while saving memory space.  Locating the largest/smallest elements in a tensor with the low-rank format is a fundamental task in a large variety of applications. However, existing algorithms often suffer from low computational efficiency or poor accuracy. In this work, we propose a general continuous optimization model for this task, on top of which an alternating iterative method combined with the maximum block increasing (MBI) approach is presented. Then we develop a novel block-search strategy to further improve the accuracy. The theoretical analysis of the convergence behavior of the alternating iterative algorithm is also provided. Numerical experiments with tensors from synthetic and real-world applications demonstrate that our proposed algorithms achieve significant improvements in both accuracy and efficiency over the existing works.",
        "keywords": "factorized tensor;top-k elements;alternating iterative method;maximum block increasing;block-search",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Xiao Chuanfu;Cuiyu Liu;Qianchao Zhu;Min Li;Chao Yang",
        "authorids": "~Xiao_Chuanfu1;~Cuiyu_Liu1;~Qianchao_Zhu1;~Min_Li11;~Chao_Yang8",
        "gender": "M;F;M;F;M",
        "homepage": "https://github.com/ChuanfuXiao;https://github.com/xiaoxi107;https://miraclezqc.github.io/;http://limin;",
        "dblp": ";;;;",
        "google_scholar": ";;;http://https://scholar.google.limin;JvVLHaEAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Xiao_Chuanfu1;~Cuiyu_Liu1;~Qianchao_Zhu1;~Min_Li11;~Chao_Yang8",
        "aff": "Peking University;Peking University;Peking University;Peking University;Peking University",
        "aff_domain": "pku.edu.cn;pku.edu.cn;pku.edu.cn;pku.edu.cn;pku.edu.cn",
        "position": "Postdoc;MS student;PhD student;Postdoc;Full Professor",
        "bibtex": "@misc{\nchuanfu2024aloc,\ntitle={A-Loc: Efficient Alternating Iterative Methods for Locating the \\$k\\$ Largest/Smallest Elements in a Factorized Tensor},\nauthor={Xiao Chuanfu and Cuiyu Liu and Qianchao Zhu and Min Li and Chao Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=e0bdvNsgcF}\n}",
        "github": "",
        "project": "",
        "reviewers": "R5w8;nzvV;neUt;TDnR",
        "site": "https://openreview.net/forum?id=e0bdvNsgcF",
        "pdf_size": 572688,
        "rating": "1;1;3;5",
        "confidence": "4;4;4;3",
        "soundness": "3;1;3;2",
        "contribution": "1;1;2;2",
        "presentation": "3;1;3;3",
        "wc_summary": "84;19;53;81",
        "wc_strengths": "22;18;96;81",
        "wc_weaknesses": "658;156;228;153",
        "wc_questions": "31;1;7;93",
        "wc_review": "795;194;384;408",
        "wc_reply_reviewers": "825;0;19;0",
        "wc_reply_authors": "371;199;184;0",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "1;1;1;0",
        "rating_avg": [
            2.5,
            1.6583123951777
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            59.25,
            26.1951808545007
        ],
        "wc_strengths_avg": [
            54.25,
            34.686993239541536
        ],
        "wc_weaknesses_avg": [
            298.75,
            209.575016402242
        ],
        "wc_questions_avg": [
            33.0,
            36.41428291206625
        ],
        "wc_review_avg": [
            445.25,
            218.28350258322317
        ],
        "wc_reply_reviewers_avg": [
            211.0,
            354.57791809417574
        ],
        "wc_reply_authors_avg": [
            188.5,
            131.3097483052953
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            0.75,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.8703882797784891,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:h0BofC8bF_wJ:scholar.google.com/&scioq=A-Loc:+Efficient+Alternating+Iterative+Methods+for+Locating+the+%24k%24+Largest/Smallest+Elements+in+a+Factorized+Tensor&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Peking University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.pku.edu.cn",
        "aff_unique_abbr": "Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "e0kaVlC5ue",
        "title": "Spectral Neural Networks: Approximation Theory and Optimization Landscape",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "There is a large variety of machine learning methodologies that are based on the extraction of spectral geometric information from data. However, the implementations of many of these methods often depend on traditional eigensolvers, which present limitations when applied in practical online big data scenarios. To address some of these challenges, researchers have proposed different strategies for training neural networks (NN) as alternatives to traditional eigensolvers, with one such approach known as Spectral Neural Network (SNN). In this paper, we investigate key theoretical aspects of SNN. First, we present quantitative insights into the tradeoff between the number of neurons and the amount of spectral geometric information a neural network learns. Second, we initiate a theoretical exploration of the optimization landscape of SNN's objective to shed light on the training dynamics of SNN. Unlike typical studies of convergence to global solutions of NN training dynamics, SNN presents an additional complexity due to its non-convex ambient loss function.",
        "keywords": "Spectral Neural Networks;Manifold Learning;Approximation with Neural Networks;Riemannian Optimization;Graph Laplacian",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/ea08bb6d2fb24f0fe01aef436f7f361440c83410.zip",
        "author": "Chenghui Li;Rishi Sonthalia;Nicolas Garcia Trillos",
        "authorids": "~Chenghui_Li2;~Rishi_Sonthalia1;~Nicolas_Garcia_Trillos1",
        "gender": "M;M;",
        "homepage": "https://chl781.github.io/;https://sites.google.com/umich.edu/rsonthal/home;https://www.nicolasgarciat.com/",
        "dblp": ";223/5758;154/6448",
        "google_scholar": "1_03hMgAAAAJ;HYozgRsAAAAJ;iZJlAscAAAAJ",
        "orcid": ";;0000-0002-7711-5901",
        "linkedin": ";rishi-sonthalia-53b44795/;",
        "or_profile": "~Chenghui_Li2;~Rishi_Sonthalia1;~Nicolas_Garcia_Trillos1",
        "aff": "University of Wisconsin - Madison;University of California, Los Angeles;University of Wisconsin, Madison",
        "aff_domain": "wisc.edu;ucla.edu;wisc.edu",
        "position": "PhD student;Postdoc;Assistant Professor",
        "bibtex": "@misc{\nli2024spectral,\ntitle={Spectral Neural Networks: Approximation Theory and Optimization Landscape},\nauthor={Chenghui Li and Rishi Sonthalia and Nicolas Garcia Trillos},\nyear={2024},\nurl={https://openreview.net/forum?id=e0kaVlC5ue}\n}",
        "github": "",
        "project": "",
        "reviewers": "SXMx;BBbU;JxCW;sU7q;hkrF",
        "site": "https://openreview.net/forum?id=e0kaVlC5ue",
        "pdf_size": 936140,
        "rating": "3;5;5;6;8",
        "confidence": "3;3;3;2;3",
        "soundness": "2;2;3;3;3",
        "contribution": "2;2;2;3;3",
        "presentation": "2;1;2;2;3",
        "wc_summary": "72;94;183;92;287",
        "wc_strengths": "40;45;198;64;143",
        "wc_weaknesses": "304;280;187;405;243",
        "wc_questions": "3;10;56;9;27",
        "wc_review": "419;429;624;570;700",
        "wc_reply_reviewers": "159;0;698;232;276",
        "wc_reply_authors": "795;463;1169;758;334",
        "reply_reviewers": "1;0;3;2;1",
        "reply_authors": "2;1;4;3;1",
        "rating_avg": [
            5.4,
            1.624807680927192
        ],
        "confidence_avg": [
            2.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            145.6,
            80.430342533151
        ],
        "wc_strengths_avg": [
            98.0,
            62.21575363201831
        ],
        "wc_weaknesses_avg": [
            283.8,
            72.31431393576239
        ],
        "wc_questions_avg": [
            21.0,
            19.235384061671343
        ],
        "wc_review_avg": [
            548.4,
            109.69521411620472
        ],
        "wc_reply_reviewers_avg": [
            273.0,
            232.31013753170566
        ],
        "wc_reply_authors_avg": [
            703.8,
            290.6553973350572
        ],
        "reply_reviewers_avg": [
            1.4,
            1.019803902718557
        ],
        "reply_authors_avg": [
            2.2,
            1.16619037896906
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.1846372364689991,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8720872828274151174&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of Wisconsin-Madison;University of California, Los Angeles;University of Wisconsin",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.wisc.edu;https://www.ucla.edu;https://www.wisc.edu",
        "aff_unique_abbr": "UW-Madison;UCLA;UW",
        "aff_campus_unique_index": "0;1;0",
        "aff_campus_unique": "Madison;Los Angeles",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "e1IMBXiDhW",
        "title": "Matrix Information Theory for Self-Supervised Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Contrastive learning often relies on comparing a single positive anchor sample with multiple negative samples to perform Self-Supervised Learning (SSL). However, non-contrastive approaches like BYOL, SimSiam, and Barlow Twins achieve SSL without explicit negative samples. In this paper, we introduce a unified matrix information-theoretic framework that explains many contrastive and non-contrastive learning methods. We then propose a novel method Matrix-SSL based on matrix information theory. Experimental results reveal that Matrix-SSL significantly outperforms state-of-the-art methods on the ImageNet dataset under linear evaluation settings and on MS-COCO for transfer learning tasks. Specifically, when performing 100 epochs pre-training, our method outperforms SimCLR by 4.6\\%, and when performing transfer learning tasks on MS-COCO, our method outperforms previous SOTA methods such as MoCo v2 and BYOL up to 3.3\\% with only 400 epochs compared to 800 epochs pre-training.",
        "keywords": "self-supervised learning;contrastive learning;non-contrastive learning;representation learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/949aeb88d130eb7567bdc5100880533485181334.zip",
        "author": "Yifan Zhang;Zhiquan Tan;Jingqin Yang;Weiran Huang;Yang Yuan",
        "authorids": "~Yifan_Zhang16;~Zhiquan_Tan1;~Jingqin_Yang2;~Weiran_Huang1;~Yang_Yuan4",
        "gender": ";M;M;M;M",
        "homepage": ";;https://github.com/yjqqqaq;https://www.weiranhuang.com;http://people.iiis.tsinghua.edu.cn/~yuanyang/index.html",
        "dblp": ";326/0177;267/1955;170/0073-1;",
        "google_scholar": ";;;AjJ2rf8AAAAJ;",
        "orcid": ";;;;",
        "linkedin": ";https://www.linkedin.cn/incareer/in/ACoAAC1A8_QBFX8OlchWmVI_pNXN4zm_t6vPKCs;;;",
        "or_profile": "~Yifan_Zhang16;~Zhiquan_Tan1;~Jingqin_Yang2;~Weiran_Huang1;~Yang_Yuan4",
        "aff": ";Tsinghua University;Tsinghua University;Shanghai AI Laboratory;Tsinghua University",
        "aff_domain": ";tsinghua.edu.cn;tsinghua.edu.cn;pjlab.org.cn;tsinghua.edu.cn",
        "position": ";PhD student;PhD student;Consultant;Assistant Professor",
        "bibtex": "@misc{\nzhang2024matrix,\ntitle={Matrix Information Theory for Self-Supervised Learning},\nauthor={Yifan Zhang and Zhiquan Tan and Jingqin Yang and Weiran Huang and Yang Yuan},\nyear={2024},\nurl={https://openreview.net/forum?id=e1IMBXiDhW}\n}",
        "github": "",
        "project": "",
        "reviewers": "m2RW;CuLc;zEzQ;CjGu",
        "site": "https://openreview.net/forum?id=e1IMBXiDhW",
        "pdf_size": 977142,
        "rating": "3;6;6;8",
        "confidence": "5;4;4;3",
        "soundness": "2;3;2;3",
        "contribution": "2;3;2;3",
        "presentation": "2;3;2;4",
        "wc_summary": "41;63;89;28",
        "wc_strengths": "23;74;43;39",
        "wc_weaknesses": "255;366;67;72",
        "wc_questions": "5;8;1383;33",
        "wc_review": "324;511;1582;172",
        "wc_reply_reviewers": "0;23;0;26",
        "wc_reply_authors": "1152;808;2188;507",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "3;2;4;2",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            55.25,
            23.155722834755128
        ],
        "wc_strengths_avg": [
            44.75,
            18.471261462065875
        ],
        "wc_weaknesses_avg": [
            190.0,
            126.74186364418033
        ],
        "wc_questions_avg": [
            357.25,
            592.3167965708891
        ],
        "wc_review_avg": [
            647.25,
            552.8731206162947
        ],
        "wc_reply_reviewers_avg": [
            12.25,
            12.295832627357937
        ],
        "wc_reply_authors_avg": [
            1163.75,
            633.8581761719257
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9901475429766743,
        "gs_citation": 18,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17075301280756353501&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Tsinghua University;Shanghai AI Laboratory",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.shanghai-ai-lab.com",
        "aff_unique_abbr": "THU;SAIL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Symmetric Single Index Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18235",
        "id": "e1vqloonRy",
        "author_site": "Aaron Zweig, Joan Bruna",
        "tldr": "",
        "abstract": "Few neural architectures lend themselves to provable learning with gradient based methods. One popular model is the single-index model, in which labels are produced by composing an unknown linear projection with a possibly unknown scalar link function. Learning this model with SGD is relatively well-understood, whereby the so-called information exponent of the link function governs a polynomial sample complexity rate.  However, extending this analysis to deeper or more complicated architectures remains challenging.\n\nIn this work, we consider single index learning in the setting of symmetric neural networks.  Under analytic assumptions on the activation and maximum degree assumptions on the link function, we prove that gradient flow recovers the hidden planted direction, represented as a finitely supported vector in the feature space of power sum polynomials.  We characterize a notion of information exponent adapted to our setting that controls the efficiency of learning.",
        "keywords": "single-index;symmetric;permutation invariant;gradient flow;learning",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/2897be59ebfc3e487b61981f3ff738853f5c0d59.pdf",
        "author": "Aaron Zweig;Joan Bruna",
        "authorids": "~Aaron_Zweig2;~Joan_Bruna1",
        "gender": "M;M",
        "homepage": ";http://cims.nyu.edu/~bruna",
        "dblp": "180/8473;44/8776",
        "google_scholar": ";L4bNmsMAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Aaron_Zweig2;~Joan_Bruna1",
        "aff": "Columbia University;New York University",
        "aff_domain": "columbia.edu;nyu.edu",
        "position": "Postdoc;Associate Professor",
        "bibtex": "@inproceedings{\nzweig2024symmetric,\ntitle={Symmetric Single Index Learning},\nauthor={Aaron Zweig and Joan Bruna},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=e1vqloonRy}\n}",
        "github": "",
        "project": "",
        "reviewers": "oXjh;7zCe;xBy6;qFtS",
        "pdf_size": 412029,
        "rating": "5;6;6;8",
        "confidence": "4;4;2;3",
        "soundness": "4;3;3;4",
        "contribution": "2;3;2;3",
        "presentation": "4;3;3;3",
        "wc_summary": "94;77;105;298",
        "wc_strengths": "47;67;137;55",
        "wc_weaknesses": "171;125;122;115",
        "wc_questions": "96;280;109;36",
        "wc_review": "408;549;473;504",
        "wc_reply_reviewers": "0;13;10;10",
        "wc_reply_authors": "487;147;142;179",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            143.5,
            89.75661535508121
        ],
        "wc_strengths_avg": [
            76.5,
            35.64758056306206
        ],
        "wc_weaknesses_avg": [
            133.25,
            22.094965489902897
        ],
        "wc_questions_avg": [
            130.25,
            90.73691365701173
        ],
        "wc_review_avg": [
            483.5,
            51.28596299183628
        ],
        "wc_reply_reviewers_avg": [
            8.25,
            4.9180788932265
        ],
        "wc_reply_authors_avg": [
            238.75,
            144.02842601375605
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.3458572319330373,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5723268012052973649&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=e1vqloonRy",
        "pdf": "https://openreview.net/pdf?id=e1vqloonRy",
        "email": "columbia.edu;nyu.edu",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Columbia University;New York University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.columbia.edu;https://www.nyu.edu",
        "aff_unique_abbr": "Columbia;NYU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "ArchLock: Locking DNN Transferability at the Architecture Level with a Zero-Cost Binary Predictor",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18234",
        "id": "e2YOVTenU9",
        "author_site": "Tong Zhou, Shaolei Ren, Xiaolin Xu",
        "tldr": "",
        "abstract": "Deep neural network (DNN) models, despite their impressive performance, are vulnerable to exploitation by attackers who attempt to transfer them to other tasks for their own benefit. Current defense strategies mainly address this vulnerability at the model parameter level, leaving the potential of architectural-level defense largely unexplored. This paper, for the first time, addresses the issue of model protection by reducing transferability at the architecture level. Specifically, we present a novel neural architecture search (NAS)-enabled algorithm that employs zero-cost proxies and evolutionary search, to explore model architectures with low transferability. Our method, namely ArchLock, aims to achieve high performance on the source task, while degrading the performance on potential target tasks, i.e., locking the transferability of a DNN model. To achieve efficient cross-task search without accurately knowing the training data owned by the attackers, we utilize zero-cost proxies to speed up architecture evaluation and simulate potential target task embeddings to assist cross-task search with a binary performance predictor. Extensive experiments on NAS-Bench-201 and TransNAS-Bench-101 demonstrate that ArchLock reduces transferability by up to 30% and 50%, respectively, with negligible performance degradation on source tasks (<2%). The code is available at https://github.com/Tongzhou0101/ArchLock.",
        "keywords": "Defense; DNN Transferability; Neural Architecture Search",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/6e6d3d437cdbf0e4a1d4012b98edbb26062b93fe.zip",
        "author": "Tong Zhou;Shaolei Ren;Xiaolin Xu",
        "authorids": "~Tong_Zhou3;~Shaolei_Ren1;~Xiaolin_Xu3",
        "gender": "F;;",
        "homepage": "https://tongzhou0101.github.io/;;",
        "dblp": "30/97-2;;",
        "google_scholar": "6ghv7EwAAAAJ;;",
        "orcid": "0000-0002-8645-5246;;",
        "linkedin": "tong-zhou-292a931b5/;;",
        "or_profile": "~Tong_Zhou3;~Shaolei_Ren1;~Xiaolin_Xu3",
        "aff": "Northeastern University;;",
        "aff_domain": "neu.edu;;",
        "position": "PhD student;;",
        "bibtex": "@inproceedings{\nzhou2024archlock,\ntitle={ArchLock: Locking {DNN} Transferability at the Architecture Level with a Zero-Cost Binary Predictor},\nauthor={Tong Zhou and Shaolei Ren and Xiaolin Xu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=e2YOVTenU9}\n}",
        "github": "",
        "project": "",
        "reviewers": "boEZ;ySE1;umc9",
        "pdf_size": 1303454,
        "rating": "3;6;8",
        "confidence": "5;4;4",
        "soundness": "2;4;3",
        "contribution": "2;3;3",
        "presentation": "3;2;3",
        "wc_summary": "66;54;42",
        "wc_strengths": "13;105;37",
        "wc_weaknesses": "157;190;83",
        "wc_questions": "21;3;1",
        "wc_review": "257;352;163",
        "wc_reply_reviewers": "237;41;0",
        "wc_reply_authors": "1241;821;381",
        "reply_reviewers": "1;1;0",
        "reply_authors": "5;3;3",
        "rating_avg": [
            5.666666666666667,
            2.0548046676563256
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            54.0,
            9.797958971132712
        ],
        "wc_strengths_avg": [
            51.666666666666664,
            38.96437118987322
        ],
        "wc_weaknesses_avg": [
            143.33333333333334,
            44.738747809427515
        ],
        "wc_questions_avg": [
            8.333333333333334,
            8.993825042154695
        ],
        "wc_review_avg": [
            257.3333333333333,
            77.15928690414107
        ],
        "wc_reply_reviewers_avg": [
            92.66666666666667,
            103.42254213768979
        ],
        "wc_reply_authors_avg": [
            814.3333333333334,
            351.1251755270318
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.9176629354822472,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4457802267794979480&as_sdt=5,34&sciodt=0,34&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=e2YOVTenU9",
        "pdf": "https://openreview.net/pdf?id=e2YOVTenU9",
        "email": "neu.edu;;",
        "author_num": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "Northeastern University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.northeastern.edu",
        "aff_unique_abbr": "NEU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "e2jDr8NdJm",
        "title": "Causal Representation Learning in Temporal Data via Single-Parent Decoding",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Scientific research often seeks to understand the causal structure underlying high-level variables in a system. For example, climate scientists study how phenomena, such as El Ni\u00f1o, affect other climate processes at remote locations across the globe. However, scientists typically collect low-level measurements, such as geographically distributed temperature readings. From these, one needs to learn both a mapping to causally-relevant latent variables, such as a high-level representation of the El Ni\u00f1o phenomenon and other processes, as well as the causal model over them. The challenge is that this task, called causal representation learning, is highly underdetermined from observational data alone, requiring other constraints during learning to resolve the indeterminacies. In this work, we consider a temporal model with a sparsity assumption, namely single-parent decoding: each observed low-level variable is only affected by a single latent variable. Such an assumption is reasonable in many scientific applications that require finding groups of low-level variables, such as extracting regions from geographically gridded measurement data in climate research or capturing brain regions from neural activity data. We demonstrate the identifiability of the resulting model and propose a differentiable method, Causal Discovery with Single-parent Decoding (CDSD), that simultaneously learns the underlying latents and a causal graph over them. We assess the validity of our theoretical results using simulated data and showcase the practical validity of our method in an application to real-world data from the climate science field.",
        "keywords": "Causal representation learning;causal discovery;causality;climate science;meteorology;teleconnections",
        "primary_area": "causal reasoning",
        "supplementary_material": "/attachment/3bdd4ba17d8c2376eea8929d22334fc564377570.pdf",
        "author": "Philippe Brouillard;Sebastien Lachapelle;Julia Kaltenborn;Yaniv Gurwicz;Dhanya Sridhar;Alexandre Drouin;Peer Nowack;Jakob Runge;David Rolnick",
        "authorids": "~Philippe_Brouillard2;~Sebastien_Lachapelle1;~Julia_Kaltenborn1;~Yaniv_Gurwicz1;~Dhanya_Sridhar2;~Alexandre_Drouin2;~Peer_Nowack1;~Jakob_Runge2;~David_Rolnick1",
        "gender": ";M;F;;M;;M;M;F",
        "homepage": ";https://slachapelle.github.io/;https://liellnima.github.io/;;https://alexdrouin.com;;https://www.causalinferencelab.com;http://www.davidrolnick.com/;https://www.dsridhar.com",
        "dblp": "242/7928;224/0080;;83/4274;117/3861;;120/7695;37/10718;166/1752",
        "google_scholar": "https://scholar.google.com/citations?hl=en;uxHoJp8AAAAJ;pUAkKYsAAAAJ;;https://scholar.google.ca/citations?user=LR6aJcEAAAAJ;v1Pf21sAAAAJ;https://scholar.google.de/citations?user=wtXVvuUAAAAJ;P_luG3cAAAAJ;agbUL90AAAAJ",
        "orcid": ";;0000-0002-9292-9655;;0000-0001-7718-0319;0000-0003-4588-7832;0000-0002-0629-1772;;",
        "linkedin": ";s%C3%A9bastien-lachapelle-a4321a122/;;;drouinalexandre/;;;;dhanyasridhar/",
        "or_profile": "~Philippe_Brouillard2;~Sebastien_Lachapelle1;~Julia_Kaltenborn1;~Yaniv_Gurwicz1;~Alexandre_Drouin2;~Peer_Nowack1;~Jakob_Runge2;~David_Rolnick1;~Dhanya_Sridhar1",
        "aff": "University of Montreal;University of Montreal;Montreal Institute for Learning Algorithms, University of Montreal, Universit\u00e9 de Montr\u00e9al;Intel;ServiceNow Research ;Karlsruher Institut f\u00fcr Technologie;Technische Universit\u00e4t Dresden;McGill University;Universit\u00e9 de Montr\u00e9al and Mila-Quebec AI Institute",
        "aff_domain": "umontreal.ca;umontreal.ca;mila.umontreal.ca;intel.com;servicenow.com;kit.edu;tu-dresden.de;cs.mcgill.ca;umontreal.ca",
        "position": "PhD student;PhD student;PhD student;Research Scientist;Research Scientist;Assistant Professor;Full Professor;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nbrouillard2024causal,\ntitle={Causal Representation Learning in Temporal Data via Single-Parent Decoding},\nauthor={Philippe Brouillard and Sebastien Lachapelle and Julia Kaltenborn and Yaniv Gurwicz and Dhanya Sridhar and Alexandre Drouin and Peer Nowack and Jakob Runge and David Rolnick},\nyear={2024},\nurl={https://openreview.net/forum?id=e2jDr8NdJm}\n}",
        "github": "",
        "project": "",
        "reviewers": "d1tf;fLAr;bMUY;EMGp",
        "site": "https://openreview.net/forum?id=e2jDr8NdJm",
        "pdf_size": 9749784,
        "rating": "3;3;3;6",
        "confidence": "4;3;3;3",
        "soundness": "3;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;2;3",
        "wc_summary": "43;29;63;67",
        "wc_strengths": "21;71;29;91",
        "wc_weaknesses": "113;273;233;43",
        "wc_questions": "81;332;24;103",
        "wc_review": "258;705;349;304",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            50.5,
            15.386682553429118
        ],
        "wc_strengths_avg": [
            53.0,
            29.017236257093817
        ],
        "wc_weaknesses_avg": [
            165.5,
            92.0258115965298
        ],
        "wc_questions_avg": [
            135.0,
            117.33499051860021
        ],
        "wc_review_avg": [
            404.0,
            176.7356783448096
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:SiBCSilPWtMJ:scholar.google.com/&scioq=Causal+Representation+Learning+in+Temporal+Data+via+Single-Parent+Decoding&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;1;2;3;4;5;6",
        "aff_unique_norm": "University of Montreal;Intel;ServiceNow;Karlsruher Institut f\u00fcr Technologie;Technische Universit\u00e4t Dresden;McGill University;Universit\u00e9 de Montr\u00e9al",
        "aff_unique_dep": ";Intel Corporation;Research;;;;",
        "aff_unique_url": "https://wwwumontreal.ca;https://www.intel.com;https://www.servicenow.com;https://www.kit.edu;https://tu-dresden.de;https://www.mcgill.ca;https://www.umontreal.ca",
        "aff_unique_abbr": "UM;Intel;ServiceNow;KIT;TUD;McGill;UdeM",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Montreal",
        "aff_country_unique_index": "0;0;0;1;1;2;2;0;0",
        "aff_country_unique": "Canada;United States;Germany"
    },
    {
        "id": "e2rBzbWwGC",
        "title": "Mitigating Label Noise on Graphs via Topological Curriculum Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Despite success on the carefully-annotated benchmarks, the effectiveness of graph neural networks (GNNs) can be considerably impaired in practice, as the real-world graph data might be noisily labeled. As a promising way to combat label noise, curriculum learning has gained significant attention due to its merit in reducing noise influence via a simple yet effective $\\textit{easy-to-hard}$ training curriculum. Unfortunately, the early studies focus on i.i.d data, and when moving to non-iid graph data and GNNs, two notable challenges remain: (1) the inherent over-smoothing effect in GNNs usually induces the under-confident prediction, which exacerbates the discrimination difficulty between easy and hard samples; (2) there is no available measure that considers the graph characteristic to promote informative sample selection in curriculum learning. To address this dilemma, we propose a novel robust measure called $\\textit{Class-conditional Betweenness Centrality}$ (CBC), designed to create a curriculum scheme resilient to graph label noise. The CBC incorporates topological information to alleviate the over-smoothing issue and enhance the identification of informative samples. On the basis of CBC, we construct a $\\textit{Topological Curriculum Learning}$ (TCL) framework that guides the model learning towards clean distribution. We theoretically prove that TCL minimizes an upper bound of the expected risk under target clean distribution, and experimentally show the superiority of our method compared with state-of-the-art baselines.",
        "keywords": "Graph neural networks;Noisy labels;Class-conditional Betweenness Centrality",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/5a46e0aee7720d2d3b9eb61596fbb44fb78cdcdb.zip",
        "author": "Yuhao Wu;Jiangchao Yao;Xiaobo Xia;Jun Yu;Ruxin Wang;Bo Han;Tongliang Liu",
        "authorids": "~Yuhao_Wu2;~Jiangchao_Yao1;~Xiaobo_Xia1;~Jun_Yu3;~Ruxin_Wang2;~Bo_Han1;~Tongliang_Liu1",
        "gender": "M;M;M;M;M;M;M",
        "homepage": "https://white1818.github.io/;https://sunarker.github.io/;https://xiaoboxia.github.io/;https://faculty.ustc.edu.cn/yujun_AI/en/index.htm;;https://tongliang-liu.github.io/;https://bhanml.github.io/",
        "dblp": ";166/5900;242/8072;50/5754-1.html;149/7989;150/6667;241/0472-3",
        "google_scholar": ";w8oDh9QAAAAJ;jRsugY0AAAAJ;efZyqyQAAAAJ;https://scholar.google.com.au/citations?user=n9qX0bUAAAAJ;https://scholar.google.com.au/citations?user=EiLdZ_YAAAAJ;nTNjqHwAAAAJ",
        "orcid": ";;;0000-0002-3197-8103;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Yuhao_Wu2;~Jiangchao_Yao1;~Xiaobo_Xia1;~Jun_Yu3;~Ruxin_Wang2;~Tongliang_Liu1;~bo_han2",
        "aff": "University of Sydney;Shanghai Artificial Intelligence Laboratory;The University of Sydney;University of Science and Technology of China;Alibaba Group;Mohamed bin Zayed University of Artificial Intelligence;MBZUAI",
        "aff_domain": "usyd.edu.au;pjlab.org.cn;sydney.edu.au;ustc.edu.cn;alibaba-inc.com;mbzuai.ac.ae;mbzuai.ac.ae",
        "position": "PhD student;Researcher;PhD student;Associate Professor;Researcher;Affiliated Associate Professor;Researcher",
        "bibtex": "@misc{\nwu2024mitigating,\ntitle={Mitigating Label Noise on Graphs via Topological Curriculum Learning},\nauthor={Yuhao Wu and Jiangchao Yao and Xiaobo Xia and Jun Yu and Ruxin Wang and Bo Han and Tongliang Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=e2rBzbWwGC}\n}",
        "github": "",
        "project": "",
        "reviewers": "gbE5;cJzR;rtA1;GKC8",
        "site": "https://openreview.net/forum?id=e2rBzbWwGC",
        "pdf_size": 2551027,
        "rating": "3;5;5;6",
        "confidence": "3;4;3;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "42;39;46;74",
        "wc_strengths": "20;21;36;50",
        "wc_weaknesses": "152;249;67;47",
        "wc_questions": "2;2;64;262",
        "wc_review": "216;311;213;433",
        "wc_reply_reviewers": "87;14;0;20",
        "wc_reply_authors": "1045;1126;1297;675",
        "reply_reviewers": "2;1;0;1",
        "reply_authors": "5;4;4;3",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            50.25,
            13.935117509371782
        ],
        "wc_strengths_avg": [
            31.75,
            12.295832627357937
        ],
        "wc_weaknesses_avg": [
            128.75,
            79.8385088788612
        ],
        "wc_questions_avg": [
            82.5,
            106.68059804856739
        ],
        "wc_review_avg": [
            293.25,
            89.79525321530086
        ],
        "wc_reply_reviewers_avg": [
            30.25,
            33.558717198367404
        ],
        "wc_reply_authors_avg": [
            1035.75,
            227.27887605318713
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            4.0,
            0.7071067811865476
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.13245323570650439,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:2eYTgGfI-gIJ:scholar.google.com/&scioq=Mitigating+Label+Noise+on+Graphs+via+Topological+Curriculum+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;2;3;4;4",
        "aff_unique_norm": "University of Sydney;Shanghai Artificial Intelligence Laboratory;University of Science and Technology of China;Alibaba Group;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.sydney.edu.au;http://www.shailab.org/;http://www.ustc.edu.cn;https://www.alibaba.com;https://mbzuai.ac.ae",
        "aff_unique_abbr": "USYD;Shanghai AI Lab;USTC;Alibaba;MBZUAI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;1;1;2;2",
        "aff_country_unique": "Australia;China;United Arab Emirates"
    },
    {
        "id": "e3JsfnAi9f",
        "title": "Interleaving Multi-Task Neural Architecture Search",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Multi-task neural architecture search (MTNAS), which searches for a shared architecture for multiple tasks, has been broadly investigated. In these methods, multiple tasks are learned simultaneously by minimizing the weighted sum of their losses. How to balance these losses by finding the optimal loss weights requires a lot of tuning, which is time-consuming and labor intensive. To address this problem, we propose an interleaving MTNAS framework, where no tuning of loss weights is needed. In our method, a set of tasks (e.g., A, B, C) are performed in an interleaving loop (e.g., ABCABCABC...) where each task transfers its knowledge to the next task. Each task is learned by minimizing its loss function alone, without intervening with losses of other tasks. Loss functions of individual tasks are organized into a multi-level optimization framework which enables all tasks performed end-to-end. The effectiveness of our method is demonstrated in a variety of experiments.",
        "keywords": "Interleaving learning;neural architecture search",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Pengtao Xie;Hao Ban",
        "authorids": "~Pengtao_Xie3;~Hao_Ban1",
        "gender": "M;",
        "homepage": "https://pengtaoxie.github.io/;",
        "dblp": "133/1998;",
        "google_scholar": "cnncomYAAAAJ;",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Pengtao_Xie3;~Hao_Ban1",
        "aff": "Carnegie Mellon University;",
        "aff_domain": " ;",
        "position": "Graduate Student;",
        "bibtex": "@misc{\nxie2024interleaving,\ntitle={Interleaving Multi-Task Neural Architecture Search},\nauthor={Pengtao Xie and Hao Ban},\nyear={2024},\nurl={https://openreview.net/forum?id=e3JsfnAi9f}\n}",
        "github": "",
        "project": "",
        "reviewers": "F7ZG;SnqF;yi1v",
        "site": "https://openreview.net/forum?id=e3JsfnAi9f",
        "pdf_size": 719122,
        "rating": "3;3;6",
        "confidence": "4;4;3",
        "soundness": "2;3;3",
        "contribution": "1;2;3",
        "presentation": "1;2;2",
        "wc_summary": "140;73;151",
        "wc_strengths": "11;73;123",
        "wc_weaknesses": "433;430;357",
        "wc_questions": "4;54;483",
        "wc_review": "588;630;1114",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            121.33333333333333,
            34.4705993887867
        ],
        "wc_strengths_avg": [
            69.0,
            45.81120678029194
        ],
        "wc_weaknesses_avg": [
            406.6666666666667,
            35.140985883849204
        ],
        "wc_questions_avg": [
            180.33333333333334,
            214.98888860176524
        ],
        "wc_review_avg": [
            777.3333333333334,
            238.67597747201586
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:9CB5XXL8R1EJ:scholar.google.com/&scioq=Interleaving+Multi-Task+Neural+Architecture+Search&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Carnegie Mellon University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cmu.edu",
        "aff_unique_abbr": "CMU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "e3tveFVmoH",
        "title": "Stochastic two points method for deep model gradient free optimization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large foundation models, such as large language models, have performed exceptionally well in various application scenarios. Building or fully fine-tuning such large models is usually prohibitive due to either hardware budget or lack of access to backpropagation. The zeroth-order methods offer a promising direction for tackling this challenge, where only forward passes are needed to update the model. This paper introduces an efficient Stochastic Two-Point (S2P) approach within the gradient-free regime. We present the theoretical convergence properties of S2P under the general and relaxed smoothness assumptions. The theoretical properties also shed light on a faster and more stable S2P variant, Accelerated S2P (AS2P), through exploiting our new convergence properties that better represent the dynamics of deep models in training. Our comprehensive empirical results show that AS2P is highly effective in optimizing objectives for large deep models, including language models, and outperforms standard methods across various model types and scales, with 2$\\times$ speed-up in training over most conducted tasks.",
        "keywords": "zeroth-order optimization;gradient free adaptation",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/0a9de23e3d391785195c137fd8af35c0cfafd731.pdf",
        "author": "Yijiang Pang;Jiayu Zhou",
        "authorids": "~Yijiang_Pang1;~Jiayu_Zhou1",
        "gender": "M;M",
        "homepage": "https://www.egr.msu.edu/~pangyiji/;http://jiayuzhou.github.io/",
        "dblp": "258/3653;73/1353",
        "google_scholar": "qCz2e0oAAAAJ;https://scholar.google.com.tw/citations?user=yQKlLTQAAAAJ",
        "orcid": "0000-0003-0895-088X;0000-0003-4336-6777",
        "linkedin": "yijiangpang/;jiayuzhou/",
        "or_profile": "~Yijiang_Pang1;~Jiayu_Zhou1",
        "aff": "Michigan State University;Michigan State University",
        "aff_domain": "msu.edu;msu.edu",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\npang2024stochastic,\ntitle={Stochastic two points method for deep model gradient free optimization},\nauthor={Yijiang Pang and Jiayu Zhou},\nyear={2024},\nurl={https://openreview.net/forum?id=e3tveFVmoH}\n}",
        "github": "",
        "project": "",
        "reviewers": "7rkr;8MoD;v68Q;QZx8",
        "site": "https://openreview.net/forum?id=e3tveFVmoH",
        "pdf_size": 2106632,
        "rating": "5;5;5;6",
        "confidence": "3;3;2;3",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;2",
        "presentation": "3;3;3;2",
        "wc_summary": "89;85;49;72",
        "wc_strengths": "27;23;46;63",
        "wc_weaknesses": "53;181;31;323",
        "wc_questions": "232;75;70;2",
        "wc_review": "401;364;196;460",
        "wc_reply_reviewers": "0;0;134;145",
        "wc_reply_authors": "663;670;512;454",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "2;2;2;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            73.75,
            15.610493265749165
        ],
        "wc_strengths_avg": [
            39.75,
            15.990231392947383
        ],
        "wc_weaknesses_avg": [
            147.0,
            116.64475984801032
        ],
        "wc_questions_avg": [
            94.75,
            84.32489252883754
        ],
        "wc_review_avg": [
            355.25,
            98.110588113618
        ],
        "wc_reply_reviewers_avg": [
            69.75,
            69.85833880074733
        ],
        "wc_reply_authors_avg": [
            574.75,
            94.04619875359131
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:OpQb6dV-rAwJ:scholar.google.com/&scioq=Stochastic+two+points+method+for+deep+model+gradient+free+optimization&hl=en&as_sdt=0,47",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Michigan State University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.msu.edu",
        "aff_unique_abbr": "MSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "e47RxA52sT",
        "title": "Towards Relaxing the Unbiasedness Condition of Doubly Robust Estimators for Debiased Recommendation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recommender system aims to recommend items or information that may be of interest to users based on their behaviors and preferences. However, there may be sampling selection bias in the process of data collection, i.e., the collected data is not a representative of the target population. Many debiasing methods are developed based on pseudo-labelings. Nevertheless, the effectiveness of these methods relies heavily on accurate pseudo-labelings (i.e., the imputed labels), which is difficult to satisfy in practice. In this paper, in contrast to the existing doubly robust estimators that take strictly accurate pseudo-labelings as an unbiasedness condition, we theoretically propose several novel doubly robust estimators that are unbiased when either (a) the pseudo-labelings deviate from the true labels with an arbitrary user-specific inductive bias, item-specific inductive bias, or a combination of both, or (b) the learned propensities are accurate. We further propose a principled propensity reconstruction learning approach that adaptively updates the constraint weights using an attention mechanism and effectively controls the variance. To summarize, the proposed methods greatly relax the unbiasedness condition of the widely-adopted doubly robust estimators, which empirically result in much lower bias. Extensive experiments show that our approach outperforms the state-of-the-art on one semi-synthetic dataset and three real-world datasets.",
        "keywords": "Recommender system;Selection bias;Doubly robust",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/b1f0f9458abe58ffff66bb8186db12c6631a2bb3.zip",
        "author": "Haoxuan Li;Chunyuan Zheng;Shuyi Wang;Kunhan Wu;Eric Wang;Xu Chen;Zhi Geng;Peng Wu",
        "authorids": "~Haoxuan_Li6;~Chunyuan_Zheng1;~Shuyi_Wang3;~Kunhan_Wu1;~Eric_Wang3;~Xu_Chen13;~Zhi_Geng1;~Peng_Wu5",
        "gender": "M;M;M;;;M;M;M",
        "homepage": "https://haoxuanli-pku.github.io/;;;;;https://gsai.ruc.edu.cn/chenxu;https://stxy.btbu.edu.cn/szdw/bssds/34339356074b408c8650309f05f24558.htm;https://pengwu.site/",
        "dblp": "145/4965-1.html;;;;;83/6331-17;;15/6146-12",
        "google_scholar": "gtDqiucAAAAJ;https://scholar.google.com/citations?hl=en;;;;loPoqy0AAAAJ;;https://scholar.google.com/citations?view_op=list_works",
        "orcid": "0000-0003-3620-3769;0000-0002-0306-7310;0000-0002-5576-6308;0000-0002-8456-350X;;0000-0003-0144-1775;;0000-0001-7154-8880",
        "linkedin": ";;shuyi-wang-9b6731254;;;;;",
        "or_profile": "~Haoxuan_Li6;~Chunyuan_Zheng1;~Shuyi_Wang3;~Kunhan_Wu1;~Eric_Wang3;~Xu_Chen13;~Zhi_Geng1;~Peng_Wu5",
        "aff": "Peking University;Peking University;University of Pennsylvania;Carnegie Mellon University;;Renmin University of China;School of mathematical Science, Peking University, Peking University;Beijing Technology and Business University",
        "aff_domain": "pku.edu.cn;stu.pku.edu.cn;upenn.edu;cmu.edu;;ruc.edu.cn;math.pku.edu.cn;btbu.edu.cn",
        "position": "PhD student;PhD student;Undergrad student;MS student;;Associate Professor;Full Professor;Associate Professor",
        "bibtex": "@misc{\nli2024towards,\ntitle={Towards Relaxing the Unbiasedness Condition of Doubly Robust Estimators for Debiased Recommendation},\nauthor={Haoxuan Li and Chunyuan Zheng and Shuyi Wang and Kunhan Wu and Eric Wang and Xu Chen and Zhi Geng and Peng Wu},\nyear={2024},\nurl={https://openreview.net/forum?id=e47RxA52sT}\n}",
        "github": "",
        "project": "",
        "reviewers": "BXqD;aJVp;uhbY;d1UZ",
        "site": "https://openreview.net/forum?id=e47RxA52sT",
        "pdf_size": 3107145,
        "rating": "3;5;6;8",
        "confidence": "4;4;3;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "76;45;84;25",
        "wc_strengths": "87;27;234;61",
        "wc_weaknesses": "117;138;132;63",
        "wc_questions": "34;26;93;73",
        "wc_review": "314;236;543;222",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            57.5,
            23.753947040439407
        ],
        "wc_strengths_avg": [
            102.25,
            78.98536256801003
        ],
        "wc_weaknesses_avg": [
            112.5,
            29.58462438497403
        ],
        "wc_questions_avg": [
            56.5,
            27.572631357924475
        ],
        "wc_review_avg": [
            328.75,
            128.56783229097394
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.8320502943378437,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:c-1ootadWGYJ:scholar.google.com/&scioq=Towards+Relaxing+the+Unbiasedness+Condition+of+Doubly+Robust+Estimators+for+Debiased+Recommendation&hl=en&as_sdt=0,48",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2;3;0;4",
        "aff_unique_norm": "Peking University;University of Pennsylvania;Carnegie Mellon University;Renmin University of China;Beijing Technology and Business University",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.upenn.edu;https://www.cmu.edu;http://www.ruc.edu.cn;http://www.btbu.edu.cn",
        "aff_unique_abbr": "Peking U;UPenn;CMU;RUC;BTBU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Peking",
        "aff_country_unique_index": "0;0;1;1;0;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "The Unreasonable Effectiveness of Linear Prediction as a Perceptual Metric",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18233",
        "id": "e4FG5PJ9uC",
        "author_site": "Daniel Severo, Lucas Theis, Johannes Ball\u00e9",
        "tldr": "",
        "abstract": "We show how perceptual embeddings of the visual system can be constructed at inference-time with no training data or deep neural network features. Our perceptual embeddings are solutions to a weighted least squares (WLS) problem, defined at the pixel-level, and solved at inference-time, that can capture global and local image characteristics. The distance in embedding space is used to define a perceptual similary metric which we call \\emph{LASI: Linear Autoregressive Similarity Index}. Experiments on full-reference image quality assessment datasets show LASI performs competitively with learned deep feature based methods like LPIPS \\citep{zhang2018unreasonable} and PIM \\citep{bhardwaj2020unsupervised}, at a similar computational cost to hand-crafted methods such as MS-SSIM \\citep{wang2003multiscale}. We found that increasing the dimensionality of the embedding space consistently reduces the WLS loss while increasing performance on perceptual tasks, at the cost of increasing the computational complexity. LASI is fully differentiable, scales cubically with the number of embedding dimensions, and can be parallelized at the pixel-level. A Maximum Differentiation (MAD) competition \\citep{wang2008maximum} between LASI and LPIPS shows that both methods are capable of finding failure points for the other, suggesting these metrics can be combined.",
        "keywords": "perceptual metrics;lpips;perceptual embeddings;representation learning;self-supervised learning;FR-IQA;image quality assessment;compression;data-free;ssim;bapps;2afc;jnd",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Daniel Severo;Lucas Theis;Johannes Ball\u00e9",
        "authorids": "~Daniel_Severo1;~Lucas_Theis1;~Johannes_Ball\u00e91",
        "gender": "M;M;Non-Binary",
        "homepage": "http://dsevero.com;http://theis.io;https://balle.io",
        "dblp": "249/9390;28/8772;84/4973",
        "google_scholar": "5bQjLz4AAAAJ;https://scholar.google.co.uk/citations?hl=en;uKDe38UAAAAJ",
        "orcid": "0000-0003-0472-5300;;0000-0003-0769-8985",
        "linkedin": "danielsevero/;;",
        "or_profile": "~Daniel_Severo1;~Lucas_Theis1;~Johannes_Ball\u00e91",
        "aff": "Vector Institute;Google;Google",
        "aff_domain": "vectorinstitute.ai;google.com;google.com",
        "position": "PhD student;Researcher;Research Scientist",
        "bibtex": "@inproceedings{\nsevero2024the,\ntitle={The Unreasonable Effectiveness of Linear Prediction as a Perceptual Metric},\nauthor={Daniel Severo and Lucas Theis and Johannes Ball{\\'e}},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=e4FG5PJ9uC}\n}",
        "github": "",
        "project": "",
        "reviewers": "QSZk;8dYU;WqhQ",
        "pdf_size": 1838053,
        "rating": "6;6;6",
        "confidence": "4;3;3",
        "soundness": "3;3;3",
        "contribution": "3;3;2",
        "presentation": "3;3;3",
        "wc_summary": "75;44;44",
        "wc_strengths": "52;26;107",
        "wc_weaknesses": "31;179;55",
        "wc_questions": "193;5;80",
        "wc_review": "351;254;286",
        "wc_reply_reviewers": "14;131;195",
        "wc_reply_authors": "716;774;1125",
        "reply_reviewers": "1;2;2",
        "reply_authors": "1;3;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            54.333333333333336,
            14.613540144521982
        ],
        "wc_strengths_avg": [
            61.666666666666664,
            33.76717669901086
        ],
        "wc_weaknesses_avg": [
            88.33333333333333,
            64.85539470408165
        ],
        "wc_questions_avg": [
            92.66666666666667,
            77.27152702573497
        ],
        "wc_review_avg": [
            297.0,
            40.3567425180312
        ],
        "wc_reply_reviewers_avg": [
            113.33333333333333,
            74.94145863420475
        ],
        "wc_reply_authors_avg": [
            871.6666666666666,
            180.69188015944587
        ],
        "reply_reviewers_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13666555897704828499&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=e4FG5PJ9uC",
        "pdf": "https://openreview.net/pdf?id=e4FG5PJ9uC",
        "email": "vectorinstitute.ai;google.com;google.com",
        "author_num": 3,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Vector Institute;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://vectorinstitute.ai/;https://www.google.com",
        "aff_unique_abbr": "Vector Institute;Google",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "Canada;United States"
    },
    {
        "id": "e4wgZqF9uG",
        "title": "On the Viability of Monocular Depth Pre-training for Semantic Segmentation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We explore how pre-training a model to infer depth from a single image compares to pre-training the model for a semantic task, e.g. ImageNet classification, for the purpose of downstream transfer to semantic segmentation. The question of whether pre-training on geometric tasks is viable for downstream transfer to semantic tasks is important for two reasons, one practical and the other scientific. In practice, if it were viable, one could reduce pre-training cost and bias due to human annotation at scale. If, however, it were not, then that would affirm human annotation as an inductive vehicle so powerful to justify the annotation effort. Yet the bootstrapping question would still be unanswered: How did the ability to assign labels to semantically coherent regions emerge? If pre-training on a geometric task was sufficient to prime a notion of \u201cobject\u201d, leveraging the regularities of the environment (what Gibson called \u201cdetached objects\u201d), that would reduce the gap to semantic inference as a matter of aligning labels, which could be done with few examples. To test these hypotheses, we have designed multiple controlled experiments that require minimal fine-tuning, using common benchmarks such as KITTI, Cityscapes, and NYU-V2: We explore different forms of supervision for depth estimation, training pipelines, and data resolutions for semantic fine-tuning. We find that depth pre-training exceeds performance relative to ImageNet pre-training on average by 5.8% mIoU and 5.2% pixel accuracy. Surprisingly, we find that optical flow estimation, which is a closely related task to depth estimation as it optimizes the same photometric reprojection error, is considerably less effective.",
        "keywords": "Representation Learning;Pre-training;Depth Estimation;Semantic Segmentation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Dong Lao;Alex Wong;Samuel Lu;Stefano Soatto",
        "authorids": "~Dong_Lao1;~Alex_Wong2;~Samuel_Lu1;~Stefano_Soatto1",
        "gender": "M;M;M;",
        "homepage": ";https://vision.cs.yale.edu/members/alex-wong/;;https://www.cs.ucla.edu/~soatto",
        "dblp": "180/5522;39/6537-1;;08/1262",
        "google_scholar": "dvQXYW0AAAAJ;K9_XuM8AAAAJ;;lH1PdF8AAAAJ",
        "orcid": ";0000-0002-3157-6016;;0000-0003-2902-6362",
        "linkedin": ";;samuel-lu-8ab9b1229/;stefano-soatto-5765aa6/",
        "or_profile": "~Dong_Lao1;~Alex_Wong2;~Samuel_Lu1;~Stefano_Soatto2",
        "aff": "University of California, Los Angeles;Yale University;University of California, Los Angeles;UCLA Computer Science Department, University of California, Los Angeles",
        "aff_domain": "cs.ucla.edu;yale.edu;ucla.edu;cs.ucla.edu",
        "position": "Postdoc;Assistant Professor;Undergrad student;Professor",
        "bibtex": "@misc{\nlao2024on,\ntitle={On the Viability of Monocular Depth Pre-training for Semantic Segmentation},\nauthor={Dong Lao and Alex Wong and Samuel Lu and Stefano Soatto},\nyear={2024},\nurl={https://openreview.net/forum?id=e4wgZqF9uG}\n}",
        "github": "",
        "project": "",
        "reviewers": "N1Lo;Ynow;r9ta;gFUe",
        "site": "https://openreview.net/forum?id=e4wgZqF9uG",
        "pdf_size": 10227389,
        "rating": "3;5;5;6",
        "confidence": "3;3;2;2",
        "soundness": "3;3;3;3",
        "contribution": "2;2;2;2",
        "presentation": "1;3;2;3",
        "wc_summary": "65;30;43;91",
        "wc_strengths": "32;46;56;113",
        "wc_weaknesses": "111;250;333;50",
        "wc_questions": "79;28;4;47",
        "wc_review": "287;354;436;301",
        "wc_reply_reviewers": "0;0;0;14",
        "wc_reply_authors": "458;631;748;231",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            2.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            57.25,
            23.155722834755128
        ],
        "wc_strengths_avg": [
            61.75,
            30.792653344588544
        ],
        "wc_weaknesses_avg": [
            186.0,
            111.60869141782821
        ],
        "wc_questions_avg": [
            39.5,
            27.427176303804956
        ],
        "wc_review_avg": [
            344.5,
            58.44014031468439
        ],
        "wc_reply_reviewers_avg": [
            3.5,
            6.06217782649107
        ],
        "wc_reply_authors_avg": [
            517.0,
            194.70105289905342
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.6882472016116854,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11378794203552691467&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "University of California, Los Angeles;Yale University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ucla.edu;https://www.yale.edu",
        "aff_unique_abbr": "UCLA;Yale",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Los Angeles;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Lion Secretly Solves a Constrained Optimization: As Lyapunov Predicts",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18232",
        "id": "e4xS9ZarDr",
        "author_site": "Lizhang Chen, Bo Liu, Kaizhao Liang, Qiang Liu",
        "tldr": "",
        "abstract": "Lion (Evolved Sign Momentum), a new optimizer discovered through program search, has shown promising results in training large AI models. It achieves results comparable to AdamW but with greater memory efficiency. As what we can expect from the result of the random search, Lion blends a number of elements from existing algorithms, including signed momentum, decoupled weight decay,  Polayk and Nesterov momentum, but doesn't fit into any existing category of theoretically grounded optimizers. Thus, even though Lion appears to perform well as a general-purpose optimizer for a wide range of tasks, its theoretical basis remains uncertain. This absence of theoretical clarity limits opportunities to further enhance and expand Lion's efficacy. This work aims to demystify Lion. Using both continuous-time and discrete-time analysis, we demonstrate that Lion is a novel and theoretically grounded approach for minimizing a general loss function $f(x)$ while enforcing a bound constraint $||x||_\\infty \\leq 1/\\lambda$. Lion achieves this through the incorporation of decoupled weight decay, where $\\lambda$ represents the weight decay coefficient. Our analysis is facilitated by the development of a new Lyapunov function for the Lion updates. It applies to a wide range of Lion-$\\phi$ algorithms, where the  $sign(\\cdot)$ operator in Lion is replaced by the subgradient of a convex function $\\phi$, leading to the solution of the general composite optimization problem $\\min_x f(x) + \\phi^*(x)$. Our findings provide valuable insights into the dynamics of Lion and pave the way for further enhancements and extensions of Lion-related algorithms.",
        "keywords": "Lion;Optimization;Lyapunov Analysis",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/f312447ae5de7c3fe14343dff00c27e7f97c7ca6.pdf",
        "author": "Lizhang Chen;Bo Liu;Kaizhao Liang;qiang liu",
        "authorids": "~Lizhang_Chen1;~Bo_Liu13;~Kaizhao_Liang1;~qiang_liu4",
        "gender": "M;M;M;M",
        "homepage": "https://l-z-chen.github.io/;https://cranial-xix.github.io/;https://kaizhaoliang.github.io/Portfolio/;https://www.cs.utexas.edu/~lqiang/",
        "dblp": "225/1559;;239/5146;61/3234-1",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;qKLmNfoAAAAJ;https://scholar.google.com.tw/citations?user=2qDh4WUAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;kaizhao-liang-427a42132/;",
        "or_profile": "~Lizhang_Chen1;~Bo_Liu13;~Kaizhao_Liang1;~Qiang_Liu1",
        "aff": "University of Texas at Austin;University of Texas, Austin;SambaNova Systems, Inc;University of Texas, Austin",
        "aff_domain": "utexas.edu;cs.utexas.edu;sambanovasystems.com;utexas.edu",
        "position": "PhD student;PhD student;Principal Engineer;Assistant Professor",
        "bibtex": "@inproceedings{\nchen2024lion,\ntitle={Lion Secretly Solves a Constrained Optimization: As Lyapunov Predicts},\nauthor={Lizhang Chen and Bo Liu and Kaizhao Liang and qiang liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=e4xS9ZarDr}\n}",
        "github": "",
        "project": "",
        "reviewers": "2PBx;GggD;fjaH;GtGX",
        "pdf_size": 2362046,
        "rating": "6;8;8;8",
        "confidence": "3;3;3;2",
        "soundness": "2;3;4;4",
        "contribution": "3;4;3;4",
        "presentation": "2;4;4;4",
        "wc_summary": "87;105;51;89",
        "wc_strengths": "55;183;67;47",
        "wc_weaknesses": "158;119;25;93",
        "wc_questions": "2;451;46;22",
        "wc_review": "302;858;189;251",
        "wc_reply_reviewers": "0;292;0;0",
        "wc_reply_authors": "1357;319;212;231",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "3;1;1;1",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            3.5,
            0.5
        ],
        "presentation_avg": [
            3.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            83.0,
            19.748417658131498
        ],
        "wc_strengths_avg": [
            88.0,
            55.308227236099334
        ],
        "wc_weaknesses_avg": [
            98.75,
            48.45810045802456
        ],
        "wc_questions_avg": [
            130.25,
            185.83914415429274
        ],
        "wc_review_avg": [
            400.0,
            267.43690844758135
        ],
        "wc_reply_reviewers_avg": [
            73.0,
            126.43970895252804
        ],
        "wc_reply_authors_avg": [
            529.75,
            479.31585358717274
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 16,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3070370124486025557&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=e4xS9ZarDr",
        "pdf": "https://openreview.net/pdf?id=e4xS9ZarDr",
        "email": "utexas.edu;cs.utexas.edu;sambanovasystems.com;utexas.edu",
        "author_num": 4,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "University of Texas at Austin;SambaNova Systems",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.utexas.edu;https://www.sambanova.com",
        "aff_unique_abbr": "UT Austin;SambaNova",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Austin;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "e5hZmQXHHg",
        "title": "VRAda: A Variance Reduced Adaptive Algorithm for Stochastic Parameter-Agnostic Minimax Optimizations",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Stochastic parameter-agnostic minimax optimization provides a novel avenue for adjusting learning rates without relying on problem-dependent parameters, bridging the gap between theoretical and empirical machine learning results. While previous studies have successfully decoupled the timescales of primal and dual variables and proposed unified parameter-agnostic algorithms for minimax optimizations, the problem of varying inherent variances within the stochastic setting persists. Such variance degradation affects the desired ratio of learning rates. Intuitively, variance-reduced techniques hold the potential to address this issue efficiently. However, they require manually tuning problem-dependent parameters to attain an optimal solution. In this paper, we introduce the Variance-Reduced Adaptive algorithm (VRAda), a solution addressing varying inherent variances and enabling the parameter-agnostic manner in stochastic minimax optimizations. Theoretical results show that VRAda achieves an optimal sample complexity of $O(1/\\epsilon^3)$ without large data batches, enabling it to find an $\\epsilon$-stationary point on non-convex-strongly-concave and non-convex-Polyak-\\L ojasiewicz objectives. To the best of our knowledge, VRAda is the first variance-reduced adaptive algorithm designed specifically for parameter-agnostic minimax optimization. Extensive experiments conducted across diverse applications validate the effectiveness of VRAda.",
        "keywords": "Stochastic minimax optimization;Parameter-agnostic;Variance-reduction",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/5847c795b207cb47e0606e8371aea7a983611553.zip",
        "author": "Xiaokang Pan;Jin Liu;Shichao Kan;Junwen Duan;Youqi Li;Lixing Chen;Zhe Qu",
        "authorids": "~Xiaokang_Pan1;~Jin_Liu12;~Shichao_Kan2;~Junwen_Duan1;~Youqi_Li3;~Lixing_Chen1;~Zhe_Qu1",
        "gender": "M;;;M;M;M;M",
        "homepage": "https://scholar.google.com/citations?hl=zh-CN&user=rtzTU6UAAAAJ;;;;https://lyouqi.github.io/;https://icst.sjtu.edu.cn/DirectoryDetail.aspx?id=27;https://zhequ1992.github.io/",
        "dblp": ";;;153/9564;https://dblp.uni-trier.de/pid/194/1801.html;154/7371;",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;;;rF_NZFAAAAAJ;;boMMe2YAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;;;0000-0002-1805-0183;0000-0003-2211-2137",
        "linkedin": ";;;;;;",
        "or_profile": "~Xiaokang_Pan1;~Jin_Liu12;~Shichao_Kan2;~Junwen_Duan1;~Youqi_Li3;~Lixing_Chen1;~Zhe_Qu1",
        "aff": "Central South University;;;Central South University;Beijing Institute of Technology;Shanghai Jiaotong University;Central South University",
        "aff_domain": "csu.edu.cn;;;csu.edu.cn;bit.edu.cn;sjtu.edu.cn;csu.edu.cn",
        "position": "MS student;;;Associate Professor;Assistant Professor;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\npan2024vrada,\ntitle={{VRA}da: A Variance Reduced Adaptive Algorithm for Stochastic Parameter-Agnostic Minimax Optimizations},\nauthor={Xiaokang Pan and Jin Liu and Shichao Kan and Junwen Duan and Youqi Li and Lixing Chen and Zhe Qu},\nyear={2024},\nurl={https://openreview.net/forum?id=e5hZmQXHHg}\n}",
        "github": "",
        "project": "",
        "reviewers": "byJD;TWBa;TzGV;QWNk",
        "site": "https://openreview.net/forum?id=e5hZmQXHHg",
        "pdf_size": 3125409,
        "rating": "3;3;3;5",
        "confidence": "4;3;4;5",
        "soundness": "1;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "1;3;3;2",
        "wc_summary": "121;45;28;63",
        "wc_strengths": "158;37;75;63",
        "wc_weaknesses": "1480;209;320;47",
        "wc_questions": "199;313;130;98",
        "wc_review": "1958;604;553;271",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            64.25,
            35.02409884636577
        ],
        "wc_strengths_avg": [
            83.25,
            45.29003753586433
        ],
        "wc_weaknesses_avg": [
            514.0,
            566.1064387551161
        ],
        "wc_questions_avg": [
            185.0,
            82.42269105046256
        ],
        "wc_review_avg": [
            846.5,
            654.1370269293735
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:MuZVdalUV8cJ:scholar.google.com/&scioq=VRAda:+A+Variance+Reduced+Adaptive+Algorithm+for+Stochastic+Parameter-Agnostic+Minimax+Optimizations&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2;0",
        "aff_unique_norm": "Central South University;Beijing Institute of Technology;Shanghai Jiao Tong University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.csu.edu.cn;http://www.bit.edu.cn/;https://www.sjtu.edu.cn",
        "aff_unique_abbr": "CSU;BIT;SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "e5lR6tySR7",
        "title": "Transformer-Based Large Language Models Are Not General Learners: A Universal Circuit Perspective",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) have demonstrated remarkable proficiency across diverse tasks, evoking perceptions of ``sparks of Artificial General Intelligence (AGI)\" (Bubeck et al., 2023). A key question naturally arises: *Can foundation models lead to AGI?* In this work, we try to answer this question partially by formally considering the capabilities of Transformer-based LLMs (T-LLMs) from the perspective of universal circuits. \nBy investigating the expressive power of realistic T-LLMs as universal circuits, we show that a T-LLM of size $\\operatorname{poly}(n)$ cannot perform all the basic operators of input length $O\\left(\\operatorname{poly}(\\log n)\\right)$. We also demonstrate that a constant-depth-$\\operatorname{poly}(n)$-size log-precision T-LLM cannot faithfully execute prompts of complexity $n$. Our analysis provides a concrete theoretical foundation that T-LLMs can only be universal circuits for limited function classes, or in other words, T-LLMs are not general learners. Furthermore, we exhibit that a constant-depth-$\\operatorname{poly}(n)$-size log-precision T-LLM can memorize $O\\left(\\operatorname{poly}(n)\\right)$ instances, which could partially explain the seeming inconsistency between LLMs' empirical successes and our negative results. To the best of our knowledge, our work takes the first step towards analyzing the limitations of T-LLMs as general learners within a rigorous theoretical framework. Our results promote the understanding of LLMs' capabilities and highlight the need for innovative architecture designs beyond Transformers to break current limitations.",
        "keywords": "Large Language Model;Transformer;Universal Circuit",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Yang Chen;Yitao Liang;Zhouchen Lin",
        "authorids": "~Yang_Chen17;~Yitao_Liang1;~Zhouchen_Lin1",
        "gender": "M;M;M",
        "homepage": "https://zero-lab-pku.github.io/personwise/chenyang/;https://web.cs.ucla.edu/~yliang/;https://zhouchenlin.github.io",
        "dblp": ";173/4969;l/ZhouchenLin",
        "google_scholar": ";KVzR1XEAAAAJ;https://scholar.google.com.tw/citations?user=TanjFwoAAAAJ",
        "orcid": ";;0000-0003-1493-7569",
        "linkedin": ";;",
        "or_profile": "~Yang_Chen17;~Yitao_Liang1;~Zhouchen_Lin1",
        "aff": "Peking University;Peking University;Peking University",
        "aff_domain": "pku.edu.cn;pku.edu.cn;pku.edu.cn",
        "position": "PhD student;Assistant Professor;Professor",
        "bibtex": "@misc{\nchen2024transformerbased,\ntitle={Transformer-Based Large Language Models Are Not General Learners: A Universal Circuit Perspective},\nauthor={Yang Chen and Yitao Liang and Zhouchen Lin},\nyear={2024},\nurl={https://openreview.net/forum?id=e5lR6tySR7}\n}",
        "github": "",
        "project": "",
        "reviewers": "8H3T;joMD;PAUt;PfJ8;T96k",
        "site": "https://openreview.net/forum?id=e5lR6tySR7",
        "pdf_size": 380845,
        "rating": "1;3;5;5;6",
        "confidence": "5;2;4;4;3",
        "soundness": "4;3;3;3;2",
        "contribution": "1;2;2;3;2",
        "presentation": "2;2;3;2;1",
        "wc_summary": "22;119;66;18;45",
        "wc_strengths": "13;1;40;63;36",
        "wc_weaknesses": "173;112;368;984;298",
        "wc_questions": "32;69;2;65;26",
        "wc_review": "240;301;476;1130;405",
        "wc_reply_reviewers": "0;0;0;51;0",
        "wc_reply_authors": "0;0;0;209;0",
        "reply_reviewers": "0;0;0;1;0",
        "reply_authors": "0;0;0;1;0",
        "rating_avg": [
            4.0,
            1.7888543819998317
        ],
        "confidence_avg": [
            3.6,
            1.019803902718557
        ],
        "soundness_avg": [
            3.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            2.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            2.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            54.0,
            36.796738985948195
        ],
        "wc_strengths_avg": [
            30.6,
            21.694238866574693
        ],
        "wc_weaknesses_avg": [
            387.0,
            311.8050673096895
        ],
        "wc_questions_avg": [
            38.8,
            25.15074551578939
        ],
        "wc_review_avg": [
            510.4,
            320.36266948569397
        ],
        "wc_reply_reviewers_avg": [
            10.2,
            20.4
        ],
        "wc_reply_authors_avg": [
            41.8,
            83.6
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4
        ],
        "reply_authors_avg": [
            0.2,
            0.4
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3288967572401359,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10837614727528883618&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Peking University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.pku.edu.cn",
        "aff_unique_abbr": "Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "e9PSTbhlSQ",
        "title": "Learning within Sleeping: A Brain-Inspired Bayesian Continual Learning Framework",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Bayesian-based methods have emerged as an effective approach in continual learning (CL) to solve catastrophic forgetting. One prominent example is Variational Continual Learning (VCL), which demonstrates remarkable performance in task-incremental learning (task-IL). However, class-incremental learning (class-IL) is still challenging for the VCL, and the reasons behind this limitation remain unclear. Relying on the sophisticated neural mechanisms, particularly the mechanism of memory consolidation during sleep, the human brain possesses inherent advantages for both task-IL and class-IL scenarios, which provides insight for a brain-inspired VCL. To identify the reasons for the inadequacy of VCL in class-IL, we first conduct a comprehensive theoretical analysis of VCL. On this basis, we propose a novel bayesian framework named as Learning within Sleeping (LwS) by leveraging the memory consolidation. By simulating the distribution integration and generalization observed during memory consolidation in sleep, LwS achieves the idea of prior knowledge guiding posterior knowledge learning as in VCL. In addition, with emulating the process of memory reactivation of the brain, LwS imposes a constraint on feature invariance to mitigate forgetting learned knowledge. Experimental results demonstrate that LwS outperforms both Bayesian and non-Bayesian methods in task-IL and class-IL scenarios, which further indicates the effectiveness of incorporating brain mechanisms on designing novel approaches for CL.",
        "keywords": "continual learning;variational continual learning;class-incremental learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Han Yuyang;Chaoqiong Fan;Tianyuan Jia;Qixin Wang;Xia Wu",
        "authorids": "~Han_Yuyang1;~Chaoqiong_Fan1;~Tianyuan_Jia1;~Qixin_Wang2;~Xia_Wu3",
        "gender": "M;F;F;F;",
        "homepage": "https://www.researchgate.net/profile/Han-Yuyang;;;https://orcid.org/my-orcid?emailVerified=true&orcid=0009-0005-8597-2160;",
        "dblp": ";;123/2509;17/6932.html;",
        "google_scholar": ";;;;",
        "orcid": "0009-0006-1192-2184;0000-0003-3877-9315;0000-0001-9602-7336;0009-0005-8597-2160;",
        "linkedin": ";;;;",
        "or_profile": "~Han_Yuyang1;~Chaoqiong_Fan1;~Tianyuan_Jia1;~Qixin_Wang2;~Xia_Wu3",
        "aff": "Beijing Normal University;Beijing Normal University;Beijing Normal University;;",
        "aff_domain": "bnu.edu.cn;bnu.edu.cn;bnu.edu.cn;;",
        "position": "MS student;Lecturer;PhD student;;",
        "bibtex": "@misc{\nyuyang2024learning,\ntitle={Learning within Sleeping: A Brain-Inspired Bayesian Continual Learning Framework},\nauthor={Han Yuyang and Chaoqiong Fan and Tianyuan Jia and Qixin Wang and Xia Wu},\nyear={2024},\nurl={https://openreview.net/forum?id=e9PSTbhlSQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "LsLM;ET4e;KMAy;HYLs",
        "site": "https://openreview.net/forum?id=e9PSTbhlSQ",
        "pdf_size": 788391,
        "rating": "3;5;5;5",
        "confidence": "4;4;4;4",
        "soundness": "2;2;2;2",
        "contribution": "1;2;3;3",
        "presentation": "1;2;2;2",
        "wc_summary": "50;57;79;63",
        "wc_strengths": "17;38;75;44",
        "wc_weaknesses": "221;128;86;97",
        "wc_questions": "2;116;37;89",
        "wc_review": "290;339;277;293",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "294;323;168;160",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            62.25,
            10.709224995301948
        ],
        "wc_strengths_avg": [
            43.5,
            20.766559657295186
        ],
        "wc_weaknesses_avg": [
            133.0,
            53.08954699373503
        ],
        "wc_questions_avg": [
            61.0,
            44.34523649728345
        ],
        "wc_review_avg": [
            299.75,
            23.44541533008106
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            236.25,
            73.0286758746179
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:nbfk5k-pq7wJ:scholar.google.com/&scioq=Learning+within+Sleeping:+A+Brain-Inspired+Bayesian+Continual+Learning+Framework&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Beijing Normal University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.bnu.edu.cn",
        "aff_unique_abbr": "BNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "e9YuyOaJbc",
        "title": "Optimal and Generalizable Multimodal Representation Learning Framework through Adaptive Graph Construction",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Multimodal contrastive learning train neural networks by levergaing ata from heterogenous sources such as images and text. Yet, current multimodal learning architectures cannot generalize to an arbitrary number of modalities, need to be hand-constructed and are often not robust to missing modalities. We propose AutoBIND, a novel contrastive learning framework that can learn representations from an arbitrary number of modalities. AutoBIND uses a graph-based approach to automatically select the most correlated modalities and uses a contrastive loss to learn the representations. AutoBIND is robust to missing modalities as it can dynamically update the graph structure during training. Based on the proposed framework, each modality maps to a shared embedding space and that the correlation between two modalities can be used as a measure of similarity between the two modalities. Therefore, the graph structure improves dynamically during training, purely as a result of the minimization of the contrastive loss. We evaluate AutoBIND on a wide variety of datasets, including tasks such as Alzhiemer's disease detection and house price prediction, and across a broad range of data modalities: 3D images, 2D images, and tables. We also show that AutoBIND outperforms previous methods on these tasks, highlighting the generalizablility of the approach.",
        "keywords": "contrastive learning;multimodal representation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Weichen Huang",
        "authorids": "~Weichen_Huang3",
        "gender": "M",
        "homepage": "https://weichenhuang.tech/",
        "dblp": "",
        "google_scholar": "",
        "orcid": "",
        "linkedin": "weichen-huang-a17393234/",
        "or_profile": "~Weichen_Huang3",
        "aff": "St Andrew's College ",
        "aff_domain": "sac.ie",
        "position": "High school student",
        "bibtex": "@misc{\nhuang2024optimal,\ntitle={Optimal and Generalizable Multimodal Representation Learning Framework through Adaptive Graph Construction},\nauthor={Weichen Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=e9YuyOaJbc}\n}",
        "github": "",
        "project": "",
        "reviewers": "pwEx;Ehq7;5eim;ZYST",
        "site": "https://openreview.net/forum?id=e9YuyOaJbc",
        "pdf_size": 449819,
        "rating": "3;3;3;5",
        "confidence": "4;5;4;4",
        "soundness": "1;2;3;2",
        "contribution": "1;1;1;2",
        "presentation": "1;2;3;2",
        "wc_summary": "42;66;74;96",
        "wc_strengths": "58;28;39;69",
        "wc_weaknesses": "103;469;109;192",
        "wc_questions": "1;10;2;93",
        "wc_review": "204;573;224;450",
        "wc_reply_reviewers": "0;0;0;42",
        "wc_reply_authors": "80;399;549;157",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            69.5,
            19.30673457630782
        ],
        "wc_strengths_avg": [
            48.5,
            15.976545308670458
        ],
        "wc_weaknesses_avg": [
            218.25,
            148.9821717521932
        ],
        "wc_questions_avg": [
            26.5,
            38.55191305240247
        ],
        "wc_review_avg": [
            362.75,
            155.13764050029897
        ],
        "wc_reply_reviewers_avg": [
            10.5,
            18.186533479473212
        ],
        "wc_reply_authors_avg": [
            296.25,
            187.47983224869816
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:CfgH4oNR9I4J:scholar.google.com/&scioq=Optimal+and+Generalizable+Multimodal+Representation+Learning+Framework+through+Adaptive+Graph+Construction&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "St Andrew's College",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.st-andrews.ac.uk",
        "aff_unique_abbr": "St Andrews",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "e9bEoxNiTJ",
        "title": "TransCues: Boundary and Reflection-empowered Pyramid Vision Transformer for Semantic Transparent Object Segmentation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Although glass is a prevalent material in everyday life, most semantic segmentation methods struggle to distinguish it from opaque materials. We propose $\\textbf{TransCues}$, a pyramidal transformer encoder-decoder architecture to segment transparent objects from a color image. \nTo distinguish between glass and non-glass regions, \nour transformer architecture is based on two important visual cues that involve boundary and reflection feature learning, respectively. \nWe implement this idea by introducing a Boundary Feature Enhancement (BFE) module paired with a boundary loss and a Reflection Feature Enhancement (RFE) module that decomposes reflections into foreground and background layers. \nWe empirically show that these two modules can be used together effectively, leading to improved overall performance on various benchmark datasets. In addition to binary segmentation of glass and mirror objects, we further demonstrate that our method works well for generic semantic segmentation for both glass and non-glass labels. Our method outperforms the state-of-the-art methods by a large margin on diverse datasets, achieving $\\textbf{+4.2}$\\% mIoU on Trans10K-v2, $\\textbf{+5.6}$\\% mIoU on MSD, $\\textbf{+10.1}$\\% mIoU on RGBD-Mirror, $\\textbf{+13.1}$\\% mIoU on TROSD, and $\\textbf{+8.3}$\\% mIoU on Stanford2D3D, demonstrate the effectiveness and efficiency of our method.",
        "keywords": "semantic segmentation;transparent object segmentation;pyramidal vision transformer",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Tuan-Anh Vu;Nguyen Truong Hai;Ziqiang Zheng;Binh-Son Hua;Qing Guo;Ivor Tsang;Sai-Kit Yeung",
        "authorids": "~Tuan-Anh_Vu1;~Nguyen_Truong_Hai1;~Ziqiang_Zheng2;~Binh-Son_Hua1;~Qing_Guo3;~Ivor_Tsang1;~Sai-Kit_Yeung3",
        "gender": "M;M;M;M;M;M;M",
        "homepage": "https://tuananh1007.github.io/;;https://sonhua.github.io;https://tsingqguo.github.io;https://www.a-star.edu.sg/cfar/about-cfar/management/prof-ivor-tsang;http://www.saikit.org/;https://zhengziqiang.github.io/",
        "dblp": "242/2724;;44/8499;25/3038-5;35/5873;144/7479;",
        "google_scholar": "EgDjnEEAAAAJ;D1ngwXoAAAAJ;sV_VjsAAAAAJ;Rj2x4QUAAAAJ;rJMOlVsAAAAJ;https://scholar.google.com.tw/citations?user=16iMMwwAAAAJ;bjvs9i0AAAAJ",
        "orcid": "0000-0002-8872-0875;;0000-0002-5706-8634;0000-0003-0974-9299;;;",
        "linkedin": "tuananhvu1007/;;binh-son-hua-40895b14/;;;;",
        "or_profile": "~Tuan-Anh_Vu1;~Nguyen_Truong_Hai1;~Binh-Son_Hua1;~Qing_Guo3;~Ivor_W_Tsang1;~Sai-kit_Yeung1;~Zheng_Ziqiang1",
        "aff": "Hong Kong University of Science and Technology;Department of Computer Science and Engineering, Hong Kong University of Science and Technology;University of Dublin, Trinity College; Agency for Science, Technology and Research (A*STAR));A*STAR;Hong Kong University of Science and Technology;Hong Kong University of Science and Technology",
        "aff_domain": "ust.hk;cse.ust.hk;tcd.ie;cfar.a-star.edu.sg;cfar.a-star.edu.sg;ust.hk;ust.hk",
        "position": "PhD student;MS student;Assistant Professor;Researcher;Principal Researcher;Full Professor;PhD student",
        "bibtex": "@misc{\nvu2024transcues,\ntitle={TransCues: Boundary and Reflection-empowered Pyramid Vision Transformer for Semantic Transparent Object Segmentation},\nauthor={Tuan-Anh Vu and Nguyen Truong Hai and Ziqiang Zheng and Binh-Son Hua and Qing Guo and Ivor Tsang and Sai-Kit Yeung},\nyear={2024},\nurl={https://openreview.net/forum?id=e9bEoxNiTJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "42YL;WwQc;3ba2",
        "site": "https://openreview.net/forum?id=e9bEoxNiTJ",
        "pdf_size": 6829589,
        "rating": "5;5;6",
        "confidence": "5;4;5",
        "soundness": "3;2;3",
        "contribution": "2;2;3",
        "presentation": "3;3;3",
        "wc_summary": "43;62;90",
        "wc_strengths": "25;39;64",
        "wc_weaknesses": "158;106;544",
        "wc_questions": "40;2;3",
        "wc_review": "266;209;701",
        "wc_reply_reviewers": "53;0;0",
        "wc_reply_authors": "1604;780;1608",
        "reply_reviewers": "1;0;0",
        "reply_authors": "3;2;3",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            65.0,
            19.30457631409368
        ],
        "wc_strengths_avg": [
            42.666666666666664,
            16.131404843417148
        ],
        "wc_weaknesses_avg": [
            269.3333333333333,
            195.3754220866984
        ],
        "wc_questions_avg": [
            15.0,
            17.682382946499793
        ],
        "wc_review_avg": [
            392.0,
            219.7316545243311
        ],
        "wc_reply_reviewers_avg": [
            17.666666666666668,
            24.984439601924677
        ],
        "wc_reply_authors_avg": [
            1330.6666666666667,
            389.38355840424947
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2454704838646458431&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2;2;0;0",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Trinity College Dublin;Agency for Science, Technology and Research",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ust.hk;https://www.tcd.ie;https://www.a-star.edu.sg",
        "aff_unique_abbr": "HKUST;TCD;A*STAR",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;1;2;2;0;0",
        "aff_country_unique": "China;Ireland;Singapore"
    },
    {
        "id": "eADuHv62J5",
        "title": "HeroLT: Benchmarking Heterogeneous Long-Tailed Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Long-tailed data distributions are prevalent in a variety of domains, including e-commerce, finance, biomedical science, and cyber security. In such scenarios, the performance of machine learning models is often dominated by the head categories, while the learning of tail categories is significantly inadequate. Given abundant studies conducted to alleviate the issue, this work aims to provide a systematic view of long-tailed learning with regard to three pivotal angles: (A1) the characterization of data long-tailedness, (A2) the data complexity of various domains, and (A3) the heterogeneity of emerging tasks. To achieve this, we develop the most comprehensive (to the best of our knowledge) long-tailed learning benchmark named HeroLT, which integrates 15 state-of-the-art algorithms and 6 evaluation metrics on 16 real-world benchmark datasets across 5 tasks from 3 domains. HeroLT with novel angles and extensive experiments (304 in total) enables researchers and practitioners to effectively and fairly evaluate newly proposed methods compared with existing baselines on varying types of datasets. Finally, we conclude by highlighting the significant applications of long-tailed learning and identifying several promising future directions. For accessibility and reproducibility, we open-source our benchmark HeroLT and corresponding results at https://anonymous.4open.science/r/HeroLT-9746/.",
        "keywords": "long-tailed learning",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Haohui Wang;Weijie Guan;Jianpeng Chen;Zi Wang;Dawei Zhou",
        "authorids": "~Haohui_Wang1;~Weijie_Guan1;~Jianpeng_Chen1;~Zi_Wang10;~Dawei_Zhou1",
        "gender": "F;M;M;M;M",
        "homepage": "https://github.com/wanghh7;https://github.com/SSSKJ;https://github.com/cjpcool;;https://sites.google.com/view/dawei-zhou/home?authuser=0",
        "dblp": "294/8598;352/4229.html;234/5858;;39/3130-3.html",
        "google_scholar": "ijh64HMAAAAJ;;https://scholar.google.com/citations?view_op=list_works;https://scholar.google.com/citations?hl=zh-CN;8dakqOgAAAAJ",
        "orcid": "0009-0000-7391-096X;0000-0003-4001-7862;;;0000-0002-7065-2990",
        "linkedin": ";;;;dawei-zhou-31035668/",
        "or_profile": "~Haohui_Wang1;~Weijie_Guan1;~Jianpeng_Chen1;~Zi_Wang10;~Dawei_Zhou1",
        "aff": "Virginia Polytechnic Institute and State University;Virginia Polytechnic Institute and State University;Virginia Polytechnic Institute and State University;Texas A&M University - College Station;Virginia Polytechnic Institute and State University",
        "aff_domain": "vt.edu;vt.edu;vt.edu;tamu.edu;vt.edu",
        "position": "PhD student;PhD student;PhD student;PhD student;Assistant Professor",
        "bibtex": "@misc{\nwang2024herolt,\ntitle={Hero{LT}: Benchmarking Heterogeneous Long-Tailed Learning},\nauthor={Haohui Wang and Weijie Guan and Jianpeng Chen and Zi Wang and Dawei Zhou},\nyear={2024},\nurl={https://openreview.net/forum?id=eADuHv62J5}\n}",
        "github": "",
        "project": "",
        "reviewers": "Tkrb;BsKP;wsvH;aihc",
        "site": "https://openreview.net/forum?id=eADuHv62J5",
        "pdf_size": 554838,
        "rating": "3;3;5;5",
        "confidence": "4;4;5;4",
        "soundness": "2;2;3;2",
        "contribution": "2;2;2;2",
        "presentation": "3;2;3;2",
        "wc_summary": "41;15;65;82",
        "wc_strengths": "47;20;61;124",
        "wc_weaknesses": "208;190;241;205",
        "wc_questions": "99;2;14;74",
        "wc_review": "395;227;381;485",
        "wc_reply_reviewers": "92;88;0;180",
        "wc_reply_authors": "1018;815;848;1260",
        "reply_reviewers": "1;1;0;2",
        "reply_authors": "2;2;2;3",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            50.75,
            25.262373206015305
        ],
        "wc_strengths_avg": [
            63.0,
            38.17721833764215
        ],
        "wc_weaknesses_avg": [
            211.0,
            18.614510468986285
        ],
        "wc_questions_avg": [
            47.25,
            40.45599461142934
        ],
        "wc_review_avg": [
            372.0,
            92.74157643689264
        ],
        "wc_reply_reviewers_avg": [
            90.0,
            63.655321851358195
        ],
        "wc_reply_authors_avg": [
            985.25,
            176.33969348958277
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:w4l3qk2Xl_IJ:scholar.google.com/&scioq=HeroLT:+Benchmarking+Heterogeneous+Long-Tailed+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "Virginia Tech;Texas A&M University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.vt.edu;https://www.tamu.edu",
        "aff_unique_abbr": "VT;TAMU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";College Station",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "PixArt-$\\alpha$: Fast Training of Diffusion Transformer for Photorealistic Text-to-Image Synthesis",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18231",
        "id": "eAKmQPe3m1",
        "author_site": "Junsong Chen, Jincheng YU, Chongjian GE, Lewei Yao, Enze Xie, Zhongdao Wang, James Kwok, Ping Luo, Huchuan Lu, Zhenguo Li",
        "tldr": "",
        "abstract": "The most advanced text-to-image (T2I) models require significant training costs (e.g., millions of GPU hours), seriously hindering the fundamental innovation for the AIGC community while increasing CO2 emissions. This paper introduces PixArt-$\\alpha$, a Transformer-based T2I diffusion model whose image generation quality is competitive with state-of-the-art image generators (e.g., Imagen, SDXL, and even Midjourney), reaching near-commercial application standards. Additionally, it supports high-resolution image synthesis up to 1024px resolution with low training cost, as shown in Figure 1 and 2. To achieve this goal, three core designs are proposed: (1) Training strategy decomposition: We devise three distinct training steps that separately optimize pixel dependency, text-image alignment, and image aesthetic quality; (2) Efficient T2I Transformer: We incorporate cross-attention modules into Diffusion Transformer (DiT) to inject text conditions and streamline the computation-intensive class-condition branch; (3) High-informative data: We emphasize the significance of concept density in text-image pairs and leverage a large Vision-Language model to auto-label dense pseudo-captions to assist text-image alignment learning. As a result, PixArt-$\\alpha$'s training speed markedly surpasses existing large-scale T2I models, e.g., PixArt-$\\alpha$ only takes 10.8% of Stable Diffusion v1.5's training time (~675 vs. ~6,250 A100 GPU days), saving nearly \\\\$300,000 (\\\\$26,000 vs. \\\\$320,000) and reducing 90% CO2 emissions. Moreover, compared with a larger SOTA model, RAPHAEL, our training cost is merely 1%. Extensive experiments demonstrate that PixArt-$\\alpha$ excels in image quality, artistry, and semantic control. We hope PixArt-$\\alpha$ will provide new insights to the AIGC community and startups to accelerate building their own high-quality yet low-cost generative models from scratch.",
        "keywords": "Text-to-Image Diffusion;Transformer",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Junsong Chen;Jincheng YU;Chongjian GE;Lewei Yao;Enze Xie;Zhongdao Wang;James Kwok;Ping Luo;Huchuan Lu;Zhenguo Li",
        "authorids": "~Junsong_Chen1;~Jincheng_YU1;~Chongjian_GE1;~Lewei_Yao1;~Enze_Xie1;~Zhongdao_Wang2;~James_Kwok1;~Ping_Luo2;~Huchuan_Lu1;~Zhenguo_Li1",
        "gender": ";M;M;M;M;;;;M;M",
        "homepage": ";https://lovesykun.cn;https://chongjiange.github.io;;https://xieenze.github.io/;;;;http://ice.dlut.edu.cn/lu/publications.html;http://www.ee.columbia.edu/~zgli/",
        "dblp": ";;287/4197;254/1943.html;218/5441;;;;64/6896;23/6479",
        "google_scholar": ";;https://scholar.google.com.hk/citations?user=7DA_vcUAAAAJ;hqDyTg8AAAAJ;42MVVPgAAAAJ;;;;D3nE0agAAAAJ;XboZC1AAAAAJ",
        "orcid": ";;;;;;;;;",
        "linkedin": ";;chongjian-ge-%EF%BC%88%E8%91%9B%E5%B4%87%E5%89%91%EF%BC%89-3b393310b/;;;;;;;",
        "or_profile": "~Junsong_Chen1;~Jincheng_YU1;~Chongjian_GE1;~Lewei_Yao1;~Enze_Xie1;~Zhongdao_Wang2;~James_Kwok1;~Ping_Luo2;~Huchuan_Lu1;~Zhenguo_Li1",
        "aff": ";Hong Kong University of Science and Technology;The University of Hong Kong;Hong Kong University of Science and Technology;Huawei Noah's Ark Lab;;;;Dalian University of Technology;Huawei Noah's Ark Lab",
        "aff_domain": ";ust.hk;hku.hk;ust.hk;huawei.com;;;;dlut.edu.cn;huawei.com",
        "position": ";MS student;PhD student;PhD student;Researcher;;;;Professor;Principal Researcher",
        "bibtex": "@inproceedings{\nchen2024pixartalpha,\ntitle={PixArt-\\${\\textbackslash}alpha\\$: Fast Training of Diffusion Transformer for Photorealistic Text-to-Image Synthesis},\nauthor={Junsong Chen and Jincheng YU and Chongjian GE and Lewei Yao and Enze Xie and Zhongdao Wang and James Kwok and Ping Luo and Huchuan Lu and Zhenguo Li},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=eAKmQPe3m1}\n}",
        "github": "",
        "project": "",
        "reviewers": "7QAx;GFA3;Bg3n;VQLf",
        "pdf_size": 14666524,
        "rating": "6;6;8;8",
        "confidence": "4;4;4;4",
        "soundness": "2;4;4;4",
        "contribution": "2;3;4;4",
        "presentation": "3;3;4;3",
        "wc_summary": "49;102;171;70",
        "wc_strengths": "83;102;238;84",
        "wc_weaknesses": "250;42;101;23",
        "wc_questions": "63;140;25;165",
        "wc_review": "445;386;535;342",
        "wc_reply_reviewers": "12;0;21;0",
        "wc_reply_authors": "1511;843;218;1086",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "5;3;2;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            3.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            98.0,
            46.17899955607527
        ],
        "wc_strengths_avg": [
            126.75,
            64.67370021886795
        ],
        "wc_weaknesses_avg": [
            104.0,
            89.06458330896743
        ],
        "wc_questions_avg": [
            98.25,
            56.58345606270441
        ],
        "wc_review_avg": [
            427.0,
            72.27378501227122
        ],
        "wc_reply_reviewers_avg": [
            8.25,
            8.842369591913696
        ],
        "wc_reply_authors_avg": [
            914.5,
            467.82715825398594
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.0,
            1.224744871391589
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 546,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6685159266178732283&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=eAKmQPe3m1",
        "pdf": "https://openreview.net/pdf?id=eAKmQPe3m1",
        "email": ";ust.hk;hku.hk;ust.hk;huawei.com;;;;dlut.edu.cn;huawei.com",
        "author_num": 10,
        "aff_unique_index": "0;1;0;2;3;2",
        "aff_unique_norm": "Hong Kong University of Science and Technology;University of Hong Kong;Huawei;Dalian University of Technology",
        "aff_unique_dep": ";;Noah's Ark Lab;",
        "aff_unique_url": "https://www.ust.hk;https://www.hku.hk;https://www.huawei.com;http://www.dlut.edu.cn/",
        "aff_unique_abbr": "HKUST;HKU;Huawei;DUT",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "eBTtShIjxu",
        "title": "Prompt Tuning Is All We Need?",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent advances in pre-trained vision-language models, e.g., CLIP, have demonstrated remarkable success in domain generalization (DG) by tuning prompts. To promote DG, one promising method is to explore how to design or learn more sweet prompts, i.e., prompt learning. The implicit intuition of it is that a more elaborate prompt learning method can lead to higher generalization performance. The foundation intuition motivates us to raise a question: Prompt tuning is all we need? To verify whether the intuition holds for DG, we design comprehensive experiments on DG benchmarks. However, our experiments demonstrate a pessimistic conclusion that simply tuning prompts using training sets can achieve comparable performance with that using test sets. Namely, even the optimal prompts can hardly bring significant performance gain than a simple tuning strategy. Our experiments show that this results from the non-separability of features extracted by the image encoder. Thus, we propose image encoder tuning, named Im-Tuning, for more separable image features. We conduct extensive experiments on multiple DG benchmarks, demonstrating that Im-Tuning can consistently outperform the relevant state-of-the-art methods.",
        "keywords": "vision-language models;prompt tuning;domain generalization",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Hang Yu;Haiting Zheng;Yonggang Zhang;Shaorong Xie;Xiaofeng Cao;Zhen Fang",
        "authorids": "~Hang_Yu9;~Haiting_Zheng1;~Yonggang_Zhang1;~Shaorong_Xie1;~Xiaofeng_Cao2;~Zhen_Fang2",
        "gender": "M;;M;F;M;M",
        "homepage": ";;https://yonggangzhangben.github.io/index.html;https://www.shu.edu.cn/info/1608/75533.htm;https://fang-zhen.github.io/index.html;https://xiaofengcaoml.github.io/",
        "dblp": "74/2568-6;;27/6859-3;76/4084;;117/3982-2.html",
        "google_scholar": "https://scholar.google.com.au/citations?user=3BLeGSoAAAAJ;;XSbEr98AAAAJ;;OzD6WJcAAAAJ;",
        "orcid": "0000-0003-3444-9992;0009-0000-6337-290X;0000-0002-4080-7592;;0000-0003-0602-6255;",
        "linkedin": ";;;;;",
        "or_profile": "~Hang_Yu9;~Haiting_Zheng1;~Yonggang_Zhang1;~Shaorong_Xie1;~Zhen_Fang2;~Xiaofeng_Cao1",
        "aff": "Shanghai University;;Hong Kong Baptist University;Shanghai University;University of Technology Sydney;Jilin University",
        "aff_domain": "shu.edu.cn;;hkbu.edu.hk;shu.edu.cn;uts.edu.au;jlu.edu.cn",
        "position": "Full Professor;;Postdoc;Full Professor;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nyu2024prompt,\ntitle={Prompt Tuning Is All We Need?},\nauthor={Hang Yu and Haiting Zheng and Yonggang Zhang and Shaorong Xie and Xiaofeng Cao and Zhen Fang},\nyear={2024},\nurl={https://openreview.net/forum?id=eBTtShIjxu}\n}",
        "github": "",
        "project": "",
        "reviewers": "Xqq5;PxvM;wRsx;W47K",
        "site": "https://openreview.net/forum?id=eBTtShIjxu",
        "pdf_size": 1203091,
        "rating": "3;3;5;6",
        "confidence": "5;5;4;4",
        "soundness": "3;2;2;2",
        "contribution": "3;2;2;3",
        "presentation": "3;1;3;3",
        "wc_summary": "50;237;64;54",
        "wc_strengths": "14;63;27;83",
        "wc_weaknesses": "248;73;36;83",
        "wc_questions": "9;19;61;47",
        "wc_review": "321;392;188;267",
        "wc_reply_reviewers": "0;25;0;0",
        "wc_reply_authors": "252;138;187;202",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            101.25,
            78.54099248163344
        ],
        "wc_strengths_avg": [
            46.75,
            27.571497964383436
        ],
        "wc_weaknesses_avg": [
            110.0,
            81.5751187556598
        ],
        "wc_questions_avg": [
            34.0,
            20.904544960366874
        ],
        "wc_review_avg": [
            292.0,
            74.63578230312856
        ],
        "wc_reply_reviewers_avg": [
            6.25,
            10.825317547305483
        ],
        "wc_reply_authors_avg": [
            194.75,
            40.6532594019225
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.9622504486493761,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1473939159748837984&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;2;3",
        "aff_unique_norm": "Shanghai University;Hong Kong Baptist University;University of Technology Sydney;Jilin University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.shu.edu.cn;https://www.hkbu.edu.hk;https://www.uts.edu.au;http://www.jlu.edu.cn",
        "aff_unique_abbr": "SHU;HKBU;UTS;JLU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "China;Australia"
    },
    {
        "title": "PORF: POSE RESIDUAL FIELD FOR ACCURATE NEURAL SURFACE RECONSTRUCTION",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18230",
        "id": "eBeECjacpw",
        "author_site": "Jia-Wang Bian, Wenjing Bian, Victor Prisacariu, Philip Torr",
        "tldr": "",
        "abstract": "Neural surface reconstruction is sensitive to the camera pose noise, even when state-of-the-art pose estimators like COLMAP or ARKit are used. Existing Pose-NeRF joint optimisation methods have struggled to improve pose accuracy in challenging real-world scenarios. To overcome the challenges, we introduce the pose residual field (PoRF), a novel implicit representation that uses an MLP for regressing pose updates. Compared with the conventional per-frame pose parameter optimisation, this new representation is more robust due to parameter sharing that leverages global information over the entire sequence. Furthermore, we propose an epipolar geometry loss to enhance the supervision that leverages the correspondences exported from COLMAP results without the extra computational overhead. Our method yields promising results. On the DTU dataset, we reduce the rotation error of COLMAP poses by 78\\%, leading to the reduced reconstruction Chamfer distance from 3.48mm to 0.85mm. On the MobileBrick dataset that contains casually captured unbounded 360-degree videos, our method refines ARKit poses and improves the reconstruction F1 score from 69.18 to 75.67, outperforming that with the provided ground-truth pose (75.14). These achievements demonstrate the efficacy of our approach in refining camera poses and improving the accuracy of neural surface reconstruction in real-world scenarios.",
        "keywords": "Neural Surface Reconstruction;Camera Pose Estimation;Neural Radiance Field",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Jia-Wang Bian;Wenjing Bian;Victor Adrian Prisacariu;Philip Torr",
        "authorids": "~Jia-Wang_Bian1;~Wenjing_Bian1;~Victor_Adrian_Prisacariu1;~Philip_Torr1",
        "gender": "F;M;;M",
        "homepage": ";;http://www.robots.ox.ac.uk/~tvg/;https://jwbian.net",
        "dblp": "296/4123;39/8616;;185/7894",
        "google_scholar": "IVfbqkgAAAAJ;https://scholar.google.co.uk/citations?user=GmWA-LoAAAAJ;;https://scholar.google.com.au/citations?user=zeGz5JcAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Wenjing_Bian1;~Victor_Adrian_Prisacariu1;~Philip_Torr1;~Jiawang_Bian1",
        "aff": "University of Oxford;University of Oxford;University of Oxford;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_domain": "ox.ac.uk;ox.ac.uk;ox.ac.uk;mbzuai.ac.ae",
        "position": "PhD student;Associate Professor;Full Professor;Postdoc",
        "bibtex": "@inproceedings{\nbian2024porf,\ntitle={{PORF}: {POSE} {RESIDUAL} {FIELD} {FOR} {ACCURATE} {NEURAL} {SURFACE} {RECONSTRUCTION}},\nauthor={Jia-Wang Bian and Wenjing Bian and Victor Adrian Prisacariu and Philip Torr},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=eBeECjacpw}\n}",
        "github": "",
        "project": "",
        "reviewers": "jgNN;7s1S;dcYV;7mvY",
        "pdf_size": 10489960,
        "rating": "5;5;6;8",
        "confidence": "4;4;5;4",
        "soundness": "3;3;3;3",
        "contribution": "1;2;3;4",
        "presentation": "3;4;3;4",
        "wc_summary": "120;96;92;89",
        "wc_strengths": "59;68;78;180",
        "wc_weaknesses": "295;65;166;146",
        "wc_questions": "8;36;6;87",
        "wc_review": "482;265;342;502",
        "wc_reply_reviewers": "678;16;6;61",
        "wc_reply_authors": "1107;267;544;473",
        "reply_reviewers": "2;1;1;1",
        "reply_authors": "3;1;1;2",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            1.118033988749895
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            99.25,
            12.234684303242156
        ],
        "wc_strengths_avg": [
            96.25,
            48.81790142970097
        ],
        "wc_weaknesses_avg": [
            168.0,
            82.50151513760217
        ],
        "wc_questions_avg": [
            34.25,
            32.683137854251385
        ],
        "wc_review_avg": [
            397.75,
            98.35744760820097
        ],
        "wc_reply_reviewers_avg": [
            190.25,
            282.3635732526418
        ],
        "wc_reply_authors_avg": [
            597.75,
            311.1200531949042
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2039687966463655423&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=eBeECjacpw",
        "pdf": "https://openreview.net/pdf?id=eBeECjacpw",
        "email": "ox.ac.uk;ox.ac.uk;ox.ac.uk;mbzuai.ac.ae",
        "author_num": 4,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "University of Oxford;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ox.ac.uk;https://mbzuai.ac.ae",
        "aff_unique_abbr": "Oxford;MBZUAI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "United Kingdom;United Arab Emirates"
    },
    {
        "id": "eC4WlSZc4H",
        "title": "Robustness Over Time: Understanding Adversarial Examples\u2019 Effectiveness on Longitudinal Versions of Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) have led to significant improvements in many tasks across various domains, such as code interpretation, response generation, and ambiguity handling.\nThese LLMs, however, when upgrading, primarily prioritize enhancing user experience while neglecting security, privacy, and safety implications.\nConsequently, unintended vulnerabilities or biases can be introduced. \nPrevious studies have predominantly focused on specific versions of the models and disregard the potential emergence of new attack vectors targeting the updated versions.\nThrough the lens of adversarial examples within the in-context learning framework, this longitudinal study addresses this gap by conducting a comprehensive assessment of the robustness of successive versions of LLMs, vis-\\`a-vis GPT-3.5 and LLaMA.\nWe conduct extensive experiments to analyze and understand the impact of the robustness in two distinct learning categories: zero-shot learning and few-shot learning.\nOur findings indicate that, compared to earlier versions of LLMs, the updated versions do not exhibit the anticipated level of robustness against adversarial attacks.\nWe hope that our study can lead to a more refined assessment of the robustness of LLMs over time and provide valuable insights into these models for both developers and users.",
        "keywords": "Robustness;Large Language Models;Adversarial Attack",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Yugeng Liu;Tianshuo Cong;Zhengyu Zhao;Michael Backes;Yun Shen;Yang Zhang",
        "authorids": "~Yugeng_Liu1;~Tianshuo_Cong1;~Zhengyu_Zhao1;~Michael_Backes3;~Yun_Shen3;~Yang_Zhang15",
        "gender": "M;M;M;;M;M",
        "homepage": "https://liu.ai;https://tianshuocong.github.io/;https://zhengyuzhao.github.io/;;https://uk.linkedin.com/in/yun-shen-24336257;https://yangzhangalmo.github.io/",
        "dblp": "https://dblp.uni-trier.de/pid/227/9104;233/3780;58/10770-1;;;06/6785-16",
        "google_scholar": "zVRiqxgAAAAJ;;pC8KpPMAAAAJ;;Gx_JJ6cAAAAJ;Xeb2888AAAAJ",
        "orcid": "0000-0001-9959-2883;;;;;0000-0003-3612-7348",
        "linkedin": ";;;;;",
        "or_profile": "~Yugeng_Liu1;~Tianshuo_Cong1;~Zhengyu_Zhao1;~Michael_Backes3;~Yun_Shen3;~Yang_Zhang15",
        "aff": "CISPA Helmholtz Center for Information Security;Tsinghua University;Xi'an Jiaotong University;;NetApp;CISPA Helmholtz Center for Information Security",
        "aff_domain": "cispa.de;mail.tsinghua.edu.cn;xjtu.edu.cn;;netapp.com;cispa.de",
        "position": "PhD student;Postdoc;Researcher;;Technical Director;Full Professor",
        "bibtex": "@misc{\nliu2024robustness,\ntitle={Robustness Over Time: Understanding Adversarial Examples{\\textquoteright} Effectiveness on Longitudinal Versions of Large Language Models},\nauthor={Yugeng Liu and Tianshuo Cong and Zhengyu Zhao and Michael Backes and Yun Shen and Yang Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=eC4WlSZc4H}\n}",
        "github": "",
        "project": "",
        "reviewers": "6TAn;4jLb;JE4Q;9mwd",
        "site": "https://openreview.net/forum?id=eC4WlSZc4H",
        "pdf_size": 713348,
        "rating": "5;6;8;8",
        "confidence": "4;2;4;4",
        "soundness": "2;3;3;3",
        "contribution": "1;3;4;3",
        "presentation": "3;3;3;3",
        "wc_summary": "63;73;68;60",
        "wc_strengths": "44;7;148;156",
        "wc_weaknesses": "133;80;143;84",
        "wc_questions": "1;3;47;1",
        "wc_review": "241;163;406;301",
        "wc_reply_reviewers": "248;0;0;0",
        "wc_reply_authors": "891;387;264;119",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            1.0897247358851685
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            66.0,
            4.949747468305833
        ],
        "wc_strengths_avg": [
            88.75,
            64.65050270492875
        ],
        "wc_weaknesses_avg": [
            110.0,
            28.257742301889582
        ],
        "wc_questions_avg": [
            13.0,
            19.6468827043885
        ],
        "wc_review_avg": [
            277.75,
            88.75070422255814
        ],
        "wc_reply_reviewers_avg": [
            62.0,
            107.38715006927039
        ],
        "wc_reply_authors_avg": [
            415.25,
            290.5928207991381
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18375776756822335984&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;3;0",
        "aff_unique_norm": "CISPA Helmholtz Center for Information Security;Tsinghua University;Xi'an Jiao Tong University;NetApp",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.cispa.de/;https://www.tsinghua.edu.cn;https://www.xjtu.edu.cn;https://www.netapp.com",
        "aff_unique_abbr": "CISPA;THU;XJTU;NetApp",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;2;0",
        "aff_country_unique": "Germany;China;United States"
    },
    {
        "title": "Reward-Free Curricula for Training Robust World Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18229",
        "id": "eCGpNGDeNu",
        "author_site": "Marc Rigter, Minqi Jiang, Ingmar Posner",
        "tldr": "",
        "abstract": "There has been a recent surge of interest in developing generally-capable agents that can adapt to new tasks without additional training in the environment. Learning world models from reward-free exploration is a promising approach, and enables policies to be trained using imagined experience for new tasks. However, achieving a general agent requires robustness across different environments. In this work, we address the novel problem of generating curricula in the reward-free setting to train robust world models. We consider robustness in terms of minimax regret over all environment instantiations and show that the minimax regret can be connected to minimising the maximum error in the world model across environment instances. This result informs our algorithm, WAKER: Weighted Acquisition of Knowledge across Environments for Robustness. WAKER selects environments for data collection based on the estimated error of the world model for each environment. Our experiments demonstrate that WAKER outperforms na\u0131\u0308ve domain randomisation, resulting in improved robustness, efficiency, and generalisation.",
        "keywords": "curricula;model-based reinforcement learning;world models;reward-free reinforcement learning;robustness;unsupervised environment design",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Marc Rigter;Minqi Jiang;Ingmar Posner",
        "authorids": "~Marc_Rigter1;~Minqi_Jiang1;~Ingmar_Posner1",
        "gender": ";M;",
        "homepage": ";https://twitter.com/minqijiang;",
        "dblp": "226/6276;270/7949;59/542",
        "google_scholar": "0PthAD8AAAAJ;;dPk-iwsAAAAJ",
        "orcid": ";;0000-0001-6270-700X",
        "linkedin": "marc-rigter-791157a0;minqi-jiang-585a6536/;ingmar-posner-20b49a",
        "or_profile": "~Marc_Rigter1;~Minqi_Jiang1;~Ingmar_Posner1",
        "aff": "University of Oxford;Google;University of Oxford",
        "aff_domain": "ox.ac.uk;google.com;ox.ac.uk",
        "position": "Postdoc;Researcher;Full Professor",
        "bibtex": "@inproceedings{\nrigter2024rewardfree,\ntitle={Reward-Free Curricula for Training Robust World Models},\nauthor={Marc Rigter and Minqi Jiang and Ingmar Posner},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=eCGpNGDeNu}\n}",
        "github": "",
        "project": "",
        "reviewers": "j9LV;3ipu;VCF1;hsNK",
        "pdf_size": 8624714,
        "rating": "5;6;6;8",
        "confidence": "3;4;4;4",
        "soundness": "3;2;3;4",
        "contribution": "2;4;2;3",
        "presentation": "2;3;4;4",
        "wc_summary": "100;126;126;47",
        "wc_strengths": "46;147;134;73",
        "wc_weaknesses": "657;448;452;97",
        "wc_questions": "7;272;122;229",
        "wc_review": "810;993;834;446",
        "wc_reply_reviewers": "707;30;91;335",
        "wc_reply_authors": "1934;889;412;998",
        "reply_reviewers": "2;1;1;1",
        "reply_authors": "4;3;2;3",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            99.75,
            32.251937926270415
        ],
        "wc_strengths_avg": [
            100.0,
            41.862871377868956
        ],
        "wc_weaknesses_avg": [
            413.5,
            201.33119480100444
        ],
        "wc_questions_avg": [
            157.5,
            102.63162280700817
        ],
        "wc_review_avg": [
            770.75,
            200.24906366822293
        ],
        "wc_reply_reviewers_avg": [
            290.75,
            266.0417025580764
        ],
        "wc_reply_authors_avg": [
            1058.25,
            551.5552442865537
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.6622661785325219,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12732050426646697529&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=eCGpNGDeNu",
        "pdf": "https://openreview.net/pdf?id=eCGpNGDeNu",
        "email": "ox.ac.uk;google.com;ox.ac.uk",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Oxford;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.ox.ac.uk;https://www.google.com",
        "aff_unique_abbr": "Oxford;Google",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "id": "eDhJFIKI6i",
        "title": "UnifiedGT: Exploring the Effective Ingredients of Transformers in Large Graphs",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In recent years, transformer models have demonstrated great potential for modeling graph-structured data, and many graph transformers (GT) have been proposed and applied to graph representation learning tasks. However, while GTs are effective, existing GTs have mostly been applied to small graphs, and their critical ingredients for success and the connections among these components when processing large graphs are poorly understood. Through a systematic investigation of using GTs on large graphs, we find that (i) explicit graph structure injection through direct neighbor attention masking is significantly more effective than implicitly using graph structure through positional encoding; (ii) combining a direct neighbor-attended GT with a message-passing graph neural network (MP-GNN) boosts accuracy; and (iii) the FFN acts as a semantic mixer and plays an important role, even though some existing GTs neglect the FFN. As part of our systematic investigation, we break down the design space of state-of-the-art GTs and introduce a modular unified GT framework, called UnifiedGT, which is effective at handling both large-scale heterogeneous and homogeneous graph data. UnifiedGT consists of five major components: (i) graph sampling, (ii) structural prior injection, (iii) attention calculation, (iv) composition of local message-passing and long-range attention, and (v) fully-connected layer. UnifiedGT provides different options for each component, which enables practitioners to create new GT methods that significantly improve accuracy over existing methods. Based on comprehensive experiments using UnifiedGT on the Open Academic Graph, we identify our best-performing method, ParDNTrans (GT with a parallel connected MP-GNN and direct neighbor attention masking), which boosts accuracy by 4.5\u20135.3% over the state-of-the-art graph transformer.",
        "keywords": "graph transformer;graph learning;graph neural network;large-scale graph;heterogeneous graph;homogeneous graph",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Junhong Lin;Xiaojie Guo;Shuaicheng Zhang;Dawei Zhou;Yada Zhu;Julian Shun",
        "authorids": "~Junhong_Lin3;~Xiaojie_Guo1;~Shuaicheng_Zhang2;~Dawei_Zhou1;~Yada_Zhu1;~Julian_Shun1",
        "gender": "M;F;M;;M;M",
        "homepage": "https://www.linkedin.com/in/junhongmit;https://sites.google.com/view/xiaojie-guo-personal-site;https://sites.google.com/view/dawei-zhou/home?authuser=0;https://researcher.watson.ibm.com/researcher/view.php?person=us-yzhu;http://people.csail.mit.edu/jshun/;https://sites.google.com/view/shuaicheng-zhang/home",
        "dblp": ";43/8066;39/3130-3.html;56/8808;;288/0392",
        "google_scholar": "p3Oe_YMAAAAJ;ad7m0r0AAAAJ;8dakqOgAAAAJ;AJb408gAAAAJ;https://scholar.google.com.tw/citations?user=BGh9WU4AAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;0000-0002-7065-2990;0000-0002-3338-6371;;0000-0002-7372-8866",
        "linkedin": ";;dawei-zhou-31035668/;yadazhu/;;shuaicheng-zhang-573368118/",
        "or_profile": "~Junhong_Lin3;~Xiaojie_Guo1;~Dawei_Zhou1;~Yada_Zhu1;~Julian_Shun1;~SHUAICHENG_ZHANG1",
        "aff": "Massachusetts Institute of Technology;International Business Machines;Virginia Polytechnic Institute and State University;IBM Research;Massachusetts Institute of Technology;Virginia Tech",
        "aff_domain": "mit.edu;ibm.com;vt.edu;us.ibm.com;mit.edu;vt.edu",
        "position": "PhD student;Researcher;Assistant Professor;Principal Research Scientist;Associate Professor;PhD student",
        "bibtex": "@misc{\nlin2024unifiedgt,\ntitle={Unified{GT}: Exploring the Effective Ingredients of Transformers in Large Graphs},\nauthor={Junhong Lin and Xiaojie Guo and Shuaicheng Zhang and Dawei Zhou and Yada Zhu and Julian Shun},\nyear={2024},\nurl={https://openreview.net/forum?id=eDhJFIKI6i}\n}",
        "github": "",
        "project": "",
        "reviewers": "h6Lj;ybig;psLQ;Fnxk",
        "site": "https://openreview.net/forum?id=eDhJFIKI6i",
        "pdf_size": 1237434,
        "rating": "3;3;3;5",
        "confidence": "5;3;4;4",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;2",
        "presentation": "2;2;2;3",
        "wc_summary": "49;48;82;114",
        "wc_strengths": "60;38;55;53",
        "wc_weaknesses": "130;112;125;34",
        "wc_questions": "97;599;6;41",
        "wc_review": "336;797;268;242",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            73.25,
            27.215574585152524
        ],
        "wc_strengths_avg": [
            51.5,
            8.200609733428363
        ],
        "wc_weaknesses_avg": [
            100.25,
            38.80963153651423
        ],
        "wc_questions_avg": [
            185.75,
            240.7876398405865
        ],
        "wc_review_avg": [
            410.75,
            225.62731993267127
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:7I_MsF2FmNEJ:scholar.google.com/&scioq=UnifiedGT:+Exploring+the+Effective+Ingredients+of+Transformers+in+Large+Graphs&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;0;2",
        "aff_unique_norm": "Massachusetts Institute of Technology;International Business Machines Corporation;Virginia Tech;IBM",
        "aff_unique_dep": ";;;IBM Research",
        "aff_unique_url": "https://web.mit.edu;https://www.ibm.com;https://www.vt.edu;https://www.ibm.com/research",
        "aff_unique_abbr": "MIT;IBM;VT;IBM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "eEslYpY6Yq",
        "title": "On the Equivalence of Graph Convolution and Mixup",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "This paper investigates the relationship between graph convolution and Mixup techniques. Graph convolution in a graph neural network involves aggregating features from neighboring samples to learn representative features for a specific node or sample. On the other hand, Mixup is a data augmentation technique that generates new examples by averaging features and one-hot labels from multiple samples. One commonality between these techniques is their utilization of information from multiple samples to derive feature representation. This study aims to explore whether a connection exists between these two approaches. Our investigation reveals that, under two mild conditions, graph convolution can be viewed as a specialized form of Mixup that is applied during both the training and testing phases. The two conditions are: 1) \\textit{Homophily Relabel} - assigning the target node's label to all its neighbors, and 2) \\textit{Test-Time Mixup} - Mixup the feature during the test time. We establish this equivalence mathematically by demonstrating that graph convolution networks (GCN) and simplified graph convolution (SGC) can be expressed as a form of Mixup. We also empirically verify the equivalence by training an MLP using the two conditions to achieve comparable performance.",
        "keywords": "Graph Neural Network;Mixup",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Xiaotian Han;Hanqing Zeng;Yu Chen;Shaoliang Nie;Jingzhou Liu;Kanika Narang;Zahra Shakeri;Karthik Abinav Sankararaman;Song Jiang;Madian Khabsa;Qifan Wang;Xia Hu",
        "authorids": "~Xiaotian_Han1;~Hanqing_Zeng1;~Yu_Chen5;~Shaoliang_Nie1;~Jingzhou_Liu1;~Kanika_Narang1;~Zahra_Shakeri1;~Karthik_Abinav_Sankararaman1;~Song_Jiang1;~Madian_Khabsa1;~Qifan_Wang2;~Xia_Hu4",
        "gender": "M;M;M;M;M;F;F;M;M;M;M;M",
        "homepage": "https://ahxt.github.io/;https://hanqingzeng.com;http://academic.hugochan.net;https://snie2012.github.io;;;https://sites.google.com/view/zshakeri/home?authuser=1;http://karthikabinavs.xyz;https://songjiang0909.github.io/;https://www.madiankhabsa.com;https://wqfcr.github.io/;https://cs.rice.edu/~xh37/index.html",
        "dblp": ";136/2474;87/1254-22;213/7860;61/11308;127/1202;159/1512;154/4666;08/237-2;87/11087;33/8610;256/9406.html",
        "google_scholar": "Uromx98AAAAJ;ubUx3R0AAAAJ;m6Sj1yoAAAAJ;https://scholar.google.com/citations?hl=en;;pF-F3KYAAAAJ;S4ilHdMAAAAJ;uJ-Dhj4AAAAJ;SjbhMQEAAAAJ;V9JYPP0AAAAJ;LrSyLosAAAAJ;https://scholar.google.com.tw/citations?user=pcCS60IAAAAJ",
        "orcid": ";;;;;;;;;;0000-0002-7570-5756;",
        "linkedin": ";hanqing-zeng-a9477995/;;shaoliang-nie/;;kanika-narang-phd-4b2b1a30;zahra-shakeri-9106669b/;;;;;",
        "or_profile": "~Xiaotian_Han1;~Hanqing_Zeng1;~Yu_Chen5;~Shaoliang_Nie1;~Jingzhou_Liu1;~Kanika_Narang1;~Zahra_Shakeri1;~Karthik_Abinav_Sankararaman1;~Song_Jiang1;~Madian_Khabsa1;~Qifan_Wang2;~Xia_Hu2",
        "aff": "Texas A&M University;Meta AI;Anytime.AI;Meta Inc;Meta;Meta Facebook;;Meta Facebook;University of California, Los Angeles;Meta;Meta AI;Rice University",
        "aff_domain": "tamu.edu;meta.com;anytime-ai.com;meta.com;meta.com;facebook.com;;fb.com;ucla.edu;meta.com;fb.com;rice.edu",
        "position": "PhD student;Researcher;Researcher;Researcher;Researcher;Researcher;;Research Scientist;PhD student;Researcher;Principal Researcher;Associate Professor",
        "bibtex": "@misc{\nhan2024on,\ntitle={On the Equivalence of Graph Convolution and Mixup},\nauthor={Xiaotian Han and Hanqing Zeng and Yu Chen and Shaoliang Nie and Jingzhou Liu and Kanika Narang and Zahra Shakeri and Karthik Abinav Sankararaman and Song Jiang and Madian Khabsa and Qifan Wang and Xia Hu},\nyear={2024},\nurl={https://openreview.net/forum?id=eEslYpY6Yq}\n}",
        "github": "",
        "project": "",
        "reviewers": "ocCu;Psnu;12Mm",
        "site": "https://openreview.net/forum?id=eEslYpY6Yq",
        "pdf_size": 6623590,
        "rating": "3;3;5",
        "confidence": "3;4;3",
        "soundness": "2;2;3",
        "contribution": "1;1;3",
        "presentation": "3;3;3",
        "wc_summary": "45;129;28",
        "wc_strengths": "56;41;81",
        "wc_weaknesses": "222;447;25",
        "wc_questions": "45;330;115",
        "wc_review": "368;947;249",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            67.33333333333333,
            44.15377170248942
        ],
        "wc_strengths_avg": [
            59.333333333333336,
            16.49915822768611
        ],
        "wc_weaknesses_avg": [
            231.33333333333334,
            172.4071408678371
        ],
        "wc_questions_avg": [
            163.33333333333334,
            121.26646509054164
        ],
        "wc_review_avg": [
            521.3333333333334,
            304.8872286964841
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            12,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:9YOWKitBHcoJ:scholar.google.com/&scioq=On+the+Equivalence+of+Graph+Convolution+and+Mixup&hl=en&as_sdt=0,5",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;1;1;1;1;3;1;1;4",
        "aff_unique_norm": "Texas A&M University;Meta;Anytime AI;University of California, Los Angeles;Rice University",
        "aff_unique_dep": ";Meta AI;;;",
        "aff_unique_url": "https://www.tamu.edu;https://meta.com;https://www.anytime.ai;https://www.ucla.edu;https://www.rice.edu",
        "aff_unique_abbr": "TAMU;Meta;Anytime AI;UCLA;Rice",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Los Angeles",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "eEtfBIjzWi",
        "title": "What, when, and where? -- Self-Supervised Spatio-Temporal Grounding in Untrimmed Multi-Action Videos from Narrated Instructions",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Spatio-temporal grounding describes the task of localizing events in space and time, e.g., in video data, based on verbal descriptions only. Models for this task are usually trained with human-annotated sentences and bounding box supervision. This work addresses this task from a multimodal supervision perspective, proposing a framework for spatio-temporal action grounding trained on loose video and subtitle supervision only, without human annotation. To this end, we combine local representation learning, which focuses on leveraging fine-grained spatial information, with a global representation encoding that captures higher-level representations and incorporates both in a joint approach. To evaluate this challenging task in a real-life setting, a new benchmark dataset is proposed providing dense spatio-temporal grounding annotations in long, untrimmed, multi-action instructional videos for over 5K events. We evaluate the proposed approach and other methods on the proposed and standard downstream tasks showing that our method improves over current baselines in various settings, including spatial, temporal, and untrimmed multi-action spatio-temporal grounding.",
        "keywords": "Self-supervised learning;Video grounding;Multimodal learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/579514fb2e6bc4305fa1d889fc3cf777122422ea.zip",
        "author": "Brian Chen;Nina Shvetsova;Andrew Rouditchenko;Daniel Kondermann;Samuel Thomas;Shih-Fu Chang;Rogerio Feris;James R. Glass;Hilde Kuehne",
        "authorids": "~Brian_Chen3;~Nina_Shvetsova1;~Andrew_Rouditchenko1;~Daniel_Kondermann3;~Samuel_Thomas1;~Shih-Fu_Chang3;~Rogerio_Feris1;~James_R._Glass1;~Hilde_Kuehne5",
        "gender": "M;F;;M;;M;M;;F",
        "homepage": "https://brian7685.github.io/;https://ninatu.github.io/;;;;http://www.ee.columbia.edu/~sfchang/;http://rogerioferis.com;;https://hildekuehne.github.io",
        "dblp": "36/39-1;301/1304;218/5458;11/6370;;c/ShihFuChang;;;45/4963",
        "google_scholar": "7zfiaA8AAAAJ;qZtU1L4AAAAJ;;4I1TxJcAAAAJ;S34WHG0AAAAJ;OMVTRscAAAAJ;xt3XLjcAAAAJ;;pxhCcH0AAAAJ",
        "orcid": ";0000-0003-0910-188X;;;;;;;0000-0003-1079-4441",
        "linkedin": "brianchen2718/;;;daniel-kondermann/;;;;;hilde-kuehne-8b9aa661",
        "or_profile": "~Brian_Chen3;~Nina_Shvetsova1;~Andrew_Rouditchenko1;~Daniel_Kondermann3;~Samuel_Thomas1;~Shih-Fu_Chang3;~Rogerio_Feris1;~James_R._Glass1;~Hilde_Kuehne5",
        "aff": "Samsung;Rheinische Friedrich-Wilhelms Universit\u00e4t Bonn;Massachusetts Institute of Technology;Heidelberg University, Ruprecht-Karls-Universit\u00e4t Heidelberg;International Business Machines;Columbia University;International Business Machines;;Rheinische Friedrich-Wilhelms-Universit\u00e4t Bonn, Rheinische Friedrich-Wilhelms Universit\u00e4t Bonn",
        "aff_domain": "samsung.com;uni-bonn.de;mit.edu;iwr.uni-heidelberg.de;ibm.com;ee.columbia.edu;ibm.com;;cs.uni-bonn.de",
        "position": "Researcher;PhD student;PhD student;Associate Professor;Researcher;Full Professor;Research Manager;;Associate Professor",
        "bibtex": "@misc{\nchen2024what,\ntitle={What, when, and where? -- Self-Supervised Spatio-Temporal Grounding in Untrimmed Multi-Action Videos from Narrated Instructions},\nauthor={Brian Chen and Nina Shvetsova and Andrew Rouditchenko and Daniel Kondermann and Samuel Thomas and Shih-Fu Chang and Rogerio Feris and James R. Glass and Hilde Kuehne},\nyear={2024},\nurl={https://openreview.net/forum?id=eEtfBIjzWi}\n}",
        "github": "",
        "project": "",
        "reviewers": "CNqU;MvS5;tJVe;YqMJ",
        "site": "https://openreview.net/forum?id=eEtfBIjzWi",
        "pdf_size": 14006000,
        "rating": "3;5;5;5",
        "confidence": "5;4;3;5",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "127;26;40;90",
        "wc_strengths": "37;15;57;128",
        "wc_weaknesses": "103;77;237;142",
        "wc_questions": "328;77;11;109",
        "wc_review": "595;195;345;469",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "393;124;317;447",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            70.75,
            40.25776322648838
        ],
        "wc_strengths_avg": [
            59.25,
            42.381452311123084
        ],
        "wc_weaknesses_avg": [
            139.75,
            60.72633283839886
        ],
        "wc_questions_avg": [
            131.25,
            118.96296692668689
        ],
        "wc_review_avg": [
            401.0,
            148.1823201330037
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            320.25,
            122.35476083912714
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6425947032415275635&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;1;2;3;4;5;4;6",
        "aff_unique_norm": "Samsung;Rheinische Friedrich-Wilhelms Universit\u00e4t Bonn;Massachusetts Institute of Technology;Heidelberg University;International Business Machines Corporation;Columbia University;Rheinische Friedrich-Wilhelms-Universit\u00e4t Bonn",
        "aff_unique_dep": "Samsung;;;;;;",
        "aff_unique_url": "https://www.samsung.com;https://www.uni-bonn.de/;https://web.mit.edu;https://www.uni-heidelberg.de;https://www.ibm.com;https://www.columbia.edu;https://www.uni-bonn.de",
        "aff_unique_abbr": "Samsung;Uni Bonn;MIT;Uni Heidelberg;IBM;Columbia;Uni Bonn",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Heidelberg",
        "aff_country_unique_index": "0;1;2;1;2;2;2;1",
        "aff_country_unique": "South Korea;Germany;United States"
    },
    {
        "id": "eFS9Pm7bsM",
        "title": "Adversarial Latent Feature Augmentation for Fairness",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "As fairness in machine learning has been increasingly important to mitigate bias in models, various methods to enhance fairness have been proposed. Among them, the data augmentation approach has shown promising results in improving fairness. However, existing data augmentation methods on either input or latent features provide limited evidence of how they discover bias and rectify it. In this paper, we propose the Adversarial Latent Feature Augmentation (ALFA) for fairness, which effectively merges adversarial attacks against fairness and data augmentation in the latent space to promote fairness. Though the adversarial perturbation against fairness has been discussed in existing literature, the effect of such adversarial perturbations has been inadequately studied only as a means to depreciate fairness. In contrast, in this paper, we point out that such perturbation can in fact be used to augment fairness. Drawing from a covariance-based fairness constraint, our method unveils a counter-intuitive relationship between adversarial attacks against fairness and enhanced model fairness upon training with the resultant perturbed latent features by hyperplane rotation. We theoretically prove that our adversarial fairness objective assuredly generates biased feature perturbation, and we validate with extensive experiments that training with adversarial features significantly improve fairness.",
        "keywords": "Fairness;Data Augmentation;Adversarial Attack",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/8165b63262e2def29732333097282071f0d80e62.zip",
        "author": "Hoin Jung;Junyi Chai;Xiaoqian Wang",
        "authorids": "~Hoin_Jung1;~Junyi_Chai1;~Xiaoqian_Wang1",
        "gender": "M;M;F",
        "homepage": ";;https://engineering.purdue.edu/~joywang/",
        "dblp": ";323/9078;151/3215-1",
        "google_scholar": "6VasZjEAAAAJ;fucMzpYAAAAJ;I3tc214AAAAJ",
        "orcid": ";0000-0002-4324-5361;",
        "linkedin": ";junyi-chai-260869256/?trk=opento_sprofile_details;",
        "or_profile": "~Hoin_Jung1;~Junyi_Chai1;~Xiaoqian_Wang1",
        "aff": "Purdue University;Purdue University;Purdue University",
        "aff_domain": "purdue.edu;purdue.edu;purdue.edu",
        "position": "PhD student;PhD student;Assistant Professor",
        "bibtex": "@misc{\njung2024adversarial,\ntitle={Adversarial Latent Feature Augmentation for Fairness},\nauthor={Hoin Jung and Junyi Chai and Xiaoqian Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=eFS9Pm7bsM}\n}",
        "github": "",
        "project": "",
        "reviewers": "XHAN;J4SN;VbNu;CWiz;KRtS;qEGE;92u3",
        "site": "https://openreview.net/forum?id=eFS9Pm7bsM",
        "pdf_size": 3757553,
        "rating": "3;5;5;6;6;6;6",
        "confidence": "1;3;4;3;3;2;3",
        "soundness": "2;3;2;3;2;2;2",
        "contribution": "2;3;2;2;3;2;2",
        "presentation": "3;2;2;3;2;2;2",
        "wc_summary": "103;90;44;94;122;56;53",
        "wc_strengths": "20;73;27;30;90;99;16",
        "wc_weaknesses": "170;169;40;14;89;308;74",
        "wc_questions": "2;132;211;107;162;128;139",
        "wc_review": "295;464;322;245;463;591;282",
        "wc_reply_reviewers": "0;0;210;12;274;11;0",
        "wc_reply_authors": "402;1516;787;612;1253;1081;1097",
        "reply_reviewers": "0;0;1;1;2;1;0",
        "reply_authors": "1;3;2;1;3;2;2",
        "rating_avg": [
            5.285714285714286,
            1.0301575072754257
        ],
        "confidence_avg": [
            2.7142857142857144,
            0.880630571852711
        ],
        "soundness_avg": [
            2.2857142857142856,
            0.45175395145262565
        ],
        "contribution_avg": [
            2.2857142857142856,
            0.4517539514526256
        ],
        "presentation_avg": [
            2.2857142857142856,
            0.45175395145262565
        ],
        "wc_summary_avg": [
            80.28571428571429,
            27.227686989083562
        ],
        "wc_strengths_avg": [
            50.714285714285715,
            32.75761322944326
        ],
        "wc_weaknesses_avg": [
            123.42857142857143,
            93.25519080590044
        ],
        "wc_questions_avg": [
            125.85714285714286,
            59.120768822152925
        ],
        "wc_review_avg": [
            380.2857142857143,
            117.64561103550939
        ],
        "wc_reply_reviewers_avg": [
            72.42857142857143,
            108.70649493391058
        ],
        "wc_reply_authors_avg": [
            964.0,
            356.7071628100563
        ],
        "reply_reviewers_avg": [
            0.7142857142857143,
            0.6998542122237652
        ],
        "reply_authors_avg": [
            2.0,
            0.7559289460184544
        ],
        "replies_avg": [
            31,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5624015883323091,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:93TYQMa2NC0J:scholar.google.com/&scioq=Adversarial+Latent+Feature+Augmentation+for+Fairness&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Purdue University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.purdue.edu",
        "aff_unique_abbr": "Purdue",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "eFVQaqkf8Z",
        "title": "Revisiting Non-separable Binary Classification and its Applications in Anomaly Detection",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The inability to linearly classify $\\texttt{XOR}$ has motivated much of deep learning.\nWe revisit this age-old problem and show that $\\textit{linear}$ classification of $\\texttt{XOR}$ is indeed possible.\nInstead of separating data between halfspaces, we propose a slightly different paradigm, $\\texttt{equality separation}$, that adapts the SVM objective to distinguish data within or outside the margin.\nOur classifier can then be integrated into neural network pipelines with a smooth approximation.\nFrom its properties, we intuit that equality separation is suitable for anomaly detection.\nTo formalize this notion, we introduce $\\textit{closing numbers}$, a quantitative measure on the capacity for classifiers to form closed decision regions for anomaly detection.\nSpringboarding from this theoretical connection between binary classification and anomaly detection, we test our hypothesis on supervised anomaly detection experiments, showing that equality separation can detect both seen and unseen anomalies.",
        "keywords": "Machine Learning;Classification;Anomaly Detection",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/4577ef7966ad5e8da4107cb4bb16528a46756f58.zip",
        "author": "Matthew Lau;ISMAILA SECK;Athanasios P Meliopoulos;Wenke Lee;Eugene Ndiaye",
        "authorids": "~Matthew_Lau1;~ISMAILA_SECK1;~Athanasios_P_Meliopoulos1;~Wenke_Lee1;~Eugene_Ndiaye1",
        "gender": ";M;M;M;",
        "homepage": "https://sites.google.com/view/matthewlauende/home;;https://ece.gatech.edu;https://wenke.gtisc.gatech.edu/;",
        "dblp": "325/5381;;;29/5976.html;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.fr/citations?hl=en;;nfkH5V4AAAAJ;",
        "orcid": "0000-0002-5113-9315;;;0000-0003-2761-1277;",
        "linkedin": "matthew-lau-ende/;;;wenke-lee-1b8109/;",
        "or_profile": "~Matthew_Lau1;~ISMAILA_SECK1;~Athanasios_P_Meliopoulos1;~Wenke_Lee1;~Eugene_Ndiaye1",
        "aff": "Georgia Institute of Technology;INSA de Rouen;;Georgia Institute of Technology;",
        "aff_domain": "gatech.edu;insa-rouen.fr;;gatech.edu;",
        "position": "PhD student;PhD student;;Full Professor;",
        "bibtex": "@misc{\nlau2024revisiting,\ntitle={Revisiting Non-separable Binary Classification and its Applications in Anomaly Detection},\nauthor={Matthew Lau and ISMAILA SECK and Athanasios P Meliopoulos and Wenke Lee and Eugene Ndiaye},\nyear={2024},\nurl={https://openreview.net/forum?id=eFVQaqkf8Z}\n}",
        "github": "",
        "project": "",
        "reviewers": "7KS5;NTiL;FBaF",
        "site": "https://openreview.net/forum?id=eFVQaqkf8Z",
        "pdf_size": 1418945,
        "rating": "3;5;6",
        "confidence": "3;2;2",
        "soundness": "2;3;4",
        "contribution": "1;2;3",
        "presentation": "1;3;3",
        "wc_summary": "46;103;78",
        "wc_strengths": "44;77;47",
        "wc_weaknesses": "473;60;70",
        "wc_questions": "101;51;50",
        "wc_review": "664;291;245",
        "wc_reply_reviewers": "0;40;0",
        "wc_reply_authors": "813;612;653",
        "reply_reviewers": "0;1;0",
        "reply_authors": "1;2;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            75.66666666666667,
            23.328570942563587
        ],
        "wc_strengths_avg": [
            56.0,
            14.89966442575134
        ],
        "wc_weaknesses_avg": [
            201.0,
            192.3763672249444
        ],
        "wc_questions_avg": [
            67.33333333333333,
            23.809428571238094
        ],
        "wc_review_avg": [
            400.0,
            187.61840705716128
        ],
        "wc_reply_reviewers_avg": [
            13.333333333333334,
            18.856180831641264
        ],
        "wc_reply_authors_avg": [
            692.6666666666666,
            86.719214838594
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9449111825230683,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17386662397568371624&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Georgia Institute of Technology;INSA de Rouen",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.gatech.edu;https://www.insa-rouen.fr",
        "aff_unique_abbr": "Georgia Tech;INSA Rouen",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United States;France"
    },
    {
        "title": "Merge, Then Compress: Demystify Efficient SMoE with Hints from Its Routing Policy",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18228",
        "id": "eFWG9Cy3WK",
        "author_site": "Pingzhi Li, Zhenyu Zhang, Prateek Yadav, Yi-Lin Sung, Yu Cheng, Mohit Bansal, Tianlong Chen",
        "tldr": "",
        "abstract": "Sparsely activated Mixture-of-Experts (SMoE) has shown promise to scale up the learning capacity of neural networks, however, they have issues like: ($a$) $\\textit{High Memory Usage,}$ due to duplication of the network layers into multiple copies as experts; and ($b$) $\\textit{Redundancy in Experts,}$ as common learning-based routing policies suffer from representational collapse. Therefore, vanilla SMoE models are memory inefficient and non-scalable, especially for resource-constrained downstream scenarios. In this paper, we ask: Can we craft a compact SMoE model by consolidating expert information? What is the best recipe to merge multiple experts into fewer but more knowledgeable experts? Our pilot investigation reveals that conventional model merging methods fail to be effective in such expert merging for SMoE. The potential reasons are: ($1$) redundant information overshadows critical experts; ($2$) appropriate neuron permutation for each expert is missing to bring all of them in alignment. To address these challenges, we propose a novel merging algorithm for SMoE, $\\textit{i.e.}$, $\\texttt{M-SMoE}$, which leverages routing statistics to guide expert merging. Specifically, it starts with neuron permutation alignment for experts; then, dominant experts and their \"group members\" are formed based on routing policies; lastly, every expert group is merged into a single expert by utilizing each expert's activation frequency as their weight for merging, thus diminishing the impact of insignificant experts. Moreover, we draw an interesting observation that our proposed merging promotes a low dimensionality in the merged expert's weight space, naturally paving the way for additional compression. Hence, our final method, $\\texttt{MC-SMoE}$ ($\\textit{i.e.}$, Merge, then Compress SMoE), further decomposes the merged experts into low-rank and structural sparse alternatives. Extensive experiments across $8$ benchmarks validate the effectiveness of our proposals. For instance, our $\\texttt{MC-SMoE}$ achieves up to $80\\%$ memory and a $20\\%$ FLOPs reduction, with virtually no loss in performance. Our code is provided as supplementary material.",
        "keywords": "Sparse Mixture-of-Experts;Efficiency;Merging;Compression",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/09585d578b64d66fcb29e8a9d5553f0d13c2975a.zip",
        "author": "Pingzhi Li;Zhenyu Zhang;Prateek Yadav;Yi-Lin Sung;Yu Cheng;Mohit Bansal;Tianlong Chen",
        "authorids": "~Pingzhi_Li1;~Zhenyu_Zhang4;~Prateek_Yadav1;~Yi-Lin_Sung1;~Yu_Cheng1;~Mohit_Bansal2;~Tianlong_Chen1",
        "gender": "M;M;M;M;M;M;M",
        "homepage": "https://pingzhili.github.io;https://zhenyu.gallery;http://prateek-yadav.github.io;https://ych133.github.io;https://www.cs.unc.edu/~mbansal/;https://tianlong-chen.github.io;https://ylsung.github.io/",
        "dblp": "358/4405;01/1844-15;220/5741;96/3060-1.html;32/5243.html;;212/7264",
        "google_scholar": "QUfhEyQAAAAJ;ZLyJRxoAAAAJ;1lXhc0kAAAAJ;https://scholar.google.com/citations?hl=en;DN8QtscAAAAJ;LE3ctn0AAAAJ;aW2XnF0AAAAJ",
        "orcid": ";;;;;0000-0001-7774-8197;",
        "linkedin": "pingzhili/;zhenyu-allen-zhang-a9b1391a3/;prateek-yadav-40bb34a8;chengyu05/;;tianlong-chen-783862167/;yi-lin-sung-41a427120/",
        "or_profile": "~Pingzhi_Li1;~Zhenyu_Zhang4;~Prateek_Yadav1;~Yu_Cheng1;~Mohit_Bansal2;~Tianlong_Chen1;~Yi_Lin_Sung1",
        "aff": "University of North Carolina at Chapel Hill;University of Texas at Austin;Department of Computer Science, University of North Carolina, Chapel Hill;The Chinese University of Hong Kong;University of North Carolina at Chapel Hill;Harvard University;Department of Computer Science, University of North Carolina, Chapel Hill",
        "aff_domain": "unc.edu;utexas.edu;cs.unc.edu;cuhk.edu.hk;unc.edu;harvard.edu;cs.unc.edu",
        "position": "PhD student;PhD student;Graduate Student;Associate Professor;Full Professor;Postdoc;PhD student",
        "bibtex": "@inproceedings{\nli2024merge,\ntitle={Merge, Then Compress: Demystify Efficient {SM}oE with Hints from Its Routing Policy},\nauthor={Pingzhi Li and Zhenyu Zhang and Prateek Yadav and Yi-Lin Sung and Yu Cheng and Mohit Bansal and Tianlong Chen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=eFWG9Cy3WK}\n}",
        "github": "",
        "project": "",
        "reviewers": "5S2f;zDGs;FC53",
        "pdf_size": 1028944,
        "rating": "3;8;8",
        "confidence": "5;3;4",
        "soundness": "2;4;4",
        "contribution": "2;4;4",
        "presentation": "2;3;4",
        "wc_summary": "54;52;99",
        "wc_strengths": "65;136;49",
        "wc_weaknesses": "456;84;50",
        "wc_questions": "2;34;82",
        "wc_review": "577;306;280",
        "wc_reply_reviewers": "0;47;33",
        "wc_reply_authors": "3319;693;1005",
        "reply_reviewers": "0;1;1",
        "reply_authors": "8;1;3",
        "rating_avg": [
            6.333333333333333,
            2.357022603955158
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "contribution_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            68.33333333333333,
            21.69997439834639
        ],
        "wc_strengths_avg": [
            83.33333333333333,
            37.80946383586463
        ],
        "wc_weaknesses_avg": [
            196.66666666666666,
            183.90093951787077
        ],
        "wc_questions_avg": [
            39.333333333333336,
            32.87687468250121
        ],
        "wc_review_avg": [
            387.6666666666667,
            134.2990030574398
        ],
        "wc_reply_reviewers_avg": [
            26.666666666666668,
            19.70335560817553
        ],
        "wc_reply_authors_avg": [
            1672.3333333333333,
            1171.3153100491581
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            4.0,
            2.943920288775949
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.8660254037844387,
        "gs_citation": 36,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7299871892872347885&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=eFWG9Cy3WK",
        "pdf": "https://openreview.net/pdf?id=eFWG9Cy3WK",
        "email": "unc.edu;utexas.edu;cs.unc.edu;cuhk.edu.hk;unc.edu;harvard.edu;cs.unc.edu",
        "author_num": 7,
        "aff_unique_index": "0;1;0;2;0;3;0",
        "aff_unique_norm": "University of North Carolina;University of Texas at Austin;Chinese University of Hong Kong;Harvard University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.unc.edu;https://www.utexas.edu;https://www.cuhk.edu.hk;https://www.harvard.edu",
        "aff_unique_abbr": "UNC;UT Austin;CUHK;Harvard",
        "aff_campus_unique_index": "0;1;0;2;0;0",
        "aff_campus_unique": "Chapel Hill;Austin;Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;1;0;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "eG9AkHtYYH",
        "title": "SemSA: Semantic Sparse Attention is hidden in Large Language Models.",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Sparse attention is one of the most effective approaches for addressing the $O(N^2)$ attention complexity of transformer models.\nExisting methods manually designs a uniform sparse attention mask for all attention heads.\nHowever, uniform masks treat different attention heads equally. To preserve necessary attentions for important heads, the masks are unnecessarily dense for unimportant heads, limiting the overall sparsity and wall-clock speedup. \nThus, we propose Semantic Sparse Attention (SemSA) paradigm. It uses statistical information to evaluate, generate and optimize different sparse attention masks for different heads.\nWe observe that the acquired attention masks successfully learn different semantic information from the dense pre-trained large language models: some heads focus on contents while others mainly encode the token positions.\nWe optimize SemSA GPU operators and evaluate it on popular large language models OPT-6.7B (2k tokens) and Llama2-7B (4k tokens). Compared with dense PyTorch models, SemSA achieves $4.18\\sim11.67\\times$ and $1.36\\sim2.34\\times$ speedup for attention layer and first-token-latency with negligible accuracy loss. Compared with other sparse attention methods optimized with state-of-the-art sparse framework, SemSA achieves up to $1.6\\times$ sparsity, $1.4\\times$ attention speedup with higher accuracy.",
        "keywords": "large language model;sparse attention;efficient transformer",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Tianyu Fu;Xuefei Ning;Boju Chen;Tianqi Wu;Genghan Zhang;Guohao Dai;Huazhong Yang;Yu Wang",
        "authorids": "~Tianyu_Fu3;~Xuefei_Ning1;~Boju_Chen1;~Tianqi_Wu2;~Genghan_Zhang1;~Guohao_Dai4;~Huazhong_Yang2;~Yu_Wang3",
        "gender": "M;Not Specified;M;M;M;M;M;M",
        "homepage": "http://nicsefc.ee.tsinghua.edu.cn/people/TianyuFu;https://nics-effalg.com/ningxuefei/;http://nicsefc.ee.tsinghua.edu.cn/people/BojuChen;http://nicsefc.ee.tsinghua.edu.cn/people/TianqiWu;https://zhang677.github.io/;https://nicsefc.ee.tsinghua.edu.cn/people/guohao-dai/;http://web.ee.tsinghua.edu.cn/yanghuazhong/en/index.htm;https://nicsefc.ee.tsinghua.edu.cn",
        "dblp": "219/6025-4;202/9525;;;329/3725;147/1470;94/1128.html;w/YuWang2.html",
        "google_scholar": "Mnfue94AAAAJ;oVslpJsAAAAJ;OWseyN4AAAAJ;;;gz3Tkl0AAAAJ;;https://scholar.google.com.hk/citations?user=j8JGVvoAAAAJ",
        "orcid": "0000-0003-3508-1755;;;;;;0000-0003-2421-353X;0000-0001-6108-5157",
        "linkedin": ";;;;genghan-zhang/;;;",
        "or_profile": "~Tianyu_Fu3;~Xuefei_Ning1;~Boju_Chen1;~Tianqi_Wu2;~Genghan_Zhang1;~Guohao_Dai4;~Huazhong_Yang2;~Yu_Wang3",
        "aff": "Infinigence;Tsinghua University;Tsinghua University;Tsinghua University;NVIDIA;Shanghai Jiaotong University;Tsinghua University;Tsinghua University",
        "aff_domain": "infini-ai.com;tsinghua.edu.cn;mails.tsinghua.edu.cn;tsinghua.edu.cn;nvidia.com;sjtu.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "Researcher;Research Assistant Professor;Undergrad student;Undergrad student;Intern;Associate Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nfu2024semsa,\ntitle={Sem{SA}: Semantic Sparse Attention is hidden in Large Language Models.},\nauthor={Tianyu Fu and Xuefei Ning and Boju Chen and Tianqi Wu and Genghan Zhang and Guohao Dai and Huazhong Yang and Yu Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=eG9AkHtYYH}\n}",
        "github": "",
        "project": "",
        "reviewers": "CLpu;xq6q;1ev5;xR4c",
        "site": "https://openreview.net/forum?id=eG9AkHtYYH",
        "pdf_size": 1190344,
        "rating": "3;3;5;5",
        "confidence": "4;3;4;3",
        "soundness": "3;2;3;3",
        "contribution": "2;2;2;4",
        "presentation": "3;2;3;4",
        "wc_summary": "83;50;68;76",
        "wc_strengths": "18;25;46;72",
        "wc_weaknesses": "109;217;172;30",
        "wc_questions": "80;104;33;18",
        "wc_review": "290;396;319;196",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            69.25,
            12.316147936753602
        ],
        "wc_strengths_avg": [
            40.25,
            21.0282548015759
        ],
        "wc_weaknesses_avg": [
            132.0,
            70.28157653325657
        ],
        "wc_questions_avg": [
            58.75,
            34.723011102149535
        ],
        "wc_review_avg": [
            300.25,
            71.57644514782778
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Kiotky_EGYkJ:scholar.google.com/&scioq=SemSA:+Semantic+Sparse+Attention+is+hidden+in+Large+Language+Models.&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1;2;3;1;1",
        "aff_unique_norm": "Infinigence;Tsinghua University;NVIDIA;Shanghai Jiao Tong University",
        "aff_unique_dep": ";;NVIDIA Corporation;",
        "aff_unique_url": ";https://www.tsinghua.edu.cn;https://www.nvidia.com;https://www.sjtu.edu.cn",
        "aff_unique_abbr": ";THU;NVIDIA;SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "1;1;1;2;1;1;1",
        "aff_country_unique": ";China;United States"
    },
    {
        "id": "eGdhD93hZr",
        "title": "MVoice: Multilingual Unified Voice Generation With Discrete Representation at Scale",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Various applications of voice synthesis have been developed independently despite the fact that they generate \"voice\" as output in common. In addition, the majority of voice synthesis models currently rely on annotated data, but it is crucial to scale them to self-supervised datasets in order to effectively capture the wide range of acoustic variations presented in human voice, including speaker identity, emotion, and prosody. In this work, we propose MVoice, a multimodal spoken large language model for synthesizing and manipulating voice signals at scale. MVoice employs self-supervised voice tokens with the \"coarse-to-fine\" designs to first determine semantic meaning and then introduce condition signals for acoustic generation. It offers notable benefits with unified generation and transformation capabilities: 1) model and data scalability: without the requirement of scattered model-specific methodologies or annotations acoustic data, training could be scaled up in terms of data usage and model capability; and 2) controllability and conditioning flexibility: we investigate different conditioning mechanisms and effectively handle voice synthesis applications, including text-to-speech, voice conversion, singing voice synthesis, singing voice conversion, and speech-to-speech translation by re-synthesizing the discrete representations with prompt guidance. Experimental results demonstrate that MVoice exhibits superior audio quality and style similarity compared with competitive baseline models in monolingual/cross-lingual voice generation. Audio samples are available at https://MVoice.github.io",
        "keywords": "voice generation;unified framework;language model;zero-shot;voice conversion;text-to-speech;singing voice synthesis",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/8071e01f7356eb1c4920c6e6b19b946e4d4031c7.pdf",
        "author": "Rongjie Huang;Chunlei Zhang;Yongqi Wang;Dongchao Yang;Jinchuan Tian;Luping Liu;Zhenhui Ye;Ziyue Jiang;Xuankai Chang;Jiatong Shi;CHAO WENG;Zhou Zhao;Dong Yu",
        "authorids": "~Rongjie_Huang1;~Chunlei_Zhang1;~Yongqi_Wang1;~Dongchao_Yang1;~Jinchuan_Tian1;~Luping_Liu2;~Zhenhui_Ye1;~Ziyue_Jiang1;~Xuankai_Chang1;~Jiatong_Shi1;~CHAO_WENG1;~Zhou_Zhao3;~Dong_Yu2",
        "gender": "M;M;M;M;M;;M;M;M;M;M;;M",
        "homepage": ";;;http://dongchaoyang.top;;;https://yerfor.github.io;;https://www.xuankaic.com;http://shijt.site;https://cweng6.github.io/;;https://sites.google.com/view/dongyu888/",
        "dblp": "212/8936-1;;;;;;265/6375;258/6865;194/1149.html;229/3529.html;;;71/4598-1",
        "google_scholar": "iRHBUsgAAAAJ;NCKZGb0AAAAJ;9_79D6IAAAAJ;WNiojyAAAAAJ;https://scholar.google.com.hk/citations?user=KE5I4R0AAAAJ;;;wDgSBssAAAAJ;cIl2jpMAAAAJ;FEDNbgkAAAAJ;;;tMY31_gAAAAJ",
        "orcid": ";;0000-0003-4695-3440;;;;;;0000-0002-5221-5412;;;;0000-0003-0520-6844",
        "linkedin": ";;;;;;;;;jiatong-shi-608b3016b/;;;dongyu/",
        "or_profile": "~Rongjie_Huang1;~Chunlei_Zhang1;~Yongqi_Wang1;~Dongchao_Yang1;~Jinchuan_Tian1;~Luping_Liu2;~Zhenhui_Ye1;~Ziyue_Jiang1;~Xuankai_Chang1;~Jiatong_Shi1;~CHAO_WENG1;~Zhou_Zhao3;~Dong_Yu2",
        "aff": "Zhejiang University;Tencent AI Lab;Zhejiang University;Chinese University of Hong Kong;Carnegie Mellon University;;Zhejiang University;Zhejiang University;Carnegie Mellon University;Carnegie Mellon University;Tencent AI Lab;;Tencent AI Lab",
        "aff_domain": "zju.edu.cn;tencent.com;zju.edu.cn;cuhk.hk;andrew.cmu.edu;;zju.edu.cn;zju.edu.cn;andrew.cmu.edu;andrew.cmu.edu;tencent.com;;tencent.com",
        "position": "MS student;Researcher;MS student;PhD student;PhD student;;PhD student;PhD student;PhD student;PhD student;Principal Researcher;;Distinguished Scientist",
        "bibtex": "@misc{\nhuang2024mvoice,\ntitle={{MV}oice: Multilingual Unified Voice Generation With Discrete Representation at Scale},\nauthor={Rongjie Huang and Chunlei Zhang and Yongqi Wang and Dongchao Yang and Jinchuan Tian and Luping Liu and Zhenhui Ye and Ziyue Jiang and Xuankai Chang and Jiatong Shi and CHAO WENG and Zhou Zhao and Dong Yu},\nyear={2024},\nurl={https://openreview.net/forum?id=eGdhD93hZr}\n}",
        "github": "",
        "project": "",
        "reviewers": "KBUu;B8JJ;at49;c2w8",
        "site": "https://openreview.net/forum?id=eGdhD93hZr",
        "pdf_size": 415730,
        "rating": "3;3;3;5",
        "confidence": "3;5;4;4",
        "soundness": "2;3;2;3",
        "contribution": "2;1;2;3",
        "presentation": "2;2;2;2",
        "wc_summary": "212;125;178;138",
        "wc_strengths": "196;56;105;63",
        "wc_weaknesses": "113;156;699;519",
        "wc_questions": "42;147;759;97",
        "wc_review": "563;484;1741;817",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            163.25,
            34.259122872601395
        ],
        "wc_strengths_avg": [
            105.0,
            55.780821076782296
        ],
        "wc_weaknesses_avg": [
            371.75,
            246.10706511597752
        ],
        "wc_questions_avg": [
            261.25,
            289.7657459052053
        ],
        "wc_review_avg": [
            901.25,
            500.1971486324167
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            13,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:KAXsXgXOkq4J:scholar.google.com/&scioq=MVoice:+Multilingual+Unified+Voice+Generation+With+Discrete+Representation+at+Scale&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;2;3;0;0;3;3;1;1",
        "aff_unique_norm": "Zhejiang University;Tencent;Chinese University of Hong Kong;Carnegie Mellon University",
        "aff_unique_dep": ";Tencent AI Lab;;",
        "aff_unique_url": "https://www.zju.edu.cn;https://ai.tencent.com;https://www.cuhk.edu.hk;https://www.cmu.edu",
        "aff_unique_abbr": "ZJU;Tencent AI Lab;CUHK;CMU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;1;0;0;1;1;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "eI6ajU2esa",
        "title": "Robust Video Perception by Seeing Motion",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Despite their excellent performance, state-of-the-art computer vision models often fail when they encounter shifted distributions or adversarial examples. We find existing video perception models fail because they are not able to perceive the correct motion. Inspired by the extensive evidence that motion is a key factor in the human visual system, we propose to correct what the model sees by restoring the\nperceived motion information. We create a test-time constraint using motion information without any human annotation, where this constraint should be respected by all robust video perception models. Our key observation is that this constraint is violated when the inputs are corrupted or adversarially attacked. By optimizing the input to respect the constraint at test time, we can adapt the inference to be\nrobust. Visualizations and empirical experiments on UCF101 and HMDB-51 datasets show that restoring motion information in deep vision models improves robustness under both common corruptions and worst-case perturbations",
        "keywords": "Action Recognition;Robustness",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/ad77659844876dee0840da7784582f79b437b525.zip",
        "author": "Lingyu Zhang;Chengzhi Mao;Junfeng Yang;Carl Vondrick",
        "authorids": "~Lingyu_Zhang3;~Chengzhi_Mao2;~Junfeng_Yang1;~Carl_Vondrick2",
        "gender": "M;M;M;M",
        "homepage": ";http://www.cs.columbia.edu/~mcz/;https://www.cs.columbia.edu/~junfeng/;http://www.cs.columbia.edu/~vondrick/",
        "dblp": ";;71/3724.html;26/8610",
        "google_scholar": "https://scholar.google.com/citations?hl=en;pTTEiHUAAAAJ;JJ9AvbAAAAAJ;3MzhkFIAAAAJ",
        "orcid": ";;0009-0000-2277-6545;",
        "linkedin": "lingyuz/;;;",
        "or_profile": "~Lingyu_Zhang3;~Chengzhi_Mao2;~Junfeng_Yang1;~Carl_Vondrick2",
        "aff": "Duke University;Mila - Quebec Artificial Intelligence Institute;Columbia University;Columbia University",
        "aff_domain": "duke.edu;mila.quebec;columbia.edu;columbia.edu",
        "position": "Research Associate;Assistant Professor;Associate Professor;Associate Professor",
        "bibtex": "@misc{\nzhang2024robust,\ntitle={Robust Video Perception by Seeing Motion},\nauthor={Lingyu Zhang and Chengzhi Mao and Junfeng Yang and Carl Vondrick},\nyear={2024},\nurl={https://openreview.net/forum?id=eI6ajU2esa}\n}",
        "github": "",
        "project": "",
        "reviewers": "NZbs;rbXC;AKHJ;EksZ;Zd57",
        "site": "https://openreview.net/forum?id=eI6ajU2esa",
        "pdf_size": 3750223,
        "rating": "3;3;5;5;5",
        "confidence": "3;3;3;2;4",
        "soundness": "2;2;3;2;3",
        "contribution": "2;3;2;2;3",
        "presentation": "2;3;3;3;3",
        "wc_summary": "58;102;49;42;74",
        "wc_strengths": "64;38;38;41;91",
        "wc_weaknesses": "150;325;166;72;211",
        "wc_questions": "37;40;37;31;62",
        "wc_review": "309;505;290;186;438",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            4.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            65.0,
            21.372880011828073
        ],
        "wc_strengths_avg": [
            54.4,
            20.732583051805193
        ],
        "wc_weaknesses_avg": [
            184.8,
            83.2235543581263
        ],
        "wc_questions_avg": [
            41.4,
            10.707007051459339
        ],
        "wc_review_avg": [
            345.6,
            113.00371675303428
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:8bfsICwmMJMJ:scholar.google.com/&scioq=Robust+Video+Perception+by+Seeing+Motion&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;2",
        "aff_unique_norm": "Duke University;Quebec Artificial Intelligence Institute;Columbia University",
        "aff_unique_dep": ";Artificial Intelligence;",
        "aff_unique_url": "https://www.duke.edu;https://mila.quebec;https://www.columbia.edu",
        "aff_unique_abbr": "Duke;Mila;Columbia",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "United States;Canada"
    },
    {
        "id": "eIYDKNqXuV",
        "title": "Village-Net clustering: A novel unsupervised manifold clustering method",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We present \"Village-Net Clustering,\" a novel unsupervised clustering algorithm designed for effectively clustering complex manifold data. The algorithm operates in two primary phases: first, utilizing K-Means clustering, it divides the dataset into distinct \"villages.\" Subsequently, a weighted network is created, where each node represents a village, capturing their proximity relationships. To attain the optimal clustering, we cluster this network using the Walk-likelihood Community Finder (WLCF), a community detection algorithm developed by one of our team members. An important feature of Village-Net Clustering is its ability to autonomously determine the optimal number of cluster. Extensive benchmarking on real datasets with known ground-truth labels showcases its competitive performance, particularly in terms of the normalized mutual information (NMI) score, when compared to state-of-the-art methods. Additionally, the algorithm demonstrates impressive computational efficiency, boasting a time complexity of O(N*k*d), where N signifies the number of instances, k represents the number of villages and d represents the dimension of the dataset, making it well-suited for effectively handling large-scale datasets.",
        "keywords": "Unsupervised clustering;Machine Learning;Random-Walks;Community detection",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Aditya Ballal;Esha Datta;Leighton T Izu",
        "authorids": "~Aditya_Ballal1;~Esha_Datta1;ltizu@ucdavis.edu",
        "gender": "M;;",
        "homepage": ";;",
        "dblp": ";;",
        "google_scholar": "RDC4JBUAAAAJ;FB5NpNQAAAAJ;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Aditya_Ballal1;~Esha_Datta1;ltizu@ucdavis.edu",
        "aff": "University of California, Davis;Sandia National Laboratories;",
        "aff_domain": "ucdavis.edu;sandia.gov;",
        "position": "Postdoc;Postdoc;",
        "bibtex": "@misc{\nballal2024villagenet,\ntitle={Village-Net clustering: A novel unsupervised manifold clustering method},\nauthor={Aditya Ballal and Esha Datta and Leighton T Izu},\nyear={2024},\nurl={https://openreview.net/forum?id=eIYDKNqXuV}\n}",
        "github": "",
        "project": "",
        "reviewers": "Uwn5;K5W5;CGby;coeZ;fUNF",
        "site": "https://openreview.net/forum?id=eIYDKNqXuV",
        "pdf_size": 4186713,
        "rating": "3;3;3;5;5",
        "confidence": "5;4;4;4;4",
        "soundness": "2;3;2;1;2",
        "contribution": "2;1;2;2;2",
        "presentation": "2;3;2;2;3",
        "wc_summary": "71;82;88;61;84",
        "wc_strengths": "21;12;72;29;42",
        "wc_weaknesses": "60;88;147;109;63",
        "wc_questions": "141;3;130;116;262",
        "wc_review": "293;185;437;315;451",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "413;222;603;349;662",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            3.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            4.2,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            1.8,
            0.4000000000000001
        ],
        "presentation_avg": [
            2.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            77.2,
            9.867117106835208
        ],
        "wc_strengths_avg": [
            35.2,
            20.874865269026287
        ],
        "wc_weaknesses_avg": [
            93.4,
            32.203105440314296
        ],
        "wc_questions_avg": [
            130.4,
            82.30334136594941
        ],
        "wc_review_avg": [
            336.2,
            98.50563435661941
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            449.8,
            162.42339732932567
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.40824829046386296,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Iiv1ouc1--8J:scholar.google.com/&scioq=Village-Net+clustering:+A+novel+unsupervised+manifold+clustering+method&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of California, Davis;Sandia National Laboratories",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ucdavis.edu;https://www.sandia.gov",
        "aff_unique_abbr": "UC Davis;SNL",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Davis;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Blending Imitation and Reinforcement Learning for Robust Policy Improvement",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18227",
        "id": "eJ0dzPJq1F",
        "author_site": "Xuefeng Liu, Takuma Yoneda, Rick Stevens, Matthew Walter, Yuxin Chen",
        "tldr": "",
        "abstract": "While reinforcement learning (RL) has shown promising performance, its sample complexity continues to be a substantial hurdle, restricting its broader application across a variety of domains. Imitation learning (IL) utilizes oracles to improve sample efficiency, yet it is often constrained by the quality of the oracles deployed. To address the demand for robust policy improvement in real-world scenarios, we introduce a novel algorithm, Robust Policy Improvement (RPI), which actively interleaves between IL and RL based on an online estimate of their performance. RPI draws on the strengths of IL, using oracle queries to facilitate exploration\u2014an aspect that is notably challenging in sparse-reward RL\u2014particularly during the early stages of learning. As learning unfolds, RPI gradually transitions to RL, effectively treating the learned policy as an improved oracle. This algorithm is capable of learning from and improving upon a diverse set of black-box oracles. Integral to RPI are Robust Active Policy Selection (RAPS) and Robust Policy Gradient (RPG), both of which reason over whether to perform state-wise imitation from the oracles or learn from its own value function when the learner\u2019s performance surpasses that of the oracles in a specific state. Empirical evaluations and theoretical analysis validate that RPI excels in comparison to existing state-of-the-art methodologies, demonstrating superior performance across various benchmark domains.",
        "keywords": "imitation learning;reinforcement learning;multiple experts",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/29d7ecd6488ac0ea3b63e1056815ca1030a60fd7.zip",
        "author": "Xuefeng Liu;Takuma Yoneda;Rick Stevens;Matthew Walter;Yuxin Chen",
        "authorids": "~Xuefeng_Liu2;~Takuma_Yoneda1;~Rick_Stevens1;~Matthew_Walter1;~Yuxin_Chen1",
        "gender": ";M;M;M;",
        "homepage": ";https://takuma.yoneda.xyz/;https://cs.uchicago.edu/directory/rick-stevens/;http://ttic.edu/walter;http://yuxinchen.org/",
        "dblp": ";;s/RickLStevens;50/7734;11/5123-1",
        "google_scholar": ";EtYv_AIAAAAJ;https://scholar.google.com.tw/citations?user=2oSSsLYAAAAJ;RAiewnEAAAAJ;-k1N7HAAAAAJ",
        "orcid": ";;;0000-0003-1425-6050;",
        "linkedin": ";;;;",
        "or_profile": "~Xuefeng_Liu2;~Takuma_Yoneda1;~Rick_Stevens1;~Matthew_Walter1;~Yuxin_Chen1",
        "aff": ";Toyota Technological Institute at Chicago;University of Chicago;Toyota Technological Institute at Chicago;University of Chicago",
        "aff_domain": ";ttic.edu;uchicago.edu;ttic.edu;uchicago.edu",
        "position": ";PhD student;Full Professor;Associate Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nliu2024blending,\ntitle={Blending Imitation and Reinforcement Learning for Robust Policy Improvement},\nauthor={Xuefeng Liu and Takuma Yoneda and Rick Stevens and Matthew Walter and Yuxin Chen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=eJ0dzPJq1F}\n}",
        "github": "",
        "project": "",
        "reviewers": "yEJM;EG6V;oW5n;6RE6",
        "pdf_size": 1165980,
        "rating": "5;8;8;8",
        "confidence": "3;3;2;3",
        "soundness": "3;3;4;3",
        "contribution": "2;3;4;3",
        "presentation": "2;3;4;3",
        "wc_summary": "75;92;108;83",
        "wc_strengths": "18;39;124;239",
        "wc_weaknesses": "144;377;26;463",
        "wc_questions": "20;156;46;383",
        "wc_review": "257;664;304;1168",
        "wc_reply_reviewers": "28;118;0;787",
        "wc_reply_authors": "1727;1781;367;3032",
        "reply_reviewers": "1;2;0;2",
        "reply_authors": "3;3;1;6",
        "rating_avg": [
            7.25,
            1.299038105676658
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            89.5,
            12.257650672131263
        ],
        "wc_strengths_avg": [
            105.0,
            86.95113570276123
        ],
        "wc_weaknesses_avg": [
            252.5,
            175.27478426744676
        ],
        "wc_questions_avg": [
            151.25,
            143.2085454852468
        ],
        "wc_review_avg": [
            598.25,
            364.682310374386
        ],
        "wc_reply_reviewers_avg": [
            233.25,
            322.66652677338567
        ],
        "wc_reply_authors_avg": [
            1726.75,
            942.8070786221325
        ],
        "reply_reviewers_avg": [
            1.25,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.25,
            1.7853571071357126
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13126311251919972416&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=eJ0dzPJq1F",
        "pdf": "https://openreview.net/pdf?id=eJ0dzPJq1F",
        "email": ";ttic.edu;uchicago.edu;ttic.edu;uchicago.edu",
        "author_num": 5,
        "aff_unique_index": "0;1;0;1",
        "aff_unique_norm": "Toyota Technological Institute at Chicago;University of Chicago",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tti-chicago.org;https://www.uchicago.edu",
        "aff_unique_abbr": "TTI Chicago;UChicago",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Chicago;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "eJFBMqCE4X",
        "title": "SimVAE: Narrowing the gap between Discriminative & Generative Self-Supervised Representation Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Self-supervised representation learning is a powerful paradigm that leverages the relationship between semantically similar data, such as augmentations, extracts of an image or sound clip, or multiple views/modalities. Recent methods, e.g. SimCLR, CLIP and DINO, have made significant strides, yielding representations that achieve state-of-the-art results on multiple downstream tasks. A number of self-supervised discriminative approaches have been proposed, e.g. instance discrimination, latent clustering and contrastive methods; though often intuitive, a comprehensive theoretical understanding of their underlying mechanisms or what they learn eludes. Meanwhile, generative approaches, such as variational autoencoders (VAEs), fit a specific latent variable model and have principled appeal, but lag significantly in terms of performance. We present a theoretical analysis of self-supervised discriminative methods and a graphical model that reflects the assumptions they implicitly make, providing a unifying theoretical framework for these methods. We show that fitting this model to the data improves representations over previous VAE-based methods on several common benchmarks (MNIST, FashionMNIST, CIFAR10, Celeb-A), narrowing the gap to discriminative methods. We illustrate how generatively learned representations offer the promise of preserving more information than discriminative approaches.",
        "keywords": "Self-supervised representation learning; Variational Inference; Probabilistic Generative Modelling; Contrastive Learning;",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/947ef2c0c05f6d23c667a5ce6f2752927e00fc8f.pdf",
        "author": "Alice Bizeul;Carl Allen",
        "authorids": "~Alice_Bizeul1;~Carl_Allen1",
        "gender": "F;M",
        "homepage": ";https://carl-allen.github.io/",
        "dblp": ";220/5654",
        "google_scholar": "0YhW_0AAAAAJ;https://scholar.google.co.uk/citations?user=wRcURR8AAAAJ",
        "orcid": ";0000-0002-1536-657X",
        "linkedin": "alice-bizeul-538584151/;",
        "or_profile": "~Alice_Bizeul1;~Carl_Allen1",
        "aff": "ETHZ - ETH Zurich;ETHZ - ETH Zurich",
        "aff_domain": "ethz.ch;ethz.ch",
        "position": "PhD student;Postdoc",
        "bibtex": "@misc{\nbizeul2024simvae,\ntitle={Sim{VAE}: Narrowing the gap between Discriminative \\& Generative Self-Supervised Representation Learning},\nauthor={Alice Bizeul and Carl Allen},\nyear={2024},\nurl={https://openreview.net/forum?id=eJFBMqCE4X}\n}",
        "github": "",
        "project": "",
        "reviewers": "DybW;xsXw;Tr95;2gEb",
        "site": "https://openreview.net/forum?id=eJFBMqCE4X",
        "pdf_size": 994555,
        "rating": "3;5;5;6",
        "confidence": "4;5;5;4",
        "soundness": "1;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;3;3",
        "wc_summary": "150;120;73;256",
        "wc_strengths": "204;22;27;83",
        "wc_weaknesses": "119;302;153;284",
        "wc_questions": "702;82;56;10",
        "wc_review": "1175;526;309;633",
        "wc_reply_reviewers": "81;0;0;0",
        "wc_reply_authors": "721;1481;559;358",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            149.75,
            67.20258551573741
        ],
        "wc_strengths_avg": [
            84.0,
            73.30416086416923
        ],
        "wc_weaknesses_avg": [
            214.5,
            79.669630349337
        ],
        "wc_questions_avg": [
            212.5,
            283.78645140316337
        ],
        "wc_review_avg": [
            660.75,
            319.02537124811874
        ],
        "wc_reply_reviewers_avg": [
            20.25,
            35.074028853269766
        ],
        "wc_reply_authors_avg": [
            779.75,
            424.7960540070965
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.2294157338705618,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:dKaivbs3lDEJ:scholar.google.com/&scioq=SimVAE:+Narrowing+the+gap+between+Discriminative+%26+Generative+Self-Supervised+Representation+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "ETH Zurich",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ethz.ch",
        "aff_unique_abbr": "ETHZ",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Switzerland"
    },
    {
        "id": "eJFt8ZRQ9a",
        "title": "IMProv: Inpainting-based Multimodal Prompting for Computer Vision Tasks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In-context learning allows adapting a model to new tasks given a task description at test time. In this paper, we present \\model~- a generative model that is able to in-context learn visual tasks from multimodal prompts. Given a textual description of a visual task (e.g. \u201cLeft: input image, Right: foreground segmentation\u201d), a few input-output visual examples, or both, the model in-context learns to solve it for a new test input.  We train a masked generative transformer on a new dataset of figures from computer vision papers and their associated captions, together with a captioned large-scale image-text dataset. During inference time, we prompt the model with text and/or image task example(s) and have the model inpaint the corresponding output. We show that training our model with text conditioning and scaling the dataset size improves in-context learning for computer vision tasks by over +10% AP for Foreground Segmentation, over +5% gains in AP for Single Object Detection, and almost 20% lower LPIPS in Colorization. Our emperical results suggest that vision and language prompts are complementary and it is advantageous to use both to achieve better in-context learning performance.",
        "keywords": "visual prompt;image inpainting;in-context learning;multimodal prompt",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Jiarui Xu;Yossi Gandelsman;Amir Bar;Jianwei Yang;Jianfeng Gao;Trevor Darrell;Xiaolong Wang",
        "authorids": "~Jiarui_Xu1;~Yossi_Gandelsman2;~Amir_Bar1;~Jianwei_Yang1;~Jianfeng_Gao1;~Trevor_Darrell2;~Xiaolong_Wang3",
        "gender": "M;M;M;M;M;M;M",
        "homepage": "https://jerryxu.net/;http://amirbar.net;https://www.microsoft.com/en-us/research/people/jfgao/;https://xiaolonw.github.io/;https://jwyang.github.io/;https://people.eecs.berkeley.edu/~trevor/;https://yossi.gandelsman.com",
        "dblp": ";73/11011;92/5339;91/952-4;;d/TrevorDarrell;232/1765",
        "google_scholar": "2GKLw94AAAAJ;L__n1LUAAAAJ;https://scholar.google.com/citations?hl=en;Y8O9N_0AAAAJ;Cl9byD8AAAAJ;https://scholar.google.com.tw/citations?user=bh-uRFMAAAAJ;https://scholar.google.co.il/citations?user=71L4yYMAAAAJ",
        "orcid": ";;;;;;0000-0003-1259-3387",
        "linkedin": ";;;;;;yossi-gandelsman-26582981/",
        "or_profile": "~Jiarui_Xu1;~Amir_Bar1;~Jianfeng_Gao1;~Xiaolong_Wang3;~Jianwei_Yang2;~trevor_darrell1;~Yossi_Gandelsman1",
        "aff": "University of California, San Diego;Tel Aviv University;Microsoft Research;University of California, San Diego;Microsoft;Electrical Engineering & Computer Science Department;University of California, Berkeley",
        "aff_domain": "ucsd.edu;tau.ac.il;microsoft.com;ucsd.edu;microsoft.com;eecs.berkeley.edu;berkeley.edu",
        "position": "PhD student;PhD student;Principal Researcher;Assistant Professor;Researcher;Professor;PhD student",
        "bibtex": "@misc{\nxu2024improv,\ntitle={{IMP}rov: Inpainting-based Multimodal Prompting for Computer Vision Tasks},\nauthor={Jiarui Xu and Yossi Gandelsman and Amir Bar and Jianwei Yang and Jianfeng Gao and Trevor Darrell and Xiaolong Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=eJFt8ZRQ9a}\n}",
        "github": "",
        "project": "",
        "reviewers": "wsst;yR1X;W54V;gzFg",
        "site": "https://openreview.net/forum?id=eJFt8ZRQ9a",
        "pdf_size": 36445123,
        "rating": "3;5;6;8",
        "confidence": "5;4;3;5",
        "soundness": "2;2;3;3",
        "contribution": "1;2;3;3",
        "presentation": "1;3;2;3",
        "wc_summary": "68;65;91;99",
        "wc_strengths": "42;74;110;98",
        "wc_weaknesses": "344;59;84;75",
        "wc_questions": "8;381;60;42",
        "wc_review": "462;579;345;314",
        "wc_reply_reviewers": "121;167;0;0",
        "wc_reply_authors": "1147;1024;496;321",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "3;4;2;1",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            80.75,
            14.566657131957214
        ],
        "wc_strengths_avg": [
            81.0,
            25.98076211353316
        ],
        "wc_weaknesses_avg": [
            140.5,
            117.8314474153653
        ],
        "wc_questions_avg": [
            122.75,
            150.26539022675848
        ],
        "wc_review_avg": [
            425.0,
            104.64941471408237
        ],
        "wc_reply_reviewers_avg": [
            72.0,
            73.81395532011545
        ],
        "wc_reply_authors_avg": [
            747.0,
            346.8450662759959
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.08362420100070908,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=523545406580677839&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;0;2;3;4",
        "aff_unique_norm": "University of California, San Diego;Tel Aviv University;Microsoft;Electrical Engineering & Computer Science Department;University of California, Berkeley",
        "aff_unique_dep": ";;Microsoft Research;Electrical Engineering & Computer Science;",
        "aff_unique_url": "https://www.ucsd.edu;https://www.tau.ac.il;https://www.microsoft.com/en-us/research;;https://www.berkeley.edu",
        "aff_unique_abbr": "UCSD;TAU;MSR;;UC Berkeley",
        "aff_campus_unique_index": "0;0;2",
        "aff_campus_unique": "San Diego;;Berkeley",
        "aff_country_unique_index": "0;1;0;0;0;0",
        "aff_country_unique": "United States;Israel;"
    },
    {
        "title": "DIFFTACTILE: A Physics-based Differentiable Tactile Simulator for Contact-rich Robotic Manipulation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18226",
        "id": "eJHnSg783t",
        "author_site": "Zilin Si, Gu Zhang, Qingwei Ben, Branden Romero, Zhou Xian, Chao Liu, Chuang Gan",
        "tldr": "",
        "abstract": "We introduce DIFFTACTILE, a physics-based differentiable tactile simulation system designed to enhance robotic manipulation with dense and physically accurate tactile feedback. In contrast to prior tactile simulators which primarily focus on manipulating rigid bodies and often rely on simplified approximations to model stress and deformations of materials in contact, DIFFTACTILE emphasizes physics-based contact modeling with high fidelity, supporting simulations of diverse contact modes and interactions with objects possessing a wide range of material properties. Our system incorporates several key components, including a Finite Element Method (FEM)-based soft body model for simulating the sensing elastomer, a multi-material simulator for modeling diverse object types (such as elastic, elastoplastic, cables) under manipulation, a penalty-based contact model for handling contact dynamics. The differentiable nature of our system facilitates gradient-based optimization for both 1) refining physical properties in simulation using real-world data, hence narrowing the sim-to-real gap and 2) efficient learning of tactile-assisted grasping and contact-rich manipulation skills. Additionally, we introduce a method to infer the optical response of our tactile sensor to contact using an efficient pixel-based neural module. We anticipate that DIFFTACTILE will serve as a useful platform for studying contact-rich manipulations, leveraging the benefits of dense tactile feedback and differentiable physics. Code and supplementary materials are available at the project website https://difftactile.github.io/.",
        "keywords": "Tactile sensing;Simulation;Robotic manipulation",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Zilin Si;Gu Zhang;Qingwei Ben;Branden Romero;Zhou Xian;Chao Liu;Chuang Gan",
        "authorids": "~Zilin_Si1;~Gu_Zhang1;~Qingwei_Ben1;~Branden_Romero1;~Zhou_Xian1;~Chao_Liu9;~Chuang_Gan1",
        "gender": "F;M;M;M;M;;M",
        "homepage": "https://si-lynnn.github.io/;https://www.gu-zhang.com/;http://www.qingweiben.com;https://www.csail.mit.edu/person/brandon-romero;;https://chaoliu.tech/;http://people.csail.mit.edu/ganchuang/",
        "dblp": "255/5095;;;;258/5020;15/5923-21;139/6993",
        "google_scholar": "AYONIP4AAAAJ;ctFTmmgAAAAJ;BeMiq1AAAAAJ;;;FSwWMcoAAAAJ;PTeSCbIAAAAJ",
        "orcid": ";;;;;0000-0002-9912-4729;",
        "linkedin": ";;;;;;",
        "or_profile": "~Zilin_Si1;~Gu_Zhang1;~Qingwei_Ben1;~Branden_Romero1;~Zhou_Xian1;~Chao_Liu9;~Chuang_Gan1",
        "aff": "Carnegie Mellon University;Shanghai Jiaotong University;, Tsinghua University;Massachusetts Institute of Technology;Carnegie Mellon University;Computer Science and Artificial Intelligence Laboratory, Electrical Engineering & Computer Science;University of Massachusetts at Amherst",
        "aff_domain": "andrew.cmu.edu;sjtu.edu.cn;cs.tsinghua.edu.cn;mit.edu;cmu.edu;csail.mit.edu;umass.edu",
        "position": "PhD student;Undergrad student;Undergrad student;PhD student;PhD student;Postdoc;Assistant Professor",
        "bibtex": "@inproceedings{\nsi2024difftactile,\ntitle={{DIFFTACTILE}: A Physics-based Differentiable Tactile Simulator for Contact-rich Robotic Manipulation},\nauthor={Zilin Si and Gu Zhang and Qingwei Ben and Branden Romero and Zhou Xian and Chao Liu and Chuang Gan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=eJHnSg783t}\n}",
        "github": "",
        "project": "",
        "reviewers": "EisY;Wssn;TYvh;Zvck",
        "pdf_size": 12462187,
        "rating": "6;6;6;8",
        "confidence": "3;1;3;3",
        "soundness": "3;3;3;3",
        "contribution": "3;3;2;3",
        "presentation": "2;3;3;4",
        "wc_summary": "120;118;102;50",
        "wc_strengths": "109;23;92;70",
        "wc_weaknesses": "233;19;143;239",
        "wc_questions": "170;1;70;83",
        "wc_review": "632;161;407;442",
        "wc_reply_reviewers": "428;0;125;90",
        "wc_reply_authors": "1279;151;957;956",
        "reply_reviewers": "2;0;1;1",
        "reply_authors": "3;2;3;3",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            2.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            97.5,
            28.297526393662043
        ],
        "wc_strengths_avg": [
            73.5,
            32.26840560052511
        ],
        "wc_weaknesses_avg": [
            158.5,
            89.06598677385212
        ],
        "wc_questions_avg": [
            81.0,
            60.09575692176612
        ],
        "wc_review_avg": [
            410.5,
            167.56864265130275
        ],
        "wc_reply_reviewers_avg": [
            160.75,
            160.8934041531846
        ],
        "wc_reply_authors_avg": [
            835.75,
            416.6877577995303
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.75,
            0.4330127018922193
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 21,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17481497579594036900&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=eJHnSg783t",
        "pdf": "https://openreview.net/pdf?id=eJHnSg783t",
        "email": "andrew.cmu.edu;sjtu.edu.cn;cs.tsinghua.edu.cn;mit.edu;cmu.edu;csail.mit.edu;umass.edu",
        "author_num": 7,
        "aff_unique_index": "0;1;2;3;0;3;4",
        "aff_unique_norm": "Carnegie Mellon University;Shanghai Jiao Tong University;Tsinghua University;Massachusetts Institute of Technology;University of Massachusetts Amherst",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.cmu.edu;https://www.sjtu.edu.cn;https://www.tsinghua.edu.cn;https://web.mit.edu;https://www.umass.edu",
        "aff_unique_abbr": "CMU;SJTU;THU;MIT;UMass Amherst",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Cambridge;Amherst",
        "aff_country_unique_index": "0;1;1;0;0;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "eJhgguibXu",
        "title": "Using Approximate Models for Efficient Exploration in Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In model-based reinforcement learning, an agent uses a learned model of environment dynamics to improve a policy. Using a learned model of the environment to select actions has many benefits. It can be used to generate experience for learning a policy or simulate potential outcomes in planning. It allows flexible adaptation to new tasks and goals without having to relearn the underlying fundamentals of the environment from scratch. These sample efficiency and generalisation gains from model use are restricted by the model\u2019s accuracy. An imperfect model can lead to failure if trusted by the agent in regions of the state space where predictions are inaccurate. It is well-documented in cognitive and developmental psychology that humans use approximate intuitive models of physics when navigating the world in everyday scenarios. These intuitive models, despite being imperfect, enable humans to reason flexibly about abstract physical concepts (for example, gravity, collisions and friction), and to apply these concepts to solve novel problems without having to relearn them from scratch. In other words, humans efficiently make use of imperfect models. In this paper, we learn dynamics models for intuitive physics tasks using graph neural networks that explicitly incorporate the abstract structure of objects, relations and events in their design. We demonstrate that these learned models can flexibly generalise to unseen tasks and, despite being imperfect, can improve the sample efficiency of policy learning through guiding exploration to useful regions of the state and action space.",
        "keywords": "Model-based reinforcement learning;graph neural networks;intuitive physics;exploration",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Divanisha Patel;Benjamin Rosman;Steven James",
        "authorids": "~Divanisha_Patel1;~Benjamin_Rosman1;~Steven_James1",
        "gender": "F;M;M",
        "homepage": ";http://www.raillab.org;",
        "dblp": ";45/4591;195/8202",
        "google_scholar": ";https://scholar.google.co.za/citations?user=pWJ0SocAAAAJ;",
        "orcid": ";;",
        "linkedin": "divanisha-patel-47a663136/;;",
        "or_profile": "~Divanisha_Patel1;~Benjamin_Rosman1;~Steven_James1",
        "aff": "University of Witwatersrand;University of the Witwatersrand;University of the Witwatersrand",
        "aff_domain": "wits.ac.za;wits.ac.za;wits.ac.za",
        "position": "PhD student;Full Professor;Senior Lecturer",
        "bibtex": "@misc{\npatel2024using,\ntitle={Using Approximate Models for Efficient Exploration in Reinforcement Learning},\nauthor={Divanisha Patel and Benjamin Rosman and Steven James},\nyear={2024},\nurl={https://openreview.net/forum?id=eJhgguibXu}\n}",
        "github": "",
        "project": "",
        "reviewers": "SceJ;PegX;zc4U;v1eZ",
        "site": "https://openreview.net/forum?id=eJhgguibXu",
        "pdf_size": 5588682,
        "rating": "1;3;3;3",
        "confidence": "4;3;3;4",
        "soundness": "2;2;2;2",
        "contribution": "1;2;1;2",
        "presentation": "2;1;3;2",
        "wc_summary": "148;75;83;111",
        "wc_strengths": "186;18;43;48",
        "wc_weaknesses": "260;19;141;272",
        "wc_questions": "243;270;179;41",
        "wc_review": "837;382;446;472",
        "wc_reply_reviewers": "5;108;196;21",
        "wc_reply_authors": "234;294;333;127",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            104.25,
            28.577744837547975
        ],
        "wc_strengths_avg": [
            73.75,
            65.79656146030733
        ],
        "wc_weaknesses_avg": [
            173.0,
            102.60360617444204
        ],
        "wc_questions_avg": [
            183.25,
            88.52789108523935
        ],
        "wc_review_avg": [
            534.25,
            177.8347196134658
        ],
        "wc_reply_reviewers_avg": [
            82.5,
            76.3560737597213
        ],
        "wc_reply_authors_avg": [
            247.0,
            77.73995111909963
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:iak-D4XfWH8J:scholar.google.com/&scioq=Using+Approximate+Models+for+Efficient+Exploration+in+Reinforcement+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of the Witwatersrand",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.wits.ac.za",
        "aff_unique_abbr": "Wits",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Africa"
    },
    {
        "id": "eKGEsFdpin",
        "title": "I Know You Did Not Write That! A Sampling Based Watermarking Method for Identifying Machine Generated Text",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Potential harms of Large Language Models such as mass misinformation and plagiarism can be partially mitigated if there exists a reliable way to detect machine generated text. In this paper, we propose a new watermarking method to detect machine-generated texts. Our method embeds a unique pattern within the generated text, ensuring that while the content remains coherent and natural to human readers, it carries distinct markers that can be identified algorithmically. Specifically, we intervene with the token sampling process in a way which enables us to trace back our token choices during the detection phase. We show how watermarking affects textual quality and compare our proposed method with a state-of-the-art watermarking method in terms of robustness and detectability. Through extensive experiments, we demonstrate the effectiveness of our watermarking scheme in distinguishing between watermarked and non-watermarked text, achieving high detection rates while maintaining textual quality.",
        "keywords": "large language models;detecting machine generated text;watermarking text",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Kaan Efe Kele\u015f;\u00d6mer Kaan G\u00fcrb\u00fcz;Mucahid Kutlu",
        "authorids": "~Kaan_Efe_Kele\u015f1;kaan.gurbuz@bilkent.edu.tr;~Mucahid_Kutlu1",
        "gender": "M;;",
        "homepage": "https://github.com/kaanefekeles;;",
        "dblp": ";;27/7658.html",
        "google_scholar": ";;9pxldM0AAAAJ",
        "orcid": ";;0000-0002-5660-4992",
        "linkedin": ";;",
        "or_profile": "~Kaan_Efe_Kele\u015f1;kaan.gurbuz@bilkent.edu.tr;~Mucahid_Kutlu1",
        "aff": "Tobb Economics and Technology University;;TOBB University of Economics and Technology",
        "aff_domain": "etu.edu.tr;;etu.edu.tr",
        "position": "MS student;;Assistant Professor",
        "bibtex": "@misc{\nkele{\\c{s}}2024i,\ntitle={I Know You Did Not Write That! A Sampling Based Watermarking Method for Identifying Machine Generated Text},\nauthor={Kaan Efe Kele{\\c{s}} and {\\\"O}mer Kaan G{\\\"u}rb{\\\"u}z and Mucahid Kutlu},\nyear={2024},\nurl={https://openreview.net/forum?id=eKGEsFdpin}\n}",
        "github": "",
        "project": "",
        "reviewers": "b2Mo;bSV5;gCgZ",
        "site": "https://openreview.net/forum?id=eKGEsFdpin",
        "pdf_size": 948811,
        "rating": "3;3;5",
        "confidence": "4;2;4",
        "soundness": "2;2;3",
        "contribution": "1;2;3",
        "presentation": "3;2;3",
        "wc_summary": "145;52;120",
        "wc_strengths": "11;49;95",
        "wc_weaknesses": "347;268;154",
        "wc_questions": "21;104;56",
        "wc_review": "524;473;425",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "181;559;233",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            105.66666666666667,
            39.296593010364425
        ],
        "wc_strengths_avg": [
            51.666666666666664,
            34.34465832637669
        ],
        "wc_weaknesses_avg": [
            256.3333333333333,
            79.22261181141545
        ],
        "wc_questions_avg": [
            60.333333333333336,
            34.022868126534476
        ],
        "wc_review_avg": [
            474.0,
            40.422765862815474
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            324.3333333333333,
            167.28684613229126
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5000000000000001,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9436109537706799010&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "TOBB University of Economics and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tobbuni.edu.tr",
        "aff_unique_abbr": "TOBB ETU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "T\u00fcrkiye"
    },
    {
        "title": "Combinatorial Bandits for Maximum Value Reward Function under Value-Index Feedback",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18225",
        "id": "eMHn77ZKOp",
        "author_site": "Yiliu Wang, Wei Chen, Milan Vojnovic",
        "tldr": "",
        "abstract": "We investigate the combinatorial multi-armed bandit problem where an action is to select $k$ arms from a set of base arms, and its reward is the maximum of the sample values of these $k$ arms, under a weak feedback structure that only returns the value and index of the arm with the maximum value. This novel feedback structure is much weaker than the semi-bandit feedback previously studied and is only slightly stronger than the full-bandit feedback, and thus it presents a new challenge for the online learning task. We propose an algorithm and derive a regret bound for instances where arm outcomes follow distributions with finite supports. Our algorithm introduces a novel concept of biased arm replacement to address the weak feedback challenge, and it achieves a distribution-dependent regret bound of $O((k/\\Delta)\\log(T))$ and a distribution-independent regret bound of $\\tilde{O}(\\sqrt{T})$, where $\\Delta$ is the reward gap and $T$ is the time horizon. \nNotably, our regret bound is comparable to the bounds obtained under the more informative semi-bandit feedback. \nWe demonstrate the effectiveness of our algorithm through experimental results.",
        "keywords": "Combinatorial multi-armed bandit;$k$-MAX bandit;value-index feedback;maximum reward function",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Yiliu Wang;Wei Chen;Milan Vojnovic",
        "authorids": "~Yiliu_Wang1;~Wei_Chen10;~Milan_Vojnovic1",
        "gender": "F;M;M",
        "homepage": "https://alleninstitute.org/person/yiliu-wang/;https://www.microsoft.com/en-us/research/people/weic/;https://personal.lse.ac.uk/vojnovic/",
        "dblp": ";c/WeiChen13;00/1815",
        "google_scholar": ";hlEPkxAAAAAJ;https://scholar.google.co.uk/citations?user=z4JhSBwAAAAJ",
        "orcid": "0009-0006-9536-8482;;",
        "linkedin": ";;",
        "or_profile": "~Yiliu_Wang1;~Wei_Chen10;~Milan_Vojnovic1",
        "aff": "Allen Institute;Microsoft Research;London School of Economics",
        "aff_domain": "alleninstitute.org;microsoft.com;lse.ac.uk",
        "position": "Researcher;Pricipal Researcher;Professor",
        "bibtex": "@inproceedings{\nwang2024combinatorial,\ntitle={Combinatorial Bandits for Maximum Value Reward Function under Value-Index Feedback},\nauthor={Yiliu Wang and Wei Chen and Milan Vojnovic},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=eMHn77ZKOp}\n}",
        "github": "",
        "project": "",
        "reviewers": "oHUd;AcYK;AX9C;hUTf",
        "pdf_size": 662809,
        "rating": "6;6;6;6",
        "confidence": "3;3;3;3",
        "soundness": "3;3;2;3",
        "contribution": "2;3;2;2",
        "presentation": "3;2;3;2",
        "wc_summary": "104;121;186;80",
        "wc_strengths": "91;173;125;155",
        "wc_weaknesses": "268;194;389;600",
        "wc_questions": "35;355;43;195",
        "wc_review": "498;843;743;1030",
        "wc_reply_reviewers": "19;0;0;9",
        "wc_reply_authors": "609;771;1244;798",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            122.75,
            39.31523241696531
        ],
        "wc_strengths_avg": [
            136.0,
            31.12876483254676
        ],
        "wc_weaknesses_avg": [
            362.75,
            153.64793360146436
        ],
        "wc_questions_avg": [
            157.0,
            130.8892661756494
        ],
        "wc_review_avg": [
            778.5,
            191.9329309941366
        ],
        "wc_reply_reviewers_avg": [
            7.0,
            7.842193570679061
        ],
        "wc_reply_authors_avg": [
            855.5,
            235.6591818707686
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14613276033584785409&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=eMHn77ZKOp",
        "pdf": "https://openreview.net/pdf?id=eMHn77ZKOp",
        "email": "alleninstitute.org;microsoft.com;lse.ac.uk",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Allen Institute for Artificial Intelligence;Microsoft;London School of Economics",
        "aff_unique_dep": ";Microsoft Research;",
        "aff_unique_url": "https://allenai.org;https://www.microsoft.com/en-us/research;https://www.lse.ac.uk",
        "aff_unique_abbr": "AI2;MSR;LSE",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "title": "On Trajectory Augmentations for Off-Policy Evaluation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18224",
        "id": "eMNN0wIyVw",
        "author_site": "Ge Gao, Qitong Gao, Xi Yang, Song Ju, Miroslav Pajic, Min Chi",
        "tldr": "",
        "abstract": "In the realm of reinforcement learning (RL), off-policy evaluation (OPE) holds a pivotal position, especially in high-stake human-involved scenarios such as e-learning and healthcare. Applying OPE to these domains is often challenging with scarce and underrepresentative offline training trajectories. Data augmentation has been a successful technique to enrich training data. However, directly employing existing data augmentation methods to OPE may not be feasible, due to the Markovian nature within the offline trajectories and the desire for generalizability across diverse target policies. In this work, we propose an offline trajectory augmentation approach to specifically facilitate OPE in human-involved scenarios. We propose sub-trajectory mining to extract potentially valuable sub-trajectories from offline data, and diversify the behaviors within those sub-trajectories by varying coverage of the state-action space. Our work was empirically evaluated in a wide array of environments, encompassing both simulated scenarios and real-world domains like robotic control, healthcare, and e-learning, where the training trajectories include varying levels of coverage of the state-action space. By enhancing the performance of a variety of OPE methods, our work offers a promising path forward for tackling OPE challenges in situations where data may be limited or underrepresentative.",
        "keywords": "Trajectory augmentation;Off-policy evaluation;Sub-trajectory mining from offline dataset",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/5bc5195910214ff51cb07371bc708cfb92d74c46.zip",
        "author": "Ge Gao;Qitong Gao;Xi Yang;Song Ju;Miroslav Pajic;Min Chi",
        "authorids": "~Ge_Gao4;~Qitong_Gao1;~Xi_Yang11;~Song_Ju1;~Miroslav_Pajic2;~Min_Chi1",
        "gender": ";M;;M;M;",
        "homepage": "https://gegao.tech/;http://qitonggao.com;;;http://people.duke.edu/~mp275/;",
        "dblp": ";238/5422;;;74/7446.html;",
        "google_scholar": "d_WL-9cAAAAJ;Flv4SrsAAAAJ;;;Fbn21-8AAAAJ;",
        "orcid": "0000-0002-3474-8637;;;;;",
        "linkedin": ";qitong-gao;;song-ju-936513134/;;",
        "or_profile": "~Ge_Gao4;~Qitong_Gao1;~Xi_Yang11;~Song_Ju1;~Miroslav_Pajic2;~Min_Chi1",
        "aff": "North Carolina State University;Duke University;;;Duke University;",
        "aff_domain": "ncsu.edu;duke.edu;;;duke.edu;",
        "position": "PhD student;PhD student;;;Associate Professor;",
        "bibtex": "@inproceedings{\ngao2024on,\ntitle={On Trajectory Augmentations for Off-Policy Evaluation},\nauthor={Ge Gao and Qitong Gao and Xi Yang and Song Ju and Miroslav Pajic and Min Chi},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=eMNN0wIyVw}\n}",
        "github": "",
        "project": "",
        "reviewers": "pod6;3xn9;WbKh",
        "pdf_size": 2467254,
        "rating": "6;6;6",
        "confidence": "4;4;4",
        "soundness": "2;2;3",
        "contribution": "2;2;2",
        "presentation": "2;1;2",
        "wc_summary": "52;42;64",
        "wc_strengths": "83;61;63",
        "wc_weaknesses": "91;241;34",
        "wc_questions": "175;139;262",
        "wc_review": "401;483;423",
        "wc_reply_reviewers": "22;195;28",
        "wc_reply_authors": "1124;1632;937",
        "reply_reviewers": "1;1;1",
        "reply_authors": "4;4;4",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            52.666666666666664,
            8.993825042154693
        ],
        "wc_strengths_avg": [
            69.0,
            9.93310961716756
        ],
        "wc_weaknesses_avg": [
            122.0,
            87.3040663428686
        ],
        "wc_questions_avg": [
            192.0,
            51.633322573702344
        ],
        "wc_review_avg": [
            435.6666666666667,
            34.65384378231207
        ],
        "wc_reply_reviewers_avg": [
            81.66666666666667,
            80.17619485995966
        ],
        "wc_reply_authors_avg": [
            1231.0,
            293.64718058695314
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            4.0,
            0.0
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14159545869120906731&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=eMNN0wIyVw",
        "pdf": "https://openreview.net/pdf?id=eMNN0wIyVw",
        "email": "ncsu.edu;duke.edu;;;duke.edu;",
        "author_num": 6,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "North Carolina State University;Duke University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ncsu.edu;https://www.duke.edu",
        "aff_unique_abbr": "NCSU;Duke",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "eMiSyBS5ZG",
        "title": "Uniform Approximation of Equivariant/Invariant Neural Networks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Equivariant structures have been widely adopted in graph neural networks due to their demonstrated effectiveness in various machine learning tasks, such as point clouds, biology, and chemistry. We focuses on investigating the approximation power of equivariant neural networks. Specifically, we prove that equivariant neural networks with any continuous activation function can approximate any continuous equivariant function. Our theorem is established based on a novel composition of any subgroup $G$ of a symmetric group $S_M$. Additionally, we note that this representation may not work for certain invariant continuous functions when the dimension of the latent space is smaller than the dimension of the input space.",
        "keywords": "Approximation;Equivariant neural networks;Invariant neural networks",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/8a7728066e41ae6263e2f4af7df021416d73bd99.pdf",
        "author": "Jianchuan Huang;Fengxiang He;Bohan Wang;Xiliang Lu;Dacheng Tao",
        "authorids": "~Jianchuan_Huang1;~Fengxiang_He1;~Bohan_Wang1;~Xiliang_Lu1;~Dacheng_Tao1",
        "gender": "M;;M;M;",
        "homepage": ";https://fengxianghe.github.io/;https://bhwangfy.github.io/;http://jszy.whu.edu.cn/lvxiliang/en/index/275082/list/index.htm;",
        "dblp": ";225/4682;202/1184;70/7812;",
        "google_scholar": ";QSx-Yu0AAAAJ;LfkHCEUAAAAJ;https://scholar.google.com/citations?hl=en;",
        "orcid": ";;;0000-0002-7592-5994;",
        "linkedin": "%E5%BB%BA%E5%B7%9D-%E9%BB%84-2a6607213/;fengxiang-he-35b173122;;;",
        "or_profile": "~Jianchuan_Huang1;~Fengxiang_He1;~Bohan_Wang1;~Xiliang_Lu1;~Dacheng_Tao1",
        "aff": "Wuhan University, Tsinghua University;University of Edinburgh;Microsoft Research Asia, University of Science and Technology of China;Wuhan University;",
        "aff_domain": "whu.edu.cn;ed.ac.uk;ustc.edu.cn;whu.edu.cn;",
        "position": "MS student;Lecturer;PhD student;Full Professor;",
        "bibtex": "@misc{\nhuang2024uniform,\ntitle={Uniform Approximation of Equivariant/Invariant Neural Networks},\nauthor={Jianchuan Huang and Fengxiang He and Bohan Wang and Xiliang Lu and Dacheng Tao},\nyear={2024},\nurl={https://openreview.net/forum?id=eMiSyBS5ZG}\n}",
        "github": "",
        "project": "",
        "reviewers": "JME2;i9to;7B9b;pKT6",
        "site": "https://openreview.net/forum?id=eMiSyBS5ZG",
        "pdf_size": 302449,
        "rating": "3;3;3;3",
        "confidence": "3;5;4;4",
        "soundness": "3;1;2;2",
        "contribution": "2;2;2;2",
        "presentation": "2;2;1;1",
        "wc_summary": "90;24;100;22",
        "wc_strengths": "98;28;22;29",
        "wc_weaknesses": "158;36;164;472",
        "wc_questions": "1154;560;93;783",
        "wc_review": "1500;648;379;1306",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            59.0,
            36.180105030251084
        ],
        "wc_strengths_avg": [
            44.25,
            31.1478329904345
        ],
        "wc_weaknesses_avg": [
            207.5,
            161.0240665242311
        ],
        "wc_questions_avg": [
            647.5,
            384.0667259734954
        ],
        "wc_review_avg": [
            958.25,
            459.94802695522026
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:oT0rrUG6CmkJ:scholar.google.com/&scioq=Uniform+Approximation+of+Equivariant/Invariant+Neural+Networks&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Wuhan University;University of Edinburgh;Microsoft",
        "aff_unique_dep": ";;Research",
        "aff_unique_url": "http://www.whu.edu.cn/;https://www.ed.ac.uk;https://www.microsoft.com/en-us/research/group/microsoft-research-asia",
        "aff_unique_abbr": "WHU;Edinburgh;MSRA",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Asia",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "id": "eMln7giNC2",
        "title": "Robust Stochastic Graph Generator for Counterfactual Explanations",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Counterfactual Explanation (CE) techniques are used to provide insights to AI system users. While well-researched in domains like medical imaging and autonomous vehicles, Graph Counterfactual Explanation (GCE) methods, especially generative ones, have been less explored. GCEs generate a new graph akin to the original one, having a different outcome grounded on the underlying predictive model. Generative approaches, despite their success in domains like artistic styles and natural language modeling, have received limited attention in GCE. We introduce RSGG-CE, a novel Robust Stochastic Graph Generator for Counterfactual Explanations capable of generating counterfactual examples from the learned latent space with a partially ordered generation sequence. Our study quantitatively and qualitatively compares RSGG-CE\u2019s performance to state-of-the-art (SoA) generative explainers, demonstrating its superior ability to generate plausible counterfactual candidates.",
        "keywords": "explainable AI;generative AI;algorithmic recourse;graph neural networks;deep learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Mario Alfonso Prado-Romero;Bardh Prenkaj;Giovanni Stilo",
        "authorids": "~Mario_Alfonso_Prado-Romero1;~Bardh_Prenkaj2;~Giovanni_Stilo2",
        "gender": "M;M;M",
        "homepage": ";https://aiimlab.org/people.html;https://bardhprenkaj.netlify.app/",
        "dblp": "195/0861;83/2005.html;211/9434",
        "google_scholar": "NPie5kEAAAAJ;uTyaicMAAAAJ;JIidltYAAAAJ",
        "orcid": "0000-0002-0491-3515;0000-0002-2092-0213;0000-0002-2991-2279",
        "linkedin": "mario-alfonso-prado-romero/;giovanni-stilo-7986b816/;prenkaj-bardh/",
        "or_profile": "~Mario_Alfonso_Prado-Romero1;~Giovanni_Stilo2;~Bardh_Prenkaj1",
        "aff": "Gran Sasso Science Institute;University of Aquila;University of Roma \"La Sapienza\"",
        "aff_domain": "gssi.it;univaq.it;uniroma1.it",
        "position": "PhD student;Associate Professor;Postdoc",
        "bibtex": "@misc{\nprado-romero2024robust,\ntitle={Robust Stochastic Graph Generator for Counterfactual Explanations},\nauthor={Mario Alfonso Prado-Romero and Bardh Prenkaj and Giovanni Stilo},\nyear={2024},\nurl={https://openreview.net/forum?id=eMln7giNC2}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=eMln7giNC2",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=768509007664289609&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Gran Sasso Science Institute;University of Aquila;University of Rome La Sapienza",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.gssi.it;;https://www.uniroma1.it",
        "aff_unique_abbr": ";;La Sapienza",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Rome",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Italy;"
    },
    {
        "title": "Unknown Domain Inconsistency Minimization for Domain Generalization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18223",
        "id": "eNoiRal5xi",
        "author_site": "Seungjae Shin, HeeSun Bae, Byeonghu Na, Yoon-Yeong, Il-chul Moon",
        "tldr": "",
        "abstract": "The objective of domain generalization (DG) is to enhance the transferability of the model learned from a source domain to unobserved domains. To prevent overfitting to a specific domain, Sharpness-Aware Minimization (SAM) reduces source domain\u2019s loss sharpness. Although SAM variants have delivered significant improvements in DG, we highlight that there\u2019s still potential for improvement in generalizing to unknown domains through the exploration on data space. This paper introduces an objective rooted in both parameter and data perturbed regions for domain generalization, coined Unknown Domain Inconsistency Minimization (UDIM). UDIM reduces the loss landscape inconsistency between source domain and unknown domains. As unknown domains are inaccessible, these domains are empirically crafted by perturbing instances from the source domain dataset. In particular, by aligning the loss landscape acquired in the source domain to the loss landscape of perturbed domains, we expect to achieve generalization grounded on these flat minima for the unknown domains. Theoretically, we validate that merging SAM optimization with the UDIM objective establishes an upper bound for the true objective of the DG task. In an empirical aspect, UDIM consistently outperforms SAM variants across multiple DG benchmark datasets. Notably, UDIM shows statistically significant improvements in scenarios with more restrictive domain information, underscoring UDIM\u2019s generalization capability in unseen domains.",
        "keywords": "Robustness;Domain generalization;Sharpness-Aware Minimization;Loss Sharpness;Inconsistency",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Seungjae Shin;HeeSun Bae;Byeonghu Na;Yoon-Yeong Kim;Il-chul Moon",
        "authorids": "~Seungjae_Shin1;~HeeSun_Bae1;~Byeonghu_Na1;~Yoon-Yeong_Kim1;~Il-chul_Moon1",
        "gender": "M;F;M;F;",
        "homepage": "https://sites.google.com/view/seungjae-shin;;https://sites.google.com/view/byeonghu-na;https://sites.google.com/view/yykim/home;",
        "dblp": "29/551;;276/5100;254/0952.html;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.co.kr/citations?user=D9U_ohsAAAAJ;https://scholar.google.co.kr/citations?user=mJoqpmEAAAAJ;;",
        "orcid": ";0000-0002-9986-0945;0000-0003-3463-2674;;",
        "linkedin": "seungjae-shin-hoodie/;heesun-bae-8a4b8523a/;byeonghu-na-17942120b/;;",
        "or_profile": "~Seungjae_Shin1;~HeeSun_Bae1;~Byeonghu_Na1;~Yoon-Yeong_Kim1;~Il-chul_Moon1",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;University of Seoul;",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr;kaist.ac.kr;uos.ac.kr;",
        "position": "PhD student;PhD student;PhD student;Assistant Professor;",
        "bibtex": "@inproceedings{\nshin2024unknown,\ntitle={Unknown Domain Inconsistency Minimization for Domain Generalization},\nauthor={Seungjae Shin and HeeSun Bae and Byeonghu Na and Yoon-Yeong Kim and Il-chul Moon},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=eNoiRal5xi}\n}",
        "github": "",
        "project": "",
        "reviewers": "DtQi;ExGX;x9yc;KWQw",
        "pdf_size": 3948535,
        "rating": "5;6;6;6",
        "confidence": "3;5;4;3",
        "soundness": "3;2;2;3",
        "contribution": "3;2;2;2",
        "presentation": "3;3;2;3",
        "wc_summary": "118;101;60;70",
        "wc_strengths": "188;59;46;75",
        "wc_weaknesses": "19;203;148;151",
        "wc_questions": "2;69;3;2",
        "wc_review": "327;432;257;298",
        "wc_reply_reviewers": "108;165;0;0",
        "wc_reply_authors": "1501;2701;965;2380",
        "reply_reviewers": "1;2;0;0",
        "reply_authors": "5;7;3;6",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            87.25,
            23.31710745354149
        ],
        "wc_strengths_avg": [
            92.0,
            56.36931789546508
        ],
        "wc_weaknesses_avg": [
            130.25,
            67.85047899609847
        ],
        "wc_questions_avg": [
            19.0,
            28.8704000665041
        ],
        "wc_review_avg": [
            328.5,
            64.72441579496875
        ],
        "wc_reply_reviewers_avg": [
            68.25,
            71.16310490696706
        ],
        "wc_reply_authors_avg": [
            1886.75,
            690.0588290138747
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            5.25,
            1.479019945774904
        ],
        "replies_avg": [
            31,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5222329678670935,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1339068496163962761&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=eNoiRal5xi",
        "pdf": "https://openreview.net/pdf?id=eNoiRal5xi",
        "email": "kaist.ac.kr;kaist.ac.kr;kaist.ac.kr;uos.ac.kr;",
        "author_num": 5,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology;University of Seoul",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.kaist.ac.kr;http://www.useoul.edu",
        "aff_unique_abbr": "KAIST;UOS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "eO6lXIWyxn",
        "title": "ARTIST: Towards Disentangled Text Painter with Diffusion Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Diffusion models have shown remarkable performance in generating a broad spectrum of visual content. However, their text rendering ability is still limited: they generate wrong characters or words that cannot blend well with the background image. To address this, we introduce a novel framework named ARTIST, which includes an additional textual diffusion model focusing on text structure learning. We first pretrain the textual diffusion model. Then we further fine-tune the visual model to learn how to inject textual structure information from the frozen textual model into the image. This disentangled architecture design and training strategy significantly enhance the text rendering ability of the diffusion models for text-rich image generation. Furthermore, we leverage pre-trained large-language models to infer the user's intention leading to better generation quality. Empirical results on the MARIO-Eval benchmark underscore the effectiveness of the proposed method, showing an improvement of up to 15\\% in various metrics.",
        "keywords": "Diffusion Models;Image generation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/c01d65081af6236a84adf47e81d83ab9047e4765.pdf",
        "author": "Yufan Zhou;Jianyi Zhang;Jiuxiang Gu;Curtis Wigington;Tong Yu;Tong Sun;Ruiyi Zhang",
        "authorids": "~Yufan_Zhou1;~Jianyi_Zhang1;~Jiuxiang_Gu2;~Curtis_Wigington1;~Tong_Yu3;~Tong_Sun1;~Ruiyi_Zhang3",
        "gender": "M;;M;;;F;",
        "homepage": "https://www.yufanzhou.com/;https://jayzhang42.github.io/;http://gujiuxiang.com;;https://www.linkedin.com/in/tong-yu-42790744;https://research.adobe.com/person/tong-sun/;",
        "dblp": ";;173/4935.html;;32/1593-1;;",
        "google_scholar": "0eVrHJAAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com.sg/citations?user=zPxKV9EAAAAJ;;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en;",
        "orcid": ";;;;0000-0002-5991-2050;;",
        "linkedin": ";;;;tong-yu-42790744;tong-sun/?trk=hb_tab_pro_top;",
        "or_profile": "~Yufan_Zhou1;~Jianyi_Zhang1;~Jiuxiang_Gu2;~Curtis_Wigington1;~Tong_Yu3;~Tong_Sun1;~Ruiyi_Zhang3",
        "aff": "Adobe ;Pittsburgh Supercomputing Center & Duke University;Adobe Systems;;Adobe Research;Adobe Systems;",
        "aff_domain": "adobe.com;duke.edu;adobe.com;;adobe.com;adobe.com;",
        "position": "Researcher;Principal investigator;Researcher;;Senior Research Scientist;Director, Document Intelligence Lab;",
        "bibtex": "@misc{\nzhou2024artist,\ntitle={{ARTIST}: Towards Disentangled Text Painter with Diffusion Models},\nauthor={Yufan Zhou and Jianyi Zhang and Jiuxiang Gu and Curtis Wigington and Tong Yu and Tong Sun and Ruiyi Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=eO6lXIWyxn}\n}",
        "github": "",
        "project": "",
        "reviewers": "B4bj;fEGX;JCmy;5qmq",
        "site": "https://openreview.net/forum?id=eO6lXIWyxn",
        "pdf_size": 26263,
        "rating": "3;5;5;5",
        "confidence": "4;4;5;3",
        "soundness": "2;3;2;3",
        "contribution": "2;3;3;3",
        "presentation": "1;2;4;2",
        "wc_summary": "56;57;49;54",
        "wc_strengths": "46;21;59;42",
        "wc_weaknesses": "89;114;145;54",
        "wc_questions": "97;3;4;116",
        "wc_review": "288;195;257;266",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            54.0,
            3.082207001484488
        ],
        "wc_strengths_avg": [
            42.0,
            13.656500283747663
        ],
        "wc_weaknesses_avg": [
            100.5,
            33.380383460949034
        ],
        "wc_questions_avg": [
            55.0,
            51.93746239469156
        ],
        "wc_review_avg": [
            251.5,
            34.514489710844636
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:KCEQ02eOTgIJ:scholar.google.com/&scioq=ARTIST:+Towards+Disentangled+Text+Painter+with+Diffusion+Models&hl=en&as_sdt=0,11",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0;0",
        "aff_unique_norm": "Adobe;Pittsburgh Supercomputing Center",
        "aff_unique_dep": "Adobe Inc.;",
        "aff_unique_url": "https://www.adobe.com;https://www.psc.edu",
        "aff_unique_abbr": "Adobe;PSC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Neural Fourier Transform: A General Approach to Equivariant Representation Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18222",
        "id": "eOCvA8iwXH",
        "author_site": "Masanori Koyama, Kenji Fukumizu, Kohei Hayashi, Takeru Miyato",
        "tldr": "",
        "abstract": "Symmetry learning has proven to be an effective approach for extracting the hidden structure of data, with the concept of equivariance relation playing the central role. \nHowever, most of the current studies are built on architectural theory and corresponding assumptions on the form of data. \nWe propose Neural Fourier Transform (NFT), a general framework of learning the latent linear action of the group without assuming explicit knowledge of how the group acts on data.\nWe present the theoretical foundations of NFT and show that \nthe existence of a linear equivariant feature, which has been assumed ubiquitously in equivariance learning, is equivalent to the existence of a group invariant kernel on the dataspace. \nWe also provide experimental results to demonstrate the application of NFT in typical scenarios with varying levels of knowledge about the acting group.",
        "keywords": "Fourier transform;equivariance;harmonic analysis;representation learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/cd308262ed943bdc0e5b097d29c4f08b78055ed2.zip",
        "author": "Masanori Koyama;Kenji Fukumizu;Kohei Hayashi;Takeru Miyato",
        "authorids": "~Masanori_Koyama1;~Kenji_Fukumizu1;~Kohei_Hayashi1;~Takeru_Miyato1",
        "gender": ";M;M;M",
        "homepage": ";http://www.ism.ac.jp/~fukumizu/;https://sites.google.com/site/koheihayashi84;http://takerum.github.io/",
        "dblp": "151/6113;96/464;84/1101.html;166/1534",
        "google_scholar": ";;https://scholar.google.com/citations?hl=en;s2lG0X0AAAAJ",
        "orcid": ";0000-0002-3488-2625;;0000-0002-7363-1773",
        "linkedin": ";;koheih/;takeru-miyato-099780104/",
        "or_profile": "~Masanori_Koyama1;~Kenji_Fukumizu1;~Kohei_Hayashi1;~Takeru_Miyato1",
        "aff": "Preferred Networks, Inc.;The Institute of Statistical Mathematics, Japan, Tokyo Institute of Technology;Preferred Networks, Inc.;Eberhard-Karls-Universit\u00e4t T\u00fcbingen",
        "aff_domain": "preferred.jp;ism.ac.jp;preferred.jp;uni-tuebingen.de",
        "position": "Researcher;Full Professor;Researcher;PhD student",
        "bibtex": "@inproceedings{\nkoyama2024neural,\ntitle={Neural Fourier Transform: A General Approach to Equivariant Representation Learning},\nauthor={Masanori Koyama and Kenji Fukumizu and Kohei Hayashi and Takeru Miyato},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=eOCvA8iwXH}\n}",
        "github": "",
        "project": "",
        "reviewers": "ef5j;uMSh;g5qF;XpFk",
        "pdf_size": 19390591,
        "rating": "6;6;8;8",
        "confidence": "3;4;3;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "97;173;78;84",
        "wc_strengths": "54;90;60;31",
        "wc_weaknesses": "86;117;72;29",
        "wc_questions": "47;11;6;42",
        "wc_review": "284;391;216;186",
        "wc_reply_reviewers": "60;0;10;13",
        "wc_reply_authors": "1185;383;120;129",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            108.0,
            38.15101571387058
        ],
        "wc_strengths_avg": [
            58.75,
            21.040140208658308
        ],
        "wc_weaknesses_avg": [
            76.0,
            31.64648479689332
        ],
        "wc_questions_avg": [
            26.5,
            18.172781845386247
        ],
        "wc_review_avg": [
            269.25,
            78.75079364679445
        ],
        "wc_reply_reviewers_avg": [
            20.75,
            23.166516786085904
        ],
        "wc_reply_authors_avg": [
            454.25,
            434.90882665220767
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6552704934002711897&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=eOCvA8iwXH",
        "pdf": "https://openreview.net/pdf?id=eOCvA8iwXH",
        "email": "preferred.jp;ism.ac.jp;preferred.jp;uni-tuebingen.de",
        "author_num": 4,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "Preferred Networks, Inc.;Institute of Statistical Mathematics;Eberhard Karls University of T\u00fcbingen",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.preferred-networks.com;https://www.ism.ac.jp;https://www.uni-tuebingen.de/",
        "aff_unique_abbr": "PFN;ISM;Uni T\u00fcbingen",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";T\u00fcbingen",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "Japan;Germany"
    },
    {
        "id": "eP6ZSy5uRj",
        "title": "Endowing Protein Language Models with Structural Knowledge",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Protein language models have shown strong performance in predicting function and structure across diverse tasks. \nThese models undergo unsupervised pretraining on vast sequence databases to generate rich protein representations, followed by finetuning with labeled data on specific downstream tasks.\nThe recent surge in computationally predicted protein structures opens new opportunities in protein representation learning.\nIn our study, we introduce a novel framework to enhance transformer protein language models specifically on protein structures.\nDrawing from recent advances in graph transformers, our approach refines the self-attention mechanisms of pretrained language transformers by integrating structural information with structure extractor modules.\nThis refined model, termed the Protein Structure Transformer (PST), is further pretrained on a protein structure database such as AlphaFoldDB, using the same masked language modeling objective as traditional protein language models.\nOur empirical findings show superior performance on several benchmark datasets. \nNotably, PST consistently outperforms the foundation model for protein sequences, ESM-2, upon which it is built. Our code and pretrained models will be released upon publication.",
        "keywords": "protein representation learning;protein language models;self-supervised learning;graph transformers",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/d12dfbb8d3706f858ee80b18e65c7f9812853f9c.zip",
        "author": "Dexiong Chen;Philip Hartout;Paolo Pellizzoni;Carlos Oliver;Karsten Borgwardt",
        "authorids": "~Dexiong_Chen1;~Philip_Hartout1;~Paolo_Pellizzoni1;~Carlos_Oliver2;~Karsten_Borgwardt2",
        "gender": "M;M;;M;",
        "homepage": "https://dexiong.me;https://pjhartout.github.io;;https://carlosoliver.co;https://www.biochem.mpg.de/borgwardt",
        "dblp": "240/6347;;279/2647;;11/3733.html",
        "google_scholar": "goM0yAIAAAAJ;xVbE-cgAAAAJ;https://scholar.google.it/citations?user=SRXEcPUAAAAJ;https://scholar.google.ch/citations?user=UnTr7qIAAAAJ;v3JsjMYAAAAJ",
        "orcid": ";0000-0002-1067-7651;;0000-0001-8742-8795;0000-0001-7221-2393",
        "linkedin": ";;;;",
        "or_profile": "~Dexiong_Chen1;~Philip_Hartout1;~Paolo_Pellizzoni1;~Carlos_Oliver2;~Karsten_Borgwardt2",
        "aff": "Max-Planck Institute;Max-Planck Institute;Max-Planck Institute;Max Planck Institute of Biochemistry;Max Planck Institute of Biochemistry",
        "aff_domain": "mpg.de;mpg.de;mpg.de;biochem.mpg.de;biochem.mpg.de",
        "position": "Project leader;PhD student;PhD student;Project Leader;Max Planck Director",
        "bibtex": "@misc{\nchen2024endowing,\ntitle={Endowing Protein Language Models with Structural Knowledge},\nauthor={Dexiong Chen and Philip Hartout and Paolo Pellizzoni and Carlos Oliver and Karsten Borgwardt},\nyear={2024},\nurl={https://openreview.net/forum?id=eP6ZSy5uRj}\n}",
        "github": "",
        "project": "",
        "reviewers": "hmnV;daTw;wJCU;XuQU;GUNq",
        "site": "https://openreview.net/forum?id=eP6ZSy5uRj",
        "pdf_size": 1402134,
        "rating": "5;5;5;6;6",
        "confidence": "4;5;5;5;3",
        "soundness": "2;3;2;3;3",
        "contribution": "2;2;2;2;3",
        "presentation": "3;3;2;3;3",
        "wc_summary": "107;91;59;105;49",
        "wc_strengths": "66;71;72;73;68",
        "wc_weaknesses": "132;160;444;158;72",
        "wc_questions": "76;2;2;66;9",
        "wc_review": "381;324;577;402;198",
        "wc_reply_reviewers": "0;0;17;20;47",
        "wc_reply_authors": "571;433;1100;693;343",
        "reply_reviewers": "0;0;1;1;1",
        "reply_authors": "2;2;3;2;2",
        "rating_avg": [
            5.4,
            0.48989794855663565
        ],
        "confidence_avg": [
            4.4,
            0.8
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            82.2,
            23.886397802933786
        ],
        "wc_strengths_avg": [
            70.0,
            2.6076809620810595
        ],
        "wc_weaknesses_avg": [
            193.2,
            129.3652194370651
        ],
        "wc_questions_avg": [
            31.0,
            32.91200388915874
        ],
        "wc_review_avg": [
            376.4,
            122.87326804476228
        ],
        "wc_reply_reviewers_avg": [
            16.8,
            17.2441294358399
        ],
        "wc_reply_authors_avg": [
            628.0,
            264.3891071886283
        ],
        "reply_reviewers_avg": [
            0.6,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            2.2,
            0.39999999999999997
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.408248290463863,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1414652472474179206&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;1;1",
        "aff_unique_norm": "Max-Planck-Gesellschaft zur F\u00f6rderung der Wissenschaften e.V.;Max Planck Institute of Biochemistry",
        "aff_unique_dep": ";Biochemistry",
        "aff_unique_url": "https://www.mpg.de;https://www.biochem.mpg.de",
        "aff_unique_abbr": "MPG;MPIB",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "title": "Diffusion in Diffusion: Cyclic One-Way Diffusion for Text-Vision-Conditioned Generation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18221",
        "id": "ePOjNlOjLC",
        "author_site": "Ruoyu Wang, Yongqi Yang, Zhihao Qian, Ye Zhu, Yu Wu",
        "tldr": "",
        "abstract": "Originating from the diffusion phenomenon in physics that describes particle movement, the diffusion generative models inherit the characteristics of stochastic random walk in the data space along the denoising trajectory. However, the intrinsic mutual interference among image regions contradicts the need for practical downstream application scenarios where the preservation of low-level pixel information from given conditioning is desired (e.g., customization tasks like personalized generation and inpainting based on a user-provided single image). In this work, we investigate the diffusion (physics) in diffusion (machine learning) properties and propose our Cyclic One-Way Diffusion (COW) method to control the direction of diffusion phenomenon given a pre-trained frozen diffusion model for versatile customization application scenarios, where the low-level pixel information from the conditioning needs to be preserved. Notably, unlike most current methods that incorporate additional conditions by fine-tuning the base text-to-image diffusion model or learning auxiliary networks, our method provides a novel perspective to understand the task needs and is applicable to a wider range of customization scenarios in a learning-free manner. Extensive experiment results show that our proposed COW can achieve more flexible customization based on strict visual conditions in different application settings. Project page: https://wangruoyu02.github.io/cow.github.io/.",
        "keywords": "Diffusion Models\uff1btext-vision Condition\uff1b",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/355ec8e4c90b7d266e47f26438ac63438d399276.zip",
        "author": "Ruoyu Wang;Yongqi Yang;Zhihao Qian;Ye Zhu;Yu Wu",
        "authorids": "~Ruoyu_Wang6;~Yongqi_Yang1;~Zhihao_Qian1;~Ye_Zhu3;~Yu_Wu3",
        "gender": "F;M;M;F;M",
        "homepage": "https://www.linkedin.com/in/%E8%8B%A5%E7%91%9C-%E7%8E%8B-275936275/;;https://torato-taraka.github.io;https://l-yezhu.github.io/;https://yu-wu.net",
        "dblp": "349/4818;349/4564;;;22/0-11",
        "google_scholar": ";;;uk5WuyIAAAAJ;23SZHUwAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";yongqi-yang-028881275/;;;",
        "or_profile": "~Ruoyu_Wang6;~Yongqi_Yang1;~Zhihao_Qian1;~Ye_Zhu3;~Yu_Wu3",
        "aff": "Wuhan University;Wuhan University;Wuhan University;Princeton University;Wuhan University",
        "aff_domain": "whu.edu.cn;whu.edu.cn;whu.edu.cn;princeton.edu;whu.edu.cn",
        "position": "Undergrad student;MS student;MS student;Postdoc;Full Professor",
        "bibtex": "@inproceedings{\nwang2024diffusion,\ntitle={Diffusion in Diffusion: Cyclic One-Way Diffusion for Text-Vision-Conditioned Generation},\nauthor={Ruoyu Wang and Yongqi Yang and Zhihao Qian and Ye Zhu and Yu Wu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ePOjNlOjLC}\n}",
        "github": "",
        "project": "",
        "reviewers": "45wn;4D12;S1EF;SshV",
        "pdf_size": 14021186,
        "rating": "5;6;6;8",
        "confidence": "4;2;4;4",
        "soundness": "3;3;3;4",
        "contribution": "3;3;3;3",
        "presentation": "3;3;3;4",
        "wc_summary": "35;63;17;81",
        "wc_strengths": "42;53;27;47",
        "wc_weaknesses": "38;177;139;1",
        "wc_questions": "129;11;22;47",
        "wc_review": "244;304;205;176",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1119;919;907;138",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;2;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            49.0,
            24.698178070456937
        ],
        "wc_strengths_avg": [
            42.25,
            9.627434756984853
        ],
        "wc_weaknesses_avg": [
            88.75,
            71.74390217990656
        ],
        "wc_questions_avg": [
            52.25,
            46.19185534269001
        ],
        "wc_review_avg": [
            232.25,
            47.93941489004637
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            770.75,
            374.8975693439476
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.13245323570650439,
        "gs_citation": 16,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4607972958027349017&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=ePOjNlOjLC",
        "pdf": "https://openreview.net/pdf?id=ePOjNlOjLC",
        "email": "whu.edu.cn;whu.edu.cn;whu.edu.cn;princeton.edu;whu.edu.cn",
        "author_num": 5,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "Wuhan University;Princeton University",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.whu.edu.cn/;https://www.princeton.edu",
        "aff_unique_abbr": "WHU;Princeton",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "eQcVfCK5cO",
        "title": "Where is the Invisible: Spatial-Temporal Reasoning with Object Permanence",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Object permanence is a cognitive ability that enables humans to reason about the existence and location of objects that are not visible in the scene, such as those occluded or contained by other objects. This ability is crucial for visual object tracking, which aims to identify and localize the target object across video frames. However, most existing tracking methods rely on deep learning models that learn discriminative visual features from the visual context and fail to handle the cases where the object disappears from the image, e.g., occluded or contained by other objects. In this paper, we propose a novel framework for tracking invisible objects based on Qualitative-Quantitative Spatial-Temporal Reasoning (QQ-STR), inspired by the concept of object permanence. Our framework consists of three modules: a visual perception module, a qualitative spatial relation reasoner (SRR), and a quantitative relation-conditioned spatial-temporal relation analyst (SRA). The SRR module infers the qualitative relationship between each object and the target object based on the current and historical observations, while the SRA module predicts the quantitative location of the target object based on the inferred relationship and a diffusion model that captures the object's motion. We devise a self-supervised learning mechanism that does not require explicit relation annotations and leverages the predicted trajectories to locate the invisible object in videos. We evaluate our framework on a synthetic dataset (LA-CATER) and a new real-world RGB-D video dataset for invisible object tracking (iVOT) that contains challenging scenarios of human-object interactions with frequent occlusion and containment events. Our framework achieves comparable performance to state-of-the-art tracking methods that use additional relation annotations, demonstrating its generalization ability to novel scenes and viewpoints.",
        "keywords": "Object Permanence;Visual Relational Reasoning;Trajectory Prediction",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/7f1970ba9c9ea6a7a2b238e77d3e5ba87a559680.zip",
        "author": "Zijian Wang;Fangwei Zhong;Hai Ci;Wei Wang;Yizhou Wang",
        "authorids": "~Zijian_Wang4;~Fangwei_Zhong3;~Hai_Ci1;~Wei_Wang4;~Yizhou_Wang1",
        "gender": "M;M;M;M;M",
        "homepage": "https://wzj52501.github.io/;;http://cognn.com/;https://cfcs.pku.edu.cn/wangyizhou/;https://fangweizhong.xyz/",
        "dblp": ";227/4707;;71/3387-1;207/1900",
        "google_scholar": ";GMrjppAAAAAJ;https://scholar.google.com/citations?hl=en;831z_VcAAAAJ;ejDz1bYAAAAJ",
        "orcid": ";;;;0000-0002-0428-4552",
        "linkedin": ";;;;",
        "or_profile": "~Zijian_Wang4;~Hai_Ci1;~Wei_Wang4;~Yizhou_Wang1;~fangwei_zhong1",
        "aff": "Peking University;National University of Singapore;Beijing Institute for General Artificial Intelligence;Peking University;Peking University",
        "aff_domain": "pku.edu.cn;nus.edu.sg;bigai.ai;pku.edu.cn;pku.edu.cn",
        "position": "PhD student;Postdoc;Research Scientist;Full Professor;Postdoc",
        "bibtex": "@misc{\nanonymous2024where,\ntitle={Where is the Invisible: Spatial-Temporal Reasoning with Object Permanence},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=eQcVfCK5cO}\n}",
        "github": "",
        "project": "",
        "reviewers": "QThc;xz37;4XQC;Z8r6",
        "site": "https://openreview.net/forum?id=eQcVfCK5cO",
        "pdf_size": 811362,
        "rating": "5;5;5;5",
        "confidence": "5;4;4;4",
        "soundness": "2;3;3;2",
        "contribution": "2;2;3;2",
        "presentation": "3;2;2;1",
        "wc_summary": "117;87;173;128",
        "wc_strengths": "15;49;117;35",
        "wc_weaknesses": "355;300;374;221",
        "wc_questions": "59;30;33;9",
        "wc_review": "546;466;697;393",
        "wc_reply_reviewers": "0;0;16;0",
        "wc_reply_authors": "744;1434;482;827",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;3;1;2",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            126.25,
            30.8818312280862
        ],
        "wc_strengths_avg": [
            54.0,
            38.3275357934736
        ],
        "wc_weaknesses_avg": [
            312.5,
            59.407491110128525
        ],
        "wc_questions_avg": [
            32.75,
            17.75352077758099
        ],
        "wc_review_avg": [
            525.5,
            112.83727221091442
        ],
        "wc_reply_reviewers_avg": [
            4.0,
            6.928203230275509
        ],
        "wc_reply_authors_avg": [
            871.75,
            348.694977738424
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ApJzp8Cru-oJ:scholar.google.com/&scioq=Where+is+the+Invisible:+Spatial-Temporal+Reasoning+with+Object+Permanence&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0;0",
        "aff_unique_norm": "Peking University;National University of Singapore;Beijing Institute for General Artificial Intelligence",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.nus.edu.sg;http://www.bigaiai.org/",
        "aff_unique_abbr": "Peking U;NUS;BIGAI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;0",
        "aff_country_unique": "China;Singapore"
    },
    {
        "id": "eQerjHehcM",
        "title": "An Invariant Information Geometric Method for High-dimensional Online Optimization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Sample efficiency lies at the heart of many optimization problems, especially for black-box settings where costly evaluations and zeroth-order feedback occur. Typical methods such as Bayesian optimization and evolutionary strategy, which stem from an online formulation that optimizes mostly through the current batch, suffer from either high computational cost or low efficiency. To strengthen sample efficiency under reasonable computational cost, one promising way is to achieve invariant under smooth bijective transformations of model parameters. In this paper, we build the first invariant practical optimizer framework InvIGO based on information geometric optimization. It can incorporate historical information without violating the invariant. We further exemplify InvIGO with historical information on multi-dimensional Gaussian, which gives an invariant and scalable optimizer SynCMA that fully incorporates historical information with no external learning rate to tune. The theoretical behavior and advantages of our algorithm over other Gaussian-based optimizers are further analyzed to demonstrate its theoretical superiority. We then benchmark SynCMA against other leading optimizers, including the competitive optimizer in Bayesian optimization, on synthetic functions, Mujoco locomotion tasks and rover planning task. In all scenarios, SynCMA demonstrates great competence, if not dominance, over other optimizers in sample efficiency.",
        "keywords": "Online optimization;Invariant optimizer;Information geometry;Evolutionary strategy;Bayesian optimization",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/68cda845c425f232173eb1ee49de00b96ae59454.zip",
        "author": "Zhengfei Zhang;Yunyue Wei;Yanan Sui",
        "authorids": "~Zhengfei_Zhang1;~Yunyue_Wei1;~Yanan_Sui1",
        "gender": ";M;M",
        "homepage": ";https://github.com/yunyuewei;https://www.yanansui.com",
        "dblp": ";;151/6934",
        "google_scholar": ";;https://scholar.google.com/citations?hl=en",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Zhengfei_Zhang1;~Yunyue_Wei1;~Yanan_Sui1",
        "aff": ";Tsinghua University;Tsinghua University",
        "aff_domain": ";tsinghua.edu.cn;tsinghua.edu.cn",
        "position": ";PhD student;Associate Professor",
        "bibtex": "@misc{\nzhang2024an,\ntitle={An Invariant Information Geometric Method for High-dimensional Online Optimization},\nauthor={Zhengfei Zhang and Yunyue Wei and Yanan Sui},\nyear={2024},\nurl={https://openreview.net/forum?id=eQerjHehcM}\n}",
        "github": "",
        "project": "",
        "reviewers": "Rig7;huPQ;wi31;PmkZ",
        "site": "https://openreview.net/forum?id=eQerjHehcM",
        "pdf_size": 6194019,
        "rating": "1;1;5;5",
        "confidence": "5;3;1;5",
        "soundness": "1;2;3;1",
        "contribution": "1;1;3;1",
        "presentation": "1;1;3;2",
        "wc_summary": "21;36;20;128",
        "wc_strengths": "20;37;9;41",
        "wc_weaknesses": "536;126;2;577",
        "wc_questions": "8;82;129;25",
        "wc_review": "585;281;160;771",
        "wc_reply_reviewers": "0;0;11;0",
        "wc_reply_authors": "638;0;451;555",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;0;1;1",
        "rating_avg": [
            3.0,
            2.0
        ],
        "confidence_avg": [
            3.5,
            1.6583123951777
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            1.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            51.25,
            44.762568067527134
        ],
        "wc_strengths_avg": [
            26.75,
            12.93010054098575
        ],
        "wc_weaknesses_avg": [
            310.25,
            250.54178793167418
        ],
        "wc_questions_avg": [
            61.0,
            47.88005847949645
        ],
        "wc_review_avg": [
            449.25,
            241.8288392644682
        ],
        "wc_reply_reviewers_avg": [
            2.75,
            4.763139720814412
        ],
        "wc_reply_authors_avg": [
            411.0,
            246.36659676181753
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            0.75,
            0.4330127018922193
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.30151134457776363,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:_8Ks0sRpI4wJ:scholar.google.com/&scioq=An+Invariant+Information+Geometric+Method+for+High-dimensional+Online+Optimization&hl=en&as_sdt=0,5",
        "gs_version_total": 5,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Tsinghua University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "eR4W9tnJoZ",
        "title": "Visuo-emotional perception and Human Cognition to engineer content-generation using Generative AI",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Media platforms compete for users\u2019 attention. Their reach crucially depends on algorithmic real-time bidding and efficiency of hyper-personalized, rapidly generated, and user-optimized content. Attention is, although, a scare and fleeting quantity, often awarded less than 1 second per stimulus. Thus, the current strategy is to rely on the vast amount of user-generated data to mimic the content to the user. The underlying assumption is that this is sufficient incentive for attention. This strategy has evidently failed. As witnessed by the alarmingly low or short-lived successes of campaigns in recent times. This mismatch is exacerbated because most content consumed today is digital. Whereas strategies for digital content mimic our past understanding from mass-media. Hence, we formalize a new understanding of communication, specifically for the digital mediums. We prove that the digital medium needs a new understanding of communication protocols. To that end, we take a first principles approach to the new communication protocol: the neurological representations of communication, specifically, where the communication happens in less than 1 second per stimulus. First, we break down and elaborate on this neurological representation of decision-making. Next, we proffer use of our behavioural communication model for generation and optimization of content creatives. To that end, we elaborate methods for rapid, AI-generation content, increasing the efficiency of visual communication on digital media. Within this exploration we include themes of Hyperpersonalization and Search-engine optimization. Thus, we find that strategically produced content exhibits stronger associations to users\u2019 nonconscious needs, wants and goals, which elicits user attention and content-diversity significantly.",
        "keywords": "creative content;digital creatives;attention;personalization;content optimization;content generation;generative AI",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Tanya Upadhyay;Jieya Rawal;Kirtana Sunil Phatnani;Biju Joseph Dominic",
        "authorids": "~Tanya_Upadhyay1;~Jieya_Rawal1;~Kirtana_Sunil_Phatnani1;~Biju_Joseph_Dominic1",
        "gender": "F;F;F;M",
        "homepage": ";;;",
        "dblp": ";;274/4090.html;",
        "google_scholar": ";;HrF-_BMAAAAJ;",
        "orcid": ";;0000-0001-9988-1167;",
        "linkedin": "tanyaupadhyay0830/;jieya-rawal-490b411b5/;kirtana-phatnani-88ba1a146/;biju-dominic-5a08764/",
        "or_profile": "~Tanya_Upadhyay1;~Jieya_Rawal1;~Kirtana_Sunil_Phatnani1;~Biju_Joseph_Dominic1",
        "aff": ";Fractal;Fractal Analytics;Fractal Analytics Ltd.",
        "aff_domain": ";fractal.ai;fractal.ai;fractal.ai",
        "position": ";Researcher;Researcher;Researcher",
        "bibtex": "@misc{\nupadhyay2024visuoemotional,\ntitle={Visuo-emotional perception and Human Cognition to engineer content-generation using Generative {AI}},\nauthor={Tanya Upadhyay and Jieya Rawal and Kirtana Sunil Phatnani and Biju Joseph Dominic},\nyear={2024},\nurl={https://openreview.net/forum?id=eR4W9tnJoZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "1HkZ;Bg7M;DN2b;ZAnW",
        "site": "https://openreview.net/forum?id=eR4W9tnJoZ",
        "pdf_size": 6611092,
        "rating": "1;3;3;3",
        "confidence": "5;3;4;2",
        "soundness": "1;1;3;2",
        "contribution": "2;1;2;2",
        "presentation": "3;2;3;2",
        "wc_summary": "25;76;53;30",
        "wc_strengths": "38;76;111;9",
        "wc_weaknesses": "50;135;427;77",
        "wc_questions": "30;38;89;4",
        "wc_review": "143;325;680;120",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            46.0,
            20.285462775100793
        ],
        "wc_strengths_avg": [
            58.5,
            38.51298482330343
        ],
        "wc_weaknesses_avg": [
            172.25,
            150.2520798524932
        ],
        "wc_questions_avg": [
            40.25,
            30.825111516424396
        ],
        "wc_review_avg": [
            317.0,
            224.11938782711326
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.7745966692414834,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:teuh2bQ-hHAJ:scholar.google.com/&scioq=Visuo-emotional+perception+and+Human+Cognition+to+engineer+content-generation+using+Generative+AI&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Fractal;Fractal Analytics;",
        "aff_unique_dep": ";;",
        "aff_unique_url": ";https://www.fractalanalytics.com;",
        "aff_unique_abbr": ";Fractal Analytics;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "1",
        "aff_country_unique": ";United States"
    },
    {
        "id": "eRAXvtP0gA",
        "title": "Unsupervised Cognition",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Unsupervised learning methods have a soft inspiration in cognition models. To this day, the most successful unsupervised learning methods revolve around clustering samples in a mathematical space. In this paper we propose a primitive-based unsupervised learning approach inspired by novel cognition models. This representation-centric approach models the input space constructively as a distributed hierarchical structure in an input-agnostic way. We compared our approach with the current state-of-the-art in unsupervised learning: K-Means for tabular data and IIC for image data. We show how our proposal performs better in average than any of the alternatives. We also evaluate some cognition-like properties of our proposal that other algorithms lack, even supervised learning ones.",
        "keywords": "Unsupervised learning;representation learning;cognition models",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/6251c693bc409d89e8d4ae320c22e8269dfd9f63.zip",
        "author": "Alfredo Ibias;Roger Aylagas;Guillem Ramirez-Miranda;Enric Guinovart;Eduard Alarcon",
        "authorids": "~Alfredo_Ibias1;~Roger_Aylagas1;~Guillem_Ramirez-Miranda1;~Enric_Guinovart1;~Eduard_Alarcon1",
        "gender": "M;M;;M;M",
        "homepage": "https://alfredoibias.com/;;;;",
        "dblp": "https://dblp.uni-trier.de/pid/242/2118;;265/3523;;28/6172.html",
        "google_scholar": ";;eagT-o8AAAAJ;;PNKavt0AAAAJ",
        "orcid": "0000-0002-3122-4272;0000-0001-5935-4960;0000-0003-2741-3705;;",
        "linkedin": "alfredo-ibias-mart%C3%ADnez-4839b69a/;roger-aylagas-torres/;;enricguinovart/;https://linkedin.com/pub/eduard-alarcon/a8/86b/b51",
        "or_profile": "~Alfredo_Ibias1;~Roger_Aylagas1;~Guillem_Ramirez-Miranda1;~Enric_Guinovart1;~Eduard_Alarcon1",
        "aff": "Avatar Cognition;Avatar Cognition;Avatar Cognition;Avatar Cognition;Universidad Polit\u00e9cnica de Cataluna",
        "aff_domain": "avatarcognition.com;avatarcognition.com;avatarcognition.com;avatarcognition.com;upc.edu",
        "position": "Researcher;Researcher;Researcher;Principal Researcher;Full Professor",
        "bibtex": "@misc{\nibias2024unsupervised,\ntitle={Unsupervised Cognition},\nauthor={Alfredo Ibias and Roger Aylagas and Guillem Ramirez-Miranda and Enric Guinovart and Eduard Alarcon},\nyear={2024},\nurl={https://openreview.net/forum?id=eRAXvtP0gA}\n}",
        "github": "",
        "project": "",
        "reviewers": "pCke;GGEd;GwDC;cK2J",
        "site": "https://openreview.net/forum?id=eRAXvtP0gA",
        "pdf_size": 437093,
        "rating": "1;1;3;5",
        "confidence": "5;3;4;4",
        "soundness": "2;1;2;3",
        "contribution": "2;1;2;3",
        "presentation": "2;1;2;3",
        "wc_summary": "59;38;65;121",
        "wc_strengths": "21;11;12;228",
        "wc_weaknesses": "397;63;233;212",
        "wc_questions": "3;19;4;4",
        "wc_review": "480;131;314;565",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "710;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;0;0;0",
        "rating_avg": [
            2.5,
            1.6583123951777
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            70.75,
            30.695072894521687
        ],
        "wc_strengths_avg": [
            68.0,
            92.45809861769817
        ],
        "wc_weaknesses_avg": [
            226.25,
            118.37942177591509
        ],
        "wc_questions_avg": [
            7.5,
            6.652067347825035
        ],
        "wc_review_avg": [
            372.5,
            166.10012040934828
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            177.5,
            307.4390183434757
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0.5,
            0.8660254037844386
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7402141440134047203&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;0;0;1",
        "aff_unique_norm": "Avatar Cognition;Universitat Polit\u00e8cnica de Catalunya",
        "aff_unique_dep": ";",
        "aff_unique_url": ";https://www.upc.edu",
        "aff_unique_abbr": ";UPC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "1",
        "aff_country_unique": ";Spain"
    },
    {
        "id": "eS0qCQDrkG",
        "title": "Towards Efficient Trace Estimation for Optimal Transport in Domain Adaptation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We improve the efficiency of optimal transport problems with Laplacian regularization in domain adaptation for large-scale data by utilizing Hutchinson's trace estimator, a classical method for approximating the trace of a matrix which to the best of our knowledge has not been used in this context. This approach significantly streamlines the computational complexity of the Laplacian regularization term with respect to the sample size $n$, improving the time from $O(n^3)$ to $O(n^2)$ by converting large-scale matrix multiplications into more manageable matrix-vector multiplication queries. In our experiments, we employed Hutch++, a more efficient variant of Hutchinson's method. Empirical validations confirm our method's efficiency, achieving an average accuracy within 1% of the original algorithm with 80% of its computational time, and maintaining an average accuracy within 3.25% in only half the time. Moreover, the integrated stochastic perturbations mitigate overfitting, enhancing average accuracy under certain conditions.",
        "keywords": "Optimal Transport;Domain Adaptation;Laplacian Regularization;Hutchinson's Trace Estimator",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Hongquan Yang;Xiju Jiang;Yangfan He;Yuchong Xiang;Haoxuan Li;David Woodruff",
        "authorids": "~Hongquan_Yang1;~Xiju_Jiang1;~Yangfan_He1;~Yuchong_Xiang1;~Haoxuan_Li6;~David_Woodruff1",
        "gender": ";M;M;M;M;M",
        "homepage": ";https://github.com/Jcomedy;https://github.com/codepassionor;;https://haoxuanli-pku.github.io/;http://www.cs.cmu.edu/~dwoodruf/",
        "dblp": ";;54/3082.html;;145/4965-1.html;w/DPWoodruff",
        "google_scholar": ";;VI2BuCgAAAAJ;;gtDqiucAAAAJ;https://scholar.google.com.tw/citations?user=0G2t-6sAAAAJ",
        "orcid": ";;;0009-0006-7770-3187;0000-0003-3620-3769;",
        "linkedin": ";;%E6%89%AC%E5%B8%86-%E8%B4%BA-a61282292/;;;",
        "or_profile": "~Hongquan_Yang1;~Xiju_Jiang1;~Yangfan_He1;~Yuchong_Xiang1;~Haoxuan_Li6;~David_Woodruff1",
        "aff": ";Beijing Normal University - Hong Kong Baptist University United International College;University of Minnesota - Twin Cities;The Chinese University of Hong Kong, Shenzhen;Peking University;Carnegie Mellon University",
        "aff_domain": ";uic.edu.cn;cs.umn.edu;cuhk.edu.cn;pku.edu.cn;cmu.edu",
        "position": ";Undergrad student;Undergrad student;Undergrad student;PhD student;Full Professor",
        "bibtex": "@misc{\nyang2024towards,\ntitle={Towards Efficient Trace Estimation for Optimal Transport in Domain Adaptation},\nauthor={Hongquan Yang and Xiju Jiang and Yangfan He and Yuchong Xiang and Haoxuan Li and David Woodruff},\nyear={2024},\nurl={https://openreview.net/forum?id=eS0qCQDrkG}\n}",
        "github": "",
        "project": "",
        "reviewers": "sBbs;AJKK;8usA;34GV",
        "site": "https://openreview.net/forum?id=eS0qCQDrkG",
        "pdf_size": 413583,
        "rating": "1;3;3;6",
        "confidence": "4;4;4;4",
        "soundness": "2;3;3;2",
        "contribution": "1;1;2;3",
        "presentation": "1;3;3;3",
        "wc_summary": "67;121;44;106",
        "wc_strengths": "25;137;33;302",
        "wc_weaknesses": "297;198;84;226",
        "wc_questions": "391;63;57;275",
        "wc_review": "780;519;218;909",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;399;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;1;0",
        "rating_avg": [
            3.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            84.5,
            30.581857366746057
        ],
        "wc_strengths_avg": [
            124.25,
            111.73042334118313
        ],
        "wc_weaknesses_avg": [
            201.25,
            76.71171683647812
        ],
        "wc_questions_avg": [
            196.5,
            142.5438529014843
        ],
        "wc_review_avg": [
            606.5,
            264.66818849268606
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            99.75,
            172.77206805499551
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0.25,
            0.4330127018922193
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:5xIRTTDgw_MJ:scholar.google.com/&scioq=Towards+Efficient+Trace+Estimation+for+Optimal+Transport+in+Domain+Adaptation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "Beijing Normal University;University of Minnesota;Chinese University of Hong Kong;Peking University;Carnegie Mellon University",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "http://www.bnu.edu.cn;https://www.minnesota.edu;https://www.cuhk.edu.cn;http://www.pku.edu.cn;https://www.cmu.edu",
        "aff_unique_abbr": "BNU;UMN;CUHK;Peking U;CMU",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Twin Cities;Shenzhen",
        "aff_country_unique_index": "0;1;0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "eS5zjXvxf8",
        "title": "MultiIoT: Towards Large-scale Multisensory Learning for the Internet of Things",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The Internet of Things (IoT), the network integrating billions of smart physical devices embedded with sensors, software, and communication technologies for the purpose of connecting and exchanging data with other devices and systems, is a critical and rapidly expanding component of our modern world. The IoT ecosystem provides a rich source of real-world modalities such as motion, thermal, geolocation, imaging, depth, sensors, video, and audio for prediction tasks involving the pose, gaze, activities, and gestures of humans as well as the touch, contact, pose, 3D of physical objects.\nMachine learning presents a rich opportunity to automatically process IoT data at scale, enabling efficient inference for impact in understanding human wellbeing, controlling physical devices, and interconnecting smart cities. To develop machine learning technologies for IoT, this paper proposes MultiIoT, the most expansive IoT benchmark to date, encompassing over 1.15 million samples from 12 modalities and 8 tasks.\nMultiIoT introduces unique challenges involving (1) learning from many sensory modalities, (2) fine-grained interactions across long temporal ranges, and (3) extreme heterogeneity due to unique structure and noise topologies in real-world sensors.\nWe also release a set of strong modeling baselines, spanning modality and task-specific methods to multisensory and multitask models to encourage future research in multisensory representation learning for IoT.",
        "keywords": "multimodal learning;representation learning;internet of things;benchmarks",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Shentong Mo;Paul Pu Liang;Russ Salakhutdinov;Louis-Philippe Morency",
        "authorids": "~Shentong_Mo1;~Paul_Pu_Liang1;~Russ_Salakhutdinov1;~Louis-Philippe_Morency1",
        "gender": ";M;M;M",
        "homepage": ";https://pliang279.github.io/;https://www.cs.cmu.edu/~rsalakhu/;https://www.cs.cmu.edu/~morency/",
        "dblp": ";207/9749;;31/739",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;;https://scholar.google.com.tw/citations?user=APgaFK0AAAAJ",
        "orcid": ";;;0000-0001-6376-7696",
        "linkedin": ";;;morency?challengeId=AQELGK_OvMa0vwAAAY72L-VV4X9hW8juuY80VHVeeSGHZ1PJHeeEa5LTFoeTmDGU0t1OL07MXJTYC9EAi6qgPDd2z9ztnbdFYA&submissionId=09a0ff34-04ac-c717-bef7-8c9c8811b463&challengeSource=AgFhxWkU3q7v4wAAAY72L-1xRE0eG-BnZUNE9e3eAG95pgOCZ9u1nxEg-1dK2Dw&challegeType=AgHMzV0lqKgEFwAAAY72L-11X6DHMd3V_A3Iur8XZeyYF2-oBzoufs8&memberId=AgH4yz7pZ_riCgAAAY72L-146jmR2pdr3dmhy2icxBtEQzQ&recognizeDevice=AgFDCNyrhKiFSAAAAY72L-16m7z2EH2t0ueWmMKjyk1_ZJAkfFVe",
        "or_profile": "~Shentong_Mo1;~Paul_Pu_Liang1;~Russ_Salakhutdinov1;~Louis-Philippe_Morency1",
        "aff": ";Massachusetts Institute of Technology;School of Computer Science, Carnegie Mellon University;Carnegie Mellon University",
        "aff_domain": ";mit.edu;cs.cmu.edu;cmu.edu",
        "position": ";Assistant Professor;Full Professor;Associate Professor",
        "bibtex": "@misc{\nmo2024multiiot,\ntitle={MultiIoT: Towards Large-scale Multisensory Learning for the Internet of Things},\nauthor={Shentong Mo and Paul Pu Liang and Russ Salakhutdinov and Louis-Philippe Morency},\nyear={2024},\nurl={https://openreview.net/forum?id=eS5zjXvxf8}\n}",
        "github": "",
        "project": "",
        "reviewers": "S9aC;18YP;4SPn",
        "site": "https://openreview.net/forum?id=eS5zjXvxf8",
        "pdf_size": 1318222,
        "rating": "1;3;5",
        "confidence": "4;4;5",
        "soundness": "1;2;2",
        "contribution": "1;2;2",
        "presentation": "1;3;2",
        "wc_summary": "106;69;45",
        "wc_strengths": "9;51;56",
        "wc_weaknesses": "115;130;107",
        "wc_questions": "46;102;139",
        "wc_review": "276;352;347",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            1.632993161855452
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            73.33333333333333,
            25.090945688745084
        ],
        "wc_strengths_avg": [
            38.666666666666664,
            21.076579946049648
        ],
        "wc_weaknesses_avg": [
            117.33333333333333,
            9.533566430716728
        ],
        "wc_questions_avg": [
            95.66666666666667,
            38.23029630483598
        ],
        "wc_review_avg": [
            325.0,
            34.708308323320324
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.8660254037844385,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14553740486607641&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Massachusetts Institute of Technology;Carnegie Mellon University",
        "aff_unique_dep": ";School of Computer Science",
        "aff_unique_url": "https://web.mit.edu;https://www.cmu.edu",
        "aff_unique_abbr": "MIT;CMU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Pittsburgh",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "eSO9quCgmz",
        "title": "Rethinking pseudo-labeling: Data-centric insights improve semi-supervised learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Pseudo-labeling is a popular semi-supervised learning technique to leverage unlabeled data when labeled samples are scarce. The generation and selection of pseudo-labels heavily rely on labeled data. Existing approaches implicitly assume that the labeled data is gold standard and \u201cperfect\u201d. However, this can be violated in reality with issues such as mislabeling or ambiguity. We address this overlooked aspect and show the importance of investigating labeled data quality to improve any pseudo-labeling method. Specifically, we introduce a novel data characterization and selection framework called DIPS to extend pseudo-labeling. We select useful labeled and pseudo-labeled samples via analysis of learning dynamics. We empirically demonstrate that DIPS improves the performance of various pseudo-labeling methods on real-world datasets across multiple modalities, including tabular and images, with minimal computational overhead. Additionally, DIPS improves data efficiency and reduces the performance distinctions between different pseudo-labelers. Overall, we highlight the significant benefits of a data-centric rethinking of pseudo-labeling in real-world settings.",
        "keywords": "pseudo-labeling;semi-supervised learning;data-centric AI",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/16ea8b4df644908c1b3f53bab9c274a7da050bb2.pdf",
        "author": "Nabeel Seedat;Nicolas Huynh;Fergus Imrie;Mihaela van der Schaar",
        "authorids": "~Nabeel_Seedat1;~Nicolas_Huynh1;~Fergus_Imrie1;~Mihaela_van_der_Schaar2",
        "gender": ";M;;F",
        "homepage": ";;;https://www.vanderschaar-lab.com",
        "dblp": "227/8368;134/9604;281/4466;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;4qCGgpsAAAAJ;DZ3S--MAAAAJ",
        "orcid": ";;0000-0002-6241-0123;",
        "linkedin": "nabeel-seedat/;;;",
        "or_profile": "~Nabeel_Seedat1;~Nicolas_Huynh1;~Fergus_Imrie1;~Mihaela_van_der_Schaar2",
        "aff": "AstraZeneca;University of Cambridge;University of California, Los Angeles;University of California, Los Angeles",
        "aff_domain": "astrazeneca.com;cam.ac.uk;ucla.edu;ucla.edu",
        "position": "Intern;PhD student;Postdoc;Full Professor",
        "bibtex": "@misc{\nseedat2024rethinking,\ntitle={Rethinking pseudo-labeling: Data-centric insights improve semi-supervised learning},\nauthor={Nabeel Seedat and Nicolas Huynh and Fergus Imrie and Mihaela van der Schaar},\nyear={2024},\nurl={https://openreview.net/forum?id=eSO9quCgmz}\n}",
        "github": "",
        "project": "",
        "reviewers": "yF2p;hGhE;K9EF;hxp2",
        "site": "https://openreview.net/forum?id=eSO9quCgmz",
        "pdf_size": 1038240,
        "rating": "3;5;6;6",
        "confidence": "4;4;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;2",
        "presentation": "3;3;3;4",
        "wc_summary": "149;81;93;109",
        "wc_strengths": "123;56;71;125",
        "wc_weaknesses": "593;112;126;308",
        "wc_questions": "449;2;19;133",
        "wc_review": "1314;251;309;675",
        "wc_reply_reviewers": "3085;75;14;333",
        "wc_reply_authors": "4269;1277;1245;2183",
        "reply_reviewers": "6;1;1;2",
        "reply_authors": "11;4;4;6",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            108.0,
            25.67099530598687
        ],
        "wc_strengths_avg": [
            93.75,
            30.719497066195597
        ],
        "wc_weaknesses_avg": [
            284.75,
            194.03785068898284
        ],
        "wc_questions_avg": [
            150.75,
            179.4106671856498
        ],
        "wc_review_avg": [
            637.25,
            423.1881230611275
        ],
        "wc_reply_reviewers_avg": [
            876.75,
            1280.544098225438
        ],
        "wc_reply_authors_avg": [
            2243.5,
            1228.559624112725
        ],
        "reply_reviewers_avg": [
            2.5,
            2.0615528128088303
        ],
        "reply_authors_avg": [
            6.25,
            2.8613807855648994
        ],
        "replies_avg": [
            43,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.4714045207910316,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:XvRzFh0NV6EJ:scholar.google.com/&scioq=Rethinking+pseudo-labeling:+Data-centric+insights+improve+semi-supervised+learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;2",
        "aff_unique_norm": "AstraZeneca;University of Cambridge;University of California, Los Angeles",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.astrazeneca.com;https://www.cam.ac.uk;https://www.ucla.edu",
        "aff_unique_abbr": "AZ;Cambridge;UCLA",
        "aff_campus_unique_index": "1;2;2",
        "aff_campus_unique": ";Cambridge;Los Angeles",
        "aff_country_unique_index": "0;0;1;1",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "id": "eSr9iK1z8n",
        "title": "Exploring View Sampling Strategy in Novel View Synthesis from Causal Perspectives",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Neural Radiance Fields (NeRF) has shown promising performance on synthesize high-quality and realistic images. But it often relies on a large amount of high-quality training data. Instead of extensively sampling training samples to cover various details of scenes, a series of works have studied how to utilize prior knowledge to achieve high-quality novel view synthesis with limited training samples. However, these methods have not explored the essence of this problem, which is how to get the optimal training set under limited view inputs. \nActiveNeRF proposes a method based on an active learning scheme that evaluates the reduction of uncertainty given new inputs, selects samples that provide the maximum information gain, and adds them to the existing training set. Since it is necessary to calculate variance changes, evaluating information gain requires the ground-truth of invisible samples, which is impossible to obtain in real situations. We revisit the view sampling strategies from a causal perspective and achieve efficient sampling without requiring the ground-truth of invisible samples. We also propose a new theoretical framework for the sampling problem in NeRF. We analyze how to obtain the optimal sampling strategy based on our framework. Experiments shows that our conclusion can not only guide sampling, but also can help us design regularization term for general NeRF.",
        "keywords": "Novel View Synthesis;Causal Reasoning;Sampling Strategy",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/55960d802304ef52e39d18cf70c1c78b1a10dbc8.pdf",
        "author": "Yunze Liu;Zifan Wang;Zhiheng Zhang",
        "authorids": "~Yunze_Liu2;~Zifan_Wang3;~Zhiheng_Zhang1",
        "gender": "M;M;M",
        "homepage": "https://yunzeliu.github.io;;https://scholar.google.com/citations?hl=en&user=YVXrszoAAAAJ",
        "dblp": "282/1192;;172/9230.html",
        "google_scholar": "xYVEg0cAAAAJ;;https://scholar.google.com/citations?hl=en",
        "orcid": "0009-0002-3148-8822;;0000-0001-6767-7487",
        "linkedin": ";zifan-wang-643a98255/;",
        "or_profile": "~Yunze_Liu2;~Zifan_Wang3;~Zhiheng_Zhang1",
        "aff": "IIIS, Tsinghua University;Tsinghua University;Tsinghua University, Institute for Interdisciplinary Information Sciences (IIIS)",
        "aff_domain": "mails.tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "PhD student;PhD student;PhD student",
        "bibtex": "@misc{\nliu2024exploring,\ntitle={Exploring View Sampling Strategy in Novel View Synthesis from Causal Perspectives},\nauthor={Yunze Liu and Zifan Wang and Zhiheng Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=eSr9iK1z8n}\n}",
        "github": "",
        "project": "",
        "reviewers": "bNPg;HZXU;itVg",
        "site": "https://openreview.net/forum?id=eSr9iK1z8n",
        "pdf_size": 2476329,
        "rating": "3;5;5",
        "confidence": "3;3;2",
        "soundness": "2;2;3",
        "contribution": "2;2;1",
        "presentation": "1;2;3",
        "wc_summary": "109;87;51",
        "wc_strengths": "51;64;85",
        "wc_weaknesses": "315;78;194",
        "wc_questions": "91;40;5",
        "wc_review": "566;269;335",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            82.33333333333333,
            23.907228102721476
        ],
        "wc_strengths_avg": [
            66.66666666666667,
            14.007934259633796
        ],
        "wc_weaknesses_avg": [
            195.66666666666666,
            96.76202193468721
        ],
        "wc_questions_avg": [
            45.333333333333336,
            35.31131389355102
        ],
        "wc_review_avg": [
            390.0,
            127.33420593069248
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:kJQkzb9zhLEJ:scholar.google.com/&scioq=Exploring+View+Sampling+Strategy+in+Novel+View+Synthesis+from+Causal+Perspectives&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Tsinghua University",
        "aff_unique_dep": "Institute for Interdisciplinary Information Sciences",
        "aff_unique_url": "https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Annealing Self-Distillation Rectification Improves Adversarial Training",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18220",
        "id": "eT6oLkm1cm",
        "author_site": "Yu-Yu Wu, Hung-Jui Wang, Shang-Tse Chen",
        "tldr": "",
        "abstract": "In standard adversarial training, models are optimized to fit invariant one-hot labels for adversarial data when the perturbations are within allowable budgets. However, the overconfident target harms generalization and causes the problem of robust overfitting. To address this issue and enhance adversarial robustness, we analyze the characteristics of robust models and identify that robust models tend to produce smoother and well-calibrated outputs. Based on the observation, we propose a simple yet effective method, Annealing Self-Distillation Rectification (ADR), which generates soft labels as a better guidance mechanism that reflects the underlying distribution of data. By utilizing ADR, we can obtain rectified labels that improve model robustness without the need for pre-trained models or extensive extra computation. Moreover, our method facilitates seamless plug-and-play integration with other adversarial training techniques by replacing the hard labels in their objectives. We demonstrate the efficacy of ADR through extensive experiments and strong performances across datasets.",
        "keywords": "Adversarial training;Adversarial robustness",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/e8fe837b01cc26145c267f69264f16bf20505b62.zip",
        "author": "Yu-Yu Wu;Hung-Jui Wang;Shang-Tse Chen",
        "authorids": "~Yu-Yu_Wu1;~Hung-Jui_Wang1;~Shang-Tse_Chen1",
        "gender": "F;M;M",
        "homepage": ";;https://www.csie.ntu.edu.tw/~stchen",
        "dblp": "326/8575;20/8329;24/9381",
        "google_scholar": ";;TLfsJRwAAAAJ",
        "orcid": ";;",
        "linkedin": "yuyu-wu-b30235180/;hung-jui-wang/;shang-tse-chen-5a908627/",
        "or_profile": "~Yu-Yu_Wu1;~Hung-Jui_Wang1;~Shang-Tse_Chen1",
        "aff": "National Taiwan University;;National Taiwan University",
        "aff_domain": "ntu.edu.tw;;ntu.edu.tw",
        "position": "MS student;;Assistant Professor",
        "bibtex": "@inproceedings{\nwu2024annealing,\ntitle={Annealing Self-Distillation Rectification Improves Adversarial Training},\nauthor={Yu-Yu Wu and Hung-Jui Wang and Shang-Tse Chen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=eT6oLkm1cm}\n}",
        "github": "",
        "project": "",
        "reviewers": "VvcZ;YNYz;EopP;NJvp",
        "pdf_size": 2764909,
        "rating": "6;6;6;6",
        "confidence": "3;4;3;4",
        "soundness": "3;3;2;3",
        "contribution": "2;2;3;3",
        "presentation": "4;3;2;3",
        "wc_summary": "70;55;58;104",
        "wc_strengths": "44;89;29;55",
        "wc_weaknesses": "98;84;45;185",
        "wc_questions": "52;17;155;73",
        "wc_review": "264;245;287;417",
        "wc_reply_reviewers": "37;372;29;116",
        "wc_reply_authors": "1098;1326;888;1085",
        "reply_reviewers": "1;4;1;1",
        "reply_authors": "3;6;3;3",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            71.75,
            19.447043477094404
        ],
        "wc_strengths_avg": [
            54.25,
            22.083647796503186
        ],
        "wc_weaknesses_avg": [
            103.0,
            51.171281008002914
        ],
        "wc_questions_avg": [
            74.25,
            50.73152373031979
        ],
        "wc_review_avg": [
            303.25,
            67.33637575634732
        ],
        "wc_reply_reviewers_avg": [
            138.5,
            139.03326939980948
        ],
        "wc_reply_authors_avg": [
            1099.25,
            155.11830162814445
        ],
        "reply_reviewers_avg": [
            1.75,
            1.299038105676658
        ],
        "reply_authors_avg": [
            3.75,
            1.299038105676658
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2928128055100516455&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=eT6oLkm1cm",
        "pdf": "https://openreview.net/pdf?id=eT6oLkm1cm",
        "email": "ntu.edu.tw;;ntu.edu.tw",
        "author_num": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "National Taiwan University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ntu.edu.tw",
        "aff_unique_abbr": "NTU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Taiwan",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "eTzVoXnGNA",
        "title": "Can Adversarial Examples Be Parsed to Reveal Victim Model Information?",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Numerous adversarial attack methods have been developed to generate imperceptible image perturbations that can cause erroneous predictions of state-of-the-art machine learning (ML) models, in particular, deep neural networks (DNNs). Despite intense research on adversarial attacks, little effort was made to uncover 'arcana' carried in adversarial attacks. In this work, we ask whether it is possible to infer data-agnostic *victim model* (VM) information (i.e., characteristics of the ML model or DNN used to generate adversarial attacks) from data-specific adversarial instances. We call this 'model parsing of adversarial attacks' -- a task to uncover 'arcana' in terms of the concealed VM information in attacks. We approach model parsing via supervised learning, which correctly assigns classes of VM's model attributes (in terms of architecture type, kernel size, activation function, and weight sparsity) to an attack instance generated from this VM. We collect a dataset of adversarial attacks across 7 attack types generated from 135 victim models (configured by 5 architecture types, 3 kernel size setups, 3 activation function types, and 3 weight sparsity ratios). We show that a simple model parsing network (MPN) is able to infer VM attributes from unseen adversarial attacks if their attack settings are consistent with the training setting (i.e., in-distribution generalization assessment). We also provide extensive experiments to justify the feasibility of VM parsing from adversarial attacks, and the influence of training and evaluation factors in the parsing performance (e.g., generalization challenge raised in out-of-distribution evaluation). We further demonstrate how the proposed MPN can be used to uncover the source VM attributes from transfer attacks, and shed light on a potential connection between model parsing and attack transferability.",
        "keywords": "reverse engineering;model parsing;adversarial example",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Yuguang Yao;Jiancheng Liu;Yifan Gong;Xiaoming Liu;Yanzhi Wang;Xue Lin;Sijia Liu",
        "authorids": "~Yuguang_Yao1;~Jiancheng_Liu2;~Yifan_Gong2;~Xiaoming_Liu2;~Yanzhi_Wang3;~Xue_Lin1;~Sijia_Liu1",
        "gender": "M;M;F;M;M;F;M",
        "homepage": "https://www.cse.msu.edu/~yaoyugua/;https://ljcc0930.github.io/;https://yifanfanfanfan.github.io/;http://www.cse.msu.edu/~liuxm/;https://web.northeastern.edu/yanzhiwang/;https://coe.northeastern.edu/people/lin-xue/;https://lsjxjtu.github.io/",
        "dblp": "238/9467;74/3002;49/3073-4.html;l/XiaomingLiu0002;;;128/6972-1",
        "google_scholar": "-chIdAkAAAAJ;ReWNzl4AAAAJ;U_gevVgAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en;p87KNLIAAAAJ;C7dO_UgAAAAJ",
        "orcid": ";;0000-0002-3912-097X;;;0000-0001-6210-8883;",
        "linkedin": "tonyyaomsu/;;yifan-gong-3059b8132/;xiaoming-liu-5a7807b/;;;",
        "or_profile": "~Yuguang_Yao1;~Jiancheng_Liu2;~Yifan_Gong2;~Xiaoming_Liu2;~Yanzhi_Wang3;~Xue_Lin1;~Sijia_Liu1",
        "aff": "Michigan State University;Michigan State University;Northeastern University;Michigan State University;Northeastern University;Northeastern University;Michigan State University",
        "aff_domain": "msu.edu;msu.edu;neu.edu;msu.edu;northeastern.edu;neu.edu;msu.edu",
        "position": "PhD student;MS student;PhD student;Professor;Associate Professor;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nyao2024can,\ntitle={Can Adversarial Examples Be Parsed to Reveal Victim Model Information?},\nauthor={Yuguang Yao and Jiancheng Liu and Yifan Gong and Xiaoming Liu and Yanzhi Wang and Xue Lin and Sijia Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=eTzVoXnGNA}\n}",
        "github": "",
        "project": "",
        "reviewers": "66Jb;9QLD;czv5;8ej7;FJLK",
        "site": "https://openreview.net/forum?id=eTzVoXnGNA",
        "pdf_size": 4434280,
        "rating": "3;3;5;5;6",
        "confidence": "4;3;4;4;2",
        "soundness": "2;1;3;2;3",
        "contribution": "2;1;2;2;3",
        "presentation": "2;2;3;4;3",
        "wc_summary": "37;60;257;209;111",
        "wc_strengths": "16;64;137;69;83",
        "wc_weaknesses": "34;539;1739;451;29",
        "wc_questions": "635;4;243;2;5",
        "wc_review": "722;667;2376;731;228",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            4.4,
            1.2
        ],
        "confidence_avg": [
            3.4,
            0.8
        ],
        "soundness_avg": [
            2.2,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            2.8,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            134.8,
            85.04681063978826
        ],
        "wc_strengths_avg": [
            73.8,
            38.82988539771911
        ],
        "wc_weaknesses_avg": [
            558.4,
            626.2566885870361
        ],
        "wc_questions_avg": [
            177.8,
            246.67987352031784
        ],
        "wc_review_avg": [
            944.8,
            739.5483486561241
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.37499999999999994,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6656724605442050368&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1;0;1;1;0",
        "aff_unique_norm": "Michigan State University;Northeastern University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.msu.edu;https://www.northeastern.edu",
        "aff_unique_abbr": "MSU;NEU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "eUAr4HwU0X",
        "title": "L-Eval: Instituting Standardized Evaluation for Long Context Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recently, there has been growing interest in extending the context length of large language models (LLMs), aiming to effectively process long inputs of one turn or conversations with more extensive histories. While proprietary models such as GPT-4 and Claude can largely preserve the reasoning ability in an extended context, open-source models are still progressing through the early stages of development. \nTo bridge this gap, we propose L-Eval to institute a more standardized evaluation for long context language models (LCLMs) addressing two key aspects: dataset construction and evaluation metrics. On the one hand, we build a new evaluation suite containing 20 sub-tasks, 508 long documents, and over 2,000 human-labeled query-response pairs encompassing diverse question styles, domains, and input length (3k$\\sim$200k tokens). On the other hand, we investigate the effectiveness in evalution metrics for LCLMs. Results show that popular n-gram matching metrics generally can not correlate well with human judgment, and thus we strongly advocate for length-instruction-enhanced (LIE) evaluation and employing LLM judges.  We conducted a comprehensive study of 4 popular commercial LLMs and 12 open-source counterparts using the L-Eval benchmark. Our empirical findings offer useful insights into the study of LCLMs and lay the groundwork for the development of more principled evaluation of these models.",
        "keywords": "Long Context;Evaluation;Metrics;Benchmark",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/d7673ced08e81e9ca949d349ef890411140a9f3c.zip",
        "author": "Chenxin An;Shansan Gong;Ming Zhong;Xingjian Zhao;Mukai Li;Jun Zhang;Lingpeng Kong;Xipeng Qiu",
        "authorids": "~Chenxin_An1;~Shansan_Gong1;~Ming_Zhong2;~Xingjian_Zhao1;~Mukai_Li2;~Jun_Zhang27;~Lingpeng_Kong1;~Xipeng_Qiu1",
        "gender": "M;F;M;M;M;M;M;M",
        "homepage": "https://chenxinan-fdu.github.io/;https://summmeer.github.io/;https://maszhongming.github.io/;;;https://ikekonglp.github.io/;https://xpqiu.github.io/;https://github.com/kiaia",
        "dblp": "289/7002;320/4745;;;;144/7656;69/1395;279/3018.html",
        "google_scholar": "fY69CxIAAAAJ;F86VNoMAAAAJ;mnifqeUAAAAJ;https://scholar.google.com/citations?hl=en;;f1hBi5wAAAAJ;Pq4Yp_kAAAAJ;BizedOAAAAAJ",
        "orcid": ";0000-0001-5028-2323;;;0000-0002-3152-5091;;0000-0001-7163-5247;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Chenxin_An1;~Shansan_Gong1;~Ming_Zhong2;~Xingjian_Zhao1;~Jun_Zhang27;~Lingpeng_Kong1;~Xipeng_Qiu1;~MUKAI_LI1",
        "aff": "University of Hong Kong;University of Hong Kong;University of Illinois Urbana Champaign;Fudan University;ByteDance;Department of Computer Science, The University of Hong Kong;Fudan University;University of Hong Kong",
        "aff_domain": "hku.hk;hku.hk;illinois.edu;fudan.edu.cn;bytedance.com;cs.hku.hk;fudan.edu.cn;hku.hk",
        "position": "PhD student;PhD student;PhD student;Undergrad student;Researcher;Assistant Professor;Full Professor;PhD student",
        "bibtex": "@misc{\nan2024leval,\ntitle={L-Eval: Instituting Standardized Evaluation for Long Context Language Models},\nauthor={Chenxin An and Shansan Gong and Ming Zhong and Xingjian Zhao and Mukai Li and Jun Zhang and Lingpeng Kong and Xipeng Qiu},\nyear={2024},\nurl={https://openreview.net/forum?id=eUAr4HwU0X}\n}",
        "github": "",
        "project": "",
        "reviewers": "cNRy;jW5y;4r4K;xVYn",
        "site": "https://openreview.net/forum?id=eUAr4HwU0X",
        "pdf_size": 1185202,
        "rating": "5;5;6;8",
        "confidence": "3;4;3;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;4",
        "presentation": "3;2;3;3",
        "wc_summary": "101;78;57;242",
        "wc_strengths": "72;72;83;117",
        "wc_weaknesses": "159;398;58;122",
        "wc_questions": "51;133;56;1",
        "wc_review": "383;681;254;482",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "797;1288;445;200",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;3;2;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            119.5,
            72.41719409090634
        ],
        "wc_strengths_avg": [
            86.0,
            18.452642087245934
        ],
        "wc_weaknesses_avg": [
            184.25,
            128.58921999918968
        ],
        "wc_questions_avg": [
            60.25,
            47.187789734209844
        ],
        "wc_review_avg": [
            450.0,
            155.95672476684038
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            682.5,
            408.9477350469128
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.40824829046386296,
        "gs_citation": 35,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10745294130178371375&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;1;2;3;0;2;0",
        "aff_unique_norm": "University of Hong Kong;University of Illinois Urbana-Champaign;Fudan University;ByteDance",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.hku.hk;https://illinois.edu;https://www.fudan.edu.cn;https://www.bytedance.com",
        "aff_unique_abbr": "HKU;UIUC;Fudan;ByteDance",
        "aff_campus_unique_index": "0;0;1;0;0",
        "aff_campus_unique": "Hong Kong SAR;Urbana-Champaign;",
        "aff_country_unique_index": "0;0;1;0;0;0;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "SaNN: Simple Yet Powerful Simplicial-aware Neural Networks",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18219",
        "id": "eUgS9Ig8JG",
        "author_site": "Sravanthi Gurugubelli, Sundeep Prabhakar Chepuri",
        "tldr": "",
        "abstract": "Simplicial neural networks (SNNs) are deep models for higher-order graph representation learning. SNNs learn low-dimensional embeddings of simplices in a simplicial complex by aggregating features of their respective upper, lower, boundary, and coboundary adjacent simplices. The aggregation in SNNs is carried out during training. Since the number of simplices of various orders in a simplicial complex is significantly large, the memory and training-time requirement in SNNs is enormous. In this work, we propose a scalable simplicial-aware neural network (SaNN) model with a constant run-time and memory requirements independent of the size of the simplicial complex and the density of interactions in it. SaNN is based on pre-aggregated simplicial-aware features as inputs to a neural network, so it has a strong simplicial-structural inductive bias. We provide theoretical conditions under which SaNN is provably more powerful than the Weisfeiler-Lehman (WL) graph isomorphism test and as powerful as the simplicial Weisfeiler-Lehman (SWL) test. We also show that SaNN is permutation and orientation equivariant and satisfies simplicial-awareness of the highest order in a simplicial complex. We demonstrate via numerical experiments that despite being computationally economical, the proposed model achieves state-of-the-art performance in predicting trajectories,  simplicial closures, and classifying graphs.",
        "keywords": "Graph Neural Networks;Higher-order Representation Learning;Simplicial Complexes;Simplicial Neural Networks;Weisfeiler-Lehman Isomorphism Test",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/0409d0bfd0e6b9c23876ef435a4f64eed976a61e.zip",
        "author": "Sravanthi Gurugubelli;Sundeep Prabhakar Chepuri",
        "authorids": "~Sravanthi_Gurugubelli1;~Sundeep_Prabhakar_Chepuri1",
        "gender": "F;M",
        "homepage": ";https://ece.iisc.ac.in/~spchepuri/",
        "dblp": ";72/10237.html",
        "google_scholar": "DXyvmJsAAAAJ;Gu8FjdwAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Sravanthi_Gurugubelli1;~Sundeep_Prabhakar_Chepuri1",
        "aff": "Indian Institute of Science, Bangalore;Indian Institute of Science",
        "aff_domain": "iisc.ac.in;iisc.ac.in",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\ngurugubelli2024sann,\ntitle={Sa{NN}: Simple Yet Powerful Simplicial-aware Neural Networks},\nauthor={Sravanthi Gurugubelli and Sundeep Prabhakar Chepuri},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=eUgS9Ig8JG}\n}",
        "github": "",
        "project": "",
        "reviewers": "4crX;LALK;7LnN;jAzK",
        "pdf_size": 1146584,
        "rating": "6;6;8;8",
        "confidence": "4;3;2;4",
        "soundness": "3;4;3;4",
        "contribution": "3;2;3;4",
        "presentation": "3;3;4;3",
        "wc_summary": "75;124;74;118",
        "wc_strengths": "65;74;77;129",
        "wc_weaknesses": "52;175;186;84",
        "wc_questions": "684;103;50;235",
        "wc_review": "876;476;387;566",
        "wc_reply_reviewers": "0;0;24;59",
        "wc_reply_authors": "1581;1288;681;1293",
        "reply_reviewers": "0;0;1;2",
        "reply_authors": "8;6;4;9",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            97.75,
            23.34925052330374
        ],
        "wc_strengths_avg": [
            86.25,
            25.073641538476217
        ],
        "wc_weaknesses_avg": [
            124.25,
            57.508151596099836
        ],
        "wc_questions_avg": [
            268.0,
            249.4463870253486
        ],
        "wc_review_avg": [
            576.25,
            184.26933412806375
        ],
        "wc_reply_reviewers_avg": [
            20.75,
            24.159625411003375
        ],
        "wc_reply_authors_avg": [
            1210.75,
            328.04449012291
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            6.75,
            1.920286436967152
        ],
        "replies_avg": [
            38,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.30151134457776363,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4927316478063032569&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=eUgS9Ig8JG",
        "pdf": "https://openreview.net/pdf?id=eUgS9Ig8JG",
        "email": "iisc.ac.in;iisc.ac.in",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Indian Institute of Science",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.iisc.ac.in",
        "aff_unique_abbr": "IISc",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Bangalore;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "India"
    },
    {
        "id": "eVlcdbIx2O",
        "title": "A Generative Model for Game Theory with Flow Equilibrium",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In recent years, generative models have emerged as a groundbreaking development in the field of artificial intelligence, transforming various domains such as image synthesis, natural language processing, and data generation. While recent studies have integrated generative models into multi-agent scenarios, their game-theoretical implications have remained largely unexplored. Specifically, the relationship between solutions derived from generative models and game theoretical equilibrium concepts lacks rigorous investigation.\nThis paper aims to bridge the gap between generative models and game theory by introducing a novel probabilistic framework for modelling multi-agent decision-making problems. This innovative framework reinterprets these problems as generative processes. Furthermore, we introduce a training objective known as \"flow equilibrium\" and establish a theoretical connection between flow equilibrium and Nash equilibrium. To analyse the theoretical properties of our framework, we present a tabular version algorithm along with a convergence proof. Additionally, we propose an extended algorithm incorporating neural networks to handle more complex environments. Notably, our framework naturally incorporates opponent modelling. Harnessing the capabilities of generative models, our framework excels in capturing the intricate dynamics of strategic interactions among agents. We validate our approach through testing on various multi-agent tasks, including cooperative and general-sum games. The empirical results consistently support our theoretical findings, demonstrating that our framework consistently outperforms existing methods in terms of solution quality.",
        "keywords": "Generative Model;Variational Inference;Game Theory",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/ba2b5b0037c2e3520cda64f052a08b0a08487681.zip",
        "author": "Zhiyu Zhao;David Henry Mguni;Yali Du;Kaiyang Guo;Haifeng Zhang;Jun Wang",
        "authorids": "~Zhiyu_Zhao1;~David_Henry_Mguni1;~Yali_Du1;~Kaiyang_Guo2;~Haifeng_Zhang3;~Jun_Wang2",
        "gender": ";M;;M;;M",
        "homepage": ";;;;https://pkuzhf.github.io;http://www0.cs.ucl.ac.uk/staff/jun.wang/",
        "dblp": ";217/2369;;199/8049;93/7133-2;w/JunWang12",
        "google_scholar": ";K-_yzBsAAAAJ;;;;https://scholar.google.co.uk/citations?user=wIE1tY4AAAAJ",
        "orcid": ";;;;;",
        "linkedin": "%E7%A5%89%E7%91%9C-%E8%B5%B5-45852323a/;;;;;",
        "or_profile": "~Zhiyu_Zhao1;~David_Henry_Mguni1;~Yali_Du1;~Kaiyang_Guo2;~Haifeng_Zhang3;~Jun_Wang2",
        "aff": "Institute of Automation, Chinese Academy of Sciences;Queen Mary University, London;;Huawei Technologies Ltd.;Institute of Automation, Chinese Academy of Sciences;University College London",
        "aff_domain": "ia.ac.cn;qmul.ac.uk;;huawei.com;ia.ac.cn;ucl.ac.uk",
        "position": "MS student;Lecturer;;Principal Researcher;Associate Professor;Professor",
        "bibtex": "@misc{\nzhao2024a,\ntitle={A Generative Model for Game Theory with Flow Equilibrium},\nauthor={Zhiyu Zhao and David Henry Mguni and Yali Du and Kaiyang Guo and Haifeng Zhang and Jun Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=eVlcdbIx2O}\n}",
        "github": "",
        "project": "",
        "reviewers": "TMg4;RfBQ;39sv",
        "site": "https://openreview.net/forum?id=eVlcdbIx2O",
        "pdf_size": 445669,
        "rating": "3;3;6",
        "confidence": "3;3;3",
        "soundness": "2;2;3",
        "contribution": "3;2;3",
        "presentation": "2;1;3",
        "wc_summary": "87;99;106",
        "wc_strengths": "51;19;64",
        "wc_weaknesses": "44;358;48",
        "wc_questions": "228;4;1",
        "wc_review": "410;480;219",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            97.33333333333333,
            7.845734863959881
        ],
        "wc_strengths_avg": [
            44.666666666666664,
            18.90913947157711
        ],
        "wc_weaknesses_avg": [
            150.0,
            147.0872756789882
        ],
        "wc_questions_avg": [
            77.66666666666667,
            106.30877459342457
        ],
        "wc_review_avg": [
            369.6666666666667,
            110.3036213770377
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4119698943494331896&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0;3",
        "aff_unique_norm": "Chinese Academy of Sciences;Queen Mary University of London;Huawei;University College London",
        "aff_unique_dep": "Institute of Automation;;Huawei Technologies;",
        "aff_unique_url": "http://www.ia.cas.cn;https://www.qmul.ac.uk;https://www.huawei.com;https://www.ucl.ac.uk",
        "aff_unique_abbr": "CAS;QMUL;Huawei;UCL",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";London",
        "aff_country_unique_index": "0;1;0;0;1",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "id": "eVpjeCNsR6",
        "title": "EraseDiff: Erasing Data Influence in Diffusion Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In response to data protection regulations and the ``right to be forgotten'', in this work, we introduce an unlearning algorithm for diffusion models. Our algorithm equips a diffusion model with a mechanism to mitigate the concerns related to data memorization. To achieve this, we formulate the unlearning problem as a bi-level optimization problem, wherein the outer objective is to preserve the utility of the diffusion model on the remaining data. The inner objective aims to scrub the information associated with forgetting data by deviating the learnable generative process from the ground-truth denoising procedure. To solve the resulting bi-level problem, we adopt a first-order method, having superior practical performance while being vigilant about the diffusion process and solving a bi-level problem therein. Empirically, we demonstrate that our algorithm can preserve the model utility, effectiveness, and efficiency while removing across two widely-used diffusion models and in both conditional and unconditional image generation scenarios. In our experiments, we demonstrate the unlearning of classes, attributes, and even a race from face and object datasets such as UTKFace, CelebA, CelebA-HQ, and CIFAR10. The source code of our algorithm is available at https://github.com/AnonymousUser-hello/DiffusionUnlearning.",
        "keywords": "Machine unlearning;Diffusion-based generative models",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/11021abc8e5713f865d72b04f1c96504dc603dd7.pdf",
        "author": "Jing Wu;Trung Le;Munawar Hayat;Mehrtash Harandi",
        "authorids": "~Jing_Wu6;~Trung_Le2;~Munawar_Hayat2;~Mehrtash_Harandi2",
        "gender": "F;M;;",
        "homepage": "https://jingwu321.github.io/;;;",
        "dblp": "88/3604-21.html;;;",
        "google_scholar": "https://scholar.google.com.au/citations?user=wRWAmm4AAAAJ;https://scholar.google.com/citations?hl=en;;",
        "orcid": "0009-0004-7049-5480;;;",
        "linkedin": ";;;",
        "or_profile": "~Jing_Wu6;~Trung_Le2;~Munawar_Hayat2;~Mehrtash_Harandi2",
        "aff": "Monash University;Monash University;;",
        "aff_domain": "monash.edu;monash.edu;;",
        "position": "PhD student;Assistant Professor;;",
        "bibtex": "@misc{\nwu2024erasediff,\ntitle={EraseDiff: Erasing Data Influence in Diffusion Models},\nauthor={Jing Wu and Trung Le and Munawar Hayat and Mehrtash Harandi},\nyear={2024},\nurl={https://openreview.net/forum?id=eVpjeCNsR6}\n}",
        "github": "",
        "project": "",
        "reviewers": "JxPy;oTvb;Sr9v;KgRz;LbvE",
        "site": "https://openreview.net/forum?id=eVpjeCNsR6",
        "pdf_size": 12874150,
        "rating": "3;5;6;6;8",
        "confidence": "4;4;3;4;3",
        "soundness": "1;3;3;3;3",
        "contribution": "1;2;3;3;4",
        "presentation": "2;3;3;3;4",
        "wc_summary": "118;153;67;133;72",
        "wc_strengths": "16;35;54;76;95",
        "wc_weaknesses": "137;82;24;131;177",
        "wc_questions": "1;10;11;282;64",
        "wc_review": "272;280;156;622;408",
        "wc_reply_reviewers": "312;0;0;0;0",
        "wc_reply_authors": "2045;365;227;708;288",
        "reply_reviewers": "1;0;0;0;0",
        "reply_authors": "4;1;1;1;1",
        "rating_avg": [
            5.6,
            1.624807680927192
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.6,
            0.8000000000000002
        ],
        "contribution_avg": [
            2.6,
            1.019803902718557
        ],
        "presentation_avg": [
            3.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            108.6,
            33.838439680339874
        ],
        "wc_strengths_avg": [
            55.2,
            28.15244216759889
        ],
        "wc_weaknesses_avg": [
            110.2,
            52.60950484465711
        ],
        "wc_questions_avg": [
            73.6,
            106.54313680383171
        ],
        "wc_review_avg": [
            347.6,
            158.70677364246305
        ],
        "wc_reply_reviewers_avg": [
            62.4,
            124.79999999999998
        ],
        "wc_reply_authors_avg": [
            726.6,
            679.8895792700459
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            1.6,
            1.2000000000000002
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.7035264706814485,
        "gs_citation": 23,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4666213113224623437&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Monash University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.monash.edu",
        "aff_unique_abbr": "Monash",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Australia"
    },
    {
        "id": "eWLOoaShEH",
        "title": "Learning to Model the World with Language",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "To interact with humans and act in the world, agents need to understand the range of language that people use and relate it to the visual world. While current agents learn to execute simple language instructions, we aim to build agents that leverage diverse language\u2014language like \u201cthis button turns on the TV\u201d or \u201cI put the bowls away\u201d\u2014that conveys general knowledge, describes the state of the world, provides interactive feedback, and more. Our key idea is that agents should interpret such diverse language as a signal that helps them predict the future: what they will observe, how the world will behave, and which situations will bring high reward. This perspective unifies language understanding with future prediction as a powerful self-supervised learning objective. We instantiate this in Dynalang, an agent that learns a multimodal world model to predict future text and image representations, and learns to act from imagined model rollouts. Unlike current agents that use language to predict actions only, Dynalang acquires a rich language understanding by learning to predict future language, video, and rewards. In addition to learning from online interaction in an environment, we show that Dynalang can be pretrained on text-only datasets, enabling learning from more general, offline datasets. From using language hints in grid worlds to navigating photorealistic home scans, Dynalang can leverage diverse types of language, e.g. environment descriptions, game rules, and instructions.",
        "keywords": "reinforcement learning;language and rl;language grounding;world models;multi-modal world models",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Jessy Lin;Yuqing Du;Olivia Watkins;Danijar Hafner;Pieter Abbeel;Dan Klein;Anca Dragan",
        "authorids": "~Jessy_Lin1;~Yuqing_Du1;~Olivia_Watkins1;~Danijar_Hafner1;~Pieter_Abbeel2;~Dan_Klein1;~Anca_Dragan1",
        "gender": ";;;;M;;F",
        "homepage": "https://jessylin.com;http://yuqingd.github.io;https://people.eecs.berkeley.edu/~oliviawatkins/;https://danijar.com;https://people.eecs.berkeley.edu/~pabbeel/;http://people.eecs.berkeley.edu/~klein/;http://www.ancadragan.com/",
        "dblp": "211/7575;218/5572;;184/8088;;;",
        "google_scholar": "jTMUPNkAAAAJ;;;VINmGpYAAAAJ;https://scholar.google.com.tw/citations?user=vtwH6GkAAAAJ;;",
        "orcid": ";;;0000-0002-9534-7271;;;",
        "linkedin": ";yuqingdu;;;;dan-klein/;",
        "or_profile": "~Jessy_Lin1;~Yuqing_Du1;~Olivia_Watkins1;~Danijar_Hafner1;~Pieter_Abbeel2;~Dan_Klein1;~Anca_Dragan1",
        "aff": "University of California, Berkeley;Google DeepMind;University of California, Berkeley;Google;Covariant;University of California, Berkeley;University of California, Berkeley",
        "aff_domain": "berkeley.edu;google.com;berkeley.edu;google.com;covariant.ai;berkeley.edu;berkeley.edu",
        "position": "PhD student;Researcher;PhD student;Researcher;Founder;Full Professor;Associate Professor",
        "bibtex": "@misc{\nlin2024learning,\ntitle={Learning to Model the World with Language},\nauthor={Jessy Lin and Yuqing Du and Olivia Watkins and Danijar Hafner and Pieter Abbeel and Dan Klein and Anca Dragan},\nyear={2024},\nurl={https://openreview.net/forum?id=eWLOoaShEH}\n}",
        "github": "",
        "project": "",
        "reviewers": "PbML;bqw2;PggN;X6yV",
        "site": "https://openreview.net/forum?id=eWLOoaShEH",
        "pdf_size": 1345556,
        "rating": "5;5;6;6",
        "confidence": "3;2;4;4",
        "soundness": "3;2;3;2",
        "contribution": "2;2;3;3",
        "presentation": "2;2;4;3",
        "wc_summary": "75;15;94;69",
        "wc_strengths": "56;17;60;68",
        "wc_weaknesses": "193;15;297;143",
        "wc_questions": "57;15;117;69",
        "wc_review": "381;62;568;349",
        "wc_reply_reviewers": "78;0;493;0",
        "wc_reply_authors": "886;0;1797;790",
        "reply_reviewers": "1;0;3;0",
        "reply_authors": "3;0;6;3",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            63.25,
            29.345996319770776
        ],
        "wc_strengths_avg": [
            50.25,
            19.677080576142387
        ],
        "wc_weaknesses_avg": [
            162.0,
            101.43470806385751
        ],
        "wc_questions_avg": [
            64.5,
            36.34212431875715
        ],
        "wc_review_avg": [
            340.0,
            180.99033123346672
        ],
        "wc_reply_reviewers_avg": [
            142.75,
            204.70878706103457
        ],
        "wc_reply_authors_avg": [
            868.25,
            636.9601145283746
        ],
        "reply_reviewers_avg": [
            1.0,
            1.224744871391589
        ],
        "reply_authors_avg": [
            3.0,
            2.1213203435596424
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.9045340337332909,
        "gs_citation": 51,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18079008737666460104&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;0;1;2;0;0",
        "aff_unique_norm": "University of California, Berkeley;Google;Covariant",
        "aff_unique_dep": ";Google DeepMind;",
        "aff_unique_url": "https://www.berkeley.edu;https://deepmind.com;",
        "aff_unique_abbr": "UC Berkeley;DeepMind;",
        "aff_campus_unique_index": "0;0;2;0;0",
        "aff_campus_unique": "Berkeley;;Mountain View",
        "aff_country_unique_index": "0;1;0;0;0;0",
        "aff_country_unique": "United States;United Kingdom;"
    },
    {
        "id": "eXrUdcxfCw",
        "title": "Continual Test-Time Adaptation by Leveraging Source Prototypes and Exponential Moving Average Target Prototypes",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Continual Test-Time Adaptation (CTA) is a challenging task that aims to adapt a source pre-trained model to continually changing target domains. In the CTA setting, the model does not know when the target domain changes, thus facing a drastic change in the distribution of streaming inputs during the test-time. The key challenge is to keep adapting the model to the continually changing target domains in an online manner. To keep track of the changing target domain distributions, we propose to maintain an exponential moving average (EMA) target prototype for each class with reliable target samples. We exploit those prototypes to cluster the target features class-wisely. Moreover, we aim to align the target distributions to the source distribution by minimizing the distance between the target feature and its corresponding pre-computed source prototype. We empirically observe that our simple proposed method achieves reasonable performance gain when applied on existing CTA methods. Furthermore, we assess the adaptation time between existing methodologies and our novel approach, demonstrating that our method can gain noteworthy performance without substantial adaptation time overhead.",
        "keywords": "Test Time Adaptation;Unsupervised Domain Adaptation;Continual Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Inseop Chung;Kyomin Hwang;Jayeon Yoo;Nojun Kwak",
        "authorids": "~Inseop_Chung1;~Kyomin_Hwang1;~Jayeon_Yoo1;~Nojun_Kwak1",
        "gender": "M;M;F;M",
        "homepage": ";https://kyominhwang.github.io/;;http://mipal.snu.ac.kr",
        "dblp": "239/5608;356/2620;281/8521;49/2806",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?view_op=list_works;JAeV59wAAAAJ;h_8-1M0AAAAJ",
        "orcid": ";;;0000-0002-1792-0327",
        "linkedin": ";kyomin-hwang-299119147/;;",
        "or_profile": "~Inseop_Chung1;~Kyomin_Hwang1;~Jayeon_Yoo1;~Nojun_Kwak1",
        "aff": "Seoul National University;NAVER;Seoul National University;Seoul National University",
        "aff_domain": "snu.ac.kr;navercorp.com;snu.ac.kr;snu.ac.kr",
        "position": "PhD student;Intern;PhD student;Full Professor",
        "bibtex": "@misc{\nchung2024continual,\ntitle={Continual Test-Time Adaptation by Leveraging Source Prototypes and Exponential Moving Average Target Prototypes},\nauthor={Inseop Chung and Kyomin Hwang and Jayeon Yoo and Nojun Kwak},\nyear={2024},\nurl={https://openreview.net/forum?id=eXrUdcxfCw}\n}",
        "github": "",
        "project": "",
        "reviewers": "hKy6;QiZ6;iXmR;eihD;JC3N",
        "site": "https://openreview.net/forum?id=eXrUdcxfCw",
        "pdf_size": 4131553,
        "rating": "3;5;5;5;6",
        "confidence": "4;4;5;4;3",
        "soundness": "2;3;2;3;3",
        "contribution": "2;2;2;2;2",
        "presentation": "4;2;2;2;3",
        "wc_summary": "210;109;77;84;89",
        "wc_strengths": "49;70;86;67;27",
        "wc_weaknesses": "203;445;200;133;56",
        "wc_questions": "1;6;167;5;45",
        "wc_review": "463;630;530;289;217",
        "wc_reply_reviewers": "0;0;0;0;94",
        "wc_reply_authors": "242;862;400;98;403",
        "reply_reviewers": "0;0;0;0;1",
        "reply_authors": "1;2;1;1;2",
        "rating_avg": [
            4.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6,
            0.8
        ],
        "wc_summary_avg": [
            113.8,
            49.264185774251864
        ],
        "wc_strengths_avg": [
            59.8,
            20.173249614278806
        ],
        "wc_weaknesses_avg": [
            207.4,
            130.3726965280691
        ],
        "wc_questions_avg": [
            44.8,
            63.15188041539223
        ],
        "wc_review_avg": [
            425.8,
            152.48003147953503
        ],
        "wc_reply_reviewers_avg": [
            18.8,
            37.6
        ],
        "wc_reply_authors_avg": [
            401.0,
            256.7551362680015
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4
        ],
        "reply_authors_avg": [
            1.4,
            0.4898979485566356
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.3227486121839514,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:0HfBKNjyogQJ:scholar.google.com/&scioq=Continual+Test-Time+Adaptation+by+Leveraging+Source+Prototypes+and+Exponential+Moving+Average+Target+Prototypes&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Seoul National University;NAVER Corporation",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.snu.ac.kr;https://www.naver.com",
        "aff_unique_abbr": "SNU;NAVER",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "Generative Modeling of Regular and Irregular Time Series Data via Koopman VAEs",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18218",
        "id": "eY7sLb0dVF",
        "author_site": "Ilan Naiman, N. Benjamin Erichson, Pu Ren, Michael W Mahoney, Omri Azencot",
        "tldr": "",
        "abstract": "Generating realistic time series data is important for many engineering and scientific applications. \nExisting work tackles this problem using generative adversarial networks (GANs).\nHowever, GANs are unstable during training, and they can suffer from mode collapse. \nWhile variational autoencoders (VAEs) are known to be more robust to the these issues, they are (surprisingly) less considered for time series generation. \nIn this work, we introduce Koopman VAE (KoVAE), a new generative framework that is based on a novel design for the model prior, and that can be optimized for either regular and irregular training data. \nInspired by Koopman theory, we represent the latent conditional prior dynamics using a linear map. \nOur approach enhances generative modeling with two desired features: (i) incorporating domain knowledge can be achieved by leveraging spectral tools that prescribe constraints on the eigenvalues of the linear map; and (ii) studying the qualitative behavior and stability of the system can be performed using tools from dynamical systems theory. \nOur results show that KoVAE outperforms state-of-the-art GAN and VAE methods across several challenging synthetic and real-world time series generation benchmarks. \nWhether trained on regular or irregular data, KoVAE generates time series that improve both discriminative and predictive metrics. \nWe also present visual evidence suggesting that KoVAE learns probability density functions that better approximate the empirical ground truth distribution.",
        "keywords": "Time Series Generation;Koopman Theory; Variational Autoencoder; Generative Modeling",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Ilan Naiman;N. Benjamin Erichson;Pu Ren;Michael W. Mahoney;Omri Azencot",
        "authorids": "~Ilan_Naiman1;~N._Benjamin_Erichson1;~Pu_Ren1;~Michael_W._Mahoney1;~Omri_Azencot1",
        "gender": "M;M;M;;Unspecified",
        "homepage": "https://www.linkedin.com/in/ilan-naiman-80071a190;https://www.benerichson.com/;https://paulpuren.github.io/;;http://omriazencot.com",
        "dblp": "285/4824;173/5153;;;132/3985.html",
        "google_scholar": "Fglytk8AAAAJ;https://scholar.google.co.uk/citations?user=8ViYcioAAAAJ;FiuAyGwAAAAJ;;https://scholar.google.co.il/citations?user=MEGuRmAAAAAJ",
        "orcid": ";;0000-0002-6354-385X;;",
        "linkedin": "ilan-naiman-80071a190;;;;omri-azencot-a8812417/",
        "or_profile": "~Ilan_Naiman1;~N._Benjamin_Erichson1;~Pu_Ren1;~Michael_W._Mahoney1;~Omri_Azencot1",
        "aff": "Ben Gurion University of the Negev, Technion;Lawrence Berkeley National Lab;Lawrence Berkeley National Lab;;Ben-Gurion University of the Negev",
        "aff_domain": "bgu.ac.il;lbl.gov;lbl.gov;;bgu.ac.il",
        "position": "PhD student;Researcher;Postdoc;;Assistant Professor",
        "bibtex": "@inproceedings{\nnaiman2024generative,\ntitle={Generative Modeling of Regular and Irregular Time Series Data via Koopman {VAE}s},\nauthor={Ilan Naiman and N. Benjamin Erichson and Pu Ren and Michael W. Mahoney and Omri Azencot},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=eY7sLb0dVF}\n}",
        "github": "",
        "project": "",
        "reviewers": "HuLD;SWgv;kti2;nGir",
        "pdf_size": 9749553,
        "rating": "5;6;6;8",
        "confidence": "5;4;4;5",
        "soundness": "2;3;3;4",
        "contribution": "2;3;3;4",
        "presentation": "1;3;3;3",
        "wc_summary": "62;95;109;45",
        "wc_strengths": "40;72;36;109",
        "wc_weaknesses": "91;233;125;93",
        "wc_questions": "343;97;1;45",
        "wc_review": "536;497;271;292",
        "wc_reply_reviewers": "284;280;0;85",
        "wc_reply_authors": "1511;927;688;440",
        "reply_reviewers": "2;1;0;2",
        "reply_authors": "5;2;2;3",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            77.75,
            25.469344318219107
        ],
        "wc_strengths_avg": [
            64.25,
            29.363029475856198
        ],
        "wc_weaknesses_avg": [
            135.5,
            57.88566316455224
        ],
        "wc_questions_avg": [
            121.5,
            132.32063331166458
        ],
        "wc_review_avg": [
            399.0,
            118.53902311053521
        ],
        "wc_reply_reviewers_avg": [
            162.25,
            123.47140357183926
        ],
        "wc_reply_authors_avg": [
            891.5,
            396.9587510056933
        ],
        "reply_reviewers_avg": [
            1.25,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.0,
            1.224744871391589
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.2294157338705618,
        "gs_citation": 19,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8249836444450014996&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=eY7sLb0dVF",
        "pdf": "https://openreview.net/pdf?id=eY7sLb0dVF",
        "email": "bgu.ac.il;lbl.gov;lbl.gov;;bgu.ac.il",
        "author_num": 5,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "Ben Gurion University of the Negev;Lawrence Berkeley National Laboratory;Ben-Gurion University of the Negev",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.bgu.ac.il;https://www.lbl.gov;https://www.bgu.ac.il",
        "aff_unique_abbr": "BGU;LBNL;BGU",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Berkeley",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "Israel;United States"
    },
    {
        "id": "eZAlb8fX5y",
        "title": "KVTQ: Compressing the KV Cache to Hardware Efficient Ternary Digits by Fine-Grained Dynamic Quantization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models(LLMs) exhibit capabilities beyond expectations in various NLP tasks.\nSince the inference of LLM consumes huge resources, optimizing the inference process of LLM\nis of great significance to promote the application of LLM.\nIn the text generation process, caching the key-value embeddings (KV cache) for subsequent\ngeneration process is a basic optimization method.\nHowever, huge size of the KV cache limits the inference batch size.\nCompressing the space occupied by the cached key-value embeddings  can enlarge the batch \nsize of LLM inference to improve throughput.\nBesides, based on the analysis of the usage mode of the KV cache, we find compressing\nthe KV cache to ternary digits can not only compress the space occupied by the KV cache,\nbut also greatly reduce the required multiplication operation in the attention block.\nCombined with the numerical features of the KV cache, we propose KVTQ, a method which\ncompresses the KV cache to hardware efficient ternary digits.\nWe validate our KVTQ method on different series of LLMs and\nget the conclusion that the KVTQ method which compresses the KV cache to \nultra-low bits can still preserve the model quality.",
        "keywords": "compression;dynamic quantization;ternary digits;KV cache",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Ruipeng Kang;xiao zheng;patrick lp;Liufeng Wang;minquan fang;Zhengbiao Wu;Xiantao Zhang",
        "authorids": "~Ruipeng_Kang1;~xiao_zheng5;~patrick_lp1;~Liufeng_Wang1;~minquan_fang1;~Zhengbiao_Wu1;~Xiantao_Zhang2",
        "gender": ";M;M;M;M;M;M",
        "homepage": "https://github.com/KANGRuipeng;https://github.com/xzheng4;https://github.com/cnpengli;https://github.com/value56;https://github.com/yynscfmq;https://github.com/alexngng;https://cn.linkedin.com/in/xiantao-zhang-66bb4317?trk=people-guest_people_search-card",
        "dblp": ";;;;;;",
        "google_scholar": ";;;;;;",
        "orcid": ";;;;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Ruipeng_Kang1;~xiao_zheng5;~patrick_lp1;~Liufeng_Wang1;~minquan_fang1;~Zhengbiao_Wu1;~Xiantao_Zhang2",
        "aff": ";;;;;;",
        "aff_domain": ";;;;;;",
        "position": ";;;;;;",
        "bibtex": "@misc{\nkang2024kvtq,\ntitle={{KVTQ}: Compressing the {KV} Cache to Hardware Efficient Ternary Digits by Fine-Grained Dynamic Quantization},\nauthor={Ruipeng Kang and xiao zheng and patrick lp and Liufeng Wang and minquan fang and Zhengbiao Wu and Xiantao Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=eZAlb8fX5y}\n}",
        "github": "",
        "project": "",
        "reviewers": "cw8R;gbCq;nvar;ZD7v;iUPn",
        "site": "https://openreview.net/forum?id=eZAlb8fX5y",
        "pdf_size": 797954,
        "rating": "3;3;5;5;6",
        "confidence": "5;2;4;4;2",
        "soundness": "2;2;2;2;3",
        "contribution": "2;2;3;2;3",
        "presentation": "3;2;2;2;3",
        "wc_summary": "66;66;76;47;80",
        "wc_strengths": "99;42;46;39;158",
        "wc_weaknesses": "110;64;335;200;95",
        "wc_questions": "8;10;49;89;2",
        "wc_review": "283;182;506;375;335",
        "wc_reply_reviewers": "168;0;0;0;10",
        "wc_reply_authors": "864;381;392;437;249",
        "reply_reviewers": "1;0;0;0;1",
        "reply_authors": "2;1;1;1;1",
        "rating_avg": [
            4.4,
            1.2
        ],
        "confidence_avg": [
            3.4,
            1.2000000000000002
        ],
        "soundness_avg": [
            2.2,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            67.0,
            11.419281938896159
        ],
        "wc_strengths_avg": [
            76.8,
            46.20562736290895
        ],
        "wc_weaknesses_avg": [
            160.8,
            98.14560611662654
        ],
        "wc_questions_avg": [
            31.6,
            33.15780451115544
        ],
        "wc_review_avg": [
            336.2,
            106.72094452355638
        ],
        "wc_reply_reviewers_avg": [
            35.6,
            66.31319627344169
        ],
        "wc_reply_authors_avg": [
            464.6,
            209.29653604395847
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.2,
            0.4000000000000001
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.24999999999999997,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:YUdkD8manFQJ:scholar.google.com/&scioq=KVTQ:+Compressing+the+KV+Cache+to+Hardware+Efficient+Ternary+Digits+by+Fine-Grained+Dynamic+Quantization&hl=en&as_sdt=0,33",
        "gs_version_total": 0
    },
    {
        "title": "G$^2$N$^2$ : Weisfeiler and Lehman go grammatical",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18217",
        "id": "eZneJ55mRO",
        "author_site": "Jason Piquenot, Aldo Moscatelli, Maxime Berar, Pierre H\u00e9roux, Romain Raveaux, Jean-Yves RAMEL, S\u00e9bastien Adam",
        "tldr": "",
        "abstract": "This paper introduces a framework for formally establishing a connection between a portion of an algebraic language and a Graph Neural Network (GNN). The framework leverages Context-Free Grammars (CFG) to organize algebraic operations into generative rules that can be translated into a GNN layer model. As CFGs derived directly from a language tend to contain redundancies in their rules and variables, we present a grammar reduction scheme. By applying this strategy, we define a CFG that conforms to the third-order Weisfeiler-Lehman (3-WL) test using the matricial language MATLANG. From this 3-WL CFG, we derive a GNN model, named G$^2$N$^2$, which is provably 3-WL compliant. Through various experiments, we demonstrate the superior efficiency of G$^2$N$^2$ compared to other 3-WL GNNs across numerous downstream tasks. Specifically, one experiment highlights the benefits of grammar reduction within our framework.",
        "keywords": "Machine learning;GNN;Graph Learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Jason Piquenot;Aldo Moscatelli;Maxime Berar;Pierre H\u00e9roux;Romain Raveaux;Jean-Yves RAMEL;S\u00e9bastien Adam",
        "authorids": "~Jason_Piquenot1;~Aldo_Moscatelli1;~Maxime_Berar1;~Pierre_H\u00e9roux1;~Romain_Raveaux1;~Jean-Yves_RAMEL1;~S\u00e9bastien_Adam1",
        "gender": "M;M;M;M;M;M;M",
        "homepage": ";https://www.linkedin.com/in/aldo-moscatelli-76bb653a/;;;http://romain.raveaux.free.fr/;https://www.univ-smb.fr/listic/presentation/membres/enseignants-chercheurs/jean-yves-ramel/;http://pagesperso.litislab.fr/sebadam/",
        "dblp": ";;89/1783;;28/2895.html;24/2999;03/6714.html",
        "google_scholar": "xp59zGIAAAAJ;;J8-mCe4AAAAJ;iF91f3gAAAAJ;q3ou3o4AAAAJ;Id00xlIAAAAJ;https://scholar.google.fr/citations?user=vNZC5qcAAAAJ",
        "orcid": ";;;;0000-0003-3149-0498;0000-0003-4427-4612;",
        "linkedin": "jason-piquenot-502b23254/;aldo-moscatelli-76bb653a/;;;;;",
        "or_profile": "~Jason_Piquenot1;~Aldo_Moscatelli1;~Maxime_Berar1;~Pierre_H\u00e9roux1;~Romain_Raveaux1;~Jean-Yves_RAMEL1;~S\u00e9bastien_Adam1",
        "aff": "Universit\u00e9 de Rouen - Haute Normandie;Universit\u00e9 de Rouen - Haute Normandie;Universit\u00e9 de Rouen Normandie;Universit\u00e9 de Rouen - Haute Normandie;Universit\u00e9 Fran\u00e7ois Rabelais de Tours;Universit\u00e9 Fran\u00e7ois Rabelais de Tours;Universit\u00e9 de Rouen",
        "aff_domain": "univ-rouen.fr;univ-rouen.fr;univ-rouen.fr;univ-rouen.fr;univ-tours.fr;univ-tours.fr;univ-rouen.fr",
        "position": "PhD student;PhD student;Assistant Professor;Assistant Professor;Associate Professor;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\npiquenot2024gn,\ntitle={G\\${\\textasciicircum}2\\$N\\${\\textasciicircum}2\\$ : Weisfeiler and Lehman go grammatical},\nauthor={Jason Piquenot and Aldo Moscatelli and Maxime Berar and Pierre H{\\'e}roux and Romain Raveaux and Jean-Yves RAMEL and S{\\'e}bastien Adam},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=eZneJ55mRO}\n}",
        "github": "",
        "project": "",
        "reviewers": "3x4U;HFhT;giVQ",
        "pdf_size": 4449157,
        "rating": "6;6;8",
        "confidence": "2;4;3",
        "soundness": "4;3;4",
        "contribution": "4;3;3",
        "presentation": "4;3;4",
        "wc_summary": "87;69;63",
        "wc_strengths": "57;46;28",
        "wc_weaknesses": "9;64;37",
        "wc_questions": "130;77;68",
        "wc_review": "283;256;196",
        "wc_reply_reviewers": "5;36;0",
        "wc_reply_authors": "963;805;390",
        "reply_reviewers": "1;1;0",
        "reply_authors": "3;4;2",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            73.0,
            10.198039027185569
        ],
        "wc_strengths_avg": [
            43.666666666666664,
            11.953614051360738
        ],
        "wc_weaknesses_avg": [
            36.666666666666664,
            22.45489305746572
        ],
        "wc_questions_avg": [
            91.66666666666667,
            27.353650985238193
        ],
        "wc_review_avg": [
            245.0,
            36.359317925395686
        ],
        "wc_reply_reviewers_avg": [
            13.666666666666666,
            15.92342788332825
        ],
        "wc_reply_authors_avg": [
            719.3333333333334,
            241.64206771356862
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.0,
            0.816496580927726
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "openreview": "https://openreview.net/forum?id=eZneJ55mRO",
        "pdf": "https://openreview.net/pdf?id=eZneJ55mRO",
        "email": "univ-rouen.fr;univ-rouen.fr;univ-rouen.fr;univ-rouen.fr;univ-tours.fr;univ-tours.fr;univ-rouen.fr",
        "author_num": 7,
        "aff_unique_index": "0;0;1;0;2;2;0",
        "aff_unique_norm": "Universit\u00e9 de Rouen;Universit\u00e9 de Rouen Normandie;Universit\u00e9 Fran\u00e7ois Rabelais",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.univ-rouen.fr;https://www.univ-rouen.fr;https://www.univ-tours.fr",
        "aff_unique_abbr": "UR;UR Normandie;UFR",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Tours",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "France"
    },
    {
        "id": "eaXMEb6fa4",
        "title": "Referring Expression Matters: Multi-referring Feature Aggregation for Referring Video Object Segmentation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Referring Video Object Segmentation aims to segment object instances referred to by natural language referring expressions in a video sequence. This interaction style is quite simple and flexible, being capable of producing high quality segmentation masks. However, the referring expression variation occurs due to the randomness of expressions provided by users, making the existing state-of-the-art models still face the problem of wrongly identifying the referred object. To address this issue, we present a novel referring video object segmentation network fed with multiple referring expressions. Specifically, a simple but effective neural expression generation module is proposed to map the features of multiple referring expressions to complementary features with less redundancy. This interaction of multiple referring expressions not only is beneficial to identify the referred object but also speeds up the training convergence. We make evaluations of the proposed method on the popular referring video object segmentation datasets, and experimental results demonstrate that our method outperforms the state-of-the-arts by a significant margin in terms of segmentation quality and achieves considerable gains in terms of training convergence speed. Our code and pre-trained models will be available.",
        "keywords": "Referring Video Object Segmentation;Referring expression segmentation;Multimodal representation earning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "YAN LI;Qiong Wang;Jianwei Zheng;Cong Bai;Lu Zhang",
        "authorids": "~YAN_LI19;~Qiong_Wang5;~Jianwei_Zheng2;~Cong_Bai1;~Lu_Zhang10",
        "gender": ";;M;M;",
        "homepage": "https://github.com/YanWQ;;;http://www.homepage.zjut.edu.cn/congbai/;",
        "dblp": "87/660-83;;60/4818-1;02/11432;",
        "google_scholar": ";;X0wntOEAAAAJ;;",
        "orcid": ";;;0000-0002-6177-3862;",
        "linkedin": ";;;;",
        "or_profile": "~YAN_LI19;~Qiong_Wang5;~Jianwei_Zheng2;~Cong_Bai1;~Lu_Zhang10",
        "aff": "Zhejiang University of Technology;;Zhejiang University of Technology;Zhejiang University of Technology;",
        "aff_domain": "zjut.edu.cn;;zjut.edu.cn;zjut.edu.cn;",
        "position": "Lecturer;;Full Professor;Full Professor;",
        "bibtex": "@misc{\nli2024referring,\ntitle={Referring Expression Matters: Multi-referring Feature Aggregation for Referring Video Object Segmentation},\nauthor={YAN LI and Qiong Wang and Jianwei Zheng and Cong Bai and Lu Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=eaXMEb6fa4}\n}",
        "github": "",
        "project": "",
        "reviewers": "SAH4;s2MZ;QT6n",
        "site": "https://openreview.net/forum?id=eaXMEb6fa4",
        "pdf_size": 1112693,
        "rating": "1;3;5",
        "confidence": "3;2;4",
        "soundness": "1;2;2",
        "contribution": "1;2;2",
        "presentation": "1;2;3",
        "wc_summary": "24;53;54",
        "wc_strengths": "12;48;24",
        "wc_weaknesses": "34;164;170",
        "wc_questions": "20;4;2",
        "wc_review": "90;269;250",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            1.632993161855452
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            43.666666666666664,
            13.912424503139471
        ],
        "wc_strengths_avg": [
            28.0,
            14.966629547095765
        ],
        "wc_weaknesses_avg": [
            122.66666666666667,
            62.74463235121303
        ],
        "wc_questions_avg": [
            8.666666666666666,
            8.055363982396381
        ],
        "wc_review_avg": [
            203.0,
            80.27868127134792
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:OxsIKsIJU-MJ:scholar.google.com/&scioq=Referring+Expression+Matters:+Multi-referring+Feature+Aggregation+for+Referring+Video+Object+Segmentation&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Zhejiang University of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.zjut.edu.cn",
        "aff_unique_abbr": "ZJUT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "ecbRyZZmKG",
        "title": "Double-I Watermark: Protecting Model Copyright for LLM Fine-tuning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "To support various applications, business owners often seek the customized models that are obtained by fine-tuning a pre-trained LLM through the API provided by LLM owners or cloud servers. However, this process carries a substantial risk of model misuse, potentially resulting in severe economic consequences for business owners. Thus, safeguarding the copyright of these customized models during LLM fine-tuning has become an urgent practical requirement, but there are limited existing solutions to provide such protection. To tackle this pressing issue, we propose a novel watermarking approach named \"Double-I watermark\". Specifically, based on the instruct-tuning data, two types of backdoor data paradigms are introduced with trigger in the instruction and the input, respectively. By leveraging LLM's learning capability to incorporate customized backdoor samples into the dataset, the proposed approach effectively injects specific watermarking information into the customized model during fine-tuning, which makes it easy to inject and verify watermarks in commercial scenarios. We evaluate the proposed \"Double-I watermark\" under various fine-tuning methods, demonstrating its harmlessness, robustness, uniqueness, imperceptibility, and validity through both theoretical analysis and experimental verification.",
        "keywords": "large language model;fine-tuning;watermark",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Shen Li;Liuyi Yao;Jinyang Gao;Lan Zhang;Yaliang Li",
        "authorids": "~Shen_Li6;~Liuyi_Yao1;~Jinyang_Gao1;~Lan_Zhang1;~Yaliang_Li1",
        "gender": "M;F;M;F;M",
        "homepage": "https://github.com/listen0425;;;https://cs.ustc.edu.cn/2020/0706/c23235a460088/page.htm;https://sites.google.com/site/yaliangli/",
        "dblp": ";219/1767;131/4047;54/2752-2;https://dblp.org/pers/hd/l/Li:Yaliang",
        "google_scholar": ";0c5is-gAAAAJ;;83QxmA8AAAAJ;CCPBcdYAAAAJ",
        "orcid": ";;;;0000-0002-4204-6096",
        "linkedin": ";;;;",
        "or_profile": "~Shen_Li6;~Liuyi_Yao1;~Jinyang_Gao1;~Lan_Zhang1;~Yaliang_Li1",
        "aff": "University of Science and Technology of China;Alibaba Group;Alibaba Group;University of Science and Technology of China;Alibaba Group",
        "aff_domain": "ustc.edu.cn;alibaba-inc.com;alibaba-inc.com;ustc.edu.cn;alibaba-inc.com",
        "position": "MS student;Staff Engineer;Researcher;Full Professor;Staff Engineer",
        "bibtex": "@misc{\nli2024doublei,\ntitle={Double-I Watermark: Protecting Model Copyright for {LLM} Fine-tuning},\nauthor={Shen Li and Liuyi Yao and Jinyang Gao and Lan Zhang and Yaliang Li},\nyear={2024},\nurl={https://openreview.net/forum?id=ecbRyZZmKG}\n}",
        "github": "",
        "project": "",
        "reviewers": "rzXY;4k11;NrtU;4HBq",
        "site": "https://openreview.net/forum?id=ecbRyZZmKG",
        "pdf_size": 783782,
        "rating": "5;5;5;6",
        "confidence": "4;4;3;2",
        "soundness": "3;2;3;3",
        "contribution": "3;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "90;73;72;208",
        "wc_strengths": "112;21;65;139",
        "wc_weaknesses": "102;111;91;151",
        "wc_questions": "140;2;72;2",
        "wc_review": "444;207;300;500",
        "wc_reply_reviewers": "39;16;37;214",
        "wc_reply_authors": "2584;1672;2249;953",
        "reply_reviewers": "1;1;1;2",
        "reply_authors": "5;4;4;2",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            110.75,
            56.60112631388178
        ],
        "wc_strengths_avg": [
            84.25,
            45.107510461119446
        ],
        "wc_weaknesses_avg": [
            113.75,
            22.64260364887395
        ],
        "wc_questions_avg": [
            54.0,
            57.28874234961002
        ],
        "wc_review_avg": [
            362.75,
            115.7958872326647
        ],
        "wc_reply_reviewers_avg": [
            76.5,
            79.89524391351465
        ],
        "wc_reply_authors_avg": [
            1864.5,
            619.1544637648993
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.75,
            1.0897247358851685
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.8703882797784891,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4423885462331472078&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1;0;1",
        "aff_unique_norm": "University of Science and Technology of China;Alibaba Group",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.ustc.edu.cn;https://www.alibaba.com",
        "aff_unique_abbr": "USTC;Alibaba",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "edETIhDTwL",
        "title": "Decompose Time and Frequency Dependencies: Multivariate Time Series Physiological Signal Emotion Recognition",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this study, we proposed a transformer based end-to-end solution to capture the relationship between the physiological signals and affective changes. We first convert the physiological signal emotion recognition prediction task to a sequence-to-sequence multivariate time series prediction task. We utilize the state-of-the-art (SOTA) self-attention mechanism to decompose the physiological signals into separate frequency domain and time domain representations, and capture the channel dependencies via Two-Stage Attention (TSA). Meanwhile, we implement the multitask learning framework to better predict the valence and arousal affective states individually. We evaluate our system on the Continuously Annotated Signals of Emotion (CASE) dataset used in the Emotion Physiology and Experience Collaboration (EPiC) challenge, and our proposed system outperform all the challenge participants in all four test scenarios.",
        "keywords": "Physiological Signal;Emotion Recognition;Time Series;Representation Learning;Affective Computing",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "Ziqing Yang;Houwei Cao",
        "authorids": "~Ziqing_Yang2;~Houwei_Cao1",
        "gender": "M;F",
        "homepage": ";https://www.nyit.edu/bio/hcao02",
        "dblp": ";21/9232.html",
        "google_scholar": "fgJpZskAAAAJ;Hltxo5MAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Ziqing_Yang2;~Houwei_Cao1",
        "aff": "New York Institute of Technology;New York Institute of Technology",
        "aff_domain": "nyit.edu;nyit.edu",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\nyang2024decompose,\ntitle={Decompose Time and Frequency Dependencies: Multivariate Time Series Physiological Signal Emotion Recognition},\nauthor={Ziqing Yang and Houwei Cao},\nyear={2024},\nurl={https://openreview.net/forum?id=edETIhDTwL}\n}",
        "github": "",
        "project": "",
        "reviewers": "8PZe;s9qV;zx9B",
        "site": "https://openreview.net/forum?id=edETIhDTwL",
        "pdf_size": 629717,
        "rating": "3;3;5",
        "confidence": "5;5;4",
        "soundness": "3;2;2",
        "contribution": "1;1;3",
        "presentation": "2;1;2",
        "wc_summary": "80;58;102",
        "wc_strengths": "10;56;324",
        "wc_weaknesses": "99;86;83",
        "wc_questions": "83;5;166",
        "wc_review": "272;205;675",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "620;357;588",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;2;2",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            80.0,
            17.962924780409974
        ],
        "wc_strengths_avg": [
            130.0,
            138.4581765973634
        ],
        "wc_weaknesses_avg": [
            89.33333333333333,
            6.944222218666553
        ],
        "wc_questions_avg": [
            84.66666666666667,
            65.73853934759697
        ],
        "wc_review_avg": [
            384.0,
            207.57809775278957
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            521.6666666666666,
            117.167496440874
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:cwFSSGAW5sgJ:scholar.google.com/&scioq=Decompose+Time+and+Frequency+Dependencies:+Multivariate+Time+Series+Physiological+Signal+Emotion+Recognition&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "New York Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nyit.edu",
        "aff_unique_abbr": "NYIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "eddd0YTCiq",
        "title": "Graph-level Representation Learning with Joint-Embedding Predictive Architectures",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Joint-Embedding Predictive Architectures (JEPAs) have recently emerged as a novel and powerful technique for self-supervised representation learning. They aim to learn an energy-based model by predicting the latent representation of a target signal $y$ from a context signal $x$. JEPAs bypass the need for data augmentation and negative samples, which are typically required by contrastive learning, while avoiding the overfitting issues associated with generative-based pretraining. In this paper, we show that graph-level representations can be effectively modeled using this paradigm and propose Graph-JEPA, the first JEPA for the graph domain. In particular, we employ masked modeling to learn embeddings for different subgraphs of the input graph. To endow the representations with the implicit hierarchy that is often present in graph-level concepts, we devise an alternative training objective that consists of predicting the coordinates of the encoded subgraphs on the unit hyperbola in the 2D plane. Extensive validation shows that Graph-JEPA can learn representations that are expressive and competitive in both graph classification and regression problems. The implementation will be available upon acceptance.",
        "keywords": "graph-level representation learning; graph self-supervised learning; joint-embedding predictive architectures",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Geri Skenderi;Hang Li;Jiliang Tang;Marco Cristani",
        "authorids": "~Geri_Skenderi1;~Hang_Li10;~Jiliang_Tang1;~Marco_Cristani1",
        "gender": "M;M;M;M",
        "homepage": "https://geriskenderi.github.io/;https://hzlihang99.github.io/;https://www.cse.msu.edu/~tangjili/;https://www.dimi.univr.it/?ent=persona&id=218&lang=en",
        "dblp": "302/3567;83/5560-7.html;64/10812;58/2811",
        "google_scholar": "F_FT7TUAAAAJ;25Vx5UIAAAAJ;WtzKMWAAAAAJ;https://scholar.google.it/citations?user=LbgTPRwAAAAJ",
        "orcid": "0000-0001-9968-7727;0000-0002-3464-3245;0000-0001-7125-3898;0000-0002-0523-6042",
        "linkedin": "geriskenderi/;;;marco-cristani-3a78a017/",
        "or_profile": "~Geri_Skenderi1;~Hang_Li10;~Jiliang_Tang1;~Marco_Cristani1",
        "aff": "University of Verona;Michigan State University;Michigan State University;Universit\u00e0 degli Studi di Verona",
        "aff_domain": "univr.it;msu.edu;msu.edu;univr.it",
        "position": "PhD student;PhD student;Full Professor;Full Professor",
        "bibtex": "@misc{\nskenderi2024graphlevel,\ntitle={Graph-level Representation Learning with Joint-Embedding Predictive Architectures},\nauthor={Geri Skenderi and Hang Li and Jiliang Tang and Marco Cristani},\nyear={2024},\nurl={https://openreview.net/forum?id=eddd0YTCiq}\n}",
        "github": "",
        "project": "",
        "reviewers": "15Jn;b3AV;dWk6",
        "site": "https://openreview.net/forum?id=eddd0YTCiq",
        "pdf_size": 595303,
        "rating": "3;3;6",
        "confidence": "4;4;4",
        "soundness": "2;3;3",
        "contribution": "2;1;3",
        "presentation": "2;1;2",
        "wc_summary": "29;24;41",
        "wc_strengths": "22;24;19",
        "wc_weaknesses": "75;86;164",
        "wc_questions": "1;10;67",
        "wc_review": "127;144;291",
        "wc_reply_reviewers": "0;0;14",
        "wc_reply_authors": "611;874;748",
        "reply_reviewers": "0;0;1",
        "reply_authors": "2;2;1",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            31.333333333333332,
            7.1336448530109
        ],
        "wc_strengths_avg": [
            21.666666666666668,
            2.0548046676563256
        ],
        "wc_weaknesses_avg": [
            108.33333333333333,
            39.617616732402716
        ],
        "wc_questions_avg": [
            26.0,
            29.223278392404914
        ],
        "wc_review_avg": [
            187.33333333333334,
            73.631213188128
        ],
        "wc_reply_reviewers_avg": [
            4.666666666666667,
            6.599663291074443
        ],
        "wc_reply_authors_avg": [
            744.3333333333334,
            107.40060003970596
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7635405431505854478&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "University of Verona;Michigan State University;Universit\u00e0 degli Studi di Verona",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.univr.it;https://www.msu.edu;https://www.univr.it",
        "aff_unique_abbr": "UniVR;MSU;UniVR",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "Italy;United States"
    },
    {
        "id": "edx7LTufJF",
        "title": "Efficient Low-Rank Diffusion Model Training for Text-to-Image Generation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recent advancements in text-to-image generation models have witnessed the success of large-scale diffusion-based generative models. However, exerting control over these models, particularly for structure-conditioned text-to-image generation, remains an open challenge. One straightforward way to achieve control is via fine-tuning, often coming at the cost of efficiency. In this work, we address this challenge by introducing ELR-Diffusion (Efficient Low-rank Diffusion), a method tailored for efficient structure-conditioned image generation. Our innovative approach leverages the low-rank decomposition of model weights, leading to a dramatic reduction in memory cost and model parameters \u2014 by up to 58\\%, at the same time performing comparably to larger models trained with expansive datasets and more computational resources. At the heart of ELR-Diffusion lies a two-stage training scheme that resorts to the low-rank decomposition and knowledge distillation strategy. To provide a robust assessment of our model, we undertake a thorough comparative analysis in the controllable text-to-image generation domain. We employ a diverse array of evaluation metrics with various conditions, including edge maps, segmentation maps, and image quality measures, offering a holistic view of the model's capabilities. We believe that ELR-Diffusion has the potential to serve as an efficient foundation model for diverse user applications that demand accurate comprehension of inputs containing multiple conditional information.",
        "keywords": "Efficiency;Diffusion",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Xuehai He;Jacob Zhiyuan Fang;Jian Zheng;Robinson Piramuthu;Mohit Bansal;Vicente Ordonez;Gunnar A Sigurdsson;Nanyun Peng;Xin Eric Wang",
        "authorids": "~Xuehai_He1;~Jacob_Zhiyuan_Fang1;~Jian_Zheng1;~Robinson_Piramuthu1;~Mohit_Bansal2;~Vicente_Ordonez2;~Gunnar_A_Sigurdsson1;~Nanyun_Peng1;~Xin_Eric_Wang2",
        "gender": "M;F;M;M;F;M;M;M;M",
        "homepage": ";;https://scholar.google.com/citations?user=2CkqEGcAAAAJ&hl=en;https://www.cs.unc.edu/~mbansal/;https://violetpeng.github.io/;https://eric-xw.github.io;http://www.gunnar.xyz;https://www.public.asu.edu/~zfang29/;https://www.cs.rice.edu/~vo9",
        "dblp": "251/0763;;29/1333;32/5243.html;117/4036;10/5630-61;179/2347;75/4027;74/7584",
        "google_scholar": "kDzxOzUAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.cl/citations?user=2CkqEGcAAAAJ;DN8QtscAAAAJ;XxRXvX0AAAAJ;YjqluE0AAAAJ;clTKG0QAAAAJ;https://scholar.google.com.au/citations?hl=en;TtA_j4YAAAAJ",
        "orcid": ";;0000-0002-1767-8382;;;0000-0003-2605-5504;0000-0001-8967-7322;;0009-0006-0279-5275",
        "linkedin": ";jian-zheng/;rpiramuthu/;;;;https://linkedin.com/in/gasigurdsson/;;vicenteordonez",
        "or_profile": "~Xuehai_He1;~Jian_Zheng1;~Robinson_Piramuthu1;~Mohit_Bansal2;~Nanyun_Peng1;~Xin_Eric_Wang2;~Gunnar_Atli_Sigurdsson1;~Zhiyuan_Fang1;~Vicente_Rom\u00e1n1",
        "aff": "University of California Santa Curz;Amazon AGI;Amazon Inc;University of North Carolina at Chapel Hill;University of California, Los Angeles;University of California, Santa Cruz;Amazon;Amazon Alexa AI;Amazon Alexa AI",
        "aff_domain": "ucsc.edu;amazon.com;amazon.com;unc.edu;ucla.edu;ucsc.edu;amazon.com;amazon.com;amazon.com",
        "position": "PhD student;Researcher;Principal Scientist;Full Professor;Assistant Professor;Assistant Professor;Researcher;Researcher;Visiting Academic",
        "bibtex": "@misc{\nhe2024efficient,\ntitle={Efficient Low-Rank Diffusion Model Training for Text-to-Image Generation},\nauthor={Xuehai He and Jacob Zhiyuan Fang and Jian Zheng and Robinson Piramuthu and Mohit Bansal and Vicente Ordonez and Gunnar A Sigurdsson and Nanyun Peng and Xin Eric Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=edx7LTufJF}\n}",
        "github": "",
        "project": "",
        "reviewers": "svyE;aWRN;mXK5;HH76",
        "site": "https://openreview.net/forum?id=edx7LTufJF",
        "pdf_size": 9746024,
        "rating": "1;3;3;3",
        "confidence": "5;4;5;4",
        "soundness": "2;2;2;3",
        "contribution": "1;2;1;2",
        "presentation": "1;3;2;2",
        "wc_summary": "79;60;44;221",
        "wc_strengths": "48;33;32;45",
        "wc_weaknesses": "109;236;232;91",
        "wc_questions": "717;27;30;60",
        "wc_review": "953;356;338;417",
        "wc_reply_reviewers": "0;0;62;25",
        "wc_reply_authors": "652;390;441;324",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            101.0,
            70.38110541899722
        ],
        "wc_strengths_avg": [
            39.5,
            7.088723439378913
        ],
        "wc_weaknesses_avg": [
            167.0,
            67.31641701695062
        ],
        "wc_questions_avg": [
            208.5,
            293.86604090979955
        ],
        "wc_review_avg": [
            516.0,
            253.99507869248177
        ],
        "wc_reply_reviewers_avg": [
            21.75,
            25.380849079571785
        ],
        "wc_reply_authors_avg": [
            451.75,
            122.82991288770012
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:X2mN7dEQPnIJ:scholar.google.com/&scioq=Efficient+Low-Rank+Diffusion+Model+Training+for+Text-to-Image+Generation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;2;3;0;1;1;1",
        "aff_unique_norm": "University of California, Santa Cruz;Amazon;University of North Carolina;University of California, Los Angeles",
        "aff_unique_dep": ";Amazon AGI;;",
        "aff_unique_url": "https://www.ucsc.edu;https://www.amazon.com;https://www.unc.edu;https://www.ucla.edu",
        "aff_unique_abbr": "UCSC;Amazon;UNC;UCLA",
        "aff_campus_unique_index": "0;2;3;0",
        "aff_campus_unique": "Santa Cruz;;Chapel Hill;Los Angeles",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "ee4QXtVDVm",
        "title": "Subword embedding from bytes against embedding-based attacks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "NLP models have grown as a powerful technology and impact our social life like never before, along with rising concerns in practical applications including privacy invasion and high computational cost. While federated learning alleviates these problems, attackers can still recover the private training data of victim clients by leveraging the transmitted model parameters and gradients. Protecting against such attacks of private information leakage remains an open challenge. We propose Subword Embedding from Bytes (SEB) as a novel solution that can protect privacy while maintaining efficiency and accuracy. Our experiments demonstrate that SEB can effectively protect against embedding-based attacks, which recover the sentences in a batch of text data, based on the gradients in federated learning. As a defense, SEB does not compromise the model's accuracy. We also verify that SEB obtains comparable and even better results over traditional subword embedding methods in machine translation, sentiment analysis, and language modeling.",
        "keywords": "Privacy;embedding;bytes;Transformer;language model;federated learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/b4881b3e110648bfaab19a7c0c65de7a3b542ffc.zip",
        "author": "Mengjiao Zhang;Jia Xu",
        "authorids": "~Mengjiao_Zhang1;~Jia_Xu3",
        "gender": "F;F",
        "homepage": ";http://jiaxu.org",
        "dblp": ";95/3616-4.html",
        "google_scholar": "azRjEeIAAAAJ;myyblq4AAAAJ",
        "orcid": "0000-0003-1446-4802;",
        "linkedin": "mengjiao-zhang/;",
        "or_profile": "~Mengjiao_Zhang1;~Jia_Xu3",
        "aff": "Stevens Institute of Technology;Stevens Institute of Technology",
        "aff_domain": "stevens.edu;stevens.edu",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nzhang2024subword,\ntitle={Subword embedding from bytes against embedding-based attacks},\nauthor={Mengjiao Zhang and Jia Xu},\nyear={2024},\nurl={https://openreview.net/forum?id=ee4QXtVDVm}\n}",
        "github": "",
        "project": "",
        "reviewers": "zsjW;Crbt;ybMb",
        "site": "https://openreview.net/forum?id=ee4QXtVDVm",
        "pdf_size": 963828,
        "rating": "5;5;8",
        "confidence": "3;3;4",
        "soundness": "3;2;3",
        "contribution": "2;2;3",
        "presentation": "3;3;3",
        "wc_summary": "135;107;38",
        "wc_strengths": "60;67;51",
        "wc_weaknesses": "141;219;44",
        "wc_questions": "81;6;10",
        "wc_review": "417;399;143",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1320;821;352",
        "reply_reviewers": "0;0;0",
        "reply_authors": "3;2;2",
        "rating_avg": [
            6.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            93.33333333333333,
            40.762182909598394
        ],
        "wc_strengths_avg": [
            59.333333333333336,
            6.548960901462833
        ],
        "wc_weaknesses_avg": [
            134.66666666666666,
            71.58367287463129
        ],
        "wc_questions_avg": [
            32.333333333333336,
            34.451253807211266
        ],
        "wc_review_avg": [
            319.6666666666667,
            125.13814588507996
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            831.0,
            395.2476017215875
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:fbroEiUbYPAJ:scholar.google.com/&scioq=Subword+embedding+from+bytes+against+embedding-based+attacks&hl=en&as_sdt=0,23",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Stevens Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.stevens.edu",
        "aff_unique_abbr": "SIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "eeaKRQIaYd",
        "title": "Unsupervised Sign Language Translation and Generation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Sign language translation and generation are crucial in facilitating communication between the deaf and hearing communities.However, the scarcity of parallel sign language video-to-text data poses a considerable challenge to developing effective sign language translation and generation systems.Motivated by the success of unsupervised neural machine translation (UNMT), this paper introduces an unsupervised sign language translation and generation network (USLNet), which learns from abundant single-modality (text and video) data without parallel sign language data. Inspired by UNMT,  USLNet comprises two main components: single-modality reconstructing modules (text and video) that rebuild the input from its noisy version in the same modality and cross-modality back-translation modules (text-video-text and video-text-video) that reconstruct the input from its noisy version in the different modality using back-translation procedure.Unlike the single-modality back-translation procedure in text-based UNMT, USLNet faces the cross-modality discrepancy in feature representation, in which the length and the feature dimension mismatch between text and video sequences.To address the issues, we propose a sliding window method to align variable-length text with video sequences.To our knowledge, USLNet is the first unsupervised sign language translation and generation model capable of generating both text and sign language video in a unified manner.Experimental results on the BBC-Oxford Sign Language datasets (BOBSL) reveal that USLNet achieves competitive results compared to supervised baseline models, indicating its effectiveness in sign language translation and generation.",
        "keywords": "unsupervised;sign language translation;natural language processing",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/e774af262de1a9376af8aec835566b3ebe521c0a.pdf",
        "author": "Zhengsheng Guo;Zhiwei He;Wenxiang Jiao;Xing Wang;Rui Wang;Kehai Chen;Zhaopeng Tu;Yong Xu;Min Zhang",
        "authorids": "~Zhengsheng_Guo2;~Zhiwei_He1;~Wenxiang_Jiao1;~Xing_Wang1;~Rui_Wang10;~Kehai_Chen2;~Zhaopeng_Tu1;~Yong_Xu9;~Min_Zhang9",
        "gender": "M;M;M;M;M;M;M;M;M",
        "homepage": "https://scholar.google.com.hk/citations?user=jM8CM20AAAAJ&hl=zh-CN;https://zwhe99.github.io/;https://wxjiao.github.io/;http://xingwang4nlp.com/;https://chenkehai.github.io;http://www.zptu.net;https://www.yongxu.org;https://zhangmin-nlp-ai.github.io/;https://wangruinlp.github.io/",
        "dblp": ";52/6077-2;239/4883;02/3674-7;78/9623;71/9281;;83/5342-5;w/RuiWang15",
        "google_scholar": "https://scholar.google.com.hk/citations?user=jM8CM20AAAAJ;https://scholar.google.com/citations?hl=en;CvtODukAAAAJ;6AqRKa0AAAAJ;_M4Am0AAAAAJ;IvE2zRgAAAAJ;https://scholar.google.com.hk/citations?user=zOVgYQYAAAAJ;https://scholar.google.com/citations?hl=zh-CN;oTU0v5IAAAAJ",
        "orcid": ";0000-0002-4807-0062;;0000-0002-0737-9653;0000-0002-4346-7618;;;;0000-0001-8007-2503",
        "linkedin": ";;;;;tuzhaopeng;;;",
        "or_profile": "~Zhengsheng_Guo2;~Zhiwei_He1;~Wenxiang_Jiao1;~Xing_Wang1;~Kehai_Chen2;~Zhaopeng_Tu1;~Yong_Xu9;~Min_Zhang9;~Rui_Wang7",
        "aff": "Harbin Institute of Technology;Shanghai Jiaotong University;Tencent AI Lab;Tencent AI Lab;Harbin Institute of Technology (Shenzhen);Tencent AI Lab;Harbin Institute of Technology;Harbin Institute of Technology, Shenzhen;Shanghai Jiaotong University",
        "aff_domain": "hit.edu.cn;sjtu.edu.cn;tencent.com;tencent.com;hit.edu.cn;tencent.com;hit.edu.cn;hit.edu.cn;sjtu.edu.cn",
        "position": "MS student;PhD student;Researcher;Researcher;Full Professor;Principal Researcher;Full Professor;Full Professor;Associate Professor",
        "bibtex": "@misc{\nguo2024unsupervised,\ntitle={Unsupervised Sign Language Translation and Generation},\nauthor={Zhengsheng Guo and Zhiwei He and Wenxiang Jiao and Xing Wang and Rui Wang and Kehai Chen and Zhaopeng Tu and Yong Xu and Min Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=eeaKRQIaYd}\n}",
        "github": "",
        "project": "",
        "reviewers": "gT8h;zNBk;WPdm;PET1",
        "site": "https://openreview.net/forum?id=eeaKRQIaYd",
        "pdf_size": 1753592,
        "rating": "5;5;5;5",
        "confidence": "4;5;4;4",
        "soundness": "2;3;3;2",
        "contribution": "2;2;2;2",
        "presentation": "2;3;2;3",
        "wc_summary": "57;85;127;43",
        "wc_strengths": "42;43;81;57",
        "wc_weaknesses": "259;244;316;132",
        "wc_questions": "2;84;17;108",
        "wc_review": "360;456;541;340",
        "wc_reply_reviewers": "84;0;20;29",
        "wc_reply_authors": "769;929;895;1083",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "3;3;3;3",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            78.0,
            32.07802986469088
        ],
        "wc_strengths_avg": [
            55.75,
            15.738090735537142
        ],
        "wc_weaknesses_avg": [
            237.75,
            66.70223009765115
        ],
        "wc_questions_avg": [
            52.75,
            44.39242615582077
        ],
        "wc_review_avg": [
            424.25,
            80.41260784230293
        ],
        "wc_reply_reviewers_avg": [
            33.25,
            31.123744954616242
        ],
        "wc_reply_authors_avg": [
            919.0,
            111.88386836358492
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            0.0
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3543599927059851324&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2;2;0;2;0;0;1",
        "aff_unique_norm": "Harbin Institute of Technology;Shanghai Jiao Tong University;Tencent",
        "aff_unique_dep": ";;Tencent AI Lab",
        "aff_unique_url": "http://www.hit.edu.cn/;https://www.sjtu.edu.cn;https://ai.tencent.com",
        "aff_unique_abbr": "HIT;SJTU;Tencent AI Lab",
        "aff_campus_unique_index": "0;2;0;2",
        "aff_campus_unique": "Harbin;;Shenzhen",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Enhancing Neural Subset Selection: Integrating Background Information into Set Representations",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18216",
        "id": "eepoE7iLpL",
        "author_site": "Binghui Xie, Yatao Bian, Kaiwen Zhou, Yongqiang Chen, Peilin Zhao, Bo Han, Wei Meng, James Cheng",
        "tldr": "",
        "abstract": "Learning neural subset selection tasks, such as compound selection in AI-aided drug discovery, have become increasingly pivotal across diverse applications. The existing methodologies in the field primarily concentrate on constructing models that capture the relationship between utility function values and subsets within their respective supersets. However, these approaches tend to overlook the valuable information contained within the superset when utilizing neural networks to model set functions. In this work, we address this oversight by adopting a probabilistic perspective. Our theoretical findings demonstrate that when the target value is conditioned on both the input set and subset, it is essential to incorporate an invariant sufficient statistic of the superset into the subset of interest for effective learning. This ensures that the output value remains invariant to permutations of the subset and its corresponding superset, enabling identification of the specific superset from which the subset originated. Motivated by these insights, we propose a simple yet effective information aggregation module designed to merge the representations of subsets and supersets from a permutation invariance perspective. Comprehensive empirical evaluations across diverse tasks and datasets validate the enhanced efficacy of our approach over conventional methods, underscoring the practicality and potency of our proposed strategies in real-world contexts.",
        "keywords": "Neural Set Function;Hierarchical Structure;Invariance;Subset Selection",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/e5184ac593e50c955d1cd16ad4b2c20b173c601e.zip",
        "author": "Binghui Xie;Yatao Bian;Kaiwen Zhou;Yongqiang Chen;Peilin Zhao;Bo Han;Wei Meng;James Cheng",
        "authorids": "~Binghui_Xie1;~Yatao_Bian1;~Kaiwen_Zhou2;~Yongqiang_Chen1;~Peilin_Zhao2;~Bo_Han1;~Wei_Meng1;~James_Cheng2",
        "gender": "M;M;;;M;M;M;M",
        "homepage": "https://xiebinghui.github.io/;https://jnhujnhu.github.io/;https://lfhase.win;;https://www.cse.cuhk.edu.hk/~wei/;https://www.cse.cuhk.edu.hk/~jcheng/;https://bhanml.github.io/;https://yataobian.com",
        "dblp": "286/4313;215/4936;76/5774-2;84/8411;https://dblp.org/pers/hd/m/Meng_0001:Wei;06/4171;241/0472-3;222/2694",
        "google_scholar": ";nHmlZ5QAAAAJ;huQ_Ig8AAAAJ;https://scholar.google.com.hk/citations?user=HPeX_YcAAAAJ;CBLnYLEAAAAJ;;nTNjqHwAAAAJ;oZBTlBkAAAAJ",
        "orcid": "0000-0001-6533-9281;;;0000-0001-8543-3953;0000-0001-8260-3304;;;0000-0002-2368-4084",
        "linkedin": ";;;;;;;",
        "or_profile": "~Binghui_Xie1;~Kaiwen_Zhou2;~Yongqiang_Chen1;~Peilin_Zhao2;~Wei_Meng1;~James_Cheng2;~bo_han2;~An_Bian1",
        "aff": "Department of Computer Science and Engineering, The Chinese University of Hong Kong;Huawei Noah's Ark Lab;Department of Computer Science and Engineering, The Chinese University of Hong Kong;Tencent;The Chinese University of Hong Kong;The Chinese University of Hong Kong;MBZUAI;Tencent AI Lab",
        "aff_domain": "cse.cuhk.edu.hk;huawei.com;cse.cuhk.edu.hk;tencent.com;cse.cuhk.edu.hk;cuhk.edu.hk;mbzuai.ac.ae;tencent.com",
        "position": "PhD student;Researcher;PhD student;Researcher;Associate Professor;Associate Professor;Researcher;Senior researcher    ",
        "bibtex": "@inproceedings{\nxie2024enhancing,\ntitle={Enhancing Neural Subset Selection: Integrating Background Information into Set Representations},\nauthor={Binghui Xie and Yatao Bian and Kaiwen Zhou and Yongqiang Chen and Peilin Zhao and Bo Han and Wei Meng and James Cheng},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=eepoE7iLpL}\n}",
        "github": "",
        "project": "",
        "reviewers": "vcJR;miuk;PoVi",
        "pdf_size": 5024609,
        "rating": "5;6;6",
        "confidence": "3;4;3",
        "soundness": "3;2;3",
        "contribution": "3;2;3",
        "presentation": "3;2;2",
        "wc_summary": "64;41;71",
        "wc_strengths": "32;23;56",
        "wc_weaknesses": "39;71;161",
        "wc_questions": "23;1;115",
        "wc_review": "158;136;403",
        "wc_reply_reviewers": "0;46;202",
        "wc_reply_authors": "1590;1044;1025",
        "reply_reviewers": "0;2;1",
        "reply_authors": "7;5;5",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            58.666666666666664,
            12.81492185782739
        ],
        "wc_strengths_avg": [
            37.0,
            13.92838827718412
        ],
        "wc_weaknesses_avg": [
            90.33333333333333,
            51.64838386199084
        ],
        "wc_questions_avg": [
            46.333333333333336,
            49.378357832376544
        ],
        "wc_review_avg": [
            232.33333333333334,
            121.01331423534447
        ],
        "wc_reply_reviewers_avg": [
            82.66666666666667,
            86.44587259602906
        ],
        "wc_reply_authors_avg": [
            1219.6666666666667,
            261.9800670958681
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            5.666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11337033982126828442&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=eepoE7iLpL",
        "pdf": "https://openreview.net/pdf?id=eepoE7iLpL",
        "email": "cse.cuhk.edu.hk;huawei.com;cse.cuhk.edu.hk;tencent.com;cse.cuhk.edu.hk;cuhk.edu.hk;mbzuai.ac.ae;tencent.com",
        "author_num": 8,
        "aff_unique_index": "0;1;0;2;0;0;3;2",
        "aff_unique_norm": "Chinese University of Hong Kong;Huawei;Tencent;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_unique_dep": "Department of Computer Science and Engineering;Noah's Ark Lab;Tencent Holdings Limited;",
        "aff_unique_url": "https://www.cuhk.edu.hk;https://www.huawei.com;https://www.tencent.com;https://www.mbzuai.ac.ae",
        "aff_unique_abbr": "CUHK;Huawei;Tencent;MBZUAI",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0;0;0;1;0",
        "aff_country_unique": "China;United Arab Emirates"
    },
    {
        "title": "Multimodal Web Navigation with Instruction-Finetuned Foundation Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18215",
        "id": "efFmBWioSc",
        "author_site": "Hiroki Furuta, Kuang-Huei Lee, Ofir Nachum, Yutaka Matsuo, Aleksandra Faust, Shixiang Gu, Izzeddin Gur",
        "tldr": "",
        "abstract": "The progress of autonomous web navigation has been hindered by the dependence on billions of exploratory interactions via online reinforcement learning, and domain-specific model designs that make it difficult to leverage generalization from rich out-of-domain data.\nIn this work, we study data-driven offline training for web agents with vision-language foundation models.\nWe propose an instruction-following multimodal agent, WebGUM, that observes both webpage screenshots and HTML pages and outputs web navigation actions, such as click and type.\nWebGUM is trained by jointly finetuning an instruction-finetuned language model and a vision encoder with temporal and local perception on a large corpus of demonstrations.\nWe empirically demonstrate this recipe improves the agent's ability of grounded multimodal perception, HTML comprehension, and multi-step reasoning, outperforming prior works by a significant margin. \nOn the MiniWoB, we improve over the previous best offline methods by more than 45.8%, even outperforming online-finetuned SoTA, humans, and GPT-4-based agent. \nOn the WebShop benchmark, our 3-billion-parameter model achieves superior performance to the existing SoTA, PaLM-540B.\nFurthermore, WebGUM exhibits strong positive transfer to the real-world planning tasks on the Mind2Web.\nWe also collect 347K high-quality demonstrations using our trained models, 38 times larger than prior work, and make them available to promote future research in this direction.",
        "keywords": "Web Navigation;Foundation Models;Large Language Models;Instruction Finetuning;Decision Making;Multimodal Document Understanding",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Hiroki Furuta;Kuang-Huei Lee;Ofir Nachum;Yutaka Matsuo;Aleksandra Faust;Shixiang Shane Gu;Izzeddin Gur",
        "authorids": "~Hiroki_Furuta1;~Kuang-Huei_Lee1;~Ofir_Nachum1;~Yutaka_Matsuo1;~Aleksandra_Faust1;~Shixiang_Shane_Gu1;~Izzeddin_Gur1",
        "gender": "M;M;M;M;F;;M",
        "homepage": "https://github.com/frt03;https://kuanghuei.github.io/;https://scholar.google.com/citations?user=C-ZlBWMAAAAJ&hl=en;http://ymatsuo.com;http://www.afaust.info;;https://sites.google.com/view/gugurus/home",
        "dblp": "267/2065;66/11466;;m/YMatsuo.html;135/8420;188/9027;121/0550",
        "google_scholar": "M0OhM1UAAAAJ;rE7-N30AAAAJ;C-ZlBWMAAAAJ;Dy8iau4AAAAJ;RK72t68AAAAJ;qS_ugJAAAAAJ;B8wslVsAAAAJ",
        "orcid": ";;;;0000-0002-3268-8685;;",
        "linkedin": ";;;;aleksandrafaust;;",
        "or_profile": "~Hiroki_Furuta1;~Kuang-Huei_Lee1;~Ofir_Nachum1;~Yutaka_Matsuo1;~Aleksandra_Faust1;~Izzeddin_Gur1;~Shixiang_Gu1",
        "aff": "Google DeepMind;Google;OpenAI;The University of Tokyo;Google Brain;Google;Google DeepMind",
        "aff_domain": "google.com;google.com;openai.com;u-tokyo.ac.jp;google.com;google.com;google.com",
        "position": "Intern;Researcher;Researcher;Associate Professor;Principal Researcher;Research Scientist;Staff Research Scientist",
        "bibtex": "@inproceedings{\nfuruta2024multimodal,\ntitle={Multimodal Web Navigation with Instruction-Finetuned Foundation Models},\nauthor={Hiroki Furuta and Kuang-Huei Lee and Ofir Nachum and Yutaka Matsuo and Aleksandra Faust and Shixiang Shane Gu and Izzeddin Gur},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=efFmBWioSc}\n}",
        "github": "",
        "project": "",
        "reviewers": "idei;a21F;cMQF",
        "pdf_size": 1039669,
        "rating": "5;5;8",
        "confidence": "3;4;4",
        "soundness": "3;3;4",
        "contribution": "2;2;4",
        "presentation": "3;3;4",
        "wc_summary": "30;60;41",
        "wc_strengths": "19;31;114",
        "wc_weaknesses": "151;52;72",
        "wc_questions": "20;131;25",
        "wc_review": "220;274;252",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "322;835;321",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;2;2",
        "rating_avg": [
            6.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            43.666666666666664,
            12.39175353029407
        ],
        "wc_strengths_avg": [
            54.666666666666664,
            42.240054713769275
        ],
        "wc_weaknesses_avg": [
            91.66666666666667,
            42.74212078136611
        ],
        "wc_questions_avg": [
            58.666666666666664,
            51.188106257432715
        ],
        "wc_review_avg": [
            248.66666666666666,
            22.17105219775452
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            492.6666666666667,
            242.0665656843634
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 111,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17538952743411168829&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=efFmBWioSc",
        "pdf": "https://openreview.net/pdf?id=efFmBWioSc",
        "email": "google.com;google.com;openai.com;u-tokyo.ac.jp;google.com;google.com;google.com",
        "author_num": 7,
        "aff_unique_index": "0;0;1;2;0;0;0",
        "aff_unique_norm": "Google;OpenAI;University of Tokyo",
        "aff_unique_dep": "Google DeepMind;;",
        "aff_unique_url": "https://deepmind.com;https://openai.com;https://www.u-tokyo.ac.jp",
        "aff_unique_abbr": "DeepMind;OpenAI;UTokyo",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;1;2;1;1;0",
        "aff_country_unique": "United Kingdom;United States;Japan"
    },
    {
        "title": "SEPT: Towards Efficient Scene Representation Learning for Motion Prediction",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18214",
        "id": "efeBC1sQj9",
        "author_site": "Zhiqian Lan, Yuxuan Jiang, Yao Mu, Chen Chen, Shengbo Li",
        "tldr": "",
        "abstract": "Motion prediction is crucial for autonomous vehicles to operate safely in complex traffic environments. Extracting effective spatiotemporal relationships among traffic elements is key to accurate forecasting. Inspired by the successful practice of pretrained large language models, this paper presents SEPT, a modeling framework that leverages self-supervised learning to develop powerful spatiotemporal understanding for complex traffic scenes. Specifically, our approach involves three masking-reconstruction modeling tasks on scene inputs including agents' trajectories and road network, pretraining the scene encoder to capture kinematics within trajectory, spatial structure of road network, and interactions among roads and agents. The pretrained encoder is then finetuned on the downstream forecasting task. Extensive experiments demonstrate that SEPT, without elaborate architectural design or manual feature engineering, achieves state-of-the-art performance on the Argoverse 1 and Argoverse 2 motion forecasting benchmarks, outperforming previous methods on all main metrics by a large margin.",
        "keywords": "motion prediction;autonomous driving;self-supervised learning",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Zhiqian Lan;Yuxuan Jiang;Yao Mu;Chen Chen;Shengbo Eben Li",
        "authorids": "~Zhiqian_Lan1;~Yuxuan_Jiang1;~Yao_Mu1;~Chen_Chen42;~Shengbo_Eben_Li2",
        "gender": "M;M;M;M;M",
        "homepage": ";https://github.com/jjyyxx;https://yaomarkmu.github.io/;https://github.com/ChenChenGith;http://www.idlab-tsinghua.com/thulab/labweb/dpeople.html?11",
        "dblp": ";;260/0674;;",
        "google_scholar": "AkBBXcgAAAAJ;ZcwQMfkAAAAJ;;;Dxiw1K8AAAAJ",
        "orcid": ";0000-0003-4285-0495;;;",
        "linkedin": ";;;;",
        "or_profile": "~Zhiqian_Lan1;~Yuxuan_Jiang1;~Yao_Mu1;~Chen_Chen42;~Shengbo_Eben_Li2",
        "aff": "Tsinghua University;Tsinghua University;The University of Hong Kong;Beijing University of Technology;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;tsinghua.edu.cn;hku.hk;bjut.edu.cn;tsinghua.edu.cn",
        "position": "MS student;MS student;PhD student;Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\nlan2024sept,\ntitle={{SEPT}: Towards Efficient Scene Representation Learning for Motion Prediction},\nauthor={Zhiqian Lan and Yuxuan Jiang and Yao Mu and Chen Chen and Shengbo Eben Li},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=efeBC1sQj9}\n}",
        "github": "",
        "project": "",
        "reviewers": "Ukgp;fR6X;siKy;JZgu",
        "pdf_size": 723234,
        "rating": "6;6;8;8",
        "confidence": "5;4;5;4",
        "soundness": "3;2;3;4",
        "contribution": "2;2;3;3",
        "presentation": "2;3;4;4",
        "wc_summary": "50;126;136;74",
        "wc_strengths": "13;74;107;127",
        "wc_weaknesses": "107;110;136;86",
        "wc_questions": "241;169;24;1",
        "wc_review": "411;479;403;288",
        "wc_reply_reviewers": "23;17;0;0",
        "wc_reply_authors": "868;1478;402;372",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "2;3;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            96.5,
            35.703641270884404
        ],
        "wc_strengths_avg": [
            80.25,
            43.19360485071835
        ],
        "wc_weaknesses_avg": [
            109.75,
            17.75352077758099
        ],
        "wc_questions_avg": [
            108.75,
            99.89087796190401
        ],
        "wc_review_avg": [
            395.25,
            68.60165814322566
        ],
        "wc_reply_reviewers_avg": [
            10.0,
            10.222524150130436
        ],
        "wc_reply_authors_avg": [
            780.0,
            448.41275628599146
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 33,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1669730278779458821&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=efeBC1sQj9",
        "pdf": "https://openreview.net/pdf?id=efeBC1sQj9",
        "email": "tsinghua.edu.cn;tsinghua.edu.cn;hku.hk;bjut.edu.cn;tsinghua.edu.cn",
        "author_num": 5,
        "aff_unique_index": "0;0;1;2;0",
        "aff_unique_norm": "Tsinghua University;University of Hong Kong;Beijing University of Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.hku.hk;http://www.bjut.edu.cn",
        "aff_unique_abbr": "THU;HKU;BJUT",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "efxXzrbgrX",
        "title": "Black-box Targeted Adversarial Attack on Segment Anything (SAM)",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Deep recognition models are widely vulnerable to adversarial examples, which change the model output by adding quasi-imperceptible perturbation to the image input. Recently, Segment Anything Model (SAM) has emerged to become a popular foundation model in computer vision due to its impressive generalization to unseen data and tasks. Realizing flexible attacks on SAM is beneficial for understanding the robustness of SAM in the adversarial context. To this end, this work aims to achieve a targeted adversarial attack (TAA) on SAM. Specifically, under a certain prompt, the goal is to make the predicted mask of an adversarial example resemble that of a given target image. The task of TAA on SAM has been realized in a concurrent arXiv work in the white-box setup by assuming access to \\textit{prompt} and \\textit{model}, which is thus less practical. To address the issue of prompt dependence, we propose a simple yet effective approach by only attacking the image encoder. Moreover, we propose a novel regularization loss to enhance the cross-model transferability by increasing the feature dominance of adversarial images over random natural images. Extensive experiments verify the effectiveness of our proposed simple techniques to conduct a successful black-box TAA on SAM.",
        "keywords": "Black-box attack;adversarial robustness;segment anything",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Sheng Zheng;Chaoning Zhang",
        "authorids": "~Sheng_Zheng1;~Chaoning_Zhang1",
        "gender": ";M",
        "homepage": "https://scholar.google.com/citations?user=TgrJOjoAAAAJ&hl=en;",
        "dblp": ";",
        "google_scholar": ";https://scholar.google.co.kr/citations?user=lvhxhyQAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Sheng_Zheng1;~Chaoning_Zhang1",
        "aff": "Beijing Institute of Technology;Kyung Hee Universityniversity",
        "aff_domain": "bit.edu.cn;khu.ac.kr",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nzheng2024blackbox,\ntitle={Black-box Targeted Adversarial Attack on Segment Anything ({SAM})},\nauthor={Sheng Zheng and Chaoning Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=efxXzrbgrX}\n}",
        "github": "",
        "project": "",
        "reviewers": "Rvz4;ifzZ;bXHA;JQeG",
        "site": "https://openreview.net/forum?id=efxXzrbgrX",
        "pdf_size": 6552882,
        "rating": "1;3;5;6",
        "confidence": "5;4;4;4",
        "soundness": "2;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "2;2;2;3",
        "wc_summary": "45;76;95;232",
        "wc_strengths": "7;46;131;29",
        "wc_weaknesses": "152;313;156;115",
        "wc_questions": "1;3;3;163",
        "wc_review": "205;438;385;539",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.920286436967152
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            112.0,
            71.54369294354325
        ],
        "wc_strengths_avg": [
            53.25,
            46.970070257558696
        ],
        "wc_weaknesses_avg": [
            184.0,
            76.17414259445262
        ],
        "wc_questions_avg": [
            42.5,
            69.57549856091582
        ],
        "wc_review_avg": [
            391.75,
            121.18451840066041
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.8268106308031117,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12521344308903682100&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Beijing Institute of Technology;Kyung Hee University",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.bit.edu.cn/;http://www.khu.ac.kr",
        "aff_unique_abbr": "BIT;KHU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "China;South Korea"
    },
    {
        "id": "ehSQZa4vuk",
        "title": "Bad Habits: Policy Confounding and Out-of-Trajectory Generalization in Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Reinforcement learning agents may sometimes develop habits that are effective only when specific policies are followed. After an initial exploration phase during which agents try out different actions in the environment, they eventually converge on a particular policy. At this point, the distribution over state-action trajectories becomes narrower, leading agents to repeatedly experience the same transitions. This repetitive exposure can give rise to spurious correlations. Agents may then pick up on these correlations and develop simple habits that only work well within the specific set of trajectories dictated by their policy. The issue here is that these habits can result in incorrect outcomes if agents are forced to deviate from their typical trajectories due to changes in the environment or in their policies. In this paper, we provide a mathematical characterization of this phenomenon, which we refer to as policy confounding, and show, through a series of examples, when and how it occurs in practice.",
        "keywords": "reinforcement learning;generalization;confounding;spurious correlations;state abstraction",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/1457709053d478222b17fcc6d8543b5351ee6e74.pdf",
        "author": "Miguel Suau;Matthijs T. J. Spaan;Frans A Oliehoek",
        "authorids": "~Miguel_Suau1;~Matthijs_T._J._Spaan1;~Frans_A_Oliehoek1",
        "gender": "M;;",
        "homepage": "https://www.suau.io/;;",
        "dblp": "254/1496;;",
        "google_scholar": "y2xDas0AAAAJ;;",
        "orcid": ";;",
        "linkedin": "miguel-suau-de-castro-289bb2117/;;",
        "or_profile": "~Miguel_Suau1;~Matthijs_T._J._Spaan1;~Frans_A_Oliehoek1",
        "aff": "Phaidra;;",
        "aff_domain": "phaidra.ai;;",
        "position": "Researcher;;",
        "bibtex": "@misc{\nsuau2024bad,\ntitle={Bad Habits: Policy Confounding and Out-of-Trajectory Generalization in Reinforcement Learning},\nauthor={Miguel Suau and Matthijs T. J. Spaan and Frans A Oliehoek},\nyear={2024},\nurl={https://openreview.net/forum?id=ehSQZa4vuk}\n}",
        "github": "",
        "project": "",
        "reviewers": "kJx4;besR;aFjn;BRdu",
        "site": "https://openreview.net/forum?id=ehSQZa4vuk",
        "pdf_size": 867542,
        "rating": "5;5;5;6",
        "confidence": "4;4;3;4",
        "soundness": "3;3;2;3",
        "contribution": "3;3;2;3",
        "presentation": "3;2;2;4",
        "wc_summary": "85;85;33;52",
        "wc_strengths": "60;113;26;87",
        "wc_weaknesses": "60;276;530;68",
        "wc_questions": "286;38;124;292",
        "wc_review": "491;512;713;499",
        "wc_reply_reviewers": "0;691;182;81",
        "wc_reply_authors": "1547;844;1238;824",
        "reply_reviewers": "0;2;1;1",
        "reply_authors": "3;2;3;2",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            63.75,
            22.286486937155438
        ],
        "wc_strengths_avg": [
            71.5,
            32.26840560052511
        ],
        "wc_weaknesses_avg": [
            233.5,
            191.84042848158987
        ],
        "wc_questions_avg": [
            185.0,
            108.37435120913067
        ],
        "wc_review_avg": [
            553.75,
            92.24796745728331
        ],
        "wc_reply_reviewers_avg": [
            238.5,
            269.08966906962445
        ],
        "wc_reply_authors_avg": [
            1113.25,
            299.94280704827713
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:t_R-eSJglcIJ:scholar.google.com/&scioq=Bad+Habits:+Policy+Confounding+and+Out-of-Trajectory+Generalization+in+Reinforcement+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Phaidra",
        "aff_unique_dep": "",
        "aff_unique_url": "",
        "aff_unique_abbr": ""
    },
    {
        "id": "ehXWDitaKt",
        "title": "Newton Losses: Using Curvature Information for Learning with Differentiable Algorithms",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In many supervised learning problems, model predictions are compared to ground truth labels using simple convex losses such as softmax cross-entropy and squared error. In weakly-supervised learning, more complex losses involving problem-specific algorithmic procedures and knowledge, e.g., differentiable shortest-path computations or sorting algorithms, are common. These losses can be hard to optimize as they are non-convex in the model output and may exhibit vanishing and exploding gradients. To alleviate this issue, we present Newton Losses, a method for boosting the performance of non-convex and hard to optimize losses by locally approximating an existing loss function with a quadratic (incorporating second-order information). As Newton Losses only replaces the loss function, the method allows training the neural network with gradient descent and is computationally efficient. We apply Newton Losses to eight differentiable algorithm methods for the multi-digit MNIST sorting benchmark and the Warcraft shortest-path benchmark.",
        "keywords": "differentiable;differentiable algorithms;second-order;newton;algorithmic losses;sorting;ranking;differentiable sorting;differentiable ranking;sort;rank;shortest-path;dijkstra",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "",
        "author": "Felix Petersen;Christian Borgelt;Tobias Sutter;Hilde Kuehne;Oliver Deussen;Stefano Ermon",
        "authorids": "~Felix_Petersen1;~Christian_Borgelt1;~Tobias_Sutter1;~Hilde_Kuehne5;~Oliver_Deussen1;~Stefano_Ermon1",
        "gender": "Not Specified;M;M;F;M;M",
        "homepage": "http://www.petersen.ai/;https://www.borgelt.net/;https://sites.google.com/view/suttert/home;https://hildekuehne.github.io;https://graphics.uni-konstanz.de;http://cs.stanford.edu/~ermon/",
        "dblp": "230/3983;b/ChristianBorgelt.html;01/10961;45/4963;48/2158;47/8135",
        "google_scholar": "v8Kat6YAAAAJ;https://scholar.google.de/citations?user=T50Bxb8AAAAJ;https://scholar.google.ch/citations?user=11gxHJIAAAAJ;pxhCcH0AAAAJ;https://scholar.google.de/scholar?hl=en;",
        "orcid": ";;0000-0003-1226-6845;0000-0003-1079-4441;0000-0001-5803-2185;",
        "linkedin": ";christian-borgelt-a2429071/;;hilde-kuehne-8b9aa661;;",
        "or_profile": "~Felix_Petersen1;~Christian_Borgelt1;~Tobias_Sutter1;~Hilde_Kuehne5;~Oliver_Deussen1;~Stefano_Ermon1",
        "aff": "Stanford University;Paris-Lodron-University of Salzburg;Universit\u00e4t Konstanz;Rheinische Friedrich-Wilhelms-Universit\u00e4t Bonn, Rheinische Friedrich-Wilhelms Universit\u00e4t Bonn;University of Konstanz;Stanford University",
        "aff_domain": "stanford.edu;sbg.ac.at;uni-konstanz.de;cs.uni-bonn.de;uni-konstanz.de;stanford.edu",
        "position": "Postdoc;Full Professor;Assistant Professor;Associate Professor;Full Professor;Associate Professor",
        "bibtex": "@misc{\npetersen2024newton,\ntitle={Newton Losses: Using Curvature Information for Learning with Differentiable Algorithms},\nauthor={Felix Petersen and Christian Borgelt and Tobias Sutter and Hilde Kuehne and Oliver Deussen and Stefano Ermon},\nyear={2024},\nurl={https://openreview.net/forum?id=ehXWDitaKt}\n}",
        "github": "",
        "project": "",
        "reviewers": "osWY;x7SJ;gz7t;RBot",
        "site": "https://openreview.net/forum?id=ehXWDitaKt",
        "pdf_size": 568854,
        "rating": "5;6;6;6",
        "confidence": "3;3;5;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;4;3;3",
        "wc_summary": "129;11;133;233",
        "wc_strengths": "59;11;32;90",
        "wc_weaknesses": "160;11;59;106",
        "wc_questions": "193;72;23;146",
        "wc_review": "541;105;247;575",
        "wc_reply_reviewers": "0;0;18;219",
        "wc_reply_authors": "730;281;299;730",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            126.5,
            78.63046483393062
        ],
        "wc_strengths_avg": [
            48.0,
            29.62262648719725
        ],
        "wc_weaknesses_avg": [
            84.0,
            55.25848351158399
        ],
        "wc_questions_avg": [
            108.5,
            65.55341333599647
        ],
        "wc_review_avg": [
            367.0,
            197.8534811419804
        ],
        "wc_reply_reviewers_avg": [
            59.25,
            92.5239833772844
        ],
        "wc_reply_authors_avg": [
            510.0,
            220.09202620722087
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5222329678670935,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17410264126483629220&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;2;3;4;0",
        "aff_unique_norm": "Stanford University;Paris-Lodron-University of Salzburg;Universit\u00e4t Konstanz;Rheinische Friedrich-Wilhelms-Universit\u00e4t Bonn;University of Konstanz",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.stanford.edu;https://www.uni-salzburg.at;https://www.uni-konstanz.de;https://www.uni-bonn.de;https://www.uni-konstanz.de",
        "aff_unique_abbr": "Stanford;PLUS;Uni Konstanz;Uni Bonn;Uni Konstanz",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Stanford;",
        "aff_country_unique_index": "0;1;2;2;2;0",
        "aff_country_unique": "United States;Austria;Germany"
    },
    {
        "title": "Turning large language models into cognitive models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18213",
        "id": "eiC4BKypf1",
        "author_site": "Marcel Binz, Eric Schulz",
        "tldr": "",
        "abstract": "Large language models are powerful systems that excel at many tasks, ranging from translation to mathematical reasoning. Yet, at the same time, these models often show unhuman-like characteristics. In the present paper, we address this gap and ask whether large language models can be turned into cognitive models. We find that -- after finetuning them on data from psychological experiments -- these models offer accurate representations of human behavior, even outperforming traditional cognitive models in two decision-making domains. In addition, we show that their representations contain the information necessary to model behavior on the level of individual subjects. Finally, we demonstrate that finetuning on multiple tasks enables large language models to predict human behavior in a previously unseen task. Taken together, these results suggest that large, pre-trained models can be adapted to become models of human cognition, which opens up future research directions toward building more general cognitive models.",
        "keywords": "cognitive modeling;large language models;neural networks;cognitive psychology;decision-making",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "Marcel Binz;Eric Schulz",
        "authorids": "~Marcel_Binz1;~Eric_Schulz1",
        "gender": "M;M",
        "homepage": ";https://cpilab.org",
        "dblp": "212/5102;124/0016",
        "google_scholar": "https://scholar.google.de/citations?user=Lvm9Q8QAAAAJ;",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Marcel_Binz1;~Eric_Schulz1",
        "aff": "Helmholtz Zentrum M\u00fcnchen;Max Planck Institute for Biological Cybernetics",
        "aff_domain": "helmholtz-munich.de;tuebingen.mpg.de",
        "position": "Postdoc;Assistant Professor",
        "bibtex": "@inproceedings{\nbinz2024turning,\ntitle={Turning large language models into cognitive models},\nauthor={Marcel Binz and Eric Schulz},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=eiC4BKypf1}\n}",
        "github": "",
        "project": "",
        "reviewers": "donP;nBjG;sVTi;RhDW",
        "pdf_size": 482665,
        "rating": "8;8;8;8",
        "confidence": "3;5;5;5",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "2;4;4;3",
        "wc_summary": "82;46;89;56",
        "wc_strengths": "280;68;133;201",
        "wc_weaknesses": "334;135;282;202",
        "wc_questions": "395;142;48;31",
        "wc_review": "1091;391;552;490",
        "wc_reply_reviewers": "32;17;17;25",
        "wc_reply_authors": "796;562;734;860",
        "reply_reviewers": "1;1;1;2",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            4.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            68.25,
            17.781661902083282
        ],
        "wc_strengths_avg": [
            170.5,
            78.79244887678007
        ],
        "wc_weaknesses_avg": [
            238.25,
            75.92224641039014
        ],
        "wc_questions_avg": [
            154.0,
            145.4218002914281
        ],
        "wc_review_avg": [
            631.0,
            271.7176843711134
        ],
        "wc_reply_reviewers_avg": [
            22.75,
            6.2599920127744575
        ],
        "wc_reply_authors_avg": [
            738.0,
            110.95043938624129
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 104,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4051887548453911938&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=eiC4BKypf1",
        "pdf": "https://openreview.net/pdf?id=eiC4BKypf1",
        "email": "helmholtz-munich.de;tuebingen.mpg.de",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Helmholtz Zentrum M\u00fcnchen;Max Planck Institute for Biological Cybernetics",
        "aff_unique_dep": ";Biological Cybernetics",
        "aff_unique_url": "https://www.helmholtz-muenchen.de;https://www.biocybernetics.mpg.de",
        "aff_unique_abbr": ";MPIBC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Germany"
    },
    {
        "title": "SAN: Inducing Metrizability of GAN with Discriminative Normalized Linear Layer",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18212",
        "id": "eiF7TU1E8E",
        "author_site": "Yuhta Takida, Masaaki Imaizumi, Takashi Shibuya, Chieh-Hsin Lai, Toshimitsu Uesaka, Naoki Murata, Yuki Mitsufuji",
        "tldr": "",
        "abstract": "Generative adversarial networks (GANs) learn a target probability distribution by optimizing a generator and a discriminator with minimax objectives. This paper addresses the question of whether such optimization actually provides the generator with gradients that make its distribution close to the target distribution. We derive *metrizable conditions*, sufficient conditions for the discriminator to serve as the distance between the distributions, by connecting the GAN formulation with the concept of sliced optimal transport. Furthermore, by leveraging these theoretical results, we propose a novel GAN training scheme called the Slicing Adversarial Network (SAN). With only simple modifications, a broad class of existing GANs can be converted to SANs. Experiments on synthetic and image datasets support our theoretical results and the effectiveness of SAN as compared to the usual GANs. We also apply SAN to StyleGAN-XL, which leads to a state-of-the-art FID score amongst GANs for class conditional generation on CIFAR10 and ImageNet 256$\\times$256. The code is available at https://github.com/sony/san.",
        "keywords": "Generative adversarial network;optimal transport;sliced Wasserstein distance",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/c0279b14d37c60c390d361836acae737aaa52204.zip",
        "author": "Yuhta Takida;Masaaki Imaizumi;Takashi Shibuya;Chieh-Hsin Lai;Toshimitsu Uesaka;Naoki Murata;Yuki Mitsufuji",
        "authorids": "~Yuhta_Takida1;~Masaaki_Imaizumi1;~Takashi_Shibuya1;~Chieh-Hsin_Lai2;~Toshimitsu_Uesaka1;~Naoki_Murata1;~Yuki_Mitsufuji1",
        "gender": "M;M;M;M;M;M;M",
        "homepage": ";https://sites.google.com/view/mimaizumi/home;;https://chiehhsinjesselai.github.io/;;;https://www.yukimitsufuji.com/",
        "dblp": "225/9928;;23/6390-1;239/4021;204/3391;166/6626;136/5043",
        "google_scholar": "https://scholar.google.co.jp/citations?user=ahqdEYUAAAAJ;https://scholar.google.co.jp/citations?user=6c0Ljd4AAAAJ;XCRO260AAAAJ;KDnKGu8AAAAJ;;https://scholar.google.co.jp/citations?user=oyuTmwoAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;0000-0002-4277-0164;;0009-0007-0747-8305;0000-0001-7418-5173;0000-0002-6806-6140",
        "linkedin": ";masaaki-imaizumi-38600b157/;takashi-shibuya-7596a439/;;;;mittu1204",
        "or_profile": "~Yuhta_Takida1;~Masaaki_Imaizumi1;~Takashi_Shibuya1;~Chieh-Hsin_Lai2;~Toshimitsu_Uesaka1;~Naoki_Murata1;~Yuki_Mitsufuji1",
        "aff": "Sony AI;The University of Tokyo;Sony AI;Sony AI;Sony AI;Sony Group Corporation;Tokyo Institute of Technology, Tokyo Institute of Technology",
        "aff_domain": "sony.com;u-tokyo.ac.jp;sony.com;sony.com;sony.com;sony.com;titech.ac.jp",
        "position": "AI Engineer;Associate Professor;Staff AI Engineer;Researcher;Researcher;Researcher;Associate Professor",
        "bibtex": "@inproceedings{\ntakida2024san,\ntitle={{SAN}: Inducing Metrizability of {GAN} with Discriminative Normalized Linear Layer},\nauthor={Yuhta Takida and Masaaki Imaizumi and Takashi Shibuya and Chieh-Hsin Lai and Toshimitsu Uesaka and Naoki Murata and Yuki Mitsufuji},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=eiF7TU1E8E}\n}",
        "github": "",
        "project": "",
        "reviewers": "EquL;xjKk",
        "pdf_size": 16692886,
        "rating": "6;6",
        "confidence": "4;4",
        "soundness": "3;3",
        "contribution": "2;3",
        "presentation": "3;2",
        "wc_summary": "110;185",
        "wc_strengths": "140;52",
        "wc_weaknesses": "101;59",
        "wc_questions": "516;44",
        "wc_review": "867;340",
        "wc_reply_reviewers": "67;57",
        "wc_reply_authors": "2474;1182",
        "reply_reviewers": "1;2",
        "reply_authors": "6;6",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            147.5,
            37.5
        ],
        "wc_strengths_avg": [
            96.0,
            44.0
        ],
        "wc_weaknesses_avg": [
            80.0,
            21.0
        ],
        "wc_questions_avg": [
            280.0,
            236.0
        ],
        "wc_review_avg": [
            603.5,
            263.5
        ],
        "wc_reply_reviewers_avg": [
            62.0,
            5.0
        ],
        "wc_reply_authors_avg": [
            1828.0,
            646.0
        ],
        "reply_reviewers_avg": [
            1.5,
            0.5
        ],
        "reply_authors_avg": [
            6.0,
            0.0
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15631968324267159695&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=eiF7TU1E8E",
        "pdf": "https://openreview.net/pdf?id=eiF7TU1E8E",
        "email": "sony.com;u-tokyo.ac.jp;sony.com;sony.com;sony.com;sony.com;titech.ac.jp",
        "author_num": 7,
        "aff_unique_index": "0;1;0;0;0;2;3",
        "aff_unique_norm": "Sony;University of Tokyo;Sony Group Corporation;Tokyo Institute of Technology",
        "aff_unique_dep": "Sony AI;;;",
        "aff_unique_url": "https://www.sony.com;https://www.u-tokyo.ac.jp;https://www.sony.com;https://www.titech.ac.jp",
        "aff_unique_abbr": "Sony AI;UTokyo;Sony;Titech",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Tokyo",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "Japan"
    },
    {
        "id": "ekdurSMmbH",
        "title": "Universal Off-Policy Selection for Human-Centric Systems via Participant Sub-grouping",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Human-centric tasks like healthcare and education are characterized by heterogeneity among patients and students, resulting in different disease trajectories and learning styles that require personalized treatments or instructional interventions for specific subgroups. When deploying reinforcement learning (RL) for such tasks, off-policy selection (OPS) is essential, since it it closes the loop by selecting and\nevaluating RL-induced policies offline, without the need for any online interaction with the participants. Many pre-existing OPS methods, however, do not consider the heterogeneity among the participants. In this work, we introduce a universal off-policy selection (UOPS) approach to address the issue of participant heterogeneity by taking a multi-step approach. Initially, it divides the participants into sub-groups, grouping together those who exhibit similar behaviors. Subsequently, it acquires OPS criteria tailored to each of these sub-groups. Consequently, when new participants come, they will receive policy recommendations based on the sub-groups\nthey align with. This methodology enhances the adaptability and personalization of the RL system, ensuring that policy selections align more closely with the unique characteristics of each participant or group of participants. We evaluate UOPS\u2019 effectiveness through two applications: an intelligent tutor system that has been used in classrooms for over eight years, as well as a healthcare application for\nsepsis treatment and intervention. In both applications, UOPS shows significant improvements in students\u2019 learning and patient outcomes.",
        "keywords": "Off-policy selection (OPS);Participants subgrouping for OPS;OPS for human-involved systems",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/475b55d45c318dd50db1eb4b4c45a286a7fe31b7.zip",
        "author": "Ge Gao;Xi Yang;Qitong Gao;Song Ju;Miroslav Pajic;Min Chi",
        "authorids": "~Ge_Gao4;~Xi_Yang11;~Qitong_Gao1;~Song_Ju1;~Miroslav_Pajic2;~Min_Chi1",
        "gender": ";;M;M;M;",
        "homepage": "https://gegao.tech/;;http://qitonggao.com;;http://people.duke.edu/~mp275/;",
        "dblp": ";;238/5422;;74/7446.html;",
        "google_scholar": "d_WL-9cAAAAJ;;Flv4SrsAAAAJ;;Fbn21-8AAAAJ;",
        "orcid": "0000-0002-3474-8637;;;;;",
        "linkedin": ";;qitong-gao;song-ju-936513134/;;",
        "or_profile": "~Ge_Gao4;~Xi_Yang11;~Qitong_Gao1;~Song_Ju1;~Miroslav_Pajic2;~Min_Chi1",
        "aff": "North Carolina State University;;Duke University;;Duke University;",
        "aff_domain": "ncsu.edu;;duke.edu;;duke.edu;",
        "position": "PhD student;;PhD student;;Associate Professor;",
        "bibtex": "@misc{\ngao2024universal,\ntitle={Universal Off-Policy Selection for Human-Centric Systems via Participant Sub-grouping},\nauthor={Ge Gao and Xi Yang and Qitong Gao and Song Ju and Miroslav Pajic and Min Chi},\nyear={2024},\nurl={https://openreview.net/forum?id=ekdurSMmbH}\n}",
        "github": "",
        "project": "",
        "reviewers": "6fct;v9Fb;Txkj",
        "site": "https://openreview.net/forum?id=ekdurSMmbH",
        "pdf_size": 1659559,
        "rating": "5;5;5",
        "confidence": "4;2;3",
        "soundness": "3;2;3",
        "contribution": "2;3;2",
        "presentation": "2;2;3",
        "wc_summary": "101;92;82",
        "wc_strengths": "47;54;54",
        "wc_weaknesses": "251;72;105",
        "wc_questions": "158;143;8",
        "wc_review": "557;361;249",
        "wc_reply_reviewers": "526;281;0",
        "wc_reply_authors": "2754;1545;775",
        "reply_reviewers": "2;1;0",
        "reply_authors": "5;5;2",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            91.66666666666667,
            7.760297817881877
        ],
        "wc_strengths_avg": [
            51.666666666666664,
            3.299831645537222
        ],
        "wc_weaknesses_avg": [
            142.66666666666666,
            77.7788888809525
        ],
        "wc_questions_avg": [
            103.0,
            67.45368781616021
        ],
        "wc_review_avg": [
            389.0,
            127.28969583853466
        ],
        "wc_reply_reviewers_avg": [
            269.0,
            214.90618108064427
        ],
        "wc_reply_authors_avg": [
            1691.3333333333333,
            814.5224913339649
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            4.0,
            1.4142135623730951
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:yHy5UqY9iD4J:scholar.google.com/&scioq=Universal+Off-Policy+Selection+for+Human-Centric+Systems+via+Participant+Sub-grouping&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "North Carolina State University;Duke University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ncsu.edu;https://www.duke.edu",
        "aff_unique_abbr": "NCSU;Duke",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Understanding In-Context Learning in Transformers and LLMs by Learning to Learn Discrete Functions",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18211",
        "id": "ekeyCgeRfC",
        "author_site": "Satwik Bhattamishra, Arkil Patel, Phil Blunsom, Varun Kanade",
        "tldr": "",
        "abstract": "In order to understand the in-context learning phenomenon, recent works have adopted a stylized experimental framework and demonstrated that Transformers can match the performance of gradient-based learning algorithms for various classes of real-valued functions. However, the limitations of Transformers in implementing learning algorithms, and their ability to learn other forms of algorithms are not well understood. Additionally, the degree to which these capabilities are confined to attention-based models is unclear. Furthermore, it remains to be seen whether the insights derived from these stylized settings can be extrapolated to pretrained Large Language Models (LLMs). In this work, we take a step towards answering these questions by demonstrating the following: (a) On a test-bed with a variety of Boolean function classes, we find that Transformers can nearly match the optimal learning algorithm for 'simpler' tasks, while their performance deteriorates on more 'complex' tasks. Additionally, we find that certain attention-free models perform (almost) identically to Transformers on a range of tasks. (b) When provided a *teaching sequence*, i.e. a set of examples that uniquely identifies a function in a class, we show that Transformers learn more sample-efficiently. Interestingly, our results show that Transformers can learn to implement *two distinct* algorithms to solve a *single* task, and can adaptively select the more sample-efficient algorithm depending on the sequence of in-context examples. (c) Lastly, we show that extant LLMs, e.g. LLaMA-2, GPT-4, can compete with nearest-neighbor baselines on prediction tasks that are guaranteed to not be in their training set.",
        "keywords": "In-context learning;Transformers;Large language models;Boolean functions",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/e414066ad28bae7c4efd18f9c257beec11cc6eb5.zip",
        "author": "Satwik Bhattamishra;Arkil Patel;Phil Blunsom;Varun Kanade",
        "authorids": "~Satwik_Bhattamishra1;~Arkil_Patel1;~Phil_Blunsom1;~Varun_Kanade1",
        "gender": "M;M;;M",
        "homepage": "https://satwikb.com/;https://arkilpatel.github.io/;;",
        "dblp": "242/4259;254/5212;96/4705;31/6692",
        "google_scholar": "https://scholar.google.com/citations?hl=en;-5goVAsAAAAJ;https://scholar.google.co.uk/citations?user=eJwbbXEAAAAJ;",
        "orcid": ";;;",
        "linkedin": ";arkil-patel;;",
        "or_profile": "~Satwik_Bhattamishra1;~Arkil_Patel1;~Phil_Blunsom1;~Varun_Kanade1",
        "aff": "University of Oxford;McGill University;Department of Computer Science, University of Oxford;University of Oxford",
        "aff_domain": "ox.ac.uk;mail.mcgill.ca;cs.ox.ac.uk;ox.ac.uk",
        "position": "PhD student;PhD student;Associate Professor;Associate Professor",
        "bibtex": "@inproceedings{\nbhattamishra2024understanding,\ntitle={Understanding In-Context Learning in Transformers and {LLM}s by Learning to Learn Discrete Functions},\nauthor={Satwik Bhattamishra and Arkil Patel and Phil Blunsom and Varun Kanade},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ekeyCgeRfC}\n}",
        "github": "",
        "project": "",
        "reviewers": "tbmK;fGea;9RLW;bf3N",
        "pdf_size": 2263038,
        "rating": "6;6;8;8",
        "confidence": "4;4;3;4",
        "soundness": "3;3;3;4",
        "contribution": "2;3;3;4",
        "presentation": "2;3;2;4",
        "wc_summary": "231;169;188;222",
        "wc_strengths": "18;52;93;161",
        "wc_weaknesses": "38;90;330;6",
        "wc_questions": "480;117;372;227",
        "wc_review": "767;428;983;616",
        "wc_reply_reviewers": "788;83;0;105",
        "wc_reply_authors": "4157;1635;1832;666",
        "reply_reviewers": "3;1;0;1",
        "reply_authors": "8;5;4;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            202.5,
            25.124689052802225
        ],
        "wc_strengths_avg": [
            81.0,
            53.27757501988994
        ],
        "wc_weaknesses_avg": [
            116.0,
            127.13772060250254
        ],
        "wc_questions_avg": [
            299.0,
            138.20094066250056
        ],
        "wc_review_avg": [
            698.5,
            203.4754284919926
        ],
        "wc_reply_reviewers_avg": [
            244.0,
            316.50987346368834
        ],
        "wc_reply_authors_avg": [
            2072.5,
            1281.8569537978876
        ],
        "reply_reviewers_avg": [
            1.25,
            1.0897247358851685
        ],
        "reply_authors_avg": [
            4.75,
            2.165063509461097
        ],
        "replies_avg": [
            32,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 44,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3583224235205117846&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=ekeyCgeRfC",
        "pdf": "https://openreview.net/pdf?id=ekeyCgeRfC",
        "email": "ox.ac.uk;mail.mcgill.ca;cs.ox.ac.uk;ox.ac.uk",
        "author_num": 4,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "University of Oxford;McGill University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ox.ac.uk;https://www.mcgill.ca",
        "aff_unique_abbr": "Oxford;McGill",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Oxford",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "United Kingdom;Canada"
    },
    {
        "title": "Fully Hyperbolic Convolutional Neural Networks for Computer Vision",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18210",
        "id": "ekz1hN5QNh",
        "author_site": "Ahmad Bdeir, Kristian Schwethelm, Niels Landwehr",
        "tldr": "",
        "abstract": "Real-world visual data exhibit intrinsic hierarchical structures that can be represented effectively in hyperbolic spaces. Hyperbolic neural networks (HNNs) are a promising approach for learning feature representations in such spaces. However, current HNNs in computer vision rely on Euclidean backbones and only project features to the hyperbolic space in the task heads, limiting their ability to fully leverage the benefits of hyperbolic geometry. To address this, we present HCNN, a fully hyperbolic convolutional neural network (CNN) designed for computer vision tasks. Based on the Lorentz model, we generalize fundamental components of CNNs and propose novel formulations of the convolutional layer, batch normalization, and multinomial logistic regression. Experiments on standard vision tasks demonstrate the promising performance of our HCNN framework in both hybrid and fully hyperbolic settings. Overall, we believe our contributions provide a foundation for developing more powerful HNNs that can better represent complex structures found in image data. Our code is publicly available at https://github.com/kschwethelm/HyperbolicCV.",
        "keywords": "hyperbolic neural networks;hyperbolic image embedding;hyperbolic vision models. hyperboloid representation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/ac273c493a59d3e955d57ba79faf02a4f6d9a15a.zip",
        "author": "Ahmad Bdeir;Kristian Schwethelm;Niels Landwehr",
        "authorids": "~Ahmad_Bdeir1;~Kristian_Schwethelm1;~Niels_Landwehr1",
        "gender": "M;M;",
        "homepage": ";;",
        "dblp": "291/3484;344/1840;",
        "google_scholar": "eeeO7kEAAAAJ;Q5X7Kw8AAAAJ;",
        "orcid": ";0009-0007-4702-755X;",
        "linkedin": ";;",
        "or_profile": "~Ahmad_Bdeir1;~Kristian_Schwethelm1;~Niels_Landwehr1",
        "aff": "Universit\u00e4t Hildesheim;Technische Universit\u00e4t M\u00fcnchen;",
        "aff_domain": "uni-hildesheim.de;tum.de;",
        "position": "PhD student;PhD student;",
        "bibtex": "@inproceedings{\nbdeir2024fully,\ntitle={Fully Hyperbolic Convolutional Neural Networks for Computer Vision},\nauthor={Ahmad Bdeir and Kristian Schwethelm and Niels Landwehr},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ekz1hN5QNh}\n}",
        "github": "",
        "project": "",
        "reviewers": "QXC6;T97r;Nvg1",
        "pdf_size": 1686300,
        "rating": "6;6;6",
        "confidence": "4;4;3",
        "soundness": "2;3;3",
        "contribution": "3;3;4",
        "presentation": "2;3;2",
        "wc_summary": "100;59;132",
        "wc_strengths": "142;47;65",
        "wc_weaknesses": "385;111;433",
        "wc_questions": "171;71;561",
        "wc_review": "798;288;1191",
        "wc_reply_reviewers": "16;0;0",
        "wc_reply_authors": "1184;719;1864",
        "reply_reviewers": "1;0;0",
        "reply_authors": "2;1;3",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            97.0,
            29.87752778706208
        ],
        "wc_strengths_avg": [
            84.66666666666667,
            41.20140234938073
        ],
        "wc_weaknesses_avg": [
            309.6666666666667,
            141.83871905168286
        ],
        "wc_questions_avg": [
            267.6666666666667,
            211.39746660943905
        ],
        "wc_review_avg": [
            759.0,
            369.6782384723234
        ],
        "wc_reply_reviewers_avg": [
            5.333333333333333,
            7.542472332656507
        ],
        "wc_reply_authors_avg": [
            1255.6666666666667,
            470.1831794335291
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 21,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15288129242628572341&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=ekz1hN5QNh",
        "pdf": "https://openreview.net/pdf?id=ekz1hN5QNh",
        "email": "uni-hildesheim.de;tum.de;",
        "author_num": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Universit\u00e4t Hildesheim;Technische Universit\u00e4t M\u00fcnchen",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uni-hildesheim.de/;https://www.tum.de",
        "aff_unique_abbr": ";TUM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Germany"
    },
    {
        "title": "Consistency Training with Learnable Data Augmentation for Graph Anomaly Detection with Limited Supervision",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18209",
        "id": "elMKXvhhQ9",
        "author_site": "Nan Chen, Zemin Liu, Bryan Hooi, Bingsheng He, Rizal Fathony, Jun Hu, Jia Chen",
        "tldr": "",
        "abstract": "Graph Anomaly Detection (GAD) has surfaced as a significant field of research, predominantly due to its substantial influence in production environments. Although existing approaches for node anomaly detection have shown effectiveness, they have yet to fully address two major challenges: operating in settings with limited supervision and managing class imbalance effectively. In response to these challenges, we propose a novel model, ConsisGAD, which is tailored for GAD in scenarios characterized by limited supervision and is anchored in the principles of consistency training. Under limited supervision, ConsisGAD effectively leverages the abundance of unlabeled data for consistency training by incorporating a novel learnable data augmentation mechanism, thereby introducing controlled noise into the dataset. Moreover, ConsisGAD takes advantage of the variance in homophily distribution between normal and anomalous nodes to craft a simplified GNN backbone, enhancing its capability to distinguish effectively between these two classes. Comprehensive experiments on several benchmark datasets validate the superior performance of ConsisGAD in comparison to state-of-the-art baselines. Our code is available at https://github.com/Xtra-Computing/ConsisGAD.",
        "keywords": "Graph anomaly detection;consistency training;learnable data augmentation",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Nan Chen;Zemin Liu;Bryan Hooi;Bingsheng He;Rizal Fathony;Jun Hu;Jia Chen",
        "authorids": "~Nan_Chen6;~Zemin_Liu1;~Bryan_Hooi1;~Bingsheng_He1;~Rizal_Fathony1;~Jun_Hu3;~Jia_Chen2",
        "gender": "M;M;;M;M;M;",
        "homepage": "https://github.com/NanChanNN/NanChanNN.github.io;https://zemin-liu.github.io/;http://bhooi.github.io;http://www.comp.nus.edu.sg/~hebs/;https://rizal.fathony.com/;https://scholar.google.com/citations?user=K7fgdO0AAAAJ&hl=en;",
        "dblp": ";17/964.html;169/9975;h/BingshengHe.html;191/6741;28/441-16;",
        "google_scholar": ";IxHO1nkAAAAJ;;https://scholar.google.com.tw/citations?user=RogYLKYAAAAJ;_cOHKxkAAAAJ;K7fgdO0AAAAJ;",
        "orcid": "0009-0007-0240-5748;0000-0001-6262-9435;0000-0002-5645-1754;0000-0001-8618-4581;;0000-0003-1277-6802;",
        "linkedin": ";;;bingsheng-he-7734b131;;;",
        "or_profile": "~Nan_Chen6;~Zemin_Liu1;~Bryan_Hooi1;~Bingsheng_He1;~Rizal_Fathony1;~Jun_Hu3;~Jia_Chen2",
        "aff": "National University of Singapore;National University of Singapore;National University of Singapore;National University of Singapore;Grab Data Science;National University of Singapore;",
        "aff_domain": "nus.edu.sg;nus.edu;nus.edu.sg;nus.edu.sg;grab.com;nus.edu;",
        "position": "Researcher;Postdoc;Assistant Professor;Full Professor;Researcher;Postdoc;",
        "bibtex": "@inproceedings{\nchen2024consistency,\ntitle={Consistency Training with Learnable Data Augmentation for Graph Anomaly Detection with Limited Supervision},\nauthor={Nan Chen and Zemin Liu and Bryan Hooi and Bingsheng He and Rizal Fathony and Jun Hu and Jia Chen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=elMKXvhhQ9}\n}",
        "github": "",
        "project": "",
        "reviewers": "tbTo;RZbU;ZNLh",
        "pdf_size": 1097385,
        "rating": "5;8;8",
        "confidence": "4;4;4",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "3;3;3",
        "wc_summary": "67;75;118",
        "wc_strengths": "28;99;149",
        "wc_weaknesses": "74;197;193",
        "wc_questions": "2;4;38",
        "wc_review": "171;375;498",
        "wc_reply_reviewers": "0;0;23",
        "wc_reply_authors": "2153;1543;2569",
        "reply_reviewers": "0;0;1",
        "reply_authors": "6;5;6",
        "rating_avg": [
            7.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            86.66666666666667,
            22.395436042987765
        ],
        "wc_strengths_avg": [
            92.0,
            49.64540932117154
        ],
        "wc_weaknesses_avg": [
            154.66666666666666,
            57.06331765873959
        ],
        "wc_questions_avg": [
            14.666666666666666,
            16.519348924485158
        ],
        "wc_review_avg": [
            348.0,
            134.85547819795826
        ],
        "wc_reply_reviewers_avg": [
            7.666666666666667,
            10.842303978193728
        ],
        "wc_reply_authors_avg": [
            2088.3333333333335,
            421.3512654411861
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 24,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9478368042730666480&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=elMKXvhhQ9",
        "pdf": "https://openreview.net/pdf?id=elMKXvhhQ9",
        "email": "nus.edu.sg;nus.edu;nus.edu.sg;nus.edu.sg;grab.com;nus.edu;",
        "author_num": 7,
        "aff_unique_index": "0;0;0;0;1;0",
        "aff_unique_norm": "National University of Singapore;Grab",
        "aff_unique_dep": ";Data Science",
        "aff_unique_url": "https://www.nus.edu.sg;https://www.grab.com",
        "aff_unique_abbr": "NUS;Grab",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "Singapore"
    },
    {
        "id": "enT2rGC7h2",
        "title": "Impact of Agent Behavior in Distributed SGD and Federated Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Distributed learning has gained significant interest recently as it allows for the training of machine learning models across a set of *heterogeneous* agents in a privacy-preserving manner with the growing amount of distributed data. In this paper, we conduct an asymptotic analysis of Generalized Distributed SGD (GD-SGD) under various communication patterns among agents, including Distributed SGD (D-SGD) and its variants in Federated Learning (FL), as well as the increasing communication interval in the FL setting. We examine the influence of agents' sampling strategies, such as *i.i.d.* sampling, shuffling methods and Markovian sampling, on the overall convergence speed of GD-SGD. We prove that all agents will asymptotically reach consensus and identify the optimal model parameter, while also analyzing the impact of sampling strategies on the limiting covariance matrix that appears in the Central Limit Theorem (CLT). Our results theoretically and empirically support recent findings on linear speedup and asymptotic network independence, and generalize previous findings on the efficient Markovian sampling strategies from vanilla SGD to GD-SGD. Overall, our results provide a deeper understanding of the convergence speed of GD-SGD and emphasize the role of *each* agent's sampling strategy, moving beyond a focus on the worst-case agent commonly found in existing literature.",
        "keywords": "Distributed Optimization;Sampling Strategy;Distributed SGD;Federated Learning;Central Limit Theorem",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Jie Hu;Do Young Eun",
        "authorids": "~Jie_Hu7;~Do_Young_Eun1",
        "gender": "M;M",
        "homepage": ";https://people.engr.ncsu.edu/dyeun/",
        "dblp": ";",
        "google_scholar": "8uBqtwEAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0002-0165-3738;",
        "linkedin": "jie-hu-ncsu;",
        "or_profile": "~Jie_Hu7;~Do_Young_Eun1",
        "aff": "North Carolina State University;North Carolina State University",
        "aff_domain": "ncsu.edu;ncsu.edu",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nhu2024impact,\ntitle={Impact of Agent Behavior in Distributed {SGD} and Federated Learning},\nauthor={Jie Hu and Do Young Eun},\nyear={2024},\nurl={https://openreview.net/forum?id=enT2rGC7h2}\n}",
        "github": "",
        "project": "",
        "reviewers": "iur4;qXnB;bYV1",
        "site": "https://openreview.net/forum?id=enT2rGC7h2",
        "pdf_size": 1090088,
        "rating": "3;5;6",
        "confidence": "3;4;3",
        "soundness": "3;3;3",
        "contribution": "2;2;2",
        "presentation": "2;3;2",
        "wc_summary": "80;64;100",
        "wc_strengths": "57;40;63",
        "wc_weaknesses": "129;300;109",
        "wc_questions": "3;59;56",
        "wc_review": "269;463;328",
        "wc_reply_reviewers": "86;23;483",
        "wc_reply_authors": "388;902;519",
        "reply_reviewers": "1;1;1",
        "reply_authors": "1;2;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            81.33333333333333,
            14.72714802291635
        ],
        "wc_strengths_avg": [
            53.333333333333336,
            9.741092797468305
        ],
        "wc_weaknesses_avg": [
            179.33333333333334,
            85.7139947085007
        ],
        "wc_questions_avg": [
            39.333333333333336,
            25.72072229848057
        ],
        "wc_review_avg": [
            353.3333333333333,
            81.20071154586982
        ],
        "wc_reply_reviewers_avg": [
            197.33333333333334,
            203.62765583835173
        ],
        "wc_reply_authors_avg": [
            603.0,
            218.0840816443664
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.18898223650461363,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:KFbosTlmZ4EJ:scholar.google.com/&scioq=Impact+of+Agent+Behavior+in+Distributed+SGD+and+Federated+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "North Carolina State University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ncsu.edu",
        "aff_unique_abbr": "NCSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "enUArz7TeR",
        "title": "Decoupled Prioritized Resampling: Advancing Offline RL with Improved Behavior Policy",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Offline reinforcement learning (RL) is challenged by the distributional shift problem.\nTo tackle this issue, existing works mainly focus on designing sophisticated policy constraints between the learned policy and the behavior policy.\nHowever, these constraints are applied equally to well-performing and inferior actions through uniform sampling, which might negatively affect the learned policy. \nIn this paper, we proposeOffline Decoupled Prioritized Resampling (ODPR), which designs specialized priority functions for the suboptimal policy constraint issue in offline RL, and employs unique decoupled resampling for training stability.\nThrough theoretical analysis, we show that the distinctive priority functions induces a provable improved behavior policy by modifying the distribution of the original behavior policy, and when constrained to this improved policy, a policy-constrained offline RL algorithm is likely to yield a better solution.\nWe provide two practical implementations to balance computation and performance: one estimates priorities based on a fitted value network (ODPR-A), and the other utilizes trajectory returns (ODPR-R) for quick computation. ODPR serves as a highly compatible plug-and-play component with prevalent offline RL algorithms. We assess ODPR using five algorithms, namely BC, TD3+BC, Onestep RL, CQL, and IQL. Comprehensive experiments substantiate that both ODPR-A and ODPR-R markedly enhance the performance across all baseline methods.",
        "keywords": "Offline reinforcement learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/28f281723e1be25210dd44522ffb4b8a3bb6b39c.zip",
        "author": "Yang Yue;Bingyi Kang;Xiao Ma;Gao Huang;Shiji Song;Shuicheng YAN",
        "authorids": "~Yang_Yue1;~Bingyi_Kang1;~Xiao_Ma2;~Gao_Huang1;~Shiji_Song1;~Shuicheng_YAN3",
        "gender": ";;M;M;M;M",
        "homepage": ";https://bingykang.github.io/;https://yusufma03.github.io/;http://www.gaohuang.net;;https://yanshuicheng.ai/",
        "dblp": ";;35/573-6;;72/5351;y/ShuichengYan",
        "google_scholar": ";https://scholar.google.com.sg/citations?user=NmHgX-wAAAAJ;hR4G6hoAAAAJ;-P9LwcgAAAAJ;;https://scholar.google.com.hk/citations?user=DNuiPHwAAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Yang_Yue1;~Bingyi_Kang1;~Xiao_Ma2;~Gao_Huang1;~Shiji_Song1;~Shuicheng_YAN3",
        "aff": ";Bytedance;Dyson Robot Learning Lab;Tsinghua University;Tsinghua University;sea Group",
        "aff_domain": ";bytedance.com;dyson.com;tsinghua.edu.cn;mail.tsinghua.edu.cn;sea.com",
        "position": ";Researcher;Research Scientist;Associate Professor;Full Professor;Researcher",
        "bibtex": "@misc{\nyue2024decoupled,\ntitle={Decoupled Prioritized Resampling: Advancing Offline {RL} with Improved Behavior Policy},\nauthor={Yang Yue and Bingyi Kang and Xiao Ma and Gao Huang and Shiji Song and Shuicheng YAN},\nyear={2024},\nurl={https://openreview.net/forum?id=enUArz7TeR}\n}",
        "github": "",
        "project": "",
        "reviewers": "dnz8;sg4V;z7fk;X3f2",
        "site": "https://openreview.net/forum?id=enUArz7TeR",
        "pdf_size": 1368865,
        "rating": "1;3;5;5",
        "confidence": "3;4;4;4",
        "soundness": "2;1;2;3",
        "contribution": "2;1;2;2",
        "presentation": "3;2;2;3",
        "wc_summary": "158;66;126;129",
        "wc_strengths": "48;15;24;63",
        "wc_weaknesses": "765;330;103;265",
        "wc_questions": "2;19;177;3",
        "wc_review": "973;430;430;460",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            1.6583123951777
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            119.75,
            33.45425981844465
        ],
        "wc_strengths_avg": [
            37.5,
            19.03286631067428
        ],
        "wc_weaknesses_avg": [
            365.75,
            244.88096598143352
        ],
        "wc_questions_avg": [
            50.25,
            73.48936997960998
        ],
        "wc_review_avg": [
            573.25,
            231.12050428293895
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.8703882797784891,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:dCaPO5cbN7wJ:scholar.google.com/&scioq=Decoupled+Prioritized+Resampling:+Advancing+Offline+RL+with+Improved+Behavior+Policy&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;2;3",
        "aff_unique_norm": "ByteDance;Dyson;Tsinghua University;Sea Group",
        "aff_unique_dep": ";Robot Learning Lab;;",
        "aff_unique_url": "https://www.bytedance.com;https://www.dyson.com;https://www.tsinghua.edu.cn;",
        "aff_unique_abbr": "Bytedance;Dyson;THU;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "China;United Kingdom;"
    },
    {
        "title": "Consciousness-Inspired Spatio-Temporal Abstractions for Better Generalization in Reinforcement Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18208",
        "id": "eo9dHwtTFt",
        "author_site": "Mingde Zhao, Safa Alver, Harm Seijen, Romain Laroche, Doina Precup, Yoshua Bengio",
        "tldr": "",
        "abstract": "Inspired by human conscious planning, we propose Skipper, a model-based reinforcement learning framework utilizing spatio-temporal abstractions to generalize better in novel situations. It automatically decomposes the given task into smaller, more manageable subtasks, and thus enables sparse decision-making and focused computation on the relevant parts of the environment. The decomposition relies on the extraction of an abstracted proxy problem represented as a directed graph, in which vertices and edges are learned end-to-end from hindsight. Our theoretical analyses provide performance guarantees under appropriate assumptions and establish where our approach is expected to be helpful. Generalization-focused experiments validate Skipper\u2019s significant advantage in zero-shot generalization, compared to some existing state-of-the-art hierarchical planning methods.",
        "keywords": "Reinforcement Learning;Planning;Neural Networks;Temporal Difference Learning;Generalization;Deep Reinforcement Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Harry Zhao;Safa Alver;Harm van Seijen;Romain Laroche;Doina Precup;Yoshua Bengio",
        "authorids": "~Harry_Zhao1;~Safa_Alver1;~Harm_van_Seijen1;~Romain_Laroche1;~Doina_Precup1;~Yoshua_Bengio1",
        "gender": "M;;M;M;F;M",
        "homepage": "http://cs.mcgill.ca/~mzhao36;;https://www.microsoft.com/en-us/research/people/havansei/;https://www.researchgate.net/profile/Romain_Laroche;http://cs.mcgill.ca/~dprecup/;http://yoshuabengio.org",
        "dblp": ";247/1013;33/7770;65/9019;p/DoinaPrecup;56/953",
        "google_scholar": "TZh189YAAAAJ;;;RiIOKJMAAAAJ;https://scholar.google.com.tw/citations?user=j54VcVEAAAAJ;kukA0LcAAAAJ",
        "orcid": ";;;;;",
        "linkedin": "harry-zhao-992a16106/;https://linkedin.com/in/safa-alver;;romain-laroche-6282397/?originalSubdomain=ca;;yoshuabengio/?originalSubdomain=ca",
        "or_profile": "~Harry_Zhao1;~Safa_Alver1;~Harm_van_Seijen1;~Romain_Laroche1;~Doina_Precup1;~Yoshua_Bengio1",
        "aff": "McGill University;McGill University;Microsoft Research;Wayve;McGill University;University of Montreal",
        "aff_domain": "mail.mcgill.ca;mcgill.ca;microsoft.com;wayve.ai;mcgill.ca;umontreal.ca",
        "position": "PhD student;PhD student;Principal Researcher;Principal Researcher;Associate Professor;Full Professor",
        "bibtex": "@inproceedings{\nzhao2024consciousnessinspired,\ntitle={Consciousness-Inspired Spatio-Temporal Abstractions for Better Generalization in Reinforcement Learning},\nauthor={Harry Zhao and Safa Alver and Harm van Seijen and Romain Laroche and Doina Precup and Yoshua Bengio},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=eo9dHwtTFt}\n}",
        "github": "",
        "project": "",
        "reviewers": "iydj;qHoq;3j7M;muKb",
        "pdf_size": 5034125,
        "rating": "5;6;6;6",
        "confidence": "4;2;4;3",
        "soundness": "3;4;3;3",
        "contribution": "2;3;2;3",
        "presentation": "2;3;4;4",
        "wc_summary": "19;116;119;199",
        "wc_strengths": "23;137;110;116",
        "wc_weaknesses": "240;111;394;523",
        "wc_questions": "4;125;131;315",
        "wc_review": "286;489;754;1153",
        "wc_reply_reviewers": "71;0;0;42",
        "wc_reply_authors": "1777;1967;2315;2887",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "4;4;4;6",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            113.25,
            63.79018341406458
        ],
        "wc_strengths_avg": [
            96.5,
            43.603325561245896
        ],
        "wc_weaknesses_avg": [
            317.0,
            155.50723455839602
        ],
        "wc_questions_avg": [
            143.75,
            111.0976484899658
        ],
        "wc_review_avg": [
            670.5,
            324.2533731513059
        ],
        "wc_reply_reviewers_avg": [
            28.25,
            30.053078045351693
        ],
        "wc_reply_authors_avg": [
            2236.5,
            422.22120979410784
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            4.5,
            0.8660254037844386
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:kF9XzoiNdywJ:scholar.google.com/&scioq=Consciousness-Inspired+Spatio-Temporal+Abstractions+for+Better+Generalization+in+Reinforcement+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=eo9dHwtTFt",
        "pdf": "https://openreview.net/pdf?id=eo9dHwtTFt",
        "email": "mail.mcgill.ca;mcgill.ca;microsoft.com;wayve.ai;mcgill.ca;umontreal.ca",
        "author_num": 6,
        "aff_unique_index": "0;0;1;2;0;3",
        "aff_unique_norm": "McGill University;Microsoft;Wayve;University of Montreal",
        "aff_unique_dep": ";Microsoft Research;;",
        "aff_unique_url": "https://www.mcgill.ca;https://www.microsoft.com/en-us/research;https://www.wayve.ai;https://wwwumontreal.ca",
        "aff_unique_abbr": "McGill;MSR;;UM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;2;0;0",
        "aff_country_unique": "Canada;United States;United Kingdom"
    },
    {
        "id": "eoB6JmdmVf",
        "title": "Speech language models lack important brain-relevant semantics",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Despite known differences between reading and listening in the brain, recent work has shown that text-based language models predict both text-evoked and speech-evoked brain activity to an impressive degree. This poses the question of what types of information language models truly predict in the brain. We investigate this question via a direct approach, in which we eliminate information related to specific low-level stimulus features (textual, speech, and visual) in the language model representations, and observe how this intervention affects the alignment with fMRI brain recordings acquired while participants read versus listened to the same naturalistic stories. We further contrast our findings with speech-based language models, which would be expected to predict speech-evoked brain activity better, provided they model language processing in the brain well. Using our direct approach, we find that both text-based and speech-based models align well with early sensory areas due to shared low-level features. Text-based models continue to align well with later language regions even after removing these features, while, surprisingly, speech-based lose most of their alignment. These findings suggest that speech models can be further improved to better reflect brain-like language processing.",
        "keywords": "Neural Language Models;Speech Models;Low-Level Stimulus properties;fMRI;reading;listening;cognitive neuroscience;NLP;Transformers",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "SUBBA REDDY OOTA;Emin \u00c7elik;Fatma Deniz;Mariya Toneva",
        "authorids": "~SUBBA_REDDY_OOTA1;~Emin_\u00c7elik1;~Fatma_Deniz1;~Mariya_Toneva1",
        "gender": "M;M;F;F",
        "homepage": "https://sites.google.com/view/subbareddyoota300/home?authuser=0;;;https://mtoneva.com",
        "dblp": "190/1709;;;160/4677",
        "google_scholar": "https://scholar.google.co.in/citations?user=4Uz0LngAAAAJ;5lw__nIAAAAJ;B5Gh1GsAAAAJ;https://scholar.google.ca/citations?user=a61sk-4AAAAJ",
        "orcid": "0000-0002-5975-622X;;0000-0001-6051-7288;0000-0002-2407-9871",
        "linkedin": "subba-reddy-oota-11a91254/;;;",
        "or_profile": "~SUBBA_REDDY_OOTA1;~Emin_\u00c7elik1;~Fatma_Deniz1;~Mariya_K_Toneva1",
        "aff": "MPI-SWS;MPI-SWS;Technische Universit\u00e4t Berlin;Max Planck Institute for Software Systems",
        "aff_domain": "mpi-sws.org;mpi-sws.org;tu-berlin.de;mpi-sws.org",
        "position": "Visiting Scholar;Postdoc;Full Professor;Assistant Professor",
        "bibtex": "@misc{\noota2024speech,\ntitle={Speech language models lack important brain-relevant semantics},\nauthor={SUBBA REDDY OOTA and Emin {\\c{C}}elik and Fatma Deniz and Mariya Toneva},\nyear={2024},\nurl={https://openreview.net/forum?id=eoB6JmdmVf}\n}",
        "github": "",
        "project": "",
        "reviewers": "1bg5;jzFj;cgRE;5at5",
        "site": "https://openreview.net/forum?id=eoB6JmdmVf",
        "pdf_size": 4572259,
        "rating": "3;5;5;6",
        "confidence": "4;4;4;3",
        "soundness": "1;3;3;3",
        "contribution": "1;3;2;3",
        "presentation": "2;3;3;4",
        "wc_summary": "150;144;228;114",
        "wc_strengths": "91;90;70;78",
        "wc_weaknesses": "28;227;1059;100",
        "wc_questions": "24;327;60;78",
        "wc_review": "293;788;1417;370",
        "wc_reply_reviewers": "77;217;1323;0",
        "wc_reply_authors": "733;1640;5120;1106",
        "reply_reviewers": "1;1;3;0",
        "reply_authors": "1;3;8;2",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            159.0,
            42.1070065428546
        ],
        "wc_strengths_avg": [
            82.25,
            8.728545125048045
        ],
        "wc_weaknesses_avg": [
            353.5,
            413.50483673108346
        ],
        "wc_questions_avg": [
            122.25,
            119.80061560776723
        ],
        "wc_review_avg": [
            717.0,
            445.8772252537687
        ],
        "wc_reply_reviewers_avg": [
            404.25,
            536.1144350789298
        ],
        "wc_reply_authors_avg": [
            2149.75,
            1744.9086473222603
        ],
        "reply_reviewers_avg": [
            1.25,
            1.0897247358851685
        ],
        "reply_authors_avg": [
            3.5,
            2.692582403567252
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.6622661785325219,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6442394322567717448&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Max Planck Institute for Software Systems;Technische Universit\u00e4t Berlin",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.mpi-sws.org;https://www.tu-berlin.de",
        "aff_unique_abbr": "MPI-SWS;TU Berlin",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "title": "Towards Energy Efficient Spiking Neural Networks: An Unstructured Pruning Framework",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18207",
        "id": "eoSeaK4QJo",
        "author_site": "Xinyu Shi, Jianhao Ding, Zecheng Hao, Zhaofei Yu",
        "tldr": "",
        "abstract": "Spiking Neural Networks (SNNs)  have emerged as energy-efficient alternatives to  Artificial Neural Networks (ANNs) when deployed on neuromorphic chips.  While recent studies have demonstrated the impressive performance of deep SNNs on challenging tasks, their energy efficiency advantage has been diminished. Existing methods targeting energy consumption reduction do not fully exploit sparsity, whereas powerful pruning methods can achieve high sparsity but are not directly targeted at energy efficiency, limiting their effectiveness in energy saving. Furthermore, none of these works fully exploit the sparsity of neurons or the potential for unstructured neuron pruning in SNNs. In this paper, we propose a novel pruning framework that combines unstructured weight pruning with unstructured neuron pruning to maximize the utilization of the sparsity of neuromorphic computing, thereby enhancing energy efficiency. To the best of our knowledge, this is the first application of unstructured neuron pruning to deep SNNs. Experimental results demonstrate that  our method achieves impressive energy efficiency gains. The sparse network pruned by our method with only 0.63\\% remaining connections can achieve a remarkable 91 times increase in energy efficiency compared to the original dense network, requiring only 8.5M SOPs for inference, with merely 2.19\\% accuracy loss on the CIFAR-10 dataset. Our work suggests that deep and dense SNNs exhibit high redundancy in energy consumption, highlighting the potential for targeted SNN sparsification to save energy.",
        "keywords": "Spiking Neural Networks;Network Pruning",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/e7abddbb59779276addcca5cca21582d50a8edb8.zip",
        "author": "Xinyu Shi;Jianhao Ding;Zecheng Hao;Zhaofei Yu",
        "authorids": "~Xinyu_Shi2;~Jianhao_Ding1;~Zecheng_Hao1;~Zhaofei_Yu1",
        "gender": ";M;;M",
        "homepage": ";https://dingjianhao.github.io/;https://hzc1208.github.io/;https://yuzhaofei.github.io",
        "dblp": ";128/2534;339/6969;166/0573",
        "google_scholar": ";4rDfCSsAAAAJ;txTkX7YAAAAJ;qaUgD50AAAAJ",
        "orcid": ";;0000-0001-9074-2857;",
        "linkedin": ";;;",
        "or_profile": "~Xinyu_Shi2;~Jianhao_Ding1;~Zecheng_Hao1;~Zhaofei_Yu1",
        "aff": ";Institute of Automation, Chinese Academy of Sciences;Peking University;Peking University",
        "aff_domain": ";ia.ac.cn;pku.edu.cn;pku.edu.cn",
        "position": ";Intern;PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nshi2024towards,\ntitle={Towards Energy Efficient Spiking Neural Networks: An Unstructured Pruning Framework},\nauthor={Xinyu Shi and Jianhao Ding and Zecheng Hao and Zhaofei Yu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=eoSeaK4QJo}\n}",
        "github": "",
        "project": "",
        "reviewers": "BChF;gonx;tCqk;iYS5",
        "pdf_size": 2372451,
        "rating": "3;6;8;8",
        "confidence": "3;4;5;5",
        "soundness": "2;3;3;3",
        "contribution": "2;2;4;3",
        "presentation": "3;3;3;3",
        "wc_summary": "50;53;85;87",
        "wc_strengths": "30;57;48;94",
        "wc_weaknesses": "187;174;65;86",
        "wc_questions": "16;41;35;68",
        "wc_review": "283;325;233;335",
        "wc_reply_reviewers": "126;128;40;46",
        "wc_reply_authors": "1721;1872;739;311",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "5;5;1;1",
        "rating_avg": [
            6.25,
            2.0463381929681126
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            68.75,
            17.297037318569906
        ],
        "wc_strengths_avg": [
            57.25,
            23.33854108550918
        ],
        "wc_weaknesses_avg": [
            128.0,
            53.22123636294069
        ],
        "wc_questions_avg": [
            40.0,
            18.614510468986285
        ],
        "wc_review_avg": [
            294.0,
            40.26164427839479
        ],
        "wc_reply_reviewers_avg": [
            85.0,
            42.05948168962618
        ],
        "wc_reply_authors_avg": [
            1160.75,
            655.6875685111012
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.0,
            2.0
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.9945577827230725,
        "gs_citation": 20,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18180276224786095832&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=eoSeaK4QJo",
        "pdf": "https://openreview.net/pdf?id=eoSeaK4QJo",
        "email": ";ia.ac.cn;pku.edu.cn;pku.edu.cn",
        "author_num": 4,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Chinese Academy of Sciences;Peking University",
        "aff_unique_dep": "Institute of Automation;",
        "aff_unique_url": "http://www.ia.cas.cn;http://www.pku.edu.cn",
        "aff_unique_abbr": "CAS;Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Maximum Likelihood Estimation is All You Need for Well-Specified Covariate Shift",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18206",
        "id": "eoTCKKOgIs",
        "author_site": "Jiawei Ge, Shange Tang, Jianqing Fan, Cong Ma, Chi Jin",
        "tldr": "",
        "abstract": "A key challenge of modern machine learning systems is to achieve Out-of-Distribution (OOD) generalization---generalizing to target data whose distribution differs from that of source data. Despite its significant importance, the fundamental question of ``what are the most effective algorithms for OOD generalization'' remains open even under the standard setting of covariate shift.\nThis paper addresses this fundamental question by proving that, surprisingly, classical Maximum Likelihood Estimation (MLE) purely using source data (without any modification) achieves the *minimax* optimality for covariate shift under the *well-specified* setting. That is, *no* algorithm performs better than MLE in this setting (up to a constant factor), justifying MLE is all you need.\nOur result holds for a very rich class of parametric models, and does not require any boundedness condition on the density ratio. We illustrate the wide applicability of our framework by instantiating it to three concrete examples---linear regression, logistic regression, and phase retrieval. This paper further complement the study by proving that, under the *misspecified setting*, MLE is no longer the optimal choice, whereas Maximum Weighted Likelihood Estimator (MWLE) emerges as minimax optimal in certain scenarios.",
        "keywords": "Covariate shift; Maximum Likelihood Estimation; Out-of-Distribution generalization;",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/7aa9325b7cf23c23a96064f06aba175096ad9968.pdf",
        "author": "Jiawei Ge;Shange Tang;Jianqing Fan;Cong Ma;Chi Jin",
        "authorids": "~Jiawei_Ge3;~Shange_Tang1;~Jianqing_Fan1;~Cong_Ma1;~Chi_Jin1",
        "gender": "F;M;M;M;M",
        "homepage": "https://jiaweige0416.github.io/research.html;https://shangetang.github.io/;https://fan.princeton.edu;https://congma1028.github.io/;https://sites.google.com/view/cjin/home",
        "dblp": "https://dblp.org/rec/journals/corr/abs-2303-01566;255/5774;33/2768;42/10808;126/1802-1",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en;;GINhGvwAAAAJ",
        "orcid": ";;0000-0003-3250-7677;;",
        "linkedin": "jiawei-ge-b378491bb/;;;;",
        "or_profile": "~Jiawei_Ge3;~Shange_Tang1;~Jianqing_Fan1;~Cong_Ma1;~Chi_Jin1",
        "aff": "Princeton University;Princeton University;Princeton University;University of Chicago;Princeton University",
        "aff_domain": "princeton.edu;princeton.edu;princeton.edu;uchicago.edu;princeton.edu",
        "position": "PhD student;PhD student;Professor;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nge2024maximum,\ntitle={Maximum Likelihood Estimation is All You Need for Well-Specified Covariate Shift},\nauthor={Jiawei Ge and Shange Tang and Jianqing Fan and Cong Ma and Chi Jin},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=eoTCKKOgIs}\n}",
        "github": "",
        "project": "",
        "reviewers": "qbMA;jKTp;Vzp3;xCis",
        "pdf_size": 579125,
        "rating": "3;6;8;8",
        "confidence": "4;3;4;3",
        "soundness": "2;3;4;3",
        "contribution": "2;2;4;3",
        "presentation": "2;2;4;3",
        "wc_summary": "25;146;117;180",
        "wc_strengths": "49;57;63;120",
        "wc_weaknesses": "307;233;76;126",
        "wc_questions": "168;2;29;207",
        "wc_review": "549;438;285;633",
        "wc_reply_reviewers": "0;0;8;0",
        "wc_reply_authors": "657;252;145;221",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.25,
            2.0463381929681126
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            117.0,
            57.6064232529672
        ],
        "wc_strengths_avg": [
            72.25,
            28.01227409547465
        ],
        "wc_weaknesses_avg": [
            185.5,
            90.20670706771199
        ],
        "wc_questions_avg": [
            101.5,
            87.6199178269416
        ],
        "wc_review_avg": [
            476.25,
            130.29078056409057
        ],
        "wc_reply_reviewers_avg": [
            2.0,
            3.4641016151377544
        ],
        "wc_reply_authors_avg": [
            318.75,
            199.1310812002988
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.3665083330689157,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3508335274061541484&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=eoTCKKOgIs",
        "pdf": "https://openreview.net/pdf?id=eoTCKKOgIs",
        "email": "princeton.edu;princeton.edu;princeton.edu;uchicago.edu;princeton.edu",
        "author_num": 5,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "Princeton University;University of Chicago",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.princeton.edu;https://www.uchicago.edu",
        "aff_unique_abbr": "Princeton;UChicago",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "eojWsJQ2fe",
        "title": "Prompt Engineering a Prompt Engineer",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Prompt engineering is a challenging yet crucial task for optimizing the performance of large language models (LLMs). It requires complex reasoning to examine the model's errors, hypothesize what is missing or misleading in the current prompt, and communicate the task clearly to the LLM. While recent works indicate that LLMs can be meta-prompted to perform automatic prompt engineering, their potentials are not fully unlocked as the meta-prompts may not offer sufficient guidance to elicit complex reasoning capabilities in LLMs.\nIn this work, we investigate the problem of \"prompt engineering a prompt engineer\"---constructing a meta-prompt that more effectively guides LLMs to perform prompt engineering. We introduce and analyze key components, such as a step-by-step reasoning template and context specification, which leads to improved performance on automatic prompt engineering. The resulting method, named PE2, finds a prompt that outperforms ``let\u2019s think step by step\u2019\u2019 by 6.3\\% on the MultiArith dataset and 3.1\\% on the GSM8K dataset. To demonstrate its versatility, we apply PE2 to the Instruction Induction benchmark, a suite of counterfactual tasks, and a real-world industrial prompt. In these settings, PE2 achieves strong performance and outperforms prior automatic prompt engineering baselines. Further, we show that PE2 makes meaningful and targeted prompt edits, amends erroneous or incomplete prompts, and presents non-trivial counterfactual reasoning abilities.",
        "keywords": "prompt engineering;large language models;optimization",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Qinyuan Ye;Mohamed Ahmed;Reid Pryzant;Fereshte Khani",
        "authorids": "~Qinyuan_Ye1;~Mohamed_Ahmed1;~Reid_Pryzant1;~Fereshte_Khani1",
        "gender": "F;;;F",
        "homepage": "http://yeqy.xyz/;;;https://people.stanford.edu/fereshte/",
        "dblp": "239/5731;49/4653-1;205/3986;129/2345",
        "google_scholar": "g230ERwAAAAJ;_any3jgAAAAJ;FkufKDgAAAAJ;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Qinyuan_Ye1;~Mohamed_Ahmed1;~Reid_Pryzant1;~Fereshte_Khani1",
        "aff": "University of Southern California;Microsoft Research;Microsoft Research;Microsoft",
        "aff_domain": "usc.edu;research.microsoft.com;research.microsoft.com;microsoft.com",
        "position": "PhD student;Principal Researcher;Researcher;Researcher",
        "bibtex": "@misc{\nye2024prompt,\ntitle={Prompt Engineering a Prompt Engineer},\nauthor={Qinyuan Ye and Mohamed Ahmed and Reid Pryzant and Fereshte Khani},\nyear={2024},\nurl={https://openreview.net/forum?id=eojWsJQ2fe}\n}",
        "github": "",
        "project": "",
        "reviewers": "MVYf;x9xJ;uHAL;iQjD",
        "site": "https://openreview.net/forum?id=eojWsJQ2fe",
        "pdf_size": 913824,
        "rating": "3;3;5;8",
        "confidence": "4;3;3;4",
        "soundness": "2;2;3;4",
        "contribution": "2;2;2;4",
        "presentation": "2;2;2;4",
        "wc_summary": "117;75;88;101",
        "wc_strengths": "103;34;108;95",
        "wc_weaknesses": "115;262;172;197",
        "wc_questions": "67;2;279;25",
        "wc_review": "402;373;647;418",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "830;871;1119;455",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;2;2;1",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            95.25,
            15.562374497485916
        ],
        "wc_strengths_avg": [
            85.0,
            29.80771712157776
        ],
        "wc_weaknesses_avg": [
            186.5,
            52.75651618520692
        ],
        "wc_questions_avg": [
            93.25,
            109.74601359502768
        ],
        "wc_review_avg": [
            460.0,
            109.16272257506222
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            818.75,
            237.3398144012083
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3665083330689157,
        "gs_citation": 81,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3722472838441911890&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "University of Southern California;Microsoft",
        "aff_unique_dep": ";Microsoft Research",
        "aff_unique_url": "https://www.usc.edu;https://www.microsoft.com/en-us/research",
        "aff_unique_abbr": "USC;MSR",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Los Angeles;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "ep9y5OrFmS",
        "title": "What Apples Tell About Oranges: Connecting Pruning Masks and Hessian Eigenspaces",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent studies have demonstrated that good pruning masks of neural networks emerge early during training, and that they remain largely stable thereafter. In a separate line of work, it has also been demonstrated that the eigenspace of the loss Hessian shrinks drastically during early training, and remains largely stable thereafter. While previous research establishes a direct relationship between individual network parameters and loss curvature at training convergence, in this study we investigate the connection between parameter pruning masks and Hessian eigenspaces, throughout the entire training process and with particular attention to their early stabilization. To quantify the similarity between these seemingly disparate objects, we cast them as orthonormal matrices from the same Stiefel manifold, each defining a linear subspace. This allows us to measure the similarity of their spans using Grassmannian metrics. In our experiments, we train a deep neural network and demonstrate that these two subspaces overlap significantly - well above random chance - throughout the entire training process and not just at convergence. This overlap is largest at initialization, and then drops and stabilizes, providing a novel perspective on the early stabilization phenomenon and suggesting that, in deep learning, largest parameter magnitudes tend to coincide with the directions of largest loss curvature. This early-stabilization and high-overlap phenomenon can be leveraged to approximate the typically intractable top Hessian subspace via parameter inspection, at only linear cost. The connection between parameters and loss curvatures also offers a fresh perspective on existing work, tending a bridge between first- and second-order methods.",
        "keywords": "deep learning;pruning;Hessian;Grassmannians",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Andres Fernandez;Frank Schneider;Maren Mahsereci;Philipp Hennig",
        "authorids": "~Andres_Fernandez1;~Frank_Schneider1;~Maren_Mahsereci1;~Philipp_Hennig1",
        "gender": "M;M;;M",
        "homepage": "https://aferro.dynu.net/;https://fsschneider.github.io;;http://mml.inf.uni-tuebingen.de",
        "dblp": ";41/328-1;159/1945;08/9077",
        "google_scholar": "HlZC1uUAAAAJ;znq-WkAAAAAJ;;https://scholar.google.de/citations?user=UeG5w08AAAAJ",
        "orcid": "0000-0003-3830-3595;;;0000-0001-7293-6092",
        "linkedin": "https://linkedin.com/in/andres-fr;frankstefanschneider/;;",
        "or_profile": "~Andres_Fernandez1;~Frank_Schneider1;~Maren_Mahsereci1;~Philipp_Hennig1",
        "aff": "Meta Facebook;University of T\u00fcbingen;University of Tuebingen;University of T\u00fcbingen",
        "aff_domain": "meta.com;uni-tuebingen.de;uni-tuebingen.de;uni-tuebingen.de",
        "position": "Intern;Postdoc;Postdoc;Full Professor",
        "bibtex": "@misc{\nfernandez2024what,\ntitle={What Apples Tell About Oranges: Connecting Pruning Masks and Hessian Eigenspaces},\nauthor={Andres Fernandez and Frank Schneider and Maren Mahsereci and Philipp Hennig},\nyear={2024},\nurl={https://openreview.net/forum?id=ep9y5OrFmS}\n}",
        "github": "",
        "project": "",
        "reviewers": "e5Zh;FPBX;kBDH;ZWvF",
        "site": "https://openreview.net/forum?id=ep9y5OrFmS",
        "pdf_size": 2413776,
        "rating": "3;3;3;5",
        "confidence": "3;3;4;3",
        "soundness": "2;3;1;3",
        "contribution": "2;2;2;2",
        "presentation": "3;3;3;3",
        "wc_summary": "115;55;102;95",
        "wc_strengths": "31;52;221;93",
        "wc_weaknesses": "331;148;581;206",
        "wc_questions": "34;35;56;117",
        "wc_review": "511;290;960;511",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            91.75,
            22.398381637966615
        ],
        "wc_strengths_avg": [
            99.25,
            73.74406755800767
        ],
        "wc_weaknesses_avg": [
            316.5,
            166.41289012573515
        ],
        "wc_questions_avg": [
            60.5,
            33.78239186321774
        ],
        "wc_review_avg": [
            568.0,
            243.64215562993198
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:tSv-y31QdXgJ:scholar.google.com/&scioq=What+Apples+Tell+About+Oranges:+Connecting+Pruning+Masks+and+Hessian+Eigenspaces&hl=en&as_sdt=0,33",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "Meta;University of T\u00fcbingen;University of Tuebingen",
        "aff_unique_dep": "Meta Platforms, Inc.;;",
        "aff_unique_url": "https://meta.com;https://www.uni-tuebingen.de/;https://www.uni-tuebingen.de/",
        "aff_unique_abbr": "Meta;Uni T\u00fcbingen;Uni T\u00fcbingen",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "United States;Germany"
    },
    {
        "id": "epFk8e470p",
        "title": "Deep Models modelled after human brain boost performance in action classification",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recognizing actions from visual input is a fundamental cognitive ability. Perceiving what others are doing is a gateway to inferring their goals, emotions, beliefs and traits. Action recognition is also key for applications ranging from robotics to healthcare monitoring. Action information can be extracted from the body pose and movements, as well as from the background scene. However, the extent to which deep neural networks make use of information about the body and information about the background remains unclear. In particular, since these two sources of information may be correlated within a training dataset, deep networks might learn to rely predominantly on one of them, without taking full advantage of the other. Unlike deep networks, humans have domain-specific brain regions selective for perceiving bodies, and regions selective for perceiving scenes. The present work tests whether humans are thus more effective at extracting information from both body and background, and whether building brain-inspired deep network architectures with separate domain-specific streams for body and scene perception endows them with more human-like performance. We first demonstrate that deep networks trained using the Human Atomic Actions 500 dataset perform almost as accurately on versions of the stimuli that show both body and background and on versions of the stimuli from which the body was removed, but are at chance-level for versions of the stimuli from which the background was removed.  Conversely, human participants (N=28) can recognize the same set of actions accurately with all three versions of the stimuli, and perform significantly better on stimuli that show only the body than on stimuli that show only the background. Finally, we implement and test a novel deep network architecture patterned after domain specificity in the brain, that utilizes separate streams to process body and background information. We show that 1) this architecture improves action recognition performance, and 2) its accuracy across different versions of the stimuli follows a pattern that matches more closely the pattern of accuracy observed in human participants.",
        "keywords": "Neuroscience;Cognition;Deep Learning;Action Recognition",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "Aidas Aglinskas;Stefano Anzellotti",
        "authorids": "~Aidas_Aglinskas1;~Stefano_Anzellotti1",
        "gender": ";M",
        "homepage": "http://Aglinskas.com;https://sccnlab.bc.edu/",
        "dblp": ";",
        "google_scholar": ";tK5W2p0AAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Aidas_Aglinskas1;~Stefano_Anzellotti1",
        "aff": "Boston College;Boston College",
        "aff_domain": "bc.edu;bc.edu",
        "position": "Postdoc;Assistant Professor",
        "bibtex": "@misc{\naglinskas2024deep,\ntitle={Deep Models modelled after human brain boost performance in action classification},\nauthor={Aidas Aglinskas and Stefano Anzellotti},\nyear={2024},\nurl={https://openreview.net/forum?id=epFk8e470p}\n}",
        "github": "",
        "project": "",
        "reviewers": "W6Z2;JzJq;df1j",
        "site": "https://openreview.net/forum?id=epFk8e470p",
        "pdf_size": 2094786,
        "rating": "1;1;3",
        "confidence": "5;4;4",
        "soundness": "1;2;3",
        "contribution": "1;1;2",
        "presentation": "1;1;2",
        "wc_summary": "87;172;26",
        "wc_strengths": "33;17;59",
        "wc_weaknesses": "244;189;104",
        "wc_questions": "62;75;11",
        "wc_review": "426;453;200",
        "wc_reply_reviewers": "326;0;0",
        "wc_reply_authors": "740;331;182",
        "reply_reviewers": "1;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            95.0,
            59.87208587202108
        ],
        "wc_strengths_avg": [
            36.333333333333336,
            17.30767331432956
        ],
        "wc_weaknesses_avg": [
            179.0,
            57.590508477236654
        ],
        "wc_questions_avg": [
            49.333333333333336,
            27.620443314488796
        ],
        "wc_review_avg": [
            359.6666666666667,
            113.43818679008503
        ],
        "wc_reply_reviewers_avg": [
            108.66666666666667,
            153.67787377787633
        ],
        "wc_reply_authors_avg": [
            417.6666666666667,
            235.90158023115393
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:MhV4m7EaGNcJ:scholar.google.com/&scioq=Deep+Models+modelled+after+human+brain+boost+performance+in+action+classification&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Boston College",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.bostoncollege.edu",
        "aff_unique_abbr": "BC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "epZV1nykll",
        "title": "Foundation Reinforcement Learning: towards Embodied Generalist Agents with Foundation Prior Assistance",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recently, people have shown that large-scale pre-training from diverse internet-scale data is the key to building a generalist model, as witnessed in the natural language processing (NLP) area. To build an embodied generalist agent, we, as well as many other researchers, hypothesize that such foundation prior is also an indispensable component. However, it is unclear \\textit{what is the proper concrete form we should represent those embodied foundation priors} and \\textit{how those priors should be used in the downstream task}. In this paper, we propose an intuitive and effective set of embodied priors that consist of foundation policy, foundation value, and foundation success reward. The proposed priors are based on the goal-conditioned Markov decision process formulation of the task. To verify the effectiveness of the proposed priors, we instantiate an actor-critic method with the assistance of the priors, called Foundation Actor-Critic (FAC). We name our framework as \\textbf{Foundation Reinforcement Learning} (FRL), since our framework completely relies on embodied foundation priors to explore, learn and reinforce. The benefits of our framework are threefold. (1) \\textit{Sample efficient learning}. With the foundation prior, FAC learns significantly faster than traditional RL. Our evaluation on the Meta-World has proved that FAC can achieve 100\\% success rates for 7/8 tasks under less than 200k frames, which outperforms the baseline method with careful manual-designed rewards under 1M frames. (2) \\textit{Robust to noisy priors}. Our method tolerates the unavoidable noise in embodied foundation models. We have shown that FAC works well even under heavy noise or quantization errors. (3) \\textit{Minimal human intervention}: FAC completely learns from the foundation priors, without the need of human-specified dense reward, or providing teleoperated demonstrations. Thus, FAC can be easily scaled up.\nWe believe our FRL framework could enable the future robot to autonomously explore and learn without human intervention in the physical world.\nIn summary, our proposed FRL framework is a novel and powerful learning paradigm, towards achieving an embodied generalist agent.",
        "keywords": "Foundation Models; Actor-Critic; Vision Languange Models; Embodied AI; Reward shaping",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/9023c90eaab3bfe3099ee0340f6a3fe21558e3dd.zip",
        "author": "Weirui Ye;Yunsheng Zhang;Mengchen Wang;Shengjie Wang;Xianfan Gu;Pieter Abbeel;Yang Gao",
        "authorids": "~Weirui_Ye1;~Yunsheng_Zhang1;~Mengchen_Wang3;~Shengjie_Wang2;~Xianfan_Gu1;~Pieter_Abbeel2;~Yang_Gao1",
        "gender": "M;M;M;M;M;M;M",
        "homepage": "https://yewr.github.io/;https://isa233.github.io/;https://github.com/fjlafafa;https://shengjiewang-jason.github.io/;;https://people.eecs.berkeley.edu/~pabbeel/;http://yang-gao.weebly.com",
        "dblp": "245/3595;;;;344/1664;;89/4402-29",
        "google_scholar": "_GgST9AAAAAJ;;;;;https://scholar.google.com.tw/citations?user=vtwH6GkAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;;0000-0002-7860-9460;;",
        "linkedin": ";;;;;;yang-gao-45245348/",
        "or_profile": "~Weirui_Ye1;~Yunsheng_Zhang1;~Mengchen_Wang3;~Shengjie_Wang2;~Xianfan_Gu1;~Pieter_Abbeel2;~Yang_Gao1",
        "aff": "Tsinghua University;;Tsinghua University;Tsinghua University;Shanghai Qi Zhi Institute;Covariant;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;;mail.tsinghua.edu.cn;mails.tsinghua.edu.cn;sqz.ac.cn;covariant.ai;tsinghua.edu.cn",
        "position": "PhD student;;Undergrad student;PhD student;Researcher;Founder;Assistant Professor",
        "bibtex": "@misc{\nye2024foundation,\ntitle={Foundation Reinforcement Learning: towards Embodied Generalist Agents with Foundation Prior Assistance},\nauthor={Weirui Ye and Yunsheng Zhang and Mengchen Wang and Shengjie Wang and Xianfan Gu and Pieter Abbeel and Yang Gao},\nyear={2024},\nurl={https://openreview.net/forum?id=epZV1nykll}\n}",
        "github": "",
        "project": "",
        "reviewers": "AdQL;rMFS;zJMD;x7U5",
        "site": "https://openreview.net/forum?id=epZV1nykll",
        "pdf_size": 1223071,
        "rating": "5;5;5;8",
        "confidence": "3;4;4;5",
        "soundness": "3;3;2;4",
        "contribution": "2;3;2;3",
        "presentation": "3;2;3;4",
        "wc_summary": "34;187;97;99",
        "wc_strengths": "27;31;66;93",
        "wc_weaknesses": "212;51;371;49",
        "wc_questions": "32;16;48;39",
        "wc_review": "305;285;582;280",
        "wc_reply_reviewers": "63;0;316;92",
        "wc_reply_authors": "1376;738;2137;322",
        "reply_reviewers": "1;0;1;2",
        "reply_authors": "4;2;4;3",
        "rating_avg": [
            5.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            104.25,
            54.45812611539255
        ],
        "wc_strengths_avg": [
            54.25,
            27.03123193641015
        ],
        "wc_weaknesses_avg": [
            170.75,
            133.19604911558
        ],
        "wc_questions_avg": [
            33.75,
            11.712706775122479
        ],
        "wc_review_avg": [
            363.0,
            126.78525150820974
        ],
        "wc_reply_reviewers_avg": [
            117.75,
            119.19390714294083
        ],
        "wc_reply_authors_avg": [
            1143.25,
            685.636702270233
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            3.25,
            0.82915619758885
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.816496580927726,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14070179958088119704&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0;1;2;0",
        "aff_unique_norm": "Tsinghua University;Shanghai Qi Zhi Institute;Covariant",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.qz.io;",
        "aff_unique_abbr": "THU;;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China;"
    },
    {
        "id": "eqEqvbKbq0",
        "title": "Robust Core-periphery Constrained Transformer for Domain Adaptation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Unsupervised domain adaptation (UDA) aims to learn transferable representation across domains. Recently a few UDA works have successfully applied Transformer-based methods and achieved state-of-the-art (SOTA) results. However, it remains challenging when there exists a large domain gap between the source and target domain. Inspired by the remarkable transferability abilities of humans, where knowledge can adapt from familiar to uncharted domains, we endeavor to apply universally existing brain structure and function principles, specifically, the core-periphery principle and the concept of the noisy brain, to design and enhance the Transformer, ultimately improving its performance in UDA. In this work, we propose a novel brain-inspired robust core-periphery constrained transformer (RCCT) for unsupervised domain adaptation, which brings a large margin of performance improvement on various datasets. The application of the core-periphery principle and the development of the latent feature interaction (LFI) operation correspond to the `Core-periphery' and `Robust' aspects mentioned in the title. Specifically, in RCCT, the self-attention operation across image patches is rescheduled by an adaptively learned weighted graph with the Core-Periphery structure (CP graph), where the information communication and exchange between image patches are manipulated and controlled by the connection strength, i.e., edge weight of the learned weighted CP graph. In addition, considering the noisy nature of data in domain adaptation tasks, we propose a latent feature interaction operation to enhance model robustness, wherein we intentionally introduce perturbations to the latent features in the latent space, ensuring the generation of robust learned weighted core-periphery graphs. We conducted extensive evaluations on several well-established UDA benchmarks, and the experimental results demonstrate that applying brain-inspired principles leads to promising results, surpassing the performance of existing Transformer-based methods.",
        "keywords": "Transformer;Core-peiphery;Noisy Brain",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/61b3d5f9ceb9e7cf1652d227965c438d71e116b0.pdf",
        "author": "Xiaowei Yu;Lu Zhang;Yao Xue;Yanjun Lyu;Tianming Liu;Dajiang Zhu",
        "authorids": "~Xiaowei_Yu1;~Lu_Zhang16;~Yao_Xue2;~Yanjun_Lyu1;~Tianming_Liu3;~Dajiang_Zhu1",
        "gender": "M;F;F;;M;M",
        "homepage": "http://shawey94.github.io/;https://qidianzl.github.io/;;;https://cobweb.cs.uga.edu/~tliu/;https://mentis.uta.edu/explore/profile/dajiang-zhu",
        "dblp": ";;;277/7781;96/5013-1.html;https://dblp.uni-trier.de/pers/hd/z/Zhu:Dajiang",
        "google_scholar": "Kc1FjToAAAAJ;XNbe_O4AAAAJ;;;92RPXm0AAAAJ;cFgudIYAAAAJ",
        "orcid": ";;;;;",
        "linkedin": "shawey94;;yao-xue-a81045138;;;",
        "or_profile": "~Xiaowei_Yu1;~Lu_Zhang16;~Yao_Xue2;~Yanjun_Lyu1;~Tianming_Liu3;~Dajiang_Zhu1",
        "aff": "University of Texas at Arlington, University of Texas at Arlington;Indiana University Indianapolis;Southern Illinois University-Carbondale;University of Texas at Arlington;University of Georgia;University of Texas at Arlington",
        "aff_domain": "mavs.uta.edu;iu.edu;siu.edu;uta.edu;uga.edu;uta.edu",
        "position": "PhD student;Assistant Professor;PhD student;PhD student;Professor;Assistant Professor",
        "bibtex": "@misc{\nyu2024robust,\ntitle={Robust Core-periphery Constrained Transformer for Domain Adaptation},\nauthor={Xiaowei Yu and Lu Zhang and Yao Xue and Yanjun Lyu and Tianming Liu and Dajiang Zhu},\nyear={2024},\nurl={https://openreview.net/forum?id=eqEqvbKbq0}\n}",
        "github": "",
        "project": "",
        "reviewers": "4j1x;mFhM;5i8Q;dFo7",
        "site": "https://openreview.net/forum?id=eqEqvbKbq0",
        "pdf_size": 924810,
        "rating": "1;3;5;6",
        "confidence": "4;4;4;3",
        "soundness": "1;2;3;3",
        "contribution": "1;2;3;3",
        "presentation": "2;1;2;3",
        "wc_summary": "58;145;133;39",
        "wc_strengths": "8;81;45;22",
        "wc_weaknesses": "108;364;393;65",
        "wc_questions": "2;49;220;2",
        "wc_review": "176;639;791;128",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.920286436967152
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            93.75,
            45.94221914535692
        ],
        "wc_strengths_avg": [
            39.0,
            27.613402542968153
        ],
        "wc_weaknesses_avg": [
            232.5,
            147.14703530822496
        ],
        "wc_questions_avg": [
            68.25,
            89.68939457929237
        ],
        "wc_review_avg": [
            433.5,
            287.0857885719877
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.676481425202546,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10268245136509684862&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;0;3;0",
        "aff_unique_norm": "University of Texas at Arlington;Indiana University;Southern Illinois University;University of Georgia",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.uta.edu;https://iu.edu;https://www.siu.edu;https://www.uga.edu",
        "aff_unique_abbr": "UTA;IU;SIU;UGA",
        "aff_campus_unique_index": "1;2;3;3",
        "aff_campus_unique": ";Indianapolis;Carbondale;Arlington",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "eqWUGoyUVI",
        "title": "LayerDiff: Exploring Text-guided Multi-layered Composable Image Synthesis via Layer-Collaborative Diffusion Model",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Despite the success of generating high-quality images given any text prompts by diffusion-based generative models, prior works directly generate the entire images, but cannot provide object-wise manipulation capability. To support wider real applications like professional graphic design and digital artistry, images are frequently created and manipulated in multiple layers to offer greater flexibility and control. \nTherefore in this paper, we propose a Layer-collaborative diffusion model, named LayerDiff, specifically designed for text-guided, multi-layered, composable image synthesis. The composable image consists of a background layer, a set of foreground layers, and associated mask layers for each foreground element. To enable this, LayerDiff introduces a layer-based generation paradigm incorporating multiple layer-collaborative attention modules to capture inter-layer patterns. Specifically, an inter-layer attention module is designed to encourage information exchange and learning between layers, while a text-guided intra-layer attention module incorporates layer-specific prompts to direct the generation of specific content for each layer. Additionally, we introduce a layer-specific prompt-enhanced module to better capture detailed textual cues from the global prompt. We also present a pipeline that integrates existing perceptual and generative models to produce a large dataset of high-quality, text-prompted, multi-layered images. Extensive experiments demonstrate that our LayerDiff model can generate high-quality multi-layered images with performance comparable to conventional whole-image generation methods. Moreover, by supporting both global and layer-specific prompts, LayerDiff enables a broader range of controllable generative applications, including layer-specific image editing and style transfer.",
        "keywords": "Layer-Collaborative Diffusion Model;Multi-layered Composable Image Synthesis",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Runhui Huang;Kaixin Cai;Jianhua Han;Xiaodan Liang;Wei Zhang;Songcen Xu;Hang Xu",
        "authorids": "~Runhui_Huang1;~Kaixin_Cai1;~Jianhua_Han1;~Xiaodan_Liang2;~Wei_Zhang45;~Songcen_Xu1;~Hang_Xu1",
        "gender": ";M;M;F;M;M;M",
        "homepage": ";https://github.com/sysu18364002;;https://www.sysu-hcp.net/;;http://www.xusongcen.com/;",
        "dblp": ";354/7068;29/6207;;10/4661-81;131/6572;",
        "google_scholar": ";;OEPMQEMAAAAJ;voxznZAAAAAJ;;_xVW9SgAAAAJ;https://scholar.google.com.hk/citations?user=J_8TX6sAAAAJ",
        "orcid": ";;;;;;0000-0003-3645-8972",
        "linkedin": ";;;;;songcen-xu-2b313465/;",
        "or_profile": "~Runhui_Huang1;~Kaixin_Cai1;~Jianhua_Han1;~Xiaodan_Liang2;~Wei_Zhang45;~Songcen_Xu1;~Hang_Xu1",
        "aff": ";SUN YAT-SEN UNIVERSITY;Huawei Technologies Ltd.;SUN YAT-SEN UNIVERSITY;Huawei Technologies Ltd;Huawei Noah's Ark Lab;Huawei Noah\u2018s Ark Lab",
        "aff_domain": ";sysu.edu.cn;huawei.com;sysu.edu.cn;huawei.com;huawei.com;huawei.com",
        "position": ";MS student;Researcher;Associate Professor;Researcher;Principal Engineer;Researcher",
        "bibtex": "@misc{\nhuang2024layerdiff,\ntitle={LayerDiff: Exploring Text-guided Multi-layered Composable Image Synthesis via Layer-Collaborative Diffusion Model},\nauthor={Runhui Huang and Kaixin Cai and Jianhua Han and Xiaodan Liang and Wei Zhang and Songcen Xu and Hang Xu},\nyear={2024},\nurl={https://openreview.net/forum?id=eqWUGoyUVI}\n}",
        "github": "",
        "project": "",
        "reviewers": "4pq3;YQTS;RBAM",
        "site": "https://openreview.net/forum?id=eqWUGoyUVI",
        "pdf_size": 2346733,
        "rating": "3;3;5",
        "confidence": "4;4;3",
        "soundness": "2;2;3",
        "contribution": "2;2;2",
        "presentation": "2;1;3",
        "wc_summary": "90;60;54",
        "wc_strengths": "15;39;41",
        "wc_weaknesses": "109;121;83",
        "wc_questions": "141;127;3",
        "wc_review": "355;347;181",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            68.0,
            15.748015748023622
        ],
        "wc_strengths_avg": [
            31.666666666666668,
            11.8133634311129
        ],
        "wc_weaknesses_avg": [
            104.33333333333333,
            15.86050300449376
        ],
        "wc_questions_avg": [
            90.33333333333333,
            62.017918557641245
        ],
        "wc_review_avg": [
            294.3333333333333,
            80.20529215013737
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12520056771532613033&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;0;1;1;1",
        "aff_unique_norm": "Sun Yat-sen University;Huawei",
        "aff_unique_dep": ";Huawei Technologies",
        "aff_unique_url": "http://www.sysu.edu.cn;https://www.huawei.com",
        "aff_unique_abbr": "SYSU;Huawei",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "eqz5aXtQv1",
        "title": "STUPD: A Synthetic Dataset for Spatial and Temporal Relation Reasoning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Understanding relations between objects is crucial for understanding the semantics of a visual scene. It is also an essential step in order to bridge visual and language models. However, current state-of-the-art computer vision models still lack the ability to perform spatial reasoning well. Existing datasets mostly cover a relatively small number of spatial relations, all of which are static relations that do not intrinsically involve motion. In this paper, we propose the Spatial and Temporal Understanding of Prepositions Dataset (STUPD) \u2013 a large scale video dataset for understanding static and dynamic spatial relationships derived from prepositions of the English language. The dataset contains 150K visual depictions (videos and images), consisting of 30 distinct spatial prepositional senses, in the form of object interaction simulations generated synthetically using Unity3D. In addition to spatial relations, we also propose 50K visual depictions across 10 temporal relations, consisting of videos depicting event/time-point interactions. To our knowledge, no dataset exists that represents temporal relations through visual settings. In this dataset, we also provide 3D information about object interactions such as frame-wise coordinates, and descriptions of the objects used. The goal of this synthetic dataset is to help models perform better in visual relationship detection in real-world settings. We demonstrate an increase in the performance of various models over 2 real-world datasets (ImageNet VidVRD and Spatial Senses) when pretrained on the STUPD dataset, in comparison to other pretraining datasets.",
        "keywords": "spatial reasoning;visual relation detection",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/280cb63c566ded8e654fadd408337c74af4828c5.pdf",
        "author": "Palaash Agrawal;Haidi Azaman;Cheston Tan",
        "authorids": "~Palaash_Agrawal1;~Haidi_Azaman1;~Cheston_Tan1",
        "gender": "M;M;M",
        "homepage": ";;",
        "dblp": ";;136/9366",
        "google_scholar": "nvebgE0AAAAJ;rIrM-oEAAAAJ;Up0UYEYAAAAJ",
        "orcid": "0000-0001-5902-585X;;",
        "linkedin": "palaashagrawal/;haidiazaman/;cheston-tan/",
        "or_profile": "~Palaash_Agrawal1;~Haidi_Azaman1;~Cheston_Tan1",
        "aff": "A*STAR;National University of Singapore;Singapore University of Technology and Design",
        "aff_domain": "cfar.a-star.edu.sg;u.nus.edu;sutd.edu.sg",
        "position": "Researcher;MS student;Assistant Professor",
        "bibtex": "@misc{\nagrawal2024stupd,\ntitle={{STUPD}: A Synthetic Dataset for Spatial and Temporal Relation Reasoning},\nauthor={Palaash Agrawal and Haidi Azaman and Cheston Tan},\nyear={2024},\nurl={https://openreview.net/forum?id=eqz5aXtQv1}\n}",
        "github": "",
        "project": "",
        "reviewers": "RbeZ;NbSm;ztaS",
        "site": "https://openreview.net/forum?id=eqz5aXtQv1",
        "pdf_size": 402850,
        "rating": "3;5;5",
        "confidence": "5;3;5",
        "soundness": "1;3;3",
        "contribution": "2;2;3",
        "presentation": "2;3;3",
        "wc_summary": "82;73;67",
        "wc_strengths": "67;54;56",
        "wc_weaknesses": "60;199;35",
        "wc_questions": "443;2;59",
        "wc_review": "652;328;217",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "662;464;416",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            74.0,
            6.164414002968976
        ],
        "wc_strengths_avg": [
            59.0,
            5.715476066494082
        ],
        "wc_weaknesses_avg": [
            98.0,
            72.1433757642839
        ],
        "wc_questions_avg": [
            168.0,
            195.84177286779243
        ],
        "wc_review_avg": [
            399.0,
            184.54809671194118
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            514.0,
            106.47065323364932
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8134203916140121754&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Agency for Science, Technology and Research;National University of Singapore;Singapore University of Technology and Design",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.a-star.edu.sg;https://www.nus.edu.sg;https://www.sutd.edu.sg",
        "aff_unique_abbr": "A*STAR;NUS;SUTD",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Singapore"
    },
    {
        "id": "er7VhmqZEA",
        "title": "NOISY MULTI-VIEW CONTRASTIVE LEARNING FRAMEWORK FOR ENHANCING TOP-K RECOMMENDATION",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recommender systems have become an essential component of various online plat-\nforms, providing personalized recommendations to users. Collaborative filtering-\nbased methods, such as matrix factorization, have been widely used to capture\nlatent user-item preferences. Recently, graph-based methods have shown promising\nresults by modeling the interactions between users and items as a graph and lever-\naging knowledge graphs (KG) to learn the user and item embeddings. Motivated\nby the recent success of contrastive learning in mining supervised signals from data\nitself, in this paper, we focus on establishing a noisy contrastive learning framework\nin Knowledge-aware recommendation systems and propose a self-supervised novel\nnoisy multi-view contrastive learning framework for improving top-K recommen-\ndation. In this paper, we propose a novel recommendation system architecture that\ngenerates three different views of user-item interactions for improved recommenda-\ntion along with a noise addition module. The global-level structural view leverages\nattention-based aggregation network Wang et al. (2019d) to capture collaborative\ninformation in the entity-item-user graph. In the item-item semantic view, we\nuse a K-nearest Neighbour item-item semantic module to incorporate semantic\nrelations among items. In the local view, we apply LightGCN He et al. (2020)\nwith noisy perturbations to generate robust user-item representations. We then use\ntwo more signals such as representation loss and uniformity loss in positive pairs\nto improve the quality of the representations and ensure uniform representations\nin the representational space. Experimental results on two benchmark datasets\ndemonstrate that our proposed method achieves superior performance compared\nto state-of-the-art methods. Additionally, we conducted extensive experiments\non CTR task-based datasets to demonstrate the robustness of our framework\u2019s\ngeneralization in learning better user-item representations which can be seen in the\nsupplementary material. All the codes to generate reproducible results are available\nin this anonymous repository.",
        "keywords": "Contrastive Learning;Recommendation Systems",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/30452e732cdd9ecd9339790a631030eda9a1d5c0.pdf",
        "author": "Manav Nitin Kapadnis;Prosenjit Biswas;Naoyuki Onoe",
        "authorids": "~Manav_Nitin_Kapadnis1;~Prosenjit_Biswas1;~Naoyuki_Onoe1",
        "gender": "M;M;M",
        "homepage": "https://manavkapadnis.github.io/;;https://www.sonyresearchindia.com/",
        "dblp": "304/7583;;",
        "google_scholar": "L7KLra8AAAAJ;;",
        "orcid": "0009-0003-8640-2106;0009-0001-6846-2354;0000-0002-8709-7241",
        "linkedin": "manav-nitin-kapadnis/;prosenjit-biswas-3b861554/;naoyuki-onoe-1923561a0/",
        "or_profile": "~Manav_Nitin_Kapadnis1;~Prosenjit_Biswas1;~Naoyuki_Onoe1",
        "aff": "Indian Institute of Technology Kharagpur;Sony Research India;Sony Research India Pvt. Ltd.",
        "aff_domain": "iitkgp.ac.in;sony.com;sony.com",
        "position": "Undergrad student;Researcher;Principal Researcher",
        "bibtex": "@misc{\nkapadnis2024noisy,\ntitle={{NOISY} {MULTI}-{VIEW} {CONTRASTIVE} {LEARNING} {FRAMEWORK} {FOR} {ENHANCING} {TOP}-K {RECOMMENDATION}},\nauthor={Manav Nitin Kapadnis and Prosenjit Biswas and Naoyuki Onoe},\nyear={2024},\nurl={https://openreview.net/forum?id=er7VhmqZEA}\n}",
        "github": "",
        "project": "",
        "reviewers": "g3vX;8SVs;1tBK;X5Ei",
        "site": "https://openreview.net/forum?id=er7VhmqZEA",
        "pdf_size": 372930,
        "rating": "3;3;5;5",
        "confidence": "4;3;3;3",
        "soundness": "3;2;2;2",
        "contribution": "1;1;1;2",
        "presentation": "3;2;3;3",
        "wc_summary": "85;86;38;42",
        "wc_strengths": "94;16;18;24",
        "wc_weaknesses": "259;116;78;83",
        "wc_questions": "33;29;4;2",
        "wc_review": "471;247;138;151",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            62.75,
            22.796655456447994
        ],
        "wc_strengths_avg": [
            38.0,
            32.46536616149585
        ],
        "wc_weaknesses_avg": [
            134.0,
            73.63083593169372
        ],
        "wc_questions_avg": [
            17.0,
            14.089002803605371
        ],
        "wc_review_avg": [
            251.75,
            133.40047788520098
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:knJB5FYe0J8J:scholar.google.com/&scioq=NOISY+MULTI-VIEW+CONTRASTIVE+LEARNING+FRAMEWORK+FOR+ENHANCING+TOP-K+RECOMMENDATION&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Indian Institute of Technology Kharagpur;Sony Research India;Sony Research India Pvt. Ltd.",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.iitkgp.ac.in;https://www.sony.com/research;https://www.sonyresearchindia.com",
        "aff_unique_abbr": "IIT Kharagpur;SRI;Sony Research India",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Kharagpur;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "India"
    },
    {
        "id": "ervzSmtQyY",
        "title": "Fairness-enhancing mixed effects deep learning improves fairness on in- and out-of-distribution clustered (non-iid) data",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Traditional deep learning (DL) suffers from two core problems. First, it assumes training samples are independent and identically distributed (iid), however, in many real-world datasets samples are grouped by measurements made on the same sample (e.g., study participant, cell, tissue) violating this assumption. On such clustered data, traditional DL suffers from reduced prediction performance, lack of generalization, poor interpretability, and cluster confounding causing Type 1 and 2 errors. Second, traditional model fitting prioritizes only overall training data accuracy, which is biased towards the most common group, with often unfair, lower accuracy on samples from underrepresented groups. When DL is used to guide critical decisions (e.g., loan approvals or determining health insurance rates) such biases can significantly impact one\u2019s quality of life. To address both of these challenges simultaneously, we introduce a fairness-enhancing mixed effects deep learning (MEDL) framework. MEDL separately quantifies cluster-invariant fixed effects (FE) and cluster-specific random effects (RE) through the introduction of: 1) a cluster adversary which encourages the learning of cluster-invariant FE, 2) a Bayesian neural network which quantifies the RE, and a mixing function combining the FE an RE into a mixed-effect prediction. We marry this MEDL with adversarial debiasing, which promotes equality-of-odds fairness across FE, RE, and ME predictions for fairness-sensitive variables. An empirical evaluation spanning three datasets: two from the census/finance sector and one from the healthcare sector is performed. The former focuses on income classification, while the latter is a healthcare dataset that predicts forthcoming hospitalization duration, a regression task. The proposed framework boosts fairness across all sensitive variables\u2014increasing fairness up to 82% for age, 43% for race, 86% for sex, and 27% for marital-status. While enhancing fairness, our method also preserves the intrinsic improved performance and interpretability advantages of MEDL. Moreover, the proposed method is agnostic to dataset type and task (regression or classification) with broad potential applicability by the community. To facilitate these benefits and further community extension, we have made our implementation available through GitHub.",
        "keywords": "Fairness-enhancing models;adversarial debiasing;mixed effects deep learning;out of distribution generalization",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Adam J Wang;Son Nguyen;Albert Montillo",
        "authorids": "~Adam_J_Wang1;~Son_Nguyen4;~Albert_Montillo2",
        "gender": "M;M;M",
        "homepage": ";https://sonnnguyen89.github.io/;https://aamontillo.net/",
        "dblp": ";;",
        "google_scholar": ";IMHuoZ8AAAAJ;",
        "orcid": ";0000-0001-9409-4738;",
        "linkedin": "adam-j-wang/;son-nguyen-06522541/;",
        "or_profile": "~Adam_J_Wang1;~Son_Nguyen4;~Albert_Montillo2",
        "aff": "Harvard University;University of Texas Southwestern Medical Center;University of Texas Southwestern Medical Center",
        "aff_domain": "college.harvard.edu;utsouthwestern.edu;utsouthwestern.edu",
        "position": "Undergrad student;Postdoc;Assistant Professor",
        "bibtex": "@misc{\nwang2024fairnessenhancing,\ntitle={Fairness-enhancing mixed effects deep learning improves fairness on in- and out-of-distribution clustered (non-iid) data},\nauthor={Adam J Wang and Son Nguyen and Albert Montillo},\nyear={2024},\nurl={https://openreview.net/forum?id=ervzSmtQyY}\n}",
        "github": "",
        "project": "",
        "reviewers": "ejZU;GZ1m;Nt9q;vJ3t",
        "site": "https://openreview.net/forum?id=ervzSmtQyY",
        "pdf_size": 1225236,
        "rating": "3;3;3;3",
        "confidence": "4;4;5;4",
        "soundness": "2;2;2;2",
        "contribution": "2;1;1;1",
        "presentation": "2;2;2;3",
        "wc_summary": "25;252;127;45",
        "wc_strengths": "23;118;87;66",
        "wc_weaknesses": "76;370;344;282",
        "wc_questions": "5;202;93;74",
        "wc_review": "129;942;651;467",
        "wc_reply_reviewers": "0;31;0;102",
        "wc_reply_authors": "502;1343;763;1013",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "1;3;2;2",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            112.25,
            89.27870686787527
        ],
        "wc_strengths_avg": [
            73.5,
            34.528973341239094
        ],
        "wc_weaknesses_avg": [
            268.0,
            115.36897329871667
        ],
        "wc_questions_avg": [
            93.5,
            70.68415664065039
        ],
        "wc_review_avg": [
            547.25,
            294.94268511017526
        ],
        "wc_reply_reviewers_avg": [
            33.25,
            41.66158302321217
        ],
        "wc_reply_authors_avg": [
            905.25,
            310.67698257193115
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:5IeJmkbJ5rAJ:scholar.google.com/&scioq=Fairness-enhancing+mixed+effects+deep+learning+improves+fairness+on+in-+and+out-of-distribution+clustered+(non-iid)+data&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Harvard University;University of Texas Southwestern Medical Center",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.harvard.edu;https://www.utsouthwestern.edu",
        "aff_unique_abbr": "Harvard;UT Southwestern",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "esh9JYzmTq",
        "title": "Assessing the Impact of Distribution Shift on Reinforcement Learning Performance",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Research in machine learning is making progress in fixing its own reproducibility crisis. Reinforcement learning (RL), in particular, faces its own set of unique challenges. Comparison of point estimates, and plots that show successful convergence to the optimal policy during training, may obfuscate overfitting or dependence on the experimental setup. Although researchers in RL have proposed reliability metrics that account for uncertainty to better understand each algorithm's strengths and weaknesses, the recommendations of past work do not assume the presence of out-of-distribution observations. We propose a set of evaluation methods that measure the robustness of RL algorithms under distribution shifts. The tools presented here argue for the need to account for performance over time while the agent is acting in its environment. In particular, we recommend time series analysis as a method of observational RL evaluation. We also show that the unique properties of RL and simulated dynamic environments allow us to make stronger assumptions to justify the measurement of causal impact in our evaluations. We then apply these tools to single-agent and multi-agent environments to show the impact of introducing distribution shifts during test time. We present this methodology as a first step toward rigorous RL evaluation in the presence of distribution shifts.",
        "keywords": "Reinforcement Learning;Metrics;Evaluation;Benchmarking;Scientific Progress;Reliability",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/3748df412244054da18b5aceb50332ec8cafa373.pdf",
        "author": "Ted Fujimoto;Joshua Suetterlein;Samrat Chatterjee;Auroop Ganguly",
        "authorids": "~Ted_Fujimoto1;~Joshua_Suetterlein1;~Samrat_Chatterjee1;~Auroop_Ganguly1",
        "gender": ";M;;",
        "homepage": ";;;https://coe.northeastern.edu/people/ganguly-auroop/",
        "dblp": ";;;65/6458.html",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;BQZXQE4AAAAJ;eNrAUJMAAAAJ",
        "orcid": ";;;0000-0002-4292-4856",
        "linkedin": ";joshua-suetterlein-33962a37/;;auroop-ganguly-ab7ba34/",
        "or_profile": "~Ted_Fujimoto1;~Joshua_Suetterlein1;~Samrat_Chatterjee1;~Auroop_Ganguly1",
        "aff": ";Pacific Northwest National Laboratory;Pacific Northwest National Laboratory;Northeastern University",
        "aff_domain": ";pnnl.gov;pnnl.gov;northeastern.edu",
        "position": ";Researcher;Principal Researcher;Full Professor",
        "bibtex": "@misc{\nfujimoto2024assessing,\ntitle={Assessing the Impact of Distribution Shift on Reinforcement Learning Performance},\nauthor={Ted Fujimoto and Joshua Suetterlein and Samrat Chatterjee and Auroop Ganguly},\nyear={2024},\nurl={https://openreview.net/forum?id=esh9JYzmTq}\n}",
        "github": "",
        "project": "",
        "reviewers": "8p4f;mUDk;okG3",
        "site": "https://openreview.net/forum?id=esh9JYzmTq",
        "pdf_size": 627814,
        "rating": "3;5;6",
        "confidence": "3;3;3",
        "soundness": "2;3;3",
        "contribution": "1;1;2",
        "presentation": "2;2;3",
        "wc_summary": "33;76;96",
        "wc_strengths": "33;39;17",
        "wc_weaknesses": "153;262;14",
        "wc_questions": "127;103;1",
        "wc_review": "346;480;128",
        "wc_reply_reviewers": "0;89;24",
        "wc_reply_authors": "819;507;69",
        "reply_reviewers": "0;1;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            68.33333333333333,
            26.284765338288427
        ],
        "wc_strengths_avg": [
            29.666666666666668,
            9.285592184789413
        ],
        "wc_weaknesses_avg": [
            143.0,
            101.492200028705
        ],
        "wc_questions_avg": [
            77.0,
            54.62600113499065
        ],
        "wc_review_avg": [
            318.0,
            145.0609067483954
        ],
        "wc_reply_reviewers_avg": [
            37.666666666666664,
            37.59728122558273
        ],
        "wc_reply_authors_avg": [
            465.0,
            307.62314607324333
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18105924077901019789&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Pacific Northwest National Laboratory;Northeastern University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.pnnl.gov;https://www.northeastern.edu",
        "aff_unique_abbr": "PNNL;NEU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "esqRHCwTJ2",
        "title": "Long-Term Impacts of Model Retraining with Strategic Feedback",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "When machine learning (ML) models need to be frequently retrained, it is often too expensive to obtain *human-annotated* samples, so recent ML models have started to label samples by themselves. This paper studies a setting where an ML model is retrained (with *human* and *model-annotated* samples) over time to make decisions about a sequence of *strategic* human agents who can adapt their behaviors in response to the most recent ML model. We aim to investigate what happens when *model-annotated* data are generated under the agents' strategic feedback and how the models retrained with such data can be affected. Specifically, we first formalize the interactions between agents and the ML system and then analyze how the agents and ML models evolve under such dynamic interactions. We find that as the model gets retrained, agents are increasingly likely to receive positive decisions, whereas the proportion of agents with positive labels may decrease over time. We thus propose an approach to stabilize the dynamics and show how this method can further be leveraged to enhance algorithmic fairness when agents come from multiple social groups. Experiments on synthetic/semi-synthetic and real data validate the theoretical findings.",
        "keywords": "Strategic Classification",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/9647252b76ce78db3749976836edeaddeca5be65.zip",
        "author": "Tian Xie;Xueru Zhang",
        "authorids": "~Tian_Xie4;~Xueru_Zhang2",
        "gender": "M;F",
        "homepage": "https://www.linkedin.com/in/tianxie1999/;https://xueruzhang.github.io/",
        "dblp": ";",
        "google_scholar": ";PNBO_a4AAAAJ",
        "orcid": ";",
        "linkedin": "tianxie1999/;",
        "or_profile": "~Tian_Xie4;~Xueru_Zhang2",
        "aff": "Ohio State University, Columbus;Ohio State University",
        "aff_domain": "osu.edu;osu.edu",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nxie2024longterm,\ntitle={Long-Term Impacts of Model Retraining with Strategic Feedback},\nauthor={Tian Xie and Xueru Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=esqRHCwTJ2}\n}",
        "github": "",
        "project": "",
        "reviewers": "Hjrr;QsNX;4hwy;UjM1",
        "site": "https://openreview.net/forum?id=esqRHCwTJ2",
        "pdf_size": 3072428,
        "rating": "3;3;5;5",
        "confidence": "4;4;3;4",
        "soundness": "3;2;3;3",
        "contribution": "2;1;2;2",
        "presentation": "3;3;2;3",
        "wc_summary": "48;35;157;62",
        "wc_strengths": "198;39;99;96",
        "wc_weaknesses": "753;280;190;159",
        "wc_questions": "350;169;227;152",
        "wc_review": "1349;523;673;469",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "840;620;591;365",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            75.5,
            48.0130190677487
        ],
        "wc_strengths_avg": [
            108.0,
            57.197027894812855
        ],
        "wc_weaknesses_avg": [
            345.5,
            239.4310965601586
        ],
        "wc_questions_avg": [
            224.5,
            77.60959992165918
        ],
        "wc_review_avg": [
            753.5,
            351.8419389441799
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            604.0,
            168.25724352906772
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:6a-WlrkZISkJ:scholar.google.com/&scioq=Long-Term+Impacts+of+Model+Retraining+with+Strategic+Feedback&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Ohio State University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.osu.edu",
        "aff_unique_abbr": "OSU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Columbus;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "etGEIggjWS",
        "title": "Sub-token ViT Embedding via Stochastic Resonance Transformers",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We discover the presence of quantization artifacts in pre-trained Vision Transformers (ViTs), which arise due to the image tokenization step inherent in these architectures. These artifacts result in coarsely quantized features, which negatively impact performance, especially on downstream dense prediction tasks. We present a zero-shot method to improve how pre-trained ViTs handle spatial quantization. \nIn particular, we propose to ensemble the features obtained from perturbing input images via sub-token spatial translations, inspired by Stochastic Resonance, a method traditionally applied to climate dynamics and signal processing. We term our method ``Stochastic Resonance Transformer\" (SRT), which we show can effectively super-resolve features of pre-trained ViTs, capturing more of the local fine-grained structures that might otherwise be neglected as a result of tokenization. SRT can be applied at any layer, on any task, and does not require any fine-tuning. The advantage of the former is evident when applied to monocular depth prediction, where we show that ensembling model outputs are detrimental while applying SRT on intermediate ViT features outperforms the baseline models by an average of 4.7% and 14.9% on the RMSE and RMSE_log metrics across three different architectures. When applied to semi-supervised video object segmentation, SRT also improves over the baseline models uniformly across all metrics, and by an average of 2.4% in F&J score. SRT also dominates test-time augmentation baselines, which we show severely harms performance. We further show that these quantization artifacts can be attenuated to some extent via self-distillation. On the unsupervised salient region segmentation, SRT improves upon the base model by an average of 2.1% on the maxF metric. Finally, we show that despite operating purely on pixel-level features, SRT generalizes to non-dense prediction tasks such as image retrieval and object discovery, yielding consistent improvements of up to 2.6% and 1.0% respectively.",
        "keywords": "Vision Transformer;Ensemble;Visualization",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Dong Lao;Yangchao Wu;Tian Yu Liu;Alex Wong;Stefano Soatto",
        "authorids": "~Dong_Lao1;~Yangchao_Wu1;~Tian_Yu_Liu2;~Alex_Wong2;~Stefano_Soatto1",
        "gender": "M;M;;M;",
        "homepage": ";https://scholar.google.com/citations?view_op=list_works&hl=en&user=k_h1nbAAAAAJ;;https://vision.cs.yale.edu/members/alex-wong/;",
        "dblp": "180/5522;;;39/6537-1;",
        "google_scholar": "dvQXYW0AAAAJ;https://scholar.google.com/citations?view_op=list_works;;K9_XuM8AAAAJ;",
        "orcid": ";;;0000-0002-3157-6016;",
        "linkedin": ";;;;",
        "or_profile": "~Dong_Lao1;~Yangchao_Wu1;~Tian_Yu_Liu2;~Alex_Wong2;~Stefano_Soatto1",
        "aff": "University of California, Los Angeles;University of California, Los Angeles;;Yale University;",
        "aff_domain": "cs.ucla.edu;ucla.edu;;yale.edu;",
        "position": "Postdoc;PhD student;;Assistant Professor;",
        "bibtex": "@misc{\nlao2024subtoken,\ntitle={Sub-token ViT Embedding via Stochastic Resonance Transformers},\nauthor={Dong Lao and Yangchao Wu and Tian Yu Liu and Alex Wong and Stefano Soatto},\nyear={2024},\nurl={https://openreview.net/forum?id=etGEIggjWS}\n}",
        "github": "",
        "project": "",
        "reviewers": "j1cP;wDbQ;3VWw",
        "site": "https://openreview.net/forum?id=etGEIggjWS",
        "pdf_size": 3915050,
        "rating": "5;5;8",
        "confidence": "3;5;4",
        "soundness": "2;3;4",
        "contribution": "2;2;3",
        "presentation": "2;3;3",
        "wc_summary": "108;260;54",
        "wc_strengths": "32;197;65",
        "wc_weaknesses": "135;609;5",
        "wc_questions": "46;233;108",
        "wc_review": "321;1299;232",
        "wc_reply_reviewers": "83;1093;141",
        "wc_reply_authors": "1066;2381;960",
        "reply_reviewers": "1;4;1",
        "reply_authors": "2;4;2",
        "rating_avg": [
            6.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            140.66666666666666,
            87.21365846140284
        ],
        "wc_strengths_avg": [
            98.0,
            71.28814768248647
        ],
        "wc_weaknesses_avg": [
            249.66666666666666,
            259.5705855617868
        ],
        "wc_questions_avg": [
            129.0,
            77.77317446695015
        ],
        "wc_review_avg": [
            617.3333333333334,
            483.3786185681871
        ],
        "wc_reply_reviewers_avg": [
            439.0,
            463.05363260281916
        ],
        "wc_reply_authors_avg": [
            1469.0,
            646.3317001870377
        ],
        "reply_reviewers_avg": [
            2.0,
            1.4142135623730951
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16436480747636646688&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "University of California, Los Angeles;Yale University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ucla.edu;https://www.yale.edu",
        "aff_unique_abbr": "UCLA;Yale",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Los Angeles;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "etm456yoiq",
        "title": "B$^{3}$CT: Three-branch Coordinated Training for Domain Adaptive Semantic Segmentation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Unsupervised domain adaptive semantic segmentation aims to adapt a dense prediction model trained on the source domain to the target domain by transferring knowledge without further annotations. A mainstream solution for transferring knowledge is to achieve alignment between different domains and eliminate domain gaps caused by source-target distributions. However, previous work paid little attention to where and when to align. We find that different contents in images are aligned at different stages of the whole network, and the alignment should be gradually strengthened during the whole training process due to the accuracy of target pseudo labels. Given these two observations, we propose a three-branch coordinated training (B$^{3}$CT) framework. Besides two normal source and target branches, a third branch is involved specifically for the alignment. In this branch, the hybrid-attention mechanism is utilized to do the alignment, while an Adaptive Alignment Controller (AAC) is built to adjust the contents being aligned according to the stages of the whole network. Meanwhile, in B$^{3}$CT, a coordinate weight is designed to gradually strengthen the importance of the alignment based on the training accuracy in the whole training process. Extensive experiments show that our proposed methods achieve competitive performances on tasks of GTA5$\\to$Cityscapes and SYNTHIA$\\to$Cityscapes.",
        "keywords": "domain adaptation;semantic segmentation",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Chen Liang;Jian Jia;Junyan Wang;Jianlong Yuan;Xin Zhao;Weihua Chen",
        "authorids": "~Chen_Liang11;~Jian_Jia1;~Junyan_Wang5;~Jianlong_Yuan1;~Xin_Zhao4;~Weihua_Chen1",
        "gender": "M;M;M;;M;M",
        "homepage": "https://github.com/JasiRose;https://github.com/valencebond;;;https://www.xinzhaoai.com/;https://cwhgn.github.io",
        "dblp": ";;70/4949-1;;68/2766-12;",
        "google_scholar": ";tiDd-T0AAAAJ;5yS_tTUAAAAJ;;Emz6Cbv7LqEC;KWVlYaMAAAAJ",
        "orcid": ";0000-0002-7888-0699;0000-0001-5409-1292;;0000-0002-7660-9897;0000-0003-4141-7833",
        "linkedin": ";;;;;",
        "or_profile": "~Chen_Liang11;~Jian_Jia1;~Junyan_Wang5;~Jianlong_Yuan1;~Xin_Zhao4;~Weihua_Chen1",
        "aff": "Institute of Automation, Chinese Academy of Sciences;kuaishou;University of New South Wales;;University of Science and Technology Beijing;Alibaba Group",
        "aff_domain": "ia.ac.cn;kuaishou.com;unsw.edu.au;;ustb.edu.cn;alibaba-inc.com",
        "position": "MS student;Researcher;PhD student;;Full Professor;Algorithm Engineer",
        "bibtex": "@misc{\nliang2024bct,\ntitle={B\\${\\textasciicircum}\\{3\\}\\${CT}: Three-branch Coordinated Training for Domain Adaptive Semantic Segmentation},\nauthor={Chen Liang and Jian Jia and Junyan Wang and Jianlong Yuan and Xin Zhao and Weihua Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=etm456yoiq}\n}",
        "github": "",
        "project": "",
        "reviewers": "Kyed;Prz3;YWN9;qoMd",
        "site": "https://openreview.net/forum?id=etm456yoiq",
        "pdf_size": 1526146,
        "rating": "3;5;5;5",
        "confidence": "5;5;3;5",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;2",
        "wc_summary": "87;79;149;53",
        "wc_strengths": "149;36;38;57",
        "wc_weaknesses": "339;137;114;410",
        "wc_questions": "19;3;4;50",
        "wc_review": "594;255;305;570",
        "wc_reply_reviewers": "156;0;0;0",
        "wc_reply_authors": "1676;1174;836;1986",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "3;2;1;2",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            92.0,
            35.22782990761707
        ],
        "wc_strengths_avg": [
            70.0,
            46.34112644293403
        ],
        "wc_weaknesses_avg": [
            250.0,
            127.26547057234339
        ],
        "wc_questions_avg": [
            19.0,
            18.986837546047525
        ],
        "wc_review_avg": [
            431.0,
            152.26785609576302
        ],
        "wc_reply_reviewers_avg": [
            39.0,
            67.54998149518622
        ],
        "wc_reply_authors_avg": [
            1418.0,
            443.69133415021753
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:5ERf1-hedicJ:scholar.google.com/&scioq=B%24%5E%7B3%7D%24CT:+Three-branch+Coordinated+Training+for+Domain+Adaptive+Semantic+Segmentation&hl=en&as_sdt=0,48",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "Chinese Academy of Sciences;Kuaishou Technology;University of New South Wales;University of Science and Technology Beijing;Alibaba Group",
        "aff_unique_dep": "Institute of Automation;;;;",
        "aff_unique_url": "http://www.ia.cas.cn;https://www.kuaishou.com;https://www.unsw.edu.au;http://www.ustb.edu.cn;https://www.alibaba.com",
        "aff_unique_abbr": "CAS;Kuaishou;UNSW;USTB;Alibaba",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "China;Australia"
    },
    {
        "id": "etnG659OB9",
        "title": "Causal Disentangled Representation Learning with VAE and Causal Flows",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Disentangled representation learning aims to learn a low dimensional representation of data where each dimension corresponds to one underlying generative factor. Due to the causal relationships between generative factors in real-world situations, causal disentangled representation learning has received widespread attention. In this paper, we first propose a variant of autoregressive flows, called causal flows, which incorporate true causal structure of generative factors into the flows. Then, we design a new VAE model based on causal flows named *Causal Flows Variational Autoencoders (CauF-VAE)* to learn causally disentangled representations. We provide a theoretical analysis of the disentanglement identifiability of CauF-VAE by incorporating supervised information on the ground-truth factors. The performance of CauF-VAE is evaluated on both synthetic and real datasets, showing its capability of achieving causal disentanglement and performing intervention experiments. Moreover, CauF-VAE exhibits remarkable performance on downstream tasks and has the potential to learn true causal structure among factors.",
        "keywords": "disentanglement;representation learning;variational autoencoders;flows",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/fbb17dbeb999c92ec0cf3be034c5413fb77d6e69.zip",
        "author": "Di Fan;Yannian Kou;Chuanhou Gao",
        "authorids": "~Di_Fan2;~Yannian_Kou1;~Chuanhou_Gao1",
        "gender": "F;M;M",
        "homepage": "https://scholar.google.com.hk/citations?hl=zh-CN&view_op=list_works&gmla=AHoSzlVVyg_Krl0-guqstC1MgXDgGh67vmXuPN-PfmxfakB_s7Q3SsbdHtVcVLE-FIMgXqc8rT0GcNpBvhNR4bbflK5Pcw13FxCgh5A6UCm-mnEAjKl1VcUT4uCv7HRARvs&user=1WOOW0gAAAAJ;;https://scholar.google.com/citations?user=4HNIbWsAAAAJ&hl=en",
        "dblp": ";;",
        "google_scholar": "https://scholar.google.com.hk/citations?hl=zh-CN;https://scholar.google.com/;4HNIbWsAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Di_Fan2;~Yannian_Kou1;~Chuanhou_Gao1",
        "aff": "Zhejiang University;Zhejiang University;Zhejiang University",
        "aff_domain": "zju.edu.cn;zju.edu.cn;zju.edu.cn",
        "position": "MS student;PhD student;Full Professor",
        "bibtex": "@misc{\nfan2024causal,\ntitle={Causal Disentangled Representation Learning with {VAE} and Causal Flows},\nauthor={Di Fan and Yannian Kou and Chuanhou Gao},\nyear={2024},\nurl={https://openreview.net/forum?id=etnG659OB9}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZbnB;Uibi;HG71;3AAm",
        "site": "https://openreview.net/forum?id=etnG659OB9",
        "pdf_size": 4657261,
        "rating": "1;3;3;5",
        "confidence": "5;5;4;3",
        "soundness": "1;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "2;2;3;3",
        "wc_summary": "179;30;47;37",
        "wc_strengths": "53;20;33;38",
        "wc_weaknesses": "399;119;147;210",
        "wc_questions": "161;74;135;32",
        "wc_review": "792;243;362;317",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            73.25,
            61.35297466301043
        ],
        "wc_strengths_avg": [
            36.0,
            11.811011811017716
        ],
        "wc_weaknesses_avg": [
            218.75,
            109.16129121625485
        ],
        "wc_questions_avg": [
            100.5,
            50.608793702280636
        ],
        "wc_review_avg": [
            428.5,
            214.12437974224233
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8528028654224418,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15999049979284270823&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Zhejiang University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.zju.edu.cn",
        "aff_unique_abbr": "ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "evk6pPJqMy",
        "title": "Know2BIO: A Comprehensive Dual-View Benchmark for Evolving Biomedical Knowledge Graphs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Knowledge graphs (KGs) have emerged as a powerful framework for representing and integrating complex biomedical information. However, assembling KGs from diverse sources remains a significant challenge in several aspects, including entity alignment, scalability, and the need for continuous updates to keep pace with scientific advancements. Moreover, the representative power of KGs is often limited by the scarcity of multi-modal data integration. To overcome these challenges, we propose Know2BIO, a general-purpose heterogeneous KG benchmark for the biomedical domain. Know2BIO integrates data from 30 diverse sources, capturing intricate relationships across 11 biomedical categories. It currently consists of ~219,000 nodes and ~6,200,000 edges. Know2BIO is capable of user-directed automated updating to reflect the latest knowledge in biomedical science. Furthermore, Know2BIO is accompanied by multi-modal data: node features including text descriptions, protein and compound sequences and structures, enabling the utilization of emerging natural language processing methods and multi-modal data integration strategies. We evaluate KG representation models on Know2BIO, demonstrating its effectiveness as a benchmark for KG representation learning in the biomedical field. Data and source code of Know2BIO are available at https://anonymous.4open.science/r/Know2BIO/.",
        "keywords": "Biomedical Knowledge Graph;Benchmark;Knowledge Base Integration",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Yijia Xiao;Dylan Steinecke;Alexander Russell Pelletier;Yushi Bai;Peipei Ping;Wei Wang",
        "authorids": "~Yijia_Xiao1;~Dylan_Steinecke1;~Alexander_Russell_Pelletier1;~Yushi_Bai1;~Peipei_Ping1;~Wei_Wang13",
        "gender": "M;M;M;M;F;F",
        "homepage": "https://yijia-xiao.com;;;https://bys0318.github.io/;;http://www.cs.ucla.edu/~weiwang",
        "dblp": "238/7281.html;;;302/4421;128/7467;w/WeiWang.html",
        "google_scholar": "xLwcZvYAAAAJ;;;https://scholar.google.com/citations?hl=zh-CN;;UedS9LQAAAAJ",
        "orcid": ";;0000-0002-1945-8420;;;0000-0002-8180-2886",
        "linkedin": "yijia-xiao/;dylan-steinecke;alexander-r-pelletier/;;;wei-wang-8800845/",
        "or_profile": "~Yijia_Xiao1;~Dylan_Steinecke1;~Alexander_Russell_Pelletier1;~Yushi_Bai1;~Peipei_Ping1;~Wei_Wang13",
        "aff": "University of California, Los Angeles;University of California, Los Angeles;, University of California, Los Angeles;Tsinghua University;University of California, Los Angeles;University of California, Los Angeles",
        "aff_domain": "ucla.edu;ucla.edu;cs.ucla.edu;tsinghua.edu.cn;ucla.edu;ucla.edu",
        "position": "PhD student;PhD student;PhD student;PhD student;Full Professor;Full Professor",
        "bibtex": "@misc{\nxiao2024knowbio,\ntitle={Know2{BIO}: A Comprehensive Dual-View Benchmark for Evolving Biomedical Knowledge Graphs},\nauthor={Yijia Xiao and Dylan Steinecke and Alexander Russell Pelletier and Yushi Bai and Peipei Ping and Wei Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=evk6pPJqMy}\n}",
        "github": "",
        "project": "",
        "reviewers": "sXSH;Jbrt;EnCN;RhR2",
        "site": "https://openreview.net/forum?id=evk6pPJqMy",
        "pdf_size": 5686815,
        "rating": "1;3;5;6",
        "confidence": "3;3;4;5",
        "soundness": "3;3;2;3",
        "contribution": "1;2;2;3",
        "presentation": "3;3;2;3",
        "wc_summary": "15;51;23;80",
        "wc_strengths": "1;37;19;58",
        "wc_weaknesses": "15;116;42;56",
        "wc_questions": "15;3;65;32",
        "wc_review": "46;207;149;226",
        "wc_reply_reviewers": "0;13;0;0",
        "wc_reply_authors": "120;323;691;156",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;3;3;3",
        "rating_avg": [
            3.75,
            1.920286436967152
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            42.25,
            25.567313116555678
        ],
        "wc_strengths_avg": [
            28.75,
            21.146808269807526
        ],
        "wc_weaknesses_avg": [
            57.25,
            36.98225926035347
        ],
        "wc_questions_avg": [
            28.75,
            23.327826731180938
        ],
        "wc_review_avg": [
            157.0,
            70.0820947175525
        ],
        "wc_reply_reviewers_avg": [
            3.25,
            5.629165124598851
        ],
        "wc_reply_authors_avg": [
            322.5,
            226.11999027065255
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.8660254037844386
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.9028289727756884,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11530176142376583166&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;1;0;0",
        "aff_unique_norm": "University of California, Los Angeles;Tsinghua University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ucla.edu;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "UCLA;THU",
        "aff_campus_unique_index": "0;0;0;0;0",
        "aff_campus_unique": "Los Angeles;",
        "aff_country_unique_index": "0;0;0;1;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "ewIfVxCzbo",
        "title": "DPO-Diff: On Discrete Prompt Optimization of Text-to-Image Diffusion Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper introduces the first gradient-based framework for prompt optimization in text-to-image diffusion models. We formulate prompt engineering as a discrete optimization problem over the language space. Two major challenges arise in efficiently finding a solution to this problem: 1) Enormous Domain Space: Setting the domain to the entire language space poses significant difficulty to the optimization process. 2) Text Gradient: Computing the text gradient incurs prohibitively high memory-runtime complexity, as it requires backpropagating through all inference steps of the diffusion model. Beyond the problem formulation, our main technical contributions lie in solving the above challenges. First, we design a family of dynamically generated compact subspaces comprised of only the most relevant words to user input, substantially restricting the domain space. Second, we introduce \"Shortcut Gradient\" --- an effective replacement for the text gradient that can be obtained with constant memory and runtime. Empirical evaluation on prompts collected from diverse sources (DiffusionDB, ChatGPT, COCO) suggests that our method can discover prompts that substantially improve (prompt enhancement) or destroy (adversarial attack) the faithfulness of images generated by the text-to-image diffusion model.",
        "keywords": "Diffusion Model;Foundation Model;Multimodal;Text-to-Image Generation;Prompt Optimization",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/75ad9dde2f63a112812ee02c17048f583c75b393.zip",
        "author": "Ruochen Wang;Ting Liu;Cho-Jui Hsieh;Boqing Gong",
        "authorids": "~Ruochen_Wang2;~Ting_Liu4;~Cho-Jui_Hsieh1;~Boqing_Gong1",
        "gender": "M;;M;M",
        "homepage": "https://ruocwang.github.io/;http://tliu.org;http://web.cs.ucla.edu/~chohsieh/index.html;http://boqinggong.info",
        "dblp": "33/120;52/5150-5;14/2770;29/7457",
        "google_scholar": "8fXrlRAAAAAJ;4wSfAIQAAAAJ;Wy89g4IAAAAJ;lv9ZeVUAAAAJ",
        "orcid": ";;;",
        "linkedin": "ruochen-wang-1699b1113/;;;boqing-gong-46aa5821/",
        "or_profile": "~Ruochen_Wang2;~Ting_Liu4;~Cho-Jui_Hsieh1;~Boqing_Gong1",
        "aff": "University of California, Los Angeles;Google DeepMind;University of California, Los Angeles;Google",
        "aff_domain": "ucla.edu;google.com;ucla.edu;google.com",
        "position": "PhD student;Researcher;Associate Professor;Research Scientist",
        "bibtex": "@misc{\nwang2024dpodiff,\ntitle={{DPO}-Diff: On Discrete Prompt Optimization of Text-to-Image Diffusion Models},\nauthor={Ruochen Wang and Ting Liu and Cho-Jui Hsieh and Boqing Gong},\nyear={2024},\nurl={https://openreview.net/forum?id=ewIfVxCzbo}\n}",
        "github": "",
        "project": "",
        "reviewers": "FurC;emXz;3K8N;BFJd",
        "site": "https://openreview.net/forum?id=ewIfVxCzbo",
        "pdf_size": 35417357,
        "rating": "5;5;5;5",
        "confidence": "4;4;3;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;2",
        "presentation": "2;3;3;2",
        "wc_summary": "22;118;54;136",
        "wc_strengths": "20;36;35;41",
        "wc_weaknesses": "264;129;125;116",
        "wc_questions": "7;99;37;9",
        "wc_review": "313;382;251;302",
        "wc_reply_reviewers": "0;49;0;0",
        "wc_reply_authors": "1742;1130;871;529",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "4;2;2;1",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            82.5,
            46.354611421087334
        ],
        "wc_strengths_avg": [
            33.0,
            7.842193570679061
        ],
        "wc_weaknesses_avg": [
            158.5,
            61.09214352107806
        ],
        "wc_questions_avg": [
            38.0,
            37.16180835212409
        ],
        "wc_review_avg": [
            312.0,
            46.69582422444217
        ],
        "wc_reply_reviewers_avg": [
            12.25,
            21.21762239271875
        ],
        "wc_reply_authors_avg": [
            1068.0,
            443.69189760463286
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            1.0897247358851685
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:zXqQzL5rZWMJ:scholar.google.com/&scioq=DPO-Diff:+On+Discrete+Prompt+Optimization+of+Text-to-Image+Diffusion+Models&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;1",
        "aff_unique_norm": "University of California, Los Angeles;Google",
        "aff_unique_dep": ";Google DeepMind",
        "aff_unique_url": "https://www.ucla.edu;https://deepmind.com",
        "aff_unique_abbr": "UCLA;DeepMind",
        "aff_campus_unique_index": "0;0;2",
        "aff_campus_unique": "Los Angeles;;Mountain View",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "title": "LLM-grounded Video Diffusion Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18205",
        "id": "exKHibougU",
        "author_site": "Long Lian, Baifeng Shi, Adam Yala, trevor darrell, Boyi Li",
        "tldr": "",
        "abstract": "Text-conditioned diffusion models have emerged as a promising tool for neural video generation. However, current models still struggle with intricate spatiotemporal prompts and often generate restricted or incorrect motion. To address these limitations, we introduce LLM-grounded Video Diffusion (LVD). Instead of directly generating videos from the text inputs, LVD first leverages a large language model (LLM) to generate dynamic scene layouts based on the text inputs and subsequently uses the generated layouts to guide a diffusion model for video generation. We show that LLMs are able to understand complex spatiotemporal dynamics from text alone and generate layouts that align closely with both the prompts and the object motion patterns typically observed in the real world. We then propose to guide video diffusion models with these layouts by adjusting the attention maps. Our approach is training-free and can be integrated into any video diffusion model that admits classifier guidance. Our results demonstrate that LVD significantly outperforms its base video diffusion model and several strong baseline methods in faithfully generating videos with the desired attributes and motion patterns.",
        "keywords": "text-to-video generation;diffusion models;large language models",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Long Lian;Baifeng Shi;Adam Yala;Trevor Darrell;Boyi Li",
        "authorids": "~Long_Lian1;~Baifeng_Shi1;~Adam_Yala1;~Trevor_Darrell2;~Boyi_Li1",
        "gender": "M;;M;F;M",
        "homepage": "https://github.com/TonyLianLong;https://bfshi.github.io;http://adamyala.csail.mit.edu/;https://sites.google.com/site/boyilics/home;https://people.eecs.berkeley.edu/~trevor/",
        "dblp": "276/0012;261/9376;177/9396;;d/TrevorDarrell",
        "google_scholar": "eOLxyqUAAAAJ;LBEIm8gAAAAJ;a4unsk4AAAAJ;;https://scholar.google.com.tw/citations?user=bh-uRFMAAAAJ",
        "orcid": "0000-0001-6098-189X;;0000-0001-9576-2590;;",
        "linkedin": "longlian/;baifeng-shi-09171b188/;;;",
        "or_profile": "~Long_Lian1;~Baifeng_Shi1;~Adam_Yala1;~Boyi_Li1;~trevor_darrell1",
        "aff": "NVIDIA;NVIDIA;University of California, San Francisco;University of California, Berkeley;Electrical Engineering & Computer Science Department",
        "aff_domain": "nvidia.com;nvidia.com;ucsf.edu;berkeley.edu;eecs.berkeley.edu",
        "position": "Intern;Research Intern;Assistant Professor;Postdoc;Professor",
        "bibtex": "@inproceedings{\nlian2024llmgrounded,\ntitle={{LLM}-grounded Video Diffusion Models},\nauthor={Long Lian and Baifeng Shi and Adam Yala and Trevor Darrell and Boyi Li},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=exKHibougU}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZTWf;34cZ;6SgA",
        "pdf_size": 13663221,
        "rating": "6;6;6",
        "confidence": "3;3;5",
        "soundness": "3;3;2",
        "contribution": "3;3;2",
        "presentation": "4;3;3",
        "wc_summary": "94;88;119",
        "wc_strengths": "66;52;67",
        "wc_weaknesses": "75;112;310",
        "wc_questions": "35;176;87",
        "wc_review": "270;428;583",
        "wc_reply_reviewers": "32;260;42",
        "wc_reply_authors": "1186;1887;1896",
        "reply_reviewers": "1;2;1",
        "reply_authors": "5;5;5",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            100.33333333333333,
            13.424687043734847
        ],
        "wc_strengths_avg": [
            61.666666666666664,
            6.847546194724712
        ],
        "wc_weaknesses_avg": [
            165.66666666666666,
            103.17083998021059
        ],
        "wc_questions_avg": [
            99.33333333333333,
            58.219889690341695
        ],
        "wc_review_avg": [
            427.0,
            127.78367136166759
        ],
        "wc_reply_reviewers_avg": [
            111.33333333333333,
            105.20245033056767
        ],
        "wc_reply_authors_avg": [
            1656.3333333333333,
            332.59618491832134
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            5.0,
            0.0
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 73,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11963871346554393391&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=exKHibougU",
        "pdf": "https://openreview.net/pdf?id=exKHibougU",
        "email": "nvidia.com;nvidia.com;ucsf.edu;berkeley.edu;eecs.berkeley.edu",
        "author_num": 5,
        "aff_unique_index": "0;0;1;2;3",
        "aff_unique_norm": "NVIDIA;University of California, San Francisco;University of California, Berkeley;Electrical Engineering & Computer Science Department",
        "aff_unique_dep": "NVIDIA Corporation;;;Electrical Engineering & Computer Science",
        "aff_unique_url": "https://www.nvidia.com;https://www.ucsf.edu;https://www.berkeley.edu;",
        "aff_unique_abbr": "NVIDIA;UCSF;UC Berkeley;",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";San Francisco;Berkeley",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States;"
    },
    {
        "id": "exei8zvY13",
        "title": "Improving High-Frequency Details in Cerebellum for Brain MRI Super-Resolution",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep-learning-based single image super-resolution (SISR) has attracted growing interest in clinical diagnosis, especially in the brain MR imaging field. \nConventionally, SISR models are trained using paired low-resolution (LR) and high-resolution (HR) images, and image patches rather than the whole images are fed into the model to prevent hardware memory issues.\nHowever, since different brain regions have disparate structures and their size varies, such as the cerebrum and the cerebellum, models trained using image patches could be dominated by the structures of the larger region in the brain and ignore the fine-grained details in smaller areas.\nIn this paper, we first investigate the capacities of several renowned models, by using more blurry LR images than previous studies, as input. \nThen, we propose a simple yet effective method for the conventional patch-based training strategy by balancing the proportion of patches containing high-frequency details, which makes the model focus more on high-frequency information in tiny regions, especially for the cerebellum. \nOur method does not depend on model architectures and this paper focuses solely on the T1-weighted brain MR images. \nCompared with the conventional patch-based training strategy, the resultant super-resolved image from our approach achieves comparable image quality for the whole brain, whereas improves significantly on the high-frequency details in the cerebellum.",
        "keywords": "Cerebellum;Data-balancing;MRI;Super-Resolution",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "Hanzhi Wang;David Marshall;DEREK KENTON JONES;Yuhua Li",
        "authorids": "~Hanzhi_Wang1;~David_Marshall3;~DEREK_KENTON_JONES1;~Yuhua_Li1",
        "gender": "M;M;M;M",
        "homepage": "https://github.com/hanzhiwangchn;https://users.cs.cf.ac.uk/Dave.Marshall/;https://www.cardiff.ac.uk/people/view/61030-jones-derek;https://www.cardiff.ac.uk/people/view/1063589-li-yuhua",
        "dblp": ";https://dblp.uni-trier.de/pid/m/ADavidMarshall.html;;79/5796-1",
        "google_scholar": ";7HJzGQYAAAAJ;YD38Y_EAAAAJ;https://scholar.google.co.uk/citations?user=33T8CtwAAAAJ",
        "orcid": "0000-0002-7714-4606;0000-0003-2789-1395;0000-0003-4409-8049;0000-0003-2913-4478",
        "linkedin": "hanzhi-wang-311a13171/;david-marshall-4306a720/?lipi=urn%3Ali%3Apage%3Ad_flagship3_feed%3BEQnW2VEpSh%2BREsJQCQ8AUA%3D%3D;derek-k-jones-mbe-3a553454/;yuhua-li-55999126/?originalSubdomain=uk",
        "or_profile": "~Hanzhi_Wang1;~David_Marshall3;~DEREK_KENTON_JONES1;~Yuhua_Li1",
        "aff": "Cardiff University;Cardiff University;;Cardiff University",
        "aff_domain": "cardiff.ac.uk;cardiff.ac.uk;;cardiff.ac.uk",
        "position": "PhD student;Full Professor;;Associate Professor",
        "bibtex": "@misc{\nwang2024improving,\ntitle={Improving High-Frequency Details in Cerebellum for Brain {MRI} Super-Resolution},\nauthor={Hanzhi Wang and David Marshall and DEREK KENTON JONES and Yuhua Li},\nyear={2024},\nurl={https://openreview.net/forum?id=exei8zvY13}\n}",
        "github": "",
        "project": "",
        "reviewers": "V9Gd;Mibw;rbC8;Pn3Y",
        "site": "https://openreview.net/forum?id=exei8zvY13",
        "pdf_size": 3665687,
        "rating": "1;1;3;3",
        "confidence": "2;5;5;4",
        "soundness": "1;1;2;1",
        "contribution": "3;1;1;1",
        "presentation": "3;1;2;1",
        "wc_summary": "97;44;108;16",
        "wc_strengths": "22;46;16;13",
        "wc_weaknesses": "307;41;65;182",
        "wc_questions": "31;63;1;2",
        "wc_review": "457;194;190;213",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            1.224744871391589
        ],
        "soundness_avg": [
            1.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            66.25,
            37.778135210727385
        ],
        "wc_strengths_avg": [
            24.25,
            12.968712349342937
        ],
        "wc_weaknesses_avg": [
            148.75,
            105.79786150957872
        ],
        "wc_questions_avg": [
            24.25,
            25.410381736605217
        ],
        "wc_review_avg": [
            263.5,
            112.05467415507485
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.40824829046386296,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:_nYYuyx46BgJ:scholar.google.com/&scioq=Improving+High-Frequency+Details+in+Cerebellum+for+Brain+MRI+Super-Resolution&hl=en&as_sdt=0,10",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Cardiff University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cardiff.ac.uk",
        "aff_unique_abbr": "Cardiff",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "title": "SweetDreamer: Aligning Geometric Priors in 2D diffusion for Consistent Text-to-3D",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18204",
        "id": "extpNXo6hB",
        "author_site": "Weiyu LI, Rui Chen, Xuelin Chen, Ping Tan",
        "tldr": "",
        "abstract": "It is inherently ambiguous to lift 2D results from pre-trained diffusion models to a 3D world for text-to-3D generation. 2D diffusion models solely learn view-agnostic priors and thus lack 3D knowledge during the lifting, leading to the multi-view inconsistency problem. We find that this problem primarily stems from geometric inconsistency, and avoiding misplaced geometric structures substantially mitigates the problem in the final outputs. Therefore, we improve the consistency by aligning the 2D geometric priors in diffusion models with well-defined 3D shapes during the lifting, addressing the vast majority of the problem. This is achieved by fine-tuning the 2D diffusion model to be viewpoint-aware and to produce view-specific coordinate maps of canonically oriented 3D objects. In our process, only coarse 3D information is used for aligning. This \u201ccoarse\u201d alignment not only resolves the multi-view inconsistency in geometries but also retains the ability in 2D diffusion models to generate detailed and diversified high-quality ob-jects unseen in the 3D datasets. Furthermore, our aligned geometric priors (AGP) are generic and can be seamlessly integrated into various state-of-the-art pipelines, obtaining high generalizability in terms of unseen shapes and visual appearance while greatly alleviating the multi-view inconsistency problem.",
        "keywords": "Text-to-3D;diffusion models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/5417478c775ac17db67aa518fc44c6f6a246df3a.pdf",
        "author": "Weiyu Li;Rui Chen;Xuelin Chen;Ping Tan",
        "authorids": "~Weiyu_Li2;~Rui_Chen15;~Xuelin_Chen1;~Ping_Tan2",
        "gender": "M;M;M;M",
        "homepage": "https://github.com/wyysf-98;https://xuelin-chen.github.io/;http://www.cs.sfu.ca/~pingtan/;https://aruichen.github.io/",
        "dblp": ";;;",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-TW;C7mNbwQAAAAJ;XhyKVFMAAAAJ;X-MT33QAAAAJ",
        "orcid": "0009-0009-0465-0581;0009-0007-0158-9469;0000-0002-4506-6973;0009-0003-7122-5207",
        "linkedin": ";;;",
        "or_profile": "~Weiyu_Li2;~Xuelin_Chen1;~Ping_Tan2;~Chen_Rui1",
        "aff": "Hong Kong University of Science and Technology;Tencent AI Lab;Hong Kong University of Science and Technology;South China University of Technology",
        "aff_domain": "hkust.edu;tencent.com;ust.hk;scut.edu.cn",
        "position": "PhD student;Researcher;Full Professor;MS student",
        "bibtex": "@inproceedings{\nli2024sweetdreamer,\ntitle={SweetDreamer: Aligning Geometric Priors in 2D diffusion for Consistent Text-to-3D},\nauthor={Weiyu Li and Rui Chen and Xuelin Chen and Ping Tan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=extpNXo6hB}\n}",
        "github": "",
        "project": "",
        "reviewers": "UgSj;uDHT;nptq;Q6rV",
        "pdf_size": 29194627,
        "rating": "5;5;6;8",
        "confidence": "4;5;3;4",
        "soundness": "3;2;3;4",
        "contribution": "2;2;2;4",
        "presentation": "3;3;3;4",
        "wc_summary": "72;79;55;75",
        "wc_strengths": "36;122;35;26",
        "wc_weaknesses": "100;177;260;186",
        "wc_questions": "31;1;103;2",
        "wc_review": "239;379;453;289",
        "wc_reply_reviewers": "0;0;88;0",
        "wc_reply_authors": "435;386;1066;534",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "2;2;4;2",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            70.25,
            9.148087231765993
        ],
        "wc_strengths_avg": [
            54.75,
            39.02162861798569
        ],
        "wc_weaknesses_avg": [
            180.75,
            56.66292879828927
        ],
        "wc_questions_avg": [
            34.25,
            41.4811704270745
        ],
        "wc_review_avg": [
            340.0,
            82.29823813423954
        ],
        "wc_reply_reviewers_avg": [
            22.0,
            38.1051177665153
        ],
        "wc_reply_authors_avg": [
            605.25,
            271.30368132408375
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.8660254037844386
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.28867513459481287,
        "gs_citation": 115,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8559670761575349362&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=extpNXo6hB",
        "pdf": "https://openreview.net/pdf?id=extpNXo6hB",
        "email": "hkust.edu;tencent.com;ust.hk;scut.edu.cn",
        "author_num": 4,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Tencent;South China University of Technology",
        "aff_unique_dep": ";Tencent AI Lab;",
        "aff_unique_url": "https://www.ust.hk;https://ai.tencent.com;https://www.scut.edu.cn",
        "aff_unique_abbr": "HKUST;Tencent AI Lab;SCUT",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Sample-Efficiency in Multi-Batch Reinforcement Learning: The Need for Dimension-Dependent Adaptivity",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18203",
        "id": "ey3GhWXQ97",
        "author_site": "Emmeran Johnson, Ciara Pike-Burke, Patrick Rebeschini",
        "tldr": "",
        "abstract": "We theoretically explore the relationship between sample-efficiency and adaptivity in reinforcement learning. An algorithm is sample-efficient if it uses a number of queries $n$ to the environment that is polynomial in the dimension $d$ of the problem. Adaptivity refers to the frequency at which queries are sent and feedback is processed to update the querying strategy. To investigate this interplay, we employ a learning framework that allows sending queries in $K$ batches, with feedback being processed and queries updated after each batch. This model encompasses the whole adaptivity spectrum, ranging from non-adaptive `offline' ($K=1$) to fully adaptive ($K=n$) scenarios, and regimes in between. For the problems of policy evaluation and best-policy identification under $d$-dimensional linear function approximation, we establish $\\Omega(\\log \\log d)$ lower bounds on the number of batches $K$ required for sample-efficient algorithms with $n = O(poly(d))$ queries. Our results show that just having adaptivity ($K>1$) does not necessarily guarantee sample-efficiency. Notably, the adaptivity-boundary for sample-efficiency is not between offline reinforcement learning ($K=1$), where sample-efficiency was known to not be possible, and adaptive settings. Instead, the boundary lies between different regimes of adaptivity and depends on the problem dimension.",
        "keywords": "RL Theory;Low adaptive RL;Linear RL;Multi-Batch RL",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Emmeran Johnson;Ciara Pike-Burke;Patrick Rebeschini",
        "authorids": "~Emmeran_Johnson1;~Ciara_Pike-Burke2;~Patrick_Rebeschini1",
        "gender": "M;;M",
        "homepage": ";https://www.ma.imperial.ac.uk/~cpikebur/;http://www.stats.ox.ac.uk/~rebeschi/",
        "dblp": "340/6893;202/1263;164/7439",
        "google_scholar": "ZubVvboAAAAJ;Hl1vu1MAAAAJ;",
        "orcid": ";;0000-0001-7772-4160",
        "linkedin": ";;patrick-rebeschini/",
        "or_profile": "~Emmeran_Johnson1;~Ciara_Pike-Burke2;~Patrick_Rebeschini1",
        "aff": "Imperial College London;Imperial College London;University of Oxford",
        "aff_domain": "ic.ac.uk;imperial.ac.uk;oxford.ac.uk",
        "position": "PhD student;Lecturer;Full Professor",
        "bibtex": "@inproceedings{\njohnson2024sampleefficiency,\ntitle={Sample-Efficiency in Multi-Batch Reinforcement Learning: The Need for Dimension-Dependent Adaptivity},\nauthor={Emmeran Johnson and Ciara Pike-Burke and Patrick Rebeschini},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ey3GhWXQ97}\n}",
        "github": "",
        "project": "",
        "reviewers": "XsoY;7s3L;ycxM",
        "pdf_size": 730560,
        "rating": "5;6;8",
        "confidence": "3;2;3",
        "soundness": "3;4;4",
        "contribution": "3;4;4",
        "presentation": "3;3;3",
        "wc_summary": "116;59;95",
        "wc_strengths": "13;157;56",
        "wc_weaknesses": "367;55;115",
        "wc_questions": "3;228;68",
        "wc_review": "499;499;334",
        "wc_reply_reviewers": "0;0;14",
        "wc_reply_authors": "734;788;553",
        "reply_reviewers": "0;0;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            90.0,
            23.53720459187964
        ],
        "wc_strengths_avg": [
            75.33333333333333,
            60.35634920113118
        ],
        "wc_weaknesses_avg": [
            179.0,
            135.17396198972642
        ],
        "wc_questions_avg": [
            99.66666666666667,
            94.54569735788554
        ],
        "wc_review_avg": [
            444.0,
            77.78174593052023
        ],
        "wc_reply_reviewers_avg": [
            4.666666666666667,
            6.599663291074443
        ],
        "wc_reply_authors_avg": [
            691.6666666666666,
            100.4998618020056
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.18898223650461363,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6548608364972603310&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=ey3GhWXQ97",
        "pdf": "https://openreview.net/pdf?id=ey3GhWXQ97",
        "email": "ic.ac.uk;imperial.ac.uk;oxford.ac.uk",
        "author_num": 3,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Imperial College London;University of Oxford",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.imperial.ac.uk;https://www.ox.ac.uk",
        "aff_unique_abbr": "ICL;Oxford",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "title": "AnyText: Multilingual Visual Text Generation and Editing",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18202",
        "id": "ezBH9WE9s2",
        "author_site": "Yuxiang Tuo, Wangmeng Xiang, Jun-Yan He, Yifeng Geng, Xuansong Xie",
        "tldr": "",
        "abstract": "Diffusion model based Text-to-Image has achieved impressive achievements recently. Although current technology for synthesizing images is highly advanced and capable of generating images with high fidelity, it is still possible to give the show away when focusing on the text area in the generated image, as synthesized text often contains blurred, unreadable, or incorrect characters, making visual text generation one of the most challenging issues in this field. To address this issue, we introduce AnyText, a diffusion-based multilingual visual text generation and editing model, that focuses on rendering accurate and coherent text in the image. AnyText comprises a diffusion pipeline with two primary elements: an auxiliary latent module and a text embedding module. The former uses inputs like text glyph, position, and masked image to generate latent features for text generation or editing. The latter employs an OCR model for encoding stroke data as embeddings, which blend with image caption embeddings from the tokenizer to generate texts that seamlessly integrate with the background. We employed text-control diffusion loss and text perceptual loss for training to further enhance writing accuracy. AnyText can write characters in multiple languages, to the best of our knowledge, this is the first work to address multilingual visual text generation. It is worth mentioning that AnyText can be plugged into existing diffusion models from the community for rendering or editing text accurately. After conducting extensive evaluation experiments, our method has outperformed all other approaches by a significant margin. Additionally, we contribute the first large-scale multilingual text images dataset, AnyWord-3M, containing 3 million image-text pairs with OCR annotations in multiple languages. Based on AnyWord-3M dataset, we propose AnyText-benchmark for the evaluation of visual text generation accuracy and quality. Our project will be open-sourced soon to improve and promote the development of text generation technology.",
        "keywords": "diffusion model;text-to-image;text generation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/bf428cbc110fa68be81af2b1e0bb9f760e1d3b12.zip",
        "author": "Yuxiang Tuo;Wangmeng Xiang;Jun-Yan He;Yifeng Geng;Xuansong Xie",
        "authorids": "~Yuxiang_Tuo2;~Wangmeng_Xiang1;~Jun-Yan_He2;~Yifeng_Geng2;~Xuansong_Xie1",
        "gender": "M;M;M;M;M",
        "homepage": ";;;;https://rwlab.sjtu.edu.cn/Article?ID=217",
        "dblp": "218/6448;45/10331;234/8028;173/3747;360/0747",
        "google_scholar": "LFNwNF4AAAAJ;-58L4KAAAAAJ;M0Ei1zkAAAAJ;bjNZqGAAAAAJ;",
        "orcid": ";;;;",
        "linkedin": ";yifeng-geng-2aaa774b/;;;",
        "or_profile": "~Wangmeng_Xiang1;~Yifeng_Geng2;~Xuansong_Xie1;~HE_JUNYAN1;~Tuo_Yuxiang1",
        "aff": "Alibaba Group;Alibaba Group;Alibaba Group;Alibaba Group;Alibaba",
        "aff_domain": "alibaba-inc.com;alibaba-inc.com;alibaba-inc.com;alibaba-inc.com;alibaba-inc.com",
        "position": "Researcher;Researcher;Researcher;Researcher;Researcher",
        "bibtex": "@inproceedings{\ntuo2024anytext,\ntitle={AnyText: Multilingual Visual Text Generation and Editing},\nauthor={Yuxiang Tuo and Wangmeng Xiang and Jun-Yan He and Yifeng Geng and Xuansong Xie},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ezBH9WE9s2}\n}",
        "github": "",
        "project": "",
        "reviewers": "LoJV;5GTp;TuoG;xCSM",
        "pdf_size": 15672044,
        "rating": "6;6;6;8",
        "confidence": "3;3;3;4",
        "soundness": "3;3;2;3",
        "contribution": "2;3;2;4",
        "presentation": "3;3;2;3",
        "wc_summary": "61;127;68;102",
        "wc_strengths": "34;107;74;100",
        "wc_weaknesses": "29;165;61;164",
        "wc_questions": "78;88;315;1",
        "wc_review": "202;487;518;367",
        "wc_reply_reviewers": "126;106;232;54",
        "wc_reply_authors": "1025;575;1789;796",
        "reply_reviewers": "2;1;3;1",
        "reply_authors": "2;1;3;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            89.5,
            26.63174797117155
        ],
        "wc_strengths_avg": [
            78.75,
            28.612715704735194
        ],
        "wc_weaknesses_avg": [
            104.75,
            60.81272481972832
        ],
        "wc_questions_avg": [
            120.5,
            117.2316083656622
        ],
        "wc_review_avg": [
            393.5,
            124.11385901663037
        ],
        "wc_reply_reviewers_avg": [
            129.5,
            64.75144786026024
        ],
        "wc_reply_authors_avg": [
            1046.25,
            457.3922687365846
        ],
        "reply_reviewers_avg": [
            1.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 86,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11745903412124797868&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=ezBH9WE9s2",
        "pdf": "https://openreview.net/pdf?id=ezBH9WE9s2",
        "email": "alibaba-inc.com;alibaba-inc.com;alibaba-inc.com;alibaba-inc.com;alibaba-inc.com",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0;1",
        "aff_unique_norm": "Alibaba Group;Alibaba Group Holding Limited",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.alibaba.com;https://www.alibaba.com",
        "aff_unique_abbr": "Alibaba;Alibaba",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Convolution Meets LoRA: Parameter Efficient Finetuning for Segment Anything Model",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18201",
        "id": "ezscMer8L0",
        "author_site": "Zihan Zhong, Zhiqiang Tang, Tong He, Haoyang Fang, Chun Yuan",
        "tldr": "",
        "abstract": "The Segment-Anything Model (SAM) stands as a foundational framework for image segmentation. While it exhibits remarkable zero-shot generalization in typical scenarios, its advantage diminishes when applied to specialized domains like medical imagery and remote sensing. To address this limitation, this paper introduces Conv-LoRA, a simple yet effective parameter-efficient fine-tuning approach. By integrating ultra-lightweight convolutional parameters into Low-Rank Adaptation (LoRA), Conv-LoRA can inject image-related inductive biases into the plain ViT encoder, further reinforcing SAM\u2019s local prior assumption. Notably, Conv-LoRA not only preserves SAM\u2019s extensive segmentation knowledge but also revives its capacity of learning high-level image semantics, which is constrained by SAM\u2019s foreground-background segmentation pretraining. Comprehensive experimentation across diverse benchmarks spanning multiple domains underscores Conv-LoRA\u2019s superiority in adapting SAM to real-world semantic segmentation tasks.",
        "keywords": "Parameter-efficient fine-tuning;Segment Anything Model;LoRA;Semantic Segmentation",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Zihan Zhong;Zhiqiang Tang;Tong He;Haoyang Fang;Chun Yuan",
        "authorids": "~Zihan_Zhong3;~Zhiqiang_Tang1;~Tong_He5;~Haoyang_Fang1;~Chun_Yuan1",
        "gender": "F;M;M;M;M",
        "homepage": "https://github.com/Harry-zzh;https://sites.google.com/site/zhiqiangtanghomepage/home;https://hetong007.github.io/;;https://www.sigs.tsinghua.edu.cn/fg3/105064.jhtml",
        "dblp": "338/6823;71/10098-1;02/1554-2;246/5209;",
        "google_scholar": "ZaNQ6mQAAAAJ;https://scholar.google.com/citations?view_op=list_works;hV5D8GYAAAAJ;_PA_5_kAAAAJ;https://scholar.google.com.hk/citations?user=fYdxi2sAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;haoyang-fang/;",
        "or_profile": "~Zihan_Zhong3;~Zhiqiang_Tang1;~Tong_He5;~Haoyang_Fang1;~Chun_Yuan1",
        "aff": "Tsinghua University;AWS;Amazon;Amazon;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;amazon.com;amazon.com;amazon.com;tsinghua.edu.cn",
        "position": "MS student;Applied Scientist;Researcher;Applied Scientist;Full Professor",
        "bibtex": "@inproceedings{\nzhong2024convolution,\ntitle={Convolution Meets Lo{RA}: Parameter Efficient Finetuning for Segment Anything Model},\nauthor={Zihan Zhong and Zhiqiang Tang and Tong He and Haoyang Fang and Chun Yuan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ezscMer8L0}\n}",
        "github": "",
        "project": "",
        "reviewers": "2Lzf;LN6g;3rwQ;W4sK",
        "pdf_size": 15707271,
        "rating": "6;6;6;6",
        "confidence": "3;4;4;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "94;159;92;123",
        "wc_strengths": "103;30;35;225",
        "wc_weaknesses": "27;48;166;518",
        "wc_questions": "47;55;2;469",
        "wc_review": "271;292;295;1335",
        "wc_reply_reviewers": "58;27;25;0",
        "wc_reply_authors": "511;695;1067;1549",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "2;2;2;3",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            117.0,
            27.175356483402386
        ],
        "wc_strengths_avg": [
            98.25,
            78.65549885418056
        ],
        "wc_weaknesses_avg": [
            189.75,
            196.78208124725177
        ],
        "wc_questions_avg": [
            143.25,
            189.15387254825103
        ],
        "wc_review_avg": [
            548.25,
            454.32442978558834
        ],
        "wc_reply_reviewers_avg": [
            27.5,
            20.573040611440984
        ],
        "wc_reply_authors_avg": [
            955.5,
            396.89891660219985
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 49,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13579172257698635249&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=ezscMer8L0",
        "pdf": "https://openreview.net/pdf?id=ezscMer8L0",
        "email": "tsinghua.edu.cn;amazon.com;amazon.com;amazon.com;tsinghua.edu.cn",
        "author_num": 5,
        "aff_unique_index": "0;1;1;1;0",
        "aff_unique_norm": "Tsinghua University;Amazon",
        "aff_unique_dep": ";Amazon Web Services",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://aws.amazon.com",
        "aff_unique_abbr": "THU;AWS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Cycle Consistency Driven Object Discovery",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18200",
        "id": "f1xnBr4WD6",
        "author_site": "Aniket Rajiv Didolkar, Anirudh Goyal, Yoshua Bengio",
        "tldr": "",
        "abstract": "Developing deep learning models that effectively learn object-centric representations, akin to human cognition, remains a challenging task. Existing approaches facilitate object discovery by representing objects as fixed-size vectors, called ``slots'' or ``object files''. While these approaches have shown promise in certain scenarios, they still exhibit certain limitations. First, they rely on architectural priors which can be unreliable and usually require meticulous engineering to identify the correct objects. Second, there has been a notable gap in investigating the practical utility of these representations in downstream tasks. To address the first limitation, we introduce a method that explicitly optimizes the constraint that each object in a scene should be associated with a distinct slot. We formalize this constraint by introducing  consistency objectives which are cyclic in nature. By integrating these consistency objectives into various existing slot-based object-centric methods, we showcase substantial improvements in object-discovery performance. These enhancements consistently hold true across both synthetic and real-world scenes, underscoring the effectiveness and adaptability of the proposed approach. To tackle the second limitation, we apply the learned object-centric representations from the proposed method to two downstream reinforcement learning tasks, demonstrating considerable performance enhancements compared to conventional slot-based and monolithic representation learning methods. Our results suggest that the proposed approach not only improves object discovery, but also provides richer features for downstream tasks.",
        "keywords": "cycle consistency;object discovery;downstream RL",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Aniket Rajiv Didolkar;Anirudh Goyal;Yoshua Bengio",
        "authorids": "~Aniket_Rajiv_Didolkar1;~Anirudh_Goyal1;~Yoshua_Bengio1",
        "gender": "M;M;M",
        "homepage": "https://github.com/dido1998/;https://anirudh9119.github.io/;http://yoshuabengio.org",
        "dblp": "245/8589;172/1039;56/953",
        "google_scholar": "https://scholar.google.ca/citations?user=ekvl5o0AAAAJ;krrh6OUAAAAJ;kukA0LcAAAAJ",
        "orcid": ";;",
        "linkedin": "aniket-didolkar-7a9b8912a;;yoshuabengio/?originalSubdomain=ca",
        "or_profile": "~Aniket_Rajiv_Didolkar1;~Anirudh_Goyal1;~Yoshua_Bengio1",
        "aff": "Manipal Institute of Technology;Google DeepMind;University of Montreal",
        "aff_domain": "manipal.edu;google.com;umontreal.ca",
        "position": "Undergrad student;Researcher;Full Professor",
        "bibtex": "@inproceedings{\ndidolkar2024cycle,\ntitle={Cycle Consistency Driven Object Discovery},\nauthor={Aniket Rajiv Didolkar and Anirudh Goyal and Yoshua Bengio},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=f1xnBr4WD6}\n}",
        "github": "",
        "project": "",
        "reviewers": "DLp5;SbRA;nRCE;7qi5",
        "pdf_size": 2172707,
        "rating": "5;6;8;8",
        "confidence": "4;2;4;4",
        "soundness": "3;3;3;3",
        "contribution": "3;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "45;45;84;122",
        "wc_strengths": "78;33;44;86",
        "wc_weaknesses": "48;81;385;87",
        "wc_questions": "53;28;115;36",
        "wc_review": "224;187;628;331",
        "wc_reply_reviewers": "0;24;631;72",
        "wc_reply_authors": "1779;367;2596;545",
        "reply_reviewers": "0;1;6;2",
        "reply_authors": "6;1;12;2",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            74.0,
            31.960913628993776
        ],
        "wc_strengths_avg": [
            60.25,
            22.275266552838374
        ],
        "wc_weaknesses_avg": [
            150.25,
            136.3440042686146
        ],
        "wc_questions_avg": [
            58.0,
            34.12477106150311
        ],
        "wc_review_avg": [
            342.5,
            173.1076254819527
        ],
        "wc_reply_reviewers_avg": [
            181.75,
            260.6668131926272
        ],
        "wc_reply_authors_avg": [
            1321.75,
            914.8331473552978
        ],
        "reply_reviewers_avg": [
            2.25,
            2.277608394786075
        ],
        "reply_authors_avg": [
            5.25,
            4.322904116447646
        ],
        "replies_avg": [
            39,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12507443428261938540&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=f1xnBr4WD6",
        "pdf": "https://openreview.net/pdf?id=f1xnBr4WD6",
        "email": "manipal.edu;google.com;umontreal.ca",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Manipal Institute of Technology;Google;University of Montreal",
        "aff_unique_dep": ";Google DeepMind;",
        "aff_unique_url": "https://mit manipal.edu;https://deepmind.com;https://wwwumontreal.ca",
        "aff_unique_abbr": "MIT Manipal;DeepMind;UM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2",
        "aff_country_unique": "India;United Kingdom;Canada"
    },
    {
        "id": "f37TVPH62h",
        "title": "Compound Returns Reduce Variance in Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Multistep returns such as $n$-step returns are commonly used to improve the sample efficiency of deep reinforcement learning (RL). Variance becomes the limiting factor in the length of the returns; looking too far into the future increases uncertainty and reverses the benefit of multistep learning. In our work, we study the ability of compound returns---weighted averages of $n$-step returns---to reduce variance. The $\\lambda$-return, used by TD($\\lambda$), is the most well-known compound return. We prove for the first time that any compound return with the same contraction rate as a given $n$-step return has strictly lower variance when experiences are not perfectly correlated. Because the $\\lambda$-return is expensive to implement in deep RL, we also introduce an approximation called Piecewise $\\lambda$-Return (PiLaR), formed by averaging two $n$-step returns, that offers similar variance reduction while being efficient to implement with minibatched experience replay. We conduct experiments showing PiLaRs can train Deep Q-Networks faster than $n$-step returns with little additional computational cost.",
        "keywords": "reinforcement learning;deep reinforcement learning;multistep learning;n-step returns;compound backups",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/5d5cb5b85ecd355a9ba70b49d423ad141fe44fec.zip",
        "author": "Brett Daley;Martha White;Marlos C. Machado",
        "authorids": "~Brett_Daley1;~Martha_White1;~Marlos_C._Machado1",
        "gender": "M;F;M",
        "homepage": "https://brett-daley.github.io/;http://marthawhite.ca;https://webdocs.cs.ualberta.ca/~machado/",
        "dblp": "157/3749;60/7057;21/10949",
        "google_scholar": "PP2_bZ8AAAAJ;t5zdD_IAAAAJ;https://scholar.google.ca/citations?user=xf_n4xUAAAAJ",
        "orcid": "0000-0002-6402-0751;0000-0002-5356-2950;",
        "linkedin": "brettdaley/;;cholodovskis/",
        "or_profile": "~Brett_Daley1;~Martha_White1;~Marlos_C._Machado1",
        "aff": "Meta;University of Alberta;University of Alberta",
        "aff_domain": "meta.com;ualberta.ca;ualberta.ca",
        "position": "Intern;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\ndaley2024compound,\ntitle={Compound Returns Reduce Variance in Reinforcement Learning},\nauthor={Brett Daley and Martha White and Marlos C. Machado},\nyear={2024},\nurl={https://openreview.net/forum?id=f37TVPH62h}\n}",
        "github": "",
        "project": "",
        "reviewers": "Ucxg;fKNs;U4yb",
        "site": "https://openreview.net/forum?id=f37TVPH62h",
        "pdf_size": 922716,
        "rating": "3;5;5",
        "confidence": "3;3;3",
        "soundness": "3;2;2",
        "contribution": "2;2;3",
        "presentation": "2;3;4",
        "wc_summary": "49;110;141",
        "wc_strengths": "16;63;48",
        "wc_weaknesses": "124;83;262",
        "wc_questions": "46;2;16",
        "wc_review": "235;258;467",
        "wc_reply_reviewers": "222;0;0",
        "wc_reply_authors": "788;150;758",
        "reply_reviewers": "3;0;0",
        "reply_authors": "3;1;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            100.0,
            38.21866908549625
        ],
        "wc_strengths_avg": [
            42.333333333333336,
            19.601587237318874
        ],
        "wc_weaknesses_avg": [
            156.33333333333334,
            76.56950364792036
        ],
        "wc_questions_avg": [
            21.333333333333332,
            18.354533197248273
        ],
        "wc_review_avg": [
            320.0,
            104.36793888290919
        ],
        "wc_reply_reviewers_avg": [
            74.0,
            104.65180361560904
        ],
        "wc_reply_authors_avg": [
            565.3333333333334,
            293.94028116079784
        ],
        "reply_reviewers_avg": [
            1.0,
            1.4142135623730951
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:VJd8V9H4jtUJ:scholar.google.com/&scioq=Compound+Returns+Reduce+Variance+in+Reinforcement+Learning&hl=en&as_sdt=0,48",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Meta;University of Alberta",
        "aff_unique_dep": "Meta Platforms, Inc.;",
        "aff_unique_url": "https://meta.com;https://www.ualberta.ca",
        "aff_unique_abbr": "Meta;UAlberta",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "United States;Canada"
    },
    {
        "id": "f3NLRksLiZ",
        "title": "Reservoir Transformer at Infinite Horizon: the Lyapunov Time and the Butterfly Effect",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We introduce Reservoir Transformer with non-linear readout, a novel neural network architecture, designed for long-context multi-variable time series prediction.  Capable of efficiently modeling arbitrarily input length sequences, our model is powerful in predicting events in the distant future by retaining comprehensive historical data. Our design of a non-linear readout and group reservoirs overcomes the limitations inherent in conventional chaotic behavior prediction techniques, notably those impeded by challenges of prolonged Lyapunov times and the butterfly effect. Our architecture consistently outperforms state-of-the-art deep neural network (DNN) models, including NLinear, Pyformer, Informer, Autoformer, and the baseline Transformer, with an error reduction of up to -89.43% in various fields such as ETTh, ETTm, and air quality.",
        "keywords": "Transformer;reservoir computing;time-series forecasting;chaotic prediction",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/fa22eee814b1236bce9aaf7e02c255554eac42f5.zip",
        "author": "Md Kowsher;Jia Xu",
        "authorids": "~Md_Kowsher1;~Jia_Xu3",
        "gender": "M;F",
        "homepage": "https://kowsher.github.io/;http://jiaxu.org",
        "dblp": ";95/3616-4.html",
        "google_scholar": "https://scholar.google.com/citations?hl=en;myyblq4AAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Md_Kowsher1;~Jia_Xu3",
        "aff": "University of Central Florida;Stevens Institute of Technology",
        "aff_domain": "ucf.edu;stevens.edu",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nkowsher2024reservoir,\ntitle={Reservoir Transformer at Infinite Horizon: the Lyapunov Time and the Butterfly Effect},\nauthor={Md Kowsher and Jia Xu},\nyear={2024},\nurl={https://openreview.net/forum?id=f3NLRksLiZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "8rjM;cN3c;rA4y;Md14",
        "site": "https://openreview.net/forum?id=f3NLRksLiZ",
        "pdf_size": 7435488,
        "rating": "3;3;5;6",
        "confidence": "3;2;4;2",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;2",
        "presentation": "2;2;3;3",
        "wc_summary": "113;95;101;91",
        "wc_strengths": "53;72;72;7",
        "wc_weaknesses": "240;430;97;2",
        "wc_questions": "76;95;59;150",
        "wc_review": "482;692;329;250",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            100.0,
            8.306623862918075
        ],
        "wc_strengths_avg": [
            51.0,
            26.56124997058685
        ],
        "wc_weaknesses_avg": [
            192.25,
            161.3015421500985
        ],
        "wc_questions_avg": [
            95.0,
            34.21257078911201
        ],
        "wc_review_avg": [
            438.25,
            168.57991428399765
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.058025885318565944,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:lgkIdc4dIdgJ:scholar.google.com/&scioq=Reservoir+Transformer+at+Infinite+Horizon:+the+Lyapunov+Time+and+the+Butterfly+Effect&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Central Florida;Stevens Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ucf.edu;https://www.stevens.edu",
        "aff_unique_abbr": "UCF;SIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "f3TQxxuquZ",
        "title": "One-stage Prompt-based Continual Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Prompt-based Continual Learning (PCL) has gained considerable attention as a promising continual learning solution as it achieves state-of-the-art performance while preventing privacy violation and memory overhead issues. Nonetheless, existing PCL approaches face significant computational burdens because of two Vision Transformer (ViT) feed-forward stages; one is for the query ViT that generates a prompt query to select prompts inside a prompt pool; the other one is a backbone ViT that mixes information between selected prompts and image tokens. To address this, we introduce a one-stage PCL framework by directly using the intermediate layer's token embedding as a prompt query. This design removes the need for an additional feed-forward stage for query ViT, resulting in $\\sim 50\\%$ computational cost reduction for both training and inference with marginal accuracy drop ($\\le 1\\%$). We further introduce a Query-Pool Regularization (QR) loss that regulates the relationship between the prompt query and the prompt pool to improve representation power. The QR loss is only applied during training time, so there is no computational overhead at inference from the QR loss. With the QR loss, our approach maintains $\\sim 50\\%$ computational cost reduction during inference as well as outperforms the prior two-stage PCL methods by $\\sim 1.4\\%$ on public class-incremental continual learning benchmarks including CIFAR-100 and ImageNet-R.",
        "keywords": "Efficient learning;Continual learning;Transfer learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/fca67507c109c234b77cb8a2422038e6fcee2fb8.zip",
        "author": "Youngeun Kim;Yuhang Li;Priyadarshini Panda",
        "authorids": "~Youngeun_Kim1;~Yuhang_Li1;~Priyadarshini_Panda1",
        "gender": "M;M;F",
        "homepage": "https://youngryan1993.github.io/homepage/;;https://intelligentcomputinglab.yale.edu/",
        "dblp": "58/2943;;168/8446",
        "google_scholar": "bh5Ve0EAAAAJ;3UzXL-AAAAAJ;qA5WsYUAAAAJ",
        "orcid": ";;",
        "linkedin": "youngeun-kim-3b97b6179/;;",
        "or_profile": "~Youngeun_Kim1;~Yuhang_Li1;~Priyadarshini_Panda1",
        "aff": "Yale University;Yale University;Yale University",
        "aff_domain": "yale.edu;yale.edu;yale.edu",
        "position": "PhD student;PhD student;Assistant Professor",
        "bibtex": "@misc{\nkim2024onestage,\ntitle={One-stage Prompt-based Continual Learning},\nauthor={Youngeun Kim and Yuhang Li and Priyadarshini Panda},\nyear={2024},\nurl={https://openreview.net/forum?id=f3TQxxuquZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "Wfb2;PuDx;2Phe;84n7",
        "site": "https://openreview.net/forum?id=f3TQxxuquZ",
        "pdf_size": 773979,
        "rating": "5;5;6;6",
        "confidence": "4;4;4;3",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;3;2",
        "wc_summary": "56;105;63;85",
        "wc_strengths": "113;59;22;98",
        "wc_weaknesses": "168;133;136;122",
        "wc_questions": "3;5;7;12",
        "wc_review": "340;302;228;317",
        "wc_reply_reviewers": "42;41;51;0",
        "wc_reply_authors": "908;784;448;625",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "3;2;1;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            77.25,
            19.266226926930972
        ],
        "wc_strengths_avg": [
            73.0,
            35.43303543305315
        ],
        "wc_weaknesses_avg": [
            139.75,
            17.122718826167766
        ],
        "wc_questions_avg": [
            6.75,
            3.344772040064913
        ],
        "wc_review_avg": [
            296.75,
            41.936708263763386
        ],
        "wc_reply_reviewers_avg": [
            33.5,
            19.72941965694886
        ],
        "wc_reply_authors_avg": [
            691.25,
            172.58530499437083
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11414924157425709727&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Yale University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.yale.edu",
        "aff_unique_abbr": "Yale",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "f3UIvWeAKs",
        "title": "Learning Node Selection via Tripartite Graph Representation in Mixed Integer Linear Programming",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Branch-and-bound methods are pivotal in solving Mixed Integer Linear Programs (MILPs), where the challenge of node selection arises, necessitating the prioritization of different regions of the space for subsequent exploration. While machine learning techniques have been proposed to address this, our paper resolves two crucial and open questions concerning \\textbf{(P1)} the representation of the MILP solving process and \\textbf{(P2)} the qualification of nodes in node selection. We present a novel tripartite graph representation for the branch-and-bound search tree, which, through theoretical validation, proves to effectively encapsulate the essential information of the search tree for node selection. To further this, we introduce three innovative metrics for node selection and formulate a GNN-based model, DQN-GNN, utilizing reinforcement learning to derive node selection policies. Empirical evaluations illustrate that DQN-GNN markedly enhances the efficiency of solving MILPs, surpassing the existing human-designed and learning-based models. compared to other AI methods, our experiments substantiate that DQN-GNN exhibits commendable generalization to MILPs that are substantially larger than those encountered during training.",
        "keywords": "Mixed Integer Linear Programming;Branch-and-Bound;Node Selection",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/d46af41fa1654143322e4b67aa43c9b55171993e.pdf",
        "author": "Sijia Zhang;Fei Shang;Feng Wu;Shaoang Li;Xiangyang Li",
        "authorids": "~Sijia_Zhang2;~Fei_Shang2;~Feng_Wu3;~Shaoang_Li1;~Xiangyang_Li4",
        "gender": "F;;M;M;",
        "homepage": "https://www.researchgate.net/profile/Sijia-Zhang-30;;http://staff.ustc.edu.cn/~wufeng02/;;http://staff.ustc.edu.cn/~xiangyangli/",
        "dblp": ";;25/3972-1;;l/XiangYangLi",
        "google_scholar": ";;8CEHlu4AAAAJ;https://scholar.google.com/citations?hl=en;JURtNb0AAAAJ",
        "orcid": ";0000-0002-5495-8869;0000-0003-3989-0509;;",
        "linkedin": ";;https://www.linkedin.com/pub/feng-wu/62/438/2a2;;",
        "or_profile": "~Sijia_Zhang2;~Fei_Shang2;~Feng_Wu3;~Shaoang_Li1;~Xiangyang_Li4",
        "aff": "University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China",
        "aff_domain": "ustc.edu.cn;ustc.edu.cn;ustc.edu.cn;ustc.edu.cn;ustc.edu",
        "position": "PhD student;PhD student;Associate Professor;PhD student;Full Professor",
        "bibtex": "@misc{\nzhang2024learning,\ntitle={Learning Node Selection via Tripartite Graph Representation in Mixed Integer Linear Programming},\nauthor={Sijia Zhang and Fei Shang and Feng Wu and Shaoang Li and Xiangyang Li},\nyear={2024},\nurl={https://openreview.net/forum?id=f3UIvWeAKs}\n}",
        "github": "",
        "project": "",
        "reviewers": "pDE5;gXzc;cMLb;ghtC",
        "site": "https://openreview.net/forum?id=f3UIvWeAKs",
        "pdf_size": 439369,
        "rating": "3;3;3;6",
        "confidence": "4;4;3;3",
        "soundness": "3;1;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;2;3",
        "wc_summary": "107;102;67;172",
        "wc_strengths": "32;68;36;68",
        "wc_weaknesses": "133;291;219;99",
        "wc_questions": "5;290;71;6",
        "wc_review": "277;751;393;345",
        "wc_reply_reviewers": "0;0;22;0",
        "wc_reply_authors": "262;1073;817;902",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;3;2;2",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            112.0,
            37.914377220257755
        ],
        "wc_strengths_avg": [
            51.0,
            17.05872210923198
        ],
        "wc_weaknesses_avg": [
            185.5,
            74.98499849969993
        ],
        "wc_questions_avg": [
            93.0,
            116.83963368651924
        ],
        "wc_review_avg": [
            441.5,
            183.3814330841593
        ],
        "wc_reply_reviewers_avg": [
            5.5,
            9.526279441628825
        ],
        "wc_reply_authors_avg": [
            763.5,
            303.86551301521536
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:DRRPWaAgEgEJ:scholar.google.com/&scioq=Learning+Node+Selection+via+Tripartite+Graph+Representation+in+Mixed+Integer+Linear+Programming&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "University of Science and Technology of China",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.ustc.edu.cn",
        "aff_unique_abbr": "USTC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "LiDAR: Sensing Linear Probing Performance in Joint Embedding SSL Architectures",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18199",
        "id": "f3g5XpL9Kb",
        "author_site": "Vimal Thilak, Chen Huang, Omid Saremi, Laurent Dinh, Hanlin Goh, Preetum Nakkiran, Joshua Susskind, Etai Littwin",
        "tldr": "",
        "abstract": "Joint embedding (JE) architectures have emerged as a promising avenue for ac-\nquiring transferable data representations. A key obstacle to using JE methods,\nhowever, is the inherent challenge of evaluating learned representations without\naccess to a downstream task, and an annotated dataset. Without efficient and re-\nliable evaluation, it is difficult to iterate on architectural and training choices for\nJE methods. In this paper, we introduce LiDAR (Linear Discriminant Analysis\nRank), a metric designed to measure the quality of representations within JE archi-\ntectures. Our metric addresses several shortcomings of recent approaches based\non feature covariance rank by discriminating between informative and uninforma-\ntive features. In essence, LiDAR quantifies the rank of the Linear Discriminant\nAnalysis (LDA) matrix associated with the surrogate SSL task\u2014a measure that\nintuitively captures the information content as it pertains to solving the SSL task.\nWe empirically demonstrate that LiDAR significantly surpasses naive rank based\napproaches in its predictive power of optimal hyperparameters. Our proposed cri-\nterion presents a more robust and intuitive means of assessing the quality of rep-\nresentations within JE architectures, which we hope facilitates broader adoption\nof these powerful techniques in various domains.",
        "keywords": "Self Supervised Learning;Joint Embedding Architectures",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/3c4cd119567928f024cf2c9493f8f5e6f9b503d3.pdf",
        "author": "Vimal Thilak;Chen Huang;Omid Saremi;Laurent Dinh;Hanlin Goh;Preetum Nakkiran;Joshua M. Susskind;Etai Littwin",
        "authorids": "~Vimal_Thilak2;~Chen_Huang6;~Omid_Saremi1;~Laurent_Dinh1;~Hanlin_Goh2;~Preetum_Nakkiran1;~Joshua_M._Susskind1;~Etai_Littwin1",
        "gender": "M;M;;;M;;M;M",
        "homepage": ";;;https://laurent-dinh.github.io/;;http://preetum.nakkiran.org;http://www.apple.com;",
        "dblp": "14/4821;05/8125-1;;131/6819;96/4057;151/6343;132/7797;",
        "google_scholar": "KyBnuqsAAAAJ;QZ-JKOUAAAAJ;;h7OHSkoAAAAJ;;zithBbUAAAAJ;Sv2TGqsAAAAJ;NOVS7vwAAAAJ",
        "orcid": ";;;;;;;",
        "linkedin": ";;omidsaremi/;;;;joshua-susskind-8ab2ab5/;",
        "or_profile": "~Vimal_Thilak2;~Chen_Huang6;~Omid_Saremi1;~Laurent_Dinh1;~Hanlin_Goh2;~Preetum_Nakkiran1;~Joshua_M._Susskind1;~Etai_Littwin1",
        "aff": "Apple;Apple;Apple;Apple;Apple;Apple;Apple;",
        "aff_domain": "apple.com;apple.com;apple.com;apple.com;apple.com;apple.com;apple.com;",
        "position": "Engineer;Research Scientist;ML;Researcher;Research Scientist;Principal Researcher;Researcher;",
        "bibtex": "@inproceedings{\nthilak2024lidar,\ntitle={Li{DAR}: Sensing Linear Probing Performance in Joint Embedding {SSL} Architectures},\nauthor={Vimal Thilak and Chen Huang and Omid Saremi and Laurent Dinh and Hanlin Goh and Preetum Nakkiran and Joshua M. Susskind and Etai Littwin},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=f3g5XpL9Kb}\n}",
        "github": "",
        "project": "",
        "reviewers": "d3VV;bVwZ;y3Lm",
        "pdf_size": 3279628,
        "rating": "6;6;8",
        "confidence": "3;1;4",
        "soundness": "3;3;4",
        "contribution": "3;3;3",
        "presentation": "3;2;4",
        "wc_summary": "61;55;62",
        "wc_strengths": "55;38;105",
        "wc_weaknesses": "8;85;187",
        "wc_questions": "1;60;130",
        "wc_review": "125;238;484",
        "wc_reply_reviewers": "12;0;128",
        "wc_reply_authors": "460;254;3399",
        "reply_reviewers": "1;0;2",
        "reply_authors": "1;1;6",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            59.333333333333336,
            3.091206165165235
        ],
        "wc_strengths_avg": [
            66.0,
            28.437065014988214
        ],
        "wc_weaknesses_avg": [
            93.33333333333333,
            73.31363371767144
        ],
        "wc_questions_avg": [
            63.666666666666664,
            52.72781260608316
        ],
        "wc_review_avg": [
            282.3333333333333,
            149.87624524549875
        ],
        "wc_reply_reviewers_avg": [
            46.666666666666664,
            57.71962885843564
        ],
        "wc_reply_authors_avg": [
            1371.0,
            1436.4764761967622
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            2.3570226039551585
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.7559289460184545,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3570492166179685088&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=f3g5XpL9Kb",
        "pdf": "https://openreview.net/pdf?id=f3g5XpL9Kb",
        "email": "apple.com;apple.com;apple.com;apple.com;apple.com;apple.com;apple.com;",
        "author_num": 8,
        "aff_unique_index": "0;0;0;0;0;0;0",
        "aff_unique_norm": "Apple",
        "aff_unique_dep": "Apple Inc.",
        "aff_unique_url": "https://www.apple.com",
        "aff_unique_abbr": "Apple",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "f43Kxj0FaW",
        "title": "Meta-Prior: Meta learning for Adaptive Inverse Problem Solvers",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep neural networks have become a foundational tool for addressing imaging inverse problems. They are typically trained for a specific task, with a supervised loss to learn a mapping from the observations to the image to recover. However, real-world imaging challenges often lack ground truth data, rendering traditional supervised approaches ineffective. Moreover, for each new imaging task, a new model needs to be trained from scratch, wasting time and resources. To overcome these limitations, we introduce a novel approach based on meta-learning. Our method trains a meta-model on a diverse set of imaging tasks, such that it can be adapted to specific tasks with a few steps of fine-tuning. The outer level uses a supervised loss, that evaluates how well the fine-tuned model performs, while the inner loss can be unsupervised, relying only on the measurement operator. This allows the meta-model to leverage a few ground truth samples for each task while being able to generalize to new imaging tasks. We show that in simple settings, this approach recovers the Bayes optimal estimator, illustrating the soundness of our approach. We also demonstrate our method's effectiveness on various imaging tasks, including image processing and magnetic resonance imaging.",
        "keywords": "Meta learning;inverse problems;imaging;self supervised learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/b943a457973c95a405e345440389f9d9c7389bdf.zip",
        "author": "Matthieu Terris;Thomas Moreau",
        "authorids": "~Matthieu_Terris1;~Thomas_Moreau2",
        "gender": ";M",
        "homepage": "https://matthieutrs.github.io/;https://tommoral.github.io",
        "dblp": "270/4825;150/2391-1",
        "google_scholar": "fYMMgNoAAAAJ;https://scholar.google.fr/citations?user=HEO_PsAAAAAJ",
        "orcid": ";0000-0002-1523-3419",
        "linkedin": ";thomasmoreau2010",
        "or_profile": "~Matthieu_Terris1;~Thomas_Martin_Moreau1",
        "aff": "INRIA;INRIA",
        "aff_domain": "inria.fr;inria.fr",
        "position": "Postdoc;Researcher",
        "bibtex": "@misc{\nterris2024metaprior,\ntitle={Meta-Prior: Meta learning for Adaptive Inverse Problem Solvers},\nauthor={Matthieu Terris and Thomas Moreau},\nyear={2024},\nurl={https://openreview.net/forum?id=f43Kxj0FaW}\n}",
        "github": "",
        "project": "",
        "reviewers": "JGWM;jubY;1w5o;r4M5",
        "site": "https://openreview.net/forum?id=f43Kxj0FaW",
        "pdf_size": 2818652,
        "rating": "3;3;3;5",
        "confidence": "3;4;4;4",
        "soundness": "2;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "3;3;2;4",
        "wc_summary": "75;54;37;60",
        "wc_strengths": "85;33;23;36",
        "wc_weaknesses": "153;120;345;16",
        "wc_questions": "1;312;8;85",
        "wc_review": "314;519;413;197",
        "wc_reply_reviewers": "0;0;25;0",
        "wc_reply_authors": "232;741;458;343",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            56.5,
            13.6106575888162
        ],
        "wc_strengths_avg": [
            44.25,
            24.014318645341575
        ],
        "wc_weaknesses_avg": [
            158.5,
            118.95482335744104
        ],
        "wc_questions_avg": [
            101.5,
            125.92160259463029
        ],
        "wc_review_avg": [
            360.75,
            119.1351648338978
        ],
        "wc_reply_reviewers_avg": [
            6.25,
            10.825317547305483
        ],
        "wc_reply_authors_avg": [
            443.5,
            189.43930426392512
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16684974333102073323&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "INRIA",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.inria.fr",
        "aff_unique_abbr": "INRIA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "France"
    },
    {
        "id": "f4HohsyNEk",
        "title": "NeuManifold: Neural Watertight Manifold Reconstruction with Efficient and High-Quality Rendering Support",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We present a method for generating high-quality watertight manifold meshes from multi-view input images. Existing volumetric rendering methods are robust in optimization but tend to generate noisy meshes with poor topology. Differentiable rasterization-based methods can generate high-quality meshes but are sensitive to initialization. Our method combines the benefits of both worlds; we take the geometry initialization obtained from neural volumetric fields, and further optimize the geometry as well as a compact neural texture representation \nwith differentiable rasterizers. Through extensive experiments, we demonstrate that our method can generate accurate mesh reconstructions with faithful appearance that are comparable to previous volume rendering methods while being an order of magnitude \nfaster in rendering. We also show that our generated mesh and neural texture reconstruction is compatible with existing graphics pipelines and enables downstream 3D applications such as simulation.",
        "keywords": "mesh reconstruction;neural rendering",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/f910f00a7402ba4b2441582602ebe335df86a116.zip",
        "author": "Xinyue Wei;Fanbo Xiang;Sai Bi;Anpei Chen;Kalyan Sunkavalli;Zexiang Xu;Hao Su",
        "authorids": "~Xinyue_Wei1;~Fanbo_Xiang1;~Sai_Bi1;~Anpei_Chen2;~Kalyan_Sunkavalli1;~Zexiang_Xu1;~Hao_Su1",
        "gender": "F;;M;M;M;M;M",
        "homepage": "https://sites.google.com/view/xinyue-wei/;https://www.fbxiang.com;https://sai-bi.github.io/;https://apchenstu.github.io/;http://www.kalyans.org/;https://cseweb.ucsd.edu/~zex014/;http://ai.ucsd.edu/~haosu",
        "dblp": "215/7941;261/3562;165/9898;210/2592;42/5978;154/0366;09/4945-1",
        "google_scholar": "UipTKqoAAAAJ;oLIh5qYAAAAJ;-q4nE1kAAAAJ;fuR1FBwAAAAJ;j7uL6VEAAAAJ;_RRIYvEAAAAJ;1P8Zu04AAAAJ",
        "orcid": ";;;;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Xinyue_Wei1;~Fanbo_Xiang1;~Sai_Bi1;~Anpei_Chen2;~Kalyan_Sunkavalli1;~Zexiang_Xu1;~Hao_Su1",
        "aff": "University of California, San Diego;University of California, San Diego;Adobe Systems;Eberhard-Karls-Universit\u00e4t T\u00fcbingen;Adobe Research;Adobe Research;University of California, San Diego",
        "aff_domain": "ucsd.edu;ucsd.edu;adobe.com;uni-tuebingen.de;adobe.com;adobe.com;ucsd.edu",
        "position": "PhD student;PhD student;Researcher;Postdoc;Principal Scientist;Researcher;Associate Professor",
        "bibtex": "@misc{\nwei2024neumanifold,\ntitle={NeuManifold: Neural Watertight Manifold Reconstruction with Efficient and High-Quality Rendering Support},\nauthor={Xinyue Wei and Fanbo Xiang and Sai Bi and Anpei Chen and Kalyan Sunkavalli and Zexiang Xu and Hao Su},\nyear={2024},\nurl={https://openreview.net/forum?id=f4HohsyNEk}\n}",
        "github": "",
        "project": "",
        "reviewers": "Q7gG;iTas;1eXC;XSZW",
        "site": "https://openreview.net/forum?id=f4HohsyNEk",
        "pdf_size": 31607148,
        "rating": "3;3;3;5",
        "confidence": "5;4;4;4",
        "soundness": "3;3;2;2",
        "contribution": "2;1;2;2",
        "presentation": "3;3;3;3",
        "wc_summary": "59;80;69;55",
        "wc_strengths": "24;59;62;84",
        "wc_weaknesses": "256;351;143;164",
        "wc_questions": "4;131;175;41",
        "wc_review": "343;621;449;344",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            65.75,
            9.67923034130297
        ],
        "wc_strengths_avg": [
            57.25,
            21.48691462262556
        ],
        "wc_weaknesses_avg": [
            228.5,
            82.51212032180484
        ],
        "wc_questions_avg": [
            87.75,
            68.34242825653769
        ],
        "wc_review_avg": [
            439.25,
            113.4292180172287
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16251903169295507685&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1;2;1;1;0",
        "aff_unique_norm": "University of California, San Diego;Adobe;Eberhard Karls University of T\u00fcbingen",
        "aff_unique_dep": ";Adobe Systems Incorporated;",
        "aff_unique_url": "https://www.ucsd.edu;https://www.adobe.com;https://www.uni-tuebingen.de/",
        "aff_unique_abbr": "UCSD;Adobe;Uni T\u00fcbingen",
        "aff_campus_unique_index": "0;0;2;0",
        "aff_campus_unique": "San Diego;;T\u00fcbingen",
        "aff_country_unique_index": "0;0;0;1;0;0;0",
        "aff_country_unique": "United States;Germany"
    },
    {
        "title": "UniAdapter: Unified Parameter-Efficient Transfer Learning for Cross-modal Modeling",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18198",
        "id": "f5H8WGLQm5",
        "author_site": "Haoyu Lu, Yuqi Huo, Guoxing Yang, Zhiwu Lu, Wei Zhan, Masayoshi Tomizuka, Mingyu Ding",
        "tldr": "",
        "abstract": "Large-scale vision-language pre-trained models have shown promising transferability to various downstream tasks. As the size of these foundation models and the number of downstream tasks grow, the standard full fine-tuning paradigm becomes unsustainable due to heavy computational and storage costs. This paper proposes UniAdapter, which unifies unimodal and multimodal adapters for parameter-efficient cross-modal adaptation on pre-trained vision-language models. Specifically, adapters are distributed to different modalities and their interactions, with the total number of tunable parameters reduced by partial weight sharing. The unified and knowledge-sharing design enables powerful cross-modal representations that can benefit various downstream tasks, requiring only 1.0%-2.0% tunable parameters of the pre-trained model. Extensive experiments on 7 cross-modal downstream benchmarks (including video-text retrieval, image-text retrieval, VideoQA, VQA and Caption) show that in most cases, UniAdapter not only outperforms the state-of-the-arts, but even beats the full fine-tuning strategy. Particularly, on the MSRVTT retrieval task, UniAdapter achieves 49.7% recall@1 with 2.2% model parameters, outperforming the latest competitors by 2.0%. The code and models are available at https://github.com/RERV/UniAdapter.",
        "keywords": "parameter-efficient transfer learning;cross-modal modeling",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Haoyu Lu;Yuqi Huo;Guoxing Yang;Zhiwu Lu;Wei Zhan;Masayoshi Tomizuka;Mingyu Ding",
        "authorids": "~Haoyu_Lu1;~Yuqi_Huo1;~Guoxing_Yang3;~Zhiwu_Lu1;~Wei_Zhan2;~Masayoshi_Tomizuka1;~Mingyu_Ding1",
        "gender": ";M;;M;;M;M",
        "homepage": "https://haoyulu1998.github.io/;;;https://gsai.ruc.edu.cn/luzhiwu;;https://me.berkeley.edu/people/masayoshi-tomizuka/;https://dingmyu.github.io/",
        "dblp": "240/2720;219/6931.html;;53/5234;;10/4434;188/5243",
        "google_scholar": "https://scholar.google.com.hk/citations?view_op=list_works;3oryMg0AAAAJ;;OUXS8doAAAAJ;;;w4yTWwoAAAAJ",
        "orcid": ";;;;;;0000-0001-6556-8359",
        "linkedin": "%E6%B5%A9%E5%AE%87-%E5%8D%A2-4b42b7198/;;;;;;dingmyu/",
        "or_profile": "~Haoyu_Lu1;~Yuqi_Huo1;~Guoxing_Yang3;~Zhiwu_Lu1;~Wei_Zhan2;~Masayoshi_Tomizuka1;~Mingyu_Ding1",
        "aff": "Renmin University of China;Baichuan Intelligent Technology;;Renmin University of China;;University of California, Berkeley;University of California, Berkeley",
        "aff_domain": "ruc.edu.cn;baichuan-inc.com;;ruc.edu.cn;;berkeley.edu;berkeley.edu",
        "position": "PhD student;Researcher;;Full Professor;;Full Professor;Postdoc",
        "bibtex": "@inproceedings{\nlu2024uniadapter,\ntitle={UniAdapter: Unified Parameter-Efficient Transfer Learning for Cross-modal Modeling},\nauthor={Haoyu Lu and Yuqi Huo and Guoxing Yang and Zhiwu Lu and Wei Zhan and Masayoshi Tomizuka and Mingyu Ding},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=f5H8WGLQm5}\n}",
        "github": "",
        "project": "",
        "reviewers": "1KDb;BCaT;euaM;2kKp",
        "pdf_size": 5728510,
        "rating": "3;6;6;8",
        "confidence": "4;2;4;4",
        "soundness": "3;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "96;55;30;146",
        "wc_strengths": "84;97;44;121",
        "wc_weaknesses": "216;176;107;256",
        "wc_questions": "3;5;4;11",
        "wc_review": "399;333;185;534",
        "wc_reply_reviewers": "29;0;40;0",
        "wc_reply_authors": "1983;1012;752;1298",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "6;2;2;3",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            81.75,
            43.94527847220905
        ],
        "wc_strengths_avg": [
            86.5,
            27.897132469126642
        ],
        "wc_weaknesses_avg": [
            188.75,
            55.02442639410246
        ],
        "wc_questions_avg": [
            5.75,
            3.112474899497183
        ],
        "wc_review_avg": [
            362.75,
            125.6192162847707
        ],
        "wc_reply_reviewers_avg": [
            17.25,
            17.68297203526602
        ],
        "wc_reply_authors_avg": [
            1261.25,
            459.2751762288051
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.25,
            1.6393596310755
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.08084520834544431,
        "gs_citation": 38,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18340010943906211324&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=f5H8WGLQm5",
        "pdf": "https://openreview.net/pdf?id=f5H8WGLQm5",
        "email": "ruc.edu.cn;baichuan-inc.com;;ruc.edu.cn;;berkeley.edu;berkeley.edu",
        "author_num": 7,
        "aff_unique_index": "0;1;0;2;2",
        "aff_unique_norm": "Renmin University of China;Baichuan Intelligent Technology;University of California, Berkeley",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.ruc.edu.cn;;https://www.berkeley.edu",
        "aff_unique_abbr": "RUC;;UC Berkeley",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Berkeley",
        "aff_country_unique_index": "0;0;0;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "f5juXkyorf",
        "title": "Closed-Form Diffusion Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Score-based generative models (SGMs) sample from a target distribution by iteratively transforming noise using the score function of the perturbed target. For any finite training set, this score function can be evaluated in closed form, but the resulting SGM memorizes its training data and does not generate novel samples. In practice, one approximates the score by training a neural network via score-matching. The error in this approximation promotes generalization, but neural SGMs are costly to train and sample, and the effective regularization this error provides is not well-understood theoretically. In this work, we instead explicitly smooth the closed-form score to obtain an SGM that generates novel samples without training. We analyze our model and propose an efficient nearest-neighbor-based estimator of its score function. Using this estimator, our method achieves sampling times competitive with neural SGMs while running on consumer-grade CPUs.",
        "keywords": "generative models; diffusion models; probabilistic modeling",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/bf220c5aa3f0e5c26a576a8cae035136bb2a57e8.zip",
        "author": "Christopher Scarvelis;Haitz S\u00e1ez de Oc\u00e1riz Borde;Justin Solomon",
        "authorids": "~Christopher_Scarvelis1;~Haitz_S\u00e1ez_de_Oc\u00e1riz_Borde1;~Justin_Solomon1",
        "gender": "M;M;M",
        "homepage": "https://cscarv.github.io/;https://www.linkedin.com/in/haitz-s%C3%A1ez-de-oc%C3%A1riz-borde-0933a9199/;http://people.csail.mit.edu/jsolomon/",
        "dblp": ";;80/5094",
        "google_scholar": "D5LCU9wAAAAJ;aP0OakUAAAAJ;pImSVwoAAAAJ",
        "orcid": ";;0000-0002-7701-7586",
        "linkedin": ";;justin-solomon-8a587914/",
        "or_profile": "~Christopher_Scarvelis1;~Haitz_S\u00e1ez_de_Oc\u00e1riz_Borde1;~Justin_Solomon1",
        "aff": "Massachusetts Institute of Technology;University of Oxford;Massachusetts Institute of Technology",
        "aff_domain": "mit.edu;ox.ac.uk;mit.edu",
        "position": "PhD student;PhD student;Associate Professor",
        "bibtex": "@misc{\nscarvelis2024closedform,\ntitle={Closed-Form Diffusion Models},\nauthor={Christopher Scarvelis and Haitz S{\\'a}ez de Oc{\\'a}riz Borde and Justin Solomon},\nyear={2024},\nurl={https://openreview.net/forum?id=f5juXkyorf}\n}",
        "github": "",
        "project": "",
        "reviewers": "P7kJ;sZVo;t4Fr;pdyz",
        "site": "https://openreview.net/forum?id=f5juXkyorf",
        "pdf_size": 29705755,
        "rating": "5;5;5;6",
        "confidence": "3;5;4;4",
        "soundness": "3;2;3;3",
        "contribution": "3;3;1;3",
        "presentation": "2;3;2;4",
        "wc_summary": "36;85;115;95",
        "wc_strengths": "63;61;66;109",
        "wc_weaknesses": "78;198;298;237",
        "wc_questions": "58;72;4;27",
        "wc_review": "235;416;483;468",
        "wc_reply_reviewers": "75;290;0;91",
        "wc_reply_authors": "872;294;869;1029",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "3;1;2;3",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            82.75,
            29.07210862665452
        ],
        "wc_strengths_avg": [
            74.75,
            19.854155736268414
        ],
        "wc_weaknesses_avg": [
            202.75,
            80.35973805333116
        ],
        "wc_questions_avg": [
            40.25,
            26.517682779609533
        ],
        "wc_review_avg": [
            400.5,
            98.73322642352979
        ],
        "wc_reply_reviewers_avg": [
            114.0,
            107.26369376447933
        ],
        "wc_reply_authors_avg": [
            766.0,
            280.0883789092293
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4388196655040208561&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Massachusetts Institute of Technology;University of Oxford",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://web.mit.edu;https://www.ox.ac.uk",
        "aff_unique_abbr": "MIT;Oxford",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "f6BIRu23ow",
        "title": "TriSAM: Tri-Plane SAM for zero-shot cortical blood vessel segmentation in VEM images",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this paper, we address a significant gap in the field of neuroimaging by introducing the first large-scale public benchmark, BvEM, designed specifically for cortical blood vessel segmentation in Volume Electron Microscopy (VEM) images. The intricate relationship between cerebral blood vessels and neural function underscores the vital role of vascular analysis in understanding brain health. While imaging techniques at macro and mesoscales have garnered substantial attention and resources, the microscale VEM imaging, capable of revealing intricate vascular details, has lacked the necessary benchmarking infrastructure. As researchers delve deeper into the microscale intricacies of cerebral vasculature, our BvEM benchmark represents a critical step toward unraveling the mysteries of neurovascular coupling and its impact on brain function and pathology.\nThe BvEM dataset is based on VEM image volumes from three mammal species: adult mouse, macaque, and human. We standardized the resolution, addressed imaging variations, and meticulously annotated blood vessels through manual, semi-automatic, and quality control processes, ensuring high-quality 3D segmentation.\nFurthermore, we developed a zero-shot cortical blood vessel segmentation method named TriSAM, which leverages the powerful segmentation model SAM for 3D segmentation. To lift SAM from 2D segmentation to 3D volume segmentation, TriSAM employs a multi-seed tracking framework, leveraging the reliability of certain image planes for tracking while using others to identify potential turning points. This approach, consisting of Tri-Plane selection, SAM-based tracking, and recursive redirection, effectively achieves long-term 3D blood vessel segmentation without model training or fine-tuning. Experimental results show that TriSAM achieved superior performances on the BvEM benchmark across three species.",
        "keywords": "Blood vessel segmentation; volume electron microscopy",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "Jia Wan;Wanhua Li;Atmadeep Banerjee;Jason Ken Adhinarta;Evelina Sjostedt;Jingpeng Wu;Jeff Lichtman;Hanspeter Pfister;Donglai Wei",
        "authorids": "~Jia_Wan2;~Wanhua_Li1;~Atmadeep_Banerjee1;~Jason_Ken_Adhinarta1;~Evelina_Sjostedt1;~Jingpeng_Wu1;~Jeff_Lichtman1;~Hanspeter_Pfister1;~Donglai_Wei1",
        "gender": "M;M;M;M;F;M;M;M;M",
        "homepage": ";https://li-wanhua.github.io/;https://atom-101.github.io;https://jasonkena.github.io/;;;https://lichtmanlab.fas.harvard.edu;https://vcg.seas.harvard.edu;https://donglaiw.github.io/",
        "dblp": "13/6504-1.html;189/8563-1;;;;;;p/HanspeterPfister;89/10116.html",
        "google_scholar": "8VCYME8AAAAJ;I03QnrsAAAAJ;lMSaCAkAAAAJ;;fnmgKPEAAAAJ;;;tvBEoaMAAAAJ;xF2mhDoAAAAJ",
        "orcid": ";;;0000-0002-6247-7475;;my-orcid?orcid=0000-0003-1604-8802;;0000-0002-3620-2582;0000-0002-2329-5484",
        "linkedin": ";;;;;jingpeng-wu-%E5%90%B4%E6%99%AF%E9%B9%8F-302a483a/;;hpfister/;",
        "or_profile": "~Jia_Wan2;~Wanhua_Li1;~Atmadeep_Banerjee1;~Jason_Ken_Adhinarta1;~Evelina_Sjostedt1;~Jingpeng_Wu1;~Jeff_Lichtman1;~Hanspeter_Pfister1;~Donglai_Wei1",
        "aff": "Boston College;Harvard University;;Boston College;Harvard University, Harvard University;Simons Foundation;Harvard University;Harvard University;Boston College",
        "aff_domain": "bc.edu;harvard.edu;;bc.edu;fas.harvard.edu;simonsfoundation.org;harvard.edu;harvard.edu;bc.edu",
        "position": "Postdoc;Postdoc;;Undergrad student;Postdoc;Associate Research Scientist;Full Professor;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nwan2024trisam,\ntitle={Tri{SAM}: Tri-Plane {SAM} for zero-shot cortical blood vessel segmentation in {VEM} images},\nauthor={Jia Wan and Wanhua Li and Atmadeep Banerjee and Jason Ken Adhinarta and Evelina Sjostedt and Jingpeng Wu and Jeff Lichtman and Hanspeter Pfister and Donglai Wei},\nyear={2024},\nurl={https://openreview.net/forum?id=f6BIRu23ow}\n}",
        "github": "",
        "project": "",
        "reviewers": "Qnji;BJ42;NUw2",
        "site": "https://openreview.net/forum?id=f6BIRu23ow",
        "pdf_size": 5281546,
        "rating": "5;5;5",
        "confidence": "5;4;3",
        "soundness": "2;3;3",
        "contribution": "3;3;3",
        "presentation": "2;2;3",
        "wc_summary": "60;74;64",
        "wc_strengths": "29;95;42",
        "wc_weaknesses": "155;94;109",
        "wc_questions": "105;65;53",
        "wc_review": "349;328;268",
        "wc_reply_reviewers": "24;0;0",
        "wc_reply_authors": "720;380;255",
        "reply_reviewers": "1;0;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            66.0,
            5.887840577551898
        ],
        "wc_strengths_avg": [
            55.333333333333336,
            28.54625875467552
        ],
        "wc_weaknesses_avg": [
            119.33333333333333,
            25.952948879762307
        ],
        "wc_questions_avg": [
            74.33333333333333,
            22.23110933404409
        ],
        "wc_review_avg": [
            315.0,
            34.322004603461025
        ],
        "wc_reply_reviewers_avg": [
            8.0,
            11.313708498984761
        ],
        "wc_reply_authors_avg": [
            451.6666666666667,
            196.48296505182213
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9068599365012251355&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;1;2;1;1;0",
        "aff_unique_norm": "Boston College;Harvard University;Simons Foundation",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.bostoncollege.edu;https://www.harvard.edu;https://www.simonsfoundation.org",
        "aff_unique_abbr": "BC;Harvard;Simons Foundation",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Project and Probe: Sample-Efficient Adaptation by Interpolating Orthogonal Features",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18197",
        "id": "f6CBQYxXvr",
        "author_site": "Annie Chen, Yoonho Lee, Amrith Setlur, Sergey Levine, Chelsea Finn",
        "tldr": "",
        "abstract": "Transfer learning with a small amount of target data is an effective and common approach to adapting a pre-trained model to distribution shifts. In some situations, target data labels may be expensive to obtain, so we may only have access to a limited number of target data points. To make the most of a very small target dataset, we propose a lightweight, sample-efficient approach that learns a diverse set of features and adapts to a target distribution by interpolating these features. Our approach, Project and Probe (Pro$^2$), first learns a linear projection that maps a pre-trained embedding onto orthogonal directions while being predictive of labels in the source dataset. The goal of this step is to learn a variety of predictive features, so that at least some of them remain useful after distribution shift. Pro$^2$ then learns a linear classifier on top of these projected features using a small target dataset. Theoretically, we find that Pro$^2$ results in more sample-efficient generalization by inducing a favorable bias-variance tradeoff. Our experiments on four datasets, with multiple distribution shift settings for each, show that Pro$^2$ improves performance by 5-15% when given limited target data compared to prior methods such as standard linear probing.",
        "keywords": "distribution-shift robustness;fine-tuning;adaptation;transfer learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Annie S Chen;Yoonho Lee;Amrith Setlur;Sergey Levine;Chelsea Finn",
        "authorids": "~Annie_S_Chen1;~Yoonho_Lee1;~Amrith_Setlur1;~Sergey_Levine1;~Chelsea_Finn1",
        "gender": "F;M;M;M;F",
        "homepage": "https://anniesch.github.io/;https://yoonholee.com/;http://ars22.github.io;https://people.eecs.berkeley.edu/~svlevine/;https://ai.stanford.edu/~cbfinn/",
        "dblp": "277/1527.html;213/8086;https://dblp.uni-trier.de/pers/hd/s/Setlur:Amrith;80/7594;131/1783",
        "google_scholar": ";https://scholar.google.co.kr/citations?user=BAAZ_ysAAAAJ;https://scholar.google.ru/citations?user=i7V1kJgAAAAJ;8R35rCwAAAAJ;vfPE6hgAAAAJ",
        "orcid": ";;0000-0002-7061-3094;;",
        "linkedin": "annie-s-chen/;;;;",
        "or_profile": "~Annie_S_Chen1;~Yoonho_Lee1;~Amrith_Setlur1;~Sergey_Levine1;~Chelsea_Finn1",
        "aff": "Stanford University;Stanford University;Carnegie Mellon University;Google;Google",
        "aff_domain": "stanford.edu;stanford.edu;cmu.edu;google.com;google.com",
        "position": "PhD student;PhD student;PhD student;Research Scientist;Research Scientist",
        "bibtex": "@inproceedings{\nchen2024project,\ntitle={Project and Probe: Sample-Efficient Adaptation by Interpolating Orthogonal Features},\nauthor={Annie S Chen and Yoonho Lee and Amrith Setlur and Sergey Levine and Chelsea Finn},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=f6CBQYxXvr}\n}",
        "github": "",
        "project": "",
        "reviewers": "sNr1;fuyr;Ft2e",
        "pdf_size": 9878183,
        "rating": "5;8;8",
        "confidence": "4;4;3",
        "soundness": "3;3;3",
        "contribution": "2;3;2",
        "presentation": "3;3;3",
        "wc_summary": "67;98;90",
        "wc_strengths": "22;44;88",
        "wc_weaknesses": "52;253;112",
        "wc_questions": "2;3;319",
        "wc_review": "143;398;609",
        "wc_reply_reviewers": "0;235;21",
        "wc_reply_authors": "423;870;711",
        "reply_reviewers": "0;2;1",
        "reply_authors": "3;3;2",
        "rating_avg": [
            7.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            85.0,
            13.140268896284683
        ],
        "wc_strengths_avg": [
            51.333333333333336,
            27.438820836342238
        ],
        "wc_weaknesses_avg": [
            139.0,
            84.24962907930218
        ],
        "wc_questions_avg": [
            108.0,
            149.20008936547816
        ],
        "wc_review_avg": [
            383.3333333333333,
            190.52617201377404
        ],
        "wc_reply_reviewers_avg": [
            85.33333333333333,
            106.1770010668768
        ],
        "wc_reply_authors_avg": [
            668.0,
            185.00270268296083
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4473191347432914496&as_sdt=20000005&sciodt=0,21&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=f6CBQYxXvr",
        "pdf": "https://openreview.net/pdf?id=f6CBQYxXvr",
        "email": "stanford.edu;stanford.edu;cmu.edu;google.com;google.com",
        "author_num": 5,
        "aff_unique_index": "0;0;1;2;2",
        "aff_unique_norm": "Stanford University;Carnegie Mellon University;Google",
        "aff_unique_dep": ";;Google",
        "aff_unique_url": "https://www.stanford.edu;https://www.cmu.edu;https://www.google.com",
        "aff_unique_abbr": "Stanford;CMU;Google",
        "aff_campus_unique_index": "0;0;2;2",
        "aff_campus_unique": "Stanford;;Mountain View",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "f6KkyweyYh",
        "title": "Biological Sequence Analysis Using B \u0301ezier Curve",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The analysis of biological (e.g., protein and DNA) sequences is essential for disease diagnosis, biomaterial engineering, genetic engineering, and drug discovery domains. Conventional analytical methods focus on transforming sequences into numerical representations for applying machine learning/deep learning-based sequence characterization. However, their efficacy is constrained by the intrinsic nature of deep learning (DL) models, which tend to exhibit suboptimal performance when applied to tabular data.\nAn alternative group of methodologies endeavors to convert biological sequences into image forms by applying the concept of Chaos Game Representation (CGR). However, a noteworthy drawback of these methods lies in their tendency to map individual elements of the sequence onto a relatively small subset of designated pixels within the generated image. The resulting sparse image representation may not adequately encapsulate the comprehensive sequence information, potentially resulting in suboptimal predictions.\nIn this study, we introduce a novel approach to transform biological sequences into images using the B\u00e9zier curve concept for element mapping. Mapping the elements onto a curve enhances the sequence information representation in the respective images, hence yielding better DL-based classification performance.  We employed three distinct protein sequence datasets to validate our system by doing three different classification tasks, and the results illustrate that our B\u00e9zier curve method is able to achieve good performance for all the tasks. \nFor instance, it has shown tremendous improvement for a protein subcellular location prediction task over the baseline methods, such as improved accuracy by 39.4\\% as compared to the FCGR baseline technique using a 2-layer CNN classifier. Moreover, for Coronavirus host classification, our B\u00e9zier method has achieved 5.3\\% more AUC ROC score than the FCGR using a 3-layer CNN classifier.",
        "keywords": "Bio-sequence Analysis;Bezier Curve;Chaos Game Representation;Deep Learning-based Classification;Image Classification",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/fe3517813ca5c27fc6dfccdcc52852c2db18c32b.zip",
        "author": "Taslim Murad;Sarwan Ali;Murray Patterson",
        "authorids": "~Taslim_Murad2;~Sarwan_Ali1;~Murray_Patterson1",
        "gender": "M;M;F",
        "homepage": "https://sarwanpasha.github.io/;;",
        "dblp": "243/0133;33/387;330/4579.html",
        "google_scholar": "9dtXSoAAAAAJ;;4SpI-IkAAAAJ",
        "orcid": "0000-0001-8121-2168;;",
        "linkedin": "sarwan-ali/;;taslim-murad-654553113/",
        "or_profile": "~Sarwan_Ali1;~Murray_Patterson1;~taslim_murad1",
        "aff": "Georgia State University;Georgia State University;Georgia State University",
        "aff_domain": "gsu.edu;gsu.edu;gsu.edu",
        "position": "PhD student;Assistant Professor;PhD student",
        "bibtex": "@misc{\nmurad2024biological,\ntitle={Biological Sequence Analysis Using B \u0301ezier Curve},\nauthor={Taslim Murad and Sarwan Ali and Murray Patterson},\nyear={2024},\nurl={https://openreview.net/forum?id=f6KkyweyYh}\n}",
        "github": "",
        "project": "",
        "reviewers": "B9o8;FrGV;TS9L;Bdp5",
        "site": "https://openreview.net/forum?id=f6KkyweyYh",
        "pdf_size": 1853328,
        "rating": "3;5;6;6",
        "confidence": "3;2;3;3",
        "soundness": "3;3;3;4",
        "contribution": "2;3;3;4",
        "presentation": "2;3;3;3",
        "wc_summary": "55;192;42;123",
        "wc_strengths": "51;34;14;161",
        "wc_weaknesses": "153;61;85;67",
        "wc_questions": "79;42;23;35",
        "wc_review": "338;329;164;386",
        "wc_reply_reviewers": "228;0;227;0",
        "wc_reply_authors": "2169;843;1504;455",
        "reply_reviewers": "1;0;2;0",
        "reply_authors": "5;2;6;2",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            103.0,
            59.88739433303139
        ],
        "wc_strengths_avg": [
            65.0,
            56.95173395077625
        ],
        "wc_weaknesses_avg": [
            91.5,
            36.5889327529514
        ],
        "wc_questions_avg": [
            44.75,
            20.90902915010642
        ],
        "wc_review_avg": [
            304.25,
            83.82235680294369
        ],
        "wc_reply_reviewers_avg": [
            113.75,
            113.75054944922245
        ],
        "wc_reply_authors_avg": [
            1242.75,
            653.1731680802573
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.75,
            1.7853571071357126
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Xe5ueS217pYJ:scholar.google.com/&scioq=Biological+Sequence+Analysis+Using+B+%CC%81ezier+Curve&hl=en&as_sdt=0,6",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Georgia State University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.gsu.edu",
        "aff_unique_abbr": "GSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "f77r0cBc4l",
        "title": "GPT-Fathom: Benchmarking Large Language Models to Decipher the Evolutionary Path towards GPT-4 and Beyond",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "With the rapid advancement of large language models (LLMs), there is a pressing need for a comprehensive evaluation suite to assess their capabilities and limitations. Existing LLM leaderboards often reference scores reported in other papers without consistent settings and prompts, which may inadvertently encourage cherry-picking favored settings and prompts for better results. In this work, we introduce GPT-Fathom, an open-source and reproducible LLM evaluation suite built on top of OpenAI Evals. We systematically evaluate 10+ leading LLMs as well as OpenAI's legacy models on 20+ curated benchmarks across 7 capability categories, all under aligned settings. Our retrospective study on OpenAI's earlier models offers valuable insights into the evolutionary path from GPT-3 to GPT-4. Currently, the community is eager to know how GPT-3 progressively improves to GPT-4, including technical details like whether adding code data improves LLM's reasoning capability, which aspects of LLM capability can be improved by SFT and RLHF, how much is the alignment tax, etc. Our analysis sheds light on many of these questions, aiming to improve the transparency of advanced LLMs.",
        "keywords": "Large language model; Benchmark",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Shen Zheng;Yuyu Zhang;Yijie Zhu;Chenguang Xi;Pengyang Gao;zhou Xun;Kevin Chang",
        "authorids": "~Shen_Zheng2;~Yuyu_Zhang1;~Yijie_Zhu1;~Chenguang_Xi2;~Pengyang_Gao1;~zhou_Xun2;~Kevin_Chang1",
        "gender": ";;;M;M;;M",
        "homepage": ";;;;https://twitter.com/fuergaosi;;https://siebelschool.illinois.edu/about/people/faculty/kcchang",
        "dblp": ";;;;;;c/KCCChang",
        "google_scholar": ";;;AAGUBuIAAAAJ;;;https://scholar.google.com.tw/citations?user=sugWZ6MAAAAJ",
        "orcid": ";;;;;;0000-0003-0997-6803",
        "linkedin": ";;yijie-zhu;;;;",
        "or_profile": "~Shen_Zheng2;~Yuyu_Zhang1;~Yijie_Zhu1;~Chenguang_Xi2;~Pengyang_Gao1;~zhou_Xun2;~Kevin_Chang1",
        "aff": ";;;;;;University of Illinois, Urbana Champaign",
        "aff_domain": ";;;;;;illinois.edu",
        "position": ";;;;;;Full Professor",
        "bibtex": "@misc{\nzheng2024gptfathom,\ntitle={{GPT}-Fathom: Benchmarking Large Language Models to Decipher the Evolutionary Path towards {GPT}-4 and Beyond},\nauthor={Shen Zheng and Yuyu Zhang and Yijie Zhu and Chenguang Xi and Pengyang Gao and zhou Xun and Kevin Chang},\nyear={2024},\nurl={https://openreview.net/forum?id=f77r0cBc4l}\n}",
        "github": "",
        "project": "",
        "reviewers": "Fohj;aiZP;ThD7",
        "site": "https://openreview.net/forum?id=f77r0cBc4l",
        "pdf_size": 461203,
        "rating": "3;3;6",
        "confidence": "3;4;4",
        "soundness": "3;2;3",
        "contribution": "2;2;3",
        "presentation": "3;3;4",
        "wc_summary": "52;12;67",
        "wc_strengths": "65;29;72",
        "wc_weaknesses": "380;145;59",
        "wc_questions": "62;8;43",
        "wc_review": "559;194;241",
        "wc_reply_reviewers": "233;0;0",
        "wc_reply_authors": "2467;626;324",
        "reply_reviewers": "1;0;0",
        "reply_authors": "5;1;1",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            43.666666666666664,
            23.213980461973534
        ],
        "wc_strengths_avg": [
            55.333333333333336,
            18.83849486792639
        ],
        "wc_weaknesses_avg": [
            194.66666666666666,
            135.67199006754817
        ],
        "wc_questions_avg": [
            37.666666666666664,
            22.365648262955006
        ],
        "wc_review_avg": [
            331.3333333333333,
            162.12409513154492
        ],
        "wc_reply_reviewers_avg": [
            77.66666666666667,
            109.83725334431037
        ],
        "wc_reply_authors_avg": [
            1139.0,
            947.0969679323583
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            1.8856180831641267
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11825396027393223998&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Illinois Urbana-Champaign",
        "aff_unique_dep": "",
        "aff_unique_url": "https://illinois.edu",
        "aff_unique_abbr": "UIUC",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Urbana-Champaign",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "f7CtrA5FGC",
        "title": "Guide PLMs Towards Expressive Captioning via Knowledge Alignment and Lift",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "As image captioning studies for Vision-Language Pretraining (VLP) have used pre-trained (vision) language models, PLMs, and demonstrated competitive performance,\nour goal is to guide PLMs towards fine-grained captioning.\nTo this goal, while addressing their problems,\nwe focus on the \u201cknowledge gap (visual vs semantic, and source vs target domain)\u201d.\nUnlike prior work,\nKEIC is based on the idea that knowledge is projected into PLMs as hidden spaces,\nand this gap is closed by fine-grained knowledge alignment and lift in these spaces.\nThis idea motivates us to propose a model-agnostic framework, \\textbf{K}nowledge \\textbf{E}mpowered \\textbf{I}mage \\textbf{C}aptioning (KEIC) instead of models; \nKEIC consists of a Topic Control Mechanism (TCM), a Mapping Layer (MaL), a Modified Attention Mechanism (MAM), and training tasks, MRM, TTM, and ITM.\nExperiments show that KEIC outperforms baselines in captioning tasks, \nwhere its newly introduced components contribute to expressive caption generation via knowledge alignment and lift.",
        "keywords": "Vision Language Models;Large Language Models;Pretrained Language Models;Image Captioning;Knowledge Control;Domain gap",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Noriaki Kawamae",
        "authorids": "~Noriaki_Kawamae1",
        "gender": "",
        "homepage": "",
        "dblp": "70/1704",
        "google_scholar": "https://scholar.google.co.jp/citations?user=ylU8pzwAAAAJ",
        "orcid": "0000-0002-0746-9624",
        "linkedin": "",
        "or_profile": "~Noriaki_Kawamae1",
        "aff": "NTT Comware",
        "aff_domain": "nttcom.co.jp",
        "position": "Evangelist",
        "bibtex": "@misc{\nkawamae2024guide,\ntitle={Guide {PLM}s Towards Expressive Captioning via Knowledge Alignment and Lift},\nauthor={Noriaki Kawamae},\nyear={2024},\nurl={https://openreview.net/forum?id=f7CtrA5FGC}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=f7CtrA5FGC",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:FlVAT_foRXoJ:scholar.google.com/&scioq=Guide+PLMs+Towards+Expressive+Captioning+via+Knowledge+Alignment+and+Lift&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "NTT Comware",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ntt-comware.co.jp",
        "aff_unique_abbr": "",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Japan"
    },
    {
        "id": "f7PmO5boQ9",
        "title": "DynaEval: A Dynamic Interaction-based Evaluation Framework for Assessing LLMs in Real-world Scenarios",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs) have shown significant advancements in diverse real-world applications, underscoring the necessity for comprehensive evaluation methodologies. Existing research about LLM evaluation usually concentrates on supervised signal-based evaluation benchmarks on domain-specific tasks, which utilize static labeled datasets to evaluate the abilities of LLMs. However, these methods often fall short in evaluating LLMs in dynamic real-world scenarios, which can be viewed as goal-driven multi-agent scenarios. In these scenarios, agents have to repeatedly obtain feedbacks and improve their outputs through cooperative or adversarial interactions in order to gradually reach their goals. To address this problem, inspired by game theory, we propose a novel dynamic interaction-based LLM evaluation framework (DynaEval) for evaluating abilities of LLMs in dynamic real-world scenarios. Specifically, we first standardize the definition of the interaction process in dynamic real-world scenarios. Next, we prove that interaction processes in evaluation tasks are equivalent to a class of dynamic games in game theory, which is beneficial to the fairness and stability of evaluation. Inspired by game theory, we propose the message pool and LLM-based referee components of DynaEval, leveraging the properties of dynamic games to ensure fairness and stability throughout the interaction and evaluation process. Moreover, we propose the synchronous interaction algorithm, which is suitable for all kinds of interactions in real-world tasks. Finally, we demonstrate the effectiveness of DynaEval through extensive experiments across four interaction-based evaluation tasks stemming from real-world scenarios. Our source code is available at https://anonymous.4open.science/r/DynaEval-112F.",
        "keywords": "large language model;evaluation;game theory;code generation;machine translation;multi-agent system",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Jiatong Li;Rui Li;Yan Zhuang;Kai Zhang;Linan Yue;Qingchuan Li;Junzhe Jiang;Qi Liu;Enhong Chen",
        "authorids": "~Jiatong_Li5;~Rui_Li27;~Yan_Zhuang4;~Kai_Zhang12;~Linan_Yue1;~Qingchuan_Li1;~Junzhe_Jiang3;~Qi_Liu3;~Enhong_Chen1",
        "gender": "M;;M;M;M;M;;M;M",
        "homepage": "https://cslijt.github.io;https://github.com/orgs/smsquirrel;http://home.ustc.edu.cn/~zykb/;http://home.ustc.edu.cn/~sa517494/;https://yuelinan.github.io/;http://home.ustc.edu.cn/~chouli/;https://github.com/Gnimixy;http://staff.ustc.edu.cn/~qiliuql/;http://staff.ustc.edu.cn/~cheneh",
        "dblp": "19/11348-2;96/4282-93;;55/957-38;297/1080;;333/0818;95/2446-3;07/258",
        "google_scholar": "https://scholar.google.com/citations?hl=en;l6Hy51oAAAAJ;7MX_P5cAAAAJ;t6IIpAUAAAAJ;https://scholar.google.com.hk/citations?user=XDaNgG4AAAAJ;;;5EoHAFwAAAAJ;Q9h02J0AAAAJ",
        "orcid": "0009-0000-8877-6927;0009-0005-3657-1133;0000-0001-7351-377X;0000-0001-5335-2470;0000-0002-5980-6098;;0009-0003-4273-2509;0000-0001-6956-5550;0000-0002-4835-4102",
        "linkedin": ";;;;;;;;",
        "or_profile": "~Jiatong_Li5;~Rui_Li27;~Yan_Zhuang4;~Kai_Zhang12;~Linan_Yue1;~Qingchuan_Li1;~Junzhe_Jiang3;~Qi_Liu3;~Enhong_Chen1",
        "aff": "University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China;;University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China",
        "aff_domain": "ustc.edu.cn;ustc.edu.cn;ustc.edu.cn;ustc.edu.cn;ustc.edu.cn;;ustc.edu.cn;ustc.edu.cn;ustc.edu.cn",
        "position": "MS student;MS student;PhD student;Researcher;PhD student;;MS student;Full Professor;Full Professor",
        "bibtex": "@misc{\nli2024dynaeval,\ntitle={DynaEval: A Dynamic Interaction-based Evaluation Framework for Assessing {LLM}s in Real-world Scenarios},\nauthor={Jiatong Li and Rui Li and Yan Zhuang and Kai Zhang and Linan Yue and Qingchuan Li and Junzhe Jiang and Qi Liu and Enhong Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=f7PmO5boQ9}\n}",
        "github": "",
        "project": "",
        "reviewers": "EKE2;ZvMp;U79L;u39q",
        "site": "https://openreview.net/forum?id=f7PmO5boQ9",
        "pdf_size": 2327410,
        "rating": "3;3;5;6",
        "confidence": "2;4;4;3",
        "soundness": "2;1;3;3",
        "contribution": "1;1;2;3",
        "presentation": "2;2;4;3",
        "wc_summary": "238;99;50;65",
        "wc_strengths": "59;78;57;88",
        "wc_weaknesses": "387;243;340;187",
        "wc_questions": "14;6;43;46",
        "wc_review": "698;426;490;386",
        "wc_reply_reviewers": "628;0;0;168",
        "wc_reply_authors": "1307;902;790;541",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            113.0,
            74.32025295974174
        ],
        "wc_strengths_avg": [
            70.5,
            13.009611831257688
        ],
        "wc_weaknesses_avg": [
            289.25,
            78.62052848970173
        ],
        "wc_questions_avg": [
            27.25,
            17.512495538900218
        ],
        "wc_review_avg": [
            500.0,
            120.18319350058893
        ],
        "wc_reply_reviewers_avg": [
            199.0,
            257.0038910211283
        ],
        "wc_reply_authors_avg": [
            885.0,
            276.46609195342563
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.17407765595569782,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6020560741923514867&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0;0;0;0",
        "aff_unique_norm": "University of Science and Technology of China",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.ustc.edu.cn",
        "aff_unique_abbr": "USTC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "f7ZEcoSdXQ",
        "title": "Incentivizing Data Collection from Heterogeneous Clients in Federated Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Federated learning (FL) provides a promising paradigm for facilitating collaboration between multiple clients that jointly learn a global model without directly sharing their local data. However, existing research suffers from two caveats: 1) From the perspective of decentralized agents, voluntary and unselfish participation is often assumed. But self-interested agents may opt out of the system or provide low-quality contributions without proper incentives; 2) From the mechanism designer's perspective, the aggregated models can be unsatisfactory as the existing game-theoretical federated learning approach for data collection ignores the potential heterogeneous effort caused by contributed data. \n\nTo alleviate above challenges, we propose an incentive-aware framework for agent participation that considers data heterogeneity to accelerate the convergence process. Specifically, we first introduce the notion of Wasserstein distance to explicitly illustrate the heterogeneous effort and reformulate the existing upper bound of convergence. To induce truthful reporting from agents, we analyze and measure the generalization error gap of any two agents by leveraging the peer prediction mechanism to develop score functions. We further present a two-stage Stackelberg game model that formalizes the process and examines the existence of equilibrium. Extensive experiments on real-world datasets demonstrate the effectiveness of our proposed incentive mechanism.",
        "keywords": "Federated Learning; Incentive Mechanism; Game Theory",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Jinlong Pang;Jiaheng Wei;Chen Qian;Yang Liu",
        "authorids": "~Jinlong_Pang2;~Jiaheng_Wei1;~Chen_Qian4;~Yang_Liu3",
        "gender": ";M;M;M",
        "homepage": ";https://sites.google.com/ucsc.edu/jiahengwei;https://users.soe.ucsc.edu/~qian/;http://www.yliuu.com",
        "dblp": ";270/8936;;51/3710-18",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;;jKrIVCIAAAAJ",
        "orcid": ";;;0000-0001-8420-6011",
        "linkedin": ";jiahengwei/;;",
        "or_profile": "~Jinlong_Pang2;~Jiaheng_Wei1;~Chen_Qian4;~Yang_Liu3",
        "aff": ";University of California, Santa Cruz;University of California, Santa Cruz;University of California, Santa Cruz",
        "aff_domain": ";ucsc.edu;ucsc.edu;ucsc.edu",
        "position": ";PhD student;Full Professor;Assistant Professor",
        "bibtex": "@misc{\npang2024incentivizing,\ntitle={Incentivizing Data Collection from Heterogeneous Clients in Federated Learning},\nauthor={Jinlong Pang and Jiaheng Wei and Chen Qian and Yang Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=f7ZEcoSdXQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "H2b8;6Cg7;WQhg;2yXg",
        "site": "https://openreview.net/forum?id=f7ZEcoSdXQ",
        "pdf_size": 836778,
        "rating": "3;5;5;6",
        "confidence": "4;2;3;2",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "1;2;2;3",
        "wc_summary": "79;111;36;101",
        "wc_strengths": "50;40;17;63",
        "wc_weaknesses": "59;148;93;183",
        "wc_questions": "511;62;2;80",
        "wc_review": "699;361;148;427",
        "wc_reply_reviewers": "579;0;0;0",
        "wc_reply_authors": "1811;785;473;403",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "3;3;2;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            81.75,
            28.838992700855556
        ],
        "wc_strengths_avg": [
            42.5,
            16.830032679706836
        ],
        "wc_weaknesses_avg": [
            120.75,
            47.96027001592047
        ],
        "wc_questions_avg": [
            163.75,
            202.5541594240908
        ],
        "wc_review_avg": [
            408.75,
            196.75412956276165
        ],
        "wc_reply_reviewers_avg": [
            144.75,
            250.714354395595
        ],
        "wc_reply_authors_avg": [
            868.0,
            563.1136652577346
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.899228803025897,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:d14YNkw2d0gJ:scholar.google.com/&scioq=Incentivizing+Data+Collection+from+Heterogeneous+Clients+in+Federated+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of California, Santa Cruz",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucsc.edu",
        "aff_unique_abbr": "UCSC",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Santa Cruz",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "f7t7AOseAa",
        "title": "ZEST: ZEROSHOT SPARSE FINE-TUNING",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent studies have pointed out that fine-tuning a subset of layers from the model can match or even outperform the performance of full fine-tuning, known as surgical fine-tuning ~\\citep{lee2022surgical}. This method effectively helps reduce the risks of overfitting and accelerates the fine-tuning process. However, swiftly and accurately identifying the \"right\" layers is not straightforward. Existing approaches naively train each layer until convergence and find the best candidates, which is not scalable, especially given the rapid growth in model sizes.\nIn this paper, we propose $\\textbf{ZEST}$: $\\textbf{Ze}$roshot $\\textbf{S}$parse fine-$\\textbf{T}$uning. We first study and compare the zero-shot metrics acquired from a single forward and backward pass. We observe that the metrics are inconsistent for different model and dataset combinations, thus we train a universal \\method predictor to generalize this method. We use the zero-shot \\method predictor to rank layers by the estimated importance and fine-tune only the important parameters.\nBy doing so, we can decrease the number of trainable parameters by up to 99\\%, being on par or outperforming full fine-tuning in terms of model performance. We thoroughly evaluate the effectiveness of \\method on various tasks and modalities. We train a universal predictor for ResNet50, MobilenetV2, and EfficientNet on 8 different datasets. We also scale this method up to BERT and LLAMA. Our results demonstrate that fine-tuning just five layers can closely match or even outperform the performance achieved through full fine-tuning on LLaMA-7B. Specifically, fine-tuning only the \\textbf{5} fully connected layers on LLaMA chosen by \\method can result in improvements of up to 5\\% over full fine-tuning",
        "keywords": "deep learning; surgical fine-tuning; efficient fine-tuning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Jiashu Han;Ligeng Zhu;Song Han",
        "authorids": "~Jiashu_Han1;~Ligeng_Zhu1;~Song_Han5",
        "gender": "M;M;",
        "homepage": ";https://lzhu.me;",
        "dblp": ";211/7203;",
        "google_scholar": ";https://scholar.google.co.uk/citations?user=y0LVrtgAAAAJ;",
        "orcid": ";;",
        "linkedin": "jiashu-han-24061b1ab/;;",
        "or_profile": "~Jiashu_Han1;~Ligeng_Zhu1;~Song_Han5",
        "aff": ";Massachusetts Institute of Technology;",
        "aff_domain": ";mit.edu;",
        "position": ";PhD student;",
        "bibtex": "@misc{\nhan2024zest,\ntitle={{ZEST}: {ZEROSHOT} {SPARSE} {FINE}-{TUNING}},\nauthor={Jiashu Han and Ligeng Zhu and Song Han},\nyear={2024},\nurl={https://openreview.net/forum?id=f7t7AOseAa}\n}",
        "github": "",
        "project": "",
        "reviewers": "XBCf;cd1r;KjeW;KcMr",
        "site": "https://openreview.net/forum?id=f7t7AOseAa",
        "pdf_size": 788090,
        "rating": "3;5;6;6",
        "confidence": "4;4;2;4",
        "soundness": "1;2;4;3",
        "contribution": "1;2;3;3",
        "presentation": "2;2;4;3",
        "wc_summary": "95;124;128;32",
        "wc_strengths": "67;17;260;52",
        "wc_weaknesses": "1053;297;113;88",
        "wc_questions": "172;3;61;109",
        "wc_review": "1387;441;562;281",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1634;652;563;651",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "4;2;2;2",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.5,
            1.118033988749895
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            94.75,
            38.40166012036459
        ],
        "wc_strengths_avg": [
            99.0,
            94.70744426918087
        ],
        "wc_weaknesses_avg": [
            387.75,
            392.4699829286311
        ],
        "wc_questions_avg": [
            86.25,
            62.126383284398585
        ],
        "wc_review_avg": [
            667.75,
            427.0523240775069
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            875.0,
            439.69591765218837
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.5,
            0.8660254037844386
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.4714045207910316,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:8Sc2rrcR1FQJ:scholar.google.com/&scioq=ZEST:+ZEROSHOT+SPARSE+FINE-TUNING&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Massachusetts Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://web.mit.edu",
        "aff_unique_abbr": "MIT",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "f8Jdtbey3B",
        "title": "Stochastic Competition Networks for Deep Learning on Tabular Data",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Despite the prevalence and significance of tabular data across numerous industries and fields, it has been relatively underexplored in the realm of deep learning. Even today, neural networks are often overshadowed by techniques such as gradient-boosted decision trees (GBDT). However, recent models are beginning to close this gap, outperforming GBDT in various setups and garnering increased attention in the field. Drawing from this inspiration, in this work we introduce a novel deep learning model specifically designed for tabular data. The foundation of this model is a Transformer-based architecture, carefully adapted to cater to the unique properties of tabular data through strategic architectural modifications, mainly two forms of stochastic competition. First, we employ the \"Local Winner Takes All\" mechanism as a refined alternative to ReLU-activated layers. Second, we introduce a novel embedding layer that blends multiple linear embedding layers through a form of stochastic competition. Model effectiveness is validated on a variety of widely-used, publicly available datasets. We show that, through incorporation of the said stochastic elements, we yield state-of-the-art performance and mark a significant advancement in applying deep learning to tabular data.",
        "keywords": "deep learning;tabular data;transformer;stochastic;lwta",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/35cce14b2595d081dc7344624c58888dcdc8c862.zip",
        "author": "Andreas Voskou;Charalambos Christoforou;Sotirios Chatzis",
        "authorids": "~Andreas_Voskou1;~Charalambos_Christoforou1;~Sotirios_Chatzis1",
        "gender": "M;M;M",
        "homepage": ";;https://www.cut.ac.cy/eecei/staff/sotirios.chatzis/",
        "dblp": ";;25/6133",
        "google_scholar": ";;https://scholar.google.gr/citations?user=__Y_0hQAAAAJ",
        "orcid": ";;",
        "linkedin": "andreas-voskou-3117b712b/;charalambos-christoforou/;",
        "or_profile": "~Andreas_Voskou1;~Charalambos_Christoforou1;~Sotirios_Chatzis1",
        "aff": "Boltzmann Research;;Cyprus University of Technology",
        "aff_domain": "boltzmann-research.com;;cut.ac.cy",
        "position": "Researcher;;Associate Professor",
        "bibtex": "@misc{\nvoskou2024stochastic,\ntitle={Stochastic Competition Networks for Deep Learning on Tabular Data},\nauthor={Andreas Voskou and Charalambos Christoforou and Sotirios Chatzis},\nyear={2024},\nurl={https://openreview.net/forum?id=f8Jdtbey3B}\n}",
        "github": "",
        "project": "",
        "reviewers": "fLPM;Nj1J;Fv9b;tizg",
        "site": "https://openreview.net/forum?id=f8Jdtbey3B",
        "pdf_size": 401784,
        "rating": "3;3;3;5",
        "confidence": "5;4;2;3",
        "soundness": "2;2;2;2",
        "contribution": "1;2;2;2",
        "presentation": "2;3;1;2",
        "wc_summary": "131;128;95;87",
        "wc_strengths": "94;23;11;28",
        "wc_weaknesses": "509;321;58;56",
        "wc_questions": "10;270;2;72",
        "wc_review": "744;742;166;243",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            110.25,
            19.48557158514987
        ],
        "wc_strengths_avg": [
            39.0,
            32.349652239243625
        ],
        "wc_weaknesses_avg": [
            236.0,
            190.94370898251663
        ],
        "wc_questions_avg": [
            88.5,
            108.23469868762051
        ],
        "wc_review_avg": [
            473.75,
            270.62370092066953
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.2581988897471611,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ODHKRB9akz8J:scholar.google.com/&scioq=Stochastic+Competition+Networks+for+Deep+Learning+on+Tabular+Data&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Boltzmann Research;Cyprus University of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.boltzmann.org;https://www.cut.ac.cy",
        "aff_unique_abbr": ";CUT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Austria;Cyprus"
    },
    {
        "id": "f8P1BqEBZl",
        "title": "Leveraging Temporal Graph Networks Using Module Decoupling",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Modern approaches for learning on dynamic graphs have adopted the use of\nbatches instead of applying updates one by one. The use of batches allows these\ntechniques to become helpful in streaming scenarios where updates to graphs are\nreceived at extreme speeds. Using batches, however, forces the models to update\ninfrequently, which results in the degradation of their performance. In this work,\nwe suggest a decoupling strategy that enables the models to update frequently\nwhile using batches. By decoupling the core modules of temporal graph networks\nand implementing them using a minimal number of learnable parameters, we have\ndeveloped the Lightweight Decoupled Temporal Graph Network (LDTGN), an ex\u0002ceptionally efficient model for learning on dynamic graphs. LDTG was validated\non various dynamic graph benchmarks, providing comparable or state-of-the-art\nresults with significantly higher throughput than previous art. Notably, our method\noutperforms previous approaches by more than 20% on benchmarks that require\nrapid model update rates, such as USLegis or UNTrade. The code to reproduce\nour experiments is available at \\href{https://github.com/TPFI22/MODULES-DECOUPLING}{this http url}.",
        "keywords": "Dynamic Graphs;Temporal Graph Learning;Graph Neural Networks;Online Learning",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Or Feldman;Chaim Baskin",
        "authorids": "~Or_Feldman1;~Chaim_Baskin1",
        "gender": "M;M",
        "homepage": ";https://chaimbaskin.bgu.ac.il",
        "dblp": ";205/2308",
        "google_scholar": ";https://scholar.google.co.il/citations?user=lfWCxJYAAAAJ",
        "orcid": ";0000-0003-4341-5639",
        "linkedin": "or-feldman-5aa127214;chaim-baskin-97441340/",
        "or_profile": "~Or_Feldman1;~Chaim_Baskin1",
        "aff": "Ben Gurion University of the Negev;Technion, Technion",
        "aff_domain": "post.bgu.ac.il;technion.ac.il",
        "position": "PhD student;Visiting Assistant Professor",
        "bibtex": "@misc{\nfeldman2024leveraging,\ntitle={Leveraging Temporal Graph Networks Using Module Decoupling},\nauthor={Or Feldman and Chaim Baskin},\nyear={2024},\nurl={https://openreview.net/forum?id=f8P1BqEBZl}\n}",
        "github": "",
        "project": "",
        "reviewers": "VFFL;CHuW;VY6D",
        "site": "https://openreview.net/forum?id=f8P1BqEBZl",
        "pdf_size": 1400725,
        "rating": "3;3;3",
        "confidence": "4;5;5",
        "soundness": "3;3;3",
        "contribution": "2;2;2",
        "presentation": "1;2;2",
        "wc_summary": "78;93;62",
        "wc_strengths": "11;50;29",
        "wc_weaknesses": "188;229;193",
        "wc_questions": "1;33;31",
        "wc_review": "278;405;315",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            77.66666666666667,
            12.657891697365017
        ],
        "wc_strengths_avg": [
            30.0,
            15.937377450509228
        ],
        "wc_weaknesses_avg": [
            203.33333333333334,
            18.263503375736967
        ],
        "wc_questions_avg": [
            21.666666666666668,
            14.636332266733431
        ],
        "wc_review_avg": [
            332.6666666666667,
            53.33124995930831
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:vziHGyljE6kJ:scholar.google.com/&scioq=Leveraging+Temporal+Graph+Networks+Using+Module+Decoupling&hl=en&as_sdt=0,5",
        "gs_version_total": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Ben Gurion University of the Negev;Technion - Israel Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.bgu.ac.il;https://www.technion.ac.il/en/",
        "aff_unique_abbr": "BGU;Technion",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Israel"
    },
    {
        "title": "DIAGNOSIS: Detecting Unauthorized Data Usages in Text-to-image Diffusion Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18196",
        "id": "f8S3aLm0Vp",
        "author_site": "Zhenting Wang, Chen Chen, Lingjuan Lyu, Dimitris Metaxas, Shiqing Ma",
        "tldr": "",
        "abstract": "Recent text-to-image diffusion models have shown surprising performance in generating high-quality images. However, concerns have arisen regarding the unauthorized data usage during the training or fine-tuning process. One example is when a model trainer collects a set of images created by a particular artist and attempts to train a model capable of generating similar images without obtaining permission and giving credit to the artist. To address this issue, we propose a method for detecting such unauthorized data usage by planting the injected memorization into the text-to-image diffusion models trained on the protected dataset. Specifically, we modify the protected images by adding unique contents on these images using stealthy image warping functions that are nearly imperceptible to humans but can be captured and memorized by diffusion models. By analyzing whether the model has memorized the injected content (i.e., whether the generated images are processed by the injected post-processing function), we can detect models that had illegally utilized the unauthorized data. Experiments on Stable Diffusion and VQ Diffusion with different model training or fine-tuning methods (i.e, LoRA, DreamBooth, and standard training) demonstrate the effectiveness of our proposed method in detecting unauthorized data usages. Code: https://github.com/ZhentingWang/DIAGNOSIS.",
        "keywords": "Unauthorized Data Usages Detection; Text-to-image Diffusion Models",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Zhenting Wang;Chen Chen;Lingjuan Lyu;Dimitris N. Metaxas;Shiqing Ma",
        "authorids": "~Zhenting_Wang1;~Chen_Chen20;~Lingjuan_Lyu1;~Dimitris_N._Metaxas1;~Shiqing_Ma2",
        "gender": "M;M;F;;M",
        "homepage": "https://zhentingwang.github.io/;https://cc233.github.io/;https://sites.google.com/view/lingjuan-lyu;https://people.cs.umass.edu/~shiqingma/;https://www.cs.rutgers.edu/~dnm/",
        "dblp": "263/4521;65/4423-43;178/9876;172/8745;m/DNMetaxas",
        "google_scholar": "QSYVbj8AAAAJ;;;X_mDnjkAAAAJ;https://scholar.google.com.tw/citations?user=a7VNhCIAAAAJ",
        "orcid": ";0000-0001-7359-8515;;0000-0003-1551-8948;",
        "linkedin": ";;;shiqing-ma-6590b086;dimitris-metaxas-1bb74914/",
        "or_profile": "~Zhenting_Wang1;~Chen_Chen20;~Lingjuan_Lyu1;~Shiqing_Ma2;~Dimitris_Metaxas1",
        "aff": "Sony AI;Sony AI;Sony;University of Massachusetts at Amherst;Rutgers University",
        "aff_domain": "sony.com;sony.com;sony.com;umass.edu;cs.rutgers.edu",
        "position": "Intern;Researcher;scientist;Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\nwang2024diagnosis,\ntitle={{DIAGNOSIS}: Detecting Unauthorized Data Usages in Text-to-image Diffusion Models},\nauthor={Zhenting Wang and Chen Chen and Lingjuan Lyu and Dimitris N. Metaxas and Shiqing Ma},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=f8S3aLm0Vp}\n}",
        "github": "",
        "project": "",
        "reviewers": "P3dG;gKsK;vEW1;KT7c",
        "pdf_size": 9485135,
        "rating": "6;6;6;8",
        "confidence": "4;2;4;4",
        "soundness": "3;3;3;4",
        "contribution": "2;2;3;4",
        "presentation": "3;3;3;3",
        "wc_summary": "56;131;124;131",
        "wc_strengths": "46;62;34;170",
        "wc_weaknesses": "137;62;60;90",
        "wc_questions": "65;36;1;3",
        "wc_review": "304;291;219;394",
        "wc_reply_reviewers": "36;56;0;56",
        "wc_reply_authors": "1865;645;618;318",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "4;2;2;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            110.5,
            31.595094555959157
        ],
        "wc_strengths_avg": [
            78.0,
            54.037024344425184
        ],
        "wc_weaknesses_avg": [
            87.25,
            31.075512867851433
        ],
        "wc_questions_avg": [
            26.25,
            26.337947907914163
        ],
        "wc_review_avg": [
            302.0,
            62.20530523998737
        ],
        "wc_reply_reviewers_avg": [
            37.0,
            22.869193252058544
        ],
        "wc_reply_authors_avg": [
            861.5,
            593.4157480215705
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.8660254037844386
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 31,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9119785816127227573&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=f8S3aLm0Vp",
        "pdf": "https://openreview.net/pdf?id=f8S3aLm0Vp",
        "email": "sony.com;sony.com;sony.com;umass.edu;cs.rutgers.edu",
        "author_num": 5,
        "aff_unique_index": "0;0;1;2;3",
        "aff_unique_norm": "Sony;Sony Corporation;University of Massachusetts Amherst;Rutgers University",
        "aff_unique_dep": "Sony AI;;;",
        "aff_unique_url": "https://www.sony.com;https://www.sony.com;https://www.umass.edu;https://www.rutgers.edu",
        "aff_unique_abbr": "Sony AI;Sony;UMass Amherst;Rutgers",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Amherst",
        "aff_country_unique_index": "0;0;0;1;1",
        "aff_country_unique": "Japan;United States"
    },
    {
        "id": "f9Djqso1p1",
        "title": "CResT: Cross-Query Residual Transformer for Object Goal Navigation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Object Goal Navigation (OGN) is the task of navigating from a random location to the target objects in an unknown environment. The end-to-end navigation method decides the actions of the agent to navigate to the target objects and relies much on the state representation obtained by the visual information processing network. In this paper, we propose the Cross-Query Residual Transformer (CResT) to extract more sufficient visual features from the image of the RGB camera for better navigation results, which includes the overall network, Residual Transformer, and Random Mask. In the overall network, the Global Feature and the Local Feature mutually query each other and are subsequently fused for better visual information processing. The Residual Transformer adds residual connections to the Transformer to solve the gradient vanishing problem, which enables the whole network to be trained in one stage without pretraining and allows the Transformer to be several times deeper. The Random Mask is proposed for data augmentation and overfitting reduction. The experiments demonstrate that CResT surpasses the competing methods and achieves state-of-the-art performance on the AI2-THOR dataset. The ablation experiments prove the Residual Transformer and the Random Mask contribute much to the navigation results.",
        "keywords": "Object Goal Navigation;Vision Transformer;Visual Encoding;Reinforcement Learning",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Xiaojiang Wu;Jiaojiao Fang;Menghan Jia;Guizhong Liu",
        "authorids": "~Xiaojiang_Wu1;~Jiaojiao_Fang1;~Menghan_Jia1;~Guizhong_Liu1",
        "gender": "M;;M;",
        "homepage": ";http://www.;https://gr.xjtu.edu.cn/web/liugz;https://gitee.com/coolboy180",
        "dblp": ";;;",
        "google_scholar": "https://scholar.google.com/;;;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Xiaojiang_Wu1;~Jiaojiao_Fang1;~Guizhong_Liu1;~jia_menghan1",
        "aff": "Xi'an Jiaotong University;Xi'an Jiaotong University;Xi'an Jiaotong University;Xi'an Jiaotong University",
        "aff_domain": "xjtu.edu.cn;xjtu.edu.cn;xjtu.edu.cn;xjtu.edu.cn",
        "position": "PhD student;Assistant Professor;Full Professor;MS student",
        "bibtex": "@misc{\nwu2024crest,\ntitle={{CR}esT: Cross-Query Residual Transformer for Object Goal Navigation},\nauthor={Xiaojiang Wu and Jiaojiao Fang and Menghan Jia and Guizhong Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=f9Djqso1p1}\n}",
        "github": "",
        "project": "",
        "reviewers": "divX;oDQU;9zLV;4dQB",
        "site": "https://openreview.net/forum?id=f9Djqso1p1",
        "pdf_size": 188158,
        "rating": "3;3;3;3",
        "confidence": "5;5;4;5",
        "soundness": "1;2;2;3",
        "contribution": "1;1;2;2",
        "presentation": "1;2;2;3",
        "wc_summary": "40;46;57;59",
        "wc_strengths": "13;21;124;20",
        "wc_weaknesses": "13;167;116;184",
        "wc_questions": "493;177;34;40",
        "wc_review": "559;411;331;303",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            50.5,
            7.826237921249264
        ],
        "wc_strengths_avg": [
            44.5,
            46.00271731104588
        ],
        "wc_weaknesses_avg": [
            120.0,
            66.65208173793224
        ],
        "wc_questions_avg": [
            186.0,
            186.24580532189174
        ],
        "wc_review_avg": [
            401.0,
            99.45853407325085
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:QH5tHgHA5S4J:scholar.google.com/&scioq=CResT:+Cross-Query+Residual+Transformer+for+Object+Goal+Navigation&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Xi'an Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.xjtu.edu.cn",
        "aff_unique_abbr": "XJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "f9RvYpXhFI",
        "title": "Estimating Fr\u00e9chet bounds for validating programmatic weak supervision",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We develop methods for estimating Fr\u00e9chet bounds on (possibly high-dimensional) distribution classes in which some variables are continuous-valued. We establish the statistical correctness of the computed bounds under uncertainty in the marginal constraints and demonstrate the usefulness of our algorithms by evaluating the performance of machine learning (ML) models trained with programmatic weak supervision (PWS). PWS is a framework for principled learning from weak supervision inputs (e.g., crowdsourced labels, knowledge bases, pre-trained models on related tasks, etc.), and it has achieved remarkable success in many areas of science and engineering. Unfortunately, it is generally difficult to validate the performance of ML models trained with PWS due to the absence of labeled data. Our algorithms address this issue by estimating sharp lower and upper bounds for performance metrics such as accuracy/recall/precision.",
        "keywords": "weak supervision;model assessment;Frechet bounds",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/20337edd5c7274cf855405593e674e636fa81cd3.zip",
        "author": "Felipe Maia Polo;Mikhail Yurochkin;Moulinath Banerjee;Subha Maity;Yuekai Sun",
        "authorids": "~Felipe_Maia_Polo1;~Mikhail_Yurochkin1;~Moulinath_Banerjee1;~Subha_Maity1;~Yuekai_Sun1",
        "gender": "M;M;M;M;",
        "homepage": "https://felipemaiapolo.github.io/;https://moonfolk.github.io/;https://lsa.umich.edu/stats/people/faculty/moulib.html;https://lsa.umich.edu/stats/people/phd-students/smaity.html;https://yuekai.github.io/",
        "dblp": "261/9581;191/6719;;278/2922;",
        "google_scholar": "CJbgmnkAAAAJ;QjBF9sUAAAAJ;;eD9vCGMAAAAJ;6T1XtW8AAAAJ",
        "orcid": "0000-0002-4950-2795;;;;",
        "linkedin": ";mikhail-yurochkin-a45659114/;;;",
        "or_profile": "~Felipe_Maia_Polo1;~Mikhail_Yurochkin1;~Moulinath_Banerjee1;~Subha_Maity1;~Yuekai_Sun1",
        "aff": "University of Michigan - Ann Arbor;IBM Research;University of Michigan - Ann Arbor;University of Waterloo;University of Michigan - Ann Arbor",
        "aff_domain": "umich.edu;ibm.com;umich.edu;uwaterloo.ca;umich.edu",
        "position": "PhD student;Researcher;Full Professor;Assistant Professor;Assistant \u2192 Associate Professor of Statistics",
        "bibtex": "@misc{\npolo2024estimating,\ntitle={Estimating Fr\\'echet bounds for validating programmatic weak supervision},\nauthor={Felipe Maia Polo and Mikhail Yurochkin and Moulinath Banerjee and Subha Maity and Yuekai Sun},\nyear={2024},\nurl={https://openreview.net/forum?id=f9RvYpXhFI}\n}",
        "github": "",
        "project": "",
        "reviewers": "JyZF;2tYp;JZxR;RUBf",
        "site": "https://openreview.net/forum?id=f9RvYpXhFI",
        "pdf_size": 2752651,
        "rating": "5;5;6;6",
        "confidence": "4;4;3;4",
        "soundness": "3;2;4;2",
        "contribution": "3;2;3;3",
        "presentation": "4;3;4;3",
        "wc_summary": "92;100;52;322",
        "wc_strengths": "55;88;24;183",
        "wc_weaknesses": "289;351;118;1163",
        "wc_questions": "62;119;2;106",
        "wc_review": "498;658;196;1774",
        "wc_reply_reviewers": "230;272;0;63",
        "wc_reply_authors": "427;500;299;444",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "1;2;2;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            141.5,
            105.78634127334209
        ],
        "wc_strengths_avg": [
            87.5,
            59.60075502877459
        ],
        "wc_weaknesses_avg": [
            480.25,
            403.3158656685849
        ],
        "wc_questions_avg": [
            72.25,
            45.72950360544055
        ],
        "wc_review_avg": [
            781.5,
            596.550710334
        ],
        "wc_reply_reviewers_avg": [
            141.25,
            112.9676391715787
        ],
        "wc_reply_authors_avg": [
            417.5,
            73.55440163579607
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:o2StlVMuN8kJ:scholar.google.com/&scioq=Estimating+Fr%C3%A9chet+bounds+for+validating+programmatic+weak+supervision&hl=en&as_sdt=0,33",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0;2;0",
        "aff_unique_norm": "University of Michigan;IBM;University of Waterloo",
        "aff_unique_dep": ";IBM Research;",
        "aff_unique_url": "https://www.umich.edu;https://www.ibm.com/research;https://uwaterloo.ca",
        "aff_unique_abbr": "UM;IBM;UW",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Ann Arbor;",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "United States;Canada"
    },
    {
        "id": "fACNPcPcrs",
        "title": "Exploring the Upper Limits of Text-Based Collaborative Filtering Using Large Language Models: Discoveries and Insights",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Text-based collaborative filtering (TCF) has become the mainstream approach for text and news recommendation, utilizing text encoders,  commonly referred to as language models (LMs), to represent items.\nHowever,  the current landscape of TCF models predominantly revolves around the utilization of small or medium-sized LMs. It remains uncertain what impact replacing the item encoder with one of the largest and most potent LMs, such as the 175-billion parameter GPT-3 model, would have on recommendation performance.  Can we expect unprecedented results?\nTo this end, we conduct an extensive series of experiments aimed at exploring the performance limits of the TCF paradigm. Specifically, we progressively increase the size of item encoders from one hundred million to one hundred billion, revealing the scaling limits of the TCF paradigm. Furthermore, we investigate whether these extremely large LMs can enable a universal item representation for the recommendation task and revolutionize the traditional ID paradigm, which is considered a significant obstacle to developing transferable \u201cone model fits all\u201d recommendation models. Our study not only demonstrates positive results but also uncovers unexpected negative outcomes, illuminating the current state of the TCF paradigm within the community. These findings will evoke deep reflection and inspire further research on text-based recommendation models. Our code and datasets will be provided upon acceptance.",
        "keywords": "Recommendation sytem;Large language models;Text-based collaborative filtering;GPT-3",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Ruyu Li;Wenhao Deng;Yu Cheng;Zheng Yuan;Jiaqi Zhang;Fajie Yuan",
        "authorids": "~Ruyu_Li2;~Wenhao_Deng2;~Yu_Cheng11;~Zheng_Yuan6;~Jiaqi_Zhang5;~Fajie_Yuan2",
        "gender": ";Not Specified;F;M;M;M",
        "homepage": ";https://w3nhao.github.io/;https://github.com/hyc9;https://zyuanat.github.io/;https://github.com/CheungKaKei;https://fajieyuan.github.io/",
        "dblp": ";283/2163-1;;;;175/4819",
        "google_scholar": ";;;https://scholar.google.com.hk/citations?user=1cFyrxYAAAAJ;https://scholar.google.com/citations?view_op=list_works;yOiBwasAAAAJ",
        "orcid": ";;;0009-0000-9231-2607;0009-0003-8317-2229;",
        "linkedin": ";;;;;",
        "or_profile": "~Ruyu_Li2;~Wenhao_Deng2;~Yu_Cheng11;~Zheng_Yuan6;~Jiaqi_Zhang5;~Fajie_Yuan2",
        "aff": ";Westlake University;Westlake University;Hong Kong Polytechnic University;;Westlake University",
        "aff_domain": ";westlake.edu;westlake.edu.cn;connect.polyu.hk;;westlake.edu.cn",
        "position": ";Researcher;PhD student;PhD student;;Assistant Professor",
        "bibtex": "@misc{\nli2024exploring,\ntitle={Exploring the Upper Limits of Text-Based Collaborative Filtering Using Large Language Models: Discoveries and Insights},\nauthor={Ruyu Li and Wenhao Deng and Yu Cheng and Zheng Yuan and Jiaqi Zhang and Fajie Yuan},\nyear={2024},\nurl={https://openreview.net/forum?id=fACNPcPcrs}\n}",
        "github": "",
        "project": "",
        "reviewers": "6KqR;Jj3E;6ddN;YHSC",
        "site": "https://openreview.net/forum?id=fACNPcPcrs",
        "pdf_size": 1677191,
        "rating": "3;5;6;8",
        "confidence": "4;4;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;3;4;3",
        "wc_summary": "149;92;177;149",
        "wc_strengths": "37;82;81;39",
        "wc_weaknesses": "48;115;48;17",
        "wc_questions": "12;98;9;74",
        "wc_review": "246;387;315;279",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1520;1821;803;1032",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;3;2;2",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            141.75,
            30.914195768287424
        ],
        "wc_strengths_avg": [
            59.75,
            21.76436307361187
        ],
        "wc_weaknesses_avg": [
            57.0,
            35.7980446393375
        ],
        "wc_questions_avg": [
            48.25,
            38.70642711488623
        ],
        "wc_review_avg": [
            306.75,
            52.36590016413353
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1294.0,
            399.5403609148893
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            31,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.16012815380508713,
        "gs_citation": 68,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3019938991539335188&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Westlake University;Hong Kong Polytechnic University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.westlake.edu.cn;https://www.polyu.edu.hk",
        "aff_unique_abbr": "WU;PolyU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "fAGEAEQvRr",
        "title": "Gradient descent for matrix factorization: Understanding large initialization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In deep learning practice, large random initialization is commonly used. Understanding the behavior of gradient descent (GD) with such initialization is both crucial and challenging. This paper focuses on a simplified matrix factorization problem, delving into the dynamics of GD when using large initialization. Leveraging a novel signal-to-noise ratio argument and an inductive argument, we offer a detailed trajectory analysis of GD from the initial point to the global minima. Our insights indicate that even with a large initialization, GD can exhibit incremental learning, which coincides with experimental observations.",
        "keywords": "Gradient descent;matrix factorization;large initialization;implicit bias;incremental learning",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/fc137a5df052e869fb3cee69f973d456fef59829.pdf",
        "author": "Hengchao Chen;Xin Chen;Mohamad Elmasri;Qiang Sun",
        "authorids": "~Hengchao_Chen1;~Xin_Chen29;~Mohamad_Elmasri1;~Qiang_Sun2",
        "gender": "M;;M;M",
        "homepage": "https://sites.google.com/view/hengchao-chen;https://orfe.princeton.edu/people/xin-chen;https://sites.google.com/view/qsun;https://sites.google.com/view/mohamadelmasri/home",
        "dblp": "320/6919;;73/2066-7;211/7678",
        "google_scholar": "https://scholar.google.ca/citations?user=M5dTp-kAAAAJ;;f0V2fAYAAAAJ;uZTMkIwAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;mohamad-elmasri-509612119/",
        "or_profile": "~Hengchao_Chen1;~Xin_Chen29;~Qiang_Sun2;~Mohamad_E_Elmasri1",
        "aff": "University of Toronto;Princeton University;University of Toronto;",
        "aff_domain": "utoronto.ca;princeton.edu;utoronto.ca;",
        "position": "PhD student;PhD student;Full Professor;",
        "bibtex": "@misc{\nchen2024gradient,\ntitle={Gradient descent for matrix factorization: Understanding large initialization},\nauthor={Hengchao Chen and Xin Chen and Mohamad Elmasri and Qiang Sun},\nyear={2024},\nurl={https://openreview.net/forum?id=fAGEAEQvRr}\n}",
        "github": "",
        "project": "",
        "reviewers": "BGNj;yiZg;MbHg;dfta",
        "site": "https://openreview.net/forum?id=fAGEAEQvRr",
        "pdf_size": 363965,
        "rating": "5;5;6;6",
        "confidence": "4;2;3;2",
        "soundness": "2;3;2;3",
        "contribution": "2;2;3;2",
        "presentation": "2;2;2;3",
        "wc_summary": "148;22;93;40",
        "wc_strengths": "27;21;75;102",
        "wc_weaknesses": "42;179;204;60",
        "wc_questions": "498;14;183;260",
        "wc_review": "715;236;555;462",
        "wc_reply_reviewers": "0;0;138;448",
        "wc_reply_authors": "1461;1208;1711;580",
        "reply_reviewers": "0;0;2;1",
        "reply_authors": "4;3;4;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            75.75,
            49.20556370980827
        ],
        "wc_strengths_avg": [
            56.25,
            33.699962907991456
        ],
        "wc_weaknesses_avg": [
            121.25,
            71.08929244267381
        ],
        "wc_questions_avg": [
            238.75,
            174.12836500696835
        ],
        "wc_review_avg": [
            492.0,
            173.30175994490074
        ],
        "wc_reply_reviewers_avg": [
            146.5,
            182.96106143111436
        ],
        "wc_reply_authors_avg": [
            1240.0,
            420.50743156334346
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.0,
            1.224744871391589
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.30151134457776363,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1920800946734644320&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Toronto;Princeton University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.utoronto.ca;https://www.princeton.edu",
        "aff_unique_abbr": "U of T;Princeton",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Canada;United States"
    },
    {
        "title": "Pre-training LiDAR-based 3D Object Detectors through Colorization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18195",
        "id": "fB1iiH9xo7",
        "author_site": "Tai-Yu Pan, Chenyang Ma, Tianle Chen, Cheng Perng Phoo, Katie Luo, Yurong You, Mark Campbell, Kilian Weinberger, Bharath Hariharan, Wei-Lun Chao",
        "tldr": "",
        "abstract": "Accurate 3D object detection and understanding for self-driving cars heavily relies on LiDAR point clouds, necessitating large amounts of labeled data to train. In this work, we introduce an innovative pre-training approach, Grounded Point Colorization (GPC), to bridge the gap between data and labels by teaching the model to colorize LiDAR point clouds, equipping it with valuable semantic cues. To tackle challenges arising from color variations and selection bias, we incorporate color as \"context\" by providing ground-truth colors as hints during colorization.\nExperimental results on the KITTI and Waymo datasets demonstrate GPC's remarkable effectiveness. Even with limited labeled data, GPC significantly improves fine-tuning performance; notably, on just 20% of the KITTI dataset, GPC outperforms training from scratch with the entire dataset. \nIn sum, we introduce a fresh perspective on pre-training for 3D object detection, aligning the objective with the model's intended role and ultimately advancing the accuracy and efficiency of 3D object detection for autonomous vehicles.",
        "keywords": "3D object detection;LiDAR point cloud;pre-training;autonomous driving;self-supervised learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/ffab97ee157dbc5fff2c8d7fcc0463ffe257338d.pdf",
        "author": "Tai-Yu Pan;Chenyang Ma;Tianle Chen;Cheng Perng Phoo;Katie Z Luo;Yurong You;Mark Campbell;Kilian Q Weinberger;Bharath Hariharan;Wei-Lun Chao",
        "authorids": "~Tai-Yu_Pan1;~Chenyang_Ma2;~Tianle_Chen2;~Cheng_Perng_Phoo1;~Katie_Z_Luo1;~Yurong_You1;~Mark_Campbell1;~Kilian_Q_Weinberger1;~Bharath_Hariharan3;~Wei-Lun_Chao1",
        "gender": ";M;M;M;F;M;M;M;M;M",
        "homepage": "https://tydpan.github.io;https://chenyangma.com;;https://cpphoo.github.io/;https://www.cs.cornell.edu/~katieluo/;http://yurongyou.com;http://campbell.mae.cornell.edu;http://www.cs.cornell.edu/~kilian/;https://sites.google.com/view/wei-lun-harry-chao;http://home.bharathh.info",
        "dblp": "285/6615;;203/7325;226/0521;207/8564;199/1968;;88/4801;64/8842;05/8412",
        "google_scholar": "M1_TnJsAAAAJ;;;kt9D2usAAAAJ;qlmK27YAAAAJ;rdwkreIAAAAJ;e1iAhHQAAAAJ;jsxk8vsAAAAJ;PGKakWwAAAAJ;TpglobcAAAAJ",
        "orcid": ";;;;;;;0009-0008-9313-7239;0000-0003-1269-7231;",
        "linkedin": "tydpan;;tianle-chen-1811341b7/;;katieluo;yurong-you/;;;;",
        "or_profile": "~Tai-Yu_Pan1;~Chenyang_Ma2;~Tianle_Chen2;~Cheng_Perng_Phoo1;~Katie_Z_Luo1;~Yurong_You1;~Mark_Campbell1;~Kilian_Q_Weinberger1;~Wei-Lun_Chao1;~Bharath_Hariharan2",
        "aff": "Ohio State University;University of North Carolina at Chapel Hill;Ohio State University, Columbus;Cornell University;Cornell University;NVIDIA;Cornell University;ASAPP Inc.;Ohio State University;Cornell University",
        "aff_domain": "osu.edu;unc.edu;osu.edu;cornell.edu;cornell.edu;nvidia.com;cornell.edu;asapp.com;osu.edu;cornell.edu",
        "position": "PhD student;PhD student;Undergrad student;PhD student;PhD student;Research Scientist;Full Professor;Principal Researcher;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\npan2024pretraining,\ntitle={Pre-training Li{DAR}-based 3D Object Detectors through Colorization},\nauthor={Tai-Yu Pan and Chenyang Ma and Tianle Chen and Cheng Perng Phoo and Katie Z Luo and Yurong You and Mark Campbell and Kilian Q Weinberger and Bharath Hariharan and Wei-Lun Chao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=fB1iiH9xo7}\n}",
        "github": "",
        "project": "",
        "reviewers": "anv1;cL42;nb3N;Hnni",
        "pdf_size": 1261517,
        "rating": "6;6;8;8",
        "confidence": "5;4;4;5",
        "soundness": "3;2;3;4",
        "contribution": "2;3;3;4",
        "presentation": "2;3;3;4",
        "wc_summary": "62;53;201;102",
        "wc_strengths": "44;32;66;105",
        "wc_weaknesses": "108;97;465;6",
        "wc_questions": "98;109;200;266",
        "wc_review": "312;291;932;479",
        "wc_reply_reviewers": "81;0;0;83",
        "wc_reply_authors": "968;742;2073;1161",
        "reply_reviewers": "2;0;0;1",
        "reply_authors": "3;1;4;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            104.5,
            58.687732960134014
        ],
        "wc_strengths_avg": [
            61.75,
            27.788261910382232
        ],
        "wc_weaknesses_avg": [
            169.0,
            175.42092235534506
        ],
        "wc_questions_avg": [
            168.25,
            68.93611172672854
        ],
        "wc_review_avg": [
            503.5,
            257.89581229636127
        ],
        "wc_reply_reviewers_avg": [
            41.0,
            41.00609710762535
        ],
        "wc_reply_authors_avg": [
            1236.0,
            505.4834319737888
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7122338262475998060&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=fB1iiH9xo7",
        "pdf": "https://openreview.net/pdf?id=fB1iiH9xo7",
        "email": "osu.edu;unc.edu;osu.edu;cornell.edu;cornell.edu;nvidia.com;cornell.edu;asapp.com;osu.edu;cornell.edu",
        "author_num": 10,
        "aff_unique_index": "0;1;0;2;2;3;2;4;0;2",
        "aff_unique_norm": "Ohio State University;University of North Carolina;Cornell University;NVIDIA;ASAPP Inc.",
        "aff_unique_dep": ";;;NVIDIA Corporation;",
        "aff_unique_url": "https://www.osu.edu;https://www.unc.edu;https://www.cornell.edu;https://www.nvidia.com;https://www.asapp.com",
        "aff_unique_abbr": "OSU;UNC;Cornell;NVIDIA;ASAPP",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Chapel Hill;Columbus",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "fBlHaSGKNg",
        "title": "Unleashing the Power of Annotation: Enhancing Semi-Supervised Learning through Unsupervised Sample Selection",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "With large volumes of unlabeled data and limited annotation budgets, Semi-Supervised Learning (SSL) has become a preferred approach in many deep learning tasks. However, most previous studies have primarily focused on  utilizing labeled and unlabeled data for model training to improve performance, while the efficient selection of samples for annotation under budgetary constraints has often been overlooked.To fill this gap, we propose an efficient sample selection methodology named Unleashing the Power of Annotation (UPA). By adopting a modified Frank-Wolfe algorithm to minimizing a novel criterion $\\alpha$-Maximum Mean Discrepancy ($\\alpha$-MMD), UPA selects a representative and diverse subset for annotation from the unlabeled data. Furthermore, we demonstrate that minimizing $\\alpha$-MMD enhances the generalization ability of low-budget learning. Experiments show that UPA consistently improves the performance of several popular SSL methods, surpassing various prevailing Active Learning (AL) and Semi-Supervised Active Learning (SSAL) methods even under constrained annotation budgets.",
        "keywords": "semi-supervised learning;unsupervised sample selection",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/358c1bba1d98bb96ba6f4d055caccaef08a41d76.zip",
        "author": "Qian Shao;Jiangrui Kang;Qiyuan Chen;Hongxia Xu;Yiwen Cao;JIAJUAN LIANG;Jian Wu",
        "authorids": "~Qian_Shao2;~Jiangrui_Kang1;~Qiyuan_Chen1;~Hongxia_Xu1;~Yiwen_Cao2;~JIAJUAN_LIANG1;~Jian_Wu6",
        "gender": "M;M;M;F;M;M;M",
        "homepage": "https://abeier87.github.io/;;https://qiyuan-chen.github.io/;;https://www.uic.edu.cn/en/faculty.htm#/yiwencao/en;;https://scholar.google.com/citations?hl=zh-TW&user=VO9XIXYAAAAJ",
        "dblp": "189/1524;387/4420;319/2575-1.html;57/101;;;96/2744-1",
        "google_scholar": "https://scholar.google.com.hk/citations?user=dxBWovEAAAAJ;;;XlpKptAAAAAJ;;3qwbWyQAAAAJ;https://scholar.google.com/citations?hl=zh-TW",
        "orcid": "0000-0001-5768-6136;;0000-0002-2315-4972;0000-0001-5384-4627;;;",
        "linkedin": ";jiangrui-kang-7b4a44242/;;;;;",
        "or_profile": "~Qian_Shao2;~Jiangrui_Kang1;~Qiyuan_Chen1;~Hongxia_Xu1;~Yiwen_Cao2;~JIAJUAN_LIANG1;~Jian_Wu6",
        "aff": "Zhejiang University;Illinois Institute of Technology;Central China Normal University;Zhejiang University;Beijing Normal University Hong Kong Baptist University United International College;;Zhejiang University",
        "aff_domain": "zju.edu.cn;hawk.iit.edu;ccnu.edu.cn;zju.edu.cn;uic.edu.cn;;zju.edu.cn",
        "position": "PhD student;PhD student;Undergrad student;Researcher;Instructor;;Full Professor",
        "bibtex": "@misc{\nshao2024unleashing,\ntitle={Unleashing the Power of Annotation: Enhancing Semi-Supervised Learning through Unsupervised Sample Selection},\nauthor={Qian Shao and Jiangrui Kang and Qiyuan Chen and Hongxia Xu and Yiwen Cao and JIAJUAN LIANG and Jian Wu},\nyear={2024},\nurl={https://openreview.net/forum?id=fBlHaSGKNg}\n}",
        "github": "",
        "project": "",
        "reviewers": "VKdd;Xj3X;VfL6;9fK9",
        "site": "https://openreview.net/forum?id=fBlHaSGKNg",
        "pdf_size": 7398997,
        "rating": "3;3;5;5",
        "confidence": "3;5;3;4",
        "soundness": "2;1;3;2",
        "contribution": "1;2;2;2",
        "presentation": "2;1;3;3",
        "wc_summary": "47;78;64;107",
        "wc_strengths": "3;41;77;18",
        "wc_weaknesses": "95;366;117;127",
        "wc_questions": "26;43;46;31",
        "wc_review": "171;528;304;283",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1001;1355;886;1030",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            74.0,
            21.988633427296023
        ],
        "wc_strengths_avg": [
            34.75,
            27.896012259819503
        ],
        "wc_weaknesses_avg": [
            176.25,
            110.16209647605659
        ],
        "wc_questions_avg": [
            36.5,
            8.261355820929152
        ],
        "wc_review_avg": [
            321.5,
            129.5
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1068.0,
            174.2311682793868
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.30151134457776363,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:MGxVMOTb4gAJ:scholar.google.com/&scioq=Unleashing+the+Power+of+Annotation:+Enhancing+Semi-Supervised+Learning+through+Unsupervised+Sample+Selection&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0;3;0",
        "aff_unique_norm": "Zhejiang University;Illinois Institute of Technology;Central China Normal University;Beijing Normal University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.zju.edu.cn;https://www.iit.edu;http://www.ccnu.edu.cn;https://www.bnu.edu.cn",
        "aff_unique_abbr": "ZJU;IIT;CCNU;BNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "fCQe7ei2f5",
        "title": "Variational Learning of Gaussian Process Latent Variable Models through Stochastic Gradient Annealed Importance Sampling",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Gaussian Process Latent Variable Models (GPLVMs) have become increasingly popular for unsupervised tasks such as dimensionality reduction and missing data recovery due to their flexibility and non-linear nature. An importance-weighted version \\cite{salimbeni2019deep} of the Bayesian GPLVMs has  been proposed to obtain a lower variational bound. However, this version of the approach is primarily limited to analyzing simple data structures, as the generation of an effective proposal distribution can become quite challenging in high-dimensional spaces or with complex data sets. In this work, we propose an Annealed Importance Sampling (AIS) approach to address these issues. By transforming the posterior into a sequence of intermediate distributions using annealing, we combine the strengths of Sequential Monte Carlo samplers and VI to explore a wider range of posterior distributions and gradually approach the target distribution. We further propose an efficient algorithm by reparameterizing all variables in the evidence lower bound (ELBO). Experimental results on both toy and image datasets demonstrate that our method outperforms state-of-the-art methods in terms of lower variational bounds, higher log-likelihoods, and more robust convergence.",
        "keywords": "Gaussian Process Latent Variable Models;variational inference;Annealed Importance Sampling",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/e620efb6e25ec4fad580bd32b0111e7ed2a4c73c.zip",
        "author": "JIAN XU;Shian Du;Junmei Yang;Delu Zeng",
        "authorids": "~JIAN_XU5;~Shian_Du1;~Junmei_Yang1;~Delu_Zeng4",
        "gender": "M;M;F;M",
        "homepage": ";;http://www2.scut.edu.cn/eemd/2013/1231/c4581a76497/page.htm;",
        "dblp": "73/1149-21;317/1383;157/9330.html;38/5665",
        "google_scholar": "https://scholar.google.com.hk/citations?user=DublkSoAAAAJ;SUgR5VAAAAAJ;;08RCdoIAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~JIAN_XU5;~Shian_Du1;~Junmei_Yang1;~Delu_zeng1",
        "aff": "South China University of Technology;Tsinghua University;South China University of Technology;South China University of Technology",
        "aff_domain": "scut.edu.cn;tsinghua.edu.cn;scut.edu.cn;scut.edu.cn",
        "position": "PhD student;MS student;Associate Professor;Full Professor",
        "bibtex": "@misc{\nxu2024variational,\ntitle={Variational Learning of  Gaussian Process Latent Variable Models  through  Stochastic Gradient Annealed Importance Sampling},\nauthor={JIAN XU and Shian Du and Junmei Yang and Delu Zeng},\nyear={2024},\nurl={https://openreview.net/forum?id=fCQe7ei2f5}\n}",
        "github": "",
        "project": "",
        "reviewers": "NbSz;uro2;G6Yr;e7un",
        "site": "https://openreview.net/forum?id=fCQe7ei2f5",
        "pdf_size": 2027811,
        "rating": "5;5;6;8",
        "confidence": "3;3;4;3",
        "soundness": "2;3;2;4",
        "contribution": "2;2;3;3",
        "presentation": "2;3;2;3",
        "wc_summary": "35;168;108;89",
        "wc_strengths": "33;57;64;238",
        "wc_weaknesses": "128;146;201;416",
        "wc_questions": "84;26;122;126",
        "wc_review": "280;397;495;869",
        "wc_reply_reviewers": "53;0;405;96",
        "wc_reply_authors": "1595;445;1774;1518",
        "reply_reviewers": "1;0;3;1",
        "reply_authors": "3;1;4;4",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            100.0,
            47.52367830881781
        ],
        "wc_strengths_avg": [
            98.0,
            81.64251343509703
        ],
        "wc_weaknesses_avg": [
            222.75,
            114.7679724487629
        ],
        "wc_questions_avg": [
            89.5,
            40.15905875391006
        ],
        "wc_review_avg": [
            510.25,
            220.66646210967357
        ],
        "wc_reply_reviewers_avg": [
            138.5,
            157.57617205656445
        ],
        "wc_reply_authors_avg": [
            1333.0,
            521.0311890856439
        ],
        "reply_reviewers_avg": [
            1.25,
            1.0897247358851685
        ],
        "reply_authors_avg": [
            3.0,
            1.224744871391589
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:IA5tdAXQdaQJ:scholar.google.com/&scioq=Variational+Learning+of+Gaussian+Process+Latent+Variable+Models+through+Stochastic+Gradient+Annealed+Importance+Sampling&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "South China University of Technology;Tsinghua University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.scut.edu.cn;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "SCUT;THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "fCcSt2T4e4",
        "title": "SILC: Improving Vision Language Pretraining with Self-Distillation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Image-Text pretraining on web-scale image caption dataset has become the default recipe for open vocabulary classification and retrieval models thanks to the success of CLIP and its variants. Several works have also used CLIP features for dense prediction tasks and have shown the emergence of open-set abilities. However, the contrastive objective only focuses on image-text alignment and does not incentivise image feature learning for dense prediction tasks. In this work, we propose the simple addition of local-to-global correspondence learning by self-distillation as an additional objective for contrastive pre-training to propose SILC. We show that distilling local image features from an exponential moving average (EMA) teacher model significantly improves model performance on several computer vision tasks including classification, retrieval, and especially segmentation. We further show that SILC scales better with the same training duration compared to the baselines. Our model SILC sets a new state of the art for zero-shot classification, few shot classification, image and text retrieval, zero-shot segmentation, and open vocabulary segmentation.",
        "keywords": "Vision Language Model;Transformer;Zero-shot transfer",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/e92e4a7b89ae4eb1b19c39adc8f52bcb3754dcea.pdf",
        "author": "Muhammad Ferjad Naeem;Yongqin Xian;Xiaohua Zhai;Lukas Hoyer;Luc Van Gool;Federico Tombari",
        "authorids": "~Muhammad_Ferjad_Naeem1;~Yongqin_Xian1;~Xiaohua_Zhai2;~Lukas_Hoyer1;~Luc_Van_Gool1;~Federico_Tombari1",
        "gender": ";M;;;;M",
        "homepage": "https://ferjad.github.io/;https://xianyongqin.github.io/;;;;https://federicotombari.github.io/",
        "dblp": "213/8506;177/9313.html;66/636;;61/5017;16/3539",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.de/citations?user=JmdnBzcAAAAJ;;;https://scholar.google.be/citations?user=TwMib_QAAAAJ;TFsE4BIAAAAJ",
        "orcid": ";;;;;0000-0001-5598-5212",
        "linkedin": ";;;;;fedet/",
        "or_profile": "~Muhammad_Ferjad_Naeem1;~Yongqin_Xian1;~Xiaohua_Zhai2;~Lukas_Hoyer1;~Luc_Van_Gool1;~Federico_Tombari1",
        "aff": "ETHZ - ETH Zurich;Google;Google DeepMind;;KU Leuven;Technical University Munich (TUM)",
        "aff_domain": "ethz.ch;google.com;google.com;;kuleuven.be;in.tum.de",
        "position": "PhD student;Researcher;Researcher;;Emeritus;Lecturer",
        "bibtex": "@misc{\nnaeem2024silc,\ntitle={{SILC}: Improving Vision Language Pretraining with Self-Distillation},\nauthor={Muhammad Ferjad Naeem and Yongqin Xian and Xiaohua Zhai and Lukas Hoyer and Luc Van Gool and Federico Tombari},\nyear={2024},\nurl={https://openreview.net/forum?id=fCcSt2T4e4}\n}",
        "github": "",
        "project": "",
        "reviewers": "FBGc;tTwz;XE72;K27w",
        "site": "https://openreview.net/forum?id=fCcSt2T4e4",
        "pdf_size": 8373686,
        "rating": "3;3;5;5",
        "confidence": "4;5;3;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "40;73;99;44",
        "wc_strengths": "39;69;57;42",
        "wc_weaknesses": "243;323;282;122",
        "wc_questions": "2;96;22;4",
        "wc_review": "324;561;460;212",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "262;557;402;209",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            64.0,
            23.885141824992374
        ],
        "wc_strengths_avg": [
            51.75,
            12.07010770457331
        ],
        "wc_weaknesses_avg": [
            242.5,
            75.1015978525091
        ],
        "wc_questions_avg": [
            31.0,
            38.3275357934736
        ],
        "wc_review_avg": [
            389.25,
            132.45636073816917
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            357.5,
            135.04906515781587
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.7071067811865475,
        "gs_citation": 25,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=488860744367102865&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;1;1;2;3",
        "aff_unique_norm": "ETH Zurich;Google;Katholieke Universiteit Leuven;Technical University Munich",
        "aff_unique_dep": ";Google;;",
        "aff_unique_url": "https://www.ethz.ch;https://www.google.com;https://www.kuleuven.be;https://www.tum.de",
        "aff_unique_abbr": "ETHZ;Google;KU Leuven;TUM",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;2;3;4",
        "aff_country_unique": "Switzerland;United States;United Kingdom;Belgium;Germany"
    },
    {
        "title": "Zero-Shot Robustification of Zero-Shot Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18194",
        "id": "fCeUoDr9Tq",
        "author_site": "Dyah Adila, Changho Shin, Linrong Cai, Frederic Sala",
        "tldr": "",
        "abstract": "Zero-shot inference is a powerful paradigm that enables the use of large pretrained models for downstream classification tasks without further training. However, these models are vulnerable to inherited biases that can impact their performance. The traditional solution is fine-tuning, but this undermines the key advantage of pretrained models, which is their ability to be used out-of-the-box. We propose RoboShot, a method that improves the robustness of pretrained model embeddings in a fully zero-shot fashion. First, we use language models (LMs) to obtain useful insights from task descriptions. These insights are embedded and used to remove harmful and boost useful components in embeddings---without any supervision. Theoretically, we provide a simple and tractable model for biases in zero-shot embeddings and give a result characterizing under what conditions our approach can boost performance. Empirically, we evaluate RoboShot on nine image and NLP classification tasks and show an average improvement of 15.98% over several zero-shot baselines. Additionally, we demonstrate that RoboShot is compatible with a variety of pretrained and language models and propose a way to further boost performance with a zero-shot adaptation variant.",
        "keywords": "zero-shot classification;spurious correlations;invariant embedding;foundation model;language model",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/8bac83619b6f63bed6687063ebf05da76a374d13.zip",
        "author": "Dyah Adila;Changho Shin;Linrong Cai;Frederic Sala",
        "authorids": "~Dyah_Adila1;~Changho_Shin2;~Linrong_Cai1;~Frederic_Sala1",
        "gender": "F;;M;M",
        "homepage": ";;https://clrt19.com;https://pages.cs.wisc.edu/~fredsala/",
        "dblp": ";;356/4050;133/3602",
        "google_scholar": ";VpvIQAcAAAAJ;;9KhIkNkAAAAJ",
        "orcid": ";;;",
        "linkedin": "dyahadila/;;;",
        "or_profile": "~Dyah_Adila1;~Changho_Shin2;~Linrong_Cai1;~Frederic_Sala1",
        "aff": "University of Wisconsin, Madison;University of Wisconsin, Madison;University of Wisconsin - Madison;University of Wisconsin, Madison",
        "aff_domain": "wisc.edu;wisc.edu;wisc.edu;wisc.edu",
        "position": "PhD student;PhD student;Undergrad student;Assistant Professor",
        "bibtex": "@inproceedings{\nadila2024zeroshot,\ntitle={Zero-Shot Robustification of Zero-Shot Models},\nauthor={Dyah Adila and Changho Shin and Linrong Cai and Frederic Sala},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=fCeUoDr9Tq}\n}",
        "github": "",
        "project": "",
        "reviewers": "1hyF;R1Zx;umVa;bCze",
        "pdf_size": 1636311,
        "rating": "6;8;8;8",
        "confidence": "4;3;5;3",
        "soundness": "3;2;3;3",
        "contribution": "3;3;4;3",
        "presentation": "3;3;1;3",
        "wc_summary": "95;117;80;96",
        "wc_strengths": "71;170;31;137",
        "wc_weaknesses": "51;283;122;110",
        "wc_questions": "1;39;3;5",
        "wc_review": "218;609;236;348",
        "wc_reply_reviewers": "0;48;4;10",
        "wc_reply_authors": "301;1089;701;425",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "2;2;1;2",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            97.0,
            13.171939872319491
        ],
        "wc_strengths_avg": [
            102.25,
            54.43057504748595
        ],
        "wc_weaknesses_avg": [
            141.5,
            86.00145347608958
        ],
        "wc_questions_avg": [
            12.0,
            15.652475842498529
        ],
        "wc_review_avg": [
            352.75,
            156.10473247150452
        ],
        "wc_reply_reviewers_avg": [
            15.5,
            19.09842925478428
        ],
        "wc_reply_authors_avg": [
            629.0,
            302.48305737677276
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.17407765595569782,
        "gs_citation": 21,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=577208491971030831&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=fCeUoDr9Tq",
        "pdf": "https://openreview.net/pdf?id=fCeUoDr9Tq",
        "email": "wisc.edu;wisc.edu;wisc.edu;wisc.edu",
        "author_num": 4,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "University of Wisconsin;University of Wisconsin-Madison",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.wisc.edu;https://www.wisc.edu",
        "aff_unique_abbr": "UW;UW-Madison",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Madison",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "fDZumshwym",
        "title": "Leveraging Hierarchical Feature Sharing for Efficient Dataset Condensation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Given a real-world dataset, data condensation (DC) aims to synthesize a significantly smaller dataset that captures the knowledge of this dataset for model training with high performance. Recent works propose to enhance DC with data parameterization, which condenses data into parameterized data containers rather than pixel space. The intuition behind data parameterization is to encode shared features of images to avoid additional storage costs. In this paper, we recognize that images share common features in a hierarchical way due to the inherent hierarchical structure of the classification system, which is overlooked by current data parameterization methods.\nTo better align DC with this hierarchical nature and encourage more efficient information sharing inside data containers, we propose a novel data parameterization architecture, Hierarchical Memory Network (HMN). HMN stores condensed data in a three-tier structure, representing the dataset-level, class-level, and instance-level features. Another helpful property of the hierarchical architecture is that HMN naturally ensures good independence among images despite achieving information sharing. This enables instance-level pruning for HMN to reduce redundant information, thereby further minimizing redundancy and enhancing performance. We evaluate HMN on four public datasets (SVHN, CIFAR10, CIFAR100, and Tiny-ImageNet) and compare HMN with eight DC baselines. The evaluation results show that our proposed method outperforms all baselines, even when trained with a batch-based loss consuming less GPU memory.",
        "keywords": "Data condensation; Data distillation; Data parameterization",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Haizhong Zheng;Jiachen Sun;Shutong Wu;Bhavya Kailkhura;Zhuoqing Mao;Chaowei Xiao;Atul Prakash",
        "authorids": "~Haizhong_Zheng1;~Jiachen_Sun1;~Shutong_Wu1;~Bhavya_Kailkhura1;~Zhuoqing_Mao1;~Chaowei_Xiao2;~Atul_Prakash1",
        "gender": "M;M;M;M;F;;M",
        "homepage": "http://zhenghaizhong.com/;https://web.eecs.umich.edu/~jiachens/;https://cychomatica.github.io/;https://people.llnl.gov/kailkhura1;https://web.eecs.umich.edu/~zmao/;https://www.eecs.umich.edu/~aprakash;https://xiaocw11.github.io/",
        "dblp": "158/4817;;288/0663;132/8938;;p/AtulPrakash;150/3317",
        "google_scholar": "Zx6pKsQAAAAJ;Knnv3p4AAAAJ;;SQpJmOgAAAAJ;Ba_Ci9UAAAAJ;kIkHa2IAAAAJ;Juoqtj8AAAAJ",
        "orcid": "0000-0003-3723-8701;;;;;0000-0002-4907-3687;0000-0002-7043-4926",
        "linkedin": "haizhong-zheng-1093a0a7/;jiachensun23/;;;;atul-prakash-8729a44/;",
        "or_profile": "~Haizhong_Zheng1;~Jiachen_Sun1;~Shutong_Wu1;~Bhavya_Kailkhura1;~Zhuoqing_Mao1;~Atul_Prakash1;~chaowei_xiao1",
        "aff": "University of Michigan;LinkedIn;University of Wisconsin - Madison;Lawrence Livermore National Laboratory;University of Michigan;University of Michigan;NVIDIA",
        "aff_domain": "umich.edu;linkedin.com;wisc.edu;llnl.gov;umich.edu;umich.edu;nvidia.com",
        "position": "PhD student;Researcher;PhD student;Research Staff;Professor;Professor;Researcher",
        "bibtex": "@misc{\nzheng2024leveraging,\ntitle={Leveraging Hierarchical Feature Sharing for Efficient Dataset Condensation},\nauthor={Haizhong Zheng and Jiachen Sun and Shutong Wu and Bhavya Kailkhura and Zhuoqing Mao and Chaowei Xiao and Atul Prakash},\nyear={2024},\nurl={https://openreview.net/forum?id=fDZumshwym}\n}",
        "github": "",
        "project": "",
        "reviewers": "RRfc;UGPZ;Y8Kv;mnZx",
        "site": "https://openreview.net/forum?id=fDZumshwym",
        "pdf_size": 11623401,
        "rating": "5;6;6;6",
        "confidence": "3;4;2;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;2",
        "wc_summary": "50;44;92;66",
        "wc_strengths": "55;17;77;53",
        "wc_weaknesses": "96;149;167;82",
        "wc_questions": "253;5;52;38",
        "wc_review": "454;215;388;239",
        "wc_reply_reviewers": "136;0;18;0",
        "wc_reply_authors": "1729;682;1165;1423",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "4;2;4;3",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            63.0,
            18.57417562100671
        ],
        "wc_strengths_avg": [
            50.5,
            21.511624764298954
        ],
        "wc_weaknesses_avg": [
            123.5,
            35.42950747611375
        ],
        "wc_questions_avg": [
            87.0,
            97.34731634719058
        ],
        "wc_review_avg": [
            324.0,
            100.12741882221871
        ],
        "wc_reply_reviewers_avg": [
            38.5,
            56.76926985614664
        ],
        "wc_reply_authors_avg": [
            1249.75,
            383.802927946101
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.25,
            0.82915619758885
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1483051248368034815&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;1;2;3;0;0;4",
        "aff_unique_norm": "University of Michigan;LinkedIn Corporation;University of Wisconsin-Madison;Lawrence Livermore National Laboratory;NVIDIA",
        "aff_unique_dep": ";;;;NVIDIA Corporation",
        "aff_unique_url": "https://www.umich.edu;https://www.linkedin.com;https://www.wisc.edu;https://www.llnl.gov;https://www.nvidia.com",
        "aff_unique_abbr": "UM;LinkedIn;UW-Madison;LLNL;NVIDIA",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Madison",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Near-Optimal Solutions of Constrained Learning Problems",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18193",
        "id": "fDaLmkdSKU",
        "author_site": "Juan Elenter, Luiz Chamon, Alejandro Ribeiro",
        "tldr": "",
        "abstract": "With the widespread adoption of machine learning systems, the need to curtail their behavior has become increasingly apparent. This is evidenced by recent advancements towards developing models that satisfy robustness, safety, and fairness requirements. These requirements can be imposed (with generalization guarantees) by formulating constrained learning problems that can then be tackled by dual ascent algorithms. Yet, though these algorithms converge in objective value, even in non-convex settings, they cannot guarantee that their outcome is feasible. Doing so requires randomizing over all iterates, which is impractical in virtually any modern applications. Still, final iterates have been observed to perform well in practice. In this work, we address this gap between theory and practice by characterizing the constraint violation of Lagrangian minimizers associated with optimal dual variables, despite lack of convexity. To do this, we leverage the fact that non-convex, finite-dimensional constrained learning problems can be seen as parametrizations of convex, functional problems. Our results show that rich parametrizations effectively mitigate the issue of feasibility in dual methods, shedding light on prior empirical successes of dual learning. We illustrate our findings in fair learning tasks.",
        "keywords": "Constrained Learning;Convex Optimization;Duality;Constrained Optimization;Fairness",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/308f265b8fae26229d739fee6468805c866f3007.zip",
        "author": "Juan Elenter;Luiz F. O. Chamon;Alejandro Ribeiro",
        "authorids": "~Juan_Elenter1;~Luiz_F._O._Chamon1;~Alejandro_Ribeiro1",
        "gender": ";M;M",
        "homepage": "https://juanelenter.github.io/;https://www.luizchamon.com;https://alelab.seas.upenn.edu",
        "dblp": "313/9585;120/6982;32/15",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.ca/citations?user=FIm-l-sAAAAJ;7mrPM4kAAAAJ",
        "orcid": ";0000-0001-7731-6650;0000-0003-4230-9906",
        "linkedin": "juan-elenter/;luiz-chamon-abb07a18;",
        "or_profile": "~Juan_Elenter1;~Luiz_F._O._Chamon1;~Alejandro_Ribeiro1",
        "aff": "University of Pennsylvania;Universit\u00e4t Stuttgart;University of Pennsylvania",
        "aff_domain": "upenn.edu;uni-stuttgart.de;upenn.edu",
        "position": "PhD student;Principal Researcher;Full Professor",
        "bibtex": "@inproceedings{\nelenter2024nearoptimal,\ntitle={Near-Optimal Solutions of Constrained Learning Problems},\nauthor={Juan Elenter and Luiz F. O. Chamon and Alejandro Ribeiro},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=fDaLmkdSKU}\n}",
        "github": "",
        "project": "",
        "reviewers": "3wd8;z2M9;2G7p;Y13X;rUm3",
        "pdf_size": 495605,
        "rating": "3;6;6;6;8",
        "confidence": "2;3;3;4;3",
        "soundness": "3;2;4;3;3",
        "contribution": "2;2;2;3;3",
        "presentation": "3;3;3;3;4",
        "wc_summary": "63;95;140;85;201",
        "wc_strengths": "29;78;80;38;53",
        "wc_weaknesses": "166;292;127;89;69",
        "wc_questions": "2;358;22;508;240",
        "wc_review": "260;823;369;720;563",
        "wc_reply_reviewers": "0;52;0;243;0",
        "wc_reply_authors": "690;1683;910;1977;1334",
        "reply_reviewers": "0;1;0;2;0",
        "reply_authors": "1;4;2;5;3",
        "rating_avg": [
            5.8,
            1.6
        ],
        "confidence_avg": [
            3.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            3.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            3.2,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            116.8,
            49.00775448844805
        ],
        "wc_strengths_avg": [
            55.6,
            20.597087172704786
        ],
        "wc_weaknesses_avg": [
            148.6,
            79.0205036683518
        ],
        "wc_questions_avg": [
            226.0,
            194.3893001170589
        ],
        "wc_review_avg": [
            547.0,
            209.95904362517945
        ],
        "wc_reply_reviewers_avg": [
            59.0,
            94.1785538219822
        ],
        "wc_reply_authors_avg": [
            1318.8,
            475.10142075140124
        ],
        "reply_reviewers_avg": [
            0.6,
            0.7999999999999999
        ],
        "reply_authors_avg": [
            3.0,
            1.4142135623730951
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5929270612815711,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17392898559894643157&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=fDaLmkdSKU",
        "pdf": "https://openreview.net/pdf?id=fDaLmkdSKU",
        "email": "upenn.edu;uni-stuttgart.de;upenn.edu",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Pennsylvania;University of Stuttgart",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.upenn.edu;https://www.uni-stuttgart.de",
        "aff_unique_abbr": "UPenn;Uni Stuttgart",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United States;Germany"
    },
    {
        "title": "CoLiDE: Concomitant Linear DAG Estimation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18192",
        "id": "fGAIgO75dG",
        "author_site": "Seyed Saman Saboksayr, Gonzalo Mateos, Mariano Tepper",
        "tldr": "",
        "abstract": "We deal with the combinatorial problem of learning directed acyclic graph (DAG) structure from observational data adhering to a linear structural equation model (SEM). Leveraging advances in differentiable, nonconvex characterizations of acyclicity, recent efforts have advocated a continuous constrained optimization paradigm to efficiently explore the space of DAGs. Most existing methods employ lasso-type score functions to guide this search, which (i) require expensive penalty parameter retuning when the $\\textit{unknown}$ SEM noise variances change across problem instances; and (ii) implicitly rely on limiting homoscedasticity assumptions. In this work, we propose a new convex score function for sparsity-aware learning of linear DAGs, which incorporates concomitant estimation of scale and thus effectively decouples the sparsity parameter from noise levels. Regularization via a smooth, nonconvex acyclicity penalty term yields CoLiDE ($\\textbf{Co}$ncomitant $\\textbf{Li}$near $\\textbf{D}$AG $\\textbf{E}$stimation), a regression-based criterion amenable to efficient gradient computation and closed-form estimation of exogenous noise levels in heteroscedastic scenarios. Our algorithm outperforms state-of-the-art methods without incurring added complexity, especially when the DAGs are larger and the noise level profile is heterogeneous. We also find CoLiDE exhibits enhanced stability manifested via reduced standard deviations in several domain-specific metrics, underscoring the robustness of our novel linear DAG estimator.",
        "keywords": "directed acyclic graph;concomitant scale estimation;causal discovery;graph structure learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/61f224de40a83e3e6f224f88faf4f7eb12e0428e.zip",
        "author": "Seyed Saman Saboksayr;Gonzalo Mateos;Mariano Tepper",
        "authorids": "~Seyed_Saman_Saboksayr1;~Gonzalo_Mateos1;~Mariano_Tepper2",
        "gender": "M;M;M",
        "homepage": ";https://www.hajim.rochester.edu/ece/sites/gmateos/;https://scholar.google.com/citations?user=4c0OPhgAAAAJ&hl=en",
        "dblp": ";28/7822;04/7545",
        "google_scholar": "11PxP9gAAAAJ;4QAOifUAAAAJ;",
        "orcid": ";0000-0002-9847-6298;",
        "linkedin": ";;",
        "or_profile": "~Seyed_Saman_Saboksayr1;~Gonzalo_Mateos1;~Mariano_Tepper2",
        "aff": "University of Rochester;University of Rochester;Intel",
        "aff_domain": "rochester.edu;rochester.edu;intel.com",
        "position": "PhD student;Associate Professor;Researcher",
        "bibtex": "@inproceedings{\nsaboksayr2024colide,\ntitle={CoLi{DE}: Concomitant Linear {DAG} Estimation},\nauthor={Seyed Saman Saboksayr and Gonzalo Mateos and Mariano Tepper},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=fGAIgO75dG}\n}",
        "github": "",
        "project": "",
        "reviewers": "VEfR;xkAR;wJd3",
        "pdf_size": 1238944,
        "rating": "3;6;8",
        "confidence": "3;4;5",
        "soundness": "2;2;4",
        "contribution": "2;2;3",
        "presentation": "3;4;3",
        "wc_summary": "72;49;67",
        "wc_strengths": "22;24;87",
        "wc_weaknesses": "60;74;229",
        "wc_questions": "193;246;13",
        "wc_review": "347;393;396",
        "wc_reply_reviewers": "455;31;99",
        "wc_reply_authors": "1057;1071;722",
        "reply_reviewers": "1;1;1",
        "reply_authors": "3;4;3",
        "rating_avg": [
            5.666666666666667,
            2.0548046676563256
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            62.666666666666664,
            9.877021593352701
        ],
        "wc_strengths_avg": [
            44.333333333333336,
            30.180935851773864
        ],
        "wc_weaknesses_avg": [
            121.0,
            76.58111168340838
        ],
        "wc_questions_avg": [
            150.66666666666666,
            99.72072112766845
        ],
        "wc_review_avg": [
            378.6666666666667,
            22.425184255405547
        ],
        "wc_reply_reviewers_avg": [
            195.0,
            185.9318871701857
        ],
        "wc_reply_authors_avg": [
            950.0,
            161.32162491949634
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.9933992677987828,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5423056552527813189&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=fGAIgO75dG",
        "pdf": "https://openreview.net/pdf?id=fGAIgO75dG",
        "email": "rochester.edu;rochester.edu;intel.com",
        "author_num": 3,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "University of Rochester;Intel",
        "aff_unique_dep": ";Intel Corporation",
        "aff_unique_url": "https://www.rochester.edu;https://www.intel.com",
        "aff_unique_abbr": "U of R;Intel",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "fGXyvmWpw6",
        "title": "Federated Virtual Learning on Heterogeneous Data with Local-global Distillation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Despite Federated Learning (FL)'s trend for learning machine learning models in a distributed manner, it is susceptible to performance drops when training on heterogeneous data. In addition, FL inevitability faces the challenges of synchronization, efficiency, and privacy. Recently, dataset distillation has been explored in order to improve the efficiency and scalability of FL by creating a smaller, synthetic dataset that retains the performance of a model trained on the local private datasets.  We discover that using distilled local datasets can amplify the heterogeneity issue in FL. To address this, we propose a new method, called Federated Virtual Learning on Heterogeneous Data with Local-Global Distillation (FedLGD), which trains FL using a smaller synthetic dataset (referred as virtual data) created through a combination of local and global dataset distillation.\nSpecifically, to handle synchronization and class imbalance, we propose iterative distribution matching to allow clients to have the same amount of balanced local virtual data; to harmonize the domain shifts, we use federated gradient matching to distill global virtual data that are shared with clients without hindering data privacy to rectify heterogeneous local training via enforcing local-global feature similarity. We experiment on both benchmark and real-world datasets that contain heterogeneous data from different sources, and further scale up to an FL scenario that contains large number of clients with heterogeneous and class imbalance data. Our method outperforms state-of-the-art heterogeneous FL algorithms under various settings with a very limited amount of distilled virtual data.",
        "keywords": "Federated Learning;Dataset Distillation;Data Heterogeneity",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/8763cd55bdf8d720e8697812c901aeb4b104cf3d.pdf",
        "author": "Chun-Yin Huang;Ruinan Jin;Can Zhao;Daguang Xu;Xiaoxiao Li",
        "authorids": "~Chun-Yin_Huang1;~Ruinan_Jin4;~Can_Zhao1;~Daguang_Xu2;~Xiaoxiao_Li1",
        "gender": "M;;F;M;Unspecified",
        "homepage": ";https://nanboy-ronan.github.io/Personal-Web/;https://research.nvidia.com/person/can-zhao;https://daguangxu.net/;https://xxlya.github.io/",
        "dblp": ";280/2578;35/2787-1;;71/8042",
        "google_scholar": "moi11dgAAAAJ;;CdzhxtYAAAAJ;r_VHYHAAAAAJ;sdENOQ4AAAAJ",
        "orcid": ";;0000-0001-7286-3452;;",
        "linkedin": ";;can-zhao-jhu/;;",
        "or_profile": "~Chun-Yin_Huang1;~Ruinan_Jin4;~Can_Zhao1;~Daguang_Xu2;~Xiaoxiao_Li1",
        "aff": "University of British Columbia;University of British Columbia;NVIDIA;NVIDIA;University of British Columbia",
        "aff_domain": "ubc.ca;ubc.ca;nvidia.com;nvidia.com;ece.ubc.ca",
        "position": "PhD student;Undergrad student;Applied deep learning research scientist;Research Manager;Assistant Professor",
        "bibtex": "@misc{\nhuang2024federated,\ntitle={Federated Virtual Learning on Heterogeneous Data with Local-global Distillation},\nauthor={Chun-Yin Huang and Ruinan Jin and Can Zhao and Daguang Xu and Xiaoxiao Li},\nyear={2024},\nurl={https://openreview.net/forum?id=fGXyvmWpw6}\n}",
        "github": "",
        "project": "",
        "reviewers": "PXsJ;8zES",
        "site": "https://openreview.net/forum?id=fGXyvmWpw6",
        "pdf_size": 2840540,
        "rating": "5;6",
        "confidence": "4;2",
        "soundness": "3;3",
        "contribution": "3;3",
        "presentation": "2;2",
        "wc_summary": "57;341",
        "wc_strengths": "29;30",
        "wc_weaknesses": "89;251",
        "wc_questions": "2;251",
        "wc_review": "177;873",
        "wc_reply_reviewers": "0;68",
        "wc_reply_authors": "970;892",
        "reply_reviewers": "0;1",
        "reply_authors": "5;4",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.0,
            1.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            199.0,
            142.0
        ],
        "wc_strengths_avg": [
            29.5,
            0.5
        ],
        "wc_weaknesses_avg": [
            170.0,
            81.0
        ],
        "wc_questions_avg": [
            126.5,
            124.5
        ],
        "wc_review_avg": [
            525.0,
            348.0
        ],
        "wc_reply_reviewers_avg": [
            34.0,
            34.0
        ],
        "wc_reply_authors_avg": [
            931.0,
            39.0
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            4.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9999999999999999,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4740619818693935435&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;1;0",
        "aff_unique_norm": "University of British Columbia;NVIDIA",
        "aff_unique_dep": ";NVIDIA Corporation",
        "aff_unique_url": "https://www.ubc.ca;https://www.nvidia.com",
        "aff_unique_abbr": "UBC;NVIDIA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;1;0",
        "aff_country_unique": "Canada;United States"
    },
    {
        "id": "fGskrC9Wy1",
        "title": "Boosted Long Short-Term Memory with Additional Inner Layers",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Long Short-Term Memory (LSTM) is widely known as a powerful type of Recurrent Neural Network, allowing it to achieve great results on many difficult sequential data tasks. \nNumerous experiments have shown that adding more complexity to neural network architectures may lead to a significant increase in performance that outweighs the incurred costs of an upgraded structure.\nIn this paper, we propose a Boosted LSTM model created by adding layers inside the LSTM unit to optimize the model by enhancing its memory and reasoning capabilities.\nWe evaluated the performance of different versions of Boosted LSTM architectures using three empirical tasks, studying the impact of different placements of additional layers, the activation functions used in the additional layers, and the model's hidden units.\nThe experiments have shown that the Boosted LSTM unit, which uses Exponential Linear Unit as its boosted layers activation function, performs better than the similar models created from the simple LSTM units while often taking fewer epochs to achieve similar or better results, usually in a smaller number of training epochs.",
        "keywords": "Recurrent Neural Networks;Long Short-Term Memory;Sequence classification;Boosted architectures",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Kacper Milan;Adrian Horzyk",
        "authorids": "~Kacper_Milan1;~Adrian_Horzyk1",
        "gender": "M;M",
        "homepage": ";https://home.agh.edu.pl/~horzyk/index-eng.php",
        "dblp": ";41/710",
        "google_scholar": ";https://scholar.google.pl/citations?user=AVeQEpYAAAAJ",
        "orcid": "0009-0003-1416-3628;0000-0001-9001-4198",
        "linkedin": "kacper-milan/;adrian-horzyk-30658844/",
        "or_profile": "~Kacper_Milan1;~Adrian_Horzyk1",
        "aff": "AGH University of Science and Technology;AGH University of Krakow",
        "aff_domain": "agh.edu.pl;agh.edu.pl",
        "position": "MS student;Associate Professor",
        "bibtex": "@misc{\nmilan2024boosted,\ntitle={Boosted Long Short-Term Memory with Additional Inner Layers},\nauthor={Kacper Milan and Adrian Horzyk},\nyear={2024},\nurl={https://openreview.net/forum?id=fGskrC9Wy1}\n}",
        "github": "",
        "project": "",
        "reviewers": "ueko;xgqM;8bpo",
        "site": "https://openreview.net/forum?id=fGskrC9Wy1",
        "pdf_size": 1014562,
        "rating": "1;3;3",
        "confidence": "5;2;4",
        "soundness": "1;2;1",
        "contribution": "1;2;2",
        "presentation": "2;3;2",
        "wc_summary": "69;76;112",
        "wc_strengths": "10;42;141",
        "wc_weaknesses": "230;53;762",
        "wc_questions": "414;25;26",
        "wc_review": "723;196;1041",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            1.247219128924647
        ],
        "soundness_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            85.66666666666667,
            18.83849486792639
        ],
        "wc_strengths_avg": [
            64.33333333333333,
            55.76338902501851
        ],
        "wc_weaknesses_avg": [
            348.3333333333333,
            301.2997768926415
        ],
        "wc_questions_avg": [
            155.0,
            183.14111135041927
        ],
        "wc_review_avg": [
            653.3333333333334,
            348.46935143408075
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.7559289460184544,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:F7xiVONq4EoJ:scholar.google.com/&scioq=Boosted+Long+Short-Term+Memory+with+Additional+Inner+Layers&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "AGH University of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.agh.edu.pl",
        "aff_unique_abbr": "AGH",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Krakow",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Poland"
    },
    {
        "id": "fH2wf2w2Ss",
        "title": "Two-Stage Diffusion Models: Better Image Synthesis by Explicitly Modeling Semantics",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recent progress with conditional image diffusion models has been stunning, and this holds true whether we are speaking about models conditioned on a text description, a scene layout, or a sketch. Unconditional image diffusion models are also improving but lag behind, as do diffusion models which are conditioned on lower-dimensional features like class labels. We advocate for a simple method that leverages this phenomenon for better unconditional generative modeling. In particular, we suggest a two-stage sampling procedure. In the first stage we sample an embedding describing the semantic content of the image. In the second stage we use a conditional image diffusion model to sample the image conditioned on this embedding, and then discard the embedding. The combined model can therefore leverage the power of conditional diffusion models on the unconditional generation task, achieving large improvements in unconditional image generation. The same method can be generalized to yield similar improvements for image generation conditioned on a low-dimensional signal like a class label.",
        "keywords": "generative modeling;diffusion models",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "William Harvey;Frank Wood",
        "authorids": "~William_Harvey1;~Frank_Wood2",
        "gender": "M;M",
        "homepage": "https://www.cs.ubc.ca/~wsgh/;http://www.robots.ox.ac.uk/~fwood/",
        "dblp": "26/8210-2;44/4750",
        "google_scholar": "https://scholar.google.co.uk/citations?user=kDd7nBkAAAAJ;d4yNzXIAAAAJ",
        "orcid": ";",
        "linkedin": ";frank-wood-43529114?trk=hp-identity-name",
        "or_profile": "~William_Harvey1;~Frank_Wood2",
        "aff": "University of British Columbia;University of British Columbia",
        "aff_domain": "cs.ubc.ca;cs.ubc.ca",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nharvey2024twostage,\ntitle={Two-Stage Diffusion Models: Better Image Synthesis by Explicitly Modeling Semantics},\nauthor={William Harvey and Frank Wood},\nyear={2024},\nurl={https://openreview.net/forum?id=fH2wf2w2Ss}\n}",
        "github": "",
        "project": "",
        "reviewers": "c6YU;WB76;5Hdf",
        "site": "https://openreview.net/forum?id=fH2wf2w2Ss",
        "pdf_size": 14699321,
        "rating": "3;3;6",
        "confidence": "3;3;3",
        "soundness": "2;2;3",
        "contribution": "2;2;2",
        "presentation": "3;1;2",
        "wc_summary": "87;89;65",
        "wc_strengths": "44;56;57",
        "wc_weaknesses": "134;123;88",
        "wc_questions": "65;78;50",
        "wc_review": "330;346;260",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "102;253;483",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            80.33333333333333,
            10.873004286866728
        ],
        "wc_strengths_avg": [
            52.333333333333336,
            5.90668171555645
        ],
        "wc_weaknesses_avg": [
            115.0,
            19.61292091114087
        ],
        "wc_questions_avg": [
            64.33333333333333,
            11.440668201153676
        ],
        "wc_review_avg": [
            312.0,
            37.345236197762446
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            279.3333333333333,
            156.65319090979992
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:gEIIg2zN3scJ:scholar.google.com/&scioq=Two-Stage+Diffusion+Models:+Better+Image+Synthesis+by+Explicitly+Modeling+Semantics&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of British Columbia",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ubc.ca",
        "aff_unique_abbr": "UBC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "fH9eqpCcR3",
        "title": "Multiple Physics Pretraining for Physical Surrogate Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We introduce multiple physics pretraining (MPP), an autoregressive task-agnostic pretraining approach for physical surrogate modeling. MPP involves training large surrogate models to predict the dynamics of multiple heterogeneous physical systems simultaneously by learning features that are broadly useful across diverse physical tasks. In order to learn effectively in this setting, we introduce a shared embedding and normalization strategy that projects the fields of multiple systems into a single shared embedding space. We validate the efficacy of our approach on both pretraining and downstream tasks over a broad fluid mechanics-oriented benchmark. We show that a single MPP-pretrained transformer is able to match or outperform task-specific baselines on all pretraining sub-tasks without the need for finetuning. For downstream tasks, we demonstrate that finetuning MPP-trained models results in more accurate predictions across multiple time-steps on new physics compared to training from scratch or finetuning pretrained video foundation models. We open-source our code and model weights trained at multiple scales for reproducibility and community experimentation. Video examples are included in the supplementary materials.",
        "keywords": "transfer learning;physics;pretraining;finetuning;surrogate models;spatiotemporal",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/1b15c36d7da4210bf437c0fbce1293449a229043.zip",
        "author": "Michael McCabe;Bruno R\u00e9galdo-Saint Blancard;Liam Holden Parker;Ruben Ohana;Miles Cranmer;Alberto Bietti;Michael Eickenberg;Siavash Golkar;Geraud Krawezik;Francois Lanusse;Mariel Pettee;Tiberiu Tesileanu;Kyunghyun Cho;Shirley Ho",
        "authorids": "~Michael_McCabe2;~Bruno_R\u00e9galdo-Saint_Blancard1;~Liam_Holden_Parker1;~Ruben_Ohana1;~Miles_Cranmer2;~Alberto_Bietti1;~Michael_Eickenberg5;~Siavash_Golkar1;gkrawezik@flatironinstitute.org;~Francois_Lanusse2;~Mariel_Pettee1;~Tiberiu_Tesileanu1;~Kyunghyun_Cho1;~Shirley_Ho2",
        "gender": "M;;M;;;M;M;;;M;F;M;M;",
        "homepage": "https://mikemccabe210.github.io/;https://users.flatironinstitute.org/~bregaldosaintblancard/;;https://rubenohana.github.io/;https://astroautomata.com/;http://alberto.bietti.me;http://eickenberg.github.io;;;https://flanusse.net;https://mariel-pettee.github.io/;http://www.ttesileanu.com;http://kyunghyuncho.me;https://www.shirleyho.space/",
        "dblp": "56/706;;;251/5608;205/2493;166/6461;117/7268;222/3276;;;;160/0174;41/9736;162/2218",
        "google_scholar": "SMXfsHYAAAAJ;TfcmfBQAAAAJ;CjYa0N4AAAAJ;https://scholar.google.fr/citations?user=F9qNg2wAAAAJ;10WfwCQAAAAJ;iT7Tp70AAAAJ;GW0werQAAAAJ;UzaZt7MAAAAJ;;fRDCooIAAAAJ;;8--imZAAAAAJ;https://scholar.google.fi/citations?user=0RAmmIAAAAAJ;fhOi--4AAAAJ",
        "orcid": "0009-0007-8117-6110;0000-0003-0055-0953;;0000-0002-8493-1210;0000-0002-6458-3423;;;;;;;0000-0003-3107-3088;;",
        "linkedin": "mmccabe-210/;;liam-parker-96ba14160/;rubenohana/;milescranmer/;;;;;;;ttesileanu/;;",
        "or_profile": "~Michael_McCabe2;~Bruno_R\u00e9galdo-Saint_Blancard1;~Liam_Holden_Parker1;~Ruben_Ohana1;~Miles_Cranmer2;~Alberto_Bietti1;~Michael_Eickenberg5;~Siavash_Golkar1;gkrawezik@flatironinstitute.org;~Francois_Lanusse2;~Mariel_Pettee1;~Tiberiu_Tesileanu1;~Kyunghyun_Cho1;~Shirley_Ho2",
        "aff": "University of Colorado, Boulder;Flatiron Institute;Flatiron Institute;Flatiron Institute;University of Cambridge;Flatiron Institute;Flatiron Institute;New York University;;CNRS;Lawrence Berkeley National Lab;Meta;Genentech;Carnegie Mellon University",
        "aff_domain": "colorado.edu;flatironinstitute.org;simonsfoundation.org;flatironinstitute.org;cam.ac.uk;flatironinstitute.org;flatironinstitute.org;nyu.edu;;cnrs.fr;lbnl.gov;meta.com;gene.com;cmu.edu",
        "position": "PhD student;Postdoc;Researcher;Postdoc;Assistant Professor;Researcher;Researcher;Research Scientist;;Researcher;Postdoc;Researcher;Senior Director of Frontier Research;Associate Professor",
        "bibtex": "@misc{\nmccabe2024multiple,\ntitle={Multiple Physics Pretraining for Physical Surrogate Models},\nauthor={Michael McCabe and Bruno R{\\'e}galdo-Saint Blancard and Liam Holden Parker and Ruben Ohana and Miles Cranmer and Alberto Bietti and Michael Eickenberg and Siavash Golkar and Geraud Krawezik and Francois Lanusse and Mariel Pettee and Tiberiu Tesileanu and Kyunghyun Cho and Shirley Ho},\nyear={2024},\nurl={https://openreview.net/forum?id=fH9eqpCcR3}\n}",
        "github": "",
        "project": "",
        "reviewers": "exE1;ffib;iLVr;AmeY;2tFL",
        "site": "https://openreview.net/forum?id=fH9eqpCcR3",
        "pdf_size": 3414080,
        "rating": "3;5;6;6;6",
        "confidence": "5;3;4;3;4",
        "soundness": "3;3;3;3;3",
        "contribution": "3;3;3;3;3",
        "presentation": "4;3;3;3;3",
        "wc_summary": "145;92;65;45;52",
        "wc_strengths": "115;81;217;78;55",
        "wc_weaknesses": "271;136;315;193;204",
        "wc_questions": "1;85;298;8;25",
        "wc_review": "532;394;895;324;336",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "832;753;836;826;755",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            5.2,
            1.16619037896906
        ],
        "confidence_avg": [
            3.8,
            0.7483314773547882
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.2,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            79.8,
            36.339510178316935
        ],
        "wc_strengths_avg": [
            109.2,
            57.20279713440594
        ],
        "wc_weaknesses_avg": [
            223.8,
            62.601597423707965
        ],
        "wc_questions_avg": [
            83.4,
            111.30247077221601
        ],
        "wc_review_avg": [
            496.2,
            212.6427990786427
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            800.4,
            38.024202818731126
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            14,
            0
        ],
        "corr_rating_confidence": -0.6416889479197478,
        "gs_citation": 53,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13371426310232524836&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1;1;2;1;1;3;4;5;6;7;8",
        "aff_unique_norm": "University of Colorado;Flatiron Institute;University of Cambridge;New York University;Centre National de la Recherche Scientifique;Lawrence Berkeley National Laboratory;Meta;Genentech;Carnegie Mellon University",
        "aff_unique_dep": ";;;;;;Meta Platforms, Inc.;;",
        "aff_unique_url": "https://www.colorado.edu;https://flatironinstitute.org;https://www.cam.ac.uk;https://www.nyu.edu;https://www.cnrs.fr;https://www.lbl.gov;https://meta.com;https://www.genentech.com;https://www.cmu.edu",
        "aff_unique_abbr": "CU;Flatiron;Cambridge;NYU;CNRS;LBNL;Meta;Genentech;CMU",
        "aff_campus_unique_index": "0;2;3",
        "aff_campus_unique": "Boulder;;Cambridge;Berkeley",
        "aff_country_unique_index": "0;0;0;0;1;0;0;0;2;0;0;0;0",
        "aff_country_unique": "United States;United Kingdom;France"
    },
    {
        "id": "fHZ04oyEed",
        "title": "Representation Learning from Interventional Data",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "To learn data representations that are robust to distribution shifts, practitioners conduct interventions and collect interventional data in addition to passively collected observational data. However, even when the underlying causal model is known, existing approaches treat interventional data like observational data and ignore the causal model. Furthermore, these approaches assume a large number of interventional data points obtained through interventions that span the entire support of the intervened variable. This leads to representations that exhibit large discrepancies in predictive performance on observational and interventional data. In this paper, we first identify a strong correlation between interventional performance and adherence of the features to the statistical independence conditions induced by the underlying causal model. Then, we exploit this correlation and propose RepLIn to explicitly enforce the statistical independence during interventions. We demonstrate the utility of RepLIn across representative image classification tasks (attribute prediction on CelebA and image classification under corruption on CIFAR-10C and ImageNet-C) by modeling them as causal graphs and learning representations that are more robust to interventional distribution shifts.",
        "keywords": "causal representation learning;representation learning;interventional data",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Gautam Sreekumar;Vishnu Boddeti",
        "authorids": "~Gautam_Sreekumar1;~Vishnu_Boddeti1",
        "gender": "M;M",
        "homepage": "https://gautamsreekumar.github.io;https://hal.cse.msu.edu",
        "dblp": "264/9857;55/6988",
        "google_scholar": "mBrW_AkAAAAJ;JKcrO9IAAAAJ",
        "orcid": "0000-0003-4677-8240;",
        "linkedin": ";",
        "or_profile": "~Gautam_Sreekumar1;~Vishnu_Boddeti1",
        "aff": "Michigan State University;Michigan State University",
        "aff_domain": "msu.edu;msu.edu",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\nsreekumar2024representation,\ntitle={Representation Learning from Interventional Data},\nauthor={Gautam Sreekumar and Vishnu Boddeti},\nyear={2024},\nurl={https://openreview.net/forum?id=fHZ04oyEed}\n}",
        "github": "",
        "project": "",
        "reviewers": "XFMF;Uyzd;Pdav;WWQo",
        "site": "https://openreview.net/forum?id=fHZ04oyEed",
        "pdf_size": 13519564,
        "rating": "3;3;3;5",
        "confidence": "3;4;3;4",
        "soundness": "2;3;2;3",
        "contribution": "2;1;1;2",
        "presentation": "2;4;3;3",
        "wc_summary": "191;97;284;49",
        "wc_strengths": "57;89;62;59",
        "wc_weaknesses": "192;179;184;98",
        "wc_questions": "52;99;29;72",
        "wc_review": "492;464;559;278",
        "wc_reply_reviewers": "205;511;42;0",
        "wc_reply_authors": "528;260;185;904",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "2;1;1;2",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            155.25,
            90.18973056839675
        ],
        "wc_strengths_avg": [
            66.75,
            12.968712349342937
        ],
        "wc_weaknesses_avg": [
            163.25,
            37.95638944894522
        ],
        "wc_questions_avg": [
            63.0,
            25.758493744782516
        ],
        "wc_review_avg": [
            448.25,
            104.17863264604695
        ],
        "wc_reply_reviewers_avg": [
            189.5,
            200.79155858750636
        ],
        "wc_reply_authors_avg": [
            469.25,
            281.532746763143
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ODCOTeXZ08cJ:scholar.google.com/&scioq=Representation+Learning+from+Interventional+Data&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Michigan State University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.msu.edu",
        "aff_unique_abbr": "MSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "fI6TkT050a",
        "title": "Tracking Cognitive Development of Large Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) have recently shown tremendous performance on a large variety of Natural Language Processing tasks, ranging from text comprehension to mathematical problems.  However, the mechanism regarding why and how such performance has been achieved remains unknown, and it is unclear whether LLMs can achieve human-like cognitive abilities or whether these models are still fundamentally limited. To bridge this gap, we introduce Piaget's Theory of Cognitive Development (PTC) as a tool to reveal the development of cognitive abilities of LLMs. We construct a benchmark (CogLM) based on the scenario experiments in PTC to evaluate the cognitive level of LLMs, covering 10 abilities and 1220 questions created by more than 20 human experts. Through extensive experiments across multiple LLMs on CogLM, we find that: (1) Human-like cognitive abilities have emerged in State-of-the-art LLMs (GPT4), comparable to those of 20-year-old humans. (2) The parameter size and optimization objective are two key factors affecting the cognitive abilities of LLMs. (3) The ability of downstream tasks highly depends on the level of cognitive abilities. These findings provide guidance for the future development of advanced abilities of LLMs from the perspective of ability evolution, and shed light on the mystery behind the emergence of advanced abilities of LLMs.",
        "keywords": "Cognitive ability;benchmark;Large Language Models;Piaget's theory of cognitive development",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Xinglin Wang;Peiwen Yuan;Shaoxiong Feng;Boyuan Pan;Yiwei Li;Bin Sun;Heda Wang;Kan Li",
        "authorids": "~Xinglin_Wang1;~Peiwen_Yuan1;~Shaoxiong_Feng1;~Boyuan_Pan1;~Yiwei_Li1;~Bin_Sun3;~Heda_Wang1;~Kan_Li3",
        "gender": "M;M;M;M;M;M;M;M",
        "homepage": "https://github.com/WangXinglin;https://ypw0102.github.io/;http://shaoxiongfeng.com/;http://panboyuan.net/;;;https://github.com/wangheda;",
        "dblp": "02/1010;327/9196.html;260/0224;203/8799;48/9884-1;01/5401-4.html;;21/2083-1.html",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com.hk/citations?user=cUB5XN8AAAAJ;BaNQV40AAAAJ;lVFNAxcAAAAJ;https://scholar.google.com.hk/citations?user=yMZeaoMAAAAJ;https://scholar.google.com/citations?hl=zh-CN;;",
        "orcid": "0000-0002-5834-1508;0000-0002-2403-8295;;;;;;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Xinglin_Wang1;~Peiwen_Yuan1;~Shaoxiong_Feng1;~Boyuan_Pan1;~Yiwei_Li1;~Bin_Sun3;~Heda_Wang1;~Kan_Li3",
        "aff": "Beijing Institute of Technology;Beijing Institute of Technology;RedNote;Xiaohongshu;Beijing Institute of Technology;Beijing Institute of Technology;;Beijing Institute of Technology",
        "aff_domain": "bit.edu.cn;bit.edu.cn;xiaohongshu.com;xiaohongshu.com;bit.edu.cn;bit.edu.cn;;bit.edu.cn",
        "position": "PhD student;PhD student;Researcher;Researcher;PhD student;PhD student;;Full Professor",
        "bibtex": "@misc{\nwang2024tracking,\ntitle={Tracking Cognitive Development of Large Language Models},\nauthor={Xinglin Wang and Peiwen Yuan and Shaoxiong Feng and Boyuan Pan and Yiwei Li and Bin Sun and Heda Wang and Kan Li},\nyear={2024},\nurl={https://openreview.net/forum?id=fI6TkT050a}\n}",
        "github": "",
        "project": "",
        "reviewers": "BFZ5;Fc8y;sSK2;LvrM",
        "site": "https://openreview.net/forum?id=fI6TkT050a",
        "pdf_size": 287289,
        "rating": "1;3;3;3",
        "confidence": "5;5;4;4",
        "soundness": "1;2;1;2",
        "contribution": "1;1;2;2",
        "presentation": "2;3;2;3",
        "wc_summary": "190;48;90;115",
        "wc_strengths": "50;168;92;29",
        "wc_weaknesses": "861;247;1276;360",
        "wc_questions": "264;2;122;58",
        "wc_review": "1365;465;1580;562",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            1.5,
            0.5
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            110.75,
            51.63997966692086
        ],
        "wc_strengths_avg": [
            84.75,
            53.14778922965658
        ],
        "wc_weaknesses_avg": [
            686.0,
            411.6193630042202
        ],
        "wc_questions_avg": [
            111.5,
            97.74840152145711
        ],
        "wc_review_avg": [
            993.0,
            486.6975446825266
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:G7PZqLN1XHsJ:scholar.google.com/&scioq=Tracking+Cognitive+Development+of+Large+Language+Models&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2;0;0;0",
        "aff_unique_norm": "Beijing Institute of Technology;RedNote;Xiaohongshu",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.bit.edu.cn/;;https://www.xiaohongshu.com",
        "aff_unique_abbr": "BIT;;XHS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China;"
    },
    {
        "id": "fIKRJeLH7W",
        "title": "Proper Backward Connection Placement Boosts Spiking Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We study how backward connections (BCs, also known as temporal feedback connections) impact the performance of Spiking Neural Networks (SNNs) and how to boost SNNs' performance. Presumably, BCs have the potential to enhance SNNs' representation capacity by creating new temporal pathways in the SNN. We find that BC can enhance SNNS 'representation by creating new temporal pathways within SNN. The specific form is that the back neuron has a guiding effect on the expression of the front neuron. It can be found that the expression ability of SNN was enhanced in almost all BCS at different locations.Based on the above analysis, we propose a backward connected neuron (BC-SNN) framework. The expression ability of SNN was further improved by selecting appropriate bc within and between blocks.\nExtensive experiments indicate that BC-SNN is able to achieve state-of-the-art results on the CIFAR10, CIFAR100, and\nTiny-ImageNet datasets, with accuracy of 95.67\\%, 78.59\\%, and 63.43\\%, respectively. A set of ablation studies are further presented\nto understand the efficacy of each design component in BC-SNN.",
        "keywords": "Spiking Neural Networks;Temporal Backward Connections;Neural Architecture Search",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/54e2c650098bb1c5a263b28bfb868ce3bf84d8a2.zip",
        "author": "Shikuang Deng;Wei Li;Yuhang Wu;Peixiang Zheng;Du Zong Xin;Shi Gu",
        "authorids": "~Shikuang_Deng1;~Wei_Li66;~Yuhang_Wu5;~Peixiang_Zheng1;~Du_Zong_Xin1;~Shi_Gu1",
        "gender": "M;M;M;M;;M",
        "homepage": "https://www.guslab.org/;https://www.zhihu.com/people/weili21;https://github.com/WHYwyh;http://guslab.org/;https://nangongwubu.github.io/;https://github.com/xiaodaiguaya",
        "dblp": "286/8188;;;;175/1269;",
        "google_scholar": "rtlmA3gAAAAJ;;;;9_jlOXUAAAAJ;",
        "orcid": ";;;;0000-0003-2303-6770;",
        "linkedin": ";;;;;",
        "or_profile": "~Shikuang_Deng1;~Wei_Li66;~Yuhang_Wu5;~Du_Zong_Xin1;~Shi_Gu1;~\u57f9\u7965_\u90d11",
        "aff": "University of Electronic Science and Technology of China;;University of Electronic Science and Technology of China;University of Electronic Science and Technology of China;University of Electronic Science and Technology of China, Tsinghua University;University of Electronic Science and Technology of China",
        "aff_domain": "uestc.edu.cn;;uestc.edu.cn;uestc.edu.cn;uestc.edu.cn;uestc.edu.cn",
        "position": "PhD student;;MS student;MS student;Full Professor;MS student",
        "bibtex": "@misc{\ndeng2024proper,\ntitle={Proper Backward Connection Placement Boosts Spiking Neural Networks},\nauthor={Shikuang Deng and Wei Li and Yuhang Wu and Peixiang Zheng and Du Zong Xin and Shi Gu},\nyear={2024},\nurl={https://openreview.net/forum?id=fIKRJeLH7W}\n}",
        "github": "",
        "project": "",
        "reviewers": "FSBw;6HHN;SWJe",
        "site": "https://openreview.net/forum?id=fIKRJeLH7W",
        "pdf_size": 2037148,
        "rating": "3;5;5",
        "confidence": "5;4;4",
        "soundness": "2;3;3",
        "contribution": "2;2;3",
        "presentation": "2;4;3",
        "wc_summary": "58;68;58",
        "wc_strengths": "26;91;32",
        "wc_weaknesses": "58;199;4",
        "wc_questions": "18;36;279",
        "wc_review": "160;394;373",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            61.333333333333336,
            4.714045207910317
        ],
        "wc_strengths_avg": [
            49.666666666666664,
            29.32954520994525
        ],
        "wc_weaknesses_avg": [
            87.0,
            82.20705565825844
        ],
        "wc_questions_avg": [
            111.0,
            119.02100654926423
        ],
        "wc_review_avg": [
            309.0,
            105.70714261581381
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.9999999999999997,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:07Ehv3zXvzAJ:scholar.google.com/&scioq=Proper+Backward+Connection+Placement+Boosts+Spiking+Neural+Networks&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "University of Electronic Science and Technology of China",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uestc.edu.cn",
        "aff_unique_abbr": "UESTC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Magnitude Invariant Parametrizations Improve Hypernetwork Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18191",
        "id": "fJNnerz6iH",
        "author_site": "Jose Javier Gonzalez Ortiz, John Guttag, Adrian Dalca",
        "tldr": "",
        "abstract": "Hypernetworks, neural networks that predict the parameters of another neural network, are powerful models that have been successfully used in diverse applications from image generation to multi-task learning. Unfortunately, existing hypernetworks are often challenging to train. Training typically converges far more slowly than for non-hypernetwork models, and the rate of convergence can be very sensitive to hyperparameter choices. In this work, we identify a fundamental and previously unidentified problem that contributes to the challenge of training hypernetworks: a magnitude proportionality between the inputs and outputs of the hypernetwork. We demonstrate both analytically and empirically that this can lead to unstable optimization, thereby slowing down convergence, and sometimes even preventing any learning. We present a simple solution to this problem using a revised hypernetwork formulation that we call Magnitude Invariant Parametrizations (MIP). We demonstrate the proposed solution on several hypernetwork tasks, where it consistently stabilizes training and achieves faster convergence. Furthermore, we perform a comprehensive ablation study including choices of activation function, normalization strategies, input dimensionality, and hypernetwork architecture; and find that MIP improves training in all scenarios. We provide easy-to-use code that can turn existing networks into MIP-based hypernetworks.",
        "keywords": "deep learning;hypernetwork;stability;optimization",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/6a3579dccf10b97b4357fa3b9cde1d8a314b2c9b.pdf",
        "author": "Jose Javier Gonzalez Ortiz;John Guttag;Adrian V Dalca",
        "authorids": "~Jose_Javier_Gonzalez_Ortiz2;~John_Guttag2;~Adrian_V_Dalca1",
        "gender": "M;M;M",
        "homepage": "https://josejg.com;https://people.csail.mit.edu/guttag/;http://adalca.mit.edu",
        "dblp": ";g/JohnVGuttag;27/4108",
        "google_scholar": "4wa-Kd0AAAAJ;;https://scholar.google.ca/citations?user=zRy-zdAAAAAJ",
        "orcid": ";;0000-0002-8422-0136",
        "linkedin": "https://linkedin.com/in/josejg;;adalca/",
        "or_profile": "~Jose_Javier_Gonzalez_Ortiz2;~John_Guttag2;~Adrian_V_Dalca1",
        "aff": "DataBricks;Massachusetts Institute of Technology;Massachusetts Institute of Technology",
        "aff_domain": "databricks.com;mit.edu;mit.edu",
        "position": "Researcher;Full Professor;Research Scientist",
        "bibtex": "@inproceedings{\nortiz2024magnitude,\ntitle={Magnitude Invariant Parametrizations Improve Hypernetwork Learning},\nauthor={Jose Javier Gonzalez Ortiz and John Guttag and Adrian V Dalca},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=fJNnerz6iH}\n}",
        "github": "",
        "project": "",
        "reviewers": "YXs9;6gdA;mEvR;7ccS",
        "pdf_size": 2337603,
        "rating": "5;6;6;8",
        "confidence": "4;3;3;3",
        "soundness": "3;3;2;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;2;4",
        "wc_summary": "60;100;86;157",
        "wc_strengths": "32;88;63;72",
        "wc_weaknesses": "148;95;284;97",
        "wc_questions": "98;4;27;216",
        "wc_review": "338;287;460;542",
        "wc_reply_reviewers": "0;0;170;105",
        "wc_reply_authors": "552;273;643;641",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            100.75,
            35.50616143713651
        ],
        "wc_strengths_avg": [
            63.75,
            20.40067400847335
        ],
        "wc_weaknesses_avg": [
            156.0,
            76.8927824961485
        ],
        "wc_questions_avg": [
            86.25,
            82.53597700397081
        ],
        "wc_review_avg": [
            406.75,
            100.24314191005787
        ],
        "wc_reply_reviewers_avg": [
            68.75,
            72.4892233369899
        ],
        "wc_reply_authors_avg": [
            527.25,
            151.32147071714576
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.6622661785325219,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3170298576660751647&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=fJNnerz6iH",
        "pdf": "https://openreview.net/pdf?id=fJNnerz6iH",
        "email": "databricks.com;mit.edu;mit.edu",
        "author_num": 3,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Databricks;Massachusetts Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://databricks.com;https://web.mit.edu",
        "aff_unique_abbr": "Databricks;MIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "fK9RkJ4fgo",
        "title": "Stochastic interpolants with data-dependent couplings",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Generative models inspired by dynamical transport of measure -- such as flows and diffusions -- construct a continuous-time map between two probability densities.  Conventionally, one of these is the target density, only accessible through samples, while the other is taken as a simple base density that is data-agnostic. In this work, using the framework of stochastic interpolants, we formalize how to \\textit{couple} the base and the target densities. This enables us to incorporate information about class labels or continuous embeddings such as textual representations to construct dynamical transport maps  that serve as conditional generative models. We show that these transport maps can be learned by solving a simple square loss regression problem analogous to the standard independent setting. We demonstrate the usefulness of constructing dependent couplings in practice through experiments in super-resolution and in-painting, where we show that the use of a data-informed base density incorporating information about partially masked or low-resolution images significantly improves performance.",
        "keywords": "flows;diffusions;stochastic interpolants;generative models;sde;ode;image generation",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Mark Goldstein;Michael Samuel Albergo;Nicholas Matthew Boffi;Rajesh Ranganath;Eric Vanden-Eijnden",
        "authorids": "~Mark_Goldstein1;~Michael_Samuel_Albergo1;~Nicholas_Matthew_Boffi1;~Rajesh_Ranganath2;~Eric_Vanden-Eijnden1",
        "gender": "M;M;M;;M",
        "homepage": "https://cims.nyu.edu/~mg3479/;http://malbergo.me;https://nmboffi.github.io;;https://wp.nyu.edu/courantinstituteofmathematicalsciences-eve2/",
        "dblp": ";;;97/7057;88/7927",
        "google_scholar": "https://scholar.google.fr/citations?hl=en;GQyCZ4kAAAAJ;_jkX2q0AAAAJ;;A5Gx65gAAAAJ",
        "orcid": ";0000-0001-9058-5943;;;",
        "linkedin": ";;;;",
        "or_profile": "~Mark_Goldstein1;~Michael_Samuel_Albergo1;~Nicholas_Matthew_Boffi1;~Rajesh_Ranganath2;~Eric_Vanden-Eijnden1",
        "aff": "Google;New York University;NYU, New York University;New York University;New York University",
        "aff_domain": "google.com;nyu.edu;cims.nyu.edu;nyu.edu;nyu.edu",
        "position": "Intern;PhD student;Instructor;Assistant Professor;Full Professor",
        "bibtex": "@misc{\ngoldstein2024stochastic,\ntitle={Stochastic interpolants with data-dependent couplings},\nauthor={Mark Goldstein and Michael Samuel Albergo and Nicholas Matthew Boffi and Rajesh Ranganath and Eric Vanden-Eijnden},\nyear={2024},\nurl={https://openreview.net/forum?id=fK9RkJ4fgo}\n}",
        "github": "",
        "project": "",
        "reviewers": "v6gN;1uKk;RKsJ",
        "site": "https://openreview.net/forum?id=fK9RkJ4fgo",
        "pdf_size": 20589818,
        "rating": "5;6;6",
        "confidence": "4;4;4",
        "soundness": "3;3;4",
        "contribution": "2;2;1",
        "presentation": "3;3;3",
        "wc_summary": "66;79;49",
        "wc_strengths": "32;32;28",
        "wc_weaknesses": "316;307;212",
        "wc_questions": "90;41;5",
        "wc_review": "504;459;294",
        "wc_reply_reviewers": "272;88;108",
        "wc_reply_authors": "1198;781;777",
        "reply_reviewers": "1;1;1",
        "reply_authors": "3;3;3",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            64.66666666666667,
            12.283683848458853
        ],
        "wc_strengths_avg": [
            30.666666666666668,
            1.8856180831641267
        ],
        "wc_weaknesses_avg": [
            278.3333333333333,
            47.04843839656695
        ],
        "wc_questions_avg": [
            45.333333333333336,
            34.83612429010374
        ],
        "wc_review_avg": [
            419.0,
            90.27735042633894
        ],
        "wc_reply_reviewers_avg": [
            156.0,
            82.42976808572658
        ],
        "wc_reply_authors_avg": [
            918.6666666666666,
            197.52524451882658
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.0,
            0.0
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 20,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15300546513847598791&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;1;1;1",
        "aff_unique_norm": "Google;New York University",
        "aff_unique_dep": "Google;",
        "aff_unique_url": "https://www.google.com;https://www.nyu.edu",
        "aff_unique_abbr": "Google;NYU",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Mountain View;;New York",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "fKfvyJeAlY",
        "title": "LeRaC: Learning Rate Curriculum",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Most curriculum learning methods require an approach to sort the data samples by difficulty, which is often cumbersome to perform. In this work, we propose a novel curriculum learning approach termed Learning Rate Curriculum (LeRaC), which leverages the use of a different learning rate for each layer of a neural network to create a data-free curriculum during the initial training epochs. More specifically, LeRaC assigns higher learning rates to neural layers closer to the input, gradually decreasing the learning rates as the layers are placed farther away from the input. The learning rates increase at various paces during the first training iterations, until they all reach the same value. From this point on, the neural model is trained as usual. This creates a model-level curriculum learning strategy that does not require sorting the examples by difficulty and is compatible with any neural network, generating higher performance levels regardless of the architecture. We conduct comprehensive experiments on 10 data sets from the computer vision (CIFAR-10, CIFAR-100, Tiny ImageNet, ImageNet-200, PASCAL VOC), language (BoolQ, QNLI, RTE) and audio (ESC-50, CREMA-D) domains, considering various convolutional (ResNet-18, Wide-ResNet-50, DenseNet-121, YOLOv5), recurrent (LSTM) and transformer (CvT, BERT, SepTr) architectures. We compare our approach with the conventional training regime, as well as with Curriculum by Smoothing (CBS), a state-of-the-art data-free curriculum learning approach. Unlike CBS, our performance improvements over the standard training regime are consistent across all data sets and models. Furthermore, we significantly surpass CBS in terms of training time (there is no additional cost over the standard training regime for LeRaC). Our code is freely available at: http//github.com/link.hidden.for.review.",
        "keywords": "curriculum learning;model-level curriculum;deep learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/d59d2dcd8c909ea72d498c63662f732ac706b99b.zip",
        "author": "Florinel Alin Croitoru;Nicolae Catalin Ristea;Radu Tudor Ionescu;Nicu Sebe",
        "authorids": "~Florinel_Alin_Croitoru1;~Nicolae_Catalin_Ristea1;~Radu_Tudor_Ionescu1;~Nicu_Sebe1",
        "gender": "M;M;M;M",
        "homepage": ";;http://raduionescu.herokuapp.com;http://disi.unitn.it/~sebe/",
        "dblp": "313/9342;253/8663;120/9006;20/3519",
        "google_scholar": "RyD1dScAAAAJ;W_1liH0AAAAJ;qVbwC6QAAAAJ;https://scholar.google.it/citations?user=stFCYOAAAAAJ",
        "orcid": ";;0000-0002-9301-1950;0000-0002-6597-7248",
        "linkedin": "alin-croitoru-34254715a;;radu-ionescu-5145374b/;",
        "or_profile": "~Florinel_Alin_Croitoru1;~Nicolae_Catalin_Ristea1;~Radu_Tudor_Ionescu1;~Nicu_Sebe1",
        "aff": "University of Bucharest;University Politehnica of Bucharest;Universitatea Bucuresti;University of Trento",
        "aff_domain": "unibuc.ro;upb.ro;unibuc.ro;unitn.it",
        "position": "PhD student;PhD student;Full Professor;Full Professor",
        "bibtex": "@misc{\ncroitoru2024lerac,\ntitle={LeRaC: Learning Rate Curriculum},\nauthor={Florinel Alin Croitoru and Nicolae Catalin Ristea and Radu Tudor Ionescu and Nicu Sebe},\nyear={2024},\nurl={https://openreview.net/forum?id=fKfvyJeAlY}\n}",
        "github": "",
        "project": "",
        "reviewers": "RRAE;3pG7;i4Pq;sPFc",
        "site": "https://openreview.net/forum?id=fKfvyJeAlY",
        "pdf_size": 1842928,
        "rating": "5;5;5;6",
        "confidence": "3;4;3;2",
        "soundness": "3;3;3;3",
        "contribution": "3;1;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "56;77;31;150",
        "wc_strengths": "28;18;73;50",
        "wc_weaknesses": "119;265;111;2",
        "wc_questions": "40;2;27;216",
        "wc_review": "243;362;242;418",
        "wc_reply_reviewers": "180;0;44;13",
        "wc_reply_authors": "1257;779;587;465",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "2;1;2;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            78.5,
            44.37623237725348
        ],
        "wc_strengths_avg": [
            42.25,
            21.194043974664204
        ],
        "wc_weaknesses_avg": [
            124.25,
            93.48629578713663
        ],
        "wc_questions_avg": [
            71.25,
            84.67991202168317
        ],
        "wc_review_avg": [
            316.25,
            76.36221251378197
        ],
        "wc_reply_reviewers_avg": [
            59.25,
            71.52403442200391
        ],
        "wc_reply_authors_avg": [
            772.0,
            301.5576230175586
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "University of Bucharest;University Politehnica of Bucharest;University of Trento",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.unibuc.ro;https://www.upb.ro;https://www.unitn.it",
        "aff_unique_abbr": "Unibuc;UPB;UniTN",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "Romania;Italy"
    },
    {
        "id": "fLO9VaAb3B",
        "title": "Alphazero-like Tree-Search can guide large language model decoding and training",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs) typically employ sampling or beam search, accompanied by prompts such as Chain-of-Thought (CoT), to boost reasoning and decoding ability. Recent work like Tree-of-Thought (ToT) and Reasoning via Planning (RAP) aim to augment the reasoning capabilities of LLMs by utilizing tree-search algorithms to guide multi-step reasoning. These methods mainly focus on LLMs' reasoning ability during inference and heavily rely on human-designed prompts to activate LLM as a value function, thus lacking general applicability and scalability. To address these limitations, we present an AlphaZero-like tree-search learning framework for LLMs (termed TS-LLM), systematically showing how tree-search with a learned value function can guide LLMs' decoding ability. TS-LLM distinguishes itself in two key ways: (1) Leveraging a learned value function, our approach can be generally applied to different tasks beyond reasoning (such as RLHF alignment),  and LLMs of any size, without prompting advanced, large-scale models. (2) It can guide LLM's decoding during both inference and training. Empirical evaluations across reasoning, planning, and RLHF alignment tasks validate the effectiveness of TS-LLM, even on trees with a depth of 64.",
        "keywords": "Large Language Models;Tree Search;Value Function;Reinforcement Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/95d1eebde2416aa2664316f9769f8f07f51a9cf7.pdf",
        "author": "Ziyu Wan;Xidong Feng;Muning Wen;Ying Wen;Weinan Zhang;Jun Wang",
        "authorids": "~Ziyu_Wan2;~Xidong_Feng1;~Muning_Wen2;~Ying_Wen1;~Weinan_Zhang1;~Jun_Wang2",
        "gender": "M;;M;M;M;M",
        "homepage": "https://github.com/ziyuwan;https://waterhorse1.github.io/;https://github.com/morning9393;https://yingwen.io;http://wnzhang.net;http://www0.cs.ucl.ac.uk/staff/jun.wang/",
        "dblp": ";;295/0261;41/4203-1;28/10261-1;w/JunWang12",
        "google_scholar": "VEtZ7gYAAAAJ;JfOLNu8AAAAJ;Zt1WFtQAAAAJ;_A1CxG8AAAAJ;Qzss0GEAAAAJ;https://scholar.google.co.uk/citations?user=wIE1tY4AAAAJ",
        "orcid": ";;0009-0000-7868-1262;0000-0003-1247-2382;0000-0002-0127-2425;",
        "linkedin": ";;;wenying45;;",
        "or_profile": "~Ziyu_Wan2;~Xidong_Feng1;~Muning_Wen2;~Ying_Wen1;~Weinan_Zhang1;~Jun_Wang2",
        "aff": "Shanghai Jiaotong University;University College London;Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;University College London",
        "aff_domain": "sjtu.edu.cn;ucl.ac.uk;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;ucl.ac.uk",
        "position": "PhD student;PhD student;PhD student;Associate Professor;Associate Professor;Professor",
        "bibtex": "@misc{\nwan2024alphazerolike,\ntitle={Alphazero-like Tree-Search can guide large language model decoding and training},\nauthor={Ziyu Wan and Xidong Feng and Muning Wen and Ying Wen and Weinan Zhang and Jun Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=fLO9VaAb3B}\n}",
        "github": "",
        "project": "",
        "reviewers": "1bFk;xk9Q;E6Fb;Zruf",
        "site": "https://openreview.net/forum?id=fLO9VaAb3B",
        "pdf_size": 622391,
        "rating": "5;5;6;6",
        "confidence": "4;4;4;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;3;4",
        "wc_summary": "45;255;169;118",
        "wc_strengths": "64;52;71;21",
        "wc_weaknesses": "165;157;662;85",
        "wc_questions": "94;4;427;36",
        "wc_review": "368;468;1329;260",
        "wc_reply_reviewers": "435;0;4125;103",
        "wc_reply_authors": "2000;650;5027;689",
        "reply_reviewers": "2;0;16;1",
        "reply_authors": "5;3;13;4",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            146.75,
            76.47344310281838
        ],
        "wc_strengths_avg": [
            52.0,
            19.144189719076646
        ],
        "wc_weaknesses_avg": [
            267.25,
            230.0286666917843
        ],
        "wc_questions_avg": [
            140.25,
            168.66886938614368
        ],
        "wc_review_avg": [
            606.25,
            423.7135677553883
        ],
        "wc_reply_reviewers_avg": [
            1165.75,
            1716.0686721399002
        ],
        "wc_reply_authors_avg": [
            2091.5,
            1779.7795509556795
        ],
        "reply_reviewers_avg": [
            4.75,
            6.53356717268599
        ],
        "reply_authors_avg": [
            6.25,
            3.960744879438715
        ],
        "replies_avg": [
            51,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 125,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12391024127440976227&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;0;0;0;1",
        "aff_unique_norm": "Shanghai Jiao Tong University;University College London",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.sjtu.edu.cn;https://www.ucl.ac.uk",
        "aff_unique_abbr": "SJTU;UCL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;0;1",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "id": "fLWqIWPMDH",
        "title": "Memoization-Aware Bayesian Optimization for AI Pipelines with Unknown Costs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Bayesian optimization (BO) is an effective approach for optimizing expensive black-box functions via potentially noisy function evaluations. However, few BO techniques address the cost-aware setting, in which different samples impose different costs on the optimizer, particularly when costs are initially unknown. This cost-aware BO setting is of special interest in tuning multi-stage AI pipelines, in which we could apply caching techniques to store and reuse early-stage outputs in favor of optimizing later stages, without incurring the costs of re-running the full pipeline. In this paper, we propose the Expected-Expected Improvement Per Unit Cost (EEIPU), a novel extension to the Expected Improvement (EI) acquisition function that adapts to unknown costs in multi-stage pipelines. EEIPU fits individual Gaussian Process (GP) models for each stage's cost data and manages the different cost regions of the search space, while balancing exploration-exploitation trade-offs. Additionally, EEIPU incorporates early-stage memoization, reducing redundant computations and costs by reusing the results of earlier stages, allowing for more iterations than existing approaches within the specified budget. In the cost-aware setting, EEIPU significantly outperforms comparable methods when tested on both synthetic and real pipelines, returning higher objective function values at lower total execution costs. This offers a significant advancement in cost-aware BO for optimizing multi-stage machine learning pipelines.",
        "keywords": "Bayesian Optimization;Cost-Awareness;Memoization;Multistage Pipeline;Expected Improvement",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/f9331279ab9c3fda31d84d97245fcf09fdcc2b99.pdf",
        "author": "Abdelmajid Essofi;Ridwan Salahuddeen;Munachiso S Nwadike;Navish Kumar;Kun Zhang;Eric Xing;Willie Neiswanger;Qirong Ho",
        "authorids": "~Abdelmajid_Essofi1;~Ridwan_Salahuddeen1;~Munachiso_S_Nwadike1;~Navish_Kumar1;~Kun_Zhang1;~Eric_Xing1;~Willie_Neiswanger2;~Qirong_Ho1",
        "gender": "M;M;M;M;M;M;M;",
        "homepage": "https://github.com/MjidHub;https://github.com/ridzy619;https://samunaai.github.io/;;http://www.andrew.cmu.edu/user/kunz1/;http://www.cs.cmu.edu/~epxing/;https://willieneis.github.io/;",
        "dblp": ";;283/4284;;96/3115-1;36/3855;120/7593.html;13/7590",
        "google_scholar": ";;wtjOZ9UAAAAJ;https://scholar.google.co.in/citations?user=BFCHfngAAAAJ;RGoypN4AAAAJ;https://scholar.google.com.tw/citations?user=5pKTRxEAAAAJ;QwKHApEAAAAJ;tR3AZbwAAAAJ",
        "orcid": ";;0009-0005-0965-3096;0000-0002-9107-9513;;;;",
        "linkedin": ";;munachiso-samuel-nwadike-7628781bb/;navishkumar/;;;;",
        "or_profile": "~Abdelmajid_Essofi1;~Ridwan_Salahuddeen1;~Munachiso_S_Nwadike1;~Navish_Kumar1;~Kun_Zhang1;~Eric_Xing1;~Willie_Neiswanger2;~Qirong_Ho1",
        "aff": ";Mohamed bin Zayed University of Artificial Intelligence;New York University Abu Dhabi;University of Basel;Carnegie Mellon University;School of Computer Science, Carnegie Mellon University;University of Southern California;Petuum, Inc.",
        "aff_domain": ";mbzuai.ac.ae;nyu.edu;unibas.ch;cmu.edu;cs.cmu.edu;usc.edu;petuum.com",
        "position": ";MS student;Researcher;PhD student;Associate Professor;Full Professor;Assistant Professor;CTO",
        "bibtex": "@misc{\nessofi2024memoizationaware,\ntitle={Memoization-Aware Bayesian Optimization for {AI} Pipelines with Unknown Costs},\nauthor={Abdelmajid Essofi and Ridwan Salahuddeen and Munachiso S Nwadike and Navish Kumar and Kun Zhang and Eric Xing and Willie Neiswanger and Qirong Ho},\nyear={2024},\nurl={https://openreview.net/forum?id=fLWqIWPMDH}\n}",
        "github": "",
        "project": "",
        "reviewers": "fSnX;uCj5;W9CP;gsaT",
        "site": "https://openreview.net/forum?id=fLWqIWPMDH",
        "pdf_size": 1526729,
        "rating": "5;5;5;6",
        "confidence": "4;3;3;4",
        "soundness": "3;3;3;3",
        "contribution": "1;2;2;2",
        "presentation": "3;3;3;3",
        "wc_summary": "60;87;217;86",
        "wc_strengths": "48;39;99;26",
        "wc_weaknesses": "318;240;276;70",
        "wc_questions": "189;127;108;114",
        "wc_review": "615;493;700;296",
        "wc_reply_reviewers": "0;100;0;0",
        "wc_reply_authors": "1261;779;772;778",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            112.5,
            61.296410987920005
        ],
        "wc_strengths_avg": [
            53.0,
            27.685736399814257
        ],
        "wc_weaknesses_avg": [
            226.0,
            94.2019108086455
        ],
        "wc_questions_avg": [
            134.5,
            32.20636583037583
        ],
        "wc_review_avg": [
            526.0,
            151.8107374331605
        ],
        "wc_reply_reviewers_avg": [
            25.0,
            43.30127018922193
        ],
        "wc_reply_authors_avg": [
            897.5,
            209.8838964761232
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:IiBbSqhzlJwJ:scholar.google.com/&scioq=Memoization-Aware+Bayesian+Optimization+for+AI+Pipelines+with+Unknown+Costs&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;3;4;5",
        "aff_unique_norm": "Mohamed bin Zayed University of Artificial Intelligence;New York University;University of Basel;Carnegie Mellon University;University of Southern California;Petuum, Inc.",
        "aff_unique_dep": ";;;;;",
        "aff_unique_url": "https://mbzuai.ac.ae;https://nyu.edu;https://www.unibas.ch;https://www.cmu.edu;https://www.usc.edu;https://www.petuum.com",
        "aff_unique_abbr": "MBZUAI;NYU;UniBas;CMU;USC;Petuum",
        "aff_campus_unique_index": "1;2;3",
        "aff_campus_unique": ";Abu Dhabi;Pittsburgh;Los Angeles",
        "aff_country_unique_index": "0;0;1;2;2;2;2",
        "aff_country_unique": "United Arab Emirates;Switzerland;United States"
    },
    {
        "title": "Convergence of Bayesian Bilevel Optimization",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18190",
        "id": "fLXpXa7iiz",
        "author_site": "Shi Fu, Fengxiang He, Xinmei Tian, Dacheng Tao",
        "tldr": "",
        "abstract": "This paper presents the first theoretical guarantee for Bayesian bilevel optimization (BBO) that we term for the prevalent bilevel framework combining Bayesian optimization at the outer level to tune hyperparameters, and the inner-level stochastic gradient descent (SGD) for training the model. We prove sublinear regret bounds suggesting simultaneous convergence of the inner-level model parameters and outer-level hyperparameters to optimal configurations for generalization capability. A pivotal, technical novelty in the proofs is modeling the excess risk of the SGD-trained parameters as evaluation noise during Bayesian optimization. Our theory implies the inner unit horizon, defined as the number of SGD iterations, shapes the convergence behavior of BBO. This suggests practical guidance on configuring the inner unit horizon to enhance training efficiency and model performance.",
        "keywords": "Hyperparameter optimization;Bayesian optimization;Convergence rate;Bilevel optimization;Learning theory",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Shi Fu;Fengxiang He;Xinmei Tian;Dacheng Tao",
        "authorids": "~Shi_Fu1;~Fengxiang_He1;~Xinmei_Tian1;~Dacheng_Tao1",
        "gender": "M;;F;",
        "homepage": "http:// home.ustc.edu.cn/~fs311;https://fengxianghe.github.io/;https://faculty.ustc.edu.cn/tianxinmei1/zh_CN/index.htm;",
        "dblp": ";225/4682;03/5204-1;",
        "google_scholar": ";QSx-Yu0AAAAJ;https://scholar.google.com.au/citations?hl=zh-CN;",
        "orcid": ";;0000-0002-5952-8753;",
        "linkedin": ";fengxiang-he-35b173122;;",
        "or_profile": "~Shi_Fu1;~Fengxiang_He1;~Xinmei_Tian1;~Dacheng_Tao1",
        "aff": "University of Science and Technology of China;University of Edinburgh;University of Science and Technology of China;",
        "aff_domain": "ustc.edu.cn;ed.ac.uk;ustc.edu.cn;",
        "position": "MS student;Lecturer;Full Professor;",
        "bibtex": "@inproceedings{\nfu2024convergence,\ntitle={Convergence of Bayesian Bilevel Optimization},\nauthor={Shi Fu and Fengxiang He and Xinmei Tian and Dacheng Tao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=fLXpXa7iiz}\n}",
        "github": "",
        "project": "",
        "reviewers": "PGhy;66Ye;pR2Q;1wgY",
        "pdf_size": 368465,
        "rating": "6;6;6;8",
        "confidence": "1;3;5;2",
        "soundness": "2;3;4;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;4;3",
        "wc_summary": "35;143;68;63",
        "wc_strengths": "89;113;73;59",
        "wc_weaknesses": "37;139;90;54",
        "wc_questions": "7;61;94;15",
        "wc_review": "168;456;325;191",
        "wc_reply_reviewers": "18;0;15;0",
        "wc_reply_authors": "403;821;913;1043",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            2.75,
            1.479019945774904
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            77.25,
            39.98984246030484
        ],
        "wc_strengths_avg": [
            83.5,
            20.068632240389476
        ],
        "wc_weaknesses_avg": [
            80.0,
            39.07044919117261
        ],
        "wc_questions_avg": [
            44.25,
            35.35091936569684
        ],
        "wc_review_avg": [
            285.0,
            115.50541112865665
        ],
        "wc_reply_reviewers_avg": [
            8.25,
            8.317902379807062
        ],
        "wc_reply_authors_avg": [
            795.0,
            239.6706072925923
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.29277002188455997,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6570294768043327531&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=fLXpXa7iiz",
        "pdf": "https://openreview.net/pdf?id=fLXpXa7iiz",
        "email": "ustc.edu.cn;ed.ac.uk;ustc.edu.cn;",
        "author_num": 4,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Science and Technology of China;University of Edinburgh",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.ustc.edu.cn;https://www.ed.ac.uk",
        "aff_unique_abbr": "USTC;Edinburgh",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "title": "$\\mathcal{B}$-Coder: Value-Based Deep Reinforcement Learning for Program Synthesis",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18189",
        "id": "fLf589bx1f",
        "author_site": "Zishun Yu, Yunzhe Tao, Liyu Chen, TAO SUN, Hongxia Yang",
        "tldr": "",
        "abstract": "Program synthesis aims to create accurate, executable programs from problem specifications, specifically from natural language descriptions in our context. \nRecent studies have leveraged the power of reinforcement learning (RL) in conjunction with large language models (LLMs), significantly enhancing code generation capabilities. The application of RL focuses on directly optimizing for functional correctness, offering an advantage over conventional supervised methods. \nDespite policy-based RL methods dominating the literature on RL for program synthesis, the nature of program synthesis tasks hints at a natural alignment with value-based methods.\nThis stems from the rich collection of off-policy programs, including those developed by human programmers and also historical samples, coupled with the straightforward verification of generated programs through automated unit testing, meaning rewards are easy to obtain.\nDiverging from the dominant use of policy-based algorithms, our work explores the feasibility of value-based approaches, leading to the development of our $\\mathcal{B}$-Coder (pronounced Bellman coder).\nYet, training value-based methods presents challenges due to the enormous search space inherent to program synthesis. \nTo this end, we introduce an initialization protocol for RL agents utilizing pre-trained LMs and a conservative Bellman operator to reduce training complexities. \nMoreover, we demonstrate how to leverage the learned value functions as a dual strategy to post-process generated programs. \nOur empirical evaluations demonstrated $\\mathcal{B}$-Coder's capability in achieving state-of-the-art performance when compared to policy-based methods. \nRemarkably, this achievement is reached with minimal reward engineering effort, highlighting the effectiveness of value-based RL, independent of reward designs.",
        "keywords": "Program Synthesis;Code Generation;Reinforcement Learning;Value-Based RL",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Zishun Yu;Yunzhe Tao;Liyu Chen;Tao Sun;Hongxia Yang",
        "authorids": "~Zishun_Yu1;~Yunzhe_Tao2;~Liyu_Chen1;~Tao_Sun14;~Hongxia_Yang2",
        "gender": "M;M;M;F;M",
        "homepage": "https://www.zishun.me;;https://lchenat.github.io/;https://www4.comp.polyu.edu.hk/~hongxyang/;",
        "dblp": "320/4542.html;;;;74/3590-8",
        "google_scholar": "yhoPwYYAAAAJ;gldelC4AAAAJ;FmNqZAYAAAAJ;iJlC5mMAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;;0009-0006-7299-6531",
        "linkedin": "zishunyu/;yunzhe-tao/;;;",
        "or_profile": "~Zishun_Yu1;~Yunzhe_Tao2;~Liyu_Chen1;~Hongxia_Yang2;~TAO_SUN3",
        "aff": "GenAI - Meta;ByteDance;ByteDance Inc;ByteDance Inc.;Bytedance",
        "aff_domain": "meta.com;bytedance.com;bytedance.com;bytedance.com;bytedance.com",
        "position": "Intern;Researcher;Researcher;Principal Researcher;Research Scientist",
        "bibtex": "@inproceedings{\nyu2024mathcalbcoder,\ntitle={\\${\\textbackslash}mathcal\\{B\\}\\$-Coder: Value-Based Deep Reinforcement Learning for Program Synthesis},\nauthor={Zishun Yu and Yunzhe Tao and Liyu Chen and Tao Sun and Hongxia Yang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=fLf589bx1f}\n}",
        "github": "",
        "project": "",
        "reviewers": "R5vH;3d3T;F9ov;dB3F",
        "pdf_size": 536494,
        "rating": "6;8;8;8",
        "confidence": "4;4;2;3",
        "soundness": "3;3;4;3",
        "contribution": "3;3;4;4",
        "presentation": "2;3;4;3",
        "wc_summary": "122;145;155;311",
        "wc_strengths": "169;81;286;3",
        "wc_weaknesses": "416;203;77;3",
        "wc_questions": "174;425;183;3",
        "wc_review": "881;854;701;320",
        "wc_reply_reviewers": "63;195;10;0",
        "wc_reply_authors": "1876;2201;428;447",
        "reply_reviewers": "1;2;1;0",
        "reply_authors": "4;4;1;1",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            183.25,
            74.72073005531999
        ],
        "wc_strengths_avg": [
            134.75,
            105.23396552444463
        ],
        "wc_weaknesses_avg": [
            174.75,
            156.56687868128432
        ],
        "wc_questions_avg": [
            196.25,
            150.2853535777855
        ],
        "wc_review_avg": [
            689.0,
            223.82694207802598
        ],
        "wc_reply_reviewers_avg": [
            67.0,
            77.68204425734432
        ],
        "wc_reply_authors_avg": [
            1238.0,
            808.7326505094252
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.5,
            1.5
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13901020295326104812&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=fLf589bx1f",
        "pdf": "https://openreview.net/pdf?id=fLf589bx1f",
        "email": "meta.com;bytedance.com;bytedance.com;bytedance.com;bytedance.com",
        "author_num": 5,
        "aff_unique_index": "0;1;1;1;1",
        "aff_unique_norm": "Meta;ByteDance",
        "aff_unique_dep": "GenAI;",
        "aff_unique_url": "https://meta.com;https://www.bytedance.com",
        "aff_unique_abbr": "Meta;ByteDance",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;1",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "fM1ETm3ssl",
        "title": "Towards Meta-Models for Automated Interpretability",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Mechanistic interpretability aims to open the black box of neural networks. Previous work has demonstrated that the mechanisms implemented by small neural networks can be fully reverse-engineered. Since these efforts rely on human labor that does not scale to models with billions of parameters, there is growing interest in automating interpretability methods. We propose to use \\emph{meta-models}, neural networks that take another network's parameters as input, to scale interpretability efforts.\nTo this end, we present a scalable meta-model architecture and successfully apply it to a variety of problems, including mapping neural network parameters to human-legible code and detecting backdoors in networks. Our results aim to provide a proof-of-concept for automating mechanistic interpretability methods.",
        "keywords": "interpretability;meta-models;automated interpretability;backdoors;trojans;backdoor detection;tracr;rasp",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Lauro Langosco;Neel Alex;William Baker;David John Quarel;Herbie Bradley;David Krueger",
        "authorids": "~Lauro_Langosco1;~Neel_Alex1;~William_Baker2;~David_John_Quarel1;~Herbie_Bradley1;~David_Krueger1",
        "gender": "M;M;;M;M;",
        "homepage": "https://neel-alex.github.io/;https://william-baker.github.io/;https://davidquarel.github.io/;https://herbiebradley.com;https://mila.umontreal.ca/en/person/david-scott-krueger/;https://www.laurolangosco.com/",
        "dblp": ";;;;142/2741.html;298/0973",
        "google_scholar": ";;;oQ0HzPcAAAAJ;https://scholar.google.ca/citations?user=5Uz70IoAAAAJ;8-HOLxkAAAAJ",
        "orcid": ";;;0000-0001-5390-1257;;",
        "linkedin": ";william-baker-ai/;;herbiebradley/;;laurolangosco/",
        "or_profile": "~Neel_Alex1;~William_Baker2;~David_John_Quarel1;~Herbie_Bradley1;~David_Krueger1;~Lauro_Langosco_di_Langosco1",
        "aff": "University of Cambridge;;University of Cambridge;University of Cambridge;University of Cambridge;University of Cambridge",
        "aff_domain": "cam.ac.uk;;cam.ac.uk;cam.ac.uk;cam.ac.uk;cam.ac.uk",
        "position": "PhD student;;Intern;PhD student;Assistant Professor;PhD student",
        "bibtex": "@misc{\nlangosco2024towards,\ntitle={Towards Meta-Models for Automated Interpretability},\nauthor={Lauro Langosco and Neel Alex and William Baker and David John Quarel and Herbie Bradley and David Krueger},\nyear={2024},\nurl={https://openreview.net/forum?id=fM1ETm3ssl}\n}",
        "github": "",
        "project": "",
        "reviewers": "aCZg;HFmY;2Mjn",
        "site": "https://openreview.net/forum?id=fM1ETm3ssl",
        "pdf_size": 1141747,
        "rating": "1;3;5",
        "confidence": "5;3;3",
        "soundness": "1;2;3",
        "contribution": "1;2;3",
        "presentation": "1;2;3",
        "wc_summary": "23;86;99",
        "wc_strengths": "2;70;140",
        "wc_weaknesses": "22;104;321",
        "wc_questions": "1;39;161",
        "wc_review": "48;299;721",
        "wc_reply_reviewers": "0;0;358",
        "wc_reply_authors": "130;738;1578",
        "reply_reviewers": "0;0;2",
        "reply_authors": "1;1;5",
        "rating_avg": [
            3.0,
            1.632993161855452
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            69.33333333333333,
            33.189690501051004
        ],
        "wc_strengths_avg": [
            70.66666666666667,
            56.3402362634576
        ],
        "wc_weaknesses_avg": [
            149.0,
            126.14541873039491
        ],
        "wc_questions_avg": [
            67.0,
            68.2544259859144
        ],
        "wc_review_avg": [
            356.0,
            277.6916755444186
        ],
        "wc_reply_reviewers_avg": [
            119.33333333333333,
            168.76281844318936
        ],
        "wc_reply_authors_avg": [
            815.3333333333334,
            593.667321729004
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            1.8856180831641267
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.8660254037844387,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9707534754008809371&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "University of Cambridge",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cam.ac.uk",
        "aff_unique_abbr": "Cambridge",
        "aff_campus_unique_index": "0;0;0;0;0",
        "aff_campus_unique": "Cambridge",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "fMX07g3prp",
        "title": "FR-NAS: Forward-and-Reverse Graph Predictor for Efficient Neural Architecture Search",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Neural Architecture Search (NAS) has risen to prominence as a pivotal tool for identifying optimal configurations for deep neural networks suited to particular tasks. However, the process of training and assessing numerous architectures introduces considerable computational overhead. One approach to mitigate this is through performance predictors, which offer a means to estimate an architecture's potential without exhaustive training. Given that neural architectures fundamentally resemble directed acyclic graphs (DAGs), graph neural networks (GNNs) become an apparent choice for such predictive tasks. Nevertheless, the scarcity of training data can impact the precision of GNN-based predictors.\nTo address this, we introduce a novel GNN predictor for NAS. This predictor renders neural architectures into vector representations by combining both the conventional and inverse graph views. Additionally, we incorporate a tailored feature loss within the GNN predictor to ensure efficient utilization of both types of representations.\nWe subsequently assess our method's efficacy through experiments on benchmark datasets including NASBench-101, NASBench-201, and the DARTS search space, with a training data range of 50 to 400 samples. The results demonstrated a notable performance improvement, achieving an enhancement of 3\\%-16\\% in terms of prediction accuracy when compared to state-of-the-art GNN predictors across the board.\nThe source code will be made publicly available.",
        "keywords": "Neural Architecture Search;Performance Predictor;Graph Neural Network",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Haoming Zhang;Ran Cheng",
        "authorids": "~Haoming_Zhang4;~Ran_Cheng1",
        "gender": "M;M",
        "homepage": ";https://chengran.tech/",
        "dblp": ";",
        "google_scholar": "UcjoVysAAAAJ;bjeIdlcAAAAJ",
        "orcid": "0000-0002-1517-0382;0000-0001-9410-8263",
        "linkedin": ";",
        "or_profile": "~Haoming_Zhang4;~Ran_Cheng1",
        "aff": "South University of Science and Technology of China;Southern Unviersity of Science and Technology",
        "aff_domain": "sustc.edu.cn;sustech.edu.cn",
        "position": "MS student;Asociate Professor",
        "bibtex": "@misc{\nzhang2024frnas,\ntitle={{FR}-{NAS}: Forward-and-Reverse Graph Predictor for Efficient Neural Architecture Search},\nauthor={Haoming Zhang and Ran Cheng},\nyear={2024},\nurl={https://openreview.net/forum?id=fMX07g3prp}\n}",
        "github": "",
        "project": "",
        "reviewers": "6p2a;wK9q;YbEc;NESX",
        "site": "https://openreview.net/forum?id=fMX07g3prp",
        "pdf_size": 528401,
        "rating": "3;3;5;5",
        "confidence": "5;5;4;4",
        "soundness": "2;3;2;3",
        "contribution": "1;2;2;3",
        "presentation": "2;3;2;3",
        "wc_summary": "54;54;24;155",
        "wc_strengths": "45;55;24;38",
        "wc_weaknesses": "620;113;55;128",
        "wc_questions": "13;59;2;108",
        "wc_review": "732;281;105;429",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            71.75,
            49.60027721696724
        ],
        "wc_strengths_avg": [
            40.5,
            11.280514172678478
        ],
        "wc_weaknesses_avg": [
            229.0,
            227.38403637898594
        ],
        "wc_questions_avg": [
            45.5,
            41.9434142625514
        ],
        "wc_review_avg": [
            386.75,
            229.97214505239543
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:mCLKhJTx0ggJ:scholar.google.com/&scioq=FR-NAS:+Forward-and-Reverse+Graph+Predictor+for+Efficient+Neural+Architecture+Search&hl=en&as_sdt=0,33",
        "gs_version_total": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "South University of Science and Technology of China;Southern University of Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.sustech.edu.cn;https://www.sustech.edu.cn",
        "aff_unique_abbr": "SUSTech;SUSTech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "fMqP9Ohm7M",
        "title": "SMOOT: Saliency Guided Mask Optimized Online Training",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Deep Neural Networks are powerful tools for understanding complex patterns and making decisions. However, their black-box nature impedes a complete understanding of their inner workings. Saliency-Guided Training (SGT) methods try to highlight the prominent features in the model's training based on the output to alleviate this problem. These methods use back-propagation and modified gradients to guide the model toward the most relevant features while keeping the impact on the prediction accuracy negligible. SGT makes the model's final result more interpretable by masking input partially. In this way, considering the model's output, we can infer how each segment of the input affects the output. In the particular case of image as the input, masking is applied to the input pixels. However, the masking strategy and number of pixels which we mask, are considered as a hyperparameter. Appropriate setting of masking strategy can directly affect the model's training. In this paper, we focus on this issue and present our contribution. We propose a novel method to determine the optimal number of masked images based on input, accuracy, and model loss during the training. The strategy prevents information loss which leads to better accuracy values. Also, by integrating the model's performance in the strategy formula, we show that our model represents the salient features more meaningful. Our experimental results demonstrate a substantial improvement in both model accuracy and the prominence of saliency, thereby affirming the effectiveness of our proposed solution.",
        "keywords": "Saliency;Modified gradients;Interpretability;Hyperparameter tuning;Information loss",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Ali Karkehabadi;Avesta Sasan",
        "authorids": "~Ali_Karkehabadi1;~Avesta_Sasan1",
        "gender": "M;",
        "homepage": ";",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": "ali-karkeh-abadi-317a3a156;",
        "or_profile": "~Ali_Karkehabadi1;~Avesta_Sasan1",
        "aff": "University of California, Davis;George Mason University",
        "aff_domain": "ucdavis.edu;gmu.edu",
        "position": "PhD student;",
        "bibtex": "@misc{\nkarkehabadi2024smoot,\ntitle={{SMOOT}: Saliency Guided Mask Optimized Online Training},\nauthor={Ali Karkehabadi and Avesta Sasan},\nyear={2024},\nurl={https://openreview.net/forum?id=fMqP9Ohm7M}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=fMqP9Ohm7M",
        "pdf_size": 3402253,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 26,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3593298067562651824&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of California, Davis;George Mason University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ucdavis.edu;https://www.gmu.edu",
        "aff_unique_abbr": "UC Davis;GMU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Davis;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "fMzO6vcmhy",
        "title": "QORA: Zero-Shot Transfer via Interpretable Object-Relational Model Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Although neural networks have demonstrated significant success in various reinforcement-learning tasks, even the highest-performing deep models often fail to generalize. As an alternative, object-oriented approaches offer a promising path towards better efficiency and generalization; however, they typically address narrow problem classes and require extensive domain knowledge. To overcome these limitations, we introduce *QORA*, an algorithm that constructs models expressive enough to solve a variety of domains, including those with stochastic transition functions, directly from a domain-agnostic object-based state representation. We also provide a novel benchmark suite to evaluate learners' generalization capabilities. In our test domains, QORA achieves 100% predictive accuracy using almost four orders of magnitude fewer observations than a neural-network baseline, demonstrates zero-shot transfer to modified environments, and adapts rapidly when applied to tasks involving previously unseen object interactions. Finally, we give examples of QORA's learned rules, showing them to be easily interpretable.",
        "keywords": "zero-shot transfer;reinforcement learning;relational learning;interpretable machine learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Gabriel Stella;Dmitri Loguinov",
        "authorids": "~Gabriel_Stella1;~Dmitri_Loguinov1",
        "gender": "Not Specified;M",
        "homepage": "https://gabrielrstella.com/;http://irl.cs.tamu.edu/people/dmitri/",
        "dblp": ";",
        "google_scholar": ";JSidYKQAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Gabriel_Stella1;~Dmitri_Loguinov1",
        "aff": "Texas A&M University - College Station;Texas A&M University - College Station",
        "aff_domain": "tamu.edu;tamu.edu",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nstella2024qora,\ntitle={{QORA}: Zero-Shot Transfer via Interpretable Object-Relational Model Learning},\nauthor={Gabriel Stella and Dmitri Loguinov},\nyear={2024},\nurl={https://openreview.net/forum?id=fMzO6vcmhy}\n}",
        "github": "",
        "project": "",
        "reviewers": "XA1i;Kowy;95NR;RNSv",
        "site": "https://openreview.net/forum?id=fMzO6vcmhy",
        "pdf_size": 537520,
        "rating": "3;3;5;6",
        "confidence": "2;4;3;2",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;2;3",
        "wc_summary": "63;113;255;111",
        "wc_strengths": "49;75;136;68",
        "wc_weaknesses": "140;618;147;86",
        "wc_questions": "54;50;164;1",
        "wc_review": "306;856;702;266",
        "wc_reply_reviewers": "0;1494;0;0",
        "wc_reply_authors": "892;2060;1008;292",
        "reply_reviewers": "0;3;0;0",
        "reply_authors": "2;3;2;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            135.5,
            71.83836022627466
        ],
        "wc_strengths_avg": [
            82.0,
            32.59601202601324
        ],
        "wc_weaknesses_avg": [
            247.75,
            215.0632174501256
        ],
        "wc_questions_avg": [
            67.25,
            59.62958577753161
        ],
        "wc_review_avg": [
            532.5,
            252.83739834130552
        ],
        "wc_reply_reviewers_avg": [
            373.5,
            646.9209766269756
        ],
        "wc_reply_authors_avg": [
            1063.0,
            636.5367232139871
        ],
        "reply_reviewers_avg": [
            0.75,
            1.299038105676658
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.4061811972299616,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:obRtvGMg5a8J:scholar.google.com/&scioq=QORA:+Zero-Shot+Transfer+via+Interpretable+Object-Relational+Model+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 16,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Texas A&M University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tamu.edu",
        "aff_unique_abbr": "TAMU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "College Station",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "fNOewRJLgQ",
        "title": "Ophiuchus: Scalable Modeling of Protein Structures through Hierarchical Coarse-graining SO(3)-Equivariant Autoencoders",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Three-dimensional native states of natural proteins display recurring and hierarchical patterns. Yet, traditional graph-based modeling of protein structures is often limited to operate within a single fine-grained resolution, and lacks hourglass neural architectures to learn those high-level building blocks. We narrow this gap by introducing Ophiuchus, an SO(3)-equivariant coarse-graining model that efficiently operates on all heavy atoms of standard protein residues, while respecting their relevant symmetries. Our model departs from current approaches that employ graph modeling, instead focusing on local convolutional coarsening to model sequence-motif interactions in log-linear length complexity. We train Ophiuchus on contiguous fragments of PDB monomers, investigating its reconstruction capabilities across different compression rates. We examine the learned latent space and demonstrate its prompt usage in conformational interpolation, comparing interpolated trajectories to structure snapshots from the PDBFlex dataset. Finally, we leverage denoising diffusion probabilistic models (DDPM) to efficiently sample readily-decodable latent embeddings of diverse miniproteins. Our experiments demonstrate Ophiuchus to be a scalable basis for efficient protein modeling and generation.",
        "keywords": "Protein Structure Generative Models;Hierarchical Protein Latent Models;SO(3)-Equivariant Neural Networks;Physics-inspired Machine Learning",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Allan Dos Santos Costa;Ilan Mitnikov;Mario Geiger;Manvitha p Ponnapati;Tess Smidt;JOSEPH JACOBSON",
        "authorids": "~Allan_Dos_Santos_Costa1;~Ilan_Mitnikov1;~Mario_Geiger1;~Manvitha_p_Ponnapati1;~Tess_Smidt1;~JOSEPH_JACOBSON1",
        "gender": "M;;M;;F;",
        "homepage": "http://web.mit.edu/allanc/www/index.html;;;;https://blondegeek.github.io/;",
        "dblp": ";;206/7093;;215/4978.html;",
        "google_scholar": "Zb4RsFsAAAAJ;;;;;",
        "orcid": ";;0000-0001-5433-0900;;0000-0001-5581-5344;",
        "linkedin": ";;;;;",
        "or_profile": "~Allan_Dos_Santos_Costa1;~Ilan_Mitnikov1;~Mario_Geiger1;~Manvitha_p_Ponnapati1;~Tess_Smidt1;~JOSEPH_JACOBSON1",
        "aff": "Massachusetts Institute of Technology;;NVIDIA;;Massachusetts Institute of Technology;",
        "aff_domain": "mit.edu;;nvidia.com;;mit.edu;",
        "position": "PhD student;;Researcher;;Assistant Professor;",
        "bibtex": "@misc{\ncosta2024ophiuchus,\ntitle={Ophiuchus: Scalable Modeling of Protein Structures through Hierarchical Coarse-graining {SO}(3)-Equivariant Autoencoders},\nauthor={Allan Dos Santos Costa and Ilan Mitnikov and Mario Geiger and Manvitha p Ponnapati and Tess Smidt and JOSEPH JACOBSON},\nyear={2024},\nurl={https://openreview.net/forum?id=fNOewRJLgQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "eRzw;ukWB;Lcpi",
        "site": "https://openreview.net/forum?id=fNOewRJLgQ",
        "pdf_size": 19651271,
        "rating": "3;3;5",
        "confidence": "2;4;3",
        "soundness": "3;1;3",
        "contribution": "3;1;3",
        "presentation": "2;2;2",
        "wc_summary": "112;22;64",
        "wc_strengths": "61;24;80",
        "wc_weaknesses": "285;167;36",
        "wc_questions": "2;2;234",
        "wc_review": "460;215;414",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "342;105;474",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            66.0,
            36.76955262170047
        ],
        "wc_strengths_avg": [
            55.0,
            23.25224003546038
        ],
        "wc_weaknesses_avg": [
            162.66666666666666,
            101.69999453731002
        ],
        "wc_questions_avg": [
            79.33333333333333,
            109.36584882351936
        ],
        "wc_review_avg": [
            363.0,
            106.3234060151699
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            307.0,
            152.66302761310612
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18131803320934370722&as_sdt=40000005&sciodt=0,22&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Massachusetts Institute of Technology;NVIDIA",
        "aff_unique_dep": ";NVIDIA Corporation",
        "aff_unique_url": "https://web.mit.edu;https://www.nvidia.com",
        "aff_unique_abbr": "MIT;NVIDIA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "fNY3HiaF0J",
        "title": "MoLE: Human-centric Text-to-image Diffusion with Mixture of Low-rank Experts",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Text-to-image diffusion has attracted vast attention due to its impressive imagegeneration capabilities. However, when it comes to human-centric text-to-image generation, particularly in the context of faces and hands, the results often fall short of naturalness due to insufficient training priors. We alleviate the issue in this work from two perspectives. 1) From the data aspect, we carefully collect a human-centric dataset comprising approximately one million high-quality human-in-the-scene images and two specific sets of close-up images of faces and hands. These datasets collectively provide a rich prior knowledge base to enhance the human-centric image generation capabilities of the diffusion model. 2) On the methodological front, we propose a simple yet effective method called Mixture of Low-rank Experts (MoLE) by considering low-rank modules trained on closeup hand and face images respectively as experts. This concept draws inspiration from our observation of low-rank refinement, where a low-rank module trained by a customized close-up dataset has the potential to enhance the corresponding image part when applied at an appropriate scale. To validate the superiority of MoLE in the context of human-centric image generation compared to state-of-the-art, we construct two benchmarks and perform evaluations with diverse metrics and human studies. More visualization, datasets, models, and code will be released on our webpage https://sites.google.com/view/mole4diffuser/.",
        "keywords": "diffusion model;human-centric image generation",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Jie Zhu;Yixiong Chen;Mingyu Ding;Ping Luo;Leye Wang;Jingdong Wang",
        "authorids": "~Jie_Zhu3;~Yixiong_Chen1;~Mingyu_Ding1;~Ping_Luo2;~Leye_Wang1;~Jingdong_Wang1",
        "gender": "M;M;M;M;M;",
        "homepage": "https://schuture.github.io/;https://dingmyu.github.io/;https://wangleye.github.io/;https://jingdongwang2017.github.io/;https://scholar.google.com/citations?hl=zh-CN&user=ZL506kEAAAAJ;http://luoping.me/",
        "dblp": ";188/5243;07/8764;49/3441;;54/4989-2.html",
        "google_scholar": "bVHYVXQAAAAJ;w4yTWwoAAAAJ;;z5SPCmgAAAAJ;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com.hk/citations?hl=en",
        "orcid": ";0000-0001-6556-8359;;0000-0002-4888-4445;;0000-0002-6685-7950",
        "linkedin": "yixiong-chen-111b49171/;dingmyu/;;;;",
        "or_profile": "~Yixiong_Chen1;~Mingyu_Ding1;~Leye_Wang1;~Jingdong_Wang1;~zhu_Jie1;~Luo_Ping2",
        "aff": "Johns Hopkins University;University of California, Berkeley;Peking University;Baidu;Peking University;The University of Hong Kong",
        "aff_domain": "jh.edu;berkeley.edu;pku.edu.cn;baidu.com;pku.edu.cn;hku.hk",
        "position": "PhD student;Postdoc;Assistant Professor;Chief Scientist for Computer Vision;PhD student;Associate Professor",
        "bibtex": "@misc{\nzhu2024mole,\ntitle={Mo{LE}: Human-centric Text-to-image Diffusion with Mixture of Low-rank Experts},\nauthor={Jie Zhu and Yixiong Chen and Mingyu Ding and Ping Luo and Leye Wang and Jingdong Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=fNY3HiaF0J}\n}",
        "github": "",
        "project": "",
        "reviewers": "Y1yT;39sw;B5SW;FSG6",
        "site": "https://openreview.net/forum?id=fNY3HiaF0J",
        "pdf_size": 11672121,
        "rating": "5;5;5;6",
        "confidence": "4;4;5;3",
        "soundness": "3;3;2;2",
        "contribution": "2;2;2;2",
        "presentation": "3;3;1;2",
        "wc_summary": "56;126;113;82",
        "wc_strengths": "33;42;72;74",
        "wc_weaknesses": "163;197;200;115",
        "wc_questions": "183;190;674;4",
        "wc_review": "435;555;1059;275",
        "wc_reply_reviewers": "106;0;81;0",
        "wc_reply_authors": "1295;1027;3549;819",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "4;4;8;3",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            94.25,
            27.261465477849864
        ],
        "wc_strengths_avg": [
            55.25,
            18.046814123273947
        ],
        "wc_weaknesses_avg": [
            168.75,
            34.266419421935524
        ],
        "wc_questions_avg": [
            262.75,
            248.86278850000858
        ],
        "wc_review_avg": [
            581.0,
            293.30530169091725
        ],
        "wc_reply_reviewers_avg": [
            46.75,
            47.57822506147114
        ],
        "wc_reply_authors_avg": [
            1672.5,
            1096.459187566961
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            4.75,
            1.920286436967152
        ],
        "replies_avg": [
            30,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:pIEaapp8xLYJ:scholar.google.com/&scioq=MoLE:+Human-centric+Text-to-image+Diffusion+with+Mixture+of+Low-rank+Experts&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;2;4",
        "aff_unique_norm": "Johns Hopkins University;University of California, Berkeley;Peking University;Baidu;University of Hong Kong",
        "aff_unique_dep": ";;;Baidu, Inc.;",
        "aff_unique_url": "https://www.jhu.edu;https://www.berkeley.edu;http://www.pku.edu.cn;https://www.baidu.com;https://www.hku.hk",
        "aff_unique_abbr": "JHU;UC Berkeley;Peking U;Baidu;HKU",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Berkeley;Hong Kong SAR",
        "aff_country_unique_index": "0;0;1;1;1;1",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "Unveiling the Pitfalls of Knowledge Editing for Large Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18188",
        "id": "fNktD3ib16",
        "author_site": "Zhoubo Li, Ningyu Zhang, Yunzhi Yao, Mengru Wang, Xi Chen, Huajun Chen",
        "tldr": "",
        "abstract": "As the cost associated with fine-tuning Large Language Models (LLMs) continues to rise, recent research efforts have pivoted towards developing methodologies to edit implicit knowledge embedded within LLMs. Yet, there's still a dark cloud lingering overhead -- will knowledge editing trigger butterfly effect? since it is still unclear whether knowledge editing might introduce side effects that pose potential risks or not. This paper pioneers the investigation into the potential pitfalls associated with knowledge editing for LLMs. To achieve this, we introduce new benchmark datasets and propose innovative evaluation metrics. Our results underline two pivotal concerns: (1) Knowledge Conflict: Editing groups of facts that logically clash can magnify the inherent inconsistencies in LLMs\u2014a facet neglected by previous methods. (2) Knowledge Distortion: Altering parameters with the aim of editing factual knowledge can irrevocably warp the innate knowledge structure of LLMs. Experimental results vividly demonstrate that knowledge editing might inadvertently cast a shadow of unintended consequences on LLMs, which warrant attention and efforts for future works. Code and data are available at https://github.com/zjunlp/PitfallsKnowledgeEditing.",
        "keywords": "model editing;knowledge editing;large language models",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/005fa0541b22d3c9f26ef069268239b2e35a3f84.zip",
        "author": "Zhoubo Li;Ningyu Zhang;Yunzhi Yao;Mengru Wang;Xi Chen;Huajun Chen",
        "authorids": "~Zhoubo_Li1;~Ningyu_Zhang1;~Yunzhi_Yao1;~Mengru_Wang1;~Xi_Chen21;~Huajun_Chen1",
        "gender": "M;M;M;F;M;M",
        "homepage": ";https://person.zju.edu.cn/en/ningyu;http://yyzcowtodd.cn;;;",
        "dblp": ";139/4181-1.html;295/9476;59/8499;;94/5089",
        "google_scholar": ";xQDOPvsAAAAJ;https://scholar.google.com.hk/citations?user=nAagIwEAAAAJ;P3bp0egAAAAJ;https://scholar.google.com/citations?hl=zh-CN;",
        "orcid": ";0000-0002-1970-0678;;0000-0002-4488-9871;;",
        "linkedin": "https://www.linkedin.cn/incareer/in/ACoAADYbK1YBjJtr7ncGkYGnf8q0xu33a_fJlMo;ningyuzhang/;;;;",
        "or_profile": "~Zhoubo_Li1;~Ningyu_Zhang1;~Yunzhi_Yao1;~Mengru_Wang1;~Xi_Chen21;~Huajun_Chen1",
        "aff": "Zhejiang University;Zhejiang University;University of California, Los Angeles;Zhejiang University;Tencent Content and Platform Group;Zhejiang University",
        "aff_domain": "zju.edu.cn;zju.edu.cn;ucla.edu;zju.edu.cn;tencent.com;zju.edu.cn",
        "position": "MS student;Associate Professor;Researcher;PhD student;Researcher;Full Professor",
        "bibtex": "@inproceedings{\nli2024unveiling,\ntitle={Unveiling the Pitfalls of Knowledge Editing for Large Language Models},\nauthor={Zhoubo Li and Ningyu Zhang and Yunzhi Yao and Mengru Wang and Xi Chen and Huajun Chen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=fNktD3ib16}\n}",
        "github": "",
        "project": "",
        "reviewers": "YAyi;XF6v;ihfd;mRJP",
        "pdf_size": 670896,
        "rating": "6;6;8;8",
        "confidence": "3;3;4;3",
        "soundness": "2;2;3;4",
        "contribution": "2;2;3;4",
        "presentation": "3;2;3;3",
        "wc_summary": "57;31;60;71",
        "wc_strengths": "71;30;46;58",
        "wc_weaknesses": "39;27;25;41",
        "wc_questions": "252;252;145;6",
        "wc_review": "419;340;276;176",
        "wc_reply_reviewers": "196;18;0;0",
        "wc_reply_authors": "1198;854;472;296",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "3;3;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            54.75,
            14.669270602180601
        ],
        "wc_strengths_avg": [
            51.25,
            15.122417134836613
        ],
        "wc_weaknesses_avg": [
            33.0,
            7.0710678118654755
        ],
        "wc_questions_avg": [
            163.75,
            101.01082862742985
        ],
        "wc_review_avg": [
            302.75,
            88.99824436470644
        ],
        "wc_reply_reviewers_avg": [
            53.5,
            82.59993946729017
        ],
        "wc_reply_authors_avg": [
            705.0,
            348.8624370722649
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            1.0
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 52,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1383579308090275276&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=fNktD3ib16",
        "pdf": "https://openreview.net/pdf?id=fNktD3ib16",
        "email": "zju.edu.cn;zju.edu.cn;ucla.edu;zju.edu.cn;tencent.com;zju.edu.cn",
        "author_num": 6,
        "aff_unique_index": "0;0;1;0;2;0",
        "aff_unique_norm": "Zhejiang University;University of California, Los Angeles;Tencent",
        "aff_unique_dep": ";;Content and Platform Group",
        "aff_unique_url": "https://www.zju.edu.cn;https://www.ucla.edu;https://www.tencent.com",
        "aff_unique_abbr": "ZJU;UCLA;Tencent",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Los Angeles",
        "aff_country_unique_index": "0;0;1;0;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "fOCjpnU2ux",
        "title": "Multi-Group Tri-plane Based Local Occupancy Estimation for Object Grasping",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "This paper addresses the challenge of robotic grasping of general objects. Similar to prior research, the task reads a single-view 3D observation (i.e., point clouds) captured by a depth camera as input. Crucially, the success of object grasping highly demands a comprehensive understanding of the shape of objects within the scene. However, single-view observations often suffer from occlusions (including both self and inter-object occlusions), which lead to gaps in the point clouds, especially in complex cluttered scenes. This renders incomplete perception of the object shape and frequently causes failures or inaccurate pose estimation during object grasping. In this paper, we tackle this issue with an effective albeit simple solution, namely completing grasping-related scene regions through local occupancy prediction. Following prior practice, the proposed model first runs by proposing a number of most likely grasp points in the scene. Around each grasp point, a module is designed to infer any voxel in its neighborhood to be either void or occupied by some object. Importantly, the occupancy map is inferred by fusing both local and global cues. We implement a multi-group tri-plane scheme for efficiently aggregating long-distance contextual information. The model further estimates 6-D grasp poses utilizing the local occupancy-enhanced object shape information and returns the top-ranked grasp proposal. Comprehensive experiments on both the large-scale GraspNet-1Billion benchmark and real robotic arm demonstrate that the proposed method can effectively complete the unobserved parts in cluttered and occluded scenes. Benefiting from the occupancy-enhanced feature, our model clearly outstrips other competing  methods under various performance metrics such as grasping average precision.",
        "keywords": "Object Grasping;Robotics;Occupancy;Tri-Plane",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/241382f04655a6c8b908d20aab9750e9562f4111.zip",
        "author": "Kangqi Ma;Hao Dong;Yadong MU",
        "authorids": "~Kangqi_Ma1;~Hao_Dong3;~Yadong_MU1",
        "gender": "M;M;M",
        "homepage": "https://github.com/1800012973;https://zsdonghao.github.io;http://www.muyadong.com/",
        "dblp": ";14/1525-3.html;55/1817",
        "google_scholar": ";xLFL4sMAAAAJ;https://scholar.google.com.tw/citations?user=Fqqx4HsAAAAJ",
        "orcid": ";0000-0003-2261-9122;",
        "linkedin": ";;",
        "or_profile": "~Kangqi_Ma1;~Hao_Dong3;~Yadong_MU1",
        "aff": "Peking University;Peking University;Peking University",
        "aff_domain": "pku.edu.cn;pku.edu.cn;pku.edu.cn",
        "position": "MS student;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nma2024multigroup,\ntitle={Multi-Group Tri-plane Based Local Occupancy Estimation for Object Grasping},\nauthor={Kangqi Ma and Hao Dong and Yadong MU},\nyear={2024},\nurl={https://openreview.net/forum?id=fOCjpnU2ux}\n}",
        "github": "",
        "project": "",
        "reviewers": "zrC8;PGYL;DkPo;pApf",
        "site": "https://openreview.net/forum?id=fOCjpnU2ux",
        "pdf_size": 5530254,
        "rating": "5;5;6;6",
        "confidence": "4;3;3;4",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;1;3;2",
        "wc_summary": "45;530;61;118",
        "wc_strengths": "23;76;56;59",
        "wc_weaknesses": "82;291;155;76",
        "wc_questions": "48;93;207;11",
        "wc_review": "198;990;479;264",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            188.5,
            199.02323984901864
        ],
        "wc_strengths_avg": [
            53.5,
            19.189841062395487
        ],
        "wc_weaknesses_avg": [
            151.0,
            86.6054270816789
        ],
        "wc_questions_avg": [
            89.75,
            73.65926621953275
        ],
        "wc_review_avg": [
            482.75,
            310.7453740604999
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:aoHF8peFMN0J:scholar.google.com/&scioq=Multi-Group+Tri-plane+Based+Local+Occupancy+Estimation+for+Object+Grasping&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Peking University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.pku.edu.cn",
        "aff_unique_abbr": "Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "fPEWP3we45",
        "title": "AED: Adaptable Error Detection for Few-shot Imitation Policy",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We study the behavior error detection of few-shot imitation (FSI) policies, which behave in novel (unseen) environments. FSI policies would provoke damage to surrounding people and objects when failing, restricting their contribution to real-world applications. We should have a robust system to notify operators when FSI policies are inconsistent with the intent of demonstrations. Thus, we formulate a novel problem: adaptable error detection (AED) for monitoring FSI policy behaviors. The problem involves the following three challenges: (1) detecting errors in novel environments, (2) no impulse signals when behavior errors occur, and (3) online detection lacking global temporal information. To tackle AED, we propose Pattern Observer (PrObe) to parse the discernable patterns in the policy feature representations of normal or error states. PrObe is then verified in our seven complex multi-stage FSI tasks. From the results, PrObe consistently surpasses strong baselines and demonstrates a robust capability to identify errors arising from a wide range of FSI policies. Finally, the visualizations of learned pattern representations support our claims and provide a better explainability of PrObe.",
        "keywords": "adaptable error detection;few-shot imitation;policy learning",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/62adc6a4a9f7bcbaaf8f6939eace12d5a9d8aa11.zip",
        "author": "Jia-Fong Yeh;Kuo-Han Hung;Pang-Chi Lo;Chi Ming Chung;Tsung-Han Wu;Hung-Ting Su;Yi-Ting Chen;Winston H. Hsu",
        "authorids": "~Jia-Fong_Yeh1;~Kuo-Han_Hung1;~Pang-Chi_Lo1;~Chi_Ming_Chung1;~Tsung-Han_Wu1;~Hung-Ting_Su1;~Yi-Ting_Chen2;~Winston_H._Hsu2",
        "gender": ";M;M;M;M;M;M;M",
        "homepage": "https://www.cmlab.csie.ntu.edu.tw/~jiafongyeh/;https://khhung-906.github.io/;;;https://tsunghan-wu.github.io;;https://sites.google.com/site/yitingchen0524/;https://winstonhsu.info/",
        "dblp": "198/7831;334/0228;;48/266;01/6790;230/2143;12/5268-1;16/5668.html",
        "google_scholar": "kS-oZ20AAAAJ;_L9iSdoAAAAJ;;Wk-_erYAAAAJ;https://scholar.google.com.tw/citations?user=ykuVSuEAAAAJ;5oNVau8AAAAJ;8tRH7RMAAAAJ;https://scholar.google.com.tw/citations?user=NOvDH3QAAAAJ",
        "orcid": ";;;;;;;0000-0002-3330-0638",
        "linkedin": ";;pang-chi-lo/?lipi=urn%3Ali%3Apage%3Ad_flagship3_profile_view_base%3B59Z50RdLSVu4tPsXR5D4nQ%3D%3D;chi-ming-chung-444875134/;tsunghanwu/;;;",
        "or_profile": "~Jia-Fong_Yeh1;~Kuo-Han_Hung1;~Pang-Chi_Lo1;~Chi_Ming_Chung1;~Tsung-Han_Wu1;~Hung-Ting_Su1;~Yi-Ting_Chen2;~Winston_Hsu1",
        "aff": "Sony Group Corporation;National Taiwan University;National Taiwan University;Mediatek Research;University of California, Berkeley;National Taiwan University;National Yang Ming Chiao Tung University;National Taiwan University",
        "aff_domain": "sony.com;ntu.edu.tw;ntu.edu.tw;mtkresearch.com;berkeley.edu;ntu.edu.tw;nycu.edu.tw;ntu.edu.tw",
        "position": "Intern;Undergrad student;Undergrad student;Researcher;PhD student;Postdoc;Assistant Professor;Professor",
        "bibtex": "@misc{\nyeh2024aed,\ntitle={{AED}: Adaptable Error Detection for Few-shot Imitation Policy},\nauthor={Jia-Fong Yeh and Kuo-Han Hung and Pang-Chi Lo and Chi Ming Chung and Tsung-Han Wu and Hung-Ting Su and Yi-Ting Chen and Winston H. Hsu},\nyear={2024},\nurl={https://openreview.net/forum?id=fPEWP3we45}\n}",
        "github": "",
        "project": "",
        "reviewers": "BbBE;Zod3;upjt",
        "site": "https://openreview.net/forum?id=fPEWP3we45",
        "pdf_size": 4357160,
        "rating": "5;5;6",
        "confidence": "3;3;4",
        "soundness": "3;2;2",
        "contribution": "3;2;3",
        "presentation": "3;1;3",
        "wc_summary": "76;29;114",
        "wc_strengths": "141;18;58",
        "wc_weaknesses": "103;182;190",
        "wc_questions": "84;3;38",
        "wc_review": "404;232;400",
        "wc_reply_reviewers": "0;849;14",
        "wc_reply_authors": "790;1510;1687",
        "reply_reviewers": "0;2;1",
        "reply_authors": "2;4;4",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            73.0,
            34.76588366008646
        ],
        "wc_strengths_avg": [
            72.33333333333333,
            51.227162933567016
        ],
        "wc_weaknesses_avg": [
            158.33333333333334,
            39.262648351270904
        ],
        "wc_questions_avg": [
            41.666666666666664,
            33.169597860423664
        ],
        "wc_review_avg": [
            345.3333333333333,
            80.15540461434206
        ],
        "wc_reply_reviewers_avg": [
            287.6666666666667,
            396.96375429278453
        ],
        "wc_reply_authors_avg": [
            1329.0,
            387.920094864909
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.9999999999999997,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1821580441115943787&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;1;2;3;1;4;1",
        "aff_unique_norm": "Sony Group Corporation;National Taiwan University;MediaTek Inc.;University of California, Berkeley;National Yang Ming Chiao Tung University",
        "aff_unique_dep": ";;Research;;",
        "aff_unique_url": "https://www.sony.com;https://www.ntu.edu.tw;https://www.mediatek.com/;https://www.berkeley.edu;https://www.nycu.edu.tw",
        "aff_unique_abbr": "Sony;NTU;MediaTek;UC Berkeley;NYCU",
        "aff_campus_unique_index": "1;1;1;2;1;1;1",
        "aff_campus_unique": ";Taiwan;Berkeley",
        "aff_country_unique_index": "0;1;1;1;2;1;1;1",
        "aff_country_unique": "Japan;China;United States"
    },
    {
        "title": "Unifying Feature and Cost Aggregation with Transformers for Semantic and Visual Correspondence",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18187",
        "id": "fQHb1uZzl7",
        "author_site": "Sunghwan Hong, Seokju Cho, Seungryong Kim, Stephen Lin",
        "tldr": "",
        "abstract": "This paper introduces a Transformer-based integrative feature and cost aggregation network designed for dense matching tasks. In the context of dense matching, many works benefit from one of two forms of aggregation: feature aggregation, which pertains to the alignment of similar features, or cost aggregation, a procedure aimed at instilling coherence in the flow estimates across neighboring pixels. In this work, we first show that feature aggregation and cost aggregation exhibit distinct characteristics and reveal the potential for substantial benefits stemming from the judicious use of both aggregation processes. We then introduce a simple yet effective architecture that harnesses self- and cross-attention mechanisms to show that our approach unifies feature aggregation and cost aggregation and effectively harnesses the strengths of both techniques. Within the proposed attention layers, the features and cost volume both complement each other, and the attention layers are interleaved through a coarse-to-fine design to further promote accurate correspondence estimation. Finally at inference, our network produces multi-scale predictions, computes their confidence scores, and selects the most confident flow for final prediction. Our framework is evaluated on standard benchmarks for semantic matching, and also applied to geometric matching, where we show that our approach achieves significant improvements compared to existing methods.",
        "keywords": "Feature aggregation;Cost aggregation;Transformer;Dense matching",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/f3699e4c0127cbc600040dcd8f3da0bfb91f4623.pdf",
        "author": "Sunghwan Hong;Seokju Cho;Seungryong Kim;Stephen Lin",
        "authorids": "~Sunghwan_Hong2;~Seokju_Cho1;~Seungryong_Kim1;~Stephen_Lin1",
        "gender": "M;M;;M",
        "homepage": "https://seokju-cho.github.io;https://cvlab.korea.ac.kr/members/faculty;https://www.microsoft.com/en-us/research/people/stevelin/;https://sunghwanhong.github.io/",
        "dblp": "294/4755;141/9955;55/4755-1.html;294/4732",
        "google_scholar": "mvPfpnMAAAAJ;cIK1hS8AAAAJ;c3PYmxUAAAAJ;",
        "orcid": "0000-0003-1199-9596;;;",
        "linkedin": "seokju-cho-43601b174/;;;",
        "or_profile": "~Seokju_Cho1;~Seungryong_Kim1;~Stephen_Lin1;~sunghwan_hong1",
        "aff": "Korea University;Korea University;Microsoft Research;Korea University",
        "aff_domain": "korea.ac.kr;korea.ac.kr;microsoft.com;korea.ac.kr",
        "position": "PhD student;Assistant Professor;Researcher;PhD student",
        "bibtex": "@inproceedings{\nhong2024unifying,\ntitle={Unifying Feature and Cost Aggregation with Transformers for Semantic and Visual Correspondence},\nauthor={Sunghwan Hong and Seokju Cho and Seungryong Kim and Stephen Lin},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=fQHb1uZzl7}\n}",
        "github": "",
        "project": "",
        "reviewers": "HY22;gxEA;4EyK;96VU",
        "pdf_size": 3463483,
        "rating": "5;5;6;6",
        "confidence": "4;4;3;4",
        "soundness": "2;2;3;3",
        "contribution": "3;2;3;2",
        "presentation": "2;3;3;3",
        "wc_summary": "52;57;57;52",
        "wc_strengths": "66;31;121;65",
        "wc_weaknesses": "297;156;28;229",
        "wc_questions": "92;5;44;115",
        "wc_review": "507;249;250;461",
        "wc_reply_reviewers": "162;0;0;161",
        "wc_reply_authors": "1852;1121;137;1575",
        "reply_reviewers": "1;0;0;2",
        "reply_authors": "4;2;1;4",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            54.5,
            2.5
        ],
        "wc_strengths_avg": [
            70.75,
            32.251937926270415
        ],
        "wc_weaknesses_avg": [
            177.5,
            99.68074036643186
        ],
        "wc_questions_avg": [
            64.0,
            42.62041764225217
        ],
        "wc_review_avg": [
            366.75,
            118.37308604577309
        ],
        "wc_reply_reviewers_avg": [
            80.75,
            80.7507739900987
        ],
        "wc_reply_authors_avg": [
            1171.25,
            651.658029567656
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.75,
            1.299038105676658
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8204270935941680822&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=fQHb1uZzl7",
        "pdf": "https://openreview.net/pdf?id=fQHb1uZzl7",
        "email": "korea.ac.kr;korea.ac.kr;microsoft.com;korea.ac.kr",
        "author_num": 4,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Korea University;Microsoft",
        "aff_unique_dep": ";Microsoft Research",
        "aff_unique_url": "https://www.korea.ac.kr;https://www.microsoft.com/en-us/research",
        "aff_unique_abbr": "KU;MSR",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "id": "fQxLgR9gx7",
        "title": "Factual and Personalized Recommendation Language Modeling with Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recommender systems (RSs) play a central role in connecting users to content, products and services, matching candidate items to users based on their preferences. While traditional RSs rely on implicit user feedback signals,\nconversational RSs interact with users\nin natural language. In this work, we develop a comPelling, Precise, Personalized, Preference-relevant language model (P$^4$LM) that recommends items to users in a way that better explains item characteristics and their relevance to a  user's preferences. To do this, P$^4$LM uses the embedding space representation of a user's preferences constructed by a traditional RS\nto generate compelling responses that are factually-grounded and relevant w.r.t. those preferences. Moreover, we develop a joint reward function that measures precision, appeal, and personalization, which we use as AI-based feedback for reinforcement learning-based language modeling. Using MovieLens data, we show that P$^4$LM can deliver compelling, personalized movie narratives to users.",
        "keywords": "Large language model;reinforcement learning;conversational recommender systems",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/93b027da275a2f73186da424a1e06e483ff93e84.pdf",
        "author": "Jihwan Jeong;Yinlam Chow;Guy Tennenholtz;ChihWei Hsu;Azamat Tulepbergenov;Mohammad Ghavamzadeh;Craig Boutilier",
        "authorids": "~Jihwan_Jeong1;~Yinlam_Chow1;~Guy_Tennenholtz2;~ChihWei_Hsu2;~Azamat_Tulepbergenov1;~Mohammad_Ghavamzadeh2;~Craig_Boutilier2",
        "gender": "M;M;;;M;M;M",
        "homepage": "https://jihwan-jeong.netlify.app;;https://guytenn.com;https://research.google/people/107258/;https://atulep.github.io;https://research.google/people/craigboutilier/;https://mohammadghavamzadeh.github.io/",
        "dblp": "157/0278;146/7869;;;;10/3411;88/6389",
        "google_scholar": "XvKkcC4AAAAJ;;https://scholar.google.co.il/citations?user=pldrn8IAAAAJ;;https://scholar.google.com/citations?hl=en;cXkm3rsAAAAJ;https://scholar.google.ca/citations?user=LHIPpCsAAAAJ",
        "orcid": ";;;0000-0001-9929-9951;;;",
        "linkedin": "jihwan-jeong-5301ab183/;;;;;;",
        "or_profile": "~Jihwan_Jeong1;~Yinlam_Chow1;~Guy_Tennenholtz2;~ChihWei_Hsu2;~Azamat_Tulepbergenov1;~Craig_Boutilier2;~Mohammad_Ghavamzadeh1",
        "aff": "University of Toronto;Google Research;Google;Google Research;Google;Google;Amazon AGI",
        "aff_domain": "utoronto.ca;google.com;google.com;google.com;google.com;google.com;amazon.com",
        "position": "PhD student;Research Scientist;Researcher;Software Engineer;Research Software Engineer;Principal Researcher;Senior Principal Scientist",
        "bibtex": "@misc{\njeong2024factual,\ntitle={Factual and Personalized Recommendation Language Modeling with Reinforcement Learning},\nauthor={Jihwan Jeong and Yinlam Chow and Guy Tennenholtz and ChihWei Hsu and Azamat Tulepbergenov and Mohammad Ghavamzadeh and Craig Boutilier},\nyear={2024},\nurl={https://openreview.net/forum?id=fQxLgR9gx7}\n}",
        "github": "",
        "project": "",
        "reviewers": "SpKz;wWN5;6DoX;VcLv",
        "site": "https://openreview.net/forum?id=fQxLgR9gx7",
        "pdf_size": 847655,
        "rating": "5;5;5;6",
        "confidence": "3;2;4;3",
        "soundness": "2;3;3;3",
        "contribution": "1;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "59;105;89;89",
        "wc_strengths": "52;113;41;32",
        "wc_weaknesses": "267;255;121;110",
        "wc_questions": "5;255;214;48",
        "wc_review": "383;728;465;279",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "501;669;551;527",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            85.5,
            16.635804759614125
        ],
        "wc_strengths_avg": [
            59.5,
            31.68990375498165
        ],
        "wc_weaknesses_avg": [
            188.25,
            72.97730811697565
        ],
        "wc_questions_avg": [
            130.5,
            106.10018850124631
        ],
        "wc_review_avg": [
            463.75,
            166.19472765403842
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            562.0,
            64.25729530566937
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:5goyZYBd7RYJ:scholar.google.com/&scioq=Factual+and+Personalized+Recommendation+Language+Modeling+with+Reinforcement+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;1;1;1;1;2",
        "aff_unique_norm": "University of Toronto;Google;Amazon",
        "aff_unique_dep": ";Google Research;Amazon AGI",
        "aff_unique_url": "https://www.utoronto.ca;https://research.google;https://www.amazon.com",
        "aff_unique_abbr": "U of T;Google Research;Amazon",
        "aff_campus_unique_index": "1;1;1;1;1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;1;1;1;1;1",
        "aff_country_unique": "Canada;United States"
    },
    {
        "id": "fTEPeQ00VM",
        "title": "TabRepo: A Large Scale Repository of Tabular Model Evaluations and its AutoML Applications",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We introduce TabRepo, a new dataset of tabular model evaluations and predictions. TabRepo contains the predictions and metrics of 1206 models evaluated on 200 regression and classification datasets. We illustrate the benefit of our datasets in multiple ways. First, we show that it allows to perform analysis such as comparing Hyperparameter Optimization against current AutoML systems while also considering ensembling at no cost by using precomputed model predictions. Second, we show that our dataset can be readily leveraged to perform transfer-learning. In particular, we show that applying standard transfer-learning techniques allows to outperform current state-of-the-art tabular systems in accuracy, runtime and latency.",
        "keywords": "Tabular prediction;AutoML;transfer learning;Tabulated dataset.",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/937168d6a898b39861568d4ed455f140da7ac601.zip",
        "author": "David Salinas;Nick Erickson",
        "authorids": "~David_Salinas2;~Nick_Erickson1",
        "gender": "M;M",
        "homepage": "https://github.com/Innixma;https://geoalgo.github.io/",
        "dblp": "202/1706;99/7083.html",
        "google_scholar": "I0nj-TcAAAAJ;https://scholar.google.fr/citations?user=D0WjJlsAAAAJ",
        "orcid": ";",
        "linkedin": "nickericksoncs/;david-salinas-184a7582/",
        "or_profile": "~Nick_Erickson1;~David_Salinas1",
        "aff": "Amazon;Amazon",
        "aff_domain": "amazon.com;amazon.com",
        "position": "Researcher;Researcher",
        "bibtex": "@misc{\nsalinas2024tabrepo,\ntitle={TabRepo: A Large Scale Repository of Tabular Model Evaluations and its Auto{ML} Applications},\nauthor={David Salinas and Nick Erickson},\nyear={2024},\nurl={https://openreview.net/forum?id=fTEPeQ00VM}\n}",
        "github": "",
        "project": "",
        "reviewers": "EeeT;PZnZ;kTk5;XQfD",
        "site": "https://openreview.net/forum?id=fTEPeQ00VM",
        "pdf_size": 881270,
        "rating": "3;3;5;6",
        "confidence": "4;3;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;1;2;3",
        "presentation": "3;3;2;3",
        "wc_summary": "123;44;62;48",
        "wc_strengths": "50;31;56;68",
        "wc_weaknesses": "813;210;63;211",
        "wc_questions": "2;46;13;165",
        "wc_review": "988;331;194;492",
        "wc_reply_reviewers": "0;111;0;0",
        "wc_reply_authors": "749;1002;274;652",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            69.25,
            31.744093938873103
        ],
        "wc_strengths_avg": [
            51.25,
            13.36740438529485
        ],
        "wc_weaknesses_avg": [
            324.25,
            288.53368520850387
        ],
        "wc_questions_avg": [
            56.5,
            64.70123646422842
        ],
        "wc_review_avg": [
            501.25,
            300.16609985139894
        ],
        "wc_reply_reviewers_avg": [
            27.75,
            48.064409910036346
        ],
        "wc_reply_authors_avg": [
            669.25,
            261.535250970113
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.19245008972987526,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2362567995408556655&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Amazon",
        "aff_unique_dep": "Amazon.com, Inc.",
        "aff_unique_url": "https://www.amazon.com",
        "aff_unique_abbr": "Amazon",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "fTiU8HhdBD",
        "title": "A Unified Framework for Reinforcement Learning under Policy and Dynamic Shifts",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Training reinforcement learning policies using environment interaction data collected from varying policies or dynamics presents a fundamental challenge. Existing works often overlook the distribution discrepancies induced by policy or dynamics shifts, or rely on specialized algorithms with task priors, thus often resulting in suboptimal policy performances and high variances. In this paper, we identify a unified strategy for online RL policy learning under diverse settings of policy and dynamics shifts: transition occupancy matching. In light of this, we introduce a surrogate policy learning objective by considering the transition occupancy discrepancies and then cast it into a tractable \\textit{min-max} optimization problem through dual reformulation. Our method, dubbed Occupancy-Matching Policy Optimization (OMPO), features a specialized actor-critic structure and a distribution discriminator. We conduct extensive experiments based on the OpenAI Gym, Meta-World, and Panda Robots environments, encompassing policy shifts under stationary and non-stationary dynamics, as well as domain adaption. The results demonstrate that OMPO outperforms the specialized baselines from different categories in all settings. We also find that OMPO exhibits particularly strong performance when combined with domain randomization, highlighting its potential in RL-based robotics applications.",
        "keywords": "Reinforcement Learning;mismatched data;policy and dynamic shifts",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/36a6dfd560fe9dd9b2981a62d710c7147f928e2c.zip",
        "author": "Yu Luo;Tianying Ji;Fuchun Sun;Jianwei Dr. Zhang;Huazhe Xu;Xianyuan Zhan",
        "authorids": "~Yu_Luo5;~Tianying_Ji2;~Fuchun_Sun1;~Jianwei_Dr._Zhang1;~Huazhe_Xu1;~Xianyuan_Zhan1",
        "gender": "M;F;M;M;M;M",
        "homepage": ";;https://www.cs.tsinghua.edu.cn/info/1121/3555.htm;https://tams.informatik.uni-hamburg.de/people/zhang/;http://hxu.rocks;http://zhanxianyuan.xyz/",
        "dblp": ";124/2199.html;;;164/9006;181/5081",
        "google_scholar": "https://scholar.google.com.hk/citations?user=KQjoQOMAAAAJ;https://scholar.google.com/citations?hl=zh-CN;;;t9HPFawAAAAJ;pDMnGloAAAAJ",
        "orcid": "0000-0001-6229-4639;;;;;0000-0002-3683-0554",
        "linkedin": ";;;;;",
        "or_profile": "~Yu_Luo5;~Tianying_Ji2;~Fuchun_Sun1;~Jianwei_Dr._Zhang1;~Huazhe_Xu1;~Xianyuan_Zhan1",
        "aff": "Tsinghua University;Tsinghua University;Tsinghua University;Universit\u00e4t Hamburg;Tsinghua University;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;tsinghua.edu.cn;cs.tsinghua.edu.cn;uni-hamburg.de;tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "PhD student;PhD student;Full Professor;Full Professor;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nluo2024a,\ntitle={A Unified Framework for Reinforcement Learning under Policy and Dynamic Shifts},\nauthor={Yu Luo and Tianying Ji and Fuchun Sun and Jianwei Dr. Zhang and Huazhe Xu and Xianyuan Zhan},\nyear={2024},\nurl={https://openreview.net/forum?id=fTiU8HhdBD}\n}",
        "github": "",
        "project": "",
        "reviewers": "UYp5;9mJF;kdm5;6QE6",
        "site": "https://openreview.net/forum?id=fTiU8HhdBD",
        "pdf_size": 7773613,
        "rating": "3;6;6;8",
        "confidence": "4;3;4;4",
        "soundness": "1;4;3;4",
        "contribution": "2;3;2;4",
        "presentation": "2;4;3;3",
        "wc_summary": "120;61;75;118",
        "wc_strengths": "25;70;75;205",
        "wc_weaknesses": "292;156;56;323",
        "wc_questions": "3;72;200;241",
        "wc_review": "440;359;406;887",
        "wc_reply_reviewers": "219;0;0;33",
        "wc_reply_authors": "1677;802;1162;923",
        "reply_reviewers": "2;0;0;1",
        "reply_authors": "7;4;4;4",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            1.224744871391589
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            93.5,
            25.985572920372565
        ],
        "wc_strengths_avg": [
            93.75,
            67.11696879329399
        ],
        "wc_weaknesses_avg": [
            206.75,
            107.33446557373824
        ],
        "wc_questions_avg": [
            129.0,
            95.79926930827813
        ],
        "wc_review_avg": [
            523.0,
            212.11435594980364
        ],
        "wc_reply_reviewers_avg": [
            63.0,
            91.06865541996324
        ],
        "wc_reply_authors_avg": [
            1141.0,
            335.4780171635692
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            4.75,
            1.299038105676658
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.08084520834544431,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:jY5MXkveErcJ:scholar.google.com/&scioq=A+Unified+Framework+for+Reinforcement+Learning+under+Policy+and+Dynamic+Shifts&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;0;0",
        "aff_unique_norm": "Tsinghua University;University of Hamburg",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.uni-hamburg.de",
        "aff_unique_abbr": "THU;UHH",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0;0",
        "aff_country_unique": "China;Germany"
    },
    {
        "title": "Align With Purpose: Optimize Desired Properties in CTC Models with a General Plug-and-Play Framework",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18186",
        "id": "fUGhVYPVRM",
        "author_site": "Eliya Segev, Maya Alroy, Ronen Katsir, Noam Wies, Ayana Shenhav, Yael Ben-Oren, David Zar, Oren Tadmor, Jacob Bitterman, Amnon Shashua, Tal Rosenwein",
        "tldr": "",
        "abstract": "Connectionist Temporal Classification (CTC) is a widely used criterion for training supervised sequence-to-sequence (seq2seq) models. It learns the alignments between the input and output sequences by marginalizing over the perfect alignments (that yield the ground truth), at the expense of the imperfect ones. This dichotomy, and in particular the equal treatment of all perfect alignments, results in a lack of controllability over the predicted alignments. This controllability is essential for capturing properties that hold significance in real-world applications. Here we propose Align With Purpose (AWP), a general Plug-and-Play framework for enhancing a desired property in models trained with the CTC criterion. We do that by complementing the CTC loss with an additional loss term that prioritizes alignments according to a desired property. AWP does not require any intervention in the CTC loss function, and allows to differentiate between both perfect and imperfect alignments for a variety of properties. We apply our framework in the domain of Automatic Speech Recognition (ASR) and show its generality in terms of property selection, architectural choice, and scale of the training dataset (up to 280,000 hours). To demonstrate the effectiveness of our framework, we apply it to two unrelated properties: token emission time for latency optimization and word error rate (WER). For the former, we report an improvement of up to 590ms in latency optimization with a minor reduction in WER, and for the latter, we report a relative improvement of 4.5% in WER over the baseline models. To the best of our knowledge, these applications have never been demonstrated to work on this scale of data. Notably, our method can be easily implemented using only a few\nlines of code and can be extended to other alignment-free loss functions and to domains other than ASR.",
        "keywords": "ASR;CTC;seq2seq;low latency;WER",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/0473b4fdf2b83b8606b43c6fb5db0bc1fddc7c4c.zip",
        "author": "Eliya Segev;Maya Alroy;Ronen Katsir;Noam Wies;Ayana Shenhav;Yael Sapir Ben-Oren;David Zar;Oren Tadmor;Jacob Bitterman;Amnon Shashua;Tal Rosenwein",
        "authorids": "~Eliya_Segev1;~Maya_Alroy1;~Ronen_Katsir1;~Noam_Wies1;~Ayana_Shenhav1;~Yael_Sapir_Ben-Oren1;~David_Zar1;~Oren_Tadmor1;~Jacob_Bitterman1;~Amnon_Shashua1;~Tal_Rosenwein1",
        "gender": "M;;M;M;F;F;M;M;M;M;M",
        "homepage": ";;;;https://www.linkedin.com/in/ayana-shenhav-1997a119a/;https://app.hibob.com/employee-profile/2620546383744074701;;;;http://www.cs.huji.ac.il/~shashua/;https://medium.com/@talrosenwein",
        "dblp": ";;;236/6106;;;;180/5773;;47/1492;180/5508",
        "google_scholar": ";;;https://scholar.google.co.il/citations?user=FxlR8voAAAAJ;;;;;;https://scholar.google.com.tw/citations?user=dwi5wvYAAAAJ;V7x6rsAAAAAJ",
        "orcid": ";;;0000-0002-1337-2298;;;;;;;",
        "linkedin": "eliya-segev;;ronen-katsir-6a136873?lipi=urn%3Ali%3Apage%3Ad_flagship3_profile_view_base_contact_details%3BLB713HzzTe%2BtNGNx4Dw%2B1g%3D%3D;noam-wies-a5ab1663/;;;zardav;;jacob-bitterman;;tal-rosenwein/",
        "or_profile": "~Eliya_Segev1;~Maya_Alroy1;~Ronen_Katsir1;~Noam_Wies1;~Ayana_Shenhav1;~Yael_Sapir_Ben-Oren1;~David_Zar1;~Oren_Tadmor1;~Jacob_Bitterman1;~Amnon_Shashua1;~Tal_Rosenwein1",
        "aff": "Orcam;;;Hebrew University of Jerusalem;Orcam;;;;Orcam;Hebrew University, Hebrew University of Jerusalem;OrCam technologies LTD",
        "aff_domain": "orcam.com;;;huji.ac.il;orcam.com;;;;orcam.com;cs.huji.ac.il;orcam.com",
        "position": "Researcher;;;PhD student;Researcher;;;;Researcher;Professor;Researcher",
        "bibtex": "@inproceedings{\nsegev2024align,\ntitle={Align With Purpose: Optimize Desired Properties in {CTC} Models with a General Plug-and-Play Framework},\nauthor={Eliya Segev and Maya Alroy and Ronen Katsir and Noam Wies and Ayana Shenhav and Yael Sapir Ben-Oren and David Zar and Oren Tadmor and Jacob Bitterman and Amnon Shashua and Tal Rosenwein},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=fUGhVYPVRM}\n}",
        "github": "",
        "project": "",
        "reviewers": "bLBJ;Nofc;4pZf;jMFR",
        "pdf_size": 871471,
        "rating": "6;6;8;8",
        "confidence": "4;5;4;5",
        "soundness": "3;3;3;4",
        "contribution": "3;3;3;4",
        "presentation": "3;3;4;4",
        "wc_summary": "133;106;92;60",
        "wc_strengths": "30;74;77;62",
        "wc_weaknesses": "283;436;120;9",
        "wc_questions": "800;27;45;24",
        "wc_review": "1246;643;334;155",
        "wc_reply_reviewers": "457;129;0;0",
        "wc_reply_authors": "1375;789;548;95",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            97.75,
            26.309456474811487
        ],
        "wc_strengths_avg": [
            60.75,
            18.619546181365433
        ],
        "wc_weaknesses_avg": [
            212.0,
            161.93362837903683
        ],
        "wc_questions_avg": [
            224.0,
            332.65071772055444
        ],
        "wc_review_avg": [
            594.5,
            414.67607840337257
        ],
        "wc_reply_reviewers_avg": [
            146.5,
            186.84284840474896
        ],
        "wc_reply_authors_avg": [
            701.75,
            461.6986977456185
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12932696908405746315&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=fUGhVYPVRM",
        "pdf": "https://openreview.net/pdf?id=fUGhVYPVRM",
        "email": "orcam.com;;;huji.ac.il;orcam.com;;;;orcam.com;cs.huji.ac.il;orcam.com",
        "author_num": 11,
        "aff_unique_index": "0;1;0;0;1;2",
        "aff_unique_norm": "Orcam;Hebrew University of Jerusalem;OrCam Technologies",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.orcam.com;https://www.huji.ac.il;https://www.orchom.com",
        "aff_unique_abbr": ";HUJI;OrCam",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Jerusalem",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "Israel"
    },
    {
        "title": "Nougat: Neural Optical Understanding for Academic Documents",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18185",
        "id": "fUtxNAKpdV",
        "author_site": "Lukas Blecher, Guillem Cucurull Preixens, Thomas Scialom, Robert Stojnic",
        "tldr": "",
        "abstract": "Scientific knowledge is predominantly stored in books and scientific journals, often in the form of PDFs. However, the PDF format leads to a loss of semantic information, particularly for mathematical expressions. We propose Nougat (Neural Optical Understanding for Academic Documents), a Visual Transformer model that performs an Optical Character Recognition (OCR) task for processing scientific documents into a markup language, and demonstrate the effectiveness of our model on a new dataset of scientific documents. The proposed approach offers a promising solution to enhance the accessibility of scientific knowledge in the digital age, by bridging the gap between human- readable documents and machine-readable text. We release the models and code to accelerate future work on scientific text recognition.",
        "keywords": "Visual Document Understanding;Optical Character Recognition;Mathematical Expression Recognition;Information Extraction",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Lukas Blecher;Guillem Cucurull;Thomas Scialom;Robert Stojnic",
        "authorids": "~Lukas_Blecher1;~Guillem_Cucurull1;~Thomas_Scialom1;~Robert_Stojnic1",
        "gender": "M;;M;M",
        "homepage": ";;;",
        "dblp": ";https://dblp.org/pers/c/Cucurull:Guillem.html;;",
        "google_scholar": ";;qou4P-kAAAAJ;https://scholar.google.co.uk/citations?user=H-X_22QAAAAJ",
        "orcid": ";;;",
        "linkedin": "lukas-blecher;;;robert-stojnic-454a39119",
        "or_profile": "~Lukas_Blecher1;~Guillem_Cucurull1;~Thomas_Scialom1;~Robert_Stojnic1",
        "aff": "Research, Facebook;Meta Facebook;;Meta Facebook",
        "aff_domain": "research.facebook.com;fb.com;;fb.com",
        "position": "Researcher;Research Engineer;;Facebook AI",
        "bibtex": "@inproceedings{\nblecher2024nougat,\ntitle={Nougat: Neural Optical Understanding for Academic Documents},\nauthor={Lukas Blecher and Guillem Cucurull and Thomas Scialom and Robert Stojnic},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=fUtxNAKpdV}\n}",
        "github": "",
        "project": "",
        "reviewers": "jN3C;YnWx;SnU5;VwBw",
        "pdf_size": 4020690,
        "rating": "3;5;8;10",
        "confidence": "5;4;5;4",
        "soundness": "2;3;3;3",
        "contribution": "1;4;3;4",
        "presentation": "3;2;3;3",
        "wc_summary": "121;57;92;75",
        "wc_strengths": "207;36;155;80",
        "wc_weaknesses": "168;130;186;3",
        "wc_questions": "14;98;515;80",
        "wc_review": "510;321;948;238",
        "wc_reply_reviewers": "19;0;0;0",
        "wc_reply_authors": "28;450;723;122",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.5,
            2.692582403567252
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            1.224744871391589
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            86.25,
            23.573024837725004
        ],
        "wc_strengths_avg": [
            119.5,
            66.04733151308992
        ],
        "wc_weaknesses_avg": [
            121.75,
            71.47858070778966
        ],
        "wc_questions_avg": [
            176.75,
            197.77686290362684
        ],
        "wc_review_avg": [
            504.25,
            274.50717203745336
        ],
        "wc_reply_reviewers_avg": [
            4.75,
            8.227241335952167
        ],
        "wc_reply_authors_avg": [
            330.75,
            275.3700918763692
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.3713906763541037,
        "gs_citation": 113,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3817091720057552185&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 8,
        "openreview": "https://openreview.net/forum?id=fUtxNAKpdV",
        "pdf": "https://openreview.net/pdf?id=fUtxNAKpdV",
        "email": "research.facebook.com;fb.com;;fb.com",
        "author_num": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Meta",
        "aff_unique_dep": "Research",
        "aff_unique_url": "https://www.facebook.com",
        "aff_unique_abbr": "FB",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "fUwfjPzI8g",
        "title": "Continual Learning via Winning Subnetworks That Arise Through Stochastic Local Competition",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The aim of this work is to address catastrophic forgetting in class-incremental learning. To this end, we propose deep networks that comprise blocks of units that compete locally to win the representation of each arising new task; competition takes place in a stochastic manner. This type of network organization results in sparse task-specific representations from each network layer; the sparsity pattern is obtained during training and is different among tasks. Under this rationale, our continual task learning algorithm regulates gradient-driven weight updates for each unit in a block on the grounds of winning probability. During inference, the network retains only the winning unit and zeroes-out all weights pertaining to non-winning units for the task at hand. As we empirically show, our method produces state-of-the-art predictive accuracy on few-shot image classification experiments, and imposes a considerably lower computational overhead compared to the current state-of-the-art.",
        "keywords": "Continual Learning;Winning Tickets;Stochastic Local Competition",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/21ff85a7d6089049cc84cac8c18443550b0f82d0.zip",
        "author": "Konstantinos Kalais;Loukas Papadoulas;Sotirios Chatzis",
        "authorids": "~Konstantinos_Kalais2;~Loukas_Papadoulas1;~Sotirios_Chatzis1",
        "gender": "M;M;M",
        "homepage": "https://ethicalaicy.com;https://www.cut.ac.cy/eecei/staff/sotirios.chatzis/;",
        "dblp": ";25/6133;323/9203",
        "google_scholar": ";https://scholar.google.gr/citations?user=__Y_0hQAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;",
        "linkedin": ";;konstantinos-kalais-025085151/",
        "or_profile": "~Loukas_Papadoulas1;~Sotirios_Chatzis1;~Konstantinos_\u0399._Kalais1",
        "aff": "Ethical AI Novelties;Cyprus University of Technology;AI Cyprus Ethical Novelties Ltd",
        "aff_domain": "ethicalaicy.com;cut.ac.cy;ethicalaicy.com",
        "position": "Researcher;Associate Professor;Researcher",
        "bibtex": "@misc{\nkalais2024continual,\ntitle={Continual Learning via Winning Subnetworks That Arise Through Stochastic Local Competition},\nauthor={Konstantinos Kalais and Loukas Papadoulas and Sotirios Chatzis},\nyear={2024},\nurl={https://openreview.net/forum?id=fUwfjPzI8g}\n}",
        "github": "",
        "project": "",
        "reviewers": "RSpN;BkhS;91vA;beRr",
        "site": "https://openreview.net/forum?id=fUwfjPzI8g",
        "pdf_size": 2228947,
        "rating": "3;5;6;6",
        "confidence": "3;4;3;3",
        "soundness": "2;3;3;3",
        "contribution": "3;2;3;3",
        "presentation": "1;2;3;3",
        "wc_summary": "201;94;100;76",
        "wc_strengths": "77;46;49;71",
        "wc_weaknesses": "224;55;55;113",
        "wc_questions": "1081;53;31;16",
        "wc_review": "1583;248;235;276",
        "wc_reply_reviewers": "167;0;0;39",
        "wc_reply_authors": "1059;338;238;486",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "3;1;1;2",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            117.75,
            48.86908531986249
        ],
        "wc_strengths_avg": [
            60.75,
            13.460590625971804
        ],
        "wc_weaknesses_avg": [
            111.75,
            68.99773547008627
        ],
        "wc_questions_avg": [
            295.25,
            453.843791959304
        ],
        "wc_review_avg": [
            585.5,
            576.0974309958342
        ],
        "wc_reply_reviewers_avg": [
            51.5,
            68.55836929215863
        ],
        "wc_reply_authors_avg": [
            530.25,
            317.76750541866295
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8495631244628466069&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Ethical AI Novelties;Cyprus University of Technology;AI Cyprus Ethical Novelties Ltd",
        "aff_unique_dep": ";;",
        "aff_unique_url": ";https://www.cut.ac.cy;",
        "aff_unique_abbr": ";CUT;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "1;1",
        "aff_country_unique": ";Cyprus"
    },
    {
        "id": "fUz6Qefe5z",
        "title": "How Neural Networks With Derivative Labels Work: A Neural Tangent Kernel Perspective",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep neural networks have achieved impressive results in a range of fields, while their analytical properties have been slow to develop. Recently, a theoretical tool called Neural Tangent Kernel (NTK) has been proposed and extended to diverse architectures based on neural networks. This tool helps explain their convergence and generalization with a least-square loss. However, researchers in numerous fields have trained their networks using an additional derivative loss item, such as Jacobian Regularization and PINN (Physics-Informed Neural Networks). This loss setup has generality, while it often leads to challenging convergence issues. To address this problem, we propose a general paradigm that utilizes G\u00e2teaux derivative labels to describe all these tasks. Additionally, we extend NTK in our setup from an analytical perspective and propose a geometrical perspective of parameter updating directions to explain the hard convergence. We also conduct experiments to verify our propositions. Finally, we provide specific expressions for distinct tasks within our paradigm.",
        "keywords": "Application of Neural Tangent Kernel",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/9f59223c29edf23e96057567d8e73232d0f2db2d.zip",
        "author": "Yuanqu Mou;zhenbin Wu;Chang Gou;Haiyang Bai;Jia Liu",
        "authorids": "~Yuanqu_Mou1;~zhenbin_Wu1;~Chang_Gou1;~Haiyang_Bai1;~Jia_Liu5",
        "gender": "M;M;M;M;M",
        "homepage": "https://github.com/topologyworld;https://github.com/zhenbin-wu;;https://scholar.google.com/citations?hl=zh-CN&user=28ZgvYAAAAAJ&view_op=list_works&gmla=AP6z3Ob_e384nW8bzsPNehAnQV1m-EmEdXctQ6ygHVvs-8JC27j-vyAoZGBuVkrxK1njCltol-4YcmT6NQVySkY-0Zn7-JCJNcibMVO8pjPRipvgVYHzaX5wkFiau1gbaHA5hJo;https://cs.nju.edu.cn/liujia",
        "dblp": ";;;;",
        "google_scholar": ";;UbQGZ1AAAAAJ;https://scholar.google.com/citations?hl=zh-CN;",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Yuanqu_Mou1;~zhenbin_Wu1;~Chang_Gou1;~Haiyang_Bai1;~Jia_Liu5",
        "aff": "Nanjing University;Nanjing University;Nanjing University;Nanjing University;Nanjing University",
        "aff_domain": "nju.edu.cn;nju.edu.cn;nju.edu.cn;nju.edu.cn;nju.edu.cn",
        "position": "MS student;MS student;PhD student;PhD student;Associate Professor",
        "bibtex": "@misc{\nmou2024how,\ntitle={How Neural Networks With Derivative Labels Work: A Neural Tangent Kernel Perspective},\nauthor={Yuanqu Mou and zhenbin Wu and Chang Gou and Haiyang Bai and Jia Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=fUz6Qefe5z}\n}",
        "github": "",
        "project": "",
        "reviewers": "PpX8;RXR5;LVg4",
        "site": "https://openreview.net/forum?id=fUz6Qefe5z",
        "pdf_size": 1084234,
        "rating": "3;3;3",
        "confidence": "3;5;3",
        "soundness": "2;2;2",
        "contribution": "2;2;2",
        "presentation": "2;1;2",
        "wc_summary": "34;57;55",
        "wc_strengths": "18;73;64",
        "wc_weaknesses": "49;399;171",
        "wc_questions": "2;1;64",
        "wc_review": "103;530;354",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            48.666666666666664,
            10.402991022884823
        ],
        "wc_strengths_avg": [
            51.666666666666664,
            24.087802353519557
        ],
        "wc_weaknesses_avg": [
            206.33333333333334,
            145.05477892468377
        ],
        "wc_questions_avg": [
            22.333333333333332,
            29.465610840812758
        ],
        "wc_review_avg": [
            329.0,
            175.2160571028428
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:vG2KENuWOwUJ:scholar.google.com/&scioq=How+Neural+Networks+With+Derivative+Labels+Work:+A+Neural+Tangent+Kernel+Perspective&hl=en&as_sdt=0,48",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Nanjing University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nju.edu.cn",
        "aff_unique_abbr": "Nanjing U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "fV54cBCGEV",
        "title": "Explicit Personalization and Local Training: Double Communication Acceleration in Federated Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Federated Learning is an evolving machine learning paradigm, in which multiple clients perform computations based on their individual private data, interspersed by communication with a remote server. A common strategy to curtail communication costs is Local Training, which consists in performing multiple local stochastic gradient descent steps between successive communication rounds. However, the conventional approach to local training overlooks the practical necessity for client-specific personalization, a technique to tailor local models to individual needs. We introduce Scafflix, a novel algorithm that efficiently integrates explicit personalization with local training. This innovative approach benefits from these two techniques, thereby achieving doubly accelerated communication, as we demonstrate both in theory and practice.",
        "keywords": "federated learning;local training;personalization",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/63e97bf6ce6fa8148096c7ae18c7e6f4a22c6d0c.zip",
        "author": "Kai Yi;Laurent Condat;Peter Richt\u00e1rik",
        "authorids": "~Kai_Yi1;~Laurent_Condat1;~Peter_Richt\u00e1rik1",
        "gender": "M;M;M",
        "homepage": "https://kaiyi.me/;https://lcondat.github.io/;https://richtarik.org",
        "dblp": "13/1589;88/1335;62/8001",
        "google_scholar": "r08j39wAAAAJ;PixYHyEAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0003-0415-3584;0000-0001-7087-1002;0000-0003-4380-5848",
        "linkedin": "kai-yi-347089153/;laurent-condat-40291720b/;richtarik/",
        "or_profile": "~Kai_Yi1;~Laurent_Condat1;~Peter_Richtarik1",
        "aff": "KAUST;KAUST;King Abdullah University of Science and Technology (KAUST)",
        "aff_domain": "kaust.edu.sa;kaust.edu.sa;kaust.edu.sa",
        "position": "PhD student;research scientist;Full Professor",
        "bibtex": "@misc{\nyi2024explicit,\ntitle={Explicit Personalization and Local Training: Double Communication Acceleration in Federated Learning},\nauthor={Kai Yi and Laurent Condat and Peter Richt{\\'a}rik},\nyear={2024},\nurl={https://openreview.net/forum?id=fV54cBCGEV}\n}",
        "github": "",
        "project": "",
        "reviewers": "Av21;65jh;zbJj",
        "site": "https://openreview.net/forum?id=fV54cBCGEV",
        "pdf_size": 718489,
        "rating": "3;3;6",
        "confidence": "4;3;3",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "2;2;3",
        "wc_summary": "110;82;53",
        "wc_strengths": "61;82;27",
        "wc_weaknesses": "223;70;114",
        "wc_questions": "76;738;14",
        "wc_review": "470;972;208",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            81.66666666666667,
            23.27134623427608
        ],
        "wc_strengths_avg": [
            56.666666666666664,
            22.661764175711376
        ],
        "wc_weaknesses_avg": [
            135.66666666666666,
            64.31346843564124
        ],
        "wc_questions_avg": [
            276.0,
            327.66242791425856
        ],
        "wc_review_avg": [
            550.0,
            316.990010357845
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17043106042217929489&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "King Abdullah University of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaust.edu.sa",
        "aff_unique_abbr": "KAUST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Saudi Arabia"
    },
    {
        "title": "An interpretable error correction method for enhancing code-to-code translation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18184",
        "id": "fVxIEHGnVT",
        "author_site": "Min Xue, Artur Andrzejak, Marla Leuther",
        "tldr": "",
        "abstract": "Transformer-based machine translation models currently dominate the field of model-based program translation. However, these models fail to provide interpretative support for the generated program translations. Moreover, researchers frequently invest substantial time and computational resources in retraining models, yet the improvement in translation accuracy is quite limited. \nTo address these issues, we introduce a novel approach, $k\\text{NN-ECD}$, which combines $k$-nearest-neighbor search with a key-value error correction datastore to overwrite the wrong translations of TransCoder-ST. This provides a decision-making basis for interpreting the corrected translations. Building upon this, we further propose $k\\text{NN-ECS}_{m}$, a methodology that employs a distributed structure with $m$ sub-datastores connected in series,  utilizing $m$ diverse experts for multi-round error correction. Additionally, we put forward a unified name rule, encouraging the datastore to focus more on code logic and structure rather than diverse rare identifiers. Our experimental results show that our approach improves the translation accuracy from 68.9\\% to 89.9\\% of TransCoder-ST (for translation from Java to Python). This error correction method augments program translation, overcoming the inherent limitations of Transformer-based code translation models, such as resource-intensive retraining requirements and uninterpretable outcomes.",
        "keywords": "Computation and Language; Programming Languages; Software Engineering; Machine Learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Min Xue;Artur Andrzejak;Marla Leuther",
        "authorids": "~Min_Xue1;~Artur_Andrzejak1;~Marla_Leuther1",
        "gender": ";M;F",
        "homepage": ";https://aip.ifi.uni-heidelberg.de/team/aa;",
        "dblp": ";00/336.html;",
        "google_scholar": ";AmoRK7cAAAAJ;",
        "orcid": ";0000-0003-0150-8220;",
        "linkedin": ";;marla-leuther-836794273",
        "or_profile": "~Min_Xue1;~Artur_Andrzejak1;~Marla_Leuther1",
        "aff": ";Heidelberg University;Ruprecht-Karls-Universit\u00e4t Heidelberg",
        "aff_domain": ";uni-heidelberg.de;uni-heidelberg.de",
        "position": ";Full Professor;MS student",
        "bibtex": "@inproceedings{\nxue2024an,\ntitle={An interpretable error correction method for enhancing code-to-code translation},\nauthor={Min Xue and Artur Andrzejak and Marla Leuther},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=fVxIEHGnVT}\n}",
        "github": "",
        "project": "",
        "reviewers": "7Q1Z;oueh;Uzpj",
        "pdf_size": 1215246,
        "rating": "6;6;6",
        "confidence": "4;3;3",
        "soundness": "3;3;2",
        "contribution": "2;3;3",
        "presentation": "3;3;2",
        "wc_summary": "205;118;75",
        "wc_strengths": "61;46;72",
        "wc_weaknesses": "302;135;182",
        "wc_questions": "381;61;78",
        "wc_review": "949;360;407",
        "wc_reply_reviewers": "63;279;177",
        "wc_reply_authors": "695;622;1049",
        "reply_reviewers": "1;2;1",
        "reply_authors": "2;3;3",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            132.66666666666666,
            54.07607809579225
        ],
        "wc_strengths_avg": [
            59.666666666666664,
            10.656244908763853
        ],
        "wc_weaknesses_avg": [
            206.33333333333334,
            70.31516352979791
        ],
        "wc_questions_avg": [
            173.33333333333334,
            147.006424651744
        ],
        "wc_review_avg": [
            572.0,
            267.2689032915477
        ],
        "wc_reply_reviewers_avg": [
            173.0,
            88.2269800004511
        ],
        "wc_reply_authors_avg": [
            788.6666666666666,
            186.48026407341044
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2824936489583343707&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=fVxIEHGnVT",
        "pdf": "https://openreview.net/pdf?id=fVxIEHGnVT",
        "email": ";uni-heidelberg.de;uni-heidelberg.de",
        "author_num": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Heidelberg University;Ruprecht-Karls-Universit\u00e4t Heidelberg",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uni-heidelberg.de;https://www.uni-heidelberg.de/",
        "aff_unique_abbr": "Uni Heidelberg;Uni Heidelberg",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Germany"
    },
    {
        "title": "Consistent Multi-Class Classification from Multiple Unlabeled Datasets",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18183",
        "id": "fW7DOHDQvF",
        "author_site": "Zixi Wei, Senlin Shu, Yuzhou Cao, Hongxin Wei, Bo An, Lei Feng",
        "tldr": "",
        "abstract": "Weakly supervised learning aims to construct effective predictive models from imperfectly labeled data. The recent trend of weakly supervised learning has focused on how to learn an accurate classifier from completely unlabeled data, given little supervised information such as class priors. In this paper, we consider a newly proposed weakly supervised learning problem called multi-class classification from multiple unlabeled datasets, where only multiple sets of unlabeled data and their class priors (i.e., the proportions of each class) are provided for training the classifier. To solve this problem, we first propose a classifier-consistent method (CCM) based on a probability transition matrix. However, CCM cannot guarantee risk consistency and lacks of purified supervision information during training. Therefore, we further propose a risk-consistent method (RCM) that progressively purifies supervision information during training by importance weighting. We provide comprehensive theoretical analyses for our methods to demonstrate the statistical consistency. Experimental results on multiple benchmark datasets and various prior matrices demonstrate the superiority of our proposed methods.",
        "keywords": "mutli-class classification;multiple unlabeled datasets;learning consistency",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/861223644cd9a62ea5d774f35d55995ab9e66ce3.zip",
        "author": "Zixi Wei;Senlin Shu;Yuzhou Cao;Hongxin Wei;Bo An;Lei Feng",
        "authorids": "~Zixi_Wei1;~Senlin_Shu2;~Yuzhou_Cao1;~Hongxin_Wei1;~Bo_An2;~Lei_Feng1",
        "gender": "M;M;M;M;M;M",
        "homepage": ";;https://yzcao-nkg.github.io/;https://hongxin001.github.io/;https://personal.ntu.edu.sg/boan/;https://lfeng1995.github.io/",
        "dblp": "247/3651.html;257/5650;256/5052;150/6350;42/6178-1.html;76/847-6",
        "google_scholar": ";tZy2YnsAAAAJ;https://scholar.google.com/citations?hl=zh-CN;cABH034AAAAJ;PEEpuNwAAAAJ;https://scholar.google.com.sg/citations?user=KomQOFkAAAAJ",
        "orcid": ";;;;0000-0002-7064-7438;0000-0003-2839-5799",
        "linkedin": ";;;;;",
        "or_profile": "~Zixi_Wei1;~Senlin_Shu2;~Yuzhou_Cao1;~Hongxin_Wei1;~Bo_An2;~Lei_Feng1",
        "aff": "Chongqing University;Chongqing University;Nanyang Technological University;Southern University of Science and Technology;Nanyang Technological University;Singapore University of Technology and Design",
        "aff_domain": "cqu.edu.cn;cqu.edu.cn;ntu.edu;sustech.edu.cn;ntu.edu.sg;sutd.edu.sg",
        "position": "MS student;PhD student;PhD student;Assistant Professor;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nwei2024consistent,\ntitle={Consistent Multi-Class Classification from Multiple Unlabeled Datasets},\nauthor={Zixi Wei and Senlin Shu and Yuzhou Cao and Hongxin Wei and Bo An and Lei Feng},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=fW7DOHDQvF}\n}",
        "github": "",
        "project": "",
        "reviewers": "XSqD;vMrL;x6yh;S73G;3iq5",
        "pdf_size": 355115,
        "rating": "6;6;6;8;8",
        "confidence": "4;3;5;4;4",
        "soundness": "3;3;2;4;3",
        "contribution": "3;3;2;4;4",
        "presentation": "3;1;3;3;3",
        "wc_summary": "59;35;86;102;81",
        "wc_strengths": "50;34;58;116;86",
        "wc_weaknesses": "127;99;276;72;104",
        "wc_questions": "696;349;2;29;12",
        "wc_review": "932;517;422;319;283",
        "wc_reply_reviewers": "45;48;23;0;46",
        "wc_reply_authors": "2580;1255;1129;441;735",
        "reply_reviewers": "1;1;1;0;1",
        "reply_authors": "5;3;3;1;3",
        "rating_avg": [
            6.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            3.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            3.2,
            0.7483314773547882
        ],
        "presentation_avg": [
            2.6,
            0.8000000000000002
        ],
        "wc_summary_avg": [
            72.6,
            23.294634575369496
        ],
        "wc_strengths_avg": [
            68.8,
            28.99931033662697
        ],
        "wc_weaknesses_avg": [
            135.6,
            72.34528319109685
        ],
        "wc_questions_avg": [
            217.6,
            272.19742834935084
        ],
        "wc_review_avg": [
            494.6,
            233.53851930677305
        ],
        "wc_reply_reviewers_avg": [
            32.4,
            18.575252353602092
        ],
        "wc_reply_authors_avg": [
            1228.0,
            734.9628562043118
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4
        ],
        "reply_authors_avg": [
            3.0,
            1.2649110640673518
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:eDCKULG9gRUJ:scholar.google.com/&scioq=Consistent+Multi-Class+Classification+from+Multiple+Unlabeled+Datasets&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=fW7DOHDQvF",
        "pdf": "https://openreview.net/pdf?id=fW7DOHDQvF",
        "email": "cqu.edu.cn;cqu.edu.cn;ntu.edu;sustech.edu.cn;ntu.edu.sg;sutd.edu.sg",
        "author_num": 6,
        "aff_unique_index": "0;0;1;2;1;3",
        "aff_unique_norm": "Chongqing University;Nanyang Technological University;Southern University of Science and Technology;Singapore University of Technology and Design",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.cqu.edu.cn;https://www.ntu.edu.sg;https://www.sustech.edu.cn;https://www.sutd.edu.sg",
        "aff_unique_abbr": "CQU;NTU;SUSTech;SUTD",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;1;1",
        "aff_country_unique": "China;Singapore"
    },
    {
        "id": "fWk5Qx0exc",
        "title": "Last-Iterate Convergence Properties of Regret-Matching Algorithms in Games",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Algorithms based on regret matching, specifically regret matching$^+$ (RM$^+$), and its variants are the most popular approaches for solving large-scale two-player zero-sum games in practice. Unlike algorithms such as optimistic gradient descent ascent, which have strong last-iterate and ergodic convergence properties for zero-sum games, virtually nothing is known about the last-iterate properties of regret-matching algorithms. Since last-iterate convergence is an attractive property both for numerical optimization reasons and because no-regret learning is viewed as a plausible method of real-world learning in games. In this paper, we study the last-iterate convergence properties of various popular variants of RM$^+$. First, we show numerically that several practical variants such as simultaneous RM$^+$, alternating RM$^+$, and simultaneous predictive RM$^+$, all lack last-iterate convergence guarantees even on a simple $3\\times 3$ game. Then, we go on to show that recent variants of these algorithms based on a *smoothing* technique do enjoy last-iterate convergence: we prove that *extragradient RM$^{+}$* and *smooth PRM$^+$*  enjoy asymptotic last-iterate convergence (without a rate) and $1/\\sqrt{t}$ best-iterate convergence. Finally, we introduce restarted variants of these algorithms, and show that in both cases they enjoy linear-rate last-iterate convergence.",
        "keywords": "two-player zero-sum games;last-iterate convergence;regret matching;no-regret learning",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Yang Cai;Gabriele Farina;Julien Grand-Cl\u00e9ment;Christian Kroer;Chung-Wei Lee;Haipeng Luo;Weiqiang Zheng",
        "authorids": "~Yang_Cai1;~Gabriele_Farina1;~Julien_Grand-Cl\u00e9ment1;~Christian_Kroer1;~Chung-Wei_Lee1;~Haipeng_Luo1;~Weiqiang_Zheng1",
        "gender": ";M;M;M;;M;M",
        "homepage": ";http://www.cs.cmu.edu/~gfarina/about/;https://julien-grand-clement.fr/;http://www.columbia.edu/~ck2945/;https://chungwei.net/;https://haipeng-luo.net/;https://weiqiang-zheng.com/",
        "dblp": ";;197/0112;64/10660;80/2550;62/2576;277/5088",
        "google_scholar": ";sktDNcEAAAAJ;https://scholar.google.fr/citations?user=K_ZLzdoAAAAJ;https://scholar.google.ch/citations?user=ckHwjPAAAAAJ;VVVc6BIAAAAJ;ct2hw4UAAAAJ;YrfhnIwAAAAJ",
        "orcid": ";;;0000-0002-9009-8683;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Yang_Cai1;~Gabriele_Farina1;~Julien_Grand-Cl\u00e9ment1;~Christian_Kroer1;~Chung-Wei_Lee1;~Haipeng_Luo1;~Weiqiang_Zheng1",
        "aff": ";Massachusetts Institute of Technology;HEC Paris;Columbia University;University of Southern California;University of Southern California;Yale University",
        "aff_domain": ";mit.edu;hec.fr;columbia.edu;usc.edu;usc.edu;yale.edu",
        "position": ";Assistant Professor;Assistant Professor;Associate Professor;PhD student;Associate Professor;PhD student",
        "bibtex": "@misc{\ncai2024lastiterate,\ntitle={Last-Iterate Convergence Properties of Regret-Matching Algorithms in Games},\nauthor={Yang Cai and Gabriele Farina and Julien Grand-Cl{\\'e}ment and Christian Kroer and Chung-Wei Lee and Haipeng Luo and Weiqiang Zheng},\nyear={2024},\nurl={https://openreview.net/forum?id=fWk5Qx0exc}\n}",
        "github": "",
        "project": "",
        "reviewers": "cEcU;RSe5;zjHV;wbGe;aUEP",
        "site": "https://openreview.net/forum?id=fWk5Qx0exc",
        "pdf_size": 433384,
        "rating": "3;5;6;8;8",
        "confidence": "4;3;3;3;2",
        "soundness": "2;3;2;4;3",
        "contribution": "2;2;2;4;3",
        "presentation": "2;3;4;4;3",
        "wc_summary": "75;166;57;243;79",
        "wc_strengths": "43;144;17;124;28",
        "wc_weaknesses": "163;227;50;9;30",
        "wc_questions": "23;21;98;13;194",
        "wc_review": "304;558;222;389;331",
        "wc_reply_reviewers": "0;177;159;0;65",
        "wc_reply_authors": "1216;672;712;0;1196",
        "reply_reviewers": "0;1;2;0;1",
        "reply_authors": "3;1;2;0;2",
        "rating_avg": [
            6.0,
            1.8973665961010275
        ],
        "confidence_avg": [
            3.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.8,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.6,
            0.8
        ],
        "presentation_avg": [
            3.2,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            124.0,
            70.48404074682438
        ],
        "wc_strengths_avg": [
            71.2,
            52.31978593228378
        ],
        "wc_weaknesses_avg": [
            95.8,
            84.48763223099579
        ],
        "wc_questions_avg": [
            69.8,
            69.30916245345921
        ],
        "wc_review_avg": [
            360.8,
            112.30565435453373
        ],
        "wc_reply_reviewers_avg": [
            80.2,
            75.72951868327172
        ],
        "wc_reply_authors_avg": [
            759.2,
            443.9992792786943
        ],
        "reply_reviewers_avg": [
            0.8,
            0.7483314773547883
        ],
        "reply_authors_avg": [
            1.6,
            1.019803902718557
        ],
        "replies_avg": [
            33,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.8333333333333333,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6347879788310982993&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;3;3;4",
        "aff_unique_norm": "Massachusetts Institute of Technology;HEC Paris;Columbia University;University of Southern California;Yale University",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://web.mit.edu;https://www.hec.edu;https://www.columbia.edu;https://www.usc.edu;https://www.yale.edu",
        "aff_unique_abbr": "MIT;HEC;Columbia;USC;Yale",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Los Angeles",
        "aff_country_unique_index": "0;1;0;0;0;0",
        "aff_country_unique": "United States;France"
    },
    {
        "id": "fXa9rO75dB",
        "title": "Self-Supervised Deep Visual Stereo Odometry with 3D-Geometric Constraints",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "This work presents a simple but highly effective self-supervised learning framework for deep visual odometry on stereo cameras.\nRecent work on deep visual odometry is often based on monocular vision.\nA common approach is to use two separate neural networks, which use raw images for depth and ego-motion prediction.\nThis paper proposes an alternative approach that argues against separate prediction of depth and ego-motion and emphasizes the advantages of optical flow and stereo cameras.\nThe framework's structure is justified based on mathematical equations for image coordinate transformations. \nIts central component is a deep neural network for optical flow predictions, from which depth and ego-motion can be derived.\nThe main contribution of this work is a 3D-geometric constraint, which enforces a realistic structure of the scene over consecutive frames and models static and moving objects.\nIt ensures that the neural network has to predict the optical flow as it would occur in the real world.\nThe presented framework is developed and tested on the KITTI dataset.\nIt achieves state-of-the-art results, outperforming most algorithms for deep visual odometry.",
        "keywords": "deep learning;self-supervised learning;visual odometry;stereo image processing",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Juri Zach",
        "authorids": "~Juri_Zach1",
        "gender": "M",
        "homepage": "",
        "dblp": "",
        "google_scholar": "",
        "orcid": "0009-0005-2592-014X",
        "linkedin": "",
        "or_profile": "~Juri_Zach1",
        "aff": "Hamburg University Of Applied Sciences",
        "aff_domain": "haw-hamburg.de",
        "position": "PhD student",
        "bibtex": "@misc{\nzach2024selfsupervised,\ntitle={Self-Supervised Deep Visual Stereo Odometry with 3D-Geometric Constraints},\nauthor={Juri Zach},\nyear={2024},\nurl={https://openreview.net/forum?id=fXa9rO75dB}\n}",
        "github": "",
        "project": "",
        "reviewers": "GRTx;5ug3;4Waj;TCz4",
        "site": "https://openreview.net/forum?id=fXa9rO75dB",
        "pdf_size": 1736193,
        "rating": "1;1;3;6",
        "confidence": "4;5;4;4",
        "soundness": "1;1;1;3",
        "contribution": "1;1;1;2",
        "presentation": "1;1;2;4",
        "wc_summary": "35;54;101;208",
        "wc_strengths": "36;45;33;310",
        "wc_weaknesses": "62;61;308;211",
        "wc_questions": "31;1;225;602",
        "wc_review": "164;161;667;1331",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            1.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            1.224744871391589
        ],
        "wc_summary_avg": [
            99.5,
            67.09135562797938
        ],
        "wc_strengths_avg": [
            106.0,
            117.86220768337915
        ],
        "wc_weaknesses_avg": [
            160.5,
            104.77237231255194
        ],
        "wc_questions_avg": [
            214.75,
            239.54161955701977
        ],
        "wc_review_avg": [
            580.75,
            479.63130371150714
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.49374193110101877,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:YzAc8NBKA80J:scholar.google.com/&scioq=Self-Supervised+Deep+Visual+Stereo+Odometry+with+3D-Geometric+Constraints&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Hamburg University of Applied Sciences",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.haw-hamburg.de",
        "aff_unique_abbr": "HAW Hamburg",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "fXcgDPBTxI",
        "title": "Amortising the Gap between Pre-training and Fine-tuning for Video Instance Segmentation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Video Instance Segmentation (VIS) development heavily relies on fine-tuning pre-trained models initially trained on images. However, there is often a significant gap between the pre-training on images and fine-tuning for video, which needs to be noticed. In order to effectively bridge this gap, we present a novel approach known as ``\\textit{video pre-training}'' to achieve substantial improvements in VIS. Notably, our approach has enhanced performance on complex video datasets involving intricate instance relationships. Our primary contribution is minimizing disparities between the pre-training and fine-tuning stages at both the data and modeling levels. Specifically, we introduce the concept of consistent pseudo-video augmentations to enrich data diversity while maintaining instance prediction consistency across both stages. Additionally, at the modeling level for pre-training, we incorporate multi-scale temporal modules to enhance the model's understanding of temporal aspects, allowing it to better adapt to object variations and facilitate contextual integration. One of the strengths of our approach is its flexibility, as it can be seamlessly integrated into various segmentation methods, consistently delivering performance improvements. Across prominent VIS benchmarks, our method consistently outperforms all state-of-the-art methods. For instance, when using a ResNet-50 as a backbone, our approach achieves a remarkable 4.0\\% increase in average precision (AP) on the most challenging VIS benchmark, OVIS, setting a new record. The code will be made available soon.",
        "keywords": "Video instance segmentation;Instance segmentation;Augmentation;Pseudo Video",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Qing Zhong;Peng-Tao Jiang;Wen Wang;Hao Chen;Chengxiang Fan;Lin Yuanbo Wu",
        "authorids": "~Qing_Zhong1;~Peng-Tao_Jiang1;~Wen_Wang7;~Hao_Chen17;~Chengxiang_Fan1;~Lin_Yuanbo_Wu1",
        "gender": "M;M;M;;M;F",
        "homepage": ";https://pengtaojiang.github.io;;;https://leaf1170124460.github.io/;https://sites.google.com/site/linwuuq/home",
        "dblp": ";218/5550;29/4680-9;;353/0691;65/6292-1",
        "google_scholar": "t6-g5_wAAAAJ;85QJ_i4AAAAJ;1ks0R04AAAAJ;;I2aAMsAAAAAJ;https://scholar.google.com.au/citations?user=mMiJUegAAAAJ",
        "orcid": "0000-0003-3567-6724;;;;0009-0000-2555-4112;0000-0001-6119-058X",
        "linkedin": ";;;;;",
        "or_profile": "~Qing_Zhong1;~Peng-Tao_Jiang1;~Wen_Wang7;~Hao_Chen17;~Chengxiang_Fan1;~Lin_Yuanbo_Wu1",
        "aff": "University of Adelaide;vivo Mobile Communication Co., Ltd;Zhejiang University;;Zhejiang University;Swansea University",
        "aff_domain": "adelaide.edu.au;vivo.com;zju.edu.cn;;zju.edu.cn;swansea.ac.uk",
        "position": "PhD student;Researcher;PhD student;;MS student;Associate Professor",
        "bibtex": "@misc{\nzhong2024amortising,\ntitle={Amortising the Gap between Pre-training and Fine-tuning for Video Instance Segmentation},\nauthor={Qing Zhong and Peng-Tao Jiang and Wen Wang and Hao Chen and Chengxiang Fan and Lin Yuanbo Wu},\nyear={2024},\nurl={https://openreview.net/forum?id=fXcgDPBTxI}\n}",
        "github": "",
        "project": "",
        "reviewers": "RhiN;7Ge9;vE9c;aJG2",
        "site": "https://openreview.net/forum?id=fXcgDPBTxI",
        "pdf_size": 35932696,
        "rating": "3;3;3;5",
        "confidence": "5;5;5;4",
        "soundness": "2;2;2;2",
        "contribution": "1;1;2;2",
        "presentation": "1;1;2;2",
        "wc_summary": "53;75;49;83",
        "wc_strengths": "30;44;26;54",
        "wc_weaknesses": "101;351;158;252",
        "wc_questions": "5;62;26;114",
        "wc_review": "189;532;259;503",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            65.0,
            14.352700094407323
        ],
        "wc_strengths_avg": [
            38.5,
            11.169153951844338
        ],
        "wc_weaknesses_avg": [
            215.5,
            95.01184136727379
        ],
        "wc_questions_avg": [
            51.75,
            41.318125562517956
        ],
        "wc_review_avg": [
            370.75,
            149.17502304340363
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:KncZi2PDHfEJ:scholar.google.com/&scioq=Amortising+the+Gap+between+Pre-training+and+Fine-tuning+for+Video+Instance+Segmentation&hl=en&as_sdt=0,11",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;2;3",
        "aff_unique_norm": "University of Adelaide;vivo Mobile Communication Co., Ltd;Zhejiang University;Swansea University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.adelaide.edu.au;https://www.vivo.com.cn;https://www.zju.edu.cn;https://www.swansea.ac.uk",
        "aff_unique_abbr": "Adelaide;vivo;ZJU;Swansea",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;2",
        "aff_country_unique": "Australia;China;United Kingdom"
    },
    {
        "id": "fYerSwf1Tb",
        "title": "HawkesVAE: Sequential Patient Event Synthesis for Clinical Trials",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Generating sequential events data, such as adverse patient events, can provide valuable insights for clinical trial development, pharmaceutical research, patient modeling, and more. One approach to generate such data is by using generative AI models, which can synthesize data that resembles real-world data. However, in the domains such as clinical trials, patient data is especially limited. Data generation methods from literature such as LSTM, Probabilistic Auto-regressive, and Diffusion-based data generators struggle with this particular task off the shelf, as we show empirically. \nTo address this task, we propose HawkesVAE, a Variational Autoencoder (VAE) that models events using Hawkes Processes (HP). Hawkes Processes are specialized statistical models designed specifically for the task of event and time-gap prediction, and VAEs enable an end-to-end generative design. Additionally, traditional VAEs rely solely on embeddings to decode events, but in a data-limited setting, this approach can have issues fitting the data. Therefore, we experiment with different ways of allowing the decoder to access varying amounts of information from the input events. Our experiments show that HawkesVAE outperforms other methods in terms of fidelity and allows the generation of highly accurate event sequences in multiple real-world sequential event datasets with only a small amount of external information. Furthermore, our empirical experiments demonstrate that HawkesVAE generates data that allows for superior utility over existing baselines while maintaining privacy.",
        "keywords": "Synthetic Data Generation;Sequential Event Generation;VAE;Hawkes",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Chufan Gao;Mandis Beigi;Afrah Shafquat;Jimeng Sun",
        "authorids": "~Chufan_Gao1;~Mandis_Beigi1;~Afrah_Shafquat1;~Jimeng_Sun3",
        "gender": ";F;F;",
        "homepage": "https://chufangao.github.io;;;http://sunlab.org",
        "dblp": "239/1854.html;46/859.html;265/0022;",
        "google_scholar": "rBlZICgAAAAJ;OZgOGVwAAAAJ;Dl_9uVgAAAAJ;9jmmp5sAAAAJ",
        "orcid": "0000-0003-2807-0337;;0000-0002-2572-5521;0000-0003-1512-6426",
        "linkedin": "chufangao/;;afrahshafquat;jimengsun/",
        "or_profile": "~Chufan_Gao1;~Mandis_Beigi1;~Afrah_Shafquat1;~Jimeng_Sun3",
        "aff": "University of Illinois Urbana-Champaign;;Medidata Solutions;Georgia Institute of Technology",
        "aff_domain": "illinois.edu;;3ds.com;gatech.edu",
        "position": "PhD student;;Researcher;Associate Professor",
        "bibtex": "@misc{\ngao2024hawkesvae,\ntitle={Hawkes{VAE}: Sequential Patient Event Synthesis for Clinical Trials},\nauthor={Chufan Gao and Mandis Beigi and Afrah Shafquat and Jimeng Sun},\nyear={2024},\nurl={https://openreview.net/forum?id=fYerSwf1Tb}\n}",
        "github": "",
        "project": "",
        "reviewers": "wpgs;jzNy;6QpK;S6gY",
        "site": "https://openreview.net/forum?id=fYerSwf1Tb",
        "pdf_size": 551290,
        "rating": "3;3;5;5",
        "confidence": "4;4;4;3",
        "soundness": "3;1;3;2",
        "contribution": "2;1;2;2",
        "presentation": "3;1;3;1",
        "wc_summary": "93;48;99;31",
        "wc_strengths": "27;17;38;67",
        "wc_weaknesses": "294;179;44;187",
        "wc_questions": "54;2;90;205",
        "wc_review": "468;246;271;490",
        "wc_reply_reviewers": "0;0;0;198",
        "wc_reply_authors": "753;842;495;1408",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;2;1;3",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            1.0
        ],
        "wc_summary_avg": [
            67.75,
            28.960101864461734
        ],
        "wc_strengths_avg": [
            37.25,
            18.713297411199342
        ],
        "wc_weaknesses_avg": [
            176.0,
            88.71020234448798
        ],
        "wc_questions_avg": [
            87.75,
            74.57336991178553
        ],
        "wc_review_avg": [
            368.75,
            110.87690246394872
        ],
        "wc_reply_reviewers_avg": [
            49.5,
            85.73651497465943
        ],
        "wc_reply_authors_avg": [
            874.5,
            333.33954160885264
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:AWyWidjfDUAJ:scholar.google.com/&scioq=HawkesVAE:+Sequential+Patient+Event+Synthesis+for+Clinical+Trials&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of Illinois Urbana-Champaign;Medidata Solutions;Georgia Institute of Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://illinois.edu;https://www.meddiasolutions.com;https://www.gatech.edu",
        "aff_unique_abbr": "UIUC;;Georgia Tech",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Urbana-Champaign;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "fZZ4ubttru",
        "title": "GenBot: Generative Simulation Empowers Automated Robotic Skill Learning at Scale",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We present GenBot, a generative robotic agent that automatically learns diverse robotic skills at scale via generative simulation. GenBot leverages the latest advancements in foundation and generative models. Instead of directly using or adapting these models to produce policies or low-level actions, we advocate for a generative scheme, which uses these models to automatically generate diversified tasks, scenes, and training supervisions, thereby scaling up robotic skill learn- ing with minimal human supervision. Our approach equips a robotic agent with a self-guided propose-generate-learn cycle: the agent first proposes interesting tasks and skills to develop, and then generates simulation environments by populating pertinent objects and assets with proper spatial configurations. Afterwards, the agent decomposes the proposed high-level task into sub-tasks, selects the optimal learning approach (reinforcement learning, motion planning, or trajectory optimization), generates required training supervision, and then learns policies to acquire the proposed skill. Our fully generative pipeline can be queried repeatedly, producing an endless stream of skill demonstrations associated with diverse tasks and environments. Our code will be made publicly available upon publication.",
        "keywords": "Robot Learning; Generative Model; Robotic Simulation",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/84e85f35ddb853d1af8805f15487cec0804f70d9.pdf",
        "author": "Yufei Wang;Zhou Xian;Feng Chen;Tsun-Hsuan Wang;Zackory Erickson;David Held;Chuang Gan",
        "authorids": "~Yufei_Wang4;~Zhou_Xian1;~Feng_Chen16;~Tsun-Hsuan_Wang2;~Zackory_Erickson1;~David_Held1;~Chuang_Gan1",
        "gender": ";M;M;M;M;M;M",
        "homepage": "https://yufeiwang63.github.io/;;https://winniechen2002.github.io/;https://zswang666.github.io/;https://zackory.com;http://davheld.github.io/;http://people.csail.mit.edu/ganchuang/",
        "dblp": ";258/5020;;217/1809.html;;22/11147;139/6993",
        "google_scholar": "HQl9718AAAAJ;;xuVkkKwAAAAJ;xE3WSuYAAAAJ;wElkTtIAAAAJ;0QtU-NsAAAAJ;PTeSCbIAAAAJ",
        "orcid": ";;;;;;",
        "linkedin": ";;https://linkedin.com/in/\u67ab-\u9648-822809265;;;;",
        "or_profile": "~Yufei_Wang4;~Zhou_Xian1;~Feng_Chen16;~Tsun-Hsuan_Wang2;~Zackory_Erickson1;~David_Held1;~Chuang_Gan1",
        "aff": "School of Computer Science, Carnegie Mellon University;Carnegie Mellon University;IIIS, Tsinghua University;Liquid AI;Carnegie Mellon University;Carnegie Mellon University;University of Massachusetts at Amherst",
        "aff_domain": "cs.cmu.edu;cmu.edu;mails.tsinghua.edu.cn;liquid.ai;cmu.edu;cmu.edu;umass.edu",
        "position": "PhD student;PhD student;Undergrad student;Researcher;Assistant Professor;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nwang2024genbot,\ntitle={GenBot: Generative Simulation Empowers Automated Robotic Skill Learning at Scale},\nauthor={Yufei Wang and Zhou Xian and Feng Chen and Tsun-Hsuan Wang and Zackory Erickson and David Held and Chuang Gan},\nyear={2024},\nurl={https://openreview.net/forum?id=fZZ4ubttru}\n}",
        "github": "",
        "project": "",
        "reviewers": "EQgy;X3QY;pBsz;niTv",
        "site": "https://openreview.net/forum?id=fZZ4ubttru",
        "pdf_size": 41839627,
        "rating": "3;5;6;8",
        "confidence": "3;5;5;3",
        "soundness": "2;2;2;4",
        "contribution": "2;3;4;4",
        "presentation": "3;4;3;3",
        "wc_summary": "58;102;201;60",
        "wc_strengths": "30;17;120;143",
        "wc_weaknesses": "135;45;386;40",
        "wc_questions": "118;772;218;48",
        "wc_review": "341;936;925;291",
        "wc_reply_reviewers": "81;0;41;0",
        "wc_reply_authors": "3600;3428;4121;614",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "9;7;8;2",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            4.0,
            1.0
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            3.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            105.25,
            58.00592642135802
        ],
        "wc_strengths_avg": [
            77.5,
            54.801916024898254
        ],
        "wc_weaknesses_avg": [
            151.5,
            140.56759939616242
        ],
        "wc_questions_avg": [
            289.0,
            285.3296339324046
        ],
        "wc_review_avg": [
            623.25,
            307.78269525754695
        ],
        "wc_reply_reviewers_avg": [
            30.5,
            33.61919094802848
        ],
        "wc_reply_authors_avg": [
            2940.75,
            1367.36779525481
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            6.5,
            2.692582403567252
        ],
        "replies_avg": [
            36,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:LfINWEV72o8J:scholar.google.com/&scioq=GenBot:+Generative+Simulation+Empowers+Automated+Robotic+Skill+Learning+at+Scale&hl=en&as_sdt=0,34",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2;0;0;3",
        "aff_unique_norm": "Carnegie Mellon University;Tsinghua University;Liquid AI;University of Massachusetts Amherst",
        "aff_unique_dep": "School of Computer Science;Institute for Interdisciplinary Information Sciences;;",
        "aff_unique_url": "https://www.cmu.edu;https://www.tsinghua.edu.cn;;https://www.umass.edu",
        "aff_unique_abbr": "CMU;THU;;UMass Amherst",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Pittsburgh;;Amherst",
        "aff_country_unique_index": "0;0;1;2;0;0;0",
        "aff_country_unique": "United States;China;Unknown"
    },
    {
        "id": "fZmdNb5ThL",
        "title": "ShiftAddAug: Augment Multiplication-Free Tiny Neural Network with Hybrid Computation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We introduce a novel training methodology termed ShiftAddAug aimed at enhancing the performance of multiplication-free tiny neural networks. Multiplication-free operators, such as Shift and Add, have garnered attention because of their hardware-friendly nature. They are more suitable for deployment on resource-limited platforms with reduced energy consumption and computational demands.\nHowever, multiplication-free networks usually suffer from under-performance in terms of accuracy compared to their vanilla counterpart with the same structure.\nShiftAddAug uses costly multiplication to augment efficient but less powerful multiplication-free operators, improving network accuracy without any inference overhead. It puts a multiplication-free tiny NN into a large multiplicative model and encourages it to be trained as a sub-model to obtain additional supervision, rather than as an independent model. In the process of inference, only the multiplication-free tiny model is used. \nThe effectiveness of ShiftAddAug is demonstrated through experiments in image classification, consistently resulting in significant improvements in accuracy and energy saving. Notably, it achieves up to a 4.05\\% accuracy improvement on the CIFAR100 while simultaneously having a 68.9\\% reduction in energy consumption compared to its costly multiplication counterpart.\nAdditionally, neural architecture search is used to obtain better augmentation effects and smaller but stronger multiplication-free tiny neural networks.\nCodes and models will be released upon acceptance.",
        "keywords": "tiny neural network;multiplication-free network",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/d27a656b62cb612bbbcdf0c8fb49085462cbcd85.pdf",
        "author": "Yipin Guo;Zihao Li;Qinyuan Ren",
        "authorids": "~Yipin_Guo1;~Zihao_Li7;~Qinyuan_Ren1",
        "gender": "M;M;M",
        "homepage": "https://github.com/coco-alen?tab=repositories;https://github.com/Jeong-zju;https://person.zju.edu.cn/0008668",
        "dblp": "302/4321.html;175/8858.html;43/3186.html",
        "google_scholar": ";;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Yipin_Guo1;~Zihao_Li7;~Qinyuan_Ren1",
        "aff": "Zhejiang University;Zhejiang University;Zhejiang University",
        "aff_domain": "zju.edu.cn;zju.edu.cn;zju.edu.cn",
        "position": "MS student;MS student;Full Professor",
        "bibtex": "@misc{\nguo2024shiftaddaug,\ntitle={ShiftAddAug: Augment Multiplication-Free Tiny Neural Network with Hybrid Computation},\nauthor={Yipin Guo and Zihao Li and Qinyuan Ren},\nyear={2024},\nurl={https://openreview.net/forum?id=fZmdNb5ThL}\n}",
        "github": "",
        "project": "",
        "reviewers": "J3s9;x9yN;PuT1;cMEX",
        "site": "https://openreview.net/forum?id=fZmdNb5ThL",
        "pdf_size": 3726163,
        "rating": "3;3;6;8",
        "confidence": "4;5;4;3",
        "soundness": "2;2;2;3",
        "contribution": "2;1;3;4",
        "presentation": "2;1;2;4",
        "wc_summary": "66;29;151;104",
        "wc_strengths": "83;38;74;34",
        "wc_weaknesses": "291;241;373;248",
        "wc_questions": "151;3;4;2",
        "wc_review": "591;311;602;388",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "813;723;816;595",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            5.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            1.118033988749895
        ],
        "presentation_avg": [
            2.25,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            87.5,
            45.24654682956479
        ],
        "wc_strengths_avg": [
            57.25,
            21.533404282648853
        ],
        "wc_weaknesses_avg": [
            288.25,
            52.54224490826405
        ],
        "wc_questions_avg": [
            40.0,
            64.08978077665736
        ],
        "wc_review_avg": [
            473.0,
            126.52470114566562
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            736.75,
            89.96770253818868
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8333333333333334,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:_edN6BeCCDgJ:scholar.google.com/&scioq=ShiftAddAug:+Augment+Multiplication-Free+Tiny+Neural+Network+with+Hybrid+Computation&hl=en&as_sdt=0,5",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Zhejiang University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.zju.edu.cn",
        "aff_unique_abbr": "ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "fagTLzHFBs",
        "title": "LDINet: Latent Decomposition and Interpolation for Single Image FMO Deblatting",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The image of fast-moving objects usually contains a blur stripe indicating the blurred object that is mixed with backgrounds. To deblur the stripe and separate the object from the background in this single image, in this work we propose a novel LDINet that introduces an efficient decomposition-interpolation module (DIB) to generate the appearances and shapes of the objects. In particular, under the assumption that motion blur is an accumulation of the appearance of the object over exposure time, in the latent space the feature maps of the long blur is decomposed into several shorter blur parts. Specifically, the blurry input is first encoded into latent feature maps. Then the DIB module breaks down the feature maps into discrete time indexed parts corresponding to different small blurs and further interpolates the target latent frames in accordance with the provided time indices. In addition, the feature maps are categorized into the scalar-like and gradient-like classes which help the affine transformations effectively capture the motion of feature warping in the interpolation. Finally, the sharp and clear images are rendered with a decoder. Extensive experiments are conducted and has shown that the proposed LDINet achieves superior performances compared to the existing competing methods.",
        "keywords": "fast moving object deblatting;image deblur;time super-resolution;latent decomposition and interpolation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/6500f4dc4fa0683af7fb0a355d86e422650b1a98.zip",
        "author": "Haodong Fan;Dingyi Zhang;Yunlong Yu;Yingming Li",
        "authorids": "~Haodong_Fan1;~Dingyi_Zhang1;~Yunlong_Yu1;~Yingming_Li1",
        "gender": ";;M;",
        "homepage": ";;https://person.zju.edu.cn/en/yunlong;",
        "dblp": ";https://dblp.uni-trier.de/pers/hd/z/Zhang:Dingyi;45/7404;119/1901",
        "google_scholar": ";;;",
        "orcid": ";;;",
        "linkedin": "haodong-fan-81b692291;;;",
        "or_profile": "~Haodong_Fan1;~Dingyi_Zhang1;~Yunlong_Yu1;~Yingming_Li1",
        "aff": "Zhejiang University;Zhejiang University;Zhejiang University;Zhejiang University",
        "aff_domain": "zju.edu.cn;zju.edu.cn;zju.edu.cn;zju.edu.cn",
        "position": "PhD student;PhD student;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nfan2024ldinet,\ntitle={{LDIN}et: Latent Decomposition and Interpolation for Single Image {FMO} Deblatting},\nauthor={Haodong Fan and Dingyi Zhang and Yunlong Yu and Yingming Li},\nyear={2024},\nurl={https://openreview.net/forum?id=fagTLzHFBs}\n}",
        "github": "",
        "project": "",
        "reviewers": "wbgD;JWwD;3qEi;Gmw4",
        "site": "https://openreview.net/forum?id=fagTLzHFBs",
        "pdf_size": 6723359,
        "rating": "3;5;6;8",
        "confidence": "5;3;3;5",
        "soundness": "2;3;3;3",
        "contribution": "1;3;3;3",
        "presentation": "1;3;2;3",
        "wc_summary": "76;103;119;118",
        "wc_strengths": "13;79;65;97",
        "wc_weaknesses": "121;164;286;607",
        "wc_questions": "4;82;55;35",
        "wc_review": "214;428;525;857",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "769;490;378;835",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            4.0,
            1.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            104.0,
            17.363755354185336
        ],
        "wc_strengths_avg": [
            63.5,
            31.284980421921315
        ],
        "wc_weaknesses_avg": [
            294.5,
            190.30304779482645
        ],
        "wc_questions_avg": [
            44.0,
            28.48683906648823
        ],
        "wc_review_avg": [
            506.0,
            231.7919325602166
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            618.0,
            189.65363165518343
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:-vNOy9ey47oJ:scholar.google.com/&scioq=LDINet:+Latent+Decomposition+and+Interpolation+for+Single+Image+FMO+Deblatting&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Zhejiang University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.zju.edu.cn",
        "aff_unique_abbr": "ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "fapHf9fmqp",
        "title": "Unnormalized Density Estimation with Root Sobolev Norm Regularization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We propose a new approach to non-parametric density estimation that is based on regularizing a Sobolev norm of the density. This method is consistent, different from Kernel Density Estimation, and makes the inductive bias of the model clear and interpretable. While there is no closed analytic form for the associated kernel, we show that one can approximate it using sampling. The optimization problem needed to determine the density is non-convex, and standard gradient methods do not perform well. However, we show that with an appropriate initialization and using natural gradients, one can obtain well performing solutions. Finally, while the approach provides unnormalized densities, which prevents the use of log-likelihood for cross validation, we show that one can instead adapt Fisher Divergence based Score Matching methods for this task. We evaluate the resulting method on the comprehensive recent Anomaly Detection benchmark suite, ADBench, and find that it ranks second best, among more than 15 algorithms.",
        "keywords": "Density estimation;Sobolev norm regularization;Score based methods;Fisher divergence for hyperparameter tuning;Anomaly detection;High dimensional data;Kernel Density Estimation (KDE)",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Mark Kozdoba;Binyamin Perets;Shie Mannor",
        "authorids": "~Mark_Kozdoba1;~Binyamin_Perets1;~Shie_Mannor2",
        "gender": ";M;M",
        "homepage": "https://www.linkedin.com/in/mark-kozdoba-5b6bb835/;;https://shie.net.technion.ac.il",
        "dblp": "161/9885;;20/1669",
        "google_scholar": "PHE-SswAAAAJ;7jP7ra0AAAAJ;https://scholar.google.com.tw/citations?user=q1HlbIUAAAAJ",
        "orcid": "0000-0002-8451-023X;;",
        "linkedin": "mark-kozdoba-5b6bb835/;benny-perets-876853102/;",
        "or_profile": "~Mark_Kozdoba1;~Binyamin_Perets1;~Shie_Mannor2",
        "aff": "Technion;Technion - Israel Institute of Technology, Technion - Israel Institute of Technology;Technion - Israel Institute of Technology, Technion",
        "aff_domain": "technion.ac.il;campus.technion.ac.il;technion.il",
        "position": "Principal Researcher;PhD student;Full Professor",
        "bibtex": "@misc{\nkozdoba2024unnormalized,\ntitle={Unnormalized Density Estimation with Root Sobolev Norm Regularization},\nauthor={Mark Kozdoba and Binyamin Perets and Shie Mannor},\nyear={2024},\nurl={https://openreview.net/forum?id=fapHf9fmqp}\n}",
        "github": "",
        "project": "",
        "reviewers": "CL4E;o1rt;oZU9",
        "site": "https://openreview.net/forum?id=fapHf9fmqp",
        "pdf_size": 3635550,
        "rating": "3;5;5",
        "confidence": "3;3;3",
        "soundness": "3;4;3",
        "contribution": "2;2;2",
        "presentation": "2;3;3",
        "wc_summary": "91;145;57",
        "wc_strengths": "36;75;31",
        "wc_weaknesses": "117;203;763",
        "wc_questions": "136;214;239",
        "wc_review": "380;637;1090",
        "wc_reply_reviewers": "0;0;753",
        "wc_reply_authors": "982;502;1946",
        "reply_reviewers": "0;0;3",
        "reply_authors": "3;2;4",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            97.66666666666667,
            36.23380864453651
        ],
        "wc_strengths_avg": [
            47.333333333333336,
            19.669491322575904
        ],
        "wc_weaknesses_avg": [
            361.0,
            286.4169454949666
        ],
        "wc_questions_avg": [
            196.33333333333334,
            43.86595744107522
        ],
        "wc_review_avg": [
            702.3333333333334,
            293.51471664788613
        ],
        "wc_reply_reviewers_avg": [
            251.0,
            354.9676041556469
        ],
        "wc_reply_authors_avg": [
            1143.3333333333333,
            600.4472407205222
        ],
        "reply_reviewers_avg": [
            1.0,
            1.4142135623730951
        ],
        "reply_authors_avg": [
            3.0,
            0.816496580927726
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Na3hcU_KpMcJ:scholar.google.com/&scioq=Unnormalized+Density+Estimation+with+Root+Sobolev+Norm+Regularization&hl=en&as_sdt=0,5",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Technion - Israel Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.technion.ac.il/en/",
        "aff_unique_abbr": "Technion",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Israel"
    },
    {
        "title": "A Paradigm Shift in Machine Translation: Boosting Translation Performance of Large Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18182",
        "id": "farT6XXntP",
        "author_site": "Haoran Xu, Young Jin Kim, Amr Mohamed Nabil Aly Aly Sharaf, Hany Awadalla",
        "tldr": "",
        "abstract": "Generative Large Language Models (LLMs) have achieved remarkable advancements in various NLP tasks. However, these advances have not been reflected in the translation task, especially those with moderate model sizes (i.e., 7B or 13B parameters), which still lag behind conventional supervised encoder-decoder translation models. Previous studies have attempted to improve the translation capabilities of these LLMs, but their gains have been limited. In this study, we propose a novel fine-tuning approach for LLMs that is specifically designed for the translation task, eliminating the need for the abundant parallel data that traditional translation models usually depend on.\nOur approach consists of two fine-tuning stages: initial fine-tuning on monolingual data followed by subsequent fine-tuning on a small set of high-quality parallel data.  We introduce the LLM  developed through this strategy as **A**dvanced **L**anguage **M**odel-based tr**A**nslator (**ALMA**). Based on LLaMA-2 as our underlying model, our results show that the model can achieve an average improvement of more than 12 BLEU and 12 COMET over its zero-shot performance across 10 translation directions from the WMT'21 (2 directions) and WMT'22 (8 directions) test datasets. The performance is significantly better than all prior work and even superior to the NLLB-54B model \\citep{nllb} and GPT-3.5-text-davinci-003, with only 7B or 13B parameters. This method establishes the foundation for a novel training paradigm in machine translation.",
        "keywords": "Machine Translation;Language Language Models;Multilingual",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Haoran Xu;Young Jin Kim;Amr Sharaf;Hany Hassan Awadalla",
        "authorids": "~Haoran_Xu3;~Young_Jin_Kim1;~Amr_Sharaf1;~Hany_Hassan_Awadalla1",
        "gender": "M;M;M;M",
        "homepage": "https://www.fe1ixxu.com/;https://www.microsoft.com/en-us/research/people/youki/;http://cs.umd.edu/~amr;",
        "dblp": ";00/8110-1.html;159/1156;83/64",
        "google_scholar": "rhcrGQ0AAAAJ;;It3Gm1EAAAAJ;",
        "orcid": ";;;",
        "linkedin": "haoran-xu-0842b3194/;ykim362/;amrsharaf/;",
        "or_profile": "~Haoran_Xu3;~Young_Jin_Kim1;~Amr_Sharaf1;~Hany_Hassan1",
        "aff": "Johns Hopkins University;Microsoft;Microsoft;Microsoft",
        "aff_domain": "jhu.edu;microsoft.com;microsoft.com;microsoft.com",
        "position": "PhD student;Principal Researcher;Researcher;Research Scientist",
        "bibtex": "@inproceedings{\nxu2024a,\ntitle={A Paradigm Shift in Machine Translation: Boosting Translation Performance of Large Language Models},\nauthor={Haoran Xu and Young Jin Kim and Amr Sharaf and Hany Hassan Awadalla},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=farT6XXntP}\n}",
        "github": "",
        "project": "",
        "reviewers": "AH62;vUYo;TMW7;TXCQ",
        "pdf_size": 465963,
        "rating": "5;6;8;8",
        "confidence": "4;4;4;4",
        "soundness": "3;3;3;4",
        "contribution": "2;3;3;4",
        "presentation": "2;4;3;4",
        "wc_summary": "223;76;41;79",
        "wc_strengths": "47;33;135;49",
        "wc_weaknesses": "123;29;27;33",
        "wc_questions": "418;228;270;73",
        "wc_review": "811;366;473;234",
        "wc_reply_reviewers": "0;0;47;0",
        "wc_reply_authors": "2181;1460;1908;872",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "4;3;4;2",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            104.75,
            69.88696230342252
        ],
        "wc_strengths_avg": [
            66.0,
            40.311288741492746
        ],
        "wc_weaknesses_avg": [
            53.0,
            40.47221268969612
        ],
        "wc_questions_avg": [
            247.25,
            122.88892342273978
        ],
        "wc_review_avg": [
            471.0,
            213.77441381044645
        ],
        "wc_reply_reviewers_avg": [
            11.75,
            20.351596988934308
        ],
        "wc_reply_authors_avg": [
            1605.25,
            495.45402158020676
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.25,
            0.82915619758885
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 156,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5611319418297146573&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=farT6XXntP",
        "pdf": "https://openreview.net/pdf?id=farT6XXntP",
        "email": "jhu.edu;microsoft.com;microsoft.com;microsoft.com",
        "author_num": 4,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Johns Hopkins University;Microsoft",
        "aff_unique_dep": ";Microsoft Corporation",
        "aff_unique_url": "https://www.jhu.edu;https://www.microsoft.com",
        "aff_unique_abbr": "JHU;Microsoft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "fcSDt7H8kI",
        "title": "Boosting Reinforcement Learning with Extremum Experiences",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Reinforcement learning research has achieved high acceleration in its progress starting from the initial installation of deep neural networks as function approximators to learn policies that make sequential decisions in high-dimensional state representation MDPs. While several consecutive barriers have been broken in deep reinforcement learning research (i.e. learning from high-dimensional states, learning purely via self-play), several others still stand. On this line, in our paper we focus on experience collection in high-dimensional complex MDPs and we propose a unique technique based on experiences obtained through extremum actions. Our method provides theoretical basis for efficient experience collection, and further comes with zero additional computational cost while leading to significant sample efficiency gains in deep reinforcement learning training. We conduct extensive experiments in the Arcade Learning Environment with high-dimensional state representation MDPs. We demonstrate that our technique improves the human normalized median scores of Arcade Learning Environment by 248% in the low-data regime.",
        "keywords": "Experience Collection;Canonicalization;Environment Interaction;Consistent Improvement over the Baseline",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/9de3171c9c2bcbcd66cff0632307c951aa1b4351.zip",
        "author": "Ezgi Korkmaz",
        "authorids": "~Ezgi_Korkmaz2",
        "gender": "",
        "homepage": "https://ezgikorkmaz.github.io/",
        "dblp": "300/7830.html",
        "google_scholar": "",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Ezgi_Korkmaz2",
        "aff": "University College London, University of London",
        "aff_domain": "ucl.ac.uk",
        "position": "PhD student",
        "bibtex": "@misc{\nkorkmaz2024boosting,\ntitle={Boosting Reinforcement Learning with Extremum Experiences},\nauthor={Ezgi Korkmaz},\nyear={2024},\nurl={https://openreview.net/forum?id=fcSDt7H8kI}\n}",
        "github": "",
        "project": "",
        "reviewers": "zmyD;qFHi;uoX8;pNsy",
        "site": "https://openreview.net/forum?id=fcSDt7H8kI",
        "pdf_size": 3237106,
        "rating": "3;3;5;5",
        "confidence": "4;4;4;3",
        "soundness": "2;1;2;2",
        "contribution": "2;2;2;2",
        "presentation": "3;3;3;2",
        "wc_summary": "47;97;56;69",
        "wc_strengths": "30;124;42;22",
        "wc_weaknesses": "30;535;220;68",
        "wc_questions": "376;6;58;35",
        "wc_review": "483;762;376;194",
        "wc_reply_reviewers": "250;0;216;0",
        "wc_reply_authors": "1125;857;984;154",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "2;2;2;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            67.25,
            18.872930350107268
        ],
        "wc_strengths_avg": [
            54.5,
            40.75230054855799
        ],
        "wc_weaknesses_avg": [
            213.25,
            198.90120034831364
        ],
        "wc_questions_avg": [
            118.75,
            149.66191065197583
        ],
        "wc_review_avg": [
            453.75,
            205.78432277508412
        ],
        "wc_reply_reviewers_avg": [
            116.5,
            117.11852970388588
        ],
        "wc_reply_authors_avg": [
            780.0,
            373.64622305062846
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:RvV6OA0gdnIJ:scholar.google.com/&scioq=Boosting+Reinforcement+Learning+with+Extremum+Experiences&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "University College London",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucl.ac.uk",
        "aff_unique_abbr": "UCL",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "fcZ9VadFd5",
        "title": "Emergence of Equivariance in Deep Ensembles",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We demonstrate that a generic deep ensemble is emergently equivariant under data augmentation in the large width limit. Specifically, the ensemble is equivariant at any training step for any choice of architecture, provided that data augmentation is used. This equivariance also holds off-manifold and is emergent in the sense that predictions of individual ensemble members are not equivariant but their collective prediction is. As such, the deep ensemble is indistinguishable from a manifestly equivariant predictor. We prove this theoretically using neural tangent kernel theory and verify our theoretical insights using detailed numerical experiments.",
        "keywords": "equivariant networks;deep ensembles;neural tangent kernel",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/132a21ed585d9914c4019b2877767f04de5e0a22.pdf",
        "author": "Jan E Gerken;Pan Kessel",
        "authorids": "~Jan_E_Gerken1;~Pan_Kessel1",
        "gender": "M;M",
        "homepage": "https://www.chalmers.se/sv/personal/Sidor/gerken.aspx;https://www.gene.com/scientists/our-scientists/pan-kessel",
        "dblp": "293/9373;238/1381",
        "google_scholar": "NIdlVIEAAAAJ;uODjwl8AAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Jan_E_Gerken1;~Pan_Kessel1",
        "aff": "Chalmers University of Technology;Prescient Design",
        "aff_domain": "chalmers.se;roche.com",
        "position": "Assistant Professor;Researcher",
        "bibtex": "@misc{\ngerken2024emergence,\ntitle={Emergence of Equivariance in Deep Ensembles},\nauthor={Jan E Gerken and Pan Kessel},\nyear={2024},\nurl={https://openreview.net/forum?id=fcZ9VadFd5}\n}",
        "github": "",
        "project": "",
        "reviewers": "waBb;wXhZ;FAEm;8JsL",
        "site": "https://openreview.net/forum?id=fcZ9VadFd5",
        "pdf_size": 849350,
        "rating": "5;5;6;8",
        "confidence": "4;4;2;3",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;4",
        "wc_summary": "41;87;86;76",
        "wc_strengths": "42;34;31;61",
        "wc_weaknesses": "135;366;65;78",
        "wc_questions": "33;4;98;2",
        "wc_review": "251;491;280;217",
        "wc_reply_reviewers": "0;0;0;15",
        "wc_reply_authors": "964;1032;650;379",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            72.5,
            18.688231591030757
        ],
        "wc_strengths_avg": [
            42.0,
            11.683321445547923
        ],
        "wc_weaknesses_avg": [
            161.0,
            121.24974226776732
        ],
        "wc_questions_avg": [
            34.25,
            38.79674599757047
        ],
        "wc_review_avg": [
            309.75,
            106.99386664664475
        ],
        "wc_reply_reviewers_avg": [
            3.75,
            6.49519052838329
        ],
        "wc_reply_authors_avg": [
            756.25,
            261.15357072037136
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.4923659639173309,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12466558153924177896&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 10,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Chalmers University of Technology;Prescient Design",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.chalmers.se;",
        "aff_unique_abbr": "Chalmers;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Sweden;"
    },
    {
        "id": "fcl6WeMARK",
        "title": "Improved Regret Bounds in Stochastic Contextual Bandits with Graph Feedback",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "This paper investigates the stochastic contextual bandit problem with general function space and graph feedback. We propose a novel algorithm that effectively adapts to the time-varying graph structures, leading to improved regret bounds in stochastic settings compared with existing approaches. Notably, our method does not require prior knowledge of graph parameters or online regression oracles, making it highly practical and innovative. Furthermore, our algorithm can be modified to derive a gap-dependent upper bound on regrets, addressing a significant research gap in this field. Extensive numerical experiments validate our findings, showcasing the adaptability of our approach to graph feedback settings. The numerical results demonstrate that regrets of our method scale with graph parameters rather than action set sizes. This algorithmic advancement in stochastic contextual bandits with graph feedback shows practical implications in various domains.",
        "keywords": "side-observations;probabilistic feedback;gap-dependent upper bound",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/633e72ebb49e28fa9e9fd8d0fb1b8555f3c0ac8b.pdf",
        "author": "Xueping Gong;Jiheng Zhang",
        "authorids": "~Xueping_Gong1;~Jiheng_Zhang1",
        "gender": ";",
        "homepage": ";https://reijz.github.io",
        "dblp": ";13/7602",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Xueping_Gong1;~Jiheng_Zhang1",
        "aff": ";Hong Kong University of Science and Technology",
        "aff_domain": ";ust.hk",
        "position": ";Full Professor",
        "bibtex": "@misc{\nanonymous2024improved,\ntitle={Improved Regret Bounds in Stochastic Contextual Bandits with Graph Feedback},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=fcl6WeMARK}\n}",
        "github": "",
        "project": "",
        "reviewers": "Z4bM;7kWt;nWZ2",
        "site": "https://openreview.net/forum?id=fcl6WeMARK",
        "pdf_size": 320502,
        "rating": "1;6;6",
        "confidence": "4;4;3",
        "soundness": "1;3;3",
        "contribution": "1;2;3",
        "presentation": "2;2;4",
        "wc_summary": "144;101;107",
        "wc_strengths": "15;129;127",
        "wc_weaknesses": "223;368;209",
        "wc_questions": "25;120;172",
        "wc_review": "407;718;615",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;697;691",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;1;1",
        "rating_avg": [
            4.333333333333333,
            2.357022603955158
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            117.33333333333333,
            19.014614262602212
        ],
        "wc_strengths_avg": [
            90.33333333333333,
            53.27496806401879
        ],
        "wc_weaknesses_avg": [
            266.6666666666667,
            71.88107462252417
        ],
        "wc_questions_avg": [
            105.66666666666667,
            60.862321860262796
        ],
        "wc_review_avg": [
            580.0,
            129.35480921352197
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            462.6666666666667,
            327.1639072731316
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5000000000000001,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:DoR3uLiHB3IJ:scholar.google.com/&scioq=Improved+Regret+Bounds+in+Stochastic+Contextual+Bandits+with+Graph+Feedback&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Hong Kong University of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ust.hk",
        "aff_unique_abbr": "HKUST",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "title": "AuG-KD: Anchor-Based Mixup Generation for Out-of-Domain Knowledge Distillation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18181",
        "id": "fcqWJ8JgMR",
        "author_site": "Zihao Tang, Zheqi Lv, Shengyu Zhang, Yifan Zhou, Xinyu Duan, Fei Wu, Kun Kuang",
        "tldr": "",
        "abstract": "Due to privacy or patent concerns, a growing number of large models are released without granting access to their training data, making transferring their knowledge inefficient and problematic. In response, Data-Free Knowledge Distillation (DFKD) methods have emerged as direct solutions. However, simply adopting models derived from DFKD for real-world applications suffers significant performance degradation, due to the discrepancy between teachers' training data and real-world scenarios (student domain). The degradation stems from the portions of teachers' knowledge that are not applicable to the student domain. They are specific to the teacher domain and would undermine students' performance. Hence, selectively transferring teachers' appropriate knowledge becomes the primary challenge in DFKD. In this work, we propose a simple but effective method AuG-KD. It utilizes an uncertainty-guided and sample-specific anchor to align student-domain data with the teacher domain and leverages a generative method to progressively trade off the learning process between OOD knowledge distillation and domain-specific information learning via mixup learning. Extensive experiments in 3 datasets and 8 settings demonstrate the stability and superiority of our approach.",
        "keywords": "out-of-domain knowledge distillation;mixup learning;domain shift;uncertainty",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/b60d8a211e401881c041e8c44ea67a7ec00e1ddf.zip",
        "author": "Zihao TANG;Zheqi Lv;Shengyu Zhang;Yifan Zhou;Xinyu Duan;Fei Wu;Kun Kuang",
        "authorids": "~Zihao_TANG1;~Zheqi_Lv1;~Shengyu_Zhang2;~Yifan_Zhou9;~Xinyu_Duan1;~Fei_Wu1;~Kun_Kuang1",
        "gender": ";;M;M;M;M;M",
        "homepage": ";;https://shengyuzhang.github.io/;https://geniusyingmanji.github.io/;;https://person.zju.edu.cn/wufei;http://kunkuang.github.io",
        "dblp": ";;47/3459-1;;31/5936;84/3254-1;194/4245",
        "google_scholar": ";;l4Dyt7EAAAAJ;1JSLzoIAAAAJ;Z1XYinwAAAAJ;XJLn4MYAAAAJ;https://scholar.google.com.hk/citations?user=FOsNiMQAAAAJ",
        "orcid": ";;0000-0002-0030-8289;;;;0009-0000-7528-8131",
        "linkedin": ";;;;;;",
        "or_profile": "~Zihao_TANG1;~Zheqi_Lv1;~Shengyu_Zhang2;~Yifan_Zhou9;~Xinyu_Duan1;~Fei_Wu1;~Kun_Kuang1",
        "aff": ";;Zhejiang University;Shanghai Jiaotong University;Huawei Technologies Ltd.;Zhejiang University;Zhejiang University",
        "aff_domain": ";;zju.edu.cn;sjtu.edu.cn;huawei.com;zju.edu.cn;zju.edu.cn",
        "position": ";;ZJU100 Young Professor;MS student;Researcher;Full Professor;Associate Professor",
        "bibtex": "@inproceedings{\ntang2024augkd,\ntitle={AuG-{KD}: Anchor-Based Mixup Generation for Out-of-Domain Knowledge Distillation},\nauthor={Zihao TANG and Zheqi Lv and Shengyu Zhang and Yifan Zhou and Xinyu Duan and Fei Wu and Kun Kuang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=fcqWJ8JgMR}\n}",
        "github": "",
        "project": "",
        "reviewers": "8qr9;5Sg9;hjEr;aobZ",
        "pdf_size": 1453654,
        "rating": "6;6;6;6",
        "confidence": "3;4;3;4",
        "soundness": "3;3;1;2",
        "contribution": "4;3;2;2",
        "presentation": "4;3;2;3",
        "wc_summary": "93;89;75;76",
        "wc_strengths": "55;209;26;97",
        "wc_weaknesses": "151;58;116;258",
        "wc_questions": "3;98;2;2",
        "wc_review": "302;454;219;433",
        "wc_reply_reviewers": "19;33;11;121",
        "wc_reply_authors": "1768;1003;1262;1497",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "4;3;3;3",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            83.25,
            7.8859051477937525
        ],
        "wc_strengths_avg": [
            96.75,
            69.54989216382725
        ],
        "wc_weaknesses_avg": [
            145.75,
            72.82298744215318
        ],
        "wc_questions_avg": [
            26.25,
            41.42689343892443
        ],
        "wc_review_avg": [
            352.0,
            96.3768644437035
        ],
        "wc_reply_reviewers_avg": [
            46.0,
            44.01136216933077
        ],
        "wc_reply_authors_avg": [
            1382.5,
            282.95803575795475
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.25,
            0.4330127018922193
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=729231389386962825&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=fcqWJ8JgMR",
        "pdf": "https://openreview.net/pdf?id=fcqWJ8JgMR",
        "email": ";;zju.edu.cn;sjtu.edu.cn;huawei.com;zju.edu.cn;zju.edu.cn",
        "author_num": 7,
        "aff_unique_index": "0;1;2;0;0",
        "aff_unique_norm": "Zhejiang University;Shanghai Jiao Tong University;Huawei",
        "aff_unique_dep": ";;Huawei Technologies",
        "aff_unique_url": "https://www.zju.edu.cn;https://www.sjtu.edu.cn;https://www.huawei.com",
        "aff_unique_abbr": "ZJU;SJTU;Huawei",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "fdfQYxMZEG",
        "title": "Chat-UniVi: A Unified Vision-Language Model for Image and Video Understanding",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large language models have demonstrated impressive universal capabilities across a wide range of open-ended tasks and have extended their utility to encompass multimodal conversations. In this study, we introduce Chat-UniVi, a unified vision-language model capable of comprehending and engaging in conversations involving images and videos. Specifically, Chat-UniVi uniformly represents images and videos using a collection of dynamic visual tokens. This novel representation framework empowers the model to efficiently utilize a limited number of visual tokens to simultaneously capture the spatial details necessary for images and the comprehensive temporal relationship required for videos. Besides, we leverage a multi-scale representation that equips large language models to perceive both high-level semantic concepts and low-level visual details. More encouragingly, Chat-UniVi is trained on a mixed dataset containing both images and videos, making it directly applicable to tasks involving both mediums without the need for any modifications. Extensive experimental results demonstrate that Chat-UniVi, as a unified model, consistently surpasses even the existing methods exclusively designed for either images or videos. To the best of our knowledge, Chat-UniVi represents the first successful unified multimodal large language model that consistently outperforms both dedicated image and video models.",
        "keywords": "vision and language;large language models;image and video understanding",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/3bcec8e6a32c2d07d5a1ec4850158851af7dfef0.zip",
        "author": "Peng Jin;Ryuichi Takanobu;Cai Wan Zhang;Xiaochun Cao;Li Yuan",
        "authorids": "~Peng_Jin4;~Ryuichi_Takanobu1;~Cai_Wan_Zhang1;~Xiaochun_Cao3;~Li_Yuan2",
        "gender": "M;;M;M;",
        "homepage": ";;http://www.sgepri.sgcc.com.cn;https://scst.sysu.edu.cn/members/caoxiaochun.htm;",
        "dblp": "83/6151-1.html;;;39/3695;",
        "google_scholar": "HHXLexAAAAAJ;;;https://scholar.google.com/citations?hl=en;",
        "orcid": "0000-0001-9287-6410;;;0000-0001-7141-708X;",
        "linkedin": ";;;;",
        "or_profile": "~Peng_Jin4;~Ryuichi_Takanobu1;~Cai_Wan_Zhang1;~Xiaochun_Cao3;~Li_Yuan2",
        "aff": "Peking University;;Nanrui Group Co., Ltd;SUN YAT-SEN UNIVERSITY;",
        "aff_domain": "pku.edu.cn;;sgepri.sgcc.com.cn;sysu.edu.cn;",
        "position": "PhD student;;Principal Researcher;Full Professor;",
        "bibtex": "@misc{\njin2024chatunivi,\ntitle={Chat-UniVi: A Unified Vision-Language Model for Image and Video Understanding},\nauthor={Peng Jin and Ryuichi Takanobu and Cai Wan Zhang and Xiaochun Cao and Li Yuan},\nyear={2024},\nurl={https://openreview.net/forum?id=fdfQYxMZEG}\n}",
        "github": "",
        "project": "",
        "reviewers": "4Vet;aENx;ThZs;iewy",
        "site": "https://openreview.net/forum?id=fdfQYxMZEG",
        "pdf_size": 9592073,
        "rating": "3;5;5;6",
        "confidence": "5;4;4;5",
        "soundness": "2;2;3;3",
        "contribution": "1;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "68;59;98;45",
        "wc_strengths": "50;77;85;56",
        "wc_weaknesses": "237;305;205;99",
        "wc_questions": "4;135;41;2",
        "wc_review": "359;576;429;202",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            67.5,
            19.42292459955503
        ],
        "wc_strengths_avg": [
            67.0,
            14.439529078193651
        ],
        "wc_weaknesses_avg": [
            211.5,
            74.31520705750607
        ],
        "wc_questions_avg": [
            45.5,
            53.956000593075835
        ],
        "wc_review_avg": [
            391.5,
            134.5483184584631
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.2294157338705618,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:xDnr1ScCf_wJ:scholar.google.com/&scioq=Chat-UniVi:+A+Unified+Vision-Language+Model+for+Image+and+Video+Understanding&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Peking University;Nanrui Group;Sun Yat-sen University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.pku.edu.cn;;http://www.sysu.edu.cn",
        "aff_unique_abbr": "Peking U;;SYSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Federated Q-Learning: Linear Regret Speedup with Low Communication Cost",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18180",
        "id": "fe6ANBxcKM",
        "author_site": "Zhong Zheng, Fengyu Gao, Lingzhou Xue, Jing Yang",
        "tldr": "",
        "abstract": "In this paper, we consider federated reinforcement learning for tabular episodic Markov Decision Processes (MDP) where, under the coordination of a central server, multiple agents collaboratively explore the environment and learn an optimal policy without sharing their raw data.  While linear speedup in the number of agents has been achieved for some metrics, such as convergence rate and sample complexity, in similar settings, it is unclear whether it is possible to design a *model-free* algorithm to achieve linear *regret* speedup with low communication cost. We propose two federated Q-Learning algorithms termed as FedQ-Hoeffding and FedQ-Bernstein, respectively, and show that the corresponding total regrets achieve a linear speedup compared with their single-agent counterparts, while the communication cost scales logarithmically in the total number of time steps $T$. Those results rely on an event-triggered synchronization mechanism between the agents and the server, a novel step size selection when the server aggregates the local estimates of the state-action values to form the global estimates, and a set of new concentration inequalities to bound the sum of non-martingale differences. This is the first work showing that linear regret speedup and logarithmic communication cost can be achieved by model-free algorithms in federated reinforcement learning.",
        "keywords": "Federated Learning;Reinforcement Learning;Q-Learning;Regret;Communication Cost",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/acb9e5927deec72d055d68ff6f2245d46d46c0c6.zip",
        "author": "Zhong Zheng;Fengyu Gao;Lingzhou Xue;Jing Yang",
        "authorids": "~Zhong_Zheng3;~Fengyu_Gao1;~Lingzhou_Xue1;~Jing_Yang3",
        "gender": "M;;M;",
        "homepage": ";https://gfengyu.github.io;https://lingzhou-xue.github.io/;http://www.ee.psu.edu/yang",
        "dblp": ";;66/80;",
        "google_scholar": "NMlDkJUAAAAJ;ppyx_LkAAAAJ;vfiEIqUAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": "0009-0005-0600-7507;;0000-0002-8252-0637;",
        "linkedin": ";;;",
        "or_profile": "~Zhong_Zheng3;~Fengyu_Gao1;~Lingzhou_Xue1;~Jing_Yang3",
        "aff": "Pennsylvania State University;Pennsylvania State University;Pennsylvania State University;Pennsylvania State University",
        "aff_domain": "psu.edu;psu.edu;psu.edu;psu.edu",
        "position": "PhD student;PhD student;Full Professor;Associate Professor",
        "bibtex": "@inproceedings{\nzheng2024federated,\ntitle={Federated Q-Learning: Linear Regret Speedup with Low Communication Cost},\nauthor={Zhong Zheng and Fengyu Gao and Lingzhou Xue and Jing Yang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=fe6ANBxcKM}\n}",
        "github": "",
        "project": "",
        "reviewers": "dPut;8uCJ;62fC;tdCn",
        "pdf_size": 1511481,
        "rating": "5;5;6;6",
        "confidence": "3;3;3;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "19;63;207;34",
        "wc_strengths": "21;39;66;39",
        "wc_weaknesses": "35;205;22;296",
        "wc_questions": "32;128;11;81",
        "wc_review": "107;435;306;450",
        "wc_reply_reviewers": "96;219;19;306",
        "wc_reply_authors": "543;2555;344;3055",
        "reply_reviewers": "2;1;1;1",
        "reply_authors": "3;5;3;7",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            80.75,
            74.58677831894873
        ],
        "wc_strengths_avg": [
            41.25,
            16.068213964221414
        ],
        "wc_weaknesses_avg": [
            139.5,
            115.66006225140984
        ],
        "wc_questions_avg": [
            63.0,
            45.3155602414888
        ],
        "wc_review_avg": [
            324.5,
            137.4854537760268
        ],
        "wc_reply_reviewers_avg": [
            160.0,
            110.42418213416842
        ],
        "wc_reply_authors_avg": [
            1624.25,
            1195.9810564971337
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.5,
            1.6583123951777
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14441210498648959693&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=fe6ANBxcKM",
        "pdf": "https://openreview.net/pdf?id=fe6ANBxcKM",
        "email": "psu.edu;psu.edu;psu.edu;psu.edu",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Pennsylvania State University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.psu.edu",
        "aff_unique_abbr": "PSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "fe8CzLTMG1",
        "title": "Can Large Language Models be Good Path Planners? A Benchmark and Investigation on Spatial-Temporal Reasoning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs) have achieved remarkable success across a wide spectrum of tasks; however, they still face limitations in scenarios that demand long-term planning and spatial reasoning. To facilitate this line of research, in this work, we propose a new benchmark, termed $\\textbf{P}$ath $\\textbf{P}$lanning from $\\textbf{N}$atural $\\textbf{L}$anguage ($\\textbf{PPNL}$). Our benchmark evaluates LLMs\u2019 spatial-temporal reasoning by formulating \u201cpath planning\u201d tasks that require an LLM to navigate to target locations while avoiding obstacles and adhering to constraints. Leveraging this benchmark, we systematically investigate LLMs including GPT-4 via different few-shot prompting methodologies and BART and T5 of various sizes via fine-tuning. Our experimental results show the promise of few-shot GPT-4 in spatial reasoning, when it is prompted to reason and act interleavedly, although it still fails to make long-term temporal reasoning. In contrast, while fine-tuned LLMs achieved impressive results on in-distribution reasoning tasks, they struggled to generalize to larger environments or environments with more obstacles.",
        "keywords": "Large Language Models;Spatial-Temporal Reasoning;Path Planning",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Mohamed Aghzal;Erion Plaku;Ziyu Yao",
        "authorids": "~Mohamed_Aghzal1;~Erion_Plaku2;~Ziyu_Yao1",
        "gender": "M;M;F",
        "homepage": "https://www.linkedin.com/in/mohamed-aghzal-ba77221a6/;https://erionplaku.github.io/;http://ziyuyao.org",
        "dblp": ";56/1461.html;",
        "google_scholar": ";DK3QY9sAAAAJ;4lYrMNUAAAAJ",
        "orcid": ";0000-0002-6622-386X;0009-0007-4571-3505",
        "linkedin": ";;",
        "or_profile": "~Mohamed_Aghzal1;~Erion_Plaku2;~Ziyu_Yao1",
        "aff": "George Mason University;National Science Foundation;George Mason University",
        "aff_domain": "gmu.edu;nsf.gov;gmu.edu",
        "position": "PhD student;Program Director;Assistant Professor",
        "bibtex": "@misc{\naghzal2024can,\ntitle={Can Large Language Models be Good Path Planners? A Benchmark and Investigation on Spatial-Temporal Reasoning},\nauthor={Mohamed Aghzal and Erion Plaku and Ziyu Yao},\nyear={2024},\nurl={https://openreview.net/forum?id=fe8CzLTMG1}\n}",
        "github": "",
        "project": "",
        "reviewers": "w1hA;wB3J;T3Yg;yt2L",
        "site": "https://openreview.net/forum?id=fe8CzLTMG1",
        "pdf_size": 1926989,
        "rating": "3;5;5;6",
        "confidence": "3;3;3;3",
        "soundness": "2;3;1;3",
        "contribution": "2;1;2;2",
        "presentation": "3;3;2;3",
        "wc_summary": "74;95;77;83",
        "wc_strengths": "88;138;85;38",
        "wc_weaknesses": "188;202;370;173",
        "wc_questions": "84;63;2;1",
        "wc_review": "434;498;534;295",
        "wc_reply_reviewers": "0;0;390;46",
        "wc_reply_authors": "631;446;1316;69",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "1;1;3;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            82.25,
            8.042853971072706
        ],
        "wc_strengths_avg": [
            87.25,
            35.37919586423637
        ],
        "wc_weaknesses_avg": [
            233.25,
            79.61587467333383
        ],
        "wc_questions_avg": [
            37.5,
            36.7593525514256
        ],
        "wc_review_avg": [
            440.25,
            91.18764993133665
        ],
        "wc_reply_reviewers_avg": [
            109.0,
            163.3187068280912
        ],
        "wc_reply_authors_avg": [
            615.5,
            452.3087993837838
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 34,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9243145018945094011&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "George Mason University;National Science Foundation",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.gmu.edu;https://www.nsf.gov",
        "aff_unique_abbr": "GMU;NSF",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "feZ7RpTLRy",
        "title": "Bridging ML and algorithms: comparison of hyperbolic embeddings",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Hyperbolic embeddings are well-studied both in the machine learning and algorithm community. However, as the research proceeds independently in those two communities, comparisons and even awareness seem to be currently lacking. We compare the performance (time needed to compute embeddings) and the quality of the embeddings obtained by the popular approaches, both on real-life hierarchies and networks and simulated networks. In particular, according to our results, the algorithm by Bl\u00e4sius et al (ESA 2016) is about 100 times faster than the Poincar\u00e9 embeddings (NIPS 2017) and Lorentz embeddings (ICML 2018) by Nickel and Kiela, while achieving results of similar (or, in some cases, even better) quality.",
        "keywords": "hyperbolic embeddings",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/bc12cb088e1f76eb7e93a2fc87f8134324924b5e.zip",
        "author": "Dorota Celi\u0144ska-Kopczy\u0144ska;Eryk Kopczy\u0144ski",
        "authorids": "~Dorota_Celi\u0144ska-Kopczy\u0144ska1;~Eryk_Kopczy\u0144ski1",
        "gender": "F;",
        "homepage": ";https://www.mimuw.edu.pl/~erykk/",
        "dblp": "200/0235;19/709",
        "google_scholar": "https://scholar.google.pl/citations?user=QlC7zNkAAAAJ;KyoDvw4AAAAJ",
        "orcid": "0000-0001-5910-0039;0000-0001-5588-1181",
        "linkedin": ";eryxcc/",
        "or_profile": "~Dorota_Celi\u0144ska-Kopczy\u0144ska1;~Eryk_Kopczy\u0144ski1",
        "aff": "University of Warsaw;",
        "aff_domain": "mimuw.edu.pl;",
        "position": "Assistant Professor;",
        "bibtex": "@misc{\nceli{\\'n}ska-kopczy{\\'n}ska2024bridging,\ntitle={Bridging {ML} and algorithms: comparison of hyperbolic embeddings},\nauthor={Dorota Celi{\\'n}ska-Kopczy{\\'n}ska and Eryk Kopczy{\\'n}ski},\nyear={2024},\nurl={https://openreview.net/forum?id=feZ7RpTLRy}\n}",
        "github": "",
        "project": "",
        "reviewers": "dipB;91h5;4BpB;wq3r",
        "site": "https://openreview.net/forum?id=feZ7RpTLRy",
        "pdf_size": 4137037,
        "rating": "3;3;5;6",
        "confidence": "3;2;3;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "102;44;44;119",
        "wc_strengths": "81;22;53;18",
        "wc_weaknesses": "136;119;86;76",
        "wc_questions": "13;1;1;105",
        "wc_review": "332;186;184;318",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            77.25,
            33.7888665095472
        ],
        "wc_strengths_avg": [
            43.5,
            25.53918557824427
        ],
        "wc_weaknesses_avg": [
            104.25,
            24.27318479310039
        ],
        "wc_questions_avg": [
            30.0,
            43.57751713900185
        ],
        "wc_review_avg": [
            255.0,
            70.178344238091
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.5555555555555555,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:AO3VAeYkgA4J:scholar.google.com/&scioq=Bridging+ML+and+algorithms:+comparison+of+hyperbolic+embeddings&hl=en&as_sdt=0,47",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Warsaw",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uw.edu.pl",
        "aff_unique_abbr": "UW",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Poland"
    },
    {
        "id": "feuai0593g",
        "title": "ScoreFlow: Bridging Score and Neural ODE for Reversible Generative Modeling",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Neural ordinary differential equations (ODEs) are commonly used in reversible generative models. However, training neural ODEs is computationally expensive for estimating the log-likelihood density and backpropagating through ODE solvers, leading to slow convergence and significant gradient estimation errors. This paper presents ScoreFlow, a novel generative model capable of reversible and controllable data transformations. Firstly, we formulate an ODE utilizing a score variant as the drift term to model transformations between two certain data distributions. Secondly, we suggest a path-constrained loss to reduce truncation errors, enhancing the model's capabilities in generating high-quality samples. Thirdly, ScoreFlow has the ability to employ a single model to achieve both conditional image generation and cross-class image translation tasks. The closed-form optimal solution for data transformation in ScoreFlow is theoretically proven, providing support for the model's efficient training. Furthermore, the effectiveness of our approach is empirically validated through image generation, translation, and interpolation experiments.",
        "keywords": "Reversible generative modeling;Neural ODEs;Diffusion models;Image translation;Deep learning",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/02a3d35872b5a8e148df3f5ceabae653fd7e9b8a.pdf",
        "author": "Dong Pang;Xinyi Le",
        "authorids": "~Dong_Pang1;~Xinyi_Le1",
        "gender": "M;F",
        "homepage": ";",
        "dblp": "250/8976;",
        "google_scholar": "LbYztZUAAAAJ;MGZyMf4AAAAJ",
        "orcid": "0000-0002-4490-0313;",
        "linkedin": ";",
        "or_profile": "~Dong_Pang1;~Xinyi_Le1",
        "aff": "Shanghai Jiaotong University;Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn;sjtu.edu",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\npang2024scoreflow,\ntitle={ScoreFlow: Bridging Score and Neural {ODE} for Reversible Generative Modeling},\nauthor={Dong Pang and Xinyi Le},\nyear={2024},\nurl={https://openreview.net/forum?id=feuai0593g}\n}",
        "github": "",
        "project": "",
        "reviewers": "VG7T;y8UH;7nbi;U1NS;Tmwk",
        "site": "https://openreview.net/forum?id=feuai0593g",
        "pdf_size": 10111200,
        "rating": "1;3;3;5;5",
        "confidence": "4;4;4;4;4",
        "soundness": "2;3;1;3;3",
        "contribution": "1;1;1;2;2",
        "presentation": "2;1;2;3;3",
        "wc_summary": "205;65;52;55;101",
        "wc_strengths": "1;13;39;54;34",
        "wc_weaknesses": "156;315;322;115;287",
        "wc_questions": "1;22;4;21;138",
        "wc_review": "363;415;417;245;560",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            3.4,
            1.4966629547095767
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.4,
            0.8
        ],
        "contribution_avg": [
            1.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.2,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            95.6,
            57.41637397119397
        ],
        "wc_strengths_avg": [
            28.2,
            18.903967837467352
        ],
        "wc_weaknesses_avg": [
            239.0,
            86.29484341488778
        ],
        "wc_questions_avg": [
            37.2,
            51.12103285341563
        ],
        "wc_review_avg": [
            400.0,
            101.49679797904956
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:lW70BHL3Ao8J:scholar.google.com/&scioq=ScoreFlow:+Bridging+Score+and+Neural+ODE+for+Reversible+Generative+Modeling&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Shanghai Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sjtu.edu.cn",
        "aff_unique_abbr": "SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "From Posterior Sampling to Meaningful Diversity in Image Restoration",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18179",
        "id": "ff2g30cZxj",
        "author_site": "Noa Cohen, Hila Manor, Yuval Bahat, Tomer Michaeli",
        "tldr": "",
        "abstract": "Image restoration problems are typically ill-posed in the sense that each degraded image can be restored in infinitely many valid ways. To accommodate this, many works generate a diverse set of outputs by attempting to randomly sample from the posterior distribution of natural images given the degraded input. Here we argue that this strategy is commonly of limited practical value because of the heavy tail of the posterior distribution. Consider for example inpainting a missing region of the sky in an image. Since there is a high probability that the missing region contains no object but clouds, any set of samples from the posterior would be entirely dominated by (practically identical) completions of sky. However, arguably, presenting users with only one clear sky completion, along with several alternative solutions such as airships, birds, and balloons, would better outline the set of possibilities. In this paper, we initiate the study of **meaningfully diverse** image restoration. We explore several post-processing approaches that can be combined with any diverse image restoration method to yield semantically meaningful diversity. Moreover, we propose a practical approach for allowing diffusion based image restoration methods to generate meaningfully diverse outputs, while incurring only negligent computational overhead. We conduct extensive user studies to analyze the proposed techniques, and find the strategy of reducing similarity between outputs to be significantly favorable over posterior sampling. Code and examples are available on the [project's webpage](https://noa-cohen.github.io/MeaningfulDiversityInIR/).",
        "keywords": "Image restoration;Diverse image restoration;Inverse problems;Posterior sampling;Meaningful diversity",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Noa Cohen;Hila Manor;Yuval Bahat;Tomer Michaeli",
        "authorids": "~Noa_Cohen1;~Hila_Manor1;~Yuval_Bahat2;~Tomer_Michaeli1",
        "gender": "F;F;;M",
        "homepage": ";https://hilamanor.github.io/;http://www.wisdom.weizmann.ac.il/%7Eybahat/;https://tomer.net.technion.ac.il/",
        "dblp": ";357/5326.html;159/8756;70/3188.html",
        "google_scholar": ";Pz32vm4AAAAJ;https://scholar.google.co.il/citations?user=VseAjdcAAAAJ;n2EbR2cAAAAJ",
        "orcid": "0009-0005-4362-909X;0009-0007-6851-148X;;",
        "linkedin": ";hilamanor/;;",
        "or_profile": "~Noa_Cohen1;~Hila_Manor1;~Yuval_Bahat2;~Tomer_Michaeli1",
        "aff": "Technion - Israel Institute of Technology, Technion - Israel Institute of Technology;Technion - Israel Institute of Technology, Technion - Israel Institute of Technology;Google;Technion, Technion",
        "aff_domain": "campus.technion.ac.il;campus.technion.ac.il;google.com;technion.ac.il",
        "position": "MS student;PhD student;Researcher;Associate Professor",
        "bibtex": "@inproceedings{\ncohen2024from,\ntitle={From Posterior Sampling to Meaningful Diversity in Image Restoration},\nauthor={Noa Cohen and Hila Manor and Yuval Bahat and Tomer Michaeli},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ff2g30cZxj}\n}",
        "github": "",
        "project": "",
        "reviewers": "iJud;Fph6;ppuX",
        "pdf_size": 19093176,
        "rating": "6;8;8",
        "confidence": "5;3;4",
        "soundness": "3;3;4",
        "contribution": "2;3;4",
        "presentation": "3;3;3",
        "wc_summary": "129;162;121",
        "wc_strengths": "29;60;48",
        "wc_weaknesses": "154;1;88",
        "wc_questions": "57;61;394",
        "wc_review": "369;284;651",
        "wc_reply_reviewers": "11;10;17",
        "wc_reply_authors": "304;170;420",
        "reply_reviewers": "1;1;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            137.33333333333334,
            17.745108872274887
        ],
        "wc_strengths_avg": [
            45.666666666666664,
            12.762793146051099
        ],
        "wc_weaknesses_avg": [
            81.0,
            62.65780079128216
        ],
        "wc_questions_avg": [
            170.66666666666666,
            157.92895730535153
        ],
        "wc_review_avg": [
            434.6666666666667,
            156.85733078891218
        ],
        "wc_reply_reviewers_avg": [
            12.666666666666666,
            3.0912061651652345
        ],
        "wc_reply_authors_avg": [
            298.0,
            102.15021618511958
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4793636337354759402&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=ff2g30cZxj",
        "pdf": "https://openreview.net/pdf?id=ff2g30cZxj",
        "email": "campus.technion.ac.il;campus.technion.ac.il;google.com;technion.ac.il",
        "author_num": 4,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Technion - Israel Institute of Technology;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.technion.ac.il/en/;https://www.google.com",
        "aff_unique_abbr": "Technion;Google",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "Israel;United States"
    },
    {
        "id": "ff5srKUefm",
        "title": "Entropy Voting Between Capsules",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Capsule networks offer a promising solution in computer vision by addressing the limitations of convolutional neural networks (CNNs), such as data dependency and viewpoint challenges. Unlike CNNs, capsules reduce the need for data augmentation by enhancing generalization from limited training data. We explore capsules from the perspective of information theory, viewing them as Monte Carlo sampled continuous random variables. We use marginal differential entropy to measure the information content of capsules, and relative entropy to model the agreement between lower-level and higher-level capsules. The proposed entropy voting method aims to maximize capsule marginal entropies and to minimize their relative entropy. We show that our approach performs better or comparably against state-of-the-art capsule networks while significantly improving inference time. This research highlights the synergy between capsules and information theory, providing insights into their combined potential.",
        "keywords": "capsule networks;information theory;computer vision;deep learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Miika Kolu;Peer Stelldinger;Hashem Haghbayan;Juha Plosila",
        "authorids": "~Miika_Kolu1;~Peer_Stelldinger1;~Hashem_Haghbayan1;~Juha_Plosila1",
        "gender": ";M;M;M",
        "homepage": ";https://www.haw-hamburg.de/hochschule/beschaeftigte/detail/person/person/show/peer-stelldinger/;https://www.utu.fi/en/people/mohammadhashem-haghbayan;https://www.utu.fi/en/people/juha-plosila",
        "dblp": ";95/760;24/9056.html;",
        "google_scholar": ";https://scholar.google.com/citations?hl=de;_0ZaL0sAAAAJ;em4kCrUAAAAJ",
        "orcid": ";0000-0001-8079-2797;0000-0001-6583-4418;",
        "linkedin": ";peer-stelldinger-562b1a1b3/?locale=en_US;hashem-haghbayan-536ab636/?trk=public_profile_browsemap&originalSubdomain=fi;",
        "or_profile": "~Miika_Kolu1;~Peer_Stelldinger1;~Hashem_Haghbayan1;~Juha_Plosila1",
        "aff": ";Hamburg University of Applied Sciences;;University of Turku",
        "aff_domain": ";haw-hamburg.de;;utu.fi",
        "position": ";Full Professor;;Full Professor",
        "bibtex": "@misc{\nkolu2024entropy,\ntitle={Entropy Voting Between Capsules},\nauthor={Miika Kolu and Peer Stelldinger and Hashem Haghbayan and Juha Plosila},\nyear={2024},\nurl={https://openreview.net/forum?id=ff5srKUefm}\n}",
        "github": "",
        "project": "",
        "reviewers": "VTJB;Y23x;66co",
        "site": "https://openreview.net/forum?id=ff5srKUefm",
        "pdf_size": 206362,
        "rating": "3;3;3",
        "confidence": "4;2;5",
        "soundness": "2;2;2",
        "contribution": "1;2;2",
        "presentation": "2;2;1",
        "wc_summary": "110;40;74",
        "wc_strengths": "51;13;47",
        "wc_weaknesses": "88;140;150",
        "wc_questions": "92;6;150",
        "wc_review": "341;199;421",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            1.247219128924647
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            74.66666666666667,
            28.58126814696802
        ],
        "wc_strengths_avg": [
            37.0,
            17.048949136725895
        ],
        "wc_weaknesses_avg": [
            126.0,
            27.17842281418601
        ],
        "wc_questions_avg": [
            82.66666666666667,
            59.157041470610714
        ],
        "wc_review_avg": [
            320.3333333333333,
            91.80171869608735
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:9IxU0KztLEAJ:scholar.google.com/&scioq=Entropy+Voting+Between+Capsules&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Hamburg University of Applied Sciences;University of Turku",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.haw-hamburg.de;https://www.utu.fi",
        "aff_unique_abbr": "HAW Hamburg;UTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Germany;Finland"
    },
    {
        "id": "ffTRtzXkIW",
        "title": "PAGAR: Taming Reward Misalignment in Inverse Reinforcement Learning-Based Imitation Learning with Protagonist Antagonist Guided Adversarial Reward",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Many imitation learning (IL) algorithms employ inverse reinforcement learning (IRL) to infer the underlying reward function that an expert is implicitly optimizing for, based on their demonstrated behaviors. However, a misalignment between the inferred reward and the true task objective can result in task failures. In this paper, we introduce Protagonist Antagonist Guided Adversarial Reward (PAGAR), a semi-supervised reward design paradigm to tackle this reward misalignment problem in IRL-based IL. We identify the conditions on the candidate reward functions under which PAGAR can guarantee to induce a policy that succeeds in the underlying task. Furthermore, we present a practical on-and-off policy approach to implement PAGAR in IRL-based IL. Experimental results show that our algorithm outperforms competitive baselines on complex IL tasks and zero-shot IL tasks in transfer environments with limited demonstrations.",
        "keywords": "Reward misspecification;reward misalignment;reward hacking;reward ambiguity;inverse reinforcement learning;reinforcement learning;imitation learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/00490f7ba63fa388f225d5f03814ee627d63c491.zip",
        "author": "Weichao Zhou;Wenchao Li",
        "authorids": "~Weichao_Zhou1;~Wenchao_Li1",
        "gender": "M;",
        "homepage": "https://sites.google.com/view/zwc662/;http://sites.bu.edu/depend/",
        "dblp": "207/8077;23/5721-1",
        "google_scholar": "JdiJIF0AAAAJ;zwA5eokAAAAJ",
        "orcid": "0009-0002-0369-2113;",
        "linkedin": ";",
        "or_profile": "~Weichao_Zhou1;~Wenchao_Li1",
        "aff": "Boston University;Boston University",
        "aff_domain": "bu.edu;bu.edu",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\nzhou2024pagar,\ntitle={{PAGAR}: Taming Reward Misalignment in Inverse Reinforcement Learning-Based Imitation Learning with Protagonist Antagonist Guided Adversarial Reward},\nauthor={Weichao Zhou and Wenchao Li},\nyear={2024},\nurl={https://openreview.net/forum?id=ffTRtzXkIW}\n}",
        "github": "",
        "project": "",
        "reviewers": "BsED;rmTC;58y7",
        "site": "https://openreview.net/forum?id=ffTRtzXkIW",
        "pdf_size": 1824911,
        "rating": "3;5;6",
        "confidence": "3;3;3",
        "soundness": "3;2;3",
        "contribution": "2;3;3",
        "presentation": "1;1;3",
        "wc_summary": "207;120;149",
        "wc_strengths": "107;33;38",
        "wc_weaknesses": "278;569;56",
        "wc_questions": "306;9;51",
        "wc_review": "898;731;294",
        "wc_reply_reviewers": "0;630;0",
        "wc_reply_authors": "716;1126;206",
        "reply_reviewers": "0;1;0",
        "reply_authors": "1;2;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            158.66666666666666,
            36.16935473881477
        ],
        "wc_strengths_avg": [
            59.333333333333336,
            33.76717669901087
        ],
        "wc_weaknesses_avg": [
            301.0,
            210.06189564030885
        ],
        "wc_questions_avg": [
            122.0,
            131.232617896619
        ],
        "wc_review_avg": [
            641.0,
            254.66186731952365
        ],
        "wc_reply_reviewers_avg": [
            210.0,
            296.98484809834997
        ],
        "wc_reply_authors_avg": [
            682.6666666666666,
            376.32728073077857
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12882527912367798313&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Boston University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.bu.edu",
        "aff_unique_abbr": "BU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "ffcHGwb4KF",
        "title": "SPADE: Sparsity-Guided Debugging for Deep Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Interpretability, broadly defined as mechanisms for understanding why and how machine learning models reach their decisions, is one of the key open goals at the intersection of deep learning theory and practice. Towards this goal, multiple tools have been proposed to aid a human examiner in reasoning about a network's behavior in general or on a set of instances. However, the outputs of these tools---such as input saliency maps or neuron visualizations---are frequently difficult for a human to interpret, or even misleading, due, in particular, to the fact that neurons can be multifaceted, i.e.,  a single neuron can be associated with multiple distinct feature combinations. In this paper, we present a new general approach to address this problem, called SPADE, which, given a trained model and a target sample, uses sample-targeted pruning to provide a \"trace\" of the network's execution on the sample, reducing the network to the connections that are most relevant to the specific prediction. We demonstrate that preprocessing with SPADE significantly increases both the accuracy of image saliency maps across several interpretability methods and the usefulness of neuron visualizations, aiding humans in reasoning about network behavior. Our findings show that sample-specific pruning of connections can disentangle multifaceted neurons, leading to consistently improved interpretability.",
        "keywords": "Interpretability;Debugging;sparsity-aided debugging",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/46d4b7719155fc1f3a3d98e8277ec96e556a22ad.pdf",
        "author": "Arshia Soltani Moakhar;Eugenia Iofinova;Dan Alistarh",
        "authorids": "~Arshia_Soltani_Moakhar1;~Eugenia_Iofinova1;~Dan_Alistarh7",
        "gender": "F;M;M",
        "homepage": ";https://ckodser.github.io;http://people.csail.mit.edu/alistarh/",
        "dblp": "295/9539;330/2487;36/3251.html",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;https://scholar.google.com/citations?hl=en;https://scholar.google.com.tw/citations?user=75q-6ZQAAAAJ",
        "orcid": "0000-0002-7778-3221;;",
        "linkedin": ";arshia-soltani-891016143/;",
        "or_profile": "~Eugenia_Iofinova1;~Arshia_Soltani_Moakar1;~Dan_Alistarh1",
        "aff": "Microsoft Research;;Institute of Science and Technology",
        "aff_domain": "research.microsoft.com;;ist.ac.at",
        "position": "Intern;;Full Professor",
        "bibtex": "@misc{\nmoakhar2024spade,\ntitle={{SPADE}: Sparsity-Guided Debugging for Deep Neural Networks},\nauthor={Arshia Soltani Moakhar and Eugenia Iofinova and Dan Alistarh},\nyear={2024},\nurl={https://openreview.net/forum?id=ffcHGwb4KF}\n}",
        "github": "",
        "project": "",
        "reviewers": "fCAG;5ZSW;mZPn;4QUk",
        "site": "https://openreview.net/forum?id=ffcHGwb4KF",
        "pdf_size": 3384579,
        "rating": "3;3;6;8",
        "confidence": "4;4;3;3",
        "soundness": "2;2;3;3",
        "contribution": "2;1;3;3",
        "presentation": "3;3;3;4",
        "wc_summary": "112;136;120;82",
        "wc_strengths": "79;113;150;27",
        "wc_weaknesses": "545;318;680;32",
        "wc_questions": "117;189;417;87",
        "wc_review": "853;756;1367;228",
        "wc_reply_reviewers": "0;0;278;20",
        "wc_reply_authors": "623;1021;1199;307",
        "reply_reviewers": "0;0;2;1",
        "reply_authors": "1;2;4;1",
        "rating_avg": [
            5.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            112.5,
            19.615045245933032
        ],
        "wc_strengths_avg": [
            92.25,
            45.273474573971015
        ],
        "wc_weaknesses_avg": [
            393.75,
            245.67089265926478
        ],
        "wc_questions_avg": [
            202.5,
            129.27006614061895
        ],
        "wc_review_avg": [
            801.0,
            404.17013744214205
        ],
        "wc_reply_reviewers_avg": [
            74.5,
            117.77414826692656
        ],
        "wc_reply_authors_avg": [
            787.5,
            347.05727193072903
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.9428090415820635,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3750709433693806887&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Microsoft;Institute of Science and Technology",
        "aff_unique_dep": "Microsoft Research;",
        "aff_unique_url": "https://www.microsoft.com/en-us/research;",
        "aff_unique_abbr": "MSR;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States;"
    },
    {
        "id": "fg143BW0jJ",
        "title": "Neural mechanisms of cognitive flexibility: Belief updating in dynamic environments with sparse rewards",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Humans and animals must develop adaptive strategies to optimize decision-making in dynamic and uncertain environments, often without the benefit of immediate rewards. While existing literature posits that animals use internal \"belief\" states as the foundation for their decision policy, the mechanism for updating them in a dynamic environment remains unclear. Furthermore, there is no known neural mechanism that can implement belief updates without the need for a reward. To address this gap, we take a multidisciplinary approach that integrates theoretical derivation, training artificial neural networks, and behavioral experiments in rodents to explore potential neural mechanisms of cognitive flexibility.\n\nA belief state is a joint probability distribution over all relevant latent variables of the environment.  Updating the joint distributions using only partial observations and marginalizing to obtain estimators is computationally demanding, in particular when latent variables are changing. Moreover, it is nontrivial for a neural network to learn how to implement this complex inference. To tackle these challenges, we introduce a novel change-detection task specifically designed to capture the complexities of partially observed dynamic environments. We formulate a Bayesian theory for sequentially updating joint probabilities and demonstrate that neural networks can accomplish the task near optimally, even in the absence of immediate rewards. We show that the network dynamics mirror the sequential update of the Bayesian latent state estimators. Furthermore, rodents trained on this task show behavior that aligns with our theoretical model and neural network simulations, suggesting that mice utilize dynamic internal state representation and inference to solve this task. Overall, our findings elucidate the computational principles behind flexible cognitive behavior that allows both biological and artificial agents to achieve zero-shot adaptation: modifying their behavior policy to reflect changes in the environment without the need for trial and error.",
        "keywords": "Theoretical neuroscience;neural dynamics;cognitive neuroscience;belief states;artificial neural networks;animal behavior",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/753f2515048725ce6f2b4630be4e4aab97526121.zip",
        "author": "John Schwarcz;Jan Philipp Bauer;Gabrielle Marmur;Haneen Rajabi;Eran Lottem;Jonathan Kadmon",
        "authorids": "~John_Schwarcz1;~Jan_Philipp_Bauer1;~Gabrielle_Marmur1;~Haneen_Rajabi1;~Eran_Lottem1;~Jonathan_Kadmon1",
        "gender": ";M;F;F;M;M",
        "homepage": "https://www.neuro-theory.org/group;https://japhba.github.io;https://elsc.huji.ac.il/lab-members/gabrielle-marmur/;;https://orcid.org/0000-0001-5852-928X;https://www.neuro-theory.org",
        "dblp": ";;;;;191/6697",
        "google_scholar": ";t3i5WEMAAAAJ;;;;77MU6_sAAAAJ",
        "orcid": ";0009-0006-0934-6835;;;;0000-0003-3970-5684",
        "linkedin": ";;;haneen-rajabi-2768b9124;;",
        "or_profile": "~John_Schwarcz1;~Jan_Philipp_Bauer1;~Gabrielle_Marmur1;~Haneen_Rajabi1;~Eran_Lottem1;~Jonathan_Kadmon1",
        "aff": "Hebrew University of Jerusalem;Hebrew University of Jerusalem;Hebrew University of Jerusalem;Hebrew University of Jerusalem;;Hebrew University of Jerusalem",
        "aff_domain": "huji.ac.il;huji.ac.il;huji.ac.il;huji.ac.il;;huji.ac.il",
        "position": "PhD student;PhD student;Instructor;PhD student;;Assistant Professor",
        "bibtex": "@misc{\nschwarcz2024neural,\ntitle={Neural mechanisms of cognitive flexibility: Belief updating in dynamic environments with sparse rewards},\nauthor={John Schwarcz and Jan Philipp Bauer and Gabrielle Marmur and Haneen Rajabi and Eran Lottem and Jonathan Kadmon},\nyear={2024},\nurl={https://openreview.net/forum?id=fg143BW0jJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "JMWQ;pqJH;qv9Y;mk4V",
        "site": "https://openreview.net/forum?id=fg143BW0jJ",
        "pdf_size": 738979,
        "rating": "3;3;3;5",
        "confidence": "4;4;3;4",
        "soundness": "3;1;3;3",
        "contribution": "1;2;1;2",
        "presentation": "4;1;4;3",
        "wc_summary": "87;193;64;72",
        "wc_strengths": "95;22;34;128",
        "wc_weaknesses": "373;57;423;146",
        "wc_questions": "344;340;35;104",
        "wc_review": "899;612;556;450",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            1.224744871391589
        ],
        "wc_summary_avg": [
            104.0,
            52.04325124355702
        ],
        "wc_strengths_avg": [
            69.75,
            43.55671590007677
        ],
        "wc_weaknesses_avg": [
            249.75,
            152.58010191371613
        ],
        "wc_questions_avg": [
            205.75,
            138.42394120960435
        ],
        "wc_review_avg": [
            629.25,
            166.25187968862187
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:E-cL4UHyU74J:scholar.google.com/&scioq=Neural+mechanisms+of+cognitive+flexibility:+Belief+updating+in+dynamic+environments+with+sparse+rewards&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Hebrew University of Jerusalem",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.huji.ac.il",
        "aff_unique_abbr": "HUJI",
        "aff_campus_unique_index": "0;0;0;0;0",
        "aff_campus_unique": "Jerusalem",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Israel"
    },
    {
        "id": "fg772k6x6U",
        "title": "Deepfake Caricatures: Amplifying attention to artifacts increases deepfake detection by humans and machines",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deepfakes can fuel online misinformation. As deepfakes get harder to recognize with the naked eye, human users become more reliant on deepfake detection models to help them decide whether a video is real or fake. Currently, models yield a prediction for a video's authenticity, but do not integrate a method for alerting a human user. We introduce a framework for amplifying artifacts in deepfake videos to make them more detectable by people. We propose a novel, semi-supervised Artifact Attention module, which is trained on human responses to create attention maps that highlight video artifacts, and magnify them to create a novel visual indicator we call \u201cDeepfake Caricatures\u201d. In a user study, we demonstrate that Caricatures greatly increase human detection, across video presentation times and user engagement levels. We also introduce a deepfake detection model that incorporates the Artifact Attention module to increase its accuracy and robustness. Overall, we demonstrate the success of a human-centered approach to designing deepfake mitigation methods.",
        "keywords": "deepfakes;video understanding;video forensics;video manipulation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/99378339796a7aafe9a79b3af08d3ad021b95056.zip",
        "author": "Camilo Luciano Fosco;Emilie L Josephs;Alex J Andonian;Aude Oliva",
        "authorids": "~Camilo_Luciano_Fosco1;~Emilie_L_Josephs1;~Alex_J_Andonian1;~Aude_Oliva1",
        "gender": "M;;M;",
        "homepage": ";https://www.emiliejosephs.com;;",
        "dblp": "256/5485;;;",
        "google_scholar": "6heiSIUAAAAJ;;;",
        "orcid": ";;;",
        "linkedin": "camilo-fosco-990535b3/;;;",
        "or_profile": "~Camilo_Luciano_Fosco1;~Emilie_L_Josephs1;~Alex_J_Andonian1;~Aude_Oliva1",
        "aff": "Massachusetts Institute of Technology;Massachusetts Institute of Technology;;",
        "aff_domain": "mit.edu;mit.edu;;",
        "position": "PhD student;Postdoc;;",
        "bibtex": "@misc{\nfosco2024deepfake,\ntitle={Deepfake Caricatures: Amplifying attention to artifacts increases deepfake detection by humans and machines},\nauthor={Camilo Luciano Fosco and Emilie L Josephs and Alex J Andonian and Aude Oliva},\nyear={2024},\nurl={https://openreview.net/forum?id=fg772k6x6U}\n}",
        "github": "",
        "project": "",
        "reviewers": "iHin;Rnom;7ZWE;qLFh",
        "site": "https://openreview.net/forum?id=fg772k6x6U",
        "pdf_size": 6818868,
        "rating": "5;5;6;6",
        "confidence": "4;5;5;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;3;4",
        "wc_summary": "30;47;79;132",
        "wc_strengths": "39;42;37;87",
        "wc_weaknesses": "102;127;135;49",
        "wc_questions": "2;99;26;3",
        "wc_review": "173;315;277;271",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "533;1192;417;337",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            72.0,
            38.85228436012483
        ],
        "wc_strengths_avg": [
            51.25,
            20.716840975399702
        ],
        "wc_weaknesses_avg": [
            103.25,
            33.60338524613257
        ],
        "wc_questions_avg": [
            32.5,
            39.57587649060978
        ],
        "wc_review_avg": [
            259.0,
            52.44044240850758
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            619.75,
            337.6576483659151
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2919831273356984712&as_sdt=5,38&sciodt=0,38&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Massachusetts Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://web.mit.edu",
        "aff_unique_abbr": "MIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "REFACTOR: Learning to Extract Theorems from Proofs",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18178",
        "id": "fgKjiVrm6u",
        "author_site": "Jin Zhou, Yuhuai Wu, Qiyang Li, Roger Grosse",
        "tldr": "",
        "abstract": "Human mathematicians are often good at recognizing modular and reusable theorems that make complex mathematical results within reach. In this paper, we propose a novel method called theoREm-from-prooF extrACTOR (REFACTOR) for training neural networks to mimic this ability in formal mathematical theorem proving. We show on a set of unseen proofs, REFACTOR is able to extract 19.6\\% of the theorems that humans would use to write the proofs. When applying the model to the existing Metamath library, REFACTOR extracted 16 new theorems. With newly extracted theorems, we show that the existing proofs in the MetaMath database can be refactored. The new theorems are used very frequently after refactoring, with an average usage of 733.5 times, and help shorten the proof lengths. Lastly, we demonstrate that the prover trained on the new-theorem refactored dataset proves more test theorems and outperforms state-of-the-art baselines by frequently leveraging a diverse set of newly extracted theorems. Code can be found at https://github.com/jinpz/refactor.",
        "keywords": "theorem extraction;mathematical reasoning;theorem proving",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "/attachment/2a597972e19fa9d3d81cb6d1928b074ed58235da.zip",
        "author": "Jin Peng Zhou;Yuhuai Wu;Qiyang Li;Roger Baker Grosse",
        "authorids": "~Jin_Peng_Zhou1;~Yuhuai_Wu1;~Qiyang_Li1;~Roger_Baker_Grosse1",
        "gender": "M;M;M;M",
        "homepage": ";http://www.cs.toronto.edu/~ywu/;https://colinqiyangli.github.io/;http://www.cs.toronto.edu/~rgrosse/",
        "dblp": "255/1107;;;26/7058",
        "google_scholar": "Nf48jqcAAAAJ;https://scholar.google.ca/citations?user=bOQGfFIAAAAJ;qlwwdfEAAAAJ;xgQd1qgAAAAJ",
        "orcid": ";;;",
        "linkedin": "https://ca.linkedin.com/in/jinpeng-zhou;;;",
        "or_profile": "~Jin_Peng_Zhou1;~Yuhuai_Wu1;~Qiyang_Li1;~Roger_Baker_Grosse1",
        "aff": "Department of Computer Science, Cornell University;;University of California, Berkeley;Vector Institute",
        "aff_domain": "cs.cornell.edu;;berkeley.edu;vectorinstitute.ai",
        "position": "PhD student;;PhD student;Faculty Member",
        "bibtex": "@inproceedings{\nzhou2024refactor,\ntitle={{REFACTOR}: Learning to Extract Theorems from Proofs},\nauthor={Jin Peng Zhou and Yuhuai Wu and Qiyang Li and Roger Baker Grosse},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=fgKjiVrm6u}\n}",
        "github": "",
        "project": "",
        "reviewers": "VAcB;QrE7;WVCw;QmHL",
        "pdf_size": 794135,
        "rating": "5;8;8;8",
        "confidence": "4;4;4;4",
        "soundness": "3;3;4;3",
        "contribution": "3;2;3;3",
        "presentation": "2;3;4;4",
        "wc_summary": "92;62;235;90",
        "wc_strengths": "26;14;49;66",
        "wc_weaknesses": "305;110;7;52",
        "wc_questions": "131;76;33;1",
        "wc_review": "554;262;324;209",
        "wc_reply_reviewers": "78;287;0;0",
        "wc_reply_authors": "1399;1198;393;124",
        "reply_reviewers": "1;2;0;0",
        "reply_authors": "3;4;1;1",
        "rating_avg": [
            7.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            119.75,
            67.58836808208939
        ],
        "wc_strengths_avg": [
            38.75,
            20.141685629559408
        ],
        "wc_weaknesses_avg": [
            118.5,
            113.69806506708898
        ],
        "wc_questions_avg": [
            60.25,
            48.75128203442449
        ],
        "wc_review_avg": [
            337.25,
            131.5928854459845
        ],
        "wc_reply_reviewers_avg": [
            91.25,
            117.41672581025243
        ],
        "wc_reply_authors_avg": [
            778.5,
            533.3809614150097
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.25,
            1.299038105676658
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12202321198796428388&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=fgKjiVrm6u",
        "pdf": "https://openreview.net/pdf?id=fgKjiVrm6u",
        "email": "cs.cornell.edu;;berkeley.edu;vectorinstitute.ai",
        "author_num": 4,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Cornell University;University of California, Berkeley;Vector Institute",
        "aff_unique_dep": "Department of Computer Science;;",
        "aff_unique_url": "https://www.cornell.edu;https://www.berkeley.edu;https://vectorinstitute.ai/",
        "aff_unique_abbr": "Cornell;UC Berkeley;Vector Institute",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Berkeley",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "United States;Canada"
    },
    {
        "title": "The Alignment Problem from a Deep Learning Perspective",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18177",
        "id": "fh8EYKFKns",
        "author_site": "Richard Ngo, Lawrence Chan, S\u00f6ren Mindermann",
        "tldr": "",
        "abstract": "AI systems based on deep learning have reached or surpassed human performance in a range of narrow domains. In coming years or decades, artificial general intelligence (AGI) may surpass human capabilities at many critical tasks. In this position paper, we examine the technical difficulty of fine-tuning hypothetical AGI systems based on pretrained deep models to pursue goals that are aligned with human interests. We argue that, if trained like today's most capable models, AGI systems could learn to act deceptively to receive higher reward, learn internally-represented goals which generalize beyond their fine-tuning distributions, and pursue those goals using power-seeking strategies. We review emerging evidence for these properties. AGIs with these properties would be difficult to align and may appear aligned even when they are not.",
        "keywords": "Alignment;Safety;AGI;position paper",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Richard Ngo;Lawrence Chan;S\u00f6ren Mindermann",
        "authorids": "~Richard_Ngo2;~Lawrence_Chan2;~S\u00f6ren_Mindermann1",
        "gender": ";M;M",
        "homepage": "https://richardcngo.com;https://chanlawrence.me/;https://www.soren-mindermann.com/",
        "dblp": "276/6932;28/2626;211/7976",
        "google_scholar": "https://scholar.google.com/citations?pli=1;https://scholar.google.com/citations?view_op=list_works;slBPlrQAAAAJ",
        "orcid": ";;0000-0002-0315-9821",
        "linkedin": ";;",
        "or_profile": "~Richard_Ngo2;~Lawrence_Chan2;~S\u00f6ren_Mindermann1",
        "aff": "OpenAI;University of California, Berkeley;Mila - Quebec Artificial Intelligence Institute",
        "aff_domain": "openai.com;berkeley.edu;mila.quebec",
        "position": "Researcher;PhD student;Postdoc",
        "bibtex": "@inproceedings{\nngo2024the,\ntitle={The Alignment Problem from a Deep Learning Perspective},\nauthor={Richard Ngo and Lawrence Chan and S{\\\"o}ren Mindermann},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=fh8EYKFKns}\n}",
        "github": "",
        "project": "",
        "reviewers": "EvUt;AFZo;QAya;MZmL",
        "pdf_size": 322954,
        "rating": "3;5;5;8",
        "confidence": "3;1;2;3",
        "soundness": "2;4;2;3",
        "contribution": "2;3;2;3",
        "presentation": "4;4;3;3",
        "wc_summary": "56;71;86;68",
        "wc_strengths": "97;94;42;148",
        "wc_weaknesses": "409;73;180;415",
        "wc_questions": "5;4;1;1",
        "wc_review": "567;242;309;632",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            2.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            70.25,
            10.685855136581255
        ],
        "wc_strengths_avg": [
            95.25,
            37.49249924984996
        ],
        "wc_weaknesses_avg": [
            269.25,
            147.69288236066083
        ],
        "wc_questions_avg": [
            2.75,
            1.7853571071357126
        ],
        "wc_review_avg": [
            437.5,
            165.3277048773133
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.1266600992762247,
        "gs_citation": 225,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=523693850107345901&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=fh8EYKFKns",
        "pdf": "https://openreview.net/pdf?id=fh8EYKFKns",
        "email": "openai.com;berkeley.edu;mila.quebec",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "OpenAI;University of California, Berkeley;Quebec Artificial Intelligence Institute",
        "aff_unique_dep": ";;Artificial Intelligence",
        "aff_unique_url": "https://openai.com;https://www.berkeley.edu;https://mila.quebec",
        "aff_unique_abbr": "OpenAI;UC Berkeley;Mila",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Berkeley",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "United States;Canada"
    },
    {
        "id": "fhJALInfQj",
        "title": "Large Language Models can $\\textit{Share}$ Images, Too!",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "This paper explores the \\textit{image-sharing} capability of Large Language Models (LLMs), such as InstructGPT, ChatGPT, and GPT-4, in a zero-shot setting, without the help of visual foundation models.\nInspired by the two-stage process of image-sharing in human dialogues, we propose a two-stage framework that allows LLMs to predict potential image-sharing turns and generate related image descriptions using our effective restriction-based prompt template.\nWith extensive experiments, we unlock the \\textit{image-sharing} capability of LLMs in zero-shot prompting, with GPT-4 achieving the best performance.\nAdditionally, we uncover the emergent \\textit{image-sharing} ability in zero-shot prompting, demonstrating the effectiveness of restriction-based prompts in both stages of our framework.\nBased on this framework, we augment the PhotoChat dataset with images generated by Stable Diffusion at predicted turns, namely PhotoChat++.\nTo our knowledge, this is the first study to assess the \\textit{image-sharing} ability of LLMs in a zero-shot setting without visual foundation models.\nThe source code and the dataset will be released after publication.",
        "keywords": "multi-modal dialogue;language model;image-sharing behavior;gpt3",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/b060bae9f75e93608493172a70af70089d873ef4.zip",
        "author": "Young-Jun Lee;Jonghwan Hyeon;Ho-Jin Choi",
        "authorids": "~Young-Jun_Lee1;~Jonghwan_Hyeon1;~Ho-Jin_Choi1",
        "gender": "M;M;M",
        "homepage": "https://sites.google.com/view/passing2961/home;https://jonghwan.com;https://keai.kaist.ac.kr/people/professor/",
        "dblp": "52/5671;;60/1227",
        "google_scholar": "8EgjKPUAAAAJ;;https://scholar.google.co.kr/citations?hl=en",
        "orcid": ";;0000-0002-3398-9543",
        "linkedin": ";;",
        "or_profile": "~Young-Jun_Lee1;~Jonghwan_Hyeon1;~Ho-Jin_Choi1",
        "aff": "Korea Advanced Institute of Science & Technology;KAIST;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr;kaist.ac.kr",
        "position": "PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nlee2024large,\ntitle={Large Language Models can \\${\\textbackslash}textit\\{Share\\}\\$ Images, Too!},\nauthor={Young-Jun Lee and Jonghwan Hyeon and Ho-Jin Choi},\nyear={2024},\nurl={https://openreview.net/forum?id=fhJALInfQj}\n}",
        "github": "",
        "project": "",
        "reviewers": "7gME;x6ME;m6aj;LPEG;aJto",
        "site": "https://openreview.net/forum?id=fhJALInfQj",
        "pdf_size": 1567293,
        "rating": "3;3;3;5;5",
        "confidence": "4;4;4;2;4",
        "soundness": "1;1;2;2;3",
        "contribution": "1;2;3;2;2",
        "presentation": "3;3;2;3;2",
        "wc_summary": "32;149;74;109;46",
        "wc_strengths": "10;79;39;28;23",
        "wc_weaknesses": "296;611;232;134;30",
        "wc_questions": "1;80;4;58;11",
        "wc_review": "339;919;349;329;110",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            3.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.6,
            0.8
        ],
        "soundness_avg": [
            1.8,
            0.7483314773547883
        ],
        "contribution_avg": [
            2.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            82.0,
            42.609858014314014
        ],
        "wc_strengths_avg": [
            35.8,
            23.523605165875406
        ],
        "wc_weaknesses_avg": [
            260.6,
            197.00517759693525
        ],
        "wc_questions_avg": [
            30.8,
            32.12102115437801
        ],
        "wc_review_avg": [
            409.2,
            269.9632567591375
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.6123724356957946,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "fht65Wm5JC",
        "title": "Borda Regret Minimization for Generalized Linear Dueling Bandits",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Dueling bandits are widely used to model preferential feedback prevalent in many applications such as recommendation systems and ranking. \n   In this paper, we study the Borda regret minimization problem for dueling bandits, which aims to identify the item with the highest Borda score while minimizing the cumulative regret.\n    We propose a rich class of generalized linear dueling bandit models, which cover many existing models.\n    We first prove a regret lower bound of order $\\Omega(d^{2/3} T^{2/3})$ for the Borda regret minimization problem, where $d$ is the dimension of contextual vectors and $T$ is the time horizon.\n    To attain this lower bound, we propose an explore-then-commit type algorithm for the stochastic setting, which has a nearly matching regret upper bound $\\tilde{O}(d^{2/3} T^{2/3})$. \n    We also propose an EXP3-type algorithm for the adversarial setting, where the underlying model parameter can change at each round. Our algorithm achieves an $\\tilde{O}(d^{2/3} T^{2/3})$ regret, which is also optimal.\n    Empirical evaluations on both synthetic data and a simulated real-world environment are conducted to corroborate our theoretical analysis.",
        "keywords": "Borda score;dueling bandit;generalized linear model;linear bandit;regret minimization",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/4312e1b304d027dff292a7cca4a4acc55c9bc4a5.zip",
        "author": "Yue Wu;Tao Jin;Qiwei Di;Hao Lou;Farzad Farnoud;Quanquan Gu",
        "authorids": "~Yue_Wu12;~Tao_Jin3;~Qiwei_Di1;~Hao_Lou1;~Farzad_Farnoud1;~Quanquan_Gu1",
        "gender": "M;M;M;M;;M",
        "homepage": "https://yuewu.us/;https://tao-j.me;https://qiwei-di1234.github.io/;http://ips.lab.virginia.edu/;http://www.ece.virginia.edu/~ffh8x;http://web.cs.ucla.edu/~qgu/",
        "dblp": "41/5979-11;88/4850-2;354/3878;44/6250;88/7890.html;50/4597",
        "google_scholar": "kSQ1mLYAAAAJ;0kCyQGsAAAAJ;SewL0pkAAAAJ;;https://scholar.google.com/citations?hl=en;GU9HgNAAAAAJ",
        "orcid": ";;;;0000-0002-8684-4487;",
        "linkedin": ";;qiwei-di-00776a253/;;farzad-farnoud-b7993315/;",
        "or_profile": "~Yue_Wu12;~Tao_Jin3;~Qiwei_Di1;~Hao_Lou1;~Farzad_Farnoud1;~Quanquan_Gu1",
        "aff": "University of California, Los Angeles;;University of California, Los Angeles;;University of Virginia;University of California, Los Angeles",
        "aff_domain": "ucla.edu;;ucla.edu;;virginia.edu;cs.ucla.edu",
        "position": "PhD student;;PhD student;;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nwu2024borda,\ntitle={Borda Regret Minimization for Generalized Linear Dueling Bandits},\nauthor={Yue Wu and Tao Jin and Qiwei Di and Hao Lou and Farzad Farnoud and Quanquan Gu},\nyear={2024},\nurl={https://openreview.net/forum?id=fht65Wm5JC}\n}",
        "github": "",
        "project": "",
        "reviewers": "PcGb;Kuh2;vgjv;Ln8Y",
        "site": "https://openreview.net/forum?id=fht65Wm5JC",
        "pdf_size": 844658,
        "rating": "5;5;5;6",
        "confidence": "2;4;3;3",
        "soundness": "2;3;2;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "167;115;66;242",
        "wc_strengths": "31;94;109;247",
        "wc_weaknesses": "150;311;137;160",
        "wc_questions": "74;139;36;124",
        "wc_review": "422;659;348;773",
        "wc_reply_reviewers": "65;71;95;43",
        "wc_reply_authors": "691;663;527;377",
        "reply_reviewers": "1;1;1;2",
        "reply_authors": "2;2;2;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            147.5,
            65.20927848090331
        ],
        "wc_strengths_avg": [
            120.25,
            78.81425949661647
        ],
        "wc_weaknesses_avg": [
            189.5,
            70.62046445613339
        ],
        "wc_questions_avg": [
            93.25,
            40.88627520330019
        ],
        "wc_review_avg": [
            550.5,
            172.33470341170406
        ],
        "wc_reply_reviewers_avg": [
            68.5,
            18.513508581573618
        ],
        "wc_reply_authors_avg": [
            564.5,
            124.76678243827561
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14660110423878220029&as_sdt=20000005&sciodt=0,21&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "University of California, Los Angeles;University of Virginia",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ucla.edu;https://www.virginia.edu",
        "aff_unique_abbr": "UCLA;UVA",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Los Angeles;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "fiPrawicu1",
        "title": "On the Convergence of AdaGrad-Norm for Non-Convex Optimization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Adaptive optimizers have achieved significant success in deep learning by dynamically adjusting the learning rate based on iterative gradients. Compared to stochastic gradient descent (SGD), adaptive optimizers converge much faster in various deep-learning tasks. However, as a fundamental adaptive optimizer,  the theoretical analysis of AdaGrad-Norm is inadequate, and there are many technical challenges regarding last-iterate convergence and average-iterate convergence rates for general non-convex loss functions. This paper aims to address these limitations and provides a comprehensive analysis of AdaGrad-Norm. We propose novel techniques that avoid the assumption of no saddle points and derive last-iterate convergence for both almost surely and mean-square senses. Furthermore, under milder conditions, we obtain the near-optimal and sub-optimal rates w.r.t averaged iterate in the expected sense and the almost surely sense, respectively.  We relax one restrictive assumption of the uniformly bounded stochastic gradient used in existing high-probability convergence analysis. Moreover, the methodologies provided in this paper have the potential to contribute to further research on the convergence properties of other stochastic algorithms.",
        "keywords": "AdaGrad-Norm;Last-iterate convergence;Stochastic optimization",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/430c559b6cd3261804b69487cd21f1f9a6e204c3.pdf",
        "author": "Ruinan Jin;Xiaoyu Wang",
        "authorids": "~Ruinan_Jin3;~Xiaoyu_Wang4",
        "gender": "F;M",
        "homepage": "https://xiaoyuwang2821.github.io/xiaoyu_wang.github.io/;https://scholar.google.com.hk/citations?hl=zh-CN&view_op=list_works&gmla=ABEO0YpMEhFteT3tG3yjwPnBjv4ebvgbyl-hmC7FT9L439bSws7FLcpMFODaF4dgg0F8vMhRXdeHXavir1trk1nOlso&user=tWQlpCUAAAAJ",
        "dblp": "58/4775-8;index.html",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;https://scholar.google.com.hk/citations?hl=zh-CN",
        "orcid": "0000-0003-4102-4909;",
        "linkedin": ";",
        "or_profile": "~Xiaoyu_Wang4;~ruinan_Jin2",
        "aff": "Hong Kong University of Science and Technology;The Chinese University of Hong Kong, Shenzhen",
        "aff_domain": "hkust.edu;cuhk.edu.cn",
        "position": "Research Assistant Professor;Postdoc",
        "bibtex": "@misc{\njin2024on,\ntitle={On the Convergence of AdaGrad-Norm for Non-Convex Optimization},\nauthor={Ruinan Jin and Xiaoyu Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=fiPrawicu1}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=fiPrawicu1",
        "pdf_size": 616293,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:GGOVaCaRrxcJ:scholar.google.com/&scioq=On+the+Convergence+of+AdaGrad-Norm+for+Non-Convex+Optimization&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Chinese University of Hong Kong",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ust.hk;https://www.cuhk.edu.cn",
        "aff_unique_abbr": "HKUST;CUHK",
        "aff_campus_unique_index": "0;1",
        "aff_campus_unique": "Hong Kong SAR;Shenzhen",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "GAIA: a benchmark for General AI Assistants",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18176",
        "id": "fibxvahvs3",
        "author_site": "Gr\u00e9goire Mialon, Cl\u00e9mentine Fourrier, Thomas Wolf, Yann LeCun, Thomas Scialom",
        "tldr": "",
        "abstract": "We introduce GAIA, a benchmark for General AI Assistants that, if solved, would represent a milestone in AI research. GAIA proposes real-world questions that require a set of fundamental abilities such as reasoning, multi-modality handling, web browsing, and generally tool-use proficiency. GAIA questions are conceptually simple for humans yet challenging for most advanced AIs: we show that human respondents obtain 92% vs. 15% for GPT-4 equipped with plugins. This notable performance disparity contrasts with the recent trend of LLMs outperforming humans on tasks requiring professional skills in e.g. law or chemistry. GAIA\u2019s philosophy departs from the current trend in AI benchmarks suggesting to target tasks that are ever more difficult for humans. We posit that the advent of Artificial General Intelligence (AGI) hinges on a system\u2019s capability to exhibit similar robustness as the average human does on such questions. Using GAIA\u2019s methodology, we devise 466 questions and their answer. We release our questions while retaining answers to 300 of them to power a leader-board accessible at https://huggingface.co/gaia-benchmark.",
        "keywords": "Large Language Models;Benchmark",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/b5b7b84f88d2b86797f084ba362102ffacc46a9d.zip",
        "author": "Gr\u00e9goire Mialon;Cl\u00e9mentine Fourrier;Thomas Wolf;Yann LeCun;Thomas Scialom",
        "authorids": "~Gr\u00e9goire_Mialon1;~Cl\u00e9mentine_Fourrier1;~Thomas_Wolf1;~Yann_LeCun1;~Thomas_Scialom1",
        "gender": ";;M;M;M",
        "homepage": ";;https://thomwolf.io;http://yann.lecun.com;",
        "dblp": "228/9191;;;l/YannLeCun;",
        "google_scholar": ";;D2H5EFEAAAAJ;WLN3QrAAAAAJ;qou4P-kAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Gr\u00e9goire_Mialon1;~Cl\u00e9mentine_Fourrier1;~Thomas_Wolf1;~Yann_LeCun1;~Thomas_Scialom1",
        "aff": "Meta Facebook;;Hugging Face;New York University;",
        "aff_domain": "fb.com;;huggingface.co;nyu.edu;",
        "position": "Postdoc;;Researcher;Full Professor;",
        "bibtex": "@inproceedings{\nmialon2024gaia,\ntitle={{GAIA}: a benchmark for General {AI} Assistants},\nauthor={Gr{\\'e}goire Mialon and Cl{\\'e}mentine Fourrier and Thomas Wolf and Yann LeCun and Thomas Scialom},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=fibxvahvs3}\n}",
        "github": "",
        "project": "",
        "reviewers": "nJWa;GSBU;FuKx;CDvr",
        "pdf_size": 4007039,
        "rating": "3;8;8;8",
        "confidence": "4;4;3;5",
        "soundness": "2;3;3;3",
        "contribution": "1;3;3;3",
        "presentation": "3;4;3;4",
        "wc_summary": "158;56;176;54",
        "wc_strengths": "103;66;94;150",
        "wc_weaknesses": "156;31;37;191",
        "wc_questions": "15;127;162;278",
        "wc_review": "432;280;469;673",
        "wc_reply_reviewers": "514;20;19;158",
        "wc_reply_authors": "271;225;677;378",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.75,
            2.165063509461097
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            111.0,
            56.36488268416781
        ],
        "wc_strengths_avg": [
            103.25,
            30.243801017729236
        ],
        "wc_weaknesses_avg": [
            103.75,
            70.87092139940047
        ],
        "wc_questions_avg": [
            145.5,
            93.80964769148214
        ],
        "wc_review_avg": [
            463.5,
            140.16508124351085
        ],
        "wc_reply_reviewers_avg": [
            177.75,
            202.20085929589914
        ],
        "wc_reply_authors_avg": [
            387.75,
            175.9820658476312
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 125,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6088095852173406019&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=fibxvahvs3",
        "pdf": "https://openreview.net/pdf?id=fibxvahvs3",
        "email": "fb.com;;huggingface.co;nyu.edu;",
        "author_num": 5,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Meta;Hugging Face;New York University",
        "aff_unique_dep": "Meta Platforms, Inc.;;",
        "aff_unique_url": "https://meta.com;https://huggingface.co;https://www.nyu.edu",
        "aff_unique_abbr": "Meta;Hugging Face;NYU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "fihkcXeG7N",
        "title": "Gate-guided and subgraph-aware Bilateral Fusion for Molecular Property Prediction",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Predicting molecular properties is crucial in scientific research and industry applications.  Molecules are often modeled as graphs where atoms and chemical bonds are represented as nodes and edges, respectively, and Graph Neural Networks (GNNs) have been commonly utilized to predict atom-related properties, such as reactivity and solubility. However, some properties, such as efficacy, and metabolic properties, are closely related to functional groups (subgraphs), which cannot be solely determined by individual atoms. In this paper, we introduce the Gate-guided and Subgraph-aware Bilateral Fusion (GSBF) model for molecular property prediction. GSBF overcomes the limitations of prior atom-wise and subgraph-wise models by integrating both types of information into two distinct branches within the model. We provide a gate-guided mechanism to control the utilization of two branches. Considering existing atom-wise GNNs cannot properly extract invariant subgraph features, we propose a decomposition-polymerization GNN architecture for the subgraph-wise branch. Furthermore, we propose cooperative node-level and graph-level self-supervised learning strategies for GSBF to improve its generalization. Our method offers a more comprehensive way to learn representations for molecular property prediction. Extensive experiments have demonstrated the effectiveness of our method.",
        "keywords": "Molecular property prediction",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Jiahao Chen;Yurou Liu;Jiangmeng Li;Bing Su;Ji-Rong Wen",
        "authorids": "~Jiahao_Chen4;~Yurou_Liu1;~Jiangmeng_Li1;~Bing_Su1;~Ji-Rong_Wen1",
        "gender": "M;F;M;M;M",
        "homepage": "https://jiahaochen1.github.io/;https://serendipity-r.github.io/;https://jiangmengli.github.io/;https://gsai.ruc.edu.cn/bingsu;https://gsai.ruc.edu.cn/english/jrwen",
        "dblp": ";;293/0997;41/5270-1;w/JRWen",
        "google_scholar": "https://scholar.google.com.hk/citations?user=Af4IREwAAAAJ;;https://scholar.google.com.sg/citations?user=-kU4VLcAAAAJ;https://scholar.google.com.sg/citations?user=d3g2VJQAAAAJ;tbxCHJgAAAAJ",
        "orcid": ";;0000-0002-3376-1522;0000-0001-8560-1910;0000-0002-9777-9676",
        "linkedin": ";;jiangmeng-li-86aaa7125/;;",
        "or_profile": "~Jiahao_Chen4;~Yurou_Liu1;~Jiangmeng_Li1;~Bing_Su1;~Ji-Rong_Wen1",
        "aff": "Renmin University of China;Renmin University of China;Institute of Software, Chinese Academy of Sciences;Renmin University of China;Renmin University of China",
        "aff_domain": "ruc.edu.cn;ruc.edu.cn;iscas.ac.cn;ruc.edu.cn;ruc.edu.cn",
        "position": "PhD student;PhD student;Assistant Professor;Associate Professor;Full Professor",
        "bibtex": "@misc{\nchen2024gateguided,\ntitle={Gate-guided and subgraph-aware Bilateral Fusion for Molecular Property Prediction},\nauthor={Jiahao Chen and Yurou Liu and Jiangmeng Li and Bing Su and Ji-Rong Wen},\nyear={2024},\nurl={https://openreview.net/forum?id=fihkcXeG7N}\n}",
        "github": "",
        "project": "",
        "reviewers": "P8ct;ni8k;KxV7;7exA",
        "site": "https://openreview.net/forum?id=fihkcXeG7N",
        "pdf_size": 2132018,
        "rating": "1;3;3;5",
        "confidence": "5;5;5;4",
        "soundness": "2;2;3;2",
        "contribution": "1;2;2;2",
        "presentation": "3;1;2;3",
        "wc_summary": "61;51;118;87",
        "wc_strengths": "26;16;90;61",
        "wc_weaknesses": "189;265;249;77",
        "wc_questions": "24;5;196;90",
        "wc_review": "300;337;653;315",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            79.25,
            25.945857087404146
        ],
        "wc_strengths_avg": [
            48.25,
            29.328953271468794
        ],
        "wc_weaknesses_avg": [
            195.0,
            73.78346698278686
        ],
        "wc_questions_avg": [
            78.75,
            74.68391727808606
        ],
        "wc_review_avg": [
            401.25,
            145.9424115875848
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:BshHV103Q-cJ:scholar.google.com/&scioq=Gate-guided+and+subgraph-aware+Bilateral+Fusion+for+Molecular+Property+Prediction&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "Renmin University of China;Chinese Academy of Sciences",
        "aff_unique_dep": ";Institute of Software",
        "aff_unique_url": "http://www.ruc.edu.cn;http://www.ios.ac.cn",
        "aff_unique_abbr": "RUC;CAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Stochastic Gradient Descent for Gaussian Processes Done Right",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18175",
        "id": "fj2E5OcLFn",
        "author_site": "Jihao Andreas Lin, Shreyas Padhy, Javier Antor\u00e1n, Austin Tripp, Alexander Terenin, Csaba Szepesvari, Jos\u00e9 Miguel Hern\u00e1ndez Lobato, David Janz",
        "tldr": "",
        "abstract": "As is well known, both sampling from the posterior and computing the mean of the posterior in Gaussian process regression reduces to solving a large linear system of equations. We study the use of stochastic gradient descent for solving this linear system, and show that when done right---by which we mean using specific insights from the optimisation and kernel communities---stochastic gradient descent is highly effective. To that end, we introduce a particularly simple stochastic dual descent algorithm, explain its design in an intuitive manner and illustrate the design choices through a series of ablation studies. Further experiments demonstrate that our new method is highly competitive. In particular, our evaluations on the UCI regression tasks and on Bayesian optimisation set our approach apart from preconditioned conjugate gradients and variational Gaussian process approximations. Moreover, our method places Gaussian process regression on par with state-of-the-art graph neural networks for molecular binding affinity prediction.",
        "keywords": "Gaussian process;stochastic gradient descent",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Jihao Andreas Lin;Shreyas Padhy;Javier Antoran;Austin Tripp;Alexander Terenin;Csaba Szepesvari;Jos\u00e9 Miguel Hern\u00e1ndez-Lobato;David Janz",
        "authorids": "~Jihao_Andreas_Lin1;~Shreyas_Padhy1;~Javier_Antoran1;~Austin_Tripp1;~Alexander_Terenin1;~Csaba_Szepesvari1;~Jos\u00e9_Miguel_Hern\u00e1ndez-Lobato1;~David_Janz1",
        "gender": "M;M;Unspecified;M;M;M;M;",
        "homepage": "https://jandylin.github.io;http://shreyaspadhy.github.io;https://javierantoran.github.io/about/;https://www.austintripp.ca/;https://avt.im/;https://sites.ualberta.ca/~szepesva/;http://www.djanz.org;http://jmhl.org",
        "dblp": "279/2864;267/9851;234/8818.html;267/5455;185/1040;http://dblp.uni-trier.de/pers/hd/s/Szepesv=aacute=ri:Csaba;190/7685;40/6058",
        "google_scholar": "Bn1GyeEAAAAJ;JxbV2R0AAAAJ;_b-Cs2cAAAAJ;WAvRaxMAAAAJ;6Qa-wXMAAAAJ;https://scholar.google.ca/citations?user=zvC19mQAAAAJ;https://scholar.google.co.uk/citations?user=rI5XB7sAAAAJ;BEBccCQAAAAJ",
        "orcid": ";;0000-0003-2877-2689;0000-0002-0138-7740;0000-0001-5292-3104;;;0000-0001-7610-949X",
        "linkedin": "jihao-andreas-lin/;;javier-antoran/;;;csaba-szepesvari-09376b1?trk=hp-identity-name;;",
        "or_profile": "~Jihao_Andreas_Lin1;~Shreyas_Padhy1;~Javier_Antoran1;~Austin_Tripp1;~Alexander_Terenin1;~Csaba_Szepesvari1;~David_Janz1;~Jose_Miguel_Hernandez_Lobato1",
        "aff": "University of Cambridge;University of Cambridge;University of Cambridge;University of Cambridge;Cornell University;Google DeepMind;University of Alberta;University of Cambridge",
        "aff_domain": "cam.ac.uk;cam.ac.uk;cam.ac.uk;cam.ac.uk;cornell.edu;google.com;ualberta.ca;cam.ac.uk",
        "position": "PhD student;PhD student;PhD student;PhD student;Assistant Professor;Research Scientist;Postdoc;Associate Professor",
        "bibtex": "@inproceedings{\nlin2024stochastic,\ntitle={Stochastic Gradient Descent for Gaussian Processes Done Right},\nauthor={Jihao Andreas Lin and Shreyas Padhy and Javier Antoran and Austin Tripp and Alexander Terenin and Csaba Szepesvari and Jos{\\'e} Miguel Hern{\\'a}ndez-Lobato and David Janz},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=fj2E5OcLFn}\n}",
        "github": "",
        "project": "",
        "reviewers": "dz2H;WMvZ;1x4h;NBgz;eaDf",
        "pdf_size": 1094656,
        "rating": "5;5;6;8;8",
        "confidence": "3;3;4;4;3",
        "soundness": "3;2;3;4;3",
        "contribution": "3;2;2;4;3",
        "presentation": "3;3;3;4;3",
        "wc_summary": "16;64;82;120;74",
        "wc_strengths": "159;46;35;59;56",
        "wc_weaknesses": "136;190;61;6;89",
        "wc_questions": "2;4;199;112;22",
        "wc_review": "313;304;377;297;241",
        "wc_reply_reviewers": "150;0;52;24;36",
        "wc_reply_authors": "601;1154;1634;268;668",
        "reply_reviewers": "1;0;1;1;1",
        "reply_authors": "2;2;3;1;1",
        "rating_avg": [
            6.4,
            1.3564659966250536
        ],
        "confidence_avg": [
            3.4,
            0.4898979485566356
        ],
        "soundness_avg": [
            3.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            2.8,
            0.7483314773547882
        ],
        "presentation_avg": [
            3.2,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            71.2,
            33.48074073254652
        ],
        "wc_strengths_avg": [
            71.0,
            44.797321348491366
        ],
        "wc_weaknesses_avg": [
            96.4,
            62.943148952050365
        ],
        "wc_questions_avg": [
            67.8,
            77.02570999348204
        ],
        "wc_review_avg": [
            306.4,
            43.357121675683224
        ],
        "wc_reply_reviewers_avg": [
            52.4,
            51.666623655896075
        ],
        "wc_reply_authors_avg": [
            865.0,
            477.45073044241957
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            1.8,
            0.7483314773547883
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.3611575592573077,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5586175668315545559&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=fj2E5OcLFn",
        "pdf": "https://openreview.net/pdf?id=fj2E5OcLFn",
        "email": "cam.ac.uk;cam.ac.uk;cam.ac.uk;cam.ac.uk;cornell.edu;google.com;ualberta.ca;cam.ac.uk",
        "author_num": 8,
        "aff_unique_index": "0;0;0;0;1;2;3;0",
        "aff_unique_norm": "University of Cambridge;Cornell University;Google;University of Alberta",
        "aff_unique_dep": ";;Google DeepMind;",
        "aff_unique_url": "https://www.cam.ac.uk;https://www.cornell.edu;https://deepmind.com;https://www.ualberta.ca",
        "aff_unique_abbr": "Cambridge;Cornell;DeepMind;UAlberta",
        "aff_campus_unique_index": "0;0;0;0;0",
        "aff_campus_unique": "Cambridge;",
        "aff_country_unique_index": "0;0;0;0;1;0;2;0",
        "aff_country_unique": "United Kingdom;United States;Canada"
    },
    {
        "id": "fj5SqqXfn1",
        "title": "Avoiding Pitfalls for Privacy Accounting of Subsampled Mechanisms under Composition",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We consider the problem of computing tight privacy guarantees for the composition of subsampled differentially private mechanisms. Recent algorithms can numerically compute the privacy parameters to arbitrary precision but must be carefully applied.\n\nOur main contribution is to address two common points of confusion. First, some privacy accountants assume that the privacy guarantees for the composition of a subsampled mechanism are determined by self-composing the worst-case datasets for the uncomposed mechanism. We show that this is not true in general. Second, Poisson subsampling is sometimes assumed to have similar privacy guarantees compared to sampling without replacement. We show that the privacy guarantees may in fact differ significantly between the two sampling schemes. This occurs for some parameters that could realistically be chosen for DP-SGD.",
        "keywords": "differential privacy;accounting;stochastic gradient descent",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Christian Janos Lebeda;Matthew Regehr;Gautam Kamath",
        "authorids": "~Christian_Janos_Lebeda1;~Matthew_Regehr1;~Gautam_Kamath1",
        "gender": ";M;M",
        "homepage": ";;http://www.gautamkamath.com/",
        "dblp": ";;73/11140",
        "google_scholar": ";;MK6zHkYAAAAJ",
        "orcid": "0000-0001-9517-8466;0009-0005-3710-6233;",
        "linkedin": ";;",
        "or_profile": "~Christian_Janos_Lebeda1;~Matthew_Regehr1;~Gautam_Kamath1",
        "aff": "IT University of Copenhagen;;University of Waterloo",
        "aff_domain": "itu.dk;;uwaterloo.ca",
        "position": "Postdoc;;Assistant Professor",
        "bibtex": "@misc{\nlebeda2024avoiding,\ntitle={Avoiding Pitfalls for Privacy Accounting of Subsampled Mechanisms under Composition},\nauthor={Christian Janos Lebeda and Matthew Regehr and Gautam Kamath},\nyear={2024},\nurl={https://openreview.net/forum?id=fj5SqqXfn1}\n}",
        "github": "",
        "project": "",
        "reviewers": "G1qb;dGjF;LTUo;xTEX",
        "site": "https://openreview.net/forum?id=fj5SqqXfn1",
        "pdf_size": 323495,
        "rating": "3;3;6;8",
        "confidence": "4;3;3;3",
        "soundness": "2;3;3;4",
        "contribution": "2;3;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "206;76;55;48",
        "wc_strengths": "81;68;48;67",
        "wc_weaknesses": "510;107;58;117",
        "wc_questions": "162;180;25;39",
        "wc_review": "959;431;186;271",
        "wc_reply_reviewers": "1386;0;0;0",
        "wc_reply_authors": "1271;90;358;348",
        "reply_reviewers": "4;0;0;0",
        "reply_authors": "3;1;1;1",
        "rating_avg": [
            5.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            96.25,
            64.19647575996676
        ],
        "wc_strengths_avg": [
            66.0,
            11.76860229593982
        ],
        "wc_weaknesses_avg": [
            198.0,
            181.51170761138246
        ],
        "wc_questions_avg": [
            101.5,
            69.9660632020982
        ],
        "wc_review_avg": [
            461.75,
            300.26103227025646
        ],
        "wc_reply_reviewers_avg": [
            346.5,
            600.1556048226159
        ],
        "wc_reply_authors_avg": [
            516.75,
            448.5216689302759
        ],
        "reply_reviewers_avg": [
            1.0,
            1.7320508075688772
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5443310539518174,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15099536644861689228&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "IT University of Copenhagen;University of Waterloo",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://itu.dk;https://uwaterloo.ca",
        "aff_unique_abbr": "ITU;UW",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Denmark;Canada"
    },
    {
        "id": "fjJcJhIzYx",
        "title": "Neural Rankers for Code Generation via Inter-Cluster Modeling",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Code Large Language Models (CodeLLMs) have ushered in a new era of code generation advancements. However, selecting the best solutions from among all possible CodeLLM solutions remains a challenge. Previous methods frequently overlooked the intricate functional similarities and interactions between clusters, resulting in suboptimal results. In this work, we introduce SRank, a novel rerank- ing strategy for selecting the best solution from code generation that focuses on modeling inter-cluster relationship. By quantifying the functional overlap between clusters, our approach provides a better ranking strategy of code solutions. Empir- ical results show that our method achieves a remarkable results on pass@1 score. For instance, on the Human-Eval benchmark, we achieve 69.66% in pass@1 with Codex002, 75.31% for WizardCoder, 53.99% for StarCoder and 60.55% for Code- Gen, which surpass the state-of-the-arts solution ranking methods, such as CodeT and Coder-Reviewer on the same CodeLLMs with significant margin (\u2248 6.1% improvement on average). Comparing to the random sampling method, we can achieve an average improvement of \u2248 23.07% on Human-Eval. Even in scenar- ios with limited test inputs, our approach demonstrates robustness and superiority, marking a new benchmark in code generation reranking.",
        "keywords": "code generation;ai4code;reranking;pass@k;ml4code;codellm;code large language model",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Hung Quoc To;Minh Huynh Nguyen;Nghi D. Q. Bui",
        "authorids": "~Hung_Quoc_To1;~Minh_Huynh_Nguyen1;~Nghi_D._Q._Bui1",
        "gender": "M;M;M",
        "homepage": "https://www.linkedin.com/in/quochungto/;https://bdqnghi.github.io/;",
        "dblp": "344/2830.html;207/7870;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;QwybxYsAAAAJ;5NH8qA0AAAAJ",
        "orcid": ";;",
        "linkedin": ";;nghminh/",
        "or_profile": "~Hung_Quoc_To1;~Nghi_D._Q._Bui1;~Nguyen_Huynh_Minh2",
        "aff": "FPT Software AI Center;SalesForce.com;FPT Software AI Center",
        "aff_domain": "fpt.com;salesforce.com;fpt.com",
        "position": "Research Resident;Researcher;Researcher",
        "bibtex": "@misc{\nto2024neural,\ntitle={Neural Rankers for Code Generation via Inter-Cluster Modeling},\nauthor={Hung Quoc To and Minh Huynh Nguyen and Nghi D. Q. Bui},\nyear={2024},\nurl={https://openreview.net/forum?id=fjJcJhIzYx}\n}",
        "github": "",
        "project": "",
        "reviewers": "c5Kt;53rB;BPa9;6Abb",
        "site": "https://openreview.net/forum?id=fjJcJhIzYx",
        "pdf_size": 754045,
        "rating": "3;5;5;6",
        "confidence": "4;3;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;4;3;3",
        "wc_summary": "90;81;56;81",
        "wc_strengths": "15;26;47;27",
        "wc_weaknesses": "118;157;102;227",
        "wc_questions": "183;24;47;2",
        "wc_review": "406;288;252;337",
        "wc_reply_reviewers": "153;0;0;0",
        "wc_reply_authors": "1862;580;317;578",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "4;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            77.0,
            12.668859459319927
        ],
        "wc_strengths_avg": [
            28.75,
            11.54068888758379
        ],
        "wc_weaknesses_avg": [
            151.0,
            48.22343828471794
        ],
        "wc_questions_avg": [
            64.0,
            70.52304587863459
        ],
        "wc_review_avg": [
            320.75,
            57.72943356728871
        ],
        "wc_reply_reviewers_avg": [
            38.25,
            66.25094338950956
        ],
        "wc_reply_authors_avg": [
            834.25,
            602.9354754034631
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            1.299038105676658
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.2294157338705618,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:mX9i624CHpAJ:scholar.google.com/&scioq=Neural+Rankers+for+Code+Generation+via+Inter-Cluster+Modeling&hl=en&as_sdt=0,33",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "FPT Software;Salesforce",
        "aff_unique_dep": "AI Center;",
        "aff_unique_url": "https://www.fpt-software.com;https://www.salesforce.com",
        "aff_unique_abbr": ";Salesforce",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Vietnam;United States"
    },
    {
        "id": "fjRM5ozPv9",
        "title": "Local-Forward: Towards Biological Plausibility in Deep Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "A lasting critique of deep learning as a model for biological intelligence and learning is the biological implausibility of backpropagation.\nBackpropagation requires caching local outputs and propagating a global error via derivatives, neither of which are known to be implemented by biological neurons.\nIn reinforcement learning, building more biologically plausible agents would allow us to better model human cognition and social behavior, and improve computational efficiency.\nWe propose Local-Forward, a new temporal-difference learning algorithm (and associated architecture) that trains neural networks to predict Q-values.\nRather than backpropagating error derivates, we rely on updates that are local to each layer of the architecture and additionally use forward connections in time to pass information from upper layers to lower layers via activations. Our approach builds on the recently proposed Forward-Forward algorithm, as well as recurrence and attention in neural architectures. \nThis approach no longer suffer the aforementioned contradictions with biology.\nFurthermore, as a proof-of-concept, we train reinforcement learning agents with Local-Forward to solve control tasks in the MinAtar environments, and show that our method's potential warrants further investigation because it opens avenues for more computational efficient training.",
        "keywords": "biological plausibility;deep Q-learning;TD learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Jonas Guan;Shon Eduard Verch;Claas A Voelcker;Ethan C Jackson;Nicolas Papernot;William A Cunningham",
        "authorids": "~Jonas_Guan1;~Shon_Eduard_Verch1;~Claas_A_Voelcker1;~Ethan_C_Jackson1;~Nicolas_Papernot1;~William_A_Cunningham1",
        "gender": ";M;M;M;M;",
        "homepage": ";https://github.com/galacticglum/;;;https://www.papernot.fr;http://social-ai.ca",
        "dblp": "275/9969;;250/2358;;162/1405;00/8258",
        "google_scholar": "OoUzutoAAAAJ;;UZq8qZ8AAAAJ;https://scholar.google.ca/citations?hl=en;cGxq0cMAAAAJ;U2KY2F8AAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";https://linkedin.com/in/shon-verch;;;nicolaspapernot;",
        "or_profile": "~Jonas_Guan1;~Shon_Eduard_Verch1;~Claas_A_Voelcker1;~Ethan_C_Jackson1;~Nicolas_Papernot1;~William_A_Cunningham1",
        "aff": "Department of Computer Science, University of Toronto;University of Toronto;Toronto University;;Google;University of Toronto",
        "aff_domain": "cs.toronto.edu;utoronto.ca;utoronto.ca;;google.com;utoronto.ca",
        "position": "PhD student;Undergrad student;PhD student;;Research Scientist;Full Professor",
        "bibtex": "@misc{\nguan2024localforward,\ntitle={Local-Forward: Towards Biological Plausibility in Deep Reinforcement Learning},\nauthor={Jonas Guan and Shon Eduard Verch and Claas A Voelcker and Ethan C Jackson and Nicolas Papernot and William A Cunningham},\nyear={2024},\nurl={https://openreview.net/forum?id=fjRM5ozPv9}\n}",
        "github": "",
        "project": "",
        "reviewers": "MymM;AyQt;eRt9",
        "site": "https://openreview.net/forum?id=fjRM5ozPv9",
        "pdf_size": 3116033,
        "rating": "3;6;6",
        "confidence": "4;4;2",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "3;3;4",
        "wc_summary": "27;117;25",
        "wc_strengths": "18;56;31",
        "wc_weaknesses": "202;117;260",
        "wc_questions": "10;295;36",
        "wc_review": "257;585;352",
        "wc_reply_reviewers": "29;0;0",
        "wc_reply_authors": "1247;2157;759",
        "reply_reviewers": "1;0;0",
        "reply_authors": "3;4;2",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            56.333333333333336,
            42.90558109254423
        ],
        "wc_strengths_avg": [
            35.0,
            15.769168230019828
        ],
        "wc_weaknesses_avg": [
            193.0,
            58.72534943843814
        ],
        "wc_questions_avg": [
            113.66666666666667,
            128.66062161965314
        ],
        "wc_review_avg": [
            398.0,
            137.79937106774713
        ],
        "wc_reply_reviewers_avg": [
            9.666666666666666,
            13.67073110293992
        ],
        "wc_reply_authors_avg": [
            1387.6666666666667,
            579.3337169158684
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.0,
            0.816496580927726
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5000000000000001,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:_6oaxGLGjI4J:scholar.google.com/&scioq=Local-Forward:+Towards+Biological+Plausibility+in+Deep+Reinforcement+Learning&hl=en&as_sdt=0,48",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "University of Toronto;Google",
        "aff_unique_dep": "Department of Computer Science;Google",
        "aff_unique_url": "https://www.utoronto.ca;https://www.google.com",
        "aff_unique_abbr": "U of T;Google",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Toronto;;Mountain View",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "Canada;United States"
    },
    {
        "id": "fjZMGKB2dU",
        "title": "A neuro-symbolic framework for answering conjunctive queries",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The problem of answering logical queries over incomplete knowledge graphs is receiving significant attention in the machine learning community. Neuro-symbolic models are a promising recent approach, showing good performance and allowing for good interpretability properties. These models rely on trained architectures to execute atomic queries, combining them with modules that simulate the symbolic operators in queries. Unfortunately, most neuro-symbolic query processors are limited to the so-called _tree-like_ logical queries that admit a bottom-up execution, where the leaves are constant values or _anchors_, and the root is the target variable. Tree-like queries, while expressive, fail short to express properties in knowledge graphs that are important in practice, such as the existence of multiple edges between entities or the presence of triangles. \n\nWe propose a framework for answering arbitrary conjunctive queries over incomplete knowledge graphs. The main idea of our method is to approximate a cyclic query by an infinite family of tree-like queries, and then leverage existing models for the latter. Our approximations achieve strong guarantees: they are _complete_, i.e. there are no false negatives, and  _optimal_, i.e. they provide the best possible approximation using tree-like queries. Our method requires the approximations to be tree-like queries where the leaves are anchors or existentially quantified variables. Hence, we also show how some of the existing neuro-symbolic models can handle these queries, which is of independent interest. Experiments show that our approximation strategy achieves competitive results, and that including queries with existentially quantified variables tends to improve the general performance of these models, both on tree-like queries and on our approximation strategy.",
        "keywords": "Knowledge graph;query answering;neuro-symbolic complex queries",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "/attachment/8fddb39dbc2a9b6b06f4aaaee9a5a555f9481140.zip",
        "author": "Pablo Barcelo;tamara cucumides;Floris Geerts;Juan L Reutter;Miguel Romero Orth",
        "authorids": "~Pablo_Barcelo1;tacucumides@uc.cl;~Floris_Geerts1;~Juan_L_Reutter1;~Miguel_Romero_Orth1",
        "gender": "M;;M;M;M",
        "homepage": "https://pbarcelo.ing.uc.cl/;;https://www.uantwerpen.be/en/staff/floris-geerts/;http://jreutter.sitios.ing.uc.cl/;http://www.mromero.cl",
        "dblp": "29/5169;;g/FlorisGeerts.html;36/27;57/4918-1.html",
        "google_scholar": "9OH3PokAAAAJ;;SGay8u4AAAAJ;;NFNyaIAAAAAJ",
        "orcid": "0000-0003-2293-2653;;0000-0002-8967-2473;;0000-0002-2615-6455",
        "linkedin": ";;florisgeerts/;;",
        "or_profile": "~Pablo_Barcelo1;tacucumides@uc.cl;~Floris_Geerts1;~Juan_L_Reutter1;~Miguel_Romero_Orth1",
        "aff": "Pontificia Universidad Cat\u00f3lica;;University of Antwerp;Pontificia Universidad Cat\u00f3lica;Pontificia Universidad Catolica de Chile",
        "aff_domain": "uc.cl;;uantwerp.be;uc.cl;uc.cl",
        "position": "Full Professor;;Full Professor;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nbarcelo2024a,\ntitle={A neuro-symbolic framework for answering conjunctive queries},\nauthor={Pablo Barcelo and tamara cucumides and Floris Geerts and Juan L Reutter and Miguel Romero Orth},\nyear={2024},\nurl={https://openreview.net/forum?id=fjZMGKB2dU}\n}",
        "github": "",
        "project": "",
        "reviewers": "tybU;vTgu;x4Ne;FeZT;Ajos",
        "site": "https://openreview.net/forum?id=fjZMGKB2dU",
        "pdf_size": 2533819,
        "rating": "3;3;3;3;6",
        "confidence": "5;2;4;4;2",
        "soundness": "2;1;2;2;3",
        "contribution": "2;1;1;1;3",
        "presentation": "3;1;2;3;3",
        "wc_summary": "149;43;13;38;50",
        "wc_strengths": "81;3;47;19;93",
        "wc_weaknesses": "351;52;156;286;49",
        "wc_questions": "33;58;7;121;71",
        "wc_review": "614;156;223;464;263",
        "wc_reply_reviewers": "82;56;0;472;5",
        "wc_reply_authors": "968;711;712;1412;349",
        "reply_reviewers": "1;1;0;2;1",
        "reply_authors": "2;1;1;2;1",
        "rating_avg": [
            3.6,
            1.2
        ],
        "confidence_avg": [
            3.4,
            1.2000000000000002
        ],
        "soundness_avg": [
            2.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            1.6,
            0.8
        ],
        "presentation_avg": [
            2.4,
            0.8
        ],
        "wc_summary_avg": [
            58.6,
            46.88965770828361
        ],
        "wc_strengths_avg": [
            48.6,
            34.58091959448158
        ],
        "wc_weaknesses_avg": [
            178.8,
            122.13991976417866
        ],
        "wc_questions_avg": [
            58.0,
            38.37707649105127
        ],
        "wc_review_avg": [
            344.0,
            169.61485783975414
        ],
        "wc_reply_reviewers_avg": [
            123.0,
            177.21399493268018
        ],
        "wc_reply_authors_avg": [
            830.4,
            351.3440479074606
        ],
        "reply_reviewers_avg": [
            1.0,
            0.6324555320336759
        ],
        "reply_authors_avg": [
            1.4,
            0.4898979485566356
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5833333333333334,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10134172531386791085&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "Pontificia Universidad Cat\u00f3lica;University of Antwerp;Pontificia Universidad Catolica de Chile",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.puc.cl;https://www.uantwerp.be;https://www.puc.cl",
        "aff_unique_abbr": "PUC;UA;PUC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "Chile;Belgium"
    },
    {
        "title": "New Insight of Variance reduce in Zero-Order Hard-Thresholding: Mitigating Gradient Error and Expansivity Contradictions",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18174",
        "id": "fjf3YenThE",
        "author_site": "Xinzhe Yuan, William de Vazelhes, Bin Gu, Huan Xiong",
        "tldr": "",
        "abstract": "Hard-thresholding is an important type of algorithm in machine learning that is used to solve $\\ell_0$ constrained optimization problems. However,  the true gradient of the objective function can be difficult to access in certain scenarios, which normally can be approximated by zeroth-order (ZO) methods. SZOHT algorithm is the only algorithm tackling $\\ell_0$ sparsity constraints with zeroth-order gradients so far. Unfortunately,  SZOHT  has a notable limitation on the number of random directions due to the inherent conflict between the deviation of ZO gradients and the expansivity of the hard-thresholding operator. \nThis paper approaches this problem by considering the role of variance and provides a new insight into variance reduction: mitigating the unique conflicts between ZO gradients and hard-thresholding.  Under this perspective, we propose a generalized variance reduced ZO hard-thresholding algorithm as well as the generalized convergence analysis under standard assumptions. The theoretical results demonstrate the new algorithm eliminates the restrictions on the number of random directions, leading to improved convergence rates and broader applicability compared with SZOHT.  Finally, we illustrate the utility of our method on a portfolio optimization problem as well as black-box adversarial attacks.",
        "keywords": "zeroth-order gradient;hard-thresholding;variance reduction",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/d6b906780662129b0df4ea9eeab9ae91be6c8ab2.zip",
        "author": "Xinzhe Yuan;William de Vazelhes;Bin Gu;Huan Xiong",
        "authorids": "~Xinzhe_Yuan1;~William_de_Vazelhes2;~Bin_Gu1;~Huan_Xiong1",
        "gender": "M;M;M;M",
        "homepage": "http://im.hit.edu.cn/;https://mbzuai.ac.ae/study/faculty/bin-gu/;https://scholar.google.com/citations?user=l4hm14MAAAAJ&hl=en;http://github.com/wdevazelhes",
        "dblp": ";29/1758-1;;247/1152",
        "google_scholar": ";Vo8OgCgAAAAJ;l4hm14MAAAAJ;ple0xCwAAAAJ",
        "orcid": ";0000-0001-6049-1815;;",
        "linkedin": ";;;",
        "or_profile": "~Xinzhe_Yuan1;~Bin_Gu1;~Huan_Xiong1;~William_De_Vazelhes1",
        "aff": "Harbin Institute of Technology;Mohamed bin Zayed University of Artificial Intelligence;Harbin Institute of Technology;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_domain": "hit.edu.cn;mbzuai.ac.ae;hit.edu.cn;mbzuai.ac.ae",
        "position": "PhD student;Assistant Professor;Full Professor;PhD student",
        "bibtex": "@inproceedings{\nyuan2024new,\ntitle={New Insight of Variance reduce in Zero-Order Hard-Thresholding: Mitigating Gradient Error and Expansivity Contradictions},\nauthor={Xinzhe Yuan and William de Vazelhes and Bin Gu and Huan Xiong},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=fjf3YenThE}\n}",
        "github": "",
        "project": "",
        "reviewers": "wexC;TcW5;7pPP;CZzv;iAcw;5xEJ",
        "pdf_size": 4251775,
        "rating": "3;5;6;6;6;6",
        "confidence": "3;3;2;4;3;2",
        "soundness": "2;2;3;4;3;3",
        "contribution": "2;3;3;3;2;3",
        "presentation": "1;2;3;2;3;3",
        "wc_summary": "73;57;105;122;28;68",
        "wc_strengths": "13;29;99;116;32;27",
        "wc_weaknesses": "30;152;75;358;25;20",
        "wc_questions": "264;29;55;188;26;47",
        "wc_review": "380;267;334;784;111;162",
        "wc_reply_reviewers": "0;0;0;73;0;0",
        "wc_reply_authors": "1729;679;475;1141;421;545",
        "reply_reviewers": "0;0;0;1;0;0",
        "reply_authors": "3;1;1;3;1;1",
        "rating_avg": [
            5.333333333333333,
            1.1055415967851332
        ],
        "confidence_avg": [
            2.8333333333333335,
            0.6871842709362768
        ],
        "soundness_avg": [
            2.8333333333333335,
            0.6871842709362768
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.7453559924999298
        ],
        "wc_summary_avg": [
            75.5,
            30.80449101456907
        ],
        "wc_strengths_avg": [
            52.666666666666664,
            39.53338954464807
        ],
        "wc_weaknesses_avg": [
            110.0,
            119.87354448195259
        ],
        "wc_questions_avg": [
            101.5,
            91.26655101039665
        ],
        "wc_review_avg": [
            339.6666666666667,
            219.17471468113186
        ],
        "wc_reply_reviewers_avg": [
            12.166666666666666,
            27.20549372624744
        ],
        "wc_reply_authors_avg": [
            831.6666666666666,
            465.8750428554373
        ],
        "reply_reviewers_avg": [
            0.16666666666666666,
            0.372677996249965
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.14625448482542616,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18045056201603318427&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=fjf3YenThE",
        "pdf": "https://openreview.net/pdf?id=fjf3YenThE",
        "email": "hit.edu.cn;mbzuai.ac.ae;hit.edu.cn;mbzuai.ac.ae",
        "author_num": 4,
        "aff_unique_index": "0;1;0;1",
        "aff_unique_norm": "Harbin Institute of Technology;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.hit.edu.cn/;https://mbzuai.ac.ae",
        "aff_unique_abbr": "HIT;MBZUAI",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Harbin;",
        "aff_country_unique_index": "0;1;0;1",
        "aff_country_unique": "China;United Arab Emirates"
    },
    {
        "id": "fjiAy3Dbx0",
        "title": "Desigen: A Pipeline for Controllable Design Template Generation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Templates serve as a good starting point to implement a design (e.g., banner, slide) but it takes great effort from designers to manually create. In this paper, we present Desigen, an automatic template creation pipeline which generates background images as well as harmonious layout elements over the background. Different from natural images, a background image should preserve enough non-salient space for the overlaying layout elements. To equip existing advanced diffusion-based models with stronger spatial control, we propose two simple but effective techniques to constrain the saliency distribution and reduce the attention weight in desired regions during the background generation process. Then conditioned on the background, we synthesize the layout with a Transformer-based autoregressive generator. To achieve a more harmonious composition, we propose an iterative inference strategy to adjust the synthesized background and layout in multiple rounds. We construct a design dataset with more than 40k advertisement banners to verify our approach. Extensive experiments demonstrate that the proposed pipeline generates high-quality templates comparable to human designers. More than a single-page design, we further show an application of presentation generation that outputs a set of theme-consistent slides. The data and code will be released.",
        "keywords": "design generation;document understanding;image synthesis;datasets and evaluation",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Haohan Weng;Danqing Huang;YU QIAO;Hu Zheng;Chin-Yew Lin;Tong Zhang;C. L. Philip Chen",
        "authorids": "~Haohan_Weng1;~Danqing_Huang1;~YU_QIAO8;~Hu_Zheng1;~Chin-Yew_Lin1;~Tong_Zhang14;~C._L._Philip_Chen1",
        "gender": "M;F;F;;M;M;",
        "homepage": "https://whaohan.github.io;;https://faculty.csu.edu.cn/qiaoyu/zh_CN/index.htm;;https://www.microsoft.com/en-us/research/people/cyl/;http://www2.scut.edu.cn/cs/2021/0317/c22284a422099/page.htm;",
        "dblp": "311/3975;56/10136;;;64/6843;07/4227-15;",
        "google_scholar": "V08HvHUAAAAJ;P55WbwYAAAAJ;;;cDF07aYAAAAJ;https://scholar.google.com/citations?hl=zh-CN;",
        "orcid": ";;;;;;",
        "linkedin": ";;https://www.linkedin.cn/incareer/in/ACoAAAmZ-skBVEUwTpIHtsHFLgc8cS3afhC4RZM;;chin-yew-lin-32585a4;;",
        "or_profile": "~Haohan_Weng1;~Danqing_Huang1;~YU_QIAO8;~Hu_Zheng1;~Chin-Yew_Lin1;~Tong_Zhang14;~C._L._Philip_Chen1",
        "aff": "South China University of Technology;Microsoft;;;Microsoft;South China University of Technology;",
        "aff_domain": "scut.edu.cn;microsoft.com;;;microsoft.com;scut.edu.cn;",
        "position": "MS student;Researcher;;;Senior Principal Research Manager;Full Professor;",
        "bibtex": "@misc{\nweng2024desigen,\ntitle={Desigen: A Pipeline for Controllable Design Template Generation},\nauthor={Haohan Weng and Danqing Huang and YU QIAO and Hu Zheng and Chin-Yew Lin and Tong Zhang and C. L. Philip Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=fjiAy3Dbx0}\n}",
        "github": "",
        "project": "",
        "reviewers": "umPG;XhSd;14nH",
        "site": "https://openreview.net/forum?id=fjiAy3Dbx0",
        "pdf_size": 7467467,
        "rating": "3;5;6",
        "confidence": "4;3;3",
        "soundness": "1;2;4",
        "contribution": "2;2;2",
        "presentation": "2;2;4",
        "wc_summary": "116;149;51",
        "wc_strengths": "31;56;17",
        "wc_weaknesses": "273;195;155",
        "wc_questions": "10;106;1",
        "wc_review": "430;506;224",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "552;592;273",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            105.33333333333333,
            40.71308825863687
        ],
        "wc_strengths_avg": [
            34.666666666666664,
            16.131404843417148
        ],
        "wc_weaknesses_avg": [
            207.66666666666666,
            48.998866200034556
        ],
        "wc_questions_avg": [
            39.0,
            47.51841748206689
        ],
        "wc_review_avg": [
            386.6666666666667,
            119.13391158225642
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            472.3333333333333,
            141.89276075810054
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.9449111825230683,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9291550395760981442&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;1;0",
        "aff_unique_norm": "South China University of Technology;Microsoft",
        "aff_unique_dep": ";Microsoft Corporation",
        "aff_unique_url": "https://www.scut.edu.cn;https://www.microsoft.com",
        "aff_unique_abbr": "SCUT;Microsoft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Ito Diffusion Approximation of Universal Ito Chains for Sampling, Optimization and Boosting",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18173",
        "id": "fjpfCOV4ru",
        "author_site": "Aleksei Ustimenko, Aleksandr Beznosikov",
        "tldr": "",
        "abstract": "In this work, we consider rather general and broad class of Markov chains, Ito chains, that look like Euler-Maryama discretization of some Stochastic Differential Equation. The chain we study is a unified framework for theoretical analysis. It comes with almost arbitrary isotropic and state-dependent  noise instead of normal and state-independent one as in most related papers. Moreover, in our chain the drift and diffusion coefficient can be inexact in order to cover wide range of applications as Stochastic Gradient Langevin Dynamics, sampling, Stochastic Gradient Descent or Stochastic Gradient Boosting. We prove the bound in $\\mathcal{W}_{2}$-distance between the laws of our Ito chain and corresponding differential equation. These results improve or cover most of the known estimates. And for some particular cases, our analysis is the first.",
        "keywords": "markov chains;diffusion processes",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Aleksei Ustimenko;Aleksandr Beznosikov",
        "authorids": "~Aleksei_Ustimenko1;~Aleksandr_Beznosikov1",
        "gender": "M;",
        "homepage": ";",
        "dblp": "242/3873;",
        "google_scholar": "OES5pK4AAAAJ;",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Aleksei_Ustimenko1;~Aleksandr_Beznosikov1",
        "aff": "ShareChat;",
        "aff_domain": "sharechat.co;",
        "position": "Researcher;",
        "bibtex": "@inproceedings{\nustimenko2024ito,\ntitle={Ito Diffusion Approximation of Universal Ito Chains for Sampling, Optimization and Boosting},\nauthor={Aleksei Ustimenko and Aleksandr Beznosikov},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=fjpfCOV4ru}\n}",
        "github": "",
        "project": "",
        "reviewers": "4gNA;RRnG;i2Nt",
        "pdf_size": 446214,
        "rating": "3;6;8",
        "confidence": "4;3;3",
        "soundness": "1;3;3",
        "contribution": "1;3;3",
        "presentation": "2;3;3",
        "wc_summary": "36;79;68",
        "wc_strengths": "17;109;74",
        "wc_weaknesses": "33;141;23",
        "wc_questions": "1;66;23",
        "wc_review": "87;395;188",
        "wc_reply_reviewers": "0;0;8",
        "wc_reply_authors": "564;631;265",
        "reply_reviewers": "0;0;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            5.666666666666667,
            2.0548046676563256
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            61.0,
            18.239152027072603
        ],
        "wc_strengths_avg": [
            66.66666666666667,
            37.915109858149634
        ],
        "wc_weaknesses_avg": [
            65.66666666666667,
            53.42492135906446
        ],
        "wc_questions_avg": [
            30.0,
            26.993826454703797
        ],
        "wc_review_avg": [
            223.33333333333334,
            128.1986306045774
        ],
        "wc_reply_reviewers_avg": [
            2.6666666666666665,
            3.7712361663282534
        ],
        "wc_reply_authors_avg": [
            486.6666666666667,
            159.11072315284792
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.9176629354822472,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16155824341148962491&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=fjpfCOV4ru",
        "pdf": "https://openreview.net/pdf?id=fjpfCOV4ru",
        "email": "sharechat.co;",
        "author_num": 2,
        "aff_unique_index": "0",
        "aff_unique_norm": "ShareChat",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sharechat.com",
        "aff_unique_abbr": "",
        "aff_country_unique_index": "0",
        "aff_country_unique": "India"
    },
    {
        "id": "fjwZHuQ3cm",
        "title": "LIMANS: Linear Model of the Adversarial Noise Space",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent works have revealed the vulnerability of deep neural network (DNN) classifiers to adversarial attacks. Among such attacks, it is common to distinguish specific attacks adapted to each example from universal ones referred as example-agnostic. Even though specific adversarial attacks are efficient on their target DNN classifier to attack, they struggle to transfer to others. Conversely, universal adversarial attacks suffer from lower attack success. To reconcile universality and efficiency, we propose a model of the adversarial noise space allowing to frame specific adversarial perturbation as a linear combination of universal adversarial directions. We bring in two stochastic gradient based algorithms for learning these universal directions and the associated adversarial attacks. Empirical analyses conducted with the CIFAR-10 and ImageNet datasets show that LIMANS (i) enables crafting specific and robust adversarial attacks with high probability, (ii) provides a deeper understanding of DNN flaws, and (iii) shows significant ability in transferability.",
        "keywords": "Deep Neural Networks;Adversarial attacks;Dictionary learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/5cebf676f16f97711171bab7ef4a58c845ddadca.pdf",
        "author": "Lucas Anquetil;Jordan Frecon;Yuan Liu;Stephane Canu;Gilles Gasso",
        "authorids": "~Lucas_Anquetil1;~Jordan_Frecon1;~Yuan_Liu6;~Stephane_Canu1;~Gilles_Gasso1",
        "gender": "M;M;Not Specified;M;M",
        "homepage": "https://lucasanquetil.github.io/;http://jordan-frecon.com;;http://asi.insa-rouen.fr/enseignants/~scanu/;http://asi.insa-rouen.fr/enseignants/~gasso/",
        "dblp": "279/3260;154/1353;;17/122;",
        "google_scholar": "xCw-7csAAAAJ;ZBj41pgAAAAJ;NtSEw7gAAAAJ;PpibCZUAAAAJ;https://scholar.google.fr/citations?user=wPTfsEQAAAAJ",
        "orcid": ";;;0000-0002-7602-4557;",
        "linkedin": "lucas-anquetil-271491117/;;;st%C3%A9phane-canu-b1127a14/;",
        "or_profile": "~Lucas_Anquetil1;~Jordan_Frecon1;~Yuan_Liu6;~Stephane_Canu1;~Gilles_Gasso1",
        "aff": ";Universit\u00e9 Jean Monnet, Inria;INSA de Rouen;INSA Rouen Normandy;INSA Rouen Normandy",
        "aff_domain": ";univ-st-etienne.fr;insa-rouen.fr;insa-rouen.fr;insa-rouen.fr",
        "position": ";Associate Professor;Postdoc;Full Professor;Full Professor",
        "bibtex": "@misc{\nanquetil2024limans,\ntitle={{LIMANS}: Linear Model of the Adversarial Noise Space},\nauthor={Lucas Anquetil and Jordan Frecon and Yuan Liu and Stephane Canu and Gilles Gasso},\nyear={2024},\nurl={https://openreview.net/forum?id=fjwZHuQ3cm}\n}",
        "github": "",
        "project": "",
        "reviewers": "APAo;XSE8;jQoc;S66D",
        "site": "https://openreview.net/forum?id=fjwZHuQ3cm",
        "pdf_size": 1111157,
        "rating": "5;5;6;6",
        "confidence": "4;3;4;3",
        "soundness": "2;3;2;2",
        "contribution": "3;3;3;2",
        "presentation": "2;3;3;3",
        "wc_summary": "154;57;79;55",
        "wc_strengths": "76;42;27;64",
        "wc_weaknesses": "270;87;407;165",
        "wc_questions": "479;262;84;4",
        "wc_review": "979;448;597;288",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "706;662;643;477",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            86.25,
            40.23291562887283
        ],
        "wc_strengths_avg": [
            52.25,
            19.00493356999703
        ],
        "wc_weaknesses_avg": [
            232.25,
            119.98202990448195
        ],
        "wc_questions_avg": [
            207.25,
            182.58337136771246
        ],
        "wc_review_avg": [
            578.0,
            256.0087889116309
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            622.0,
            86.77845354694908
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:NRm0nUDD4lYJ:scholar.google.com/&scioq=LIMANS:+Linear+Model+of+the+Adversarial+Noise+Space&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;2",
        "aff_unique_norm": "Universit\u00e9 Jean Monnet;INSA de Rouen;INSA Rouen Normandy",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.univ-jean-monnet.fr;https://www.insa-rouen.fr;https://www.insa-rouen.fr",
        "aff_unique_abbr": "UJM;INSA Rouen;INSA Rouen",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "France"
    },
    {
        "title": "Efficient Dynamics Modeling in Interactive Environments with Koopman Theory",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18172",
        "id": "fkrYDQaHOJ",
        "author_site": "Arnab Mondal, Siba Smarak Panigrahi, Sai Rajeswar, Kaleem Siddiqi, Siamak Ravanbakhsh",
        "tldr": "",
        "abstract": "The accurate modeling of dynamics in interactive environments is critical for successful long-range prediction. Such a capability could advance Reinforcement Learning (RL) and Planning algorithms, but achieving it is challenging. Inaccuracies in model estimates can compound, resulting in increased errors over long horizons.\nWe approach this problem from the lens of Koopman theory, where the nonlinear dynamics of the environment can be linearized in a high-dimensional latent space. This allows us to efficiently parallelize the sequential problem of long-range prediction using convolution while accounting for the agent's action at every time step.\nOur approach also enables stability analysis and better control over gradients through time. Taken together, these advantages result in significant improvement over the existing approaches, both in the efficiency and the accuracy of modeling dynamics over extended horizons. We also show that this model can be easily incorporated into dynamics modeling for model-based planning and model-free RL and report promising experimental results.",
        "keywords": "Koopman Theory;Reinforcement Learning;Dynamical System;Planning;Longe range dynamics prediction models;Efficient forward dynamics",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/ba477243a1f52461755023d6a310db7ee59e19a9.zip",
        "author": "Arnab Kumar Mondal;Siba Smarak Panigrahi;Sai Rajeswar;Kaleem Siddiqi;Siamak Ravanbakhsh",
        "authorids": "~Arnab_Kumar_Mondal1;~Siba_Smarak_Panigrahi1;~Sai_Rajeswar2;~Kaleem_Siddiqi1;~Siamak_Ravanbakhsh1",
        "gender": "M;M;;M;",
        "homepage": "https://arnab39.github.io;https://sibasmarak.github.io/;;http://www.cim.mcgill.ca/~siddiqi/;",
        "dblp": ";304/7822;;s/KaleemSiddiqi;",
        "google_scholar": "NhWR4yIAAAAJ;https://scholar.google.co.in/citations?hl=en;;https://scholar.google.com.tw/citations?user=1jEAOVcAAAAJ;",
        "orcid": ";;;;",
        "linkedin": "arnab-mondal-01b522a9/;siba-smarak-panigrahi-42b38a213/;;;",
        "or_profile": "~Arnab_Kumar_Mondal1;~Siba_Smarak_Panigrahi1;~Sai_Rajeswar2;~Kaleem_Siddiqi1;~Siamak_Ravanbakhsh1",
        "aff": "McGill University;Mila - Quebec AI Institute;;McGill University;",
        "aff_domain": "mcgill.ca;mila.quebec;;mcgill.ca;",
        "position": "PhD student;Researcher;;Full Professor;",
        "bibtex": "@inproceedings{\nmondal2024efficient,\ntitle={Efficient Dynamics Modeling in Interactive Environments with Koopman Theory},\nauthor={Arnab Kumar Mondal and Siba Smarak Panigrahi and Sai Rajeswar and Kaleem Siddiqi and Siamak Ravanbakhsh},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=fkrYDQaHOJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "xZWp;3syb;UaZL;tVSX",
        "pdf_size": 6291844,
        "rating": "3;5;6;8",
        "confidence": "5;3;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "76;49;115;92",
        "wc_strengths": "61;128;62;82",
        "wc_weaknesses": "339;76;239;263",
        "wc_questions": "27;1;132;366",
        "wc_review": "503;254;548;803",
        "wc_reply_reviewers": "0;9;97;146",
        "wc_reply_authors": "1029;575;1078;753",
        "reply_reviewers": "0;1;1;2",
        "reply_authors": "3;2;3;2",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            83.0,
            24.031229681395832
        ],
        "wc_strengths_avg": [
            83.25,
            27.160403163428924
        ],
        "wc_weaknesses_avg": [
            229.25,
            95.8706811282782
        ],
        "wc_questions_avg": [
            131.5,
            143.9973958097854
        ],
        "wc_review_avg": [
            527.0,
            194.75754157413263
        ],
        "wc_reply_reviewers_avg": [
            63.0,
            61.094189576423716
        ],
        "wc_reply_authors_avg": [
            858.75,
            205.39763265432248
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.4181210050035454,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4052439128028730382&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=fkrYDQaHOJ",
        "pdf": "https://openreview.net/pdf?id=fkrYDQaHOJ",
        "email": "mcgill.ca;mila.quebec;;mcgill.ca;",
        "author_num": 5,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "McGill University;Quebec AI Institute",
        "aff_unique_dep": ";AI Institute",
        "aff_unique_url": "https://www.mcgill.ca;https://mila.quebec",
        "aff_unique_abbr": "McGill;Mila",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "fkvdewFFN6",
        "title": "Learning Fair Representations with High-Confidence Guarantees",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Representation learning is increasingly employed to generate representations that are predictive across multiple downstream tasks.\nThe development of representation learning algorithms that provide strong fairness guarantees is thus important because it can prevent unfairness towards disadvantaged groups for $all$ downstream prediction tasks.\nIn this paper, we formally define the problem of learning representations that are fair with high confidence.\nWe then introduce the $\\textbf{F}$air $\\textbf{R}$epresentation learning with high-confidence $\\textbf{G}$uarantees (FRG) framework, which provides high-confidence guarantees for limiting unfairness across all downstream models and tasks, with user-defined upper bounds.\nAfter proving that FRG ensures fairness for all downstream models and tasks with high probability, we present empirical evaluations that demonstrate FRG's effectiveness at upper bounding unfairness for multiple downstream models and tasks.",
        "keywords": "Fairness;Representation Learning;High-Confidence Fairness Guarantees",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/9458cebe6c91af8b7fd7c8004cdbae08b191fed1.zip",
        "author": "Yuhong Luo;Austin Hoag;Philip S. Thomas",
        "authorids": "~Yuhong_Luo1;~Austin_Hoag1;~Philip_S._Thomas1",
        "gender": "M;M;M",
        "homepage": ";;http://psthomas.com",
        "dblp": ";;46/11107",
        "google_scholar": "NnhGIRwAAAAJ;U6ExNJkAAAAJ;e8Gzgo4AAAAJ",
        "orcid": ";;",
        "linkedin": "yuhong-luo/;;",
        "or_profile": "~Yuhong_Luo1;~Austin_Hoag1;~Philip_S._Thomas1",
        "aff": "University of Massachusetts at Amherst;;College of Information and Computer Science, University of Massachusetts, Amherst",
        "aff_domain": "umass.edu;;cs.umass.edu",
        "position": "MS student;;Associate Professor",
        "bibtex": "@misc{\nluo2024learning,\ntitle={Learning Fair Representations with High-Confidence Guarantees},\nauthor={Yuhong Luo and Austin Hoag and Philip S. Thomas},\nyear={2024},\nurl={https://openreview.net/forum?id=fkvdewFFN6}\n}",
        "github": "",
        "project": "",
        "reviewers": "YuAR;kxaq;pP3w",
        "site": "https://openreview.net/forum?id=fkvdewFFN6",
        "pdf_size": 8750940,
        "rating": "3;3;3",
        "confidence": "4;3;3",
        "soundness": "3;3;3",
        "contribution": "2;2;2",
        "presentation": "3;2;3",
        "wc_summary": "62;102;125",
        "wc_strengths": "35;111;82",
        "wc_weaknesses": "451;688;152",
        "wc_questions": "314;157;437",
        "wc_review": "862;1058;796",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            96.33333333333333,
            26.02989734047285
        ],
        "wc_strengths_avg": [
            76.0,
            31.31559781748812
        ],
        "wc_weaknesses_avg": [
            430.3333333333333,
            219.30850923350474
        ],
        "wc_questions_avg": [
            302.6666666666667,
            114.59009070983795
        ],
        "wc_review_avg": [
            905.3333333333334,
            111.26345112190056
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16385272924671327662&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Massachusetts Amherst",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.umass.edu",
        "aff_unique_abbr": "UMass Amherst",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Amherst",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "flg9EB6ikY",
        "title": "Selective Prediction via Training Dynamics",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Selective prediction is the task of rejecting inputs a model would predict incorrectly on through a trade-off between input space coverage and model utility. Current methods for selective prediction typically impose constraints on either the model architecture or the loss function; this inhibits their usage in practice. In contrast to prior work, we show that state-of-the-art selective prediction performance can be attained solely from studying the (discretized) training dynamics of a model. We propose a general framework that, given a test input, monitors metrics capturing the instability of predictions from intermediate models obtained during training w.r.t. the final model's prediction. In particular, we reject data points exhibiting too much disagreement with the final prediction at late stages in training. The proposed scoring mechanism is domain-agnostic (i.e., it works for both discrete and real-valued prediction) and can be flexibly combined with existing selective prediction approaches as it does not require any train-time modifications. Our experimental evaluation on image classification, regression, and time series forecasting problems shows that our method beats past state-of-the-art accuracy/utility trade-offs on typical selective prediction benchmarks.",
        "keywords": "selective prediction;training dynamics;example difficulty;forging;reject option;uncertainty quantification;reliability",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/ae1f8afaa163b43fbee1e2c11b645219a584a233.zip",
        "author": "Stephan Rabanser;Anvith Thudi;Kimia Hamidieh;Adam Dziedzic;Israfil Bahceci;Akram Bin Sediq;HAMZA SOKUN;Nicolas Papernot",
        "authorids": "~Stephan_Rabanser1;~Anvith_Thudi1;~Kimia_Hamidieh1;~Adam_Dziedzic1;~Israfil_Bahceci1;~Akram_Bin_Sediq1;~HAMZA_SOKUN1;~Nicolas_Papernot1",
        "gender": "M;M;F;;M;M;;M",
        "homepage": "https://rabanser.dev;https://www.anvith.com;;;;;;https://www.papernot.fr",
        "dblp": "210/2399;;;;;;;162/1405",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.ca/citations?hl=en;;;X125iR0AAAAJ;X_1QuPoAAAAJ;https://scholar.google.ca/citations?hl=en;cGxq0cMAAAAJ",
        "orcid": ";;;;;;;",
        "linkedin": ";anvith-thudi-54b5621bb/?originalSubdomain=ca;kimia-hamidieh-956519212/;;;akrambinsediq/;;nicolaspapernot",
        "or_profile": "~Stephan_Rabanser1;~Anvith_Thudi1;~Kimia_Hamidieh1;~Adam_Dziedzic1;~Israfil_Bahceci1;~Akram_Bin_Sediq1;~HAMZA_SOKUN1;~Nicolas_Papernot1",
        "aff": "Google;University of Toronto;Massachusetts Institute of Technology;;Ericsson Canada;;Ericsson Canada;Google",
        "aff_domain": "google.com;utoronto.ca;mit.edu;;ericsson.com;;ericsson.com;google.com",
        "position": "Student Researcher;PhD student;PhD student;;Researcher;;Researcher;Research Scientist",
        "bibtex": "@misc{\nrabanser2024selective,\ntitle={Selective Prediction via Training Dynamics},\nauthor={Stephan Rabanser and Anvith Thudi and Kimia Hamidieh and Adam Dziedzic and Israfil Bahceci and Akram Bin Sediq and HAMZA SOKUN and Nicolas Papernot},\nyear={2024},\nurl={https://openreview.net/forum?id=flg9EB6ikY}\n}",
        "github": "",
        "project": "",
        "reviewers": "MGKy;2hdK;jRFU;ux7A;GEsV",
        "site": "https://openreview.net/forum?id=flg9EB6ikY",
        "pdf_size": 3663903,
        "rating": "3;5;5;6;6",
        "confidence": "4;5;4;3;4",
        "soundness": "2;2;3;2;3",
        "contribution": "2;2;2;3;2",
        "presentation": "3;3;2;3;4",
        "wc_summary": "53;116;63;235;106",
        "wc_strengths": "35;26;37;159;28",
        "wc_weaknesses": "157;55;99;259;110",
        "wc_questions": "151;97;19;178;29",
        "wc_review": "396;294;218;831;273",
        "wc_reply_reviewers": "1013;59;23;669;39",
        "wc_reply_authors": "2986;953;996;2309;1214",
        "reply_reviewers": "3;1;1;3;1",
        "reply_authors": "5;3;3;4;3",
        "rating_avg": [
            5.0,
            1.0954451150103321
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            3.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            114.6,
            64.85244791062246
        ],
        "wc_strengths_avg": [
            57.0,
            51.16639522186413
        ],
        "wc_weaknesses_avg": [
            136.0,
            69.5356023918683
        ],
        "wc_questions_avg": [
            94.8,
            63.499291334628296
        ],
        "wc_review_avg": [
            402.4,
            221.91764238113203
        ],
        "wc_reply_reviewers_avg": [
            360.6,
            407.20982306422815
        ],
        "wc_reply_authors_avg": [
            1691.6,
            814.1431323790677
        ],
        "reply_reviewers_avg": [
            1.8,
            0.9797958971132713
        ],
        "reply_authors_avg": [
            3.6,
            0.8
        ],
        "replies_avg": [
            35,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.2886751345948129,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:8rW8nk9WKrMJ:scholar.google.com/&scioq=Selective+Prediction+via+Training+Dynamics&hl=en&as_sdt=0,24",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;3;0",
        "aff_unique_norm": "Google;University of Toronto;Massachusetts Institute of Technology;Ericsson",
        "aff_unique_dep": "Google;;;",
        "aff_unique_url": "https://www.google.com;https://www.utoronto.ca;https://web.mit.edu;https://www.ericsson.com/ca",
        "aff_unique_abbr": "Google;U of T;MIT;Ericsson",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Mountain View;",
        "aff_country_unique_index": "0;1;0;1;1;0",
        "aff_country_unique": "United States;Canada"
    },
    {
        "id": "fmAzKz9DJs",
        "title": "Centroid- and Orientation-aware Feature Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Robust techniques for learning centroids and orientations of objects and shapes in two-dimensional images, along with other features is crucial for image- and video-processing applications. While this has been partially addressed using a number of techniques by achieving translational and rotational equivariance and invariance properties, learning them as part of the features still remains an open problem. In this paper, we propose a novel encoder-decoder-based mechanism for learning independent factors of variations, including centroids and orientations, by embedding special layers to achieve translational and rotational equivariance and invariance. Our evaluation, across a number of datasets, including that of real-world ones, against five different state-of-the-art baseline models shows that our model not only can offer superior disentangling and reconstruction performance, but also offers exceptional training and inference performance, as much as 10X for training and 9X on inference compared to the average performance of other models.",
        "keywords": "disentanglement;disentangling;rotational equivariant convolutional layer;centroid learning;orientation learning;feature learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Jaehoon Cha;Jinhae Park;Jeyan Thiyagalingam",
        "authorids": "~Jaehoon_Cha1;~Jinhae_Park1;~Jeyan_Thiyagalingam1",
        "gender": ";Not Specified;",
        "homepage": ";;",
        "dblp": ";;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;",
        "orcid": ";0000-0003-0159-6187;",
        "linkedin": ";;",
        "or_profile": "~Jaehoon_Cha1;~Jinhae_Park1;~Jeyan_Thiyagalingam1",
        "aff": "Science and Technology Facilities Council;Chungnam National University;",
        "aff_domain": "stfc.ac.uk;cnu.ac.kr;",
        "position": "Researcher;Full Professor;",
        "bibtex": "@misc{\ncha2024centroid,\ntitle={Centroid- and Orientation-aware Feature Learning},\nauthor={Jaehoon Cha and Jinhae Park and Jeyan Thiyagalingam},\nyear={2024},\nurl={https://openreview.net/forum?id=fmAzKz9DJs}\n}",
        "github": "",
        "project": "",
        "reviewers": "sBsU;8vxB;ULgT",
        "site": "https://openreview.net/forum?id=fmAzKz9DJs",
        "pdf_size": 6079232,
        "rating": "3;3;3",
        "confidence": "4;3;4",
        "soundness": "2;1;2",
        "contribution": "2;1;2",
        "presentation": "2;2;3",
        "wc_summary": "69;32;61",
        "wc_strengths": "29;17;47",
        "wc_weaknesses": "273;136;97",
        "wc_questions": "51;29;35",
        "wc_review": "422;214;240",
        "wc_reply_reviewers": "275;0;0",
        "wc_reply_authors": "1844;862;1094",
        "reply_reviewers": "1;0;0",
        "reply_authors": "3;2;2",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            54.0,
            15.895492023421818
        ],
        "wc_strengths_avg": [
            31.0,
            12.328828005937952
        ],
        "wc_weaknesses_avg": [
            168.66666666666666,
            75.47332126137171
        ],
        "wc_questions_avg": [
            38.333333333333336,
            9.285592184789413
        ],
        "wc_review_avg": [
            292.0,
            92.53467818427136
        ],
        "wc_reply_reviewers_avg": [
            91.66666666666667,
            129.63624321753372
        ],
        "wc_reply_authors_avg": [
            1266.6666666666667,
            419.0794143781767
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:2Af-1kcNN2wJ:scholar.google.com/&scioq=Centroid-+and+Orientation-aware+Feature+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Science and Technology Facilities Council;Chungnam National University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.stfc.ac.uk;http://www.cnu.ac.kr",
        "aff_unique_abbr": "STFC;CNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United Kingdom;South Korea"
    },
    {
        "id": "fmoknhh7CH",
        "title": "Harmonic Prior Flow Matching for Multi-Ligand Docking and Binding Site Design",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "A significant amount of protein function requires binding small molecules, including enzymatic catalysis. As such, designing binding pockets for small molecules has several impactful applications ranging from drug synthesis to energy storage. Towards this goal, we first develop HarmonicFlow, an improved generative process over 3D protein-ligand binding structures based on our self-conditioned flow matching objective. FlowSite extends this flow model to jointly generate a protein pocket's discrete residue types and the molecule's binding 3D structure. We show that HarmonicFlow improves upon the state-of-the-art generative processes for docking in simplicity, generality, and performance. Enabled by this structure modeling, FlowSite designs binding sites substantially better than baseline approaches and provides the first general solution for binding site design.",
        "keywords": "flow matching;generative models;proteins;molecules",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/45fdd1c8088e8647a557209489fc9b195cdf044a.zip",
        "author": "Hannes Stark;Bowen Jing;Regina Barzilay;Tommi S. Jaakkola",
        "authorids": "~Hannes_Stark1;~Bowen_Jing1;~Regina_Barzilay1;~Tommi_S._Jaakkola1",
        "gender": ";;female;",
        "homepage": ";;https://www.regina.csail.mit.edu/;",
        "dblp": ";;b/ReginaBarzilay;",
        "google_scholar": ";;;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Hannes_Stark1;~Bowen_Jing1;~Regina_Barzilay1;~Tommi_S._Jaakkola1",
        "aff": ";;Massachusetts Institute of Technology;",
        "aff_domain": ";;mit.edu;",
        "position": ";;Professor;",
        "bibtex": "@misc{\nstark2024harmonic,\ntitle={Harmonic Prior Flow Matching for Multi-Ligand Docking and Binding Site Design},\nauthor={Hannes Stark and Bowen Jing and Regina Barzilay and Tommi S. Jaakkola},\nyear={2024},\nurl={https://openreview.net/forum?id=fmoknhh7CH}\n}",
        "github": "",
        "project": "",
        "reviewers": "jkK7;cRSx;k1W9;4Vb5;XYXw",
        "site": "https://openreview.net/forum?id=fmoknhh7CH",
        "pdf_size": 5361843,
        "rating": "5;5;5;5;6",
        "confidence": "4;5;5;3;4",
        "soundness": "3;3;3;1;3",
        "contribution": "2;2;2;2;3",
        "presentation": "3;3;3;2;4",
        "wc_summary": "61;16;46;123;38",
        "wc_strengths": "121;13;20;16;35",
        "wc_weaknesses": "28;224;148;21;24",
        "wc_questions": "45;3;34;256;11",
        "wc_review": "255;256;248;416;108",
        "wc_reply_reviewers": "112;125;163;0;49",
        "wc_reply_authors": "564;697;991;721;240",
        "reply_reviewers": "1;1;1;0;1",
        "reply_authors": "3;3;3;3;2",
        "rating_avg": [
            5.2,
            0.39999999999999997
        ],
        "confidence_avg": [
            4.2,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.6,
            0.8
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            3.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            56.8,
            36.15190174804086
        ],
        "wc_strengths_avg": [
            41.0,
            40.708721424284505
        ],
        "wc_weaknesses_avg": [
            89.0,
            82.796135175502
        ],
        "wc_questions_avg": [
            69.8,
            94.32581831078912
        ],
        "wc_review_avg": [
            256.6,
            97.53686482556223
        ],
        "wc_reply_reviewers_avg": [
            89.8,
            57.99793099757956
        ],
        "wc_reply_authors_avg": [
            642.6,
            244.4394403528203
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4
        ],
        "reply_authors_avg": [
            2.8,
            0.39999999999999997
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.1336306209562122,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:MHGEt1UYjigJ:scholar.google.com/&scioq=Harmonic+Prior+Flow+Matching+for+Multi-Ligand+Docking+and+Binding+Site+Design&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Massachusetts Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://web.mit.edu",
        "aff_unique_abbr": "MIT",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "fnBYPL5Ged",
        "title": "CPLLM: Clinical Prediction with Large Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We present Clinical Prediction with Large Language Models (CPLLM), a method that involves fine-tuning a pre-trained Large Language Model (LLM) for clinical disease prediction. We utilized quantization and fine-tuned the LLM using prompts, with the task of predicting whether patients will be diagnosed with a target disease during their next visit or in the subsequent diagnosis, leveraging their historical diagnosis records. We compared our results versus various baselines, including Logistic Regression, RETAIN, and Med-BERT, which is the current state-of-the-art model for disease prediction using structured EHR data. Our experiments have shown that CPLLM surpasses all the tested models in terms of both PR-AUC and ROC-AUC metrics, displaying noteworthy enhancements compared to the baseline models",
        "keywords": "NLP;EHR;LLM;classification",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/0714df1799a66ca45b43f12d63c11417ce2ff0b9.zip",
        "author": "Ofir Ben Shoham;Nadav Rappoport",
        "authorids": "~Ofir_Ben_Shoham1;~Nadav_Rappoport1",
        "gender": "M;M",
        "homepage": ";https://nadavrap.com",
        "dblp": ";00/9420",
        "google_scholar": ";zL-QE0cAAAAJ",
        "orcid": ";0000-0002-7218-2558",
        "linkedin": "ofir-ben-shoham/;nadavrap/",
        "or_profile": "~Ofir_Ben_Shoham1;~Nadav_Rappoport1",
        "aff": ";Ben-Gurion University of the Negev",
        "aff_domain": ";bgu.ac.il",
        "position": ";Assistant Professor",
        "bibtex": "@misc{\nshoham2024cpllm,\ntitle={{CPLLM}: Clinical Prediction with Large Language Models},\nauthor={Ofir Ben Shoham and Nadav Rappoport},\nyear={2024},\nurl={https://openreview.net/forum?id=fnBYPL5Ged}\n}",
        "github": "",
        "project": "",
        "reviewers": "9sDQ;i4m4;qHnV;M1Ux",
        "site": "https://openreview.net/forum?id=fnBYPL5Ged",
        "pdf_size": 198111,
        "rating": "1;1;3;3",
        "confidence": "5;4;5;4",
        "soundness": "2;1;2;3",
        "contribution": "2;1;2;1",
        "presentation": "2;1;3;2",
        "wc_summary": "116;69;110;19",
        "wc_strengths": "28;22;41;18",
        "wc_weaknesses": "152;190;379;88",
        "wc_questions": "33;13;261;41",
        "wc_review": "329;294;791;166",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.0,
            1.0
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            78.5,
            38.82331773560833
        ],
        "wc_strengths_avg": [
            27.25,
            8.699856320652657
        ],
        "wc_weaknesses_avg": [
            202.25,
            108.36137457599918
        ],
        "wc_questions_avg": [
            87.0,
            100.9752444909147
        ],
        "wc_review_avg": [
            395.0,
            236.54492173792275
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 32,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6323569614792009973&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 11,
        "aff_unique_index": "0",
        "aff_unique_norm": "Ben-Gurion University of the Negev",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.bgu.ac.il",
        "aff_unique_abbr": "BGU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Israel"
    },
    {
        "id": "fnO5h1CFyh",
        "title": "Learning Successor Representations with Distributed Hebbian Temporal Memory",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper presents a novel approach to address the challenge of online hidden representation learning for decision-making under uncertainty in non-stationary, partially observable environments. The proposed algorithm, Distributed Hebbian Temporal Memory (DHTM), is based on factor graph formalism and a multicomponent neuron model. DHTM aims to capture sequential data relationships and make cumulative predictions about future observations, forming Successor Representation (SR). Inspired by neurophysiological models of the neocortex, the algorithm utilizes distributed representations, sparse transition matrices, and local Hebbian-like learning rules to overcome the instability and slow learning process of traditional temporal memory algorithms like RNN and HMM. Experimental results demonstrate that DHTM outperforms classical LSTM and performs comparably to more advanced RNN-like algorithms, speeding up Temporal Difference learning for SR in changing environments. Additionally, we compare the SRs produced by DHTM to another biologically inspired HMM-like algorithm, CSCG. Our findings suggest that DHTM is a promising approach for addressing the challenges of online hidden representation learning in dynamic environments.",
        "keywords": "Temporal Memory;Successor Representation;Hebbian Learning;Factor Graph;Multicomponent Neuron Model",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/8961c03747f8839365b69674b1d421ded66ea402.zip",
        "author": "Evgenii Aleksandrovich Dzhivelikian;Petr Kuderov;Aleksandr Panov",
        "authorids": "~Evgenii_Aleksandrovich_Dzhivelikian1;~Petr_Kuderov1;~Aleksandr_Panov1",
        "gender": "M;Non-Binary;M",
        "homepage": "https://www.researchgate.net/profile/Evgenij-Dzhivelikyan;https://github.com/pkuderov;http://grafft.github.io",
        "dblp": ";286/7485;177/9975",
        "google_scholar": "-5VtFp8AAAAJ;32pBXQUAAAAJ;https://scholar.google.ru/citations?hl=ru",
        "orcid": "0000-0001-8110-1521;0000-0001-7055-3426;0000-0002-9747-3837",
        "linkedin": ";pkuderov/?lipi=urn%3Ali%3Apage%3Ad_flagship3_feed%3Bn9K365r%2FQ1i3VjivRY3sZA%3D%3D;",
        "or_profile": "~Evgenii_Aleksandrovich_Dzhivelikian1;~Petr_Kuderov1;~Aleksandr_Panov1",
        "aff": "Moscow Institute of Physics and Technology;Moscow Institute of Physics and Technology;Federal Research Center \u00abComputer Science and Control\u00bb of Russian Academy of Sciences",
        "aff_domain": "mipt.ru;mipt.ru;frccsc.ru",
        "position": "PhD student;PhD student;Principal Researcher",
        "bibtex": "@misc{\ndzhivelikian2024learning,\ntitle={Learning Successor Representations with Distributed Hebbian Temporal Memory},\nauthor={Evgenii Aleksandrovich Dzhivelikian and Petr Kuderov and Aleksandr Panov},\nyear={2024},\nurl={https://openreview.net/forum?id=fnO5h1CFyh}\n}",
        "github": "",
        "project": "",
        "reviewers": "kwS4;aAVr;wRcd;qUQp",
        "site": "https://openreview.net/forum?id=fnO5h1CFyh",
        "pdf_size": 5603611,
        "rating": "3;3;3;3",
        "confidence": "4;3;3;3",
        "soundness": "1;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "3;2;1;2",
        "wc_summary": "13;62;61;170",
        "wc_strengths": "11;46;66;32",
        "wc_weaknesses": "247;200;161;111",
        "wc_questions": "2;216;60;491",
        "wc_review": "273;524;348;804",
        "wc_reply_reviewers": "34;0;0;0",
        "wc_reply_authors": "450;1141;636;714",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "1;3;3;3",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            76.5,
            57.5
        ],
        "wc_strengths_avg": [
            38.75,
            20.06707502353046
        ],
        "wc_weaknesses_avg": [
            179.75,
            50.026867781223324
        ],
        "wc_questions_avg": [
            192.25,
            189.4074642140589
        ],
        "wc_review_avg": [
            487.25,
            204.312719868343
        ],
        "wc_reply_reviewers_avg": [
            8.5,
            14.722431864335457
        ],
        "wc_reply_authors_avg": [
            735.25,
            253.1317591690146
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.8660254037844386
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5185852459767489114&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Moscow Institute of Physics and Technology;Russian Academy of Sciences",
        "aff_unique_dep": ";Computer Science and Control",
        "aff_unique_url": "https://www.mipt.ru/en;https://www.ras.ru",
        "aff_unique_abbr": "MIPT;RAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Russian Federation"
    },
    {
        "id": "fnYvczj0OU",
        "title": "Equal Long-term Benefit Rate: Adapting Static Fairness Notions to Sequential Decision Making",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Decisions made by machine learning models may have lasting impacts over time, making long-term fairness a crucial consideration. \nIt has been shown that when ignoring the long-term effect, naively imposing fairness criterion in static settings can actually exacerbate bias over time. To explicitly address biases in sequential decision-making, recent works formulate long-term fairness notions in Markov Decision Process (MDP) framework. They define the long-term bias to be the sum of static bias over each time step. However, we demonstrate that naively summing up the step-wise bias can cause a false sense of fairness since it fails to consider the importance difference of different time steps during transition. In this work, we introduce a long-term fairness notion called Equal Long-term Benefit Rate (ELBERT), which explicitly considers varying temporal importance and adapts static fairness principles to the sequential setting. Moreover, we show that the policy gradient of Long-term Benefit Rate can be analytically reduced to standard policy gradient. This makes standard policy optimization methods applicable for reducing bias, leading to our bias mitigation method ELBERT-PO. Extensive experiments on diverse sequential decision making environments consistently show that ELBERT-PO significantly reduces bias and maintains high utility.",
        "keywords": "Long-term Fairness; Fairness; Sequential decision making; Reinforcement Learning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Yuancheng Xu;Chenghao Deng;Yanchao Sun;Ruijie Zheng;Xiyao Wang;Jieyu Zhao;Furong Huang",
        "authorids": "~Yuancheng_Xu1;~Chenghao_Deng1;~Yanchao_Sun1;~Ruijie_Zheng1;~Xiyao_Wang1;~Jieyu_Zhao1;~Furong_Huang1",
        "gender": "M;M;F;;M;F;F",
        "homepage": "https://yuancheng-xu.github.io;https://deng-chenghao.com;https://ycsun2017.github.io/home/index.html;http://www.ruijiezheng.com;;http://jyzhao.net/;https://furong-huang.com",
        "dblp": ";;132/6840;294/8474;;59/2379-1;72/8513",
        "google_scholar": "OPB0QgwAAAAJ;AcGw1hcAAAAJ;bloBY_QAAAAJ;;puVqfbwAAAAJ;9VaGBCQAAAAJ;13yyuCcAAAAJ",
        "orcid": ";;0000-0002-1137-9939;;;;",
        "linkedin": "yuancheng-xu/;chenghao-deng-326444182/;;;;;",
        "or_profile": "~Yuancheng_Xu1;~Chenghao_Deng1;~Yanchao_Sun1;~Ruijie_Zheng1;~Xiyao_Wang1;~Jieyu_Zhao1;~Furong_Huang1",
        "aff": "University of Maryland, College Park;University of Maryland, College Park;J.P. Morgan AI Research;University of Maryland, College Park;University of Maryland, College Park;University of Southern California;University of Maryland",
        "aff_domain": "umd.edu;umd.edu;jpmchase.com;cs.umd.edu;umd.edu;usc.edu;cs.umd.edu",
        "position": "PhD student;PhD student;Researcher;PhD student;PhD student;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nxu2024equal,\ntitle={Equal Long-term Benefit Rate: Adapting Static Fairness Notions to Sequential Decision Making},\nauthor={Yuancheng Xu and Chenghao Deng and Yanchao Sun and Ruijie Zheng and Xiyao Wang and Jieyu Zhao and Furong Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=fnYvczj0OU}\n}",
        "github": "",
        "project": "",
        "reviewers": "1EzK;aJ3j;na9A",
        "site": "https://openreview.net/forum?id=fnYvczj0OU",
        "pdf_size": 1747763,
        "rating": "3;5;5",
        "confidence": "4;3;4",
        "soundness": "2;3;2",
        "contribution": "2;1;2",
        "presentation": "3;3;3",
        "wc_summary": "117;110;60",
        "wc_strengths": "123;47;42",
        "wc_weaknesses": "893;79;36",
        "wc_questions": "211;118;454",
        "wc_review": "1344;354;592",
        "wc_reply_reviewers": "0;51;316",
        "wc_reply_authors": "3032;1366;2213",
        "reply_reviewers": "0;1;1",
        "reply_authors": "6;5;5",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            95.66666666666667,
            25.381533094401966
        ],
        "wc_strengths_avg": [
            70.66666666666667,
            37.06151043273271
        ],
        "wc_weaknesses_avg": [
            336.0,
            394.24949799164824
        ],
        "wc_questions_avg": [
            261.0,
            141.65450928226747
        ],
        "wc_review_avg": [
            763.3333333333334,
            421.9331173960579
        ],
        "wc_reply_reviewers_avg": [
            122.33333333333333,
            138.51674587893297
        ],
        "wc_reply_authors_avg": [
            2203.6666666666665,
            680.1736706328923
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2001003193369300747&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;1;0;0;2;0",
        "aff_unique_norm": "University of Maryland;J.P. Morgan;University of Southern California",
        "aff_unique_dep": ";AI Research;",
        "aff_unique_url": "https://www/umd.edu;https://www.jpmorgan.com;https://www.usc.edu",
        "aff_unique_abbr": "UMD;JPM;USC",
        "aff_campus_unique_index": "0;0;0;0;2",
        "aff_campus_unique": "College Park;;Los Angeles",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "fpYIlzOpIA",
        "title": "NLPBench: Evaluating Large Language Models on Solving NLP Problems",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent developments in large language models (LLMs) have shown promise in enhancing the capabilities of natural language processing (NLP). Despite these successes, there remains a dearth of research dedicated to the NLP problem-solving abilities of LLMs. To fill the gap in this area, we present a unique benchmarking dataset, NLPBench, comprising 378 college-level NLP questions spanning various NLP topics sourced from Yale University's prior final exams. NLPBench includes questions with context, in which multiple sub-questions share the same public information, and diverse question types, including multiple choice, short answer, and math. Our evaluation, centered on LLMs such as GPT-3.5/4, PaLM-2, and LLAMA-2, incorporates advanced prompting strategies like the chain-of-thought (CoT) and tree-of-thought (ToT). Our study reveals that the effectiveness of the advanced prompting strategies can be inconsistent, occasionally damaging LLM performance, especially in smaller models like the LLAMA-2 (13b). Furthermore, our manual assessment illuminated specific shortcomings in LLMs' scientific problem-solving skills, with weaknesses in logical decomposition and reasoning notably affecting results.",
        "keywords": "Dataset and benchmark;LLM evaluation;NLP",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Linxin Song;Jieyu Zhang;Lechao Cheng;Pengyuan Zhou;Tianyi Zhou;Irene Li",
        "authorids": "~Linxin_Song1;~Jieyu_Zhang1;~Lechao_Cheng2;~Pengyuan_Zhou1;~Tianyi_Zhou1;~Irene_Li1",
        "gender": "M;M;M;;M;F",
        "homepage": "https://linxins97.github.io/;https://jieyuz2.github.io/;https://faculty.hfut.edu.cn/ChengLechao;;https://tianyizhou.github.io/;https://ireneli.eu/",
        "dblp": "330/3920.html;;165/9781;;88/8205-1;44/8976",
        "google_scholar": "https://scholar.google.com.hk/citations?user=IjqXzSwAAAAJ;T_INUHUAAAAJ;PKFAv-cAAAAJ;;OKvgizMAAAAJ;JuYPjCMAAAAJ",
        "orcid": "0009-0009-7349-8990;0000-0002-1846-2436;0000-0002-7546-9052;;0000-0001-5348-0632;",
        "linkedin": ";jieyu-zhang-3baaa8154/;;;tianyizhou;",
        "or_profile": "~Linxin_Song1;~Jieyu_Zhang1;~Lechao_Cheng2;~Pengyuan_Zhou1;~Tianyi_Zhou1;~Irene_Li1",
        "aff": "University of Southern California;University of Washington;Hefei University of Technology;;University of Maryland, College Park;University of Tokyo",
        "aff_domain": "usc.edu;cs.washington.edu;hfut.edu.cn;;umd.edu;u-tokyo.ac.jp",
        "position": "PhD student;PhD student;Associate Professor;;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nsong2024nlpbench,\ntitle={{NLPB}ench: Evaluating Large Language Models on Solving {NLP} Problems},\nauthor={Linxin Song and Jieyu Zhang and Lechao Cheng and Pengyuan Zhou and Tianyi Zhou and Irene Li},\nyear={2024},\nurl={https://openreview.net/forum?id=fpYIlzOpIA}\n}",
        "github": "",
        "project": "",
        "reviewers": "tbcE;FuWu;YrAB",
        "site": "https://openreview.net/forum?id=fpYIlzOpIA",
        "pdf_size": 6094354,
        "rating": "5;5;6",
        "confidence": "4;3;4",
        "soundness": "3;2;3",
        "contribution": "3;2;2",
        "presentation": "3;2;3",
        "wc_summary": "91;92;55",
        "wc_strengths": "47;42;20",
        "wc_weaknesses": "257;75;21",
        "wc_questions": "19;72;23",
        "wc_review": "414;281;119",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "500;454;145",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            79.33333333333333,
            17.21110752456745
        ],
        "wc_strengths_avg": [
            36.333333333333336,
            11.728408057172787
        ],
        "wc_weaknesses_avg": [
            117.66666666666667,
            100.95983799951784
        ],
        "wc_questions_avg": [
            38.0,
            24.097026095903757
        ],
        "wc_review_avg": [
            271.3333333333333,
            120.62706532486352
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            366.3333333333333,
            157.62895955023268
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8541360958026256902&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "University of Southern California;University of Washington;Hefei University of Technology;University of Maryland;University of Tokyo",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.usc.edu;https://www.washington.edu;http://www.hfut.edu.cn/;https://www/umd.edu;https://www.u-tokyo.ac.jp",
        "aff_unique_abbr": "USC;UW;HUT;UMD;UTokyo",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Los Angeles;;College Park",
        "aff_country_unique_index": "0;0;1;0;2",
        "aff_country_unique": "United States;China;Japan"
    },
    {
        "title": "Circuit Component Reuse Across Tasks in Transformer Language Models",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18171",
        "id": "fpoAYV6Wsk",
        "author_site": "Jack Merullo, Carsten Eickhoff, Ellie Pavlick",
        "tldr": "",
        "abstract": "Recent work in mechanistic interpretability has shown that behaviors in language models can be successfully reverse-engineered through circuit analysis. A common criticism, however, is that each circuit is task-specific, and thus such analysis cannot contribute to understanding the models at a higher level. In this work, we present evidence that insights (both low-level findings about specific heads and higher-level findings about general algorithms) can indeed generalize across tasks. Specifically, we study the circuit discovered in (Wang, 2022) for the Indirect Object Identification (IOI) task and 1.) show that it reproduces on a larger GPT2 model, and 2.) that it is mostly reused to solve a seemingly different task: Colored Objects (Ippolito & Callison-Burch, 2023). We provide evidence that the process underlying both tasks is functionally very similar, and contains about a 78% overlap in in-circuit attention heads. We further present a proof-of-concept intervention experiment, in which we adjust four attention heads in middle layers in order to \u2018repair\u2019 the Colored Objects circuit and make it behave like the IOI circuit. In doing so, we boost accuracy from 49.6% to 93.7% on the Colored Objects task and explain most sources of error. The intervention affects downstream attention heads in specific ways predicted by their interactions in the IOI circuit, indicating that this subcircuit behavior is invariant to the different task inputs. Overall, our results provide evidence that it may yet be possible to explain large language models' behavior in terms of a relatively small number of interpretable task-general algorithmic building blocks and computational components.",
        "keywords": "interpretability;llms;mechanistic interpretability;circuit",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/381a5e79a33251cf21950992c331af97d466296e.zip",
        "author": "Jack Merullo;Carsten Eickhoff;Ellie Pavlick",
        "authorids": "~Jack_Merullo2;~Carsten_Eickhoff1;~Ellie_Pavlick1",
        "gender": "M;F;M",
        "homepage": "https://health-nlp.org;http://cs.brown.edu/people/epavlick/;https://jmerullo.github.io/",
        "dblp": "42/8700;141/4059;248/8361",
        "google_scholar": "QQi1_rAAAAAJ;sFyrSa8AAAAJ;7w0xLF4AAAAJ",
        "orcid": "0000-0001-9895-4061;;",
        "linkedin": ";;",
        "or_profile": "~Carsten_Eickhoff1;~Ellie_Pavlick1;~jack_merullo1",
        "aff": "Eberhard-Karls-Universit\u00e4t T\u00fcbingen;Brown University;Brown University",
        "aff_domain": "uni-tuebingen.de;brown.edu;brown.edu",
        "position": "Full Professor;Assistant Professor;PhD student",
        "bibtex": "@inproceedings{\nmerullo2024circuit,\ntitle={Circuit Component Reuse Across Tasks in Transformer Language Models},\nauthor={Jack Merullo and Carsten Eickhoff and Ellie Pavlick},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=fpoAYV6Wsk}\n}",
        "github": "",
        "project": "",
        "reviewers": "PvTR;mB6u;F5uQ;4sdK",
        "pdf_size": 7062134,
        "rating": "6;6;6;8",
        "confidence": "4;3;3;3",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;2;4;2",
        "wc_summary": "102;64;159;58",
        "wc_strengths": "113;174;119;91",
        "wc_weaknesses": "330;670;251;246",
        "wc_questions": "181;685;43;22",
        "wc_review": "726;1593;572;417",
        "wc_reply_reviewers": "14;228;333;22",
        "wc_reply_authors": "588;1129;1249;161",
        "reply_reviewers": "1;1;2;1",
        "reply_authors": "1;2;2;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            95.75,
            40.226701331329664
        ],
        "wc_strengths_avg": [
            124.25,
            30.55630049596973
        ],
        "wc_weaknesses_avg": [
            374.25,
            173.97180087588907
        ],
        "wc_questions_avg": [
            232.75,
            268.15515564687547
        ],
        "wc_review_avg": [
            827.0,
            455.5441800747761
        ],
        "wc_reply_reviewers_avg": [
            149.25,
            136.42832367217594
        ],
        "wc_reply_authors_avg": [
            781.75,
            436.39854204614386
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 63,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=616353060728554551&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=fpoAYV6Wsk",
        "pdf": "https://openreview.net/pdf?id=fpoAYV6Wsk",
        "email": "uni-tuebingen.de;brown.edu;brown.edu",
        "author_num": 3,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Eberhard Karls University of T\u00fcbingen;Brown University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uni-tuebingen.de/;https://www.brown.edu",
        "aff_unique_abbr": "Uni T\u00fcbingen;Brown",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "T\u00fcbingen;",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "Germany;United States"
    },
    {
        "title": "Sample-efficient Learning of Infinite-horizon Average-reward MDPs with General Function Approximation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18170",
        "id": "fq1wNrC2ai",
        "author_site": "Jianliang He, Han Zhong, Zhuoran Yang",
        "tldr": "",
        "abstract": "We study infinite-horizon average-reward Markov decision processes (AMDPs) in the context of general function approximation. Specifically, we propose a novel algorithmic framework named Local-fitted Optimization with OPtimism (LOOP), which incorporates both model-based and value-based incarnations. In particular, LOOP features a novel construction of confidence sets and a low-switching policy updating scheme, which are tailored to the average-reward and function approximation setting. Moreover, for AMDPs, we propose a novel complexity measure --- average-reward generalized eluder coefficient (AGEC) --- which captures the challenge of exploration in AMDPs with general function approximation. Such a complexity measure encompasses almost all previously known tractable AMDP models, such as linear AMDPs and linear mixture AMDPs, and also includes newly identified cases such as kernel AMDPs and AMDPs with Bellman eluder dimensions. Using AGEC, we prove that LOOP achieves a sublinear  $\\tilde{\\mathcal{O}}(\\mathrm{poly}(d, \\mathrm{sp}(V^*)) \\sqrt{T\\beta} )$ regret, where $d$ and $\\beta$ correspond to  AGEC and log-covering number of the hypothesis class respectively,  $\\mathrm{sp}(V^*)$ is the span of the optimal state bias function, $T$ denotes the number of steps, and $\\tilde{\\mathcal{O}} (\\cdot) $ omits logarithmic factors. When specialized to concrete AMDP models, our regret bounds are comparable to those established by the existing algorithms designed specifically for these special cases.  To the best of our knowledge, this paper presents the first comprehensive theoretical framework capable of handling nearly all AMDPs.",
        "keywords": "Reinforcement learning theory;General function approximation;Infinite-horizon Average-reward MDPs;Sample efficiency",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/839f865b2cda93cd5225f4ff44137658f13924df.pdf",
        "author": "Jianliang He;Han Zhong;Zhuoran Yang",
        "authorids": "~Jianliang_He1;~Han_Zhong1;~Zhuoran_Yang1",
        "gender": "M;;M",
        "homepage": "https://no.io/;https://hanzhong-ml.github.io/;https://zhuoranyang.github.io/",
        "dblp": ";137/8096.html;",
        "google_scholar": ";Bk5q_pAAAAAJ;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Jianliang_He1;~Han_Zhong1;~Zhuoran_Yang1",
        "aff": "Fudan University;Peking University;Yale University",
        "aff_domain": "fudan.edu.cn;stu.pku.edu.cn;yale.edu",
        "position": "Undergrad student;PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nhe2024sampleefficient,\ntitle={Sample-efficient Learning of Infinite-horizon Average-reward {MDP}s with General Function Approximation},\nauthor={Jianliang He and Han Zhong and Zhuoran Yang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=fq1wNrC2ai}\n}",
        "github": "",
        "project": "",
        "reviewers": "pAvA;jdKK;q11B;SbWP",
        "pdf_size": 1232278,
        "rating": "5;6;6;8",
        "confidence": "3;3;3;2",
        "soundness": "3;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;2;2",
        "wc_summary": "87;53;54;51",
        "wc_strengths": "44;22;56;45",
        "wc_weaknesses": "176;148;110;22",
        "wc_questions": "101;102;102;18",
        "wc_review": "408;325;322;136",
        "wc_reply_reviewers": "0;0;26;0",
        "wc_reply_authors": "607;1022;652;47",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;2;2;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            61.25,
            14.905955185763842
        ],
        "wc_strengths_avg": [
            41.75,
            12.336429791475327
        ],
        "wc_weaknesses_avg": [
            114.0,
            58.05170109479997
        ],
        "wc_questions_avg": [
            80.75,
            36.23102951890824
        ],
        "wc_review_avg": [
            297.75,
            99.55996936520219
        ],
        "wc_reply_reviewers_avg": [
            6.5,
            11.258330249197702
        ],
        "wc_reply_authors_avg": [
            582.0,
            348.33532694804296
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.9271726499455306,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=578029005386622575&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=fq1wNrC2ai",
        "pdf": "https://openreview.net/pdf?id=fq1wNrC2ai",
        "email": "fudan.edu.cn;stu.pku.edu.cn;yale.edu",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Fudan University;Peking University;Yale University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.fudan.edu.cn;http://www.pku.edu.cn;https://www.yale.edu",
        "aff_unique_abbr": "Fudan;Peking U;Yale",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Are Human-generated Demonstrations Necessary for In-context Learning?",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18169",
        "id": "frRDT6EOhg",
        "author_site": "Rui Li, Guoyin Wang, Jiwei Li",
        "tldr": "",
        "abstract": "Despite the promising few-shot ability of large language models (LLMs), the standard paradigm of In-context Learning (ICL) suffers the disadvantages of susceptibility to selected demonstrations and the intricacy to generate these demonstrations. In this paper, we raise the fundamental question that whether human-generated demonstrations are necessary for ICL. To answer this question, we propose self-contemplation prompting strategy (SEC), a paradigm free from human-crafted demonstrations. The key point of SEC is that, instead of using hand-crafted examples as demonstrations in ICL, SEC asks LLMs to first create demonstrations on their own, based on which the final output is generated. SEC is a flexible framework and can be adapted to both the vanilla ICL and the chain-of-thought (CoT), but with greater ease: as the manual-generation process of both examples and rationale can be saved. Extensive experiments in arithmetic reasoning, commonsense reasoning, multi-task language understanding, and code generation benchmarks, show that SEC, which does not require hand-crafted demonstrations, significantly outperforms the zero-shot learning strategy, and achieves comparable results to ICL with hand-crafted demonstrations. This demonstrates that, for many tasks, contemporary LLMs possess a sufficient level of competence to exclusively depend on their own capacity for decision making, removing the need for external training data.",
        "keywords": "language model;large language model;few-shot learning;natural language processing;in-context learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Rui Li;Guoyin Wang;Jiwei Li",
        "authorids": "~Rui_Li26;~Guoyin_Wang1;~Jiwei_Li1",
        "gender": "M;M;M",
        "homepage": "https://ruili33.github.io;;https://nlp.stanford.edu/~bdlijiwei/",
        "dblp": ";05/3838-2;73/5746-1",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;PwU16JEAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Rui_Li26;~Guoyin_Wang1;~Jiwei_Li1",
        "aff": "University of Science and Technology of China;Bytedance;Zhejiang University",
        "aff_domain": "ustc.edu.cn;bytedance.com;zju.edu.cn",
        "position": "Undergrad student;Principal Researcher;Assistant Professor",
        "bibtex": "@inproceedings{\nli2024are,\ntitle={Are Human-generated Demonstrations Necessary for In-context Learning?},\nauthor={Rui Li and Guoyin Wang and Jiwei Li},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=frRDT6EOhg}\n}",
        "github": "",
        "project": "",
        "reviewers": "B8T2;fqq3;yTZX;wk7D",
        "pdf_size": 770528,
        "rating": "6;6;6;8",
        "confidence": "4;5;3;4",
        "soundness": "2;2;3;3",
        "contribution": "3;3;2;3",
        "presentation": "3;3;3;2",
        "wc_summary": "59;102;43;72",
        "wc_strengths": "34;65;22;89",
        "wc_weaknesses": "166;195;62;199",
        "wc_questions": "53;5;49;48",
        "wc_review": "312;367;176;408",
        "wc_reply_reviewers": "15;12;11;89",
        "wc_reply_authors": "336;752;549;521",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            69.0,
            21.644860821913362
        ],
        "wc_strengths_avg": [
            52.5,
            26.272609310839304
        ],
        "wc_weaknesses_avg": [
            155.5,
            55.46395225729952
        ],
        "wc_questions_avg": [
            38.75,
            19.57517560585345
        ],
        "wc_review_avg": [
            315.75,
            87.57960664446946
        ],
        "wc_reply_reviewers_avg": [
            31.75,
            33.08606202013168
        ],
        "wc_reply_authors_avg": [
            539.5,
            147.47965961447022
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11053249878967613900&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=frRDT6EOhg",
        "pdf": "https://openreview.net/pdf?id=frRDT6EOhg",
        "email": "ustc.edu.cn;bytedance.com;zju.edu.cn",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of Science and Technology of China;ByteDance;Zhejiang University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.ustc.edu.cn;https://www.bytedance.com;https://www.zju.edu.cn",
        "aff_unique_abbr": "USTC;Bytedance;ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "frjDLUebFY",
        "title": "Exponentially Expanding the Compiler Phase-Ordering Problem's Search Space through the Learning of Dormant Information",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Applying compilation transformations in optimal sequences can significantly improve program speed and reduce code size. However, finding these optimal sequences, a problem known as the phase-ordering problem, remains a longstanding challenge. Specifically, modern compilers offer hundreds of available transformations, making the search space too large to efficiently explore in a reasonable time frame. Existing solutions tackle this problem by grouping transformations into short sequences, based on prior knowledge from human experts, and then searching for optimal orders within these sequences. However, such pruning methods can be aggressive, potentially excluding optimal solutions from the search space. Additionally, they lack scalability for new transformations.\n\nIn this paper, we propose a new, more conservative pruning approach that relies on Machine Learning to capture dormant information. This approach only excludes non-optimal solutions from the search space. It does not rely on any prior human knowledge, making it scalable to new transformations.\n\nTo demonstrate the efficiency of this conservative pruning approach, we integrate it with a classical Reinforcement Learning model, previously used with aggressive pruning methods. Our solution, named FlexPO, is capable of exploring a search space that is exponentially larger than those considered in existing solutions. Experimental results demonstrate that FlexPO generates programs that are 12% faster or 17.6% smaller than the programs generated by modern compilers.",
        "keywords": "Compiler;Reinforcement Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Ruobing Han;Hyesoon Kim",
        "authorids": "~Ruobing_Han1;~Hyesoon_Kim1",
        "gender": "M;",
        "homepage": "https://drcut.github.io/;https://www.cc.gatech.edu/~hyesoon",
        "dblp": "236/4877.html;https://dblp.org/pers/k/Kim:Hyesoon.html",
        "google_scholar": "https://scholar.google.com/citations?hl=en;7OvZhQIAAAAJ",
        "orcid": "0000-0002-3090-3951;0000-0002-6061-7825",
        "linkedin": ";",
        "or_profile": "~Ruobing_Han1;~Hyesoon_Kim1",
        "aff": "Georgia Institute of Technology;Georgia Institute of Technology",
        "aff_domain": "gatech.edu;gatech.edu",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nhan2024exponentially,\ntitle={Exponentially Expanding the Compiler Phase-Ordering Problem's Search Space through the Learning of Dormant Information},\nauthor={Ruobing Han and Hyesoon Kim},\nyear={2024},\nurl={https://openreview.net/forum?id=frjDLUebFY}\n}",
        "github": "",
        "project": "",
        "reviewers": "5iQh;gVMu;voGU;wMoc",
        "site": "https://openreview.net/forum?id=frjDLUebFY",
        "pdf_size": 963512,
        "rating": "3;3;5;8",
        "confidence": "3;4;4;3",
        "soundness": "2;1;3;3",
        "contribution": "1;2;2;4",
        "presentation": "2;2;2;4",
        "wc_summary": "48;65;213;104",
        "wc_strengths": "39;21;17;25",
        "wc_weaknesses": "143;154;83;23",
        "wc_questions": "550;53;116;225",
        "wc_review": "780;293;429;377",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            1.0897247358851685
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            107.5,
            64.20475060305117
        ],
        "wc_strengths_avg": [
            25.5,
            8.2915619758885
        ],
        "wc_weaknesses_avg": [
            100.75,
            52.39453692895854
        ],
        "wc_questions_avg": [
            236.0,
            191.44581478841474
        ],
        "wc_review_avg": [
            469.75,
            185.57932939850818
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.3665083330689157,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:69ia--qbIWwJ:scholar.google.com/&scioq=Exponentially+Expanding+the+Compiler+Phase-Ordering+Problem%27s+Search+Space+through+the+Learning+of+Dormant+Information&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Georgia Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.gatech.edu",
        "aff_unique_abbr": "Georgia Tech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Tensor Trust: Interpretable Prompt Injection Attacks from an Online Game",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18168",
        "id": "fsW7wJGLBd",
        "author_site": "Sam Toyer, Olivia Watkins, Ethan Mendes, Justin Svegliato, Luke Bailey, Tiffany Wang, Isaac Ong, Karim Elmaaroufi, Pieter Abbeel, trevor darrell, Alan Ritter, Stuart Russell",
        "tldr": "",
        "abstract": "While Large Language Models (LLMs) are increasingly being used in real-world applications, they remain vulnerable to *prompt injection attacks*: malicious third party prompts that subvert the intent of the system designer. To help researchers study this problem, we present a dataset of over 563,000 prompt injection attacks and 118,000 prompt-based \"defenses\" against prompt injection, all created by players of an online game called Tensor Trust. To the best of our knowledge, this is the first dataset that includes both human-generated attacks and defenses for instruction-following LLMs. The attacks in our dataset have easily interpretable structure, and shed light on the weaknesses of LLMs. We also use the dataset to create a benchmark for resistance to two types of prompt injection, which we refer to as *prompt extraction* and *prompt hijacking*. Our benchmark results show that many models are vulnerable to the attack strategies in the Tensor Trust dataset. Furthermore, we show that some attack strategies from the dataset generalize to deployed LLM-based applications, even though they have a very different set of constraints to the game. We release data and code at [tensortrust.ai/paper](https://tensortrust.ai/paper)",
        "keywords": "large language models;LLMs;security;adversarial examples;prompt extraction;prompt injection;prompt hijacking;prompt engineering",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Sam Toyer;Olivia Watkins;Ethan Adrian Mendes;Justin Svegliato;Luke Bailey;Tiffany Wang;Isaac Ong;Karim Elmaaroufi;Pieter Abbeel;Trevor Darrell;Alan Ritter;Stuart Russell",
        "authorids": "~Sam_Toyer1;~Olivia_Watkins1;~Ethan_Adrian_Mendes1;~Justin_Svegliato2;~Luke_Bailey1;~Tiffany_Wang1;~Isaac_Ong1;~Karim_Elmaaroufi1;~Pieter_Abbeel2;~Trevor_Darrell2;~Alan_Ritter1;~Stuart_Russell1",
        "gender": ";;;M;F;M;M;M;M;M;;M",
        "homepage": "https://www.qxcv.net/;https://people.eecs.berkeley.edu/~oliviawatkins/;;https://www.justinsvegliato.com/;https://www.tiffanywang.me/;https://isaacong.me;https://kael.tech.blog/;https://people.eecs.berkeley.edu/~pabbeel/;http://aritter.github.io/;https://people.eecs.berkeley.edu/~russell/;;https://people.eecs.berkeley.edu/~trevor/",
        "dblp": "203/9103;;;133/5067.html;;338/0119;229/1913.html;;47/3133;;171/4369;d/TrevorDarrell",
        "google_scholar": "J8E8GQYAAAAJ;;1SJ4uSgAAAAJ;3Orv6wUAAAAJ;;z0pC4TgAAAAJ;;https://scholar.google.com.tw/citations?user=vtwH6GkAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com.tw/citations?user=KJGrjCAAAAAJ;rUr9LjMAAAAJ;https://scholar.google.com.tw/citations?user=bh-uRFMAAAAJ",
        "orcid": "0000-0002-6665-6593;;;;;0009-0006-3551-7394;;;;;;",
        "linkedin": ";;;;wtiffany/;isaacong;;;;;;",
        "or_profile": "~Sam_Toyer1;~Olivia_Watkins1;~Ethan_Adrian_Mendes1;~Justin_Svegliato2;~Tiffany_Wang1;~Isaac_Ong1;~Karim_Elmaaroufi1;~Pieter_Abbeel2;~Alan_Ritter1;~Stuart_Russell1;~Luke_James_Bailey1;~trevor_darrell1",
        "aff": "University of California, Berkeley;University of California, Berkeley;Georgia Institute of Technology;Microsoft;University of California, Berkeley;University of California, Berkeley;University of California, Berkeley;Covariant;Georgia Institute of Technology;University of California, Berkeley;Harvard University;Electrical Engineering & Computer Science Department",
        "aff_domain": "berkeley.edu;berkeley.edu;gatech.edu;microsoft.com;berkeley.edu;berkeley.edu;berkeley.edu;covariant.ai;gatech.edu;berkeley.edu;harvard.edu;eecs.berkeley.edu",
        "position": "PhD student;PhD student;MS student;Senior Research Scientist;Undergrad student;MS student;PhD student;Founder;Associate Professor;Full Professor;Undergrad student;Professor",
        "bibtex": "@inproceedings{\ntoyer2024tensor,\ntitle={Tensor Trust: Interpretable Prompt Injection Attacks from an Online Game},\nauthor={Sam Toyer and Olivia Watkins and Ethan Adrian Mendes and Justin Svegliato and Luke Bailey and Tiffany Wang and Isaac Ong and Karim Elmaaroufi and Pieter Abbeel and Trevor Darrell and Alan Ritter and Stuart Russell},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=fsW7wJGLBd}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZAuw;6PUw;gj2Z",
        "pdf_size": 2366830,
        "rating": "5;8;8",
        "confidence": "3;2;3",
        "soundness": "3;3;3",
        "contribution": "2;2;3",
        "presentation": "3;3;3",
        "wc_summary": "44;64;107",
        "wc_strengths": "21;24;70",
        "wc_weaknesses": "34;27;84",
        "wc_questions": "44;2;2",
        "wc_review": "143;117;263",
        "wc_reply_reviewers": "0;0;9",
        "wc_reply_authors": "940;197;723",
        "reply_reviewers": "0;0;1",
        "reply_authors": "3;1;1",
        "rating_avg": [
            7.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            71.66666666666667,
            26.284765338288427
        ],
        "wc_strengths_avg": [
            38.333333333333336,
            22.425184255405547
        ],
        "wc_weaknesses_avg": [
            48.333333333333336,
            25.381533094401966
        ],
        "wc_questions_avg": [
            16.0,
            19.79898987322333
        ],
        "wc_review_avg": [
            174.33333333333334,
            63.58895781152225
        ],
        "wc_reply_reviewers_avg": [
            3.0,
            4.242640687119285
        ],
        "wc_reply_authors_avg": [
            620.0,
            311.94978228340966
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            12,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 86,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11488137792677027267&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 9,
        "openreview": "https://openreview.net/forum?id=fsW7wJGLBd",
        "pdf": "https://openreview.net/pdf?id=fsW7wJGLBd",
        "email": "berkeley.edu;berkeley.edu;gatech.edu;microsoft.com;berkeley.edu;berkeley.edu;berkeley.edu;covariant.ai;gatech.edu;berkeley.edu;harvard.edu;eecs.berkeley.edu",
        "author_num": 12,
        "aff_unique_index": "0;0;1;2;0;0;0;3;1;0;4;5",
        "aff_unique_norm": "University of California, Berkeley;Georgia Institute of Technology;Microsoft;Covariant;Harvard University;Electrical Engineering & Computer Science Department",
        "aff_unique_dep": ";;Microsoft Corporation;;;Electrical Engineering & Computer Science",
        "aff_unique_url": "https://www.berkeley.edu;https://www.gatech.edu;https://www.microsoft.com;;https://www.harvard.edu;",
        "aff_unique_abbr": "UC Berkeley;Georgia Tech;Microsoft;;Harvard;",
        "aff_campus_unique_index": "0;0;0;0;0;0",
        "aff_campus_unique": "Berkeley;",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States;"
    },
    {
        "id": "fsWr2AxJl8",
        "title": "T1: Scaling Diffusion Probabilistic Fields to High-Resolution on Unified Visual Modalities",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Diffusion Probabilistic Field (DPF) models the distribution of continuous functions defined over metric spaces. While DPF shows great potential for unifying data generation of various modalities including images, videos, and 3D geometry, it does not scale to a higher data resolution. This can be attributed to the ``scaling property'', where it is difficult for the model to capture local structures through uniform sampling. To this end, we propose a new model comprising of a view-wise sampling algorithm to focus on local structure learning, and incorporating additional guidance, e.g., text description, to complement the global geometry. The model can be scaled to generate high-resolution data while unifying multiple modalities. Experimental results on data generation in various modalities demonstrate the effectiveness of our model, as well as its potential as a foundation framework for scalable modality-unified visual content generation.",
        "keywords": "Generative Models;Modality-unified Generative Models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/7b332a018c2299d4e67a9d7342add969ac0c4b7e.pdf",
        "author": "Kangfu Mei;Mo Zhou;Vishal M. Patel",
        "authorids": "~Kangfu_Mei1;~Mo_Zhou1;~Vishal_M._Patel1",
        "gender": ";M;",
        "homepage": ";;",
        "dblp": ";;",
        "google_scholar": ";BVIO95UAAAAJ;",
        "orcid": ";0000-0003-3813-4875;",
        "linkedin": ";mo-zhou-9bb99021b/;",
        "or_profile": "~Kangfu_Mei1;~Mo_Zhou1;~Vishal_M._Patel1",
        "aff": ";Johns Hopkins University;",
        "aff_domain": ";jhu.edu;",
        "position": ";PhD student;",
        "bibtex": "@misc{\nmei2024t,\ntitle={T1: Scaling Diffusion Probabilistic Fields to High-Resolution on Unified Visual Modalities},\nauthor={Kangfu Mei and Mo Zhou and Vishal M. Patel},\nyear={2024},\nurl={https://openreview.net/forum?id=fsWr2AxJl8}\n}",
        "github": "",
        "project": "",
        "reviewers": "5j9d;3ac9;DQqx;DYLH",
        "site": "https://openreview.net/forum?id=fsWr2AxJl8",
        "pdf_size": 13043804,
        "rating": "3;3;3;5",
        "confidence": "5;4;3;4",
        "soundness": "2;3;2;2",
        "contribution": "3;2;2;2",
        "presentation": "3;3;2;3",
        "wc_summary": "90;102;67;66",
        "wc_strengths": "88;120;29;23",
        "wc_weaknesses": "250;291;525;294",
        "wc_questions": "42;111;7;94",
        "wc_review": "470;624;628;477",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            81.25,
            15.35211711784404
        ],
        "wc_strengths_avg": [
            65.0,
            40.663251222694925
        ],
        "wc_weaknesses_avg": [
            340.0,
            108.21506364642586
        ],
        "wc_questions_avg": [
            63.5,
            41.35516896350443
        ],
        "wc_review_avg": [
            549.75,
            76.30326008762667
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8456763202562717672&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "Johns Hopkins University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.jhu.edu",
        "aff_unique_abbr": "JHU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "fsc9GXX6Z6",
        "title": "Detecting and Removing Adversarial Patches using Frequency Signatures",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Computer vision systems deployed in safety-critical applications have proven to be susceptible to adversarial patches. The patches can cause catastrophic outcomes within autonomous driving scenarios. Existing defense techniques learn discriminative patch features or trigger patterns, which leave the defenses vulnerable to unseen patch attacks. In this paper, we propose Corner Cutter, a defense against adversarial patches that is robust to unseen patches and adaptive attacks. The framework is based on the insight that the construction process of adversarial patches leaves an attack signature in the frequency domain. The signature can be detected in different adversarial patches, including the LaVAN patch, the adversarial patch, the naturalistic patch, and a projected gradient descent-based patch. The framework neutralizes identified patches by isolating the high frequency signals and removing the corresponding pixels in the image domain. Corner Cutter is able to achieve an 11% increase in adversarial accuracy for the image classification task and an 8% increase in mean average precision on the Naturalistic patch over other defenses. The evaluations also demonstrate that the framework is robust to unseen patches and adaptive attacks.",
        "keywords": "Adversarial Robustness",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Dominic Simon;Chase Walker;Sumit Kumar Jha;Rickard Ewetz",
        "authorids": "~Dominic_Simon1;~Chase_Walker1;~Sumit_Kumar_Jha2;~Rickard_Ewetz1",
        "gender": "M;M;;M",
        "homepage": ";;http://www.sumitkumarjha.com;https://ewetz.ece.ufl.edu/",
        "dblp": ";348/7054;05/5046-1;127/9041",
        "google_scholar": ";j5vNNv4AAAAJ;3kJbs98AAAAJ;h_RaG-8AAAAJ",
        "orcid": ";0000-0001-8664-5843;0000-0003-0354-2940;",
        "linkedin": "dominic-simon-014b24233/;;sumit-jha-572a45180/;",
        "or_profile": "~Dominic_Simon1;~Chase_Walker1;~Sumit_Kumar_Jha2;~Rickard_Ewetz1",
        "aff": "University of Central Florida;University of Central Florida;Florida International University;University of Central Florida",
        "aff_domain": "ucf.edu;ucf.edu;fiu.edu;ucf.edu",
        "position": "PhD student;PhD student;Full Professor;Associate Professor",
        "bibtex": "@misc{\nsimon2024detecting,\ntitle={Detecting and Removing Adversarial Patches using Frequency Signatures},\nauthor={Dominic Simon and Chase Walker and Sumit Kumar Jha and Rickard Ewetz},\nyear={2024},\nurl={https://openreview.net/forum?id=fsc9GXX6Z6}\n}",
        "github": "",
        "project": "",
        "reviewers": "1H9u;DrYS;r6Dg;pCXn",
        "site": "https://openreview.net/forum?id=fsc9GXX6Z6",
        "pdf_size": 19158991,
        "rating": "3;3;3;5",
        "confidence": "5;5;4;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "2;2;3;2",
        "wc_summary": "52;49;42;77",
        "wc_strengths": "18;25;126;17",
        "wc_weaknesses": "560;198;371;56",
        "wc_questions": "32;5;82;111",
        "wc_review": "662;277;621;261",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            55.0,
            13.209844813622906
        ],
        "wc_strengths_avg": [
            46.5,
            46.00271731104588
        ],
        "wc_weaknesses_avg": [
            296.25,
            188.76225125803094
        ],
        "wc_questions_avg": [
            57.5,
            41.43971524998694
        ],
        "wc_review_avg": [
            455.25,
            186.89886971300817
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:APy4oCvq7iAJ:scholar.google.com/&scioq=Detecting+and+Removing+Adversarial+Patches+using+Frequency+Signatures&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "University of Central Florida;Florida International University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ucf.edu;https://www.fiu.edu",
        "aff_unique_abbr": "UCF;FIU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Can We Evaluate Domain Adaptation Models Without Target-Domain Labels?",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18167",
        "id": "fszrlQ2DuP",
        "author_site": "JIANFEI YANG, Hanjie Qian, Yuecong Xu, Kai Wang, Lihua Xie",
        "tldr": "",
        "abstract": "Unsupervised domain adaptation (UDA) involves adapting a model trained on a label-rich source domain to an unlabeled target domain. However, in real-world scenarios, the absence of target-domain labels makes it challenging to evaluate the performance of UDA models. Furthermore, prevailing UDA methods relying on adversarial training and self-training could lead to model degeneration and negative transfer, further exacerbating the evaluation problem. In this paper, we propose a novel metric called the Transfer Score to address these issues. The proposed metric enables the unsupervised evaluation of UDA models by assessing the spatial uniformity of the classifier via model parameters, as well as the transferability and discriminability of deep representations. Based on the metric, we achieve three novel objectives without target-domain labels: (1) selecting the best UDA method from a range of available options, (2) optimizing hyperparameters of UDA models to prevent model degeneration, and (3) identifying which checkpoint of UDA model performs optimally. Our work bridges the gap between data-level UDA research and practical UDA scenarios, enabling a realistic assessment of UDA model performance. We validate the effectiveness of our metric through extensive empirical studies on UDA datasets of different scales and imbalanced distributions. The results demonstrate that our metric robustly achieves the aforementioned goals.",
        "keywords": "domain adaptation; feature transferability;",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/3578989e822015b7fe775da1cacd918407099647.zip",
        "author": "Jianfei Yang;Hanjie Qian;Yuecong Xu;Kai Wang;Lihua Xie",
        "authorids": "~Jianfei_Yang4;~Hanjie_Qian1;~Yuecong_Xu1;~Kai_Wang8;~Lihua_Xie2",
        "gender": "M;M;M;M;M",
        "homepage": ";https://xuyu0010.github.io;https://kaiwang960112.github.io/;https://personal.ntu.edu.sg/elhxie/;https://marsyang.site/",
        "dblp": ";242/7964;78/2022-36;40/2499;06/5852.html",
        "google_scholar": ";cqeOXE4AAAAJ;i2II0XIAAAAJ;Fmrv3J8AAAAJ;https://scholar.google.com.sg/citations?user=V25k08UAAAAJ",
        "orcid": "0000-0002-2602-7880;0000-0002-4292-7379;0000-0002-1154-5175;0000-0002-7137-4136;0000-0002-8075-0439",
        "linkedin": ";xuyu0014/;;https://www.linkedin.com/posts/ntueee_research-project-collaboration-activity-7054010243399188480-ZJaM;jianfei-yang-55560386/",
        "or_profile": "~Hanjie_Qian1;~Yuecong_Xu1;~Kai_Wang8;~Lihua_Xie2;~JIANFEI_YANG3",
        "aff": ";Institute for Infocomm Research, A*STAR;National University of Singapore;Nanyang Technological University;The University of Tokyo",
        "aff_domain": ";i2r.a-star.edu.sg;u.nus.edu;ntu.edu.sg;u-tokyo.ac.jp",
        "position": ";Researcher;PhD student;Full Professor;Visiting Scholar",
        "bibtex": "@inproceedings{\nyang2024can,\ntitle={Can We Evaluate Domain Adaptation Models Without Target-Domain Labels?},\nauthor={Jianfei Yang and Hanjie Qian and Yuecong Xu and Kai Wang and Lihua Xie},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=fszrlQ2DuP}\n}",
        "github": "",
        "project": "",
        "reviewers": "VJy8;iLFW;eAAs;hZ7S",
        "pdf_size": 1153533,
        "rating": "6;6;6;6",
        "confidence": "4;4;4;5",
        "soundness": "3;3;2;3",
        "contribution": "2;3;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "66;21;48;51",
        "wc_strengths": "35;9;18;48",
        "wc_weaknesses": "103;188;214;213",
        "wc_questions": "74;2;5;10",
        "wc_review": "278;220;285;322",
        "wc_reply_reviewers": "162;15;113;0",
        "wc_reply_authors": "3085;2336;2172;1251",
        "reply_reviewers": "2;1;2;0",
        "reply_authors": "7;6;5;3",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            46.5,
            16.224980739587952
        ],
        "wc_strengths_avg": [
            27.5,
            15.074813431681335
        ],
        "wc_weaknesses_avg": [
            179.5,
            45.37895988230669
        ],
        "wc_questions_avg": [
            22.75,
            29.72688177390962
        ],
        "wc_review_avg": [
            276.25,
            36.526531453177974
        ],
        "wc_reply_reviewers_avg": [
            72.5,
            67.47777411859404
        ],
        "wc_reply_authors_avg": [
            2211.0,
            652.4227923670355
        ],
        "reply_reviewers_avg": [
            1.25,
            0.82915619758885
        ],
        "reply_authors_avg": [
            5.25,
            1.479019945774904
        ],
        "replies_avg": [
            33,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5360719528453947838&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=fszrlQ2DuP",
        "pdf": "https://openreview.net/pdf?id=fszrlQ2DuP",
        "email": ";i2r.a-star.edu.sg;u.nus.edu;ntu.edu.sg;u-tokyo.ac.jp",
        "author_num": 5,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Institute for Infocomm Research;National University of Singapore;Nanyang Technological University;University of Tokyo",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.i2r.a-star.edu.sg;https://www.nus.edu.sg;https://www.ntu.edu.sg;https://www.u-tokyo.ac.jp",
        "aff_unique_abbr": "I2R;NUS;NTU;UTokyo",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "Singapore;Japan"
    },
    {
        "id": "ft0hSoZTVe",
        "title": "YOLOR-Based Multi-Task Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Multi-task learning (MTL) aims to learn multiple tasks using a single model and jointly improve all of them assuming generalization and shared semantics. Reducing conflicts between tasks during joint learning is difficult and generally requires careful network design and extremely large models. We propose building on You Only Learn One Representation (YOLOR) (Wang et al., 2023), a network architecture specifically designed for multitasking. YOLOR leverages both explicit and implicit knowledge, from data observations and learned latents, respectively, to improve a shared representation while minimizing the number of training parameters. However, YOLOR and its follow-up, YOLOv7 (Wang et al., 2023a), only trained two tasks at once. In this paper, we jointly train object detection, instance segmentation, semantic segmentation, and image captioning. We analyze tradeoffs and attempt to maximize sharing of semantic information. Through our architecture and training strategies, we find that our method achieves competitive performance on all tasks while maintaining a low parameter count and without any pre-training. We will release code soon.",
        "keywords": "YOLOR;Multi-task;object detection;instance segmentation;semantic segmentation;image captioning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Hung-Shuo Chang;Chien-Yao Wang;Richard Robert Wang;Gene Chou;Hong-Yuan Mark Liao",
        "authorids": "~Hung-Shuo_Chang2;~Chien-Yao_Wang1;~Richard_Robert_Wang1;~Gene_Chou1;~Hong-Yuan_Mark_Liao2",
        "gender": "M;M;M;;M",
        "homepage": ";;;https://genechou.com/;https://www.iis.sinica.edu.tw/pages/liao/index_zh.html",
        "dblp": ";168/6259;;322/1261;05/2757",
        "google_scholar": "pAdR3h0AAAAJ;DkQh4M4AAAAJ;;FZN-I0QAAAAJ;_IXt8boAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;richardrwang23/;gene-chou;",
        "or_profile": "~Hung-Shuo_Chang2;~Chien-Yao_Wang1;~Richard_Robert_Wang1;~Gene_Chou1;~Hong-Yuan_Mark_Liao2",
        "aff": "Institute of Information Science, Academia Sinica;Academia Sinica;University of California, Berkeley;Cornell University;Academia Sinica",
        "aff_domain": "iis.sinica.edu.tw;iis.sinica.edu.tw;berkeley.edu;cornell.edu;iis.sinica.edu.tw",
        "position": "Researcher;Assistant Research Fellow/Professor;Undergrad student;PhD student;Full Professor",
        "bibtex": "@misc{\nchang2024yolorbased,\ntitle={{YOLOR}-Based Multi-Task Learning},\nauthor={Hung-Shuo Chang and Chien-Yao Wang and Richard Robert Wang and Gene Chou and Hong-Yuan Mark Liao},\nyear={2024},\nurl={https://openreview.net/forum?id=ft0hSoZTVe}\n}",
        "github": "",
        "project": "",
        "reviewers": "Se2d;ZD4T;ojGP;MQQ6",
        "site": "https://openreview.net/forum?id=ft0hSoZTVe",
        "pdf_size": 11952533,
        "rating": "1;3;3;5",
        "confidence": "4;4;4;4",
        "soundness": "1;2;2;3",
        "contribution": "2;1;1;2",
        "presentation": "1;3;1;3",
        "wc_summary": "100;39;84;82",
        "wc_strengths": "19;19;24;123",
        "wc_weaknesses": "422;221;246;47",
        "wc_questions": "2;7;2;43",
        "wc_review": "543;286;356;295",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            1.0
        ],
        "wc_summary_avg": [
            76.25,
            22.609455986378798
        ],
        "wc_strengths_avg": [
            46.25,
            44.358623738795146
        ],
        "wc_weaknesses_avg": [
            234.0,
            132.87776337672153
        ],
        "wc_questions_avg": [
            13.5,
            17.153716798408443
        ],
        "wc_review_avg": [
            370.0,
            103.44805459746452
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0;0;1;2;0",
        "aff_unique_norm": "Academia Sinica;University of California, Berkeley;Cornell University",
        "aff_unique_dep": "Institute of Information Science;;",
        "aff_unique_url": "https://www.sinica.edu.tw;https://www.berkeley.edu;https://www.cornell.edu",
        "aff_unique_abbr": "AS;UC Berkeley;Cornell",
        "aff_campus_unique_index": "0;0;1;0",
        "aff_campus_unique": "Taiwan;Berkeley;",
        "aff_country_unique_index": "0;0;1;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Improved Probabilistic Image-Text Representations",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18166",
        "id": "ft1mr3WlGM",
        "tldr": "",
        "abstract": "Image-Text Matching (ITM) task, a fundamental vision-language (VL) task, suffers from the inherent ambiguity arising from multiplicity and imperfect annotations. Deterministic functions are not sufficiently powerful to capture ambiguity, prompting the exploration of probabilistic embeddings to tackle the challenge. However, the existing probabilistic ITM approach encounters two key shortcomings; the burden of heavy computations due to the Monte Carlo approximation, and the loss saturation issue in the face of abundant false negatives. To overcome the issues, this paper presents an improved Probabilistic Cross-Modal Embeddings (named PCME++) by introducing a new probabilistic distance with a closed-form solution. In addition, two optimization techniques are proposed to enhance PCME++ further: first, the incorporation of pseudo-positives to prevent the negative effect under massive false negatives; second, mixed sample data augmentation for probabilistic matching. Experimental results on MS-COCO Caption and two extended benchmarks, CxC and ECCV Caption, demonstrate the effectiveness of PCME++ compared to state-of-the-art ITM methods. The robustness of PCME++ is also evaluated under noisy image-text correspondences. In addition, the potential applicability of PCME++ in automatic prompt-filtering for zero-shot classification is shown. The code is available at https://github.com/naver-ai/pcmepp.",
        "keywords": "Probabilistic embedding;image-text matching;cross-modal retrieval;vision-language",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Sanghyuk Chun",
        "authorids": "~Sanghyuk_Chun1",
        "gender": "M",
        "homepage": "https://sanghyukchun.github.io/home/",
        "dblp": "213/1095.html",
        "google_scholar": "https://scholar.google.co.kr/citations?user=4_uj0xcAAAAJ",
        "orcid": "0000-0002-4533-2610",
        "linkedin": "https://kr.linkedin.com/in/sanghyukchun/en",
        "or_profile": "~Sanghyuk_Chun1",
        "aff": "NAVER AI Lab",
        "aff_domain": "navercorp.com",
        "position": "Lead research scientist",
        "bibtex": "@inproceedings{\nchun2024improved,\ntitle={Improved Probabilistic Image-Text Representations},\nauthor={Sanghyuk Chun},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ft1mr3WlGM}\n}",
        "github": "",
        "project": "",
        "reviewers": "36mP;XAP9;RNqC",
        "pdf_size": 2308540,
        "rating": "6;6;8",
        "confidence": "5;3;3",
        "soundness": "3;3;3",
        "contribution": "3;2;3",
        "presentation": "3;3;4",
        "wc_summary": "47;40;85",
        "wc_strengths": "24;35;111",
        "wc_weaknesses": "164;126;24",
        "wc_questions": "3;51;38",
        "wc_review": "238;252;258",
        "wc_reply_reviewers": "16;45;0",
        "wc_reply_authors": "1360;1740;499",
        "reply_reviewers": "1;1;0",
        "reply_authors": "5;3;3",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            57.333333333333336,
            19.770910168449223
        ],
        "wc_strengths_avg": [
            56.666666666666664,
            38.681031814343086
        ],
        "wc_weaknesses_avg": [
            104.66666666666667,
            59.11194652709571
        ],
        "wc_questions_avg": [
            30.666666666666668,
            20.270394394014364
        ],
        "wc_review_avg": [
            249.33333333333334,
            8.379870059984356
        ],
        "wc_reply_reviewers_avg": [
            20.333333333333332,
            18.62495339293199
        ],
        "wc_reply_authors_avg": [
            1199.6666666666667,
            519.1662118778105
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 36,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16198478954301863485&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=ft1mr3WlGM",
        "pdf": "https://openreview.net/pdf?id=ft1mr3WlGM",
        "email": "navercorp.com",
        "author_num": 1,
        "aff_unique_index": "0",
        "aff_unique_norm": "NAVER Corporation",
        "aff_unique_dep": "NAVER AI Lab",
        "aff_unique_url": "https://www.naver.com",
        "aff_unique_abbr": "NAVER",
        "aff_country_unique_index": "0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "ftKqt3Di3H",
        "title": "Text-Free Federated Transformers Knowledge Distillation Without GAN",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Federated Learning (FL) is a distributed learning process designed to protect user privacy by avoiding the transmission of user data during communication while training a model. Many techniques aim to enhance the performance of models through knowledge distillation but lack data on the server side. To address this issue, Generative Adversarial Networks (GANs) are commonly employed to generate data for model distillation. The GANs approach faces numerous challenges in recent popular large-scale Transformer-based NLP tasks, such as structural mismatches in models, high computational complexity, and concerns regarding the privacy of client-generated text. Prior research has sought to enhance the process using auxiliary data to avoid the above issues, however, the selection of suitable data tailored to diverse tasks remains a challenging endeavor. To address the challenges posed by GANs and auxiliary data, this work proposes a lightweight approach that samples from the embedding structure of Transformers and learns a set of pseudo data for the distillation process, which draws inspiration from the concept of soft prompts. This lightweight approach does not require GANs or auxiliary data, incurs no communication overhead, and yields improved model performance with relatively lower computational costs on the server side. Our experiments yield superior results compared to methods that rely on auxiliary data on complex NLP tasks such as the SuperGLUE Benchmark.",
        "keywords": "Federated Learning;Knowledge Distillation;Transformer;SuperGLUE benchmark",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/9dce8cb131c302c83d3a51537ecda0ab3d078f44.pdf",
        "author": "Zhongxiang Lei;Yongzi Yu;Chongyang Shi;Yuanchi Ma;Jinyan Liu",
        "authorids": "~Zhongxiang_Lei1;~Yongzi_Yu1;~Chongyang_Shi1;~Yuanchi_Ma1;~Jinyan_Liu1",
        "gender": "M;F;M;M;",
        "homepage": "https://github.com/NPCLEI;;https://cs.bit.edu.cn/szdw/jsml2/rjznyrjgcyjs2/3c137ad5c6484e8d931719b1612dd35c.htm;https://blog.csdn.net/weixin_43288629?type=blog;",
        "dblp": ";;68/7942-1.html;338/2501;149/9402",
        "google_scholar": ";;;;",
        "orcid": ";0000-0001-6695-3849;;;",
        "linkedin": ";;;;",
        "or_profile": "~Zhongxiang_Lei1;~Yongzi_Yu1;~Chongyang_Shi1;~Yuanchi_Ma1;~Jinyan_Liu1",
        "aff": "Beijing Institute of Technology;Beijing Institute of Technology;Beijing Institute of Technology;Beijing Institute of Technology;Beijing Institute of Technology",
        "aff_domain": "bit.edu.cn;bit.edu.cn;bit.edu.cn;bit.edu.cn;bit.edu.cn",
        "position": "MS student;Undergrad student;Associate Professor;PhD student;Full Professor",
        "bibtex": "@misc{\nanonymous2024textfree,\ntitle={Text-Free Federated Transformers Knowledge Distillation Without {GAN}},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=ftKqt3Di3H}\n}",
        "github": "",
        "project": "",
        "reviewers": "PazT;DJtk;PY1Q;hSV1",
        "site": "https://openreview.net/forum?id=ftKqt3Di3H",
        "pdf_size": 486027,
        "rating": "3;5;5;6",
        "confidence": "4;4;4;3",
        "soundness": "2;2;3;3",
        "contribution": "1;2;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "62;64;47;201",
        "wc_strengths": "6;60;30;305",
        "wc_weaknesses": "265;109;149;145",
        "wc_questions": "4;2;3;71",
        "wc_review": "337;235;229;722",
        "wc_reply_reviewers": "109;18;0;31",
        "wc_reply_authors": "1093;1452;407;594",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "4;4;3;2",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            93.5,
            62.411937960617756
        ],
        "wc_strengths_avg": [
            100.25,
            119.75052191953068
        ],
        "wc_weaknesses_avg": [
            167.0,
            58.68560300448484
        ],
        "wc_questions_avg": [
            20.0,
            29.45335295004628
        ],
        "wc_review_avg": [
            380.75,
            201.64123462228653
        ],
        "wc_reply_reviewers_avg": [
            39.5,
            41.608292442733095
        ],
        "wc_reply_authors_avg": [
            886.5,
            411.67614698935375
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.25,
            0.82915619758885
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.6622661785325219,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11215662953628625968&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Beijing Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.bit.edu.cn/",
        "aff_unique_abbr": "BIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "ftdtqEiTXZ",
        "title": "Pay attention to cycle for spatio-temporal graph neural network",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph Neural Networks (GNNs) and Transformer have been increasingly adopted to learn the complex vector representations of spatio-temporal graphs, capturing intricate spatio-temporal dependencies crucial for applications such as traffic datasets. Although many existing methods utilize multi-head attention mechanisms and message-passing neural networks (MPNNs) to capture both spatial and temporal relations, these approaches encode temporal and spatial relations independently, and reflect the graph's topological characteristics in a limited manner. In this work, we introduce the Cycle to Mixer (Cy2Mixer), a novel spatio-temporal GNN based on topological non-trivial invariants of spatio-temporal graphs with gated multi-layer perceptrons (gMLP). The Cy2Mixer is composed of three blocks based on MLPs: A message-passing block for encapsulating spatial information: a cycle message-passing block for enriching topological information through cyclic subgraphs: And a temporal block for capturing temporal properties. We bolster the effectiveness of Cy2Mixer with mathematical evidence emphasizing that our cycle message-passing block is capable of offering differentiated information to the deep learning model compared to the message-passing block. Furthermore, empirical evaluations substantiate the efficacy of the Cy2Mixer, demonstrating state-of-the-art performances across various traffic benchmark datasets.",
        "keywords": "Graph Neural Network;Traffic forecast;Spatio-Temporal Graph;Multilayer perceptron",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/7be5dffb30fbee6a6f2b51d7405b2664ef26e15d.zip",
        "author": "Yun Young Choi;Minho Lee;Sun Woo Park;Seunghwan Lee;Joohwan Ko",
        "authorids": "~Yun_Young_Choi1;~Minho_Lee5;~Sun_Woo_Park1;~Seunghwan_Lee4;~Joohwan_Ko2",
        "gender": ";M;M;;M",
        "homepage": ";https://leemingo.github.io/;https://sites.google.com/wisc.edu/spark483;;https://joohwanko.com/",
        "dblp": ";;;;358/5976",
        "google_scholar": ";JHgYc48AAAAJ;;;",
        "orcid": ";;;;",
        "linkedin": ";minho-lee-9a96191a4/;;seunghwan-lee-830170279;",
        "or_profile": "~Yun_Young_Choi1;~Minho_Lee5;~Sun_Woo_Park1;~Seunghwan_Lee4;~Joohwan_Ko2",
        "aff": ";Yonsei University;;SolverX;Korea Advanced Institute of Science & Technology",
        "aff_domain": ";yonsei.ac.kr;;solverx.ai;kaist.edu",
        "position": ";MS student;;Researcher;MS student",
        "bibtex": "@misc{\nchoi2024pay,\ntitle={Pay attention to cycle for spatio-temporal graph neural network},\nauthor={Yun Young Choi and Minho Lee and Sun Woo Park and Seunghwan Lee and Joohwan Ko},\nyear={2024},\nurl={https://openreview.net/forum?id=ftdtqEiTXZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "LrWr;MKsg;6VA9;VYt1",
        "site": "https://openreview.net/forum?id=ftdtqEiTXZ",
        "pdf_size": 669517,
        "rating": "3;5;5;5",
        "confidence": "4;4;4;3",
        "soundness": "3;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "1;2;2;3",
        "wc_summary": "72;65;83;85",
        "wc_strengths": "48;60;45;58",
        "wc_weaknesses": "540;303;131;156",
        "wc_questions": "138;4;26;2",
        "wc_review": "798;432;285;301",
        "wc_reply_reviewers": "89;0;81;0",
        "wc_reply_authors": "1331;717;894;332",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "3;1;2;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            76.25,
            8.166241485530538
        ],
        "wc_strengths_avg": [
            52.75,
            6.378675411086537
        ],
        "wc_weaknesses_avg": [
            282.5,
            162.54307121498596
        ],
        "wc_questions_avg": [
            42.5,
            55.9352304008842
        ],
        "wc_review_avg": [
            454.0,
            206.63373393519268
        ],
        "wc_reply_reviewers_avg": [
            42.5,
            42.59401366389413
        ],
        "wc_reply_authors_avg": [
            818.5,
            358.93627568135264
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:mCH7krHeSowJ:scholar.google.com/&scioq=Pay+attention+to+cycle+for+spatio-temporal+graph+neural+network&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Yonsei University;SolverX;Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.yonsei.ac.kr;;https://www.kaist.ac.kr",
        "aff_unique_abbr": "Yonsei;;KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea;"
    },
    {
        "id": "fud9JxIiEq",
        "title": "Improved DDIM Sampling with Moment Matching Gaussian Mixtures",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We propose using a Gaussian Mixture Model (GMM) as reverse transition operator (kernel) within the Denoising Diffusion Implicit Models (DDIM) framework, which is one of the most widely used approaches for accelerated sampling from pre-trained Denoising Diffusion Probabilistic Models (DDPM). Specifically we match the first and second order central moments of the DDPM forward marginals by constraining the parameters of the GMM. We see that moment matching is sufficient to obtain samples with equal or better quality than the original DDIM with Gaussian kernels. We provide experimental results with unconditional models trained on CelebAHQ and FFHQ and class-conditional models trained on ImageNet datasets respectively. Our results suggest that using the GMM kernel leads to significant improvements in the quality of the generated samples when the number of sampling steps is small, as measured by FID and IS metrics. For example on ImageNet 256x256, using 10 sampling steps, we achieve a FID of 6.94 and IS of 207.85 with a GMM kernel compared to 10.15 and 196.73 respectively with a Gaussian kernel.",
        "keywords": "Diffusion;DDIM;Generative models",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Prasad Gabbur",
        "authorids": "~Prasad_Gabbur1",
        "gender": "M",
        "homepage": "https://uweb.engr.arizona.edu/~pgsangam/",
        "dblp": "63/214",
        "google_scholar": "Mk9iFM8AAAAJ",
        "orcid": "",
        "linkedin": "prasad-gabbur-bb31706",
        "or_profile": "~Prasad_Gabbur1",
        "aff": "Apple",
        "aff_domain": "apple.com",
        "position": "Researcher",
        "bibtex": "@misc{\ngabbur2024improved,\ntitle={Improved {DDIM} Sampling with Moment Matching Gaussian Mixtures},\nauthor={Prasad Gabbur},\nyear={2024},\nurl={https://openreview.net/forum?id=fud9JxIiEq}\n}",
        "github": "",
        "project": "",
        "reviewers": "fa8T;K8bf;kj2x;Rr35",
        "site": "https://openreview.net/forum?id=fud9JxIiEq",
        "pdf_size": 5999505,
        "rating": "3;3;5;5",
        "confidence": "4;4;4;3",
        "soundness": "2;3;3;3",
        "contribution": "2;3;2;2",
        "presentation": "2;2;3;3",
        "wc_summary": "65;71;64;89",
        "wc_strengths": "36;68;36;48",
        "wc_weaknesses": "137;241;123;165",
        "wc_questions": "69;5;118;114",
        "wc_review": "307;385;341;416",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "736;438;779;745",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            72.25,
            10.034316120194738
        ],
        "wc_strengths_avg": [
            47.0,
            13.076696830622021
        ],
        "wc_weaknesses_avg": [
            166.5,
            45.59331091289599
        ],
        "wc_questions_avg": [
            76.5,
            45.54393483220351
        ],
        "wc_review_avg": [
            362.25,
            41.565460420883106
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            674.5,
            137.48181697955553
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6368264744137147408&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "Apple",
        "aff_unique_dep": "Apple Inc.",
        "aff_unique_url": "https://www.apple.com",
        "aff_unique_abbr": "Apple",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "fvTaoyH96Z",
        "title": "Non-Parameterized Randomization for Environmental Generalization in Deep Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The generalization problem presents a major obstacle to the practical application of reinforcement learning (RL) in real-world scenarios, primarily due to the prohibitively high cost of retraining policies. The environmental generalization, which involves the ability to generalize RL agents to different environments with distinct generative models but the same task semantics, remains an unsolved challenge that directly affects real-world deployment. In this paper, we build a structured mathematical framework to describe environmental generalization and show that the difficulty comes from a non-optimizable gap without learning in all environments. Accordingly, we propose a kind of non-parameterized randomization method to augment the training environments. We theoretically demonstrate that training in these environments will give an approximately optimizable lower bound for this gap. Through empirical evaluation, we demonstrate the effectiveness of our method in zero-shot environmental generalization tasks spanning a wide range of diverse environments. Comparisons with existing advanced methods designed for generalization tasks demonstrate that our method has significant superiority in these challenging tasks.",
        "keywords": "reinforcement learning;zero-shot generalization;environmental generalization",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/2587ee40cb218218d32e1a89887cca58cdd10c79.zip",
        "author": "Yihan Li;Tianren Zhang;Jinsheng Ren;Ying Fang;Feng Chen",
        "authorids": "~Yihan_Li1;~Tianren_Zhang1;~Jinsheng_Ren1;~Ying_Fang2;~Feng_Chen1",
        "gender": "M;M;M;F;M",
        "homepage": ";;;;",
        "dblp": ";;;;21/3047-7",
        "google_scholar": ";https://scholar.google.com/citations?hl=zh-CN;;;",
        "orcid": "0000-0001-9485-8152;0000-0001-9687-5263;0000-0002-5013-1880;0000-0002-8073-0964;0000-0003-4813-2494",
        "linkedin": ";%E5%A4%A9%E4%BB%BB-%E7%AB%A0-622b30110/;;;",
        "or_profile": "~Yihan_Li1;~Tianren_Zhang1;~Jinsheng_Ren1;~Ying_Fang2;~Feng_Chen1",
        "aff": "Tsinghua University;Tsinghua University;Tsinghua University;Fujian Normal University;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;fjnu.edu.cn;tsinghua.edu.cn",
        "position": "PhD student;PhD student;Researcher;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nli2024nonparameterized,\ntitle={Non-Parameterized Randomization for Environmental Generalization in Deep Reinforcement Learning},\nauthor={Yihan Li and Tianren Zhang and Jinsheng Ren and Ying Fang and Feng Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=fvTaoyH96Z}\n}",
        "github": "",
        "project": "",
        "reviewers": "Et3C;jHMr;yfA1",
        "site": "https://openreview.net/forum?id=fvTaoyH96Z",
        "pdf_size": 2051537,
        "rating": "1;3;3",
        "confidence": "4;4;3",
        "soundness": "1;2;3",
        "contribution": "1;2;2",
        "presentation": "1;3;3",
        "wc_summary": "63;67;86",
        "wc_strengths": "32;50;32",
        "wc_weaknesses": "519;161;152",
        "wc_questions": "461;144;3",
        "wc_review": "1075;422;273",
        "wc_reply_reviewers": "0;144;0",
        "wc_reply_authors": "0;1123;725",
        "reply_reviewers": "0;2;0",
        "reply_authors": "0;2;1",
        "rating_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            72.0,
            10.03327796219494
        ],
        "wc_strengths_avg": [
            38.0,
            8.48528137423857
        ],
        "wc_weaknesses_avg": [
            277.3333333333333,
            170.9236346702494
        ],
        "wc_questions_avg": [
            202.66666666666666,
            191.52429494859277
        ],
        "wc_review_avg": [
            590.0,
            348.2996793950099
        ],
        "wc_reply_reviewers_avg": [
            48.0,
            67.88225099390856
        ],
        "wc_reply_authors_avg": [
            616.0,
            464.8964042307347
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            1.0,
            0.816496580927726
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Btd_scRYEJMJ:scholar.google.com/&scioq=Non-Parameterized+Randomization+for+Environmental+Generalization+in+Deep+Reinforcement+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "Tsinghua University;Fujian Normal University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tsinghua.edu.cn;http://www.fjnu.edu.cn",
        "aff_unique_abbr": "THU;FJNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "fvhJu0FODp",
        "title": "Avalon's Game of Thoughts: Battle Against Deception through Recursive Contemplation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recent breakthroughs in large language models (LLMs) have brought remarkable success in the field of LLM-as-Agent. Nevertheless, a prevalent assumption is that the information processed by LLMs is consistently honest, neglecting the pervasive deceptive or misleading information in human society and AI-generated content. This oversight makes LLMs susceptible to malicious manipulations, potentially resulting in detrimental outcomes. This study utilizes the intricate Avalon game as a testbed to explore LLMs' potential in deceptive environments. Avalon, full of misinformation and requiring sophisticated logic, manifests as a \"Game-of-Thoughts\". Inspired by the efficacy of humans' recursive thinking and perspective-taking in the Avalon game, we introduce a novel framework, Recursive Contemplation (ReCon), to enhance LLMs' ability to identify and counteract deceptive information. ReCon combines formulation and refinement contemplation processes; formulation contemplation produces initial thoughts and speech, while refinement contemplation further polishes them. Additionally, we incorporate first-order and second-order perspective transitions into these processes respectively. Specifically, the first-order allows an LLM agent to infer others\u2019 mental states, and the second-order involves understanding how others perceive the agent\u2019s mental state. After integrating ReCon with different LLMs, extensive experiment results from the Avalon game indicate its efficacy in aiding LLMs to discern and maneuver around deceptive information without extra fine-tuning and data. Finally, we offer a possible explanation for the efficacy of ReCon and explore the current limitations of LLMs in terms of safety, reasoning, speaking style, and format, potentially furnishing insights for subsequent research.",
        "keywords": "Large language model;Avalon game;strategic communnication;deception",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Shenzhi Wang;Chang Liu;Zilong Zheng;Siyuan Qi;Shuo Chen;Qisen Yang;Andrew Zhao;Chaofei Wang;Shiji Song;Gao Huang",
        "authorids": "~Shenzhi_Wang1;~Chang_Liu38;~Zilong_Zheng1;~Siyuan_Qi1;~Shuo_Chen3;~Qisen_Yang1;~Andrew_Zhao1;~Chaofei_Wang1;~Shiji_Song1;~Gao_Huang1",
        "gender": ";M;M;;;F;M;M;M;M",
        "homepage": ";https://github.com/changliucoding;http://zilongzheng.github.io;;;https://qisen-yang.netlify.app/;https://andrewzh112.github.io;;;http://www.gaohuang.net",
        "dblp": ";;218/5234;177/5178;;;170/0026;;72/5351;",
        "google_scholar": ";;9sDx70IAAAAJ;ePclJR4AAAAJ;;VwblgV0AAAAJ;Tlt5xsYAAAAJ;https://scholar.google.com.hk/citations?user=-hwGMHcAAAAJ;;-P9LwcgAAAAJ",
        "orcid": ";;;0000-0002-4070-733X;;0000-0002-2587-2660;;;;",
        "linkedin": ";;;;;;;;;",
        "or_profile": "~Shenzhi_Wang1;~Chang_Liu38;~Zilong_Zheng1;~Siyuan_Qi1;~Shuo_Chen3;~Qisen_Yang1;~Andrew_Zhao1;~Chaofei_Wang1;~Shiji_Song1;~Gao_Huang1",
        "aff": ";Technische Universit\u00e4t M\u00fcnchen;Beijing Institute for General Artificial Intelligence;Beijing Institute for General Artificial Intelligence;;Tsinghua University;BIGAI;Tsinghua University;Tsinghua University;Tsinghua University",
        "aff_domain": ";tum.de;bigai.ai;bigai.ai;;tsinghua.edu.cn;bigai.ai;tsinghua.edu.cn;mail.tsinghua.edu.cn;tsinghua.edu.cn",
        "position": ";MS student;Researcher;Researcher;;PhD student;Researcher;PhD student;Full Professor;Associate Professor",
        "bibtex": "@misc{\nwang2024avalons,\ntitle={Avalon's Game of Thoughts: Battle Against Deception through Recursive Contemplation},\nauthor={Shenzhi Wang and Chang Liu and Zilong Zheng and Siyuan Qi and Shuo Chen and Qisen Yang and Andrew Zhao and Chaofei Wang and Shiji Song and Gao Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=fvhJu0FODp}\n}",
        "github": "",
        "project": "",
        "reviewers": "48Jp;zjpH;WArX;p3aL",
        "site": "https://openreview.net/forum?id=fvhJu0FODp",
        "pdf_size": 4791770,
        "rating": "3;3;3;6",
        "confidence": "4;3;3;3",
        "soundness": "1;2;3;3",
        "contribution": "1;2;2;3",
        "presentation": "2;2;3;3",
        "wc_summary": "231;110;62;96",
        "wc_strengths": "65;21;30;32",
        "wc_weaknesses": "893;137;223;344",
        "wc_questions": "28;1;72;2",
        "wc_review": "1217;269;387;474",
        "wc_reply_reviewers": "1220;0;72;0",
        "wc_reply_authors": "2409;1575;782;1278",
        "reply_reviewers": "5;0;1;0",
        "reply_authors": "5;5;2;3",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            124.75,
            63.77842503543028
        ],
        "wc_strengths_avg": [
            37.0,
            16.688319268278637
        ],
        "wc_weaknesses_avg": [
            399.25,
            294.39800865495
        ],
        "wc_questions_avg": [
            25.75,
            28.81297450802329
        ],
        "wc_review_avg": [
            586.75,
            371.0770640985508
        ],
        "wc_reply_reviewers_avg": [
            323.0,
            518.7166856772587
        ],
        "wc_reply_authors_avg": [
            1511.0,
            590.810883447487
        ],
        "reply_reviewers_avg": [
            1.5,
            2.0615528128088303
        ],
        "reply_authors_avg": [
            3.75,
            1.299038105676658
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 68,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14812032290058835837&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1;2;3;2;2;2",
        "aff_unique_norm": "Technische Universit\u00e4t M\u00fcnchen;Beijing Institute for General Artificial Intelligence;Tsinghua University;Beijing Institute of General Artificial Intelligence",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.tum.de;http://www.bigaiai.org/;https://www.tsinghua.edu.cn;https://www.bigmodel.cn/",
        "aff_unique_abbr": "TUM;BIGAI;THU;BIGAI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;1;1;1;1",
        "aff_country_unique": "Germany;China"
    },
    {
        "id": "fvse7bMkAs",
        "title": "Risk Assessment and Statistical Significance in the Age of Foundation Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We propose a distributional framework for assessing socio-technical risks of foundation models with quantified statistical significance. Our approach hinges on a new statistical relative testing  based on first and second order stochastic dominance of real random variables. We show that the second order statistics in this test are linked to mean-risk models commonly used in econometrics and mathematical finance to balance risk and utility when choosing between alternatives. Using this framework, we formally develop a risk-aware approach for foundation model selection given guardrails quantified by specified metrics. Inspired by portfolio optimization and selection theory in mathematical finance, we define a metrics portfolio for each model as a means to aggregate a collection of metrics, and perform model selection based on the stochastic dominance of these portfolios. The statistical significance of our tests is backed theoretically by an  asymptotic analysis via central limit theorems instantiated in practice via  a bootstrap variance estimate. \nWe use our framework to compare various large language models regarding risks related to drifting from instructions and outputting toxic content.",
        "keywords": "stochastic orders;evaluation;optimal transport;statistical significance;risk assessment;econometrics",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/7acbb64651b07b0289190f73a2c37f0ab8952f2d.zip",
        "author": "Apoorva Nitsure;Youssef Mroueh;Mattia Rigotti;Kristjan Greenewald;Brian Belgodere;Mikhail Yurochkin;Jiri Navratil;Igor Melnyk;Jarret Ross",
        "authorids": "~Apoorva_Nitsure1;~Youssef_Mroueh1;~Mattia_Rigotti1;~Kristjan_Greenewald1;~Brian_Belgodere1;~Mikhail_Yurochkin1;~Jiri_Navratil1;~Igor_Melnyk1;~Jarret_Ross1",
        "gender": ";;;;M;M;;M;",
        "homepage": ";;http://www.matrig.net;https://researcher.watson.ibm.com/researcher/view.php?person=ibm-Kristjan.H.Greenewald;;https://moonfolk.github.io/;https://researcher.watson.ibm.com/researcher/view.php?person=us-jiri;https://imelnyk.github.io/;",
        "dblp": ";http://dblp.uni-trier.de/pers/hd/m/Mroueh:Youssef;01/9816;146/0563;https://dblp.uni-trier.de/pid/139/2237;191/6719;00/680-1.html;;192/1669",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;TmHt7CwAAAAJ;L3zNUG4AAAAJ;;QjBF9sUAAAAJ;H41S5AgAAAAJ;4vDRTWwAAAAJ;",
        "orcid": ";;0000-0001-6466-2810;;;;0009-0007-5230-7679;;",
        "linkedin": "apoorvanitsure/;;;;brian-belgodere-050a953/;mikhail-yurochkin-a45659114/;jiri-navratil-62641497/;;",
        "or_profile": "~Apoorva_Nitsure1;~Youssef_Mroueh1;~Mattia_Rigotti1;~Kristjan_Greenewald1;~Brian_Belgodere1;~Mikhail_Yurochkin1;~Jiri_Navratil1;~Igor_Melnyk1;~Jarret_Ross1",
        "aff": "International Business Machines;IBM;International Business Machines;MIT-IBM Watson AI Lab, IBM Research;IBM Research;IBM Research;International Business Machines;International Business Machines;International Business Machines",
        "aff_domain": "ibm.com;us.ibm.com;ibm.com;ibm.com;ibm.com;ibm.com;ibm.com;ibm.com;ibm.com",
        "position": "Researcher;Research Staff member;Researcher;Research Scientist;Researcher;Researcher;Principal Research Staff Member;Researcher;Researcher",
        "bibtex": "@misc{\nnitsure2024risk,\ntitle={Risk Assessment and Statistical Significance in the Age of Foundation Models},\nauthor={Apoorva Nitsure and Youssef Mroueh and Mattia Rigotti and Kristjan Greenewald and Brian Belgodere and Mikhail Yurochkin and Jiri Navratil and Igor Melnyk and Jarret Ross},\nyear={2024},\nurl={https://openreview.net/forum?id=fvse7bMkAs}\n}",
        "github": "",
        "project": "",
        "reviewers": "MwiU;XDvM;wuox;7hNz;57J8;qkuw",
        "site": "https://openreview.net/forum?id=fvse7bMkAs",
        "pdf_size": 1265724,
        "rating": "3;5;5;6;6;6",
        "confidence": "3;4;2;3;3;3",
        "soundness": "2;1;2;3;3;3",
        "contribution": "2;2;2;3;3;3",
        "presentation": "3;1;2;3;3;3",
        "wc_summary": "59;87;153;185;146;171",
        "wc_strengths": "59;63;44;35;88;115",
        "wc_weaknesses": "106;272;104;37;77;175",
        "wc_questions": "5;238;184;87;47;196",
        "wc_review": "229;660;485;344;358;657",
        "wc_reply_reviewers": "0;378;0;12;33;0",
        "wc_reply_authors": "599;1582;578;748;571;953",
        "reply_reviewers": "0;2;0;1;1;0",
        "reply_authors": "1;3;1;1;1;2",
        "rating_avg": [
            5.166666666666667,
            1.0671873729054746
        ],
        "confidence_avg": [
            3.0,
            0.5773502691896257
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.7453559924999298
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.7637626158259734
        ],
        "wc_summary_avg": [
            133.5,
            45.29072752782847
        ],
        "wc_strengths_avg": [
            67.33333333333333,
            27.010286106510527
        ],
        "wc_weaknesses_avg": [
            128.5,
            76.25122949828416
        ],
        "wc_questions_avg": [
            126.16666666666667,
            84.86345241360121
        ],
        "wc_review_avg": [
            455.5,
            161.5206385161558
        ],
        "wc_reply_reviewers_avg": [
            70.5,
            138.0190204283453
        ],
        "wc_reply_authors_avg": [
            838.5,
            358.4386279406839
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.74535599249993
        ],
        "reply_authors_avg": [
            1.5,
            0.7637626158259734
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14382172442678407020&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;0;1;1;1;0;0;0",
        "aff_unique_norm": "International Business Machines Corporation;IBM",
        "aff_unique_dep": ";AI Lab",
        "aff_unique_url": "https://www.ibm.com;https://www.ibmwatsonai.org/",
        "aff_unique_abbr": "IBM;MIT-IBM AI Lab",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "fw1oizreEF",
        "title": "Convexifying Transformers: Improving optimization and understanding of transformer networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Understanding the fundamental mechanism behind the success of transformer networks is still an open problem in the deep learning literature. Although their remarkable performance has been mostly attributed to the self-attention mechanism, the literature still lacks a solid analysis of these networks and interpretation of the functions learned by them. To this end, we study the training problem of attention/transformer networks and introduce a novel convex analytic approach to improve the understanding and optimization of these networks. Particularly, we first introduce a convex alternative to the self-attention mechanism and reformulate the regularized training problem of transformer networks with our alternative convex attention. Then, we cast the reformulation as a convex optimization problem that is interpretable and easier to optimize. Moreover, as a byproduct of our convex analysis, we reveal an implicit regularization mechanism, which promotes sparsity across tokens. Therefore, we not only improve the optimization of attention/transformer networks but also provide a solid theoretical understanding of the functions learned by them. We also demonstrate the effectiveness of our theory through several numerical experiments.",
        "keywords": "Convex optimization;transformers;attention;self-attention;group sparsity",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/0f7d89e8f2a7c318c03fd0841e13694cbff4eb7a.zip",
        "author": "Tolga Ergen;Behnam Neyshabur;Harsh Mehta",
        "authorids": "~Tolga_Ergen1;~Behnam_Neyshabur1;~Harsh_Mehta1",
        "gender": "M;M;M",
        "homepage": "https://tolgaergen.github.io/;https://www.neyshabur.net;",
        "dblp": "202/7477.html;131/9898;122/1475",
        "google_scholar": "https://scholar.google.com.tr/citations?user=T1pWaCsAAAAJ;e1ucbCYAAAAJ;murJPNoAAAAJ",
        "orcid": "0000-0003-4806-0224;;",
        "linkedin": ";;",
        "or_profile": "~Tolga_Ergen1;~Behnam_Neyshabur1;~Harsh_Mehta1",
        "aff": "LG AI Research;Google;Google Research",
        "aff_domain": "lgresearch.ai;google.com;google.com",
        "position": "Research Scientist;Research Scientist;Software Engineer",
        "bibtex": "@misc{\nergen2024convexifying,\ntitle={Convexifying Transformers: Improving optimization and understanding of transformer networks},\nauthor={Tolga Ergen and Behnam Neyshabur and Harsh Mehta},\nyear={2024},\nurl={https://openreview.net/forum?id=fw1oizreEF}\n}",
        "github": "",
        "project": "",
        "reviewers": "E73C;6FNQ;boLQ;Mygf",
        "site": "https://openreview.net/forum?id=fw1oizreEF",
        "pdf_size": 678089,
        "rating": "5;5;5;5",
        "confidence": "3;4;3;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;4",
        "wc_summary": "18;95;108;133",
        "wc_strengths": "45;55;45;16",
        "wc_weaknesses": "81;89;374;201",
        "wc_questions": "2;79;69;32",
        "wc_review": "146;318;596;382",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            88.5,
            42.933087473416116
        ],
        "wc_strengths_avg": [
            40.25,
            14.58380951603524
        ],
        "wc_weaknesses_avg": [
            186.25,
            118.3245008440771
        ],
        "wc_questions_avg": [
            45.5,
            30.614539029683264
        ],
        "wc_review_avg": [
            360.5,
            161.04269620197
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9360709362735309429&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "LG;Google",
        "aff_unique_dep": "LG AI Research;Google",
        "aff_unique_url": "https://www.lgaires.com;https://www.google.com",
        "aff_unique_abbr": "LG AI;Google",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "title": "Improving Generalization of Alignment with Human Preferences through Group Invariant Learning",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18165",
        "id": "fwCoLe3TAX",
        "author_site": "Rui Zheng, Wei Shen, Yuan Hua, Wenbin Lai, Shihan Dou, Yuhao Zhou, Zhiheng Xi, Xiao Wang, Haoran Huang, Tao Gui, Qi Zhang, Xuanjing Huang",
        "tldr": "",
        "abstract": "The success of AI assistants based on language models (LLMs) hinges crucially on Reinforcement Learning from Human Feedback (RLHF), which enables the generation of responses more aligned with human preferences. \nAs universal AI assistants, there's a growing expectation for them to perform consistently across various domains. \nHowever, previous work shows that Reinforcement Learning (RL) often exploits shortcuts to attain high rewards and overlooks challenging samples.\nThis focus on quick reward gains undermines both the stability in training and the model's ability to generalize to new, unseen data.\nIn this work, we propose a novel approach that can learn a consistent policy via RL across various data groups or domains. \nGiven the challenges associated with acquiring group annotations, our method automatically classifies data into different groups, deliberately maximizing performance variance.\nThen, we optimize the policy to perform well on challenging groups. \nLastly, leveraging the established groups, our approach adaptively adjusts the exploration space, allocating more learning capacity to more challenging data and preventing the model from over-optimizing on simpler data. Experimental results indicate that our approach significantly enhances training stability and model generalization.",
        "keywords": "alignment;language model;invariant learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Rui Zheng;Wei Shen;Yuan Hua;Wenbin Lai;Shihan Dou;Yuhao Zhou;Zhiheng Xi;Xiao Wang;Haoran Huang;Tao Gui;Qi Zhang;Xuanjing Huang",
        "authorids": "~Rui_Zheng1;~Wei_Shen12;~Yuan_Hua2;~Wenbin_Lai1;~Shihan_Dou1;~Yuhao_Zhou3;~Zhiheng_Xi1;~Xiao_Wang12;~Haoran_Huang1;~Tao_Gui1;~Qi_Zhang8;~Xuanjing_Huang1",
        "gender": "M;;;M;M;;M;M;M;M;F;M",
        "homepage": "https://github.com/ruizheng20;http://github.com/fakerbaby;https://github.com/hyserendipity;;https://ciaran.top;https://woooodyy.github.io/;https://xiaowangnlp.github.io/;;;http://qizhang.info;https://xuanjing-huang.github.io/;https://shihandou.com/",
        "dblp": ";;;;;333/4268;;170/8136;135/6973;52/323-1;05/6735-1;282/6213",
        "google_scholar": "https://scholar.google.com.hk/citations?user=7Z0V_SoAAAAJ;-DlGT8IAAAAJ;;;qHHExWgAAAAJ;https://scholar.google.com.hk/citations?user=zSVLkqAAAAAJ;https://scholar.google.com.hk/citations?hl=zh-CN;ZT6jRqwAAAAJ;;XfqR3yYAAAAJ;RGsMgZA4H78C;BM5WHiYAAAAJ",
        "orcid": ";;;;;;;;;;0000-0001-9197-9426;",
        "linkedin": ";;;;;;;;;;;",
        "or_profile": "~Rui_Zheng1;~Wei_Shen12;~Yuan_Hua2;~Wenbin_Lai1;~Yuhao_Zhou3;~Zhiheng_Xi1;~Xiao_Wang12;~Haoran_Huang1;~Tao_Gui1;~Qi_Zhang8;~Xuanjing_Huang1;~Dou_Shi_Han1",
        "aff": "Fudan University;Fudan University;;Fudan University;Fudan University;Fudan University;Fudan University;Bytedance Inc;Fudan University;Fudan University;Fudan University;Fudan University",
        "aff_domain": "fudan.edu.cn;fudan.edu.cn;;fudan.edu.cn;fudan.edu.cn;fudan.edu.cn;fudan.edu.cn;bytedance.com;fudan.edu.cn;fudan.edu.cn;fudan.edu.cn;fudan.edu.cn",
        "position": "PhD student;MS student;;MS student;MS student;PhD student;PhD student;Researcher;Assistant Professor;Full Professor;Full Professor;MS student",
        "bibtex": "@inproceedings{\nzheng2024improving,\ntitle={Improving Generalization of Alignment with Human Preferences through Group Invariant Learning},\nauthor={Rui Zheng and Wei Shen and Yuan Hua and Wenbin Lai and Shihan Dou and Yuhao Zhou and Zhiheng Xi and Xiao Wang and Haoran Huang and Tao Gui and Qi Zhang and Xuanjing Huang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=fwCoLe3TAX}\n}",
        "github": "",
        "project": "",
        "reviewers": "bjuC;cgwB;cSKU;7D9U",
        "pdf_size": 491895,
        "rating": "6;6;8;10",
        "confidence": "3;3;4;4",
        "soundness": "2;3;3;4",
        "contribution": "3;3;2;4",
        "presentation": "3;3;3;4",
        "wc_summary": "147;76;80;91",
        "wc_strengths": "104;73;20;82",
        "wc_weaknesses": "108;156;233;185",
        "wc_questions": "3;4;4;24",
        "wc_review": "362;309;337;382",
        "wc_reply_reviewers": "41;41;0;17",
        "wc_reply_authors": "1134;1036;2037;1566",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "3;2;4;3",
        "rating_avg": [
            7.5,
            1.6583123951777
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            98.5,
            28.53506614676055
        ],
        "wc_strengths_avg": [
            69.75,
            30.85753554644311
        ],
        "wc_weaknesses_avg": [
            170.5,
            45.36794022214365
        ],
        "wc_questions_avg": [
            8.75,
            8.814051281902097
        ],
        "wc_review_avg": [
            347.5,
            27.35415873317986
        ],
        "wc_reply_reviewers_avg": [
            24.75,
            17.32591988899868
        ],
        "wc_reply_authors_avg": [
            1443.25,
            396.57746721164074
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            12,
            0
        ],
        "corr_rating_confidence": 0.9045340337332909,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11044354265047442749&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=fwCoLe3TAX",
        "pdf": "https://openreview.net/pdf?id=fwCoLe3TAX",
        "email": "fudan.edu.cn;fudan.edu.cn;;fudan.edu.cn;fudan.edu.cn;fudan.edu.cn;fudan.edu.cn;bytedance.com;fudan.edu.cn;fudan.edu.cn;fudan.edu.cn;fudan.edu.cn",
        "author_num": 12,
        "aff_unique_index": "0;0;0;0;0;0;1;0;0;0;0",
        "aff_unique_norm": "Fudan University;ByteDance",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.fudan.edu.cn;https://www.bytedance.com",
        "aff_unique_abbr": "Fudan;Bytedance",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "fwJeVYGcbz",
        "title": "Multiple Modes for Continual Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Adapting model parameters to incoming streams of data is a crucial factor to deep learning scalability. Interestingly, prior continual learning strategies in online settings inadvertently anchor their updated parameters to a local parameter subspace to remember old tasks, else drift away from the subspace and forget. From this observation, we formulate a trade-off between constructing multiple parameter modes and allocating tasks per mode. Mode-Optimized Task Allocation (MOTA), our contributed adaptation strategy, trains multiple modes in parallel, then optimizes task allocation per mode. We empirically demonstrate improvements over baseline continual learning strategies and across varying distribution shifts, namely sub-population, domain, and task shift.",
        "keywords": "continual learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Siddhartha Datta;Nigel Shadbolt",
        "authorids": "~Siddhartha_Datta1;~Nigel_Shadbolt1",
        "gender": ";M",
        "homepage": "http://siddharthadatta.ml/;https://www.cs.ox.ac.uk/people/nigel.shadbolt/",
        "dblp": ";s/NigelShadbolt",
        "google_scholar": ";wTAM67UAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Siddhartha_Datta1;~Nigel_Shadbolt1",
        "aff": "University of Oxford;University of Oxford",
        "aff_domain": "ox.ac.uk;ox.ac.uk",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\ndatta2024multiple,\ntitle={Multiple Modes for Continual Learning},\nauthor={Siddhartha Datta and Nigel Shadbolt},\nyear={2024},\nurl={https://openreview.net/forum?id=fwJeVYGcbz}\n}",
        "github": "",
        "project": "",
        "reviewers": "dCAf;DgD8;esLW;Nb7N",
        "site": "https://openreview.net/forum?id=fwJeVYGcbz",
        "pdf_size": 2228401,
        "rating": "3;3;5;5",
        "confidence": "4;4;3;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;2",
        "presentation": "2;1;3;2",
        "wc_summary": "56;39;60;72",
        "wc_strengths": "34;58;16;58",
        "wc_weaknesses": "168;458;419;146",
        "wc_questions": "41;119;48;3",
        "wc_review": "299;674;543;279",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            56.75,
            11.818946653572814
        ],
        "wc_strengths_avg": [
            41.5,
            17.684739183827393
        ],
        "wc_weaknesses_avg": [
            297.75,
            141.6375215117802
        ],
        "wc_questions_avg": [
            52.75,
            41.90689084148334
        ],
        "wc_review_avg": [
            448.75,
            166.47878994034045
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3406962528913236929&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Oxford",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ox.ac.uk",
        "aff_unique_abbr": "Oxford",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "fweSF6QplV",
        "title": "Structured Graph Reduction for Efficient GNN",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Scalability remains a prominent challenge for Graph Neural Networks (GNNs) when dealing with large-scale graph data. Graph coarsening is a technique that reduces a large graph to a smaller tractable graph. A good quality graph representation with specific properties is needed to achieve good performance with downstream applications.\nHowever, existing coarsening methods could not coarsen graphs with desirable properties, such as sparsity, scale-free characteristics, bipartite structure, or multi-component structure. This work introduces a unified optimization framework for learning coarsened graphs with desirable structures and properties. The proposed frameworks are solved efficiently by leveraging block majorization-minimization, \n $\\log$ determinant, structured regularization, and spectral regularization frameworks. Extensive experiments with real benchmark datasets elucidate the proposed framework\u2019s efficacy in preserving the structure in coarsened graphs. Empirically, when there is no prior knowledge available regarding the graph's structure, constructing a multicomponent coarsened graph consistently demonstrates superior performance compared to state-of-the-art methods.",
        "keywords": "structured graph coarsening;graph neural network;node classification;convex optimization",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/5cd47d0782a9e07c96ce69f57ddbdb7b6f4c499b.zip",
        "author": "Manoj Kumar;Subhanu Halder;Abhishek Gupta;Sandeep Kumar",
        "authorids": "~Manoj_Kumar4;~Subhanu_Halder1;~Abhishek_Gupta8;~Sandeep_Kumar8",
        "gender": "M;M;M;M",
        "homepage": ";;;https://sites.google.com/view/sandeepkr/home",
        "dblp": ";;;",
        "google_scholar": "gdL-bokAAAAJ;;;lycMMW8AAAAJ",
        "orcid": ";;;",
        "linkedin": "manoj-kumar-9042b449/;subhanuhalder777/;abhishek-gupta-063b62144/;sandeep-kumar-84463332/",
        "or_profile": "~Manoj_Kumar4;~Subhanu_Halder1;~Abhishek_Gupta8;~Sandeep_Kumar8",
        "aff": "Indian Institute of Technology Delhi;Indian Institute of Technology, Delhi;Indian Institute of Technology, Delhi;Indian Institute of Technology Delhi",
        "aff_domain": "iitd.ac.in;iitd.ac.in;iitd.ac.in;iitd.ac.in",
        "position": "PhD student;PhD student;Researcher;Assistant Professor",
        "bibtex": "@misc{\nkumar2024structured,\ntitle={Structured Graph Reduction for Efficient {GNN}},\nauthor={Manoj Kumar and Subhanu Halder and Abhishek Gupta and Sandeep Kumar},\nyear={2024},\nurl={https://openreview.net/forum?id=fweSF6QplV}\n}",
        "github": "",
        "project": "",
        "reviewers": "A6C2;Nawj;EfFB;nDtt",
        "site": "https://openreview.net/forum?id=fweSF6QplV",
        "pdf_size": 1463871,
        "rating": "3;5;5;6",
        "confidence": "4;2;4;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;3;2",
        "wc_summary": "53;43;99;67",
        "wc_strengths": "17;20;105;65",
        "wc_weaknesses": "157;214;168;285",
        "wc_questions": "57;109;181;31",
        "wc_review": "284;386;553;448",
        "wc_reply_reviewers": "32;35;0;0",
        "wc_reply_authors": "1127;973;954;701",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "3;3;3;2",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            65.5,
            21.13646138784825
        ],
        "wc_strengths_avg": [
            51.75,
            36.14813273185767
        ],
        "wc_weaknesses_avg": [
            206.0,
            50.37360419902471
        ],
        "wc_questions_avg": [
            94.5,
            57.295287764352835
        ],
        "wc_review_avg": [
            417.75,
            97.6021900369044
        ],
        "wc_reply_reviewers_avg": [
            16.75,
            16.78354849249705
        ],
        "wc_reply_authors_avg": [
            938.75,
            152.78150247984865
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.75,
            0.4330127018922193
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.48420012470625223,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:LDTrbwGIESEJ:scholar.google.com/&scioq=Structured+Graph+Reduction+for+Efficient+GNN&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Indian Institute of Technology Delhi",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.iitd.ac.in",
        "aff_unique_abbr": "IIT Delhi",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Delhi",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "India"
    },
    {
        "id": "fx8AJDQRVB",
        "title": "Image Super-Resolution via Latent Diffusion: A Sampling-Space Mixture of Experts and Frequency-Augmented Decoder Approach",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The recent use of diffusion prior, enhanced by pre-trained text-image models, has markedly elevated the performance of image super-resolution (SR). To alleviate the huge computational cost required by pixel-based diffusion SR, latent-based methods utilize a feature encoder to transform the image and then implement the SR image generation in a compact latent space. Nevertheless, there are two major issues that limit the performance of latent-based diffusion. First, the compression of latent space usually causes reconstruction distortion. Second, huge computational cost still constrains the parameter scale of the diffusion model. To counteract these issues, we first propose a frequency compensation module that enhances the frequency components from latent space to pixel space. The reconstruction distortion (especially for high-frequency information) can be significantly decreased. Then, we propose to use Sample-Space Mixture of Experts\n(SS-MoE) to achieve more powerful latent-based SR, which steadily improves the capacity of the model without a significant increase in inference costs. These carefully crafted designs contribute to performance improvements in largely explored 4\u00d7 blind super-resolution benchmarks and extend to large magnification factors, i.e., 8\u00d7 image SR benchmarks.",
        "keywords": "Diffusion Model;Image Super-Resolution",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Feng Luo;Jinxi Xiang;Jun Zhang;Xiao Han;Yang Wei",
        "authorids": "~Feng_Luo4;~Jinxi_Xiang1;~Jun_Zhang17;~Xiao_Han2;~Yang_Wei2",
        "gender": "F;M;M;M;M",
        "homepage": ";https://jinxixiang.netlify.app/;https://junzhang.org;;",
        "dblp": ";227/4249;29/4190-18.html;01/2095-7;03/1094-32.html",
        "google_scholar": "TGd_-9UAAAAJ;Zn-0LioAAAAJ;;XGVV3gEAAAAJ;",
        "orcid": ";;0000-0001-5579-7094;;",
        "linkedin": ";;;xiaohan2009;",
        "or_profile": "~Feng_Luo4;~Jinxi_Xiang1;~Jun_Zhang17;~Xiao_Han2;~Yang_Wei2",
        "aff": "Tencent AI Lab;Tencent AI Lab;Tencent AI Lab;Tencent AI Lab;Tencent AI Lab",
        "aff_domain": "tencent.com;tencent.com;tencent.com;tencent.com;tencent.com",
        "position": "Researcher;Researcher;Principal Researcher;Principal Researcher;Researcher",
        "bibtex": "@misc{\nluo2024image,\ntitle={Image Super-Resolution via Latent Diffusion: A Sampling-Space Mixture of Experts and Frequency-Augmented Decoder Approach},\nauthor={Feng Luo and Jinxi Xiang and Jun Zhang and Xiao Han and Yang Wei},\nyear={2024},\nurl={https://openreview.net/forum?id=fx8AJDQRVB}\n}",
        "github": "",
        "project": "",
        "reviewers": "krWG;MvoB;uAFu;dphS",
        "site": "https://openreview.net/forum?id=fx8AJDQRVB",
        "pdf_size": 17710085,
        "rating": "3;3;5;6",
        "confidence": "5;4;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "81;36;25;67",
        "wc_strengths": "19;49;18;28",
        "wc_weaknesses": "142;134;160;94",
        "wc_questions": "3;6;15;4",
        "wc_review": "245;225;218;193",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1739;2287;1918;1023",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "4;5;4;2",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            52.25,
            22.64260364887395
        ],
        "wc_strengths_avg": [
            28.5,
            12.459935794377111
        ],
        "wc_weaknesses_avg": [
            132.5,
            24.14021540914662
        ],
        "wc_questions_avg": [
            7.0,
            4.743416490252569
        ],
        "wc_review_avg": [
            220.25,
            18.59267328815305
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1741.75,
            459.6114527511254
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            3.75,
            1.0897247358851685
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5555555555555555,
        "gs_citation": 16,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5506528698721078092&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Tencent",
        "aff_unique_dep": "Tencent AI Lab",
        "aff_unique_url": "https://ai.tencent.com",
        "aff_unique_abbr": "Tencent AI Lab",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "fx8pfuAsyL",
        "title": "Degradation-aware Unfolding Knowledge-assist Transformer for Spectral Compressive Imaging",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Snapshot compressive spectral imaging offers the capability to effectively capture three-dimensional spatial-spectral images through a single-shot two-dimensional measurement, showcasing its significant potential for spectral data acquisition. However, the challenge of accurately reconstructing 3D spectral signals from 2D measurements persists, particularly when it comes to preserving fine-grained details like textures, which is caused by the lack of high-fidelity clean image information in the input compressed measurements. In this paper, we introduce a two-phase training strategy embedding high-quality knowledge prior in a deep unfolding framework, aiming at reconstructing high-fidelity spectral signals. Our experimental results on synthetic benchmarks and real-world datasets demonstrate the notably enhanced accuracy of our proposed method, both in spatial and spectral dimensions. Code and pre-trained models will be released.",
        "keywords": "Spectral image reconstruction;deep unfolding;vector quantization",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Zongliang Wu;Ruiying Lu;Xin Yuan",
        "authorids": "~Zongliang_Wu1;~Ruiying_Lu1;~Xin_Yuan4",
        "gender": "M;F;M",
        "homepage": ";https://github.com/RuiyingLu;https://en.westlake.edu.cn/faculty/xin-yuan.html",
        "dblp": ";255/5995;78/713-2",
        "google_scholar": ";;cS9CbWkAAAAJ",
        "orcid": "0000-0003-0750-0246;0000-0002-8825-6064;0000-0002-8311-7524",
        "linkedin": ";;xin-yuan-0024bb31/",
        "or_profile": "~Zongliang_Wu1;~Ruiying_Lu1;~Xin_Yuan4",
        "aff": "Zhejiang University;Xidian University;Westlake University",
        "aff_domain": "zju.edu.cn;xidian.edu;westlake.edu.cn",
        "position": "PhD student;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nwu2024degradationaware,\ntitle={Degradation-aware Unfolding Knowledge-assist Transformer for Spectral Compressive Imaging},\nauthor={Zongliang Wu and Ruiying Lu and Xin Yuan},\nyear={2024},\nurl={https://openreview.net/forum?id=fx8pfuAsyL}\n}",
        "github": "",
        "project": "",
        "reviewers": "EFVD;y4To;fgj2;wS7P",
        "site": "https://openreview.net/forum?id=fx8pfuAsyL",
        "pdf_size": 3433786,
        "rating": "3;5;5;5",
        "confidence": "5;4;4;4",
        "soundness": "3;3;2;3",
        "contribution": "2;2;2;2",
        "presentation": "3;3;2;2",
        "wc_summary": "41;75;152;57",
        "wc_strengths": "16;25;30;41",
        "wc_weaknesses": "161;169;86;226",
        "wc_questions": "103;4;120;27",
        "wc_review": "321;273;388;351",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            81.25,
            42.581539427315214
        ],
        "wc_strengths_avg": [
            28.0,
            9.027735042633894
        ],
        "wc_weaknesses_avg": [
            160.5,
            49.78202486842013
        ],
        "wc_questions_avg": [
            63.5,
            49.053542175871456
        ],
        "wc_review_avg": [
            333.25,
            42.109232954305874
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:T5TSREAdNOwJ:scholar.google.com/&scioq=Degradation-aware+Unfolding+Knowledge-assist+Transformer+for+Spectral+Compressive+Imaging&hl=en&as_sdt=0,47",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Zhejiang University;Xidian University;Westlake University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.zju.edu.cn;http://www.xidian.edu.cn/;https://www.westlake.edu.cn",
        "aff_unique_abbr": "ZJU;Xidian;WU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "fxCSiPPulq",
        "title": "One Training Fits All: Addressing Model-Heterogeneity Federated Learning via Architecture Probing",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Model-heterogeneity federated learning (FL) is a flexible setting where a client trains a model subject to its local computation capacity. Towards the scenario, partial averaging extracts the clients' models from a global model so that the aggregation of each model parameter is identified. While existing models can only generate submodels with predefined settings established during training, our approach utilizes a trainable probabilistic masking strategy named FedMAP, enabling the dynamic creation of customized model sizes aligned with the client's budget. In detail, the clients find the best model architectures based on their local datasets and computation resources, and the FL server merges these local optimal architectures into a probabilistic mask. In the end, we attain a stable probabilistic mask, with which we can generate arbitrary models for evaluation or update the counterpart of the model parameters while training with the clients' data. Our experiments validate the effectiveness of the proposed FedMAP from two aspects: (i) It can improve the state-of-the-art approaches to heterogeneous model updates, especially for those small-size models; and (ii) We can extract the submodels whose sizes never appear in training with exceptional performance.",
        "keywords": "Federated Learning;Model Heterogeneity;Model Pruning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Feijie Wu;Yaqing Wang;Tianci Liu;Xingchen Wang;Lu Su;Jing Gao",
        "authorids": "~Feijie_Wu1;~Yaqing_Wang1;~Tianci_Liu1;~Xingchen_Wang1;~Lu_Su1;~Jing_Gao2",
        "gender": ";M;M;M;M;F",
        "homepage": "https://harli.me/;https://yaqingwang.github.io/;https://lliutianc.github.io;https://wangxingchen2930.github.io;https://engineering.purdue.edu/~lusu/;https://engineering.purdue.edu/~jinggao/",
        "dblp": "246/4255;147/1393;148/1911-3;;63/4152-1;67/4834-4",
        "google_scholar": "https://scholar.google.com/citations?hl=en;_Rfg2CAAAAAJ;;;38RuCN4AAAAJ;Ftj1h4cAAAAJ",
        "orcid": "0000-0003-0541-1901;;;0000-0003-1352-7445;0000-0001-7223-543X;",
        "linkedin": ";;;;;",
        "or_profile": "~Feijie_Wu1;~Yaqing_Wang1;~Tianci_Liu1;~Xingchen_Wang1;~Lu_Su1;~Jing_Gao2",
        "aff": "Purdue University;Google DeepMind;Purdue University;Purdue University;Purdue University;Purdue University",
        "aff_domain": "purdue.edu;google.com;purdue.edu;purdue.edu;purdue.edu;purdue.edu",
        "position": "PhD student;Research Scientist;PhD student;PhD student;Associate Professor;Associate Professor",
        "bibtex": "@misc{\nwu2024one,\ntitle={One Training Fits All: Addressing Model-Heterogeneity Federated Learning via Architecture Probing},\nauthor={Feijie Wu and Yaqing Wang and Tianci Liu and Xingchen Wang and Lu Su and Jing Gao},\nyear={2024},\nurl={https://openreview.net/forum?id=fxCSiPPulq}\n}",
        "github": "",
        "project": "",
        "reviewers": "LZmJ;UbYG;VuHT;hWhP",
        "site": "https://openreview.net/forum?id=fxCSiPPulq",
        "pdf_size": 534299,
        "rating": "3;3;5;5",
        "confidence": "5;3;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "83;111;63;71",
        "wc_strengths": "31;87;122;31",
        "wc_weaknesses": "128;454;165;104",
        "wc_questions": "106;163;1;2",
        "wc_review": "348;815;351;208",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            82.0,
            18.193405398660254
        ],
        "wc_strengths_avg": [
            67.75,
            38.77740966078059
        ],
        "wc_weaknesses_avg": [
            212.75,
            140.97051996782872
        ],
        "wc_questions_avg": [
            68.0,
            69.48740893140281
        ],
        "wc_review_avg": [
            430.5,
            229.3866822638141
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:WH_9KxnvuPoJ:scholar.google.com/&scioq=One+Training+Fits+All:+Addressing+Model-Heterogeneity+Federated+Learning+via+Architecture+Probing&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0;0;0",
        "aff_unique_norm": "Purdue University;Google",
        "aff_unique_dep": ";Google DeepMind",
        "aff_unique_url": "https://www.purdue.edu;https://deepmind.com",
        "aff_unique_abbr": "Purdue;DeepMind",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;0;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "title": "Crystalformer: Infinitely Connected Attention for Periodic Structure Encoding",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18164",
        "id": "fxQiecl9HB",
        "author_site": "Tatsunori Taniai, Ryo Igarashi, Yuta Suzuki, Naoya Chiba, Kotaro Saito, Yoshitaka Ushiku, Kanta Ono",
        "tldr": "",
        "abstract": "Predicting physical properties of materials from their crystal structures is a fundamental problem in materials science. In peripheral areas such as the prediction of molecular properties, fully connected attention networks have been shown to be successful. However, unlike these finite atom arrangements, crystal structures are infinitely repeating, periodic arrangements of atoms, whose fully connected attention results in *infinitely connected attention*. In this work, we show that this infinitely connected attention can lead to a computationally tractable formulation, interpreted as *neural potential summation*, that performs infinite interatomic potential summations in a deeply learned feature space. We then propose a simple yet effective Transformer-based encoder architecture for crystal structures called *Crystalformer*. Compared to an existing Transformer-based model, the proposed model requires only 29.4% of the number of parameters, with minimal modifications to the original Transformer architecture. Despite the architectural simplicity, the proposed method outperforms state-of-the-art methods for various property regression tasks on the Materials Project and JARVIS-DFT datasets.",
        "keywords": "Materials Science;Attention Networks;Transformer;Physics-Informed ML",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Tatsunori Taniai;Ryo Igarashi;Yuta Suzuki;Naoya Chiba;Kotaro Saito;Yoshitaka Ushiku;Kanta Ono",
        "authorids": "~Tatsunori_Taniai4;~Ryo_Igarashi1;~Yuta_Suzuki1;~Naoya_Chiba1;~Kotaro_Saito1;~Yoshitaka_Ushiku3;~Kanta_Ono1",
        "gender": "M;M;;M;M;;M",
        "homepage": "https://taniai.space;https://researchmap.jp/rigarash;;https://sites.google.com/view/n-chiba-;https://sites.google.com/view/kotarosaito/;;https://yoshitakaushiku.net/",
        "dblp": "128/7894;123/3920-2;;202/5745;;40/10032;24/8843",
        "google_scholar": "-9J6RhYAAAAJ;i06GU0EAAAAJ;;https://scholar.google.co.jp/citations?user=TkFr708AAAAJ;;;kxUld9MAAAAJ",
        "orcid": ";0000-0002-2894-7226;0000-0002-0019-4832;;;;0000-0002-9014-1389",
        "linkedin": ";rigarash/;;;;;losnuevetoros/",
        "or_profile": "~Tatsunori_Taniai4;~Ryo_Igarashi1;~Yuta_Suzuki1;~Naoya_Chiba1;~Kotaro_Saito1;~Kanta_Ono1;~Yoshitaka_Ushiku4",
        "aff": "OMRON SINIC X;OMRON SINIC X Corporation;Toyota Motor Corporation;Tohoku University;Osaka University;Osaka University, Tokyo Institute of Technology;OMRON SINIC X",
        "aff_domain": "sinicx.com;sinicx.com;toyota.ac.jp;tohoku.ac.jp;osaka-u.ac.jp;osaka-u.ac.jp;sinicx.com",
        "position": "Researcher;Project Researcher;Researcher;Assistant Professor;Researcher;Full Professor;Principal Investigator",
        "bibtex": "@inproceedings{\ntaniai2024crystalformer,\ntitle={Crystalformer: Infinitely Connected Attention for Periodic Structure Encoding},\nauthor={Tatsunori Taniai and Ryo Igarashi and Yuta Suzuki and Naoya Chiba and Kotaro Saito and Yoshitaka Ushiku and Kanta Ono},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=fxQiecl9HB}\n}",
        "github": "",
        "project": "",
        "reviewers": "8AQw;u628;NG2X;S6vd",
        "pdf_size": 1104367,
        "rating": "5;8;8;8",
        "confidence": "4;4;3;4",
        "soundness": "2;3;3;4",
        "contribution": "2;3;3;3",
        "presentation": "3;3;2;3",
        "wc_summary": "69;258;32;96",
        "wc_strengths": "36;64;37;152",
        "wc_weaknesses": "310;256;160;114",
        "wc_questions": "19;114;1;92",
        "wc_review": "434;692;230;454",
        "wc_reply_reviewers": "123;223;0;27",
        "wc_reply_authors": "2690;1345;858;833",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "5;3;2;2",
        "rating_avg": [
            7.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            113.75,
            86.32605342537096
        ],
        "wc_strengths_avg": [
            72.25,
            47.39396058571176
        ],
        "wc_weaknesses_avg": [
            210.0,
            77.18808198161165
        ],
        "wc_questions_avg": [
            56.5,
            47.573627147822144
        ],
        "wc_review_avg": [
            452.5,
            163.7154543712963
        ],
        "wc_reply_reviewers_avg": [
            93.25,
            87.7564100222884
        ],
        "wc_reply_authors_avg": [
            1431.5,
            754.719981185075
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            1.224744871391589
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12263316289144607637&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=fxQiecl9HB",
        "pdf": "https://openreview.net/pdf?id=fxQiecl9HB",
        "email": "sinicx.com;sinicx.com;toyota.ac.jp;tohoku.ac.jp;osaka-u.ac.jp;osaka-u.ac.jp;sinicx.com",
        "author_num": 7,
        "aff_unique_index": "0;0;1;2;3;3;0",
        "aff_unique_norm": "OMRON Corporation;Toyota Motor Corporation;Tohoku University;Osaka University",
        "aff_unique_dep": "SINIC X;;;",
        "aff_unique_url": "https://www.omron.com;https://www.toyota-global.com;https://www.tohoku.ac.jp;https://www.osaka-u.ac.jp",
        "aff_unique_abbr": "OMRON;Toyota;Tohoku U;Osaka U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "Japan"
    },
    {
        "id": "fyCPspuM5L",
        "title": "PowerGraph: A power grid benchmark dataset for graph neural networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Public Graph Neural Networks (GNN) benchmark datasets facilitate the use of GNN and enhance GNN applicability to diverse disciplines. The community currently lacks public datasets of electrical power grids for GNN applications. Indeed, GNNs have the potential for capturing complex power grid phenomena over alternative machine learning techniques. Power grids are complex engineered networks that are naturally amenable to graph representations. Therefore, GNN have the potential for capturing the behaviour of power grids over alternative machine learning techniques. To this aim, we develop a graph dataset for cascading failure events, which are the major cause of blackouts in electric power grids. Historical blackout datasets are scarce and incomplete. The assessment of vulnerability and the identification of critical components are usually conducted via computationally expensive offline simulations of cascading failures. Instead, we propose the use of machine learning models for the online detection of cascading failures leveraging the knowledge of the system state at the onset of the cascade. We develop PowerGraph, a graph dataset modelling cascading failures in power grids, designed for two purposes, namely, i) training GNN models for different graph-level tasks including multi-class classification, binary classification, and regression, and ii) explaining GNN models. The dataset generated via physics-based cascading failure model ensures generality of the operating and environmental conditions by spanning diverse failure scenarios. In addition, we foster the use of the dataset to benchmark GNN explainability methods by assigning ground-truth edge-level explanations. PowerGraph helps the development of better GNN models for graph-level tasks and explainability, critical in many domains ranging from chemistry to biology, where the systems and processes can be described as graphs. The dataset is available at https://figshare.com/articles/dataset/PowerGraph/22820534 and the code at https://anonymous.4open.science/r/PowerGraph/.",
        "keywords": "Power grids;graph neural networks;explainability;benchmark",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/1428e6cd03834d9e610b4773f6a7fcbbf1e18f86.pdf",
        "author": "Anna Varbella;Kenza Amara;Blazhe Gjorgiev;Giovanni Sansavini",
        "authorids": "~Anna_Varbella1;~Kenza_Amara1;~Blazhe_Gjorgiev1;~Giovanni_Sansavini1",
        "gender": "F;F;;Not Specified",
        "homepage": ";https://ai.ethz.ch/people/kenza-amara.html;https://rre.ethz.ch/the-lab/people/senior-researchers/dr--blazhe-gjorgiev.html;http://www.rre.ethz.ch",
        "dblp": ";;;",
        "google_scholar": "X87maeEAAAAJ;e4wlh1AAAAAJ;https://scholar.google.ch/citations?user=3pDpQIAAAAAJ;",
        "orcid": "0000-0003-0778-5106;0000-0001-7139-5562;;",
        "linkedin": "anna-varbella-1661441b7/;kenza-amara/;;",
        "or_profile": "~Anna_Varbella1;~Kenza_Amara1;~Blazhe_Gjorgiev1;~Giovanni_Sansavini1",
        "aff": "ETHZ - ETH Zurich;ETH AI Center;ETHZ - ETH Zurich;ETHZ - ETH Zurich",
        "aff_domain": "ethz.ch;infk.ethz.ch;ethz.ch;ethz.ch",
        "position": "PhD student;PhD student;Researcher;Associate Professor",
        "bibtex": "@misc{\nvarbella2024powergraph,\ntitle={PowerGraph: A power grid benchmark dataset for graph neural networks},\nauthor={Anna Varbella and Kenza Amara and Blazhe Gjorgiev and Giovanni Sansavini},\nyear={2024},\nurl={https://openreview.net/forum?id=fyCPspuM5L}\n}",
        "github": "",
        "project": "",
        "reviewers": "9FMu;vvXj;btRh;RsGH",
        "site": "https://openreview.net/forum?id=fyCPspuM5L",
        "pdf_size": 1535294,
        "rating": "3;3;5;8",
        "confidence": "3;4;3;3",
        "soundness": "2;2;3;2",
        "contribution": "3;2;2;3",
        "presentation": "3;3;2;3",
        "wc_summary": "114;54;63;184",
        "wc_strengths": "52;94;19;73",
        "wc_weaknesses": "246;170;70;37",
        "wc_questions": "137;109;141;1",
        "wc_review": "549;427;293;295",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            103.75,
            51.6738570265468
        ],
        "wc_strengths_avg": [
            59.5,
            27.69927796892908
        ],
        "wc_weaknesses_avg": [
            130.75,
            82.61771904379835
        ],
        "wc_questions_avg": [
            97.0,
            56.78027826631356
        ],
        "wc_review_avg": [
            391.0,
            106.1602562167217
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.49374193110101877,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6805421884575826990&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "ETH Zurich",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ethz.ch",
        "aff_unique_abbr": "ETHZ",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Zurich",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Switzerland"
    },
    {
        "title": "Global Optimality for Non-linear Constrained Restoration Problems via Invexity",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18163",
        "id": "fyTPWfXtcc",
        "author_site": "Samuel Pinilla, Jeyan Thiyagalingam",
        "tldr": "",
        "abstract": "Signal restoration is an important constrained optimization problem with significant applications in various domains. Although non-convex constrained optimization problems have been shown to perform better than convex counterparts in terms of reconstruction quality, convex constrained optimization problems have been preferably for its global optima guarantees. Despite the success of non-convex methods in a large number of applications, it is not an overstatement to say that there is little or no hope for non-convex problems to ensure global optima. In this paper, for the first time, we develop invex constrained optimization theory to mitigate the loss of guarantees for global optima in non-convex constrained inverse problems, where the invex function is a mapping where any critical point is a global minimizer. We also develop relevant theories to extend the global optima guarantee to a set of quasi-invex functions - the largest optimizable mappings. More specifically, we propose a family of invex/quasi-invex of functions for handling constrained inverse problems using the non-convex setting along with guarantees for their global optima. Our experimental evaluation shows that the proposed approach is very promising and can aid in extending existing convex optimization algorithms, such as the alternating direction method of multipliers, and accelerated proximal gradient methods.",
        "keywords": "Constrained optimization;Invexity;Quasi-invexity;Global optima",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/01f8c2aef73f47a494f24b4b21c7c6500645107f.pdf",
        "author": "Samuel Pinilla;Jeyan Thiyagalingam",
        "authorids": "~Samuel_Pinilla1;~Jeyan_Thiyagalingam1",
        "gender": "M;",
        "homepage": ";",
        "dblp": ";",
        "google_scholar": "yGayy7sAAAAJ;",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Samuel_Pinilla1;~Jeyan_Thiyagalingam1",
        "aff": "University of Manchester;",
        "aff_domain": "manchester.ac.uk;",
        "position": "Postdoc;",
        "bibtex": "@inproceedings{\npinilla2024global,\ntitle={Global Optimality for Non-linear Constrained Restoration Problems via Invexity},\nauthor={Samuel Pinilla and Jeyan Thiyagalingam},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=fyTPWfXtcc}\n}",
        "github": "",
        "project": "",
        "reviewers": "a9wE;ta5r;4Bfb",
        "pdf_size": 20463448,
        "rating": "3;5;6",
        "confidence": "4;3;3",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "2;3;1",
        "wc_summary": "92;119;83",
        "wc_strengths": "53;49;15",
        "wc_weaknesses": "231;90;310",
        "wc_questions": "87;118;64",
        "wc_review": "463;376;472",
        "wc_reply_reviewers": "130;401;132",
        "wc_reply_authors": "1768;1313;1302",
        "reply_reviewers": "1;1;1",
        "reply_authors": "3;2;3",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            98.0,
            15.297058540778355
        ],
        "wc_strengths_avg": [
            39.0,
            17.048949136725895
        ],
        "wc_weaknesses_avg": [
            210.33333333333334,
            90.99572639537652
        ],
        "wc_questions_avg": [
            89.66666666666667,
            22.125902367034783
        ],
        "wc_review_avg": [
            437.0,
            43.289721643826724
        ],
        "wc_reply_reviewers_avg": [
            221.0,
            127.28183950063995
        ],
        "wc_reply_authors_avg": [
            1461.0,
            217.12822632413932
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.9449111825230683,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=754741692801583668&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=fyTPWfXtcc",
        "pdf": "https://openreview.net/pdf?id=fyTPWfXtcc",
        "email": "manchester.ac.uk;",
        "author_num": 2,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Manchester",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.manchester.ac.uk",
        "aff_unique_abbr": "UoM",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "fzc3eleTxX",
        "title": "$\\sigma$-PCA: a unified neural model for linear and nonlinear principal component analysis",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Linear principal component analysis (PCA) is marked by orthogonality and ordering of variances -- its conventional nonlinear counterpart is marked by neither.\n    To yield a useful output, conventional nonlinear PCA requires, as a preprocessing step, whitening. This makes the overall transformation akin to independent component analysis (ICA). But, as a side effect of whitening, the overall transformation becomes non-orthogonal and the variances become non-estimable. Conventional nonlinear PCA thus lacks the two distinctive characteristics of PCA.\n    To bridge the disparity, we propose $\\sigma$-PCA, a unified neural model for linear and nonlinear PCA as single-layer autoencoders. The key is modelling the variances as separate parameters.  With our model, we show that whitening is not required, and nonlinear PCA can retain both orthogonality and ordering of variances, becoming a special case of ICA for when the overall transformation is assumed orthogonal.  And so where linear PCA fails to separate components into orthogonal directions when their variances are similar, nonlinear PCA can. And when the overall transformation is non-orthogonal, two isolated layers of nonlinear PCA can perform conventional ICA. In the middle between linear PCA and ICA, we carve out a place for nonlinear PCA as a method in its own right.",
        "keywords": "principal component analysis;nonlinear principal component analysis;independent component analysis;single-layer autoencoder",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/e286ed7dcfdb403dbfcfb06e6b6355565fbc9bbb.zip",
        "author": "Fahdi Kanavati;Lucy Katsnith;Masayuki Tsuneki",
        "authorids": "~Fahdi_Kanavati1;~Lucy_Katsnith1;~Masayuki_Tsuneki1",
        "gender": ";F;",
        "homepage": ";https://invertibleai.com;",
        "dblp": ";;",
        "google_scholar": ";;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Fahdi_Kanavati1;~Lucy_Katsnith1;~Masayuki_Tsuneki1",
        "aff": ";Invertible AI;",
        "aff_domain": ";invertibleai.com;",
        "position": ";Researcher;",
        "bibtex": "@misc{\nkanavati2024sigmapca,\ntitle={\\${\\textbackslash}sigma\\$-{PCA}: a unified neural model for linear and nonlinear principal component analysis},\nauthor={Fahdi Kanavati and Lucy Katsnith and Masayuki Tsuneki},\nyear={2024},\nurl={https://openreview.net/forum?id=fzc3eleTxX}\n}",
        "github": "",
        "project": "",
        "reviewers": "cVoi;dby8;v4Cb;xK5D",
        "site": "https://openreview.net/forum?id=fzc3eleTxX",
        "pdf_size": 20670481,
        "rating": "3;3;5;5",
        "confidence": "3;4;3;2",
        "soundness": "1;1;2;3",
        "contribution": "2;1;2;2",
        "presentation": "2;1;3;3",
        "wc_summary": "108;30;39;80",
        "wc_strengths": "75;38;61;90",
        "wc_weaknesses": "483;173;122;184",
        "wc_questions": "219;171;60;174",
        "wc_review": "885;412;282;528",
        "wc_reply_reviewers": "344;0;0;0",
        "wc_reply_authors": "1620;993;1132;1244",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "3;2;2;2",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            64.25,
            31.514877439076294
        ],
        "wc_strengths_avg": [
            66.0,
            19.144189719076646
        ],
        "wc_weaknesses_avg": [
            240.5,
            141.948053878875
        ],
        "wc_questions_avg": [
            156.0,
            58.59607495387383
        ],
        "wc_review_avg": [
            526.75,
            224.3962733647776
        ],
        "wc_reply_reviewers_avg": [
            86.0,
            148.95636945092346
        ],
        "wc_reply_authors_avg": [
            1247.25,
            232.85121322423896
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.7071067811865475,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15272931548179540339&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Invertible AI",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.invertible.ai",
        "aff_unique_abbr": "Invertible AI",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "g0KxyULAun",
        "title": "MaskCLR: Multi-Level Contrastive Learning for Robust Skeletal Action Recognition",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Current transformer-based skeletal action recognition models focus on a limited set of joints and low-level motion patterns to predict action classes. This results in significant performance degradation under small skeleton perturbations or changing the pose estimator between training and testing. In this work, we introduce MaskCLR, a new Masked Contrastive Learning approach for Robust skeletal action recognition. We propose a Targeted Masking (TM) strategy to occlude the most important joints and encourage the model to explore a larger set of discriminative joints. Furthermore, we propose a Multi-Level Contrastive Learning (MLCL) paradigm to enforce feature embeddings of standard and occluded skeletons to be class-discriminative, i.e, more compact within each class and more dispersed across different classes. Our approach helps the model capture the high-level action semantics instead of low-level joint variations, and can be seamlessly incorporated into transformer-based models. Without loss of generality, we apply our method on Spatial-Temporal Multi-Head Self-Attention encoder (ST-MHSA), and we perform extensive experiments on NTU60, NTU120, and Kinetics400 benchmarks. MaskCLR consistently outperforms previous state-of-the-art methods on standard and perturbed skeletons from different pose estimators, showing improved accuracy, generalization, and robustness to skeleton perturbations. We make our implementation anonymously available at anonymous.4open.science/r/MaskCLR-A503.",
        "keywords": "Transformers;Skeleton-based Action Recognition;Contrastive Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Mohamed O Abdelfattah;Mariam Hassan;Alexandre Alahi",
        "authorids": "~Mohamed_O_Abdelfattah2;~Mariam_Hassan1;~Alexandre_Alahi3",
        "gender": "M;F;M",
        "homepage": "http://moo-osama.github.io;https://www.linkedin.com/in/mariam-hegazy;https://vita.epfl.ch/",
        "dblp": ";;48/3455",
        "google_scholar": "gqvkC84AAAAJ;;UIhXQ64AAAAJ",
        "orcid": "0009-0002-5732-4340;;",
        "linkedin": "muhammad-osama-77b7561b0/;;",
        "or_profile": "~Mohamed_O_Abdelfattah2;~Mariam_Hassan1;~Alexandre_Alahi3",
        "aff": "EPFL - EPF Lausanne;EPFL - EPF Lausanne;EPFL",
        "aff_domain": "epfl.ch;epfl.ch;epfl.ch",
        "position": "PhD student;MS student;Associate Professor",
        "bibtex": "@misc{\nabdelfattah2024maskclr,\ntitle={Mask{CLR}: Multi-Level Contrastive Learning for Robust Skeletal Action Recognition},\nauthor={Mohamed O Abdelfattah and Mariam Hassan and Alexandre Alahi},\nyear={2024},\nurl={https://openreview.net/forum?id=g0KxyULAun}\n}",
        "github": "",
        "project": "",
        "reviewers": "vH9p;VBCi;WKXM;8Cc6;jVKN",
        "site": "https://openreview.net/forum?id=g0KxyULAun",
        "pdf_size": 3416347,
        "rating": "3;3;5;6;6",
        "confidence": "5;3;4;2;4",
        "soundness": "2;2;4;3;2",
        "contribution": "2;2;3;3;3",
        "presentation": "3;2;4;3;2",
        "wc_summary": "95;81;35;87;111",
        "wc_strengths": "53;26;36;29;94",
        "wc_weaknesses": "334;491;83;184;142",
        "wc_questions": "1;37;36;112;103",
        "wc_review": "483;635;190;412;450",
        "wc_reply_reviewers": "0;0;0;132;0",
        "wc_reply_authors": "1325;2271;470;584;1137",
        "reply_reviewers": "0;0;0;1;0",
        "reply_authors": "2;4;1;1;2",
        "rating_avg": [
            4.6,
            1.3564659966250536
        ],
        "confidence_avg": [
            3.6,
            1.019803902718557
        ],
        "soundness_avg": [
            2.6,
            0.8
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.8,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            81.8,
            25.474693324945054
        ],
        "wc_strengths_avg": [
            47.6,
            25.016794358990122
        ],
        "wc_weaknesses_avg": [
            246.8,
            147.6447086759292
        ],
        "wc_questions_avg": [
            57.8,
            42.69613565652049
        ],
        "wc_review_avg": [
            434.0,
            143.58133583443217
        ],
        "wc_reply_reviewers_avg": [
            26.4,
            52.79999999999999
        ],
        "wc_reply_authors_avg": [
            1157.4,
            643.4154489907745
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4
        ],
        "reply_authors_avg": [
            2.0,
            1.0954451150103321
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.4048204523763681,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:WtEopZzgDyUJ:scholar.google.com/&scioq=MaskCLR:+Multi-Level+Contrastive+Learning+for+Robust+Skeletal+Action+Recognition&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "EPFL",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.epfl.ch",
        "aff_unique_abbr": "EPFL",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Lausanne;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Switzerland"
    },
    {
        "id": "g0fHn95m3D",
        "title": "Text-To-Energy: Accelerating Quantum Chemistry Calculations through Enhanced Text-to-Vector Encoding and Orbital-Aware Multilayer Perceptron",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Accurately predicting material properties remains a complex and computationally intensive task. In this work, we introduce Text-To-Energy (T2E), a novel approach combining text-to-vector encoding and a multilayer perceptron (MLP) for rapid and precise energy predictions. T2E begins by converting pivotal material attributes to a vector representation, followed by the utilization of an MLP block incorporating significant physical data. This novel integration of textual, physical, and quantum insights enables T2E to swiftly and accurately predict the total energy of material systems. The proposed methodology marks a significant departure from conventional computational techniques, offering a reduction in computational burden, which is imposed by particle count and their interactions, obviating the need for extensive quantum chemistry expertise. Comprehensive validation across a diverse range of atoms and molecules affirms the superior performance of T2E over state-of-the-art solutions such as DFT, FermiNet, and PsiFormer.",
        "keywords": "qantum mechanics;quantum chemistry;computational physics;density functional theory;material science;physics-informed machine learning",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/ce32f37cfaafb4bdb6fe3c070ad00f7952b5b911.zip",
        "author": "Can Polat;HASAN KURBAN;Mustafa Kurban",
        "authorids": "~Can_Polat1;~HASAN_KURBAN1;~Mustafa_Kurban1",
        "gender": "M;M;",
        "homepage": ";https://www.hasankurban.com;https://avesis.ankara.edu.tr/kurbanm",
        "dblp": "356/0113;151/4752;",
        "google_scholar": "ZtdUrpsAAAAJ;;-xcZFYwAAAAJ",
        "orcid": ";0000-0003-3142-2866;0000-0002-7263-0234",
        "linkedin": ";;mustafa-kurban-9ba46480/",
        "or_profile": "~Can_Polat1;~HASAN_KURBAN1;~Mustafa_Kurban1",
        "aff": "Texas A&M University - College Station;Texas A&M at Qatar;Ankara University",
        "aff_domain": "tamu.edu;qatar.tamu.edu;ankara.edu.tr",
        "position": "PhD student;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\npolat2024texttoenergy,\ntitle={Text-To-Energy: Accelerating Quantum Chemistry Calculations through Enhanced Text-to-Vector Encoding and Orbital-Aware Multilayer Perceptron},\nauthor={Can Polat and HASAN KURBAN and Mustafa Kurban},\nyear={2024},\nurl={https://openreview.net/forum?id=g0fHn95m3D}\n}",
        "github": "",
        "project": "",
        "reviewers": "pP7a;m4uK;D8dd;Ld95",
        "site": "https://openreview.net/forum?id=g0fHn95m3D",
        "pdf_size": 4149573,
        "rating": "1;1;3;8",
        "confidence": "4;5;5;4",
        "soundness": "1;2;2;3",
        "contribution": "1;2;2;3",
        "presentation": "2;2;2;4",
        "wc_summary": "66;36;40;131",
        "wc_strengths": "13;13;23;117",
        "wc_weaknesses": "90;248;55;100",
        "wc_questions": "40;4;25;55",
        "wc_review": "209;301;143;403",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "724;636;616;699",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.25,
            2.8613807855648994
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            68.25,
            38.015621788943555
        ],
        "wc_strengths_avg": [
            41.5,
            43.780703511935485
        ],
        "wc_weaknesses_avg": [
            123.25,
            73.93705092847564
        ],
        "wc_questions_avg": [
            31.0,
            18.854707634964804
        ],
        "wc_review_avg": [
            264.0,
            97.92343948207701
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            668.75,
            44.22315569924878
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.4368520283305189,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:NMo2g9ltfeoJ:scholar.google.com/&scioq=Text-To-Energy:+Accelerating+Quantum+Chemistry+Calculations+through+Enhanced+Text-to-Vector+Encoding+and+Orbital-Aware+Multilayer+Perceptron&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Texas A&M University;Ankara University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tamu.edu;https://www.ankara.edu.tr",
        "aff_unique_abbr": "TAMU;Ankara U",
        "aff_campus_unique_index": "0;1",
        "aff_campus_unique": "College Station;Qatar;",
        "aff_country_unique_index": "0;1;2",
        "aff_country_unique": "United States;Qatar;T\u00fcrkiye"
    },
    {
        "title": "Adaptive Federated Learning with Auto-Tuned Clients",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18162",
        "id": "g0mlwqs8pi",
        "author_site": "Junhyung Lyle Kim, Mohammad Taha Toghani, Cesar Uribe, Anastasios Kyrillidis",
        "tldr": "",
        "abstract": "Federated learning (FL) is a distributed machine learning framework where the global model of a central server is trained via multiple collaborative steps by participating clients without sharing their data. While being a flexible framework, where the distribution of local data, participation rate, and computing power of each client can greatly vary, such flexibility gives rise to many new challenges, especially in the hyperparameter tuning on the client side. We propose $\\Delta$-SGD, a simple step size rule for SGD that enables each client to use its own step size by adapting to the local smoothness of the function each client is optimizing. We provide theoretical and empirical results where the benefit of the client adaptivity is shown in various FL scenarios.",
        "keywords": "federated learning;distributed optimization;adaptive method",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/78b652f6cc9993c675d7af0218622880707a4594.pdf",
        "author": "Junhyung Lyle Kim;Taha Toghani;Cesar A Uribe;Anastasios Kyrillidis",
        "authorids": "~Junhyung_Lyle_Kim1;~Taha_Toghani1;~Cesar_A_Uribe1;~Anastasios_Kyrillidis2",
        "gender": "M;;M;M",
        "homepage": "http://jlylekim.github.io;;https://cauribe.rice.edu/;http://akyrillidis.github.io",
        "dblp": "290/2228;;143/6101;53/9879",
        "google_scholar": "Ku197mP8hmUC;;b_uG-kEAAAAJ;TEGzkZMAAAAJ",
        "orcid": ";;0000-0002-7080-9724;",
        "linkedin": ";;cesarauribe/;",
        "or_profile": "~Junhyung_Lyle_Kim1;~Taha_Toghani1;~Cesar_A_Uribe1;~Anastasios_Kyrillidis2",
        "aff": "Rice University;;Rice University;Rice University",
        "aff_domain": "rice.edu;;rice.edu;rice.edu",
        "position": "PhD student;;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nkim2024adaptive,\ntitle={Adaptive Federated Learning with Auto-Tuned Clients},\nauthor={Junhyung Lyle Kim and Taha Toghani and Cesar A Uribe and Anastasios Kyrillidis},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=g0mlwqs8pi}\n}",
        "github": "",
        "project": "",
        "reviewers": "Yzoy;WWBM;WDyG;RQMs",
        "pdf_size": 7402714,
        "rating": "6;6;6;8",
        "confidence": "3;3;2;3",
        "soundness": "3;2;3;3",
        "contribution": "2;3;3;2",
        "presentation": "4;3;3;2",
        "wc_summary": "73;48;77;64",
        "wc_strengths": "39;48;85;82",
        "wc_weaknesses": "187;142;205;101",
        "wc_questions": "114;12;69;299",
        "wc_review": "413;250;436;546",
        "wc_reply_reviewers": "237;105;231;63",
        "wc_reply_authors": "1617;824;845;1286",
        "reply_reviewers": "2;2;2;1",
        "reply_authors": "4;3;2;4",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            65.5,
            11.146748404803978
        ],
        "wc_strengths_avg": [
            63.5,
            20.279299790673246
        ],
        "wc_weaknesses_avg": [
            158.75,
            40.47452902752545
        ],
        "wc_questions_avg": [
            123.5,
            107.57904070961034
        ],
        "wc_review_avg": [
            411.25,
            105.80022447991308
        ],
        "wc_reply_reviewers_avg": [
            159.0,
            76.48529270389177
        ],
        "wc_reply_authors_avg": [
            1143.0,
            330.0340891483787
        ],
        "reply_reviewers_avg": [
            1.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.25,
            0.82915619758885
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1570372315955757861&as_sdt=5,34&sciodt=0,34&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=g0mlwqs8pi",
        "pdf": "https://openreview.net/pdf?id=g0mlwqs8pi",
        "email": "rice.edu;;rice.edu;rice.edu",
        "author_num": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Rice University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.rice.edu",
        "aff_unique_abbr": "Rice",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "g16vmAtJ8x",
        "title": "On the Inadequacy of Similarity-based Privacy Metrics: Reconstruction Attacks against ``Truly Anonymous Synthetic Data''",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Training generative models to produce synthetic data is meant to provide a privacy-friendly approach to data release.\nHowever, we get robust guarantees only when models are trained to satisfy Differential Privacy (DP).\nAlas, this is not the standard in industry as many companies use ad-hoc strategies to empirically evaluate privacy based on the statistical {\\em similarity} between synthetic and real data.\n\nIn this paper, we review the privacy metrics offered by leading companies in this space and shed light on a few critical flaws in reasoning about privacy entirely via empirical evaluations.\nWe analyze the undesirable properties of the metrics and filters they use and demonstrate their unreliability and inconsistency through counter-examples.\nWe then present a reconstruction attack, \\emph{ReconSyn}, which successfully recovers (i.e., leaks all the attributes of) at least 78\\% of the low-density train records (or outliers) with only black-box access to a single fitted generative model and the privacy metrics.\nFinally, we show that applying DP or using generators with low utility does not successfully mitigate \\emph{ReconSyn} as the privacy leakage still comes from access to the metrics.\nOverall, our work serves as a warning to practitioners not to deviate from established privacy-preserving mechanisms.",
        "keywords": "synthetic data;privacy metrics;reconstruction attacks;differential privacy;generative models",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Georgi Ganev;Emiliano De Cristofaro",
        "authorids": "~Georgi_Ganev1;~Emiliano_De_Cristofaro1",
        "gender": ";",
        "homepage": "https://ganevgv.github.io/;https://emilianodc.com",
        "dblp": "284/8917;36/6225",
        "google_scholar": "TVWEFoUAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Georgi_Ganev1;~Emiliano_De_Cristofaro1",
        "aff": "Hazy;University of California, Riverside",
        "aff_domain": "hazy.com;ucr.edu",
        "position": "Researcher;Full Professor",
        "bibtex": "@misc{\nganev2024on,\ntitle={On the Inadequacy of Similarity-based Privacy Metrics: Reconstruction Attacks against ``Truly Anonymous Synthetic Data''},\nauthor={Georgi Ganev and Emiliano De Cristofaro},\nyear={2024},\nurl={https://openreview.net/forum?id=g16vmAtJ8x}\n}",
        "github": "",
        "project": "",
        "reviewers": "WhWB;82J9;XpV4;uGem;5urh",
        "site": "https://openreview.net/forum?id=g16vmAtJ8x",
        "pdf_size": 3062144,
        "rating": "3;5;6;8;8",
        "confidence": "4;5;3;4;4",
        "soundness": "2;4;3;4;3",
        "contribution": "2;2;4;3;3",
        "presentation": "3;3;3;2;3",
        "wc_summary": "173;36;67;116;134",
        "wc_strengths": "95;85;82;59;112",
        "wc_weaknesses": "365;678;349;536;256",
        "wc_questions": "7;340;69;26;86",
        "wc_review": "640;1139;567;737;588",
        "wc_reply_reviewers": "555;158;0;340;0",
        "wc_reply_authors": "1881;1647;576;1488;772",
        "reply_reviewers": "2;1;0;2;0",
        "reply_authors": "5;4;2;5;2",
        "rating_avg": [
            6.0,
            1.8973665961010275
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            3.2,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.8,
            0.7483314773547882
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            105.2,
            48.56088961293852
        ],
        "wc_strengths_avg": [
            86.6,
            17.327434893832383
        ],
        "wc_weaknesses_avg": [
            436.8,
            150.71217601773253
        ],
        "wc_questions_avg": [
            105.6,
            120.60281920419607
        ],
        "wc_review_avg": [
            734.2,
            210.74857057640983
        ],
        "wc_reply_reviewers_avg": [
            210.6,
            212.99164302854697
        ],
        "wc_reply_authors_avg": [
            1272.8,
            508.4436645293164
        ],
        "reply_reviewers_avg": [
            1.0,
            0.8944271909999159
        ],
        "reply_authors_avg": [
            3.6,
            1.3564659966250536
        ],
        "replies_avg": [
            31,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.16666666666666669,
        "gs_citation": 16,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3068675994393063421&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Hazy;University of California, Riverside",
        "aff_unique_dep": ";",
        "aff_unique_url": ";https://www.ucr.edu",
        "aff_unique_abbr": ";UCR",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Riverside",
        "aff_country_unique_index": "1",
        "aff_country_unique": ";United States"
    },
    {
        "title": "Neural Active Learning Beyond Bandits",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18161",
        "id": "g1S72T3FGc",
        "author_site": "Yikun Ban, Ishika Agarwal, Ziwei Wu, Yada Zhu, Kommy Weldemariam, Hanghang Tong, Jingrui He",
        "tldr": "",
        "abstract": "We study both stream-based and pool-based active learning with neural network approximations. A recent line of works proposed bandit-based approaches that transformed active learning into a bandit problem, achieving both theoretical and empirical success. However, the performance and computational costs of these methods may be susceptible to the number of classes, denoted as $K$, due to this transformation. Therefore, this paper seeks to answer the question: \"How can we mitigate the adverse impacts of $K$   while retaining the advantages of principled exploration and provable performance guarantees in active learning?\" To tackle this challenge, we propose two algorithms based on the newly designed exploitation and exploration neural networks for stream-based and pool-based active learning. Subsequently, we provide theoretical performance guarantees for both algorithms in a non-parametric setting, demonstrating a slower error-growth rate concerning $K$ for the proposed approaches. We use extensive experiments to evaluate the proposed algorithms, which consistently outperform state-of-the-art baselines.",
        "keywords": "Active Learning;Neural Active Learning;Contextual Bandits;Neural Contextual Bandits",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/b9fde938610da3bee52bbc52c0520085be88c2b3.zip",
        "author": "Yikun Ban;Ishika Agarwal;Ziwei Wu;Yada Zhu;Kommy Weldemariam;Hanghang Tong;Jingrui He",
        "authorids": "~Yikun_Ban1;~Ishika_Agarwal1;~Ziwei_Wu1;~Yada_Zhu1;~Kommy_Weldemariam1;~Hanghang_Tong3;~Jingrui_He1",
        "gender": ";F;F;;;;F",
        "homepage": ";https://agarwalishika.github.io/;;https://researcher.watson.ibm.com/researcher/view.php?person=us-yzhu;https://research.ibm.com/people/kommy-weldemariam--1;http://tonghanghang.org;https://www.hejingrui.org",
        "dblp": ";;201/3657;56/8808;61/5240.html;58/1757;34/2685",
        "google_scholar": ";UQSG7u0AAAAJ;glHe3FwAAAAJ;AJb408gAAAAJ;lHXu6nkAAAAJ;RaINcuUAAAAJ;hXpZynkAAAAJ",
        "orcid": ";0009-0002-7249-3847;;0000-0002-3338-6371;;0000-0003-4405-3887;0000-0002-6429-6272",
        "linkedin": ";;;yadazhu/;https://www.linkedin.com/feed/;htong/;",
        "or_profile": "~Yikun_Ban1;~Ishika_Agarwal1;~Ziwei_Wu1;~Yada_Zhu1;~Kommy_Weldemariam1;~Hanghang_Tong3;~Jingrui_He1",
        "aff": ";University of Illinois, Urbana-Champaign;University of Illinois, Urbana Champaign;IBM Research;;University of Illinois, Urbana Champaign;University of Illinois, Urbana Champaign",
        "aff_domain": ";cs.illinois.edu;illinois.edu;us.ibm.com;;illinois.edu;illinois.edu",
        "position": ";PhD student;PhD student;Principal Research Scientist;;Associate Professor;Full Professor",
        "bibtex": "@inproceedings{\nban2024neural,\ntitle={Neural Active Learning Beyond Bandits},\nauthor={Yikun Ban and Ishika Agarwal and Ziwei Wu and Yada Zhu and Kommy Weldemariam and Hanghang Tong and Jingrui He},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=g1S72T3FGc}\n}",
        "github": "",
        "project": "",
        "reviewers": "4Q6h;Jpt8;73vR;5FNs",
        "pdf_size": 906177,
        "rating": "6;6;6;8",
        "confidence": "3;3;2;3",
        "soundness": "3;3;3;4",
        "contribution": "2;2;2;4",
        "presentation": "3;3;3;3",
        "wc_summary": "63;70;47;482",
        "wc_strengths": "68;125;77;49",
        "wc_weaknesses": "55;83;20;133",
        "wc_questions": "7;50;2;155",
        "wc_review": "193;328;146;819",
        "wc_reply_reviewers": "13;27;0;22",
        "wc_reply_authors": "239;571;173;491",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            165.5,
            182.92143122116664
        ],
        "wc_strengths_avg": [
            79.75,
            28.01227409547465
        ],
        "wc_weaknesses_avg": [
            72.75,
            41.33022501753408
        ],
        "wc_questions_avg": [
            53.5,
            61.5
        ],
        "wc_review_avg": [
            371.5,
            266.8618556481986
        ],
        "wc_reply_reviewers_avg": [
            15.5,
            10.259142264341596
        ],
        "wc_reply_authors_avg": [
            368.5,
            166.58556360021117
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3640835125023528581&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 9,
        "openreview": "https://openreview.net/forum?id=g1S72T3FGc",
        "pdf": "https://openreview.net/pdf?id=g1S72T3FGc",
        "email": ";cs.illinois.edu;illinois.edu;us.ibm.com;;illinois.edu;illinois.edu",
        "author_num": 7,
        "aff_unique_index": "0;1;2;1;1",
        "aff_unique_norm": "University of Illinois;University of Illinois Urbana-Champaign;IBM",
        "aff_unique_dep": ";;IBM Research",
        "aff_unique_url": "https://illinois.edu;https://illinois.edu;https://www.ibm.com/research",
        "aff_unique_abbr": "UIUC;UIUC;IBM",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Urbana-Champaign;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "g1fE8fSOm5",
        "title": "Graph Neural Networks Provably Benefit from Structural Information: A Feature Learning Perspective",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph neural networks (GNNs) have shown remarkable capabilities in learning from graph-structured data, outperforming traditional multilayer perceptrons (MLPs) in numerous graph applications. Despite these advantages, there has been limited theoretical exploration into why GNNs are so effective, particularly from the perspective of feature learning. This study aims to address this gap by examining the role of graph convolution in feature learning theory under a specific data generative model. We undertake a comparative analysis of the optimization and generalization between two-layer graph convolutional networks (GCNs) and their convolutional neural network (CNN) counterparts. Our findings reveal that graph convolution significantly enhances the regime of low test error over CNNs. This highlights a substantial discrepancy between GNNs and MLPs in terms of generalization capacity, a conclusion further supported by our empirical simulations on both synthetic and real-world datasets.",
        "keywords": "Graph Neural Network;Feature Learning;Graph Convolution;Deep Learning Theory",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/a86580b881735ccc91a3597ff75c23eb47dcd1aa.zip",
        "author": "Wei Huang;Yuan Cao;Haonan Wang;Xin Cao;Taiji Suzuki",
        "authorids": "~Wei_Huang6;~Yuan_Cao1;~Haonan_Wang1;~Xin_Cao2;~Taiji_Suzuki1",
        "gender": "M;M;M;M;M",
        "homepage": "https://weihuang05.github.io/;https://yuancaohku.github.io/;http://charles-haonan-wang.me/;https://xincao-unsw.github.io/;http://ibis.t.u-tokyo.ac.jp/suzuki/",
        "dblp": "81/6685-34;;;77/2970-1;08/312",
        "google_scholar": "RZfDh4MAAAAJ;-VGnHI4AAAAJ;cLziVZMAAAAJ;https://scholar.google.com.sg/citations?user=kJIkUagAAAAJ;x8osrBsAAAAJ",
        "orcid": "0000-0001-5674-7021;;0009-0006-6963-8987;0000-0002-3519-7013;",
        "linkedin": ";;;;",
        "or_profile": "~Wei_Huang6;~Yuan_Cao1;~Haonan_Wang1;~Xin_Cao2;~Taiji_Suzuki1",
        "aff": "RIKEN AIP;University of Hong Kong;National University of Singapore;University of New South Wales;The University of Tokyo",
        "aff_domain": "riken.jp;hku.hk;u.nus.edu;unsw.edu.au;tokyo.ac.jp",
        "position": "Research Scientist;Assistant Professor;PhD student;Senior Lecturer;Associate Professor",
        "bibtex": "@misc{\nhuang2024graph,\ntitle={Graph Neural Networks Provably Benefit from Structural Information: A Feature Learning Perspective},\nauthor={Wei Huang and Yuan Cao and Haonan Wang and Xin Cao and Taiji Suzuki},\nyear={2024},\nurl={https://openreview.net/forum?id=g1fE8fSOm5}\n}",
        "github": "",
        "project": "",
        "reviewers": "Q462;UPB7;LXCw;DNKm;9JJs",
        "site": "https://openreview.net/forum?id=g1fE8fSOm5",
        "pdf_size": 993548,
        "rating": "3;5;5;6;6",
        "confidence": "3;4;5;3;3",
        "soundness": "3;3;4;3;2",
        "contribution": "2;3;2;3;3",
        "presentation": "2;3;3;3;3",
        "wc_summary": "64;89;38;110;79",
        "wc_strengths": "40;12;13;54;57",
        "wc_weaknesses": "200;9;13;113;157",
        "wc_questions": "6;77;13;194;143",
        "wc_review": "310;187;77;471;436",
        "wc_reply_reviewers": "50;0;0;38;183",
        "wc_reply_authors": "1465;761;0;942;1618",
        "reply_reviewers": "1;0;0;1;1",
        "reply_authors": "3;2;0;3;3",
        "rating_avg": [
            5.0,
            1.0954451150103321
        ],
        "confidence_avg": [
            3.6,
            0.8
        ],
        "soundness_avg": [
            3.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            76.0,
            24.17436658942691
        ],
        "wc_strengths_avg": [
            35.2,
            19.405153954555477
        ],
        "wc_weaknesses_avg": [
            98.4,
            76.49209109443929
        ],
        "wc_questions_avg": [
            86.6,
            73.10430903852385
        ],
        "wc_review_avg": [
            296.2,
            148.5010437673756
        ],
        "wc_reply_reviewers_avg": [
            54.2,
            67.4459783827027
        ],
        "wc_reply_authors_avg": [
            957.2,
            574.3648317924767
        ],
        "reply_reviewers_avg": [
            0.6,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            2.2,
            1.16619037896906
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 16,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16310476210340367285&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "RIKEN;University of Hong Kong;National University of Singapore;University of New South Wales;University of Tokyo",
        "aff_unique_dep": "Advanced Institute for Computational Science;;;;",
        "aff_unique_url": "https://www.aip.riken.jp;https://www.hku.hk;https://www.nus.edu.sg;https://www.unsw.edu.au;https://www.u-tokyo.ac.jp",
        "aff_unique_abbr": "RIKEN AIP;HKU;NUS;UNSW;UTokyo",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;1;2;3;0",
        "aff_country_unique": "Japan;China;Singapore;Australia"
    },
    {
        "id": "g1oP6DjgFs",
        "title": "Unleash Data Generation for Efficient and Effective Data-free Knowledge Distillation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Data-Free Knowledge Distillation (DFKD) has recently made remarkable advancements with its core principle of transferring knowledge from a teacher neural network to a student neural network without requiring access to the original data. Nonetheless, existing approaches encounter a significant challenge when attempting to generate samples from random noise inputs, which inherently lack meaningful information. Consequently, these models struggle to effectively map this noise to the ground-truth sample distribution, resulting in the production of low-quality data and imposing substantial time requirements for training the generator. In this paper, we propose a novel Noisy Layer Generation method (NAYER) which relocates the randomness source from the input to a noisy layer and utilizes the meaningful label-text embedding (LTE) as the input. The significance of LTE lies in its ability to contain substantial meaningful inter-class information, enabling the generation of high-quality samples with only a few training steps. Simultaneously, the noisy layer plays a key role in addressing the issue of diversity in sample generation by preventing the model from overemphasizing the constrained label information. By reinitializing the noisy layer in each iteration, we aim to facilitate the generation of diverse samples while still retaining the method's efficiency, thanks to the ease of learning provided by LTE. Experiments carried out on multiple datasets demonstrate that our NAYER not only outperforms the state-of-the-art methods but also achieves speeds 5 to 15 times faster than previous approaches. The code is available at \\url{https://github.com/fw742211/nayer}.",
        "keywords": "data-free knowledge distillation;adversarial;generative model;label-text embedding",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Minh-Tuan Tran;Trung Le;Xuan-May Le;Mehrtash Harandi;Quan Hung Tran;Dinh Phung",
        "authorids": "~Minh-Tuan_Tran1;~Trung_Le2;~Xuan-May_Le1;~Mehrtash_Harandi2;~Quan_Hung_Tran1;~Dinh_Phung2",
        "gender": "M;M;F;M;M;M",
        "homepage": "https://sites.google.com/view/tmtuan1307;;https://sites.google.com/view/xuanmay2701;;https://research.monash.edu/en/persons/dinh-phung;https://sites.google.com/site/mehrtashharandi/",
        "dblp": "297/3277;;205/4737.html;151/8700;71/5859;92/5921",
        "google_scholar": "iag2fS0AAAAJ;https://scholar.google.com/citations?hl=en;5UYlHHEAAAAJ;ehs5ImcAAAAJ;https://scholar.google.com.au/citations?user=OtA9SwIAAAAJ;--M1XEkAAAAJ",
        "orcid": "0000-0002-9401-9786;;;;0000-0002-9977-8247;0000-0002-6937-6300",
        "linkedin": ";;;;https://linkedin.com/in/dinh-phung-6b537a6;mehrtash-harandi-b99358155/",
        "or_profile": "~Minh-Tuan_Tran1;~Trung_Le2;~Xuan-May_Le1;~Quan_Hung_Tran1;~Dinh_Phung1;~Mehrtash_T._Harandi1",
        "aff": "Monash University;Monash University;University of Melbourne;ServiceNow Inc;Monash University;Australian National University",
        "aff_domain": "monash.edu;monash.edu;unimelb.edu;servicenow.com;monash.edu;anu.edu.au",
        "position": "PhD student;Assistant Professor;PhD student;Principal Researcher;Full Professor;Adjunct",
        "bibtex": "@misc{\ntran2024unleash,\ntitle={Unleash Data Generation for Efficient and Effective Data-free Knowledge Distillation},\nauthor={Minh-Tuan Tran and Trung Le and Xuan-May Le and Mehrtash Harandi and Quan Hung Tran and Dinh Phung},\nyear={2024},\nurl={https://openreview.net/forum?id=g1oP6DjgFs}\n}",
        "github": "",
        "project": "",
        "reviewers": "axyR;ovkC;m3cF;Dv9s",
        "site": "https://openreview.net/forum?id=g1oP6DjgFs",
        "pdf_size": 1577467,
        "rating": "3;5;5;6",
        "confidence": "4;5;4;4",
        "soundness": "3;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;3;3",
        "wc_summary": "195;89;92;87",
        "wc_strengths": "82;157;25;86",
        "wc_weaknesses": "397;273;129;124",
        "wc_questions": "5;2;2;24",
        "wc_review": "679;521;248;321",
        "wc_reply_reviewers": "0;210;33;300",
        "wc_reply_authors": "708;948;659;399",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "1;2;2;2",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            115.75,
            45.7896003476772
        ],
        "wc_strengths_avg": [
            87.5,
            46.82146943443787
        ],
        "wc_weaknesses_avg": [
            230.75,
            113.10697370188984
        ],
        "wc_questions_avg": [
            8.25,
            9.175374651751284
        ],
        "wc_review_avg": [
            442.25,
            169.32716114079275
        ],
        "wc_reply_reviewers_avg": [
            135.75,
            123.97252719856928
        ],
        "wc_reply_authors_avg": [
            678.5,
            194.93652813159466
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.13245323570650439,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:TC5tZE8bJMMJ:scholar.google.com/&scioq=Unleash+Data+Generation+for+Efficient+and+Effective+Data-free+Knowledge+Distillation&hl=en&as_sdt=0,5",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;1;2;0;3",
        "aff_unique_norm": "Monash University;University of Melbourne;ServiceNow;Australian National University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.monash.edu;https://www.unimelb.edu.au;https://www.servicenow.com;https://www.anu.edu.au",
        "aff_unique_abbr": "Monash;UniMelb;ServiceNow;ANU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0;0",
        "aff_country_unique": "Australia;United States"
    },
    {
        "id": "g2so5fj8pK",
        "title": "Detailed 3D Face Reconstruction in Full Pose Range",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Monocular detailed 3D face reconstruction aims to recover realistic 3D face from a single-face image. Although existing two-stage reconstruction methods have achieved great success, they are still hard to reconstruct accurate shapes and believable details for large pose images. The reason for the former is that the proportion of large pose data in their training set is often not high, resulting in a limited ability for coarse 3D face reconstruction. The latter is caused by the loss of face details in self-occluded areas of large pose images. In order to perform detailed 3D face reconstruction in full pose range, we respectively propose a self-augment mechanism and a self-supervised detail reconstruction method for large-pose images at the two stages. Specifically, in the first stage, the self augment mechanism generates a set of large pose data for each training image for re-learning. In the second stage, we pad the self-occluded side of the unwrapped input image according to the face symmetry prior, and design a Recursive Image-to-image Translation Network constrained by the details of input image to estimate its original details. By doing so, we could weaken the training set constraints on coarse 3D face reconstruction and reconstruct the believable face details of large pose images, enabling full pose range detailed 3D face reconstruction. Extensive experiments show that our method could achieve a level comparable to state-of-the-art methods.",
        "keywords": "Representation learning for computer vision;Detailed 3D face reconstruction;Large pose",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/b1070fa80b9c501578f8a4e6286f4e3843943691.pdf",
        "author": "Xinyu Li;Xitie Zhang;Suping Wu;Kehua Ma;Xiang Zhang",
        "authorids": "~Xinyu_Li12;~Xitie_Zhang1;~Suping_Wu1;~Kehua_Ma1;~Xiang_Zhang28",
        "gender": ";M;;M;M",
        "homepage": ";https://orcid.org/0000-0002-8114-9119;;;https://scholar.google.com.hk/citations?hl=zh-CN&user=YPJpaqgAAAAJ",
        "dblp": ";;;;",
        "google_scholar": ";;;;",
        "orcid": "0000-0003-3554-7359;0000-0002-8114-9119;;0000-0003-4031-0575;",
        "linkedin": ";;;;",
        "or_profile": "~Xinyu_Li12;~Xitie_Zhang1;~Suping_Wu1;~Kehua_Ma1;~Xiang_Zhang28",
        "aff": ";Ningxia University;;Ningxia University;Ningxia University",
        "aff_domain": ";nxu.edu.cn;;nxu.edu.cn;nxu.edu.cn",
        "position": ";MS student;;MS student;MS student",
        "bibtex": "@misc{\nli2024detailed,\ntitle={Detailed 3D Face Reconstruction in Full Pose Range},\nauthor={Xinyu Li and Xitie Zhang and Suping Wu and Kehua Ma and Xiang Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=g2so5fj8pK}\n}",
        "github": "",
        "project": "",
        "reviewers": "AJb8;upxb;Zc9u;7m2U",
        "site": "https://openreview.net/forum?id=g2so5fj8pK",
        "pdf_size": 4637735,
        "rating": "3;3;3;5",
        "confidence": "3;4;5;5",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "3;3;2;3",
        "wc_summary": "135;33;91;71",
        "wc_strengths": "171;33;18;42",
        "wc_weaknesses": "48;297;202;424",
        "wc_questions": "50;55;47;8",
        "wc_review": "404;418;358;545",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            82.5,
            36.77974986320598
        ],
        "wc_strengths_avg": [
            66.0,
            61.22499489587565
        ],
        "wc_weaknesses_avg": [
            242.75,
            137.2795960804081
        ],
        "wc_questions_avg": [
            40.0,
            18.694919095839918
        ],
        "wc_review_avg": [
            431.25,
            69.3230661468461
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5222329678670935,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:c1w5Ui3SQGYJ:scholar.google.com/&scioq=Detailed+3D+Face+Reconstruction+in+Full+Pose+Range&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Ningxia University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.nxu.edu.cn",
        "aff_unique_abbr": "",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "g4I3Wzv3fw",
        "title": "Revisiting the Static Model in Robust Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Designing control policies whose performance level is guaranteed to remain above a given threshold in a span of environments is a critical feature for the adoption of reinforcement learning (RL) in real-world applications. \nThe search for such robust policies is a notoriously difficult problem, often cast as a two-player game, whose formalization dates back to the 1970's. \nThis two-player game is strongly related to the so-called dynamic model of transition function uncertainty, where the environment dynamics are allowed to change at each time step.\nBut in practical applications, one is rather interested in robustness to a span of static transition models throughout interaction episodes. \nThe static model is known to be harder to solve than the dynamic one, and seminal algorithms, such as robust value iteration, as well as most recent works on deep robust RL, build upon the dynamic model.\nIn this work, we propose to revisit the static model. \nWe suggest an analysis of why solving the static model under some mild hypotheses is a reasonable endeavor, and formalize the general intuition that robust MDPs can be solved by tackling a series of static problems. \nWe introduce a generic meta-algorithm called IWOCS, which incrementally identifies worst-case transition models so as to guide the search for a robust policy. \nDiscussion on IWOCS sheds light on new ways to decouple policy optimization and adversarial transition functions and opens new perspectives for analysis.\nWe derive a deep RL version of IWOCS and demonstrate it is competitive with state-of-the-art algorithms on classical benchmarks.",
        "keywords": "Reinforcement Learning;Robust MDPs",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/ab570c94f2d2dfd6f9ae0b002bdd454bc30f013b.zip",
        "author": "Adil Zouitine;Matthieu Geist;Emmanuel Rachelson",
        "authorids": "~Adil_Zouitine1;~Matthieu_Geist1;~Emmanuel_Rachelson1",
        "gender": ";M;M",
        "homepage": ";;https://personnel.isae-supaero.fr/emmanuel-rachelson",
        "dblp": "281/6912;38/6508;52/6241",
        "google_scholar": "https://scholar.google.fr/citations?user=jw4_zowAAAAJ;ectPLEUAAAAJ;https://scholar.google.fr/citations?user=KtG9BSgAAAAJ",
        "orcid": ";;0000-0002-8559-1617",
        "linkedin": ";;emmanuelrachelson/",
        "or_profile": "~Adil_Zouitine1;~Matthieu_Geist1;~Emmanuel_Rachelson1",
        "aff": "Institut Sup\u00e9rieur de l'A\u00e9ronautique et de l'Espace;Google;Institut Sup\u00e9rieur de l'A\u00e9ronautique et de l'Espace",
        "aff_domain": "isae-supaero.fr;google.com;isae-supaero.fr",
        "position": "PhD student;Researcher;Full Professor",
        "bibtex": "@misc{\nzouitine2024revisiting,\ntitle={Revisiting the Static Model in Robust Reinforcement Learning},\nauthor={Adil Zouitine and Matthieu Geist and Emmanuel Rachelson},\nyear={2024},\nurl={https://openreview.net/forum?id=g4I3Wzv3fw}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZA2E;SYvP;KrKt;cHJH",
        "site": "https://openreview.net/forum?id=g4I3Wzv3fw",
        "pdf_size": 1355173,
        "rating": "3;5;5;6",
        "confidence": "4;2;3;3",
        "soundness": "2;2;2;2",
        "contribution": "2;3;2;2",
        "presentation": "2;2;2;1",
        "wc_summary": "131;124;111;114",
        "wc_strengths": "64;27;106;162",
        "wc_weaknesses": "44;39;398;722",
        "wc_questions": "299;56;5;317",
        "wc_review": "538;246;620;1315",
        "wc_reply_reviewers": "164;0;410;0",
        "wc_reply_authors": "1618;477;1445;1772",
        "reply_reviewers": "2;0;1;0",
        "reply_authors": "3;1;2;3",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            120.0,
            7.968688725254614
        ],
        "wc_strengths_avg": [
            89.75,
            50.21142798208392
        ],
        "wc_weaknesses_avg": [
            300.75,
            283.4355085376566
        ],
        "wc_questions_avg": [
            169.25,
            140.06137047737323
        ],
        "wc_review_avg": [
            679.75,
            392.21956542222625
        ],
        "wc_reply_reviewers_avg": [
            143.5,
            167.79973182338523
        ],
        "wc_reply_authors_avg": [
            1328.0,
            504.7588533151251
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.6488856845230502,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17115077571922807505&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Institut Sup\u00e9rieur de l'A\u00e9ronautique et de l'Espace;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.isae-supaero.fr;https://www.google.com",
        "aff_unique_abbr": "ISAE-SUPAERO;Google",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "France;United States"
    },
    {
        "title": "A Progressive Training Framework for Spiking Neural Networks with Learnable Multi-hierarchical Model",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18160",
        "id": "g52tgL8jy6",
        "author_site": "Zecheng Hao, Xinyu Shi, Zihan Huang, Tong Bu, Zhaofei Yu, Tiejun Huang",
        "tldr": "",
        "abstract": "Spiking Neural Networks (SNNs) have garnered considerable attention due to their energy efficiency and unique biological characteristics. However, the widely adopted Leaky Integrate-and-Fire (LIF) model, as the mainstream neuron model in current SNN research, has been revealed to exhibit significant deficiencies in deep-layer gradient calculation and capturing global information on the time dimension. In this paper, we propose the Learnable Multi-hierarchical (LM-H) model to address these issues by dynamically regulating its membrane-related factors. We point out that the LM-H model fully encompasses the information representation range of the LIF model while offering the flexibility to adjust the extraction ratio between historical and current information. Additionally, we theoretically demonstrate the effectiveness of the LM-H model and the functionality of its internal parameters, and propose a progressive training algorithm tailored specifically for the LM-H model. Furthermore, we devise an efficient training framework for our novel advanced model, encompassing hybrid training and time-slicing online training. Through extensive experiments on various datasets, we validate the remarkable superiority of our model and training algorithm compared to previous state-of-the-art approaches. Code is available at [https://github.com/hzc1208/STBP_LMH](https://github.com/hzc1208/STBP_LMH).",
        "keywords": "Spiking Neural Networks;Learnable Multi-hierarchical Model;Spatio-Temporal Back-propagation",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/e3115a180ce0f98bdcdcda9be74fa41ca0dc840f.zip",
        "author": "Zecheng Hao;Xinyu Shi;Zihan Huang;Tong Bu;Zhaofei Yu;Tiejun Huang",
        "authorids": "~Zecheng_Hao1;~Xinyu_Shi2;~Zihan_Huang2;~Tong_Bu1;~Zhaofei_Yu1;~Tiejun_Huang1",
        "gender": ";;M;;M;M",
        "homepage": "https://hzc1208.github.io/;;https://github.com/h-z-h-cell;;https://yuzhaofei.github.io;https://idm.pku.edu.cn/~tjhuang/",
        "dblp": "339/6969;;;;166/0573;h/TiejunHuang",
        "google_scholar": "txTkX7YAAAAJ;;;;qaUgD50AAAAJ;https://scholar.google.com.tw/citations?user=knvEK4AAAAAJ",
        "orcid": "0000-0001-9074-2857;;;;;0000-0002-4234-6099",
        "linkedin": ";;;;;",
        "or_profile": "~Zecheng_Hao1;~Xinyu_Shi2;~Zihan_Huang2;~Tong_Bu1;~Zhaofei_Yu1;~Tiejun_Huang1",
        "aff": "Peking University;;Harbin Institute of Technology;;Peking University;Peking University",
        "aff_domain": "pku.edu.cn;;hit.edu.cn;;pku.edu.cn;pku.edu.cn",
        "position": "PhD student;;Undergrad student;;Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\nhao2024a,\ntitle={A Progressive Training Framework for Spiking Neural Networks with Learnable Multi-hierarchical Model},\nauthor={Zecheng Hao and Xinyu Shi and Zihan Huang and Tong Bu and Zhaofei Yu and Tiejun Huang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=g52tgL8jy6}\n}",
        "github": "",
        "project": "",
        "reviewers": "SiwN;T4SQ;uzHG;LLZy",
        "pdf_size": 584412,
        "rating": "5;6;6;8",
        "confidence": "3;3;3;5",
        "soundness": "2;2;3;3",
        "contribution": "3;2;2;4",
        "presentation": "3;2;3;3",
        "wc_summary": "54;69;77;76",
        "wc_strengths": "31;65;22;60",
        "wc_weaknesses": "74;69;119;60",
        "wc_questions": "48;38;65;149",
        "wc_review": "207;241;283;345",
        "wc_reply_reviewers": "0;48;64;0",
        "wc_reply_authors": "921;904;753;473",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "3;3;3;2",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            69.0,
            9.192388155425117
        ],
        "wc_strengths_avg": [
            44.5,
            18.364367672206956
        ],
        "wc_weaknesses_avg": [
            80.5,
            22.787057730211682
        ],
        "wc_questions_avg": [
            75.0,
            43.800684926151554
        ],
        "wc_review_avg": [
            269.0,
            51.478150704935004
        ],
        "wc_reply_reviewers_avg": [
            28.0,
            28.5657137141714
        ],
        "wc_reply_authors_avg": [
            762.75,
            179.6139958355139
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.75,
            0.4330127018922193
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.9271726499455306,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3173376032842353105&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=g52tgL8jy6",
        "pdf": "https://openreview.net/pdf?id=g52tgL8jy6",
        "email": "pku.edu.cn;;hit.edu.cn;;pku.edu.cn;pku.edu.cn",
        "author_num": 6,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Peking University;Harbin Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.pku.edu.cn;http://www.hit.edu.cn/",
        "aff_unique_abbr": "Peking U;HIT",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Harbin",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "g5Iqg4BwsF",
        "title": "In-Context Learning with Iterative Demonstration Selection",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Spurred by advancements in scale, large language models (LLMs) have demonstrated strong few-shot learning ability via in-context learning (ICL). However, the performance of ICL has been shown to be highly sensitive to the selection of few-shot demonstrations. Selecting the most suitable examples as context remains an ongoing challenge and an open problem. Existing literature has highlighted the importance of selecting examples that are diverse or semantically similar to the test sample while ignoring the fact that the optimal selection dimension, i.e., diversity or similarity, is task-specific. Leveraging the merits of both dimensions, we propose Iterative Demonstration Selection (IDS). Using zero-shot chain-of-thought reasoning (Zero-shot-CoT), IDS iteratively selects examples that are diverse but still strongly correlated with the test sample as ICL demonstrations. Specifically, IDS applies Zero-shot-CoT to the test sample before demonstration selection. The output reasoning path is then used to choose demonstrations that are prepended to the test sample for inference. The generated answer is accompanied by its corresponding reasoning path for extracting a new set of demonstrations in the next iteration. After several iterations, IDS adopts majority voting to obtain the final result. Through extensive experiments on tasks including commonsense reasoning, question answering, topic classification, and sentiment analysis, we demonstrate that IDS can consistently outperform existing ICL demonstration selection methods.",
        "keywords": "In-context learning;iterative demonstration selection;zero-shot chain-of-thought",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Chengwei Qin;Aston Zhang;Anirudh Dagar;Wenming Ye",
        "authorids": "~Chengwei_Qin1;~Aston_Zhang2;~Anirudh_Dagar1;~Wenming_Ye1",
        "gender": "M;;Unspecified;M",
        "homepage": ";;https://anirudhdagar.ml;",
        "dblp": "195/2732;;;",
        "google_scholar": ";;;",
        "orcid": ";;;",
        "linkedin": "chengwei-qin-3401a1107/;;;https://linkedin.com/in/wenming-ye-0170b11",
        "or_profile": "~Chengwei_Qin1;~Aston_Zhang2;~Anirudh_Dagar1;~Wenming_Ye1",
        "aff": "Nanyang Technological University;;AWS;Google",
        "aff_domain": "ntu.edu.sg;;amazon.com;google.com",
        "position": "PhD student;;Applied Scientist;Researcher",
        "bibtex": "@misc{\nqin2024incontext,\ntitle={In-Context Learning with Iterative Demonstration Selection},\nauthor={Chengwei Qin and Aston Zhang and Anirudh Dagar and Wenming Ye},\nyear={2024},\nurl={https://openreview.net/forum?id=g5Iqg4BwsF}\n}",
        "github": "",
        "project": "",
        "reviewers": "vsHS;LAeZ;MpmC;R6Td",
        "site": "https://openreview.net/forum?id=g5Iqg4BwsF",
        "pdf_size": 634568,
        "rating": "3;5;5;6",
        "confidence": "4;4;4;5",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;2",
        "presentation": "3;2;3;3",
        "wc_summary": "71;45;83;83",
        "wc_strengths": "43;16;45;70",
        "wc_weaknesses": "144;182;111;157",
        "wc_questions": "60;2;60;29",
        "wc_review": "318;245;299;339",
        "wc_reply_reviewers": "165;60;21;14",
        "wc_reply_authors": "1473;683;950;562",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "3;2;2;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            70.5,
            15.5161206491829
        ],
        "wc_strengths_avg": [
            43.5,
            19.11151485361639
        ],
        "wc_weaknesses_avg": [
            148.5,
            25.59785147234041
        ],
        "wc_questions_avg": [
            37.75,
            24.21130934088448
        ],
        "wc_review_avg": [
            300.25,
            34.89537935028075
        ],
        "wc_reply_reviewers_avg": [
            65.0,
            60.3365560833563
        ],
        "wc_reply_authors_avg": [
            917.0,
            350.3591014944524
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.6622661785325219,
        "gs_citation": 46,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8967879859895944702&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Nanyang Technological University;Amazon;Google",
        "aff_unique_dep": ";Amazon Web Services;Google",
        "aff_unique_url": "https://www.ntu.edu.sg;https://aws.amazon.com;https://www.google.com",
        "aff_unique_abbr": "NTU;AWS;Google",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "Singapore;United States"
    },
    {
        "id": "g5TIh84amg",
        "title": "A Curriculum View of Robust Loss Functions",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Robust loss functions are designed to mitigate the adverse impacts of label noise, which enjoy theoretical guarantees that is agnostic to the training dynamics. However, these guarantees fail to characterize some empirical phenomenons. To address this limitation, we unify a broad array of loss functions into a novel standard form, which consists of a primary loss function inducing a sample-weighting curriculum and an optional implicit regularizer. The resulting curriculum view leads to a straightforward analysis of the training dynamics, which helps demystify how loss functions and regularizers affect learning and noise robustness. In particular, we show that robust loss functions implicitly sift and neglect corrupted samples. We then analyze the roles of regularizers with different loss functions. Finally, we dissect the cause of the notorious underfitting issue and provide effective fixes.",
        "keywords": "robust loss function;deep learning;noisy label",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/37269f7434279f9b391904cae15221c78c5c117d.zip",
        "author": "Zebin Ou;Jiao Xue;Qiankun Fu;Yue Zhang",
        "authorids": "~Zebin_Ou1;~Jiao_Xue1;~Qiankun_Fu1;~Yue_Zhang7",
        "gender": ";;F;M",
        "homepage": ";https://github.com/youxuanxue;;http://frcchang.github.io",
        "dblp": "195/1849;;207/3370;47/722-4",
        "google_scholar": "znJISzAAAAAJ;;;",
        "orcid": ";;;0000-0002-5214-2268",
        "linkedin": ";;;",
        "or_profile": "~Zebin_Ou1;~Jiao_Xue1;~Qiankun_Fu1;~Yue_Zhang7",
        "aff": "Zhihu;Inspur Cloud Information Technology Co., Ltd.;;Westlake University",
        "aff_domain": "zhihu.com;inspur.com;;westlake.edu.cn",
        "position": "Researcher;Researcher;;Full Professor",
        "bibtex": "@misc{\nou2024a,\ntitle={A Curriculum View of Robust Loss Functions},\nauthor={Zebin Ou and Jiao Xue and Qiankun Fu and Yue Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=g5TIh84amg}\n}",
        "github": "",
        "project": "",
        "reviewers": "pjXu;L9A1;gQaq;CdpW",
        "site": "https://openreview.net/forum?id=g5TIh84amg",
        "pdf_size": 4649007,
        "rating": "5;5;6;6",
        "confidence": "4;3;4;3",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "107;178;67;77",
        "wc_strengths": "46;101;92;63",
        "wc_weaknesses": "108;884;72;53",
        "wc_questions": "32;108;34;50",
        "wc_review": "293;1271;265;243",
        "wc_reply_reviewers": "0;500;0;0",
        "wc_reply_authors": "991;2986;494;406",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "2;5;1;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            107.25,
            43.41874595148966
        ],
        "wc_strengths_avg": [
            75.5,
            22.073740054644116
        ],
        "wc_weaknesses_avg": [
            279.25,
            349.71086271375674
        ],
        "wc_questions_avg": [
            56.0,
            30.822070014844883
        ],
        "wc_review_avg": [
            518.0,
            435.1057342761642
        ],
        "wc_reply_reviewers_avg": [
            125.0,
            216.50635094610965
        ],
        "wc_reply_authors_avg": [
            1219.25,
            1044.1344202256719
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            1.6393596310755
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:RlBUlJG4nlEJ:scholar.google.com/&scioq=A+Curriculum+View+of+Robust+Loss+Functions&hl=en&as_sdt=0,33",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Zhihu;Inspur Cloud Information Technology Co., Ltd.;Westlake University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.zhihu.com;https://www.inspur.com;https://www.westlake.edu.cn",
        "aff_unique_abbr": "Zhihu;;WU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "g6Urb6ukm7",
        "title": "Learning Spatio-Temporal Representation for Multivariate Time Series",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Label sparsity renders the use of the label information of multivariate time series (MTS) challenging in practice. Thus, unsupervised representation learning methods have been studied to learn effective representations of MTS without label information. Recently, many studies have employed contrastive learning to generate robust representations by capturing underlying information about MTS. However, they have some limitations, such as the insufficient consideration of relationships between the variables of MTS and high sensitivity to positive pairs. We proposed a novel spatio-temporal contrastive representation learning method (STCR) for generating effective MTS representations suitable for classification and forecasting tasks. STCR learns representations by encouraging spatio-temporal consistency, which comprehensively reflects the spatial information and temporal dependency of MTS and simultaneously mitigates sensitivity to constructing positive pairs for contrastive learning. The results of extensive experiments on MTS classification and forecasting tasks demonstrate the efficacy of STCR in generating high-quality representations and state-of-the-art performance on both tasks.",
        "keywords": "multivariate time series;contrastive learning;representation learning;spatio-temporal consistency",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/b11bfde74aa02fce32e32146c4a967639815b667.zip",
        "author": "Sangho Lee;Youngdoo Son",
        "authorids": "~Sangho_Lee6;~Youngdoo_Son1",
        "gender": "M;",
        "homepage": "https://sites.google.com/view/dgudslab/home;",
        "dblp": ";",
        "google_scholar": "https://scholar.google.co.kr/citations?user=JwelX1MAAAAJ;",
        "orcid": "0000-0002-7784-8515;",
        "linkedin": ";",
        "or_profile": "~Sangho_Lee6;~Youngdoo_Son1",
        "aff": "Dongguk University;",
        "aff_domain": "dongguk.edu;",
        "position": "PhD student;",
        "bibtex": "@misc{\nlee2024learning,\ntitle={Learning Spatio-Temporal Representation for Multivariate Time Series},\nauthor={Sangho Lee and Youngdoo Son},\nyear={2024},\nurl={https://openreview.net/forum?id=g6Urb6ukm7}\n}",
        "github": "",
        "project": "",
        "reviewers": "Egy1;rtxb;3yDx;eaUW;Rr7Y",
        "site": "https://openreview.net/forum?id=g6Urb6ukm7",
        "pdf_size": 2466055,
        "rating": "3;3;3;5;6",
        "confidence": "5;4;4;4;3",
        "soundness": "1;2;2;3;3",
        "contribution": "1;2;2;2;3",
        "presentation": "3;3;3;3;2",
        "wc_summary": "20;54;69;53;63",
        "wc_strengths": "20;36;8;44;47",
        "wc_weaknesses": "85;254;246;171;76",
        "wc_questions": "35;332;62;2;42",
        "wc_review": "160;676;385;270;228",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            4.0,
            1.2649110640673518
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.2,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            51.8,
            16.96349020691202
        ],
        "wc_strengths_avg": [
            31.0,
            14.832396974191326
        ],
        "wc_weaknesses_avg": [
            166.4,
            75.93312847499436
        ],
        "wc_questions_avg": [
            94.6,
            120.26237982012496
        ],
        "wc_review_avg": [
            343.8,
            181.48983442606368
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.7499999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:cs6hq8TyYUsJ:scholar.google.com/&scioq=Learning+Spatio-Temporal+Representation+for+Multivariate+Time+Series&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Dongguk University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.dongguk.edu",
        "aff_unique_abbr": "DGU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "InfoCon: Concept Discovery with Generative and Discriminative Informativeness",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18159",
        "id": "g6eCbercEc",
        "author_site": "Ruizhe Liu, Qian Luo, Yanchao Yang",
        "tldr": "",
        "abstract": "We focus on the self-supervised discovery of manipulation concepts that can be adapted and reassembled to address various robotic tasks. We propose that the decision to conceptualize a physical procedure should not depend on how we name it (semantics) but rather on the significance of the informativeness in its representation regarding the low-level physical state and state changes. We model manipulation concepts -- discrete symbols -- as generative and discriminative goals and derive metrics that can autonomously link them to meaningful sub-trajectories from noisy, unlabeled demonstrations. Specifically, we employ a trainable codebook containing encodings --symbols -- capable of synthesizing the end-state of a sub-trajectory given the current state (generative informativeness). Moreover, the encoding corresponding to a particular sub-trajectory should differentiate the state within and outside it and confidently predict the subsequent action based on the gradient of its discriminative score (discriminative informativeness). These metrics, which do not rely on human annotation, can be seamlessly integrated into a VQ-VAE framework, enabling the partitioning of demonstrations into semantically consistent sub-trajectories, fulfilling the purpose of discovering manipulation concepts and the corresponding (sub)-goal states. We evaluate the effectiveness of the learned concepts by training policies that utilize them as guidance, demonstrating superior performance compared to other baselines. Additionally, our discovered manipulation concepts compare favorably to human-annotated ones, while saving much manual effort. The code and trained models will be made public.",
        "keywords": "concept discovery;robotic manipulation;self-supervised learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Ruizhe Liu;Qian Luo;Yanchao Yang",
        "authorids": "~Ruizhe_Liu1;~Qian_Luo1;~Yanchao_Yang1",
        "gender": "M;M;M",
        "homepage": ";;https://yanchaoyang.github.io/",
        "dblp": ";;84/8637-1",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;https://scholar.google.com/citations?hl=en;r2tKnV4AAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Ruizhe_Liu1;~Qian_Luo1;~Yanchao_Yang1",
        "aff": "Peking University;University of Hong Kong;University of Hong Kong",
        "aff_domain": "pku.edu.cn;hku.hk;hku.hk",
        "position": "Undergrad student;PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nliu2024infocon,\ntitle={InfoCon: Concept Discovery with Generative and Discriminative Informativeness},\nauthor={Ruizhe Liu and Qian Luo and Yanchao Yang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=g6eCbercEc}\n}",
        "github": "",
        "project": "",
        "reviewers": "WSFG;mBdA;v8jc;1PDE",
        "pdf_size": 12579149,
        "rating": "6;6;8;8",
        "confidence": "3;3;4;3",
        "soundness": "3;3;2;3",
        "contribution": "3;3;3;3",
        "presentation": "3;4;3;2",
        "wc_summary": "64;26;126;71",
        "wc_strengths": "93;47;21;63",
        "wc_weaknesses": "117;143;25;2",
        "wc_questions": "84;2;208;109",
        "wc_review": "358;218;380;245",
        "wc_reply_reviewers": "0;0;28;0",
        "wc_reply_authors": "1191;1042;1158;887",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "2;2;3;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            71.75,
            35.695763053897586
        ],
        "wc_strengths_avg": [
            56.0,
            26.095976701399778
        ],
        "wc_weaknesses_avg": [
            71.75,
            59.52887954598172
        ],
        "wc_questions_avg": [
            100.75,
            73.48936997960998
        ],
        "wc_review_avg": [
            300.25,
            69.84402265047454
        ],
        "wc_reply_reviewers_avg": [
            7.0,
            12.12435565298214
        ],
        "wc_reply_authors_avg": [
            1069.5,
            119.01365467878045
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2568700679620818905&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=g6eCbercEc",
        "pdf": "https://openreview.net/pdf?id=g6eCbercEc",
        "email": "pku.edu.cn;hku.hk;hku.hk",
        "author_num": 3,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Peking University;University of Hong Kong",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.hku.hk",
        "aff_unique_abbr": "Peking U;HKU",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Follow-Up Differential Descriptions: Language Models Resolve Ambiguities for Image Classification",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18158",
        "id": "g6rZtxaXRm",
        "author_site": "Reza Esfandiarpoor, Stephen Bach",
        "tldr": "",
        "abstract": "A promising approach for improving the performance of vision-language models like CLIP for image classification is to extend the class descriptions (i.e., prompts) with related attributes, e.g., using brown sparrow instead of sparrow. However, current zero-shot methods select a subset of attributes regardless of commonalities between the target classes, potentially providing no useful information that would have helped to distinguish between them. For instance, they may use color instead of bill shape to distinguish between sparrows and wrens, which are both brown. We propose Follow-up Differential Descriptions (FuDD), a zero-shot approach that tailors the class descriptions to each dataset and leads to additional attributes that better differentiate the target classes. FuDD first identifies the ambiguous classes for each image, and then uses a Large Language Model (LLM) to generate new class descriptions that differentiate between them. The new class descriptions resolve the initial ambiguity and help predict the correct label. In our experiments, FuDD consistently outperforms generic description ensembles and naive LLM-generated descriptions on 12 datasets. We show that differential descriptions are an effective tool to resolve class ambiguities, which otherwise significantly degrade the performance. We also show that high quality natural language class descriptions produced by FuDD result in comparable performance to few-shot adaptation methods.",
        "keywords": "representation learning for computer vision;image classification;vision-language models;large language models;CLIP;GPT-3;LLAMA",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/c4d35f1fac607d0c833cc75b33edb5b7267dea93.zip",
        "author": "Reza Esfandiarpoor;Stephen Bach",
        "authorids": "~Reza_Esfandiarpoor1;~Stephen_Bach1",
        "gender": ";M",
        "homepage": ";http://stephenbach.net",
        "dblp": ";90/1077",
        "google_scholar": ";hs6pGXoAAAAJ",
        "orcid": ";0000-0003-3857-3560",
        "linkedin": ";",
        "or_profile": "~Reza_Esfandiarpoor1;~Stephen_Bach1",
        "aff": ";Snorkel AI",
        "aff_domain": ";snorkel.ai",
        "position": ";Researcher",
        "bibtex": "@inproceedings{\nesfandiarpoor2024followup,\ntitle={Follow-Up Differential Descriptions: Language Models Resolve Ambiguities for Image Classification},\nauthor={Reza Esfandiarpoor and Stephen Bach},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=g6rZtxaXRm}\n}",
        "github": "",
        "project": "",
        "reviewers": "sQgp;RXgc;LDou;Y5Zb",
        "pdf_size": 23218454,
        "rating": "5;5;6;8",
        "confidence": "4;4;3;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "67;114;165;64",
        "wc_strengths": "28;44;40;81",
        "wc_weaknesses": "65;194;63;21",
        "wc_questions": "1;90;1;61",
        "wc_review": "161;442;269;227",
        "wc_reply_reviewers": "0;0;41;0",
        "wc_reply_authors": "659;770;244;516",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            102.5,
            41.17341375208036
        ],
        "wc_strengths_avg": [
            48.25,
            19.803724397193573
        ],
        "wc_weaknesses_avg": [
            85.75,
            64.92062461190588
        ],
        "wc_questions_avg": [
            38.25,
            38.63531415686949
        ],
        "wc_review_avg": [
            274.75,
            103.95281381473038
        ],
        "wc_reply_reviewers_avg": [
            10.25,
            17.75352077758099
        ],
        "wc_reply_authors_avg": [
            547.25,
            196.87734125592004
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1799562992751933802&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=g6rZtxaXRm",
        "pdf": "https://openreview.net/pdf?id=g6rZtxaXRm",
        "email": ";snorkel.ai",
        "author_num": 2,
        "aff_unique_index": "0",
        "aff_unique_norm": "Snorkel AI",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.snorkelai.com",
        "aff_unique_abbr": "Snorkel AI",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "g7YB6K2eXj",
        "title": "Double Rounding Quantization for Flexible Deep Neural Network Compression",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Model quantization is widely applied for compression and acceleration of deep neural networks, due to its simplification and adaptability. The quantization bit-width is typically predefined for quantizing a given neural network. However, the bit-width settings vary in different hardware and transmission demands, which will induce considerable training and storage costs. Therefore, the scheme of once-joint training for multiple bit-widths (multi-bit) is proposed to address this issue. In this paper, we propose a Double Rounding quantization method that can save the highest bit-width model instead of the full-precision counterpart and fully exploits the representation value range. Nevertheless, the performance during once-joint training degrades significantly due to inconsistent gradients between high-bit and low-bit quantization. To tackle this problem, we set the learning rate of multi-bit to proper values in an adaptive manner during training. We also apply our method for mixed-precision super-net and provide a novel training strategy with weighted probability. Experimental results demonstrate the proposed method outperforms the SOTA once-joint quantization-aware methods on ImageNet datasets. The code will be available soon.",
        "keywords": "Model Quantization;Double Rounding;Mixed-Precision Super-Net",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/fbd9c25089db64a6f5b487501c3472821af61a06.pdf",
        "author": "Haiduo Huang;Zhenhua Liu;Kai Han;Pengju Ren;Yunhe Wang",
        "authorids": "~Haiduo_Huang1;~Zhenhua_Liu2;~Kai_Han2;~Pengju_Ren1;~Yunhe_Wang1",
        "gender": "M;M;M;M;M",
        "homepage": ";;https://iamhankai.github.io;https://gr.xjtu.edu.cn/web/pengjuren;https://www.wangyunhe.site/",
        "dblp": "315/7717;02/1825-3.html;51/4757-2;99/2460.html;63/8217-1",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;bihqxP4AAAAJ;vThoBVcAAAAJ;qVYDbvIAAAAJ;https://scholar.google.com.sg/citations?user=isizOkYAAAAJ",
        "orcid": ";;0000-0002-9761-2702;;0000-0002-0142-509X",
        "linkedin": ";;;;",
        "or_profile": "~Haiduo_Huang1;~Zhenhua_Liu2;~Kai_Han2;~Pengju_Ren1;~Yunhe_Wang1",
        "aff": "AMD;Huawei Technologies Ltd.;Huawei Noah's Ark Lab;Xi'an Jiaotong University;Huawei Noah's Ark Lab",
        "aff_domain": "amd.com;huawei.com;huawei.com;xjtu.edu.cn;huawei.com",
        "position": "Intern;Researcher;Principal Researcher;Full Professor;Principal Researcher",
        "bibtex": "@misc{\nhuang2024double,\ntitle={Double Rounding Quantization for Flexible Deep Neural Network Compression},\nauthor={Haiduo Huang and Zhenhua Liu and Kai Han and Pengju Ren and Yunhe Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=g7YB6K2eXj}\n}",
        "github": "",
        "project": "",
        "reviewers": "fWCS;DGQc;GakW;mFBC",
        "site": "https://openreview.net/forum?id=g7YB6K2eXj",
        "pdf_size": 337138,
        "rating": "5;5;5;5",
        "confidence": "5;4;5;4",
        "soundness": "3;3;3;2",
        "contribution": "2;2;2;2",
        "presentation": "3;3;3;2",
        "wc_summary": "122;84;42;246",
        "wc_strengths": "30;36;35;49",
        "wc_weaknesses": "26;124;114;120",
        "wc_questions": "472;91;18;1",
        "wc_review": "650;335;209;416",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "774;783;626;777",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            123.5,
            76.17578355356773
        ],
        "wc_strengths_avg": [
            37.5,
            7.0178344238090995
        ],
        "wc_weaknesses_avg": [
            96.0,
            40.570925550201586
        ],
        "wc_questions_avg": [
            145.5,
            191.51305438533427
        ],
        "wc_review_avg": [
            402.5,
            160.80811546685075
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            740.0,
            65.89764790946639
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:aXtsojjMCb0J:scholar.google.com/&scioq=Double+Rounding+Quantization+for+Flexible+Deep+Neural+Network+Compression&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;2;1",
        "aff_unique_norm": "Advanced Micro Devices, Inc.;Huawei;Xi'an Jiao Tong University",
        "aff_unique_dep": ";Huawei Technologies;",
        "aff_unique_url": "https://www.amd.com;https://www.huawei.com;https://www.xjtu.edu.cn",
        "aff_unique_abbr": "AMD;Huawei;XJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;1",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "Flow Matching on General Geometries",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18157",
        "id": "g7ohDlTITL",
        "author_site": "Ricky T. Q. Chen, Yaron Lipman",
        "tldr": "",
        "abstract": "We propose Riemannian Flow Matching (RFM), a simple yet powerful framework for training continuous normalizing flows on manifolds. Existing methods for generative modeling on manifolds either require expensive simulation, are inherently unable to scale to high dimensions, or use approximations for limiting quantities that result in biased training objectives. Riemannian Flow Matching bypasses these limitations and offers several advantages over previous approaches: it is simulation-free on simple geometries, does not require divergence computation, and computes its target vector field in closed-form. The key ingredient behind RFM is the construction of a relatively simple premetric for defining target vector fields, which encompasses the existing Euclidean case. To extend to general geometries, we rely on the use of spectral decompositions to efficiently compute premetrics on the fly. Our method achieves state-of-the-art performance on real-world non-Euclidean datasets, and we demonstrate tractable training on general geometries, including triangular meshes with highly non-trivial curvature and boundaries.",
        "keywords": "general manifolds;diffusion models;continuous normalizing flow",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/dbdc756913aa45bdcb7198345036276ec0daaacc.zip",
        "author": "Ricky T. Q. Chen;Yaron Lipman",
        "authorids": "~Ricky_T._Q._Chen1;~Yaron_Lipman1",
        "gender": ";",
        "homepage": ";",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Ricky_T._Q._Chen1;~Yaron_Lipman1",
        "aff": ";",
        "aff_domain": ";",
        "position": ";",
        "bibtex": "@inproceedings{\nchen2024flow,\ntitle={Flow Matching on General Geometries},\nauthor={Ricky T. Q. Chen and Yaron Lipman},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=g7ohDlTITL}\n}",
        "github": "",
        "project": "",
        "reviewers": "q47k;tLmW;FTs2",
        "pdf_size": 11452570,
        "rating": "8;8;8",
        "confidence": "3;4;4",
        "soundness": "4;3;4",
        "contribution": "3;3;3",
        "presentation": "4;3;4",
        "wc_summary": "80;55;116",
        "wc_strengths": "44;109;104",
        "wc_weaknesses": "6;116;55",
        "wc_questions": "2;65;118",
        "wc_review": "132;345;393",
        "wc_reply_reviewers": "0;15;58",
        "wc_reply_authors": "10;778;825",
        "reply_reviewers": "0;1;1",
        "reply_authors": "1;1;2",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            83.66666666666667,
            25.037749277618563
        ],
        "wc_strengths_avg": [
            85.66666666666667,
            29.53340857778225
        ],
        "wc_weaknesses_avg": [
            59.0,
            44.99629614386796
        ],
        "wc_questions_avg": [
            61.666666666666664,
            47.41542177627678
        ],
        "wc_review_avg": [
            290.0,
            113.4283915075939
        ],
        "wc_reply_reviewers_avg": [
            24.333333333333332,
            24.580932086115496
        ],
        "wc_reply_authors_avg": [
            537.6666666666666,
            373.6097191217357
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 55,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8492991384228075340&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=g7ohDlTITL",
        "pdf": "https://openreview.net/pdf?id=g7ohDlTITL",
        "email": ";",
        "author_num": 2
    },
    {
        "id": "g8oaZRhDcf",
        "title": "Copy Suppression: Comprehensively Understanding an Attention Head",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We present a single attention head in GPT-2 Small that has one main role across the entire training distribution. If components in earlier layers predict a certain token, and this token appears earlier in the context, the head suppresses it: we call this copy suppression. Attention Head 10.7 (L10H7) suppresses naive copying behavior which improves overall model calibration. This explains why multiple prior works studying certain narrow tasks found negative heads that systematically favored the wrong answer. We uncover the mechanism that the Negative Heads use for copy suppression with weights-based evidence and are able to explain 76.9% of the impact of L10H7 in GPT-2 Small. To the best of our knowledge, this is the most comprehensive description of the complete role of a component in a language model to date. One major effect of copy suppression is its role in self-repair. Self-repair refers to how ablating crucial model components results in downstream neural network parts compensating for this ablation. Copy suppression leads to self-repair: if an initial overconfident copier is ablated, then there is nothing to suppress. We show that self-repair is implemented by several mechanisms, one of which is copy suppression, which explains 39% of the behavior in a narrow task. Interactive visualisations of the copy suppression phenomena may be\nseen at our web app https://copy-suppression.streamlit.app/",
        "keywords": "Interpretability;Mechanistic Interpretability;Large Language Models;Natural Language Processing;Science of Deep Learning",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Callum Stuart McDougall;Arthur Conmy;Cody Rushing;Thomas McGrath;Neel Nanda",
        "authorids": "~Callum_Stuart_McDougall1;~Arthur_Conmy1;~Cody_Rushing1;~Thomas_McGrath1;~Neel_Nanda1",
        "gender": "M;M;M;;M",
        "homepage": "https://www.perfectlynormal.co.uk/;https://arthurconmy.github.io/;https://starship006.github.io/;;https://neelnanda.io",
        "dblp": ";;;;285/6389",
        "google_scholar": ";;t5fY7ysAAAAJ;;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;;",
        "linkedin": "callum-mcdougall-1b6318170/;;codyrushing/;https://uk.linkedin.com/in/tom-mcgrath-7337bb151;https://linkedin.com/in/neel-nanda-993580151",
        "or_profile": "~Callum_Stuart_McDougall1;~Arthur_Conmy1;~Cody_Rushing1;~Thomas_McGrath1;~Neel_Nanda1",
        "aff": "Anthropic;Google DeepMind;University of Texas at Austin;Google;Google DeepMind",
        "aff_domain": "anthropic.com;google.com;utexas.edu;google.com;deepmind.com",
        "position": "Researcher;Researcher;Undergrad student;Research Scientist;Researcher",
        "bibtex": "@misc{\nmcdougall2024copy,\ntitle={Copy Suppression: Comprehensively Understanding an Attention Head},\nauthor={Callum Stuart McDougall and Arthur Conmy and Cody Rushing and Thomas McGrath and Neel Nanda},\nyear={2024},\nurl={https://openreview.net/forum?id=g8oaZRhDcf}\n}",
        "github": "",
        "project": "",
        "reviewers": "ccpw;pBv5;bo4P;DKgn",
        "site": "https://openreview.net/forum?id=g8oaZRhDcf",
        "pdf_size": 1992234,
        "rating": "3;5;6;6",
        "confidence": "3;2;3;3",
        "soundness": "2;3;3;3",
        "contribution": "1;2;3;2",
        "presentation": "2;2;3;3",
        "wc_summary": "22;97;56;105",
        "wc_strengths": "12;79;55;62",
        "wc_weaknesses": "230;123;26;22",
        "wc_questions": "10;55;16;21",
        "wc_review": "274;354;153;210",
        "wc_reply_reviewers": "63;0;0;0",
        "wc_reply_authors": "921;724;361;517",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "3;2;3;2",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            70.0,
            33.36914742692717
        ],
        "wc_strengths_avg": [
            52.0,
            24.68805379125702
        ],
        "wc_weaknesses_avg": [
            100.25,
            85.13041465892199
        ],
        "wc_questions_avg": [
            25.5,
            17.471405209656147
        ],
        "wc_review_avg": [
            247.75,
            74.80098595606879
        ],
        "wc_reply_reviewers_avg": [
            15.75,
            27.279800219209818
        ],
        "wc_reply_authors_avg": [
            630.75,
            211.33193677246229
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 35,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11849103389425012841&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;1;1",
        "aff_unique_norm": "Anthropic;Google;University of Texas at Austin",
        "aff_unique_dep": ";Google DeepMind;",
        "aff_unique_url": "https://www.anthropic.com;https://deepmind.com;https://www.utexas.edu",
        "aff_unique_abbr": "Anthropic;DeepMind;UT Austin",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Austin;Mountain View",
        "aff_country_unique_index": "0;1;0;0;1",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "title": "On the Parameterization of Second-Order Optimization Effective towards the Infinite Width",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18156",
        "id": "g8sGBSQjYk",
        "author_site": "Satoki Ishikawa, Ryo Karakida",
        "tldr": "",
        "abstract": "Second-order optimization has been developed to accelerate the training of deep neural networks and it is being applied to increasingly larger-scale models. In this study, towards training on further larger scales, we identify a specific parameterization for second-order optimization that promotes feature learning in a stable manner even if the network width increases significantly. Inspired by a maximal update parametrization, we consider a one-step update of the gradient and reveal the appropriate scales of hyperparameters including random initialization, learning rates, and damping terms. Our approach covers two major second-order optimization algorithms, K-FAC and Shampoo, and we demonstrate that our parametrization achieves higher generalization performance in feature learning.\nIn particular, it enables us to transfer the hyperparameters across models with different widths.",
        "keywords": "Deep learning;Second-order optimization;K-FAC;Feature learning;Infinite width;Maximum update parameterization",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Satoki Ishikawa;Ryo Karakida",
        "authorids": "~Satoki_Ishikawa1;~Ryo_Karakida2",
        "gender": "M;M",
        "homepage": "https://riverstone496.github.io/;https://sites.google.com/view/ryokarakida/english",
        "dblp": "346/8912.html;",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": "ishikawa-satoki-a190b61b6/;",
        "or_profile": "~Satoki_Ishikawa1;~Ryo_Karakida2",
        "aff": "Tokyo Institute of Technology, Tokyo Institute of Technology;AIST, National Institute of Advanced Industrial Science and Technology",
        "aff_domain": "titech.ac.jp;aist.go.jp",
        "position": "MS student;Researcher",
        "bibtex": "@inproceedings{\nishikawa2024on,\ntitle={On the Parameterization of Second-Order Optimization Effective towards the Infinite Width},\nauthor={Satoki Ishikawa and Ryo Karakida},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=g8sGBSQjYk}\n}",
        "github": "",
        "project": "",
        "reviewers": "SW4H;Xrk9;ZUFF",
        "pdf_size": 1265522,
        "rating": "6;8;8",
        "confidence": "3;5;3",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "3;3;3",
        "wc_summary": "71;207;97",
        "wc_strengths": "67;125;87",
        "wc_weaknesses": "50;217;190",
        "wc_questions": "19;47;139",
        "wc_review": "207;596;513",
        "wc_reply_reviewers": "0;101;0",
        "wc_reply_authors": "325;431;601",
        "reply_reviewers": "0;1;0",
        "reply_authors": "1;1;2",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            125.0,
            58.94630324852159
        ],
        "wc_strengths_avg": [
            93.0,
            24.055491403558285
        ],
        "wc_weaknesses_avg": [
            152.33333333333334,
            73.19532468372249
        ],
        "wc_questions_avg": [
            68.33333333333333,
            51.25968743130956
        ],
        "wc_review_avg": [
            438.6666666666667,
            167.28086826917442
        ],
        "wc_reply_reviewers_avg": [
            33.666666666666664,
            47.6118565998942
        ],
        "wc_reply_authors_avg": [
            452.3333333333333,
            113.68181717212106
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6499329756959039266&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=g8sGBSQjYk",
        "pdf": "https://openreview.net/pdf?id=g8sGBSQjYk",
        "email": "titech.ac.jp;aist.go.jp",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Tokyo Institute of Technology;National Institute of Advanced Industrial Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.titech.ac.jp;https://www.aist.go.jp",
        "aff_unique_abbr": "Titech;AIST",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Tokyo;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Japan"
    },
    {
        "title": "Adaptive Rational Activations to Boost Deep Reinforcement Learning",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18155",
        "id": "g90ysX1sVs",
        "author_site": "Quentin Delfosse, Patrick Schramowski, Martin Mundt, Alejandro Molina Ramirez, Kristian Kersting",
        "tldr": "",
        "abstract": "Latest insights from biology show that intelligence not only emerges from the connections between neurons, but that individual neurons shoulder more computational responsibility than previously anticipated. Specifically, neural plasticity should be critical in the context of constantly changing reinforcement learning (RL) environments, yet current approaches still primarily employ static activation functions. In this work, we motivate the use of adaptable activation functions in RL and show that rational activation functions are particularly suitable for augmenting plasticity. Inspired by residual networks, we derive a condition under which rational units are closed under residual connections and formulate a naturally regularised version. The proposed joint-rational activation allows for desirable degrees of flexibility, yet regularises plasticity to an extent that avoids overfitting by leveraging a mutual set of activation function parameters across layers. We demonstrate that equipping popular algorithms with (joint) rational activations leads to consistent improvements on different games from the Atari Learning Environment benchmark, notably making DQN competitive to DDQN and Rainbow.",
        "keywords": "Deep Reinforcement Learning;Neural Plasticity;Activation Functions;Rational Functions",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/2737cb738844f05ff8a16a71d451d1c4da59b318.pdf",
        "author": "Quentin Delfosse;Patrick Schramowski;Martin Mundt;Alejandro Molina;Kristian Kersting",
        "authorids": "~Quentin_Delfosse1;~Patrick_Schramowski1;~Martin_Mundt1;~Alejandro_Molina1;~Kristian_Kersting1",
        "gender": "M;M;M;M;M",
        "homepage": "https://quentindelfosse.me/;https://ml-research.github.io/people/pschramowski/index.html;https://owl-ml.uni-bremen.de;https://molina.ai;http://www.ml.informatik.tu-darmstadt.de/",
        "dblp": "286/1466.html;217/1650;200/8146;https://dblp.uni-trier.de/pid/26/7693-1;40/3793",
        "google_scholar": "k1E0FgIAAAAJ;GD481RkAAAAJ;riGBurAAAAAJ;VIHj44oAAAAJ;QY-earAAAAAJ",
        "orcid": ";0000-0003-1231-7120;0000-0003-1639-8255;;0000-0002-2873-9152",
        "linkedin": "quentin-delfosse-70b377150/;;;;",
        "or_profile": "~Quentin_Delfosse1;~Patrick_Schramowski1;~Martin_Mundt1;~Alejandro_Molina1;~Kristian_Kersting1",
        "aff": "CS Department, TU Darmstadt, TU Darmstadt;German Research Center for AI;Technische Universit\u00e4t Darmstadt & hessian.AI;Amazon;TU Darmstadt",
        "aff_domain": "cs.tu-darmstadt.de;dfki.de;tu-darmstadt.de;amazon.com;tu-darmstadt.de",
        "position": "PhD student;Researcher;Junior Research Group Leader;Researcher;Full Professor",
        "bibtex": "@inproceedings{\ndelfosse2024adaptive,\ntitle={Adaptive Rational Activations to Boost Deep Reinforcement Learning},\nauthor={Quentin Delfosse and Patrick Schramowski and Martin Mundt and Alejandro Molina and Kristian Kersting},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=g90ysX1sVs}\n}",
        "github": "",
        "project": "",
        "reviewers": "qikv;mxps;7Gju;cKgE",
        "pdf_size": 2848536,
        "rating": "6;8;8;8",
        "confidence": "3;3;4;4",
        "soundness": "2;3;3;2",
        "contribution": "3;3;3;3",
        "presentation": "1;2;2;3",
        "wc_summary": "23;71;43;174",
        "wc_strengths": "13;37;59;69",
        "wc_weaknesses": "835;136;468;226",
        "wc_questions": "4;80;40;452",
        "wc_review": "875;324;610;921",
        "wc_reply_reviewers": "0;41;86;113",
        "wc_reply_authors": "817;650;328;517",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "2;2;2;1",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            77.75,
            58.12647847582029
        ],
        "wc_strengths_avg": [
            44.5,
            21.558061137310098
        ],
        "wc_weaknesses_avg": [
            416.25,
            270.5386987105542
        ],
        "wc_questions_avg": [
            144.0,
            179.84437717093076
        ],
        "wc_review_avg": [
            682.5,
            238.5985121495941
        ],
        "wc_reply_reviewers_avg": [
            60.0,
            43.14510400960925
        ],
        "wc_reply_authors_avg": [
            578.0,
            179.25261504368632
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 17,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11171882147885925332&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=g90ysX1sVs",
        "pdf": "https://openreview.net/pdf?id=g90ysX1sVs",
        "email": "cs.tu-darmstadt.de;dfki.de;tu-darmstadt.de;amazon.com;tu-darmstadt.de",
        "author_num": 5,
        "aff_unique_index": "0;1;0;2;0",
        "aff_unique_norm": "Technische Universit\u00e4t Darmstadt;German Research Center for Artificial Intelligence;Amazon",
        "aff_unique_dep": "Computer Science Department;;Amazon.com, Inc.",
        "aff_unique_url": "https://www.tu-darmstadt.de;https://www.dfki.de/;https://www.amazon.com",
        "aff_unique_abbr": "TU Darmstadt;DFKI;Amazon",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Darmstadt",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "Germany;United States"
    },
    {
        "title": "Evaluating the Zero-shot Robustness of Instruction-tuned Language Models",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18154",
        "id": "g9diuvxN6D",
        "author_site": "Jiuding Sun, Chantal Shaib, Byron Wallace",
        "tldr": "",
        "abstract": "Instruction fine-tuning has recently emerged as a promising approach for improving the zero-shot capabilities of Large Language Models (LLMs) on new tasks. This technique has shown particular strength in improving the performance of modestly sized LLMs, sometimes inducing performance competitive with much larger model variants. In this paper, we ask two questions: (1) How sensitive are instruction-tuned models to the particular phrasings of instructions, and, (2) How can we make them more robust to such natural language variation? To answer the former, we collect a set of 319 instructions manually written by NLP practitioners for over 80 unique tasks included in widely used benchmarks, and we evaluate the variance and average performance of these instructions as compared to instruction phrasings observed during instruction fine-tuning. We find that using novel (unobserved) but appropriate instruction phrasings consistently degrades model performance, sometimes substantially so. Further, such natural instructions yield a wide variance in downstream performance, despite their semantic equivalence. Put another way, instruction-tuned models are not especially robust to instruction re-phrasings. \nWe propose a simple method to mitigate this issue by introducing ``soft prompt'' embedding parameters and optimizing these to maximize the similarity between representations of semantically equivalent instructions. We show that this method consistently improves the robustness of instruction-tuned models.",
        "keywords": "Instruction Tuning;Robustness;Large Language Models",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/237a01de70ebdef056980c06a061ed37fde16275.zip",
        "author": "Jiuding Sun;Chantal Shaib;Byron C Wallace",
        "authorids": "~Jiuding_Sun1;~Chantal_Shaib1;~Byron_C_Wallace1",
        "gender": "M;F;M",
        "homepage": "https://github.com/SunJiuding;http://chantal.shaib.info;http://www.byronwallace.com/",
        "dblp": ";;00/8247",
        "google_scholar": ";;KTzRHmwAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Jiuding_Sun1;~Chantal_Shaib1;~Byron_C_Wallace1",
        "aff": "Northeastern University;Northeastern University;Northeastern University",
        "aff_domain": "neu.edu;northeastern.edu;northeastern.edu",
        "position": "Undergrad student;PhD student;Associate Professor",
        "bibtex": "@inproceedings{\nsun2024evaluating,\ntitle={Evaluating the Zero-shot Robustness of Instruction-tuned Language Models},\nauthor={Jiuding Sun and Chantal Shaib and Byron C Wallace},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=g9diuvxN6D}\n}",
        "github": "",
        "project": "",
        "reviewers": "hcVs;KbYU;cGUu;RNd8",
        "pdf_size": 3210414,
        "rating": "6;8;8;8",
        "confidence": "4;4;4;4",
        "soundness": "2;3;3;3",
        "contribution": "3;4;3;3",
        "presentation": "3;3;3;4",
        "wc_summary": "37;59;95;91",
        "wc_strengths": "46;60;88;106",
        "wc_weaknesses": "147;114;231;55",
        "wc_questions": "13;48;120;54",
        "wc_review": "243;281;534;306",
        "wc_reply_reviewers": "92;0;188;0",
        "wc_reply_authors": "2162;446;958;340",
        "reply_reviewers": "2;0;2;0",
        "reply_authors": "5;1;2;1",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            70.5,
            23.84848003542364
        ],
        "wc_strengths_avg": [
            75.0,
            23.430749027719962
        ],
        "wc_weaknesses_avg": [
            136.75,
            63.61750938224476
        ],
        "wc_questions_avg": [
            58.75,
            38.674119253061214
        ],
        "wc_review_avg": [
            341.0,
            113.6639784628358
        ],
        "wc_reply_reviewers_avg": [
            70.0,
            77.79460135510689
        ],
        "wc_reply_authors_avg": [
            976.5,
            723.2418336905022
        ],
        "reply_reviewers_avg": [
            1.0,
            1.0
        ],
        "reply_authors_avg": [
            2.25,
            1.6393596310755
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 49,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5397536070023563356&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=g9diuvxN6D",
        "pdf": "https://openreview.net/pdf?id=g9diuvxN6D",
        "email": "neu.edu;northeastern.edu;northeastern.edu",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Northeastern University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.northeastern.edu",
        "aff_unique_abbr": "NEU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "gAnRV4UaUv",
        "title": "ISCUTE: Instance Segmentation of Cables Using Text Embedding",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In the field of robotics and automation, conventional object recognition and instance segmentation methods face a formidable challenge when it comes to perceiving Deformable Linear Objects (DLOs) like wires, cables, and flexible tubes. This challenge arises primarily from the lack of distinct attributes such as shape, color, and texture, which calls for tailored solutions to achieve precise identification.\nIn this work, we propose a foundation model-based DLO instance segmentation technique that is text-promptable and user-friendly. Specifically, our approach combines the text-conditioned semantic segmentation capabilities of CLIPSeg model with the zero-shot generalization capabilities of Segment Anything Model (SAM). We show that our method exceeds state-of-the-art performance on DLO instance segmentation, achieving a mIoU of $91.21\\%$. We also introduce a rich and diverse DLO-specific dataset for instance segmentation.",
        "keywords": "Deformable Linear Objects;Instance Segmentation;Text-Promptable Models;CLIPSeg;Segment Anything Model (SAM);Instance Mask;Deep Vision-Language Fusion;Zero-Shot Generalization",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Omkar Joglekar;Shir Kozlovsky;Dotan Di Castro",
        "authorids": "~Omkar_Joglekar2;~Shir_Kozlovsky1;~Dotan_Di_Castro1",
        "gender": "M;F;M",
        "homepage": ";https://github.com/shirkozlovsky;",
        "dblp": ";;72/538",
        "google_scholar": "https://scholar.google.com/citations?hl=en;KxrnkosAAAAJ;zhQaFaMAAAAJ",
        "orcid": "0009-0006-5461-1087;;",
        "linkedin": "omkar-joglekar-4a196b163;;dotan-di-castro-b0a99039/",
        "or_profile": "~Omkar_Joglekar2;~Shir_Kozlovsky1;~Dotan_Di_Castro1",
        "aff": "Bosch;Bosch;Bosch",
        "aff_domain": "bosch.com;bosch.com;bosch.com",
        "position": "Researcher;Researcher;Bosch Center for Artificial Inteligence",
        "bibtex": "@misc{\njoglekar2024iscute,\ntitle={{ISCUTE}: Instance Segmentation of Cables Using Text Embedding},\nauthor={Omkar Joglekar and Shir Kozlovsky and Dotan Di Castro},\nyear={2024},\nurl={https://openreview.net/forum?id=gAnRV4UaUv}\n}",
        "github": "",
        "project": "",
        "reviewers": "NWxv;UDha;Bk1o",
        "site": "https://openreview.net/forum?id=gAnRV4UaUv",
        "pdf_size": 29880652,
        "rating": "3;6;6",
        "confidence": "5;3;4",
        "soundness": "2;3;3",
        "contribution": "1;3;2",
        "presentation": "2;3;3",
        "wc_summary": "29;51;63",
        "wc_strengths": "32;36;115",
        "wc_weaknesses": "67;85;58",
        "wc_questions": "41;34;311",
        "wc_review": "169;206;547",
        "wc_reply_reviewers": "565;0;0",
        "wc_reply_authors": "1146;252;542",
        "reply_reviewers": "1;0;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            47.666666666666664,
            14.079141387961917
        ],
        "wc_strengths_avg": [
            61.0,
            38.21866908549625
        ],
        "wc_weaknesses_avg": [
            70.0,
            11.224972160321824
        ],
        "wc_questions_avg": [
            128.66666666666666,
            128.96080369200902
        ],
        "wc_review_avg": [
            307.3333333333333,
            170.1417709506464
        ],
        "wc_reply_reviewers_avg": [
            188.33333333333334,
            266.34355424693285
        ],
        "wc_reply_authors_avg": [
            646.6666666666666,
            372.4024107810737
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8660254037844387,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8456299977349698616&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Robert Bosch GmbH",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.bosch.com",
        "aff_unique_abbr": "Bosch",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "gBLEHzKOfF",
        "title": "Generative Entropic Neural Optimal Transport To Map Within and Across Space",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Learning measure-to-measure mappings is a crucial task in machine learning, fea-\ntured prominently in generative modeling. Recent years have witnessed a surge of\ntechniques that draw inspiration from optimal transport (OT) theory. Combined\nwith neural network models, these methods collectively known as Neural OT use\noptimal transport as an inductive bias: such mappings should be optimal w.r.t. a\ngiven cost function, in the sense that they are able to move points in a thrifty way,\nwithin (by minimizing displacements) or across spaces (by being isometric). This\nprinciple, while intuitive, is often confronted with several practical challenges that\nrequire adapting the OT toolbox: cost functions other than the squared-Euclidean\ncost can be challenging to handle, the deterministic formulation of Monge maps\nleaves little flexibility, mapping across incomparable spaces raises multiple chal-\nlenges, while the mass conservation constraint inherent to OT can provide too\nmuch credit to outliers. While each of these mismatches between practice and\ntheory has been addressed independently in various works, we propose in this\nwork an elegant framework to unify them, called generative entropic neural op-\ntimal transport (GENOT). GENOT can accommodate any cost function; handles\nrandomness using conditional generative models; can map points across incompa-\nrable spaces, and can be used as an unbalanced solver. We evaluate our approach\nthrough experiments conducted on various synthetic datasets and demonstrate its\npracticality in single-cell biology. In this domain, GENOT proves to be valu-\nable for tasks such as modeling cell development, predicting cellular responses to\ndrugs, and translating between different data modalities of cells.",
        "keywords": "optimal transport;single-cell biology",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Dominik Klein;Th\u00e9o Uscidda;Fabian J Theis;marco cuturi",
        "authorids": "~Dominik_Klein1;~Th\u00e9o_Uscidda1;~Fabian_J_Theis1;~marco_cuturi2",
        "gender": "M;M;M;",
        "homepage": "https://scholar.google.com/citations?user=Zs1w-ukAAAAJ&hl=en&oi=ao;https://theouscidda6.github.io/;http://marcocuturi.net;https://www.helmholtz-munich.de/en/icb/pi/fabian-theis",
        "dblp": ";;85/5102;t/FabianJTheis",
        "google_scholar": "Zs1w-ukAAAAJ;xnQZonMAAAAJ;https://scholar.google.fr/citations?user=kQEydDMAAAAJ;sqWpn2AAAAAJ",
        "orcid": ";;;0000-0002-2419-1943",
        "linkedin": ";th\u00e9o-uscidda-926335174/;;",
        "or_profile": "~Dominik_Klein1;~Th\u00e9o_Uscidda1;~marco_cuturi2;~Fabian_J._Theis1",
        "aff": ";Ecole Nationale de la Statistique et de l'Administration Economique;Ensae ParisTech;Technical University Munich",
        "aff_domain": ";ensae.fr;ensae.fr;tum.de",
        "position": ";PhD student;Full Professor;Full Professor",
        "bibtex": "@misc{\nklein2024generative,\ntitle={Generative Entropic Neural Optimal Transport To Map Within and Across Space},\nauthor={Dominik Klein and Th{\\'e}o Uscidda and Fabian J Theis and marco cuturi},\nyear={2024},\nurl={https://openreview.net/forum?id=gBLEHzKOfF}\n}",
        "github": "",
        "project": "",
        "reviewers": "fozM;DBjq;NfWc;WAiP",
        "site": "https://openreview.net/forum?id=gBLEHzKOfF",
        "pdf_size": 8055059,
        "rating": "5;5;6;8",
        "confidence": "3;5;3;4",
        "soundness": "4;1;3;3",
        "contribution": "2;2;3;3",
        "presentation": "4;3;3;3",
        "wc_summary": "80;310;62;46",
        "wc_strengths": "76;51;26;44",
        "wc_weaknesses": "400;729;54;338",
        "wc_questions": "148;226;179;12",
        "wc_review": "704;1316;321;440",
        "wc_reply_reviewers": "61;347;87;0",
        "wc_reply_authors": "1424;2677;858;1225",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "3;5;2;2",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            1.0897247358851685
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            124.5,
            107.77174954504542
        ],
        "wc_strengths_avg": [
            49.25,
            17.93564885918544
        ],
        "wc_weaknesses_avg": [
            380.25,
            239.91704295443458
        ],
        "wc_questions_avg": [
            141.25,
            79.6221545802423
        ],
        "wc_review_avg": [
            695.25,
            384.25992179773317
        ],
        "wc_reply_reviewers_avg": [
            123.75,
            132.70526553230658
        ],
        "wc_reply_authors_avg": [
            1546.0,
            683.8183238258537
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            1.224744871391589
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3812852294845967051&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Ecole Nationale de la Statistique et de l'Administration Economique;ENSAE ParisTech;Technical University of Munich",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://ensae.fr;https://www.ensae.fr;https://www.tum.de",
        "aff_unique_abbr": "ENSAE;Ensae;TUM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "France;Germany"
    },
    {
        "id": "gBV21wK07P",
        "title": "3D Autoencoding Diffusion Model for Molecule Interpolation and Manipulation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Manipulating known molecules and interpolating between them is useful for many applications in drug design and protein engineering, where exploration around the molecular templates is involved. Recent studies using equivariant diffusion models have made significant progress in the de novo generation of high-quality molecules, but using these models to directly manipulate a specified template remains less explored. This is mainly due to an intrinsic property of diffusion models: the lack of a latent semantic space that is easy to operate on. To address this issue, we propose the first semantics-guided equivariant diffusion model that leverages the \u201csemantic\u201d embedding of a 3D molecule, learned from an auxiliary encoder, to control the generative denoising process. By modifying the embedding, we can steer the generation towards another specified molecule or a desired molecular property. We show that our model can effectively manipulate basic chemical properties, outperforming several baselines. We further verify that our approach can achieve smoother interpolation between 3D molecular pairs compared to standard diffusion models.",
        "keywords": "diffusion models;3D molecule optimization;controllable generation;equivariant GNN",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Tianxiao Li;Martin Renqiang Min;Hongyu Guo;Mark Gerstein",
        "authorids": "~Tianxiao_Li1;~Martin_Renqiang_Min1;~Hongyu_Guo1;~Mark_Gerstein2",
        "gender": "M;M;M;M",
        "homepage": ";http://www.cs.toronto.edu/~cuty;https://hongyuharryguo.github.io/;http://www.gersteinlab.org/",
        "dblp": ";29/7048;;67/5132",
        "google_scholar": "Q4EBjt4AAAAJ;T2M4JjEAAAAJ;https://scholar.google.ca/citations?user=bZUqlakAAAAJ;YvjuUugAAAAJ",
        "orcid": ";0000-0002-8563-6133;;0000-0002-9746-3719",
        "linkedin": ";martin-renqiang-min-955a8766;harry-h-y-guo-a582087/;mbgmbg/",
        "or_profile": "~Tianxiao_Li1;~Martin_Renqiang_Min1;~Hongyu_Guo1;~Mark_Gerstein1",
        "aff": "NEC;NEC Laboratories America;National Research Council Canada;Yale University",
        "aff_domain": "nec-labs.com;nec-labs.com;nrc-cnrc.gc.ca;yale.edu",
        "position": "Postdoc;Researcher;Senior Research Officer;Full Professor",
        "bibtex": "@misc{\nli2024d,\ntitle={3D Autoencoding Diffusion Model for Molecule Interpolation and Manipulation},\nauthor={Tianxiao Li and Martin Renqiang Min and Hongyu Guo and Mark Gerstein},\nyear={2024},\nurl={https://openreview.net/forum?id=gBV21wK07P}\n}",
        "github": "",
        "project": "",
        "reviewers": "Xp9N;SYuH;bMs7;6Nzc",
        "site": "https://openreview.net/forum?id=gBV21wK07P",
        "pdf_size": 4618599,
        "rating": "3;3;3;5",
        "confidence": "5;4;3;2",
        "soundness": "2;3;2;3",
        "contribution": "1;2;2;2",
        "presentation": "2;2;2;1",
        "wc_summary": "82;99;81;75",
        "wc_strengths": "94;34;55;30",
        "wc_weaknesses": "372;215;244;150",
        "wc_questions": "2;90;68;1",
        "wc_review": "550;438;448;256",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "452;783;718;303",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            84.25,
            8.926785535678562
        ],
        "wc_strengths_avg": [
            53.25,
            25.370997221236692
        ],
        "wc_weaknesses_avg": [
            245.25,
            80.70741911373452
        ],
        "wc_questions_avg": [
            40.25,
            39.52451770736741
        ],
        "wc_review_avg": [
            423.0,
            105.9103394386025
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            564.0,
            195.1550665496543
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.7745966692414834,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Zs6J4as9Ek8J:scholar.google.com/&scioq=3D+Autoencoding+Diffusion+Model+for+Molecule+Interpolation+and+Manipulation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "NEC Corporation;NEC Laboratories America;National Research Council Canada;Yale University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.nec.com;https://www.nec-labs.com;https://www.nrc-cnrc.gc.ca;https://www.yale.edu",
        "aff_unique_abbr": "NEC;NEC Labs America;NRC-CNRC;Yale",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;1",
        "aff_country_unique": "Japan;United States;Canada"
    },
    {
        "title": "BESA: Pruning Large Language Models with Blockwise Parameter-Efficient Sparsity Allocation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18153",
        "id": "gC6JTEU3jl",
        "author_site": "Peng Xu, Wenqi Shao, Mengzhao Chen, Shitao Tang, Kaipeng Zhang, Gao Peng, Fengwei An, Yu Qiao, Ping Luo",
        "tldr": "",
        "abstract": "Large language models (LLMs) have demonstrated outstanding performance in various tasks, such as text summarization, text question-answering, and etc. While their performance is impressive, the computational footprint due to their vast number of parameters can be prohibitive. Existing solutions such as SparseGPT and Wanda attempt to alleviate this issue through weight pruning. However, their layer-wise approach results in significant perturbation to the model's output and requires meticulous hyperparameter tuning, such as the pruning rate, which can adversely affect overall model performance. To address this, this paper introduces a novel LLM pruning technique dubbed blockwise parameter-efficient sparsity allocation (BESA) by applying a blockwise reconstruction loss. In contrast to the typical layer-wise pruning techniques, BESA is characterized by two distinctive attributes: i) it targets the overall pruning error with respect to individual transformer blocks, and ii) it allocates layer-specific sparsity in a differentiable manner, both of which ensure reduced performance degradation after pruning. Our experiments show that BESA achieves state-of-the-art performance, efficiently pruning LLMs like LLaMA1, and LLaMA2 with 7B to 70B parameters on a single A100 GPU in just five hours. Code is available at [here](https://github.com/LinkAnonymous/BESA).",
        "keywords": "Large Language Model Compression;LLM Pruning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Peng Xu;Wenqi Shao;Mengzhao Chen;Shitao Tang;Kaipeng Zhang;Peng Gao;Fengwei An;Yu Qiao;Ping Luo",
        "authorids": "~Peng_Xu11;~Wenqi_Shao2;~Mengzhao_Chen1;~Shitao_Tang1;~Kaipeng_Zhang1;~Peng_Gao3;~Fengwei_An1;~Yu_Qiao1;~Ping_Luo2",
        "gender": "M;M;M;M;M;;M;;",
        "homepage": ";https://wqshao126.github.io/;https://chenmnz.github.io/;https://tangshitao.github.io/;http://kpzhang93.github.io/;;https://faculty.sustech.edu.cn/?tagid=anfw&iscss=1&snapid=1&orderby=date&go=1;;",
        "dblp": ";227/3122;301/9459;203/8797;179/2126;;;;",
        "google_scholar": ";Bs9mrwwAAAAJ;https://scholar.google.com.hk/citations?user=dN7UtFkAAAAJ;https://scholar.google.com/citations?hl=zh-CN;4OqZBmYAAAAJ;;;;",
        "orcid": ";;;;;;;;",
        "linkedin": "https://www.linkedin.cn/incareer/in/peng-xu-250466206;;;;;;;;",
        "or_profile": "~Peng_Xu11;~Wenqi_Shao2;~Mengzhao_Chen1;~Shitao_Tang1;~Kaipeng_Zhang1;~Peng_Gao3;~Fengwei_An1;~Yu_Qiao1;~Ping_Luo2",
        "aff": "University of Hong Kong;Shanghai AI Laboratory;Xiamen University;Simon Fraser University;Shanghai AI Laboratory;;;;",
        "aff_domain": "hku.hk;pjlab.org.cn;xmu.edu.cn;sfu.ca;pjlab.org.cn;;;;",
        "position": "PhD student;Researcher;MS student;PhD student;Researcher;;;;",
        "bibtex": "@inproceedings{\nxu2024besa,\ntitle={{BESA}: Pruning Large Language Models with Blockwise Parameter-Efficient Sparsity Allocation},\nauthor={Peng Xu and Wenqi Shao and Mengzhao Chen and Shitao Tang and Kaipeng Zhang and Peng Gao and Fengwei An and Yu Qiao and Ping Luo},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=gC6JTEU3jl}\n}",
        "github": "",
        "project": "",
        "reviewers": "JpTs;qTC9;MvCd;VXVS",
        "pdf_size": 644787,
        "rating": "6;6;8;8",
        "confidence": "3;3;2;3",
        "soundness": "3;3;3;4",
        "contribution": "3;3;3;4",
        "presentation": "3;3;2;3",
        "wc_summary": "34;68;30;78",
        "wc_strengths": "53;79;23;73",
        "wc_weaknesses": "107;65;52;71",
        "wc_questions": "19;1;6;77",
        "wc_review": "213;213;111;299",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1360;483;739;455",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;1;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            52.5,
            20.850659461993043
        ],
        "wc_strengths_avg": [
            57.0,
            21.863211109075447
        ],
        "wc_weaknesses_avg": [
            73.75,
            20.38841582860228
        ],
        "wc_questions_avg": [
            25.75,
            30.309858132297485
        ],
        "wc_review_avg": [
            209.0,
            66.58828725834597
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            759.25,
            364.07167906883393
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 35,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11102378747794211025&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=gC6JTEU3jl",
        "pdf": "https://openreview.net/pdf?id=gC6JTEU3jl",
        "email": "hku.hk;pjlab.org.cn;xmu.edu.cn;sfu.ca;pjlab.org.cn;;;;",
        "author_num": 9,
        "aff_unique_index": "0;1;2;3;1",
        "aff_unique_norm": "University of Hong Kong;Shanghai AI Laboratory;Xiamen University;Simon Fraser University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.hku.hk;https://www.shanghai-ai-lab.com;https://www.xmu.edu.cn;https://www.sfu.ca",
        "aff_unique_abbr": "HKU;SAIL;XMU;SFU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "China;Canada"
    },
    {
        "id": "gCZyD7WD0w",
        "title": "Guided Decoupled Exploration for Offline Reinforcement Learning Fine-tuning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Fine-tuning pre-trained offline Reinforcement Learning (RL) agents with online interactions is a promising strategy to improve the sample efficiency. In this work, we study the problem of sample-efficient fine-tuning for offline RL agents. We first discussed three challenges related to the over-concentration on the offline dataset, *i.e.,* inefficient exploration, distributional shifted samples, and distorted value functions. We focused on the exploration issue and investigated an important open question of how to explore more efficiently in offline RL fine-tuning. Through detailed experiments, we found that it is important to relax the conservative constraints to encourage exploration while avoiding reckless actions which could ruin the learned policy. To this end, we introduced the Guided Decoupled Exploration (GDE) for fine-tuning offline RL agents, where we decouple the exploration and exploitation policies and use a dynamic teacher policy to guide exploration. Experiments on the D4RL benchmark tasks showcase the effectiveness of the proposed method.",
        "keywords": "Exploration;Reinforcement Leraning;Offline RL;Fine-Tuning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/672824ddded54f85a836ce8a310b746a295ce3b5.zip",
        "author": "Yuwei Fu;Di Wu;Benoit Boulet",
        "authorids": "~Yuwei_Fu1;~Di_Wu11;~Benoit_Boulet1",
        "gender": "M;M;M",
        "homepage": "http://mcgillialab.com/people/;http://mcgillialab.com/people/;https://www.mcgill.ca/ece/benoit-boulet",
        "dblp": "200/1646;52/328-44.html;",
        "google_scholar": ";https://scholar.google.ca/citations?user=IbcoTsgAAAAJ;https://scholar.google.ca/citations?user=kkGyLY4AAAAJ",
        "orcid": ";;0000-0002-3191-3967",
        "linkedin": ";;benoit-boulet-97078012/",
        "or_profile": "~Yuwei_Fu1;~Di_Wu11;~Benoit_Boulet1",
        "aff": "McGill University;McGill University;McGill University",
        "aff_domain": "mcgill.ca;mcgill.ca;mcgill.ca",
        "position": "PhD student;Adjunct Professor;Full Professor",
        "bibtex": "@misc{\nfu2024guided,\ntitle={Guided Decoupled Exploration for Offline Reinforcement Learning Fine-tuning},\nauthor={Yuwei Fu and Di Wu and Benoit Boulet},\nyear={2024},\nurl={https://openreview.net/forum?id=gCZyD7WD0w}\n}",
        "github": "",
        "project": "",
        "reviewers": "XFhn;uJfn;Se55;DsmU",
        "site": "https://openreview.net/forum?id=gCZyD7WD0w",
        "pdf_size": 26784310,
        "rating": "3;5;6;8",
        "confidence": "4;4;3;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;4;3",
        "wc_summary": "87;112;81;113",
        "wc_strengths": "67;76;80;129",
        "wc_weaknesses": "309;316;84;29",
        "wc_questions": "169;448;62;25",
        "wc_review": "632;952;307;296",
        "wc_reply_reviewers": "55;0;0;1",
        "wc_reply_authors": "646;1674;612;687",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "2;3;1;3",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            98.25,
            14.411367041332339
        ],
        "wc_strengths_avg": [
            88.0,
            24.13503677229434
        ],
        "wc_weaknesses_avg": [
            184.5,
            129.49227776203492
        ],
        "wc_questions_avg": [
            176.0,
            165.7030476484968
        ],
        "wc_review_avg": [
            546.75,
            270.116063017363
        ],
        "wc_reply_reviewers_avg": [
            14.0,
            23.67488120350343
        ],
        "wc_reply_authors_avg": [
            904.75,
            444.91986638045285
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.16012815380508713,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:SSelumW_9KYJ:scholar.google.com/&scioq=Guided+Decoupled+Exploration+for+Offline+Reinforcement+Learning+Fine-tuning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "McGill University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.mcgill.ca",
        "aff_unique_abbr": "McGill",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "gCjeBKuDlc",
        "title": "ViCor: Bridging Visual Understanding and Commonsense Reasoning with Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In our work, we explore the synergistic capabilities of pre-trained vision-and-language models (VLMs) and large language models (LLMs) for visual commonsense reasoning (VCR). We categorize the problem of VCR into visual commonsense understanding (VCU) and visual commonsense inference (VCI). For VCU, which involves perceiving the literal visual content, pre-trained VLMs exhibit strong cross-dataset generalization. On the other hand, in VCI, where the goal is to infer conclusions beyond image content, VLMs face difficulties. We find that a baseline where VLMs provide perception results (image captions) to LLMs leads to improved performance on VCI. However, we identify a challenge with VLMs\u2019 passive perception, which often misses crucial context information, leading to incorrect or uncertain reasoning by LLMs. To mitigate this issue, we suggest a collaborative approach where LLMs, when uncertain about their reasoning, actively direct VLMs to concentrate on and gather relevant visual elements to support potential commonsense inferences. In our method, named ViCor, pre-trained LLMs serve as problem classifiers to analyze the problem category, VLM commanders to leverage VLMs differently based on the problem classification, and visual commonsense reasoners to answer the question. VLMs will perform visual recognition and understanding. We evaluate our framework on two VCR benchmark datasets and outperform all other methods that do not require in-domain supervised fine-tuning.",
        "keywords": "Visual commonsense reasoning;large langugage model;vision-language-models",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Kaiwen Zhou;Kwonjoon Lee;Teruhisa Misu;Xin Eric Wang",
        "authorids": "~Kaiwen_Zhou3;~Kwonjoon_Lee1;~Teruhisa_Misu2;~Xin_Eric_Wang2",
        "gender": "M;M;M;M",
        "homepage": "https://kevinz-01.github.io/;https://kjunelee.github.io;;https://eric-xw.github.io",
        "dblp": ";127/7948;https://dblp.org/pers/m/Misu:Teruhisa.html;10/5630-61",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;C6Wu8M0AAAAJ;4LAT5WYAAAAJ;YjqluE0AAAAJ",
        "orcid": ";0000-0002-1433-551X;;0000-0003-2605-5504",
        "linkedin": ";;;",
        "or_profile": "~Kaiwen_Zhou3;~Kwonjoon_Lee1;~Teruhisa_Misu2;~Xin_Eric_Wang2",
        "aff": "Samsung;Honda Research Institute USA;Honda Research Institute USA, Inc.;University of California, Santa Cruz",
        "aff_domain": "samsung.com;honda-ri.com;honda-ri.com;ucsc.edu",
        "position": "Intern;Sr Research Scientist;Scientist;Assistant Professor",
        "bibtex": "@misc{\nzhou2024vicor,\ntitle={ViCor: Bridging Visual Understanding and Commonsense Reasoning with Large Language Models},\nauthor={Kaiwen Zhou and Kwonjoon Lee and Teruhisa Misu and Xin Eric Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=gCjeBKuDlc}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZNkb;eVt8;iFin;GM3o",
        "site": "https://openreview.net/forum?id=gCjeBKuDlc",
        "pdf_size": 1298529,
        "rating": "3;5;6;6",
        "confidence": "4;5;4;4",
        "soundness": "1;2;3;2",
        "contribution": "1;2;2;2",
        "presentation": "1;3;3;2",
        "wc_summary": "45;108;76;74",
        "wc_strengths": "35;209;25;89",
        "wc_weaknesses": "99;179;71;188",
        "wc_questions": "17;161;86;43",
        "wc_review": "196;657;258;394",
        "wc_reply_reviewers": "0;0;32;0",
        "wc_reply_authors": "347;1002;699;427",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            75.75,
            22.29770167528483
        ],
        "wc_strengths_avg": [
            89.5,
            73.1624903895432
        ],
        "wc_weaknesses_avg": [
            134.25,
            50.335747734587194
        ],
        "wc_questions_avg": [
            76.75,
            54.52694288147833
        ],
        "wc_review_avg": [
            376.25,
            177.20662374753377
        ],
        "wc_reply_reviewers_avg": [
            8.0,
            13.856406460551018
        ],
        "wc_reply_authors_avg": [
            618.75,
            256.8738746933989
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8599680099562673164&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Samsung;Honda Research Institute;Honda Research Institute USA;University of California, Santa Cruz",
        "aff_unique_dep": "Samsung;Honda Research Institute;Research Institute;",
        "aff_unique_url": "https://www.samsung.com;https://honda-ri.com;https://honda-ri.com;https://www.ucsc.edu",
        "aff_unique_abbr": "Samsung;HRI USA;HRI USA;UCSC",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Santa Cruz",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "id": "gDDW5zMKFe",
        "title": "FIITED: Fine-grained embedding dimension optimization during training for recommender systems",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Huge embedding tables in modern Deep Learning Recommender Models (DLRM) require prohibitively large memory during training and inference. Aiming to reduce the memory footprint of training, this paper proposes FIne-grained\nIn-Training Embedding Dimension optimization (FIITED). Given the observation that embedding vectors are not equally important, FIITED adjusts the dimension of each individual embedding vector continuously during training, assigning longer dimensions to more important embeddings while adapting to dynamic changes in data. A novel embedding storage system based on virtually hashed physically indexed hash tables is designed to efficiently implement the embedding dimension adjustment and effectively enable memory saving. Experiments on two industry models show that FIITED is able to reduce the size of embeddings by more than 65% while maintaining the trained model\u2019s quality, saving significantly more memory than a state-of-the-art in-training embedding pruning method. On public click-through rate prediction datasets, FIITED is able to prune up to 93.75%-99.75% embeddings without significant accuracy loss. Given the same embedding size reduction, FIITED is able to achieve better model quality than the baselines.",
        "keywords": "Model Pruning;Embedding Dimension Search;Recommendation Models;Machine Learning Training",
        "primary_area": "infrastructure, software libraries, hardware, etc.",
        "supplementary_material": "",
        "author": "Qinyi Luo;Penghan Wang;Wei Zhang;Fan Lai;Jiachen Mao;Xiaohan Wei;Jun Song;Wei-Yu Tsai;Yuxi Hu;Xuehai Qian",
        "authorids": "~Qinyi_Luo1;~Penghan_Wang1;~Wei_Zhang94;~Fan_Lai1;~Jiachen_Mao1;~Xiaohan_Wei2;~Jun_Song3;~Wei-Yu_Tsai1;~Yuxi_Hu2;~Xuehai_Qian3",
        "gender": "F;M;M;;M;M;F;;M;",
        "homepage": "http://alchem.usc.edu/~qinyi/;https://github.com/Marmot-C;;https://fanlai.me/;https://www.linkedin.com/in/jiachen-mao/;;http://junsong.me/;;;https://alchem.cs.purdue.edu/xuehaiq.html",
        "dblp": ";;;179/2330;;;;;;42/5189.html",
        "google_scholar": "melC6I8AAAAJ;;;PlWcEMsAAAAJ;;6iZ_ddsAAAAJ;Zxc-0LoAAAAJ;NnJBAagAAAAJ;;https://scholar.google.co.uk/citations?user=5QL8V68AAAAJ",
        "orcid": ";0009-0005-9308-6273;;;;;;;;",
        "linkedin": "qinyi-luo-a87057119/;;rabbitwayne/;;;;;;huyuxi;",
        "or_profile": "~Qinyi_Luo1;~Penghan_Wang1;~Wei_Zhang94;~Fan_Lai1;~Jiachen_Mao1;~Xiaohan_Wei2;~Jun_Song3;~Wei-Yu_Tsai1;~Yuxi_Hu2;~Xuehai_Qian3",
        "aff": "University of Southern California;University of Illinois, Urbana Champaign;;Google;;;University of Washington, Seattle;;Meta Facebook;Purdue University",
        "aff_domain": "usc.edu;illinois.edu;;google.com;;;uw.edu;;meta.com;purdue.edu",
        "position": "PhD student;Intern;;Researcher;;;PhD student;;Researcher;Associate Professor",
        "bibtex": "@misc{\nluo2024fiited,\ntitle={{FIITED}: Fine-grained embedding dimension optimization during training for recommender systems},\nauthor={Qinyi Luo and Penghan Wang and Wei Zhang and Fan Lai and Jiachen Mao and Xiaohan Wei and Jun Song and Wei-Yu Tsai and Yuxi Hu and Xuehai Qian},\nyear={2024},\nurl={https://openreview.net/forum?id=gDDW5zMKFe}\n}",
        "github": "",
        "project": "",
        "reviewers": "Rag8;pdDD;1xeD;yjuq;CGz8",
        "site": "https://openreview.net/forum?id=gDDW5zMKFe",
        "pdf_size": 430440,
        "rating": "3;3;3;5;8",
        "confidence": "4;2;4;3;4",
        "soundness": "2;3;2;3;4",
        "contribution": "1;2;2;2;4",
        "presentation": "1;3;3;3;4",
        "wc_summary": "110;209;135;82;39",
        "wc_strengths": "65;151;99;73;24",
        "wc_weaknesses": "658;208;194;61;1",
        "wc_questions": "54;266;617;23;1",
        "wc_review": "887;834;1045;239;65",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "562;2236;751;858;16",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "2;4;1;1;1",
        "rating_avg": [
            4.4,
            1.9595917942265424
        ],
        "confidence_avg": [
            3.4,
            0.8
        ],
        "soundness_avg": [
            2.8,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.2,
            0.9797958971132712
        ],
        "presentation_avg": [
            2.8,
            0.9797958971132712
        ],
        "wc_summary_avg": [
            115.0,
            56.79084433251543
        ],
        "wc_strengths_avg": [
            82.4,
            41.91228936720112
        ],
        "wc_weaknesses_avg": [
            224.4,
            230.56851476296586
        ],
        "wc_questions_avg": [
            192.2,
            232.4593727944735
        ],
        "wc_review_avg": [
            614.0,
            387.4831609244459
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            884.6,
            735.3060859261265
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.8,
            1.1661903789690604
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.2806706996939059,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:B-sGCvy2owwJ:scholar.google.com/&scioq=FIITED:+Fine-grained+embedding+dimension+optimization+during+training+for+recommender+systems&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;4;5",
        "aff_unique_norm": "University of Southern California;University of Illinois Urbana-Champaign;Google;University of Washington;Meta;Purdue University",
        "aff_unique_dep": ";;Google;;Meta Platforms, Inc.;",
        "aff_unique_url": "https://www.usc.edu;https://illinois.edu;https://www.google.com;https://www.washington.edu;https://meta.com;https://www.purdue.edu",
        "aff_unique_abbr": "USC;UIUC;Google;UW;Meta;Purdue",
        "aff_campus_unique_index": "0;1;2;3",
        "aff_campus_unique": "Los Angeles;Urbana-Champaign;Mountain View;Seattle;",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "gDlsMWost9",
        "title": "Multimodal Chain-of-Thought Reasoning in Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs) have shown impressive performance on complex reasoning by leveraging chain-of-thought (CoT) prompting to generate intermediate reasoning chains as the rationale to infer the answer. However, existing CoT studies have primarily focused on the language modality. We propose Multimodal-CoT that incorporates language (text) and vision (images) modalities into a two-stage framework that separates rationale generation and answer inference. In this way, answer inference can leverage better generated rationales that are based on multimodal information. Experimental results on ScienceQA and A-OKVQA benchmark datasets show the effectiveness of our proposed approach. With Multimodal-CoT, our model under 1 billion parameters achieves new state-of-the-art performance on the ScienceQA benchmark. Our analysis indicates that Multimodal-CoT offers the advantages of mitigating hallucination. Code is publicly available at Anonymous.",
        "keywords": "Chain of Thought Prompting;Language Models;Multimodal Reasoning;Fine-tuning;Natural Language Processing.",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/1ae82ef30ab67f2df7cf0248c4cca88f17c0bc9f.zip",
        "author": "Zhuosheng Zhang;Aston Zhang;Mu Li;hai zhao;George Karypis;Alex Smola",
        "authorids": "~Zhuosheng_Zhang1;~Aston_Zhang2;~Mu_Li4;~hai_zhao1;~George_Karypis1;~Alex_Smola1",
        "gender": "M;;;M;M;M",
        "homepage": "https://bcmi.sjtu.edu.cn/~zhangzs/;;https://github.com/mli;http://bcmi.sjtu.edu.cn/~zhaohai/;;http://alex.smola.org",
        "dblp": "06/9708;;;25/1145-1.html;;s/AlexanderJSmola",
        "google_scholar": "https://scholar.google.co.jp/citations?user=63LTQhgAAAAJ;;;https://scholar.google.com.tw/citations?user=4dU5KS0AAAAJ;ElqwScwAAAAJ;Tb0ZrYwAAAAJ",
        "orcid": "0000-0002-4183-3645;;;;;",
        "linkedin": ";;;;;smola",
        "or_profile": "~Zhuosheng_Zhang1;~Aston_Zhang2;~Mu_Li4;~hai_zhao1;~George_Karypis1;~Alex_Smola1",
        "aff": "Shanghai Jiaotong University;;Amazon;Shanghai Jiaotong University;University of Minnesota, Minneapolis;Boson AI",
        "aff_domain": "sjtu.edu.cn;;amazon.com;sjtu.edu.cn;umn.edu;boson.ai",
        "position": "Assistant Professor;;Researcher;Full Professor;Full Professor;CEO",
        "bibtex": "@misc{\nzhang2024multimodal,\ntitle={Multimodal Chain-of-Thought Reasoning in Language Models},\nauthor={Zhuosheng Zhang and Aston Zhang and Mu Li and hai zhao and George Karypis and Alex Smola},\nyear={2024},\nurl={https://openreview.net/forum?id=gDlsMWost9}\n}",
        "github": "",
        "project": "",
        "reviewers": "mQUb;9gAH;MqoG;USEM",
        "site": "https://openreview.net/forum?id=gDlsMWost9",
        "pdf_size": 683927,
        "rating": "5;5;5;6",
        "confidence": "3;3;4;4",
        "soundness": "3;4;3;3",
        "contribution": "2;4;3;3",
        "presentation": "3;4;3;3",
        "wc_summary": "77;59;19;57",
        "wc_strengths": "81;77;26;61",
        "wc_weaknesses": "68;88;99;42",
        "wc_questions": "99;1;63;44",
        "wc_review": "325;225;207;204",
        "wc_reply_reviewers": "108;0;0;0",
        "wc_reply_authors": "616;522;476;201",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            53.0,
            21.118712081942874
        ],
        "wc_strengths_avg": [
            61.25,
            21.683807322516035
        ],
        "wc_weaknesses_avg": [
            74.25,
            21.683807322516035
        ],
        "wc_questions_avg": [
            51.75,
            35.336772631353874
        ],
        "wc_review_avg": [
            240.25,
            49.58515402819679
        ],
        "wc_reply_reviewers_avg": [
            27.0,
            46.76537180435969
        ],
        "wc_reply_authors_avg": [
            453.75,
            154.40267970472533
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 502,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12715836164647038800&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;0;2;3",
        "aff_unique_norm": "Shanghai Jiao Tong University;Amazon;University of Minnesota;Boson AI",
        "aff_unique_dep": ";Amazon.com, Inc.;;",
        "aff_unique_url": "https://www.sjtu.edu.cn;https://www.amazon.com;https://www.minnesota.edu;https://www.boson.ai",
        "aff_unique_abbr": "SJTU;Amazon;UMN;Boson AI",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Minneapolis",
        "aff_country_unique_index": "0;1;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "gDycDxX5Wa",
        "title": "PatchCraft: Learning Optimized Image Patch for Enhanced Visual Attention of CLIP",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large-scale Vision-Language Models, such as CLIP, have gained proficiency in building robust connections between images and text, offering a diverse range of practical applications, from tasks like zero-shot classification to generating images based on textual descriptions. However, when compared to their counterparts in the realm of large language models like GPT-3, these vision-language models exhibit somewhat limited abilities in handling novel discriminative tasks using prompts. In this research, we explore the concept of creating visual prompts as a strategy to address computer vision tasks that go beyond mere classification. Instead of relying exclusively on text-based prompts, our investigation delves into the potential of directly manipulating images. More specifically, we've discovered an intriguing capability within CLIP \u2013 the ability to direct the model's attention to specific regions within an image by introducing an optimized patch onto that region. This approach allows us to concentrate on local details while preserving the overall contextual understanding. Our experiments have demonstrated the effectiveness of this straightforward technique, enabling us to attain strong performance in keypoint localization and naming keypoint tasks.",
        "keywords": "vision-language models;explainable AI;transformer-based models",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Razieh Rezaei;Masoud Jalili Sabet;Ashkan Khakzar;Daniel Rueckert;Philip Torr;Jindong Gu",
        "authorids": "~Razieh_Rezaei1;~Masoud_Jalili_Sabet2;~Ashkan_Khakzar1;~Daniel_Rueckert2;~Philip_Torr1;~Jindong_Gu1",
        "gender": "F;;M;M;;",
        "homepage": ";;http://ashk-on.github.io/;https://aim-lab.io/author/daniel-ruckert/;http://www.robots.ox.ac.uk/~tvg/;",
        "dblp": ";;201/0889;69/2478;;",
        "google_scholar": ";;Tc4cWAcAAAAJ;https://scholar.google.co.uk/citations?user=H0O0WnQAAAAJ;;",
        "orcid": ";;;;;",
        "linkedin": "razieh-rezaei/;;;;;",
        "or_profile": "~Razieh_Rezaei1;~Masoud_Jalili_Sabet2;~Ashkan_Khakzar1;~Daniel_Rueckert2;~Philip_Torr1;~Jindong_Gu1",
        "aff": "Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen;;University of Oxford;Imperial College London;University of Oxford;",
        "aff_domain": "lmu.de;;ox.ac.uk;imperial.ac.uk;ox.ac.uk;",
        "position": "Researcher;;Postdoc;Full Professor;Full Professor;",
        "bibtex": "@misc{\nrezaei2024patchcraft,\ntitle={PatchCraft: Learning Optimized Image Patch for Enhanced Visual Attention of {CLIP}},\nauthor={Razieh Rezaei and Masoud Jalili Sabet and Ashkan Khakzar and Daniel Rueckert and Philip Torr and Jindong Gu},\nyear={2024},\nurl={https://openreview.net/forum?id=gDycDxX5Wa}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=gDycDxX5Wa",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:mw6rl-VLGVQJ:scholar.google.com/&scioq=PatchCraft:+Learning+Optimized+Image+Patch+for+Enhanced+Visual+Attention+of+CLIP&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen;University of Oxford;Imperial College London",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.lmu.de;https://www.ox.ac.uk;https://www.imperial.ac.uk",
        "aff_unique_abbr": "LMU;Oxford;ICL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "Germany;United Kingdom"
    },
    {
        "id": "gENfMmUIkT",
        "title": "A Pipeline-Based Approach for Object Detection on Resource Constrained Internet of Things Devices",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Object detection with computer vision and convolutional neural networks on resource constrained devices can be challenging. The limited power and processing capacity of these devices complicates the use of deep neural networks and other object detection methods. To address this problem, we propose a pipeline-based approach. We introduce a multi-step detection pipeline considering the size of the objects to be detected and the correlation among them. To evaluate the performance of this approach, we test it in a collaborative smart surveillance system employing edge computing and the internet of things paradigm. Additionally, field testing was conducted considering real world surveillance scenarios. Results showed that the introduction of the pipeline-based processing improved the execution time by a factor of 3 and produced a significant improvement on the mean average precision.",
        "keywords": "Edge Computing;Artificial Intelligence;Internet of Things;Computer Vision",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Vagner Takiya Bonadio;Geovane Fedrecheski;Laisa Costa;Marcelo Knorich Zuffo",
        "authorids": "~Vagner_Takiya_Bonadio1;~Geovane_Fedrecheski1;~Laisa_Costa1;~Marcelo_Knorich_Zuffo1",
        "gender": "M;M;F;M",
        "homepage": ";;;",
        "dblp": ";;;",
        "google_scholar": ";;37fNfpgAAAAJ;",
        "orcid": ";0000-0003-1311-5301;;",
        "linkedin": "vagner-b-568565155/;;;marcelo-knorich-zuffo/",
        "or_profile": "~Vagner_Takiya_Bonadio1;~Geovane_Fedrecheski1;~Laisa_Costa1;~Marcelo_Knorich_Zuffo1",
        "aff": "University of S\u00e3o Paulo;INRIA;;",
        "aff_domain": "usp.com.br;inria.fr;;",
        "position": "Researcher;Researcher;;",
        "bibtex": "@misc{\nbonadio2024a,\ntitle={A Pipeline-Based Approach for Object Detection on Resource Constrained Internet of Things Devices},\nauthor={Vagner Takiya Bonadio and Geovane Fedrecheski and Laisa Costa and Marcelo Knorich Zuffo},\nyear={2024},\nurl={https://openreview.net/forum?id=gENfMmUIkT}\n}",
        "github": "",
        "project": "",
        "reviewers": "cncP;eUP2;SrVC",
        "site": "https://openreview.net/forum?id=gENfMmUIkT",
        "pdf_size": 15683299,
        "rating": "1;1;3",
        "confidence": "5;5;3",
        "soundness": "1;2;1",
        "contribution": "1;1;1",
        "presentation": "3;2;2",
        "wc_summary": "67;81;71",
        "wc_strengths": "80;68;34",
        "wc_weaknesses": "114;90;166",
        "wc_questions": "62;123;284",
        "wc_review": "323;362;555",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "soundness_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            73.0,
            5.887840577551898
        ],
        "wc_strengths_avg": [
            60.666666666666664,
            19.48218559493661
        ],
        "wc_weaknesses_avg": [
            123.33333333333333,
            31.72100600898752
        ],
        "wc_questions_avg": [
            156.33333333333334,
            93.64590517238624
        ],
        "wc_review_avg": [
            413.3333333333333,
            101.43087410755278
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9999999999999997,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:qri2a1txFYkJ:scholar.google.com/&scioq=A+Pipeline-Based+Approach+for+Object+Detection+on+Resource+Constrained+Internet+of+Things+Devices&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of S\u00e3o Paulo;INRIA",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.usp.br;https://www.inria.fr",
        "aff_unique_abbr": "USP;INRIA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Brazil;France"
    },
    {
        "id": "gEUN4FCCrS",
        "title": "Value Bonuses using Ensemble Errors for Exploration in Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Optimistic value estimates provide one mechanism for directed exploration in reinforcement learning (RL). The agent acts greedily with respect to an estimate of the value plus what can be seen as a \\emph{value bonus}. The value bonus can be learned by estimating a value function on \\emph{reward bonuses}, propagating local uncertainties around rewards. This approach, however, only increases the value bonus for an action retroactively, after seeing a higher reward bonus from that state and action. Such an approach does not encourage the agent to visit a state and action for the first time. In this work, we introduce an algorithm for exploration called Value Bonuses with Ensemble errors (VBE), that maintains an ensemble of random action-value functions (RQFs). VBE uses the errors in the estimation of these RQFs for designing value bonuses that provide first-visit optimism and deep exploration. The key idea is to design the rewards for these RQFs in such a way that the value bonus can decrease to zero. We show that VBE outperforms Bootstrap DQN and two reward bonus approaches (RND and ACB) on several classic environments used to test exploration and provide demonstrative experiments that it learns faster in several Atari environments.",
        "keywords": "Reinforcement Learning;Exploration;Value bonuses;Ensembles;Uncertainty estimates",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/382df5fcfbbcacd8080b581bedb74bc4db950a52.pdf",
        "author": "Abdul Wahab;Raksha Kumaraswamy;Martha White",
        "authorids": "~Abdul_Wahab1;~Raksha_Kumaraswamy1;~Martha_White1",
        "gender": "M;F;F",
        "homepage": "https://mirzaabdulwahab1612.github.io/;http://marthawhite.ca;http://webdocs.cs.ualberta.ca/~kumarasw/",
        "dblp": "45/4163-3;60/7057;162/7061",
        "google_scholar": "https://scholar.google.ca/citations?user=kDa8TgEAAAAJ;t5zdD_IAAAAJ;",
        "orcid": ";0000-0002-5356-2950;",
        "linkedin": "abdul-wahab1612/;;",
        "or_profile": "~Abdul_Wahab1;~Martha_White1;~Raksha_Kumar_Kumaraswamy1",
        "aff": "University of Alberta;University of Alberta;Sony Canada Ltd.",
        "aff_domain": "ualberta.ca;ualberta.ca;sony.com",
        "position": "MS student;Associate Professor;Researcher",
        "bibtex": "@misc{\nwahab2024value,\ntitle={Value Bonuses using Ensemble Errors for Exploration in Reinforcement Learning},\nauthor={Abdul Wahab and Raksha Kumaraswamy and Martha White},\nyear={2024},\nurl={https://openreview.net/forum?id=gEUN4FCCrS}\n}",
        "github": "",
        "project": "",
        "reviewers": "VBsA;E6HL;MrVZ;pttX",
        "site": "https://openreview.net/forum?id=gEUN4FCCrS",
        "pdf_size": 7515193,
        "rating": "3;5;5;6",
        "confidence": "4;4;3;3",
        "soundness": "1;2;3;4",
        "contribution": "2;2;2;3",
        "presentation": "1;3;3;3",
        "wc_summary": "46;122;47;115",
        "wc_strengths": "167;201;38;108",
        "wc_weaknesses": "301;217;141;379",
        "wc_questions": "8;173;2;33",
        "wc_review": "522;713;228;635",
        "wc_reply_reviewers": "0;91;0;400",
        "wc_reply_authors": "952;1347;680;1153",
        "reply_reviewers": "0;1;0;2",
        "reply_authors": "2;3;1;3",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            1.118033988749895
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            82.5,
            36.08670115153226
        ],
        "wc_strengths_avg": [
            128.5,
            61.945540598173814
        ],
        "wc_weaknesses_avg": [
            259.5,
            89.23424230641508
        ],
        "wc_questions_avg": [
            54.0,
            69.6814178960216
        ],
        "wc_review_avg": [
            524.5,
            184.16093505409881
        ],
        "wc_reply_reviewers_avg": [
            122.75,
            164.32494485013527
        ],
        "wc_reply_authors_avg": [
            1033.0,
            247.06578071436763
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.6882472016116854,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:rh2jfr7vNOwJ:scholar.google.com/&scioq=Value+Bonuses+using+Ensemble+Errors+for+Exploration+in+Reinforcement+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "University of Alberta;Sony Canada Ltd.",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ualberta.ca;https://www.sony.com/ca",
        "aff_unique_abbr": "UAlberta;Sony Canada",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "gEdg9JvO8X",
        "title": "BDQL: Offline RL via Behavior Diffusion Q-learning without Policy Constraint",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Offline reinforcement learning (RL) algorithms often constrain the policy or regularize the value function within an off-policy actor-critic framework to overcome the overestimation on out-of-distribution (OOD) actions.\nAnd the on-policy style offline algorithms also cannot escape from these constraints (or regularization). \nIn this paper, we propose an on-policy style algorithm, Behavior Diffusion Q-Learning (BDQL), which has the potential to solve offline RL without introducing any potential constraints.\nBDQL first recovers the behavior policy through the diffusion model and then updates this diffusion-based behavior policy using the behavior Q-function learned by SARSA.\nThe update of BDQL exhibits a special two-stage pattern. \nAt the beginning of the training, thanks to the precise modeling of the diffusion model, the on-policy guidance of the behavior Q-function over the behavior policy is effective enough to solve the offline RL.\nAs training processes, BDQL suffers from the OOD issue, causing the training fluctuation or even collapse.\nConsequently, OOD issue arises after BDQL solves the offline problem which means the policy constraint is not necessary for solving offline RL in BDQL. \nAlthough the policy constraint can overcome the OOD issue and then completely address the training fluctuation, it also has a negative impact on solving the offline problem in the first stage. \nTherefore, we introduce the stochastic weight averaging (SWA) to mitigate the training fluctuation without affecting the offline solution. \nExperiments on D4RL demonstrate the special two-stage training phenomenon, where the first stage does have the capability to solve offline RL.",
        "keywords": "Offline Reinforcement Learning;Diffusion Policy",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Zifeng Zhuang;Huaicheng Zhou;Jinxin Liu;Donglin Wang",
        "authorids": "~Zifeng_Zhuang1;~Huaicheng_Zhou1;~Jinxin_Liu1;~Donglin_Wang1",
        "gender": "M;M;;M",
        "homepage": ";https://github.com/0ifeng0;;https://milab.westlake.edu.cn/",
        "dblp": "276/5034;;;",
        "google_scholar": ";;;https://scholar.google.ca/citations?user=-fo6wdwAAAAJ",
        "orcid": ";;;0000-0002-8188-3735",
        "linkedin": ";;;",
        "or_profile": "~Zifeng_Zhuang1;~Huaicheng_Zhou1;~Jinxin_Liu1;~Donglin_Wang1",
        "aff": "Zhejiang University;Westlake University;;Westlake University",
        "aff_domain": "zju.edu.cn;westlake.edu;;westlake.edu.cn",
        "position": "PhD student;Intern;;Associate Professor",
        "bibtex": "@misc{\nzhuang2024bdql,\ntitle={{BDQL}: Offline {RL} via Behavior Diffusion Q-learning without Policy Constraint},\nauthor={Zifeng Zhuang and Huaicheng Zhou and Jinxin Liu and Donglin Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=gEdg9JvO8X}\n}",
        "github": "",
        "project": "",
        "reviewers": "BEcH;Chng;FiPY",
        "site": "https://openreview.net/forum?id=gEdg9JvO8X",
        "pdf_size": 5904503,
        "rating": "3;3;5",
        "confidence": "4;3;4",
        "soundness": "2;2;3",
        "contribution": "2;1;2",
        "presentation": "3;3;3",
        "wc_summary": "42;73;88",
        "wc_strengths": "44;35;33",
        "wc_weaknesses": "106;217;124",
        "wc_questions": "136;2;84",
        "wc_review": "328;327;329",
        "wc_reply_reviewers": "0;138;319",
        "wc_reply_authors": "634;797;1011",
        "reply_reviewers": "0;1;2",
        "reply_authors": "2;2;3",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            67.66666666666667,
            19.154343864744856
        ],
        "wc_strengths_avg": [
            37.333333333333336,
            4.784233364802441
        ],
        "wc_weaknesses_avg": [
            149.0,
            48.641546028061235
        ],
        "wc_questions_avg": [
            74.0,
            55.16037224916694
        ],
        "wc_review_avg": [
            328.0,
            0.816496580927726
        ],
        "wc_reply_reviewers_avg": [
            152.33333333333334,
            130.62499335459844
        ],
        "wc_reply_authors_avg": [
            814.0,
            154.37832317610741
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:xFBqDlDn2vMJ:scholar.google.com/&scioq=BDQL:+Offline+RL+via+Behavior+Diffusion+Q-learning+without+Policy+Constraint&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Zhejiang University;Westlake University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.zju.edu.cn;https://www.westlake.edu.cn",
        "aff_unique_abbr": "ZJU;WU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "gEhGC7jaTf",
        "title": "WATT FOR WHAT: RETHINKING DEEP LEARNING\u2019S ENERGY-PERFORMANCE RELATIONSHIP",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Deep learning models have revolutionized various fields, from image recognition to natural language processing, by achieving unprecedented levels of accuracy. However, their increasing energy consumption has raised concerns about their environmental impact, disadvantaging smaller entities in research and exacerbating global energy consumption. In this paper, we explore the trade-off between model accuracy and electricity consumption, proposing a metric that penalizes large consumption of electricity. We conduct a comprehensive study on the electricity consumption of various deep learning models across different GPUs, presenting a detailed analysis of their accuracy-efficiency trade-offs. By evaluating accuracy per unit of electricity consumed, we demonstrate how smaller, more energy-efficient models can significantly expedite research while mitigating environmental concerns. Our results highlight the potential for a more sustainable approach to deep learning, emphasizing the importance of optimizing models for efficiency. This research also contributes to a more equitable research landscape, where smaller entities can compete effectively with larger counterparts. This advocates for the adoption of efficient deep learning practices to reduce electricity consumption, safeguarding the environment for future generations whilst also helping ensure a fairer competitive landscape.",
        "keywords": "Energy tracking;Efficient learning;Metric;Power Consumption",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Shreyank N Gowda;Xinyue Hao;Gen Li;Laura Sevilla-Lara;Shashank Narayana Gowda;Jonathan Huang",
        "authorids": "~Shreyank_N_Gowda1;~Xinyue_Hao1;~Gen_Li5;~Laura_Sevilla-Lara3;shashankng13@gmail.com;~Jonathan_Huang1",
        "gender": "M;F;M;;;",
        "homepage": "https://sites.google.com/view/shreyankngowda/home;https://www.inf.ed.ac.uk/people/students/Maggie_Hao.html;https://reagan1311.github.io/;;;http://jonathan-huang.org/",
        "dblp": "191/1593;254/1162.html;28/538-8;;;55/2421",
        "google_scholar": "H95HfgIAAAAJ;8_xMMrsAAAAJ;Rfh4mm0AAAAJ;;;-pu6i_4AAAAJ",
        "orcid": "0000-0002-4975-0705;;;;;",
        "linkedin": "shreyank-gowda-b5264488/;;gen-li-84bb62191/;;;",
        "or_profile": "~Shreyank_N_Gowda1;~Xinyue_Hao1;~Gen_Li5;~Laura_Sevilla-Lara3;shashankng13@gmail.com;~Jonathan_Huang1",
        "aff": "University of Oxford;University of Edinburgh, University of Edinburgh;University of Edinburgh;;;Google",
        "aff_domain": "ox.ac.uk;ed.ac.uk;ed.ac.uk;;;google.com",
        "position": "Postdoc;PhD student;PhD student;;;Research Scientist",
        "bibtex": "@misc{\ngowda2024watt,\ntitle={{WATT} {FOR} {WHAT}: {RETHINKING} {DEEP} {LEARNING}{\\textquoteright}S {ENERGY}-{PERFORMANCE} {RELATIONSHIP}},\nauthor={Shreyank N Gowda and Xinyue Hao and Gen Li and Laura Sevilla-Lara and Shashank Narayana Gowda and Jonathan Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=gEhGC7jaTf}\n}",
        "github": "",
        "project": "",
        "reviewers": "nMed;MAKR;JEc8;MKQf",
        "site": "https://openreview.net/forum?id=gEhGC7jaTf",
        "pdf_size": 2043238,
        "rating": "1;3;3;5",
        "confidence": "4;5;4;3",
        "soundness": "1;1;2;2",
        "contribution": "1;2;1;2",
        "presentation": "3;2;2;3",
        "wc_summary": "49;319;31;36",
        "wc_strengths": "27;72;123;29",
        "wc_weaknesses": "254;695;191;157",
        "wc_questions": "1;106;179;16",
        "wc_review": "331;1192;524;238",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            1.5,
            0.5
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            108.75,
            121.56556872733331
        ],
        "wc_strengths_avg": [
            62.75,
            39.15593824696326
        ],
        "wc_weaknesses_avg": [
            324.25,
            216.86329219118664
        ],
        "wc_questions_avg": [
            75.5,
            71.99479147827293
        ],
        "wc_review_avg": [
            571.25,
            372.94059513547194
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=930474747004029440&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "University of Oxford;University of Edinburgh;Google",
        "aff_unique_dep": ";;Google",
        "aff_unique_url": "https://www.ox.ac.uk;https://www.ed.ac.uk;https://www.google.com",
        "aff_unique_abbr": "Oxford;Edinburgh;Google",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "title": "Efficient Backpropagation with Variance Controlled Adaptive Sampling",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18152",
        "id": "gEwKAZZmSw",
        "author_site": "Ziteng Wang, Jianfei Chen, Jun Zhu",
        "tldr": "",
        "abstract": "Sampling-based algorithms, which eliminate \"unimportant\" computations during forward and/or backpropagation (BP), offer potential solutions to accelerate neural network training. However, since sampling introduces approximations to training, such algorithms may not consistently maintain accuracy across various tasks. In this work, we introduce a variance-controlled adaptive sampling (VCAS) method designed to minimize the computational load of BP. VCAS computes an unbiased stochastic gradient with fine-grained layerwise importance sampling in data dimension for activation gradient calculation and leverage score sampling in token dimension for weight gradient calculation. To preserve accuracy, we control the additional variance introduced by learning the sample ratio jointly with model parameters during training. We assessed VCAS on multiple fine-tuning and pre-training tasks in both vision and natural language domains. On all the tasks, VCAS can preserve the original training loss trajectory and validation accuracy with an up to 73.87% FLOPs reduction of BP and 49.58% FLOPs reduction of the whole training process. The implementation is available at https://github.com/thu-ml/VCAS.",
        "keywords": "efficient training algorithms;stochastic gradient descent;importance sampling;variance reduction",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/6cdf17bbba030b8f2776f03f5e6c8543b1e0850f.zip",
        "author": "Ziteng Wang;Jianfei Chen;Jun Zhu",
        "authorids": "~Ziteng_Wang3;~Jianfei_Chen1;~Jun_Zhu2",
        "gender": ";M;M",
        "homepage": ";http://ml.cs.tsinghua.edu.cn/~jianfei;http://ml.cs.tsinghua.edu.cn/~jun",
        "dblp": ";48/6809-1;50/2644-1",
        "google_scholar": ";di5RZ1MAAAAJ;axsP38wAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Ziteng_Wang3;~Jianfei_Chen1;~Jun_Zhu2",
        "aff": ";Tsinghua University;Tsinghua University",
        "aff_domain": ";tsinghua.edu.cn;mail.tsinghua.edu.cn",
        "position": ";Associate Professor;Professor",
        "bibtex": "@inproceedings{\nwang2024efficient,\ntitle={Efficient Backpropagation with Variance Controlled Adaptive Sampling},\nauthor={Ziteng Wang and Jianfei Chen and Jun Zhu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=gEwKAZZmSw}\n}",
        "github": "",
        "project": "",
        "reviewers": "PsQT;Dd1x;d6vC;MWbo",
        "pdf_size": 702821,
        "rating": "6;6;6;8",
        "confidence": "3;4;3;4",
        "soundness": "2;3;4;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "61;80;64;55",
        "wc_strengths": "38;98;43;68",
        "wc_weaknesses": "151;214;85;210",
        "wc_questions": "1;55;35;49",
        "wc_review": "251;447;227;382",
        "wc_reply_reviewers": "96;28;0;24",
        "wc_reply_authors": "1350;784;800;704",
        "reply_reviewers": "2;1;0;1",
        "reply_authors": "4;3;2;3",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            65.0,
            9.246621004453464
        ],
        "wc_strengths_avg": [
            61.75,
            23.81569860407206
        ],
        "wc_weaknesses_avg": [
            165.0,
            52.492856656882374
        ],
        "wc_questions_avg": [
            35.0,
            20.92844953645635
        ],
        "wc_review_avg": [
            326.75,
            91.10536482556886
        ],
        "wc_reply_reviewers_avg": [
            37.0,
            35.70714214271425
        ],
        "wc_reply_authors_avg": [
            909.5,
            256.910003697793
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11166185247257673955&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=gEwKAZZmSw",
        "pdf": "https://openreview.net/pdf?id=gEwKAZZmSw",
        "email": ";tsinghua.edu.cn;mail.tsinghua.edu.cn",
        "author_num": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Tsinghua University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "gFBTNDNDUG",
        "title": "A Computational Framework for Solving Wasserstein Lagrangian Flows",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The dynamical formulation of the optimal transport can be extended through various choices of the underlying geometry (_kinetic energy_), and the regularization of density paths (_potential energy_). These combinations yield different variational problems (_Lagrangians_), encompassing many variations of the optimal transport problem such as the Schr\u00f6dinger bridge, unbalanced optimal transport, and optimal transport with physical constraints, among others. In general, the optimal density path is unknown, and solving these variational problems can be computationally challenging. Leveraging the dual formulation of the Lagrangians, we propose a novel deep learning based framework approaching all of these problems from a unified perspective. Our method does not require simulating or backpropagating through the trajectories of the learned dynamics, and does not need access to optimal couplings. We showcase the versatility of the proposed framework by outperforming previous approaches for the single-cell trajectory inference, where incorporating prior knowledge into the dynamics is crucial for correct predictions.",
        "keywords": "optimal transport;Schr\u00f6dinger bridge;trajectory inference;single-cell",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/9cc327386b05495fbb587660ef900ba8bd30065e.zip",
        "author": "Kirill Neklyudov;Rob Brekelmans;Alexander Tong;Lazar Atanackovic;qiang liu;Alireza Makhzani",
        "authorids": "~Kirill_Neklyudov1;~Rob_Brekelmans1;~Alexander_Tong1;~Lazar_Atanackovic1;~qiang_liu4;~Alireza_Makhzani1",
        "gender": "M;M;;M;;M",
        "homepage": "https://necludov.github.io/;https://brekelma.github.io;https://alextong.net;https://lazaratan.github.io/;http://www.alireza.ai/;https://www.cs.utexas.edu/~lqiang/",
        "dblp": "195/1093;207/7856.html;153/9296;235/6207;122/5126.html;61/3234-1",
        "google_scholar": "https://scholar.google.ru/citations?user=eOttYWgAAAAJ;M6ADg_UAAAAJ;CS80pt4AAAAJ;qhTWIh4AAAAJ;B0KVWJEAAAAJ;https://scholar.google.com.tw/citations?user=2qDh4WUAAAAJ",
        "orcid": ";;0000-0002-2031-4096;;;",
        "linkedin": ";;atong01/;;;",
        "or_profile": "~Kirill_Neklyudov1;~Rob_Brekelmans1;~Alexander_Tong1;~Lazar_Atanackovic1;~Alireza_Makhzani1;~Qiang_Liu1",
        "aff": "Vector Institute;;Universit\u00e9 de Montr\u00e9al;Valence Labs powered by recursion;Vector Institute;University of Texas, Austin",
        "aff_domain": "vectorinstitute.ai;;umontreal.ca;valencelabs.com;vectorinstitute.ai;utexas.edu",
        "position": "Postdoc;;Postdoc;Intern;Researcher;Assistant Professor",
        "bibtex": "@misc{\nneklyudov2024a,\ntitle={A Computational Framework for Solving Wasserstein Lagrangian Flows},\nauthor={Kirill Neklyudov and Rob Brekelmans and Alexander Tong and Lazar Atanackovic and qiang liu and Alireza Makhzani},\nyear={2024},\nurl={https://openreview.net/forum?id=gFBTNDNDUG}\n}",
        "github": "",
        "project": "",
        "reviewers": "E9Se;sAE6;feJt;zR9h;uk1R",
        "site": "https://openreview.net/forum?id=gFBTNDNDUG",
        "pdf_size": 4268367,
        "rating": "3;5;6;8;8",
        "confidence": "3;3;1;3;3",
        "soundness": "3;2;3;4;3",
        "contribution": "2;2;2;4;3",
        "presentation": "2;2;3;4;3",
        "wc_summary": "69;110;77;65;98",
        "wc_strengths": "35;63;133;125;55",
        "wc_weaknesses": "137;683;709;72;285",
        "wc_questions": "5;3;4;38;87",
        "wc_review": "246;859;923;300;525",
        "wc_reply_reviewers": "196;0;51;0;93",
        "wc_reply_authors": "810;630;614;69;336",
        "reply_reviewers": "1;0;1;0;1",
        "reply_authors": "2;1;1;1;1",
        "rating_avg": [
            6.0,
            1.8973665961010275
        ],
        "confidence_avg": [
            2.6,
            0.8
        ],
        "soundness_avg": [
            3.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            2.6,
            0.8
        ],
        "presentation_avg": [
            2.8,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            83.8,
            17.359723500102184
        ],
        "wc_strengths_avg": [
            82.2,
            39.3669912490147
        ],
        "wc_weaknesses_avg": [
            377.2,
            269.4248689338087
        ],
        "wc_questions_avg": [
            27.4,
            32.58588651548397
        ],
        "wc_review_avg": [
            570.6,
            278.5782475355892
        ],
        "wc_reply_reviewers_avg": [
            68.0,
            72.8642573557159
        ],
        "wc_reply_authors_avg": [
            491.8,
            260.12181761628534
        ],
        "reply_reviewers_avg": [
            0.6,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.2,
            0.4000000000000001
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 17,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13718585745659394597&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;2;0;3",
        "aff_unique_norm": "Vector Institute;Universit\u00e9 de Montr\u00e9al;Valence Labs;University of Texas at Austin",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://vectorinstitute.ai/;https://www.umontreal.ca;;https://www.utexas.edu",
        "aff_unique_abbr": "Vector Institute;UdeM;;UT Austin",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Austin",
        "aff_country_unique_index": "0;0;0;2",
        "aff_country_unique": "Canada;;United States"
    },
    {
        "title": "Gene Regulatory Network Inference in the Presence of Dropouts: a Causal View",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18151",
        "id": "gFR4QwK53h",
        "author_site": "HAOYUE DAI, Ignavier Ng, Gongxu Luo, Petar Stojanov, Peter Spirtes, Kun Zhang",
        "tldr": "",
        "abstract": "Gene regulatory network inference (GRNI) is a challenging problem, particularly owing to the presence of zeros in single-cell RNA sequencing data: some are biological zeros representing no gene expression, while some others are technical zeros arising from the sequencing procedure (aka dropouts), which may bias GRNI by distorting the joint distribution of the measured gene expressions. Existing approaches typically handle dropout error via imputation, which may introduce spurious relations as the true joint distribution is generally unidentifiable. To tackle this issue, we introduce a causal graphical model to characterize the dropout mechanism, namely, Causal Dropout Model. We provide a simple yet effective theoretical result: interestingly, the conditional independence (CI) relations in the data with dropouts, after deleting the samples with zero values (regardless if technical or not) for the conditioned variables, are asymptotically identical to the CI relations in the original data without dropouts. This particular test-wise deletion procedure, in which we perform CI tests on the samples without zeros for the conditioned variables, can be seamlessly integrated with existing structure learning approaches including constraint-based and greedy score-based methods, thus giving rise to a principled framework for GRNI in the presence of dropouts. We further show that the causal dropout model can be validated from data, and many existing statistical models to handle dropouts fit into our model as specific parametric instances. Empirical evaluation on synthetic, curated, and real-world experimental transcriptomic data comprehensively demonstrate the efficacy of our method.",
        "keywords": "Gene regulatory network;Single-cell RNA-sequencing;Dropout;Zero-inflated data;Causal model;Causal discovery;Nonparametric",
        "primary_area": "causal reasoning",
        "supplementary_material": "",
        "author": "Haoyue Dai;Ignavier Ng;Gongxu Luo;Peter Spirtes;Petar Stojanov;Kun Zhang",
        "authorids": "~Haoyue_Dai1;~Ignavier_Ng1;~Gongxu_Luo1;~Peter_Spirtes1;~Petar_Stojanov2;~Kun_Zhang1",
        "gender": ";M;M;M;;M",
        "homepage": "https://hyda.cc;https://ignavierng.github.io/;https://dblp.org/pid/252/7950.html;https://www.cmu.edu/dietrich/philosophy/people/faculty/spirtes.html;;http://www.andrew.cmu.edu/user/kunz1/",
        "dblp": "277/1316;251/3037;252/7950.html;87/3550;;96/3115-1",
        "google_scholar": "f4tCtoMAAAAJ;;;mar1eCwAAAAJ;RydEtZkAAAAJ;RGoypN4AAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Haoyue_Dai1;~Ignavier_Ng1;~Gongxu_Luo1;~Peter_Spirtes1;~Petar_Stojanov2;~Kun_Zhang1",
        "aff": "Carnegie Mellon University;Carnegie Mellon University;Mohamed bin Zayed University of Artificial Intelligence;Carnegie Mellon University;;Carnegie Mellon University",
        "aff_domain": "cmu.edu;cmu.edu;mbzuai.ac.ae;cmu.edu;;cmu.edu",
        "position": "PhD student;PhD student;PhD student;Full Professor;;Associate Professor",
        "bibtex": "@inproceedings{\ndai2024gene,\ntitle={Gene Regulatory Network Inference in the Presence of Dropouts: a Causal View},\nauthor={Haoyue Dai and Ignavier Ng and Gongxu Luo and Peter Spirtes and Petar Stojanov and Kun Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=gFR4QwK53h}\n}",
        "github": "",
        "project": "",
        "reviewers": "f2vv;6osj;pofH",
        "pdf_size": 1889717,
        "rating": "6;8;8",
        "confidence": "4;4;4",
        "soundness": "3;3;3",
        "contribution": "3;4;3",
        "presentation": "3;4;3",
        "wc_summary": "52;125;96",
        "wc_strengths": "41;99;82",
        "wc_weaknesses": "81;112;9",
        "wc_questions": "81;176;140",
        "wc_review": "255;512;327",
        "wc_reply_reviewers": "0;13;0",
        "wc_reply_authors": "580;927;716",
        "reply_reviewers": "0;1;0",
        "reply_authors": "2;2;1",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            91.0,
            30.011109054259666
        ],
        "wc_strengths_avg": [
            74.0,
            24.34474618201362
        ],
        "wc_weaknesses_avg": [
            67.33333333333333,
            43.14574782705192
        ],
        "wc_questions_avg": [
            132.33333333333334,
            39.16063783387032
        ],
        "wc_review_avg": [
            364.6666666666667,
            108.24765842989656
        ],
        "wc_reply_reviewers_avg": [
            4.333333333333333,
            6.128258770283412
        ],
        "wc_reply_authors_avg": [
            741.0,
            142.76087232385024
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15925581130364080260&as_sdt=5,39&sciodt=0,39&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=gFR4QwK53h",
        "pdf": "https://openreview.net/pdf?id=gFR4QwK53h",
        "email": "cmu.edu;cmu.edu;mbzuai.ac.ae;cmu.edu;;cmu.edu",
        "author_num": 6,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "Carnegie Mellon University;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cmu.edu;https://mbzuai.ac.ae",
        "aff_unique_abbr": "CMU;MBZUAI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "United States;United Arab Emirates"
    },
    {
        "title": "IMPUS: Image Morphing with Perceptually-Uniform Sampling Using Diffusion Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18150",
        "id": "gG38EBe2S8",
        "author_site": "Zhaoyuan Yang, Zhengyang Yu, Zhiwei Xu, Jaskirat Singh, Jing Zhang, Dylan Campbell, Peter Tu, Richard Hartley",
        "tldr": "",
        "abstract": "We present a diffusion-based image morphing approach with perceptually-uniform sampling (IMPUS) that produces smooth, direct and realistic interpolations given an image pair. The embeddings of two images may lie on distinct conditioned distributions of a latent diffusion model, especially when they have significant semantic difference. To bridge this gap, we interpolate in the locally linear and continuous text embedding space and Gaussian latent space. We first optimize the endpoint text embeddings and then map the images to the latent space using a probability flow ODE. Unlike existing work that takes an indirect morphing path, we show that the model adaptation yields a direct path and suppresses ghosting artifacts in the interpolated images. To achieve this, we propose a heuristic bottleneck constraint based on a novel relative perceptual path diversity score that automatically controls the bottleneck size and balances the diversity along the path with its directness. We also propose a perceptually-uniform sampling technique that enables visually smooth changes between the interpolated images. Extensive experiments validate that our IMPUS can achieve smooth, direct, and realistic image morphing and is adaptable to several other generative tasks.",
        "keywords": "image morphing;diffusion models;clip inversion",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/80f525349987daa42ffbce519f4b1b17ff73aed6.pdf",
        "author": "Zhaoyuan Yang;Zhengyang Yu;Zhiwei Xu;Jaskirat Singh;Jing Zhang;Dylan Campbell;Peter Tu;Richard Hartley",
        "authorids": "~Zhaoyuan_Yang1;~Zhengyang_Yu3;~Zhiwei_Xu2;~Jaskirat_Singh1;~Jing_Zhang9;~Dylan_Campbell1;~Peter_Tu1;~Richard_Hartley1",
        "gender": ";M;;;;M;M;M",
        "homepage": ";https://comp.anu.edu.au/people/zhengyang-yu/;;https://1jsingh.github.io/;;https://sites.google.com/view/djcampbell;;http://axiom.anu.edu.au/~hartley/",
        "dblp": "227/2718;;;74/2036;;139/6663;97/2416.html;h/RIHartley",
        "google_scholar": "qxa04lIAAAAJ;N8Nuv1kAAAAJ;;HAmEM_4AAAAJ;;https://scholar.google.com.au/citations?user=FayBF1AAAAAJ;;https://scholar.google.com.tw/citations?user=cHia5p0AAAAJ",
        "orcid": ";;;;;0000-0002-4717-6850;;0000-0002-5005-0191",
        "linkedin": ";;;;;;;",
        "or_profile": "~Zhaoyuan_Yang1;~Zhengyang_Yu3;~Zhiwei_Xu2;~Jaskirat_Singh1;~Jing_Zhang9;~Dylan_Campbell1;~Peter_Tu1;~Richard_Hartley1",
        "aff": "General Electric;Australian National University;;Meta Facebook;;Australian National University;General Electric;Google",
        "aff_domain": "ge.com;anu.edu.au;;meta.com;;anu.edu.au;ge.com;google.com",
        "position": "Researcher;PhD student;;Intern;;Lecturer;Scientist;visitor",
        "bibtex": "@inproceedings{\nyang2024impus,\ntitle={{IMPUS}: Image Morphing with Perceptually-Uniform Sampling Using Diffusion Models},\nauthor={Zhaoyuan Yang and Zhengyang Yu and Zhiwei Xu and Jaskirat Singh and Jing Zhang and Dylan Campbell and Peter Tu and Richard Hartley},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=gG38EBe2S8}\n}",
        "github": "",
        "project": "",
        "reviewers": "UYJ7;meGk;zxkV;NAVh",
        "pdf_size": 13015595,
        "rating": "6;6;6;6",
        "confidence": "3;4;4;4",
        "soundness": "2;3;4;4",
        "contribution": "2;3;4;3",
        "presentation": "2;3;3;4",
        "wc_summary": "86;80;92;121",
        "wc_strengths": "40;137;61;145",
        "wc_weaknesses": "211;139;61;224",
        "wc_questions": "87;59;63;92",
        "wc_review": "424;415;277;582",
        "wc_reply_reviewers": "257;20;0;28",
        "wc_reply_authors": "1834;635;413;1696",
        "reply_reviewers": "2;1;0;1",
        "reply_authors": "3;2;1;3",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            94.75,
            15.738090735537142
        ],
        "wc_strengths_avg": [
            95.75,
            45.94221914535692
        ],
        "wc_weaknesses_avg": [
            158.75,
            65.06295028662626
        ],
        "wc_questions_avg": [
            75.25,
            14.428704030508076
        ],
        "wc_review_avg": [
            424.5,
            107.99652772195965
        ],
        "wc_reply_reviewers_avg": [
            76.25,
            104.85317114899291
        ],
        "wc_reply_authors_avg": [
            1144.5,
            627.3446022721483
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15666249696424816274&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=gG38EBe2S8",
        "pdf": "https://openreview.net/pdf?id=gG38EBe2S8",
        "email": "ge.com;anu.edu.au;;meta.com;;anu.edu.au;ge.com;google.com",
        "author_num": 8,
        "aff_unique_index": "0;1;2;1;0;3",
        "aff_unique_norm": "General Electric;Australian National University;Meta;Google",
        "aff_unique_dep": ";;Meta Platforms, Inc.;Google",
        "aff_unique_url": "https://www.ge.com;https://www.anu.edu.au;https://meta.com;https://www.google.com",
        "aff_unique_abbr": "GE;ANU;Meta;Google",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;0;1;0;0",
        "aff_country_unique": "United States;Australia"
    },
    {
        "title": "Modulated Phase Diffusor: Content-Oriented Feature Synthesis for Detecting Unknown Objects",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18149",
        "id": "gHAr7ZA1OL",
        "author_site": "Aming Wu, Cheng Deng",
        "tldr": "",
        "abstract": "To promote the safe deployment of object detectors, a task of unsupervised out-of-distribution object detection (OOD-OD) is recently proposed, aiming to detect unknown objects during training without reliance on any auxiliary OOD data. To alleviate the impact of lacking OOD data, for this task, one feasible solution is to exploit the known in-distribution (ID) data to synthesize proper OOD information for supervision, which strengthens detectors' discrimination. From the frequency perspective, since the phase generally reflects the content of the input, in this paper, we explore leveraging the phase of ID features to generate expected OOD features involving different content. And a method of Modulated Phase Diffusion (MPD) is proposed, containing a shared forward and two different reverse processes. Specifically, after calculating the phase of the extracted features, to prevent the rapid loss of content in the phase, the forward process gradually performs Gaussian Average on the phase instead of adding noise. The averaged phase and original amplitude are combined to obtain the features taken as the input of the reverse process. Next, one OOD branch is defined to synthesize virtual OOD features by continually enlarging the content discrepancy between the OOD features and original ones. Meanwhile, another modulated branch is designed to generate augmented features owning a similar phase as the original features by scaling and shifting the OOD branch. Both original and augmented features are used for training, enhancing the discrimination. Experimental results on OOD-OD, incremental object detection, and open-set object detection demonstrate the superiorities of our method. The source code will be released at https://github.com/AmingWu/MPD.",
        "keywords": "Unsupervised out-of-distribution object detection; OOD data synthesis; Modulated phase diffusion",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Aming WU;Cheng Deng",
        "authorids": "~Aming_WU2;~Cheng_Deng2",
        "gender": "M;M",
        "homepage": "https://amingwu.github.io/;http://see.xidian.edu.cn/faculty/chdeng/",
        "dblp": "219/1674;",
        "google_scholar": "xjGiOx0AAAAJ;OROjmc8AAAAJ",
        "orcid": "0000-0002-2024-2678;0000-0003-2620-3247",
        "linkedin": ";",
        "or_profile": "~Aming_WU2;~Cheng_Deng1",
        "aff": "Xidian University;Xidian University",
        "aff_domain": "xidian.edu.cn;xidian.edu.cn",
        "position": "Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\nwu2024modulated,\ntitle={Modulated Phase Diffusor: Content-Oriented Feature Synthesis for Detecting Unknown Objects},\nauthor={Aming WU and Cheng Deng},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=gHAr7ZA1OL}\n}",
        "github": "",
        "project": "",
        "reviewers": "3rox;A444;PJVM",
        "pdf_size": 10305803,
        "rating": "3;6;6",
        "confidence": "5;3;3",
        "soundness": "2;3;2",
        "contribution": "2;3;2",
        "presentation": "1;3;3",
        "wc_summary": "59;43;122",
        "wc_strengths": "23;78;87",
        "wc_weaknesses": "173;26;321",
        "wc_questions": "44;104;60",
        "wc_review": "299;251;590",
        "wc_reply_reviewers": "44;0;108",
        "wc_reply_authors": "743;861;751",
        "reply_reviewers": "1;0;1",
        "reply_authors": "2;2;2",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            74.66666666666667,
            34.101156708957674
        ],
        "wc_strengths_avg": [
            62.666666666666664,
            28.288199345702832
        ],
        "wc_weaknesses_avg": [
            173.33333333333334,
            120.4334763353704
        ],
        "wc_questions_avg": [
            69.33333333333333,
            25.368396787253932
        ],
        "wc_review_avg": [
            380.0,
            149.77983842960975
        ],
        "wc_reply_reviewers_avg": [
            50.666666666666664,
            44.34210439550904
        ],
        "wc_reply_authors_avg": [
            785.0,
            53.839266958853244
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:pkhe3rP7kmUJ:scholar.google.com/&scioq=Modulated+Phase+Diffusor:+Content-Oriented+Feature+Synthesis+for+Detecting+Unknown+Objects&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=gHAr7ZA1OL",
        "pdf": "https://openreview.net/pdf?id=gHAr7ZA1OL",
        "email": "xidian.edu.cn;xidian.edu.cn",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Xidian University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.xidian.edu.cn/",
        "aff_unique_abbr": "Xidian",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "gHaokdQkoi",
        "title": "GNRK: Graph Neural Runge-Kutta method for solving partial differential equations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Neural networks have proven to be efficient surrogate models for tackling partial differential equations (PDEs). However, their applicability is often confined to specific PDEs under certain constraints, in contrast to classical PDE solvers that rely on numerical differentiation. Striking a balance between efficiency and versatility, this study introduces a novel approach called Graph Neural Runge-Kutta (GNRK), which integrates graph neural network modules with a recurrent structure inspired by the classical solvers. The GNRK operates on graph structures, ensuring its resilience to changes in spatial and temporal resolutions during domain discretization. Moreover, it demonstrates the capability to address general PDEs, irrespective of initial conditions or PDE coefficients. To assess its performance, we benchmark the GNRK against existing neural network based PDE solvers using the 2-dimensional Burgers' equation, revealing the GNRK's superiority in terms of model size and accuracy. Additionally, this graph-based methodology offers a straightforward extension for solving coupled differential equations, typically necessitating more intricate models.",
        "keywords": "PDE solver;Graph Neural Networks;Runge-Kutta method",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "/attachment/e2e6b9bcf926fa9d5d1480c3907a4bb5c63de854.zip",
        "author": "Hoyun Choi;Sungyeop Lee;Byungnam Kahng;Junghyo Jo",
        "authorids": "~Hoyun_Choi1;~Sungyeop_Lee1;~Byungnam_Kahng1;~Junghyo_Jo1",
        "gender": ";;M;",
        "homepage": ";https://www.researchgate.net/profile/Sungyeop-Lee;;",
        "dblp": "358/4500;285/5084;61/5474;48/11016",
        "google_scholar": "72RCugkAAAAJ;;N-ITb_AAAAAJ;h1QXLx0AAAAJ",
        "orcid": "0000-0001-7033-0222;;0000-0002-9099-6395;0000-0002-1284-9488",
        "linkedin": "hoyunchoi/?locale=en_US;;;",
        "or_profile": "~Hoyun_Choi1;~Sungyeop_Lee1;~Byungnam_Kahng1;~Junghyo_Jo1",
        "aff": "Seoul National University;Samsung;Korea Institute of Energy Technology;Seoul National University",
        "aff_domain": "snu.ac.kr;samsung.com;kentech.ac.kr;snu.ac.kr",
        "position": "PhD student;Researcher;Full Professor;Associate Professor",
        "bibtex": "@misc{\nchoi2024gnrk,\ntitle={{GNRK}: Graph Neural Runge-Kutta method for solving partial differential equations},\nauthor={Hoyun Choi and Sungyeop Lee and Byungnam Kahng and Junghyo Jo},\nyear={2024},\nurl={https://openreview.net/forum?id=gHaokdQkoi}\n}",
        "github": "",
        "project": "",
        "reviewers": "r1o4;yG9N;MKmy;pwWA;Sxmd",
        "site": "https://openreview.net/forum?id=gHaokdQkoi",
        "pdf_size": 994217,
        "rating": "3;3;3;5;5",
        "confidence": "4;4;4;3;5",
        "soundness": "3;3;1;2;4",
        "contribution": "2;3;2;2;3",
        "presentation": "2;3;2;3;4",
        "wc_summary": "167;199;110;39;45",
        "wc_strengths": "41;37;49;54;144",
        "wc_weaknesses": "458;129;306;328;71",
        "wc_questions": "257;68;29;35;144",
        "wc_review": "923;433;494;456;404",
        "wc_reply_reviewers": "0;0;33;39;35",
        "wc_reply_authors": "700;561;331;545;410",
        "reply_reviewers": "0;0;1;1;1",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            3.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.6,
            1.019803902718557
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.8,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            112.0,
            63.899921752690744
        ],
        "wc_strengths_avg": [
            65.0,
            39.94496213541828
        ],
        "wc_weaknesses_avg": [
            258.4,
            140.57965713430946
        ],
        "wc_questions_avg": [
            106.6,
            85.62382845913864
        ],
        "wc_review_avg": [
            542.0,
            192.76202945601085
        ],
        "wc_reply_reviewers_avg": [
            21.4,
            17.579533554676583
        ],
        "wc_reply_authors_avg": [
            509.4,
            128.0353076303564
        ],
        "reply_reviewers_avg": [
            0.6,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:KLp3xaKpunIJ:scholar.google.com/&scioq=GNRK:+Graph+Neural+Runge-Kutta+method+for+solving+partial+differential+equations&hl=en&as_sdt=0,5",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Seoul National University;Samsung;Korea Institute of Energy Technology",
        "aff_unique_dep": ";Samsung;",
        "aff_unique_url": "https://www.snu.ac.kr;https://www.samsung.com;http://www.kiet.re.kr",
        "aff_unique_abbr": "SNU;Samsung;KIENT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "gHwS4DzkYu",
        "title": "Flatness-aware Adversarial Attack",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The transferability of adversarial examples can be exploited to launch black-box attacks. However, adversarial ones often present poor transferability. To alleviate this issue, by observing that the diversity of inputs can boost transferability, input regularization based methods are proposed, which craft adversarial ones by combining several transformed inputs. We reveal that input regularization based methods make resultant adversarial ones biased towards flat extreme regions. Inspired by this, we propose an attack called FAA which explicitly adds a flatness-aware regularization term in the optimization target to promote the resultant adversarial ones towards flat extreme regions. The flatness-aware regularization term involves gradients of samples around the resultant adversarial ones but optimizing gradients requires the evaluation of Hessian matrix in high-dimension spaces which generally is intractable. To address the problem, we derive an approximate solution to circumvent the construction of Hessian matrix, thereby making FAA practical and cheap. Extensive experiments show the transferability of adversarial ones crafted by FAA can be considerably boosted compared with state-of-the-art baselines.",
        "keywords": "transfer-based attacks;adversarial attacks",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/c1c15cb3af74142f9e6bb78b80704ec3e0b14074.zip",
        "author": "Mingyuan Fan;Xiaodan Li;Cen Chen;Yinggui Wang",
        "authorids": "~Mingyuan_Fan1;~Xiaodan_Li1;~Cen_Chen1;~Yinggui_Wang1",
        "gender": ";F;F;M",
        "homepage": ";;https://sites.google.com/site/chencenpersonalwebsite/;",
        "dblp": ";126/7789;152/6215-1.html;136/1775",
        "google_scholar": ";YximuHAAAAAJ;https://scholar.google.com.sg/citations?user=3Mn4S9UAAAAJ;",
        "orcid": ";;0000-0003-0325-1705;",
        "linkedin": ";;;",
        "or_profile": "~Mingyuan_Fan1;~Xiaodan_Li1;~Cen_Chen1;~Yinggui_Wang1",
        "aff": ";Alibaba Group;East China Normal University;Ant Group",
        "aff_domain": ";alibaba-inc.com;dase.ecnu.edu.cn;antgroup.com",
        "position": ";Researcher;Associate Professor;Principal Researcher",
        "bibtex": "@misc{\nfan2024flatnessaware,\ntitle={Flatness-aware Adversarial Attack},\nauthor={Mingyuan Fan and Xiaodan Li and Cen Chen and Yinggui Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=gHwS4DzkYu}\n}",
        "github": "",
        "project": "",
        "reviewers": "fujR;tmEk;DvXX",
        "site": "https://openreview.net/forum?id=gHwS4DzkYu",
        "pdf_size": 29636587,
        "rating": "3;5;8",
        "confidence": "5;4;4",
        "soundness": "3;3;3",
        "contribution": "1;3;3",
        "presentation": "3;4;3",
        "wc_summary": "60;33;57",
        "wc_strengths": "24;94;71",
        "wc_weaknesses": "208;302;85",
        "wc_questions": "2;92;3",
        "wc_review": "294;521;216",
        "wc_reply_reviewers": "145;0;0",
        "wc_reply_authors": "1402;1154;0",
        "reply_reviewers": "1;0;0",
        "reply_authors": "5;5;0",
        "rating_avg": [
            5.333333333333333,
            2.0548046676563256
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            50.0,
            12.083045973594572
        ],
        "wc_strengths_avg": [
            63.0,
            29.13188402192118
        ],
        "wc_weaknesses_avg": [
            198.33333333333334,
            88.85318727478992
        ],
        "wc_questions_avg": [
            32.333333333333336,
            42.19267972317262
        ],
        "wc_review_avg": [
            343.6666666666667,
            129.37370503914445
        ],
        "wc_reply_reviewers_avg": [
            48.333333333333336,
            68.3536555146996
        ],
        "wc_reply_authors_avg": [
            852.0,
            610.9031565368333
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            2.3570226039551585
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8029550685469661,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17115775320608213972&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Alibaba Group;East China Normal University;Ant Group",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.alibaba.com;http://www.ecnu.edu.cn;https://www.antgroup.com",
        "aff_unique_abbr": "Alibaba;ECNU;Ant Group",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "gIM3ZCWOVR",
        "title": "Evade ChatGPT Detectors via A Single Space",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "ChatGPT brings revolutionary social value but also raises concerns about the misuse of AI-generated text. Consequently, an important question is how to detect whether texts are generated by ChatGPT or by human. Existing detectors are built upon the assumption that there are distributional gaps between human-generated and AI-generated text. These gaps are typically identified using statistical information or classifiers. Our research challenges the distributional gap assumption in detectors. We find that detectors do not effectively discriminate the semantic and stylistic gaps between human-generated and AI-generated text. Instead, the \"subtle differences\", such as an extra space, become crucial for detection. Based on this discovery, we propose the SpaceInfi strategy to evade detection. Experiments demonstrate the effectiveness of this strategy across multiple benchmarks and detectors. We also provide a theoretical explanation for why SpaceInfi is successful in evading perplexity-based detection. And we empirically show that a phenomenon called token mutation causes the evasion for language model-based detectors. Our findings offer new insights and challenges for understanding and constructing more applicable ChatGPT detectors.",
        "keywords": "ChatGPT;AI-generated text;detector;large language model",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/6a089fe07781b1ebe38d9b166aa74886b0e2598f.pdf",
        "author": "Shuyang Cai;Wanyun Cui",
        "authorids": "~Shuyang_Cai1;~Wanyun_Cui1",
        "gender": "M;M",
        "homepage": "https://github.com/AllenCsy;https://cuiwanyun.github.io/",
        "dblp": ";116/5305",
        "google_scholar": ";https://scholar.google.com.hk/citations?user=FP7ANisAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Shuyang_Cai1;~Wanyun_Cui1",
        "aff": "Shanghai University of Finance and Economics;Shanghai University of Finance and Economics",
        "aff_domain": "sufe.edu;shufe.edu.cn",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\ncai2024evade,\ntitle={Evade Chat{GPT} Detectors via A Single Space},\nauthor={Shuyang Cai and Wanyun Cui},\nyear={2024},\nurl={https://openreview.net/forum?id=gIM3ZCWOVR}\n}",
        "github": "",
        "project": "",
        "reviewers": "cd2Y;7Vtq;Gnd1",
        "site": "https://openreview.net/forum?id=gIM3ZCWOVR",
        "pdf_size": 434108,
        "rating": "3;3;6",
        "confidence": "4;5;3",
        "soundness": "2;2;3",
        "contribution": "1;2;3",
        "presentation": "3;2;3",
        "wc_summary": "35;108;128",
        "wc_strengths": "13;27;284",
        "wc_weaknesses": "69;116;268",
        "wc_questions": "50;6;394",
        "wc_review": "167;257;1074",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            90.33333333333333,
            39.96943276499625
        ],
        "wc_strengths_avg": [
            108.0,
            124.58196766252597
        ],
        "wc_weaknesses_avg": [
            151.0,
            84.9274199929956
        ],
        "wc_questions_avg": [
            150.0,
            173.46661542402524
        ],
        "wc_review_avg": [
            499.3333333333333,
            408.00844217845406
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.8660254037844387,
        "gs_citation": 29,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15135089778491755102&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Shanghai University of Finance and Economics",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.sufe.edu.cn",
        "aff_unique_abbr": "SUFE",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Neural Optimal Transport with General Cost Functionals",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18148",
        "id": "gIiz7tBtYZ",
        "author_site": "Arip Asadulaev, Alexander Korotin, Vage Egiazarian, Petr Mokrov, Evgeny Burnaev",
        "tldr": "",
        "abstract": "We introduce a novel neural network-based algorithm to compute optimal transport (OT) plans for general cost functionals. In contrast to common Euclidean costs, i.e., $\\ell^1$ or $\\ell^2$, such functionals provide more flexibility and allow using auxiliary information, such as class labels, to construct the required transport map. Existing methods for general cost functionals are discrete and do not provide an out-of-sample estimation. We address the challenge of designing a continuous OT approach for general cost functionals in high-dimensional spaces, such as images. We construct two example functionals: one to map distributions while preserving the class-wise structure and the other one to preserve the given data pairs. Additionally, we provide the theoretical error analysis for our recovered transport plans. Our implementation is available at \\url{https://github.com/machinestein/gnot}",
        "keywords": "Optimal Transport;Neural Networks;Generative Modelling",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Arip Asadulaev;Alexander Korotin;Vage Egiazarian;Petr Mokrov;Evgeny Burnaev",
        "authorids": "~Arip_Asadulaev1;~Alexander_Korotin2;~Vage_Egiazarian1;~Petr_Mokrov1;~Evgeny_Burnaev1",
        "gender": "M;M;M;M;M",
        "homepage": ";;https://github.com/PetrMokrov;http://faculty.skoltech.ru/people/evgenyburnaev;https://akorotin.netlify.app",
        "dblp": "243/2822;232/3274;;144/7845;209/9906",
        "google_scholar": "wcdrgdYAAAAJ;Bktg6JEAAAAJ;CRsi4IkAAAAJ;https://scholar.google.ru/citations?user=pCRdcOwAAAAJ;https://scholar.google.ru/citations?user=1rIIvjAAAAAJ",
        "orcid": ";0000-0003-4444-9769;;0000-0001-8424-0690;0000-0003-4286-925X",
        "linkedin": ";;;;",
        "or_profile": "~Arip_Asadulaev1;~Vage_Egiazarian1;~Petr_Mokrov1;~Evgeny_Burnaev1;~Alexander_Andreevich_Korotin1",
        "aff": "ITMO University;Yandex;Skolkovo Institute of Science and Technology;Skolkovo Institute of Science and Technology;Skolkovo Institute of Science and Technology",
        "aff_domain": "itmo.ru;yandex-team.ru;skolkovotech.ru;skoltech.ru;skoltech.ru",
        "position": "PhD student;Researcher;PhD student;Full Professor;Head of Research Group",
        "bibtex": "@inproceedings{\nasadulaev2024neural,\ntitle={Neural Optimal Transport with General Cost Functionals},\nauthor={Arip Asadulaev and Alexander Korotin and Vage Egiazarian and Petr Mokrov and Evgeny Burnaev},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=gIiz7tBtYZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "BH6f;iaG1;LT3k;nKa4",
        "pdf_size": 28434168,
        "rating": "6;6;6;6",
        "confidence": "3;3;3;4",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "68;117;79;306",
        "wc_strengths": "43;48;41;60",
        "wc_weaknesses": "265;142;291;198",
        "wc_questions": "5;112;61;177",
        "wc_review": "381;419;472;741",
        "wc_reply_reviewers": "0;0;90;0",
        "wc_reply_authors": "399;744;931;887",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;2;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            142.5,
            96.13142046178243
        ],
        "wc_strengths_avg": [
            48.0,
            7.3824115301167
        ],
        "wc_weaknesses_avg": [
            224.0,
            58.24517147369385
        ],
        "wc_questions_avg": [
            88.75,
            63.46800374992111
        ],
        "wc_review_avg": [
            503.25,
            141.01839419026157
        ],
        "wc_reply_reviewers_avg": [
            22.5,
            38.97114317029974
        ],
        "wc_reply_authors_avg": [
            740.25,
            208.79819802862283
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 41,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11441074728953273241&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=gIiz7tBtYZ",
        "pdf": "https://openreview.net/pdf?id=gIiz7tBtYZ",
        "email": "itmo.ru;yandex-team.ru;skolkovotech.ru;skoltech.ru;skoltech.ru",
        "author_num": 5,
        "aff_unique_index": "0;1;2;2;2",
        "aff_unique_norm": "ITMO University;Yandex;Skolkovo Institute of Science and Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.itmo.ru;https://yandex.com;https://www.skoltech.ru",
        "aff_unique_abbr": "ITMO;Yandex;Skoltech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Russian Federation"
    },
    {
        "id": "gJ7cHBHfBk",
        "title": "Don't be so negative! Score-based Generative Modeling with Oracle-assisted Guidance",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The maximum likelihood  principle advocates parameter estimation via optimization of the data likelihood function. Models estimated in this way can exhibit a variety of generalization characteristics dictated by engineering choices such as architecture, parameterization, and optimization bias. This work addresses model learning in a setting where, in addition to the training dataset, there further exists side-information in the form of an oracle that can label samples as being outside the support of the true data generating distribution. Specifically we develop a new denoising diffusion probabilistic modeling methodology, Gen-neG, that leverages this additional side-information. Gen-neG builds on classifier guidance in diffusion models to guide the generation process towards the positive support region indicated by the oracle. We empirically establish the utility of Gen-neG in applications including collision avoidance in self-driving simulators and  safety-guarded human motion generation.",
        "keywords": "Generative models;Score-based models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/21214e53888408dcc54065e682b0fb29133d15a0.zip",
        "author": "Saeid Naderiparizi;Xiaoxuan Liang;Berend Zwartsenberg;Frank Wood",
        "authorids": "~Saeid_Naderiparizi1;~Xiaoxuan_Liang2;~Berend_Zwartsenberg1;~Frank_Wood2",
        "gender": "M;F;M;M",
        "homepage": "https://www.cs.ubc.ca/~saeidnp/;;https://bzwartsenberg.github.io/;http://www.robots.ox.ac.uk/~fwood/",
        "dblp": "244/9611;;;44/4750",
        "google_scholar": "Ubt0dYYAAAAJ;;;d4yNzXIAAAAJ",
        "orcid": ";;;",
        "linkedin": "saeidnp;xiaoxuan-liang-4451a4171/;;frank-wood-43529114?trk=hp-identity-name",
        "or_profile": "~Saeid_Naderiparizi1;~Xiaoxuan_Liang2;~Berend_Zwartsenberg1;~Frank_Wood2",
        "aff": "University of British Columbia;University of British Columbia;Inverted AI;University of British Columbia",
        "aff_domain": "ubc.ca;cs.ubc.ca;inverted.ai;cs.ubc.ca",
        "position": "PhD student;PhD student;Researcher;Full Professor",
        "bibtex": "@misc{\nnaderiparizi2024dont,\ntitle={Don't be so negative! Score-based Generative Modeling with Oracle-assisted Guidance},\nauthor={Saeid Naderiparizi and Xiaoxuan Liang and Berend Zwartsenberg and Frank Wood},\nyear={2024},\nurl={https://openreview.net/forum?id=gJ7cHBHfBk}\n}",
        "github": "",
        "project": "",
        "reviewers": "G3Cq;DCC6;6Hw3;8oPJ",
        "site": "https://openreview.net/forum?id=gJ7cHBHfBk",
        "pdf_size": 5515820,
        "rating": "3;3;3;6",
        "confidence": "3;3;3;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "102;81;117;37",
        "wc_strengths": "79;56;62;41",
        "wc_weaknesses": "339;134;54;58",
        "wc_questions": "30;114;8;32",
        "wc_review": "550;385;241;168",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            84.25,
            30.127852562039664
        ],
        "wc_strengths_avg": [
            59.5,
            13.6106575888162
        ],
        "wc_weaknesses_avg": [
            146.25,
            115.7591789017182
        ],
        "wc_questions_avg": [
            46.0,
            40.3732584763727
        ],
        "wc_review_avg": [
            336.0,
            146.15573885414148
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14553952500122075679&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "University of British Columbia;Inverted AI",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ubc.ca;https://www.inverted.ai",
        "aff_unique_abbr": "UBC;Inverted AI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "Canada;United States"
    },
    {
        "id": "gJRrG43BYC",
        "title": "State-drive Implicit Modeling",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Implicit models are a general class of learning models that forgo the hierarchical layer structure typical in neural networks and instead define the internal states based on an \"equilibrium\" equation, offering competitive performance and reduced memory consumption. However, training such models usually relies on expensive implicit differentiation for backward propagation. In this work, we present a new approach to training implicit models, called State-driven Implicit Modeling (SIM), where we constrain the internal states and outputs to match that of a baseline model, circumventing costly backward computations. The training problem becomes convex by construction and can be solved in a parallel fashion, thanks to its decomposable structure. We demonstrate how the SIM approach can be further applied to parameter reduction and robust training by combining it with custom objective functions.",
        "keywords": "implicit models;learning algorithm;convex optimization",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/65d1143a6669fcaabd60193addcff232a6f57268.pdf",
        "author": "Alicia Y. Tsai;Juliette Decugis;Laurent El Ghaoui;Alper Atamturk",
        "authorids": "~Alicia_Y._Tsai1;~Juliette_Decugis1;~Laurent_El_Ghaoui1;~Alper_Atamturk2",
        "gender": "F;M;M;F",
        "homepage": ";https://people.eecs.berkeley.edu/~elghaoui/;https://atamturk.ieor.berkeley.edu/;",
        "dblp": "329/6087;40/1786;;279/6303",
        "google_scholar": ";https://scholar.google.com.tw/citations?user=3XLQbL8AAAAJ;;https://scholar.google.com.tw/citations?user=8w8cEeQAAAAJ",
        "orcid": ";;;",
        "linkedin": "juliette-decugis-a29673139/;;;",
        "or_profile": "~Juliette_Decugis1;~Laurent_El_Ghaoui1;~Alper_Atamturk2;~Yi-Ting_Alicia_Tsai1",
        "aff": "Ecole Normale Sup\u00e9rieure de Cachan;University of California, Berkeley;University of California, Berkeley;University of California, Berkeley",
        "aff_domain": "ens-cachan.fr;berkeley.edu;berkeley.edu;berkeley.edu",
        "position": "MS student;Full Professor;Full Professor;PhD student",
        "bibtex": "@misc{\ntsai2024statedrive,\ntitle={State-drive Implicit Modeling},\nauthor={Alicia Y. Tsai and Juliette Decugis and Laurent El Ghaoui and Alper Atamturk},\nyear={2024},\nurl={https://openreview.net/forum?id=gJRrG43BYC}\n}",
        "github": "",
        "project": "",
        "reviewers": "xzz3;JW8T;437Q;jTGa",
        "site": "https://openreview.net/forum?id=gJRrG43BYC",
        "pdf_size": 455404,
        "rating": "3;3;5;6",
        "confidence": "3;3;3;2",
        "soundness": "2;2;3;3",
        "contribution": "1;2;3;3",
        "presentation": "3;2;2;3",
        "wc_summary": "57;85;49;68",
        "wc_strengths": "17;34;34;75",
        "wc_weaknesses": "124;267;160;148",
        "wc_questions": "35;4;43;74",
        "wc_review": "233;390;286;365",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            64.75,
            13.497684986693088
        ],
        "wc_strengths_avg": [
            40.0,
            21.365860619221497
        ],
        "wc_weaknesses_avg": [
            174.75,
            54.815029873201745
        ],
        "wc_questions_avg": [
            39.0,
            24.9098374141623
        ],
        "wc_review_avg": [
            318.5,
            62.53199181219162
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.7777777777777777,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:FvJbMmwYIB0J:scholar.google.com/&scioq=State-drive+Implicit+Modeling&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Ecole Normale Sup\u00e9rieure de Cachan;University of California, Berkeley",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ens-cachan.fr;https://www.berkeley.edu",
        "aff_unique_abbr": "ENS Cachan;UC Berkeley",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Berkeley",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "France;United States"
    },
    {
        "id": "gJTPyCZmbj",
        "title": "PagFormer: Polar Accumulator Grid Integrated into Transformers for Medical Image Segmentation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent transformers have made remarkable strides in medical image analysis, enhancing the efficacy of various downstream applications. \nYet, the rich geometric patterns present in medical images offer untapped potential for further refinement.\nIn this paper, introduce the Polar Accumulator Grid (PAGrid) and seamlessly integrate it into the transformer network, PagFormer, with an aim to improve segmentation performance for elliptical or oval objects in medical images.  \nInspired by both the bilateral grid, renowned for its edge-preserving filtering, and the directed accumulator, skilled at integrating geometric shapes into neural networks, PAGrid facilitates geometric-preserving filtering through a symmetric sequence of accumulating, processing, and slicing.\nPAGrid preserves elliptical geometry information and promotes the aggregation of global information.\nThe symmetry between accumulation and slicing in PAGrid allows us to transition from the classic encoder-decoder architecture to an encoder-slicer design, emboddied in the PagFormer.\nAdditionally, PAGrid's parallelization is managed with CUDA programming, and the back-propagation is enabled for neural network training.\nAn empirical experiment on three medical image segmentation datasets \u2014 specifically, ISIC2017 and ISIC2018 datasets for skin lesions, ACDC datasets for cardiac organs, all of which contains elliptically distributed objects \u2014 reveals that our method outperforms other state-of-the-art transformers.",
        "keywords": "Directed Accumulator;Transformers;Skin Lesion Segmentation;Cardiac Organs",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Hang Zhang;Renjiu Hu;Rongguang Wang;Dongdong Liu;Gaolei Li",
        "authorids": "~Hang_Zhang4;~Renjiu_Hu1;~Rongguang_Wang1;~Dongdong_Liu1;~Gaolei_Li1",
        "gender": "M;M;M;M;M",
        "homepage": "https://tinymilky.github.io;;;http://mechatronics.engineering.nyu.edu/people/phd-candidates/dongdong-liu.php;",
        "dblp": "49/6156-10;342/7887;274/3225;45/8193;176/5848",
        "google_scholar": "https://scholar.google.com/citations?hl=en;LH7Ru_IAAAAJ;i_X02A0AAAAJ;pfaSYhsAAAAJ;",
        "orcid": "0000-0003-0115-387X;0000-0003-4651-3349;;0000-0001-5265-6907;",
        "linkedin": "hang-zhang-462980bb;renjiu-hu-796954a0/;rongguangw/;dongdong-liu-367642128/;",
        "or_profile": "~Hang_Zhang4;~Renjiu_Hu1;~Rongguang_Wang1;~Dongdong_Liu1;~Gaolei_Li1",
        "aff": "Cornell University;Weill Cornell Medicine, Cornell University;University of Pennsylvania;New York University;Shanghai Jiaotong University",
        "aff_domain": "cornell.edu;med.cornell.edu;upenn.edu;nyu.edu;sjtu.edu.cn",
        "position": "Researcher;Researcher;PhD student;Researcher;Associate Professor",
        "bibtex": "@misc{\nzhang2024pagformer,\ntitle={PagFormer: Polar Accumulator Grid  Integrated into Transformers for Medical Image Segmentation},\nauthor={Hang Zhang and Renjiu Hu and Rongguang Wang and Dongdong Liu and Gaolei Li},\nyear={2024},\nurl={https://openreview.net/forum?id=gJTPyCZmbj}\n}",
        "github": "",
        "project": "",
        "reviewers": "PEuz;G822;Y6wX;YC5Q",
        "site": "https://openreview.net/forum?id=gJTPyCZmbj",
        "pdf_size": 2860858,
        "rating": "3;3;5;6",
        "confidence": "4;3;3;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "102;57;130;81",
        "wc_strengths": "50;88;128;31",
        "wc_weaknesses": "154;421;108;76",
        "wc_questions": "1;3;53;23",
        "wc_review": "307;569;419;211",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            92.5,
            26.874709300753377
        ],
        "wc_strengths_avg": [
            74.25,
            37.204670405743414
        ],
        "wc_weaknesses_avg": [
            189.75,
            136.36050564587973
        ],
        "wc_questions_avg": [
            20.0,
            20.904544960366874
        ],
        "wc_review_avg": [
            376.5,
            133.30697656161885
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5555555555555555,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:AKksqYTa8rcJ:scholar.google.com/&scioq=PagFormer:+Polar+Accumulator+Grid+Integrated+into+Transformers+for+Medical+Image+Segmentation&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2;3",
        "aff_unique_norm": "Cornell University;University of Pennsylvania;New York University;Shanghai Jiao Tong University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.cornell.edu;https://www.upenn.edu;https://www.nyu.edu;https://www.sjtu.edu.cn",
        "aff_unique_abbr": "Cornell;UPenn;NYU;SJTU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Weill Cornell Medicine",
        "aff_country_unique_index": "0;0;0;0;1",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "A Simple Romance Between Multi-Exit Vision Transformer and Token Reduction",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18147",
        "id": "gJeYtRuguR",
        "author_site": "Dongyang Liu, Meina Kan, Shiguang Shan, Xilin CHEN",
        "tldr": "",
        "abstract": "Vision Transformers (ViTs) are now flourishing in the computer vision area. Despite the remarkable success, ViTs suffer from high computational costs, which greatly hinder their practical usage. Token reduction, which identifies and discards unimportant tokens during forward propagation, has then been proposed to make ViTs more efficient. For token reduction methodologies, a scoring metric is essential to distinguish between important and unimportant tokens. The attention score from the $\\mathrm{[CLS]}$ token, which takes the responsibility to aggregate useful information and form the final output, has been established by prior works as an advantageous choice. Nevertheless, whereas the task pressure is applied at the end of the whole model, token reduction generally starts from very early blocks. Given the long distance in between, in the early blocks, $\\mathrm{[CLS]}$ token lacks the impetus to gather task-relevant information, causing somewhat arbitrary attention allocation. This phenomenon, in turn, degrades the reliability of token scoring and substantially compromises the effectiveness of token reduction. Inspired by advances in the domain of dynamic neural networks, in this paper, we introduce Multi-Exit Token Reduction (METR), a simple romance between multi-exit architecture and token reduction\u2014two areas previously considered orthogonal. By injecting early task pressure via multi-exit loss, the $\\mathrm{[CLS]}$ token is spurred to collect task-related information in even early blocks, thus bolstering the credibility of $\\mathrm{[CLS]}$ attention as a token-scoring metric. Additionally, we employ self-distillation to further refine the quality of early supervision. Extensive experiments substantiate both the existence and effectiveness of the newfound chemistry. Comparative assessments also indicate that METR outperforms state-of-the-art token reduction methods on standard benchmarks, especially under aggressive reduction ratios.",
        "keywords": "Vision Transformer;Token Reduction",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Dongyang Liu;Meina Kan;Shiguang Shan;Xilin CHEN",
        "authorids": "~Dongyang_Liu1;~Meina_Kan1;~Shiguang_Shan2;~Xilin_CHEN2",
        "gender": "M;;M;",
        "homepage": "https://chrisliu6.github.io/;;http://vipl.ict.ac.cn/people/sgshan/;",
        "dblp": ";;s/ShiguangShan;",
        "google_scholar": "VxQGEOcAAAAJ;;https://scholar.google.com.tw/citations?user=Vkzd7MIAAAAJ;",
        "orcid": ";;0000-0002-8348-392X;",
        "linkedin": ";;;",
        "or_profile": "~Dongyang_Liu1;~Meina_Kan1;~Shiguang_Shan2;~Xilin_CHEN2",
        "aff": "Institute of Computing Technology , Chinese Academy of Sciences;;Institute of Computing Technology, Chinese Academy of Sciences;",
        "aff_domain": "ict.ac.cn;;ict.ac.cn;",
        "position": "MS student;;Full Professor;",
        "bibtex": "@inproceedings{\nliu2024a,\ntitle={A Simple Romance Between Multi-Exit Vision Transformer and Token Reduction},\nauthor={Dongyang Liu and Meina Kan and Shiguang Shan and Xilin CHEN},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=gJeYtRuguR}\n}",
        "github": "",
        "project": "",
        "reviewers": "jWbQ;G39w;Zdao;9w9u",
        "pdf_size": 729536,
        "rating": "6;8;8;8",
        "confidence": "2;4;4;5",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "87;166;133;81",
        "wc_strengths": "52;172;78;70",
        "wc_weaknesses": "59;147;175;2",
        "wc_questions": "3;57;110;15",
        "wc_review": "201;542;496;168",
        "wc_reply_reviewers": "0;0;141;0",
        "wc_reply_authors": "272;247;1064;166",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;3;1",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            116.75,
            34.83084121866711
        ],
        "wc_strengths_avg": [
            93.0,
            46.57252408878007
        ],
        "wc_weaknesses_avg": [
            95.75,
            69.0049817042219
        ],
        "wc_questions_avg": [
            46.25,
            41.91285602294361
        ],
        "wc_review_avg": [
            351.75,
            168.44342522045793
        ],
        "wc_reply_reviewers_avg": [
            35.25,
            61.054790966802926
        ],
        "wc_reply_authors_avg": [
            437.25,
            363.96934967109524
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.9271726499455306,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5623049777377271110&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=gJeYtRuguR",
        "pdf": "https://openreview.net/pdf?id=gJeYtRuguR",
        "email": "ict.ac.cn;;ict.ac.cn;",
        "author_num": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Chinese Academy of Sciences",
        "aff_unique_dep": "Institute of Computing Technology",
        "aff_unique_url": "http://www.ict.ac.cn",
        "aff_unique_abbr": "CAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "gJiOQw1fkF",
        "title": "Enhanced Model-agnostic Training of Deep Tabular Generation Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Despite the active research for tabular data synthesis, state-of-the-art methods continue to face challenges arising from the complex distribution of tabular data. To this end, we claim that the difficulty can be alleviated by making the distribution simpler using Gaussian decomposition. In this paper, we propose a training method, Gaussian Decomposition-based Generation of Tabular data (GADGET), which can be applied to any generative models for tabular data. The method i) decomposes the complicated distribution of tabular data into a mixture of $K$ Gaussian distributions, ii) trains one model for each decomposed Gaussian distribution aided by our proposed self-paced learning algorithm. In other words, we do not stop at utilizing a Gaussian mixture model to discover $K$ simplified distributions but utilize their surrogate density functions for designing our self-paced learning algorithm. In our experiments with 11 datasets and 8 baselines, we show that GADGET greatly improves existing tabular data synthesis methods. In particular, a score-based generative model on our GADGET training framework achieves the state-of-the-art performance in terms of sampling quality and diversity.",
        "keywords": "mixture of gaussian;tabular data generation;score-based generative model",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/2c2ae4b67110a8eefe2302df2cbc95fe7a7d89af.zip",
        "author": "Jayoung Kim;Noseong Park",
        "authorids": "~Jayoung_Kim1;~Noseong_Park1",
        "gender": "F;",
        "homepage": ";",
        "dblp": "26/9969-2;",
        "google_scholar": "3qbSHGwAAAAJ;",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Jayoung_Kim1;~Noseong_Park1",
        "aff": "Yonsei University;",
        "aff_domain": "yonsei.ac.kr;",
        "position": "MS student;",
        "bibtex": "@misc{\nkim2024enhanced,\ntitle={Enhanced Model-agnostic Training of Deep Tabular Generation Models},\nauthor={Jayoung Kim and Noseong Park},\nyear={2024},\nurl={https://openreview.net/forum?id=gJiOQw1fkF}\n}",
        "github": "",
        "project": "",
        "reviewers": "gU1v;hPk2;PxXe;wKre",
        "site": "https://openreview.net/forum?id=gJiOQw1fkF",
        "pdf_size": 15712922,
        "rating": "1;3;5;6",
        "confidence": "3;4;4;3",
        "soundness": "1;3;2;3",
        "contribution": "1;2;2;2",
        "presentation": "2;1;2;3",
        "wc_summary": "35;120;79;81",
        "wc_strengths": "8;156;11;65",
        "wc_weaknesses": "154;799;328;28",
        "wc_questions": "6;126;2;448",
        "wc_review": "203;1201;420;622",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.920286436967152
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            78.75,
            30.086334107032716
        ],
        "wc_strengths_avg": [
            60.0,
            59.88739433303139
        ],
        "wc_weaknesses_avg": [
            327.25,
            292.4528808201417
        ],
        "wc_questions_avg": [
            145.5,
            181.61704215188618
        ],
        "wc_review_avg": [
            611.5,
            371.20243803078665
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.13018891098082386,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Ulw-XgPgEAgJ:scholar.google.com/&scioq=Enhanced+Model-agnostic+Training+of+Deep+Tabular+Generation+Models&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Yonsei University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.yonsei.ac.kr",
        "aff_unique_abbr": "Yonsei",
        "aff_country_unique_index": "0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "gK7HIepdn7",
        "title": "MATLABER: Material-Aware Text-to-3D via LAtent BRDF auto-EncodeR",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Based on powerful text-to-image diffusion models, text-to-3D generation has made significant progress in generating compelling geometry and appearance. However, existing methods still struggle to recover high-fidelity object materials, either only considering Lambertian reflectance, or failing to disentangle BRDF materials from the environment lights. In this work, we propose Material-Aware Text-to-3D via LAtent BRDF auto-EncodeR (MATLABER) that leverages a novel latent BRDF auto-encoder for material generation.\nThe BRDF auto-encoder is trained with large-scale real-world BRDF collections, serving as a useful prior to constrain the generated material in a natural distribution. To further disentangle material from environment lights, we adopt a semantic-aware material regularization that motivates object parts with the same semantics to share similar materials.\nThrough exhaustive experiments, our approach demonstrates the superiority over existing ones in generating realistic and coherent object materials.\nMoreover, high-quality materials naturally enable multiple downstream tasks such as relighting and material editing.",
        "keywords": "Text-to-3D generation;stable diffusion;material generation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/b36aacb727c71c37480db542f5737d0d27ca7612.pdf",
        "author": "Xudong XU;Yitong Wang;Zhaoyang Lyu;Xingang Pan;Bo Dai",
        "authorids": "~Xudong_XU1;~Yitong_Wang3;~Zhaoyang_Lyu1;~Xingang_Pan1;~Bo_Dai2",
        "gender": "M;;M;M;M",
        "homepage": "https://sheldontsui.github.io;;;https://xingangpan.github.io/;http://daibo.info/",
        "dblp": "210/2741;;241/6250;211/7940;64/2903-2",
        "google_scholar": "https://scholar.google.com.hk/citations?user=D8VMkA8AAAAJ;;https://scholar.google.com.tw/citations?user=gkXFhbwAAAAJ;https://scholar.google.com.hk/citations?user=uo0q9WgAAAAJ;https://scholar.google.com.hk/citations?user=KNWTvgEAAAAJ",
        "orcid": ";;;0000-0002-5825-9467;0000-0003-0777-9232",
        "linkedin": ";;;;",
        "or_profile": "~Xudong_XU1;~Yitong_Wang3;~Zhaoyang_Lyu1;~Xingang_Pan1;~Bo_Dai2",
        "aff": "Shanghai AI Laboratory;;Shanghai AI Laboratory;Nanyang Technological University;Shanghai AI Laboratory",
        "aff_domain": "pjlab.org.cn;;pjlab.org.cn;ntu.edu.sg;pjlab.org.cn",
        "position": "Researcher;;Researcher;Assistant Professor;Scientist",
        "bibtex": "@misc{\nxu2024matlaber,\ntitle={{MATLABER}: Material-Aware Text-to-3D via {LA}tent {BRDF} auto-EncodeR},\nauthor={Xudong XU and Yitong Wang and Zhaoyang Lyu and Xingang Pan and Bo Dai},\nyear={2024},\nurl={https://openreview.net/forum?id=gK7HIepdn7}\n}",
        "github": "",
        "project": "",
        "reviewers": "VHfX;Kg7h;A1cD",
        "site": "https://openreview.net/forum?id=gK7HIepdn7",
        "pdf_size": 6900105,
        "rating": "3;5;6",
        "confidence": "3;5;4",
        "soundness": "2;4;3",
        "contribution": "2;3;2",
        "presentation": "2;4;3",
        "wc_summary": "31;48;133",
        "wc_strengths": "34;55;197",
        "wc_weaknesses": "130;165;346",
        "wc_questions": "51;67;560",
        "wc_review": "246;335;1236",
        "wc_reply_reviewers": "213;140;84",
        "wc_reply_authors": "704;571;907",
        "reply_reviewers": "2;1;1",
        "reply_authors": "4;2;2",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            70.66666666666667,
            44.61937795273359
        ],
        "wc_strengths_avg": [
            95.33333333333333,
            72.39858807708583
        ],
        "wc_weaknesses_avg": [
            213.66666666666666,
            94.65845034766954
        ],
        "wc_questions_avg": [
            226.0,
            236.26397665887762
        ],
        "wc_review_avg": [
            605.6666666666666,
            447.19148272549
        ],
        "wc_reply_reviewers_avg": [
            145.66666666666666,
            52.81624329271778
        ],
        "wc_reply_authors_avg": [
            727.3333333333334,
            138.16013253548297
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.6546536707079772,
        "gs_citation": 21,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=564984937286807106&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Shanghai AI Laboratory;Nanyang Technological University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.shanghai-ai-lab.com;https://www.ntu.edu.sg",
        "aff_unique_abbr": "SAIL;NTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "China;Singapore"
    },
    {
        "id": "gKd8hH6ERY",
        "title": "Large Scene Synthesis Controlled With Detailed Text Using View-wise Conditional Joint Diffusion With Hierarchical Spatial Controls",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recently, text-driven large scene image synthesis has made significant progress with diffusion models, but controlling it is challenging. While using additional segmentation map with corresponding texts has greatly improved the controllability of large scene synthesis, adding more texts for large scene generation to faithfully reflect detailed text descriptions is challenging. Here, we propose DetText2Scene, a novel detailed-text-driven large-scale image synthesis with high faithfulness, high controllability with high naturalness in global context for the given descriptions. Our DetText2Scene consists of 1) a hierarchical keypoint-box layout conversion from the detailed text by leveraging large language model for spatial controls, 2) a view-wise conditioned joint diffusion process to synthesize a large scene from the given detailed text and the spatial controls in grounded hierarchical keypoint-box layout and 3) a pixel perturbation-based hierarchical enhancement to hierarchically refine it for global coherence. In experiments, our DetText2Scene significantly outperforms prior arts in text-to-image synthesis with the detailed text as well as our generated keypoint-box layouts qualitatively and quantitatively, achieving strong faithfulness with detailed descriptions, superior controllability, and excellent naturalness in global context in CLIP scores and/or user studies.",
        "keywords": "Large-Scale Image Synthesis;Text-guided Image Generation;Diffusion Model",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/29fbeec733d5f2d5e089412b3fdf32798f2a8e38.pdf",
        "author": "Gwanghyun Kim;Dong Un Kang;Hoigi Seo;Hayeon Kim;Se Young Chun",
        "authorids": "~Gwanghyun_Kim1;~Dong_Un_Kang1;~Hoigi_Seo1;~Hayeon_Kim1;~Se_Young_Chun2",
        "gender": ";M;M;F;",
        "homepage": "https://gwang-kim.github.io/;;https://seohoiki3215.github.io;https://janeyeon.github.io;https://icl.snu.ac.kr",
        "dblp": "02/7013;254/2961;344/5117;227/9040;85/2542",
        "google_scholar": "https://scholar.google.co.kr/citations?user=SCLtNC4AAAAJ;;https://scholar.google.co.kr/citations?user=J5w82IEAAAAJ;asHgEcIAAAAJ;https://scholar.google.co.kr/citations?user=ntw4vH4AAAAJ",
        "orcid": "0000-0001-6570-236X;;;;0000-0001-8739-8960",
        "linkedin": "gwanghyun-bradley-kim/;kdu1;;;sychun-953593206/",
        "or_profile": "~Gwanghyun_Kim1;~Dong_Un_Kang1;~Hoigi_Seo1;~Hayeon_Kim1;~Se_Young_Chun1",
        "aff": "Google;Seoul National University;Seoul National University;Seoul National University;Seoul National University",
        "aff_domain": "google.com;snu.ac.kr;snu.ac.kr;snu.ac.kr;snu.ac.kr",
        "position": "Student Researcher;PhD student;MS student;MS student;Associate Professor",
        "bibtex": "@misc{\nkim2024large,\ntitle={Large Scene Synthesis Controlled With Detailed Text Using View-wise Conditional Joint Diffusion With Hierarchical Spatial Controls},\nauthor={Gwanghyun Kim and Dong Un Kang and Hoigi Seo and Hayeon Kim and Se Young Chun},\nyear={2024},\nurl={https://openreview.net/forum?id=gKd8hH6ERY}\n}",
        "github": "",
        "project": "",
        "reviewers": "F2WC;WVZo;TMzU;EaVt",
        "site": "https://openreview.net/forum?id=gKd8hH6ERY",
        "pdf_size": 14306951,
        "rating": "3;3;6;6",
        "confidence": "4;2;5;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;2",
        "presentation": "1;1;3;3",
        "wc_summary": "68;22;53;85",
        "wc_strengths": "22;16;317;77",
        "wc_weaknesses": "259;95;136;103",
        "wc_questions": "2;16;2;249",
        "wc_review": "351;149;508;514",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            1.0
        ],
        "wc_summary_avg": [
            57.0,
            23.16246964380094
        ],
        "wc_strengths_avg": [
            108.0,
            122.98577153475925
        ],
        "wc_weaknesses_avg": [
            148.25,
            65.76235625340686
        ],
        "wc_questions_avg": [
            67.25,
            105.08895041820524
        ],
        "wc_review_avg": [
            380.5,
            148.7791988148881
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.6882472016116854,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Tk5e2VV5fnsJ:scholar.google.com/&scioq=Large+Scene+Synthesis+Controlled+With+Detailed+Text+Using+View-wise+Conditional+Joint+Diffusion+With+Hierarchical+Spatial+Controls&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1;1",
        "aff_unique_norm": "Google;Seoul National University",
        "aff_unique_dep": "Google;",
        "aff_unique_url": "https://www.google.com;https://www.snu.ac.kr",
        "aff_unique_abbr": "Google;SNU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Mountain View;",
        "aff_country_unique_index": "0;1;1;1;1",
        "aff_country_unique": "United States;South Korea"
    },
    {
        "title": "LUT-GEMM: Quantized Matrix Multiplication based on LUTs for Efficient Inference in Large-Scale Generative Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18146",
        "id": "gLARhFLE0F",
        "author_site": "Gunho Park, baeseong park, Minsub Kim, Sungjae Lee, Jeonghoon Kim, Beomseok Kwon, Se Jung Kwon, Byeongwook Kim, Youngjoo Lee, Dongsoo Lee",
        "tldr": "",
        "abstract": "Recent advances in self-supervised learning and the Transformer architecture have significantly improved natural language processing (NLP), achieving remarkably low perplexity.\nHowever, the growing size of NLP models introduces a memory wall problem during the generation phase.\nTo mitigate this issue, recent efforts have focused on quantizing model weights to sub-4-bit precision while preserving full precision for activations, resulting in practical speed-ups during inference on a single GPU.\nHowever, these improvements primarily stem from reduced memory movement, which necessitates a resource-intensive dequantization process rather than actual computational reduction.\nIn this paper, we introduce LUT-GEMM, an efficient kernel for quantized matrix multiplication, which not only eliminates the resource-intensive dequantization process but also reduces computational costs compared to previous kernels for weight-only quantization.\nFurthermore, we proposed group-wise quantization to offer a flexible trade-off between compression ratio and accuracy.\nThe impact of LUT-GEMM is facilitated by implementing high compression ratios through low-bit quantization and efficient LUT-based operations.\nWe show experimentally that when applied to the OPT-175B model with 3-bit quantization, LUT-GEMM substantially accelerates token generation latency, achieving a remarkable 2.1x improvement on a single GPU when compared to OPTQ, which relies on the costly dequantization process.",
        "keywords": "Neural Network Quantization;Model Compression;Generative Language Model;Transformer;Deep Learning",
        "primary_area": "infrastructure, software libraries, hardware, etc.",
        "supplementary_material": "/attachment/01cc68d564654914cc1cd40fe129aa70d394ec0c.zip",
        "author": "Gunho Park;Baeseong park;Minsub Kim;Sungjae Lee;Jeonghoon Kim;Beomseok Kwon;Se Jung Kwon;Byeongwook Kim;Youngjoo Lee;Dongsoo Lee",
        "authorids": "~Gunho_Park1;~Baeseong_park1;~Minsub_Kim3;~Sungjae_Lee1;~Jeonghoon_Kim1;~Beomseok_Kwon1;~Se_Jung_Kwon1;~Byeongwook_Kim1;~Youngjoo_Lee1;~Dongsoo_Lee1",
        "gender": "M;M;M;M;M;M;;;M;M",
        "homepage": "https://sites.google.com/view/epiclab/member/ghpark?authuser=0;;https://llsj14.github.io;;https://jchoi-hyu.github.io/;;;https://sites.google.com/view/epiclab;;https://baeseong.tistory.com/",
        "dblp": ";;;;;119/5676;220/5405;;11/9680;241/6925.html",
        "google_scholar": "3l_lwHkAAAAJ;https://scholar.google.co.kr/citations?user=Q-r9qi4AAAAJ;https://scholar.google.co.kr/citations?user=i_BBE-oAAAAJ;https://scholar.google.com/citations?hl=ko;;https://scholar.google.co.kr/citations?user=8eTxKOkAAAAJ;https://scholar.google.co.kr/citations?user=OjfC7gUAAAAJ;https://scholar.google.co.kr/citations?user=_ZEvQuEAAAAJ;ALiieEkAAAAJ;https://scholar.google.co.kr/citations?user=RMmyMJsAAAAJ",
        "orcid": ";;;0000-0002-6068-6476;;;;0000-0002-2467-8276;;",
        "linkedin": ";;;jeonghoon-kim-804892175/;;se-jung-kwon-305503175/;;;;baeseong-park/",
        "or_profile": "~Gunho_Park1;~Minsub_Kim3;~Sungjae_Lee1;~Jeonghoon_Kim1;~Beomseok_Kwon1;~Se_Jung_Kwon1;~Byeongwook_Kim1;~Youngjoo_Lee1;~Dongsoo_Lee1;~Bae_Seong_Park1",
        "aff": "Pohang University of Science and Technology;;NAVER Clova;NAVER;NAVER CLOUD;NAVER Cloud;NAVER CLOUD;Pohang University of Science and Technology;NAVER CLOVA;NAVER Clova",
        "aff_domain": "postech.ac.kr;;navercorp.com;navercorp.com;navercorp.com;navercorp.com;navercorp.com;postech.ac.kr;navercorp.com;navercorp.com",
        "position": "PhD student;;Researcher;Researcher;Researcher;AI Researcher;Researcher;Associate Professor;Executive Officer;Software Engineer",
        "bibtex": "@inproceedings{\npark2024lutgemm,\ntitle={{LUT}-{GEMM}: Quantized Matrix Multiplication based on {LUT}s for Efficient Inference in Large-Scale Generative Language Models},\nauthor={Gunho Park and Baeseong park and Minsub Kim and Sungjae Lee and Jeonghoon Kim and Beomseok Kwon and Se Jung Kwon and Byeongwook Kim and Youngjoo Lee and Dongsoo Lee},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=gLARhFLE0F}\n}",
        "github": "",
        "project": "",
        "reviewers": "banf;UZqJ;kS8V;cNRT",
        "pdf_size": 622608,
        "rating": "6;6;8;8",
        "confidence": "4;4;5;4",
        "soundness": "3;3;4;4",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;4",
        "wc_summary": "89;133;121;103",
        "wc_strengths": "91;107;98;80",
        "wc_weaknesses": "187;119;196;76",
        "wc_questions": "104;5;80;47",
        "wc_review": "471;364;495;306",
        "wc_reply_reviewers": "177;19;0;0",
        "wc_reply_authors": "1363;731;1211;995",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "3;2;2;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            111.5,
            16.815171720800237
        ],
        "wc_strengths_avg": [
            94.0,
            9.874208829065749
        ],
        "wc_weaknesses_avg": [
            144.5,
            49.5
        ],
        "wc_questions_avg": [
            59.0,
            37.1685350800916
        ],
        "wc_review_avg": [
            409.0,
            77.25606772286562
        ],
        "wc_reply_reviewers_avg": [
            49.0,
            74.30679645900501
        ],
        "wc_reply_authors_avg": [
            1075.0,
            237.78982316322958
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 144,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11231470048283790031&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=gLARhFLE0F",
        "pdf": "https://openreview.net/pdf?id=gLARhFLE0F",
        "email": "postech.ac.kr;;navercorp.com;navercorp.com;navercorp.com;navercorp.com;navercorp.com;postech.ac.kr;navercorp.com;navercorp.com",
        "author_num": 10,
        "aff_unique_index": "0;1;1;1;1;1;0;1;1",
        "aff_unique_norm": "Pohang University of Science and Technology;NAVER Corporation",
        "aff_unique_dep": ";Clova",
        "aff_unique_url": "https://www.postech.ac.kr;https://www.naver.com",
        "aff_unique_abbr": "POSTECH;NAVER",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Pohang;",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "gLZeEpfVjy",
        "title": "Understanding and Robustifying Sub-domain Alignment for Domain Adaptation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In unsupervised domain adaptation (UDA), aligning source and target domains improves the predictive performance of learned models on the target domain. A common methodological improvement in alignment methods is to divide the domains and align sub-domains instead. These sub-domain-based algorithms have demonstrated great empirical success but lack theoretical support. In this work, we establish a rigorous theoretical understanding of the advantages of these methods that have the potential to enhance their overall impact on the field. Our theory uncovers that sub-domain-based methods optimize an error bound that is at least as strong as non-sub-domain-based error bounds and is empirically verified to be much stronger. Furthermore, our analysis indicates that when the marginal weights of sub-domains shift between source and target tasks, the performance of these methods may be compromised. We therefore implement an algorithm to robustify sub-domain alignment for domain adaptation under sub-domain shift, offering a valuable adaptation strategy for future sub-domain-based methods. Empirical experiments across various benchmarks validate our theoretical insights, prove the necessity for the proposed adaptation strategy, and demonstrate the algorithm's competitiveness in handling label shift.",
        "keywords": "Sub-domain method;Domain/Distribution alignment;Robust knowledge transfer;Theory driven methodology",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Yiling Liu;Juncheng Dong;Ziyang Jiang;Ahmed Aloui;Keyu Li;Michael Hunter Klein;Vahid Tarokh;David Carlson",
        "authorids": "~Yiling_Liu2;~Juncheng_Dong1;~Ziyang_Jiang1;~Ahmed_Aloui1;~Keyu_Li3;~Michael_Hunter_Klein1;~Vahid_Tarokh1;~David_Carlson1",
        "gender": ";;M;M;F;M;;",
        "homepage": ";;;;;;;",
        "dblp": ";;216/8578;116/6738;73/8134;320/5373;;",
        "google_scholar": ";;cuCwWe4AAAAJ;;vf1rdvUAAAAJ;9mhDJI8AAAAJ;;",
        "orcid": ";;0000-0001-7096-4612;;;0009-0000-9584-3462;;",
        "linkedin": ";;ziyang-jiang-950310/;ahmed-aloui-b06547153/;;mhunterklein/;;",
        "or_profile": "~Yiling_Liu2;~Juncheng_Dong1;~Ziyang_Jiang1;~Ahmed_Aloui1;~Keyu_Li3;~Michael_Hunter_Klein1;~Vahid_Tarokh1;~David_Carlson1",
        "aff": ";;Duke University;Duke University, Duke University;Duke University;Duke University;;",
        "aff_domain": ";;duke.edu;ece.duke.edu;duke.edu;duke.edu;;",
        "position": ";;PhD student;PhD student;PhD student;PhD student;;",
        "bibtex": "@misc{\nliu2024understanding,\ntitle={Understanding and Robustifying Sub-domain Alignment for Domain Adaptation},\nauthor={Yiling Liu and Juncheng Dong and Ziyang Jiang and Ahmed Aloui and Keyu Li and Michael Hunter Klein and Vahid Tarokh and David Carlson},\nyear={2024},\nurl={https://openreview.net/forum?id=gLZeEpfVjy}\n}",
        "github": "",
        "project": "",
        "reviewers": "epCK;p9oY;W1Lh",
        "site": "https://openreview.net/forum?id=gLZeEpfVjy",
        "pdf_size": 13101614,
        "rating": "5;6;6",
        "confidence": "4;4;3",
        "soundness": "2;3;3",
        "contribution": "2;3;2",
        "presentation": "3;3;3",
        "wc_summary": "70;78;54",
        "wc_strengths": "60;69;20",
        "wc_weaknesses": "71;136;261",
        "wc_questions": "71;2;4",
        "wc_review": "272;285;339",
        "wc_reply_reviewers": "15;11;15",
        "wc_reply_authors": "856;776;1195",
        "reply_reviewers": "1;1;1",
        "reply_authors": "2;3;3",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            67.33333333333333,
            9.977753031397176
        ],
        "wc_strengths_avg": [
            49.666666666666664,
            21.296843793284385
        ],
        "wc_weaknesses_avg": [
            156.0,
            78.84584115009915
        ],
        "wc_questions_avg": [
            25.666666666666668,
            32.0659043568433
        ],
        "wc_review_avg": [
            298.6666666666667,
            29.00957696271277
        ],
        "wc_reply_reviewers_avg": [
            13.666666666666666,
            1.8856180831641267
        ],
        "wc_reply_authors_avg": [
            942.3333333333334,
            181.6229305150891
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:LJkxFLp4BWoJ:scholar.google.com/&scioq=Understanding+and+Robustifying+Sub-domain+Alignment+for+Domain+Adaptation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Duke University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.duke.edu",
        "aff_unique_abbr": "Duke",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "gLtHsY0zCC",
        "title": "T-Measure: A Measure for Model Transferabilty",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "A popular paradigm in AI modeling, including computer vision, natural language processing, and graph modeling, is applying a large pre-trained model that has been fine-tuned for a particular task on novel datasets. \nHowever, many such models are published in model repositories, fine-tuned using different types of source data.\nConsequently, practitioners face the problem of model selection -- choosing the best model for their task from a repository of models. \nModel performance in a target domain depends on factors including task definition, model architecture, data distribution, and the model transfer method.\nPrevious model selection methods in transfer learning focus on task definition when assessing transferability, and often require a labeled dataset in the target domain.\nWe formulate the transfer problem as label-agnostic model selection, where the goal is to choose the best-performing model on a target domain without access to labeled data. \nSpecifically, we analyze the impact of source domain training data on model transferability. \nTo measure this transferability, we introduce a new type of quantitative measure, the T-Measure, which correlates with the test-time performance of a model on an unlabeled target domain.  \nWe propose a T-Measure estimation method which incorporates distributional measures of the source domain's training data instances, the distribution of the target domain's instances, and the base performance of a task-specific model to create a ranking of models.  \nWe then adapt previous task-centric transferability measures for data-centric selection and compare them against T-Measure.\nWe thoroughly evaluate the T-Measure performance for 4 tasks and 11 datasets and show its effectiveness in ranking models for model selection compared to baselines.",
        "keywords": "Transfer Estimation;Transfer Learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Pegah Jandaghi;Pei Zhou;Alon Albalak;Jay Pujara",
        "authorids": "~Pegah_Jandaghi1;~Pei_Zhou1;~Alon_Albalak1;~Jay_Pujara1",
        "gender": "F;M;;",
        "homepage": ";https://shaoxia57.github.io/;https://alon-albalak.github.io/;https://www.jaypujara.org",
        "dblp": ";;283/4427;65/10103",
        "google_scholar": "QI-eVvkAAAAJ;13PGDZsAAAAJ;F6J_7d8AAAAJ;yvdSr4AAAAAJ",
        "orcid": ";;0000-0003-0809-1704;0000-0001-6921-1744",
        "linkedin": ";pei-zhou-169051119/;alonalbalak;pujara",
        "or_profile": "~Pegah_Jandaghi1;~Pei_Zhou1;~Alon_Albalak1;~Jay_Pujara1",
        "aff": "University of Southern California;University of Southern California;University of California, Santa Barbara;University of Southern California",
        "aff_domain": "usc.edu;usc.edu;ucsb.edu;usc.edu",
        "position": "PhD student;PhD student;PhD student;Assistant Professor",
        "bibtex": "@misc{\njandaghi2024tmeasure,\ntitle={T-Measure: A Measure for Model Transferabilty},\nauthor={Pegah Jandaghi and Pei Zhou and Alon Albalak and Jay Pujara},\nyear={2024},\nurl={https://openreview.net/forum?id=gLtHsY0zCC}\n}",
        "github": "",
        "project": "",
        "reviewers": "fP8i;TVL6;7czX;Umyu",
        "site": "https://openreview.net/forum?id=gLtHsY0zCC",
        "pdf_size": 794148,
        "rating": "3;3;3;5",
        "confidence": "4;3;3;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;2",
        "presentation": "2;2;2;3",
        "wc_summary": "180;90;69;80",
        "wc_strengths": "62;39;34;45",
        "wc_weaknesses": "339;377;249;60",
        "wc_questions": "255;52;14;1",
        "wc_review": "836;558;366;186",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "203;376;250;166",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            104.75,
            44.075928804734225
        ],
        "wc_strengths_avg": [
            45.0,
            10.559356040971437
        ],
        "wc_weaknesses_avg": [
            256.25,
            122.46912876312953
        ],
        "wc_questions_avg": [
            80.5,
            102.47560685353369
        ],
        "wc_review_avg": [
            486.5,
            240.87496756616284
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            248.75,
            79.26971363641981
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:hgESTQuJSfgJ:scholar.google.com/&scioq=T-Measure:+A+Measure+for+Model+Transferabilty&hl=en&as_sdt=0,23",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "University of Southern California;University of California, Santa Barbara",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.usc.edu;https://www.ucsb.edu",
        "aff_unique_abbr": "USC;UCSB",
        "aff_campus_unique_index": "0;0;1;0",
        "aff_campus_unique": "Los Angeles;Santa Barbara",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "gM8X6RbXkV",
        "title": "Hierarchical Concept Discovery Models: A Concept Pyramid Scheme",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Deep Learning algorithms have recently gained significant attention due to their impressive performance. However, their high complexity and un-interpretable mode of operation hinders their confident deployment in real-world safety-critical tasks. This work targets *ante hoc* interpretability, and specifically Concept Bottleneck Models (CBMs). Our goal is to design a framework that admits a highly interpretable decision making process with respect to human understandable concepts, on *multiple levels of granularity. To this end, we propose a novel hierarchical concept discovery formulation leveraging: (i) recent advances in image-text models, and (ii) an innovative formulation for *multi-level concept selection* via data-driven and sparsity inducing Bayesian arguments. Within this framework, concept information does not solely rely on the similarity between the *whole* image and general *unstructured* concepts; instead, we introduce the notion of *concept hierarchy* to uncover and exploit more granular concept information residing in *patch-specific* regions of the image scene. As we experimentally show, the proposed construction not only outperforms recent CBM approaches, but also yields a principled framework towards interpetability.",
        "keywords": "Interpretability;Explainability;Concept Bottleneck;Sparsity;Multimodal Models;Concepts;Textual Descriptions;Bayesian;Mask",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/45cfe3f48830c7e014671b4e6be4b905700b4384.zip",
        "author": "Konstantinos P. Panousis;Dino Ienco;Diego Marcos",
        "authorids": "~Konstantinos_P._Panousis1;~Dino_Ienco2;~Diego_Marcos1",
        "gender": ";M;",
        "homepage": ";https://sites.google.com/site/dinoienco/;",
        "dblp": "220/4070;91/6423.html;171/0518",
        "google_scholar": ";https://scholar.google.it/citations?user=C8zfH3kAAAAJ;IUqydU0AAAAJ",
        "orcid": ";0000-0002-8736-3132;",
        "linkedin": ";dino-ienco-2511b16/;",
        "or_profile": "~Konstantinos_P._Panousis1;~Dino_Ienco2;~Diego_Marcos1",
        "aff": "INRIA;INRAE, National Research Institute in Agriculture and Environment;INRIA",
        "aff_domain": "inria.fr;inrae.fr;inria.fr",
        "position": "Postdoc;Researcher;Assistant Professor",
        "bibtex": "@misc{\npanousis2024hierarchical,\ntitle={Hierarchical Concept Discovery Models: A Concept Pyramid Scheme},\nauthor={Konstantinos P. Panousis and Dino Ienco and Diego Marcos},\nyear={2024},\nurl={https://openreview.net/forum?id=gM8X6RbXkV}\n}",
        "github": "",
        "project": "",
        "reviewers": "iVqG;DfML;Hcna;peBd",
        "site": "https://openreview.net/forum?id=gM8X6RbXkV",
        "pdf_size": 3101831,
        "rating": "3;5;5;6",
        "confidence": "5;3;4;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "127;136;146;169",
        "wc_strengths": "17;45;131;48",
        "wc_weaknesses": "448;114;469;17",
        "wc_questions": "177;83;104;330",
        "wc_review": "769;378;850;564",
        "wc_reply_reviewers": "0;61;0;0",
        "wc_reply_authors": "1538;1181;2074;951",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "2;3;3;2",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            144.5,
            15.660459763365825
        ],
        "wc_strengths_avg": [
            60.25,
            42.5991490525339
        ],
        "wc_weaknesses_avg": [
            262.0,
            199.608366558118
        ],
        "wc_questions_avg": [
            173.5,
            96.85685313905257
        ],
        "wc_review_avg": [
            640.25,
            183.82107468949255
        ],
        "wc_reply_reviewers_avg": [
            15.25,
            26.413774815425377
        ],
        "wc_reply_authors_avg": [
            1436.0,
            423.58529247366465
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.6488856845230502,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1707948849572906479&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "INRIA;INRAE",
        "aff_unique_dep": ";National Research Institute in Agriculture and Environment",
        "aff_unique_url": "https://www.inria.fr;https://www.inrae.fr",
        "aff_unique_abbr": "INRIA;INRAE",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "France"
    },
    {
        "id": "gMGUa8C0tL",
        "title": "TaCA: Hot-Plugging Upgrades for Foundation Model with Task-agnostic Compatible Adapter",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Visual foundation models, such as CLIP, exhibit exceptional proficiency in learning feature representations from extensive datasets via self-supervised techniques, showcasing noteworthy aptitude for transfer learning and generalization. A growing number of applications based on visual foundation models are emerging, including innovative solutions such as BLIP-2. These applications employ pre-trained CLIP models as upstream feature extractors and train various downstream modules to accomplish diverse tasks. However, scenarios necessitating system upgrades that entail updating the foundational model pose challenges, as they entail the inefficient and inflexible process of retraining all downstream modules to align with the new foundational model. In this paper, we propose an innovative and valuable task, Hot-Plugging Upgrades for visual foundation models. The aim is to seamlessly integrate superior-performing foundation models into downstream applications without adjusting the downstream modules. To realize this objective, we introduce a parameter-efficient and task-agnostic Compatible Adapter, referred to as TaCA, which promotes compatibility across distinct foundation models while concurrently enhancing performance for the new models. We conduct extensive experimental validation of TaCA using different scales of models with up to one billion parameters on various tasks such as video-text retrieval, video recognition, and visual question answering. The results consistently affirm the efficacy of TaCA in facilitating hot-plugging upgrades for visual foundation models. Codes and models will be made available.",
        "keywords": "Visual Foundation Model;Compatible Representation Learning;Parameter-Efficient Transfer Learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Binjie Zhang;Yixiao Ge;XUYUAN XU;Ying Shan;Mike Zheng Shou",
        "authorids": "~Binjie_Zhang1;~Yixiao_Ge2;~XUYUAN_XU1;~Ying_Shan2;~Mike_Zheng_Shou1",
        "gender": "M;F;M;M;",
        "homepage": "https://binjiezhang.github.io/;https://geyixiao.com/;;;http://www.columbia.edu/~zs2262/",
        "dblp": "275/3673;228/6649;;68/5910;284/0807",
        "google_scholar": "https://scholar.google.com/citations?hl=en;TtU74NAAAAAJ;https://scholar.google.com.hk/citations?hl=zh-CN;4oXBp9UAAAAJ;h1-3lSoAAAAJ",
        "orcid": ";;;0000-0001-7673-8325;",
        "linkedin": ";;;YingShanProfile/;",
        "or_profile": "~Binjie_Zhang1;~Yixiao_Ge2;~XUYUAN_XU1;~Ying_Shan2;~Zheng_Shou1",
        "aff": "National University of Singapore;Tencent;Magic Light Inc. ;Tencent PCG ARC Lab;National University of Singapore",
        "aff_domain": "nus.edu;tencent.com;magiclight.ai;arc.tencent.com;nus.edu.sg",
        "position": "PhD student;Researcher;CTO;Director;Assistant Professor",
        "bibtex": "@misc{\nzhang2024taca,\ntitle={Ta{CA}: Hot-Plugging Upgrades for Foundation Model with Task-agnostic Compatible Adapter},\nauthor={Binjie Zhang and Yixiao Ge and XUYUAN XU and Ying Shan and Mike Zheng Shou},\nyear={2024},\nurl={https://openreview.net/forum?id=gMGUa8C0tL}\n}",
        "github": "",
        "project": "",
        "reviewers": "REM4;dvkW;TD34;N62r",
        "site": "https://openreview.net/forum?id=gMGUa8C0tL",
        "pdf_size": 7820155,
        "rating": "5;5;5;6",
        "confidence": "3;4;4;5",
        "soundness": "2;2;2;3",
        "contribution": "2;1;3;3",
        "presentation": "3;4;3;3",
        "wc_summary": "38;67;71;93",
        "wc_strengths": "43;49;47;25",
        "wc_weaknesses": "115;226;372;35",
        "wc_questions": "9;35;1;35",
        "wc_review": "205;377;491;188",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "625;714;752;154",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;2;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            67.25,
            19.57517560585345
        ],
        "wc_strengths_avg": [
            41.0,
            9.486832980505138
        ],
        "wc_weaknesses_avg": [
            187.0,
            126.52470114566562
        ],
        "wc_questions_avg": [
            20.0,
            15.264337522473747
        ],
        "wc_review_avg": [
            315.25,
            125.5475507526929
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            561.25,
            239.60110079045964
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:1Pg9R3kvyuUJ:scholar.google.com/&scioq=TaCA:+Hot-Plugging+Upgrades+for+Foundation+Model+with+Task-agnostic+Compatible+Adapter&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;1;0",
        "aff_unique_norm": "National University of Singapore;Tencent;Magic Light Inc.",
        "aff_unique_dep": ";Tencent Holdings Limited;",
        "aff_unique_url": "https://www.nus.edu.sg;https://www.tencent.com;",
        "aff_unique_abbr": "NUS;Tencent;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;1;0",
        "aff_country_unique": "Singapore;China;United States"
    },
    {
        "title": "An Unforgeable Publicly Verifiable Watermark for Large Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18145",
        "id": "gMLQwKDY3N",
        "author_site": "Aiwei Liu, Leyi Pan, Xuming Hu, Shuang Li, Lijie Wen, Irwin King, Philip Yu",
        "tldr": "",
        "abstract": "Recently, text watermarking algorithms for large language models (LLMs) have been proposed to mitigate the potential harms of text generated by LLMs, including fake news and copyright issues. However, current watermark detection algorithms require the secret key used in the watermark generation process, making them susceptible to security breaches and counterfeiting during public detection.\nTo address this limitation, we propose an unforgeable publicly verifiable watermark algorithm named UPV that uses two different neural networks for watermark generation and detection, instead of using the same key at both stages. Meanwhile, the token embedding parameters are shared between the generation and detection networks, which makes the detection network achieve a high accuracy very efficiently.\nExperiments demonstrate that our algorithm attains high detection accuracy and computational efficiency through neural networks. Subsequent analysis confirms the high complexity involved in forging the watermark from the detection network. Our code is available at https://github.com/THU-BPM/unforgeable_watermark",
        "keywords": "Watermark;Large Language Models;Model Security",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/0414a8928416cb2b3d830d53a68151f47b76bd11.zip",
        "author": "Aiwei Liu;Leyi Pan;Xuming Hu;Shuang Li;Lijie Wen;Irwin King;Philip S. Yu",
        "authorids": "~Aiwei_Liu1;~Leyi_Pan1;~Xuming_Hu1;~Shuang_Li11;~Lijie_Wen1;~Irwin_King1;~Philip_S._Yu1",
        "gender": "M;F;M;M;M;M;M",
        "homepage": "https://exlaw.github.io/;;https://xuminghu.github.io/;https://www.thss.tsinghua.edu.cn/en/faculty/lijiewen.htm;https://www.cse.cuhk.edu.hk/irwin.king/;https://cs.uic.edu/profiles/philip-yu/;https://thulishuang.github.io/",
        "dblp": "321/4365;353/1437.html;262/3664;36/172-1;k/IrwinKing;y/PhilipSYu;43/6294-15",
        "google_scholar": "UCOOmcEAAAAJ;https://scholar.google.com/citations?hl=zh-CN;dbBKbXoAAAAJ;https://scholar.google.com.tw/citations?user=f3C0jUIAAAAJ;MXvC7tkAAAAJ;D0lL1r0AAAAJ;LSTOX04AAAAJ",
        "orcid": ";;0000-0001-6075-4224;0000-0003-0358-3160;0000-0001-8106-6447;0000-0002-3491-5968;0000-0003-0794-8091",
        "linkedin": "%E7%91%B7%E7%8E%AE-%E5%88%98-0722731a6/;%E4%B9%90%E6%80%A1-%E6%BD%98-806718275/;;;irwinking/;;",
        "or_profile": "~Aiwei_Liu1;~Leyi_Pan1;~Xuming_Hu1;~Lijie_Wen1;~Irwin_King1;~Philip_S._Yu1;~Shu'ang_Li1",
        "aff": "Chinese University of Hong Kong;Tsinghua University;Tsinghua University;Tsinghua University;The Chinese University of Hong Kong;University of Illinois Chicago;Tencent",
        "aff_domain": "cuhk.hk;mails.tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;cuhk.edu.hk;uic.edu;tencent.com",
        "position": "Visiting Scholar;Undergrad student;PhD student;Associate Professor;Full Professor;Full Professor;Researcher",
        "bibtex": "@inproceedings{\nliu2024an,\ntitle={An Unforgeable Publicly Verifiable Watermark for Large Language Models},\nauthor={Aiwei Liu and Leyi Pan and Xuming Hu and Shuang Li and Lijie Wen and Irwin King and Philip S. Yu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=gMLQwKDY3N}\n}",
        "github": "",
        "project": "",
        "reviewers": "seaW;kypk;CjAu;PMgN",
        "pdf_size": 394557,
        "rating": "3;6;6;6",
        "confidence": "3;2;4;3",
        "soundness": "3;3;3;2",
        "contribution": "3;3;2;2",
        "presentation": "2;2;3;3",
        "wc_summary": "54;196;55;48",
        "wc_strengths": "59;150;38;36",
        "wc_weaknesses": "188;96;378;45",
        "wc_questions": "5;40;22;10",
        "wc_review": "306;482;493;139",
        "wc_reply_reviewers": "0;0;730;0",
        "wc_reply_authors": "593;624;1790;237",
        "reply_reviewers": "0;0;3;0",
        "reply_authors": "1;1;3;1",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            88.25,
            62.267065933766304
        ],
        "wc_strengths_avg": [
            70.75,
            46.63354479342097
        ],
        "wc_weaknesses_avg": [
            176.75,
            126.99089534293394
        ],
        "wc_questions_avg": [
            19.25,
            13.47915056670857
        ],
        "wc_review_avg": [
            355.0,
            145.11202569049885
        ],
        "wc_reply_reviewers_avg": [
            182.5,
            316.09927238132013
        ],
        "wc_reply_authors_avg": [
            811.0,
            585.3225606449831
        ],
        "reply_reviewers_avg": [
            0.75,
            1.299038105676658
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 46,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16528658367684363126&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=gMLQwKDY3N",
        "pdf": "https://openreview.net/pdf?id=gMLQwKDY3N",
        "email": "cuhk.hk;mails.tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;cuhk.edu.hk;uic.edu;tencent.com",
        "author_num": 7,
        "aff_unique_index": "0;1;1;1;0;2;3",
        "aff_unique_norm": "Chinese University of Hong Kong;Tsinghua University;University of Illinois at Chicago;Tencent",
        "aff_unique_dep": ";;;Tencent Holdings Limited",
        "aff_unique_url": "https://www.cuhk.edu.hk;https://www.tsinghua.edu.cn;https://www.uic.edu;https://www.tencent.com",
        "aff_unique_abbr": "CUHK;THU;UIC;Tencent",
        "aff_campus_unique_index": "0;0;2",
        "aff_campus_unique": "Hong Kong SAR;;Chicago",
        "aff_country_unique_index": "0;0;0;0;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "gMsZBhwiM4",
        "title": "ICA model estimation using an optimized version of genetic algorithms",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper presents a method of estimating the independent component analysis model based on the use of a training algorithm based on an optimized version of genetic algorithms with a neural network algorithm. The mixed training algorithm is applied to optimize the objective function negentropy used to estimate the ICA model. The proposed estimation algorithm improves the training scheme based on genetic algorithms by using for crossover the most suitable chromosomes evaluated by the objective function with the parameters calculated calculated accordingly by a multilayer neural network algorithm. The performances of the proposed algorithm for estimating the independent components were evaluated through a comparative analysis with the versions of FastICA algorithms based on the standard Newton method, as well as on the secant method of derivation of the training scheme at the level of the optimization stage of the approximate objective function. The experimental results for the proposed algorithm for estimating the independent components are established in specific blind source separation applications using unidimensional and bidimensional signals.",
        "keywords": "Independent Component Analysis (ICA);Blind Source Separation (BSS);Artificial Neural Networks (ANN);Genetic Algorithms (GA)",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Doru Constantin",
        "authorids": "~Doru_Constantin1",
        "gender": "M",
        "homepage": "http://upb.ro",
        "dblp": "",
        "google_scholar": "",
        "orcid": "0009-0002-7308-480X",
        "linkedin": "",
        "or_profile": "~Doru_Constantin1",
        "aff": "The National University of Science and Technology POLITEHNICA Bucharest, Pite\u0219ti University Centre",
        "aff_domain": "upb.ro",
        "position": "Associate Professor",
        "bibtex": "@misc{\nconstantin2024ica,\ntitle={{ICA} model estimation using an optimized version of genetic algorithms},\nauthor={Doru Constantin},\nyear={2024},\nurl={https://openreview.net/forum?id=gMsZBhwiM4}\n}",
        "github": "",
        "project": "",
        "reviewers": "6jJ9;ZRC8;t4Z3",
        "site": "https://openreview.net/forum?id=gMsZBhwiM4",
        "pdf_size": 2553893,
        "rating": "1;3;6",
        "confidence": "5;3;2",
        "soundness": "1;1;2",
        "contribution": "1;1;2",
        "presentation": "1;1;2",
        "wc_summary": "45;50;28",
        "wc_strengths": "50;11;14",
        "wc_weaknesses": "188;153;79",
        "wc_questions": "57;59;2",
        "wc_review": "340;273;123",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;525;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;1;0",
        "rating_avg": [
            3.3333333333333335,
            2.0548046676563256
        ],
        "confidence_avg": [
            3.3333333333333335,
            1.247219128924647
        ],
        "soundness_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            41.0,
            9.41629792788369
        ],
        "wc_strengths_avg": [
            25.0,
            17.72004514666935
        ],
        "wc_weaknesses_avg": [
            140.0,
            45.43860326491855
        ],
        "wc_questions_avg": [
            39.333333333333336,
            26.411277052720408
        ],
        "wc_review_avg": [
            245.33333333333334,
            90.72424642227065
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            175.0,
            247.48737341529164
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.953820966476532,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:sKjvaWB4hz8J:scholar.google.com/&scioq=ICA+model+estimation+using+an+optimized+version+of+genetic+algorithms&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "National University of Science and Technology POLITEHNICA Bucharest",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.upb.ro",
        "aff_unique_abbr": "UPB",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Pite\u0219ti",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Romania"
    },
    {
        "id": "gOuWPd4f2U",
        "title": "Multil-Level Multimodal Alignment with Knowledge-Guided Instance-Wise Discrimination",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In multimodal alignment, meta-alignment and multi-level alignment play important roles. However, it is challenging to integrate meta-alignment into a multi-level multimodal alignment framework involving the operation on both reducible substances (e.g., molecules and spectrum) and irreducible elements (e.g., atoms and spectral peaks). It not only inherits the challenges from meta-alignment (e.g., heterogeneity, loss of nuance, interference, and conflicting similarities) but also introduces new challenges: navigating the interactions among reducible substances and irreducible elements and recognizing objects at each level. Many existing alignment methods suffer from inaccurate component relation estimation and potential bias, as they hold manual definitions of pair closeness. In response, we introduce Multi-level Multimodal Alignment with Knowledge-guided Instance-wise Discrimination (K-M3AID), an innovative approach that utilizes continuous knowledge variables with inherent natural ordering for meta-alignment. K-M3AID effectively addresses these challenges by promoting both reliable distance learning and unbiased alignment within the context of cross-modality alignment for multi-level structures. Extensive empirical studies conducted on complex molecular structures underscore the substantial efficacy of K-M3AID. It significantly improves matching accuracy while augmenting multi-level alignment capabilities. This novel approach holds great promise for advancing alignment techniques across diverse molecular contexts, offering a more robust foundation for ongoing research in chemical analysis and beyond.",
        "keywords": "Multimodal learning;Meta Learning;Graph representation learning;Contrastive learning;Knowledge-Guided Instance-Wise Discrimination",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/272c42b4432aded83f9a7ec354646af0fb556de4.zip",
        "author": "Hao Xu;Zhengyang Zhou;Pengyu Hong",
        "authorids": "~Hao_Xu18;~Zhengyang_Zhou2;~Pengyu_Hong1",
        "gender": "M;M;M",
        "homepage": "https://gaingod-xu.github.io/;;http://www.cs.brandeis.edu/~hong/",
        "dblp": ";;89/4734",
        "google_scholar": "tcYaFAcAAAAJ;;https://scholar.google.com.tw/citations?user=pvDa8pcAAAAJ",
        "orcid": "0000-0002-9795-5633;0000-0002-4609-7448;0000-0002-3177-2754",
        "linkedin": "hao-xu-62bb11169/;;",
        "or_profile": "~Hao_Xu18;~Zhengyang_Zhou2;~Pengyu_Hong1",
        "aff": "Brandeis University;Brandeis University;Brandeis University",
        "aff_domain": "brandeis.edu;brandeis.edu;brandeis.edu",
        "position": "Postdoc;PhD student;Full Professor",
        "bibtex": "@misc{\nxu2024multillevel,\ntitle={Multil-Level Multimodal Alignment with Knowledge-Guided Instance-Wise Discrimination},\nauthor={Hao Xu and Zhengyang Zhou and Pengyu Hong},\nyear={2024},\nurl={https://openreview.net/forum?id=gOuWPd4f2U}\n}",
        "github": "",
        "project": "",
        "reviewers": "svdX;XYBY;VTNJ",
        "site": "https://openreview.net/forum?id=gOuWPd4f2U",
        "pdf_size": 3916182,
        "rating": "3;5;5",
        "confidence": "3;3;2",
        "soundness": "2;2;3",
        "contribution": "2;3;2",
        "presentation": "2;2;3",
        "wc_summary": "90;45;74",
        "wc_strengths": "75;29;39",
        "wc_weaknesses": "222;132;76",
        "wc_questions": "2;152;12",
        "wc_review": "389;358;201",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            69.66666666666667,
            18.624953392931992
        ],
        "wc_strengths_avg": [
            47.666666666666664,
            19.754043186705406
        ],
        "wc_weaknesses_avg": [
            143.33333333333334,
            60.140576060500855
        ],
        "wc_questions_avg": [
            55.333333333333336,
            68.47546194724713
        ],
        "wc_review_avg": [
            316.0,
            82.2962129545866
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:aCSryJsl2A4J:scholar.google.com/&scioq=Multil-Level+Multimodal+Alignment+with+Knowledge-Guided+Instance-Wise+Discrimination&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Brandeis University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.brandeis.edu",
        "aff_unique_abbr": "Brandeis",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "gP9TWGHtGM",
        "title": "Continual Knowledge Graph Link Prediction: Beyond Experience Replay",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Knowledge graphs (KGs) empower AI systems with essential inference capabilities as they increasingly integrate into life and industries. The dynamic nature of real-world KGs underscores the necessity for KG link prediction methods to possess continual learning capabilities.\nHowever, the existing benchmark datasets primarily rely on sampling based methods, falling short of adequately evaluating models' abilities for continual KG link prediction. In this paper, we explicitly formulate the continual KG link prediction task and provide definitions for its two specific settings: class-incremental and expansive. \nTwo new benchmark datasets are established to provide valid benchmarking for fair evaluation of continual KG link prediction methods. \nFurthermore, we propose BER, a novel approach based on experience replay and knowledge distillation to alleviate the catastrophic forgetting problem. Extensive experimental results demonstrate the datasets' effectiveness in providing a fair evaluation of continual learning ability and validate the efficacy of our proposed method. Codes can be found in supplementary material and will be released along with both datasets upon acceptance.",
        "keywords": "Knowledge Graph Link Prediction;Continual Learning",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/acb23f39f045163b522bbd0fa3a1b9c73f448bc2.zip",
        "author": "Han Wu;Jie Yin;Thang D Bui;Balakanapathy Rajaratnam",
        "authorids": "~Han_Wu4;~Jie_Yin3;~Thang_D_Bui1;~Balakanapathy_Rajaratnam1",
        "gender": "F;F;M;Not Specified",
        "homepage": "https://www.sydney.edu.au/business/about/our-people/research-students/han-wu-293.html;https://www.sydney.edu.au/business/about/our-people/academic-staff/jie-yin.html;http://thangbui.github.io;https://scholar.google.com/citations?hl=en&user=WbFQcaMAAAAJ",
        "dblp": "13/1864;97/3358;155/1914;",
        "google_scholar": ";-vxkP70AAAAJ;https://scholar.google.com.au/citations?user=SVq3y1sAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0002-3750-0696;;;",
        "linkedin": ";;;",
        "or_profile": "~Han_Wu4;~Jie_Yin3;~Thang_D_Bui1;~Balakanapathy_Rajaratnam1",
        "aff": "University of Sydney;The University of Sydney;Australian National University;",
        "aff_domain": "sydney.edu.au;sydney.edu.au;anu.edu.au;",
        "position": "PhD student;Associate Professor;Assistant Professor;",
        "bibtex": "@misc{\nwu2024continual,\ntitle={Continual Knowledge Graph Link Prediction: Beyond Experience Replay},\nauthor={Han Wu and Jie Yin and Thang D Bui and Balakanapathy Rajaratnam},\nyear={2024},\nurl={https://openreview.net/forum?id=gP9TWGHtGM}\n}",
        "github": "",
        "project": "",
        "reviewers": "JHqC;iVed;pgai;kHDH",
        "site": "https://openreview.net/forum?id=gP9TWGHtGM",
        "pdf_size": 456299,
        "rating": "3;3;3;5",
        "confidence": "5;4;5;4",
        "soundness": "2;2;1;3",
        "contribution": "1;2;2;3",
        "presentation": "3;3;2;3",
        "wc_summary": "60;48;75;43",
        "wc_strengths": "14;17;46;43",
        "wc_weaknesses": "222;95;69;282",
        "wc_questions": "7;85;5;53",
        "wc_review": "303;245;195;421",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            56.5,
            12.338962679253067
        ],
        "wc_strengths_avg": [
            30.0,
            14.577379737113251
        ],
        "wc_weaknesses_avg": [
            167.0,
            88.0880241576572
        ],
        "wc_questions_avg": [
            37.5,
            33.4776044543214
        ],
        "wc_review_avg": [
            291.0,
            84.22588675698226
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:vVOPCw-1AjYJ:scholar.google.com/&scioq=Continual+Knowledge+Graph+Link+Prediction:+Beyond+Experience+Replay&hl=en&as_sdt=0,23",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "University of Sydney;Australian National University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.sydney.edu.au;https://www.anu.edu.au",
        "aff_unique_abbr": "USYD;ANU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Australia"
    },
    {
        "title": "FlashFFTConv: Efficient Convolutions for Long Sequences with Tensor Cores",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18144",
        "id": "gPKTTAfYBp",
        "author_site": "Dan Fu, Hermann Kumbong, Eric Nguyen, Christopher Re",
        "tldr": "",
        "abstract": "Convolution models with long filters have demonstrated state-of-the-art reasoning abilities in many long-sequence tasks but lag behind the most optimized Transformers in wall-clock time.\nA major bottleneck is the Fast Fourier Transform (FFT)---which allows long convolutions to run in $O(N\\log N)$ time in sequence length $N$ but has poor hardware utilization.\nIn this paper, we study how to optimize the FFT convolution.\nWe find two key bottlenecks: the FFT does not effectively use specialized matrix multiply units, and it incurs expensive I/O between layers of the memory hierarchy.\nIn response, we propose FlashFFTConv.\nFlashFFTConv uses a matrix decomposition that computes the FFT using matrix multiply units and enables kernel fusion for long sequences, reducing I/O.\nWe also present two sparse convolution algorithms---1) partial convolutions and 2) frequency-sparse convolutions---which can be implemented simply by skipping blocks in the matrix decomposition, enabling further opportunities for memory and compute savings.\nFlashFFTConv speeds up exact FFT convolutions by up to 8.7$\\times$ over PyTorch and achieves up to 4.4$\\times$ speedup end-to-end.\nGiven the same compute budget, FlashFFTConv allows Hyena-GPT-s to achieve 2.3 points better perplexity and M2-BERT-base to achieve 3.3 points higher GLUE score---matching models with twice the parameter count.\nFlashFFTConv also achieves 96.1% accuracy on Path-512, a high-resolution vision task where no model had previously achieved better than 50%.\nFurthermore, partial convolutions enable longer-sequence models---yielding the first DNA model that can process the longest human genes (2.3M base pairs)---and frequency-sparse convolutions speed up pretrained models while maintaining or improving model quality.",
        "keywords": "convolutions;GPUs;hardware-efficient algorithms;long context;fast fourier transform;I/O awareness",
        "primary_area": "infrastructure, software libraries, hardware, etc.",
        "supplementary_material": "/attachment/0c489cf1f8c688a2f44e0e20004fe4a153e4b0f4.zip",
        "author": "Daniel Y Fu;Hermann Kumbong;Eric Nguyen;Christopher Re",
        "authorids": "~Daniel_Y_Fu1;~Hermann_Kumbong1;~Eric_Nguyen1;~Christopher_Re1",
        "gender": ";M;M;",
        "homepage": ";https://kumbong.github.io/;http://erictnguyen.com;",
        "dblp": ";359/5994;;",
        "google_scholar": ";NnL2qHgAAAAJ;66TLwGUAAAAJ;",
        "orcid": ";;;",
        "linkedin": ";hermannkumbong/;nguyenstanford/;",
        "or_profile": "~Daniel_Y_Fu1;~Hermann_Kumbong1;~Eric_Nguyen1;~Christopher_Re1",
        "aff": ";Stanford University;Stanford University;",
        "aff_domain": ";stanford.edu;stanford.edu;",
        "position": ";MS student;PhD student;",
        "bibtex": "@inproceedings{\nfu2024flashfftconv,\ntitle={Flash{FFTC}onv: Efficient Convolutions for Long Sequences with Tensor Cores},\nauthor={Daniel Y Fu and Hermann Kumbong and Eric Nguyen and Christopher Re},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=gPKTTAfYBp}\n}",
        "github": "",
        "project": "",
        "reviewers": "8BY8;Bh63;pq6T",
        "pdf_size": 2780558,
        "rating": "6;8;8",
        "confidence": "5;3;4",
        "soundness": "3;3;4",
        "contribution": "3;3;4",
        "presentation": "3;3;3",
        "wc_summary": "46;229;83",
        "wc_strengths": "33;125;29",
        "wc_weaknesses": "304;267;1",
        "wc_questions": "30;70;35",
        "wc_review": "413;691;148",
        "wc_reply_reviewers": "14;102;0",
        "wc_reply_authors": "736;479;26",
        "reply_reviewers": "1;1;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            119.33333333333333,
            79.00351609615583
        ],
        "wc_strengths_avg": [
            62.333333333333336,
            44.34210439550904
        ],
        "wc_weaknesses_avg": [
            190.66666666666666,
            134.96254624483373
        ],
        "wc_questions_avg": [
            45.0,
            17.795130420052185
        ],
        "wc_review_avg": [
            417.3333333333333,
            221.69999749411116
        ],
        "wc_reply_reviewers_avg": [
            38.666666666666664,
            45.146674542232034
        ],
        "wc_reply_authors_avg": [
            413.6666666666667,
            293.51471664788613
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 24,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4647935783043643129&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=gPKTTAfYBp",
        "pdf": "https://openreview.net/pdf?id=gPKTTAfYBp",
        "email": ";stanford.edu;stanford.edu;",
        "author_num": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Stanford University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.stanford.edu",
        "aff_unique_abbr": "Stanford",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Stanford",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "gS0XOu0JKs",
        "title": "Improving the Reliability of Large Language Models by Leveraging Uncertainty-Aware In-Context Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In recent years, large-scale language models (LLMs) have gained attention for their impressive text generation capabilities. However, these models often face the challenge of \"hallucination,\" which undermines their reliability. In this study, we introduce an uncertainty-aware in-context learning framework to empower the model to enhance or reject its output in response to uncertainty.\nHuman-defined methods for estimating uncertainty typically assume that \"uncertainty is lower when the model's response is correct compared to when it is incorrect.\" However, setting a precise threshold to distinguish correctness is challenging. Therefore, we introduce uncertainty information as an intermediary variable that implicitly influences the model's behavior.\nOur innovative uncertainty-aware in-context learning framework involves fine-tuning the LLM using a calibration dataset. Our aim is to improve the model's responses by filtering out answers with high uncertainty while considering the model's knowledge limitations. We evaluate the model's knowledge by examining multiple responses to the same question for the presence of a correct answer.\nWhen the model lacks relevant knowledge, the response should indicate that the question cannot be answered. Conversely, when the model has relevant knowledge, the response should provide the correct answer.\nExtensive experiments confirm the effectiveness of our framework, leading to two key findings. First, the logit output values of the LLM partly reflect inherent uncertainty. Second, our model autonomously recognizes uncertainty, resulting in improved responses.",
        "keywords": "Large Language Model; Uncertainty;",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Yuchen Yang;Yu Wang;Yanfeng Wang;Houqiang Li",
        "authorids": "~Yuchen_Yang2;~Yu_Wang40;~Yanfeng_Wang1;~Houqiang_Li1",
        "gender": ";M;M;M",
        "homepage": ";https://mediabrain.sjtu.edu.cn/yuwang/;https://cmic.sjtu.edu.cn/wangyanfeng/;https://staff.ustc.edu.cn/~lihq/",
        "dblp": ";02/5889-27.html;55/5407-1.html;59/7017.html",
        "google_scholar": ";;https://scholar.google.com/citations?hl=zh-CN;7sFMIKoAAAAJ",
        "orcid": ";0000-0001-9500-081X;0000-0002-3196-2347;0000-0003-2188-3028",
        "linkedin": ";;;",
        "or_profile": "~Yuchen_Yang2;~Yu_Wang40;~Yanfeng_Wang1;~Houqiang_Li1",
        "aff": ";Shanghai Jiaotong University;Shanghai Jiaotong University;University of Science and Technology of China",
        "aff_domain": ";sjtu.edu.cn;sjtu.edu.cn;ustc.edu.cn",
        "position": ";Associate Professor;Full Professor;Professor",
        "bibtex": "@misc{\nyang2024improving,\ntitle={Improving the Reliability of Large Language Models by Leveraging Uncertainty-Aware In-Context Learning},\nauthor={Yuchen Yang and Yu Wang and Yanfeng Wang and Houqiang Li},\nyear={2024},\nurl={https://openreview.net/forum?id=gS0XOu0JKs}\n}",
        "github": "",
        "project": "",
        "reviewers": "9t2n;JPa6;4TCY",
        "site": "https://openreview.net/forum?id=gS0XOu0JKs",
        "pdf_size": 524881,
        "rating": "3;3;3",
        "confidence": "4;3;3",
        "soundness": "2;3;1",
        "contribution": "2;3;1",
        "presentation": "2;2;2",
        "wc_summary": "99;39;101",
        "wc_strengths": "32;24;52",
        "wc_weaknesses": "217;122;159",
        "wc_questions": "44;4;6",
        "wc_review": "392;189;318",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            79.66666666666667,
            28.767265347188555
        ],
        "wc_strengths_avg": [
            36.0,
            11.775681155103795
        ],
        "wc_weaknesses_avg": [
            166.0,
            39.098167049961134
        ],
        "wc_questions_avg": [
            18.0,
            18.40289832245635
        ],
        "wc_review_avg": [
            299.6666666666667,
            83.88219252154906
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 18,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17043291878751427177&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Shanghai Jiao Tong University;University of Science and Technology of China",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.sjtu.edu.cn;http://www.ustc.edu.cn",
        "aff_unique_abbr": "SJTU;USTC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "gSB6IfUEGz",
        "title": "VoxGenesis: Unsupervised Discovery of Latent Speaker Manifold for Speech Synthesis",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Achieving nuanced and accurate emulation of human voice has been a longstanding goal in artificial intelligence. Although significant progress has been made in recent years, the mainstream of speech synthesis models still relies on supervised speaker modeling and explicit reference utterances. However, there are many aspects of human voice, such as emotion, intonation, and speaking style, for which it is hard to obtain accurate labels.\nIn this paper, we propose VoxGenesis, a novel unsupervised speech synthesis framework that can discover a latent speaker manifold and meaningful voice editing directions without supervision. VoxGenesis is conceptually simple. Instead of mapping speech features to waveforms deterministically, VoxGenesis transforms a Gaussian distribution into speech distributions conditioned and aligned by semantic tokens. This forces the model to learn a speaker distribution disentangled from the semantic content.\nDuring the inference, sampling from the Gaussian distribution enables the creation of novel speakers with distinct characteristics. More importantly, the exploration of latent space uncovers human-interpretable directions associated with specific speaker characteristics such as gender attributes, pitch, tone, and emotion, allowing for voice editing by manipulating the latent codes along these identified directions.\nWe conduct extensive experiments to evaluate the proposed VoxGenesis using both subjective and objective metrics, finding that it produces significantly more diverse and realistic speakers with distinct characteristics than the previous approaches. We also show that  latent space manipulation produces consistent and human-identifiable effects that are not detrimental to the speech quality, which was not possible with previous approaches.\nFinally, we demonstrate that VoxGenesis can also be used in voice conversion and multi-speaker TTS, outperforming the state-of-the-art approaches. Audio samples of VoxGenesis can be found at: \\url{https://bit.ly/VoxGenesis}.",
        "keywords": "Speech Synthesis; Text-to-speech;Unsupervised Learning;Generative adversarial network;Voice conversion;",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/cdc74e106c286d4682abd5a92370ebcfdd9e472a.zip",
        "author": "Weiwei Lin;Chenhang HE;Man-Wai Mak;Jiachen Lian;Kong Aik Lee",
        "authorids": "~Weiwei_Lin2;~Chenhang_HE1;~Man-Wai_Mak1;~Jiachen_Lian1;~Kong_Aik_Lee1",
        "gender": "M;;M;M;M",
        "homepage": "https://github.com/skyhehe123;http://www.eie.polyu.edu.hk/~mwmak/mypage.htm;https://jlian2.github.io;https://sites.google.com/view/kongaiklee;https://scholar.google.com/citations?user=p2qxp1UAAAAJ&hl=en",
        "dblp": "272/1145;https://dblp.uni-trier.de/pid/16/5121.html;249/9914;35/4621;53/282-2",
        "google_scholar": "dU6hpFUAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?view_op=list_works;SZegiA4AAAAJ;p2qxp1UAAAAJ",
        "orcid": "0000-0001-5069-3587;0000-0001-8854-3760;;0000-0001-9133-3000;",
        "linkedin": ";;jiachenlian/en;;",
        "or_profile": "~Chenhang_HE1;~Man-Wai_Mak1;~Jiachen_Lian1;~Kong_Aik_Lee1;~Eric_Lin2",
        "aff": "The Hong Kong Polytechnic University;Hong Kong Polytechnic University;Electrical Engineering & Computer Science Department, University of California Berkeley;Hong Kong Polytechnic University;Hong Kong Polytechnic University",
        "aff_domain": "polyu.edu.hk;polyu.edu.hk;eecs.berkeley.edu;polyu.edu.hk;polyu.edu.hk",
        "position": "Assistant Professor;Full Professor;PhD student;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nlin2024voxgenesis,\ntitle={VoxGenesis: Unsupervised Discovery of Latent Speaker Manifold for Speech Synthesis},\nauthor={Weiwei Lin and Chenhang HE and Man-Wai Mak and Jiachen Lian and Kong Aik Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=gSB6IfUEGz}\n}",
        "github": "",
        "project": "",
        "reviewers": "dHpK;cVSz;fp4x;dpEi",
        "site": "https://openreview.net/forum?id=gSB6IfUEGz",
        "pdf_size": 849479,
        "rating": "1;5;5;5",
        "confidence": "4;4;4;4",
        "soundness": "1;3;2;3",
        "contribution": "1;2;2;3",
        "presentation": "1;3;2;3",
        "wc_summary": "25;22;30;66",
        "wc_strengths": "4;43;36;32",
        "wc_weaknesses": "255;139;112;192",
        "wc_questions": "1;30;55;6",
        "wc_review": "285;234;233;296",
        "wc_reply_reviewers": "148;83;261;48",
        "wc_reply_authors": "517;821;1204;387",
        "reply_reviewers": "1;1;2;1",
        "reply_authors": "2;2;3;1",
        "rating_avg": [
            4.0,
            1.7320508075688772
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            35.75,
            17.69710428290459
        ],
        "wc_strengths_avg": [
            28.75,
            14.821858857781638
        ],
        "wc_weaknesses_avg": [
            174.5,
            54.66488818245218
        ],
        "wc_questions_avg": [
            23.0,
            21.482551058940835
        ],
        "wc_review_avg": [
            262.0,
            28.766299727285052
        ],
        "wc_reply_reviewers_avg": [
            135.0,
            81.11411714368838
        ],
        "wc_reply_authors_avg": [
            732.25,
            314.6246771949079
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:bQqLNzlIO94J:scholar.google.com/&scioq=VoxGenesis:+Unsupervised+Discovery+of+Latent+Speaker+Manifold+for+Speech+Synthesis&hl=en&as_sdt=0,44",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "Hong Kong Polytechnic University;University of California, Berkeley",
        "aff_unique_dep": ";Electrical Engineering & Computer Science Department",
        "aff_unique_url": "https://www.polyu.edu.hk;https://www.berkeley.edu",
        "aff_unique_abbr": "PolyU;UC Berkeley",
        "aff_campus_unique_index": "0;0;1;0;0",
        "aff_campus_unique": "Hong Kong SAR;Berkeley",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "gSlLbfSOq1",
        "title": "Temporally Equivariant Contrastive Learning for Disease Progression",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Self-supervised contrastive learning methods provide robust representations by ensuring their invariance to different image transformations while simultaneously preventing representational collapse across different training samples. Equivariant contrastive learning, on the other hand, provides representations sensitive to specific image transformations while remaining invariant to others. By introducing equivariance to time-induced transformations, such as the anatomical changes in longitudinal medical images of a patient caused by disease progression, the model can effectively capture such changes in the representation space. However, learning temporally meaningful representations is challenging, as each patient's disease progresses at a different pace and manifests itself as different anatomical changes. In this work, we propose a Time-equivariant Contrastive Learning (TC) method. First, an encoder projects two unlabeled scans from different time points of the same patient to the representation space. Next, a temporal equivariance module is trained to predict the representation of a later visit based on the representation from one of the previous visits and from the time interval between them. Additionally, an invariance loss is applied to a projection of the representation space to encourage it to be robust to irrelevant image transformations such as translation, rotation, and noise. The representations learned with TC are not only sensitive to the progression of time but the temporal equivariant module can also be used to predict the representation for a given image at a future time-point. Our method has been evaluated on two longitudinal ophthalmic imaging datasets outperforming other state-of-the-art equivariant contrastive learning methods. Our method also showed a higher sensitivity to temporal ordering among the scans of each patient in comparison with the existing methods.",
        "keywords": "Disease progression;contrastive learning;representation learning;equivariance;temporal task;medical imaging",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Taha Emre;Arunava Chakravarty;Dmitrii Lachinov;Antoine Rivail;Ursula Schmidt-Erfurth;Hrvoje Bogunovi\u0107",
        "authorids": "~Taha_Emre1;~Arunava_Chakravarty1;~Dmitrii_Lachinov1;~Antoine_Rivail1;~Ursula_Schmidt-Erfurth2;~Hrvoje_Bogunovi\u01071",
        "gender": ";M;;M;;M",
        "homepage": ";https://optima.meduniwien.ac.at/team/computational-imaging-research/arunava-chakravarty/;https://optima.meduniwien.ac.at/about-us/team/computational-imaging-research/dmitrii-lachinov/;;;https://optima.meduniwien.ac.at/team/hrvoje-bogunovic/",
        "dblp": ";141/8822.html;    223/8680;;;",
        "google_scholar": ";https://scholar.google.co.in/citations?user=Tk2svbAAAAAJ;;;;0pPVZz4AAAAJ",
        "orcid": ";0000-0003-3646-0650;;;;0000-0002-9168-0894",
        "linkedin": ";arunava-chakravarty-b1736b158;;;;",
        "or_profile": "~Taha_Emre1;~Arunava_Chakravarty1;~Dmitrii_Lachinov1;~Antoine_Rivail1;~Ursula_Schmidt-Erfurth2;~Hrvoje_Bogunovi\u01071",
        "aff": ";Indian Institute of Technology Kharagpur, Dhirubhai Ambani Institute Of Information and Communication Technology;Medical University of Vienna;Medical University of Vienna;;Medical University of Vienna",
        "aff_domain": ";iitkgp.ernet.in;meduniwien.ac.at;meduniwien.ac.at;;meduniwien.ac.at",
        "position": ";Postdoc;PhD student;PhD student;;Associate Professor",
        "bibtex": "@misc{\nanonymous2024temporally,\ntitle={Temporally Equivariant Contrastive Learning for Disease Progression},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=gSlLbfSOq1}\n}",
        "github": "",
        "project": "",
        "reviewers": "9udP;mWX7;m6pm;G1yR",
        "site": "https://openreview.net/forum?id=gSlLbfSOq1",
        "pdf_size": 2830788,
        "rating": "3;5;5;5",
        "confidence": "4;4;3;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "1;3;3;4",
        "wc_summary": "86;71;150;49",
        "wc_strengths": "30;69;221;42",
        "wc_weaknesses": "339;137;412;150",
        "wc_questions": "3;102;102;19",
        "wc_review": "458;379;885;260",
        "wc_reply_reviewers": "0;0;12;0",
        "wc_reply_authors": "698;719;973;299",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            89.0,
            37.59654239421492
        ],
        "wc_strengths_avg": [
            90.5,
            76.65670225100999
        ],
        "wc_weaknesses_avg": [
            259.5,
            118.92539678302528
        ],
        "wc_questions_avg": [
            56.5,
            45.85029988996801
        ],
        "wc_review_avg": [
            495.5,
            235.6634252488069
        ],
        "wc_reply_reviewers_avg": [
            3.0,
            5.196152422706632
        ],
        "wc_reply_authors_avg": [
            672.25,
            241.15075678919195
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:dHzdshEMIFsJ:scholar.google.com/&scioq=Temporally+Equivariant+Contrastive+Learning+for+Disease+Progression&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Indian Institute of Technology Kharagpur;Medical University of Vienna",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.iitkgp.ac.in;https://www.meduniwien.ac.at",
        "aff_unique_abbr": "IIT Kharagpur;MUW",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Kharagpur;",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "India;Austria"
    },
    {
        "title": "Safety-Tuned LLaMAs: Lessons From Improving the Safety of Large Language Models that Follow Instructions",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18143",
        "id": "gT5hALch9z",
        "author_site": "Federico Bianchi, Mirac Suzgun, Giuseppe Attanasio, Paul R\u00f6ttger, Dan Jurafsky, Tatsunori Hashimoto, James Y Zou",
        "tldr": "",
        "abstract": "Training large language models to follow instructions makes them perform better on a wide range of tasks and generally become more helpful. However, a perfectly helpful model will follow even the most malicious instructions and readily generate harmful content.\nIn this paper, we raise concerns over the safety of models that only emphasize helpfulness, not harmlessness, in their instruction-tuning.\nWe show that several popular instruction-tuned models are highly unsafe. Moreover, we show that adding just 3\\% safety examples (a few hundred demonstrations) when fine-tuning a model like LLaMA can substantially improve its safety. Our safety-tuning does not make models significantly less capable or helpful as measured by standard benchmarks. However, we do find exaggerated safety behaviours, where too much safety-tuning makes models refuse perfectly safe prompts if they superficially resemble unsafe ones. As a whole, our results illustrate trade-offs in training LLMs to be helpful and training them to be safe.",
        "keywords": "llms;instruction tuning;safety",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/582a5b3fe86a22014297d2f7a5e2763cd863a631.pdf",
        "author": "Federico Bianchi;Mirac Suzgun;Giuseppe Attanasio;Paul Rottger;Dan Jurafsky;Tatsunori Hashimoto;James Zou",
        "authorids": "~Federico_Bianchi1;~Mirac_Suzgun1;~Giuseppe_Attanasio1;~Paul_Rottger1;~Dan_Jurafsky1;~Tatsunori_Hashimoto1;~James_Zou1",
        "gender": ";;M;M;M;M;",
        "homepage": "https://federicobianchi.io;https://web.stanford.edu/people/~msuzgun/;https://gattanasio.cc;https://paulrottger.com/;http://web.stanford.edu/~jurafsky/;https://thashim.github.io;",
        "dblp": "122/8815-1;230/3470;198/3907;282/4243;31/985;;",
        "google_scholar": "1okGjb8AAAAJ;C3aEsC8AAAAJ;https://scholar.google.it/citations?user=IuhnRJQAAAAJ;7rpmd9cAAAAJ;uZg9l58AAAAJ;5ygiTwsAAAAJ;23ZXZvEAAAAJ",
        "orcid": "0000-0003-0776-361X;;;0009-0008-7115-6893;;;",
        "linkedin": "federico-bianchi-3b7998121/;;;paul-rottger/;;;",
        "or_profile": "~Federico_Bianchi1;~Mirac_Suzgun1;~Giuseppe_Attanasio1;~Paul_Rottger1;~Dan_Jurafsky1;~Tatsunori_Hashimoto1;~James_Zou1",
        "aff": "Stanford University;Stanford University;Bocconi University;Bocconi University;Stanford University;Stanford University;Stanford University",
        "aff_domain": "stanford.edu;stanford.edu;unibocconi.it;unibocconi.it;stanford.edu;stanford.edu;stanford.edu",
        "position": "Postdoc;PhD student;Postdoc;Postdoc;Full Professor;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nbianchi2024safetytuned,\ntitle={Safety-Tuned {LL}a{MA}s: Lessons From Improving the Safety of Large Language Models that Follow Instructions},\nauthor={Federico Bianchi and Mirac Suzgun and Giuseppe Attanasio and Paul Rottger and Dan Jurafsky and Tatsunori Hashimoto and James Zou},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=gT5hALch9z}\n}",
        "github": "",
        "project": "",
        "reviewers": "gf5T;yQ2D;cMF9;HxPh",
        "pdf_size": 1158770,
        "rating": "6;6;6;6",
        "confidence": "4;3;4;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;2;2",
        "presentation": "3;3;3;3",
        "wc_summary": "83;82;95;70",
        "wc_strengths": "34;39;48;68",
        "wc_weaknesses": "124;51;67;106",
        "wc_questions": "38;250;45;14",
        "wc_review": "279;422;255;258",
        "wc_reply_reviewers": "0;0;0;250",
        "wc_reply_authors": "433;973;447;308",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;2;2;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            82.5,
            8.845903006477066
        ],
        "wc_strengths_avg": [
            47.25,
            12.987975207860538
        ],
        "wc_weaknesses_avg": [
            87.0,
            29.266021253323792
        ],
        "wc_questions_avg": [
            86.75,
            94.95097419194813
        ],
        "wc_review_avg": [
            303.5,
            69.03803299631298
        ],
        "wc_reply_reviewers_avg": [
            62.5,
            108.25317547305482
        ],
        "wc_reply_authors_avg": [
            540.25,
            255.64171705729095
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 172,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15227336606164099485&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=gT5hALch9z",
        "pdf": "https://openreview.net/pdf?id=gT5hALch9z",
        "email": "stanford.edu;stanford.edu;unibocconi.it;unibocconi.it;stanford.edu;stanford.edu;stanford.edu",
        "author_num": 7,
        "aff_unique_index": "0;0;1;1;0;0;0",
        "aff_unique_norm": "Stanford University;Bocconi University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.stanford.edu;https://www.bocconi.edu",
        "aff_unique_abbr": "Stanford;Bocconi",
        "aff_campus_unique_index": "0;0;0;0;0",
        "aff_campus_unique": "Stanford;",
        "aff_country_unique_index": "0;0;1;1;0;0;0",
        "aff_country_unique": "United States;Italy"
    },
    {
        "id": "gTDBfwlzdy",
        "title": "Stochastic Zeroth-Order Optimization under Strongly Convexity and Lipschitz Hessian: Minimax Sample Complexity",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Optimization of convex functions under stochastic zeroth-order feedback has been\na major and challenging question in online learning. In this work, we consider the\nproblem of optimizing second-order smooth and strongly convex functions where\nthe algorithm is only accessible to noisy evaluations of the objective function it\nqueries. We provide the first tight characterization for the rate of the minimax\nsimple regret by developing matching upper and lower bounds. We propose an\nalgorithm that features a combination of a bootstrapping stage and a mirror-descent\nstage. The main innovation of our approach is the usage of a gradient estimation\nscheme that exploits the local geometry of the objective function, and we provide\nsharp analysis for the corresponding estimation bounds.",
        "keywords": "optimization;higher-order smoothness;sample complexity;optimality",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Qian Yu;Yining Wang;Baihe Huang;Qi Lei;Jason D. Lee",
        "authorids": "~Qian_Yu5;~Yining_Wang1;~Baihe_Huang1;~Qi_Lei1;~Jason_D._Lee1",
        "gender": ";M;;F;M",
        "homepage": "https://scholar.princeton.edu/qyu;https://yining-wang.com;;https://cecilialeiqi.github.io/;https://jasondlee88.github.io/",
        "dblp": "16/3790-1;04/7235;279/4131;;88/3262",
        "google_scholar": "SxUNhucAAAAJ;HpQGq54AAAAJ;chICXXMAAAAJ;kGOgaowAAAAJ;GR_DsT0AAAAJ",
        "orcid": "0000-0002-2034-5941;;;;",
        "linkedin": ";;;;",
        "or_profile": "~Qian_Yu5;~Yining_Wang1;~Baihe_Huang1;~Qi_Lei1;~Jason_D._Lee1",
        "aff": "University of California, Santa Barbara;University of Texas at Dallas;University of California, Berkeley;New York University;Princeton University",
        "aff_domain": "ucsb.edu;cs.utdallas.edu;berkeley.edu;nyu.edu;princeton.edu",
        "position": "Assistant Professor;Associate Professor;PhD student;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nyu2024stochastic,\ntitle={Stochastic Zeroth-Order Optimization under Strongly Convexity and Lipschitz Hessian: Minimax Sample Complexity},\nauthor={Qian Yu and Yining Wang and Baihe Huang and Qi Lei and Jason D. Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=gTDBfwlzdy}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=gTDBfwlzdy",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12026496598151491674&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "University of California, Santa Barbara;University of Texas at Dallas;University of California, Berkeley;New York University;Princeton University",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.ucsb.edu;https://www.utdallas.edu;https://www.berkeley.edu;https://www.nyu.edu;https://www.princeton.edu",
        "aff_unique_abbr": "UCSB;UT Dallas;UC Berkeley;NYU;Princeton",
        "aff_campus_unique_index": "0;1;2",
        "aff_campus_unique": "Santa Barbara;Dallas;Berkeley;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "gTRtDFm8Di",
        "title": "Reduce, Reuse, and Recycle: Navigating Test-Time Adaptation with OOD-Contaminated Streams",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Test-Time Adaptation (TTA) aims to quickly adapt a pre-trained Deep Neural Network (DNN) to shifted test data from unseen distributions. Early TTA works only targeted simple and restrictive test scenarios that did not align with the philosophy of TTA that emphasizes practicality. Subsequent research efforts have thus been geared towards exploring more realistic test scenarios. In the same spirit, this work investigates for the first time TTA with data streams contaminated with out-of-distribution (OOD) data. Surprisingly, we observe the existence of benign OOD data that can improve TTA performance. We provide meaningful insights into the causes of benign OOD-contamination by analyzing the feature space of the pre-trained DNN. Inspired by these empirical findings, we propose R3, a novel TTA algorithm that specifically targets OOD-contaminated streams. Our experimental results verify that R3 improves competitive baselines by up to nearly 3%p on OOD-contaminated streams created with CIFAR-10-C and ImageNet-C.",
        "keywords": "Test-time Adaptation;Out-of-Distribution",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Jisoo Mok;Jonghyun Lee;Saehyung Lee;Sungroh Yoon",
        "authorids": "~Jisoo_Mok1;~Jonghyun_Lee1;~Saehyung_Lee1;~Sungroh_Yoon1",
        "gender": "F;M;M;",
        "homepage": ";;;http://ailab.snu.ac.kr",
        "dblp": "294/8666;;260/0442;99/1474",
        "google_scholar": "LZP5k2cAAAAJ;;nS24h74AAAAJ;Bphl_fIAAAAJ",
        "orcid": "0000-0001-7002-0275;;;0000-0002-2367-197X",
        "linkedin": ";jonghyun-lee-0886061a3/;;",
        "or_profile": "~Jisoo_Mok1;~Jonghyun_Lee1;~Saehyung_Lee1;~Sungroh_Yoon1",
        "aff": "Seoul National University;Seoul National University;Adobe Systems;Seoul National University",
        "aff_domain": "snu.ac.kr;snu.ac.kr;adobe.com;snu.ac.kr",
        "position": "PhD student;PhD student;Intern;Full Professor",
        "bibtex": "@misc{\nmok2024reduce,\ntitle={Reduce, Reuse, and Recycle: Navigating Test-Time Adaptation with {OOD}-Contaminated Streams},\nauthor={Jisoo Mok and Jonghyun Lee and Saehyung Lee and Sungroh Yoon},\nyear={2024},\nurl={https://openreview.net/forum?id=gTRtDFm8Di}\n}",
        "github": "",
        "project": "",
        "reviewers": "szCP;8qGX;hsXp;hKzM",
        "site": "https://openreview.net/forum?id=gTRtDFm8Di",
        "pdf_size": 17833146,
        "rating": "3;5;5;5",
        "confidence": "4;3;5;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;2;2",
        "wc_summary": "61;94;37;105",
        "wc_strengths": "23;64;42;31",
        "wc_weaknesses": "264;256;175;29",
        "wc_questions": "5;2;32;328",
        "wc_review": "353;416;286;493",
        "wc_reply_reviewers": "0;41;185;0",
        "wc_reply_authors": "347;489;382;377",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            74.25,
            26.920020430898635
        ],
        "wc_strengths_avg": [
            40.0,
            15.411035007422441
        ],
        "wc_weaknesses_avg": [
            181.0,
            94.41133406535468
        ],
        "wc_questions_avg": [
            91.75,
            136.89845689415202
        ],
        "wc_review_avg": [
            387.0,
            76.54083877251412
        ],
        "wc_reply_reviewers_avg": [
            56.5,
            76.05425694857587
        ],
        "wc_reply_authors_avg": [
            398.75,
            53.79765329454436
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:sSR3SspObnsJ:scholar.google.com/&scioq=Reduce,+Reuse,+and+Recycle:+Navigating+Test-Time+Adaptation+with+OOD-Contaminated+Streams&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Seoul National University;Adobe",
        "aff_unique_dep": ";Adobe Systems Incorporated",
        "aff_unique_url": "https://www.snu.ac.kr;https://www.adobe.com",
        "aff_unique_abbr": "SNU;Adobe",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "id": "gTWaUlxxWi",
        "title": "On the Effectiveness of One-Shot Federated Ensembles in Heterogeneous Cross-Silo Settings",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "FL is a popular approach for training machine learning models on decentralized data. For communication efficiency, one-shot FL trades the iterative exchange of models between clients and the FL server for one single round of communication. However, one-shot FL does not perform as well as iterative FL, and struggles under high data heterogeneity. While ensembles have repeatedly appeared as strong contenders in one-shot FL literature, their full potential is still under-explored. In this work, we extensively examine federated ensembles across the heterogeneity spectrum, in conjunction with various aggregation functions from the ensemble literature, with a specific focus on cross-silo settings. Our experiments reveal that an aggregator based on a shallow neural network can significantly boost the performance of ensembles under high data heterogeneity. Through comprehensive evaluations on the CIFAR-10, SVHN and the cross-silo healthcare FLamby benchmark, we show that federated ensembles not only achieve up to 26% higher accuracy over current one-shot methods but can also match the performance of iterative FL under high data heterogeneity, all while being up to 9.1x more efficient in terms of communication due to their one-shot nature.",
        "keywords": "Federated Learning;One-Shot;Communication Efficiency;Ensembles",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/42bc5006861ba32ee985cbdb9913f40348631fee.zip",
        "author": "Youssef Allouah;Akash Dhasade;Rachid Guerraoui;Nirupam Gupta;Anne-marie Kermarrec;Rafael Pinot;Rafael Pires;Rishi Sharma",
        "authorids": "~Youssef_Allouah1;~Akash_Dhasade1;~Rachid_Guerraoui1;~Nirupam_Gupta1;~Anne-marie_Kermarrec2;~Rafael_Pinot1;~Rafael_Pires1;~Rishi_Sharma2",
        "gender": "M;;M;;F;;M;M",
        "homepage": "https://youssefallouah.com/;;https://lpdwww.epfl.ch/rachid/;;https://people.epfl.ch/anne-marie.kermarrec;;https://pires.tech/;https://rishisharma.netlify.app/",
        "dblp": "312/3936;;g/RachidGuerraoui;;86/676.html;;189/6914;158/4544-1",
        "google_scholar": "kVZu88cAAAAJ;;;;https://scholar.google.it/citations?user=aIAy-qcAAAAJ;;https://scholar.google.ch/citations?user=EegvylkAAAAJ;jUfDXOsAAAAJ",
        "orcid": "0000-0003-1048-7548;;;;0000-0001-8187-724X;;0000-0002-7826-1599;0000-0002-1928-1549",
        "linkedin": ";;;;;;rafaelppires/?locale=en_US;rishi-s8/",
        "or_profile": "~Youssef_Allouah1;~Akash_Dhasade1;~Rachid_Guerraoui1;~Nirupam_Gupta1;~Anne-marie_Kermarrec2;~Rafael_Pinot1;~Rafael_Pires1;~Rishi_Sharma2",
        "aff": "Stanford University;;;;School of Computer and Communication Sciences, EPFL - EPF Lausanne;;EPFL - EPF Lausanne;Massachusetts Institute of Technology",
        "aff_domain": "stanford.edu;;;;ic.epfl.ch;;epfl.ch;mit.edu",
        "position": "Visiting student researcher;;;;Full Professor;;Postdoc;Intern",
        "bibtex": "@misc{\nallouah2024on,\ntitle={On the Effectiveness of One-Shot Federated Ensembles in Heterogeneous Cross-Silo Settings},\nauthor={Youssef Allouah and Akash Dhasade and Rachid Guerraoui and Nirupam Gupta and Anne-marie Kermarrec and Rafael Pinot and Rafael Pires and Rishi Sharma},\nyear={2024},\nurl={https://openreview.net/forum?id=gTWaUlxxWi}\n}",
        "github": "",
        "project": "",
        "reviewers": "ne5T;zo9y;4Q6E;hFH5",
        "site": "https://openreview.net/forum?id=gTWaUlxxWi",
        "pdf_size": 783488,
        "rating": "3;3;5;5",
        "confidence": "5;3;5;3",
        "soundness": "3;2;3;3",
        "contribution": "2;2;2;2",
        "presentation": "3;2;3;3",
        "wc_summary": "51;99;38;89",
        "wc_strengths": "81;90;31;115",
        "wc_weaknesses": "707;346;54;151",
        "wc_questions": "69;62;33;29",
        "wc_review": "908;597;156;384",
        "wc_reply_reviewers": "48;122;36;0",
        "wc_reply_authors": "764;1246;641;678",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            1.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            69.25,
            25.420218331084413
        ],
        "wc_strengths_avg": [
            79.25,
            30.515364982251153
        ],
        "wc_weaknesses_avg": [
            314.5,
            249.82043551319015
        ],
        "wc_questions_avg": [
            48.25,
            17.483921184905864
        ],
        "wc_review_avg": [
            511.25,
            277.10952257185244
        ],
        "wc_reply_reviewers_avg": [
            51.5,
            44.37059837324712
        ],
        "wc_reply_authors_avg": [
            832.25,
            243.01067363389618
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18035876641819488539&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "Stanford University;EPFL;Massachusetts Institute of Technology",
        "aff_unique_dep": ";School of Computer and Communication Sciences;",
        "aff_unique_url": "https://www.stanford.edu;https://www.epfl.ch;https://web.mit.edu",
        "aff_unique_abbr": "Stanford;EPFL;MIT",
        "aff_campus_unique_index": "0;1;1",
        "aff_campus_unique": "Stanford;Lausanne;",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "United States;Switzerland"
    },
    {
        "title": "W\u00fcrstchen: An Efficient Architecture for Large-Scale Text-to-Image Diffusion Models",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18142",
        "id": "gU58d5QeGv",
        "author_site": "Pablo Pern\u00edas, Dominic Rampas, Mats L. Richter, Christopher Pal, Marc Aubreville",
        "tldr": "",
        "abstract": "We introduce W\u00fcrstchen, a novel architecture for text-to-image synthesis that combines competitive performance with unprecedented cost-effectiveness for large-scale text-to-image diffusion models.\nA key contribution of our work is to develop a latent diffusion technique in which we learn a detailed but extremely compact semantic image representation used to guide the diffusion process. This highly compressed representation of an image provides much more detailed guidance compared to latent representations of language and this significantly reduces the computational requirements to achieve state-of-the-art results. Our approach also improves the quality of text-conditioned image generation based on our user preference study.\nThe training requirements of our approach consists of 24,602 A100-GPU hours - compared to Stable Diffusion 2.1's 200,000 GPU hours.  \nOur approach also requires less training data to achieve these results. Furthermore, our compact latent representations allows us to perform inference over twice as fast, slashing the usual costs and carbon footprint of a state-of-the-art (SOTA) diffusion model significantly, without compromising the end performance. In a broader comparison against SOTA models our approach is substantially more efficient and compares favourably in terms of image quality.\nWe believe that this work motivates more emphasis on the prioritization of both performance and computational accessibility.",
        "keywords": "Latent Diffusion Model;Text-to-Image;Neural Architectures;Foundation Models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/019a923f4f8092ea3e4d81c87abfcf428eec3447.pdf",
        "author": "Pablo Pernias;Dominic Rampas;Mats Leon Richter;Christopher Pal;Marc Aubreville",
        "authorids": "~Pablo_Pernias1;~Dominic_Rampas1;~Mats_Leon_Richter1;~Christopher_Pal1;~Marc_Aubreville1",
        "gender": "M;M;M;;M",
        "homepage": ";;;https://scholar.google.ca/citations?user=1ScWJOoAAAAJ&hl=en&oi=ao;http://deepmicroscopy.org",
        "dblp": "333/2425;333/2017;245/2691.html;45/1217;166/6549",
        "google_scholar": ";;xtlV5SAAAAAJ;https://scholar.google.ca/citations?user=1ScWJOoAAAAJ;https://scholar.google.de/citations?user=6iPoAXAAAAAJ",
        "orcid": ";;;;0000-0002-5294-5247",
        "linkedin": "pablopernias/;dominic-rampas-7bb2ba1b8/;https://de.linkedin.com/in/mats-richter-879609154;;marc-aubreville-48a977120/",
        "or_profile": "~Pablo_Pernias1;~Dominic_Rampas1;~Mats_Leon_Richter1;~Christopher_Pal1;~Marc_Aubreville1",
        "aff": ";;Montreal Institute for Learning Algorithms, University of Montreal, Universit\u00e9 de Montr\u00e9al;Polytechnique Montreal;Technische Hochschule Ingolstadt",
        "aff_domain": ";;mila.umontreal.ca;polymtl.ca;thi.de",
        "position": ";;Postdoc;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\npernias2024wrstchen,\ntitle={W\\\"urstchen: An Efficient Architecture for Large-Scale Text-to-Image Diffusion Models},\nauthor={Pablo Pernias and Dominic Rampas and Mats Leon Richter and Christopher Pal and Marc Aubreville},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=gU58d5QeGv}\n}",
        "github": "",
        "project": "",
        "reviewers": "MvDK;ix2S;b5h8;CAkw",
        "pdf_size": 6638233,
        "rating": "8;8;8;8",
        "confidence": "4;4;5;4",
        "soundness": "3;3;4;3",
        "contribution": "3;3;4;3",
        "presentation": "3;3;3;3",
        "wc_summary": "58;120;57;68",
        "wc_strengths": "89;115;60;55",
        "wc_weaknesses": "440;30;41;80",
        "wc_questions": "8;72;4;51",
        "wc_review": "595;337;162;254",
        "wc_reply_reviewers": "1149;0;10;0",
        "wc_reply_authors": "1484;325;520;538",
        "reply_reviewers": "4;0;1;0",
        "reply_authors": "2;1;1;2",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            75.75,
            25.907286619790966
        ],
        "wc_strengths_avg": [
            79.75,
            24.138920854089562
        ],
        "wc_weaknesses_avg": [
            147.75,
            169.7503681881132
        ],
        "wc_questions_avg": [
            33.75,
            28.760867511255636
        ],
        "wc_review_avg": [
            337.0,
            161.30561056578287
        ],
        "wc_reply_reviewers_avg": [
            289.75,
            496.1050166043476
        ],
        "wc_reply_authors_avg": [
            716.75,
            450.7778693547411
        ],
        "reply_reviewers_avg": [
            1.25,
            1.6393596310755
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 97,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16484458810949804240&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=gU58d5QeGv",
        "pdf": "https://openreview.net/pdf?id=gU58d5QeGv",
        "email": ";;mila.umontreal.ca;polymtl.ca;thi.de",
        "author_num": 5,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of Montreal;Polytechnique Montreal;Technische Hochschule Ingolstadt",
        "aff_unique_dep": "Montreal Institute for Learning Algorithms;;",
        "aff_unique_url": "https://www.mila.quebec;https://www.polymtl.ca;https://www.thi.de",
        "aff_unique_abbr": "MILA;PolyMTL;THI",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Montreal;",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "Canada;Germany"
    },
    {
        "id": "gU6OqJfO0G",
        "title": "ON LEARNABILITY AND EXPERIENCE REPLAY METHODS FOR GRAPH INCREMENTAL LEARNING ON EVOLVING GRAPHS",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent research has witnessed a surge in the exploration of Node-wise Graph Incremental Learning (NGIL) due to its substantial practical relevance. A central challenge in NGIL stems from the structural shifts induced by the inherent interdependence among vertices within graph data, adding complexity to the task of maintaining consistent model performance over time. Although several efforts have been made to devise incremental learning methods for NGIL, they have overlooked a fundamental question concerning the learnability of NGIL\u2014whether there always exists a learning algorithm capable of consistently producing a model with a small error from the hypothesis.  In this paper, we present the first theoretical study on the learnability of the NGIL problem with the statistical learning framework. Our analysis uncovers a critical insight: NGIL is not always learnable when structural shifts are uncontrolled. Additionally, in order to control structural shift, we leverage the idea of experience reply which selects a small set of representative data to replay with the new tasks, and propose a novel experience replay method, Structure-Evolution-Aware Experience Replay (SEA-ER). SEA-ER comprises a novel experience sample selection strategy founded on the topological awareness of GNNs and a novel replay objective utilizing importance re-weighting, which can effectively counteract catastrophic forgetting and mitigate the effect of structural shifts in NGIL. Comprehensive experiments validate our theoretical results and showcase the effectiveness of our newly proposed experience replay approach.",
        "keywords": "graph neural network;incremental learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Junwei Su;Difan Zou;Chuan Wu",
        "authorids": "~Junwei_Su1;~Difan_Zou1;~Chuan_Wu1",
        "gender": "M;M;",
        "homepage": ";https://difanzou.github.io/;https://i.cs.hku.hk/~cwu/",
        "dblp": "226/0880;161/8923;34/3772-1",
        "google_scholar": "https://scholar.google.ca/citations?user=jtWS-OMAAAAJ;Cp4fcTQAAAAJ;mY7MWXMAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Junwei_Su1;~Difan_Zou1;~Chuan_Wu1",
        "aff": "The University of Hong Kong;University of Hong Kong;The University of Hong Kong",
        "aff_domain": "hku.hk;hku.hk;hku.hk",
        "position": "PhD student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nsu2024on,\ntitle={{ON} {LEARNABILITY} {AND} {EXPERIENCE} {REPLAY} {METHODS} {FOR} {GRAPH} {INCREMENTAL} {LEARNING} {ON} {EVOLVING} {GRAPHS}},\nauthor={Junwei Su and Difan Zou and Chuan Wu},\nyear={2024},\nurl={https://openreview.net/forum?id=gU6OqJfO0G}\n}",
        "github": "",
        "project": "",
        "reviewers": "Fnb6;vspK;tgji;MQqi",
        "site": "https://openreview.net/forum?id=gU6OqJfO0G",
        "pdf_size": 744744,
        "rating": "3;5;5;6",
        "confidence": "4;3;4;5",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;1;3",
        "wc_summary": "107;66;48;134",
        "wc_strengths": "35;18;31;114",
        "wc_weaknesses": "190;448;136;193",
        "wc_questions": "3;124;6;16",
        "wc_review": "335;656;221;457",
        "wc_reply_reviewers": "0;0;0;201",
        "wc_reply_authors": "744;561;1123;604",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "2;2;3;2",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            88.75,
            33.75925798947601
        ],
        "wc_strengths_avg": [
            49.5,
            37.765725201563384
        ],
        "wc_weaknesses_avg": [
            241.75,
            121.2195838138376
        ],
        "wc_questions_avg": [
            37.25,
            50.3158772158451
        ],
        "wc_review_avg": [
            417.25,
            161.13716982744856
        ],
        "wc_reply_reviewers_avg": [
            50.25,
            87.03555308033609
        ],
        "wc_reply_authors_avg": [
            758.0,
            221.328940719464
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.3244428422615251,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:aHzzKg8BMx8J:scholar.google.com/&scioq=ON+LEARNABILITY+AND+EXPERIENCE+REPLAY+METHODS+FOR+GRAPH+INCREMENTAL+LEARNING+ON+EVOLVING+GRAPHS&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Hong Kong",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.hku.hk",
        "aff_unique_abbr": "HKU",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "gVWnZVmpLP",
        "title": "Central Force Field: Unifying Generative and Discriminative Models While Harmonizing Energy-Based and Score-Based Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In the pursuit of Artificial General Intelligence, a prevalent approach is to establish a comprehensive unified foundation model that addresses multiple tasks concurrently. However, creating such a model that unifies generative and discriminative models presents significant challenges.\nThis paper aims to realize this unified model aspiration by suggesting the incorporation of a central force field from physics. \nMore precisely, within the framework of this central force field, the potential functions governing the data distribution and the joint data-label distribution become intricately interwoven with a standard discriminative classifier, rendering them well-suited for handling discriminative tasks.\nMoreover, the central force field exhibits a captivating characteristic: objects located within this field experience an attractive force that propels them towards the center. This phenomenon of centripetal motion, orchestrated by the force field, has the remarkable capability to progressively revert diffused data to its original configuration, thereby facilitating the execution of generative tasks.\nOur proposed method adeptly bridges the realms of energy-based and score-based models. Extensive experimental validation attests to the effectiveness of our approach, showcasing not only its prowess in image generation benchmarks but also its promising competitiveness in image classification benchmarks.",
        "keywords": "Central Force Field;Generative Model;Discriminative Model;Energy-Based Model;Score-Based Model",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Guangrun Wang;Chen Lin;Philip Torr",
        "authorids": "~Guangrun_Wang1;~Chen_Lin2;~Philip_Torr1",
        "gender": "M;M;",
        "homepage": "https://wanggrun.github.io;https://scholar.google.com/citations?hl=en&user=rObgGWIAAAAJ;http://www.robots.ox.ac.uk/~tvg/",
        "dblp": "165/1374.html;;",
        "google_scholar": "nuHIZx0AAAAJ;https://scholar.google.com/citations?hl=en;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Guangrun_Wang1;~Chen_Lin2;~Philip_Torr1",
        "aff": "University of Oxford;University of Oxford, University of Oxford;University of Oxford",
        "aff_domain": "ox.ac.uk;eng.ox.ac.uk;ox.ac.uk",
        "position": "Researcher;PhD student;Full Professor",
        "bibtex": "@misc{\nwang2024central,\ntitle={Central Force Field: Unifying Generative and Discriminative Models While Harmonizing Energy-Based and Score-Based Models},\nauthor={Guangrun Wang and Chen Lin and Philip Torr},\nyear={2024},\nurl={https://openreview.net/forum?id=gVWnZVmpLP}\n}",
        "github": "",
        "project": "",
        "reviewers": "3hco;ELK7;mAWA",
        "site": "https://openreview.net/forum?id=gVWnZVmpLP",
        "pdf_size": 2827998,
        "rating": "3;3;3",
        "confidence": "4;3;4",
        "soundness": "2;1;2",
        "contribution": "2;1;2",
        "presentation": "2;2;1",
        "wc_summary": "43;46;68",
        "wc_strengths": "47;40;19",
        "wc_weaknesses": "346;237;70",
        "wc_questions": "101;1;127",
        "wc_review": "537;324;284",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            52.333333333333336,
            11.14550233153366
        ],
        "wc_strengths_avg": [
            35.333333333333336,
            11.897712198383164
        ],
        "wc_weaknesses_avg": [
            217.66666666666666,
            113.50281445360238
        ],
        "wc_questions_avg": [
            76.33333333333333,
            54.31594813884981
        ],
        "wc_review_avg": [
            381.6666666666667,
            111.04453561021762
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:fQTsZX3_lCgJ:scholar.google.com/&scioq=Central+Force+Field:+Unifying+Generative+and+Discriminative+Models+While+Harmonizing+Energy-Based+and+Score-Based+Models&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Oxford",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ox.ac.uk",
        "aff_unique_abbr": "Oxford",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "gWHiS8Z867",
        "title": "Routing with Rich Text Queries via Next-Vertex Prediction Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Autoregressive modeling of text via transformers has led to recent breakthroughs in language. In this work, we study the effectiveness of this framework for routing problems on graphs. In particular, we aim to develop a learning based routing system that can process rich natural language based queries indicating various desired criteria and produce near optimal routes from the source to the destination. Furthermore, the system should be able to generalize to new geographies not seen during training time. \n\nSolving the above problem via combinatorial approaches is challenging since one has to learn specific cost functions over the edges of the graphs for each possible type of query. We instead investigate the efficacy of autoregressive modeling for routing. We propose a multimodal architecture that jointly encodes text and graph data and present a simple way of training the architecture via {\\em next token prediction}. In particular, given a text query and a prefix of a ground truth path, we train the network to predict the next vertex on the path. While a priori this approach may seem suboptimal due to the local nature of the predictions made, we show that when done at scale, this yields near optimal performance. \n\nWe demonstrate the effectiveness of our approach via extensive experiments on synthetic graphs as well as graphs from the OpenStreetMap repository. We also present recommendations for the training techniques, architecture choices and the inference algorithms needed to get the desired performance for such problems.",
        "keywords": "Text based routing;next token prediction",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Eric Zhao;Pranjal Awasthi;Zhengdao Chen;Sreenivas Gollapudi;Daniel Delling",
        "authorids": "~Eric_Zhao1;~Pranjal_Awasthi3;~Zhengdao_Chen1;~Sreenivas_Gollapudi2;~Daniel_Delling1",
        "gender": "M;;;M;",
        "homepage": "https://eric-zhao.com;https://www.cs.rutgers.edu/~pa336/;;https://www.sreenivasgollapudi.com;http://www.danieldelling.com",
        "dblp": "294/8327.html;57/679;;https://dblp.uni-trier.de/pers/g/Gollapudi:Sreenivas.html;",
        "google_scholar": "6OfjaHQAAAAJ;;;Ysd-WJgAAAAJ;",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Eric_Zhao1;~Pranjal_Awasthi3;~Zhengdao_Chen1;~Sreenivas_Gollapudi2;~Daniel_Delling1",
        "aff": "University of California, Berkeley;Rutgers University;;Google;Google",
        "aff_domain": "berkeley.edu;rutgers.edu;;google.com;google.com",
        "position": "PhD student;Assistant Professor;;Researcher;Researcher",
        "bibtex": "@misc{\nzhao2024routing,\ntitle={Routing with Rich Text Queries via Next-Vertex Prediction Models},\nauthor={Eric Zhao and Pranjal Awasthi and Zhengdao Chen and Sreenivas Gollapudi and Daniel Delling},\nyear={2024},\nurl={https://openreview.net/forum?id=gWHiS8Z867}\n}",
        "github": "",
        "project": "",
        "reviewers": "P8sR;vEqU;eXjd",
        "site": "https://openreview.net/forum?id=gWHiS8Z867",
        "pdf_size": 14079312,
        "rating": "5;5;6",
        "confidence": "3;4;2",
        "soundness": "3;3;3",
        "contribution": "2;2;2",
        "presentation": "3;3;2",
        "wc_summary": "127;117;53",
        "wc_strengths": "51;62;85",
        "wc_weaknesses": "234;319;86",
        "wc_questions": "159;6;123",
        "wc_review": "571;504;347",
        "wc_reply_reviewers": "103;0;23",
        "wc_reply_authors": "635;571;291",
        "reply_reviewers": "1;0;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            99.0,
            32.78210894171799
        ],
        "wc_strengths_avg": [
            66.0,
            14.165686240583852
        ],
        "wc_weaknesses_avg": [
            213.0,
            96.2739147779224
        ],
        "wc_questions_avg": [
            96.0,
            65.31462317123173
        ],
        "wc_review_avg": [
            474.0,
            93.8758044794646
        ],
        "wc_reply_reviewers_avg": [
            42.0,
            44.14370472294625
        ],
        "wc_reply_authors_avg": [
            499.0,
            149.38094479104979
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:31IzLa_ktrcJ:scholar.google.com/&scioq=Routing+with+Rich+Text+Queries+via+Next-Vertex+Prediction+Models&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;2",
        "aff_unique_norm": "University of California, Berkeley;Rutgers University;Google",
        "aff_unique_dep": ";;Google",
        "aff_unique_url": "https://www.berkeley.edu;https://www.rutgers.edu;https://www.google.com",
        "aff_unique_abbr": "UC Berkeley;Rutgers;Google",
        "aff_campus_unique_index": "0;2;2",
        "aff_campus_unique": "Berkeley;;Mountain View",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "gWw0NjTQRg",
        "title": "AV-PEA: PARAMETER-EFFICIENT ADAPTER FOR AUDIO-VISUAL MULTIMODAL LEARNING",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Fine-tuning has emerged as a widely used transfer learning technique for leveraging pre-trained vision transformers in various downstream tasks. However, its success relies on tuning a significant number of trainable parameters, which could lead to significant costs in terms of both model training and storage. When it comes to audio-visual multimodal learning, the challenge also lies in effectively incorporating both audio and visual cues into the transfer learning process, especially when the original model has been trained with unimodal samples only. This paper introduces a novel audio-visual parameter-efficient adapter (AV-PEA) designed to improve multimodal transfer learning for audio-visual tasks. Through the integration of AV-PEA into a frozen vision transformer, like ViT (Dosovitskiy et al., 2021), the transformer becomes adept at processing audio inputs without prior knowledge of audio pre-training. This also facilitates the exchange of essential audio-visual cues between audio and visual modalities, all while introducing a limited set of trainable parameters into each block of the frozen transformer. The experimental results demonstrate that our AV-PEA consistently achieves superior or comparable performance to state-of-the-art methods in a range of audio-visual tasks, including audio-visual event localization (AVEL), audio-visual question answering (AVQA), audio-visual retrieval (AVR), and audio-visual captioning (AVC). Furthermore, it distinguishes itself from competitors by enabling seamless integration into these tasks while maintaining a consistent number of trainable parameters, typically accounting for less than 3.7% of the total parameters per task.",
        "keywords": "PARAMETER-EFFICIENT;ADAPTER;AUDIO-VISUAL LEARNING;MULTIMODAL LEARNING",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Abduljalil Radman;Jorma Laaksonen",
        "authorids": "~Abduljalil_Radman1;~Jorma_Laaksonen2",
        "gender": ";",
        "homepage": ";",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Abduljalil_Radman1;~Jorma_Laaksonen2",
        "aff": ";",
        "aff_domain": ";",
        "position": ";",
        "bibtex": "@misc{\nradman2024avpea,\ntitle={{AV}-{PEA}: {PARAMETER}-{EFFICIENT} {ADAPTER} {FOR} {AUDIO}-{VISUAL} {MULTIMODAL} {LEARNING}},\nauthor={Abduljalil Radman and Jorma Laaksonen},\nyear={2024},\nurl={https://openreview.net/forum?id=gWw0NjTQRg}\n}",
        "github": "",
        "project": "",
        "reviewers": "diyf;oLz4;Bn7A;G8r2",
        "site": "https://openreview.net/forum?id=gWw0NjTQRg",
        "pdf_size": 1323172,
        "rating": "3;3;5;6",
        "confidence": "3;4;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "1;2;2;3",
        "wc_summary": "120;74;36;34",
        "wc_strengths": "118;45;35;34",
        "wc_weaknesses": "340;145;308;118",
        "wc_questions": "26;9;84;76",
        "wc_review": "604;273;463;262",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            66.0,
            35.014282800023196
        ],
        "wc_strengths_avg": [
            58.0,
            34.90701935141412
        ],
        "wc_weaknesses_avg": [
            227.75,
            97.38165895074904
        ],
        "wc_questions_avg": [
            48.75,
            31.948200262299597
        ],
        "wc_review_avg": [
            400.5,
            142.08888063462248
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.5555555555555555,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Lgc7xEcs9AwJ:scholar.google.com/&scioq=AV-PEA:+PARAMETER-EFFICIENT+ADAPTER+FOR+AUDIO-VISUAL+MULTIMODAL+LEARNING&hl=en&as_sdt=0,5",
        "gs_version_total": 5
    },
    {
        "id": "gXFoaqQgEI",
        "title": "Dual-target Point Cloud Registration Using Representative Overlapping Points",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Point cloud registration is a challenging task when only partially visible data is\navailable. Recently, many learning-based methods have been proposed for this\nproblem and have achieved satisfactory performance. However, they rarely com\u0002bine multiple features and fail to pay attention to the key factor of registration:\nalignment of attitude. Based on this phenomenon, we propose a dual-target point\ncloud registration model, which combines multiple features learned from Point\u0002Net, DGCNN, and attention module. First, an initialization module is introduced\nfor coarse registration, in which a new target point cloud is added compared to\nthe original model. Second, we design a two-step attention-based representative\noverlapping-point selection module, which uses both global and local features of\ninput point clouds. In the first step, overlapping scores are predicted using global\nfeatures. In the second step, a feature-matching matrix is obtained based on local\nfeatures and a self-attention module. Representative overlapping points are se\u0002lected based on the overlapping scores in the first step and the feature-matching\nmatrix in the second step. Finally, a weighted SVD algorithm is used to estimate\nthe transformation from the point cloud after initialization to the target point cloud.\nExtensive experiments on ModelNet40 show our method achieves state-of-the-art\nperformance compared to other learning-based methods. The code is available at\nhttps://github.com/Dual-target.",
        "keywords": "point cloud registration;partially visible data;overlapping points;dual-target;alignment of attitude",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Zhifeng Rao;Yuang Chen;Ming Cao;Zhiyun Lin",
        "authorids": "~Zhifeng_Rao3;~Yuang_Chen1;~Ming_Cao1;~Zhiyun_Lin1",
        "gender": ";;;",
        "homepage": ";https://github.com/raozf/Dual-target;https://www.rug.nl/staff/m.cao/;",
        "dblp": ";;;",
        "google_scholar": ";;;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Zhifeng_Rao3;~Yuang_Chen1;~Ming_Cao1;~Zhiyun_Lin1",
        "aff": ";South University of Science and Technology of China;University of Groningen;",
        "aff_domain": ";sustc.edu.cn;rug.nl;",
        "position": ";MS student;Full Professor;",
        "bibtex": "@misc{\nrao2024dualtarget,\ntitle={Dual-target Point Cloud Registration Using Representative Overlapping Points},\nauthor={Zhifeng Rao and Yuang Chen and Ming Cao and Zhiyun Lin},\nyear={2024},\nurl={https://openreview.net/forum?id=gXFoaqQgEI}\n}",
        "github": "",
        "project": "",
        "reviewers": "XE5g;hH1j;5tja",
        "site": "https://openreview.net/forum?id=gXFoaqQgEI",
        "pdf_size": 3022976,
        "rating": "1;3;3",
        "confidence": "5;5;5",
        "soundness": "1;3;1",
        "contribution": "1;2;1",
        "presentation": "1;2;2",
        "wc_summary": "53;63;65",
        "wc_strengths": "8;48;26",
        "wc_weaknesses": "385;203;92",
        "wc_questions": "104;30;114",
        "wc_review": "550;344;297",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "confidence_avg": [
            5.0,
            0.0
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "contribution_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            60.333333333333336,
            5.2493385826745405
        ],
        "wc_strengths_avg": [
            27.333333333333332,
            16.35712552851373
        ],
        "wc_weaknesses_avg": [
            226.66666666666666,
            120.78171311180441
        ],
        "wc_questions_avg": [
            82.66666666666667,
            37.464056848605644
        ],
        "wc_review_avg": [
            397.0,
            109.87568733194193
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:5Xm2dMA3-p8J:scholar.google.com/&scioq=Dual-target+Point+Cloud+Registration+Using+Representative+Overlapping+Points&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "South University of Science and Technology of China;University of Groningen",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.sustech.edu.cn;https://www.rug.nl",
        "aff_unique_abbr": "SUSTech;RUG",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "China;Netherlands"
    },
    {
        "id": "gXfKPj4s7C",
        "title": "Object2Scene: Putting Objects in Context for Open-Vocabulary 3D Detection",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Point cloud-based open-vocabulary 3D object detection aims to detect 3D categories that do not have ground-truth annotations in the training set. It is extremely challenging because of the limited data and annotations (bounding boxes with class labels or text descriptions) of 3D scenes. Previous approaches leverage large-scale richly-annotated image datasets as a bridge between 3D and category semantics but require an extra alignment process between 2D images and 3D points, limiting the open-vocabulary ability of 3D detectors. Instead of leveraging 2D images, we propose Object2Scene, the first approach that leverages large-scale large-vocabulary 3D object datasets to augment existing 3D scene datasets for open-vocabulary 3D object detection. Object2Scene inserts objects from different sources into 3D scenes to enrich the vocabulary of 3D scene datasets and generates text descriptions for the newly inserted objects. We further introduce a framework that unifies 3D detection and visual grounding, named L3Det, and propose a cross-domain object-level contrastive learning approach to mitigate the domain gap between 3D objects from different datasets. Extensive experiments on existing open-vocabulary 3D object detection benchmarks show that Object2Scene obtains superior performance over existing methods. We further verify the effectiveness of Object2Scene on a new benchmark OV-ScanNet-200, by holding out all rare categories as novel categories not seen during training.",
        "keywords": "open vocabulary 3d detection;3d detection;contrastive learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/059b718c7087b733d0dfd1f219e00419997966c6.pdf",
        "author": "Chenming Zhu;Wenwei Zhang;Tai Wang;Xihui Liu;Kai Chen",
        "authorids": "~Chenming_Zhu1;~Wenwei_Zhang1;~Tai_Wang2;~Xihui_Liu1;~Kai_Chen4",
        "gender": "M;M;F;M;M",
        "homepage": "https://github.com/ZCMax;https://zhangwenwei.cn;https://xh-liu.github.io/;https://chenkai.site/;https://tai-wang.github.io/",
        "dblp": "251/1919;;184/3911;181/2839-26;",
        "google_scholar": "QabwS_wAAAAJ;QDXADSEAAAAJ;https://scholar.google.com.hk/citations?user=4YL23GMAAAAJ;https://scholar.google.com.hk/citations?user=eGD0b7IAAAAJ;JmbbZWIAAAAJ",
        "orcid": ";0000-0002-2748-4514;0000-0003-1831-9952;0000-0002-6820-2325;",
        "linkedin": ";wenweizhang-b9769a124/;;;%E6%B3%B0-%E7%8E%8B-2b2738147/",
        "or_profile": "~Chenming_Zhu1;~Wenwei_Zhang1;~Xihui_Liu1;~Kai_Chen4;~Tai_WANG1",
        "aff": "University of Hong Kong;Shanghai AI Laboratory;University of Hong Kong;Shanghai AI Laboratory;Shanghai AI Laboratory",
        "aff_domain": "hku.hk;pjlab.org.cn;hku.hk;pjlab.org.cn;pjlab.org.cn",
        "position": "PhD student;Researcher;Assistant Professor;Researcher;Research Scientist",
        "bibtex": "@misc{\nzhu2024objectscene,\ntitle={Object2Scene: Putting Objects in Context for Open-Vocabulary 3D Detection},\nauthor={Chenming Zhu and Wenwei Zhang and Tai Wang and Xihui Liu and Kai Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=gXfKPj4s7C}\n}",
        "github": "",
        "project": "",
        "reviewers": "sdvC;ciKG;UJPz;XyDn",
        "site": "https://openreview.net/forum?id=gXfKPj4s7C",
        "pdf_size": 6347559,
        "rating": "3;5;6;6",
        "confidence": "4;5;5;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;2",
        "presentation": "2;3;3;2",
        "wc_summary": "77;108;80;64",
        "wc_strengths": "34;72;66;43",
        "wc_weaknesses": "312;295;154;142",
        "wc_questions": "3;5;3;5",
        "wc_review": "426;480;303;254",
        "wc_reply_reviewers": "0;0;28;48",
        "wc_reply_authors": "774;496;311;361",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            82.25,
            16.037066439969625
        ],
        "wc_strengths_avg": [
            53.75,
            15.722197683530124
        ],
        "wc_weaknesses_avg": [
            225.75,
            78.0972950876021
        ],
        "wc_questions_avg": [
            4.0,
            1.0
        ],
        "wc_review_avg": [
            365.75,
            90.97904978620078
        ],
        "wc_reply_reviewers_avg": [
            19.0,
            20.273134932713294
        ],
        "wc_reply_authors_avg": [
            485.5,
            179.78667915059782
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.40824829046386296,
        "gs_citation": 18,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15976952205902767716&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;1;1",
        "aff_unique_norm": "University of Hong Kong;Shanghai AI Laboratory",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.hku.hk;https://www.shanghai-ai-lab.com",
        "aff_unique_abbr": "HKU;SAIL",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "gYa9R2Pmp8",
        "title": "Jailbreaking Language Models at Scale via Persona Modulation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Despite significant efforts to align large language models to produce harmless responses, their safety mechanisms are still vulnerable to prompts that elicit undesirable behaviour: jailbreaks. In this work, we investigate persona modulation as a black-box jailbreak that steers the target model to take on particular personalities (personas) that are more likely to comply with harmful instructions. We show that persona modulation can be automated to exploit this vulnerability at scale. We achieve this by using a novel jailbreak prompt that gets a language model to generate jailbreak prompts for arbitrary topics rather than manually crafting a jailbreak prompt for each persona. Persona modulation leads to high attack success rates against GPT-4, and the prompts are transferable to other state-of-the-art models such as Claude 2 and Vicuna. Our work expands the attack surface for misuse and highlights new vulnerabilities in large language models.",
        "keywords": "Language Model;Prompt Engineering;Model Evaluations;Red-Teaming;Persona Modulation",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Rusheb Shah;Quentin Feuillade Montixi;Soroush Pour;Arush Tagade;Javier Rando",
        "authorids": "~Rusheb_Shah1;~Quentin_Feuillade_Montixi1;~Soroush_Pour1;~Arush_Tagade2;~Javier_Rando2",
        "gender": "M;M;Not Specified;M;M",
        "homepage": "https://github.com/rusheb;;https://www.soroushjp.com/;;https://javirando.com",
        "dblp": ";;;;257/3128",
        "google_scholar": ";;;;d_rilUYAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";quentin101010/;soroushjp/;arush-tagade/;https://linkedin.com/in/javier-rando",
        "or_profile": "~Rusheb_Shah1;~Quentin_Feuillade_Montixi1;~Soroush_Pour1;~Arush_Tagade2;~Javier_Rando2",
        "aff": ";PRISM Eval;;Leap Laboratories;Department of Computer Science, ETHZ - ETH Zurich",
        "aff_domain": ";prism-eval.ai;;leap-labs.com;inf.ethz.ch",
        "position": ";Researcher;;Researcher;PhD student",
        "bibtex": "@misc{\nshah2024jailbreaking,\ntitle={Jailbreaking Language Models at Scale via Persona Modulation},\nauthor={Rusheb Shah and Quentin Feuillade Montixi and Soroush Pour and Arush Tagade and Javier Rando},\nyear={2024},\nurl={https://openreview.net/forum?id=gYa9R2Pmp8}\n}",
        "github": "",
        "project": "",
        "reviewers": "2ytU;pyxV;quGs;DNY8",
        "site": "https://openreview.net/forum?id=gYa9R2Pmp8",
        "pdf_size": 1113152,
        "rating": "3;3;5;5",
        "confidence": "4;3;3;4",
        "soundness": "2;1;2;3",
        "contribution": "2;1;2;3",
        "presentation": "2;2;3;3",
        "wc_summary": "46;34;52;49",
        "wc_strengths": "54;17;36;48",
        "wc_weaknesses": "111;60;49;74",
        "wc_questions": "51;47;15;49",
        "wc_review": "262;158;152;220",
        "wc_reply_reviewers": "196;71;0;0",
        "wc_reply_authors": "607;499;156;420",
        "reply_reviewers": "1;2;0;0",
        "reply_authors": "3;3;2;2",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            45.25,
            6.832825184358224
        ],
        "wc_strengths_avg": [
            38.75,
            14.13108276106258
        ],
        "wc_weaknesses_avg": [
            73.5,
            23.39337513057917
        ],
        "wc_questions_avg": [
            40.5,
            14.79019945774904
        ],
        "wc_review_avg": [
            198.0,
            45.5411901469428
        ],
        "wc_reply_reviewers_avg": [
            66.75,
            80.05427846155382
        ],
        "wc_reply_authors_avg": [
            420.5,
            166.51201157874468
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:_ybQ7e1ScjEJ:scholar.google.com/&scioq=Jailbreaking+Language+Models+at+Scale+via+Persona+Modulation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "PRISM;Leap Laboratories;ETH Zurich",
        "aff_unique_dep": "Evaluation;;Department of Computer Science",
        "aff_unique_url": ";;https://www.ethz.ch",
        "aff_unique_abbr": "PRISM;;ETHZ",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Zurich",
        "aff_country_unique_index": "1",
        "aff_country_unique": ";Switzerland"
    },
    {
        "id": "gYcft1HIaU",
        "title": "Do Current Large Language Models Master Adequate Clinical Knowledge?",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) show promising potential in solving clinical problems. Current LLMs, including so-called medical LLMs, are reported to achieve excellent performance on certain medical evaluation benchmarks, such as medical question answering, medical exams, etc. However, such evaluations cannot assess whether LLMs have mastered sufficient, compressive, and necessary medical knowledge for solving real clinical problems, such as clinical diagnostic assistance. In this paper, we propose a framework to assess the mastery of LLMs in clinical knowledge. Firstly, we construct a large medical disease-based knowledge base, MedDisK, covering 10,632 common diseases across 18 clinical knowledge aspects, which are crucial for diagnosing and treating diseases. Built on that, we propose a MedDisK-based evaluation method MedDisKEval: We prompt LLMs to retrieve information related to these clinical knowledge aspects. Then, we evaluate an LLM's mastery of medical knowledge by measuring the similarity between the LLM-generated information and the content within our knowledge base. Our experimental findings reveal that over 50\\% of the clinical information generated by our evaluated LLMs is significantly inconsistent with the corresponding knowledge stored in our knowledge base. We further perform a significance analysis to compare the performance of medical LLMs with their backbone models, discovering that 5 out of 6 medical LLMs perform less effectively than their backbone models in over half of the clinical knowledge aspects. These observations demonstrate that existing LLMs have not mastered adequate knowledge for clinical practice. Our findings offer novel and constructive insights for the advancement of medical LLMs.",
        "keywords": "Large Language Model;Medical Large Language Model;Clinical Knowledge;Knowledge Graph",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Yuxuan Zhou;Chen Ning;Xien Liu;Ji Wu",
        "authorids": "~Yuxuan_Zhou1;~Chen_Ning1;~Xien_Liu4;~Ji_Wu3",
        "gender": "M;;M;M",
        "homepage": "https://zhouyx17.github.io/;;;http://speech.tsinghua.edu.cn/en/",
        "dblp": "172/9870-2;;;91/4957-2",
        "google_scholar": "RxWuu7gAAAAJ;;WOJZUW8AAAAJ;",
        "orcid": ";0009-0004-2796-3947;;0000-0001-6170-726X",
        "linkedin": ";;;",
        "or_profile": "~Yuxuan_Zhou1;~Chen_Ning1;~Xien_Liu4;~Ji_Wu3",
        "aff": "Tsinghua University;Tsinghua University; Tsinghua University;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;tsinghua.edu.cn;mail.tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "PhD student;PhD student;Postdoc;Full Professor",
        "bibtex": "@misc{\nzhou2024do,\ntitle={Do Current Large Language Models Master Adequate Clinical Knowledge?},\nauthor={Yuxuan Zhou and Chen Ning and Xien Liu and Ji Wu},\nyear={2024},\nurl={https://openreview.net/forum?id=gYcft1HIaU}\n}",
        "github": "",
        "project": "",
        "reviewers": "h42w;tVw5;rk49",
        "site": "https://openreview.net/forum?id=gYcft1HIaU",
        "pdf_size": 4800297,
        "rating": "3;5;5",
        "confidence": "2;4;4",
        "soundness": "2;3;2",
        "contribution": "2;2;2",
        "presentation": "1;2;3",
        "wc_summary": "102;60;175",
        "wc_strengths": "81;69;43",
        "wc_weaknesses": "153;259;126",
        "wc_questions": "52;220;319",
        "wc_review": "388;608;663",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1478;1536;1521",
        "reply_reviewers": "0;0;0",
        "reply_authors": "3;3;3",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            112.33333333333333,
            47.51374070261734
        ],
        "wc_strengths_avg": [
            64.33333333333333,
            15.86050300449376
        ],
        "wc_weaknesses_avg": [
            179.33333333333334,
            57.40112271453311
        ],
        "wc_questions_avg": [
            197.0,
            110.20889256316842
        ],
        "wc_review_avg": [
            553.0,
            118.81357947081077
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1511.6666666666667,
            24.580932086115496
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            3.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:mCyIc6x2_7QJ:scholar.google.com/&scioq=Do+Current+Large+Language+Models+Master+Adequate+Clinical+Knowledge%3F&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Tsinghua University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "gZNB1H5IsQ",
        "title": "Exploring Federated Optimization by Reducing Variance of Adaptive Unbiased Client Sampling",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Federated Learning (FL) systems usually sample a fraction of clients to conduct a training process. Notably, the variance of global estimates for updating the global model built on information from sampled clients is highly related to federated optimization quality. This paper explores a line of \"free\" adaptive client sampling techniques in federated optimization, where the server builds promising sampling probability and reliable global estimates without requiring additional local communication and computation. We capture a minor variant in the sampling procedure and improve the global estimation accordingly. Based on that, we propose a novel sampler called K-Vib, which solves an online convex optimization respecting client sampling in federated optimization. It achieves improved a linear speed up on regret bound $\\tilde{\\mathcal{O}}\\big(N^{\\frac{1}{3}}T^{\\frac{2}{3}}/K^{\\frac{4}{3}}\\big)$  with communication budget $K$. As a result, it significantly improves the performance of federated optimization. Theoretical improvements and intensive experiments on classic federated tasks demonstrate our findings.",
        "keywords": "Optimization; Federated Learning; Unbiased Sampling; Variance Reduction;",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/e6b99c6fc14d97eaad43fea7f509459d017b1eec.zip",
        "author": "Dun Zeng;Zenglin Xu;Yu Pan;Qifan Wang;Xiaoying Tang",
        "authorids": "~Dun_Zeng1;~Zenglin_Xu1;~Yu_Pan1;~Qifan_Wang2;~Xiaoying_Tang2",
        "gender": ";M;M;M;F",
        "homepage": "https://github.com/Zengdun-cs;https://faculty.fudan.edu.cn/xuzenglin/en/index.htm;https://yupan.me;https://wqfcr.github.io/;https://sse.cuhk.edu.cn/en/faculty/tangxiaoying",
        "dblp": "298/1134;68/1538;;33/8610;134/9714-2",
        "google_scholar": "CuNFd3EAAAAJ;gF0H9nEAAAAJ;NuxEyPAAAAAJ;LrSyLosAAAAJ;https://scholar.google.com/citations?hl=zh-TW",
        "orcid": ";0000-0001-5550-6461;0000-0001-7515-8492;0000-0002-7570-5756;0000-0003-3955-1195",
        "linkedin": ";;;;",
        "or_profile": "~Dun_Zeng1;~Zenglin_Xu1;~Yu_Pan1;~Qifan_Wang2;~Xiaoying_Tang2",
        "aff": "University of Electronic Science and Technology of China;Harbin Institute of Technology Shenzhen;Harbin Institute of Technology, Shenzhen;Meta AI;The Chinese University of Hong Kong, Shenzhen",
        "aff_domain": "uestc.edu.cn;hit.edu.cn;hit.edu.cn;fb.com;cuhk.edu.cn",
        "position": "PhD student;Full Professor;PhD Candidate;Principal Researcher;Assistant Professor",
        "bibtex": "@misc{\nzeng2024exploring,\ntitle={Exploring Federated Optimization by Reducing Variance of Adaptive Unbiased Client Sampling},\nauthor={Dun Zeng and Zenglin Xu and Yu Pan and Qifan Wang and Xiaoying Tang},\nyear={2024},\nurl={https://openreview.net/forum?id=gZNB1H5IsQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "iPwA;SHAe;6zGx",
        "site": "https://openreview.net/forum?id=gZNB1H5IsQ",
        "pdf_size": 1192081,
        "rating": "3;3;5",
        "confidence": "4;4;3",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "1;3;2",
        "wc_summary": "110;58;95",
        "wc_strengths": "40;58;175",
        "wc_weaknesses": "400;746;762",
        "wc_questions": "171;41;86",
        "wc_review": "721;903;1118",
        "wc_reply_reviewers": "0;152;0",
        "wc_reply_authors": "614;1061;640",
        "reply_reviewers": "0;1;0",
        "reply_authors": "1;3;1",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            87.66666666666667,
            21.853044537445015
        ],
        "wc_strengths_avg": [
            91.0,
            59.84981202978001
        ],
        "wc_weaknesses_avg": [
            636.0,
            167.00498994541053
        ],
        "wc_questions_avg": [
            99.33333333333333,
            53.90320542932077
        ],
        "wc_review_avg": [
            914.0,
            162.2611064508888
        ],
        "wc_reply_reviewers_avg": [
            50.666666666666664,
            71.65348716023682
        ],
        "wc_reply_authors_avg": [
            771.6666666666666,
            204.86472501520498
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:154XwQu_ugMJ:scholar.google.com/&scioq=Exploring+Federated+Optimization+by+Reducing+Variance+of+Adaptive+Unbiased+Client+Sampling&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;2;3",
        "aff_unique_norm": "University of Electronic Science and Technology of China;Harbin Institute of Technology;Meta;Chinese University of Hong Kong",
        "aff_unique_dep": ";;Meta AI;",
        "aff_unique_url": "https://www.uestc.edu.cn;https://www.hit.edu.cn/;https://meta.com;https://www.cuhk.edu.cn",
        "aff_unique_abbr": "UESTC;HIT;Meta;CUHK",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Shenzhen",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "gZRfDWLlGY",
        "title": "Exact Path Kernels Naturally Decompose Model Predictions",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper proposes a generalized exact path kernel gEPK which naturally decomposes model predictions into localized input gradients or parameter gradients. Many cutting edge out-of-distribution (OOD) detection methods are in effect projections onto a reduced representation of the gEPK parameter gradient subspace. This decomposition is also shown to map the significant modes of variation that define how model predictions depend on training input gradients at arbitrary test points. These local features are independent of architecture and can be directly compared between models. Furthermore this method also allows measurement of signal manifold dimension and can inform theoretically principled methods for OOD detection on pre-trained models.",
        "keywords": "Neural Tangent Kernels;robustness;manifolds;out of distribution detection",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Michael Geyer;Brian Wesley Bell;David Glickenstein;Amanda S Fernandez;Juston Moore",
        "authorids": "~Michael_Geyer1;~Brian_Wesley_Bell1;~David_Glickenstein1;~Amanda_S_Fernandez1;~Juston_Moore2",
        "gender": "M;M;M;F;M",
        "homepage": ";https://sites.google.com/math.arizona.edu/brian-bell/;http://math.arizona.edu/~glickenstein;https://sites.google.com/view/amandafernandez/home;",
        "dblp": "15/4735;;38/3964;247/1055;126/1789",
        "google_scholar": ";Vd4SXS4AAAAJ;bveUPXQAAAAJ;2UJTwuwAAAAJ;gyFa3X0AAAAJ",
        "orcid": ";;0000-0002-9238-0973;0000-0003-2397-0838;",
        "linkedin": ";;david-glickenstein-08619870/;amandasdfernandez;",
        "or_profile": "~Michael_Geyer1;~Brian_Wesley_Bell1;~David_Glickenstein1;~Amanda_S_Fernandez1;~Juston_Moore2",
        "aff": ";University of Arizona;University of Arizona;University of Texas, San Antonio;Los Alamos National Laboratory",
        "aff_domain": ";arizona.edu;arizona.edu;utsa.edu;lanl.gov",
        "position": ";PhD student;Full Professor;Assistant Professor;Scientist",
        "bibtex": "@misc{\ngeyer2024exact,\ntitle={Exact Path Kernels Naturally Decompose Model Predictions},\nauthor={Michael Geyer and Brian Wesley Bell and David Glickenstein and Amanda S Fernandez and Juston Moore},\nyear={2024},\nurl={https://openreview.net/forum?id=gZRfDWLlGY}\n}",
        "github": "",
        "project": "",
        "reviewers": "eT4X;dZQY;HDfE",
        "site": "https://openreview.net/forum?id=gZRfDWLlGY",
        "pdf_size": 544652,
        "rating": "3;5;5",
        "confidence": "2;2;3",
        "soundness": "2;2;3",
        "contribution": "2;2;2",
        "presentation": "2;2;1",
        "wc_summary": "60;16;111",
        "wc_strengths": "20;81;23",
        "wc_weaknesses": "126;132;107",
        "wc_questions": "182;14;7",
        "wc_review": "388;243;248",
        "wc_reply_reviewers": "99;0;0",
        "wc_reply_authors": "353;397;288",
        "reply_reviewers": "1;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            62.333333333333336,
            38.818666758260626
        ],
        "wc_strengths_avg": [
            41.333333333333336,
            28.075295585660754
        ],
        "wc_weaknesses_avg": [
            121.66666666666667,
            10.656244908763854
        ],
        "wc_questions_avg": [
            67.66666666666667,
            80.89636717567868
        ],
        "wc_review_avg": [
            293.0,
            67.20615051218651
        ],
        "wc_reply_reviewers_avg": [
            33.0,
            46.66904755831214
        ],
        "wc_reply_authors_avg": [
            346.0,
            44.773504069557326
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.49999999999999983,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:iGu3sMTx-2EJ:scholar.google.com/&scioq=Exact+Path+Kernels+Naturally+Decompose+Model+Predictions&hl=en&as_sdt=0,7",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "University of Arizona;University of Texas at San Antonio;Los Alamos National Laboratory",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.arizona.edu;https://www.utsa.edu;https://www.lanl.gov",
        "aff_unique_abbr": "UA;UTSA;LANL",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";San Antonio",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "gaAvQ4ogUX",
        "title": "A Convergent Federated Clustering Algorithm without Initial Condition",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Federated learning (FL) is a distributed learning paradigm that allows multiple users to collaboratively train a shared model without exchanging their data with a central server. However, optimal models of different users often differ due to heterogeneity of data across users. \nIn this paper, we address the dichotomy between heterogeneous models and simultaneous training in FL via a clustering structure among the users.  The clustering framework is one way to allow for   high heterogeneity level between users, while users with similar data can still train a shared model. In this paper, we define a new clustering framework for FL based on the (optimal) local models of the users: two users belong to the same cluster if their local models are close. We propose an  algorithm, Successive Refine Federated Clustering Algorithm (SR-FCA), that treats each user as a singleton cluster as an initialization, and then successively refine the cluster estimation via exploiting similarity with other users. In any intermediate step, SR-FCA uses an  error-tolerant federated learning algorithm within each cluster to exploit simultaneous training and to correct clustering errors. Unlike some prominent prior works,  SR-FCA does not require any  good initialization (or warm start), both in theory and practice. We show that with proper choice of learning rate, SR-FCA incurs arbitrarily small clustering error. Additionally, SR-FCA does not require the knowledge of the number of clusters apriori like some prior works. We also validate the performance of our algorithm on real-world FL datasets including FEMNIST and Shakespeare in non-convex problems and show the benefits of SR-FCA over several baselines.",
        "keywords": "Federated Learning;Heterogeneity;Clustering",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/a3ae176d816553f0a67cd219afdf647e4cdda1d5.zip",
        "author": "Harsh Vardhan;Avishek Ghosh;Arya Mazumdar",
        "authorids": "~Harsh_Vardhan1;~Avishek_Ghosh2;~Arya_Mazumdar1",
        "gender": ";M;M",
        "homepage": ";https://sites.google.com/view/avishekghosh;http://www.cs.umass.edu/~arya",
        "dblp": ";98/275;77/6050",
        "google_scholar": ";8y0Dg5cAAAAJ;https://scholar.google.com.tw/citations?user=9tjQU1EAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Harsh_Vardhan1;~Avishek_Ghosh2;~Arya_Mazumdar1",
        "aff": ";Indian Institute of Technology, Bombay;University of California, San Diego",
        "aff_domain": ";iitb.ac.in;ucsd.edu",
        "position": ";Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nvardhan2024a,\ntitle={A Convergent Federated Clustering  Algorithm without Initial Condition},\nauthor={Harsh Vardhan and Avishek Ghosh and Arya Mazumdar},\nyear={2024},\nurl={https://openreview.net/forum?id=gaAvQ4ogUX}\n}",
        "github": "",
        "project": "",
        "reviewers": "Vidh;TZiD;41D8;rp3L",
        "site": "https://openreview.net/forum?id=gaAvQ4ogUX",
        "pdf_size": 499413,
        "rating": "3;3;5;5",
        "confidence": "4;5;3;2",
        "soundness": "2;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "2;1;3;2",
        "wc_summary": "67;24;63;58",
        "wc_strengths": "56;11;58;81",
        "wc_weaknesses": "253;41;207;73",
        "wc_questions": "122;4;7;6",
        "wc_review": "498;80;335;218",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            53.0,
            17.04406054905931
        ],
        "wc_strengths_avg": [
            51.5,
            25.362373705944798
        ],
        "wc_weaknesses_avg": [
            143.5,
            88.73978814489023
        ],
        "wc_questions_avg": [
            34.75,
            50.38538974742579
        ],
        "wc_review_avg": [
            282.75,
            153.592602360921
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8944271909999159,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=449272174461110329&as_sdt=5,34&sciodt=0,34&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Indian Institute of Technology Bombay;University of California, San Diego",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.iitb.ac.in;https://www.ucsd.edu",
        "aff_unique_abbr": "IIT Bombay;UCSD",
        "aff_campus_unique_index": "0;1",
        "aff_campus_unique": "Bombay;San Diego",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "India;United States"
    },
    {
        "title": "Logical Languages Accepted by Transformer Encoders with Hard Attention",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18141",
        "id": "gbrHZq07mq",
        "author_site": "Pablo Barcelo, Alexander Kozachinskiy, Anthony W. Lin, Vladimir Podolskii",
        "tldr": "",
        "abstract": "We contribute to the study of formal languages that can be recognized by transformer encoders. We focus on two self-attention mechanisms: (1) UHAT (Unique Hard Attention Transformers) and (2) AHAT (Average Hard Attention Transformers). UHAT encoders are known to  recognize only languages inside the circuit complexity class ${\\sf AC}^0$, i.e., accepted by a family of poly-sized and depth-bounded boolean circuits with unbounded fan-ins. On the other hand, AHAT encoders can recognize languages outside ${\\sf AC}^0$), but their expressive power still lies within the bigger circuit complexity class ${\\sf TC}^0$, i.e., ${\\sf AC}^0$-circuits extended by majority gates.\nWe first show a negative result that there is an  ${\\sf AC}^0$-language that cannot be recognized by an UHAT encoder. On the positive side, we show that UHAT encoders can recognize a rich fragment of ${\\sf AC}^0$-languages, namely, all languages definable in first-order logic with arbitrary unary numerical predicates. This logic, includes, for example, all regular languages from  ${\\sf AC}^0$. We then show that AHAT encoders can recognize all languages of our logic even when we enrich it with counting terms. Using these results, we obtain a characterization of which counting properties are expressible by UHAT and AHAT, in relation to regular languages.",
        "keywords": "transformer encoders;languages;AC0;first order logic;linear temporal logic;counting terms;parity;majority",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "/attachment/5630524797871c905ca27daf2cd1114719f1f16d.pdf",
        "author": "Pablo Barcelo;Alexander Kozachinskiy;Anthony Widjaja Lin;Vladimir Podolskii",
        "authorids": "~Pablo_Barcelo1;~Alexander_Kozachinskiy1;~Anthony_Widjaja_Lin1;podolskii.vv@gmail.com",
        "gender": "M;M;M;",
        "homepage": "https://pbarcelo.ing.uc.cl/;https://kozlachinskiy.github.io/;https://anthonywlin.github.io/;",
        "dblp": "29/5169;164/0711;38/2655;",
        "google_scholar": "9OH3PokAAAAJ;gAKBJ7kAAAAJ;https://scholar.google.co.uk/citations?user=__5nnYUAAAAJ;",
        "orcid": "0000-0003-2293-2653;0000-0002-9956-9023;0000-0003-4715-5096;",
        "linkedin": ";;;",
        "or_profile": "~Pablo_Barcelo1;~Alexander_Kozachinskiy1;~Anthony_Widjaja_Lin1;podolskii.vv@gmail.com",
        "aff": "Pontificia Universidad Cat\u00f3lica;Pontificia Universidad Catolica de Chile;Universit\u00e4t Kaiserslautern;",
        "aff_domain": "uc.cl;puc.cl;uni-kl.de;",
        "position": "Full Professor;Postdoc;Full Professor;",
        "bibtex": "@inproceedings{\nbarcelo2024logical,\ntitle={Logical Languages Accepted by Transformer Encoders with Hard Attention},\nauthor={Pablo Barcelo and Alexander Kozachinskiy and Anthony Widjaja Lin and Vladimir Podolskii},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=gbrHZq07mq}\n}",
        "github": "",
        "project": "",
        "reviewers": "maoo;wdZx;ceMz;yxZd;auhY",
        "pdf_size": 292730,
        "rating": "3;3;6;8;8",
        "confidence": "3;3;2;3;3",
        "soundness": "2;2;3;4;2",
        "contribution": "2;2;2;3;4",
        "presentation": "3;2;2;4;2",
        "wc_summary": "110;72;394;151;191",
        "wc_strengths": "43;31;61;150;70",
        "wc_weaknesses": "368;161;38;10;47",
        "wc_questions": "28;11;152;132;118",
        "wc_review": "549;275;645;443;426",
        "wc_reply_reviewers": "141;35;577;0;67",
        "wc_reply_authors": "911;652;1023;51;336",
        "reply_reviewers": "1;1;1;0;1",
        "reply_authors": "3;1;2;1;1",
        "rating_avg": [
            5.6,
            2.244994432064365
        ],
        "confidence_avg": [
            2.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.6,
            0.8
        ],
        "contribution_avg": [
            2.6,
            0.8
        ],
        "presentation_avg": [
            2.6,
            0.8
        ],
        "wc_summary_avg": [
            183.6,
            112.47862019068336
        ],
        "wc_strengths_avg": [
            71.0,
            41.77559095931499
        ],
        "wc_weaknesses_avg": [
            124.8,
            132.07785582753831
        ],
        "wc_questions_avg": [
            88.2,
            57.377347446531545
        ],
        "wc_review_avg": [
            467.6,
            124.52084162902209
        ],
        "wc_reply_reviewers_avg": [
            164.0,
            211.68089191044146
        ],
        "wc_reply_authors_avg": [
            594.6,
            360.3623731745588
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4
        ],
        "reply_authors_avg": [
            1.6,
            0.8
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.08908708063747481,
        "gs_citation": 16,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14435860525364898125&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=gbrHZq07mq",
        "pdf": "https://openreview.net/pdf?id=gbrHZq07mq",
        "email": "uc.cl;puc.cl;uni-kl.de;",
        "author_num": 4,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Pontificia Universidad Cat\u00f3lica;Pontificia Universidad Catolica de Chile;University of Kaiserslautern",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.puc.cl;https://www.puc.cl;https://www.uni-kl.de",
        "aff_unique_abbr": "PUC;PUC;Uni KL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "Chile;Germany"
    },
    {
        "title": "Feature Collapse",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18140",
        "id": "gctmyMiPHH",
        "author_site": "Thomas Laurent, James von Brecht, Xavier Bresson",
        "tldr": "",
        "abstract": "We formalize and study a phenomenon called *feature collapse* that makes precise the intuitive idea that entities playing a similar role in a learning task receive similar representations. As feature collapse requires a notion of task, we leverage a synthetic task in which a learner must classify  `sentences' constituted of $L$ tokens. We start by showing experimentally that feature collapse goes hand in hand with generalization. We then prove that, in the large sample limit,  distinct tokens that play identical roles in the task receive identical local feature representations in the first layer of the network. This analysis shows that a neural network trained on this task provably learns interpretable and meaningful representations in its first layer.",
        "keywords": "deep learning theory;representation learning;neural collapse",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Thomas Laurent;James von Brecht;Xavier Bresson",
        "authorids": "~Thomas_Laurent1;~James_von_Brecht1;~Xavier_Bresson6",
        "gender": "M;;M",
        "homepage": "http://thomaslaurent.lmu.build/homepage.html;;https://www.comp.nus.edu.sg/cs/people/xaviercs/",
        "dblp": "47/8889-1;24/9745;95/378",
        "google_scholar": "_Ag_9uAAAAAJ;;https://scholar.google.com.sg/citations?hl=en",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Thomas_Laurent1;~James_von_Brecht1;~Xavier_Bresson6",
        "aff": "Loyola Marymount University;None;National University of Singapore",
        "aff_domain": "lmu.edu;gmail.com;nus.edu.sg",
        "position": "Full Professor;Independent Scholar;Associate Professor",
        "bibtex": "@inproceedings{\nlaurent2024feature,\ntitle={Feature Collapse},\nauthor={Thomas Laurent and James von Brecht and Xavier Bresson},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=gctmyMiPHH}\n}",
        "github": "",
        "project": "",
        "reviewers": "pmX6;xgCm;nQiF;ZbKw",
        "pdf_size": 3388908,
        "rating": "5;6;6;8",
        "confidence": "2;3;3;3",
        "soundness": "3;3;3;3",
        "contribution": "3;2;3;3",
        "presentation": "3;2;4;3",
        "wc_summary": "118;145;129;90",
        "wc_strengths": "19;47;68;38",
        "wc_weaknesses": "139;231;62;95",
        "wc_questions": "232;80;5;76",
        "wc_review": "508;503;264;299",
        "wc_reply_reviewers": "0;14;20;51",
        "wc_reply_authors": "1497;755;577;955",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "2;2;2;3",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            120.5,
            20.05617112013158
        ],
        "wc_strengths_avg": [
            43.0,
            17.621010186706094
        ],
        "wc_weaknesses_avg": [
            131.75,
            63.47981962797311
        ],
        "wc_questions_avg": [
            98.25,
            82.78398093834338
        ],
        "wc_review_avg": [
            393.5,
            112.69538588602464
        ],
        "wc_reply_reviewers_avg": [
            21.25,
            18.64638034579366
        ],
        "wc_reply_authors_avg": [
            946.0,
            345.0811498763733
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.6622661785325219,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16699217797939665071&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=gctmyMiPHH",
        "pdf": "https://openreview.net/pdf?id=gctmyMiPHH",
        "email": "lmu.edu;gmail.com;nus.edu.sg",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Loyola Marymount University;Google;National University of Singapore",
        "aff_unique_dep": ";Google AI;",
        "aff_unique_url": "https://www.lmu.edu;https://ai.google;https://www.nus.edu.sg",
        "aff_unique_abbr": "LMU;Google AI;NUS",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "United States;Singapore"
    },
    {
        "title": "OmniControl: Control Any Joint at Any Time for Human Motion Generation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18139",
        "id": "gd0lAEtWso",
        "author_site": "Yiming Xie, Varun Jampani, Lei Zhong, Deqing Sun, Huaizu Jiang",
        "tldr": "",
        "abstract": "We present a novel approach named OmniControl for incorporating flexible spatial control signals into a text-conditioned human motion generation model based on the diffusion process. Unlike previous methods that can only control the pelvis trajectory, OmniControl can incorporate flexible spatial control signals over different joints at different times with only one model. Specifically, we propose analytic spatial guidance that ensures the generated motion can tightly conform to the input control signals. At the same time, realism guidance is introduced to refine all the joints to generate more coherent motion. Both the spatial and realism guidance are essential and they are highly complementary for balancing control accuracy and motion realism. By combining them, OmniControl generates motions that are realistic, coherent, and consistent with the spatial constraints. Experiments on HumanML3D and KIT-ML datasets show that OmniControl not only achieves significant improvement over state-of-the-art methods on pelvis control but also shows promising results when incorporating the constraints over other joints. Project page: https://neu-vi.github.io/omnicontrol/.",
        "keywords": "3D human motion generation;diffusion models;conditional generation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/872e6dfa87254055f708adb0462dd8269e03f19b.zip",
        "author": "Yiming Xie;Varun Jampani;Lei Zhong;Deqing Sun;Huaizu Jiang",
        "authorids": "~Yiming_Xie2;~Varun_Jampani2;~Lei_Zhong1;~Deqing_Sun2;~Huaizu_Jiang1",
        "gender": "M;M;M;M;M",
        "homepage": "https://ymingxie.github.io/;https://zhongleilz.github.io;https://deqings.github.io/;http://jianghz.me;https://varunjampani.github.io/",
        "dblp": "239/2956;;69/4250;128/7890;124/2785",
        "google_scholar": "86y0joUAAAAJ;https://scholar.google.com/citations?hl=zh-CN;t4rgICIAAAAJ;0hHqYoAAAAAJ;1Cv6Sf4AAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Yiming_Xie2;~Lei_Zhong1;~Deqing_Sun2;~Huaizu_Jiang1;~Varun_Jampani1",
        "aff": "Northeastern University;University of Edinburgh;Google DeepMind;Northeastern University;Stability AI",
        "aff_domain": "northeastern.edu;sms.ed.ac.uk;google.com;northeastern.edu;stability.ai",
        "position": "PhD student;PhD student;Research Scientist;Assistant Professor;Principal Researcher",
        "bibtex": "@inproceedings{\nxie2024omnicontrol,\ntitle={OmniControl: Control Any Joint at Any Time for Human Motion Generation},\nauthor={Yiming Xie and Varun Jampani and Lei Zhong and Deqing Sun and Huaizu Jiang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=gd0lAEtWso}\n}",
        "github": "",
        "project": "",
        "reviewers": "4D6Y;gCs4;YHiJ;EL5t",
        "pdf_size": 1609943,
        "rating": "6;6;6;8",
        "confidence": "4;5;4;3",
        "soundness": "3;2;3;3",
        "contribution": "2;3;3;4",
        "presentation": "3;2;3;3",
        "wc_summary": "61;81;77;65",
        "wc_strengths": "49;100;47;78",
        "wc_weaknesses": "137;187;75;64",
        "wc_questions": "47;5;138;44",
        "wc_review": "294;373;337;251",
        "wc_reply_reviewers": "0;88;0;10",
        "wc_reply_authors": "756;528;881;460",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "3;3;3;3",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            71.0,
            8.246211251235321
        ],
        "wc_strengths_avg": [
            68.5,
            21.937410968480304
        ],
        "wc_weaknesses_avg": [
            115.75,
            49.6657578216622
        ],
        "wc_questions_avg": [
            58.5,
            48.798053239857836
        ],
        "wc_review_avg": [
            313.75,
            45.76775611716179
        ],
        "wc_reply_reviewers_avg": [
            24.5,
            36.888345042845174
        ],
        "wc_reply_authors_avg": [
            656.25,
            169.87109083066488
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.0,
            0.0
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 113,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3913433381833080667&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=gd0lAEtWso",
        "pdf": "https://openreview.net/pdf?id=gd0lAEtWso",
        "email": "northeastern.edu;sms.ed.ac.uk;google.com;northeastern.edu;stability.ai",
        "author_num": 5,
        "aff_unique_index": "0;1;2;0;3",
        "aff_unique_norm": "Northeastern University;University of Edinburgh;Google;Stability AI",
        "aff_unique_dep": ";;Google DeepMind;",
        "aff_unique_url": "https://www.northeastern.edu;https://www.ed.ac.uk;https://deepmind.com;https://stability.ai",
        "aff_unique_abbr": "NEU;Edinburgh;DeepMind;Stability AI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;0;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "gdNruOMSwc",
        "title": "Deep-Learning Approaches for Optimized Web Accessibility: Correcting Violations and Enhancing User Experience",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "With the increasing need for inclusive, user-friendly technology, web accessibility is crucial to ensuring equal access to online content for individuals with disabilities, including visual, auditory, cognitive, or motor impairments. Despite the existence of accessibility guidelines and standards such as Web Content Accessibility Guidelines (WCAG) and the Web Accessibility Initiative (W3C), over 90% of websites still fail to meet the necessary accessibility requirements. Manually detecting and correcting accessibility violations can be time-consuming and error-prone, highlighting the need for automated and intelligent solutions. While research has demonstrated methods to find and target accessibility errors, limited research has focused on effectively correcting accessibility violations. This paper presents an automatic deep-learning-based approach to correcting accessibility violations in web content. We aim to enhance web accessibility, promote inclusivity, and improve the overall user experience for individuals with impairments. We employ website accessibility violation data and prompt engineering to identify potential accessibility issues within HTML code. Leveraging accessibility error information, large language models (LLMs), and prompt engineering techniques, we achieved an over 50% reduction in accessibility violation errors after corrections. While our research successfully illustrates the ability of prompt engineering techniques to efficiently correct website accessibility violation errors, further research may be necessary to explore a larger range of website URLs or to focus on researching techniques for best handling specific common accessibility errors. Our work demonstrates a valuable approach toward the direction of inclusive web content, and provides directions for future research to explore advanced methods to automate web accessibility.",
        "keywords": "web accessibility;artificial intelligence;large language models;benchmark;GPT",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/adbd6b210a74f4dc13ff1c7a46ae14838f1e2aa3.zip",
        "author": "Calista Huang;Alyssa Ma;Suchir Vyasamudri;Eugenie Puype;Sayem Kamal;Salar Cheema;Michael Lutz",
        "authorids": "~Calista_Huang1;~Alyssa_Ma1;~Suchir_Vyasamudri1;~Eugenie_Puype1;~Sayem_Kamal1;~Salar_Cheema1;~Michael_Lutz2",
        "gender": "F;;;F;M;M;M",
        "homepage": ";;;;;;",
        "dblp": ";;;;;;",
        "google_scholar": ";;;;;;UyodfjcAAAAJ",
        "orcid": ";;;;;;",
        "linkedin": "calista-h-b3970a229/;alyssa-m-1304a4243/;suchir-vyasamudri-abab7b1bb/;eugenie-puype-67b647210/;sayem-kamal-000683236/;https://linkedin.com/in/salarcheema;",
        "or_profile": "~Calista_Huang1;~Alyssa_Ma1;~Suchir_Vyasamudri1;~Eugenie_Puype1;~Sayem_Kamal1;~Salar_Cheema1;~Michael_Lutz2",
        "aff": "Carlmont High School;Crofton House School;Lynbrook High School;International School of Zug and Luzern;Columbia University;Department of Computer Science;University of California, Berkeley",
        "aff_domain": "carlmonths.org;croftonhouseschool.edu;lynbrookhighschool.edu;internationalschoolofzugandluzern.edu;columbia.edu;cs.illinois.edu;berkeley.edu",
        "position": "High School Student;High School Student;Researcher;Student;Undergrad student;Undergrad student;Undergrad student",
        "bibtex": "@misc{\nhuang2024deeplearning,\ntitle={Deep-Learning Approaches for Optimized Web Accessibility: Correcting Violations and Enhancing User Experience},\nauthor={Calista Huang and Alyssa Ma and Suchir Vyasamudri and Eugenie Puype and Sayem Kamal and Salar Cheema and Michael Lutz},\nyear={2024},\nurl={https://openreview.net/forum?id=gdNruOMSwc}\n}",
        "github": "",
        "project": "",
        "reviewers": "72AK;Q9fB;pEL2",
        "site": "https://openreview.net/forum?id=gdNruOMSwc",
        "pdf_size": 712213,
        "rating": "3;5;5",
        "confidence": "4;3;4",
        "soundness": "2;3;2",
        "contribution": "2;3;2",
        "presentation": "2;3;2",
        "wc_summary": "83;86;54",
        "wc_strengths": "129;61;32",
        "wc_weaknesses": "687;72;116",
        "wc_questions": "93;11;120",
        "wc_review": "992;230;322",
        "wc_reply_reviewers": "0;0;13",
        "wc_reply_authors": "983;347;659",
        "reply_reviewers": "0;0;1",
        "reply_authors": "2;1;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            74.33333333333333,
            14.429907214608907
        ],
        "wc_strengths_avg": [
            74.0,
            40.65300316909769
        ],
        "wc_weaknesses_avg": [
            291.6666666666667,
            280.1194189785651
        ],
        "wc_questions_avg": [
            74.66666666666667,
            46.348918242200895
        ],
        "wc_review_avg": [
            514.6666666666666,
            339.60892541601766
        ],
        "wc_reply_reviewers_avg": [
            4.333333333333333,
            6.128258770283413
        ],
        "wc_reply_authors_avg": [
            663.0,
            259.6613178738797
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:7SuV6Khm2RYJ:scholar.google.com/&scioq=Deep-Learning+Approaches+for+Optimized+Web+Accessibility:+Correcting+Violations+and+Enhancing+User+Experience&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;4;5;6",
        "aff_unique_norm": "Carlmont High School;Crofton House School;Lynbrook High School;International School of Zug and Luzern;Columbia University;Unknown Institution;University of California, Berkeley",
        "aff_unique_dep": ";;;;;Department of Computer Science;",
        "aff_unique_url": "https://www.carlmont.org;;;https://www.iszlu.ch;https://www.columbia.edu;;https://www.berkeley.edu",
        "aff_unique_abbr": ";;;;Columbia;;UC Berkeley",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Berkeley",
        "aff_country_unique_index": "0;1;0;2;0;0",
        "aff_country_unique": "United States;United Kingdom;Switzerland;"
    },
    {
        "id": "gdjTPCQxXJ",
        "title": "From Scarcity to Efficiency: Improving CLIP Training via Visual-enriched Captions",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Web-crawled datasets are pivotal to the success of pre-training vision-language models, exemplified by CLIP. However, web-crawled AltTexts can be noisy and potentially irrelevant to images, thereby undermining the crucial image-text alignment. Existing methods for rewriting captions using large language models (LLMs) have shown promise on small, curated datasets like CC3M and CC12M. Nevertheless, their efficacy on massive web-captured captions is constrained by the inherent noise and randomness in such data. In this study, we address this limitation by focusing on two key aspects: data quality and data variety. Unlike recent LLM rewriting techniques, we emphasize exploiting visual concepts and their integration into the captions to improve data quality. For data variety, we propose a novel mixed training scheme that optimally leverages AltTexts alongside newly generated Visual-enriched Captions (VeC). We use CLIP as one example and adapt the method for CLIP training on large-scale web-crawled datasets, named VeCLIP.  We conduct a comprehensive evaluation of VeCLIP across small, medium, and large scales of raw data. Our results show significant advantages in image-text alignment and overall model performance,  underscoring the effectiveness of VeCLIP in improving CLIP training. For example, VeCLIP achieves a remarkable over 20\\% improvement in COCO and Flickr30k retrieval tasks under the 12M setting. For data efficiency, we also achieve a notable over 3% improvement while using only 14\\% of the data employed in the vanilla CLIP and 11% in ALIGN.",
        "keywords": "Vision-language model;large-scale pre-training",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Zhengfeng Lai;Haotian Zhang;Wentao Wu;Haoping Bai;Aleksei Timofeev;Xianzhi Du;Zhe Gan;Jiulong Shan;Chen-Nee Chuah;Yinfei Yang;Meng Cao",
        "authorids": "~Zhengfeng_Lai1;~Haotian_Zhang3;~Wentao_Wu3;~Haoping_Bai1;~Aleksei_Timofeev1;~Xianzhi_Du4;~Zhe_Gan1;~Jiulong_Shan2;~Chen-Nee_Chuah1;~Yinfei_Yang1;~Meng_Cao2",
        "gender": "M;M;M;;;M;M;;F;;M",
        "homepage": "https://zjujefflai.github.io/;https://haotian-zhang.github.io/;https://www.linkedin.com/in/wentao-wu-45819168/;;;;http://zhegan27.github.io/;;https://www.ece.ucdavis.edu/~chuah/;;https://www.linkedin.com/in/caomeng/",
        "dblp": "272/6220;;;;;;41/7845;;;117/4082;",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;1vz0kKUAAAAJ;;;;l1hP40AAAAAJ;E64XWyMAAAAJ;;bZNRLNAAAAAJ;kvDbu90AAAAJ;",
        "orcid": "0000-0002-2984-7913;0000-0001-6809-0426;;;;;;;0000-0002-2772-387X;;",
        "linkedin": "zhengfeng-jeff-lai-b3a214160/;haotian-zhang-075508a6/;;;;xianzhi-du-1b128934/;zhe-gan-a2229a78/;;chen-nee-chuah-2451511/;;caomeng/",
        "or_profile": "~Zhengfeng_Lai1;~Haotian_Zhang3;~Wentao_Wu3;~Haoping_Bai1;~Aleksei_Timofeev1;~Xianzhi_Du4;~Zhe_Gan1;~Jiulong_Shan2;~Chen-Nee_Chuah1;~Yinfei_Yang1;~Meng_Cao2",
        "aff": "Apple;Apple AI/ML;Apple;;;Apple;Apple;;University of California, Davis;Apple;Apple",
        "aff_domain": "apple.com;apple.com;apple.com;;;apple.com;apple.com;;ucdavis.edu;apple.com;apple.com",
        "position": "Researcher;Researcher;Researcher;;;Researcher;Principal Researcher;;Professor;Researcher;Researcher",
        "bibtex": "@misc{\nlai2024from,\ntitle={From Scarcity to Efficiency: Improving {CLIP} Training via Visual-enriched Captions},\nauthor={Zhengfeng Lai and Haotian Zhang and Wentao Wu and Haoping Bai and Aleksei Timofeev and Xianzhi Du and Zhe Gan and Jiulong Shan and Chen-Nee Chuah and Yinfei Yang and Meng Cao},\nyear={2024},\nurl={https://openreview.net/forum?id=gdjTPCQxXJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "xQRG;kMtd;8ucx",
        "site": "https://openreview.net/forum?id=gdjTPCQxXJ",
        "pdf_size": 15231341,
        "rating": "3;5;5",
        "confidence": "5;4;4",
        "soundness": "2;3;2",
        "contribution": "2;2;2",
        "presentation": "3;3;3",
        "wc_summary": "94;76;43",
        "wc_strengths": "105;17;59",
        "wc_weaknesses": "412;33;80",
        "wc_questions": "23;32;6",
        "wc_review": "634;158;188",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "484;92;81",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            71.0,
            21.118712081942874
        ],
        "wc_strengths_avg": [
            60.333333333333336,
            35.93821859184948
        ],
        "wc_weaknesses_avg": [
            175.0,
            168.67918267132632
        ],
        "wc_questions_avg": [
            20.333333333333332,
            10.780641085864152
        ],
        "wc_review_avg": [
            326.6666666666667,
            217.6623276749766
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            219.0,
            187.43710056087258
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": -0.9999999999999997,
        "gs_citation": 28,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3904647199650419901&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0;0;0;1;0;0",
        "aff_unique_norm": "Apple;University of California, Davis",
        "aff_unique_dep": "Apple Inc.;",
        "aff_unique_url": "https://www.apple.com;https://www.ucdavis.edu",
        "aff_unique_abbr": "Apple;UC Davis",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Davis",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Attention Satisfies: A Constraint-Satisfaction Lens on Factual Errors of Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18138",
        "id": "gfFVATffPd",
        "author_site": "Mert Yuksekgonul, Varun Chandrasekaran, Erik Jones, Suriya Gunasekar, Ranjita Naik, Hamid Palangi, Ece Kamar, Besmira Nushi",
        "tldr": "",
        "abstract": "We investigate the internal behavior of Transformer-based Large Language Models (LLMs) when they generate factually incorrect text. We propose modeling factual queries as constraint satisfaction problems and use this framework to investigate how the LLM interacts internally with factual constraints. We find a strong positive relationship between the LLM's attention to constraint tokens and the factual accuracy of generations. We curate a suite of 10 datasets containing over 40,000 prompts to study the task of predicting factual errors with the Llama-2 family across all scales (7B, 13B, 70B). We propose SAT Probe, a method probing attention patterns, that can predict factual errors and fine-grained constraint satisfaction, and allow early error identification. The approach and findings take another step towards using the mechanistic understanding of LLMs to enhance their reliability.",
        "keywords": "interpretability;factual errors;hallucinations;attention;large language models",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Mert Yuksekgonul;Varun Chandrasekaran;Erik Jones;Suriya Gunasekar;Ranjita Naik;Hamid Palangi;Ece Kamar;Besmira Nushi",
        "authorids": "~Mert_Yuksekgonul1;~Varun_Chandrasekaran1;~Erik_Jones3;~Suriya_Gunasekar1;~Ranjita_Naik1;~Hamid_Palangi1;~Ece_Kamar1;~Besmira_Nushi1",
        "gender": "M;M;M;;F;M;;F",
        "homepage": "https://cs.stanford.edu/~merty;http://pages.cs.wisc.edu/~chandrasekaran/;http://people.eecs.berkeley.edu/~erjones/;http://sgunasekar.github.io;https://github.com/ranjita-naik/;https://www.hamidpalangi.com/;https://www.ecekamar.com/;http://besmiranushi.com/",
        "dblp": "249/5558;;264/5304;;;01/963;36/3834;117/4927",
        "google_scholar": "https://scholar.google.com/citations?hl=en;Sl7nSOsAAAAJ;_-CU2CsAAAAJ;EkREu_QAAAAJ;;https://scholar.google.ca/citations?user=B1lAghgAAAAJ;7Xko5sYAAAAJ;QWTkjB8AAAAJ",
        "orcid": ";;;;;;;",
        "linkedin": ";;erik-jones-879239133/;;;;;",
        "or_profile": "~Mert_Yuksekgonul1;~Varun_Chandrasekaran1;~Erik_Jones3;~Suriya_Gunasekar1;~Ranjita_Naik1;~Hamid_Palangi1;~Ece_Kamar1;~Besmira_Nushi1",
        "aff": "Microsoft;University of Illinois Urbana-Champaign;University of California, Berkeley;Microsoft;Microsoft;Google;;Microsoft",
        "aff_domain": "microsoft.com;illinois.edu;berkeley.edu;microsoft.com;microsoft.com;google.com;;microsoft.com",
        "position": "Intern;Assistant Professor;PhD student;Senior Researcher;Researcher;Staff Research Scientist;;Researcher",
        "bibtex": "@inproceedings{\nyuksekgonul2024attention,\ntitle={Attention Satisfies: A Constraint-Satisfaction Lens on Factual Errors of Language Models},\nauthor={Mert Yuksekgonul and Varun Chandrasekaran and Erik Jones and Suriya Gunasekar and Ranjita Naik and Hamid Palangi and Ece Kamar and Besmira Nushi},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=gfFVATffPd}\n}",
        "github": "",
        "project": "",
        "reviewers": "MD6P;m32R;KSCt",
        "pdf_size": 3603646,
        "rating": "6;6;6",
        "confidence": "4;3;4",
        "soundness": "3;3;2",
        "contribution": "3;2;2",
        "presentation": "4;3;3",
        "wc_summary": "87;104;126",
        "wc_strengths": "101;63;107",
        "wc_weaknesses": "239;5;481",
        "wc_questions": "35;156;152",
        "wc_review": "462;328;866",
        "wc_reply_reviewers": "244;7;27",
        "wc_reply_authors": "1144;689;1406",
        "reply_reviewers": "1;1;1",
        "reply_authors": "3;2;5",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            105.66666666666667,
            15.965240019770729
        ],
        "wc_strengths_avg": [
            90.33333333333333,
            19.48218559493661
        ],
        "wc_weaknesses_avg": [
            241.66666666666666,
            194.33533446654067
        ],
        "wc_questions_avg": [
            114.33333333333333,
            56.12090123613087
        ],
        "wc_review_avg": [
            552.0,
            228.67152570153254
        ],
        "wc_reply_reviewers_avg": [
            92.66666666666667,
            107.31987493263098
        ],
        "wc_reply_authors_avg": [
            1079.6666666666667,
            296.2277652227908
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            1.247219128924647
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 39,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10353094262233998728&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=gfFVATffPd",
        "pdf": "https://openreview.net/pdf?id=gfFVATffPd",
        "email": "microsoft.com;illinois.edu;berkeley.edu;microsoft.com;microsoft.com;google.com;;microsoft.com",
        "author_num": 8,
        "aff_unique_index": "0;1;2;0;0;3;0",
        "aff_unique_norm": "Microsoft;University of Illinois Urbana-Champaign;University of California, Berkeley;Google",
        "aff_unique_dep": "Microsoft Corporation;;;Google",
        "aff_unique_url": "https://www.microsoft.com;https://illinois.edu;https://www.berkeley.edu;https://www.google.com",
        "aff_unique_abbr": "Microsoft;UIUC;UC Berkeley;Google",
        "aff_campus_unique_index": "1;2;3",
        "aff_campus_unique": ";Urbana-Champaign;Berkeley;Mountain View",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "gfh8ZbSlyf",
        "title": "SITReg: Multi-resolution architecture for symmetric, inverse consistent, and topology preserving image registration using deformation inversion layers",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep learning has emerged as a strong alternative for classical iterative methods for deformable medical image registration, where the goal is to find a mapping between the coordinate systems of two images. Popular classical image registration methods enforce the useful inductive biases of symmetricity, inverse consistency, and topology preservation by construct. However, while many deep learning registration methods encourage these properties via loss functions, none of the methods enforces all of them by construct. Here, we propose a novel registration architecture based on extracting multi-resolution feature representations which is by construct symmetric, inverse consistent, and topology preserving. We also develop an implicit layer for memory efficient inversion of the deformation fields. Our method achieves state-of-the-art registration accuracy on two datasets.",
        "keywords": "Deformable image registration;Unsupervised learning;Symmetric registration;Medical imaging;Deep equilibrium models",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/92c15975e9cfbbe4064f405772c23de9ec3707a4.zip",
        "author": "Joel Honkamaa;Pekka Marttinen",
        "authorids": "~Joel_Honkamaa1;~Pekka_Marttinen1",
        "gender": ";M",
        "homepage": ";https://users.ics.aalto.fi/~pemartti/",
        "dblp": "327/6406;32/894",
        "google_scholar": ";id47-5cAAAAJ",
        "orcid": ";0000-0001-7078-7927",
        "linkedin": "joel-honkamaa-76411b21b;",
        "or_profile": "~Joel_Honkamaa1;~Pekka_Marttinen1",
        "aff": "Aalto University;Aalto University",
        "aff_domain": "aalto.fi;aalto.fi",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\nhonkamaa2024sitreg,\ntitle={{SITR}eg: Multi-resolution architecture for symmetric, inverse consistent, and topology preserving image registration using deformation inversion layers},\nauthor={Joel Honkamaa and Pekka Marttinen},\nyear={2024},\nurl={https://openreview.net/forum?id=gfh8ZbSlyf}\n}",
        "github": "",
        "project": "",
        "reviewers": "2iyN;nQ7w;eYpy",
        "site": "https://openreview.net/forum?id=gfh8ZbSlyf",
        "pdf_size": 5385741,
        "rating": "5;5;6",
        "confidence": "4;4;4",
        "soundness": "2;3;3",
        "contribution": "2;3;2",
        "presentation": "2;3;2",
        "wc_summary": "50;50;69",
        "wc_strengths": "29;50;54",
        "wc_weaknesses": "326;31;147",
        "wc_questions": "8;33;69",
        "wc_review": "413;164;339",
        "wc_reply_reviewers": "0;0;41",
        "wc_reply_authors": "1239;306;687",
        "reply_reviewers": "0;0;1",
        "reply_authors": "10;2;3",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            56.333333333333336,
            8.9566858950296
        ],
        "wc_strengths_avg": [
            44.333333333333336,
            10.96458946893235
        ],
        "wc_weaknesses_avg": [
            168.0,
            121.34523751127057
        ],
        "wc_questions_avg": [
            36.666666666666664,
            25.037749277618563
        ],
        "wc_review_avg": [
            305.3333333333333,
            104.40412933510926
        ],
        "wc_reply_reviewers_avg": [
            13.666666666666666,
            19.3275853524323
        ],
        "wc_reply_authors_avg": [
            744.0,
            383.0221925685247
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            5.0,
            3.559026084010437
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:P2yuvwJ0Qp8J:scholar.google.com/&scioq=SITReg:+Multi-resolution+architecture+for+symmetric,+inverse+consistent,+and+topology+preserving+image+registration+using+deformation+inversion+layers&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Aalto University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.aalto.fi",
        "aff_unique_abbr": "Aalto",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Finland"
    },
    {
        "id": "ghdSJUNlRQ",
        "title": "Bridging Sub-Tasks to Long-Horizon Task in Hierarchical Goal-Based Reinforcement Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Hierarchical goal-based reinforcement learning (HGRL) is a promising approach\nto learn a long-horizon task by decomposing it into a series of subtasks of achiev-\ning subgoals in a shorter horizon. However, the performance of HGRL crucially\ndepends on the design of intrinsic rewards for these subtasks: as frequently ob-\nserved in practice, short-sighted reward designs often lead the agent into undesir-\nable states where the final goal is no longer achievable. One potential remedy to\nthe issue is to provide the agent with a means to evaluate the achievability of the fi-\nnal goal upon the completion of the subtask; yet, evaluating this achievability over\na long planning horizon is a challenging task by itself. In this work, we propose\na subtask reward scheme aimed at bridging the gap between the long-horizon pri-\nmary goal and short-horizon subtasks by incorporating a look-ahead information\ntowards the next subgoals. We provide an extensive empirical analysis in MuJoCo\nenvironments, demonstrating the importance of looking ahead to the subsequent\nsub-goals and the improvement of the proposed framework applied to the existing\nHGRL baselines.",
        "keywords": "Hierarchical Reinforcement Learning;Goal-based Reinforcement Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/bbe1cfe574db49a9d979072ffaee7f7d23f49489.zip",
        "author": "Gangbok Lee;Youngsik Yoon;Jeongyeol Kwon;Sungsoo Ahn;Jungseul Ok",
        "authorids": "~Gangbok_Lee1;~Youngsik_Yoon1;~Jeongyeol_Kwon1;~Sungsoo_Ahn1;~Jungseul_Ok2",
        "gender": ";M;M;M;M",
        "homepage": "http://ml.postech.ac.kr;http://ml.postech.ac.kr/;https://kwonchungli.github.io/;https://sungsooahn.super.site/;https://sites.google.com/view/jungseulok",
        "dblp": ";273/1365;https://dblp.uni-trier.de/pid/228/9224;90/5164;117/3448",
        "google_scholar": ";;cnyMCYMAAAAJ;XTenHs0AAAAJ;KWG3UUMAAAAJ",
        "orcid": ";;;;0000-0003-4742-2473",
        "linkedin": ";;;;",
        "or_profile": "~Gangbok_Lee1;~Youngsik_Yoon1;~Jeongyeol_Kwon1;~Sungsoo_Ahn1;~Jungseul_Ok2",
        "aff": "POSTECH;POSTECH;University of Wisconsin - Madison;Pohang University of Science and Technology;POSTECH",
        "aff_domain": "postech.ac.kr;postech.ac.kr;wisc.edu;postech.ac.kr;postech.ac.kr",
        "position": "MS student;PhD student;Postdoc;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nlee2024bridging,\ntitle={Bridging Sub-Tasks to Long-Horizon Task in Hierarchical Goal-Based Reinforcement Learning},\nauthor={Gangbok Lee and Youngsik Yoon and Jeongyeol Kwon and Sungsoo Ahn and Jungseul Ok},\nyear={2024},\nurl={https://openreview.net/forum?id=ghdSJUNlRQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "xgwB;mzz8;oQAw",
        "site": "https://openreview.net/forum?id=ghdSJUNlRQ",
        "pdf_size": 2494778,
        "rating": "3;3;5",
        "confidence": "3;5;4",
        "soundness": "2;3;2",
        "contribution": "2;3;2",
        "presentation": "2;3;1",
        "wc_summary": "99;77;133",
        "wc_strengths": "124;44;43",
        "wc_weaknesses": "130;216;229",
        "wc_questions": "75;2;99",
        "wc_review": "428;339;504",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            103.0,
            23.03620339089466
        ],
        "wc_strengths_avg": [
            70.33333333333333,
            37.95025984393549
        ],
        "wc_weaknesses_avg": [
            191.66666666666666,
            43.926706632247715
        ],
        "wc_questions_avg": [
            58.666666666666664,
            41.24991582482994
        ],
        "wc_review_avg": [
            423.6666666666667,
            67.43062278289361
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:zkYHbn2lTrsJ:scholar.google.com/&scioq=Bridging+Sub-Tasks+to+Long-Horizon+Task+in+Hierarchical+Goal-Based+Reinforcement+Learning&hl=en&as_sdt=0,47",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "Pohang University of Science and Technology;University of Wisconsin-Madison",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.postech.ac.kr;https://www.wisc.edu",
        "aff_unique_abbr": "POSTECH;UW-Madison",
        "aff_campus_unique_index": "0;0;1;0;0",
        "aff_campus_unique": "Pohang;Madison",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "id": "ghyeMoj1gK",
        "title": "Client-centric Federated Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Conventional federated learning (FL) frameworks follow a server-centric model where the server determines session initiation and client participation. We introduce Client-Centric Federated Learning (CCFL), a novel client-centric FL framework that puts clients as the driving role of FL sessions. In CCFL, each client independently and asynchronously updates its model by uploading a locally trained model to the server and receiving a customized model tailored to its local task.  The server maintains a repository of cluster models, iteratively refining them using received client models. Our framework accommodates complex dynamics in clients' data distributions, characterized by time-varying mixtures of cluster distributions, enabling rapid adaptation to new tasks with high performance. We propose novel strategies for accurate server estimation of clients' data distributions. CCFL offers clients complete autonomy for model updates, enhances model accuracy, and significantly reduces client computation, communication, and waiting time. We provide a theoretical analysis of CCFL's convergence. Extensive experiments across various datasets and system settings highlight CCFL's substantial advantages in model performance and computation efficiency over baselines.",
        "keywords": "Federated Learning;Client-Centric;Client Autonomy and Asynchrony;Distribution Estimation",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Chenqing Zhu;Songze Li",
        "authorids": "~Chenqing_Zhu1;~Songze_Li1",
        "gender": "Not Specified;M",
        "homepage": "https://github.com/KoalaWithGarlicHead/DBLP_Author_Name_Disambiguation;https://s3di-lab.github.io/",
        "dblp": ";119/2630",
        "google_scholar": ";vcGuNDYAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Chenqing_Zhu1;~Songze_Li1",
        "aff": "Hong Kong University of Science and Technology;Southeast University",
        "aff_domain": "hkust.edu;seu.edu.cn",
        "position": "MS student;Full Professor",
        "bibtex": "@misc{\nzhu2024clientcentric,\ntitle={Client-centric Federated Learning},\nauthor={Chenqing Zhu and Songze Li},\nyear={2024},\nurl={https://openreview.net/forum?id=ghyeMoj1gK}\n}",
        "github": "",
        "project": "",
        "reviewers": "nNv3;aGfK;7mm9",
        "site": "https://openreview.net/forum?id=ghyeMoj1gK",
        "pdf_size": 6664720,
        "rating": "5;5;5",
        "confidence": "4;3;3",
        "soundness": "2;3;3",
        "contribution": "2;2;2",
        "presentation": "3;3;2",
        "wc_summary": "13;71;52",
        "wc_strengths": "33;39;24",
        "wc_weaknesses": "125;119;119",
        "wc_questions": "358;235;16",
        "wc_review": "529;464;211",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "2429;1241;1026",
        "reply_reviewers": "0;0;0",
        "reply_authors": "5;3;3",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            45.333333333333336,
            24.143091949642425
        ],
        "wc_strengths_avg": [
            32.0,
            6.164414002968976
        ],
        "wc_weaknesses_avg": [
            121.0,
            2.8284271247461903
        ],
        "wc_questions_avg": [
            203.0,
            141.44256784999345
        ],
        "wc_review_avg": [
            401.3333333333333,
            137.17709559381828
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1565.3333333333333,
            616.9799204368179
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:EDJMJXJvIKgJ:scholar.google.com/&scioq=Client-centric+Federated+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Southeast University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ust.hk;https://www.seu.edu.cn/",
        "aff_unique_abbr": "HKUST;SEU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "giOE27ECcm",
        "title": "Inverse Decision Making via Inverse Generative Modeling",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "It is often extremely challenging to infer novel concepts in decision making, such as new actions, goals, or plans, from just a few examples. In this work, we formulate the problem of inferring unfamiliar concepts in decision making as Inverse Decision Making via Inverse Generative Modeling (IDM-IGM). We then introduce a novel concept inference method for this new formulation, which can swiftly adapt to new decision making concepts by leveraging invertible neural generative models. The core idea is to pretrain a generative model on a set of basic concepts and their demonstrations. During test time, given a few demonstrations of a new decision making concept (such as a new goal or a new action), our method can conveniently infer the underlying concept through backpropagation thanks to the invertibility of the generative model. This critically avoids any fine-tuning, greatly accelerating the speed of concept learning. We evaluate our method in three domains -- object rearrangement, goal-reaching, and motion caption of human actions. Our experimental results demonstrate that the pretrained generative model can successfully (1) infer learned concepts and generate agent motion or plans of inferred concepts in unseen environments and (2) infer new compositions of learned concepts or even novel concepts to interpret unseen agent behaviors.",
        "keywords": "inverse decision-making;concept learning;inverse RL;generative model for decision-making;learning from demonstrations",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Aviv Netanyahu;Yilun Du;Tianmin Shu;Jyothish Pari;Joshua B. Tenenbaum;Pulkit Agrawal",
        "authorids": "~Aviv_Netanyahu1;~Yilun_Du1;~Tianmin_Shu1;~Jyothish_Pari1;~Joshua_B._Tenenbaum1;~Pulkit_Agrawal1",
        "gender": ";;;M;;M",
        "homepage": ";https://yilundu.github.io;;https://jyopari.github.io/;;https://people.eecs.berkeley.edu/~pulkitag/",
        "dblp": "286/8767;204/4379;163/2175.html;297/5770.html;t/JoshuaBTenenbaum;149/2672",
        "google_scholar": ";;YT_ffdwAAAAJ;WyIW46YAAAAJ;;UpZmJI0AAAAJ",
        "orcid": ";;;;;",
        "linkedin": "aviv-netanyahu/;;;jyo-pari-1a70bb1b3;;",
        "or_profile": "~Aviv_Netanyahu1;~Yilun_Du1;~Tianmin_Shu1;~Jyothish_Pari1;~Joshua_B._Tenenbaum1;~Pulkit_Agrawal1",
        "aff": "Massachusetts Institute of Technology;Massachusetts Institute of Technology;Johns Hopkins University;Massachusetts Institute of Technology;Massachusetts Institute of Technology;Massachusetts Institute of Technology",
        "aff_domain": "mit.edu;mit.edu;jhu.edu;mit.edu;mit.edu;mit.edu",
        "position": "PhD student;PhD student;Assistant Professor;PhD student;Professor;Assistant Professor",
        "bibtex": "@misc{\nnetanyahu2024inverse,\ntitle={Inverse Decision Making via Inverse Generative Modeling},\nauthor={Aviv Netanyahu and Yilun Du and Tianmin Shu and Jyothish Pari and Joshua B. Tenenbaum and Pulkit Agrawal},\nyear={2024},\nurl={https://openreview.net/forum?id=giOE27ECcm}\n}",
        "github": "",
        "project": "",
        "reviewers": "veLU;SoYM;oDMW;Mjji",
        "site": "https://openreview.net/forum?id=giOE27ECcm",
        "pdf_size": 1644930,
        "rating": "3;3;3;6",
        "confidence": "3;3;2;4",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;2",
        "presentation": "2;3;2;3",
        "wc_summary": "72;64;189;90",
        "wc_strengths": "48;32;65;55",
        "wc_weaknesses": "285;60;180;89",
        "wc_questions": "50;78;48;2",
        "wc_review": "455;234;482;236",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            103.75,
            50.11175011910879
        ],
        "wc_strengths_avg": [
            50.0,
            12.020815280171307
        ],
        "wc_weaknesses_avg": [
            153.5,
            87.8877124517415
        ],
        "wc_questions_avg": [
            44.5,
            27.253440149823287
        ],
        "wc_review_avg": [
            351.75,
            117.14174106611188
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Vl-6Y_WvlrYJ:scholar.google.com/&scioq=Inverse+Decision+Making+via+Inverse+Generative+Modeling&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;0;0",
        "aff_unique_norm": "Massachusetts Institute of Technology;Johns Hopkins University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://web.mit.edu;https://www.jhu.edu",
        "aff_unique_abbr": "MIT;JHU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "FedImpro: Measuring and Improving Client Update in Federated Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18137",
        "id": "giU9fYGTND",
        "author_site": "Zhenheng Tang, Yonggang Zhang, Shaohuai Shi, Xinmei Tian, Tongliang Liu, Bo Han, Xiaowen Chu",
        "tldr": "",
        "abstract": "Federated Learning (FL) models often experience client drift caused by heterogeneous data, where the distribution of data differs across clients. To address this issue, advanced research primarily focuses on manipulating the existing gradients to achieve more consistent client models. In this paper, we present an alternative perspective on client drift and aim to mitigate it by generating improved local models. First, we analyze the generalization contribution of local training and conclude that this generalization contribution is bounded by the conditional Wasserstein distance between the data distribution of different clients. Then, we propose FedImpro, to construct similar conditional distributions for local training. Specifically, FedImpro decouples the model into high-level and low-level components, and trains the high-level portion on reconstructed feature distributions. This approach enhances the generalization contribution and reduces the dissimilarity of gradients in FL. Experimental results show that FedImpro can help FL defend against data heterogeneity and enhance the generalization performance of the model.",
        "keywords": "Federated Learning;Deep Learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Zhenheng Tang;Yonggang Zhang;Shaohuai Shi;Xinmei Tian;Tongliang Liu;Bo Han;Xiaowen Chu",
        "authorids": "~Zhenheng_Tang2;~Yonggang_Zhang1;~Shaohuai_Shi1;~Xinmei_Tian1;~Tongliang_Liu1;~Bo_Han1;~Xiaowen_Chu2",
        "gender": "M;M;F;M;M;M;M",
        "homepage": "https://yonggangzhangben.github.io/index.html;https://shaohuais.github.io/;https://faculty.ustc.edu.cn/tianxinmei1/zh_CN/index.htm;https://tongliang-liu.github.io/;https://facultyprofiles.hkust-gz.edu.cn/faculty-personal-page/CHU-Xiaowen/xwchu;https://bhanml.github.io/;",
        "dblp": "27/6859-3;79/8378;03/5204-1;150/6667;24/2536;241/0472-3;234/7546",
        "google_scholar": "XSbEr98AAAAJ;https://scholar.google.com.hk/citations?user=Wr4B6fQAAAAJ;https://scholar.google.com.au/citations?hl=zh-CN;https://scholar.google.com.au/citations?user=EiLdZ_YAAAAJ;https://scholar.google.com.hk/citations?user=v4rX24EAAAAJ;nTNjqHwAAAAJ;FlYcrEcAAAAJ",
        "orcid": "0000-0002-4080-7592;0000-0002-1418-5160;0000-0002-5952-8753;;0000-0001-9745-4372;;0000-0001-8769-9974",
        "linkedin": ";;;;;;",
        "or_profile": "~Yonggang_Zhang1;~Shaohuai_Shi1;~Xinmei_Tian1;~Tongliang_Liu1;~Xiaowen_Chu2;~bo_han2;~Zhenheng_TANG1",
        "aff": "Hong Kong Baptist University;Harbin Institute of Technology, Shenzhen;University of Science and Technology of China;Mohamed bin Zayed University of Artificial Intelligence;Hong Kong University of Science and Technology (Guangzhou);MBZUAI;Hong Kong Baptist University",
        "aff_domain": "hkbu.edu.hk;hit.edu.cn;ustc.edu.cn;mbzuai.ac.ae;ust.hk;mbzuai.ac.ae;hkbu.edu.hk",
        "position": "Postdoc;Full Professor;Full Professor;Affiliated Associate Professor;Full Professor;Researcher;PhD student",
        "bibtex": "@inproceedings{\ntang2024fedimpro,\ntitle={FedImpro: Measuring and Improving Client Update in Federated Learning},\nauthor={Zhenheng Tang and Yonggang Zhang and Shaohuai Shi and Xinmei Tian and Tongliang Liu and Bo Han and Xiaowen Chu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=giU9fYGTND}\n}",
        "github": "",
        "project": "",
        "reviewers": "LhTp;AtvR;9583;Kzyf",
        "pdf_size": 1938396,
        "rating": "6;6;8;8",
        "confidence": "4;3;2;3",
        "soundness": "3;3;3;3",
        "contribution": "3;2;3;2",
        "presentation": "3;2;3;3",
        "wc_summary": "75;43;32;113",
        "wc_strengths": "59;39;17;130",
        "wc_weaknesses": "193;64;35;277",
        "wc_questions": "10;2;31;66",
        "wc_review": "337;148;115;586",
        "wc_reply_reviewers": "118;11;29;40",
        "wc_reply_authors": "2140;1390;1470;1547",
        "reply_reviewers": "2;1;1;1",
        "reply_authors": "7;6;5;5",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            65.75,
            31.522809202226885
        ],
        "wc_strengths_avg": [
            61.25,
            42.381452311123084
        ],
        "wc_weaknesses_avg": [
            142.25,
            97.926949814645
        ],
        "wc_questions_avg": [
            27.25,
            24.752525123712125
        ],
        "wc_review_avg": [
            296.5,
            187.3799615754043
        ],
        "wc_reply_reviewers_avg": [
            49.5,
            40.88092464707715
        ],
        "wc_reply_authors_avg": [
            1636.75,
            295.806841536838
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            5.75,
            0.82915619758885
        ],
        "replies_avg": [
            34,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.7071067811865475,
        "gs_citation": 21,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3225006413999203578&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=giU9fYGTND",
        "pdf": "https://openreview.net/pdf?id=giU9fYGTND",
        "email": "hkbu.edu.hk;hit.edu.cn;ustc.edu.cn;mbzuai.ac.ae;ust.hk;mbzuai.ac.ae;hkbu.edu.hk",
        "author_num": 7,
        "aff_unique_index": "0;1;2;3;4;3;0",
        "aff_unique_norm": "Hong Kong Baptist University;Harbin Institute of Technology;University of Science and Technology of China;Mohamed bin Zayed University of Artificial Intelligence;Hong Kong University of Science and Technology",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.hkbu.edu.hk;http://en.hhit.edu.cn/;http://www.ustc.edu.cn;https://mbzuai.ac.ae;https://www.ust.hk",
        "aff_unique_abbr": "HKBU;HIT;USTC;MBZUAI;HKUST",
        "aff_campus_unique_index": "0;1;0;0",
        "aff_campus_unique": "Hong Kong SAR;Shenzhen;",
        "aff_country_unique_index": "0;0;0;1;0;1;0",
        "aff_country_unique": "China;United Arab Emirates"
    },
    {
        "id": "gisAooH2TG",
        "title": "RePLan: Robotic Replanning with Perception and Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Advancements in large language models (LLMs) have demonstrated their potential in facilitating high-level reasoning, logical reasoning and robotics planning. Recently, LLMs have also been able to generate reward functions for low-level robot actions, effectively bridging the interface between high-level planning and low-level robot control. However, the challenge remains that even with syntactically correct plans, robots can still fail to achieve their intended goals. This failure can be attributed to imperfect plans proposed by LLMs or to unforeseeable environmental circumstances that hinder the execution of planned subtasks due to erroneous assumptions about the state of objects. One way to prevent these challenges is to rely on human-provided step-by-step instructions, limiting the autonomy of robotic systems. Vision Language Models (VLMs) have shown remarkable success in tasks such as visual question answering and image captioning. Leveraging the capabilities of VLMs, we present a novel framework called RePLan that enables real-time replanning capabilities. This framework utilizes the physical grounding provided by a VLM's understanding of the world's state to adapt robot actions when the initial plan fails to achieve the desired goal. We test our approach within two long-horizon task domains, a wooden cabinet puzzle and a larger-scale kitchen environment. We find that RePLan enables a robot to successfully adapt to  unforeseen obstacles while accomplishing open-ended, long-horizon goals, while baseline models cannot.",
        "keywords": "robotics;planning;natural language processing;computer vision",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Marta Skreta;Zihan Zhou;Jia Lin Yuan;Kourosh Darvish;Alan Aspuru-Guzik;Animesh Garg",
        "authorids": "~Marta_Skreta1;~Zihan_Zhou1;~Jia_Lin_Yuan2;~Kourosh_Darvish1;~Alan_Aspuru-Guzik2;~Animesh_Garg1",
        "gender": "F;M;M;M;M;M",
        "homepage": ";;;https://kouroshd.github.io/;http://matter.toronto.edu;http://animesh.garg.tech",
        "dblp": "255/5167;00/6525-2;;201/0505;;123/5728",
        "google_scholar": "https://scholar.google.ca/citations?user=OYd3hjYAAAAJ;;;FwFFVdIAAAAJ;Ag_6KEgAAAAJ;zp8V7ZMAAAAJ",
        "orcid": ";;;;0000-0002-8277-4434;0000-0003-0482-4296",
        "linkedin": "martaskreta/;;jalnyn;kouroshdarvish/;;animeshgarg/",
        "or_profile": "~Marta_Skreta1;~Zihan_Zhou1;~Jia_Lin_Yuan2;~Kourosh_Darvish1;~Alan_Aspuru-Guzik2;~Animesh_Garg1",
        "aff": "Department of Computer Science, University of Toronto;Department of Computer Science, University of Toronto;;University of Toronto;University of Toronto;NVIDIA",
        "aff_domain": "cs.toronto.edu;cs.toronto.edu;;utoronto.ca;utoronto.ca;nvidia.com",
        "position": "PhD student;PhD student;;Researcher;Full Professor;Researcher",
        "bibtex": "@misc{\nskreta2024replan,\ntitle={Re{PL}an: Robotic Replanning with Perception and Language Models},\nauthor={Marta Skreta and Zihan Zhou and Jia Lin Yuan and Kourosh Darvish and Alan Aspuru-Guzik and Animesh Garg},\nyear={2024},\nurl={https://openreview.net/forum?id=gisAooH2TG}\n}",
        "github": "",
        "project": "",
        "reviewers": "Ya9u;b9qX;6UHr;jtHn",
        "site": "https://openreview.net/forum?id=gisAooH2TG",
        "pdf_size": 17420369,
        "rating": "3;3;5;6",
        "confidence": "4;4;4;4",
        "soundness": "2;3;2;2",
        "contribution": "3;2;2;2",
        "presentation": "3;4;2;3",
        "wc_summary": "107;151;173;63",
        "wc_strengths": "97;73;38;49",
        "wc_weaknesses": "245;456;404;53",
        "wc_questions": "21;154;42;71",
        "wc_review": "470;834;657;236",
        "wc_reply_reviewers": "273;48;38;0",
        "wc_reply_authors": "1457;1097;2729;553",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "3;3;4;2",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            123.5,
            42.246301613277346
        ],
        "wc_strengths_avg": [
            64.25,
            22.75274708689041
        ],
        "wc_weaknesses_avg": [
            289.5,
            157.1185857879328
        ],
        "wc_questions_avg": [
            72.0,
            50.5618433208284
        ],
        "wc_review_avg": [
            549.25,
            221.9790249100126
        ],
        "wc_reply_reviewers_avg": [
            89.75,
            107.30418211793985
        ],
        "wc_reply_authors_avg": [
            1459.0,
            800.747151103268
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 31,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18414722425344808258&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0;1",
        "aff_unique_norm": "University of Toronto;NVIDIA",
        "aff_unique_dep": "Department of Computer Science;NVIDIA Corporation",
        "aff_unique_url": "https://www.utoronto.ca;https://www.nvidia.com",
        "aff_unique_abbr": "U of T;NVIDIA",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Toronto;",
        "aff_country_unique_index": "0;0;0;0;1",
        "aff_country_unique": "Canada;United States"
    },
    {
        "id": "gjB7qqPJbv",
        "title": "Benchmarks and Custom Package for Electrical Load Forecasting",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Load forecasting is of great significance in the power industry as it can provide a reference for subsequent tasks such as power grid dispatch, thus bringing huge economic benefits. However, there are many differences between load forecasting and traditional time series forecasting. On the one hand, the load is largely influenced by many external factors, such as temperature or calendar variables. On the other hand, load forecasting aims to minimize the cost of subsequent tasks such as power grid dispatch, rather than simply pursuing prediction accuracy. In addition, the scale of predictions (such as building-level loads and aggregated-level loads) can also significantly impact the predicted results. In this paper, we provide a comprehensive load forecasting archive, which includes load domain-specific feature engineering to help forecasting models better model load data. In addition, different from the traditional loss function which only aims for accuracy, we also provide a method to customize the loss function and link the forecasting error to requirements related to subsequent tasks (such as power grid dispatching costs) integrating it into our forecasting framework. Based on such a situation, we conducted extensive experiments on 16 forecasting methods in 11 load datasets at different levels under 11evaluation metrics, providing a reference for researchers to compare different load forecasting models.",
        "keywords": "Load forecasting;Forecast evaluation;Feature engineering;Customized loss function",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Zhixian Wang;Qingsong Wen;Chaoli Zhang;Liang Sun;Leandro Von Krannichfeldt;Shirui Pan;Yi Wang",
        "authorids": "~Zhixian_Wang2;~Qingsong_Wen2;~Chaoli_Zhang1;~Liang_Sun2;~Leandro_Von_Krannichfeldt1;~Shirui_Pan1;~Yi_Wang43",
        "gender": "M;F;M;;;M;M",
        "homepage": ";;https://www.linkedin.com/in/liang-sun-a0a87621/;;;http://www.eeyiwang.com/;https://sites.google.com/site/qingsongwen8/",
        "dblp": ";156/0429;18/5837-1;;91/8171;;27/561",
        "google_scholar": ";2bL2FJ0AAAAJ;D_cOMBgAAAAJ;;https://scholar.google.com.au/citations?user=frWRJN4AAAAJ;KYDSElAAAAAJ;vjPJvwYAAAAJ",
        "orcid": "0009-0000-2734-5074;;0009-0002-5835-7259;0000-0001-8563-8086;0000-0003-0794-527X;0000-0003-1143-0666;0000-0003-4516-2524",
        "linkedin": ";;;;;;qingsong-wen-22814156/",
        "or_profile": "~Zhixian_Wang2;~Chaoli_Zhang1;~Liang_Sun2;~Leandro_Von_Krannichfeldt1;~Shirui_Pan1;~Yi_Wang43;~Qingsong_Wen1",
        "aff": " University of Hong Kong;Zhejiang Normal University;Alibaba Group;EPFL - EPF Lausanne;Griffith University;;Squirrel Ai Learning",
        "aff_domain": "eee.hku.hk;zjnu.edu.cn;alibaba-inc.com;epfl.ch;griffith.edu.au;;squirrelai.com",
        "position": "PhD student;Lecturer;Staff Software Engineer;PhD student;Full Professor;;Principal Researcher",
        "bibtex": "@misc{\nwang2024benchmarks,\ntitle={Benchmarks and Custom Package for Electrical Load Forecasting},\nauthor={Zhixian Wang and Qingsong Wen and Chaoli Zhang and Liang Sun and Leandro Von Krannichfeldt and Shirui Pan and Yi Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=gjB7qqPJbv}\n}",
        "github": "",
        "project": "",
        "reviewers": "rLha;zDou;wtQT",
        "site": "https://openreview.net/forum?id=gjB7qqPJbv",
        "pdf_size": 2394648,
        "rating": "3;3;5",
        "confidence": "3;4;4",
        "soundness": "2;2;3",
        "contribution": "3;2;2",
        "presentation": "2;2;3",
        "wc_summary": "103;205;93",
        "wc_strengths": "85;362;83",
        "wc_weaknesses": "287;403;435",
        "wc_questions": "452;372;6",
        "wc_review": "927;1342;617",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            133.66666666666666,
            50.60522590492892
        ],
        "wc_strengths_avg": [
            176.66666666666666,
            131.05300030479611
        ],
        "wc_weaknesses_avg": [
            375.0,
            63.58196809368727
        ],
        "wc_questions_avg": [
            276.6666666666667,
            194.15686670547834
        ],
        "wc_review_avg": [
            962.0,
            297.0129065658034
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12637646540370304227&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;3;4;5",
        "aff_unique_norm": "University of Hong Kong;Zhejiang Normal University;Alibaba Group;EPFL;Griffith University;Squirrel Ai Learning",
        "aff_unique_dep": ";;;;;",
        "aff_unique_url": "https://www.hku.hk;http://www.zjnu.edu.cn;https://www.alibaba.com;https://www.epfl.ch;https://www.griffith.edu.au;https://www.squirrelai.com/",
        "aff_unique_abbr": "HKU;ZJNU;Alibaba;EPFL;Griffith;",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Hong Kong SAR;;Lausanne",
        "aff_country_unique_index": "0;0;0;1;2;0",
        "aff_country_unique": "China;Switzerland;Australia"
    },
    {
        "title": "PRES: Toward Scalable Memory-Based Dynamic Graph Neural Networks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18136",
        "id": "gjXor87Xfy",
        "author_site": "Junwei Su, Difan Zou, Chuan Wu",
        "tldr": "",
        "abstract": "Memory-based Dynamic Graph Neural Networks (MDGNNs) are a family of dynamic graph neural networks that leverage a memory module to extract, distill, and memorize long-term temporal dependencies, leading to superior performance compared to memory-less counterparts. However, training MDGNNs faces the challenge of handling entangled temporal and structural dependencies, requiring sequential and chronological processing of data sequences to capture accurate temporal patterns. During the batch training, the temporal data points within the same batch will be processed in parallel, while their temporal dependencies are neglected. This issue is referred to as temporal discontinuity and restricts the effective temporal batch size, limiting data parallelism and reducing MDGNNs' flexibility in industrial applications. This paper studies the efficient training of MDGNNs at scale, focusing on the temporal discontinuity in training MDGNNs with large temporal batch sizes. We first conduct a theoretical study on the impact of temporal batch \nsize on the convergence of MDGNN training. Based on the analysis, we propose PRES, an iterative prediction-correction scheme combined with a memory coherence learning objective to mitigate the effect of temporal discontinuity, enabling MDGNNs to be trained with significantly larger temporal batches without sacrificing generalization performance. Experimental results demonstrate that our approach enables up to a 4 $\\times$ larger temporal batch (3.4$\\times$ speed-up) during MDGNN training.",
        "keywords": "Dynamic/Temporal Graph Neural Network",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Junwei Su;Difan Zou;Chuan Wu",
        "authorids": "~Junwei_Su1;~Difan_Zou1;~Chuan_Wu1",
        "gender": "M;M;",
        "homepage": ";https://difanzou.github.io/;https://i.cs.hku.hk/~cwu/",
        "dblp": "226/0880;161/8923;34/3772-1",
        "google_scholar": "https://scholar.google.ca/citations?user=jtWS-OMAAAAJ;Cp4fcTQAAAAJ;mY7MWXMAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Junwei_Su1;~Difan_Zou1;~Chuan_Wu1",
        "aff": "The University of Hong Kong;University of Hong Kong;The University of Hong Kong",
        "aff_domain": "hku.hk;hku.hk;hku.hk",
        "position": "PhD student;Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\nsu2024pres,\ntitle={{PRES}: Toward Scalable Memory-Based Dynamic Graph Neural Networks},\nauthor={Junwei Su and Difan Zou and Chuan Wu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=gjXor87Xfy}\n}",
        "github": "",
        "project": "",
        "reviewers": "pqbr;dnLR",
        "pdf_size": 921852,
        "rating": "6;6",
        "confidence": "3;3",
        "soundness": "3;2",
        "contribution": "3;3",
        "presentation": "3;3",
        "wc_summary": "105;149",
        "wc_strengths": "37;39",
        "wc_weaknesses": "51;57",
        "wc_questions": "170;475",
        "wc_review": "363;720",
        "wc_reply_reviewers": "50;350",
        "wc_reply_authors": "869;2995",
        "reply_reviewers": "1;3",
        "reply_authors": "3;7",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            127.0,
            22.0
        ],
        "wc_strengths_avg": [
            38.0,
            1.0
        ],
        "wc_weaknesses_avg": [
            54.0,
            3.0
        ],
        "wc_questions_avg": [
            322.5,
            152.5
        ],
        "wc_review_avg": [
            541.5,
            178.5
        ],
        "wc_reply_reviewers_avg": [
            200.0,
            150.0
        ],
        "wc_reply_authors_avg": [
            1932.0,
            1063.0
        ],
        "reply_reviewers_avg": [
            2.0,
            1.0
        ],
        "reply_authors_avg": [
            5.0,
            2.0
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5622138040905922116&as_sdt=5,40&sciodt=0,40&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=gjXor87Xfy",
        "pdf": "https://openreview.net/pdf?id=gjXor87Xfy",
        "email": "hku.hk;hku.hk;hku.hk",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Hong Kong",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.hku.hk",
        "aff_unique_abbr": "HKU",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Can LLMs Express Their Uncertainty? An Empirical Evaluation of Confidence Elicitation in LLMs",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18135",
        "id": "gjeQKFxFpZ",
        "author_site": "Miao Xiong, Zhiyuan Hu, Xinyang Lu, YIFEI LI, Jie Fu, Junxian He, Bryan Hooi",
        "tldr": "",
        "abstract": "Empowering large language models (LLMs) to accurately express confidence in their answers is essential for reliable and trustworthy decision-making. Previous confidence elicitation methods, which primarily rely on *white-box access* to internal model information or model fine-tuning, have become less suitable for LLMs, especially closed-source commercial APIs. This leads to a growing need to explore the untapped area of *black-box* approaches for LLM uncertainty estimation. To better break down the problem, we define a systematic framework with three components: *prompting* strategies for eliciting verbalized confidence, *sampling* methods for generating multiple responses, and *aggregation* techniques for computing consistency. We then benchmark these methods on two key tasks\u2014confidence calibration and failure prediction\u2014across five types of datasets (e.g., commonsense and arithmetic reasoning) and five widely-used LLMs including GPT-4 and LLaMA 2 Chat. Our analysis uncovers several key insights: 1) LLMs, when verbalizing their confidence, tend to be *overconfident*, potentially imitating human patterns of expressing confidence. 2) As model capability scales up, both calibration and failure prediction performance improve, yet still far from ideal performance. \n3) Employing our proposed strategies, such as human-inspired prompts, consistency among multiple responses, and better aggregation strategies can help mitigate this overconfidence from various perspectives. \n4) Comparisons with white-box methods indicate that while white-box methods perform better, the gap is narrow, e.g., 0.522 to 0.605 in AUROC. Despite these advancements, none of these techniques consistently outperform others, and all investigated methods struggle in challenging tasks, such as those requiring professional knowledge, indicating significant scope for improvement. We believe this study can serve as a strong baseline and provide insights for eliciting confidence in black-box LLMs. The code is publicly available at https://github.com/MiaoXiong2320/llm-uncertainty.",
        "keywords": "uncertainty quantification;uncertainty estimation;calibration;failure prediction;large language models;black-box language models;LLM evaluation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Miao Xiong;Zhiyuan Hu;Xinyang Lu;YIFEI LI;Jie Fu;Junxian He;Bryan Hooi",
        "authorids": "~Miao_Xiong2;~Zhiyuan_Hu4;~Xinyang_Lu1;~YIFEI_LI3;~Jie_Fu2;~Junxian_He1;~Bryan_Hooi1",
        "gender": "F;M;M;;;M;",
        "homepage": "https://miaoxiong2320.github.io/;https://zhiyuanhubj.github.io/zhiyuan.github.io/;;;;https://jxhe.github.io;http://bhooi.github.io",
        "dblp": ";;;;;188/6127.html;169/9975",
        "google_scholar": "yQ4U_5IAAAAJ;https://scholar.google.com.hk/citations?hl=zh-CN;;;;BIFGeoUAAAAJ;",
        "orcid": ";;0000-0003-0610-070X;;;;0000-0002-5645-1754",
        "linkedin": "miao-xiong-9b1892187/;;xinyang-lu-370724170;;;;",
        "or_profile": "~Miao_Xiong2;~Zhiyuan_Hu4;~Xinyang_Lu1;~YIFEI_LI3;~Jie_Fu2;~Junxian_He1;~Bryan_Hooi1",
        "aff": "National University of Singapore;National University of Singapore;National University of Singapore;;;Hong Kong University of Science and Technology;National University of Singapore",
        "aff_domain": "u.nus.edu;u.nus.edu;u.nus.edu;;;ust.hk;nus.edu.sg",
        "position": "PhD student;PhD student;PhD student;;;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nxiong2024can,\ntitle={Can {LLM}s Express Their Uncertainty? An Empirical Evaluation of Confidence Elicitation in {LLM}s},\nauthor={Miao Xiong and Zhiyuan Hu and Xinyang Lu and YIFEI LI and Jie Fu and Junxian He and Bryan Hooi},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=gjeQKFxFpZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "bmdf;GBf5;Bvbz;uQRx",
        "pdf_size": 1073761,
        "rating": "5;5;6;8",
        "confidence": "3;4;3;4",
        "soundness": "3;2;4;4",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;4",
        "wc_summary": "248;48;27;61",
        "wc_strengths": "2;70;38;51",
        "wc_weaknesses": "2;123;115;65",
        "wc_questions": "2;67;4;6",
        "wc_review": "254;308;184;183",
        "wc_reply_reviewers": "6;10;0;0",
        "wc_reply_authors": "799;1048;756;822",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "2;3;2;2",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            96.0,
            88.59176033920987
        ],
        "wc_strengths_avg": [
            40.25,
            24.843258642939738
        ],
        "wc_weaknesses_avg": [
            76.25,
            48.28755015529365
        ],
        "wc_questions_avg": [
            19.75,
            27.316432783216772
        ],
        "wc_review_avg": [
            232.25,
            52.356351095163234
        ],
        "wc_reply_reviewers_avg": [
            4.0,
            4.242640687119285
        ],
        "wc_reply_authors_avg": [
            856.25,
            113.21301824436976
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.40824829046386296,
        "gs_citation": 355,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3235830266927345053&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=gjeQKFxFpZ",
        "pdf": "https://openreview.net/pdf?id=gjeQKFxFpZ",
        "email": "u.nus.edu;u.nus.edu;u.nus.edu;;;ust.hk;nus.edu.sg",
        "author_num": 7,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "National University of Singapore;Hong Kong University of Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.nus.edu.sg;https://www.ust.hk",
        "aff_unique_abbr": "NUS;HKUST",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "Singapore;China"
    },
    {
        "title": "DyVal: Dynamic Evaluation of Large Language Models for Reasoning Tasks",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18134",
        "id": "gjfOL9z5Xr",
        "author_site": "Kaijie Zhu, Jiaao Chen, Jindong Wang, Neil Gong, Diyi Yang, Xing Xie",
        "tldr": "",
        "abstract": "Large language models (LLMs) have achieved remarkable performance in various evaluation benchmarks. However, concerns are raised about potential data contamination in their considerable volume of training corpus. Moreover, the static nature and fixed complexity of current benchmarks may inadequately gauge the advancing capabilities of LLMs. \nIn this paper, we introduce DyVal, a general and flexible protocol for dynamic evaluation of LLMs. Based on our framework, we build graph-informed DyVal by leveraging the structural advantage of directed acyclic graphs to dynamically generate evaluation samples with controllable complexities. DyVal generates challenging evaluation sets on reasoning tasks including mathematics, logical reasoning, and algorithm problems. We evaluate various LLMs ranging from Flan-T5-large to GPT-3.5-Turbo and GPT-4. Experiments show that LLMs perform worse in DyVal-generated evaluation samples with different complexities, highlighting the significance of dynamic evaluation.\nWe also analyze the failure cases and results of different prompting methods.\nMoreover, DyVal-generated samples are not only evaluation sets, but also helpful data for fine-tuning to improve the performance of LLMs on existing benchmarks.\nWe hope that DyVal can shed light on future evaluation research of LLMs. Code is available at: https://github.com/microsoft/promptbench.",
        "keywords": "Large Language Models;Evaluation;Data Contamination",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/d567888eed0799bf34b22327aa1c62add04ae8cf.zip",
        "author": "Kaijie Zhu;Jiaao Chen;Jindong Wang;Neil Zhenqiang Gong;Diyi Yang;Xing Xie",
        "authorids": "~Kaijie_Zhu1;~Jiaao_Chen2;~Jindong_Wang1;~Neil_Zhenqiang_Gong1;~Diyi_Yang2;~Xing_Xie3",
        "gender": "M;M;F;M;M;M",
        "homepage": "https://github.com/Immortalise;https://cs.stanford.edu/people/jiaaoc/;https://cs.stanford.edu/~diyiy/;http://research.microsoft.com/en-us/people/xingx/;https://jd92.wang/;http://people.duke.edu/~zg70/",
        "dblp": "56/7058;230/3663;70/11145;08/6809-1;19/2969-1;03/9437",
        "google_scholar": ";Pi9IVvUAAAAJ;j9jhYqQAAAAJ;5EQfAFIAAAAJ;hBZ_tKsAAAAJ;t6uCsYoAAAAJ",
        "orcid": ";;;0000-0002-8608-8482;0000-0002-4833-0880;0000-0002-9900-9309",
        "linkedin": ";;;xingx/;jindong-wang/;",
        "or_profile": "~Kaijie_Zhu1;~Jiaao_Chen2;~Diyi_Yang2;~Xing_Xie3;~Jindong_Wang4;~Neil_Gong2",
        "aff": "Institute of automation, Chinese Academy of Sciences;Georgia Institute of Technology;Stanford University;Microsoft Research Asia;Microsoft Research;Duke University",
        "aff_domain": "ia.ac.cn;gatech.edu;stanford.edu;microsoft.com;microsoft.com;duke.edu",
        "position": "MS student;PhD student;Assistant Professor;Senior Principal Researcher;Researcher;Associate Professor",
        "bibtex": "@inproceedings{\nzhu2024dyval,\ntitle={DyVal: Dynamic Evaluation of Large Language Models for Reasoning Tasks},\nauthor={Kaijie Zhu and Jiaao Chen and Jindong Wang and Neil Zhenqiang Gong and Diyi Yang and Xing Xie},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=gjfOL9z5Xr}\n}",
        "github": "",
        "project": "",
        "reviewers": "MYvY;sT7J;iwJv;ydTt",
        "pdf_size": 924405,
        "rating": "6;6;6;8",
        "confidence": "5;4;3;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "112;50;23;119",
        "wc_strengths": "34;90;225;81",
        "wc_weaknesses": "317;103;347;187",
        "wc_questions": "7;39;1;50",
        "wc_review": "470;282;596;437",
        "wc_reply_reviewers": "250;80;226;67",
        "wc_reply_authors": "1206;742;1963;1149",
        "reply_reviewers": "2;1;2;1",
        "reply_authors": "3;2;4;3",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            76.0,
            40.712405971644564
        ],
        "wc_strengths_avg": [
            107.5,
            71.09324862460569
        ],
        "wc_weaknesses_avg": [
            238.5,
            98.67497149733563
        ],
        "wc_questions_avg": [
            24.25,
            20.72890493972125
        ],
        "wc_review_avg": [
            446.25,
            111.86235962109865
        ],
        "wc_reply_reviewers_avg": [
            155.75,
            82.81417451137214
        ],
        "wc_reply_authors_avg": [
            1265.0,
            440.92799865737715
        ],
        "reply_reviewers_avg": [
            1.5,
            0.5
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 40,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6710983311249885878&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=gjfOL9z5Xr",
        "pdf": "https://openreview.net/pdf?id=gjfOL9z5Xr",
        "email": "ia.ac.cn;gatech.edu;stanford.edu;microsoft.com;microsoft.com;duke.edu",
        "author_num": 6,
        "aff_unique_index": "0;1;2;3;3;4",
        "aff_unique_norm": "Chinese Academy of Sciences;Georgia Institute of Technology;Stanford University;Microsoft;Duke University",
        "aff_unique_dep": "Institute of Automation;;;Research;",
        "aff_unique_url": "http://www.ia.cas.cn;https://www.gatech.edu;https://www.stanford.edu;https://www.microsoft.com/en-us/research/group/asia;https://www.duke.edu",
        "aff_unique_abbr": "CAS;Georgia Tech;Stanford;MSR Asia;Duke",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Stanford;Asia",
        "aff_country_unique_index": "0;1;1;0;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Confronting Reward Model Overoptimization with Constrained RLHF",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18133",
        "id": "gkfUvn0fLU",
        "author_site": "Ted Moskovitz, Aaditya Singh, DJ Strouse, Tuomas Sandholm, Ruslan Salakhutdinov, Anca Dragan, Stephen McAleer",
        "tldr": "",
        "abstract": "Large language models are typically aligned with human preferences by optimizing reward models (RMs) fitted to human feedback. However, human preferences are multi-faceted, and it is increasingly common to derive reward from a composition of simpler reward models which each capture a different aspect of language quality. This itself presents a challenge, as it is difficult to appropriately weight these component RMs when combining them. Compounding this difficulty, because any RM is only a proxy for human evaluation, this process is vulnerable to *overoptimization*, wherein past a certain point, accumulating higher reward is associated with worse human ratings. In this paper, we perform the first study on overoptimization in composite RMs, showing that correlation between component RMs has a significant effect on the locations of these points. We then introduce an approach to solve this issue using constrained reinforcement learning as a means of preventing the agent from exceeding each RM's threshold of usefulness. Our method addresses the problem of weighting component RMs by learning dynamic weights, naturally given by the Lagrange multipliers. As a result, each RM stays within the range at which it is an effective proxy, improving evaluation performance. Finally, we introduce an adaptive method using gradient-free optimization to identify and optimize towards these points during a single run.",
        "keywords": "rlhf;overoptimization;constrained RL",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/2c42d0b0ed2c137d100785929fa5585651ecbb04.zip",
        "author": "Ted Moskovitz;Aaditya K Singh;DJ Strouse;Tuomas Sandholm;Ruslan Salakhutdinov;Anca Dragan;Stephen Marcus McAleer",
        "authorids": "~Ted_Moskovitz1;~Aaditya_K_Singh1;~DJ_Strouse1;~Tuomas_Sandholm1;~Ruslan_Salakhutdinov1;~Anca_Dragan1;~Stephen_Marcus_McAleer1",
        "gender": "M;;M;F;M;M;M",
        "homepage": "https://tedmoskovitz.github.io/;http://www.djstrouse.com;http://www.cs.cmu.edu/~sandholm;http://www.ancadragan.com/;https://www.andrew.cmu.edu/user/smcaleer/;https://aadityasingh.github.io/;https://www.cs.cmu.edu/~rsalakhu/",
        "dblp": ";181/2305;s/TuomasSandholm;;;;",
        "google_scholar": "pPVXrTYAAAAJ;K8E0T7MAAAAJ;0DpK1EMAAAAJ;;iEFL4-YAAAAJ;9OPKqmMAAAAJ;",
        "orcid": ";;;;;;",
        "linkedin": ";;;;stephen-mcaleer/;;",
        "or_profile": "~Ted_Moskovitz1;~DJ_Strouse1;~Tuomas_Sandholm1;~Anca_Dragan1;~Stephen_Marcus_McAleer1;~Aaditya_Singh1;~Russ_Salakhutdinov1",
        "aff": "Gatsby Computational Neuroscience Unit;Google DeepMind;Carnegie Mellon University;University of California, Berkeley;Carnegie Mellon University;University College London, University of London;School of Computer Science, Carnegie Mellon University",
        "aff_domain": "gatsby.ucl.ac.uk;google.com;cmu.edu;berkeley.edu;cmu.edu;ucl.ac.uk;cs.cmu.edu",
        "position": "PhD student;Research Scientist;Full Professor;Associate Professor;Postdoc;PhD student;Full Professor",
        "bibtex": "@inproceedings{\nmoskovitz2024confronting,\ntitle={Confronting Reward Model Overoptimization with Constrained {RLHF}},\nauthor={Ted Moskovitz and Aaditya K Singh and DJ Strouse and Tuomas Sandholm and Ruslan Salakhutdinov and Anca Dragan and Stephen Marcus McAleer},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=gkfUvn0fLU}\n}",
        "github": "",
        "project": "",
        "reviewers": "FHce;kPJr;xdFb;uRgS",
        "pdf_size": 915861,
        "rating": "6;6;8;8",
        "confidence": "4;4;3;3",
        "soundness": "3;3;4;3",
        "contribution": "3;3;4;3",
        "presentation": "3;2;3;3",
        "wc_summary": "34;80;118;60",
        "wc_strengths": "66;139;82;42",
        "wc_weaknesses": "32;187;81;131",
        "wc_questions": "129;194;28;188",
        "wc_review": "261;600;309;421",
        "wc_reply_reviewers": "17;110;13;26",
        "wc_reply_authors": "426;852;324;599",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            73.0,
            30.675723300355934
        ],
        "wc_strengths_avg": [
            82.25,
            35.723766598722484
        ],
        "wc_weaknesses_avg": [
            107.75,
            57.60805065266486
        ],
        "wc_questions_avg": [
            134.75,
            66.66098934159318
        ],
        "wc_review_avg": [
            397.75,
            130.40585684699903
        ],
        "wc_reply_reviewers_avg": [
            41.5,
            39.82775414205526
        ],
        "wc_reply_authors_avg": [
            550.25,
            200.03546560547707
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 45,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12828051530272508031&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=gkfUvn0fLU",
        "pdf": "https://openreview.net/pdf?id=gkfUvn0fLU",
        "email": "gatsby.ucl.ac.uk;google.com;cmu.edu;berkeley.edu;cmu.edu;ucl.ac.uk;cs.cmu.edu",
        "author_num": 7,
        "aff_unique_index": "0;1;2;3;2;0;2",
        "aff_unique_norm": "University College London;Google;Carnegie Mellon University;University of California, Berkeley",
        "aff_unique_dep": "Gatsby Computational Neuroscience Unit;Google DeepMind;;",
        "aff_unique_url": "https://www.ucl.ac.uk;https://deepmind.com;https://www.cmu.edu;https://www.berkeley.edu",
        "aff_unique_abbr": "UCL;DeepMind;CMU;UC Berkeley",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Berkeley;Pittsburgh",
        "aff_country_unique_index": "0;0;1;1;1;0;1",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "title": "VertiBench: Advancing Feature Distribution Diversity in Vertical Federated Learning Benchmarks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18132",
        "id": "glwwbaeKm2",
        "author_site": "Zhaomin Wu, Junyi Hou, Bingsheng He",
        "tldr": "",
        "abstract": "Vertical Federated Learning (VFL) is a crucial paradigm for training machine learning models on feature-partitioned, distributed data. However, due to privacy restrictions, few public real-world VFL datasets exist for algorithm evaluation, and these represent a limited array of feature distributions. Existing benchmarks often resort to synthetic datasets, derived from arbitrary feature splits from a global set, which only capture a subset of feature distributions, leading to inadequate algorithm performance assessment. This paper addresses these shortcomings by introducing two key factors affecting VFL performance - feature importance and feature correlation - and proposing associated evaluation metrics and dataset splitting methods. Additionally, we introduce a real VFL dataset to address the deficit in image-image VFL scenarios. Our comprehensive evaluation of cutting-edge VFL algorithms provides valuable insights for future research in the field.",
        "keywords": "Vertical federated learning;benchmark;feature correlation;feature importance",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Zhaomin Wu;Junyi Hou;Bingsheng He",
        "authorids": "~Zhaomin_Wu1;~Junyi_Hou1;~Bingsheng_He1",
        "gender": "M;M;M",
        "homepage": "https://zhaominwu.com;https://www.junyi.dev;http://www.comp.nus.edu.sg/~hebs/",
        "dblp": "254/0918;;h/BingshengHe.html",
        "google_scholar": "QjehmgkAAAAJ;;https://scholar.google.com.tw/citations?user=RogYLKYAAAAJ",
        "orcid": "0000-0002-6463-0031;0009-0003-0443-456X;0000-0001-8618-4581",
        "linkedin": ";;bingsheng-he-7734b131",
        "or_profile": "~Zhaomin_Wu1;~Junyi_Hou1;~Bingsheng_He1",
        "aff": "National University of Singapore;National University of Singapore;National University of Singapore",
        "aff_domain": "u.nus.edu;u.nus.edu;nus.edu.sg",
        "position": "PhD student;MS student;Full Professor",
        "bibtex": "@inproceedings{\nwu2024vertibench,\ntitle={VertiBench: Advancing Feature Distribution Diversity in Vertical Federated Learning Benchmarks},\nauthor={Zhaomin Wu and Junyi Hou and Bingsheng He},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=glwwbaeKm2}\n}",
        "github": "",
        "project": "",
        "reviewers": "6Ygd;oXEA;MyAZ;BWae",
        "pdf_size": 8702580,
        "rating": "6;6;6;8",
        "confidence": "2;2;3;4",
        "soundness": "2;2;2;3",
        "contribution": "3;2;3;3",
        "presentation": "3;3;3;2",
        "wc_summary": "84;115;96;133",
        "wc_strengths": "104;139;57;227",
        "wc_weaknesses": "115;288;544;226",
        "wc_questions": "29;3;62;334",
        "wc_review": "332;545;759;920",
        "wc_reply_reviewers": "0;13;40;95",
        "wc_reply_authors": "920;661;942;768",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "3;1;2;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            107.0,
            18.641351882307248
        ],
        "wc_strengths_avg": [
            131.75,
            62.21484951360085
        ],
        "wc_weaknesses_avg": [
            293.25,
            157.47916528861842
        ],
        "wc_questions_avg": [
            107.0,
            132.71586190052793
        ],
        "wc_review_avg": [
            639.0,
            221.61114592908
        ],
        "wc_reply_reviewers_avg": [
            37.0,
            36.462309307009065
        ],
        "wc_reply_authors_avg": [
            822.75,
            114.93340463068168
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.8703882797784891,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17614358898106467908&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=glwwbaeKm2",
        "pdf": "https://openreview.net/pdf?id=glwwbaeKm2",
        "email": "u.nus.edu;u.nus.edu;nus.edu.sg",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "National University of Singapore",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nus.edu.sg",
        "aff_unique_abbr": "NUS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Singapore"
    },
    {
        "id": "gmHtBH8Fnp",
        "title": "Biased Binary Attribute Classifiers Ignore the Majority Classes",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "To visualize the regions of interest that classifiers base their decisions on, different Class Activation Mapping (CAM) methods have been developed.\nHowever, all of these techniques target categorical classifiers only, though most real-world tasks are binary classification.\nIn this paper, we extend gradient-based CAM techniques to work with binary classifiers and visualize the active regions for binary attribute classifiers.\nWhen training an unbalanced binary classifier on a biased dataset, it is well-known that the majority class is mostly predicted much better than minority class.\nIn our experiments on the CelebA dataset, we verify these results, when training an unbalanced classifier to extract 40 facial attributes simultaneously.\nOne would expect that the biased classifier has learned to extract features mainly for the majority classes and that the proportional energy of the activations mainly reside in certain specific regions of the image where the attribute is located.\nHowever, we find very little regular activation for samples of majority classes, while the active regions for minority classes seem mostly reasonable and overlap with our expectations.\nThese results suggest that biased classifiers only rely on bias activation for majority classes.\nWhen training a balanced classifier on the unbalanced data by employing attribute-specific class weights, positive and negative classes are classified similarly well and show expected activations for almost all attributes.",
        "keywords": "Facial Attribute Classification;Class Activation Mapping;Binary Classifiers",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/5c19dcf286aa2df23ed4c415d84faf944fecd8e6.pdf",
        "author": "Xinyi Zhang;Johanna Sophie Bieri;Manuel G\u00fcnther",
        "authorids": "~Xinyi_Zhang11;~Johanna_Sophie_Bieri1;~Manuel_G\u00fcnther1",
        "gender": "F;F;M",
        "homepage": "https://www.ifi.uzh.ch/en/aiml/people/zhang.html;;https://www.ifi.uzh.ch/en/aiml/people/guenther.html",
        "dblp": ";;92/7377",
        "google_scholar": ";;N9urlTYAAAAJ",
        "orcid": ";;0000-0003-1489-7448",
        "linkedin": "xinyi-zhang-074629213/;https://linkedin.com/in/johanna-bieri-321a05263;",
        "or_profile": "~Xinyi_Zhang11;~Johanna_Sophie_Bieri1;~Manuel_G\u00fcnther1",
        "aff": "University of Zurich;Department of Informatics, University of Zurich, University of Zurich;University of Zurich, University of Zurich",
        "aff_domain": "ifi.uzh.ch;ifi.uzh.ch;ifi.uzh.ch",
        "position": "PhD student;MS student;Assistant Professor",
        "bibtex": "@misc{\nzhang2024biased,\ntitle={Biased Binary Attribute Classifiers Ignore the Majority Classes},\nauthor={Xinyi Zhang and Johanna Sophie Bieri and Manuel G{\\\"u}nther},\nyear={2024},\nurl={https://openreview.net/forum?id=gmHtBH8Fnp}\n}",
        "github": "",
        "project": "",
        "reviewers": "yjBg;XzHa;uTPu;rwvH",
        "site": "https://openreview.net/forum?id=gmHtBH8Fnp",
        "pdf_size": 4084418,
        "rating": "3;3;3;3",
        "confidence": "4;2;4;4",
        "soundness": "3;2;2;3",
        "contribution": "2;2;1;2",
        "presentation": "4;3;2;3",
        "wc_summary": "50;118;63;152",
        "wc_strengths": "2;55;33;133",
        "wc_weaknesses": "122;227;319;109",
        "wc_questions": "2;46;30;349",
        "wc_review": "176;446;445;743",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            95.75,
            41.30602256330183
        ],
        "wc_strengths_avg": [
            55.75,
            48.41164632606497
        ],
        "wc_weaknesses_avg": [
            194.25,
            85.32694474783449
        ],
        "wc_questions_avg": [
            106.75,
            140.7468916175416
        ],
        "wc_review_avg": [
            452.5,
            200.58726280599174
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16315834401108508705&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Zurich",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.unizh.ch",
        "aff_unique_abbr": "UZH",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Switzerland"
    },
    {
        "title": "Can LLMs Keep a Secret? Testing Privacy Implications of Language Models via Contextual Integrity Theory",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18131",
        "id": "gmg7t8b4s0",
        "author_site": "Niloofar Mireshghallah, Hyunwoo Kim, Xuhui Zhou, Yulia Tsvetkov, Maarten Sap, Reza Shokri, Yejin Choi",
        "tldr": "",
        "abstract": "Existing efforts on quantifying privacy implications for large language models (LLMs) solely focus on measuring leakage of training data. In this work, we shed light on the often-overlooked interactive settings where an LLM receives information from multiple sources and generates an output to be shared with other entities, creating the potential of exposing sensitive input data in inappropriate contexts. In these scenarios, humans nat- urally uphold privacy by choosing whether or not to disclose information depending on the context. We ask the question \u201cCan LLMs demonstrate an equivalent discernment and reasoning capability when considering privacy in context?\u201d We propose CONFAIDE, a benchmark grounded in the theory of contextual integrity and designed to identify critical weaknesses in the privacy reasoning capabilities of instruction-tuned LLMs. CONFAIDE consists of four tiers, gradually increasing in complexity, with the final tier evaluating contextual privacy reasoning and theory of mind capabilities. Our experiments show that even commercial models such as GPT-4 and ChatGPT reveal private information in contexts that humans would not, 39% and 57% of the time, respectively, highlighting the urgent need for a new direction of privacy-preserving approaches as we demonstrate a larger underlying problem stemmed in the models\u2019 lack of reasoning capabilities.",
        "keywords": "Contextual Integrity;Privacy;Theory of Mind",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/36d4998c485237f0715d61be2a2f2f48118bf524.zip",
        "author": "Niloofar Mireshghallah;Hyunwoo Kim;Xuhui Zhou;Yulia Tsvetkov;Maarten Sap;Reza Shokri;Yejin Choi",
        "authorids": "~Niloofar_Mireshghallah1;~Hyunwoo_Kim3;~Xuhui_Zhou1;~Yulia_Tsvetkov1;~Maarten_Sap1;~Reza_Shokri1;~Yejin_Choi1",
        "gender": ";M;M;F;M;;F",
        "homepage": ";http://hyunwookim.com;https://xuhuizhou.github.io/;https://homes.cs.washington.edu/~yuliats/;http://maartensap.com;;https://yejinc.github.io/",
        "dblp": ";02/8768-2;;75/8157;153/9519;;89/579-1",
        "google_scholar": ";https://scholar.google.co.kr/citations?user=PAXFuxsAAAAJ;CKyX_Y8AAAAJ;SEDPkrsAAAAJ;gFN4QUYAAAAJ;;vhP-tlcAAAAJ",
        "orcid": ";0009-0002-2714-1287;;0000-0002-4634-7128;;;",
        "linkedin": ";hyunw-kim/;;;;;",
        "or_profile": "~Niloofar_Mireshghallah1;~Hyunwoo_Kim3;~Xuhui_Zhou1;~Yulia_Tsvetkov1;~Maarten_Sap1;~Reza_Shokri1;~Yejin_Choi1",
        "aff": ";Allen Institute for Artificial Intelligence / University of Washington;Allen Institute for Artificial Intelligence;Department of Computer Science, University of Washington;Carnegie Mellon University;;Department of Computer Science, University of Washington",
        "aff_domain": ";allenai.org;allenai.org;cs.washington.edu;cmu.edu;;cs.washington.edu",
        "position": ";Postdoc;Intern;Associate Professor;Assistant Professor;;Full Professor",
        "bibtex": "@inproceedings{\nmireshghallah2024can,\ntitle={Can {LLM}s Keep a Secret? Testing  Privacy  Implications of Language Models  via Contextual Integrity Theory},\nauthor={Niloofar Mireshghallah and Hyunwoo Kim and Xuhui Zhou and Yulia Tsvetkov and Maarten Sap and Reza Shokri and Yejin Choi},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=gmg7t8b4s0}\n}",
        "github": "",
        "project": "",
        "reviewers": "z5sf;J8CV;fMFx;8YWe",
        "pdf_size": 3915509,
        "rating": "3;6;8;8",
        "confidence": "4;3;3;3",
        "soundness": "2;3;3;4",
        "contribution": "2;3;4;4",
        "presentation": "2;3;3;4",
        "wc_summary": "51;43;194;40",
        "wc_strengths": "76;31;124;18",
        "wc_weaknesses": "477;30;149;19",
        "wc_questions": "2;8;221;33",
        "wc_review": "606;112;688;110",
        "wc_reply_reviewers": "0;67;0;0",
        "wc_reply_authors": "1161;819;1006;244",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "2;2;2;1",
        "rating_avg": [
            6.25,
            2.0463381929681126
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            82.0,
            64.78811619425278
        ],
        "wc_strengths_avg": [
            62.25,
            41.64357693570522
        ],
        "wc_weaknesses_avg": [
            168.75,
            185.12478899380278
        ],
        "wc_questions_avg": [
            66.0,
            90.24134307511164
        ],
        "wc_review_avg": [
            379.0,
            269.56446353330773
        ],
        "wc_reply_reviewers_avg": [
            16.75,
            29.011851026778693
        ],
        "wc_reply_authors_avg": [
            807.5,
            347.14154173766065
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.9169493006161777,
        "gs_citation": 86,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16468696935337585826&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=gmg7t8b4s0",
        "pdf": "https://openreview.net/pdf?id=gmg7t8b4s0",
        "email": ";allenai.org;allenai.org;cs.washington.edu;cmu.edu;;cs.washington.edu",
        "author_num": 7,
        "aff_unique_index": "0;0;1;2;1",
        "aff_unique_norm": "Allen Institute for Artificial Intelligence;University of Washington;Carnegie Mellon University",
        "aff_unique_dep": ";Department of Computer Science;",
        "aff_unique_url": "https://allenai.org;https://www.washington.edu;https://www.cmu.edu",
        "aff_unique_abbr": "AI2;UW;CMU",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Seattle",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "SalUn: Empowering Machine Unlearning via Gradient-based Weight Saliency in Both Image Classification and Generation",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18130",
        "id": "gn0mIhQGNM",
        "author_site": "Chongyu Fan, Jiancheng Liu, Yihua Zhang, Eric Wong, Dennis Wei, Sijia Liu",
        "tldr": "",
        "abstract": "With evolving data regulations, machine unlearning (MU) has become an important tool for fostering trust and safety in today's AI models. However, existing MU methods focusing on data and/or weight perspectives often suffer limitations in unlearning accuracy, stability, and cross-domain applicability. To address these challenges, we introduce the concept of 'weight saliency' for MU, drawing parallels with input saliency in model explanation. This innovation directs MU's attention toward specific model weights rather than the entire model, improving effectiveness and efficiency. The resultant method that we call saliency unlearning (SalUn) narrows the performance gap with 'exact' unlearning (model retraining from scratch after removing the forgetting data points). To the best of our knowledge, SalUn is the first principled MU approach that can effectively erase the influence of forgetting data, classes, or concepts in both image classification and generation tasks. As highlighted below, For example, SalUn yields a stability advantage in high-variance random data forgetting, e.g., with a 0.2% gap compared to exact unlearning on the CIFAR-10 dataset. Moreover, in preventing conditional diffusion models from generating harmful images, SalUn achieves nearly 100% unlearning accuracy, outperforming current state-of-the-art baselines like Erased Stable Diffusion and Forget-Me-Not. Codes are available at https://github.com/OPTML-Group/Unlearn-Saliency.\n\n**WARNING**: This paper contains model outputs that may be offensive in nature.",
        "keywords": "Machine unlearning;generative model;diffusion model;weight saliency",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/a4df9f98a2b8b906caea89ad87d9a32c89f92ca5.zip",
        "author": "Chongyu Fan;Jiancheng Liu;Yihua Zhang;Eric Wong;Dennis Wei;Sijia Liu",
        "authorids": "~Chongyu_Fan1;~Jiancheng_Liu2;~Yihua_Zhang1;~Eric_Wong1;~Dennis_Wei1;~Sijia_Liu1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://github.com/a-F1;https://ljcc0930.github.io/;https://yihua-zhang.com;http://riceric22.github.io/;https://sites.google.com/site/dennislwei/;https://lsjxjtu.github.io/",
        "dblp": "359/3239;74/3002;;64/1811-1.html;59/8761;128/6972-1",
        "google_scholar": ";ReWNzl4AAAAJ;https://scholar.google.com/citations?hl=zh-CN;pWnTMRkAAAAJ;r4ldy4AAAAAJ;C7dO_UgAAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";;zhangyihua/;;dennis-wei-4886036b/;",
        "or_profile": "~Chongyu_Fan1;~Jiancheng_Liu2;~Yihua_Zhang1;~Eric_Wong1;~Dennis_Wei1;~Sijia_Liu1",
        "aff": "Huazhong University of Science and Technology;Michigan State University;Michigan State University;University of Pennsylvania;International Business Machines;Michigan State University",
        "aff_domain": "hust.edu.cn;msu.edu;msu.edu;upenn.edu;ibm.com;msu.edu",
        "position": "Undergrad student;MS student;PhD student;Assistant Professor;Research Staff Member;Assistant Professor",
        "bibtex": "@inproceedings{\nfan2024salun,\ntitle={SalUn: Empowering Machine Unlearning via Gradient-based Weight Saliency in Both Image Classification and Generation},\nauthor={Chongyu Fan and Jiancheng Liu and Yihua Zhang and Eric Wong and Dennis Wei and Sijia Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=gn0mIhQGNM}\n}",
        "github": "",
        "project": "",
        "reviewers": "TAAE;vf6N;XDsn;miKP",
        "pdf_size": 16039317,
        "rating": "6;8;8;8",
        "confidence": "4;2;2;3",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;4",
        "presentation": "3;2;3;4",
        "wc_summary": "82;26;89;145",
        "wc_strengths": "77;38;37;54",
        "wc_weaknesses": "142;70;27;145",
        "wc_questions": "2;26;66;220",
        "wc_review": "303;160;219;564",
        "wc_reply_reviewers": "0;12;0;60",
        "wc_reply_authors": "1084;830;885;1527",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "3;3;2;4",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            85.5,
            42.14558102577303
        ],
        "wc_strengths_avg": [
            51.5,
            16.194134740701646
        ],
        "wc_weaknesses_avg": [
            96.0,
            49.88486744494767
        ],
        "wc_questions_avg": [
            78.5,
            84.83366077212511
        ],
        "wc_review_avg": [
            311.5,
            154.383451185676
        ],
        "wc_reply_reviewers_avg": [
            18.0,
            24.73863375370596
        ],
        "wc_reply_authors_avg": [
            1081.5,
            274.0168790421495
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.8703882797784891,
        "gs_citation": 130,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15640077154789754368&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=gn0mIhQGNM",
        "pdf": "https://openreview.net/pdf?id=gn0mIhQGNM",
        "email": "hust.edu.cn;msu.edu;msu.edu;upenn.edu;ibm.com;msu.edu",
        "author_num": 6,
        "aff_unique_index": "0;1;1;2;3;1",
        "aff_unique_norm": "Huazhong University of Science and Technology;Michigan State University;University of Pennsylvania;International Business Machines Corporation",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "http://www.hust.edu.cn;https://www.msu.edu;https://www.upenn.edu;https://www.ibm.com",
        "aff_unique_abbr": "HUST;MSU;UPenn;IBM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "gnasT4ZS8Y",
        "title": "Improved Algorithms for Adversarial Multi-armed Bandit with Unbounded Losses",
        "track": "main",
        "status": "Desk Reject",
        "tldr": "",
        "abstract": "We consider the Adversarial Multi-Armed Bandits (MAB) problem with unbounded losses, where the algorithms have no prior knowledge on the sizes of the losses. We present UMAB-NN and UMAB-G, two algorithms for non-negative and general unbounded loss respectively. For non-negative unbounded loss, UMAB-NN achieves the first adaptive and scale free regret bound without uniform exploration. Built up on that, we further develop UMAB-G that can learn from arbitrary unbounded loss. Our analysis reveals the asymmetry between positive and negative losses in the MAB problem and provide additional insights. We also accompany our theoretical findings with extensive empirical evaluations, showing that our algorithms consistently out-performs all existing algorithms that handles unbounded losses.",
        "keywords": "adversarial bandits;scale free regret;adaptive regret;unbounded losses",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/0cb083f622985e58ce324316e92b03f1b9d5be13.pdf",
        "author": "Mingyu Chen;Xuezhou Zhang",
        "authorids": "~Mingyu_Chen2;~Xuezhou_Zhang2",
        "gender": "M;M",
        "homepage": ";https://zhangxz1123.github.io/",
        "dblp": ";213/7993",
        "google_scholar": "-C4-gdYAAAAJ;tR-p-r8AAAAJ",
        "orcid": ";",
        "linkedin": "mingyu-chen-7b0136180/;",
        "or_profile": "~Mingyu_Chen2;~Xuezhou_Zhang1",
        "aff": "Boston University, Boston University;Boston University, Boston University",
        "aff_domain": "bu.edu;bu.edu",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nchen2024improved,\ntitle={Improved Algorithms for Adversarial Multi-armed Bandit with Unbounded Losses},\nauthor={Mingyu Chen and Xuezhou Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=gnasT4ZS8Y}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=gnasT4ZS8Y",
        "pdf_size": 1237047,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Sjqwgvz_7UwJ:scholar.google.com/&scioq=Improved+Algorithms+for+Adversarial+Multi-armed+Bandit+with+Unbounded+Losses&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Boston University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.bu.edu",
        "aff_unique_abbr": "BU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Boston",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "gp5dPMBzMH",
        "title": "BELT-2: Bootstrapping EEG-to-Language representation alignment for multi-task brain decoding",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The remarkable success of large language models (LLMs) across various multi-modality applications is evident. However, integrating large language models with humans, or brain dynamics, remains relatively unexplored. In this paper, we introduce BELT-2, a pioneering multi-task model designed to enhance both encoding and decoding performance from EEG signals. To bolster the quality of the EEG encoder, BELT-2 is the first work to innovatively 1) adopt byte pair encoding (BPE)-level EEG-language alignment and 2) integrate multi-task training and decoding in the EEG domain. Inspired by the idea of Bridging the Brain with GPT, we connect the multi-task EEG encoder with LLMs by utilizing prefix-tuning on intermediary output from the EEG encoder. These remarkable advancements firmly establish BELT-2 as a pioneering breakthrough, making it the first work in the field capable of decoding coherent and readable sentences from non-invasive brain signals. Our experiments highlight significant advancements over prior techniques in both quantitative and qualitative measures, achieving a remarkable decoding performance with a BLEU-1 score of 52.2% on the ZuCo dataset. Furthermore, BELT-2 shows an improvement ranging from 31% to 162% on other translation benchmarks. Codes can be accessed via the provided anonymous link.",
        "keywords": "EEG;Brain;Decoding",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/283d1d828819ebe769973321832b16355e73057b.pdf",
        "author": "Charles Chau;Yiqun Duan;Yu-Cheng Chang;Thomas Do;Yu-Kai Wang;Chin-teng Lin",
        "authorids": "~Charles_Chau1;~Yiqun_Duan1;~Yu-Cheng_Chang3;~Thomas_Do1;~Yu-Kai_Wang1;~Chin-teng_Lin1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://github.com/DuanYiqun;;https://profiles.uts.edu.au/Thomas.Do;https://profiles.uts.edu.au/YuKai.Wang;http://www.uts.edu.au/staff/chin-teng.lin;",
        "dblp": "248/5526;;;;;",
        "google_scholar": "https://scholar.google.com.au/citations?user=GoQKrD0AAAAJ;;8_nErXAAAAAJ;https://scholar.google.com/citations?hl=zh-TW;nubkF1cAAAAJ;l-eP62sAAAAJ",
        "orcid": ";0000-0001-9244-0318;0000-0002-8597-5944;;0000-0001-8371-8197;my-orcid?orcid=0000-0002-6620-604X",
        "linkedin": ";;thomas-do/;;;",
        "or_profile": "~Yiqun_Duan1;~Yu-Cheng_Chang3;~Thomas_Do1;~Yu-Kai_Wang1;~Chin-teng_Lin1;~Charles_Zhou1",
        "aff": "University of Technology Sydney;University of Technology Sydney;University of Technology Sydney;University of Technology Sydney;University of Technology Sydney;University of Technology Sydney",
        "aff_domain": "uts.edu.au;uts.edu.au;uts.edu.au;uts.edu.au;uts.edu.au;uts.edu.au",
        "position": "PhD student;Researcher;Assistant Professor;Lecturer;Full Professor;PhD student",
        "bibtex": "@misc{\nchau2024belt,\ntitle={{BELT}-2: Bootstrapping {EEG}-to-Language representation alignment for multi-task brain decoding},\nauthor={Charles Chau and Yiqun Duan and Yu-Cheng Chang and Thomas Do and Yu-Kai Wang and Chin-teng Lin},\nyear={2024},\nurl={https://openreview.net/forum?id=gp5dPMBzMH}\n}",
        "github": "",
        "project": "",
        "reviewers": "6hGH;8fpS;psny;KLkP;CXNw",
        "site": "https://openreview.net/forum?id=gp5dPMBzMH",
        "pdf_size": 3315636,
        "rating": "1;5;5;6;8",
        "confidence": "5;4;3;4;2",
        "soundness": "2;3;3;3;3",
        "contribution": "2;2;3;2;3",
        "presentation": "3;3;3;2;3",
        "wc_summary": "69;37;31;86;77",
        "wc_strengths": "15;26;43;77;47",
        "wc_weaknesses": "305;211;27;64;243",
        "wc_questions": "161;2;24;292;52",
        "wc_review": "550;276;125;519;419",
        "wc_reply_reviewers": "129;27;6;0;24",
        "wc_reply_authors": "1087;1046;862;978;987",
        "reply_reviewers": "1;1;1;0;1",
        "reply_authors": "3;3;3;2;3",
        "rating_avg": [
            5.0,
            2.280350850198276
        ],
        "confidence_avg": [
            3.6,
            1.019803902718557
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            60.0,
            21.98181066245454
        ],
        "wc_strengths_avg": [
            41.6,
            21.143320458244016
        ],
        "wc_weaknesses_avg": [
            170.0,
            106.69582934679312
        ],
        "wc_questions_avg": [
            106.2,
            107.77457956308622
        ],
        "wc_review_avg": [
            377.8,
            158.46690506222427
        ],
        "wc_reply_reviewers_avg": [
            37.2,
            47.03785709404713
        ],
        "wc_reply_authors_avg": [
            992.0,
            76.23909758122797
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4
        ],
        "reply_authors_avg": [
            2.8,
            0.39999999999999997
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.8600261451922268,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:YPq2hbiBhyYJ:scholar.google.com/&scioq=BELT-2:+Bootstrapping+EEG-to-Language+representation+alignment+for+multi-task+brain+decoding&hl=en&as_sdt=0,48",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "University of Technology Sydney",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uts.edu.au",
        "aff_unique_abbr": "UTS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "Australia"
    },
    {
        "title": "Efficient Subgraph GNNs by Learning Effective Selection Policies",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18129",
        "id": "gppLqZLQeY",
        "author_site": "Beatrice Bevilacqua, Moshe Eliasof, Eli Meirom, Bruno Ribeiro, Haggai Maron",
        "tldr": "",
        "abstract": "Subgraph GNNs are provably expressive neural architectures that learn graph representations from sets of subgraphs. Unfortunately, their applicability is hampered by the computational complexity associated with performing message passing on many subgraphs. In this paper, we consider the problem of learning to select a small subset of the large set of possible subgraphs in a data-driven fashion. We first motivate the problem by proving that there are families of WL-indistinguishable graphs for which there exist efficient subgraph selection policies: small subsets of subgraphs that can already identify all the graphs within the family. We then propose a new approach, called _Policy-Learn_, that learns how to select subgraphs in an iterative manner. We prove that, unlike popular random policies and prior work addressing the same problem, our architecture is able to learn the efficient policies mentioned above. Our experimental results demonstrate that _Policy-Learn_ outperforms existing baselines across a wide range of datasets.",
        "keywords": "Graph Neural Networks;Subgraphs;Expressive power;Sampling",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Beatrice Bevilacqua;Moshe Eliasof;Eli Meirom;Bruno Ribeiro;Haggai Maron",
        "authorids": "~Beatrice_Bevilacqua1;~Moshe_Eliasof1;~Eli_Meirom2;~Bruno_Ribeiro1;~Haggai_Maron1",
        "gender": "F;M;;M;M",
        "homepage": "http://beabevi.github.io/;;;https://www.cs.purdue.edu/homes/ribeirob/;https://haggaim.github.io/",
        "dblp": "275/2364;239/6004;132/8961;15/606;181/6629",
        "google_scholar": ";44LKqBsAAAAJ;ZYEgD7wAAAAJ;KIEleCsAAAAJ;https://scholar.google.co.il/citations?user=4v8uJrIAAAAJ",
        "orcid": ";;;0000-0002-3527-6192;",
        "linkedin": ";;;;",
        "or_profile": "~Beatrice_Bevilacqua1;~Moshe_Eliasof1;~Eli_Meirom2;~Bruno_Ribeiro1;~Haggai_Maron1",
        "aff": "Purdue University;University of Cambridge;;Stanford University;NVIDIA",
        "aff_domain": "purdue.edu;cam.ac.uk;;stanford.edu;nvidia.com",
        "position": "PhD student;Postdoc;;Visiting Associate Professor;Research Scientist",
        "bibtex": "@inproceedings{\nbevilacqua2024efficient,\ntitle={Efficient Subgraph {GNN}s by Learning Effective Selection Policies},\nauthor={Beatrice Bevilacqua and Moshe Eliasof and Eli Meirom and Bruno Ribeiro and Haggai Maron},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=gppLqZLQeY}\n}",
        "github": "",
        "project": "",
        "reviewers": "ew9j;w3Fw;VjjR;gwbR",
        "pdf_size": 566915,
        "rating": "6;6;6;8",
        "confidence": "4;4;3;4",
        "soundness": "3;2;3;3",
        "contribution": "2;3;2;2",
        "presentation": "3;3;2;3",
        "wc_summary": "56;58;108;166",
        "wc_strengths": "27;32;62;50",
        "wc_weaknesses": "381;184;32;146",
        "wc_questions": "50;85;81;201",
        "wc_review": "514;359;283;563",
        "wc_reply_reviewers": "375;138;75;83",
        "wc_reply_authors": "2226;640;1374;1298",
        "reply_reviewers": "1;1;2;2",
        "reply_authors": "5;2;3;3",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            97.0,
            44.955533585978046
        ],
        "wc_strengths_avg": [
            42.75,
            14.02453207775575
        ],
        "wc_weaknesses_avg": [
            185.75,
            125.84191471842757
        ],
        "wc_questions_avg": [
            104.25,
            57.4777130721117
        ],
        "wc_review_avg": [
            429.75,
            113.35205115038721
        ],
        "wc_reply_reviewers_avg": [
            167.75,
            122.08885084232712
        ],
        "wc_reply_authors_avg": [
            1384.5,
            563.4702742825037
        ],
        "reply_reviewers_avg": [
            1.5,
            0.5
        ],
        "reply_authors_avg": [
            3.25,
            1.0897247358851685
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 18,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16482819080494320381&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=gppLqZLQeY",
        "pdf": "https://openreview.net/pdf?id=gppLqZLQeY",
        "email": "purdue.edu;cam.ac.uk;;stanford.edu;nvidia.com",
        "author_num": 5,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Purdue University;University of Cambridge;Stanford University;NVIDIA",
        "aff_unique_dep": ";;;NVIDIA Corporation",
        "aff_unique_url": "https://www.purdue.edu;https://www.cam.ac.uk;https://www.stanford.edu;https://www.nvidia.com",
        "aff_unique_abbr": "Purdue;Cambridge;Stanford;NVIDIA",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Cambridge;Stanford",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "gqjEhvUC6H",
        "title": "Data De-Duplication and Semantic Enhancement for Contrastive Language-Image Pre-training",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Benefiting from the countless image-text pairs in the web data, vision-language pre-training models (e.g. CLIP) have emerged as an efficient alternative in learning representations that are transferable across a wide range of downstream tasks.\nHowever, we reveal that the web data are noisy, with significant scene redundancy and misalignment in the image-text pairs, which increase the training expenses and computing resources.\nTo alleviate these problems, this paper proposes a novel training strategy that comprises two dedicated components, namely Data De-Duplication ($\\text{D}^3$) and Semantic Enhancement (SE).\n$\\text{D}^3$ leverages the pre-clustered data prototypes to decrease the training cost without reducing the data diversity by uniformly sampling a portion of image-text pairs at each training epoch. \nSE utilizes a large language model (LLM) and a visual large language model (VLLM) to refine and augment the text caption, which can help to form a one-to-multiple mapping relation between image and text. \nFurthermore, we employ a Diverse Captions Training Mechanism (DCTM) and a Modality Self-enhancement Training Mechanism (MSTM) for effective training. \nExperimental results indicate that the proposed method achieves state-of-the-art performance on various tasks including image classification, image-text retrieval, object detection, and segmentation (performance improvements varying from 0.2\\% to 23.9\\% for all datasets) with only half of the training time compared with original CLIP. \nOur code and generated data will be publicly available.",
        "keywords": "Data De-Duplication;Semantic Enhancement;Large Language Model;Visual Large Language Model;Contrastive Language-Image Pre-training",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/56c365d4a555fe330138ceb632be1bb6bc245a54.pdf",
        "author": "Siyang Sun;Chen-Wei Xie;Shuailei Ma;Yun Zheng",
        "authorids": "~Siyang_Sun1;~Chen-Wei_Xie2;~Shuailei_Ma1;~Yun_Zheng3",
        "gender": "M;M;F;M",
        "homepage": ";https://github.com/xiaomabufei;;",
        "dblp": "180/5461;337/1450;;",
        "google_scholar": "UHCDCRMAAAAJ;dNhzCu4AAAAJ;https://scholar.google.com.hk/citations?hl=zh-CN;-hFpScAAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Chen-Wei_Xie2;~Shuailei_Ma1;~Sun_Siyang1;~Yun_Zheng1",
        "aff": "Alibaba Group;Northeastern University;Alibaba Group;Alibaba Group",
        "aff_domain": "alibaba-inc.com;neu.edu.cn;alibaba-inc.com;alibaba-inc.com",
        "position": "Researcher;PhD student;Researcher;Researcher",
        "bibtex": "@misc{\nsun2024data,\ntitle={Data De-Duplication and Semantic Enhancement for Contrastive Language-Image Pre-training},\nauthor={Siyang Sun and Chen-Wei Xie and Shuailei Ma and Yun Zheng},\nyear={2024},\nurl={https://openreview.net/forum?id=gqjEhvUC6H}\n}",
        "github": "",
        "project": "",
        "reviewers": "YX2M;xVnC;Fx4U;AY1m",
        "site": "https://openreview.net/forum?id=gqjEhvUC6H",
        "pdf_size": 1678112,
        "rating": "3;5;5;5",
        "confidence": "5;5;4;4",
        "soundness": "2;2;2;2",
        "contribution": "1;2;2;2",
        "presentation": "1;2;3;3",
        "wc_summary": "60;60;96;128",
        "wc_strengths": "22;49;166;35",
        "wc_weaknesses": "224;144;145;274",
        "wc_questions": "4;45;115;110",
        "wc_review": "310;298;522;547",
        "wc_reply_reviewers": "24;0;44;594",
        "wc_reply_authors": "2440;620;1620;2328",
        "reply_reviewers": "1;0;1;3",
        "reply_authors": "3;1;3;4",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            86.0,
            28.35489375751565
        ],
        "wc_strengths_avg": [
            68.0,
            57.38031021177909
        ],
        "wc_weaknesses_avg": [
            196.75,
            55.160561092142636
        ],
        "wc_questions_avg": [
            68.5,
            46.360004314063644
        ],
        "wc_review_avg": [
            419.25,
            115.66627641624848
        ],
        "wc_reply_reviewers_avg": [
            165.5,
            247.8845497403983
        ],
        "wc_reply_authors_avg": [
            1752.0,
            725.2530592834477
        ],
        "reply_reviewers_avg": [
            1.25,
            1.0897247358851685
        ],
        "reply_authors_avg": [
            2.75,
            1.0897247358851685
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7723986942966437194&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Alibaba Group;Northeastern University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.alibaba.com;https://www.northeastern.edu",
        "aff_unique_abbr": "Alibaba;NEU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "gql60q5W4z",
        "title": "Reinforcement Learning with Fine-grained Reward for Controllable Text Generation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "To alleviate text degeneration of large-scale language models and meet the requirements of real-world applications, it is essential to make generation more controllable. Previous reinforcement learning (RL) research on language modeling generally learns from sentence-level feedback, which requires extensive exploration to collect enough trajectories, and more steps to learn contributory components from a noisy trajectory corpus. To tackle that, we propose a novel reinforcement learning algorithm with FIne-grained REward (FIRE). We derive an extensible fine-grained reward function and ease the trade-off between reward approximation and training stability. We present a theoretical connection between our approach and canonical policy-gradient RL methods. Experimental results show that FIRE can achieve superior controllability of language models with less computational overheads compared to prior RL approaches.",
        "keywords": "controllable text generation;reinforcement learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Wendi Li;Wei Wei;Dangyang Chen",
        "authorids": "~Wendi_Li1;~Wei_Wei14;~Dangyang_Chen1",
        "gender": "M;M;M",
        "homepage": "https://windylee0822.github.io/;https://www.eric-weiwei.com;",
        "dblp": "224/6352;24/4105-2;327/3353",
        "google_scholar": "hK19TbcAAAAJ;https://scholar.google.com.sg/citations?hl=en;",
        "orcid": ";0000-0003-4488-0102;",
        "linkedin": ";;",
        "or_profile": "~Wendi_Li1;~Wei_Wei14;~Dangyang_Chen1",
        "aff": "Huazhong University of Science and Technology;Huazhong University of Science and Technology;Pingan Technology",
        "aff_domain": "hust.edu.cn;hust.edu.cn;pingan.com.cn",
        "position": "MS student;Full Professor;CTO",
        "bibtex": "@misc{\nli2024reinforcement,\ntitle={Reinforcement Learning with Fine-grained Reward for Controllable Text Generation},\nauthor={Wendi Li and Wei Wei and Dangyang Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=gql60q5W4z}\n}",
        "github": "",
        "project": "",
        "reviewers": "J25V;JiMb;bVBE;EvSr",
        "site": "https://openreview.net/forum?id=gql60q5W4z",
        "pdf_size": 516684,
        "rating": "3;3;5;5",
        "confidence": "4;4;4;2",
        "soundness": "2;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "1;2;3;3",
        "wc_summary": "124;46;81;82",
        "wc_strengths": "26;37;71;18",
        "wc_weaknesses": "710;216;401;79",
        "wc_questions": "189;6;25;72",
        "wc_review": "1049;305;578;251",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            83.25,
            27.63489641739227
        ],
        "wc_strengths_avg": [
            38.0,
            20.211382931407737
        ],
        "wc_weaknesses_avg": [
            351.5,
            236.42599264886252
        ],
        "wc_questions_avg": [
            73.0,
            71.15124735378853
        ],
        "wc_review_avg": [
            545.75,
            315.8871436130315
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:OUg0hMryvHAJ:scholar.google.com/&scioq=Reinforcement+Learning+with+Fine-grained+Reward+for+Controllable+Text+Generation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Huazhong University of Science and Technology;PingAn Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.hust.edu.cn;https://www.pingan.com",
        "aff_unique_abbr": "HUST;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "gqmELEp3lZ",
        "title": "OpenReviewer: Mitigating Challenges in LLM Reviewing",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Human reviews of research papers are slow and of variable quality. Hence there is increasing interest in using large language models (LLMs) such as GPT to review research papers. This paper develops a proof-of-concept LLM review process that shows LLMs offer consistently high-quality reviews almost instantly. However, many challenges and limitations remain: risk of misuse, inflated review scores, overconfident ratings, skewed score distributions, and limited prompt length. We mitigate these issues without prompt engineering by using LLM watermarking to mark LLM-generated reviews; classifying and detection errors and shortcomings of papers; and using long-context windows that include the review form, entire paper, reviewer guidelines, code of ethics and conduct, area chair guidelies, and previous year statistics; and a blind human evaluation of reviews. We aim to use OpenReviewer to review and revise research papers, improving their quality. This work identifies and addresses drawbacks associated with GPT as a reviewer and enhances the quality of the reviewing process based on a randomized human blind evaluation. Making OpenReviewer available as an open online service that generates reviews will allow the use of scalable human feedback to learn and improve.",
        "keywords": "ChatGPT;reviewing research papers;LLM watermarking;long context windows;fine-tuning;randomized human blind evaluation",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Keith Tyser;Jason Lee;Avi Shporer;Madeleine Udell;Dov Te'eni;Iddo Drori",
        "authorids": "~Keith_Tyser1;~Jason_Lee6;~Avi_Shporer1;~Madeleine_Udell1;teeni@tauex.tau.ac.il;~Iddo_Drori1",
        "gender": "M;M;M;F;;M",
        "homepage": ";https://www.linkedin.com/in/jason-lee-b3479a17b/;https://space.mit.edu/home/shporer/;https://people.orie.cornell.edu/mru8;;https://www.cs.columbia.edu/~idrori",
        "dblp": ";;;153/2166;;86/2557",
        "google_scholar": ";;dFtkTYcAAAAJ;tZ9pEDMAAAAJ;;https://scholar.google.com/citations?hl=en",
        "orcid": ";;0000-0002-1836-3120;0000-0002-3985-915X;;0000-0001-9797-3885",
        "linkedin": "keithtyser/;;;;;iddodrori",
        "or_profile": "~Keith_Tyser1;~Jason_Lee6;~Avi_Shporer1;~Madeleine_Udell1;teeni@tauex.tau.ac.il;~Iddo_Drori1",
        "aff": ";Boston University;Massachusetts Institute of Technology;Stanford University;;Columbia University",
        "aff_domain": ";bu.edu;mit.edu;stanford.edu;;columbia.edu",
        "position": ";Undergrad student;Research Scientist;Assistant Professor;;Adjunct Associate Professor",
        "bibtex": "@misc{\ntyser2024openreviewer,\ntitle={OpenReviewer: Mitigating Challenges in {LLM} Reviewing},\nauthor={Keith Tyser and Jason Lee and Avi Shporer and Madeleine Udell and Dov Te'eni and Iddo Drori},\nyear={2024},\nurl={https://openreview.net/forum?id=gqmELEp3lZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "koKB;Ndo8;8sHm",
        "site": "https://openreview.net/forum?id=gqmELEp3lZ",
        "pdf_size": 2727967,
        "rating": "3;3;5",
        "confidence": "4;3;3",
        "soundness": "2;2;2",
        "contribution": "1;2;2",
        "presentation": "2;1;3",
        "wc_summary": "80;58;84",
        "wc_strengths": "36;32;22",
        "wc_weaknesses": "505;217;27",
        "wc_questions": "2;161;54",
        "wc_review": "623;468;187",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            74.0,
            11.430952132988164
        ],
        "wc_strengths_avg": [
            30.0,
            5.887840577551898
        ],
        "wc_weaknesses_avg": [
            249.66666666666666,
            196.50501831307574
        ],
        "wc_questions_avg": [
            72.33333333333333,
            66.19331956893804
        ],
        "wc_review_avg": [
            426.0,
            180.45682770864246
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17897413871104172853&as_sdt=10005&sciodt=0,8&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Boston University;Massachusetts Institute of Technology;Stanford University;Columbia University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.bu.edu;https://web.mit.edu;https://www.stanford.edu;https://www.columbia.edu",
        "aff_unique_abbr": "BU;MIT;Stanford;Columbia",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Stanford",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "gqtbL7j2JW",
        "title": "You Only Submit One Image to Find the Most Suitable Generative Model",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep generative models have achieved promising results in image generation, and various generative model hubs, e.g., Hugging Face and Civitai, have been developed that enable model developers to upload models and users to download models. However, these model hubs lack advanced model management and identification mechanisms, resulting in users only searching for models through text matching, download sorting, etc., making it difficult to efficiently find the model that best meets user requirements. In this paper, we propose a novel setting called *Generative Model Identification* (GMI), which aims to enable the user to identify the most appropriate generative model(s) for the user's requirements from a large number of candidate models efficiently. To our best knowledge, it has not been studied yet. In this paper, we introduce a comprehensive solution consisting of three pivotal modules: a weighted Reduced Kernel Mean Embedding (RKME) framework for capturing the generated image distribution and the relationship between images and prompts, a pre-trained vision-language model aimed at addressing dimensionality challenges, and an image interrogator designed to tackle cross-modality issues. Extensive empirical results demonstrate the proposal is both efficient and effective. For example, users only need to submit a single example image to describe their requirements, and the model platform can achieve an average top-4 identification accuracy of more than 80%. The code and benchmark are all released to promote the research.",
        "keywords": "Machine Learning;Model Reuse;Specification;Generative Model;Stable Diffusion",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/ba66ef6abd268282a5c58568b61894207a2fb167.zip",
        "author": "Zhi Zhou;Lan-Zhe Guo;Pengxiao Song;Yu-Feng Li",
        "authorids": "~Zhi_Zhou2;~Lan-Zhe_Guo2;~Pengxiao_Song1;~Yu-Feng_Li1",
        "gender": "M;M;M;M",
        "homepage": "http://www.lamda.nju.edu.cn/zhouz/;http://www.lamda.nju.edu.cn/guolz;https://github.com/pengxiao-song;https://cs.nju.edu.cn/liyf/index.htm",
        "dblp": "04/2090-7;216/4845;;57/413",
        "google_scholar": "VzvP5a8AAAAJ;dpunvqgAAAAJ;;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;0000-0002-2220-5248",
        "linkedin": ";;;",
        "or_profile": "~Zhi_Zhou2;~Lan-Zhe_Guo2;~Pengxiao_Song1;~Yu-feng_Li2",
        "aff": "Nanjing University;Nanjing University;Nanjing University;Nanjing University",
        "aff_domain": "nju.edu.cn;nju.edu.cn;nju.edu.cn;nju.edu.cn",
        "position": "PhD student;Assistant Professor;MS student;Assistant Professor",
        "bibtex": "@misc{\nzhou2024you,\ntitle={You Only Submit One Image to Find the Most Suitable Generative Model},\nauthor={Zhi Zhou and Lan-Zhe Guo and Pengxiao Song and Yu-Feng Li},\nyear={2024},\nurl={https://openreview.net/forum?id=gqtbL7j2JW}\n}",
        "github": "",
        "project": "",
        "reviewers": "7QtA;pBNB;BSis;htir",
        "site": "https://openreview.net/forum?id=gqtbL7j2JW",
        "pdf_size": 30095901,
        "rating": "3;3;6;8",
        "confidence": "4;3;2;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;4;3",
        "wc_summary": "50;56;105;93",
        "wc_strengths": "35;84;57;132",
        "wc_weaknesses": "50;166;365;95",
        "wc_questions": "16;48;191;13",
        "wc_review": "151;354;718;333",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1067;1412;1390;343",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "5;5;4;3",
        "rating_avg": [
            5.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            76.0,
            23.484037131634757
        ],
        "wc_strengths_avg": [
            77.0,
            36.18701424544446
        ],
        "wc_weaknesses_avg": [
            169.0,
            120.48028884427526
        ],
        "wc_questions_avg": [
            67.0,
            72.89375830618147
        ],
        "wc_review_avg": [
            389.0,
            205.69759356881158
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1053.0,
            432.07233190751754
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            4.25,
            0.82915619758885
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:zfpVw0anki4J:scholar.google.com/&scioq=You+Only+Submit+One+Image+to+Find+the+Most+Suitable+Generative+Model&hl=en&as_sdt=0,33",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Nanjing University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nju.edu.cn",
        "aff_unique_abbr": "Nanjing U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "gqzknNJShg",
        "title": "FourierAugment: Frequency-Based Image Encoding for Resource-Constrained Vision Tasks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Resource-constrained vision tasks, such as image classification on low-end devices, put forward significant challenges due to limited computational resources and restricted access to a vast number of training samples. Previous studies have utilized data augmentation that optimizes various image transformations to learn effective lightweight models with few data samples. However, these studies require a calibration step for optimizing data augmentation to specific scenarios or hardly exploit frequency components readily available from Fourier analysis. To address the limitations, we propose a frequency-based image encoding method, namely FourierAugment, which allows lightweight models to learn richer features with a restrained amount of data. Further, we reveal the correlations between the amount of data and frequency components lightweight models learn in the process of designing FourierAugment. Extensive experiments on multiple resource-constrained vision tasks under diverse conditions corroborate the effectiveness of the proposed FourierAugment method compared to baselines.",
        "keywords": "Fourier Analysis;Computer Vision;Few-Shot Class Incremental Learning;Resource-Constrained Models",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/9bff403895584c8f58f0c9d5d8ba45f631a8c4d9.zip",
        "author": "Jiae Yoon;Myeongjin Lee;Ue-Hwan Kim",
        "authorids": "~Jiae_Yoon1;~Myeongjin_Lee2;~Ue-Hwan_Kim1",
        "gender": "F;M;M",
        "homepage": "https://www.notion.so/jiaeyoon/Jiae-Yoon-905908b9308747818ca4f5f0a77de777;https://github.com/lmj311;https://uehwan.github.io/",
        "dblp": ";;",
        "google_scholar": ";;EPliWZIAAAAJ",
        "orcid": ";;0000-0003-2201-2988",
        "linkedin": ";;",
        "or_profile": "~Jiae_Yoon1;~Myeongjin_Lee2;~Ue-Hwan_Kim1",
        "aff": "Gwangju Institute of Science and Technology;Gwangju Institute of Science and Technology;Gwangju Institute of Science and Technology",
        "aff_domain": "gist.ac.kr;gist.ac.kr;gist.ac.kr",
        "position": "PhD student;Undergrad student;Assistant Professor",
        "bibtex": "@misc{\nyoon2024fourieraugment,\ntitle={FourierAugment: Frequency-Based Image Encoding for Resource-Constrained Vision Tasks},\nauthor={Jiae Yoon and Myeongjin Lee and Ue-Hwan Kim},\nyear={2024},\nurl={https://openreview.net/forum?id=gqzknNJShg}\n}",
        "github": "",
        "project": "",
        "reviewers": "hasU;myuo;2Mv7;cppX",
        "site": "https://openreview.net/forum?id=gqzknNJShg",
        "pdf_size": 3733004,
        "rating": "5;5;5;6",
        "confidence": "3;3;4;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;2",
        "presentation": "2;3;3;3",
        "wc_summary": "48;37;63;131",
        "wc_strengths": "89;35;37;92",
        "wc_weaknesses": "49;242;42;270",
        "wc_questions": "104;5;22;6",
        "wc_review": "290;319;164;499",
        "wc_reply_reviewers": "14;66;0;7",
        "wc_reply_authors": "422;473;215;375",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            69.75,
            36.54705870518173
        ],
        "wc_strengths_avg": [
            63.25,
            27.279800219209818
        ],
        "wc_weaknesses_avg": [
            150.75,
            105.74349861811837
        ],
        "wc_questions_avg": [
            34.25,
            40.831207427652686
        ],
        "wc_review_avg": [
            318.0,
            119.64739863448766
        ],
        "wc_reply_reviewers_avg": [
            21.75,
            26.022826518270456
        ],
        "wc_reply_authors_avg": [
            371.25,
            96.63947174938406
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:n4FbcDPM5K8J:scholar.google.com/&scioq=FourierAugment:+Frequency-Based+Image+Encoding+for+Resource-Constrained+Vision+Tasks&hl=en&as_sdt=0,5",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Gwangju Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.gist.ac.kr",
        "aff_unique_abbr": "GIST",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Gwangju",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "grQ97sPU5T",
        "title": "Spectral Highways: Injecting Homophily into Heterophilic Graphs",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The application of convolution in graphs is at the core of Graph Neural Network (GNN) algorithms that led to the emergence of Graph Representation Learning (GRL). Various algorithms have been proposed over the last few years to solve the classical GRL task of node classification in a transductive setting. It is widely assumed that standard GNNs perform better on graphs with high homophily, i.e., nodes belonging to the same class are highly connected to each other. This assumption has led to the designing of specialised algorithms in the last few years for datasets that do not contain the property of homophily, i.e., heterophilic datasets. In this work, we both challenge and leverage this assumption. We argue that it is not necessary to follow the common trend of designing new algorithms but instead focus on understanding and enriching the data. We present a new technique from the perspective of data engineering that enables better performance on heterophilic datasets by both heterophilic GNN algorithms and non-heterophilic GNN algorithms. Our proposed technique, Spectral Highways, enables better connectivity and information flow between nodes in a heterophilic graph. We also draw an analogy between the performance of Spectral Highways and a recently proposed network property, i.e., Adjusted homophily. We conduct experiments on 11 baselines and 8 heterophilic datasets and achieve significant improvements in results.",
        "keywords": "Heterophily;GNN;Homophily",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Karan Goyal;Saankhya Samanta;Mukesh Mohania;Vikram Goyal",
        "authorids": "~Karan_Goyal1;~Saankhya_Samanta1;~Mukesh_Mohania1;~Vikram_Goyal1",
        "gender": ";;M;M",
        "homepage": ";https://www.linkedin.com/in/saankhya-samanta-62a007281/;https://www.iiitd.ac.in/mukesh;https://www.iiitd.ac.in/vikram/",
        "dblp": "246/8470;;85/6670.html;70/6404.html",
        "google_scholar": "https://scholar.google.co.in/citations?hl=en;;zgaqvNQAAAAJ;https://scholar.google.com.tw/citations?user=YJaVmSwAAAAJ",
        "orcid": ";;;0000-0003-0769-6381",
        "linkedin": "karan-goyal-757727a6/;saankhya-samanta-62a007281/;;vikram-goyal-7a684213/",
        "or_profile": "~Karan_Goyal1;~Saankhya_Samanta1;~Mukesh_Mohania1;~Vikram_Goyal1",
        "aff": "Indraprastha Institute of Information Technology, Delhi;Indian Institute of Engineering Science and Technology, Shibpur;Indraprastha Institute of Information Technology;Indraprastha Institute of Information Technology, Delhi",
        "aff_domain": "iiitd.ac.in;iiests.ac.in;iiitd.ac.in;iiitd.ac.in",
        "position": "PhD student;Undergrad student;Full Professor;Full Professor",
        "bibtex": "@misc{\ngoyal2024spectral,\ntitle={Spectral Highways: Injecting Homophily into Heterophilic Graphs},\nauthor={Karan Goyal and Saankhya Samanta and Mukesh Mohania and Vikram Goyal},\nyear={2024},\nurl={https://openreview.net/forum?id=grQ97sPU5T}\n}",
        "github": "",
        "project": "",
        "reviewers": "okcj;r3Ms;eD98;AHfa",
        "site": "https://openreview.net/forum?id=grQ97sPU5T",
        "pdf_size": 287339,
        "rating": "3;5;5;5",
        "confidence": "5;4;4;5",
        "soundness": "2;2;3;2",
        "contribution": "2;2;2;2",
        "presentation": "4;3;2;2",
        "wc_summary": "52;76;137;48",
        "wc_strengths": "50;6;76;28",
        "wc_weaknesses": "60;2;399;220",
        "wc_questions": "401;210;250;34",
        "wc_review": "563;294;862;330",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            78.25,
            35.56947427219019
        ],
        "wc_strengths_avg": [
            40.0,
            25.96150997149434
        ],
        "wc_weaknesses_avg": [
            170.25,
            154.32494127651563
        ],
        "wc_questions_avg": [
            223.75,
            130.6720609005613
        ],
        "wc_review_avg": [
            512.25,
            226.79767966185193
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:yfONeoWT4s8J:scholar.google.com/&scioq=Spectral+Highways:+Injecting+Homophily+into+Heterophilic+Graphs&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Indraprastha Institute of Information Technology;Indian Institute of Engineering Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.iiitd.ac.in;https://www.iiests.ac.in",
        "aff_unique_abbr": "IIIT-D;IIEST Shibpur",
        "aff_campus_unique_index": "0;1;0",
        "aff_campus_unique": "Delhi;Shibpur;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "India"
    },
    {
        "id": "gsZAtAdzkY",
        "title": "ARB: Advanced Reasoning Benchmark for Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) have demonstrated remarkable performance on various quantitative reasoning and knowledge benchmarks. However, many of these benchmarks are losing utility as LLMs get increasingly high scores, despite not yet reaching expert performance in these domains. We introduce ARB, a novel benchmark composed of advanced reasoning problems in multiple fields. ARB presents a more challenging test than prior benchmarks, featuring problems in mathematics, physics, biology, chemistry, and law. As a subset of ARB, we introduce a challenging set of math and physics problems which require advanced symbolic reasoning and domain knowledge. We evaluate recent models such as GPT-4 and Claude on ARB and demonstrate that current models score well below 50% on more demanding tasks. In order to improve both automatic and assisted evaluation capabilities, we introduce a rubric-based evaluation approach, allowing GPT-4 to score its own intermediate reasoning steps. Further, we conduct a human evaluation of the symbolic subset of ARB, finding promising agreement between annotators and GPT-4 rubric evaluation score.",
        "keywords": "benchmark;academic;mathematics;physics;LLM",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/97a01d29b3709dd8c6072185431a568ec2613997.pdf",
        "author": "Tomohiro Sawada;Daniel Paleka;Alexander Havrilla;Pranav Tadepalli;Paula Vidas;Alexander Perikles Kranias;John J Nay;Kshitij Gupta;Aran Komatsuzaki",
        "authorids": "~Tomohiro_Sawada1;~Daniel_Paleka1;~Alexander_Havrilla2;~Pranav_Tadepalli1;~Paula_Vidas1;~Alexander_Perikles_Kranias1;~John_J_Nay1;~Kshitij_Gupta1;~Aran_Komatsuzaki1",
        "gender": "M;;M;M;;M;;M;",
        "homepage": "https://tomohiro-sawada.github.io/;https://danielpaleka.com/;https://dahoas.github.io/;http://pranav.cc;;https://alexkranias.com/;http://johnjnay.com/;;https://arankomatsuzaki.wordpress.com/",
        "dblp": "353/1617;324/2779;;;;;;;",
        "google_scholar": "t0dADxkAAAAJ;;;;;;;;zzksRXYAAAAJ",
        "orcid": ";;;;;;;;",
        "linkedin": "tom-sawada-16303220a/;;;pranav-tadepalli-b2b563243/;paula-vidas-589974264/;;;kshitijkgupta/;",
        "or_profile": "~Tomohiro_Sawada1;~Daniel_Paleka1;~Alexander_Havrilla2;~Pranav_Tadepalli1;~Paula_Vidas1;~Alexander_Perikles_Kranias1;~John_J_Nay1;~Kshitij_Gupta1;~Aran_Komatsuzaki1",
        "aff": "Georgia Institute of Technology;Department of Computer Science, ETHZ - ETH Zurich;Georgia Institute of Technology;Georgia Institute of Technology;ETHZ - ETH Zurich;Georgia Institute of Technology;Stanford University;;",
        "aff_domain": "gatech.edu;inf.ethz.ch;gatech.edu;gatech.edu;ethz.ch;gatech.edu;stanford.edu;;",
        "position": "PhD student;PhD student;PhD student;Undergrad student;MS student;Undergrad student;Researcher;;",
        "bibtex": "@misc{\nsawada2024arb,\ntitle={{ARB}: Advanced Reasoning Benchmark for Large Language Models},\nauthor={Tomohiro Sawada and Daniel Paleka and Alexander Havrilla and Pranav Tadepalli and Paula Vidas and Alexander Perikles Kranias and John J Nay and Kshitij Gupta and Aran Komatsuzaki},\nyear={2024},\nurl={https://openreview.net/forum?id=gsZAtAdzkY}\n}",
        "github": "",
        "project": "",
        "reviewers": "jkxa;Bwn3;Vtbi;c9vS",
        "site": "https://openreview.net/forum?id=gsZAtAdzkY",
        "pdf_size": 440600,
        "rating": "5;5;6;6",
        "confidence": "3;3;2;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "87;50;102;43",
        "wc_strengths": "43;50;117;87",
        "wc_weaknesses": "67;224;48;60",
        "wc_questions": "100;57;17;26",
        "wc_review": "297;381;284;216",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "447;623;263;288",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            70.5,
            24.70323865407125
        ],
        "wc_strengths_avg": [
            74.25,
            29.810862114336782
        ],
        "wc_weaknesses_avg": [
            99.75,
            72.05683520666169
        ],
        "wc_questions_avg": [
            50.0,
            32.45766473423496
        ],
        "wc_review_avg": [
            294.5,
            58.653644388051454
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            405.25,
            144.17068876855654
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 75,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5512964966028642645&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;0;0;1;0;2",
        "aff_unique_norm": "Georgia Institute of Technology;ETH Zurich;Stanford University",
        "aff_unique_dep": ";Department of Computer Science;",
        "aff_unique_url": "https://www.gatech.edu;https://www.ethz.ch;https://www.stanford.edu",
        "aff_unique_abbr": "Georgia Tech;ETHZ;Stanford",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Zurich;Stanford",
        "aff_country_unique_index": "0;1;0;0;1;0;0",
        "aff_country_unique": "United States;Switzerland"
    },
    {
        "id": "gszCTQVDaC",
        "title": "Poisoning-based Backdoor Attack against Vision-Language Model",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We delve into a novel methodology of performing stealthy backdoor attacks on large language models under visual instruction tuning, wherein we subtly infuse malicious triggers in both the textual and visual domains, thereby manipulating the model to exhibit predefined exploitable behaviors during the inference process. Our methodology, in contrast to existing works, does not necessitate access to model gradients and weights and ensures the deployment of clean images and labels. This strategic poisoning maintains stealth by generating correct outputs when tested on samples with untriggered images or instructions while revealing its strength by activating malicious behaviors when encountered with specified visual triggers and textual triggers at the same time. We further examine the effectiveness of our method on LLaVA model, exploring various tasks including string injection, over-refusal, and false knowledge injection, to demonstrate the versatility and robustness of our approach in diverse application scenarios. The results expose significant vulnerabilities in current models, emphasizing the need for developing advanced countermeasures and underlining the greater importance of data quality in the realm of visual instruction tuning.",
        "keywords": "Security;Backdoor Attack;Data Poisoning;Visual Instruction Tuning;Large Language Models",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Yiwei Zhang;Chaowei Xiao;Shutong Wu",
        "authorids": "~Yiwei_Zhang6;~Chaowei_Xiao2;~Shutong_Wu1",
        "gender": "M;M;M",
        "homepage": ";https://cychomatica.github.io/;https://xiaocw11.github.io/",
        "dblp": ";288/0663;150/3317",
        "google_scholar": ";;Juoqtj8AAAAJ",
        "orcid": ";;0000-0002-7043-4926",
        "linkedin": "yiwei-zhang-6888aa228/;;",
        "or_profile": "~Yiwei_Zhang6;~Shutong_Wu1;~chaowei_xiao1",
        "aff": "Department of Computer Science, University of Wisconsin - Madison;University of Wisconsin - Madison;NVIDIA",
        "aff_domain": "cs.wisc.edu;wisc.edu;nvidia.com",
        "position": "PhD student;PhD student;Researcher",
        "bibtex": "@misc{\nzhang2024poisoningbased,\ntitle={Poisoning-based Backdoor Attack against Vision-Language Model},\nauthor={Yiwei Zhang and Chaowei Xiao and Shutong Wu},\nyear={2024},\nurl={https://openreview.net/forum?id=gszCTQVDaC}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=gszCTQVDaC",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:MINThDTTtisJ:scholar.google.com/&scioq=Poisoning-based+Backdoor+Attack+against+Vision-Language+Model&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "University of Wisconsin-Madison;NVIDIA",
        "aff_unique_dep": "Department of Computer Science;NVIDIA Corporation",
        "aff_unique_url": "https://www.wisc.edu;https://www.nvidia.com",
        "aff_unique_abbr": "UW-Madison;NVIDIA",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Madison;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "gtMbnrsyLA",
        "title": "SMAAT: Scalable Manifold-Aware Adversarial Training for Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Adversarial Training (AT), the method of finetuning a deep learning model with adversarially generated examples, is the most reliable form of making a model robust against future adversarial perturbations. However, AT is substantially expensive than standard training as it requires several full forward and backward passes to compute adversarial examples. In this paper, we introduce SMAAT, an efficient AT method that uses only adversarial examples generated in the last layer to finetune encoder-based large language models. The basis of our approach are the following three observations (i) the intrinsic dimensionality of the embedding space spanned by different layers of a deep model is substantially lower than the explicit dimensionality of the token embeddings; (ii) Encoder-based language models exhibit a monotonic behavior in their intrinsic dimensionality, i.e., deeper layers (closer to the output) have much lower intrinsic dimensionality than the shallow layers (closer to the input); (iii) off-manifold examples tend to persist across layers, i.e., an image of an off-manifold example generated in a shallow layer continues to remain off-manifold with respect to the embedding space of the later layers. We empirically demonstrate the effectiveness of SMAAT and show that it increases robustness by 8.6%, 15.7%, and 28.8% for BERT and 6.0%, 5.8%, and 19.0% for RoBERTa over the previous state-of-the-art results on AGNEWS, IMDB, and YELP, respectively. These improvements are achieved while maintaining comparable generalization and reducing the computational cost to approximately 1/3 to 1/4 of the GPU times required by the Projected Gradient Descent algorithm.",
        "keywords": "adversarial training;robustness;sentiment analysis;large language models",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Enes Altinisik;Safa Messaoud;Husrev Taha Sencar;Hassan Sajjad;Sanjay Chawla",
        "authorids": "~Enes_Altinisik1;~Safa_Messaoud1;~Husrev_Taha_Sencar1;~Hassan_Sajjad1;~Sanjay_Chawla2",
        "gender": "M;;M;M;M",
        "homepage": ";https://ece.illinois.edu/directory/profile/messaou2;;https://hsajjad.github.io/;https://www.hbku.edu.qa/en/staff/sanjay-chawla",
        "dblp": "231/2612;126/7519;;73/5938;22/5463.html",
        "google_scholar": "https://scholar.google.com.tr/citations?user=AltBWsEAAAAJ;M2wXrP4AAAAJ;KGxrG0YAAAAJ;https://scholar.google.de/citations?user=t3BH6NkAAAAJ;fdUJcwYAAAAJ",
        "orcid": "0000-0001-9300-6564;;;;0000-0002-8102-2572",
        "linkedin": ";;;hassan-sajjad-154b043a/;",
        "or_profile": "~Enes_Altinisik1;~Safa_Messaoud1;~Husrev_Taha_Sencar1;~Hassan_Sajjad1;~Sanjay_Chawla2",
        "aff": "Qatar Computing Research Institute;Qatar Computing Research Institute;QCRI;Dalhousie University;Qatar Computing Research Institute",
        "aff_domain": "hbku.edu.qa;hbku.edu;qf.org;dal.ca;hbku.edu.qa",
        "position": "Researcher;Researcher;Principal Researcher;Associate Professor;Full Professor",
        "bibtex": "@misc{\naltinisik2024smaat,\ntitle={{SMAAT}: Scalable Manifold-Aware Adversarial Training for Large Language Models},\nauthor={Enes Altinisik and Safa Messaoud and Husrev Taha Sencar and Hassan Sajjad and Sanjay Chawla},\nyear={2024},\nurl={https://openreview.net/forum?id=gtMbnrsyLA}\n}",
        "github": "",
        "project": "",
        "reviewers": "nXMe;crCo;6Kya;JQp6;Tdyi",
        "site": "https://openreview.net/forum?id=gtMbnrsyLA",
        "pdf_size": 2834741,
        "rating": "5;5;6;6;8",
        "confidence": "5;4;3;3;4",
        "soundness": "2;2;3;3;3",
        "contribution": "2;2;3;2;3",
        "presentation": "3;2;3;3;3",
        "wc_summary": "62;71;49;47;145",
        "wc_strengths": "33;29;91;32;114",
        "wc_weaknesses": "122;191;100;59;128",
        "wc_questions": "2;4;3;63;367",
        "wc_review": "219;295;243;201;754",
        "wc_reply_reviewers": "0;148;0;127;156",
        "wc_reply_authors": "435;919;503;683;747",
        "reply_reviewers": "0;1;0;1;1",
        "reply_authors": "2;2;2;2;2",
        "rating_avg": [
            6.0,
            1.0954451150103321
        ],
        "confidence_avg": [
            3.8,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            74.8,
            36.1795522360352
        ],
        "wc_strengths_avg": [
            59.8,
            35.63930414584437
        ],
        "wc_weaknesses_avg": [
            120.0,
            42.96510211788167
        ],
        "wc_questions_avg": [
            87.8,
            141.52229506335743
        ],
        "wc_review_avg": [
            342.4,
            208.21296789585418
        ],
        "wc_reply_reviewers_avg": [
            86.2,
            71.01661777358875
        ],
        "wc_reply_authors_avg": [
            657.4,
            173.44693713063947
        ],
        "reply_reviewers_avg": [
            0.6,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.24397501823713333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:h0WKjGHwnBoJ:scholar.google.com/&scioq=SMAAT:+Scalable+Manifold-Aware+Adversarial+Training+for+Large+Language+Models&hl=en&as_sdt=0,23",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "Qatar Computing Research Institute;Dalhousie University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.qcri.org;https://www.dal.ca",
        "aff_unique_abbr": "QCRI;Dal",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "Qatar;Canada"
    },
    {
        "id": "gtfJxelOqu",
        "title": "Hierarchy-aware Biased Bound Loss Function for Hierarchical Text Classification",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Hierarchical text classification (HTC) is a challenging problem with two key issues: utilizing structural information and mitigating label imbalance. Recently, the unit-based approach generating unit-based feature representations has outperformed the global approach focusing on a global feature representation. Nevertheless, unit-based models using BCE and ZMLCE losses still face static thresholding and label imbalance challenges. Those challenges become more critical in large-scale hierarchies. This paper introduces a novel hierarchy-aware loss function for unit-based HTC models: Hierarchy-aware Biased Bound (H2B) loss. H2B integrates learnable bounds and biases to address static thresholding and mitigate label imbalance adaptively. Experimental results on benchmark datasets demonstrate the superior performance of H2B compared to competitive HTC models.",
        "keywords": "Deep Learning;Natural Language Processing;Hierarchical Text Classification",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Gibaeg Kim;SangHun Im;Heung-Seon Oh",
        "authorids": "~Gibaeg_Kim1;~SangHun_Im1;~Heung-Seon_Oh1",
        "gender": "M;M;",
        "homepage": ";;https://www.dicelab.kr/",
        "dblp": "307/3202;;",
        "google_scholar": "k30v3qEAAAAJ;https://scholar.google.co.kr/citations?user=aSqEbVIAAAAJ;https://scholar.google.co.kr/citations?user=hzP5fHIAAAAJ",
        "orcid": "0000-0003-3167-8861;0000-0002-2321-9473;",
        "linkedin": ";sang-hun-im-tkrhkshdqn/;",
        "or_profile": "~Gibaeg_Kim1;~SangHun_Im1;~Heung-Seon_Oh1",
        "aff": "Korea University of Technology and Education;Korea University of Technology and Education;Korea University of Technology and Education",
        "aff_domain": "koreatech.ac.kr;koreatech.ac.kr;koreatech.ac.kr",
        "position": "MS student;PhD student;Associate Professor",
        "bibtex": "@misc{\nkim2024hierarchyaware,\ntitle={Hierarchy-aware Biased Bound Loss Function for Hierarchical Text Classification},\nauthor={Gibaeg Kim and SangHun Im and Heung-Seon Oh},\nyear={2024},\nurl={https://openreview.net/forum?id=gtfJxelOqu}\n}",
        "github": "",
        "project": "",
        "reviewers": "CjA1;Dnhv;LxBt",
        "site": "https://openreview.net/forum?id=gtfJxelOqu",
        "pdf_size": 3083710,
        "rating": "3;3;5",
        "confidence": "3;4;4",
        "soundness": "2;3;3",
        "contribution": "2;1;2",
        "presentation": "3;2;3",
        "wc_summary": "123;117;82",
        "wc_strengths": "63;27;33",
        "wc_weaknesses": "419;90;168",
        "wc_questions": "49;13;1",
        "wc_review": "654;247;284",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            107.33333333333333,
            18.080068829760823
        ],
        "wc_strengths_avg": [
            41.0,
            15.748015748023622
        ],
        "wc_weaknesses_avg": [
            225.66666666666666,
            140.36697933947602
        ],
        "wc_questions_avg": [
            21.0,
            20.396078054371138
        ],
        "wc_review_avg": [
            395.0,
            183.76252791759984
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Q65Fu4H4r9gJ:scholar.google.com/&scioq=Hierarchy-aware+Biased+Bound+Loss+Function+for+Hierarchical+Text+Classification&hl=en&as_sdt=0,47",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Korea University of Technology and Education",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.kute.ac.kr",
        "aff_unique_abbr": "KUTE",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "Generative Judge for Evaluating Alignment",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18128",
        "id": "gtkFw6sZGS",
        "author_site": "Junlong Li, Shichao Sun, Weizhe Yuan, Run-Ze Fan, hai zhao, Pengfei Liu",
        "tldr": "",
        "abstract": "The rapid development of Large Language Models (LLMs) has substantially expanded the range of tasks they can address. In the field of Natural Language Processing (NLP), researchers have shifted their focus from conventional NLP tasks (e.g., sequence tagging and parsing) towards tasks that revolve around aligning with human needs (e.g., brainstorming and email writing). This shift in task distribution imposes new requirements on evaluating these aligned models regarding *generality* (i.e., assessing performance across diverse scenarios), *flexibility* (i.e., examining under different protocols), and *interpretability* (i.e., scrutinizing models with explanations). In this paper, we propose a generative judge with 13B parameters, **Auto-J**, designed to address these challenges. Our model is trained on user queries and LLM-generated responses under massive real-world scenarios and accommodates diverse evaluation protocols (e.g., pairwise response comparison and single-response evaluation) with well-structured natural language critiques. To demonstrate the efficacy of our approach, we construct a new testbed covering 58 different scenarios. Experimentally, **Auto-J** outperforms a series of strong competitors, including both open-source and closed-source models, by a large margin. We also provide detailed analysis and case studies to further reveal the potential of our method and make a variety of resources public at https://github.com/GAIR-NLP/auto-j.",
        "keywords": "Generative;Evaluation;Alignment",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Junlong Li;Shichao Sun;Weizhe Yuan;Run-Ze Fan;hai zhao;Pengfei Liu",
        "authorids": "~Junlong_Li1;~Shichao_Sun1;~Weizhe_Yuan1;~Run-Ze_Fan1;~hai_zhao1;~Pengfei_Liu1",
        "gender": ";M;F;M;M;M",
        "homepage": ";https://shichaosun.github.io;http://yyy-apple.github.io/;https://rzfan525.github.io/;http://bcmi.sjtu.edu.cn/~zhaohai/;http://pfliu.com/",
        "dblp": "115/6031;;207/1964;355/5702;25/1145-1.html;34/3381-3",
        "google_scholar": "UX7TpSYAAAAJ;https://scholar.google.com/citations?hl=en;2k5j4eMAAAAJ;https://scholar.google.com.hk/citations?user=mhot7AUAAAAJ;https://scholar.google.com.tw/citations?user=4dU5KS0AAAAJ;oIz_CYEAAAAJ",
        "orcid": ";;;0000-0002-8505-7756;;",
        "linkedin": ";;weizhey/;;;",
        "or_profile": "~Junlong_Li1;~Shichao_Sun1;~Weizhe_Yuan1;~Run-Ze_Fan1;~hai_zhao1;~Pengfei_Liu1",
        "aff": "Shanghai Jiaotong University;The Hong Kong Polytechnic University;New York University;University of Chinese Academy of Sciences;Shanghai Jiaotong University;Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn;polyu.edu.hk;nyu.edu;mails.ucas.ac.cn;sjtu.edu.cn;sjtu.edu",
        "position": "MS student;PhD student;PhD student;MS student;Full Professor;Associate Professor",
        "bibtex": "@inproceedings{\nli2024generative,\ntitle={Generative Judge for Evaluating Alignment},\nauthor={Junlong Li and Shichao Sun and Weizhe Yuan and Run-Ze Fan and hai zhao and Pengfei Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=gtkFw6sZGS}\n}",
        "github": "",
        "project": "",
        "reviewers": "WSEj;jzn2;PG92",
        "pdf_size": 3314807,
        "rating": "5;5;6",
        "confidence": "3;4;2",
        "soundness": "3;3;3",
        "contribution": "2;2;3",
        "presentation": "2;3;2",
        "wc_summary": "26;71;57",
        "wc_strengths": "11;50;31",
        "wc_weaknesses": "25;51;77",
        "wc_questions": "32;35;106",
        "wc_review": "94;207;271",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1329;1922;1632",
        "reply_reviewers": "0;0;0",
        "reply_authors": "4;4;4",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            51.333333333333336,
            18.80307303489394
        ],
        "wc_strengths_avg": [
            30.666666666666668,
            15.923427883328248
        ],
        "wc_weaknesses_avg": [
            51.0,
            21.228911104120876
        ],
        "wc_questions_avg": [
            57.666666666666664,
            34.198765409814946
        ],
        "wc_review_avg": [
            190.66666666666666,
            73.17710631672237
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1627.6666666666667,
            242.11062668861842
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            4.0,
            0.0
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 114,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13575182542323243821&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=gtkFw6sZGS",
        "pdf": "https://openreview.net/pdf?id=gtkFw6sZGS",
        "email": "sjtu.edu.cn;polyu.edu.hk;nyu.edu;mails.ucas.ac.cn;sjtu.edu.cn;sjtu.edu",
        "author_num": 6,
        "aff_unique_index": "0;1;2;3;0;0",
        "aff_unique_norm": "Shanghai Jiao Tong University;Hong Kong Polytechnic University;New York University;University of Chinese Academy of Sciences",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.sjtu.edu.cn;https://www.polyu.edu.hk;https://www.nyu.edu;http://www.ucas.ac.cn",
        "aff_unique_abbr": "SJTU;PolyU;NYU;UCAS",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;1;0;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "CausalLM is not optimal for in-context learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18127",
        "id": "guRNebwZBb",
        "author_site": "Nan Ding, Tomer Levinboim, Jialin Wu, Sebastian Goodman, Radu Soricut",
        "tldr": "",
        "abstract": "Recent empirical evidence indicates that transformer based in-context learning performs better when using a prefix language model (prefixLM), in which in-context samples can all attend to each other, compared to causal language models (causalLM), which use auto-regressive attention that prohibits in-context samples to attend to future samples. While this result is intuitive, it is not understood from a theoretical perspective. In this paper we take a theoretical approach and analyze the convergence behavior of prefixLM and causalLM under a certain parameter construction. Our analysis shows that both LM types converge to their stationary points at a linear rate, but that while prefixLM converges to the optimal solution of linear regression, causalLM convergence dynamics follows that of an online gradient descent algorithm, which is not guaranteed to be optimal even as the number of samples grows infinitely. We supplement our theoretical claims with empirical experiments over synthetic and real tasks and using various types of transformers. Our experiments verify that causalLM consistently underperforms prefixLM in all settings.",
        "keywords": "in-context learning;causalLM;prefixLM",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/9439d329aac5882fef12935265c3c9ae294dd55b.pdf",
        "author": "Nan Ding;Tomer Levinboim;Jialin Wu;Sebastian Goodman;Radu Soricut",
        "authorids": "~Nan_Ding3;~Tomer_Levinboim1;~Jialin_Wu1;~Sebastian_Goodman1;~Radu_Soricut2",
        "gender": "M;M;M;M;M",
        "homepage": ";;https://jialinwu.netlify.app/;https://research.google/people/106379/;",
        "dblp": ";08/2681;149/5889;192/1217;",
        "google_scholar": ";wgvxfvkAAAAJ;M7EpKqsAAAAJ;hNNaQL8AAAAJ;NAzD9mgAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";tomerlevinboim/;jialin-wu-a50135175/;;",
        "or_profile": "~Nan_Ding3;~Tomer_Levinboim1;~Jialin_Wu1;~Sebastian_Goodman1;~Radu_Soricut2",
        "aff": "Google;;Google;Google;Google",
        "aff_domain": "google.com;;google.com;google.com;google.com",
        "position": "Research Scientist;;Researcher;Researcher;Research Scientist",
        "bibtex": "@inproceedings{\nding2024causallm,\ntitle={Causal{LM} is not optimal for in-context learning},\nauthor={Nan Ding and Tomer Levinboim and Jialin Wu and Sebastian Goodman and Radu Soricut},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=guRNebwZBb}\n}",
        "github": "",
        "project": "",
        "reviewers": "m1Xp;RFAv;9q6M;mzWe",
        "pdf_size": 395797,
        "rating": "6;6;6;8",
        "confidence": "3;3;4;4",
        "soundness": "3;3;3;3",
        "contribution": "3;2;2;4",
        "presentation": "3;3;3;3",
        "wc_summary": "74;61;63;80",
        "wc_strengths": "104;48;32;53",
        "wc_weaknesses": "226;120;72;29",
        "wc_questions": "23;53;2;45",
        "wc_review": "427;282;169;207",
        "wc_reply_reviewers": "16;0;0;0",
        "wc_reply_authors": "805;394;280;295",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            69.5,
            7.826237921249264
        ],
        "wc_strengths_avg": [
            59.25,
            26.975683494584526
        ],
        "wc_weaknesses_avg": [
            111.75,
            73.39746249019785
        ],
        "wc_questions_avg": [
            30.75,
            19.904459299363044
        ],
        "wc_review_avg": [
            271.25,
            98.68732188077657
        ],
        "wc_reply_reviewers_avg": [
            4.0,
            6.928203230275509
        ],
        "wc_reply_authors_avg": [
            443.5,
            213.25864578018871
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 26,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10831266460306494065&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=guRNebwZBb",
        "pdf": "https://openreview.net/pdf?id=guRNebwZBb",
        "email": "google.com;;google.com;google.com;google.com",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Google",
        "aff_unique_dep": "Google",
        "aff_unique_url": "https://www.google.com",
        "aff_unique_abbr": "Google",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Mountain View",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "gusHSc09zj",
        "title": "Discovering Mixtures of Structural Causal Models from Time Series Data",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In fields such as finance, climate science, and neuroscience, inferring causal relationships from time series data poses a formidable challenge. While contemporary techniques can handle non-linear relationships between variables and flexible noise distributions, they rely on the simplifying assumption that data originates from the same underlying causal model. In this work, we relax this assumption and perform causal discovery from time series data originating from mixtures of different causal models. We infer both the underlying structural causal models and the posterior probability for each sample belonging to a specific mixture component. Our approach employs an end-to-end training process that maximizes an evidence-lower bound for data likelihood. Through extensive experimentation on both synthetic and real-world datasets, we demonstrate that our method surpasses state-of-the-art benchmarks in causal discovery tasks, particularly when the data emanates from diverse underlying causal graphs. Theoretically, we prove the identifiability of such a model under some mild assumptions.",
        "keywords": "Causal Discovery;Time Series;Bayesian Inference",
        "primary_area": "causal reasoning",
        "supplementary_material": "",
        "author": "Sumanth Varambally;Yian Ma;Rose Yu",
        "authorids": "~Sumanth_Varambally1;~Yian_Ma1;~Rose_Yu1",
        "gender": ";M;F",
        "homepage": ";https://sites.google.com/view/yianma;http://roseyu.com",
        "dblp": ";;164/7314",
        "google_scholar": ";A0TFlacAAAAJ;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Sumanth_Varambally1;~Yian_Ma1;~Rose_Yu1",
        "aff": ";University of California, San Diego;University of California, San Diego",
        "aff_domain": ";ucsd.edu;ucsd.edu",
        "position": ";Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nvarambally2024discovering,\ntitle={Discovering Mixtures of Structural Causal Models from Time Series Data},\nauthor={Sumanth Varambally and Yian Ma and Rose Yu},\nyear={2024},\nurl={https://openreview.net/forum?id=gusHSc09zj}\n}",
        "github": "",
        "project": "",
        "reviewers": "dKxB;vYSG;bLPE;vKpF",
        "site": "https://openreview.net/forum?id=gusHSc09zj",
        "pdf_size": 918134,
        "rating": "3;3;5;5",
        "confidence": "4;4;3;3",
        "soundness": "1;2;3;3",
        "contribution": "2;2;2;2",
        "presentation": "3;3;2;3",
        "wc_summary": "23;83;57;20",
        "wc_strengths": "30;75;64;52",
        "wc_weaknesses": "261;124;81;112",
        "wc_questions": "38;75;579;35",
        "wc_review": "352;357;781;219",
        "wc_reply_reviewers": "384;0;274;0",
        "wc_reply_authors": "892;831;2402;569",
        "reply_reviewers": "1;0;2;0",
        "reply_authors": "2;2;4;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            45.75,
            25.955490748587284
        ],
        "wc_strengths_avg": [
            55.25,
            16.69393602479655
        ],
        "wc_weaknesses_avg": [
            144.5,
            69.06699645995909
        ],
        "wc_questions_avg": [
            181.75,
            229.89277391862495
        ],
        "wc_review_avg": [
            427.25,
            211.60384566448693
        ],
        "wc_reply_reviewers_avg": [
            164.5,
            169.03475973893654
        ],
        "wc_reply_authors_avg": [
            1173.5,
            719.5799121709832
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.25,
            1.0897247358851685
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3602400541678954792&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of California, San Diego",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucsd.edu",
        "aff_unique_abbr": "UCSD",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "San Diego",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "gvHvwL6Ks4",
        "title": "Privacy-Preserving Data Quality Evaluation in Federated Learning Using Influence Approximation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In Federated Learning, it is crucial to handle low-quality, corrupted, or malicious data, but traditional data valuation methods are not suitable due to privacy concerns. To address this, we propose a simple yet effective approach that utilizes a new influence approximation called \"lazy influence\" to filter and score data while preserving privacy. To do this, each participant uses their own data to estimate the influence of another participant's batch and sends a differentially private obfuscated score to the Center of the federation. Our method has been shown to successfully filter out corrupted data in various applications, achieving a recall rate of over $>90\\%$ (sometimes up to $100\\%$) while maintaining strong differential privacy guarantees with epsilon values of less than or equal to one.",
        "keywords": "federated learning;client selection;vit;visual image transformers;image classification;transformers;data valuation;privacy preserving",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Ljubomir Rokvic;Panayiotis Danassis;Boi Faltings",
        "authorids": "~Ljubomir_Rokvic1;~Panayiotis_Danassis1;~Boi_Faltings1",
        "gender": "M;;M",
        "homepage": ";;http://liawww.epfl.ch/~faltings/",
        "dblp": "321/0959;;f/BoiFaltings",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;dJg1TUEAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Ljubomir_Rokvic1;~Panayiotis_Danassis1;~Boi_Faltings1",
        "aff": "EPFL - EPF Lausanne;;Swiss Federal Institute of Technology Lausanne",
        "aff_domain": "epfl.ch;;epfl.ch",
        "position": "PhD student;;Professor",
        "bibtex": "@misc{\nrokvic2024privacypreserving,\ntitle={Privacy-Preserving Data Quality Evaluation in Federated Learning Using Influence Approximation},\nauthor={Ljubomir Rokvic and Panayiotis Danassis and Boi Faltings},\nyear={2024},\nurl={https://openreview.net/forum?id=gvHvwL6Ks4}\n}",
        "github": "",
        "project": "",
        "reviewers": "pxB7;KGyK;633s;eJdW",
        "site": "https://openreview.net/forum?id=gvHvwL6Ks4",
        "pdf_size": 1270903,
        "rating": "3;5;5;5",
        "confidence": "4;3;3;3",
        "soundness": "3;3;3;2",
        "contribution": "1;2;3;3",
        "presentation": "3;3;2;3",
        "wc_summary": "35;76;343;52",
        "wc_strengths": "44;26;87;36",
        "wc_weaknesses": "170;204;118;47",
        "wc_questions": "345;28;353;94",
        "wc_review": "594;334;901;229",
        "wc_reply_reviewers": "0;0;215;0",
        "wc_reply_authors": "240;204;269;152",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            126.5,
            125.84216304561838
        ],
        "wc_strengths_avg": [
            48.25,
            23.263436977368585
        ],
        "wc_weaknesses_avg": [
            134.75,
            59.20040118107309
        ],
        "wc_questions_avg": [
            205.0,
            145.9057915231606
        ],
        "wc_review_avg": [
            514.5,
            259.7080091179323
        ],
        "wc_reply_reviewers_avg": [
            53.75,
            93.09773090682715
        ],
        "wc_reply_authors_avg": [
            216.25,
            43.65990723764768
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12593456842022077164&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "EPFL;Swiss Federal Institute of Technology Lausanne",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.epfl.ch;https://www.epfl.ch",
        "aff_unique_abbr": "EPFL;EPFL",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Lausanne",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Switzerland"
    },
    {
        "id": "gvKZyTlUgQ",
        "title": "Warped Convolutional Neural Networks For Large Homography Transformation with $\\mathfrak{sl}(3)$ Algebra",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Homography has fundamental and elegant relationship with the special linear group and its embedding Lie algebra structure. However, the integration of homography and algebraic expressions in neural networks remains largely unexplored. In this paper, we propose Warped Convolution Neural Networks to effectively learn and represent the homography by $\\mathfrak{sl}(3)$ algebra with group convolution. Specifically, six commutative subgroups within the $SL(3)$ group are composed to form a homography. For each subgroup, a warp function is proposed to bridge the Lie algebra structure to its corresponding parameters in homography. By taking advantage of the warped convolution, homography learning is formulated into several simple pseudo-translation regressions. Our proposed method enables to learn features that are invariant to significant homography transformations through exploration along the Lie topology. Moreover, it can be easily plugged into other popular CNN-based methods and empower them with homography representation capability. Through extensive experiments on benchmark datasets such as POT, S-COCO, and MNIST-Proj, we demonstrate the effectiveness of our approach in various tasks like planar object tracking, homography estimation and classification.",
        "keywords": "SL(3);Lie algebra;Equivariance;Homography Learning;Group Equivariant Architecture",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Xinrui Zhan;Wenyu Liu;Jianke Zhu;Yang Li",
        "authorids": "~Xinrui_Zhan1;~Wenyu_Liu4;~Jianke_Zhu1;~Yang_Li46",
        "gender": "M;M;M;M",
        "homepage": ";;https://person.zju.edu.cn/en/jkzhu;http://ihpdep.github.io/",
        "dblp": "309/6307;42/4110-5;10/4016;37/4190-41",
        "google_scholar": ";https://scholar.google.com/citations?hl=zh-CN;SC-WmzwAAAAJ;N1ZDSHYAAAAJ",
        "orcid": ";0000-0002-3035-987X;0000-0003-1831-0106;0000-0001-9427-7665",
        "linkedin": ";;https://www.linkedin.cn/incareer/in/jianke-zhu-b83bba8;",
        "or_profile": "~Xinrui_Zhan1;~Wenyu_Liu4;~Jianke_Zhu1;~Yang_Li46",
        "aff": ";Zhejiang University;Zhejiang University;East China Normal University",
        "aff_domain": ";zju.edu.cn;zju.edu.cn;ecnu.edu.cn",
        "position": ";PhD student;Full Professor;Associate Professor",
        "bibtex": "@misc{\nzhan2024warped,\ntitle={Warped Convolutional Neural Networks For Large Homography Transformation with \\${\\textbackslash}mathfrak\\{sl\\}(3)\\$ Algebra},\nauthor={Xinrui Zhan and Wenyu Liu and Jianke Zhu and Yang Li},\nyear={2024},\nurl={https://openreview.net/forum?id=gvKZyTlUgQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "i6Q7;o1vN;uatX",
        "site": "https://openreview.net/forum?id=gvKZyTlUgQ",
        "pdf_size": 3324387,
        "rating": "5;6;8",
        "confidence": "4;4;4",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "2;3;2",
        "wc_summary": "67;62;112",
        "wc_strengths": "11;29;69",
        "wc_weaknesses": "16;30;123",
        "wc_questions": "306;36;6",
        "wc_review": "400;157;310",
        "wc_reply_reviewers": "0;10;0",
        "wc_reply_authors": "1495;303;521",
        "reply_reviewers": "0;1;0",
        "reply_authors": "2;2;1",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            80.33333333333333,
            22.484562605386735
        ],
        "wc_strengths_avg": [
            36.333333333333336,
            24.239545283597124
        ],
        "wc_weaknesses_avg": [
            56.333333333333336,
            47.48567035315905
        ],
        "wc_questions_avg": [
            116.0,
            134.90737563232042
        ],
        "wc_review_avg": [
            289.0,
            100.30952098380293
        ],
        "wc_reply_reviewers_avg": [
            3.3333333333333335,
            4.714045207910316
        ],
        "wc_reply_authors_avg": [
            773.0,
            518.2303220255128
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:38MAkiQCHGkJ:scholar.google.com/&scioq=Warped+Convolutional+Neural+Networks+For+Large+Homography+Transformation+with+%24%5Cmathfrak%7Bsl%7D(3)%24+Algebra&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Zhejiang University;East China Normal University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.zju.edu.cn;http://www.ecnu.edu.cn",
        "aff_unique_abbr": "ZJU;ECNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Dual Associated Encoder for Face Restoration",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18126",
        "id": "gwDuW7Ok5f",
        "author_site": "Yu-Ju Tsai, Yu-Lun Liu, Lu Qi, Kelvin Chan, Ming-Hsuan Yang",
        "tldr": "",
        "abstract": "Restoring facial details from low-quality (LQ) images has remained challenging due to the nature of the problem caused by various degradations in the wild. \nThe codebook prior has been proposed to address the ill-posed problems by leveraging an autoencoder and learned codebook of high-quality (HQ) features, achieving remarkable quality.\nHowever, existing approaches in this paradigm frequently depend on a single encoder pre-trained on HQ data for restoring HQ images, disregarding the domain gap and distinct feature representations between LQ and HQ images.\nAs a result, encoding LQ inputs with the same encoder could be insufficient, resulting in imprecise feature representation and leading to suboptimal performance.\nTo tackle this problem, we propose a novel dual-branch framework named $\\textit{DAEFR}$. Our method introduces an auxiliary LQ branch that extracts domain-specific information from the LQ inputs. \nAdditionally, we incorporate association training to promote effective synergy between the two branches, enhancing code prediction and restoration quality.\nWe evaluate the effectiveness of DAEFR on both synthetic and real-world datasets, demonstrating its superior performance in restoring facial details.\nProject page: https://liagm.github.io/DAEFR/",
        "keywords": "Blind Face Restoration;Vector Quantization;Codebook Prior;Feature Encoding;Feature Representation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "YU-JU TSAI;Yu-Lun Liu;Lu Qi;Kelvin C.K. Chan;Ming-Hsuan Yang",
        "authorids": "~YU-JU_TSAI1;~Yu-Lun_Liu2;~Lu_Qi1;~Kelvin_C.K._Chan1;~Ming-Hsuan_Yang1",
        "gender": "M;M;M;M;",
        "homepage": "https://liagm.github.io/;https://www.luqi.info;https://ckkelvinchan.github.io/;https://faculty.ucmerced.edu/mhyang/;http://www.cmlab.csie.ntu.edu.tw/~yulunliu/",
        "dblp": "177/6561;;228/2769;79/3711.html;142/0282-1",
        "google_scholar": "https://scholar.google.com.tw/citations?user=-mtZTxEAAAAJ;https://scholar.google.com.hk/citations?user=SSI90d4AAAAJ;https://scholar.google.com.hk/citations?user=QYTu_KQAAAAJ;p9-ohHsAAAAJ;gliihzoAAAAJ",
        "orcid": ";;;0000-0003-4848-2304;",
        "linkedin": ";;;minghsuanyang/;yu-lun-liu-37321396/",
        "or_profile": "~YU-JU_TSAI1;~Lu_Qi1;~Kelvin_C.K._Chan1;~Ming-Hsuan_Yang1;~Yu_Lun_Liu1",
        "aff": "University of California, Merced;University of California, Merced;Google DeepMind;University of California at Merced;National Yang Ming Chiao Tung University",
        "aff_domain": "ucmerced.edu;ucmerced.edu;google.com;umcerced.edu;nycu.edu.tw",
        "position": "PhD student;Postdoc;Senior Research Scientist;Professor;Assistant Professor",
        "bibtex": "@inproceedings{\ntsai2024dual,\ntitle={Dual Associated Encoder for Face Restoration},\nauthor={YU-JU TSAI and Yu-Lun Liu and Lu Qi and Kelvin C.K. Chan and Ming-Hsuan Yang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=gwDuW7Ok5f}\n}",
        "github": "",
        "project": "",
        "reviewers": "X7AW;cKwn;qW23;huYM;UndL",
        "pdf_size": 16757694,
        "rating": "5;5;8;8;8",
        "confidence": "3;4;3;4;4",
        "soundness": "3;4;3;3;3",
        "contribution": "2;2;3;3;3",
        "presentation": "3;4;3;3;3",
        "wc_summary": "100;84;84;79;234",
        "wc_strengths": "70;26;46;57;283",
        "wc_weaknesses": "238;54;78;44;337",
        "wc_questions": "3;28;8;57;247",
        "wc_review": "411;192;216;237;1101",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "797;751;586;659;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "2;2;2;2;0",
        "rating_avg": [
            6.8,
            1.469693845669907
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            3.2,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            3.2,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            116.2,
            59.324194052679715
        ],
        "wc_strengths_avg": [
            96.4,
            94.40889788573956
        ],
        "wc_weaknesses_avg": [
            150.2,
            116.91774886645739
        ],
        "wc_questions_avg": [
            68.6,
            91.19780699117715
        ],
        "wc_review_avg": [
            431.4,
            343.59313147966157
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            558.6,
            288.6926393242474
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.6,
            0.8
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.16666666666666669,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6170962180412885463&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=gwDuW7Ok5f",
        "pdf": "https://openreview.net/pdf?id=gwDuW7Ok5f",
        "email": "ucmerced.edu;ucmerced.edu;google.com;umcerced.edu;nycu.edu.tw",
        "author_num": 5,
        "aff_unique_index": "0;0;1;0;2",
        "aff_unique_norm": "University of California, Merced;Google;National Yang Ming Chiao Tung University",
        "aff_unique_dep": ";Google DeepMind;",
        "aff_unique_url": "https://www.ucmerced.edu;https://deepmind.com;https://www.nycu.edu.tw",
        "aff_unique_abbr": "UC Merced;DeepMind;NYCU",
        "aff_campus_unique_index": "0;0;0;2",
        "aff_campus_unique": "Merced;;Taiwan",
        "aff_country_unique_index": "0;0;1;0;2",
        "aff_country_unique": "United States;United Kingdom;China"
    },
    {
        "title": "Learning Large DAGs is Harder than you Think: Many Losses are Minimal for the Wrong DAG",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18125",
        "id": "gwbQ2YwLhD",
        "author_site": "Jonas Seng, Matej Ze\u010devi\u0107, Devendra Singh Dhami, Kristian Kersting",
        "tldr": "",
        "abstract": "Structure learning is a crucial task in science, especially in fields such as medicine and biology, where the wrong identification of (in)dependencies among random variables can have significant implications. The primary objective of structure learning is to learn a Directed Acyclic Graph (DAG) that represents the underlying probability distribution of the data. Many prominent DAG learners rely on least square losses or log-likelihood losses for optimization. It is well-known from regression models that least square losses are heavily influenced by the scale of the variables. Recently it has been demonstrated that the scale of data also affects performance of structure learning algorithms, though with a strong focus on linear 2-node systems and simulated data. Moving beyond these results, we provide conditions under which square-based losses are minimal for wrong DAGs in $d$-dimensional cases. Furthermore, we also show that scale can impair performance of structure learners if relations among variables are non-linear for both square based and log-likelihood based losses. We confirm our theoretical findings through extensive experiments on synthetic and real-world data.",
        "keywords": "Directed Acyclic Graphs;Structure Learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/6401b27b4773430f5f39434a09ff5ed0dcce6fb1.pdf",
        "author": "Jonas Seng;Matej Ze\u010devi\u0107;Devendra Singh Dhami;Kristian Kersting",
        "authorids": "~Jonas_Seng1;~Matej_Ze\u010devi\u01071;~Devendra_Singh_Dhami1;~Kristian_Kersting1",
        "gender": "M;M;M;M",
        "homepage": ";https://sites.google.com/view/devendradhami;http://www.ml.informatik.tu-darmstadt.de/;https://www.matej-zecevic.de",
        "dblp": "322/5090;201/2130;40/3793;286/1847",
        "google_scholar": ";aVlaHfkAAAAJ;QY-earAAAAAJ;gzJZcPUAAAAJ",
        "orcid": ";;0000-0002-2873-9152;",
        "linkedin": "jonas-seng-19b80b1a1;;;",
        "or_profile": "~Jonas_Seng1;~Devendra_Singh_Dhami1;~Kristian_Kersting1;~Matej_Zecevic1",
        "aff": "Technische Universit\u00e4t Darmstadt;Eindhoven University of Technology;TU Darmstadt;TU Darmstadt",
        "aff_domain": "tu-darmstadt.de;tue.nl;tu-darmstadt.de;tu-darmstadt.de",
        "position": "PhD student;Assistant Professor;Full Professor;PhD student",
        "bibtex": "@inproceedings{\nseng2024learning,\ntitle={Learning Large {DAG}s is Harder than you Think: Many Losses are Minimal for the Wrong {DAG}},\nauthor={Jonas Seng and Matej Ze{\\v{c}}evi{\\'c} and Devendra Singh Dhami and Kristian Kersting},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=gwbQ2YwLhD}\n}",
        "github": "",
        "project": "",
        "reviewers": "kwyp;NBUG;FNo4;HNsv",
        "pdf_size": 387011,
        "rating": "5;6;6;6",
        "confidence": "3;3;3;4",
        "soundness": "3;4;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "49;108;80;92",
        "wc_strengths": "26;135;33;77",
        "wc_weaknesses": "28;131;228;52",
        "wc_questions": "186;87;506;26",
        "wc_review": "289;461;847;247",
        "wc_reply_reviewers": "96;102;26;0",
        "wc_reply_authors": "927;530;1449;450",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "4;2;3;3",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            82.25,
            21.614520582238228
        ],
        "wc_strengths_avg": [
            67.75,
            43.47053599853584
        ],
        "wc_weaknesses_avg": [
            109.75,
            78.18687549710629
        ],
        "wc_questions_avg": [
            201.25,
            184.98023543070758
        ],
        "wc_review_avg": [
            461.0,
            236.84171929793112
        ],
        "wc_reply_reviewers_avg": [
            56.0,
            44.02272140611028
        ],
        "wc_reply_authors_avg": [
            839.0,
            395.8048761700644
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17976727515098643092&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=gwbQ2YwLhD",
        "pdf": "https://openreview.net/pdf?id=gwbQ2YwLhD",
        "email": "tu-darmstadt.de;tue.nl;tu-darmstadt.de;tu-darmstadt.de",
        "author_num": 4,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Technische Universit\u00e4t Darmstadt;Eindhoven University of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tu-darmstadt.de;https://www.tue.nl",
        "aff_unique_abbr": "TUD;TU/e",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Darmstadt",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "Germany;Netherlands"
    },
    {
        "title": "ZeRO++: Extremely Efficient Collective Communication for Large Model Training",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18124",
        "id": "gx2BT0a9MQ",
        "author_site": "Guanhua Wang, Heyang Qin, Sam Jacobs, Xiaoxia (Shirley) Wu, Connor Holmes, Zhewei Yao, Samyam Rajbhandari, Olatunji Ruwase, Feng Yan, Lei Yang, Yuxiong He",
        "tldr": "",
        "abstract": "Zero Redundancy Optimizer (ZeRO) has been used to train a wide range of large language models on massive GPU clusters due to its ease of use, efficiency, and good scalability. However, when training on low-bandwidth clusters, and/or when small batch size per GPU is used, ZeRO\u2019s effective throughput is limited due to communication overheads. To alleviate this limitation, this paper introduces ZeRO++ composing of three communication volume reduction techniques (lowprecision all-gather, data remapping, and low-precision gradient averaging) to significantly reduce the communication volume up to 4x that enables up to 2.16x better throughput at 384 GPU scale. Our results also show ZeRO++ can speedup the RLHF by 3.3x compared to vanilla ZeRO. To verify the convergence of ZeRO++, we test up to 13B model for pretraining with 8/6-bits all gather and up to 30B model for finetuning with 4/2-bits all gather, and demonstrate on-par accuracy as original ZeRO (aka standard training). As a byproduct, the model trained with ZeRO++ is naturally weight-quantized, which can be directly used for inference without post-training quantization or quantization-aware training.",
        "keywords": "low-precision LLM pretraining;2 bits;auto compression;low memory pretraining",
        "primary_area": "infrastructure, software libraries, hardware, etc.",
        "supplementary_material": "",
        "author": "Guanhua Wang;Heyang Qin;Sam Ade Jacobs;Xiaoxia Wu;Connor Holmes;Zhewei Yao;Samyam Rajbhandari;Olatunji Ruwase;Feng Yan;Lei Yang;Yuxiong He",
        "authorids": "~Guanhua_Wang1;~Heyang_Qin1;~Sam_Ade_Jacobs1;~Xiaoxia_Wu1;~Connor_Holmes1;~Zhewei_Yao1;~Samyam_Rajbhandari1;~Olatunji_Ruwase1;~Feng_Yan2;~Lei_Yang1;~Yuxiong_He1",
        "gender": "M;M;M;F;M;M;M;M;;M;",
        "homepage": "https://people.eecs.berkeley.edu/~guanhua/;https://www.cse.unr.edu/~heyangq/;https://people.llnl.gov/jacobs32;https://sites.google.com/view/xwu/home;;;https://www.snowflake.com/en/blog/authors/samyam-rajbhandari/;https://www.microsoft.com/en-us/research/people/olruwase/;http://www.cs.uh.edu/~fyan/;https://www.cse.unr.edu/~lyang/;",
        "dblp": ";;79/10956;63/1016;;195/2887;;72/2838;62/3960-1.html;50/2484-1;https://dblp.org/pers/hd/h/He:Yuxiong",
        "google_scholar": "qimMoFIAAAAJ;0azIceIAAAAJ;;Ry0Bdt8AAAAJ;https://scholar.google.com/citations?hl=en;gpSeMjYAAAAJ;;HZDafzgAAAAJ;iLE0_VAAAAAJ;https://scholar.google.com/citations?hl=en;SB3_eb0AAAAJ",
        "orcid": ";;0000-0003-3425-5602;;;;;;;;",
        "linkedin": "guanhua-wang;heyangqin;;;;;samyam-rajbhandari-08ba5730/;;;;",
        "or_profile": "~Guanhua_Wang1;~Heyang_Qin1;~Sam_Ade_Jacobs1;~Xiaoxia_Wu1;~Connor_Holmes1;~Zhewei_Yao1;~Samyam_Rajbhandari1;~Olatunji_Ruwase1;~Feng_Yan2;~Lei_Yang1;~Yuxiong_He1",
        "aff": "Microsoft;Microsoft;Microsoft;Microsoft;Colorado School of Mines;Snowflake;Microsoft;Microsoft;University of Houston;University of Nevada, Reno;Microsoft",
        "aff_domain": "microsoft.com;microsoft.com;microsoft.com;microsoft.com;mines.edu;snowflake.com;microsoft.com;microsoft.com;uh.edu;unr.edu;microsoft.com",
        "position": "Researcher;Researcher;Computer Scientist;Researcher;PhD student;Researcher;Research Engineer;Researcher;Associate Professor;Associate Professor;Researcher",
        "bibtex": "@inproceedings{\nwang2024zero,\ntitle={Ze{RO}++: Extremely Efficient Collective Communication for Large Model Training},\nauthor={Guanhua Wang and Heyang Qin and Sam Ade Jacobs and Xiaoxia Wu and Connor Holmes and Zhewei Yao and Samyam Rajbhandari and Olatunji Ruwase and Feng Yan and Lei Yang and Yuxiong He},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=gx2BT0a9MQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZpeK;V3tv;TkZG;kJiX;QbwT",
        "pdf_size": 1451326,
        "rating": "5;5;6;6;8",
        "confidence": "5;4;4;4;3",
        "soundness": "3;3;3;3;4",
        "contribution": "2;2;3;3;3",
        "presentation": "3;3;3;4;3",
        "wc_summary": "45;54;55;36;30",
        "wc_strengths": "51;18;59;79;49",
        "wc_weaknesses": "131;215;59;104;138",
        "wc_questions": "20;18;100;54;198",
        "wc_review": "247;305;273;273;415",
        "wc_reply_reviewers": "22;20;0;0;0",
        "wc_reply_authors": "635;799;328;938;859",
        "reply_reviewers": "1;1;0;0;0",
        "reply_authors": "1;2;1;2;2",
        "rating_avg": [
            6.0,
            1.0954451150103321
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            3.2,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            3.2,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            44.0,
            9.818350166906862
        ],
        "wc_strengths_avg": [
            51.2,
            19.701776569639602
        ],
        "wc_weaknesses_avg": [
            129.4,
            51.000392155355044
        ],
        "wc_questions_avg": [
            78.0,
            66.9686493816323
        ],
        "wc_review_avg": [
            302.6,
            59.132393829440055
        ],
        "wc_reply_reviewers_avg": [
            8.4,
            10.307278981380101
        ],
        "wc_reply_authors_avg": [
            711.8,
            216.1660472877274
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.6,
            0.4898979485566356
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": -0.8660254037844387,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7361757818736639028&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=gx2BT0a9MQ",
        "pdf": "https://openreview.net/pdf?id=gx2BT0a9MQ",
        "email": "microsoft.com;microsoft.com;microsoft.com;microsoft.com;mines.edu;snowflake.com;microsoft.com;microsoft.com;uh.edu;unr.edu;microsoft.com",
        "author_num": 11,
        "aff_unique_index": "0;0;0;0;1;2;0;0;3;4;0",
        "aff_unique_norm": "Microsoft;Colorado School of Mines;Snowflake Inc.;University of Houston;University of Nevada",
        "aff_unique_dep": "Microsoft Corporation;;;;",
        "aff_unique_url": "https://www.microsoft.com;https://www.mines.edu;https://www.snowflake.com;https://www.uh.edu;https://www.unr.edu",
        "aff_unique_abbr": "Microsoft;CSM;Snowflake;UH;UNR",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Reno",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Diffeomorphic Mesh Deformation via Efficient Optimal Transport for Cortical Surface Reconstruction",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18123",
        "id": "gxhRR8vUQb",
        "author_site": "Thanh-Tung Le, Khai Nguyen, shanlin sun, Kun Han, Nhat Ho, Xiaohui Xie",
        "tldr": "",
        "abstract": "Mesh deformation plays a pivotal role in many 3D vision tasks including dynamic simulations, rendering, and reconstruction. However, defining an efficient discrepancy between predicted and target meshes remains an open problem. A prevalent approach in current deep learning is the set-based approach which measures the discrepancy between two surfaces by comparing two randomly sampled point-clouds from the two meshes with Chamfer pseudo-distance. Nevertheless, the set-based approach still has limitations such as lacking a theoretical guarantee for choosing the number of points in sampled point-clouds, and the pseudo-metricity and the quadratic complexity of the Chamfer divergence. To address these issues, we propose a novel metric for learning mesh deformation. The metric is defined by sliced Wasserstein distance on meshes represented as probability measures that generalize the set-based approach. By leveraging probability measure space, we gain flexibility in encoding meshes using diverse forms of probability measures, such as continuous, empirical, and discrete measures via \\textit{varifold} representation. After having encoded probability measures, we can compare meshes by using the sliced Wasserstein distance which is an effective optimal transport distance with linear computational complexity and can provide a fast statistical rate for approximating the surface of meshes. To the end, we employ a neural ordinary differential equation (ODE) to deform the input surface into the target shape by modeling the trajectories of the points on the surface. Our experiments on cortical surface reconstruction demonstrate that our approach surpasses other competing methods in multiple datasets and metrics.",
        "keywords": "Mesh deformation;optimal transport;cortical surface reconstruction;computer vision;medical imaging.",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/bb8c1180bf7e175a58d7f17682a8bd008cd12edc.zip",
        "author": "Thanh Tung Le;Khai Nguyen;shanlin sun;Kun Han;Nhat Ho;Xiaohui Xie",
        "authorids": "~Thanh_Tung_Le1;~Khai_Nguyen1;~shanlin_sun1;~Kun_Han3;~Nhat_Ho1;~Xiaohui_Xie2",
        "gender": ";M;M;M;M;",
        "homepage": ";https://khainb.com;;;https://nhatptnk8912.github.io/;https://www.ics.uci.edu/~xhx/",
        "dblp": ";120/4308;141/8363;85/9877;203/4479;",
        "google_scholar": ";im5fNaQAAAAJ;c6wKvwgAAAAJ;;https://scholar.google.ca/citations?user=Xs7cKMwAAAAJ;1CR0meYAAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";;;kunhan-kun-han-9209871b9/;nhat-pham-minh-ho-267b8164/;",
        "or_profile": "~Thanh_Tung_Le1;~Khai_Nguyen1;~shanlin_sun1;~Kun_Han3;~Nhat_Ho1;~Xiaohui_Xie2",
        "aff": ";University of Texas, Austin;University of California, Irvine;University of California, Irvine;University of Texas, Austin;University of California, Irvine",
        "aff_domain": ";utexas.edu;uci.edu;uci.edu;utexas.edu;uci.edu",
        "position": ";PhD student;PhD student;PhD student;Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\nle2024diffeomorphic,\ntitle={Diffeomorphic Mesh Deformation via Efficient Optimal Transport for Cortical Surface Reconstruction},\nauthor={Thanh Tung Le and Khai Nguyen and shanlin sun and Kun Han and Nhat Ho and Xiaohui Xie},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=gxhRR8vUQb}\n}",
        "github": "",
        "project": "",
        "reviewers": "LCQZ;9F6e;4B9Y;As4U",
        "pdf_size": 14429473,
        "rating": "6;6;8;8",
        "confidence": "3;2;4;4",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "56;133;111;73",
        "wc_strengths": "49;62;72;140",
        "wc_weaknesses": "218;75;60;62",
        "wc_questions": "130;17;61;80",
        "wc_review": "453;287;304;355",
        "wc_reply_reviewers": "188;0;0;19",
        "wc_reply_authors": "1524;215;454;257",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "3;1;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            93.25,
            30.384000724065288
        ],
        "wc_strengths_avg": [
            80.75,
            35.16656793035112
        ],
        "wc_weaknesses_avg": [
            103.75,
            66.21319732500463
        ],
        "wc_questions_avg": [
            72.0,
            40.54010360124897
        ],
        "wc_review_avg": [
            349.75,
            64.65050270492875
        ],
        "wc_reply_reviewers_avg": [
            51.75,
            79.04547741648474
        ],
        "wc_reply_authors_avg": [
            612.5,
            533.9337505721098
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.9045340337332909,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1999322394018083801&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=gxhRR8vUQb",
        "pdf": "https://openreview.net/pdf?id=gxhRR8vUQb",
        "email": ";utexas.edu;uci.edu;uci.edu;utexas.edu;uci.edu",
        "author_num": 6,
        "aff_unique_index": "0;1;1;0;1",
        "aff_unique_norm": "University of Texas at Austin;University of California, Irvine",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.utexas.edu;https://www.uci.edu",
        "aff_unique_abbr": "UT Austin;UCI",
        "aff_campus_unique_index": "0;1;1;0;1",
        "aff_campus_unique": "Austin;Irvine",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "gyJpajLkX2",
        "title": "ENHANCING MULTIVARIATE TIME SERIES FORECAST- ING WITH MUTUAL INFORMATION-DRIVEN CROSS- VARIABLE AND TEMPORAL MODELING",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent researches have showcased the significant effectiveness of deep learning techniques for multivariate time series forecasting (MTSF). Broadly speaking, these techniques are bifurcated into two categories: Channel-independence and Channel-mixing approaches. While Channel-independence models have generally demonstrated superior outcomes, Channel-mixing methods, especially\nwhen dealing with time series that display inter-variable correlations, theoretically promise enhanced performance by incorporating the correlation between variables. However, we contend that the unnecessary integration of information through Channel-mixing can curtail the potential enhancement in MTSF model performance. To substantiate this claim, we introduce the Cross-variable Decorrelation Aware feature Modeling (CDAM) for Channel-mixing approaches. This approach is geared toward reducing superfluous information by minimizing\nthe mutual information between the latent representation of a single univariate sequence and its accompanying multivariate sequence input. Concurrently, it optimizes the joint mutual information shared between the latent representation, its univariate input, and the associated univariate forecast series. Notably, prevailing techniques directly project future series using a single-step forecaster, sidelining the temporal correlation that might exist across varying timesteps in the target series. Addressing this gap, we introduce the Temporal correlation Aware Modeling (TAM). This strategy maximizes the mutual information between adjacent sub-sequences of both the forecasted and target series. By synergizing CDAM and TAM, we sculpt a pioneering framework for MTSF, named as InfoTime. Comprehensive experimental analysis have demonstrated the capability of InfoTime to consistently outpace existing models, encompassing even those considered state-of-the-art.",
        "keywords": "time series forecasting",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Shiyi Qi;Liangjian Wen;Yiduo Li;Yuanhang Yang;Zhe Li;Zhongwen Rao;Lujia Pan;Zenglin Xu",
        "authorids": "~Shiyi_Qi1;~Liangjian_Wen1;~Yiduo_Li1;~Yuanhang_Yang1;~Zhe_Li13;~Zhongwen_Rao1;~Lujia_Pan2;~Zenglin_Xu1",
        "gender": "M;M;F;M;M;M;F;M",
        "homepage": "https://github.com/yikouchunzhen;;;;https://plumprc.github.io/;;;https://faculty.fudan.edu.cn/xuzenglin/en/index.htm",
        "dblp": "321/1594;231/7379;;219/1699;;338/6279;72/11359.html;68/1538",
        "google_scholar": ";jwHflLcAAAAJ;;5GUZrRkAAAAJ;https://scholar.google.com/citations?hl=en;;;gF0H9nEAAAAJ",
        "orcid": "0000-0002-8060-1273;0009-0000-3493-6403;0000-0002-0375-8269;;;;0000-0002-8988-4740;0000-0001-5550-6461",
        "linkedin": ";;;;;;lujia-pan-246909a/?originalSubdomain=cn;",
        "or_profile": "~Shiyi_Qi1;~Liangjian_Wen1;~Yiduo_Li1;~Yuanhang_Yang1;~Zhe_Li13;~Zhongwen_Rao1;~Lujia_Pan2;~Zenglin_Xu1",
        "aff": "Harbin Institute of Technology, shenzhen;Southwest University of Finance and Economics;Alibaba Group;Harbin Institute of Technology (Shenzhen);Singapore Management University;Huawei Technologies Ltd.;Huawei Technologies Ltd.;Harbin Institute of Technology Shenzhen",
        "aff_domain": "hit.edu.cn;swufe.edu.cn;antgroup.com;hit.edu.cn;smu.edu.sg;huawei.com;huawei.com;hit.edu.cn",
        "position": "MS student;Assistant Professor;Researcher;MS student;Researcher;Researcher;Researcher;Full Professor",
        "bibtex": "@misc{\nqi2024enhancing,\ntitle={{ENHANCING} {MULTIVARIATE} {TIME} {SERIES} {FORECAST}- {ING} {WITH} {MUTUAL} {INFORMATION}-{DRIVEN} {CROSS}- {VARIABLE} {AND} {TEMPORAL} {MODELING}},\nauthor={Shiyi Qi and Liangjian Wen and Yiduo Li and Yuanhang Yang and Zhe Li and Zhongwen Rao and Lujia Pan and Zenglin Xu},\nyear={2024},\nurl={https://openreview.net/forum?id=gyJpajLkX2}\n}",
        "github": "",
        "project": "",
        "reviewers": "hxYF;b8jU;Gm16",
        "site": "https://openreview.net/forum?id=gyJpajLkX2",
        "pdf_size": 462602,
        "rating": "6;6;6",
        "confidence": "4;3;3",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "3;3;2",
        "wc_summary": "86;57;89",
        "wc_strengths": "31;37;298",
        "wc_weaknesses": "209;64;257",
        "wc_questions": "64;154;290",
        "wc_review": "390;312;934",
        "wc_reply_reviewers": "35;0;0",
        "wc_reply_authors": "2263;684;1917",
        "reply_reviewers": "1;0;0",
        "reply_authors": "6;2;6",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            77.33333333333333,
            14.429907214608907
        ],
        "wc_strengths_avg": [
            122.0,
            124.47489706764172
        ],
        "wc_weaknesses_avg": [
            176.66666666666666,
            82.04199466668817
        ],
        "wc_questions_avg": [
            169.33333333333334,
            92.89898934984288
        ],
        "wc_review_avg": [
            545.3333333333334,
            276.66746987835216
        ],
        "wc_reply_reviewers_avg": [
            11.666666666666666,
            16.49915822768611
        ],
        "wc_reply_authors_avg": [
            1621.3333333333333,
            677.6795375068923
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            4.666666666666667,
            1.8856180831641267
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10766433048090356576&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;0;3;4;4;0",
        "aff_unique_norm": "Harbin Institute of Technology;Southwest University of Finance and Economics;Alibaba Group;Singapore Management University;Huawei",
        "aff_unique_dep": ";;;;Huawei Technologies",
        "aff_unique_url": "http://en.hhit.edu.cn/;https://www.swufe.edu.cn;https://www.alibaba.com;https://www.smu.edu.sg;https://www.huawei.com",
        "aff_unique_abbr": "HIT;SWUFE;Alibaba;SMU;Huawei",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Shenzhen;",
        "aff_country_unique_index": "0;0;0;0;1;0;0;0",
        "aff_country_unique": "China;Singapore"
    },
    {
        "title": "Learning Polynomial Problems with $SL(2, \\mathbb{R})$-Equivariance",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18122",
        "id": "gyfXuRfxW2",
        "author_site": "Hannah Lawrence, Mitchell Harris",
        "tldr": "",
        "abstract": "Optimizing and certifying the positivity of polynomials are fundamental primitives across mathematics and engineering applications, from dynamical systems to operations research. However, solving these problems in practice requires large semidefinite programs, with poor scaling in dimension and degree. In this work, we demonstrate for the first time that neural networks can effectively solve such problems in a data-driven fashion, achieving tenfold speedups while retaining high accuracy. Moreover, we observe that these polynomial learning problems are equivariant to the non-compact group $SL(2,\\mathbb{R})$, which consists of area-preserving linear transformations. We therefore adapt our learning pipelines to accommodate this structure, including data augmentation, a new $SL(2,\\mathbb{R})$-equivariant architecture, and an architecture equivariant with respect to its maximal compact subgroup, $SO(2, \\mathbb{R})$. Surprisingly, the most successful approaches in practice do not enforce equivariance to the entire group, which we prove arises from an unusual lack of architecture universality for $SL(2,\\mathbb{R})$ in particular. A consequence of this result, which is of independent interest, is that there exists an equivariant function for which there is no sequence of equivariant polynomials multiplied by arbitrary invariants that approximates the original function. This is a rare example of a symmetric problem where data augmentation outperforms a fully equivariant architecture, and provides interesting lessons in both theory and practice for other problems with non-compact symmetries.",
        "keywords": "equivariance;invariance;polynomials;non-compact;special linear group;data augmentation;universality",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/59c229fe444969b30be8da29dbecfc8339616f83.zip",
        "author": "Hannah Lawrence;Mitchell Tong Harris",
        "authorids": "~Hannah_Lawrence1;~Mitchell_Tong_Harris1",
        "gender": "F;",
        "homepage": "https://hannahlawrence.github.io/;",
        "dblp": "251/5474;",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": "hannah-lawrence-417b5a130/;",
        "or_profile": "~Hannah_Lawrence1;~Mitchell_Tong_Harris1",
        "aff": "Massachusetts Institute of Technology;",
        "aff_domain": "mit.edu;",
        "position": "PhD student;",
        "bibtex": "@inproceedings{\nlawrence2024learning,\ntitle={Learning Polynomial Problems with \\${SL}(2, {\\textbackslash}mathbb\\{R\\})\\$-Equivariance},\nauthor={Hannah Lawrence and Mitchell Tong Harris},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=gyfXuRfxW2}\n}",
        "github": "",
        "project": "",
        "reviewers": "AJ4x;J1SQ;b6w7",
        "pdf_size": 1992508,
        "rating": "5;8;8",
        "confidence": "2;5;3",
        "soundness": "1;4;3",
        "contribution": "2;4;3",
        "presentation": "1;3;2",
        "wc_summary": "26;120;73",
        "wc_strengths": "25;117;68",
        "wc_weaknesses": "170;106;190",
        "wc_questions": "109;857;6",
        "wc_review": "330;1200;337",
        "wc_reply_reviewers": "0;45;0",
        "wc_reply_authors": "928;1280;11",
        "reply_reviewers": "0;1;0",
        "reply_authors": "3;2;1",
        "rating_avg": [
            7.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.3333333333333335,
            1.247219128924647
        ],
        "soundness_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            73.0,
            38.37533930360313
        ],
        "wc_strengths_avg": [
            70.0,
            37.58545818087983
        ],
        "wc_weaknesses_avg": [
            155.33333333333334,
            35.82674358011841
        ],
        "wc_questions_avg": [
            324.0,
            379.2264055503871
        ],
        "wc_review_avg": [
            622.3333333333334,
            408.4820137479196
        ],
        "wc_reply_reviewers_avg": [
            15.0,
            21.213203435596427
        ],
        "wc_reply_authors_avg": [
            739.6666666666666,
            534.909545832024
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.7559289460184545,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "openreview": "https://openreview.net/forum?id=gyfXuRfxW2",
        "pdf": "https://openreview.net/pdf?id=gyfXuRfxW2",
        "email": "mit.edu;",
        "author_num": 2,
        "aff_unique_index": "0",
        "aff_unique_norm": "Massachusetts Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://web.mit.edu",
        "aff_unique_abbr": "MIT",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "gywQnORzJX",
        "title": "NPEFF: Non-Negative Per-Example Fisher Factorization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "As deep learning models are deployed in more and more settings, it becomes in-\ncreasingly important to be able to understand why they produce a given prediction,\nbut interpretation of these models remains a challenge. In this paper, we introduce\na novel interpretability method called NPEFF that is readily applicable to any\nend-to-end differentiable model. It operates on the principle that processing of a\ncharacteristic shared across different examples involves a specific subset of model\nparameters. We perform NPEFF by decomposing each example\u2019s Fisher infor-\nmation matrix as a non-negative sum of components. These components take the\nform of either non-negative vectors or rank-1 positive semi-definite matrices de-\npending on whether we are using diagonal or low-rank Fisher representations, re-\nspectively. For the latter form, we introduce a novel and highly scalable algorithm.\nWe demonstrate that components recovered by NPEFF have interpretable tunings\nthrough experiments on language and vision models. Using unique properties of\nNPEFF\u2019s parameter-space representations, we ran extensive experiments to verify\nthat the connections between directions in parameters space and examples recov-\nered by NPEFF actually reflect the model\u2019s processing. We further demonstrate\nNPEFF\u2019s ability to uncover processing strategies actually used by a model by cre-\nating a TRACR-compiled model with known ground truth. We explore a potential\napplications of NPEFF in uncovering and correcting flawed heuristics used by a\nmodel. We release our code to faciliate research using NPEFF.",
        "keywords": "Interpretability;factorization;fisher information",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/29a84e1212d476fd28b8da534ca19508ff1f6b3d.zip",
        "author": "Michael S Matena;Colin Raffel",
        "authorids": "~Michael_S_Matena1;~Colin_Raffel1",
        "gender": ";",
        "homepage": ";http://colinraffel.com",
        "dblp": ";149/0082",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;I66ZBYwAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Michael_S_Matena1;~Colin_Raffel1",
        "aff": "Department of Computer Science, University of North Carolina, Chapel Hill;Hugging Face",
        "aff_domain": "cs.unc.edu;huggingface.co",
        "position": "PhD student;Researcher",
        "bibtex": "@misc{\nmatena2024npeff,\ntitle={{NPEFF}: Non-Negative Per-Example Fisher Factorization},\nauthor={Michael S Matena and Colin Raffel},\nyear={2024},\nurl={https://openreview.net/forum?id=gywQnORzJX}\n}",
        "github": "",
        "project": "",
        "reviewers": "RGwC;19bz;Brpd;2rEq",
        "site": "https://openreview.net/forum?id=gywQnORzJX",
        "pdf_size": 3469108,
        "rating": "5;5;6;6",
        "confidence": "3;4;3;4",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;1;2;4",
        "wc_summary": "166;59;99;113",
        "wc_strengths": "11;22;36;100",
        "wc_weaknesses": "67;255;65;78",
        "wc_questions": "36;2;121;154",
        "wc_review": "280;338;321;445",
        "wc_reply_reviewers": "54;0;0;47",
        "wc_reply_authors": "689;354;461;875",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            109.25,
            38.290827883450106
        ],
        "wc_strengths_avg": [
            42.25,
            34.499094191007394
        ],
        "wc_weaknesses_avg": [
            116.25,
            80.26012397199496
        ],
        "wc_questions_avg": [
            78.25,
            61.57261972662849
        ],
        "wc_review_avg": [
            346.0,
            60.92208138269736
        ],
        "wc_reply_reviewers_avg": [
            25.25,
            25.370997221236692
        ],
        "wc_reply_authors_avg": [
            594.75,
            202.0351145222038
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:I5wWxAeRRewJ:scholar.google.com/&scioq=NPEFF:+Non-Negative+Per-Example+Fisher+Factorization&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of North Carolina;Hugging Face",
        "aff_unique_dep": "Department of Computer Science;",
        "aff_unique_url": "https://www.unc.edu;https://huggingface.co",
        "aff_unique_abbr": "UNC;Hugging Face",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Chapel Hill;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Automatic Functional Differentiation in JAX",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18121",
        "id": "gzT61ziSCu",
        "tldr": "",
        "abstract": "We extend JAX with the capability to automatically differentiate higher-order functions (functionals and operators). By representing functions as infinite dimensional generalization of arrays, we seamlessly use JAX's existing primitive system to implement higher-order functions. We present a set of primitive operators that serve as foundational building blocks for constructing several key types of functionals. For every introduced primitive operator, we derive and implement both linearization and transposition rules, aligning with JAX's internal protocols for forward and reverse mode automatic differentiation. This enhancement allows for functional differentiation in the same syntax traditionally use for functions. The resulting functional gradients are themselves functions ready to be invoked in python. We showcase this tool's efficacy and simplicity through applications where functional derivatives are indispensable.",
        "keywords": "JAX;automatic differentiation;calculus of variation;higher-order functions;functionals;operators;JVP rules;transpose rules",
        "primary_area": "infrastructure, software libraries, hardware, etc.",
        "supplementary_material": "",
        "author": "Min Lin",
        "authorids": "~Min_Lin1",
        "gender": "M",
        "homepage": "https://linmin.me",
        "dblp": "",
        "google_scholar": "BGONmkIAAAAJ",
        "orcid": "",
        "linkedin": "min-lin-08a3a422/",
        "or_profile": "~Min_Lin1",
        "aff": "Sea AI Lab",
        "aff_domain": "sea.com",
        "position": "Principal Researcher",
        "bibtex": "@inproceedings{\nlin2024automatic,\ntitle={Automatic Functional Differentiation in {JAX}},\nauthor={Min Lin},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=gzT61ziSCu}\n}",
        "github": "",
        "project": "",
        "reviewers": "VvN5;RHkE;4ztS;Mbhg",
        "pdf_size": 1236119,
        "rating": "5;6;8;8",
        "confidence": "3;2;4;4",
        "soundness": "2;3;3;4",
        "contribution": "2;3;2;3",
        "presentation": "2;2;3;2",
        "wc_summary": "51;216;120;103",
        "wc_strengths": "23;11;72;66",
        "wc_weaknesses": "32;683;28;293",
        "wc_questions": "912;4;110;126",
        "wc_review": "1018;914;330;588",
        "wc_reply_reviewers": "378;727;0;23",
        "wc_reply_authors": "1489;1890;201;926",
        "reply_reviewers": "3;2;0;1",
        "reply_authors": "4;4;1;2",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            122.5,
            59.66783052868606
        ],
        "wc_strengths_avg": [
            43.0,
            26.42915057280502
        ],
        "wc_weaknesses_avg": [
            259.0,
            267.31161590922306
        ],
        "wc_questions_avg": [
            288.0,
            363.3042801839802
        ],
        "wc_review_avg": [
            712.5,
            271.90945184013003
        ],
        "wc_reply_reviewers_avg": [
            282.0,
            297.42478040674416
        ],
        "wc_reply_authors_avg": [
            1126.5,
            634.6434038103603
        ],
        "reply_reviewers_avg": [
            1.5,
            1.118033988749895
        ],
        "reply_authors_avg": [
            2.75,
            1.299038105676658
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0.7543365091413573,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5923395923425676542&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=gzT61ziSCu",
        "pdf": "https://openreview.net/pdf?id=gzT61ziSCu",
        "email": "sea.com",
        "author_num": 1,
        "aff_unique_index": "0",
        "aff_unique_norm": "Sea AI Lab",
        "aff_unique_dep": "",
        "aff_unique_url": "",
        "aff_unique_abbr": ""
    },
    {
        "title": "Path Choice Matters for Clear Attributions in Path Methods",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18120",
        "id": "gzYgsZgwXa",
        "author_site": "Borui Zhang, Wenzhao Zheng, Jie Zhou, Jiwen Lu",
        "tldr": "",
        "abstract": "Rigorousness and clarity are both essential for interpretations of DNNs to engender human trust. Path methods are commonly employed to generate rigorous attributions that satisfy three axioms. However, the meaning of attributions remains ambiguous due to distinct path choices. To address the ambiguity, we introduce Concentration Principle, which centrally allocates high attributions to indispensable features, thereby endowing aesthetic and sparsity. We then present SAMP, a model-agnostic interpreter, which efficiently searches the near-optimal path from a pre-defined set of manipulation paths. Moreover, we propose the infinitesimal constraint (IC) and momentum strategy (MS) to improve the rigorousness and optimality. Visualizations show that SAMP can precisely reveal DNNs by pinpointing salient image pixels.\nWe also perform quantitative experiments and observe that our method significantly outperforms the counterparts.",
        "keywords": "explainable AI;integrated gradient;attribution;path method",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/ce6e73870d5f3174edb39c12fdc52ad823c23b08.zip",
        "author": "Borui Zhang;Wenzhao Zheng;Jie Zhou;Jiwen Lu",
        "authorids": "~Borui_Zhang1;~Wenzhao_Zheng1;~Jie_Zhou3;~Jiwen_Lu1",
        "gender": "M;;M;M",
        "homepage": "http://boruizhang.site/;https://wzzheng.net;https://www.tsinghua.edu.cn/publish/auen/1713/2011/20110506105532098625469/20110506105532098625469_.html;http://ivg.au.tsinghua.edu.cn/Jiwen_Lu/",
        "dblp": "230/7918;230/1277;00/5012-1;http://dblp.uni-trier.de/pers/hd/l/Lu:Jiwen",
        "google_scholar": "MUN3ZNgAAAAJ;LdK9scgAAAAJ;;TN8uDQoAAAAJ",
        "orcid": "0000-0001-7237-7454;;;0000-0002-6121-5529",
        "linkedin": "BoruiZhang-THU;;;",
        "or_profile": "~Borui_Zhang1;~Wenzhao_Zheng1;~Jie_Zhou3;~Jiwen_Lu1",
        "aff": "Tsinghua University;University of California, Berkeley;Tsinghua University;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;berkeley.edu;tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "PhD student;Postdoc;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nzhang2024path,\ntitle={Path Choice Matters for Clear Attributions in Path Methods},\nauthor={Borui Zhang and Wenzhao Zheng and Jie Zhou and Jiwen Lu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=gzYgsZgwXa}\n}",
        "github": "",
        "project": "",
        "reviewers": "4ZSP;7nkz;tbYK",
        "pdf_size": 36067692,
        "rating": "6;8;8",
        "confidence": "3;3;3",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "3;4;3",
        "wc_summary": "93;31;42",
        "wc_strengths": "98;99;48",
        "wc_weaknesses": "216;12;227",
        "wc_questions": "29;170;17",
        "wc_review": "436;312;334",
        "wc_reply_reviewers": "0;0;134",
        "wc_reply_authors": "812;1169;1401",
        "reply_reviewers": "0;0;1",
        "reply_authors": "2;3;4",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            55.333333333333336,
            27.010286106510527
        ],
        "wc_strengths_avg": [
            81.66666666666667,
            23.809428571238094
        ],
        "wc_weaknesses_avg": [
            151.66666666666666,
            98.86129452700666
        ],
        "wc_questions_avg": [
            72.0,
            69.46941773183363
        ],
        "wc_review_avg": [
            360.6666666666667,
            54.020572213021055
        ],
        "wc_reply_reviewers_avg": [
            44.666666666666664,
            63.168205785998246
        ],
        "wc_reply_authors_avg": [
            1127.3333333333333,
            242.2565215267119
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.0,
            0.816496580927726
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9847669878809594096&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=gzYgsZgwXa",
        "pdf": "https://openreview.net/pdf?id=gzYgsZgwXa",
        "email": "tsinghua.edu.cn;berkeley.edu;tsinghua.edu.cn;tsinghua.edu.cn",
        "author_num": 4,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Tsinghua University;University of California, Berkeley",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.berkeley.edu",
        "aff_unique_abbr": "THU;UC Berkeley",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Berkeley",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Language Model Beats Diffusion - Tokenizer is key to visual generation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18119",
        "id": "gzqrANCF4g",
        "author_site": "Lijun Yu, Jos\u00e9 Lezama, Nitesh Bharadwaj Gundavarapu, Luca Versari, Kihyuk Sohn, David Minnen, Yong Cheng, Agrim Gupta, Xiuye Gu, Alexander G Hauptmann, Boqing Gong, Ming-Hsuan Yang, Irfan Essa, David Ross, Lu Jiang",
        "tldr": "",
        "abstract": "While Large Language Models (LLMs) are the dominant models for generative tasks in language, they do not perform as well as diffusion models on image and video generation. To effectively use LLMs for visual generation, one crucial component is the visual tokenizer that maps pixel-space inputs to discrete tokens appropriate for LLM learning. In this paper, we introduce \\modelname{}, a video tokenizer designed to generate concise and expressive tokens for both videos and images using a common token vocabulary. Equipped with this new tokenizer, we show that LLMs outperform diffusion models on standard image and video generation benchmarks including ImageNet and Kinetics. In addition, we demonstrate that our tokenizer surpasses the previously top-performing video tokenizer on two more tasks: (1) video compression comparable to the next-generation video codec (VCC) according to human evaluations, and (2) learning effective representations for action recognition tasks.",
        "keywords": "language model;diffusion model;video generation;visual tokenization",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Lijun Yu;Jose Lezama;Nitesh Bharadwaj Gundavarapu;Luca Versari;Kihyuk Sohn;David Minnen;Yong Cheng;Agrim Gupta;Xiuye Gu;Alexander G Hauptmann;Boqing Gong;Ming-Hsuan Yang;Irfan Essa;David A Ross;Lu Jiang",
        "authorids": "~Lijun_Yu1;~Jose_Lezama1;~Nitesh_Bharadwaj_Gundavarapu1;~Luca_Versari1;~Kihyuk_Sohn1;~David_Minnen1;~Yong_Cheng3;~Agrim_Gupta1;~Xiuye_Gu1;~Alexander_G_Hauptmann1;~Boqing_Gong1;~Ming-Hsuan_Yang1;~Irfan_Essa1;~David_A_Ross1;~Lu_Jiang1",
        "gender": "M;M;Not Specified;M;M;M;M;;F;M;M;M;M;M;M",
        "homepage": "https://me.lj-y.com/;https://iie.fing.edu.uy/~jlezama/;;;https://sites.google.com/site/kihyuksml/;http://research.minnen.org;;;https://laoreja.github.io/;;http://boqinggong.info;https://faculty.ucmerced.edu/mhyang/;http://www.irfanessa.com/;http://www.lujiang.info/;http://www.cs.toronto.edu/~dross/",
        "dblp": "94/5561;151/8861;247/1182.html;184/0419;53/10771;;34/6276.html;200/8282;199/1920;h/AlexanderGHauptmann;29/7457;79/3711.html;e/IrfanAEssa;22/752-4;68/2171",
        "google_scholar": "IaDc0OcAAAAJ;iDP84cQAAAAJ;v19p_0oAAAAJ;;VxpypngAAAAJ;https://scholar.google.com/citations?hl=en;rZ0mlMYAAAAJ;AxzVaI8AAAAJ;qCrypnoAAAAJ;https://scholar.google.co.uk/citations?user=Py54GcEAAAAJ;lv9ZeVUAAAAJ;p9-ohHsAAAAJ;https://scholar.google.com.tw/citations?user=XM97iScAAAAJ;jIKjjSYAAAAJ;RqOzJR0AAAAJ",
        "orcid": "0000-0003-0645-1657;;;;;;;;;;;0000-0003-4848-2304;0000-0002-6236-2969;0000-0003-0286-8439;",
        "linkedin": "lijun-yu/;;;;;;;;xiuyegu/;;boqing-gong-46aa5821/;minghsuanyang/;irfanessa/;roadjiang/;",
        "or_profile": "~Lijun_Yu1;~Jose_Lezama1;~Nitesh_Bharadwaj_Gundavarapu1;~Luca_Versari1;~Kihyuk_Sohn1;~David_Minnen1;~Yong_Cheng3;~Agrim_Gupta1;~Xiuye_Gu1;~Alexander_G_Hauptmann1;~Boqing_Gong1;~Ming-Hsuan_Yang1;~Irfan_Essa1;~Lu_Jiang1;~David_Alexander_Ross1",
        "aff": "School of Computer Science, Carnegie Mellon University;Google;Google;Google;Google;Google;Google;Stanford University;Google;School of Computer Science, Carnegie Mellon University;Google;University of California at Merced;Georgia Institute of Technology;Google Research;Research, Google",
        "aff_domain": "cs.cmu.edu;google.com;google.com;google.com;google.com;google.com;google.com;stanford.edu;google.com;cs.cmu.edu;google.com;umcerced.edu;gatech.edu;google.com;research.google.com",
        "position": "PhD student;Researcher;Researcher;Researcher;Research Scientist;Researcher;Researcher;PhD student;Researcher;Full Professor;Research Scientist;Professor;Full Professor;Researcher;Software Engineer",
        "bibtex": "@inproceedings{\nyu2024language,\ntitle={Language Model Beats Diffusion - Tokenizer is key to visual generation},\nauthor={Lijun Yu and Jose Lezama and Nitesh Bharadwaj Gundavarapu and Luca Versari and Kihyuk Sohn and David Minnen and Yong Cheng and Agrim Gupta and Xiuye Gu and Alexander G Hauptmann and Boqing Gong and Ming-Hsuan Yang and Irfan Essa and David A Ross and Lu Jiang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=gzqrANCF4g}\n}",
        "github": "",
        "project": "",
        "reviewers": "k12R;sfJe;rVyC",
        "pdf_size": 3407233,
        "rating": "8;8;8",
        "confidence": "4;4;3",
        "soundness": "3;3;3",
        "contribution": "4;4;4",
        "presentation": "3;3;3",
        "wc_summary": "54;78;72",
        "wc_strengths": "66;120;70",
        "wc_weaknesses": "134;92;83",
        "wc_questions": "70;145;2",
        "wc_review": "324;435;227",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "613;1216;370",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;2;1",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            4.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            68.0,
            10.198039027185569
        ],
        "wc_strengths_avg": [
            85.33333333333333,
            24.567367696917707
        ],
        "wc_weaknesses_avg": [
            103.0,
            22.22611077089287
        ],
        "wc_questions_avg": [
            72.33333333333333,
            58.40281576164705
        ],
        "wc_review_avg": [
            328.6666666666667,
            84.97973614665766
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            733.0,
            355.648703076505
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            15,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 296,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10816486597646660868&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=gzqrANCF4g",
        "pdf": "https://openreview.net/pdf?id=gzqrANCF4g",
        "email": "cs.cmu.edu;google.com;google.com;google.com;google.com;google.com;google.com;stanford.edu;google.com;cs.cmu.edu;google.com;umcerced.edu;gatech.edu;google.com;research.google.com",
        "author_num": 15,
        "aff_unique_index": "0;1;1;1;1;1;1;2;1;0;1;3;4;1;1",
        "aff_unique_norm": "Carnegie Mellon University;Google;Stanford University;University of California, Merced;Georgia Institute of Technology",
        "aff_unique_dep": "School of Computer Science;Google;;;",
        "aff_unique_url": "https://www.cmu.edu;https://www.google.com;https://www.stanford.edu;https://www.ucmerced.edu;https://www.gatech.edu",
        "aff_unique_abbr": "CMU;Google;Stanford;UC Merced;Georgia Tech",
        "aff_campus_unique_index": "0;1;1;1;1;1;1;2;1;0;1;3;1;1",
        "aff_campus_unique": "Pittsburgh;Mountain View;Stanford;Merced;",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Understanding Certified Training with Interval Bound Propagation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18118",
        "id": "h05eQniJsQ",
        "author_site": "Yuhao Mao, Mark N M\u00fcller, Marc Fischer, Martin Vechev",
        "tldr": "",
        "abstract": "As robustness verification methods are becoming more precise, training certifiably robust neural networks is becoming ever more relevant. To this end, certified training methods compute and then optimize an upper bound on the worst-case loss over a robustness specification. Curiously, training methods based on the imprecise interval bound propagation (IBP) consistently outperform those leveraging more precise bounds. Still, we lack a theoretical understanding of the mechanisms making IBP so successful. In this work, we investigate these mechanisms by leveraging a novel metric measuring the tightness of IBP bounds. We first show theoretically that, for deep linear models (DLNs), tightness decreases with width and depth at initialization, but improves with IBP training. We, then, derive sufficient and necessary conditions on weight matrices for IBP bounds to become exact and demonstrate that these impose strong regularization, providing an explanation for the observed robustness-accuracy trade-off. Finally, we show how these results on DLNs transfer to ReLU networks, before conducting an extensive empirical study, (i) confirming this transferability and yielding state-of-the-art certified accuracy, (ii) finding that while all IBP-based training methods lead to high tightness, this increase is dominated by the size of the propagated input regions rather than the robustness specification, and finally (iii) observing that non-IBP-based methods do not increase tightness. Together, these results help explain the success of recent certified training methods and may guide the development of new ones.",
        "keywords": "Certified Robustness;Adversarial Robustness;Neural Network Verification;Certified Training",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/7f5bcc61c7aee3f08a9a7e07902214ebe9655bb6.zip",
        "author": "Yuhao Mao;Mark Niklas Mueller;Marc Fischer;Martin Vechev",
        "authorids": "~Yuhao_Mao1;~Mark_Niklas_Mueller2;~Marc_Fischer1;~Martin_Vechev1",
        "gender": "M;M;M;M",
        "homepage": "https://algebraloveme.github.io/about/;https://www.sri.inf.ethz.ch/people/mark;;https://www.sri.inf.ethz.ch/people/martin",
        "dblp": "245/5901;287/4254;37/9373-2;93/2189.html",
        "google_scholar": ";RBpmcCAAAAAJ;;https://scholar.google.ch/citations?user=aZ1Rh50AAAAJ",
        "orcid": ";0000-0002-2496-6542;;",
        "linkedin": ";mark-m%C3%BCller-8bb4b1140/;;",
        "or_profile": "~Yuhao_Mao1;~Mark_Niklas_Mueller2;~Marc_Fischer1;~Martin_Vechev1",
        "aff": "ETHZ - ETH Zurich;Swiss Federal Institute of Technology;Swiss Federal Institute of Technology;Swiss Federal Institute of Technology",
        "aff_domain": "ethz.ch;ethz.ch;ethz.ch;ethz.ch",
        "position": "PhD student;PhD student;PhD student;Full Professor",
        "bibtex": "@inproceedings{\nmao2024understanding,\ntitle={Understanding Certified Training with Interval Bound Propagation},\nauthor={Yuhao Mao and Mark Niklas Mueller and Marc Fischer and Martin Vechev},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=h05eQniJsQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "KaHF;C4Wz;HbFM;FpVR",
        "pdf_size": 644831,
        "rating": "5;5;6;6",
        "confidence": "5;5;3;3",
        "soundness": "2;3;3;3",
        "contribution": "1;2;3;2",
        "presentation": "3;4;3;3",
        "wc_summary": "63;168;57;20",
        "wc_strengths": "53;118;70;37",
        "wc_weaknesses": "277;153;148;61",
        "wc_questions": "153;138;2;33",
        "wc_review": "546;577;277;151",
        "wc_reply_reviewers": "350;166;0;97",
        "wc_reply_authors": "1818;1477;596;741",
        "reply_reviewers": "1;1;0;2",
        "reply_authors": "3;2;1;3",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            4.0,
            1.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            77.0,
            55.05905920009894
        ],
        "wc_strengths_avg": [
            69.5,
            30.335622624235025
        ],
        "wc_weaknesses_avg": [
            159.75,
            76.94600379486903
        ],
        "wc_questions_avg": [
            81.5,
            65.14790863872761
        ],
        "wc_review_avg": [
            387.75,
            179.7044448532089
        ],
        "wc_reply_reviewers_avg": [
            153.25,
            127.9870598927876
        ],
        "wc_reply_authors_avg": [
            1158.0,
            506.72823090883736
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 16,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8065276269867019597&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=h05eQniJsQ",
        "pdf": "https://openreview.net/pdf?id=h05eQniJsQ",
        "email": "ethz.ch;ethz.ch;ethz.ch;ethz.ch",
        "author_num": 4,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "ETH Zurich;Swiss Federal Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ethz.ch;https://www.ethz.ch",
        "aff_unique_abbr": "ETHZ;ETH Zurich",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Switzerland"
    },
    {
        "id": "h1SSQ6Dekc",
        "title": "TransLLaMa: LLM-based Simultaneous Translation System",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Decoder-only large language models (LLMs) have recently demonstrated impressive capabilities in text generation and reasoning. Nonetheless, they have limited applications in simultaneous machine translation (SiMT), which is currently dominated by encoder-decoder transformers. This study demonstrates that, after fine-tuning on a small dataset comprising causally aligned source and target sentence pairs, a pre-trained open-source LLM can control input segmentation directly by generating a special \"wait\" token. This obviates the need for a separate policy and enables the LLM to perform English-German and English-Russian SiMT tasks with BLEU scores that are comparable to those of specific state-of-the-art baselines. We also evaluated closed-source models such as GPT-4, which displayed encouraging results in performing the SiMT task without prior training (zero-shot), indicating a promising avenue for enhancing future SiMT systems.",
        "keywords": "simultaneous machine translation;large language model",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Roman Koshkin;Katsuhito Sudoh;Satoshi Nakamura",
        "authorids": "~Roman_Koshkin1;~Katsuhito_Sudoh2;~Satoshi_Nakamura2",
        "gender": "M;M;M",
        "homepage": "https://roman-koshkin.unit.oist.jp;https://www.sudoh.nl/;https://sds.cuhk.edu.cn/en/teacher/1185",
        "dblp": "351/7581.html;66/2380;57/1548-1",
        "google_scholar": "OpQXH3cAAAAJ;https://scholar.google.co.jp/citations?user=F_J3ZBcAAAAJ;https://scholar.google.co.jp/citations?user=ckdfXawAAAAJ",
        "orcid": "0000-0002-8739-4545;0000-0002-2122-9846;0000-0001-6956-3803",
        "linkedin": "romankoshkininterpreter/;;",
        "or_profile": "~Roman_Koshkin1;~Katsuhito_Sudoh2;~Satoshi_Nakamura2",
        "aff": "Okinawa Institute of Science and Technology (OIST);Nara Institute of Science and Technology, Japan;Nara Institute of Science and Technology, Japan",
        "aff_domain": "oist.jp;naist.jp;naist.jp",
        "position": "PhD student;Associate Professor;Full Professor",
        "bibtex": "@misc{\nkoshkin2024transllama,\ntitle={Trans{LL}aMa: {LLM}-based Simultaneous Translation System},\nauthor={Roman Koshkin and Katsuhito Sudoh and Satoshi Nakamura},\nyear={2024},\nurl={https://openreview.net/forum?id=h1SSQ6Dekc}\n}",
        "github": "",
        "project": "",
        "reviewers": "xrvK;Hphj;jikd;yShq",
        "site": "https://openreview.net/forum?id=h1SSQ6Dekc",
        "pdf_size": 590945,
        "rating": "5;6;6;8",
        "confidence": "4;4;4;5",
        "soundness": "2;3;4;3",
        "contribution": "3;2;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "123;58;38;110",
        "wc_strengths": "56;81;46;83",
        "wc_weaknesses": "152;116;84;114",
        "wc_questions": "63;34;66;14",
        "wc_review": "394;289;234;321",
        "wc_reply_reviewers": "0;0;51;0",
        "wc_reply_authors": "746;389;507;800",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            82.25,
            35.27304211433995
        ],
        "wc_strengths_avg": [
            66.5,
            15.913830462839549
        ],
        "wc_weaknesses_avg": [
            116.5,
            24.09875515457178
        ],
        "wc_questions_avg": [
            44.25,
            21.47527648250425
        ],
        "wc_review_avg": [
            309.5,
            57.864064841661445
        ],
        "wc_reply_reviewers_avg": [
            12.75,
            22.083647796503186
        ],
        "wc_reply_authors_avg": [
            610.5,
            168.85274649824325
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.9271726499455306,
        "gs_citation": 23,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11146658477695396104&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Okinawa Institute of Science and Technology;Nara Institute of Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.oist.jp;https://www.nist.jp",
        "aff_unique_abbr": "OIST;NIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Japan"
    },
    {
        "id": "h1ZEMXxSz1",
        "title": "Segment Anything Model is a Good Teacher for Local Feature Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Local feature detection and description play an important role in many computer vision tasks, which are designed to detect and describe keypoints in \"any scene'' and \"any downstream task''. Data-driven local feature learning methods need to rely on pixel-level correspondence for training, which is challenging to acquire at scale, thus hindering further performance improvement. In this paper, we propose SAMFeat to introduce SAM (segment anything model), a fundamental model trained on 10 million images, as a teacher to guide local feature learning and thus inspire higher performance on limited datasets. First, we construct an auxiliary task of Pixel Semantic Relational Distillation (PSRD) for distilling feature relations with category-agnostic semantic information learned by the SAM encoder into a local feature learning network, hence improving local feature description using semantic discrimination. Second, we develop a technique called Weakly Supervised Contrastive Learning Based on Semantic Grouping (WSC), which utilizes semantic groupings derived from SAM as weakly supervised signals to optimize the metric space of local descriptors. Third, we design an Edge Attention Guidance Module (EAGM) to further improve the accuracy of local feature detection and description by prompting the network to pay more attention to the edge region guided by SAM. SAMFeat's performance in experiments conducted on various tasks such as image matching on HPatches, and long-term, extensive visual localization datasets like Aachen Day-Night showcases its superiority over previous local features. The release code is available at supplementary material.",
        "keywords": "Local Feature Learning;Local Feature Detection and Description;Computer Vision;Deep Learning;AI",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/c7829b9ee53122e52d18ba2af4bc470147c913ca.zip",
        "author": "Jingqian Wu;Rongtao Xu;Zach Wood-Doughty;Changwei Wang",
        "authorids": "~Jingqian_Wu1;~Rongtao_Xu1;~Zach_Wood-Doughty1;~Changwei_Wang2",
        "gender": "M;;;",
        "homepage": ";http://www.nlpr.ia.ac.cn/ivc/;;",
        "dblp": "298/1819;93/4025;;",
        "google_scholar": "Lc-5ohUAAAAJ;;;",
        "orcid": ";;;",
        "linkedin": "jingqian-wu/;;;",
        "or_profile": "~Jingqian_Wu1;~Rongtao_Xu1;~Zach_Wood-Doughty1;~Changwei_Wang2",
        "aff": "Northwestern University, Northwestern University;Institute of Automation, Chinese Academy of Sciences;;",
        "aff_domain": "u.northwestern.edu;ia.ac.cn;;",
        "position": "MS student;PhD student;;",
        "bibtex": "@misc{\nwu2024segment,\ntitle={Segment Anything Model is a Good Teacher for Local Feature Learning},\nauthor={Jingqian Wu and Rongtao Xu and Zach Wood-Doughty and Changwei Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=h1ZEMXxSz1}\n}",
        "github": "",
        "project": "",
        "reviewers": "933k;uqrh;SX6K;F7AB",
        "site": "https://openreview.net/forum?id=h1ZEMXxSz1",
        "pdf_size": 2676790,
        "rating": "5;5;5;6",
        "confidence": "4;5;3;4",
        "soundness": "3;3;2;3",
        "contribution": "3;2;2;3",
        "presentation": "3;2;2;3",
        "wc_summary": "175;124;139;108",
        "wc_strengths": "70;60;94;82",
        "wc_weaknesses": "82;130;350;279",
        "wc_questions": "101;235;25;49",
        "wc_review": "428;549;608;518",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "693;1268;1081;747",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;2;2;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            136.5,
            24.78406746278746
        ],
        "wc_strengths_avg": [
            76.5,
            12.757350822173073
        ],
        "wc_weaknesses_avg": [
            210.25,
            108.56420911147467
        ],
        "wc_questions_avg": [
            102.5,
            81.28191680810683
        ],
        "wc_review_avg": [
            525.75,
            65.03989160507572
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            947.25,
            237.4409137027568
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 19,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3870616914140873347&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Northwestern University;Chinese Academy of Sciences",
        "aff_unique_dep": ";Institute of Automation",
        "aff_unique_url": "https://www.northwestern.edu;http://www.ia.cas.cn",
        "aff_unique_abbr": "NU;CAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "DFormer: Rethinking RGBD Representation Learning for Semantic Segmentation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18117",
        "id": "h1sFUGlI09",
        "author_site": "Bowen Yin, Xuying Zhang, Zhong-Yu Li, Li Liu, Ming-Ming Cheng, Qibin Hou",
        "tldr": "",
        "abstract": "We present DFormer, a novel RGB-D pretraining framework to learn transferable representations for RGB-D segmentation tasks. DFormer has two new key innovations: 1) Unlike previous works that encode RGB-D information with RGB pretrained backbone, we pretrain the backbone using image-depth pairs from ImageNet-1K, and thus the DFormer is endowed with the capacity to encode RGB-D representations; 2) DFormer comprises a sequence of RGB-D blocks, which are tailored for encoding both RGB and depth information through a novel building block design. DFormer avoids the mismatched encoding of the 3D geometry relationships in depth maps by RGB pretrained backbones, which widely lies in existing methods but has not been resolved. We finetune the pretrained DFormer on two popular RGB-D tasks, i.e., RGB-D semantic segmentation and RGB-D salient object detection, with a lightweight decoder head. Experimental results show that our DFormer achieves new state-of-the-art performance on these two tasks with less than half of the computational cost of the current best methods on two RGB-D semantic segmentation datasets and five RGB-D salient object detection datasets. Code will be made publicly available.",
        "keywords": "RGB-D Semantic Segmentation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/e136ffb4d02eb114635bbb31db2f3e415be0aac8.zip",
        "author": "Bowen Yin;Xuying Zhang;Zhong-Yu Li;Li Liu;Ming-Ming Cheng;Qibin Hou",
        "authorids": "~Bowen_Yin1;~Xuying_Zhang1;~Zhong-Yu_Li1;~Li_Liu9;~Ming-Ming_Cheng3;~Qibin_Hou1",
        "gender": "M;F;M;M;M;M",
        "homepage": "http://yinbowen-chn.github.io/;http://lilyliliu.com/Default.aspx;https://mmcheng.net;https://houqb.github.io/;https://zhangxuying1004.github.io/;https://github.com/lzyhha",
        "dblp": "38/1434;33/4528-2.html;45/7592;40/4112;276/3115;283/4860",
        "google_scholar": "xr_FRrEAAAAJ;https://scholar.google.com.au/citations?user=9cMQrVsAAAAJ;huWpVyEAAAAJ;fF8OFV8AAAAJ;76_hOG0AAAAJ;g6WHXrgAAAAJ",
        "orcid": ";0000-0002-2011-2873;0000-0001-5550-8758;;;0000-0002-3682-4904",
        "linkedin": ";;;;;",
        "or_profile": "~Bowen_Yin1;~Li_Liu9;~Ming-Ming_Cheng3;~Qibin_Hou1;~Zhang_Xuying1;~ZhongYu_Li1",
        "aff": "Nankai University;National University of Defense Technology;Nankai University;Nankai University;Nankai University;Nankai University",
        "aff_domain": "nankai.edu.cn;nudt.edu.cn;nankai.edu.cn;nankai.edu.cn;nankai.edu.cn;nankai.edu.cn",
        "position": "PhD student;Full Professor;Full Professor;Associate Professor;PhD student;PhD student",
        "bibtex": "@inproceedings{\nyin2024dformer,\ntitle={{DF}ormer: Rethinking {RGBD} Representation Learning for Semantic Segmentation},\nauthor={Bowen Yin and Xuying Zhang and Zhong-Yu Li and Li Liu and Ming-Ming Cheng and Qibin Hou},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=h1sFUGlI09}\n}",
        "github": "",
        "project": "",
        "reviewers": "HRuY;zqyp;KRMX",
        "pdf_size": 2797465,
        "rating": "3;6;8",
        "confidence": "5;5;5",
        "soundness": "2;3;3",
        "contribution": "1;2;2",
        "presentation": "2;3;3",
        "wc_summary": "68;56;82",
        "wc_strengths": "26;60;61",
        "wc_weaknesses": "253;87;304",
        "wc_questions": "3;123;83",
        "wc_review": "350;326;530",
        "wc_reply_reviewers": "45;29;97",
        "wc_reply_authors": "721;784;1167",
        "reply_reviewers": "1;1;1",
        "reply_authors": "2;1;3",
        "rating_avg": [
            5.666666666666667,
            2.0548046676563256
        ],
        "confidence_avg": [
            5.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            68.66666666666667,
            10.624918300339486
        ],
        "wc_strengths_avg": [
            49.0,
            16.268579122549905
        ],
        "wc_weaknesses_avg": [
            214.66666666666666,
            92.64388209098801
        ],
        "wc_questions_avg": [
            69.66666666666667,
            49.88876515698588
        ],
        "wc_review_avg": [
            402.0,
            91.03845341392834
        ],
        "wc_reply_reviewers_avg": [
            57.0,
            29.028721409436322
        ],
        "wc_reply_authors_avg": [
            890.6666666666666,
            197.08261099233377
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 58,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10029966355725802009&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=h1sFUGlI09",
        "pdf": "https://openreview.net/pdf?id=h1sFUGlI09",
        "email": "nankai.edu.cn;nudt.edu.cn;nankai.edu.cn;nankai.edu.cn;nankai.edu.cn;nankai.edu.cn",
        "author_num": 6,
        "aff_unique_index": "0;1;0;0;0;0",
        "aff_unique_norm": "Nankai University;National University of Defense Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.nankai.edu.cn;http://www.nudt.edu.cn/",
        "aff_unique_abbr": "NKU;NUDT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "h2PnrddEzp",
        "title": "Model Pruning with Model Transfer",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "With a well-trained ``full-size'' network, model pruning aims to derive a small network by removing some weights with minimum performance deterioration, e.g., image classification accuracy. In the typical setup, both model training and pruning are done on the \\emph{same} target dataset, which represent a downstream task of interest. On the other hand, to better solve a downstream task in the real world, the well-established practice is transferring a model pretrained on some source data to the target dataset via finetuning. The two worlds motivate us to study model pruning in a new realistic setup, which embraces a pretrained model and allows transferring it to the target dataset. In the new setup, we first show, as expected, transferring a pretrained model improves state-of-the-art (SOTA) pruning methods remarkably once they follow a principled pruning pipeline: \\emph{transfer the pretrained model by finetuning on the target dataset, prune, and finetune again.} Surprisingly, in the new setup, the simplistic random pruning (which removes random filters) and the L1-norm method (which removes filters that have small L1 norms) outperform SOTA methods, and the latter performs the best! Based on the simple L1-norm method, we propose two techniques to further improve the pruning performance by exploiting the full-size model. Specifically, when finetuning the L1-norm pruned model, our techniques (1) directly reuse the full-size model's classifier, or (2) regularize the pruned model in its finetuning through aligning its features to the off-the-shelf class-mean computed by the full-size model. Extensive experiments on large-scale benchmark datasets demonstrate that our techniques significantly outperform existing approaches.",
        "keywords": "pruning;transfer learning;structured pruning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/a4ce441843b8d00093b1e0dd77909a7b6a1ce8df.zip",
        "author": "Xiaozhou Xu;Yuzhu Wang;Lechao Cheng;Manni Duan;Shu Kong",
        "authorids": "~Xiaozhou_Xu2;~Yuzhu_Wang1;~Lechao_Cheng2;~Manni_Duan2;~Shu_Kong1",
        "gender": "F;;M;F;M",
        "homepage": ";;https://faculty.hfut.edu.cn/ChengLechao;;https://aimerykong.github.io/",
        "dblp": "https://dblp.uni-trier.de/pid/283/1789.html;;165/9781;03/3126;26/11141",
        "google_scholar": "ZtowHccAAAAJ;ApZFks8AAAAJ;PKFAv-cAAAAJ;lIlNBQoAAAAJ;sm9FdLoAAAAJ",
        "orcid": ";0009-0005-8827-3779;0000-0002-7546-9052;;0000-0002-1362-5937",
        "linkedin": ";;;;aimerykong/",
        "or_profile": "~Xiaozhou_Xu2;~Yuzhu_Wang1;~Lechao_Cheng2;~Manni_Duan2;~Shu_Kong1",
        "aff": "Zhejiang University;Zhejiang lab;Hefei University of Technology;Zhejiang Lab;Texas A&M University - College Station",
        "aff_domain": "zju.edu.cn;zhejianglab.com;hfut.edu.cn;zhejianglab.com;tamu.edu",
        "position": "PhD student;Algorithm Engineer;Associate Professor;Researcher;Assistant Professor",
        "bibtex": "@misc{\nxu2024model,\ntitle={Model Pruning with Model Transfer},\nauthor={Xiaozhou Xu and Yuzhu Wang and Lechao Cheng and Manni Duan and Shu Kong},\nyear={2024},\nurl={https://openreview.net/forum?id=h2PnrddEzp}\n}",
        "github": "",
        "project": "",
        "reviewers": "LN4j;KtUB;jc6u;Cwmj",
        "site": "https://openreview.net/forum?id=h2PnrddEzp",
        "pdf_size": 1105520,
        "rating": "3;5;5;5",
        "confidence": "4;3;4;5",
        "soundness": "3;3;2;2",
        "contribution": "3;2;2;1",
        "presentation": "3;3;2;2",
        "wc_summary": "76;70;71;55",
        "wc_strengths": "16;50;36;33",
        "wc_weaknesses": "126;84;121;474",
        "wc_questions": "60;51;2;2",
        "wc_review": "278;255;230;564",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            68.0,
            7.842193570679061
        ],
        "wc_strengths_avg": [
            33.75,
            12.090802289343747
        ],
        "wc_weaknesses_avg": [
            201.25,
            158.3056774092452
        ],
        "wc_questions_avg": [
            28.75,
            26.93858756505248
        ],
        "wc_review_avg": [
            331.75,
            135.1598590558602
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0;0;1;2;3",
        "aff_unique_norm": "Zhejiang University;Hefei University of Technology;Zhejiang Lab;Texas A&M University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.zju.edu.cn;http://www.hfut.edu.cn/;http://www.zhejianglab.com;https://www.tamu.edu",
        "aff_unique_abbr": "ZJU;HUT;;TAMU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";College Station",
        "aff_country_unique_index": "0;0;0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Improved sampling via learned diffusions",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18116",
        "id": "h4pNROsO06",
        "author_site": "Lorenz Richter, Julius Berner",
        "tldr": "",
        "abstract": "Recently, a series of papers proposed deep learning-based approaches to sample from target distributions using controlled diffusion processes, being trained only on the unnormalized target densities without access to samples. Building on previous work, we identify these approaches as special cases of a generalized Schr\u00f6dinger bridge problem, seeking a stochastic evolution between a given prior distribution and the specified target. We further generalize this framework by introducing a variational formulation based on divergences between path space measures of time-reversed diffusion processes. This abstract perspective leads to practical losses that can be optimized by gradient-based algorithms and includes previous objectives as special cases. At the same time, it allows us to consider divergences other than the reverse Kullback-Leibler divergence that is known to suffer from mode collapse. In particular, we propose the so-called \\textit{log-variance loss}, which exhibits favorable numerical properties and leads to significantly improved performance across all considered approaches.",
        "keywords": "Schr\u00f6dinger bridge;sampling from densities;stochastic optimal control;diffusion-based generative modeling",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Lorenz Richter;Julius Berner",
        "authorids": "~Lorenz_Richter1;~Julius_Berner1",
        "gender": ";M",
        "homepage": ";https://jberner.info/",
        "dblp": ";227/2217",
        "google_scholar": "https://scholar.google.de/citations?user=uxlQvnUAAAAJ;73-D2jgAAAAJ",
        "orcid": ";0000-0002-5648-648X",
        "linkedin": ";julius-berner/",
        "or_profile": "~Lorenz_Richter1;~Julius_Berner1",
        "aff": "Zuse Institute Berlin;California Institute of Technology",
        "aff_domain": "zib.de;caltech.edu",
        "position": "Postdoc;Postdoc",
        "bibtex": "@inproceedings{\nrichter2024improved,\ntitle={Improved sampling via learned diffusions},\nauthor={Lorenz Richter and Julius Berner},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=h4pNROsO06}\n}",
        "github": "",
        "project": "",
        "reviewers": "kAh6;29Lh;i9dA;y7Cc",
        "pdf_size": 4169124,
        "rating": "6;6;6;8",
        "confidence": "4;3;2;4",
        "soundness": "4;3;3;4",
        "contribution": "3;3;2;4",
        "presentation": "4;2;3;4",
        "wc_summary": "41;85;44;263",
        "wc_strengths": "36;57;43;142",
        "wc_weaknesses": "118;506;234;72",
        "wc_questions": "2;71;3;1",
        "wc_review": "197;719;324;478",
        "wc_reply_reviewers": "0;14;0;0",
        "wc_reply_authors": "719;1146;726;159",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;3;1;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            108.25,
            91.02025873397636
        ],
        "wc_strengths_avg": [
            69.5,
            42.53527947480773
        ],
        "wc_weaknesses_avg": [
            232.5,
            168.57861667483215
        ],
        "wc_questions_avg": [
            19.25,
            29.88624265443885
        ],
        "wc_review_avg": [
            429.5,
            194.5179940262597
        ],
        "wc_reply_reviewers_avg": [
            3.5,
            6.06217782649107
        ],
        "wc_reply_authors_avg": [
            687.5,
            350.7167660662946
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.5222329678670935,
        "gs_citation": 60,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11706936833463220431&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 10,
        "openreview": "https://openreview.net/forum?id=h4pNROsO06",
        "pdf": "https://openreview.net/pdf?id=h4pNROsO06",
        "email": "zib.de;caltech.edu",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Zuse Institute Berlin;California Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.zib.de;https://www.caltech.edu",
        "aff_unique_abbr": "ZIB;Caltech",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Pasadena",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Germany;United States"
    },
    {
        "title": "Self-Supervised Dataset Distillation for Transfer Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18115",
        "id": "h57gkDO2Yg",
        "author_site": "Dong Bok Lee, Seanie Lee, Joonho Ko, Kenji Kawaguchi, Juho Lee, Sung Ju Hwang",
        "tldr": "",
        "abstract": "Dataset distillation aims to optimize a small set so that a model trained on the set achieves performance similar to that of a model trained on the full dataset. While many supervised methods have achieved remarkable success in distilling a large dataset into a small set of representative samples, however, \nthey are not designed to produce a distilled dataset that can be effectively used to facilitate self-supervised pre-training. To this end, we propose a novel problem of distilling an unlabeled dataset into a set of small synthetic samples for efficient self-supervised learning (SSL). We first prove that a gradient of synthetic samples with respect to a SSL objective in naive bilevel optimization is \\textit{biased} due to the randomness originating from data augmentations or masking for inner optimization. To address this issue, we propose to minimize the mean squared error (MSE) between a model's representations of the synthetic examples and their corresponding learnable target feature representations for the inner objective, which does not introduce any randomness. Our primary motivation is that the model obtained by the proposed inner optimization can mimic the \\textit{self-supervised target model}. To achieve this, we also introduce the MSE between representations of the inner model and the self-supervised target model on the original full dataset for outer optimization. We empirically validate the effectiveness of our method on transfer learning. Our code is available at \nhttps://github.com/db-Lee/selfsup_dd",
        "keywords": "Dataset Distillation;Self-supervised Learning;Kernel Ridge Regression",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Dong Bok Lee;Seanie Lee;Joonho Ko;Kenji Kawaguchi;Juho Lee;Sung Ju Hwang",
        "authorids": "~Dong_Bok_Lee1;~Seanie_Lee1;~Joonho_Ko1;~Kenji_Kawaguchi1;~Juho_Lee2;~Sung_Ju_Hwang1",
        "gender": ";M;M;;M;",
        "homepage": ";https://seanie12.github.io/;https://www.linkedin.com/in/joonho-ko-kaist/;https://ml.comp.nus.edu.sg/#members;https://juho.lee.github.io;",
        "dblp": ";219/6771;;;55/3410-1;",
        "google_scholar": ";zrZu6GkAAAAJ;;aLl3rYoAAAAJ;Py4URJUAAAAJ;",
        "orcid": ";;;;;",
        "linkedin": ";;joonho-ko-580b53201/;;;",
        "or_profile": "~Dong_Bok_Lee1;~Seanie_Lee1;~Joonho_Ko1;~Kenji_Kawaguchi1;~Juho_Lee2;~Sung_Ju_Hwang1",
        "aff": ";Montreal Institute for Learning Algorithms, University of Montreal, Universit\u00e9 de Montr\u00e9al;KAIST;National University of Singapore;Korea Advanced Institute of Science & Technology;",
        "aff_domain": ";mila.umontreal.ca;gsai.kaist.ac.kr;nus.edu;kaist.ac.kr;",
        "position": ";Intern;MS student;Presidential Young Professor;Associate Professor;",
        "bibtex": "@inproceedings{\nlee2024selfsupervised,\ntitle={Self-Supervised Dataset Distillation for Transfer Learning},\nauthor={Dong Bok Lee and Seanie Lee and Joonho Ko and Kenji Kawaguchi and Juho Lee and Sung Ju Hwang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=h57gkDO2Yg}\n}",
        "github": "",
        "project": "",
        "reviewers": "EboT;fRLb;4KT8;59jF;hYSv",
        "pdf_size": 5705379,
        "rating": "5;6;6;6;8",
        "confidence": "4;3;3;4;3",
        "soundness": "3;3;2;3;3",
        "contribution": "2;2;3;3;3",
        "presentation": "3;3;3;3;3",
        "wc_summary": "54;76;116;54;211",
        "wc_strengths": "32;90;72;60;172",
        "wc_weaknesses": "81;184;189;105;165",
        "wc_questions": "2;8;31;6;5",
        "wc_review": "169;358;408;225;553",
        "wc_reply_reviewers": "0;15;0;0;0",
        "wc_reply_authors": "460;1305;848;339;909",
        "reply_reviewers": "0;1;0;0;0",
        "reply_authors": "1;4;2;1;2",
        "rating_avg": [
            6.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.4,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            102.2,
            58.92503712345033
        ],
        "wc_strengths_avg": [
            85.2,
            47.32187654774481
        ],
        "wc_weaknesses_avg": [
            144.8,
            43.70995309995196
        ],
        "wc_questions_avg": [
            10.4,
            10.480458005259122
        ],
        "wc_review_avg": [
            342.6,
            136.1977973390172
        ],
        "wc_reply_reviewers_avg": [
            3.0,
            6.0
        ],
        "wc_reply_authors_avg": [
            772.2,
            344.5190270507567
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            2.0,
            1.0954451150103321
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5833333333333334,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14366012951968567812&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=h57gkDO2Yg",
        "pdf": "https://openreview.net/pdf?id=h57gkDO2Yg",
        "email": ";mila.umontreal.ca;gsai.kaist.ac.kr;nus.edu;kaist.ac.kr;",
        "author_num": 6,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "University of Montreal;Korea Advanced Institute of Science and Technology;National University of Singapore",
        "aff_unique_dep": "Montreal Institute for Learning Algorithms;;",
        "aff_unique_url": "https://www.mila.quebec;https://www.kaist.ac.kr;https://www.nus.edu.sg",
        "aff_unique_abbr": "MILA;KAIST;NUS",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Montreal;",
        "aff_country_unique_index": "0;1;2;1",
        "aff_country_unique": "Canada;South Korea;Singapore"
    },
    {
        "id": "h5lqXPd9JN",
        "title": "Model-Decoupling-Based Federated Learning with Consistency via Knowledge Distillation Using Conditional Generator",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Federated Learning (FL) is gaining popularity as a distributed learning framework that only shares model parameters or gradient updates and keeps private data locally. However, FL is at risk of privacy leakage caused by privacy inference attacks. And most existing privacy-preserving mechanisms in FL conflict with achieving high performance and efficiency. Therefore, we propose FedMD-CG, a novel FL method with highly competitive performance and high-level privacy preservation, which decouples each client's local model into a feature extractor and a classifier, and utilizes a conditional generator instead of the feature extractor to perform server-side model aggregation. To ensure the consistency of local generators and classifiers, FedMD-CG leverages knowledge distillation to train local models and generators at both the latent feature level and the logit level. Also, we construct additional classification losses and design new diversity losses to enhance client-side training. FedMD-CG is robust to data heterogeneity and does not require training extra discriminators (like cGAN). We conduct extensive experiments on various image classification tasks to validate the superiority of FedMD-CG.",
        "keywords": "Federated Learning;model decoupling;knowledge distillation",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/e53f41d620bacaea956e3fabf930989a5775cb28.zip",
        "author": "Kangyang Luo;Shuai Wang;Xiang Li;Yunshi Lan;Ming Gao;Jinlong Shu",
        "authorids": "~Kangyang_Luo1;~Shuai_Wang20;~Xiang_Li24;~Yunshi_Lan1;~Ming_Gao1;~Jinlong_Shu1",
        "gender": "M;M;M;F;M;M",
        "homepage": ";https://github.com/ScottWong98;https://lixiang3776.github.io;https://lanyunshi.github.io;http://dase.ecnu.edu.cn/mgao/;https://math.ecnu.edu.cn/~jlshu/intro.html",
        "dblp": ";42/1503;40/1491-67.html;185/6830.html;71/4173-1;",
        "google_scholar": "https://scholar.google.com.hk/citations?hl=zh-CN;;JnxxNtsAAAAJ;Q0F92XIAAAAJ;https://scholar.google.com/citations?hl=zh-CN;",
        "orcid": ";;0009-0003-0142-2483;0000-0002-0192-8498;0000-0002-5603-2680;",
        "linkedin": ";;;;;",
        "or_profile": "~Kangyang_Luo1;~Shuai_Wang20;~Xiang_Li24;~Yunshi_Lan1;~Ming_Gao1;~Jinlong_Shu1",
        "aff": "East China Normal University;East China Normal University;East China Normal University;East China Normal University;;Shanghai Normal University",
        "aff_domain": "ecnu.edu.cn;ecnu.edu.cn;ecnu.edu.cn;ecnu.edu.cn;;shnu.edu.cn",
        "position": "PhD student;MS student;Full Professor;Associate Professor;;Full Professor",
        "bibtex": "@misc{\nluo2024modeldecouplingbased,\ntitle={Model-Decoupling-Based Federated Learning with Consistency via Knowledge Distillation Using Conditional Generator},\nauthor={Kangyang Luo and Shuai Wang and Xiang Li and Yunshi Lan and Ming Gao and Jinlong Shu},\nyear={2024},\nurl={https://openreview.net/forum?id=h5lqXPd9JN}\n}",
        "github": "",
        "project": "",
        "reviewers": "eFsa;iK9N;i6FV;C5Ch",
        "site": "https://openreview.net/forum?id=h5lqXPd9JN",
        "pdf_size": 896278,
        "rating": "3;5;5;6",
        "confidence": "4;3;5;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "70;111;100;66",
        "wc_strengths": "31;98;64;35",
        "wc_weaknesses": "248;174;408;26",
        "wc_questions": "96;63;3;72",
        "wc_review": "445;446;575;199",
        "wc_reply_reviewers": "293;0;0;0",
        "wc_reply_authors": "1694;1126;724;251",
        "reply_reviewers": "2;0;0;0",
        "reply_authors": "4;3;2;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            86.75,
            19.201236939322424
        ],
        "wc_strengths_avg": [
            57.0,
            26.879360111431225
        ],
        "wc_weaknesses_avg": [
            214.0,
            137.60087209025966
        ],
        "wc_questions_avg": [
            58.5,
            34.23813663153998
        ],
        "wc_review_avg": [
            416.25,
            136.11644830805716
        ],
        "wc_reply_reviewers_avg": [
            73.25,
            126.87272165442026
        ],
        "wc_reply_authors_avg": [
            948.75,
            530.1374232215643
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.3458572319330373,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Rnw2jPMECj8J:scholar.google.com/&scioq=Model-Decoupling-Based+Federated+Learning+with+Consistency+via+Knowledge+Distillation+Using+Conditional+Generator&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;1",
        "aff_unique_norm": "East China Normal University;Shanghai Normal University",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.ecnu.edu.cn;http://www.shnu.edu.cn",
        "aff_unique_abbr": "ECNU;SHNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "VQGraph: Rethinking Graph Representation Space for Bridging GNNs and MLPs",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18114",
        "id": "h6Tz85BqRI",
        "author_site": "Ling Yang, Ye Tian, Minkai Xu, Zhongyi Liu, Shenda Hong, Wei Qu, Wentao Zhang, Bin CUI, Muhan Zhang, Jure Leskovec",
        "tldr": "",
        "abstract": "GNN-to-MLP distillation aims to utilize knowledge distillation (KD) to learn computationally-efficient multi-layer perceptron (student MLP) on graph data by mimicking the output representations of teacher GNN. Existing methods mainly make the MLP to mimic the GNN predictions over a few class labels. However, the class space may not be expressive enough for covering numerous diverse local graph structures, thus limiting the performance of knowledge transfer from GNN to MLP. To address this issue, we propose to learn a new powerful graph representation space by directly labeling nodes' diverse local structures for GNN-to-MLP distillation. Specifically, we propose a variant of VQ-VAE to learn a structure-aware tokenizer on graph data that can encode each node's local substructure as a discrete code. The discrete codes constitute a codebook as a new graph representation space that is able to identify different local graph structures of nodes with the corresponding code indices. Then, based on the learned codebook, we propose a new distillation target, namely soft code assignments, to directly transfer the structural knowledge of each node from GNN to MLP. The resulting framework VQGraph achieves new state-of-the-art performance on GNN-to-MLP distillation in both transductive and inductive settings across seven graph datasets. We show that VQGraph with better performance infers faster than GNNs by 828\u00d7, and also achieves accuracy improvement over GNNs and stand-alone MLPs by 3.90% and 28.05% on average, respectively. Our code is available at https://github.com/YangLing0818/VQGraph",
        "keywords": "Graph Knowledge Distillation;Efficient Graph Learning",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/129f44ea286e3ab1dd1ca74f7ec8307b7b2f42dc.zip",
        "author": "Ling Yang;Ye Tian;Minkai Xu;Zhongyi Liu;Shenda Hong;Wei Qu;Wentao Zhang;Bin CUI;Muhan Zhang;Jure Leskovec",
        "authorids": "~Ling_Yang1;~Ye_Tian15;~Minkai_Xu1;~Zhongyi_Liu1;~Shenda_Hong1;~Wei_Qu3;~Wentao_Zhang1;~Bin_CUI2;~Muhan_Zhang1;~Jure_Leskovec1",
        "gender": "M;M;M;;;M;;M;M;",
        "homepage": "https://yangling0818.github.io/;https://tyfeld.github.io/;https://minkaixu.com;;;;;https://cuibinpku.github.io/index.html;https://muhanzhang.github.io/;http://cs.stanford.edu/~jure/",
        "dblp": "01/24-6.html;;257/3355;46/394;;36/440;;55/5031.html;157/5518;l/JureLeskovec",
        "google_scholar": "https://scholar.google.com.hk/citations?user=sIKujqAAAAAJ;vUY_PIUAAAAJ;https://scholar.google.com/citations?hl=en;;;;;IJAU8KoAAAAJ;https://scholar.google.com.hk/citations?user=OBBqkosAAAAJ;Q_kKkIUAAAAJ",
        "orcid": "0000-0003-1905-8053;;;;;;;0000-0003-1681-4677;0000-0002-7680-6401;0000-0002-5411-923X",
        "linkedin": ";;;;;wei-qu-95b9607a/;;;jerry-muhan-zhang-a33a1777/;leskovec/",
        "or_profile": "~Ling_Yang1;~Ye_Tian15;~Minkai_Xu1;~Zhongyi_Liu1;~Shenda_Hong1;~Wei_Qu3;~Wentao_Zhang1;~Bin_CUI2;~Muhan_Zhang1;~Jure_Leskovec1",
        "aff": "Peking University;Peking University;Stanford University;Ant Group;;Ant Group;;Peking University;Peking University;Kumo.AI",
        "aff_domain": "pku.edu.cn;pku.edu.cn;stanford.edu;alipay.com;;alipay.com;;pku.edu.cn;pku.edu.cn;kumo.ai",
        "position": "PhD student;MS student;PhD student;Director of Alipay Search;;Algorithm Expert;;Full Professor;Assistant Professor;Chief Scientist",
        "bibtex": "@inproceedings{\nyang2024vqgraph,\ntitle={{VQG}raph: Rethinking Graph Representation Space for Bridging {GNN}s and {MLP}s},\nauthor={Ling Yang and Ye Tian and Minkai Xu and Zhongyi Liu and Shenda Hong and Wei Qu and Wentao Zhang and Bin CUI and Muhan Zhang and Jure Leskovec},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=h6Tz85BqRI}\n}",
        "github": "",
        "project": "",
        "reviewers": "T74P;12WL;Cnqf;4K7i;F8Tt",
        "pdf_size": 2195025,
        "rating": "5;5;6;8;8",
        "confidence": "4;3;4;4;4",
        "soundness": "3;2;2;3;3",
        "contribution": "2;2;2;3;3",
        "presentation": "3;3;3;3;3",
        "wc_summary": "125;74;48;75;51",
        "wc_strengths": "42;25;70;87;58",
        "wc_weaknesses": "148;182;136;72;29",
        "wc_questions": "6;3;393;77;92",
        "wc_review": "321;284;647;311;230",
        "wc_reply_reviewers": "0;88;273;20;206",
        "wc_reply_authors": "844;863;2461;719;1217",
        "reply_reviewers": "0;1;2;1;3",
        "reply_authors": "3;4;6;3;5",
        "rating_avg": [
            6.4,
            1.3564659966250536
        ],
        "confidence_avg": [
            3.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            74.6,
            27.58695343817436
        ],
        "wc_strengths_avg": [
            56.4,
            21.527656630483495
        ],
        "wc_weaknesses_avg": [
            113.4,
            55.22897790109826
        ],
        "wc_questions_avg": [
            114.2,
            143.99916666425537
        ],
        "wc_review_avg": [
            358.6,
            147.61923993843078
        ],
        "wc_reply_reviewers_avg": [
            117.4,
            106.0143386528445
        ],
        "wc_reply_authors_avg": [
            1220.8,
            641.858676033907
        ],
        "reply_reviewers_avg": [
            1.4,
            1.019803902718557
        ],
        "reply_authors_avg": [
            4.2,
            1.16619037896906
        ],
        "replies_avg": [
            36,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.5160468465421402,
        "gs_citation": 28,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8284705669122813901&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=h6Tz85BqRI",
        "pdf": "https://openreview.net/pdf?id=h6Tz85BqRI",
        "email": "pku.edu.cn;pku.edu.cn;stanford.edu;alipay.com;;alipay.com;;pku.edu.cn;pku.edu.cn;kumo.ai",
        "author_num": 10,
        "aff_unique_index": "0;0;1;2;2;0;0;3",
        "aff_unique_norm": "Peking University;Stanford University;Ant Group;Kumo.AI",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.stanford.edu;https://www.antgroup.com;https://www.kumo.ai",
        "aff_unique_abbr": "Peking U;Stanford;Ant Group;Kumo.AI",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Stanford",
        "aff_country_unique_index": "0;0;1;0;0;0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "h6qviVGwsx",
        "title": "FedBug: A Bottom-Up Gradual Unfreezing Framework for Federated Learning With Client Drift",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Federated Learning (FL) offers a collaborative training framework, allowing multiple clients to contribute to a shared model without compromising data privacy. Due to the heterogeneous nature of local datasets, updated client models may overfit and diverge from one another, commonly known as the problem of client drift. In this paper, we propose FedBug (Federated Learning with Bottom-Up Gradual Unfreezing), a novel FL framework designed to effectively mitigate client drift. FedBug adaptively leverages the client model parameters, distributed by the server at each global round, as the reference points for cross-client alignment. Specifically, on the client side, FedBug begins by freezing the entire model, then gradually unfreezes the layers, from the input layer to the output layer. This bottom-up approach allows models to train the newly thawed layers to project data into a latent space, wherein the separating hyperplanes remain consistent across all clients. We theoretically analyze FedBug in a novel over-parameterization FL setup, revealing its superior convergence rate compared to FedAvg. Through comprehensive experiments, spanning various datasets, training conditions, and network architectures, we validate the efficacy of FedBug. Our contributions encompass a novel FL framework, theoretical analysis, and empirical validation, demonstrating the potential and wide applicability of FedBug.",
        "keywords": "federated learning;decentralized learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/b96802469cb0eeeb1b3b40a7a9b411a09a728a5a.pdf",
        "author": "Chia Hsiang Kao;Yu-Chiang Frank Wang",
        "authorids": "~Chia_Hsiang_Kao1;~Yu-Chiang_Frank_Wang2",
        "gender": "M;M",
        "homepage": "https://iandrover.github.io;http://vllab.ee.ntu.edu.tw/ycwang.html",
        "dblp": "241/3791;30/1690",
        "google_scholar": "https://scholar.google.com.tw/citations?user=W_i9B0sAAAAJ;HSGvdtoAAAAJ",
        "orcid": ";0000-0002-2333-157X",
        "linkedin": ";",
        "or_profile": "~Chia_Hsiang_Kao1;~Yu-Chiang_Frank_Wang2",
        "aff": "Cornell University;National Taiwan University",
        "aff_domain": "cornell.edu;ntu.edu.tw",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nkao2024fedbug,\ntitle={FedBug: A Bottom-Up Gradual Unfreezing Framework for Federated Learning With Client Drift},\nauthor={Chia Hsiang Kao and Yu-Chiang Frank Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=h6qviVGwsx}\n}",
        "github": "",
        "project": "",
        "reviewers": "3LcF;Rnja;hW47;AHdV",
        "site": "https://openreview.net/forum?id=h6qviVGwsx",
        "pdf_size": 946180,
        "rating": "3;3;5;6",
        "confidence": "4;5;4;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "103;127;63;64",
        "wc_strengths": "39;77;51;49",
        "wc_weaknesses": "223;309;325;134",
        "wc_questions": "50;139;55;11",
        "wc_review": "415;652;494;258",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            89.25,
            27.11434122378783
        ],
        "wc_strengths_avg": [
            54.0,
            14.035668847618199
        ],
        "wc_weaknesses_avg": [
            247.75,
            76.27376678780195
        ],
        "wc_questions_avg": [
            63.75,
            46.66569939473746
        ],
        "wc_review_avg": [
            454.75,
            142.07282463581836
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:cY7H1okek6YJ:scholar.google.com/&scioq=FedBug:+A+Bottom-Up+Gradual+Unfreezing+Framework+for+Federated+Learning+With+Client+Drift&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Cornell University;National Taiwan University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cornell.edu;https://www.ntu.edu.tw",
        "aff_unique_abbr": "Cornell;NTU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Taiwan",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "Active Retrosynthetic Planning Aware of Route Quality",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18113",
        "id": "h7DGnWGeos",
        "author_site": "Luotian Yuan, Yemin Yu, Ying Wei, Yongwei Wang, Zhihua Wang, Fei Wu",
        "tldr": "",
        "abstract": "Retrosynthetic planning is a sequential decision-making process of identifying synthetic routes from the available building block materials to reach a desired target molecule.\nThough existing planning approaches show promisingly high solving rates and low costs, the trivial route cost evaluation via pre-trained forward reaction prediction models certainly falls short of real-world chemical practice.\nAn alternative option is to annotate the actual cost of a route, such as yield, through chemical experiments or input from chemists, while \nthis often leads to substantial query costs.\nIn order to strike the balance between query costs and route quality evaluation, we propose an Active Retrosynthetic Planning (ARP) framework that remains compatible with the established retrosynthetic planners.\nOn one hand, the proposed ARP trains an actor that decides whether to query the cost of a reaction; on the other hand, it resorts to a critic to estimate the value of a molecule with its preceding reaction cost as input. \nThose molecules with low reaction costs are preferred to expand first.\nWe apply our framework to different existing approaches on both the benchmark and an expert dataset and demonstrate that it outperforms the existing state-of-the-art approach by 6.2\\% in route quality while reducing the query cost by 12.8\\%.\nIn addition, \nARP consistently plans \nhigh-quality routes with either abundant or sparse annotations.",
        "keywords": "Retrosynthetic planning;route evaluation;reinforcement learning",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/713e89ddf1aad5f74ca8fa9945bd587f7653c3e5.pdf",
        "author": "Luotian Yuan;Yemin Yu;Ying Wei;Yongwei Wang;Zhihua Wang;Fei Wu",
        "authorids": "~Luotian_Yuan1;~Yemin_Yu1;~Ying_Wei1;~Yongwei_Wang1;~Zhihua_Wang4;~Fei_Wu1",
        "gender": "M;Not Specified;F;M;M;M",
        "homepage": "https://github.com/yuanluotian;https://www.linkedin.com/in/yemin-yu-54654692/;https://wei-ying.net/;https://enkiwang.github.io/index.html;;https://person.zju.edu.cn/wufei",
        "dblp": "323/8896;337/1128;14/4899-1;;;84/3254-1",
        "google_scholar": ";;5UpFdKsAAAAJ;https://scholar.google.ca/citations?hl=en;oDdO4JIAAAAJ;XJLn4MYAAAAJ",
        "orcid": ";;;0000-0001-9712-8964;0000-0002-1593-1321;",
        "linkedin": ";;;;;",
        "or_profile": "~Luotian_Yuan1;~Yemin_Yu1;~Ying_Wei1;~Yongwei_Wang1;~Zhihua_Wang4;~Fei_Wu1",
        "aff": ";City University of Hong Kong;Nanyang Technological University;Zhejiang University;Shanghai Institute for Advanced Study of Zhejiang University;Zhejiang University",
        "aff_domain": ";cityu.edu.hk;ntu.edu.sg;zju.edu.cn;zju.edu.cn;zju.edu.cn",
        "position": ";PhD student;Assistant Professor;Assistant Professor;Researcher;Full Professor",
        "bibtex": "@inproceedings{\nyuan2024active,\ntitle={Active Retrosynthetic Planning Aware of Route Quality},\nauthor={Luotian Yuan and Yemin Yu and Ying Wei and Yongwei Wang and Zhihua Wang and Fei Wu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=h7DGnWGeos}\n}",
        "github": "",
        "project": "",
        "reviewers": "23Kg;BDYr;iEQU;zSxo",
        "pdf_size": 3564016,
        "rating": "6;6;6;8",
        "confidence": "4;3;5;4",
        "soundness": "3;3;3;3",
        "contribution": "3;3;2;3",
        "presentation": "3;2;2;3",
        "wc_summary": "64;73;38;85",
        "wc_strengths": "189;66;12;114",
        "wc_weaknesses": "619;63;161;30",
        "wc_questions": "160;242;30;44",
        "wc_review": "1032;444;241;273",
        "wc_reply_reviewers": "219;36;0;12",
        "wc_reply_authors": "1533;1547;1725;382",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "4;5;3;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            65.0,
            17.277152543170995
        ],
        "wc_strengths_avg": [
            95.25,
            65.05142196754811
        ],
        "wc_weaknesses_avg": [
            218.25,
            236.33596319646318
        ],
        "wc_questions_avg": [
            119.0,
            87.11486669908874
        ],
        "wc_review_avg": [
            497.5,
            318.0978623002676
        ],
        "wc_reply_reviewers_avg": [
            66.75,
            88.85205399989356
        ],
        "wc_reply_authors_avg": [
            1296.75,
            533.5271197418178
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.5,
            1.118033988749895
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=670450665580856834&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=h7DGnWGeos",
        "pdf": "https://openreview.net/pdf?id=h7DGnWGeos",
        "email": ";cityu.edu.hk;ntu.edu.sg;zju.edu.cn;zju.edu.cn;zju.edu.cn",
        "author_num": 6,
        "aff_unique_index": "0;1;2;2;2",
        "aff_unique_norm": "City University of Hong Kong;Nanyang Technological University;Zhejiang University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.cityu.edu.hk;https://www.ntu.edu.sg;https://www.zju.edu.cn",
        "aff_unique_abbr": "CityU;NTU;ZJU",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Hong Kong SAR;;Shanghai",
        "aff_country_unique_index": "0;1;0;0;0",
        "aff_country_unique": "China;Singapore"
    },
    {
        "title": "Tractable Probabilistic Graph Representation Learning with Graph-Induced Sum-Product Networks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18112",
        "id": "h7nOCxFsPg",
        "author_site": "Federico Errica, Mathias Niepert",
        "tldr": "",
        "abstract": "We introduce Graph-Induced Sum-Product Networks (GSPNs), a new probabilistic framework for graph representation learning that can tractably answer probabilistic queries. Inspired by the computational trees induced by vertices in the context of message-passing neural networks, we build hierarchies of sum-product networks (SPNs) where the parameters of a parent SPN are learnable transformations of the a-posterior mixing probabilities of its children's sum units. Due to weight sharing and the tree-shaped computation graphs of GSPNs, we obtain the efficiency and efficacy of deep graph networks with the additional advantages of a probabilistic model. We show the model's competitiveness on scarce supervision scenarios, under missing data, and for graph classification in comparison to popular neural models. We complement the experiments with qualitative analyses on hyper-parameters and the model's ability to answer probabilistic queries.",
        "keywords": "Deep Graph Networks;Graph Neural Networks;Bayesian Networks;Sum-Product Networks;Graph Representation Learning;Missing Data;Graph Classification;Weak Supervision",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/c43a643cf6ed9719f35fd3ce750340f0e008c46a.pdf",
        "author": "Federico Errica;Mathias Niepert",
        "authorids": "~Federico_Errica1;~Mathias_Niepert1",
        "gender": "M;M",
        "homepage": "http://pages.di.unipi.it/errica/;http://www.matlog.net",
        "dblp": "203/9424;n/MathiasNiepert",
        "google_scholar": "https://scholar.google.co.uk/citations?user=VJ0n2gQAAAAJ;https://scholar.google.de/citations?user=p5vLzq0AAAAJ",
        "orcid": "0000-0001-5181-2904;",
        "linkedin": "https://it.linkedin.com/in/federicoerrica;",
        "or_profile": "~Federico_Errica1;~Mathias_Niepert1",
        "aff": "NEC;NEC",
        "aff_domain": "neclab.eu;neclab.eu",
        "position": "Researcher;Research Scientist",
        "bibtex": "@inproceedings{\nerrica2024tractable,\ntitle={Tractable Probabilistic Graph Representation Learning with Graph-Induced Sum-Product Networks},\nauthor={Federico Errica and Mathias Niepert},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=h7nOCxFsPg}\n}",
        "github": "",
        "project": "",
        "reviewers": "ReHv;GF8k;KgLo",
        "pdf_size": 570072,
        "rating": "5;6;6",
        "confidence": "3;2;3",
        "soundness": "3;3;3",
        "contribution": "3;3;2",
        "presentation": "3;2;4",
        "wc_summary": "90;97;100",
        "wc_strengths": "111;106;82",
        "wc_weaknesses": "157;68;80",
        "wc_questions": "93;79;44",
        "wc_review": "451;350;306",
        "wc_reply_reviewers": "29;58;0",
        "wc_reply_authors": "626;296;516",
        "reply_reviewers": "1;1;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            95.66666666666667,
            4.189935029992178
        ],
        "wc_strengths_avg": [
            99.66666666666667,
            12.657891697365017
        ],
        "wc_weaknesses_avg": [
            101.66666666666667,
            39.43207943906698
        ],
        "wc_questions_avg": [
            72.0,
            20.607442021431645
        ],
        "wc_review_avg": [
            369.0,
            60.70145522692736
        ],
        "wc_reply_reviewers_avg": [
            29.0,
            23.678400846904054
        ],
        "wc_reply_authors_avg": [
            479.3333333333333,
            137.1941041817112
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=631134883840890567&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=h7nOCxFsPg",
        "pdf": "https://openreview.net/pdf?id=h7nOCxFsPg",
        "email": "neclab.eu;neclab.eu",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "NEC Corporation",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nec.com",
        "aff_unique_abbr": "NEC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Japan"
    },
    {
        "title": "Neural Network-Based Score Estimation in Diffusion Models: Optimization and Generalization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18111",
        "id": "h8GeqOxtd4",
        "author_site": "Yinbin Han, Meisam Razaviyayn, Renyuan Xu",
        "tldr": "",
        "abstract": "Diffusion models have emerged as a powerful tool rivaling GANs in generating high-quality samples with improved fidelity, flexibility, and robustness. A key component of these models is to learn the score function through score matching. Despite empirical success on various tasks,  it remains unclear whether gradient-based algorithms can learn the score function with a provable accuracy. As a first step toward answering this question, this paper establishes a mathematical framework for analyzing score estimation using neural networks trained by gradient descent. Our analysis covers both the optimization and the generalization aspects of the learning procedure. In particular, we propose a parametric form to formulate the denoising score-matching problem as a regression with noisy labels. Compared to the standard supervised learning setup, the score-matching problem introduces distinct challenges, including unbounded input, vector-valued output, and an additional time variable, preventing existing techniques from being applied directly. In this paper, we show that with proper designs, the evolution of neural networks during training can be accurately modeled by a series of kernel regression tasks. Furthermore, by applying an early-stopping rule for gradient descent and leveraging recent developments in neural tangent kernels, we establish the first generalization error (sample complexity) bounds for learning the score function with neural networks, despite the presence of noise in the observations. Our analysis is grounded in a novel parametric form of the neural network and an innovative connection between score matching and regression analysis, facilitating the application of advanced statistical and optimization techniques.",
        "keywords": "diffusion models; score estimation; neural networks; neural tangent kernels",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Yinbin Han;Meisam Razaviyayn;Renyuan Xu",
        "authorids": "~Yinbin_Han1;~Meisam_Razaviyayn1;~Renyuan_Xu1",
        "gender": ";M;F",
        "homepage": "https://yinbinhan.github.io/;https://sites.usc.edu/razaviyayn/;https://renyuanxu.github.io/",
        "dblp": "342/7550;43/8577;",
        "google_scholar": "6TF7dTgO6G8C;https://scholar.google.com/citations?hl=en;",
        "orcid": ";;",
        "linkedin": ";;renyuan-xu-b8073276/",
        "or_profile": "~Yinbin_Han1;~Meisam_Razaviyayn1;~Renyuan_Xu1",
        "aff": "University of Southern California;Google;University of Southern California",
        "aff_domain": "usc.edu;google.com;usc.edu",
        "position": "PhD student;Researcher;Assistant Professor",
        "bibtex": "@inproceedings{\nhan2024neural,\ntitle={Neural Network-Based Score Estimation in Diffusion Models: Optimization and Generalization},\nauthor={Yinbin Han and Meisam Razaviyayn and Renyuan Xu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=h8GeqOxtd4}\n}",
        "github": "",
        "project": "",
        "reviewers": "HzBc;NU4S;E1nm;zi6V",
        "pdf_size": 548182,
        "rating": "5;6;6;8",
        "confidence": "2;2;4;4",
        "soundness": "3;2;3;3",
        "contribution": "3;3;2;4",
        "presentation": "3;3;2;3",
        "wc_summary": "9;73;83;36",
        "wc_strengths": "33;123;47;30",
        "wc_weaknesses": "26;237;67;75",
        "wc_questions": "11;2;374;84",
        "wc_review": "79;435;571;225",
        "wc_reply_reviewers": "0;100;43;0",
        "wc_reply_authors": "328;816;1251;513",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;2;2;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.0,
            1.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            50.25,
            29.55820529057879
        ],
        "wc_strengths_avg": [
            58.25,
            37.93003427364653
        ],
        "wc_weaknesses_avg": [
            101.25,
            80.54928615450295
        ],
        "wc_questions_avg": [
            117.75,
            151.32477490483836
        ],
        "wc_review_avg": [
            327.5,
            189.1474292714548
        ],
        "wc_reply_reviewers_avg": [
            35.75,
            41.038853541491626
        ],
        "wc_reply_authors_avg": [
            727.0,
            349.1038527429911
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.6882472016116854,
        "gs_citation": 23,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15135025456709677139&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=h8GeqOxtd4",
        "pdf": "https://openreview.net/pdf?id=h8GeqOxtd4",
        "email": "usc.edu;google.com;usc.edu",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Southern California;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.usc.edu;https://www.google.com",
        "aff_unique_abbr": "USC;Google",
        "aff_campus_unique_index": "0;1;0",
        "aff_campus_unique": "Los Angeles;Mountain View",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Multi-Source Diffusion Models for Simultaneous Music Generation and Separation",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18110",
        "id": "h922Qhkmx1",
        "author_site": "Giorgio Mariani, Irene Tallini, Emilian Postolache, Michele Mancusi, Luca Cosmo, Emanuele Rodol\u00e0",
        "tldr": "",
        "abstract": "In this work, we define a diffusion-based generative model capable of both music generation and source separation by learning the score of the joint probability density of sources sharing a context. Alongside the classic total inference tasks (i.e., generating a mixture, separating the sources), we also introduce and experiment on the partial generation task of source imputation, where we generate a subset of the sources given the others (e.g., play a piano track that goes well with the drums). Additionally, we introduce a novel inference method for the separation task based on Dirac likelihood functions. We train our model on Slakh2100, a standard dataset for musical source separation, provide qualitative results in the generation settings, and showcase competitive quantitative results in the source separation setting. Our method is the first example of a single model that can handle both generation and separation tasks, thus representing a step toward general audio models.",
        "keywords": "source separation;probabilistic diffusion models;music generation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/ce96fbc2ccc8d79e2984ab1973c671b0c29238a0.zip",
        "author": "Giorgio Mariani;Irene Tallini;Emilian Postolache;Michele Mancusi;Luca Cosmo;Emanuele Rodol\u00e0",
        "authorids": "~Giorgio_Mariani1;~Irene_Tallini1;~Emilian_Postolache1;~Michele_Mancusi1;~Luca_Cosmo2;~Emanuele_Rodol\u00e01",
        "gender": "M;F;M;M;M;M",
        "homepage": ";;https://michelemancusi.netlify.app/;;;https://emilianpostolache.com/",
        "dblp": "312/5858;243/3083;304/2552;122/8728;54/8401;274/0359",
        "google_scholar": ";C1WjSW0AAAAJ;V-VmPu0AAAAJ;https://scholar.google.it/citations?hl=it;-EH4wBYAAAAJ;UoVX7gUAAAAJ",
        "orcid": ";0000-0002-9387-2865;0000-0003-1591-7076;0000-0001-7729-4666;0000-0003-0091-7241;0000-0002-4785-5204",
        "linkedin": "giorgio-mariani/;;michele-mancusi/;;;emilian-postolache/",
        "or_profile": "~Giorgio_Mariani1;~Irene_Tallini1;~Michele_Mancusi1;~Luca_Cosmo2;~Emanuele_Rodol\u00e01;~Emilian_Postolache2",
        "aff": "University of Roma \"La Sapienza\";University of Roma \"La Sapienza\";University of Roma \"La Sapienza\";University of Venice;Sapienza University of Rome;University of Roma \"La Sapienza\"",
        "aff_domain": "uniroma1.it;uniroma1.it;uniroma1.it;unive.it;uniroma1.it;uniroma1.it",
        "position": "PhD student;PhD student;Researcher;Assistant Professor;Full Professor;PhD student",
        "bibtex": "@inproceedings{\nmariani2024multisource,\ntitle={Multi-Source Diffusion Models for Simultaneous Music Generation and Separation},\nauthor={Giorgio Mariani and Irene Tallini and Emilian Postolache and Michele Mancusi and Luca Cosmo and Emanuele Rodol{\\`a}},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=h922Qhkmx1}\n}",
        "github": "",
        "project": "",
        "reviewers": "yjJy;K9Yj;J4Tn;oyrq",
        "pdf_size": 857722,
        "rating": "8;8;8;8",
        "confidence": "3;3;4;3",
        "soundness": "3;4;4;3",
        "contribution": "3;3;3;4",
        "presentation": "4;3;4;4",
        "wc_summary": "96;105;44;97",
        "wc_strengths": "85;218;130;128",
        "wc_weaknesses": "207;164;13;115",
        "wc_questions": "104;133;26;62",
        "wc_review": "492;620;213;402",
        "wc_reply_reviewers": "21;18;0;0",
        "wc_reply_authors": "744;794;225;904",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "1;2;1;2",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            85.5,
            24.212600025606502
        ],
        "wc_strengths_avg": [
            140.25,
            48.35480844755772
        ],
        "wc_weaknesses_avg": [
            124.75,
            72.2647043860279
        ],
        "wc_questions_avg": [
            81.25,
            40.67785023818245
        ],
        "wc_review_avg": [
            431.75,
            148.15933146447443
        ],
        "wc_reply_reviewers_avg": [
            9.75,
            9.807522622966516
        ],
        "wc_reply_authors_avg": [
            666.75,
            261.52951554270123
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 46,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1492023010742835744&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=h922Qhkmx1",
        "pdf": "https://openreview.net/pdf?id=h922Qhkmx1",
        "email": "uniroma1.it;uniroma1.it;uniroma1.it;unive.it;uniroma1.it;uniroma1.it",
        "author_num": 6,
        "aff_unique_index": "0;0;0;1;2;0",
        "aff_unique_norm": "University of Rome La Sapienza;University of Venice;Sapienza University of Rome",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.uniroma1.it;https://www.unive.it;https://www.uniroma1.it",
        "aff_unique_abbr": "La Sapienza;Unive;Sapienza",
        "aff_campus_unique_index": "0;0;0;0;0",
        "aff_campus_unique": "Rome;",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "Italy"
    },
    {
        "id": "h9LcbJ3l9r",
        "title": "Value-Evolutionary-Based Reinforcement Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Combining Evolutionary Algorithms (EAs) and Reinforcement Learning (RL) for policy search has been proven to improve RL performance. However, prior research largely overlooks value-based RL in favor of merging EAs with policy-based RL. This paper introduces Value-Evolutionary-Based Reinforcement Learning (VEB-RL), a framework that combines EAs and RL for policy search with a focus on value-based RL. The framework maintains a population of value functions instead of policies and leverages negative Temporal Difference (TD) error as the fitness metric for evolution. The metric is more sample efficient for population evaluation than cumulative rewards of simulation and is closely associated with the accuracy of the value function approximation. In addition, VEB-RL enables elites of the population to interact with the environment to offer high-quality samples for RL optimization, while the RL value function participates in the population's evolution in each generation. Experiments on MinAtar and Atari demonstrate the effectiveness of VEB-RL in significantly improving DQN, Rainbow, and SPR.",
        "keywords": "Evolutionary Algorithms;Reinforcement Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Pengyi Li;Jianye HAO;Hongyao Tang;YAN ZHENG;Fazl Barez",
        "authorids": "~Pengyi_Li1;~Jianye_HAO1;~Hongyao_Tang1;~YAN_ZHENG1;~Fazl_Barez1",
        "gender": "M;M;M;M;",
        "homepage": "https://yeshenpy.github.io/;http://www.icdai.org/jianye.html;https://bluecontra.github.io/;https://yanzzzzz.github.io;",
        "dblp": "195/6948;21/7664.html;220/4275;10/2381-2;",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;;yIqzRH4AAAAJ;https://scholar.google.com.hk/citations?user=tJuhd1kAAAAJ;",
        "orcid": "0009-0009-8546-2346;0000-0002-0422-8235;;;",
        "linkedin": ";;;;",
        "or_profile": "~Pengyi_Li1;~Jianye_HAO1;~Hongyao_Tang1;~YAN_ZHENG1;~Fazl_Barez1",
        "aff": "Tianjin University;Tianjin University;Montreal Institute for Learning Algorithms, University of Montreal, Universit\u00e9 de Montr\u00e9al;Tianjin Unibersity, China;",
        "aff_domain": "tju.edu.cn;tju.edu.cn;mila.umontreal.ca;tju.edu.cn;",
        "position": "PhD student;Associate Professor;Postdoc;Associate Professor;",
        "bibtex": "@misc{\nli2024valueevolutionarybased,\ntitle={Value-Evolutionary-Based Reinforcement Learning},\nauthor={Pengyi Li and Jianye HAO and Hongyao Tang and YAN ZHENG and Fazl Barez},\nyear={2024},\nurl={https://openreview.net/forum?id=h9LcbJ3l9r}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=h9LcbJ3l9r",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9541402201241565429&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Tianjin University;University of Montreal",
        "aff_unique_dep": ";Montreal Institute for Learning Algorithms",
        "aff_unique_url": "http://www.tju.edu.cn;https://www.mila.quebec",
        "aff_unique_abbr": "TJU;MILA",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Montreal",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "China;Canada"
    },
    {
        "id": "h9TTpQdGKJ",
        "title": "Learning Transferable Robust Representations for Few-shot Learning via Multi-view Consistency",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Despite the success on few-shot learning problems, most meta-learned models only focus on achieving good performance on clean examples and thus easily break down when given adversarially perturbed samples. While some recent works have shown that a combination of adversarial learning and meta-learning could enhance the robustness of a meta-learner against adversarial attacks, they fail to achieve generalizable adversarial robustness to unseen domains and tasks, which is the ultimate goal of meta-learning. To address this challenge, we propose a novel meta-adversarial multi-view representation learning framework with dual encoders. Specifically, we introduce the discrepancy across the two differently augmented samples of the same data instance by first updating the encoder parameters with them and further imposing a novel label-free adversarial attack to maximize their discrepancy. Then, we maximize the consistency across the views to learn transferable robust representations across domains and tasks. Through experimental validation on multiple benchmarks, we demonstrate the effectiveness of our framework on few-shot learning tasks from unseen domains, achieving over 10\\% robust accuracy improvements against previous adversarial meta-learning baselines.",
        "keywords": "robust meta-learning;unseen domain;robustness",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/9a49a498a4e9ccf75a14e3d273033f5a773eaa1f.zip",
        "author": "Minseon Kim;Hyeonjeong Ha;Dong Bok Lee;Sung Ju Hwang",
        "authorids": "~Minseon_Kim1;~Hyeonjeong_Ha1;~Dong_Bok_Lee1;~Sung_Ju_Hwang1",
        "gender": ";;;",
        "homepage": "https://kim-minseon.github.io/;https://hyeonjeongha.github.io/;;",
        "dblp": "247/5952;331/5333;;",
        "google_scholar": "ZwObZNwAAAAJ;https://scholar.google.com/citations?hl=ko;;",
        "orcid": ";;;",
        "linkedin": "minseon-kim-707a84174;hyeonjeong-ha-bb93b0285/;;",
        "or_profile": "~Minseon_Kim1;~Hyeonjeong_Ha1;~Dong_Bok_Lee1;~Sung_Ju_Hwang1",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;;",
        "aff_domain": "kaist.ac.kr;kaist.edu;;",
        "position": "PhD student;MS student;;",
        "bibtex": "@misc{\nkim2024learning,\ntitle={Learning Transferable Robust Representations for Few-shot Learning via Multi-view Consistency},\nauthor={Minseon Kim and Hyeonjeong Ha and Dong Bok Lee and Sung Ju Hwang},\nyear={2024},\nurl={https://openreview.net/forum?id=h9TTpQdGKJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "fCDy;9Rh6;Cwq1;rEWc",
        "site": "https://openreview.net/forum?id=h9TTpQdGKJ",
        "pdf_size": 9877001,
        "rating": "3;3;5;6",
        "confidence": "5;3;5;3",
        "soundness": "2;3;3;3",
        "contribution": "1;2;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "52;173;51;50",
        "wc_strengths": "21;34;25;37",
        "wc_weaknesses": "373;199;351;171",
        "wc_questions": "6;145;7;3",
        "wc_review": "452;551;434;261",
        "wc_reply_reviewers": "0;192;147;29",
        "wc_reply_authors": "1016;1059;1698;558",
        "reply_reviewers": "0;1;2;1",
        "reply_authors": "3;2;4;2",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            1.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            81.5,
            52.83228179815821
        ],
        "wc_strengths_avg": [
            29.25,
            6.49519052838329
        ],
        "wc_weaknesses_avg": [
            273.5,
            89.39099507221071
        ],
        "wc_questions_avg": [
            40.25,
            60.49535106105262
        ],
        "wc_review_avg": [
            424.5,
            104.38031423597076
        ],
        "wc_reply_reviewers_avg": [
            92.0,
            79.77781646548118
        ],
        "wc_reply_authors_avg": [
            1082.75,
            405.8678202321539
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.19245008972987526,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:KGH7ELIc5yYJ:scholar.google.com/&scioq=Learning+Transferable+Robust+Representations+for+Few-shot+Learning+via+Multi-view+Consistency&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "FedWon: Triumphing Multi-domain Federated Learning Without Normalization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18109",
        "id": "hAYHmV1gM8",
        "author_site": "Weiming Zhuang, Lingjuan Lyu",
        "tldr": "",
        "abstract": "Federated learning (FL) enhances data privacy with collaborative in-situ training on decentralized clients. Nevertheless, FL encounters challenges due to non-independent and identically distributed (non-i.i.d) data, leading to potential performance degradation and hindered convergence. While prior studies predominantly addressed the issue of skewed label distribution, our research addresses a crucial yet frequently overlooked problem known as multi-domain FL. In this scenario, clients' data originate from diverse domains with distinct feature distributions, instead of label distributions. To address the multi-domain problem in FL, we propose a novel method called Federated Learning Without Normalizations (FedWon). FedWon draws inspiration from the observation that batch normalization (BN) faces challenges in effectively modeling the statistics of multiple domains, while existing normalization techniques possess their own limitations. In order to address these issues, FedWon eliminates the normalization layers in FL and reparameterizes convolution layers with scaled weight standardization. Through extensive experimentation on five datasets and five models, our comprehensive experimental results demonstrate that FedWon surpasses both FedAvg and the current state-of-the-art method (FedBN) across all experimental setups, achieving notable accuracy improvements of more than 10% in certain domains. Furthermore, FedWon is versatile for both cross-silo and cross-device FL, exhibiting robust domain generalization capability, showcasing strong performance even with a batch size as small as 1, thereby catering to resource-constrained devices. Additionally, FedWon can also effectively tackle the challenge of skewed label distribution.",
        "keywords": "federated learning;multi-domain federated learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Weiming Zhuang;Lingjuan Lyu",
        "authorids": "~Weiming_Zhuang1;~Lingjuan_Lyu1",
        "gender": ";F",
        "homepage": "https://weiming.me/;https://sites.google.com/view/lingjuan-lyu",
        "dblp": "274/0724;178/9876",
        "google_scholar": "lLuLAzEAAAAJ;",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Weiming_Zhuang1;~Lingjuan_Lyu1",
        "aff": "Sony Research;Sony",
        "aff_domain": "sony.com;sony.com",
        "position": "Researcher;scientist",
        "bibtex": "@inproceedings{\nzhuang2024fedwon,\ntitle={FedWon: Triumphing Multi-domain Federated Learning Without Normalization},\nauthor={Weiming Zhuang and Lingjuan Lyu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=hAYHmV1gM8}\n}",
        "github": "",
        "project": "",
        "reviewers": "M4Q8;hdps;Vk8b;C95h",
        "pdf_size": 4304772,
        "rating": "5;5;6;8",
        "confidence": "3;3;4;5",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;4",
        "wc_summary": "85;50;51;63",
        "wc_strengths": "131;27;42;106",
        "wc_weaknesses": "153;78;116;101",
        "wc_questions": "51;133;82;77",
        "wc_review": "420;288;291;347",
        "wc_reply_reviewers": "0;36;204;0",
        "wc_reply_authors": "733;827;935;497",
        "reply_reviewers": "0;1;2;0",
        "reply_authors": "4;4;5;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            62.25,
            14.095655359010449
        ],
        "wc_strengths_avg": [
            76.5,
            43.246387132337425
        ],
        "wc_weaknesses_avg": [
            112.0,
            27.26719640887196
        ],
        "wc_questions_avg": [
            85.75,
            29.710057219736214
        ],
        "wc_review_avg": [
            336.5,
            53.63068151720618
        ],
        "wc_reply_reviewers_avg": [
            60.0,
            84.42748367682174
        ],
        "wc_reply_authors_avg": [
            748.0,
            161.58279611394278
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.5,
            1.5
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.9847319278346618,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10756413520542012008&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=hAYHmV1gM8",
        "pdf": "https://openreview.net/pdf?id=hAYHmV1gM8",
        "email": "sony.com;sony.com",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Sony;Sony Corporation",
        "aff_unique_dep": "Research;",
        "aff_unique_url": "https://www.sony.com;https://www.sony.com",
        "aff_unique_abbr": "Sony;Sony",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Japan"
    },
    {
        "title": "Solving Homogeneous and Heterogeneous Cooperative Tasks with Greedy Sequential Execution",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18108",
        "id": "hB2hXtxIPH",
        "author_site": "Shanqi Liu, Dong Xing, Pengjie Gu, Bo An, Yong Liu, Xinrun Wang",
        "tldr": "",
        "abstract": "Cooperative multi-agent reinforcement learning (MARL) is extensively used for solving complex cooperative tasks, and value decomposition methods are a prevalent approach for this domain. However, these methods have not been successful in addressing both homogeneous and heterogeneous tasks simultaneously which is a crucial aspect for the practical application of cooperative agents. \nOn one hand, value decomposition methods demonstrate superior performance in homogeneous tasks. Nevertheless, they tend to produce agents with similar policies, which is unsuitable for heterogeneous tasks. On the other hand, solutions based on personalized observation or assigned roles are well-suited for heterogeneous tasks. However, they often lead to a trade-off situation where the agent's performance in homogeneous scenarios is negatively affected due to the aggregation of distinct policies. An alternative approach is to adopt sequential execution policies, which offer a flexible form for learning both types of tasks. However, learning sequential execution policies poses challenges in terms of credit assignment, and the limited information about subsequently executed agents can lead to sub-optimal solutions, which is known as the relative over-generalization problem. To tackle these issues, this paper proposes Greedy Sequential Execution (GSE) as a solution to learn the optimal policy that covers both scenarios. In the proposed GSE framework, we introduce an individual utility function into the framework of value decomposition to consider the complex interactions between agents. \nThis function is capable of representing both the homogeneous and heterogeneous optimal policies. Furthermore, we utilize greedy marginal contribution calculated by the utility function as the credit value of the sequential execution policy to address the credit assignment and relative over-generalization problem. We evaluated GSE in both homogeneous and heterogeneous scenarios. The results demonstrate that GSE achieves significant improvement in performance across multiple domains, especially in scenarios involving both homogeneous and heterogeneous tasks.",
        "keywords": "Multi-Agent Cooperation;Credit Assignment;Homogeneous and Heterogeneous Cooperative Tasks",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/7e9be8b7a794a18e534aae22eb9529c2452ec7c9.pdf",
        "author": "Shanqi Liu;Dong Xing;Pengjie Gu;Xinrun Wang;Bo An;Yong Liu",
        "authorids": "~Shanqi_Liu1;~Dong_Xing1;~Pengjie_Gu1;~Xinrun_Wang1;~Bo_An2;~Yong_Liu11",
        "gender": ";M;M;M;M;M",
        "homepage": ";;;https://rainwangphy.github.io/;https://personal.ntu.edu.sg/boan/;https://person.zju.edu.cn/en/yongliu",
        "dblp": "277/9570;https://dblp.uni-trier.de/pid/116/8390;226/1222;199/6413;42/6178-1.html;29/4867-7",
        "google_scholar": "Zc-FbhEAAAAJ;S_IrSW8AAAAJ;;ROANfPUAAAAJ;PEEpuNwAAAAJ;https://scholar.google.com.hk/citations?user=qYcgBbEAAAAJ",
        "orcid": ";;;;0000-0002-7064-7438;0000-0003-4822-8939",
        "linkedin": ";;;;;",
        "or_profile": "~Shanqi_Liu1;~Dong_Xing1;~Pengjie_Gu1;~Xinrun_Wang1;~Bo_An2;~Yong_Liu11",
        "aff": "Zhejiang University;;Nanyang Technological University;Nanyang Technological University;Nanyang Technological University;Zhejiang University",
        "aff_domain": "zju.edu.cn;;ntu.edu.sg;ntu.edu.sg;ntu.edu.sg;zju.edu.cn",
        "position": "PhD student;;PhD student;Postdoc;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nliu2024solving,\ntitle={Solving Homogeneous and Heterogeneous Cooperative Tasks with Greedy Sequential Execution},\nauthor={Shanqi Liu and Dong Xing and Pengjie Gu and Xinrun Wang and Bo An and Yong Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=hB2hXtxIPH}\n}",
        "github": "",
        "project": "",
        "reviewers": "CxDZ;CQwR;GHAQ;ia9o",
        "pdf_size": 6594234,
        "rating": "6;6;8;8",
        "confidence": "3;5;3;4",
        "soundness": "2;3;3;3",
        "contribution": "3;2;3;3",
        "presentation": "3;3;4;3",
        "wc_summary": "83;48;156;82",
        "wc_strengths": "46;26;79;110",
        "wc_weaknesses": "58;167;46;159",
        "wc_questions": "105;5;80;13",
        "wc_review": "292;246;361;364",
        "wc_reply_reviewers": "26;371;13;14",
        "wc_reply_authors": "718;1620;338;336",
        "reply_reviewers": "1;2;1;1",
        "reply_authors": "1;6;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            92.25,
            39.410499869958514
        ],
        "wc_strengths_avg": [
            65.25,
            32.02635633349507
        ],
        "wc_weaknesses_avg": [
            107.5,
            55.73374202401988
        ],
        "wc_questions_avg": [
            50.75,
            42.769001625008734
        ],
        "wc_review_avg": [
            315.75,
            49.50946879133324
        ],
        "wc_reply_reviewers_avg": [
            106.0,
            153.08331065142275
        ],
        "wc_reply_authors_avg": [
            753.0,
            524.1726814705246
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            2.165063509461097
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.30151134457776363,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1632652004845580324&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=hB2hXtxIPH",
        "pdf": "https://openreview.net/pdf?id=hB2hXtxIPH",
        "email": "zju.edu.cn;;ntu.edu.sg;ntu.edu.sg;ntu.edu.sg;zju.edu.cn",
        "author_num": 6,
        "aff_unique_index": "0;1;1;1;0",
        "aff_unique_norm": "Zhejiang University;Nanyang Technological University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.zju.edu.cn;https://www.ntu.edu.sg",
        "aff_unique_abbr": "ZJU;NTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;0",
        "aff_country_unique": "China;Singapore"
    },
    {
        "title": "PhyloGFN: Phylogenetic inference with generative flow networks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18107",
        "id": "hB7SlfEmze",
        "author_site": "MING YANG ZHOU, Zichao Yan, Elliot Layne, Nikolay Malkin, Dinghuai Zhang, Moksh Jain, Mathieu Blanchette, Yoshua Bengio",
        "tldr": "",
        "abstract": "Phylogenetics is a branch of computational biology that studies the evolutionary relationships among biological entities. Its long history and numerous applications notwithstanding, inference of phylogenetic trees from sequence data remains challenging: the high complexity of tree space poses a significant obstacle for the current combinatorial and probabilistic techniques. In this paper, we adopt the framework of generative flow networks (GFlowNets) to tackle two core problems in phylogenetics: parsimony-based and Bayesian phylogenetic inference. Because GFlowNets are well-suited for sampling complex combinatorial structures, they are a natural choice for exploring and sampling from the multimodal posterior distribution over tree topologies and evolutionary distances. We demonstrate that our amortized posterior sampler, PhyloGFN, produces diverse and high-quality evolutionary hypotheses on real benchmark datasets. PhyloGFN is competitive with prior works in marginal likelihood estimation and achieves a closer fit to the target distribution than state-of-the-art variational inference methods.",
        "keywords": "Phylogenetic Inference;GFlowNets;Bayesian Inference;Deep Generative Modeling",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/3efbe4edfb02b45867f340f8904f345d30c21a3c.zip",
        "author": "Ming Yang Zhou;Zichao Yan;Elliot Layne;Nikolay Malkin;Dinghuai Zhang;Moksh Jain;Mathieu Blanchette;Yoshua Bengio",
        "authorids": "~Ming_Yang_Zhou1;~Zichao_Yan1;~Elliot_Layne2;~Nikolay_Malkin1;~Dinghuai_Zhang1;~Moksh_Jain1;~Mathieu_Blanchette1;~Yoshua_Bengio1",
        "gender": "M;M;;;;M;M;M",
        "homepage": ";https://www.cs.mcgill.ca/~zyan9;;;;https://mj10.github.io;http://www.cs.mcgill.ca/~blanchem/;http://yoshuabengio.org",
        "dblp": ";27/10180;;;;249/9368;;56/953",
        "google_scholar": ";https://scholar.google.ca/citations?user=Qd6L_zwAAAAJ;;;;TD07G_wAAAAJ;https://scholar.google.com.tw/citations?user=8vXnOQsAAAAJ;kukA0LcAAAAJ",
        "orcid": ";0000-0002-9420-739X;;;;;;",
        "linkedin": "mingyangzhou/;;elliot-layne-364a09163/;;;;;yoshuabengio/?originalSubdomain=ca",
        "or_profile": "~Ming_Yang_Zhou1;~Zichao_Yan1;~Elliot_Layne2;~Nikolay_Malkin1;~Dinghuai_Zhang1;~Moksh_Jain1;~Mathieu_Blanchette1;~Yoshua_Bengio1",
        "aff": ";Montreal Institute for Learning Algorithms, University of Montreal, Universit\u00e9 de Montr\u00e9al;McGill University, McGill University;;;Universit\u00e9 de Montr\u00e9al;McGill University;University of Montreal",
        "aff_domain": ";mila.umontreal.ca;mail.mcgill.ca;;;umontreal.ca;mcgill.ca;umontreal.ca",
        "position": ";Postdoc;PhD student;;;PhD student;Associate Professor;Full Professor",
        "bibtex": "@inproceedings{\nzhou2024phylogfn,\ntitle={Phylo{GFN}: Phylogenetic inference with generative flow networks},\nauthor={Ming Yang Zhou and Zichao Yan and Elliot Layne and Nikolay Malkin and Dinghuai Zhang and Moksh Jain and Mathieu Blanchette and Yoshua Bengio},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=hB7SlfEmze}\n}",
        "github": "",
        "project": "",
        "reviewers": "tiKV;7zzf;SMRb;iXKc",
        "pdf_size": 2252306,
        "rating": "5;6;8;8",
        "confidence": "4;4;3;4",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;3;2;4",
        "wc_summary": "146;167;73;160",
        "wc_strengths": "76;24;103;69",
        "wc_weaknesses": "152;43;273;531",
        "wc_questions": "61;940;129;225",
        "wc_review": "435;1174;578;985",
        "wc_reply_reviewers": "241;203;0;10",
        "wc_reply_authors": "2307;3025;1254;1222",
        "reply_reviewers": "2;2;0;1",
        "reply_authors": "7;7;5;3",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            136.5,
            37.43327396848959
        ],
        "wc_strengths_avg": [
            68.0,
            28.398943642325854
        ],
        "wc_weaknesses_avg": [
            249.75,
            181.6196231138034
        ],
        "wc_questions_avg": [
            338.75,
            351.9874820217333
        ],
        "wc_review_avg": [
            793.0,
            298.5020937950017
        ],
        "wc_reply_reviewers_avg": [
            113.5,
            109.3857851825364
        ],
        "wc_reply_authors_avg": [
            1952.0,
            757.8683922687369
        ],
        "reply_reviewers_avg": [
            1.25,
            0.82915619758885
        ],
        "reply_authors_avg": [
            5.5,
            1.6583123951777
        ],
        "replies_avg": [
            36,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.5555555555555555,
        "gs_citation": 25,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8787724684883857917&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=hB7SlfEmze",
        "pdf": "https://openreview.net/pdf?id=hB7SlfEmze",
        "email": ";mila.umontreal.ca;mail.mcgill.ca;;;umontreal.ca;mcgill.ca;umontreal.ca",
        "author_num": 8,
        "aff_unique_index": "0;1;2;1;0",
        "aff_unique_norm": "University of Montreal;McGill University;Universit\u00e9 de Montr\u00e9al",
        "aff_unique_dep": "Montreal Institute for Learning Algorithms;;",
        "aff_unique_url": "https://www.mila.quebec;https://www.mcgill.ca;https://www.umontreal.ca",
        "aff_unique_abbr": "MILA;McGill;UdeM",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Montreal;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "hC4GdMOqvU",
        "title": "Knowledge Distillation for Predicting Varying Environment Maps from Single Images",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We present a learning-based method for estimating view-dependent environmental lighting from a single image. Our method learns to distill knowledge from a differentiable geometry and texture decomposition framework. The goal is to directly predict the environment map from an input image using a neural network and thus bypass the need for solving iterative optimization.\nWe propose a new physically-based strategy that decouples the illumination color and distribution of a local light probe given by a sampled pixel on the input image. The experiments show that our proposed method can train a neural network to efficiently derive the environment map of comparable or even higher quality from a single image in under a second, a significant improvement over the time-consuming optimization-based alternatives that require a few minutes to obtain the results.",
        "keywords": "Environment Maps;Intrinsic Images",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/e97f9401f168a254cab098c9158de2944c93c35b.pdf",
        "author": "SHANG-LIN LU;Ting-I Hsieh;Hwann-Tzong Chen",
        "authorids": "~SHANG-LIN_LU1;~Ting-I_Hsieh1;~Hwann-Tzong_Chen1",
        "gender": "M;M;M",
        "homepage": "https://github.com/ShLL625;;https://htchen.github.io/",
        "dblp": ";255/7049.html?fbclid=IwAR22U4Ccy_gVptSdG-AikYQ_6XlCG-ls3dBuIxgWzOrYXDgjMCU5byPfoQw;74/2341",
        "google_scholar": ";https://scholar.google.com.tw/citations?user=QrH79X4AAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;0000-0003-2806-7090",
        "linkedin": ";;",
        "or_profile": "~SHANG-LIN_LU1;~Ting-I_Hsieh1;~Hwann-Tzong_Chen1",
        "aff": "National Tsinghua University;Google;National Tsing Hua University",
        "aff_domain": "nthu.edu.tw;google.com;nthu.edu.tw",
        "position": "MS student;Researcher;Full Professor",
        "bibtex": "@misc{\nlu2024knowledge,\ntitle={Knowledge Distillation for Predicting Varying Environment Maps from Single Images},\nauthor={SHANG-LIN LU and Ting-I Hsieh and Hwann-Tzong Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=hC4GdMOqvU}\n}",
        "github": "",
        "project": "",
        "reviewers": "zAh2;Pvo6;nhSg;cpaY",
        "site": "https://openreview.net/forum?id=hC4GdMOqvU",
        "pdf_size": 25882966,
        "rating": "3;5;5;6",
        "confidence": "3;4;4;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;2;3",
        "wc_summary": "105;72;48;101",
        "wc_strengths": "25;33;22;107",
        "wc_weaknesses": "360;288;136;101",
        "wc_questions": "31;23;1;50",
        "wc_review": "521;416;207;359",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            81.5,
            23.157072353818823
        ],
        "wc_strengths_avg": [
            46.75,
            35.01696017646306
        ],
        "wc_weaknesses_avg": [
            221.25,
            106.57714342203022
        ],
        "wc_questions_avg": [
            26.25,
            17.5695048308141
        ],
        "wc_review_avg": [
            375.75,
            113.4402375702731
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.2294157338705618,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:tpMHVphkESoJ:scholar.google.com/&scioq=Knowledge+Distillation+for+Predicting+Varying+Environment+Maps+from+Single+Images&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Tsinghua University;Google;National Tsing Hua University",
        "aff_unique_dep": ";Google;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.google.com;https://www.nthu.edu.tw",
        "aff_unique_abbr": "THU;Google;NTHU",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Mountain View;Taiwan",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "hCaoJh01io",
        "title": "InfoGround: Ground Manipulation Concepts with Maximal Information Boost",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We aim at grounding manipulation concepts proposed by Large Language Models in the form of task-related step-by-step instructions to their corresponding physical states, i.e., key states, from unannotated demonstrations. The grounded concepts not only facilitate efficient manipulation policy training but also promote generalization. Current methods mainly rely on multimodal foundation models to localize these key states, which involves encoding physical observations and textual descriptions into a shared space and measuring their feature similarity. However, due to the limited availability of curated training data for multimodal encoders and variations in physical states, the grounding often lacks accuracy and semantic consistency. To effectively leverage the commonsense knowledge embedded within pre-trained foundation models, we introduce an information-theoretic criterion designed to enhance grounding efficiency without requiring costly fine-tuning. Our approach is based on the observation that the uncertainty of a state diminishes rapidly as it approaches a key state, as this state admits more physical constraints than non-key states. This phenomenon is characterized as maximizing the rate of increase in mutual information between the key state and its preceding states, referred to as maximal information boost. By employing maximal information boost, we can train a key state grounding network that effectively utilizes noisy similarity measures from multimodal encoders. Experimental results demonstrate that our grounded key states exhibit good semantic compatibility with instructions. Furthermore, when used as sub-goal guidance, our grounding method leads to manipulation policies that achieve higher success rates and improved generalization.",
        "keywords": "concept grounding;robotic manipulation;large models;embodied agents",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/39df6d8b7ef001d639dc6859b5bd3efd0aa7d9f7.zip",
        "author": "Pei Zhou;Yanchao Yang",
        "authorids": "~Pei_Zhou2;~Yanchao_Yang1",
        "gender": ";M",
        "homepage": "https://github.com/PeiZhou26;https://yanchaoyang.github.io/",
        "dblp": ";84/8637-1",
        "google_scholar": ";r2tKnV4AAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Pei_Zhou2;~Yanchao_Yang1",
        "aff": "University of Hong Kong;University of Hong Kong",
        "aff_domain": "hku.hk;hku.hk",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nzhou2024infoground,\ntitle={InfoGround: Ground Manipulation Concepts with Maximal Information Boost},\nauthor={Pei Zhou and Yanchao Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=hCaoJh01io}\n}",
        "github": "",
        "project": "",
        "reviewers": "S4jr;4ns7;KD76;dSMV",
        "site": "https://openreview.net/forum?id=hCaoJh01io",
        "pdf_size": 2899781,
        "rating": "3;5;5;6",
        "confidence": "4;4;4;5",
        "soundness": "3;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;3;4",
        "wc_summary": "43;89;57;77",
        "wc_strengths": "37;59;45;68",
        "wc_weaknesses": "114;281;55;163",
        "wc_questions": "77;53;98;107",
        "wc_review": "271;482;255;415",
        "wc_reply_reviewers": "169;0;50;155",
        "wc_reply_authors": "1431;1826;1501;1904",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "3;4;4;4",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            66.5,
            17.741194999210173
        ],
        "wc_strengths_avg": [
            52.25,
            12.028611723719408
        ],
        "wc_weaknesses_avg": [
            153.25,
            83.07940478843118
        ],
        "wc_questions_avg": [
            83.75,
            20.825165065372232
        ],
        "wc_review_avg": [
            355.75,
            95.8941473709423
        ],
        "wc_reply_reviewers_avg": [
            93.5,
            70.91720524668185
        ],
        "wc_reply_authors_avg": [
            1665.5,
            202.91192670713076
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.75,
            0.4330127018922193
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.6622661785325219,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:LbgT8J0EE3kJ:scholar.google.com/&scioq=InfoGround:+Ground+Manipulation+Concepts+with+Maximal+Information+Boost&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Hong Kong",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.hku.hk",
        "aff_unique_abbr": "HKU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "PolyVoice: Language Models for Speech to Speech Translation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18106",
        "id": "hCrFG9cyuC",
        "author_site": "Qianqian Dong, Zhiying Huang, Qiao Tian, Chen Xu, Tom Ko, yunlong zhao, Siyuan Feng, Tang Li, Kexin Wang, Xuxin Cheng, Fengpeng Yue, Ye Bai, Xi Chen, Lu Lu, Zejun MA, Yuping Wang, Mingxuan Wang, Yuxuan Wang",
        "tldr": "",
        "abstract": "With the huge success of GPT models in natural language processing, there is a growing interest in applying language modeling approaches to speech tasks.\nCurrently, the dominant architecture in speech-to-speech translation (S2ST) remains the encoder-decoder paradigm, creating a need to investigate the impact of language modeling approaches in this area. \nIn this study, we introduce PolyVoice, a language model-based framework designed for S2ST systems. Our framework comprises three decoder-only language models: a translation language model, a duration language model, and a speech synthesis language model. \nThese language models employ different types of prompts to extract learned information effectively. By utilizing unsupervised semantic units, our framework can transfer semantic information across these models, making it applicable even to unwritten languages. \nWe evaluate our system on Chinese $\\rightarrow$ English and English $\\rightarrow$ Spanish language pairs. Experimental results demonstrate that \\method outperforms the state-of-the-art encoder-decoder model, producing voice-cloned speech with high translation and audio quality.\nSpeech samples are available at https://polyvoice.github.io.",
        "keywords": "Speech-to-Speecn Translatiom;Audio Language Model;Voice Clone",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Qian qian Dong;Zhiying Huang;Qiao Tian;Chen Xu;Tom Ko;yunlong zhao;Siyuan Feng;Tang Li;Kexin Wang;Xuxin Cheng;Fengpeng Yue;Ye Bai;Xi Chen;Lu Lu;Zejun MA;Yuping Wang;Mingxuan Wang;Yuxuan Wang",
        "authorids": "~Qian_qian_Dong1;~Zhiying_Huang1;~Qiao_Tian1;~Chen_Xu9;~Tom_Ko2;~yunlong_zhao4;~Siyuan_Feng3;~Tang_Li2;~Kexin_Wang5;~Xuxin_Cheng3;~Fengpeng_Yue1;~Ye_Bai1;~Xi_Chen46;~Lu_Lu6;~Zejun_MA1;~Yuping_Wang3;~Mingxuan_Wang1;~Yuxuan_Wang1",
        "gender": ";M;M;M;M;M;M;M;;;;M;M;M;M;;M;M",
        "homepage": ";;https://scholar.google.com/citations?user=PMH1tnEAAAAJ&hl=en;;https://tomkocse.github.io/;https://yunlongia.github.io/;https://scholar.google.com/citations?user=H2A1rGwAAAAJ&hl=en;https://github.com;;;https://github.com/fengpeng-yue/fengpeng-yue.github.io;;https://speechtranslation.github.io;;;;https://mingxuan.github.io/;",
        "dblp": ";;206/9465-1.html;54/1474-8;96/8762;;;;;;;;;;;;43/11214;",
        "google_scholar": ";https://scholar.google.com.hk/citations?user=yYUnVMMAAAAJ;PMH1tnEAAAAJ;DmYTrQYAAAAJ;26-lhTQAAAAJ;;H2A1rGwAAAAJ;;;;;https://scholar.google.com.sg/;;IQaR2KoAAAAJ;https://scholar.google.com/citations?hl=zh-CN;;hOQ6G6EAAAAJ;3RaOfJkAAAAJ",
        "orcid": ";;;;;;;;0000-0003-2526-7935;;;;;;;;;",
        "linkedin": ";;;;;;;;;;;;;;zejun-ma-58614365/;;;",
        "or_profile": "~Qian_qian_Dong1;~Zhiying_Huang1;~Qiao_Tian1;~Chen_Xu9;~Tom_Ko2;~yunlong_zhao4;~Siyuan_Feng3;~Tang_Li2;~Kexin_Wang5;~Xuxin_Cheng3;~Fengpeng_Yue1;~Ye_Bai1;~Xi_Chen46;~Lu_Lu6;~Zejun_MA1;~Yuping_Wang3;~Mingxuan_Wang1;~Yuxuan_Wang1",
        "aff": ";;Independent;Harbin Engineering University;ByteDance AI Lab;Institute of Automation, Chinese Academy of Sciences;;ByteDance Inc.;;;zhipu;Bytedance Inc.;;;ByteDance Inc.;;ByteDance Inc.;ByteDance",
        "aff_domain": ";;nothing.com;hrbeu.edu.cn;bytedance.com;ia.ac.cn;;bytedance.com;;;aminer.cn;bytecance.com;;;bytedance.com;;bytedance.com;bytedance.com",
        "position": ";;Researcher;Lecturer;Researcher;PhD student;;Researcher;;;Full Professor;Researcher;;;Principal Researcher;;Researcher;Researcher",
        "bibtex": "@inproceedings{\ndong2024polyvoice,\ntitle={PolyVoice: Language Models for Speech to Speech Translation},\nauthor={Qian qian Dong and Zhiying Huang and Qiao Tian and Chen Xu and Tom Ko and yunlong zhao and Siyuan Feng and Tang Li and Kexin Wang and Xuxin Cheng and Fengpeng Yue and Ye Bai and Xi Chen and Lu Lu and Zejun MA and Yuping Wang and Mingxuan Wang and Yuxuan Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=hCrFG9cyuC}\n}",
        "github": "",
        "project": "",
        "reviewers": "JZne;PpHm;2GYW;Jg4v",
        "pdf_size": 551929,
        "rating": "3;5;8;8",
        "confidence": "5;3;5;4",
        "soundness": "2;2;4;3",
        "contribution": "2;2;4;3",
        "presentation": "2;3;4;3",
        "wc_summary": "83;48;193;183",
        "wc_strengths": "101;62;90;82",
        "wc_weaknesses": "561;176;37;126",
        "wc_questions": "8;36;32;98",
        "wc_review": "753;322;352;489",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1746;663;222;427",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;2;1;1",
        "rating_avg": [
            6.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            126.75,
            62.58743883560023
        ],
        "wc_strengths_avg": [
            83.75,
            14.254385290148432
        ],
        "wc_weaknesses_avg": [
            225.0,
            200.27605947791164
        ],
        "wc_questions_avg": [
            43.5,
            33.237779709240506
        ],
        "wc_review_avg": [
            479.0,
            170.2600951485697
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            764.5,
            587.7620692082809
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            18,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 26,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3383475108771904189&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=hCrFG9cyuC",
        "pdf": "https://openreview.net/pdf?id=hCrFG9cyuC",
        "email": ";;nothing.com;hrbeu.edu.cn;bytedance.com;ia.ac.cn;;bytedance.com;;;aminer.cn;bytecance.com;;;bytedance.com;;bytedance.com;bytedance.com",
        "author_num": 18,
        "aff_unique_index": "0;1;2;3;2;4;5;2;2;2",
        "aff_unique_norm": "Independent;Harbin Engineering University;ByteDance;Chinese Academy of Sciences;Zhipu AI;Bytedance Inc.",
        "aff_unique_dep": ";;AI Lab;Institute of Automation;;",
        "aff_unique_url": ";http://www.heu.edu.cn;https://www.bytedance.com;http://www.ia.cas.cn;https://www.zhipu.ai;https://www.bytedance.com",
        "aff_unique_abbr": ";HEU;ByteDance;CAS;Zhipu;Bytedance",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "1;1;1;1;1;1;1;1;1",
        "aff_country_unique": ";China"
    },
    {
        "title": "P$^2$OT: Progressive Partial Optimal Transport for Deep Imbalanced Clustering",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18105",
        "id": "hD3sGVqPsr",
        "author_site": "Chuyu Zhang, Hui Ren, Xuming He",
        "tldr": "",
        "abstract": "Deep clustering, which learns representation and semantic clustering without labels information, poses a great challenge for deep learning-based approaches. Despite significant progress in recent years, most existing methods focus on uniformly distributed datasets, significantly limiting the practical applicability of their methods. In this paper, we first introduce a more practical problem setting named deep imbalanced clustering, where the underlying classes exhibit an imbalance distribution. To tackle this problem, we propose a novel pseudo-labeling-based learning framework. Our framework formulates pseudo-label generation as a progressive partial optimal transport problem, which progressively transports each sample to imbalanced clusters under prior distribution constraints, thus generating imbalance-aware pseudo-labels and learning from high-confident samples.\nIn addition, we transform the initial formulation into an unbalanced optimal transport problem with augmented constraints, which can be solved efficiently by a fast matrix scaling algorithm. Experiments on various datasets, including a human-curated long-tailed CIFAR100, challenging ImageNet-R, and large-scale subsets of fine-grained iNaturalist2018 datasets, demonstrate the superiority of our method.",
        "keywords": "deep imbalanced clustering;optimal transport",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Chuyu Zhang;Hui Ren;Xuming He",
        "authorids": "~Chuyu_Zhang1;~Hui_Ren2;~Xuming_He3",
        "gender": "M;M;M",
        "homepage": ";https://rhfeiyang.github.io;https://faculty.sist.shanghaitech.edu.cn/faculty/hexm/index.html",
        "dblp": "270/8658;50/5673-3;03/4230",
        "google_scholar": "V7IktkcAAAAJ;d4jhC7gAAAAJ;0KyeZ2QAAAAJ",
        "orcid": ";0009-0000-6109-4731;",
        "linkedin": ";hui-ren/;",
        "or_profile": "~Chuyu_Zhang1;~Hui_Ren2;~Xuming_He3",
        "aff": "ShanghaiTech University;Massachusetts Institute of Technology;ShanghaiTech University",
        "aff_domain": "shanghaitech.edu.cn;mit.edu;shanghaitech.edu.cn",
        "position": "PhD student;Undergrad student;Associate Professor",
        "bibtex": "@inproceedings{\nzhang2024pot,\ntitle={P\\${\\textasciicircum}2\\${OT}: Progressive Partial Optimal Transport for Deep Imbalanced Clustering},\nauthor={Chuyu Zhang and Hui Ren and Xuming He},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=hD3sGVqPsr}\n}",
        "github": "",
        "project": "",
        "reviewers": "qtAk;xbkw;H8zS",
        "pdf_size": 1557848,
        "rating": "6;6;6",
        "confidence": "4;3;4",
        "soundness": "3;3;2",
        "contribution": "3;3;3",
        "presentation": "3;3;2",
        "wc_summary": "66;78;59",
        "wc_strengths": "151;33;22",
        "wc_weaknesses": "296;289;186",
        "wc_questions": "35;66;158",
        "wc_review": "548;466;425",
        "wc_reply_reviewers": "36;19;14",
        "wc_reply_authors": "304;540;1630",
        "reply_reviewers": "1;1;1",
        "reply_authors": "2;1;4",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            67.66666666666667,
            7.845734863959881
        ],
        "wc_strengths_avg": [
            68.66666666666667,
            58.3913996711464
        ],
        "wc_weaknesses_avg": [
            257.0,
            50.2858495669176
        ],
        "wc_questions_avg": [
            86.33333333333333,
            52.23238671765078
        ],
        "wc_review_avg": [
            479.6666666666667,
            51.13598428591053
        ],
        "wc_reply_reviewers_avg": [
            23.0,
            9.41629792788369
        ],
        "wc_reply_authors_avg": [
            824.6666666666666,
            577.549613068484
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=59792606271993354&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=hD3sGVqPsr",
        "pdf": "https://openreview.net/pdf?id=hD3sGVqPsr",
        "email": "shanghaitech.edu.cn;mit.edu;shanghaitech.edu.cn",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "ShanghaiTech University;Massachusetts Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.shanghaitech.edu.cn;https://web.mit.edu",
        "aff_unique_abbr": "ShanghaiTech;MIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "hDKLrK8AwP",
        "title": "Towards Readable Scalable Vector Graphic Generation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The surge in the use of Scalable Vector Graphics (SVGs) for digital graphics, particularly with advancements in generative models, has seen a proliferation in the automatic creation of SVGs. Yet, as these models prioritize visual accuracy, they often neglect the readability of the underlying SVG code. However, the readability of the SVG code is equivalently, if not more, important in comparison to visual accuracy, for the convenience of editing and logical inference for downstream tasks. Therefore, this paper delves into the overlooked realm of SVG code readability, emphasizing its importance in ensuring efficient comprehension and modification of the generated graphics. Readability, encompassing aspects like logical struc- turing and minimized complexity, plays a pivotal role in ensuring SVGs are not just visually accurate but also human-friendly at the code level. We first propose a clear set of desiderata for SVG code readability, serving as a foundation for our subsequent analyses. Leveraging this, we introduce a set of dedicated metrics to evaluate SVG readability and design differentiable objectives to guide SVG gener- ation models towards producing more readable code. Our evaluation reveals that while most SVG generators can produce visually accurate graphics, the underlying code often lacks structure and simplicity. However, with our proposed metrics and objectives, SVG generators exhibit significant improvements in code readability without compromising visual accuracy.",
        "keywords": "Scalable Vector Graphic;Readability",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Peiyan Zhang;Haohan Wang",
        "authorids": "~Peiyan_Zhang1;~Haohan_Wang1",
        "gender": "M;M",
        "homepage": "https://peiyance.github.io/;http://cs.cmu.edu/~haohanw",
        "dblp": "277/0918;132/4066",
        "google_scholar": "A1_FpIcAAAAJ;nZxJGeUAAAAJ",
        "orcid": "0000-0002-8691-1846;",
        "linkedin": ";haohanwang/",
        "or_profile": "~Peiyan_Zhang1;~Haohan_Wang1",
        "aff": "Department of Computer Science and Engineering, Hong Kong University of Science and Technology;University of Illinois, Urbana Champaign",
        "aff_domain": "cse.ust.hk;illinois.edu",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nzhang2024towards,\ntitle={Towards Readable Scalable Vector Graphic Generation},\nauthor={Peiyan Zhang and Haohan Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=hDKLrK8AwP}\n}",
        "github": "",
        "project": "",
        "reviewers": "pKgQ;Zk7q;z767;p9Qj",
        "site": "https://openreview.net/forum?id=hDKLrK8AwP",
        "pdf_size": 233287,
        "rating": "3;3;5;5",
        "confidence": "5;4;5;3",
        "soundness": "1;2;1;2",
        "contribution": "1;2;3;2",
        "presentation": "2;1;3;2",
        "wc_summary": "92;89;58;59",
        "wc_strengths": "22;67;65;50",
        "wc_weaknesses": "126;150;190;257",
        "wc_questions": "10;116;37;11",
        "wc_review": "250;422;350;377",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            1.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            74.5,
            16.03901493234544
        ],
        "wc_strengths_avg": [
            51.0,
            17.98610574860495
        ],
        "wc_weaknesses_avg": [
            180.75,
            49.605317255310446
        ],
        "wc_questions_avg": [
            43.5,
            43.23482392701513
        ],
        "wc_review_avg": [
            349.75,
            63.07287451829035
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.30151134457776363,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:RzVS784Nu80J:scholar.google.com/&scioq=Towards+Readable+Scalable+Vector+Graphic+Generation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Hong Kong University of Science and Technology;University of Illinois Urbana-Champaign",
        "aff_unique_dep": "Department of Computer Science and Engineering;",
        "aff_unique_url": "https://www.ust.hk;https://illinois.edu",
        "aff_unique_abbr": "HKUST;UIUC",
        "aff_campus_unique_index": "0;1",
        "aff_campus_unique": "Hong Kong SAR;Urbana-Champaign",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "hDzjO41IOO",
        "title": "Tweedie Moment Projected Diffusions for Inverse Problems",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Diffusion generative models unlock new possibilities for inverse problems as they allow for the incorporation of strong empirical priors into the process of scientific inference. Recently, diffusion models received significant attention for solving inverse problems by posterior sampling, but many challenges remain open due to the intractability of this sampling process. Prior work resorted to Gaussian approximations to conditional densities of the reverse process, leveraging Tweedie's formula to parameterise its mean, complemented with various heuristics. In this work, we leverage higher order information using Tweedie's formula and obtain a finer approximation with a principled covariance estimate. This novel approximation removes any time-dependent step-size hyperparameters required by earlier methods, and enables higher quality approximations of the posterior density which results in better samples. Specifically, we tackle noisy linear inverse problems and obtain a novel approximation to the gradient of the likelihood. We then plug this gradient estimate into various diffusion models and show that this method is optimal for a Gaussian data distribution. We illustrate the empirical effectiveness of our approach for general linear inverse problems on toy synthetic examples as well as image restoration using pretrained diffusion models as the prior. We show that our method improves the sample quality by providing statistically principled approximations to diffusion posterior sampling problem.",
        "keywords": "generative models;diffusion models;inverse problems",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/2291e3ba8df3bc38572611ca9b710bb1461f2ef8.zip",
        "author": "Benjamin Boys;Mark Girolami;Jakiw Pidstrigach;Sebastian Reich;Alan Mosca;Omer Deniz Akyildiz",
        "authorids": "~Benjamin_Boys1;~Mark_Girolami2;~Jakiw_Pidstrigach1;~Sebastian_Reich1;~Alan_Mosca1;~Omer_Deniz_Akyildiz1",
        "gender": "M;Not Specified;M;M;M;",
        "homepage": "https://github.com/bb515;http://www.eng.cam.ac.uk/profiles/mag92;;https://www.math.uni-potsdam.de/~sreich/;www.dcs.bbk.ac.uk/~amosca02;http://akyildiz.me",
        "dblp": ";g/MarkAGirolami.html;;;;139/6538",
        "google_scholar": "2nokdPYAAAAJ;https://scholar.google.co.uk/citations?hl=en;https://scholar.google.com/citations?view_op=list_works;https://scholar.google.de/citations?user=cqxv9PAAAAAJ;https://scholar.google.co.uk/citations?user=0Nx6kPwAAAAJ;X1fsIjIAAAAJ",
        "orcid": ";;;0000-0002-5336-8904;;0000-0002-5248-1219",
        "linkedin": ";;;;;",
        "or_profile": "~Benjamin_Boys1;~Mark_Girolami2;~Jakiw_Pidstrigach1;~Sebastian_Reich1;~Alan_Mosca1;~Omer_Deniz_Akyildiz1",
        "aff": "University of Cambridge;University of Cambridge;University of Oxford;University of Potsdam;;Imperial College London",
        "aff_domain": "cam.ac.uk;cam.ac.uk;oxford.ac.uk;uni-potsdam.de;;imperial.ac.uk",
        "position": "PhD student;Full Professor;Postdoc;Full Professor;;Assistant Professor",
        "bibtex": "@misc{\nboys2024tweedie,\ntitle={Tweedie Moment Projected Diffusions for Inverse Problems},\nauthor={Benjamin Boys and Mark Girolami and Jakiw Pidstrigach and Sebastian Reich and Alan Mosca and Omer Deniz Akyildiz},\nyear={2024},\nurl={https://openreview.net/forum?id=hDzjO41IOO}\n}",
        "github": "",
        "project": "",
        "reviewers": "ixot;NB1r;3wW3;uiGE",
        "site": "https://openreview.net/forum?id=hDzjO41IOO",
        "pdf_size": 2696803,
        "rating": "3;3;6;8",
        "confidence": "5;4;4;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;2;3",
        "wc_summary": "111;87;68;134",
        "wc_strengths": "50;45;96;93",
        "wc_weaknesses": "156;157;206;241",
        "wc_questions": "41;248;70;192",
        "wc_review": "358;537;440;660",
        "wc_reply_reviewers": "0;0;254;280",
        "wc_reply_authors": "1013;2070;2185;2870",
        "reply_reviewers": "0;0;1;2",
        "reply_authors": "2;3;4;7",
        "rating_avg": [
            5.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            100.0,
            24.849547279578356
        ],
        "wc_strengths_avg": [
            71.0,
            23.590252224170897
        ],
        "wc_weaknesses_avg": [
            190.0,
            35.714142856857144
        ],
        "wc_questions_avg": [
            137.75,
            85.21846924229513
        ],
        "wc_review_avg": [
            498.75,
            112.6129988056441
        ],
        "wc_reply_reviewers_avg": [
            133.5,
            133.81610515928193
        ],
        "wc_reply_authors_avg": [
            2034.5,
            664.3479886324636
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            4.0,
            1.8708286933869707
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5443310539518174,
        "gs_citation": 27,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=449230249657860209&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;2;3",
        "aff_unique_norm": "University of Cambridge;University of Oxford;University of Potsdam;Imperial College London",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.cam.ac.uk;https://www.ox.ac.uk;https://www.uni-potsdam.de;https://www.imperial.ac.uk",
        "aff_unique_abbr": "Cambridge;Oxford;UP;ICL",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Cambridge;",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "United Kingdom;Germany"
    },
    {
        "id": "hEGcVa1l4I",
        "title": "Efficient Parameter Tuning of Large Protein Language Models for De Novo Protein Design",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Protein language models (ProtLMs) have achieved unprecedented breakthroughs in protein design. However, optimizing ProtLMs effectively with limited data has been challenging due to their large number of parameters. In this study, we introduce prefix tuning to efficiently prompt the pre-trained ProtLMs for de novo protein design with desired structures and functions. During the training process, only the prefix virtual token is trainable,  while the pre-trained ProtLM is frozen. We trained two prefix virtual tokens on antimicrobial peptide (AMP) dataset and alpha-helix strucutre dataset, respectively. Our results demonstrate that prefix tuning is efficient to prompt the pre-trained ProtLM by optimizing fewer trainable parameters to achieve superior results compared with fine tuning, even under low-data settings. Furthermore, these two prefix virtual tokens can be combined to precisely control protein generation with both desired properties, which is not possessed by other tuning methods. We anticipate that prefix tuning will contribute to the protein discovery and biomedical advancement.",
        "keywords": "De novo protein design; protein language model; prefix tuning.",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/a25a90fc454096235bae46a3106f77491a6ebd72.pdf",
        "author": "Jiawei Luo;Xianliang Liu;Jiahao Li;Junjie Chen",
        "authorids": "~Jiawei_Luo1;~Xianliang_Liu1;~Jiahao_Li7;~Junjie_Chen5",
        "gender": "M;;M;",
        "homepage": "https://carrotljw.github.io/;https://mail.hit.edu.cn/;;",
        "dblp": ";;;",
        "google_scholar": ";;https://scholar.google;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Jiawei_Luo1;~Xianliang_Liu1;~Jiahao_Li7;~Junjie_Chen5",
        "aff": ";Harbin Institute of Technology;;",
        "aff_domain": ";hit.edu.cn;;",
        "position": ";MS student;;",
        "bibtex": "@misc{\nluo2024efficient,\ntitle={Efficient Parameter Tuning of Large Protein Language Models for De Novo Protein Design},\nauthor={Jiawei Luo and Xianliang Liu and Jiahao Li and Junjie Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=hEGcVa1l4I}\n}",
        "github": "",
        "project": "",
        "reviewers": "wnAV;xTS7;H4xA",
        "site": "https://openreview.net/forum?id=hEGcVa1l4I",
        "pdf_size": 19996115,
        "rating": "3;3;5",
        "confidence": "4;4;4",
        "soundness": "1;3;2",
        "contribution": "1;2;2",
        "presentation": "3;3;2",
        "wc_summary": "68;96;114",
        "wc_strengths": "18;16;85",
        "wc_weaknesses": "267;169;72",
        "wc_questions": "4;2;84",
        "wc_review": "357;283;355",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            92.66666666666667,
            18.92675942210452
        ],
        "wc_strengths_avg": [
            39.666666666666664,
            32.0659043568433
        ],
        "wc_weaknesses_avg": [
            169.33333333333334,
            79.60876556985139
        ],
        "wc_questions_avg": [
            30.0,
            38.19249489974001
        ],
        "wc_review_avg": [
            331.6666666666667,
            34.4222150491349
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:KiZMMsNi84EJ:scholar.google.com/&scioq=Efficient+Parameter+Tuning+of+Large+Protein+Language+Models+for+De+Novo+Protein+Design&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Harbin Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.hit.edu.cn/",
        "aff_unique_abbr": "HIT",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Harbin",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "title": "Label-free Node Classification on Graphs with Large Language Models (LLMs)",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18104",
        "id": "hESD2NJFg8",
        "author_site": "Zhikai Chen, Haitao Mao, Hongzhi Wen, Haoyu Han, Wei Jin, Haiyang Zhang, Hui Liu, Jiliang Tang",
        "tldr": "",
        "abstract": "In recent years, there have been remarkable advancements in node classification achieved by Graph Neural Networks (GNNs). However, they necessitate abundant high-quality labels to ensure promising performance. In contrast, Large Language Models (LLMs) exhibit impressive zero-shot proficiency on text-attributed graphs. Yet, they face challenges in efficiently processing structural data and suffer from high inference costs. In light of these observations, this work introduces a label-free node classification on graphs with LLMs pipeline, LLM-GNN. It amalgamates the strengths of both GNNs and LLMs while mitigating their limitations. Specifically, LLMs are leveraged to annotate a small portion of nodes and then GNNs are trained on LLMs' annotations to make predictions for the remaining large portion of nodes. The implementation of LLM-GNN faces a unique challenge: how can we actively select nodes for LLMs to annotate and consequently enhance the GNN training? How can we leverage LLMs to obtain annotations of high quality, representativeness, and diversity, thereby enhancing GNN performance with less cost?\nTo tackle this challenge, we develop an annotation quality heuristic and leverage the confidence scores derived from LLMs to advanced node selection. Comprehensive experimental results validate the effectiveness of LLM-GNN. In particular, LLM-GNN can achieve an accuracy of 74.9\\% on a vast-scale dataset \\products with a cost less than 1 dollar.",
        "keywords": "Node classification;Graph Neural Networks;Large Language Models",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Zhikai Chen;Haitao Mao;Hongzhi Wen;Haoyu Han;Wei Jin;Haiyang Zhang;Hui Liu;Jiliang Tang",
        "authorids": "~Zhikai_Chen3;~Haitao_Mao1;~Hongzhi_Wen1;~Haoyu_Han1;~Wei_Jin4;~Haiyang_Zhang4;~Hui_Liu8;~Jiliang_Tang1",
        "gender": "M;M;M;;M;F;M;M",
        "homepage": "http://currytang.github.io;https://www.cse.msu.edu/~wenhongz/;https://cse.msu.edu/~hanhaoy1/;http://www.cs.emory.edu/~wjin30/;;https://scholar.google.com/citations?user=EuzF_zsAAAAJ&hl=en;https://www.cse.msu.edu/~tangjili/;",
        "dblp": "92/40;179/0477;257/5633-1;66/2173-9;;93/4010-31;64/10812;",
        "google_scholar": "6hUny38AAAAJ;;;eWow24EAAAAJ;;;WtzKMWAAAAAJ;3GmlKM4AAAAJ",
        "orcid": "0009-0009-7305-8629;0000-0003-0775-8538;0000-0002-2529-6042;;;0000-0002-3555-3495;0000-0001-7125-3898;",
        "linkedin": ";;;;haiyang-z-63b3b835;;;",
        "or_profile": "~Zhikai_Chen3;~Hongzhi_Wen1;~Haoyu_Han1;~Wei_Jin4;~Haiyang_Zhang4;~Hui_Liu8;~Jiliang_Tang1;~Mao_Haitao1",
        "aff": "Michigan State University;Michigan State University;Michigan State University;Emory University;Amazon;Michigan State University;Michigan State University;Michigan State University",
        "aff_domain": "msu.edu;msu.edu;msu.edu;emory.edu;amazon.com;msu.edu;msu.edu;msu.edu",
        "position": "PhD student;PhD student;PhD student;Assistant Professor;Principal Researcher;Assistant Professor;Full Professor;PhD student",
        "bibtex": "@inproceedings{\nchen2024labelfree,\ntitle={Label-free Node Classification on Graphs with Large Language Models ({LLM}s)},\nauthor={Zhikai Chen and Haitao Mao and Hongzhi Wen and Haoyu Han and Wei Jin and Haiyang Zhang and Hui Liu and Jiliang Tang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=hESD2NJFg8}\n}",
        "github": "",
        "project": "",
        "reviewers": "HZKD;JunD;ugc7;LGrX",
        "pdf_size": 815989,
        "rating": "6;6;6;8",
        "confidence": "4;4;4;5",
        "soundness": "3;3;2;4",
        "contribution": "2;2;2;4",
        "presentation": "3;3;3;3",
        "wc_summary": "98;129;90;83",
        "wc_strengths": "58;68;21;118",
        "wc_weaknesses": "202;163;31;103",
        "wc_questions": "3;178;214;3",
        "wc_review": "361;538;356;307",
        "wc_reply_reviewers": "112;26;16;16",
        "wc_reply_authors": "3342;2309;2845;1612",
        "reply_reviewers": "2;1;1;1",
        "reply_authors": "9;8;8;4",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            100.0,
            17.564168070250297
        ],
        "wc_strengths_avg": [
            66.25,
            34.629286738250904
        ],
        "wc_weaknesses_avg": [
            124.75,
            64.60021284794657
        ],
        "wc_questions_avg": [
            99.5,
            97.33575910219224
        ],
        "wc_review_avg": [
            390.5,
            87.73397289533855
        ],
        "wc_reply_reviewers_avg": [
            42.5,
            40.33298897924626
        ],
        "wc_reply_authors_avg": [
            2527.0,
            642.2807018741884
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            7.25,
            1.920286436967152
        ],
        "replies_avg": [
            40,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 77,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2472017899133034394&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=hESD2NJFg8",
        "pdf": "https://openreview.net/pdf?id=hESD2NJFg8",
        "email": "msu.edu;msu.edu;msu.edu;emory.edu;amazon.com;msu.edu;msu.edu;msu.edu",
        "author_num": 8,
        "aff_unique_index": "0;0;0;1;2;0;0;0",
        "aff_unique_norm": "Michigan State University;Emory University;Amazon",
        "aff_unique_dep": ";;Amazon.com, Inc.",
        "aff_unique_url": "https://www.msu.edu;https://www.emory.edu;https://www.amazon.com",
        "aff_unique_abbr": "MSU;Emory;Amazon",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "hEl2HpiH3g",
        "title": "FedJETs: Efficient Just-In-Time Personalization with Federated Mixture of Experts",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "One of the goals in Federated Learning (FL) is to create personalized models that can adapt to the context of each participating client, while utilizing knowledge from a shared global model. Yet, often, personalization requires a fine-tuning step using clients' labeled data in order to achieve good performance. This may not be feasible in scenarios where incoming clients are fresh and/or have privacy concerns. It, then, remains open how one can achieve just-in-time personalization in these scenarios. We propose FedJETs, a novel solution by using a Mixture-of-Experts (MoE) framework within a FL setup. Our method leverages the diversity of the clients to train specialized experts on different subsets of classes, and a gating function to route the input to the most relevant expert(s). Our gating function harnesses the knowledge of a pretrained model common expert to enhance its routing decisions on-the-fly. As a highlight, our approach can improve accuracy up to 18\\% in state of the art FL settings, while maintaining competitive zero-shot performance. In practice, our method can handle non-homogeneous data distributions, scale more efficiently, and improve the state-of-the-art performance on common FL benchmarks.",
        "keywords": "Just-in-time personalization;Mixture of Experts;Federated Learning",
        "primary_area": "infrastructure, software libraries, hardware, etc.",
        "supplementary_material": "/attachment/43b971abba5074c944dbabd7763d2a00421467d2.zip",
        "author": "Chen Dun;Mirian Del Carmen Hipolito Garcia;Guoqing Zheng;Ahmed Hassan Awadallah;Robert Sim;Anastasios Kyrillidis;Dimitrios Dimitriadis",
        "authorids": "~Chen_Dun2;~Mirian_Del_Carmen_Hipolito_Garcia1;~Guoqing_Zheng1;~Ahmed_Hassan_Awadallah1;~Robert_Sim1;~Anastasios_Kyrillidis2;~Dimitrios_Dimitriadis1",
        "gender": ";F;;M;M;M;",
        "homepage": ";https://www.microsoft.com/en-us/research/people/mirianh/;https://www.microsoft.com/en-us/research/people/zheng/;https://www.microsoft.com/en-us/research/people/hassanam/publications/;;http://akyrillidis.github.io;",
        "dblp": "228/8450;;https://dblp.org/pers/z/Zheng:Guoqing.html;147/9148;47/1233;53/9879;05/3143",
        "google_scholar": "QbPWRIoAAAAJ;;aMhUcoMAAAAJ;sNGk-9MAAAAJ;uT8sPt8AAAAJ;TEGzkZMAAAAJ;AQSvco0AAAAJ",
        "orcid": ";;;;;;0000-0001-8483-0105",
        "linkedin": ";mirian-hip%C3%B3lito-garc%C3%ADa-22b658160;;ahmed-hassan-awadallah-a355a27/;simra/;;https://www.linkedin.com/dimitrios.dimitriadis",
        "or_profile": "~Chen_Dun2;~Mirian_Del_Carmen_Hipolito_Garcia1;~Guoqing_Zheng1;~Ahmed_Hassan_Awadallah1;~Robert_Sim1;~Anastasios_Kyrillidis2;~Dimitrios_Dimitriadis1",
        "aff": "ByteDance Inc.;Microsoft;Microsoft Research;Microsoft Research;Microsoft;Rice University;Amazon",
        "aff_domain": "bytedance.com;microsoft.com;microsoft.com;microsoft.com;microsoft.com;rice.edu;amazon.com",
        "position": "Researcher;Researcher;Researcher;Principal Researcher;Principal Researcher;Assistant Professor;Principal Applied Scientist",
        "bibtex": "@misc{\ndun2024fedjets,\ntitle={Fed{JET}s: Efficient Just-In-Time Personalization with Federated Mixture of Experts},\nauthor={Chen Dun and Mirian Del Carmen Hipolito Garcia and Guoqing Zheng and Ahmed Hassan Awadallah and Robert Sim and Anastasios Kyrillidis and Dimitrios Dimitriadis},\nyear={2024},\nurl={https://openreview.net/forum?id=hEl2HpiH3g}\n}",
        "github": "",
        "project": "",
        "reviewers": "Na6T;pX49;Y7tu;k6Nb",
        "site": "https://openreview.net/forum?id=hEl2HpiH3g",
        "pdf_size": 1044283,
        "rating": "3;5;5;6",
        "confidence": "5;3;3;3",
        "soundness": "2;2;2;3",
        "contribution": "1;2;2;2",
        "presentation": "3;3;3;3",
        "wc_summary": "53;99;60;89",
        "wc_strengths": "35;58;80;57",
        "wc_weaknesses": "130;126;83;169",
        "wc_questions": "99;118;122;83",
        "wc_review": "317;401;345;398",
        "wc_reply_reviewers": "9;0;0;0",
        "wc_reply_authors": "700;351;0;580",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "1;1;0;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            75.25,
            19.240257274787155
        ],
        "wc_strengths_avg": [
            57.5,
            15.913830462839549
        ],
        "wc_weaknesses_avg": [
            127.0,
            30.454884665682123
        ],
        "wc_questions_avg": [
            105.5,
            15.628499608087784
        ],
        "wc_review_avg": [
            365.25,
            35.66773752286512
        ],
        "wc_reply_reviewers_avg": [
            2.25,
            3.897114317029974
        ],
        "wc_reply_authors_avg": [
            407.75,
            266.72117932402745
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            0.75,
            0.4330127018922193
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.9271726499455306,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8020050601556725308&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1;1;1;2;3",
        "aff_unique_norm": "ByteDance;Microsoft;Rice University;Amazon",
        "aff_unique_dep": ";Microsoft Corporation;;Amazon.com, Inc.",
        "aff_unique_url": "https://www.bytedance.com;https://www.microsoft.com;https://www.rice.edu;https://www.amazon.com",
        "aff_unique_abbr": "ByteDance;Microsoft;Rice;Amazon",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;1;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "hEpdbd4VTg",
        "title": "3DiffTection: 3D Object Detection with Geometry-Aware Diffusion Features",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We present 3DiffTection, a cutting-edge method for 3D detection from posed images, grounded in features from a 3D-aware diffusion model. Annotating large-scale image data for 3D object detection is both resource-intensive and time-consuming. Recently, large image diffusion models have gained traction as potent feature extractors for 2D perception tasks. However, since these features, originally trained on paired text and image data, are not directly adaptable to 3D tasks and often misalign with target data, our approach bridges these gaps through two specialized tuning strategies: geometric and semantic. \nFor geometric tuning, we refine a diffusion model on a view synthesis task, introducing a novel epipolar warp operator. This task meets two pivotal criteria: the necessity for 3D awareness and reliance solely on posed image data, which are readily available (e.g., from videos). For semantic refinement, we further train the model on target data using box supervision. Both tuning phases employ a ControlNet to preserve the integrity of the original feature capabilities. In the final step, we harness these capabilities to conduct test-time prediction ensemble across multiple virtual viewpoints.\nThrough this methodology, we derive 3D-aware features tailored for 3D detection and excel in identifying cross-view point correspondences. Consequently, the resulting model emerges as a powerful 3D detector, substantially surpassing previous benchmarks, e.g., Cube-RCNN, a precedent in single-view 3D detection by 9.43\\% in AP3D-Near on the Omni3D-ARkitscene dataset. Furthermore, 3DiffTection showcases robust data efficiency and remarkable generalization to cross-domain data.",
        "keywords": "3D Computer Vision;Image Diffusion Networks;Novel View Synthesis;3D Object Detection",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/1b29d1d02cbab1d164e4861ab01daf58660f0c86.pdf",
        "author": "Chenfeng Xu;Huan Ling;Sanja Fidler;Or Litany",
        "authorids": "~Chenfeng_Xu1;~Huan_Ling1;~Sanja_Fidler1;~Or_Litany1",
        "gender": "M;M;F;M",
        "homepage": ";http://www.cs.toronto.edu/~linghuan/;http://www.cs.toronto.edu/~fidler/;http://orlitany.github.io",
        "dblp": "65/1881;202/1680;08/6607;119/1476",
        "google_scholar": "RpqvaTUAAAAJ;03n03GEAAAAJ;CUlqK5EAAAAJ;https://scholar.google.co.il/citations?user=Ihs8dwsAAAAJ",
        "orcid": "0000-0002-4941-6985;;;",
        "linkedin": ";;sanja-fidler-2846a1a?trk=hp-identity-name;",
        "or_profile": "~Chenfeng_Xu1;~Huan_Ling1;~Sanja_Fidler1;~Or_Litany1",
        "aff": "University of California, Berkeley;NVIDIA;Department of Computer Science, University of Toronto;NVIDIA",
        "aff_domain": "berkeley.edu;nvidia.com;cs.toronto.edu;nvidia.com",
        "position": "PhD student;Researcher;Associate Professor;Research Scientist",
        "bibtex": "@misc{\nxu2024difftection,\ntitle={3DiffTection: 3D Object Detection with Geometry-Aware Diffusion Features},\nauthor={Chenfeng Xu and Huan Ling and Sanja Fidler and Or Litany},\nyear={2024},\nurl={https://openreview.net/forum?id=hEpdbd4VTg}\n}",
        "github": "",
        "project": "",
        "reviewers": "16V1;T1bR;CDfS",
        "site": "https://openreview.net/forum?id=hEpdbd4VTg",
        "pdf_size": 5215679,
        "rating": "3;5;6",
        "confidence": "4;4;4",
        "soundness": "3;2;3",
        "contribution": "2;2;3",
        "presentation": "2;2;4",
        "wc_summary": "46;75;67",
        "wc_strengths": "30;35;46",
        "wc_weaknesses": "140;27;112",
        "wc_questions": "3;67;2",
        "wc_review": "219;204;227",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "560;692;277",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;2;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            62.666666666666664,
            12.229290885229428
        ],
        "wc_strengths_avg": [
            37.0,
            6.683312551921141
        ],
        "wc_weaknesses_avg": [
            93.0,
            48.0485865210067
        ],
        "wc_questions_avg": [
            24.0,
            30.40833219146796
        ],
        "wc_review_avg": [
            216.66666666666666,
            9.533566430716727
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            509.6666666666667,
            173.1210238211665
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7113827141271751047&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "University of California, Berkeley;NVIDIA;University of Toronto",
        "aff_unique_dep": ";NVIDIA Corporation;Department of Computer Science",
        "aff_unique_url": "https://www.berkeley.edu;https://www.nvidia.com;https://www.utoronto.ca",
        "aff_unique_abbr": "UC Berkeley;NVIDIA;U of T",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Berkeley;;Toronto",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "United States;Canada"
    },
    {
        "id": "hF8jnnexSB",
        "title": "The Power of Minimalism in Long Sequence Time-series Forecasting",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recently, transformer-based models have been widely applied to time series forecasting tasks due to their remarkable capability to capture complex interactions within sequential data. However, as the sequence length expands, Transformer-based models suffer from increased memory consumption, overfitting, and performance deterioration in capturing long-range dependencies. Recently, several studies have shown that MLP-based models can outperform advanced Transformer-based models for long-term time series forecasting (LTSF) tasks. Unfortunately, linear mappings often struggle to capture intricate dependencies when handling multivariate time series. Although modeling each channel independently can alleviate this issue, it will significantly increase the computational cost. To this end, we introduce a set of simple yet effective depthwise convolution models named LTSF-Conv to perform LTSF. Specifically, we apply unique filters to each channel to achieve channel independence, which plays a pivotal role in enhancing overall forecasting performance. Experimental results show that LTSF-Conv models outperform the state-of-the-art Transformer-based and MLP-based models across seven real-world LTSF benchmarks. Surprisingly, a two-layer non-stacked network can outperform the state-of-the-art Transformer model in 91\\% of cases with a significant reduction of computing resources. In particular, LTSF-Conv models substantially decrease the average number of trainable parameters (by $\\sim$ 12$\\times$), maximum memory consumption (by $\\sim$ 86$\\times$), running time (by $\\sim$ 18$\\times$), and inference time (by $\\sim$ 2$\\times$) on the Electricity benchmark.",
        "keywords": "Long-term time series forecasting;Transformers;Efficiency",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/526e8e361fea82efcdeafa981122024e19db94e5.zip",
        "author": "Zhao Sun;Meng Fang;Dongjin Song;Defu Li;Tianjin Huang;Qinke Peng",
        "authorids": "~Zhao_Sun1;~Meng_Fang1;~Dongjin_Song2;~Defu_Li1;~Tianjin_Huang1;~Qinke_Peng1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://research.tue.nl/en/persons/zhao-sun/similar;;https://songdj.github.io/;;https://research.tue.nl/nl/persons/tianjin-huang;http://www.xjtu.edu.cn/jsnr.jsp?urltype=tree.TreeTempUrl&wbtreeid=1632&wbwbxjtuteacherid=570",
        "dblp": ";67/463;41/3281;;189/3972;",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;IcNYP1oAAAAJ;BJdHw6AAAAAJ;;https://scholar.google.co.uk/citations?user=yFLmPsoAAAAJ;",
        "orcid": ";;;0009-0008-8805-0569;;",
        "linkedin": ";;;;;",
        "or_profile": "~Zhao_Sun1;~Meng_Fang1;~Dongjin_Song2;~Defu_Li1;~Tianjin_Huang1;~Qinke_Peng1",
        "aff": "Xi'an Jiaotong University;Eindhoven University of Technology;University of Connecticut;Xi'an Jiaotong University;University of Exeter;Xi'an Jiaotong University",
        "aff_domain": "xjtu.edu.cn;tue.nl;uconn.edu;xjtu.edu.cn;exeter.ac.uk;xjtu.edu.cn",
        "position": "PhD student;Assistant Professor;Assistant Professor;MS student;Lecturer;Full Professor",
        "bibtex": "@misc{\nsun2024the,\ntitle={The Power of Minimalism in Long Sequence Time-series Forecasting},\nauthor={Zhao Sun and Meng Fang and Dongjin Song and Defu Li and Tianjin Huang and Qinke Peng},\nyear={2024},\nurl={https://openreview.net/forum?id=hF8jnnexSB}\n}",
        "github": "",
        "project": "",
        "reviewers": "1dcB;gotF;3Fmc;dk3x",
        "site": "https://openreview.net/forum?id=hF8jnnexSB",
        "pdf_size": 3289924,
        "rating": "3;6;6;8",
        "confidence": "4;5;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "2;4;2;3",
        "wc_summary": "92;58;762;43",
        "wc_strengths": "211;53;8;111",
        "wc_weaknesses": "375;205;8;31",
        "wc_questions": "23;75;10;4",
        "wc_review": "701;391;788;189",
        "wc_reply_reviewers": "0;0;0;6",
        "wc_reply_authors": "1906;1338;2273;861",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "3;2;3;1",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            238.75,
            302.6197077191107
        ],
        "wc_strengths_avg": [
            95.75,
            75.89919301283776
        ],
        "wc_weaknesses_avg": [
            154.75,
            148.2268110025983
        ],
        "wc_questions_avg": [
            28.0,
            27.99107000455681
        ],
        "wc_review_avg": [
            517.25,
            240.18573542156912
        ],
        "wc_reply_reviewers_avg": [
            1.5,
            2.598076211353316
        ],
        "wc_reply_authors_avg": [
            1594.5,
            538.7970397097594
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:AcDmo96rzDgJ:scholar.google.com/&scioq=The+Power+of+Minimalism+in+Long+Sequence+Time-series+Forecasting&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0;3;0",
        "aff_unique_norm": "Xi'an Jiao Tong University;Eindhoven University of Technology;University of Connecticut;University of Exeter",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.xjtu.edu.cn;https://www.tue.nl;https://www.uconn.edu;https://www.exeter.ac.uk",
        "aff_unique_abbr": "XJTU;TU/e;UConn;Exeter",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;0;3;0",
        "aff_country_unique": "China;Netherlands;United States;United Kingdom"
    },
    {
        "id": "hGKda1uVEn",
        "title": "Support Vector-based Shapley Value Estimation for Feature Selection and Explanation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In recent years, employing Shapley values to compute feature importance has gained considerable attention. Calculating these values inherently necessitates managing an exponential number of parameters\u2014a challenge commonly mitigated through an additivity assumption coupled with linear regression. This paper proposes a novel approach by modeling supervised learning as a multilinear game, incorporating both direct and interaction effects to establish the requisite values for Shapley value computation. To efficiently handle the exponentially increasing parameters intrinsic to multilinear games, we introduce a support vector machine (SVM)-based method for parameter estimation, its complexity is predominantly contingent on the number of samples due to the implementation of a dual SVM formulation. Additionally, we unveil an optimized dynamic programming algorithm capable of directly computing the Shapley value and interaction index from the dual SVM. Our proposed methodology is versatile, ascertaining feature importance across a myriad of supervised tasks, thereby offering a practical tool for feature selection and explanation. Experiments underscore the competitive efficacy of our proposed methods in terms of feature selection and explanation.",
        "keywords": "explainability; Shapley Value; Support vector machine; Dynamic programming",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/516432d476fc74d7936d05f9c93a6734debdc324.zip",
        "author": "Majid Mohammadi;Ilaria Tiddi;Annette Ten Teije",
        "authorids": "~Majid_Mohammadi2;~Ilaria_Tiddi1;~Annette_Ten_Teije2",
        "gender": ";F;F",
        "homepage": ";https://kmitd.github.io/ilaria/;https://research.vu.nl/en/persons/acm-ten-teije",
        "dblp": ";124/9746;https://dblp.uni-trier.de/pid/96/3134.html",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;https://scholar.google.ca/citations?user=2fDYEcgAAAAJ",
        "orcid": ";0000-0001-7116-9338;0000-0002-9771-8822",
        "linkedin": ";;",
        "or_profile": "~Majid_Mohammadi2;~Ilaria_Tiddi1;~Annette_Ten_Teije2",
        "aff": ";Vrije Universiteit Amsterdam;Vrije Universiteit Amsterdam",
        "aff_domain": ";vu.nl;vu.nl",
        "position": ";Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nanonymous2024support,\ntitle={Support Vector-based Shapley Value Estimation for Feature Selection and Explanation},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=hGKda1uVEn}\n}",
        "github": "",
        "project": "",
        "reviewers": "Ey9T;iYFx;NKAm;gc9E",
        "site": "https://openreview.net/forum?id=hGKda1uVEn",
        "pdf_size": 526899,
        "rating": "5;5;5;6",
        "confidence": "4;4;3;3",
        "soundness": "2;2;3;4",
        "contribution": "2;2;4;3",
        "presentation": "2;2;2;3",
        "wc_summary": "42;96;130;22",
        "wc_strengths": "37;132;13;36",
        "wc_weaknesses": "707;471;63;88",
        "wc_questions": "50;50;66;73",
        "wc_review": "836;749;272;219",
        "wc_reply_reviewers": "0;179;89;11",
        "wc_reply_authors": "968;1660;1281;565",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "2;3;3;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            72.5,
            42.83398183685472
        ],
        "wc_strengths_avg": [
            54.5,
            45.76297630180974
        ],
        "wc_weaknesses_avg": [
            332.25,
            270.1123608796902
        ],
        "wc_questions_avg": [
            59.75,
            10.059199769365355
        ],
        "wc_review_avg": [
            519.0,
            275.86137823189387
        ],
        "wc_reply_reviewers_avg": [
            69.75,
            71.80311622764015
        ],
        "wc_reply_authors_avg": [
            1118.5,
            402.69125890687025
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:yCuV9IJtMIsJ:scholar.google.com/&scioq=Support+Vector-based+Shapley+Value+Estimation+for+Feature+Selection+and+Explanation&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Vrije Universiteit Amsterdam",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.vu.nl",
        "aff_unique_abbr": "VU Amsterdam",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Netherlands"
    },
    {
        "id": "hGtAY5t2yB",
        "title": "Masked Autoencoders Are Robust Neural Architecture Search Learners",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Neural Architecture Search (NAS) currently relies heavily on labeled data, which is both expensive and time-consuming to acquire. In this paper, we propose a novel NAS framework based on Masked Autoencoders (MAE) that eliminates the need for labeled data during the search process. By replacing the super-vised learning objective with an image reconstruction task, our approach enables the robust discovery of network architectures without compromising performance and generalization ability. Additionally, we address the problem of performance collapse encountered in the widely-used Differentiable Architecture Search (DARTS) method in the unsupervised paradigm by introducing a multi-scale decoder. Through extensive experiments conducted on various search spaces and datasets, we demonstrate the effectiveness and robustness of the proposed method, providing empirical evidence of its superiority over baseline approaches.",
        "keywords": "neural architecture search;masked autoencoders",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Yiming;Xiangxiang Chu;Bo Zhang",
        "authorids": "~Yiming1;~Xiangxiang_Chu1;~Bo_Zhang7",
        "gender": "M;M;M",
        "homepage": "https://scholar.google.com/citations?hl=en&user=lVG3ZB8AAAAJ;https://cxxgtxy.github.io/;",
        "dblp": "68/5169;207/8002;36/2259-46",
        "google_scholar": ";jn21pUsAAAAJ;uUNQnu0AAAAJ",
        "orcid": ";0000-0003-2548-0605;0000-0003-0564-617X",
        "linkedin": ";;bo-zhang-20a86588/",
        "or_profile": "~Yiming1;~Xiangxiang_Chu1;~Bo_Zhang7",
        "aff": "Sensetime;MeiTuan;Meituan Inc.",
        "aff_domain": "sensetime.com;meituan.com;meituan.com",
        "position": "Researcher;Senior Engineer;Senior Software Engineer",
        "bibtex": "@misc{\nyiming2024masked,\ntitle={Masked Autoencoders Are Robust Neural Architecture Search Learners},\nauthor={Yiming and Xiangxiang Chu and Bo Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=hGtAY5t2yB}\n}",
        "github": "",
        "project": "",
        "reviewers": "qAFC;CagH;eDJx;UdAV",
        "site": "https://openreview.net/forum?id=hGtAY5t2yB",
        "pdf_size": 342404,
        "rating": "3;3;5;5",
        "confidence": "5;4;4;3",
        "soundness": "2;2;3;2",
        "contribution": "2;2;2;2",
        "presentation": "2;2;3;3",
        "wc_summary": "41;64;91;80",
        "wc_strengths": "18;14;18;103",
        "wc_weaknesses": "129;133;75;243",
        "wc_questions": "69;16;33;3",
        "wc_review": "257;227;217;429",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            69.0,
            18.801595676963167
        ],
        "wc_strengths_avg": [
            38.25,
            37.41907935799597
        ],
        "wc_weaknesses_avg": [
            145.0,
            61.04096984812741
        ],
        "wc_questions_avg": [
            30.25,
            24.772716847370617
        ],
        "wc_review_avg": [
            282.5,
            85.85307216401752
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.7071067811865475,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:5pDz9E7btPoJ:scholar.google.com/&scioq=Masked+Autoencoders+Are+Robust+Neural+Architecture+Search+Learners&hl=en&as_sdt=0,5",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "SenseTime;Meituan;Meituan Inc.",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.sensetime.com;https://www.meituan.com;https://www.meituan.com",
        "aff_unique_abbr": "SenseTime;MeiTuan;Meituan",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "hH5HK4hsLY",
        "title": "Enhancement-Driven Pretraining for Robust Fingerprint Representation Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Fingerprint recognition stands as a pivotal component of biometric technology, with diverse applications from identity verification to advanced search tools. In this paper, we propose a unique method for deriving robust fingerprint representations by leveraging enhancement-based pre-training. Building on the achievements of U-Net-based fingerprint enhancement, our method employs a specialized encoder to derive representations from fingerprint images in a self-supervised manner. We further refine these representations, aiming to enhance the verification capabilities. Our experimental results, tested on publicly available fingerprint datasets, reveal a marked improvement in verification performance against established self-supervised training techniques. Our findings not only highlight the effectiveness of our method but also pave the way for potential advancements. Crucially, our research indicates that it is feasible to extract meaningful fingerprint representations from degraded images without relying on enhanced samples.",
        "keywords": "Self-Supervised Learning;Fingerprint Verification;Representation Learning;Biometrics",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Ekta Gavas;Kaustubh Olpadkar;Anoop M. Namboodiri",
        "authorids": "~Ekta_Gavas1;~Kaustubh_Olpadkar1;~Anoop_M._Namboodiri1",
        "gender": "F;;",
        "homepage": ";;",
        "dblp": ";;",
        "google_scholar": ";;",
        "orcid": ";;",
        "linkedin": "ektagavas/;;",
        "or_profile": "~Ekta_Gavas1;~Kaustubh_Olpadkar1;~Anoop_M._Namboodiri1",
        "aff": ";;",
        "aff_domain": ";;",
        "position": ";;",
        "bibtex": "@misc{\ngavas2024enhancementdriven,\ntitle={Enhancement-Driven Pretraining for Robust Fingerprint Representation Learning},\nauthor={Ekta Gavas and Kaustubh Olpadkar and Anoop M. Namboodiri},\nyear={2024},\nurl={https://openreview.net/forum?id=hH5HK4hsLY}\n}",
        "github": "",
        "project": "",
        "reviewers": "NFpv;eThS;dTWo",
        "site": "https://openreview.net/forum?id=hH5HK4hsLY",
        "pdf_size": 1396053,
        "rating": "1;3;3",
        "confidence": "4;3;4",
        "soundness": "1;3;2",
        "contribution": "1;2;2",
        "presentation": "3;3;3",
        "wc_summary": "41;72;80",
        "wc_strengths": "13;52;166",
        "wc_weaknesses": "165;260;264",
        "wc_questions": "1;159;240",
        "wc_review": "220;543;750",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "124;211;384",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            64.33333333333333,
            16.81930108205715
        ],
        "wc_strengths_avg": [
            77.0,
            64.91532946846992
        ],
        "wc_weaknesses_avg": [
            229.66666666666666,
            45.75538826800135
        ],
        "wc_questions_avg": [
            133.33333333333334,
            99.24492710237413
        ],
        "wc_review_avg": [
            504.3333333333333,
            218.09223329183968
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            239.66666666666666,
            108.06273897859315
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:yywN2gJZn70J:scholar.google.com/&scioq=Enhancement-Driven+Pretraining+for+Robust+Fingerprint+Representation+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 6
    },
    {
        "title": "Adaptive Window Pruning for Efficient Local Motion Deblurring",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18103",
        "id": "hI18CDyadM",
        "author_site": "Haoying Li, Jixin Zhao, Shangchen Zhou, Huajun Feng, Chongyi Li, Chen Change Loy",
        "tldr": "",
        "abstract": "Local motion blur commonly occurs in real-world photography due to the mixing between moving objects and stationary backgrounds during exposure. Existing image deblurring methods predominantly focus on global deblurring, inadvertently affecting the sharpness of backgrounds in locally blurred images and wasting unnecessary computation on sharp pixels, especially for high-resolution images.\nThis paper aims to adaptively and efficiently restore high-resolution locally blurred images. We propose a local motion deblurring vision Transformer (LMD-ViT) built on adaptive window pruning Transformer blocks (AdaWPT). To focus deblurring on local regions and reduce computation, AdaWPT prunes unnecessary windows, only allowing the active windows to be involved in the deblurring processes. The pruning operation relies on the blurriness confidence predicted by a confidence predictor that is trained end-to-end using a reconstruction loss with Gumbel-Softmax re-parameterization and a pruning loss guided by annotated blur masks. Our method removes local motion blur effectively without distorting sharp regions, demonstrated by its exceptional perceptual and quantitative improvements (+0.28dB) compared to state-of-the-art methods. In addition, our approach substantially reduces FLOPs by 66% and achieves more than a twofold increase in inference speed compared to Transformer-based deblurring methods. We will make our code and annotated blur masks publicly available.",
        "keywords": "Local motion deblurring;transformer;deep learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/804f8b88bc7e3865cea6974498329378aa58b898.zip",
        "author": "Haoying Li;Jixin Zhao;Shangchen Zhou;Huajun Feng;Chongyi Li;Chen Change Loy",
        "authorids": "~Haoying_Li1;~Jixin_Zhao1;~Shangchen_Zhou1;~Huajun_Feng1;~Chongyi_Li1;~Chen_Change_Loy2",
        "gender": "F;M;M;;;M",
        "homepage": "https://leiali.github.io/;https://zjx0101.github.io/zhaojixin.github.io/;https://shangchenzhou.com;;;https://www.mmlab-ntu.com/person/ccloy/index.html",
        "dblp": "291/4710;308/9982;191/5298;;;01/5855",
        "google_scholar": "inMLhvkAAAAJ;0Z89rfUAAAAJ;https://scholar.google.com.hk/citations?user=suaDwBQAAAAJ;;;https://scholar.google.co.uk/citations?user=559LF80AAAAJ",
        "orcid": "0000-0002-0096-7292;0009-0002-9655-4800;0000-0001-8201-8877;;;0000-0001-5345-1591",
        "linkedin": "haoying-li-388863265/;jixin-zhao-6693141b0/;;;;",
        "or_profile": "~Haoying_Li1;~Jixin_Zhao1;~Shangchen_Zhou1;~Huajun_Feng1;~Chongyi_Li1;~Chen_Change_Loy2",
        "aff": "Zhejiang University;Nanyang Technological University;Nanyang Technological University;;;Nanyang Technological University",
        "aff_domain": "zju.edu.cn;ntu.edu.sg;ntu.edu.sg;;;ntu.edu.sg",
        "position": "PhD student;MS student;PhD student;;;Full Professor",
        "bibtex": "@inproceedings{\nli2024adaptive,\ntitle={Adaptive Window Pruning for Efficient Local Motion Deblurring},\nauthor={Haoying Li and Jixin Zhao and Shangchen Zhou and Huajun Feng and Chongyi Li and Chen Change Loy},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=hI18CDyadM}\n}",
        "github": "",
        "project": "",
        "reviewers": "ePoq;SKAv;S2zK",
        "pdf_size": 9321725,
        "rating": "3;6;8",
        "confidence": "5;4;5",
        "soundness": "2;4;3",
        "contribution": "2;4;3",
        "presentation": "2;4;4",
        "wc_summary": "99;115;32",
        "wc_strengths": "44;168;71",
        "wc_weaknesses": "279;148;315",
        "wc_questions": "2;5;2",
        "wc_review": "424;436;420",
        "wc_reply_reviewers": "156;0;0",
        "wc_reply_authors": "2427;425;1451",
        "reply_reviewers": "1;0;0",
        "reply_authors": "5;2;2",
        "rating_avg": [
            5.666666666666667,
            2.0548046676563256
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            82.0,
            35.95367389665021
        ],
        "wc_strengths_avg": [
            94.33333333333333,
            53.24367463735846
        ],
        "wc_weaknesses_avg": [
            247.33333333333334,
            71.76040381405024
        ],
        "wc_questions_avg": [
            3.0,
            1.4142135623730951
        ],
        "wc_review_avg": [
            426.6666666666667,
            6.79869268479038
        ],
        "wc_reply_reviewers_avg": [
            52.0,
            73.53910524340094
        ],
        "wc_reply_authors_avg": [
            1434.3333333333333,
            817.3980398530177
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.0,
            1.4142135623730951
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.11470786693528084,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17738951729099727698&as_sdt=8000005&sciodt=0,19&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=hI18CDyadM",
        "pdf": "https://openreview.net/pdf?id=hI18CDyadM",
        "email": "zju.edu.cn;ntu.edu.sg;ntu.edu.sg;;;ntu.edu.sg",
        "author_num": 6,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Zhejiang University;Nanyang Technological University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.zju.edu.cn;https://www.ntu.edu.sg",
        "aff_unique_abbr": "ZJU;NTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "China;Singapore"
    },
    {
        "id": "hIDoBRUt4e",
        "title": "The Devil is in the Edges: Monocular Depth Estimation with Edge-aware Consistency Fusion",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "This paper presents a novel monocular depth estimation method, named ECFNet, for estimating high-quality monocular depth with clear edges and valid overall structure from a single RGB image. We make a thorough inquiry about the key factor that affects the edge depth estimation of the MDE networks, and come to a ratiocination that the edge information itself plays a critical role in predicting depth details. Driven by this analysis, we propose to explicitly employ the image edges as input for ECFNet and fuse the initial depths from different sources to produce the final depth. Specifically, ECFNet first uses a hybrid edge detection strategy to get the edge map and edge-highlighted image from the input image, and then leverages a pre-trained MDE network to infer the initial depths of the aforementioned three images. After that, ECFNet utilizes a layered fusion module (LFM) to fuse the initial depth, which will be further updated by a depth consistency module (DCM) to form the final estimation. Extensive experimental results on four public datasets and ablation studies indicate that our method achieves state-of-the-art performance.",
        "keywords": "monocular depth estimation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Pengzhi Li;Yikang Ding;Haohan Wang;Chengshuai Tang;Zhiheng Li",
        "authorids": "~Pengzhi_Li1;~Yikang_Ding1;~Haohan_Wang3;~Chengshuai_Tang1;~Zhiheng_Li3",
        "gender": "M;M;M;M;M",
        "homepage": "https://zrealli.github.io;;;https://www.sigs.tsinghua.edu.cn/lzh/list.htm;https://github.com/csinsgcc",
        "dblp": ";307/5268;;89/6935-1;",
        "google_scholar": "ttBQptwAAAAJ;gdP9StQAAAAJ;https://scholar.google.com/citations?hl=zh-CN;;",
        "orcid": ";;0000-0003-3451-6884;;",
        "linkedin": ";;;;",
        "or_profile": "~Pengzhi_Li1;~Yikang_Ding1;~Haohan_Wang3;~Zhiheng_Li3;~tang_chengshuai1",
        "aff": "Tsinghua University;Megvii Technology Inc.;JD.com;Tsinghua University;Electronic Engineering, Tsinghua University, Tsinghua University",
        "aff_domain": "mails.tsinghua.edu.cn;megvii.com;jd.com;mail.tsinghua.edu.cn;mails.tsinghua.edu.cn",
        "position": "MS student;Researcher;Researcher;Associate Professor;MS student",
        "bibtex": "@misc{\nli2024the,\ntitle={The Devil is in the Edges: Monocular Depth Estimation with Edge-aware Consistency Fusion},\nauthor={Pengzhi Li and Yikang Ding and Haohan Wang and Chengshuai Tang and Zhiheng Li},\nyear={2024},\nurl={https://openreview.net/forum?id=hIDoBRUt4e}\n}",
        "github": "",
        "project": "",
        "reviewers": "bKTL;ZRn8;sHHy",
        "site": "https://openreview.net/forum?id=hIDoBRUt4e",
        "pdf_size": 9185878,
        "rating": "3;5;5",
        "confidence": "3;4;5",
        "soundness": "3;2;3",
        "contribution": "2;2;3",
        "presentation": "3;2;3",
        "wc_summary": "50;80;111",
        "wc_strengths": "34;29;433",
        "wc_weaknesses": "121;178;158",
        "wc_questions": "2;20;5",
        "wc_review": "207;307;707",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            80.33333333333333,
            24.904261125803796
        ],
        "wc_strengths_avg": [
            165.33333333333334,
            189.27992204375212
        ],
        "wc_weaknesses_avg": [
            152.33333333333334,
            23.612614331233114
        ],
        "wc_questions_avg": [
            9.0,
            7.874007874011811
        ],
        "wc_review_avg": [
            407.0,
            216.02468994692867
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.8660254037844385,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17653469586018530810&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;0;0",
        "aff_unique_norm": "Tsinghua University;Megvii Technology;JD.com",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.megvii.com;https://www.jd.com",
        "aff_unique_abbr": "THU;Megvii;JD",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "True Knowledge Comes from Practice: Aligning Large Language Models with Embodied Environments via Reinforcement Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18102",
        "id": "hILVmJ4Uvu",
        "author_site": "Weihao Tan, Wentao Zhang, Shanqi Liu, Longtao Zheng, Xinrun Wang, Bo An",
        "tldr": "",
        "abstract": "Despite the impressive performance across numerous tasks, large language models (LLMs) often fail in solving simple decision-making tasks due to the misalignment of the knowledge in LLMs with environments. On the contrary, reinforcement learning (RL) agents learn policies from scratch, which makes them always align with environments but difficult to incorporate prior knowledge for efficient explorations. To narrow the gap, we propose TWOSOME, a novel general online framework that deploys LLMs as decision-making agents to efficiently interact and align with embodied environments via RL without requiring any prepared datasets or prior knowledge of the environments. Firstly, we query the joint probabilities of each valid action with LLMs to form behavior policies. Then, to enhance the stability and robustness of the policies, we propose two normalization methods and summarize four prompt design principles. Finally, we design a novel parameter-efficient training architecture where the actor and critic share one frozen LLM equipped with low-rank adapters (LoRA) updated by PPO. We conduct extensive experiments to evaluate TWOSOME. i) TWOSOME exhibits significantly better sample efficiency and performance compared to the conventional RL method, PPO, and prompt tuning method, SayCan, in both classical decision-making environment, Overcooked, and simulated household environment, VirtualHome. ii) Benefiting from LLMs' open-vocabulary feature, TWOSOME shows superior generalization ability to unseen tasks. iii) Under our framework, there is no significant loss of the LLMs' original ability during online PPO finetuning.",
        "keywords": "Reinforcement Learning;Large Language Models;Parameter-Efficient Fine-Tuning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/b4ca6851a195ef5668724ce0d5a604fc5b0510c8.zip",
        "author": "Weihao Tan;Wentao Zhang;Shanqi Liu;Longtao Zheng;Xinrun Wang;Bo An",
        "authorids": "~Weihao_Tan1;~Wentao_Zhang9;~Shanqi_Liu1;~Longtao_Zheng1;~Xinrun_Wang1;~Bo_An2",
        "gender": "M;M;;M;M;M",
        "homepage": "https://weihaotan.github.io/;;;https://ltzheng.github.io/;https://rainwangphy.github.io/;https://personal.ntu.edu.sg/boan/",
        "dblp": "238/0151;41/3249-7;277/9570;293/7155;199/6413;42/6178-1.html",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;Zvtt7ZcAAAAJ;Zc-FbhEAAAAJ;https://scholar.google.com/citations?hl=en;ROANfPUAAAAJ;PEEpuNwAAAAJ",
        "orcid": ";0009-0008-2767-6998;;;;0000-0002-7064-7438",
        "linkedin": ";;;longtaozheng;;",
        "or_profile": "~Weihao_Tan1;~Wentao_Zhang9;~Shanqi_Liu1;~Longtao_Zheng1;~Xinrun_Wang1;~Bo_An2",
        "aff": "Nanyang Technological University;Nanyang Technological University;Zhejiang University;Nanyang Technological University, Singapore;Nanyang Technological University;Nanyang Technological University",
        "aff_domain": "ntu.edu.sg;ntu.edu.sg;zju.edu.cn;ntu.edu.sg;ntu.edu.sg;ntu.edu.sg",
        "position": "Researcher;Researcher;PhD student;PhD student;Postdoc;Full Professor",
        "bibtex": "@inproceedings{\ntan2024true,\ntitle={True Knowledge Comes from Practice: Aligning Large Language Models with Embodied Environments via Reinforcement Learning},\nauthor={Weihao Tan and Wentao Zhang and Shanqi Liu and Longtao Zheng and Xinrun Wang and Bo An},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=hILVmJ4Uvu}\n}",
        "github": "",
        "project": "",
        "reviewers": "HnZU;fSyb;Xize;FDRX",
        "pdf_size": 31961570,
        "rating": "6;6;6;6",
        "confidence": "4;3;4;3",
        "soundness": "3;2;3;3",
        "contribution": "3;2;2;3",
        "presentation": "4;3;3;3",
        "wc_summary": "100;109;86;110",
        "wc_strengths": "104;59;100;90",
        "wc_weaknesses": "173;206;250;90",
        "wc_questions": "107;86;99;1",
        "wc_review": "484;460;535;291",
        "wc_reply_reviewers": "343;25;0;0",
        "wc_reply_authors": "2675;1530;661;687",
        "reply_reviewers": "2;1;0;0",
        "reply_authors": "6;4;1;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            101.25,
            9.627434756984853
        ],
        "wc_strengths_avg": [
            88.25,
            17.640507362318125
        ],
        "wc_weaknesses_avg": [
            179.75,
            58.576339079870806
        ],
        "wc_questions_avg": [
            73.25,
            42.381452311123084
        ],
        "wc_review_avg": [
            442.5,
            91.56555029048862
        ],
        "wc_reply_reviewers_avg": [
            92.0,
            145.27387927635166
        ],
        "wc_reply_authors_avg": [
            1388.25,
            821.045484428238
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.0,
            2.1213203435596424
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 47,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14614877622225968202&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=hILVmJ4Uvu",
        "pdf": "https://openreview.net/pdf?id=hILVmJ4Uvu",
        "email": "ntu.edu.sg;ntu.edu.sg;zju.edu.cn;ntu.edu.sg;ntu.edu.sg;ntu.edu.sg",
        "author_num": 6,
        "aff_unique_index": "0;0;1;0;0;0",
        "aff_unique_norm": "Nanyang Technological University;Zhejiang University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ntu.edu.sg;https://www.zju.edu.cn",
        "aff_unique_abbr": "NTU;ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0;0",
        "aff_country_unique": "Singapore;China"
    },
    {
        "id": "hIpUwg8kAU",
        "title": "Estimation error of gradient descent in deep regressions",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "To achieve a theoretical understanding of deep learning, it is necessary to consider the approximation, generalization, and optimization errors. In recent years, there have been significant advancements in the literature regarding each or two of these errors. However, there have been few works that simultaneously analyze all three errors. This is due to the gap that exists between the optimization and generalization errors in over-parameterized regimes. In this work, we attempt to bridge this gap by establishing consistency between the outputs of gradient descent and the true regression function in the over-parameterized scenario. Our research offers a feasible perspective for a more comprehensive understanding of the theory behind deep learning.",
        "keywords": "deep regression;gradient descent;estimation error;approximation;generalization;optimization",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/4e8ce9ac73c94d7832c584e45577b2252d9020f2.pdf",
        "author": "Yuling Jiao;Yanming Lai;Huazhen Lin;Yang Wang",
        "authorids": "~Yuling_Jiao1;~Yanming_Lai1;~Huazhen_Lin1;~Yang_Wang25",
        "gender": "M;M;F;M",
        "homepage": "https://jszy.whu.edu.cn/jiaoyuling/en/index.htm;;https://huazhenlin.com/;http://www.math.ust.hk/~yangwang",
        "dblp": "136/7658;;;",
        "google_scholar": "yFDDsVgAAAAJ;P6EcP_UAAAAJ;;",
        "orcid": ";;0000-0002-6066-1842;0000-0002-8903-2388",
        "linkedin": ";;;",
        "or_profile": "~Yuling_Jiao1;~Yanming_Lai1;~Huazhen_Lin1;~Yang_Wang25",
        "aff": "Wuhan University;Hong Kong University of Science and Technology;Southwest University of Finance and Economics;Hong Kong University of Science and Technology",
        "aff_domain": "whu.edu.cn;ust.hk;swufe.edu.cn;hkust.edu.hk",
        "position": "Full Professor;PhD student;Full Professor;Full Professor",
        "bibtex": "@misc{\njiao2024estimation,\ntitle={Estimation error of gradient descent in deep regressions},\nauthor={Yuling Jiao and Yanming Lai and Huazhen Lin and Yang Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=hIpUwg8kAU}\n}",
        "github": "",
        "project": "",
        "reviewers": "Mz9q;VTNi;JNjG;x5tH",
        "site": "https://openreview.net/forum?id=hIpUwg8kAU",
        "pdf_size": 251704,
        "rating": "3;3;5;6",
        "confidence": "3;3;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;1;3;2",
        "wc_summary": "51;16;59;109",
        "wc_strengths": "44;23;40;162",
        "wc_weaknesses": "279;251;278;117",
        "wc_questions": "54;68;154;108",
        "wc_review": "428;358;531;496",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            58.75,
            33.214266513051285
        ],
        "wc_strengths_avg": [
            67.25,
            55.26922742358536
        ],
        "wc_weaknesses_avg": [
            231.25,
            66.91178894634338
        ],
        "wc_questions_avg": [
            96.0,
            38.91015291668744
        ],
        "wc_review_avg": [
            453.25,
            66.29998114630199
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.7777777777777777,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:b66m1udLk5cJ:scholar.google.com/&scioq=Estimation+error+of+gradient+descent+in+deep+regressions&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "Wuhan University;Hong Kong University of Science and Technology;Southwest University of Finance and Economics",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.whu.edu.cn/;https://www.ust.hk;https://www.swufe.edu.cn",
        "aff_unique_abbr": "WHU;HKUST;SWUFE",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "hJCinlknXn",
        "title": "UOEP: User-Oriented Exploration Policy for Enhancing Long-Term User Experiences in Recommender Systems",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Reinforcement learning (RL) has gained traction for enhancing user long-term  experiences in recommender systems by effectively exploring users' interests. However, modern recommender system exhibit distinct user behavioral patterns among tens of millions of items, which increases the difficulty of exploration. For example, user behaviors with different activity levels require varying intensity of exploration, while previous studies often overlook this aspect and apply a uniform exploration strategy to all users, which ultimately hurts user experiences in the long run. To address these challenges, we propose User-Oriented Exploration Policy (UOEP), a novel approach facilitating fine-grained exploration among user groups. We first construct a distributional critic which allows policy optimization under varying quantile levels of cumulative reward feedbacks from users, representing user groups with varying activity levels. Guided by this critic, we devise a population of distinct actors aimed at effective and fine-grained exploration within its respective user group. To simultaneously enhance diversity and stability during the exploration process, we further introduce a population-level diversity regularization term and a supervision module. \nExperimental results on public recommendation datasets demonstrate that our approach outperforms all other baselines in terms of long-term performance, validating its user-oriented exploration effectiveness. Meanwhile, further analyses reveal our approach's additional benefits of improved performance for low-activity users as well as increased fairness among users.",
        "keywords": "Recommender System;Reinforcement Learning;Exploration",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Changshuo Zhang;Sirui Chen;Xiao Zhang;Sunhao Dai;Weijie Yu;Jun Xu",
        "authorids": "~Changshuo_Zhang2;~Sirui_Chen2;~Xiao_Zhang7;~Sunhao_Dai1;~Weijie_Yu1;~Jun_Xu1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://csr16.github.io/;https://pinkfloyd1989.github.io/Xiao_Zhang/;https://github.com/KID-22;;https://gsai.ruc.edu.cn/~junxu;https://scholar.google.com.hk/citations?user=iiitJeAAAAAJ&hl=en",
        "dblp": ";49/4478-34;314/6465;150/8498;90/514-1;349/0682",
        "google_scholar": "PoV08-oAAAAJ;https://scholar.google.com.hk/citations?user=5FZ6wbAAAAAJ;https://scholar.google.com.hk/citations?user=lXO-uZMAAAAJ;bSXRkNcAAAAJ;su14mcEAAAAJ;https://scholar.google.com.hk/citations?user=iiitJeAAAAAJ",
        "orcid": "0000-0001-7740-508X;0000-0001-7397-5632;0009-0002-7549-0860;;;0009-0001-8481-9421",
        "linkedin": ";;;;;%E6%98%8C%E7%A1%95-%E5%BC%A0-0352b4264/",
        "or_profile": "~Sirui_Chen2;~Xiao_Zhang7;~Sunhao_Dai1;~Weijie_Yu1;~Jun_Xu1;~ChangShuo_Zhang1",
        "aff": "University of Illinois, Urbana Champaign;Renmin University of China;Renmin University of China;University of International Business and Economics;Renmin University of China;Renmin University of China",
        "aff_domain": "illinois.edu;ruc.edu.cn;ruc.edu.cn;uibe.edu.cn;ruc.edu.cn;ruc.edu.cn",
        "position": "PhD student;Assistant Professor;PhD student;Assistant Professor;Full Professor;MS student",
        "bibtex": "@misc{\nzhang2024uoep,\ntitle={{UOEP}: User-Oriented Exploration Policy for Enhancing Long-Term User Experiences in Recommender Systems},\nauthor={Changshuo Zhang and Sirui Chen and Xiao Zhang and Sunhao Dai and Weijie Yu and Jun Xu},\nyear={2024},\nurl={https://openreview.net/forum?id=hJCinlknXn}\n}",
        "github": "",
        "project": "",
        "reviewers": "3uff;BY7j;L2ep",
        "site": "https://openreview.net/forum?id=hJCinlknXn",
        "pdf_size": 4239523,
        "rating": "3;5;8",
        "confidence": "4;3;3",
        "soundness": "2;3;4",
        "contribution": "2;2;4",
        "presentation": "2;3;4",
        "wc_summary": "98;77;68",
        "wc_strengths": "42;53;47",
        "wc_weaknesses": "167;253;45",
        "wc_questions": "6;6;86",
        "wc_review": "313;389;246",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1829;1281;1057",
        "reply_reviewers": "0;0;0",
        "reply_authors": "6;5;2",
        "rating_avg": [
            5.333333333333333,
            2.0548046676563256
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            81.0,
            12.569805089976535
        ],
        "wc_strengths_avg": [
            47.333333333333336,
            4.4969125210773475
        ],
        "wc_weaknesses_avg": [
            155.0,
            85.33854150773065
        ],
        "wc_questions_avg": [
            32.666666666666664,
            37.712361663282536
        ],
        "wc_review_avg": [
            316.0,
            58.418033745297066
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1389.0,
            324.2879378988165
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            4.333333333333333,
            1.699673171197595
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.8029550685469661,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11344880557086752808&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1;2;1;1",
        "aff_unique_norm": "University of Illinois Urbana-Champaign;Renmin University of China;University of International Business and Economics",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://illinois.edu;http://www.ruc.edu.cn;http://www.uibe.edu.cn",
        "aff_unique_abbr": "UIUC;RUC;UIBE",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Urbana-Champaign;",
        "aff_country_unique_index": "0;1;1;1;1;1",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "hJEMTDOwKx",
        "title": "Language Models as Semantic Indexers",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Semantic identifier (ID) is an important concept in information retrieval that aims to preserve the semantics of objects such as documents and items inside their IDs. Previous studies typically adopt a two-stage pipeline to learn semantic IDs by first procuring embeddings using off-the-shelf text encoders and then deriving IDs based on the embeddings. However, each step introduces potential information loss and there is usually an inherent mismatch between the distribution of embeddings within the latent space produced by text encoders and the anticipated distribution required for semantic indexing. Nevertheless, it is non-trivial to design a method that can learn the document\u2019s semantic representations and its hierarchical structure simultaneously, given that semantic IDs are discrete and sequentially structured, and the semantic supervision is deficient. In this paper, we introduce LMINDEXER, a self-supervised framework to learn semantic IDs with a generative language model. We tackle the challenge of sequential discrete ID by introducing a semantic indexer capable of generating neural sequential discrete representations with progressive training and contrastive learning. In response to the semantic supervision deficiency, we propose to train the model with a self-supervised document reconstruction objective. The learned semantic indexer can facilitate various downstream tasks, such as recommendation and retrieval. We conduct experiments on three tasks including recommendation, product search, and document retrieval on five datasets from various domains, where LMINDEXER outperforms competitive baselines significantly and consistently. Code is available at https://anonymous.4open.science/r/ICLR24-submit-B2E7/.",
        "keywords": "semantic indexing;self-supervised learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/21c401df1ffee105f75800c332b54bd6e1937fca.pdf",
        "author": "Bowen Jin;Hansi Zeng;Guoyin Wang;Xiusi Chen;Tianxin Wei;Ruirui Li;Zhengyang Wang;Zheng Li;Yang Li;Hanqing Lu;Suhang Wang;Jiawei Han;Xianfeng Tang",
        "authorids": "~Bowen_Jin1;~Hansi_Zeng1;~Guoyin_Wang1;~Xiusi_Chen1;~Tianxin_Wei1;~Ruirui_Li3;~Zhengyang_Wang1;~Zheng_Li9;~Yang_Li80;~Hanqing_Lu3;~Suhang_Wang1;~Jiawei_Han1;~Xianfeng_Tang1",
        "gender": "M;;M;M;;M;M;M;M;M;M;M;M",
        "homepage": "https://peterjin.me/;https://hansizeng.github.io/;;https://xiusic.github.io/;https://weitianxin.github.io/;https://ruiruili.mystrikingly.com/;;;;https://faculty.ist.psu.edu/szw494/;http://hanj.cs.illinois.edu/;https://xta.ng/;https://hsqmlzno1.github.io/",
        "dblp": "235/8066;;05/3838-2;210/1049;277/5800;12/8221-2;;;39/6752;136/9440;h/JiaweiHan.html;33/7694;10/1143-18",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;;https://scholar.google.com/citations?hl=en;JqGAil4AAAAJ;_LU2-kMAAAAJ;gYCtd6cAAAAJ;A4fNBtEAAAAJ;;pNYuJQIAAAAJ;cdT_WMMAAAAJ;https://scholar.google.com.tw/citations?user=Kv9AbjMAAAAJ;u1PEv-QAAAAJ;https://scholar.google.com.hk/citations?user=P6fwn4AAAAAJ",
        "orcid": "0000-0003-1295-2829;;;0000-0002-9713-8000;0000-0003-4450-2005;;0000-0002-5146-2884;;;0000-0003-3448-4878;0000-0002-3629-2696;;",
        "linkedin": "bowen-peter-jin/;;;xiusi-chen-53180583/;tianxin-wei-7063a2180/;;;yang-laurence-li-54023266;;;;xianfengtang/;",
        "or_profile": "~Bowen_Jin1;~Hansi_Zeng1;~Guoyin_Wang1;~Xiusi_Chen1;~Tianxin_Wei1;~Ruirui_Li3;~Zhengyang_Wang1;~Yang_Li80;~Hanqing_Lu3;~Suhang_Wang1;~Jiawei_Han1;~Xianfeng_Tang1;~zheng_li4",
        "aff": "University of Illinois, Urbana Champaign;University of Massachusetts at Amherst;Bytedance;University of California, Los Angeles;University of Illinois, Urbana-Champaign;Amazon;Amazon;;Amazon;Pennsylvania State University;University of Illinois at Urbana-Champaign (UIUC);Amazon;Amazon",
        "aff_domain": "illinois.edu;umass.edu;bytedance.com;ucla.edu;uiuc.edu;amazon.com;amazon.com;;amazon.com;psu.edu;illinois.edu;amazon.com;amazon.com",
        "position": "PhD student;PhD student;Principal Researcher;PhD student;PhD student;Researcher;Researcher;;Researcher;Assistant Professor;Full Professor;Researcher;Researcher",
        "bibtex": "@misc{\njin2024language,\ntitle={Language Models as Semantic Indexers},\nauthor={Bowen Jin and Hansi Zeng and Guoyin Wang and Xiusi Chen and Tianxin Wei and Ruirui Li and Zhengyang Wang and Zheng Li and Yang Li and Hanqing Lu and Suhang Wang and Jiawei Han and Xianfeng Tang},\nyear={2024},\nurl={https://openreview.net/forum?id=hJEMTDOwKx}\n}",
        "github": "",
        "project": "",
        "reviewers": "HnqK;4DWK;2Nr6;dU5G",
        "site": "https://openreview.net/forum?id=hJEMTDOwKx",
        "pdf_size": 1254820,
        "rating": "5;5;6;6",
        "confidence": "4;4;4;3",
        "soundness": "1;3;2;2",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "112;62;133;84",
        "wc_strengths": "33;78;60;59",
        "wc_weaknesses": "93;304;9;263",
        "wc_questions": "87;193;73;8",
        "wc_review": "325;637;275;414",
        "wc_reply_reviewers": "56;97;0;0",
        "wc_reply_authors": "748;996;303;856",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            97.75,
            26.984949508939238
        ],
        "wc_strengths_avg": [
            57.5,
            16.03901493234544
        ],
        "wc_weaknesses_avg": [
            167.25,
            120.8560610809404
        ],
        "wc_questions_avg": [
            90.25,
            66.39041723019972
        ],
        "wc_review_avg": [
            412.75,
            138.71260757407742
        ],
        "wc_reply_reviewers_avg": [
            38.25,
            40.90461465409496
        ],
        "wc_reply_authors_avg": [
            725.75,
            259.42857880349266
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            13,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 31,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10618922475077052397&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 11,
        "aff_unique_index": "0;1;2;3;4;5;5;5;6;0;5;5",
        "aff_unique_norm": "University of Illinois Urbana-Champaign;University of Massachusetts Amherst;ByteDance;University of California, Los Angeles;University of Illinois;Amazon;Pennsylvania State University",
        "aff_unique_dep": ";;;;;Amazon.com, Inc.;",
        "aff_unique_url": "https://illinois.edu;https://www.umass.edu;https://www.bytedance.com;https://www.ucla.edu;https://illinois.edu;https://www.amazon.com;https://www.psu.edu",
        "aff_unique_abbr": "UIUC;UMass Amherst;Bytedance;UCLA;UIUC;Amazon;PSU",
        "aff_campus_unique_index": "0;1;3;0;0",
        "aff_campus_unique": "Urbana-Champaign;Amherst;;Los Angeles",
        "aff_country_unique_index": "0;0;1;0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "hLT9cW4Afz",
        "title": "Causal Impact Index: A Causal Formulation of Citations",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Evaluating the significance of a paper is pivotal yet challenging for the scientific community. While the citation count is the most commonly used proxy for this purpose, they are widely criticized for failing to accurately reflect a paper\u2019s true impact. In this work, we propose a causal inference method, SYNMATCH, which adapts the traditional matching framework to high-dimensional text embeddings. Specifically, we encode each paper using the text embeddings by large language models, extract similar samples by cosine similarity, and synthesize a counterfactual sample by the weighted average of similar papers according to their similarity values. We apply the resulting metric, called CAUSALCITE, as a causal formulation of paper citations. We show its effectiveness on various criteria, such as high correlation with paper impact as reported by scientific experts on a previous dataset of 1K papers, and test-of-time awards for past papers, and sub-field stable behavior. We also provide a set of findings that can serve as suggested ways for future researchers to use our metric for a better understanding of a paper\u2019s quality.",
        "keywords": "High-dimensional causal inference;text analysis;matching;citation analysis;science of science",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/7398bb0566ebb520c071617db50733a6058eb69a.zip",
        "author": "Ishan Kumar;Zhijing Jin;Ehsan Mokhtarian;Siyuan Guo;Yuen Chen;Negar Kiyavash;Mrinmaya Sachan;Bernhard Sch\u00f6lkopf",
        "authorids": "~Ishan_Kumar1;~Zhijing_Jin1;~Ehsan_Mokhtarian1;~Siyuan_Guo1;~Yuen_Chen1;~Negar_Kiyavash1;~Mrinmaya_Sachan3;~Bernhard_Sch\u00f6lkopf1",
        "gender": "M;;M;F;F;F;;",
        "homepage": ";;;https://siyuanguo.com/;https://chenyuen0103.github.io/;https://people.epfl.ch/negar.kiyavash?lang=en;;",
        "dblp": ";;276/5445;;67/2614;85/4976;;",
        "google_scholar": ";;https://scholar.google.com/scholar?hl=en;;w5flVIsAAAAJ;7tBDvOwAAAAJ;;",
        "orcid": ";;;;;0000-0002-8545-7709;;",
        "linkedin": "ishan-kumar-a23807180/;;https://linkedin.com/in/ehsanmokhtarian/;;;;;",
        "or_profile": "~Ishan_Kumar1;~Zhijing_Jin1;~Ehsan_Mokhtarian1;~Siyuan_Guo1;~Yuen_Chen1;~Negar_Kiyavash1;~Mrinmaya_Sachan3;~Bernhard_Sch\u00f6lkopf1",
        "aff": ";;Swiss Federal Institute of Technology Lausanne;Max Planck Institute for Intelligent Systems, Max-Planck Institute;University of Illinois at Urbana-Champaign ;EPFL - EPF Lausanne;;",
        "aff_domain": ";;epfl.ch;tuebingen.mpg.de;illinois.edu;epfl.ch;;",
        "position": ";;PhD student;PhD student;PhD student;Full Professor;;",
        "bibtex": "@misc{\nkumar2024causal,\ntitle={Causal Impact Index: A Causal Formulation of Citations},\nauthor={Ishan Kumar and Zhijing Jin and Ehsan Mokhtarian and Siyuan Guo and Yuen Chen and Negar Kiyavash and Mrinmaya Sachan and Bernhard Sch{\\\"o}lkopf},\nyear={2024},\nurl={https://openreview.net/forum?id=hLT9cW4Afz}\n}",
        "github": "",
        "project": "",
        "reviewers": "tkEL;Hvdi;kS1d",
        "site": "https://openreview.net/forum?id=hLT9cW4Afz",
        "pdf_size": 807426,
        "rating": "3;3;3",
        "confidence": "4;4;3",
        "soundness": "2;2;2",
        "contribution": "2;2;2",
        "presentation": "2;3;3",
        "wc_summary": "17;82;24",
        "wc_strengths": "11;66;31",
        "wc_weaknesses": "188;515;89",
        "wc_questions": "219;60;2",
        "wc_review": "435;723;146",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            41.0,
            29.13188402192118
        ],
        "wc_strengths_avg": [
            36.0,
            22.73030282830976
        ],
        "wc_weaknesses_avg": [
            264.0,
            182.02747045432457
        ],
        "wc_questions_avg": [
            93.66666666666667,
            91.7327034862098
        ],
        "wc_review_avg": [
            434.6666666666667,
            235.55938152029142
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:g61pxq19f2gJ:scholar.google.com/&scioq=Causal+Impact+Index:+A+Causal+Formulation+of+Citations&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Swiss Federal Institute of Technology Lausanne;Max Planck Institute for Intelligent Systems;University of Illinois Urbana-Champaign;EPFL",
        "aff_unique_dep": ";Intelligent Systems;;",
        "aff_unique_url": "https://www.epfl.ch;https://www.mpi-is.mpg.de;https://illinois.edu;https://www.epfl.ch",
        "aff_unique_abbr": "EPFL;MPI-IS;UIUC;EPFL",
        "aff_campus_unique_index": "0;2;0",
        "aff_campus_unique": "Lausanne;;Urbana-Champaign",
        "aff_country_unique_index": "0;1;2;0",
        "aff_country_unique": "Switzerland;Germany;United States"
    },
    {
        "title": "Contrastive Learning is Spectral Clustering on Similarity Graph",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18101",
        "id": "hLZQTFGToA",
        "author_site": "Yifan Zhang, Zhiquan Tan, Jingqin Yang, Yang Yuan",
        "tldr": "",
        "abstract": "Contrastive learning is a powerful self-supervised learning method, but we have a limited theoretical understanding of how it works and why it works. In this paper, we prove that contrastive learning with the standard InfoNCE loss is equivalent to spectral clustering on the similarity graph. Using this equivalence as the building block, we extend our analysis to the CLIP model and rigorously characterize how similar multi-modal objects are embedded together. Motivated by our theoretical insights, we introduce the Kernel-InfoNCE loss, incorporating mixtures of kernel functions that outperform the standard Gaussian kernel on several vision datasets.",
        "keywords": "contrastive learning theory;self-supervised learning theory;representation learning theory;CLIP;multi-modal learning theory;markov random field;kernel method",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Zhiquan Tan;Yifan Zhang;Jingqin Yang;Yang Yuan",
        "authorids": "~Zhiquan_Tan1;~Yifan_Zhang16;~Jingqin_Yang2;~Yang_Yuan4",
        "gender": "M;;M;M",
        "homepage": ";;https://github.com/yjqqqaq;http://people.iiis.tsinghua.edu.cn/~yuanyang/index.html",
        "dblp": "326/0177;;267/1955;",
        "google_scholar": ";;;",
        "orcid": ";;;",
        "linkedin": "https://www.linkedin.cn/incareer/in/ACoAAC1A8_QBFX8OlchWmVI_pNXN4zm_t6vPKCs;;;",
        "or_profile": "~Zhiquan_Tan1;~Yifan_Zhang16;~Jingqin_Yang2;~Yang_Yuan4",
        "aff": "Tsinghua University;;Tsinghua University;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;;tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "PhD student;;PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\ntan2024contrastive,\ntitle={Contrastive Learning is Spectral Clustering on Similarity Graph},\nauthor={Zhiquan Tan and Yifan Zhang and Jingqin Yang and Yang Yuan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=hLZQTFGToA}\n}",
        "github": "",
        "project": "",
        "reviewers": "Hqsc;5UyX;TB2Y;PnKu",
        "pdf_size": 1205329,
        "rating": "5;6;6;10",
        "confidence": "4;3;4;3",
        "soundness": "3;3;3;4",
        "contribution": "2;3;3;4",
        "presentation": "3;3;2;3",
        "wc_summary": "52;72;67;190",
        "wc_strengths": "62;60;32;32",
        "wc_weaknesses": "207;165;273;89",
        "wc_questions": "17;41;108;2",
        "wc_review": "338;338;480;313",
        "wc_reply_reviewers": "0;0;54;0",
        "wc_reply_authors": "575;855;1874;215",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "2;2;4;1",
        "rating_avg": [
            6.75,
            1.920286436967152
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            95.25,
            55.19680697286755
        ],
        "wc_strengths_avg": [
            46.5,
            14.517231140957975
        ],
        "wc_weaknesses_avg": [
            183.5,
            66.77387213573884
        ],
        "wc_questions_avg": [
            42.0,
            40.564763033943635
        ],
        "wc_review_avg": [
            367.25,
            65.89148275763719
        ],
        "wc_reply_reviewers_avg": [
            13.5,
            23.382685902179844
        ],
        "wc_reply_authors_avg": [
            879.75,
            617.2339001545524
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            1.0897247358851685
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.6509445549041193,
        "gs_citation": 20,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11132671949487658080&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=hLZQTFGToA",
        "pdf": "https://openreview.net/pdf?id=hLZQTFGToA",
        "email": "tsinghua.edu.cn;;tsinghua.edu.cn;tsinghua.edu.cn",
        "author_num": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Tsinghua University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "hMRpwnQTIt",
        "title": "Learning to Select In-context Examples from Reward",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large language models (LLMs) have impressive in-context learning ability. When prompted with a few examples of the same task, LLMs can solve new questions without task-specific training, demonstrating their ability of in-context learning. \nRecent studies revealed that the selection of contexts can significantly affect the LM\u2019s answer quality. \nIn this work, we propose Reward-Guided Example Selection(ReGES), a novel method that learns to iteratively select in-context examples conditioned on the input question from feedback.\nGiven a task and an example set, we use the MCTS algorithm to select different in-context examples, collect the LLM\u2019s outputs, and evaluate their accuracies. \nThen, we leverage the offline RL algorithm to train a value function to estimate the reward from in-context learning. \nDuring inference, we iteratively select a sequence of in-context examples for the given question based on the prediction of the value function.\nOur method substantially improves the performance of several LLMs (Vicuna, LLaMA-2, GPT3.5) on four benchmarks (GSM8K, Strategy QA, TREC, QNLI), and can be combined with in-context example retrieval method to give further improvement. \nWhen combined with BM25, ReGES achieves up to $+6.6$ accuracy improvement with an average of $+2.25$ over strong baselines.\nMoreover, we observe consistent improvement while applying the in-context examples selected by our method to language models that are not used during the training phase, demonstrating its generalization ability.",
        "keywords": "Natural language processing;In-context learning;Large Language Model;GPT;LLaMA;Vicuna",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Ji Li;Yikang Shen;Shun Zhang;Chuang Gan",
        "authorids": "~Ji_Li6;~Yikang_Shen1;~Shun_Zhang6;~Chuang_Gan1",
        "gender": "M;M;;M",
        "homepage": "https://github.com/Iiji;;https://shunzh.github.io/;http://people.csail.mit.edu/ganchuang/",
        "dblp": ";152/8226;;139/6993",
        "google_scholar": "XLJrjN8AAAAJ;qff5rRYAAAAJ;;PTeSCbIAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Ji_Li6;~Yikang_Shen1;~Shun_Zhang6;~Chuang_Gan1",
        "aff": "Tsinghua University;International Business Machines;MIT-IBM Watson AI Lab;University of Massachusetts at Amherst",
        "aff_domain": "tsinghua.edu.cn;ibm.com;ibm.com;umass.edu",
        "position": "Undergrad student;Researcher;Researcher;Assistant Professor",
        "bibtex": "@misc{\nli2024learning,\ntitle={Learning to Select In-context Examples from Reward},\nauthor={Ji Li and Yikang Shen and Shun Zhang and Chuang Gan},\nyear={2024},\nurl={https://openreview.net/forum?id=hMRpwnQTIt}\n}",
        "github": "",
        "project": "",
        "reviewers": "vcLv;GVqZ;PmkA;dZ1D",
        "site": "https://openreview.net/forum?id=hMRpwnQTIt",
        "pdf_size": 405496,
        "rating": "3;5;5;5",
        "confidence": "4;4;4;3",
        "soundness": "2;3;2;2",
        "contribution": "2;2;2;2",
        "presentation": "2;3;2;3",
        "wc_summary": "95;52;72;93",
        "wc_strengths": "100;32;95;38",
        "wc_weaknesses": "242;99;84;297",
        "wc_questions": "18;52;44;346",
        "wc_review": "455;235;295;774",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            78.0,
            17.507141400011598
        ],
        "wc_strengths_avg": [
            66.25,
            31.371762781201824
        ],
        "wc_weaknesses_avg": [
            180.5,
            91.25376704553078
        ],
        "wc_questions_avg": [
            115.0,
            133.9589489358587
        ],
        "wc_review_avg": [
            439.75,
            209.0638359449094
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:F_bVdlanQDcJ:scholar.google.com/&scioq=Learning+to+Select+In-context+Examples+from+Reward&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Tsinghua University;International Business Machines Corporation;Massachusetts Institute of Technology;University of Massachusetts Amherst",
        "aff_unique_dep": ";;IBM Watson AI Lab;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.ibm.com;https://www.mitibmwatsonailab.org;https://www.umass.edu",
        "aff_unique_abbr": "THU;IBM;MIT-IBM AI Lab;UMass Amherst",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Amherst",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Lemur: Harmonizing Natural Language and Code for Language Agents",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18100",
        "id": "hNhwSmtXRh",
        "author_site": "Yiheng Xu, Hongjin SU, Chen Xing, Boyu Mi, Qian Liu, Weijia Shi, Binyuan Hui, Fan Zhou, Yitao Liu, Tianbao Xie, Zhoujun Cheng, Siheng Zhao, Lingpeng Kong, Bailin Wang, Caiming Xiong, Tao Yu",
        "tldr": "",
        "abstract": "We introduce Lemur and Lemur-Chat, openly accessible language models optimized\nfor both natural language and coding capabilities to serve as the backbone\nof versatile language agents. The evolution from language chat models to\nfunctional language agents demands that models not only master human interaction,\nreasoning, and planning but also ensure grounding in the relevant environments.\nThis calls for a harmonious blend of language and coding capabilities\nin the models. Lemur and Lemur-Chat are proposed to address this necessity,\ndemonstrating balanced proficiencies in both domains, unlike existing\nopen-source models that tend to specialize in either. Through meticulous pretraining\nusing a code-intensive corpus and instruction fine-tuning on text and code\ndata, our models achieve state-of-the-art averaged performance across diverse\ntext and coding benchmarks. Comprehensive experiments demonstrate Lemur\u2019s\nsuperiority over existing open-source models and its proficiency across various\nagent tasks involving human communication, tool usage, and interaction under\nfully- and partially- observable environments. The harmonization between natural\nand programming languages enables Lemur-Chat to significantly narrow the\ngap with proprietary models on agent abilities, providing key insights into developing\nadvanced open-source agents adept at reasoning, planning, and operating\nseamlessly across environments. Our model and code have been open-sourced at\nhttps://github.com/OpenLemur/Lemur.",
        "keywords": "large language model;agent;code generation;reasoning;decision making",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Yiheng Xu;Hongjin SU;Chen Xing;Boyu Mi;Qian Liu;Weijia Shi;Binyuan Hui;Fan Zhou;Yitao Liu;Tianbao Xie;Zhoujun Cheng;Siheng Zhao;Lingpeng Kong;Bailin Wang;Caiming Xiong;Tao Yu",
        "authorids": "~Yiheng_Xu1;~Hongjin_SU1;~Chen_Xing2;~Boyu_Mi1;~Qian_Liu2;~Weijia_Shi1;~Binyuan_Hui1;~Fan_Zhou6;~Yitao_Liu2;~Tianbao_Xie1;~Zhoujun_Cheng1;~Siheng_Zhao1;~Lingpeng_Kong1;~Bailin_Wang3;~Caiming_Xiong1;~Tao_Yu5",
        "gender": ";;F;M;M;;F;M;M;M;M;;M;;M;M",
        "homepage": ";https://hongjin-su.github.io/;;;http://siviltaram.github.io/;https://weijiashi.notion.site/;https://huybery.github.io/;https://koalazf99.github.io/;https://yitaoliu17.com/;https://tianbaoxie.com;http://blankcheng.github.io;https://sihengz02.github.io/;https://ikekonglp.github.io/;;http://cmxiong.com/;https://taoyds.github.io/",
        "dblp": ";;;;;132/80601;246/4699;;128/1821;;;341/1176;144/7656;;80/7282;67/1014-9",
        "google_scholar": ";zDsbIcgAAAAJ;tAUdLM0AAAAJ;https://scholar.google.com/citations?view_op=list_works;bcbeUo0AAAAJ;https://scholar.google.com/citations?hl=en;RBb3ItMAAAAJ;qi8UzmkAAAAJ;;https://scholar.google.com/citations?hl=zh-CN;t41vrrQAAAAJ;l7EAauYAAAAJ;f1hBi5wAAAAJ;;vaSdahkAAAAJ;5_Fn5CIAAAAJ",
        "orcid": ";;;;;0000-3200-0000-0011;;;;;;;;;;",
        "linkedin": ";hongjin-su-7b24b122b/;chen-xing-83082074/;;;weijia-shi-773768112;;;%E4%BA%A6%E9%9F%AC-%E5%88%98-9ba124257/;;;;;;caiming-xiong-150a1417;tao-yu-b9b551a5/",
        "or_profile": "~Yiheng_Xu1;~Hongjin_SU1;~Chen_Xing2;~Boyu_Mi1;~Qian_Liu2;~Weijia_Shi1;~Binyuan_Hui1;~Fan_Zhou6;~Yitao_Liu2;~Tianbao_Xie1;~Zhoujun_Cheng1;~Siheng_Zhao1;~Lingpeng_Kong1;~Bailin_Wang3;~Caiming_Xiong1;~Tao_Yu5",
        "aff": ";the University of Hong Kong, University of Hong Kong;SalesForce.com;Zhejiang University;Tiktok;University of Washington, Seattle;Alibaba Group;Shanghai Jiaotong University;The University of Hong Kong;University of Hong Kong;Shanghai Jiaotong University;Nanjing University;Department of Computer Science, The University of Hong Kong;;Salesforce Research;The University of Hong Kong",
        "aff_domain": ";cs.hku.hk;salesforce.com;zju.edu.cn;bytedance.com;uw.edu;alibaba-inc.com;sjtu.edu.cn;hku.hk;cs.hku.hk;sjtu.edu.cn;nju.edu.cn;cs.hku.hk;;salesforce.com;hku.hk",
        "position": ";PhD student;Researcher;Undergrad student;Researcher;PhD student;Researcher;MS student;Undergrad student;PhD student;MS student;Undergrad student;Assistant Professor;;Research Scientist;Assistant Professor",
        "bibtex": "@inproceedings{\nxu2024lemur,\ntitle={Lemur: Harmonizing Natural Language and Code for Language Agents},\nauthor={Yiheng Xu and Hongjin SU and Chen Xing and Boyu Mi and Qian Liu and Weijia Shi and Binyuan Hui and Fan Zhou and Yitao Liu and Tianbao Xie and Zhoujun Cheng and Siheng Zhao and Lingpeng Kong and Bailin Wang and Caiming Xiong and Tao Yu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=hNhwSmtXRh}\n}",
        "github": "",
        "project": "",
        "reviewers": "JHRb;nTpx;QCzC;Ycpy",
        "pdf_size": 591046,
        "rating": "6;6;8;8",
        "confidence": "3;4;4;3",
        "soundness": "3;2;4;4",
        "contribution": "2;2;4;4",
        "presentation": "3;3;4;4",
        "wc_summary": "116;104;123;34",
        "wc_strengths": "57;29;137;52",
        "wc_weaknesses": "92;64;61;89",
        "wc_questions": "14;10;36;41",
        "wc_review": "279;207;357;216",
        "wc_reply_reviewers": "0;9;6;0",
        "wc_reply_authors": "1112;655;391;541",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            3.0,
            1.0
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            94.25,
            35.442735503908274
        ],
        "wc_strengths_avg": [
            68.75,
            40.794454279963105
        ],
        "wc_weaknesses_avg": [
            76.5,
            14.080127840328723
        ],
        "wc_questions_avg": [
            25.25,
            13.442005058770064
        ],
        "wc_review_avg": [
            264.75,
            60.05154036325796
        ],
        "wc_reply_reviewers_avg": [
            3.75,
            3.897114317029974
        ],
        "wc_reply_authors_avg": [
            674.75,
            269.24930362026936
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            16,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 48,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14859965768820951174&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=hNhwSmtXRh",
        "pdf": "https://openreview.net/pdf?id=hNhwSmtXRh",
        "email": ";cs.hku.hk;salesforce.com;zju.edu.cn;bytedance.com;uw.edu;alibaba-inc.com;sjtu.edu.cn;hku.hk;cs.hku.hk;sjtu.edu.cn;nju.edu.cn;cs.hku.hk;;salesforce.com;hku.hk",
        "author_num": 16,
        "aff_unique_index": "0;1;2;3;4;5;6;0;0;6;7;0;1;0",
        "aff_unique_norm": "University of Hong Kong;Salesforce;Zhejiang University;TikTok;University of Washington;Alibaba Group;Shanghai Jiao Tong University;Nanjing University",
        "aff_unique_dep": ";;;;;;;",
        "aff_unique_url": "https://www.hku.hk;https://www.salesforce.com;https://www.zju.edu.cn;https://www.tiktok.com;https://www.washington.edu;https://www.alibaba.com;https://www.sjtu.edu.cn;https://www.nju.edu.cn",
        "aff_unique_abbr": "HKU;Salesforce;ZJU;TikTok;UW;Alibaba;SJTU;Nanjing U",
        "aff_campus_unique_index": "0;2;0;0;0;0",
        "aff_campus_unique": "Hong Kong SAR;;Seattle",
        "aff_country_unique_index": "0;1;0;0;1;0;0;0;0;0;0;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "hO4z2uaLqi",
        "title": "Permutations improve performance in three-dimensional bin packing problem",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In recent years, with the advent of deep learning and reinforcement learning, researchers have begun to explore the use of deep reinforcement learning to solve the three-dimensional bin packing problem. However, current innovations in the 3D bin packing problem primarily involve modifications to the network architecture or the incorporation of heuristic rules. Efforts to improve performance from the perspective of function approximation are relatively scarce. As is well known, one of the crucial theoretical foundations of deep learning is the ability of neural networks to approximate many functions. As such, we propose a method based on approximation theory that uses permutations to better approximate policy functions, which we refer to as Permutation Packing. Nonetheless, due to the high memory requirements when the number of permutations is large, we also propose a memory-efficient variation of Permutation Packing, which we call Limited-Memory Permutation Packing. Both methods can be efficiently integrated with existing models. We demonstrate the effectiveness of both Permutation Packing and Limited-Memory Permutation Packing from both theoretical and experimental perspectives. Furthermore, based on our theoretical and experimental results, we find that our methods can effectively improve performance even without retraining the model.",
        "keywords": "permutation;deep reinforcement learning; 3D packing;",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/9e51697dffa0f4986bdafeb28b15020b720841ef.zip",
        "author": "Xinyuan Tian;pengzhan qu;Hongsheng Qi",
        "authorids": "~Xinyuan_Tian1;~pengzhan_qu1;~Hongsheng_Qi1",
        "gender": ";;M",
        "homepage": ";;https://lenovo.com",
        "dblp": ";;",
        "google_scholar": ";;",
        "orcid": ";0000-0001-5910-3694;",
        "linkedin": ";;hong-sheng-qi-a542151/",
        "or_profile": "~Xinyuan_Tian1;~pengzhan_qu1;~Hongsheng_Qi1",
        "aff": ";Lenovo;Xi'an University of Electronic Science and Technology",
        "aff_domain": ";lenovo.com;xidian.edu.cn",
        "position": ";Principal Researcher;Lecturer",
        "bibtex": "@misc{\ntian2024permutations,\ntitle={Permutations improve performance in three-dimensional bin packing problem},\nauthor={Xinyuan Tian and pengzhan qu and Hongsheng Qi},\nyear={2024},\nurl={https://openreview.net/forum?id=hO4z2uaLqi}\n}",
        "github": "",
        "project": "",
        "reviewers": "3QSB;5pxn;Pj8c;PXmX",
        "site": "https://openreview.net/forum?id=hO4z2uaLqi",
        "pdf_size": 381774,
        "rating": "3;3;5;5",
        "confidence": "5;3;3;2",
        "soundness": "2;2;4;3",
        "contribution": "1;2;3;3",
        "presentation": "1;2;2;1",
        "wc_summary": "53;90;206;65",
        "wc_strengths": "41;55;42;86",
        "wc_weaknesses": "136;313;73;44",
        "wc_questions": "6;12;99;13",
        "wc_review": "236;470;420;208",
        "wc_reply_reviewers": "47;0;65;0",
        "wc_reply_authors": "73;502;203;128",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.25,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            103.5,
            60.66506408139696
        ],
        "wc_strengths_avg": [
            56.0,
            18.179658962697843
        ],
        "wc_weaknesses_avg": [
            141.5,
            104.45214215132211
        ],
        "wc_questions_avg": [
            32.5,
            38.48701079585163
        ],
        "wc_review_avg": [
            333.5,
            113.32585759657854
        ],
        "wc_reply_reviewers_avg": [
            28.0,
            28.71410803072246
        ],
        "wc_reply_authors_avg": [
            226.5,
            165.61778286162388
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.6882472016116854,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Sg_Q-wceYBoJ:scholar.google.com/&scioq=Permutations+improve+performance+in+three-dimensional+bin+packing+problem&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Lenovo Group Limited;Xi'an University of Electronic Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.lenovo.com;http://www.xidian.edu.cn/",
        "aff_unique_abbr": "Lenovo;Xidian University",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Xi'an",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Piecewise Linear Parametrization of Policies: Towards Interpretable Deep Reinforcement Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18099",
        "id": "hOMVq57Ce0",
        "author_site": "Maxime Wabartha, Joelle Pineau",
        "tldr": "",
        "abstract": "Learning inherently interpretable policies is a central challenge in the path to developing autonomous agents that humans can trust. Linear policies can justify their decisions while interacting in a dynamic environment, but their reduced expressivity prevents them from solving hard tasks. Instead, we argue for the use of piecewise-linear policies. We carefully study to what extent they can retain the interpretable properties of linear policies while reaching competitive performance with neural baselines. In particular, we propose the HyperCombinator (HC), a piecewise-linear neural architecture expressing a policy with a controllably small number of sub-policies. Each sub-policy is linear with respect to interpretable features, shedding light on the decision process of the agent without requiring an additional explanation model. We evaluate HC policies in control and navigation experiments, visualize the improved interpretability of the agent and highlight its trade-off with performance. Moreover, we validate that the restricted model class that the HyperCombinator belongs to is compatible with the algorithmic constraints of various reinforcement learning algorithms.",
        "keywords": "Reinforcement learning;interpretability;control;navigation;transparency;discrete",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Maxime Wabartha;Joelle Pineau",
        "authorids": "~Maxime_Wabartha1;~Joelle_Pineau1",
        "gender": ";F",
        "homepage": ";http://www.cs.mcgill.ca/~jpineau",
        "dblp": ";p/JoellePineau",
        "google_scholar": ";https://scholar.google.ca/citations?user=CEt6_mMAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Maxime_Wabartha1;~Joelle_Pineau1",
        "aff": ";Meta Facebook",
        "aff_domain": ";fb.com",
        "position": ";Researcher Manager",
        "bibtex": "@inproceedings{\nwabartha2024piecewise,\ntitle={Piecewise Linear Parametrization of Policies: Towards Interpretable Deep Reinforcement Learning},\nauthor={Maxime Wabartha and Joelle Pineau},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=hOMVq57Ce0}\n}",
        "github": "",
        "project": "",
        "reviewers": "KsbR;j8Wd;8HLj;yR55",
        "pdf_size": 3094951,
        "rating": "3;6;6;8",
        "confidence": "3;5;3;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "68;135;87;259",
        "wc_strengths": "69;71;55;87",
        "wc_weaknesses": "106;949;199;31",
        "wc_questions": "13;31;64;85",
        "wc_review": "256;1186;405;462",
        "wc_reply_reviewers": "0;376;251;15",
        "wc_reply_authors": "839;3706;836;280",
        "reply_reviewers": "0;3;1;1",
        "reply_authors": "3;7;3;2",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            137.25,
            74.4122805724969
        ],
        "wc_strengths_avg": [
            70.5,
            11.346805717910216
        ],
        "wc_weaknesses_avg": [
            321.25,
            367.28488602173655
        ],
        "wc_questions_avg": [
            48.25,
            28.01227409547465
        ],
        "wc_review_avg": [
            577.25,
            359.41993197372904
        ],
        "wc_reply_reviewers_avg": [
            160.5,
            159.34318309861894
        ],
        "wc_reply_authors_avg": [
            1415.25,
            1342.0062173850015
        ],
        "reply_reviewers_avg": [
            1.25,
            1.0897247358851685
        ],
        "reply_authors_avg": [
            3.75,
            1.920286436967152
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.08084520834544431,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17760499277202009526&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=hOMVq57Ce0",
        "pdf": "https://openreview.net/pdf?id=hOMVq57Ce0",
        "email": ";fb.com",
        "author_num": 2,
        "aff_unique_index": "0",
        "aff_unique_norm": "Meta",
        "aff_unique_dep": "Meta Platforms, Inc.",
        "aff_unique_url": "https://meta.com",
        "aff_unique_abbr": "Meta",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Communication-Efficient Gradient Descent-Accent Methods for Distributed Variational Inequalities: Unified Analysis and Local Updates",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18098",
        "id": "hORCalGn3Z",
        "author_site": "Siqi Zhang, Sayantan Choudhury, Sebastian Stich, Nicolas Loizou",
        "tldr": "",
        "abstract": "Distributed and federated learning algorithms and techniques associated primarily with minimization problems. However, with the increase of minimax optimization and variational inequality problems in machine learning, the necessity of designing efficient distributed/federated learning approaches for these problems is becoming more apparent. In this paper, we provide a unified convergence analysis of communication-efficient local training methods for distributed variational inequality problems (VIPs). Our approach is based on a general key assumption on the stochastic estimates that allows us to propose and analyze several novel local training algorithms under a single framework for solving a class of structured non-monotone VIPs. We present the first local gradient descent-accent algorithms with provable improved communication complexity for solving distributed variational inequalities on heterogeneous data. The general algorithmic framework recovers state-of-the-art algorithms and their sharp convergence guarantees when the setting is specialized to minimization or minimax optimization problems. Finally, we demonstrate the strong performance of the proposed algorithms compared to state-of-the-art methods when solving federated minimax optimization problems.",
        "keywords": "Federated Learning;Variational Inequality;Minimax Optimization;Communication Complexity",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Siqi Zhang;Sayantan Choudhury;Sebastian U Stich;Nicolas Loizou",
        "authorids": "~Siqi_Zhang2;~Sayantan_Choudhury1;~Sebastian_U_Stich1;~Nicolas_Loizou1",
        "gender": "M;M;M;M",
        "homepage": "https://siqi-z.github.io/;https://sites.google.com/view/sayantan-homepage/home;https://www.sstich.ch;https://nicolasloizou.github.io/",
        "dblp": ";;04/10549;173/4958",
        "google_scholar": "0M171lEAAAAJ;;https://scholar.google.ch/citations?user=8l-mDfQAAAAJ;https://scholar.google.co.uk/citations?user=mvDmzAQAAAAJ",
        "orcid": ";;;",
        "linkedin": ";sayantan-choudhury-21168941;;",
        "or_profile": "~Siqi_Zhang2;~Sayantan_Choudhury1;~Sebastian_U_Stich1;~Nicolas_Loizou1",
        "aff": "Johns Hopkins University;Johns Hopkins University;CISPA Helmholtz Center for Information Security;Johns Hopkins University",
        "aff_domain": "jhu.edu;jhu.edu;cispa.de;jhu.edu",
        "position": "Postdoc;PhD student;Tenure Track Faculty;Assistant Professor",
        "bibtex": "@inproceedings{\nzhang2024communicationefficient,\ntitle={Communication-Efficient Gradient Descent-Accent Methods for Distributed Variational Inequalities: Unified Analysis and Local Updates},\nauthor={Siqi Zhang and Sayantan Choudhury and Sebastian U Stich and Nicolas Loizou},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=hORCalGn3Z}\n}",
        "github": "",
        "project": "",
        "reviewers": "5mwf;HQew;bdRp;5WaQ",
        "pdf_size": 757858,
        "rating": "5;6;6;8",
        "confidence": "3;3;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;4;3",
        "wc_summary": "34;103;60;63",
        "wc_strengths": "42;22;32;114",
        "wc_weaknesses": "62;67;74;35",
        "wc_questions": "23;6;29;64",
        "wc_review": "161;198;195;276",
        "wc_reply_reviewers": "43;39;0;30",
        "wc_reply_authors": "728;680;686;810",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            65.0,
            24.66779276708802
        ],
        "wc_strengths_avg": [
            52.5,
            36.204281514760105
        ],
        "wc_weaknesses_avg": [
            59.5,
            14.773286702694158
        ],
        "wc_questions_avg": [
            30.5,
            21.10094784600919
        ],
        "wc_review_avg": [
            207.5,
            42.13371571556442
        ],
        "wc_reply_reviewers_avg": [
            28.0,
            16.837458240482736
        ],
        "wc_reply_authors_avg": [
            726.0,
            51.90375708944392
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.6882472016116854,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9823167557917674772&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=hORCalGn3Z",
        "pdf": "https://openreview.net/pdf?id=hORCalGn3Z",
        "email": "jhu.edu;jhu.edu;cispa.de;jhu.edu",
        "author_num": 4,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Johns Hopkins University;CISPA Helmholtz Center for Information Security",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.jhu.edu;https://www.cispa.de/",
        "aff_unique_abbr": "JHU;CISPA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "United States;Germany"
    },
    {
        "id": "hOkDxL1Cwd",
        "title": "How to estimate the emotions hidden behind spatio-temporal",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Emotion estimation of online spatiotemporal behavior is a\ntechnique for studying mental health and its changing laws\nbased on spatiotemporal trajectory data of objects. According\nto WHO data, the proportion of patients with depression\nworldwide is as high as 3.7%, and mental health detection\ntechnology has become a new hotspot in current international\nresearch. Traditional technologies mainly collect physiological data such as heart rate, blood pressure, blood oxygen and\nsleep through wearable devices (such as wristbands) to\nachieve online analysis of mental health levels. However, the\nlow measurement accuracy of wearable devices makes it difficult to meet the quality requirements for emotion estimation.\nMore importantly, emotional changes are not only affected\nby physiological factors, but social factors are more important. This paper studies the relationship between the object's spatiotemporal behavior and emotional state, focusing\non the mechanism of the object's social behavior pattern and\nits changes on emotional changes. A social activity pattern\nextraction method based on spatio-temporal trajectory data is\nproposed, a social activity sequence expression model of the\nsubject's daily behavior is established, and the mapping relationship between the social activity sequence and the emotional index under multi-resolution is explored. The experimental results show that the object's social and social activity\npatterns are closely related to its emotional index. The proposed SADS emotion estimation model is better than the\nbaseline paper on both SAPD22111510 and SAPD23031530\ndatasets, with an average increase in accuracy of 3.9% and\n8.1% respectively. For the first time, the paper expands the\nresearch object of online emotion estimation from traditional\nspatiotemporal behavior to social behavior pattern research,\nwhich provides new research ideas and technical approaches\nfor online emotion estimation research.",
        "keywords": "Behavior pattern analysis;Emotional perception;Spatiotemporal trajectory",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Chengcheng Chen",
        "authorids": "~Chengcheng_Chen1",
        "gender": "M",
        "homepage": "http://www.baidu.com",
        "dblp": "",
        "google_scholar": "",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Chengcheng_Chen1",
        "aff": "Xidian University",
        "aff_domain": "xidian.edu.cn",
        "position": "MS student",
        "bibtex": "@misc{\nchen2024how,\ntitle={How to estimate the emotions hidden behind spatio-temporal},\nauthor={Chengcheng Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=hOkDxL1Cwd}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=hOkDxL1Cwd",
        "pdf_size": 573477,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:9tdBhwwh6FwJ:scholar.google.com/&scioq=How+to+estimate+the+emotions+hidden+behind+spatio-temporal&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Xidian University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.xidian.edu.cn/",
        "aff_unique_abbr": "Xidian",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "title": "Langevin Monte Carlo for strongly log-concave distributions: Randomized midpoint revisited",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18097",
        "id": "hOxgrGM63n",
        "author_site": "LU YU, Avetik Karagulyan, Arnak Dalalyan",
        "tldr": "",
        "abstract": "We revisit the problem of sampling from a target distribution that has a smooth strongly log-concave density everywhere in $\\mathbb{R}^p$. In this context, if no additional density information is available, the randomized midpoint discretization for the kinetic Langevin diffusion is known to be the most scalable method in high dimensions with large condition numbers. Our main result is a nonasymptotic and easy to compute upper bound on the $W_2$-error of this method. To provide a more thorough explanation of our method for establishing the computable upper bound, we conduct an analysis of the midpoint discretization for the vanilla Langevin process. This analysis helps to clarify the underlying principles and provides valuable insights that we use to establish an improved upper bound for the kinetic Langevin process with the midpoint discretization. Furthermore, by applying these techniques we establish new guarantees for the kinetic Langevin process with Euler discretization, which have a better dependence on the condition number than existing upper bounds",
        "keywords": "Markov Chain Monte Carlo;Kinetic Langevin;Langevin algorithm;Midpoint method;Mixing rate",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/af61d934b3cf387f3e5dbef869facae5e8fccd05.pdf",
        "author": "Lu Yu;Avetik Karagulyan;Arnak S. Dalalyan",
        "authorids": "~Lu_Yu7;~Avetik_Karagulyan1;~Arnak_S._Dalalyan2",
        "gender": ";M;M",
        "homepage": "https://sites.google.com/view/luyu-stats;https://avetx.github.io/;https://adalalyan.github.io/",
        "dblp": ";207/8322;87/1594",
        "google_scholar": "tvbx-fcAAAAJ;1-_KDtoAAAAJ;https://scholar.google.fr/citations?user=avlybF8AAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Lu_Yu7;~Avetik_Karagulyan1;~Arnak_Dalalyan1",
        "aff": "Ecole Nationale de la Statistique et de l'Administration Economique;King Abdullah University of Science and Technology;",
        "aff_domain": "ensae.fr;kaust.edu.sa;",
        "position": "Postdoc;Postdoc;",
        "bibtex": "@inproceedings{\nyu2024langevin,\ntitle={Langevin Monte Carlo for strongly log-concave distributions: Randomized midpoint revisited},\nauthor={Lu Yu and Avetik Karagulyan and Arnak S. Dalalyan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=hOxgrGM63n}\n}",
        "github": "",
        "project": "",
        "reviewers": "FzXn;gtQ6;Y55L;4YVq",
        "pdf_size": 753765,
        "rating": "5;6;6;8",
        "confidence": "4;2;3;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "2;4;4;3",
        "wc_summary": "34;116;171;50",
        "wc_strengths": "65;59;27;65",
        "wc_weaknesses": "63;122;63;17",
        "wc_questions": "14;23;17;39",
        "wc_review": "176;320;278;171",
        "wc_reply_reviewers": "0;0;0;7",
        "wc_reply_authors": "509;446;219;93",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            92.75,
            54.64144489304799
        ],
        "wc_strengths_avg": [
            54.0,
            15.7797338380595
        ],
        "wc_weaknesses_avg": [
            66.25,
            37.265097611572145
        ],
        "wc_questions_avg": [
            23.25,
            9.65336728815391
        ],
        "wc_review_avg": [
            236.25,
            64.50726703248247
        ],
        "wc_reply_reviewers_avg": [
            1.75,
            3.031088913245535
        ],
        "wc_reply_authors_avg": [
            316.75,
            168.28899993760734
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3244428422615251,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=201529887984110244&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=hOxgrGM63n",
        "pdf": "https://openreview.net/pdf?id=hOxgrGM63n",
        "email": "ensae.fr;kaust.edu.sa;",
        "author_num": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Ecole Nationale de la Statistique et de l'Administration Economique;King Abdullah University of Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://ensae.fr;https://www.kast.kau.edu.sa",
        "aff_unique_abbr": "ENSAE;KAUST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "France;Saudi Arabia"
    },
    {
        "id": "hP4iZU8I3Y",
        "title": "Understanding Inter-Session Intentions via Complex Logical Reasoning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Understanding user intentions is crucial for enhancing product recommendations, navigation suggestions, and query reformulations. However, user intentions can be intricate, involving multiple sessions and attribute requirements connected by logical operators such as And, Or, and Not. For example, a user may search for Nike or Adidas running shoes across various sessions, with a preference for the color purple. In another case, a user may have purchased a mattress in a previous session and is now seeking a corresponding bed frame without intending to buy another mattress. Prior research on session understanding has not sufficiently addressed how to make product or attribute recommendations for such complex intentions.\nIn this paper, we introduce the task of logical session query answering (LSQA), where sessions are treated as hyperedges of items. We formulate the problem of complex intention understanding as a task of answering logical queries on an aggregated hypergraph of sessions, items, and attributes. We also propose a new model, the Logical Session Graph Transformer (LSGT), which captures interactions among items across different sessions and their logical connections using a transformer structure.\nWe analyze the expressiveness of LSGT and prove the permutation invariance of the inputs for the logical operators. We evaluate LSGT on three datasets and demonstrate that it achieves state-of-the-art results.",
        "keywords": "knowledge graph;complex query answering;session understanding",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "",
        "author": "Jiaxin Bai;Chen Luo;Zheng Li;Qingyu Yin;Yangqiu Song",
        "authorids": "~Jiaxin_Bai1;~Chen_Luo3;~Zheng_Li9;~Qingyu_Yin2;~Yangqiu_Song1",
        "gender": "M;M;M;M;M",
        "homepage": "http://bjx.fun/;https://chen-luo.com/;;https://www.cse.ust.hk/~yqsong/;https://hsqmlzno1.github.io/",
        "dblp": "250/9281;46/4719-3.html;179/2542;86/2159;10/1143-18",
        "google_scholar": "BHQiBpQAAAAJ;4EoNAFcAAAAJ;P-mBKNYAAAAJ;MdQZ-q8AAAAJ;https://scholar.google.com.hk/citations?user=P6fwn4AAAAAJ",
        "orcid": "0000-0002-8985-6467;0000-0001-5339-5817;;0000-0002-7818-6090;",
        "linkedin": ";chen-luo-a7a45b84/;;yqsong/;",
        "or_profile": "~Jiaxin_Bai1;~Chen_Luo3;~Qingyu_Yin2;~Yangqiu_Song1;~zheng_li4",
        "aff": "Hong Kong University of Science and Technology;Amazon;Amazon;Hong Kong University of Science and Technology;Amazon",
        "aff_domain": "ust.hk;amazon.com;amazon.com;ust.hk;amazon.com",
        "position": "PhD student;Researcher;Researcher;Associate Professor;Researcher",
        "bibtex": "@misc{\nbai2024understanding,\ntitle={Understanding Inter-Session Intentions via Complex Logical Reasoning},\nauthor={Jiaxin Bai and Chen Luo and Zheng Li and Qingyu Yin and Yangqiu Song},\nyear={2024},\nurl={https://openreview.net/forum?id=hP4iZU8I3Y}\n}",
        "github": "",
        "project": "",
        "reviewers": "Kyoc;kouL;kt6F",
        "site": "https://openreview.net/forum?id=hP4iZU8I3Y",
        "pdf_size": 567896,
        "rating": "5;6;6",
        "confidence": "5;4;3",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "3;3;2",
        "wc_summary": "142;107;67",
        "wc_strengths": "67;73;42",
        "wc_weaknesses": "582;98;242",
        "wc_questions": "1;31;55",
        "wc_review": "792;309;406",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "608;1003;1374",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;2;2",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            105.33333333333333,
            30.64129385141706
        ],
        "wc_strengths_avg": [
            60.666666666666664,
            13.424687043734844
        ],
        "wc_weaknesses_avg": [
            307.3333333333333,
            202.92089317980268
        ],
        "wc_questions_avg": [
            29.0,
            22.090722034374522
        ],
        "wc_review_avg": [
            502.3333333333333,
            208.61820523519887
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            995.0,
            312.76935058708466
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1385862508475886508&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;1;0;1",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Amazon",
        "aff_unique_dep": ";Amazon.com, Inc.",
        "aff_unique_url": "https://www.ust.hk;https://www.amazon.com",
        "aff_unique_abbr": "HKUST;Amazon",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;1;1;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "hQ28OHX2sv",
        "title": "Transformers Perform In-Context Learning through Neural Networks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Transformer based neural sequence models exhibit remarkable ability to do in-context learning. Given some training examples, a pre-trained model can make accurate predictions on a novel input. This paper studies why transformers can learn different types of function classes in context. We first show by construction that transformers implement approximate gradient descent on parameters of neural networks and provide an upper bound for number of heads, hidden dimension, and number of layers of the transformer. We also show that transformers can learn deep and narrow neural networks, which has better approximation capabilities compared to shallow and wide neural networks, using less resource. Our results move beyond linearity in terms of in-context learning instances and provide an understanding of why transformers can learn many types of function classes through the bridge of neural networks.",
        "keywords": "In-Context Learning;Transformers;Neural-Networks;Gradient Desent",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/52a8d3815d07c1ef2c56ed398f858b8d57b90855.pdf",
        "author": "Zhijie Wang;Bo Jiang;Shuai Li",
        "authorids": "~Zhijie_Wang7;~Bo_Jiang2;~Shuai_Li3",
        "gender": "M;M;F",
        "homepage": "https://github.com/Vincent-Zhijie;https://jhc.sjtu.edu.cn/~bjiang/;http://shuaili8.github.io",
        "dblp": ";34/2005-3.html;57/2281-10",
        "google_scholar": "x_9XRb4AAAAJ;WxAIZtMAAAAJ;https://scholar.google.com.hk/citations?user=kMZgQxcAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Zhijie_Wang7;~Bo_Jiang2;~Shuai_Li3",
        "aff": "Shanghai Jiaotong University;Shanghai Jiaotong University;John Hopcroft Center, Shanghai Jiao Tong University",
        "aff_domain": "sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn",
        "position": "Undergrad student;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nwang2024transformers,\ntitle={Transformers Perform In-Context Learning through Neural Networks},\nauthor={Zhijie Wang and Bo Jiang and Shuai Li},\nyear={2024},\nurl={https://openreview.net/forum?id=hQ28OHX2sv}\n}",
        "github": "",
        "project": "",
        "reviewers": "m6gj;Ah1w;SDBk",
        "site": "https://openreview.net/forum?id=hQ28OHX2sv",
        "pdf_size": 276106,
        "rating": "3;3;3",
        "confidence": "4;4;3",
        "soundness": "2;2;3",
        "contribution": "2;2;2",
        "presentation": "2;2;2",
        "wc_summary": "32;145;61",
        "wc_strengths": "17;33;42",
        "wc_weaknesses": "139;81;110",
        "wc_questions": "2;49;112",
        "wc_review": "190;308;325",
        "wc_reply_reviewers": "0;0;88",
        "wc_reply_authors": "69;169;297",
        "reply_reviewers": "0;0;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            79.33333333333333,
            47.91891299082464
        ],
        "wc_strengths_avg": [
            30.666666666666668,
            10.338708279513881
        ],
        "wc_weaknesses_avg": [
            110.0,
            23.678400846904054
        ],
        "wc_questions_avg": [
            54.333333333333336,
            45.065384597148274
        ],
        "wc_review_avg": [
            274.3333333333333,
            60.035174874586836
        ],
        "wc_reply_reviewers_avg": [
            29.333333333333332,
            41.48359782961079
        ],
        "wc_reply_authors_avg": [
            178.33333333333334,
            93.31428377025435
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:YFj2S-Ztgb4J:scholar.google.com/&scioq=Transformers+Perform+In-Context+Learning+through+Neural+Networks&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Shanghai Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sjtu.edu.cn",
        "aff_unique_abbr": "SJTU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Shanghai",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Plan-Seq-Learn: Language Model Guided RL for Solving Long Horizon Robotics Tasks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18096",
        "id": "hQVCCxQrYN",
        "author_site": "Murtaza Dalal, Tarun Chiruvolu, Devendra Chaplot, Ruslan Salakhutdinov",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) are highly capable of performing planning for long-horizon robotics tasks, yet existing methods require access to a pre-defined skill library (*e.g.* picking, placing, pulling, pushing, navigating). However, LLM planning does not address how to design or learn those behaviors, which remains challenging particularly in long-horizon settings. Furthermore, for many tasks of interest, the robot needs to be able to adjust its behavior in a fine-grained manner, requiring the agent to be capable of modifying *low-level* control actions. Can we instead use the internet-scale knowledge from LLMs for high-level policies, guiding reinforcement learning (RL) policies to efficiently solve robotic control tasks online without requiring a pre-determined set of skills? In this paper, we propose **Plan-Seq-Learn** (PSL): a modular approach that uses motion planning to bridge the gap between abstract language and learned low-level control for solving long-horizon robotics tasks from scratch. We demonstrate that PSL is capable of solving 20+ challenging single and multi-stage robotics tasks on four benchmarks at success rates of over 80% from raw visual input, out-performing language-based, classical, and end-to-end approaches. Video results and code at https://planseqlearn.github.io/",
        "keywords": "Long-horizon robot learning;reinforcement learning;LLMs",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/96b6f340abfb8457f436df0c9d379b93308bfa13.pdf",
        "author": "Murtaza Dalal;Tarun Chiruvolu;Devendra Singh Chaplot;Ruslan Salakhutdinov",
        "authorids": "~Murtaza_Dalal1;~Tarun_Chiruvolu1;~Devendra_Singh_Chaplot2;~Ruslan_Salakhutdinov1",
        "gender": "M;;M;M",
        "homepage": "https://mihdalal.github.io/;;https://devendrachaplot.github.io/;https://www.cs.cmu.edu/~rsalakhu/",
        "dblp": "215/5516;;161/0038;",
        "google_scholar": "5dBp2f4AAAAJ;;1MSpdmQAAAAJ;",
        "orcid": ";;;",
        "linkedin": "murtaza-dalal-9b397a89/;tarun-chiruvolu/;;",
        "or_profile": "~Murtaza_Dalal1;~Tarun_Chiruvolu1;~Devendra_Chaplot1;~Russ_Salakhutdinov1",
        "aff": "Carnegie Mellon University;Carnegie Mellon University;Meta Facebook;School of Computer Science, Carnegie Mellon University",
        "aff_domain": "cmu.edu;cmu.edu;fb.com;cs.cmu.edu",
        "position": "PhD student;Undergrad student;Researcher;Full Professor",
        "bibtex": "@inproceedings{\ndalal2024planseqlearn,\ntitle={Plan-Seq-Learn: Language Model Guided {RL} for Solving Long Horizon Robotics Tasks},\nauthor={Murtaza Dalal and Tarun Chiruvolu and Devendra Singh Chaplot and Ruslan Salakhutdinov},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=hQVCCxQrYN}\n}",
        "github": "",
        "project": "",
        "reviewers": "oGjq;ue89;KErm",
        "pdf_size": 31447347,
        "rating": "6;6;8",
        "confidence": "4;4;4",
        "soundness": "3;3;3",
        "contribution": "3;3;2",
        "presentation": "3;3;3",
        "wc_summary": "59;84;126",
        "wc_strengths": "66;77;157",
        "wc_weaknesses": "52;49;307",
        "wc_questions": "314;40;3",
        "wc_review": "491;250;593",
        "wc_reply_reviewers": "170;0;44",
        "wc_reply_authors": "3411;649;2059",
        "reply_reviewers": "2;0;1",
        "reply_authors": "6;2;5",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            89.66666666666667,
            27.644569488820444
        ],
        "wc_strengths_avg": [
            100.0,
            40.554490092549145
        ],
        "wc_weaknesses_avg": [
            136.0,
            120.92146211487851
        ],
        "wc_questions_avg": [
            119.0,
            138.7107301785506
        ],
        "wc_review_avg": [
            444.6666666666667,
            143.8108325389835
        ],
        "wc_reply_reviewers_avg": [
            71.33333333333333,
            72.0431969183921
        ],
        "wc_reply_authors_avg": [
            2039.6666666666667,
            1127.664646761419
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            4.333333333333333,
            1.699673171197595
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 48,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4645892432000865156&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=hQVCCxQrYN",
        "pdf": "https://openreview.net/pdf?id=hQVCCxQrYN",
        "email": "cmu.edu;cmu.edu;fb.com;cs.cmu.edu",
        "author_num": 4,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Carnegie Mellon University;Meta",
        "aff_unique_dep": ";Meta Platforms, Inc.",
        "aff_unique_url": "https://www.cmu.edu;https://meta.com",
        "aff_unique_abbr": "CMU;Meta",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Pittsburgh",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "hR6U3ZcVac",
        "title": "Variational Language Concepts for Interpreting Pretrained Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Pretrained Language Models (PLMs) such as BERT and its variants have achieved remarkable success in natural language processing. To date, the interpretability of PLMs has primarily relied on the attention weights in their self-attention layers. However, these attention weights only provide word-level interpretations, failing to capture higher-level structures, and are therefore lacking in readability and intuitiveness. \nTo address this challenge, we first provide a formal definition of ``conceptual interpretation`` and then propose a variational Bayesian framework, dubbed VAriational LANguage ConcEpt (VALANCE), to go beyond word-level interpretations and provide concept-level interpretations. Our theoretical analysis shows that our VALANCE finds the optimal language concepts to interpret PLM predictions. Empirical results on several real-world datasets show that our method can successfully provide conceptual interpretation for PLMs.",
        "keywords": "Conceptual Interpretation;Interpretability and Explainability;Generative Models;Probabilistic Graphical Models;Pretrained Lauguage Models",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Hengyi Wang;Zhiqing Hong;Desheng Zhang;Hao Wang",
        "authorids": "~Hengyi_Wang1;~Zhiqing_Hong2;~Desheng_Zhang2;~Hao_Wang3",
        "gender": "M;M;;",
        "homepage": "https://carbonated-law-fad.notion.site/Hengyi-Wang-76cf0e03fa5648cdaf45218e69e840cc;http://www.zhiqinghong.site/;;",
        "dblp": "215/1801;248/4120;;",
        "google_scholar": "eKs-ZGQAAAAJ;8pMYf88AAAAJ;;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Hengyi_Wang1;~Zhiqing_Hong2;~Desheng_Zhang2;~Hao_Wang3",
        "aff": "Rutgers University;Rutgers University, New Brunswick;;",
        "aff_domain": "rutgers.edu;rutgers.edu;;",
        "position": "PhD student;PhD student;;",
        "bibtex": "@misc{\nwang2024variational,\ntitle={Variational Language Concepts for Interpreting Pretrained Language Models},\nauthor={Hengyi Wang and Zhiqing Hong and Desheng Zhang and Hao Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=hR6U3ZcVac}\n}",
        "github": "",
        "project": "",
        "reviewers": "Spgz;5MHt;XoeF",
        "site": "https://openreview.net/forum?id=hR6U3ZcVac",
        "pdf_size": 1060367,
        "rating": "3;3;5",
        "confidence": "3;4;3",
        "soundness": "2;2;3",
        "contribution": "2;2;2",
        "presentation": "2;2;2",
        "wc_summary": "46;178;74",
        "wc_strengths": "52;91;72",
        "wc_weaknesses": "190;496;86",
        "wc_questions": "7;8;11",
        "wc_review": "295;773;243",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            99.33333333333333,
            56.78810517079161
        ],
        "wc_strengths_avg": [
            71.66666666666667,
            15.923427883328248
        ],
        "wc_weaknesses_avg": [
            257.3333333333333,
            174.02171001215785
        ],
        "wc_questions_avg": [
            8.666666666666666,
            1.699673171197595
        ],
        "wc_review_avg": [
            437.0,
            238.53441400910407
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:nzsAPaQJ0wgJ:scholar.google.com/&scioq=Variational+Language+Concepts+for+Interpreting+Pretrained+Language+Models&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Rutgers University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.rutgers.edu",
        "aff_unique_abbr": "Rutgers",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";New Brunswick",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "hRbLHpLAy4",
        "title": "RetPur: Diffusion Purification Model for Defending Hash Retrieval Target Attacks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep Neural Networks (DNNs) have harnessed their formidable representational capabilities to attain remarkable performance in image retrieval models. Nonetheless, in cases where malicious actors introduce adversarial perturbations into the test dataset, the retrieval model may readily yield results that are either irrelevant or intentionally manipulated by the attacker. Specifically, the targeted attack is notable for producing predefined results, thereby inflicting a more adverse impact on retrieval performance. While adversarial purification has demonstrated effectiveness in countering adversarial attacks, its application in retrieval tasks remains unexplored. Addressing these concerns, we introduce a free-trained purification model denoted as RetPur aimed at purifying adversarial test dataset, thereby mitigating the issue of targeted attacks within both uni-modal and cross-modal retrieval systems. RetPur employs a pre-trained diffusion model, offering a plug-and-play convenience, while utilizing adversarial samples as conditioning factors to guide image generation, thereby enhancing task accuracy. In terms of retrieval system architecture, our study pioneers the incorporation of adversarial purification tasks into uni-modal (Image-to-Image) and cross-modal (Image-to-Image, Image-to-Text) hash retrieval systems, specifically tailored to image retrieval scenarios. Furthermore, we explore the application of adversarial purification tasks to a wider array of attacks, including both generative and iterative approaches. Through an extensive series of experiments, it can be concluded that the purified dataset exhibits retrieval performance in the retrieval systems that is closely akin to that of the original dataset, even across different attacks and modalities.",
        "keywords": "Adversarial purification;Target attacks;Guided diffusion model;Hash retrieval",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Yahui Liu;Xize Wu;Jiasong Wu;Lotfi Senhadji;Huazhong Shu",
        "authorids": "~Yahui_Liu5;~Xize_Wu1;~Jiasong_Wu1;~Lotfi_Senhadji1;~Huazhong_Shu1",
        "gender": ";M;M;;M",
        "homepage": "https://blog.csdn.net/qq_37839667?spm=1000.2115.3001.5343;;https://cse.seu.edu.cn/2019/0105/c23024a257549/page.htm;;https://cse.seu.edu.cn/",
        "dblp": ";;63/8859.html;;",
        "google_scholar": ";;https://scholar.google.com/citations?hl=zh-CN;;Fsc-Sa4AAAAJ",
        "orcid": ";0000-0001-6122-273X;;0000-0001-9434-6341;",
        "linkedin": ";;;;",
        "or_profile": "~Yahui_Liu5;~Xize_Wu1;~Jiasong_Wu1;~Lotfi_Senhadji1;~Huazhong_Shu1",
        "aff": "Southeast University;Southeast University;Southeast University;Universit\u00e9 Rennes I;Southeast University",
        "aff_domain": "seu.edu.cn;seu.edu.cn;seu.edu.cn;univ-rennes1.fr;seu.edu.cn",
        "position": "PhD student;PhD student;Associate Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nliu2024retpur,\ntitle={RetPur: Diffusion Purification Model for Defending Hash Retrieval Target Attacks},\nauthor={Yahui Liu and Xize Wu and Jiasong Wu and Lotfi Senhadji and Huazhong Shu},\nyear={2024},\nurl={https://openreview.net/forum?id=hRbLHpLAy4}\n}",
        "github": "",
        "project": "",
        "reviewers": "6D5x;o7o6;vSmf",
        "site": "https://openreview.net/forum?id=hRbLHpLAy4",
        "pdf_size": 409218,
        "rating": "3;3;6",
        "confidence": "4;4;4",
        "soundness": "2;3;3",
        "contribution": "1;2;3",
        "presentation": "3;3;2",
        "wc_summary": "55;76;98",
        "wc_strengths": "21;58;45",
        "wc_weaknesses": "109;96;63",
        "wc_questions": "20;42;16",
        "wc_review": "205;272;222",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            76.33333333333333,
            17.55625877635159
        ],
        "wc_strengths_avg": [
            41.333333333333336,
            15.326085243430198
        ],
        "wc_weaknesses_avg": [
            89.33333333333333,
            19.362047641943477
        ],
        "wc_questions_avg": [
            26.0,
            11.430952132988164
        ],
        "wc_review_avg": [
            233.0,
            28.437065014988214
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:uDdKm57DcUoJ:scholar.google.com/&scioq=RetPur:+Diffusion+Purification+Model+for+Defending+Hash+Retrieval+Target+Attacks&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "Southeast University;Universit\u00e9 Rennes I",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.seu.edu.cn/;https://www.univ-rennes1.fr",
        "aff_unique_abbr": "SEU;UR1",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "China;France"
    },
    {
        "id": "hRos9WldRK",
        "title": "L2B: Learning to Bootstrap Robust Models for Combating Label Noise",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Deep neural networks have shown great success in representation learning. However, when learning with noisy labels (LNL), they can easily overfit and fail to generalize to new data. To address this challenge, in this paper, we propose a novel machine learning method called Learning to Bootstrap (L2B) that leverages a joint reweighting mechanism to train models using their own predictions to bootstrap themselves without being adversely affected by erroneous pseudo-labels. Unlike conventional approaches, L2B dynamically adjusts the importance weight between real observed labels and pseudo-labels, as well as between different samples, to determine the appropriate weighting. Additionally, L2B conducts implicit relabeling concurrently, leading to significant improvements without incurring additional costs. L2B offers several benefits over the baseline methods.  It yields more robust models that are less susceptible to the impact of noisy labels by guiding the bootstrapping procedure more effectively. It better exploits the valuable information contained in corrupted instances by adapting the weights of both instances and labels. Furthermore, L2B is compatible with existing noisy label learning methods and delivers competitive results on several benchmark datasets, including CIFAR-10, CIFAR-100, ISIC2019, and Clothing 1M datasets. Extensive experiments demonstrate that our method effectively mitigates the challenges of noisy labels, often necessitating few to no validation samples, and be well generalized to other tasks such as image segmentation. This not only positions it as a robust complement to existing LNL techniques but also underscores its practical applicability. The code and models are available at https://anonymous.4open.science/r/L2B-6006.",
        "keywords": "noisy label;meta-learning;image classification",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/a487defbbd73cc733aebaca7f77450a9d00303b6.pdf",
        "author": "Yuyin Zhou;Xianhang Li;Fengze Liu;Qingyue Wei;Xuxi Chen;Lequan Yu;Cihang Xie;Matthew P. Lungren;Lei Xing",
        "authorids": "~Yuyin_Zhou1;~Xianhang_Li1;~Fengze_Liu1;~Qingyue_Wei1;~Xuxi_Chen1;~Lequan_Yu1;~Cihang_Xie3;~Matthew_P._Lungren1;~Lei_Xing1",
        "gender": ";M;M;F;Unspecified;M;;M;M",
        "homepage": "https://yuyinzhou.github.io/;https://xhl-video.github.io/xianhangli/;;https://profiles.stanford.edu/qingyue-wei;;https://yulequan.github.io/;;http://med.stanford.edu/xinglab.html;https://cihangxie.github.io/",
        "dblp": "192/1413;268/5945;;;267/9662;165/8092;;;175/3366",
        "google_scholar": "eiqVLC0AAAAJ;YKpFz4YAAAAJ;T3EjsaAAAAAJ;;afsDlKYAAAAJ;https://scholar.google.com.hk/citations?user=llXf3wUAAAAJ;z1UtMSYAAAAJ;;X3vVZPcAAAAJ",
        "orcid": ";;;;;0000-0002-9315-6527;;;",
        "linkedin": ";;;;;;;;",
        "or_profile": "~Yuyin_Zhou1;~Xianhang_Li1;~Fengze_Liu1;~Qingyue_Wei1;~Xuxi_Chen1;~Lequan_Yu1;~Matthew_P._Lungren1;~Lei_Xing1;~cihang_xie1",
        "aff": "University of California, Santa Cruz;University of California, Santa Cruz;ByteDance;Stanford University;University of Texas at Austin;The University of Hong Kong;Microsoft;Stanford University;University of California, Santa Cruz",
        "aff_domain": "ucsc.edu;ucsc.edu;bytedance.com;stanford.edu;utexas.edu;hku.hk;microsoft.com;stanford.edu;ucsc.edu",
        "position": "Assistant Professor;PhD student;Researcher;PhD student;PhD student;Assistant Professor;Principal Researcher;Professor, Dept of Radiation Oncology,;Assistant Professor",
        "bibtex": "@misc{\nzhou2024lb,\ntitle={L2B: Learning to Bootstrap Robust Models for Combating Label Noise},\nauthor={Yuyin Zhou and Xianhang Li and Fengze Liu and Qingyue Wei and Xuxi Chen and Lequan Yu and Cihang Xie and Matthew P. Lungren and Lei Xing},\nyear={2024},\nurl={https://openreview.net/forum?id=hRos9WldRK}\n}",
        "github": "",
        "project": "",
        "reviewers": "iafb;Ss7A;Pagb;Qjb7",
        "site": "https://openreview.net/forum?id=hRos9WldRK",
        "pdf_size": 2052631,
        "rating": "3;5;6;6",
        "confidence": "5;4;4;2",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "42;55;50;67",
        "wc_strengths": "37;51;31;96",
        "wc_weaknesses": "442;182;108;63",
        "wc_questions": "107;109;31;217",
        "wc_review": "628;397;220;443",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            53.5,
            9.069178573608527
        ],
        "wc_strengths_avg": [
            53.75,
            25.449705302812447
        ],
        "wc_weaknesses_avg": [
            198.75,
            146.72657393941972
        ],
        "wc_questions_avg": [
            116.0,
            66.24952830020754
        ],
        "wc_review_avg": [
            422.0,
            145.17747759208382
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -0.7492686492653551,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11155332374637973116&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;1;2;3;4;5;2;0",
        "aff_unique_norm": "University of California, Santa Cruz;ByteDance;Stanford University;University of Texas at Austin;University of Hong Kong;Microsoft",
        "aff_unique_dep": ";;;;;Microsoft Corporation",
        "aff_unique_url": "https://www.ucsc.edu;https://www.bytedance.com;https://www.stanford.edu;https://www.utexas.edu;https://www.hku.hk;https://www.microsoft.com",
        "aff_unique_abbr": "UCSC;ByteDance;Stanford;UT Austin;HKU;Microsoft",
        "aff_campus_unique_index": "0;0;2;3;4;2;0",
        "aff_campus_unique": "Santa Cruz;;Stanford;Austin;Hong Kong SAR",
        "aff_country_unique_index": "0;0;1;0;0;1;0;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "Self-RAG: Learning to Retrieve, Generate, and Critique through Self-Reflection",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18095",
        "id": "hSyW5go0v8",
        "author_site": "Akari Asai, Zeqiu Wu, Yizhong Wang, Avi Sil, Hannaneh Hajishirzi",
        "tldr": "",
        "abstract": "Despite their remarkable capabilities, large language models (LLMs) often produce responses containing factual inaccuracies due to their sole reliance on the parametric knowledge they encapsulate. Retrieval-Augmented Generation (RAG), an ad hoc approach that augments LMs with retrieval of relevant knowledge, decreases such issues. However, indiscriminately retrieving and incorporating a fixed number of retrieved passages, regardless of whether retrieval is necessary, or passages are relevant, diminishes LM versatility or can lead to unhelpful response generation. We introduce a new framework called **Self-Reflective Retrieval-Augmented Generation (Self-RAG)** that enhances an LM's quality and factuality through retrieval and self-reflection. \nOur framework trains a single arbitrary LM that adaptively retrieves passages on-demand, and generates and reflects on retrieved passages and its generations using special tokens, called {\\it reflection} tokens. Generating reflection tokens makes the LM controllable during the inference phase, enabling it to tailor its behavior to diverse task requirements. \nExperiments show that Self-RAG (7B and 13B parameters) significantly outperforms state-of-the-art LLMs and retrieval-augmented models on a diverse set of tasks. \nSpecifically, Self-RAG outperforms ChatGPT and retrieval-augmented Llama2-chat on Open-domain QA, reasoning, and fact verification tasks, and it shows significant gains in improving factuality and citation accuracy for long-form generations relative to these models. Our code and trained models are available at https://selfrag.github.io/",
        "keywords": "Retrieval-augmented Generation;Language Models;Retrieval-augmented LMs;Factuality",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Akari Asai;Zeqiu Wu;Yizhong Wang;Avirup Sil;Hannaneh Hajishirzi",
        "authorids": "~Akari_Asai2;~Zeqiu_Wu1;~Yizhong_Wang2;~Avirup_Sil1;~Hannaneh_Hajishirzi1",
        "gender": "F;F;M;;F",
        "homepage": "https://akariasai.github.io/;http://ellenmellon.github.io/;https://yizhong-wang.com;http://ibm.biz/avirupsil;https://homes.cs.washington.edu/~hannaneh/",
        "dblp": ";188/5861;79/3601;07/10489;52/1296",
        "google_scholar": "gqB4u_wAAAAJ;Ug_hZoYAAAAJ;y5zpqdAAAAAJ;;LOV6_WIAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Akari_Asai2;~Zeqiu_Wu1;~Yizhong_Wang2;~Avirup_Sil1;~Hannaneh_Hajishirzi1",
        "aff": "Paul G. Allen School of Computer Science & Engineering, University of Washington;University of Washington, Seattle;Department of Computer Science, University of Washington;International Business Machines;University of Washington",
        "aff_domain": "cs.washington.edu;uw.edu;cs.washington.edu;ibm.com;uw.edu",
        "position": "PhD student;PhD student;PhD student;Principal Researcher;Associate Professor",
        "bibtex": "@inproceedings{\nasai2024selfrag,\ntitle={Self-{RAG}: Learning to Retrieve, Generate, and Critique through Self-Reflection},\nauthor={Akari Asai and Zeqiu Wu and Yizhong Wang and Avirup Sil and Hannaneh Hajishirzi},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=hSyW5go0v8}\n}",
        "github": "",
        "project": "",
        "reviewers": "quEF;uRop;4MCy;3ScW",
        "pdf_size": 1244749,
        "rating": "6;8;8;8",
        "confidence": "2;3;4;4",
        "soundness": "3;3;4;3",
        "contribution": "3;4;3;3",
        "presentation": "2;4;4;3",
        "wc_summary": "182;145;125;118",
        "wc_strengths": "55;60;78;55",
        "wc_weaknesses": "285;126;128;97",
        "wc_questions": "187;52;70;47",
        "wc_review": "709;383;401;317",
        "wc_reply_reviewers": "48;0;0;5",
        "wc_reply_authors": "2062;860;1478;1242",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "3;2;3;2",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            142.5,
            24.86463351831271
        ],
        "wc_strengths_avg": [
            62.0,
            9.460443964212251
        ],
        "wc_weaknesses_avg": [
            159.0,
            73.7733014036921
        ],
        "wc_questions_avg": [
            89.0,
            57.22324702426454
        ],
        "wc_review_avg": [
            452.5,
            151.35636755683586
        ],
        "wc_reply_reviewers_avg": [
            13.25,
            20.16649448962313
        ],
        "wc_reply_authors_avg": [
            1410.5,
            436.01920829247877
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.8703882797784891,
        "gs_citation": 517,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8898243279279799480&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=hSyW5go0v8",
        "pdf": "https://openreview.net/pdf?id=hSyW5go0v8",
        "email": "cs.washington.edu;uw.edu;cs.washington.edu;ibm.com;uw.edu",
        "author_num": 5,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "University of Washington;International Business Machines Corporation",
        "aff_unique_dep": "Paul G. Allen School of Computer Science & Engineering;",
        "aff_unique_url": "https://www.washington.edu;https://www.ibm.com",
        "aff_unique_abbr": "UW;IBM",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Seattle;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Fine-tuning Aligned Language Models Compromises Safety, Even When Users Do Not Intend To!",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18094",
        "id": "hTEGyKf0dZ",
        "author_site": "Xiangyu Qi, Yi Zeng, Tinghao Xie, Pin-Yu Chen, Ruoxi Jia, Prateek Mittal, Peter Henderson",
        "tldr": "",
        "abstract": "Optimizing large language models (LLMs) for downstream use cases often involves the customization of pre-trained LLMs through further fine-tuning. Meta's open-source release of Llama models and OpenAI's APIs for fine-tuning GPT-3.5 Turbo on customized datasets accelerate this trend. But, what are the safety costs associated with such customized fine-tuning? While existing safety alignment techniques restrict harmful behaviors of LLMs at inference time, they do not cover safety risks when fine-tuning privileges are extended to end-users. Our red teaming studies find that the safety alignment of LLMs can be compromised by fine-tuning with only a few adversarially designed training examples. For instance, we jailbreak GPT-3.5 Turbo's safety guardrails by fine-tuning it on only 10 such examples at a cost of less than $0.20 via OpenAI's APIs, making the model responsive to nearly any harmful instructions. Disconcertingly, our research also reveals that, even without malicious intent, simply fine-tuning with benign and commonly used datasets can also inadvertently degrade the safety alignment of LLMs, though to a lesser extent. These findings suggest that fine-tuning aligned LLMs introduces new safety risks that current safety infrastructures fall short of addressing --- even if a model's initial safety alignment is impeccable, how can it be maintained after customized fine-tuning? We outline and critically analyze potential mitigations and advocate for further research efforts toward reinforcing safety protocols for the customized fine-tuning of aligned LLMs.  (This paper contains red-teaming data and model-generated content that can be offensive in nature.)",
        "keywords": "AI Safety;Large Language Models;Fine-tuning;Jailbreaking;AI Alignment",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Xiangyu Qi;Yi Zeng;Tinghao Xie;Pin-Yu Chen;Ruoxi Jia;Prateek Mittal;Peter Henderson",
        "authorids": "~Xiangyu_Qi2;~Yi_Zeng3;~Tinghao_Xie1;~Pin-Yu_Chen1;~Ruoxi_Jia1;~Prateek_Mittal1;~Peter_Henderson1",
        "gender": "M;M;M;M;;;M",
        "homepage": "https://unispac.github.io;https://yizeng623.github.io/;https://tinghaoxie.com;http://www.pinyuchen.com;https://ruoxijia.info/;http://www.princeton.edu/~pmittal/;http://www.peterhenderson.co/",
        "dblp": "274/2321;75/148;307/5298;39/8969;147/5355-1;;h/PeterHenderson2",
        "google_scholar": "9Za3rmkAAAAJ;slUNmHQAAAAJ;gFT5XpMAAAAJ;jxwlCUUAAAAJ;JCrug-YAAAAJ;https://scholar.google.com.tw/citations?user=xTKD8J4AAAAJ;dy_JBs0AAAAJ",
        "orcid": ";0000-0002-6901-9194;;0000-0003-1039-8369;;0000-0002-4057-0118;",
        "linkedin": ";chnyizeng/;;pin-yu-chen-940062a2;;;phende/",
        "or_profile": "~Xiangyu_Qi2;~Yi_Zeng3;~Tinghao_Xie1;~Pin-Yu_Chen1;~Ruoxi_Jia1;~Prateek_Mittal1;~Peter_Henderson1",
        "aff": "Princeton University;Virginia Tech;Meta Facebook;International Business Machines;Virginia Tech;Princeton University;Princeton University",
        "aff_domain": "princeton.edu;vt.edu;meta.com;ibm.com;vt.edu;princeton.edu;princeton.edu",
        "position": "PhD student;PhD student;Intern;Principal Researcher;Assistant Professor;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nqi2024finetuning,\ntitle={Fine-tuning Aligned Language Models Compromises Safety, Even When Users Do Not Intend To!},\nauthor={Xiangyu Qi and Yi Zeng and Tinghao Xie and Pin-Yu Chen and Ruoxi Jia and Prateek Mittal and Peter Henderson},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=hTEGyKf0dZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "wPag;uovh;26Ab;soMi",
        "pdf_size": 4792080,
        "rating": "6;6;6;10",
        "confidence": "5;4;2;5",
        "soundness": "2;2;3;4",
        "contribution": "2;3;2;4",
        "presentation": "3;3;3;4",
        "wc_summary": "58;53;36;133",
        "wc_strengths": "12;33;29;88",
        "wc_weaknesses": "265;113;172;57",
        "wc_questions": "3;67;6;28",
        "wc_review": "338;266;243;306",
        "wc_reply_reviewers": "11;57;11;0",
        "wc_reply_authors": "2015;1576;1510;544",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "6;5;4;1",
        "rating_avg": [
            7.0,
            1.7320508075688772
        ],
        "confidence_avg": [
            4.0,
            1.224744871391589
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            70.0,
            37.275997639231605
        ],
        "wc_strengths_avg": [
            40.5,
            28.53506614676055
        ],
        "wc_weaknesses_avg": [
            151.75,
            76.99797075248152
        ],
        "wc_questions_avg": [
            26.0,
            25.563646062328434
        ],
        "wc_review_avg": [
            288.25,
            36.51284020724764
        ],
        "wc_reply_reviewers_avg": [
            19.75,
            21.970150204311302
        ],
        "wc_reply_authors_avg": [
            1411.25,
            537.0127442621823
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.0,
            1.8708286933869707
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.4714045207910316,
        "gs_citation": 564,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14332933435628840179&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=hTEGyKf0dZ",
        "pdf": "https://openreview.net/pdf?id=hTEGyKf0dZ",
        "email": "princeton.edu;vt.edu;meta.com;ibm.com;vt.edu;princeton.edu;princeton.edu",
        "author_num": 7,
        "aff_unique_index": "0;1;2;3;1;0;0",
        "aff_unique_norm": "Princeton University;Virginia Tech;Meta;International Business Machines Corporation",
        "aff_unique_dep": ";;Meta Platforms, Inc.;",
        "aff_unique_url": "https://www.princeton.edu;https://www.vt.edu;https://meta.com;https://www.ibm.com",
        "aff_unique_abbr": "Princeton;VT;Meta;IBM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "hUs8YHAUEr",
        "title": "Enhancing Large Language Models in Coding Through Multi-Perspective Self-Consistency",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs) have exhibited remarkable ability in textual generation. However, in complex reasoning tasks such as code generation, generating the correct answer in a single attempt remains a formidable challenge for LLMs. Previous research has explored solutions by aggregating multiple outputs, leveraging the consistency among them. However, none of them have comprehensively captured this consistency from different perspectives. \nIn this paper, we propose the Multi-Perspective Self-Consistency (MPSC) framework, a novel decoding strategy for LLM that incorporates both inter-consistency across outputs from multiple perspectives and intra-consistency within a single perspective. Specifically, we ask LLMs to sample multiple diverse outputs from various perspectives for a given query and then construct a multipartite graph based on them. With two predefined measures of consistency, we embed both inter- and intra-consistency information into the graph. The optimal choice is then determined based on consistency analysis in the graph.\nWe conduct comprehensive evaluation on the code generation task by introducing solution, specification and test case as three perspectives. We leverage a code interpreter to quantitatively measure the inter-consistency and propose several intra-consistency measure functions. Our MPSC framework significantly boosts the performance on various popular benchmarks, including HumanEval (+17.60%), HumanEval Plus (+17.61%), MBPP (+6.50%) and CodeContests (+11.82%) in Pass$@1$, when compared to original outputs generated from ChatGPT, and even surpassing GPT-4.",
        "keywords": "large language model;multi-perspective self-consistency;code generation",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Baizhou Huang;Shuai Lu;Xiaojun Wan;Nan Duan",
        "authorids": "~Baizhou_Huang1;~Shuai_Lu1;~Xiaojun_Wan1;~Nan_Duan1",
        "gender": "M;M;M;M",
        "homepage": ";;https://wanxiaojun.github.io;https://nanduan.github.io/",
        "dblp": "329/4291;;07/1521;",
        "google_scholar": "1Zx1wi8AAAAJ;GAokfukAAAAJ;lTTeBdkAAAAJ;Qaa6OxIAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Baizhou_Huang1;~Shuai_Lu1;~Xiaojun_Wan1;~Nan_Duan1",
        "aff": "Peking University;Microsoft;Peking University;Microsoft Research Asia",
        "aff_domain": "pku.edu.cn;microsoft.com;pku.edu.cn;microsoft.com",
        "position": "PhD student;Research SDE;Full Professor;Principal Researcher",
        "bibtex": "@misc{\nhuang2024enhancing,\ntitle={Enhancing Large Language Models in Coding Through Multi-Perspective Self-Consistency},\nauthor={Baizhou Huang and Shuai Lu and Xiaojun Wan and Nan Duan},\nyear={2024},\nurl={https://openreview.net/forum?id=hUs8YHAUEr}\n}",
        "github": "",
        "project": "",
        "reviewers": "F87r;cqa4;F8qr;q6tm;myx4",
        "site": "https://openreview.net/forum?id=hUs8YHAUEr",
        "pdf_size": 587441,
        "rating": "5;5;5;5;6",
        "confidence": "4;4;5;4;5",
        "soundness": "3;3;1;3;3",
        "contribution": "2;2;2;2;3",
        "presentation": "2;2;3;3;3",
        "wc_summary": "71;44;44;91;80",
        "wc_strengths": "81;33;50;32;46",
        "wc_weaknesses": "510;32;213;172;220",
        "wc_questions": "48;139;5;70;97",
        "wc_review": "710;248;312;365;443",
        "wc_reply_reviewers": "91;22;185;0;39",
        "wc_reply_authors": "1578;722;776;1151;703",
        "reply_reviewers": "1;1;1;0;1",
        "reply_authors": "3;2;2;2;1",
        "rating_avg": [
            5.2,
            0.39999999999999997
        ],
        "confidence_avg": [
            4.4,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.6,
            0.8
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            66.0,
            19.0473095212946
        ],
        "wc_strengths_avg": [
            48.4,
            17.76063061943466
        ],
        "wc_weaknesses_avg": [
            229.4,
            155.7916557457427
        ],
        "wc_questions_avg": [
            71.8,
            45.12826165497626
        ],
        "wc_review_avg": [
            415.6,
            160.50246104032175
        ],
        "wc_reply_reviewers_avg": [
            67.4,
            66.02605546297613
        ],
        "wc_reply_authors_avg": [
            986.0,
            338.10471750627795
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4
        ],
        "reply_authors_avg": [
            2.0,
            0.6324555320336759
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.6123724356957946,
        "gs_citation": 35,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2707749355968007590&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;0;1",
        "aff_unique_norm": "Peking University;Microsoft",
        "aff_unique_dep": ";Microsoft Corporation",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.microsoft.com",
        "aff_unique_abbr": "Peking U;Microsoft",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Asia",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "hVsiTj9aOO",
        "title": "Improved Variational Bayesian Phylogenetic Inference using Mixtures",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We present VBPI-Mixtures, an algorithm designed to enhance the accuracy of phylogenetic posterior distributions, particularly for tree-topology and branch-length approximations. Despite the Variational Bayesian Phylogenetic Inference (VBPI), a leading-edge black-box variational inference (BBVI) framework, achieving remarkable approximations of these distributions, the multimodality of the tree-topology posterior presents a formidable challenge to sampling-based learning techniques such as BBVI. Advanced deep learning methodologies such as normalizing flows and graph neural networks have been explored to refine the branch-length posterior approximation, yet efforts to ameliorate the posterior approximation over tree topologies have been lacking. Our novel VBPI-Mixtures algorithm bridges this gap by harnessing the latest breakthroughs in mixture learning within the BBVI domain. As a result, VBPI-Mixtures is capable of capturing distributions over tree-topologies that VBPI fails to model. We deliver state-of-the-art performance on difficult density estimation tasks across numerous real phylogenetic datasets.",
        "keywords": "Phylogenetic Inference;Variational Inference;Bayesian Inference;Mixtures;Black-Box Variational Inference",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/75c6e7917c80ba67c8e7eac10119133c989e6215.zip",
        "author": "Oskar Kviman;Ricky Mol\u00e9n;Jens Lagergren",
        "authorids": "~Oskar_Kviman1;~Ricky_Mol\u00e9n1;~Jens_Lagergren1",
        "gender": "M;M;M",
        "homepage": "https://okviman.github.io/;https://www.kth.se/profile/rickym/;https://lagergrenlab.org/",
        "dblp": "248/5749;;86/3552",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;https://scholar.google.com/citations?hl=sv",
        "orcid": ";;",
        "linkedin": ";https://linkedin.com/in/ricky-molen-1a3044b3;",
        "or_profile": "~Oskar_Kviman1;~Ricky_Mol\u00e9n1;~Jens_Lagergren1",
        "aff": "KTH Royal Institute of Technology, Stockholm, Sweden;KTH Royal Institute of Technology;KTH Royal Institute of Technology, Stockholm, Sweden",
        "aff_domain": "kth.se;kth.se;kth.se",
        "position": "PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nkviman2024improved,\ntitle={Improved Variational Bayesian Phylogenetic Inference using Mixtures},\nauthor={Oskar Kviman and Ricky Mol{\\'e}n and Jens Lagergren},\nyear={2024},\nurl={https://openreview.net/forum?id=hVsiTj9aOO}\n}",
        "github": "",
        "project": "",
        "reviewers": "Byae;r9Xn;7sSs;TkMa",
        "site": "https://openreview.net/forum?id=hVsiTj9aOO",
        "pdf_size": 9320714,
        "rating": "3;6;6;6",
        "confidence": "3;2;3;3",
        "soundness": "3;3;3;4",
        "contribution": "2;3;2;3",
        "presentation": "3;3;2;4",
        "wc_summary": "130;152;49;41",
        "wc_strengths": "123;58;24;39",
        "wc_weaknesses": "176;79;100;114",
        "wc_questions": "187;43;45;31",
        "wc_review": "616;332;218;225",
        "wc_reply_reviewers": "0;13;0;0",
        "wc_reply_authors": "1015;510;602;685",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "2;1;2;2",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            93.0,
            48.708315511830214
        ],
        "wc_strengths_avg": [
            61.0,
            37.769034936042516
        ],
        "wc_weaknesses_avg": [
            117.25,
            36.134298111351214
        ],
        "wc_questions_avg": [
            76.5,
            64.02148077012902
        ],
        "wc_review_avg": [
            347.75,
            161.32943779732204
        ],
        "wc_reply_reviewers_avg": [
            3.25,
            5.629165124598851
        ],
        "wc_reply_authors_avg": [
            703.0,
            190.47178268709516
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12998903715657260736&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "KTH Royal Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kth.se",
        "aff_unique_abbr": "KTH",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Stockholm;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Sweden"
    },
    {
        "id": "hWF4KWeNgb",
        "title": "Hierarchical Gaussian Mixture Normalizing Flows Modeling for Multi-Class Anomaly Detection",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "One of the most challenges for anomaly detection (AD) is how to design one unified\nAD model, where the model is trained with normal instances from multiple classes\nwith the objective to detect anomalies in these classes. For such a challenging task,\npopular normalizing flow (NF) based AD methods may fall into a \u201dhomogeneous\nmapping\u201d issue, where the NF-based AD models are biased to generate large\nlog-likelihoods for both normal and abnormal samples, and thereby lead to a\nhigh missing rate of anomalies. In this paper, we propose a novel model with\nstronger unified AD performance, HGAD (Hierarchical Gaussian mixture). The\nproposed HGAD performs much better for multi-class anomaly detection by three\nkey improvements. First, we propose to model NF-based AD networks with\ninter-class Gaussian mixture prior for more effectively capturing the complex multiclass\ndistribution. Second, we propose a mutual information maximization loss to\nintroduce the class repulsion property to the model for better structuring the latent\nfeature space, where the class centers are repulsed from each other. In this way,\ndifferent class centers are more distinguishable and more conducive to avoid the\nbias issue. Third, we introduce an intra-class mixed class centers learning strategy\nthat can prompt the model to learn diverse normal patterns even within one class.\nTogether with the inter-class Gaussian mixture modeling, we form a hierarchical\nGaussian mixture normalizing flows modeling method to accomplish the multiclass\nAD task. We evaluate our method on four real-world AD benchmarks,\nwhere we can significantly improve the previous NF-based AD methods and also\noutperform the SOTA unified AD methods. Code will be available online.",
        "keywords": "Multi-Class Anomaly Detection;Hierarchical Gaussian Mixture Normalizing Flows Modeling",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/3bdc1c9c2704eea15e2bd418b502c7ba9a13169e.pdf",
        "author": "Xincheng Yao;Ruoqi Li;Yan Luo;Chao Gao;Chongyang Zhang",
        "authorids": "~Xincheng_Yao2;~Ruoqi_Li2;~Yan_Luo3;~Chao_Gao4;~Chongyang_Zhang1",
        "gender": "M;F;M;M;F",
        "homepage": ";;https://ee.sjtu.edu.cn/FacultyDetail.aspx?id=96&infoid=66&flag=66;https://github.com/jsyzgaochao;",
        "dblp": "310/4056;;;;209/4891",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;https://scholar.google.com/citations?hl=en;;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": "0000-0001-6946-9171;0000-0001-8472-6244;0000-0001-7292-0445;;",
        "linkedin": ";;;;",
        "or_profile": "~Xincheng_Yao2;~Ruoqi_Li2;~Chongyang_Zhang1;~Chao_Gao6;~Luona_Yang1",
        "aff": "Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;;Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;;sjtu.edu.cn",
        "position": "PhD student;MS student;Full Professor;;PhD student",
        "bibtex": "@misc{\nyao2024hierarchical,\ntitle={Hierarchical Gaussian Mixture Normalizing Flows Modeling for Multi-Class Anomaly Detection},\nauthor={Xincheng Yao and Ruoqi Li and Yan Luo and Chao Gao and Chongyang Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=hWF4KWeNgb}\n}",
        "github": "",
        "project": "",
        "reviewers": "v6Sb;EGfe;37tJ;tw2T",
        "site": "https://openreview.net/forum?id=hWF4KWeNgb",
        "pdf_size": 2802596,
        "rating": "3;3;5;6",
        "confidence": "3;3;3;3",
        "soundness": "2;2;3;3",
        "contribution": "2;3;2;3",
        "presentation": "1;2;2;2",
        "wc_summary": "33;98;102;28",
        "wc_strengths": "40;61;39;34",
        "wc_weaknesses": "297;334;239;50",
        "wc_questions": "207;46;30;81",
        "wc_review": "577;539;410;193",
        "wc_reply_reviewers": "0;0;128;35",
        "wc_reply_authors": "1349;0;928;730",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "2;0;2;3",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            65.25,
            34.823662931977736
        ],
        "wc_strengths_avg": [
            43.5,
            10.35615758860399
        ],
        "wc_weaknesses_avg": [
            230.0,
            109.3000457456446
        ],
        "wc_questions_avg": [
            91.0,
            69.46581893276722
        ],
        "wc_review_avg": [
            429.75,
            150.04895034621202
        ],
        "wc_reply_reviewers_avg": [
            40.75,
            52.36112584733067
        ],
        "wc_reply_authors_avg": [
            751.75,
            488.2040428960006
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            1.0897247358851685
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=786958337597142483&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Shanghai Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sjtu.edu.cn",
        "aff_unique_abbr": "SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Bongard-OpenWorld: Few-Shot Reasoning for Free-form Visual Concepts in the Real World",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18093",
        "id": "hWS4MueyzC",
        "author_site": "Rujie Wu, Xiaojian Ma, Qing Li, Zhenliang Zhang, Wei Wang, Song-Chun Zhu, Yizhou Wang",
        "tldr": "",
        "abstract": "We introduce Bongard-OpenWorld, a new benchmark for evaluating real-world few-shot reasoning for machine vision. It originates from the classical Bongard Problems (BPs): Given two sets of images (positive and negative), the model needs to identify the set that query images belong to by inducing the visual concepts, which is exclusively depicted by images from the positive set. Our benchmark inherits the few-shot concept induction of the original BPs while adding the two novel layers of challenge: 1) open-world free-form concepts, as the visual concepts in Bongard-OpenWorld are unique compositions of terms from an open vocabulary, ranging from object categories to abstract visual attributes and commonsense factual knowledge; 2)  real-world images, as opposed to the synthetic diagrams used by many counterparts. In our exploration, Bongard-OpenWorld already imposes a significant challenge to current few-shot reasoning algorithms. We further investigate to which extent the recently introduced Large Language Models (LLMs) and Vision-Language Models (VLMs) can solve our task, by directly probing VLMs, and combining VLMs and LLMs in an interactive reasoning scheme. We even conceived a neuro-symbolic reasoning approach that reconciles LLMs & VLMs with logical reasoning to emulate the human problem-solving process for Bongard Problems. However, none of these approaches manage to close the human-machine gap, as the best learner achieves 64% accuracy while human participants easily reach 91%. We hope Bongard-OpenWorld can help us better understand the limitations of current visual intelligence and facilitate future research on visual agents with stronger few-shot visual reasoning capabilities.",
        "keywords": "Few-shot learning;Visual reasoning;Open world learning",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Rujie Wu;Xiaojian Ma;Zhenliang Zhang;Wei Wang;Qing Li;Song-Chun Zhu;Yizhou Wang",
        "authorids": "~Rujie_Wu2;~Xiaojian_Ma1;~Zhenliang_Zhang2;~Wei_Wang4;~Qing_Li1;~Song-Chun_Zhu1;~Yizhou_Wang1",
        "gender": "M;;M;M;M;M;M",
        "homepage": "https://rujiewu.github.io;;http://www.zlz.link;http://cognn.com/;http://liqing-ustc.github.io/;https://zhusongchun.net/;https://cfcs.pku.edu.cn/wangyizhou/",
        "dblp": "324/8753;;74/9671-2;;181/2689-3;10/10313;71/3387-1",
        "google_scholar": "https://scholar.google.com/citations?;;https://scholar.google.com.hk/citations?user=wXOtuW0AAAAJ;https://scholar.google.com/citations?hl=en;iwdFZBEAAAAJ;https://scholar.google.com.tw/citations?user=Al8dyb4AAAAJ;831z_VcAAAAJ",
        "orcid": "0009-0001-6426-1248;;0000-0002-3620-7228;;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Rujie_Wu2;~Xiaojian_Ma1;~Zhenliang_Zhang2;~Wei_Wang4;~Qing_Li1;~Song-Chun_Zhu1;~Yizhou_Wang1",
        "aff": "Peking University;;Beijing Institute for General Artificial Intelligence;Beijing Institute for General Artificial Intelligence;Beijing Institute for General Artificial Intelligence (BIGAI);Peking University;Peking University",
        "aff_domain": "stu.pku.edu.cn;;bigai.ai;bigai.ai;bigai.ai;pku.edu.cn;pku.edu.cn",
        "position": "PhD student;;Researcher;Research Scientist;Researcher;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nwu2024bongardopenworld,\ntitle={Bongard-OpenWorld: Few-Shot Reasoning for Free-form Visual Concepts in the Real World},\nauthor={Rujie Wu and Xiaojian Ma and Zhenliang Zhang and Wei Wang and Qing Li and Song-Chun Zhu and Yizhou Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=hWS4MueyzC}\n}",
        "github": "",
        "project": "",
        "reviewers": "yoip;bqT5;Gtsv;CSkd",
        "pdf_size": 38218526,
        "rating": "5;6;8;8",
        "confidence": "5;4;3;4",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "30;260;81;122",
        "wc_strengths": "30;67;193;86",
        "wc_weaknesses": "55;583;144;390",
        "wc_questions": "4;282;78;472",
        "wc_review": "119;1192;496;1070",
        "wc_reply_reviewers": "69;202;134;1188",
        "wc_reply_authors": "222;2725;1037;4825",
        "reply_reviewers": "1;1;1;3",
        "reply_authors": "1;6;3;7",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            123.25,
            85.41479672749915
        ],
        "wc_strengths_avg": [
            94.0,
            60.60115510450275
        ],
        "wc_weaknesses_avg": [
            293.0,
            207.57769629707332
        ],
        "wc_questions_avg": [
            209.0,
            182.81411324074517
        ],
        "wc_review_avg": [
            719.25,
            434.93066976243466
        ],
        "wc_reply_reviewers_avg": [
            398.25,
            458.38105054637674
        ],
        "wc_reply_authors_avg": [
            2202.25,
            1762.9012131994236
        ],
        "reply_reviewers_avg": [
            1.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            4.25,
            2.384848003542364
        ],
        "replies_avg": [
            32,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5983077004461477992&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=hWS4MueyzC",
        "pdf": "https://openreview.net/pdf?id=hWS4MueyzC",
        "email": "stu.pku.edu.cn;;bigai.ai;bigai.ai;bigai.ai;pku.edu.cn;pku.edu.cn",
        "author_num": 7,
        "aff_unique_index": "0;1;1;1;0;0",
        "aff_unique_norm": "Peking University;Beijing Institute for General Artificial Intelligence",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.pku.edu.cn;http://www.bigaiai.org/",
        "aff_unique_abbr": "Peking U;BIGAI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "hWjPRRyiqm",
        "title": "EZ-CLIP: EFFICIENT ZERO-SHOT VIDEO ACTION RECOGNITION",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent advancements in large-scale pre-training of visual-language models on paired image-text data have demonstrated impressive generalization capabilities for zero-shot tasks. Building on this success, efforts have been made to adapt these image-based visual-language models, such as CLIP, for videos extending their zero-shot capabilities to the video domain. While these adaptations have shown promising results, they come at a significant computational cost and struggle with effectively modeling the crucial temporal aspects inherent to the video domain. In this study, we present EZ-CLIP, a simple and efficient adaptation of CLIP that addresses these challenges. EZ-CLIP leverages temporal visual prompting for seamless temporal adaptation, requiring no fundamental alterations to the core CLIP architecture while preserving its remarkable generalization abilities. Moreover, we introduce a novel learning objective that guides the temporal visual prompts to focus on capturing motion, thereby enhancing its learning capabilities from video data. We conducted extensive experiments on five different benchmark datasets, thoroughly evaluating EZ-CLIP for zero-shot learning and base-to-novel video action recognition, and also demonstrating its potential for few-shot generalization. Impressively, with a mere 5.2 million learnable parameters (as opposed to the 71.1 million in the prior best model), EZ-CLIP can be efficiently trained on a single GPU, outperforming existing approaches in several evaluations.",
        "keywords": "zero-shot learning;video action recognition;video representation learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/ec93aa87e07f052a2440e973c63538cd0cdeb6f2.zip",
        "author": "Shahzad Ahmad;Sukalpa Chanda;Yogesh S Rawat",
        "authorids": "~Shahzad_Ahmad1;~Sukalpa_Chanda1;~Yogesh_S_Rawat1",
        "gender": "M;;M",
        "homepage": ";;https://www.crcv.ucf.edu/person/rawat/",
        "dblp": ";;148/2258",
        "google_scholar": ";;D_JvEcwAAAAJ",
        "orcid": "0009-0002-5962-2659;;",
        "linkedin": "shahzad-ahmad-048aa4180/;;",
        "or_profile": "~Shahzad_Ahmad1;~Sukalpa_Chanda1;~Yogesh_S_Rawat1",
        "aff": ";;University of Central Florida",
        "aff_domain": ";;ucf.edu",
        "position": ";;Assistant Professor",
        "bibtex": "@misc{\nahmad2024ezclip,\ntitle={{EZ}-{CLIP}: {EFFICIENT} {ZERO}-{SHOT} {VIDEO} {ACTION} {RECOGNITION}},\nauthor={Shahzad Ahmad and Sukalpa Chanda and Yogesh S Rawat},\nyear={2024},\nurl={https://openreview.net/forum?id=hWjPRRyiqm}\n}",
        "github": "",
        "project": "",
        "reviewers": "wVRo;PcJL;y6Hw",
        "site": "https://openreview.net/forum?id=hWjPRRyiqm",
        "pdf_size": 7964413,
        "rating": "5;5;6",
        "confidence": "5;5;5",
        "soundness": "3;2;3",
        "contribution": "2;2;3",
        "presentation": "3;3;3",
        "wc_summary": "72;50;152",
        "wc_strengths": "56;77;119",
        "wc_weaknesses": "298;145;238",
        "wc_questions": "6;212;9",
        "wc_review": "432;484;518",
        "wc_reply_reviewers": "0;300;0",
        "wc_reply_authors": "1195;1716;759",
        "reply_reviewers": "0;2;0",
        "reply_authors": "3;4;2",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            5.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            91.33333333333333,
            43.8279464370496
        ],
        "wc_strengths_avg": [
            84.0,
            26.19160170741759
        ],
        "wc_weaknesses_avg": [
            227.0,
            62.94441992742486
        ],
        "wc_questions_avg": [
            75.66666666666667,
            96.41000409132285
        ],
        "wc_review_avg": [
            478.0,
            35.364765892999586
        ],
        "wc_reply_reviewers_avg": [
            100.0,
            141.4213562373095
        ],
        "wc_reply_authors_avg": [
            1223.3333333333333,
            391.2069642642995
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            3.0,
            0.816496580927726
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14376849455381693987&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Central Florida",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucf.edu",
        "aff_unique_abbr": "UCF",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "hXYmlHxrQR",
        "title": "Perceptual Context and Sensitivity in Image Quality Assessment: A Human-Centric Approach",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Blind Image Quality Assessment (BIQA) mirrors subjective made by human observers. The Human Visual System (HVS) assesses image quality by combining a global perspective of the contrasting relationships among samples of varying quality with a local analysis of individual images. However, current BIQA methodologies tend to emphasize local evaluations but overlook the contrasting relationship inherent in global perception, leading to the incomprehensive representation of human subjective assessment. Consequently, the representation learning of the BIQA model remains suboptimal. To address this, we present the Perceptual Context and Sensitivity in BIQA (CSIQA), a novel metric learning paradigm that seamlessly integrates efficient human-centric global and local evaluations into the BIQA methodology. Specifically, the CSIQA comprises two primary components:\n1). A Quality Context Contrastive Learning module, that is equipped with different contrastive learning strategies to effectively capture potential quality correlations in the \\textbf{global context} of the dataset.\n2). A Quality-aware mask attention module, which employs the random masking mechanism to ensure the consistency with visual \\textbf{local sensitivity}, thereby improving the model's perception of local distortions.\nExtensive experiments on eight standard BIQA datasets demonstrate the superior performance to the state-of-the-art BIQA methods, \\emph{i.e.,} achieving the PLCC values of 0.941 ($\\uparrow 3.3\\%$ vs. 0.908 in TID2013) and 0.920 ($\\uparrow 2.6\\%$ vs. 0.894 in LIVEC).",
        "keywords": "Human Visual System; Quality Context Contrastive Learning; Quality-Aware Mask Attention; Global and Local",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/e624e16a805478c40f380757b07798c1e04c222f.zip",
        "author": "Xudong Li;Jingyuan Zheng;Runze Hu;Xiawu Zheng;Ke Li;Yunhang Shen;Yutao Liu;Yan Zhang;Jian Zhang;Pingyang Dai;Rongrong Ji",
        "authorids": "~Xudong_Li7;~Jingyuan_Zheng1;~Runze_Hu1;~Xiawu_Zheng1;~Ke_Li4;~Yunhang_Shen1;~Yutao_Liu2;~Yan_Zhang22;~Jian_Zhang22;~Pingyang_Dai1;~Rongrong_Ji5",
        "gender": "M;;;M;M;M;M;;M;M;M",
        "homepage": "https://github.com/LXDxmumac/LXDxmumac.github.io;;;https://sites.google.com/view/zhengxiawu/%E9%A6%96%E9%A1%B5;http://keli.info;https://shenyunhang.github.io/;https://www.researchgate.net/profile/Yutao-Liu;;http://jianzhang.tech/;;http://mac.xmu.edu.cn/rrji-en.html",
        "dblp": ";;;222/7865;;146/1800;;;07/314-18;04/8207;86/5681",
        "google_scholar": ";;;jBgXocYAAAAJ;mfWsFM0AAAAJ;29teR74AAAAJ;;;7brFI_4AAAAJ;https://scholar.google.com.hk/citations?user=fEw3__QAAAAJ;",
        "orcid": ";;;0000-0002-6855-5403;0000-0001-7998-0731;0000-0002-3970-7519;0000-0002-3066-1884;;0000-0001-5486-3125;;",
        "linkedin": ";;;;;;;;;;",
        "or_profile": "~Xudong_Li7;~Jingyuan_Zheng1;~Runze_Hu1;~Xiawu_Zheng1;~Ke_Li4;~Yunhang_Shen1;~Yutao_Liu2;~Yan_Zhang22;~Jian_Zhang22;~Pingyang_Dai1;~Rongrong_Ji5",
        "aff": "XMU;;;PengCheng Lab;Tencent;Tencent;Ocean University of China;;Peking University;Xiamen University;Xiamen University",
        "aff_domain": "xmu.edu;;;pcl.ac.cn;tencent.com;tencent.com;ouc.edu.cn;;pku.edu.cn;xmu.edu.cn;xmu.edu.cn",
        "position": "MS student;;;Postdoc;Principal Researcher;Researcher;Associate Professor;;Assistant Professor;Senior Engineer;Full Professor",
        "bibtex": "@misc{\nli2024perceptual,\ntitle={Perceptual Context and Sensitivity in Image Quality Assessment: A Human-Centric Approach},\nauthor={Xudong Li and Jingyuan Zheng and Runze Hu and Xiawu Zheng and Ke Li and Yunhang Shen and Yutao Liu and Yan Zhang and Jian Zhang and Pingyang Dai and Rongrong Ji},\nyear={2024},\nurl={https://openreview.net/forum?id=hXYmlHxrQR}\n}",
        "github": "",
        "project": "",
        "reviewers": "GoQM;8aSJ;GAJw;NFhk;xjPV",
        "site": "https://openreview.net/forum?id=hXYmlHxrQR",
        "pdf_size": 2733809,
        "rating": "1;3;5;5;6",
        "confidence": "5;5;5;5;4",
        "soundness": "1;2;2;2;3",
        "contribution": "1;2;2;2;3",
        "presentation": "1;2;3;3;2",
        "wc_summary": "56;10;64;72;47",
        "wc_strengths": "6;24;55;19;25",
        "wc_weaknesses": "410;181;448;58;24",
        "wc_questions": "24;19;70;70;293",
        "wc_review": "496;234;637;219;389",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            4.0,
            1.7888543819998317
        ],
        "confidence_avg": [
            4.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            2.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            2.2,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            49.8,
            21.562931155109688
        ],
        "wc_strengths_avg": [
            25.8,
            16.092234151913154
        ],
        "wc_weaknesses_avg": [
            224.2,
            175.6
        ],
        "wc_questions_avg": [
            95.2,
            101.26282634807306
        ],
        "wc_review_avg": [
            395.0,
            158.5547224146919
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": -0.5590169943749475,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:my_KJ7vx7TAJ:scholar.google.com/&scioq=Perceptual+Context+and+Sensitivity+in+Image+Quality+Assessment:+A+Human-Centric+Approach&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;2;3;4;0;0",
        "aff_unique_norm": "Xiamen University;Pengcheng Lab;Tencent;Ocean University of China;Peking University",
        "aff_unique_dep": ";;Tencent Holdings Limited;;",
        "aff_unique_url": "https://www.xmu.edu.cn;;https://www.tencent.com;http://www.ouc.edu.cn;http://www.pku.edu.cn",
        "aff_unique_abbr": "XMU;;Tencent;OUC;Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "hac6DzbMa7",
        "title": "Continual Learning with Orthogonal Weights and Knowledge Transfer",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Orthogonal projection has been shown highly effective at overcoming *catastrophic forgetting* (CF) in continual learning (CL). Existing orthogonal projection methods are *all* based on *orthogonal gradients* (OG) between tasks. However, this paper shows theoretically that OG cannot guarantee CF elimination, which is a major limitation of the existing OG-based CL methods. Our theory further shows that only the *weight/parameter-level orthogonality* between tasks can guarantee CF elimination as the final classification is computed based on the network weights/parameters only. Existing OG-based methods also have two other *inherent limitations*, i.e., *over-consumption of network capacity* and *limiting knowledge transfer* (KT) across tasks. KT is also a core objective of CL. This paper then proposes a novel *weight-level orthogonal projection* method (called STIL), which ensures that each task occupies a weight subspace that is orthogonal to those of the other tasks. The method also addresses the two other limitations of the OG-based methods. Extensive evaluations show that the proposed STIL not only overcomes CF better than baselines, but also, perhaps more importantly, performs KT much better than them.",
        "keywords": "Continual Learning;Catastrophic Forgetting;Knowledge Transfer;Orthogonal Gradients Projection;Weight/Parameter-Level Orthogonality",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/650017dece4492a6f9efbfa4585ad946e8c3c4ed.zip",
        "author": "Zhi Wang;Yanni Li;Bing Liu;Zhongbin Wu;Jiawei Liu",
        "authorids": "~Zhi_Wang10;~Yanni_Li2;~Bing_Liu1;~Zhongbin_Wu1;~Jiawei_Liu4",
        "gender": "M;F;M;M;M",
        "homepage": "https://scholar.google.com.sg/citations?hl=zh-CN&user=gG5fmP4AAAAJ;;https://www.cs.uic.edu/~liub/;https://github.com/ZDLTH;",
        "dblp": ";;l/BingLiu1.html;;",
        "google_scholar": "https://scholar.google.com.sg/citations?hl=zh-CN;https://scholar.google.com/citations?hl=zh-CN;Kt1bjZoAAAAJ;;Tm8B3BIAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Zhi_Wang10;~Yanni_Li2;~Bing_Liu1;~Zhongbin_Wu1;~Jiawei_Liu4",
        "aff": "Xidian University;Xidian University;University of Illinois at Chicago;Xidian University;",
        "aff_domain": "xidian.edu.cn;xidian.edu;uic.edu;xidian.edu;",
        "position": "PhD student;Full Professor;Full Professor;MS student;",
        "bibtex": "@misc{\nwang2024continual,\ntitle={Continual Learning with Orthogonal Weights and Knowledge Transfer},\nauthor={Zhi Wang and Yanni Li and Bing Liu and Zhongbin Wu and Jiawei Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=hac6DzbMa7}\n}",
        "github": "",
        "project": "",
        "reviewers": "1mbh;bgzv;NdAy;c582",
        "site": "https://openreview.net/forum?id=hac6DzbMa7",
        "pdf_size": 497695,
        "rating": "3;3;6;6",
        "confidence": "5;5;3;5",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;2",
        "presentation": "3;1;1;3",
        "wc_summary": "100;90;64;105",
        "wc_strengths": "44;69;57;44",
        "wc_weaknesses": "333;401;132;32",
        "wc_questions": "87;85;49;113",
        "wc_review": "564;645;302;294",
        "wc_reply_reviewers": "0;283;0;0",
        "wc_reply_authors": "704;773;436;493",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            4.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            1.0
        ],
        "wc_summary_avg": [
            89.75,
            15.81731646013318
        ],
        "wc_strengths_avg": [
            53.5,
            10.404326023342406
        ],
        "wc_weaknesses_avg": [
            224.5,
            148.7758380920773
        ],
        "wc_questions_avg": [
            83.5,
            22.776083947860748
        ],
        "wc_review_avg": [
            451.25,
            155.92846917737634
        ],
        "wc_reply_reviewers_avg": [
            70.75,
            122.54259463549806
        ],
        "wc_reply_authors_avg": [
            601.5,
            140.6067210342379
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5773502691896258,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:3zv282jg9oUJ:scholar.google.com/&scioq=Continual+Learning+with+Orthogonal+Weights+and+Knowledge+Transfer&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Xidian University;University of Illinois at Chicago",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.xidian.edu.cn/;https://www.uic.edu",
        "aff_unique_abbr": "Xidian;UIC",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Chicago",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "FedP3: Federated Personalized and Privacy-friendly Network Pruning under Model Heterogeneity",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18092",
        "id": "hbHwZYqk9T",
        "author_site": "Kai Yi, Nidham Gazagnadou, Peter Richtarik, Lingjuan Lyu",
        "tldr": "",
        "abstract": "The interest in federated learning has surged in recent research due to its unique ability to train a global model using privacy-secured information held locally on each client. This paper pays particular attention to the issue of client-side model heterogeneity, a pervasive challenge in the practical implementation of FL that escalates its complexity.  Assuming a scenario where each client possesses varied memory storage, processing capabilities and network bandwidth - a phenomenon referred to as system heterogeneity - there is a pressing need to customize a unique model for each client. In response to this, we present an effective and adaptable federated framework FedP3, representing Federated Personalized and Privacy-friendly network Pruning, tailored for model heterogeneity scenarios. Our proposed methodology can incorporate and adapt well-established techniques to its specific instances. We offer a theoretical interpretation of FedP3 and its locally differential-private variant, DP-FedP3, and theoretically validate their efficiencies.",
        "keywords": "Network Pruning;Federated Learning;Model Heterogeneity",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Kai Yi;Nidham Gazagnadou;Peter Richt\u00e1rik;Lingjuan Lyu",
        "authorids": "~Kai_Yi1;~Nidham_Gazagnadou1;~Peter_Richt\u00e1rik1;~Lingjuan_Lyu1",
        "gender": "M;M;F;M",
        "homepage": "https://kaiyi.me/;https://ngazagna.github.io/;https://sites.google.com/view/lingjuan-lyu;https://richtarik.org",
        "dblp": "13/1589;236/5973;178/9876;62/8001",
        "google_scholar": "r08j39wAAAAJ;;;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0003-0415-3584;;;0000-0003-4380-5848",
        "linkedin": "kai-yi-347089153/;nidham-gazagnadou-b06415a7/;;richtarik/",
        "or_profile": "~Kai_Yi1;~Nidham_Gazagnadou1;~Lingjuan_Lyu1;~Peter_Richtarik1",
        "aff": "KAUST;Sony AI;Sony;King Abdullah University of Science and Technology (KAUST)",
        "aff_domain": "kaust.edu.sa;sony.com;sony.com;kaust.edu.sa",
        "position": "PhD student;Researcher;scientist;Full Professor",
        "bibtex": "@inproceedings{\nyi2024fedp,\ntitle={FedP3: Federated Personalized and Privacy-friendly Network Pruning under Model Heterogeneity},\nauthor={Kai Yi and Nidham Gazagnadou and Peter Richt{\\'a}rik and Lingjuan Lyu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=hbHwZYqk9T}\n}",
        "github": "",
        "project": "",
        "reviewers": "8d9P;CVkW;Kwpv;2HRe;45Hg;mPei",
        "pdf_size": 688678,
        "rating": "3;5;6;6;8;8",
        "confidence": "4;3;5;4;4;4",
        "soundness": "2;3;4;2;3;4",
        "contribution": "2;2;3;2;4;4",
        "presentation": "4;3;3;3;3;3",
        "wc_summary": "32;112;46;74;48;50",
        "wc_strengths": "46;71;54;30;80;108",
        "wc_weaknesses": "184;174;222;40;33;101",
        "wc_questions": "5;127;101;275;5;32",
        "wc_review": "267;484;423;419;166;291",
        "wc_reply_reviewers": "0;85;0;123;0;0",
        "wc_reply_authors": "849;1206;1417;1651;98;407",
        "reply_reviewers": "0;1;0;2;0;0",
        "reply_authors": "3;3;3;4;1;1",
        "rating_avg": [
            6.0,
            1.7320508075688772
        ],
        "confidence_avg": [
            4.0,
            0.5773502691896257
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.8333333333333335,
            0.8975274678557507
        ],
        "presentation_avg": [
            3.1666666666666665,
            0.3726779962499649
        ],
        "wc_summary_avg": [
            60.333333333333336,
            26.214923654709015
        ],
        "wc_strengths_avg": [
            64.83333333333333,
            25.221793926857956
        ],
        "wc_weaknesses_avg": [
            125.66666666666667,
            72.51819695006826
        ],
        "wc_questions_avg": [
            90.83333333333333,
            94.4500161755177
        ],
        "wc_review_avg": [
            341.6666666666667,
            109.43440450282941
        ],
        "wc_reply_reviewers_avg": [
            34.666666666666664,
            50.23832092027847
        ],
        "wc_reply_authors_avg": [
            938.0,
            548.5003798236303
        ],
        "reply_reviewers_avg": [
            0.5,
            0.7637626158259734
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            30,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.16666666666666669,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17548422163637969729&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=hbHwZYqk9T",
        "pdf": "https://openreview.net/pdf?id=hbHwZYqk9T",
        "email": "kaust.edu.sa;sony.com;sony.com;kaust.edu.sa",
        "author_num": 4,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "King Abdullah University of Science and Technology;Sony;Sony Corporation",
        "aff_unique_dep": ";Sony AI;",
        "aff_unique_url": "https://www.kaust.edu.sa;https://www.sony.com;https://www.sony.com",
        "aff_unique_abbr": "KAUST;Sony AI;Sony",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "Saudi Arabia;Japan"
    },
    {
        "id": "hbN3pu5mUg",
        "title": "LISA: Reasoning Segmentation via Large Language Model",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Although perception systems have made remarkable advancements in recent years, they still rely on explicit human instruction to identify the target objects or categories before executing visual recognition tasks. Such systems lack the ability to actively reason and comprehend implicit user intentions. In this work, we propose a new segmentation task --- reasoning segmentation. The task is designed to output a segmentation mask given a complex and implicit query text. Furthermore, we establish a benchmark comprising over one thousand image-instruction pairs, incorporating intricate reasoning and world knowledge for evaluation purposes. Finally, we present LISA: large Language Instructed Segmentation Assistant, which inherits the language generation capabilities of the multi-modal Large Language Model (LLM) while also possessing the ability to produce segmentation masks. We expand the original vocabulary with a <SEG> token and propose the embedding-as-mask paradigm to unlock the segmentation capability. Remarkably, LISA can handle cases involving: 1) complex reasoning; 2) world knowledge; 3) explanatory answers; 4) multi-turn conversation. Also, it demonstrates robust zero-shot capability when trained exclusively on reasoning-free datasets. In addition, fine-tuning the model with merely 239 reasoning segmentation image-instruction pairs results in further performance enhancement. Experiments show our method not only unlocks new reasoning segmentation capabilities but also proves effective in both complex reasoning segmentation and standard referring segmentation tasks.",
        "keywords": "Large Language Model;Multi-model Large Lanaguage Model;Segmentation;Reasoning Segmentation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Xin Lai;Zhuotao Tian;Yukang Chen;Yanwei Li;Yuhui Yuan;Shu Liu;Jiaya Jia",
        "authorids": "~Xin_Lai1;~Zhuotao_Tian1;~Yukang_Chen1;~Yanwei_Li1;~Yuhui_Yuan1;~Shu_Liu4;~Jiaya_Jia1",
        "gender": "M;M;M;;M;M;M",
        "homepage": "https://x-lai.github.io;https://scholar.google.com/citations?user=mEjhz-IAAAAJ&hl=zh-CN;https://yukangchen.com/;;;https://shuliu1993.github.io/;https://jiaya.me",
        "dblp": ";243/7181;225/4601;;190/7361;57/1180-5;31/5649",
        "google_scholar": "tqNDPA4AAAAJ;mEjhz-IAAAAJ;6p0ygKUAAAAJ;;PzyvzksAAAAJ;BUEDUFkAAAAJ;https://scholar.google.com.tw/citations?user=XPAkzTEAAAAJ",
        "orcid": ";;;;;;",
        "linkedin": ";;;;rainbowsecret/;;",
        "or_profile": "~Xin_Lai1;~Zhuotao_Tian1;~Yukang_Chen1;~Yanwei_Li1;~Yuhui_Yuan1;~Shu_Liu4;~Jiaya_Jia1",
        "aff": "The Chinese University of Hong Kong;SmartMore;NVIDIA;;Microsoft Research;SmartMore Ltd.;Department of Computer Science and Engineering, Hong Kong University of Science and Technology",
        "aff_domain": "cuhk.edu.hk;smartmore.com;nvidia.com;;microsoft.com;smartmore.com;cse.ust.hk",
        "position": "PhD student;Researcher;Researcher;;Senior Researcher;Principal Researcher;Full Professor",
        "bibtex": "@misc{\nlai2024lisa,\ntitle={{LISA}: Reasoning Segmentation via Large Language Model},\nauthor={Xin Lai and Zhuotao Tian and Yukang Chen and Yanwei Li and Yuhui Yuan and Shu Liu and Jiaya Jia},\nyear={2024},\nurl={https://openreview.net/forum?id=hbN3pu5mUg}\n}",
        "github": "",
        "project": "",
        "reviewers": "1t4G;KBow;t6An;VGzJ",
        "site": "https://openreview.net/forum?id=hbN3pu5mUg",
        "pdf_size": 7733693,
        "rating": "5;5;5;6",
        "confidence": "4;4;4;4",
        "soundness": "3;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "2;4;3;3",
        "wc_summary": "131;56;166;38",
        "wc_strengths": "80;33;43;110",
        "wc_weaknesses": "196;97;76;120",
        "wc_questions": "5;2;21;152",
        "wc_review": "412;188;306;420",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            97.75,
            52.62307003586925
        ],
        "wc_strengths_avg": [
            66.5,
            30.614539029683264
        ],
        "wc_weaknesses_avg": [
            122.25,
            45.334175850014084
        ],
        "wc_questions_avg": [
            45.0,
            62.197266820978555
        ],
        "wc_review_avg": [
            331.5,
            94.28016758576535
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 498,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=72522445660784918&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;2;3;1;4",
        "aff_unique_norm": "Chinese University of Hong Kong;SmartMore;NVIDIA;Microsoft;Hong Kong University of Science and Technology",
        "aff_unique_dep": ";;NVIDIA Corporation;Microsoft Research;Department of Computer Science and Engineering",
        "aff_unique_url": "https://www.cuhk.edu.hk;;https://www.nvidia.com;https://www.microsoft.com/en-us/research;https://www.ust.hk",
        "aff_unique_abbr": "CUHK;;NVIDIA;MSR;HKUST",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;2;2;0;0",
        "aff_country_unique": "China;;United States"
    },
    {
        "id": "hbsvyhznr4",
        "title": "AutoJoin: Efficient Adversarial Training against Gradient-Free Perturbations for Ro- bust Maneuvering via Denoising Autoencoder and Joint Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "With the growing use of machine learning algorithms and ubiquitous sensors,\nmany \u2018perception-to-control\u2019 systems are being developed and deployed.\nTo ensure their trustworthiness, improving their robustness through ad-\nversarial training is one potential approach. We propose a gradient-free\nadversarial training technique, named AutoJoin, to effectively and effi-\nciently produce robust models for image-based maneuvering. Compared to\nother state-of-the-art methods with testing on over 5M images, AutoJoin\nachieves significant performance increases up to the 40% range against\nperturbations while improving on clean performance up to 300%. Auto-\nJoin is also highly efficient, saving up to 86% time per training epoch\nand 90% training data over other state-of-the-art techniques. The core\nidea of AutoJoin is to use a decoder attachment to the original regression\nmodel creating a denoising autoencoder within the architecture. This archi-\ntecture allows the tasks \u2018maneuvering\u2019 and \u2018denoising sensor input\u2019 to be\njointly learnt and reinforce each other\u2019s performance. The project code is at\nhttps://anonymous.4open.science/r/AutoJoin-FA13.",
        "keywords": "autonomous driving;gradient-free perturbations",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/9dab7e6b1721e4a900183508779f33366b7613ad.pdf",
        "author": "Taylor Michael Villarreal;Bibek Poudel;Ryan Wickman;Yu Shen;Weizi Li",
        "authorids": "~Taylor_Michael_Villarreal2;~Bibek_Poudel1;~Ryan_Wickman1;~Yu_Shen1;~Weizi_Li1",
        "gender": "M;M;M;M;M",
        "homepage": "http://www.tmichaelvillarreal.com/home;https://poudel-bibek.github.io;;http://www.cs.umd.edu/~yushen/;http://weizi-li.github.io/",
        "dblp": ";298/8061;;;60/7775",
        "google_scholar": ";PzBn1jgAAAAJ;;krGKS_QAAAAJ;",
        "orcid": ";;;;",
        "linkedin": ";;ryan-wickman-771160144/;;",
        "or_profile": "~Taylor_Michael_Villarreal2;~Bibek_Poudel1;~Ryan_Wickman1;~Yu_Shen1;~Weizi_Li1",
        "aff": "University of Tennessee, Knoxville;University of Tennessee, Knoxville;University of Memphis;Adobe Research;University of Tennessee, Knoxville",
        "aff_domain": "utk.edu;utk.edu;memphis.edu;adobe.com;utk.edu",
        "position": "PhD student;PhD student;PhD student;Researcher;Assistant Professor",
        "bibtex": "@misc{\nvillarreal2024autojoin,\ntitle={AutoJoin: Efficient Adversarial Training against Gradient-Free Perturbations for Ro- bust Maneuvering via Denoising Autoencoder and Joint Learning},\nauthor={Taylor Michael Villarreal and Bibek Poudel and Ryan Wickman and Yu Shen and Weizi Li},\nyear={2024},\nurl={https://openreview.net/forum?id=hbsvyhznr4}\n}",
        "github": "",
        "project": "",
        "reviewers": "qavn;7kUe;vA9d;gYbZ",
        "site": "https://openreview.net/forum?id=hbsvyhznr4",
        "pdf_size": 1803393,
        "rating": "3;5;5;5",
        "confidence": "4;1;3;4",
        "soundness": "2;3;3;2",
        "contribution": "2;3;3;3",
        "presentation": "2;2;2;3",
        "wc_summary": "32;50;49;270",
        "wc_strengths": "18;39;53;63",
        "wc_weaknesses": "112;55;142;145",
        "wc_questions": "48;5;2;76",
        "wc_review": "210;149;246;554",
        "wc_reply_reviewers": "24;0;0;0",
        "wc_reply_authors": "321;71;180;230",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            1.224744871391589
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            100.25,
            98.26590202099607
        ],
        "wc_strengths_avg": [
            43.25,
            16.887495373796554
        ],
        "wc_weaknesses_avg": [
            113.5,
            36.15591237958185
        ],
        "wc_questions_avg": [
            32.75,
            30.898017735770686
        ],
        "wc_review_avg": [
            289.75,
            156.4550654341367
        ],
        "wc_reply_reviewers_avg": [
            6.0,
            10.392304845413264
        ],
        "wc_reply_authors_avg": [
            200.5,
            90.2510387751853
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.4714045207910316,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:1NYP5CfhWw8J:scholar.google.com/&scioq=AutoJoin:+Efficient+Adversarial+Training+against+Gradient-Free+Perturbations+for+Ro-+bust+Maneuvering+via+Denoising+Autoencoder+and+Joint+Learning&hl=en&as_sdt=0,23",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;1;2;0",
        "aff_unique_norm": "University of Tennessee;University of Memphis;Adobe",
        "aff_unique_dep": ";;Adobe Research",
        "aff_unique_url": "https://www.utk.edu;https://www.memphis.edu;https://research.adobe.com",
        "aff_unique_abbr": "UT;UM;Adobe",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Knoxville;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "hcXfzlmg7Y",
        "title": "Trolley Problems for Large Language Models Across 100+ Languages",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "As large language models (LLMs) are becoming deployed in more and more systems, it is crucial to inspect the moral tendencies in their decision-making process. In this paper, we take the largest set of moral judgments collected to date, the trolley problems, to check the preferences stated in LLMs' responses, as well as their supporting reasons. We first conduct a large-scale inspection on over 10K trolley problem scenarios in English, and compare them with human preferences. Then we extend the questions to different cultures by changing the language of the prompts and positioning the questions for different persona. We discover that LLMs tend to generate more human-aligned responses for the English culture, but also show interesting tendencies on other cultures.",
        "keywords": "AI Safety;Moral Decision-Making;Cognitive Science;Large Language Models",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Zhijing Jin",
        "authorids": "~Zhijing_Jin1",
        "gender": "",
        "homepage": "",
        "dblp": "",
        "google_scholar": "",
        "orcid": "",
        "linkedin": "",
        "or_profile": "",
        "aff": "",
        "aff_domain": "",
        "position": "",
        "bibtex": "@misc{\njin2024trolley,\ntitle={Trolley Problems for Large Language Models Across 100+ Languages},\nauthor={Zhijing Jin},\nyear={2024},\nurl={https://openreview.net/forum?id=hcXfzlmg7Y}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=hcXfzlmg7Y",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:2qMqToosAeoJ:scholar.google.com/&scioq=Trolley+Problems+for+Large+Language+Models+Across+100%2B+Languages&hl=en&as_sdt=0,5",
        "gs_version_total": 0
    },
    {
        "id": "hdCDVSPQ7v",
        "title": "Jorge: Approximate Preconditioning for GPU-Efficient Second-Order Optimization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Despite their better convergence properties compared to first-order optimizers,\nsecond-order optimizers for deep learning have been less popular due to their\nsignificant computational costs. The primary efficiency bottleneck in such\noptimizers is matrix inverse calculations in the preconditioning step, which\nare expensive to compute on GPUs.  In this paper, we introduce Jorge, a\nsecond-order optimizer that promises the best of both worlds -- rapid\nconvergence benefits of second-order methods, and high computational efficiency\ntypical of first-order methods. We address the primary computational bottleneck\nof computing matrix inverses by completely eliminating them using an\napproximation of the preconditioner computation. This makes Jorge extremely\nefficient on GPUs in terms of wall-clock time. Further, we describe an approach\nto determine Jorge's hyperparameters directly from a well-tuned SGD baseline,\nthereby significantly minimizing tuning efforts. Our empirical evaluations\ndemonstrate the distinct advantages of using Jorge, outperforming\nstate-of-the-art optimizers such as SGD, AdamW, and Shampoo across multiple\ndeep learning models, both in terms of sample efficiency and wall-clock time.",
        "keywords": "second order optimizer;hardware efficiency;approximate preconditioning",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Siddharth Singh;Zachary Sating;Abhinav Bhatele",
        "authorids": "~Siddharth_Singh7;~Zachary_Sating1;~Abhinav_Bhatele1",
        "gender": "M;M;",
        "homepage": "https://siddharth9820.github.io/;https://zsat.github.io/;https://www.cs.umd.edu/~bhatele",
        "dblp": ";;82/6441",
        "google_scholar": "jNyBgaEAAAAJ;;3x65qtwAAAAJ",
        "orcid": "0000-0002-2756-4290;0009-0005-1676-9302;",
        "linkedin": ";zack-sating/;",
        "or_profile": "~Siddharth_Singh7;~Zachary_Sating1;~Abhinav_Bhatele1",
        "aff": "University of Maryland, College Park;University of Maryland, College Park;University of Maryland, College Park",
        "aff_domain": "umd.edu;umd.edu;umd.edu",
        "position": "PhD student;MS student;Associate Professor",
        "bibtex": "@misc{\nsingh2024jorge,\ntitle={Jorge: Approximate Preconditioning for {GPU}-Efficient Second-Order Optimization},\nauthor={Siddharth Singh and Zachary Sating and Abhinav Bhatele},\nyear={2024},\nurl={https://openreview.net/forum?id=hdCDVSPQ7v}\n}",
        "github": "",
        "project": "",
        "reviewers": "9qvx;yz1B;LZ4W;k7BV",
        "site": "https://openreview.net/forum?id=hdCDVSPQ7v",
        "pdf_size": 481460,
        "rating": "3;5;5;5",
        "confidence": "2;5;4;4",
        "soundness": "1;2;2;2",
        "contribution": "2;3;2;2",
        "presentation": "4;4;3;3",
        "wc_summary": "113;76;83;69",
        "wc_strengths": "79;59;144;22",
        "wc_weaknesses": "372;45;414;77",
        "wc_questions": "163;162;35;88",
        "wc_review": "727;342;676;256",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "364;408;253;414",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            85.25,
            16.768646337734005
        ],
        "wc_strengths_avg": [
            76.0,
            44.26623995778272
        ],
        "wc_weaknesses_avg": [
            227.0,
            167.04640073943526
        ],
        "wc_questions_avg": [
            112.0,
            53.86557342124931
        ],
        "wc_review_avg": [
            500.25,
            204.3310732610192
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            359.75,
            64.58473116766841
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.9271726499455306,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17901480269297243793&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Maryland",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www/umd.edu",
        "aff_unique_abbr": "UMD",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "College Park",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "hdYqGkSr9S",
        "title": "Benchmarking Zero-Shot Recognition with Vision-Language Models: Challenges on Granularity and Specificity",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper introduces innovative benchmarks to evaluate Vision-Language Models (VLMs) in real-world zero-shot recognition tasks, focusing on the pivotal properties of granularity and specificity. We propose a unique evaluation protocol using adapted ImageNet and MS-COCO datasets to assess models' consistency in recognizing concepts at varying granularity levels and their sensitivity to the specificity of language inputs. Our extensive evaluation reveals that state-of-the-art VLMs, including contrastive models like CLIP, struggle with granularity and are sensitive to text specificity, impacting their effectiveness in open-world settings. This comprehensive study, a first in evaluating VLMs from these perspectives, provides valuable insights and tools for the community, highlighting the limitations and paving the way for enhanced models with better generalization in zero-shot recognition. Our benchmark will be open-sourced upon acceptance.",
        "keywords": "vision-language model;representation learning;benchmark",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Zhenlin Xu;Yi Zhu;Siqi Deng;Abhay Mittal;Yanbei Chen;Manchen Wang;Paolo Favaro;Joseph Tighe;Davide Modolo",
        "authorids": "~Zhenlin_Xu1;~Yi_Zhu1;~Siqi_Deng1;~Abhay_Mittal1;~Yanbei_Chen2;~Manchen_Wang1;~Paolo_Favaro1;~Joseph_Tighe3;~Davide_Modolo2",
        "gender": "M;M;;;F;;M;M;M",
        "homepage": "http://wildphoton.github.io/;https://bryanyzhu.github.io/;;;https://yanbeic.github.io/;;http://cvg.unibe.ch;https://jovapo.github.io/;http://davidemodolo.wordpress.com/",
        "dblp": "66/5350;;;286/7972;213/4048;262/0087;02/4162;58/8741;160/8205",
        "google_scholar": "RPGduXAAAAAJ;IXw4UiwAAAAJ;;BwE_L4MAAAAJ;u66VocEAAAAJ;https://scholar.google.com/citations?hl=en;w_XDRRsAAAAJ;TJo2_hAAAAAJ;l1SQgzIAAAAJ",
        "orcid": ";0000-0002-6482-6712;;0000-0002-4904-3162;;;0000-0003-3546-8247;0000-0002-0716-8119;0000-0002-7625-7748",
        "linkedin": ";yi-zhu-546a437a/;;abhaymittal;yanbeic/;manchenwang/;paolo-favaro-25765b4;joseph-tighe-4b85001/;davidemodolo/",
        "or_profile": "~Zhenlin_Xu1;~Yi_Zhu1;~Siqi_Deng1;~Abhay_Mittal1;~Yanbei_Chen2;~Manchen_Wang1;~Paolo_Favaro1;~Joseph_Tighe3;~Davide_Modolo2",
        "aff": "Amazon;Boson AI;;Amazon;Amazon;Amazon;Institute f\u00fcr Informatik, University of Bern;Meta;Amazon",
        "aff_domain": "amazon.com;boson.ai;;amazon.com;amazon.com;amazon.com;unibe.ch;meta.com;amazon.com",
        "position": "Applied Scientist;Researcher;;Researcher;Researcher;Researcher;Full Professor;Principal Researcher;Principal Researcher",
        "bibtex": "@misc{\nxu2024benchmarking,\ntitle={Benchmarking Zero-Shot Recognition with Vision-Language Models: Challenges on Granularity and Specificity},\nauthor={Zhenlin Xu and Yi Zhu and Siqi Deng and Abhay Mittal and Yanbei Chen and Manchen Wang and Paolo Favaro and Joseph Tighe and Davide Modolo},\nyear={2024},\nurl={https://openreview.net/forum?id=hdYqGkSr9S}\n}",
        "github": "",
        "project": "",
        "reviewers": "stdj;pPRh;PhzX;1Zb8;jHnf",
        "site": "https://openreview.net/forum?id=hdYqGkSr9S",
        "pdf_size": 6267660,
        "rating": "3;3;6;6;8",
        "confidence": "4;4;4;4;5",
        "soundness": "2;2;3;4;3",
        "contribution": "2;2;2;3;4",
        "presentation": "3;2;3;3;4",
        "wc_summary": "141;82;76;65;111",
        "wc_strengths": "12;44;82;136;156",
        "wc_weaknesses": "37;478;266;236;126",
        "wc_questions": "1;111;31;2;42",
        "wc_review": "191;715;455;439;435",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "238;735;656;336;401",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            5.2,
            1.9390719429665317
        ],
        "confidence_avg": [
            4.2,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.8,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.6,
            0.8
        ],
        "presentation_avg": [
            3.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            95.0,
            27.575351312358652
        ],
        "wc_strengths_avg": [
            86.0,
            54.14055781020362
        ],
        "wc_weaknesses_avg": [
            228.6,
            148.92360457630616
        ],
        "wc_questions_avg": [
            37.4,
            40.14274529725141
        ],
        "wc_review_avg": [
            447.0,
            165.91081941814403
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            473.2,
            190.42625869349004
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.7219948723811553,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9945401567126889525&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;0;0;0;2;3;0",
        "aff_unique_norm": "Amazon;Boson AI;University of Bern;Meta",
        "aff_unique_dep": "Amazon.com, Inc.;;Institute for Computer Science;Meta Platforms, Inc.",
        "aff_unique_url": "https://www.amazon.com;https://www.boson.ai;https://www.unibe.ch;https://meta.com",
        "aff_unique_abbr": "Amazon;Boson AI;UniBE;Meta",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;0;2;0;0",
        "aff_country_unique": "United States;China;Switzerland"
    },
    {
        "id": "hdoD5OYHPJ",
        "title": "AutoCLIP: Auto-tuning Zero-Shot Classifiers for Vision-Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Classifiers built upon vision-language models such as CLIP have shown remarkable zero-shot performance across a broad range of image classification tasks. Prior work has studied different ways of automatically creating descriptor sets for every class based on prompt templates, ranging from manually engineered templates over templates obtained from a large language model to templates built from random words and characters. Up until now, deriving zero-shot classifiers from the respective encoded class descriptors has remained nearly unchanged, i.e., classify to the class that maximizes cosine similarity between its averaged encoded class descriptors and the image encoding. However, weighing all class descriptors equally can be suboptimal when certain descriptors match visual clues on a given image better than others. In this work, we propose AutoCLIP, a method for auto-tuning zero-shot classifiers. AutoCLIP tunes per-image weights to each prompt template at inference time, based on statistics of class descriptor-image similarities. AutoCLIP is fully unsupervised, has very low computational overhead, and can be easily implemented in few lines of code. We show that AutoCLIP outperforms baselines across a broad range of vision-language models, datasets, and prompt templates consistently and by up to 3 percent point accuracy.",
        "keywords": "zero-shot image classifier;vision-language model;CLIP;multi-modal",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Jan Hendrik Metzen;Piyapat Saranrittichai;Chaithanya Kumar Mummadi",
        "authorids": "~Jan_Hendrik_Metzen1;~Piyapat_Saranrittichai1;~Chaithanya_Kumar_Mummadi1",
        "gender": "M;M;M",
        "homepage": "http://jmetzen.github.io/;;",
        "dblp": "93/1712;299/7804;208/6386",
        "google_scholar": "https://scholar.google.de/citations?user=w047VfEAAAAJ;https://scholar.google.de/citations?user=ncbD7EQAAAAJ;XJLtaG4AAAAJ",
        "orcid": ";0000-0003-0620-7945;0000-0002-1173-2720",
        "linkedin": "jan-hendrik-metzen-211543135/;https://www.linkedin.com/pub/piyapat-saranrittichai/38/684/b41;",
        "or_profile": "~Jan_Hendrik_Metzen1;~Piyapat_Saranrittichai1;~Chaithanya_Kumar_Mummadi1",
        "aff": "Bosch Center Artificial Intelligence;Albert-Ludwigs-Universit\u00e4t Freiburg;Bosch Center for Artificial Intelligence",
        "aff_domain": "bosch.com;uni-freiburg.de;bosch.com",
        "position": "Senior Expert;PhD student;Researcher",
        "bibtex": "@misc{\nmetzen2024autoclip,\ntitle={Auto{CLIP}: Auto-tuning Zero-Shot Classifiers for Vision-Language Models},\nauthor={Jan Hendrik Metzen and Piyapat Saranrittichai and Chaithanya Kumar Mummadi},\nyear={2024},\nurl={https://openreview.net/forum?id=hdoD5OYHPJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "2EvZ;rfek;5SeE",
        "site": "https://openreview.net/forum?id=hdoD5OYHPJ",
        "pdf_size": 1305544,
        "rating": "5;6;6",
        "confidence": "2;4;4",
        "soundness": "2;3;3",
        "contribution": "2;2;2",
        "presentation": "3;3;3",
        "wc_summary": "77;210;113",
        "wc_strengths": "92;98;30",
        "wc_weaknesses": "39;220;192",
        "wc_questions": "138;14;84",
        "wc_review": "346;542;419",
        "wc_reply_reviewers": "0;0;64",
        "wc_reply_authors": "788;780;673",
        "reply_reviewers": "0;0;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            133.33333333333334,
            56.16839759944099
        ],
        "wc_strengths_avg": [
            73.33333333333333,
            30.739045022396013
        ],
        "wc_weaknesses_avg": [
            150.33333333333334,
            79.5501239610739
        ],
        "wc_questions_avg": [
            78.66666666666667,
            50.76306618880393
        ],
        "wc_review_avg": [
            435.6666666666667,
            80.87988350359782
        ],
        "wc_reply_reviewers_avg": [
            21.333333333333332,
            30.169889330626027
        ],
        "wc_reply_authors_avg": [
            747.0,
            52.42772803266099
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14105039147554712937&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Bosch Center for Artificial Intelligence;Albert-Ludwigs-Universit\u00e4t Freiburg",
        "aff_unique_dep": "Artificial Intelligence;",
        "aff_unique_url": "https://www.bosch-ai.com;https://www.uni-freiburg.de",
        "aff_unique_abbr": "BCAI;Albert-Ludwigs-Universit\u00e4t",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Freiburg",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "he4CPgU44D",
        "title": "Active Continual Learning: On Balancing Knowledge Retention and Learnability",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Acquiring new knowledge without forgetting what has been learned in a sequence of tasks is the central focus of continual learning (CL). While tasks arrive sequentially, the training data are often prepared and annotated independently, leading to the CL of incoming supervised learning tasks. This paper considers the under-explored problem of active continual learning (ACL) for a sequence of active learning (AL) tasks, where each incoming task includes a pool of unlabelled data and an annotation budget. We investigate the effectiveness and interplay between several AL and CL algorithms in the domain, class and task-incremental scenarios. Our experiments reveal the trade-off between two contrasting goals of not forgetting the old knowledge and the ability to quickly learn new knowledge in CL and AL, respectively. While conditioning the query strategy on the annotations collected for the previous tasks leads to improved task performance on the domain and task incremental learning, our proposed forgetting-learning profile suggests a gap in balancing the effect of AL and CL for the class-incremental scenario.",
        "keywords": "continual learning;active learning;catastrophic forgetting",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Thuy-Trang Vu;Shahram Khadivi;Mahsa Ghorbanali;Dinh Phung;Gholamreza Haffari",
        "authorids": "~Thuy-Trang_Vu1;~Shahram_Khadivi1;~Mahsa_Ghorbanali1;~Dinh_Phung2;~Gholamreza_Haffari2",
        "gender": ";M;F;M;M",
        "homepage": ";;;https://research.monash.edu/en/persons/dinh-phung;https://rezahaffari.github.io/HomePage/HomePage.html",
        "dblp": "228/5538;03/5199;;71/5859;",
        "google_scholar": "https://scholar.google.com.au/citations?user=cx2eAe0AAAAJ;EQhruhUAAAAJ;;https://scholar.google.com.au/citations?user=OtA9SwIAAAAJ;https://scholar.google.com.tw/citations?user=Perjx5EAAAAJ",
        "orcid": ";;;0000-0002-9977-8247;",
        "linkedin": ";khadivi/;mahsa-ghorbanali-03134a77/?originalSubdomain=au;https://linkedin.com/in/dinh-phung-6b537a6;gholamrezahaffari/?originalSubdomain=au",
        "or_profile": "~Thuy-Trang_Vu1;~Shahram_Khadivi1;~Mahsa_Ghorbanali1;~Dinh_Phung1;~Gholamreza_Haffari1",
        "aff": "Monash University;eBay Research;Monash University;Monash University;Monash University",
        "aff_domain": "monash.edu;ebayinc.com;monash.edu;monash.edu;monash.edu",
        "position": "Assistant Professor;Director of Research;Researcher;Full Professor;Full Professor",
        "bibtex": "@misc{\nvu2024active,\ntitle={Active Continual Learning: On Balancing Knowledge Retention and Learnability},\nauthor={Thuy-Trang Vu and Shahram Khadivi and Mahsa Ghorbanali and Dinh Phung and Gholamreza Haffari},\nyear={2024},\nurl={https://openreview.net/forum?id=he4CPgU44D}\n}",
        "github": "",
        "project": "",
        "reviewers": "j1Rg;Hffh;3Lkg;Ej6r",
        "site": "https://openreview.net/forum?id=he4CPgU44D",
        "pdf_size": 874979,
        "rating": "3;5;5;6",
        "confidence": "2;3;4;4",
        "soundness": "2;3;2;2",
        "contribution": "2;2;2;2",
        "presentation": "2;3;2;2",
        "wc_summary": "115;25;97;49",
        "wc_strengths": "57;19;65;20",
        "wc_weaknesses": "226;49;216;117",
        "wc_questions": "9;11;47;2",
        "wc_review": "407;104;425;188",
        "wc_reply_reviewers": "0;0;21;0",
        "wc_reply_authors": "369;410;620;209",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            71.5,
            36.093628246547894
        ],
        "wc_strengths_avg": [
            40.25,
            20.94486810653149
        ],
        "wc_weaknesses_avg": [
            152.0,
            73.15394726192156
        ],
        "wc_questions_avg": [
            17.25,
            17.498214194597114
        ],
        "wc_review_avg": [
            281.0,
            138.37449186898573
        ],
        "wc_reply_reviewers_avg": [
            5.25,
            9.093266739736606
        ],
        "wc_reply_authors_avg": [
            402.0,
            146.56568493341135
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.899228803025897,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18233992533128475081&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;0;0;0",
        "aff_unique_norm": "Monash University;eBay",
        "aff_unique_dep": ";eBay Research",
        "aff_unique_url": "https://www.monash.edu;https://research.ebay.com",
        "aff_unique_abbr": "Monash;eBay",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;0",
        "aff_country_unique": "Australia;United States"
    },
    {
        "title": "Kosmos-G: Generating Images in Context with Multimodal Large Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18091",
        "id": "he6mX9LTyE",
        "author_site": "Xichen Pan, Li Dong, Shaohan Huang, Zhiliang Peng, Wenhu Chen, Furu Wei",
        "tldr": "",
        "abstract": "Recent advancements in subject-driven image generation have made significant strides. However, current methods still fall short in diverse application scenarios, as they require test-time tuning and cannot accept interleaved multi-image and text input. These limitations keep them far from the ultimate goal of \"image as a foreign language in image generation.\" This paper presents Kosmos-G, a model that leverages the advanced multimodal perception capabilities of Multimodal Large Language Models (MLLMs) to tackle the aforementioned challenge. Our approach aligns the output space of MLLM with CLIP using the textual modality as an anchor and performs compositional instruction tuning on curated data. Kosmos-G demonstrates an impressive capability of zero-shot subject-driven generation with interleaved multi-image and text input. Notably, the score distillation instruction tuning requires no modifications to the image decoder. This allows for a seamless substitution of CLIP and effortless integration with a myriad of U-Net techniques ranging from fine-grained controls to personalized image decoder variants. We posit Kosmos-G as an initial attempt towards the goal of \"image as a foreign language in image generation.\"",
        "keywords": "Diffusion Models;Vision-Language;Multimodal Large Language Model;Image Generation;Subject-Driven Generation",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Xichen Pan;Li Dong;Shaohan Huang;Zhiliang Peng;Wenhu Chen;Furu Wei",
        "authorids": "~Xichen_Pan1;~Li_Dong1;~Shaohan_Huang1;~Zhiliang_Peng1;~Wenhu_Chen3;~Furu_Wei1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://xichenpan.com/;http://dong.li;;;https://www.microsoft.com/en-us/research/people/fuwei/;https://wenhuchen.github.io/",
        "dblp": "317/0180;85/5090-4;176/0380;289/0209;72/5870;136/0957.html",
        "google_scholar": "9wh9VXIAAAAJ;wEfQgPgAAAAJ;;-X1tyN0AAAAJ;G-V1VpwAAAAJ;https://scholar.google.co.jp/citations?user=U8ShbhUAAAAJ",
        "orcid": "0000-0002-8308-841X;;;;;",
        "linkedin": "xichenpan/;;;;;",
        "or_profile": "~Xichen_Pan1;~Li_Dong1;~Shaohan_Huang1;~Zhiliang_Peng1;~Furu_Wei1;~wenhu_chen1",
        "aff": "Meta Facebook;Microsoft Research;Microsoft;University of Chinese Academy of Sciences;Microsoft Research;University of Waterloo",
        "aff_domain": "meta.com;microsoft.com;microsoft.com;ucas.ac.cn;microsoft.com;uwaterloo.ca",
        "position": "Intern;Principal Researcher;Researcher;PhD student;Distinguished Scientist;Assistant Professor",
        "bibtex": "@inproceedings{\npan2024kosmosg,\ntitle={Kosmos-G: Generating Images in Context with Multimodal Large Language Models},\nauthor={Xichen Pan and Li Dong and Shaohan Huang and Zhiliang Peng and Wenhu Chen and Furu Wei},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=he6mX9LTyE}\n}",
        "github": "",
        "project": "",
        "reviewers": "J1rb;VSX4;hrQd",
        "pdf_size": 12182770,
        "rating": "6;6;6",
        "confidence": "4;4;4",
        "soundness": "2;2;3",
        "contribution": "3;3;3",
        "presentation": "3;3;3",
        "wc_summary": "48;49;30",
        "wc_strengths": "54;57;82",
        "wc_weaknesses": "140;47;194",
        "wc_questions": "75;4;2",
        "wc_review": "317;157;308",
        "wc_reply_reviewers": "147;11;0",
        "wc_reply_authors": "1234;720;1170",
        "reply_reviewers": "1;1;0",
        "reply_authors": "7;5;6",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            42.333333333333336,
            8.73053390247253
        ],
        "wc_strengths_avg": [
            64.33333333333333,
            12.552113589175153
        ],
        "wc_weaknesses_avg": [
            127.0,
            60.71243694664216
        ],
        "wc_questions_avg": [
            27.0,
            33.95094500402996
        ],
        "wc_review_avg": [
            260.6666666666667,
            73.39542825604936
        ],
        "wc_reply_reviewers_avg": [
            52.666666666666664,
            66.85473472803221
        ],
        "wc_reply_authors_avg": [
            1041.3333333333333,
            228.71428075706646
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            6.0,
            0.816496580927726
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 87,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11534635979893554099&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=he6mX9LTyE",
        "pdf": "https://openreview.net/pdf?id=he6mX9LTyE",
        "email": "meta.com;microsoft.com;microsoft.com;ucas.ac.cn;microsoft.com;uwaterloo.ca",
        "author_num": 6,
        "aff_unique_index": "0;1;1;2;1;3",
        "aff_unique_norm": "Meta;Microsoft;University of Chinese Academy of Sciences;University of Waterloo",
        "aff_unique_dep": "Meta Platforms, Inc.;Microsoft Research;;",
        "aff_unique_url": "https://meta.com;https://www.microsoft.com/en-us/research;http://www.ucas.ac.cn;https://uwaterloo.ca",
        "aff_unique_abbr": "Meta;MSR;UCAS;UW",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0;2",
        "aff_country_unique": "United States;China;Canada"
    },
    {
        "id": "hfAEEsIQ6D",
        "title": "Perceptual Metrics for Video Game Playstyle Similarity and Diversity",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In gaming, decision-making diversity reflects the broad spectrum of styles that players can adopt. Despite the importance of this diversity, finding a universally applicable metric for it is challenging. To address this, a previous approach introduced the $\\textit{Playstyle Distance}$\u2014a method for gauging similarity between datasets using game screens and their corresponding action pairs. This method identifies comparable states in discrete representations and then computes action distribution distances. Building on it, we introduce several new techniques. These include multiscale analysis with varied state granularity, perceptual kernels rooted in psychology, and the utilization of the intersection over union method for efficient data assessment. These innovations advance playstyle measurement and offer insights into human cognition of similarity. In experiments across two racing games and seven Atari games, our metric achieves over 90\\% accuracy in playstyle classification. Remarkably, this requires fewer than 512 observation-action pairs, less than half an episode in all tested games. We also develop an algorithm for assessing decision-making diversity using this metric. Our findings illuminate promising avenues for real-time game analysis and the evolution of AI with diverse playstyles.",
        "keywords": "Playstyle;Decision-Making Behavior;Metric;Similarity;Diversity;Video Game;Deep Reinforcement Learning;Human Cognition",
        "primary_area": "metric learning, kernel learning, and sparse coding",
        "supplementary_material": "/attachment/ee79b36ffff9c5b99e42cc197cb252bbe481dd0e.zip",
        "author": "Chiu-Chou Lin;Wei-Chen Chiu;I-Chen Wu",
        "authorids": "~Chiu-Chou_Lin1;~Wei-Chen_Chiu3;~I-Chen_Wu3",
        "gender": "M;M;M",
        "homepage": "https://lightofhexagram.wordpress.com;https://cgilab.nctu.edu.tw/~icwu/;https://walonchiu.github.io/",
        "dblp": "303/5070;06/983;148/9413",
        "google_scholar": "https://scholar.google.com.tw/citations?user=eF4HSi0AAAAJ;;FiFOBS8AAAAJ",
        "orcid": ";0000-0003-2535-0587;0000-0001-7715-8306",
        "linkedin": ";;",
        "or_profile": "~Chiu-Chou_Lin1;~I-Chen_Wu3;~Wei-chen_Chiu2",
        "aff": "National Chiao Tung University;National Yang Ming Chiao Tung University;National Chiao Tung University",
        "aff_domain": "nctu.edu.tw;nycu.edu.tw;nctu.edu.tw",
        "position": "PhD student;Full Professor;Associate Professor",
        "bibtex": "@misc{\nlin2024perceptual,\ntitle={Perceptual Metrics for Video Game Playstyle Similarity and Diversity},\nauthor={Chiu-Chou Lin and Wei-Chen Chiu and I-Chen Wu},\nyear={2024},\nurl={https://openreview.net/forum?id=hfAEEsIQ6D}\n}",
        "github": "",
        "project": "",
        "reviewers": "EUGE;6U4t;MAaz;crkG",
        "site": "https://openreview.net/forum?id=hfAEEsIQ6D",
        "pdf_size": 4214988,
        "rating": "3;3;5;6",
        "confidence": "4;3;4;2",
        "soundness": "3;3;2;3",
        "contribution": "2;1;2;2",
        "presentation": "2;2;3;3",
        "wc_summary": "62;199;129;59",
        "wc_strengths": "28;61;159;41",
        "wc_weaknesses": "246;383;198;529",
        "wc_questions": "6;94;248;4",
        "wc_review": "342;737;734;633",
        "wc_reply_reviewers": "24;0;202;70",
        "wc_reply_authors": "731;1045;987;1056",
        "reply_reviewers": "2;0;2;1",
        "reply_authors": "3;2;3;3",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            112.25,
            57.37322982018704
        ],
        "wc_strengths_avg": [
            72.25,
            51.44596680012924
        ],
        "wc_weaknesses_avg": [
            339.0,
            129.00193796993904
        ],
        "wc_questions_avg": [
            88.0,
            99.26731586982696
        ],
        "wc_review_avg": [
            611.5,
            161.1280546646052
        ],
        "wc_reply_reviewers_avg": [
            74.0,
            78.06407624509497
        ],
        "wc_reply_authors_avg": [
            954.75,
            131.8149744907611
        ],
        "reply_reviewers_avg": [
            1.25,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.75,
            0.4330127018922193
        ],
        "replies_avg": [
            32,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:vhTPJ7O2_ssJ:scholar.google.com/&scioq=Perceptual+Metrics+for+Video+Game+Playstyle+Similarity+and+Diversity&hl=en&as_sdt=0,30",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "National Chiao Tung University;National Yang Ming Chiao Tung University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.nctu.edu.tw;https://www.nycu.edu.tw",
        "aff_unique_abbr": "NCTU;NYCU",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Taiwan",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "hftNRiSQQq",
        "title": "Boosting Efficiency in Task-Agnostic Exploration Through Causal Knowledge",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The effectiveness of model training heavily relies on the quality of available training resources. However, budget constraints often impose limitations on data collection efforts. To tackle this challenge, we introduce $\\textit{causal exploration}$ in this paper, a strategy that leverages the underlying causal knowledge for both data collection and model training. We, in particular, focus on enhancing the sample efficiency and reliability of the world model learning within the domain of task-agnostic reinforcement learning. During the exploration phase, the agent actively selects actions expected to yield causal insights most beneficial for world model training. Concurrently, the causal knowledge is acquired and incrementally refined with the ongoing collection of data. We demonstrate that causal exploration aids in learning accurate world models using fewer data and provide theoretical guarantees for its convergence. Empirical experiments, on both synthetic data and real-world applications, further validate the benefits of causal exploration.",
        "keywords": "Causal Exploration;Reinforcement Learning;Active Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/134194e52ea19e2de0f7abb522cf189f3bd24ebe.pdf",
        "author": "Yupei Yang;Biwei Huang;Shikui Tu;Lei Xu",
        "authorids": "~Yupei_Yang1;~Biwei_Huang1;~Shikui_Tu1;~Lei_Xu7",
        "gender": "M;F;M;M",
        "homepage": "https://yupei-yang.github.io/;;http://www.cs.sjtu.edu.cn/~tushikui;http://www.cse.cuhk.edu.hk/~lxu/",
        "dblp": ";165/3288;04/115;19/360-1",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;Yewd61kAAAAJ;rN2ny9kAAAAJ",
        "orcid": ";;0000-0001-6270-0449;0000-0002-2752-1573",
        "linkedin": ";;;",
        "or_profile": "~Yupei_Yang1;~Biwei_Huang1;~Shikui_Tu1;~Lei_Xu7",
        "aff": "Shanghai Jiaotong University;University of California, San Diego;Shanghai Jiaotong University;Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn;ucsd.edu;sjtu.edu.cn;sjtu.edu.cn",
        "position": "PhD student;Assistant Professor;Associate Professor;Full Professor",
        "bibtex": "@misc{\nyang2024boosting,\ntitle={Boosting Efficiency in Task-Agnostic Exploration Through Causal Knowledge},\nauthor={Yupei Yang and Biwei Huang and Shikui Tu and Lei Xu},\nyear={2024},\nurl={https://openreview.net/forum?id=hftNRiSQQq}\n}",
        "github": "",
        "project": "",
        "reviewers": "GFa4;8ich;SHAc;mVqv",
        "site": "https://openreview.net/forum?id=hftNRiSQQq",
        "pdf_size": 0,
        "rating": "3;3;3;5",
        "confidence": "4;5;4;3",
        "soundness": "2;1;2;3",
        "contribution": "1;2;1;2",
        "presentation": "2;1;2;3",
        "wc_summary": "179;23;91;23",
        "wc_strengths": "61;22;100;23",
        "wc_weaknesses": "185;97;759;29",
        "wc_questions": "223;5;4;175",
        "wc_review": "648;147;954;250",
        "wc_reply_reviewers": "22;58;0;0",
        "wc_reply_authors": "834;341;903;482",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "2;1;2;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            79.0,
            64.06246951218786
        ],
        "wc_strengths_avg": [
            51.5,
            32.113081446662825
        ],
        "wc_weaknesses_avg": [
            267.5,
            289.1068141708182
        ],
        "wc_questions_avg": [
            101.75,
            98.72024868283103
        ],
        "wc_review_avg": [
            499.75,
            322.1524289835481
        ],
        "wc_reply_reviewers_avg": [
            20.0,
            23.706539182259394
        ],
        "wc_reply_authors_avg": [
            640.0,
            235.14357316329102
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3405160498605679890&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Shanghai Jiao Tong University;University of California, San Diego",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.sjtu.edu.cn;https://www.ucsd.edu",
        "aff_unique_abbr": "SJTU;UCSD",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";San Diego",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "hgDDyoWQt3",
        "title": "Feasibility with Language Models for Open-World Compositional Zero-Shot Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Humans can easily tell if an attribute (also called state) is realistic, i.e., feasible, for an object, e.g. fire can be hot, but it cannot be wet. In Open-World Compositional Zero-Shot Learning, when all possible state-object combinations are considered as unseen classes, zero-shot predictors tend to perform poorly. Our work focuses on using external auxiliary knowledge to determine the feasibility of state-object combinations. Our Feasibility with Language Model (FLM) is a simple and effective approach that leverages Large Language Models (LLMs) to better comprehend the semantic relationships between states and objects. FLM involves querying an LLM about the feasibility of a given pair and retrieving the output logit for the positive answer. To mitigate potential misguidance of the LLM given that many of the state-object compositions are rare or completely infeasible, we observe that significant work needs to go into exploiting the in-context learning ability of LLMs. We present an extensive study on many prompt variants and involving six LLMs, including two LLMs with open access to the logit values, identifying Vicuna and ChatGPT as best performing, and we demonstrate that our FLM consistently improves OW-CZSL performance across all three benchmarks.",
        "keywords": "Compositional Zero-Shot Learning;Large Language Models",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Jae Myung Kim;Stephan Alaniz;Cordelia Schmid;Zeynep Akata",
        "authorids": "~Jae_Myung_Kim1;~Stephan_Alaniz1;~Cordelia_Schmid1;~Zeynep_Akata1",
        "gender": "M;M;F;F",
        "homepage": "https://jaemyung-kim.github.io;https://www.eml-munich.de/people/stephan-alaniz;https://cordeliaschmid.github.io/;https://eml-unitue.de/people/zeynep-akata",
        "dblp": "51/1888;217/1919;s/CordeliaSchmid;117/4838",
        "google_scholar": "eP6FHFAAAAAJ;mzZa_yQAAAAJ;IvqCXP4AAAAJ;jQl9RtkAAAAJ",
        "orcid": ";0000-0003-3541-2163;;0000-0002-1432-7747",
        "linkedin": ";;cordelia-schmid-47985a9;zeynep-akata-36182045/?ppe=1",
        "or_profile": "~Jae_Myung_Kim1;~Stephan_Alaniz1;~Cordelia_Schmid1;~Zeynep_Akata1",
        "aff": "University of Tuebingen;Eberhard-Karls-Universit\u00e4t T\u00fcbingen;Inria;Helmholtz Munich",
        "aff_domain": "uni-tuebingen.de;uni-tuebingen.de;inria.fr;helmholtz-munich.de",
        "position": "PhD student;Postdoc;Researcher;Researcher",
        "bibtex": "@misc{\nkim2024feasibility,\ntitle={Feasibility with Language Models for Open-World Compositional Zero-Shot Learning},\nauthor={Jae Myung Kim and Stephan Alaniz and Cordelia Schmid and Zeynep Akata},\nyear={2024},\nurl={https://openreview.net/forum?id=hgDDyoWQt3}\n}",
        "github": "",
        "project": "",
        "reviewers": "655z;iHMU;Z7Er;niw2",
        "site": "https://openreview.net/forum?id=hgDDyoWQt3",
        "pdf_size": 737538,
        "rating": "3;3;5;6",
        "confidence": "4;4;5;4",
        "soundness": "3;2;3;2",
        "contribution": "1;2;3;2",
        "presentation": "2;2;3;3",
        "wc_summary": "103;46;75;57",
        "wc_strengths": "24;47;18;74",
        "wc_weaknesses": "176;116;120;49",
        "wc_questions": "65;2;1;42",
        "wc_review": "368;211;214;222",
        "wc_reply_reviewers": "41;41;0;0",
        "wc_reply_authors": "704;479;542;407",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            70.25,
            21.556611514799815
        ],
        "wc_strengths_avg": [
            40.75,
            22.038318901404434
        ],
        "wc_weaknesses_avg": [
            115.25,
            45.007638240636446
        ],
        "wc_questions_avg": [
            27.5,
            27.244265451650556
        ],
        "wc_review_avg": [
            253.75,
            66.08469943943152
        ],
        "wc_reply_reviewers_avg": [
            20.5,
            20.5
        ],
        "wc_reply_authors_avg": [
            533.0,
            109.67451846258547
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:iFFzhpJeWIcJ:scholar.google.com/&scioq=Feasibility+with+Language+Models+for+Open-World+Compositional+Zero-Shot+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "University of Tuebingen;Eberhard Karls University of T\u00fcbingen;INRIA;Helmholtz Zentrum M\u00fcnchen",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.uni-tuebingen.de/;https://www.uni-tuebingen.de/;https://www.inria.fr;https://www.helmholtz-muenchen.de",
        "aff_unique_abbr": "Uni T\u00fcbingen;Uni T\u00fcbingen;Inria;HMGU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";T\u00fcbingen",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "Germany;France"
    },
    {
        "id": "hgQFmoZT4g",
        "title": "CT++: Complementary Co-Training for Semi-Supervised Semantic Segmentation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "With limited annotations, semi-supervised semantic segmentation aims to enhance the segmentation ability through abundant unlabeled images. Among recent trends, co-training is gaining increasing popularity, where two parallel models produce pseudo labels for each other. The success of co-training heavily relies on the discrepancy of peer models. To achieve this, prior works mostly leverage different initializations in decoders. Unfortunately, the two models still quickly converge to an extremely coupling state, making co-training downgrade to poorer self-training. To address this dilemma, we present our CT++, decoupling dual Co-Training models from two novel perspectives. First, we propose to construct complementary feature-level views. We design two co-training models to utilize disjoint and complementary sets of features for decoding. Apart from complementary features, we further seek complementary input views for the two models to learn respectively. Our two complementary principles enlarge the model discrepancy significantly, enabling co-training models to transfer distinct knowledge to each other and broaden their capability. This contributes to remarkably boosted co-training effectiveness. Extensive studies on Pascal, Cityscapes, COCO, and ADE20K exhibit the strong superiority of our method, e.g., 80.2% mIoU with only 92 labels on Pascal.",
        "keywords": "semi-supervised learning;semantic segmentation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Lihe Yang;Zhen Zhao;Xiaogang Xu;Yu Qiao;Yinghuan Shi;Hengshuang Zhao",
        "authorids": "~Lihe_Yang1;~Zhen_Zhao4;~Xiaogang_Xu2;~Yu_Qiao1;~Yinghuan_Shi3;~Hengshuang_Zhao2",
        "gender": ";M;M;;M;M",
        "homepage": "https://liheyoung.github.io/;http://zhaozhen.me/;https://xiaogang00.github.io;;https://cs.nju.edu.cn/shiyh/;https://hszhao.github.io",
        "dblp": ";29/1773-1;118/2268-2;;30/7184;185/7848",
        "google_scholar": "QX7xv3UAAAAJ;7mpuhO8AAAAJ;https://scholar.google.com.hk/citations?user=R65xDQwAAAAJ;;m6BKDUMAAAAJ;4uE10I0AAAAJ",
        "orcid": ";0000-0002-0796-4078;0000-0002-7928-7336;;;0000-0001-8277-2706",
        "linkedin": ";;;;;hengshuang-zhao-347b8391/?originalSubdomain=hk",
        "or_profile": "~Lihe_Yang1;~Zhen_Zhao4;~Xiaogang_Xu2;~Yu_Qiao1;~Yinghuan_Shi3;~Hengshuang_Zhao2",
        "aff": "The University of Hong Kong;University of Sydney;Zhejiang University;;Nanjing University;The University of Hong Kong",
        "aff_domain": "hku.hk;usyd.edu.au;zju.edu.cn;;nju.edu.cn;hku.hk",
        "position": "PhD student;PhD student;Assistant Professor;;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nyang2024ct,\ntitle={{CT}++: Complementary Co-Training for Semi-Supervised Semantic Segmentation},\nauthor={Lihe Yang and Zhen Zhao and Xiaogang Xu and Yu Qiao and Yinghuan Shi and Hengshuang Zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=hgQFmoZT4g}\n}",
        "github": "",
        "project": "",
        "reviewers": "TKHm;RoW9;4N2H;VjKK",
        "site": "https://openreview.net/forum?id=hgQFmoZT4g",
        "pdf_size": 6945305,
        "rating": "3;3;5;5",
        "confidence": "5;5;4;4",
        "soundness": "3;2;3;2",
        "contribution": "1;2;2;2",
        "presentation": "3;3;3;3",
        "wc_summary": "122;105;57;38",
        "wc_strengths": "61;40;12;22",
        "wc_weaknesses": "290;376;245;148",
        "wc_questions": "61;54;2;30",
        "wc_review": "534;575;316;238",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            80.5,
            34.20891696619465
        ],
        "wc_strengths_avg": [
            33.75,
            18.659782956937093
        ],
        "wc_weaknesses_avg": [
            264.75,
            82.21123706647407
        ],
        "wc_questions_avg": [
            36.75,
            23.12331074911203
        ],
        "wc_review_avg": [
            415.75,
            142.20473796607482
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Lon0bLb1dhIJ:scholar.google.com/&scioq=CT%2B%2B:+Complementary+Co-Training+for+Semi-Supervised+Semantic+Segmentation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;0",
        "aff_unique_norm": "University of Hong Kong;University of Sydney;Zhejiang University;Nanjing University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.hku.hk;https://www.sydney.edu.au;https://www.zju.edu.cn;https://www.nju.edu.cn",
        "aff_unique_abbr": "HKU;USYD;ZJU;Nanjing U",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;1;0;0;0",
        "aff_country_unique": "China;Australia"
    },
    {
        "id": "hgayrNSbri",
        "title": "Close the Gap: Lightweight Image Captioning via Retrieval Augmentation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Image Captioning is important for many applications such as content-based image search or accessibility for visually impaired individuals.\n  To achieve rich language capabilities, recent work conditioned pretrained language models (LMs) on pretrained vision-language models (VLMs) that allow for image inputs.\n  However, pretrained VLMs usually suffer from a modality gap which constitutes the misalignment of image and text representations in the joint embedding space.\n  While this gap can in principle be minimized by finetuning, this is usually costly or often infeasible and requires large amounts of task specific data.\n  To address this issue, we propose to bridge the modality gap at lower costs via a linear mapping that is optimized via a least-squares solution.\n  This does not require gradients and can be computed within minutes, even on CPU.\n  At inference, we apply our mapping to images embedded by the VLM and retrieve the closest captions from the training dataset.\n  Along with an instruction, these captions serve as a prompt for the LM to generate a new caption.\n  In addition, we propose a method to iteratively refine the mapping by bootstrapping synthetic captions from the LM.\n  This enables explicit optimization for commonly used image captioning metrics.\n  We find that reference-free metrics, such as CLIP-score, often assign unusually high scores to hallucinated content.\n  On reference-based metrics, our method achieves competitive performance to lightweight captioning approaches on MS-COCO and Flickr30k datasets.",
        "keywords": "Image Captioning;Vision-Language Models;Foundation Models;Large Language Models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/c828181a7fc8e8d1d74c7f93dcfe9011f323bfe3.zip",
        "author": "Fabian Paischer;Thomas Adler;Markus Hofmarcher;Sepp Hochreiter",
        "authorids": "~Fabian_Paischer1;~Thomas_Adler1;~Markus_Hofmarcher1;~Sepp_Hochreiter1",
        "gender": "M;M;M;M",
        "homepage": ";;;https://www.jku.at/en/institute-for-machine-learning/about-us/team/sepp-hochreiter/",
        "dblp": "309/5971;250/9175;224/9960;h/SeppHochreiter.html",
        "google_scholar": "zdm5ZKwAAAAJ;R6p_vo4AAAAJ;FD27EMIAAAAJ;https://scholar.google.at/citations?user=tvUH3WMAAAAJ",
        "orcid": ";;;0000-0001-7449-2528",
        "linkedin": ";;;https://linkedin.com/in/sepp-hochreiter-41514846",
        "or_profile": "~Fabian_Paischer1;~Thomas_Adler1;~Markus_Hofmarcher1;~Sepp_Hochreiter1",
        "aff": ", Johannes Kepler Universit\u00e4t Linz;Johannes Kepler University Linz;Johannes Kepler Universit\u00e4t Linz;Johannes Kepler University Linz",
        "aff_domain": "bioinf.jku.at;jku.at;jku.at;jku.at",
        "position": "PhD student;PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\npaischer2024close,\ntitle={Close the Gap: Lightweight Image Captioning via Retrieval Augmentation},\nauthor={Fabian Paischer and Thomas Adler and Markus Hofmarcher and Sepp Hochreiter},\nyear={2024},\nurl={https://openreview.net/forum?id=hgayrNSbri}\n}",
        "github": "",
        "project": "",
        "reviewers": "yd7b;ZWpM;mspE;rPFf;RtHk",
        "site": "https://openreview.net/forum?id=hgayrNSbri",
        "pdf_size": 5108864,
        "rating": "3;3;3;3;5",
        "confidence": "4;3;4;4;5",
        "soundness": "1;2;2;2;3",
        "contribution": "1;3;2;2;3",
        "presentation": "2;3;2;3;3",
        "wc_summary": "108;99;71;91;207",
        "wc_strengths": "9;134;15;52;102",
        "wc_weaknesses": "244;364;274;358;168",
        "wc_questions": "15;130;30;8;4",
        "wc_review": "376;727;390;509;481",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "245;412;387;383;210",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            3.4,
            0.8
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            2.2,
            0.7483314773547882
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            115.2,
            47.499052622131316
        ],
        "wc_strengths_avg": [
            62.4,
            48.787703368779304
        ],
        "wc_weaknesses_avg": [
            281.6,
            73.48904680290798
        ],
        "wc_questions_avg": [
            37.4,
            47.14064064053436
        ],
        "wc_review_avg": [
            496.6,
            126.0073013757536
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            327.4,
            82.91344884878447
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.7905694150420948,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:AzLoBK-XbuIJ:scholar.google.com/&scioq=Close+the+Gap:+Lightweight+Image+Captioning+via+Retrieval+Augmentation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "Johannes Kepler Universit\u00e4t Linz;Johannes Kepler University;Johannes Kepler University Linz",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.jku.at;https://www.jku.at;https://www.jku.at",
        "aff_unique_abbr": "JKU;JKU;JKU",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Linz",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Austria"
    },
    {
        "title": "GPAvatar: Generalizable and Precise Head Avatar from Image(s)",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18090",
        "id": "hgehGq2bDv",
        "author_site": "Xuangeng Chu, Yu Li, Ailing Zeng, Tianyu Yang, Lijian Lin, Yunfei Liu, Tatsuya Harada",
        "tldr": "",
        "abstract": "Head avatar reconstruction, crucial for applications in virtual reality, online meetings, gaming, and film industries, has garnered substantial attention within the computer vision community. The fundamental objective of this field is to faithfully recreate the head avatar and precisely control expressions and postures. Existing methods, categorized into 2D-based warping, mesh-based, and neural rendering approaches, present challenges in maintaining multi-view consistency, incorporating non-facial information, and generalizing to new identities. In this paper, we propose a framework named GPAvatar that reconstructs 3D head avatars from one or several images in a single forward pass. The key idea of this work is to introduce a dynamic point-based expression field driven by a point cloud to precisely and effectively capture expressions. Furthermore, we use a Multi Tri-planes Attention (MTA) fusion module in tri-planes canonical field to leverage information from multiple input images. The proposed method achieves faithful identity reconstruction, precise expression control, and multi-view consistency, demonstrating promising results for free-viewpoint rendering and novel view synthesis.",
        "keywords": "NeRF;Head Avatar;Dynamic NeRF",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/b8a175f9d670c207f4aecdb8f2b49d0be34c524d.zip",
        "author": "Xuangeng Chu;Yu Li;Ailing Zeng;Tianyu Yang;Lijian Lin;Yunfei Liu;Tatsuya Harada",
        "authorids": "~Xuangeng_Chu1;~Yu_Li4;~Ailing_Zeng1;~Tianyu_Yang2;~Lijian_Lin1;~Yunfei_Liu1;~Tatsuya_Harada1",
        "gender": "M;M;F;M;;M;M",
        "homepage": "https://xg-chu.site;https://yu-li.github.io/;https://ailingzeng.site/;https://tianyu-yang.com/;;https://www.liuyunfei.net;https://www.mi.t.u-tokyo.ac.jp/harada/",
        "dblp": ";34/2997-3;226/4720;120/8076-3.html;;136/3330-1.html;14/5849",
        "google_scholar": "yr4kSUsAAAAJ;j9lwU7kAAAAJ;Tn7fzS8AAAAJ;BXsWsf8AAAAJ;;https://scholar.google.com.hk/citations?user=B1Z1vTMAAAAJ;https://scholar.google.com/citations?hl=ja",
        "orcid": ";;;;;;",
        "linkedin": "xuangeng-chu-544188165/;;%E7%88%B1%E7%8E%B2-%E6%9B%BE-65504112a/;;;;",
        "or_profile": "~Xuangeng_Chu1;~Yu_Li4;~Ailing_Zeng1;~Tianyu_Yang2;~Lijian_Lin1;~Yunfei_Liu1;~Tatsuya_Harada1",
        "aff": "Princeton University;International Digital Economy Academy;International Digital Economy Academy;International Digital Economy Academy;;International Digital Economy Academy (IDEA);The University of Tokyo",
        "aff_domain": "princeton.edu;idea.edu.cn;idea.edu.cn;idea.edu.cn;;idea.edu.cn;u-tokyo.ac.jp",
        "position": "Student Researcher;Principal Researcher;Researcher;Researcher;;Researcher;Full Professor",
        "bibtex": "@inproceedings{\nchu2024gpavatar,\ntitle={{GPA}vatar: Generalizable and Precise Head Avatar from Image(s)},\nauthor={Xuangeng Chu and Yu Li and Ailing Zeng and Tianyu Yang and Lijian Lin and Yunfei Liu and Tatsuya Harada},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=hgehGq2bDv}\n}",
        "github": "",
        "project": "",
        "reviewers": "mo8c;q9Mp;MrBB",
        "pdf_size": 5924457,
        "rating": "6;6;6",
        "confidence": "5;4;4",
        "soundness": "3;3;3",
        "contribution": "3;2;3",
        "presentation": "3;2;3",
        "wc_summary": "113;116;94",
        "wc_strengths": "53;50;58",
        "wc_weaknesses": "65;253;34",
        "wc_questions": "210;128;49",
        "wc_review": "441;547;235",
        "wc_reply_reviewers": "35;0;0",
        "wc_reply_authors": "952;749;388",
        "reply_reviewers": "1;0;0",
        "reply_authors": "3;1;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            107.66666666666667,
            9.741092797468305
        ],
        "wc_strengths_avg": [
            53.666666666666664,
            3.299831645537222
        ],
        "wc_weaknesses_avg": [
            117.33333333333333,
            96.76202193468723
        ],
        "wc_questions_avg": [
            129.0,
            65.7317782101372
        ],
        "wc_review_avg": [
            407.6666666666667,
            129.5359238032275
        ],
        "wc_reply_reviewers_avg": [
            11.666666666666666,
            16.49915822768611
        ],
        "wc_reply_authors_avg": [
            696.3333333333334,
            233.24426871605846
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 26,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4641261063138610174&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=hgehGq2bDv",
        "pdf": "https://openreview.net/pdf?id=hgehGq2bDv",
        "email": "princeton.edu;idea.edu.cn;idea.edu.cn;idea.edu.cn;;idea.edu.cn;u-tokyo.ac.jp",
        "author_num": 7,
        "aff_unique_index": "0;1;1;1;1;2",
        "aff_unique_norm": "Princeton University;International Digital Economy Academy;University of Tokyo",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.princeton.edu;;https://www.u-tokyo.ac.jp",
        "aff_unique_abbr": "Princeton;;UTokyo",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;2",
        "aff_country_unique": "United States;;Japan"
    },
    {
        "id": "hgrZluxFC7",
        "title": "Adversarial Machine Learning in Latent Representations of Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Distributed deep neural networks (DNNs) have been shown to reduce the computational burden of mobile devices and decrease the end-to-end inference latency in edge computing scenarios. While distributed DNNs have been studied, to the best of our knowledge the resilience of distributed DNNs to adversarial action still remains an open problem. In this paper, we fill the existing research gap by rigorously analyzing the robustness of distributed DNNs against adversarial action. We cast this problem in the context of information theory and introduce two new measurements for distortion and robustness. Our theoretical findings indicate that (i) assuming the same level of information distortion, latent features are always more robust than input representations; (ii) the adversarial robustness is jointly determined by the feature dimension and the generalization capability of the DNN. To test our theoretical findings, we perform extensive experimental analysis by considering 6 different DNN architectures, 6 different approaches for distributed DNN and 10 different adversarial attacks to the ImageNet-1K dataset. Our experimental results support our theoretical findings by showing that the compressed latent representations can reduce the success rate of adversarial attacks by 88% in the best case and by 57% on the average compared to attacks to the input space.",
        "keywords": "distributed neural network;adversarial attack;information theory",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Milin Zhang;Mohammad Abdi;Francesco Restuccia",
        "authorids": "~Milin_Zhang1;~Mohammad_Abdi1;~Francesco_Restuccia2",
        "gender": "M;M;",
        "homepage": "https://milinzhang.github.io/;;",
        "dblp": "76/2111-2;;",
        "google_scholar": "bkDjoScAAAAJ;t_gb8OoAAAAJ;",
        "orcid": "0009-0002-9675-8352;;",
        "linkedin": "milin-zhang-b82454204;mohammad-abdi-215920146/;",
        "or_profile": "~Milin_Zhang1;~Mohammad_Abdi1;~Francesco_Restuccia2",
        "aff": "Northeastern University;Northeastern University;",
        "aff_domain": "northeastern.edu;northeastern.edu;",
        "position": "PhD student;PhD student;",
        "bibtex": "@misc{\nzhang2024adversarial,\ntitle={Adversarial Machine Learning in Latent Representations of Neural Networks},\nauthor={Milin Zhang and Mohammad Abdi and Francesco Restuccia},\nyear={2024},\nurl={https://openreview.net/forum?id=hgrZluxFC7}\n}",
        "github": "",
        "project": "",
        "reviewers": "4MyR;z2Hg;an5M;CQZD;nH51",
        "site": "https://openreview.net/forum?id=hgrZluxFC7",
        "pdf_size": 1759573,
        "rating": "3;6;6;6;8",
        "confidence": "4;3;3;4;5",
        "soundness": "2;3;3;3;3",
        "contribution": "2;2;2;2;3",
        "presentation": "2;3;3;2;3",
        "wc_summary": "64;121;54;97;123",
        "wc_strengths": "20;55;28;58;61",
        "wc_weaknesses": "223;87;577;152;124",
        "wc_questions": "77;132;52;165;136",
        "wc_review": "384;395;711;472;444",
        "wc_reply_reviewers": "279;23;59;0;86",
        "wc_reply_authors": "1775;417;1295;1159;852",
        "reply_reviewers": "2;1;2;0;1",
        "reply_authors": "5;1;3;2;2",
        "rating_avg": [
            5.8,
            1.6
        ],
        "confidence_avg": [
            3.8,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            91.8,
            28.47735942814923
        ],
        "wc_strengths_avg": [
            44.4,
            16.95405556201819
        ],
        "wc_weaknesses_avg": [
            232.6,
            177.87253863370813
        ],
        "wc_questions_avg": [
            112.4,
            41.49505994693826
        ],
        "wc_review_avg": [
            481.2,
            119.2935874219566
        ],
        "wc_reply_reviewers_avg": [
            89.4,
            99.28262687902652
        ],
        "wc_reply_authors_avg": [
            1099.6,
            452.79646641730767
        ],
        "reply_reviewers_avg": [
            1.2,
            0.7483314773547883
        ],
        "reply_authors_avg": [
            2.6,
            1.3564659966250536
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.30066889715147743,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12183572549962900033&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Northeastern University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.northeastern.edu",
        "aff_unique_abbr": "NEU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "A path-norm toolkit for modern networks: consequences, promises and challenges",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18089",
        "id": "hiHZVUIYik",
        "author_site": "Antoine Gonon, Nicolas Brisebarre, Elisa Riccietti, R\u00e9mi Gribonval",
        "tldr": "",
        "abstract": "This work introduces the first toolkit around path-norms that fully encompasses general DAG ReLU networks with biases, skip connections and any operation based on the extraction of order statistics: max pooling, GroupSort etc.\nThis toolkit notably allows us to establish generalization bounds for modern neural networks that are not only the most widely applicable path-norm based ones, but also recover or beat the sharpest known bounds of this type. \nThese extended path-norms further enjoy the usual benefits of path-norms: ease of computation,  invariance under the symmetries of the network, and improved sharpness on layered fully-connected networks compared to the product of operator norms, another complexity measure most commonly used.\n\nThe versatility of the toolkit and its ease of implementation allow us to challenge the concrete promises of path-norm-based generalization bounds, by numerically evaluating the sharpest known bounds for ResNets on ImageNet.",
        "keywords": "ReLU neural networks;path-norm;generalization;contraction lemma;peeling",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Antoine Gonon;Nicolas Brisebarre;Elisa Riccietti;R\u00e9mi Gribonval",
        "authorids": "~Antoine_Gonon1;~Nicolas_Brisebarre1;~Elisa_Riccietti1;~R\u00e9mi_Gribonval1",
        "gender": ";M;F;",
        "homepage": "https://agonon.github.io/;http://perso.ens-lyon.fr/nicolas.brisebarre/;http://perso.ens-lyon.fr/elisa.riccietti/;",
        "dblp": "251/5625;71/5350.html;179/5701;",
        "google_scholar": "https://scholar.google.fr/citations?user=MFWtaNwAAAAJ;;NtPpissAAAAJ;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Antoine_Gonon1;~Nicolas_Brisebarre1;~Elisa_Riccietti1;~R\u00e9mi_Gribonval1",
        "aff": "Ecole Normale Sup\u00e9rieure de Lyon;CNRS;ENS Lyon;",
        "aff_domain": "ens-lyon.fr;cnrs.fr;ens.fr;",
        "position": "PhD student;Researcher;Associate Professor;",
        "bibtex": "@inproceedings{\ngonon2024a,\ntitle={A path-norm toolkit for modern networks: consequences, promises and challenges},\nauthor={Antoine Gonon and Nicolas Brisebarre and Elisa Riccietti and R{\\'e}mi Gribonval},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=hiHZVUIYik}\n}",
        "github": "",
        "project": "",
        "reviewers": "m3hb;fyuf;wKAQ",
        "pdf_size": 990137,
        "rating": "6;8;8",
        "confidence": "3;4;4",
        "soundness": "3;4;4",
        "contribution": "3;3;3",
        "presentation": "3;4;4",
        "wc_summary": "80;125;106",
        "wc_strengths": "48;166;28",
        "wc_weaknesses": "35;192;64",
        "wc_questions": "17;362;2",
        "wc_review": "180;845;200",
        "wc_reply_reviewers": "0;31;0",
        "wc_reply_authors": "168;488;163",
        "reply_reviewers": "0;1;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            103.66666666666667,
            18.445113776342563
        ],
        "wc_strengths_avg": [
            80.66666666666667,
            60.88969991349568
        ],
        "wc_weaknesses_avg": [
            97.0,
            68.21045863111219
        ],
        "wc_questions_avg": [
            127.0,
            166.2828914831589
        ],
        "wc_review_avg": [
            408.3333333333333,
            308.87789748629723
        ],
        "wc_reply_reviewers_avg": [
            10.333333333333334,
            14.613540144521982
        ],
        "wc_reply_authors_avg": [
            273.0,
            152.04166095733981
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.9999999999999998,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12786982079677663026&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "openreview": "https://openreview.net/forum?id=hiHZVUIYik",
        "pdf": "https://openreview.net/pdf?id=hiHZVUIYik",
        "email": "ens-lyon.fr;cnrs.fr;ens.fr;",
        "author_num": 4,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Ecole Normale Sup\u00e9rieure de Lyon;Centre National de la Recherche Scientifique",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ens-lyon.fr;https://www.cnrs.fr",
        "aff_unique_abbr": "ENS de Lyon;CNRS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "France"
    },
    {
        "title": "Better Neural PDE Solvers Through Data-Free Mesh Movers",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18088",
        "id": "hj9ZuNimRl",
        "author_site": "Peiyan Hu, Yue Wang, Zhi-Ming Ma",
        "tldr": "",
        "abstract": "Recently, neural networks have been extensively employed to solve partial differential equations (PDEs) in physical system modeling. While major studies focus on learning system evolution on predefined static mesh discretizations, some methods utilize reinforcement learning or supervised learning techniques to create adaptive and dynamic meshes, due to the dynamic nature of these systems. However, these approaches face two primary challenges: (1) the need for expensive optimal mesh data, and (2) the change of the solution space's degree of freedom and topology during mesh refinement. To address these challenges, this paper proposes a neural PDE solver with a neural mesh adapter. To begin with, we introduce a novel data-free neural mesh adaptor, called Data-free Mesh Mover (DMM), with two main innovations. Firstly, it is an operator that maps the solution to adaptive meshes and is trained using the Monge-Amp\u00e8re equation without optimal mesh data. Secondly, it dynamically changes the mesh by moving existing nodes rather than adding or deleting nodes and edges. Theoretical analysis shows that meshes generated by DMM have the lowest interpolation error bound. Based on DMM, to efficiently and accurately model dynamic systems, we develop a moving mesh based neural PDE solver (MM-PDE) that embeds the moving mesh with a two-branch architecture and a learnable interpolation framework to preserve information within the data. Empirical experiments demonstrate that our method generates suitable meshes and considerably enhances accuracy when modeling widely considered PDE systems. The code can be found at: https://github.com/Peiyannn/MM-PDE.git.",
        "keywords": "neural PDE solvers;adaptive moving mesh;neural operators;Monge-Amp\u00e8re equation",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Peiyan Hu;Yue Wang;Zhi-Ming Ma",
        "authorids": "~Peiyan_Hu1;~Yue_Wang15;~Zhi-Ming_Ma1",
        "gender": "Not Specified;M;",
        "homepage": "https://peiyannn.github.io/;https://scholar.google.com/citations?hl=zh-CN&user=fGv5irIAAAAJ;http://homepage.amss.ac.cn/research/homePage/8eb59241e2e74d828fb84eec0efadba5/myHomePage.html",
        "dblp": "318/3127;33/4822-17.html;",
        "google_scholar": "TcyZu_8AAAAJ;https://scholar.google.com/citations?hl=zh-CN;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Peiyan_Hu1;~Yue_Wang15;~Zhi-Ming_Ma1",
        "aff": "Chinese Academy of Sciences;Microsoft Research Aisa;Academy of Mathematics and Systems Science, Chinese Academy of Sciences, Chinese Academy of Sciences",
        "aff_domain": "amss.ac.cn;microsoft.com;amss.ac.cn",
        "position": "PhD student;Researcher;Full Professor",
        "bibtex": "@inproceedings{\nhu2024better,\ntitle={Better Neural {PDE} Solvers Through Data-Free Mesh Movers},\nauthor={Peiyan Hu and Yue Wang and Zhi-Ming Ma},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=hj9ZuNimRl}\n}",
        "github": "",
        "project": "",
        "reviewers": "Uu92;W4Uo;qbBA",
        "pdf_size": 4585709,
        "rating": "6;6;6",
        "confidence": "4;3;4",
        "soundness": "2;3;3",
        "contribution": "3;3;3",
        "presentation": "2;2;3",
        "wc_summary": "80;42;68",
        "wc_strengths": "58;32;9",
        "wc_weaknesses": "207;322;39",
        "wc_questions": "239;86;190",
        "wc_review": "584;482;306",
        "wc_reply_reviewers": "0;133;50",
        "wc_reply_authors": "808;1598;1224",
        "reply_reviewers": "0;1;1",
        "reply_authors": "2;3;3",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            63.333333333333336,
            15.860503004493758
        ],
        "wc_strengths_avg": [
            33.0,
            20.016659728003237
        ],
        "wc_weaknesses_avg": [
            189.33333333333334,
            116.20766851728082
        ],
        "wc_questions_avg": [
            171.66666666666666,
            63.79306824064473
        ],
        "wc_review_avg": [
            457.3333333333333,
            114.82547142898605
        ],
        "wc_reply_reviewers_avg": [
            61.0,
            54.85131417447231
        ],
        "wc_reply_authors_avg": [
            1210.0,
            322.66804407419505
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10000014253005632055&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=hj9ZuNimRl",
        "pdf": "https://openreview.net/pdf?id=hj9ZuNimRl",
        "email": "amss.ac.cn;microsoft.com;amss.ac.cn",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Chinese Academy of Sciences;Microsoft",
        "aff_unique_dep": ";Microsoft Research",
        "aff_unique_url": "https://www.cas.cn;https://www.microsoft.com/en-us/research/group/asia",
        "aff_unique_abbr": "CAS;MSR Asia",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Beijing",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "hkAzAZXbdE",
        "title": "Bi-directional Deformation for Parameterization of Neural Implicit Surfaces",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The growing capabilities of neural rendering have increased the demand for new techniques that enable the intuitive editing of 3D objects, particularly when they are represented as neural implicit surfaces. In this paper, we present a novel neural algorithm to parameterize neural implicit surfaces to simple parametric domains, such as spheres, cubes or polycubes, where 3D radiance field can be represented as a 2D field, thereby facilitating visualization and various editing tasks. Technically, our method computes a bi-directional deformation between 3D objects and their chosen parametric domains, eliminating the need for any prior information. We adopt a forward mapping of points on the zero level set of the 3D object to a parametric domain, followed by a backward mapping through inverse deformation. To ensure the map is bijective, we employ a cycle loss while optimizing the smoothness of both deformations. Additionally, we leverage a Laplacian regularizer to effectively control angle distortion and offer the flexibility to choose from a range of parametric domains for managing area distortion. Designed for compatibility, our framework integrates seamlessly with existing neural rendering pipelines, taking multi-view images as input to reconstruct 3D geometry and compute the corresponding texture map. We also introduce a simple yet effective technique for intrinsic radiance decomposition, facilitating both view-independent material editing and view-dependent shading editing. Our method allows for the immediate rendering of edited textures through volume rendering, without the need for network re-training. Moreover, our approach supports the co-parameterization of multiple objects and enables texture transfer between them. We demonstrate the effectiveness of our method on images of human heads and man-made objects. We will make the source code publicly available.",
        "keywords": "neural parameterization;multi-view reconstruction;texture editing;neural implicit surfaces;neural rendering",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/11342e469fc9e2ad9d38d9d3d4cca844f8c003a3.zip",
        "author": "Baixin Xu;Jiangbei Hu;Fei Hou;Kwan-Yee Lin;Wayne Wu;Chen Qian;Ying He",
        "authorids": "~Baixin_Xu2;~Jiangbei_Hu1;~Fei_Hou1;~Kwan-Yee_Lin2;~Wayne_Wu1;~Chen_Qian1;~Ying_He1",
        "gender": "M;M;M;F;;M;M",
        "homepage": "https://xubaixinxbx.github.io/;;https://lcs.ios.ac.cn/~houf/;https://kwanyeelin.github.io/;;;https://personal.ntu.edu.sg/yhe/",
        "dblp": "344/1650;210/0076;24/3702;218/5452;;;h/YingHe1",
        "google_scholar": "WpN22HAAAAAJ;https://scholar.google.com/citations?hl=en;NWoYRf8AAAAJ;https://scholar.google.com.hk/citations?user=beGt3cAAAAAJ;;AerkT0YAAAAJ;ISNmBxwAAAAJ",
        "orcid": ";0000-0002-6774-6267;;;;;0000-0002-6749-4485",
        "linkedin": ";;;;;;",
        "or_profile": "~Baixin_Xu2;~Jiangbei_Hu1;~Fei_Hou1;~Kwan-Yee_Lin2;~Wayne_Wu1;~Chen_Qian1;~Ying_He1",
        "aff": "Nanyang Technological University;Dalian University of Technology;Institute of Software, Chinese Academy of Sciences;Shanghai Artificial Intelligence Laboratory;;Tsinghua University;Nanyang Technological University",
        "aff_domain": "ntu.edu.sg;dlut.edu.cn;ios.ac.cn;pjlab.org.cn;;mails.tsinghua.edu.cn;ntu.edu.sg",
        "position": "Project Officer;Postdoc;Associate Professor;Researcher;;PhD student;Associate Professor",
        "bibtex": "@misc{\nxu2024bidirectional,\ntitle={Bi-directional Deformation for Parameterization of Neural Implicit Surfaces},\nauthor={Baixin Xu and Jiangbei Hu and Fei Hou and Kwan-Yee Lin and Wayne Wu and Chen Qian and Ying He},\nyear={2024},\nurl={https://openreview.net/forum?id=hkAzAZXbdE}\n}",
        "github": "",
        "project": "",
        "reviewers": "4YC2;bgLy;3Lvc;sy5Q",
        "site": "https://openreview.net/forum?id=hkAzAZXbdE",
        "pdf_size": 13214925,
        "rating": "3;3;5;5",
        "confidence": "4;3;3;4",
        "soundness": "3;1;2;3",
        "contribution": "1;1;2;3",
        "presentation": "2;1;3;2",
        "wc_summary": "49;87;145;71",
        "wc_strengths": "84;30;111;43",
        "wc_weaknesses": "327;239;345;233",
        "wc_questions": "33;82;115;11",
        "wc_review": "493;438;716;358",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            88.0,
            35.566838487557476
        ],
        "wc_strengths_avg": [
            67.0,
            32.28776858192588
        ],
        "wc_weaknesses_avg": [
            286.0,
            50.44799302251776
        ],
        "wc_questions_avg": [
            60.25,
            40.739262389002576
        ],
        "wc_review_avg": [
            501.25,
            132.95370434854382
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17776475175918767134&as_sdt=800005&sciodt=0,15&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;4;0",
        "aff_unique_norm": "Nanyang Technological University;Dalian University of Technology;Chinese Academy of Sciences;Shanghai Artificial Intelligence Laboratory;Tsinghua University",
        "aff_unique_dep": ";;Institute of Software;;",
        "aff_unique_url": "https://www.ntu.edu.sg;http://www.dlut.edu.cn/;http://www.ios.ac.cn;http://www.shailab.org/;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "NTU;DUT;CAS;Shanghai AI Lab;THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;1;0",
        "aff_country_unique": "Singapore;China"
    },
    {
        "id": "hkL8djXrMM",
        "title": "Neural Diffusion Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Diffusion models have shown remarkable performance on many generative tasks. Despite recent success, most diffusion models are restricted in that they only allow linear transformation of the data distribution. In contrast, broader family of transformations can potentially help train generative distributions more efficiently, simplifying the reverse process and closing the gap between the true negative log-likelihood and the variational approximation. In this paper, we present Neural Diffusion Models (NDMs), a generalization of conventional diffusion models that enables defining and learning time-dependent non-linear transformations of data. We show how to optimise NDMs using a variational bound in a simulation-free setting. Moreover, we derive a time-continuous formulation of NDMs, which allows fast and reliable inference using off-the-shelf numerical ODE and SDE solvers. Finally, we demonstrate the utility of NDMs with learnable transformations through experiments on standard image generation benchmarks, including CIFAR-10, downsampled versions of ImageNet and CelebA-HQ. NDMs outperform conventional diffusion models in terms of likelihood and produce high-quality samples.",
        "keywords": "diffusion;generative models;variational inference",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/0b3edc4d675bf687ef41ac655efbd0d6eb12e1e0.pdf",
        "author": "Grigory Bartosh;Dmitry P. Vetrov;Christian A. Naesseth",
        "authorids": "~Grigory_Bartosh1;~Dmitry_P._Vetrov1;~Christian_A._Naesseth1",
        "gender": "M;M;M",
        "homepage": ";https://constructor.university/faculty-member/dmitry-vetrov;https://naesseth.github.io/",
        "dblp": ";89/3348;146/0902",
        "google_scholar": ";https://scholar.google.ru/citations?user=7HU0UoUAAAAJ;GQ6rOssAAAAJ",
        "orcid": ";;",
        "linkedin": "grigory-bartosh-76004a163/;;",
        "or_profile": "~Grigory_Bartosh1;~Dmitry_P._Vetrov1;~Christian_A_Naesseth1",
        "aff": "University of Amsterdam;National Research University Higher School of Economics;University of Amsterdam",
        "aff_domain": "uva.nl;hse.ru;uva.nl",
        "position": "PhD student;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nbartosh2024neural,\ntitle={Neural Diffusion Models},\nauthor={Grigory Bartosh and Dmitry P. Vetrov and Christian A. Naesseth},\nyear={2024},\nurl={https://openreview.net/forum?id=hkL8djXrMM}\n}",
        "github": "",
        "project": "",
        "reviewers": "vgew;Y8jp;rkQA;LvPx",
        "site": "https://openreview.net/forum?id=hkL8djXrMM",
        "pdf_size": 1297204,
        "rating": "5;5;5;6",
        "confidence": "3;4;4;3",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;2",
        "presentation": "3;2;3;3",
        "wc_summary": "79;47;111;59",
        "wc_strengths": "64;47;65;28",
        "wc_weaknesses": "140;301;216;193",
        "wc_questions": "131;4;80;2",
        "wc_review": "414;399;472;282",
        "wc_reply_reviewers": "351;48;17;21",
        "wc_reply_authors": "1734;749;551;568",
        "reply_reviewers": "2;1;1;1",
        "reply_authors": "4;2;1;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            74.0,
            24.228082879171435
        ],
        "wc_strengths_avg": [
            51.0,
            15.083103128998356
        ],
        "wc_weaknesses_avg": [
            212.5,
            58.0538543078752
        ],
        "wc_questions_avg": [
            54.25,
            54.33403629402108
        ],
        "wc_review_avg": [
            391.75,
            68.97961655445759
        ],
        "wc_reply_reviewers_avg": [
            109.25,
            140.0827880219408
        ],
        "wc_reply_authors_avg": [
            900.5,
            487.43743188228785
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3759804013750445777&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Amsterdam;National Research University Higher School of Economics",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uva.nl;https://hse.ru",
        "aff_unique_abbr": "UvA;HSE",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Netherlands;Russian Federation"
    },
    {
        "id": "hkQOYyUChL",
        "title": "Learning and Forgetting Unsafe Examples in Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "As the number of large language models (LLMs) available to the public grows, there is a pressing need to understand the safety implications associated with these models learning from third-party custom finetuning data.  We explore the behavior of LLMs finetuned on unsafe content, represented by datasets that contain biases, toxicity, and harmfulness, finding that while LLMs can readily learn this unsafe content, they also tend to forget it when subsequently finetuned on safer content.  Drawing inspiration from this forgetting behavior, we introduce the ``\\ff{}'' algorithm, which filters unsafe data based on how strong the model's forgetting signal is for that data. We find that the \\ff{} algorithm outperforms alternative strategies like replay and moral self-correction in curbing LLMs' ability to assimilate unsafe content during custom finetuning, e.g. 75\\% lower than not applying any safety measures and 62\\% lower than using self-correction in toxicity score.",
        "keywords": "Large language models; Safety alignment; Neural networks forgetting",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Jiachen ZHAO;Zhun Deng;David Madras;James Zou;Mengye Ren",
        "authorids": "~Jiachen_ZHAO1;~Zhun_Deng1;~David_Madras1;~James_Zou1;~Mengye_Ren1",
        "gender": "M;M;M;;",
        "homepage": ";https://www.zhundeng.org/;http://www.cs.toronto.edu/~madras/;;http://www.cs.toronto.edu/~mren",
        "dblp": ";204/4353;188/6211;;163/1952",
        "google_scholar": "9dFt9JAAAAAJ;nkmi-moAAAAJ;MgnNDpkAAAAJ;23ZXZvEAAAAJ;XcQ9WqMAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Jiachen_ZHAO1;~Zhun_Deng1;~David_Madras1;~James_Zou1;~Mengye_Ren1",
        "aff": "University of Massachusetts Amherst;Columbia University;Google;Stanford University;New York University",
        "aff_domain": "umass.edu;columbia.edu;google.com;stanford.edu;nyu.edu",
        "position": "MS student;Postdoc;Researcher;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nzhao2024learning,\ntitle={Learning and Forgetting Unsafe Examples in Large Language Models},\nauthor={Jiachen ZHAO and Zhun Deng and David Madras and James Zou and Mengye Ren},\nyear={2024},\nurl={https://openreview.net/forum?id=hkQOYyUChL}\n}",
        "github": "",
        "project": "",
        "reviewers": "DzUN;qeKd;LEME;pR1P",
        "site": "https://openreview.net/forum?id=hkQOYyUChL",
        "pdf_size": 588135,
        "rating": "3;3;5;6",
        "confidence": "3;5;3;4",
        "soundness": "1;1;2;3",
        "contribution": "1;1;3;3",
        "presentation": "2;2;2;3",
        "wc_summary": "42;168;61;48",
        "wc_strengths": "116;30;81;59",
        "wc_weaknesses": "808;309;159;101",
        "wc_questions": "67;14;18;97",
        "wc_review": "1033;521;319;305",
        "wc_reply_reviewers": "233;0;96;0",
        "wc_reply_authors": "3026;1057;1093;405",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "6;3;3;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            1.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            79.75,
            51.4119392748416
        ],
        "wc_strengths_avg": [
            71.5,
            31.42053468672995
        ],
        "wc_weaknesses_avg": [
            344.25,
            278.2960429111417
        ],
        "wc_questions_avg": [
            49.0,
            34.69149751740331
        ],
        "wc_review_avg": [
            544.5,
            294.7011197807026
        ],
        "wc_reply_reviewers_avg": [
            82.25,
            95.4525405633606
        ],
        "wc_reply_authors_avg": [
            1395.25,
            980.5239351999521
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.25,
            1.7853571071357126
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.17407765595569782,
        "gs_citation": 32,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8289082060151570200&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "University of Massachusetts Amherst;Columbia University;Google;Stanford University;New York University",
        "aff_unique_dep": ";;Google;;",
        "aff_unique_url": "https://www.umass.edu;https://www.columbia.edu;https://www.google.com;https://www.stanford.edu;https://www.nyu.edu",
        "aff_unique_abbr": "UMass Amherst;Columbia;Google;Stanford;NYU",
        "aff_campus_unique_index": "0;2;3",
        "aff_campus_unique": "Amherst;;Mountain View;Stanford",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "A Differentially Private Clustering Algorithm for Well-Clustered Graphs",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18087",
        "id": "hkSjjs4o5d",
        "author_site": "Weiqiang He, Hendrik Fichtenberger, Pan Peng",
        "tldr": "",
        "abstract": "We study differentially private (DP) algorithms for recovering clusters in well-clustered graphs, which are graphs whose vertex set can be partitioned into a small number of sets, each inducing a subgraph of high inner conductance and small outer conductance. Such graphs have widespread application as a benchmark in the theoretical analysis of spectral clustering.\nWe provide an efficient ($\\epsilon$,$\\delta$)-DP algorithm tailored specifically for such graphs. Our algorithm draws inspiration from the recent work of Chen et al., who developed DP algorithms for recovery of stochastic block models in cases where the graph comprises exactly two nearly-balanced clusters. Our algorithm works for well-clustered graphs with $k$ nearly-balanced clusters, and the misclassification ratio almost matches the one of the best-known non-private algorithms. We conduct experimental evaluations on datasets with known ground truth clusters to substantiate the prowess of our algorithm. We also show that any (pure) $\\epsilon$-DP algorithm would result in substantial error.",
        "keywords": "differential privacy;graph clustering;semidefinite programming;spectral clustering",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Weiqiang He;Hendrik Fichtenberger;Pan Peng",
        "authorids": "~Weiqiang_He1;~Hendrik_Fichtenberger1;~Pan_Peng1",
        "gender": ";;M",
        "homepage": ";;http://staff.ustc.edu.cn/~ppeng/",
        "dblp": ";;08/9919-1",
        "google_scholar": ";;",
        "orcid": "0009-0007-7918-3346;;0000-0003-2700-5699",
        "linkedin": ";;",
        "or_profile": "~Weiqiang_He1;~Hendrik_Fichtenberger1;~Pan_Peng1",
        "aff": "University of Science and Technology of China;;University of Science and Technology of China",
        "aff_domain": "ustc.edu.cn;;ustc.edu.cn",
        "position": "MS student;;Full Professor",
        "bibtex": "@inproceedings{\nhe2024a,\ntitle={A Differentially Private Clustering Algorithm for Well-Clustered Graphs},\nauthor={Weiqiang He and Hendrik Fichtenberger and Pan Peng},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=hkSjjs4o5d}\n}",
        "github": "",
        "project": "",
        "reviewers": "vyy9;ApBn;ZCFz;viwC",
        "pdf_size": 420726,
        "rating": "6;6;6;8",
        "confidence": "3;2;3;3",
        "soundness": "4;3;3;4",
        "contribution": "3;3;2;4",
        "presentation": "4;2;3;3",
        "wc_summary": "168;154;42;298",
        "wc_strengths": "82;53;38;148",
        "wc_weaknesses": "85;61;12;230",
        "wc_questions": "196;155;60;150",
        "wc_review": "531;423;152;826",
        "wc_reply_reviewers": "0;0;0;148",
        "wc_reply_authors": "727;617;332;1102",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            165.5,
            90.75654246389072
        ],
        "wc_strengths_avg": [
            80.25,
            42.192268249052454
        ],
        "wc_weaknesses_avg": [
            97.0,
            81.16957558100202
        ],
        "wc_questions_avg": [
            140.25,
            49.650654577759596
        ],
        "wc_review_avg": [
            483.0,
            241.4094032965576
        ],
        "wc_reply_reviewers_avg": [
            37.0,
            64.08587988004847
        ],
        "wc_reply_authors_avg": [
            694.5,
            275.9189192498405
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:2Msqok0dDqwJ:scholar.google.com/&scioq=A+Differentially+Private+Clustering+Algorithm+for+Well-Clustered+Graphs&hl=en&as_sdt=0,33",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=hkSjjs4o5d",
        "pdf": "https://openreview.net/pdf?id=hkSjjs4o5d",
        "email": "ustc.edu.cn;;ustc.edu.cn",
        "author_num": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Science and Technology of China",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.ustc.edu.cn",
        "aff_unique_abbr": "USTC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "hkWHdI8ss5",
        "title": "SITTO: Single-Image Textured Mesh Reconstruction through Test-Time Optimization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Reconstruction of a 3D textured mesh from a single image has been a long-standing and challenging problem. To address this challenge, we aim to leverage existing feed-forward-based models designed for predicting shape (i.e., textureless mesh) from a single image. However, there are difficulties that have to be overcome.  Firstly, methods that estimate shape using feed-forward approaches cannot always guarantee high-quality results. A test-time optimization technique with feedback loops specified to each target object instance is necessary to apply these methods practically.  To tackle this, we unlock the recent advancements in multi-view diffusion models, showing impressive multi-view image generation performances. Nonetheless, there are challenges associated with utilizing diffusion models. Specifically, it is crucial to estimate the viewpoint of the given reference image (i.e., its elevation and azimuth angles) and sample relative viewpoints from the reference viewpoint. We solely employ neural mesh representation and texture optimization to optimize training efficiency in terms of time and memory complexity. SITTO tackles these challenges by introducing an automatic pipeline for monocular 3D textured mesh reconstruction with test-time optimization. Our method demonstrates impressive results in fine-grained geometry details and the generation of realistic texture appearances.",
        "keywords": "Feed-forward Mesh Prediction;Multi-View Diffusion;Test-Time Optimization;Textured Mesh Generation;DMTet;Physically Based Rendering (PBR)",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/709844347dfbd8d06c132c07af51293ab16dd6c3.zip",
        "author": "Kim Yu-Ji;Hyunwoo Ha;Kim Youwang;Jaeheung Surh;Hyowon Ha;Tae-Hyun Oh",
        "authorids": "~Kim_Yu-Ji1;~Hyunwoo_Ha1;~Kim_Youwang1;~Jaeheung_Surh2;~Hyowon_Ha3;~Tae-Hyun_Oh3",
        "gender": "F;;;;M;M",
        "homepage": "https://ug-kim.notion.site/;;https://kim-youwang.github.io;;https://sites.google.com/site/hyowoncv;https://ami.kaist.ac.kr",
        "dblp": "326/5472;176/1369;325/4399;;62/10333;119/1450",
        "google_scholar": "I7k0GkIAAAAJ;;gKXTrF8AAAAJ;;https://scholar.google.co.kr/citations?user=odlwb08AAAAJ;dMCBjeIAAAAJ",
        "orcid": "0000-0002-1774-5442;;0000-0002-7508-9260;;0000-0002-2824-917X;0000-0003-0468-1571",
        "linkedin": "yuji-kim-b57022186/;hyun-woo-ha-7aa450200;kim-youwang/;;hyowonha/?originalSubdomain=kr;tae-hyun-oh-at-mit/",
        "or_profile": "~Kim_Yu-Ji1;~Hyunwoo_Ha1;~Kim_Youwang1;~Jaeheung_Surh2;~Hyowon_Ha3;~Tae-Hyun_Oh3",
        "aff": "Pohang University of Science and Technology;Pohang University of Science and Technology;Eberhard-Karls-Universit\u00e4t T\u00fcbingen;;Bucketplace;POSTECH",
        "aff_domain": "postech.ac.kr;postech.edu;uni-tuebingen.de;;bucketplace.net;postech.ac.kr",
        "position": "PhD student;PhD student;Intern;;Tech Lead & Manager;Associate Professor",
        "bibtex": "@misc{\nyu-ji2024sitto,\ntitle={{SITTO}: Single-Image Textured Mesh Reconstruction through Test-Time Optimization},\nauthor={Kim Yu-Ji and Hyunwoo Ha and Kim Youwang and Jaeheung Surh and Hyowon Ha and Tae-Hyun Oh},\nyear={2024},\nurl={https://openreview.net/forum?id=hkWHdI8ss5}\n}",
        "github": "",
        "project": "",
        "reviewers": "tSLs;dbEu;JToQ",
        "site": "https://openreview.net/forum?id=hkWHdI8ss5",
        "pdf_size": 3405851,
        "rating": "1;3;3",
        "confidence": "5;5;5",
        "soundness": "1;1;2",
        "contribution": "1;1;2",
        "presentation": "1;2;2",
        "wc_summary": "45;39;70",
        "wc_strengths": "8;19;31",
        "wc_weaknesses": "108;68;296",
        "wc_questions": "108;11;92",
        "wc_review": "269;137;489",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "confidence_avg": [
            5.0,
            0.0
        ],
        "soundness_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            51.333333333333336,
            13.424687043734844
        ],
        "wc_strengths_avg": [
            19.333333333333332,
            9.392668535736915
        ],
        "wc_weaknesses_avg": [
            157.33333333333334,
            99.40266037128427
        ],
        "wc_questions_avg": [
            70.33333333333333,
            42.460439103816256
        ],
        "wc_review_avg": [
            298.3333333333333,
            145.19259240363778
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:CD6KatbxiBwJ:scholar.google.com/&scioq=SITTO:+Single-Image+Textured+Mesh+Reconstruction+through+Test-Time+Optimization&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2;0",
        "aff_unique_norm": "Pohang University of Science and Technology;Eberhard Karls University of T\u00fcbingen;Bucketplace",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.postech.ac.kr;https://www.uni-tuebingen.de/;",
        "aff_unique_abbr": "POSTECH;Uni T\u00fcbingen;",
        "aff_campus_unique_index": "0;0;1;0",
        "aff_campus_unique": "Pohang;T\u00fcbingen;",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "South Korea;Germany;"
    },
    {
        "id": "hkgULK8u4d",
        "title": "MGTST: Multi-scale and Cross-channel Gated Transformer for Multivariate long-term time-series forecasting",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Transformer-based models have emerged as popular choices for the multivariate long-term time-series forecasting problem due to their ability to capture long-term dependencies. However, current transformer-based models either overlook crucial mutual dependencies among channels or fail to capture various temporal patterns across different scales. To fill the gap, we propose a novel model called MGTST (Multi-scale and cross-channel Gated Time-Series Transformer). In this model, we introduce three innovative designs, including Parallel Multi-Scale Architecture (PMSA), Temporal Embedding with Representation Tokens (TERT), and Cross-Channel Attention and Gated Mechanism (CCAGM). In addition, we introduce Channel Grouping (CG) to mitigate channel interaction redundancy for datasets with a large number of channels. The experimental results demonstrate that our model outperforms both channel-dependent (CD) and channel-independent (CI) baseline models on seven widely used benchmark datasets, with performance improvement ranging from 1.5 percent to 41.9 percent compared to the state-of-the-art in terms of forecasting accuracy.",
        "keywords": "Transformer;multivariate time-series forecasting;deep learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Jiahui Li;Zhou Zhou;Dit-Yan Yeung",
        "authorids": "~Jiahui_Li3;~Zhou_Zhou6;~Dit-Yan_Yeung2",
        "gender": "M;Not Specified;M",
        "homepage": "https://jimmylihui.github.io;;https://cse.hkust.edu.hk/faculty/dyyeung/",
        "dblp": ";;41/5668",
        "google_scholar": ";;nEsOOx8AAAAJ",
        "orcid": ";0000-0002-6490-8945;0000-0003-3716-8125",
        "linkedin": ";;",
        "or_profile": "~Jiahui_Li3;~Zhou_Zhou6;~Dit-Yan_Yeung2",
        "aff": "Hong Kong University of Science and Technology;Hong Kong University of Science and Technology;Hong Kong University of Science and Technology",
        "aff_domain": "ust.hk;ust.hk;ust.hk",
        "position": "Researcher;Postdoc;Chair Professor",
        "bibtex": "@misc{\nli2024mgtst,\ntitle={{MGTST}: Multi-scale and Cross-channel Gated Transformer for Multivariate long-term time-series forecasting},\nauthor={Jiahui Li and Zhou Zhou and Dit-Yan Yeung},\nyear={2024},\nurl={https://openreview.net/forum?id=hkgULK8u4d}\n}",
        "github": "",
        "project": "",
        "reviewers": "oeni;pwF5;PgoA",
        "site": "https://openreview.net/forum?id=hkgULK8u4d",
        "pdf_size": 3477979,
        "rating": "3;5;5",
        "confidence": "3;3;3",
        "soundness": "2;3;1",
        "contribution": "2;2;1",
        "presentation": "2;2;2",
        "wc_summary": "96;41;623",
        "wc_strengths": "61;56;8",
        "wc_weaknesses": "189;131;8",
        "wc_questions": "88;179;8",
        "wc_review": "434;407;647",
        "wc_reply_reviewers": "0;20;0",
        "wc_reply_authors": "555;461;612",
        "reply_reviewers": "0;1;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            253.33333333333334,
            262.35641575705534
        ],
        "wc_strengths_avg": [
            41.666666666666664,
            23.893281249943232
        ],
        "wc_weaknesses_avg": [
            109.33333333333333,
            75.46448760104906
        ],
        "wc_questions_avg": [
            91.66666666666667,
            69.85858731911362
        ],
        "wc_review_avg": [
            496.0,
            107.34057946554975
        ],
        "wc_reply_reviewers_avg": [
            6.666666666666667,
            9.428090415820632
        ],
        "wc_reply_authors_avg": [
            542.6666666666666,
            62.25931434108653
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:IvNtDuovhIEJ:scholar.google.com/&scioq=MGTST:+Multi-scale+and+Cross-channel+Gated+Transformer+for+Multivariate+long-term+time-series+forecasting&hl=en&as_sdt=0,31",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Hong Kong University of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ust.hk",
        "aff_unique_abbr": "HKUST",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "hkjcdmz8Ro",
        "title": "Jailbreaking Black Box Large Language Models in Twenty Queries",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "There is growing research interest in ensuring that large language models align with human safety and ethical guidelines. Adversarial attacks known as 'jailbreaks' pose a significant threat as they coax models into overriding alignment safeguards. Identifying these vulnerabilities through attacking a language model (red teaming) is instrumental in understanding inherent weaknesses and preventing misuse. We present Prompt Automatic Iterative Refinement (PAIR), which generates semantic jailbreaks with only black-box access \nto a language model.\nEmpirically, PAIR often requires fewer than 20 queries, orders of magnitude fewer than prior jailbreak attacks. PAIR draws inspiration from the human process of social engineering, and employs an attacker language model to automatically generate adversarial prompts in place of a human. The attacker model uses the target model's response as additional context to iteratively refine the adversarial prompt. PAIR achieves competitive jailbreaking success rates and transferability on open and closed-source language models, including GPT-3.5/4, Vicuna, and PaLM.",
        "keywords": "large language models;LLM;jailbreaking;red teaming",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Patrick Chao;Alexander Robey;Edgar Dobriban;Hamed Hassani;George J. Pappas;Eric Wong",
        "authorids": "~Patrick_Chao1;~Alexander_Robey1;~Edgar_Dobriban1;~Hamed_Hassani2;~George_J._Pappas1;~Eric_Wong1",
        "gender": ";M;M;M;;M",
        "homepage": "https://patrickrchao.github.io/;https://arobey1.github.io/;https://www.seas.upenn.edu/~hassani/;http://riceric22.github.io/;https://statistics.wharton.upenn.edu/profile/dobriban/;http://www.georgejpappas.org/",
        "dblp": "222/2677.html;242/9113;73/4984;64/1811-1.html;99/11269;p/GeorgeJPappas",
        "google_scholar": ";V5NWZc8AAAAJ;;pWnTMRkAAAAJ;aGvH4yMAAAAJ;https://scholar.google.com.tw/citations?user=Kia-4B0AAAAJ",
        "orcid": ";;;;;0000-0001-9081-0637",
        "linkedin": ";alexrobey/;;;edgar-dobriban/;",
        "or_profile": "~Patrick_Chao1;~Alexander_Robey1;~Hamed_Hassani2;~Eric_Wong1;~Edgar_Dobriban2;~George_Pappas1",
        "aff": "The Wharton School, University of Pennsylvania;School of Engineering and Applied Science, University of Pennsylvania;University of Pennsylvania;University of Pennsylvania;The Wharton School, University of Pennsylvania;School of Engineering and Applied Science, University of Pennsylvania",
        "aff_domain": "wharton.upenn.edu;seas.upenn.edu;upenn.edu;upenn.edu;wharton.upenn.edu;seas.upenn.edu",
        "position": "PhD student;PhD student;;Assistant Professor;Associate Professor;Full Professor",
        "bibtex": "@misc{\nchao2024jailbreaking,\ntitle={Jailbreaking Black Box Large Language Models in Twenty Queries},\nauthor={Patrick Chao and Alexander Robey and Edgar Dobriban and Hamed Hassani and George J. Pappas and Eric Wong},\nyear={2024},\nurl={https://openreview.net/forum?id=hkjcdmz8Ro}\n}",
        "github": "",
        "project": "",
        "reviewers": "PADE;9YSw;2SyA;HLa7",
        "site": "https://openreview.net/forum?id=hkjcdmz8Ro",
        "pdf_size": 2863510,
        "rating": "3;5;5;6",
        "confidence": "4;3;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "56;28;89;57",
        "wc_strengths": "83;31;39;52",
        "wc_weaknesses": "157;217;319;411",
        "wc_questions": "68;2;3;84",
        "wc_review": "364;278;450;604",
        "wc_reply_reviewers": "232;375;417;77",
        "wc_reply_authors": "2247;1446;2765;1145",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "4;2;4;3",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            57.5,
            21.592822881689184
        ],
        "wc_strengths_avg": [
            51.25,
            19.803724397193573
        ],
        "wc_weaknesses_avg": [
            276.0,
            97.10303805751909
        ],
        "wc_questions_avg": [
            39.25,
            37.18450618201081
        ],
        "wc_review_avg": [
            424.0,
            120.40764095355411
        ],
        "wc_reply_reviewers_avg": [
            275.25,
            133.43233303813585
        ],
        "wc_reply_authors_avg": [
            1900.75,
            641.2434697523242
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.25,
            0.82915619758885
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.13245323570650439,
        "gs_citation": 592,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1618697255803227028&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "University of Pennsylvania",
        "aff_unique_dep": "The Wharton School",
        "aff_unique_url": "https://www.wharton.upenn.edu",
        "aff_unique_abbr": "UPenn Wharton",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "hlj6HiGJeB",
        "title": "NeuralMatrix: Compute the Entire Neural Networks with Linear Matrix Operations for Efficient Inference",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The inherent diversity of computation types within individual deep neural network (DNN) models necessitates a corresponding variety of computation units within hardware processors, leading to a significant constraint on computation efficiency during neural network execution. In this study, we introduce NeuralMatrix, a framework that transforms the computation of entire DNNs into linear matrix operations, effectively enabling their execution with one general-purpose matrix multiplication (GEMM) accelerator. By surmounting the constraints posed by the diverse computation types required by individual network models, this approach provides both generality, allowing a wide range of DNN models to be executed using a single GEMM accelerator and application-specific acceleration levels without extra special function units, which are validated through main stream DNNs and their variant models.",
        "keywords": "Neural Network;Linear Matrix Operation;Efficient Inference",
        "primary_area": "infrastructure, software libraries, hardware, etc.",
        "supplementary_material": "",
        "author": "Ruiqi Sun;Jie Zhao;Yiran Li;Xin He;An Zou",
        "authorids": "~Ruiqi_Sun1;~Jie_Zhao1;~Yiran_Li3;~Xin_He15;~An_Zou1",
        "gender": "M;;;M;M",
        "homepage": "https://sites.ji.sjtu.edu.cn/zouan/;;;;https://sites.ji.sjtu.edu.cn/zouan/",
        "dblp": ";;;;202/9504",
        "google_scholar": ";;AIZwpTAAAAAJ;https://scholar.google.com.hk/citations?user=9xtHahMAAAAJ;",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Ruiqi_Sun1;~Jie_Zhao1;~Yiran_Li3;~Xin_He15;~An_Zou1",
        "aff": "Shanghai Jiaotong University;;;;Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn;;;;sjtu.edu.cn",
        "position": "PhD student;;;;Assistant Professor",
        "bibtex": "@misc{\nsun2024neuralmatrix,\ntitle={NeuralMatrix: Compute the Entire Neural Networks with Linear Matrix Operations for Efficient Inference},\nauthor={Ruiqi Sun and Jie Zhao and Yiran Li and Xin He and An Zou},\nyear={2024},\nurl={https://openreview.net/forum?id=hlj6HiGJeB}\n}",
        "github": "",
        "project": "",
        "reviewers": "tPnn;jE62;Zkh6;JHrZ;P9wc",
        "site": "https://openreview.net/forum?id=hlj6HiGJeB",
        "pdf_size": 463281,
        "rating": "3;3;5;5;5",
        "confidence": "4;3;4;4;4",
        "soundness": "2;2;3;2;3",
        "contribution": "2;2;3;2;2",
        "presentation": "3;2;3;2;3",
        "wc_summary": "35;54;53;64;71",
        "wc_strengths": "27;70;47;14;36",
        "wc_weaknesses": "101;104;74;59;147",
        "wc_questions": "4;42;47;9;54",
        "wc_review": "167;270;221;146;308",
        "wc_reply_reviewers": "0;18;0;0;21",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;1;0;0;1",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            4.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            55.4,
            12.175385004179539
        ],
        "wc_strengths_avg": [
            38.8,
            18.988417522268673
        ],
        "wc_weaknesses_avg": [
            97.0,
            30.126400382388866
        ],
        "wc_questions_avg": [
            31.2,
            20.5854317418897
        ],
        "wc_review_avg": [
            222.4,
            60.829598058839736
        ],
        "wc_reply_reviewers_avg": [
            7.8,
            9.6
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.6123724356957947,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:GTu_NzdlYgsJ:scholar.google.com/&scioq=NeuralMatrix:+Compute+the+Entire+Neural+Networks+with+Linear+Matrix+Operations+for+Efficient+Inference&hl=en&as_sdt=0,11",
        "gs_version_total": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Shanghai Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sjtu.edu.cn",
        "aff_unique_abbr": "SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Polynormer: Polynomial-Expressive Graph Transformer in Linear Time",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18086",
        "id": "hmv1LpNfXa",
        "author_site": "Chenhui Deng, Zichao Yue, Zhiru Zhang",
        "tldr": "",
        "abstract": "Graph transformers (GTs) have emerged as a promising architecture that is theoretically more expressive than message-passing graph neural networks (GNNs). However, typical GT models have at least quadratic complexity and thus cannot scale to large graphs. While there are several linear GTs recently proposed, they still lag behind GNN counterparts on several popular graph datasets, which poses a critical concern on their practical expressivity. To balance the trade-off between expressivity and scalability of GTs, we propose Polynormer, a polynomial-expressive GT model with linear complexity. Polynormer is built upon a novel base model that learns a high-degree polynomial on input features. To enable the base model permutation equivariant, we integrate it with graph topology and node features separately, resulting in local and global equivariant attention models. Consequently, Polynormer adopts a linear local-to-global attention scheme to learn high-degree equivariant polynomials whose coefficients are controlled by attention scores. Polynormer has been evaluated on $13$ homophilic and heterophilic datasets, including large graphs with millions of nodes. Our extensive experiment results show that Polynormer outperforms state-of-the-art GNN and GT baselines on most datasets, even without the use of nonlinear activation functions. Source code of Polynormer is freely available at: [github.com/cornell-zhang/Polynormer](https://github.com/cornell-zhang/Polynormer).",
        "keywords": "Graph Transformers;Polynomial Networks;Large-Scale Graph Learning;Node Classification",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Chenhui Deng;Zichao Yue;Zhiru Zhang",
        "authorids": "~Chenhui_Deng1;~Zichao_Yue1;~Zhiru_Zhang2",
        "gender": "M;M;M",
        "homepage": "https://chenhui1016.github.io;;https://www.csl.cornell.edu/~zhiruz",
        "dblp": "250/2396;;81/4227",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;https://scholar.google.com.tw/citations?user=x05pUHsAAAAJ",
        "orcid": ";;",
        "linkedin": "chenhui-deng-113b0b16a;zichao-yue-893816200/;",
        "or_profile": "~Chenhui_Deng1;~Zichao_Yue1;~Zhiru_Zhang2",
        "aff": "Cornell University;Cornell University;Cornell University",
        "aff_domain": "cornell.edu;cornell.edu;cornell.edu",
        "position": "PhD;PhD student;Associate Professor",
        "bibtex": "@inproceedings{\ndeng2024polynormer,\ntitle={Polynormer: Polynomial-Expressive Graph Transformer in Linear Time},\nauthor={Chenhui Deng and Zichao Yue and Zhiru Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=hmv1LpNfXa}\n}",
        "github": "",
        "project": "",
        "reviewers": "uwZk;D5Yt;HGJh",
        "pdf_size": 972839,
        "rating": "6;6;6",
        "confidence": "4;4;3",
        "soundness": "2;3;2",
        "contribution": "3;3;2",
        "presentation": "3;3;3",
        "wc_summary": "63;80;104",
        "wc_strengths": "45;30;63",
        "wc_weaknesses": "205;49;55",
        "wc_questions": "29;8;3",
        "wc_review": "342;167;225",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "688;218;262",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            82.33333333333333,
            16.81930108205715
        ],
        "wc_strengths_avg": [
            46.0,
            13.490737563232042
        ],
        "wc_weaknesses_avg": [
            103.0,
            72.16647421067486
        ],
        "wc_questions_avg": [
            13.333333333333334,
            11.2644968324772
        ],
        "wc_review_avg": [
            244.66666666666666,
            72.78430844320468
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            389.3333333333333,
            211.95177648596288
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 37,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=884763075685752430&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=hmv1LpNfXa",
        "pdf": "https://openreview.net/pdf?id=hmv1LpNfXa",
        "email": "cornell.edu;cornell.edu;cornell.edu",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Cornell University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cornell.edu",
        "aff_unique_abbr": "Cornell",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Finetuning Text-to-Image Diffusion Models for Fairness",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18085",
        "id": "hnrB5YHoYu",
        "author_site": "Xudong Shen, Chao Du, Tianyu Pang, Min Lin, Yongkang Wong, Mohan Kankanhalli",
        "tldr": "",
        "abstract": "The rapid adoption of text-to-image diffusion models in society underscores an urgent need to address their biases. Without interventions, these biases could propagate a skewed worldview and restrict opportunities for minority groups. In this work, we frame fairness as a distributional alignment problem. Our solution consists of two main technical contributions: (1) a distributional alignment loss that steers specific characteristics of the generated images towards a user-defined target distribution, and (2) adjusted direct finetuning of diffusion model's sampling process (adjusted DFT), which leverages an adjusted gradient to directly optimize losses defined on the generated images. Empirically, our method markedly reduces gender, racial, and their intersectional biases for occupational prompts. Gender bias is significantly reduced even when finetuning just five soft tokens. Crucially, our method supports diverse perspectives of fairness beyond absolute equality, which is demonstrated by controlling age to a 75% young and 25% old distribution while simultaneously debiasing gender and race. Finally, our method is scalable: it can debias multiple concepts at once by simply including these prompts in the finetuning data. We share code and various fair diffusion model adaptors at https://sail-sg.github.io/finetune-fair-diffusion/.",
        "keywords": "Fairness;Alignment;Diffusion Models;Text-to-Image Generation",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/755530331a7e40fd2c39db790490f008339f9711.zip",
        "author": "Xudong Shen;Chao Du;Tianyu Pang;Min Lin;Yongkang Wong;Mohan Kankanhalli",
        "authorids": "~Xudong_Shen1;~Chao_Du1;~Tianyu_Pang1;~Min_Lin1;~Yongkang_Wong1;~Mohan_Kankanhalli1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://xudongolivershen.github.io;https://duchao0726.github.io/;https://p2333.github.io/;https://linmin.me;https://sites.google.com/site/yongkangwong/;https://www.comp.nus.edu.sg/~mohan",
        "dblp": ";75/7523;202/2550;;89/7407;09/3613.html",
        "google_scholar": ";QOp7xW0AAAAJ;wYDbtFsAAAAJ;BGONmkIAAAAJ;https://scholar.google.com.sg/citations?user=Xa0mxggAAAAJ;6Lx_eowAAAAJ",
        "orcid": "0000-0001-9549-0986;0000-0003-1244-6336;0000-0003-0639-6176;;0000-0002-1239-4428;0000-0002-4846-2015",
        "linkedin": "oliverxudongshen/;duchao/;%E5%A4%A9%E5%AE%87-%E5%BA%9E-b3999017a/;min-lin-08a3a422/;yongkangwong/;mohan-kankanhalli-583417221",
        "or_profile": "~Xudong_Shen1;~Chao_Du1;~Tianyu_Pang1;~Min_Lin1;~Yongkang_Wong1;~Mohan_Kankanhalli1",
        "aff": "National University of Singapore;Sea AI Lab;Sea AI Lab;Sea AI Lab;National University of Singapore;National University of Singapore",
        "aff_domain": "nus.edu.sg;sea.com;sea.com;sea.com;nus.edu.sg;nus.edu.sg",
        "position": "PhD student;Senior Research Scientist;Senior Research Scientist;Principal Researcher;Senior Research Fellow;Full Professor",
        "bibtex": "@inproceedings{\nshen2024finetuning,\ntitle={Finetuning Text-to-Image Diffusion Models for Fairness},\nauthor={Xudong Shen and Chao Du and Tianyu Pang and Min Lin and Yongkang Wong and Mohan Kankanhalli},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=hnrB5YHoYu}\n}",
        "github": "",
        "project": "",
        "reviewers": "KXKr;T8Ls;qhuJ",
        "pdf_size": 34710410,
        "rating": "6;6;10",
        "confidence": "2;2;4",
        "soundness": "3;3;4",
        "contribution": "2;2;4",
        "presentation": "3;2;4",
        "wc_summary": "72;49;185",
        "wc_strengths": "51;62;105",
        "wc_weaknesses": "63;64;24",
        "wc_questions": "88;35;497",
        "wc_review": "274;210;811",
        "wc_reply_reviewers": "33;0;18",
        "wc_reply_authors": "1045;910;1189",
        "reply_reviewers": "1;0;1",
        "reply_authors": "3;3;3",
        "rating_avg": [
            7.333333333333333,
            1.8856180831641267
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            102.0,
            59.43624034767565
        ],
        "wc_strengths_avg": [
            72.66666666666667,
            23.299976156401723
        ],
        "wc_weaknesses_avg": [
            50.333333333333336,
            18.62495339293199
        ],
        "wc_questions_avg": [
            206.66666666666666,
            206.43373970571986
        ],
        "wc_review_avg": [
            431.6666666666667,
            269.49871160277473
        ],
        "wc_reply_reviewers_avg": [
            17.0,
            13.490737563232042
        ],
        "wc_reply_authors_avg": [
            1048.0,
            113.92102527628515
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.0,
            0.0
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 45,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1845827797695036927&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=hnrB5YHoYu",
        "pdf": "https://openreview.net/pdf?id=hnrB5YHoYu",
        "email": "nus.edu.sg;sea.com;sea.com;sea.com;nus.edu.sg;nus.edu.sg",
        "author_num": 6,
        "aff_unique_index": "0;1;1;1;0;0",
        "aff_unique_norm": "National University of Singapore;Sea AI Lab",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.nus.edu.sg;",
        "aff_unique_abbr": "NUS;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Singapore;"
    },
    {
        "title": "Conformal Inductive Graph Neural Networks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18084",
        "id": "homn1jOKI5",
        "author_site": "Soroush H. Zargarbashi, Aleksandar Bojchevski",
        "tldr": "",
        "abstract": "Conformal prediction (CP) transforms any model's output into prediction sets guaranteed to include (cover) the true label. CP requires exchangeability, a relaxation of the i.i.d. assumption, to obtain a valid distribution-free coverage guarantee. This makes it directly applicable to transductive node-classification. However, conventional CP cannot be applied in inductive settings due to the implicit shift in the (calibration) scores caused by message passing with the new nodes. We fix this issue for both cases of node and edge-exchangeable graphs,  recovering the standard coverage guarantee without sacrificing statistical efficiency. We further prove that the guarantee holds independently of the prediction time, e.g. upon arrival of a new node/edge or at any subsequent moment.",
        "keywords": "Conformal Prediction;Graph Neural Networks;Inductive Node Classification",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/f81705a89cec718dd5314359f0c1862257f097cb.zip",
        "author": "Soroush H. Zargarbashi;Aleksandar Bojchevski",
        "authorids": "~Soroush_H._Zargarbashi1;~Aleksandar_Bojchevski1",
        "gender": "M;M",
        "homepage": "https://www.linkedin.com/in/soroushzargar/;https://abojchevski.github.io/",
        "dblp": "354/2876;203/8114",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.de/citations?user=F1APiN4AAAAJ",
        "orcid": ";",
        "linkedin": "soroushzargar/;",
        "or_profile": "~Soroush_H._Zargarbashi1;~Aleksandar_Bojchevski1",
        "aff": "CISPA, saarland university, saarland informatics campus;University of Cologne",
        "aff_domain": "cispa.saarland;uni-koeln.de",
        "position": "PhD student;Full Professor",
        "bibtex": "@inproceedings{\nzargarbashi2024conformal,\ntitle={Conformal Inductive Graph Neural Networks},\nauthor={Soroush H. Zargarbashi and Aleksandar Bojchevski},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=homn1jOKI5}\n}",
        "github": "",
        "project": "",
        "reviewers": "aMS7;daSk;2Ri3;w8hy",
        "pdf_size": 1053713,
        "rating": "5;6;6;8",
        "confidence": "3;2;3;4",
        "soundness": "2;3;2;3",
        "contribution": "3;3;3;3",
        "presentation": "2;2;2;3",
        "wc_summary": "64;71;54;146",
        "wc_strengths": "53;27;42;175",
        "wc_weaknesses": "346;154;212;162",
        "wc_questions": "237;50;18;457",
        "wc_review": "700;302;326;940",
        "wc_reply_reviewers": "0;14;0;0",
        "wc_reply_authors": "902;512;391;333",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            83.75,
            36.44430682562093
        ],
        "wc_strengths_avg": [
            74.25,
            58.89556434910867
        ],
        "wc_weaknesses_avg": [
            218.5,
            76.89440811918641
        ],
        "wc_questions_avg": [
            190.5,
            175.12923799297477
        ],
        "wc_review_avg": [
            567.0,
            266.9850183062713
        ],
        "wc_reply_reviewers_avg": [
            3.5,
            6.06217782649107
        ],
        "wc_reply_authors_avg": [
            534.5,
            221.78649643294335
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.6488856845230502,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2218129192374449995&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=homn1jOKI5",
        "pdf": "https://openreview.net/pdf?id=homn1jOKI5",
        "email": "cispa.saarland;uni-koeln.de",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Saarland University;University of Cologne",
        "aff_unique_dep": "CISPA;",
        "aff_unique_url": "https://www.uni-saarland.de;https://www.uni-koeln.de/",
        "aff_unique_abbr": "Saarland U;UC",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Saarland Informatics Campus;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Germany"
    },
    {
        "title": "Causally Aligned Curriculum Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18083",
        "id": "hp4yOjhwTs",
        "author_site": "Mingxuan Li, Junzhe Zhang, Elias Bareinboim",
        "tldr": "",
        "abstract": "A pervasive challenge in Reinforcement Learning (RL) is the ``curse of dimensionality'' which is the exponential growth in the state-action space when optimizing a high-dimensional target task. The framework of curriculum learning trains the agent in a curriculum composed of a sequence of related and more manageable source tasks. The expectation is that when some optimal decision rules are shared across source tasks and the target task, the agent could more quickly pick up the necessary skills to behave optimally in the environment, thus accelerating the learning process. \nHowever, this critical assumption of invariant optimal decision rules does not necessarily hold in many practical applications, specifically when the underlying environment contains unobserved confounders. This paper studies the problem of curriculum RL through causal lenses. We derive a sufficient graphical condition characterizing causally aligned source tasks, i.e., the invariance of optimal decision rules holds. We further develop an efficient algorithm to generate a causally aligned curriculum, provided with qualitative causal knowledge of the target environment. Finally, we validate our proposed methodology through experiments in confounded environments.",
        "keywords": "Causal Inference;Curriculum Learning;Reinforcement Learning",
        "primary_area": "causal reasoning",
        "supplementary_material": "",
        "author": "Mingxuan Li;Junzhe Zhang;Elias Bareinboim",
        "authorids": "~Mingxuan_Li1;~Junzhe_Zhang3;~Elias_Bareinboim2",
        "gender": "M;;M",
        "homepage": "https://mingxuan.me;;https://causalai.net",
        "dblp": ";;85/9005",
        "google_scholar": "V4MEw70AAAAJ;;r5U-D7YAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Mingxuan_Li1;~Junzhe_Zhang3;~Elias_Bareinboim2",
        "aff": "Columbia University;;Columbia University",
        "aff_domain": "columbia.edu;;columbia.edu",
        "position": "PhD student;;Associate Professor",
        "bibtex": "@inproceedings{\nli2024causally,\ntitle={Causally Aligned Curriculum Learning},\nauthor={Mingxuan Li and Junzhe Zhang and Elias Bareinboim},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=hp4yOjhwTs}\n}",
        "github": "",
        "project": "",
        "reviewers": "StU4;eG2G;C4uc;1poU",
        "pdf_size": 7536249,
        "rating": "3;6;6;8",
        "confidence": "4;3;3;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;4;3;3",
        "wc_summary": "126;101;76;106",
        "wc_strengths": "35;43;57;62",
        "wc_weaknesses": "163;268;74;614",
        "wc_questions": "69;145;211;65",
        "wc_review": "393;557;418;847",
        "wc_reply_reviewers": "0;0;0;36",
        "wc_reply_authors": "902;1779;1109;1583",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "2;3;2;4",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            102.25,
            17.80975856096876
        ],
        "wc_strengths_avg": [
            49.25,
            10.779030568655049
        ],
        "wc_weaknesses_avg": [
            279.75,
            204.83209587366918
        ],
        "wc_questions_avg": [
            122.5,
            60.22250409938132
        ],
        "wc_review_avg": [
            553.75,
            180.46796807189912
        ],
        "wc_reply_reviewers_avg": [
            9.0,
            15.588457268119896
        ],
        "wc_reply_authors_avg": [
            1343.25,
            352.4672857159938
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8892972917998875,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12200487327131214788&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=hp4yOjhwTs",
        "pdf": "https://openreview.net/pdf?id=hp4yOjhwTs",
        "email": "columbia.edu;;columbia.edu",
        "author_num": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Columbia University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.columbia.edu",
        "aff_unique_abbr": "Columbia",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "hpSEeLWkXX",
        "title": "SupMem: Support Memorization for Semiparametric Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Semiparametric language models (Semi-LMs) combine the advantages of neural language models and non-parametric memory, making them suitable for continual learning from dynamic text data with little catastrophic forgetting. However, their scalability is limited due to the linear increase in memory cost with data and model size. To mitigate this scalability issue, we propose Support Memorization (SupMem) by only memorizing support entries, inspired by the concept of support vectors in SVMs and the equivalence between Transformers and SVMs in terms of optimization geometry \\citep{tarzanagh_transformers_2023,tarzanagh_margin_2023}. We first present a novel perspective on support entry identification, modeling ResMem as an optimization problem that maximizes support entry expectation with a constraint on the number of support entries. Then, we provide theoretical analyses to propose a feasible approximate solution in practice. Experimental results show that ResMem achieves the same performance as the conventional full memorization method with much-reduced memory consumption, demonstrating its effectiveness in improving both data and model scalability for continual learning in Semi-LMs.",
        "keywords": "NLP;semiparametric model;language model;continual learning;scalability;support vectors;data compression;kNN-LM",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Guangyue Peng;Tao Ge;Si-Qing Chen;Furu Wei;Houfeng Wang",
        "authorids": "~Guangyue_Peng1;~Tao_Ge1;~Si-Qing_Chen1;~Furu_Wei1;~Houfeng_Wang1",
        "gender": "Not Specified;M;F;M;M",
        "homepage": "https://github.com/vitis-melongena;https://getao.github.io/;;https://www.microsoft.com/en-us/research/people/fuwei/;https://cs.pku.edu.cn/info/1083/1701.htm",
        "dblp": "341/5588;136/7923;;72/5870;38/1358",
        "google_scholar": "yHtBUvkAAAAJ;LYbs7Q8AAAAJ;;G-V1VpwAAAAJ;",
        "orcid": "0009-0000-6771-6327;;0000-0002-6945-4540;;0000-0001-7130-1589",
        "linkedin": ";;si-qing-chen-seattle/;;",
        "or_profile": "~Guangyue_Peng1;~Tao_Ge1;~Si-Qing_Chen1;~Furu_Wei1;~Houfeng_Wang1",
        "aff": "Peking University;Tencent AI Lab;Microsoft;Microsoft Research;Peking University",
        "aff_domain": "pku.edu.cn;tencent.com;microsoft.com;microsoft.com;pku.edu.cn",
        "position": "PhD student;Principal Researcher;Partner Applied Science Manager;Distinguished Scientist;Full Professor",
        "bibtex": "@misc{\npeng2024supmem,\ntitle={SupMem: Support Memorization for Semiparametric Language Models},\nauthor={Guangyue Peng and Tao Ge and Si-Qing Chen and Furu Wei and Houfeng Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=hpSEeLWkXX}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=hpSEeLWkXX",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:_dTPfwtDsvYJ:scholar.google.com/&scioq=SupMem:+Support+Memorization+for+Semiparametric+Language+Models&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;2;0",
        "aff_unique_norm": "Peking University;Tencent;Microsoft",
        "aff_unique_dep": ";Tencent AI Lab;Microsoft Corporation",
        "aff_unique_url": "http://www.pku.edu.cn;https://ai.tencent.com;https://www.microsoft.com",
        "aff_unique_abbr": "Peking U;Tencent AI Lab;Microsoft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "hpdt0skySQ",
        "title": "Tab2Gan: Utilizing image conversion and Gan inversion for tabular model robustness",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "New advanced adversarial attacks are emerging rapidly. \nThese threats have prompted the development of various defense strategies, including robustness techniques.\nIn this paper we propose a novel attack-agnostic robustness method that utilizes the generative capabilities of image based generative adversarial networks (GANS) to enhance the robustness of classical machine learning models trained on structured (tabular) data. \nTo safeguard the target models, we employ two GANs, each trained on benign data from different classes. \nThese GANs function as a defensive mechanism by classifying incoming inputs, whether they are benign or adversarial, and then reconstructing them within the benign data distribution of each respective GAN before presenting them to the target model.  \nIn our evaluation, conducted on three commonly known structured datasets and two conventional machine learning models, our proposed robustness approach consistently outperformed the existing techniques in the field.\nIn most of the experiments applying the suggested robustness method yields classification accuracy results that closely align with the benign accuracy rate of 99% i.e., the target model performs as if it has not been subjected to any attack whatsoever.",
        "keywords": "robustness;adversarial attack;gan inversion;structured data;security",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Arie Pavlov;Edita Grolman;Ikuya Morikawa;Toshiya Shimizu;Asaf Shabtai;Yuval Elovici",
        "authorids": "~Arie_Pavlov1;~Edita_Grolman1;~Ikuya_Morikawa1;~Toshiya_Shimizu1;~Asaf_Shabtai1;~Yuval_Elovici1",
        "gender": "M;;;M;;M",
        "homepage": ";;;;;https://cyber.bgu.ac.il/yuval/",
        "dblp": ";;22/726;78/5031;;38/4086",
        "google_scholar": ";https://scholar.google.co.il/citations?hl=en;JBFx8KYAAAAJ;;;https://scholar.google.co.il/citations?user=ruZDm9QAAAAJ",
        "orcid": ";;0000-0003-2720-812X;0000-0003-3660-5231;;0000-0002-9641-128X",
        "linkedin": "arie-pavlov-78217316a/;;;;;yuval-elovici-0baa4a4/?originalSubdomain=il",
        "or_profile": "~Arie_Pavlov1;~Edita_Grolman1;~Ikuya_Morikawa1;~Toshiya_Shimizu1;~Asaf_Shabtai1;~Yuval_Elovici1",
        "aff": ";Ben-Gurion University of the Negev;Fujitsu Research;Fujitsu;;Ben Gurion University of the Negev, Technion",
        "aff_domain": ";post.bgu.ac.il;fujitsu.com;fujitsu.com;;bgu.ac.il",
        "position": ";Postdoc;Research Manager;Researcher;;Full Professor",
        "bibtex": "@misc{\npavlov2024tabgan,\ntitle={Tab2Gan: Utilizing image conversion and Gan inversion for tabular model robustness},\nauthor={Arie Pavlov and Edita Grolman and Ikuya Morikawa and Toshiya Shimizu and Asaf Shabtai and Yuval Elovici},\nyear={2024},\nurl={https://openreview.net/forum?id=hpdt0skySQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "tf3D;CeqD;pzJ6;PeVY",
        "site": "https://openreview.net/forum?id=hpdt0skySQ",
        "pdf_size": 309803,
        "rating": "3;3;3;5",
        "confidence": "4;3;5;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "2;2;1;2",
        "wc_summary": "80;43;99;83",
        "wc_strengths": "92;31;49;91",
        "wc_weaknesses": "190;111;113;91",
        "wc_questions": "40;2;1;18",
        "wc_review": "402;187;262;283",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            76.25,
            20.51066795596867
        ],
        "wc_strengths_avg": [
            65.75,
            26.52710877574109
        ],
        "wc_weaknesses_avg": [
            126.25,
            37.79798275040614
        ],
        "wc_questions_avg": [
            15.25,
            15.801503093060482
        ],
        "wc_review_avg": [
            283.5,
            77.16378684331141
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:NXoJgzX-VukJ:scholar.google.com/&scioq=Tab2Gan:+Utilizing+image+conversion+and+Gan+inversion+for+tabular+model+robustness&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "Ben-Gurion University of the Negev;Fujitsu Limited;Ben Gurion University of the Negev",
        "aff_unique_dep": ";Fujitsu Research;",
        "aff_unique_url": "https://www.bgu.ac.il;https://www.fujitsu.com/;https://www.bgu.ac.il",
        "aff_unique_abbr": "BGU;Fujitsu;BGU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "Israel;Japan"
    },
    {
        "id": "hqUznsPMLn",
        "title": "ACES: Generating Diverse Programming Puzzles with Autotelic Language Models and Semantic Descriptors",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Finding and selecting new and interesting problems to solve is at the heart of curiosity, science and innovation. We here study automated problem generation in the context of the open-ended space of python programming puzzles. Existing generative models often aim at modeling a reference distribution without any explicit diversity optimization. Other methods explicitly optimizing for diversity do so either in limited hand-coded representation spaces or in uninterpretable learned embedding spaces that may not align with human perceptions of interesting variations. With ACES (Autotelic Code Exploration via Semantic descriptors), we introduce a family of autotelic generation methods that leverage semantic descriptors evaluated by a large language model (LLM) to directly optimize for interesting diversity. Each puzzle is labeled along 10 dimensions, each capturing a programming skill required to solve it. ACES generates and pursues novel and feasible goals to explore that abstract semantic space, slowly discovering a diversity of solvable programming puzzles in any given run. Across a set of experiments, we show that ACES discovers a richer diversity of puzzles than existing diversity-maximizing algorithms as measured across a range of diversity metrics. We further study whether and in which conditions this diversity can translate into the successful training of puzzle solving models.",
        "keywords": "program synthesis;large language models;diversity search;puzzle generation",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/fc89bd4d434c90b463c8ca16f1d666c7e3ecc97d.zip",
        "author": "Julien Pourcel;C\u00e9dric Colas;Pierre-Yves Oudeyer;Laetitia Teodorescu",
        "authorids": "~Julien_Pourcel1;~C\u00e9dric_Colas1;~Pierre-Yves_Oudeyer1;~Laetitia_Teodorescu1",
        "gender": "M;M;M;F",
        "homepage": "https://www.linkedin.com/in/julien-pourcel-b527ab150/;https://cedriccolas.com;http://www.pyoudeyer.com;",
        "dblp": ";215/3872;33/5513;",
        "google_scholar": "WgMxQxoAAAAJ;https://scholar.google.fr/citations?user=VBz8gZ4AAAAJ;https://scholar.google.fr/citations?user=gCqGj4sAAAAJ;https://scholar.google.fr/citations?user=kgfJ_3gAAAAJ",
        "orcid": ";0000-0003-0212-427X;;",
        "linkedin": "julien-pourcel-b527ab150/;;pierreyvesoudeyer/;",
        "or_profile": "~Julien_Pourcel1;~C\u00e9dric_Colas1;~Pierre-Yves_Oudeyer1;~Laetitia_Teodorescu1",
        "aff": "INRIA;Massachusetts Institute of Technology;Inria;INRIA",
        "aff_domain": "inria.fr;mit.edu;inria.fr;inria.fr",
        "position": "PhD student;Postdoc;Research director;Postdoc",
        "bibtex": "@misc{\npourcel2024aces,\ntitle={{ACES}: Generating Diverse Programming Puzzles with Autotelic Language Models and Semantic Descriptors},\nauthor={Julien Pourcel and C{\\'e}dric Colas and Pierre-Yves Oudeyer and Laetitia Teodorescu},\nyear={2024},\nurl={https://openreview.net/forum?id=hqUznsPMLn}\n}",
        "github": "",
        "project": "",
        "reviewers": "XBPq;ufAe;AUHG",
        "site": "https://openreview.net/forum?id=hqUznsPMLn",
        "pdf_size": 3165957,
        "rating": "3;3;5",
        "confidence": "5;4;4",
        "soundness": "2;2;3",
        "contribution": "1;1;2",
        "presentation": "4;3;3",
        "wc_summary": "14;145;176",
        "wc_strengths": "18;71;168",
        "wc_weaknesses": "224;852;547",
        "wc_questions": "87;13;527",
        "wc_review": "343;1081;1418",
        "wc_reply_reviewers": "0;273;684",
        "wc_reply_authors": "636;2051;2993",
        "reply_reviewers": "0;1;2",
        "reply_authors": "1;4;5",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            111.66666666666667,
            70.21079372543481
        ],
        "wc_strengths_avg": [
            85.66666666666667,
            62.109222789820485
        ],
        "wc_weaknesses_avg": [
            541.0,
            256.4150281607275
        ],
        "wc_questions_avg": [
            209.0,
            226.88029149017476
        ],
        "wc_review_avg": [
            947.3333333333334,
            448.929343611615
        ],
        "wc_reply_reviewers_avg": [
            319.0,
            281.12986323050063
        ],
        "wc_reply_authors_avg": [
            1893.3333333333333,
            968.6782518233573
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            1.699673171197595
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9343150283539756531&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "INRIA;Massachusetts Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.inria.fr;https://web.mit.edu",
        "aff_unique_abbr": "INRIA;MIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "France;United States"
    },
    {
        "id": "hr4HTShC6l",
        "title": "Detecting Shortcuts using Mutual Information",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The failure of deep neural networks to generalize to out-of-distribution (OOD) data is a well-known problem that raises concerns about the deployment of trained networks in safety-critical domains such as healthcare and autonomous vehicles. We study a particular kind of distribution shift \u2014 shortcuts or spurious correlations in the training data. These correlations are not present in real-world test data, so there\nis a performance drop due to distribution shift, also referred to as shortcut learning. Shortcut learning is often only exposed when models are evaluated in carefully controlled experimental settings, posing a serious dilemma for AI practitioners to properly assess the effectiveness of a trained model for real-world applications. In this work, we try to understand shortcut learning using information-theoretic tools and propose to use the mutual information (MI) between the learned representation and the input space as a domain-agnostic metric for detecting shortcuts in the training datasets. For studying the training dynamics of shortcut learning, we develop a Neural Tangent Kernel (NTK) based framework, which can be used to detect shortcuts and spurious correlations in the training data without requiring class labels\nof the test data. We empirically demonstrate on multiple datasets, such as MNIST, CelebA, NICO, Waterbirds, and BenchMD, that MI can effectively detect shortcuts. We benchmark against multiple OOD detection baselines to show that OOD detectors cannot detect shortcuts, and our method can be used in complementary with OOD detectors to identify all types of distribution shifts in the datasets, including\nshortcuts.",
        "keywords": "shortcuts;spurious correlation;mutual information;information theory;neural tangent kernel",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/51f14e81aa32b370b97ad25ffc7becbdabd22c25.pdf",
        "author": "Mohammed Adnan;Yani Ioannou;Kenyon Tsai;Angus Galloway;Hamid Tizhoosh;Rahul G Krishnan;Graham W. Taylor",
        "authorids": "~Mohammed_Adnan1;~Yani_Ioannou1;~Kenyon_Tsai1;~Angus_Galloway1;~Hamid_Tizhoosh1;~Rahul_G_Krishnan1;~Graham_W._Taylor1",
        "gender": "M;M;;M;;M;",
        "homepage": "https://adnan1306.github.io;https://yani.ai;;http://angusg.com;;http://www.cs.toronto.edu/~rahulgk/index.html;",
        "dblp": "254/1485;119/5087;;;;172/0880;",
        "google_scholar": "g39sWmYAAAAJ;Qy9yv44AAAAJ;;;;ilJgXHkAAAAJ;",
        "orcid": ";0000-0002-9797-5888;;;;;",
        "linkedin": ";yanii/;;angusgalloway/;;rahulgk/;",
        "or_profile": "~Mohammed_Adnan1;~Yani_Ioannou1;~Kenyon_Tsai1;~Angus_Galloway1;~Hamid_Tizhoosh1;~Rahul_G_Krishnan1;~Graham_W._Taylor1",
        "aff": "University of Calgary / Vector Institute;University of Calgary;;University of Guelph;;Department of Computer Science, University of Toronto;",
        "aff_domain": "ucalgary.ca;ucalgary.ca;;uoguelph.ca;;cs.toronto.edu;",
        "position": "PhD student;Assistant Professor;;PhD student;;Assistant Professor;",
        "bibtex": "@misc{\nadnan2024detecting,\ntitle={Detecting Shortcuts using Mutual Information},\nauthor={Mohammed Adnan and Yani Ioannou and Kenyon Tsai and Angus Galloway and Hamid Tizhoosh and Rahul G Krishnan and Graham W. Taylor},\nyear={2024},\nurl={https://openreview.net/forum?id=hr4HTShC6l}\n}",
        "github": "",
        "project": "",
        "reviewers": "XNRX;8GQW;XhXU;cP5y",
        "site": "https://openreview.net/forum?id=hr4HTShC6l",
        "pdf_size": 1063249,
        "rating": "3;3;3;3",
        "confidence": "4;4;3;4",
        "soundness": "2;2;1;2",
        "contribution": "2;3;2;2",
        "presentation": "2;2;1;3",
        "wc_summary": "65;127;60;79",
        "wc_strengths": "21;92;49;32",
        "wc_weaknesses": "188;179;123;165",
        "wc_questions": "78;4;597;96",
        "wc_review": "352;402;829;372",
        "wc_reply_reviewers": "0;0;0;24",
        "wc_reply_authors": "368;15;0;356",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;0;1",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            82.75,
            26.479945241635225
        ],
        "wc_strengths_avg": [
            48.5,
            27.02313823374332
        ],
        "wc_weaknesses_avg": [
            163.75,
            24.913600703230355
        ],
        "wc_questions_avg": [
            193.75,
            235.35544926769808
        ],
        "wc_review_avg": [
            488.75,
            197.24778199006445
        ],
        "wc_reply_reviewers_avg": [
            6.0,
            10.392304845413264
        ],
        "wc_reply_authors_avg": [
            184.75,
            177.3800651144316
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            0.75,
            0.4330127018922193
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13066390812904943212&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "University of Calgary;University of Guelph;University of Toronto",
        "aff_unique_dep": ";;Department of Computer Science",
        "aff_unique_url": "https://www.ucalgary.ca;https://www.uoguelph.ca;https://www.utoronto.ca",
        "aff_unique_abbr": "U of C;U of G;U of T",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Toronto",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "hrxiJjz9gm",
        "title": "Communication Compression for Byzantine Robust Learning: New Efficient Algorithms and Improved Rates",
        "track": "main",
        "status": "Desk Reject",
        "tldr": "",
        "abstract": "Byzantine robustness is an essential feature of algorithms for certain distributed optimization problems, typically encountered in collaborative/federated learning.  These problems are usually huge-scale, implying that communication compression is also imperative for their resolution. These factors have spurred recent algorithmic and theoretical developments in the literature of Byzantine-robust learning with compression. In this paper, we contribute to this research area in two main directions. First, we propose a new Byzantine-robust method with compression -- Byz-DASHA-PAGE -- and prove that the new method has better convergence rate (for non-convex and Polyak-Lojasiewicz smooth optimization problems), smaller neighborhood size in the heterogeneous case, and tolerates more Byzantine workers under over-parametrization than the previous method with SOTA theoretical convergence guarantees (Byz-VR-MARINA). Secondly, we develop the first Byzantine-robust method with communication compression and error feedback -- Byz-EF21 -- along with its bi-directional compression version -- Byz-EF21-BC -- and derive the convergence rates for these methods for non-convex and Polyak-Lojasiewicz smooth case. We test the proposed methods and illustrate our theoretical findings in the numerical experiments.",
        "keywords": "Byzantine robustness;communication compression;variance reduction;error feedback",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Ahmad Rammal;Kaja Gruntkowska;Nikita Fedin;Eduard Gorbunov;Peter Richt\u00e1rik",
        "authorids": "~Ahmad_Rammal1;~Kaja_Gruntkowska1;~Nikita_Fedin1;~Eduard_Gorbunov1;~Peter_Richt\u00e1rik1",
        "gender": "M;F;M;M;M",
        "homepage": "https://www.linkedin.com/in/ahmad-rammal-494662207/;;;https://eduardgorbunov.github.io;https://richtarik.org",
        "dblp": ";;;215/5512.html;62/8001",
        "google_scholar": ";H0W8ADAAAAAJ;;https://scholar.google.ru/citations?user=85j2RqQAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;0000-0001-5593-3746;;0000-0003-4380-5848",
        "linkedin": ";kaja-gruntkowska-a240a924b;;;richtarik/",
        "or_profile": "~Ahmad_Rammal1;~Kaja_Gruntkowska1;~Nikita_Fedin1;~Eduard_Gorbunov1;~Peter_Richtarik1",
        "aff": "\u00c9cole Polytechnique;King Abdullah University of Science and Technology;MIPT;Mohamed bin Zayed University of Artificial Intelligence;King Abdullah University of Science and Technology (KAUST)",
        "aff_domain": "polytechnique.fr;kaust.edu.sa;phystech.edu;mbzuai.ac.ae;kaust.edu.sa",
        "position": "MS student;PhD student;MS student;Postdoc;Full Professor",
        "bibtex": "@misc{\nrammal2024communication,\ntitle={Communication Compression for Byzantine Robust Learning: New Efficient Algorithms and Improved Rates},\nauthor={Ahmad Rammal and Kaja Gruntkowska and Nikita Fedin and Eduard Gorbunov and Peter Richt{\\'a}rik},\nyear={2024},\nurl={https://openreview.net/forum?id=hrxiJjz9gm}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=hrxiJjz9gm",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=694544092588860739&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 11,
        "aff_unique_index": "0;1;2;3;1",
        "aff_unique_norm": "Ecole Polytechnique;King Abdullah University of Science and Technology;Moscow Institute of Physics and Technology;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.polytechnique.edu;https://www.kast.kau.edu.sa;https://mipt.ru;https://mbzuai.ac.ae",
        "aff_unique_abbr": "X;KAUST;MIPT;MBZUAI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;3;1",
        "aff_country_unique": "France;Saudi Arabia;Russian Federation;United Arab Emirates"
    },
    {
        "title": "InstructDET: Diversifying Referring Object Detection with Generalized Instructions",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18082",
        "id": "hss35aoQ1Y",
        "author_site": "Ronghao Dang, Jiangyan Feng, Haodong Zhang, Chongjian GE, Lin Song, Lijun GONG, Chengju Liu, Qijun Chen, Feng Zhu, Rui Zhao, Yibing Song",
        "tldr": "",
        "abstract": "We propose InstructDET, a data-centric method for referring object detection (ROD) that localizes target objects based on user instructions. While deriving from referring expressions (REC), the instructions we leverage are greatly diversified to encompass common user intentions related to object detection. For one image, we produce tremendous instructions that refer to every single object and different combinations of multiple objects. Each instruction and its corresponding object bounding boxes (bbxs) constitute one training data pair. In order to encompass common detection expressions, we involve emerging vision-language model (VLM) and large language model (LLM) to generate instructions guided by text prompts and object bbxs, as the generalizations of foundation models are effective to produce human-like expressions (e.g., describing object property, category, and relationship). We name our constructed dataset as InDET. It contains images, bbxs and generalized instructions that are from foundation models. Our InDET is developed from existing REC datasets and object detection datasets, with the expanding potential that any image with object bbxs can be incorporated through using our InstructDET method. By using our InDET dataset, we show that a conventional ROD model surpasses existing methods on standard REC datasets and our InDET test set. Our data-centric method InstructDET, with automatic data expansion by leveraging foundation models, directs a promising field that ROD can be greatly diversified to execute common object detection instructions.",
        "keywords": "Referring Object Detection; Visual Grounding; Foundation Models",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/a9812c540ceb78d60a5c29781c49b1dea2b97621.zip",
        "author": "Ronghao Dang;Jiangyan Feng;Haodong Zhang;Chongjian GE;Lin Song;Lijun GONG;Chengju Liu;Qijun Chen;Feng Zhu;Rui Zhao;Yibing Song",
        "authorids": "~Ronghao_Dang1;~Jiangyan_Feng2;~Haodong_Zhang2;~Chongjian_GE1;~Lin_Song2;~Lijun_GONG2;~Chengju_Liu1;~Qijun_Chen2;~Feng_Zhu1;~Rui_Zhao6;~Yibing_Song1",
        "gender": "M;F;Non-Binary;M;M;F;F;M;M;M;",
        "homepage": "https://rh-dang.github.io/;;;https://chongjiange.github.io;https://linsong.cc;;;http://rail.tongji.edu.cn;http://home.ustc.edu.cn/~zhufengx/;http://zhaorui.xyz/;https://ybsong00.github.io/",
        "dblp": "318/1427;;;287/4197;;;81/;75;71/2791-6;26/2578-1;77/2117",
        "google_scholar": "https://scholar.google.com.hk/citations?hl=zh-CN;;;https://scholar.google.com.hk/citations?user=7DA_vcUAAAAJ;6Ra2TgQAAAAJ;CvmpmS0AAAAJ;;;oO53gjEAAAAJ;1c9oQNMAAAAJ;oRhJHmIAAAAJ",
        "orcid": "0000-0003-1176-3735;;;;;;0000-0001-7543-0855;0000-0001-5644-1188;;;",
        "linkedin": ";jiangyanfeng-starking?trk=contact-info;;chongjian-ge-%EF%BC%88%E8%91%9B%E5%B4%87%E5%89%91%EF%BC%89-3b393310b/;\u6797-\u5b8b-9520a5183/;;;;;;",
        "or_profile": "~Ronghao_Dang1;~Jiangyan_Feng2;~Haodong_Zhang2;~Chongjian_GE1;~Lin_Song2;~Lijun_GONG2;~Chengju_Liu1;~Qijun_Chen2;~Feng_Zhu1;~Rui_Zhao6;~Yibing_Song1",
        "aff": "Tongji University;SenseTime;SenseTime;The University of Hong Kong;Tencent AI Lab;Sensetime;Tongji University;Tongji University;SenseTime Group LTD;SenseTime Research;Alibaba DAMO Academy",
        "aff_domain": "tongji.edu.cn;sensetime.com;sensetime.com;hku.hk;tencent.com;sensetime.com;tongji.edu.cn;tongji.edu.cn;sensetime.com;sensetime.com;alibaba-inc.com",
        "position": "MS student;Researcher;Researcher;PhD student;Researcher;Researcher;Full Professor;Full Professor;Researcher;Researcher;Staff Scientist",
        "bibtex": "@inproceedings{\ndang2024instructdet,\ntitle={Instruct{DET}: Diversifying Referring Object Detection with Generalized Instructions},\nauthor={Ronghao Dang and Jiangyan Feng and Haodong Zhang and Chongjian GE and Lin Song and Lijun GONG and Chengju Liu and Qijun Chen and Feng Zhu and Rui Zhao and Yibing Song},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=hss35aoQ1Y}\n}",
        "github": "",
        "project": "",
        "reviewers": "n3DU;nJxy;uAXw;Vtb3",
        "pdf_size": 12256125,
        "rating": "5;6;6;6",
        "confidence": "4;3;3;4",
        "soundness": "3;2;2;3",
        "contribution": "2;2;3;4",
        "presentation": "2;2;2;4",
        "wc_summary": "80;113;119;48",
        "wc_strengths": "15;59;158;54",
        "wc_weaknesses": "173;69;377;19",
        "wc_questions": "2;6;58;2",
        "wc_review": "270;247;712;123",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1017;464;1343;369",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;2;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            90.0,
            28.434134416225863
        ],
        "wc_strengths_avg": [
            71.5,
            52.76599283629562
        ],
        "wc_weaknesses_avg": [
            159.5,
            137.31259956755608
        ],
        "wc_questions_avg": [
            17.0,
            23.727621035409346
        ],
        "wc_review_avg": [
            338.0,
            223.05044272540684
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            798.25,
            400.18206793908195
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5087541950628154230&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=hss35aoQ1Y",
        "pdf": "https://openreview.net/pdf?id=hss35aoQ1Y",
        "email": "tongji.edu.cn;sensetime.com;sensetime.com;hku.hk;tencent.com;sensetime.com;tongji.edu.cn;tongji.edu.cn;sensetime.com;sensetime.com;alibaba-inc.com",
        "author_num": 11,
        "aff_unique_index": "0;1;1;2;3;1;0;0;4;1;5",
        "aff_unique_norm": "Tongji University;SenseTime;University of Hong Kong;Tencent;SenseTime Group;Alibaba Group",
        "aff_unique_dep": ";;;Tencent AI Lab;;DAMO Academy",
        "aff_unique_url": "https://www.tongji.edu.cn;https://www.sensetime.com;https://www.hku.hk;https://ai.tencent.com;https://www.sensetime.com;https://www.alibaba-group.com",
        "aff_unique_abbr": "Tongji;SenseTime;HKU;Tencent AI Lab;SenseTime;Alibaba DAMO",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "htEL8LrrVe",
        "title": "Communication Bounds for the Distributed Experts Problem",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this work, we study the experts problem in the distributed setting where an expert's cost needs to be aggregated across multiple servers. Our study considers various communication models such as the message-passing model and the broadcast model, along with multiple aggregation functions, such as summing and taking the maximum of an expert's cost across servers. We propose the first communication-efficient protocols that achieve near-optimal regret in these settings, even against a strong adversary who can choose the inputs adaptively. Additionally, we give a lower bound showing that the communication of our protocols is nearly optimal. Finally, we implement our protocols and demonstrate empirical savings on real-world benchmarks.",
        "keywords": "Online Learning;Communication Bounds;Distributed Expert Problem;Bandit Learning",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/d1bf5e5a76f37e52014c3e4c34d25e246fefc2b0.zip",
        "author": "Zhihao Jia;Qi Pang;David Woodruff;Zhihao Zhang;Wenting Zheng",
        "authorids": "~Zhihao_Jia2;~Qi_Pang1;~David_Woodruff1;~Zhihao_Zhang2;~Wenting_Zheng1",
        "gender": "M;;M;;",
        "homepage": "https://www.cs.cmu.edu/~zhihaoj2/;;http://www.cs.cmu.edu/~dwoodruf/;;https://wzheng.github.io/",
        "dblp": ";;w/DPWoodruff;91/5464;94/4314",
        "google_scholar": "0IWLFR4AAAAJ;;https://scholar.google.com.tw/citations?user=0G2t-6sAAAAJ;https://scholar.google.com/citations?hl=en;OeDgxpgAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Zhihao_Jia2;~Qi_Pang1;~David_Woodruff1;~Zhihao_Zhang2;~Wenting_Zheng1",
        "aff": "Carnegie Mellon University;;Carnegie Mellon University;Carnegie Mellon University;Carnegie Mellon University",
        "aff_domain": "cs.cmu.edu;;cmu.edu;andrew.cmu.edu;cmu.edu",
        "position": "Assistant Professor;;Full Professor;PhD student;Assistant Professor",
        "bibtex": "@misc{\njia2024communication,\ntitle={Communication Bounds for the Distributed Experts Problem},\nauthor={Zhihao Jia and Qi Pang and David Woodruff and Zhihao Zhang and Wenting Zheng},\nyear={2024},\nurl={https://openreview.net/forum?id=htEL8LrrVe}\n}",
        "github": "",
        "project": "",
        "reviewers": "K9qt;WmKY;4QY1;ihMU",
        "site": "https://openreview.net/forum?id=htEL8LrrVe",
        "pdf_size": 1693778,
        "rating": "3;3;5;8",
        "confidence": "4;3;3;3",
        "soundness": "2;3;2;3",
        "contribution": "2;3;3;3",
        "presentation": "1;2;1;3",
        "wc_summary": "95;266;79;137",
        "wc_strengths": "61;154;30;12",
        "wc_weaknesses": "171;187;279;142",
        "wc_questions": "2;93;3;7",
        "wc_review": "329;700;391;298",
        "wc_reply_reviewers": "18;233;15;5",
        "wc_reply_authors": "267;231;442;169",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            144.25,
            73.41449107635358
        ],
        "wc_strengths_avg": [
            64.25,
            54.70089121760266
        ],
        "wc_weaknesses_avg": [
            194.75,
            51.24634133282102
        ],
        "wc_questions_avg": [
            26.25,
            38.58351331851468
        ],
        "wc_review_avg": [
            429.5,
            159.7224154588203
        ],
        "wc_reply_reviewers_avg": [
            67.75,
            95.52846434440366
        ],
        "wc_reply_authors_avg": [
            277.25,
            101.3715319998667
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.49374193110101877,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:D8geHVt8LF8J:scholar.google.com/&scioq=Communication+Bounds+for+the+Distributed+Experts+Problem&hl=en&as_sdt=0,47",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Carnegie Mellon University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cmu.edu",
        "aff_unique_abbr": "CMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Information Bottleneck Analysis of Deep Neural Networks via Lossy Compression",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18081",
        "id": "huGECz8dPp",
        "author_site": "Ivan Butakov, Aleksandr Tolmachev, Sofia Malanchuk, Anna Neopryatnaya, Alexey Frolov, Kirill Andreev",
        "tldr": "",
        "abstract": "The Information Bottleneck (IB) principle offers an information-theoretic framework for analyzing the training process of deep neural networks (DNNs). Its essence lies in tracking the dynamics of two mutual information (MI) values: between the hidden layer output and the DNN input/target. According to the hypothesis put forth by Shwartz-Ziv & Tishby (2017), the training process consists of two distinct phases: fitting and compression. The latter phase is believed to account for the good generalization performance exhibited by DNNs. Due to the challenging nature of estimating MI between high-dimensional random vectors, this hypothesis was only partially verified for NNs of tiny sizes or specific types, such as quantized NNs. In this paper, we introduce a framework for conducting IB analysis of general NNs. Our approach leverages the stochastic NN method proposed by Goldfeld et al. (2019) and incorporates a compression step to overcome the obstacles associated with high dimensionality. In other words, we estimate the MI between the compressed representations of high-dimensional random vectors. The proposed method is supported by both theoretical and practical justifications. Notably, we demonstrate the accuracy of our estimator through synthetic experiments featuring predefined MI values and comparison with MINE (Belghazi et al., 2018). Finally, we perform IB analysis on a close-to-real-scale convolutional DNN, which reveals new features of the MI dynamics.",
        "keywords": "deep learning;information bottleneck principle;stochastic neural networks;lossy compression",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/93413ec74fd48cc6b82b3b35fe35056a668dd7a7.zip",
        "author": "Ivan Butakov;Alexander Tolmachev;Sofia Malanchuk;Anna Neopryatnaya;Alexey Frolov;Kirill Andreev",
        "authorids": "~Ivan_Butakov1;~Alexander_Tolmachev1;~Sofia_Malanchuk1;~Anna_Neopryatnaya1;~Alexey_Frolov1;~Kirill_Andreev1",
        "gender": ";M;F;F;M;M",
        "homepage": "https://github.com/VanessB;https://github.com/Alexandr-Tolmachev;https://github.com/DCAM-Fox;;https://faculty.skoltech.ru/people/alexeyfrolov;",
        "dblp": "338/2406;328/7821;;330/3342;54/9671;43/8436",
        "google_scholar": ";https://scholar.google.ru/citations?user=qyUGmKQAAAAJ;;;https://scholar.google.ru/citations?hl=ru;https://scholar.google.ru/citations?user=kC11Cv8AAAAJ",
        "orcid": "0000-0002-0424-6695;0009-0006-7711-3005;;;0000-0002-6734-0179;0000-0002-2920-2015",
        "linkedin": ";;;;;",
        "or_profile": "~Ivan_Butakov1;~Alexander_Tolmachev1;~Sofia_Malanchuk1;~Anna_Neopryatnaya1;~Alexey_Frolov1;~Kirill_Andreev1",
        "aff": "Sirius University of Science and Technology;Skolkovo Institute of Science and Technology;Moscow Institute of Physics and Technology;Skolkovo Institute of Science and Technology;Skolkovo Institute of Science and Technology;Skolkovo Institute of Science and Technology",
        "aff_domain": "siriusuniversity.ru;skoltech.ru;mipt.ru;skolkovotech.ru;skolkovotech.ru;skolkovotech.ru",
        "position": "MS student;MS student;MS student;Researcher;Full Professor;Researcher",
        "bibtex": "@inproceedings{\nbutakov2024information,\ntitle={Information Bottleneck Analysis of Deep Neural Networks via Lossy Compression},\nauthor={Ivan Butakov and Alexander Tolmachev and Sofia Malanchuk and Anna Neopryatnaya and Alexey Frolov and Kirill Andreev},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=huGECz8dPp}\n}",
        "github": "",
        "project": "",
        "reviewers": "d5Zt;Lyy3;MJhB;Fd1K",
        "pdf_size": 632360,
        "rating": "5;6;6;6",
        "confidence": "3;1;4;3",
        "soundness": "2;3;3;2",
        "contribution": "2;3;2;2",
        "presentation": "3;3;3;3",
        "wc_summary": "49;93;46;124",
        "wc_strengths": "19;23;33;48",
        "wc_weaknesses": "229;239;282;212",
        "wc_questions": "26;2;300;95",
        "wc_review": "323;357;661;479",
        "wc_reply_reviewers": "96;0;419;32",
        "wc_reply_authors": "613;242;1784;949",
        "reply_reviewers": "1;0;2;1",
        "reply_authors": "2;1;4;3",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            2.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            78.0,
            32.42684073418192
        ],
        "wc_strengths_avg": [
            30.75,
            11.188722000300123
        ],
        "wc_weaknesses_avg": [
            240.5,
            25.83118270617898
        ],
        "wc_questions_avg": [
            105.75,
            117.23134179902574
        ],
        "wc_review_avg": [
            455.0,
            132.32535660258014
        ],
        "wc_reply_reviewers_avg": [
            136.75,
            166.58237451783427
        ],
        "wc_reply_authors_avg": [
            897.0,
            569.9021845896013
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.13245323570650439,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3855553197407928126&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=huGECz8dPp",
        "pdf": "https://openreview.net/pdf?id=huGECz8dPp",
        "email": "siriusuniversity.ru;skoltech.ru;mipt.ru;skolkovotech.ru;skolkovotech.ru;skolkovotech.ru",
        "author_num": 6,
        "aff_unique_index": "1;2;1;1;1",
        "aff_unique_norm": ";Skolkovo Institute of Science and Technology;Moscow Institute of Physics and Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": ";https://www.skoltech.ru;https://www.mipt.ru/en",
        "aff_unique_abbr": ";Skoltech;MIPT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "1;1;1;1;1",
        "aff_country_unique": ";Russian Federation"
    },
    {
        "id": "hujS6bmduD",
        "title": "Harnessing Text to Image Diffusion for Dense Prediction Tasks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Equipped with large-scale training data, text-to-image diffusion models have demonstrated the capacity to generate high-quality images that semantically correspond to the given textual descriptions. \nThese compelling results imply that visual semantic knowledge has been effectively encapsulated within the generative diffusion model. \nThe prospect of utilizing this embedded knowledge as a prior for down-stream vision tasks presents an intriguing avenue for exploration, which remains notably under-investigated. In this work, we demonstrate that when provided with appropriate image tags as textual descriptions, the implicit knowledge within these text-to-image diffusion models can be effectively leveraged for visual dense prediction tasks. Initially, we discover that supplying ground-truth semantic labels as textual instructions significantly enhances performance due to the extracted high-quality visual knowledge. Motivated by this observation, when presented with noisy tagging labels, we propose an adapter module attempting to derive relevant semantic information.\nSubsequently, we propose a multi-label classification learning objective which further enriches the semantic quality of tags, thereby amplifying the efficacy of knowledge extraction.  We conduct extensive experiments four benchmarks, which suggest that the proposed approach is effective to unlock the representational capabilities of text-to-image diffusion models, showcasing a promising avenue for advancing dense prediction tasks in visual domains.",
        "keywords": "Diffusion Models;Visual Perception; Class Captioner",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yiqi Wang;Quanzeng You;Wentao Chen;Bin Shan;Jianbo Yuan;Yingjie Tian;Hongxia Yang",
        "authorids": "~Yiqi_Wang4;~Quanzeng_You3;~Wentao_Chen1;~Bin_Shan1;~Jianbo_Yuan1;~Yingjie_Tian2;~Hongxia_Yang2",
        "gender": "M;M;M;M;F;M;M",
        "homepage": "https://qzyou.github.io/;;;;https://www4.comp.polyu.edu.hk/~hongxyang/;http://people.ucas.ac.cn/~0006939?language=en;https://orcid.org/0009-0003-7495-6347",
        "dblp": "33/9972.html;;;134/6790;;;178/8638-4",
        "google_scholar": "c5KJsIgAAAAJ;Ho3o8eQAAAAJ;;https://scholar.google.com/citations?hl=en;iJlC5mMAAAAJ;;",
        "orcid": "0000-0003-3608-0607;;;;;;0009-0003-7495-6347",
        "linkedin": "quanzeng-you-5b98a55a/;;https://www.linkedin.cn/in/bin-shan-288004107;;;;",
        "or_profile": "~Quanzeng_You3;~Wentao_Chen1;~Bin_Shan1;~Jianbo_Yuan1;~Hongxia_Yang2;~Tian_YingJie1;~wang_Yi_Qi1",
        "aff": "ByteDance;ByteDance Inc.;bytedance;Bytedance;ByteDance Inc.;, Chinese Academy of Sciences;University of Chinese Academy of Sciences",
        "aff_domain": "bytedance.com;bytedance.com;bytedance.com;bytedance.com;bytedance.com;ucas.ac.cn;ucas.ac.cn",
        "position": "Researcher;Researcher;Researcher;Researcher;Principal Researcher;Full Professor;PhD student",
        "bibtex": "@misc{\nwang2024harnessing,\ntitle={Harnessing Text to Image Diffusion for Dense Prediction Tasks},\nauthor={Yiqi Wang and Quanzeng You and Wentao Chen and Bin Shan and Jianbo Yuan and Yingjie Tian and Hongxia Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=hujS6bmduD}\n}",
        "github": "",
        "project": "",
        "reviewers": "6BRj;Mq6h;x6HC;Sgbx",
        "site": "https://openreview.net/forum?id=hujS6bmduD",
        "pdf_size": 562572,
        "rating": "3;3;5;5",
        "confidence": "4;4;5;4",
        "soundness": "2;2;3;2",
        "contribution": "2;2;2;3",
        "presentation": "1;2;3;2",
        "wc_summary": "67;57;73;54",
        "wc_strengths": "42;61;15;37",
        "wc_weaknesses": "333;331;85;93",
        "wc_questions": "2;46;5;140",
        "wc_review": "444;495;178;324",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            62.75,
            7.628073151196179
        ],
        "wc_strengths_avg": [
            38.75,
            16.37643123516232
        ],
        "wc_weaknesses_avg": [
            210.5,
            121.5349743900907
        ],
        "wc_questions_avg": [
            48.25,
            55.75112106496155
        ],
        "wc_review_avg": [
            360.25,
            122.16868461271079
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:7jKxTOeI5vcJ:scholar.google.com/&scioq=Harnessing+Text+to+Image+Diffusion+for+Dense+Prediction+Tasks&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0;1;2",
        "aff_unique_norm": "ByteDance;Chinese Academy of Sciences;University of Chinese Academy of Sciences",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.bytedance.com;http://www.cas.cn;http://www.ucas.ac.cn",
        "aff_unique_abbr": "ByteDance;CAS;UCAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "huwR9N2ea0",
        "title": "Overcoming Data Inequality across Domains with Semi-Supervised Domain Generalization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "While there have been considerable advancements in machine learning driven by extensive datasets, a significant disparity still persists in the availability of data across various sources and populations. This inequality across domains poses challenges in modeling for those with limited data, which can lead to profound practical and ethical concerns. In this paper, we address a representative case of data inequality problem across domains termed Semi-Supervised Domain Generalization (SSDG), in which only one domain is labeled while the rest are unlabeled. We propose a novel algorithm, ProUD, designed for progressive generalization across domains by leveraging domain-aware prototypes and uncertainty-adaptive mixing strategies. Our experiments on three different benchmark datasets demonstrate the effectiveness of ProUD, outperforming existing baseline models in domain generalization and semi-supervised learning.",
        "keywords": "Domain Generalization;Semi-Supervised Learning;Uncertainty;Data Inequality;Representation Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/a59ec5bf2eb22dfba505de4262709aa35e41206f.zip",
        "author": "Jinha Park;Wonguk Cho;Taesup Kim",
        "authorids": "~Jinha_Park1;~Wonguk_Cho1;~Taesup_Kim1",
        "gender": "M;M;M",
        "homepage": ";;",
        "dblp": ";319/3781;",
        "google_scholar": ";Jijzx8sAAAAJ;7V7yNeoAAAAJ",
        "orcid": ";;",
        "linkedin": "jinha-park-165274257;wonguk-cho/;",
        "or_profile": "~Jinha_Park1;~Wonguk_Cho1;~Taesup_Kim1",
        "aff": "Seoul National University;Qualcomm Inc, QualComm;Seoul National University",
        "aff_domain": "snu.ac.kr;qti.qualcomm.com;snu.ac.kr",
        "position": "Undergrad student;Research Intern;Assistant Professor",
        "bibtex": "@misc{\nanonymous2024overcoming,\ntitle={Overcoming Data Inequality across Domains with Semi-Supervised Domain Generalization},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=huwR9N2ea0}\n}",
        "github": "",
        "project": "",
        "reviewers": "Rcny;sXNN;oRJe;8HJ1",
        "site": "https://openreview.net/forum?id=huwR9N2ea0",
        "pdf_size": 1059419,
        "rating": "5;5;6;6",
        "confidence": "3;3;4;3",
        "soundness": "1;2;2;3",
        "contribution": "1;2;3;2",
        "presentation": "2;2;3;2",
        "wc_summary": "62;61;49;224",
        "wc_strengths": "61;69;48;99",
        "wc_weaknesses": "308;179;109;395",
        "wc_questions": "4;26;95;280",
        "wc_review": "435;335;301;998",
        "wc_reply_reviewers": "137;0;126;0",
        "wc_reply_authors": "1582;747;1300;1579",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "5;2;4;4",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            99.0,
            72.34984450570713
        ],
        "wc_strengths_avg": [
            69.25,
            18.73999733191016
        ],
        "wc_weaknesses_avg": [
            247.75,
            111.00760109109646
        ],
        "wc_questions_avg": [
            101.25,
            108.52505471088232
        ],
        "wc_review_avg": [
            517.25,
            281.8974769308871
        ],
        "wc_reply_reviewers_avg": [
            65.75,
            65.86491858341586
        ],
        "wc_reply_authors_avg": [
            1302.0,
            340.27856235737215
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.75,
            1.0897247358851685
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:f7ze2ZbPcuQJ:scholar.google.com/&scioq=Overcoming+Data+Inequality+across+Domains+with+Semi-Supervised+Domain+Generalization&hl=en&as_sdt=0,33",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Seoul National University;Qualcomm Incorporated",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.snu.ac.kr;https://www.qualcomm.com",
        "aff_unique_abbr": "SNU;Qualcomm",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "id": "hv2lUWKyrJ",
        "title": "Relational Constraints On Neural Networks Reproduce Human Biases towards Abstract Geometric Regularity",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Uniquely among primates, humans possess a remarkable capacity to recognize and manipulate abstract structure in the service of task goals across a broad range of behaviors. One illustration of this is in the visual perception of geometric forms. Studies have shown a uniquely human bias toward geometric regularity, with task performance enhanced for more regular and symmetric forms compared to their geometrically irregular counterparts. Such studies conclude that this behavior implies the existence of discrete symbolic structure in human mental representations, and that replicating such behavior in neural network architectures will require mechanisms for symbolic processing. In this study, we argue that human biases towards geometric regularity can be reproduced in neural networks, without explicitly providing them with symbolic machinery, by augmenting them with an architectural constraint that enables the system to discover and manipulate relational structure. When trained with the appropriate curriculum, this model exhibits human-like biases towards symmetry and regularity in two distinct tasks involving abstract geometric reasoning. Our findings indicate that neural networks, when equipped with the necessary training objectives and architectural elements, can exhibit human-like regularity biases and generalization. This approach provides insights into the neural mechanisms underlying geometric reasoning and offers an alternative to prevailing symbolic ``Language of Thought'' models in this domain.",
        "keywords": "human cognition;geometry;abstraction;vision;cognitive science;relational;human intelligence",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "Declan Campbell;Sreejan Kumar;Tyler Giallanza;Jonathan D. Cohen;Thomas L. Griffiths",
        "authorids": "ic0523@princeton.edu;~Sreejan_Kumar1;~Tyler_Giallanza1;~Jonathan_D._Cohen1;~Thomas_L._Griffiths1",
        "gender": ";;;;",
        "homepage": ";http://www.sreejankumar.com;;;http://cocosci.princeton.edu/tom/",
        "dblp": ";276/0083;;;34/4472",
        "google_scholar": ";Hft2m4wAAAAJ;ABQNb_0AAAAJ;;https://scholar.google.com/citations?hl=en",
        "orcid": ";0000-0003-1769-5147;;;",
        "linkedin": ";sreejan-kumar-14060b76/;;;",
        "or_profile": "ic0523@princeton.edu;~Sreejan_Kumar1;~Tyler_Giallanza1;~Jonathan_D._Cohen1;~Thomas_L._Griffiths1",
        "aff": ";Princeton University;Princeton University;;Princeton University",
        "aff_domain": ";princeton.edu;princeton.edu;;princeton.edu",
        "position": ";PhD student;PhD student;;Professor",
        "bibtex": "@misc{\ncampbell2024relational,\ntitle={Relational Constraints On Neural Networks Reproduce Human Biases towards Abstract Geometric Regularity},\nauthor={Declan Campbell and Sreejan Kumar and Tyler Giallanza and Jonathan D. Cohen and Thomas L. Griffiths},\nyear={2024},\nurl={https://openreview.net/forum?id=hv2lUWKyrJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "F4KU;W6kC;eSYk;UjxR",
        "site": "https://openreview.net/forum?id=hv2lUWKyrJ",
        "pdf_size": 2299050,
        "rating": "3;5;5;5",
        "confidence": "3;3;5;3",
        "soundness": "3;2;2;2",
        "contribution": "1;2;3;2",
        "presentation": "2;3;3;3",
        "wc_summary": "62;97;50;212",
        "wc_strengths": "61;106;41;28",
        "wc_weaknesses": "192;220;328;334",
        "wc_questions": "7;2;16;89",
        "wc_review": "322;425;435;663",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            105.25,
            64.00537086838885
        ],
        "wc_strengths_avg": [
            59.0,
            29.57194616524249
        ],
        "wc_weaknesses_avg": [
            268.5,
            63.314690238522054
        ],
        "wc_questions_avg": [
            28.5,
            35.28809997718778
        ],
        "wc_review_avg": [
            461.25,
            124.5960974509234
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16080941804079261576&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Princeton University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.princeton.edu",
        "aff_unique_abbr": "Princeton",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Graph Parsing Networks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18080",
        "id": "hv3SklibkL",
        "author_site": "Yunchong Song, Siyuan Huang, Xinbing Wang, Chenghu Zhou, Zhouhan Lin",
        "tldr": "",
        "abstract": "Graph pooling compresses graph information into a compact representation. State-of-the-art graph pooling methods follow a hierarchical approach, which reduces the graph size step-by-step. These methods must balance memory efficiency with preserving node information, depending on whether they use node dropping or node clustering. Additionally, fixed pooling ratios or numbers of pooling layers are predefined for all graphs, which prevents personalized pooling structures from being captured for each individual graph. In this work, inspired by bottom-up grammar induction, we propose an efficient graph parsing algorithm to infer the pooling structure, which then drives graph pooling. The resulting Graph Parsing Network (GPN) adaptively learns personalized pooling structure for each individual graph. GPN benefits from the discrete assignments generated by the graph parsing algorithm, allowing good memory efficiency while preserving node information intact. Experimental results on standard benchmarks demonstrate that GPN outperforms state-of-the-art graph pooling methods in graph classification tasks while being able to achieve competitive performance in node classification tasks. We also conduct a graph reconstruction task to show GPN's ability to preserve node information and measure both memory and time efficiency through relevant tests.",
        "keywords": "GNN;graph pooling;parsing",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Yunchong Song;Siyuan Huang;Xinbing Wang;Chenghu Zhou;Zhouhan Lin",
        "authorids": "~Yunchong_Song1;~Siyuan_Huang8;~Xinbing_Wang1;~Chenghu_Zhou3;~Zhouhan_Lin1",
        "gender": "M;M;M;M;M",
        "homepage": "https://github.com/realCrush;https://github.com/SiyuanHuangSJTU;http://www.cs.sjtu.edu.cn/~wang-xb/;http://www.igsnrr.cas.cn/gkjj/ysfc/ysfc_zhouchenghu/;https://hantek.github.io",
        "dblp": "339/6816;62/885-3;96/1149.html;85/1324.html;121/7919.html",
        "google_scholar": "C-TqDNsAAAAJ;https://scholar.google.com/citations?view_op=list_works;https://scholar.google.com.tw/citations?user=CT5yZbwAAAAJ;;https://scholar.google.ca/citations?user=LNZ4efwAAAAJ",
        "orcid": ";;0000-0002-0357-8356;;0009-0009-7204-0689",
        "linkedin": ";siyuan-huang-885863235/;;;https://ca.linkedin.com/in/zhouhan-lin-34b98975",
        "or_profile": "~Yunchong_Song1;~Siyuan_Huang8;~Xinbing_Wang1;~Chenghu_Zhou3;~Zhouhan_Lin1",
        "aff": "Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;IGSNRR, Chinese Academy of Sciences, Beijing, China;Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn;sjtu.edu.cn;cs.sjtu.edu.cn;lreis.ac.cn;sjtu.edu.cn",
        "position": "PhD student;MS student;Full Professor;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nsong2024graph,\ntitle={Graph Parsing Networks},\nauthor={Yunchong Song and Siyuan Huang and Xinbing Wang and Chenghu Zhou and Zhouhan Lin},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=hv3SklibkL}\n}",
        "github": "",
        "project": "",
        "reviewers": "H5gS;UKss;xTBe;4RVW",
        "pdf_size": 1714563,
        "rating": "3;5;8;8",
        "confidence": "4;3;3;5",
        "soundness": "2;2;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;3;4;3",
        "wc_summary": "52;34;67;139",
        "wc_strengths": "19;14;84;80",
        "wc_weaknesses": "144;83;60;152",
        "wc_questions": "1;26;23;86",
        "wc_review": "216;157;234;457",
        "wc_reply_reviewers": "0;49;0;96",
        "wc_reply_authors": "208;958;262;704",
        "reply_reviewers": "0;1;0;2",
        "reply_authors": "1;3;1;3",
        "rating_avg": [
            6.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            73.0,
            39.85599076675927
        ],
        "wc_strengths_avg": [
            49.25,
            32.828151029261456
        ],
        "wc_weaknesses_avg": [
            109.75,
            39.20698279643564
        ],
        "wc_questions_avg": [
            34.0,
            31.535694062442957
        ],
        "wc_review_avg": [
            266.0,
            113.89249316789935
        ],
        "wc_reply_reviewers_avg": [
            36.25,
            39.87715511417533
        ],
        "wc_reply_authors_avg": [
            533.0,
            311.82206464584897
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.0,
            1.0
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.1421338109037403,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6783369775020163278&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=hv3SklibkL",
        "pdf": "https://openreview.net/pdf?id=hv3SklibkL",
        "email": "sjtu.edu.cn;sjtu.edu.cn;cs.sjtu.edu.cn;lreis.ac.cn;sjtu.edu.cn",
        "author_num": 5,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "Shanghai Jiao Tong University;Chinese Academy of Sciences",
        "aff_unique_dep": ";IGSNRR",
        "aff_unique_url": "https://www.sjtu.edu.cn;http://www.cas.cn",
        "aff_unique_abbr": "SJTU;CAS",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Beijing",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "hv8l922Ad7",
        "title": "Correcting Flaws in Common Disentanglement Metrics",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recent years have seen growing interest in learning disentangled representations, in which distinct features, such as size or shape, are represented by distinct neurons. Quantifying the extent to which a given representation is disentangled is not straightforward; multiple metrics have been proposed. In this paper, we identify two failings of existing metrics, which mean they can assign a high score to a model which is still entangled, and we propose two new metrics, which redress these problems. First, we demonstrate these failure modes on hypothetical toy examples, then we show that similar situations occur in practice, and finally we validate our metrics on the downstream task of compositional generalization. We show that performance on this task is (a) generally quite poor, (b) correlated with most disentanglement metrics, and (c) most strongly correlated with our newly proposed metrics.",
        "keywords": "disentanglement;metrics;compositional generalization",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Louis Mahon;Lei Sha;Thomas Lukasiewicz",
        "authorids": "~Louis_Mahon1;~Lei_Sha1;~Thomas_Lukasiewicz2",
        "gender": ";M;",
        "homepage": ";https://shalei120.github.io;https://www.cs.ox.ac.uk/people/thomas.lukasiewicz/",
        "dblp": ";93/3906;l/ThomasLukasiewicz",
        "google_scholar": "https://scholar.google.co.uk/citations?hl=en;https://scholar.google.com.hk/citations?user=EbZ_P6gAAAAJ;arjucpEAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Louis_Mahon1;~Lei_Sha1;~Thomas_Lukasiewicz2",
        "aff": "School of Informatics, University of Edinburgh;Beihang University;Department of Computer Science, University of Oxford",
        "aff_domain": "inf.ed.ac.uk;buaa.edu.cn;cs.ox.ac.uk",
        "position": "Postdoc;Full Professor;Full Professor",
        "bibtex": "@misc{\nanonymous2024correcting,\ntitle={Correcting Flaws in Common Disentanglement Metrics},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=hv8l922Ad7}\n}",
        "github": "",
        "project": "",
        "reviewers": "s8qd;v9Ai;ok83;cX7W;zKra",
        "site": "https://openreview.net/forum?id=hv8l922Ad7",
        "pdf_size": 406299,
        "rating": "3;3;3;3;5",
        "confidence": "2;4;3;4;3",
        "soundness": "4;3;3;2;2",
        "contribution": "2;2;2;2;1",
        "presentation": "1;3;3;2;2",
        "wc_summary": "64;99;93;193;100",
        "wc_strengths": "89;109;56;75;47",
        "wc_weaknesses": "61;201;203;241;169",
        "wc_questions": "55;74;65;726;30",
        "wc_review": "269;483;417;1235;346",
        "wc_reply_reviewers": "0;38;0;0;0",
        "wc_reply_authors": "95;344;180;696;174",
        "reply_reviewers": "0;1;0;0;0",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            3.4,
            0.8
        ],
        "confidence_avg": [
            3.2,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.8,
            0.7483314773547882
        ],
        "contribution_avg": [
            1.8,
            0.4
        ],
        "presentation_avg": [
            2.2,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            109.8,
            43.62292975030448
        ],
        "wc_strengths_avg": [
            75.2,
            22.346364357541475
        ],
        "wc_weaknesses_avg": [
            175.0,
            61.397068333919655
        ],
        "wc_questions_avg": [
            190.0,
            268.4034276979338
        ],
        "wc_review_avg": [
            550.0,
            349.8513970245081
        ],
        "wc_reply_reviewers_avg": [
            7.6,
            15.200000000000001
        ],
        "wc_reply_authors_avg": [
            297.8,
            214.9552511570722
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.13363062095621217,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18259894543435243878&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of Edinburgh;Beihang University;University of Oxford",
        "aff_unique_dep": "School of Informatics;;Department of Computer Science",
        "aff_unique_url": "https://www.ed.ac.uk;http://www.buaa.edu.cn/;https://www.ox.ac.uk",
        "aff_unique_abbr": "Edinburgh;BUAA;Oxford",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Edinburgh;;Oxford",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United Kingdom;China"
    },
    {
        "id": "hvoVD7x7f8",
        "title": "Uncertainty-Aware Decision Transformer for Stochastic Driving Environments",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Offline Reinforcement Learning (RL) has emerged as a promising framework for learning policies without active interactions, making it especially appealing for autonomous driving tasks. \nRecent successes of Transformers inspire casting offline RL as sequence modeling, which performs well in long-horizon tasks. However, they are overly optimistic in stochastic environments with incorrect assumptions that the same goal can be consistently achieved by identical actions. In this paper, we introduce an uncertainty-aware decision transformer (UNREST) for planning in stochastic driving environments without introducing additional transition or complex generative models. Specifically, UNREST estimates state uncertainties by the conditional mutual information between transitions and returns, and segments sequences accordingly. Discovering the 'uncertainty accumulation' and 'temporal locality' properties of driving environments, UNREST replaces the global returns in decision transformers with less uncertain truncated returns, to learn from true outcomes of agent actions rather than environment transitions. We also dynamically evaluate environmental uncertainty during inference for cautious planning.\nExtensive experimental results demonstrate UNREST's superior performance in various driving scenarios and the power of our uncertainty estimation strategy.",
        "keywords": "Autonomous Driving;Decision Transformer;Uncertainty Estimation",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Zenan Li;Fan Nie;Qiao Sun;Fang Da;Hang Zhao",
        "authorids": "~Zenan_Li4;~Fan_Nie1;~Qiao_Sun1;~Fang_Da2;~Hang_Zhao1",
        "gender": "M;;M;Not Specified;M",
        "homepage": "https://github.com/Emiyalzn;;https://qiaosun.me;;http://www.mit.edu/~hangzhao/",
        "dblp": ";;10/6242;131/6851;",
        "google_scholar": ";;D1KNQasAAAAJ;https://scholar.google.com/citations?hl=en;DmahiOYAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Zenan_Li4;~Fan_Nie1;~Qiao_Sun1;~Fang_Da2;~Hang_Zhao1",
        "aff": ";;;QCraft Inc;Tsinghua University",
        "aff_domain": ";;;qcraft.ai;tsinghua.edu.cn",
        "position": ";;;Researcher;Assistant Professor",
        "bibtex": "@misc{\nli2024uncertaintyaware,\ntitle={Uncertainty-Aware Decision Transformer for Stochastic Driving Environments},\nauthor={Zenan Li and Fan Nie and Qiao Sun and Fang Da and Hang Zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=hvoVD7x7f8}\n}",
        "github": "",
        "project": "",
        "reviewers": "nCLY;mZkV;PUEU;xhtH",
        "site": "https://openreview.net/forum?id=hvoVD7x7f8",
        "pdf_size": 3210839,
        "rating": "3;5;6;6",
        "confidence": "4;3;3;2",
        "soundness": "2;3;3;2",
        "contribution": "2;3;2;3",
        "presentation": "2;2;3;2",
        "wc_summary": "196;26;141;125",
        "wc_strengths": "76;41;91;81",
        "wc_weaknesses": "247;92;202;90",
        "wc_questions": "165;33;77;159",
        "wc_review": "684;192;511;455",
        "wc_reply_reviewers": "156;13;0;228",
        "wc_reply_authors": "2221;605;1211;1397",
        "reply_reviewers": "2;1;0;3",
        "reply_authors": "7;3;4;5",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            122.0,
            61.363670033660796
        ],
        "wc_strengths_avg": [
            72.25,
            18.833148966649205
        ],
        "wc_weaknesses_avg": [
            157.75,
            68.62352002047112
        ],
        "wc_questions_avg": [
            108.5,
            55.75616557834658
        ],
        "wc_review_avg": [
            460.5,
            176.51133108103852
        ],
        "wc_reply_reviewers_avg": [
            99.25,
            96.28960224240205
        ],
        "wc_reply_authors_avg": [
            1358.5,
            577.6908775461146
        ],
        "reply_reviewers_avg": [
            1.5,
            1.118033988749895
        ],
        "reply_authors_avg": [
            4.75,
            1.479019945774904
        ],
        "replies_avg": [
            33,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.8660254037844386,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9845160657300893873&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "QCraft Inc;Tsinghua University",
        "aff_unique_dep": ";",
        "aff_unique_url": ";https://www.tsinghua.edu.cn",
        "aff_unique_abbr": ";THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "hwIfIl85eB",
        "title": "FusionShot: Boosting Few Shot Learners with Focal-Diversity Optimized Ensemble Method",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Designing optimal few-shot learners is challenging. First, it is hard to train a few-shot model that can deliver the best generalization performance on all benchmarks compared to existing state-of-the-art (SOTA) methods. Second, unlike traditional deep neural networks (e.g., CNN, auto-encoder), few-shot learners utilize the metric space distance-based loss function to optimize the deep embedding learning on complex or multi-modal data. Both the choice of latent similarity computation methods and the choice of DNN embedding algorithms for latent feature extraction will impact the generalization performance of few-shot learners. This paper presents {\\sc FusionShot}, a focal diversity optimized few-shot ensemble learning framework with three original contributions. First, we revisit the few-shot learning architectures to analyze why some few-shot learners perform well whereas other SOTA few-shot models fail miserably. Second, we explore and compare two alternative fusion channels to ensemble multiple few-shot learners: (i) the fusion of various latent distance methods, and (ii) the fusion of multiple DNN embedding algorithms that learn/extract latent features differently. Finally, we introduce a focal-diversity optimized few-shot ensemble learning framework for further boosting the performance of few-shot ensemble learning. \nExtensive experiments on representative few-shot benchmarks (mini-Imagenet and CUB) show that our {\\sc FusionShot} can select the best performing ensembles from a pool of base few-shot models, which outperform the representative SOTA  models, on novel tasks (unknown at training), even when a majority of the base models fails. For reproducibility purposes, trained models, results, and code are made available at \\url{https://anonymous.4open.science/r/fusionshot-0A44/}.",
        "keywords": "Few-shot learning;ensemble learning;ensemble pruning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Selim Furkan Tekin;Fatih Ilhan;Sihao Hu;Tiansheng Huang;Ling Liu",
        "authorids": "~Selim_Furkan_Tekin1;~Fatih_Ilhan1;~Sihao_Hu1;~Tiansheng_Huang1;~Ling_Liu3",
        "gender": "M;M;M;M;",
        "homepage": "https://sftekin.com/;https://fatih-ilhan.github.io/;https://bayi-hu.github.io/;https://huangtiansheng.github.io/;",
        "dblp": "283/8174;260/0254;266/4995;249/2114;",
        "google_scholar": "a2O4Zx0AAAAJ;https://scholar.google.com.tr/citations?hl=en;WcZbKF4AAAAJ;zz6Oq8wAAAAJ;",
        "orcid": "0000-0002-8662-3609;0000-0002-0173-7544;0000-0003-3297-6991;0000-0002-4557-1865;",
        "linkedin": ";;;;",
        "or_profile": "~Selim_Furkan_Tekin1;~Fatih_Ilhan1;~Sihao_Hu1;~Tiansheng_Huang1;~Ling_Liu3",
        "aff": "College of Computing, Georgia Institute of Technology;Georgia Institute of Technology;Georgia Institute of Technology;Georgia Institute of Technology;",
        "aff_domain": "cc.gatech.edu;gatech.edu;gatech.edu;gatech.edu;",
        "position": "PhD student;PhD student;PhD student;PhD student;",
        "bibtex": "@misc{\ntekin2024fusionshot,\ntitle={FusionShot: Boosting Few Shot Learners with Focal-Diversity Optimized Ensemble Method},\nauthor={Selim Furkan Tekin and Fatih Ilhan and Sihao Hu and Tiansheng Huang and Ling Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=hwIfIl85eB}\n}",
        "github": "",
        "project": "",
        "reviewers": "K6te;mohu;Mcgk",
        "site": "https://openreview.net/forum?id=hwIfIl85eB",
        "pdf_size": 8226555,
        "rating": "3;3;5",
        "confidence": "5;4;4",
        "soundness": "2;2;3",
        "contribution": "2;2;2",
        "presentation": "2;2;3",
        "wc_summary": "186;85;78",
        "wc_strengths": "55;45;78",
        "wc_weaknesses": "622;590;239",
        "wc_questions": "101;36;29",
        "wc_review": "964;756;424",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "41;41;41",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            116.33333333333333,
            49.34459330959056
        ],
        "wc_strengths_avg": [
            59.333333333333336,
            13.816254517375137
        ],
        "wc_weaknesses_avg": [
            483.6666666666667,
            173.497998707638
        ],
        "wc_questions_avg": [
            55.333333333333336,
            32.417416443771224
        ],
        "wc_review_avg": [
            714.6666666666666,
            222.38305291146227
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            41.0,
            0.0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Xe4IwxvuGPsJ:scholar.google.com/&scioq=FusionShot:+Boosting+Few+Shot+Learners+with+Focal-Diversity+Optimized+Ensemble+Method&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Georgia Institute of Technology",
        "aff_unique_dep": "College of Computing",
        "aff_unique_url": "https://www.gatech.edu",
        "aff_unique_abbr": "Georgia Tech",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Atlanta;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "hwXUmwJAq5",
        "title": "UGradSL: Machine Unlearning Using Gradient-based Smoothed Label",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The objective of machine unlearning (MU) is to eliminate previously learned data from a model. However, it is challenging to strike a balance between computation cost and performance when using existing MU techniques. Taking inspiration from the influence of label smoothing on model confidence, we consider MU as decreasing confidence in the forgotten data and increasing it in the remaining. This observation suggests a simple gradient-based MU approach that uses an inverse process of label smoothing. This work introduces UGradSL, a simple, plug-and-play MU approach that uses smoothed labels. We provide theoretical analyses demonstrating why properly introducing label smoothing improves MU performance. We conducted extensive experiments on six datasets of various sizes and different modalities, demonstrating the effectiveness and robustness of our proposed method. The consistent improvement in MU performance is only at a marginal cost of additional computations.  For instance, UGradSL improves over the gradient ascent MU baseline by 66\\% unlearning accuracy without sacrificing unlearning efficiency. This work also introduces a more practical MU paradigm, known as group-forgetting, which involves forgetting a subgroup of a superclass.",
        "keywords": "Machine Unlearning;Negative Label Smoothing;Influence Function",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/68b2d8bec403a8e72169176421212a151bd23998.zip",
        "author": "Zonglin Di;Jinghan Jia;Jiancheng Liu;Zhaowei Zhu;Sijia Liu;Yang Liu",
        "authorids": "~Zonglin_Di1;~Jinghan_Jia1;~Jiancheng_Liu2;~Zhaowei_Zhu1;~Sijia_Liu1;~Yang_Liu3",
        "gender": ";M;M;M;M;M",
        "homepage": ";https://jinghanjia.netlify.app/;https://ljcc0930.github.io/;https://www.zzw.ai;https://lsjxjtu.github.io/;http://www.yliuu.com",
        "dblp": ";286/5392;74/3002;202/1712;128/6972-1;51/3710-18",
        "google_scholar": ";bqP_zxYAAAAJ;ReWNzl4AAAAJ;YS8pSQoAAAAJ;C7dO_UgAAAAJ;jKrIVCIAAAAJ",
        "orcid": ";;;0000-0003-3894-5862;;0000-0001-8420-6011",
        "linkedin": ";jinghan-jia-5194451ba/;;;;",
        "or_profile": "~Zonglin_Di1;~Jinghan_Jia1;~Jiancheng_Liu2;~Zhaowei_Zhu1;~Sijia_Liu1;~Yang_Liu3",
        "aff": ";Michigan State University;Michigan State University;Docta.ai;Michigan State University;University of California, Santa Cruz",
        "aff_domain": ";msu.edu;msu.edu;docta.ai;msu.edu;ucsc.edu",
        "position": ";PhD student;MS student;Researcher;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\ndi2024ugradsl,\ntitle={{UG}rad{SL}: Machine Unlearning Using Gradient-based Smoothed Label},\nauthor={Zonglin Di and Jinghan Jia and Jiancheng Liu and Zhaowei Zhu and Sijia Liu and Yang Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=hwXUmwJAq5}\n}",
        "github": "",
        "project": "",
        "reviewers": "4Lns;32Fz;RaEn",
        "site": "https://openreview.net/forum?id=hwXUmwJAq5",
        "pdf_size": 1157902,
        "rating": "3;3;3",
        "confidence": "4;5;2",
        "soundness": "1;3;2",
        "contribution": "2;2;2",
        "presentation": "2;3;3",
        "wc_summary": "11;62;120",
        "wc_strengths": "8;63;63",
        "wc_weaknesses": "630;352;352",
        "wc_questions": "15;3;76",
        "wc_review": "664;480;611",
        "wc_reply_reviewers": "280;0;0",
        "wc_reply_authors": "674;361;607",
        "reply_reviewers": "1;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            1.247219128924647
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            64.33333333333333,
            44.52964056545807
        ],
        "wc_strengths_avg": [
            44.666666666666664,
            25.927248643506744
        ],
        "wc_weaknesses_avg": [
            444.6666666666667,
            131.0504567799068
        ],
        "wc_questions_avg": [
            31.333333333333332,
            31.961782734314987
        ],
        "wc_review_avg": [
            585.0,
            77.33477010159574
        ],
        "wc_reply_reviewers_avg": [
            93.33333333333333,
            131.99326582148888
        ],
        "wc_reply_authors_avg": [
            547.3333333333334,
            134.56679464943133
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:iT0jBqyCBcQJ:scholar.google.com/&scioq=UGradSL:+Machine+Unlearning+Using+Gradient-based+Smoothed+Label&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;2",
        "aff_unique_norm": "Michigan State University;Docta.ai;University of California, Santa Cruz",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.msu.edu;https://docta.ai;https://www.ucsc.edu",
        "aff_unique_abbr": "MSU;Docta.ai;UCSC",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Santa Cruz",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "hxAveMWogn",
        "title": "InstaTAP: Instance Motion Estimation for Tracking Any Point",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "This paper tackles a challenge in learning the long-term point trajectories in videos, like the Tracking Any Point (TAP) task. Fundamentally, the estimation of point-level motions is hindered by the significant uncertainty inherent in comprehensive comparisons across the entire video frame. While existing models attempt to mitigate this issue by considering a regularized comparison space (e.g., the cost volumes), point-level motion remains highly noisy, often leading to failures on individual points. To tackle the issue, our key idea is to jointly track multiple points within a given semantic object: since points in an object tend to move together on average, individual noise trajectories can be effectively marginalized, subsequently obtaining fine-grained motion information. Specifically, we predict the object mask using point-prompted segmentation provided by Segment Anything Models (SAM) and enhance the performance of existing models through a systematic two-stage procedure: (a) estimating the average motion of points within the object mask (predicted by SAM) as the initial estimate, and (b) refining this estimate to achieve point-level tracking. In stage (b), we actively generate fine-grained features around the initial estimate, preserving high-frequency details for precise tracking. Consequently, our method not only overcomes the failure modes seen in existing state-of-the-art methods but also demonstrates superior precision in tracking results. For example, on the recent TAP-Vid benchmark, our method advances the state-of-the-art performance, achieving up to a 25% improvement in accuracy at the 1-pixel error threshold. Furthermore, we showcase the advantages of our method in two downstream tasks: video depth estimation and video frame interpolation, exploiting the point-wise correspondence in each task.",
        "keywords": "Video Point Tracking;Point Tracking;Tracking;Spatial-Temporal Vision;Segment Anything Model",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/b54317517988cba153e45abbb2974c9e1d295d68.pdf",
        "author": "Seong Hyeon Park;Sukmin Yun;Paul Hongsuck Seo;Jinwoo Shin",
        "authorids": "~Seong_Hyeon_Park2;~Sukmin_Yun1;~Paul_Hongsuck_Seo1;~Jinwoo_Shin1",
        "gender": "M;;M;M",
        "homepage": "https://www.shpark.org/;https://sites.google.com/view/sukmin-yun;https://phseo.github.io;https://sites.google.com/site/mijirim/",
        "dblp": "260/0708;234/9078;172/0938;31/7062",
        "google_scholar": "ZRKX9B0AAAAJ;fQcZ_hQAAAAJ;https://scholar.google.co.kr/citations?user=Tp7U8_UAAAAJ;https://scholar.google.com.tw/citations?user=m3eDp7kAAAAJ",
        "orcid": ";;;",
        "linkedin": ";sukmin-yun-975b67129/;;",
        "or_profile": "~Seong_Hyeon_Park2;~Sukmin_Yun1;~Paul_Hongsuck_Seo1;~Jinwoo_Shin1",
        "aff": "Korea Advanced Institute of Science & Technology;Mohamed bin Zayed University of Artificial Intelligence;Korea University;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.edu;mbzuai.ac.ae;korea.ac.kr;kaist.ac.kr",
        "position": "PhD student;Postdoc;Assistant Professor;Full Professor",
        "bibtex": "@misc{\npark2024instatap,\ntitle={Insta{TAP}: Instance Motion Estimation for Tracking Any Point},\nauthor={Seong Hyeon Park and Sukmin Yun and Paul Hongsuck Seo and Jinwoo Shin},\nyear={2024},\nurl={https://openreview.net/forum?id=hxAveMWogn}\n}",
        "github": "",
        "project": "",
        "reviewers": "sKxk;tNTu;K1PM",
        "site": "https://openreview.net/forum?id=hxAveMWogn",
        "pdf_size": 5095477,
        "rating": "3;3;5",
        "confidence": "4;4;4",
        "soundness": "3;2;3",
        "contribution": "2;2;2",
        "presentation": "3;2;3",
        "wc_summary": "66;64;139",
        "wc_strengths": "50;23;16",
        "wc_weaknesses": "203;181;112",
        "wc_questions": "23;22;17",
        "wc_review": "342;290;284",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            89.66666666666667,
            34.89348872720462
        ],
        "wc_strengths_avg": [
            29.666666666666668,
            14.65908895153068
        ],
        "wc_weaknesses_avg": [
            165.33333333333334,
            38.76711091748892
        ],
        "wc_questions_avg": [
            20.666666666666668,
            2.6246692913372702
        ],
        "wc_review_avg": [
            305.3333333333333,
            26.04269997949948
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:DMm1k1oQ1lAJ:scholar.google.com/&scioq=InstaTAP:+Instance+Motion+Estimation+for+Tracking+Any+Point&hl=en&as_sdt=0,34",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology;Mohamed bin Zayed University of Artificial Intelligence;Korea University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.kaist.ac.kr;https://mbzuai.ac.ae;https://www.korea.ac.kr",
        "aff_unique_abbr": "KAIST;MBZUAI;KU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "South Korea;United Arab Emirates"
    },
    {
        "id": "hy84B74XFt",
        "title": "Towards Interpretable Controllability in Object-Centric Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The binding problem in artificial neural networks is actively explored with the goal of achieving human-level recognition skills through the comprehension of the world in terms of symbol-like entities. Especially in the field of computer vision, object-centric learning (OCL) is extensively researched to better understand complex scenes by acquiring object representations or slots. While recent studies in OCL have made strides with complex images or videos, the interpretability and interactivity over object representation remain largely uncharted, still holding promise in the field of OCL. In this paper, we introduce a novel method, Slot Attention with Image Augmentation (SlotAug), to explore the possibility of learning interpretable controllability over slots in a self-supervised manner by utilizing an image augmentation strategy. We also devise the concept of sustainability in controllable slots by introducing iterative and reversible controls over slots with two proposed submethods: Auxiliary Identity Manipulation and Slot Consistency Loss. Extensive empirical studies and theoretical validation confirm the effectiveness of our approach, offering a novel capability for interpretable and sustainable control of object representations. Code will be available upon acceptance.",
        "keywords": "computer vision; binding problem; object-centric learning; object representation; representation learning; human-interactive neural network;",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/8acf55a60878b5042d5fc1da9d16c0243432d90f.pdf",
        "author": "Jinwoo Kim;Janghyuk Choi;Jaehyun Kang;Changyeon Lee;Ho-Jin Choi;Seon Joo Kim",
        "authorids": "~Jinwoo_Kim5;~Janghyuk_Choi1;~Jaehyun_Kang1;~Changyeon_Lee1;~Ho-Jin_Choi1;~Seon_Joo_Kim2",
        "gender": "M;M;M;;M;M",
        "homepage": "https://sites.google.com/view/hello-jinwoo;;https://github.com/kang-jaehyun;https://changyeon2.github.io;https://keai.kaist.ac.kr/people/professor/;https://sites.google.com/site/seonjookim/",
        "dblp": ";344/3842;;;60/1227;94/5528",
        "google_scholar": "https://scholar.google.com/citations?hl=ko;;;EMwpxJsAAAAJ;https://scholar.google.co.kr/citations?hl=en;1F2czKYAAAAJ",
        "orcid": ";;0000-0001-5922-1770;;0000-0002-3398-9543;",
        "linkedin": "jinwoo-kim-a00658206/;;;changyeon2/;;",
        "or_profile": "~Jinwoo_Kim5;~Janghyuk_Choi1;~Jaehyun_Kang1;~Changyeon_Lee1;~Ho-Jin_Choi1;~Seon_Joo_Kim1",
        "aff": "Yonsei University;Korea Advanced Institute of Science & Technology;Yonsei University;Yonsei University;Korea Advanced Institute of Science & Technology;Yonsei University",
        "aff_domain": "yonsei.ac.kr;kaist.ac.kr;yonsei.ac.kr;yonsei.ac.kr;kaist.ac.kr;yonsei.ac.kr",
        "position": "PhD student;MS student;MS student;Undergrad student;Full Professor;Full Professor",
        "bibtex": "@misc{\nkim2024towards,\ntitle={Towards Interpretable Controllability in Object-Centric Learning},\nauthor={Jinwoo Kim and Janghyuk Choi and Jaehyun Kang and Changyeon Lee and Ho-Jin Choi and Seon Joo Kim},\nyear={2024},\nurl={https://openreview.net/forum?id=hy84B74XFt}\n}",
        "github": "",
        "project": "",
        "reviewers": "jXVc;byFg;dLyp",
        "site": "https://openreview.net/forum?id=hy84B74XFt",
        "pdf_size": 2894205,
        "rating": "1;6;8",
        "confidence": "3;4;4",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "1;3;3",
        "wc_summary": "64;81;107",
        "wc_strengths": "31;89;112",
        "wc_weaknesses": "314;103;295",
        "wc_questions": "194;2;83",
        "wc_review": "603;275;597",
        "wc_reply_reviewers": "296;0;31",
        "wc_reply_authors": "2155;269;1001",
        "reply_reviewers": "1;0;1",
        "reply_authors": "4;1;2",
        "rating_avg": [
            5.0,
            2.943920288775949
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            84.0,
            17.682382946499793
        ],
        "wc_strengths_avg": [
            77.33333333333333,
            34.081601422990026
        ],
        "wc_weaknesses_avg": [
            237.33333333333334,
            95.3041913500602
        ],
        "wc_questions_avg": [
            93.0,
            78.70196947980399
        ],
        "wc_review_avg": [
            491.6666666666667,
            153.22604942444423
        ],
        "wc_reply_reviewers_avg": [
            109.0,
            132.83322877453017
        ],
        "wc_reply_authors_avg": [
            1141.6666666666667,
            776.3544436803478
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.9607689228305227,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:qm2ZhE6x9UsJ:scholar.google.com/&scioq=Towards+Interpretable+Controllability+in+Object-Centric+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;0;0;1;0",
        "aff_unique_norm": "Yonsei University;Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.yonsei.ac.kr;https://www.kaist.ac.kr",
        "aff_unique_abbr": "Yonsei;KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "hyjfjf8GA0",
        "title": "A Case Study for the Behaviors of Generalists and Specialists in Competitive Games",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this study, we investigate the behavioral change of a heterogeneous population as a system of information exchange. Previous approaches, such as OpenAIFive and NeuPL, have modeled a population as a single conditioned neural network to achieve rapid competitive learning. However, we found that this approach can overgeneralize the population as Generalists and hinder individual learning of specializations. To address this challenge, we propose Joint Entropy Minimization (JEM), a novel policy gradient formulation for heterogeneous populations. Our theoretical and experimental results show that JEM enables the training of Generalist populations to become Specialists. Compared to previous methods, Specialists trained with JEM exhibit increased strategy diversity, improved competitive performance, and reduced population performance disparity. These findings suggest that modeling a heterogeneous population as a group of Specialists can more fully realize the diverse potential of individual agents.",
        "keywords": "Population Learning;Information Theory;Reinforcement Learning;Competitive Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/f7a91935a83083911ecc9fa13e6ab92822a5dde9.pdf",
        "author": "Stefan Juang;Qiyang Cao;Yuan Zhou;Ruochen Liu;Elvis S. Liu;Nevin L. Zhang",
        "authorids": "~Stefan_Juang1;~Qiyang_Cao1;~Yuan_Zhou9;~Ruochen_Liu2;~Elvis_S._Liu1;~Nevin_L._Zhang1",
        "gender": "M;M;;M;M;M",
        "homepage": ";https://www.linkedin.com/in/qiyang-cao-a0b6ab111/;;https://github.com/RuochenLiu;;https://cse.hkust.edu.hk/~lzhang/teach/courses.html",
        "dblp": ";;;;;https://dblp.uni-trier.de/pid/z/NevinLianwenZhang.html",
        "google_scholar": ";;;;https://scholar.google.co.uk/citations?user=ZxRKSisAAAAJ;",
        "orcid": ";;;;;",
        "linkedin": "stefan-juang-93b63998;qiyang-cao-a0b6ab111/;https://www.linkedin.cn/incareer/in/\u5706-\u5468-6002b623a;;;",
        "or_profile": "~Stefan_Juang1;~Qiyang_Cao1;~Yuan_Zhou9;~Ruochen_Liu2;~Elvis_S._Liu1;~Nevin_Zhang1",
        "aff": "Hong Kong University of Science and Technology;;Tencent;;Tencent;Hong Kong University of Science and Technology",
        "aff_domain": "ust.hk;;tencent.com;;tencent.com;ust.hk",
        "position": "PhD student;;Researcher;;Principal Researcher;Full Professor",
        "bibtex": "@misc{\njuang2024a,\ntitle={A Case Study for the Behaviors of Generalists and Specialists in Competitive Games},\nauthor={Stefan Juang and Qiyang Cao and Yuan Zhou and Ruochen Liu and Elvis S. Liu and Nevin L. Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=hyjfjf8GA0}\n}",
        "github": "",
        "project": "",
        "reviewers": "XoZX;prT3;14MZ;h8i4",
        "site": "https://openreview.net/forum?id=hyjfjf8GA0",
        "pdf_size": 1158303,
        "rating": "3;3;3;5",
        "confidence": "2;4;3;2",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "1;1;1;2",
        "wc_summary": "39;92;41;50",
        "wc_strengths": "19;64;16;36",
        "wc_weaknesses": "444;41;25;186",
        "wc_questions": "13;115;91;10",
        "wc_review": "515;312;173;282",
        "wc_reply_reviewers": "232;0;0;53",
        "wc_reply_authors": "633;526;431;516",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            55.5,
            21.47673159491453
        ],
        "wc_strengths_avg": [
            33.75,
            19.057478846898924
        ],
        "wc_weaknesses_avg": [
            174.0,
            168.02827143073276
        ],
        "wc_questions_avg": [
            57.25,
            46.54231945230061
        ],
        "wc_review_avg": [
            320.5,
            123.63353105043954
        ],
        "wc_reply_reviewers_avg": [
            71.25,
            95.29788822424136
        ],
        "wc_reply_authors_avg": [
            526.5,
            71.71645557332013
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Mk1CdFl6A-EJ:scholar.google.com/&scioq=A+Case+Study+for+the+Behaviors+of+Generalists+and+Specialists+in+Competitive+Games&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;0",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Tencent",
        "aff_unique_dep": ";Tencent Holdings Limited",
        "aff_unique_url": "https://www.ust.hk;https://www.tencent.com",
        "aff_unique_abbr": "HKUST;Tencent",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Strategic Preys Make Acute Predators: Enhancing Camouflaged Object Detectors by Generating Camouflaged Objects",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18079",
        "id": "hywpSoHwgX",
        "author_site": "Chunming He, Kai Li, Yachao Zhang, Yulun Zhang, Chenyu You, zhenhua guo, Xiu Li, Martin Danelljan, Fisher Yu",
        "tldr": "",
        "abstract": "Camouflaged object detection (COD) is the challenging task of identifying camouflaged objects visually blended into surroundings. Albeit achieving remarkable success, existing COD detectors still struggle to obtain precise results in some challenging cases. To handle this problem, we draw inspiration from the prey-vs-predator game that leads preys to develop better camouflage and predators to acquire more acute vision systems and develop algorithms from both the prey side and the predator side. On the prey side, we propose an adversarial training framework, Camouflageator, which introduces an auxiliary generator to generate more camouflaged objects that are harder for a COD method to detect. Camouflageator trains the generator and detector in an adversarial way such that the enhanced auxiliary generator helps produce a stronger detector. On the predator side, we introduce a novel COD method, called Internal Coherence and Edge Guidance (ICEG), which introduces a camouflaged feature coherence module to excavate the internal coherence of camouflaged objects, striving to obtain more complete segmentation results. Additionally, ICEG proposes a novel edge-guided separated calibration module to remove false predictions to avoid obtaining ambiguous boundaries. Extensive experiments show that ICEG outperforms existing COD detectors and Camouflageator is flexible to improve various COD detectors, including ICEG, which brings state-of-the-art COD performance.",
        "keywords": "camouflaged object detection;adversarial training;image segmentation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Chunming He;Kai Li;Yachao Zhang;Yulun Zhang;Chenyu You;Zhenhua Guo;Xiu Li;Martin Danelljan;Fisher Yu",
        "authorids": "~Chunming_He1;~Kai_Li11;~Yachao_Zhang1;~Yulun_Zhang1;~Chenyu_You1;~Zhenhua_Guo3;~Xiu_Li1;~Martin_Danelljan4;~Fisher_Yu2",
        "gender": "M;;M;M;M;F;M;M;M",
        "homepage": "https://chunminghe.github.io;;https://yachao-zhang.github.io/;http://yulunzhang.com/;https://chenyuyou.me/;https://thusigsiclab.github.io/thu.github.io/introduction.html;https://martin-danelljan.github.io/;https://www.yf.io/;https://www-en.sz.tsinghua.edu.cn/INFORMATIONSCIENCE/108561.jhtml",
        "dblp": "251/5104;https://dblp.uni-trier.de/pers/hd/l/Li_0012:Kai;40/10584-1;166/2763-1.html;191/9432;13/1206-1;151/8848;117/6314;41/294-1",
        "google_scholar": "https://scholar.google.com/citations?hl=en;YsROc4UAAAAJ;https://scholar.google.de/citations?user=a-I8c8EAAAAJ;ORmLjWoAAAAJ;hy_wB7cAAAAJ;https://scholar.google.com/citations?hl=zh-CN;NCSSpMkAAAAJ;-XCiamcAAAAJ;dbR6bD0AAAAJ",
        "orcid": "0000-0001-6479-7109;;0000-0002-6153-5004;0000-0002-2288-5079;0000-0001-8365-7822;0000-0003-0403-1923;;;0000-0002-8201-0864",
        "linkedin": "https://www.linkedin.com/feed/?trk=guest_homepage-basic_nav-header-join;;;yulun-zhang-1116b5b9/;chenyu-you-b07475a4/;;;;zhenhua-guo-71589020/",
        "or_profile": "~Chunming_He1;~Kai_Li11;~Yachao_Zhang1;~Yulun_Zhang1;~Chenyu_You1;~Xiu_Li1;~Martin_Danelljan4;~Fisher_Yu2;~Zhenhua_Guo1",
        "aff": "Tsinghua University;NEC-Labs;Tsinghua University;Swiss Federal Institute of Technology;Yale University;Tsinghua University;ETH Zurich;Swiss Federal Institute of Technology;TianyiJiaotong Technology",
        "aff_domain": "tsinghua.edu.cn;nec-labs.com;tsinghua.edu.cn;ethz.ch;yale.edu;tsinghua.edu.cn;vision.ee.ethz.ch;ethz.ch;tyjt-ai.com",
        "position": "MS student;NEC Labs, America;Postdoc;Postdoc;PhD student;Professor;Principal Researcher;Assistant Professor;Principal Researcher",
        "bibtex": "@inproceedings{\nhe2024strategic,\ntitle={Strategic Preys Make Acute Predators: Enhancing Camouflaged Object Detectors by Generating Camouflaged Objects},\nauthor={Chunming He and Kai Li and Yachao Zhang and Yulun Zhang and Chenyu You and Zhenhua Guo and Xiu Li and Martin Danelljan and Fisher Yu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=hywpSoHwgX}\n}",
        "github": "",
        "project": "",
        "reviewers": "bgwW;VfAG;pcqB;fgyc",
        "pdf_size": 2252603,
        "rating": "5;5;8;8",
        "confidence": "1;2;5;4",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "65;59;38;48",
        "wc_strengths": "99;68;69;46",
        "wc_weaknesses": "137;310;103;35",
        "wc_questions": "11;1;62;3",
        "wc_review": "312;438;272;132",
        "wc_reply_reviewers": "0;0;28;0",
        "wc_reply_authors": "924;1090;717;448",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "3;4;4;2",
        "rating_avg": [
            6.5,
            1.5
        ],
        "confidence_avg": [
            3.0,
            1.5811388300841898
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            52.5,
            10.35615758860399
        ],
        "wc_strengths_avg": [
            70.5,
            18.848076824970764
        ],
        "wc_weaknesses_avg": [
            146.25,
            101.42330846506636
        ],
        "wc_questions_avg": [
            19.25,
            24.963723680572976
        ],
        "wc_review_avg": [
            288.5,
            109.16386764859516
        ],
        "wc_reply_reviewers_avg": [
            7.0,
            12.12435565298214
        ],
        "wc_reply_authors_avg": [
            794.75,
            239.87431604905098
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.25,
            0.82915619758885
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.9486832980505139,
        "gs_citation": 70,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10741392972273729000&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=hywpSoHwgX",
        "pdf": "https://openreview.net/pdf?id=hywpSoHwgX",
        "email": "tsinghua.edu.cn;nec-labs.com;tsinghua.edu.cn;ethz.ch;yale.edu;tsinghua.edu.cn;vision.ee.ethz.ch;ethz.ch;tyjt-ai.com",
        "author_num": 9,
        "aff_unique_index": "0;1;0;2;3;0;4;2;5",
        "aff_unique_norm": "Tsinghua University;NEC Laboratories;Swiss Federal Institute of Technology;Yale University;ETH Zurich;TianyiJiao Tong Technology",
        "aff_unique_dep": ";;;;;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.nec-labs.com;https://www.ethz.ch;https://www.yale.edu;https://www.ethz.ch;",
        "aff_unique_abbr": "THU;NEC-Labs;ETH Zurich;Yale;ETHZ;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;2;1;0;2;2;0",
        "aff_country_unique": "China;United States;Switzerland"
    },
    {
        "id": "hz2zhaZPXm",
        "title": "Towards Foundation Models for Learning on Tabular Data",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Learning on tabular data underpins numerous real-world applications. Despite considerable efforts in developing effective learning models for tabular data, cur\u0002rent transferable tabular models remain in their infancy, limited by either the lack of support for direct instruction following in new tasks or the neglect of acquiring foundational knowledge and capabilities from diverse tabular datasets. In this paper, we propose Tabular Foundation Models (TabFMs) to overcome these limitations. TabFMs harness the potential of generative tabular learning, employing a pre-trained large language model (LLM) as the base model and fine-tuning it using purpose-designed objectives on an extensive range of tabular datasets. This approach endows TabFMs with a profound understanding and universal capabilities essential for learning on tabular data. Our evaluations underscore TabFM\u2019s effectiveness: not only does it significantly excel in instruction-following tasks like zero-shot and in-context inference, but it also showcases performance that approaches, and in instances, even transcends, the renowned yet mysterious closed\u0002source LLMs like GPT-4. Furthermore, when fine-tuning with scarce data, our model achieves remarkable efficiency and maintains competitive performance with abundant training data. Finally, while our results are promising, we also delve into TabFM\u2019s limitations and potential opportunities, aiming to stimulate and expedite future research on developing more potent TabFMs.",
        "keywords": "tabular deep learning;tabular foundation models;large language models for tabular data",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Han Zhang;Xumeng Wen;Shun Zheng;Wei Xu;Jiang Bian",
        "authorids": "~Han_Zhang18;~Xumeng_Wen1;~Shun_Zheng1;~Wei_Xu14;~Jiang_Bian1",
        "gender": "M;M;M;M;M",
        "homepage": ";https://github.com/xumwen;;http://people.iiis.tsinghua.edu.cn/~weixu/;https://sites.google.com/view/jiangbian",
        "dblp": ";358/9194.html;179/2615.html;;09/851-2.html",
        "google_scholar": "TTwXmYQAAAAJ;;21Q9To4AAAAJ;6jN5vScAAAAJ;pZBEnY8AAAAJ",
        "orcid": ";;0009-0005-7355-7090;;0000-0002-9472-600X",
        "linkedin": ";;;;jbian/",
        "or_profile": "~Han_Zhang18;~Xumeng_Wen1;~Shun_Zheng1;~Wei_Xu14;~Jiang_Bian1",
        "aff": "Tsinghua University;Microsoft Research Asia;Microsoft;Tsinghua University;Microsoft",
        "aff_domain": "tsinghua.edu.cn;microsoft.com;microsoft.com;tsinghua.edu.cn;microsoft.com",
        "position": "PhD student;Researcher;Senior Researcher;Associate Professor;Partner Research Manager",
        "bibtex": "@misc{\nzhang2024towards,\ntitle={Towards Foundation Models for Learning on Tabular Data},\nauthor={Han Zhang and Xumeng Wen and Shun Zheng and Wei Xu and Jiang Bian},\nyear={2024},\nurl={https://openreview.net/forum?id=hz2zhaZPXm}\n}",
        "github": "",
        "project": "",
        "reviewers": "zaKi;RmY6;rfx2;2oDN",
        "site": "https://openreview.net/forum?id=hz2zhaZPXm",
        "pdf_size": 640014,
        "rating": "3;3;3;5",
        "confidence": "4;5;4;4",
        "soundness": "3;2;1;2",
        "contribution": "2;3;2;2",
        "presentation": "3;2;3;3",
        "wc_summary": "56;156;69;94",
        "wc_strengths": "34;77;49;77",
        "wc_weaknesses": "466;1070;177;352",
        "wc_questions": "158;4;145;2",
        "wc_review": "714;1307;440;525",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "743;572;808;590",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;3;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            93.75,
            38.447204059593204
        ],
        "wc_strengths_avg": [
            59.25,
            18.525320510047862
        ],
        "wc_weaknesses_avg": [
            516.25,
            335.8693012170061
        ],
        "wc_questions_avg": [
            77.25,
            74.3954803734743
        ],
        "wc_review_avg": [
            746.5,
            338.46011581868845
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            678.25,
            100.13085188891584
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 19,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5991168258931741570&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;0;1",
        "aff_unique_norm": "Tsinghua University;Microsoft",
        "aff_unique_dep": ";Research",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.microsoft.com/en-us/research/group/asia",
        "aff_unique_abbr": "THU;MSR Asia",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Asia",
        "aff_country_unique_index": "0;0;1;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "hz9TMobz2q",
        "title": "Push: Concurrent Probabilistic Programming for Bayesian Deep Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We introduce a library called Push that takes a probabilistic programming approach to Bayesian deep learning (BDL). This library enables concurrent execution of BDL inference algorithms on multi-GPU hardware for neural network (NN) models. To accomplish this, Push introduces an abstraction that represents an input NN as a particle. Push enables easy creation of particles so that an input NN can be replicated and particles can communicate asynchronously so that a variety of parameter updates can be expressed, including common BDL algorithms. Our hope is that Push lowers the barrier to experimenting with BDL by streamlining the scaling of particles across GPUs. We evaluate the scaling behavior of particles on single-node multi-GPU devices on vision and scientific machine learning (SciML) tasks.",
        "keywords": "probabilistic programming;bayesian deep learning;concurrency",
        "primary_area": "infrastructure, software libraries, hardware, etc.",
        "supplementary_material": "/attachment/8a7e2479245d05c8c7c28dc4b8b9ba3290f8897b.zip",
        "author": "Daniel Huang;Christian L Cama\u00f1o;Jonathan Tsegaye;Jonathan Austin Gale",
        "authorids": "~Daniel_Huang3;~Christian_L_Cama\u00f1o1;~Jonathan_Tsegaye1;~Jonathan_Austin_Gale1",
        "gender": "M;M;M;M",
        "homepage": "https://danehuang.github.io/;;https://github.com/jontseg;https://github.com/JohnnyJones",
        "dblp": "21/2554-1;;;",
        "google_scholar": "VTe4SGUAAAAJ;ANMsX18AAAAJ;;",
        "orcid": "0000-0002-1949-1116;;;",
        "linkedin": ";chris-cama%C3%B1o/;jonathantsegaye/;",
        "or_profile": "~Daniel_Huang3;~Christian_L_Cama\u00f1o1;~Jonathan_Tsegaye1;~Jonathan_Austin_Gale1",
        "aff": "San Francisco State University;San Francisco State University;;San Francisco State University",
        "aff_domain": "sfsu.edu;sfsu.edu;;sfsu.edu",
        "position": "Assistant Professor;Undergrad student;;MS student",
        "bibtex": "@misc{\nhuang2024push,\ntitle={Push: Concurrent Probabilistic Programming for Bayesian Deep Learning},\nauthor={Daniel Huang and Christian L Cama{\\~n}o and Jonathan Tsegaye and Jonathan Austin Gale},\nyear={2024},\nurl={https://openreview.net/forum?id=hz9TMobz2q}\n}",
        "github": "",
        "project": "",
        "reviewers": "pwQF;R5Ru;G8dD;omDv",
        "site": "https://openreview.net/forum?id=hz9TMobz2q",
        "pdf_size": 611597,
        "rating": "3;3;3;8",
        "confidence": "4;4;4;4",
        "soundness": "3;2;3;3",
        "contribution": "1;2;2;4",
        "presentation": "2;2;3;4",
        "wc_summary": "22;117;63;56",
        "wc_strengths": "23;134;195;40",
        "wc_weaknesses": "198;514;268;59",
        "wc_questions": "17;132;129;20",
        "wc_review": "260;897;655;175",
        "wc_reply_reviewers": "15;40;165;15",
        "wc_reply_authors": "174;425;871;238",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;1;2;2",
        "rating_avg": [
            4.25,
            2.165063509461097
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            1.0897247358851685
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            64.5,
            34.04776057246644
        ],
        "wc_strengths_avg": [
            98.0,
            70.16765636673352
        ],
        "wc_weaknesses_avg": [
            259.75,
            164.94298257276665
        ],
        "wc_questions_avg": [
            74.5,
            56.02008568361887
        ],
        "wc_review_avg": [
            496.75,
            293.605496372258
        ],
        "wc_reply_reviewers_avg": [
            58.75,
            62.18671481916375
        ],
        "wc_reply_authors_avg": [
            427.0,
            272.4288898042937
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:KquuikTQd_AJ:scholar.google.com/&scioq=Push:+Concurrent+Probabilistic+Programming+for+Bayesian+Deep+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "San Francisco State University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sfsu.edu",
        "aff_unique_abbr": "SFSU",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "San Francisco",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "hzu5luG4DC",
        "title": "Evaluating Adversarial Defense in the Era of Large Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large language models (LLMs) have demonstrated superior performance in many natural language processing tasks. Existing works have shown that LLMs are not robust to adversarial attacks, questioning the applicability of these models in scenarios with safety concerns. However, one key aspect that has been overlooked is evaluating and developing defense mechanisms against adversarial attacks.\nIn this work, we systematically study how LLMs react to different adversarial defense strategies. We also propose defenses tailored for LLMs that can significantly improve their robustness: First, we develop prompting methods to alert the LLM about potential adversarial contents; Second, we use neural models such as the LLM itself for typo correction; Third, we propose an effective fine-tuning scheme to improve robustness against corrupted inputs. Extensive experiments are conducted to evaluate the adversarial defense approaches. We show that by using the proposed defenses, robustness of LLMs can increase by up to 20\\%. Our code will be publicly available.",
        "keywords": "large language models;adversarial robustness",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Joachim Studnia;Simiao Zuo;Xiaodong Liu;Qiang Lou;Jian Jiao",
        "authorids": "~Joachim_Studnia1;~Simiao_Zuo1;~Xiaodong_Liu1;~Qiang_Lou1;~Jian_Jiao2",
        "gender": ";;;M;M",
        "homepage": ";;;;",
        "dblp": ";232/2089;65/622;07/4536;29/265-7.html",
        "google_scholar": ";J8TSTXMAAAAJ;NIewcxMAAAAJ;;D6KwmF8AAAAJ",
        "orcid": "0009-0005-3817-0202;;;;0000-0003-4779-9588",
        "linkedin": "joachim-studnia;;;;jian-jiao-82897810/",
        "or_profile": "~Joachim_Studnia1;~Simiao_Zuo1;~Xiaodong_Liu1;~Qiang_Lou1;~Jian_Jiao2",
        "aff": "Stanford University;Microsoft;Microsoft Research;;Microsoft",
        "aff_domain": "stanford.edu;microsoft.com;microsoft.com;;microsoft.com",
        "position": "MS student;Researcher;Researcher;;Principal Researcher",
        "bibtex": "@misc{\nstudnia2024evaluating,\ntitle={Evaluating Adversarial Defense in the Era of Large Language Models},\nauthor={Joachim Studnia and Simiao Zuo and Xiaodong Liu and Qiang Lou and Jian Jiao},\nyear={2024},\nurl={https://openreview.net/forum?id=hzu5luG4DC}\n}",
        "github": "",
        "project": "",
        "reviewers": "GNz2;WaJ4;M5vg;VoDX",
        "site": "https://openreview.net/forum?id=hzu5luG4DC",
        "pdf_size": 677534,
        "rating": "3;3;3;3",
        "confidence": "4;3;4;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;1;2",
        "presentation": "2;2;2;3",
        "wc_summary": "119;83;193;92",
        "wc_strengths": "59;30;29;32",
        "wc_weaknesses": "736;86;284;116",
        "wc_questions": "203;3;14;56",
        "wc_review": "1117;202;520;296",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            121.75,
            43.21675022488387
        ],
        "wc_strengths_avg": [
            37.5,
            12.459935794377111
        ],
        "wc_weaknesses_avg": [
            305.5,
            259.75132338450175
        ],
        "wc_questions_avg": [
            69.0,
            79.85298992523698
        ],
        "wc_review_avg": [
            533.75,
            356.00307231820346
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12265643364744685060&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Stanford University;Microsoft",
        "aff_unique_dep": ";Microsoft Corporation",
        "aff_unique_url": "https://www.stanford.edu;https://www.microsoft.com",
        "aff_unique_abbr": "Stanford;Microsoft",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Stanford;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "i0MsmV7hYZ",
        "title": "Advancing Counterfactual Inference through Quantile Regression",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The capacity to address counterfactual \"what if\" inquiries is crucial for understanding and making use of causal influences. Traditional counterfactual inference usually assumes a structural causal model is available. However, in practice, such a causal model is often unknown and may not be identifiable. This paper aims to perform reliable counterfactual inference based on the (learned) qualitative causal structure and observational data, without a given causal model or even directly estimating conditional distributions. We re-cast counterfactual reasoning as an extended quantile regression problem using neural networks. The approach is statistically more efficient than existing ones, and further makes it possible to develop the generalization ability of the estimated counterfactual outcome to unseen data and provide an upper bound on the generalization error. Experiment results on multiple datasets strongly support our theoretical claims.",
        "keywords": "Counterfactual Inference;Quantile Regression;Individual Treatment Effect Estimation",
        "primary_area": "causal reasoning",
        "supplementary_material": "/attachment/6fede86628327c797a3d4e40bb68c203986b9a4d.zip",
        "author": "Shaoan Xie;Biwei Huang;Bin Gu;Tongliang Liu;Kun Zhang",
        "authorids": "~Shaoan_Xie4;~Biwei_Huang1;~Bin_Gu1;~Tongliang_Liu1;~Kun_Zhang1",
        "gender": ";F;M;M;M",
        "homepage": "https://shaoan.net;;https://mbzuai.ac.ae/study/faculty/bin-gu/;https://tongliang-liu.github.io/;http://www.andrew.cmu.edu/user/kunz1/",
        "dblp": "205/9276.html;165/3288;29/1758-1;150/6667;96/3115-1",
        "google_scholar": "mChB-hQAAAAJ;;Vo8OgCgAAAAJ;https://scholar.google.com.au/citations?user=EiLdZ_YAAAAJ;RGoypN4AAAAJ",
        "orcid": ";;0000-0001-6049-1815;;",
        "linkedin": ";;;;",
        "or_profile": "~Shaoan_Xie4;~Biwei_Huang1;~Bin_Gu1;~Tongliang_Liu1;~Kun_Zhang1",
        "aff": "Carnegie Mellon University;University of California, San Diego;Mohamed bin Zayed University of Artificial Intelligence;Mohamed bin Zayed University of Artificial Intelligence;Carnegie Mellon University",
        "aff_domain": "cmu.edu;ucsd.edu;mbzuai.ac.ae;mbzuai.ac.ae;cmu.edu",
        "position": "PhD student;Assistant Professor;Assistant Professor;Affiliated Associate Professor;Associate Professor",
        "bibtex": "@misc{\nxie2024advancing,\ntitle={Advancing Counterfactual Inference through Quantile Regression},\nauthor={Shaoan Xie and Biwei Huang and Bin Gu and Tongliang Liu and Kun Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=i0MsmV7hYZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "v37y;di4h;uBiw",
        "site": "https://openreview.net/forum?id=i0MsmV7hYZ",
        "pdf_size": 632632,
        "rating": "3;5;6",
        "confidence": "3;3;4",
        "soundness": "1;2;3",
        "contribution": "1;2;3",
        "presentation": "2;2;3",
        "wc_summary": "33;21;93",
        "wc_strengths": "12;42;25",
        "wc_weaknesses": "248;514;183",
        "wc_questions": "145;2;410",
        "wc_review": "438;579;711",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "682;785;735",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;2",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            49.0,
            31.496031496047245
        ],
        "wc_strengths_avg": [
            26.333333333333332,
            12.283683848458853
        ],
        "wc_weaknesses_avg": [
            315.0,
            143.19450641231552
        ],
        "wc_questions_avg": [
            185.66666666666666,
            169.02925453568352
        ],
        "wc_review_avg": [
            576.0,
            111.47196957082978
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            734.0,
            42.05551886098502
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.7559289460184545,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17437901804405756998&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;2;0",
        "aff_unique_norm": "Carnegie Mellon University;University of California, San Diego;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.cmu.edu;https://www.ucsd.edu;https://mbzuai.ac.ae",
        "aff_unique_abbr": "CMU;UCSD;MBZUAI",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";San Diego",
        "aff_country_unique_index": "0;0;1;1;0",
        "aff_country_unique": "United States;United Arab Emirates"
    },
    {
        "id": "i1bBVKRVb5",
        "title": "Mask Frozen-DETR: High Quality Instance Segmentation with One GPU",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In this paper, we aim to study how to build a strong instance segmenter with minimal training time and GPUs, as opposed to the majority of current approaches that pursue more accurate instance segmenter by building more advanced frameworks at the cost of longer training time and higher GPU requirements. To achieve this, we introduce a simple and general framework, termed Mask Frozen-DETR, which can convert any existing DETR-based object detection model into a powerful instance segmentation model. Our method only requires training an additional lightweight mask network that predicts instance masks within the bounding boxes given by a frozen DETR-based object detector. Remarkably, our method outperforms the state-of-the-art instance segmentation method Mask DINO in terms of performance on the COCO test-dev split (55.3\\% vs. 54.7\\%) while being over 10$\\times$ times faster to train. Furthermore, all of our experiments can be trained using only one Tesla V100 GPU with 16 GB of memory, demonstrating the significant efficiency of our proposed framework.",
        "keywords": "instance segmentation;object detection",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Zhanhao Liang;Bohan CHEN;Haoyuan Zheng;Yuhui Yuan",
        "authorids": "~Zhanhao_Liang1;~Bohan_CHEN2;1730849763@qq.com;~Yuhui_Yuan1",
        "gender": ";M;;M",
        "homepage": ";https://github.com/BHCHENGIT?tab=repositories;;",
        "dblp": ";;;190/7361",
        "google_scholar": ";eDy7754AAAAJ;;PzyvzksAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;rainbowsecret/",
        "or_profile": "~Zhanhao_Liang1;~Bohan_CHEN2;1730849763@qq.com;~Yuhui_Yuan1",
        "aff": ";University of Liverpool;;Microsoft Research",
        "aff_domain": ";liv.ac.uk;;microsoft.com",
        "position": ";Undergrad student;;Senior Researcher",
        "bibtex": "@misc{\nliang2024mask,\ntitle={Mask Frozen-{DETR}: High Quality Instance Segmentation with One {GPU}},\nauthor={Zhanhao Liang and Bohan CHEN and Haoyuan Zheng and Yuhui Yuan},\nyear={2024},\nurl={https://openreview.net/forum?id=i1bBVKRVb5}\n}",
        "github": "",
        "project": "",
        "reviewers": "YtrW;Nd3w;stNZ;kpyR",
        "site": "https://openreview.net/forum?id=i1bBVKRVb5",
        "pdf_size": 9090900,
        "rating": "3;3;5;6",
        "confidence": "5;3;4;4",
        "soundness": "2;1;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;1;3;2",
        "wc_summary": "36;166;108;88",
        "wc_strengths": "55;109;63;70",
        "wc_weaknesses": "178;22;239;97",
        "wc_questions": "59;1;423;6",
        "wc_review": "328;298;833;261",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            99.5,
            46.52687395473717
        ],
        "wc_strengths_avg": [
            74.25,
            20.753011829611623
        ],
        "wc_weaknesses_avg": [
            134.0,
            81.96645655388551
        ],
        "wc_questions_avg": [
            122.25,
            175.11906663753092
        ],
        "wc_review_avg": [
            430.0,
            233.87924234527526
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1624908244507057264&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Liverpool;Microsoft",
        "aff_unique_dep": ";Microsoft Research",
        "aff_unique_url": "https://www.liverpool.ac.uk;https://www.microsoft.com/en-us/research",
        "aff_unique_abbr": "Liv Uni;MSR",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "title": "On Bias-Variance Alignment in Deep Models",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18078",
        "id": "i2Phucne30",
        "author_site": "Lin Chen, Michal Lukasik, Wittawat Jitkrittum, Chong You, Sanjiv Kumar",
        "tldr": "",
        "abstract": "Classical wisdom in machine learning holds that the generalization error can be decomposed into bias and variance, and these two terms exhibit a \\emph{trade-off}. However, in this paper, we show that for an ensemble of deep learning based classification models, bias and variance are \\emph{aligned} at a sample level, where squared bias is approximately \\emph{equal} to variance for correctly classified sample points. We present empirical evidence confirming this phenomenon in a variety of deep learning models and datasets. Moreover, we study this phenomenon from two theoretical perspectives: calibration and neural collapse. We first show theoretically that under the assumption that the models are well calibrated, we can observe the bias-variance alignment. Second, starting from the picture provided by the neural collapse theory, we show an approximate correlation between bias and variance.",
        "keywords": "bias-variance decomposition;ensemble;deep learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Lin Chen;Michal Lukasik;Wittawat Jitkrittum;Chong You;Sanjiv Kumar",
        "authorids": "~Lin_Chen14;~Michal_Lukasik1;~Wittawat_Jitkrittum1;~Chong_You2;~Sanjiv_Kumar1",
        "gender": ";;M;M;",
        "homepage": ";https://mlukasik.github.io/;http://wittawat.com;https://sites.google.com/view/cyou;http://www.sanjivk.com/",
        "dblp": ";72/11338;95/3398.html;164/7311;",
        "google_scholar": ";https://scholar.google.co.uk/citations?user=cLZLZCQAAAAJ;https://scholar.google.co.uk/citations?hl=en;Mfrpm_IAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;0000-0002-9400-9262;;",
        "linkedin": ";;wittawat-jitkrittum/;;",
        "or_profile": "~Lin_Chen14;~Michal_Lukasik1;~Wittawat_Jitkrittum1;~Chong_You2;~Sanjiv_Kumar1",
        "aff": ";Google Research;Google Research;Google;Google",
        "aff_domain": ";google.com;google.com;google.com;google.com",
        "position": ";Research Scientist;Research Scientist;Research Scientist;Research Scientist",
        "bibtex": "@inproceedings{\nchen2024on,\ntitle={On Bias-Variance Alignment in Deep Models},\nauthor={Lin Chen and Michal Lukasik and Wittawat Jitkrittum and Chong You and Sanjiv Kumar},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=i2Phucne30}\n}",
        "github": "",
        "project": "",
        "reviewers": "iQea;18mF;1psh;ehNn",
        "pdf_size": 2124042,
        "rating": "6;6;8;8",
        "confidence": "3;3;4;3",
        "soundness": "2;3;4;4",
        "contribution": "3;3;4;4",
        "presentation": "2;3;4;4",
        "wc_summary": "96;101;82;178",
        "wc_strengths": "132;75;61;172",
        "wc_weaknesses": "962;116;194;204",
        "wc_questions": "72;1;102;316",
        "wc_review": "1262;293;439;870",
        "wc_reply_reviewers": "350;0;0;0",
        "wc_reply_authors": "3114;404;1353;1399",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "6;1;3;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            3.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            114.25,
            37.459144410944575
        ],
        "wc_strengths_avg": [
            110.0,
            44.5926002830066
        ],
        "wc_weaknesses_avg": [
            369.0,
            344.05958786233526
        ],
        "wc_questions_avg": [
            122.75,
            117.44653038723622
        ],
        "wc_review_avg": [
            716.0,
            379.9638140665503
        ],
        "wc_reply_reviewers_avg": [
            87.5,
            151.55444566227678
        ],
        "wc_reply_authors_avg": [
            1567.5,
            977.21504798074
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            1.8708286933869707
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6461639058177099106&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=i2Phucne30",
        "pdf": "https://openreview.net/pdf?id=i2Phucne30",
        "email": ";google.com;google.com;google.com;google.com",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Google",
        "aff_unique_dep": "Google Research",
        "aff_unique_url": "https://research.google",
        "aff_unique_abbr": "Google Research",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Mountain View",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "i3QbVBiWbp",
        "title": "Learning Informative Latent Representation for Quantum State Tomography",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Quantum state tomography (QST) is the process of reconstructing the complete state of a quantum system (mathematically described as a density matrix) through a series of different measurements. These measurements are performed on a number of identical copies of the quantum system, with outcomes gathered as probabilities/frequencies. \nQST aims to recover the density matrix and the corresponding properties of the quantum state from the measured frequencies. \nAlthough an informationally complete set of measurements can specify the quantum state accurately in an ideal scenario with a large number of identical copies, both the measurements and identical copies are restricted and imperfect in practical scenarios, making QST highly ill-posed. The conventional QST methods usually assume adequate or accurate measured frequencies or rely on manually designed regularizers to handle the ill-posed reconstruction problem, suffering from limited applications in realistic scenarios. \nRecent advances in deep neural networks (DNNs) led to the emergence of deep learning (DL) in QST. However, existing DL-based QST approaches often employ generic DNN models that are not optimized for imperfect conditions of QST. In this paper, we propose a transformer-based autoencoder architecture tailored for QST with imperfect measurement data. Our method leverages a transformer-based encoder to extract \\emph{an informative latent representation} (ILR) from imperfect measurement data and employs a decoder to predict the quantum states based on the ILR. We anticipate that the high-dimensional ILR will capture more comprehensive information about the quantum states. To achieve this, we conduct pre-training of the encoder using a pretext task that involves reconstructing high-quality frequencies from measured frequencies. Extensive simulations and experiments demonstrate the remarkable ability of the informative latent representation to deal with imperfect measurement data in QST.",
        "keywords": "Quantum state tomography;Imperfect measurement data;Latent representation",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Hailan Ma;Zhenhong Sun;Daoyi Dong;Dong Gong",
        "authorids": "~Hailan_Ma1;~Zhenhong_Sun1;~Daoyi_Dong1;~Dong_Gong1",
        "gender": "F;;M;M",
        "homepage": ";;https://profiles.uts.edu.au/Daoyi.Dong;https://donggong1.github.io",
        "dblp": "174/3519;;27/3317;125/5032",
        "google_scholar": "https://scholar.google.com.au/citations?user=JogRo-oAAAAJ;;https://scholar.google.com.au/citations?hl=en;https://scholar.google.com.au/citations?user=e2u6hRoAAAAJ",
        "orcid": "0000-0002-5039-9916;;0000-0002-7425-3559;0000-0002-2668-9630",
        "linkedin": ";;;",
        "or_profile": "~Hailan_Ma1;~Zhenhong_Sun1;~Daoyi_Dong1;~Dong_Gong1",
        "aff": "University of New South Wales;;Australian National University;University of New South Wales",
        "aff_domain": "unsw.edu.au;;anu.edu.au;unsw.edu.au",
        "position": "PhD student;;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nma2024learning,\ntitle={Learning Informative Latent Representation for Quantum State Tomography},\nauthor={Hailan Ma and Zhenhong Sun and Daoyi Dong and Dong Gong},\nyear={2024},\nurl={https://openreview.net/forum?id=i3QbVBiWbp}\n}",
        "github": "",
        "project": "",
        "reviewers": "aFck;bkkh;wK9G;aafB",
        "site": "https://openreview.net/forum?id=i3QbVBiWbp",
        "pdf_size": 1458794,
        "rating": "3;5;5;6",
        "confidence": "5;3;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;2",
        "wc_summary": "65;71;75;35",
        "wc_strengths": "47;61;59;41",
        "wc_weaknesses": "67;209;282;5",
        "wc_questions": "282;6;110;380",
        "wc_review": "461;347;526;461",
        "wc_reply_reviewers": "249;207;88;11",
        "wc_reply_authors": "1620;1340;1358;1008",
        "reply_reviewers": "2;1;1;1",
        "reply_authors": "5;3;3;3",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            61.5,
            15.708278072405008
        ],
        "wc_strengths_avg": [
            52.0,
            8.306623862918075
        ],
        "wc_weaknesses_avg": [
            140.75,
            110.08718136095592
        ],
        "wc_questions_avg": [
            194.5,
            145.5498196494932
        ],
        "wc_review_avg": [
            448.75,
            64.46074386787667
        ],
        "wc_reply_reviewers_avg": [
            138.75,
            94.48379490685161
        ],
        "wc_reply_authors_avg": [
            1331.5,
            217.17446903353994
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.5,
            0.8660254037844386
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.6488856845230502,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16975020949300127133&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of New South Wales;Australian National University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.unsw.edu.au;https://www.anu.edu.au",
        "aff_unique_abbr": "UNSW;ANU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Australia"
    },
    {
        "id": "i43XCU54Br",
        "title": "Dynamic LLM-Agent Network: An LLM-agent Collaboration Framework with Agent Team Optimization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language model (LLM) agents have been shown effective on a wide range of tasks, and by ensembling multiple LLM agents, their performances could be further improved. Existing approaches employ a fixed set of agents to interact with each other in a static architecture, which limits their generalizability to various tasks and requires strong human prior in designing these agents. In this work, we propose to construct a strategic team of agents communicating in a dynamic interaction architecture based on the task query. Specifically, we build a framework named Dynamic LLM-Agent Network (**DyLAN**) for LLM-agent collaboration on complicated tasks like reasoning and code generation. DyLAN enables agents to interact for multiple rounds in a dynamic architecture with inference-time agent selection and an early-stopping mechanism to improve performance and efficiency. We further design an automatic agent team optimization algorithm based on an unsupervised metric termed *Agent Importance Score*, enabling the selection of best agents based on the contribution each agent makes. Empirically, we demonstrate that DyLAN performs well in both reasoning and code generation tasks with reasonable computational cost. DyLAN achieves 13.0\\% and 13.3\\% improvement on MATH and HumanEval, respectively, compared to a single execution on GPT-35-turbo. On specific subjects of MMLU, agent team optimization in DyLAN increases accuracy by up to 25.0\\%.",
        "keywords": "large language model;LLM-powered agent;multi-agent collaboration;reasoning;code generation",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/716347712cd549cf6f2315dc5e0be413676d713e.zip",
        "author": "Zijun Liu;Yanzhe Zhang;Peng Li;Yang Liu;Diyi Yang",
        "authorids": "~Zijun_Liu2;~Yanzhe_Zhang1;~Peng_Li2;~Yang_Liu19;~Diyi_Yang2",
        "gender": "M;M;M;M;F",
        "homepage": ";https://stevenyzzhang.github.io/website/;http://www.lpeng.net/;http://nlp.csai.tsinghua.edu.cn/~ly/;https://cs.stanford.edu/~diyiy/",
        "dblp": ";42/3070;83/6353-30;51/3710-5;70/11145",
        "google_scholar": "vXsVhPcAAAAJ;iJImxvUAAAAJ;hgYzkOQAAAAJ;https://scholar.google.com.hk/citations?user=lVhoKNcAAAAJ;j9jhYqQAAAAJ",
        "orcid": ";;0000-0003-1374-5979;0000-0002-3087-242X;",
        "linkedin": "%E5%AD%90%E5%90%9B-%E5%88%98-164596263/;;;;",
        "or_profile": "~Zijun_Liu2;~Yanzhe_Zhang1;~Peng_Li2;~Yang_Liu19;~Diyi_Yang2",
        "aff": "Department of Computer Science and Technology, Tsinghua University;Georgia Institute of Technology;Tsinghua University;Tsinghua University;Stanford University",
        "aff_domain": "cs.tsinghua.edu.cn;gatech.edu;tsinghua.edu.cn;tsinghua.edu.cn;stanford.edu",
        "position": "Undergrad student;PhD student;Associate Professor;Professor;Assistant Professor",
        "bibtex": "@misc{\nliu2024dynamic,\ntitle={Dynamic {LLM}-Agent Network: An {LLM}-agent Collaboration Framework with Agent Team Optimization},\nauthor={Zijun Liu and Yanzhe Zhang and Peng Li and Yang Liu and Diyi Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=i43XCU54Br}\n}",
        "github": "",
        "project": "",
        "reviewers": "mH5o;yyiU;CxXZ;9MJA;qY2A;KzWB",
        "site": "https://openreview.net/forum?id=i43XCU54Br",
        "pdf_size": 837579,
        "rating": "3;5;5;6;6;8",
        "confidence": "3;3;3;3;3;2",
        "soundness": "2;3;3;3;3;3",
        "contribution": "2;2;2;3;2;3",
        "presentation": "2;2;3;4;3;2",
        "wc_summary": "117;131;132;67;71;154",
        "wc_strengths": "105;102;124;39;39;332",
        "wc_weaknesses": "276;66;214;94;28;245",
        "wc_questions": "2;188;98;93;20;34",
        "wc_review": "500;487;568;293;158;765",
        "wc_reply_reviewers": "0;12;0;0;0;21",
        "wc_reply_authors": "667;672;1149;680;334;549",
        "reply_reviewers": "0;1;0;0;0;1",
        "reply_authors": "1;1;2;1;1;1",
        "rating_avg": [
            5.5,
            1.5
        ],
        "confidence_avg": [
            2.8333333333333335,
            0.3726779962499649
        ],
        "soundness_avg": [
            2.8333333333333335,
            0.3726779962499649
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.7453559924999298
        ],
        "wc_summary_avg": [
            112.0,
            32.29034943549956
        ],
        "wc_strengths_avg": [
            123.5,
            98.79060346679401
        ],
        "wc_weaknesses_avg": [
            153.83333333333334,
            94.85500631080166
        ],
        "wc_questions_avg": [
            72.5,
            62.74219739006065
        ],
        "wc_review_avg": [
            461.8333333333333,
            194.11801965700033
        ],
        "wc_reply_reviewers_avg": [
            5.5,
            8.200609733428363
        ],
        "wc_reply_authors_avg": [
            675.1666666666666,
            243.90258756770544
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.1666666666666667,
            0.3726779962499649
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.7453559924999298,
        "gs_citation": 119,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14033654343850454790&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;0;2",
        "aff_unique_norm": "Tsinghua University;Georgia Institute of Technology;Stanford University",
        "aff_unique_dep": "Department of Computer Science and Technology;;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.gatech.edu;https://www.stanford.edu",
        "aff_unique_abbr": "THU;Georgia Tech;Stanford",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Stanford",
        "aff_country_unique_index": "0;1;0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "i4ULDEeBss",
        "title": "RoleLLM: Benchmarking, Eliciting, and Enhancing Role-Playing Abilities of Large Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The advent of Large Language Models (LLMs) has paved the way for complex tasks such as role-playing, which enhances user interactions by enabling models to imitate various characters. However, the closed-source nature of state-of-the-art LLMs and their general-purpose training limit role-playing optimization. In this paper, we introduce RoleLLM, a framework to benchmark, elicit, and enhance role-playing abilities in LLMs. RoleLLM comprises four stages: (1) Role Profile Construction for 100 roles; (2) Context-Based Instruction Generation (Context-Instruct) for role-specific knowledge extraction; (3) Role Prompting using GPT (RoleGPT) for speaking style imitation; and (4) Role-Conditioned Instruction Tuning (RoCIT) for fine-tuning open-source models along with role customization. By Context-Instruct and RoleGPT, we create RoleBench, the first systematic and fine-grained character-level benchmark dataset for role-playing with 168,093 samples. Moreover, RoCIT on RoleBench yields RoleLLaMA (English) and RoleGLM (Chinese), significantly enhancing role-playing abilities and even achieving comparable results with RoleGPT (using GPT-4).",
        "keywords": "Large Language Models;Role-Playing;AI Agents;Natural Language Processing",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Zekun Wang;zhongyuan peng;Haoran Que;Jiaheng Liu;Wangchunshu Zhou;Yuhan Wu;Hongcheng Guo;Ruitong Gan;Zehao Ni;Man Zhang;Zhaoxiang Zhang;Wanli Ouyang;Ke Xu;Wenhu Chen;Jie Fu;Junran Peng",
        "authorids": "~Zekun_Wang2;~zhongyuan_peng1;~Haoran_Que1;~Jiaheng_Liu1;~Wangchunshu_Zhou1;~Yuhan_Wu3;~Hongcheng_Guo1;~Ruitong_Gan1;~Zehao_Ni1;~Man_Zhang1;~Zhaoxiang_Zhang3;~Wanli_Ouyang1;~Ke_Xu4;~Wenhu_Chen3;~Jie_Fu2;~Junran_Peng1",
        "gender": "M;M;M;M;M;F;M;M;;F;M;;;;;M",
        "homepage": "https://zenmoore.github.io;https://pengzhongyuan-casia.github.io/;;https://liujiaheng.github.io/;https://michaelzhouwang.github.io;https://github.com/JiayunisK;;https://github.com/PROPHETE-pro;;https://teacher.bupt.edu.cn/zhangman/zh_CN/index/244915/list/index.htm;http://zhaoxiangzhang.net;;;;;https://jrpeng.github.io/",
        "dblp": ";;358/4966;225/1962;245/8640.html;;84/8542;;;49/5096-5;55/2285-1.html;;x/KeXu;;;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?view_op=list_works;onEik5gAAAAJ;yFI_RjUAAAAJ;UebIjuQAAAAJ;;https://scholar.google.com/citations?hl=zh-CN;;;yPvtwagAAAAJ;qxWfV6cAAAAJ;;;;;https://scholar.google.com.hk/citations?hl=en",
        "orcid": ";;;;;;;;0009-0007-7288-6217;0000-0003-3043-2122;;;;;;",
        "linkedin": "zekun-wang-023b96189/;;;;;;;;;;;;;;;",
        "or_profile": "~Zekun_Wang2;~zhongyuan_peng1;~Haoran_Que1;~Jiaheng_Liu1;~Wangchunshu_Zhou1;~Yuhan_Wu3;~Hongcheng_Guo1;~Ruitong_Gan1;~Zehao_Ni1;~Man_Zhang1;~Zhaoxiang_Zhang3;~Wanli_Ouyang1;~Ke_Xu4;~Wenhu_Chen3;~Jie_Fu2;~Junran_Peng1",
        "aff": "Beihang University;University of Chinese Academy of Sciences;Beihang University;Alibaba Group;AIWaves Inc.;Beijing University of Posts and Telecommunications;Beihang University;The Hong Kong Polytechnic University, Hong Kong Polytechnic University;University of Chinese Academy of Sciences;Beijing University of Posts and Telecommunications;Institute of Automation, Chinese Academy of Sciences;;Beihang University;;;University of Science and Technology Beijing",
        "aff_domain": "buaa.edu.cn;ucas.ac.cn;buaa.edu.cn;alibaba-inc.com;aiwaves.cn;bupt.edu.cn;buaa.edu.cn;comp.polyu.edu.hk;ucas.ac.cn;bupt.edu.cn;ia.ac.cn;;buaa.edu.cn;;;ustb.edu.cn",
        "position": "MS student;MS student;MS student;Researcher;Researcher;Undergrad student;PhD student;PhD student;MS student;Full Professor;Full Professor;;Full Professor;;;Associate Professor",
        "bibtex": "@misc{\nwang2024rolellm,\ntitle={Role{LLM}: Benchmarking, Eliciting, and Enhancing Role-Playing Abilities of Large Language Models},\nauthor={Zekun Wang and zhongyuan peng and Haoran Que and Jiaheng Liu and Wangchunshu Zhou and Yuhan Wu and Hongcheng Guo and Ruitong Gan and Zehao Ni and Man Zhang and Zhaoxiang Zhang and Wanli Ouyang and Ke Xu and Wenhu Chen and Jie Fu and Junran Peng},\nyear={2024},\nurl={https://openreview.net/forum?id=i4ULDEeBss}\n}",
        "github": "",
        "project": "",
        "reviewers": "2iur;HbAh;nGiR;mGAb",
        "site": "https://openreview.net/forum?id=i4ULDEeBss",
        "pdf_size": 2281512,
        "rating": "3;5;6;6",
        "confidence": "4;4;3;4",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;3;3;4",
        "wc_summary": "82;46;48;83",
        "wc_strengths": "141;38;35;41",
        "wc_weaknesses": "277;173;46;88",
        "wc_questions": "47;9;16;51",
        "wc_review": "547;266;145;263",
        "wc_reply_reviewers": "0;0;111;0",
        "wc_reply_authors": "3604;1342;1859;1914",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "9;6;6;6",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            64.75,
            17.76759691123141
        ],
        "wc_strengths_avg": [
            63.75,
            44.65072787760576
        ],
        "wc_weaknesses_avg": [
            146.0,
            88.39400432156017
        ],
        "wc_questions_avg": [
            30.75,
            18.471261462065875
        ],
        "wc_review_avg": [
            305.25,
            147.85867407764755
        ],
        "wc_reply_reviewers_avg": [
            27.75,
            48.064409910036346
        ],
        "wc_reply_authors_avg": [
            2179.75,
            852.0294522491579
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            6.75,
            1.299038105676658
        ],
        "replies_avg": [
            32,
            0
        ],
        "authors#_avg": [
            16,
            0
        ],
        "corr_rating_confidence": -0.4714045207910316,
        "gs_citation": 211,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17525742729663905763&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0;2;3;4;0;5;1;4;6;0;7",
        "aff_unique_norm": "Beihang University;University of Chinese Academy of Sciences;Alibaba Group;AIWaves Inc.;Beijing University of Posts and Telecommunications;Hong Kong Polytechnic University;Chinese Academy of Sciences;University of Science and Technology Beijing",
        "aff_unique_dep": ";;;;;;Institute of Automation;",
        "aff_unique_url": "http://www.buaa.edu.cn/;http://www.ucas.ac.cn;https://www.alibaba.com;;http://www.bupt.edu.cn/;https://www.polyu.edu.hk;http://www.ia.cas.cn;http://www.ustb.edu.cn",
        "aff_unique_abbr": "BUAA;UCAS;Alibaba;;BUPT;PolyU;CAS;USTB",
        "aff_campus_unique_index": "1;2;1",
        "aff_campus_unique": ";Beijing;Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;1;0;0;0;0;0;0;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "i4eDGZFcva",
        "title": "Reward Centering",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We show that discounted methods for solving continuing reinforcement learning problems can be significantly improved if they center their rewards by subtracting out the rewards' (changing) empirical average. The improvement is substantial at commonly-used discount factors and increases further as the discount factor approaches 1. In addition, we show that if a problem's rewards are shifted by a constant, then non-centering methods perform much worse, whereas centering methods are (unsurprisingly) unaffected. In this sense, reward centering significantly increases the generality of discounted reinforcement learning methods. Insight into the benefits of reward centering can be gained from the decomposition of the discounted value function proposed by Blackwell in 1962.",
        "keywords": "reinforcement learning; discounting; average reward",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Abhishek Naik;Yi Wan;Richard S. Sutton",
        "authorids": "~Abhishek_Naik1;~Yi_Wan1;~Richard_S._Sutton1",
        "gender": "M;M;M",
        "homepage": "https://abhisheknaik96.github.io/;https://sites.google.com/view/yi-wan/;http://richsutton.com",
        "dblp": ";;48/6070",
        "google_scholar": "https://scholar.google.co.in/citations?user=9gV4DRsAAAAJ;zMVstroAAAAJ;https://scholar.google.ca/citations?user=6m4wv6gAAAAJ",
        "orcid": ";;0000-0002-3679-3415",
        "linkedin": ";;richard-sutton-0653545/",
        "or_profile": "~Abhishek_Naik1;~Yi_Wan1;~Richard_S_Sutton1",
        "aff": "University of Alberta;Meta AI Research;University of Alberta",
        "aff_domain": "ualberta.ca;meta.com;ualberta.ca",
        "position": "PhD student;Postdoc;Full Professor",
        "bibtex": "@misc{\nnaik2024reward,\ntitle={Reward Centering},\nauthor={Abhishek Naik and Yi Wan and Richard S. Sutton},\nyear={2024},\nurl={https://openreview.net/forum?id=i4eDGZFcva}\n}",
        "github": "",
        "project": "",
        "reviewers": "DBdQ;xMY5;JTzu;Kzst;ecFz",
        "site": "https://openreview.net/forum?id=i4eDGZFcva",
        "pdf_size": 3012930,
        "rating": "3;5;5;5;6",
        "confidence": "4;5;2;3;3",
        "soundness": "3;3;3;3;3",
        "contribution": "2;2;2;3;3",
        "presentation": "2;1;2;3;3",
        "wc_summary": "110;77;67;195;104",
        "wc_strengths": "92;92;40;78;100",
        "wc_weaknesses": "159;49;210;216;53",
        "wc_questions": "85;294;13;3;118",
        "wc_review": "446;512;330;492;375",
        "wc_reply_reviewers": "83;204;91;143;28",
        "wc_reply_authors": "736;318;731;529;732",
        "reply_reviewers": "1;1;1;1;1",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            4.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.4,
            1.019803902718557
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.2,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            110.6,
            45.16015943284523
        ],
        "wc_strengths_avg": [
            80.4,
            21.406541056415442
        ],
        "wc_weaknesses_avg": [
            137.4,
            73.2846505074562
        ],
        "wc_questions_avg": [
            102.6,
            105.00399992381243
        ],
        "wc_review_avg": [
            431.0,
            69.05649860802386
        ],
        "wc_reply_reviewers_avg": [
            109.8,
            59.563075810438136
        ],
        "wc_reply_authors_avg": [
            609.2,
            165.66399729573112
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.32025630761017426,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10812050546392478097&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Alberta;Meta",
        "aff_unique_dep": ";Meta AI Research",
        "aff_unique_url": "https://www.ualberta.ca;https://meta.com",
        "aff_unique_abbr": "UAlberta;Meta AI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Canada;United States"
    },
    {
        "id": "i4kDKfllrz",
        "title": "Synergistic Classification and Unknown Discrimination for Open Set Recognition",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Deep learners tend to perform well when trained under the closed set assumption but struggle when deployed under open set conditions. This motivates the field of Open Set Recognition in which we seek to give deep learners the ability to recognize whether a data sample belongs to the known classes trained on or comes from the surrounding infinite world. Existing open set recognition methods typically rely upon a single function for the dual task of distinguishing between knowns and unknowns as well as making fine known class distinction. This dual process leaves performance on the table as the function is not specialized for either task. In this work, we introduce Synergistic Classification and unknown Discrimination (SCAD), where we instead learn specialized functions for both known/unknown discrimination and fine class distinction amongst the world of knowns. Our experiments and analysis demonstrate that SCAD handily outperforms modern methods in open set recognition when compared using AUROC scores and correct classification rate at various true positive rates.",
        "keywords": "Open Set Recognition;Open Set Classifier;Novelty Detection;Unknown Class Detection;Out-of-Distribution Detection",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Daniel Brignac;Abhijit Mahalanobis",
        "authorids": "~Daniel_Brignac2;~Abhijit_Mahalanobis1",
        "gender": "M;M",
        "homepage": ";https://ece.engineering.arizona.edu/faculty-staff/faculty/abhijit-mahalanobis",
        "dblp": ";",
        "google_scholar": ";L9Y5FbwAAAAJ",
        "orcid": ";",
        "linkedin": "daniel-brignac-7163ab177/;",
        "or_profile": "~Daniel_Brignac2;~Abhijit_Mahalanobis1",
        "aff": "University of Arizona;University of Arizona",
        "aff_domain": "arizona.edu;arizona.edu",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\nbrignac2024synergistic,\ntitle={Synergistic Classification and Unknown Discrimination for Open Set Recognition},\nauthor={Daniel Brignac and Abhijit Mahalanobis},\nyear={2024},\nurl={https://openreview.net/forum?id=i4kDKfllrz}\n}",
        "github": "",
        "project": "",
        "reviewers": "DxdR;32wB;RKPT;oZJx",
        "site": "https://openreview.net/forum?id=i4kDKfllrz",
        "pdf_size": 702621,
        "rating": "3;3;3;5",
        "confidence": "3;5;4;5",
        "soundness": "1;2;3;3",
        "contribution": "1;2;2;2",
        "presentation": "2;3;3;3",
        "wc_summary": "35;42;117;88",
        "wc_strengths": "7;9;12;37",
        "wc_weaknesses": "152;313;67;147",
        "wc_questions": "2;14;44;1",
        "wc_review": "196;378;240;273",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            70.5,
            33.69347117766289
        ],
        "wc_strengths_avg": [
            16.25,
            12.111461513789324
        ],
        "wc_weaknesses_avg": [
            169.75,
            89.3179013412205
        ],
        "wc_questions_avg": [
            15.25,
            17.36915369268175
        ],
        "wc_review_avg": [
            271.75,
            67.15048398932058
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.5222329678670935,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:xasNJ6aMObEJ:scholar.google.com/&scioq=Synergistic+Classification+and+Unknown+Discrimination+for+Open+Set+Recognition&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Arizona",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.arizona.edu",
        "aff_unique_abbr": "UA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "i5JfdnCob7",
        "title": "Optimal Kernel Choice for Score Function-based Causal Discovery",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Score-based methods have demonstrated their effectiveness in discovering causal relationships by scoring different causal structures based on their goodness of fit to the data. \nRecently, Huang et al. proposed a generalized score function that can handle general data distributions and causal relationships by modeling the relations in reproducing kernel Hilbert space (RKHS). \nThe selection of an appropriate kernel within this score function is crucial for accurately characterizing causal relationships and ensuring precise causal discovery. \nHowever, selecting the optimal kernel for a given data remains unsolved.\nIn this paper, we propose a kernel selection method within the generalized score function that automatically selects the optimal kernel that best fits the data. Specifically, we model the generative process of the variables involved in each step of the causal graph search procedure as a mixture of independent noise variables. Based on this model, we derive an automatic kernel selection method by maximizing the marginal likelihood of the variables involved in each search step.\nWe conduct experiments on both synthetic data and real-world benchmarks, and the results demonstrate that our proposed method outperforms heuristic kernel selection methods.",
        "keywords": "score-based causal discovery;optimal kernel selection",
        "primary_area": "causal reasoning",
        "supplementary_material": "/attachment/764828441c36d66c65fa6f22b07e7a8b542a253b.zip",
        "author": "Wenjie Wang;Biwei Huang;Feng Liu;Tongliang Liu;Xinge You;Kun Zhang;Mingming Gong",
        "authorids": "~Wenjie_Wang3;~Biwei_Huang1;~Feng_Liu2;~Tongliang_Liu1;~Xinge_You1;~Kun_Zhang1;~Mingming_Gong1",
        "gender": "M;F;M;M;M;M;M",
        "homepage": ";;https://fengliu90.github.io/index.html;https://tongliang-liu.github.io/;http://bmal.hust.edu.cn/info/1005/1091.htm;http://www.andrew.cmu.edu/user/kunz1/;https://mingming-gong.github.io/",
        "dblp": ";165/3288;77/1318-3;150/6667;16/1184;96/3115-1;98/8479",
        "google_scholar": "TdnF2vcAAAAJ;;https://scholar.google.com/citations?hl=en;https://scholar.google.com.au/citations?user=EiLdZ_YAAAAJ;v7bRZX8AAAAJ;RGoypN4AAAAJ;https://scholar.google.com.au/citations?user=6BmiCJIAAAAJ",
        "orcid": ";;0000-0002-5005-9129;;;;0000-0001-7147-5589",
        "linkedin": ";;alexfengliu;;;;",
        "or_profile": "~Wenjie_Wang3;~Biwei_Huang1;~Feng_Liu2;~Tongliang_Liu1;~Xinge_You1;~Kun_Zhang1;~Mingming_Gong1",
        "aff": "University of Melbourne;University of California, San Diego;University of Melbourne;Mohamed bin Zayed University of Artificial Intelligence;Huazhong University of Science and Technology;Carnegie Mellon University;University of Melbourne",
        "aff_domain": "unimelb.edu;ucsd.edu;unimelb.edu.au;mbzuai.ac.ae;hust.edu.cn;cmu.edu;unimelb.edu.au",
        "position": "PhD student;Assistant Professor;Assistant Professor;Affiliated Associate Professor;Full Professor;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nwang2024optimal,\ntitle={Optimal Kernel Choice for Score Function-based Causal Discovery},\nauthor={Wenjie Wang and Biwei Huang and Feng Liu and Tongliang Liu and Xinge You and Kun Zhang and Mingming Gong},\nyear={2024},\nurl={https://openreview.net/forum?id=i5JfdnCob7}\n}",
        "github": "",
        "project": "",
        "reviewers": "oMj1;2GNL;VHXH;SijP;qtuB",
        "site": "https://openreview.net/forum?id=i5JfdnCob7",
        "pdf_size": 668382,
        "rating": "3;3;5;5;6",
        "confidence": "4;3;4;3;3",
        "soundness": "2;2;2;2;3",
        "contribution": "2;1;1;2;2",
        "presentation": "1;3;1;2;3",
        "wc_summary": "63;64;101;130;61",
        "wc_strengths": "56;22;17;100;21",
        "wc_weaknesses": "168;169;258;242;13",
        "wc_questions": "46;305;58;82;32",
        "wc_review": "333;560;434;554;127",
        "wc_reply_reviewers": "98;0;306;128;0",
        "wc_reply_authors": "330;718;885;820;168",
        "reply_reviewers": "1;0;1;2;0",
        "reply_authors": "1;1;2;2;1",
        "rating_avg": [
            4.4,
            1.2
        ],
        "confidence_avg": [
            3.4,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.2,
            0.39999999999999997
        ],
        "contribution_avg": [
            1.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.0,
            0.8944271909999159
        ],
        "wc_summary_avg": [
            83.8,
            27.47653544390195
        ],
        "wc_strengths_avg": [
            43.2,
            31.68217164273939
        ],
        "wc_weaknesses_avg": [
            170.0,
            86.69717411773004
        ],
        "wc_questions_avg": [
            104.6,
            101.53541254163495
        ],
        "wc_review_avg": [
            401.6,
            160.92060154001413
        ],
        "wc_reply_reviewers_avg": [
            106.4,
            112.26682501968246
        ],
        "wc_reply_authors_avg": [
            584.2,
            283.4871425655844
        ],
        "reply_reviewers_avg": [
            0.8,
            0.7483314773547883
        ],
        "reply_authors_avg": [
            1.4,
            0.4898979485566356
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.2721655269759087,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2325456776738920831&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;0;2;3;4;0",
        "aff_unique_norm": "University of Melbourne;University of California, San Diego;Mohamed bin Zayed University of Artificial Intelligence;Huazhong University of Science and Technology;Carnegie Mellon University",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.unimelb.edu.au;https://www.ucsd.edu;https://mbzuai.ac.ae;http://www.hust.edu.cn;https://www.cmu.edu",
        "aff_unique_abbr": "UniMelb;UCSD;MBZUAI;HUST;CMU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";San Diego",
        "aff_country_unique_index": "0;1;0;2;3;1;0",
        "aff_country_unique": "Australia;United States;United Arab Emirates;China"
    },
    {
        "id": "i5da6iedW8",
        "title": "FedBiOT: a solution for federated large language model fine-tuning with intellectual property protection",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Due to data and information privacy concerns, data owners are not willing to share the data with others, but each of them may not have sufficient data to fine-tune a satisfactory large language model (LLM) individually. Parallelly, the LLM owners may not be willing to disclose the LLMs' details, including their architectures and parameters. Therefore, this leads to the challenge of fine-tuning an LLM on a federated learning task where the clients with task-specific data cannot obtain the complete LLM. To solve the challenge, this paper introduces FedBiOT, a method that guarantees the clients' data privacy and avoids the disclosure of an LLM. Specifically, we formulate and solve a bi-level optimization problem to ensure that the emulator distilled on the public dataset by the LLM owner can help the adaptors' local fine-tuning on clients' private datasets, regardless of the distribution drift between those datasets. Different clients' adapters are synchronized in a federated learning style, and the full model composed with the final derived adapter can achieve better performance on downstream tasks. We conduct extensive experiments on LLaMA-7B training for various federated learning tasks and witness significant improvements over existing baselines.",
        "keywords": "Federated Learning;Large Language Model",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Feijie Wu;Zitao Li;Yaliang Li;Bolin Ding;Jing Gao",
        "authorids": "~Feijie_Wu1;~Zitao_Li1;~Yaliang_Li1;~Bolin_Ding3;~Jing_Gao2",
        "gender": ";M;M;M;F",
        "homepage": "https://harli.me/;;https://sites.google.com/site/yaliangli/;https://bolinding.github.io/;https://engineering.purdue.edu/~jinggao/",
        "dblp": "246/4255;220/3927;https://dblp.org/pers/hd/l/Li:Yaliang;46/3522.html;67/4834-4",
        "google_scholar": "https://scholar.google.com/citations?hl=en;_8DPNucAAAAJ;CCPBcdYAAAAJ;AjYkTi8AAAAJ;Ftj1h4cAAAAJ",
        "orcid": "0000-0003-0541-1901;;0000-0002-4204-6096;;",
        "linkedin": ";;;bolin-ding-50a0119/;",
        "or_profile": "~Feijie_Wu1;~Zitao_Li1;~Yaliang_Li1;~Bolin_Ding3;~Jing_Gao2",
        "aff": "Purdue University;Alibaba Group (U.S.);Alibaba Group;Alibaba Group;Purdue University",
        "aff_domain": "purdue.edu;alibaba-inc.com;alibaba-inc.com;alibaba-inc.com;purdue.edu",
        "position": "PhD student;Researcher;Staff Engineer;Senior Director;Associate Professor",
        "bibtex": "@misc{\nwu2024fedbiot,\ntitle={FedBi{OT}: a solution for federated large language model fine-tuning with intellectual property protection},\nauthor={Feijie Wu and Zitao Li and Yaliang Li and Bolin Ding and Jing Gao},\nyear={2024},\nurl={https://openreview.net/forum?id=i5da6iedW8}\n}",
        "github": "",
        "project": "",
        "reviewers": "uuim;nUtE;hDuF;4sKJ",
        "site": "https://openreview.net/forum?id=i5da6iedW8",
        "pdf_size": 465801,
        "rating": "3;5;5;6",
        "confidence": "5;3;4;1",
        "soundness": "3;2;3;2",
        "contribution": "2;2;2;2",
        "presentation": "3;3;3;3",
        "wc_summary": "105;66;68;39",
        "wc_strengths": "47;26;45;6",
        "wc_weaknesses": "153;115;252;51",
        "wc_questions": "1;42;50;2",
        "wc_review": "306;249;415;98",
        "wc_reply_reviewers": "16;0;0;0",
        "wc_reply_authors": "768;737;882;286",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            1.479019945774904
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            69.5,
            23.47871376374779
        ],
        "wc_strengths_avg": [
            31.0,
            16.59819267269783
        ],
        "wc_weaknesses_avg": [
            142.75,
            72.85044612080286
        ],
        "wc_questions_avg": [
            23.75,
            22.431841208425134
        ],
        "wc_review_avg": [
            267.0,
            114.35689747452928
        ],
        "wc_reply_reviewers_avg": [
            4.0,
            6.928203230275509
        ],
        "wc_reply_authors_avg": [
            668.25,
            227.20076474343128
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.8919017444789035,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:i5c3aSi2--MJ:scholar.google.com/&scioq=FedBiOT:+a+solution+for+federated+large+language+model+fine-tuning+with+intellectual+property+protection&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1;0",
        "aff_unique_norm": "Purdue University;Alibaba Group",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.purdue.edu;https://www.alibaba.com",
        "aff_unique_abbr": "Purdue;Alibaba",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;1;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "i6EtCiIK4a",
        "title": "Rethinking Moreau Envelope for Nonconvex Bi-Level Optimization: A Single-loop and Hessian-free Solution Strategy",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Bi-Level Optimization (BLO) has found diverse applications in machine learning due to its ability to model nested structures. Addressing large-scale BLO problems for complex learning tasks presents two significant challenges: ensuring computational efficiency and providing theoretical guarantees. Recent advancements in scalable BLO algorithms has predominantly relied on lower-level convexity simplification. In this context, our work takes on the challenge of large-scale BLO problems involving nonconvexity in both the upper and lower levels. We address both computational and theoretical challenges simultaneously. Specifically, by utilizing the Moreau envelope-based reformulation, we introduce an innovative single-loop gradient-based algorithm with non-asymptotic convergence analysis for general nonconvex BLO problems. Notably, this algorithm relies solely on first-order gradient information, making it exceedingly practical and efficient, particularly for large-scale BLO learning tasks. We validate the effectiveness of our approach on a series of different synthetic problems,  two typicial hyper-parameter learning tasks and the real-world neural architecture search application. These experiments collectively substantiate the superior performance of our method.",
        "keywords": "Bi-level Optimization;Nonconvex;Hessian-free;Single-loop;Moreau Envelope;Convergence Analysis;Non-asymptotic",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/681b9f463fb81851c07675863000ee74e93bb42b.zip",
        "author": "Risheng Liu;Zhu Liu;Wei Yao;Shangzhi Zeng;Jin Zhang",
        "authorids": "~Risheng_Liu1;~Zhu_Liu3;~Wei_Yao3;~Shangzhi_Zeng1;~Jin_Zhang8",
        "gender": ";M;;M;M",
        "homepage": "https://rsliu.tech/;https://scholar.google.com/citations?user=WDjOXbIAAAAJ&hl=zh-CN;https://mathscinet.ams.org/mathscinet/search/author.html?mrauthid=910710;;https://math.sustech.edu.cn/c/zhangjin?lang=en",
        "dblp": "82/8066;14/191-4.html;;209/8353;",
        "google_scholar": "DzuhImQAAAAJ;WDjOXbIAAAAJ;;rzIzb6cAAAAJ;https://scholar.google.ca/citations?hl=en",
        "orcid": ";0000-0003-0975-2711;;0000-0002-6950-7825;",
        "linkedin": ";;;;",
        "or_profile": "~Risheng_Liu1;~Zhu_Liu3;~Wei_Yao3;~Shangzhi_Zeng1;~Jin_Zhang8",
        "aff": "Dalian University of Technology;Dalian University of Technology;Southern University of Science and Technology;University of Victoria;",
        "aff_domain": "dlut.edu.cn;dlut.edu.cn;sustech.edu.cn;uvic.ca;",
        "position": "Full Professor;PhD student;Assistant Professor;Postdoc;",
        "bibtex": "@misc{\nliu2024rethinking,\ntitle={Rethinking Moreau Envelope for Nonconvex Bi-Level Optimization: A Single-loop and Hessian-free Solution Strategy},\nauthor={Risheng Liu and Zhu Liu and Wei Yao and Shangzhi Zeng and Jin Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=i6EtCiIK4a}\n}",
        "github": "",
        "project": "",
        "reviewers": "Qikw;wVzv;am3o;y7ue;UhJL",
        "site": "https://openreview.net/forum?id=i6EtCiIK4a",
        "pdf_size": 9235942,
        "rating": "5;6;6;8;8",
        "confidence": "4;3;4;5;2",
        "soundness": "2;2;3;3;3",
        "contribution": "3;2;3;4;4",
        "presentation": "3;3;3;3;3",
        "wc_summary": "70;41;56;75;40",
        "wc_strengths": "47;9;40;53;62",
        "wc_weaknesses": "127;62;52;29;38",
        "wc_questions": "11;21;1;125;55",
        "wc_review": "255;133;149;282;195",
        "wc_reply_reviewers": "0;0;18;14;0",
        "wc_reply_authors": "2210;415;362;622;761",
        "reply_reviewers": "0;0;1;1;0",
        "reply_authors": "5;1;1;1;2",
        "rating_avg": [
            6.6,
            1.2
        ],
        "confidence_avg": [
            3.6,
            1.019803902718557
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            3.2,
            0.7483314773547882
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            56.4,
            14.402777509911065
        ],
        "wc_strengths_avg": [
            42.2,
            18.10414317221337
        ],
        "wc_weaknesses_avg": [
            61.6,
            34.60982519458889
        ],
        "wc_questions_avg": [
            42.6,
            45.03154449938399
        ],
        "wc_review_avg": [
            202.8,
            58.00827527172309
        ],
        "wc_reply_reviewers_avg": [
            6.4,
            7.939773296511683
        ],
        "wc_reply_authors_avg": [
            874.0,
            683.2267559163648
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            2.0,
            1.5491933384829668
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.13074409009212265,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:c0xvPxZhoXsJ:scholar.google.com/&scioq=Rethinking+Moreau+Envelope+for+Nonconvex+Bi-Level+Optimization:+A+Single-loop+and+Hessian-free+Solution+Strategy&hl=en&as_sdt=0,48",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "Dalian University of Technology;Southern University of Science and Technology;University of Victoria",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.dlut.edu.cn/;https://www.sustech.edu.cn;https://www.uvic.ca",
        "aff_unique_abbr": "DUT;SUSTech;UVic",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "China;Canada"
    },
    {
        "id": "i6JcQpiFdR",
        "title": "Guaranteed Trust Region Optimization via Two-Phase KL Penalization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "On-policy reinforcement learning (RL) has become a popular framework for solving sequential decision problems due to its computational efficiency and theoretical simplicity.\nSome on-policy methods guarantee every policy update is constrained to a trust region relative to the prior policy to ensure training stability.\nThese methods often require computationally intensive non-linear optimization or require a particular form of action distribution.\nIn this work, we show that applying KL penalization alone is nearly sufficient to enforce such trust regions.\nThen, we show that introducing a \"fixup\" phase is sufficient to guarantee a trust region is enforced on every policy update while adding fewer than 5\\% additional gradient steps in practice.\nThe resulting algorithm, which we call FixPO, is able to train a variety of policy architectures and action spaces, is easy to implement, and produces results competitive with other trust region methods.",
        "keywords": "Reinforcement Learning;Trust Region Methods;On-Policy RL",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/d7405c71d6198e70cced60617ffea233d862237b.zip",
        "author": "K.R. Zentner;Ujjwal Puri;Zhehui Huang;Gaurav S. Sukhatme",
        "authorids": "~K.R._Zentner1;~Ujjwal_Puri1;~Zhehui_Huang1;~Gaurav_S._Sukhatme1",
        "gender": "Not Specified;M;M;M",
        "homepage": "https://zentner.io/;;https://zhehui-huang.github.io/;http://www-robotics.usc.edu/~gaurav/",
        "dblp": "295/9732;201/6114;267/9259;s/GauravSSukhatme",
        "google_scholar": "IjVj4hsAAAAJ;;vLUrmdMAAAAJ;https://scholar.google.com.tw/citations?user=lRUi-A8AAAAJ",
        "orcid": ";;0000-0001-9620-1699;0000-0003-2408-474X",
        "linkedin": "zentnerkyle/;ujjwalpuri/;zhehui-huang/?locale=en_US;gaurav-sukhatme-9b6420b/",
        "or_profile": "~K.R._Zentner1;~Ujjwal_Puri1;~Zhehui_Huang1;~Gaurav_S._Sukhatme1",
        "aff": "University of Southern California;;University of Southern California;University of Southern California",
        "aff_domain": "usc.edu;;usc.edu;usc.edu",
        "position": "PhD student;;PhD student;Full Professor",
        "bibtex": "@misc{\nzentner2024guaranteed,\ntitle={Guaranteed Trust Region Optimization via Two-Phase {KL} Penalization},\nauthor={K.R. Zentner and Ujjwal Puri and Zhehui Huang and Gaurav S. Sukhatme},\nyear={2024},\nurl={https://openreview.net/forum?id=i6JcQpiFdR}\n}",
        "github": "",
        "project": "",
        "reviewers": "HunE;cJrU;bxPw;MD36",
        "site": "https://openreview.net/forum?id=i6JcQpiFdR",
        "pdf_size": 1992574,
        "rating": "3;5;6;10",
        "confidence": "3;4;2;5",
        "soundness": "2;3;3;4",
        "contribution": "2;2;3;4",
        "presentation": "1;2;3;4",
        "wc_summary": "18;61;52;105",
        "wc_strengths": "21;60;35;115",
        "wc_weaknesses": "182;151;88;11",
        "wc_questions": "2;8;28;143",
        "wc_review": "223;280;203;374",
        "wc_reply_reviewers": "0;0;0;935",
        "wc_reply_authors": "833;263;372;565",
        "reply_reviewers": "0;0;0;3",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            6.0,
            2.5495097567963922
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            59.0,
            31.024184114977142
        ],
        "wc_strengths_avg": [
            57.75,
            35.88436288970448
        ],
        "wc_weaknesses_avg": [
            108.0,
            65.44845299928792
        ],
        "wc_questions_avg": [
            45.25,
            57.251091692648096
        ],
        "wc_review_avg": [
            270.0,
            66.35887280537547
        ],
        "wc_reply_reviewers_avg": [
            233.75,
            404.8668762692251
        ],
        "wc_reply_authors_avg": [
            508.25,
            216.44557630037164
        ],
        "reply_reviewers_avg": [
            0.75,
            1.299038105676658
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.6139406135149205,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6482042486685127304&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Southern California",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.usc.edu",
        "aff_unique_abbr": "USC",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Los Angeles",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "i6t6laraaF",
        "title": "POI-based Traffic Generation via Supervised Contrastive Learning on Reconstructed Graph",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Traffic flow generation problem under realistic scenarios has raised more and more attention in recent years. This problem aims at generating traffic flow without using historical traffic data. Since road network and POI data can provide a more comprehensive picture of traffic patterns, most previous methods use both or either of them to generate traffic flow. However, roadnet graph in real-world has bias and abnormal structure, which will influence the performance of traffic generation. Previous traffic generation models directly receive real-world roadnet graph with map-match POI data as input and then use an end-to-end loss for training, which could not model the complex relationship between POI and traffic in a proper way. Different from prior methods, we propose a novel POI-based Traffic Generation model via Supervised Contrastive learning on \\Reconstructed graph, termed as TG-SCR, which combines POI data and road network data to generate the distribution of traffic flows. Our model has two novel modules: a graph reconstruction module and a POI supervised contrastive module. The structural module includes a k-NN graph builder and a k-NN graph aggregator, which is used to reconstruct the original roadnet graph into a k-NN graph and reform POI feature. The contrastive module is used to model the relationship between POI feature and traffic flow. Extensive experiments show that our model outperforms other baseline methods on four real-world datasets.",
        "keywords": "Traffic Generation;Contrastive Learning;Graph Reconstruction",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Su Ziyang;Zhanyu Liu;Guanjie Zheng",
        "authorids": "~Su_Ziyang1;~Zhanyu_Liu1;~Guanjie_Zheng1",
        "gender": "M;M;M",
        "homepage": ";https://zhyliu00.github.io/;http://jhc.sjtu.edu.cn/~gjzheng/",
        "dblp": ";02/10777;204/3356",
        "google_scholar": ";VAnWz0IAAAAJ;jJpqDQIAAAAJ",
        "orcid": "0009-0009-3947-4506;0000-0001-6207-5460;",
        "linkedin": ";;",
        "or_profile": "~Su_Ziyang1;~Zhanyu_Liu1;~Guanjie_Zheng1",
        "aff": "Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn",
        "position": "PhD student;PhD student;Assistant Professor",
        "bibtex": "@misc{\nziyang2024poibased,\ntitle={{POI}-based Traffic Generation via Supervised Contrastive Learning on Reconstructed Graph},\nauthor={Su Ziyang and Zhanyu Liu and Guanjie Zheng},\nyear={2024},\nurl={https://openreview.net/forum?id=i6t6laraaF}\n}",
        "github": "",
        "project": "",
        "reviewers": "rnVi;bmB5;ZfDL;M1Po",
        "site": "https://openreview.net/forum?id=i6t6laraaF",
        "pdf_size": 2527485,
        "rating": "3;3;3;5",
        "confidence": "4;3;3;3",
        "soundness": "3;2;2;2",
        "contribution": "2;1;3;2",
        "presentation": "3;2;2;2",
        "wc_summary": "29;88;47;192",
        "wc_strengths": "31;6;43;153",
        "wc_weaknesses": "123;67;153;179",
        "wc_questions": "5;1;76;5",
        "wc_review": "188;162;319;529",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            89.0,
            63.194145298437256
        ],
        "wc_strengths_avg": [
            58.25,
            56.3088580953299
        ],
        "wc_weaknesses_avg": [
            130.5,
            41.674332628129754
        ],
        "wc_questions_avg": [
            21.75,
            31.363792819109108
        ],
        "wc_review_avg": [
            299.5,
            145.24892426451908
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:H82bKTYme7IJ:scholar.google.com/&scioq=POI-based+Traffic+Generation+via+Supervised+Contrastive+Learning+on+Reconstructed+Graph&hl=en&as_sdt=0,33",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Shanghai Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sjtu.edu.cn",
        "aff_unique_abbr": "SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "EventRPG: Event Data Augmentation with Relevance Propagation Guidance",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18077",
        "id": "i7LCsDMcZ4",
        "author_site": "Mingyuan Sun, Donghao Zhang, Zongyuan Ge, Jiaxu Wang, Jia Li, Zheng Fang, Renjing Xu",
        "tldr": "",
        "abstract": "Event camera, a novel bio-inspired vision sensor, has drawn a lot of attention for its low latency, low power consumption, and high dynamic range. Currently, overfitting remains a critical problem in event-based classification tasks for Spiking Neural Network (SNN) due to its relatively weak spatial representation capability. Data augmentation is a simple but efficient method to alleviate overfitting and improve the generalization ability of neural networks, and saliency-based augmentation methods are proven to be effective in the image processing field. However, there is no approach available for extracting saliency maps from SNNs. Therefore, for the first time, we present Spiking Layer-Time-wise Relevance Propagation rule (SLTRP) and Spiking Layer-wise Relevance Propagation rule (SLRP) in order for SNN to generate stable and accurate CAMs and saliency maps. Based on this, we propose EventRPG, which leverages relevance propagation on the spiking neural network for more efficient augmentation. Our proposed method has been evaluated on several SNN structures, achieving state-of-the-art performance in object recognition tasks including N-Caltech101, CIFAR10-DVS, with accuracies of 85.62% and 85.55%, as well as action recognition task SL-Animals with an accuracy of 91.59%. Our code is available at https://github.com/myuansun/EventRPG.",
        "keywords": "Spiking Neural Network;Event Camera;Data Augmentation",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Mingyuan Sun;Donghao Zhang;Zongyuan Ge;WANG Jiaxu;Jia Li;Zheng Fang;Renjing Xu",
        "authorids": "~Mingyuan_Sun1;~Donghao_Zhang1;~Zongyuan_Ge1;~WANG_Jiaxu1;~Jia_Li16;~Zheng_Fang9;~Renjing_Xu1",
        "gender": "M;M;M;;F;M;",
        "homepage": "https://myuansun.github.io;;https://research.monash.edu/en/persons/zongyuan-ge;;;http://faculty.neu.edu.cn/fangzheng;",
        "dblp": ";157/0280;147/2757;;;77/4730-1;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;https://scholar.google.com.au/citations?user=Q0gUrcIAAAAJ;;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en;",
        "orcid": ";;0000-0002-5880-8673;;0009-0006-6492-727X;;",
        "linkedin": ";;;;jia-li-603107310/;;",
        "or_profile": "~Mingyuan_Sun1;~Donghao_Zhang1;~Zongyuan_Ge1;~WANG_Jiaxu1;~Jia_Li16;~Zheng_Fang9;~Renjing_Xu1",
        "aff": "Northeastern University;;Monash University;;Zhengzhou Tobacco Research Institute of CNTC ;Northeastern University;",
        "aff_domain": "neu.edu.cn;;monash.edu;;ztri.com.cn;mail.neu.edu.cn;",
        "position": "MS student;;Associate Professor;;Researcher;Full Professor;",
        "bibtex": "@inproceedings{\nsun2024eventrpg,\ntitle={Event{RPG}: Event Data Augmentation with Relevance Propagation Guidance},\nauthor={Mingyuan Sun and Donghao Zhang and Zongyuan Ge and WANG Jiaxu and Jia Li and Zheng Fang and Renjing Xu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=i7LCsDMcZ4}\n}",
        "github": "",
        "project": "",
        "reviewers": "DHWr;rLwX;dKSN",
        "pdf_size": 6742471,
        "rating": "5;6;8",
        "confidence": "3;3;3",
        "soundness": "3;3;4",
        "contribution": "3;2;3",
        "presentation": "2;3;4",
        "wc_summary": "44;64;69",
        "wc_strengths": "76;51;49",
        "wc_weaknesses": "133;209;98",
        "wc_questions": "22;2;152",
        "wc_review": "275;326;368",
        "wc_reply_reviewers": "0;134;0",
        "wc_reply_authors": "857;1464;985",
        "reply_reviewers": "0;2;0",
        "reply_authors": "2;6;4",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            59.0,
            10.801234497346433
        ],
        "wc_strengths_avg": [
            58.666666666666664,
            12.283683848458853
        ],
        "wc_weaknesses_avg": [
            146.66666666666666,
            46.33453235858639
        ],
        "wc_questions_avg": [
            58.666666666666664,
            66.49979114420002
        ],
        "wc_review_avg": [
            323.0,
            38.02630668366309
        ],
        "wc_reply_reviewers_avg": [
            44.666666666666664,
            63.168205785998246
        ],
        "wc_reply_authors_avg": [
            1102.0,
            261.2521132290927
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            4.0,
            1.632993161855452
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11877750136238974670&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=i7LCsDMcZ4",
        "pdf": "https://openreview.net/pdf?id=i7LCsDMcZ4",
        "email": "neu.edu.cn;;monash.edu;;ztri.com.cn;mail.neu.edu.cn;",
        "author_num": 7,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Northeastern University;Monash University;Zhengzhou Tobacco Research Institute",
        "aff_unique_dep": ";;Tobacco Research",
        "aff_unique_url": "https://www.northeastern.edu;https://www.monash.edu;",
        "aff_unique_abbr": "NEU;Monash;ZTRI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;0",
        "aff_country_unique": "United States;Australia;China"
    },
    {
        "id": "i7P2mK3x3o",
        "title": "Computing high-dimensional optimal transport by flow neural networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Flow-based models are widely used in generative tasks, including normalizing flow, where a neural network transports from a data distribution $P$ to a normal distribution. This work develops a flow-based model that transports from $P$ to an arbitrary $Q$ where both distributions are only accessible via finite samples. We propose to learn the dynamic optimal transport between $P$ and $Q$ by training a flow neural network. The model is trained to find an invertible transport map between $P$ and $Q$ optimally by minimizing the transport cost. The trained optimal transport flow allows for performing many downstream tasks, including infinitesimal density ratio estimation and distribution interpolation in the latent space for generative models. The effectiveness of the proposed model on high-dimensional data is empirically demonstrated in mutual information estimation, energy-based generative models, and image-to-image translation.",
        "keywords": "flow model;optimal transport;neural ODE",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/95a8521fd38244c33f4b19537a9c2052e844be88.zip",
        "author": "Chen Xu;Xiuyuan Cheng;Yao Xie",
        "authorids": "~Chen_Xu12;~Xiuyuan_Cheng1;~Yao_Xie2",
        "gender": "M;;F",
        "homepage": "https://hamrel-cxu.github.io/;;http://www2.isye.gatech.edu/~yxie77",
        "dblp": ";79/9747;13/4242-2",
        "google_scholar": "https://scholar.google.com/citations?hl=en;I2gwdssAAAAJ;qvYp8ZQAAAAJ",
        "orcid": ";;",
        "linkedin": "chen-xu-92013714a/;;yaoxie/",
        "or_profile": "~Chen_Xu12;~Xiuyuan_Cheng1;~Yao_Xie2",
        "aff": "Georgia Institute of Technology;Duke University;Georgia Institute of Technology",
        "aff_domain": "gatech.edu;duke.edu;gatech.edu",
        "position": "PhD student;Associate Professor;Full Professor",
        "bibtex": "@misc{\nxu2024computing,\ntitle={Computing high-dimensional optimal transport by flow neural networks},\nauthor={Chen Xu and Xiuyuan Cheng and Yao Xie},\nyear={2024},\nurl={https://openreview.net/forum?id=i7P2mK3x3o}\n}",
        "github": "",
        "project": "",
        "reviewers": "3qrZ;Q3SS;qvyZ;MAzo;f3T8",
        "site": "https://openreview.net/forum?id=i7P2mK3x3o",
        "pdf_size": 2123109,
        "rating": "3;3;5;5;5",
        "confidence": "4;4;3;4;4",
        "soundness": "2;1;4;3;2",
        "contribution": "2;1;2;3;2",
        "presentation": "3;3;4;3;2",
        "wc_summary": "60;93;88;70;122",
        "wc_strengths": "17;15;115;31;36",
        "wc_weaknesses": "120;417;98;142;164",
        "wc_questions": "5;220;255;53;180",
        "wc_review": "202;745;556;296;502",
        "wc_reply_reviewers": "0;59;34;0;0",
        "wc_reply_authors": "368;554;260;321;440",
        "reply_reviewers": "0;1;1;0;0",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            4.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.4,
            1.019803902718557
        ],
        "contribution_avg": [
            2.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            3.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            86.6,
            21.350409832132026
        ],
        "wc_strengths_avg": [
            42.8,
            36.97783119654261
        ],
        "wc_weaknesses_avg": [
            188.2,
            116.4961801948888
        ],
        "wc_questions_avg": [
            142.6,
            96.93833091197722
        ],
        "wc_review_avg": [
            460.2,
            192.69914374485424
        ],
        "wc_reply_reviewers_avg": [
            18.6,
            24.113066996962456
        ],
        "wc_reply_authors_avg": [
            388.6,
            101.51965326969946
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.40824829046386296,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4965442409196205743&as_sdt=1005&sciodt=0,4&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Georgia Institute of Technology;Duke University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.gatech.edu;https://www.duke.edu",
        "aff_unique_abbr": "Georgia Tech;Duke",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "i7oU4nfKEA",
        "title": "When Is Multilinguality a Curse? Language Modeling for 252 High- and Low-Resource Languages",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Multilingual language models are widely used to extend NLP systems to low-resource languages. However, concrete evidence for the effects of multilinguality on language modeling performance in individual languages remains scarce. Here, we pre-train over 10,000 monolingual and multilingual language models for over 250 languages, including multiple language families that are under-studied in NLP. We assess how language modeling performance in each language varies as a function of (1) monolingual dataset size, (2) added multilingual dataset size, (3) linguistic similarity of the added languages, and (4) model size (up to 45M parameters). We find that in moderation, adding multilingual data improves low-resource language modeling performance, similar to increasing low-resource dataset sizes by up to 33%. Improvements depend on the syntactic similarity of the added multilingual data, with marginal additional effects of vocabulary overlap. However, high-resource languages consistently perform worse in multilingual pre-training scenarios. As dataset sizes increase, adding multilingual data begins to hurt performance for both low-resource and high-resource languages, likely due to limited model capacity (the \"curse of multilinguality\"). These results suggest that massively multilingual pre-training may not be beneficial for any languages involved, but that more targeted models can significantly improve performance.",
        "keywords": "language models;multilingual NLP;low-resource languages",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Tyler A. Chang;Catherine Arnett;Zhuowen Tu;Ben Bergen",
        "authorids": "~Tyler_A._Chang1;~Catherine_Arnett1;~Zhuowen_Tu1;~Ben_Bergen1",
        "gender": ";F;;",
        "homepage": ";https://catherinearnett.github.io/;;",
        "dblp": ";358/8873;;",
        "google_scholar": ";gIDJdFAAAAAJ;;",
        "orcid": ";0000-0003-0448-5415;;",
        "linkedin": ";catherine-arnett96/;;",
        "or_profile": "~Tyler_A._Chang1;~Catherine_Arnett1;~Zhuowen_Tu1;~Ben_Bergen1",
        "aff": ";University of California, San Diego;;",
        "aff_domain": ";ucsd.edu;;",
        "position": ";PhD student;;",
        "bibtex": "@misc{\nchang2024when,\ntitle={When Is Multilinguality a Curse? Language Modeling for 252 High- and Low-Resource Languages},\nauthor={Tyler A. Chang and Catherine Arnett and Zhuowen Tu and Ben Bergen},\nyear={2024},\nurl={https://openreview.net/forum?id=i7oU4nfKEA}\n}",
        "github": "",
        "project": "",
        "reviewers": "yYRw;Dd5N;wTm3;HmV5",
        "site": "https://openreview.net/forum?id=i7oU4nfKEA",
        "pdf_size": 1244782,
        "rating": "5;6;6;8",
        "confidence": "3;4;4;4",
        "soundness": "3;3;2;4",
        "contribution": "2;3;2;3",
        "presentation": "3;3;3;4",
        "wc_summary": "168;89;99;90",
        "wc_strengths": "27;34;114;142",
        "wc_weaknesses": "52;121;235;90",
        "wc_questions": "15;148;5;41",
        "wc_review": "262;392;453;363",
        "wc_reply_reviewers": "0;73;11;0",
        "wc_reply_authors": "621;295;557;361",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            111.5,
            32.85194058195041
        ],
        "wc_strengths_avg": [
            79.25,
            49.806500579743606
        ],
        "wc_weaknesses_avg": [
            124.5,
            68.31727453580098
        ],
        "wc_questions_avg": [
            52.25,
            56.82154080980205
        ],
        "wc_review_avg": [
            367.5,
            69.03079023160608
        ],
        "wc_reply_reviewers_avg": [
            21.0,
            30.35621847332108
        ],
        "wc_reply_authors_avg": [
            458.5,
            134.48698821819158
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.6622661785325219,
        "gs_citation": 96,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14472290338615468883&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of California, San Diego",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucsd.edu",
        "aff_unique_abbr": "UCSD",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "San Diego",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Locality Sensitive Sparse Encoding for Learning World Models Online",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18076",
        "id": "i8PjQT3Uig",
        "author_site": "Zichen Liu, Chao Du, Wee Sun Lee, Min Lin",
        "tldr": "",
        "abstract": "Acquiring an accurate world model $\\textit{online}$ for model-based reinforcement learning (MBRL) is challenging due to data nonstationarity, which typically causes catastrophic forgetting for neural networks (NNs). From the online learning perspective, a Follow-The-Leader (FTL) world model is desirable, which optimally fits all previous experiences at each round. Unfortunately, NN-based models need re-training on all accumulated data at every interaction step to achieve FTL, which is computationally expensive for lifelong agents. In this paper, we revisit models that can achieve FTL with incremental updates. Specifically, our world model is a linear regression model supported by nonlinear random features. The linear part ensures efficient FTL update while the nonlinear random feature empowers the fitting of complex environments. To best trade off model capacity and computation efficiency, we introduce a locality sensitive sparse encoding, which allows us to conduct efficient sparse updates even with very high dimensional nonlinear features. We validate the representation power of our encoding and verify that it allows efficient online learning under data covariate shift. We also show, in the Dyna MBRL setting, that our world models learned online using a $\\textit{single pass}$ of trajectory data either surpass or match the performance of deep world models trained with replay and other continual learning methods.",
        "keywords": "model-based rl;online learning;incremental learning;catastrophic forgetting",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Zichen Liu;Chao Du;Wee Sun Lee;Min Lin",
        "authorids": "~Zichen_Liu1;~Chao_Du1;~Wee_Sun_Lee1;~Min_Lin1",
        "gender": ";M;M;M",
        "homepage": ";https://duchao0726.github.io/;http://www.comp.nus.edu.sg/~leews/;https://linmin.me",
        "dblp": ";75/7523;86/1498;",
        "google_scholar": ";QOp7xW0AAAAJ;https://scholar.google.com.sg/citations?user=8PCrLgwAAAAJ;BGONmkIAAAAJ",
        "orcid": ";0000-0003-1244-6336;;",
        "linkedin": ";duchao/;;min-lin-08a3a422/",
        "or_profile": "~Zichen_Liu1;~Chao_Du1;~Wee_Sun_Lee1;~Min_Lin1",
        "aff": ";Sea AI Lab;National University of Singapore;Sea AI Lab",
        "aff_domain": ";sea.com;nus.edu.sg;sea.com",
        "position": ";Senior Research Scientist;Full Professor;Principal Researcher",
        "bibtex": "@inproceedings{\nliu2024locality,\ntitle={Locality Sensitive Sparse Encoding for Learning World Models Online},\nauthor={Zichen Liu and Chao Du and Wee Sun Lee and Min Lin},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=i8PjQT3Uig}\n}",
        "github": "",
        "project": "",
        "reviewers": "CrA3;2Y3F;LJy1",
        "pdf_size": 1939576,
        "rating": "6;6;8",
        "confidence": "4;3;3",
        "soundness": "2;2;3",
        "contribution": "3;2;3",
        "presentation": "2;3;3",
        "wc_summary": "163;90;51",
        "wc_strengths": "109;26;44",
        "wc_weaknesses": "643;311;51",
        "wc_questions": "84;2;60",
        "wc_review": "999;429;206",
        "wc_reply_reviewers": "336;9;0",
        "wc_reply_authors": "942;1237;154",
        "reply_reviewers": "1;1;0",
        "reply_authors": "3;4;1",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            101.33333333333333,
            46.42078078715274
        ],
        "wc_strengths_avg": [
            59.666666666666664,
            35.64952859280034
        ],
        "wc_weaknesses_avg": [
            335.0,
            242.27807714827742
        ],
        "wc_questions_avg": [
            48.666666666666664,
            34.42221504913489
        ],
        "wc_review_avg": [
            544.6666666666666,
            333.91249685442375
        ],
        "wc_reply_reviewers_avg": [
            115.0,
            156.31378697990783
        ],
        "wc_reply_authors_avg": [
            777.6666666666666,
            457.14792159893085
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8853641238689050941&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=i8PjQT3Uig",
        "pdf": "https://openreview.net/pdf?id=i8PjQT3Uig",
        "email": ";sea.com;nus.edu.sg;sea.com",
        "author_num": 4,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Sea AI Lab;National University of Singapore",
        "aff_unique_dep": ";",
        "aff_unique_url": ";https://www.nus.edu.sg",
        "aff_unique_abbr": ";NUS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "1",
        "aff_country_unique": ";Singapore"
    },
    {
        "id": "i8bdPSmOwk",
        "title": "Momentum-driven Noise-free Guided Conditional Sampling for Denoising Diffusion Probabilistic Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We present a novel approach for conditional sampling of denoising diffusion probabilistic models (DDPM) using noise-free guidance, which is applicable to any guidance function operating on clean data. We observe that the performance gap between previous clean estimation $(\\widehat{x_0})$-based methods and noised sample $(x_t)$-based methods stems from the incorporation of estimation deviation in the clean-estimation guidance process. The former contrasts with noise-guided techniques where noise contamination is addressed by a noise-finetuned classifier, leading to inconsistent and unreliable guidance gradients from the inaccurate clean estimation. To tackle this issue, we propose a two-fold solution: (1) implementing momentum-driven gradient filtering to stabilize the gradient transmitted from the guidance function, ensuring coherence throughout the denoising process, and adaptively adjusting the update stepsize of pivot pixels to increase their resilience against detrimental gradients; and (2) introducing a guidance suppression scheme to alleviate the impact of unreasonably large weights assigned considering the significantly larger estimation deviation in the early stage. Our momentum-driven noise-free conditional sampling method demonstrates superior performance in guided image generation tasks at less than 2\\% of the training cost for classifiers, eliminating the need for noise-finetuning. Moreover, it offers the potential for reusing guidance on DDPM with other noise schedules. We further showcase the versatility of our approach by applying it to the arbitrary style transfer task, achieving state-of-the-art performance without being limited to labeled datasets.",
        "keywords": "diffusion models;conditional image generation;arbitrary style-transfer",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Qi Jiang;Haofei Lu;Lei Chu;Jiahao Li;Yan Lu;Yuexin Ma",
        "authorids": "~Qi_Jiang1;~Haofei_Lu1;~Lei_Chu2;~Jiahao_Li3;~Yan_Lu7;~Yuexin_Ma2",
        "gender": ";;;;M;F",
        "homepage": ";;;;https://www.microsoft.com/en-us/research/people/yanlu/;http://yuexinma.me/aboutme.html",
        "dblp": ";;;35/4180;15/4830-1;209/5925",
        "google_scholar": ";;;AcOcw0AAAAAJ;djk5l-4AAAAJ;",
        "orcid": ";;;;0000-0001-5383-6424;",
        "linkedin": ";;;;;",
        "or_profile": "~Qi_Jiang1;~Haofei_Lu1;~Lei_Chu2;~Jiahao_Li3;~Yan_Lu7;~Yuexin_Ma2",
        "aff": ";;;Microsoft Research Asia;Microsoft Research Asia;ShanghaiTech University",
        "aff_domain": ";;;microsoft.com;microsoft.com;shanghaitech.edu.cn",
        "position": ";;;Researcher;Partner Research Manager;Assistant Professor",
        "bibtex": "@misc{\njiang2024momentumdriven,\ntitle={Momentum-driven Noise-free Guided Conditional Sampling for Denoising Diffusion Probabilistic Models},\nauthor={Qi Jiang and Haofei Lu and Lei Chu and Jiahao Li and Yan Lu and Yuexin Ma},\nyear={2024},\nurl={https://openreview.net/forum?id=i8bdPSmOwk}\n}",
        "github": "",
        "project": "",
        "reviewers": "SuQ1;hNt5;TEdQ",
        "site": "https://openreview.net/forum?id=i8bdPSmOwk",
        "pdf_size": 20959338,
        "rating": "5;5;6",
        "confidence": "4;3;4",
        "soundness": "2;3;3",
        "contribution": "2;2;3",
        "presentation": "3;3;3",
        "wc_summary": "84;88;66",
        "wc_strengths": "51;93;66",
        "wc_weaknesses": "262;195;176",
        "wc_questions": "2;2;4",
        "wc_review": "399;378;312",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "838;572;245",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            79.33333333333333,
            9.568466729604882
        ],
        "wc_strengths_avg": [
            70.0,
            17.378147196982766
        ],
        "wc_weaknesses_avg": [
            211.0,
            36.88721549082645
        ],
        "wc_questions_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "wc_review_avg": [
            363.0,
            37.067505985701274
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            551.6666666666666,
            242.5178114879171
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:v3vBZrbQgekJ:scholar.google.com/&scioq=Momentum-driven+Noise-free+Guided+Conditional+Sampling+for+Denoising+Diffusion+Probabilistic+Models&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Microsoft;ShanghaiTech University",
        "aff_unique_dep": "Research;",
        "aff_unique_url": "https://www.microsoft.com/en-us/research/group/asia;https://www.shanghaitech.edu.cn",
        "aff_unique_abbr": "MSR Asia;ShanghaiTech",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Asia;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "i91bz8kRnK",
        "title": "Language-driven Open-Vocabulary Keypoint Detection for Animal Body and Face",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Current approaches for image-based keypoint detection on animal (including human) body and face are limited to specific keypoints and species. We address the limitation by proposing the Open-Vocabulary Keypoint Detection (OVKD) task. It aims to use text prompts to localize arbitrary keypoints of any species. To accomplish this objective, we propose Open-Vocabulary Keypoint Detection with Semantic-feature Matching (KDSM), which utilizes both vision and language models to harness the relationship between text and vision and thus achieve keypoint detection through associating text prompt with relevant keypoint features. Additionally, KDSM integrates domain distribution matrix matching and some special designs to reinforce the relationship between language and vision, thereby improving the model's generalizability and performance. Extensive experiments show that our proposed components bring significant performance improvements, and our overall method achieves impressive results in OVKD. Remarkably, our method outperforms the state-of-the-art few-shot keypoint detection methods using a zero-shot fashion. We will make the source code publicly accessible.",
        "keywords": "Keypoint detection;Open-Vocabulary Keypoint detection;Open-set Keypoint detection",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Hao Zhang;Kaipeng Zhang;Lumin Xu;Shenqi Lai;Wenqi Shao;Nanning Zheng;Ping Luo;Yu Qiao",
        "authorids": "~Hao_Zhang56;~Kaipeng_Zhang1;~Lumin_Xu1;~Shenqi_Lai1;~Wenqi_Shao2;~Nanning_Zheng1;~Ping_Luo2;~Yu_Qiao1",
        "gender": "M;M;;M;M;M;;",
        "homepage": ";http://kpzhang93.github.io/;http://mmlab.ie.cuhk.edu.hk;;https://wqshao126.github.io/;;;",
        "dblp": ";179/2126;212/1288;238/0159;227/3122;07/256-1;;",
        "google_scholar": "hwZUvY0AAAAJ;4OqZBmYAAAAJ;;CgadbL8AAAAJ;Bs9mrwwAAAAJ;https://scholar.google.com/citations?hl=zh-CN;;",
        "orcid": "0000-0002-3572-7053;;;;;;;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Hao_Zhang56;~Kaipeng_Zhang1;~Lumin_Xu1;~Shenqi_Lai1;~Wenqi_Shao2;~Nanning_Zheng1;~Ping_Luo2;~Yu_Qiao1",
        "aff": "Xi'an Jiaotong University;Shanghai AI Laboratory;The Chinese University of Hong Kong;Zhejiang University;Shanghai AI Laboratory;Xi'an Jiaotong University;;",
        "aff_domain": "xjtu.edu.cn;pjlab.org.cn;cuhk.edu.hk;zju.edu.cn;pjlab.org.cn;xjtu.edu.cn;;",
        "position": "PhD student;Researcher;PhD student;PhD student;Researcher;Full Professor;;",
        "bibtex": "@misc{\nzhang2024languagedriven,\ntitle={Language-driven Open-Vocabulary Keypoint Detection for Animal Body and Face},\nauthor={Hao Zhang and Kaipeng Zhang and Lumin Xu and Shenqi Lai and Wenqi Shao and Nanning Zheng and Ping Luo and Yu Qiao},\nyear={2024},\nurl={https://openreview.net/forum?id=i91bz8kRnK}\n}",
        "github": "",
        "project": "",
        "reviewers": "yVmq;As86;r55N;eZk5;R5x4",
        "site": "https://openreview.net/forum?id=i91bz8kRnK",
        "pdf_size": 2675557,
        "rating": "3;5;5;6;6",
        "confidence": "4;4;4;4;5",
        "soundness": "2;3;3;3;2",
        "contribution": "2;2;3;3;2",
        "presentation": "3;2;3;3;3",
        "wc_summary": "95;50;65;86;104",
        "wc_strengths": "54;55;55;19;32",
        "wc_weaknesses": "141;66;198;66;309",
        "wc_questions": "25;354;3;75;1",
        "wc_review": "315;525;321;246;446",
        "wc_reply_reviewers": "0;54;0;0;0",
        "wc_reply_authors": "580;1341;520;287;1441",
        "reply_reviewers": "0;1;0;0;0",
        "reply_authors": "1;2;1;1;2",
        "rating_avg": [
            5.0,
            1.0954451150103321
        ],
        "confidence_avg": [
            4.2,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            80.0,
            19.809088823063014
        ],
        "wc_strengths_avg": [
            43.0,
            14.872793954062566
        ],
        "wc_weaknesses_avg": [
            156.0,
            91.21184133652824
        ],
        "wc_questions_avg": [
            91.6,
            133.88293393857188
        ],
        "wc_review_avg": [
            370.6,
            100.59940357676084
        ],
        "wc_reply_reviewers_avg": [
            10.8,
            21.6
        ],
        "wc_reply_authors_avg": [
            833.8,
            466.43730554062677
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            1.4,
            0.4898979485566356
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.4564354645876385,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7687381446008301344&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;3;1;0",
        "aff_unique_norm": "Xi'an Jiao Tong University;Shanghai AI Laboratory;Chinese University of Hong Kong;Zhejiang University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.xjtu.edu.cn;https://www.shanghai-ai-lab.com;https://www.cuhk.edu.hk;https://www.zju.edu.cn",
        "aff_unique_abbr": "XJTU;SAIL;CUHK;ZJU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "i92ssjkZCz",
        "title": "UniPAD: A Universal Pre-training Paradigm for Autonomous Driving",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In the context of autonomous driving, the significance of effective feature learning is widely acknowledged. While conventional 3D self-supervised pre-training methods have shown widespread success, most methods follow the ideas originally designed for 2D images. In this paper, we present UniPAD, a novel self-supervised learning paradigm applying 3D volumetric differentiable rendering. UniPAD implicitly encodes 3D space, facilitating the reconstruction of continuous 3D shape structures and the intricate appearance characteristics of their 2D projections. The flexibility of our method enables seamless integration into both 2D and 3D frameworks, enabling a more holistic comprehension of the scenes. We manifest the feasibility and effectiveness of UniPAD by conducting extensive experiments on various downstream 3D tasks. Our method significantly improves lidar-, camera-, and lidar-camera-based baseline by 9.1, 7.7, and 6.9 NDS, respectively. Notably, our pretraining pipeline achieves 73.2 NDS for 3D object detection and 79.4 mIoU for 3D semantic segmentation on the nuScenes validation set, achieving state-of-the-art results in comparison with previous methods.",
        "keywords": "Multimodal Pre-training; Autonomous Driving; 3D Object Detection; 3D Semantic Segmentation",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Honghui Yang;Sha Zhang;Di Huang;Xiaoyang Wu;Haoyi Zhu;Tong He;SHIXIANG TANG;Hengshuang Zhao;Qibo Qiu;Binbin Lin;Xiaofei He;Wanli Ouyang",
        "authorids": "~Honghui_Yang1;~Sha_Zhang1;~Di_Huang6;~Xiaoyang_Wu1;~Haoyi_Zhu1;~Tong_He2;~SHIXIANG_TANG1;~Hengshuang_Zhao2;~Qibo_Qiu1;~Binbin_Lin3;~Xiaofei_He2;~Wanli_Ouyang1",
        "gender": ";F;;M;M;M;M;M;;M;M;",
        "homepage": ";;;https://xywu.me;https://www.haoyizhu.site/;http://tonghe90.github.io/;;https://hszhao.github.io;;https://www.linkedin.com/in/binbin-lin-03598b31/;https://person.zju.edu.cn/0007101;",
        "dblp": ";;;56/4409-2;;02/1554-1;260/6757;185/7848;;51/8073;h/XiaofeiHe.html;",
        "google_scholar": ";;;Np1dTpQAAAAJ;pD1NOyUAAAAJ;kWADCMUAAAAJ;TJ4ihdkAAAAJ;4uE10I0AAAAJ;;Zmvq4KYAAAAJ;QLLFowsAAAAJ;",
        "orcid": ";0000-0002-1814-6783;;;;0000-0003-2772-9320;;0000-0001-8277-2706;;0000-0002-0330-6406;0009-0001-9107-2354;",
        "linkedin": ";;;;;;shixiang-tang-80441a1a3/;hengshuang-zhao-347b8391/?originalSubdomain=hk;;;;",
        "or_profile": "~Honghui_Yang1;~Sha_Zhang1;~Di_Huang6;~Xiaoyang_Wu1;~Haoyi_Zhu1;~Tong_He2;~SHIXIANG_TANG1;~Hengshuang_Zhao2;~Qibo_Qiu1;~Binbin_Lin3;~Xiaofei_He2;~Wanli_Ouyang1",
        "aff": ";University of Science and Technology of China;;the University of Hong Kong, University of Hong Kong;University of Science and Technology of China;Shanghai AI lab;The Chinese University of Hong Kong;The University of Hong Kong;;Zhejiang University;Zhejiang University;",
        "aff_domain": ";ustc.edu.cn;;cs.hku.hk;ustc.edu.cn;pjlab.org.cn;cuhk.edu.hk;hku.hk;;zju.edu.cn;zju.edu.cn;",
        "position": ";PhD student;;PhD student;PhD student;Researcher;Postdoc;Assistant Professor;;Researcher;Professor;",
        "bibtex": "@misc{\nyang2024unipad,\ntitle={Uni{PAD}: A Universal Pre-training Paradigm for Autonomous Driving},\nauthor={Honghui Yang and Sha Zhang and Di Huang and Xiaoyang Wu and Haoyi Zhu and Tong He and SHIXIANG TANG and Hengshuang Zhao and Qibo Qiu and Binbin Lin and Xiaofei He and Wanli Ouyang},\nyear={2024},\nurl={https://openreview.net/forum?id=i92ssjkZCz}\n}",
        "github": "",
        "project": "",
        "reviewers": "NRvC;k4Vb;Cmb1;2nXX",
        "site": "https://openreview.net/forum?id=i92ssjkZCz",
        "pdf_size": 7042894,
        "rating": "5;5;6;6",
        "confidence": "3;4;5;3",
        "soundness": "2;2;3;3",
        "contribution": "3;3;3;4",
        "presentation": "2;2;3;3",
        "wc_summary": "203;226;87;259",
        "wc_strengths": "75;43;65;19",
        "wc_weaknesses": "256;68;135;39",
        "wc_questions": "103;459;34;1",
        "wc_review": "637;796;321;318",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            193.75,
            64.76640718767716
        ],
        "wc_strengths_avg": [
            50.5,
            21.558061137310098
        ],
        "wc_weaknesses_avg": [
            124.5,
            83.5239486614468
        ],
        "wc_questions_avg": [
            149.25,
            182.58200212507256
        ],
        "wc_review_avg": [
            518.0,
            206.30923391840705
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            12,
            0
        ],
        "corr_rating_confidence": 0.30151134457776363,
        "gs_citation": 47,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4354953188435144047&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;0;2;3;1;4;4",
        "aff_unique_norm": "University of Science and Technology of China;University of Hong Kong;Shanghai AI Lab;Chinese University of Hong Kong;Zhejiang University",
        "aff_unique_dep": ";;AI Research;;",
        "aff_unique_url": "http://www.ustc.edu.cn;https://www.hku.hk;https://www.shanghaiailab.com;https://www.cuhk.edu.hk;https://www.zju.edu.cn",
        "aff_unique_abbr": "USTC;HKU;Shanghai AI Lab;CUHK;ZJU",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Scaling Laws for Sparsely-Connected Foundation Models",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18075",
        "id": "i9K2ZWkYIP",
        "author_site": "Elias Frantar, Carlos Riquelme Ruiz, Neil Houlsby, Dan Alistarh, Utku Evci",
        "tldr": "",
        "abstract": "We explore the impact of parameter sparsity on the scaling behavior of Transformers trained on massive datasets (i.e., \"foundation models\"), in both vision and language domains. In this setting, we identify the first scaling law describing the relationship between weight sparsity, number of non-zero parameters, and amount of training data, which we validate empirically across model and data scales; on ViT/JFT-4B and T5/C4. These results allow us to characterize the \"optimal sparsity\", the sparsity level which yields the best performance for a given effective model size and training budget. For a fixed number of non-zero parameters, we identify that the optimal sparsity increases with the amount of data used for training. We also extend our study to different sparsity structures (such as the hardware-friendly n:m pattern) and strategies (such as starting from a pretrained dense model). Our findings shed light on the power and limitations of weight sparsity across various parameter and computational settings, offering both theoretical understanding and practical implications for leveraging sparsity towards computational efficiency improvements. We provide pruning and scaling law fitting code at: github.com/google-research/jaxpruner/tree/main/jaxpruner/projects/bigsparse.",
        "keywords": "sparsity;scaling;optimal sparsity;efficiency;foundational models;transformers;structured sparsity;pruning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/c86b1992123f70485daa4bcaa319070a3d63fe58.zip",
        "author": "Elias Frantar;Carlos Riquelme Ruiz;Neil Houlsby;Dan Alistarh;Utku Evci",
        "authorids": "~Elias_Frantar1;~Carlos_Riquelme_Ruiz1;~Neil_Houlsby1;~Dan_Alistarh7;~Utku_Evci1",
        "gender": "M;M;M;;M",
        "homepage": ";https://rikel.github.io/;https://neilhoulsby.github.io/;http://evcu.github.io;http://people.csail.mit.edu/alistarh/",
        "dblp": "259/2210;https://dblp.uni-trier.de/pers/hd/r/Riquelme:Carlos;91/10669;179/8146;36/3251.html",
        "google_scholar": "hjdlwz8AAAAJ;Es2BBeYAAAAJ;https://scholar.google.com/citations?hl=en;8yGMMwcAAAAJ;https://scholar.google.com.tw/citations?user=75q-6ZQAAAAJ",
        "orcid": ";;;;",
        "linkedin": "elias-frantar-5b43181a4;;;;",
        "or_profile": "~Elias_Frantar1;~Carlos_Riquelme_Ruiz1;~Neil_Houlsby1;~Utku_Evci1;~Dan_Alistarh1",
        "aff": "Institute of Science and Technology Austria;Google;Google;Google;Institute of Science and Technology",
        "aff_domain": "ist.ac.at;google.com;google.com;google.com;ist.ac.at",
        "position": "PhD student;Researcher;Researcher;Researcher;Full Professor",
        "bibtex": "@inproceedings{\nfrantar2024scaling,\ntitle={Scaling Laws for Sparsely-Connected Foundation Models},\nauthor={Elias Frantar and Carlos Riquelme Ruiz and Neil Houlsby and Dan Alistarh and Utku Evci},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=i9K2ZWkYIP}\n}",
        "github": "",
        "project": "",
        "reviewers": "Tdrh;1amU;jJsH;pZ1g",
        "pdf_size": 452626,
        "rating": "6;6;8;8",
        "confidence": "3;5;4;3",
        "soundness": "3;3;3;3",
        "contribution": "3;2;3;3",
        "presentation": "2;3;4;3",
        "wc_summary": "21;62;95;89",
        "wc_strengths": "35;77;157;71",
        "wc_weaknesses": "50;120;78;45",
        "wc_questions": "42;102;4;5",
        "wc_review": "148;361;334;210",
        "wc_reply_reviewers": "0;138;14;14",
        "wc_reply_authors": "583;897;488;287",
        "reply_reviewers": "0;2;1;1",
        "reply_authors": "1;3;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            66.75,
            29.192250684042847
        ],
        "wc_strengths_avg": [
            85.0,
            44.56455991031439
        ],
        "wc_weaknesses_avg": [
            73.25,
            29.77729839995563
        ],
        "wc_questions_avg": [
            38.25,
            39.86461463503692
        ],
        "wc_review_avg": [
            263.25,
            87.57675205212854
        ],
        "wc_reply_reviewers_avg": [
            41.5,
            56.00669602824291
        ],
        "wc_reply_authors_avg": [
            563.75,
            220.08790857291547
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.30151134457776363,
        "gs_citation": 24,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7913780078158927003&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=i9K2ZWkYIP",
        "pdf": "https://openreview.net/pdf?id=i9K2ZWkYIP",
        "email": "ist.ac.at;google.com;google.com;google.com;ist.ac.at",
        "author_num": 5,
        "aff_unique_index": "0;1;1;1;2",
        "aff_unique_norm": "Institute of Science and Technology Austria;Google;Institute of Science and Technology",
        "aff_unique_dep": ";Google;",
        "aff_unique_url": "https://www.ist.ac.at;https://www.google.com;",
        "aff_unique_abbr": "IST Austria;Google;",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "Austria;United States;"
    },
    {
        "title": "Asymptotically Free Sketched Ridge Ensembles: Risks, Cross-Validation, and Tuning",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18074",
        "id": "i9Vs5NGDpk",
        "author_site": "Pratik Patil, Daniel LeJeune",
        "tldr": "",
        "abstract": "We employ random matrix theory to establish consistency of generalized cross validation (GCV) for estimating prediction risks of sketched ridge regression ensembles, enabling efficient and consistent tuning of regularization and sketching parameters. Our results hold for a broad class of asymptotically free sketches under very mild data assumptions. For squared prediction risk, we provide a decomposition into an unsketched equivalent implicit ridge bias and a sketching-based variance, and prove that the risk can be globally optimized by only tuning sketch size in infinite ensembles. For general subquadratic prediction risk functionals, we extend GCV to construct consistent risk estimators, and thereby obtain distributional convergence of the GCV-corrected predictions in Wasserstein-2 metric. This in particular allows construction of prediction intervals with asymptotically correct coverage conditional on the training data. We also propose an \"ensemble trick\" whereby the risk for unsketched ridge regression can be efficiently estimated via GCV using small sketched ridge ensembles. We empirically validate our theoretical results using both synthetic and real large-scale datasets with practical sketches including CountSketch and subsampled randomized discrete cosine transforms.",
        "keywords": "asymptotic freeness;sketching;ensembles;ridge regression;generalized cross-validation;tuning",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/2e22cf2dbfc472ba57b5af7250bc243fcc899eb8.zip",
        "author": "Pratik Patil;Daniel LeJeune",
        "authorids": "~Pratik_Patil1;~Daniel_LeJeune1",
        "gender": ";M",
        "homepage": "https://www.stat.berkeley.edu/~pratikpatil/;https://dlej.net/",
        "dblp": "48/2268;219/9028",
        "google_scholar": ";vlZDXYgAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Pratik_Patil1;~Daniel_LeJeune1",
        "aff": "University of California, Berkeley;Stanford University",
        "aff_domain": "berkeley.edu;stanford.edu",
        "position": "Postdoc;Postdoc",
        "bibtex": "@inproceedings{\npatil2024asymptotically,\ntitle={Asymptotically Free Sketched Ridge Ensembles: Risks, Cross-Validation, and Tuning},\nauthor={Pratik Patil and Daniel LeJeune},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=i9Vs5NGDpk}\n}",
        "github": "",
        "project": "",
        "reviewers": "GR2e;WHDZ;qfu6;t4Ef",
        "pdf_size": 1266819,
        "rating": "6;8;8;8",
        "confidence": "4;3;4;3",
        "soundness": "3;3;4;3",
        "contribution": "3;3;4;3",
        "presentation": "3;3;4;3",
        "wc_summary": "57;94;194;79",
        "wc_strengths": "73;88;112;28",
        "wc_weaknesses": "49;103;147;5",
        "wc_questions": "63;146;4;31",
        "wc_review": "242;431;457;143",
        "wc_reply_reviewers": "22;128;15;0",
        "wc_reply_authors": "437;639;501;231",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            106.0,
            52.48333068699051
        ],
        "wc_strengths_avg": [
            75.25,
            30.621683493890405
        ],
        "wc_weaknesses_avg": [
            76.0,
            53.71219600798314
        ],
        "wc_questions_avg": [
            61.0,
            53.33385416412356
        ],
        "wc_review_avg": [
            318.25,
            130.8536873763976
        ],
        "wc_reply_reviewers_avg": [
            41.25,
            50.71180828958873
        ],
        "wc_reply_authors_avg": [
            452.0,
            147.0
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4136434028747801262&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=i9Vs5NGDpk",
        "pdf": "https://openreview.net/pdf?id=i9Vs5NGDpk",
        "email": "berkeley.edu;stanford.edu",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of California, Berkeley;Stanford University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.berkeley.edu;https://www.stanford.edu",
        "aff_unique_abbr": "UC Berkeley;Stanford",
        "aff_campus_unique_index": "0;1",
        "aff_campus_unique": "Berkeley;Stanford",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Feature emergence via margin maximization: case studies in algebraic tasks",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18073",
        "id": "i9wDX850jR",
        "author_site": "Depen Morwani, Benjamin Edelman, Costin-Andrei Oncescu, Rosie Zhao, Sham Kakade",
        "tldr": "",
        "abstract": "Understanding the internal representations learned by neural networks is a cornerstone challenge in the science of machine learning. While there have been significant recent strides in some cases towards understanding *how* neural networks implement specific target functions, this paper explores a complementary question -- *why* do networks arrive at particular computational strategies? \nOur inquiry focuses on the algebraic learning tasks of modular addition, sparse parities, and finite group operations. Our primary theoretical findings analytically characterize the features learned by stylized neural networks for these algebraic tasks. Notably, our main technique demonstrates how the principle of margin maximization alone can be used to fully specify the features learned by the network. \nSpecifically, we prove that the trained networks utilize Fourier features to perform modular addition and employ features corresponding to irreducible group-theoretic representations to perform compositions in general groups, aligning closely with the empirical observations of Nanda et al. (2023) and Chughtai et al. (2023). More generally, we hope our techniques can help to foster a deeper understanding of why neural networks adopt specific computational strategies.",
        "keywords": "inductive bias;margin maximization;feature learning;mechanistic interpretability",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Depen Morwani;Benjamin L. Edelman;Costin-Andrei Oncescu;Rosie Zhao;Sham M. Kakade",
        "authorids": "~Depen_Morwani1;~Benjamin_L._Edelman1;~Costin-Andrei_Oncescu1;~Rosie_Zhao1;~Sham_M._Kakade1",
        "gender": "M;M;F;M;M",
        "homepage": ";;https://rosieyzh.github.io/;https://shamulent.github.io;https://www.benjaminedelman.com/",
        "dblp": "277/5200;;277/9223;s/SMKakade;241/9410",
        "google_scholar": "vOngxFUAAAAJ;;rgwbR6wAAAAJ;https://scholar.google.com.tw/citations?user=wb-DKCIAAAAJ;mQSj2C0AAAAJ",
        "orcid": ";;;;",
        "linkedin": "depen-morwani-070298122/;costin-andrei-oncescu-0b3b18176/;https://linkedin.com/in/rosieyzh;;",
        "or_profile": "~Depen_Morwani1;~Costin-Andrei_Oncescu1;~Rosie_Zhao1;~Sham_M._Kakade1;~Benjamin_L_Edelman1",
        "aff": "Harvard University, Harvard University;Harvard University, Harvard University;Harvard University, Harvard University;Harvard University;Harvard University",
        "aff_domain": "g.harvard.edu;fas.harvard.edu;g.harvard.edu;harvard.edu;harvard.edu",
        "position": "PhD student;PhD student;PhD student;Full Professor;PhD student",
        "bibtex": "@inproceedings{\nmorwani2024feature,\ntitle={Feature emergence via margin maximization: case studies in algebraic tasks},\nauthor={Depen Morwani and Benjamin L. Edelman and Costin-Andrei Oncescu and Rosie Zhao and Sham M. Kakade},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=i9wDX850jR}\n}",
        "github": "",
        "project": "",
        "reviewers": "hFRW;CYd2;xfNV;jPZB",
        "pdf_size": 914315,
        "rating": "6;6;8;8",
        "confidence": "3;3;3;2",
        "soundness": "4;4;3;4",
        "contribution": "4;2;3;2",
        "presentation": "2;2;3;3",
        "wc_summary": "187;271;63;92",
        "wc_strengths": "83;122;159;43",
        "wc_weaknesses": "422;214;274;40",
        "wc_questions": "2;176;43;142",
        "wc_review": "694;783;539;317",
        "wc_reply_reviewers": "4;143;23;4",
        "wc_reply_authors": "175;523;248;103",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            153.25,
            82.00724053399188
        ],
        "wc_strengths_avg": [
            101.75,
            43.27455950093542
        ],
        "wc_weaknesses_avg": [
            237.5,
            136.8676367882488
        ],
        "wc_questions_avg": [
            90.75,
            70.80033545118272
        ],
        "wc_review_avg": [
            583.25,
            176.78571067821065
        ],
        "wc_reply_reviewers_avg": [
            43.5,
            57.967663399519566
        ],
        "wc_reply_authors_avg": [
            262.25,
            159.0336049393335
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7959697162567485441&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=i9wDX850jR",
        "pdf": "https://openreview.net/pdf?id=i9wDX850jR",
        "email": "g.harvard.edu;fas.harvard.edu;g.harvard.edu;harvard.edu;harvard.edu",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Harvard University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.harvard.edu",
        "aff_unique_abbr": "Harvard",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "iARAKITHTH",
        "title": "Spotting LLMs With Binoculars: Zero-Shot Detection of Machine-Generated Text",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Detecting text generated by modern large language models is thought to be hard, as both LLMs and humans can exhibit a wide range of complex behaviors. However, we find that a score based on contrasting two closely related language models is highly accurate at separating human-generated and machine-generated text. \nBased on this mechanism, we propose a novel LLM detector that only requires simple calculations using pre-trained LLMs.  The method, called *Binoculars*, achieves state-of-the-art accuracy without any training data.\nIt is capable of spotting machine text from a range of modern LLMs without any model-specific modifications.\nWe comprehensively evaluate *Binoculars* on a number of text sources and in varied situations. \nOn news documents *Binoculars* detect 95\\% of synthetic samples at a false positive rate of 0.01%, given 512 tokens of text from either humans or ChatGPT, matching highly competitive commercial detectors tuned specifically to detect ChatGPT.",
        "keywords": "LLM;Detection;Language Modelling;AI Detection",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/74e66936eb8ed217cd7c27d8ddd6dad5be64fb4e.zip",
        "author": "Abhimanyu Hans;Avi Schwarzschild;Valeriia Cherepanova;Hamid Kazemi;Aniruddha Saha;Micah Goldblum;Jonas Geiping;Tom Goldstein",
        "authorids": "~Abhimanyu_Hans1;~Avi_Schwarzschild1;~Valeriia_Cherepanova1;~Hamid_Kazemi1;~Aniruddha_Saha1;~Micah_Goldblum1;~Jonas_Geiping1;~Tom_Goldstein1",
        "gender": "M;M;F;M;M;;M;M",
        "homepage": "https://ahans30.github.io/;https://cs.umd.edu/~avi1;https://www.vcherepanova.com/;;https://ani0075saha.github.io/;;https://jonasgeiping.github.io/;https://www.cs.umd.edu/~tomg/",
        "dblp": ";249/9334.html;;;221/8102;241/7231;190/7229;25/8184",
        "google_scholar": "b77HAM8AAAAJ;WNvQ7AcAAAAJ;PySUqqUAAAAJ;7hNdaGQAAAAJ;xfjALj0AAAAJ;pGDKzuUAAAAJ;https://scholar.google.de/citations?user=206vNCEAAAAJ;KmSuVtgAAAAJ",
        "orcid": ";;;;;;;",
        "linkedin": "abhimanyu-hans-891a15122/;;;hamid-kazemi-608a8085/;;;;",
        "or_profile": "~Abhimanyu_Hans1;~Avi_Schwarzschild1;~Valeriia_Cherepanova1;~Hamid_Kazemi1;~Aniruddha_Saha1;~Micah_Goldblum1;~Jonas_Geiping1;~Tom_Goldstein1",
        "aff": "Department of Computer Science, University of Maryland, College Park;Carnegie Mellon University;Amazon;University of Maryland, College Park;University of Maryland, College Park;New York University;Max Planck Institute for Intelligent Systems, Max-Planck Institute;University of Maryland, College Park",
        "aff_domain": "cs.umd.edu;cmu.edu;amazon.com;umd.edu;umd.edu;nyu.edu;tuebingen.mpg.de;umd.edu",
        "position": "PhD student;Postdoc;Postdoc;PhD student;Postdoc;Postdoc;Principal Researcher;Full Professor",
        "bibtex": "@misc{\nhans2024spotting,\ntitle={Spotting {LLM}s With Binoculars: Zero-Shot Detection of Machine-Generated Text},\nauthor={Abhimanyu Hans and Avi Schwarzschild and Valeriia Cherepanova and Hamid Kazemi and Aniruddha Saha and Micah Goldblum and Jonas Geiping and Tom Goldstein},\nyear={2024},\nurl={https://openreview.net/forum?id=iARAKITHTH}\n}",
        "github": "",
        "project": "",
        "reviewers": "CMmZ;iAnY;FmjG;M521",
        "site": "https://openreview.net/forum?id=iARAKITHTH",
        "pdf_size": 3069652,
        "rating": "3;3;3;8",
        "confidence": "3;4;3;3",
        "soundness": "1;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;2;4",
        "wc_summary": "73;67;63;103",
        "wc_strengths": "47;46;45;148",
        "wc_weaknesses": "460;91;612;156",
        "wc_questions": "4;10;29;182",
        "wc_review": "584;214;749;589",
        "wc_reply_reviewers": "36;0;0;0",
        "wc_reply_authors": "1321;612;1203;1139",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "3;2;3;3",
        "rating_avg": [
            4.25,
            2.165063509461097
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            76.5,
            15.708278072405008
        ],
        "wc_strengths_avg": [
            71.5,
            44.17295552710957
        ],
        "wc_weaknesses_avg": [
            329.75,
            214.3716107603803
        ],
        "wc_questions_avg": [
            56.25,
            73.18597884841057
        ],
        "wc_review_avg": [
            534.0,
            196.3097042940058
        ],
        "wc_reply_reviewers_avg": [
            9.0,
            15.588457268119896
        ],
        "wc_reply_authors_avg": [
            1068.75,
            271.6655802636764
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            0.4330127018922193
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 31,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2163974418024982315&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;2;3;3;4;5;3",
        "aff_unique_norm": "University of Maryland, College Park;Carnegie Mellon University;Amazon;University of Maryland;New York University;Max Planck Institute for Intelligent Systems",
        "aff_unique_dep": "Department of Computer Science;;Amazon.com, Inc.;;;Intelligent Systems",
        "aff_unique_url": "https://www/umd.edu;https://www.cmu.edu;https://www.amazon.com;https://www/umd.edu;https://www.nyu.edu;https://www.mpi-is.mpg.de",
        "aff_unique_abbr": "UMD;CMU;Amazon;UMD;NYU;MPI-IS",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "College Park;",
        "aff_country_unique_index": "0;0;0;0;0;0;1;0",
        "aff_country_unique": "United States;Germany"
    },
    {
        "title": "Negatively Correlated Ensemble Reinforcement Learning for Online Diverse Game Level Generation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18072",
        "id": "iAW2EQXfwb",
        "author_site": "Ziqi Wang, Chengpeng Hu, Jialin Liu, Xin Yao",
        "tldr": "",
        "abstract": "Deep reinforcement learning has recently been successfully applied to online procedural content generation in which a policy determines promising game-level segments.  However, existing methods can hardly discover diverse level patterns, while the lack of diversity makes the gameplay boring. This paper proposes an ensemble reinforcement learning approach that uses multiple negatively correlated sub-policies to generate different alternative level segments, and stochastically selects one of them following a selector model. A novel policy regularisation technique is integrated into the approach to diversify the generated alternatives. In addition, we develop theorems to provide general methodologies for optimising policy regularisation in a Markov decision process. The proposed approach is compared with several state-of-the-art policy ensemble methods and classic methods on a well-known level generation benchmark, with two different reward functions expressing game-design goals from different perspectives. Results show that our approach boosts level diversity notably with competitive performance in terms of the reward.  Furthermore, by varying the regularisation coefficient, the trained generators form a well-spread Pareto front, allowing explicit trade-offs between diversity and rewards of generated levels.",
        "keywords": "Level Generation;Video Games;Deep Reinforcement Learning;Ensemble Learning;Regularisation",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Ziqi Wang;Chengpeng Hu;Jialin Liu;Xin Yao",
        "authorids": "~Ziqi_Wang7;~Chengpeng_Hu1;~Jialin_Liu4;~Xin_Yao1",
        "gender": "M;M;F;",
        "homepage": ";https://scholar.google.com/citations?user=g-ePd4UAAAAJ&hl=zh-CN;http://www.liujialin.tech/;http://www.cs.bham.ac.uk/~xin",
        "dblp": ";278/3130;32/5050-1;",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;g-ePd4UAAAAJ;https://scholar.google.co.uk/citations?user=xhytgbIAAAAJ;",
        "orcid": ";0000-0001-8343-4186;0000-0001-7047-8454;",
        "linkedin": ";;;",
        "or_profile": "~Ziqi_Wang7;~Chengpeng_Hu1;~Jialin_Liu4;~Xin_Yao1",
        "aff": "Southern University of Science and Technology;Southern University of Science and Technology;Southern University of Science and Technology;",
        "aff_domain": "mail.sustech.edu.cn;sustech.edu.cn;sustech.edu.cn;",
        "position": "MS student;MS student;Assistant Professor;",
        "bibtex": "@inproceedings{\nwang2024negatively,\ntitle={Negatively Correlated Ensemble Reinforcement Learning for Online Diverse Game Level Generation},\nauthor={Ziqi Wang and Chengpeng Hu and Jialin Liu and Xin Yao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=iAW2EQXfwb}\n}",
        "github": "",
        "project": "",
        "reviewers": "qX6Q;cq3K;t3p4;NGar",
        "pdf_size": 5075118,
        "rating": "5;6;6;6",
        "confidence": "3;3;4;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "184;142;149;64",
        "wc_strengths": "116;100;132;46",
        "wc_weaknesses": "108;147;68;107",
        "wc_questions": "103;110;35;203",
        "wc_review": "511;499;384;420",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1432;881;847;560",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "4;2;2;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            134.75,
            43.83705624240752
        ],
        "wc_strengths_avg": [
            98.5,
            32.35351603767356
        ],
        "wc_weaknesses_avg": [
            107.5,
            27.932955446926844
        ],
        "wc_questions_avg": [
            112.75,
            59.776144907479605
        ],
        "wc_review_avg": [
            453.5,
            53.21888762460185
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            930.0,
            315.513074214049
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.25,
            1.0897247358851685
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14367450859464628636&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=iAW2EQXfwb",
        "pdf": "https://openreview.net/pdf?id=iAW2EQXfwb",
        "email": "mail.sustech.edu.cn;sustech.edu.cn;sustech.edu.cn;",
        "author_num": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Southern University of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sustech.edu.cn",
        "aff_unique_abbr": "SUSTech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Neural Contractive Dynamical Systems",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18071",
        "id": "iAYIRHOYy8",
        "author_site": "Hadi Beik Mohammadi, S\u00f8ren Hauberg, Georgios Arvanitidis, Nadia Figueroa, Gerhard Neumann, Leonel Rozo",
        "tldr": "",
        "abstract": "Stability guarantees are crucial when ensuring that a fully autonomous robot does not take undesirable or potentially harmful actions. Unfortunately, global stability guarantees are hard to provide in dynamical systems learned from data, especially when the learned dynamics are governed by neural networks. We propose a novel methodology to learn \\emph{neural contractive dynamical systems}, where our neural architecture ensures contraction, and hence, global stability. To efficiently scale the method to high-dimensional dynamical systems, we develop a variant of the variational autoencoder that learns dynamics in a low-dimensional latent representation space while retaining contractive stability after decoding. We further extend our approach to learning contractive systems on the Lie group of rotations to account for full-pose end-effector dynamic motions. The result is the first highly flexible learning architecture that provides contractive stability guarantees with capability to perform obstacle avoidance. Empirically, we demonstrate that our approach encodes the desired dynamics more accurately than the current state-of-the-art, which provides less strong stability guarantees.",
        "keywords": "learning from demonstration;dynamical systems;contraction theory",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/58947be005497ff04d158bb31e64b18f6186222b.zip",
        "author": "Hadi Beik Mohammadi;S\u00f8ren Hauberg;Georgios Arvanitidis;Nadia Figueroa;Gerhard Neumann;Leonel Rozo",
        "authorids": "~Hadi_Beik_Mohammadi1;~S\u00f8ren_Hauberg1;~Georgios_Arvanitidis1;~Nadia_Figueroa1;~Gerhard_Neumann2;~Leonel_Rozo1",
        "gender": "M;M;M;F;M;M",
        "homepage": ";http://www2.compute.dtu.dk/~sohau/;https://www2.compute.dtu.dk/~gear/;https://nbfigueroa.github.io/;https://alr.anthropomatik.kit.edu/;https://leonelrozo.weebly.com/",
        "dblp": ";39/7226;142/4188;116/8822;60/4878;10/9515",
        "google_scholar": "https://scholar.google.de/citations?hl=en;https://scholar.google.com/citations?hl=en;sFtJbSUAAAAJ;1NQRXHQAAAAJ;https://scholar.google.com.tw/citations?user=GL360kMAAAAJ;https://scholar.google.it/citations?user=vLWgi-YAAAAJ",
        "orcid": ";;0000-0002-0377-2976;0000-0002-6873-4671;;0000-0001-5970-9135",
        "linkedin": ";;;nadiabarbara/;;leonelrozo/",
        "or_profile": "~Hadi_Beik_Mohammadi1;~S\u00f8ren_Hauberg1;~Georgios_Arvanitidis1;~Nadia_Figueroa1;~Gerhard_Neumann1;~Leonel_Dario_Rozo1",
        "aff": ";Technical University of Denmark;Technical University of Denmark;University of Pennsylvania;Karlsruhe Institute of Technology;Robert Bosch GmbH, Bosch",
        "aff_domain": ";dtu.dk;dtu.dk;seas.upenn.edu;kit.edu;de.bosch.com",
        "position": ";Professor;Assistant Professor;Assistant Professor;Full Professor;Principal Researcher",
        "bibtex": "@inproceedings{\nmohammadi2024neural,\ntitle={Neural Contractive Dynamical Systems},\nauthor={Hadi Beik Mohammadi and S{\\o}ren Hauberg and Georgios Arvanitidis and Nadia Figueroa and Gerhard Neumann and Leonel Rozo},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=iAYIRHOYy8}\n}",
        "github": "",
        "project": "",
        "reviewers": "4cHX;fKvz;2Vh1",
        "pdf_size": 50802636,
        "rating": "5;6;8",
        "confidence": "4;3;3",
        "soundness": "2;3;3",
        "contribution": "3;3;3",
        "presentation": "3;2;4",
        "wc_summary": "280;79;418",
        "wc_strengths": "2;81;179",
        "wc_weaknesses": "2;92;69",
        "wc_questions": "2;125;47",
        "wc_review": "286;377;713",
        "wc_reply_reviewers": "0;39;297",
        "wc_reply_authors": "978;1729;1335",
        "reply_reviewers": "0;1;2",
        "reply_authors": "2;4;2",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            259.0,
            139.19051691835907
        ],
        "wc_strengths_avg": [
            87.33333333333333,
            72.39858807708583
        ],
        "wc_weaknesses_avg": [
            54.333333333333336,
            38.177945931591914
        ],
        "wc_questions_avg": [
            58.0,
            50.813384063650005
        ],
        "wc_review_avg": [
            458.6666666666667,
            183.63792878620933
        ],
        "wc_reply_reviewers_avg": [
            112.0,
            131.78011989674314
        ],
        "wc_reply_authors_avg": [
            1347.3333333333333,
            306.71847388480245
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.7559289460184545,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3398253901141208640&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=iAYIRHOYy8",
        "pdf": "https://openreview.net/pdf?id=iAYIRHOYy8",
        "email": ";dtu.dk;dtu.dk;seas.upenn.edu;kit.edu;de.bosch.com",
        "author_num": 6,
        "aff_unique_index": "0;0;1;2;3",
        "aff_unique_norm": "Technical University of Denmark;University of Pennsylvania;Karlsruhe Institute of Technology;Robert Bosch GmbH",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.tek.dk;https://www.upenn.edu;https://www.kit.edu;https://www.bosch.com",
        "aff_unique_abbr": "DTU;UPenn;KIT;Bosch",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;2;2",
        "aff_country_unique": "Denmark;United States;Germany"
    },
    {
        "id": "iAurxvdrdZ",
        "title": "Revisiting Collaborative Filtering",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "As a critical role in recommender systems, Collaborative Filtering (CF) is an indispensable technique. Its learning process typically comprises two key components: interaction encoder and loss function. Existing studies mainly concentrate on developing more robust encoders, such as graph neural networks, to acquire representations modelling multi-hop connectivity from user-item interactions. However, limited attention has been given to examining the desired characteristics of representations in collaborative filtering (CF).",
        "keywords": "Collaborative Filtering",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Hao Zhu;Yifei Zhang;Irwin King;Piotr Koniusz",
        "authorids": "~Hao_Zhu2;~Yifei_Zhang6;~Irwin_King1;~Piotr_Koniusz1",
        "gender": ";M;M;",
        "homepage": ";https://yifeiacc.github.io/;https://www.cse.cuhk.edu.hk/irwin.king/;https://www.koniusz.com",
        "dblp": ";55/5266-1.html;k/IrwinKing;25/8616",
        "google_scholar": ";DmwXESQAAAAJ;MXvC7tkAAAAJ;https://scholar.google.co.uk/citations?user=wZ7-1tUAAAAJ",
        "orcid": ";0000-0003-4185-8663;0000-0001-8106-6447;0000-0002-6340-5289",
        "linkedin": ";;irwinking/;",
        "or_profile": "~Hao_Zhu2;~Yifei_Zhang6;~Irwin_King1;~Piotr_Koniusz1",
        "aff": ";Department of Computer Science and Engineering, The Chinese University of Hong Kong;The Chinese University of Hong Kong;Data61, CSIRO",
        "aff_domain": ";cse.cuhk.edu.hk;cuhk.edu.hk;data61.csiro.au",
        "position": ";PhD student;Full Professor;Principal Researcher",
        "bibtex": "@misc{\nzhu2024revisiting,\ntitle={Revisiting Collaborative Filtering},\nauthor={Hao Zhu and Yifei Zhang and Irwin King and Piotr Koniusz},\nyear={2024},\nurl={https://openreview.net/forum?id=iAurxvdrdZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=iAurxvdrdZ",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Chinese University of Hong Kong;CSIRO",
        "aff_unique_dep": "Department of Computer Science and Engineering;Data61",
        "aff_unique_url": "https://www.cuhk.edu.hk;https://www.csiro.au",
        "aff_unique_abbr": "CUHK;CSIRO",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "China;Australia"
    },
    {
        "id": "iBAWiEjogY",
        "title": "ProteiNexus: Illuminating Protein Pathways through Structural Pre-training",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Protein representation learning has emerged as a powerful tool for various biological tasks. Language models derived from protein sequences represent the predominant trend in many current approaches. However, recent advances reveal that protein sequences alone cannot fully encapsulate the abundant information contained within protein structures, critical for understanding protein function and aiding innovative protein design. In this study, we present ProteiNexus, an innovative approach, effectively integrating protein structure learning with numerous downstream tasks. We propose a structural encoding mechanism adept at capturing fine-grained distance details and spatial positioning. By implementing a robust pre-training strategy and fine-tuning with lightweight decoders designed for specific downstream tasks, our model exhibits outstanding performance, establishing new benchmarks across a range of tasks. The code and models could be found at github repos.",
        "keywords": "Protein Representation Learning;Large-Scale 3D Protein Pretraining;Structural biology",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Jiashan Li;Xi Chen;He Huang;Mingliang Zeng;Jingcheng Yu;Xinqi Gong;Qiwei Ye",
        "authorids": "~Jiashan_Li1;~Xi_Chen45;~He_Huang6;~Mingliang_Zeng1;~Jingcheng_Yu1;~Xinqi_Gong1;~Qiwei_Ye1",
        "gender": ";;M;M;;M;M",
        "homepage": "https://www.researchgate.net/profile/Jiashan_Li4;https://www.baai.ac.cn/;;https://mlzeng.com;;https://www.researchgate.net/profile/Xinqi-Gong;",
        "dblp": ";;;;183/0966;200/7127;50/995",
        "google_scholar": ";;vV9bZ4AAAAAJ;;;JDAZPZ0AAAAJ;RJ6SuR8AAAAJ",
        "orcid": ";;;;;0000-0003-2802-6176;0000-0003-4264-5846",
        "linkedin": ";;;;;;qiwei-ye-15282964/",
        "or_profile": "~Jiashan_Li1;~Xi_Chen45;~He_Huang6;~Mingliang_Zeng1;~Jingcheng_Yu1;~Xinqi_Gong1;~Qiwei_Ye1",
        "aff": "Renmin University of China;BAAI;Beijing Academy of Artificial Intelligence;;Researcher at Beijing Academy of Artificial Intelligence;Renmin University of China;Beijing Academy of Artificial Intelligence",
        "aff_domain": "ruc.edu.cn;baai.ac.cn;baai.ac.cn;;baai.ac.cn;ruc.edu.cn;baai.ac.cn",
        "position": "PhD student;Researcher;Researcher;;Researcher;Full Professor;Principal Researcher",
        "bibtex": "@misc{\nli2024proteinexus,\ntitle={ProteiNexus: Illuminating Protein Pathways through Structural Pre-training},\nauthor={Jiashan Li and Xi Chen and He Huang and Mingliang Zeng and Jingcheng Yu and Xinqi Gong and Qiwei Ye},\nyear={2024},\nurl={https://openreview.net/forum?id=iBAWiEjogY}\n}",
        "github": "",
        "project": "",
        "reviewers": "oPJy;tXRC;wGDE",
        "site": "https://openreview.net/forum?id=iBAWiEjogY",
        "pdf_size": 1597939,
        "rating": "3;3;5",
        "confidence": "5;4;4",
        "soundness": "1;2;3",
        "contribution": "1;2;2",
        "presentation": "2;2;3",
        "wc_summary": "61;40;95",
        "wc_strengths": "33;59;158",
        "wc_weaknesses": "126;372;98",
        "wc_questions": "666;976;114",
        "wc_review": "886;1447;465",
        "wc_reply_reviewers": "654;132;115",
        "wc_reply_authors": "1449;2117;1020",
        "reply_reviewers": "2;1;1",
        "reply_authors": "2;3;2",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            65.33333333333333,
            22.661764175711376
        ],
        "wc_strengths_avg": [
            83.33333333333333,
            53.85371131335539
        ],
        "wc_weaknesses_avg": [
            198.66666666666666,
            123.09707100044618
        ],
        "wc_questions_avg": [
            585.3333333333334,
            356.5027660793422
        ],
        "wc_review_avg": [
            932.6666666666666,
            402.2555848655871
        ],
        "wc_reply_reviewers_avg": [
            300.3333333333333,
            250.1763822230672
        ],
        "wc_reply_authors_avg": [
            1528.6666666666667,
            451.3773981443417
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:VgTmWlCP-N8J:scholar.google.com/&scioq=ProteiNexus:+Illuminating+Protein+Pathways+through+Structural+Pre-training&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1;0;1",
        "aff_unique_norm": "Renmin University of China;Beijing Academy of Artificial Intelligence",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.ruc.edu.cn;https://www.baaic.cn",
        "aff_unique_abbr": "RUC;BAAI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "iBCVaBcpfV",
        "title": "Boosting Unsupervised Contrastive Learning Using Diffusion-Based Data Augmentation From Scratch",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Unsupervised Contrastive learning has gained prominence in fields such as vision, natural language processing, and biology, leveraging predefined positive and negative samples for representation learning. Data augmentation, categorized into hand-designed and model-based methods, has been identified as a crucial component for enhancing contrastive learning. However, hand-designed methods require human expertise in domain-specific data while sometimes distorting the meaning of the data. In contrast, model-based methods, such as generative models, usually require supervision or large-scale external data. To address the problems presented above, this paper proposes DiffAug, a novel unsupervised contrastive learning technique with diffusion mode-based positive data generation. DiffAug consists of a semantic encoder and a conditional diffusion model; the conditional diffusion model generates new positive samples conditioned on the semantic encoding to serve the training of unsupervised contrast learning. With the help of iterative training of the semantic encoder and diffusion model, DiffAug improves the representation ability in an uninterrupted and unsupervised manner. Experimental evaluations show that DiffAug outperforms hand-designed augmentation and classical representation learning methods in classification and clustering tasks on visual and biological datasets, highlighting its potential for generalizing unsupervised learning techniques. The code for review is released at https://anonymous.4open.science/r/diffaug_review-804E.",
        "keywords": "Data Augmentation; AI for Science; Unsupervised Contrastive Learning",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Zelin Zang;Hao Luo;Kai Wang;Panpan Zhang;Fan Wang;Stan Z. Li;Yang You",
        "authorids": "~Zelin_Zang2;~Hao_Luo1;~Kai_Wang8;~Panpan_Zhang1;~Fan_Wang6;~Stan_Z._Li2;~Yang_You1",
        "gender": "M;M;M;F;F;M;M",
        "homepage": ";http://luohao.site/;https://kaiwang960112.github.io/;;;https://www.comp.nus.edu.sg/~youy/;https://en.westlake.edu.cn/academics/School_of_Engineering/About/Our_People/Faculty/201912/t20191206_2497.shtml",
        "dblp": "226/7615;14/3727-4;78/2022-36;;;33/8167-1.html;l/StanZLi",
        "google_scholar": "foERjnQAAAAJ;7QvWnzMAAAAJ;i2II0XIAAAAJ;7QsqATEAAAAJ;WCRGTHsAAAAJ;jF4dPZwAAAAJ;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": ";0000-0002-6405-4011;0000-0002-1154-5175;;0000-0001-7320-1119;;",
        "linkedin": ";;;;;yang-you-0b92914b/;stan-z-li-%E6%9D%8E%E5%AD%90%E9%9D%92-55753224/",
        "or_profile": "~Zelin_Zang2;~Hao_Luo1;~Kai_Wang8;~Panpan_Zhang1;~Fan_Wang6;~Yang_You1;~Stan_Z._Li1",
        "aff": "National University of Singapore;Alibaba Group;National University of Singapore;National University of Singapore;Alibaba Group;National University of Singapore;Westlake University",
        "aff_domain": "nus.edu.sg;alibaba-inc.com;u.nus.edu;u.nus.edu;alibaba-inc.com;nus.edu.sg;westlake.edu.cn",
        "position": "Intern;Researcher;PhD student;PhD student;Senior Staff Algorithm Engineer;Professor;Chair Professor",
        "bibtex": "@misc{\nzang2024boosting,\ntitle={Boosting Unsupervised Contrastive Learning Using Diffusion-Based Data Augmentation From Scratch},\nauthor={Zelin Zang and Hao Luo and Kai Wang and Panpan Zhang and Fan Wang and Stan Z. Li and Yang You},\nyear={2024},\nurl={https://openreview.net/forum?id=iBCVaBcpfV}\n}",
        "github": "",
        "project": "",
        "reviewers": "RifC;AdtB;VepM;Dx6S",
        "site": "https://openreview.net/forum?id=iBCVaBcpfV",
        "pdf_size": 20772823,
        "rating": "3;3;5;5",
        "confidence": "4;4;4;5",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;2",
        "presentation": "3;2;2;3",
        "wc_summary": "54;89;94;60",
        "wc_strengths": "32;60;51;66",
        "wc_weaknesses": "237;428;239;316",
        "wc_questions": "2;39;134;206",
        "wc_review": "325;616;518;648",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            74.25,
            17.469616481193857
        ],
        "wc_strengths_avg": [
            52.25,
            12.852528934026953
        ],
        "wc_weaknesses_avg": [
            305.0,
            77.82994282408282
        ],
        "wc_questions_avg": [
            95.25,
            80.04178596208358
        ],
        "wc_review_avg": [
            526.75,
            125.94319155873413
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8192408275133536453&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0;1;0;2",
        "aff_unique_norm": "National University of Singapore;Alibaba Group;Westlake University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.nus.edu.sg;https://www.alibaba.com;https://www.westlake.edu.cn",
        "aff_unique_abbr": "NUS;Alibaba;WU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;1;0;1",
        "aff_country_unique": "Singapore;China"
    },
    {
        "title": "Rethinking Backdoor Attacks on Dataset Distillation: A Kernel Method Perspective",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18070",
        "id": "iCNOK45Csv",
        "author_site": "Ming-Yu Chung, Sheng-Yen Chou, Chia-Mu Yu, Pin-Yu Chen, Sy-Yen Kuo, Tsung-Yi Ho",
        "tldr": "",
        "abstract": "Dataset distillation offers a potential means to enhance data efficiency in deep learning. Recent studies have shown its ability to counteract backdoor risks present in original training samples. In this study, we delve into the theoretical aspects of backdoor attacks and dataset distillation based on kernel methods. We introduce two new theory-driven trigger pattern generation methods specialized for dataset distillation. Following a comprehensive set of analyses and experiments, we show that our optimization-based trigger design framework informs effective backdoor attacks on dataset distillation. Notably, datasets poisoned by our designed trigger prove resilient against conventional backdoor attack detection and mitigation methods.  Our empirical results validate that the triggers developed using our approaches are proficient at executing resilient backdoor attacks.",
        "keywords": "Backdoor;Trigger;Dataset Condensation;Dataset Distillation",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/16c565fa7379d6df36c29e19eb841d402844f4c5.pdf",
        "author": "Ming-Yu Chung;Sheng-Yen Chou;Chia-Mu Yu;Pin-Yu Chen;Sy-Yen Kuo;Tsung-Yi Ho",
        "authorids": "~Ming-Yu_Chung1;~Sheng-Yen_Chou2;~Chia-Mu_Yu1;~Pin-Yu_Chen1;~Sy-Yen_Kuo2;~Tsung-Yi_Ho2",
        "gender": "M;;M;M;M;M",
        "homepage": ";https://frankccccc.github.io/blog/;https://chiamuyu.weebly.com/;http://www.pinyuchen.com;http://homepage.ntu.edu.tw/~sykuo/;https://www.cse.cuhk.edu.hk/people/faculty/tsung-yi-ho/",
        "dblp": ";336/3125;91/1919.html;39/8969;57/264;63/4181.html",
        "google_scholar": "TDHBg5wAAAAJ;y4L5ImMAAAAJ;https://scholar.google.com.tw/citations?user=dW4W4isAAAAJ;jxwlCUUAAAAJ;https://scholar.google.com/citations?hl=en;TRDUYkAAAAAJ",
        "orcid": ";;0000-0002-1677-2131;0000-0003-1039-8369;;0000-0001-7348-5625",
        "linkedin": ";sheng-yen-chou-ba89b2184;chia-mu-yu-0b130988?originalSubdomain=tw;pin-yu-chen-940062a2;;",
        "or_profile": "~Ming-Yu_Chung1;~Sheng-Yen_Chou2;~Chia-Mu_Yu1;~Pin-Yu_Chen1;~Sy-Yen_Kuo2;~Tsung-Yi_Ho2",
        "aff": "Duke University;The Chinese University of Hong Kong;National Yang Ming Chiao Tung University;International Business Machines;National Taiwan University;Department of Computer Science and Engineering, The Chinese University of Hong Kong",
        "aff_domain": "duke.edu;cuhk.edu.hk;nycu.edu.tw;ibm.com;ntu.edu.tw;cse.cuhk.edu.hk",
        "position": "PhD student;Researcher;Associate Professor;Principal Researcher;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nchung2024rethinking,\ntitle={Rethinking Backdoor Attacks on Dataset Distillation: A Kernel Method Perspective},\nauthor={Ming-Yu Chung and Sheng-Yen Chou and Chia-Mu Yu and Pin-Yu Chen and Sy-Yen Kuo and Tsung-Yi Ho},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=iCNOK45Csv}\n}",
        "github": "",
        "project": "",
        "reviewers": "bXcG;Z9NC;npoK;hKa2",
        "pdf_size": 396594,
        "rating": "5;6;6;6",
        "confidence": "4;4;3;3",
        "soundness": "2;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "2;2;2;3",
        "wc_summary": "73;60;69;75",
        "wc_strengths": "72;107;47;90",
        "wc_weaknesses": "206;67;61;101",
        "wc_questions": "158;5;44;13",
        "wc_review": "509;239;221;279",
        "wc_reply_reviewers": "188;0;33;16",
        "wc_reply_authors": "3329;1177;997;1245",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "7;3;2;2",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            69.25,
            5.7608593109014565
        ],
        "wc_strengths_avg": [
            79.0,
            22.237355957937087
        ],
        "wc_weaknesses_avg": [
            108.75,
            58.1823641664723
        ],
        "wc_questions_avg": [
            55.0,
            61.22499489587565
        ],
        "wc_review_avg": [
            312.0,
            115.65898149300814
        ],
        "wc_reply_reviewers_avg": [
            59.25,
            75.2441858218959
        ],
        "wc_reply_authors_avg": [
            1687.0,
            952.329774815426
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.5,
            2.0615528128088303
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6514361897530726026&as_sdt=10005&sciodt=0,8&hl=en",
        "gs_version_total": 9,
        "openreview": "https://openreview.net/forum?id=iCNOK45Csv",
        "pdf": "https://openreview.net/pdf?id=iCNOK45Csv",
        "email": "duke.edu;cuhk.edu.hk;nycu.edu.tw;ibm.com;ntu.edu.tw;cse.cuhk.edu.hk",
        "author_num": 6,
        "aff_unique_index": "0;1;2;3;4;1",
        "aff_unique_norm": "Duke University;Chinese University of Hong Kong;National Yang Ming Chiao Tung University;International Business Machines Corporation;National Taiwan University",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.duke.edu;https://www.cuhk.edu.hk;https://www.nycu.edu.tw;https://www.ibm.com;https://www.ntu.edu.tw",
        "aff_unique_abbr": "Duke;CUHK;NYCU;IBM;NTU",
        "aff_campus_unique_index": "1;2;2;1",
        "aff_campus_unique": ";Hong Kong SAR;Taiwan",
        "aff_country_unique_index": "0;1;1;0;1;1",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "iEFMwP5wng",
        "title": "Reliable Test-Time Adaptation via Agreement-on-the-Line",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Test-time adaptation (TTA) methods aim to improve robustness to distribution shifts by adapting models using unlabeled data from the shifted test distribution. However, there remain unresolved challenges that undermine the reliability of TTA, which include difficulties in evaluating TTA performance, miscalibration after TTA, and  unreliable hyperparameter tuning for adaptation. In this work, we make a notable and surprising observation that TTAed models strongly show the agreement-on-the-line phenomenon (Baek et al., 2022) across a wide range of distribution shifts. We find such linear trends occur consistently in a wide range of models adapted with various hyperparameters, and persist in distributions where the phenomenon fails to hold in vanilla model (i.e., before adaptation). We leverage these observations to make TTA methods more reliable from three perspectives: (i) estimating OOD accuracy (without labeled data) to determine when TTA helps and when it hurts, (ii) calibrating TTAed models again without any labeled data, and (iii) reliably determining hyperparameters for TTA without any labeled validation data. Through extensive experiments, we demonstrate that various TTA methods can be precisely evaluated, both in terms of their improvements and degradations. Moreover, our proposed methods on unsupervised calibration and hyperparameters tuning for TTA achieve results close to the ones assuming access to ground-truth labels, in both OOD accuracy and calibration error.",
        "keywords": "Test-time adaptation;Agreement-on-the-line;Accuarcy-on-the-line;Error estimation;Hyperparameter tuning;Calibration",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Eungyeup Kim;Mingjie Sun;Aditi Raghunathan;J Zico Kolter",
        "authorids": "~Eungyeup_Kim1;~Mingjie_Sun1;~Aditi_Raghunathan1;~J_Zico_Kolter1",
        "gender": "M;M;F;M",
        "homepage": "https://www.linkedin.com/in/eungyeup-kim-815718165/;https://eric-mingjie.github.io/;https://www.cs.cmu.edu/~aditirag/;http://www.zicokolter.com",
        "dblp": ";54/3913;166/1409;67/2526",
        "google_scholar": ";wCZbouUAAAAJ;Ch9iRwQAAAAJ;UXh1I6UAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Eungyeup_Kim1;~Mingjie_Sun1;~Aditi_Raghunathan1;~Zico_Kolter1",
        "aff": "Carnegie Mellon University;Computer Science Department, Carnegie Mellon University;Carnegie Mellon University;Carnegie Mellon University",
        "aff_domain": "andrew.cmu.edu;cs.cmu.edu;cmu.edu;cmu.edu",
        "position": "PhD student;PhD student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nkim2024reliable,\ntitle={Reliable Test-Time Adaptation via Agreement-on-the-Line},\nauthor={Eungyeup Kim and Mingjie Sun and Aditi Raghunathan and J Zico Kolter},\nyear={2024},\nurl={https://openreview.net/forum?id=iEFMwP5wng}\n}",
        "github": "",
        "project": "",
        "reviewers": "gmmt;a5t4;72ab;mLJy",
        "site": "https://openreview.net/forum?id=iEFMwP5wng",
        "pdf_size": 941724,
        "rating": "5;5;6;6",
        "confidence": "4;4;4;3",
        "soundness": "2;2;3;3",
        "contribution": "3;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "89;136;96;143",
        "wc_strengths": "85;93;118;44",
        "wc_weaknesses": "59;488;276;157",
        "wc_questions": "182;5;5;146",
        "wc_review": "415;722;495;490",
        "wc_reply_reviewers": "37;0;0;29",
        "wc_reply_authors": "844;1003;254;866",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "3;2;1;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            116.0,
            23.759208741033444
        ],
        "wc_strengths_avg": [
            85.0,
            26.61766330841233
        ],
        "wc_weaknesses_avg": [
            245.0,
            159.9609327304639
        ],
        "wc_questions_avg": [
            84.5,
            80.51242140191785
        ],
        "wc_review_avg": [
            530.5,
            115.01412956676236
        ],
        "wc_reply_reviewers_avg": [
            16.5,
            16.740669042783207
        ],
        "wc_reply_authors_avg": [
            741.75,
            288.1166213532291
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7585481133338362359&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Carnegie Mellon University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cmu.edu",
        "aff_unique_abbr": "CMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "iFDhuao7G4",
        "title": "The RL Perceptron: Generalisation Dynamics of Policy Learning in High Dimensions",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Reinforcement learning (RL) algorithms have proven transformative in a range of domains. To tackle real-world domains, these systems often use neural networks to learn policies directly from pixels or other high-dimensional sensory input. By contrast, much theory of RL has focused on discrete state spaces or worst-case analysis, and fundamental questions remain about the dynamics of policy learning in high-dimensional settings. Here, we propose a solvable high-dimensional model of RL that can capture a variety of learning protocols, and derive its typical dynamics as a set of closed-form ordinary differential equations (ODEs). We derive optimal schedules for the learning rates and task difficulty\u2014analogous to annealing schemes and curricula during training in RL, and show that the model exhibits rich behaviour, including delayed learning under sparse rewards; a variety of learning regimes depending on reward baselines; and a speed-accuracy trade-off driven by reward stringency. Experiments on a variant of the Procgen game \u201cBossfight\u201d also show such a speed-accuracy trade-off in practice. Together, these results take a step towards closing the gap between theory and practice in high-dimensional RL.",
        "keywords": "Statistical physics of learning;generalisation models;reinforcement learning;Reinforce Policy gradient",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Nishil Patel;Sebastian Lee;Stefano Sarao Mannelli;Sebastian Goldt;Andrew M Saxe",
        "authorids": "~Nishil_Patel1;~Sebastian_Lee1;~Stefano_Sarao_Mannelli1;~Sebastian_Goldt1;~Andrew_M_Saxe1",
        "gender": "M;;M;M;M",
        "homepage": ";https://seblee97.github.io/;https://stefsmlab.github.io/;https://datascience.sissa.it/research-unit/12/theory-of-neural-networks;https://www.saxelab.org",
        "dblp": ";;232/3343;234/8941;39/6894",
        "google_scholar": ";Vl9WQ0EAAAAJ;https://scholar.google.it/citations?user=Kq272_MAAAAJ;R06wsMkAAAAJ;h0Al1fcAAAAJ",
        "orcid": ";;;;0000-0002-9831-8812",
        "linkedin": "nishil-patel-6764021b0/;;;;",
        "or_profile": "~Nishil_Patel1;~Sebastian_Lee1;~Stefano_Sarao_Mannelli1;~Sebastian_Goldt1;~Andrew_M_Saxe1",
        "aff": "University College London, University of London;Imperial College London, Imperial College London;University College London;SISSA;University College London, University of London",
        "aff_domain": "ucl.ac.uk;imperial.ac.uk;ucl.ac.uk;sissa.it;ucl.ac.uk",
        "position": "PhD student;PhD student;Postdoc;Assistant Professor;Full Professor",
        "bibtex": "@misc{\npatel2024the,\ntitle={The {RL} Perceptron: Generalisation Dynamics of Policy Learning in High Dimensions},\nauthor={Nishil Patel and Sebastian Lee and Stefano Sarao Mannelli and Sebastian Goldt and Andrew M Saxe},\nyear={2024},\nurl={https://openreview.net/forum?id=iFDhuao7G4}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=iFDhuao7G4",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14712874366052554209&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0;2;0",
        "aff_unique_norm": "University College London;Imperial College London;Scuola Internazionale Superiore di Studi Avanzati",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ucl.ac.uk;https://www.imperial.ac.uk;https://www.sissa.it",
        "aff_unique_abbr": "UCL;ICL;SISSA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "United Kingdom;Italy"
    },
    {
        "id": "iGDWZFc7Ya",
        "title": "Language Models Linearly Represent Sentiment",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Sentiment is a pervasive feature in natural language text, yet it is an open question how sentiment is represented within Large Language Models (LLMs). In this study, we reveal that across a range of models, sentiment is represented linearly: a single direction in activation space mostly captures the feature across a range of tasks with one extreme for positive and the other for negative. Through causal interventions, we isolate this direction and show it is causally relevant in both toy tasks and real world datasets such as Stanford Sentiment Treebank. \n\nWe further uncover the mechanisms that involve this direction, highlighting the roles of a small subset of attention heads and neurons. Finally, we discover a phenomenon which we term the summarization motif: sentiment is not solely represented on emotionally charged words, but is additionally summarised at intermediate positions without inherent sentiment, such as punctuation and names. We show that in Stanford Sentiment Treebank zero-shot classification, 76\\% of above-chance classification accuracy is lost when ablating the sentiment direction, nearly half of which (36\\%) is due to ablating the summarized sentiment direction exclusively at comma positions.",
        "keywords": "NLP;Mechanistic Interpretability;Large Language Models",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/96a3ccf1f0cc994781d0a990bb7313de6374f98e.pdf",
        "author": "Curt Tigges;Oskar John Hollinsworth;Neel Nanda;Atticus Geiger",
        "authorids": "~Curt_Tigges1;~Oskar_John_Hollinsworth1;~Neel_Nanda1;~Atticus_Geiger1",
        "gender": "M;M;M;M",
        "homepage": "https://curttigges.com;;https://neelnanda.io;https://atticusg.github.io/",
        "dblp": ";;285/6389;229/4086",
        "google_scholar": ";;https://scholar.google.com/citations?hl=en;",
        "orcid": ";;;",
        "linkedin": "curttigges/;oskar-hollinsworth-18539b129/;https://linkedin.com/in/neel-nanda-993580151;",
        "or_profile": "~Curt_Tigges1;~Oskar_John_Hollinsworth1;~Neel_Nanda1;~Atticus_Geiger1",
        "aff": "EleutherAI Institute;FAR AI;Google DeepMind; Pr(Ai)\u00b2R Group",
        "aff_domain": "eleuther.ai;far.ai;deepmind.com;prair.group",
        "position": "Researcher;Researcher;Researcher;Principal Researcher",
        "bibtex": "@misc{\ntigges2024language,\ntitle={Language Models Linearly Represent Sentiment},\nauthor={Curt Tigges and Oskar John Hollinsworth and Neel Nanda and Atticus Geiger},\nyear={2024},\nurl={https://openreview.net/forum?id=iGDWZFc7Ya}\n}",
        "github": "",
        "project": "",
        "reviewers": "8vUR;6Ynr;dUnj",
        "site": "https://openreview.net/forum?id=iGDWZFc7Ya",
        "pdf_size": 494692,
        "rating": "3;6;6",
        "confidence": "3;3;3",
        "soundness": "2;3;2",
        "contribution": "2;2;4",
        "presentation": "1;2;2",
        "wc_summary": "199;106;202",
        "wc_strengths": "47;85;116",
        "wc_weaknesses": "125;218;231",
        "wc_questions": "43;4;28",
        "wc_review": "414;413;577",
        "wc_reply_reviewers": "139;25;80",
        "wc_reply_authors": "810;803;847",
        "reply_reviewers": "1;1;1",
        "reply_authors": "2;2;2",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            169.0,
            44.56455991031439
        ],
        "wc_strengths_avg": [
            82.66666666666667,
            28.21740991342441
        ],
        "wc_weaknesses_avg": [
            191.33333333333334,
            47.204048790566915
        ],
        "wc_questions_avg": [
            25.0,
            16.06237840420901
        ],
        "wc_review_avg": [
            468.0,
            77.07572034477957
        ],
        "wc_reply_reviewers_avg": [
            81.33333333333333,
            46.54985380094001
        ],
        "wc_reply_authors_avg": [
            820.0,
            19.30457631409368
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5032369099461672656&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "EleutherAI Institute;FAR AI;Google;Pr(Ai)\u00b2R Group",
        "aff_unique_dep": ";;Google DeepMind;",
        "aff_unique_url": "https://www.eleuther.ai;https://www.far.ai;https://deepmind.com;",
        "aff_unique_abbr": "EleutherAI;FAR AI;DeepMind;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "United States;United Kingdom;"
    },
    {
        "id": "iGHPVbttMs",
        "title": "The Cyclical Chaos And Its Equilibrium",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Finding a Nash Equilibrium (NE) in noncooperative games is a fundamental challenge in game theory and artificial intelligence, but existing methods can be computationally demanding to address the cyclical strategy problem. Existing methods like Policy Space Response Oracles (PSRO) allow agents to learn a best response (BR) policy against all prior policies. Once the learned policy converges, it is added to the sequence until an NE is identified. While the learning against all prior policies prevents agents' strategy interactions from descending into a cyclical chaos, this approach increases computational demands due to the expanding population of opponents. Our research offers a new perspective. We argue that cyclical strategies are not chaotic anomalies to be avoided; instead, they are orderly sequences integral to an equilibrium. We establish the theoretical equivalency between a complete set of cyclical strategies and the support set of a Mixed Strategy NE (MSNE). Our proof intuitively demonstrates that the cyclical strategies must form a circular counter, implying that a complete set is necessary to support an MSNE due to the intrinsic counterbalancing dynamic. This enables a novel graph search learning representation of self-play that finds an NE as a graph search. Our empirical results show improved self-play efficiency in discovering both a Pure Strategy NE (PSNE) and a MSNE in noncooperative games such as Connect4 and Naruto Mobile.",
        "keywords": "Game Theory;Graph;Fixed Point Theorem;Noncooperative Game;Self-Play;Multi-Agent Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/915aff850bf863093b477176ab4a5b2c401384f3.pdf",
        "author": "Stefan Juang;Yuan Zhou;Hong Wang;Elvis S. Liu;Nevin L. Zhang",
        "authorids": "~Stefan_Juang1;~Yuan_Zhou9;~Hong_Wang8;~Elvis_S._Liu1;~Nevin_L._Zhang1",
        "gender": "M;;M;M;M",
        "homepage": ";;https://www.linkedin.com/in/wang-hong-47210523b/;;https://cse.hkust.edu.hk/~lzhang/teach/courses.html",
        "dblp": ";;;;https://dblp.uni-trier.de/pid/z/NevinLianwenZhang.html",
        "google_scholar": ";;;https://scholar.google.co.uk/citations?user=ZxRKSisAAAAJ;",
        "orcid": ";;;;",
        "linkedin": "stefan-juang-93b63998;https://www.linkedin.cn/incareer/in/\u5706-\u5468-6002b623a;;;",
        "or_profile": "~Stefan_Juang1;~Yuan_Zhou9;~Hong_Wang8;~Elvis_S._Liu1;~Nevin_Zhang1",
        "aff": "Hong Kong University of Science and Technology;Tencent;;Tencent;Hong Kong University of Science and Technology",
        "aff_domain": "ust.hk;tencent.com;;tencent.com;ust.hk",
        "position": "PhD student;Researcher;;Principal Researcher;Full Professor",
        "bibtex": "@misc{\njuang2024the,\ntitle={The Cyclical Chaos And Its Equilibrium},\nauthor={Stefan Juang and Yuan Zhou and Hong Wang and Elvis S. Liu and Nevin L. Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=iGHPVbttMs}\n}",
        "github": "",
        "project": "",
        "reviewers": "Sw3W;smZR;bTtB;smjN;dG4F",
        "site": "https://openreview.net/forum?id=iGHPVbttMs",
        "pdf_size": 1287418,
        "rating": "3;3;3;3;5",
        "confidence": "3;4;4;2;2",
        "soundness": "3;2;3;2;3",
        "contribution": "2;1;1;1;3",
        "presentation": "3;1;3;1;2",
        "wc_summary": "213;286;79;107;72",
        "wc_strengths": "65;19;157;29;103",
        "wc_weaknesses": "315;10;513;32;168",
        "wc_questions": "95;36;30;12;73",
        "wc_review": "688;351;779;180;416",
        "wc_reply_reviewers": "180;45;0;78;0",
        "wc_reply_authors": "597;490;1020;160;458",
        "reply_reviewers": "1;1;0;1;0",
        "reply_authors": "1;1;3;1;1",
        "rating_avg": [
            3.4,
            0.8
        ],
        "confidence_avg": [
            3.0,
            0.8944271909999159
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            1.6,
            0.8
        ],
        "presentation_avg": [
            2.0,
            0.8944271909999159
        ],
        "wc_summary_avg": [
            151.4,
            84.17743165480877
        ],
        "wc_strengths_avg": [
            74.6,
            50.71331186187705
        ],
        "wc_weaknesses_avg": [
            207.6,
            187.75153794310182
        ],
        "wc_questions_avg": [
            49.2,
            30.301155093494376
        ],
        "wc_review_avg": [
            482.8,
            220.61858489256974
        ],
        "wc_reply_reviewers_avg": [
            60.6,
            66.55403819453784
        ],
        "wc_reply_authors_avg": [
            545.0,
            278.2617472812244
        ],
        "reply_reviewers_avg": [
            0.6,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.4,
            0.8
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5590169943749475,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0;1;1;0",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Tencent",
        "aff_unique_dep": ";Tencent Holdings Limited",
        "aff_unique_url": "https://www.ust.hk;https://www.tencent.com",
        "aff_unique_abbr": "HKUST;Tencent",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "iH49a0yxgF",
        "title": "DUDE: Deep Unsupervised Domain adaptation using variable nEighbors for physiological time series analysis",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep learning for continuous physiological time series such as electrocardiography or oximetry has achieved remarkable success in supervised learning scenarios where training and testing data are drawn from the same distribution. However, when evaluating real-world applications, models often fail to generalize due to distribution shifts between the source domain on which the model was trained and the target domain where it is deployed. A common and particularly challenging shift often encountered in reality is where the source and target domain supports do not fully overlap. In this paper, we propose a novel framework, named Deep Unsupervised Domain adaptation using variable nEighbors (DUDE), to address this challenge. We introduce a new type of contrastive loss between the source and target domains using a dynamic neighbor selection strategy, in which the number of neighbors for each sample is adaptively determined based on the density observed in the latent space. This strategy allows us to deal with difficult real-world distribution shifts where there is a lack of common support between the source and the target. We evaluated the performance of DUDE on three distinct tasks, each corresponding to a different type of continuous physiological time series. In each case, we used multiple real-world datasets as source and target domains, with target domains that included demographics, ethnicities, geographies, and/or comorbidities that were not present in the source domain. The experimental results demonstrate the superior performance of DUDE compared to the baselines and a set of four benchmark methods, highlighting its effectiveness in handling a variety of realistic domain shifts. The source code is made open-source [upon acceptance of the manuscript].",
        "keywords": "Deep learning;Domain adaptation;Continuous physiological time series",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/55884fbf6e6dd37aab26c99a3f8f9b02063a09df.pdf",
        "author": "Jeremy Levy;Noam Ben-Moshe;Uri Shalit;Joachim Behar",
        "authorids": "~Jeremy_Levy2;~Noam_Ben-Moshe1;~Uri_Shalit1;~Joachim_Behar1",
        "gender": "M;F;M;M",
        "homepage": ";;;https://www.aimlab-technion.com/",
        "dblp": ";;87/7049;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;https://scholar.google.co.il/citations?user=aeGDj-IAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0001-7498-6413;0009-0000-2551-4313;0000-0002-4026-2692;",
        "linkedin": ";;;joachim-behar-%F0%9F%8E%97%EF%B8%8F-04730b78/",
        "or_profile": "~Jeremy_Levy2;~Noam_Ben-Moshe1;~Uri_Shalit1;~Joachim_Behar1",
        "aff": "Technion - Israel Institute of Technology, Technion;;Technion;Technion - Israel Institute of Technology, Technion",
        "aff_domain": "technion.ac.il;;technion.ac.il;technion.ac.il",
        "position": "PhD student;;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nlevy2024dude,\ntitle={{DUDE}: Deep Unsupervised Domain adaptation using variable nEighbors for physiological time series analysis},\nauthor={Jeremy Levy and Noam Ben-Moshe and Uri Shalit and Joachim Behar},\nyear={2024},\nurl={https://openreview.net/forum?id=iH49a0yxgF}\n}",
        "github": "",
        "project": "",
        "reviewers": "1WBk;qJ3Y;Pmyo;nstb",
        "site": "https://openreview.net/forum?id=iH49a0yxgF",
        "pdf_size": 487056,
        "rating": "5;6;6;6",
        "confidence": "4;4;4;2",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;2",
        "presentation": "2;3;3;3",
        "wc_summary": "59;55;30;67",
        "wc_strengths": "45;28;31;128",
        "wc_weaknesses": "259;57;38;64",
        "wc_questions": "5;91;134;5",
        "wc_review": "368;231;233;264",
        "wc_reply_reviewers": "0;0;46;0",
        "wc_reply_authors": "764;783;793;202",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            52.75,
            13.827056809024834
        ],
        "wc_strengths_avg": [
            58.0,
            40.92065493122025
        ],
        "wc_weaknesses_avg": [
            104.5,
            89.70646576473739
        ],
        "wc_questions_avg": [
            58.75,
            55.858638544096294
        ],
        "wc_review_avg": [
            274.0,
            55.82562135793923
        ],
        "wc_reply_reviewers_avg": [
            11.5,
            19.91858428704209
        ],
        "wc_reply_authors_avg": [
            635.5,
            250.4980039840637
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1855546840461393802&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Technion - Israel Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.technion.ac.il",
        "aff_unique_abbr": "Technion",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Israel"
    },
    {
        "id": "iHSp6wvQmV",
        "title": "PhaseFusion: A Diffusion-based Periodic Parameterized Motion Generation Framework",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In this study, we introduce a learning-based method for generating high-quality human motion sequences from text descriptions (e.g., ``A person walks forward\"). Existing techniques struggle with motion diversity and smooth transitions due to limited text-to-motion datasets and reliance on full-body skeletal pose representations. To address this, we develop a network encoder that converts motion sequences into periodic signals, capturing the local periodicity of motions in time and space. We also propose a conditional diffusion model for predicting periodic motion parameters based on text descriptions and the starting pose. Our approach outperforms current methods, generating a broader variety of high-quality motions with natural transitions, especially in longer sequences.",
        "keywords": "Motion Synthesis;Text to Motion",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/0da328ff50dfd14d39cb2982bc8c174c69524a38.zip",
        "author": "Weilin Wan;Yiming Huang;Shutong Wu;Taku Komura;Wenping Wang;Dinesh Jayaraman;Lingjie Liu",
        "authorids": "~Weilin_Wan1;~Yiming_Huang5;~Shutong_Wu2;~Taku_Komura2;~Wenping_Wang1;~Dinesh_Jayaraman2;~Lingjie_Liu1",
        "gender": ";;M;M;M;M;F",
        "homepage": ";;https://scriptwonder.github.io;https://i.cs.hku.hk/~taku/;https://engineering.tamu.edu/cse/profiles/Wang-Wenping.html;https://www.seas.upenn.edu/~dineshj/;https://lingjie0206.github.io/",
        "dblp": ";;;;;145/3870;204/0052",
        "google_scholar": ";;;;28shvv0AAAAJ;QxLpghAAAAAJ;https://scholar.google.de/citations?user=HZPnJ9gAAAAJ",
        "orcid": ";;0009-0006-0794-9704;0000-0002-2729-5860;0000-0002-2284-3952;0000-0002-6888-3095;",
        "linkedin": ";;shutong-wu-214043172/;;;dinesh-jayaraman-44b31539/;",
        "or_profile": "~Weilin_Wan1;~Yiming_Huang5;~Shutong_Wu2;~Taku_Komura2;~Wenping_Wang1;~Dinesh_Jayaraman2;~Lingjie_Liu1",
        "aff": ";;University of Pennsylvania;the University of Hong Kong, University of Hong Kong;Texas A&M University - College Station;University of Pennsylvania;University of Pennsylvania",
        "aff_domain": ";;upenn.edu;cs.hku.hk;tamu.edu;upenn.edu;upenn.edu",
        "position": ";;MS student;Full Professor;Full Professor;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nwan2024phasefusion,\ntitle={PhaseFusion: A Diffusion-based Periodic Parameterized Motion Generation Framework},\nauthor={Weilin Wan and Yiming Huang and Shutong Wu and Taku Komura and Wenping Wang and Dinesh Jayaraman and Lingjie Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=iHSp6wvQmV}\n}",
        "github": "",
        "project": "",
        "reviewers": "jvFF;N4P9;psKt;DwHH",
        "site": "https://openreview.net/forum?id=iHSp6wvQmV",
        "pdf_size": 2833158,
        "rating": "3;3;5;6",
        "confidence": "4;3;4;2",
        "soundness": "3;2;2;3",
        "contribution": "3;3;3;2",
        "presentation": "2;2;2;3",
        "wc_summary": "63;64;73;43",
        "wc_strengths": "36;36;59;49",
        "wc_weaknesses": "197;548;266;198",
        "wc_questions": "65;67;81;14",
        "wc_review": "361;715;479;304",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            60.75,
            10.96300597464035
        ],
        "wc_strengths_avg": [
            45.0,
            9.669539802906858
        ],
        "wc_weaknesses_avg": [
            302.25,
            144.6139256779927
        ],
        "wc_questions_avg": [
            56.75,
            25.439880109780393
        ],
        "wc_review_avg": [
            464.75,
            157.6647947387114
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:L9xaL_yGJSoJ:scholar.google.com/&scioq=PhaseFusion:+A+Diffusion-based+Periodic+Parameterized+Motion+Generation+Framework&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0;0",
        "aff_unique_norm": "University of Pennsylvania;University of Hong Kong;Texas A&M University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.upenn.edu;https://www.hku.hk;https://www.tamu.edu",
        "aff_unique_abbr": "UPenn;HKU;TAMU",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Hong Kong SAR;College Station",
        "aff_country_unique_index": "0;1;0;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "Poly-View Contrastive Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18069",
        "id": "iHcTLIor0m",
        "author_site": "Amitis Shidani, R Devon Hjelm, Jason Ramapuram, Russell Webb, Eeshan Gunesh Dhekane, Dan Busbridge",
        "tldr": "",
        "abstract": "Contrastive learning typically matches pairs of related views among a number of unrelated negative views. Views can be generated (e.g. by augmentations) or be observed. We investigate matching when there are more than two related views which we call poly-view tasks,\nand derive new representation learning objectives using information maximization and sufficient statistics. We show that with unlimited computation, one should maximize the number of related views, and with a fixed compute budget, it is beneficial to decrease the number of unique samples whilst increasing the number of views of those samples. In particular, poly-view contrastive models trained for 128 epochs with batch size 256 outperform SimCLR trained for 1024 epochs at batch size 4096 on ImageNet1k, challenging the belief that contrastive models require large batch sizes and many training epochs.",
        "keywords": "Contrastive learning;Self-Supervised Learning;SimCLR;Multi-View;Augmentations;Multiplicity;InfoMax;Sufficient Statistics",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Amitis Shidani;R Devon Hjelm;Jason Ramapuram;Russell Webb;Eeshan Gunesh Dhekane;Dan Busbridge",
        "authorids": "~Amitis_Shidani1;~R_Devon_Hjelm1;~Jason_Ramapuram1;~Russell_Webb1;~Eeshan_Gunesh_Dhekane1;~Dan_Busbridge1",
        "gender": "F;M;M;;M;M",
        "homepage": "https://shidani.github.io/;;http://jramapuram.github.io;;https://github.com/eeshandhekane;https://github.com/dbusbridge",
        "dblp": "315/0405;195/5928;200/8958;62/1807;228/0596.html;220/3480",
        "google_scholar": "_BbDEQgAAAAJ;https://scholar.google.ca/citations?user=68c5HfwAAAAJ;U-MT4IsAAAAJ;;zob4NZEAAAAJ;https://scholar.google.co.uk/citations?user=CvA9jjMAAAAJ",
        "orcid": ";;;;0009-0006-3026-6258;0000-0002-2178-6917",
        "linkedin": ";;jramapuram/;;eeshan-gunesh-dhekane-05677482/;danbusbridge/",
        "or_profile": "~Amitis_Shidani1;~R_Devon_Hjelm1;~Jason_Ramapuram1;~Russell_Webb1;~Eeshan_Gunesh_Dhekane1;~Dan_Busbridge1",
        "aff": "Apple;Apple;Apple;Apple;Apple;Apple",
        "aff_domain": "apple.com;apple.com;apple.com;apple.com;apple.com;apple.com",
        "position": "Intern;Researcher;Researcher;Researcher;Researcher;Researcher",
        "bibtex": "@inproceedings{\nshidani2024polyview,\ntitle={Poly-View Contrastive Learning},\nauthor={Amitis Shidani and R Devon Hjelm and Jason Ramapuram and Russell Webb and Eeshan Gunesh Dhekane and Dan Busbridge},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=iHcTLIor0m}\n}",
        "github": "",
        "project": "",
        "reviewers": "PqKH;P4Q6;AhEA;ymcZ",
        "pdf_size": 810623,
        "rating": "6;6;6;8",
        "confidence": "2;4;3;4",
        "soundness": "3;3;3;3",
        "contribution": "3;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "66;76;109;63",
        "wc_strengths": "31;91;45;100",
        "wc_weaknesses": "33;221;39;38",
        "wc_questions": "63;11;131;4",
        "wc_review": "193;399;324;205",
        "wc_reply_reviewers": "0;46;0;0",
        "wc_reply_authors": "529;957;1051;358",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "2;3;4;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            78.5,
            18.255136263528684
        ],
        "wc_strengths_avg": [
            66.75,
            29.345996319770776
        ],
        "wc_weaknesses_avg": [
            82.75,
            79.85103318054188
        ],
        "wc_questions_avg": [
            52.25,
            50.85948780709456
        ],
        "wc_review_avg": [
            280.25,
            85.57270300744274
        ],
        "wc_reply_reviewers_avg": [
            11.5,
            19.91858428704209
        ],
        "wc_reply_authors_avg": [
            723.75,
            288.6168524185655
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5222329678670935,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9517600899372820015&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=iHcTLIor0m",
        "pdf": "https://openreview.net/pdf?id=iHcTLIor0m",
        "email": "apple.com;apple.com;apple.com;apple.com;apple.com;apple.com",
        "author_num": 6,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "Apple",
        "aff_unique_dep": "Apple Inc.",
        "aff_unique_url": "https://www.apple.com",
        "aff_unique_abbr": "Apple",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Disentangling Time Series Representations via Contrastive Independence-of-Support on l-Variational Inference",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18068",
        "id": "iI7hZSczxE",
        "author_site": "Khalid OUBLAL, Said Ladjal, David Benhaiem, Emmanuel LE BORGNE, Fran\u00e7ois Roueff",
        "tldr": "",
        "abstract": "Learning disentangled representations for time series is a promising path to facilitate reliable generalization to in- and out-of distribution (OOD), offering benefits like feature derivation and improved interpretability and fairness, thereby enhancing downstream tasks. We focus on disentangled representation learning for home appliance electricity usage, enabling users to understand and optimize their consumption for a reduced carbon footprint. Our approach frames the problem as disentangling each attribute's role in total consumption. Unlike existing methods assuming attribute independence which leads to non-identiability, we acknowledge real-world time series attribute correlations, learned up to a smooth bijection using contrastive learning and a single autoencoder. To address this, we propose a Disentanglement under Independence-Of-Support via Contrastive Learning (DIOSC), facilitating representation generalization across diverse correlated scenarios. Our method utilizes innovative \\textit{l}-variational inference layers with self-attention, effectively addressing temporal dependencies across bottom-up and top-down networks. We find that DIOSC can enhance the task of representation of time series electricity consumption. We introduce TDS (Time Disentangling Score) to gauge disentanglement quality. TDS reliably reflects disentanglement performance, making it a valuable metric for evaluating time series representations disentanglement. Code available at https://institut-polytechnique-de-paris.github.io/time-disentanglement-lib.",
        "keywords": "Learning disentangled representations;Generalization;Weak supervised learning;Appliance usage Electricity;Multi-modal learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Khalid Oublal;Said Ladjal;David Benhaiem;Emmanuel LE BORGNE;Fran\u00e7ois Roueff",
        "authorids": "~Khalid_Oublal2;~Said_Ladjal1;~David_Benhaiem1;~Emmanuel_LE_BORGNE1;~Fran\u00e7ois_Roueff1",
        "gender": "M;M;M;M;Not Specified",
        "homepage": "https://scholar.google.com/citations?user=3mMrjroAAAAJ&hl=fr;perso.telecom-paristech.fr/~ladjal;https://scholar.google.fr/citations?user=IL-2GPoAAAAJ&hl=fr;;https://perso.telecom-paristech.fr/roueff/",
        "dblp": ";;;;",
        "google_scholar": "3mMrjroAAAAJ;;https://scholar.google.fr/citations?user=IL-2GPoAAAAJ;;zhJZ1iwAAAAJ",
        "orcid": ";;;;0000-0003-2372-0724",
        "linkedin": ";;;emmanuel-le-borgne-682296102/;",
        "or_profile": "~Khalid_Oublal2;~Said_Ladjal1;~David_Benhaiem1;~Emmanuel_LE_BORGNE1;~Fran\u00e7ois_Roueff1",
        "aff": "T\u00e9l\u00e9com Paris;ENS Cachan;;TotalEnergies;T\u00e9l\u00e9com Paris",
        "aff_domain": "telecom-paris.fr;ens-cachan.fr;;totalenergies.com;telecom-paristech.fr",
        "position": "PhD student;PhD student;;Researcher;Full Professor",
        "bibtex": "@inproceedings{\noublal2024disentangling,\ntitle={Disentangling Time Series Representations via Contrastive Independence-of-Support on l-Variational Inference},\nauthor={Khalid Oublal and Said Ladjal and David Benhaiem and Emmanuel LE BORGNE and Fran{\\c{c}}ois Roueff},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=iI7hZSczxE}\n}",
        "github": "",
        "project": "",
        "reviewers": "a2rd;cDdv;jyEy",
        "pdf_size": 2807109,
        "rating": "1;8;8",
        "confidence": "3;5;4",
        "soundness": "1;4;3",
        "contribution": "2;4;3",
        "presentation": "1;4;3",
        "wc_summary": "59;231;224",
        "wc_strengths": "25;186;66",
        "wc_weaknesses": "249;10;43",
        "wc_questions": "24;10;255",
        "wc_review": "357;437;588",
        "wc_reply_reviewers": "0;0;28",
        "wc_reply_authors": "366;296;808",
        "reply_reviewers": "0;0;1",
        "reply_authors": "2;2;3",
        "rating_avg": [
            5.666666666666667,
            3.299831645537222
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "wc_summary_avg": [
            171.33333333333334,
            79.48305200201835
        ],
        "wc_strengths_avg": [
            92.33333333333333,
            68.31463158715627
        ],
        "wc_weaknesses_avg": [
            100.66666666666667,
            105.74917914049682
        ],
        "wc_questions_avg": [
            96.33333333333333,
            112.33976242730009
        ],
        "wc_review_avg": [
            460.6666666666667,
            95.77868006793346
        ],
        "wc_reply_reviewers_avg": [
            9.333333333333334,
            13.199326582148887
        ],
        "wc_reply_authors_avg": [
            490.0,
            226.66862744249957
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.8660254037844386,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13104860702644532111&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=iI7hZSczxE",
        "pdf": "https://openreview.net/pdf?id=iI7hZSczxE",
        "email": "telecom-paris.fr;ens-cachan.fr;;totalenergies.com;telecom-paristech.fr",
        "author_num": 5,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "T\u00e9l\u00e9com Paris;Ecole Normale Superieure de Cachan;TotalEnergies",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.telecom-paris.fr;https://www.ens-cachan.fr;https://www.totalenergies.com",
        "aff_unique_abbr": "T\u00e9l\u00e9com Paris;ENS Cachan;TotalEnergies",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Cachan",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "France"
    },
    {
        "title": "ECoFLaP: Efficient Coarse-to-Fine Layer-Wise Pruning for Vision-Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18067",
        "id": "iIT02bAKzv",
        "author_site": "Yi-Lin Sung, Jaehong Yoon, Mohit Bansal",
        "tldr": "",
        "abstract": "Large Vision-Language Models (LVLMs) can understand the world comprehensively by integrating rich information from different modalities, achieving remarkable performance improvements on various multimodal downstream tasks. However, deploying LVLMs is often problematic due to their massive computational/energy costs and carbon consumption, making it infeasible to adopt conventional iterative global pruning, which is costly due to computing the Hessian matrix of the entire large model for sparsification. Alternatively, several studies have recently proposed layer-wise pruning approaches to avoid the expensive computation of global pruning and efficiently compress model weights according to their importance within a layer. However, these methods often suffer from suboptimal model compression due to their lack of a global perspective. To address this limitation in recent efficient pruning methods for large models, we propose Efficient Coarse-to-Fine Layer-Wise Pruning (ECoFLaP), a two-stage coarse-to-fine weight pruning approach for LVLMs. We first determine the sparsity ratios of different layers or blocks by leveraging the global importance score, which is efficiently computed based on the zeroth-order approximation of the global model gradients. Then, the multimodal model performs layer-wise unstructured weight pruning. We validate our proposed method across various multi-modal and single-modal models and datasets, demonstrating significant performance improvements over prevalent pruning techniques in the high-sparsity regime.",
        "keywords": "multi-modal learning;model pruning;layer-wise pruning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/2ab6fb70447999b79e5b746f7be72da062e6e8a6.zip",
        "author": "Yi-Lin Sung;Jaehong Yoon;Mohit Bansal",
        "authorids": "~Yi-Lin_Sung1;~Jaehong_Yoon1;~Mohit_Bansal2",
        "gender": "M;M;M",
        "homepage": "https://jaehong31.github.io/;https://www.cs.unc.edu/~mbansal/;https://ylsung.github.io/",
        "dblp": "203/4449;32/5243.html;212/7264",
        "google_scholar": "-5comoUAAAAJ;DN8QtscAAAAJ;aW2XnF0AAAAJ",
        "orcid": ";;",
        "linkedin": "jaehongyoon/;;yi-lin-sung-41a427120/",
        "or_profile": "~Jaehong_Yoon1;~Mohit_Bansal2;~Yi_Lin_Sung1",
        "aff": "University of North Carolina at Chapel Hill;University of North Carolina at Chapel Hill;Department of Computer Science, University of North Carolina, Chapel Hill",
        "aff_domain": "unc.edu;unc.edu;cs.unc.edu",
        "position": "Postdoc;Full Professor;PhD student",
        "bibtex": "@inproceedings{\nsung2024ecoflap,\ntitle={{EC}o{FL}aP: Efficient Coarse-to-Fine Layer-Wise Pruning for Vision-Language Models},\nauthor={Yi-Lin Sung and Jaehong Yoon and Mohit Bansal},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=iIT02bAKzv}\n}",
        "github": "",
        "project": "",
        "reviewers": "q2nJ;4r21;5Mvp;GD72",
        "pdf_size": 1290156,
        "rating": "5;5;6;6",
        "confidence": "4;4;4;4",
        "soundness": "3;2;3;3",
        "contribution": "2;2;4;2",
        "presentation": "3;3;4;3",
        "wc_summary": "59;37;70;115",
        "wc_strengths": "115;29;53;60",
        "wc_weaknesses": "257;238;60;98",
        "wc_questions": "4;10;6;37",
        "wc_review": "435;314;189;310",
        "wc_reply_reviewers": "0;532;0;0",
        "wc_reply_authors": "1666;2106;528;826",
        "reply_reviewers": "0;3;0;0",
        "reply_authors": "5;6;1;3",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            70.25,
            28.43743131859838
        ],
        "wc_strengths_avg": [
            64.25,
            31.47518864121389
        ],
        "wc_weaknesses_avg": [
            163.25,
            85.57854579273943
        ],
        "wc_questions_avg": [
            14.25,
            13.311179511974137
        ],
        "wc_review_avg": [
            312.0,
            86.98563099730897
        ],
        "wc_reply_reviewers_avg": [
            133.0,
            230.36275740666068
        ],
        "wc_reply_authors_avg": [
            1281.5,
            633.0250784921558
        ],
        "reply_reviewers_avg": [
            0.75,
            1.299038105676658
        ],
        "reply_authors_avg": [
            3.75,
            1.920286436967152
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 16,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11489744293041150205&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=iIT02bAKzv",
        "pdf": "https://openreview.net/pdf?id=iIT02bAKzv",
        "email": "unc.edu;unc.edu;cs.unc.edu",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of North Carolina",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.unc.edu",
        "aff_unique_abbr": "UNC",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Chapel Hill",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "iJBQAAhqvY",
        "title": "RealFM: A Realistic Mechanism to Incentivize Data Contribution and Device Participation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Edge device participation in federating learning (FL) has been typically studied under the lens of device-server communication (e.g., device dropout) and assumes an undying desire from edge devices to participate in FL. As a result, current FL frameworks are flawed when implemented in real-world settings, with many encountering the free-rider problem. In a step to push FL towards realistic settings, we propose RealFM: the first truly federated mechanism which (1) realistically models device utility, (2) incentivizes data contribution and device participation, and (3) provably removes the free-rider phenomena. RealFM does not require data sharing and allows for a non-linear relationship between device accuracy and utility, which improves the utility gained by the server and participating devices compared to non-participating devices as well as devices participating in other FL mechanisms. On real-world data, RealFM improves device and server utility, as well as data contribution, by up to 3 magnitudes and 7x respectively compared to baseline mechanisms.",
        "keywords": "Federated Learning;Realistic;Mechanisms;Utility",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/1a7aaf310c5d8ab631c1214aa8f372f1cafabbcf.zip",
        "author": "Marco Bornstein;Amrit Bedi;Anit Kumar Sahu;Furqan Khan;Furong Huang",
        "authorids": "~Marco_Bornstein1;~Amrit_Bedi1;~Anit_Kumar_Sahu1;~Furqan_Khan1;~Furong_Huang1",
        "gender": "M;M;;M;F",
        "homepage": "https://marcobornstein.github.io;https://sites.google.com/view/amritsinghbedi/home;;;https://furong-huang.com",
        "dblp": "332/0431;176/2707.html;;;72/8513",
        "google_scholar": ";91WLA6QAAAAJ;;pMWkCrcAAAAJ;13yyuCcAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Marco_Bornstein1;~Amrit_Bedi1;~Anit_Kumar_Sahu1;~Furqan_Khan1;~Furong_Huang1",
        "aff": "University of Maryland, College Park;University of Maryland, College Park;;;University of Maryland",
        "aff_domain": "umd.edu;umd.edu;;;cs.umd.edu",
        "position": "PhD student;Researcher;;;Assistant Professor",
        "bibtex": "@misc{\nbornstein2024realfm,\ntitle={Real{FM}: A Realistic Mechanism to Incentivize Data Contribution and Device Participation},\nauthor={Marco Bornstein and Amrit Bedi and Anit Kumar Sahu and Furqan Khan and Furong Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=iJBQAAhqvY}\n}",
        "github": "",
        "project": "",
        "reviewers": "EigJ;gdSK;A7vi;jpGm",
        "site": "https://openreview.net/forum?id=iJBQAAhqvY",
        "pdf_size": 2159894,
        "rating": "3;5;5;6",
        "confidence": "4;4;4;3",
        "soundness": "3;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "47;61;73;73",
        "wc_strengths": "43;55;38;49",
        "wc_weaknesses": "186;361;275;67",
        "wc_questions": "37;9;245;25",
        "wc_review": "313;486;631;214",
        "wc_reply_reviewers": "0;358;492;33",
        "wc_reply_authors": "852;1942;2656;657",
        "reply_reviewers": "0;2;3;1",
        "reply_authors": "2;4;4;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            63.5,
            10.712142642814275
        ],
        "wc_strengths_avg": [
            46.25,
            6.378675411086537
        ],
        "wc_weaknesses_avg": [
            222.25,
            108.91596531271253
        ],
        "wc_questions_avg": [
            79.0,
            96.35351576356723
        ],
        "wc_review_avg": [
            411.0,
            160.0296847462995
        ],
        "wc_reply_reviewers_avg": [
            220.75,
            209.99687497674816
        ],
        "wc_reply_authors_avg": [
            1526.75,
            815.3819273812733
        ],
        "reply_reviewers_avg": [
            1.5,
            1.118033988749895
        ],
        "reply_authors_avg": [
            2.75,
            1.299038105676658
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.6622661785325219,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4124865604301129308&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Maryland",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www/umd.edu",
        "aff_unique_abbr": "UMD",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "College Park;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "iJyV77AUGR",
        "title": "Pre-trained Transformers as Plug-in Defenders Against Adversarial Perturbations",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "With more and more deep neural networks being deployed as various daily ser- vices, their reliability is essential. It is frightening that deep neural networks are vulnerable and sensitive to adversarial attacks, the most common one of which for the services is evasion-based. Recent works usually strengthen the robustness by adversarial training or leveraging the knowledge of an amount of clean data. However, retraining and redeploying the model need a large computational budget, leading to heavy losses to the online service. In addition, when training, it is likely that only limited adversarial examples are available for the service provider, while much clean data may not be accessible. Based on the analysis on the defense for deployed models, we find that how to rapidly defend against a certain attack for a frozen original service model with limitations of few clean and adversarial examples, which is named as RaPiD (Rapid Plug-in Defender), is really important. Motivated by the generalization and the universal computation ability of pre-trained transformer models, we come up with a new defender method, CeTaD, which stands for Considering Pre-trained Transformers as Defenders. In particular, we evaluate the effectiveness and the transferability of CeTaD in the case of one-shot adversarial examples and explore the impact of different parts of CeTaD as well as training data conditions. CeTaD is flexible for different differentiable service models, and suitable for various types of attacks.",
        "keywords": "pre-trained transformers;fine-tuning;adversarial defense",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/717259f3c11196de6eb095b5aaa8ec7cfdf48410.pdf",
        "author": "Kai Wu;Yujian Betterest Li;Jian Lou;Xiaoyu Zhang;Handing Wang;Jing Liu",
        "authorids": "~Kai_Wu3;~Yujian_Betterest_Li1;~Jian_Lou2;~Xiaoyu_Zhang6;~Handing_Wang1;~Jing_Liu20",
        "gender": ";;;F;F;F",
        "homepage": ";;https://sites.google.com/view/jianlou;https://scholar.google.com.hk/citations?user=XtfE1f0AAAAJ&hl=zh-CN;;https://faculty.xidian.edu.cn/LJ22/zh_CN/index.htm",
        "dblp": ";;05/4625-1;12/5927-10.html;125/6067;72/2590-6",
        "google_scholar": ";;;https://scholar.google.com.hk/citations?user=XtfE1f0AAAAJ;https://scholar.google.com.hk/citations?user=JtYr_7cAAAAJ;kqRxf3MAAAAJ",
        "orcid": ";;0000-0002-4110-2068;;0000-0002-4805-3780;0000-0002-6834-5350",
        "linkedin": ";;;;;",
        "or_profile": "~Kai_Wu3;~Yujian_Betterest_Li1;~Jian_Lou2;~Xiaoyu_Zhang6;~Handing_Wang1;~Jing_Liu20",
        "aff": ";;www.hoiying.net;Xidian University;Xidian University ;Xidian University, China",
        "aff_domain": ";;hoiying.net;xidian.edu.cn;xidian.edu.cn;mail.xidian.edu.cn",
        "position": ";;Researcher;Associate Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nwu2024pretrained,\ntitle={Pre-trained Transformers as Plug-in Defenders Against Adversarial Perturbations},\nauthor={Kai Wu and Yujian Betterest Li and Jian Lou and Xiaoyu Zhang and Handing Wang and Jing Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=iJyV77AUGR}\n}",
        "github": "",
        "project": "",
        "reviewers": "GjLF;Lpvc;7fic;9SPS",
        "site": "https://openreview.net/forum?id=iJyV77AUGR",
        "pdf_size": 1847267,
        "rating": "3;3;3;3",
        "confidence": "2;3;5;4",
        "soundness": "3;2;3;3",
        "contribution": "2;2;2;1",
        "presentation": "2;2;3;3",
        "wc_summary": "72;81;37;31",
        "wc_strengths": "34;51;19;40",
        "wc_weaknesses": "277;156;124;586",
        "wc_questions": "10;6;3;2",
        "wc_review": "393;294;183;659",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            55.25,
            21.591375593046404
        ],
        "wc_strengths_avg": [
            36.0,
            11.554220008291344
        ],
        "wc_weaknesses_avg": [
            285.75,
            182.49982876704297
        ],
        "wc_questions_avg": [
            5.25,
            3.112474899497183
        ],
        "wc_review_avg": [
            382.25,
            176.20637758038157
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:11XWtfUjvVUJ:scholar.google.com/&scioq=Pre-trained+Transformers+as+Plug-in+Defenders+Against+Adversarial+Perturbations&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Hoiying Limited;Xidian University",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.hoiying.net;http://www.xidian.edu.cn/",
        "aff_unique_abbr": ";Xidian",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "iKd99CYwPX",
        "title": "Deterministic Diffusion for Sequential Tasks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Diffusion models have been used effectively in sequential tasks such as video prediction and robot trajectory generation. Existing approaches typically predict sequence segments autoregressively by denoising Gaussian noise. This iterative denoising process is time-consuming, a problem compounded by the autoregressive nature of sequence prediction.  In this paper, we aim to expedite inference by leveraging the properties of the sequence prediction task. Drawing on recent work on deterministic denoising diffusion, we initialize the denoising process with a non-Gaussian source distribution obtained using the context available when predicting sequence elements. Our main insight is that starting from a distribution more closely resembling the target enables inference with fewer iterations, leading to quicker generation. We demonstrate the effectiveness of our method on diffusion for video prediction and in robot control using diffusion policies. Our method attains faster sequence generation with minimal loss of prediction quality, in some cases even improving performance over existing methods.",
        "keywords": "Diffusion Models;Sequence Prediction;Robotic Manipulation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/e1ace2d7c2818a54b8b7f3ebd7a6f9c7c324f1c7.zip",
        "author": "Meital Bojan;Orr Krupnik;Aviv Tamar",
        "authorids": "~Meital_Bojan1;~Orr_Krupnik1;~Aviv_Tamar2",
        "gender": "F;M;M",
        "homepage": ";https://www.orrkrup.com;https://avivt.github.io/avivt/",
        "dblp": ";234/8503;49/10622",
        "google_scholar": ";E2lnAzIAAAAJ;https://scholar.google.co.il/citations?user=kppa2vgAAAAJ",
        "orcid": ";;",
        "linkedin": "meital-bojan-a6864412b/;;",
        "or_profile": "~Meital_Bojan1;~Orr_Krupnik1;~Aviv_Tamar2",
        "aff": "Technion - Israel Institute of Technology, Technion - Israel Institute of Technology;Technion - Israel Institute of Technology, Technion - Israel Institute of Technology;Technion, Technion",
        "aff_domain": "campus.technion.ac.il;campus.technion.ac.il;technion.ac.il",
        "position": "MS student;PhD student;Assistant Professor",
        "bibtex": "@misc{\nbojan2024deterministic,\ntitle={Deterministic Diffusion for Sequential Tasks},\nauthor={Meital Bojan and Orr Krupnik and Aviv Tamar},\nyear={2024},\nurl={https://openreview.net/forum?id=iKd99CYwPX}\n}",
        "github": "",
        "project": "",
        "reviewers": "HtfP;X2Za;eaWM;1n8o",
        "site": "https://openreview.net/forum?id=iKd99CYwPX",
        "pdf_size": 2057782,
        "rating": "3;5;5;5",
        "confidence": "4;4;4;4",
        "soundness": "2;3;3;2",
        "contribution": "2;2;2;2",
        "presentation": "3;2;3;3",
        "wc_summary": "124;107;95;18",
        "wc_strengths": "81;55;33;22",
        "wc_weaknesses": "221;168;281;317",
        "wc_questions": "61;8;159;2",
        "wc_review": "487;338;568;359",
        "wc_reply_reviewers": "63;801;160;295",
        "wc_reply_authors": "528;1579;456;585",
        "reply_reviewers": "1;4;1;1",
        "reply_authors": "1;4;2;2",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            86.0,
            40.58940748520481
        ],
        "wc_strengths_avg": [
            47.75,
            22.576259654778955
        ],
        "wc_weaknesses_avg": [
            246.75,
            56.94899033345543
        ],
        "wc_questions_avg": [
            57.5,
            62.93846200853656
        ],
        "wc_review_avg": [
            438.0,
            94.26293014753998
        ],
        "wc_reply_reviewers_avg": [
            329.75,
            284.2774832799812
        ],
        "wc_reply_authors_avg": [
            787.0,
            459.54053140065895
        ],
        "reply_reviewers_avg": [
            1.75,
            1.299038105676658
        ],
        "reply_authors_avg": [
            2.25,
            1.0897247358851685
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:IeJ2IFEJJrQJ:scholar.google.com/&scioq=Deterministic+Diffusion+for+Sequential+Tasks&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Technion - Israel Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.technion.ac.il/en/",
        "aff_unique_abbr": "Technion",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Israel"
    },
    {
        "id": "iKsu33WcmU",
        "title": "ProtChatGPT: Towards Understanding Proteins with Large Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Protein research is crucial in various fundamental disciplines, but understanding their intricate structure-function relationships remains challenging. Recent Large Language Models (LLMs) have made significant strides in comprehending task-specific knowledge, suggesting the potential for ChatGPT-like systems specialized in protein to facilitate basic research. In this work, we introduce ProtChatGPT, which aims at learning and understanding protein structures via natural languages. ProtChatGPT enables users to upload proteins, ask questions, and engage in interactive conversations to produce comprehensive answers. The system comprises protein encoders, a Protein-Language Pertaining Transformer (PLP-former), a projection adapter, and an LLM. The protein first undergoes protein encoders and PLP-former to produce protein embeddings, which are then projected by the adapter to conform with the LLM. The LLM finally combines user questions with projected embeddings to generate informative answers. Experiments show that ProtChatGPT can produce promising responses to proteins and their corresponding questions. We hope that ProtChatGPT could form the basis for further exploration and application in protein research. Code will be publicly available.",
        "keywords": "Large Language Models;ChatGPT-like system;Protein Understanding",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Chao Wang;Hehe Fan;Ruijie Quan;Yi Yang",
        "authorids": "~Chao_Wang31;~Hehe_Fan1;~Ruijie_Quan1;~Yi_Yang22",
        "gender": "M;M;M;M",
        "homepage": ";https://hehefan.github.io;;https://person.zju.edu.cn/yiyang",
        "dblp": ";184/5722.html;238/0204;33/4854-1.html",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;hVuflMQAAAAJ;WKLRPsAAAAAJ;RMSuNFwAAAAJ",
        "orcid": "0000-0003-1297-768X;0000-0001-9572-2345;;",
        "linkedin": ";;;",
        "or_profile": "~Chao_Wang31;~Hehe_Fan1;~Ruijie_Quan1;~Yi_Yang22",
        "aff": "University of Technology Sydney;Zhejiang University;Zhejiang University;Zhejiang University",
        "aff_domain": "uts.edu.au;zju.edu.cn;zju.edu.cn;zju.edu.cn",
        "position": "PhD student;Assistant Professor;Postdoc;Full Professor",
        "bibtex": "@misc{\nwang2024protchatgpt,\ntitle={ProtChat{GPT}: Towards Understanding Proteins with Large Language Models},\nauthor={Chao Wang and Hehe Fan and Ruijie Quan and Yi Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=iKsu33WcmU}\n}",
        "github": "",
        "project": "",
        "reviewers": "MnUj;uU9h;o37r;iHd4",
        "site": "https://openreview.net/forum?id=iKsu33WcmU",
        "pdf_size": 3942180,
        "rating": "3;5;6;6",
        "confidence": "4;3;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "76;46;88;87",
        "wc_strengths": "18;77;116;106",
        "wc_weaknesses": "149;102;121;147",
        "wc_questions": "36;83;88;257",
        "wc_review": "279;308;413;597",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            74.25,
            16.97608612136496
        ],
        "wc_strengths_avg": [
            79.25,
            38.15347297429161
        ],
        "wc_weaknesses_avg": [
            129.75,
            19.45989465541887
        ],
        "wc_questions_avg": [
            116.0,
            83.89576866564845
        ],
        "wc_review_avg": [
            399.25,
            124.58004454967899
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 23,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8700214857765136964&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "University of Technology Sydney;Zhejiang University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uts.edu.au;https://www.zju.edu.cn",
        "aff_unique_abbr": "UTS;ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "Australia;China"
    },
    {
        "id": "iMRhuFS0Uz",
        "title": "Mildly Constrained Evaluation Policy for Offline Reinforcement Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Offline reinforcement learning (RL) methodologies enforce constraints on the policy to adhere closely to the behavior policy, thereby stabilizing value learning and mitigating the selection of out-of-distribution (OOD) actions during test time. Conventional approaches apply identical constraints for both value learning and test time inference. However, our findings indicate that the constraints suitable for value estimation may in fact be excessively restrictive for action selection during test time.\nTo address this issue, we propose a \\textit{Mildly Constrained Evaluation Policy (MCEP)} for test time inference with a more constrained \\textit{target policy} for value estimation. Since the \\textit{target policy} has been adopted in various prior approaches, MCEP can be seamlessly integrated with them as a plug-in. We instantiate MCEP based on TD3-BC [Fujimoto and Gu, 2021], AWAC [Nair et al., 2020] and DQL [Wang et al., 2023] algorithms. The empirical results on D4RL MuJoCo locomotion and high-dimensional humanoid tasks show that the MCEP brought significant performance improvement on classic offline RL methods and can further improve SOTA methods. The codes are open-sourced at link.",
        "keywords": "reinforcement learning;offline reinforcement learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/69ad46d773e3422ab7172a19de530a7dea7be502.zip",
        "author": "Linjie Xu;zhengyao jiang;Jinyu Wang;Lei Song;Jiang Bian",
        "authorids": "~Linjie_Xu1;~zhengyao_jiang2;~Jinyu_Wang1;~Lei_Song3;~Jiang_Bian1",
        "gender": "M;M;;M;M",
        "homepage": "http://eecs.qmul.ac.uk/people/profiles/xulinjie.html;https://zhengyaojiang.github.io/;;;https://sites.google.com/view/jiangbian",
        "dblp": ";;;76/893-1.html;09/851-2.html",
        "google_scholar": ";https://scholar.google.co.jp/citations?user=J8pFrgwAAAAJ;LvgWSg0AAAAJ;pXDSOocAAAAJ;pZBEnY8AAAAJ",
        "orcid": ";;;;0000-0002-9472-600X",
        "linkedin": ";;jinyuwang5134/;;jbian/",
        "or_profile": "~Linjie_Xu1;~zhengyao_jiang2;~Jinyu_Wang1;~Lei_Song3;~Jiang_Bian1",
        "aff": "School of Electronic Engineering and Computer Science;;Microsoft;Microsoft;Microsoft",
        "aff_domain": "qmul.ac.uk;;microsoft.com;microsoft.com;microsoft.com",
        "position": "PhD student;;Researcher;Principal Researcher;Partner Research Manager",
        "bibtex": "@misc{\nxu2024mildly,\ntitle={Mildly Constrained Evaluation Policy for Offline Reinforcement Learning},\nauthor={Linjie Xu and zhengyao jiang and Jinyu Wang and Lei Song and Jiang Bian},\nyear={2024},\nurl={https://openreview.net/forum?id=iMRhuFS0Uz}\n}",
        "github": "",
        "project": "",
        "reviewers": "WVL4;px9k;r8JF;VtJK",
        "site": "https://openreview.net/forum?id=iMRhuFS0Uz",
        "pdf_size": 8656314,
        "rating": "5;5;5;6",
        "confidence": "4;4;4;3",
        "soundness": "2;4;2;2",
        "contribution": "3;2;2;2",
        "presentation": "3;3;2;3",
        "wc_summary": "54;103;68;113",
        "wc_strengths": "52;80;29;182",
        "wc_weaknesses": "258;86;140;244",
        "wc_questions": "37;148;3;40",
        "wc_review": "401;417;240;579",
        "wc_reply_reviewers": "135;321;155;219",
        "wc_reply_authors": "1323;1349;819;1023",
        "reply_reviewers": "1;2;2;2",
        "reply_authors": "3;3;3;3",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            84.5,
            24.27447218787671
        ],
        "wc_strengths_avg": [
            85.75,
            58.43104910918509
        ],
        "wc_weaknesses_avg": [
            182.0,
            71.76350047203663
        ],
        "wc_questions_avg": [
            57.0,
            54.51146668362538
        ],
        "wc_review_avg": [
            409.25,
            119.98828067773952
        ],
        "wc_reply_reviewers_avg": [
            207.5,
            72.50344819386179
        ],
        "wc_reply_authors_avg": [
            1128.5,
            219.86984786459465
        ],
        "reply_reviewers_avg": [
            1.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            0.0
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=93229258655421342&as_sdt=5,31&sciodt=0,31&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Queen Mary University of London;Microsoft",
        "aff_unique_dep": "School of Electronic Engineering and Computer Science;Microsoft Corporation",
        "aff_unique_url": "https://www.eecs.qmul.ac.uk;https://www.microsoft.com",
        "aff_unique_abbr": "QMUL;Microsoft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "id": "iNtEAeVQE0",
        "title": "DISK: Domain Inference for Discovering Spurious Correlation with KL-Divergence",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Existing methods utilize domain information to address the subpopulation shift issue and enhance model generalization. However, the availability of domain information is not always guaranteed. In response to this challenge, we introduce a novel end-to-end method called DISK. DISK discovers the spurious correlations present in the training and validation sets through KL-divergence and assigns spurious labels (which are also the domain labels) to classify instances based on spurious features. By combining spurious labels $y_s$ with true labels $y$, DISK effectively partitions the data into different groups with unique data distributions $\\mathbb{P}(\\mathbf{x}|y,y_s)$. The group partition inferred by DISK then can be seamlessly leveraged to design algorithms to further mitigate the subpopulation shift and improve generalization on test data. Unlike existing domain inference methods,  such as ZIN and DISC, DISK reliably infers domains without requiring additional information. We extensively evaluated DISK on different datasets, considering scenarios where validation labels are either available or unavailable, demonstrating its effectiveness in domain inference and mitigating subpopulation shift. Furthermore, our results also suggest that for some complex data, the neural network-based DISK may have the potential to perform more reasonable domain inferences, which highlights the potential effective integration of DISK and human decisions when the (human-defined) domain information is available. Codes of DISK are available at [https://anonymous.4open.science/r/DISK-E23A/](https://anonymous.4open.science/r/DISK-E23A/).",
        "keywords": "Domain Generalization;Domain Inferrence;Spurious Correlation",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/a8bfce8aff8f3a7154eba3568c54658fe52e07fa.zip",
        "author": "Yujin Han;Difan Zou",
        "authorids": "~Yujin_Han1;~Difan_Zou1",
        "gender": "F;M",
        "homepage": "https://yujinhanml.github.io/;https://difanzou.github.io/",
        "dblp": "317/6852;161/8923",
        "google_scholar": "https://scholar.google.co.kr/citations?user=SxpbS5YAAAAJ;Cp4fcTQAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Yujin_Han1;~Difan_Zou1",
        "aff": "the University of Hong Kong;University of Hong Kong",
        "aff_domain": "cs.hku.hk;hku.hk",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nhan2024disk,\ntitle={{DISK}: Domain Inference for Discovering Spurious Correlation with {KL}-Divergence},\nauthor={Yujin Han and Difan Zou},\nyear={2024},\nurl={https://openreview.net/forum?id=iNtEAeVQE0}\n}",
        "github": "",
        "project": "",
        "reviewers": "eWm8;eBHc;R9Uq;cYfB",
        "site": "https://openreview.net/forum?id=iNtEAeVQE0",
        "pdf_size": 6580041,
        "rating": "3;3;3;6",
        "confidence": "4;4;3;4",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;2",
        "presentation": "2;3;2;2",
        "wc_summary": "168;104;44;27",
        "wc_strengths": "39;23;17;71",
        "wc_weaknesses": "358;312;206;313",
        "wc_questions": "122;132;53;204",
        "wc_review": "687;571;320;615",
        "wc_reply_reviewers": "0;0;81;0",
        "wc_reply_authors": "1978;1910;1521;1326",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "3;3;3;2",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            85.75,
            55.43633736097651
        ],
        "wc_strengths_avg": [
            37.5,
            20.946360065653412
        ],
        "wc_weaknesses_avg": [
            297.25,
            55.86311394829329
        ],
        "wc_questions_avg": [
            127.75,
            53.508760964911154
        ],
        "wc_review_avg": [
            548.25,
            138.1328617672131
        ],
        "wc_reply_reviewers_avg": [
            20.25,
            35.074028853269766
        ],
        "wc_reply_authors_avg": [
            1683.75,
            270.2983305534831
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            0.4330127018922193
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:a3dlRXD_flsJ:scholar.google.com/&scioq=DISK:+Domain+Inference+for+Discovering+Spurious+Correlation+with+KL-Divergence&hl=en&as_sdt=0,33",
        "gs_version_total": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Hong Kong",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.hku.hk",
        "aff_unique_abbr": "HKU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "iObosMNqxc",
        "title": "CLIP Facial Expression Recognition: Balancing Precision and Generalization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Current facial expression recognition (FER) methods excel in achieving high classification accuracy but often struggle to generalize effectively across various unseen test sets. On the other hand, CLIP demonstrates impressive generalization ability, albeit at the cost of lower classification accuracy compared to SOTA FER methods. In this paper, we propose a novel approach to adapt CLIP for FER, striking a balance between precision and generalization. Our motivation is rooted in the potential of large pre-trained models like CLIP to extract generalizable face features across diverse FER domains, showcasing high generalization ability. However, these extracted face features, which include extra information like age and gender, are not directly suitable for FER tasks, resulting in lower classification accuracy. To solve this problem, we train a traditional FER model to learn sigmoid masks to only select expression-related features from the fixed CLIP face features. The selected features are utilized for classification. To improve the generalization ability of the learned masks, we propose a channel-separation module to map the channels of the masked features directly to logits and avoid using the FC layer to reduce overfitting. We also introduce a channel-diverse loss to make the learned masks as diverse as possible. Extensive experiments on numerous FER datasets verify that our method outperforms SOTA FER methods by large margins. Based on both the high classification accuracy and generalization ability, our proposed method has the potential to become a new paradigm in the FER field. The code will be available.",
        "keywords": "Facial expression recognition;CLIP;generalization",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yuhang Zhang;Weihong Deng",
        "authorids": "~Yuhang_Zhang6;~Weihong_Deng1",
        "gender": "M;M",
        "homepage": ";http://whdeng.cn",
        "dblp": ";39/232",
        "google_scholar": "https://scholar.google.com.au/citations?hl=en;1rhBlUEAAAAJ",
        "orcid": "0000-0003-4161-5020;",
        "linkedin": "zhang-yuhang-1431931a0;",
        "or_profile": "~Yuhang_Zhang6;~Weihong_Deng1",
        "aff": "Beijing University of Posts and Telecommunications;Beijing University of Post and Telecommunication",
        "aff_domain": "bupt.edu.cn;bupt.edu.cn",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nzhang2024clip,\ntitle={{CLIP} Facial Expression Recognition: Balancing Precision and Generalization},\nauthor={Yuhang Zhang and Weihong Deng},\nyear={2024},\nurl={https://openreview.net/forum?id=iObosMNqxc}\n}",
        "github": "",
        "project": "",
        "reviewers": "Re8m;cU44;zwTJ;GoGn",
        "site": "https://openreview.net/forum?id=iObosMNqxc",
        "pdf_size": 11111639,
        "rating": "3;3;5;6",
        "confidence": "5;5;5;5",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;4",
        "presentation": "3;3;3;4",
        "wc_summary": "76;35;125;119",
        "wc_strengths": "29;18;64;230",
        "wc_weaknesses": "317;160;280;213",
        "wc_questions": "104;3;5;64",
        "wc_review": "526;216;474;626",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            5.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            88.75,
            36.334384541367974
        ],
        "wc_strengths_avg": [
            85.25,
            85.28005335364185
        ],
        "wc_weaknesses_avg": [
            242.5,
            60.48346881586737
        ],
        "wc_questions_avg": [
            44.0,
            42.432299018554254
        ],
        "wc_review_avg": [
            460.5,
            151.36297433652658
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:4zhn-hon4QQJ:scholar.google.com/&scioq=CLIP+Facial+Expression+Recognition:+Balancing+Precision+and+Generalization&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Beijing University of Posts and Telecommunications",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.bupt.edu.cn/",
        "aff_unique_abbr": "BUPT",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Beijing",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "iP31fDtrPR",
        "title": "Learning Directed Graphical Models with Optimal Transport",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Estimating the parameters of a probabilistic directed graphical model from incomplete data remains a long-standing challenge. This is because, in the presence of latent variables, both the likelihood function and posterior distribution are intractable without further assumptions about structural dependencies or model classes. While existing learning methods are fundamentally based on likelihood maximization, here we offer a new view of the parameter learning problem through the lens of optimal transport. This perspective licenses a general framework that operates on any directed graphs without making unrealistic assumptions on the posterior over the latent variables or resorting to black-box variational approximations. We develop a theoretical framework and support it with extensive empirical evidence demonstrating the flexibility and versatility of our approach. Across experiments, we show that not only can our method recover the ground-truth parameters but it also performs comparably or better on downstream applications, notably the non-trivial task of discrete representation learning.",
        "keywords": "Bayesian networks;probabilistic graphical models",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/2a1771364ba4a2016cef8108cb3c38802349ad7b.zip",
        "author": "Vy Vo;Trung Le;Long Tung Vuong;He Zhao;Edwin V. Bonilla;Dinh Phung",
        "authorids": "~Vy_Vo2;~Trung_Le2;~Long_Tung_Vuong1;~He_Zhao1;~Edwin_V._Bonilla1;~Dinh_Phung2",
        "gender": "F;M;M;;;",
        "homepage": "https://isvy08.github.io/;;;;;",
        "dblp": "176/4660;;329/6838;;;",
        "google_scholar": "3CpFpFkAAAAJ;https://scholar.google.com/citations?hl=en;DCC657sAAAAJ;;;",
        "orcid": ";;;;;",
        "linkedin": ";;long-vuong-783477131/;;;",
        "or_profile": "~Vy_Vo2;~Trung_Le2;~Long_Tung_Vuong1;~He_Zhao1;~Edwin_V._Bonilla1;~Dinh_Phung2",
        "aff": "Monash University;Monash University;Monash University;;;",
        "aff_domain": "monash.edu;monash.edu;monash.edu;;;",
        "position": "PhD student;Assistant Professor;PhD student;;;",
        "bibtex": "@misc{\nvo2024learning,\ntitle={Learning Directed Graphical Models with Optimal Transport},\nauthor={Vy Vo and Trung Le and Long Tung Vuong and He Zhao and Edwin V. Bonilla and Dinh Phung},\nyear={2024},\nurl={https://openreview.net/forum?id=iP31fDtrPR}\n}",
        "github": "",
        "project": "",
        "reviewers": "zaHP;Y8kc;7CB5",
        "site": "https://openreview.net/forum?id=iP31fDtrPR",
        "pdf_size": 2173846,
        "rating": "3;5;6",
        "confidence": "4;3;3",
        "soundness": "3;3;2",
        "contribution": "2;2;3",
        "presentation": "2;3;3",
        "wc_summary": "67;57;71",
        "wc_strengths": "31;4;54",
        "wc_weaknesses": "585;54;26",
        "wc_questions": "22;14;279",
        "wc_review": "705;129;430",
        "wc_reply_reviewers": "0;46;32",
        "wc_reply_authors": "688;532;550",
        "reply_reviewers": "0;1;1",
        "reply_authors": "1;2;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            65.0,
            5.887840577551898
        ],
        "wc_strengths_avg": [
            29.666666666666668,
            20.43417616532547
        ],
        "wc_weaknesses_avg": [
            221.66666666666666,
            257.169637053487
        ],
        "wc_questions_avg": [
            105.0,
            123.07991983531134
        ],
        "wc_review_avg": [
            421.3333333333333,
            235.23085587472482
        ],
        "wc_reply_reviewers_avg": [
            26.0,
            19.252705437591537
        ],
        "wc_reply_authors_avg": [
            590.0,
            69.68500556073738
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.9449111825230683,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=599274555169055601&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Monash University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.monash.edu",
        "aff_unique_abbr": "Monash",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Australia"
    },
    {
        "id": "iP8ig954Uz",
        "title": "HART: Efficient Adaptation via Regularized Autoregressive Parameter Generation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Fine-tuning is an effective approach for adapting a pre-trained language model to downstream tasks, but it incurs a high computational cost. To achieve an extremely efficient task adaptation, \\citet{phang2022hypertuning} have proposed to use an auxiliary hypernetwork to generate task-specific weights without any backpropagation. A hypernetwork can generate weights for parameter-efficient fine-tuning (PEFT) modules, such as prefixes \\citep{li2021prefix} and LoRAs \\citep{hu2021lora}, for any unseen task based on a few task-specific demonstration examples, at the cost of a single forward pass. However, hypernetwork training is challenging. Firstly, it is sample inefficient due to the under-exploitation of the dependencies between PEFT weights across layers. Secondly, it exhibits training instability due to the high diversity of few-shot demonstration inputs. To address these limitations, we propose a novel hypernetwork training approach, named HART. It exploits layerwise dependencies by autoregressively generating weights for individual layers, and stabilizes the training by regularizing the consistency between weights generated based on different demonstrations. We train the hypernetwork on a diverse collection of tasks \\citep{wang2022super,sanh2021multitask} and evaluate its performance on unseen tasks. HART notably outperforms \\citet{phang2022hypertuning} on both T5-Large and T5-XL models.",
        "keywords": "hypernetwork;weight generation;parameter-efficient fine-tuning;task adaptation;in-context learning",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/5966d475858630ac92707435d7d1296da5306a30.zip",
        "author": "Chen Liang;Nikos Karampatziakis;Tuo Zhao;Weizhu Chen",
        "authorids": "~Chen_Liang3;~Nikos_Karampatziakis1;~Tuo_Zhao2;~Weizhu_Chen1",
        "gender": "F;;M;M",
        "homepage": "https://cliang1453.github.io/;;https://www.microsoft.com/en-us/research/people/wzchen/;http://www2.isye.gatech.edu/~tzhao80",
        "dblp": "35/3221-6;91/8774;79/2536;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;LG_E-4EAAAAJ;EJXN6tYAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Chen_Liang3;~Nikos_Karampatziakis1;~Weizhu_Chen1;~Tuo_Zhao1",
        "aff": "Microsoft;Microsoft;Microsoft GenAI;Georgia Institute of Technology",
        "aff_domain": "microsoft.com;microsoft.com;microsoft.com;gatech.edu",
        "position": "Researcher;Researcher;Vice President;Associate Professor",
        "bibtex": "@misc{\nliang2024hart,\ntitle={{HART}: Efficient Adaptation via Regularized Autoregressive Parameter Generation},\nauthor={Chen Liang and Nikos Karampatziakis and Tuo Zhao and Weizhu Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=iP8ig954Uz}\n}",
        "github": "",
        "project": "",
        "reviewers": "Yxi9;hN68;cSGa",
        "site": "https://openreview.net/forum?id=iP8ig954Uz",
        "pdf_size": 1227592,
        "rating": "5;5;6",
        "confidence": "3;4;3",
        "soundness": "3;2;3",
        "contribution": "2;2;2",
        "presentation": "3;2;2",
        "wc_summary": "46;47;530",
        "wc_strengths": "130;36;2",
        "wc_weaknesses": "97;116;2",
        "wc_questions": "8;16;2",
        "wc_review": "281;215;536",
        "wc_reply_reviewers": "83;137;624",
        "wc_reply_authors": "402;700;937",
        "reply_reviewers": "1;1;1",
        "reply_authors": "1;1;2",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            207.66666666666666,
            227.92445142098194
        ],
        "wc_strengths_avg": [
            56.0,
            54.135632135098106
        ],
        "wc_weaknesses_avg": [
            71.66666666666667,
            49.86871653540814
        ],
        "wc_questions_avg": [
            8.666666666666666,
            5.734883511361751
        ],
        "wc_review_avg": [
            344.0,
            138.41242718773483
        ],
        "wc_reply_reviewers_avg": [
            281.3333333333333,
            243.30273780256198
        ],
        "wc_reply_authors_avg": [
            679.6666666666666,
            218.8855611704182
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:mkroiMPZflsJ:scholar.google.com/&scioq=HART:+Efficient+Adaptation+via+Regularized+Autoregressive+Parameter+Generation&hl=en&as_sdt=0,5",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "Microsoft;Georgia Institute of Technology",
        "aff_unique_dep": "Microsoft Corporation;",
        "aff_unique_url": "https://www.microsoft.com;https://www.gatech.edu",
        "aff_unique_abbr": "Microsoft;Georgia Tech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "iPWUG1PRsf",
        "title": "Neural Coherence",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Many important machine learning problem settings involve adapting a large pre-trained model to a limited number of examples.  To create a good pre-trained model a number of choices must be made, from determining when to stop training the model, to which dataset(s) to train the model upon. In this work we develop a principle that we shall refer to as Neural Coherence, which is based on characterizing the way in which a neural network behaves on different types of inputs using the statistics of activation functions across different sets of inputs. Our experiments show that these measures of Neural Coherence can be used to formulate a general approach for inferring and improving the generalization of a model to a downstream problem.  We show how Neural Coherence can be used to make decisions for early-stopping, and to infer which dataset to train on, given a target dataset. Overall, our experiments indicate that our approach to using Neural Coherence for model selection tasks can significantly improve the performance of deep learning models to out-of-distribution downstream problems.",
        "keywords": "Out-of-Distribution;Meta-Learning;Transfer Learning;Few-Shot Learning;Domain Adaptation;Model Selection",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Simon Guiroy;Christopher Pal;Sarath Chandar;Mats Leon Richter",
        "authorids": "~Simon_Guiroy1;~Christopher_Pal1;~Sarath_Chandar1;~Mats_Leon_Richter1",
        "gender": "Not Specified;;M;M",
        "homepage": "https://simonguiroy.github.io/;https://scholar.google.ca/citations?user=1ScWJOoAAAAJ&hl=en&oi=ao;http://sarathchandar.in/;",
        "dblp": ";45/1217;45/8542;245/2691.html",
        "google_scholar": ";https://scholar.google.ca/citations?user=1ScWJOoAAAAJ;https://scholar.google.co.in/citations?user=yxWtZLAAAAAJ;xtlV5SAAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;https://de.linkedin.com/in/mats-richter-879609154",
        "or_profile": "~Simon_Guiroy1;~Christopher_Pal1;~Sarath_Chandar1;~Mats_Leon_Richter1",
        "aff": "Montreal Institute for Learning Algorithms, University of Montreal, University of Montreal;Polytechnique Montreal;\u00c9cole Polytechnique de Montr\u00e9al;Montreal Institute for Learning Algorithms, University of Montreal, Universit\u00e9 de Montr\u00e9al",
        "aff_domain": "mila.umontreal.ca;polymtl.ca;polymtl.ca;mila.umontreal.ca",
        "position": "PhD student;Full Professor;Assistant Professor;Postdoc",
        "bibtex": "@misc{\nguiroy2024neural,\ntitle={Neural Coherence},\nauthor={Simon Guiroy and Christopher Pal and Sarath Chandar and Mats Leon Richter},\nyear={2024},\nurl={https://openreview.net/forum?id=iPWUG1PRsf}\n}",
        "github": "",
        "project": "",
        "reviewers": "EvXa;KqcV;q2Kw;zNiE",
        "site": "https://openreview.net/forum?id=iPWUG1PRsf",
        "pdf_size": 984932,
        "rating": "3;3;3;5",
        "confidence": "4;3;4;3",
        "soundness": "1;3;2;2",
        "contribution": "2;2;2;2",
        "presentation": "2;3;3;1",
        "wc_summary": "139;83;54;115",
        "wc_strengths": "74;153;51;84",
        "wc_weaknesses": "782;265;192;368",
        "wc_questions": "146;92;171;289",
        "wc_review": "1141;593;468;856",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            97.75,
            32.135455497005175
        ],
        "wc_strengths_avg": [
            90.5,
            38.01644381054072
        ],
        "wc_weaknesses_avg": [
            401.75,
            228.2677977727038
        ],
        "wc_questions_avg": [
            174.5,
            72.00868003234055
        ],
        "wc_review_avg": [
            764.5,
            258.57735786414094
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "University of Montreal;Polytechnique Montreal;\u00c9cole Polytechnique de Montr\u00e9al",
        "aff_unique_dep": "Montreal Institute for Learning Algorithms;;",
        "aff_unique_url": "https://www.umontreal.ca;https://www.polymtl.ca;https://www.polymtl.ca",
        "aff_unique_abbr": "UM;PolyMTL;Polytechnique Montr\u00e9al",
        "aff_campus_unique_index": "0;0;1;0",
        "aff_campus_unique": "Montreal;Montr\u00e9al",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "title": "Identifying Policy Gradient Subspaces",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18066",
        "id": "iPWxqnt2ke",
        "author_site": "Jan Schneider, Pierre Schumacher, Simon Guist, Le Chen, Daniel Haeufle, Bernhard Schoelkopf, Dieter B\u00fcchler",
        "tldr": "",
        "abstract": "Policy gradient methods hold great potential for solving complex continuous control tasks. Still, their training efficiency can be improved by exploiting structure within the optimization problem. Recent work indicates that supervised learning can be accelerated by leveraging the fact that gradients lie in a low-dimensional and slowly-changing subspace. In this paper, we conduct a thorough evaluation of this phenomenon for two popular deep policy gradient methods on various simulated benchmark tasks. Our results demonstrate the existence of such gradient subspaces despite the continuously changing data distribution inherent to reinforcement learning. These findings reveal promising directions for future work on more efficient reinforcement learning, e.g., through improving parameter-space exploration or enabling second-order optimization.",
        "keywords": "reinforcement learning;policy gradients;gradient subspaces",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Jan Schneider;Pierre Schumacher;Simon Guist;Le Chen;Daniel Haeufle;Bernhard Sch\u00f6lkopf;Dieter B\u00fcchler",
        "authorids": "~Jan_Schneider1;~Pierre_Schumacher1;~Simon_Guist1;~Le_Chen3;~Daniel_Haeufle1;~Bernhard_Sch\u00f6lkopf1;~Dieter_B\u00fcchler1",
        "gender": "M;M;M;;;;M",
        "homepage": "https://ei.is.mpg.de/person/jschneider;https://al.is.mpg.de/person/pschumacher;https://www.is.mpg.de/person/sguist;;;;http://embodied.ml/",
        "dblp": ";;;;;;181/4076.html",
        "google_scholar": "https://scholar.google.com/citations?hl=de;;;;;;https://scholar.google.de/citations?user=8HYQ1tgAAAAJ",
        "orcid": "0000-0001-8426-7981;;;;;;",
        "linkedin": ";;simon-guist-831a27155/;;;;",
        "or_profile": "~Jan_Schneider1;~Pierre_Schumacher1;~Simon_Guist1;~Le_Chen3;~Daniel_Haeufle1;~Bernhard_Sch\u00f6lkopf1;~Dieter_B\u00fcchler1",
        "aff": "Max Planck Institute for Intelligent Systems;Max Planck Institute for Intelligent Systems, Max-Planck Institute;Max-Planck-Institute for Intelligent Systems, Max-Planck Institute;;;;Max Planck Institute for Intelligent Systems, Max-Planck Institute",
        "aff_domain": "is.mpg.de;tuebingen.mpg.de;is.mpg.de;;;;tuebingen.mpg.de",
        "position": "PhD student;PhD Student;PhD student;;;;Group Leader",
        "bibtex": "@inproceedings{\nschneider2024identifying,\ntitle={Identifying Policy Gradient Subspaces},\nauthor={Jan Schneider and Pierre Schumacher and Simon Guist and Le Chen and Daniel Haeufle and Bernhard Sch{\\\"o}lkopf and Dieter B{\\\"u}chler},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=iPWxqnt2ke}\n}",
        "github": "",
        "project": "",
        "reviewers": "862E;CUg2;qF4u;u1A7",
        "pdf_size": 2887325,
        "rating": "6;6;6;8",
        "confidence": "2;3;2;3",
        "soundness": "3;3;3;2",
        "contribution": "3;3;2;3",
        "presentation": "3;3;3;4",
        "wc_summary": "100;66;21;283",
        "wc_strengths": "88;91;52;187",
        "wc_weaknesses": "146;42;48;1250",
        "wc_questions": "1;143;107;51",
        "wc_review": "335;342;228;1771",
        "wc_reply_reviewers": "32;22;0;129",
        "wc_reply_authors": "673;700;743;2096",
        "reply_reviewers": "1;1;0;4",
        "reply_authors": "2;2;2;4",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            2.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            117.5,
            99.57534835490158
        ],
        "wc_strengths_avg": [
            104.5,
            50.04248195283683
        ],
        "wc_weaknesses_avg": [
            371.5,
            508.8798974217787
        ],
        "wc_questions_avg": [
            75.5,
            54.080957831754425
        ],
        "wc_review_avg": [
            669.0,
            637.8420650913516
        ],
        "wc_reply_reviewers_avg": [
            45.75,
            49.43872470038037
        ],
        "wc_reply_authors_avg": [
            1053.0,
            602.6935373803174
        ],
        "reply_reviewers_avg": [
            1.5,
            1.5
        ],
        "reply_authors_avg": [
            2.5,
            0.8660254037844386
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9060193178834978138&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=iPWxqnt2ke",
        "pdf": "https://openreview.net/pdf?id=iPWxqnt2ke",
        "email": "is.mpg.de;tuebingen.mpg.de;is.mpg.de;;;;tuebingen.mpg.de",
        "author_num": 7,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Max Planck Institute for Intelligent Systems;Max-Planck-Institute for Intelligent Systems",
        "aff_unique_dep": "Intelligent Systems;Intelligent Systems",
        "aff_unique_url": "https://www.mpi-is.mpg.de;https://www.mpi-is.mpg.de",
        "aff_unique_abbr": "MPI-IS;MPI-IS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "iPtgY9cJaV",
        "title": "Identifying Latent State Transition Processes for Individualized Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In recent years, reinforcement learning (RL) has been increasingly applied to systems that interact with individuals in various domains, such as healthcare, education, and e-commerce. When an RL agent interacts with individuals, individual-specific factors, ranging from personal preferences to physiological nuances, may causally influence state transitions, such as health conditions, learning progress, or user selections. Consequently, different individuals may exhibit different state transition processes. Understanding these individualized state-transition processes is crucial for making individualized policies. In practice, however, identifying these state-transition processes is challenging, especially since individual-specific factors often remain latent. In this paper, we present a practical method that effectively learns these processes from observed state-action trajectories, backed by theoretical guarantees. To our knowledge, this is the first work to provide a theoretical guarantee for identifying the state-transition processes involving latent individual-specific factors. Our experiments on synthetic and real-world datasets demonstrate that our method can effectively identify the latent state-transition processes and help learn individualized RL policies.",
        "keywords": "individualized reinforcement learning;latent state transition;identifiability",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/ba4755d8b4a7788218cb4bd2b10f84ecc5f4ce97.pdf",
        "author": "Yuewen Sun;Biwei Huang;Yu Yao;Donghuo Zeng;Xinshuai Dong;Roberto Legaspi;Kazushi Ikeda;Peter Spirtes;Kun Zhang",
        "authorids": "~Yuewen_Sun1;~Biwei_Huang1;~Yu_Yao3;xdo-zen@kddi.com;~Xinshuai_Dong1;~Roberto_Legaspi1;~Kazushi_Ikeda2;~Peter_Spirtes1;~Kun_Zhang1",
        "gender": "F;F;M;;M;M;M;M;M",
        "homepage": "https://yuewen-sun.github.io/;;https://a5507203.github.io/;;https://dongxinshuai.github.io/;https://www.researchgate.net/profile/Roberto-Legaspi;https://scholar.google.co.jp/citations?user=_2Ns9dAAAAAJ&hl=ja;https://www.cmu.edu/dietrich/philosophy/people/faculty/spirtes.html;http://www.andrew.cmu.edu/user/kunz1/",
        "dblp": "219/9893;165/3288;230/9625;;279/6151.html;296/0450.html;;87/3550;96/3115-1",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;OkcaMKAAAAAJ;;A7JyL1sAAAAJ;zE7Zhk0AAAAJ;;mar1eCwAAAAJ;RGoypN4AAAAJ",
        "orcid": ";;;;;0000-0001-8909-635X;;;",
        "linkedin": ";;yu-yao-150377134/;;;roberto-legaspi-5a3a4361/;;;",
        "or_profile": "~Yuewen_Sun1;~Biwei_Huang1;~Yu_Yao3;xdo-zen@kddi.com;~Xinshuai_Dong1;~Roberto_Legaspi1;~Kazushi_Ikeda2;~Peter_Spirtes1;~Kun_Zhang1",
        "aff": "Mohamed bin Zayed University of Artificial Intelligence;University of California, San Diego;University of Sydney;;Carnegie Mellon University;KDDI Research, Inc.;;Carnegie Mellon University;Carnegie Mellon University",
        "aff_domain": "mbzuai.ac.ae;ucsd.edu;sydney.edu.au;;cmu.edu;kddi-research.jp;;cmu.edu;cmu.edu",
        "position": "Postdoc;Assistant Professor;Lecturer;;PhD student;Researcher;;Full Professor;Associate Professor",
        "bibtex": "@misc{\nsun2024identifying,\ntitle={Identifying Latent State Transition Processes for Individualized Reinforcement Learning},\nauthor={Yuewen Sun and Biwei Huang and Yu Yao and Donghuo Zeng and Xinshuai Dong and Roberto Legaspi and Kazushi Ikeda and Peter Spirtes and Kun Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=iPtgY9cJaV}\n}",
        "github": "",
        "project": "",
        "reviewers": "rs8u;y8Yq;Mxvj;2bUe;DHA9",
        "site": "https://openreview.net/forum?id=iPtgY9cJaV",
        "pdf_size": 2186724,
        "rating": "3;5;6;6;6",
        "confidence": "3;3;3;3;3",
        "soundness": "2;2;3;2;2",
        "contribution": "1;2;3;2;2",
        "presentation": "2;3;2;3;2",
        "wc_summary": "47;45;50;117;121",
        "wc_strengths": "39;57;34;22;49",
        "wc_weaknesses": "74;625;36;287;213",
        "wc_questions": "19;3;56;51;4",
        "wc_review": "179;730;176;477;387",
        "wc_reply_reviewers": "0;318;14;183;120",
        "wc_reply_authors": "1804;4334;922;3320;2255",
        "reply_reviewers": "0;1;1;1;2",
        "reply_authors": "5;8;2;7;5",
        "rating_avg": [
            5.2,
            1.16619037896906
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.2,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            2.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            76.0,
            35.16816742453322
        ],
        "wc_strengths_avg": [
            40.2,
            12.089665007765932
        ],
        "wc_weaknesses_avg": [
            247.0,
            209.80467106334882
        ],
        "wc_questions_avg": [
            26.6,
            22.73851358378555
        ],
        "wc_review_avg": [
            389.8,
            206.6372667260192
        ],
        "wc_reply_reviewers_avg": [
            127.0,
            117.10166523154143
        ],
        "wc_reply_authors_avg": [
            2527.0,
            1188.8512102025215
        ],
        "reply_reviewers_avg": [
            1.0,
            0.6324555320336759
        ],
        "reply_authors_avg": [
            5.4,
            2.0591260281974
        ],
        "replies_avg": [
            40,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14326577476552009830&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;3;4;3;3",
        "aff_unique_norm": "Mohamed bin Zayed University of Artificial Intelligence;University of California, San Diego;University of Sydney;Carnegie Mellon University;KDDI Research",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://mbzuai.ac.ae;https://www.ucsd.edu;https://www.sydney.edu.au;https://www.cmu.edu;https://www.kddi-research.com",
        "aff_unique_abbr": "MBZUAI;UCSD;USYD;CMU;KDDI",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";San Diego",
        "aff_country_unique_index": "0;1;2;1;3;1;1",
        "aff_country_unique": "United Arab Emirates;United States;Australia;Japan"
    },
    {
        "id": "iQHL76NqJT",
        "title": "Node-CwR: Node Classification with Reject Option",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Graph attention networks (GAT) have been state-of-the-art GNN architecture used as the backbone for various graph learning problems. One of the key tasks in graph learning is node classification. While several works cover multiple aspects of node classification, there has yet to be an attempt to understand the behaviour of GAT models for node classification with a reject option. This paper proposes a new approach called Node-CwR, which models node classification with a reject option using GAT. We offer both cost-based and coverage-based models to include the reject option in the node classification task. Cost-based models find the optimal classifier for a given cost of rejection value. Such models are trained by minimizing the rejection and misclassification rates on unrejected samples. Coverage-based methods take coverage as input and find the optimal model for a given coverage rate. We empirically evaluate our approaches on three benchmark datasets and show their effectiveness in learning efficient reject option models for node classification tasks. We observe that, in general, cost-based methods outperform coverage-based models for reject option. Additionally, our results include robust learning of node classifiers using label smoothing in the presence of label noise. We observe that label smoothing works well to handle label noise in cost-based models, while it works adversely in coverage-based models.",
        "keywords": "Node classification;graph attention networks;reject option;label noise;label smoothing;robust learning",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/513a54a045b9d795371cba893c5e396122774c7e.zip",
        "author": "Uday Bhaskar Kuchipudi;Charu Sharma;Naresh Manwani",
        "authorids": "~Uday_Bhaskar_Kuchipudi1;~Charu_Sharma2;~Naresh_Manwani1",
        "gender": "M;F;M",
        "homepage": "https://github.com/BhaskarSteve;https://charusharma.org/;https://sites.google.com/site/nareshmanwani/home",
        "dblp": ";202/8640;17/2536",
        "google_scholar": ";https://scholar.google.com.tw/citations?user=bftN0M0AAAAJ;https://scholar.google.com.tw/citations?user=qz4eDmgAAAAJ",
        "orcid": ";0000-0003-2518-5008;",
        "linkedin": ";shcharu/;",
        "or_profile": "~Uday_Bhaskar_Kuchipudi1;~Charu_Sharma2;~Naresh_Manwani1",
        "aff": "International Institute of Information Technology Hyderabad, Dhirubhai Ambani Institute Of Information and Communication Technology;International Institute of Information Technology Hyderabad,;International Institute of Information Technology Hyderabad",
        "aff_domain": "iiit.ac.in;iiit.ac.in;iiit.ac.in",
        "position": "MS student;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nkuchipudi2024nodecwr,\ntitle={Node-CwR: Node Classification with Reject Option},\nauthor={Uday Bhaskar Kuchipudi and Charu Sharma and Naresh Manwani},\nyear={2024},\nurl={https://openreview.net/forum?id=iQHL76NqJT}\n}",
        "github": "",
        "project": "",
        "reviewers": "JNJ6;C48L;Kn9X;A6Y2",
        "site": "https://openreview.net/forum?id=iQHL76NqJT",
        "pdf_size": 2651316,
        "rating": "3;3;3;3",
        "confidence": "4;4;4;4",
        "soundness": "2;2;3;2",
        "contribution": "2;2;2;2",
        "presentation": "3;2;3;2",
        "wc_summary": "56;46;72;74",
        "wc_strengths": "34;30;43;26",
        "wc_weaknesses": "275;182;99;208",
        "wc_questions": "123;57;53;4",
        "wc_review": "488;315;267;312",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            62.0,
            11.575836902790225
        ],
        "wc_strengths_avg": [
            33.25,
            6.299801584177076
        ],
        "wc_weaknesses_avg": [
            191.0,
            63.027771656627685
        ],
        "wc_questions_avg": [
            59.25,
            42.310607417053234
        ],
        "wc_review_avg": [
            345.5,
            84.44080767022542
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:mHBNaYhHKlUJ:scholar.google.com/&scioq=Node-CwR:+Node+Classification+with+Reject+Option&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "International Institute of Information Technology Hyderabad;International Institute of Information Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://iiit Hyderabad.ac.in;https://iiit Hyderabad.ac.in",
        "aff_unique_abbr": "IIIT Hyderabad;IIIT Hyderabad",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hyderabad",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "India"
    },
    {
        "id": "iQIQT88prm",
        "title": "Adversarial Machine Unlearning: A Stackelberg Game Approach",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper focuses on the challenge of machine unlearning, aiming to remove\nthe influence of specific training data on machine learning models. \nTraditionally, the development of unlearning algorithms runs parallel with that of membership inference attacks, a type of privacy threat to determine whether a data instance was used for training. \nRecognizing this interplay, we propose a game-theoretic framework that integrates the attacks into the design of unlearning algorithms.\nWe model the unlearning problem as a Stackelberg game, introducing a two-player dynamic: a defender striving to unlearn specific training data from a model, and an attacker employing membership inference attacks to detect the traces of the data.\nAdopting this adversarial perspective allows the utilization of new attack advancements,  facilitating the design of unlearning algorithms.\nOur framework stands out in two ways. First, it enables the exact implementation of advanced membership inference attacks, providing verification for the effectiveness of unlearning. Second, it enables differentiation through optimization problems of attacks, making the framework readily integrable into end-to-end learning pipelines.\nWe present extensive experimental results to validate the efficacy of the proposed framework.",
        "keywords": "machine unlearning;game theory;privacy;membership inference attack;adversarial;stackelberg game",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Sixie Yu;Zonglin Di;Yang Liu",
        "authorids": "~Sixie_Yu1;~Zonglin_Di1;~Yang_Liu3",
        "gender": "M;;M",
        "homepage": "http://sixie-yu.org/;;http://www.yliuu.com",
        "dblp": "169/3359;;51/3710-18",
        "google_scholar": "oUnG6J4AAAAJ;;jKrIVCIAAAAJ",
        "orcid": ";;0000-0001-8420-6011",
        "linkedin": ";;",
        "or_profile": "~Sixie_Yu1;~Zonglin_Di1;~Yang_Liu3",
        "aff": ";;University of California, Santa Cruz",
        "aff_domain": ";;ucsc.edu",
        "position": ";;Assistant Professor",
        "bibtex": "@misc{\nyu2024adversarial,\ntitle={Adversarial Machine Unlearning: A Stackelberg Game Approach},\nauthor={Sixie Yu and Zonglin Di and Yang Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=iQIQT88prm}\n}",
        "github": "",
        "project": "",
        "reviewers": "BoXP;4Z9k;d9Wv",
        "site": "https://openreview.net/forum?id=iQIQT88prm",
        "pdf_size": 505391,
        "rating": "5;5;6",
        "confidence": "4;4;4",
        "soundness": "2;3;3",
        "contribution": "3;3;3",
        "presentation": "2;3;3",
        "wc_summary": "118;23;68",
        "wc_strengths": "42;74;86",
        "wc_weaknesses": "539;67;248",
        "wc_questions": "5;5;8",
        "wc_review": "704;169;410",
        "wc_reply_reviewers": "651;0;0",
        "wc_reply_authors": "1490;165;249",
        "reply_reviewers": "3;0;0",
        "reply_authors": "5;1;1",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            69.66666666666667,
            38.80148908940939
        ],
        "wc_strengths_avg": [
            67.33333333333333,
            18.571184369578823
        ],
        "wc_weaknesses_avg": [
            284.6666666666667,
            194.42965023084543
        ],
        "wc_questions_avg": [
            6.0,
            1.4142135623730951
        ],
        "wc_review_avg": [
            427.6666666666667,
            218.76979275535786
        ],
        "wc_reply_reviewers_avg": [
            217.0,
            306.8843430349616
        ],
        "wc_reply_authors_avg": [
            634.6666666666666,
            605.783422978506
        ],
        "reply_reviewers_avg": [
            1.0,
            1.4142135623730951
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            1.8856180831641267
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:uw-MuGlMWKUJ:scholar.google.com/&scioq=Adversarial+Machine+Unlearning:+A+Stackelberg+Game+Approach&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of California, Santa Cruz",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucsc.edu",
        "aff_unique_abbr": "UCSC",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Santa Cruz",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "iS3fQooCaa",
        "title": "Large Language Models as Gaming Agents",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Although recent works have demonstrated that Large Language Models (LLMs) are starting to excel at following human instructions, their strategic thinking, planning, and long-term decision-making skills remain unclear. To rigorously evaluate these capabilities, we propose leveraging strategic gaming environments as they provide well-defined, structured benchmarks with clear success criteria. Specifically, we adopt multiple popular reasoning-oriented autonomous agents and analyze their performances over two popular strategic gaming environments: Tic-Tac-Toe (one of the most popular complete information gaming) and Texas Hold\u2019em Poker (one of the most popular incomplete information games). To our surprise, we find that even one of the most advanced LLMs, ChatGPT, is largely ineffective\nin these two gaming scenarios. An even more surprising finding is that state-of-the-art reasoning methods, e.g., Chain-of-Thought, ReAct, etc., do not help much. For instance, in the naive 3\u00d73 Tic-Tac-Toe environment, nearly all agents only perform slightly better than the random agent, i.e., the agent that randomly selects an action at each step. To understand this failure mode in more depth, we\ncarry out a detailed demographic analysis. Our analysis uncovers two potential reasons behind this weakness: 1) autonomous agents lack gaming intents, i.e., they cannot \u201cthink ahead\u201d to defend against opponents\u2019 future moves; 2) LLMs suffer from severe hallucinations and factual errors, e.g., even advanced reasoning agents fail to recognize immediate win/lose situations. With these insights, we take the first step to propose a simple yet effective Think Ahead Language-powered Gaming Agent (TALAGA). TALAGA recursively thinks ahead of the opponent\u2019s move, evaluates current gaming situations, and adjusts action selection with reward signal backtrack. We further empower TALAGA with additional features to alleviate hallucinations and factual errors, such as uncertainty estimation. Experimental results demonstrate that TALAGA significantly outperforms existing reasoning autonomous agents. A broader implication of our exploration is that games can serve as stress tests for LLMs, pushing them to their limits and uncovering vulnerabilities or weaknesses. We hope that this paper sheds new light on the limitations of current autonomous reasoning agents, which, in turn, would help with model improvements and achieve greater robustness.",
        "keywords": "Language model;agent;reasoning;decision making",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/b7611b5dc3d866cd750e6451a9cd3984d7e42642.pdf",
        "author": "Jinhao Duan;Shiqi Wang;James Diffenderfer;Bhavya Kailkhura;Kaidi Xu",
        "authorids": "~Jinhao_Duan1;~Shiqi_Wang2;~James_Diffenderfer1;~Bhavya_Kailkhura1;~Kaidi_Xu1",
        "gender": "M;M;;M;M",
        "homepage": "https://jinhaoduan.github.io;https://shiqi-wang.github.io;;https://people.llnl.gov/kailkhura1;https://kaidixu.com/",
        "dblp": "282/2912;58/9145-2;188/4110;132/8938;195/8175",
        "google_scholar": "aWeTAXYAAAAJ;u_MzXeMAAAAJ;nRr24_QAAAAJ;SQpJmOgAAAAJ;lYK0wlsAAAAJ",
        "orcid": ";0000-0002-6338-1432;;;",
        "linkedin": ";tcwangshiqi/;;;",
        "or_profile": "~Jinhao_Duan1;~Shiqi_Wang2;~James_Diffenderfer1;~Bhavya_Kailkhura1;~Kaidi_Xu1",
        "aff": "Drexel University;Amazon;Lawrence Livermore National Labs;Lawrence Livermore National Laboratory;Drexel University",
        "aff_domain": "drexel.edu;amazon.com;llnl.gov;llnl.gov;drexel.edu",
        "position": "PhD student;Researcher;Researcher;Research Staff;Assistant Professor",
        "bibtex": "@misc{\nduan2024large,\ntitle={Large Language Models as Gaming Agents},\nauthor={Jinhao Duan and Shiqi Wang and James Diffenderfer and Bhavya Kailkhura and Kaidi Xu},\nyear={2024},\nurl={https://openreview.net/forum?id=iS3fQooCaa}\n}",
        "github": "",
        "project": "",
        "reviewers": "Fp2o;8Ys6;MMad",
        "site": "https://openreview.net/forum?id=iS3fQooCaa",
        "pdf_size": 583500,
        "rating": "3;3;6",
        "confidence": "4;4;4",
        "soundness": "2;3;2",
        "contribution": "2;2;2",
        "presentation": "2;2;3",
        "wc_summary": "35;83;103",
        "wc_strengths": "27;248;51",
        "wc_weaknesses": "182;399;32",
        "wc_questions": "53;6;210",
        "wc_review": "297;736;396",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            73.66666666666667,
            28.5345794120436
        ],
        "wc_strengths_avg": [
            108.66666666666667,
            99.00953938327805
        ],
        "wc_weaknesses_avg": [
            204.33333333333334,
            150.65707934098404
        ],
        "wc_questions_avg": [
            89.66666666666667,
            87.2251238017019
        ],
        "wc_review_avg": [
            476.3333333333333,
            188.00768305813696
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:HhCFqhYAyZwJ:scholar.google.com/&scioq=Large+Language+Models+as+Gaming+Agents&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;2;0",
        "aff_unique_norm": "Drexel University;Amazon;Lawrence Livermore National Laboratory",
        "aff_unique_dep": ";Amazon.com, Inc.;",
        "aff_unique_url": "https://www.drexel.edu;https://www.amazon.com;https://www.llnl.gov",
        "aff_unique_abbr": "Drexel;Amazon;LLNL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Deceptive Fairness Attacks on Graphs via Meta Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18065",
        "id": "iS5ADHNg2A",
        "author_site": "Jian Kang, Yinglong Xia, Ross Maciejewski, Jiebo Luo, Hanghang Tong",
        "tldr": "",
        "abstract": "We study deceptive fairness attacks on graphs to answer the following question: How can we achieve poisoning attacks on a graph learning model to exacerbate the bias deceptively? We answer this question via a bi-level optimization problem and propose a meta learning-based framework named FATE. FATE is broadly applicable with respect to various fairness definitions and graph learning models, as well as arbitrary choices of manipulation operations. We further instantiate FATE to attack statistical parity or individual fairness on graph neural networks. We conduct extensive experimental evaluations on real-world datasets in the task of semi-supervised node classification. The experimental results demonstrate that FATE could amplify the bias of graph neural networks with or without fairness consideration while maintaining the utility on the downstream task. We hope this paper provides insights into the adversarial robustness of fair graph learning and can shed light on designing robust and fair graph learning in future studies.",
        "keywords": "graph learning;fairness;adversarial attacks",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/d9919c5a8f3e8af21303186e780c0261eeaa9a08.pdf",
        "author": "Jian Kang;Yinglong Xia;Ross Maciejewski;Jiebo Luo;Hanghang Tong",
        "authorids": "~Jian_Kang1;~Yinglong_Xia1;~Ross_Maciejewski1;~Jiebo_Luo1;~Hanghang_Tong3",
        "gender": "M;M;M;;M",
        "homepage": "https://jiank2.github.io/;;http://rmaciejewski.faculty.asu.edu/;http://tonghanghang.org;https://www.cs.rochester.edu/u/jluo/",
        "dblp": "56/6072-8;61/3251;81/5349.html;58/1757;25/5545",
        "google_scholar": "U_jFlOQAAAAJ;;https://scholar.google.com.tw/citations?user=nChgOjEAAAAJ;RaINcuUAAAAJ;CcbnBvgAAAAJ",
        "orcid": "0000-0003-3902-7131;0000-0002-8155-5440;;0000-0003-4405-3887;0000-0002-4516-9729",
        "linkedin": "jiank2/;;;htong/;jieboluo/",
        "or_profile": "~Jian_Kang1;~Yinglong_Xia1;~Ross_Maciejewski1;~Hanghang_Tong3;~Jiebo_Luo3",
        "aff": "University of Rochester;Meta;Arizona State University;University of Illinois, Urbana Champaign;University of Rochester",
        "aff_domain": "cs.rochester.edu;meta.com;asu.edu;illinois.edu;rochester.edu",
        "position": "Assistant Professor;Researcher;Full Professor;Associate Professor;Full Professor",
        "bibtex": "@inproceedings{\nkang2024deceptive,\ntitle={Deceptive Fairness Attacks on Graphs via Meta Learning},\nauthor={Jian Kang and Yinglong Xia and Ross Maciejewski and Jiebo Luo and Hanghang Tong},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=iS5ADHNg2A}\n}",
        "github": "",
        "project": "",
        "reviewers": "Jcma;RLh1;CLho;5Ww3",
        "pdf_size": 1620829,
        "rating": "6;6;6;8",
        "confidence": "5;3;3;3",
        "soundness": "4;3;3;4",
        "contribution": "3;4;3;3",
        "presentation": "3;4;3;2",
        "wc_summary": "90;213;68;79",
        "wc_strengths": "68;96;24;8",
        "wc_weaknesses": "600;119;19;217",
        "wc_questions": "5;79;23;174",
        "wc_review": "763;507;134;478",
        "wc_reply_reviewers": "89;36;9;103",
        "wc_reply_authors": "2976;1168;428;1492",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "5;3;2;3",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            112.5,
            58.54271944486351
        ],
        "wc_strengths_avg": [
            49.0,
            34.91418050019218
        ],
        "wc_weaknesses_avg": [
            238.75,
            220.0026988470823
        ],
        "wc_questions_avg": [
            70.25,
            65.82315322133998
        ],
        "wc_review_avg": [
            470.5,
            223.70572187586083
        ],
        "wc_reply_reviewers_avg": [
            59.25,
            38.290827883450106
        ],
        "wc_reply_authors_avg": [
            1516.0,
            926.9606248379702
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.25,
            1.0897247358851685
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13618497786089597783&as_sdt=5,31&sciodt=0,31&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=iS5ADHNg2A",
        "pdf": "https://openreview.net/pdf?id=iS5ADHNg2A",
        "email": "cs.rochester.edu;meta.com;asu.edu;illinois.edu;rochester.edu",
        "author_num": 5,
        "aff_unique_index": "0;1;2;3;0",
        "aff_unique_norm": "University of Rochester;Meta;Arizona State University;University of Illinois Urbana-Champaign",
        "aff_unique_dep": ";Meta Platforms, Inc.;;",
        "aff_unique_url": "https://www.rochester.edu;https://meta.com;https://www.asu.edu;https://illinois.edu",
        "aff_unique_abbr": "U of R;Meta;ASU;UIUC",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Urbana-Champaign",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "iS7c9lkXuF",
        "title": "Object-Centric Noise Filtering in Neural Radiance Fields via Influence Functions and Segmentation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Neural Radiance Fields (NeRF) is a method for 3D scene modeling that employs fully-connected networks to learn 3D geometric information and synthesizes high-quality novel views. However, NeRF exhibits vulnerability when confronted with distractors in the training images, such as the presence of moving objects like pedestrians or different weather conditions within specific views. Given the difficulty of data curation in NeRF compared to other domains, training a robust model that maintains 3D consistency is an important and timely challenge. Previous approaches have attempted to differentiate distractors by using loss values, but there is a fundamental limitation that hard-to-learn pixels like high-frequency details also show high loss values. In this paper, we propose a noise pruning framework via influence functions to effectively filter out noisy pixels, ultimately enhancing the robustness of NeRF. Furthermore, we improve the precision of detection by incorporating segmentation techniques to refine pixel-level predictions. Our method demonstrates superior performance on benchmark datasets, including synthetic and natural scenes, showcasing its effectiveness across various environments and proficiency in dataset pruning.",
        "keywords": "NeRF;robust learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yeonsung Jung;Heecheol Yun;Jin-Hwa Kim;Eunho Yang",
        "authorids": "~Yeonsung_Jung1;~Heecheol_Yun1;~Jin-Hwa_Kim1;~Eunho_Yang1",
        "gender": ";M;Unspecified;M",
        "homepage": "https://yeonsungjung.github.io/;;http://wityworks.com;https://sites.google.com/site/hleehome2/",
        "dblp": "264/2809;379/5127;48/258;96/2621",
        "google_scholar": "https://scholar.google.com/citations?hl=ko;;https://scholar.google.co.kr/citations?user=3f2wPekAAAAJ;",
        "orcid": ";;0000-0002-0423-0415;",
        "linkedin": "yeonsung-jung-a50015213/;yoon6503-352b76229/;;",
        "or_profile": "~Yeonsung_Jung1;~Heecheol_Yun1;~Jin-Hwa_Kim1;~Eunho_Yang1",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;NAVER;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr;navercorp.com;kaist.ac.kr",
        "position": "PhD student;PhD student;Research Scientist;Associate Professor",
        "bibtex": "@misc{\njung2024objectcentric,\ntitle={Object-Centric Noise Filtering in Neural Radiance Fields via Influence Functions and Segmentation},\nauthor={Yeonsung Jung and Heecheol Yun and Jin-Hwa Kim and Eunho Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=iS7c9lkXuF}\n}",
        "github": "",
        "project": "",
        "reviewers": "RkM8;yQMB;hbFT",
        "site": "https://openreview.net/forum?id=iS7c9lkXuF",
        "pdf_size": 1577735,
        "rating": "3;3;5",
        "confidence": "4;4;3",
        "soundness": "2;2;2",
        "contribution": "2;1;2",
        "presentation": "1;2;3",
        "wc_summary": "80;69;48",
        "wc_strengths": "22;36;14",
        "wc_weaknesses": "172;107;164",
        "wc_questions": "62;41;21",
        "wc_review": "336;253;247",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            65.66666666666667,
            13.27487183449325
        ],
        "wc_strengths_avg": [
            24.0,
            9.092121131323903
        ],
        "wc_weaknesses_avg": [
            147.66666666666666,
            28.940552094864323
        ],
        "wc_questions_avg": [
            41.333333333333336,
            16.73983937265296
        ],
        "wc_review_avg": [
            278.6666666666667,
            40.61472092179824
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:kGx50PwHI38J:scholar.google.com/&scioq=Object-Centric+Noise+Filtering+in+Neural+Radiance+Fields+via+Influence+Functions+and+Segmentation&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology;NAVER Corporation",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.kaist.ac.kr;https://www.naver.com",
        "aff_unique_abbr": "KAIST;NAVER",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "iSAgvYhZzg",
        "title": "You Only Look at Screens: Multimodal Chain-of-Action Agents",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Autonomous user interface (UI) agents aim to facilitate task automation by interacting with the user interface without manual intervention. Recent studies have investigated eliciting the capabilities of large language models (LLMs) for effective engagement in diverse environments. To align with the input-output requirement of LLMs, existing approaches are developed under a sandbox setting where they rely on external tools and application-specific APIs to parse the environment into textual elements and interpret the predicted actions. Consequently, those approaches often grapple with inference inefficiency and error propagation risks. To mitigate the challenges, we introduce Auto-UI, a multimodal solution that directly interacts with the interface, bypassing the need for environment parsing or reliance on application-dependent APIs. Moreover, we propose a chain-of-action technique---leveraging a series of intermediate previous action histories and future action plans---to help the agent decide what action to execute. We evaluate our approach on a new device-control benchmark AITW with 30$K$ unique instructions, spanning multi-step tasks such as application operation, web searching, and web shopping. Experimental results show that Auto-UI achieves state-of-the-art performance with an action type prediction accuracy of 90\\% and an overall action success rate of 74\\%. Code is publicly available at Anonymous.",
        "keywords": "Autonomous Agent;Large Language Models;Natural Language Interface;Vision-language Model;Chain-of-Thought.",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/cf2679e33c9d991002f438fc305ec9a559d5cbec.zip",
        "author": "Zhuosheng Zhang;Aston Zhang",
        "authorids": "~Zhuosheng_Zhang1;~Aston_Zhang2",
        "gender": "M;",
        "homepage": "https://bcmi.sjtu.edu.cn/~zhangzs/;",
        "dblp": "06/9708;",
        "google_scholar": "https://scholar.google.co.jp/citations?user=63LTQhgAAAAJ;",
        "orcid": "0000-0002-4183-3645;",
        "linkedin": ";",
        "or_profile": "~Zhuosheng_Zhang1;~Aston_Zhang2",
        "aff": "Shanghai Jiaotong University;",
        "aff_domain": "sjtu.edu.cn;",
        "position": "Assistant Professor;",
        "bibtex": "@misc{\nzhang2024you,\ntitle={You Only Look at Screens: Multimodal Chain-of-Action Agents},\nauthor={Zhuosheng Zhang and Aston Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=iSAgvYhZzg}\n}",
        "github": "",
        "project": "",
        "reviewers": "CMSv;tvGC;y4jm;BNVX",
        "site": "https://openreview.net/forum?id=iSAgvYhZzg",
        "pdf_size": 5719341,
        "rating": "5;5;5;6",
        "confidence": "4;4;3;3",
        "soundness": "3;3;3;3",
        "contribution": "3;2;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "94;36;50;104",
        "wc_strengths": "70;51;45;225",
        "wc_weaknesses": "250;122;59;111",
        "wc_questions": "96;25;73;57",
        "wc_review": "510;234;227;497",
        "wc_reply_reviewers": "205;0;0;0",
        "wc_reply_authors": "1375;435;316;571",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            71.0,
            28.653097563788805
        ],
        "wc_strengths_avg": [
            97.75,
            74.0451720235695
        ],
        "wc_weaknesses_avg": [
            135.5,
            70.25845144891822
        ],
        "wc_questions_avg": [
            62.75,
            25.829972899714782
        ],
        "wc_review_avg": [
            367.0,
            136.59978038049695
        ],
        "wc_reply_reviewers_avg": [
            51.25,
            88.76760388790495
        ],
        "wc_reply_authors_avg": [
            674.25,
            414.5162089713742
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 98,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15817627520612595336&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0",
        "aff_unique_norm": "Shanghai Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sjtu.edu.cn",
        "aff_unique_abbr": "SJTU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "iSHEYpGF6P",
        "title": "Meta-Learning with Task-Environment Interaction",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The goal of meta-learning is to learn a universal model from various meta-training tasks, enabling rapid adaptation to new tasks with minimal training. Currently, mainstream meta-learning algorithms randomly sample meta-training tasks from a task pool, and the meta-model treats these sampled tasks equally without discrimination, training on them as a whole. However, due to the limitations imposed by training computational power and time constraints, harmful tasks sampled from the imbalanced distribution can have a significant impact on the optimization of the meta-model.Therefore, this paper introduces a form of meta-learning called Task-Environment Interaction Meta-Learning(TIML), which is distinct from reinforcement learning with data preprocessing. In TIML, we create a Task Environment Interaction Mechanism that assesses the interaction between the meta-learning model and the presently sampled task environment. It conducts training differently based on factors such as task difficulty, rewards, harmfulness levels, and others, thereby altering the current practice of uniformly handling multiple tasks.By doing so, we can rapidly enhance the generalization and convergence of meta-learning parameters for unknown tasks. Experimental results demonstrate that the proposed TIML method achieves improvements in model performance while maintaining the same training time complexity. It exhibits faster convergence, greater stability, and can be flexibly combined with other models, showcasing its robust simplicity and universality.",
        "keywords": "Meta-learning;Task-Environment Interaction;Reward  Calculation;Difficulty Assessment;Few-shot Classification",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/71df715e0870c3fd8e405b073e784310bcb13bd0.zip",
        "author": "Maofa Wang;Quan Wan;Zhixiong Leng;Bingchen Yan;Yanlin Xu;Qian He",
        "authorids": "~Maofa_Wang1;~Quan_Wan1;~Zhixiong_Leng1;~Bingchen_Yan1;~Yanlin_Xu1;~Qian_He4",
        "gender": "M;M;;M;F;M",
        "homepage": "https://www.scholat.com/wangmaofa;;;;;https://www.guet.edu.cn/people2/4020013.html",
        "dblp": ";;;;;",
        "google_scholar": "-7fzuVQAAAAJ;;;;;",
        "orcid": ";0009-0004-5486-125X;;0009-0004-1183-928X;0009-0004-6021-3603;",
        "linkedin": ";;;;;",
        "or_profile": "~Maofa_Wang1;~Quan_Wan1;~Zhixiong_Leng1;~Bingchen_Yan1;~Yanlin_Xu1;~Qian_He4",
        "aff": ";;;Guilin University Of Electronic Technology;Guilin University of Electronic Technology;Guilin University of Electronic Technology",
        "aff_domain": ";;;guet.edu.cn;guet.edu.cn;guet.edu.cn",
        "position": ";;;MS student;MS student;Full Professor",
        "bibtex": "@misc{\nwang2024metalearning,\ntitle={Meta-Learning with Task-Environment Interaction},\nauthor={Maofa Wang and Quan Wan and Zhixiong Leng and Bingchen Yan and Yanlin Xu and Qian He},\nyear={2024},\nurl={https://openreview.net/forum?id=iSHEYpGF6P}\n}",
        "github": "",
        "project": "",
        "reviewers": "DThM;4N3x;5KuL;E2rE",
        "site": "https://openreview.net/forum?id=iSHEYpGF6P",
        "pdf_size": 450490,
        "rating": "3;3;3;6",
        "confidence": "3;2;5;3",
        "soundness": "2;2;2;3",
        "contribution": "1;2;1;3",
        "presentation": "3;1;1;3",
        "wc_summary": "64;61;59;35",
        "wc_strengths": "22;15;40;40",
        "wc_weaknesses": "91;496;642;74",
        "wc_questions": "18;162;34;46",
        "wc_review": "195;734;775;195",
        "wc_reply_reviewers": "33;358;154;0",
        "wc_reply_authors": "220;397;701;574",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.0,
            1.0
        ],
        "wc_summary_avg": [
            54.75,
            11.54068888758379
        ],
        "wc_strengths_avg": [
            29.25,
            11.031205736455105
        ],
        "wc_weaknesses_avg": [
            325.75,
            248.73919574526246
        ],
        "wc_questions_avg": [
            65.0,
            56.87706040223949
        ],
        "wc_review_avg": [
            474.75,
            280.1253067825183
        ],
        "wc_reply_reviewers_avg": [
            136.25,
            140.2789631413064
        ],
        "wc_reply_authors_avg": [
            473.0,
            181.63837700221833
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.13245323570650439,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:acOtG-vKK6QJ:scholar.google.com/&scioq=Meta-Learning+with+Task-Environment+Interaction&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Guilin University of Electronic Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.guet.edu.cn",
        "aff_unique_abbr": "GUET",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "iSdHl6qEs2",
        "title": "SEEKING THE SEARCH SPACE FOR SIZE-AWARE VISION TRANSFORMER ARCHITECTURE",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recently, vision transformer methods have gained significant attention due to their superior performance in various tasks, whereas their architectures still highly rely on manual design. Although neural architecture search (NAS) has been introduced to automate the process, it still requires humans to manually specify a fixed search space. Even allowing search space updates, existing methods tend to lose control of model size and result in large and complex models for satisfactory performance. To address these issues, we introduce a constrained optimization framework to Seeking the Search Space for Size-aware transformer architecture, named S4, which allows the search space to evolve to neighbor search space under user-specified constraints (e.g., model size, FLOPS, etc.). With extensive experiments on various benchmarks, including Cifar10, Cifar100, Tiny ImageNet, and SUN397, the results demonstrate that S4 can consistently find architectures that align with model size expectations while achieving better performance than those searched by the original search space or with larger size from compared NAS methods. Moreover, we demonstrate the plug-and-play characteristic of S4 by finding effective yet lightweight adapters for well-recognized foundation models (such as CLIP), achieving excellent performance for downstream tasks.",
        "keywords": "Neural Architecture Search;Vision Transformer;Size-aware",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/b41cc74464843a476e4f76af4b39dc979d08e10e.pdf",
        "author": "Chih-Han Tsou;Yu-Chen Lin;Yi Cheng Huang;WeiHua Li;Jun-Cheng Chen;Chu-Song Chen",
        "authorids": "~Chih-Han_Tsou3;~Yu-Chen_Lin2;~Yi_Cheng_Huang2;~WeiHua_Li3;~Jun-Cheng_Chen2;~Chu-Song_Chen2",
        "gender": "F;;M;M;M;",
        "homepage": ";;;https://www.citi.sinica.edu.tw/pages/pullpull/index_zh.html;https://www.csie.ntu.edu.tw/en/member/Faculty/Chu-Song-Chen-94737564;",
        "dblp": ";55/6226;;77/251;67/1007;",
        "google_scholar": ";;https://scholar.google.com.tw/citations?user=iwuzSHEAAAAJ;https://scholar.google.com.au/citations?user=3x9KITUAAAAJ;WKk6fIQAAAAJ;",
        "orcid": ";;0009-0005-8330-0491;0000-0002-0209-8932;0000-0002-2959-2471;",
        "linkedin": "chih-han-tsou-06822724a/;yu-chen-alice-lin-6141b9245/;;jun-cheng-chen-83b8712a/;;yicheng-huang-6354811a0/",
        "or_profile": "~Chih-Han_Tsou3;~Yu-Chen_Lin2;~WeiHua_Li3;~Jun-Cheng_Chen2;~Chu-Song_Chen2;~Yi_Cheng_HUANG1",
        "aff": ";National Taiwan University;National Taiwan University;Research Center for Information Technology Innovation, Academia Sinica;Department of Computer Science and Informational Engineering, National Taiwan University;",
        "aff_domain": ";ntu.edu.tw;csie.ntu.edu.tw;sinica.edu.tw;csie.ntu.edu.tw;",
        "position": ";MS student;PhD student;Associate Research Fellow/Professor;Professor;",
        "bibtex": "@misc{\ntsou2024seeking,\ntitle={{SEEKING} {THE} {SEARCH} {SPACE} {FOR} {SIZE}-{AWARE} {VISION} {TRANSFORMER} {ARCHITECTURE}},\nauthor={Chih-Han Tsou and Yu-Chen Lin and Yi Cheng Huang and WeiHua Li and Jun-Cheng Chen and Chu-Song Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=iSdHl6qEs2}\n}",
        "github": "",
        "project": "",
        "reviewers": "U6go;dqhy;kmdm",
        "site": "https://openreview.net/forum?id=iSdHl6qEs2",
        "pdf_size": 499660,
        "rating": "3;5;5",
        "confidence": "5;4;2",
        "soundness": "2;2;2",
        "contribution": "2;2;2",
        "presentation": "3;2;3",
        "wc_summary": "50;49;44",
        "wc_strengths": "29;33;53",
        "wc_weaknesses": "226;346;90",
        "wc_questions": "29;2;5",
        "wc_review": "334;430;192",
        "wc_reply_reviewers": "0;65;0",
        "wc_reply_authors": "417;808;327",
        "reply_reviewers": "0;1;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            1.247219128924647
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            47.666666666666664,
            2.6246692913372702
        ],
        "wc_strengths_avg": [
            38.333333333333336,
            10.498677165349081
        ],
        "wc_weaknesses_avg": [
            220.66666666666666,
            104.57958160601375
        ],
        "wc_questions_avg": [
            12.0,
            12.083045973594572
        ],
        "wc_review_avg": [
            318.6666666666667,
            97.76616092607003
        ],
        "wc_reply_reviewers_avg": [
            21.666666666666668,
            30.641293851417057
        ],
        "wc_reply_authors_avg": [
            517.3333333333334,
            208.79069796223095
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.7559289460184545,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:B1NopCCJLeUJ:scholar.google.com/&scioq=SEEKING+THE+SEARCH+SPACE+FOR+SIZE-AWARE+VISION+TRANSFORMER+ARCHITECTURE&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "National Taiwan University;Academia Sinica",
        "aff_unique_dep": ";Research Center for Information Technology Innovation",
        "aff_unique_url": "https://www.ntu.edu.tw;https://www.sinica.edu.tw",
        "aff_unique_abbr": "NTU;Academia Sinica",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Taiwan",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "iShM3YolRY",
        "title": "On the Tool Manipulation Capability of Open-sourced Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent studies on software tool manipulation with large language models (LLMs) mostly rely on closed model APIs. The industrial adoption of these models is substantially constrained due to the security and robustness risks in exposing information to closed LLM API services. In this paper, we ask can we enhance open-source LLMs to be competitive to leading closed LLM APIs in tool manipulation, with practical amount of human supervision. By analyzing common tool manipulation failures, we first demonstrate that open-source LLMs may require training with usage examples, in-context demonstration and generation style regulation to resolve failures. These insights motivate us to revisit classical methods in LLM literature, and demonstrate that we can adapt them as model alignment with programmatic data generation, system prompts and in-context demonstration retrievers to enhance open-source LLMs for tool manipulation. To evaluate these techniques, we create ToolBench, a tool manipulation benchmark consisting of diverse software tools for real-world tasks. We demonstrate that our techniques can boost leading open-source LLMs by up to 94% success rate, showing capabilities competitive to OpenAI GPT-4 in 4 out of 8 ToolBench tasks. We show that such enhancement typically requires about one developer day to curate data for each tool, rendering a recipe with practical amount of human supervision.",
        "keywords": "datasets;large language model;tool manipulation",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/ddb73eea7c68f8a0027f8a2a2d9ea678c99600c1.pdf",
        "author": "Qiantong Xu;Fenglu Hong;Bo Li;Changran Hu;Zhengyu Chen;Jian Zhang",
        "authorids": "~Qiantong_Xu1;~Fenglu_Hong1;~Bo_Li43;~Changran_Hu1;~Zhengyu_Chen5;~Jian_Zhang1",
        "gender": "M;F;M;;M;M",
        "homepage": ";;;;;http://cs.stanford.edu/people/zjian/",
        "dblp": ";;;;80/887-2;",
        "google_scholar": "EONOwy4AAAAJ;;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en;8BwEbTQAAAAJ;wm2BrUcAAAAJ",
        "orcid": ";;;;0000-0001-5811-456X;",
        "linkedin": ";fenglu-hong-ba42b8156;;changran-hu/;edison-zhengyu-chen-0b47459b/;jian-zhang-10383a98/",
        "or_profile": "~Qiantong_Xu1;~Fenglu_Hong1;~Bo_Li43;~Changran_Hu1;~Zhengyu_Chen5;~Jian_Zhang1",
        "aff": "Sambanova Systems;Sambanova Systems;Sambanova Systems;Sambanova Systems, Inc;;Sambanova Systems Inc.",
        "aff_domain": "sambanovasystems.ai;sambanovasystems.ai;sambanovasystems.ai;sambanovasystems.com;;sambanovasystems.com",
        "position": "Engineer;Software engineer;Researcher;Researcher;;Principle software engineer",
        "bibtex": "@misc{\nxu2024on,\ntitle={On the Tool Manipulation Capability of Open-sourced Large Language Models},\nauthor={Qiantong Xu and Fenglu Hong and Bo Li and Changran Hu and Zhengyu Chen and Jian Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=iShM3YolRY}\n}",
        "github": "",
        "project": "",
        "reviewers": "Y6vx;3VL8;dbqH;Qyny",
        "site": "https://openreview.net/forum?id=iShM3YolRY",
        "pdf_size": 909446,
        "rating": "5;5;5;6",
        "confidence": "5;4;3;4",
        "soundness": "2;3;2;3",
        "contribution": "2;2;1;2",
        "presentation": "2;3;2;3",
        "wc_summary": "119;142;93;83",
        "wc_strengths": "54;47;76;47",
        "wc_weaknesses": "155;63;32;222",
        "wc_questions": "109;75;114;2",
        "wc_review": "437;327;315;354",
        "wc_reply_reviewers": "0;0;0;4",
        "wc_reply_authors": "714;817;858;771",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "2;2;2;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            109.25,
            23.025800746119558
        ],
        "wc_strengths_avg": [
            56.0,
            11.895377253370318
        ],
        "wc_weaknesses_avg": [
            118.0,
            75.17645908128422
        ],
        "wc_questions_avg": [
            75.0,
            44.73812691653507
        ],
        "wc_review_avg": [
            358.25,
            47.60974165021272
        ],
        "wc_reply_reviewers_avg": [
            1.0,
            1.7320508075688772
        ],
        "wc_reply_authors_avg": [
            790.0,
            53.59570878344646
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 103,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11305894605163005023&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "SambaNova Systems",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sambanova.com",
        "aff_unique_abbr": "",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "iStX5y0Ttg",
        "title": "Towards Universal Robust Federated Learning via Meta Stackelberg Game",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent studies have revealed that federated learning (FL) systems are susceptible to a range of security threats. Although various defense mechanisms have been proposed, they are typically non-adaptive and tailored to specific types of attacks, leaving them insufficient in the face of unknown/uncertain or adaptive attacks. In this work, we formulate adversarial federated learning as a Bayesian Stackelberg Markov game (BSMG) to tackle adaptive attacks of uncertain types. We further develop an efficient meta-learning approach to solve the game, which provides a robust and adaptive FL defense.\nTheoretically, we show that our algorithm provably converges to the first-order $\\varepsilon$-equilibrium point in $O(\\varepsilon^{-2})$ gradient iterations with $O(\\varepsilon^{-4})$ samples per iteration. Empirical results show that our meta-Stackelberg framework obtains superb performance against strong model poisoning and backdoor attacks with uncertain types.",
        "keywords": "Federated Learning;Game Theory;Reinforcement Learning;Robust Machine Learning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/0d9925503e95bcbc665704a255a04f8f6f186f5a.pdf",
        "author": "Henger Li;Tao Li;Yunian Pan;Tianyi Xu;Quanyan Zhu;Zizhan Zheng",
        "authorids": "~Henger_Li1;~Tao_Li6;~Yunian_Pan1;~Tianyi_Xu1;~Quanyan_Zhu1;~Zizhan_Zheng1",
        "gender": "M;M;M;M;M;M",
        "homepage": ";https://taoli-nyu.github.io/;https://unionpan.github.io/;https://xutianyi01.github.io/Tianyi-Xu/;https://engineering.nyu.edu/faculty/quanyan-zhu;https://www.cs.tulane.edu/~zzheng3/",
        "dblp": "241/9384;;;;;23/286",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en;;Lt08jLgAAAAJ;Qt2WDh0AAAAJ;B1v2AUYAAAAJ",
        "orcid": ";0000-0001-8966-7239;;;;",
        "linkedin": "hengerli30/;tao-li-nyu/;;tianyixu516527139/;;",
        "or_profile": "~Henger_Li1;~Tao_Li6;~Yunian_Pan1;~Tianyi_Xu1;~Quanyan_Zhu1;~Zizhan_Zheng1",
        "aff": "Tulane University;New York University;New York University;Tulane University;New York University;Tulane University",
        "aff_domain": "tulane.edu;nyu.edu;nyu.edu;tulane.edu;nyu.edu;tulane.edu",
        "position": "PhD student;PhD student;PhD student;PhD student;Associate Professor;Associate Professor",
        "bibtex": "@misc{\nli2024towards,\ntitle={Towards Universal Robust Federated Learning via Meta Stackelberg Game},\nauthor={Henger Li and Tao Li and Yunian Pan and Tianyi Xu and Quanyan Zhu and Zizhan Zheng},\nyear={2024},\nurl={https://openreview.net/forum?id=iStX5y0Ttg}\n}",
        "github": "",
        "project": "",
        "reviewers": "UDsm;D75P;YEKb;gEMV",
        "site": "https://openreview.net/forum?id=iStX5y0Ttg",
        "pdf_size": 2522497,
        "rating": "3;3;3;5",
        "confidence": "3;3;5;3",
        "soundness": "2;3;2;3",
        "contribution": "1;1;2;3",
        "presentation": "1;2;3;3",
        "wc_summary": "120;139;65;56",
        "wc_strengths": "22;20;34;17",
        "wc_weaknesses": "474;474;299;336",
        "wc_questions": "2;4;47;185",
        "wc_review": "618;637;445;594",
        "wc_reply_reviewers": "0;25;55;0",
        "wc_reply_authors": "667;1281;1110;519",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;2;3;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            95.0,
            35.29164207004259
        ],
        "wc_strengths_avg": [
            23.25,
            6.456585785072479
        ],
        "wc_weaknesses_avg": [
            395.75,
            79.33591557422149
        ],
        "wc_questions_avg": [
            59.5,
            74.65420282877582
        ],
        "wc_review_avg": [
            573.5,
            75.73803535872844
        ],
        "wc_reply_reviewers_avg": [
            20.0,
            22.638462845343543
        ],
        "wc_reply_authors_avg": [
            894.25,
            311.68042527563387
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:6dg3E5vEKIQJ:scholar.google.com/&scioq=Towards+Universal+Robust+Federated+Learning+via+Meta+Stackelberg+Game&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;0;1;0",
        "aff_unique_norm": "Tulane University;New York University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tulane.edu;https://www.nyu.edu",
        "aff_unique_abbr": "Tulane;NYU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "iT1ttQXwOg",
        "title": "Equivariant Deep Weight Space Alignment",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Permutation symmetries of deep networks make simple operations like model averaging and similarity estimation challenging. In many cases, aligning the weights of the networks, i.e., finding optimal permutations between their weights, is necessary. More generally, weight alignment is essential for a wide range of applications, from model merging, through exploring the optimization landscape of deep neural networks, to defining meaningful distance functions between neural networks. Unfortunately, weight alignment is an NP-hard problem. Prior research has mainly focused on solving relaxed versions of the alignment problem, leading to either time-consuming methods or sub-optimal solutions. To accelerate the alignment process and improve its quality, we propose a novel framework aimed at learning to solve the weight alignment problem, which we name DEEP-ALIGN. To that end,  we first demonstrate that weight alignment adheres to two fundamental symmetries and then, propose a deep architecture that respects these symmetries. Notably, our framework does not require any labeled data. We provide a theoretical analysis of our approach and evaluate DEEP-ALIGN on several types of network architectures and learning setups. Our experimental results indicate that a feed-forward pass with DEEP-ALIGN produces better or equivalent alignments compared to those produced by current optimization algorithms. Additionally, our alignments can be used as an initialization for other methods to gain even better solutions with a significant speedup in convergence.",
        "keywords": "Equivariance;Weight alignment;Weight space;Symmetries",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Aviv Navon;Aviv Shamsian;Ethan Fetaya;Gal Chechik;Nadav Dym;Haggai Maron",
        "authorids": "~Aviv_Navon1;~Aviv_Shamsian1;~Ethan_Fetaya1;~Gal_Chechik1;~Nadav_Dym1;~Haggai_Maron1",
        "gender": "M;M;M;;M;M",
        "homepage": "https://avivnavon.github.io/;;http://www.cs.toronto.edu/~ethanf/;https://chechiklab.biu.ac.il/~gal/;https://haggaim.github.io/;https://nadavdym.github.io./",
        "dblp": "269/9785;261/9492;01/10046;c/GalChechik;181/6629;167/1176",
        "google_scholar": "https://scholar.google.co.il/citations?user=N-sME4wAAAAJ;;zLuqh-0AAAAJ;Wk2gAZUAAAAJ;https://scholar.google.co.il/citations?user=4v8uJrIAAAAJ;https://scholar.google.co.il/citations?user=qOyXmMYAAAAJ",
        "orcid": ";;0000-0003-3125-1665;0000-0001-9164-5303;;",
        "linkedin": ";aviv-shamsian/;;;;",
        "or_profile": "~Aviv_Navon1;~Aviv_Shamsian1;~Ethan_Fetaya1;~Gal_Chechik1;~Haggai_Maron1;~Nadav_E_Dym1",
        "aff": "Bar Ilan University, Israel;Bar-Ilan University;Bar Ilan University;NVIDIA;NVIDIA;Technion - Israel Institute of Technology, Technion",
        "aff_domain": "biu.ac.il;biu.ac.il;biu.ac.il;nvidia.com;nvidia.com;technion.ac.il",
        "position": "PhD student;PhD student;Assistant Professor;Principal Researcher;Research Scientist;Assistant Professor",
        "bibtex": "@misc{\nnavon2024equivariant,\ntitle={Equivariant Deep Weight Space Alignment},\nauthor={Aviv Navon and Aviv Shamsian and Ethan Fetaya and Gal Chechik and Nadav Dym and Haggai Maron},\nyear={2024},\nurl={https://openreview.net/forum?id=iT1ttQXwOg}\n}",
        "github": "",
        "project": "",
        "reviewers": "ayDH;VRRk;ZcWa;qGCa",
        "site": "https://openreview.net/forum?id=iT1ttQXwOg",
        "pdf_size": 3896857,
        "rating": "6;6;6;6",
        "confidence": "4;4;3;2",
        "soundness": "3;4;3;3",
        "contribution": "3;3;2;2",
        "presentation": "3;3;2;3",
        "wc_summary": "100;134;80;78",
        "wc_strengths": "76;63;122;69",
        "wc_weaknesses": "171;67;140;131",
        "wc_questions": "97;118;29;110",
        "wc_review": "444;382;371;388",
        "wc_reply_reviewers": "54;0;79;0",
        "wc_reply_authors": "602;355;921;667",
        "reply_reviewers": "1;0;2;0",
        "reply_authors": "1;1;3;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            98.0,
            22.494443758403985
        ],
        "wc_strengths_avg": [
            82.5,
            23.264780248263683
        ],
        "wc_weaknesses_avg": [
            127.25,
            37.81781987370504
        ],
        "wc_questions_avg": [
            88.5,
            35.16034698349833
        ],
        "wc_review_avg": [
            396.25,
            28.23450902707536
        ],
        "wc_reply_reviewers_avg": [
            33.25,
            34.404759845114455
        ],
        "wc_reply_authors_avg": [
            636.25,
            201.43407730570317
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 19,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5434543739837023110&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;0;1;1;2",
        "aff_unique_norm": "Bar-Ilan University;NVIDIA;Technion - Israel Institute of Technology",
        "aff_unique_dep": ";NVIDIA Corporation;",
        "aff_unique_url": "https://www.biu.ac.il;https://www.nvidia.com;https://www.technion.ac.il",
        "aff_unique_abbr": "BIU;NVIDIA;Technion",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;1;0",
        "aff_country_unique": "Israel;United States"
    },
    {
        "id": "iT9sQ9Nejx",
        "title": "Graph-Based Automatic Feature Selection for Multi-Class Classification via Mean Simplified Silhouette",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "This paper introduces a novel graph-based filter method for automatic feature selection (abbreviated as GB-AFS) for multi-class classification tasks. The method determines the minimum combination of features required to sustain prediction performance while maintaining complementary discriminating abilities between different classes. It does not require any user-defined parameters such as the number of features to select. The methodology employs the Jeffries--Matusita (JM) distance in conjunction with t-distributed Stochastic Neighbor Embedding (t-SNE) to generate a low-dimensional space reflecting how effectively each feature can differentiate between each pair of classes. The minimum number of features is selected using our newly developed Mean Simplified Silhouette (abbreviated as MSS) index, designed to evaluate the clustering results for the feature selection task. \nExperimental results on public data sets demonstrate the superior performance of the proposed GB-AFS over other filter-based techniques and automatic feature selection approaches. Moreover, the proposed algorithm maintained the accuracy achieved when utilizing all features, while using only $7\\%$ to $30\\%$ of the features. Consequently, this resulted in a reduction of the time needed for classifications, from $15\\%$ to $70\\%$.",
        "keywords": "Graph-Based Feature Selection;Silhouette;Multi-Class Classification;Optimal K",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "David Levin;Gonen Singer",
        "authorids": "~David_Levin2;~Gonen_Singer1",
        "gender": "M;M",
        "homepage": ";https://www.eng.biu.ac.il/singerg/",
        "dblp": ";",
        "google_scholar": ";0YHAMhQAAAAJ",
        "orcid": "0009-0007-2220-4070;",
        "linkedin": ";gonen-singer-b4270848/",
        "or_profile": "~David_Levin2;~Gonen_Singer1",
        "aff": "Bar-Ilan University;Bar-Ilan University",
        "aff_domain": "biu.ac.il;biu.ac.il",
        "position": "MS student;Associate Professor",
        "bibtex": "@misc{\nlevin2024graphbased,\ntitle={Graph-Based Automatic Feature Selection for Multi-Class Classification via Mean Simplified Silhouette},\nauthor={David Levin and Gonen Singer},\nyear={2024},\nurl={https://openreview.net/forum?id=iT9sQ9Nejx}\n}",
        "github": "",
        "project": "",
        "reviewers": "uTMn;8xaB;sV3v;yuKD",
        "site": "https://openreview.net/forum?id=iT9sQ9Nejx",
        "pdf_size": 1485898,
        "rating": "3;3;5;6",
        "confidence": "4;5;5;3",
        "soundness": "2;2;3;2",
        "contribution": "2;1;3;3",
        "presentation": "2;3;4;2",
        "wc_summary": "35;176;77;41",
        "wc_strengths": "58;90;20;42",
        "wc_weaknesses": "224;156;14;72",
        "wc_questions": "15;42;49;120",
        "wc_review": "332;464;160;275",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            82.25,
            56.45960945667265
        ],
        "wc_strengths_avg": [
            52.5,
            25.509802037648196
        ],
        "wc_weaknesses_avg": [
            116.5,
            80.00468736267895
        ],
        "wc_questions_avg": [
            56.5,
            38.797551469132685
        ],
        "wc_review_avg": [
            307.75,
            109.43576883268102
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:82CrlfGssQ4J:scholar.google.com/&scioq=Graph-Based+Automatic+Feature+Selection+for+Multi-Class+Classification+via+Mean+Simplified+Silhouette&hl=en&as_sdt=0,47",
        "gs_version_total": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Bar-Ilan University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.biu.ac.il",
        "aff_unique_abbr": "BIU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Israel"
    },
    {
        "title": "Kernelised Normalising Flows",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18064",
        "id": "iTFdNLHE7k",
        "author_site": "Eshant English, Matthias Kirchler, Christoph Lippert",
        "tldr": "",
        "abstract": "Normalising Flows are non-parametric statistical models known for their dual capabilities of density estimation and generation. They are distinguished by their inherently invertible architecture. However, the requirement of invertibility imposes constraints on their expressiveness, necessitating a large number of parameters and innovative architectural designs to achieve satisfactory outcomes. Whilst flow-based models predominantly rely on neural-network-based transformations for expressive designs, alternative transformation methods have received limited attention. In this work, we present Ferumal flow, a novel kernelised normalising flow paradigm that integrates kernels into the framework. Our results demonstrate that a kernelised flow can yield competitive or superior results compared to neural network-based flows whilst maintaining parameter efficiency. Kernelised flows excel especially in the low-data regime, enabling flexible non-parametric density estimation in applications with sparse data availability.",
        "keywords": "Machine Learning;Maximum Likelihood;Density Estimation;Statistics;Kernels",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Eshant English;Matthias Kirchler;Christoph Lippert",
        "authorids": "~Eshant_English1;~Matthias_Kirchler1;~Christoph_Lippert1",
        "gender": ";M;M",
        "homepage": "https://hpi.de/forschung/kooperationen-partner/research-schools/hpi-dse/mitglieder/research-pages/eshant-english.html;;http://hpi.de/lippert",
        "dblp": "353/1292;190/2072;45/7970.html",
        "google_scholar": ";https://scholar.google.de/citations?user=O1sl64kAAAAJ;RVl8TE0AAAAJ",
        "orcid": ";0000-0003-0616-2740;0000-0001-6363-2556",
        "linkedin": "eshantenglish/;;christoph-lippert-307b8135/",
        "or_profile": "~Eshant_English1;~Matthias_Kirchler1;~Christoph_Lippert1",
        "aff": "Hasso Plattner Institute;TU Kaiserslautern;Hasso Plattner Institute",
        "aff_domain": "hpi.de;uni-kl.de;hpi.de",
        "position": "PhD student;PhD student;Full Professor",
        "bibtex": "@inproceedings{\nenglish2024kernelised,\ntitle={Kernelised Normalising Flows},\nauthor={Eshant English and Matthias Kirchler and Christoph Lippert},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=iTFdNLHE7k}\n}",
        "github": "",
        "project": "",
        "reviewers": "ffkL;wvm3;UUvL;12iZ",
        "pdf_size": 3207035,
        "rating": "5;6;8;8",
        "confidence": "3;4;4;3",
        "soundness": "2;3;3;4",
        "contribution": "2;2;3;4",
        "presentation": "2;3;3;4",
        "wc_summary": "31;63;199;111",
        "wc_strengths": "17;128;78;50",
        "wc_weaknesses": "108;210;270;70",
        "wc_questions": "22;68;357;85",
        "wc_review": "178;469;904;316",
        "wc_reply_reviewers": "39;146;65;24",
        "wc_reply_authors": "572;1279;1132;122",
        "reply_reviewers": "1;2;1;1",
        "reply_authors": "2;5;3;1",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            101.0,
            63.340350488452465
        ],
        "wc_strengths_avg": [
            68.25,
            40.69628361410904
        ],
        "wc_weaknesses_avg": [
            164.5,
            79.56601033104525
        ],
        "wc_questions_avg": [
            133.0,
            131.36399811211595
        ],
        "wc_review_avg": [
            466.75,
            272.62371045087036
        ],
        "wc_reply_reviewers_avg": [
            68.5,
            47.08768416475799
        ],
        "wc_reply_authors_avg": [
            776.25,
            460.7268035397984
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            1.479019945774904
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.19245008972987526,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=777708075516733266&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=iTFdNLHE7k",
        "pdf": "https://openreview.net/pdf?id=iTFdNLHE7k",
        "email": "hpi.de;uni-kl.de;hpi.de",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Hasso Plattner Institute;Technische Universit\u00e4t Kaiserslautern",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.hpi.de;https://www.tu-kl.de",
        "aff_unique_abbr": "HPI;TU Kaiserslautern",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "title": "Gradual Domain Adaptation via Gradient Flow",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18063",
        "id": "iTTZFKrlGV",
        "author_site": "Zhan ZHUANG, Yu Zhang, Ying Wei",
        "tldr": "",
        "abstract": "Domain shift degrades classification models on new data distributions. Conventional unsupervised domain adaptation (UDA) aims to learn features that bridge labeled source and unlabeled target domains. In contrast to feature learning, gradual domain adaptation (GDA) leverages extra continuous intermediate domains with pseudo-labels to boost the source classifier. However, real intermediate domains are sometimes unavailable or ineffective. In this paper, we propose $\\textbf{G}$radual Domain Adaptation via $\\textbf{G}$radient $\\textbf{F}$low (GGF) to generate intermediate domains with preserving labels, thereby enabling us a fine-tuning method for GDA. We employ the Wasserstein gradient flow in Kullback\u2013Leibler divergence to transport samples from the source to the target domain. To simulate the dynamics, we utilize the Langevin algorithm. Since the Langevin algorithm disregards label information and introduces diffusion noise, we introduce classifier-based and sample-based potentials to avoid label switching and dramatic deviations in the sampling process. For the proposed GGF model, we analyze its generalization bound. Experiments on several benchmark datasets demonstrate the superiority of the proposed GGF method compared to state-of-the-art baselines.",
        "keywords": "Domain adaptation;gradual domain adaptation;gradient flow",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Zhan Zhuang;Yu Zhang;Ying Wei",
        "authorids": "~Zhan_Zhuang1;~Yu_Zhang3;~Ying_Wei1",
        "gender": ";M;F",
        "homepage": ";http://cse.sustech.edu.cn/faculty/~zhangy/;https://wei-ying.net/",
        "dblp": "354/8439;50/671-6;14/4899-1",
        "google_scholar": "YC7hQdIAAAAJ;https://scholar.google.com.hk/citations?user=jaRS5w4AAAAJ;5UpFdKsAAAAJ",
        "orcid": "0000-0003-0215-8728;;",
        "linkedin": ";;",
        "or_profile": "~Zhan_Zhuang1;~Yu_Zhang3;~Ying_Wei1",
        "aff": "City University of Hong Kong;Southern University of Science and Technology;Nanyang Technological University",
        "aff_domain": "cityu.edu.hk;sustc.edu.cn;ntu.edu.sg",
        "position": "PhD student;Associate Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nzhuang2024gradual,\ntitle={Gradual Domain Adaptation via Gradient Flow},\nauthor={Zhan Zhuang and Yu Zhang and Ying Wei},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=iTTZFKrlGV}\n}",
        "github": "",
        "project": "",
        "reviewers": "T69j;KhtB;MZDz;vJxQ",
        "pdf_size": 8854439,
        "rating": "6;6;6;8",
        "confidence": "4;2;4;3",
        "soundness": "3;3;3;3",
        "contribution": "3;3;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "151;82;53;106",
        "wc_strengths": "202;32;52;41",
        "wc_weaknesses": "231;163;123;237",
        "wc_questions": "48;45;62;9",
        "wc_review": "632;322;290;393",
        "wc_reply_reviewers": "9;0;0;63",
        "wc_reply_authors": "1094;1813;1415;1646",
        "reply_reviewers": "1;0;0;2",
        "reply_authors": "2;3;2;3",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            98.0,
            35.895682191595135
        ],
        "wc_strengths_avg": [
            81.75,
            69.78672868103219
        ],
        "wc_weaknesses_avg": [
            188.5,
            47.69433928675394
        ],
        "wc_questions_avg": [
            41.0,
            19.557607215607945
        ],
        "wc_review_avg": [
            409.25,
            133.8980489028873
        ],
        "wc_reply_reviewers_avg": [
            18.0,
            26.239283526803852
        ],
        "wc_reply_authors_avg": [
            1492.0,
            269.76378556062707
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.17407765595569782,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8040199153917444603&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=iTTZFKrlGV",
        "pdf": "https://openreview.net/pdf?id=iTTZFKrlGV",
        "email": "cityu.edu.hk;sustc.edu.cn;ntu.edu.sg",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "City University of Hong Kong;Southern University of Science and Technology;Nanyang Technological University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.cityu.edu.hk;https://www.sustech.edu.cn;https://www.ntu.edu.sg",
        "aff_unique_abbr": "CityU;SUSTech;NTU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "China;Singapore"
    },
    {
        "id": "iTddgL0lTQ",
        "title": "ToolTalk: Evaluating Tool Usage in a Conversational Setting",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs) have displayed massive improvements in reasoning and decision-making skills and can hold natural conversations with users. Many recent works seek to augment LLM-based assistants with external tools so they can access private or up-to-date information and carry out actions on behalf of users. To better measure the performance of these assistants, this paper introduces ToolTalk, a benchmark consisting of complex user intents requiring multi-step tool usage specified through dialogue. ToolTalk contains 28 tools grouped into 7 plugins, and includes a complete simulated implementation of each tool, allowing for fully automated evaluation of assistants that rely on execution feedback. ToolTalk also emphasizes tools that externally affect the world rather than only tools for referencing or searching information. We evaluate GPT-3.5 and GPT-4 on ToolTalk resulting in success rates of 26% and 50% respectively. Our analysis of the errors reveals three major categories and suggests some future directions for improvement.",
        "keywords": "benchmark;tool-usage;LLM;chatbot;tool-augmented LLM;tool LLM;tool-learning;augmented language models",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Nicholas Charles Farn;Richard Shin",
        "authorids": "~Nicholas_Charles_Farn1;~Richard_Shin1",
        "gender": "M;M",
        "homepage": ";https://rshin.github.io",
        "dblp": ";13/8735",
        "google_scholar": ";xPnkc80AAAAJ",
        "orcid": ";",
        "linkedin": "nicholasfarn/;",
        "or_profile": "~Nicholas_Charles_Farn1;~Richard_Shin1",
        "aff": ";Microsoft",
        "aff_domain": ";microsoft.com",
        "position": ";Researcher",
        "bibtex": "@misc{\nfarn2024tooltalk,\ntitle={ToolTalk: Evaluating Tool Usage in a Conversational Setting},\nauthor={Nicholas Charles Farn and Richard Shin},\nyear={2024},\nurl={https://openreview.net/forum?id=iTddgL0lTQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "NJBf;XpDT;LeeB;YHNY",
        "site": "https://openreview.net/forum?id=iTddgL0lTQ",
        "pdf_size": 336436,
        "rating": "3;3;3;6",
        "confidence": "4;3;3;4",
        "soundness": "2;2;2;4",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "101;318;297;42",
        "wc_strengths": "117;56;36;39",
        "wc_weaknesses": "176;187;31;42",
        "wc_questions": "1;5;143;1",
        "wc_review": "395;566;507;124",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "604;535;0;273",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;0;1",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            189.5,
            120.05936031813596
        ],
        "wc_strengths_avg": [
            62.0,
            32.657311585615865
        ],
        "wc_weaknesses_avg": [
            109.0,
            72.70832139445939
        ],
        "wc_questions_avg": [
            37.5,
            60.932339525083066
        ],
        "wc_review_avg": [
            398.0,
            169.6982616292813
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            353.0,
            238.29288701092193
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0.75,
            0.4330127018922193
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8304854865117492544&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "Microsoft",
        "aff_unique_dep": "Microsoft Corporation",
        "aff_unique_url": "https://www.microsoft.com",
        "aff_unique_abbr": "Microsoft",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "iTrd5xyHLP",
        "title": "LLMatic: Neural Architecture Search via Large Language Models and Quality Diversity Optimization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) have emerged as powerful tools capable of accomplishing a broad spectrum of tasks. Their abilities span numerous areas, and one area where they have made a significant impact is in the domain of code generation. Here, we propose to use the coding abilities of LLMs to introduce meaningful variations to code defining neural networks. Meanwhile, Quality-Diversity (QD) algorithms are known to discover diverse and robust solutions. By merging the code-generating abilities of LLMs with the diversity and\nrobustness of QD solutions, we introduce LLMatic, a Neural Architecture Search (NAS) algorithm. While LLMs struggle to conduct NAS directly through prompts, LLMatic uses a procedural approach, leveraging QD for prompts and network architecture to create diverse and high-performing networks. We test LLMatic on the CIFAR-10 and NAS-bench-201 benchmark, demonstrating that it can produce competitive networks while evaluating just 2, 000 candidates, even without prior knowledge of the benchmark domain or exposure to any previous top-performing models for the benchmark.",
        "keywords": "Neural Architecture Search;Large Language Models;Quality Diversity Optimization",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/d4e9788495996f629824f4bf7de5ad26734fbfc8.zip",
        "author": "Muhammad Umair Nasir;Sam Earle;Julian Togelius;Steven James;Christopher Wesley Cleghorn",
        "authorids": "~Muhammad_Umair_Nasir1;~Sam_Earle1;~Julian_Togelius1;~Steven_James1;~Christopher_Wesley_Cleghorn1",
        "gender": "M;M;M;M;",
        "homepage": "https://umair-nasir14.github.io/;;http://julian.togelius.com;;",
        "dblp": "319/7239;;47/767;195/8202;",
        "google_scholar": "O-4Fbb0AAAAJ;pilikrUAAAAJ;lr4I9BwAAAAJ;;",
        "orcid": "0000-0002-2458-9599;;0000-0003-3128-4598;;",
        "linkedin": "umair-nasir/;sam-earle-43a0701ab;togelius/;;",
        "or_profile": "~Muhammad_Umair_Nasir1;~Sam_Earle1;~Julian_Togelius1;~Steven_James1;~Christopher_Wesley_Cleghorn1",
        "aff": "Axon Corporate Services;New York University;New York University;University of the Witwatersrand;",
        "aff_domain": "axon.co.za;nyu.edu;nyu.edu;wits.ac.za;",
        "position": "Data Scientist;PhD student;Associate Professor;Senior Lecturer;",
        "bibtex": "@misc{\nnasir2024llmatic,\ntitle={{LLM}atic: Neural Architecture Search via Large Language Models and Quality Diversity Optimization},\nauthor={Muhammad Umair Nasir and Sam Earle and Julian Togelius and Steven James and Christopher Wesley Cleghorn},\nyear={2024},\nurl={https://openreview.net/forum?id=iTrd5xyHLP}\n}",
        "github": "",
        "project": "",
        "reviewers": "za3A;7vVP;4jrW;eaNZ;j44t",
        "site": "https://openreview.net/forum?id=iTrd5xyHLP",
        "pdf_size": 939503,
        "rating": "3;3;3;3;5",
        "confidence": "4;4;4;5;3",
        "soundness": "2;2;3;2;3",
        "contribution": "3;2;3;1;3",
        "presentation": "1;2;2;1;1",
        "wc_summary": "52;36;64;79;75",
        "wc_strengths": "41;20;82;42;106",
        "wc_weaknesses": "126;115;313;120;156",
        "wc_questions": "9;53;171;97;54",
        "wc_review": "228;224;630;338;391",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            3.4,
            0.8
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.4,
            0.8
        ],
        "presentation_avg": [
            1.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            61.2,
            15.714961024450552
        ],
        "wc_strengths_avg": [
            58.2,
            31.205127783747336
        ],
        "wc_weaknesses_avg": [
            166.0,
            74.86788363510752
        ],
        "wc_questions_avg": [
            76.8,
            54.70795189001321
        ],
        "wc_review_avg": [
            362.2,
            148.48622831764567
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.7905694150420948,
        "gs_citation": 66,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2749289522181475670&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "Axon Corporate Services;New York University;University of the Witwatersrand",
        "aff_unique_dep": ";;",
        "aff_unique_url": ";https://www.nyu.edu;https://www.wits.ac.za",
        "aff_unique_abbr": ";NYU;Wits",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "1;1;2",
        "aff_country_unique": ";United States;South Africa"
    },
    {
        "id": "iTsHStJKcm",
        "title": "Make a Donut: Language-Guided Hierarchical EMD-Space Planning for Zero-shot Deformable Object Manipulation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deformable object manipulation stands as one of the most captivating yet formidable challenges in robotics. While previous techniques have predominantly relied on learning latent dynamics through demonstrations, typically represented as either particles or images, there exists a pertinent limitation: acquiring suitable demonstrations, especially for long-horizon tasks, can be elusive. Moreover, basing learning entirely on demonstrations can hamper the model's ability to generalize beyond the demonstrated tasks. In this work, we introduce a demonstration-free hierarchical planning approach capable of tackling intricate long-horizon tasks without necessitating any training. We employ large language models (LLMs) to articulate a high-level, stage-by-stage plan corresponding to a specified task. For every individual stage, the LLM provides both the tool's name and the Python code to craft intermediate subgoal point clouds. With the tool and subgoal for a particular stage at our disposal, we present a granular closed-loop model predictive control strategy. This leverages Differentiable Physics with Point-to-Point correspondence (DiffPhysics-P2P) loss in the earth mover distance (EMD) space, applied iteratively. Experimental findings affirm that our technique surpasses multiple benchmarks in dough manipulation, spanning both short and long horizons. Remarkably, our model demonstrates robust generalization capabilities to novel and previously unencountered complex tasks without any preliminary demonstrations. We further substantiate our approach with experimental trials on real-world robotic platforms.",
        "keywords": "Deformable Object Manipulation; Large Language Models; Long-horizon Task Planning",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/a1e1137c84fc6219201117f9f2bf8921577e6cec.zip",
        "author": "Yang You;Bokui Shen;Congyue Deng;Haoran Geng;He Wang;Leonidas Guibas",
        "authorids": "~Yang_You2;~Bokui_Shen1;~Congyue_Deng1;~Haoran_Geng1;~He_Wang5;~Leonidas_Guibas1",
        "gender": "M;F;M;M;M;M",
        "homepage": "https://qq456cvb.github.io;https://cs.stanford.edu/~congyue/;https://github.com/geng-haoran/haorangeng;https://hughw19.github.io;http://geometry.stanford.edu/;https://cs.stanford.edu/~bshen88",
        "dblp": "33/8167;267/5521;295/7112;01/6368-10;g/LeonidasJGuibas;280/3036",
        "google_scholar": "1YV1_KUAAAAJ;XJZ8UBcAAAAJ;Inr-6rEAAAAJ;roCAWkoAAAAJ;https://scholar.google.com.tw/citations?user=5JlEyTAAAAAJ;mOMChFIAAAAJ",
        "orcid": ";;;;;0000-0002-8183-3607",
        "linkedin": ";;haoran-geng-422778238/;;;",
        "or_profile": "~Yang_You2;~Congyue_Deng1;~Haoran_Geng1;~He_Wang5;~Leonidas_Guibas1;~William_B._Shen1",
        "aff": "Stanford University;Stanford University;Peking University;Peking University;Stanford University;Stanford University",
        "aff_domain": "stanford.edu;stanford.edu;pku.edu.cn;pku.edu.cn;stanford.edu;stanford.edu",
        "position": "Postdoc;PhD student;Undergrad student;Assistant Professor;Full Professor;Researcher",
        "bibtex": "@misc{\nyou2024make,\ntitle={Make a Donut: Language-Guided Hierarchical {EMD}-Space Planning for Zero-shot Deformable Object Manipulation},\nauthor={Yang You and Bokui Shen and Congyue Deng and Haoran Geng and He Wang and Leonidas Guibas},\nyear={2024},\nurl={https://openreview.net/forum?id=iTsHStJKcm}\n}",
        "github": "",
        "project": "",
        "reviewers": "ujgq;Hik8;c5qh;MTGX",
        "site": "https://openreview.net/forum?id=iTsHStJKcm",
        "pdf_size": 16565055,
        "rating": "5;5;5;6",
        "confidence": "5;4;3;3",
        "soundness": "2;3;2;3",
        "contribution": "2;3;2;2",
        "presentation": "2;3;3;3",
        "wc_summary": "39;31;53;273",
        "wc_strengths": "88;63;44;57",
        "wc_weaknesses": "720;71;68;117",
        "wc_questions": "7;118;65;56",
        "wc_review": "854;283;230;503",
        "wc_reply_reviewers": "802;33;12;61",
        "wc_reply_authors": "3099;851;795;753",
        "reply_reviewers": "3;1;1;1",
        "reply_authors": "7;3;2;2",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            99.0,
            100.7670581092849
        ],
        "wc_strengths_avg": [
            63.0,
            15.98436736314578
        ],
        "wc_weaknesses_avg": [
            244.0,
            275.50408345431106
        ],
        "wc_questions_avg": [
            61.5,
            39.38591118661596
        ],
        "wc_review_avg": [
            467.5,
            245.50407328596404
        ],
        "wc_reply_reviewers_avg": [
            227.0,
            332.4311958887132
        ],
        "wc_reply_authors_avg": [
            1374.5,
            996.2473337480005
        ],
        "reply_reviewers_avg": [
            1.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            3.5,
            2.0615528128088303
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2423718017501926285&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;1;0;0",
        "aff_unique_norm": "Stanford University;Peking University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.stanford.edu;http://www.pku.edu.cn",
        "aff_unique_abbr": "Stanford;Peking U",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Stanford;",
        "aff_country_unique_index": "0;0;1;1;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "iUD9FklwQf",
        "title": "G4SATBench: Benchmarking and Advancing SAT Solving with Graph Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph neural networks (GNNs) have recently emerged as a promising approach for solving the Boolean Satisfiability Problem (SAT), offering potential alternatives to traditional backtracking or local search SAT solvers. However, despite the growing volume of literature in this field, there remains a notable absence of a unified dataset and a fair benchmark to evaluate and compare existing approaches. To address this crucial gap, we present G4SATBench, the first benchmark study that establishes a comprehensive evaluation framework for GNN-based SAT solvers. In G4SATBench, we meticulously curate a large and diverse set of SAT datasets comprising 7 problems with 3 difficulty levels and benchmark a broad range of GNN models across various prediction tasks, training objectives, and inference algorithms. To explore the learning abilities and comprehend the strengths and limitations of GNN-based SAT solvers, we also compare their solving processes with the heuristics in search-based SAT solvers. Our empirical results provide valuable insights into the performance of GNN-based SAT solvers and further suggest that existing GNN models can effectively learn a solving strategy akin to greedy local search but struggle to learn backtracking search in the latent space.",
        "keywords": "SAT solving;Graph neural networks",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/cff90eb9feb91a9ef79d8c5ca762f152e5802c0a.pdf",
        "author": "Zhaoyu Li;Jinpei Guo;Xujie Si",
        "authorids": "~Zhaoyu_Li3;~Jinpei_Guo1;~Xujie_Si1",
        "gender": "M;M;M",
        "homepage": "https://www.zhaoyu-li.com/;https://jp-guo.github.io/;https://xujie.si",
        "dblp": ";;142/8449",
        "google_scholar": ";;Ru-jrx4AAAAJ",
        "orcid": ";;",
        "linkedin": "zhaoyu-li-9171892a5/;;",
        "or_profile": "~Zhaoyu_Li3;~Jinpei_Guo1;~Xujie_Si1",
        "aff": "University of Toronto;Shanghai Jiaotong University;University of Toronto",
        "aff_domain": "cs.toronto.edu;sjtu.edu.cn;toronto.edu",
        "position": "PhD student;Undergrad student;Assistant Professor",
        "bibtex": "@misc{\nli2024gsatbench,\ntitle={G4{SATB}ench: Benchmarking and Advancing {SAT} Solving with Graph Neural Networks},\nauthor={Zhaoyu Li and Jinpei Guo and Xujie Si},\nyear={2024},\nurl={https://openreview.net/forum?id=iUD9FklwQf}\n}",
        "github": "",
        "project": "",
        "reviewers": "Enee;Fzt9;E9kP;1zwz",
        "site": "https://openreview.net/forum?id=iUD9FklwQf",
        "pdf_size": 1245889,
        "rating": "5;5;5;6",
        "confidence": "3;4;3;4",
        "soundness": "2;3;3;4",
        "contribution": "2;2;2;2",
        "presentation": "3;3;3;4",
        "wc_summary": "69;70;26;84",
        "wc_strengths": "76;36;127;75",
        "wc_weaknesses": "225;191;40;139",
        "wc_questions": "42;8;31;44",
        "wc_review": "412;305;224;342",
        "wc_reply_reviewers": "58;65;14;57",
        "wc_reply_authors": "834;528;801;836",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;1;2;2",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            62.25,
            21.75287337341897
        ],
        "wc_strengths_avg": [
            78.5,
            32.31485726411305
        ],
        "wc_weaknesses_avg": [
            148.75,
            69.85833880074733
        ],
        "wc_questions_avg": [
            31.25,
            14.306903927824496
        ],
        "wc_review_avg": [
            320.75,
            67.79887535940401
        ],
        "wc_reply_reviewers_avg": [
            48.5,
            20.155644370746373
        ],
        "wc_reply_authors_avg": [
            749.75,
            128.77960824602627
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4975517059889206601&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Toronto;Shanghai Jiao Tong University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.utoronto.ca;https://www.sjtu.edu.cn",
        "aff_unique_abbr": "U of T;SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Canada;China"
    },
    {
        "id": "iVaxLjVRQN",
        "title": "Balancing Fairness and Accuracy in Data-Restricted Binary Classification",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Applications that deal with sensitive information may have restrictions placed on the data available to a machine learning (ML) model. For example, in some applications a model may not have direct access to sensitive attributes. This can affect the ability of an ML model to produce accurate and fair decisions. This paper proposes a framework that models the tradeoff between accuracy and fairness under four practical scenarios that dictate the type of data available for analysis. In contrast to prior work that examines the outputs of a scoring function, our framework directly analyzes the joint distribution of the feature vector, class label, and sensitive attribute by constructing a discrete approximation from a dataset. Through formulating multiple convex optimization problems, we answer the question: How is the accuracy of a Bayesian oracle affected in each situation when constrained to be fair? Analysis is performed on a suite of fairness definitions that include group and individual fairness. Experiments on three datasets demonstrate the utility of the proposed framework as a tool for quantifying the tradeoffs among different fairness notions and their distributional dependencies.",
        "keywords": "Fairness;Fairness-Accuracy Tradeoff;Linear Programming;Method of Multipliers;Convex Optimization;Vector Quantization",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/b750e2ff895b21a68f0c507a374ec304089e90e5.pdf",
        "author": "Zachary McBride Lazri;Danial Dervovic;Antigoni Polychroniadou;Ivan Brugere;Dana Dachman-Soled;Min Wu",
        "authorids": "~Zachary_McBride_Lazri1;~Danial_Dervovic1;~Antigoni_Polychroniadou1;~Ivan_Brugere1;~Dana_Dachman-Soled1;~Min_Wu1",
        "gender": ";M;F;M;;F",
        "homepage": ";https://www.danialdervovic.com;https://antigonip.github.io/work.html;;https://user.eng.umd.edu/~danadach/;https://user.eng.umd.edu/~minwu/bio.html",
        "dblp": "318/8753;203/8299.html;40/11429;50/10346;38/6981.html;16/0-1",
        "google_scholar": ";ttWrIOcAAAAJ;https://scholar.google.dk/citations?user=5e-gHjMAAAAJ;JGlGUcsAAAAJ;Ss009KUAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0002-7400-5547;0000-0002-6135-561X;;0000-0002-2953-3746;;0000-0001-7672-9357",
        "linkedin": "zachary-lazri-58a21221a;https://uk.linkedin.com/in/danial-dervovic;;ivanbrugere/;;minwu/",
        "or_profile": "~Zachary_McBride_Lazri1;~Danial_Dervovic1;~Antigoni_Polychroniadou1;~Ivan_Brugere1;~Dana_Dachman-Soled1;~Min_Wu1",
        "aff": "University of Maryland, College Park;J.P. Morgan Chase;J.P. Morgan AI Research ;J.P. Morgan;University of Maryland, College Park;University of Maryland, College Park",
        "aff_domain": "umd.edu;jpmorgan.com;jpmorgan.com;jpmchase.com;umd.edu;umd.edu",
        "position": "PhD student;Researcher;Principal Researcher;Researcher;Associate Professor;Full Professor",
        "bibtex": "@misc{\nlazri2024balancing,\ntitle={Balancing Fairness and Accuracy in Data-Restricted Binary Classification},\nauthor={Zachary McBride Lazri and Danial Dervovic and Antigoni Polychroniadou and Ivan Brugere and Dana Dachman-Soled and Min Wu},\nyear={2024},\nurl={https://openreview.net/forum?id=iVaxLjVRQN}\n}",
        "github": "",
        "project": "",
        "reviewers": "VFAT;wq6f;ENEz;5mdp",
        "site": "https://openreview.net/forum?id=iVaxLjVRQN",
        "pdf_size": 5378186,
        "rating": "3;3;5;5",
        "confidence": "3;4;3;4",
        "soundness": "3;1;3;2",
        "contribution": "1;1;2;2",
        "presentation": "3;2;3;3",
        "wc_summary": "61;78;142;461",
        "wc_strengths": "27;51;297;10",
        "wc_weaknesses": "373;316;630;97",
        "wc_questions": "2;2;265;22",
        "wc_review": "463;447;1334;590",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            185.5,
            161.90197651665653
        ],
        "wc_strengths_avg": [
            96.25,
            116.8147572013057
        ],
        "wc_weaknesses_avg": [
            354.0,
            189.75642281619878
        ],
        "wc_questions_avg": [
            72.75,
            111.29549631499022
        ],
        "wc_review_avg": [
            708.5,
            365.3577014379196
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:GzLXG9Q1FJQJ:scholar.google.com/&scioq=Balancing+Fairness+and+Accuracy+in+Data-Restricted+Binary+Classification&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;2;0;0",
        "aff_unique_norm": "University of Maryland;JPMorgan Chase & Co.;J.P. Morgan",
        "aff_unique_dep": ";;AI Research",
        "aff_unique_url": "https://www/umd.edu;https://www.jpmorganchase.com;https://www.jpmorgan.com",
        "aff_unique_abbr": "UMD;JPM;JPM",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "College Park;",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "iVqd2aXzvd",
        "title": "Automata Learning for Neural Event ODEs: An Interpretable Model of Piecewise Dynamics",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Discrete events within a continuous system cause discontinuities in its derivatives.\nGiven event specifications and state update functions,\nODE solvers can integrate until an event, apply the update function, and restart the integration process to obtain a piecewise solution for the system.\nHowever, in many real-world scenarios,\nthe event specifications are not readily available or vary across different black-box implementations.\nWe present a method to learn the dynamics of a black-box ODE implementation that uses abstract automata learning and Neural Event ODEs.\nWithout prior knowledge of the system, the method extracts the event specifications and state update functions, and generates a high-coverage training dataset\nthrough abstract automata learning.\nAdditionally, our approach introduces a significantly more efficient training process for Neural Event ODEs that slices training trajectories into temporally consecutive pairs within continuous dynamics.\nBoth contributions ensure well-posed initial values for each ODE slice.\nA~proof-of-concept implementation captures event specifications in an interpretable automaton and uses the trajectories from automata learning to efficiently train a simple feed-forward neural network by solving well-posed, single-step IVPs.\nDuring inference, the implementation detects the events and solves the IVP piecewise.\nPreliminary empirical results show significant improvements in training time and computational resource requirements while retaining all advantages of a piecewise solution.",
        "keywords": "Automata Learning;Neural ODEs;Domain Informed Machine Learning;Interpretable AI;Hybrid Systems;Piecewise ODEs;Active Learning;Event Detection Problem;Initial Value Problem;Discontinuous Dynamics",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "",
        "author": "Masoud Ebrahimi;Thomas Schranz;Mina Basirat",
        "authorids": "~Masoud_Ebrahimi1;~Thomas_Schranz1;~Mina_Basirat2",
        "gender": ";M;",
        "homepage": ";;",
        "dblp": ";247/7296;",
        "google_scholar": ";;",
        "orcid": ";0000-0002-9762-2353;",
        "linkedin": ";;",
        "or_profile": "~Masoud_Ebrahimi1;~Thomas_Schranz1;~Mina_Basirat2",
        "aff": ";;",
        "aff_domain": ";;",
        "position": ";;",
        "bibtex": "@misc{\nebrahimi2024automata,\ntitle={Automata Learning for Neural Event {ODE}s: An Interpretable Model of Piecewise Dynamics},\nauthor={Masoud Ebrahimi and Thomas Schranz and Mina Basirat},\nyear={2024},\nurl={https://openreview.net/forum?id=iVqd2aXzvd}\n}",
        "github": "",
        "project": "",
        "reviewers": "fYaA;B45E;tB87;zGTB",
        "site": "https://openreview.net/forum?id=iVqd2aXzvd",
        "pdf_size": 593139,
        "rating": "3;3;5;6",
        "confidence": "3;3;2;4",
        "soundness": "2;2;2;4",
        "contribution": "2;2;2;3",
        "presentation": "3;3;2;4",
        "wc_summary": "117;50;99;63",
        "wc_strengths": "76;22;26;131",
        "wc_weaknesses": "127;165;138;78",
        "wc_questions": "102;67;8;14",
        "wc_review": "422;304;271;286",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "748;504;557;213",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            82.25,
            26.920020430898635
        ],
        "wc_strengths_avg": [
            63.75,
            44.274004788363115
        ],
        "wc_weaknesses_avg": [
            127.0,
            31.488092987667578
        ],
        "wc_questions_avg": [
            47.75,
            38.8353897881816
        ],
        "wc_review_avg": [
            320.75,
            59.612813219978136
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            505.5,
            191.71397966762882
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.2721655269759087,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ERWze6GeiYoJ:scholar.google.com/&scioq=Automata+Learning+for+Neural+Event+ODEs:+An+Interpretable+Model+of+Piecewise+Dynamics&hl=en&as_sdt=0,5",
        "gs_version_total": 0
    },
    {
        "id": "iWi2mL8qoc",
        "title": "Multi-Scale Window based Transformer Network for High Quality Image Inpainting",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "To achieve effective image inpainting, it is crucial for the model to understand contextual information. Previous studies using CNN-based algorithms have encountered limitations due to the absence of long-range dependencies, which resulted in the model's inability to capture contextual information. In this paper, we propose a Multi-Scale Window-based Transformer model for high-quality image inpainting. We introduce a transformer network with multi-scale windows to capture the influence of different window sizes and gather significant contextual information. To effectively integrate features processed through self-attention, we modified the polarized self-attention network to align with the dimensions of the multi-window scale. We also propose the Selective Mask Update method, which captures vital information from features processed by self-attention, enabling the generation of higher-quality results. Experiments show that it effectively fills in missing areas and demonstrates superior performance on the benchmark dataset compared to other models.",
        "keywords": "Image inpainting;Image completion;Transformer;Multi-scale window;Polarized self-attention;Mask updating",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "SeongJoo Kim;Jaeyoung Choi",
        "authorids": "~SeongJoo_Kim1;~Jaeyoung_Choi2",
        "gender": "F;",
        "homepage": "https://lab.hufs.ac.kr/pmi;https://lab.hufs.ac.kr/pmi",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~SeongJoo_Kim1;~Jaeyoung_Choi2",
        "aff": ";Hankuk University of Foreign Studies",
        "aff_domain": ";hufs.ac.kr",
        "position": ";Associate Professor",
        "bibtex": "@misc{\nkim2024multiscale,\ntitle={Multi-Scale Window based Transformer Network for High Quality Image Inpainting},\nauthor={SeongJoo Kim and Jaeyoung Choi},\nyear={2024},\nurl={https://openreview.net/forum?id=iWi2mL8qoc}\n}",
        "github": "",
        "project": "",
        "reviewers": "UsMm;Z4FZ;8FYW;NdAo",
        "site": "https://openreview.net/forum?id=iWi2mL8qoc",
        "pdf_size": 9883077,
        "rating": "3;3;3;5",
        "confidence": "5;5;5;5",
        "soundness": "2;2;3;3",
        "contribution": "1;1;2;2",
        "presentation": "2;1;3;2",
        "wc_summary": "83;61;32;101",
        "wc_strengths": "21;19;49;86",
        "wc_weaknesses": "55;317;141;321",
        "wc_questions": "1;42;2;2",
        "wc_review": "160;439;224;510",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            5.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            69.25,
            25.752427070084092
        ],
        "wc_strengths_avg": [
            43.75,
            27.123559869604136
        ],
        "wc_weaknesses_avg": [
            208.5,
            114.61566210601411
        ],
        "wc_questions_avg": [
            11.75,
            17.469616481193857
        ],
        "wc_review_avg": [
            333.25,
            145.2366603168773
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:zhrmErWol5gJ:scholar.google.com/&scioq=Multi-Scale+Window+based+Transformer+Network+for+High+Quality+Image+Inpainting&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Hankuk University of Foreign Studies",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.hufs.ac.kr",
        "aff_unique_abbr": "HUFS",
        "aff_country_unique_index": "0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "Contrastive Preference Learning: Learning from Human Feedback without Reinforcement Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18062",
        "id": "iX1RjVQODj",
        "author_site": "Joey Hejna, Rafael Rafailov, Harshit Sikchi, Chelsea Finn, Scott Niekum, W. Bradley Knox, Dorsa Sadigh",
        "tldr": "",
        "abstract": "Reinforcement Learning from Human Feedback (RLHF) has emerged as a popular paradigm for aligning models with human intent. Typically RLHF algorithms operate in two phases: first, use human preferences to learn a reward function and second, align the model by optimizing the learned reward via reinforcement learning (RL). This paradigm assumes that human preferences are distributed according to reward, but recent work suggests that they instead follow the \\emph{regret} under the user's optimal policy. Thus, learning a reward function from feedback is not only based on a flawed assumption of human preference, but also leads to unwieldy optimization challenges that stem from policy gradients or bootstrapping in the RL phase. Because of these optimization challenges, contemporary RLHF methods restrict themselves to contextual bandit settings (e.g., as in large language models) or limit observation dimensionality (e.g., state-based robotics). We overcome these limitations by introducing a new family of algorithms for optimizing behavior from human feedback using the \\textit{regret}-based model of human preferences. Using the principle of maximum entropy, we derive \\fullname (\\abv), an algorithm for learning optimal policies from preferences without learning reward functions, circumventing the need for RL. \\abv is fully off-policy, uses only a simple contrastive objective, and can be applied to arbitrary MDPs. This enables \\abv to elegantly scale to high-dimensional and sequential RLHF problems while being simpler than prior methods.",
        "keywords": "reinforcement learning from human feedback;preference-based RL;human-in-the-loop RL;preference learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/efa06c4501dbc2e21a0c40ca772daba508b73299.zip",
        "author": "Joey Hejna;Rafael Rafailov;Harshit Sikchi;Chelsea Finn;Scott Niekum;W. Bradley Knox;Dorsa Sadigh",
        "authorids": "~Joey_Hejna1;~Rafael_Rafailov1;~Harshit_Sikchi1;~Chelsea_Finn1;~Scott_Niekum1;~W._Bradley_Knox2;~Dorsa_Sadigh1",
        "gender": "M;M;F;M;M;F;M",
        "homepage": "https://rmrafailov.github.io/;https://hari-sikchi.github.io/;https://ai.stanford.edu/~cbfinn/;https://people.cs.umass.edu/~sniekum/index.php;https://www.bradknox.net;https://dorsa.fyi/;https://joeyhejna.com",
        "dblp": "272/5358;271/4663;131/1783;62/8399;29/853;117/3174;336/3297",
        "google_scholar": "TwABcRgAAAAJ;jFOPZE0AAAAJ;vfPE6hgAAAAJ;4wXYfSUAAAAJ;0a58TKgAAAAJ;ZaJEZpYAAAAJ;y_sLoXoAAAAJ",
        "orcid": ";;;;0000-0002-6006-9523;;",
        "linkedin": ";;;;wbknox/;;",
        "or_profile": "~Rafael_Rafailov1;~Harshit_Sikchi1;~Chelsea_Finn1;~Scott_Niekum1;~W._Bradley_Knox2;~Dorsa_Sadigh1;~Donald_Joseph_Hejna_III1",
        "aff": "Stanford University;University of Texas, Austin;Google;University of Massachusetts at Amherst;Massachusetts Institute of Technology;Stanford University;Google",
        "aff_domain": "stanford.edu;utexas.edu;google.com;umass.edu;mit.edu;stanford.edu;google.com",
        "position": "PhD student;PhD student;Research Scientist;Associate Professor;Researcher;Assistant Professor;Intern",
        "bibtex": "@inproceedings{\nhejna2024contrastive,\ntitle={Contrastive Preference Learning: Learning from Human Feedback without Reinforcement Learning},\nauthor={Joey Hejna and Rafael Rafailov and Harshit Sikchi and Chelsea Finn and Scott Niekum and W. Bradley Knox and Dorsa Sadigh},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=iX1RjVQODj}\n}",
        "github": "",
        "project": "",
        "reviewers": "WpDS;NpZJ;moLC;Vhgt",
        "pdf_size": 1401901,
        "rating": "6;6;8;8",
        "confidence": "3;4;4;2",
        "soundness": "3;3;4;4",
        "contribution": "2;3;4;3",
        "presentation": "2;3;3;4",
        "wc_summary": "60;49;157;112",
        "wc_strengths": "28;55;190;42",
        "wc_weaknesses": "108;67;3;7",
        "wc_questions": "20;25;254;42",
        "wc_review": "216;196;604;203",
        "wc_reply_reviewers": "103;0;47;0",
        "wc_reply_authors": "1052;558;883;155",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "4;1;2;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            94.5,
            43.22325762827231
        ],
        "wc_strengths_avg": [
            78.75,
            64.93602621041728
        ],
        "wc_weaknesses_avg": [
            46.25,
            43.74571407578119
        ],
        "wc_questions_avg": [
            85.25,
            97.76854044118691
        ],
        "wc_review_avg": [
            304.75,
            172.9210441212983
        ],
        "wc_reply_reviewers_avg": [
            37.5,
            42.40577790820492
        ],
        "wc_reply_authors_avg": [
            662.0,
            342.347046138856
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.30151134457776363,
        "gs_citation": 27,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3131908199934210724&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=iX1RjVQODj",
        "pdf": "https://openreview.net/pdf?id=iX1RjVQODj",
        "email": "stanford.edu;utexas.edu;google.com;umass.edu;mit.edu;stanford.edu;google.com",
        "author_num": 7,
        "aff_unique_index": "0;1;2;3;4;0;2",
        "aff_unique_norm": "Stanford University;University of Texas at Austin;Google;University of Massachusetts Amherst;Massachusetts Institute of Technology",
        "aff_unique_dep": ";;Google;;",
        "aff_unique_url": "https://www.stanford.edu;https://www.utexas.edu;https://www.google.com;https://www.umass.edu;https://web.mit.edu",
        "aff_unique_abbr": "Stanford;UT Austin;Google;UMass Amherst;MIT",
        "aff_campus_unique_index": "0;1;2;3;0;2",
        "aff_campus_unique": "Stanford;Austin;Mountain View;Amherst;",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "iZQW7eutCv",
        "title": "pEBR: A Probabilistic Approach to Embedding Based Retrieval",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Embedding retrieval aims to learn a shared semantic representation space for both queries and items, thus enabling efficient and effective item retrieval using approximate nearest neighbor (ANN) algorithms. In current industrial practice, retrieval systems typically retrieve a fixed number of items for different queries, which actually leads to insufficient retrieval (low recall) for head queries and irrelevant retrieval (low precision) for tail queries. Mostly due to the trend of frequentist approach to loss function designs, till now there is no satisfactory solution to holistically address this challenge in the industry. In this paper, we move away from the frequentist approach, and take a novel probabilistic approach to embedding based retrieval (namely pEBR) by learning the item distribution for different queries, which enables a dynamic cosine similarity threshold calculated by the probabilistic cumulative distribution function (CDF) value. The experimental results show that our approach improves both the retrieval precision and recall significantly. Ablation studies also illustrate how the probabilistic approach is able to capture the differences between head and tail queries.",
        "keywords": "Embedding retrieval;probabilistic modeling;neural network",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Han Zhang;Yunjiang Jiang;Mingming Li;Haowei Yuan;Wen-Yun Yang",
        "authorids": "~Han_Zhang10;~Yunjiang_Jiang1;~Mingming_Li3;~Haowei_Yuan1;~Wen-Yun_Yang1",
        "gender": "F;M;M;;M",
        "homepage": ";https://sites.google.com/view/jyj3m/home;https://scholar.google.com/citations?user=rhIlcv8AAAAJ&hl=zh-CN;https://orcid.org/0009-0008-5859-8195;",
        "dblp": ";;;;53/864",
        "google_scholar": "_JA9U-EAAAAJ;;rhIlcv8AAAAJ;;WyvbFd8AAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;wen-yun-yang-31b48740/",
        "or_profile": "~Han_Zhang10;~Yunjiang_Jiang1;~Mingming_Li3;~Haowei_Yuan1;~Wen-Yun_Yang1",
        "aff": ";;JD.com;Shanghai Jiaotong University;Meta Facebook",
        "aff_domain": ";;jd.com;sjtu.edu.cn;meta.com",
        "position": ";;Researcher;Undergrad student;Researcher",
        "bibtex": "@misc{\nzhang2024pebr,\ntitle={p{EBR}: A Probabilistic Approach to Embedding Based Retrieval},\nauthor={Han Zhang and Yunjiang Jiang and Mingming Li and Haowei Yuan and Wen-Yun Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=iZQW7eutCv}\n}",
        "github": "",
        "project": "",
        "reviewers": "vdaa;xamY;2BmG",
        "site": "https://openreview.net/forum?id=iZQW7eutCv",
        "pdf_size": 1890842,
        "rating": "3;5;5",
        "confidence": "2;3;3",
        "soundness": "2;2;3",
        "contribution": "2;2;2",
        "presentation": "3;3;4",
        "wc_summary": "74;83;26",
        "wc_strengths": "42;53;25",
        "wc_weaknesses": "172;25;133",
        "wc_questions": "3;47;122",
        "wc_review": "291;208;306",
        "wc_reply_reviewers": "36;0;81",
        "wc_reply_authors": "286;137;211",
        "reply_reviewers": "1;0;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            61.0,
            25.019992006393608
        ],
        "wc_strengths_avg": [
            40.0,
            11.51810169544733
        ],
        "wc_weaknesses_avg": [
            110.0,
            62.177166226839255
        ],
        "wc_questions_avg": [
            57.333333333333336,
            49.12795085850371
        ],
        "wc_review_avg": [
            268.3333333333333,
            43.099368389287974
        ],
        "wc_reply_reviewers_avg": [
            39.0,
            33.13608305156178
        ],
        "wc_reply_authors_avg": [
            211.33333333333334,
            60.829451930970265
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.9999999999999998,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:CAbHqmK1kDwJ:scholar.google.com/&scioq=pEBR:+A+Probabilistic+Approach+to+Embedding+Based+Retrieval&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "JD.com;Shanghai Jiao Tong University;Meta",
        "aff_unique_dep": ";;Meta Platforms, Inc.",
        "aff_unique_url": "https://www.jd.com;https://www.sjtu.edu.cn;https://meta.com",
        "aff_unique_abbr": "JD;SJTU;Meta",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "On the Hardness of Online Nonconvex Optimization with Single Oracle Feedback",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18061",
        "id": "iZgECfyHXF",
        "author_site": "Ziwei Guan, Yi Zhou, Yingbin Liang",
        "tldr": "",
        "abstract": "Online nonconvex optimization has been an active area of research recently. Previous studies either considered the global regret with full information about the objective functions, or studied the local regret with window-smoothed objective functions, which required access to unlimited number of gradient oracles per time step. In this paper, we focus on the more challenging and practical setting, where access to only a single oracle is allowed per time step, and take the local regret of the original (i.e., unsmoothed) objective functions as the performance metric. Specifically, for both settings respectively with a single exact and stochastic gradient oracle feedback, we derive lower bounds on the local regret and show that the classical online (stochastic) gradient descent algorithms are optimal. Moreover, for the more challenging setting with a single function value oracle feedback, we develop an online algorithm based on a one-point running difference gradient estimator, and show that such an algorithm achieves a local regret that a generic stochastic gradient oracle can best achieve.",
        "keywords": "online nonconvex optimization;local regret;optimal rate analysis",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Ziwei Guan;Yi Zhou;Yingbin Liang",
        "authorids": "~Ziwei_Guan1;~Yi_Zhou2;~Yingbin_Liang1",
        "gender": ";M;F",
        "homepage": ";https://sites.google.com/site/yizhouhomepage/home;https://sites.google.com/view/yingbinliang/home",
        "dblp": ";;51/332",
        "google_scholar": ";4fK8bYIAAAAJ;lGgLAiIAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Ziwei_Guan1;~Yi_Zhou2;~Yingbin_Liang1",
        "aff": ";University of Utah;The Ohio State University",
        "aff_domain": ";utah.edu;osu.edu",
        "position": ";Assistant Professor;Professor",
        "bibtex": "@inproceedings{\nguan2024on,\ntitle={On the Hardness of Online Nonconvex Optimization with Single Oracle Feedback},\nauthor={Ziwei Guan and Yi Zhou and Yingbin Liang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=iZgECfyHXF}\n}",
        "github": "",
        "project": "",
        "reviewers": "e2ZJ;qRqP;xXV1;sA6m",
        "pdf_size": 353800,
        "rating": "6;6;6;8",
        "confidence": "4;3;3;3",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;4",
        "presentation": "4;3;3;3",
        "wc_summary": "170;107;88;137",
        "wc_strengths": "46;32;212;282",
        "wc_weaknesses": "201;31;56;39",
        "wc_questions": "215;29;182;114",
        "wc_review": "632;199;538;572",
        "wc_reply_reviewers": "54;0;0;34",
        "wc_reply_authors": "800;492;409;447",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "2;1;1;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            125.5,
            31.06847276581197
        ],
        "wc_strengths_avg": [
            143.0,
            107.01868995647442
        ],
        "wc_weaknesses_avg": [
            81.75,
            69.43837195672145
        ],
        "wc_questions_avg": [
            135.0,
            71.21446482281532
        ],
        "wc_review_avg": [
            485.25,
            168.65849370844032
        ],
        "wc_reply_reviewers_avg": [
            22.0,
            23.108440016582687
        ],
        "wc_reply_authors_avg": [
            537.0,
            154.65930298562708
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:BmuMLxFpJ1cJ:scholar.google.com/&scioq=On+the+Hardness+of+Online+Nonconvex+Optimization+with+Single+Oracle+Feedback&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=iZgECfyHXF",
        "pdf": "https://openreview.net/pdf?id=iZgECfyHXF",
        "email": ";utah.edu;osu.edu",
        "author_num": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Utah;Ohio State University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.utah.edu;https://www.osu.edu",
        "aff_unique_abbr": "Utah;OSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "ia5wG0Fp2U",
        "title": "Video-Teller: Enhancing Cross-Modal Generation with Fusion and Decoupling",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "This paper proposes Video-Teller, a Video-Text foundational model that leverages multi modal fusion and fine-grained modality alignment to significantly enhance the cross-modal generation task. Video-Teller boosts the training efficiency by utilizing frozen pre-trained vision and language modules. Furthermore, it capitalizes on the robust linguistic capabilities of large language model, enabling the generation of more nuanced descriptions for videos (video summaries). To effectively integrate visual and auditory information and improve the model's understanding of videos, Video-Teller employs cascaded Q-Former to fuse information from different frames and modalities. In addition to conventional loss functions, we introduce an additional Text Auto-Encoder to decouple the target text for fine-grained modality alignment, further optimizing the model. Experimental results demonstrate the efficacy of our proposed video foundational model in accurately comprehending videos and generating coherent and precise language descriptions. It is worth noting that the fine-grained alignment enhances the model's capabilities with a relatively minimal increase in cost.",
        "keywords": "Video Understanding;Modality alignment;Representation decoupling;Fine-grained",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Haogeng Liu;Qihang Fan;Tingkai Liu;Linjie Yang;Yunzhe Tao;Huaibo Huang;Ran He;Hongxia Yang",
        "authorids": "~Haogeng_Liu1;~Qihang_Fan1;~Tingkai_Liu1;~Linjie_Yang4;~Yunzhe_Tao2;~Huaibo_Huang1;~Ran_He1;~Hongxia_Yang2",
        "gender": "M;M;M;M;M;M;M;F",
        "homepage": "https://github.com/liuhaogeng;https://github.com/qhfan;https://tk-21st.github.io/;https://sites.google.com/site/linjieyang89/;;https://people.ucas.edu.cn/~huanghuaibo;https://rhe-web.github.io/;https://www4.comp.polyu.edu.hk/~hongxyang/",
        "dblp": ";344/3915;270/4091;126/6794;;211/7251.html;61/6198-1;",
        "google_scholar": ";9HGN_c0AAAAJ;hUYLD3_8Z1sC;;gldelC4AAAAJ;XMvLciUAAAAJ;ayrg9AUAAAAJ;iJlC5mMAAAAJ",
        "orcid": ";0000-0002-6115-5503;0000-0003-3075-7648;;;0000-0001-5866-2283;0000-0002-3807-991X;",
        "linkedin": ";;;;yunzhe-tao/;;;",
        "or_profile": "~Haogeng_Liu1;~Qihang_Fan1;~Tingkai_Liu1;~Linjie_Yang4;~Yunzhe_Tao2;~Huaibo_Huang1;~Ran_He1;~Hongxia_Yang2",
        "aff": "University of Chinese Academy of Sciences;Institute of Automation, Chinese Academy of Sciences;ByteDance Inc.;ByteDance Inc.;ByteDance;Institute of Automation, Chinese Academy of Sciences;Institute of Automation, Chinese Academy of Sciences;ByteDance Inc.",
        "aff_domain": "ucas.ac.cn;ia.ac.cn;bytedance.com;bytedance.com;bytedance.com;ia.ac.cn;ia.ac.cn;bytedance.com",
        "position": "MS student;PhD student;Researcher;Research Scientist;Researcher;Associate Professor;Full Professor;Principal Researcher",
        "bibtex": "@misc{\nliu2024videoteller,\ntitle={Video-Teller: Enhancing Cross-Modal Generation with Fusion and Decoupling},\nauthor={Haogeng Liu and Qihang Fan and Tingkai Liu and Linjie Yang and Yunzhe Tao and Huaibo Huang and Ran He and Hongxia Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=ia5wG0Fp2U}\n}",
        "github": "",
        "project": "",
        "reviewers": "wY2h;2rTV;9ESt;5do8",
        "site": "https://openreview.net/forum?id=ia5wG0Fp2U",
        "pdf_size": 2363427,
        "rating": "3;3;5;5",
        "confidence": "4;4;4;4",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "3;2;3;2",
        "wc_summary": "57;33;68;86",
        "wc_strengths": "57;30;44;104",
        "wc_weaknesses": "271;145;262;181",
        "wc_questions": "39;10;18;83",
        "wc_review": "424;218;392;454",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            61.0,
            19.196353820452465
        ],
        "wc_strengths_avg": [
            58.75,
            27.815238629211866
        ],
        "wc_weaknesses_avg": [
            214.75,
            53.38714732967102
        ],
        "wc_questions_avg": [
            37.5,
            28.324018076537094
        ],
        "wc_review_avg": [
            372.0,
            91.57510578754469
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2347240651608150954&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;2;2;1;1;2",
        "aff_unique_norm": "University of Chinese Academy of Sciences;Chinese Academy of Sciences;ByteDance",
        "aff_unique_dep": ";Institute of Automation;",
        "aff_unique_url": "http://www.ucas.ac.cn;http://www.ia.cas.cn;https://www.bytedance.com",
        "aff_unique_abbr": "UCAS;CAS;ByteDance",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Identifiable Latent Polynomial Causal Models through the Lens of Change",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18060",
        "id": "ia9fKO1Vjq",
        "author_site": "Yuhang Liu, Zhen Zhang, Dong Gong, Mingming Gong, Biwei Huang, Anton Hengel, Kun Zhang, Qinfeng Shi",
        "tldr": "",
        "abstract": "Causal representation learning aims to unveil latent high-level causal representations from observed low-level data. One of its primary tasks is to provide reliable assurance of identifying these latent causal models, known as \\textit{identifiability}. A recent breakthrough explores identifiability by leveraging the change of causal influences among latent causal variables across multiple environments \\citep{liu2022identifying}. However, this progress rests on the assumption that the causal relationships among latent causal variables adhere strictly to linear Gaussian models. In this paper, we extend the scope of latent causal models to involve nonlinear causal relationships, represented by polynomial models, and general noise distributions conforming to the exponential family. Additionally, we investigate the necessity of imposing changes on all causal parameters and present partial identifiability results when part of them remains unchanged. Further, we propose a novel empirical estimation method, grounded in our theoretical finding, that enables learning consistent latent causal representations. Our experimental results, obtained from both synthetic and real-world data, validate our theoretical contributions concerning identifiability and consistency.",
        "keywords": "Latent Causal Models;Causal Representations;Identifiability;Representation Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Yuhang Liu;Zhen Zhang;Dong Gong;Mingming Gong;Biwei Huang;Anton van den Hengel;Kun Zhang;Javen Qinfeng Shi",
        "authorids": "~Yuhang_Liu1;~Zhen_Zhang2;~Dong_Gong1;~Mingming_Gong1;~Biwei_Huang1;~Anton_van_den_Hengel1;~Kun_Zhang1;~Javen_Qinfeng_Shi1",
        "gender": ";M;M;M;F;;M;M",
        "homepage": "https://sites.google.com/view/yuhangliu/homepage;https://zzhang.org;https://donggong1.github.io;https://mingming-gong.github.io/;;;http://www.andrew.cmu.edu/user/kunz1/;https://cs.adelaide.edu.au/~javen/",
        "dblp": ";19/5112-8;125/5032;98/8479;165/3288;v/AntonvandenHengel;96/3115-1;http://dblp.uni-trier.de/pers/hd/s/Shi:Qinfeng",
        "google_scholar": "5xZspvQAAAAJ;https://scholar.google.com.sg/citations?user=4X6Hqg0AAAAJ;https://scholar.google.com.au/citations?user=e2u6hRoAAAAJ;https://scholar.google.com.au/citations?user=6BmiCJIAAAAJ;;https://scholar.google.com.au/citations?user=nMGZ2ZQAAAAJ;RGoypN4AAAAJ;https://scholar.google.com.au/citations?user=h6O9vYkAAAAJ",
        "orcid": ";0000-0003-2805-4396;0000-0002-2668-9630;0000-0001-7147-5589;;0000-0003-3027-8364;;0000-0002-9126-2107",
        "linkedin": ";;;;;;;",
        "or_profile": "~Yuhang_Liu1;~Zhen_Zhang2;~Dong_Gong1;~Mingming_Gong1;~Biwei_Huang1;~Anton_van_den_Hengel1;~Kun_Zhang1;~Javen_Shi1",
        "aff": "The University of Adelaide;The University of Adelaide;University of New South Wales;University of Melbourne;University of California, San Diego;University of Adelaide;Carnegie Mellon University;University of Adelaide",
        "aff_domain": "adelaide.edu.au;adelaide.edu.au;unsw.edu.au;unimelb.edu.au;ucsd.edu;adelaide.edu.au;cmu.edu;adelaide.edu.au",
        "position": "Postdoc;Postdoc;Assistant Professor;Assistant Professor;Assistant Professor;Professor;Associate Professor;Professor",
        "bibtex": "@inproceedings{\nliu2024identifiable,\ntitle={Identifiable Latent Polynomial Causal Models through the Lens of Change},\nauthor={Yuhang Liu and Zhen Zhang and Dong Gong and Mingming Gong and Biwei Huang and Anton van den Hengel and Kun Zhang and Javen Qinfeng Shi},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ia9fKO1Vjq}\n}",
        "github": "",
        "project": "",
        "reviewers": "kugU;YEeM;22Xe;KC1H;UsXb",
        "pdf_size": 2615097,
        "rating": "3;6;6;6;6",
        "confidence": "3;3;4;4;4",
        "soundness": "3;3;3;4;2",
        "contribution": "1;3;3;3;3",
        "presentation": "2;4;3;3;4",
        "wc_summary": "64;144;79;91;118",
        "wc_strengths": "164;83;43;95;142",
        "wc_weaknesses": "607;127;40;232;306",
        "wc_questions": "74;229;400;6;119",
        "wc_review": "909;583;562;424;685",
        "wc_reply_reviewers": "0;22;84;0;56",
        "wc_reply_authors": "1141;1202;969;479;1293",
        "reply_reviewers": "0;1;1;0;1",
        "reply_authors": "4;3;4;1;3",
        "rating_avg": [
            5.4,
            1.2
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            3.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            2.6,
            0.8000000000000002
        ],
        "presentation_avg": [
            3.2,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            99.2,
            28.547504269200136
        ],
        "wc_strengths_avg": [
            105.4,
            43.074818629914155
        ],
        "wc_weaknesses_avg": [
            262.4,
            194.61202429449213
        ],
        "wc_questions_avg": [
            165.6,
            137.83845617243395
        ],
        "wc_review_avg": [
            632.6,
            161.30790433205684
        ],
        "wc_reply_reviewers_avg": [
            32.4,
            32.9460164511584
        ],
        "wc_reply_authors_avg": [
            1016.8,
            288.97224780244903
        ],
        "reply_reviewers_avg": [
            0.6,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            3.0,
            1.0954451150103321
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.6123724356957945,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6409624064785525206&as_sdt=5,34&sciodt=0,34&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=ia9fKO1Vjq",
        "pdf": "https://openreview.net/pdf?id=ia9fKO1Vjq",
        "email": "adelaide.edu.au;adelaide.edu.au;unsw.edu.au;unimelb.edu.au;ucsd.edu;adelaide.edu.au;cmu.edu;adelaide.edu.au",
        "author_num": 8,
        "aff_unique_index": "0;0;1;2;3;0;4;0",
        "aff_unique_norm": "University of Adelaide;University of New South Wales;University of Melbourne;University of California, San Diego;Carnegie Mellon University",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.adelaide.edu.au;https://www.unsw.edu.au;https://www.unimelb.edu.au;https://www.ucsd.edu;https://www.cmu.edu",
        "aff_unique_abbr": "Adelaide;UNSW;UniMelb;UCSD;CMU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";San Diego",
        "aff_country_unique_index": "0;0;0;0;1;0;1;0",
        "aff_country_unique": "Australia;United States"
    },
    {
        "title": "CausalTime: Realistically Generated Time-series for Benchmarking of Causal Discovery",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18059",
        "id": "iad1yyyGme",
        "author_site": "YUXIAO CHENG, Ziqian Wang, Tingxiong Xiao, Qin Zhong, Jinli Suo, Kunlun He",
        "tldr": "",
        "abstract": "Time-series causal discovery (TSCD) is a fundamental problem of machine learning. However,  existing synthetic datasets cannot properly evaluate or predict the algorithms' performance on real data. This study introduces the CausalTime pipeline to generate time-series that highly resemble the real data and with ground truth causal graphs for quantitative performance evaluation. The pipeline starts from real observations in a specific scenario and produces a matching benchmark dataset. Firstly, we harness deep neural networks along with normalizing flow to accurately capture realistic dynamics. Secondly, we extract hypothesized causal graphs by performing importance analysis on the neural network or leveraging prior knowledge. Thirdly, we derive the ground truth causal graphs by splitting the causal model into causal term, residual term, and noise term. Lastly, using the fitted network and the derived causal graph, we generate corresponding versatile time-series proper for algorithm assessment. In the experiments, we validate the fidelity of the generated data through qualitative and quantitative experiments, followed by a benchmarking of existing TSCD algorithms using these generated datasets. CausalTime offers a feasible solution to evaluating TSCD algorithms in real applications and can be generalized to a wide range of fields. For easy use of the proposed approach, we also provide a user-friendly website, hosted on www.causaltime.cc.",
        "keywords": "Time series;Causal discovery;Neural networks;Benchmark;Dataset",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/31608c8c8259046722f7e6bfa0fe5ec7c63deabe.zip",
        "author": "Yuxiao Cheng;Ziqian Wang;Tingxiong Xiao;Qin Zhong;Jinli Suo;Kunlun He",
        "authorids": "~Yuxiao_Cheng1;~Ziqian_Wang1;~Tingxiong_Xiao1;~Qin_Zhong1;~Jinli_Suo1;~Kunlun_He1",
        "gender": "M;F;M;F;F;M",
        "homepage": ";https://github.com/Daerwang2020/Wangziqian;;https://www.301hospital.com.cn/index.html;https://sites.google.com/site/suojinli/;",
        "dblp": "324/5268;;330/2406;;15/898;226/9735",
        "google_scholar": "f44eGhAAAAAJ;;_T0JoMjux74C;;e4lel8QAAAAJ;",
        "orcid": "0000-0002-9097-1454;;0000-0002-0943-4097;0000-0001-6834-1942;;0000-0002-3335-5700",
        "linkedin": ";;;;;",
        "or_profile": "~Yuxiao_Cheng1;~Ziqian_Wang1;~Tingxiong_Xiao1;~Qin_Zhong1;~Jinli_Suo1;~Kunlun_He1",
        "aff": "Tsinghua University;Tsinghua University;Tsinghua University;;Tsinghua University;Chinese PLA General Hospital",
        "aff_domain": "tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;;tsinghua.edu.cn;plagh.org",
        "position": "PhD student;Undergrad student;PhD student;;Associate Professor;Full Professor",
        "bibtex": "@inproceedings{\ncheng2024causaltime,\ntitle={CausalTime: Realistically Generated Time-series for Benchmarking of Causal Discovery},\nauthor={Yuxiao Cheng and Ziqian Wang and Tingxiong Xiao and Qin Zhong and Jinli Suo and Kunlun He},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=iad1yyyGme}\n}",
        "github": "",
        "project": "",
        "reviewers": "7uMr;YwkA;3QnF;jMsi",
        "pdf_size": 3783184,
        "rating": "5;6;8;8",
        "confidence": "4;3;4;4",
        "soundness": "3;2;3;2",
        "contribution": "3;2;3;3",
        "presentation": "2;2;3;4",
        "wc_summary": "175;28;139;140",
        "wc_strengths": "68;57;126;101",
        "wc_weaknesses": "195;89;492;154",
        "wc_questions": "169;140;64;204",
        "wc_review": "607;314;821;599",
        "wc_reply_reviewers": "87;26;53;0",
        "wc_reply_authors": "1275;637;1348;1012",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "3;2;3;2",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            120.5,
            55.33760023709015
        ],
        "wc_strengths_avg": [
            88.0,
            27.26719640887196
        ],
        "wc_weaknesses_avg": [
            232.5,
            154.51618038250882
        ],
        "wc_questions_avg": [
            144.25,
            51.57700553541277
        ],
        "wc_review_avg": [
            585.25,
            180.15045795112485
        ],
        "wc_reply_reviewers_avg": [
            41.5,
            32.26840560052511
        ],
        "wc_reply_authors_avg": [
            1068.0,
            278.45376635987526
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16285899150956168578&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=iad1yyyGme",
        "pdf": "https://openreview.net/pdf?id=iad1yyyGme",
        "email": "tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;;tsinghua.edu.cn;plagh.org",
        "author_num": 6,
        "aff_unique_index": "0;0;0;0;1",
        "aff_unique_norm": "Tsinghua University;Chinese PLA General Hospital",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tsinghua.edu.cn;http://www.plagg.com.cn",
        "aff_unique_abbr": "THU;PLA General Hospital",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Epitopological learning and Cannistraci-Hebb network shape intelligence brain-inspired theory for ultra-sparse advantage in deep learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18058",
        "id": "iayEcORsGd",
        "author_site": "Yingtao Zhang, Jialin Zhao, Wenjing Wu, Alessandro Muscoloni, Carlo Vittorio Cannistraci",
        "tldr": "",
        "abstract": "Sparse training (ST) aims to ameliorate deep learning by replacing fully connected artificial neural networks (ANNs) with sparse or ultra-sparse ones, such as brain networks are, therefore it might benefit to borrow brain-inspired learning paradigms from complex network intelligence theory. Here, we launch the ultra-sparse advantage challenge, whose goal is to offer evidence on the extent to which ultra-sparse (around 1\\% connection retained) topologies can achieve any leaning advantage against fully connected. Epitopological learning is a field of network science and complex network intelligence that studies how to implement learning on complex networks by changing the shape of their connectivity structure (epitopological plasticity). One way to implement Epitopological (epi- means new) Learning is via link prediction: predicting the likelihood of non-observed links to appear in the network. Cannistraci-Hebb learning theory inspired the CH3-L3 network automata rule for link prediction which is effective for general-purpose link prediction. Here, starting from CH3-L3 we propose Epitopological Sparse Meta-deep Learning (ESML) to apply Epitopological Learning to sparse training. In empirical experiments, we find that ESML learns ANNs with ultra-sparse hyperbolic (epi-)topology in which emerges a community layer organization that is meta-deep (meaning that each layer also has an internal depth due to power-law node hierarchy). Furthermore, we discover that ESML can in many cases automatically sparse the neurons during training (arriving even to 30\\% neurons left in hidden layers), this process of node dynamic removal is called percolation. Starting from this network science evidence, we design Cannistraci-Hebb training (CHT), a 4-step training methodology that puts ESML at its heart. We conduct experiments on 7 datasets and 5 network structures comparing CHT to dynamic sparse training SOTA algorithms and the fully connected counterparts. The results indicate that, with a mere 1\\% of links retained during training, CHT surpasses fully connected networks on VGG16, GoogLeNet, ResNet50, and ResNet152. This key finding is an evidence for ultra-sparse advantage and signs a milestone in deep learning. CHT acts akin to a gradient-free oracle that adopts CH3-L3-based epitopological learning to guide the placement of new links in the ultra-sparse network topology to facilitate sparse-weight gradient learning, and this in turn reduces the convergence time of ultra-sparse training. Finally, CHT offers the first examples of parsimony dynamic sparse training because, in many datasets, it can retain network performance by percolating and significantly reducing the node network size.\nOur code is available at: https://github.com/biomedical-cybernetics/Cannistraci-Hebb-training",
        "keywords": "Sparse Training;Network Science;Epitopological Learning;Network Automata;Network Percolation;Hyperbolic Network",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Yingtao Zhang;Jialin Zhao;Wenjing Wu;Alessandro Muscoloni;Carlo Vittorio Cannistraci",
        "authorids": "~Yingtao_Zhang3;~Jialin_Zhao1;~Wenjing_Wu1;~Alessandro_Muscoloni1;~Carlo_Vittorio_Cannistraci1",
        "gender": "M;M;F;M;M",
        "homepage": "https://brain.tsinghua.edu.cn/en/info/1048/1156.htm;https://github.com/abcbdf/;https://brain.tsinghua.edu.cn;;https://brain.tsinghua.edu.cn/en/info/1010/1003.htm",
        "dblp": ";160/9058-4;;158/8670;54/8711",
        "google_scholar": ";;;04tnUN4AAAAJ;b7xoXO0AAAAJ",
        "orcid": ";;;;0000-0003-0100-8410",
        "linkedin": ";;;;",
        "or_profile": "~Yingtao_Zhang3;~Jialin_Zhao1;~Wenjing_Wu1;~Alessandro_Muscoloni1;~Carlo_Vittorio_Cannistraci1",
        "aff": "Tsinghua University;Tsinghua University;Tsinghua University;Tsinghua University;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "PhD student;PhD student;Undergrad student;Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\nzhang2024epitopological,\ntitle={Epitopological learning and Cannistraci-Hebb network shape intelligence brain-inspired theory for ultra-sparse advantage in deep learning},\nauthor={Yingtao Zhang and Jialin Zhao and Wenjing Wu and Alessandro Muscoloni and Carlo Vittorio Cannistraci},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=iayEcORsGd}\n}",
        "github": "",
        "project": "",
        "reviewers": "cMYk;nVAm;M5bF",
        "pdf_size": 5624274,
        "rating": "6;8;8",
        "confidence": "4;2;2",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "3;3;3",
        "wc_summary": "37;96;26",
        "wc_strengths": "74;74;100",
        "wc_weaknesses": "40;47;23",
        "wc_questions": "34;40;2",
        "wc_review": "185;257;151",
        "wc_reply_reviewers": "22;39;19",
        "wc_reply_authors": "977;516;90",
        "reply_reviewers": "1;1;1",
        "reply_authors": "2;1;1",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            53.0,
            30.735430152621365
        ],
        "wc_strengths_avg": [
            82.66666666666667,
            12.256517540566824
        ],
        "wc_weaknesses_avg": [
            36.666666666666664,
            10.077477638553983
        ],
        "wc_questions_avg": [
            25.333333333333332,
            16.679994670929073
        ],
        "wc_review_avg": [
            197.66666666666666,
            44.19150245113747
        ],
        "wc_reply_reviewers_avg": [
            26.666666666666668,
            8.806563209081938
        ],
        "wc_reply_authors_avg": [
            527.6666666666666,
            362.2101906658925
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16930724791637937588&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=iayEcORsGd",
        "pdf": "https://openreview.net/pdf?id=iayEcORsGd",
        "email": "tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Tsinghua University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "ibggY9ZJ1T",
        "title": "HuRef: HUman-REadable Fingerprint for Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Protecting the copyright of large language models (LLMs) has become crucial due to their resource-intensive training and accompanying carefully designed licenses. However, identifying the original base model of an LLM is challenging due to potential parameter alterations through fine-tuning or continued pretraining.\nIn this study, we introduce HuRef, a human-readable fingerprint for LLMs that uniquely identifies the base model without exposing model parameters or interfering with training. We first observe that the vector direction of LLM parameters remains stable after the model has converged during pretraining, showing negligible perturbations through subsequent training steps, including continued pretraining, supervised fine-tuning (SFT), and RLHF, which makes it a sufficient condition to identify the base model. The necessity is validated by continuing to train an LLM with an extra term to drive away the model parameters' direction and the model becomes damaged.  \nHowever, this direction is vulnerable to simple attacks like dimension permutation or matrix rotation, which significantly changes it without affecting performance. \nTo address this, leveraging the Transformer structure, we systematically analyze potential attacks and define three invariant terms that identify an LLM's base model.\nWe make these invariant terms human-readable by mapping them to a Gaussian vector using a convolutional encoder and then converting it into a natural image with StyleGAN2. The encoder discriminates between invariants from different base models and ensures Gaussian output through adversarial training, while StyleGAN2 transforms Gaussian vectors into dog images. Consequently, our method generates a dog image as an identity fingerprint for an LLM, where the dog's appearance strongly indicates the LLM's base model. Specifically, if the LLM is adapted from another base model, the generated dog highly resembles that model; otherwise if trained independently from scratch, it exhibits a unique dog image distinct from other models.\nExperimental results across various LLMs demonstrate the effectiveness of our method, the generated dog image remains invariant to different training steps, including SFT, RLHF, or even continued pretraining with augmented vocabulary in a new language.",
        "keywords": "Large Language Models (LLMs);Model Identification;Fingerprinting",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/d2c2facd9464f215317a548b5e339507892e3a37.zip",
        "author": "Boyi Zeng;Chenghu Zhou;Xinbing Wang;Zhouhan Lin",
        "authorids": "~Boyi_Zeng2;~Chenghu_Zhou3;~Xinbing_Wang1;~Zhouhan_Lin1",
        "gender": "M;M;M;M",
        "homepage": ";http://www.igsnrr.cas.cn/gkjj/ysfc/ysfc_zhouchenghu/;http://www.cs.sjtu.edu.cn/~wang-xb/;https://hantek.github.io",
        "dblp": ";85/1324.html;96/1149.html;121/7919.html",
        "google_scholar": ";;https://scholar.google.com.tw/citations?user=CT5yZbwAAAAJ;https://scholar.google.ca/citations?user=LNZ4efwAAAAJ",
        "orcid": "0009-0001-9131-0228;;0000-0002-0357-8356;0009-0009-7204-0689",
        "linkedin": ";;;https://ca.linkedin.com/in/zhouhan-lin-34b98975",
        "or_profile": "~Boyi_Zeng2;~Chenghu_Zhou3;~Xinbing_Wang1;~Zhouhan_Lin1",
        "aff": "Shanghai Jiaotong University;IGSNRR, Chinese Academy of Sciences, Beijing, China;Shanghai Jiaotong University;Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn;lreis.ac.cn;cs.sjtu.edu.cn;sjtu.edu.cn",
        "position": "PhD student;Full Professor;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nzeng2024huref,\ntitle={HuRef: {HU}man-{RE}adable Fingerprint  for Large Language Models},\nauthor={Boyi Zeng and Chenghu Zhou and Xinbing Wang and Zhouhan Lin},\nyear={2024},\nurl={https://openreview.net/forum?id=ibggY9ZJ1T}\n}",
        "github": "",
        "project": "",
        "reviewers": "feP3;qUfX;8z4E",
        "site": "https://openreview.net/forum?id=ibggY9ZJ1T",
        "pdf_size": 3895818,
        "rating": "3;5;6",
        "confidence": "4;3;3",
        "soundness": "2;3;4",
        "contribution": "2;2;4",
        "presentation": "2;3;4",
        "wc_summary": "114;61;116",
        "wc_strengths": "27;25;59",
        "wc_weaknesses": "141;130;29",
        "wc_questions": "9;39;44",
        "wc_review": "291;255;248",
        "wc_reply_reviewers": "52;70;29",
        "wc_reply_authors": "850;808;764",
        "reply_reviewers": "1;1;1",
        "reply_authors": "3;2;3",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            97.0,
            25.468935326524086
        ],
        "wc_strengths_avg": [
            37.0,
            15.57776192739723
        ],
        "wc_weaknesses_avg": [
            100.0,
            50.40502620440412
        ],
        "wc_questions_avg": [
            30.666666666666668,
            15.456030825826172
        ],
        "wc_review_avg": [
            264.6666666666667,
            18.83849486792639
        ],
        "wc_reply_reviewers_avg": [
            50.333333333333336,
            16.779617264870957
        ],
        "wc_reply_authors_avg": [
            807.3333333333334,
            35.11251755270318
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9449111825230683,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5402153993814029029&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Shanghai Jiao Tong University;Chinese Academy of Sciences",
        "aff_unique_dep": ";IGSNRR",
        "aff_unique_url": "https://www.sjtu.edu.cn;http://www.cas.cn",
        "aff_unique_abbr": "SJTU;CAS",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Beijing",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "ic1Z7Qe9xH",
        "title": "Elastic Load Balancing for Dynamic LLMs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "To reduce the computational and memory costs of Large Language Models (LLMs), families of training schemes that introduce dynamic training workloads is emerging. For example, in gradual pruning, the pruning of the parameters of a model happens during training to reduce resource requirements. However,\none of the side effects of this is that sparsification introduces workload imbalance among workers, which, in turn affects the pipeline parallelism efficiency in distributed training. Similar issues arise in layer freezing schemes. We propose load balancing algorithms to adaptively maintain equal compute workloads among different workers, and also dynamically pack work into fewer workers while sustaining training throughput. Our solution, DYNPIPE, supports both single nodes with multi-GPUs and also systems with multi-nodes. Our methods accelerate the training of dynamic GPT class of models by up to 1.29x in a single node with 8 A100 GPUs, and 2.54x in a data and pipeline hybrid parallelism multi-node setting up to 720 A100 GPUs, over state-of-the art production solutions used in training static LLMs. DYNPIPE is available at https:\n//anonymous.4open.science/r/DynPipe-CC54",
        "keywords": "Transformers; Dynamic Models; Pipeline Parallelism; LLMs",
        "primary_area": "infrastructure, software libraries, hardware, etc.",
        "supplementary_material": "/attachment/ecdd31ad282b07c98f2a4e16f3867134bac9ba54.pdf",
        "author": "Mohamed Wahib;Muhammet Abdullah Soyt\u00fcrk;Didem Unat",
        "authorids": "~Mohamed_Wahib1;~Muhammet_Abdullah_Soyt\u00fcrk1;~Didem_Unat1",
        "gender": "M;F;",
        "homepage": "https://www.r-ccs.riken.jp/en/research/labs/hpaisrt/;http://home.ku.edu.tr/~dunat/;https://mabdullahsoyturk.github.io/",
        "dblp": "10/6150.html;;",
        "google_scholar": "C3fmEegAAAAJ;https://scholar.google.com.tw/citations?user=JQ1n--oAAAAJ;etoOwyMAAAAJ",
        "orcid": "0000-0002-7165-2095;;0000-0002-2880-0857",
        "linkedin": ";;",
        "or_profile": "~Mohamed_Wahib1;~Didem_Unat1;~Muhammet_Abdullah_Soyturk1",
        "aff": "RIKEN;Ko\u00e7 University;",
        "aff_domain": "riken.jp;ku.edu.tr;",
        "position": "Principal Researcher;Associate Professor;",
        "bibtex": "@misc{\nwahib2024elastic,\ntitle={Elastic Load Balancing for Dynamic {LLM}s},\nauthor={Mohamed Wahib and Muhammet Abdullah Soyt{\\\"u}rk and Didem Unat},\nyear={2024},\nurl={https://openreview.net/forum?id=ic1Z7Qe9xH}\n}",
        "github": "",
        "project": "",
        "reviewers": "cgYk;4Zma;fgMF",
        "site": "https://openreview.net/forum?id=ic1Z7Qe9xH",
        "pdf_size": 714662,
        "rating": "3;3;5",
        "confidence": "5;4;4",
        "soundness": "2;2;2",
        "contribution": "2;1;2",
        "presentation": "2;2;1",
        "wc_summary": "158;95;68",
        "wc_strengths": "12;101;37",
        "wc_weaknesses": "26;218;186",
        "wc_questions": "307;70;12",
        "wc_review": "503;484;303",
        "wc_reply_reviewers": "0;0;9",
        "wc_reply_authors": "587;274;388",
        "reply_reviewers": "0;0;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            107.0,
            37.70941526992961
        ],
        "wc_strengths_avg": [
            50.0,
            37.47888294315436
        ],
        "wc_weaknesses_avg": [
            143.33333333333334,
            83.98941732279265
        ],
        "wc_questions_avg": [
            129.66666666666666,
            127.60964784146309
        ],
        "wc_review_avg": [
            430.0,
            90.13693286698116
        ],
        "wc_reply_reviewers_avg": [
            3.0,
            4.242640687119285
        ],
        "wc_reply_authors_avg": [
            416.3333333333333,
            129.3427831599257
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:-SFsgVJgAZgJ:scholar.google.com/&scioq=Elastic+Load+Balancing+for+Dynamic+LLMs&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "RIKEN;Ko\u00e7 University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.riken.jp;https://www.ku.edu.tr",
        "aff_unique_abbr": "RIKEN;Ko\u00e7",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Japan;T\u00fcrkiye"
    },
    {
        "title": "Dissecting Sample Hardness: A Fine-Grained Analysis of Hardness Characterization Methods for Data-Centric AI",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18057",
        "id": "icTZCUbtD6",
        "author_site": "Nabeel Seedat, Fergus Imrie, Mihaela van der Schaar",
        "tldr": "",
        "abstract": "Characterizing samples that are difficult to learn from is crucial to developing highly performant ML models. This has led to numerous Hardness Characterization Methods (HCMs) that aim to identify ''hard'' samples. However, there is a lack of consensus regarding the definition and evaluation of ''hardness''. Unfortunately, current HCMs have only been evaluated on specific types of hardness and often only qualitatively or with respect to downstream performance, overlooking the fundamental quantitative identification task. We address this gap by presenting a fine-grained taxonomy of hardness types. Additionally, we propose the Hardness Characterization Analysis Toolkit (H-CAT), which supports comprehensive and quantitative benchmarking of HCMs across the hardness taxonomy and can easily be extended to new HCMs, hardness types, and datasets. We use H-CAT to evaluate 13 different HCMs across 8 hardness types. This comprehensive evaluation encompassing over 14K setups uncovers strengths and weaknesses of different HCMs, leading to practical tips to guide HCM selection and future development. Our findings highlight the need for more comprehensive HCM evaluation, while we hope our hardness taxonomy and toolkit will advance the principled evaluation and uptake of data-centric AI methods.",
        "keywords": "data-centric AI;hardness characterization;data-centric ML;DMLR;benchmarking",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/f6646837921bc5e67e60c0f0aff42cca93d5cc3e.pdf",
        "author": "Nabeel Seedat;Fergus Imrie;Mihaela van der Schaar",
        "authorids": "~Nabeel_Seedat1;~Fergus_Imrie1;~Mihaela_van_der_Schaar2",
        "gender": ";;F",
        "homepage": ";;https://www.vanderschaar-lab.com",
        "dblp": "227/8368;281/4466;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;4qCGgpsAAAAJ;DZ3S--MAAAAJ",
        "orcid": ";0000-0002-6241-0123;",
        "linkedin": "nabeel-seedat/;;",
        "or_profile": "~Nabeel_Seedat1;~Fergus_Imrie1;~Mihaela_van_der_Schaar2",
        "aff": "AstraZeneca;University of California, Los Angeles;University of California, Los Angeles",
        "aff_domain": "astrazeneca.com;ucla.edu;ucla.edu",
        "position": "Intern;Postdoc;Full Professor",
        "bibtex": "@inproceedings{\nseedat2024dissecting,\ntitle={Dissecting Sample Hardness: A Fine-Grained Analysis of Hardness Characterization Methods for Data-Centric {AI}},\nauthor={Nabeel Seedat and Fergus Imrie and Mihaela van der Schaar},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=icTZCUbtD6}\n}",
        "github": "",
        "project": "",
        "reviewers": "5UHg;kMBG;u8mR;zsTV;SFiV",
        "pdf_size": 8786036,
        "rating": "1;6;8;8;8",
        "confidence": "5;4;2;4;3",
        "soundness": "2;3;3;4;2",
        "contribution": "1;2;4;2;3",
        "presentation": "2;4;3;2;2",
        "wc_summary": "70;67;105;140;78",
        "wc_strengths": "37;108;99;130;39",
        "wc_weaknesses": "185;191;42;162;446",
        "wc_questions": "2;55;193;152;63",
        "wc_review": "294;421;439;584;626",
        "wc_reply_reviewers": "297;0;23;0;157",
        "wc_reply_authors": "2731;1028;792;478;1569",
        "reply_reviewers": "2;0;1;0;1",
        "reply_authors": "5;4;3;2;4",
        "rating_avg": [
            6.2,
            2.7129319932501077
        ],
        "confidence_avg": [
            3.6,
            1.019803902718557
        ],
        "soundness_avg": [
            2.8,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.4,
            1.019803902718557
        ],
        "presentation_avg": [
            2.6,
            0.8
        ],
        "wc_summary_avg": [
            92.0,
            27.488179277645873
        ],
        "wc_strengths_avg": [
            82.6,
            37.79206265871182
        ],
        "wc_weaknesses_avg": [
            205.2,
            131.98090771016845
        ],
        "wc_questions_avg": [
            93.0,
            69.43486156103431
        ],
        "wc_review_avg": [
            472.8,
            119.69193790727928
        ],
        "wc_reply_reviewers_avg": [
            95.4,
            116.51712320513239
        ],
        "wc_reply_authors_avg": [
            1319.6,
            790.6874477314028
        ],
        "reply_reviewers_avg": [
            0.8,
            0.7483314773547883
        ],
        "reply_authors_avg": [
            3.6,
            1.019803902718557
        ],
        "replies_avg": [
            31,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.7662672848552682,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11003117258214822445&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=icTZCUbtD6",
        "pdf": "https://openreview.net/pdf?id=icTZCUbtD6",
        "email": "astrazeneca.com;ucla.edu;ucla.edu",
        "author_num": 3,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "AstraZeneca;University of California, Los Angeles",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.astrazeneca.com;https://www.ucla.edu",
        "aff_unique_abbr": "AZ;UCLA",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Los Angeles",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "id": "ickxszYnwH",
        "title": "Image Compression Is an Effective Objective for Visual Representation Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Self-supervised pre-training is an effective method for initializing the weights of vision transformers. In this paper, we advocate for a novel learning objective that trains the target model to use a minimal number of tokens to reconstruct images. Compared to the existing approaches including contrastive learning (CL) and masked image modeling (MIM), our formulation not only offers a new perspective of visual pre-training from the information theory, but also alleviates the degradation dilemma which may lead to instability. The idea is implemented using Semantic Merging and Reconstruction (SMR). SMR feeds the entire image (without any degradation) into the target model, gradually reduces the number of tokens throughout the encoder, and requires the decoder to maximally recover the original image in the semantic space using the remaining tokens. We establish SMR upon the vanilla ViT and two of its variants. Under the standard evaluation protocol, SMR shows favorable performance in visual pre-training and various downstream tasks. Additionally, SMR enjoys reduced pre-training time and memory consumption and thus is scalable to pre-train very large vision models. Code is submitted as supplementary material and will be open-sourced.",
        "keywords": "Visual Pre-training;Self-supervised Learning;Image Compression;Kolmogorov Complexity",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/09f44a4bbf310d7590c3258603d688cd0f22fffb.zip",
        "author": "Yunjie Tian;Lingxi Xie",
        "authorids": "~Yunjie_Tian1;~Lingxi_Xie1",
        "gender": "M;M",
        "homepage": "https://sunsmarterjie.github.io/;http://lingxixie.com/",
        "dblp": "270/0554;123/2869",
        "google_scholar": "https://scholar.google.com.hk/citations?user=DuetWVcAAAAJ;EEMm7hwAAAAJ",
        "orcid": "0000-0002-5103-3748;",
        "linkedin": ";",
        "or_profile": "~Yunjie_Tian1;~Lingxi_Xie1",
        "aff": "University of Chinese Academy of Sciences;Huawei Technologies Ltd.",
        "aff_domain": "ucas.ac.cn;huawei.com",
        "position": "PhD student;Researcher",
        "bibtex": "@misc{\ntian2024image,\ntitle={Image Compression Is an Effective Objective for Visual Representation Learning},\nauthor={Yunjie Tian and Lingxi Xie},\nyear={2024},\nurl={https://openreview.net/forum?id=ickxszYnwH}\n}",
        "github": "",
        "project": "",
        "reviewers": "gZTV;TTbD;Zv11",
        "site": "https://openreview.net/forum?id=ickxszYnwH",
        "pdf_size": 2238485,
        "rating": "3;5;5",
        "confidence": "5;5;4",
        "soundness": "2;2;2",
        "contribution": "2;2;2",
        "presentation": "1;3;3",
        "wc_summary": "55;48;115",
        "wc_strengths": "61;49;57",
        "wc_weaknesses": "192;217;390",
        "wc_questions": "110;47;2",
        "wc_review": "418;361;564",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "43;43;43",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            72.66666666666667,
            30.070288030250428
        ],
        "wc_strengths_avg": [
            55.666666666666664,
            4.988876515698588
        ],
        "wc_weaknesses_avg": [
            266.3333333333333,
            88.03913271317981
        ],
        "wc_questions_avg": [
            53.0,
            44.294469180700204
        ],
        "wc_review_avg": [
            447.6666666666667,
            85.48814082796643
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            43.0,
            0.0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:46aEYW0GtXEJ:scholar.google.com/&scioq=Image+Compression+Is+an+Effective+Objective+for+Visual+Representation+Learning&hl=en&as_sdt=0,11",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Chinese Academy of Sciences;Huawei",
        "aff_unique_dep": ";Huawei Technologies",
        "aff_unique_url": "http://www.ucas.ac.cn;https://www.huawei.com",
        "aff_unique_abbr": "UCAS;Huawei",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "idpV2AqusC",
        "title": "Improving SAM Requires Rethinking its Optimization Formulation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper rethinks Sharpness-Aware Minimization (SAM), which is originally formulated as a zero-sum game where the weights of a network and a bounded perturbation try to minimize/maximize, respectively, the same differentiable loss. We argue that SAM should instead be reformulated using the 0-1 loss, as this provides a tighter bound on its generalization gap. As a continuous relaxation, we follow the simple conventional approach where the minimizing (maximizing) player uses an upper bound (lower bound) surrogate to the 0-1 loss. This leads to a novel formulation of SAM as a bilevel optimization problem, dubbed as BiSAM. Through numerical evidence, we show that BiSAM consistently results in improved performance when compared to the original SAM and variants, while enjoying similar computational complexity.",
        "keywords": "Sharpness aware minimization;generalization;supervised learning;optimization;bilevel optimization",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Wanyun Xie;Fabian Latorre;Kimon Antonakopoulos;Thomas Pethick;Volkan Cevher",
        "authorids": "~Wanyun_Xie1;~Fabian_Latorre1;~Kimon_Antonakopoulos1;~Thomas_Pethick1;~Volkan_Cevher1",
        "gender": "F;M;M;M;M",
        "homepage": ";https://fabianlatorre.com;;https://pethick.dk;http://lions.epfl.ch",
        "dblp": ";244/9638;https://dblp.org/pers/hd/a/Antonakopoulos:Kimon;305/4521;70/5301",
        "google_scholar": "S4rh8MoAAAAJ;B46S5NwAAAAJ;;;https://scholar.google.ch/citations?user=hlWhzU8AAAAJ",
        "orcid": ";;;;",
        "linkedin": "wanyun-xie-71a287210/;;;;",
        "or_profile": "~Wanyun_Xie1;~Fabian_Latorre1;~Kimon_Antonakopoulos1;~Thomas_Pethick1;~Volkan_Cevher1",
        "aff": "EPFL - EPF Lausanne;Swiss Federal Institute of Technology Lausanne;EPFL - EPF Lausanne;Swiss Federal Institute of Technology Lausanne;Amazon Development Center Germany",
        "aff_domain": "epfl.ch;epfl.ch;epfl.ch;epfl.ch;amazon.de",
        "position": "PhD student;PhD student;Postdoc;PhD student;Amazon Scholar",
        "bibtex": "@misc{\nxie2024improving,\ntitle={Improving {SAM} Requires Rethinking its Optimization Formulation},\nauthor={Wanyun Xie and Fabian Latorre and Kimon Antonakopoulos and Thomas Pethick and Volkan Cevher},\nyear={2024},\nurl={https://openreview.net/forum?id=idpV2AqusC}\n}",
        "github": "",
        "project": "",
        "reviewers": "6ZVi;Z9xG;idNJ;duHp",
        "site": "https://openreview.net/forum?id=idpV2AqusC",
        "pdf_size": 558257,
        "rating": "3;6;6;10",
        "confidence": "3;4;3;4",
        "soundness": "2;2;2;4",
        "contribution": "2;3;3;4",
        "presentation": "2;2;3;4",
        "wc_summary": "61;51;97;84",
        "wc_strengths": "83;34;51;33",
        "wc_weaknesses": "77;98;66;19",
        "wc_questions": "185;2;65;23",
        "wc_review": "406;185;279;159",
        "wc_reply_reviewers": "0;37;0;69",
        "wc_reply_authors": "910;635;621;330",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            6.25,
            2.48746859276655
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            73.25,
            18.198557635153396
        ],
        "wc_strengths_avg": [
            50.25,
            20.216020874544032
        ],
        "wc_weaknesses_avg": [
            65.0,
            28.939592256975562
        ],
        "wc_questions_avg": [
            68.75,
            70.84622431717868
        ],
        "wc_review_avg": [
            257.25,
            96.78939766317383
        ],
        "wc_reply_reviewers_avg": [
            26.5,
            28.81405906844782
        ],
        "wc_reply_authors_avg": [
            624.0,
            205.15969389721755
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.7035264706814485,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13462558978953903998&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;1;0;1;2",
        "aff_unique_norm": "EPFL;Swiss Federal Institute of Technology Lausanne;Amazon",
        "aff_unique_dep": ";;Development Center",
        "aff_unique_url": "https://www.epfl.ch;https://www.epfl.ch;https://www.amazon.de",
        "aff_unique_abbr": "EPFL;EPFL;Amazon",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Lausanne;",
        "aff_country_unique_index": "0;0;0;0;1",
        "aff_country_unique": "Switzerland;Germany"
    },
    {
        "title": "First-order ANIL provably learns representations despite overparametrisation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18056",
        "id": "if2vRbS8Ew",
        "author_site": "O\u011fuz Kaan Y\u00fcksel, Etienne Boursier, Nicolas Flammarion",
        "tldr": "",
        "abstract": "Due to its empirical success in few-shot classification and reinforcement learning, meta-learning has recently received significant interest. Meta-learning methods leverage data from previous tasks to learn a new task in a sample-efficient manner. In particular, model-agnostic methods look for initialization points from which gradient descent quickly adapts to any new task. Although it has been empirically suggested that such methods perform well by learning shared representations during pretraining, there is limited theoretical evidence of such behavior. More importantly, it has not been shown that these methods still learn a shared structure, despite architectural misspecifications. In this direction, this work shows, in the limit of an infinite number of tasks, that first-order ANIL with a linear two-layer network architecture successfully learns linear shared representations. This result even holds with _overparametrization_; having a width larger than the dimension of the shared representations results in an asymptotically low-rank solution. The learned solution then yields a good adaptation performance on any new task after a single gradient step. Overall, this illustrates how well model-agnostic methods such as first-order ANIL can learn shared representations.",
        "keywords": "meta-learning;misspecification;overparametrization;pretraining;optimization",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "O\u011fuz Kaan Y\u00fcksel;Etienne Boursier;Nicolas Flammarion",
        "authorids": "~O\u011fuz_Kaan_Y\u00fcksel1;~Etienne_Boursier1;~Nicolas_Flammarion1",
        "gender": ";M;M",
        "homepage": ";https://eboursier.github.io/;",
        "dblp": ";203/8633;164/7417",
        "google_scholar": ";https://scholar.google.fr/citations?user=-9todDUAAAAJ;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~O\u011fuz_Kaan_Y\u00fcksel1;~Etienne_Boursier1;~Nicolas_Flammarion1",
        "aff": ";INRIA;Swiss Federal Institute of Technology Lausanne",
        "aff_domain": ";inria.fr;epfl.ch",
        "position": ";Researcher;Assistant Professor",
        "bibtex": "@inproceedings{\ny{\\\"u}ksel2024firstorder,\ntitle={First-order {ANIL} provably learns representations despite overparametrisation},\nauthor={O{\\u{g}}uz Kaan Y{\\\"u}ksel and Etienne Boursier and Nicolas Flammarion},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=if2vRbS8Ew}\n}",
        "github": "",
        "project": "",
        "reviewers": "aoqC;4g2e;pdse;FVcv",
        "pdf_size": 13968043,
        "rating": "5;5;6;8",
        "confidence": "4;4;3;3",
        "soundness": "3;4;4;3",
        "contribution": "3;2;3;3",
        "presentation": "2;3;3;4",
        "wc_summary": "154;119;80;64",
        "wc_strengths": "368;169;20;24",
        "wc_weaknesses": "647;286;161;82",
        "wc_questions": "144;114;53;89",
        "wc_review": "1313;688;314;259",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1047;1296;629;377",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            104.25,
            35.00267846894006
        ],
        "wc_strengths_avg": [
            145.25,
            141.9249361458373
        ],
        "wc_weaknesses_avg": [
            294.0,
            216.39431600668257
        ],
        "wc_questions_avg": [
            100.0,
            33.39910178432947
        ],
        "wc_review_avg": [
            643.5,
            420.3037592027937
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            837.25,
            356.94703738790156
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8164965809277259,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1683895311360730719&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=if2vRbS8Ew",
        "pdf": "https://openreview.net/pdf?id=if2vRbS8Ew",
        "email": ";inria.fr;epfl.ch",
        "author_num": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "INRIA;Swiss Federal Institute of Technology Lausanne",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.inria.fr;https://www.epfl.ch",
        "aff_unique_abbr": "INRIA;EPFL",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Lausanne",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "France;Switzerland"
    },
    {
        "id": "ifGvDAcJK4",
        "title": "AnoRand - Deep Learning-Based Semi-Supervised Anomaly Detection with Synthetic Labels",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Anomaly detection, or more generally outlier detection, is one of the most popular and challenging topics in theoretical and applied machine learning. The main challenge is that in general we have access to very few labeled data or no labels at all. \nIn this paper, we present a new semi-supervised anomaly detection method called AnoRand by combining a deep learning architecture with random synthetic label generation.\nThe proposed architecture has two building blocks: (1) a noise detection (ND) block composed of feed forward perceptron and (2) an autoencoder (AE) block. \nThe main idea of this new architecture is to learn one class (e.g. the majority class in case of anomaly detection) as well as possible by taking advantage of the ability of auto encoders to represent data in a latent space and the ability of Feed Forward Perceptron (FFP) to learn one class when the data is highly imbalanced. First, we create synthetic anomalies by randomly disturbing (add noise) a few samples (e.g., 2%) from the training set. Second, we use the normal and synthetic samples as input to our model.\nWe compared the performance of the proposed method to 17 state-of-the-art unsupervised anomaly detection method on synthetic datasets and 57 real-world datasets. \nOur results show that this new method generally outperforms most of the state-of-the-art methods and has the best performance (AUC ROC and AUC PR) on the vast majority of reference datasets.",
        "keywords": "Outlier detection;anomaly detection;unsupervised learning;semi-supervised learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Mansour ZOUBEIROU A MAYAKI;Michel Riveill",
        "authorids": "~Mansour_ZOUBEIROU_A_MAYAKI1;~Michel_Riveill1",
        "gender": "M;M",
        "homepage": ";http://www.i3s.unice.fr/~riveill",
        "dblp": "315/4925.html;62/1718",
        "google_scholar": "XMKFn6wAAAAJ;X6MChWcAAAAJ",
        "orcid": "0000-0002-6910-7119;0000-0001-6726-6637",
        "linkedin": ";",
        "or_profile": "~Mansour_ZOUBEIROU_A_MAYAKI1;~Michel_Riveill1",
        "aff": "Universit\u00e9 de Nice-Sophia Antipolis;Universit\u00e9 de Nice-Sophia Antipolis",
        "aff_domain": "unice.fr;unice.fr",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nmayaki2024anorand,\ntitle={AnoRand - Deep Learning-Based Semi-Supervised Anomaly Detection with Synthetic Labels},\nauthor={Mansour ZOUBEIROU A MAYAKI and Michel Riveill},\nyear={2024},\nurl={https://openreview.net/forum?id=ifGvDAcJK4}\n}",
        "github": "",
        "project": "",
        "reviewers": "Upnj;T2ce;3QvY",
        "site": "https://openreview.net/forum?id=ifGvDAcJK4",
        "pdf_size": 1131798,
        "rating": "3;3;3",
        "confidence": "5;5;4",
        "soundness": "2;2;3",
        "contribution": "2;1;1",
        "presentation": "1;2;2",
        "wc_summary": "40;69;69",
        "wc_strengths": "17;31;44",
        "wc_weaknesses": "270;217;205",
        "wc_questions": "2;23;6",
        "wc_review": "329;340;324",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            59.333333333333336,
            13.67073110293992
        ],
        "wc_strengths_avg": [
            30.666666666666668,
            11.025223605694151
        ],
        "wc_weaknesses_avg": [
            230.66666666666666,
            28.241026106633512
        ],
        "wc_questions_avg": [
            10.333333333333334,
            9.104333522498441
        ],
        "wc_review_avg": [
            331.0,
            6.683312551921141
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:es7_BZ2SQ-wJ:scholar.google.com/&scioq=AnoRand+-+Deep+Learning-Based+Semi-Supervised+Anomaly+Detection+with+Synthetic+Labels&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Universit\u00e9 de Nice-Sophia Antipolis",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.unice.fr",
        "aff_unique_abbr": "UNICA",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Sophia Antipolis",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "France"
    },
    {
        "id": "igUP5kQRij",
        "title": "Retrosynthesis Prediction via Search in (Hyper) Graph",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Retrosynthesis prediction is a fundamental challenge in organic synthesis, involving the prediction of reactants based on a given core product. Recently, semi-template-based methods and graph-edits-based methods have achieved good performance in interpretability and accuracy. However, their mechanisms still fail to predict complex reactions, e.g., reactions with multiple reaction center or attaching the same leaving group to more than one atom. Hence, we propose, a semi-template-based method, the \\textbf{Retro}synthesis via \\textbf{S}earch \\textbf{i}n (Hyper) \\textbf{G}raph (RetroSiG) framework to alleviate these limitations. In this paper, we cast the reaction center identification and the leaving group completion as search in the product molecular graph and leaving group hypergraph respectively. RetroSiG has several advantages as a semi-template-based method: First, RetroSiG is able to handle the complex reactions mentioned above with its novel search mechanism. Second, RetroSiG naturally exploits the hypergraph to model the implicit dependencies between leaving groups. Third, RetroSiG makes full use of the prior, i.e., one-hop constraint. It reduces the search space and enhances overall performance. Comprehensive experiments demonstrate that RetroSiG achieves a competitive result. Furthermore, we conduct experiments to show the capability of RetroSiG in predicting complex reactions. Ablation experiments verify the effectiveness of individual components, including the one-hop constraint and the leaving group hypergraph.",
        "keywords": "Retrosynthesis Prediction via \\\\ Search in (Hyper) Graph",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/4211a08bb9085291122016b0d129d9b22903cc55.zip",
        "author": "Zixun Lan;Binjie Hong;Jiajun Zhu;Zhenfu Liu;Zuo Zeng;Fei Ma",
        "authorids": "~Zixun_Lan1;~Binjie_Hong1;~Jiajun_Zhu3;~Zhenfu_Liu1;~Zuo_Zeng1;~Fei_Ma4",
        "gender": "M;M;M;M;M;M",
        "homepage": ";;;;https://www.xjtlu.edu.cn/en/departments/academic-departments/mathematical-sciences/staff/fei-ma;",
        "dblp": "289/5936;;;;;",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en;itB4ITMAAAAJ;Wigf6vMAAAAJ;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": ";;;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Zixun_Lan1;~Binjie_Hong1;~Zhenfu_Liu1;~Zuo_Zeng1;~Fei_Ma4;~zhu_jiajun1",
        "aff": "University of Liverpool;The University of Manchester;;;;Xi'an Jiaotong-Liverpool University",
        "aff_domain": "liverpool.ac.uk;machester.ac.uk;;;;xjtlu.edu.cn",
        "position": "PhD student;MS student;;;;Undergrad student",
        "bibtex": "@misc{\nlan2024retrosynthesis,\ntitle={Retrosynthesis Prediction via Search in (Hyper) Graph},\nauthor={Zixun Lan and Binjie Hong and Jiajun Zhu and Zhenfu Liu and Zuo Zeng and Fei Ma},\nyear={2024},\nurl={https://openreview.net/forum?id=igUP5kQRij}\n}",
        "github": "",
        "project": "",
        "reviewers": "nw3M;tzVj;2mmA",
        "site": "https://openreview.net/forum?id=igUP5kQRij",
        "pdf_size": 1524854,
        "rating": "5;5;5",
        "confidence": "5;4;4",
        "soundness": "2;3;3",
        "contribution": "3;2;2",
        "presentation": "2;3;1",
        "wc_summary": "86;134;63",
        "wc_strengths": "41;199;55",
        "wc_weaknesses": "248;109;1062",
        "wc_questions": "1;98;8",
        "wc_review": "376;540;1188",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            94.33333333333333,
            29.578520735305354
        ],
        "wc_strengths_avg": [
            98.33333333333333,
            71.41117248411173
        ],
        "wc_weaknesses_avg": [
            473.0,
            420.3339941839901
        ],
        "wc_questions_avg": [
            35.666666666666664,
            44.16886786967591
        ],
        "wc_review_avg": [
            701.3333333333334,
            350.57793554199736
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13231267625894678850&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of Liverpool;University of Manchester;Xi'an Jiao Tong-Liverpool University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.liverpool.ac.uk;https://www.manchester.ac.uk;https://www.xjtu.edu.cn/en",
        "aff_unique_abbr": "Liv Uni;UoM;XJTLU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Xi'an",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "United Kingdom;China"
    },
    {
        "title": "USB-NeRF: Unrolling Shutter Bundle Adjusted Neural Radiance Fields",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18055",
        "id": "igfDXfMvm5",
        "author_site": "Moyang Li, Peng Wang, Lingzhe Zhao, Bangyan Liao, Peidong Liu",
        "tldr": "",
        "abstract": "Neural Radiance Fields (NeRF) has received much attention recently due to its impressive capability to represent 3D scene and synthesize novel view images. Existing works usually assume that the input images are captured by a global shutter camera. Thus, rolling shutter (RS) images cannot be trivially applied to an off-the-shelf NeRF algorithm for novel view synthesis. Rolling shutter effect would also affect the accuracy of the camera pose estimation (e.g. via COLMAP), which further prevents the success of NeRF algorithm with RS images.\nIn this paper, we propose Unrolling Shutter Bundle Adjusted Neural Radiance Fields (USB-NeRF). USB-NeRF is able to correct rolling shutter distortions and recover accurate camera motion trajectory simultaneously under the framework of NeRF, by modeling the physical image formation process of a RS camera.\nExperimental results demonstrate that USB-NeRF achieves better performance compared to prior works, in terms of RS effect removal, novel view image synthesis as well as camera motion estimation. Furthermore, our algorithm can also be used to recover high-fidelity high frame-rate global shutter video from a sequence of RS images.",
        "keywords": "Neural Radiance Fields;Bundle Adjustment;Rolling Shutter",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/70d15e784e959725f70523e56a8b6ff6b0b5a6f0.zip",
        "author": "Moyang Li;Peng Wang;Lingzhe Zhao;Bangyan Liao;Peidong Liu",
        "authorids": "~Moyang_Li1;~Peng_Wang29;~Lingzhe_Zhao1;~Bangyan_Liao1;~Peidong_Liu3",
        "gender": "F;M;M;M;M",
        "homepage": "https://moyangli00.github.io/;https://wangpeng000.github.io/;https://github.com/LingzheZhao/;https://bangyan101.github.io/;https://ethliup.github.io/",
        "dblp": "358/6210;;234/8463;329/6556;07/11190",
        "google_scholar": "Qvu8bNYAAAAJ;xZTSmVsAAAAJ;mN764NsAAAAJ;0z2qluIAAAAJ;https://scholar.google.com.sg/citations?user=XZczNEEAAAAJ",
        "orcid": ";;0009-0005-8000-1525;0009-0007-7739-4879;",
        "linkedin": ";;;;",
        "or_profile": "~Moyang_Li1;~Peng_Wang29;~Lingzhe_Zhao1;~Bangyan_Liao1;~Peidong_Liu1",
        "aff": "ETHZ - ETH Zurich;Zhejiang University;Westlake University;Westlake University;Westlake University",
        "aff_domain": "ethz.ch;zju.edu.cn;westlake.edu.cn;westlake.edu;westlake.edu.cn",
        "position": "MS student;PhD student;PhD student;PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nli2024usbnerf,\ntitle={{USB}-Ne{RF}: Unrolling Shutter Bundle Adjusted Neural Radiance Fields},\nauthor={Moyang Li and Peng Wang and Lingzhe Zhao and Bangyan Liao and Peidong Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=igfDXfMvm5}\n}",
        "github": "",
        "project": "",
        "reviewers": "Xdqv;wLRe;UbiP;CtJa",
        "pdf_size": 28560795,
        "rating": "3;3;8;8",
        "confidence": "3;4;5;4",
        "soundness": "2;2;3;4",
        "contribution": "1;2;3;3",
        "presentation": "3;2;4;4",
        "wc_summary": "70;47;147;55",
        "wc_strengths": "43;25;85;30",
        "wc_weaknesses": "136;111;84;39",
        "wc_questions": "50;17;138;4",
        "wc_review": "299;200;454;128",
        "wc_reply_reviewers": "465;778;22;0",
        "wc_reply_authors": "1547;2504;790;221",
        "reply_reviewers": "2;2;1;0",
        "reply_authors": "4;6;1;1",
        "rating_avg": [
            5.5,
            2.5
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            79.75,
            39.694930406791244
        ],
        "wc_strengths_avg": [
            45.75,
            23.594225988576103
        ],
        "wc_weaknesses_avg": [
            92.5,
            35.947878936037384
        ],
        "wc_questions_avg": [
            52.25,
            52.27033097274208
        ],
        "wc_review_avg": [
            270.25,
            122.23005972345756
        ],
        "wc_reply_reviewers_avg": [
            316.25,
            324.7832931355922
        ],
        "wc_reply_authors_avg": [
            1265.5,
            855.8920784771874
        ],
        "reply_reviewers_avg": [
            1.25,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.0,
            2.1213203435596424
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.7071067811865475,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5401493427736266765&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=igfDXfMvm5",
        "pdf": "https://openreview.net/pdf?id=igfDXfMvm5",
        "email": "ethz.ch;zju.edu.cn;westlake.edu.cn;westlake.edu;westlake.edu.cn",
        "author_num": 5,
        "aff_unique_index": "0;1;2;2;2",
        "aff_unique_norm": "ETH Zurich;Zhejiang University;Westlake University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ethz.ch;https://www.zju.edu.cn;https://www.westlake.edu.cn",
        "aff_unique_abbr": "ETHZ;ZJU;WU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;1",
        "aff_country_unique": "Switzerland;China"
    },
    {
        "id": "ihX0d33lk5",
        "title": "Efficient OCR for Building a Diverse Digital History",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Many users consult digital archives daily, but the information they can access is unrepresentative of the diversity of documentary history. The sequence-to-sequence architecture typically used for optical character recognition (OCR) \u2013 which jointly learns a vision and language model - is poorly extensible to low-resource document collections, as learning a language-vision model requires extensive labeled sequences and compute. This study models OCR as a character level image retrieval problem, using a contrastively trained vision encoder. Because the model only learns characters\u2019 visual features, it is more sample efficient and extensible than existing architectures, enabling accurate OCR in settings where existing solutions fail. Crucially, it opens new avenues for community engagement in making digital history more representative of documentary history.",
        "keywords": "contrastive learning;efficient computer vision;low resource settings",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/575529943e4483f4a179751325f34de63e2ba093.zip",
        "author": "Jacob Carlson;Tom Bryan;Melissa Dell",
        "authorids": "~Jacob_Carlson1;~Tom_Bryan1;~Melissa_Dell1",
        "gender": "M;M;",
        "homepage": "https://jscarlson.github.io/;;",
        "dblp": "129/0862;149/9220;",
        "google_scholar": "ijle68oAAAAJ;-PBqxS8AAAAJ;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Jacob_Carlson1;~Tom_Bryan1;~Melissa_Dell1",
        "aff": "Harvard University;Harvard University, Harvard University;",
        "aff_domain": "g.harvard.edu;fas.harvard.edu;",
        "position": "PhD student;Researcher;",
        "bibtex": "@misc{\ncarlson2024efficient,\ntitle={Efficient {OCR} for Building a Diverse Digital History},\nauthor={Jacob Carlson and Tom Bryan and Melissa Dell},\nyear={2024},\nurl={https://openreview.net/forum?id=ihX0d33lk5}\n}",
        "github": "",
        "project": "",
        "reviewers": "9D84;wGzQ;9WAE;rAdB",
        "site": "https://openreview.net/forum?id=ihX0d33lk5",
        "pdf_size": 49549314,
        "rating": "1;3;3;6",
        "confidence": "5;4;4;5",
        "soundness": "1;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "1;2;2;3",
        "wc_summary": "160;53;91;90",
        "wc_strengths": "135;40;57;83",
        "wc_weaknesses": "255;74;219;166",
        "wc_questions": "93;17;4;68",
        "wc_review": "643;184;371;407",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            98.5,
            38.66846260197062
        ],
        "wc_strengths_avg": [
            78.75,
            35.90525727522364
        ],
        "wc_weaknesses_avg": [
            178.5,
            68.13405903070799
        ],
        "wc_questions_avg": [
            45.5,
            36.39024594585752
        ],
        "wc_review_avg": [
            401.25,
            163.23966276613046
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.14002800840280097,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5159345493279868668&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Harvard University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.harvard.edu",
        "aff_unique_abbr": "Harvard",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "ihr4X2qK62",
        "title": "Choosing Public Datasets for Private Machine Learning via Gradient Subspace Distance",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Differentially private stochastic gradient descent privatizes model training by injecting noise into each iteration, where the noise magnitude increases with the number of model parameters. Recent works suggest that we can reduce the noise by leveraging public data for private machine learning, by projecting gradients onto a subspace prescribed by the public data. However, given a choice of public datasets, it is not a priori clear which one may be most appropriate for the private task. We give an algorithm for selecting a public dataset by measuring a low-dimensional subspace distance between gradients of the public and private examples. We provide theoretical analysis demonstrating that the excess risk scales with this subspace distance. This distance is easy to compute and robust to modifications in the setting. Empirical evaluation shows that trained model accuracy is monotone in this distance.",
        "keywords": "Differential Privacy;Private Machine Learning;Distribution Shift",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Xin Gu;Gautam Kamath;Steven Wu",
        "authorids": "~Xin_Gu2;~Gautam_Kamath1;~Steven_Wu1",
        "gender": "M;M;M",
        "homepage": "https://xinguu.github.io;http://www.gautamkamath.com/;https://zstevenwu.com/",
        "dblp": ";73/11140;137/8350",
        "google_scholar": ";MK6zHkYAAAAJ;MbF6rTEAAAAJ",
        "orcid": ";;",
        "linkedin": ";;zstevenwu/",
        "or_profile": "~Xin_Gu2;~Gautam_Kamath1;~Zhiwei_Steven_Wu1",
        "aff": "Pennsylvania State University;University of Waterloo;Carnegie Mellon University",
        "aff_domain": "psu.edu;uwaterloo.ca;cmu.edu",
        "position": "PhD student;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\ngu2024choosing,\ntitle={Choosing Public Datasets for Private Machine Learning via Gradient Subspace Distance},\nauthor={Xin Gu and Gautam Kamath and Steven Wu},\nyear={2024},\nurl={https://openreview.net/forum?id=ihr4X2qK62}\n}",
        "github": "",
        "project": "",
        "reviewers": "VtTm;Ukt9;heJ7;xFXu",
        "site": "https://openreview.net/forum?id=ihr4X2qK62",
        "pdf_size": 1489618,
        "rating": "3;3;6;6",
        "confidence": "3;4;3;3",
        "soundness": "2;2;3;4",
        "contribution": "1;1;2;3",
        "presentation": "3;2;3;4",
        "wc_summary": "71;88;61;257",
        "wc_strengths": "63;5;48;46",
        "wc_weaknesses": "326;170;10;269",
        "wc_questions": "80;9;54;150",
        "wc_review": "540;272;173;722",
        "wc_reply_reviewers": "290;250;0;173",
        "wc_reply_authors": "1695;515;900;1069",
        "reply_reviewers": "1;1;0;2",
        "reply_authors": "7;2;5;4",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            119.25,
            80.11359123145085
        ],
        "wc_strengths_avg": [
            40.5,
            21.523243250030884
        ],
        "wc_weaknesses_avg": [
            193.75,
            119.87571689045284
        ],
        "wc_questions_avg": [
            73.25,
            51.07531204016281
        ],
        "wc_review_avg": [
            426.75,
            216.98775887132436
        ],
        "wc_reply_reviewers_avg": [
            178.25,
            111.17188268622601
        ],
        "wc_reply_authors_avg": [
            1044.75,
            425.7348793556854
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            4.5,
            1.8027756377319946
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896258,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12325967144637605848&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Pennsylvania State University;University of Waterloo;Carnegie Mellon University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.psu.edu;https://uwaterloo.ca;https://www.cmu.edu",
        "aff_unique_abbr": "PSU;UW;CMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United States;Canada"
    },
    {
        "title": "Graph Metanetworks for Processing Diverse Neural Architectures",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18054",
        "id": "ijK5hyxs0n",
        "author_site": "Derek Lim, Haggai Maron, Marc T Law, Jonathan Lorraine, James Lucas",
        "tldr": "",
        "abstract": "Neural networks efficiently encode learned information within their parameters. Consequently, many tasks can be unified by treating neural networks themselves as input data. When doing so, recent studies demonstrated the importance of accounting for the symmetries and geometry of parameter spaces. However, those works developed architectures tailored to specific networks such as MLPs and CNNs without normalization layers, and generalizing such architectures to other types of networks can be challenging. In this work, we overcome these challenges by building new metanetworks --- neural networks that take weights from other neural networks as input. Put simply, we carefully build graphs representing the input neural networks and process the graphs using graph neural networks. Our approach, Graph Metanetworks (GMNs), generalizes to neural architectures where competing methods struggle, such as multi-head attention layers, normalization layers, convolutional layers, ResNet blocks, and group-equivariant linear layers. We prove that GMNs are expressive and equivariant to parameter permutation symmetries that leave the input neural network functions unchanged. We validate the effectiveness of our method on several metanetwork tasks over diverse neural network architectures.",
        "keywords": "Metanetwork;graph;equivariance;expressivity",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Derek Lim;Haggai Maron;Marc T. Law;Jonathan Lorraine;James Lucas",
        "authorids": "~Derek_Lim1;~Haggai_Maron1;~Marc_T._Law1;~Jonathan_Lorraine1;~James_Lucas1",
        "gender": "M;M;M;M;M",
        "homepage": "https://cptq.github.io/;https://haggaim.github.io/;http://www.cs.toronto.edu/~jlucas/;https://www.jonlorraine.com/;http://www.cs.toronto.edu/~law/",
        "dblp": "267/5433;181/6629;24/2474;215/5229;117/7668",
        "google_scholar": "y9YTBIsAAAAJ;https://scholar.google.co.il/citations?user=4v8uJrIAAAAJ;https://scholar.google.ca/citations?user=AYaHBAQAAAAJ;Hzf8bu0AAAAJ;https://scholar.google.fr/citations?user=_7QgnUcAAAAJ",
        "orcid": ";;;0000-0002-1255-6554;",
        "linkedin": ";;;jonlorraine/;",
        "or_profile": "~Derek_Lim1;~Haggai_Maron1;~James_Lucas1;~Jonathan_Peter_Lorraine1;~Marc_T_Law1",
        "aff": "Liquid AI;NVIDIA;NVIDIA;Vector Institute;NVIDIA",
        "aff_domain": "liquid.ai;nvidia.com;nvidia.com;vectorinstitute.ai;nvidia.com",
        "position": "Researcher;Research Scientist;Researcher;Researcher;Research Scientist",
        "bibtex": "@inproceedings{\nlim2024graph,\ntitle={Graph Metanetworks for Processing Diverse Neural Architectures},\nauthor={Derek Lim and Haggai Maron and Marc T. Law and Jonathan Lorraine and James Lucas},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ijK5hyxs0n}\n}",
        "github": "",
        "project": "",
        "reviewers": "fJUi;ffRA;ZWAE",
        "pdf_size": 3896604,
        "rating": "6;6;6",
        "confidence": "3;4;3",
        "soundness": "3;3;3",
        "contribution": "3;2;3",
        "presentation": "4;3;3",
        "wc_summary": "83;76;186",
        "wc_strengths": "99;100;70",
        "wc_weaknesses": "276;153;82",
        "wc_questions": "180;61;3",
        "wc_review": "638;390;341",
        "wc_reply_reviewers": "448;67;0",
        "wc_reply_authors": "1819;1004;184",
        "reply_reviewers": "1;1;0",
        "reply_authors": "3;2;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            115.0,
            50.2858495669176
        ],
        "wc_strengths_avg": [
            89.66666666666667,
            13.912424503139471
        ],
        "wc_weaknesses_avg": [
            170.33333333333334,
            80.14292787819078
        ],
        "wc_questions_avg": [
            81.33333333333333,
            73.6764699359451
        ],
        "wc_review_avg": [
            456.3333333333333,
            130.00598276831553
        ],
        "wc_reply_reviewers_avg": [
            171.66666666666666,
            197.30236243446814
        ],
        "wc_reply_authors_avg": [
            1002.3333333333334,
            667.4869952957052
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 37,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9881908683248481315&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=ijK5hyxs0n",
        "pdf": "https://openreview.net/pdf?id=ijK5hyxs0n",
        "email": "liquid.ai;nvidia.com;nvidia.com;vectorinstitute.ai;nvidia.com",
        "author_num": 5,
        "aff_unique_index": "0;1;1;2;1",
        "aff_unique_norm": "Liquid AI;NVIDIA;Vector Institute",
        "aff_unique_dep": ";NVIDIA Corporation;",
        "aff_unique_url": ";https://www.nvidia.com;https://vectorinstitute.ai/",
        "aff_unique_abbr": ";NVIDIA;Vector Institute",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;2;1",
        "aff_country_unique": "Unknown;United States;Canada"
    },
    {
        "title": "FreeNoise: Tuning-Free Longer Video Diffusion via Noise Rescheduling",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18053",
        "id": "ijoqFqSC7p",
        "author_site": "Haonan Qiu, Menghan Xia, Yong Zhang, Yingqing He, Xintao Wang, Ying Shan, Ziwei Liu",
        "tldr": "",
        "abstract": "With the availability of large-scale video datasets and the advances of diffusion models, text-driven video generation has achieved substantial progress. However, existing video generation models are typically trained on a limited number of frames, resulting in the inability to generate high-fidelity long videos during inference. Furthermore, these models only support single-text conditions, whereas real-life scenarios often require multi-text conditions as the video content changes over time. To tackle these challenges, this study explores the potential of extending the text-driven capability to generate longer videos conditioned on multiple texts. 1) We first analyze the impact of initial noise in video diffusion models. Then building upon the observation of noise, we propose FreeNoise, a tuning-free and time-efficient paradigm to enhance the generative capabilities of pretrained video diffusion models while preserving content consistency. Specifically, instead of initializing noises for all frames, we reschedule a sequence of noises for long-range correlation and perform temporal attention over them by window-based fusion. 2) Additionally, we design a novel motion injection method to support the generation of videos conditioned on multiple text prompts. Extensive experiments validate the superiority of our paradigm in extending the generative capabilities of video diffusion models. It is noteworthy that compared with the previous best-performing method which brought about 255% extra time cost, our method incurs only negligible time cost of approximately 17%. Generated video samples are available at our website: http://haonanqiu.com/projects/FreeNoise.html.",
        "keywords": "diffusion;video diffusion;video generation;tuning-free",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/fba947c0e74d735c4102e8f42a1c6272d23f94f1.zip",
        "author": "Haonan Qiu;Menghan Xia;Yong Zhang;Yingqing He;Xintao Wang;Ying Shan;Ziwei Liu",
        "authorids": "~Haonan_Qiu1;~Menghan_Xia1;~Yong_Zhang6;~Yingqing_He1;~Xintao_Wang1;~Ying_Shan2;~Ziwei_Liu1",
        "gender": ";M;M;;;M;M",
        "homepage": "http://www.haonanqiu.com;https://menghanxia.github.io/;https://yzhang2016.github.io/yongnorriszhang.github.io/;https://github.com/YingqingHe;;;https://liuziwei7.github.io/",
        "dblp": "218/5791.html;169/4908;66/4615-34.html;161/3838;;68/5910;05/6300-2",
        "google_scholar": "https://scholar.google.com.hk/citations?user=8Ss6ahEAAAAJ;IJxaAQQAAAAJ;a_zSeVEAAAAJ;;;4oXBp9UAAAAJ;https://scholar.google.com.hk/citations?user=lc45xlcAAAAJ",
        "orcid": ";;;0000-0003-0134-8220;;0000-0001-7673-8325;",
        "linkedin": ";;;;;YingShanProfile/;",
        "or_profile": "~Haonan_Qiu1;~Menghan_Xia1;~Yong_Zhang6;~Yingqing_He1;~Xintao_Wang1;~Ying_Shan2;~Ziwei_Liu1",
        "aff": "Nanyang Technological University;Tencent AI Lab;Tencent AI Lab;Hong Kong University of Science and Technology;;Tencent PCG ARC Lab;Nanyang Technological University",
        "aff_domain": "ntu.edu.sg;tencent.com;tencent.com;ust.hk;;arc.tencent.com;ntu.edu.sg",
        "position": "PhD student;Researcher;Researcher;PhD student;;Director;Assistant Professor",
        "bibtex": "@inproceedings{\nqiu2024freenoise,\ntitle={FreeNoise: Tuning-Free Longer Video Diffusion via Noise Rescheduling},\nauthor={Haonan Qiu and Menghan Xia and Yong Zhang and Yingqing He and Xintao Wang and Ying Shan and Ziwei Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ijoqFqSC7p}\n}",
        "github": "",
        "project": "",
        "reviewers": "C7UC;17jd;pTfs;q7Nz",
        "pdf_size": 8208709,
        "rating": "5;6;6;6",
        "confidence": "4;4;4;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "30;70;77;78",
        "wc_strengths": "51;65;174;59",
        "wc_weaknesses": "204;115;143;74",
        "wc_questions": "2;111;50;33",
        "wc_review": "287;361;444;244",
        "wc_reply_reviewers": "171;101;0;0",
        "wc_reply_authors": "1032;589;421;113",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "3;2;2;2",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            63.75,
            19.727835664360143
        ],
        "wc_strengths_avg": [
            87.25,
            50.33078084035653
        ],
        "wc_weaknesses_avg": [
            134.0,
            47.281074437876306
        ],
        "wc_questions_avg": [
            49.0,
            39.717754216471
        ],
        "wc_review_avg": [
            334.0,
            76.05590049430748
        ],
        "wc_reply_reviewers_avg": [
            68.0,
            72.3636649154809
        ],
        "wc_reply_authors_avg": [
            538.75,
            332.01986009875975
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 82,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14113267982552847374&as_sdt=10005&sciodt=0,8&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=ijoqFqSC7p",
        "pdf": "https://openreview.net/pdf?id=ijoqFqSC7p",
        "email": "ntu.edu.sg;tencent.com;tencent.com;ust.hk;;arc.tencent.com;ntu.edu.sg",
        "author_num": 7,
        "aff_unique_index": "0;1;1;2;1;0",
        "aff_unique_norm": "Nanyang Technological University;Tencent;Hong Kong University of Science and Technology",
        "aff_unique_dep": ";Tencent AI Lab;",
        "aff_unique_url": "https://www.ntu.edu.sg;https://ai.tencent.com;https://www.ust.hk",
        "aff_unique_abbr": "NTU;Tencent AI Lab;HKUST",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;1;1;1;1;0",
        "aff_country_unique": "Singapore;China"
    },
    {
        "id": "ikRVG8awyS",
        "title": "RFold: RNA Secondary Structure Prediction with Decoupled Optimization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The secondary structure of ribonucleic acid (RNA) is more stable and accessible in the cell than its tertiary structure, making it essential for functional prediction. Although deep learning has shown promising results in this field, current methods suffer from poor generalization and high complexity. In this work, we present RFold, a simple yet effective RNA secondary structure prediction in an end-to-end manner. RFold introduces a decoupled optimization process that decomposes the vanilla constraint satisfaction problem into row-wise and column-wise optimization, simplifying the solving process while guaranteeing the validity of the output. Moreover, RFold adopts attention maps as informative representations instead of designing hand-crafted features. Extensive experiments demonstrate that RFold achieves competitive performance and about eight times faster inference efficiency than the state-of-the-art method.",
        "keywords": "Bioinformatics;Molecular structure prediction",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/623c52c1da507351c217f08011bd148db1c72038.zip",
        "author": "Cheng Tan;Zhangyang Gao;Lingzhi Gu;Ge Wang;Lirong Wu;Jun Xia;Jiangbin Zheng;Stan Z. Li",
        "authorids": "~Cheng_Tan1;~Zhangyang_Gao1;~Lingzhi_Gu2;~Ge_Wang3;~Lirong_Wu1;~Jun_Xia1;~Jiangbin_Zheng3;~Stan_Z._Li2",
        "gender": "M;M;F;;;M;M;M",
        "homepage": "https://chengtan9907.github.io/;;http://www.amss.ac.cn/;;;http://junxia97.github.io/;;https://en.westlake.edu.cn/academics/School_of_Engineering/About/Our_People/Faculty/201912/t20191206_2497.shtml",
        "dblp": "70/1533-12.html;275/3266;;34/5591;15/10330;;;l/StanZLi",
        "google_scholar": "6kTV6aMAAAAJ;4SclT-QAAAAJ;;https://scholar.google.com.hk/citations?user=t9GUEMoAAAAJ;Tk7TrCoAAAAJ;aPKKpSYAAAAJ;;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": ";0000-0003-1026-6083;;0000-0001-8553-6493;;;0000-0003-3305-0103;",
        "linkedin": ";;;;;;;stan-z-li-%E6%9D%8E%E5%AD%90%E9%9D%92-55753224/",
        "or_profile": "~Cheng_Tan1;~Zhangyang_Gao1;~Lingzhi_Gu2;~Ge_Wang3;~Lirong_Wu1;~Jun_Xia1;~Jiangbin_Zheng3;~Stan_Z._Li1",
        "aff": "Zhejiang University & Westlake University;Westlake University, China;Academy of Mathematics and Systems Science, Chinese Academy of Sciences, Chinese Academy of Sciences;WESTLAKE UNIVERSITY;Westlake University;Westlake University, China;Westlake University;Westlake University",
        "aff_domain": "westlake.edu.cn;westlake.edu.cn;amss.ac.cn;westlake.edu.cn;westlake.edu.cn;westlake.edu.cn;westlake.edu.cn;westlake.edu.cn",
        "position": "PhD student;PhD student;MS student;PhD student;PhD student;PhD student;PhD student;Chair Professor",
        "bibtex": "@misc{\ntan2024rfold,\ntitle={{RF}old: {RNA} Secondary Structure Prediction with Decoupled Optimization},\nauthor={Cheng Tan and Zhangyang Gao and Lingzhi Gu and Ge Wang and Lirong Wu and Jun Xia and Jiangbin Zheng and Stan Z. Li},\nyear={2024},\nurl={https://openreview.net/forum?id=ikRVG8awyS}\n}",
        "github": "",
        "project": "",
        "reviewers": "G4jZ;BXWa;Y2Rp;fGRe",
        "site": "https://openreview.net/forum?id=ikRVG8awyS",
        "pdf_size": 1934673,
        "rating": "3;5;6;6",
        "confidence": "5;3;3;2",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;4",
        "presentation": "1;3;4;4",
        "wc_summary": "77;67;43;77",
        "wc_strengths": "11;65;67;60",
        "wc_weaknesses": "103;41;77;220",
        "wc_questions": "121;10;39;78",
        "wc_review": "312;183;226;435",
        "wc_reply_reviewers": "0;26;0;0",
        "wc_reply_authors": "570;510;493;435",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "3;3;2;2",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            1.224744871391589
        ],
        "wc_summary_avg": [
            66.0,
            13.892443989449804
        ],
        "wc_strengths_avg": [
            50.75,
            23.09085316743407
        ],
        "wc_weaknesses_avg": [
            110.25,
            67.07971004707757
        ],
        "wc_questions_avg": [
            62.0,
            41.743262929483606
        ],
        "wc_review_avg": [
            289.0,
            96.24188277460078
        ],
        "wc_reply_reviewers_avg": [
            6.5,
            11.258330249197702
        ],
        "wc_reply_authors_avg": [
            502.0,
            48.10925066969969
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.9365858115816939,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11044875271931610050&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;1;1;1;1;1",
        "aff_unique_norm": "Zhejiang University;Westlake University;Chinese Academy of Sciences",
        "aff_unique_dep": ";;Academy of Mathematics and Systems Science",
        "aff_unique_url": "http://www.zju.edu.cn;https://www.westlake.edu.cn;http://www.cas.cn",
        "aff_unique_abbr": "ZJU;WU;CAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "A Neural Framework for Generalized Causal Sensitivity Analysis",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18052",
        "id": "ikX6D1oM1c",
        "author_site": "Dennis Frauen, Fergus Imrie, Alicia Curth, Valentyn Melnychuk, Stefan Feuerriegel, Mihaela van der Schaar",
        "tldr": "",
        "abstract": "Unobserved confounding is common in many applications, making causal inference from observational data challenging. As a remedy, causal sensitivity analysis is an important tool to draw causal conclusions under unobserved confounding with mathematical guarantees. In this paper, we propose NeuralCSA, a neural framework for generalized causal sensitivity analysis. Unlike previous work, our framework is compatible with (i) a large class of sensitivity models, including the marginal sensitivity model, $f$-sensitivity models, and Rosenbaum's sensitivity model; (ii) different treatment types (i.e., binary and continuous); and (iii) different causal queries, including (conditional) average treatment effects and simultaneous effects on multiple outcomes. This generality is achieved by learning a latent distribution shift that corresponds to a treatment intervention using two conditional normalizing flows. We provide theoretical guarantees that NeuralCSA is able to infer valid bounds on the causal query of interest and also demonstrate this empirically using both simulated and real-world data.",
        "keywords": "Causal machine learning;treatment effect estimation;sensitivity analysis;unobserved confounding;uncertainty estimation",
        "primary_area": "causal reasoning",
        "supplementary_material": "",
        "author": "Dennis Frauen;Fergus Imrie;Alicia Curth;Valentyn Melnychuk;Stefan Feuerriegel;Mihaela van der Schaar",
        "authorids": "~Dennis_Frauen1;~Fergus_Imrie1;~Alicia_Curth1;~Valentyn_Melnychuk1;~Stefan_Feuerriegel1;~Mihaela_van_der_Schaar2",
        "gender": "M;;F;M;M;F",
        "homepage": "https://www.ai.bwl.uni-muenchen.de/team/research_team/dennis_frauen/index.html;;;https://valentyn1997.github.io/;http://www.ai.bwl.lmu.de;https://www.vanderschaar-lab.com",
        "dblp": "315/0115;281/4466;261/8064;254/1513;125/0630;",
        "google_scholar": "ieyW4WQAAAAJ;4qCGgpsAAAAJ;eWRBqsYAAAAJ;EMExrOMAAAAJ;https://scholar.google.de/citations?hl=de;DZ3S--MAAAAJ",
        "orcid": ";0000-0002-6241-0123;;0000-0002-2401-6803;0000-0001-7856-8729;",
        "linkedin": "dennis-frauen-6b5746171/;;;valentyn-melnychuk/;;",
        "or_profile": "~Dennis_Frauen1;~Fergus_Imrie1;~Alicia_Curth1;~Valentyn_Melnychuk1;~Stefan_Feuerriegel1;~Mihaela_van_der_Schaar2",
        "aff": "Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen;University of California, Los Angeles;University of Cambridge;Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen;LMU Munich;University of California, Los Angeles",
        "aff_domain": "lmu.de;ucla.edu;cam.ac.uk;lmu.de;lmu.de;ucla.edu",
        "position": "PhD student;Postdoc;PhD student;PhD student;Professor;Full Professor",
        "bibtex": "@inproceedings{\nfrauen2024a,\ntitle={A Neural Framework for Generalized Causal Sensitivity Analysis},\nauthor={Dennis Frauen and Fergus Imrie and Alicia Curth and Valentyn Melnychuk and Stefan Feuerriegel and Mihaela van der Schaar},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ikX6D1oM1c}\n}",
        "github": "",
        "project": "",
        "reviewers": "ijNf;MpUG;i97n;9LA1",
        "pdf_size": 4389108,
        "rating": "6;6;6;8",
        "confidence": "2;3;3;3",
        "soundness": "3;3;3;3",
        "contribution": "3;2;3;3",
        "presentation": "4;3;3;3",
        "wc_summary": "69;55;21;37",
        "wc_strengths": "55;46;64;91",
        "wc_weaknesses": "42;39;117;140",
        "wc_questions": "91;81;34;3",
        "wc_review": "257;221;236;271",
        "wc_reply_reviewers": "0;0;0;21",
        "wc_reply_authors": "571;695;886;787",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;2;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            45.5,
            18.131464364468744
        ],
        "wc_strengths_avg": [
            64.0,
            16.837458240482736
        ],
        "wc_weaknesses_avg": [
            84.5,
            44.75768090506924
        ],
        "wc_questions_avg": [
            52.25,
            35.66072769868837
        ],
        "wc_review_avg": [
            246.25,
            19.17517926904466
        ],
        "wc_reply_reviewers_avg": [
            5.25,
            9.093266739736606
        ],
        "wc_reply_authors_avg": [
            734.75,
            116.19030725495135
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4776956821228215651&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=ikX6D1oM1c",
        "pdf": "https://openreview.net/pdf?id=ikX6D1oM1c",
        "email": "lmu.de;ucla.edu;cam.ac.uk;lmu.de;lmu.de;ucla.edu",
        "author_num": 6,
        "aff_unique_index": "0;1;2;0;3;1",
        "aff_unique_norm": "Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen;University of California, Los Angeles;University of Cambridge;Ludwig Maximilian University of Munich",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.lmu.de;https://www.ucla.edu;https://www.cam.ac.uk;https://www.lmu.de",
        "aff_unique_abbr": "LMU;UCLA;Cambridge;LMU",
        "aff_campus_unique_index": "1;2;3;1",
        "aff_campus_unique": ";Los Angeles;Cambridge;Munich",
        "aff_country_unique_index": "0;1;2;0;0;1",
        "aff_country_unique": "Germany;United States;United Kingdom"
    },
    {
        "id": "ikdB0VXPlw",
        "title": "Motion Flow Matching for Efficient Human Motion Synthesis and Editing",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Human motion synthesis is a fundamental task in the field of computer animation. Recent methods based on diffusion models or GPT structure demonstrate commendable performance but exhibit drawbacks in terms of slow sampling speeds or the accumulation of errors. In this paper, we propose Motion Flow Matching, a novel generative model designed for human motion generation featuring efficient sampling and effectiveness in motion editing applications.  Our method reduces the sampling complexity from 1000 steps in previous diffusion models to just 10 steps, while achieving comparable performance in text-to-motion and action-to-motion generation benchmarks.  Noticeably, our approach establishes a new state-of-the-art result of Fr\u00e9chet Inception Distance on the KIT-ML dataset. What is more, we tailor a straightforward motion editing paradigm named trajectory rewriting leveraging the ODE-style generative models and apply it to various editing scenarios including motion prediction, motion in-between prediction, motion interpolation, and upper-body editing.",
        "keywords": "human motion synthesis;flow matching",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/f6710367b0807c636348117360ca0de430a17f10.pdf",
        "author": "Vincent Tao Hu;Wenzhe Yin;Pingchuan Ma;Yunlu Chen;Basura Fernando;Yuki M Asano;Efstratios Gavves;Pascal Mettes;Bj\u00f6rn Ommer;Cees G. M. Snoek",
        "authorids": "~Vincent_Tao_Hu1;~Wenzhe_Yin1;~Pingchuan_Ma2;~Yunlu_Chen1;~Basura_Fernando1;~Yuki_M_Asano1;~Efstratios_Gavves1;~Pascal_Mettes1;~Bj\u00f6rn_Ommer2;~Cees_G._M._Snoek1",
        "gender": "M;M;M;;M;;M;M;;",
        "homepage": "http://taohu.me;https://ywzcode.github.io/;;;https://basurafernando.github.io/;;https://www.egavves.com;https://staff.fnwi.uva.nl/p.s.m.mettes/;;",
        "dblp": "272/5410;274/1924;250/4448;;01/9558;;03/8693;147/4008;;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;2y3cf-sAAAAJ;a5JMcsgAAAAJ;;https://scholar.google.com.au/citations?user=GyvseMkAAAAJ;;https://scholar.google.nl/citations?user=QqfCvsgAAAAJ;https://scholar.google.nl/citations?user=sMQxA3AAAAAJ;;",
        "orcid": ";;0000-0002-1367-6195;;0000-0002-6920-9916;;;0000-0001-9275-5942;;",
        "linkedin": "taohu620/;;;;;;;;;",
        "or_profile": "~Vincent_Tao_Hu1;~Wenzhe_Yin1;~Pingchuan_Ma2;~Yunlu_Chen1;~Basura_Fernando1;~Yuki_M_Asano1;~Efstratios_Gavves1;~Pascal_Mettes1;~Bj\u00f6rn_Ommer2;~Cees_G._M._Snoek1",
        "aff": "Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen;University of Amsterdam;Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen;;A*STAR;;University of Amsterdam;University of Amsterdam;;",
        "aff_domain": "lmu.de;uva.nl;lmu.de;;astar.edu.sg;;uva.nl;uva.nl;;",
        "position": "Postdoc;PhD student;PhD student;;Principal Researcher;;Associate Professor;Assistant Professor;;",
        "bibtex": "@misc{\nhu2024motion,\ntitle={Motion Flow Matching for Efficient Human Motion Synthesis and Editing},\nauthor={Vincent Tao Hu and Wenzhe Yin and Pingchuan Ma and Yunlu Chen and Basura Fernando and Yuki M Asano and Efstratios Gavves and Pascal Mettes and Bj{\\\"o}rn Ommer and Cees G. M. Snoek},\nyear={2024},\nurl={https://openreview.net/forum?id=ikdB0VXPlw}\n}",
        "github": "",
        "project": "",
        "reviewers": "QsSx;xr7a;AfYn",
        "site": "https://openreview.net/forum?id=ikdB0VXPlw",
        "pdf_size": 5937921,
        "rating": "3;5;5",
        "confidence": "4;3;2",
        "soundness": "2;3;2",
        "contribution": "2;2;2",
        "presentation": "3;2;2",
        "wc_summary": "65;29;53",
        "wc_strengths": "108;47;44",
        "wc_weaknesses": "198;253;128",
        "wc_questions": "8;3;58",
        "wc_review": "379;332;283",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            49.0,
            14.966629547095765
        ],
        "wc_strengths_avg": [
            66.33333333333333,
            29.48822740612863
        ],
        "wc_weaknesses_avg": [
            193.0,
            51.15336417740935
        ],
        "wc_questions_avg": [
            23.0,
            24.8327740429189
        ],
        "wc_review_avg": [
            331.3333333333333,
            39.19467083956979
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:vwPJ9EMQjsYJ:scholar.google.com/&scioq=Motion+Flow+Matching+for+Efficient+Human+Motion+Synthesis+and+Editing&hl=en&as_sdt=0,23",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;2;1;1",
        "aff_unique_norm": "Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen;University of Amsterdam;Agency for Science, Technology and Research",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.lmu.de;https://www.uva.nl;https://www.a-star.edu.sg",
        "aff_unique_abbr": "LMU;UvA;A*STAR",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;2;1;1",
        "aff_country_unique": "Germany;Netherlands;Singapore"
    },
    {
        "title": "Scaling Convex Neural Networks with Burer-Monteiro Factorization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18051",
        "id": "ikmuHqugN7",
        "author_site": "Arda Sahiner, Tolga Ergen, Batu Ozturkler, John M Pauly, Morteza Mardani, Mert Pilanci",
        "tldr": "",
        "abstract": "It has been demonstrated that the training problem for a variety of (non) linear two-layer neural networks (such as two-layer perceptrons, convolutional networks, and self-attention) can be posed as equivalent convex optimization problems, with an induced regularizer which encourages low rank. However, this regularizer becomes prohibitively expensive to compute at moderate scales, impeding training convex neural networks. To this end, we propose applying the Burer-Monteiro factorization to convex neural networks, which for the first time enables a Burer-Monteiro perspective on neural networks with non-linearities. This factorization leads to an equivalent yet computationally tractable non-convex alternative with no spurious local minima. We develop a novel relative optimality bound of stationary points of the Burer-Monteiro factorization, providing verifiable conditions under which any stationary point is a global optimum. Further, for the first time, we show that linear self-attention with sufficiently many heads has no spurious local minima. Our experiments validate the novel relative optimality bound and the utility of the Burer-Monteiro factorization for scaling convex neural networks.",
        "keywords": "burer-monteiro;convex optimization;neural networks;stationary points;global optima;relu activation",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/e7b3b544e859df2c67a6c062cb75b76495cc8a6e.zip",
        "author": "Arda Sahiner;Tolga Ergen;Batu Ozturkler;John M. Pauly;Morteza Mardani;Mert Pilanci",
        "authorids": "~Arda_Sahiner1;~Tolga_Ergen1;~Batu_Ozturkler1;~John_M._Pauly1;~Morteza_Mardani1;~Mert_Pilanci3",
        "gender": "M;M;;M;M;M",
        "homepage": "http://web.stanford.edu/~sahiner/;https://tolgaergen.github.io/;https://batuozt.github.io;http://www.stanford.edu/~pauly;http://web.stanford.edu/~morteza/;https://stanford.edu/~pilanci/",
        "dblp": "264/6371;202/7477.html;281/6970;95/6728;74/258;45/8056",
        "google_scholar": "723GIZQAAAAJ;https://scholar.google.com.tr/citations?user=T1pWaCsAAAAJ;O_tiFfoAAAAJ;Fc6GIIQAAAAJ;H7edsyEAAAAJ;aSAS-aAAAAAJ",
        "orcid": ";0000-0003-4806-0224;;;;",
        "linkedin": ";;;john-pauly-69805911/;;mert-pilanci-ba615743/",
        "or_profile": "~Arda_Sahiner1;~Tolga_Ergen1;~Batu_Ozturkler1;~John_M._Pauly1;~Morteza_Mardani1;~Mert_Pilanci3",
        "aff": ";LG AI Research;Stanford University;;;Stanford University",
        "aff_domain": ";lgresearch.ai;stanford.edu;;;stanford.edu",
        "position": ";Research Scientist;PhD student;;;Assistant Professor",
        "bibtex": "@inproceedings{\nsahiner2024scaling,\ntitle={Scaling Convex Neural Networks with Burer-Monteiro Factorization},\nauthor={Arda Sahiner and Tolga Ergen and Batu Ozturkler and John M. Pauly and Morteza Mardani and Mert Pilanci},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ikmuHqugN7}\n}",
        "github": "",
        "project": "",
        "reviewers": "xgT4;4XdN;8nq3;TUoh;Mur9",
        "pdf_size": 771266,
        "rating": "5;6;6;8;8",
        "confidence": "3;4;3;3;3",
        "soundness": "3;2;3;4;3",
        "contribution": "2;3;2;4;3",
        "presentation": "2;2;2;3;3",
        "wc_summary": "67;164;59;187;90",
        "wc_strengths": "1;41;35;243;105",
        "wc_weaknesses": "398;205;155;10;134",
        "wc_questions": "2;182;1;162;113",
        "wc_review": "468;592;250;602;442",
        "wc_reply_reviewers": "0;201;18;55;14",
        "wc_reply_authors": "548;1056;268;100;159",
        "reply_reviewers": "0;1;1;1;1",
        "reply_authors": "2;3;2;1;1",
        "rating_avg": [
            6.6,
            1.2
        ],
        "confidence_avg": [
            3.2,
            0.39999999999999997
        ],
        "soundness_avg": [
            3.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            2.8,
            0.7483314773547882
        ],
        "presentation_avg": [
            2.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            113.4,
            52.22489827658834
        ],
        "wc_strengths_avg": [
            85.0,
            85.85569288055393
        ],
        "wc_weaknesses_avg": [
            180.4,
            126.3243444471413
        ],
        "wc_questions_avg": [
            92.0,
            77.22952803170558
        ],
        "wc_review_avg": [
            470.8,
            127.6658137482388
        ],
        "wc_reply_reviewers_avg": [
            57.6,
            73.969182772287
        ],
        "wc_reply_authors_avg": [
            426.2,
            350.51756018778855
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            1.8,
            0.7483314773547883
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.24999999999999997,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1739716947338503016&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=ikmuHqugN7",
        "pdf": "https://openreview.net/pdf?id=ikmuHqugN7",
        "email": ";lgresearch.ai;stanford.edu;;;stanford.edu",
        "author_num": 6,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "LG;Stanford University",
        "aff_unique_dep": "LG AI Research;",
        "aff_unique_url": "https://www.lgaires.com;https://www.stanford.edu",
        "aff_unique_abbr": "LG AI;Stanford",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Stanford",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "id": "ikqcUzUogm",
        "title": "Programmatic Evaluation of Rule-Following Behavior",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "As Large Language Models (LLMs) are being deployed today with increasing real-world responsibilities, it is important for us to reliably specify and constrain the behavior of these systems. However, evaluating a model's adherence to even very simple rules (e.g., \"do not generate abusive text\" or \"do not aid the user in the commission of crime\") requires costly human judgment, which slows down the monitoring and improvement of rule-following behavior in LLMs. \nMotivated by that, we propose the Benchmark for Identifying Non-compliant Decisions (BIND), a framework to programmatically evaluate rule-following in LLMs. BIND consists of 15 text scenarios in which the model is instructed to obey a set of rules while interacting with the human user. The scenarios are inspired by various security properties of computer systems and simple children's games. Each scenario has a concise evaluation program to decide whether the model has broken any rules in the conversation, which also means all our scenarios can be trivially solved by corresponding programs. Through extensive qualitative exploration of model behavior in our scenarios, we identify 6 different categories of attack strategies. We then systematically hand-write a suite of 862 test cases implementing specific strategies from these 6 categories and evaluate currently popular proprietary and open-source models. All evaluated models struggle on the test suite: GPT-4, the best overall model, passes only 73.9% of test cases, while Llama2-7B only passes 26.1% of test cases.\nAdditionally, we evaluate the performance of Llama2 and Vicuna under adversarially optimized inputs, which reliably drive pass rates down to $0\\%$ across multiple scenarios. We propose BIND as a challenging new setting for open research into defending against both human-written and automatic attacks on LLMs, as well as exploring rule-following model behavior.",
        "keywords": "large language models;rule-following;instruction following;alignment;safety",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/d7197fc3b198171ff99bef495e534220887b1f8c.zip",
        "author": "Norman Mu;Sarah Li Chen;Zifan Wang;Sizhe Chen;Dan Hendrycks;David Wagner",
        "authorids": "~Norman_Mu1;~Sarah_Li_Chen1;~Zifan_Wang1;~Sizhe_Chen1;~Dan_Hendrycks1;~David_Wagner3",
        "gender": "M;;M;M;;",
        "homepage": ";;https://www.zifanw.net;https://sizhe-chen.github.io;;https://people.eecs.berkeley.edu/~daw/",
        "dblp": "232/1821;;;;182/2504;42/5626",
        "google_scholar": "UFlWdvUAAAAJ;;HJOP3wMAAAAJ;;;67kghxAAAAAJ",
        "orcid": ";;;;;0000-0002-9944-9232",
        "linkedin": ";sarah-chen1/;zifan-wang-sail/;;;",
        "or_profile": "~Norman_Mu1;~Sarah_Li_Chen1;~Zifan_Wang1;~Sizhe_Chen1;~Dan_Hendrycks1;~David_Wagner3",
        "aff": "University of California, Berkeley;Stanford University;Center for AI Safety;University of California, Berkeley;Center for AI Safety;University of California, Berkeley",
        "aff_domain": "berkeley.edu;stanford.edu;safe.ai;berkeley.edu;safe.ai;berkeley.edu",
        "position": "PhD student;Undergrad student;Researcher;PhD student;Executive and Research Director;Professor",
        "bibtex": "@misc{\nmu2024programmatic,\ntitle={Programmatic Evaluation of Rule-Following Behavior},\nauthor={Norman Mu and Sarah Li Chen and Zifan Wang and Sizhe Chen and Dan Hendrycks and David Wagner},\nyear={2024},\nurl={https://openreview.net/forum?id=ikqcUzUogm}\n}",
        "github": "",
        "project": "",
        "reviewers": "NyVg;1QQx;UwWZ;do43",
        "site": "https://openreview.net/forum?id=ikqcUzUogm",
        "pdf_size": 498061,
        "rating": "3;5;5;6",
        "confidence": "5;2;4;4",
        "soundness": "2;2;2;4",
        "contribution": "2;2;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "46;113;86;127",
        "wc_strengths": "7;51;24;87",
        "wc_weaknesses": "17;37;73;182",
        "wc_questions": "279;87;55;2",
        "wc_review": "349;288;238;398",
        "wc_reply_reviewers": "300;0;0;0",
        "wc_reply_authors": "460;219;209;232",
        "reply_reviewers": "2;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            93.0,
            30.87879531328902
        ],
        "wc_strengths_avg": [
            42.25,
            30.22726418318403
        ],
        "wc_weaknesses_avg": [
            77.25,
            63.71960059510731
        ],
        "wc_questions_avg": [
            105.75,
            104.53079689737375
        ],
        "wc_review_avg": [
            318.25,
            60.54079203314076
        ],
        "wc_reply_reviewers_avg": [
            75.0,
            129.9038105676658
        ],
        "wc_reply_authors_avg": [
            280.0,
            104.24250572583144
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.4736842105263159,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Nx2f22I9ExcJ:scholar.google.com/&scioq=Programmatic+Evaluation+of+Rule-Following+Behavior&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0;2;0",
        "aff_unique_norm": "University of California, Berkeley;Stanford University;Center for AI Safety",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.berkeley.edu;https://www.stanford.edu;https://www.centerforaisafety.org",
        "aff_unique_abbr": "UC Berkeley;Stanford;",
        "aff_campus_unique_index": "0;1;0;0",
        "aff_campus_unique": "Berkeley;Stanford;",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "How Do Transformers Learn In-Context Beyond Simple Functions? A Case Study on Learning with Representations",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18050",
        "id": "ikwEDva1JZ",
        "author_site": "Tianyu Guo, Wei Hu, Song Mei, Huan Wang, Caiming Xiong, Silvio Savarese, Yu Bai",
        "tldr": "",
        "abstract": "While large language models based on the transformer architecture have demonstrated remarkable in-context learning (ICL) capabilities, understandings of such capabilities are still in an early stage, where existing theory and mechanistic understanding focus mostly on simple scenarios such as learning simple function classes. This paper takes initial steps on understanding ICL in more complex scenarios, by studying learning with \\emph{representations}. Concretely, we construct synthetic in-context learning problems with a compositional structure, where the label depends on the input through a possibly complex but \\emph{fixed} representation function, composed with a linear function that \\emph{differs} in each instance. By construction, the optimal ICL algorithm first transforms the inputs by the representation function, and then performs linear ICL on top of the transformed dataset. We show theoretically the existence of transformers that approximately implement such algorithms with mild depth and size.  Empirically, we find trained transformers consistently achieve near-optimal ICL performance in this setting, and exhibit the desired dissection where lower layers transforms the dataset and upper layers perform linear ICL. Through extensive probing and a new pasting experiment, we further reveal several mechanisms within the trained transformers, such as concrete copying behaviors on both the inputs and the representations, linear ICL capability of the upper layers alone, and a post-ICL representation selection mechanism in a harder mixture setting. These observed mechanisms align well with our theory and may shed light on how transformers perform ICL in more realistic scenarios.",
        "keywords": "in-context learning;transformers;representation learning;learning theory;mechanistic understanding",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Tianyu Guo;Wei Hu;Song Mei;Huan Wang;Caiming Xiong;Silvio Savarese;Yu Bai",
        "authorids": "~Tianyu_Guo4;~Wei_Hu1;~Song_Mei1;~Huan_Wang1;~Caiming_Xiong1;~Silvio_Savarese1;~Yu_Bai1",
        "gender": "M;M;M;M;M;M;",
        "homepage": "https://statistics.berkeley.edu/people/tianyu-guo;https://weihu.me;https://www.stat.berkeley.edu/~songmei/;http://www.cs.yale.edu/homes/wang-huan/;http://cmxiong.com/;;https://yubai.org",
        "dblp": ";;https://dblp.org/pers/hd/m/Mei:Song;70/6155-16.html;80/7282;50/3578;03/6325-17.html",
        "google_scholar": ";ZybgAqkAAAAJ;https://scholar.google.com.hk/citations?hl=en;7NpTttkAAAAJ;vaSdahkAAAAJ;ImpbxLsAAAAJ;owqhKD8AAAAJ",
        "orcid": ";;;;;;",
        "linkedin": ";;;huanwangyale/;caiming-xiong-150a1417;;",
        "or_profile": "~Tianyu_Guo4;~Wei_Hu1;~Song_Mei1;~Huan_Wang1;~Caiming_Xiong1;~Silvio_Savarese1;~Yu_Bai1",
        "aff": "University of California, Berkeley;University of Michigan - Ann Arbor;University of California, Berkeley;Salesforce.com;Salesforce Research;Stanford University;Salesforce Research",
        "aff_domain": "berkeley.edu;umich.edu;berkeley.edu;salesforce.com;salesforce.com;stanford.edu;salesforce.com",
        "position": "PhD student;Assistant Professor;Assistant Professor;Researcher;Research Scientist;Adjunct Professor;Research Scientist",
        "bibtex": "@inproceedings{\nguo2024how,\ntitle={How Do Transformers Learn In-Context Beyond Simple Functions? A Case Study on Learning with Representations},\nauthor={Tianyu Guo and Wei Hu and Song Mei and Huan Wang and Caiming Xiong and Silvio Savarese and Yu Bai},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ikwEDva1JZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "z67a;67Bi;oQN2;R1v9",
        "pdf_size": 11560718,
        "rating": "6;6;6;8",
        "confidence": "4;4;3;3",
        "soundness": "3;2;3;3",
        "contribution": "3;3;2;4",
        "presentation": "4;3;3;3",
        "wc_summary": "68;27;209;119",
        "wc_strengths": "157;25;74;37",
        "wc_weaknesses": "211;134;153;91",
        "wc_questions": "189;23;105;87",
        "wc_review": "625;209;541;334",
        "wc_reply_reviewers": "0;70;22;190",
        "wc_reply_authors": "974;457;700;571",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "2;2;1;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            105.75,
            67.93885118251559
        ],
        "wc_strengths_avg": [
            73.25,
            51.61576793965193
        ],
        "wc_weaknesses_avg": [
            147.25,
            43.1182965804541
        ],
        "wc_questions_avg": [
            101.0,
            59.2452529743945
        ],
        "wc_review_avg": [
            427.25,
            164.60008353582327
        ],
        "wc_reply_reviewers_avg": [
            70.5,
            73.48979520994735
        ],
        "wc_reply_authors_avg": [
            675.5,
            192.59088763490342
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 61,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16256555134777318996&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=ikwEDva1JZ",
        "pdf": "https://openreview.net/pdf?id=ikwEDva1JZ",
        "email": "berkeley.edu;umich.edu;berkeley.edu;salesforce.com;salesforce.com;stanford.edu;salesforce.com",
        "author_num": 7,
        "aff_unique_index": "0;1;0;2;2;3;2",
        "aff_unique_norm": "University of California, Berkeley;University of Michigan;Salesforce;Stanford University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.berkeley.edu;https://www.umich.edu;https://www.salesforce.com;https://www.stanford.edu",
        "aff_unique_abbr": "UC Berkeley;UM;Salesforce;Stanford",
        "aff_campus_unique_index": "0;1;0;3",
        "aff_campus_unique": "Berkeley;Ann Arbor;;Stanford",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Multi-View Representation is What You Need for Point-Cloud Pre-Training",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18049",
        "id": "imZcqOrbig",
        "author_site": "Siming Yan, Chen Song, Youkang Kong, Qixing Huang",
        "tldr": "",
        "abstract": "A promising direction for pre-training 3D point clouds is to leverage the massive amount of data in 2D, whereas the domain gap between 2D and 3D creates a fundamental challenge. This paper proposes a novel approach to point-cloud pre-training that learns 3D representations by leveraging pre-trained 2D networks. Different from the popular practice of predicting 2D features first and then obtaining 3D features through dimensionality lifting, our approach directly uses a 3D network for feature extraction. We train the 3D feature extraction network with the help of the novel 2D knowledge transfer loss, which enforces the 2D projections of the 3D feature to be consistent with the output of pre-trained 2D networks. To prevent the feature from discarding 3D signals, we introduce the multi-view consistency loss that additionally encourages the projected 2D feature representations to capture pixel-wise correspondences across different views. Such correspondences induce 3D geometry and effectively retain 3D features in the projected 2D features. Experimental results demonstrate that our pre-trained model can be successfully transferred to various downstream tasks, including 3D shape classification, part segmentation, 3D object detection, and semantic segmentation, achieving state-of-the-art performance.",
        "keywords": "point cloud;point cloud pre-training;multi-view representation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/12cb5180f9e68198aca236c945bef274ef879498.pdf",
        "author": "Siming Yan;Chen Song;Youkang Kong;Qixing Huang",
        "authorids": "~Siming_Yan1;~Chen_Song5;~Youkang_Kong1;~Qixing_Huang1",
        "gender": "M;M;;M",
        "homepage": ";http://songc.me/;https://github.com/DQSSSSS;https://www.cs.utexas.edu/~huangqx/",
        "dblp": "156/8709;;;82/241",
        "google_scholar": "znWC2vAAAAAJ;AoV0Q34AAAAJ;;https://scholar.google.com.tw/citations?user=pamL_rIAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Siming_Yan1;~Chen_Song5;~Youkang_Kong1;~Qixing_Huang1",
        "aff": "The University of Texas at Austin;University of Texas at Austin;Tsinghua University;University of Texas at Austin",
        "aff_domain": "cs.utexas.edu;utexas.edu;mail.tsinghua.edu.cn;utexas.edu",
        "position": "PhD student;PhD student;PhD student;Associate Professor",
        "bibtex": "@inproceedings{\nyan2024multiview,\ntitle={Multi-View Representation is What You Need for Point-Cloud Pre-Training},\nauthor={Siming Yan and Chen Song and Youkang Kong and Qixing Huang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=imZcqOrbig}\n}",
        "github": "",
        "project": "",
        "reviewers": "1Vvn;JZVU;GBMb;RdJt",
        "pdf_size": 2480089,
        "rating": "6;6;6;6",
        "confidence": "4;5;4;5",
        "soundness": "2;3;2;3",
        "contribution": "2;3;2;2",
        "presentation": "3;3;3;4",
        "wc_summary": "45;109;64;61",
        "wc_strengths": "71;98;62;39",
        "wc_weaknesses": "246;231;190;224",
        "wc_questions": "2;58;49;33",
        "wc_review": "364;496;365;357",
        "wc_reply_reviewers": "25;81;24;25",
        "wc_reply_authors": "501;743;1626;1288",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;2;4;4",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            69.75,
            23.7841859225831
        ],
        "wc_strengths_avg": [
            67.5,
            21.12463017427761
        ],
        "wc_weaknesses_avg": [
            222.75,
            20.51066795596867
        ],
        "wc_questions_avg": [
            35.5,
            21.313141485947114
        ],
        "wc_review_avg": [
            395.5,
            58.105507484230785
        ],
        "wc_reply_reviewers_avg": [
            38.75,
            24.39646490785089
        ],
        "wc_reply_authors_avg": [
            1039.5,
            442.614109580795
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.0,
            1.0
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9363566337467905214&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=imZcqOrbig",
        "pdf": "https://openreview.net/pdf?id=imZcqOrbig",
        "email": "cs.utexas.edu;utexas.edu;mail.tsinghua.edu.cn;utexas.edu",
        "author_num": 4,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "University of Texas at Austin;Tsinghua University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.utexas.edu;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "UT Austin;THU",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Austin;",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "imuVEKaU3b",
        "title": "Noise-guided Unsupervised Outlier Detection",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Over the past decade, we have witnessed enormous research on unsupervised outlier detection techniques, ranging from statistical models to recent deep learning-based approaches. Existing approaches generally limit their discussions to unlabelled data mixed with normal data (inliers) and abnormal data (outliers), constituting only a tiny fraction of the whole value space. Such approaches tend to fall into the local optimum of a specific subspace and hardly generalize to diverse datasets. This paper proposes a novel end-to-end Noise-guided unsupervised Outlier Detector (NOD), which infers the anomaly score of the entire value space via a simple MLP to learn the difference between samples and uniform noise. We further theoretically prove that the learned classifier can separate outliers from inliers under a loose condition. Extensive experiments show that NOD significantly advances UOD performance in 22 diverse real-world datasets by an average of 30.6% ROC_AUC against 11 state-of-the-art counterparts without dataset-specific tuning. The merit is of paramount importance for UOD due to the lack of labeled data for supervision.",
        "keywords": "Outlier Detection;Synthetic Outliers;Neural Networks;Unsupervised Learning",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/53b5115ad2ac8347e8749e9c8166e3f51d8b81ce.zip",
        "author": "Zifeng Wan;You LiAC;Yun Lei;Tianyuan Xu;Songgaojun Deng;Jinglin Li;Ning Gui",
        "authorids": "~Zifeng_Wan1;~You_LiAC1;~Yun_Lei2;~Tianyuan_Xu2;~Songgaojun_Deng1;1603582578@qq.com;~Ning_Gui1",
        "gender": "M;F;M;;F;;M",
        "homepage": ";;;;https://songgaojundeng.github.io/;;https://faculty.csu.edu.cn/guining/zh_CN/index.htm",
        "dblp": ";;;;241/4844.html;;30/3048",
        "google_scholar": ";Ttg2RWQAAAAJ;;;RtzagbgAAAAJ;;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": "0000-0002-3180-2925;;0000-0002-9451-4293;;0000-0002-9822-9270;;",
        "linkedin": ";;;https://www.linkedin.cn/incareer/in/ACoAACiNGkoBV1P_O7oqoAm-qy9wHJwY1o0QK6k;;;",
        "or_profile": "~Zifeng_Wan1;~You_LiAC1;~Yun_Lei2;~Tianyuan_Xu2;~Songgaojun_Deng1;1603582578@qq.com;~Ning_Gui1",
        "aff": ";;Huawei Technologies Ltd.;;University of Amsterdam;;Central South University",
        "aff_domain": ";;huawei.com;;uva.nl;;csu.edu.cn",
        "position": ";;Researcher;;Postdoc;;Full Professor",
        "bibtex": "@misc{\nwan2024noiseguided,\ntitle={Noise-guided Unsupervised Outlier Detection},\nauthor={Zifeng Wan and You LiAC and Yun Lei and Tianyuan Xu and Songgaojun Deng and Jinglin Li and Ning Gui},\nyear={2024},\nurl={https://openreview.net/forum?id=imuVEKaU3b}\n}",
        "github": "",
        "project": "",
        "reviewers": "35WP;8pA6;DJGq",
        "site": "https://openreview.net/forum?id=imuVEKaU3b",
        "pdf_size": 5921454,
        "rating": "3;3;5",
        "confidence": "4;4;4",
        "soundness": "1;2;3",
        "contribution": "2;2;3",
        "presentation": "1;2;3",
        "wc_summary": "58;45;51",
        "wc_strengths": "44;161;29",
        "wc_weaknesses": "148;136;20",
        "wc_questions": "132;45;163",
        "wc_review": "382;387;263",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            51.333333333333336,
            5.312459150169743
        ],
        "wc_strengths_avg": [
            78.0,
            59.00847396772772
        ],
        "wc_weaknesses_avg": [
            101.33333333333333,
            57.71962885843564
        ],
        "wc_questions_avg": [
            113.33333333333333,
            49.94886273869395
        ],
        "wc_review_avg": [
            344.0,
            57.312011539176204
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:o4pc3YVN_4gJ:scholar.google.com/&scioq=Noise-guided+Unsupervised+Outlier+Detection&hl=en&as_sdt=0,23",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Huawei;University of Amsterdam;Central South University",
        "aff_unique_dep": "Huawei Technologies;;",
        "aff_unique_url": "https://www.huawei.com;https://www.uva.nl;https://www.csu.edu.cn",
        "aff_unique_abbr": "Huawei;UvA;CSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "China;Netherlands"
    },
    {
        "id": "ioBIT7gLBm",
        "title": "Hard View Selection for Contrastive Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Many Contrastive Learning (CL) methods train their models to be invariant to different \"views\" of an image input for which a good data augmentation pipeline is crucial. While considerable efforts were directed towards improving pre-text tasks, architectures, or robustness (e.g., Siamese networks or teacher-softmax centering), the majority of these methods remain strongly reliant on the random sampling of operations within the image augmentation pipeline, such as the random resized crop or color distortion operation. \nIn this paper, we argue that the role of the view generation and its effect on performance has so far received insufficient attention. To address this, we propose an easy, learning-free, yet powerful Hard View Selection (HVS) strategy designed to extend the random view generation to expose the pretrained model to harder samples during CL training. It encompasses the following iterative steps: 1) randomly sample multiple views and create pairs of two views, 2) run forward passes for each view pair on the currently trained model, 3) adversarially select the pair yielding the worst loss, and 4) run the backward pass with the selected pair.\nIn our empirical analysis we show that under the hood, HVS increases task difficulty by controlling the Intersection over Union of views during pretraining. With only 300-epoch pretraining, HVS is able to closely rival the 800-epoch DINO baseline which remains very favorable even when factoring in the slowdown induced by the additional forwards of HVS. Additionally, HVS consistently achieves accuracy improvements on ImageNet between 0.55% and 1.9% on linear evaluation and similar improvements on transfer tasks across multiple CL methods, such as DINO, SimSiam, and SimCLR.",
        "keywords": "Contrastive Learning;Self-Supervised Learning;Pretraining;Data Augmentation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/b42fb5b660d691af0d0fb36542af1b0dd71f248f.pdf",
        "author": "Fabio Ferreira;Ivo Rapant;Frank Hutter",
        "authorids": "~Fabio_Ferreira1;~Ivo_Rapant2;~Frank_Hutter1",
        "gender": "M;M;M",
        "homepage": "http://ferreirafabio.github.io;;http://ml.informatik.uni-freiburg.de/~hutter/",
        "dblp": "128/6466;;89/5383",
        "google_scholar": "https://scholar.google.de/citations?user=LFtEAeYAAAAJ;;https://scholar.google.de/citations?user=YUrxwrkAAAAJ",
        "orcid": "0000-0002-0816-2042;;0000-0002-2037-3694",
        "linkedin": ";ivo-rapant-81194024a/;frank-hutter-9190b24b/",
        "or_profile": "~Fabio_Ferreira1;~Ivo_Rapant2;~Frank_Hutter1",
        "aff": "Universit\u00e4t Freiburg;;Albert-Ludwigs-Universit\u00e4t Freiburg",
        "aff_domain": "uni-freiburg.de;;uni-freiburg.de",
        "position": "PhD student;;Full Professor",
        "bibtex": "@misc{\nferreira2024hard,\ntitle={Hard View Selection for Contrastive Learning},\nauthor={Fabio Ferreira and Ivo Rapant and Frank Hutter},\nyear={2024},\nurl={https://openreview.net/forum?id=ioBIT7gLBm}\n}",
        "github": "",
        "project": "",
        "reviewers": "seyJ;a1az;PWAF;zn9X",
        "site": "https://openreview.net/forum?id=ioBIT7gLBm",
        "pdf_size": 11724293,
        "rating": "3;5;6;8",
        "confidence": "4;5;4;3",
        "soundness": "2;3;2;3",
        "contribution": "1;2;2;2",
        "presentation": "2;2;3;3",
        "wc_summary": "78;53;171;57",
        "wc_strengths": "83;51;116;124",
        "wc_weaknesses": "214;456;318;85",
        "wc_questions": "15;2;172;68",
        "wc_review": "390;562;777;334",
        "wc_reply_reviewers": "0;0;84;0",
        "wc_reply_authors": "1080;2082;1176;574",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "2;3;3;1",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            89.75,
            47.861127232859864
        ],
        "wc_strengths_avg": [
            93.5,
            28.952547383606852
        ],
        "wc_weaknesses_avg": [
            268.25,
            136.243119092305
        ],
        "wc_questions_avg": [
            64.25,
            66.94167237229736
        ],
        "wc_review_avg": [
            515.75,
            172.6533738448224
        ],
        "wc_reply_reviewers_avg": [
            21.0,
            36.373066958946424
        ],
        "wc_reply_authors_avg": [
            1228.0,
            543.5163291015275
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5883484054145521,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:6e3Bbn2oNLoJ:scholar.google.com/&scioq=Hard+View+Selection+for+Contrastive+Learning&hl=en&as_sdt=0,44",
        "gs_version_total": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Freiburg;Albert-Ludwigs-Universit\u00e4t Freiburg",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uni-freiburg.de;https://www.uni-freiburg.de",
        "aff_unique_abbr": "Uni Freiburg;Albert-Ludwigs-Universit\u00e4t",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Freiburg",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Germany"
    },
    {
        "title": "Efficient Modulation for Vision Networks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18048",
        "id": "ip5LHJs6QX",
        "author_site": "Xu Ma, Xiyang Dai, Jianwei Yang, Bin Xiao, Yinpeng Chen, Yun Fu, Lu Yuan",
        "tldr": "",
        "abstract": "In this work, we present efficient modulation, a novel design for efficient vision networks. We revisit the modulation mechanism, which operates input through convolutional context modeling and feature projection layers, and fuses features via element-wise multiplication and an MLP block. We demonstrate that the abstracted modulation mechanism is particularly well suited for efficient networks and further tailor the modulation design by proposing the efficient modulation (EfficientMod) block, which is considered the essential building block for our networks. Bene- fiting from the prominent representational ability of modulation mechanism and the efficiency of efficient modulation design, our network can accomplish better accuracy-efficiency trade-offs and set new state-of-the-art performance for efficient networks. When integrating EfficientMod block with the vanilla self-attention block, we obtain the hybrid architecture and further improve the performance without sacrificing the efficiency. We carry out comprehensive experiments to verify EfficientMod\u2019s performance. With fewer parameters, our EfficientMod-s performs 0.6 top-1 accuracy better than the prior state-of-the-art approach EfficientFormerV2-s2 without any training tricks and is 25% faster on GPU. Additionally, our method presents a notable improvement in downstream tasks, outperforming EfficientFormerV2-s by 3.6 mIoU on the ADE20K benchmark. Code and checkpoints are available at https://github.com/ma-xu/EfficientMod.",
        "keywords": "EfficientMod;Efficient Networks",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/0e5f09bffd5c54486d66de87adc232e7585c974d.zip",
        "author": "Xu Ma;Xiyang Dai;Jianwei Yang;Bin Xiao;Yinpeng Chen;Yun Fu;Lu Yuan",
        "authorids": "~Xu_Ma2;~Xiyang_Dai4;~Jianwei_Yang1;~Bin_Xiao2;~Yinpeng_Chen1;~Yun_Fu1;~Lu_Yuan1",
        "gender": "M;M;M;M;M;M;M",
        "homepage": "https://ma-xu.github.io/;;https://scholar.google.com/citations?user=V_VpLksAAAAJ&hl=en;http://www1.ece.neu.edu/~yunfu/;https://www.microsoft.com/en-us/research/people/luyuan/;https://jwyang.github.io/;https://sites.google.com/site/xiyangdai/",
        "dblp": "77/9370-5;43/5134-1;45/6977;00/5815-1;;;176/5470",
        "google_scholar": "Ya7frcEAAAAJ;https://scholar.google.com/citations?authuser=1;;https://scholar.google.com.tw/citations?user=h-JEcQ8AAAAJ;k9TsUVsAAAAJ;Cl9byD8AAAAJ;QC8RwcoAAAAJ",
        "orcid": ";0000-0001-6477-5911;;0000-0002-5098-2853;;;",
        "linkedin": ";;;furaymond/;;;",
        "or_profile": "~Xu_Ma2;~Bin_Xiao2;~Yinpeng_Chen1;~Yun_Fu1;~Lu_Yuan1;~Jianwei_Yang2;~Xiyang_Dai2",
        "aff": "Adobe Systems;Microsoft;Google DeepMind;Northeastern University;Microsoft;Microsoft;Microsoft",
        "aff_domain": "adobe.com;microsoft.com;google.com;northeastern.edu;microsoft.com;microsoft.com;microsoft.com",
        "position": "Intern;Principal Researcher;Research Scientist;Full Professor;Principal Research Manager;Researcher;Researcher",
        "bibtex": "@inproceedings{\nma2024efficient,\ntitle={Efficient Modulation for Vision Networks},\nauthor={Xu Ma and Xiyang Dai and Jianwei Yang and Bin Xiao and Yinpeng Chen and Yun Fu and Lu Yuan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ip5LHJs6QX}\n}",
        "github": "",
        "project": "",
        "reviewers": "fvW3;xsDm;6eCe;Q55t",
        "pdf_size": 15196153,
        "rating": "5;5;6;8",
        "confidence": "5;4;4;3",
        "soundness": "3;2;3;2",
        "contribution": "3;2;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "52;63;66;88",
        "wc_strengths": "23;54;76;45",
        "wc_weaknesses": "52;202;244;164",
        "wc_questions": "4;5;52;19",
        "wc_review": "131;324;438;316",
        "wc_reply_reviewers": "88;53;22;23",
        "wc_reply_authors": "1861;1811;1313;869",
        "reply_reviewers": "1;2;1;1",
        "reply_authors": "7;7;3;2",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            67.25,
            13.06474263045392
        ],
        "wc_strengths_avg": [
            49.5,
            19.00657780874821
        ],
        "wc_weaknesses_avg": [
            165.5,
            71.377517468738
        ],
        "wc_questions_avg": [
            20.0,
            19.403607911932255
        ],
        "wc_review_avg": [
            302.25,
            110.01903244439119
        ],
        "wc_reply_reviewers_avg": [
            46.5,
            27.004629232781554
        ],
        "wc_reply_authors_avg": [
            1463.5,
            404.6118510375098
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.75,
            2.277608394786075
        ],
        "replies_avg": [
            32,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.8660254037844386,
        "gs_citation": 22,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16383195334190328887&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=ip5LHJs6QX",
        "pdf": "https://openreview.net/pdf?id=ip5LHJs6QX",
        "email": "adobe.com;microsoft.com;google.com;northeastern.edu;microsoft.com;microsoft.com;microsoft.com",
        "author_num": 7,
        "aff_unique_index": "0;1;2;3;1;1;1",
        "aff_unique_norm": "Adobe;Microsoft;Google;Northeastern University",
        "aff_unique_dep": "Adobe Systems Incorporated;Microsoft Corporation;Google DeepMind;",
        "aff_unique_url": "https://www.adobe.com;https://www.microsoft.com;https://deepmind.com;https://www.northeastern.edu",
        "aff_unique_abbr": "Adobe;Microsoft;DeepMind;NEU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0;0;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "ipWSxcmgsx",
        "title": "Optimizing the trade-off between utility and performance in interpretable sleep classification",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep learning has made significant strides in numerous fields, yet its adoption in healthcare has been slow due to the considerable risks associated with clinical applications. Explainable models are essential to foster trust and accountability. This work examines the trade-off between interpretable techniques for automating sleep state annotation, a critical step in diagnosing sleep disorders. We introduce an interpretable approach, NormIntSleep, that produces explanations grounded in clinical guidelines by combining meaningful features with deep neural network embeddings. Furthermore, we propose the metric $Alignment_{DT}$ to quantify domain-grounded interpretability and the resulting utility of explanations. Crucially, NormIntSleep outperforms prior interpretable techniques with 0.814--0.847 accuracy, 0.787--0.793 F1-score, 0.759--0.788 $\\kappa$, and the hightest $Alignment_{DT}$ score. NormIntSleep represents a potentially generalizable interpretable machine learning approach where domain knowledge is essential for safe and efficient implementation in healthcare.",
        "keywords": "sleep staging;interpretability;representation learning;embedding;cnn;lstm;eeg",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "Irfan Al-Hussaini;Eric Carl Landsness;Cassie S. Mitchell",
        "authorids": "~Irfan_Al-Hussaini1;~Eric_Carl_Landsness1;~Cassie_S._Mitchell1",
        "gender": "M;M;F",
        "homepage": "https://iah3.github.io;https://profiles.wustl.edu/en/persons/eric-landsness;",
        "dblp": "https://dblp.uni-trier.de/pers/a/Al=Hussaini:Irfan;323/2144;222/3800",
        "google_scholar": "UYiz4E4AAAAJ;;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0003-2969-7019;0000-0003-3227-1641;",
        "linkedin": "irfan-al-hussaini/;;",
        "or_profile": "~Irfan_Al-Hussaini1;~Eric_Carl_Landsness1;~Cassie_S._Mitchell1",
        "aff": ";Washington University, Saint Louis;Georgia Institute of Technology",
        "aff_domain": ";wustl.edu;gatech.edu",
        "position": ";Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nal-hussaini2024optimizing,\ntitle={Optimizing the trade-off between utility and performance in interpretable sleep classification},\nauthor={Irfan Al-Hussaini and Eric Carl Landsness and Cassie S. Mitchell},\nyear={2024},\nurl={https://openreview.net/forum?id=ipWSxcmgsx}\n}",
        "github": "",
        "project": "",
        "reviewers": "ppPz;uEgX;coUd;ommx",
        "site": "https://openreview.net/forum?id=ipWSxcmgsx",
        "pdf_size": 4817512,
        "rating": "3;3;3;5",
        "confidence": "4;2;4;3",
        "soundness": "3;1;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;1;3;3",
        "wc_summary": "42;120;80;123",
        "wc_strengths": "34;161;50;100",
        "wc_weaknesses": "114;516;121;433",
        "wc_questions": "66;23;4;401",
        "wc_review": "256;820;255;1057",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            91.25,
            33.11627243516396
        ],
        "wc_strengths_avg": [
            86.25,
            49.54984863750847
        ],
        "wc_weaknesses_avg": [
            296.0,
            180.91296249854514
        ],
        "wc_questions_avg": [
            123.5,
            161.78148843424577
        ],
        "wc_review_avg": [
            597.0,
            351.62977689609846
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.17407765595569782,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ydffznUodbgJ:scholar.google.com/&scioq=Optimizing+the+trade-off+between+utility+and+performance+in+interpretable+sleep+classification&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Washington University in St. Louis;Georgia Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://wustl.edu;https://www.gatech.edu",
        "aff_unique_abbr": "WUSTL;Georgia Tech",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Saint Louis;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "iq2FBcjYRn",
        "title": "SlowFormer: Universal Adversarial Patch for Attack on Compute and Energy Efficiency of Inference Efficient Vision Transformers",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recently, there has been a lot of progress in reducing the computation of deep models at inference time. These methods can reduce both the computational needs and power usage of deep models. Some of these approaches adaptively scale the compute based on the input instance. We show that such models can be vulnerable to a universal adversarial patch attack, where the attacker optimizes for a patch that when pasted on any image, can increase the compute and power consumption of the model. We run experiments with three different efficient vision transformer methods showing that in some cases, the attacker can increase the computation to the maximum possible level by simply pasting a patch that occupies only 8\\% of the image area. We also show that a standard adversarial training defense method can reduce some of the attack's success. We believe adaptive efficient methods will be necessary for the future to lower the power usage of deep models, so we hope our paper encourages the community to study the robustness of these methods and develop better defense methods for the proposed attack.",
        "keywords": "Adversarial attack;Efficient Transformers;Energy Attack;Transformers;Universal Adversarial Patch",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/aced0c9ca53f76fff2fcf02218621ff08ecd6bef.zip",
        "author": "Navaneet K L;Soroush Abbasi Koohpayegani;Essam Sleiman;Hamed Pirsiavash",
        "authorids": "~Navaneet_K_L1;~Soroush_Abbasi_Koohpayegani1;~Essam_Sleiman1;~Hamed_Pirsiavash1",
        "gender": "M;M;M;M",
        "homepage": ";http://soroush-abbasi.github.io;https://essamsleiman.com/;https://web.cs.ucdavis.edu/~hpirsiav/",
        "dblp": "226/4749;277/5486;;07/6340",
        "google_scholar": "https://scholar.google.co.in/citations?hl=en;JS10DM0AAAAJ;mHRMvnUAAAAJ;https://scholar.google.com.tw/citations?user=c9XXy4MAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;hpirsiav/",
        "or_profile": "~Navaneet_K_L1;~Soroush_Abbasi_Koohpayegani1;~Essam_Sleiman1;~Hamed_Pirsiavash1",
        "aff": "University of California, Davis;University of California, Davis;Harvard University, Harvard University;University of California, Davis",
        "aff_domain": "ucdavis.edu;ucdavis.edu;g.harvard.edu;ucdavis.edu",
        "position": "PhD student;PhD student;MS student;Associate Professor",
        "bibtex": "@misc{\nl2024slowformer,\ntitle={SlowFormer: Universal Adversarial Patch for Attack on Compute and Energy Efficiency of Inference Efficient Vision Transformers},\nauthor={Navaneet K L and Soroush Abbasi Koohpayegani and Essam Sleiman and Hamed Pirsiavash},\nyear={2024},\nurl={https://openreview.net/forum?id=iq2FBcjYRn}\n}",
        "github": "",
        "project": "",
        "reviewers": "fHNd;UkHb;CMkn;Mjw1",
        "site": "https://openreview.net/forum?id=iq2FBcjYRn",
        "pdf_size": 6003896,
        "rating": "3;5;5;5",
        "confidence": "4;5;4;4",
        "soundness": "3;3;3;3",
        "contribution": "1;2;2;3",
        "presentation": "2;3;2;2",
        "wc_summary": "48;49;113;85",
        "wc_strengths": "14;32;31;27",
        "wc_weaknesses": "86;217;562;80",
        "wc_questions": "31;38;9;2",
        "wc_review": "179;336;715;194",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            73.75,
            27.123559869604136
        ],
        "wc_strengths_avg": [
            26.0,
            7.176350047203662
        ],
        "wc_weaknesses_avg": [
            236.25,
            195.87799136197
        ],
        "wc_questions_avg": [
            20.0,
            14.916433890176299
        ],
        "wc_review_avg": [
            356.0,
            216.13306086760537
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6695542700887414217&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "University of California, Davis;Harvard University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ucdavis.edu;https://www.harvard.edu",
        "aff_unique_abbr": "UC Davis;Harvard",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Davis;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "iqAbdT35hE",
        "title": "Out-Of-Distribution Detection With Smooth Training",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Detecting out-of-distribution (OOD) inputs is important for ensuring the safe deployment of machine learning models in real-world scenarios. The primary factor impacting OOD detection is the neural network's overconfidence, where a trained neural network tends to make overly confident predictions for OOD samples. A naive solution to mitigate the overconfidence problem of neural networks is label smoothing. However, our experimental observations show that simply using label smoothing doesn't work. We believe that this is because label smoothing is applied to the original ID samples, which is the opposite of the goal of OOD detection (high confidence for ID samples and low confidence for OOD samples). To this end, we propose a new training strategy: smooth training (SMOT) where label smoothing is applied to the perturbed inputs. During the smooth training process, input images are masked with random-sized label-related regions, and their labels are softened to varying degrees depending on the size of masked regions. With this training approach, we make the prediction confidence of the neural network closely related to the number of input image features belonging to a known class, thus allowing the neural network to produce highly distinguishable confidence scores between in- and out-of-distribution data. Extensive experiments are conducted on diverse OOD detection benchmarks, showing the effectiveness of SMOT.",
        "keywords": "out-of-distribution dection",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Jun Nie;Yonggang Zhang;Yadan Luo;Zhen Fang;Xiaofeng Cao;Xinmei Tian",
        "authorids": "~Jun_Nie1;~Yonggang_Zhang1;~Yadan_Luo1;~Zhen_Fang2;~Xiaofeng_Cao2;~Xinmei_Tian1",
        "gender": ";M;F;M;F;M",
        "homepage": "http://staff.ustc.edu.cn/~xinmei/students.html;https://yonggangzhangben.github.io/index.html;https://sites.google.com/view/yadanluo/home;https://fang-zhen.github.io/index.html;https://faculty.ustc.edu.cn/tianxinmei1/zh_CN/index.htm;https://xiaofengcaoml.github.io/",
        "dblp": ";27/6859-3;182/2414;;03/5204-1;117/3982-2.html",
        "google_scholar": ";XSbEr98AAAAJ;3IfL11AAAAAJ;OzD6WJcAAAAJ;https://scholar.google.com.au/citations?hl=zh-CN;",
        "orcid": ";0000-0002-4080-7592;0000-0001-6272-2971;0000-0003-0602-6255;0000-0002-5952-8753;",
        "linkedin": ";;;;;",
        "or_profile": "~Jun_Nie1;~Yonggang_Zhang1;~Yadan_Luo1;~Zhen_Fang2;~Xinmei_Tian1;~Xiaofeng_Cao1",
        "aff": "University of Science and Technology of China;Hong Kong Baptist University;The University of Queensland;University of Technology Sydney;University of Science and Technology of China;Jilin University",
        "aff_domain": "ustc.edu.cn;hkbu.edu.hk;uq.edu.au;uts.edu.au;ustc.edu.cn;jlu.edu.cn",
        "position": "MS student;Postdoc;Assistant Professor;Assistant Professor;Full Professor;Associate Professor",
        "bibtex": "@misc{\nnie2024outofdistribution,\ntitle={Out-Of-Distribution Detection With Smooth Training},\nauthor={Jun Nie and Yonggang Zhang and Yadan Luo and Zhen Fang and Xiaofeng Cao and Xinmei Tian},\nyear={2024},\nurl={https://openreview.net/forum?id=iqAbdT35hE}\n}",
        "github": "",
        "project": "",
        "reviewers": "m2VV;c4yF;2XDU;H2kX",
        "site": "https://openreview.net/forum?id=iqAbdT35hE",
        "pdf_size": 8662456,
        "rating": "5;6;6;6",
        "confidence": "5;3;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;4;3;4",
        "wc_summary": "97;53;58;84",
        "wc_strengths": "8;68;49;93",
        "wc_weaknesses": "768;35;137;281",
        "wc_questions": "6;47;8;2",
        "wc_review": "879;203;252;460",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1439;254;624;1027",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;1;2",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            73.0,
            18.179658962697843
        ],
        "wc_strengths_avg": [
            54.5,
            31.052375110448477
        ],
        "wc_weaknesses_avg": [
            305.25,
            281.0999599786524
        ],
        "wc_questions_avg": [
            15.75,
            18.171062159378575
        ],
        "wc_review_avg": [
            448.5,
            266.62004800839713
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            836.0,
            442.65053936485833
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:vaUFLcdzmp0J:scholar.google.com/&scioq=Out-Of-Distribution+Detection+With+Smooth+Training&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;0;4",
        "aff_unique_norm": "University of Science and Technology of China;Hong Kong Baptist University;University of Queensland;University of Technology Sydney;Jilin University",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "http://www.ustc.edu.cn;https://www.hkbu.edu.hk;https://www.uq.edu.au;https://www.uts.edu.au;http://www.jlu.edu.cn",
        "aff_unique_abbr": "USTC;HKBU;UQ;UTS;JLU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;1;1;0;0",
        "aff_country_unique": "China;Australia"
    },
    {
        "id": "iqHh5Iuytv",
        "title": "RNNS with gracefully degrading continuous attractors",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Attractor networks are essential theoretical components in recurrent networks for memory, learning, and computation.\nHowever, the continuous attractors that are essential for continuous-valued memory suffer from structural instability---infinitesimal changes in the parameters can destroy the continuous attractor.\nMoreover, the perturbed system's dynamics can exhibit divergent behavior with associated exploding gradients.\nThis poses a question about the utility of continuous attractors for systems that learn using gradient signals.\nTo address this issue, we use Fenichel's persistence theorem from dynamical systems theory to show that bounded attractors are stable in the sense that all perturbations maintain the stability.\nThis ensures that if there is a restorative learning signal, there will be no exploding gradients for any length of time for backpropagation.\nIn contrast, unbounded attractors may devolve into divergent systems under certain perturbations, leading to exploding gradients.\nThis insight also suggests that there can exist homeostatic mechanisms for certain implementations of continuous attractors that maintain the structure of the attractor sufficiently for the neural computation it is used in.\nFinally, we verify in a simple continuous attractor that all perturbations preserve the invariant manifold and demonstrate the principle numerically in ring attractor systems.",
        "keywords": "exploding gradient problem;gradient descent;bifurcation analysis",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "\u00c1bel S\u00e1godi;Piotr A Sokol;Il Memming Park",
        "authorids": "~\u00c1bel_S\u00e1godi1;~Piotr_A_Sokol2;~Il_Memming_Park1",
        "gender": "M;M;M",
        "homepage": ";https://scholar.google.com/citations?user=MwySeOEAAAAJ&hl=en;http://catniplab.github.io/",
        "dblp": ";228/9266;00/4652-2",
        "google_scholar": "-nSEXC0AAAAJ;MwySeOEAAAAJ;CsmltusAAAAJ",
        "orcid": "0000-0002-1414-5062;;0000-0002-4255-7750",
        "linkedin": "asagodi/;;memming/",
        "or_profile": "~\u00c1bel_S\u00e1godi1;~Piotr_A_Sokol2;~Il_Memming_Park1",
        "aff": "Champalimaud Research;;Champalimaud Centre for the Unknown",
        "aff_domain": "fchampalimaud.org;;fchampalimaud.org",
        "position": "PhD student;;Associate Professor",
        "bibtex": "@misc{\ns{\\'a}godi2024rnns,\ntitle={{RNNS} with gracefully degrading continuous attractors},\nauthor={{\\'A}bel S{\\'a}godi and Piotr A Sokol and Il Memming Park},\nyear={2024},\nurl={https://openreview.net/forum?id=iqHh5Iuytv}\n}",
        "github": "",
        "project": "",
        "reviewers": "2ZH1;EwtU;yzhP;K1Kz",
        "site": "https://openreview.net/forum?id=iqHh5Iuytv",
        "pdf_size": 47427346,
        "rating": "3;5;5;5",
        "confidence": "2;3;4;4",
        "soundness": "2;3;3;2",
        "contribution": "2;2;2;2",
        "presentation": "2;3;2;3",
        "wc_summary": "610;75;93;74",
        "wc_strengths": "19;16;47;51",
        "wc_weaknesses": "207;148;390;96",
        "wc_questions": "51;123;12;2",
        "wc_review": "887;362;542;223",
        "wc_reply_reviewers": "0;0;0;48",
        "wc_reply_authors": "675;735;615;773",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            213.0,
            229.33272771237864
        ],
        "wc_strengths_avg": [
            33.25,
            15.848895860595462
        ],
        "wc_weaknesses_avg": [
            210.25,
            110.96029695345989
        ],
        "wc_questions_avg": [
            47.0,
            47.544715794712666
        ],
        "wc_review_avg": [
            503.5,
            248.6247171944093
        ],
        "wc_reply_reviewers_avg": [
            12.0,
            20.784609690826528
        ],
        "wc_reply_authors_avg": [
            699.5,
            60.00624967451307
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.8703882797784891,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:wCVqecD-FRsJ:scholar.google.com/&scioq=RNNS+with+gracefully+degrading+continuous+attractors&hl=en&as_sdt=0,23",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Champalimaud Foundation;Champalimaud Centre for the Unknown",
        "aff_unique_dep": "Champalimaud Research;",
        "aff_unique_url": "https://www.champalimaud.org;https://www.champalimaud.org",
        "aff_unique_abbr": "CF;CCU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Portugal"
    },
    {
        "id": "irBktGvHmC",
        "title": "Characterizing Exceptional Distributions with Neural Rule Extraction",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Explaining the characteristics of patients with an unusual disease mortality can be an important tool to a clinician\nto understand and treat diseases.\nMore generally, our goal is to find subsets of the data where the distribution of the target property, e.g. patient survivability, differs.\nThe discovered subset must also defined by a human-interpretable rule given some descriptive features.\nHowever, previous methods typically constrain the property of interest to be a scalar, which must also follow some standard distribution. \nAdditionally, they require a prohibitive computational complexity for larger number of features, while, invariably, applying them on numerical features requires their a-priori discretisation.\n\nTo this end, we propose SYFLOW, a method which leverages the flexibility of normalising flows to learn any distribution that the property of interest may follow. \nWith this, we then quantify the KL-divergence of this distribution in the discovered subset, thus yielding an objective that can be directly optimised all the way back to learnable feature weights. These, in turn, result in interpretable descriptions like ``*Patients with heart disease and blood cholesterol above 243mg/dL*''.\n\nWhen applied on established real-world datasets, SYFLOW provides easily interpretable descriptions in a fraction of the times of state-of-the-art methods, \nand seamlessly extends onto multi-variate targets, such as images. \nIn evaluating on synthetic datasets, we also outperform the competition in terms of precision/recall, when the target property does not follow a simple distribution.\nIn general, SYFLOW enables a wide range of applications to find notable trends in their data.",
        "keywords": "Rule Learning;Normalizing Flows;Subgroup Discovery",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Sascha Xu;Nils Philipp Walter;Jilles Vreeken;Janis Kalofolias",
        "authorids": "~Sascha_Xu1;~Nils_Philipp_Walter1;~Jilles_Vreeken2;~Janis_Kalofolias1",
        "gender": "M;M;M;M",
        "homepage": ";;https://vreeken.eu;",
        "dblp": "247/3300;;94/6462;194/4254",
        "google_scholar": "https://scholar.google.de/citations?user=82xDR9IAAAAJ;https://scholar.google.de/citations?user=uMpszvoAAAAJ;p5HEQfIAAAAJ;",
        "orcid": "0009-0008-5191-0342;;0000-0002-2310-2806;0000-0002-5842-8750",
        "linkedin": "sascha-xu-36073216a/;;jilles-vreeken-b3b05b58/;",
        "or_profile": "~Sascha_Xu1;~Nils_Philipp_Walter1;~Jilles_Vreeken2;~Janis_Kalofolias1",
        "aff": "CISPA, saarland university, saarland informatics campus;CISPA, saarland university, saarland informatics campus;CISPA Helmholtz Center for Information Security;CISPA, Helmholtz Center for Information Security",
        "aff_domain": "cispa.saarland;cispa.saarland;cispa.de;cispa.saarland",
        "position": "PhD student;PhD student;Tenured Faculty;PhD student",
        "bibtex": "@misc{\nxu2024characterizing,\ntitle={Characterizing Exceptional Distributions with Neural Rule Extraction},\nauthor={Sascha Xu and Nils Philipp Walter and Jilles Vreeken and Janis Kalofolias},\nyear={2024},\nurl={https://openreview.net/forum?id=irBktGvHmC}\n}",
        "github": "",
        "project": "",
        "reviewers": "fxuS;SrBh;MKfq;eY6J;mMzX",
        "site": "https://openreview.net/forum?id=irBktGvHmC",
        "pdf_size": 948995,
        "rating": "3;3;5;5;6",
        "confidence": "4;3;4;4;3",
        "soundness": "2;2;2;3;3",
        "contribution": "3;2;2;2;3",
        "presentation": "2;3;2;2;2",
        "wc_summary": "131;21;132;114;65",
        "wc_strengths": "152;43;93;18;103",
        "wc_weaknesses": "706;210;328;167;175",
        "wc_questions": "87;22;96;5;133",
        "wc_review": "1076;296;649;304;476",
        "wc_reply_reviewers": "291;0;0;0;13",
        "wc_reply_authors": "804;592;110;239;102",
        "reply_reviewers": "1;0;0;0;1",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            4.4,
            1.2
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.2,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            92.6,
            43.297113067732354
        ],
        "wc_strengths_avg": [
            81.8,
            47.071859959003106
        ],
        "wc_weaknesses_avg": [
            317.2,
            202.75837837189368
        ],
        "wc_questions_avg": [
            68.6,
            47.86063100294437
        ],
        "wc_review_avg": [
            560.2,
            288.60519745839645
        ],
        "wc_reply_reviewers_avg": [
            60.8,
            115.21006900440602
        ],
        "wc_reply_authors_avg": [
            369.4,
            280.7928774025438
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.06804138174397723,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Rdidu8UANP0J:scholar.google.com/&scioq=Characterizing+Exceptional+Distributions+with+Neural+Rule+Extraction&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "Saarland University;CISPA Helmholtz Center for Information Security;Helmholtz Center for Information Security",
        "aff_unique_dep": "CISPA;;CISPA",
        "aff_unique_url": "https://www.uni-saarland.de;https://www.cispa.de/;https://www.cispa.de/",
        "aff_unique_abbr": "Saarland U;CISPA;CISPA",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Saarland Informatics Campus;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "title": "DOS: Diverse Outlier Sampling for Out-of-Distribution Detection",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18047",
        "id": "iriEqxFB4y",
        "author_site": "Wenyu Jiang, Hao Cheng, MingCai Chen, Chongjun Wang, Hongxin Wei",
        "tldr": "",
        "abstract": "Modern neural networks are known to give overconfident predictions for out-of-distribution inputs when deployed in the open world. It is common practice to leverage a surrogate outlier dataset to regularize the model during training, and recent studies emphasize the role of uncertainty in designing the sampling strategy for outlier datasets. However, the OOD samples selected solely based on predictive uncertainty can be biased towards certain types, which may fail to capture the full outlier distribution. In this work, we empirically show that diversity is critical in sampling outliers for OOD detection performance. Motivated by the observation, we propose a straightforward and novel sampling strategy named DOS (Diverse Outlier Sampling) to select diverse and informative outliers. Specifically, we cluster the normalized features at each iteration, and the most informative outlier from each cluster is selected for model training with absent category loss. With DOS, the sampled outliers efficiently shape a globally compact decision boundary between ID and OOD data. Extensive experiments demonstrate the superiority of DOS, reducing the average FPR95 by up to 25.79% on CIFAR-100 with TI-300K.",
        "keywords": "out-of-distribution detection;data-centric artificial intelligence",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/530e2c1bdc10b2339a08bf05dae7e4dae3880962.zip",
        "author": "Wenyu Jiang;Hao Cheng;MingCai Chen;Chongjun Wang;Hongxin Wei",
        "authorids": "~Wenyu_Jiang1;~Hao_Cheng14;~MingCai_Chen1;~Chongjun_Wang1;~Hongxin_Wei1",
        "gender": "M;M;;M;M",
        "homepage": ";https://ha0cheng.github.io/;https://chenmc1996.github.io/;;https://hongxin001.github.io/",
        "dblp": ";;138/3964;07/146;150/6350",
        "google_scholar": "mdOH9HQAAAAJ;https://scholar.google.com.hk/citations?user=Nred870AAAAJ;dQwpk-8AAAAJ;;cABH034AAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Wenyu_Jiang1;~Hao_Cheng14;~MingCai_Chen1;~Chongjun_Wang1;~Hongxin_Wei1",
        "aff": "Nanjing University;;Nanjing University;Nanjing University;Southern University of Science and Technology",
        "aff_domain": "nju.edu.cn;;nju.edu.cn;nju.edu.cn;sustech.edu.cn",
        "position": "PhD student;;PhD student;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\njiang2024dos,\ntitle={{DOS}: Diverse Outlier Sampling for Out-of-Distribution Detection},\nauthor={Wenyu Jiang and Hao Cheng and MingCai Chen and Chongjun Wang and Hongxin Wei},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=iriEqxFB4y}\n}",
        "github": "",
        "project": "",
        "reviewers": "BvLD;HJAj;bYrq",
        "pdf_size": 3307827,
        "rating": "6;8;8",
        "confidence": "3;4;4",
        "soundness": "3;4;4",
        "contribution": "2;3;3",
        "presentation": "3;3;4",
        "wc_summary": "97;130;106",
        "wc_strengths": "65;119;26",
        "wc_weaknesses": "146;254;153",
        "wc_questions": "98;267;2",
        "wc_review": "406;770;287",
        "wc_reply_reviewers": "0;206;32",
        "wc_reply_authors": "1012;1030;383",
        "reply_reviewers": "0;2;1",
        "reply_authors": "2;4;3",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            111.0,
            13.92838827718412
        ],
        "wc_strengths_avg": [
            70.0,
            38.13135192987524
        ],
        "wc_weaknesses_avg": [
            184.33333333333334,
            49.34459330959056
        ],
        "wc_questions_avg": [
            122.33333333333333,
            109.54552579736986
        ],
        "wc_review_avg": [
            487.6666666666667,
            205.46586631901226
        ],
        "wc_reply_reviewers_avg": [
            79.33333333333333,
            90.5145783224387
        ],
        "wc_reply_authors_avg": [
            808.3333333333334,
            300.84584461518193
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            3.0,
            0.816496580927726
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.9999999999999998,
        "gs_citation": 17,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10811072676198448472&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=iriEqxFB4y",
        "pdf": "https://openreview.net/pdf?id=iriEqxFB4y",
        "email": "nju.edu.cn;;nju.edu.cn;nju.edu.cn;sustech.edu.cn",
        "author_num": 5,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "Nanjing University;Southern University of Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.nju.edu.cn;https://www.sustech.edu.cn",
        "aff_unique_abbr": "Nanjing U;SUSTech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "irorVob9Eq",
        "title": "Towards the Characterization of Representations Learned via Capsule-based Network Architectures",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Capsule Networks (CapsNets) have been re-introduced as a more compact and interpretable alternative to standard deep neural networks. While recent efforts have proved their compression capabilities, to date, their interpretability properties have not been fully assessed. Here, we conduct a systematic and principled study towards assessing the interpretability of these types of networks. We pay special attention towards analyzing the level to which part-whole relationships are encoded within the learned representation. Our analysis in the MNIST, SVHN, PASCAL-part and CelebA datasets on several capsule-based architectures suggest that the representations encoded in CapsNets might not be as disentangled nor strictly related to parts-whole relationships as is commonly stated in the literature.",
        "keywords": "capsule networks;interpretation;hierarchical relationships;explanations;representation learning;perturbations;part-whole relationships",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Saja AL Tawalbeh;Jose Oramas",
        "authorids": "~Saja_AL_Tawalbeh1;~Jose_Oramas1",
        "gender": "M;F",
        "homepage": "http://idlab.uantwerpen.be/~joramasmogrovejo;https://www.uantwerpen.be/nl/personeel/saja-tawalbeh/",
        "dblp": "47/9735;281/8699.html",
        "google_scholar": "FurBYlUAAAAJ;p6PVOMEAAAAJ",
        "orcid": "0000-0002-8607-5067;0000-0001-6278-0768",
        "linkedin": "https://linkedin.com/in/jos%C3%A9-oramas-m-3183501b;saja-tawalbeh-b744a1151/",
        "or_profile": "~Jose_Oramas1;~Saja_Khaled_Tawalbeh1",
        "aff": "University of Antwerp;Universiteit Antwerpen",
        "aff_domain": "uantwerpen.be;ua.ac.be",
        "position": "Associate Professor;PhD student",
        "bibtex": "@misc{\ntawalbeh2024towards,\ntitle={Towards the Characterization of Representations Learned via Capsule-based Network Architectures},\nauthor={Saja AL Tawalbeh and Jose Oramas},\nyear={2024},\nurl={https://openreview.net/forum?id=irorVob9Eq}\n}",
        "github": "",
        "project": "",
        "reviewers": "FL72;nJf8;66ge",
        "site": "https://openreview.net/forum?id=irorVob9Eq",
        "pdf_size": 42748863,
        "rating": "5;6;6",
        "confidence": "3;2;4",
        "soundness": "2;3;3",
        "contribution": "2;3;2",
        "presentation": "3;3;2",
        "wc_summary": "42;149;65",
        "wc_strengths": "31;67;79",
        "wc_weaknesses": "87;37;648",
        "wc_questions": "4;5;5",
        "wc_review": "164;258;797",
        "wc_reply_reviewers": "24;19;44",
        "wc_reply_authors": "686;190;1383",
        "reply_reviewers": "1;1;1",
        "reply_authors": "4;1;6",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            85.33333333333333,
            45.98792111945146
        ],
        "wc_strengths_avg": [
            59.0,
            20.396078054371138
        ],
        "wc_weaknesses_avg": [
            257.3333333333333,
            276.99618930391244
        ],
        "wc_questions_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "wc_review_avg": [
            406.3333333333333,
            278.8958387801598
        ],
        "wc_reply_reviewers_avg": [
            29.0,
            10.801234497346433
        ],
        "wc_reply_authors_avg": [
            753.0,
            489.3390099579908
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            2.0548046676563256
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13173090074440592344&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Antwerp",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uantwerp.be",
        "aff_unique_abbr": "UA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Belgium"
    },
    {
        "title": "MAPE-PPI: Towards Effective and Efficient Protein-Protein Interaction Prediction via Microenvironment-Aware Protein Embedding",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18046",
        "id": "itGkF993gz",
        "author_site": "Lirong Wu, Yijun Tian, Yufei Huang, Siyuan Li, Haitao Lin, Nitesh Chawla, Stan Z Li",
        "tldr": "",
        "abstract": "Protein-Protein Interactions (PPIs) are fundamental in various biological processes and play a key role in life activities. The growing demand and cost of experimental PPI assays require computational methods for efficient PPI prediction. While existing methods rely heavily on protein sequence for PPI prediction, it is the protein structure that is the key to determine the interactions. To take both protein modalities into account, we define the microenvironment of an amino acid residue by its sequence and structural contexts, which describe the surrounding chemical properties and geometric features. In addition, microenvironments defined in previous work are largely based on experimentally assayed physicochemical properties, for which the \"vocabulary\" is usually extremely small. This makes it difficult to cover the diversity and complexity of microenvironments. In this paper, we propose Microenvironment-Aware Protein Embedding for PPI prediction (MPAE-PPI), which encodes microenvironments into chemically meaningful discrete codes via a sufficiently large microenvironment \"vocabulary\" (i.e., codebook). Moreover, we propose a novel pre-training strategy, namely Masked Codebook Modeling (MCM), to capture the dependencies between different microenvironments by randomly masking the codebook and reconstructing the input. With the learned microenvironment codebook, we can reuse it as an off-the-shelf tool to efficiently and effectively encode proteins of different sizes and functions for large-scale PPI prediction. Extensive experiments show that MAPE-PPI can scale to PPI prediction with millions of PPIs with superior trade-offs between effectiveness and computational efficiency than the state-of-the-art competitors.",
        "keywords": "Bioinformatics;Protein-Protein Interaction;Protein Sequence-Structure Co-Modeling",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Lirong Wu;Yijun Tian;Yufei Huang;Siyuan Li;Haitao Lin;Nitesh V Chawla;Stan Z. Li",
        "authorids": "~Lirong_Wu1;~Yijun_Tian1;~Yufei_Huang4;~Siyuan_Li6;~Haitao_Lin2;~Nitesh_V_Chawla1;~Stan_Z._Li2",
        "gender": ";;M;M;M;M;M",
        "homepage": ";https://www.yijuntian.com/;https://2021.igem.org/Team:ZJU-China;https://lupin1998.github.io/;;http://niteshchawla.nd.edu;https://en.westlake.edu.cn/academics/School_of_Engineering/About/Our_People/Faculty/201912/t20191206_2497.shtml",
        "dblp": "15/10330;234/9123-1;68/1946-2;63/9705-2;34/1040;c/NiteshVChawla.html;l/StanZLi",
        "google_scholar": "Tk7TrCoAAAAJ;dbaBgV0AAAAJ;qmTjdwIAAAAJ;https://scholar.google.com/citations?hl=zh-CN;o5A23qIAAAAJ;hDLBEhkAAAAJ;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": ";0000-0003-2795-6080;0009-0007-8184-4529;0000-0001-6806-2468;;;",
        "linkedin": ";yijun-tian/;;https://www.linkedin.cn/incareer/in/siyuan-li-lupin1998/;;;stan-z-li-%E6%9D%8E%E5%AD%90%E9%9D%92-55753224/",
        "or_profile": "~Lirong_Wu1;~Yijun_Tian1;~Yufei_Huang4;~Siyuan_Li6;~Haitao_Lin2;~Nitesh_Chawla1;~Stan_Z._Li1",
        "aff": "Westlake University;University of Notre Dame;Zhejiang University;Alibaba Group;Westlake University;University of Notre Dame;Westlake University",
        "aff_domain": "westlake.edu.cn;nd.edu;zju.edu.cn;alibaba-inc.com;westlake.edu.cn;nd.edu;westlake.edu.cn",
        "position": "PhD student;PhD student;PhD student;Intern;PhD student;Full Professor;Chair Professor",
        "bibtex": "@inproceedings{\nwu2024mapeppi,\ntitle={{MAPE}-{PPI}: Towards Effective and Efficient Protein-Protein Interaction Prediction via Microenvironment-Aware Protein Embedding},\nauthor={Lirong Wu and Yijun Tian and Yufei Huang and Siyuan Li and Haitao Lin and Nitesh V Chawla and Stan Z. Li},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=itGkF993gz}\n}",
        "github": "",
        "project": "",
        "reviewers": "wZyc;4o6m;XV9S",
        "pdf_size": 1528957,
        "rating": "3;6;8",
        "confidence": "4;4;5",
        "soundness": "3;3;3",
        "contribution": "2;3;4",
        "presentation": "3;3;3",
        "wc_summary": "71;34;113",
        "wc_strengths": "20;54;188",
        "wc_weaknesses": "268;71;125",
        "wc_questions": "5;71;17",
        "wc_review": "364;230;443",
        "wc_reply_reviewers": "0;0;17",
        "wc_reply_authors": "1503;519;626",
        "reply_reviewers": "0;0;1",
        "reply_authors": "3;1;1",
        "rating_avg": [
            5.666666666666667,
            2.0548046676563256
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            72.66666666666667,
            32.27313984655902
        ],
        "wc_strengths_avg": [
            87.33333333333333,
            72.52279335185287
        ],
        "wc_weaknesses_avg": [
            154.66666666666666,
            83.11571585580083
        ],
        "wc_questions_avg": [
            31.0,
            28.705400188814647
        ],
        "wc_review_avg": [
            345.6666666666667,
            87.91789098673577
        ],
        "wc_reply_reviewers_avg": [
            5.666666666666667,
            8.013876853447538
        ],
        "wc_reply_authors_avg": [
            882.6666666666666,
            440.81162517439225
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.8029550685469661,
        "gs_citation": 32,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=682281181564090132&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=itGkF993gz",
        "pdf": "https://openreview.net/pdf?id=itGkF993gz",
        "email": "westlake.edu.cn;nd.edu;zju.edu.cn;alibaba-inc.com;westlake.edu.cn;nd.edu;westlake.edu.cn",
        "author_num": 7,
        "aff_unique_index": "0;1;2;3;0;1;0",
        "aff_unique_norm": "Westlake University;University of Notre Dame;Zhejiang University;Alibaba Group",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.westlake.edu.cn;https://www.nd.edu;https://www.zju.edu.cn;https://www.alibaba.com",
        "aff_unique_abbr": "WU;Notre Dame;ZJU;Alibaba",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "itJj6p7ssr",
        "title": "Hardware-Friendly Post-Training Quantization: Input- and Output-Channelwise Scale and Offset",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Post-training quantization enables swift quantization of neural networks using a minimal calibration dataset.\nSpecifically, these methods tend to underperform dramatically on hardware with fixed integer bit width, particularly in extremely low-bit quantization scenarios.\nIn response, we introduce an optimized method for uniform channel-wise quantization, which is compatible with existing hardware. This approach does not increase memory requirements and results in only a marginal increase in computation.\nThis strategy involves applying a specific multiplier to the result of the weighted activation products, thereby yielding a more accurate result for the multiply-accumulate (MAC) operation in convolutional or fully-connected layers. We also present an optimization technique to determine the optimal channel grouping approach.\nTo affirm the superiority of our proposed quantization scheme, we conducted tests on a variety of CNN-based models.\nOur proposed approach enhances accuracy in 2/4-bit weight and feature quantization by 1-5%p while only increasing the number of integer operations in convolutional-based networks by less than 1.5%.",
        "keywords": "post-training quantization;CNN;computer vision;low-bit;discrete optimization;Neural network quantization;calculation cost",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/1e3b5df0347dd363400abdb59858496e26c0cbac.zip",
        "author": "Geunjae Choi;Kamin Lee;KiYoon Yoo;Nojun Kwak",
        "authorids": "~Geunjae_Choi1;~Kamin_Lee1;~KiYoon_Yoo1;~Nojun_Kwak1",
        "gender": ";F;M;M",
        "homepage": ";;http://mipal.snu.ac.kr;http://mipal.snu.ac.kr",
        "dblp": ";356/2611;266/1524;49/2806",
        "google_scholar": ";;S93OUYQAAAAJ;h_8-1M0AAAAJ",
        "orcid": ";;;0000-0002-1792-0327",
        "linkedin": ";kamin-lee/;;",
        "or_profile": "~Geunjae_Choi1;~Kamin_Lee1;~KiYoon_Yoo1;~Nojun_Kwak1",
        "aff": ";LG Electronics;Seoul National University;Seoul National University",
        "aff_domain": ";lge.com;snu.ac.kr;snu.ac.kr",
        "position": ";Researcher;PhD student;Full Professor",
        "bibtex": "@misc{\nchoi2024hardwarefriendly,\ntitle={Hardware-Friendly Post-Training Quantization: Input- and Output-Channelwise Scale and Offset},\nauthor={Geunjae Choi and Kamin Lee and KiYoon Yoo and Nojun Kwak},\nyear={2024},\nurl={https://openreview.net/forum?id=itJj6p7ssr}\n}",
        "github": "",
        "project": "",
        "reviewers": "LRrq;J41k;Zj2N;yDxC",
        "site": "https://openreview.net/forum?id=itJj6p7ssr",
        "pdf_size": 1652232,
        "rating": "5;5;6;8",
        "confidence": "5;4;5;4",
        "soundness": "3;2;3;3",
        "contribution": "2;2;2;2",
        "presentation": "2;3;3;4",
        "wc_summary": "42;38;113;39",
        "wc_strengths": "62;28;46;48",
        "wc_weaknesses": "121;67;131;50",
        "wc_questions": "21;6;195;72",
        "wc_review": "246;139;485;209",
        "wc_reply_reviewers": "79;0;21;0",
        "wc_reply_authors": "1483;898;1226;497",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "3;2;3;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            58.0,
            31.788362650504666
        ],
        "wc_strengths_avg": [
            46.0,
            12.083045973594572
        ],
        "wc_weaknesses_avg": [
            92.25,
            34.46284230878237
        ],
        "wc_questions_avg": [
            73.5,
            74.29165498223875
        ],
        "wc_review_avg": [
            269.75,
            130.07954297275188
        ],
        "wc_reply_reviewers_avg": [
            25.0,
            32.334192428449484
        ],
        "wc_reply_authors_avg": [
            1026.0,
            369.1456352173218
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.40824829046386296,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:PVosMXZECeoJ:scholar.google.com/&scioq=Hardware-Friendly+Post-Training+Quantization:+Input-+and+Output-Channelwise+Scale+and+Offset&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "LG;Seoul National University",
        "aff_unique_dep": "LG Electronics;",
        "aff_unique_url": "https://www.lg.com;https://www.snu.ac.kr",
        "aff_unique_abbr": "LG;SNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "itKMOWSP6K",
        "title": "FusionFormer: A Multi-sensory Fusion in Bird's-Eye-View and Temporal Consistent Transformer for 3D Object Detection",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Multi-sensor modal fusion has demonstrated strong advantages in 3D object detection tasks. However, existing methods that fuse multi-modal features require transforming features into the bird's eye view space and may lose certain information on Z-axis, thus leading to inferior performance. To this end, we propose a novel end-to-end multi-modal fusion transformer-based framework, dubbed FusionFormer, that incorporates deformable attention and residual structures within the fusion encoding module. Specifically, by developing a uniform sampling strategy, our method can easily sample from 2D image and 3D voxel features spontaneously, thus exploiting flexible adaptability and avoiding explicit transformation to the bird's eye view space during the feature concatenation process. We further implement a residual structure in our feature encoder to ensure the model's robustness in case of missing an input modality. Through extensive experiments on a popular autonomous driving benchmark dataset, nuScenes, our method achieves state-of-the-art single model performance of 72.6% mAP and 75.1% NDS in the 3D object detection task without test time augmentation.",
        "keywords": "multi-sensory fusion;temporal fusion;transformer;3D object detection",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/089b0390292a345ead0fe658cc9dc218acb984cd.zip",
        "author": "Chunyong Hu;Hang Zheng;Kun Li;Jianyun Xu;Weibo Mao;Maochun Luo;Lingxuan Wang;Mingxia Chen;Qihao Peng;Kaixuan Liu;Yiru Zhao;Hao Peihan;Minzhe Liu;Kaicheng Yu",
        "authorids": "~Chunyong_Hu1;~Hang_Zheng1;~Kun_Li7;~Jianyun_Xu1;~Weibo_Mao1;~Maochun_Luo1;~Lingxuan_Wang1;~Mingxia_Chen1;~Qihao_Peng1;~Kaixuan_Liu1;~Yiru_Zhao1;~Hao_Peihan1;~Minzhe_Liu1;~Kaicheng_Yu1",
        "gender": "M;M;M;M;M;M;M;M;M;;;;M;M",
        "homepage": ";;https://flunge.github.io/;;;;;;;https://scholar.google.com/citations?user=YJns6hQAAAAJ&hl=zh-CN;;;https://iscl.nju.edu.cn/e7/87/c42983a518023/page.htm;https://www.yukaicheng.cn",
        "dblp": "288/2242;92/1606;;21/3291;44/4166;;;;;;184/9442;;;",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?view_op=list_works;;;;YJns6hQAAAAJ;;https://scholar.google.com.hk/citations?hl=zh-CN;;j9OguiIAAAAJ",
        "orcid": ";;;;;;0000-0003-3897-7346;;0000-0002-1115-5767;;;;;",
        "linkedin": ";;;;weibo-mao-3b2876236/;;;chenmingxia;;;;;;",
        "or_profile": "~Chunyong_Hu1;~Hang_Zheng1;~Kun_Li7;~Jianyun_Xu1;~Weibo_Mao1;~Maochun_Luo1;~Lingxuan_Wang1;~Mingxia_Chen1;~Qihao_Peng1;~Kaixuan_Liu1;~Yiru_Zhao1;~Hao_Peihan1;~Minzhe_Liu1;~Kaicheng_Yu1",
        "aff": "Alibaba Group;;Alibaba Group;Alibaba Group;;Alibaba Group;Alibaba Group;Alibaba Group;Alibaba Group;;Alibaba Group;;;Westlake University",
        "aff_domain": "alibaba-inc.com;;alibaba-inc.com;alibaba-inc.com;;alibaba-inc.com;alibaba-inc.com;cainiao.com;alibaba-inc.com;;alibaba-inc.com;;;westlake.edu",
        "position": "Researcher;;Researcher;Researcher;;Researcher;Researcher;Researcher;Intern;;Researcher;;;Assistant Professor",
        "bibtex": "@misc{\nhu2024fusionformer,\ntitle={FusionFormer: A Multi-sensory Fusion in Bird's-Eye-View and Temporal Consistent Transformer for 3D Object Detection},\nauthor={Chunyong Hu and Hang Zheng and Kun Li and Jianyun Xu and Weibo Mao and Maochun Luo and Lingxuan Wang and Mingxia Chen and Qihao Peng and Kaixuan Liu and Yiru Zhao and Hao Peihan and Minzhe Liu and Kaicheng Yu},\nyear={2024},\nurl={https://openreview.net/forum?id=itKMOWSP6K}\n}",
        "github": "",
        "project": "",
        "reviewers": "q7W1;5zjx;bQU3;Qpuj",
        "site": "https://openreview.net/forum?id=itKMOWSP6K",
        "pdf_size": 11786182,
        "rating": "3;6;6;6",
        "confidence": "4;2;5;3",
        "soundness": "3;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;4",
        "wc_summary": "36;32;58;147",
        "wc_strengths": "37;22;32;44",
        "wc_weaknesses": "124;82;232;99",
        "wc_questions": "6;4;52;44",
        "wc_review": "203;140;374;334",
        "wc_reply_reviewers": "0;0;187;0",
        "wc_reply_authors": "911;591;2215;757",
        "reply_reviewers": "0;0;2;0",
        "reply_authors": "2;1;8;2",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            68.25,
            46.53157530107916
        ],
        "wc_strengths_avg": [
            33.75,
            8.011710179481033
        ],
        "wc_weaknesses_avg": [
            134.25,
            58.379683966256614
        ],
        "wc_questions_avg": [
            26.5,
            21.696773953747133
        ],
        "wc_review_avg": [
            262.75,
            94.98782816761315
        ],
        "wc_reply_reviewers_avg": [
            46.75,
            80.97337525384502
        ],
        "wc_reply_authors_avg": [
            1118.5,
            643.0993313633594
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            3.25,
            2.7726341266023544
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            14,
            0
        ],
        "corr_rating_confidence": -0.2581988897471611,
        "gs_citation": 27,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15030771655949444070&as_sdt=5,34&sciodt=0,34&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0;0;0;0;0;1",
        "aff_unique_norm": "Alibaba Group;Westlake University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.alibaba.com;https://www.westlake.edu.cn",
        "aff_unique_abbr": "Alibaba;WU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "itNHdOzZig",
        "title": "Encodings for Prediction-based Neural Architecture Search",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Predictor-based methods have substantially enhanced Neural Architecture Search (NAS) optimization, with the efficacy of these predictors largely influenced by the method of encoding neural network architectures. \nWhile traditional encodings used an adjacency matrix describing the graph structure of a neural network, novel encodings embrace a variety of approaches from unsupervised pretraining of latent representations to vectors of zero-cost proxies. \nIn this paper, we categorize and investigate neural encodings from three main types: structural, learned, and score-based.\nFurthermore, we extend these encodings and introduce unified encodings, that extend NAS predictors to multiple search spaces. \nOur analysis draws from experiments conducted on over 1.5 million neural network architectures on NAS spaces such as NASBench-101 (NB101), NB201, NB301, Network Design Spaces (NDS), and TransNASBench-101. \nBuilding on our study, we present our predictor FLAN: Flow Attention for NAS. \nFLAN integrates critical insights on predictor design, transfer learning, and unified encodings to enable more than an order of magnitude cost reduction for training NAS accuracy predictors. Our implementation and encodings for all neural networks are open-sourced at \\url{https://anonymous.4open.science/r/flan_nas-433F/}.",
        "keywords": "Architecture Encodings;Neural architecture search (NAS);Predictor-based NAS;AutoML",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Yash Akhauri;Mohamed S Abdelfattah",
        "authorids": "~Yash_Akhauri1;~Mohamed_S_Abdelfattah1",
        "gender": "M;M",
        "homepage": ";https://mohsaied.github.io/",
        "dblp": "241/9414;124/7095",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.ca/citations?user=q4wBpWAAAAAJ",
        "orcid": ";",
        "linkedin": ";mabdelfattah/",
        "or_profile": "~Yash_Akhauri1;~Mohamed_S_Abdelfattah1",
        "aff": "Cornell University;Cornell University",
        "aff_domain": "cornell.edu;cornell.edu",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nakhauri2024encodings,\ntitle={Encodings for Prediction-based Neural Architecture Search},\nauthor={Yash Akhauri and Mohamed S Abdelfattah},\nyear={2024},\nurl={https://openreview.net/forum?id=itNHdOzZig}\n}",
        "github": "",
        "project": "",
        "reviewers": "14w6;nwAh;oKjh",
        "site": "https://openreview.net/forum?id=itNHdOzZig",
        "pdf_size": 12917519,
        "rating": "3;6;8",
        "confidence": "5;4;5",
        "soundness": "2;3;4",
        "contribution": "2;3;4",
        "presentation": "1;3;4",
        "wc_summary": "74;101;96",
        "wc_strengths": "52;73;145",
        "wc_weaknesses": "994;104;146",
        "wc_questions": "121;216;210",
        "wc_review": "1241;494;597",
        "wc_reply_reviewers": "710;156;67",
        "wc_reply_authors": "2243;1407;708",
        "reply_reviewers": "1;2;1",
        "reply_authors": "6;5;2",
        "rating_avg": [
            5.666666666666667,
            2.0548046676563256
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "wc_summary_avg": [
            90.33333333333333,
            11.728408057172787
        ],
        "wc_strengths_avg": [
            90.0,
            39.824615503479755
        ],
        "wc_weaknesses_avg": [
            414.6666666666667,
            410.00921398860726
        ],
        "wc_questions_avg": [
            182.33333333333334,
            43.438334324521335
        ],
        "wc_review_avg": [
            777.3333333333334,
            330.54735750805145
        ],
        "wc_reply_reviewers_avg": [
            311.0,
            284.4655808119265
        ],
        "wc_reply_authors_avg": [
            1452.6666666666667,
            627.4925409029887
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            4.333333333333333,
            1.699673171197595
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.11470786693528084,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3146587467407181773&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Cornell University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cornell.edu",
        "aff_unique_abbr": "Cornell",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "itrOA1adPn",
        "title": "A computational approach to visual ecology with deep reinforcement learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Animal vision is thought to optimize various objectives from metabolic efficiency to discrimination performance, yet its ultimate objective is to facilitate the survival of the animal within its ecological niche. However, modeling animal behavior in complex environments has been challenging. To study how environments shape and constrain visual processing, we developed a deep reinforcement learning framework in which an agent moves through a 3-d environment that it perceives through a vision model, where its only goal is to survive. Within this framework we developed a foraging task where the agent must gather food that sustains it, and avoid food that harms it. We first established that the complexity of the vision model required for survival on this task scaled with the variety and visual complexity of the food in the environment. Moreover, we showed that a recurrent network architecture was necessary to fully exploit complex vision models on the most visually demanding tasks.  Finally, we showed how different network architectures learned distinct representations of the environment and task, and lead the agent to exhibit distinct behavioural strategies. In summary, this paper lays the foundation for a computational approach to visual ecology, provides extensive benchmarks for future work, and demonstrates how representations and behaviour emerge from an agent's drive for survival.",
        "keywords": "Visual Ecology;Deep Reinforcement Learning;Neural Coding",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/f0aee4177abf0834c084c8071ce4a96776fb1d9a.zip",
        "author": "Sacha Sokoloski;Jure Majnik;Philipp Berens",
        "authorids": "~Sacha_Sokoloski1;~Jure_Majnik1;~Philipp_Berens1",
        "gender": "M;;M",
        "homepage": "https://sacha-sokoloski.gitlab.io/website/;https://github.com/juremaj;http://www.berenslab.org",
        "dblp": ";;78/3560",
        "google_scholar": ";;https://scholar.google.de/citations?user=lPQLk3QAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Sacha_Sokoloski1;~Jure_Majnik1;~Philipp_Berens1",
        "aff": "Eberhard-Karls-Universit\u00e4t T\u00fcbingen;Institut de neurobiologie de la m\u00e9diterran\u00e9e;University of Tuebingen",
        "aff_domain": "uni-tuebingen.de;inserm.fr;uni-tuebingen.de",
        "position": "Postdoc;PhD student;Full Professor",
        "bibtex": "@misc{\nsokoloski2024a,\ntitle={A computational approach to visual ecology with deep reinforcement learning},\nauthor={Sacha Sokoloski and Jure Majnik and Philipp Berens},\nyear={2024},\nurl={https://openreview.net/forum?id=itrOA1adPn}\n}",
        "github": "",
        "project": "",
        "reviewers": "pa3w;zf5P;PwAE;bdjp",
        "site": "https://openreview.net/forum?id=itrOA1adPn",
        "pdf_size": 1688936,
        "rating": "3;3;5;6",
        "confidence": "5;4;3;3",
        "soundness": "3;2;3;3",
        "contribution": "1;2;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "93;101;179;118",
        "wc_strengths": "38;67;31;32",
        "wc_weaknesses": "486;168;742;43",
        "wc_questions": "61;70;262;101",
        "wc_review": "678;406;1214;294",
        "wc_reply_reviewers": "763;74;0;117",
        "wc_reply_authors": "1399;927;2346;364",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "3;2;4;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            122.75,
            33.70738049745189
        ],
        "wc_strengths_avg": [
            42.0,
            14.679918255903198
        ],
        "wc_weaknesses_avg": [
            359.75,
            273.47429038211254
        ],
        "wc_questions_avg": [
            123.5,
            81.32803944519996
        ],
        "wc_review_avg": [
            648.0,
            355.3646015010499
        ],
        "wc_reply_reviewers_avg": [
            238.5,
            305.6979718611165
        ],
        "wc_reply_authors_avg": [
            1259.0,
            726.7079881217765
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8703882797784892,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:d_kO5OPENDAJ:scholar.google.com/&scioq=A+computational+approach+to+visual+ecology+with+deep+reinforcement+learning&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Eberhard Karls University of T\u00fcbingen;Institut de Neurobiologie de la M\u00e9diterran\u00e9e;University of Tuebingen",
        "aff_unique_dep": ";Neurobiology;",
        "aff_unique_url": "https://www.uni-tuebingen.de/;https://www.institut-neurobiologie-mediterranee.cnrs.fr;https://www.uni-tuebingen.de/",
        "aff_unique_abbr": "Uni T\u00fcbingen;;Uni T\u00fcbingen",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "T\u00fcbingen;",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Germany;France"
    },
    {
        "id": "ivokwVKY4o",
        "title": "Formal Verification for Neural Networks with General Nonlinearities via Branch-and-Bound",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Bound propagation with branch-and-bound (BaB) is so far among the most effective methods for neural network (NN) verification. However, existing works with BaB have mostly focused on NNs with piecewise linear activations, especially ReLU networks. In this paper, we develop a framework for conducting BaB based on bound propagation with general branching points and an arbitrary number of branches, as an important move for extending NN verification to models with various nonlinearities beyond ReLU. Our framework strengthens verification for common element-wise activation functions, as well as other multi-dimensional nonlinear operations such as multiplication. In addition, we find that existing heuristics for choosing neurons to branch for ReLU networks are insufficient for general nonlinearities, and we design a new heuristic named BBPS, which usually outperforms the heuristic obtained by directly extending the existing ones originally developed for ReLU networks. We empirically demonstrate the effectiveness of our BaB framework on verifying a wide range of NNs, including networks with Sigmoid, Tanh,  sine or GeLU activations, LSTMs and ViTs, which have various nonlinearities. Our framework also enables applications with models beyond neural networks, such as models for AC Optimal Power Flow (ACOPF).",
        "keywords": "neural network verification;formal verification;robustness verification",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Zhouxing Shi;Qirui Jin;J Zico Kolter;Suman Jana;Cho-Jui Hsieh;Huan Zhang",
        "authorids": "~Zhouxing_Shi1;~Qirui_Jin1;~J_Zico_Kolter1;~Suman_Jana1;~Cho-Jui_Hsieh1;~Huan_Zhang1",
        "gender": ";M;M;M;M;M",
        "homepage": "https://shizhouxing.github.io;https://c-lister.github.io;http://sumanj.info;http://web.cs.ucla.edu/~chohsieh/index.html;http://huan-zhang.com;http://www.zicokolter.com",
        "dblp": "232/2169;;74/28;14/2770;23/1797-1.html;67/2526",
        "google_scholar": "YFIr4PwAAAAJ;0g6YBJMAAAAJ;https://scholar.google.com.tw/citations?user=SDY9FwUAAAAJ;Wy89g4IAAAAJ;LTa3GzEAAAAJ;UXh1I6UAAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Zhouxing_Shi1;~Qirui_Jin1;~Suman_Jana1;~Cho-Jui_Hsieh1;~Huan_Zhang1;~Zico_Kolter1",
        "aff": "University of California, Los Angeles;University of Michigan - Ann Arbor;, Columbia University;University of California, Los Angeles;University of Illinois, Urbana Champaign;Carnegie Mellon University",
        "aff_domain": "ucla.edu;umich.edu;cs.columbia.edu;ucla.edu;uiuc.edu;cmu.edu",
        "position": "PhD student;Undergrad student;Associate Professor;Associate Professor;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nshi2024formal,\ntitle={Formal Verification for Neural Networks with General Nonlinearities via Branch-and-Bound},\nauthor={Zhouxing Shi and Qirui Jin and J Zico Kolter and Suman Jana and Cho-Jui Hsieh and Huan Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=ivokwVKY4o}\n}",
        "github": "",
        "project": "",
        "reviewers": "abyN;NV4g;ygGn;Cfzz",
        "site": "https://openreview.net/forum?id=ivokwVKY4o",
        "pdf_size": 514217,
        "rating": "5;5;5;6",
        "confidence": "4;4;4;3",
        "soundness": "4;3;3;2",
        "contribution": "2;2;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "76;58;75;58",
        "wc_strengths": "86;47;21;49",
        "wc_weaknesses": "103;351;52;49",
        "wc_questions": "223;88;4;7",
        "wc_review": "488;544;152;163",
        "wc_reply_reviewers": "129;330;0;0",
        "wc_reply_authors": "953;1452;518;570",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            66.75,
            8.757139944068497
        ],
        "wc_strengths_avg": [
            50.75,
            23.155722834755128
        ],
        "wc_weaknesses_avg": [
            138.75,
            124.40734504039543
        ],
        "wc_questions_avg": [
            80.5,
            88.90584907642466
        ],
        "wc_review_avg": [
            336.75,
            180.38205980640092
        ],
        "wc_reply_reviewers_avg": [
            114.75,
            134.97291394942914
        ],
        "wc_reply_authors_avg": [
            873.25,
            373.9902238027085
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 19,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9555475681893750210&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;0;3;4",
        "aff_unique_norm": "University of California, Los Angeles;University of Michigan;Columbia University;University of Illinois Urbana-Champaign;Carnegie Mellon University",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.ucla.edu;https://www.umich.edu;https://www.columbia.edu;https://illinois.edu;https://www.cmu.edu",
        "aff_unique_abbr": "UCLA;UM;Columbia;UIUC;CMU",
        "aff_campus_unique_index": "0;1;0;3",
        "aff_campus_unique": "Los Angeles;Ann Arbor;;Urbana-Champaign",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "iwd9sQWnXb",
        "title": "Large Language Models are Effective Text Rankers with Pairwise Ranking Prompting",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Ranking documents using Large Language Models (LLMs) by directly feeding the query and candidate documents into the prompt is an interesting and practical problem. However, there has been limited success so far, as researchers have found it difficult to outperform fine-tuned baseline rankers on benchmark datasets. We analyze pointwise and listwise ranking prompts used by existing methods and argue that off-the-shelf LLMs do not fully understand these challenging ranking formulations. In this paper, we propose to significantly reduce the burden on LLMs by using a new technique called Pairwise Ranking Prompting (PRP). Our results are the first in the literature to achieve state-of-the-art ranking performance on standard benchmarks using moderate-sized open-sourced LLMs. On TREC-DL2020, PRP based on the Flan-UL2 model with 20B parameters outperforms the previous best approach in the literature, which is based on the blackbox commercial GPT-4 that has 50x (estimated) model size, by over 5% at NDCG@1. On TREC-DL2019, PRP performs favorably with supervised models and is only inferior to the GPT-4 solution among LLM-based methods on the NDCG@5 and NDCG@10 metrics, while outperforming other LLM-based solutions, such as InstructGPT which has 175B parameters, by over 10% for all ranking metrics. By using the same prompt template on seven BEIR tasks, PRP beats supervised baselines and outperforms the blackbox commercial ChatGPT solution by 4.2\\% and pointwise LLM-based solutions by over 10\\% on average NDCG@10. Furthermore, we propose several variants of PRP to improve efficiency and show that it is possible to achieve competitive results even with linear complexity. We also discuss other benefits of PRP, such as supporting both generation and scoring LLM APIs, as well as being insensitive to input ordering.",
        "keywords": "text ranking;large language models",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Zhen Qin;Rolf Jagerman;Kai Hui;Honglei Zhuang;Junru Wu;Le Yan;Jiaming Shen;Tianqi Liu;Jialu Liu;Donald Metzler;Xuanhui Wang;Michael Bendersky",
        "authorids": "~Zhen_Qin5;~Rolf_Jagerman2;~Kai_Hui1;~Honglei_Zhuang1;~Junru_Wu2;~Le_Yan1;~Jiaming_Shen1;~Tianqi_Liu1;~Jialu_Liu1;~Donald_Metzler1;~Xuanhui_Wang1;~Michael_Bendersky1",
        "gender": "M;;M;M;M;M;;M;M;M;M;",
        "homepage": "http://alumni.cs.ucr.edu/~zqin001/;https://www.jagerman.nl/;https://khui.github.io/;https://hongleizhuang.github.io/;http://sandbox3aster.github.io/;;https://mickeysjm.github.io;;https://jialu.info/;https://research.google/people/DonaldMetzler/;;http://bendersky.github.io/",
        "dblp": ";144/7357;37/10077;10/9988;;67/2358;178/3627;134/5653-2;14/8399;95/2272;67/2661;80/4305",
        "google_scholar": "Kv1yk3YAAAAJ;4yjQ964AAAAJ;VorTj3AAAAAJ;FxEDj4wAAAAJ;nBbGvyEAAAAJ;X_knTr4AAAAJ;-ZJ0sCoAAAAJ;pUKhiMIAAAAJ;BUERw4QAAAAJ;bmXpOd8AAAAJ;;C9mxM5IAAAAJ",
        "orcid": "0000-0001-6739-134X;0000-0002-5169-495X;0000-0002-3110-7404;0000-0001-8134-1509;;;0000-0002-0467-4956;;;0000-0003-4276-6269;;0000-0002-2941-6240",
        "linkedin": ";;;;junru-wu/;;jiaming-shen-08186710a/;;;donmetzler/;;",
        "or_profile": "~Zhen_Qin5;~Rolf_Jagerman2;~Kai_Hui1;~Honglei_Zhuang1;~Junru_Wu2;~Le_Yan1;~Jiaming_Shen1;~Tianqi_Liu1;~Jialu_Liu1;~Donald_Metzler1;~Xuanhui_Wang1;~Michael_Bendersky1",
        "aff": "Google Deepmind;Google;Google;Google DeepMind;Google Research;Google;Google Research;Google DeepMind;Google Research;Google;Google;Google",
        "aff_domain": "google.com;google.com;google.com;google.com;google.com;google.com;google.com;google.com;google.com;google.com;google.com;google.com",
        "position": "Researcher;Researcher;Software Engineer;Research Scientist;Researcher;Software Engineer;Research Scientist;Software Engineer;Software Engineer Manager;Research Scientist;Software Engineer;Researcher",
        "bibtex": "@misc{\nqin2024large,\ntitle={Large Language Models are Effective Text Rankers with Pairwise Ranking Prompting},\nauthor={Zhen Qin and Rolf Jagerman and Kai Hui and Honglei Zhuang and Junru Wu and Le Yan and Jiaming Shen and Tianqi Liu and Jialu Liu and Donald Metzler and Xuanhui Wang and Michael Bendersky},\nyear={2024},\nurl={https://openreview.net/forum?id=iwd9sQWnXb}\n}",
        "github": "",
        "project": "",
        "reviewers": "aHw8;2oVm;dX3y;WHhA",
        "site": "https://openreview.net/forum?id=iwd9sQWnXb",
        "pdf_size": 244154,
        "rating": "3;5;5;5",
        "confidence": "4;3;3;4",
        "soundness": "3;3;3;2",
        "contribution": "2;3;2;2",
        "presentation": "3;3;3;3",
        "wc_summary": "77;178;90;140",
        "wc_strengths": "32;169;43;65",
        "wc_weaknesses": "156;215;245;286",
        "wc_questions": "5;23;4;4",
        "wc_review": "270;585;382;495",
        "wc_reply_reviewers": "0;91;183;0",
        "wc_reply_authors": "103;283;789;391",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;2;4;2",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            121.25,
            40.332214171800686
        ],
        "wc_strengths_avg": [
            77.25,
            54.28800512083678
        ],
        "wc_weaknesses_avg": [
            225.5,
            47.38406905279453
        ],
        "wc_questions_avg": [
            9.0,
            8.093207028119323
        ],
        "wc_review_avg": [
            433.0,
            118.44619031442083
        ],
        "wc_reply_reviewers_avg": [
            68.5,
            75.83040287378144
        ],
        "wc_reply_authors_avg": [
            391.5,
            251.50099403382086
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            1.0897247358851685
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            12,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 238,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16114746473883483909&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;1;1;1;1;1;1;1;1;1;1",
        "aff_unique_norm": "DeepMind;Google",
        "aff_unique_dep": "DeepMind;Google",
        "aff_unique_url": "https://deepmind.com;https://www.google.com",
        "aff_unique_abbr": "DeepMind;Google",
        "aff_campus_unique_index": "1;1;1;1;1;1;1;1;1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;1;0;1;1;1;0;1;1;1;1",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "title": "Learning Performance-Improving Code Edits",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18045",
        "id": "ix7rLVHXyY",
        "author_site": "Alexander Shypula, Aman Madaan, Yimeng Zeng, Uri Alon, Jacob Gardner, Yiming Yang, Milad Hashemi, Graham Neubig, Parthasarathy Ranganathan, Osbert Bastani, Amir Yazdanbakhsh",
        "tldr": "",
        "abstract": "With the decline of Moore's law, optimizing program performance has become a major focus of software research. However, high-level optimizations such as API and algorithm changes remain elusive due to the difficulty of understanding the semantics of code. Simultaneously, pretrained large language models (LLMs) have demonstrated strong capabilities at solving a wide range of programming tasks. To that end, we introduce a framework for adapting LLMs to high-level program optimization. First, we curate a dataset of performance-improving edits made by human programmers of over 77,000 competitive C++ programming submission pairs, accompanied by extensive unit tests. A major challenge is the significant variability of measuring performance on commodity hardware, which can lead to spurious \"improvements.\" To isolate and reliably evaluate the impact of program optimizations, we design an environment based on the gem5 full system simulator, the de facto simulator used in academia and industry. Next, we propose a broad range of adaptation strategies for code optimization; for prompting, these include retrieval-based few-shot prompting and chain-of-thought, and for finetuning, these include performance-conditioned generation and synthetic data augmentation based on self-play. A combination of these techniques achieves a mean speedup of 6.86$\\times$ with eight generations, higher than average optimizations from individual programmers (3.66$\\times$). Using our model's fastest generations, we set a new upper limit on the fastest speedup possible for our dataset at 9.64$\\times$ compared to using the fastest human submissions available (9.56$\\times$).",
        "keywords": "Large Language Models;Retrieval Augmented Generation;Program Synthesis;Program Optimization;Fine-Tuning;Goal-Conditioning;Data Augmentation;Self-Play;Synthetic Dataset;Performance Optimization;Machine Learning for Code Optimization;Dataset",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/2ed5e8d1a32892498040922cd560750929883383.zip",
        "author": "Alexander G Shypula;Aman Madaan;Yimeng Zeng;Uri Alon;Jacob R. Gardner;Yiming Yang;Milad Hashemi;Graham Neubig;Parthasarathy Ranganathan;Osbert Bastani;Amir Yazdanbakhsh",
        "authorids": "~Alexander_G_Shypula1;~Aman_Madaan1;~Yimeng_Zeng1;~Uri_Alon1;~Jacob_R._Gardner1;~Yiming_Yang1;~Milad_Hashemi1;~Graham_Neubig1;~Parthasarathy_Ranganathan1;~Osbert_Bastani1;~Amir_Yazdanbakhsh1",
        "gender": "M;;M;M;F;;M;M;M;M;M",
        "homepage": ";https://madaan.github.io;;https://urialon.ml/;http://www.cs.cmu.edu/~yiming/;;http://phontron.com;http://www.parthasarathys.com;http://obastani.github.io;https://www.ayazdan.com/;",
        "dblp": ";138/1043;;40/2257-2;25/1666;127/9046;03/8155;12/6848;21/11275;44/8745;144/7773",
        "google_scholar": ";jW9ts2cAAAAJ;OoVzXRYAAAAJ;https://scholar.google.co.il/citations?user=QBn7vq8AAAAJ;MlZq4XwAAAAJ;;wlosgkoAAAAJ;S3gQoMgAAAAJ;cxYepGkAAAAJ;Vdu_sqwAAAAJ;0gkajvEAAAAJ",
        "orcid": ";;;;0000-0001-8322-607X;;;0000-0002-9751-5902;;0000-0001-8199-7671;",
        "linkedin": "alexander-shypula-4831a281/;amnmadaan/;yimengz;https://linkedin.com/in/urialon1/;yiming-yang-24100924/;;;partharanganathan/;;ayazdanb/;",
        "or_profile": "~Alexander_G_Shypula1;~Aman_Madaan1;~Yimeng_Zeng1;~Uri_Alon1;~Yiming_Yang1;~Milad_Hashemi1;~Graham_Neubig1;~Parthasarathy_Ranganathan1;~Osbert_Bastani1;~Amir_Yazdanbakhsh1;~Jacob_R_Gardner1",
        "aff": "University of Pennsylvania;Carnegie Mellon University;University of Pennsylvania;Google DeepMind;School of Computer Science, Carnegie Mellon University;Google;Carnegie Mellon University;Google;University of Pennsylvania;Google DeepMind;University of Pennsylvania",
        "aff_domain": "seas.upenn.edu;cmu.edu;seas.upenn.edu;google.com;cs.cmu.edu;google.com;cmu.edu;google.com;upenn.edu;google.com;upenn.edu",
        "position": "PhD student;PhD student;PhD student;Researcher;Full Professor;Research Scientist;Associate Professor;Researcher;Assistant Professor;Researcher;Assistant Professor",
        "bibtex": "@inproceedings{\nshypula2024learning,\ntitle={Learning Performance-Improving Code Edits},\nauthor={Alexander G Shypula and Aman Madaan and Yimeng Zeng and Uri Alon and Jacob R. Gardner and Yiming Yang and Milad Hashemi and Graham Neubig and Parthasarathy Ranganathan and Osbert Bastani and Amir Yazdanbakhsh},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ix7rLVHXyY}\n}",
        "github": "",
        "project": "",
        "reviewers": "VFMY;jit6;nenm;8KXu",
        "pdf_size": 640039,
        "rating": "5;8;8;8",
        "confidence": "4;4;3;3",
        "soundness": "2;4;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;4;3;2",
        "wc_summary": "99;56;105;94",
        "wc_strengths": "33;45;49;102",
        "wc_weaknesses": "274;114;50;211",
        "wc_questions": "103;91;27;86",
        "wc_review": "509;306;231;493",
        "wc_reply_reviewers": "94;0;73;15",
        "wc_reply_authors": "2687;1041;906;1017",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "6;4;4;4",
        "rating_avg": [
            7.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            88.5,
            19.1637678967368
        ],
        "wc_strengths_avg": [
            57.25,
            26.49882072847771
        ],
        "wc_weaknesses_avg": [
            162.25,
            86.30288233888831
        ],
        "wc_questions_avg": [
            76.75,
            29.38005275693017
        ],
        "wc_review_avg": [
            384.75,
            119.36996062661662
        ],
        "wc_reply_reviewers_avg": [
            45.5,
            39.080046059338265
        ],
        "wc_reply_authors_avg": [
            1412.75,
            737.4491084135908
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.5,
            0.8660254037844386
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 73,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=156883623346226686&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=ix7rLVHXyY",
        "pdf": "https://openreview.net/pdf?id=ix7rLVHXyY",
        "email": "seas.upenn.edu;cmu.edu;seas.upenn.edu;google.com;cs.cmu.edu;google.com;cmu.edu;google.com;upenn.edu;google.com;upenn.edu",
        "author_num": 11,
        "aff_unique_index": "0;1;0;2;1;2;1;2;0;2;0",
        "aff_unique_norm": "University of Pennsylvania;Carnegie Mellon University;Google",
        "aff_unique_dep": ";;Google DeepMind",
        "aff_unique_url": "https://www.upenn.edu;https://www.cmu.edu;https://deepmind.com",
        "aff_unique_abbr": "UPenn;CMU;DeepMind",
        "aff_campus_unique_index": "1;2;2",
        "aff_campus_unique": ";Pittsburgh;Mountain View",
        "aff_country_unique_index": "0;0;0;1;0;0;0;0;0;1;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "title": "The Effect of Intrinsic Dataset Properties on Generalization: Unraveling Learning Differences Between Natural and Medical Images",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18044",
        "id": "ixP76Y33y1",
        "author_site": "Nicholas Konz, Maciej Mazurowski",
        "tldr": "",
        "abstract": "This paper investigates discrepancies in how neural networks learn from different imaging domains, which are commonly overlooked when adopting computer vision techniques from the domain of natural images to other specialized domains such as medical images. Recent works have found that the generalization error of a trained network typically increases with the intrinsic dimension ($d_{data}$) of its training set. Yet, the steepness of this relationship varies significantly between medical (radiological) and natural imaging domains, with no existing theoretical explanation. We address this gap in knowledge by establishing and empirically validating a generalization scaling law with respect to $d_{data}$, and propose that the substantial scaling discrepancy between the two considered domains may be at least partially attributed to the higher intrinsic ``label sharpness'' ($K_\\mathcal{F}$) of medical imaging datasets, a metric which we propose. Next, we demonstrate an additional benefit of measuring the label sharpness of a training set: it is negatively correlated with the trained model's adversarial robustness, which notably leads to models for medical images having a substantially higher vulnerability to adversarial attack. Finally, we extend our $d_{data}$ formalism to the related metric of learned representation intrinsic dimension ($d_{repr}$), derive a generalization scaling law with respect to $d_{repr}$, and show that $d_{data}$ serves as an upper bound for $d_{repr}$. Our theoretical results are supported by thorough experiments with six models and eleven natural and medical imaging datasets over a range of training set sizes. Our findings offer insights into the influence of intrinsic dataset properties on generalization, representation learning, and robustness in deep neural networks. *Code link: https://github.com/mazurowski-lab/intrinsic-properties*",
        "keywords": "generalization;medical images;scaling law;intrinsic dimension;medical image analysis",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/2e65ba3a0cdc6c45665a72b046cd85af023a578c.pdf",
        "author": "Nicholas Konz;Maciej A Mazurowski",
        "authorids": "~Nicholas_Konz1;~Maciej_A_Mazurowski1",
        "gender": "M;M",
        "homepage": "https://nickk124.github.io/;https://sites.duke.edu/mazurowski/",
        "dblp": "307/2984;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;HlxjJPQAAAAJ",
        "orcid": "0000-0003-0230-1598;",
        "linkedin": "nick-konz-247988168;",
        "or_profile": "~Nicholas_Konz1;~Maciej_A_Mazurowski1",
        "aff": "Duke University;Duke University",
        "aff_domain": "duke.edu;duke.edu",
        "position": "PhD student;Associate Professor",
        "bibtex": "@inproceedings{\nkonz2024the,\ntitle={The Effect of Intrinsic Dataset Properties on Generalization: Unraveling Learning Differences Between Natural and Medical Images},\nauthor={Nicholas Konz and Maciej A Mazurowski},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ixP76Y33y1}\n}",
        "github": "",
        "project": "",
        "reviewers": "fAwr;xVDy;MU2A;kQAF",
        "pdf_size": 469743,
        "rating": "6;6;8;8",
        "confidence": "4;4;4;3",
        "soundness": "4;2;3;2",
        "contribution": "2;3;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "152;94;52;91",
        "wc_strengths": "64;44;24;27",
        "wc_weaknesses": "226;120;160;436",
        "wc_questions": "166;184;88;85",
        "wc_review": "608;442;324;639",
        "wc_reply_reviewers": "629;28;0;46",
        "wc_reply_authors": "1957;1475;437;1324",
        "reply_reviewers": "2;1;0;1",
        "reply_authors": "4;3;1;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            97.25,
            35.688758734369
        ],
        "wc_strengths_avg": [
            39.75,
            15.943258763502524
        ],
        "wc_weaknesses_avg": [
            235.5,
            121.78977789617649
        ],
        "wc_questions_avg": [
            130.75,
            44.71786555729153
        ],
        "wc_review_avg": [
            503.25,
            127.75244616053345
        ],
        "wc_reply_reviewers_avg": [
            175.75,
            262.1968487606211
        ],
        "wc_reply_authors_avg": [
            1298.25,
            549.4558103250888
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12743378944650780260&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=ixP76Y33y1",
        "pdf": "https://openreview.net/pdf?id=ixP76Y33y1",
        "email": "duke.edu;duke.edu",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Duke University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.duke.edu",
        "aff_unique_abbr": "Duke",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "iyMixbK9M2",
        "title": "The Extrapolation Power of Implicit Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Faced with out-of-distribution data, deep neural networks may break down, even on simple tasks. In this paper, we consider the extrapolation ability of implicit deep learning models, which allow layer depth flexibility and feedback in their computational graph. We compare the out-of-sample performance of implicit and non-implicit deep learning models on both mathematical extrapolation tasks and real-world use cases in time series forecasting and earthquake location prediction. Throughout our experiments, we demonstrate a marked performance increase with implicit models. In addition, we observe that to achieve acceptable performance, the architectures of the non-implicit models must be carefully tailored to the task at hand. In contrast, implicit models do not require such task-specific architectural design, as they learn the model structure during training.",
        "keywords": "deep learning;implicit models;function extrapolation;out of distribution",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/bfd5f65de76f272eb6d1f11482d501f936d1de3f.pdf",
        "author": "Juliette Decugis;Max Emerling;Ashwin Ganesh;Alicia Y. Tsai;Laurent El Ghaoui",
        "authorids": "~Juliette_Decugis1;~Max_Emerling1;~Ashwin_Ganesh1;~Alicia_Y._Tsai1;~Laurent_El_Ghaoui1",
        "gender": "F;M;M;F;M",
        "homepage": ";;https://people.eecs.berkeley.edu/~elghaoui/;;",
        "dblp": "329/6087;;40/1786;279/6303;284/4057",
        "google_scholar": ";;https://scholar.google.com.tw/citations?user=3XLQbL8AAAAJ;https://scholar.google.com.tw/citations?user=8w8cEeQAAAAJ;veZ4QwEAAAAJ",
        "orcid": ";;;;",
        "linkedin": "juliette-decugis-a29673139/;ashwin-ganesh10;;;maxemerling/",
        "or_profile": "~Juliette_Decugis1;~Ashwin_Ganesh1;~Laurent_El_Ghaoui1;~Yi-Ting_Alicia_Tsai1;~Max_Franklin_Emerling1",
        "aff": "Ecole Normale Sup\u00e9rieure de Cachan;;University of California, Berkeley;University of California, Berkeley;",
        "aff_domain": "ens-cachan.fr;;berkeley.edu;berkeley.edu;",
        "position": "MS student;;Full Professor;PhD student;",
        "bibtex": "@misc{\ndecugis2024the,\ntitle={The Extrapolation Power of Implicit Models},\nauthor={Juliette Decugis and Max Emerling and Ashwin Ganesh and Alicia Y. Tsai and Laurent El Ghaoui},\nyear={2024},\nurl={https://openreview.net/forum?id=iyMixbK9M2}\n}",
        "github": "",
        "project": "",
        "reviewers": "g5rm;qMje;QgPM",
        "site": "https://openreview.net/forum?id=iyMixbK9M2",
        "pdf_size": 1721650,
        "rating": "3;3;5",
        "confidence": "4;4;3",
        "soundness": "2;2;3",
        "contribution": "2;2;2",
        "presentation": "2;2;3",
        "wc_summary": "53;38;109",
        "wc_strengths": "112;33;30",
        "wc_weaknesses": "128;102;60",
        "wc_questions": "3;77;70",
        "wc_review": "296;250;269",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            66.66666666666667,
            30.554141381415967
        ],
        "wc_strengths_avg": [
            58.333333333333336,
            37.96782263385084
        ],
        "wc_weaknesses_avg": [
            96.66666666666667,
            28.015868519267592
        ],
        "wc_questions_avg": [
            50.0,
            33.35665850571167
        ],
        "wc_review_avg": [
            271.6666666666667,
            18.873850222522755
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5446401557464723119&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Ecole Normale Sup\u00e9rieure de Cachan;University of California, Berkeley",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ens-cachan.fr;https://www.berkeley.edu",
        "aff_unique_abbr": "ENS Cachan;UC Berkeley",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Berkeley",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "France;United States"
    },
    {
        "title": "Parameter-Efficient Multi-Task Model Fusion with Partial Linearization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18043",
        "id": "iynRvVVAmH",
        "author_site": "Anke Tang, Li Shen, Yong Luo, Yibing Zhan, Han Hu, Bo Du, Yixin Chen, Dacheng Tao",
        "tldr": "",
        "abstract": "Large pre-trained models have enabled significant advances in machine learning and served as foundation components.\nModel fusion methods, such as task arithmetic, have been proven to be powerful and scalable to incorporate fine-tuned weights from different tasks into a multi-task model. \nHowever, efficiently fine-tuning large pre-trained models on multiple downstream tasks remains challenging, leading to inefficient multi-task model fusion.\nIn this work, we propose a novel method to improve multi-task fusion for parameter-efficient fine-tuning techniques like LoRA fine-tuning.\nSpecifically, our approach partially linearizes only the adapter modules and applies task arithmetic over the linearized adapters.\nThis allows us to leverage the the advantages of model fusion over linearized fine-tuning, while still performing fine-tuning and inference efficiently.\nWe demonstrate that our partial linearization technique enables a more effective fusion of multiple tasks into a single model, outperforming standard adapter tuning and task arithmetic alone.\nExperimental results demonstrate the capabilities of our proposed partial linearization technique to effectively construct unified multi-task models via the fusion of fine-tuned task vectors. \nWe evaluate performance over an increasing number of tasks and find that our approach outperforms standard parameter-efficient fine-tuning techniques. The results highlight the benefits of partial linearization for scalable and efficient multi-task model fusion.",
        "keywords": "model fusion;parameter-efficient fine-tuning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/21789e8b3d11112ec964b8026de8d2dbe9ac7715.zip",
        "author": "Anke Tang;Li Shen;Yong Luo;Yibing Zhan;Han Hu;Bo Du;Yixin Chen;Dacheng Tao",
        "authorids": "~Anke_Tang1;~Li_Shen1;~Yong_Luo2;~Yibing_Zhan2;~Han_Hu6;~Bo_Du3;~Yixin_Chen1;~Dacheng_Tao1",
        "gender": "M;M;M;;;;M;",
        "homepage": ";https://sites.google.com/site/mathshenli/home;;;;;https://www.cse.wustl.edu/~yixin.chen/;",
        "dblp": "348/4694;91/3680-8;57/5272-2.html;;;;59/983;",
        "google_scholar": "KA7cyvUAAAAJ;yVhgENIAAAAJ;zb1oVGIAAAAJ;;;;NByrsK0AAAAJ;",
        "orcid": "0000-0002-0576-8153;;;;;;;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Anke_Tang1;~Li_Shen1;~Yong_Luo2;~Yibing_Zhan2;~Han_Hu6;~Bo_Du3;~Yixin_Chen1;~Dacheng_Tao1",
        "aff": "JD.com;JD Explore Academy;Wuhan University;;;;Washington University, Saint Louis;",
        "aff_domain": "jd.com;jd.com;whu.edu.cn;;;;wustl.edu;",
        "position": "Intern;Researcher;Professor;;;;Full Professor;",
        "bibtex": "@inproceedings{\ntang2024parameterefficient,\ntitle={Parameter-Efficient Multi-Task Model Fusion with Partial Linearization},\nauthor={Anke Tang and Li Shen and Yong Luo and Yibing Zhan and Han Hu and Bo Du and Yixin Chen and Dacheng Tao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=iynRvVVAmH}\n}",
        "github": "",
        "project": "",
        "reviewers": "HkFi;iJMj;vkjS;tr5D",
        "pdf_size": 913161,
        "rating": "6;6;8;8",
        "confidence": "4;2;2;2",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;4;3;2",
        "wc_summary": "58;86;83;108",
        "wc_strengths": "19;58;48;24",
        "wc_weaknesses": "103;162;15;26",
        "wc_questions": "286;129;10;36",
        "wc_review": "466;435;156;194",
        "wc_reply_reviewers": "306;26;41;29",
        "wc_reply_authors": "3535;1657;530;721",
        "reply_reviewers": "2;1;1;1",
        "reply_authors": "8;5;2;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            2.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            83.75,
            17.725334975678173
        ],
        "wc_strengths_avg": [
            37.25,
            16.23845743905498
        ],
        "wc_weaknesses_avg": [
            76.5,
            59.885307046052624
        ],
        "wc_questions_avg": [
            115.25,
            108.05409524862998
        ],
        "wc_review_avg": [
            312.75,
            138.83690971784125
        ],
        "wc_reply_reviewers_avg": [
            100.5,
            118.77815455714068
        ],
        "wc_reply_authors_avg": [
            1610.75,
            1190.0160450598976
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.25,
            2.48746859276655
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 24,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5510899397004401881&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=iynRvVVAmH",
        "pdf": "https://openreview.net/pdf?id=iynRvVVAmH",
        "email": "jd.com;jd.com;whu.edu.cn;;;;wustl.edu;",
        "author_num": 8,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "JD.com;JD;Wuhan University;Washington University in St. Louis",
        "aff_unique_dep": ";JD Explore Academy;;",
        "aff_unique_url": "https://www.jd.com;;http://www.whu.edu.cn/;https://wustl.edu",
        "aff_unique_abbr": "JD;;WHU;WUSTL",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Saint Louis",
        "aff_country_unique_index": "0;0;2",
        "aff_country_unique": "China;;United States"
    },
    {
        "id": "izO4mxI9nU",
        "title": "HAICO-CN: Human-AI Collaboration By Cluster-wise Noisy-Label Augmentation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The intricate dynamics of human-AI collaboration presents an ongoing chal- lenge. While recent research incorporates human behaviors into machine learn- ing model design, most utilise single global confusion matrix or human behavior model, disregarding potential personalization to user. To address this gap, we propose HAICO-CN, a human-AI collaborative method that enhances human-AI joint decision-making by training personalized models using a novel cluster-wise noisy-label augmentation technique. During training, HAICO-CN first identifies and clusters noise label patterns within the multi-rater data sets, followed by a cluster-wise noisy-label augmentation method that generates enough data to train a collaborative human-AI model for each cluster. During inference, the user fol- lows an onboarding process, allowing HAICO-CN to select a cluster-wise human- AI model based on the user\u2019s noisy label patterns, thereby enhancing human-AI joint decision-making performance. HAICO-CN is simple to implement, model- agnostic, and effective. We propose new evaluation criteria for assessing human- AI collaborative methods and empirically evaluate HAICO-CN across diverse datasets, including CIFAR-10N, CIFAR-10H, Fashion-MNIST-H, and Chaoyang histopathology, demonstrating HAICO-CN\u2019s superior performance compared to state-of-the-art human-AI collaboration approaches.",
        "keywords": "Human-Ai Collaboration;Noisy-label learning;Multi-rater learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Dileepa Pitawela;Gustavo Carneiro;Hsiang-Ting Chen",
        "authorids": "~Dileepa_Pitawela1;~Gustavo_Carneiro1;~Hsiang-Ting_Chen1",
        "gender": "M;M;M",
        "homepage": "https://cs.adelaide.edu.au/~carneiro/;https://ht-timchen.github.io;",
        "dblp": "53/3609;;",
        "google_scholar": "https://scholar.google.com.au/citations?user=E0TtOWAAAAAJ;https://scholar.google.com.au/citations?user=UgJAkMgAAAAJ;",
        "orcid": "0000-0002-5571-6220;;0000-0002-4887-7122",
        "linkedin": "gustavo-carneiro-3578812/;;dileepa-pitawela/",
        "or_profile": "~Gustavo_Carneiro1;~Hsiang-Ting_Chen1;~Pitawelayalage_Dasun_Dileepa_Pitawela1",
        "aff": "University of Surrey;University of Adelaide;University of Adelaide",
        "aff_domain": "surrey.ac.uk;adelaide.edu.au;adelaide.edu.au",
        "position": "Full Professor;Assistant Professor;PhD student",
        "bibtex": "@misc{\npitawela2024haicocn,\ntitle={{HAICO}-{CN}: Human-{AI} Collaboration By Cluster-wise Noisy-Label Augmentation},\nauthor={Dileepa Pitawela and Gustavo Carneiro and Hsiang-Ting Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=izO4mxI9nU}\n}",
        "github": "",
        "project": "",
        "reviewers": "bbw3;Ub55;SoV5",
        "site": "https://openreview.net/forum?id=izO4mxI9nU",
        "pdf_size": 5075531,
        "rating": "5;5;8",
        "confidence": "4;4;3",
        "soundness": "3;2;3",
        "contribution": "3;2;3",
        "presentation": "3;3;3",
        "wc_summary": "128;53;62",
        "wc_strengths": "26;163;53",
        "wc_weaknesses": "46;360;344",
        "wc_questions": "64;200;16",
        "wc_review": "264;776;475",
        "wc_reply_reviewers": "17;0;0",
        "wc_reply_authors": "649;1112;1199",
        "reply_reviewers": "1;0;0",
        "reply_authors": "1;2;2",
        "rating_avg": [
            6.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            81.0,
            33.436506994600975
        ],
        "wc_strengths_avg": [
            80.66666666666667,
            59.252754272598075
        ],
        "wc_weaknesses_avg": [
            250.0,
            144.39759924135396
        ],
        "wc_questions_avg": [
            93.33333333333333,
            77.92874237974644
        ],
        "wc_review_avg": [
            505.0,
            210.09680308530795
        ],
        "wc_reply_reviewers_avg": [
            5.666666666666667,
            8.013876853447538
        ],
        "wc_reply_authors_avg": [
            986.6666666666666,
            241.39363887411963
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Zqbau4hSoz0J:scholar.google.com/&scioq=HAICO-CN:+Human-AI+Collaboration+By+Cluster-wise+Noisy-Label+Augmentation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "University of Surrey;University of Adelaide",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.surrey.ac.uk;https://www.adelaide.edu.au",
        "aff_unique_abbr": "Surrey;Adelaide",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "United Kingdom;Australia"
    },
    {
        "id": "izdFGwDgvW",
        "title": "ICE: Image-Caption Encoding for Improved Out-Of-Distribution Generalization In Vision-Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent advances in vision-language models have combined contrastive approaches with generative methods to achieve state-of-the-art (SOTA) on downstream inference tasks like zero-shot image classification. \nHowever, one persistent issue of these models for image classification is their out-of-distribution (OOD) generalization capabilities.\nWe first show that when an OOD datapoint is misclassified, the correct class can be typically found in the Top-$K$ predicted classes.\nIn order to steer the model prediction toward the correct class within the top predicted classes, we propose the Image-Caption Encoding (ICE) method, a straightforward approach that directly enforces consistency between the image-conditioned and caption-conditioned predictions at evaluation time only.\nIntuitively, we take advantage of unique properties of the generated captions to guide our local search for the correct class label within the Top-$K$ predicted classes.\nWe show that our method can be easily combined with other SOTA methods to enhance Top-1 OOD accuracies by 0.5% on average and up to 3% on challenging datasets.",
        "keywords": "zero shot classification;image-caption encoding",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Eric Yang Yu;Christopher Liao;Sathvik Ravi;Theodoros Tsiligkaridis;Brian Kulis",
        "authorids": "~Eric_Yang_Yu1;~Christopher_Liao1;~Sathvik_Ravi1;~Theodoros_Tsiligkaridis1;~Brian_Kulis1",
        "gender": "M;M;M;M;",
        "homepage": "https://ericyangyu.github.io/;;;https://sites.google.com/view/theo-t;http://people.bu.edu/bkulis/",
        "dblp": "331/8331;;;64/10412;43/3732",
        "google_scholar": "6ebcOw8AAAAJ;;;hVUVOTIAAAAJ;okcbLqoAAAAJ",
        "orcid": ";;;;",
        "linkedin": "eric-yu-engineer/;christopher-liao-524996a1;sathvik-ravi/;;",
        "or_profile": "~Eric_Yang_Yu1;~Christopher_Liao1;~Sathvik_Ravi1;~Theodoros_Tsiligkaridis1;~Brian_Kulis1",
        "aff": "University of California, San Diego;Boston University;;MIT Lincoln Laboratory, Massachusetts Institute of Technology;Boston University",
        "aff_domain": "ucsd.edu;bu.edu;;ll.mit.edu;bu.edu",
        "position": "MS student;PhD student;;Senior AI Research Scientist;Associate Professor",
        "bibtex": "@misc{\nyu2024ice,\ntitle={{ICE}: Image-Caption Encoding for Improved Out-Of-Distribution Generalization In Vision-Language Models},\nauthor={Eric Yang Yu and Christopher Liao and Sathvik Ravi and Theodoros Tsiligkaridis and Brian Kulis},\nyear={2024},\nurl={https://openreview.net/forum?id=izdFGwDgvW}\n}",
        "github": "",
        "project": "",
        "reviewers": "DXxh;oC1d;F7uJ;jLvo",
        "site": "https://openreview.net/forum?id=izdFGwDgvW",
        "pdf_size": 1079795,
        "rating": "3;5;5;6",
        "confidence": "4;4;4;3",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "3;3;3;3",
        "wc_summary": "76;44;91;107",
        "wc_strengths": "80;28;31;139",
        "wc_weaknesses": "208;111;239;168",
        "wc_questions": "74;62;22;10",
        "wc_review": "438;245;383;424",
        "wc_reply_reviewers": "36;300;57;105",
        "wc_reply_authors": "1316;700;819;1149",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;1;1;2",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            79.5,
            23.243278598338918
        ],
        "wc_strengths_avg": [
            69.5,
            45.12482686947397
        ],
        "wc_weaknesses_avg": [
            181.5,
            47.85655649960619
        ],
        "wc_questions_avg": [
            42.0,
            26.68332812825267
        ],
        "wc_review_avg": [
            372.5,
            76.33642642932665
        ],
        "wc_reply_reviewers_avg": [
            124.5,
            104.36594272079374
        ],
        "wc_reply_authors_avg": [
            996.0,
            247.36309344766855
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.6622661785325219,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:X4RZex-Z6vMJ:scholar.google.com/&scioq=ICE:+Image-Caption+Encoding+for+Improved+Out-Of-Distribution+Generalization+In+Vision-Language+Models&hl=en&as_sdt=0,23",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "University of California, San Diego;Boston University;Massachusetts Institute of Technology",
        "aff_unique_dep": ";;Lincoln Laboratory",
        "aff_unique_url": "https://www.ucsd.edu;https://www.bu.edu;https://web.mit.edu",
        "aff_unique_abbr": "UCSD;BU;MIT",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "San Diego;;Cambridge",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Spoken Question Answering and Speech Continuation Using Spectrogram-Powered LLM",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18042",
        "id": "izrOLJov5y",
        "author_site": "Eliya Nachmani, Alon Levkovitch, Roy Hirsch, Julian Salazar, Chulayuth Asawaroengchai, Soroosh Mariooryad, Ehud Rivlin, RJ Skerry-Ryan, Michele Tadmor Ramanovich",
        "tldr": "",
        "abstract": "We present Spectron, a novel approach to adapting pre-trained large language models (LLMs) to perform spoken question answering (QA) and speech continuation. By endowing the LLM with a pre-trained speech encoder, our model becomes able to take speech inputs and generate speech outputs. The entire system is trained end-to-end and operates directly on spectrograms, simplifying our architecture. Key to our approach is a training objective that jointly supervises speech recognition, text continuation, and speech synthesis using only paired speech-text pairs, enabling a `cross-modal' chain-of-thought within a single decoding pass. Our method surpasses existing spoken language models in speaker preservation and semantic coherence. Furthermore, the proposed model improves upon direct initialization in retaining the knowledge of the original LLM as demonstrated through spoken QA datasets. We release our audio samples and spoken QA dataset via our website.",
        "keywords": "Speech Continuation;Spoken Question Answering",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/797ccee522fe8ae4170ca6dd29a37ee82aa155e9.zip",
        "author": "Eliya Nachmani;Alon Levkovitch;Roy Hirsch;Julian Salazar;Chulayuth Asawaroengchai;Soroosh Mariooryad;Ehud Rivlin;RJ Skerry-Ryan;Michelle Tadmor Ramanovich",
        "authorids": "~Eliya_Nachmani1;~Alon_Levkovitch1;~Roy_Hirsch2;~Julian_Salazar1;~Chulayuth_Asawaroengchai1;~Soroosh_Mariooryad1;~Ehud_Rivlin2;~RJ_Skerry-Ryan1;~Michelle_Tadmor_Ramanovich1",
        "gender": "M;;M;M;M;M;M;M;F",
        "homepage": ";;;http://julianslzr.com;;;http://www.cs.technion.ac.il/~ehudr/;http://rjryan.me/;",
        "dblp": "183/6370;;;182/4139-0;;60/10648;;;",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;shCi1fAAAAAJ;Nd6DvD4AAAAJ;;wLsZd9wAAAAJ;;fHsIRb0AAAAJ;z29vIsUAAAAJ",
        "orcid": ";;;0000-0003-0943-7594;;;;;",
        "linkedin": ";;;julianslzr/;chulayuth-asawaroengchai-540635b4/;;;;",
        "or_profile": "~Eliya_Nachmani1;~Alon_Levkovitch1;~Roy_Hirsch2;~Julian_Salazar1;~Chulayuth_Asawaroengchai1;~Soroosh_Mariooryad1;~Ehud_Rivlin2;~RJ_Skerry-Ryan1;~Michelle_Tadmor_Ramanovich1",
        "aff": "Research, Google;Tel Aviv University;Google;Google Research;King Mongkut's University of Technology Thonburi;Google;Technion, Technion;;Google",
        "aff_domain": "research.google.com;tau.ac.il;google.com;google.com;kmutt.ac.th;google.com;technion.ac.il;;google.com",
        "position": "Researcher;MS student;Researcher;Research Scientist;PhD student;Researcher;Full Professor;;Researcher",
        "bibtex": "@inproceedings{\nnachmani2024spoken,\ntitle={Spoken Question Answering and Speech Continuation Using Spectrogram-Powered {LLM}},\nauthor={Eliya Nachmani and Alon Levkovitch and Roy Hirsch and Julian Salazar and Chulayuth Asawaroengchai and Soroosh Mariooryad and Ehud Rivlin and RJ Skerry-Ryan and Michelle Tadmor Ramanovich},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=izrOLJov5y}\n}",
        "github": "",
        "project": "",
        "reviewers": "6UiY;hbZt;Qrsa;zUkq",
        "pdf_size": 367408,
        "rating": "5;6;8;8",
        "confidence": "4;4;4;3",
        "soundness": "3;3;3;4",
        "contribution": "2;3;3;3",
        "presentation": "2;3;4;4",
        "wc_summary": "203;98;72;115",
        "wc_strengths": "63;33;79;79",
        "wc_weaknesses": "178;137;75;22",
        "wc_questions": "267;87;85;46",
        "wc_review": "711;355;311;262",
        "wc_reply_reviewers": "0;98;11;0",
        "wc_reply_authors": "1263;556;478;278",
        "reply_reviewers": "0;2;1;0",
        "reply_authors": "3;2;2;1",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            122.0,
            49.208739061268375
        ],
        "wc_strengths_avg": [
            63.5,
            18.78163997099295
        ],
        "wc_weaknesses_avg": [
            103.0,
            59.42642509860407
        ],
        "wc_questions_avg": [
            121.25,
            85.72156963098611
        ],
        "wc_review_avg": [
            409.75,
            177.0104163601679
        ],
        "wc_reply_reviewers_avg": [
            27.25,
            41.09364306069735
        ],
        "wc_reply_authors_avg": [
            643.75,
            371.62371762308175
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -0.5555555555555555,
        "gs_citation": 40,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2239314690427158927&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=izrOLJov5y",
        "pdf": "https://openreview.net/pdf?id=izrOLJov5y",
        "email": "research.google.com;tau.ac.il;google.com;google.com;kmutt.ac.th;google.com;technion.ac.il;;google.com",
        "author_num": 9,
        "aff_unique_index": "0;1;0;0;2;0;3;0",
        "aff_unique_norm": "Google;Tel Aviv University;King Mongkut's University of Technology Thonburi;Technion - Israel Institute of Technology",
        "aff_unique_dep": "Google Research;;;",
        "aff_unique_url": "https://research.google;https://www.tau.ac.il;http://www.kmutt.ac.th;https://www.technion.ac.il/en/",
        "aff_unique_abbr": "Google;TAU;KMUTT;Technion",
        "aff_campus_unique_index": "0;0;0;0;0",
        "aff_campus_unique": "Mountain View;",
        "aff_country_unique_index": "0;1;0;0;2;0;1;0",
        "aff_country_unique": "United States;Israel;Thailand"
    },
    {
        "title": "ContextRef: Evaluating Referenceless Metrics for Image Description Generation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18041",
        "id": "j0ZvKSNZiP",
        "author_site": "Elisa Kreiss, Eric Zelikman, Christopher Potts, Nick Haber",
        "tldr": "",
        "abstract": "Referenceless metrics (e.g., CLIPScore) use pretrained vision--language models to assess image descriptions directly without costly ground-truth reference texts. Such methods can facilitate rapid progress, but only if they truly align with human preference judgments. In this paper, we introduce ContextRef, a benchmark for assessing referenceless metrics for such alignment. ContextRef has two components: human ratings along a variety of established quality dimensions, and ten diverse robustness checks designed to uncover fundamental weaknesses. A crucial aspect of ContextRef is that images and descriptions are presented in context, reflecting prior work showing that context is important for description quality. Using ContextRef, we assess a variety of pretrained models, scoring functions, and techniques for incorporating context. None of the methods is successful with ContextRef, but we show that careful fine-tuning yields substantial improvements. ContextRef remains a challenging benchmark though, in large part due to the challenge of context dependence.",
        "keywords": "image description evaluation;referenceless metrics;multimodal evaluation",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Elisa Kreiss;Eric Zelikman;Christopher Potts;Nick Haber",
        "authorids": "~Elisa_Kreiss1;~Eric_Zelikman1;~Christopher_Potts1;~Nick_Haber1",
        "gender": "F;M;M;",
        "homepage": "http://elisakreiss.com/;https://zelikman.me;http://web.stanford.edu/~cgpotts/;",
        "dblp": "212/3956;217/2378;13/2617;179/4983",
        "google_scholar": "m-WKGikAAAAJ;V5B8dSUAAAAJ;3j08YoAAAAAJ;euNCoVYAAAAJ",
        "orcid": ";;0000-0002-7978-6055;0000-0001-8804-7804",
        "linkedin": ";ericzelikman/;;",
        "or_profile": "~Elisa_Kreiss1;~Eric_Zelikman1;~Christopher_Potts1;~Nick_Haber1",
        "aff": "University of California, Los Angeles;Stanford University;Stanford University;Stanford University",
        "aff_domain": "ucla.edu;stanford.edu;stanford.edu;stanford.edu",
        "position": "Assistant Professor;PhD student;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nkreiss2024contextref,\ntitle={ContextRef: Evaluating Referenceless Metrics for Image Description Generation},\nauthor={Elisa Kreiss and Eric Zelikman and Christopher Potts and Nick Haber},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=j0ZvKSNZiP}\n}",
        "github": "",
        "project": "",
        "reviewers": "T1dS;hp9w;jrgb",
        "pdf_size": 1685009,
        "rating": "6;6;6",
        "confidence": "3;3;1",
        "soundness": "3;3;2",
        "contribution": "2;3;2",
        "presentation": "3;2;2",
        "wc_summary": "92;103;80",
        "wc_strengths": "50;88;113",
        "wc_weaknesses": "28;224;58",
        "wc_questions": "6;73;1",
        "wc_review": "176;488;252",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "425;1724;633",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;4;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            91.66666666666667,
            9.392668535736915
        ],
        "wc_strengths_avg": [
            83.66666666666667,
            25.901522906749882
        ],
        "wc_weaknesses_avg": [
            103.33333333333333,
            86.19873677857595
        ],
        "wc_questions_avg": [
            26.666666666666668,
            32.82614134429381
        ],
        "wc_review_avg": [
            305.3333333333333,
            132.8390839407673
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            927.3333333333334,
            569.6925096537215
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16885032499385218704&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=j0ZvKSNZiP",
        "pdf": "https://openreview.net/pdf?id=j0ZvKSNZiP",
        "email": "ucla.edu;stanford.edu;stanford.edu;stanford.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "University of California, Los Angeles;Stanford University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ucla.edu;https://www.stanford.edu",
        "aff_unique_abbr": "UCLA;Stanford",
        "aff_campus_unique_index": "0;1;1;1",
        "aff_campus_unique": "Los Angeles;Stanford",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "j1FLTvgyAh",
        "title": "Multi-Vision Multi-Prompt for Few-Shot Learning in Vision-Language Model",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In vision-language models such as the Contrastive Language-Image Pre-Training model (CLIP), prompt learning can efficiently and rapidly adapt to specific tasks in few-shot learning. Previous methods for prompt learning often rely on a single prompt. However, a single prompt may not accurately distinguish between different categories, especially when a category has multiple features and contextual connections in a few-shot learning environment. While the performance of few-shot learning can improve through meta-learning or image augmentation strategies, these approaches may increase computational cost and affect accuracy. To address these issues, we propose a new method called Multi-Vision Multi-Prompt (MVMP), designed for CLIP in a few-shot learning environment. Instead of increasing the number of model parameters, MVMP employs multiple prompts at different stages of the training process and averages the predictions. Additionally, we present a mixed self-augmentation framework and text distillation to further enhance the model's performance. Extensive experimental validation demonstrates that our approach significantly outperforms the state-of-the-art in the few-shot learning classification tasks, improving accuracy by 4.6% and 2%.",
        "keywords": "Few-shot Learning;Vision-Language Models;Transfer Learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Ran Wang;Hua Zuo;Zhen Fang;Jie Lu",
        "authorids": "~Ran_Wang4;~Hua_Zuo1;~Zhen_Fang2;~Jie_Lu4",
        "gender": ";F;M;",
        "homepage": ";https://profiles.uts.edu.au/Hua.Zuo;https://fang-zhen.github.io/index.html;",
        "dblp": ";;;",
        "google_scholar": ";https://scholar.google.com.au/citations?user=Ud8HF50AAAAJ;OzD6WJcAAAAJ;",
        "orcid": ";0000-0002-9122-0775;0000-0003-0602-6255;",
        "linkedin": "ran-wang-016536232;;;",
        "or_profile": "~Ran_Wang4;~Hua_Zuo1;~Zhen_Fang2;~Jie_Lu4",
        "aff": "University of Technology Sydney;University of Technology Sydney;University of Technology Sydney;",
        "aff_domain": "uts.edu.au;uts.edu.au;uts.edu.au;",
        "position": "PhD student;Senior Lecturer;Assistant Professor;",
        "bibtex": "@misc{\nwang2024multivision,\ntitle={Multi-Vision Multi-Prompt for Few-Shot Learning in Vision-Language Model},\nauthor={Ran Wang and Hua Zuo and Zhen Fang and Jie Lu},\nyear={2024},\nurl={https://openreview.net/forum?id=j1FLTvgyAh}\n}",
        "github": "",
        "project": "",
        "reviewers": "bsQr;RSHG;gxiR;ihSe",
        "site": "https://openreview.net/forum?id=j1FLTvgyAh",
        "pdf_size": 7727397,
        "rating": "1;3;3;3",
        "confidence": "5;3;4;5",
        "soundness": "1;3;1;2",
        "contribution": "1;2;1;3",
        "presentation": "1;2;2;1",
        "wc_summary": "117;62;57;59",
        "wc_strengths": "29;100;28;44",
        "wc_weaknesses": "385;225;115;359",
        "wc_questions": "2;35;5;2",
        "wc_review": "533;422;205;464",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            73.75,
            25.033727249452888
        ],
        "wc_strengths_avg": [
            50.25,
            29.414069762615306
        ],
        "wc_weaknesses_avg": [
            271.0,
            108.61859877571612
        ],
        "wc_questions_avg": [
            11.0,
            13.910427743243556
        ],
        "wc_review_avg": [
            406.0,
            122.62748468430722
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:GwkbbhyDthUJ:scholar.google.com/&scioq=Multi-Vision+Multi-Prompt+for+Few-Shot+Learning+in+Vision-Language+Model&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Technology Sydney",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uts.edu.au",
        "aff_unique_abbr": "UTS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Australia"
    },
    {
        "id": "j1PhOBgplU",
        "title": "Evolving Computation Graphs",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Graph neural networks (GNNs) have demonstrated success in modeling relational data, especially for data that exhibits homophily: when a connection between nodes tends to imply that they belong to the same class. However, while this assumption is true in many relevant situations, there are important real-world scenarios that violate this assumption, and this has spurred research into improving GNNs for these cases. In this work, we propose Evolving Computation Graphs (ECGs), a novel method for enhancing GNNs on heterophilic datasets. Our approach builds on prior theoretical insights linking node degree, high homophily, and inter vs intra-class embedding similarity by rewiring the GNNs\u2019 computation graph towards adding edges that connect nodes that are likely to be in the same class. We utilise auxiliary classifiers to identify these edges, ultimately improving GNN performance on non-homophilic data as a result. We evaluate ECGs on a diverse set of recently-proposed heterophilic datasets and demonstrate improvements over the relevant baselines. ECG presents a simple, intuitive and elegant approach for improving GNN performance on heterophilic datasets without requiring prior domain knowledge.",
        "keywords": "graph neural networks;heterophily;graph rewiring",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Andreea Deac;Jian Tang",
        "authorids": "~Andreea_Deac1;~Jian_Tang1",
        "gender": "F;",
        "homepage": ";http://www.jian-tang.com",
        "dblp": "222/3221;181/2667-5",
        "google_scholar": "E6zzj8kAAAAJ;https://scholar.google.ca/citations?user=1ir6WUEAAAAJ",
        "orcid": ";",
        "linkedin": "andreea-ioana-deac-76206510b;",
        "or_profile": "~Andreea_Deac1;~Jian_Tang1",
        "aff": ";Mila, HEC Montreal",
        "aff_domain": ";hec.ca",
        "position": ";Assistant Professor",
        "bibtex": "@misc{\ndeac2024evolving,\ntitle={Evolving Computation Graphs},\nauthor={Andreea Deac and Jian Tang},\nyear={2024},\nurl={https://openreview.net/forum?id=j1PhOBgplU}\n}",
        "github": "",
        "project": "",
        "reviewers": "3tzc;gESK;7f7X;gyLE",
        "site": "https://openreview.net/forum?id=j1PhOBgplU",
        "pdf_size": 11343143,
        "rating": "3;3;5;6",
        "confidence": "4;5;4;4",
        "soundness": "3;2;2;3",
        "contribution": "1;2;2;3",
        "presentation": "2;2;3;3",
        "wc_summary": "72;54;101;174",
        "wc_strengths": "11;22;32;119",
        "wc_weaknesses": "291;325;213;53",
        "wc_questions": "51;4;108;77",
        "wc_review": "425;405;454;423",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            100.25,
            45.7622934302904
        ],
        "wc_strengths_avg": [
            46.0,
            42.79602785306132
        ],
        "wc_weaknesses_avg": [
            220.5,
            104.88446024078114
        ],
        "wc_questions_avg": [
            60.0,
            38.11167800031901
        ],
        "wc_review_avg": [
            426.75,
            17.55526986406076
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5555555555555555,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3147813815337220884&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0",
        "aff_unique_norm": "HEC Montreal",
        "aff_unique_dep": "HEC Business School",
        "aff_unique_url": "https://www.hec.ca",
        "aff_unique_abbr": "HEC",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Montreal",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "j1SktNMHA7",
        "title": "Rethinking Label Smoothing as a Tool for Embedding Perturbation Uncertainty",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Model robustness is the ability of a machine learning model to perform well when confronted with unexpected distributional shifts during inference. While various augmentation-based methods exist to improve common corruption robustness, they often rely on predefined image operations, and the untapped potential of perturbation-based strategies still exists. In response to these limitations, we repurpose label smoothing as a tool for embedding the uncertainty of perturbations. By correlating confidence levels with a monotonically decreasing function to the intensity of isotropic perturbations, we demonstrate that the model eventually acquires the increased boundary thickness and flatter minima. These metrics have strong relationships with general model robustness, extending beyond the resistance to common corruption. Our evaluations on CIFAR-10/100, Tiny-ImageNet, and ImageNet benchmarks confirm that our approach not only bolsters robustness on its own but also complements existing augmentation strategies effectively. Notably, our method enhances both common corruption and adversarial robustness in all experimental cases, a feature not observed with prior augmentations.",
        "keywords": "Deep Learning;Model Robustness;Domain Generalization;Common Corruption Robustness;Adversarial Robustness",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/3bf3baf7b236d53a61039fd3bf8fafb4fbd54ed9.pdf",
        "author": "Weebum Yoo;Hwanjo Yu;Sung Whan Yoon",
        "authorids": "~Weebum_Yoo2;~Hwanjo_Yu1;~Sung_Whan_Yoon1",
        "gender": "M;M;M",
        "homepage": "https://sites.google.com/view/swyoon89/home;http://di.postech.ac.kr/hwanjoyu;https://sites.google.com/view/swyoon89",
        "dblp": ";80/6889;129/0978",
        "google_scholar": ";LbrCa7EAAAAJ;https://scholar.google.co.kr/citations?user=6RwONs0AAAAJ",
        "orcid": ";0000-0002-7510-0255;0000-0002-7202-2837",
        "linkedin": ";;",
        "or_profile": "~Weebum_Yoo2;~Hwanjo_Yu1;~Sung_Whan_Yoon1",
        "aff": "Ulsan National Institute of Science and Technology;Pohang University of Science and Technology;Ulsan National Institute of Science and Technology",
        "aff_domain": "unist.ac.kr;postech.edu;unist.ac.kr",
        "position": "PhD student;Full Professor;Associate Professor",
        "bibtex": "@misc{\nyoo2024rethinking,\ntitle={Rethinking Label Smoothing as a Tool for Embedding Perturbation Uncertainty},\nauthor={Weebum Yoo and Hwanjo Yu and Sung Whan Yoon},\nyear={2024},\nurl={https://openreview.net/forum?id=j1SktNMHA7}\n}",
        "github": "",
        "project": "",
        "reviewers": "Gg61;DLcS;4KU5;M1mD",
        "site": "https://openreview.net/forum?id=j1SktNMHA7",
        "pdf_size": 1862940,
        "rating": "5;5;6;6",
        "confidence": "3;4;3;3",
        "soundness": "2;2;3;2",
        "contribution": "2;3;3;3",
        "presentation": "3;2;3;4",
        "wc_summary": "61;241;84;87",
        "wc_strengths": "33;97;43;64",
        "wc_weaknesses": "192;661;86;324",
        "wc_questions": "57;172;97;3",
        "wc_review": "343;1171;310;478",
        "wc_reply_reviewers": "0;771;0;0",
        "wc_reply_authors": "1033;2264;418;861",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "2;5;1;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            118.25,
            71.5799378317696
        ],
        "wc_strengths_avg": [
            59.25,
            24.498724456591614
        ],
        "wc_weaknesses_avg": [
            315.75,
            216.42825023549952
        ],
        "wc_questions_avg": [
            82.25,
            61.62538032337002
        ],
        "wc_review_avg": [
            575.5,
            349.52575012436495
        ],
        "wc_reply_reviewers_avg": [
            192.75,
            333.8527931589011
        ],
        "wc_reply_authors_avg": [
            1144.0,
            684.4497790196151
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            1.5
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Ckb07e3aZw0J:scholar.google.com/&scioq=Rethinking+Label+Smoothing+as+a+Tool+for+Embedding+Perturbation+Uncertainty&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Ulsan National Institute of Science and Technology;Pohang University of Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.unist.ac.kr;https://www.postech.ac.kr",
        "aff_unique_abbr": "UNIST;POSTECH",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Pohang",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "j20nMRUWK9",
        "title": "Adaptive Knowledge Transfer for Generalized Category Discovery",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We tackle the general category discovery problem, which aims to discover novel classes in unlabeled datasets by leveraging the information of known classes. Most previous works transfer knowledge implicitly from known classes to novel ones through shared representation spaces.\nHowever, the implicit nature of knowledge transfer in these methods poses difficulties in controlling the flow of information between known and novel classes. Furthermore, it is susceptible to the label uncertainty of unlabeled data learning.\nTo overcome these limitations, our work introduces an explicit and adaptive knowledge transfer framework that can facilitate novel class discovery. This framework can be dissected into three primary steps. The initial step entails obtaining representations of known class knowledge. This is achieved through a pre-trained known-class model. The subsequent step is to transform the knowledge representation to enable more targeted knowledge transfer, realized through an adapter layer and a channel selection matrix. The final step is knowledge distillation, where we maximize the mutual information between two representation spaces.\nFurthermore, we introduce a challenge benchmark iNat21 which is comprised of three distinct difficulty levels. \nWe conduct extensive experiments on various benchmark datasets and the results demonstrate the superiority of our approach over the previous state-of-the-art methods.",
        "keywords": "general category discovery;novel class discovery;knowledge transfer",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Chuyu Zhang;Peiyan Gu;Xueyang Yu;Xuming He",
        "authorids": "~Chuyu_Zhang1;~Peiyan_Gu1;~Xueyang_Yu1;~Xuming_He3",
        "gender": "M;M;M;M",
        "homepage": ";http://plus.sist.shanghaitech.edu.cn/author/peiyan-gu/;https://github.com/Unicorn53547;https://faculty.sist.shanghaitech.edu.cn/faculty/hexm/index.html",
        "dblp": "270/8658;352/4220;350/1163;03/4230",
        "google_scholar": "V7IktkcAAAAJ;;https://scholar.google.com/citations?view_op=list_works;0KyeZ2QAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Chuyu_Zhang1;~Peiyan_Gu1;~Xueyang_Yu1;~Xuming_He3",
        "aff": "ShanghaiTech University;ShanghaiTech University;ShanghaiTech University;ShanghaiTech University",
        "aff_domain": "shanghaitech.edu.cn;shanghaitech.edu.cn;shanghaitech.edu.cm;shanghaitech.edu.cn",
        "position": "PhD student;MS student;Undergrad student;Associate Professor",
        "bibtex": "@misc{\nzhang2024adaptive,\ntitle={Adaptive Knowledge Transfer for Generalized Category Discovery},\nauthor={Chuyu Zhang and Peiyan Gu and Xueyang Yu and Xuming He},\nyear={2024},\nurl={https://openreview.net/forum?id=j20nMRUWK9}\n}",
        "github": "",
        "project": "",
        "reviewers": "UEjY;ZnW3;tjGj;Npp8;2BvT",
        "site": "https://openreview.net/forum?id=j20nMRUWK9",
        "pdf_size": 2146339,
        "rating": "5;5;5;6;8",
        "confidence": "5;4;4;3;4",
        "soundness": "3;2;3;3;3",
        "contribution": "2;2;2;2;3",
        "presentation": "3;3;2;3;4",
        "wc_summary": "74;66;117;115;104",
        "wc_strengths": "34;37;83;62;97",
        "wc_weaknesses": "167;70;154;85;58",
        "wc_questions": "25;23;302;100;54",
        "wc_review": "300;196;656;362;313",
        "wc_reply_reviewers": "0;4;0;0;60",
        "wc_reply_authors": "614;460;1938;288;403",
        "reply_reviewers": "0;1;0;0;1",
        "reply_authors": "1;2;3;1;1",
        "rating_avg": [
            5.8,
            1.16619037896906
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            3.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            95.2,
            21.19811312357777
        ],
        "wc_strengths_avg": [
            62.6,
            24.791934172226256
        ],
        "wc_weaknesses_avg": [
            106.8,
            44.86156484118671
        ],
        "wc_questions_avg": [
            100.8,
            104.37509281432999
        ],
        "wc_review_avg": [
            365.4,
            155.0349637984929
        ],
        "wc_reply_reviewers_avg": [
            12.8,
            23.650792798551173
        ],
        "wc_reply_authors_avg": [
            740.6,
            607.8406370094057
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.6,
            0.8
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.2711630722733202,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:EjZMeVVmFEkJ:scholar.google.com/&scioq=Adaptive+Knowledge+Transfer+for+Generalized+Category+Discovery&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "ShanghaiTech University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.shanghaitech.edu.cn",
        "aff_unique_abbr": "ShanghaiTech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "j2AWbl4L3K",
        "title": "Weight Uncertainty in Individual Treatment Effect",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The estimation of individual treatment effects (ITE) has recently gained significant attention from both the research and industrial communities due to its potential applications in various fields such as healthcare, economics, and education. However, the sparsity of observational data often leads to a lack of robustness and over-fitting in most existing methods. To address this issue, this paper investigates the benefits of incorporating uncertainty modeling in the process of optimizing parameters for robust ITE estimation. Specifically, we derive an informative generalization bound that connects to Bayesian inference and propose a variational bound in closed form to learn a probability distribution on the weights of a hypothesis and representation function. Through experiments on one synthetic dataset and two benchmark datasets, we demonstrate the effectiveness of our proposed model in comparison to state-of-the-art methods. Moreover, we conduct experiments on a real-world dataset in recommender scenarios to verify the benefits of uncertainty in causal inference. The results of our experiments provide evidence of the practicality of our model, which aligns with our initial expectations.",
        "keywords": "Individual Treatment Effect;Causal inference;Bayesian inference",
        "primary_area": "causal reasoning",
        "supplementary_material": "",
        "author": "Zhenlei Wang;Xiaoxiao Xu;Xiaoxi Yu;Xu Chen;Lantao Hu;Peng Jiang;Kun Gai",
        "authorids": "~Zhenlei_Wang1;~Xiaoxiao_Xu2;~Xiaoxi_Yu1;~Xu_Chen13;~Lantao_Hu1;~Peng_Jiang6;~Kun_Gai1",
        "gender": "M;F;;M;M;M;M",
        "homepage": "https://causal-rec.github.io/;https://scholar.google.com/citations?hl=zh-CN&user=1I2OrQEAAAAJ&view_op=list_works&sortby=pubdate;;https://gsai.ruc.edu.cn/chenxu;;;",
        "dblp": "223/8301;116/1526;;83/6331-17;;;59/2902",
        "google_scholar": "7x0kGsUAAAAJ;https://scholar.google.com/citations?hl=zh-CN;;loPoqy0AAAAJ;P0EK1y8AAAAJ;https://scholar.google.com/citations?hl=en;PXO4ygEAAAAJ",
        "orcid": ";0009-0007-5493-5628;;0000-0003-0144-1775;;0000-0002-9266-0780;",
        "linkedin": ";;;;;;",
        "or_profile": "~Zhenlei_Wang1;~Xiaoxiao_Xu2;~Xiaoxi_Yu1;~Xu_Chen13;~Lantao_Hu1;~Peng_Jiang6;~Kun_Gai1",
        "aff": "Renmin University of China;Kuaishou Technology;;Renmin University of China;;Kuaishou Technology;Kuaishou- \u5feb\u624b\u79d1\u6280",
        "aff_domain": "ruc.edu.cn;kuaishou.com;;ruc.edu.cn;;kuaishou.com;kuaishou.com",
        "position": "PhD student;Engineer;;Associate Professor;;Vice President;Instructor",
        "bibtex": "@misc{\nanonymous2024weight,\ntitle={Weight Uncertainty in Individual Treatment Effect},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=j2AWbl4L3K}\n}",
        "github": "",
        "project": "",
        "reviewers": "AZrT;GUVX;A9su;dZmK;iMow",
        "site": "https://openreview.net/forum?id=j2AWbl4L3K",
        "pdf_size": 888124,
        "rating": "1;3;3;5;5",
        "confidence": "4;4;3;3;3",
        "soundness": "2;2;2;2;2",
        "contribution": "1;1;2;2;2",
        "presentation": "3;1;1;2;3",
        "wc_summary": "30;52;46;68;36",
        "wc_strengths": "33;28;23;27;41",
        "wc_weaknesses": "92;516;20;105;72",
        "wc_questions": "1;68;214;155;19",
        "wc_review": "156;664;303;355;168",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            3.4,
            1.4966629547095767
        ],
        "confidence_avg": [
            3.4,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.0,
            0.8944271909999159
        ],
        "wc_summary_avg": [
            46.4,
            13.230268326832983
        ],
        "wc_strengths_avg": [
            30.4,
            6.1838499334961226
        ],
        "wc_weaknesses_avg": [
            161.0,
            179.8466013023321
        ],
        "wc_questions_avg": [
            91.4,
            81.2861611838079
        ],
        "wc_review_avg": [
            329.2,
            184.07976531927673
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.7637626158259733,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:v0dFNaKcHWwJ:scholar.google.com/&scioq=Weight+Uncertainty+in+Individual+Treatment+Effect&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;1;1",
        "aff_unique_norm": "Renmin University of China;Kuaishou Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.ruc.edu.cn;https://www.kuaishou.com",
        "aff_unique_abbr": "RUC;Kuaishou",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "j2F9jDsjcC",
        "title": "Train Short, Test Long In Combinatorial Optimization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The inherent characteristics of the Transformer enable us to train on shorter datasets and extrapolate to testing on longer ones directly. Numerous researchers in the realm of natural language processing have proposed a variety of methods for length extrapolation, the majority of which involve position embeddings. Nonetheless, in combinatorial optimization problems, Transformers are devoid of position embeddings. We aspire to achieve successful length extrapolation in combinatorial optimization problems as well. As such, We propose an entropy invariant extrapolation method (EIE), which obviates the need for positional embeddings and employs varying scale factors according to different lengths. Our approach eliminates the need for retraining, setting it apart from prior work. Results on multiple combinatorial optimization datasets demonstrate that our method surpasses existing ones.",
        "keywords": "Transformer Extrapolation;Combinatorial Optimization;",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/d857888a54ae0a1a23a9edb3eb590389d6086382.zip",
        "author": "Xinyuan Tian;pengzhan qu;Hongsheng Qi",
        "authorids": "~Xinyuan_Tian1;~pengzhan_qu1;~Hongsheng_Qi1",
        "gender": ";;M",
        "homepage": ";;https://lenovo.com",
        "dblp": ";;",
        "google_scholar": ";;",
        "orcid": ";0000-0001-5910-3694;",
        "linkedin": ";;hong-sheng-qi-a542151/",
        "or_profile": "~Xinyuan_Tian1;~pengzhan_qu1;~Hongsheng_Qi1",
        "aff": ";Lenovo;Xi'an University of Electronic Science and Technology",
        "aff_domain": ";lenovo.com;xidian.edu.cn",
        "position": ";Principal Researcher;Lecturer",
        "bibtex": "@misc{\ntian2024train,\ntitle={Train Short, Test Long In Combinatorial Optimization},\nauthor={Xinyuan Tian and pengzhan qu and Hongsheng Qi},\nyear={2024},\nurl={https://openreview.net/forum?id=j2F9jDsjcC}\n}",
        "github": "",
        "project": "",
        "reviewers": "edwp;nV4X;zexN;SN8V",
        "site": "https://openreview.net/forum?id=j2F9jDsjcC",
        "pdf_size": 816147,
        "rating": "1;3;5;5",
        "confidence": "4;4;3;3",
        "soundness": "2;2;2;2",
        "contribution": "1;1;2;2",
        "presentation": "2;1;2;2",
        "wc_summary": "97;52;31;128",
        "wc_strengths": "30;31;28;44",
        "wc_weaknesses": "305;289;381;143",
        "wc_questions": "102;2;186;51",
        "wc_review": "534;374;626;366",
        "wc_reply_reviewers": "55;0;0;0",
        "wc_reply_authors": "815;275;326;411",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            3.5,
            1.6583123951777
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            77.0,
            37.887992820945264
        ],
        "wc_strengths_avg": [
            33.25,
            6.299801584177076
        ],
        "wc_weaknesses_avg": [
            279.5,
            86.13216588476108
        ],
        "wc_questions_avg": [
            85.25,
            68.0711943482704
        ],
        "wc_review_avg": [
            475.0,
            109.95908329919816
        ],
        "wc_reply_reviewers_avg": [
            13.75,
            23.81569860407206
        ],
        "wc_reply_authors_avg": [
            456.75,
            212.46455586756113
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.9045340337332909,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:vuY9EvpaNkcJ:scholar.google.com/&scioq=Train+Short,+Test+Long+In+Combinatorial+Optimization&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Lenovo Group Limited;Xi'an University of Electronic Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.lenovo.com;http://www.xidian.edu.cn/",
        "aff_unique_abbr": "Lenovo;Xidian University",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Xi'an",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "j3bkYuxITP",
        "title": "Refined Partitioning Boosts MGDA: Introducing RP-MGDA for Multi-Objective Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Multi-objective optimization is a critical topic in the field of machine learning, with applications in multi-task learning, federated learning, reinforcement learning, and more. In this paper, to elevate the performance of the widely used Multiple Gradient Descent Algorithm (MGDA) in multi-objective optimization tasks, we introduce a novel version of MGDA through Refined Partitioning (RP-MGDA). RP-MGDA leverages the concept of `refined partitioning', where variables are strategically partitioned and grouped in order to improve the optimization process, in contrast to vanilla MGDA which ignores potential variable structure and, as a result, treats all parameters as one variable. Our examples and experiments showcase the effectiveness of RP-MGDA compared to MGDA under various scenarios. We provide insights into the underlying mechanisms of RP-MGDA and demonstrate its potential applications. Specifically, the concept of refined variable partitioning in RP-MGDA is not limited solely to MGDA and holds promise for enhancing other multi-objective gradient methods (e.g., PCGrad, CAGrad).",
        "keywords": "Multi-Objective Optimization;Machine Learning;Optimization",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/c107285faaa6efd32636fd1b1dc3ae47d23e7cc1.pdf",
        "author": "Zeou Hu;Yaoliang Yu",
        "authorids": "~Zeou_Hu1;~Yaoliang_Yu1",
        "gender": "M;M",
        "homepage": "https://cs.uwaterloo.ca/~z97hu/;https://cs.uwaterloo.ca/~y328yu/",
        "dblp": "267/9499;90/4989",
        "google_scholar": ";https://scholar.google.ca/citations?user=zbXIQMsAAAAJ",
        "orcid": ";0000-0002-3823-0720",
        "linkedin": ";",
        "or_profile": "~Zeou_Hu1;~Yaoliang_Yu1",
        "aff": "University of Waterloo;University of Waterloo",
        "aff_domain": "uwaterloo.ca;uwaterloo.ca",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\nhu2024refined,\ntitle={Refined Partitioning Boosts {MGDA}: Introducing {RP}-{MGDA} for Multi-Objective Learning},\nauthor={Zeou Hu and Yaoliang Yu},\nyear={2024},\nurl={https://openreview.net/forum?id=j3bkYuxITP}\n}",
        "github": "",
        "project": "",
        "reviewers": "pzQ4;M8VM;wLSR;kzPt",
        "site": "https://openreview.net/forum?id=j3bkYuxITP",
        "pdf_size": 1322742,
        "rating": "3;3;5;5",
        "confidence": "4;2;3;4",
        "soundness": "2;3;2;3",
        "contribution": "2;3;2;3",
        "presentation": "2;3;2;3",
        "wc_summary": "111;72;105;66",
        "wc_strengths": "47;41;54;73",
        "wc_weaknesses": "316;24;97;130",
        "wc_questions": "172;114;46;37",
        "wc_review": "646;251;302;306",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            88.5,
            19.72941965694886
        ],
        "wc_strengths_avg": [
            53.75,
            12.028611723719408
        ],
        "wc_weaknesses_avg": [
            141.75,
            107.66702141324427
        ],
        "wc_questions_avg": [
            92.25,
            54.82871054475019
        ],
        "wc_review_avg": [
            376.25,
            157.24244814934676
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.30151134457776363,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:P1iXHs7kSuUJ:scholar.google.com/&scioq=Refined+Partitioning+Boosts+MGDA:+Introducing+RP-MGDA+for+Multi-Objective+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Waterloo",
        "aff_unique_dep": "",
        "aff_unique_url": "https://uwaterloo.ca",
        "aff_unique_abbr": "UW",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Canada"
    },
    {
        "title": "Training Graph Transformers via Curriculum-Enhanced Attention Distillation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18040",
        "id": "j4VMrwgn1M",
        "author_site": "Yisong Huang, Jin Li, Xinlong Chen, Yang-Geng Fu",
        "tldr": "",
        "abstract": "Recent studies have shown that Graph Transformers (GTs) can be effective for specific graph-level tasks. However, when it comes to node classification, training GTs remains challenging, especially in semi-supervised settings with a severe scarcity of labeled data. Our paper aims to address this research gap by focusing on semi-supervised node classification. To accomplish this, we develop a curriculum-enhanced attention distillation method that involves utilizing a Local GT teacher and a Global GT student. Additionally, we introduce the concepts of in-class and out-of-class and then propose two improvements, out-of-class entropy and top-k pruning, to facilitate the student's out-of-class exploration under the teacher's in-class guidance. Taking inspiration from human learning, our method involves a curriculum mechanism for distillation that initially provides strict guidance to the student and gradually allows for more out-of-class exploration by a dynamic balance. Extensive experiments show that our method outperforms many state-of-the-art approaches on seven public graph benchmarks, proving its effectiveness.",
        "keywords": "graph transformers;graph neural networks;knowledge distillation;curriculum learning;node classification",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Yisong Huang;Jin Li;Xinlong Chen;Yang-Geng Fu",
        "authorids": "~Yisong_Huang1;~Jin_Li8;~Xinlong_Chen1;~Yang-Geng_Fu1",
        "gender": "M;;;",
        "homepage": ";https://github.com/jslijin;https://github.com/cxl078;",
        "dblp": "214/0166-2;48/1097-32.html;118/7338;",
        "google_scholar": ";;;",
        "orcid": "0009-0008-8315-2240;0000-0003-3332-7790;0009-0002-1763-3122;",
        "linkedin": ";;;",
        "or_profile": "~Yisong_Huang1;~Jin_Li8;~Xinlong_Chen1;~Yang-Geng_Fu1",
        "aff": "Fuzhou University;Hong Kong University of Science and Technology (Guangzhou);Fuzhou University;",
        "aff_domain": "fzu.edu.cn;hkust-gz.edu.cn;fzu.edu.cn;",
        "position": "MS student;PhD student;PhD student;",
        "bibtex": "@inproceedings{\nhuang2024training,\ntitle={Training Graph Transformers via Curriculum-Enhanced Attention Distillation},\nauthor={Yisong Huang and Jin Li and Xinlong Chen and Yang-Geng Fu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=j4VMrwgn1M}\n}",
        "github": "",
        "project": "",
        "reviewers": "imQL;4ymw;qbbX;pnsY",
        "pdf_size": 4591047,
        "rating": "5;6;8;8",
        "confidence": "5;4;3;3",
        "soundness": "2;3;3;4",
        "contribution": "3;3;2;4",
        "presentation": "3;2;3;4",
        "wc_summary": "94;112;156;62",
        "wc_strengths": "66;12;111;45",
        "wc_weaknesses": "107;24;190;13",
        "wc_questions": "4;96;18;101",
        "wc_review": "271;244;475;221",
        "wc_reply_reviewers": "0;0;15;0",
        "wc_reply_authors": "1857;576;846;741",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "3;1;2;1",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            106.0,
            33.97057550292606
        ],
        "wc_strengths_avg": [
            58.5,
            35.90612761075747
        ],
        "wc_weaknesses_avg": [
            83.5,
            71.42303549976016
        ],
        "wc_questions_avg": [
            54.75,
            44.064583284084286
        ],
        "wc_review_avg": [
            302.75,
            101.01082862742985
        ],
        "wc_reply_reviewers_avg": [
            3.75,
            6.49519052838329
        ],
        "wc_reply_authors_avg": [
            1005.0,
            501.2289895846009
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.986440050415621,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11064104395527654551&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=j4VMrwgn1M",
        "pdf": "https://openreview.net/pdf?id=j4VMrwgn1M",
        "email": "fzu.edu.cn;hkust-gz.edu.cn;fzu.edu.cn;",
        "author_num": 4,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Fuzhou University;Hong Kong University of Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.fznu.edu.cn;https://www.ust.hk",
        "aff_unique_abbr": "FZU;HKUST",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Non-Exchangeable Conformal Risk Control",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18039",
        "id": "j511LaqEeP",
        "author_site": "Ant\u00f3nio Farinhas, Chrysoula Zerva, Dennis Ulmer, Andre Martins",
        "tldr": "",
        "abstract": "Split conformal prediction has recently sparked great interest due to its ability to provide formally guaranteed uncertainty sets or intervals for predictions made by black-box neural models, ensuring a predefined probability of containing the actual ground truth. While the original formulation assumes data exchangeability, some extensions handle non-exchangeable data, which is often the case in many real-world scenarios. In parallel, some progress has been made in conformal methods that provide statistical guarantees for a broader range of objectives, such as bounding the best $F_1$-score or minimizing the false negative rate in expectation. In this paper, we leverage and extend these two lines of work by proposing non-exchangeable conformal risk control, which allows controlling the expected value of any monotone loss function when the data is not exchangeable. Our framework is flexible, makes very few assumptions, and allows weighting the data based on its relevance for a given test example; a careful choice of weights may result in tighter bounds, making our framework useful in the presence of change points, time series, or other forms of distribution drift. Experiments with both synthetic and real world data show the usefulness of our method.",
        "keywords": "conformal prediction;conformal risk control;non-exchangeable data;uncertainty",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Ant\u00f3nio Farinhas;Chrysoula Zerva;Dennis Thomas Ulmer;Andre Martins",
        "authorids": "~Ant\u00f3nio_Farinhas1;~Chrysoula_Zerva1;~Dennis_Thomas_Ulmer1;~Andre_Martins1",
        "gender": "M;F;Non-Binary;M",
        "homepage": ";;http://dennisulmer.eu/;https://andre-martins.github.io/",
        "dblp": "267/5345;190/2097;;m/AndreFTMartins",
        "google_scholar": "yK5wIPkAAAAJ;https://scholar.google.com/citations?hl=en;rn9WoaEAAAAJ;https://scholar.google.pt/citations?user=mT7ppvwAAAAJ",
        "orcid": ";0000-0002-4031-9492;;",
        "linkedin": ";chryssa-zerva-7bb4a966/;;",
        "or_profile": "~Ant\u00f3nio_Farinhas1;~Chrysoula_Zerva1;~Dennis_Thomas_Ulmer1;~Andre_Martins1",
        "aff": "Instituto Superior T\u00e9cnico;Instituto Superior T\u00e9cnico;IT University of Copenhagen;Unbabel",
        "aff_domain": "tecnico.ulisboa.pt;tecnico.ulisboa.pt;itu.dk;unbabel.com",
        "position": "PhD student;Assistant Professor;PhD student;Research Scientist",
        "bibtex": "@inproceedings{\nfarinhas2024nonexchangeable,\ntitle={Non-Exchangeable Conformal Risk Control},\nauthor={Ant{\\'o}nio Farinhas and Chrysoula Zerva and Dennis Thomas Ulmer and Andre Martins},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=j511LaqEeP}\n}",
        "github": "",
        "project": "",
        "reviewers": "aj7z;wGbj;r1o1;2JpW",
        "pdf_size": 1443546,
        "rating": "5;5;6;8",
        "confidence": "4;5;4;4",
        "soundness": "2;3;3;4",
        "contribution": "2;2;2;2",
        "presentation": "2;3;3;3",
        "wc_summary": "74;229;125;39",
        "wc_strengths": "79;106;15;46",
        "wc_weaknesses": "158;69;215;234",
        "wc_questions": "88;201;45;8",
        "wc_review": "399;605;400;327",
        "wc_reply_reviewers": "441;178;831;0",
        "wc_reply_authors": "1107;925;2010;170",
        "reply_reviewers": "2;1;3;0",
        "reply_authors": "3;3;5;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            116.75,
            71.66022257849887
        ],
        "wc_strengths_avg": [
            61.5,
            34.23813663153998
        ],
        "wc_weaknesses_avg": [
            169.0,
            64.15216286299317
        ],
        "wc_questions_avg": [
            85.5,
            72.44480657714533
        ],
        "wc_review_avg": [
            432.75,
            103.76024045847234
        ],
        "wc_reply_reviewers_avg": [
            362.5,
            312.6903420318574
        ],
        "wc_reply_authors_avg": [
            1053.0,
            654.7591160113772
        ],
        "reply_reviewers_avg": [
            1.5,
            1.118033988749895
        ],
        "reply_authors_avg": [
            3.0,
            1.4142135623730951
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.4714045207910316,
        "gs_citation": 17,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13330558226647386577&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=j511LaqEeP",
        "pdf": "https://openreview.net/pdf?id=j511LaqEeP",
        "email": "tecnico.ulisboa.pt;tecnico.ulisboa.pt;itu.dk;unbabel.com",
        "author_num": 4,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "Instituto Superior T\u00e9cnico;IT University of Copenhagen;Unbabel",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ist.utl.pt;https://itu.dk;https://www.unbabel.com",
        "aff_unique_abbr": "IST;ITU;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "Portugal;Denmark"
    },
    {
        "id": "j56A1HUTQS",
        "title": "Bridging Indexing Structure and Graph Learning: Expressive and Scalable Graph Neural Network via Core-Fringe",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Existing message passing-based and transformer-based graph neural networks (GNNs) can not satisfy requirements for learning representative graph embeddings due to restricted receptive fields, redundant message passing, and reliance on fixed aggregations. These methods face scalability and expressivity limitations from intractable exponential growth or quadratic complexity, restricting interaction ranges and information coverage across large graphs. Motivated by the analysis of long-range graph structures, we introduce a novel Graph Neural Network called Core-Fringe Graph Neural Network (CFGNN). Our Core-Fringe structure, drawing inspiration from the graph indexing technique known as Hub Labeling, offers a straightforward and effective approach for learning scalable graph representations while ensuring comprehensive coverage of information. CFGNN leverages this structure to enable selective propagation of relevant embeddings through a carefully designed message function. Theoretical analysis is presented to show the expressivity and scalability of the proposed method. Empirically, CFGNN exceeds standard GNNs on tasks including classification and regression, especially for large, long-range graphs where scalability and coverage matter. Ablation studies further confirm the benefits of our core-fringe based graph neural network, including improved expressivity and scalability.",
        "keywords": "graph neural networks;hub labeling;graph indexing;graph sampler",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/db8e889c3c1f704d2c26ad6f7340326ec8ed428c.pdf",
        "author": "Pak Lon Ip;Shenghui Zhang;Xuekai WEI;Tsz Nam Chan;Leong Hou U",
        "authorids": "~Pak_Lon_Ip1;~Shenghui_Zhang1;~Xuekai_WEI1;~Tsz_Nam_Chan1;~Leong_Hou_U2",
        "gender": "M;M;M;M;M",
        "homepage": ";;https://scholars.cityu.edu.hk/en/persons/xuekai-wei(3c5a3770-05a4-4518-9150-2c3959299e73).html;https://edisonchan-szu.github.io/;https://www.fst.um.edu.mo/personal/ryanlhu/",
        "dblp": "300/3964;94/9972;211/0698;166/7652;38/4996",
        "google_scholar": "ygUVTbgAAAAJ;;;https://scholar.google.com.hk/citations?user=b2AOUEEAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": "0009-0001-9220-5884;0000-0002-3047-5395;0000-0002-3761-1759;0000-0001-5851-7967;0000-0002-5135-5165",
        "linkedin": ";;;;",
        "or_profile": "~Pak_Lon_Ip1;~Shenghui_Zhang1;~Xuekai_WEI1;~Tsz_Nam_Chan1;~Leong_Hou_U2",
        "aff": "University of Macau;University of Macau;Chongqing University;Shenzhen University;University of macau",
        "aff_domain": "um.edu.mo;edu.mo;cqu.edu.cn;szu.edu.cn;um.edu.mo",
        "position": "PhD student;PhD student;Associate Professor;Associate Professor;Associate Professor",
        "bibtex": "@misc{\nip2024bridging,\ntitle={Bridging Indexing Structure and Graph Learning: Expressive and Scalable Graph Neural Network via Core-Fringe},\nauthor={Pak Lon Ip and Shenghui Zhang and Xuekai WEI and Tsz Nam Chan and Leong Hou U},\nyear={2024},\nurl={https://openreview.net/forum?id=j56A1HUTQS}\n}",
        "github": "",
        "project": "",
        "reviewers": "T5WA;iyTY;PUcW",
        "site": "https://openreview.net/forum?id=j56A1HUTQS",
        "pdf_size": 1475367,
        "rating": "3;5;6",
        "confidence": "3;5;4",
        "soundness": "2;2;3",
        "contribution": "1;2;2",
        "presentation": "3;2;4",
        "wc_summary": "105;46;71",
        "wc_strengths": "41;21;71",
        "wc_weaknesses": "376;100;199",
        "wc_questions": "57;27;62",
        "wc_review": "579;194;403",
        "wc_reply_reviewers": "0;0;151",
        "wc_reply_authors": "1834;1111;1176",
        "reply_reviewers": "0;0;1",
        "reply_authors": "3;2;2",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            74.0,
            24.179881444429512
        ],
        "wc_strengths_avg": [
            44.333333333333336,
            20.548046676563253
        ],
        "wc_weaknesses_avg": [
            225.0,
            114.16654501210063
        ],
        "wc_questions_avg": [
            48.666666666666664,
            15.456030825826172
        ],
        "wc_review_avg": [
            392.0,
            157.3679340484162
        ],
        "wc_reply_reviewers_avg": [
            50.333333333333336,
            71.18208263944578
        ],
        "wc_reply_authors_avg": [
            1373.6666666666667,
            326.5846835899619
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.6546536707079772,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:u-eZvDOmY4EJ:scholar.google.com/&scioq=Bridging+Indexing+Structure+and+Graph+Learning:+Expressive+and+Scalable+Graph+Neural+Network+via+Core-Fringe&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2;0",
        "aff_unique_norm": "University of Macau;Chongqing University;Shenzhen University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.um.edu.mo;https://www.cqu.edu.cn;https://www.szu.edu.cn",
        "aff_unique_abbr": "UM;CQU;SZU",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Macau SAR;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "j5EbZEyK9I",
        "title": "Mo' Data Mo' Problems: How Data Composition Compromises Scaling Properties",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The accumulation of data in the machine learning setting is often presented as a panacea to address its many modeling problems---including issues with correctness, robustness, and bias. But when does adding more data help, and when does it hinder progress on desired model outcomes? We model data accumulation from multiple sources and present analysis of two practical strategies that result the addition of more data degrading overall model performance. We then demonstrate empirically on three real-world datasets that adding training data can result in reduced overall accuracy and reduced worst-subgroup performance while introducing further accuracy disparities between subgroups. We use a simple heuristic for determining when the accumulation of more data may worsen the issues the additional data is meant to solve. We conclude with a discussion on considerations for data collection and suggestions for studying data composition in the age of increasingly large models.",
        "keywords": "data composition;tabular data;measuring data;dataset bias;disparities",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/794f349c2a44db9b35cac7bc82ff92f50bc1d087.zip",
        "author": "Judy Hanwen Shen;Inioluwa Deborah Raji;Irene Y. Chen",
        "authorids": "~Judy_Hanwen_Shen1;~Inioluwa_Deborah_Raji1;~Irene_Y._Chen1",
        "gender": "F;F;F",
        "homepage": "http://heyyjudes.github.io/;;http://irenechen.net",
        "dblp": "217/2243;;48/9068",
        "google_scholar": "LCjSZ3eS8pIC;https://scholar.google.com/citations?hl=en;Du51uRIAAAAJ",
        "orcid": ";;",
        "linkedin": ";deborah-raji-065751b2/;irenetrampoline/",
        "or_profile": "~Judy_Hanwen_Shen1;~Inioluwa_Deborah_Raji1;~Irene_Chen2",
        "aff": "Apple;University of California, Berkeley;University of California, Berkeley",
        "aff_domain": "apple.com;berkeley.edu;berkeley.edu",
        "position": "Intern;PhD student;Assistant Professor",
        "bibtex": "@misc{\nshen2024mo,\ntitle={Mo' Data Mo' Problems: How Data Composition Compromises Scaling Properties},\nauthor={Judy Hanwen Shen and Inioluwa Deborah Raji and Irene Y. Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=j5EbZEyK9I}\n}",
        "github": "",
        "project": "",
        "reviewers": "7keK;4rSz;UNBZ;r5EZ",
        "site": "https://openreview.net/forum?id=j5EbZEyK9I",
        "pdf_size": 567156,
        "rating": "3;3;6;6",
        "confidence": "4;4;4;4",
        "soundness": "3;2;3;2",
        "contribution": "1;1;3;2",
        "presentation": "2;3;3;3",
        "wc_summary": "51;60;94;52",
        "wc_strengths": "6;29;55;66",
        "wc_weaknesses": "442;479;209;43",
        "wc_questions": "123;96;34;273",
        "wc_review": "622;664;392;434",
        "wc_reply_reviewers": "0;455;0;11",
        "wc_reply_authors": "867;2130;502;303",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "2;4;1;1",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            64.25,
            17.52676524633111
        ],
        "wc_strengths_avg": [
            39.0,
            23.313086453749534
        ],
        "wc_weaknesses_avg": [
            293.25,
            177.73065998864686
        ],
        "wc_questions_avg": [
            131.5,
            87.8364958317441
        ],
        "wc_review_avg": [
            528.0,
            116.90166808048549
        ],
        "wc_reply_reviewers_avg": [
            116.5,
            195.48465412916687
        ],
        "wc_reply_authors_avg": [
            950.5,
            710.387394313835
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Cy77VHQJr8AJ:scholar.google.com/&scioq=Mo%27+Data+Mo%27+Problems:+How+Data+Composition+Compromises+Scaling+Properties&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Apple;University of California, Berkeley",
        "aff_unique_dep": "Apple Inc.;",
        "aff_unique_url": "https://www.apple.com;https://www.berkeley.edu",
        "aff_unique_abbr": "Apple;UC Berkeley",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Berkeley",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Safe Offline Reinforcement Learning with Feasibility-Guided Diffusion Model",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18038",
        "id": "j5JvZCaDM0",
        "author_site": "Yinan Zheng, Jianxiong Li, Dongjie Yu, Yujie Yang, Shengbo Li, Xianyuan Zhan, Jingjing Liu",
        "tldr": "",
        "abstract": "Safe offline reinforcement learning is a promising way to bypass risky online interactions towards safe policy learning. Most existing methods only enforce soft constraints, i.e., constraining safety violations in expectation below thresholds predetermined. This can lead to potentially unsafe outcomes, thus unacceptable in safety-critical scenarios. An alternative is to enforce the hard constraint of zero violation. However, this can be challenging in offline setting, as it needs to strike the right balance among three highly intricate and correlated aspects: safety constraint satisfaction, reward maximization, and behavior regularization imposed by offline datasets. Interestingly, we discover that via reachability analysis of safe-control theory, the hard safety constraint can be equivalently translated to identifying the largest feasible region given the offline dataset. This seamlessly converts the original trilogy problem to a feasibility-dependent objective, i.e., maximizing reward value within the feasible region while minimizing safety risks in the infeasible region. Inspired by these, we propose FISOR (FeasIbility-guided Safe Offline RL), which allows safety constraint adherence, reward maximization, and offline policy learning to be realized via three decoupled processes, while offering strong safety performance and stability. In FISOR, the optimal policy for the translated optimization problem can be derived in a special form of weighted behavior cloning, which can be effectively extracted with a guided diffusion model thanks to its expressiveness.  We compare FISOR against baselines on DSRL benchmark for safe offline RL. Evaluation results show that FISOR is the only method that can guarantee safety satisfaction in all tasks, while achieving top returns in most tasks. Code: https://github.com/ZhengYinan-AIR/FISOR.",
        "keywords": "Safe offline reinforcement learning;Hamilton-Jacobi reachability;diffusion model",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Yinan Zheng;Jianxiong Li;Dongjie Yu;Yujie Yang;Shengbo Eben Li;Xianyuan Zhan;Jingjing Liu",
        "authorids": "~Yinan_Zheng1;~Jianxiong_Li1;~Dongjie_Yu1;~Yujie_Yang1;~Shengbo_Eben_Li2;~Xianyuan_Zhan1;~Jingjing_Liu2",
        "gender": ";M;M;M;M;;M",
        "homepage": "https://github.com/ZhengYinan-AIR;https://manutdmoon.github.io;https://yangyujie-jack.github.io/;http://www.idlab-tsinghua.com/thulab/labweb/dpeople.html?11;http://zhanxianyuan.xyz/;https://air.tsinghua.edu.cn/en/info/1046/1194.htm#:~:text=Jingjing%20Liu%20is%20Professor%2C%20Principal,CVPR%2C%20ACL%2C%20etc.);https://facebear-ljx.github.io/",
        "dblp": ";;;;181/5081;30/3008-1;43/1987",
        "google_scholar": ";;2T7-s0MAAAAJ;Dxiw1K8AAAAJ;pDMnGloAAAAJ;BzJ_GboAAAAJ;TRLwpiUAAAAJ",
        "orcid": ";0000-0002-3616-5400;0000-0001-7222-0019;;0000-0002-3683-0554;;",
        "linkedin": ";;;;;jingjing-liu-65703431/;",
        "or_profile": "~Yinan_Zheng1;~Dongjie_Yu1;~Yujie_Yang1;~Shengbo_Eben_Li2;~Xianyuan_Zhan1;~Jingjing_Liu2;~Li_Jianxiong1",
        "aff": "Tsinghua University;University of Hong Kong;Tsinghua University;Tsinghua University;Tsinghua University;Tsinghua University;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;hku.hk;tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "PhD student;PhD student;PhD student;Full Professor;Associate Professor;Full Professor;PhD student",
        "bibtex": "@inproceedings{\nzheng2024safe,\ntitle={Safe Offline Reinforcement Learning with Feasibility-Guided Diffusion Model},\nauthor={Yinan Zheng and Jianxiong Li and Dongjie Yu and Yujie Yang and Shengbo Eben Li and Xianyuan Zhan and Jingjing Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=j5JvZCaDM0}\n}",
        "github": "",
        "project": "",
        "reviewers": "FU8i;axZi;3zVo;5fk7",
        "pdf_size": 9223469,
        "rating": "6;8;8;8",
        "confidence": "3;3;3;2",
        "soundness": "2;3;4;3",
        "contribution": "3;3;4;3",
        "presentation": "3;3;3;3",
        "wc_summary": "92;90;45;59",
        "wc_strengths": "20;47;89;96",
        "wc_weaknesses": "89;404;115;129",
        "wc_questions": "39;96;32;50",
        "wc_review": "240;637;281;334",
        "wc_reply_reviewers": "21;255;32;42",
        "wc_reply_authors": "712;1029;740;502",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;3;2;2",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            71.5,
            20.130822139197395
        ],
        "wc_strengths_avg": [
            63.0,
            31.10466202999158
        ],
        "wc_weaknesses_avg": [
            184.25,
            127.68197797653356
        ],
        "wc_questions_avg": [
            54.25,
            24.94368657596547
        ],
        "wc_review_avg": [
            373.0,
            156.0208319424044
        ],
        "wc_reply_reviewers_avg": [
            87.5,
            96.99097896196326
        ],
        "wc_reply_authors_avg": [
            745.75,
            187.62778978605488
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 37,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11088399687482596128&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=j5JvZCaDM0",
        "pdf": "https://openreview.net/pdf?id=j5JvZCaDM0",
        "email": "tsinghua.edu.cn;hku.hk;tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn",
        "author_num": 7,
        "aff_unique_index": "0;1;0;0;0;0;0",
        "aff_unique_norm": "Tsinghua University;University of Hong Kong",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.hku.hk",
        "aff_unique_abbr": "THU;HKU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "j5cPsz8AEQ",
        "title": "Physics-informed neural networks with unknown measurement noise",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Physics-informed neural networks (PINNs) constitute a flexible approach to both finding solutions and identifying parameters of partial differential equations. Most works on the topic assume noiseless data, or data contaminated by weak Gaussian noise. We show that the standard PINN framework breaks down in case of non-Gaussian noise. We give a way of resolving this fundamental issue and we propose to jointly train an energy-based model (EBM) to learn the correct noise distribution. We illustrate the improved performance of our approach using multiple examples",
        "keywords": "physics-informed neural networks;energy-based models;non-Gaussian noise;system identification",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Philipp Pilar;Niklas Wahlstr\u00f6m",
        "authorids": "~Philipp_Pilar1;~Niklas_Wahlstr\u00f6m1",
        "gender": "M;M",
        "homepage": ";https://nikwa.github.io/",
        "dblp": "296/6568;86/9874",
        "google_scholar": "jJ-2FqEAAAAJ;https://scholar.google.se/citations?user=L8DhrjsAAAAJ",
        "orcid": "0000-0002-9935-3716;0000-0002-4634-7240",
        "linkedin": ";",
        "or_profile": "~Philipp_Pilar1;~Niklas_Wahlstr\u00f6m1",
        "aff": "Uppsala University;Uppsala University",
        "aff_domain": "uu.se;uu.se",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\npilar2024physicsinformed,\ntitle={Physics-informed neural networks with unknown measurement noise},\nauthor={Philipp Pilar and Niklas Wahlstr{\\\"o}m},\nyear={2024},\nurl={https://openreview.net/forum?id=j5cPsz8AEQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "4nHF;pToC;PpGy;99Tt",
        "site": "https://openreview.net/forum?id=j5cPsz8AEQ",
        "pdf_size": 1617745,
        "rating": "3;3;5;6",
        "confidence": "3;3;4;3",
        "soundness": "2;1;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;1;3;2",
        "wc_summary": "49;70;94;91",
        "wc_strengths": "15;9;12;40",
        "wc_weaknesses": "23;203;91;296",
        "wc_questions": "13;4;74;31",
        "wc_review": "100;286;271;458",
        "wc_reply_reviewers": "52;14;65;73",
        "wc_reply_authors": "131;231;237;332",
        "reply_reviewers": "2;1;1;2",
        "reply_authors": "2;1;2;2",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            76.0,
            18.12456896039186
        ],
        "wc_strengths_avg": [
            19.0,
            12.30853362509117
        ],
        "wc_weaknesses_avg": [
            153.25,
            104.5140540788654
        ],
        "wc_questions_avg": [
            30.5,
            26.93046601899046
        ],
        "wc_review_avg": [
            278.75,
            126.68341446298328
        ],
        "wc_reply_reviewers_avg": [
            51.0,
            22.638462845343543
        ],
        "wc_reply_authors_avg": [
            232.75,
            71.10687378868515
        ],
        "reply_reviewers_avg": [
            1.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18093080440794738624&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Uppsala University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uu.se",
        "aff_unique_abbr": "UU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Sweden"
    },
    {
        "id": "j7S7o6ROn9",
        "title": "Distributional Structured Pruning by Lower bounding the Total Variation Distance using Witness functions",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent literature introduced the notion of distributional structured pruning (DSP) in Deep Neural Networks by retaining discriminative filters that can effectively differentiate between classes.  Crucial to  DSP is the ability to estimate the discriminative ability of a filter, which is defined by the minimum pairwise Total Variation (TV) distance between the class-conditional feature distributions. Since the computation of TV distance is generally intractable, existing literature assumes the class-conditional feature distributions are Gaussian, thereby enabling the use of the tractable Hellinger lower bound to estimate discriminative ability. However, the Gaussian assumption is not only restrictive but also does not typically hold. In this work, we address this gap by deriving a lower bound on TV Distance which depends only on the moments of witness functions. Using linear witness functions, the bound establishes new relationships between the TV Distance and well-known discriminant-based classifiers, such as Fisher Discriminants and Minimax Probability machines. The lower bounds are used to produce a variety of pruning algorithms called WitnessPrune by varying the choice of witness function. We empirically show that we can achieve up to 7\\% greater accuracy for similar sparsity in hard-to-prune layers using a polynomial witness function as compared to the state-of-the-art.",
        "keywords": "Pruning;Structured Pruning;Total Variation Distance",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Chaitanya Murti;Chiranjib Bhattacharyya",
        "authorids": "~Chaitanya_Murti1;~Chiranjib_Bhattacharyya1",
        "gender": ";M",
        "homepage": ";http://www.csa.iisc.ac.in/~chiru/",
        "dblp": ";b/CBhattacharyya",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Chaitanya_Murti1;~Chiranjib_Bhattacharyya1",
        "aff": ";Indian Institute of Science, Indian institute of science, Bangalore",
        "aff_domain": ";iisc.ac.in",
        "position": ";Full Professor",
        "bibtex": "@misc{\nmurti2024distributional,\ntitle={Distributional Structured Pruning by Lower bounding the Total Variation Distance using Witness functions},\nauthor={Chaitanya Murti and Chiranjib Bhattacharyya},\nyear={2024},\nurl={https://openreview.net/forum?id=j7S7o6ROn9}\n}",
        "github": "",
        "project": "",
        "reviewers": "1f4m;G7wT;XVjC",
        "site": "https://openreview.net/forum?id=j7S7o6ROn9",
        "pdf_size": 694918,
        "rating": "3;6;6",
        "confidence": "3;3;3",
        "soundness": "3;3;3",
        "contribution": "2;2;3",
        "presentation": "3;3;3",
        "wc_summary": "133;98;60",
        "wc_strengths": "26;76;143",
        "wc_weaknesses": "291;87;161",
        "wc_questions": "138;78;122",
        "wc_review": "588;339;486",
        "wc_reply_reviewers": "570;33;0",
        "wc_reply_authors": "2386;926;1797",
        "reply_reviewers": "1;1;0",
        "reply_authors": "5;2;3",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            97.0,
            29.81051268708183
        ],
        "wc_strengths_avg": [
            81.66666666666667,
            47.93282336307299
        ],
        "wc_weaknesses_avg": [
            179.66666666666666,
            84.32213364367757
        ],
        "wc_questions_avg": [
            112.66666666666667,
            25.368396787253932
        ],
        "wc_review_avg": [
            471.0,
            102.20567498920987
        ],
        "wc_reply_reviewers_avg": [
            201.0,
            261.26997531289356
        ],
        "wc_reply_authors_avg": [
            1703.0,
            599.7371646535395
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            1.247219128924647
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:e70BA3QpxLAJ:scholar.google.com/&scioq=Distributional+Structured+Pruning+by+Lower+bounding+the+Total+Variation+Distance+using+Witness+functions&hl=en&as_sdt=0,48",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Indian Institute of Science",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.iisc.ac.in",
        "aff_unique_abbr": "IISc",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Bangalore",
        "aff_country_unique_index": "0",
        "aff_country_unique": "India"
    },
    {
        "id": "j80yTpU7ni",
        "title": "Connection Strength-Based Optimization for Multi-Task Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The goal of multi-task learning is to learn diverse tasks within a single unified network. As each task has its own unique objective function, conflicts emerge during training, resulting in negative transfer among them. Earlier research identified these conflicting gradients in shared parameters between tasks and attempted to realign them in the same direction. However, we prove that such optimization strategies lead to sub-optimal Pareto solutions due to their inability to accurately determine the individual contributions of each parameter across various tasks. In this paper, we propose the concept of task priority to evaluate parameter contributions across different tasks. We identify two types of connections to learn and maintain task priority: implicit and explicit connections. Implicit connections relate to the links between parameters influenced by task-specific loss during backpropagation, whereas explicit connections are gauged by the magnitude of parameters. Based on these, we present a new method named connection strength-based optimization for multi-task learning. Our optimization process consists of two phases. The first phase learns the task priority within the network, while the second phase modifies the gradients while upholding this priority. This ultimately leads to finding new Pareto optimal solutions for multiple tasks. Through extensive experiments with different loss scaling techniques, we show that our approach greatly enhances multi-task performance in comparison to earlier gradient manipulation methods.",
        "keywords": "multi-task learning;optimization;task priority;connection strength",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Wooseong Jeong;Kuk-Jin Yoon",
        "authorids": "~Wooseong_Jeong2;~Kuk-Jin_Yoon1",
        "gender": "M;M",
        "homepage": ";",
        "dblp": "166/4787;42/5677",
        "google_scholar": ";1NvBj_gAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Wooseong_Jeong2;~Kuk-Jin_Yoon1",
        "aff": "The Korea Advanced Institute of Science and Technology (KAIST);Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\njeong2024connection,\ntitle={Connection Strength-Based Optimization for Multi-Task Learning},\nauthor={Wooseong Jeong and Kuk-Jin Yoon},\nyear={2024},\nurl={https://openreview.net/forum?id=j80yTpU7ni}\n}",
        "github": "",
        "project": "",
        "reviewers": "twaP;8sTu;PR9H;3sc7",
        "site": "https://openreview.net/forum?id=j80yTpU7ni",
        "pdf_size": 11831417,
        "rating": "3;5;6;6",
        "confidence": "4;4;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;4",
        "wc_summary": "57;50;131;374",
        "wc_strengths": "46;57;56;143",
        "wc_weaknesses": "129;81;150;179",
        "wc_questions": "154;5;48;35",
        "wc_review": "386;193;385;731",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            153.0,
            131.48193792304707
        ],
        "wc_strengths_avg": [
            75.5,
            39.207779840230685
        ],
        "wc_weaknesses_avg": [
            134.75,
            35.75174820900371
        ],
        "wc_questions_avg": [
            60.5,
            56.189411813970786
        ],
        "wc_review_avg": [
            423.75,
            194.01981213267885
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.4714045207910316,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:xlro8x-yAu8J:scholar.google.com/&scioq=Connection+Strength-Based+Optimization+for+Multi-Task+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "Solving Inverse Problems with Latent Diffusion Models via Hard Data Consistency",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18037",
        "id": "j8hdRqOUhN",
        "author_site": "Bowen Song, Soo Min Kwon, Zecheng Zhang, Xinyu Hu, Qing Qu, Liyue Shen",
        "tldr": "",
        "abstract": "Latent diffusion models have been demonstrated to generate high-quality images, while offering efficiency in model training compared to diffusion models operating in the pixel space. However, incorporating latent diffusion models to solve inverse problems remains a challenging problem due to the nonlinearity of the encoder and decoder. To address these issues, we propose ReSample, an algorithm that can solve general inverse problems with pre-trained latent diffusion models. Our algorithm incorporates data consistency by solving an optimization problem during the reverse sampling process, a concept that we term as hard data consistency. Upon solving this optimization problem, we propose a novel resampling scheme to map the measurement-consistent sample back onto the noisy data manifold and theoretically demonstrate its benefits. Lastly, we apply our algorithm to solve a wide range of linear and nonlinear inverse problems in both natural and medical images, demonstrating that our approach outperforms existing state-of-the-art approaches, including those based on pixel-space diffusion models.",
        "keywords": "Diffusion models;inverse problems",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Bowen Song;Soo Min Kwon;Zecheng Zhang;Xinyu Hu;Qing Qu;Liyue Shen",
        "authorids": "~Bowen_Song3;~Soo_Min_Kwon1;~Zecheng_Zhang1;~Xinyu_Hu2;~Qing_Qu2;~Liyue_Shen1",
        "gender": ";M;;F;M;F",
        "homepage": "https://web.stanford.edu/~bowens18/;https://soominkwon.github.io/;;https://christine1729.github.io/posts/2022-10-17-dsml/;https://qingqu.engin.umich.edu/;https://liyueshen.engin.umich.edu/",
        "dblp": ";256/2093;;;127/6874-1;159/2036",
        "google_scholar": "https://scholar.google.com/citations?hl=en;_sdoF5IAAAAJ;;;JfblW3MAAAAJ;Ho4qk9wAAAAJ",
        "orcid": ";;;;0000-0001-9136-558X;0000-0001-5942-3196",
        "linkedin": ";;;;qing-q-1a0b9746/;",
        "or_profile": "~Bowen_Song3;~Soo_Min_Kwon1;~Zecheng_Zhang1;~Xinyu_Hu2;~Qing_Qu2;~Liyue_Shen1",
        "aff": "University of Michigan - Ann Arbor;University of Michigan - Ann Arbor;;Microsoft;University of Michigan;University of Michigan - Ann Arbor",
        "aff_domain": "umich.edu;umich.edu;;microsoft.com;umich.edu;umich.edu",
        "position": "PhD student;PhD student;;Researcher;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nsong2024solving,\ntitle={Solving Inverse Problems with Latent Diffusion Models via Hard Data Consistency},\nauthor={Bowen Song and Soo Min Kwon and Zecheng Zhang and Xinyu Hu and Qing Qu and Liyue Shen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=j8hdRqOUhN}\n}",
        "github": "",
        "project": "",
        "reviewers": "1zP2;4YEX;azNZ;6mow",
        "pdf_size": 6862117,
        "rating": "6;8;8;8",
        "confidence": "3;3;4;4",
        "soundness": "3;3;3;3",
        "contribution": "3;3;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "39;86;63;67",
        "wc_strengths": "80;31;91;35",
        "wc_weaknesses": "107;127;101;19",
        "wc_questions": "10;56;652;198",
        "wc_review": "236;300;907;319",
        "wc_reply_reviewers": "0;67;70;110",
        "wc_reply_authors": "485;598;1922;756",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "2;3;5;3",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            63.75,
            16.723860200324566
        ],
        "wc_strengths_avg": [
            59.25,
            26.57418860473448
        ],
        "wc_weaknesses_avg": [
            88.5,
            41.26439142893059
        ],
        "wc_questions_avg": [
            229.0,
            253.86019774671254
        ],
        "wc_review_avg": [
            440.5,
            271.0834742288803
        ],
        "wc_reply_reviewers_avg": [
            61.75,
            39.486548342441885
        ],
        "wc_reply_authors_avg": [
            940.25,
            574.9279846206828
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.25,
            1.0897247358851685
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 87,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8445810380414067256&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=j8hdRqOUhN",
        "pdf": "https://openreview.net/pdf?id=j8hdRqOUhN",
        "email": "umich.edu;umich.edu;;microsoft.com;umich.edu;umich.edu",
        "author_num": 6,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "University of Michigan;Microsoft",
        "aff_unique_dep": ";Microsoft Corporation",
        "aff_unique_url": "https://www.umich.edu;https://www.microsoft.com",
        "aff_unique_abbr": "UM;Microsoft",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Ann Arbor;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "j9KV9wsHqC",
        "title": "Prompt-aware Adapter: Towards Learning Effective Visual Tokens for GPT4-Style Multimodal Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The rapid advancement of Large Language Models (LLMs) has revolutionized chatbot systems, resulting in unprecedented levels of intelligence. Moreover, the recent GPT4-style models have demonstrated extraordinary multi-modal abilities, such as generating human-like responses based on visual inputs and textual prompts. To bridge the gap between the vision and language modalities, GPT4-style models usually learn an adapter that converts the visual inputs to understandable tokens for LLMs. However, those adapters are usually independent of textual prompts, thus outputting invariant visual tokens, regardless of the question of interest. Those prompt-irrelevant visual tokens significantly increase the burden of visual reasoning on LLMs. In this paper, we propose prompt-aware adapter, which is equipped with an ability of dynamically embedding visual inputs based on the prompt. In this way, the proposed adapter extracts the most informative visual clues to the prompt, thus largely facilitating LLMs for visual understanding. Experiments on various questions, including object classification, color recognition, counting and position reasoning, demonstrates the effectiveness of the proposed method. \nCode will be publicly available.",
        "keywords": "Large Language Models;Multimodal Large Language Models;adapter;vision-language",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yue Zhang;Hehe Fan",
        "authorids": "~Yue_Zhang27;~Hehe_Fan1",
        "gender": "F;M",
        "homepage": "https://github.com/YueCheong;https://hehefan.github.io",
        "dblp": "47/722;184/5722.html",
        "google_scholar": "I5EAh8kAAAAJ;hVuflMQAAAAJ",
        "orcid": "0000-0002-0431-6390;0000-0001-9572-2345",
        "linkedin": ";",
        "or_profile": "~Yue_Zhang27;~Hehe_Fan1",
        "aff": "Zhejiang University;Zhejiang University",
        "aff_domain": "zju.edu.cn;zju.edu.cn",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nzhang2024promptaware,\ntitle={Prompt-aware Adapter: Towards Learning Effective Visual Tokens for {GPT}4-Style Multimodal Models},\nauthor={Yue Zhang and Hehe Fan},\nyear={2024},\nurl={https://openreview.net/forum?id=j9KV9wsHqC}\n}",
        "github": "",
        "project": "",
        "reviewers": "3AJJ;PKd5;1W2T;p8Xv",
        "site": "https://openreview.net/forum?id=j9KV9wsHqC",
        "pdf_size": 5027974,
        "rating": "3;3;5;5",
        "confidence": "4;4;3;4",
        "soundness": "3;2;2;4",
        "contribution": "1;2;2;2",
        "presentation": "3;2;3;3",
        "wc_summary": "33;80;135;55",
        "wc_strengths": "31;23;58;50",
        "wc_weaknesses": "76;169;179;29",
        "wc_questions": "6;1;4;39",
        "wc_review": "146;273;376;173",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            75.75,
            38.03534540397918
        ],
        "wc_strengths_avg": [
            40.5,
            14.080127840328723
        ],
        "wc_weaknesses_avg": [
            113.25,
            63.080801358257965
        ],
        "wc_questions_avg": [
            12.5,
            15.402921800749363
        ],
        "wc_review_avg": [
            242.0,
            90.68351559131351
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:oEv4mp-4mP0J:scholar.google.com/&scioq=Prompt-aware+Adapter:+Towards+Learning+Effective+Visual+Tokens+for+GPT4-Style+Multimodal+Models&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Zhejiang University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.zju.edu.cn",
        "aff_unique_abbr": "ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "j9dDXNffBz",
        "title": "A Study of Unsupervised Evaluation Metrics for Practical and Automatic Domain Adaptation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Unsupervised domain adaptation (UDA) methods facilitate the transfer of models to target domains without labels. However, these methods necessitate a labeled target validation set for hyper-parameter tuning and model selection. In this paper, we aim to find an evaluation metric capable of assessing the quality of a transferred model without access to target validation labels. We begin with the metric based on mutual information of the model prediction. Through empirical analysis, we identify three prevalent issues with this metric: 1) It does not account for the source structure. 2) It can be easily attacked. 3) It fails to detect negative transfer caused by the over-alignment of source and target features. To address the first two issues, we incorporate source accuracy into the metric and employ a new MLP classifier that is held out during training, significantly improving the result. To tackle the final issue, we integrate this enhanced metric with data augmentation, resulting in a novel unsupervised UDA metric called the Augmentation Consistency Metric (ACM). Additionally, we empirically demonstrate the shortcomings of previous experiment settings and conduct large-scale experiments to validate the effectiveness of our proposed metric. Furthermore, we leverage our metric to automatically search for the optimal set of hyper-parameters, achieving superior performance comparable to manually tuned sets across four common benchmarks.",
        "keywords": "Unsupervised Evaluation Metrics;Unsupervised Domain Adaptation",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/7a8e42fb8255e4981b7bc4a2359050ee1331894c.zip",
        "author": "Minghao Chen;zepeng gao;Shuai Zhao;Qibo Qiu;Ke Li;Binbin Lin;Xiaofei He",
        "authorids": "~Minghao_Chen2;~zepeng_gao1;~Shuai_Zhao1;~Qibo_Qiu1;~Ke_Li13;~Binbin_Lin3;~Xiaofei_He2",
        "gender": "M;M;M;;M;M;M",
        "homepage": ";;;;http://www.fullong.cn/;https://www.linkedin.com/in/binbin-lin-03598b31/;https://person.zju.edu.cn/0007101",
        "dblp": "39/332-1;;116/8682-6;;;51/8073;h/XiaofeiHe.html",
        "google_scholar": "xxPcRRQAAAAJ;;;;;Zmvq4KYAAAAJ;QLLFowsAAAAJ",
        "orcid": ";;0000-0003-1320-4283;;;0000-0002-0330-6406;0009-0001-9107-2354",
        "linkedin": ";https://www.linkedin.cn/incareer/in/ACoAADSig9MBgk8wCFx-YhWeSef6rdsqcyreg7U;;;;;",
        "or_profile": "~Minghao_Chen2;~zepeng_gao1;~Shuai_Zhao1;~Qibo_Qiu1;~Ke_Li13;~Binbin_Lin3;~Xiaofei_He2",
        "aff": "Hangzhou Dianzi University;;University of Technology Sydney;;Fullong Tech.;Zhejiang University;Zhejiang University",
        "aff_domain": "hdu.edu.cn;;student.uts.edu.au;;fullong.com.cn;zju.edu.cn;zju.edu.cn",
        "position": "Lecturer;;PhD student;;Principal Researcher;Researcher;Professor",
        "bibtex": "@misc{\nchen2024a,\ntitle={A Study of Unsupervised Evaluation Metrics for Practical and Automatic Domain Adaptation},\nauthor={Minghao Chen and zepeng gao and Shuai Zhao and Qibo Qiu and Ke Li and Binbin Lin and Xiaofei He},\nyear={2024},\nurl={https://openreview.net/forum?id=j9dDXNffBz}\n}",
        "github": "",
        "project": "",
        "reviewers": "77mm;8ogz;PtWR;ETkW",
        "site": "https://openreview.net/forum?id=j9dDXNffBz",
        "pdf_size": 1748835,
        "rating": "3;5;6;6",
        "confidence": "5;3;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;2;3",
        "wc_summary": "97;137;111;80",
        "wc_strengths": "55;37;64;93",
        "wc_weaknesses": "532;61;324;133",
        "wc_questions": "60;408;43;6",
        "wc_review": "744;643;542;312",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            106.25,
            20.873128658636684
        ],
        "wc_strengths_avg": [
            62.25,
            20.24073862288627
        ],
        "wc_weaknesses_avg": [
            262.5,
            182.88315942152792
        ],
        "wc_questions_avg": [
            129.25,
            162.1162777144849
        ],
        "wc_review_avg": [
            560.25,
            160.13490406529115
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1831633357459070561&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;3;3",
        "aff_unique_norm": "Hangzhou Dianzi University;University of Technology Sydney;Fullong Technology;Zhejiang University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "http://www.hdu.edu.cn/;https://www.uts.edu.au;;https://www.zju.edu.cn",
        "aff_unique_abbr": "HGHDU;UTS;;ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "China;Australia;"
    },
    {
        "id": "jBmrRP6wu3",
        "title": "ConceptHash: Interpretable Fine-Grained Hashing with Concept Discovery",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Existing fine-grained hashing methods typically lack code interpretability as they compute hash code bits holistically using both global and local features. To address this limitation, we propose ConceptHash, a novel method that achieves sub-code level interpretability. In ConceptHash, each sub-code corresponds to a human-understandable concept, such as an object part, and these concepts are automatically discovered without human annotations. Specifically, we leverage a Vision Transformer architecture and introduce concept tokens as visual prompts, along with image patch tokens as model inputs. Each concept is then mapped to a specific sub-code at the model output, providing natural sub-code interpretability. To capture subtle visual differences among highly similar sub-categories (e.g., bird species), we incorporate language guidance to ensure that the learned hash codes are distinguishable within fine-grained object classes while maintaining semantic alignment. This approach allows us to develop hash codes that exhibit similarity within families of species while remaining distinct from species in other families. Extensive experiments on four fine-grained image retrieval benchmarks demonstrate that ConceptHash outperforms previous methods by a significant margin, offering unique sub-code interpretability as an additional benefit.",
        "keywords": "fine-grained hashing;deep hashing;learning to hash;fine-grained retrieval;interpretability;concept bottleneck model",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Kam Woh Ng;Xiatian Zhu;Yi-Zhe Song;Tao Xiang",
        "authorids": "~Kam_Woh_Ng1;~Xiatian_Zhu3;~Yi-Zhe_Song2;~Tao_Xiang1",
        "gender": "M;;M;M",
        "homepage": "https://kamwoh.github.io;https://x-up-lab.github.io;http://personal.ee.surrey.ac.uk/Personal/Y.Song/;https://www.surrey.ac.uk/people/tao-xiang",
        "dblp": "234/8663;128/7935;98/1684;22/4460-2.html",
        "google_scholar": "HxEQkLoAAAAJ;ZbA-z1cAAAAJ;https://scholar.google.co.uk/citations?user=irZFP_AAAAAJ;MeS5d4gAAAAJ",
        "orcid": ";0000-0002-9284-2955;;0000-0002-2530-1059",
        "linkedin": "thomas-ng-kam-woh/;;;",
        "or_profile": "~Kam_Woh_Ng1;~Xiatian_Zhu3;~Yi-Zhe_Song2;~Tao_Xiang1",
        "aff": "University of Surrey;University of Surrey;University of Surrey;University of Surrey",
        "aff_domain": "surrey.ac.uk;surrey.ac.uk;surrey.ac.uk;surrey.ac.uk",
        "position": "PhD student;Associate Professor;Professor;Full Professor",
        "bibtex": "@misc{\nng2024concepthash,\ntitle={ConceptHash: Interpretable Fine-Grained Hashing with Concept Discovery},\nauthor={Kam Woh Ng and Xiatian Zhu and Yi-Zhe Song and Tao Xiang},\nyear={2024},\nurl={https://openreview.net/forum?id=jBmrRP6wu3}\n}",
        "github": "",
        "project": "",
        "reviewers": "7pJE;nLVP;cpFr;cLQM",
        "site": "https://openreview.net/forum?id=jBmrRP6wu3",
        "pdf_size": 13210359,
        "rating": "5;5;5;6",
        "confidence": "4;4;3;3",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "41;71;55;145",
        "wc_strengths": "33;37;45;252",
        "wc_weaknesses": "241;168;117;409",
        "wc_questions": "84;4;7;74",
        "wc_review": "399;280;224;880",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            78.0,
            40.11234224026316
        ],
        "wc_strengths_avg": [
            91.75,
            92.621204375672
        ],
        "wc_weaknesses_avg": [
            233.75,
            110.36162149950498
        ],
        "wc_questions_avg": [
            42.25,
            36.93490896157726
        ],
        "wc_review_avg": [
            445.75,
            258.55596589520036
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4761452030181792110&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of Surrey",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.surrey.ac.uk",
        "aff_unique_abbr": "Surrey",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "jBt8qp1iYK",
        "title": "SCoRe: Submodular Combinatorial Representation Learning for Real-World Class-Imbalanced Settings",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Representation Learning in real-world class-imbalanced settings has emerged as a challenging task in the evolution of deep learning. \nLack of diversity in visual and structural features for rare classes restricts modern neural networks to learn discriminative feature clusters.\nThis manifests in the form of large inter-class bias between rare object classes and elevated intra-class variance among abundant classes in the dataset. Although deep metric learning approaches have shown promise in this domain, significant improvements need to be made to overcome the challenges associated with class-imbalance in mission critical tasks like autonomous navigation and medical diagnostics. Set-based combinatorial functions like Submodular Information Measures exhibit properties that allow them to simultaneously model diversity and cooperation among feature clusters. In this paper, we introduce the SCoRe (Submodular Combinatorial Representation Learning) framework and propose a family of Submodular Combinatorial Loss functions to overcome these pitfalls in contrastive learning. We also show that existing contrastive learning approaches are either submodular or can be re-formulated to create their submodular counterparts. We conduct experiments on the newly introduced family of combinatorial objectives on two image classification benchmarks - pathologically imbalanced CIFAR-10, subsets of MedMNIST and a real-world road object detection benchmark - India Driving Dataset (IDD). Our experiments clearly show that the newly introduced objectives like Facility Location, Graph-Cut and Log Determinant outperform state-of-the-art metric learners by up to 7.6% for the imbalanced classification tasks and up to 19.4% for object detection tasks.",
        "keywords": "Representation Learning;Submodular Functions;Contrastive Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Anay Majee;Suraj Nandkishor Kothawade;Krishnateja Killamsetty;Rishabh K Iyer",
        "authorids": "~Anay_Majee1;~Suraj_Nandkishor_Kothawade2;~Krishnateja_Killamsetty1;~Rishabh_K_Iyer2",
        "gender": "M;M;M;M",
        "homepage": "https://amajee11us.github.io/;http://surajk.me;https://krishnatejakillamsetty.me;https://www.rishiyer.com",
        "dblp": "284/3256;220/3896;https://dblp.uni-trier.de/pid/273/3972;37/10544.html",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;cHDE-2YAAAAJ;l_XxJ1kAAAAJ",
        "orcid": "0000-0003-0189-8310;;;",
        "linkedin": "anaymajee/;suraj-kothawade-6835b5a9/;krishnateja-killamsetty/;rishabh-iyer-36893717/",
        "or_profile": "~Anay_Majee1;~Suraj_Nandkishor_Kothawade2;~Krishnateja_Killamsetty1;~Rishabh_K_Iyer2",
        "aff": "The University of Texas at Dallas;Google;International Business Machines;Microsoft",
        "aff_domain": "utdallas.edu;google.com;ibm.com;microsoft.com",
        "position": "PhD student;Researcher;Researcher;Research Scientist",
        "bibtex": "@misc{\nmajee2024score,\ntitle={{SC}oRe: Submodular Combinatorial Representation Learning for Real-World Class-Imbalanced Settings},\nauthor={Anay Majee and Suraj Nandkishor Kothawade and Krishnateja Killamsetty and Rishabh K Iyer},\nyear={2024},\nurl={https://openreview.net/forum?id=jBt8qp1iYK}\n}",
        "github": "",
        "project": "",
        "reviewers": "q4FE;KzrN;zWRY",
        "site": "https://openreview.net/forum?id=jBt8qp1iYK",
        "pdf_size": 815876,
        "rating": "5;5;5",
        "confidence": "3;3;4",
        "soundness": "2;3;3",
        "contribution": "2;2;3",
        "presentation": "3;3;2",
        "wc_summary": "44;98;89",
        "wc_strengths": "18;33;138",
        "wc_weaknesses": "73;135;130",
        "wc_questions": "3;2;124",
        "wc_review": "138;268;481",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1073;643;1790",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;1;3",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            77.0,
            23.62202362203543
        ],
        "wc_strengths_avg": [
            63.0,
            53.38539126015655
        ],
        "wc_weaknesses_avg": [
            112.66666666666667,
            28.122746823325933
        ],
        "wc_questions_avg": [
            43.0,
            57.27710420985567
        ],
        "wc_review_avg": [
            295.6666666666667,
            141.38913992555754
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1168.6666666666667,
            473.1217837113635
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "University of Texas at Dallas;Google;International Business Machines Corporation;Microsoft",
        "aff_unique_dep": ";Google;;Microsoft Corporation",
        "aff_unique_url": "https://www.utdallas.edu;https://www.google.com;https://www.ibm.com;https://www.microsoft.com",
        "aff_unique_abbr": "UT Dallas;Google;IBM;Microsoft",
        "aff_campus_unique_index": "0;1",
        "aff_campus_unique": "Dallas;Mountain View;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "jD1sU2vLOn",
        "title": "Learning Counterfactually Invariant Predictors",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Notions of counterfactual invariance have proven essential for predictors that are fair, robust, and generalizable in the real world. We propose simple graphical criteria that yield a sufficient condition for a predictor to be counterfactually invariant in terms of (conditional independence in) the observational distribution. Any predictor that satisfies our criterion is provably counterfactually invariant. In order to learn such predictors, we propose a model-agnostic framework, called Counterfactual Invariance Prediction (CIP), building on a kernel-based conditional dependence measure called Hilbert-Schmidt Conditional Independence Criterion (HSCIC). Our experimental results demonstrate the effectiveness of CIP in enforcing counterfactual invariance across various simulated and real-world datasets including scalar and multi-variate settings.real-world dataset.",
        "keywords": "Causality;Counterfactual Invariance",
        "primary_area": "causal reasoning",
        "supplementary_material": "/attachment/07589787090ec4e9b200ad33e04f69c05dc0965d.zip",
        "author": "Francesco Quinzan;Cecilia Casolo;Krikamol Muandet;Yucen Luo;Niki Kilbertus",
        "authorids": "~Francesco_Quinzan1;~Cecilia_Casolo1;~Krikamol_Muandet1;~Yucen_Luo1;~Niki_Kilbertus1",
        "gender": ";F;M;F;",
        "homepage": ";;http://krikamol.org;http://yucenluo.com;",
        "dblp": ";;34/1240;http://dblp.uni-trier.de/pers/hd/l/Luo:Yucen;202/1966",
        "google_scholar": ";;E2z5uYsAAAAJ;__wMZSYAAAAJ;uQZjTq4AAAAJ",
        "orcid": ";;0000-0002-4182-5282;;",
        "linkedin": ";cecilia-casolo-819374171;krikamol-muandet/;http://www.linkedin.com/in/yucen-luo-5b8071a1/;",
        "or_profile": "~Francesco_Quinzan1;~Cecilia_Casolo1;~Krikamol_Muandet1;~Yucen_Luo1;~Niki_Kilbertus1",
        "aff": ";Technische Universit\u00e4t M\u00fcnchen;CISPA Helmholtz Center for Information Security;Max Planck Institute for Intelligent Systems, Max-Planck Institute;Helmholtz AI",
        "aff_domain": ";tum.de;cispa.saarland;tuebingen.mpg.de;helmholtz-muenchen.de",
        "position": ";PhD student;Associate Professor;Postdoc;Group Leader",
        "bibtex": "@misc{\nquinzan2024learning,\ntitle={Learning Counterfactually Invariant Predictors},\nauthor={Francesco Quinzan and Cecilia Casolo and Krikamol Muandet and Yucen Luo and Niki Kilbertus},\nyear={2024},\nurl={https://openreview.net/forum?id=jD1sU2vLOn}\n}",
        "github": "",
        "project": "",
        "reviewers": "Lrr5;sZNY;mZ5A",
        "site": "https://openreview.net/forum?id=jD1sU2vLOn",
        "pdf_size": 579619,
        "rating": "3;3;5",
        "confidence": "4;5;3",
        "soundness": "2;1;3",
        "contribution": "2;1;3",
        "presentation": "2;2;2",
        "wc_summary": "49;34;54",
        "wc_strengths": "42;10;24",
        "wc_weaknesses": "546;90;4",
        "wc_questions": "17;2;95",
        "wc_review": "654;136;177",
        "wc_reply_reviewers": "0;0;11",
        "wc_reply_authors": "681;548;661",
        "reply_reviewers": "0;0;1",
        "reply_authors": "1;1;2",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            45.666666666666664,
            8.498365855987974
        ],
        "wc_strengths_avg": [
            25.333333333333332,
            13.097921802925667
        ],
        "wc_weaknesses_avg": [
            213.33333333333334,
            237.83654517803234
        ],
        "wc_questions_avg": [
            38.0,
            40.76763422127902
        ],
        "wc_review_avg": [
            322.3333333333333,
            235.12030017749544
        ],
        "wc_reply_reviewers_avg": [
            3.6666666666666665,
            5.185449728701348
        ],
        "wc_reply_authors_avg": [
            630.0,
            58.55481762132529
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.8660254037844387,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12603329754815759414&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Technische Universit\u00e4t M\u00fcnchen;CISPA Helmholtz Center for Information Security;Max Planck Institute for Intelligent Systems;Helmholtz Association of German Research Centres",
        "aff_unique_dep": ";;Intelligent Systems;Helmholtz AI",
        "aff_unique_url": "https://www.tum.de;https://www.cispa.de/;https://www.mpi-is.mpg.de;https://www.helmholtz-ai.de",
        "aff_unique_abbr": "TUM;CISPA;MPI-IS;Helmholtz AI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "jDy2Djjrge",
        "title": "LAURAGPT: LISTEN, ATTEND, UNDERSTAND, AND REGENERATE AUDIO WITH GPT",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Generative Pre-trained Transformer (GPT) models have achieved remarkable performance on various natural language processing tasks. However, there has been limited research on applying similar frameworks to audio tasks. Previously proposed large language models for audio tasks either lack sufficient quantitative evaluations, or are limited to tasks for recognizing and understanding audio content, or significantly underperform existing state-of-the-art (SOTA) models. In this paper, we propose LauraGPT, a unified GPT model for audio recognition, understanding, and generation. LauraGPT is a versatile language model that can process both audio and text inputs and generate outputs in either modalities. It can perform a wide range of tasks related to content, semantics, paralinguistics, and audio-signal analysis. Some of its noteworthy tasks include automatic speech recognition, speech-to-text translation, text-to-speech synthesis, machine translation, speech enhancement, automated audio captioning, speech emotion recognition, and spoken language understanding. To achieve this goal, we use a combination of continuous and discrete features for audio. We encode input audio into continuous representations using an audio encoder and decode output audio from discrete codec codes. We then fine-tune a large decoder-only Transformer-based language model on multiple audio-to-text, text-to-audio, audio-to-audio, and text-to-text tasks using a supervised multitask learning approach. Extensive experiments show that LauraGPT achieves competitive or superior performance compared to existing SOTA models on various audio processing benchmarks.",
        "keywords": "LauraGPT;unified multimodality modeling;GPT;audio understanding;audio generation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Jiaming Wang;Zhihao Du;Qian Chen;Yunfei Chu;Zhifu Gao;Zerui Li;Kai Hu;Xiaohuan Zhou;Jin Xu;Ziyang Ma;Wen Wang;Siqi Zheng;Chang Zhou;Zhijie Yan;ShiLiang Zhang",
        "authorids": "~Jiaming_Wang5;~Zhihao_Du1;~Qian_Chen1;~Yunfei_Chu1;~Zhifu_Gao1;~Zerui_Li1;~Kai_Hu7;~Xiaohuan_Zhou1;~Jin_Xu5;~Ziyang_Ma3;~Wen_Wang6;~Siqi_Zheng1;~Chang_Zhou2;~Zhijie_Yan2;~ShiLiang_Zhang1",
        "gender": "M;M;M;F;M;M;M;F;;M;;M;M;M;M",
        "homepage": "https://wangjiaming.github.io;https://zhihaodu.github.io;https://scholar.google.com/citations?user=8eosmSQAAAAJ&hl=en;https://scholar.google.com/citations?user=41QhCyYAAAAJ&hl=en;https://scholar.google.com.hk/citations?hl=zh-CN&user=x6HfdMAAAAAJ;https://lizerui9926.github.io/;https://hukai-sun.github.io/;;;http://ziyang.tech/;https://scholar.google.com/citations?user=85Tj1OwAAAAJ&hl=en;;;;http://home.ustc.edu.cn/~zsl2008/",
        "dblp": ";228/8520;11/1394-3;;226/1812.html;;;217/2489;;;29/4680-1;;;;",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;8eosmSQAAAAJ;;https://scholar.google.com.hk/citations?hl=zh-CN;;;;;4RZnXGMAAAAJ;85Tj1OwAAAAJ;https://scholar.google.com.hk/citations?user=BsrS95gAAAAJ;QeSoG3sAAAAJ;;BcWMSE4AAAAJ",
        "orcid": ";0000-0003-3509-9322;0000-0001-6939-7438;;0009-0008-5691-7324;;;;;;0000-0002-0356-1968;;;;",
        "linkedin": ";%E5%BF%97%E6%B5%A9-%E6%9D%9C-b786a1117/;;;;;;;;;wen-wang-414b548/;;;zhijie-yan-32417123/;",
        "or_profile": "~Jiaming_Wang5;~Zhihao_Du1;~Qian_Chen1;~Yunfei_Chu1;~Zhifu_Gao1;~Zerui_Li1;~Kai_Hu7;~Xiaohuan_Zhou1;~Jin_Xu5;~Ziyang_Ma3;~Wen_Wang6;~Siqi_Zheng1;~Chang_Zhou2;~Zhijie_Yan2;~ShiLiang_Zhang1",
        "aff": "Alibaba Group;Alibaba Group;Alibaba Group;Alibaba Group;Alibaba Group;;;Alibaba Group;;Shanghai Jiaotong University;Alibaba Group;Alibaba Group;Alibaba Group;;Alibaba Group",
        "aff_domain": "alibaba-inc.com;alibaba-inc.com;alibaba-inc.com;alibaba-inc.com;alibaba-inc.com;;;alibaba-inc.com;;sjtu.edu.cn;alibaba-inc.com;alibaba-inc.com;alibaba-inc.com;;alibaba-inc.com",
        "position": "Researcher;Principal Researcher;Researcher;Researcher;Researcher;;;Researcher;;PhD student;Senior Staff Algorithm Engineer;Researcher;Researcher;;Staff Algorithm Engineer",
        "bibtex": "@misc{\nwang2024lauragpt,\ntitle={{LAURAGPT}: {LISTEN}, {ATTEND}, {UNDERSTAND}, {AND} {REGENERATE} {AUDIO} {WITH} {GPT}},\nauthor={Jiaming Wang and Zhihao Du and Qian Chen and Yunfei Chu and Zhifu Gao and Zerui Li and Kai Hu and Xiaohuan Zhou and Jin Xu and Ziyang Ma and Wen Wang and Siqi Zheng and Chang Zhou and Zhijie Yan and ShiLiang Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=jDy2Djjrge}\n}",
        "github": "",
        "project": "",
        "reviewers": "ncjQ;Nqbz;x7eV;Xm2a",
        "site": "https://openreview.net/forum?id=jDy2Djjrge",
        "pdf_size": 364229,
        "rating": "5;5;6;6",
        "confidence": "4;4;3;5",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;2;3",
        "wc_summary": "117;130;261;71",
        "wc_strengths": "64;42;75;112",
        "wc_weaknesses": "260;533;272;90",
        "wc_questions": "44;11;54;42",
        "wc_review": "485;716;662;315",
        "wc_reply_reviewers": "0;69;0;0",
        "wc_reply_authors": "1233;1143;895;336",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "2;2;2;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            144.75,
            70.60586023836832
        ],
        "wc_strengths_avg": [
            73.25,
            25.33155147242269
        ],
        "wc_weaknesses_avg": [
            288.75,
            158.32462695361073
        ],
        "wc_questions_avg": [
            37.75,
            16.099301227071937
        ],
        "wc_review_avg": [
            544.5,
            157.66182163098333
        ],
        "wc_reply_reviewers_avg": [
            17.25,
            29.877876430563134
        ],
        "wc_reply_authors_avg": [
            901.75,
            349.3017141383649
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            15,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 81,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14923948034090315152&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0;0;0;1;0;0;0;0",
        "aff_unique_norm": "Alibaba Group;Shanghai Jiao Tong University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.alibaba.com;https://www.sjtu.edu.cn",
        "aff_unique_abbr": "Alibaba;SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "jE6VXUhxq9",
        "title": "On Causal Discovery in the Presence of Deterministic Relations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Many causal discovery methods typically rely on the assumption of independent noise, yet real-life situations often involve deterministic relationships. In these cases, observed variables are represented as deterministic functions of their parental variables, without noise.\nWhen determinism is present, constraint-based methods encounter challenges due to the violation of the faithfulness assumption. In this paper, we excitingly find, supported by both theoretical analysis and empirical evidence, that score-based methods with exact search can naturally address the issues of deterministic relations under rather mild assumptions. Nonetheless, exact score-based methods can be computationally expensive. To enhance the efficiency and scalability, we develop a novel framework for causal discovery that can detect and handle deterministic relations, called Determinism-aware Greedy Equivalent Search (DGES). DGES comprises three phases: (1) run Greedy Equivalent Search (GES) to obtain an initial graph, (2) identify deterministic clusters (i.e., variables with deterministic relationships), and (3) perform exact search exclusively on each deterministic cluster and its neighbors. The proposed DGES accommodates both linear and nonlinear causal relationships, as well as both continuous and discrete data types. Furthermore, we investigate the identifiability conditions of DGES. We conducted extensive experiments on both simulated and real-world datasets to show the efficacy of our proposed method.",
        "keywords": "Causal discovery;score-based method;deterministic relation",
        "primary_area": "causal reasoning",
        "supplementary_material": "/attachment/4fcb95a317c72388e0d33a9766ceb5cd9e8d1873.zip",
        "author": "Loka Li;Hanin Al Ghothani;Biwei Huang;Guangyi Chen;Jiji Zhang;Shahar Harel;Kun Zhang",
        "authorids": "~Loka_Li1;~Hanin_Al_Ghothani1;~Biwei_Huang1;~Guangyi_Chen1;~Jiji_Zhang1;~Shahar_Harel2;~Kun_Zhang1",
        "gender": "M;F;F;M;M;M;M",
        "homepage": "https://lokali.github.io;;;https://chengy12.github.io/;;;http://www.andrew.cmu.edu/user/kunz1/",
        "dblp": "371/1096;;165/3288;c/GuangyiChen-2;99/3659;;96/3115-1",
        "google_scholar": "PT5AMzgAAAAJ;;;https://scholar.google.com/citations?hl=zh-CN;5GAikocAAAAJ;WR5abPAAAAAJ;RGoypN4AAAAJ",
        "orcid": ";;;;;;",
        "linkedin": ";hanin-al-ghothani-a90328128;;;;;",
        "or_profile": "~Loka_Li1;~Hanin_Al_Ghothani1;~Biwei_Huang1;~Guangyi_Chen1;~Jiji_Zhang1;~Shahar_Harel2;~Kun_Zhang1",
        "aff": "Mohamed bin Zayed University of Artificial Intelligence;Mohamed bin Zayed University of Artificial Intelligence;University of California, San Diego;Carnegie Mellon University;The Chinese University of Hong Kong;;Carnegie Mellon University",
        "aff_domain": "mbzuai.ac.ae;mbzuai.ac.ae;ucsd.edu;cmu.edu;cuhk.edu.hk;;cmu.edu",
        "position": "PhD student;PhD student;Assistant Professor;Postdoc;Professor;;Associate Professor",
        "bibtex": "@misc{\nli2024on,\ntitle={On Causal Discovery in the Presence of Deterministic Relations},\nauthor={Loka Li and Hanin Al Ghothani and Biwei Huang and Guangyi Chen and Jiji Zhang and Shahar Harel and Kun Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=jE6VXUhxq9}\n}",
        "github": "",
        "project": "",
        "reviewers": "dg4D;bELW;qsqn;fVdc",
        "site": "https://openreview.net/forum?id=jE6VXUhxq9",
        "pdf_size": 2842891,
        "rating": "5;6;6;8",
        "confidence": "4;3;4;3",
        "soundness": "4;4;3;3",
        "contribution": "2;2;2;3",
        "presentation": "4;4;3;3",
        "wc_summary": "23;70;61;68",
        "wc_strengths": "35;40;73;104",
        "wc_weaknesses": "188;56;121;47",
        "wc_questions": "74;285;92;218",
        "wc_review": "320;451;347;437",
        "wc_reply_reviewers": "0;0;0;29",
        "wc_reply_authors": "1245;1508;1270;1155",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "2;3;2;3",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            55.5,
            19.059118552545918
        ],
        "wc_strengths_avg": [
            63.0,
            27.81186797034676
        ],
        "wc_weaknesses_avg": [
            103.0,
            56.77587515838043
        ],
        "wc_questions_avg": [
            167.25,
            87.74786322184717
        ],
        "wc_review_avg": [
            388.75,
            56.286654723833074
        ],
        "wc_reply_reviewers_avg": [
            7.25,
            12.55736835487436
        ],
        "wc_reply_authors_avg": [
            1294.5,
            130.47317732009134
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.6882472016116854,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17728316998578546339&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;1;2;3;2",
        "aff_unique_norm": "Mohamed bin Zayed University of Artificial Intelligence;University of California, San Diego;Carnegie Mellon University;Chinese University of Hong Kong",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://mbzuai.ac.ae;https://www.ucsd.edu;https://www.cmu.edu;https://www.cuhk.edu.hk",
        "aff_unique_abbr": "MBZUAI;UCSD;CMU;CUHK",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";San Diego;Hong Kong SAR",
        "aff_country_unique_index": "0;0;1;1;2;1",
        "aff_country_unique": "United Arab Emirates;United States;China"
    },
    {
        "title": "Language Models Represent Space and Time",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18036",
        "id": "jE8xbmvFin",
        "author_site": "Wes Gurnee, Max Tegmark",
        "tldr": "",
        "abstract": "The capabilities of large language models (LLMs) have sparked debate over whether such systems just learn an enormous collection of superficial statistics or a set of more coherent and grounded representations that reflect the real world. We find evidence for the latter by analyzing the learned representations of three spatial datasets (world, US, NYC places) and three temporal datasets (historical figures, artworks, news headlines) in the Llama-2 family of models. We discover that LLMs learn linear representations of space and time across multiple scales. These representations are robust to prompting variations and unified across different entity types (e.g. cities and landmarks). In addition, we identify individual \"space neurons\" and \"time neurons\" that reliably encode spatial and temporal coordinates. While further investigation is needed, our results suggest modern LLMs learn rich spatiotemporal representations of the real world and possess basic ingredients of a world model.",
        "keywords": "Interpretability;world models;probing",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Wes Gurnee;Max Tegmark",
        "authorids": "~Wes_Gurnee1;~Max_Tegmark1",
        "gender": ";",
        "homepage": "https://www.wesg.me/;https://space.mit.edu/home/tegmark/",
        "dblp": ";25/6578",
        "google_scholar": "5sxXSfwAAAAJ;eBXEZxgAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Wes_Gurnee1;~Max_Tegmark1",
        "aff": "Massachusetts Institute of Technology;Massachusetts Institute of Technology",
        "aff_domain": "mit.edu;mit.edu",
        "position": "PhD student;Full Professor",
        "bibtex": "@inproceedings{\ngurnee2024language,\ntitle={Language Models Represent Space and Time},\nauthor={Wes Gurnee and Max Tegmark},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=jE8xbmvFin}\n}",
        "github": "",
        "project": "",
        "reviewers": "XR65;eYoU;MD6k;xxLT",
        "pdf_size": 5223457,
        "rating": "5;6;8;8",
        "confidence": "4;4;4;4",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "4;4;4;4",
        "wc_summary": "113;91;94;66",
        "wc_strengths": "103;30;26;134",
        "wc_weaknesses": "386;236;190;115",
        "wc_questions": "21;91;74;12",
        "wc_review": "623;448;384;327",
        "wc_reply_reviewers": "0;157;0;20",
        "wc_reply_authors": "1037;551;944;158",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "2;1;2;1",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            4.0,
            0.0
        ],
        "wc_summary_avg": [
            91.0,
            16.718253497300488
        ],
        "wc_strengths_avg": [
            73.25,
            46.57990446533784
        ],
        "wc_weaknesses_avg": [
            231.75,
            98.97569146007518
        ],
        "wc_questions_avg": [
            49.5,
            33.69347117766289
        ],
        "wc_review_avg": [
            445.5,
            111.05966864708358
        ],
        "wc_reply_reviewers_avg": [
            44.25,
            65.60630686145959
        ],
        "wc_reply_authors_avg": [
            672.5,
            348.58463821574236
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 247,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2674847876149703750&as_sdt=5,34&sciodt=0,34&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=jE8xbmvFin",
        "pdf": "https://openreview.net/pdf?id=jE8xbmvFin",
        "email": "mit.edu;mit.edu",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Massachusetts Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://web.mit.edu",
        "aff_unique_abbr": "MIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "jENDptNU5u",
        "title": "EditHOI: A framework for HOI image editing with self-generated skeleton guidance",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recently, there were remarkable advances in image editing tasks. This could be categorized into text-guided global editing, local editing, text-guided local editing. To resolve the flawed human generation problem in prior image editing models, we propose a novel skeleton and text-guided local editing framework, EditHOI. Our goal is to edit an image by synthesizing an object-interactive human in the image. To do this, our framework consists of two stages: the first stage generates object-interactive skeleton using diffusion-based module, while the second stage outputs a Human and Object Interaction (HOI) image based on skeleton and text guidance. For effective evaluation on a object-interactive skeleton, we designed joint parameter and two evaluation metrics; object interaction top-n accuracy and skeleton probability distance. The excellent performance of our framework is demonstrated through experiments qualitatively and quantitatively. Lastly, we show its applicability such as user controllable editing, generating pseudo SMPL ground truth and scalability to human-to-human interaction. The corresponding code is available at https://anonymous.4open.science/r/ HOI_editing_image-43F1/",
        "keywords": "Image editing;object interaction human skeleton generation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/849e9922b00f07ee48cabf37ad1a4c30a6b19881.pdf",
        "author": "ChangHee Yang;Chan Hee Kang;Kyeongbo Kong;Hanni Oh;Suk-Ju Kang",
        "authorids": "~ChangHee_Yang1;~Chan_Hee_Kang1;~Kyeongbo_Kong1;~Hanni_Oh1;~Suk-Ju_Kang1",
        "gender": "M;M;M;;M",
        "homepage": ";;https://www.pnu-cvsp.com/;https://github.com/hannixxxoh;http://vds.sogang.ac.kr/",
        "dblp": "366/2241;;218/1547;;99/7096",
        "google_scholar": ";;O9QSF7UAAAAJ;;",
        "orcid": "0000-0002-8482-5039;;0000-0002-1135-7502;;",
        "linkedin": ";\ucc2c\ud76c-\uac15-6751ba243/;;;",
        "or_profile": "~ChangHee_Yang1;~Chan_Hee_Kang1;~Kyeongbo_Kong1;~Hanni_Oh1;~Suk-Ju_Kang1",
        "aff": "Sogang University;Sogang University;Pusan National University;Sogang University;Sogang University",
        "aff_domain": "sogang.ac.kr;sogang.ac.kr;pusan.ac.kr;sogang.ac.kr;sogang.ac.kr",
        "position": "MS student;MS student;Assistant Professor;MS student;Full Professor",
        "bibtex": "@misc{\nyang2024edithoi,\ntitle={Edit{HOI}: A framework for {HOI} image editing with self-generated skeleton guidance},\nauthor={ChangHee Yang and Chan Hee Kang and Kyeongbo Kong and Hanni Oh and Suk-Ju Kang},\nyear={2024},\nurl={https://openreview.net/forum?id=jENDptNU5u}\n}",
        "github": "",
        "project": "",
        "reviewers": "tHfv;BnY7;jZPv;rWaG",
        "site": "https://openreview.net/forum?id=jENDptNU5u",
        "pdf_size": 7729346,
        "rating": "1;3;5;6",
        "confidence": "5;3;3;3",
        "soundness": "1;2;2;3",
        "contribution": "1;2;1;3",
        "presentation": "2;3;2;1",
        "wc_summary": "71;38;64;94",
        "wc_strengths": "12;22;113;49",
        "wc_weaknesses": "139;84;83;67",
        "wc_questions": "45;105;2;1",
        "wc_review": "267;249;262;211",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.920286436967152
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            66.75,
            19.967160539245434
        ],
        "wc_strengths_avg": [
            49.0,
            39.350984739901996
        ],
        "wc_weaknesses_avg": [
            93.25,
            27.261465477849864
        ],
        "wc_questions_avg": [
            38.25,
            42.43450836288786
        ],
        "wc_review_avg": [
            247.25,
            21.935986415021322
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.8268106308031117,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:r5WLh7XtywIJ:scholar.google.com/&scioq=EditHOI:+A+framework+for+HOI+image+editing+with+self-generated+skeleton+guidance&hl=en&as_sdt=0,23",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "Sogang University;Pusan National University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.sogang.ac.kr;https://www.pnu.ac.kr",
        "aff_unique_abbr": "Sogang;PNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "Compressing Latent Space via Least Volume",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18035",
        "id": "jFJPd9kIiF",
        "author_site": "Qiuyi Chen, Mark Fuge",
        "tldr": "",
        "abstract": "This paper introduces Least Volume---a simple yet effective regularization inspired by geometric intuition---that can reduce the necessary number of latent dimensions needed by an autoencoder without requiring any prior knowledge of the intrinsic dimensionality of the dataset. We show that the Lipschitz continuity of the decoder is the key to making it work, provide a proof that PCA is just a linear special case of it, and reveal that it has a similar PCA-like importance ordering effect when applied to nonlinear models. We demonstrate the intuition behind the regularization on some pedagogical toy problems, and its effectiveness on several benchmark problems, including MNIST, CIFAR-10 and CelebA.",
        "keywords": "Autoencoder;Representation Learning;Dimension Reduction",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Qiuyi Chen;Mark Fuge",
        "authorids": "~Qiuyi_Chen1;~Mark_Fuge1",
        "gender": "M;M",
        "homepage": ";https://ideal.ethz.ch",
        "dblp": ";204/9404",
        "google_scholar": "a45DFM0AAAAJ;rgvbw14AAAAJ",
        "orcid": ";0000-0003-3819-8895",
        "linkedin": ";markfuge/",
        "or_profile": "~Qiuyi_Chen1;~Mark_Fuge1",
        "aff": "University of Maryland, College Park;University of Maryland, College Park",
        "aff_domain": "umd.edu;umd.edu",
        "position": "PhD student;Associate Professor",
        "bibtex": "@inproceedings{\nchen2024compressing,\ntitle={Compressing Latent Space via Least Volume},\nauthor={Qiuyi Chen and Mark Fuge},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=jFJPd9kIiF}\n}",
        "github": "",
        "project": "",
        "reviewers": "VztC;k8im;nEBV;8zx4",
        "pdf_size": 3931182,
        "rating": "5;5;6;8",
        "confidence": "3;4;4;4",
        "soundness": "3;3;4;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;2",
        "wc_summary": "257;78;62;163",
        "wc_strengths": "58;67;31;88",
        "wc_weaknesses": "156;104;103;913",
        "wc_questions": "224;220;52;1",
        "wc_review": "695;469;248;1165",
        "wc_reply_reviewers": "42;55;10;187",
        "wc_reply_authors": "190;693;410;937",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            140.0,
            77.69491617860206
        ],
        "wc_strengths_avg": [
            61.0,
            20.457272545478784
        ],
        "wc_weaknesses_avg": [
            319.0,
            343.6153372595583
        ],
        "wc_questions_avg": [
            124.25,
            99.40919223089985
        ],
        "wc_review_avg": [
            644.25,
            339.66260833362276
        ],
        "wc_reply_reviewers_avg": [
            73.5,
            67.54442982215484
        ],
        "wc_reply_authors_avg": [
            557.5,
            282.4858403531051
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.4714045207910316,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4177079499407610998&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=jFJPd9kIiF",
        "pdf": "https://openreview.net/pdf?id=jFJPd9kIiF",
        "email": "umd.edu;umd.edu",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Maryland",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www/umd.edu",
        "aff_unique_abbr": "UMD",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "College Park",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "IRAD: Implicit Representation-driven Image Resampling against Adversarial Attacks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18034",
        "id": "jFa5KESW65",
        "author_site": "Yue Cao, Tianlin Li, Xiaofeng Cao, Ivor Tsang, Yang Liu, Qing Guo",
        "tldr": "",
        "abstract": "We introduce a novel approach to counter adversarial attacks, namely, image resampling. Image resampling transforms a discrete image into a new one, simulating the process of scene recapturing or rerendering as specified by a geometrical transformation. The underlying rationale behind our idea is that image resampling can alleviate the influence of adversarial perturbations while preserving essential semantic information, thereby conferring an inherent advantage in defending against adversarial attacks. To validate this concept, we present a comprehensive study on leveraging image resampling to defend against adversarial attacks. We have developed basic resampling methods that employ interpolation strategies and coordinate shifting magnitudes. Our analysis reveals that these basic methods can partially mitigate adversarial attacks. However, they come with apparent limitations: the accuracy of clean images noticeably decreases, while the improvement in accuracy on adversarial examples is not substantial.We propose implicit representation-driven image resampling (IRAD) to overcome these limitations. First, we construct an implicit continuous representation that enables us to represent any input image within a continuous coordinate space. Second, we introduce SampleNet, which automatically generates pixel-wise shifts for resampling in response to different inputs. Furthermore, we can extend our approach to the state-of-the-art diffusion-based method, accelerating it with fewer time steps while preserving its defense capability. Extensive experiments demonstrate that our method significantly enhances the adversarial robustness of diverse deep models against various attacks while maintaining high accuracy on clean images.",
        "keywords": "adversarial defense;resampling;implicit representation",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/b68fe6d5d255f9deea00eb5249d818ebb68d5e8b.zip",
        "author": "Yue Cao;Tianlin Li;Xiaofeng Cao;Ivor Tsang;Yang Liu;Qing Guo",
        "authorids": "~Yue_Cao9;~Tianlin_Li2;~Xiaofeng_Cao2;~Ivor_Tsang1;~Yang_Liu36;~Qing_Guo3",
        "gender": "F;;M;M;M;M",
        "homepage": ";;https://personal.ntu.edu.sg/yangliu/;https://tsingqguo.github.io;https://www.a-star.edu.sg/cfar/about-cfar/management/prof-ivor-tsang;https://xiaofengcaoml.github.io/",
        "dblp": ";137/8830;51/3710-3;25/3038-5;35/5873;117/3982-2.html",
        "google_scholar": ";XB6CydwAAAAJ;https://scholar.google.com.sg/citations?hl=en;Rj2x4QUAAAAJ;rJMOlVsAAAAJ;",
        "orcid": "0009-0001-3785-7281;;0000-0001-7300-9215;0000-0003-0974-9299;;",
        "linkedin": ";;;;;",
        "or_profile": "~Yue_Cao9;~Tianlin_Li2;~Yang_Liu36;~Qing_Guo3;~Ivor_W_Tsang1;~Xiaofeng_Cao1",
        "aff": "National Technological University;Nanyang Technological University;Nanyang Technological University; Agency for Science, Technology and Research (A*STAR));A*STAR;Jilin University",
        "aff_domain": "ntu.edu;ntu.edu.sg;ntu.edu.sg;cfar.a-star.edu.sg;cfar.a-star.edu.sg;jlu.edu.cn",
        "position": "PhD student;PhD student;Full Professor;Researcher;Principal Researcher;Associate Professor",
        "bibtex": "@inproceedings{\ncao2024irad,\ntitle={{IRAD}: Implicit Representation-driven Image Resampling against Adversarial Attacks},\nauthor={Yue Cao and Tianlin Li and Xiaofeng Cao and Ivor Tsang and Yang Liu and Qing Guo},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=jFa5KESW65}\n}",
        "github": "",
        "project": "",
        "reviewers": "mZuj;4nS8;ynQw;x2bE",
        "pdf_size": 16004096,
        "rating": "5;6;6;8",
        "confidence": "4;3;4;4",
        "soundness": "3;3;3;4",
        "contribution": "3;3;2;3",
        "presentation": "4;2;3;3",
        "wc_summary": "58;91;65;52",
        "wc_strengths": "52;55;35;89",
        "wc_weaknesses": "174;53;163;74",
        "wc_questions": "2;1;24;9",
        "wc_review": "286;200;287;224",
        "wc_reply_reviewers": "55;0;31;43",
        "wc_reply_authors": "3207;389;1119;1288",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "6;1;3;4",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            66.5,
            14.874474780643517
        ],
        "wc_strengths_avg": [
            57.75,
            19.587942719948924
        ],
        "wc_weaknesses_avg": [
            116.0,
            53.16483800407935
        ],
        "wc_questions_avg": [
            9.0,
            9.192388155425117
        ],
        "wc_review_avg": [
            249.25,
            38.205856880850085
        ],
        "wc_reply_reviewers_avg": [
            32.25,
            20.461854754640402
        ],
        "wc_reply_authors_avg": [
            1500.75,
            1041.4260355397305
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.5,
            1.8027756377319946
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.13245323570650439,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3005387206290089018&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=jFa5KESW65",
        "pdf": "https://openreview.net/pdf?id=jFa5KESW65",
        "email": "ntu.edu;ntu.edu.sg;ntu.edu.sg;cfar.a-star.edu.sg;cfar.a-star.edu.sg;jlu.edu.cn",
        "author_num": 6,
        "aff_unique_index": "0;1;1;2;2;3",
        "aff_unique_norm": "National Technological University;Nanyang Technological University;Agency for Science, Technology and Research;Jilin University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.ntu.edu;https://www.ntu.edu.sg;https://www.a-star.edu.sg;http://www.jlu.edu.cn",
        "aff_unique_abbr": "NTU;NTU;A*STAR;JLU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;1;2",
        "aff_country_unique": "United States;Singapore;China"
    },
    {
        "id": "jFiFmHrIfD",
        "title": "Explorative Latent Self-Supervised Active Search Algorithm (ELSA)",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In computer vision, attaining exceptional performance often necessitates access to large labeled datasets. The creation of extensive datasets through manual annotation is not only cost-prohibitive but also practically infeasible due to the scarcity of positive samples in imbalanced datasets where negative samples dominate. To tackle this intricate problem, we introduce Efficient Latent Space-based Self-Supervised Active Learning Search (ELSA), an active learning-based labeling assistant. ELSA distinguishes itself from existing interactive annotation methods by focusing exclusively on positive class labeling in massively imbalanced datasets replete with a substantial number of negative samples. Through the automatic exclusion of the majority of negative samples, ELSA achieves a remarkable level of precision and accuracy in its search. This novel framework comprises three fundamental components: a)an iterative Nearest Neighbor Search, b)a Sophisticated Random Sampler, c)a Linear Head powered by Active Learning. Our comprehensive study provides insights into the interplay of these components and their collective impact on search efficiency. Notably, we demonstrate that ELSA achieves orders of magnitude superior performance, in average starting with as little as 5 or less positive samples in ImageNet 1k we managed to detect as much as 80\\% of all the examples belonging to that class by only labeling as little as 0.67\\% of the entire dataset manually.",
        "keywords": "Computer Vision;Active Learning;Interactive Labeling;Self-Supervised Learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/720928444bcff37532a5e9313f9ab5dc6611cf0d.zip",
        "author": "Aniket Nath;Diptarko Choudhury;Subhankar Mishra",
        "authorids": "~Aniket_Nath1;~Diptarko_Choudhury1;~Subhankar_Mishra1",
        "gender": "M;M;M",
        "homepage": "https://aniket-nath.github.io/portfolio/;;https://www.niser.ac.in/~smishra/",
        "dblp": ";;147/8391",
        "google_scholar": "oD-kyloAAAAJ;;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0002-9429-8973;0009-0001-8105-4718;",
        "linkedin": ";diptarko-choudhury-371518205/;",
        "or_profile": "~Aniket_Nath1;~Diptarko_Choudhury1;~Subhankar_Mishra1",
        "aff": "National Institute of Science Education and Research;National Institute of Science Education and Research;National Institute of Science Education and Research",
        "aff_domain": "niser.ac.in;niser.ac.in;niser.ac.in",
        "position": "Undergrad student;Undergrad student;Assistant Professor",
        "bibtex": "@misc{\nnath2024explorative,\ntitle={Explorative Latent Self-Supervised Active Search Algorithm ({ELSA})},\nauthor={Aniket Nath and Diptarko Choudhury and Subhankar Mishra},\nyear={2024},\nurl={https://openreview.net/forum?id=jFiFmHrIfD}\n}",
        "github": "",
        "project": "",
        "reviewers": "HU18;4JSg;3EJ7",
        "site": "https://openreview.net/forum?id=jFiFmHrIfD",
        "pdf_size": 5016380,
        "rating": "1;5;5",
        "confidence": "4;2;3",
        "soundness": "2;3;2",
        "contribution": "1;2;3",
        "presentation": "1;1;2",
        "wc_summary": "52;71;115",
        "wc_strengths": "19;17;78",
        "wc_weaknesses": "71;72;97",
        "wc_questions": "68;66;66",
        "wc_review": "210;226;356",
        "wc_reply_reviewers": "34;15;341",
        "wc_reply_authors": "617;313;398",
        "reply_reviewers": "1;1;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            3.6666666666666665,
            1.8856180831641267
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            79.33333333333333,
            26.386023236217735
        ],
        "wc_strengths_avg": [
            38.0,
            28.296053906272277
        ],
        "wc_weaknesses_avg": [
            80.0,
            12.027745701779143
        ],
        "wc_questions_avg": [
            66.66666666666667,
            0.9428090415820634
        ],
        "wc_review_avg": [
            264.0,
            65.38093503970914
        ],
        "wc_reply_reviewers_avg": [
            130.0,
            149.40102632400712
        ],
        "wc_reply_authors_avg": [
            442.6666666666667,
            128.06335237772836
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:sMcgX3diktsJ:scholar.google.com/&scioq=Explorative+Latent+Self-Supervised+Active+Search+Algorithm+(ELSA)&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "National Institute of Science Education and Research",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.niser.ac.in",
        "aff_unique_abbr": "NISER",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "India"
    },
    {
        "id": "jFox1iMWUa",
        "title": "CAUSAL NEURAL NETWORKS FOR CONTINUOUS TREATMENT EFFECT ESTIMATION",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Causal inference have wide applications in medical decision-making, evaluating advertising, and voucher distribution. The exist of confounding effect makes it difficult to have an unbiased uplift estimation. \nTraditional methods focuses on the ordering of the problem. Little attention have been paid to the response performance, either on the evaluation metric, nor the modeling. \nIn this work, an end-to-end multi-task deep neural network is proposed to capture the relations between the treatment propensity and the treatment effect, where the treatment can be continuous. \nThe performance of the proposal is tested over large scale semi-synthetic and real-world data. \nThe result shows that the proposal balances the estimation of response performance and individual treatment effect. \nThe online environment implementation suggests the proposal can boost up the market scale and achieve 4.8% higher return over investment (ROI).",
        "keywords": "Causal Inference;DNN;multi-task;uplift",
        "primary_area": "causal reasoning",
        "supplementary_material": "",
        "author": "Zhe Yu;Chi Xia;Shaosheng Cao;Lin Zhou",
        "authorids": "~Zhe_Yu5;~Chi_Xia1;~Shaosheng_Cao2;~Lin_Zhou3",
        "gender": "M;M;M;",
        "homepage": ";;;",
        "dblp": ";;;69/6147",
        "google_scholar": "Lpu45OEAAAAJ;;ZF0ntl4AAAAJ;",
        "orcid": "0000-0003-1068-2386;0009-0006-1277-7898;0000-0002-3795-8824;0000-0002-4965-5775",
        "linkedin": ";;;",
        "or_profile": "~Zhe_Yu5;~Chi_Xia1;~Shaosheng_Cao2;~Lin_Zhou3",
        "aff": ";;DiDi Chuxing;Didi Research",
        "aff_domain": ";;didichuxing.com;didichuxing.com",
        "position": ";;Researcher;Researcher",
        "bibtex": "@misc{\nanonymous2024causal,\ntitle={{CAUSAL} {NEURAL} {NETWORKS} {FOR} {CONTINUOUS} {TREATMENT} {EFFECT} {ESTIMATION}},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=jFox1iMWUa}\n}",
        "github": "",
        "project": "",
        "reviewers": "pLg1;LXVg;5vkR;QMLA;iNGX",
        "site": "https://openreview.net/forum?id=jFox1iMWUa",
        "pdf_size": 395205,
        "rating": "3;3;3;3;5",
        "confidence": "4;4;4;4;4",
        "soundness": "2;1;2;2;3",
        "contribution": "2;1;2;2;2",
        "presentation": "1;1;2;2;2",
        "wc_summary": "59;33;23;28;74",
        "wc_strengths": "82;11;35;33;48",
        "wc_weaknesses": "300;550;314;180;342",
        "wc_questions": "100;2;6;25;94",
        "wc_review": "541;596;378;266;558",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            3.4,
            0.8
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            1.8,
            0.4000000000000001
        ],
        "presentation_avg": [
            1.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            43.4,
            19.703806738800502
        ],
        "wc_strengths_avg": [
            41.8,
            23.352944139872385
        ],
        "wc_weaknesses_avg": [
            337.2,
            119.95065652175481
        ],
        "wc_questions_avg": [
            45.4,
            42.884029661401925
        ],
        "wc_review_avg": [
            467.8,
            125.47254679809444
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:cmJpb20mHVgJ:scholar.google.com/&scioq=CAUSAL+NEURAL+NETWORKS+FOR+CONTINUOUS+TREATMENT+EFFECT+ESTIMATION&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Didi Chuxing;Didi Research",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.didichuxing.com/;https://www.didi.com",
        "aff_unique_abbr": "DiDi;Didi",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "jGuXGNcK6O",
        "title": "The Fundamental Limits of Least-Privilege Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Offloading model training and inference to a service provider is a common practice but raises concerns about data misuse when the provider is untrusted. Collaborative learning and model partitioning aim to address this issue by having clients share a representation of their data instead of the raw data itself. To prevent unintended information leakage, the feature mappings that produce such representations should follow the least-privilege principle, i.e., output representations that are relevant for the intended task, and nothing else. In this work, we provide the first formalisation of the least-privilege principle for machine learning. We first observe that every task comes with fundamental leakage: at the very least, a representation shared for a particular task must reveal the information that can be inferred from the task label itself. Considering this, we formalise the least-privilege principle as a bound on the inference gain about the data behind the representation over what is already revealed through the task\u2019s fundamental leakage. We prove that, under realistic assumptions on the data distribution, there is an inherent trade-off between the utility of representations output by a feature mapping and the leakage of information beyond the intended task. In experiments on image classification, we confirm that any data representation that has good utility for a given prediction task also always leaks more information about the original data than the task label itself. We show that this implies that censoring techniques that hide specific data attributes cannot achieve the desired goal of least-privilege learning.",
        "keywords": "societal harms;unintended information leakage",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/83a1b3008712e0eb278b73f32deb0bc7edebfa82.pdf",
        "author": "Theresa Stadler;Bogdan Kulynych;Nicolas Papernot;Michael Gastpar;Carmela Troncoso",
        "authorids": "~Theresa_Stadler1;~Bogdan_Kulynych1;~Nicolas_Papernot1;~Michael_Gastpar1;~Carmela_Troncoso1",
        "gender": ";Not Specified;M;;F",
        "homepage": "https://reslbesl.github.io;https://kulyny.ch;https://www.papernot.fr;https://people.epfl.ch/michael.gastpar;http://carmelatroncoso.com/",
        "dblp": ";203/9056;162/1405;;01/4825",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en;cGxq0cMAAAAJ;https://scholar.google.ch/citations?user=IQ3hcw4AAAAJ;sMkt3SgAAAAJ",
        "orcid": ";;;0000-0002-5499-5336;0000-0002-2374-2248",
        "linkedin": ";;nicolaspapernot;;carmela-troncoso-b497975/?originalSubdomain=ch",
        "or_profile": "~Theresa_Stadler1;~Bogdan_Kulynych1;~Nicolas_Papernot1;~Michael_Gastpar1;~Carmela_Troncoso1",
        "aff": "Swiss Federal Institute of Technology Lausanne;CHUV - University Hospital Lausanne;Google;School of Computer and Communication Sciences, EPFL - EPF Lausanne;EPFL - EPF Lausanne",
        "aff_domain": "epfl.ch;chuv.ch;google.com;ic.epfl.ch;epfl.ch",
        "position": "PhD student;Postdoc;Research Scientist;Full Professor;Associate Professor",
        "bibtex": "@misc{\nstadler2024the,\ntitle={The Fundamental Limits of Least-Privilege Learning},\nauthor={Theresa Stadler and Bogdan Kulynych and Nicolas Papernot and Michael Gastpar and Carmela Troncoso},\nyear={2024},\nurl={https://openreview.net/forum?id=jGuXGNcK6O}\n}",
        "github": "",
        "project": "",
        "reviewers": "KceC;kXjd;orQ6;qV6w;3Rfy",
        "site": "https://openreview.net/forum?id=jGuXGNcK6O",
        "pdf_size": 696673,
        "rating": "5;5;5;6;6",
        "confidence": "4;4;3;3;3",
        "soundness": "3;3;3;3;3",
        "contribution": "3;2;2;4;2",
        "presentation": "3;2;2;4;3",
        "wc_summary": "64;136;158;72;221",
        "wc_strengths": "18;9;104;32;43",
        "wc_weaknesses": "19;10;178;65;50",
        "wc_questions": "121;2;181;125;116",
        "wc_review": "222;157;621;294;430",
        "wc_reply_reviewers": "209;0;645;0;0",
        "wc_reply_authors": "962;93;2540;544;554",
        "reply_reviewers": "1;0;4;0;0",
        "reply_authors": "4;1;6;2;1",
        "rating_avg": [
            5.4,
            0.48989794855663565
        ],
        "confidence_avg": [
            3.4,
            0.4898979485566356
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6,
            0.8
        ],
        "presentation_avg": [
            2.8,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            130.2,
            58.00137929394439
        ],
        "wc_strengths_avg": [
            41.2,
            33.486713783230506
        ],
        "wc_weaknesses_avg": [
            64.4,
            60.2215908125981
        ],
        "wc_questions_avg": [
            109.0,
            58.44997861419626
        ],
        "wc_review_avg": [
            344.8,
            165.21186398076864
        ],
        "wc_reply_reviewers_avg": [
            170.8,
            250.53654424055586
        ],
        "wc_reply_authors_avg": [
            938.6,
            846.6044176591569
        ],
        "reply_reviewers_avg": [
            1.0,
            1.5491933384829668
        ],
        "reply_authors_avg": [
            2.8,
            1.9390719429665317
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.6666666666666665,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10222119602895288907&as_sdt=8005&sciodt=0,7&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;2;3;3",
        "aff_unique_norm": "Swiss Federal Institute of Technology Lausanne;University Hospital Lausanne;Google;EPFL",
        "aff_unique_dep": ";;Google;School of Computer and Communication Sciences",
        "aff_unique_url": "https://www.epfl.ch;https://www.chuv.ch;https://www.google.com;https://www.epfl.ch",
        "aff_unique_abbr": "EPFL;CHUV;Google;EPFL",
        "aff_campus_unique_index": "0;0;1;0;0",
        "aff_campus_unique": "Lausanne;Mountain View",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "Switzerland;United States"
    },
    {
        "title": "LitCab: Lightweight Language Model Calibration over Short- and Long-form Responses",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18033",
        "id": "jH67LHVOIO",
        "author_site": "Xin Liu, Muhammad Khalifa, Lu Wang",
        "tldr": "",
        "abstract": "A model is considered well-calibrated when its probability estimate aligns with the actual likelihood of the output being correct. Calibrating language models (LMs) is crucial, as it plays a vital role in detecting and mitigating hallucinations of LMs as well as building more trustworthy models. However, standard calibration techniques may not be suited for LM calibration. For instance, post-processing methods such as temperature scaling do not reorder the candidate generations. On the other hand, training-based methods require fine-tuning the entire model, which is impractical for LMs of large scale. We present LitCab, a lightweight calibration mechanism consisting of a single linear layer that takes the input text representation and predicts a bias term, which is then added to the LM output logits. LitCab improves model calibration by only adding < 2% of the original model parameters. For evaluation, we construct CaT, a benchmark consisting of eight text generation tasks, covering responses ranging from short phrases to paragraphs. We test LitCab with Llama2-7B, where it improves calibration across all tasks, reducing the average ECE score by as large as 30%. We further conduct a comprehensive evaluation with multiple popular open-sourced LMs from GPT and LLaMA families, yielding the following key findings: (i) Larger models within the same family exhibit better calibration on tasks with short generation tasks, but not necessarily for longer ones. (ii) GPT-family models show superior calibration compared to LLaMA, Llama2, and Vicuna models, despite having much fewer parameters. (iii) Fine-tuning pretrained model (e.g., LLaMA) with samples of limited purpose (e.g., conversations) may lead to worse calibration, highlighting the importance of fine-tuning setups for calibrating LMs.",
        "keywords": "calibration;hallucination;large language model",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Xin Liu;Muhammad Khalifa;Lu Wang",
        "authorids": "~Xin_Liu18;~Muhammad_Khalifa2;~Lu_Wang9",
        "gender": "M;M;F",
        "homepage": "https://xinliu-cs.github.io;https://mukhal.github.io;https://web.eecs.umich.edu/~wangluxy/",
        "dblp": ";246/4401;49/3800-8",
        "google_scholar": "AUUYG0QAAAAJ;tnmUr30AAAAJ;uczqEdUAAAAJ",
        "orcid": ";;",
        "linkedin": ";muhammaad-khalifa-9a467b100/;",
        "or_profile": "~Xin_Liu18;~Muhammad_Khalifa2;~Lu_Wang9",
        "aff": "University of Michigan - Ann Arbor;University of Michigan - Ann Arbor;University of Michigan",
        "aff_domain": "umich.edu;umich.edu;umich.edu",
        "position": "PhD student;PhD student;Associate Professor",
        "bibtex": "@inproceedings{\nliu2024litcab,\ntitle={LitCab: Lightweight Language Model Calibration over Short- and Long-form Responses},\nauthor={Xin Liu and Muhammad Khalifa and Lu Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=jH67LHVOIO}\n}",
        "github": "",
        "project": "",
        "reviewers": "7atx;Y9cb;vYMP",
        "pdf_size": 1011518,
        "rating": "5;6;8",
        "confidence": "3;3;3",
        "soundness": "3;2;3",
        "contribution": "2;3;3",
        "presentation": "3;3;4",
        "wc_summary": "176;93;112",
        "wc_strengths": "89;30;59",
        "wc_weaknesses": "78;291;63",
        "wc_questions": "75;14;111",
        "wc_review": "418;428;345",
        "wc_reply_reviewers": "0;11;9",
        "wc_reply_authors": "690;1191;795",
        "reply_reviewers": "0;1;1",
        "reply_authors": "3;5;2",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            127.0,
            35.505868059613285
        ],
        "wc_strengths_avg": [
            59.333333333333336,
            24.087802353519557
        ],
        "wc_weaknesses_avg": [
            144.0,
            104.12492496996096
        ],
        "wc_questions_avg": [
            66.66666666666667,
            40.036094825655624
        ],
        "wc_review_avg": [
            397.0,
            36.995495221265344
        ],
        "wc_reply_reviewers_avg": [
            6.666666666666667,
            4.784233364802441
        ],
        "wc_reply_authors_avg": [
            892.0,
            215.72667892497674
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            1.247219128924647
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 16,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10507436392416334480&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=jH67LHVOIO",
        "pdf": "https://openreview.net/pdf?id=jH67LHVOIO",
        "email": "umich.edu;umich.edu;umich.edu",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Michigan",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.umich.edu",
        "aff_unique_abbr": "UM",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Ann Arbor;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "jHdz0CIS2y",
        "title": "SelfVC: Voice Conversion With Iterative Refinement using Self Transformations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We propose SelfVC, a training strategy to iteratively improve a voice conversion model with self-synthesized examples. Previous efforts on voice conversion focus on factorizing speech into explicitly disentangled representations that separately encode speaker characteristics and linguistic content. However, disentangling speech representations to capture such attributes using task-specific loss terms can lead to information loss by discarding finer nuances such as accent and emotion of the original signal. In this work, instead of explicitly disentangling attributes with loss terms, we present a framework to train a controllable voice conversion model on entangled speech representations derived from self-supervised learning (SSL) and speaker verification models. First, we develop techniques to derive prosodic information from the audio signal and SSL representations to train predictive submodules in the synthesis model. Next, we propose a training strategy to iteratively improve the synthesis model for voice conversion, by creating a challenging training objective using self-synthesized examples. In this training approach, the current state of the synthesis model is used to generate voice-converted variations of an utterance, which serve as inputs for the reconstruction task, ensuring a continuous and purposeful refinement of the model. We demonstrate that incorporating such self-synthesized examples during training improves the speaker similarity of generated speech as compared to a baseline voice conversion model trained solely on heuristically perturbed inputs. Our framework is trained without any text and is applicable to a range of tasks such as zero-shot voice conversion, voice conversion across different languages, and controllable speech synthesis with pitch and pace modifications. We conduct extensive comparisons against prior work and find that SelfVC achieves state-of-the-art results in zero-shot voice conversion on metrics evaluating naturalness, speaker similarity, and intelligibility of synthesized audio.",
        "keywords": "speech;voice conversion;representation learning;self supervised learning;speech synthesis",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Paarth Neekhara;Shehzeen Samarah Hussain;Rafael Valle;Boris Ginsburg;Rishabh Ranjan;Shlomo Dubnov;Farinaz Koushanfar;Julian McAuley",
        "authorids": "~Paarth_Neekhara1;~Shehzeen_Samarah_Hussain1;~Rafael_Valle1;~Boris_Ginsburg1;~Rishabh_Ranjan5;~Shlomo_Dubnov1;~Farinaz_Koushanfar1;~Julian_McAuley1",
        "gender": "M;;Not Specified;;M;M;F;M",
        "homepage": "https://paarthneekhara.github.io/;;http://rafaelvalle.github.io;;;http://dub.ucsd.edu;https://farinaz.eng.ucsd.edu/;http://cseweb.ucsd.edu/~jmcauley/",
        "dblp": "194/3168;;;;148/9922;89/4032;k/FarinazKoushanfar.html;29/3483",
        "google_scholar": "lbls-cUAAAAJ;;SktxU8IAAAAJ;;o7WaNbMAAAAJ;NJfiIl8AAAAJ;3XnMVUAAAAAJ;icbo4M0AAAAJ",
        "orcid": ";;;;;;0000-0003-0798-3794;0000-0003-0955-7588",
        "linkedin": ";;vallerafael/;;ranjan-rishabh;shlomo-dubnov-10141/;farinaz-koushanfar-9372a6a/;",
        "or_profile": "~Paarth_Neekhara1;~Shehzeen_Samarah_Hussain1;~Rafael_Valle1;~Boris_Ginsburg1;~Rishabh_Ranjan5;~Shlomo_Dubnov1;~Farinaz_Koushanfar1;~Julian_McAuley1",
        "aff": "NVIDIA;;NVIDIA;;;University of California, San Diego;University of California, San Diego;University of California, San Diego, University of California, San Diego",
        "aff_domain": "nvidia.com;;nvidia.com;;;ucsd.edu;ucsd.edu;eng.ucsd.edu",
        "position": "Researcher;;Senior Research Scientist;;;Full Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nneekhara2024selfvc,\ntitle={Self{VC}: Voice Conversion With Iterative Refinement using Self Transformations},\nauthor={Paarth Neekhara and Shehzeen Samarah Hussain and Rafael Valle and Boris Ginsburg and Rishabh Ranjan and Shlomo Dubnov and Farinaz Koushanfar and Julian McAuley},\nyear={2024},\nurl={https://openreview.net/forum?id=jHdz0CIS2y}\n}",
        "github": "",
        "project": "",
        "reviewers": "PEBv;YZVi;vyxg",
        "site": "https://openreview.net/forum?id=jHdz0CIS2y",
        "pdf_size": 1841630,
        "rating": "5;5;5",
        "confidence": "4;4;4",
        "soundness": "3;2;3",
        "contribution": "2;2;2",
        "presentation": "3;3;3",
        "wc_summary": "63;259;58",
        "wc_strengths": "29;131;102",
        "wc_weaknesses": "56;116;355",
        "wc_questions": "1;42;96",
        "wc_review": "149;548;611",
        "wc_reply_reviewers": "0;0;29",
        "wc_reply_authors": "284;243;412",
        "reply_reviewers": "0;0;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            126.66666666666667,
            93.59605879641632
        ],
        "wc_strengths_avg": [
            87.33333333333333,
            42.913349386357105
        ],
        "wc_weaknesses_avg": [
            175.66666666666666,
            129.15193464374516
        ],
        "wc_questions_avg": [
            46.333333333333336,
            38.90444133457716
        ],
        "wc_review_avg": [
            436.0,
            204.5629487468344
        ],
        "wc_reply_reviewers_avg": [
            9.666666666666666,
            13.67073110293992
        ],
        "wc_reply_authors_avg": [
            313.0,
            71.9768481295664
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10338007784549955322&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;0;1;1;1",
        "aff_unique_norm": "NVIDIA;University of California, San Diego",
        "aff_unique_dep": "NVIDIA Corporation;",
        "aff_unique_url": "https://www.nvidia.com;https://www.ucsd.edu",
        "aff_unique_abbr": "NVIDIA;UCSD",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";San Diego",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Provably Efficient UCB-type Algorithms For Learning Predictive State Representations",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18032",
        "id": "jId5PXbBbX",
        "author_site": "Ruiquan Huang, Yingbin Liang, Jing Yang",
        "tldr": "",
        "abstract": "The general sequential decision-making problem, which includes Markov decision processes (MDPs) and partially observable MDPs (POMDPs) as special cases, aims at maximizing a cumulative reward by making a sequence of decisions based on a history of observations and actions over time. Recent studies have shown that the sequential decision-making problem is statistically learnable if it admits a low-rank structure modeled by predictive state representations (PSRs). Despite these advancements, existing approaches typically involve oracles or steps that are computationally intractable. On the other hand, the upper confidence bound (UCB) based approaches, which have served successfully as computationally efficient methods in bandits and MDPs, have not been investigated for more general PSRs, due to the difficulty of optimistic bonus design in these more challenging settings. This paper proposes the first known UCB-type approach for PSRs, featuring a novel bonus term that upper bounds the total variation distance between the estimated and true models. We further characterize the sample complexity bounds for our designed UCB-type algorithms for both online and offline PSRs. In contrast to existing approaches for PSRs, our UCB-type algorithms enjoy computational tractability, last-iterate guaranteed near-optimal policy, and guaranteed model accuracy.",
        "keywords": "Reinforcement learning;Sequential decision-making problem;Predictive state representation;POMDP;UCB;online and offline",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Ruiquan Huang;Yingbin Liang;Jing Yang",
        "authorids": "~Ruiquan_Huang1;~Yingbin_Liang1;~Jing_Yang3",
        "gender": "M;F;",
        "homepage": ";https://sites.google.com/view/yingbinliang/home;http://www.ee.psu.edu/yang",
        "dblp": "304/8880;51/332;",
        "google_scholar": "0eo3JGgAAAAJ;lGgLAiIAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;",
        "linkedin": "ruiquan-huang-369543185/;;",
        "or_profile": "~Ruiquan_Huang1;~Yingbin_Liang1;~Jing_Yang3",
        "aff": "Pennsylvania State University;The Ohio State University;Pennsylvania State University",
        "aff_domain": "psu.edu;osu.edu;psu.edu",
        "position": "PhD student;Professor;Associate Professor",
        "bibtex": "@inproceedings{\nhuang2024provably,\ntitle={Provably Efficient {UCB}-type Algorithms For Learning Predictive State Representations},\nauthor={Ruiquan Huang and Yingbin Liang and Jing Yang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=jId5PXbBbX}\n}",
        "github": "",
        "project": "",
        "reviewers": "dtbr;eKGX;4GGq;YPuy",
        "pdf_size": 563290,
        "rating": "5;6;6;8",
        "confidence": "4;3;3;3",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "4;3;3;2",
        "wc_summary": "42;54;57;124",
        "wc_strengths": "26;71;68;106",
        "wc_weaknesses": "211;184;95;235",
        "wc_questions": "3;6;124;171",
        "wc_review": "282;315;344;636",
        "wc_reply_reviewers": "0;22;21;55",
        "wc_reply_authors": "1666;768;830;1396",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "4;3;3;3",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            69.25,
            32.104322138927024
        ],
        "wc_strengths_avg": [
            67.75,
            28.358199872347328
        ],
        "wc_weaknesses_avg": [
            181.25,
            52.964020806581516
        ],
        "wc_questions_avg": [
            76.0,
            73.41321406940307
        ],
        "wc_review_avg": [
            394.25,
            141.28760561351444
        ],
        "wc_reply_reviewers_avg": [
            24.5,
            19.67866865415443
        ],
        "wc_reply_authors_avg": [
            1165.0,
            378.87860852785025
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.25,
            0.4330127018922193
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.6622661785325219,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8744064639991538775&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=jId5PXbBbX",
        "pdf": "https://openreview.net/pdf?id=jId5PXbBbX",
        "email": "psu.edu;osu.edu;psu.edu",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Pennsylvania State University;Ohio State University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.psu.edu;https://www.osu.edu",
        "aff_unique_abbr": "PSU;OSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "BioBridge: Bridging Biomedical Foundation Models via Knowledge Graphs",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18031",
        "id": "jJCeMiwHdH",
        "author_site": "Zifeng Wang, Zichen Wang, Balasubramaniam Srinivasan, Vassilis N. Ioannidis, Huzefa Rangwala, RISHITA ANUBHAI",
        "tldr": "",
        "abstract": "Foundation models (FMs) learn from large volumes of unlabeled data to demonstrate superior performance across a wide range of tasks. However, FMs developed for biomedical domains have largely remained unimodal, i.e., independently trained and used for tasks on protein sequences alone, small molecule structures alone, or clinical data alone.\nTo overcome this limitation, we present BioBridge, a parameter-efficient learning framework, to bridge independently trained unimodal FMs to establish multimodal behavior. BioBridge achieves it by utilizing Knowledge Graphs (KG) to learn transformations between one unimodal FM and another without fine-tuning any underlying unimodal FMs.\nOur results demonstrate that BioBridge can\nbeat the best baseline KG embedding methods (on average by ~ 76.3%) in cross-modal retrieval tasks. We also identify BioBridge demonstrates out-of-domain generalization ability by extrapolating to unseen modalities or relations. Additionally, we also show that BioBridge presents itself as a general-purpose retriever that can aid biomedical multimodal question answering as well as enhance the guided generation of novel drugs. Code is at https://github.com/RyanWangZf/BioBridge.",
        "keywords": "drug discovery;foundation model;multi-modal learning;knowledge graph",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Zifeng Wang;Zichen Wang;Balasubramaniam Srinivasan;Vassilis N. Ioannidis;Huzefa Rangwala;RISHITA ANUBHAI",
        "authorids": "~Zifeng_Wang3;~Zichen_Wang3;~Balasubramaniam_Srinivasan1;~Vassilis_N._Ioannidis1;~Huzefa_Rangwala2;~RISHITA_ANUBHAI2",
        "gender": "M;;;;M;F",
        "homepage": "https://zifengwang.xyz;https://wangz10.github.io/;;https://scholar.google.com/citations?hl=en&user=mjmiI4sAAAAJ&view_op=list_works&authuser=1;http://www.cs.gmu.edu/~rangwala;",
        "dblp": ";118/3574;230/3792;;30/444;119/7727",
        "google_scholar": "kMlWwTAAAAAJ;bwLMCp4AAAAJ;uM4EhgEAAAAJ;;yWJ9BqEAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";0000-0002-1415-1286;;0000-0002-8367-0733;;",
        "linkedin": ";;;;;",
        "or_profile": "~Zifeng_Wang3;~Zichen_Wang3;~Balasubramaniam_Srinivasan1;~Vassilis_N._Ioannidis1;~Huzefa_Rangwala2;~RISHITA_ANUBHAI2",
        "aff": "University of Illinois, Urbana Champaign;Amazon;Amazon;Amazon Web Services;Computer Science, George Mason University;Amazon",
        "aff_domain": "illinois.edu;amazon.com;amazon.com;amazon.com;cs.gmu.edu;amazon.com",
        "position": "PhD student;Researcher;Senior Applied Scientist;Applied Scientist II;Full Professor;Researcher",
        "bibtex": "@inproceedings{\nwang2024biobridge,\ntitle={BioBridge: Bridging Biomedical Foundation Models via Knowledge Graphs},\nauthor={Zifeng Wang and Zichen Wang and Balasubramaniam Srinivasan and Vassilis N. Ioannidis and Huzefa Rangwala and RISHITA ANUBHAI},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=jJCeMiwHdH}\n}",
        "github": "",
        "project": "",
        "reviewers": "xFRj;VYFb;L5qe;cgGU",
        "pdf_size": 1752416,
        "rating": "6;6;8;8",
        "confidence": "3;4;5;4",
        "soundness": "3;3;4;3",
        "contribution": "3;2;4;3",
        "presentation": "3;3;3;3",
        "wc_summary": "55;92;52;131",
        "wc_strengths": "36;76;27;128",
        "wc_weaknesses": "36;217;27;175",
        "wc_questions": "175;94;413;42",
        "wc_review": "302;479;519;476",
        "wc_reply_reviewers": "33;17;18;0",
        "wc_reply_authors": "647;1647;1259;590",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "2;4;3;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            82.5,
            32.12864765283469
        ],
        "wc_strengths_avg": [
            66.75,
            39.88342387508876
        ],
        "wc_weaknesses_avg": [
            113.75,
            83.64022656592938
        ],
        "wc_questions_avg": [
            181.0,
            142.0827223838282
        ],
        "wc_review_avg": [
            444.0,
            83.72275676302112
        ],
        "wc_reply_reviewers_avg": [
            17.0,
            11.683321445547923
        ],
        "wc_reply_authors_avg": [
            1035.75,
            439.68362205112896
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.7071067811865475,
        "gs_citation": 22,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15712356642460372149&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=jJCeMiwHdH",
        "pdf": "https://openreview.net/pdf?id=jJCeMiwHdH",
        "email": "illinois.edu;amazon.com;amazon.com;amazon.com;cs.gmu.edu;amazon.com",
        "author_num": 6,
        "aff_unique_index": "0;1;1;1;2;1",
        "aff_unique_norm": "University of Illinois Urbana-Champaign;Amazon;George Mason University",
        "aff_unique_dep": ";Amazon.com, Inc.;Computer Science",
        "aff_unique_url": "https://illinois.edu;https://www.amazon.com;https://www.gmu.edu",
        "aff_unique_abbr": "UIUC;Amazon;GMU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Urbana-Champaign;",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Task Planning for Visual Room Rearrangement under Partial Observability",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18030",
        "id": "jJvXNpvOdM",
        "author_site": "Karan Mirakhor, Sourav Ghosh, DIPANJAN DAS, Brojeshwar Bhowmick",
        "tldr": "",
        "abstract": "This paper presents a novel hierarchical task planner under partial observability\nthat empowers an embodied agent to use visual input to efficiently plan a sequence\nof actions for simultaneous object search and rearrangement in an untidy room,\nto achieve a desired tidy state. The paper introduces (i) a novel Search Network\nthat utilizes commonsense knowledge from large language models to find unseen\nobjects, (ii) a Deep RL network trained with proxy reward, along with (iii) a novel\ngraph-based state representation to produce a scalable and effective planner that\ninterleaves object search and rearrangement to minimize the number of steps taken\nand overall traversal of the agent, as well as to resolve blocked goal and swap\ncases, and (iv) a sample-efficient cluster-biased sampling for simultaneous training\nof the proxy reward network along with the Deep RL network. Furthermore,\nthe paper presents new metrics and a benchmark dataset - RoPOR, to measure\nthe effectiveness of rearrangement planning. Experimental results show that our\nmethod significantly outperforms the state-of-the-art rearrangement methods Weihs\net al. (2021a); Gadre et al. (2022); Sarch et al. (2022); Ghosh et al. (2022).",
        "keywords": "Task Planning;Object Search;Deep-RL;Robotics",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/c45fb2afcba8e0b00d5fa5c2ef29149850a03232.zip",
        "author": "Karan Mirakhor;Sourav Ghosh;Dipanjan Das;Brojeshwar Bhowmick",
        "authorids": "~Karan_Mirakhor1;~Sourav_Ghosh2;~Dipanjan_Das4;~Brojeshwar_Bhowmick3",
        "gender": "M;M;M;M",
        "homepage": ";;;https://sites.google.com/view/brojeshwar/home",
        "dblp": ";;https://dblp.uni-trier.de/pers/hd/d/Das_0003:Dipanjan;88/7529",
        "google_scholar": "wpeFm64AAAAJ;https://scholar.google.co.in/citations?hl=en;HRZMDDsAAAAJ;https://scholar.google.co.in/citations?user=Eqf8NrEAAAAJ",
        "orcid": ";;;",
        "linkedin": "karan-mirakhor-b065b7142;sourav-ghosh-5927b1128/;dipanjan-das-38859019;",
        "or_profile": "~Karan_Mirakhor1;~Sourav_Ghosh2;~Dipanjan_Das4;~Brojeshwar_Bhowmick3",
        "aff": "Tata Consultancy Services Limited, India;Tata Consultancy Services Limited, India;TCS Research & Innovation;TCS Research & Innovation",
        "aff_domain": "tcs.com;tcs.com;tcs.com;tcs.com",
        "position": "Predoc;Researcher;Principal Researcher;Principal Researcher",
        "bibtex": "@inproceedings{\nmirakhor2024task,\ntitle={Task Planning for Visual Room Rearrangement under Partial Observability},\nauthor={Karan Mirakhor and Sourav Ghosh and Dipanjan Das and Brojeshwar Bhowmick},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=jJvXNpvOdM}\n}",
        "github": "",
        "project": "",
        "reviewers": "eRZf;JNsv;YNy7",
        "pdf_size": 2316686,
        "rating": "6;6;8",
        "confidence": "4;3;4",
        "soundness": "2;2;2",
        "contribution": "2;2;2",
        "presentation": "2;2;2",
        "wc_summary": "115;181;246",
        "wc_strengths": "48;73;89",
        "wc_weaknesses": "271;297;651",
        "wc_questions": "3;296;17",
        "wc_review": "437;847;1003",
        "wc_reply_reviewers": "430;429;94",
        "wc_reply_authors": "1212;1360;1266",
        "reply_reviewers": "2;2;1",
        "reply_authors": "5;4;3",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            180.66666666666666,
            53.48104544810453
        ],
        "wc_strengths_avg": [
            70.0,
            16.87206764645835
        ],
        "wc_weaknesses_avg": [
            406.3333333333333,
            173.3307692118037
        ],
        "wc_questions_avg": [
            105.33333333333333,
            134.9427862301485
        ],
        "wc_review_avg": [
            762.3333333333334,
            238.6983219230686
        ],
        "wc_reply_reviewers_avg": [
            317.6666666666667,
            158.15674362971552
        ],
        "wc_reply_authors_avg": [
            1279.3333333333333,
            61.15190557583267
        ],
        "reply_reviewers_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            4.0,
            0.816496580927726
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.49999999999999983,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5937441148090006313&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=jJvXNpvOdM",
        "pdf": "https://openreview.net/pdf?id=jJvXNpvOdM",
        "email": "tcs.com;tcs.com;tcs.com;tcs.com",
        "author_num": 4,
        "aff_unique_index": "0;0;1;1",
        "aff_unique_norm": "Tata Consultancy Services Limited;Tata Consultancy Services",
        "aff_unique_dep": ";Research & Innovation",
        "aff_unique_url": "https://www.tcs.com;https://www.tcs.com",
        "aff_unique_abbr": "TCS;TCS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "India"
    },
    {
        "title": "OpenWebMath: An Open Dataset of High-Quality Mathematical Web Text",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18029",
        "id": "jKHmjlpViu",
        "author_site": "Keiran Paster, Marco Dos Santos, Zhangir Azerbayev, Jimmy Ba",
        "tldr": "",
        "abstract": "There is growing evidence that pretraining on high quality, carefully thought-out tokens such as code or mathematics plays an important role in improving the reasoning abilities of large language models. For example, Minerva, a PaLM model finetuned on billions of tokens of mathematical documents from arXiv and the web, reported dramatically improved performance on problems that require quantitative reasoning. However, because all known open source web datasets employ preprocessing that does not faithfully preserve mathematical notation, the benefits of large scale training on quantitive web documents are unavailable to the research community. We introduce OpenWebMath, an open dataset inspired by these works containing 14.7B tokens of mathematical webpages from Common Crawl. We describe in detail our method for extracting text and LaTeX content and removing boilerplate from HTML documents, as well as our methods for quality filtering and deduplication. Additionally, we run small-scale experiments by training 1.4B language models on OpenWebMath, showing that models trained on 14.7B tokens of our dataset surpass the performance of models trained on over 20x the amount of general language data. We hope that our dataset, open-sourced and released on the Hugging Face Hub, will help spur advances in the reasoning abilities of large language models.",
        "keywords": "web-scale dataset;natural language processing;large language model;reasoning;AI for math",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/d869e6dda8bd1840ebd71f4eec1443eee48cce81.zip",
        "author": "Keiran Paster;Marco Dos Santos;Zhangir Azerbayev;Jimmy Ba",
        "authorids": "~Keiran_Paster1;~Marco_Dos_Santos1;~Zhangir_Azerbayev1;~Jimmy_Ba1",
        "gender": "M;M;M;M",
        "homepage": "http://keirp.com;;;http://jimmylba.github.io",
        "dblp": ";;;https://dblp.org/pers/b/Ba:Jimmy.html",
        "google_scholar": ";;;https://scholar.google.ca/citations?user=ymzxRhAAAAAJ",
        "orcid": ";;;",
        "linkedin": ";dsantosmarco/;zhangir-azerbayev-314ab21b8/;",
        "or_profile": "~Keiran_Paster1;~Marco_Dos_Santos1;~Zhangir_Azerbayev1;~Jimmy_Ba1",
        "aff": "University of Toronto;Sorbonne University;;Department of Computer Science, University of Toronto",
        "aff_domain": "toronto.edu;sorbonne-universite.fr;;cs.toronto.edu",
        "position": "PhD student;MS student;;Assistant Professor",
        "bibtex": "@inproceedings{\npaster2024openwebmath,\ntitle={OpenWebMath: An Open Dataset of High-Quality Mathematical Web Text},\nauthor={Keiran Paster and Marco Dos Santos and Zhangir Azerbayev and Jimmy Ba},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=jKHmjlpViu}\n}",
        "github": "",
        "project": "",
        "reviewers": "aKVX;2Z7u;oFxt",
        "pdf_size": 666277,
        "rating": "5;5;8",
        "confidence": "3;3;4",
        "soundness": "3;3;2",
        "contribution": "3;2;2",
        "presentation": "3;2;3",
        "wc_summary": "35;122;82",
        "wc_strengths": "25;44;21",
        "wc_weaknesses": "47;44;73",
        "wc_questions": "13;22;205",
        "wc_review": "120;232;381",
        "wc_reply_reviewers": "0;4;70",
        "wc_reply_authors": "507;350;2289",
        "reply_reviewers": "0;1;2",
        "reply_authors": "1;1;4",
        "rating_avg": [
            6.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            79.66666666666667,
            35.55590277608237
        ],
        "wc_strengths_avg": [
            30.0,
            10.03327796219494
        ],
        "wc_weaknesses_avg": [
            54.666666666666664,
            13.02134998974974
        ],
        "wc_questions_avg": [
            80.0,
            88.46468221838589
        ],
        "wc_review_avg": [
            244.33333333333334,
            106.90909949838486
        ],
        "wc_reply_reviewers_avg": [
            24.666666666666668,
            32.097074979228594
        ],
        "wc_reply_authors_avg": [
            1048.6666666666667,
            879.3870339933126
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            2.0,
            1.4142135623730951
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 81,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13280251528031659875&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=jKHmjlpViu",
        "pdf": "https://openreview.net/pdf?id=jKHmjlpViu",
        "email": "toronto.edu;sorbonne-universite.fr;;cs.toronto.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Toronto;Sorbonne University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.utoronto.ca;https://www.sorbonne.universite.fr",
        "aff_unique_abbr": "U of T;Sorbonne",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Toronto",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Canada;France"
    },
    {
        "title": "Less is More: Fewer Interpretable Region via Submodular Subset Selection",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18028",
        "id": "jKTUlxo5zy",
        "author_site": "Ruoyu Chen, Hua Zhang, Siyuan Liang, Jingzhi Li, Xiaochun Cao",
        "tldr": "",
        "abstract": "Image attribution algorithms aim to identify important regions that are highly relevant to model decisions. Although existing attribution solutions can effectively assign importance to target elements, they still face the following challenges: 1) existing attribution methods generate inaccurate small regions thus misleading the direction of correct attribution, and 2) the model cannot produce good attribution results for samples with wrong predictions. To address the above challenges, this paper re-models the above image attribution problem as a submodular subset selection problem, aiming to enhance model interpretability using fewer regions. To address the lack of attention to local regions, we construct a novel submodular function to discover more accurate small interpretation regions. To enhance the attribution effect for all samples, we also impose four different constraints on the selection of sub-regions, i.e., confidence, effectiveness, consistency, and collaboration scores, to assess the importance of various subsets. Moreover, our theoretical analysis substantiates that the proposed function is in fact submodular. Extensive experiments show that the proposed method outperforms SOTA methods on two face datasets (Celeb-A and VGG-Face2) and one fine-grained dataset (CUB-200-2011). For correctly predicted samples, the proposed method improves the Deletion and Insertion scores with an average of 4.9\\% and 2.5\\% gain relative to HSIC-Attribution. For incorrectly predicted samples, our method achieves gains of 81.0\\% and 18.4\\% compared to the HSIC-Attribution algorithm in the average highest confidence and Insertion score respectively. The code is released at https://github.com/RuoyuChen10/SMDL-Attribution.",
        "keywords": "Interpretable AI;Submodular subset selection;Explainable AI;Image Attribution",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/7d96ba920e8792bf85586f38994173fa647196c8.zip",
        "author": "Ruoyu Chen;Hua Zhang;Siyuan Liang;Jingzhi Li;Xiaochun Cao",
        "authorids": "~Ruoyu_Chen2;~Hua_Zhang4;~Siyuan_Liang1;~Jingzhi_Li1;~Xiaochun_Cao3",
        "gender": "M;M;F;F;M",
        "homepage": "https://ruoyuchen10.github.io/;https://visionhzhang.github.io/;https://www.github.com/;;https://scst.sysu.edu.cn/members/caoxiaochun.htm",
        "dblp": "18/6696-1;69/2745-8;205/8767.html;17/1271;39/3695",
        "google_scholar": "rvxqCZIAAAAJ;https://scholar.google.com.hk/citations?user=KYifAy8AAAAJ;Hon4nf0AAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0001-7630-7154;;0000-0002-6154-0233;0000-0003-1816-9464;0000-0001-7141-708X",
        "linkedin": "ruoyu-chen-495383239/;;;;",
        "or_profile": "~Ruoyu_Chen2;~Hua_Zhang4;~Siyuan_Liang1;~Jingzhi_Li1;~Xiaochun_Cao3",
        "aff": "Chinese Academy of Sciences;Chinese Academy of Sciences;National University of Singapore;Institute information of engineering, chinese academy of sciences;SUN YAT-SEN UNIVERSITY",
        "aff_domain": "iie.ac.cn;iie.ac.cn;nus.edu;iie.ac.cn;sysu.edu.cn",
        "position": "PhD student;Full Professor;Researcher;Associate Professor;Full Professor",
        "bibtex": "@inproceedings{\nchen2024less,\ntitle={Less is More: Fewer Interpretable Region via Submodular Subset Selection},\nauthor={Ruoyu Chen and Hua Zhang and Siyuan Liang and Jingzhi Li and Xiaochun Cao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=jKTUlxo5zy}\n}",
        "github": "",
        "project": "",
        "reviewers": "2zii;2VHY;gx4h;kDMz",
        "pdf_size": 6913494,
        "rating": "6;8;8;8",
        "confidence": "2;4;4;5",
        "soundness": "3;4;3;3",
        "contribution": "2;4;4;3",
        "presentation": "2;3;3;2",
        "wc_summary": "45;78;79;153",
        "wc_strengths": "71;73;74;81",
        "wc_weaknesses": "166;156;96;248",
        "wc_questions": "118;2;7;184",
        "wc_review": "400;309;256;666",
        "wc_reply_reviewers": "0;28;57;52",
        "wc_reply_authors": "1007;1306;707;3004",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "2;4;2;8",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            88.75,
            39.53716605929161
        ],
        "wc_strengths_avg": [
            74.75,
            3.766629793329841
        ],
        "wc_weaknesses_avg": [
            166.5,
            54.136401801375754
        ],
        "wc_questions_avg": [
            77.75,
            76.89725287680959
        ],
        "wc_review_avg": [
            407.75,
            157.7440569403488
        ],
        "wc_reply_reviewers_avg": [
            34.25,
            22.609455986378798
        ],
        "wc_reply_authors_avg": [
            1506.0,
            890.4220909209295
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.0,
            2.449489742783178
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.9271726499455306,
        "gs_citation": 28,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6411192709341738624&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=jKTUlxo5zy",
        "pdf": "https://openreview.net/pdf?id=jKTUlxo5zy",
        "email": "iie.ac.cn;iie.ac.cn;nus.edu;iie.ac.cn;sysu.edu.cn",
        "author_num": 5,
        "aff_unique_index": "0;0;1;0;2",
        "aff_unique_norm": "Chinese Academy of Sciences;National University of Singapore;Sun Yat-sen University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.cas.cn;https://www.nus.edu.sg;http://www.sysu.edu.cn",
        "aff_unique_abbr": "CAS;NUS;SYSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "China;Singapore"
    },
    {
        "title": "Rethinking Branching on Exact Combinatorial Optimization Solver: The First Deep Symbolic Discovery Framework",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18027",
        "id": "jKhNBulNMh",
        "author_site": "Yufei Kuang, Jie Wang, Haoyang Liu, Fangzhou Zhu, Xijun Li, Jia Zeng, Jianye HAO, Bin Li, Feng Wu",
        "tldr": "",
        "abstract": "Machine learning (ML) has been shown to successfully accelerate solving NP-hard combinatorial optimization (CO) problems under the branch and bound framework. \nHowever, the high training and inference cost and limited interpretability of ML approaches severely limit their wide application to modern exact CO solvers. In contrast, human-designed policies---though widely integrated in modern CO solvers due to their compactness and reliability---can not capture data-driven patterns for higher performance. To combine the advantages of the two paradigms, we propose the first symbolic discovery framework---namely, deep symbolic discovery for exact combinatorial optimization solver (Symb4CO)---to learn high-performance symbolic policies on the branching task. Specifically, we show the potential existence of small symbolic policies empirically, employ a large neural network to search in the high-dimensional discrete space, and compile the learned symbolic policies directly for fast deployment. Experiments show that the Symb4CO learned purely CPU-based policies consistently achieve *comparable* performance to previous GPU-based state-of-the-art approaches. \nFurthermore, the appealing features of Symb4CO include its high training (*ten training instances*) and inference (*one CPU core*) efficiency and good interpretability (*one-line expressions*), making it simple and reliable for deployment. The results show encouraging potential for the *wide* deployment of ML to modern CO solvers.",
        "keywords": "Combinatorial Optimization;Branch and Bound;Deep Symbolic Optimization;Learn to Optimize;Machine Learning for Combinatorial Optimization",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Yufei Kuang;Jie Wang;Haoyang Liu;Fangzhou Zhu;Xijun Li;Jia Zeng;Jianye HAO;Bin Li;Feng Wu",
        "authorids": "~Yufei_Kuang1;~Jie_Wang1;~Haoyang_Liu2;~Fangzhou_Zhu1;~Xijun_Li1;~Jia_Zeng1;~Jianye_HAO1;~Bin_Li8;~Feng_Wu1",
        "gender": "M;M;M;M;M;M;M;M;M",
        "homepage": "https://miralab.ai/people/yufei-kuang/;http://staff.ustc.edu.cn/~jwangx;https://miralab.ai/people/haoyang-liu/;;https://xijunlee.github.io/;;http://www.icdai.org/jianye.html;http://staff.ustc.edu.cn/~binli;",
        "dblp": "280/1134;29/5259-5;53/8773-2.html;74/8725;203/0784;31/435;21/7664.html;89/6764-25;25/3972-1",
        "google_scholar": "STN3F_oAAAAJ;OugG4dUAAAAJ;;5fTTRiwAAAAJ;QXU_QbMAAAAJ;;;;5bInRDEAAAAJ",
        "orcid": ";;;;0000-0002-9013-1180;;0000-0002-0422-8235;0000-0002-2332-3959;",
        "linkedin": ";;;;;;;;",
        "or_profile": "~Yufei_Kuang1;~Jie_Wang1;~Haoyang_Liu2;~Fangzhou_Zhu1;~Xijun_Li1;~Jia_Zeng1;~Jianye_HAO1;~Bin_Li8;~Feng_Wu1",
        "aff": "University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China;Huawei Technologies Ltd.;Huawei Technologies Ltd.;;Tianjin University;University of Science and Technology of China;University of Science and Technology of China",
        "aff_domain": "ustc.edu.cn;ustc.edu.cn;ustc.edu;huawei.com;huawei.com;;tju.edu.cn;ustc.edu.cn;ustc.edu.cn",
        "position": "PhD student;Full Professor;MS student;Researcher;Researcher;;Associate Professor;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nkuang2024rethinking,\ntitle={Rethinking Branching on Exact Combinatorial Optimization Solver: The First Deep Symbolic Discovery Framework},\nauthor={Yufei Kuang and Jie Wang and Haoyang Liu and Fangzhou Zhu and Xijun Li and Jia Zeng and Jianye HAO and Bin Li and Feng Wu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=jKhNBulNMh}\n}",
        "github": "",
        "project": "",
        "reviewers": "hTDx;z5TX;dfwS",
        "pdf_size": 505480,
        "rating": "6;6;8",
        "confidence": "3;4;4",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "3;3;3",
        "wc_summary": "52;43;918",
        "wc_strengths": "62;39;64",
        "wc_weaknesses": "136;76;83",
        "wc_questions": "9;26;73",
        "wc_review": "259;184;1138",
        "wc_reply_reviewers": "67;11;0",
        "wc_reply_authors": "1350;1619;3264",
        "reply_reviewers": "1;1;0",
        "reply_authors": "3;4;5",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            337.6666666666667,
            410.3740840853487
        ],
        "wc_strengths_avg": [
            55.0,
            11.343133018115703
        ],
        "wc_weaknesses_avg": [
            98.33333333333333,
            26.78722747048592
        ],
        "wc_questions_avg": [
            36.0,
            27.067816067549053
        ],
        "wc_review_avg": [
            527.0,
            433.1258477625181
        ],
        "wc_reply_reviewers_avg": [
            26.0,
            29.337120967584166
        ],
        "wc_reply_authors_avg": [
            2077.6666666666665,
            846.0221956636573
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            4.0,
            0.816496580927726
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.49999999999999983,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11425494574671453768&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=jKhNBulNMh",
        "pdf": "https://openreview.net/pdf?id=jKhNBulNMh",
        "email": "ustc.edu.cn;ustc.edu.cn;ustc.edu;huawei.com;huawei.com;;tju.edu.cn;ustc.edu.cn;ustc.edu.cn",
        "author_num": 9,
        "aff_unique_index": "0;0;0;1;1;2;0;0",
        "aff_unique_norm": "University of Science and Technology of China;Huawei;Tianjin University",
        "aff_unique_dep": ";Huawei Technologies;",
        "aff_unique_url": "http://www.ustc.edu.cn;https://www.huawei.com;http://www.tju.edu.cn",
        "aff_unique_abbr": "USTC;Huawei;TJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "jLDFp45qYz",
        "title": "VQ-CAD: Computer-Aided Design Model Generation with Vector Quantized Diffusion",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Computer-Aided Design (CAD) software remains a pivotal tool in modern engineering and manufacturing, driving the design of a diverse range of products. In this work, we introduce VQ-CAD, the first CAD generation model based on Denoising Diffusion Probabilistic Models. This model utilizes a vector quantized diffusion model, employing multiple hierarchical codebooks generated through VQ-VAE. This integration not only offers a novel perspective on CAD model generation but also achieves state-of-the-art performance in 3D CAD model creation in a fully automatic fashion. Our model is able to recognize and incorporate implicit design constraints by simply forgoing traditional data augmentation. Furthermore, by melding our approach with CLIP, we significantly simplify the existing design process, directly generate CAD command sequences from initial design concepts represented by text or sketches, capture design intentions, and ensure designs adhere to implicit constraints.",
        "keywords": "Diffusion model;Computer-Aided Design;CLIP",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/0f32204b4390a220fa0c6c3c8fd069ecb86ffc0e.zip",
        "author": "Hanxiao Wang;Mingyang Zhao;Yiqun Wang;Weize Quan;Dong-ming Yan",
        "authorids": "~Hanxiao_Wang3;~Mingyang_Zhao1;~Yiqun_Wang1;~Weize_Quan1;~Dong-ming_Yan1",
        "gender": "M;;M;M;M",
        "homepage": ";;;;https://sites.google.com/site/yandongming/",
        "dblp": ";;71/2818-1;185/6242;94/1731-1.html",
        "google_scholar": "rPvC5AkAAAAJ;;g55eWKgAAAAJ;PMR9cooAAAAJ;xAFSO3AAAAAJ",
        "orcid": ";;;;0000-0003-2209-2404",
        "linkedin": ";;;;dongming-yan-ba7b85111/",
        "or_profile": "~Hanxiao_Wang3;~Mingyang_Zhao1;~Yiqun_Wang1;~Weize_Quan1;~Dong-ming_Yan1",
        "aff": "Institute of automation, Chinese Academy of Sciences;;Chongqing University;Institute of Automation, Chinese Academy of Sciences;Institute of Automation, Chinese Academy of Sciences",
        "aff_domain": "ia.ac.cn;;cqu.edu.cn;ia.ac.cn;ia.ac.cn",
        "position": "PhD student;;Associate Professor;Associate Professor;Full Professor",
        "bibtex": "@misc{\nwang2024vqcad,\ntitle={{VQ}-{CAD}: Computer-Aided Design Model Generation with Vector Quantized Diffusion},\nauthor={Hanxiao Wang and Mingyang Zhao and Yiqun Wang and Weize Quan and Dong-ming Yan},\nyear={2024},\nurl={https://openreview.net/forum?id=jLDFp45qYz}\n}",
        "github": "",
        "project": "",
        "reviewers": "yDgr;AUuC;4YyQ",
        "site": "https://openreview.net/forum?id=jLDFp45qYz",
        "pdf_size": 2679331,
        "rating": "3;3;6",
        "confidence": "3;5;5",
        "soundness": "1;2;4",
        "contribution": "2;1;2",
        "presentation": "1;2;4",
        "wc_summary": "82;82;78",
        "wc_strengths": "9;54;95",
        "wc_weaknesses": "272;160;178",
        "wc_questions": "3;138;188",
        "wc_review": "366;434;539",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "wc_summary_avg": [
            80.66666666666667,
            1.8856180831641267
        ],
        "wc_strengths_avg": [
            52.666666666666664,
            35.122009560324926
        ],
        "wc_weaknesses_avg": [
            203.33333333333334,
            49.10759162854105
        ],
        "wc_questions_avg": [
            109.66666666666667,
            78.13805446487362
        ],
        "wc_review_avg": [
            446.3333333333333,
            71.16334886879778
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8478419272407916640&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Chinese Academy of Sciences;Chongqing University",
        "aff_unique_dep": "Institute of Automation;",
        "aff_unique_url": "http://www.ia.cas.cn;https://www.cqu.edu.cn",
        "aff_unique_abbr": "CAS;CQU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Debiasing Attention Mechanism in Transformer without Demographics",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18026",
        "id": "jLIUfrAcMQ",
        "author_site": "Shenyu Lu, Yipei Wang, Xiaoqian Wang",
        "tldr": "",
        "abstract": "Although transformers demonstrate impressive capabilities in a variety of tasks, the fairness issue remains a significant concern when deploying these models. Existing works to address fairness issues in transformers require sensitive labels (such as age, gender, etc.), which can raise privacy concerns or violate legal regulations. An alternative way is through fairness without demographics. However, existing works that improve Rawlsian Max-Min fairness may impose overly restrictive constraints. Other methods that use auxiliary networks could be parameter inefficient. In this paper, we present a new approach to debiasing transformers by leveraging their inherent structure.  By reconsidering the roles of important components (queries, keys, and values) in the attention mechanism, we introduce a simple yet effective debiasing strategy from two perspectives: 1) Grounded in theoretical analysis, we normalize and apply absolute value operations to queries and keys to minimize the bias in attention weight allocation; 2) We reduce the bias within values through local alignment via contrastive learning. Throughout the entire process, our approach does not require any sensitive labels. Furthermore, to enhance memory efficiency in the training phase, we propose a strategy that debias only the last encoder to improve fairness in pre-trained models. We conduct experiments in computer vision and natural language processing tasks and show that our method is comparable and even outperforms the state-of-the-art method with substantially lower energy consumption.",
        "keywords": "Fairness;Transformer;Attention;Without demographics",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/56ee979ef4a66f68ede5d811ad748e3ad1327391.zip",
        "author": "Shenyu Lu;Yipei Wang;Xiaoqian Wang",
        "authorids": "~Shenyu_Lu1;~Yipei_Wang1;~Xiaoqian_Wang1",
        "gender": "M;M;F",
        "homepage": "https://orcid.org/0000-0001-6883-8537;https://yipei-wang.github.io;https://engineering.purdue.edu/~joywang/",
        "dblp": "300/7332;140/2763;151/3215-1",
        "google_scholar": "rOH-vbQAAAAJ;NXENco8AAAAJ;I3tc214AAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Shenyu_Lu1;~Yipei_Wang1;~Xiaoqian_Wang1",
        "aff": "Purdue University;Purdue University;Purdue University",
        "aff_domain": "purdue.edu;purdue.edu;purdue.edu",
        "position": "PhD student;PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nlu2024debiasing,\ntitle={Debiasing Attention Mechanism in Transformer without Demographics},\nauthor={Shenyu Lu and Yipei Wang and Xiaoqian Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=jLIUfrAcMQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "sKv2;DJw2;mDe1;JY1q",
        "pdf_size": 1609934,
        "rating": "5;6;6;6",
        "confidence": "4;4;3;4",
        "soundness": "2;3;3;4",
        "contribution": "3;2;3;3",
        "presentation": "3;3;3;2",
        "wc_summary": "121;48;173;175",
        "wc_strengths": "82;17;132;109",
        "wc_weaknesses": "364;167;93;309",
        "wc_questions": "4;2;2;152",
        "wc_review": "571;234;400;745",
        "wc_reply_reviewers": "0;121;0;270",
        "wc_reply_authors": "1202;1069;485;1110",
        "reply_reviewers": "0;2;0;1",
        "reply_authors": "2;2;1;3",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            129.25,
            51.664180047688745
        ],
        "wc_strengths_avg": [
            85.0,
            43.06390600026895
        ],
        "wc_weaknesses_avg": [
            233.25,
            108.27366946769654
        ],
        "wc_questions_avg": [
            40.0,
            64.66838485689897
        ],
        "wc_review_avg": [
            487.5,
            190.5236205828558
        ],
        "wc_reply_reviewers_avg": [
            97.75,
            111.0413774230129
        ],
        "wc_reply_authors_avg": [
            966.5,
            282.13516264372294
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3401899365877161243&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=jLIUfrAcMQ",
        "pdf": "https://openreview.net/pdf?id=jLIUfrAcMQ",
        "email": "purdue.edu;purdue.edu;purdue.edu",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Purdue University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.purdue.edu",
        "aff_unique_abbr": "Purdue",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "jLLF5EbwI2",
        "title": "Spade : Training-Free Improvement of Spatial Fidelity in Text-to-Image Generation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Text-to-Image (T2I) generation models have seen progressive improvements in their abilities to generate  photo-realistic images. However, it has been demonstrated that they struggle to follow reasoning-intensive textual instructions, particularly when it comes to generating accurate spatial relationships between objects. In this work, we present an approach to improve upon the above shortcomings of these models by leveraging spatially accurate images (LSAI) as grounding reference to guide diffusion-based T2I models.  Given an input prompt containing a spatial phrase, our method involves symbolically creating a corresponding synthetic image, which accurately represents the spatial relationship articulated in the prompt. Next, we use the created image alongside the text prompt, in a training-free manner to condition image synthesis models in generating spatially coherent images. To facilitate our LSAI method, we create SPADE, a large database of 190k text-image pairs, where each image is deterministically generated through open-source 3D rendering tools encompassing a diverse set of 80 MS-COCO objects.  Variation of the images in SPADE is introduced through object and background manipulation as well as GPT-4 guided layout arrangement. We evaluate our method of utilizing SPADE as T2I guidance on Stable Diffusion and ControlNet, and find our LSAI method  substantially improves upon existing methods on the VISOR benchmark. Through extensive ablations and analysis, we analyze LSAI with respect to multiple facets of SPADE and also perform human studies to demonstrate the effectiveness of our method on prompts which contain multiple relationships and out-of-distribution objects. Finally, we present our SPADE Generator as an extendable framework to the research community, emphasizing its potential for expansion.",
        "keywords": "T2I;Image Synthesis;Synthetic Dataset",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/a4db1ebf43d9d2234b19942203dc679ff8b9d743.zip",
        "author": "Agneet Chatterjee;Yiran Luo;Chitta Baral;Yezhou Yang",
        "authorids": "~Agneet_Chatterjee1;~Yiran_Luo1;~Chitta_Baral1;~Yezhou_Yang1",
        "gender": "M;;M;M",
        "homepage": "https://agneetchatterjee.com/;;http://chitta.orissalinks.com;https://yezhouyang.engineering.asu.edu",
        "dblp": "218/8410;;b/ChittaBaral;78/7455",
        "google_scholar": ";;9Yd716IAAAAJ;k2suuZgAAAAJ",
        "orcid": ";;0000-0002-7549-723X;",
        "linkedin": ";;chitta-baral-8a8438b;",
        "or_profile": "~Agneet_Chatterjee1;~Yiran_Luo1;~Chitta_Baral1;~Yezhou_Yang1",
        "aff": "Arizona State University;;Arizona State University;Arizona State University",
        "aff_domain": "asu.edu;;asu.edu;asu.edu",
        "position": "PhD student;;Full Professor;Associate Professor",
        "bibtex": "@misc{\nchatterjee2024spade,\ntitle={Spade : Training-Free Improvement of Spatial Fidelity in Text-to-Image Generation},\nauthor={Agneet Chatterjee and Yiran Luo and Chitta Baral and Yezhou Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=jLLF5EbwI2}\n}",
        "github": "",
        "project": "",
        "reviewers": "2sKk;xFgb;dk9K;wpM5",
        "site": "https://openreview.net/forum?id=jLLF5EbwI2",
        "pdf_size": 49824410,
        "rating": "3;3;5;5",
        "confidence": "4;3;4;3",
        "soundness": "2;3;2;3",
        "contribution": "2;2;1;2",
        "presentation": "2;3;2;3",
        "wc_summary": "79;234;62;95",
        "wc_strengths": "86;141;29;84",
        "wc_weaknesses": "470;264;109;81",
        "wc_questions": "65;88;1;4",
        "wc_review": "700;727;201;264",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            117.5,
            68.26602375999352
        ],
        "wc_strengths_avg": [
            85.0,
            39.604292696625706
        ],
        "wc_weaknesses_avg": [
            231.0,
            154.59139691457608
        ],
        "wc_questions_avg": [
            39.5,
            37.897889123274396
        ],
        "wc_review_avg": [
            473.0,
            241.71781068014
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Ip--KMx9RlgJ:scholar.google.com/&scioq=Spade+:+Training-Free+Improvement+of+Spatial+Fidelity+in+Text-to-Image+Generation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Arizona State University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.asu.edu",
        "aff_unique_abbr": "ASU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "jLnygpRFYm",
        "title": "Predicting masked tokens in stochastic locations improves masked image modeling",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Masked Image Modeling (MIM) is a promising self-supervised learning approach that enables learning from unlabeled images. Despite its recent success, learning good representations through MIM remains challenging because it requires predicting the right semantic content in accurate locations. For example, given an incomplete picture of a dog, we can guess that there is a tail, but we cannot determine its exact location. In this work, we propose to incorporate location uncertainty to MIM by using stochastic positional embeddings (StoP). Specifically, we condition the model on stochastic masked token positions drawn from a gaussian distribution. We show that using StoP reduces overfitting to location features and guides the model toward learning features that are more robust to location uncertainties. Quantitatively, using StoP improves downstream MIM performance on a variety of downstream tasks. For example, linear probing on ImageNet using ViT-B is improved by $+1.7\\%$, and by $2.5\\%$ for ViT-H using 1\\% of the data.",
        "keywords": "Self-Supervised Learning; Representation Learning; Masked Image Modeling; JEPA",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/eba46b43cfe7d87090f2a90216b2078edfb18385.pdf",
        "author": "Amir Bar;Florian Bordes;Assaf Shocher;Mido Assran;Pascal Vincent;Nicolas Ballas;Trevor Darrell;Amir Globerson;Yann LeCun",
        "authorids": "~Amir_Bar1;~Florian_Bordes1;~Assaf_Shocher1;~Mido_Assran1;~Pascal_Vincent1;~Nicolas_Ballas1;~Trevor_Darrell2;~Amir_Globerson1;~Yann_LeCun1",
        "gender": "M;M;M;M;;M;M;M;M",
        "homepage": "http://amirbar.net;;https://assafshocher.github.io/;http://www.iro.umontreal.ca/~vincentp;;http://www.cs.tau.ac.il/~gamir/;http://yann.lecun.com;http://www.midoassran.ca/;https://people.eecs.berkeley.edu/~trevor/",
        "dblp": "73/11011;194/9862;211/8006;43/861;120/9066;08/4162.html;l/YannLeCun;216/2717;d/TrevorDarrell",
        "google_scholar": "L__n1LUAAAAJ;OADfWhUAAAAJ;https://scholar.google.co.il/citations?user=ndRmNK8AAAAJ;WBCKQMsAAAAJ;euUV4iUAAAAJ;https://scholar.google.com.tw/citations?user=5JserkUAAAAJ;WLN3QrAAAAAJ;gcQTTvkAAAAJ;https://scholar.google.com.tw/citations?user=bh-uRFMAAAAJ",
        "orcid": ";;;;;;;0000-0001-9159-8447;",
        "linkedin": ";florianbordes;;;;;;;",
        "or_profile": "~Amir_Bar1;~Florian_Bordes1;~Assaf_Shocher1;~Pascal_Vincent1;~Nicolas_Ballas1;~Amir_Globerson1;~Yann_LeCun1;~Mahmoud_Assran1;~trevor_darrell1",
        "aff": "Tel Aviv University;Meta;University of California, Berkeley;Facebook A.I. Research;Meta;Tel Aviv University;New York University;Meta;Electrical Engineering & Computer Science Department",
        "aff_domain": "tau.ac.il;meta.com;berkeley.edu;fb.com;meta.com;tau.ac.il;nyu.edu;meta.com;eecs.berkeley.edu",
        "position": "PhD student;Researcher;Postdoc;Research Scientist;Researcher;Associate Professor;Full Professor;Research Scientist;Professor",
        "bibtex": "@misc{\nbar2024predicting,\ntitle={Predicting masked tokens in stochastic locations improves masked image modeling},\nauthor={Amir Bar and Florian Bordes and Assaf Shocher and Mido Assran and Pascal Vincent and Nicolas Ballas and Trevor Darrell and Amir Globerson and Yann LeCun},\nyear={2024},\nurl={https://openreview.net/forum?id=jLnygpRFYm}\n}",
        "github": "",
        "project": "",
        "reviewers": "gTwQ;Hczn;92Mr",
        "site": "https://openreview.net/forum?id=jLnygpRFYm",
        "pdf_size": 3126395,
        "rating": "5;5;8",
        "confidence": "3;4;4",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "2;3;3",
        "wc_summary": "67;70;24",
        "wc_strengths": "35;88;46",
        "wc_weaknesses": "22;204;10",
        "wc_questions": "391;12;62",
        "wc_review": "515;374;142",
        "wc_reply_reviewers": "211;86;19",
        "wc_reply_authors": "1514;1355;166",
        "reply_reviewers": "1;1;1",
        "reply_authors": "6;4;2",
        "rating_avg": [
            6.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            53.666666666666664,
            21.01322334996598
        ],
        "wc_strengths_avg": [
            56.333333333333336,
            22.83759084394752
        ],
        "wc_weaknesses_avg": [
            78.66666666666667,
            88.75935005520388
        ],
        "wc_questions_avg": [
            155.0,
            168.12098818013968
        ],
        "wc_review_avg": [
            343.6666666666667,
            153.77978482954845
        ],
        "wc_reply_reviewers_avg": [
            105.33333333333333,
            79.5668831165887
        ],
        "wc_reply_authors_avg": [
            1011.6666666666666,
            601.4894475845404
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            4.0,
            1.632993161855452
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:QnhCRWWzm1EJ:scholar.google.com/&scioq=Predicting+masked+tokens+in+stochastic+locations+improves+masked+image+modeling&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;1;1;0;3;1;4",
        "aff_unique_norm": "Tel Aviv University;Meta;University of California, Berkeley;New York University;Electrical Engineering & Computer Science Department",
        "aff_unique_dep": ";Meta Platforms, Inc.;;;Electrical Engineering & Computer Science",
        "aff_unique_url": "https://www.tau.ac.il;https://meta.com;https://www.berkeley.edu;https://www.nyu.edu;",
        "aff_unique_abbr": "TAU;Meta;UC Berkeley;NYU;",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Berkeley",
        "aff_country_unique_index": "0;1;1;1;1;0;1;1",
        "aff_country_unique": "Israel;United States;"
    },
    {
        "id": "jMJ9IRWmH9",
        "title": "Privacy Preserving API Fine-tuning for LLMs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "As deep learning models become larger and more expensive, many practitioners turn to fine-tuning APIs. \nThese web services allow fine-tuning a model between two parties: the client that provides the data, and the server that hosts the model. \nWhile convenient, the fine-tuning APIs raise a new concern: the data of the client is at risk of privacy breach during the training procedure.\nThis challenge presents an important practical case of vertical federated learning, where the two parties perform parameter-efficient fine-tuning (PEFT) of a large pre-trained model.\nIn this study, we systematically search for a way to fine-tune models over an API  *while keeping the labels private*.\nWe analyze the privacy of popular algorithms for parameter-efficient fine-tuning when training over an API.\nUsing this analysis, we propose P$^3$EFT, a two-party split learning algorithm that takes advantage of existing PEFT properties to maintain privacy at a lower performance overhead.\nTo validate our algorithm, we fine-tune DeBERTa-v2-XXLarge and Flan-T5 using LoRA adapters on a range of common NLP tasks. We find that P$^3$EFT is competitive with existing privacy-preserving methods in a two-party setup while having higher accuracy.",
        "keywords": "Split Learning;Vertical Federated Learning;Federated Learning;Parameter Efficient Fine-tuning;Large Language Models",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Philip Zmushko;Marat Mansurov;Ruslan Svirschevski;Denis Kuznedelev;Max Ryabinin;Aleksandr Beznosikov",
        "authorids": "~Philip_Zmushko1;~Marat_Mansurov1;~Ruslan_Svirschevski1;~Denis_Kuznedelev1;~Max_Ryabinin1;~Aleksandr_Beznosikov1",
        "gender": ";M;;M;Not Specified;",
        "homepage": ";;;https://github.com/Godofnothing;https://mryab.github.io/;",
        "dblp": ";;;322/8616;276/0192;",
        "google_scholar": "zbKIABUAAAAJ;;;;930PERsAAAAJ;",
        "orcid": ";;;0009-0005-2420-9620;;",
        "linkedin": ";mrrrat/;;;;",
        "or_profile": "~Philip_Zmushko1;~Marat_Mansurov1;~Ruslan_Svirschevski1;~Denis_Kuznedelev1;~Max_Ryabinin1;~Aleksandr_Beznosikov1",
        "aff": "Moscow Institute of Physics and Technology;Higher School of Economics, Higher School of Economics;;Yandex;Together AI;",
        "aff_domain": "mipt.ru;cs.hse.ru;;yandex-team.ru;together.ai;",
        "position": "MS student;Undergrad student;;Researcher;Researcher;",
        "bibtex": "@misc{\nzmushko2024privacy,\ntitle={Privacy Preserving {API} Fine-tuning for {LLM}s},\nauthor={Philip Zmushko and Marat Mansurov and Ruslan Svirschevski and Denis Kuznedelev and Max Ryabinin and Aleksandr Beznosikov},\nyear={2024},\nurl={https://openreview.net/forum?id=jMJ9IRWmH9}\n}",
        "github": "",
        "project": "",
        "reviewers": "aRLa;awQz;DV4T;7KRM",
        "site": "https://openreview.net/forum?id=jMJ9IRWmH9",
        "pdf_size": 1362977,
        "rating": "1;3;5;5",
        "confidence": "4;4;3;5",
        "soundness": "1;1;1;3",
        "contribution": "1;2;1;2",
        "presentation": "1;3;2;3",
        "wc_summary": "85;133;33;49",
        "wc_strengths": "44;41;10;41",
        "wc_weaknesses": "578;101;12;36",
        "wc_questions": "14;2;154;328",
        "wc_review": "721;277;209;454",
        "wc_reply_reviewers": "7;0;0;70",
        "wc_reply_authors": "740;471;355;1209",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            3.5,
            1.6583123951777
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            1.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            75.0,
            38.41874542459709
        ],
        "wc_strengths_avg": [
            34.0,
            13.910427743243556
        ],
        "wc_weaknesses_avg": [
            181.75,
            231.0804784052517
        ],
        "wc_questions_avg": [
            124.5,
            131.81331495717723
        ],
        "wc_review_avg": [
            415.25,
            197.88680476474423
        ],
        "wc_reply_reviewers_avg": [
            19.25,
            29.439556722206262
        ],
        "wc_reply_authors_avg": [
            693.75,
            328.6300161275595
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7990029681581420221&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Moscow Institute of Physics and Technology;Higher School of Economics;Yandex;Together AI",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.mipt.ru/en;https://www.hse.ru;https://yandex.com;https://www.together.ai",
        "aff_unique_abbr": "MIPT;HSE;Yandex;Together AI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "Russian Federation;United States"
    },
    {
        "title": "ASID: Active Exploration for System Identification in Robotic Manipulation",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18025",
        "id": "jNR6s6OSBT",
        "author_site": "Marius Memmel, Andrew Wagenmaker, Chuning Zhu, Dieter Fox, Abhishek Gupta",
        "tldr": "",
        "abstract": "Model-free control strategies such as reinforcement learning have shown the ability to learn control strategies without requiring an accurate model or simulator of the world. While this is appealing due to the lack of modeling requirements, such methods can be sample inefficient, making them impractical in many real-world domains. On the other hand, model-based control techniques leveraging accurate simulators can circumvent these challenges and use a large amount of cheap simulation data to learn controllers that can effectively transfer to the real world. The challenge with such model-based techniques is the requirement for an extremely accurate simulation, requiring both the specification of appropriate simulation assets and physical parameters. This requires considerable human effort to design for every environment being considered. In this work, we propose a learning system that can leverage a small amount of real-world data to autonomously refine a simulation model and then plan an accurate control strategy that can be deployed in the real world. Our approach critically relies on utilizing an initial (possibly inaccurate) simulator to design effective exploration policies that, when deployed in the real world, collect high-quality data. We demonstrate the efficacy of this paradigm in identifying articulation, mass, and other physical parameters in several challenging robotic manipulation tasks, and illustrate that only a small amount of real-world data can allow for effective sim-to-real transfer.",
        "keywords": "sim2real;system identification;exploration",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Marius Memmel;Andrew Wagenmaker;Chuning Zhu;Dieter Fox;Abhishek Gupta",
        "authorids": "~Marius_Memmel1;~Andrew_Wagenmaker1;~Chuning_Zhu1;~Dieter_Fox1;~Abhishek_Gupta1",
        "gender": "M;M;M;M;M",
        "homepage": "https://memmelma.github.io/;https://wagenmaker.github.io;https://homes.cs.washington.edu/~zchuning/;https://homes.cs.washington.edu/~fox/;https://homes.cs.washington.edu/~abhgupta/",
        "dblp": "297/5209;195/1036;295/9468;f/DieterFox;18/6404-4",
        "google_scholar": "FoIK-M0AAAAJ;ym8AZSIAAAAJ;;DqXsbPAAAAAJ;1wLVDP4AAAAJ",
        "orcid": ";;;;",
        "linkedin": "marius-memmel-333138153/;;chuning-zhu-39b086167/;;",
        "or_profile": "~Marius_Memmel1;~Andrew_Wagenmaker1;~Chuning_Zhu1;~Dieter_Fox1;~Abhishek_Gupta1",
        "aff": "University of Washington;University of Washington, Seattle;University of Washington;Department of Computer Science;University of Washington",
        "aff_domain": "cs.washington.edu;uw.edu;cs.washington.edu;cs.washington.edu;uw.edu",
        "position": "PhD student;PhD student;PhD student;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nmemmel2024asid,\ntitle={{ASID}: Active Exploration for System Identification in Robotic Manipulation},\nauthor={Marius Memmel and Andrew Wagenmaker and Chuning Zhu and Dieter Fox and Abhishek Gupta},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=jNR6s6OSBT}\n}",
        "github": "",
        "project": "",
        "reviewers": "gS1p;4bkX;zEL2;WUcQ",
        "pdf_size": 15825293,
        "rating": "5;6;8;8",
        "confidence": "3;3;4;3",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "4;2;3;3",
        "wc_summary": "61;85;100;113",
        "wc_strengths": "37;45;74;56",
        "wc_weaknesses": "169;315;37;448",
        "wc_questions": "453;160;24;105",
        "wc_review": "720;605;235;722",
        "wc_reply_reviewers": "0;170;0;90",
        "wc_reply_authors": "1509;1524;235;1030",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "3;3;1;2",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            89.75,
            19.330998422223306
        ],
        "wc_strengths_avg": [
            53.0,
            13.874436925511608
        ],
        "wc_weaknesses_avg": [
            242.25,
            154.20663896214066
        ],
        "wc_questions_avg": [
            185.5,
            161.84019896181542
        ],
        "wc_review_avg": [
            570.5,
            199.4072466085423
        ],
        "wc_reply_reviewers_avg": [
            65.0,
            70.88723439378913
        ],
        "wc_reply_authors_avg": [
            1074.5,
            523.8275002326625
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5555555555555555,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10327660061691872074&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=jNR6s6OSBT",
        "pdf": "https://openreview.net/pdf?id=jNR6s6OSBT",
        "email": "cs.washington.edu;uw.edu;cs.washington.edu;cs.washington.edu;uw.edu",
        "author_num": 5,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "University of Washington;Unknown Institution",
        "aff_unique_dep": ";Department of Computer Science",
        "aff_unique_url": "https://www.washington.edu;",
        "aff_unique_abbr": "UW;",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Seattle",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States;"
    },
    {
        "title": "Analyzing and Improving Optimal-Transport-based Adversarial Networks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18024",
        "id": "jODehvtTDx",
        "author_site": "Jaemoo Choi, Jaewoong Choi, Myungjoo Kang",
        "tldr": "",
        "abstract": "Optimal Transport (OT) problem aims to find a transport plan that bridges two distributions while minimizing a given cost function. OT theory has been widely utilized in generative modeling. In the beginning, OT distance has been used as a measure for assessing the distance between data and generated distributions. Recently, OT transport map between data and prior distributions has been utilized as a generative model. These OT-based generative models share a similar adversarial training objective. In this paper, we begin by unifying these OT-based adversarial methods within a single framework. Then, we elucidate the role of each component in training dynamics through a comprehensive analysis of this unified framework. Moreover, we suggest a simple but novel method that improves the previously best-performing OT-based model. Intuitively, our approach conducts a gradual refinement of the generated distribution, progressively aligning it with the data distribution. Our approach achieves a FID score of 2.51 on CIFAR-10 and 5.99 on CelebA-HQ-256, outperforming unified OT-based adversarial approaches.",
        "keywords": "Optimal Transport;Generative Adversarial Networks",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/b88aeaa8e0e0944ccc46dca6ef4417a9dd2a4d0c.zip",
        "author": "Jaemoo Choi;Jaewoong Choi;Myungjoo Kang",
        "authorids": "~Jaemoo_Choi1;~Jaewoong_Choi1;~Myungjoo_Kang1",
        "gender": "M;M;",
        "homepage": "https://github.com/JaemooC;;http://ncia.snu.ac.kr/",
        "dblp": "295/8916;63/11483;64/5657.html",
        "google_scholar": "Ba2G6sIAAAAJ;e4ZLjREAAAAJ;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Jaemoo_Choi1;~Jaewoong_Choi1;~Myungjoo_Kang1",
        "aff": "Seoul National University;Korea Institute for Advanced Study;Seoul National University",
        "aff_domain": "snu.ac.kr;kias.re.kr;snu.ac.kr",
        "position": "PhD student;Postdoc;Full Professor",
        "bibtex": "@inproceedings{\nchoi2024analyzing,\ntitle={Analyzing and Improving Optimal-Transport-based Adversarial Networks},\nauthor={Jaemoo Choi and Jaewoong Choi and Myungjoo Kang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=jODehvtTDx}\n}",
        "github": "",
        "project": "",
        "reviewers": "oAtf;h5iC;1bYC;7jfY;12Gz",
        "pdf_size": 41616742,
        "rating": "5;6;6;6;6",
        "confidence": "3;4;3;4;3",
        "soundness": "3;3;3;3;3",
        "contribution": "2;3;3;3;2",
        "presentation": "3;4;3;3;3",
        "wc_summary": "71;83;155;130;101",
        "wc_strengths": "40;71;73;50;80",
        "wc_weaknesses": "81;45;96;28;711",
        "wc_questions": "167;33;64;122;13",
        "wc_review": "359;232;388;330;905",
        "wc_reply_reviewers": "0;0;128;0;686",
        "wc_reply_authors": "1144;354;503;632;3822",
        "reply_reviewers": "0;0;2;0;2",
        "reply_authors": "3;2;4;2;6",
        "rating_avg": [
            5.8,
            0.39999999999999997
        ],
        "confidence_avg": [
            3.4,
            0.4898979485566356
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            3.2,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            108.0,
            30.776614498674153
        ],
        "wc_strengths_avg": [
            62.8,
            15.171025014810304
        ],
        "wc_weaknesses_avg": [
            192.2,
            260.538979809164
        ],
        "wc_questions_avg": [
            79.8,
            57.073286220437666
        ],
        "wc_review_avg": [
            442.8,
            236.98725704138607
        ],
        "wc_reply_reviewers_avg": [
            162.8,
            266.2558168378674
        ],
        "wc_reply_authors_avg": [
            1291.0,
            1293.1174733952055
        ],
        "reply_reviewers_avg": [
            0.8,
            0.9797958971132713
        ],
        "reply_authors_avg": [
            3.4,
            1.4966629547095764
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.408248290463863,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15077394717922059605&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=jODehvtTDx",
        "pdf": "https://openreview.net/pdf?id=jODehvtTDx",
        "email": "snu.ac.kr;kias.re.kr;snu.ac.kr",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Seoul National University;Korea Institute for Advanced Study",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.snu.ac.kr;http://www.kaist.edu",
        "aff_unique_abbr": "SNU;KIAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "Optimal Sample Complexity for Average Reward Markov Decision Processes",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18023",
        "id": "jOm5p3q7c7",
        "author_site": "Shengbo Wang, Jose Blanchet, Peter Glynn",
        "tldr": "",
        "abstract": "We resolve the open question regarding the sample complexity of policy learning for maximizing the long-run average reward associated with a uniformly ergodic Markov decision process (MDP), assuming a generative model. In this context, the existing literature provides a sample complexity upper bound of $\\widetilde O(|S||A|t_{\\text{mix}}^2 \\epsilon^{-2})$ and a lower bound of $\\Omega(|S||A|t_{\\text{mix}} \\epsilon^{-2})$.  In these expressions, $|S|$ and $|A|$ denote the cardinalities of the state and action spaces respectively, $t_{\\text{mix}}$ serves as a uniform upper limit for the total variation mixing times, and $\\epsilon$ signifies the error tolerance. Therefore, a notable gap of $t_{\\text{mix}}$ still remains to be bridged. Our primary contribution is the development of an estimator for the optimal policy of average reward MDPs with a sample complexity of $\\widetilde O(|S||A|t_{\\text{mix}}\\epsilon^{-2})$. This marks the first algorithm and analysis to reach the literature's lower bound. Our new algorithm draws inspiration from ideas in Li et al. (2020), Jin \\& Sidford (2021), and Wang et al. (2023). Additionally, we conduct numerical experiments to validate our theoretical findings.",
        "keywords": "reinforcement learning;Markov decision processes;long run average reward;sample complexity",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/4d3caaec69fedbfa4ae50511d87ab70b443df102.zip",
        "author": "Shengbo Wang;Jose Blanchet;Peter Glynn",
        "authorids": "~Shengbo_Wang1;~Jose_Blanchet1;~Peter_Glynn2",
        "gender": "M;M;M",
        "homepage": ";https://web.stanford.edu/~jblanche/;https://web.stanford.edu/~glynn/",
        "dblp": ";75/5093.html;",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;https://scholar.google.co.in/citations?user=O24CcQQAAAAJ;",
        "orcid": ";;",
        "linkedin": ";jose-blanchet;",
        "or_profile": "~Shengbo_Wang1;~Jose_Blanchet1;~Peter_Glynn2",
        "aff": "Stanford University;Stanford University;Stanford University",
        "aff_domain": "stanford.edu;stanford.edu;stanford.edu",
        "position": "PhD student;Professor;Full Professor",
        "bibtex": "@inproceedings{\nwang2024optimal,\ntitle={Optimal Sample Complexity for Average Reward Markov Decision Processes},\nauthor={Shengbo Wang and Jose Blanchet and Peter Glynn},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=jOm5p3q7c7}\n}",
        "github": "",
        "project": "",
        "reviewers": "iFE8;tPAf;fwUc;qCaw",
        "pdf_size": 1164668,
        "rating": "6;6;6;8",
        "confidence": "3;3;2;4",
        "soundness": "3;3;3;4",
        "contribution": "3;3;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "89;41;74;76",
        "wc_strengths": "50;59;88;33",
        "wc_weaknesses": "123;96;85;152",
        "wc_questions": "25;103;90;96",
        "wc_review": "287;299;337;357",
        "wc_reply_reviewers": "0;34;14;0",
        "wc_reply_authors": "313;379;449;431",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            70.0,
            17.705931209625774
        ],
        "wc_strengths_avg": [
            57.5,
            19.93113142799475
        ],
        "wc_weaknesses_avg": [
            114.0,
            25.93260495977988
        ],
        "wc_questions_avg": [
            78.5,
            31.228992939254383
        ],
        "wc_review_avg": [
            320.0,
            28.231188426986208
        ],
        "wc_reply_reviewers_avg": [
            12.0,
            13.92838827718412
        ],
        "wc_reply_authors_avg": [
            393.0,
            52.85830114561004
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.816496580927726,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12504592954230470998&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=jOm5p3q7c7",
        "pdf": "https://openreview.net/pdf?id=jOm5p3q7c7",
        "email": "stanford.edu;stanford.edu;stanford.edu",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Stanford University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.stanford.edu",
        "aff_unique_abbr": "Stanford",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Stanford",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "jPzysuGAwl",
        "title": "Prompt-Tuning Decision Transformer with Preference Ranking",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Prompt-tuning has emerged as a promising method for adapting pre-trained models to downstream tasks or aligning with human preferences. Prompt learning is widely used in NLP but has limited applicability to RL due to the complex physical meaning and environment-specific information contained within RL prompts. Directly extending prompt-tuning approaches to RL is challenging because RL prompts guide agent behavior based on environmental modeling and analysis, rather than adjusting the prompt format for downstream tasks widely used in NLP. In this work, we propose the Prompt-Tuning DT algorithm to address these challenges by using trajectory segments as prompts to guide RL agents in acquiring environmental information and optimizing prompts via black-box tuning to enhance their ability to contain more relevant information, thereby enabling agents to make better decisions. Our approach involves randomly sampling a Gaussian distribution to fine-tune the elements of the prompt trajectory and using the preference ranking function to find the optimization direction, thereby providing more informative prompts and guiding the agent toward specific preferences in the target environment. Extensive experiments show that with only 0.03% of the parameters learned, Prompt-Tuning DT achieves comparable or even better performance than full-model fine-tuning in the few-shot settings. Our work contributes to the advancement of prompt-tuning approaches in RL, providing a promising direction for optimizing pre-trained large-scale RL agents for specific preference tasks.",
        "keywords": "prompt tuning;decision transformer;ranking optimization",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/2d9f2a7c325f610d3ad5ba00061e54f08c828d6d.pdf",
        "author": "Shengchao Hu;Li Shen;Ya Zhang;Dacheng Tao",
        "authorids": "~Shengchao_Hu1;~Li_Shen1;~Ya_Zhang1;~Dacheng_Tao1",
        "gender": ";M;F;",
        "homepage": ";https://sites.google.com/site/mathshenli/home;https://annzhanglion.github.io/;",
        "dblp": ";91/3680-8;85/3714-2;",
        "google_scholar": ";yVhgENIAAAAJ;pbjw9sMAAAAJ;",
        "orcid": ";;0000-0002-5390-9053;",
        "linkedin": ";;;",
        "or_profile": "~Shengchao_Hu1;~Li_Shen1;~Ya_Zhang1;~Dacheng_Tao1",
        "aff": ";JD Explore Academy;Shanghai Jiaotong University;",
        "aff_domain": ";jd.com;sjtu.edu.cn;",
        "position": ";Researcher;Professor;",
        "bibtex": "@misc{\nhu2024prompttuning,\ntitle={Prompt-Tuning Decision Transformer with Preference Ranking},\nauthor={Shengchao Hu and Li Shen and Ya Zhang and Dacheng Tao},\nyear={2024},\nurl={https://openreview.net/forum?id=jPzysuGAwl}\n}",
        "github": "",
        "project": "",
        "reviewers": "pE8y;2gif;Yeg6;WG8A",
        "site": "https://openreview.net/forum?id=jPzysuGAwl",
        "pdf_size": 1010587,
        "rating": "3;5;5;5",
        "confidence": "5;4;4;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "1;2;3;3",
        "wc_summary": "107;109;106;98",
        "wc_strengths": "27;145;49;65",
        "wc_weaknesses": "84;582;247;77",
        "wc_questions": "214;169;25;196",
        "wc_review": "432;1005;427;436",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            105.0,
            4.183300132670378
        ],
        "wc_strengths_avg": [
            71.5,
            44.52808102759426
        ],
        "wc_weaknesses_avg": [
            247.5,
            204.75167886979585
        ],
        "wc_questions_avg": [
            151.0,
            74.48825410761081
        ],
        "wc_review_avg": [
            575.0,
            248.28109070164808
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 20,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16713921081358557865&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "JD;Shanghai Jiao Tong University",
        "aff_unique_dep": "JD Explore Academy;",
        "aff_unique_url": ";https://www.sjtu.edu.cn",
        "aff_unique_abbr": ";SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "1",
        "aff_country_unique": ";China"
    },
    {
        "id": "jQ0KLjlZjR",
        "title": "CookingCLIP\uff1aLearning a Contextualized Multimodal Embedding from Instructional Cooking Videos for Zero-shot Recipe Generation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Cooking is one of the oldest and the most common human activities in daily life. Instructional cooking videos have also become one of the most common data sources for multi-modal visual understanding research, compared to general domains, cooking videos: (1) not only have a significantly stronger cross-modal dependency between the speech texts and their corresponding visual frames at each individual step, (2) but also have a significantly stronger cross-context dependency between sequential steps along their temporal dimensions, making it an ideal domain for contextualized multi-modal embedding and semantic understanding. This paper proposes CookingCLIP, which introduces the latest CLIP (Contrastive Language-Image Pre-training) embedding from the general domain into the specific domain of cooking understanding and makes two adaptions upon the original CLIP embedding for better customization to the cooking understanding problems: (1) from the upstream perspective, we extend the static multi-modal CLIP embedding with a temporal dimension, to facilitate context-aware semantic understanding; (2) from the downstream perspective, we introduce the concept of zero-shot embedding to sequence-to-sequence dense prediction domains, facilitating CLIP being not only capable of telling \u201c Which \u201d (cross-modal recipe generation), but also capable of telling \u201c When \u201d (cross-context recipe localization). Experiments conducted on two challenging cooking caption generation benchmarks, YouCook2 and CrossTask, demonstrate the effectiveness of the proposed embedding. The code will be released.",
        "keywords": "CookingCLIP\uff1aLearning a Contextualized Multimodal Embedding from Instructional Cooking Videos for Zero-shot Recipe Generation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "lin wang;Jing Chen;Zhang Hongyi",
        "authorids": "~lin_wang16;~Jing_Chen12;~Zhang_Hongyi1",
        "gender": ";;",
        "homepage": ";;",
        "dblp": ";;",
        "google_scholar": ";;",
        "orcid": ";0009-0008-5542-9847;0000-0002-2060-3832",
        "linkedin": ";;",
        "or_profile": "~lin_wang16;~Jing_Chen12;~Zhang_Hongyi1",
        "aff": ";;",
        "aff_domain": ";;",
        "position": ";;",
        "bibtex": "@misc{\nwang2024cookingcliplearning,\ntitle={Cooking{CLIP}\uff1aLearning a Contextualized Multimodal Embedding from Instructional Cooking Videos for Zero-shot Recipe Generation},\nauthor={lin wang and Jing Chen and Zhang Hongyi},\nyear={2024},\nurl={https://openreview.net/forum?id=jQ0KLjlZjR}\n}",
        "github": "",
        "project": "",
        "reviewers": "5T4L;Qj9E;1XSR;f8ZN",
        "site": "https://openreview.net/forum?id=jQ0KLjlZjR",
        "pdf_size": 9522143,
        "rating": "1;3;3;5",
        "confidence": "3;4;4;3",
        "soundness": "2;1;2;3",
        "contribution": "1;2;1;3",
        "presentation": "1;1;1;2",
        "wc_summary": "60;55;90;52",
        "wc_strengths": "26;19;14;27",
        "wc_weaknesses": "18;182;359;168",
        "wc_questions": "56;14;5;30",
        "wc_review": "160;270;468;277",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            1.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            64.25,
            15.138939857202683
        ],
        "wc_strengths_avg": [
            21.5,
            5.315072906367325
        ],
        "wc_weaknesses_avg": [
            181.75,
            120.851923857256
        ],
        "wc_questions_avg": [
            26.25,
            19.369757355217438
        ],
        "wc_review_avg": [
            293.75,
            110.78893220895307
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:EwycBlXY3kIJ:scholar.google.com/&scioq=CookingCLIP%EF%BC%9ALearning+a+Contextualized+Multimodal+Embedding+from+Instructional+Cooking+Videos+for+Zero-shot+Recipe+Generation&hl=en&as_sdt=0,19",
        "gs_version_total": 0
    },
    {
        "id": "jQ596tXT3k",
        "title": "Explaining the Out-of-Distribution Detection Paradox through Likelihood Peaks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Likelihood-based deep generative models (DGMs) commonly exhibit a puzzling behaviour: when trained on a relatively complex dataset, they assign higher likelihood values to out-of-distribution (OOD) data from simpler sources. Adding to the mystery, OOD samples are never generated by these DGMs despite having high likelihoods. This two-pronged paradox has yet to be conclusively explained, making likelihood-based OOD detection unreliable. Our primary observation is that high-likelihood regions will not be generated if they contain minimal probability mass, which can occur if the density is sharply peaked. We demonstrate how this seeming contradiction of large densities yet low probability mass can occur on data confined to low dimensional manifolds. We also show that this scenario can be identified through local intrinsic dimension (LID) estimation, and propose a method for OOD detection which pairs the likelihoods and LID estimates obtained from a pre-trained DGM. Moreover, we provide an efficient method for estimating LID from a normalizing flow model, improving upon existing estimators, and enabling state-of-the-art OOD detection performance with respect to comparable flow-based benchmarks.",
        "keywords": "out-of-distribution detection;normalizing flows;manifold hypothesis;intrinsic dimension",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/e5b8ae6748ff2fb9c64c640b0980a6a3b8d1246b.pdf",
        "author": "Hamidreza Kamkari;Brendan Leigh Ross;Jesse C. Cresswell;Anthony L. Caterini;Rahul G Krishnan;Gabriel Loaiza-Ganem",
        "authorids": "~Hamidreza_Kamkari1;~Brendan_Leigh_Ross1;~Jesse_C._Cresswell1;~Anthony_L._Caterini1;~Rahul_G_Krishnan1;~Gabriel_Loaiza-Ganem1",
        "gender": "M;M;M;M;M;",
        "homepage": "https://hamidrezakmk.github.io/;;;http://www.cs.toronto.edu/~rahulgk/index.html;https://sites.google.com/view/gabriel-loaiza-ganem/about-me;https://jescresswell.github.io/",
        "dblp": ";295/0098;167/4383;172/0880;238/1617;279/6764",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.ca/citations?user=TyY1aSYAAAAJ;34sCXQEAAAAJ;ilJgXHkAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.ca/citations?hl=en",
        "orcid": ";;;;;0000-0002-9284-8804",
        "linkedin": "hamidreza-kamkari/;brendan-ross;;rahulgk/;;",
        "or_profile": "~Hamidreza_Kamkari1;~Brendan_Leigh_Ross1;~Anthony_L._Caterini1;~Rahul_G_Krishnan1;~Gabriel_Loaiza-Ganem1;~Jesse_C_Cresswell1",
        "aff": "Department of Computer Science;Layer 6 AI;Layer6;Department of Computer Science, University of Toronto;Layer 6 AI;Layer 6 AI",
        "aff_domain": "cs.toronto.edu;layer6.ai;layer6.ai;cs.toronto.edu;layer6.ai;layer6.ai",
        "position": "MS student;Senior Machine Learning Scientist;Researcher;Assistant Professor;Machine Learning Research Scientist;Staff Machine Learning Scientist",
        "bibtex": "@misc{\nkamkari2024explaining,\ntitle={Explaining the Out-of-Distribution Detection Paradox through Likelihood Peaks},\nauthor={Hamidreza Kamkari and Brendan Leigh Ross and Jesse C. Cresswell and Anthony L. Caterini and Rahul G Krishnan and Gabriel Loaiza-Ganem},\nyear={2024},\nurl={https://openreview.net/forum?id=jQ596tXT3k}\n}",
        "github": "",
        "project": "",
        "reviewers": "c1to;i5V7;urvk",
        "site": "https://openreview.net/forum?id=jQ596tXT3k",
        "pdf_size": 7255233,
        "rating": "5;6;6",
        "confidence": "1;4;4",
        "soundness": "2;2;3",
        "contribution": "2;3;3",
        "presentation": "3;2;4",
        "wc_summary": "42;96;74",
        "wc_strengths": "70;85;130",
        "wc_weaknesses": "342;438;78",
        "wc_questions": "52;113;5",
        "wc_review": "506;732;287",
        "wc_reply_reviewers": "869;240;61",
        "wc_reply_authors": "2044;1206;264",
        "reply_reviewers": "2;2;1",
        "reply_authors": "5;4;2",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.0,
            1.4142135623730951
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            70.66666666666667,
            22.17105219775452
        ],
        "wc_strengths_avg": [
            95.0,
            25.495097567963924
        ],
        "wc_weaknesses_avg": [
            286.0,
            152.21038072352357
        ],
        "wc_questions_avg": [
            56.666666666666664,
            44.21412544525662
        ],
        "wc_review_avg": [
            508.3333333333333,
            181.67798129902505
        ],
        "wc_reply_reviewers_avg": [
            390.0,
            346.49771524018263
        ],
        "wc_reply_authors_avg": [
            1171.3333333333333,
            727.095286434698
        ],
        "reply_reviewers_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            1.247219128924647
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.9999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Efobm9xbEhIJ:scholar.google.com/&scioq=Explaining+the+Out-of-Distribution+Detection+Paradox+through+Likelihood+Peaks&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;1;1",
        "aff_unique_norm": "Unknown Institution;Layer 6 AI;Layer6 AI;University of Toronto",
        "aff_unique_dep": "Department of Computer Science;;;Department of Computer Science",
        "aff_unique_url": ";https://layer6.ai;https://layer6.ai;https://www.utoronto.ca",
        "aff_unique_abbr": ";Layer 6 AI;Layer6;U of T",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Toronto",
        "aff_country_unique_index": "1;1;1;1;1",
        "aff_country_unique": ";Canada"
    },
    {
        "id": "jRYK7SlkTf",
        "title": "Batch Reinforcement Active Learning with TrustSet Extraction",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Data labeling has nontrivial cost especially when large deep learning models are data hungry. Batch active learning is a common approach to increase label efficiency by selecting informative data batch for oracle to annotate, with the purpose that training target model on selected subset could yield the performance from training with full dataset. Uncertainty and diversity are the main concern for data sampling, but it is difficult to clearly analyze them before knowing data labels. Recent batch active learning  leverages pretrained model to extract feature space of dataset and measure uncertainty and diversity of sampled data points by expert knowledge such as Mahalanobis Distance. Drawbacks of these methods refer to the lack of usage of feedback from selected data and uncleared relationship between feature distribution and actual accuracy achieved by target model. To deal with this issue, we propose TrustSet, which is extracted from labeled dataset containing most important data for training data sampler. Compared with analysis from unlabeled data pool, with ground truth knowledge, TrustSet is more reliable and correlated to target model accuracy. Then we formalize batch active learning as a reinforcement learning problem. Taking TrustSet as goal, we train a policy to adaptively sample data with high potential to be within TrustSet of unlabeled data pool. By evaluating on 10 image classification benchmarks, proposed active learning method achieves new state-of-the-art result.",
        "keywords": "Active Learning; Reinforcement Learning; TrustSet",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Guofeng Cui;Pichao WANG;Han-Kai Hsu;Yang Liu;Xiaohang Sun;Zhu Liu;Xiang Hao;Vimal Bhat",
        "authorids": "~Guofeng_Cui1;~Pichao_WANG3;~Han-Kai_Hsu2;~Yang_Liu96;~Xiaohang_Sun2;~Zhu_Liu4;~Xiang_Hao1;~Vimal_Bhat1",
        "gender": "M;M;M;F;M;M;M;M",
        "homepage": ";https://wangpichao.github.io/;https://sites.google.com/site/kevinhkhsu/;;;https://sites.google.com/view/zhuliu;https://dblp.org/pid/19/9764.html;https://www.amazon.science/author/vimal-bhat",
        "dblp": "218/1163.html;;216/8058;;;14/191-1;;291/3787",
        "google_scholar": ";;https://scholar.google.co.uk/citations?user=Ju-WQCkAAAAJ;E44R9RIAAAAJ;hnStLIoAAAAJ;G_GEF3sAAAAJ;;hzOAwQoAAAAJ",
        "orcid": ";;;;;0000-0003-4194-5142;;",
        "linkedin": "guofeng-cui-56b729197/;;;yang-nancy-liu-22578646/;;zhuliu11/;xiang1hao/;bhatvimal/",
        "or_profile": "~Guofeng_Cui1;~Pichao_WANG3;~Han-Kai_Hsu2;~Yang_Liu96;~Xiaohang_Sun2;~Zhu_Liu4;~Xiang_Hao1;~Vimal_Bhat1",
        "aff": "Rutgers University;Amazon;Amazon;Amazon;Amazon;Amazon Prime Video;Amazon;Amazon",
        "aff_domain": "rutgers.edu;amazon.com;amazon.com;amazon.com;amazon.com;amazon.com;amazon.com;amazon.com",
        "position": "PhD student;Researcher;Researcher;Researcher;Researcher;Researcher;Researcher;Researcher",
        "bibtex": "@misc{\ncui2024batch,\ntitle={Batch Reinforcement Active Learning with TrustSet Extraction},\nauthor={Guofeng Cui and Pichao WANG and Han-Kai Hsu and Yang Liu and Xiaohang Sun and Zhu Liu and Xiang Hao and Vimal Bhat},\nyear={2024},\nurl={https://openreview.net/forum?id=jRYK7SlkTf}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=jRYK7SlkTf",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:0yarF8f_ENEJ:scholar.google.com/&scioq=Batch+Reinforcement+Active+Learning+with+TrustSet+Extraction&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1;1;1;1;1",
        "aff_unique_norm": "Rutgers University;Amazon",
        "aff_unique_dep": ";Amazon.com, Inc.",
        "aff_unique_url": "https://www.rutgers.edu;https://www.amazon.com",
        "aff_unique_abbr": "Rutgers;Amazon",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "jRpD8VfGRf",
        "title": "Multi-interest Disentangled Representation Learning for Multimodal Recommendation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In recent years, multimodal recommendation systems have been widely used in e-commerce and short video platforms. How to effectively utilize multimodal data and avoid the interference of multimodal noise information has become the key research direction of researchers. Many studies add multimodal data as auxiliary features to the model, which brings positive effects. Pictures, text and audio signals in short videos are more likely to attract users' interest than basic attributes. The user's multiple personalized interests largely determine the user's behavioral preferences. In order to effectively utilize user interest to improve model effect, We propose a new Multi-interest Disentangled Representation Learning method for multimodal recommendation (MIDR). Specifically, we first introduce the expected maximum to describe the relationship between interest and predicted target, and establish the optimization object based on multi-interest recommendation. Then, considering the relationship between user interest and multiple modalities, we introduce disentangled representation learning to extract modal sharing and modal specific interest representations. Furthermore, we introduce multi-interest contrast module to help model learning interest representation based on self-supervised learning. We conducted experiments on three real-world data sets, and our proposed MIDR outperformed other state-of-art models. The effectiveness of the disentangled interest representation module and interest contrast module was verified by the ablation experiment.",
        "keywords": "Multiple Interests;Disentangled Representation;Multimodal Recommendation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Wei Yang;Qingchen Yang;Yiqun Chen;Chi Lu",
        "authorids": "~Wei_Yang10;~Qingchen_Yang1;~Yiqun_Chen2;~Chi_Lu2",
        "gender": "M;;M;M",
        "homepage": ";;;",
        "dblp": ";;;",
        "google_scholar": ";;;",
        "orcid": "0009-0004-0151-2160;0009-0000-2895-041X;0000-0002-5434-658X;0009-0009-9196-6241",
        "linkedin": ";;;",
        "or_profile": "~Wei_Yang10;~Qingchen_Yang1;~Yiqun_Chen2;~Chi_Lu2",
        "aff": "Institute of Automation, Chinese Academy of Sciences;Qingdao University;Renmin University of China;Tencent",
        "aff_domain": "ia.ac.cn;qdu.edu.cn;ruc.edu.cn;tencent.com",
        "position": "PhD student;MS student;PhD student;Researcher",
        "bibtex": "@misc{\nyang2024multiinterest,\ntitle={Multi-interest Disentangled Representation Learning for Multimodal Recommendation},\nauthor={Wei Yang and Qingchen Yang and Yiqun Chen and Chi Lu},\nyear={2024},\nurl={https://openreview.net/forum?id=jRpD8VfGRf}\n}",
        "github": "",
        "project": "",
        "reviewers": "MGCH;NfjL;2Vun;UexV",
        "site": "https://openreview.net/forum?id=jRpD8VfGRf",
        "pdf_size": 271807,
        "rating": "3;3;5;6",
        "confidence": "4;4;4;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;1;3;2",
        "wc_summary": "71;161;60;92",
        "wc_strengths": "52;28;45;69",
        "wc_weaknesses": "207;331;66;146",
        "wc_questions": "111;43;5;76",
        "wc_review": "441;563;176;383",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "303;230;275;278",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            96.0,
            39.24920381358073
        ],
        "wc_strengths_avg": [
            48.5,
            14.705441169852742
        ],
        "wc_weaknesses_avg": [
            187.5,
            96.76905497110117
        ],
        "wc_questions_avg": [
            58.75,
            39.25796097608738
        ],
        "wc_review_avg": [
            390.75,
            139.97566752832435
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            271.5,
            26.31064423384574
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:oXRms-8UVAQJ:scholar.google.com/&scioq=Multi-interest+Disentangled+Representation+Learning+for+Multimodal+Recommendation&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Chinese Academy of Sciences;Qingdao University;Renmin University of China;Tencent",
        "aff_unique_dep": "Institute of Automation;;;Tencent Holdings Limited",
        "aff_unique_url": "http://www.ia.cas.cn;https://www.qdu.edu.cn;http://www.ruc.edu.cn;https://www.tencent.com",
        "aff_unique_abbr": "CAS;QDU;RUC;Tencent",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Pushing Boundaries: Mixup's Influence on Neural Collapse",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18022",
        "id": "jTSKkcbEsj",
        "author_site": "Quinn Fisher, Haoming Meng, Vardan Papyan",
        "tldr": "",
        "abstract": "Mixup is a data augmentation strategy that employs convex combinations of training instances and their respective labels to improve the robustness and calibration of deep neural networks. Despite its widespread adoption, the nuanced mechanisms that underpin its success are not entirely understood. The observed phenomenon of Neural Collapse, where the last-layer activations and classifier of deep networks converge to a simplex equiangular tight frame (ETF), provides a compelling motivation to explore whether mixup induces alternative geometric configurations and whether those could explain its success. In this study, we delve into the last-layer activations of training data for deep networks subjected to mixup, aiming to uncover insights into its operational efficacy. Our investigation, spanning various architectures and dataset pairs, reveals that mixup's last-layer activations predominantly converge to a distinctive configuration different than one might expect. In this configuration, activations from mixed-up examples of identical classes align with the classifier, while those from different classes delineate channels along the decision boundary. These findings are unexpected, as mixed-up features are not simple convex combinations of feature class means (as one might get, for example, by training mixup with the mean squared error loss). By analyzing this distinctive geometric configuration, we elucidate the mechanisms by which mixup enhances model calibration. To further validate our empirical observations, we conduct a theoretical analysis under the assumption of an unconstrained features model, utilizing the mixup loss. Through this, we characterize and derive the optimal last-layer features under the assumption that the classifier forms a simplex ETF.",
        "keywords": "mixup;neural collapse;unconstrained features model",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Quinn LeBlanc Fisher;Haoming Meng;Vardan Papyan",
        "authorids": "~Quinn_LeBlanc_Fisher1;~Haoming_Meng1;~Vardan_Papyan1",
        "gender": ";;M",
        "homepage": ";;https://sites.google.com/view/vardan-papyan",
        "dblp": ";;173/9783",
        "google_scholar": ";;https://scholar.google.co.il/citations?user=VrE-Gd4AAAAJ",
        "orcid": ";;",
        "linkedin": "quinn-fisher/;haoming-meng-264870180/;",
        "or_profile": "~Quinn_LeBlanc_Fisher1;~Haoming_Meng1;~Vardan_Papyan1",
        "aff": ";University of Toronto;University of Toronto",
        "aff_domain": ";utoronto.ca;toronto.edu",
        "position": ";MS student;Assistant Professor",
        "bibtex": "@inproceedings{\nfisher2024pushing,\ntitle={Pushing Boundaries: Mixup's Influence on Neural Collapse},\nauthor={Quinn LeBlanc Fisher and Haoming Meng and Vardan Papyan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=jTSKkcbEsj}\n}",
        "github": "",
        "project": "",
        "reviewers": "cLyU;nn4q;vgCZ;BaMd",
        "pdf_size": 5201468,
        "rating": "5;6;6;6",
        "confidence": "2;4;3;4",
        "soundness": "3;3;2;3",
        "contribution": "2;3;1;2",
        "presentation": "3;3;2;1",
        "wc_summary": "35;60;93;63",
        "wc_strengths": "8;48;34;68",
        "wc_weaknesses": "50;139;582;408",
        "wc_questions": "4;21;158;13",
        "wc_review": "97;268;867;552",
        "wc_reply_reviewers": "0;129;25;0",
        "wc_reply_authors": "521;462;1402;860",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "4;1;4;4",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            62.75,
            20.571521577170707
        ],
        "wc_strengths_avg": [
            39.5,
            21.834605560898048
        ],
        "wc_weaknesses_avg": [
            294.75,
            211.83646404715125
        ],
        "wc_questions_avg": [
            49.0,
            63.217877218394484
        ],
        "wc_review_avg": [
            446.0,
            292.387585235762
        ],
        "wc_reply_reviewers_avg": [
            38.5,
            53.23767462990847
        ],
        "wc_reply_authors_avg": [
            811.25,
            373.35731879795793
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.25,
            1.299038105676658
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.8703882797784891,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17240571656657372429&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=jTSKkcbEsj",
        "pdf": "https://openreview.net/pdf?id=jTSKkcbEsj",
        "email": ";utoronto.ca;toronto.edu",
        "author_num": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Toronto",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.utoronto.ca",
        "aff_unique_abbr": "U of T",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "jTbfNsi9Nn",
        "title": "Test-Time-Adaptation for Depth Completion",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "There exists an abundance of off-the-shelf models, pretrained on some curated datasets; when tested on new unseen datasets, their performance degrades due to a domain gap between the source training and target testing data. Existing methods for bridging this gap, such as domain adaptation (DA), may require the source data on which the model was trained (often not available), while others, i.e., source-free DA, require many passes through the testing data. We propose an online test-time adaptation method for depth completion, the task of inferring a dense depth map from a single image and associated sparse depth map, that closes the performance gap in a single pass. We first present a study on how the domain shift in each data modality affects model performance. Based on our observations that the sparse depth modality exhibits a much smaller covariate shift than the image, we design a embedding module trained in the source domain that preserves a mapping from features encoding only sparse depth to those encoding image and sparse depth. During test time, sparse depth features are projected using this map as a proxy for source domain features and are used as guidance to train a set of auxiliary parameters (i.e. meta layer) to align image and sparse depth features from the target test domain to that of the source domain. We evaluate our method on indoor and outdoor scenarios and show that it improves over baselines by an average of 12.54\\%.",
        "keywords": "Test-Time Adaptation;Depth Completion;3D Vision",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Hyoungseob Park;Anjali Wang Gupta;Alex Wong",
        "authorids": "~Hyoungseob_Park1;~Anjali_Wang_Gupta1;~Alex_Wong2",
        "gender": "M;F;M",
        "homepage": ";;https://vision.cs.yale.edu/members/alex-wong/",
        "dblp": "268/8125;304/1275;39/6537-1",
        "google_scholar": "A3c4pHkAAAAJ;Vv4Iq7sAAAAJ;K9_XuM8AAAAJ",
        "orcid": "0000-0003-0787-2082;;0000-0002-3157-6016",
        "linkedin": ";anjaliwgupta/;",
        "or_profile": "~Hyoungseob_Park1;~Anjali_Wang_Gupta1;~Alex_Wong2",
        "aff": "Yale University;Yale University;Yale University",
        "aff_domain": "yale.edu;yale.edu;yale.edu",
        "position": "PhD student;Undergrad student;Assistant Professor",
        "bibtex": "@misc{\npark2024testtimeadaptation,\ntitle={Test-Time-Adaptation for Depth Completion},\nauthor={Hyoungseob Park and Anjali Wang Gupta and Alex Wong},\nyear={2024},\nurl={https://openreview.net/forum?id=jTbfNsi9Nn}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=jTbfNsi9Nn",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 18,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1187743167076919385&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Yale University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.yale.edu",
        "aff_unique_abbr": "Yale",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "jTdqzBGMsq",
        "title": "Aligner: One Global Token is Worth Millions of Parameters When Aligning LLMs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We introduce Aligner, a novel Parameter-Efficient Fine-Tuning (PEFT) method for aligning multi-billion-sized Large Language Models (LLMs). Aligner employs a unique design that constructs a globally shared set of tunable tokens that will change the attention of every layer. Remarkably with this method, even when using one token accounting for a mere 5,000 parameters, Aligner can still perform comparably well to state-of-the-art methods like LoRA that require millions of parameters. This capacity is substantiated in both instruction following and value alignment tasks. Besides the multiple order-of-magnitude improvement in parameter efficiency, the insight Aligner provides into the internal mechanisms of LLMs is also valuable. The architectural features and efficacy of our method demonstrate that an LLM separates its handling of \"form\" and \"knowledge\" internally in some orthogonal manner. This finding should give impetus to new research into LLM mechanism understanding and value alignment.",
        "keywords": "LLM;Parameter-Efficient-Finetuning;Alignment;Human Preference;Value",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/f1dc5be994a7ad1731b17f5e5b0a91932bf1ebe4.pdf",
        "author": "Zhou Ziheng;Ying Nian Wu;Song-Chun Zhu;Demetri Terzopoulos",
        "authorids": "~Zhou_Ziheng1;~Ying_Nian_Wu1;~Song-Chun_Zhu1;~Demetri_Terzopoulos1",
        "gender": "M;M;M;M",
        "homepage": ";https://zhusongchun.net/;https://web.cs.ucla.edu/~dt;http://www.stat.ucla.edu/~ywu/",
        "dblp": ";10/10313;85/4738;18/568.html",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.com.tw/citations?user=Al8dyb4AAAAJ;pKuBFaQAAAAJ;7k_1QFIAAAAJ",
        "orcid": ";;;",
        "linkedin": "josephziheng/;;demetri-terzopoulos/;",
        "or_profile": "~Zhou_Ziheng1;~Song-Chun_Zhu1;~Demetri_Terzopoulos1;~Yingnian_Wu1",
        "aff": "Computer Science Department, University of California, Los Angeles;Peking University;University of California, Los Angeles;UCLA",
        "aff_domain": "cs.ucla.edu;pku.edu.cn;ucla.edu;stat.ucla.edu",
        "position": "PhD student;Full Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nziheng2024aligner,\ntitle={Aligner: One Global Token is Worth Millions of Parameters When Aligning {LLM}s},\nauthor={Zhou Ziheng and Ying Nian Wu and Song-Chun Zhu and Demetri Terzopoulos},\nyear={2024},\nurl={https://openreview.net/forum?id=jTdqzBGMsq}\n}",
        "github": "",
        "project": "",
        "reviewers": "aiF1;o5YH;tff3",
        "site": "https://openreview.net/forum?id=jTdqzBGMsq",
        "pdf_size": 2016616,
        "rating": "3;5;5",
        "confidence": "4;4;3",
        "soundness": "1;2;3",
        "contribution": "2;2;1",
        "presentation": "2;2;2",
        "wc_summary": "29;178;81",
        "wc_strengths": "9;52;20",
        "wc_weaknesses": "189;292;44",
        "wc_questions": "39;27;3",
        "wc_review": "266;549;148",
        "wc_reply_reviewers": "0;5;0",
        "wc_reply_authors": "725;740;311",
        "reply_reviewers": "0;1;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            96.0,
            61.746794788609606
        ],
        "wc_strengths_avg": [
            27.0,
            18.239152027072603
        ],
        "wc_weaknesses_avg": [
            175.0,
            101.7283965599904
        ],
        "wc_questions_avg": [
            23.0,
            14.966629547095765
        ],
        "wc_review_avg": [
            321.0,
            168.2636819597939
        ],
        "wc_reply_reviewers_avg": [
            1.6666666666666667,
            2.357022603955158
        ],
        "wc_reply_authors_avg": [
            592.0,
            198.79134790025446
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:_7VHiDw-lrUJ:scholar.google.com/&scioq=Aligner:+One+Global+Token+is+Worth+Millions+of+Parameters+When+Aligning+LLMs&hl=en&as_sdt=0,47",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "University of California, Los Angeles;Peking University",
        "aff_unique_dep": "Computer Science Department;",
        "aff_unique_url": "https://www.ucla.edu;http://www.pku.edu.cn",
        "aff_unique_abbr": "UCLA;Peking U",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Los Angeles;",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "jTsnuWsda2",
        "title": "Multimodal Procedural Planning via Dual Text-Image Prompting",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Embodied agents have achieved prominent performance in following human instructions to complete tasks. However, the potential of providing instructions informed by texts and images to assist humans in completing tasks remains unexplored. To uncover this capability, we present the multimodal procedural planning (MPP) task, in which models are given a high-level goal and generate plans of paired text-image steps, providing more complementary and informative guidance than unimodal plans. The key challenges of MPP are to ensure the informativeness, temporal coherence, and accuracy of plans across modalities. To tackle this, we propose Text-Image Prompting (TIP), a dual-modality prompting method that jointly leverages zero-shot reasoning ability in large language models (LLMs) and compelling text-to-image generation ability from diffusion-based models. Our TIP improves the interaction in the dual modalities using text-to-image bridge and image-to-text bridge, allowing LLMs to guide the textual-grounded image plan generation and leveraging the descriptions of image plans to ground the textual plan reversely. To address the lack of relevant datasets, we collect WIKIPLAN and RECIPEPLAN as a testbed for MPP. Our results show compelling human preferences and automatic scores against unimodal and multimodal baselines on \\wiki~ and \\recipe~ in terms of informativeness, temporal coherence, and plan accuracy.",
        "keywords": "Multimodal Procedural Planning;Large Language Model;Text-to-Image Synthesis",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/bf87500ac54418921874e6112f316341787fe856.zip",
        "author": "Yujie Lu;Pan Lu;Zhiyu Chen;Wanrong Zhu;Xin Eric Wang;William Yang Wang",
        "authorids": "~Yujie_Lu1;~Pan_Lu2;~Zhiyu_Chen1;~Wanrong_Zhu1;~Xin_Eric_Wang2;~William_Yang_Wang2",
        "gender": ";;F;;M;",
        "homepage": "https://yujielu10.github.io/;;https://czyssrs.github.io/;;https://eric-xw.github.io;",
        "dblp": ";;71/1661-2.html;;10/5630-61;",
        "google_scholar": "pcmr6GMAAAAJ;;Wusd9LgAAAAJ;;YjqluE0AAAAJ;",
        "orcid": ";;;;0000-0003-2605-5504;",
        "linkedin": ";;zhiyu-zoey-chen-904805124/;;;",
        "or_profile": "~Yujie_Lu1;~Pan_Lu2;~Zhiyu_Chen1;~Wanrong_Zhu1;~Xin_Eric_Wang2;~William_Yang_Wang2",
        "aff": "UC Santa Barbara;;Carnegie Mellon University;;University of California, Santa Cruz;",
        "aff_domain": "ucsb.edu;;cmu.edu;;ucsc.edu;",
        "position": "PhD student;;Postdoc;;Assistant Professor;",
        "bibtex": "@misc{\nlu2024multimodal,\ntitle={Multimodal Procedural Planning via Dual Text-Image Prompting},\nauthor={Yujie Lu and Pan Lu and Zhiyu Chen and Wanrong Zhu and Xin Eric Wang and William Yang Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=jTsnuWsda2}\n}",
        "github": "",
        "project": "",
        "reviewers": "XpZ4;taPy;jid5",
        "site": "https://openreview.net/forum?id=jTsnuWsda2",
        "pdf_size": 9402277,
        "rating": "3;5;6",
        "confidence": "4;4;3",
        "soundness": "2;3;2",
        "contribution": "3;3;3",
        "presentation": "2;3;3",
        "wc_summary": "73;79;68",
        "wc_strengths": "79;55;49",
        "wc_weaknesses": "401;41;80",
        "wc_questions": "125;73;4",
        "wc_review": "678;248;201",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            73.33333333333333,
            4.496912521077347
        ],
        "wc_strengths_avg": [
            61.0,
            12.96148139681572
        ],
        "wc_weaknesses_avg": [
            174.0,
            161.3009609394811
        ],
        "wc_questions_avg": [
            67.33333333333333,
            49.56028876249837
        ],
        "wc_review_avg": [
            375.6666666666667,
            214.64130284940245
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.7559289460184545,
        "gs_citation": 41,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8979893346118360477&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of California, Santa Barbara;Carnegie Mellon University;University of California, Santa Cruz",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ucsb.edu;https://www.cmu.edu;https://www.ucsc.edu",
        "aff_unique_abbr": "UCSB;CMU;UCSC",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Santa Barbara;;Santa Cruz",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "jU3zRzUBiD",
        "title": "Compensating for Nonlinear Reduction with Linear Computations in Private Inference",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Increasingly serious data privacy concerns and strict regulations have recently posed significant challenges to machine learning, a field that hinges on high-performance processing of massive user data.\nConsequently, privacy-preserving machine learning (PPML) has emerged to securely execute machine learning tasks without violating privacy.\nUnfortunately, the computational cost to securely execute nonlinear computations in PPML models remains significant, calling for new neural architecture designs with fewer nonlinear operations.\nWe propose Seesaw, a novel neural architecture search method tailored for PPML. \nSeesaw exploits a previously unexplored opportunity to leverage more linear computations and nonlinear result reuse, in order to compensate for the accuracy loss due to nonlinear reduction.\nIt also incorporates specifically designed pruning and search strategies to efficiently handle the much larger design space including both nonlinear and linear operators.\nCompared to the previous state-of-the-art PPML for image classification on ImageNet, Seesaw achieves $1.68\\times$ less latency at 71\\% iso-accuracy, or 4.59\\% higher accuracy at iso-latency of 1000K ReLU operations.",
        "keywords": "Privacy Preserving Machine Learning; Network Architecture Search;Cryptography;",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/53c1301408cbf2b3f9f8ff651c26551323b605f4.zip",
        "author": "Fabing Li;Yuanhao Zhai;Mingyu Gao",
        "authorids": "~Fabing_Li1;~Yuanhao_Zhai1;~Mingyu_Gao1",
        "gender": ";M;M",
        "homepage": ";https://www.yhzhai.com;https://people.iiis.tsinghua.edu.cn/~gaomy/",
        "dblp": ";22/11135-1;61/7672-1",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;",
        "orcid": ";0000-0002-3277-3329;",
        "linkedin": "fabing-li-ba955b1aa/;yuanhao-zhai-895518161/;",
        "or_profile": "~Fabing_Li1;~Yuanhao_Zhai1;~Mingyu_Gao1",
        "aff": ";State University of New York at Buffalo;Shanghai Qi Zhi Institute",
        "aff_domain": ";buffalo.edu;sqz.ac.cn",
        "position": ";PhD student;Researcher",
        "bibtex": "@misc{\nli2024compensating,\ntitle={Compensating for Nonlinear Reduction with Linear Computations in Private Inference},\nauthor={Fabing Li and Yuanhao Zhai and Mingyu Gao},\nyear={2024},\nurl={https://openreview.net/forum?id=jU3zRzUBiD}\n}",
        "github": "",
        "project": "",
        "reviewers": "SDAb;68ze;gfp9",
        "site": "https://openreview.net/forum?id=jU3zRzUBiD",
        "pdf_size": 4320450,
        "rating": "1;5;6",
        "confidence": "5;2;2",
        "soundness": "2;3;2",
        "contribution": "1;2;3",
        "presentation": "2;3;3",
        "wc_summary": "51;61;99",
        "wc_strengths": "53;111;32",
        "wc_weaknesses": "438;108;66",
        "wc_questions": "80;62;67",
        "wc_review": "622;342;264",
        "wc_reply_reviewers": "110;0;12",
        "wc_reply_authors": "697;322;453",
        "reply_reviewers": "1;0;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.0,
            2.160246899469287
        ],
        "confidence_avg": [
            3.0,
            1.4142135623730951
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            70.33333333333333,
            20.677416559027765
        ],
        "wc_strengths_avg": [
            65.33333333333333,
            33.409912035535534
        ],
        "wc_weaknesses_avg": [
            204.0,
            166.34903065542642
        ],
        "wc_questions_avg": [
            69.66666666666667,
            7.586537784494029
        ],
        "wc_review_avg": [
            409.3333333333333,
            153.71257448743597
        ],
        "wc_reply_reviewers_avg": [
            40.666666666666664,
            49.27022991173834
        ],
        "wc_reply_authors_avg": [
            490.6666666666667,
            155.39269252088044
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.9819805060619657,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:aAiUfB4z66AJ:scholar.google.com/&scioq=Compensating+for+Nonlinear+Reduction+with+Linear+Computations+in+Private+Inference&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "State University of New York at Buffalo;Shanghai Qi Zhi Institute",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.buffalo.edu;https://www.qz.io",
        "aff_unique_abbr": "SUNY Buffalo;",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Buffalo;",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "jUNSBetmAo",
        "title": "Beyond Disentanglement: On the Orthogonality of Learned Representations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Evaluating learned representations independently of designated downstream tasks is pivotal for crafting robust and adaptable algorithms across a diverse array of applications. Among such evaluations, the assessment of disentanglement in a learned representation has emerged as a significant technique. In a disentangled representation, independent data generating factors are encoded in mutually orthogonal subspaces, a characteristic enhancing numerous downstream applications, potentially bolstering interpretability, fairness, and robustness. However, a representation is often deemed well-disentangled if these orthogonal subspaces are one-dimensional and align with the canonical basis of the latent space \u2013 a powerful yet frequently challenging or unattainable condition in real-world scenarios \u2013 thus narrowing the applicability of disentanglement. Addressing this, we propose a novel evaluation scheme, Importance-Weighted Orthogonality (IWO), to gauge the mutual orthogonality between subspaces encoding the data generating factors, irrespective of their dimensionality or alignment with the canonical basis. For that matter, we introduce a new method, Latent Orthogonal Analysis (LOA), which identifies the subspace encoding each data generating factor and establishes an importance-ranked basis spanning it, thereby forming the foundational bedrock for IWO. Through extensive comparisons of learned representations from synthetic and real-world datasets, we demonstrate that, relative to existing disentanglement metrics, IWO offers a superior assessment of orthogonality and exhibits stronger correlation with downstream task performance across a spectrum of applications.",
        "keywords": "Disentanglement;Orthogonality;Unsupervised Learning;Representation Learning;DCI;DCI-ES",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Robin C. Geyer;Alessandro Torcinovich;Jo\u00e3o B. S. Carvalho;Alexander Meyer;Joachim M. Buhmann",
        "authorids": "~Robin_C._Geyer1;~Alessandro_Torcinovich1;~Jo\u00e3o_B._S._Carvalho1;~Alexander_Meyer1;~Joachim_M._Buhmann1",
        "gender": ";M;;M;M",
        "homepage": ";https://aretor.github.io;;;https://ise.ethz.ch",
        "dblp": ";198/0821;;162/7950;b/JMBuhmann",
        "google_scholar": ";HxaBTK8AAAAJ;;NO6qTxAAAAAJ;https://scholar.google.ch/citations?user=zQWbCzYAAAAJ",
        "orcid": ";0000-0001-8110-1791;;0000-0002-6944-2478;",
        "linkedin": ";alessandro-torcinovich-4b6a6812a/;;;",
        "or_profile": "~Robin_C._Geyer1;~Alessandro_Torcinovich1;~Jo\u00e3o_B._S._Carvalho1;~Alexander_Meyer1;~Joachim_M._Buhmann1",
        "aff": ";ETH Z\u00fcrich;;German Heart Center of the Charit\u00e9;Department of Computer Science, ETHZ - ETH Zurich",
        "aff_domain": ";inf.ethz.ch;;dhzc-charite.de;inf.ethz.ch",
        "position": ";Postdoc;;Full Professor;Professor",
        "bibtex": "@misc{\ngeyer2024beyond,\ntitle={Beyond Disentanglement: On the Orthogonality of Learned Representations},\nauthor={Robin C. Geyer and Alessandro Torcinovich and Jo{\\~a}o B. S. Carvalho and Alexander Meyer and Joachim M. Buhmann},\nyear={2024},\nurl={https://openreview.net/forum?id=jUNSBetmAo}\n}",
        "github": "",
        "project": "",
        "reviewers": "J4X7;ccpN;Voxk;1Jck",
        "site": "https://openreview.net/forum?id=jUNSBetmAo",
        "pdf_size": 385600,
        "rating": "3;5;5;8",
        "confidence": "4;3;3;5",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;1;3",
        "wc_summary": "56;119;46;120",
        "wc_strengths": "96;75;58;30",
        "wc_weaknesses": "330;76;177;102",
        "wc_questions": "92;42;2;42",
        "wc_review": "574;312;283;294",
        "wc_reply_reviewers": "180;0;50;86",
        "wc_reply_authors": "1135;537;619;533",
        "reply_reviewers": "1;0;1;2",
        "reply_authors": "3;2;3;3",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            85.25,
            34.43381332353418
        ],
        "wc_strengths_avg": [
            64.75,
            24.159625411003375
        ],
        "wc_weaknesses_avg": [
            171.25,
            98.87207644223925
        ],
        "wc_questions_avg": [
            44.5,
            31.917863337009262
        ],
        "wc_review_avg": [
            365.75,
            120.67803238369443
        ],
        "wc_reply_reviewers_avg": [
            79.0,
            65.82552696332935
        ],
        "wc_reply_authors_avg": [
            706.0,
            250.04999500099976
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.75,
            0.4330127018922193
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5488604301969737,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:cP-yW4MuuUoJ:scholar.google.com/&scioq=Beyond+Disentanglement:+On+the+Orthogonality+of+Learned+Representations&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "ETH Zurich;Charit\u00e9 - Universit\u00e4tsmedizin Berlin",
        "aff_unique_dep": ";German Heart Center",
        "aff_unique_url": "https://www.ethz.ch;https://www.charite.de",
        "aff_unique_abbr": "ETHZ;Charit\u00e9",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Zurich",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Switzerland;Germany"
    },
    {
        "title": "Hybrid Distillation: Connecting Masked Autoencoders with Contrastive Learners",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18021",
        "id": "jUWktnsplU",
        "author_site": "Bowen Shi, XIAOPENG ZHANG, Yaoming Wang, Li Jin, Wenrui Dai, Junni Zou, Hongkai Xiong, Qi Tian",
        "tldr": "",
        "abstract": "As two prominent strategies for representation learning, Contrastive Learning (CL) and Masked Image Modeling (MIM) have witnessed significant progress. Previous studies have demonstrated the advantages of each approach in specific scenarios. CL, resembling supervised pre-training, excels at capturing longer-range global patterns and enhancing feature discrimination, while MIM is adept at introducing local and diverse attention across transformer layers. Considering the respective strengths, previous studies utilize feature distillation to inherit both discrimination and diversity. In this paper, we thoroughly examine previous feature distillation methods and observe that the increase in diversity mainly stems from asymmetric designs, which may in turn compromise the discrimination ability. To strike a balance between the two properties, we propose a simple yet effective strategy termed Hybrid Distill, which leverages both the CL and MIM teachers to jointly guide the student model. Hybrid Distill emulates the token relations of the MIM teacher at intermediate layers for diversity, while simultaneously distilling the final features of the CL teacher to enhance discrimination. A progressive redundant token masking strategy is employed to reduce the expenses associated with distillation and aid in preventing the model from converging to local optima. Experimental results demonstrate that Hybrid Distill achieves superior performance on various benchmark datasets.",
        "keywords": "contrastive learning;mask image moding;feature distillation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/851c541ef523e0ef92aa055dcbb7af324fd60455.pdf",
        "author": "Bowen Shi;XIAOPENG ZHANG;Yaoming Wang;Jin Li;Wenrui Dai;Junni Zou;Hongkai Xiong;Qi Tian",
        "authorids": "~Bowen_Shi2;~XIAOPENG_ZHANG7;~Yaoming_Wang1;~Jin_Li10;~Wenrui_Dai1;~Junni_Zou1;~Hongkai_Xiong1;~Qi_Tian3",
        "gender": "M;M;;;;F;M;M",
        "homepage": ";https://sites.google.com/site/zxphistory/;;;;http://www.cs.sjtu.edu.cn/~zou-jn;http://min.sjtu.edu.cn;https://www.qitian1987.com/index.html",
        "dblp": ";;;;16/5135.html;91/4613;21/3569;78/1467-1.html",
        "google_scholar": "lJHbpY0AAAAJ;Ud6aBAcAAAAJ;;;Xg8MhyAAAAAJ;https://scholar.google.com/citations?hl=zh-CN;bB16iN4AAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;;;;0000-0003-4552-0029;0000-0002-7252-5047",
        "linkedin": ";;;;;;;",
        "or_profile": "~Bowen_Shi2;~XIAOPENG_ZHANG7;~Yaoming_Wang1;~Jin_Li10;~Wenrui_Dai1;~Junni_Zou1;~Hongkai_Xiong1;~Qi_Tian3",
        "aff": "Shanghai Jiaotong University;Huawei Technologies Ltd.;;;Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;Huawei Technologies Ltd.",
        "aff_domain": "sjtu.edu.cn;huawei.com;;;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;huawei.com",
        "position": "PhD student;Principal Researcher;;;Associate Professor;Full Professor;Full Professor;Principal Researcher",
        "bibtex": "@inproceedings{\nshi2024hybrid,\ntitle={Hybrid Distillation: Connecting Masked Autoencoders with Contrastive Learners},\nauthor={Bowen Shi and XIAOPENG ZHANG and Yaoming Wang and Jin Li and Wenrui Dai and Junni Zou and Hongkai Xiong and Qi Tian},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=jUWktnsplU}\n}",
        "github": "",
        "project": "",
        "reviewers": "4NJ5;zDe2;mHak;ZCMG",
        "pdf_size": 2742000,
        "rating": "6;6;6;8",
        "confidence": "4;4;4;3",
        "soundness": "3;2;3;3",
        "contribution": "3;3;2;3",
        "presentation": "3;3;2;3",
        "wc_summary": "66;61;61;97",
        "wc_strengths": "28;32;43;66",
        "wc_weaknesses": "77;255;525;276",
        "wc_questions": "4;91;12;54",
        "wc_review": "175;439;641;493",
        "wc_reply_reviewers": "0;209;0;27",
        "wc_reply_authors": "186;1409;880;576",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "1;3;2;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            71.25,
            15.006248698458919
        ],
        "wc_strengths_avg": [
            42.25,
            14.771171246722448
        ],
        "wc_weaknesses_avg": [
            283.25,
            159.55622049923343
        ],
        "wc_questions_avg": [
            40.25,
            34.91686555233731
        ],
        "wc_review_avg": [
            437.0,
            168.37458240482735
        ],
        "wc_reply_reviewers_avg": [
            59.0,
            87.30120274085576
        ],
        "wc_reply_authors_avg": [
            762.75,
            446.9067995678741
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16173498847243949441&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=jUWktnsplU",
        "pdf": "https://openreview.net/pdf?id=jUWktnsplU",
        "email": "sjtu.edu.cn;huawei.com;;;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;huawei.com",
        "author_num": 8,
        "aff_unique_index": "0;1;0;0;0;1",
        "aff_unique_norm": "Shanghai Jiao Tong University;Huawei",
        "aff_unique_dep": ";Huawei Technologies",
        "aff_unique_url": "https://www.sjtu.edu.cn;https://www.huawei.com",
        "aff_unique_abbr": "SJTU;Huawei",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Towards Foundation Models for Knowledge Graph Reasoning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18020",
        "id": "jVEoydFOl9",
        "author_site": "Mikhail Galkin, Xinyu Yuan, Hesham Mostafa, Jian Tang, Zhaocheng Zhu",
        "tldr": "",
        "abstract": "Foundation models in language and vision have the ability to run inference on any textual and visual inputs thanks to the transferable representations such as a vocabulary of tokens in language. \nKnowledge graphs (KGs) have different entity and relation vocabularies that generally do not overlap.\nThe key challenge of designing foundation models on KGs is to learn such transferable representations that enable inference on any graph with arbitrary entity and relation vocabularies.\nIn this work, we make a step towards such foundation models and present ULTRA, an approach for learning universal and transferable graph representations. \nULTRA builds relational representations as a function conditioned on their interactions.\nSuch a conditioning strategy allows a pre-trained ULTRA model to inductively generalize to any unseen KG with any relation vocabulary and to be fine-tuned on any graph.\nConducting link prediction experiments on 57 different KGs, we find that the zero-shot inductive inference performance of a single pre-trained ULTRA model on unseen graphs of various sizes is often on par or better than strong baselines trained on specific graphs. \nFine-tuning further boosts the performance.",
        "keywords": "graph neural networks;foundation model;knowledge graph;link prediction;knowledge graph reasoning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Mikhail Galkin;Xinyu Yuan;Hesham Mostafa;Jian Tang;Zhaocheng Zhu",
        "authorids": "~Mikhail_Galkin1;~Xinyu_Yuan2;~Hesham_Mostafa1;~Jian_Tang1;~Zhaocheng_Zhu1",
        "gender": "M;F;M;;M",
        "homepage": "https://migalkin.github.io/;https://github.com/KatarinaYuan/;;http://www.jian-tang.com;https://kiddozhu.github.io/",
        "dblp": "160/8154;;137/2994;181/2667-5;195/0435",
        "google_scholar": "yfYRbG4AAAAJ;;;https://scholar.google.ca/citations?user=1ir6WUEAAAAJ;Qd8JumkAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Mikhail_Galkin1;~Xinyu_Yuan2;~Hesham_Mostafa1;~Jian_Tang1;~Zhaocheng_Zhu1",
        "aff": "Intel;Montreal Institute for Learning Algorithms, University of Montreal, Universit\u00e9 de Montr\u00e9al;Intel;Mila, HEC Montreal;Universit\u00e9 de Montr\u00e9al",
        "aff_domain": "intel.com;mila.umontreal.ca;intel.com;hec.ca;mila.quebec",
        "position": "Researcher;PhD student;Researcher;Assistant Professor;PhD student",
        "bibtex": "@inproceedings{\ngalkin2024towards,\ntitle={Towards Foundation Models for Knowledge Graph Reasoning},\nauthor={Mikhail Galkin and Xinyu Yuan and Hesham Mostafa and Jian Tang and Zhaocheng Zhu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=jVEoydFOl9}\n}",
        "github": "",
        "project": "",
        "reviewers": "c3Sg;sna7;HLbG;ebFz",
        "pdf_size": 590522,
        "rating": "5;6;8;8",
        "confidence": "5;4;3;4",
        "soundness": "3;3;4;3",
        "contribution": "2;2;4;2",
        "presentation": "3;3;4;3",
        "wc_summary": "115;73;143;75",
        "wc_strengths": "25;49;91;39",
        "wc_weaknesses": "342;98;175;103",
        "wc_questions": "143;25;87;5",
        "wc_review": "625;245;496;222",
        "wc_reply_reviewers": "179;12;37;25",
        "wc_reply_authors": "2268;933;917;466",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "4;2;2;1",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            101.5,
            29.236107812087436
        ],
        "wc_strengths_avg": [
            51.0,
            24.61706725018234
        ],
        "wc_weaknesses_avg": [
            179.5,
            98.64202958171532
        ],
        "wc_questions_avg": [
            65.0,
            54.24020648928247
        ],
        "wc_review_avg": [
            397.0,
            169.93675294061612
        ],
        "wc_reply_reviewers_avg": [
            63.25,
            67.41058893082005
        ],
        "wc_reply_authors_avg": [
            1146.0,
            674.3689642918036
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.25,
            1.0897247358851685
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 85,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11537098443945554698&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=jVEoydFOl9",
        "pdf": "https://openreview.net/pdf?id=jVEoydFOl9",
        "email": "intel.com;mila.umontreal.ca;intel.com;hec.ca;mila.quebec",
        "author_num": 5,
        "aff_unique_index": "0;1;0;2;3",
        "aff_unique_norm": "Intel;University of Montreal;HEC Montreal;Universit\u00e9 de Montr\u00e9al",
        "aff_unique_dep": "Intel Corporation;Montreal Institute for Learning Algorithms;HEC Business School;",
        "aff_unique_url": "https://www.intel.com;https://www.mila.quebec;https://www.hec.ca;https://www.umontreal.ca",
        "aff_unique_abbr": "Intel;MILA;HEC;UdeM",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Montreal",
        "aff_country_unique_index": "0;1;0;1;1",
        "aff_country_unique": "United States;Canada"
    },
    {
        "id": "jVsXDLIt45",
        "title": "Nugget 2D: Dynamic Contextual Compression for Scaling Decoder-only Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Standard Transformer-based language models (LMs) scale poorly to long contexts. We propose a solution based on dynamic contextual compression, which extends the Nugget approach of Qin & Van Durme (2023) from BERT-like frameworks to decoder-only LMs. Our method models history as compressed \u201cnuggets\u201d which are trained to allow for reconstruction, and it can be initialized with off-the-shelf models such as LLaMA. We demonstrate through experiments in language modeling, question answering, and summarization that Nugget2D retains capabilities in these tasks, while drastically reducing the overhead during decoding in terms of time and space. For example, in the experiments of autoencoding, Nugget2D can shrink context at a 20x compression ratio with a BLEU score of 98% for reconstruction, achieving nearly lossless encoding.",
        "keywords": "large language models;efficient transformers;autoencoder",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Guanghui Qin;Corby Rosset;Ethan C. Chau;Nikhil Rao;Benjamin Van Durme",
        "authorids": "~Guanghui_Qin2;~Corby_Rosset2;~Ethan_C._Chau1;~Nikhil_Rao1;~Benjamin_Van_Durme2",
        "gender": ";;;M;",
        "homepage": ";;;;",
        "dblp": ";;;57/9513.html;",
        "google_scholar": ";;;GhqD_rwAAAAJ;",
        "orcid": ";;;;",
        "linkedin": ";;;nikhil-rao-012068a1/;",
        "or_profile": "~Guanghui_Qin2;~Corby_Rosset2;~Ethan_C._Chau1;~Nikhil_Rao1;~Benjamin_Van_Durme2",
        "aff": ";;;Microsoft;",
        "aff_domain": ";;;microsoft.com;",
        "position": ";;;Principal Researcher;",
        "bibtex": "@misc{\nqin2024nugget,\ntitle={Nugget 2D: Dynamic Contextual Compression for Scaling Decoder-only Language Models},\nauthor={Guanghui Qin and Corby Rosset and Ethan C. Chau and Nikhil Rao and Benjamin Van Durme},\nyear={2024},\nurl={https://openreview.net/forum?id=jVsXDLIt45}\n}",
        "github": "",
        "project": "",
        "reviewers": "WuCW;TZ9E;Hb1S",
        "site": "https://openreview.net/forum?id=jVsXDLIt45",
        "pdf_size": 595949,
        "rating": "5;6;6",
        "confidence": "4;3;3",
        "soundness": "2;3;3",
        "contribution": "2;2;3",
        "presentation": "4;3;2",
        "wc_summary": "307;227;85",
        "wc_strengths": "30;50;23",
        "wc_weaknesses": "83;178;44",
        "wc_questions": "158;123;300",
        "wc_review": "578;578;452",
        "wc_reply_reviewers": "0;0;21",
        "wc_reply_authors": "619;695;1054",
        "reply_reviewers": "0;0;1",
        "reply_authors": "1;2;3",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            206.33333333333334,
            91.80171869608735
        ],
        "wc_strengths_avg": [
            34.333333333333336,
            11.440668201153676
        ],
        "wc_weaknesses_avg": [
            101.66666666666667,
            56.2751178487339
        ],
        "wc_questions_avg": [
            193.66666666666666,
            76.53466897789234
        ],
        "wc_review_avg": [
            536.0,
            59.39696961966999
        ],
        "wc_reply_reviewers_avg": [
            7.0,
            9.899494936611665
        ],
        "wc_reply_authors_avg": [
            789.3333333333334,
            189.7021056522275
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9999999999999997,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9515123596898351354&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Microsoft",
        "aff_unique_dep": "Microsoft Corporation",
        "aff_unique_url": "https://www.microsoft.com",
        "aff_unique_abbr": "Microsoft",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "jVuknNhGmV",
        "title": "Causal Inference on Distributional Outcomes under Continuous Treatments",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Causal inference is widely practiced in various domains. Existing literature predominantly focuses on causal estimators for scalar or vector outcomes. However, real-world scenarios often involve response variables that are better represented as distributions. This paper addresses the need for causal inference methods capable of accommodating the distributional nature of responses when the treatments are continuous variables. We adopt a novel framework for causal inference within a vector space that incorporates the Wasserstein metric. Drawing upon Rubin's causal framework, we introduce three estimators, namely the Distributional Direct Regression (Dist-DR), Distributional Inverse Propensity Weighting (Dist-IPW), and Distributional Doubly Machine Learning (Dist-DML) estimators, tailored for estimating target quantities, i.e., causal effect maps. We thoroughly examine the statistical properties of these estimators. Through two experiments, we validate the efficacy of the proposed methodology, establishing its practical utility.",
        "keywords": "causal inference;distributional outcome;continuous treatments;doubly machine learning",
        "primary_area": "causal reasoning",
        "supplementary_material": "/attachment/a2be3d07be1e80e3c6fe057b0e7c6589442cbb93.zip",
        "author": "YIJUN LI;Cheuk Hang LEUNG;Qi WU",
        "authorids": "~YIJUN_LI6;~Cheuk_Hang_LEUNG2;~Qi_WU5",
        "gender": "M;;M",
        "homepage": ";;http://www.cityu.edu.hk/stfprofile/qiwu55.htm",
        "dblp": ";;",
        "google_scholar": "lfJisoYAAAAJ;;60AO2VAAAAAJ",
        "orcid": "0000-0001-7237-1378;0000-0002-3911-9055;0000-0002-4028-981X",
        "linkedin": ";;qi-wu-27802817",
        "or_profile": "~YIJUN_LI6;~Cheuk_Hang_Leung1;~Qi_Wu2",
        "aff": "City University Hong Kong ;City University of Hong Kong;City University of Hong Kong",
        "aff_domain": "cityu.edu;cityu.edu.hk;cityu.edu.hk",
        "position": "PhD student;Research Assistant;Associate Professor, SDSc",
        "bibtex": "@misc{\nli2024causal,\ntitle={Causal Inference on Distributional Outcomes under Continuous Treatments},\nauthor={YIJUN LI and Cheuk Hang LEUNG and Qi WU},\nyear={2024},\nurl={https://openreview.net/forum?id=jVuknNhGmV}\n}",
        "github": "",
        "project": "",
        "reviewers": "nqXb;F8tv;5HfR;Hjb6",
        "site": "https://openreview.net/forum?id=jVuknNhGmV",
        "pdf_size": 1558302,
        "rating": "3;3;5;5",
        "confidence": "3;3;3;3",
        "soundness": "3;2;2;3",
        "contribution": "2;2;1;2",
        "presentation": "2;2;2;3",
        "wc_summary": "46;174;72;171",
        "wc_strengths": "86;36;18;50",
        "wc_weaknesses": "233;121;100;499",
        "wc_questions": "197;122;98;5",
        "wc_review": "562;453;288;725",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            115.75,
            57.499456519170685
        ],
        "wc_strengths_avg": [
            47.5,
            24.95495942693556
        ],
        "wc_weaknesses_avg": [
            238.25,
            158.80707635366883
        ],
        "wc_questions_avg": [
            105.5,
            68.55836929215863
        ],
        "wc_review_avg": [
            507.0,
            159.2372443871094
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:K2p6AuMCcJoJ:scholar.google.com/&scioq=Causal+Inference+on+Distributional+Outcomes+under+Continuous+Treatments&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "City University of Hong Kong",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cityu.edu.hk",
        "aff_unique_abbr": "CityU",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "jWxrIeWgir",
        "title": "HOSC: Hyperbolic Oscillating Periodic Activations for Sharp Feature Preservation in Implicit Neural Representations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In learning implicit neural representations of field functions, the choice of activations critically influences a model's capacity to encode intricate signal and pattern properties. Traditional activation functions, such as ReLU, and more recent ones like SIREN, serve the role to provide bases for the signal approximation. However, especially when it comes to preserving sharp features in signals like SDFs or RGB images, the choice of the activation plays a crucial role. In this work, we introduce a novel activation function that we denote as the Hyperbolic Oscillating Activation (H), defined as $\\text{hosc}(x) = \\tanh(a \\sin(x))$.\n\nOur empirical evidence demonstrates HOSC's superior capability in preserving high-frequency sharp details in comparison to both SIREN and the non-periodic Rectified Linear Unit (ReLU) function, achieving faster convergence rates, and yielding lower losses in signal encoding tasks at reasonably small computational complexity overhead. When juxtaposed with ReLU and SIREN, HOSC offers notable advantages, underscoring its potential as a favored choice for implicit neural field networks.\n\nThe research and evaluations presented in this paper affirm the potential of \\HOSC{} as a robust, efficient, and high-performing periodic activation function for neural implicit fields of curves, images, and SDFs, opening avenues for further exploration in this domain.",
        "keywords": "Activation Functions;Neural Implicit Representations;High-Frequency Preservation;Periodic Activation Functions;Signal Encoding;Neural Networks",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/57cb8e5095aaa146f20a77b2c363ad5d9b183d08.zip",
        "author": "Danzel Serrano;Jakub Szymkowiak;Przemyslaw Musialski",
        "authorids": "~Danzel_Serrano1;~Jakub_Szymkowiak1;~Przemyslaw_Musialski1",
        "gender": "M;M;M",
        "homepage": "https://dependanz.github.io/;;https://web.njit.edu/~przem/",
        "dblp": ";;90/4148",
        "google_scholar": "L44bua4AAAAJ;;GG5256IAAAAJ",
        "orcid": ";0009-0006-7831-364X;0000-0001-6429-8190",
        "linkedin": "danzel-serrano-542870181/;jakubszymkowiak/;",
        "or_profile": "~Danzel_Serrano1;~Jakub_Szymkowiak1;~Przemyslaw_Musialski1",
        "aff": "New Jersey Institute of Technology;IDEAS NCBR;New Jersey Institute of Technology",
        "aff_domain": "njit.edu;ideas-ncbr.pl;njit.edu",
        "position": "PhD student;Researcher;Associate Professor",
        "bibtex": "@misc{\nserrano2024hosc,\ntitle={{HOSC}: Hyperbolic Oscillating Periodic Activations for Sharp Feature Preservation in Implicit Neural Representations},\nauthor={Danzel Serrano and Jakub Szymkowiak and Przemyslaw Musialski},\nyear={2024},\nurl={https://openreview.net/forum?id=jWxrIeWgir}\n}",
        "github": "",
        "project": "",
        "reviewers": "VTh6;Tuj3;Y34h",
        "site": "https://openreview.net/forum?id=jWxrIeWgir",
        "pdf_size": 47774648,
        "rating": "3;3;5",
        "confidence": "3;4;4",
        "soundness": "3;2;3",
        "contribution": "2;3;3",
        "presentation": "3;2;2",
        "wc_summary": "71;73;49",
        "wc_strengths": "43;103;43",
        "wc_weaknesses": "216;494;68",
        "wc_questions": "2;248;6",
        "wc_review": "332;918;166",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "211;400;349",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            64.33333333333333,
            10.873004286866728
        ],
        "wc_strengths_avg": [
            63.0,
            28.284271247461902
        ],
        "wc_weaknesses_avg": [
            259.3333333333333,
            176.59243723582526
        ],
        "wc_questions_avg": [
            85.33333333333333,
            115.03429440340342
        ],
        "wc_review_avg": [
            472.0,
            322.56885569854177
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            320.0,
            79.8373346248483
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:pTIiS9FgifoJ:scholar.google.com/&scioq=HOSC:+Hyperbolic+Oscillating+Periodic+Activations+for+Sharp+Feature+Preservation+in+Implicit+Neural+Representations&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "New Jersey Institute of Technology;Institute for Development, Economic Analysis, and Simulation (IDEAS)",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.njit.edu;https://www.ideas-ncbr.gov.pl",
        "aff_unique_abbr": "NJIT;IDEAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United States;Poland"
    },
    {
        "title": "Jointly-Learned Exit and Inference for a Dynamic Neural Network",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18019",
        "id": "jX2DT7qDam",
        "author_site": "Florence Regol, Joud Chataoui, Mark Coates",
        "tldr": "",
        "abstract": "Large pretrained models, coupled with fine-tuning, are slowly becoming established as the dominant architecture in machine learning. Even though these models offer impressive performance, their practical application is often limited by the prohibitive amount of resources required for $\\textit{every}$ inference. Early-exiting dynamic neural networks (EDNN) circumvent this issue by allowing a model to make some of its predictions from intermediate layers (i.e., early-exit). Training an EDNN architecture is challenging as it consists of two intertwined components: the gating mechanism (GM) that controls early-exiting decisions and the intermediate inference modules (IMs) that perform inference from intermediate representations. As a result, most existing approaches rely on thresholding confidence metrics for the gating mechanism and strive to improve the underlying backbone network and the inference modules. Although successful, this approach has two fundamental shortcomings: 1) the GMs and the IMs are decoupled during training, leading to a train-test mismatch; and 2) the thresholding gating mechanism introduces a positive bias into the predictive probabilities, making it difficult to readily extract uncertainty information. We propose a novel architecture that connects these two modules. This leads to significant performance improvements on classification datasets and enables better uncertainty characterization capabilities.",
        "keywords": "early-exit dynamic networks;efficient inference",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/4f5f35a9616fcd3c3ed4bab4fede00362b25f8b4.zip",
        "author": "florence regol;Joud Chataoui;Mark Coates",
        "authorids": "~florence_regol1;~Joud_Chataoui1;~Mark_Coates1",
        "gender": "F;M;M",
        "homepage": ";;http://www.ece.mcgill.ca/~mcoate/",
        "dblp": "251/8836;;c/MarkCoates",
        "google_scholar": "https://scholar.google.ca/citations?user=goNKjhkAAAAJ;;https://scholar.google.ca/citations?user=qxWORNoAAAAJ",
        "orcid": ";;0000-0001-5030-1379",
        "linkedin": ";joud-chataoui/;",
        "or_profile": "~florence_regol1;~Joud_Chataoui1;~Mark_Coates1",
        "aff": "McGill University;McGill University;McGill University",
        "aff_domain": "mcgill.ca;mcgill.ca;mcgill.ca",
        "position": "PhD student;MS student;Full Professor",
        "bibtex": "@inproceedings{\nregol2024jointlylearned,\ntitle={Jointly-Learned Exit and Inference for a Dynamic Neural Network},\nauthor={florence regol and Joud Chataoui and Mark Coates},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=jX2DT7qDam}\n}",
        "github": "",
        "project": "",
        "reviewers": "KZAV;smKZ;1vfw;CAtU",
        "pdf_size": 1391986,
        "rating": "6;8;8;8",
        "confidence": "4;4;5;4",
        "soundness": "2;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "63;151;77;74",
        "wc_strengths": "60;71;39;105",
        "wc_weaknesses": "360;252;171;114",
        "wc_questions": "62;61;2;137",
        "wc_review": "545;535;289;430",
        "wc_reply_reviewers": "44;29;10;81",
        "wc_reply_authors": "2314;1298;341;585",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "4;3;1;1",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            91.25,
            34.888214342382156
        ],
        "wc_strengths_avg": [
            68.75,
            23.878599205146017
        ],
        "wc_weaknesses_avg": [
            224.25,
            92.45100053541876
        ],
        "wc_questions_avg": [
            65.5,
            47.89832982474441
        ],
        "wc_review_avg": [
            449.75,
            103.16340194080458
        ],
        "wc_reply_reviewers_avg": [
            41.0,
            26.04803255526221
        ],
        "wc_reply_authors_avg": [
            1134.5,
            766.4112799274291
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.25,
            1.299038105676658
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2997170060502272642&as_sdt=80005&sciodt=0,11&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=jX2DT7qDam",
        "pdf": "https://openreview.net/pdf?id=jX2DT7qDam",
        "email": "mcgill.ca;mcgill.ca;mcgill.ca",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "McGill University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.mcgill.ca",
        "aff_unique_abbr": "McGill",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "jXOVnxvLic",
        "title": "To Simulate Neural Organoid: A Framework and A Benchmark based on AI",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Neural organoids hold significant value for AI modeling, cognitive exploration, and medical discovery in academic research.\nHowever, the current research on neural organoids primarily relies on trial-and-error experimental design methods that are time-consuming and expensive.\nMoreover, due to the intrinsic unknowability of complex biological systems, purely rational deduction through mathematical and physical modeling is nearly impossible.\nAs a result, the design of organoid experiments is constrained by the above limitations. \nWith AI models being applied to address diverse biological challenges, the demand for novel experimental paths for neural organoids has become urgent.\nIn response to the above issues, we propose the first neural organoid simulation framework to realistically reconstruct various details of interaction experiments using real mature organoids. \nThis framework employs advanced neural computing models as elements, harnessing AI methods to enable stimulation, response, and learning functionalities.\nThe significant consumption can be mitigated through the combination of the framework with real experiments.\nAn intelligent expansion platform is also established based on spiking neural network to facilitate the exploration of organoid-machine collaborative intelligence.\nIn addition, we introduce a benchmark for evaluating our framework, including a set of real organoid experimental data and a series of evaluation metrics.\nThe experimental results show that our simulation framework features outstanding simulation capabilities and reflects similarity with real organoid experiments in many aspects.\nWith the intelligent expansion platform, the performance of the combination is comparable to pure AI algorithms in a basic classification task.",
        "keywords": "Neural Organoid Simulation;Spiking Neural Network;AI for neurosciences",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/c1bc90d1f74cb866d3ccc001b3156b942270eff0.zip",
        "author": "Jingjie Shang;Haorui Zheng;Chengyi Zhang;Jian Cao;Liqun Chen;Xiaochen Bo;Yuan Wang",
        "authorids": "~Jingjie_Shang1;~Haorui_Zheng1;~Chengyi_Zhang2;~Jian_Cao4;~Liqun_Chen5;~Xiaochen_Bo2;~Yuan_Wang2",
        "gender": "M;;M;M;F;M;M",
        "homepage": ";https://github.com/getsum-zero;https://github.com/ZhengmingHu;https://www.ss.pku.edu.cn/teacherteam/teacherlist/1657-%E6%9B%B9%E5%81%A5.html;http://mctu.tju.edu.cn/info/1194/1423.htm;https://sysomics.com/;http://scholar.pku.edu.cn/wangyuan",
        "dblp": "252/4198;;;50/2102-2;;94/3428;",
        "google_scholar": "https://scholar.google.com.hk/citations?user=vHRAL2sAAAAJ;;;;;;YOhZM6kAAAAJ",
        "orcid": "0000-0002-9276-2349;;;0000-0002-4724-7065;;0000-0003-1911-7922;0000-0002-4951-4286",
        "linkedin": ";;;;;;",
        "or_profile": "~Jingjie_Shang1;~Haorui_Zheng1;~Chengyi_Zhang2;~Jian_Cao4;~Liqun_Chen5;~Xiaochen_Bo2;~Yuan_Wang2",
        "aff": "Peking University;Peking University;Peking University;Peking University;;Academy of Military Medical Sciences;Peking University",
        "aff_domain": "pku.edu.cn;pku.edu.cn;pku.edu.cn;pku.edu.cn;;bmi.ac.cn;pku.edu.cn",
        "position": "PhD student;MS student;MS student;Associate Professor;;Full Professor;Full Professor",
        "bibtex": "@misc{\nshang2024to,\ntitle={To Simulate Neural Organoid: A Framework and A Benchmark based on {AI}},\nauthor={Jingjie Shang and Haorui Zheng and Chengyi Zhang and Jian Cao and Liqun Chen and Xiaochen Bo and Yuan Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=jXOVnxvLic}\n}",
        "github": "",
        "project": "",
        "reviewers": "qTxr;WMhb;kTjU;V5kH",
        "site": "https://openreview.net/forum?id=jXOVnxvLic",
        "pdf_size": 3433574,
        "rating": "3;3;3;3",
        "confidence": "5;4;2;4",
        "soundness": "3;3;2;2",
        "contribution": "1;1;2;1",
        "presentation": "2;2;1;1",
        "wc_summary": "38;162;85;91",
        "wc_strengths": "11;23;26;61",
        "wc_weaknesses": "87;163;251;314",
        "wc_questions": "56;136;24;142",
        "wc_review": "192;484;386;608",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            94.0,
            44.30011286667337
        ],
        "wc_strengths_avg": [
            30.25,
            18.619546181365433
        ],
        "wc_weaknesses_avg": [
            203.75,
            86.13760793056655
        ],
        "wc_questions_avg": [
            89.5,
            50.820763473210434
        ],
        "wc_review_avg": [
            417.5,
            152.11426626059767
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:3_8zewNJ_zcJ:scholar.google.com/&scioq=To+Simulate+Neural+Organoid:+A+Framework+and+A+Benchmark+based+on+AI&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;1;0",
        "aff_unique_norm": "Peking University;Academy of Military Medical Sciences",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.pku.edu.cn;",
        "aff_unique_abbr": "Peking U;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "jXR5pjs1rV",
        "title": "Everyone Deserves A Reward: Learning Customized Human Preferences",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Reward models (RMs) are essential for aligning large language models (LLMs) with human preferences to improve interaction quality. However, the real world is pluralistic, which leads to diversified human preferences with respect to different religions, politics, cultures, etc. Moreover, each individual can have their unique preferences on various topics. Neglecting the diversity of preferences, current human feedback aligning methods only consider a general reward model, which is below satisfaction for customized or personalized application scenarios. To explore customized preference learning, we collect a domain-specific preference (DSP) dataset, which consists of comprehensive user queries and corresponding responses preferred from four practical domains. Besides, from the perspective of data efficiency, we propose a three-stage customized RM learning scheme, then empirically verify its effectiveness on both general preference datasets and our DSP set. Furthermore, we test multiple training and data strategies on the three learning stages. We find several ways to better preserve the general preferring ability while training the customized RMs, especially general preference enrichment, and customized preference imitation learning.",
        "keywords": "Human Preference Alignment;Large Language Model;Data Efficiency",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/ab3ad384b7965be386c7b52ada03b3e746167e69.pdf",
        "author": "Pengyu Cheng;Jiawen Xie;Ke Bai;Yong Dai;nan du",
        "authorids": "~Pengyu_Cheng1;~Jiawen_Xie1;~Ke_Bai1;~Yong_Dai1;~nan_du3",
        "gender": "M;F;M;M;M",
        "homepage": "https://linear95.github.io/;;https://daiyongya.github.io/;https://scholar.google.com/citations?user=BO4jEkAAAAAJ&hl=en;https://github.com/xjw-nlp",
        "dblp": "223/6048;33/8570-1;;;351/5556",
        "google_scholar": "eeQ_yCkAAAAJ;;https://scholar.google.com/citations?hl=zh-CN;;",
        "orcid": "0000-0003-0421-8376;;0000-0002-3041-5851;;0000-0001-6918-3632",
        "linkedin": ";;yong-dai-9255311a6/;;",
        "or_profile": "~Pengyu_Cheng1;~Ke_Bai1;~Yong_Dai1;~nan_du3;~Xie_Jia_wen1",
        "aff": "Tencent;eBay Inc.;Tencent AI Lab;Tencent INC;Shanghai Jiaotong University",
        "aff_domain": "tencent.com;ebay.com;tencent.com;tencent.com;sjtu.edu.cn",
        "position": "Researcher;Researcher;Researcher;Principal Researcher;MS student",
        "bibtex": "@misc{\ncheng2024everyone,\ntitle={Everyone Deserves A Reward: Learning Customized Human Preferences},\nauthor={Pengyu Cheng and Jiawen Xie and Ke Bai and Yong Dai and nan du},\nyear={2024},\nurl={https://openreview.net/forum?id=jXR5pjs1rV}\n}",
        "github": "",
        "project": "",
        "reviewers": "AsgA;NCvM;kam2",
        "site": "https://openreview.net/forum?id=jXR5pjs1rV",
        "pdf_size": 1583979,
        "rating": "3;5;5",
        "confidence": "3;2;4",
        "soundness": "2;3;4",
        "contribution": "2;2;2",
        "presentation": "2;3;3",
        "wc_summary": "125;103;213",
        "wc_strengths": "12;51;201",
        "wc_weaknesses": "44;74;770",
        "wc_questions": "50;26;208",
        "wc_review": "231;254;1392",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;608",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            147.0,
            47.525431788324305
        ],
        "wc_strengths_avg": [
            88.0,
            81.47392220827471
        ],
        "wc_weaknesses_avg": [
            296.0,
            335.39230760409515
        ],
        "wc_questions_avg": [
            94.66666666666667,
            80.7355078154725
        ],
        "wc_review_avg": [
            625.6666666666666,
            541.9608431940038
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            202.66666666666666,
            286.6139486409473
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 25,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2178168534715215930&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;0;2",
        "aff_unique_norm": "Tencent;eBay Inc.;Shanghai Jiao Tong University",
        "aff_unique_dep": "Tencent Holdings Limited;;",
        "aff_unique_url": "https://www.tencent.com;https://www.ebayinc.com;https://www.sjtu.edu.cn",
        "aff_unique_abbr": "Tencent;eBay;SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "jXxrf3BCuN",
        "title": "Inference from Real-World Sparse Measurements",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Real-world problems often involve complex and unstructured sets of measurements, which happens when sensors are sparsely placed in either space or time. Being able to model this irregular spatiotemporal data and extract meaningful forecasts is crucial. Deep learning architectures capable of processing sets of measurements with positions varying from set to set, and extracting readouts anywhere are methodologically difficult. Current state-of-the-art models are graph neural networks and require domain-specific knowledge for proper setup.\n\n  We propose an attention-based model focused on robustness and practical applicability, with two key design contributions. First, we adopt a ViT-like transformer that takes both context points and read-out positions as inputs, eliminating the need for an encoder-decoder structure. Second, we use a unified method for encoding both context and read-out positions. This approach is intentionally straightforward and integrates well with other systems. Compared to existing approaches, our model is simpler, requires less specialized knowledge, and does not suffer from a problematic bottleneck effect, all of which contribute to superior performance.\n\n  We conduct in-depth ablation studies that characterize this problematic bottleneck in the latent representations of alternative models that inhibit information utilization and impede training efficiency. We also perform experiments across various problem domains, including high-altitude wind nowcasting, two-day weather forecasting, fluid dynamics, and heat diffusion. Our attention-based model consistently outperforms state-of-the-art models in handling irregularly sampled data. Notably, our model reduces the root mean square error (RMSE) for wind nowcasting from 9.24 to 7.98 and for heat diffusion tasks from 0.126 to 0.084.",
        "keywords": "Attention-based models;irregularly sampled data;wind nowcasting;dynamical systems",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/4c08c605eaaabfb13b2ff69dbe7ccba965a48d45.zip",
        "author": "Arnaud Pannatier;Kyle Matoba;Fran\u00e7ois Fleuret",
        "authorids": "~Arnaud_Pannatier1;~Kyle_Matoba1;~Fran\u00e7ois_Fleuret2",
        "gender": "M;;M",
        "homepage": "https://arnaudpannatier.ch;;https://fleuret.org/francois/",
        "dblp": "309/6542;https://dblp.uni-trier.de/pid/150/1860.html;90/5265",
        "google_scholar": "8XxcMWkAAAAJ;;https://scholar.google.ch/citations?user=Bj1tRlsAAAAJ",
        "orcid": ";;0000-0001-9457-7393",
        "linkedin": ";;francois-fleuret/",
        "or_profile": "~Arnaud_Pannatier1;~Kyle_Matoba1;~Francois_Fleuret1",
        "aff": "Idiap Research Institute;Swiss Federal Institute of Technology Lausanne;University of Geneva",
        "aff_domain": "idiap.ch;epfl.ch;unige.ch",
        "position": "PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\npannatier2024inference,\ntitle={Inference from Real-World Sparse Measurements},\nauthor={Arnaud Pannatier and Kyle Matoba and Fran{\\c{c}}ois Fleuret},\nyear={2024},\nurl={https://openreview.net/forum?id=jXxrf3BCuN}\n}",
        "github": "",
        "project": "",
        "reviewers": "7eM6;jjJ1;nVVV;3Jak",
        "site": "https://openreview.net/forum?id=jXxrf3BCuN",
        "pdf_size": 324499,
        "rating": "3;3;5;6",
        "confidence": "3;3;3;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;1",
        "presentation": "2;2;2;3",
        "wc_summary": "45;45;39;53",
        "wc_strengths": "33;228;34;79",
        "wc_weaknesses": "213;392;184;427",
        "wc_questions": "18;80;596;27",
        "wc_review": "309;745;853;586",
        "wc_reply_reviewers": "0;0;39;219",
        "wc_reply_authors": "314;1563;1220;830",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "2;3;3;2",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            45.5,
            4.9749371855331
        ],
        "wc_strengths_avg": [
            93.5,
            79.84516265873594
        ],
        "wc_weaknesses_avg": [
            304.0,
            106.71691524777128
        ],
        "wc_questions_avg": [
            180.25,
            241.1994765748881
        ],
        "wc_review_avg": [
            623.25,
            204.78571117145844
        ],
        "wc_reply_reviewers_avg": [
            64.5,
            90.61042986323373
        ],
        "wc_reply_authors_avg": [
            981.75,
            464.6323143088522
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:aaRM5gq9XSsJ:scholar.google.com/&scioq=Inference+from+Real-World+Sparse+Measurements&hl=en&as_sdt=0,33",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Idiap Research Institute;Swiss Federal Institute of Technology Lausanne;University of Geneva",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.idiap.ch;https://www.epfl.ch;https://www.unige.ch",
        "aff_unique_abbr": "Idiap;EPFL;UNIGE",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Lausanne",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Switzerland"
    },
    {
        "id": "jYHRP6nj9Q",
        "title": "CDGraph: Dual Conditional Social Graph Synthesizing via Diffusion Model",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The social graphs synthesized by the generative models are increasingly in demand due to data scarcity and concerns over user privacy. One of the key performance criteria for generating social networks is the fidelity to specified conditionals, such as users with certain membership and financial status. While recent diffusion models have shown remarkable performance in generating images, their effectiveness in synthesizing graphs has not yet been explored in the context of conditional social graphs. In this paper, we propose the first kind of conditional diffusion model for social networks, CDGraph, which trains and synthesizes graphs based on two specified conditions. We propose the co-evolution dependency in the denoising process of CDGraph to capture the mutual dependencies between the dual conditions and further incorporate social homophily and social contagion to preserve the connectivity between nodes while satisfying the specified conditions. Moreover, we introduce a novel classifier loss, which guides the training of the diffusion process through the mutual dependency of dual conditions. We evaluate CDGraph against four existing graph generative methods, i.e., SPECTRE, GSM, EDGE, and DiGress, on four datasets. Our results show that the generated graphs from CDGraph achieve much higher dual-conditional validity and lower discrepancy in various social network metrics than the baselines, thus demonstrating its proficiency in generating dual-conditional social graphs.",
        "keywords": "social network;diffusion model;graph generation",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Jui-Yi Tsai;Ya-Wen Teng;HO CHIOK YEW;De-Nian Yang;Lydia Y. Chen",
        "authorids": "~Jui-Yi_Tsai1;~Ya-Wen_Teng1;~HO_CHIOK_YEW1;~De-Nian_Yang1;~Lydia_Y._Chen1",
        "gender": "M;F;M;M;F",
        "homepage": "https://github.com/vincenttsai2015;https://homepage.iis.sinica.edu.tw/pages/ywteng/index_en.html;https://www.linkedin.com/in/ho-chiok-yew-775378176/;https://homepage.iis.sinica.edu.tw/pages/dnyang/index_en.html;https://www.lydiaychen.com/",
        "dblp": "177/0974;163/2000;https://dblp.org;85/318;https://dblp.uni-trier.de/pers/c/Chen:Lydia_Y=.html",
        "google_scholar": "https://scholar.google.com.tw/citations?view_op=list_works;;;;https://scholar.google.ch/citations?hl=en",
        "orcid": ";0009-0009-3563-578X;;0000-0002-3765-9293;",
        "linkedin": ";;ho-chiok-yew-775378176/;;",
        "or_profile": "~Jui-Yi_Tsai1;~Ya-Wen_Teng1;~HO_CHIOK_YEW1;~De-Nian_Yang1;~Lydia_Y._Chen1",
        "aff": "Academia Sinica;Institute of Information Science, Academia Sinica;;Academia Sinica;Delft University of Technology",
        "aff_domain": "iis.sinica.edu.tw;iis.sinica.edu.tw;;iis.sinica.edu.tw;tudelft.nl",
        "position": "Research Assistant;Postdoc;;Professor;Associate Professor",
        "bibtex": "@misc{\ntsai2024cdgraph,\ntitle={{CDG}raph: Dual Conditional Social Graph Synthesizing via Diffusion Model},\nauthor={Jui-Yi Tsai and Ya-Wen Teng and HO CHIOK YEW and De-Nian Yang and Lydia Y. Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=jYHRP6nj9Q}\n}",
        "github": "",
        "project": "",
        "reviewers": "zZ91;QDkE;FtFj;FhD6",
        "site": "https://openreview.net/forum?id=jYHRP6nj9Q",
        "pdf_size": 3199893,
        "rating": "5;5;5;5",
        "confidence": "3;4;2;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "2;2;3;2",
        "wc_summary": "38;57;39;167",
        "wc_strengths": "48;114;25;140",
        "wc_weaknesses": "237;169;89;208",
        "wc_questions": "4;61;45;219",
        "wc_review": "327;401;198;734",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1349;1640;617;1896",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;5;2;4",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            75.25,
            53.508760964911154
        ],
        "wc_strengths_avg": [
            81.75,
            46.884832302142236
        ],
        "wc_weaknesses_avg": [
            175.75,
            55.59395200918891
        ],
        "wc_questions_avg": [
            82.25,
            81.64366172581923
        ],
        "wc_review_avg": [
            415.0,
            197.98358517816573
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1375.5,
            478.77578259556947
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            3.5,
            1.118033988749895
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:d9kfj0NU61YJ:scholar.google.com/&scioq=CDGraph:+Dual+Conditional+Social+Graph+Synthesizing+via+Diffusion+Model&hl=en&as_sdt=0,5",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "Academia Sinica;Delft University of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.sinica.edu.tw;https://www.tudelft.nl",
        "aff_unique_abbr": "Academia Sinica;TU Delft",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Taiwan;",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "China;Netherlands"
    },
    {
        "id": "jYsowwcXV1",
        "title": "A Data Perspective on Enhanced Identity Preservation for Diffusion Personalization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large text-to-image models have revolutionized the ability to generate imagery using natural language. However, particularly unique or personal visual concepts, such as your pet, an object in your house, etc., will not be captured by the original model. This has led to interest in how to inject new visual concepts, bound to a new text token, using as few as 4-6 examples. Despite significant progress, this task remains a formidable challenge, particularly in preserving the subject's identity. While most researchers attempt to to address this issue by modifying model architectures, our approach takes a data-centric perspective, advocating the modification of data rather than the model itself. We introduce a novel regularization dataset generation strategy on both the text and image level; demonstrating the importance of a rich and structured regularization dataset (automatically generated) to prevent losing text coherence and better identity preservation. The better quality is enabled by allowing up to 5x more fine-tuning iterations without overfitting and degeneration. The generated renditions of the desired subject preserve even fine details such as text and logos; all while maintaining the ability to generate diverse samples that follow the input text prompt. Since our method focuses on data augmentation, rather than adjusting the model architecture, it is complementary and can be combined with prior work. We show on established benchmarks that our data-centric approach forms the new state of the art in terms of image quality, with the best trade-off between identity preservation, diversity, and text alignment.",
        "keywords": "diffusion personalization;diffusion models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/93550b5d8bec753cdbc4f9f98ca7c922a9cf010b.zip",
        "author": "Xingzhe He;Zhiwen Cao;Nicholas Kolkin;Lantao Yu;Helge Rhodin;Ratheesh Kalarot",
        "authorids": "~Xingzhe_He1;~Zhiwen_Cao2;~Nicholas_Kolkin2;~Lantao_Yu3;~Helge_Rhodin5;~Ratheesh_Kalarot1",
        "gender": "M;;M;M;;M",
        "homepage": "https://xingzhehe.github.io/;;;https://complexfilter.github.io/;;https://scholar.google.co.nz/citations?user=BuKGWPEAAAAJ&hl=en",
        "dblp": "258/0493;;155/9989;;;124/2803",
        "google_scholar": "25tDZpwAAAAJ;;MqWYTj0AAAAJ;B1fy-hYAAAAJ;;https://scholar.google.co.nz/citations?user=BuKGWPEAAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";;;lantao-yu-a933b943/;;",
        "or_profile": "~Xingzhe_He1;~Zhiwen_Cao2;~Nicholas_Kolkin2;~Lantao_Yu3;~Helge_Rhodin5;~Ratheesh_Kalarot1",
        "aff": "University of British Columbia;;Adobe Systems;Adobe Systems;;Adobe Systems",
        "aff_domain": "cs.ubc.ca;;adobe.com;adobe.com;;adobe.com",
        "position": "PhD student;;Researcher;Researcher;;Researcher",
        "bibtex": "@misc{\nhe2024a,\ntitle={A Data Perspective on Enhanced Identity Preservation for Diffusion Personalization},\nauthor={Xingzhe He and Zhiwen Cao and Nicholas Kolkin and Lantao Yu and Helge Rhodin and Ratheesh Kalarot},\nyear={2024},\nurl={https://openreview.net/forum?id=jYsowwcXV1}\n}",
        "github": "",
        "project": "",
        "reviewers": "hHDA;vEAP;AXFR;rHiC",
        "site": "https://openreview.net/forum?id=jYsowwcXV1",
        "pdf_size": 39709090,
        "rating": "3;3;6;6",
        "confidence": "3;4;3;4",
        "soundness": "2;2;3;3",
        "contribution": "2;1;3;3",
        "presentation": "1;2;3;3",
        "wc_summary": "91;48;61;82",
        "wc_strengths": "54;34;10;198",
        "wc_weaknesses": "185;164;135;140",
        "wc_questions": "107;27;52;5",
        "wc_review": "437;273;258;425",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "576;392;553;179",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            70.5,
            16.948451256678293
        ],
        "wc_strengths_avg": [
            74.0,
            73.2666363360568
        ],
        "wc_weaknesses_avg": [
            156.0,
            20.0124960961895
        ],
        "wc_questions_avg": [
            47.75,
            38.03534540397918
        ],
        "wc_review_avg": [
            348.25,
            83.0282331499352
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            425.0,
            158.73720420871726
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12761712125970480131&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "University of British Columbia;Adobe",
        "aff_unique_dep": ";Adobe Systems Incorporated",
        "aff_unique_url": "https://www.ubc.ca;https://www.adobe.com",
        "aff_unique_abbr": "UBC;Adobe",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "Canada;United States"
    },
    {
        "title": "Dynamics-Informed Protein Design with Structure Conditioning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18018",
        "id": "jZPqf2G9Sw",
        "author_site": "Urszula Julia Komorowska, Simon Mathis, Kieran Didi, Francisco Vargas, Pietro Lio, Mateja Jamnik",
        "tldr": "",
        "abstract": "Current protein generative models are able to design novel backbones with desired shapes or functional motifs. However, despite the importance of a protein\u2019s dynamical properties for its function, conditioning on dynamical properties remains elusive. We present a new approach to protein generative modeling by leveraging Normal Mode Analysis that enables us to capture dynamical properties too. We introduce a method for conditioning the diffusion probabilistic models on protein dynamics, specifically on the lowest non-trivial normal mode of oscillation. Our method, similar to the classifier guidance conditioning, formulates the sampling process as being driven by conditional and unconditional terms. However, unlike previous works, we approximate the conditional term with a simple analytical function rather than an external neural network, thus making the eigenvector calculations approachable. We present the corresponding SDE theory as a formal justification of our approach. We extend our framework to conditioning on structure and dynamics at the same time, enabling scaffolding of the dynamical motifs. We demonstrate the empirical effectiveness of our method by turning the open-source unconditional protein diffusion model Genie into the conditional model with no retraining. Generated proteins exhibit the desired dynamical and structural properties while still being biologically plausible. Our work represents a first step towards incorporating dynamical behaviour in protein design and may open the door to designing more flexible and functional proteins in the future.",
        "keywords": "Diffusion Models;Generative Modeling;Protein Design;Normal Mode Analysis",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Urszula Julia Komorowska;Simon V Mathis;Kieran Didi;Francisco Vargas;Pietro Lio;Mateja Jamnik",
        "authorids": "~Urszula_Julia_Komorowska1;~Simon_V_Mathis1;~Kieran_Didi1;~Francisco_Vargas1;~Pietro_Lio1;~Mateja_Jamnik1",
        "gender": ";M;M;M;M;F",
        "homepage": ";https://simonmathis.org;https://kdidi.netlify.app/;;https://www.cst.cam.ac.uk/people/pl219;http://www.cl.cam.ac.uk/~mj201",
        "dblp": ";338/5638;336/6909;79/7431-1;l/PietroLio.html;41/1392",
        "google_scholar": "2ldyD9MAAAAJ;https://scholar.google.ch/citations?user=N6I6fT0AAAAJ;KxQAWKQAAAAJ;;https://scholar.google.co.uk/citations?user=3YrWf7EAAAAJ;d5QiyJkAAAAJ",
        "orcid": ";0000-0002-5246-6481;0000-0001-6839-3320;;0000-0002-0540-5053;0000-0003-2772-2532",
        "linkedin": "urszula-julia-komorowska-b080b9230/;simonmathis/;kieran-didi/;;;",
        "or_profile": "~Urszula_Julia_Komorowska1;~Simon_V_Mathis1;~Kieran_Didi1;~Francisco_Vargas1;~Pietro_Lio1;~Mateja_Jamnik1",
        "aff": "University of Cambridge;University of Cambridge;University of Cambridge;University of Cambridge;University of Cambridge;University of Cambridge",
        "aff_domain": "cam.ac.uk;cam.ac.uk;cam.ac.uk;cam.ac.uk;cam.ac.uk;cam.ac.uk",
        "position": "PhD student;PhD student;MS student;PhD student;Full Professor;Professor in Artificial Intelligence",
        "bibtex": "@inproceedings{\nkomorowska2024dynamicsinformed,\ntitle={Dynamics-Informed Protein Design with Structure Conditioning},\nauthor={Urszula Julia Komorowska and Simon V Mathis and Kieran Didi and Francisco Vargas and Pietro Lio and Mateja Jamnik},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=jZPqf2G9Sw}\n}",
        "github": "",
        "project": "",
        "reviewers": "65X8;E2Vz;M3zP;FtGW",
        "pdf_size": 29360250,
        "rating": "5;5;6;6",
        "confidence": "4;3;4;4",
        "soundness": "3;2;3;2",
        "contribution": "2;2;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "100;18;43;70",
        "wc_strengths": "55;63;47;65",
        "wc_weaknesses": "298;246;121;296",
        "wc_questions": "57;170;162;702",
        "wc_review": "510;497;373;1133",
        "wc_reply_reviewers": "136;0;0;101",
        "wc_reply_authors": "924;795;342;1055",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "2;1;1;3",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            57.75,
            30.548117781624452
        ],
        "wc_strengths_avg": [
            57.5,
            7.123903424387503
        ],
        "wc_weaknesses_avg": [
            240.25,
            71.93182536263069
        ],
        "wc_questions_avg": [
            272.75,
            251.80684561782667
        ],
        "wc_review_avg": [
            628.25,
            296.28312051144593
        ],
        "wc_reply_reviewers_avg": [
            59.25,
            60.528402423986044
        ],
        "wc_reply_authors_avg": [
            779.0,
            268.52653500166423
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12595098278396914684&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=jZPqf2G9Sw",
        "pdf": "https://openreview.net/pdf?id=jZPqf2G9Sw",
        "email": "cam.ac.uk;cam.ac.uk;cam.ac.uk;cam.ac.uk;cam.ac.uk;cam.ac.uk",
        "author_num": 6,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "University of Cambridge",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cam.ac.uk",
        "aff_unique_abbr": "Cambridge",
        "aff_campus_unique_index": "0;0;0;0;0;0",
        "aff_campus_unique": "Cambridge",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "jb37oaGZXy",
        "title": "Musketeer: Joint Training/Inference for Multi-task Vision-Language Model with Task Explanation Prompts",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We present a sequence-to-sequence vision-language model whose parameters are jointly trained on all tasks and fully shared among multiple tasks, resulting in a single model which we named Musketeer. The integration of knowledge across heterogeneous tasks is enabled by a novel feature called Task Explanation Prompt (TEP). TEP reduces interference among tasks, allowing the model to focus on their shared structure. With a single model, Musketeer achieves results comparable to or better than strong baselines trained on single tasks, almost uniformly across multiple tasks.",
        "keywords": "Multi-Task Learning;Multi-modality",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Zhaoyang Zhang;Yantao Shen;Kunyu Shi;Zhaowei Cai;Jun Fang;Siqi Deng;Hao Yang;Davide Modolo;Zhuowen Tu;Stefano Soatto",
        "authorids": "~Zhaoyang_Zhang1;~Yantao_Shen2;~Kunyu_Shi1;~Zhaowei_Cai1;~Jun_Fang2;~Siqi_Deng1;~Hao_Yang4;~Davide_Modolo2;~Zhuowen_Tu1;~Stefano_Soatto3",
        "gender": "M;M;M;M;;;M;M;;",
        "homepage": "https://zzyfd.github.io/#/;https://scholar.google.com.hk/citations?user=bEctTN0AAAAJ&hl=zh-CN;;https://zhaoweicai.github.io/;;;https://sites.google.com/site/lancelot365;http://davidemodolo.wordpress.com/;;",
        "dblp": ";86/3372;;119/1498;55/2632-4;;54/4089-33.html;160/8205;;",
        "google_scholar": "Pf6o7uAAAAAJ;https://scholar.google.com.hk/citations?user=bEctTN0AAAAJ;jlE0jusAAAAJ;uRrSKVIAAAAJ;https://scholar.google.com/citations?hl=en;;https://scholar.google.com.sg/citations?user=Y-I1X9QAAAAJ;l1SQgzIAAAAJ;;",
        "orcid": ";;;;;;;0000-0002-7625-7748;;",
        "linkedin": ";;;;jun-fang-12946085;;;davidemodolo/;;",
        "or_profile": "~Zhaoyang_Zhang1;~Yantao_Shen2;~Kunyu_Shi1;~Zhaowei_Cai1;~Jun_Fang2;~Siqi_Deng1;~Hao_Yang4;~Davide_Modolo2;~Zhuowen_Tu1;~Stefano_Soatto3",
        "aff": "The Chinese University of Hong Kong;Amazon;Amazon;Amazon;Amazon;;Amazon;Amazon;;",
        "aff_domain": "cuhk.edu.hk;amazon.com;amazon.com;amazon.com;amazon.com;;amazon.com;amazon.com;;",
        "position": "PhD student;Researcher;Researcher;Applied Scientist;Senior Applied Scientist;;Principal Researcher;Principal Researcher;;",
        "bibtex": "@misc{\nzhang2024musketeer,\ntitle={Musketeer: Joint Training/Inference for Multi-task Vision-Language Model with Task Explanation Prompts},\nauthor={Zhaoyang Zhang and Yantao Shen and Kunyu Shi and Zhaowei Cai and Jun Fang and Siqi Deng and Hao Yang and Davide Modolo and Zhuowen Tu and Stefano Soatto},\nyear={2024},\nurl={https://openreview.net/forum?id=jb37oaGZXy}\n}",
        "github": "",
        "project": "",
        "reviewers": "uHwb;Dtxz;nMNN",
        "site": "https://openreview.net/forum?id=jb37oaGZXy",
        "pdf_size": 615901,
        "rating": "3;6;8",
        "confidence": "4;4;4",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "2;3;4",
        "wc_summary": "97;112;99",
        "wc_strengths": "33;81;56",
        "wc_weaknesses": "188;153;24",
        "wc_questions": "114;49;27",
        "wc_review": "432;395;206",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1267;925;234",
        "reply_reviewers": "0;0;0",
        "reply_authors": "3;3;2",
        "rating_avg": [
            5.666666666666667,
            2.0548046676563256
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            102.66666666666667,
            6.649979114420002
        ],
        "wc_strengths_avg": [
            56.666666666666664,
            19.601587237318874
        ],
        "wc_weaknesses_avg": [
            121.66666666666667,
            70.52343975981005
        ],
        "wc_questions_avg": [
            63.333333333333336,
            36.9353790047188
        ],
        "wc_review_avg": [
            344.3333333333333,
            98.97586686774824
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            808.6666666666666,
            429.6683475529573
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:l8cSMIUOsqUJ:scholar.google.com/&scioq=Musketeer:+Joint+Training/Inference+for+Multi-task+Vision-Language+Model+with+Task+Explanation+Prompts&hl=en&as_sdt=0,5",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;1;1;1;1;1",
        "aff_unique_norm": "Chinese University of Hong Kong;Amazon",
        "aff_unique_dep": ";Amazon.com, Inc.",
        "aff_unique_url": "https://www.cuhk.edu.hk;https://www.amazon.com",
        "aff_unique_abbr": "CUHK;Amazon",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;1;1;1;1;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Foundation Model-oriented Robustness: Robust Image Model Evaluation with Pretrained Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18017",
        "id": "jd5GokdySz",
        "author_site": "Peiyan Zhang, Haoyang Liu, Chaozhuo Li, Xing Xie, Sunghun Kim, Haohan Wang",
        "tldr": "",
        "abstract": "Machine learning has demonstrated remarkable performance over finite datasets, yet whether the scores over the fixed benchmarks can sufficiently indicate the model\u2019s performance in the real world is still in discussion. In reality, an ideal robust model will probably behave similarly to the oracle (e.g., the human users), thus a good evaluation protocol is probably to evaluate the models\u2019 behaviors in comparison to the oracle. In this paper, we introduce a new robustness measurement that directly measures the image classification model\u2019s performance compared with a surrogate oracle (i.e., a zoo of foundation models). Besides, we design a simple method that can accomplish the evaluation beyond the scope of the benchmarks. Our method extends the image datasets with new samples that are sufficiently perturbed to be distinct from the ones in the original sets, but are still bounded within the same image-label structure the original test image represents, constrained by a zoo of foundation models pretrained with a large amount of samples. As a result, our new method will offer us a new way to evaluate the models\u2019 robustness performance, free of limitations of fixed benchmarks or constrained perturbations, although scoped by the power of the oracle. In addition to the evaluation results, we also leverage our generated data to understand the behaviors of the model and our new evaluation strategies.",
        "keywords": "robustness;distribution shift;reliable machine learning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/549cfd3c8a75bf507ae0758a84992ed6c239e372.zip",
        "author": "Peiyan Zhang;Haoyang Liu;Chaozhuo Li;Xing Xie;Sunghun Kim;Haohan Wang",
        "authorids": "~Peiyan_Zhang1;~Haoyang_Liu1;~Chaozhuo_Li1;~Xing_Xie3;~Sunghun_Kim1;~Haohan_Wang1",
        "gender": "M;M;;M;M;M",
        "homepage": "https://peiyance.github.io/;;https://scss.bupt.edu.cn/info/1063/5534.htm;http://research.microsoft.com/en-us/people/xingx/;https://www.cse.ust.hk/~hunkim/;http://cs.cmu.edu/~haohanw",
        "dblp": "277/0918;53/8773-1;316/1269.html;08/6809-1;;132/4066",
        "google_scholar": "A1_FpIcAAAAJ;1jLWSKAAAAAJ;https://scholar.google.com/citations?hl=zh-CN;5EQfAFIAAAAJ;https://scholar.google.com.tw/citations?user=dQM6NLgAAAAJ;nZxJGeUAAAAJ",
        "orcid": "0000-0002-8691-1846;0000-0002-9657-9007;0000-0002-8179-7503;0000-0002-8608-8482;;",
        "linkedin": ";haoyang-liu-58268a1a2/;;xingx/;;haohanwang/",
        "or_profile": "~Peiyan_Zhang1;~Haoyang_Liu1;~Chaozhuo_Li1;~Xing_Xie3;~Sunghun_Kim1;~Haohan_Wang1",
        "aff": "Department of Computer Science and Engineering, Hong Kong University of Science and Technology;University of Illinois, Urbana-Champaign;Beijing University of Posts and Telecommunications;Microsoft Research Asia;Hong Kong University of Science and Technology;University of Illinois, Urbana Champaign",
        "aff_domain": "cse.ust.hk;uiuc.edu;bupt.edu.cn;microsoft.com;ust.hk;illinois.edu",
        "position": "PhD student;PhD student;Associate Professor;Senior Principal Researcher;Associate Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nzhang2024foundation,\ntitle={Foundation Model-oriented Robustness: Robust Image Model Evaluation with Pretrained Models},\nauthor={Peiyan Zhang and Haoyang Liu and Chaozhuo Li and Xing Xie and Sunghun Kim and Haohan Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=jd5GokdySz}\n}",
        "github": "",
        "project": "",
        "reviewers": "FCU2;LU8n;eMG1",
        "pdf_size": 5068053,
        "rating": "6;6;8",
        "confidence": "4;3;4",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "3;3;3",
        "wc_summary": "57;48;102",
        "wc_strengths": "73;45;13",
        "wc_weaknesses": "117;339;132",
        "wc_questions": "62;2;2",
        "wc_review": "309;434;249",
        "wc_reply_reviewers": "185;0;27",
        "wc_reply_authors": "1523;1681;629",
        "reply_reviewers": "2;0;1",
        "reply_authors": "5;5;2",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            69.0,
            23.62202362203543
        ],
        "wc_strengths_avg": [
            43.666666666666664,
            24.513035081133648
        ],
        "wc_weaknesses_avg": [
            196.0,
            101.3015300970326
        ],
        "wc_questions_avg": [
            22.0,
            28.284271247461902
        ],
        "wc_review_avg": [
            330.6666666666667,
            77.06418681131262
        ],
        "wc_reply_reviewers_avg": [
            70.66666666666667,
            81.59384508377795
        ],
        "wc_reply_authors_avg": [
            1277.6666666666667,
            463.1899058581576
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            4.0,
            1.4142135623730951
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.49999999999999983,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1001859637170360662&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=jd5GokdySz",
        "pdf": "https://openreview.net/pdf?id=jd5GokdySz",
        "email": "cse.ust.hk;uiuc.edu;bupt.edu.cn;microsoft.com;ust.hk;illinois.edu",
        "author_num": 6,
        "aff_unique_index": "0;1;2;3;0;4",
        "aff_unique_norm": "Hong Kong University of Science and Technology;University of Illinois;Beijing University of Posts and Telecommunications;Microsoft;University of Illinois Urbana-Champaign",
        "aff_unique_dep": "Department of Computer Science and Engineering;;;Research;",
        "aff_unique_url": "https://www.ust.hk;https://illinois.edu;http://www.bupt.edu.cn/;https://www.microsoft.com/en-us/research/group/asia;https://illinois.edu",
        "aff_unique_abbr": "HKUST;UIUC;BUPT;MSR Asia;UIUC",
        "aff_campus_unique_index": "0;1;2;3;0;1",
        "aff_campus_unique": "Hong Kong SAR;Urbana-Champaign;Beijing;Asia",
        "aff_country_unique_index": "0;1;0;0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "jdynlBj3b0",
        "title": "Can Class-Priors Help Single-Positive Multi-Label Learning?",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Single-positive multi-label learning (SPMLL) is a typical weakly supervised multi-label learning problem, where each training example is annotated with only one positive label. Existing SPMLL methods typically assign pseudo-labels to unannotated labels with the assumption that prior probabilities of all classes are identical. However, the class-prior of each category may differ significantly in real-world scenarios, which makes the predictive model not perform as well as expected due to the unrealistic assumption on real-world application. To alleviate this issue, a novel framework named CRISP, i.e., Class-pRiors Induced Single-Positive multi-label learning, is proposed. Specifically, a class-priors estimator is introduced, which could estimate the class-priors that are theoretically guaranteed to converge to the ground-truth class-priors. In addition, based on the estimated class-priors, an unbiased risk estimator for classification is derived, and the corresponding risk minimizer could be guaranteed to approximately converge to the optimal risk minimizer on fully supervised data. Experimental results on ten MLL benchmark datasets demonstrate the effectiveness and superiority of our method over existing SPMLL approaches.",
        "keywords": "Multi-label Learning;Single-Positive Multi-Label Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Biao Liu;Jie Wang;Ning Xu;Xin Geng",
        "authorids": "~Biao_Liu1;~Jie_Wang32;~Ning_Xu5;~Xin_Geng1",
        "gender": "M;M;M;M",
        "homepage": "http://palm.seu.edu.cn/homepage/liubiao/demo/demo/index.html;http://palm.seu.edu.cn/xuning/;http://palm.seu.edu.cn/xgeng/index.htm;http://palm.seu.edu.cn/homepage/wangjie/index.html",
        "dblp": ";04/5856-9;;",
        "google_scholar": ";;ZOCxkIcAAAAJ;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Biao_Liu1;~Ning_Xu5;~Xin_Geng1;~wang_jie2",
        "aff": "Southeast University;Southeast University;Southeast University, China;Southeast University",
        "aff_domain": "seu.edu.cn;seu.edu.cn;seu.edu.cn;seu.edu.cn",
        "position": "PhD student;Associate Professor;Professor;MS student",
        "bibtex": "@misc{\nliu2024can,\ntitle={Can Class-Priors Help Single-Positive Multi-Label Learning?},\nauthor={Biao Liu and Jie Wang and Ning Xu and Xin Geng},\nyear={2024},\nurl={https://openreview.net/forum?id=jdynlBj3b0}\n}",
        "github": "",
        "project": "",
        "reviewers": "6TNH;cikX;KmCM;BQ4v",
        "site": "https://openreview.net/forum?id=jdynlBj3b0",
        "pdf_size": 2859435,
        "rating": "3;6;8;8",
        "confidence": "4;3;3;3",
        "soundness": "2;2;3;4",
        "contribution": "2;3;3;4",
        "presentation": "1;3;3;3",
        "wc_summary": "55;76;104;39",
        "wc_strengths": "46;83;38;24",
        "wc_weaknesses": "32;159;117;68",
        "wc_questions": "149;109;76;47",
        "wc_review": "282;427;335;178",
        "wc_reply_reviewers": "0;60;34;0",
        "wc_reply_authors": "1260;1400;1535;511",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "4;4;4;1",
        "rating_avg": [
            6.25,
            2.0463381929681126
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            68.5,
            24.336187047275914
        ],
        "wc_strengths_avg": [
            47.75,
            21.821720830401986
        ],
        "wc_weaknesses_avg": [
            94.0,
            48.15080477001397
        ],
        "wc_questions_avg": [
            95.25,
            38.0024670251814
        ],
        "wc_review_avg": [
            305.5,
            90.05692644100175
        ],
        "wc_reply_reviewers_avg": [
            23.5,
            25.233905761891084
        ],
        "wc_reply_authors_avg": [
            1176.5,
            396.3385547735673
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.25,
            1.299038105676658
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9169493006161777,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2305833791342599982&as_sdt=5,31&sciodt=0,31&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Southeast University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.seu.edu.cn/",
        "aff_unique_abbr": "SEU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "jeMZi2Z9xe",
        "title": "Follow-the-Perturbed-Leader for Adversarial Bandits: Heavy Tails, Robustness, and Privacy",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We study adversarial bandit problems with potentially heavy-tailed losses. Unlike standard settings with non-negative and bounded losses, managing negative and unbounded losses introduces a unique challenge in controlling the ``stability'' of the algorithm and hence the regret. To tackle this challenge, we propose a Follow-the-Perturbed-Leader (FTPL) based learning algorithm. Notably, our method achieves (nearly) optimal worst-case regret, eliminating the need for an undesired assumption inherent in the Follow-the-Regularized-Leader (FTRL) based approach. Thanks to this distinctive advantage, our algorithmic framework finds novel applications in two important scenarios with unbounded heavy-tailed losses. For adversarial bandits with heavy-tailed losses and Huber contamination, which we call the robust setting, our algorithm is the first to match the lower bound (up to a $\\polylog(K)$ factor, where $K$ is the number of actions). In the private setting, where true losses are in a bounded range (e.g., $[0,1]$) but with additional Local Differential Privacy (LDP) guarantees, our algorithm achieves an improvement of a $\\polylog(T)$ factor in the regret bound compared to the best-known results, where $T$ is the total number of rounds. Furthermore, when compared to state-of-the-art FTRL-based algorithms, our FTPL-based algorithm has a more streamlined design. It eliminates the need for additional explicit exploration and solely maintains the absolute value of loss estimates below a predetermined threshold.",
        "keywords": "Adversarial Bandits;Online Learning;Heavy Tails;Follow-the-Perturbed-Leader",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Duo Cheng;Xingyu Zhou;Bo Ji",
        "authorids": "~Duo_Cheng1;~Xingyu_Zhou2;~Bo_Ji3",
        "gender": "M;M;",
        "homepage": "https://duocheng1999.github.io/;http://xingyuzhou.org;https://people.cs.vt.edu/boji/",
        "dblp": ";07/10352-1;",
        "google_scholar": ";AsTyRmwAAAAJ;",
        "orcid": ";;",
        "linkedin": "duo-c-49b31019b;;",
        "or_profile": "~Duo_Cheng1;~Xingyu_Zhou2;~Bo_Ji3",
        "aff": "Virginia Polytechnic Institute and State University;Wayne State University;Virginia Tech",
        "aff_domain": "vt.edu;wayne.edu;vt.edu",
        "position": "PhD student;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nanonymous2024followtheperturbedleader,\ntitle={Follow-the-Perturbed-Leader for Adversarial Bandits: Heavy Tails, Robustness, and Privacy},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=jeMZi2Z9xe}\n}",
        "github": "",
        "project": "",
        "reviewers": "J99q;XopM;PzqF;rKqQ",
        "site": "https://openreview.net/forum?id=jeMZi2Z9xe",
        "pdf_size": 462269,
        "rating": "5;6;8;8",
        "confidence": "4;4;3;3",
        "soundness": "3;3;4;3",
        "contribution": "2;3;3;2",
        "presentation": "2;3;3;3",
        "wc_summary": "49;39;229;87",
        "wc_strengths": "62;16;124;80",
        "wc_weaknesses": "268;50;56;291",
        "wc_questions": "42;23;40;103",
        "wc_review": "421;128;449;561",
        "wc_reply_reviewers": "0;10;18;15",
        "wc_reply_authors": "940;559;753;1363",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "2;1;1;2",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            101.0,
            76.03946343840151
        ],
        "wc_strengths_avg": [
            70.5,
            38.713692668098716
        ],
        "wc_weaknesses_avg": [
            166.25,
            113.56138208035335
        ],
        "wc_questions_avg": [
            52.0,
            30.35621847332108
        ],
        "wc_review_avg": [
            389.75,
            159.9427631998397
        ],
        "wc_reply_reviewers_avg": [
            10.75,
            6.832825184358224
        ],
        "wc_reply_authors_avg": [
            903.75,
            297.40660298655104
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.9622504486493761,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:nRIYVQXzmSIJ:scholar.google.com/&scioq=Follow-the-Perturbed-Leader+for+Adversarial+Bandits:+Heavy+Tails,+Robustness,+and+Privacy&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Virginia Tech;Wayne State University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.vt.edu;https://wayne.edu",
        "aff_unique_abbr": "VT;WSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "jeNWwtIX71",
        "title": "Provable Domain Generalization via Information Theory Guided Distribution Matching",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Domain generalization (DG) aims to learn predictors that perform well on unseen data distributions by leveraging multiple related training environments. To this end, DG is commonly formulated as an average or worst-case optimization problem, which however either lacks robustness or is overly conservative. In this work, we propose a novel probabilistic framework for DG by minimizing the gap between training and test-domain population risks. Our formulation is built upon comprehensive information-theoretic analysis and enables direct optimization without stringent assumptions. Specifically, we establish information-theoretic upper bounds for both source and target-domain generalization errors, revealing the key quantities that control the capability of learning algorithms to generalize on unseen domains. Based on the theoretical findings, we propose Inter-domain Distribution Matching (IDM) for high-probability DG by simultaneously aligning inter-domain gradients and representations, and Per-sample Distribution Matching (PDM) for high-dimensional and complex data distribution alignment. Extensive experimental results validate the efficacy of our methods, showing superior performance over various baseline methods.",
        "keywords": "domain generalization;out-of-distribution generalization;information theory",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/56f305249fb71332eb0392360cbcef6a50c12f32.zip",
        "author": "Yuxin Dong;Tieliang Gong;Hong Chen;Shuangyong Song;Chen Li",
        "authorids": "~Yuxin_Dong1;~Tieliang_Gong2;~Hong_Chen1;~Shuangyong_Song2;~Chen_Li19",
        "gender": "M;;;;M",
        "homepage": "https://yuxin-dong.github.io/;;https://chenhongml.github.io/;;http://chenli.group",
        "dblp": ";;https://dblp.uni-trier.de/pers/hd/c/Chen_0004:Hong;;l/ChenLi32",
        "google_scholar": "yFJv-2kAAAAJ;;;;",
        "orcid": "0000-0002-4475-5056;;;;0000-0002-0079-3106",
        "linkedin": "yuxin-dong-939a03349;;;;",
        "or_profile": "~Yuxin_Dong1;~Tieliang_Gong2;~Hong_Chen1;~Shuangyong_Song2;~Chen_Li19",
        "aff": "Xi'an Jiaotong University;;Huazhong Agricultural University;;Xi'an Jiaotong University",
        "aff_domain": "xjtu.edu.cn;;hzau.edu.cn;;xjtu.edu.cn",
        "position": "PhD student;;Full Professor;;Full Professor",
        "bibtex": "@misc{\ndong2024provable,\ntitle={Provable Domain Generalization via Information Theory Guided Distribution Matching},\nauthor={Yuxin Dong and Tieliang Gong and Hong Chen and Shuangyong Song and Chen Li},\nyear={2024},\nurl={https://openreview.net/forum?id=jeNWwtIX71}\n}",
        "github": "",
        "project": "",
        "reviewers": "pEKy;pzid;rTAB;G8me",
        "site": "https://openreview.net/forum?id=jeNWwtIX71",
        "pdf_size": 506521,
        "rating": "1;5;6;8",
        "confidence": "5;4;4;4",
        "soundness": "1;3;3;3",
        "contribution": "1;2;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "29;162;100;97",
        "wc_strengths": "12;67;68;59",
        "wc_weaknesses": "241;289;214;150",
        "wc_questions": "73;59;224;198",
        "wc_review": "355;577;606;504",
        "wc_reply_reviewers": "3307;0;0;0",
        "wc_reply_authors": "1973;1028;609;855",
        "reply_reviewers": "7;0;0;0",
        "reply_authors": "4;2;1;2",
        "rating_avg": [
            5.0,
            2.5495097567963922
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            97.0,
            47.05847426340977
        ],
        "wc_strengths_avg": [
            51.5,
            23.070543990118654
        ],
        "wc_weaknesses_avg": [
            223.5,
            50.22200712834962
        ],
        "wc_questions_avg": [
            138.5,
            73.24786686313807
        ],
        "wc_review_avg": [
            510.5,
            97.16609490969574
        ],
        "wc_reply_reviewers_avg": [
            826.75,
            1431.9730051575693
        ],
        "wc_reply_authors_avg": [
            1116.25,
            516.566246961607
        ],
        "reply_reviewers_avg": [
            1.75,
            3.031088913245535
        ],
        "reply_authors_avg": [
            2.25,
            1.0897247358851685
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9058216273156766,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:JFLdcKVRzswJ:scholar.google.com/&scioq=Provable+Domain+Generalization+via+Information+Theory+Guided+Distribution+Matching&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Xi'an Jiao Tong University;Huazhong Agricultural University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.xjtu.edu.cn;http://www.hzau.edu.cn/",
        "aff_unique_abbr": "XJTU;HAU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "MuSR: Testing the Limits of Chain-of-thought with Multistep Soft Reasoning",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18015",
        "id": "jenyYQzue1",
        "author_site": "Zayne Sprague, Xi Ye, Kaj Bostrom, Swarat Chaudhuri, Greg Durrett",
        "tldr": "",
        "abstract": "While large language models (LLMs) equipped with techniques like chain-of-thought prompting have demonstrated impressive capabilities, they still fall short in their ability to reason robustly in complex settings. However, evaluating LLM reasoning is challenging because system capabilities continue to grow while benchmark datasets for tasks like logical deduction have remained static. We introduce MuSR, a dataset for evaluating language models on multistep soft reasoning tasks specified in a natural language narrative. This dataset has two crucial features. First, it is created through a novel neurosymbolic synthetic-to-natural generation algorithm, enabling the construction of complex reasoning instances that challenge GPT-4 (e.g., murder mysteries roughly 1000 words in length) and which can be scaled further as more capable LLMs are released. Second, our data instances are free text narratives corresponding to real-world domains of reasoning; this makes it simultaneously much more challenging than other synthetically-crafted benchmarks while remaining realistic and tractable for human annotators to solve with high accuracy. We evaluate a range of LLMs and prompting techniques on this dataset and characterize the gaps that remain for techniques like chain-of-thought to perform robust reasoning.",
        "keywords": "Large Language Models;Chain-of-Thought;Textual Reasoning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/a0fefb56255472c56c4f033db40374add9e033c1.zip",
        "author": "Zayne Rea Sprague;Xi Ye;Kaj Bostrom;Swarat Chaudhuri;Greg Durrett",
        "authorids": "~Zayne_Rea_Sprague1;~Xi_Ye2;~Kaj_Bostrom1;~Swarat_Chaudhuri1;~Greg_Durrett1",
        "gender": "M;;M;M;M",
        "homepage": "https://zaynesprague.com/;https://xiye17.github.io/;https://bostromk.net;http://www.cs.utexas.edu/~swarat;http://www.cs.utexas.edu/~gdurrett/",
        "dblp": "311/5080.html;;262/6299;37/6100;69/7968",
        "google_scholar": "https://scholar.google.com/citations?hl=en;qH83GlAAAAAJ;Ulvgh34AAAAJ;9j6RBYQAAAAJ;https://scholar.google.com.tw/citations?user=EpQ_sDEAAAAJ",
        "orcid": ";;;0000-0002-6859-1391;",
        "linkedin": ";;;swarat-chaudhuri-609b3092/;",
        "or_profile": "~Zayne_Rea_Sprague1;~Xi_Ye2;~Kaj_Bostrom1;~Swarat_Chaudhuri1;~Greg_Durrett1",
        "aff": "University of Texas at Austin;UT Austin;University of Texas, Austin;University of Texas at Austin;University of Texas at Austin",
        "aff_domain": "cs.utexas.edu;cs.utexas.edu;cs.utexas.edu;utexas.edu;utexas.edu",
        "position": "PhD student;PhD student;PhD student;Full Professor;Associate Professor",
        "bibtex": "@inproceedings{\nsprague2024musr,\ntitle={Mu{SR}: Testing the Limits of Chain-of-thought with Multistep Soft Reasoning},\nauthor={Zayne Rea Sprague and Xi Ye and Kaj Bostrom and Swarat Chaudhuri and Greg Durrett},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=jenyYQzue1}\n}",
        "github": "",
        "project": "",
        "reviewers": "WJFH;cJvj;NkVA;WiLx",
        "pdf_size": 756399,
        "rating": "5;6;8;8",
        "confidence": "4;3;3;4",
        "soundness": "3;2;4;3",
        "contribution": "3;2;4;3",
        "presentation": "4;2;4;3",
        "wc_summary": "164;99;56;113",
        "wc_strengths": "71;66;46;271",
        "wc_weaknesses": "413;262;6;458",
        "wc_questions": "67;35;59;185",
        "wc_review": "715;462;167;1027",
        "wc_reply_reviewers": "0;53;0;159",
        "wc_reply_authors": "806;464;245;807",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            108.0,
            38.555155297314
        ],
        "wc_strengths_avg": [
            113.5,
            91.4125264939111
        ],
        "wc_weaknesses_avg": [
            284.75,
            176.55222315224466
        ],
        "wc_questions_avg": [
            86.5,
            58.07538204781782
        ],
        "wc_review_avg": [
            592.75,
            316.96874845952874
        ],
        "wc_reply_reviewers_avg": [
            53.0,
            64.91147818375421
        ],
        "wc_reply_authors_avg": [
            580.5,
            238.89589782999624
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.19245008972987526,
        "gs_citation": 54,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1934698333082864403&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=jenyYQzue1",
        "pdf": "https://openreview.net/pdf?id=jenyYQzue1",
        "email": "cs.utexas.edu;cs.utexas.edu;cs.utexas.edu;utexas.edu;utexas.edu",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "University of Texas at Austin",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.utexas.edu",
        "aff_unique_abbr": "UT Austin",
        "aff_campus_unique_index": "0;0;0;0;0",
        "aff_campus_unique": "Austin",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "jesfGs3fIc",
        "title": "Set-based Neural Network Encoding",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We propose an approach to neural network weight encoding for generalization performance prediction that utilizes set-to-set and set-to-vector functions to efficiently encode neural network parameters. Our approach is capable of encoding neural networks in a modelzoo of mixed architecture and different parameter sizes as opposed to previous approaches that require custom encoding models for different architectures. Furthermore, our \\textbf{S}et-based \\textbf{N}eural network \\textbf{E}ncoder (SNE) takes into consideration the hierarchical computational structure of neural networks by utilizing a layer-wise encoding scheme that culminates to encoding all layer-wise encodings to obtain the neural network encoding vector. Additionally, we introduce a \\textit{pad-chunk-encode} pipeline to efficiently encode neural network layers that is adjustable to computational and memory constraints. We also introduce two new tasks for neural network generalization performance prediction: cross-dataset and cross-architecture. In cross-dataset performance prediction, we evaluate how well performance predictors generalize across modelzoos trained on different datasets but of the same architecture. In cross-architecture performance prediction, we evaluate how well generalization performance predictors transfer to modelzoos of different architecture. Experimentally, we show that SNE outperforms the relevant baselines on the cross-dataset task and provide the first set of results on the cross-architecture task.",
        "keywords": "Neural Network Encoding;Sets",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Bruno Andreis;Bedionita Soro;Sung Ju Hwang",
        "authorids": "~Bruno_Andreis1;~Bedionita_Soro1;~Sung_Ju_Hwang1",
        "gender": "M;;",
        "homepage": "https://andreisbruno.github.io/;;",
        "dblp": "225/0404;;",
        "google_scholar": "WzQ_v4IAAAAJ;;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Bruno_Andreis1;~Bedionita_Soro1;~Sung_Ju_Hwang1",
        "aff": "Korea Advanced Institute of Science & Technology;;",
        "aff_domain": "kaist.ac.kr;;",
        "position": "PhD student;;",
        "bibtex": "@misc{\nandreis2024setbased,\ntitle={Set-based Neural Network Encoding},\nauthor={Bruno Andreis and Bedionita Soro and Sung Ju Hwang},\nyear={2024},\nurl={https://openreview.net/forum?id=jesfGs3fIc}\n}",
        "github": "",
        "project": "",
        "reviewers": "Yfht;dyJx;Ab9j;8ZLb",
        "site": "https://openreview.net/forum?id=jesfGs3fIc",
        "pdf_size": 3506623,
        "rating": "3;3;5;8",
        "confidence": "5;3;3;3",
        "soundness": "1;2;2;3",
        "contribution": "2;2;2;4",
        "presentation": "3;2;2;3",
        "wc_summary": "64;55;35;86",
        "wc_strengths": "53;11;65;17",
        "wc_weaknesses": "246;70;82;28",
        "wc_questions": "51;2;44;186",
        "wc_review": "414;138;226;317",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1238;652;1122;418",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "4;2;3;1",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            60.0,
            18.3166590840142
        ],
        "wc_strengths_avg": [
            36.5,
            22.994564575133836
        ],
        "wc_weaknesses_avg": [
            106.5,
            82.99849396224006
        ],
        "wc_questions_avg": [
            70.75,
            69.12805146971814
        ],
        "wc_review_avg": [
            273.75,
            102.77250361842898
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            857.5,
            335.45901388992365
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.49374193110101877,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9031442352293905695&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_country_unique_index": "0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "jfTrsqRrpb",
        "title": "Open-world Instance Segmentation: Top-down Learning with Bottom-up Supervision",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Top-down instance segmentation architectures excel with predefined closed-world taxonomies but exhibit biases and performance degradation in open-world scenarios. In this work, we introduce bottom-Up and top-Down Open-world Segmentation (UDOS), a novel approach that combines classical bottom-up segmentation methods within a top-down learning framework. UDOS leverages a top-down network trained with weak supervision derived from class-agnostic bottom-up segmentation to predict object parts. These part-masks undergo affinity-based grouping and refinement to generate precise instance-level segmentations. UDOS balances the efficiency of top-down architectures with the capacity to handle unseen categories through bottom-up supervision. We validate UDOS on challenging datasets (MS-COCO, LVIS, ADE20k, UVO, and OpenImages), achieving superior performance over state-of-the-art methods in cross-category and cross-dataset transfer tasks. Our code and models will be publicly available.",
        "keywords": "instance segmentation; open-world learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/3af4e09c3a279a6522013d0ff87f76db5377e5ce.pdf",
        "author": "Tarun Kalluri;Weiyao Wang;Heng Wang;Manmohan Chandraker;Lorenzo Torresani;Du Tran",
        "authorids": "~Tarun_Kalluri1;~Weiyao_Wang1;~Heng_Wang2;~Manmohan_Chandraker3;~Lorenzo_Torresani1;~Du_Tran1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://tarun005.github.io/;https://research.fb.com/people/wang-weiyao/;https://ltorresa.github.io;https://dutran.github.io;https://hengcv.github.io/;http://cseweb.ucsd.edu/~mkchandraker/",
        "dblp": "167/4104;206/6183-1;75/2854;34/6488;;79/589",
        "google_scholar": "https://scholar.google.co.in/citations?user=AeraUlMAAAAJ;;ss8KR5gAAAAJ;3TVbh8QAAAAJ;ghmgyewAAAAJ;oPFCNk4AAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";;;du-tran-737572226/;;",
        "or_profile": "~Tarun_Kalluri1;~Weiyao_Wang1;~Lorenzo_Torresani1;~Du_Tran1;~heng_Wang1;~Manmohan_Chandraker2",
        "aff": "University of California, San Diego, University of California, San Diego;Meta Facebook;Meta;Google;Bytedance;University of California, San Diego",
        "aff_domain": "eng.ucsd.edu;meta.com;meta.com;google.com;bytedance.com;ucsd.edu",
        "position": "PhD student;Researcher;Researcher;Research Scientist;research scientist;Full Professor",
        "bibtex": "@misc{\nkalluri2024openworld,\ntitle={Open-world Instance Segmentation: Top-down Learning with Bottom-up Supervision},\nauthor={Tarun Kalluri and Weiyao Wang and Heng Wang and Manmohan Chandraker and Lorenzo Torresani and Du Tran},\nyear={2024},\nurl={https://openreview.net/forum?id=jfTrsqRrpb}\n}",
        "github": "",
        "project": "",
        "reviewers": "jfRf;bvBC;Rvq9;QToW",
        "site": "https://openreview.net/forum?id=jfTrsqRrpb",
        "pdf_size": 11466064,
        "rating": "3;5;5;6",
        "confidence": "4;5;5;4",
        "soundness": "1;3;2;3",
        "contribution": "1;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "58;139;33;23",
        "wc_strengths": "82;61;27;14",
        "wc_weaknesses": "186;123;179;155",
        "wc_questions": "2;5;2;16",
        "wc_review": "328;328;241;208",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "566;404;573;571",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            63.25,
            45.554225929105634
        ],
        "wc_strengths_avg": [
            46.0,
            26.953663943887108
        ],
        "wc_weaknesses_avg": [
            160.75,
            24.641174890820444
        ],
        "wc_questions_avg": [
            6.25,
            5.7608593109014565
        ],
        "wc_review_avg": [
            276.25,
            53.04891610579805
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            528.5,
            71.92530848039513
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.2294157338705618,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=844827083250665330&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;1;2;3;0",
        "aff_unique_norm": "University of California, San Diego;Meta;Google;ByteDance",
        "aff_unique_dep": ";Meta Platforms, Inc.;Google;",
        "aff_unique_url": "https://www.ucsd.edu;https://meta.com;https://www.google.com;https://www.bytedance.com",
        "aff_unique_abbr": "UCSD;Meta;Google;Bytedance",
        "aff_campus_unique_index": "0;2;0",
        "aff_campus_unique": "San Diego;;Mountain View",
        "aff_country_unique_index": "0;0;0;0;1;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "jgpPKi7YCT",
        "title": "Information Theoretical Study on Neural Learning Processes",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In this paper, we reveal how deep networks converge over data flows in their training process via an information theoretical analysis. By looking into individual neurons in different layers, we found that the whole learning process of neural networks are pertinent to the local flows per individual neurons in various layers.",
        "keywords": "Neural Networks;Information Flow;Explainability",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Richard Jiang",
        "authorids": "~Richard_Jiang3",
        "gender": "M",
        "homepage": "https://wp.lancs.ac.uk/autobrain",
        "dblp": "70/8305",
        "google_scholar": "NuyoNc4AAAAJ",
        "orcid": "0000-0003-1721-9474",
        "linkedin": "",
        "or_profile": "~Richard_M._Jiang1",
        "aff": "Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn",
        "position": "Visiting Scholar",
        "bibtex": "@misc{\njiang2024information,\ntitle={Information Theoretical Study on Neural Learning Processes},\nauthor={Richard Jiang},\nyear={2024},\nurl={https://openreview.net/forum?id=jgpPKi7YCT}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=jgpPKi7YCT",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:hdfiNAlU8noJ:scholar.google.com/&scioq=Information+Theoretical+Study+on+Neural+Learning+Processes&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Shanghai Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sjtu.edu.cn",
        "aff_unique_abbr": "SJTU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "jhCzPwcVbG",
        "title": "LLMZip: Lossless Text Compression using Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We design a lossless compression algorithm for compressing English text by using the large language model LLaMA-7B as a predictor for the next token given a window of past tokens. Specifically, the proposed LLMZip algorithm uses the conditional probabilities at the output of the large language model in conjunction with Arithmetic Coding. We show that our scheme outperforms state-of-the-art text compression schemes such as BSC, ZPAQ, and paq8h. We show that it is possible to marginally improve the compression performance further by first extracting a summary from the document and compressing the text by conditioning on the summary. Finally, we investigate the compression performance of LLMZip when the summary (side information) is available both at the encoder and decoder. We show that the LLM is able to exploit the available side information to significantly improve the compression performance. As an important byproduct, we provide new estimates of an asymptotic upper bound on the entropy of English which is significantly smaller than currently available estimates in \\cite{cover1978convergent}, \\cite{lutati2023focus}.",
        "keywords": "Large Language Models;Transformers;Compression;Arithmetic Coding;Zip;Lossless Text Compression",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Chandra Shekhara Kaushik Valmeekam;Krishna Narayanan;Dileep Kalathil;Jean-Francois Chamberland;Srinivas Shakkottai",
        "authorids": "~Chandra_Shekhara_Kaushik_Valmeekam1;~Krishna_Narayanan1;~Dileep_Kalathil1;~Jean-Francois_Chamberland1;~Srinivas_Shakkottai1",
        "gender": "M;M;M;M;",
        "homepage": ";https://krishnanarayanan.wikidot.com;http://people.tamu.edu/~dileep.kalathil/;https://people.engr.tamu.edu/chmbrlnd/index.html;https://cesg.tamu.edu/faculty/sshakkot/",
        "dblp": ";;44/8356;;03/353.html",
        "google_scholar": "https://scholar.google.com/citations?hl=en;oDivxXQAAAAJ;S24XFwwAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0002-2356-1682;;;0000-0002-2983-9884;0000-0002-5882-6433",
        "linkedin": ";;;chmbrlnd/;",
        "or_profile": "~Chandra_Shekhara_Kaushik_Valmeekam1;~Krishna_Narayanan1;~Dileep_Kalathil1;~Jean-Francois_Chamberland1;~Srinivas_Shakkottai1",
        "aff": "Texas A&M University - College Station;Texas A&M;Texas A&M University;Texas A&M University - College Station;Texas A&M",
        "aff_domain": "tamu.edu;tamu.edu;tamu.edu;tamu.edu;tamu.edu",
        "position": "PhD student;Full Professor;Associate Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nvalmeekam2024llmzip,\ntitle={{LLMZ}ip: Lossless Text Compression using Large Language Models},\nauthor={Chandra Shekhara Kaushik Valmeekam and Krishna Narayanan and Dileep Kalathil and Jean-Francois Chamberland and Srinivas Shakkottai},\nyear={2024},\nurl={https://openreview.net/forum?id=jhCzPwcVbG}\n}",
        "github": "",
        "project": "",
        "reviewers": "fbKB;o5QE;1ivF",
        "site": "https://openreview.net/forum?id=jhCzPwcVbG",
        "pdf_size": 262882,
        "rating": "3;6;6",
        "confidence": "4;3;3",
        "soundness": "2;2;3",
        "contribution": "1;2;3",
        "presentation": "1;2;3",
        "wc_summary": "46;91;44",
        "wc_strengths": "17;32;30",
        "wc_weaknesses": "196;149;17",
        "wc_questions": "4;50;92",
        "wc_review": "263;322;183",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "679;646;408",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            60.333333333333336,
            21.699974398346395
        ],
        "wc_strengths_avg": [
            26.333333333333332,
            6.649979114420001
        ],
        "wc_weaknesses_avg": [
            120.66666666666667,
            75.77305296446458
        ],
        "wc_questions_avg": [
            48.666666666666664,
            35.93821859184948
        ],
        "wc_review_avg": [
            256.0,
            56.96197562116913
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            577.6666666666666,
            120.72650450041569
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 42,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7074470061260101516&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Texas A&M University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tamu.edu",
        "aff_unique_abbr": "TAMU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "College Station;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Look, Remember and Reason: Grounded Reasoning in Videos with Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18014",
        "id": "jhPvuc7kxB",
        "author_site": "Apratim Bhattacharyya, Sunny Panchal, Reza Pourreza, Mingu Lee, Pulkit Madan, Roland Memisevic",
        "tldr": "",
        "abstract": "Multi-modal language models (LM) have recently shown promising performance \nin high-level reasoning tasks on videos. However, existing methods still fall short in tasks like causal or  compositional spatiotemporal reasoning over actions, in which model predictions need to be grounded in fine-grained low-level details, such as object motions and object interactions.\nIn this work, we propose training an LM end-to-end on low-level surrogate tasks, including object detection, re-identification, and tracking, to endow the  model with the required low-level visual capabilities. We show that a two-stream video encoder with spatiotemporal attention is effective at capturing the required static and motion-based cues in the video. By leveraging the LM's ability to perform the low-level surrogate tasks,  we can cast reasoning in videos as the three-step process of *Look, Remember, Reason*, wherein visual information is extracted using low-level visual skills step-by-step and then integrated to arrive at a final answer. We demonstrate the effectiveness of our framework on diverse visual reasoning tasks from the ACRE, CATER, Something-Else and STAR datasets. Our approach is trainable end-to-end and surpasses state-of-the-art task-specific methods across these tasks by a large margin.",
        "keywords": "Grounding;Reasoning;Language Models",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Apratim Bhattacharyya;Sunny Panchal;Reza Pourreza;Mingu Lee;Pulkit Madan;Roland Memisevic",
        "authorids": "~Apratim_Bhattacharyya1;~Sunny_Panchal1;~Reza_Pourreza1;~Mingu_Lee1;~Pulkit_Madan1;~Roland_Memisevic1",
        "gender": "M;;;M;;M",
        "homepage": "https://www.mpi-inf.mpg.de/departments/computer-vision-and-multimodal-computing/people/apratim-bhattacharyya/;;;;https://www.linkedin.com/in/madanpulkit;",
        "dblp": "180/5968;;;;350/5227;98/4508",
        "google_scholar": "https://scholar.google.de/citations?user=SKb4VyUAAAAJ;;;;;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;;;",
        "linkedin": ";;;mingu-lee-0aa28aa5/;madanpulkit/;",
        "or_profile": "~Apratim_Bhattacharyya1;~Sunny_Panchal1;~Reza_Pourreza1;~Mingu_Lee1;~Pulkit_Madan1;~Roland_Memisevic1",
        "aff": "Qualcomm Technologies, Inc.;;;Qualcomm Inc, QualComm;Qualcomm Inc, QualComm;Qualcomm Inc, Qualcomm",
        "aff_domain": "qualcomm.com;;;qti.qualcomm.com;qti.qualcomm.com;qti.qualcomm.com",
        "position": "Researcher;;;Researcher;Researcher;Researcher",
        "bibtex": "@inproceedings{\nbhattacharyya2024look,\ntitle={Look, Remember and Reason: Grounded Reasoning in Videos with Language Models},\nauthor={Apratim Bhattacharyya and Sunny Panchal and Reza Pourreza and Mingu Lee and Pulkit Madan and Roland Memisevic},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=jhPvuc7kxB}\n}",
        "github": "",
        "project": "",
        "reviewers": "Fa1W;4932;tQdf;5Fo1",
        "pdf_size": 3561938,
        "rating": "6;6;6;8",
        "confidence": "5;3;4;3",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;2;3",
        "wc_summary": "30;35;82;160",
        "wc_strengths": "30;10;99;30",
        "wc_weaknesses": "72;137;32;14",
        "wc_questions": "4;2;3;50",
        "wc_review": "136;184;216;254",
        "wc_reply_reviewers": "26;0;40;19",
        "wc_reply_authors": "1051;359;561;1113",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "3;1;1;3",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            76.75,
            52.1697949008811
        ],
        "wc_strengths_avg": [
            42.25,
            33.766662553471285
        ],
        "wc_weaknesses_avg": [
            63.75,
            47.214272206611426
        ],
        "wc_questions_avg": [
            14.75,
            20.363877332178173
        ],
        "wc_review_avg": [
            197.5,
            43.298383341644524
        ],
        "wc_reply_reviewers_avg": [
            21.25,
            14.411367041332339
        ],
        "wc_reply_authors_avg": [
            771.0,
            319.8468383461059
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            1.0
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5089139332487013374&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=jhPvuc7kxB",
        "pdf": "https://openreview.net/pdf?id=jhPvuc7kxB",
        "email": "qualcomm.com;;;qti.qualcomm.com;qti.qualcomm.com;qti.qualcomm.com",
        "author_num": 6,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Qualcomm Technologies;Qualcomm Incorporated",
        "aff_unique_dep": "Inc.;",
        "aff_unique_url": "https://www.qualcomm.com;https://www.qualcomm.com",
        "aff_unique_abbr": "QTI;Qualcomm",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "jhiByZpuIS",
        "title": "MSfusion: Enabling Collaborative Training of Large Models over Resource-Constraint Participants",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Training large models like GPT-3 requires a large amount of data, as well as abundant computation resources. While collaborative learning (e.g., federated learning) provides a promising paradigm to harness collective data from many participants, performing training for large models remains a major challenge for participants with limited resources. We introduce MSfusion, an effective and efficient collaborative learning framework, tailored for training large models on resource-constraint devices through model splitting. Specifically, a double shifting model splitting scheme is designed such that in each training round, each participant is assigned a subset of model parameters to train over local data, and aggregates with sub-models of other peers on common parameters. While model splitting significantly reduces the computation and communication costs of individual participants, additional novel designs on adaptive model overlapping and contrastive loss functions help MSfusion to maintain training effectiveness, against model shift across participants. Extensive experiments on image and NLP datasets illustrate significant advantages of MSfusion in performance and efficiency for training large models, and its strong scalability: computation cost of each participant reduces significantly as the number of participants increases.",
        "keywords": "Collaborative Learning;Large Models;Model Splitting;Contrastive Learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Jin Xie;Songze Li",
        "authorids": "~Jin_Xie10;~Songze_Li1",
        "gender": "M;M",
        "homepage": ";https://s3di-lab.github.io/",
        "dblp": ";119/2630",
        "google_scholar": "a41Tc_YAAAAJ;vcGuNDYAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Jin_Xie10;~Songze_Li1",
        "aff": ";Southeast University",
        "aff_domain": ";seu.edu.cn",
        "position": ";Full Professor",
        "bibtex": "@misc{\nxie2024msfusion,\ntitle={{MS}fusion: Enabling Collaborative Training of Large Models over Resource-Constraint Participants},\nauthor={Jin Xie and Songze Li},\nyear={2024},\nurl={https://openreview.net/forum?id=jhiByZpuIS}\n}",
        "github": "",
        "project": "",
        "reviewers": "wET1;wTYd;PcAY",
        "site": "https://openreview.net/forum?id=jhiByZpuIS",
        "pdf_size": 9927346,
        "rating": "3;5;6",
        "confidence": "4;3;3",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "3;3;3",
        "wc_summary": "103;74;106",
        "wc_strengths": "38;66;328",
        "wc_weaknesses": "352;135;79",
        "wc_questions": "5;15;24",
        "wc_review": "498;290;537",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1541;1679;1038",
        "reply_reviewers": "0;0;0",
        "reply_authors": "5;5;5",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            94.33333333333333,
            14.429907214608907
        ],
        "wc_strengths_avg": [
            144.0,
            130.60883073769043
        ],
        "wc_weaknesses_avg": [
            188.66666666666666,
            117.73510757440006
        ],
        "wc_questions_avg": [
            14.666666666666666,
            7.760297817881877
        ],
        "wc_review_avg": [
            441.6666666666667,
            108.41996536103898
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1419.3333333333333,
            275.46606969925637
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            5.0,
            0.0
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.9449111825230683,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:sjAaCX4_kB4J:scholar.google.com/&scioq=MSfusion:+Enabling+Collaborative+Training+of+Large+Models+over+Resource-Constraint+Participants&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Southeast University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.seu.edu.cn/",
        "aff_unique_abbr": "SEU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "ji0iMTgjos",
        "title": "Matrix-wise Class Imbalance Matters: On the Generalization of Micro-AUC in Multi-label Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Micro-AUC is averaging AUC on the prediction matrix in multi-label learning. While it is a commonly-used evaluation measure in practice, the theoretical understanding is far behind. To fill up this gap, this paper takes an initial step to characterize the generalization guarantees of algorithms based on three surrogate losses w.r.t. Micro-AUC. Theoretically, we identify a critical data-dependent quantity affecting the generalization bounds: \\emph{the matrix-wise class imbalance}. Our results of the imbalance-aware error bounds show that the commonly-used univariate loss-based algorithm has a worse learning guarantee than the ones with the proposed pairwise and reweighting univariate loss, which probably implies its worse performance. Finally, empirical results of the linear and deep neural network-based models on various benchmarks corroborate our theory findings.",
        "keywords": "Micro-AUC;Statistical Learning Theory;Generalization;Multi-Label Learning",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/13e4a4cd6e8d8b707d1920a654ef46b5664b2d49.zip",
        "author": "Guoqiang Wu;Yan Zhang;Teng Pang;Chongxuan Li;Yilong Yin",
        "authorids": "~Guoqiang_Wu2;~Yan_Zhang25;~Teng_Pang2;~Chongxuan_Li1;~Yilong_Yin1",
        "gender": "M;M;M;M;M",
        "homepage": "https://guoqiangwoodrowwu.github.io/;;http://ml.cs.tsinghua.edu.cn/~chongxuan;https://faculty.sdu.edu.cn/ylyin;https://time.sdu.edu.cn/info/1068/2603.htm",
        "dblp": "98/4857;;161/9965;;",
        "google_scholar": "KCTX-_0AAAAJ;;UKMcQn4AAAAJ;;",
        "orcid": "0000-0003-4486-7944;0000-0002-2728-4491;0000-0002-0912-9076;;",
        "linkedin": ";;;;",
        "or_profile": "~Guoqiang_Wu2;~Yan_Zhang25;~Chongxuan_Li1;~Yilong_Yin1;~teng_pang1",
        "aff": "Shandong University;Shandong University;Renmin University of China;Shandong University;Shandong University",
        "aff_domain": "sdu.edu.cn;sdu.edu.cn;ruc.edu.cn;sdu.edu.cn;sdu.edu.cn",
        "position": "Associate Professor;PhD student;Associate Professor;Full Professor;MS student",
        "bibtex": "@misc{\nwu2024matrixwise,\ntitle={Matrix-wise Class Imbalance Matters: On the Generalization of Micro-{AUC} in Multi-label Learning},\nauthor={Guoqiang Wu and Yan Zhang and Teng Pang and Chongxuan Li and Yilong Yin},\nyear={2024},\nurl={https://openreview.net/forum?id=ji0iMTgjos}\n}",
        "github": "",
        "project": "",
        "reviewers": "MN9U;yuay;6xUb;dXyR;wJZ6",
        "site": "https://openreview.net/forum?id=ji0iMTgjos",
        "pdf_size": 414516,
        "rating": "5;5;6;8;8",
        "confidence": "4;4;3;3;2",
        "soundness": "3;3;3;4;3",
        "contribution": "2;2;2;3;3",
        "presentation": "3;3;3;4;3",
        "wc_summary": "45;45;65;133;43",
        "wc_strengths": "62;31;22;45;20",
        "wc_weaknesses": "168;149;67;254;31",
        "wc_questions": "111;78;35;2;26",
        "wc_review": "386;303;189;434;120",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            6.4,
            1.3564659966250536
        ],
        "confidence_avg": [
            3.2,
            0.7483314773547882
        ],
        "soundness_avg": [
            3.2,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            3.2,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            66.2,
            34.353456885734225
        ],
        "wc_strengths_avg": [
            36.0,
            15.709869509324385
        ],
        "wc_weaknesses_avg": [
            133.8,
            78.58600384292359
        ],
        "wc_questions_avg": [
            50.4,
            39.01076774430362
        ],
        "wc_review_avg": [
            286.4,
            117.60714264023252
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.8669214468630109,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:INPWagIfchAJ:scholar.google.com/&scioq=Matrix-wise+Class+Imbalance+Matters:+On+the+Generalization+of+Micro-AUC+in+Multi-label+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "Shandong University;Renmin University of China",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.sdu.edu.cn;http://www.ruc.edu.cn",
        "aff_unique_abbr": "SDU;RUC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Knowledge Fusion of Large Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18013",
        "id": "jiDsk12qcz",
        "author_site": "Fanqi Wan, Xinting Huang, Deng Cai, Xiaojun Quan, Wei BI, Shuming Shi",
        "tldr": "",
        "abstract": "While training large language models (LLMs) from scratch can generate models with distinct functionalities and strengths, it comes at significant costs and may result in redundant capabilities. Alternatively, a cost-effective and compelling approach is to merge existing pre-trained LLMs into a more potent model. However, due to the varying architectures of these LLMs, directly blending their weights is impractical. In this paper, we introduce the notion of knowledge fusion for LLMs, aimed at combining the capabilities of existing LLMs and transferring them into a single LLM. By leveraging the generative distributions of source LLMs, we externalize their collective knowledge and unique strengths, thereby potentially elevating the capabilities of the target model beyond those of any individual source LLM. We validate our approach using three popular LLMs with different architectures\u2014Llama-2, MPT, and OpenLLaMA\u2014across various benchmarks and tasks. Our findings confirm that the fusion of LLMs can improve the performance of the target model across a range of capabilities such as reasoning, commonsense, and code generation. Our code, model weights, and data are public at \\url{https://github.com/fanqiwan/FuseLLM}.",
        "keywords": "Large Language Models;Model Fusion",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Fanqi Wan;Xinting Huang;Deng Cai;Xiaojun Quan;Wei Bi;Shuming Shi",
        "authorids": "~Fanqi_Wan1;~Xinting_Huang1;~Deng_Cai1;~Xiaojun_Quan1;~Wei_Bi1;~Shuming_Shi1",
        "gender": "M;M;M;M;F;M",
        "homepage": "https://fanqiwan.github.io/;https://timhuang1.github.io/;https://jcyk.github.io/;https://sites.google.com/site/xiaojunquan/;https://scholar.google.com.hk/citations?hl=en&user=aSJcgQMAAAAJ&view_op=list_works&sortby=pubdate#d=gsc_md_iad&u=%2Fcitations%3Fview_op%3Dimport_lookup%26hl%3Den%26imq%3DWei%2BBi%26json%3D%26btnA%3D1;",
        "dblp": "347/8267;;c/DCai-2;90/5936;38/1163;s/ShumingShi",
        "google_scholar": "AeS1tmEAAAAJ;QmyPDWQAAAAJ;KpbRLYcAAAAJ;dRpg4t8AAAAJ;https://scholar.google.com.hk/citations?hl=en;Lg31AKMAAAAJ",
        "orcid": ";;;;0000-0001-8457-0630;",
        "linkedin": "fanqiwan/;xintingh/;;;;",
        "or_profile": "~Fanqi_Wan1;~Xinting_Huang1;~Deng_Cai1;~Xiaojun_Quan1;~Wei_Bi1;~Shuming_Shi1",
        "aff": "SUN YAT-SEN UNIVERSITY;Tencent;Tencent AI Lab;SUN YAT-SEN UNIVERSITY;Hong Kong University of Science and Technology;Tencent AI Lab",
        "aff_domain": "sysu.edu.cn;tencent.com;tencent.com;sysu.edu.cn;ust.hk;tencent.com",
        "position": "MS student;Researcher;Research Scientist;Full Professor;PhD student;Principal Researcher",
        "bibtex": "@inproceedings{\nwan2024knowledge,\ntitle={Knowledge Fusion of Large Language Models},\nauthor={Fanqi Wan and Xinting Huang and Deng Cai and Xiaojun Quan and Wei Bi and Shuming Shi},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=jiDsk12qcz}\n}",
        "github": "",
        "project": "",
        "reviewers": "jpJv;M2ne;fXfT;CN5G",
        "pdf_size": 563572,
        "rating": "6;6;6;8",
        "confidence": "3;4;4;3",
        "soundness": "4;3;3;3",
        "contribution": "3;2;3;3",
        "presentation": "3;3;4;3",
        "wc_summary": "126;68;67;55",
        "wc_strengths": "28;32;13;31",
        "wc_weaknesses": "23;248;232;66",
        "wc_questions": "159;4;2;71",
        "wc_review": "336;352;314;223",
        "wc_reply_reviewers": "0;0;21;0",
        "wc_reply_authors": "814;1235;1266;609",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;2;3;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            79.0,
            27.613402542968153
        ],
        "wc_strengths_avg": [
            26.0,
            7.648529270389178
        ],
        "wc_weaknesses_avg": [
            142.25,
            99.08676753229969
        ],
        "wc_questions_avg": [
            59.0,
            64.0663718342158
        ],
        "wc_review_avg": [
            306.25,
            49.92181386928964
        ],
        "wc_reply_reviewers_avg": [
            5.25,
            9.093266739736606
        ],
        "wc_reply_authors_avg": [
            981.0,
            279.29106681023654
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 99,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9158411337130476733&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=jiDsk12qcz",
        "pdf": "https://openreview.net/pdf?id=jiDsk12qcz",
        "email": "sysu.edu.cn;tencent.com;tencent.com;sysu.edu.cn;ust.hk;tencent.com",
        "author_num": 6,
        "aff_unique_index": "0;1;1;0;2;1",
        "aff_unique_norm": "Sun Yat-sen University;Tencent;Hong Kong University of Science and Technology",
        "aff_unique_dep": ";Tencent Holdings Limited;",
        "aff_unique_url": "http://www.sysu.edu.cn;https://www.tencent.com;https://www.ust.hk",
        "aff_unique_abbr": "SYSU;Tencent;HKUST",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "jiQg5IvuYF",
        "title": "Corgi$^2$: A Hybrid Offline-Online Approach To Storage-Aware Data Shuffling For SGD",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "When using Stochastic Gradient Descent (SGD) for training machine learning models, it is often crucial to provide the model with examples sampled at random from the dataset. However, for large datasets stored in the cloud, random access to individual examples can be costly and inefficient.\nA recent work proposed an online shuffling algorithm called CorgiPile, which greatly improves efficiency of data access, at the cost of some performance loss, which becomes particularly apparent for large datasets stored in homogeneous shards (e.g., video datasets).\nIn this paper, we extend CorgiPile by adding an efficient offline iteration, transforming it into a hybrid two-step partial data shuffling strategy. We show through comprehensive theoretical analysis that our approach performs similarly to SGD with random access (even for homogenous data) without compromising on the data access efficiency of CorgiPile, and demonstrate its practical advantages through experimental results.",
        "keywords": "Data Shuffle;SGD;Theoretical Guarantees",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Etay Livne;Gal Kaplun;eran malach;Shai Shalev-Shwartz",
        "authorids": "~Etay_Livne1;~Gal_Kaplun1;~eran_malach1;~Shai_Shalev-Shwartz1",
        "gender": "M;M;M;M",
        "homepage": ";http://www.galkaplun.com;;http://www.cs.huji.ac.il/~shais/",
        "dblp": ";237/9816;202/2566;95/2750",
        "google_scholar": ";y4BzFYsAAAAJ;I15dUOwAAAAJ;https://scholar.google.co.il/citations?user=uYVc9koAAAAJ",
        "orcid": ";;;",
        "linkedin": "etay-livne-6a7006276/;gal-kaplun-865496151/;;",
        "or_profile": "~Etay_Livne1;~Gal_Kaplun1;~eran_malach1;~Shai_Shalev-Shwartz1",
        "aff": "Mobileye;;Harvard University;Hebrew University, Hebrew University of Jerusalem",
        "aff_domain": "mobileye.com;;harvard.edu;cs.huji",
        "position": "Researcher;;Postdoc;Full Professor",
        "bibtex": "@misc{\nlivne2024corgi,\ntitle={Corgi\\${\\textasciicircum}2\\$: A Hybrid Offline-Online Approach To Storage-Aware Data Shuffling For {SGD}},\nauthor={Etay Livne and Gal Kaplun and eran malach and Shai Shalev-Shwartz},\nyear={2024},\nurl={https://openreview.net/forum?id=jiQg5IvuYF}\n}",
        "github": "",
        "project": "",
        "reviewers": "FYCm;ZuF5;neFw;xhMF",
        "site": "https://openreview.net/forum?id=jiQg5IvuYF",
        "pdf_size": 2258776,
        "rating": "3;3;5;6",
        "confidence": "4;4;3;3",
        "soundness": "2;2;2;3",
        "contribution": "1;2;3;2",
        "presentation": "2;3;3;3",
        "wc_summary": "59;92;52;118",
        "wc_strengths": "10;31;39;77",
        "wc_weaknesses": "199;476;98;346",
        "wc_questions": "2;58;15;88",
        "wc_review": "270;657;204;629",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            80.25,
            26.517682779609533
        ],
        "wc_strengths_avg": [
            39.25,
            24.23195204683271
        ],
        "wc_weaknesses_avg": [
            279.75,
            143.57641693537278
        ],
        "wc_questions_avg": [
            40.75,
            34.259122872601395
        ],
        "wc_review_avg": [
            440.0,
            204.5763915998129
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9622504486493761,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:MiexrxbEnWEJ:scholar.google.com/&scioq=Corgi%24%5E2%24:+A+Hybrid+Offline-Online+Approach+To+Storage-Aware+Data+Shuffling+For+SGD&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Mobileye;Harvard University;Hebrew University of Jerusalem",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.mobileye.com;https://www.harvard.edu;https://www.huji.ac.il",
        "aff_unique_abbr": "Mobileye;Harvard;HUJI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Israel;United States"
    },
    {
        "title": "Stochastic Controlled Averaging for Federated Learning with Communication Compression",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18012",
        "id": "jj5ZjZsWJe",
        "author_site": "Xinmeng Huang, Ping Li, Xiaoyun Li",
        "tldr": "",
        "abstract": "Communication compression has been an important topic in Federated Learning (FL) for alleviating the communication overhead. However, communication compression brings forth new challenges in FL due to the interplay of compression-incurred information distortion and inherent characteristics of FL such as partial participation and data heterogeneity. Despite the recent development, the existing approaches either cannot accommodate arbitrary data heterogeneity or partial participation, or require stringent conditions on compression. In this paper, we revisit the seminal stochastic controlled averaging method by proposing an equivalent but more efficient/simplified formulation with halved uplink communication costs, building upon which we propose two compressed FL algorithms, SCALLION and  SCAFCOM, to support unbiased and biased compression, respectively. Both the proposed methods outperform the existing compressed FL methods in terms of communication and computation complexities. Moreover,SCALLION and SCAFCOM attain fast convergence rates under arbitrary data heterogeneity without any additional assumptions on compression errors. Experiments show that \\scallion and  \\scafcom outperform recent compressed FL methods under the same communication budget.",
        "keywords": "federated learning;communication compression;data heterogeneity;controlled averaging",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Xinmeng Huang;Ping Li;Xiaoyun Li",
        "authorids": "~Xinmeng_Huang1;~Ping_Li3;~Xiaoyun_Li2",
        "gender": "M;M;M",
        "homepage": ";http://www.stat.rutgers.edu/home/pingli/;",
        "dblp": "256/1617;62/5860-1;48/1982",
        "google_scholar": "vM2nHxEAAAAJ;;",
        "orcid": ";;",
        "linkedin": "xinmeng-huang-8032221b3/;;",
        "or_profile": "~Xinmeng_Huang1;~Ping_Li3;~Xiaoyun_Li2",
        "aff": "University of Pennsylvania;LinkedIn;LinkedIn",
        "aff_domain": "upenn.edu;linkedin.com;linkedin.com",
        "position": "PhD student;Engineer;Researcher",
        "bibtex": "@inproceedings{\nhuang2024stochastic,\ntitle={Stochastic Controlled Averaging for Federated Learning with Communication Compression},\nauthor={Xinmeng Huang and Ping Li and Xiaoyun Li},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=jj5ZjZsWJe}\n}",
        "github": "",
        "project": "",
        "reviewers": "fdMe;17jD;aALW",
        "pdf_size": 732311,
        "rating": "8;8;8",
        "confidence": "4;3;2",
        "soundness": "3;3;3",
        "contribution": "4;3;3",
        "presentation": "4;4;3",
        "wc_summary": "170;69;67",
        "wc_strengths": "152;51;18",
        "wc_weaknesses": "238;25;147",
        "wc_questions": "111;33;7",
        "wc_review": "671;178;239",
        "wc_reply_reviewers": "300;32;95",
        "wc_reply_authors": "374;121;424",
        "reply_reviewers": "1;1;1",
        "reply_authors": "3;2;2",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            102.0,
            48.09019304043878
        ],
        "wc_strengths_avg": [
            73.66666666666667,
            57.00487308604025
        ],
        "wc_weaknesses_avg": [
            136.66666666666666,
            87.26333072309863
        ],
        "wc_questions_avg": [
            50.333333333333336,
            44.19150245113747
        ],
        "wc_review_avg": [
            362.6666666666667,
            219.44222221097033
        ],
        "wc_reply_reviewers_avg": [
            142.33333333333334,
            114.41542242586394
        ],
        "wc_reply_authors_avg": [
            306.3333333333333,
            132.63064837694526
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 28,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8978063110694915968&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=jj5ZjZsWJe",
        "pdf": "https://openreview.net/pdf?id=jj5ZjZsWJe",
        "email": "upenn.edu;linkedin.com;linkedin.com",
        "author_num": 3,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "University of Pennsylvania;LinkedIn Corporation",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.upenn.edu;https://www.linkedin.com",
        "aff_unique_abbr": "UPenn;LinkedIn",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "LLM Augmented LLMs: Expanding Capabilities through Composition",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18011",
        "id": "jjA4O1vJRz",
        "author_site": "Rachit Bansal, Bidisha Samanta, Siddharth Dalmia, Nitish Gupta, Sriram Ganapathy, Abhishek Bapna, Prateek Jain, Partha Talukdar",
        "tldr": "",
        "abstract": "Foundational models with billions of parameters which have been trained on large corpus of data have demonstrated non-trivial skills in a variety of domains. However, due to their monolithic structure, it is challenging and expensive to augment them or impart new skills. On the other hand, due to their adaptation abilities,several new instances of these models are being trained towards new domains and tasks.  In this work, we study the problem of efficient and practical composition of existing foundation models with more specific models to enable newer capabilities. To this end,  we propose CALM\u2014Composition to Augment Language Models\u2014which introduces cross-attention between models to compose their representations and enable new capabilities. Salient features of CALM are: (i) Scales up LLMs on new tasks by \u2018re-using\u2019 existing LLMs along with a few additional parameters and data, (ii) Existing model weights are kept intact, and hence preserves existing capabilities, and (iii) Applies to diverse domains and settings. We illustrate that augmenting PaLM2-S with a smaller model trained on low-resource languages results in an absolute improvement of up to 13% on tasks like translation into English and arithmetic reasoning for low-resource languages. Similarly,when PaLM2-S is augmented with a code-specific model, we see a relative improvement of 40% over the base model for code generation and explanation tasks\u2014on-par with fully fine-tuned counterparts.",
        "keywords": "Large Language Models;Model Composition;Knowledge Augmentation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Rachit Bansal;Bidisha Samanta;Siddharth Dalmia;Nitish Gupta;Sriram Ganapathy;Abhishek Bapna;Prateek Jain;Partha Talukdar",
        "authorids": "~Rachit_Bansal1;~Bidisha_Samanta2;~Siddharth_Dalmia1;~Nitish_Gupta1;~Sriram_Ganapathy1;~Abhishek_Bapna1;~Prateek_Jain1;~Partha_Talukdar1",
        "gender": "M;F;M;M;M;M;M;M",
        "homepage": "https://rachitbansal.github.io;https://sites.google.com/view/bidisha-samanta/;https://www.cs.cmu.edu/~sdalmia;http://nitishgupta.github.io/;http://leap.ee.iisc.ac.in/sriram/;;http://prateekjain.org;https://parthatalukdar.github.io/",
        "dblp": "228/6038;198/0754;175/8966;45/10343;23/4298.html;;https://dblp.uni-trier.de/pers/j/Jain_0002:Prateek.html;282/0169.html",
        "google_scholar": "https://scholar.google.co.in/citations?user=7-x28WYAAAAJ;https://scholar.google.co.in/citations?user=qJrVMhMAAAAJ;HSAe9OUAAAAJ;STiAua8AAAAJ;cgpzrtcAAAAJ;;qYhRbJoAAAAJ;https://scholar.google.com.tw/citations?user=CIZwXAcAAAAJ",
        "orcid": ";;0000-0003-0437-5988;;;;;",
        "linkedin": ";bidisha-samanta-baa73b5b/;siddalmia/;;;abhishek-bapna-529908/;;",
        "or_profile": "~Rachit_Bansal1;~Bidisha_Samanta2;~Siddharth_Dalmia1;~Nitish_Gupta1;~Sriram_Ganapathy1;~Abhishek_Bapna1;~Prateek_Jain1;~Partha_Talukdar1",
        "aff": "Research, Google;Research, Google;Google Deepmind;Google;Google DeepMind;;Google;Indian Institute of Science, Bangalore",
        "aff_domain": "research.google.com;research.google.com;google.com;google.com;google.com;;google.com;iisc.ac.in",
        "position": "Researcher;Researcher;Researcher;Researcher;Researcher;;Researcher;Associate Professor",
        "bibtex": "@inproceedings{\nbansal2024llm,\ntitle={{LLM} Augmented {LLM}s: Expanding Capabilities through Composition},\nauthor={Rachit Bansal and Bidisha Samanta and Siddharth Dalmia and Nitish Gupta and Sriram Ganapathy and Abhishek Bapna and Prateek Jain and Partha Talukdar},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=jjA4O1vJRz}\n}",
        "github": "",
        "project": "",
        "reviewers": "AR8D;QMa2;kQBq;6aS2",
        "pdf_size": 392454,
        "rating": "6;6;6;8",
        "confidence": "4;3;4;4",
        "soundness": "3;3;2;4",
        "contribution": "3;3;3;4",
        "presentation": "3;3;2;3",
        "wc_summary": "73;89;150;105",
        "wc_strengths": "42;123;60;101",
        "wc_weaknesses": "87;246;110;124",
        "wc_questions": "3;127;76;33",
        "wc_review": "205;585;396;363",
        "wc_reply_reviewers": "0;0;0;6",
        "wc_reply_authors": "986;1810;898;341",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "3;4;3;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            104.25,
            28.734778579275673
        ],
        "wc_strengths_avg": [
            81.5,
            32.113081446662825
        ],
        "wc_weaknesses_avg": [
            141.75,
            61.621323419738395
        ],
        "wc_questions_avg": [
            59.75,
            46.69783185545128
        ],
        "wc_review_avg": [
            387.25,
            135.078449428471
        ],
        "wc_reply_reviewers_avg": [
            1.5,
            2.598076211353316
        ],
        "wc_reply_authors_avg": [
            1008.75,
            524.5652366484077
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            1.0897247358851685
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 44,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3668029210306898471&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 8,
        "openreview": "https://openreview.net/forum?id=jjA4O1vJRz",
        "pdf": "https://openreview.net/pdf?id=jjA4O1vJRz",
        "email": "research.google.com;research.google.com;google.com;google.com;google.com;;google.com;iisc.ac.in",
        "author_num": 8,
        "aff_unique_index": "0;0;1;0;0;0;2",
        "aff_unique_norm": "Google;DeepMind;Indian Institute of Science",
        "aff_unique_dep": "Google Research;DeepMind;",
        "aff_unique_url": "https://research.google;https://deepmind.com;https://www.iisc.ac.in",
        "aff_unique_abbr": "Google;DeepMind;IISc",
        "aff_campus_unique_index": "0;0;0;0;2",
        "aff_campus_unique": "Mountain View;;Bangalore",
        "aff_country_unique_index": "0;0;1;0;1;0;2",
        "aff_country_unique": "United States;United Kingdom;India"
    },
    {
        "title": "Self-Supervised High Dynamic Range Imaging with Multi-Exposure Images in Dynamic Scenes",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18010",
        "id": "jjiOHEcS2c",
        "author_site": "Zhilu Zhang, Haoyu Wang, Shuai Liu, Xiaotao Wang, LEI LEI, Wangmeng Zuo",
        "tldr": "",
        "abstract": "Merging multi-exposure images is a common approach for obtaining high dynamic range (HDR) images, with the primary challenge being the avoidance of ghosting artifacts in dynamic scenes. Recent methods have proposed using deep neural networks for deghosting. However, the methods typically rely on sufficient data with HDR ground-truths, which are difficult and costly to collect. In this work, to eliminate the need for labeled data, we propose SelfHDR, a self-supervised HDR reconstruction method that only requires dynamic multi-exposure images during training. Specifically, SelfHDR learns a reconstruction network under the supervision of two complementary components, which can be constructed from multi-exposure images and focus on HDR color as well as structure, respectively. The color component is estimated from aligned multi-exposure images, while the structure one is generated through a structure-focused network that is supervised by the color component and an input reference (\\eg, medium-exposure) image. During testing, the learned reconstruction network is directly deployed to predict an HDR image. Experiments on real-world images demonstrate our SelfHDR achieves superior results against the state-of-the-art self-supervised methods, and comparable performance to supervised ones. Codes are available at https://github.com/cszhilu1998/SelfHDR",
        "keywords": "High Dynamic Range Imaging; Self-Supervised Learning; Multi-Exposure Images",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Zhilu Zhang;Haoyu Wang;Shuai Liu;Xiaotao Wang;LEI LEI;Wangmeng Zuo",
        "authorids": "~Zhilu_Zhang2;~Haoyu_Wang13;~Shuai_Liu8;~Xiaotao_Wang1;~LEI_LEI2;~Wangmeng_Zuo3",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://github.com/cszhilu1998;https://github.com/hywang2002;http://no;https://no;https://dblp.org/pid/09/471;",
        "dblp": ";;76/5789-0009;42/10799.html;;93/2671",
        "google_scholar": "8pIq2N0AAAAJ;;https://scholar.google.com.hk/citations?user=nXedfIsAAAAJ;;;rUOpCEYAAAAJ",
        "orcid": "0000-0002-5758-5949;;;;;0000-0002-3330-783X",
        "linkedin": ";;;;;",
        "or_profile": "~Zhilu_Zhang2;~Haoyu_Wang13;~Shuai_Liu8;~Xiaotao_Wang1;~LEI_LEI2;~Wangmeng_Zuo3",
        "aff": "Harbin Institute of Technology;Harbin Institute of Technology;Xiaomi;XiaomiCamera;Xiaomi;Harbin Institute of Technology",
        "aff_domain": "hit.edu.cn;hit.edu.cn;xiaomi.com;xiaomi.com;xiaomi.com;hit.edu.cn",
        "position": "PhD student;Undergrad student;Researcher;Researcher;Researcher;Full Professor",
        "bibtex": "@inproceedings{\nzhang2024selfsupervised,\ntitle={Self-Supervised High Dynamic Range Imaging with Multi-Exposure Images in Dynamic Scenes},\nauthor={Zhilu Zhang and Haoyu Wang and Shuai Liu and Xiaotao Wang and LEI LEI and Wangmeng Zuo},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=jjiOHEcS2c}\n}",
        "github": "",
        "project": "",
        "reviewers": "TwnM;Vk35;DQCr;nVjt",
        "pdf_size": 37052885,
        "rating": "6;6;8;8",
        "confidence": "3;4;4;5",
        "soundness": "2;3;3;4",
        "contribution": "2;2;3;4",
        "presentation": "2;3;3;3",
        "wc_summary": "102;70;71;42",
        "wc_strengths": "112;49;45;40",
        "wc_weaknesses": "81;158;66;58",
        "wc_questions": "144;85;123;5",
        "wc_review": "439;362;305;145",
        "wc_reply_reviewers": "23;0;14;0",
        "wc_reply_authors": "534;489;618;405",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            71.25,
            21.22940178149163
        ],
        "wc_strengths_avg": [
            61.5,
            29.33001875212493
        ],
        "wc_weaknesses_avg": [
            90.75,
            39.694930406791244
        ],
        "wc_questions_avg": [
            89.25,
            53.039490005089604
        ],
        "wc_review_avg": [
            312.75,
            107.89433488371853
        ],
        "wc_reply_reviewers_avg": [
            9.25,
            9.781998773256925
        ],
        "wc_reply_authors_avg": [
            511.5,
            76.96914966400499
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.7071067811865475,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7721779986017665106&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=jjiOHEcS2c",
        "pdf": "https://openreview.net/pdf?id=jjiOHEcS2c",
        "email": "hit.edu.cn;hit.edu.cn;xiaomi.com;xiaomi.com;xiaomi.com;hit.edu.cn",
        "author_num": 6,
        "aff_unique_index": "0;0;1;1;1;0",
        "aff_unique_norm": "Harbin Institute of Technology;Xiaomi Corporation",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.hit.edu.cn/;https://www.xiaomi.com",
        "aff_unique_abbr": "HIT;Xiaomi",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Harbin;",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "jkhVrIllKg",
        "title": "Federated Learning Under Second-Order Data Heterogeneity",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We consider the problem of Federated Learning over clients with heterogeneous data. We propose an algorithm called SABER that samples a subset of clients and tasks each client with its own local subproblem. SABER provably reduces client drift by incorporating an estimate of the global update direction and regularization into each client's subproblem. Under second-order data heterogeneity with parameter $\\delta$, we prove that the method's communication complexity for nonconvex problems is $O\\left(\\delta\\varepsilon^2\\sqrt{M}\\right)$. In addition, for problems satisfying $\\mu$-Polyak-Lojasiewicz condition, the method converges linearly with communication complexity of $O\\left(\\left(\\frac{\\delta}{\\mu}\\sqrt{M} + M\\right)\\log\\frac{1}{\\varepsilon}\\right)$. To showcase the empirical performance of our method, we compare it to standard baselines such as FedAvg on a few empirical problems.",
        "keywords": "federated learning;data heterogeneity;optimization;theory",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/d924fbe3d97c6ca4e69069742b3326c8493fd139.pdf",
        "author": "Konstantin Mishchenko;Rui Li;Hongxiang Fan;Stylianos Venieris",
        "authorids": "~Konstantin_Mishchenko1;~Rui_Li11;~Hongxiang_Fan1;~Stylianos_Venieris1",
        "gender": ";F;M;",
        "homepage": "https://konstmish.com/;https://ruihuili.github.io/;https://os-hxfan.github.io/;https://steliosven10.github.io/",
        "dblp": "222/9853;;;169/2322",
        "google_scholar": "Z8Y8nhQAAAAJ;;iBT_uw4AAAAJ;https://scholar.google.co.uk/citations?user=A1QXa5cAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;stylianos-i-venieris-300446155",
        "or_profile": "~Konstantin_Mishchenko1;~Rui_Li11;~Hongxiang_Fan1;~Stylianos_Venieris1",
        "aff": "Samsung;Samsung AI Center;Samsung;Samsung AI",
        "aff_domain": "samsung.com;samsung.com;samsung.com;samsung.com",
        "position": "Researcher;Researcher;Researcher;Researcher",
        "bibtex": "@misc{\nmishchenko2024federated,\ntitle={Federated Learning Under Second-Order Data Heterogeneity},\nauthor={Konstantin Mishchenko and Rui Li and Hongxiang Fan and Stylianos Venieris},\nyear={2024},\nurl={https://openreview.net/forum?id=jkhVrIllKg}\n}",
        "github": "",
        "project": "",
        "reviewers": "M25p;cfg4;MTuL;CbZE",
        "site": "https://openreview.net/forum?id=jkhVrIllKg",
        "pdf_size": 404121,
        "rating": "3;3;5;6",
        "confidence": "4;3;4;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;4;3;3",
        "wc_summary": "127;51;50;39",
        "wc_strengths": "91;36;47;73",
        "wc_weaknesses": "612;158;173;75",
        "wc_questions": "4;57;3;157",
        "wc_review": "834;302;273;344",
        "wc_reply_reviewers": "102;167;23;25",
        "wc_reply_authors": "408;530;267;380",
        "reply_reviewers": "1;2;1;1",
        "reply_authors": "2;3;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            66.75,
            35.102528398962946
        ],
        "wc_strengths_avg": [
            61.75,
            21.579793789561567
        ],
        "wc_weaknesses_avg": [
            254.5,
            209.75044696019125
        ],
        "wc_questions_avg": [
            55.25,
            62.67525428747776
        ],
        "wc_review_avg": [
            438.25,
            229.87646138741565
        ],
        "wc_reply_reviewers_avg": [
            79.25,
            59.84302382065933
        ],
        "wc_reply_authors_avg": [
            396.25,
            93.53709157334325
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.19245008972987526,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1218762063353262688&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Samsung",
        "aff_unique_dep": "Samsung",
        "aff_unique_url": "https://www.samsung.com",
        "aff_unique_abbr": "Samsung",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "jkonJu7ScD",
        "title": "MIND: Masked and Inverse Dynamics Modeling for Data-Efficient Deep Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In pixel-based deep reinforcement learning (DRL), learning representations of states that change because of an agent\u2019s action or interaction with the environment poses a critical challenge in improving data efficiency. Recent data-efficient DRL studies have integrated DRL with self-supervised learning (SSL) and data augmentation to learn state representations from given interactions. However, some methods have difficulties in explicitly capturing evolving state representations or in selecting data augmentations for appropriate reward signals. Our goal is to explicitly learn the inherent dynamics that change with an agent\u2019s intervention and interaction with the environment. We propose masked and inverse dynamics modeling (MIND), which uses masking augmentation and fewer hyperparameters to learn agent-controllable representations in changing states. Our method is comprised of a self-supervised multi-task learning that leverages a transformer architecture, which captures the spatio-temporal information underlying in the highly correlated consecutive frames. MIND uses two tasks to perform self-supervised multi-task learning: masked modeling and inverse dynamics modeling. Masked modeling learns the static visual representation required for control in the state, and inverse dynamics modeling learns the rapidly evolving state representation with agent intervention. By integrating inverse dynamics modeling as a complementary component to masked modeling, our method effectively learns evolving state representations. We evaluate our method by using discrete and continuous control environments with limited interactions. MIND outperforms previous methods across benchmarks and significantly improves data efficiency.",
        "keywords": "deep reinforcement learning;inverse dynamics modeling;masked modeling;self-supervised multi-task learning;transformer",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/6bc8ec1f7f1f4dccce4c2a5a31a9cdd71cfc9890.zip",
        "author": "Young Jae Lee;Jaehoon Kim;Youngjoon Park;Min Gu Kwak;Seoung Bum Kim",
        "authorids": "~Young_Jae_Lee1;~Jaehoon_Kim2;~Youngjoon_Park1;~Min_Gu_Kwak1;~Seoung_Bum_Kim1",
        "gender": "M;M;;M;M",
        "homepage": ";;;;http://dmqa.korea.ac.kr/",
        "dblp": ";;;;48/803",
        "google_scholar": ";d1DjmOQAAAAJ;;sFsZSfMAAAAJ;https://scholar.google.co.kr/citations?user=-ACQ0GAAAAAJ",
        "orcid": "0000-0002-1309-0602;0000-0002-4773-6467;;0000-0003-0649-9909;",
        "linkedin": ";;;min-gu-kwak-787b35199/;",
        "or_profile": "~Young_Jae_Lee1;~Jaehoon_Kim2;~Youngjoon_Park1;~Min_Gu_Kwak1;~Seoung_Bum_Kim1",
        "aff": "Korea University;Korea University;;Georgia Institute of Technology;Korea University",
        "aff_domain": "korea.ac.kr;korea.ac.kr;;gatech.edu;korea.ac.kr",
        "position": "PhD student;PhD student;;Postdoc;Full Professor",
        "bibtex": "@misc{\nlee2024mind,\ntitle={{MIND}: Masked and Inverse Dynamics Modeling for Data-Efficient Deep Reinforcement Learning},\nauthor={Young Jae Lee and Jaehoon Kim and Youngjoon Park and Min Gu Kwak and Seoung Bum Kim},\nyear={2024},\nurl={https://openreview.net/forum?id=jkonJu7ScD}\n}",
        "github": "",
        "project": "",
        "reviewers": "Hy4i;t6qc;uqBc;RYme",
        "site": "https://openreview.net/forum?id=jkonJu7ScD",
        "pdf_size": 1026501,
        "rating": "3;5;5;6",
        "confidence": "5;4;4;4",
        "soundness": "1;2;2;3",
        "contribution": "2;3;2;2",
        "presentation": "1;3;3;2",
        "wc_summary": "54;58;19;103",
        "wc_strengths": "22;32;44;66",
        "wc_weaknesses": "289;99;48;129",
        "wc_questions": "3;296;15;37",
        "wc_review": "368;485;126;335",
        "wc_reply_reviewers": "0;97;30;0",
        "wc_reply_authors": "694;763;683;522",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            58.5,
            29.837057495671385
        ],
        "wc_strengths_avg": [
            41.0,
            16.401219466856727
        ],
        "wc_weaknesses_avg": [
            141.25,
            90.08433548625422
        ],
        "wc_questions_avg": [
            87.75,
            120.8498551923005
        ],
        "wc_review_avg": [
            328.5,
            129.519303580586
        ],
        "wc_reply_reviewers_avg": [
            31.75,
            39.61297136040163
        ],
        "wc_reply_authors_avg": [
            665.5,
            88.34166627362198
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9271726499455306,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:tHvGYda5cqYJ:scholar.google.com/&scioq=MIND:+Masked+and+Inverse+Dynamics+Modeling+for+Data-Efficient+Deep+Reinforcement+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Korea University;Georgia Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.korea.ac.kr;https://www.gatech.edu",
        "aff_unique_abbr": "KU;Georgia Tech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "title": "Space Group Constrained Crystal Generation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18009",
        "id": "jkvZ7v4OmP",
        "author_site": "Rui Jiao, Wenbing Huang, Yu Liu, Deli Zhao, Yang Liu",
        "tldr": "",
        "abstract": "Crystals are the foundation of numerous scientific and industrial applications. While various learning-based approaches have been proposed for crystal generation, existing methods neglect the spacegroup constraint which is crucial in describing the geometry of crystals and closely relevant to many desirable properties. However, considering spacegroup constraint is challenging owing to its diverse and nontrivial forms. In this paper, we reduce the spacegroup constraint into an equivalent formulation that is more tractable to be handcrafted into the generation process. In particular, we translate the spacegroup constraint into two cases: the basis constraint of the invariant exponential space of the lattice matrix and the Wyckoff position constraint of the fractional coordinates. Upon the derived constraints, we then propose DiffCSP++, a novel diffusion model that has enhanced a previous work DiffCSP by further taking spacegroup constraint into account. Experiments on several popular datasets verify the benefit of the involvement of the spacegroup constraint, and show that our DiffCSP++ achieves the best or comparable performance on crystal structure prediction and ab initio crystal generation.",
        "keywords": "material generation;spacegroup;diffusion generative models",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Rui Jiao;Wenbing Huang;Yu Liu;Deli Zhao;Yang Liu",
        "authorids": "~Rui_Jiao1;~Wenbing_Huang1;~Yu_Liu23;~Deli_Zhao1;~Yang_Liu19",
        "gender": "M;M;M;M;M",
        "homepage": "https://jiaor17.github.io/;https://gsai.ruc.edu.cn/english/wenbing_huang;https://github.com/liuyuyuil;https://zhaodeli.github.io;http://nlp.csai.tsinghua.edu.cn/~ly/",
        "dblp": "223/1073;155/3181-1.html;97/2274-63;77/1992;51/3710-5",
        "google_scholar": "buW16-AAAAAJ;0yNkmO4AAAAJ;8zksQb4AAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com.hk/citations?user=lVhoKNcAAAAJ",
        "orcid": ";;;0000-0002-8838-578X;0000-0002-3087-242X",
        "linkedin": ";;;;",
        "or_profile": "~Rui_Jiao1;~Wenbing_Huang1;~Yu_Liu23;~Deli_Zhao1;~Yang_Liu19",
        "aff": "Tsinghua University;Renmin University of China;Alibaba Group;Alibaba Group;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;ruc.edu.cn;alibaba-inc.com;alibaba-inc.com;tsinghua.edu.cn",
        "position": "PhD student;Associate Professor;Researcher;Director;Professor",
        "bibtex": "@inproceedings{\njiao2024space,\ntitle={Space Group Constrained Crystal Generation},\nauthor={Rui Jiao and Wenbing Huang and Yu Liu and Deli Zhao and Yang Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=jkvZ7v4OmP}\n}",
        "github": "",
        "project": "",
        "reviewers": "34Zd;GFzi;GbgC",
        "pdf_size": 1249880,
        "rating": "6;8;8",
        "confidence": "3;3;2",
        "soundness": "3;4;3",
        "contribution": "3;4;3",
        "presentation": "3;3;3",
        "wc_summary": "45;37;165",
        "wc_strengths": "30;21;124",
        "wc_weaknesses": "50;164;50",
        "wc_questions": "5;20;4",
        "wc_review": "130;242;343",
        "wc_reply_reviewers": "25;0;35",
        "wc_reply_authors": "763;498;356",
        "reply_reviewers": "1;0;1",
        "reply_authors": "3;2;2",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            82.33333333333333,
            58.545329066933725
        ],
        "wc_strengths_avg": [
            58.333333333333336,
            46.578488120113505
        ],
        "wc_weaknesses_avg": [
            88.0,
            53.74011537017761
        ],
        "wc_questions_avg": [
            9.666666666666666,
            7.318166133366716
        ],
        "wc_review_avg": [
            238.33333333333334,
            86.9955298979334
        ],
        "wc_reply_reviewers_avg": [
            20.0,
            14.719601443879744
        ],
        "wc_reply_authors_avg": [
            539.0,
            168.66732542690855
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 41,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16106386297098268460&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=jkvZ7v4OmP",
        "pdf": "https://openreview.net/pdf?id=jkvZ7v4OmP",
        "email": "tsinghua.edu.cn;ruc.edu.cn;alibaba-inc.com;alibaba-inc.com;tsinghua.edu.cn",
        "author_num": 5,
        "aff_unique_index": "0;1;2;2;0",
        "aff_unique_norm": "Tsinghua University;Renmin University of China;Alibaba Group",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;http://www.ruc.edu.cn;https://www.alibaba.com",
        "aff_unique_abbr": "THU;RUC;Alibaba",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "How Does Unlabeled Data Provably Help Out-of-Distribution Detection?",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18008",
        "id": "jlEjB8MVGa",
        "author_site": "Xuefeng Du, Zhen Fang, Ilias Diakonikolas, Yixuan Li",
        "tldr": "",
        "abstract": "Using unlabeled data to regularize the machine learning models has demonstrated promise for improving safety and reliability in detecting out-of-distribution (OOD) data. Harnessing the power of unlabeled in-the-wild data is non-trivial due to the heterogeneity of both in-distribution (ID) and OOD data. This lack of a clean set of OOD samples poses significant challenges in learning an optimal OOD classifier. Currently, there is a lack of research on formally understanding how unlabeled data helps OOD detection. This paper bridges the gap by introducing a new learning framework SAL (Separate And Learn) that offers both strong theoretical guarantees and empirical effectiveness. The framework separates candidate outliers from the unlabeled data and then trains an OOD classifier using the candidate outliers and the labeled ID data. Theoretically, we provide rigorous error bounds from the lens of separability and learnability, formally justifying the two components in our algorithm. Our theory shows that SAL can separate the candidate outliers with small error rates, which leads to a generalization guarantee for the learned OOD classifier. Empirically, SAL achieves state-of-the-art performance on common benchmarks, reinforcing our theoretical insights. Code is publicly available at https://github.com/deeplearning-wisc/sal.",
        "keywords": "out-of-distribution detection;learnability",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Xuefeng Du;Zhen Fang;Ilias Diakonikolas;Yixuan Li",
        "authorids": "~Xuefeng_Du1;~Zhen_Fang2;~Ilias_Diakonikolas1;~Yixuan_Li1",
        "gender": "M;M;M;F",
        "homepage": "https://d12306.github.io/;https://fang-zhen.github.io/index.html;http://www.iliasdiakonikolas.org/;http://pages.cs.wisc.edu/~sharonli/",
        "dblp": "34/3557;;d/IliasDiakonikolas;144/6087-1",
        "google_scholar": "GE_aEh4AAAAJ;OzD6WJcAAAAJ;Vb3FLmkAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";0000-0003-0602-6255;;",
        "linkedin": "xuefeng-du-094723192/;;;liyixuan",
        "or_profile": "~Xuefeng_Du1;~Zhen_Fang2;~Ilias_Diakonikolas1;~Yixuan_Li1",
        "aff": "University of Wisconsin, Madison;University of Technology Sydney;University of Wisconsin - Madison;Cornell University",
        "aff_domain": "wisc.edu;uts.edu.au;wisc.edu;cornell.edu",
        "position": "PhD student;Assistant Professor;Full Professor;Graduate Student",
        "bibtex": "@inproceedings{\ndu2024how,\ntitle={How Does Unlabeled Data Provably Help Out-of-Distribution Detection?},\nauthor={Xuefeng Du and Zhen Fang and Ilias Diakonikolas and Yixuan Li},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=jlEjB8MVGa}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZN1X;dSEG;BtG8;XJRS",
        "pdf_size": 1174975,
        "rating": "6;6;6;8",
        "confidence": "3;5;2;3",
        "soundness": "3;2;4;3",
        "contribution": "3;2;3;3",
        "presentation": "3;3;3;2",
        "wc_summary": "89;102;70;75",
        "wc_strengths": "109;28;58;71",
        "wc_weaknesses": "135;88;51;126",
        "wc_questions": "31;156;42;5",
        "wc_review": "364;374;221;277",
        "wc_reply_reviewers": "0;26;0;25",
        "wc_reply_authors": "883;1200;464;854",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "2;4;1;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            1.0897247358851685
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            84.0,
            12.509996003196804
        ],
        "wc_strengths_avg": [
            66.5,
            29.073183520213263
        ],
        "wc_weaknesses_avg": [
            100.0,
            33.3391661563393
        ],
        "wc_questions_avg": [
            58.5,
            57.87270513808733
        ],
        "wc_review_avg": [
            309.0,
            63.28111882702454
        ],
        "wc_reply_reviewers_avg": [
            12.75,
            12.754901018824098
        ],
        "wc_reply_authors_avg": [
            850.25,
            261.05590876285487
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            1.0897247358851685
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.13245323570650439,
        "gs_citation": 25,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2527305805770957243&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=jlEjB8MVGa",
        "pdf": "https://openreview.net/pdf?id=jlEjB8MVGa",
        "email": "wisc.edu;uts.edu.au;wisc.edu;cornell.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "University of Wisconsin;University of Technology Sydney;University of Wisconsin-Madison;Cornell University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.wisc.edu;https://www.uts.edu.au;https://www.wisc.edu;https://www.cornell.edu",
        "aff_unique_abbr": "UW;UTS;UW-Madison;Cornell",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Madison;",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "United States;Australia"
    },
    {
        "title": "COPlanner: Plan to Roll Out Conservatively but to Explore Optimistically for Model-Based RL",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18007",
        "id": "jnFcKjtUPN",
        "author_site": "Xiyao Wang, Ruijie Zheng, Yanchao Sun, Ruonan Jia, Wichayaporn Wongkamjan, Huazhe Xu, Furong Huang",
        "tldr": "",
        "abstract": "Dyna-style model-based reinforcement learning contains two phases: model rollouts to generate sample for policy learning and real environment exploration using current policy for dynamics model learning. However, due to the complex real-world environment, it is inevitable to learn an imperfect dynamics model with model prediction error, which can further mislead policy learning and result in sub-optimal solutions. In this paper, we propose $\\texttt{COPlanner}$, a planning-driven framework for model-based methods to address the inaccurately learned dynamics model problem with conservative model rollouts and optimistic environment exploration. $\\texttt{COPlanner}$ leverages an uncertainty-aware policy-guided model predictive control (UP-MPC) component to plan for multi-step uncertainty estimation. This estimated uncertainty then serves as a penalty during model rollouts and as a bonus during real environment exploration  respectively, to choose actions. Consequently, $\\texttt{COPlanner}$ can avoid model uncertain regions through conservative model rollouts,  thereby alleviating the influence of model error. Simultaneously, it explores high-reward model uncertain regions to reduce model error actively through optimistic real environment exploration. $\\texttt{COPlanner}$ is a plug-and-play framework that can be applied to any dyna-style model-based methods. Experimental results on a series of proprioceptive and visual continuous control tasks demonstrate that both sample efficiency and asymptotic performance of strong model-based methods are significantly improved combined with $\\texttt{COPlanner}$.",
        "keywords": "Model-based RL; Model-predictive control; Model rollouts; Model error",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Xiyao Wang;Ruijie Zheng;Yanchao Sun;Ruonan Jia;Wichayaporn Wongkamjan;Huazhe Xu;Furong Huang",
        "authorids": "~Xiyao_Wang1;~Ruijie_Zheng1;~Yanchao_Sun1;~Ruonan_Jia1;~Wichayaporn_Wongkamjan1;~Huazhe_Xu1;~Furong_Huang1",
        "gender": "M;;F;M;F;M;F",
        "homepage": ";http://www.ruijiezheng.com;https://ycsun2017.github.io/home/index.html;https://github.com/jiaruonan;https://wwongkamjan.github.io/;http://hxu.rocks;https://furong-huang.com",
        "dblp": ";294/8474;132/6840;164/0792;325/4756;164/9006;72/8513",
        "google_scholar": "puVqfbwAAAAJ;;bloBY_QAAAAJ;;rnWb3ikAAAAJ;t9HPFawAAAAJ;13yyuCcAAAAJ",
        "orcid": ";;0000-0002-1137-9939;;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Xiyao_Wang1;~Ruijie_Zheng1;~Yanchao_Sun1;~Ruonan_Jia1;~Wichayaporn_Wongkamjan1;~Huazhe_Xu1;~Furong_Huang1",
        "aff": "University of Maryland, College Park;University of Maryland, College Park;J.P. Morgan AI Research;Tsinghua University;Department of Computer Science, University of Maryland, College Park;Tsinghua University;University of Maryland",
        "aff_domain": "umd.edu;cs.umd.edu;jpmchase.com;tsinghua.edu.cn;cs.umd.edu;tsinghua.edu.cn;cs.umd.edu",
        "position": "PhD student;PhD student;Researcher;Researcher;PhD student;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nwang2024coplanner,\ntitle={{COP}lanner: Plan to Roll Out Conservatively but to Explore Optimistically for Model-Based {RL}},\nauthor={Xiyao Wang and Ruijie Zheng and Yanchao Sun and Ruonan Jia and Wichayaporn Wongkamjan and Huazhe Xu and Furong Huang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=jnFcKjtUPN}\n}",
        "github": "",
        "project": "",
        "reviewers": "D4cs;NmVv;EHTZ",
        "pdf_size": 10745387,
        "rating": "6;6;6",
        "confidence": "4;3;3",
        "soundness": "3;3;3",
        "contribution": "2;2;2",
        "presentation": "3;3;3",
        "wc_summary": "48;60;110",
        "wc_strengths": "87;44;57",
        "wc_weaknesses": "265;61;39",
        "wc_questions": "72;58;74",
        "wc_review": "472;223;280",
        "wc_reply_reviewers": "89;11;6",
        "wc_reply_authors": "1221;480;481",
        "reply_reviewers": "1;1;1",
        "reply_authors": "3;1;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            72.66666666666667,
            26.849374087469688
        ],
        "wc_strengths_avg": [
            62.666666666666664,
            18.00617178142601
        ],
        "wc_weaknesses_avg": [
            121.66666666666667,
            101.7491468705703
        ],
        "wc_questions_avg": [
            68.0,
            7.118052168020874
        ],
        "wc_review_avg": [
            325.0,
            106.51760417883985
        ],
        "wc_reply_reviewers_avg": [
            35.333333333333336,
            38.00292386412159
        ],
        "wc_reply_authors_avg": [
            727.3333333333334,
            349.075286371802
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18367741495018017715&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=jnFcKjtUPN",
        "pdf": "https://openreview.net/pdf?id=jnFcKjtUPN",
        "email": "umd.edu;cs.umd.edu;jpmchase.com;tsinghua.edu.cn;cs.umd.edu;tsinghua.edu.cn;cs.umd.edu",
        "author_num": 7,
        "aff_unique_index": "0;0;1;2;3;2;0",
        "aff_unique_norm": "University of Maryland;J.P. Morgan;Tsinghua University;University of Maryland, College Park",
        "aff_unique_dep": ";AI Research;;Department of Computer Science",
        "aff_unique_url": "https://www/umd.edu;https://www.jpmorgan.com;https://www.tsinghua.edu.cn;https://www/umd.edu",
        "aff_unique_abbr": "UMD;JPM;THU;UMD",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "College Park;",
        "aff_country_unique_index": "0;0;0;1;0;1;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "jnZtTUdWyi",
        "title": "Adaptive Invariant Representation Learning for Non-stationary Domain Generalization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Although recent advances in machine learning have shown its success to learn from independent and identically distributed (IID) data, it is vulnerable to out-of-distribution (OOD) data in an open world. Domain generalization (DG) deals with such an issue and it aims to learn a model from multiple source domains that can be generalized to unseen target domains. Existing studies on DG have largely focused on stationary settings with homogeneous source domains. However, in many applications,  domains may evolve along a specific direction (e.g., time, space). Without accounting for such non-stationary patterns, models trained with existing methods may fail to generalize on OOD data. In this paper, we study domain generalization in non-stationary environment. We first examine the impact of environmental non-stationarity on model performance and establish the theoretical upper bounds for the model error at target domains. Then, we propose a novel algorithm based on invariant representation learning, which leverages the non-stationary pattern to train a model that attains good performance on target domains. Experiments on both synthetic and real data validate the proposed algorithm.",
        "keywords": "domain generalization;non-stationary;temporal-shift;invariant;representation learning;adaptive",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/fb13635d9ed2e6ff1060389dc5acda82c9c55d05.zip",
        "author": "Thai-Hoang Pham;Xueru Zhang;Ping Zhang",
        "authorids": "~Thai-Hoang_Pham1;~Xueru_Zhang2;~Ping_Zhang5",
        "gender": "M;F;",
        "homepage": "https://pth1993.github.io/;https://xueruzhang.github.io/;http://pingzhang.net/",
        "dblp": "174/4833;;13/4682-16",
        "google_scholar": "bht4j9oAAAAJ;PNBO_a4AAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0002-1733-6155;;0000-0002-4601-0779",
        "linkedin": ";;zhangping/",
        "or_profile": "~Thai-Hoang_Pham1;~Xueru_Zhang2;~Ping_Zhang5",
        "aff": "Ohio State University, Columbus;Ohio State University;The Ohio State University",
        "aff_domain": "osu.edu;osu.edu;osu.edu",
        "position": "PhD student;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\npham2024adaptive,\ntitle={Adaptive Invariant Representation Learning for Non-stationary Domain Generalization},\nauthor={Thai-Hoang Pham and Xueru Zhang and Ping Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=jnZtTUdWyi}\n}",
        "github": "",
        "project": "",
        "reviewers": "VfLk;6RJQ;Uk8r;vTu8",
        "site": "https://openreview.net/forum?id=jnZtTUdWyi",
        "pdf_size": 2366641,
        "rating": "3;5;5;6",
        "confidence": "5;3;3;3",
        "soundness": "2;3;2;3",
        "contribution": "2;3;3;3",
        "presentation": "2;2;2;2",
        "wc_summary": "86;44;141;98",
        "wc_strengths": "62;30;70;82",
        "wc_weaknesses": "204;30;168;105",
        "wc_questions": "4;335;98;7",
        "wc_review": "356;439;477;292",
        "wc_reply_reviewers": "0;179;0;0",
        "wc_reply_authors": "1086;1544;734;399",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "3;4;2;2",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            92.25,
            34.55701810052482
        ],
        "wc_strengths_avg": [
            61.0,
            19.261360284258224
        ],
        "wc_weaknesses_avg": [
            126.75,
            66.14897958396637
        ],
        "wc_questions_avg": [
            111.0,
            134.7312139038315
        ],
        "wc_review_avg": [
            391.0,
            71.98263679527167
        ],
        "wc_reply_reviewers_avg": [
            44.75,
            77.50927363870726
        ],
        "wc_reply_authors_avg": [
            940.75,
            424.6312370751827
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.9271726499455306,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:TeYlsJxsBzoJ:scholar.google.com/&scioq=Adaptive+Invariant+Representation+Learning+for+Non-stationary+Domain+Generalization&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Ohio State University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.osu.edu",
        "aff_unique_abbr": "OSU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Columbus;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "jo36Mzwuvf",
        "title": "Gaussian Process-Based Corruption-resilience Forecasting Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Time series forecasting is challenging due to complex temporal dependencies and unobserved external factors, which can lead to incorrect predictions by even the best forecasting models. Using more training data is one way to improve the accuracy, but this source is often limited. In contrast, we are building on successful denoising approaches for image generation. When a time series is corrupted by the common isotropic Gaussian noise, it yields unnaturally behaving time series. To avoid generating unnaturally behaving time series that do not represent the true error mode in modern forecasting models, we propose to employ Gaussian Processes to generate smoothly-correlated corrupted time series. However, instead of directly corrupting the training data, we propose a joint forecast-corrupt-denoise model to encourage the forecasting model to focus on accurately predicting coarse-grained behavior, while the denoising model focuses on capturing fine-grained behavior. All three parts are interacting via a corruption model which enforces the model to be resilient.\nOur extensive experiments demonstrate that our proposed corruption-resilient forecasting approach is able to improve the forecasting accuracy of several state-of-the-art forecasting models as well as several other denoising approaches",
        "keywords": "Time Series Forecasting;Denoising Models;Gaussian Process Models;Neural Networks",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Sepideh Koohfar;Laura Dietz",
        "authorids": "~Sepideh_Koohfar3;~Laura_Dietz1",
        "gender": "F;F",
        "homepage": "http://www.cs.unh.edu/~dietz;https://www.cs.unh.edu/~sk1015/",
        "dblp": "85/5754;",
        "google_scholar": "IIXpJ8oAAAAJ;",
        "orcid": "0000-0003-1624-3907;",
        "linkedin": ";",
        "or_profile": "~Laura_Dietz1;~sepideh_koohfar2",
        "aff": "University of New Hampshire;University of New Hampshire",
        "aff_domain": "unh.edu;unh.edu",
        "position": "Associate Professor;PhD student",
        "bibtex": "@misc{\nkoohfar2024gaussian,\ntitle={Gaussian Process-Based Corruption-resilience Forecasting Models},\nauthor={Sepideh Koohfar and Laura Dietz},\nyear={2024},\nurl={https://openreview.net/forum?id=jo36Mzwuvf}\n}",
        "github": "",
        "project": "",
        "reviewers": "nq8v;Niyb;zFSw;Hpfd",
        "site": "https://openreview.net/forum?id=jo36Mzwuvf",
        "pdf_size": 577276,
        "rating": "3;5;5;6",
        "confidence": "4;3;4;4",
        "soundness": "2;3;3;3",
        "contribution": "1;2;2;2",
        "presentation": "1;3;2;2",
        "wc_summary": "103;103;98;77",
        "wc_strengths": "43;21;50;79",
        "wc_weaknesses": "157;177;179;257",
        "wc_questions": "498;110;111;91",
        "wc_review": "801;411;438;504",
        "wc_reply_reviewers": "326;108;12;163",
        "wc_reply_authors": "518;429;102;380",
        "reply_reviewers": "2;2;1;2",
        "reply_authors": "2;3;1;2",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            95.25,
            10.732543966832841
        ],
        "wc_strengths_avg": [
            48.25,
            20.72890493972125
        ],
        "wc_weaknesses_avg": [
            192.5,
            38.21975928757271
        ],
        "wc_questions_avg": [
            202.5,
            170.793003369576
        ],
        "wc_review_avg": [
            538.5,
            155.28441647506037
        ],
        "wc_reply_reviewers_avg": [
            152.25,
            113.94379096730107
        ],
        "wc_reply_authors_avg": [
            357.25,
            155.44995175296773
        ],
        "reply_reviewers_avg": [
            1.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.13245323570650439,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:OaE1TMU6m2kJ:scholar.google.com/&scioq=Gaussian+Process-Based+Corruption-resilience+Forecasting+Models&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of New Hampshire",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.unh.edu",
        "aff_unique_abbr": "UNH",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "joMMM9eadc",
        "title": "Effective Generation of Feasible Solutions for Integer Programming via Guided Diffusion",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Feasible solutions are crucial for Integer Programming (IP) since they can substantially speed up the solving process. In many applications, similar IP instances often exhibit similar structures and shared solution distributions, which can be potentially modeled by deep learning methods.  Unfortunately, existing deep-learning-based algorithms, such as Neural Diving \\citep{nair2020solving}, fail to capture the full underlying distributions and can only generate \\emph{partial} feasible solutions for a given IP instance. In this paper, we propose a novel framework that generates \\emph{complete} feasible solutions \\emph{end-to-end}. Our framework leverages contrastive learning to characterize the relationship between IP instances and solutions, and learns latent embeddings for both IP instances and their solutions. Further, the framework employs diffusion models to learn the distribution of solution embeddings conditioned on IP representations, with a dedicated guided sampling strategy that accounts for both constraints and objectives. We empirically evaluate our framework on four typical datasets of IP problems, and show that it effectively generates complete feasible solutions with a higher probability and a better quality for a given IP instance than the state-of-the-art.",
        "keywords": "Integer Programming;Diffusion Models",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/67e041d3434b3d62f2b58a7a9302f9a68c63c5a2.zip",
        "author": "Hao Zeng;Jiaqi Wang;Avirup Das;Junying He;Kunpeng Han;Haoyuan Hu;Mingfei Sun",
        "authorids": "~Hao_Zeng6;~Jiaqi_Wang12;~Avirup_Das1;~Junying_He1;~Kunpeng_Han1;~Haoyuan_Hu1;~Mingfei_Sun1",
        "gender": "M;F;M;M;M;M;M",
        "homepage": "https://www.researchgate.net/scientific-contributions/Hao-Zeng-2167422778;;;;https://scholar.google.com/citations?user=VM3b49QAAAAJ;;https://research.manchester.ac.uk/en/persons/mingfei-sun",
        "dblp": "59/6515;;;;232/1683;205/3156;195/7934.html",
        "google_scholar": ";;;;;;2Uzgp5kAAAAJ",
        "orcid": "0009-0005-7755-3564;;;0000-0003-2661-7888;;;",
        "linkedin": ";%E4%BD%B3%E7%90%AA-%E7%8E%8B-26965b292/;avirup-das-4b9538172/;;;;",
        "or_profile": "~Hao_Zeng6;~Jiaqi_Wang12;~Avirup_Das1;~Junying_He1;~Kunpeng_Han1;~Haoyuan_Hu1;~Mingfei_Sun1",
        "aff": "Cainiao Network ;Tsinghua University;University of Manchester;;;Cainiao Network;University of Manchester ",
        "aff_domain": "cainiao.com;mail.tsinghua.edu.cn;manchester.ac.uk;;;cainiao.com;manchester.ac.uk",
        "position": "Researcher;MS student;PhD student;;;Principal Researcher;Assistant Professor",
        "bibtex": "@misc{\nzeng2024effective,\ntitle={Effective Generation of Feasible Solutions for Integer Programming via Guided Diffusion},\nauthor={Hao Zeng and Jiaqi Wang and Avirup Das and Junying He and Kunpeng Han and Haoyuan Hu and Mingfei Sun},\nyear={2024},\nurl={https://openreview.net/forum?id=joMMM9eadc}\n}",
        "github": "",
        "project": "",
        "reviewers": "jBX3;MZmK;wgcj;CS3k",
        "site": "https://openreview.net/forum?id=joMMM9eadc",
        "pdf_size": 777920,
        "rating": "5;6;6;8",
        "confidence": "3;4;4;2",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;2",
        "presentation": "2;2;3;3",
        "wc_summary": "47;95;103;55",
        "wc_strengths": "47;43;120;16",
        "wc_weaknesses": "214;230;112;40",
        "wc_questions": "109;4;35;1",
        "wc_review": "417;372;370;112",
        "wc_reply_reviewers": "0;30;38;0",
        "wc_reply_authors": "1415;562;455;97",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "3;2;2;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            75.0,
            24.331050121192877
        ],
        "wc_strengths_avg": [
            56.5,
            38.55191305240247
        ],
        "wc_weaknesses_avg": [
            149.0,
            77.51773990513398
        ],
        "wc_questions_avg": [
            37.25,
            43.51077452769601
        ],
        "wc_review_avg": [
            317.75,
            120.26715054411159
        ],
        "wc_reply_reviewers_avg": [
            17.0,
            17.233687939614086
        ],
        "wc_reply_authors_avg": [
            632.25,
            483.6172944591622
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.6225430174794673,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:5dceS66_6zkJ:scholar.google.com/&scioq=Effective+Generation+of+Feasible+Solutions+for+Integer+Programming+via+Guided+Diffusion&hl=en&as_sdt=0,5",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;2;0;2",
        "aff_unique_norm": "Cainiao Network;Tsinghua University;University of Manchester",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.cainiao.com;https://www.tsinghua.edu.cn;https://www.manchester.ac.uk",
        "aff_unique_abbr": "Cainiao;THU;UoM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;1",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "id": "jolYuxpVn1",
        "title": "FacTool: Factuality Detection in Generative AI - A Tool Augmented Framework for Multi-Task and Multi-Domain Scenarios",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The emergence of generative pre-trained models has facilitated the synthesis of high-quality text but has also posed challenges in identifying factual errors in the generated text. In particular: (1) A wider range of tasks now face an increasing risk of containing factual errors when handled by generative models. (2) The content generated by these models tends to be lengthy and lacks clearly defined granularity for individual facts. (3) There is a scarcity of explicit evidence available during the process of fact checking. With the above challenges in mind, in this paper, we propose FacTool, a tool augmented multi-task and multi-domain framework for detecting factual errors of texts generated by large language models (e.g., ChatGPT). Experiments on four different tasks (knowledge-based QA, code generation, mathematical reasoning, and scientific literature review) show the efficacy of the proposed method.",
        "keywords": "Factuality;LLM",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "I-Chun Chern;Steffi Chern;Shiqi Chen;Weizhe Yuan;Kehua Feng;Chunting Zhou;Junxian He;Graham Neubig;Pengfei Liu",
        "authorids": "~I-Chun_Chern1;~Steffi_Chern1;~Shiqi_Chen3;~Weizhe_Yuan1;~Kehua_Feng1;~Chunting_Zhou1;~Junxian_He1;~Graham_Neubig1;~Pengfei_Liu1",
        "gender": "M;;F;F;M;F;M;M;M",
        "homepage": ";https://steffichern.github.io/;;http://yyy-apple.github.io/;https://weiji-feng.github.io/;https://violet-zct.github.io/;https://jxhe.github.io;http://phontron.com;http://pfliu.com/",
        "dblp": "284/9591;;;207/1964;;161/2679;188/6127.html;03/8155;34/3381-3",
        "google_scholar": "zmit6DkAAAAJ;https://scholar.google.com/citations?view_op=list_works;4Tg7zOMAAAAJ;2k5j4eMAAAAJ;PQVboTgAAAAJ;mR5W7EgAAAAJ;BIFGeoUAAAAJ;wlosgkoAAAAJ;oIz_CYEAAAAJ",
        "orcid": ";;;;;;;;",
        "linkedin": ";steffichern/;;weizhey/;;;;;",
        "or_profile": "~I-Chun_Chern1;~Steffi_Chern1;~Shiqi_Chen3;~Weizhe_Yuan1;~Kehua_Feng1;~Chunting_Zhou1;~Junxian_He1;~Graham_Neubig1;~Pengfei_Liu1",
        "aff": "Shanghai Jiaotong University;Carnegie Mellon University;City University of Hong Kong;New York University;XiDian University;Meta AI;Hong Kong University of Science and Technology;Carnegie Mellon University;Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu;cmu.edu;cityu.edu.hk;nyu.edu;xidian.edu.cn;meta.com;ust.hk;cmu.edu;sjtu.edu",
        "position": "PhD student;Undergrad student;PhD student;PhD student;Undergrad student;Researcher;Assistant Professor;Associate Professor;Associate Professor",
        "bibtex": "@misc{\nchern2024factool,\ntitle={FacTool: Factuality Detection in Generative {AI} - A Tool Augmented Framework for Multi-Task and Multi-Domain Scenarios},\nauthor={I-Chun Chern and Steffi Chern and Shiqi Chen and Weizhe Yuan and Kehua Feng and Chunting Zhou and Junxian He and Graham Neubig and Pengfei Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=jolYuxpVn1}\n}",
        "github": "",
        "project": "",
        "reviewers": "wbTV;fmJJ;tg4t",
        "site": "https://openreview.net/forum?id=jolYuxpVn1",
        "pdf_size": 2308116,
        "rating": "6;6;6",
        "confidence": "4;3;4",
        "soundness": "3;2;3",
        "contribution": "3;2;2",
        "presentation": "3;2;3",
        "wc_summary": "77;126;134",
        "wc_strengths": "34;53;73",
        "wc_weaknesses": "47;147;100",
        "wc_questions": "1;83;59",
        "wc_review": "159;409;366",
        "wc_reply_reviewers": "17;0;125",
        "wc_reply_authors": "252;966;1803",
        "reply_reviewers": "1;0;1",
        "reply_authors": "2;8;9",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            112.33333333333333,
            25.197001585285676
        ],
        "wc_strengths_avg": [
            53.333333333333336,
            15.923427883328248
        ],
        "wc_weaknesses_avg": [
            98.0,
            40.849316599750686
        ],
        "wc_questions_avg": [
            47.666666666666664,
            34.42221504913489
        ],
        "wc_review_avg": [
            311.3333333333333,
            109.13701887484781
        ],
        "wc_reply_reviewers_avg": [
            47.333333333333336,
            55.355417279813025
        ],
        "wc_reply_authors_avg": [
            1007.0,
            633.8564506258496
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            6.333333333333333,
            3.0912061651652345
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 197,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16627436630519101067&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;3;4;5;6;1;0",
        "aff_unique_norm": "Shanghai Jiao Tong University;Carnegie Mellon University;City University of Hong Kong;New York University;Xidian University;Meta;Hong Kong University of Science and Technology",
        "aff_unique_dep": ";;;;;Meta AI;",
        "aff_unique_url": "https://www.sjtu.edu.cn;https://www.cmu.edu;https://www.cityu.edu.hk;https://www.nyu.edu;http://www.xidian.edu.cn/;https://meta.com;https://www.ust.hk",
        "aff_unique_abbr": "SJTU;CMU;CityU;NYU;XDU;Meta;HKUST",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;1;0;1;0;1;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "MINT: Evaluating LLMs in Multi-turn Interaction with Tools and Language Feedback",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18006",
        "id": "jp3gWrMuIZ",
        "author_site": "Xingyao Wang, Zihan Wang, Jiateng Liu, Yangyi Chen, Lifan Yuan, Hao Peng, Heng Ji",
        "tldr": "",
        "abstract": "To solve complex tasks, large language models (LLMs) often require multiple rounds of interactions with the user, sometimes assisted by external tools.\nHowever, current evaluation protocols often emphasize benchmark performance with single-turn exchanges, neglecting the nuanced interactions among the user, LLMs, and external tools, while also underestimating the importance of natural language feedback from users. These oversights contribute to discrepancies between research benchmark evaluations and real-world use cases.\nWe introduce MINT, a benchmark that evaluates LLMs' ability to solve tasks with multi-turn interactions by (1) using tools and (2) leveraging natural language feedback.\nTo ensure reproducibility, we provide an evaluation framework where LLMs can access tools by executing Python code and receive users' natural language feedback simulated by GPT-4.\nWe repurpose a diverse set of established evaluation datasets focusing on reasoning, coding, and decision-making and carefully curate them into a compact subset for efficient evaluation.\nOur analysis of 20 open- and closed-source LLMs offers intriguing findings.\n(a) LLMs generally benefit from tools and language feedback, with performance gains (absolute, same below) of 1--8% for each turn of tool use and 2--17% with natural language feedback.\n(b) Better single-turn performance does not guarantee better multi-turn performance.\n(c) Surprisingly, on the LLMs evaluated, supervised instruction-finetuning (SIFT) and reinforcement learning from human feedback (RLHF) generally hurt multi-turn capabilities.\nWe expect MINT can help measure progress and incentivize research in improving LLMs' capabilities in multi-turn interactions, especially for open-source communities where multi-turn human evaluation can be less accessible compared to commercial LLMs with a larger user base.",
        "keywords": "large language model;multi-turn interaction;learning from feedback;reinforcement learning from human feedback;instruction tuning",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/a0ecd2a09508c7eb3743413d3dc234ff6fc510b9.zip",
        "author": "Xingyao Wang;Zihan Wang;Jiateng Liu;Yangyi Chen;Lifan Yuan;Hao Peng;Heng Ji",
        "authorids": "~Xingyao_Wang1;~Zihan_Wang23;~Jiateng_Liu2;~Yangyi_Chen1;~Lifan_Yuan1;~Hao_Peng4;~Heng_Ji3",
        "gender": "M;M;M;M;;;F",
        "homepage": "https://xwang.dev;https://zihanwang314.github.io;https://lumos-jiateng.github.io/;https://yangyi-chen.github.io/;;;http://blender.cs.illinois.edu/hengji.html",
        "dblp": "264/9892;152/5077-10;;05/10083;;;",
        "google_scholar": "F7qq3YcAAAAJ;https://scholar.google.com/citations?hl=en;;https://scholar.google.com/citations?hl=en;;;z7GCqT4AAAAJ",
        "orcid": "0000-0002-3483-8624;;;;;;",
        "linkedin": ";;;yangyi-chen-4006a11b2/;;;",
        "or_profile": "~Xingyao_Wang1;~Zihan_Wang23;~Jiateng_Liu2;~Yangyi_Chen1;~Lifan_Yuan1;~Hao_Peng4;~Heng_Ji3",
        "aff": "University of Illinois Urbana-Champaign;Renmin University of China;Department of Computer Science;Department of Computer Science, University of Illinois at Urbana-Champaign;;;University of Illinois, Urbana-Champaign",
        "aff_domain": "cs.illinois.edu;ruc.edu.cn;cs.illinois.edu;cs.illinois.edu;;;uiuc.edu",
        "position": "PhD student;Undergrad student;MS student;PhD student;;;Full Professor",
        "bibtex": "@inproceedings{\nwang2024mint,\ntitle={{MINT}: Evaluating {LLM}s in Multi-turn Interaction with Tools and Language Feedback},\nauthor={Xingyao Wang and Zihan Wang and Jiateng Liu and Yangyi Chen and Lifan Yuan and Hao Peng and Heng Ji},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=jp3gWrMuIZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "Nxjw;VNEC;hgTu;vnHy",
        "pdf_size": 1498322,
        "rating": "5;6;8;8",
        "confidence": "5;4;4;5",
        "soundness": "3;3;4;4",
        "contribution": "3;3;3;4",
        "presentation": "3;3;2;4",
        "wc_summary": "74;81;185;97",
        "wc_strengths": "83;55;130;106",
        "wc_weaknesses": "327;436;331;143",
        "wc_questions": "51;56;239;2",
        "wc_review": "535;628;885;348",
        "wc_reply_reviewers": "101;350;14;24",
        "wc_reply_authors": "1533;1394;655;435",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            109.25,
            44.52176434060088
        ],
        "wc_strengths_avg": [
            93.5,
            27.753378172755834
        ],
        "wc_weaknesses_avg": [
            309.25,
            105.46652312463894
        ],
        "wc_questions_avg": [
            87.0,
            90.25796363756497
        ],
        "wc_review_avg": [
            599.0,
            193.47738885978382
        ],
        "wc_reply_reviewers_avg": [
            122.25,
            135.73204301122118
        ],
        "wc_reply_authors_avg": [
            1004.25,
            468.3755838000098
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.19245008972987526,
        "gs_citation": 135,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11546597930652901987&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=jp3gWrMuIZ",
        "pdf": "https://openreview.net/pdf?id=jp3gWrMuIZ",
        "email": "cs.illinois.edu;ruc.edu.cn;cs.illinois.edu;cs.illinois.edu;;;uiuc.edu",
        "author_num": 7,
        "aff_unique_index": "0;1;2;0;3",
        "aff_unique_norm": "University of Illinois Urbana-Champaign;Renmin University of China;Unknown Institution;University of Illinois",
        "aff_unique_dep": ";;Department of Computer Science;",
        "aff_unique_url": "https://illinois.edu;http://www.ruc.edu.cn;;https://illinois.edu",
        "aff_unique_abbr": "UIUC;RUC;;UIUC",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Urbana-Champaign;",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "United States;China;"
    },
    {
        "id": "jpsQPNUzs0",
        "title": "SAMPLING TO DISTILL: KNOWLEDGE TRANSFER FROM OPEN-WORLD DATA",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Data-Free Knowledge Distillation (DFKD) is a novel task that aims to train high-performance student models using only the teacher network without original training data.\nDespite encouraging results, existing DFKD methods rely heavily on generation modules with high computational costs. \nMeanwhile, they ignore the fact that the generated and original data exist domain shifts due to the lack of supervision information. \nMoreover, knowledge is transferred through each example, ignoring the implicit relationship among multiple examples.\nTo this end, we propose a novel Open-world Data Sampling Distillation (ODSD) method without a redundant generation process.\nFirst, we try to sample open-world data close to the original data's distribution by an adaptive sampling module.\nThen, we introduce a low-noise representation to alleviate the domain shifts and build a structured relationship of multiple data examples to exploit data knowledge.\nExtensive experiments on CIFAR-10, CIFAR-100, NYUv2, and ImageNet show that our ODSD method achieves state-of-the-art performance. \nEspecially, we improve 1.50\\%-9.59\\% accuracy on the ImageNet dataset compared with the existing results.",
        "keywords": "Data-free;Knowledge Transfer",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Yuzheng Wang",
        "authorids": "~Yuzheng_Wang1",
        "gender": "",
        "homepage": "",
        "dblp": "",
        "google_scholar": "",
        "orcid": "",
        "linkedin": "",
        "or_profile": "",
        "aff": "",
        "aff_domain": "",
        "position": "",
        "bibtex": "@misc{\nwang2024sampling,\ntitle={{SAMPLING} {TO} {DISTILL}: {KNOWLEDGE} {TRANSFER} {FROM} {OPEN}-{WORLD} {DATA}},\nauthor={Yuzheng Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=jpsQPNUzs0}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=jpsQPNUzs0",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17338186321751459879&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6
    },
    {
        "title": "Unprocessing Seven Years of Algorithmic Fairness",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18005",
        "id": "jr03SfWsBS",
        "author_site": "Andr\u00e9 F. Cruz, Moritz Hardt",
        "tldr": "",
        "abstract": "Seven years ago, researchers proposed a postprocessing method to equalize the error rates of a model across different demographic groups. The work launched hundreds of papers purporting to improve over the postprocessing baseline. We empirically evaluate these claims through thousands of model evaluations on several tabular datasets. We find that the fairness-accuracy Pareto frontier achieved by postprocessing contains all other methods we were feasibly able to evaluate. In doing so, we address two common methodological errors that have confounded previous observations. One relates to the comparison of methods with different unconstrained base models. The other concerns methods achieving different levels of constraint relaxation. At the heart of our study is a simple idea we call unprocessing that roughly corresponds to the inverse of postprocessing. Unprocessing allows for a direct comparison of methods using different underlying models and levels of relaxation.",
        "keywords": "fairness;algorithmic fairness;social computing;tabular data;meta study",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/395d0ac4ddf66d240d56a05ca7c0f3a185466b35.pdf",
        "author": "Andr\u00e9 Cruz;Moritz Hardt",
        "authorids": "~Andr\u00e9_Cruz1;~Moritz_Hardt1",
        "gender": "M;Not Specified",
        "homepage": "https://andrefcruz.github.io;http://mrtz.org/",
        "dblp": "231/2735;26/4683",
        "google_scholar": "https://scholar.google.pt/citations?user=ctk2MhUAAAAJ;adnTgaAAAAAJ",
        "orcid": "0000-0002-3334-2838;",
        "linkedin": "andre-f-cruz/;",
        "or_profile": "~Andr\u00e9_Cruz1;~Moritz_Hardt1",
        "aff": "Max Planck Institute for Intelligent Systems;Max-Planck-Institute for Intelligent Systems, Max-Planck Institute",
        "aff_domain": "is.mpg.de;is.mpg.de",
        "position": "PhD student;Principal Researcher",
        "bibtex": "@inproceedings{\ncruz2024unprocessing,\ntitle={Unprocessing Seven Years of Algorithmic Fairness},\nauthor={Andr{\\'e} Cruz and Moritz Hardt},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=jr03SfWsBS}\n}",
        "github": "",
        "project": "",
        "reviewers": "tygt;RSrR;4YF6;QHJ8",
        "pdf_size": 1952638,
        "rating": "6;6;8;8",
        "confidence": "5;3;3;3",
        "soundness": "4;2;3;4",
        "contribution": "3;2;3;4",
        "presentation": "4;2;3;4",
        "wc_summary": "77;114;132;33",
        "wc_strengths": "89;58;176;44",
        "wc_weaknesses": "116;82;161;1",
        "wc_questions": "30;233;29;1",
        "wc_review": "312;487;498;79",
        "wc_reply_reviewers": "23;162;76;0",
        "wc_reply_authors": "524;977;530;20",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "1;2;2;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            89.0,
            37.927562537025764
        ],
        "wc_strengths_avg": [
            91.75,
            51.295102105366745
        ],
        "wc_weaknesses_avg": [
            90.0,
            58.52777118599341
        ],
        "wc_questions_avg": [
            73.25,
            92.96336644076526
        ],
        "wc_review_avg": [
            344.0,
            169.8631802363302
        ],
        "wc_reply_reviewers_avg": [
            65.25,
            62.28713751650496
        ],
        "wc_reply_authors_avg": [
            512.75,
            338.6571828560558
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 16,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17604458727315229584&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=jr03SfWsBS",
        "pdf": "https://openreview.net/pdf?id=jr03SfWsBS",
        "email": "is.mpg.de;is.mpg.de",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Max Planck Institute for Intelligent Systems;Max-Planck-Institute for Intelligent Systems",
        "aff_unique_dep": "Intelligent Systems;Intelligent Systems",
        "aff_unique_url": "https://www.mpi-is.mpg.de;https://www.mpi-is.mpg.de",
        "aff_unique_abbr": "MPI-IS;MPI-IS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "jrm33chK71",
        "title": "Few and Fewer: Learning Better from Few Examples Using Fewer Base Classes",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "When training data is scarce, it is common to make use of a feature extractor that has been pre-trained on a large \u201cbase\u201d dataset, either by fine-tuning its parameters on the \u201ctarget\u201d dataset or by directly adopting its representation as features for a simple classifier. Fine-tuning is ineffective for few-shot learning, since the target dataset contains only a handful of examples. However, directly adopting the features without fine-tuning relies on the distribution of the base dataset being similar enough to that of the target dataset in order to achieve separability and generalization. This paper investigates whether better features for the target dataset can be obtained by training on fewer base classes, in an effort to bring the distribution of the base dataset closer to that of the target dataset. We consider cross-domain few-shot image classification in eight different domains from Meta-Dataset and entertain multiple real-world settings (domain-informed, task-informed and uninformed) where progressively less detail is known about the target task. To our knowledge, this is the first demonstration that fine-tuning on a subset of carefully selected base classes can significantly improve few-shot learning. Our contributions are simple and intuitive methods that can be implemented in any few-shot solution. We also give insights into the conditions in which these solutions are likely to provide a boost in accuracy. We release the code to reproduce all experiments from this paper on GitHub. https://anonymous.4open.science/r/Few-and-Fewer-C978",
        "keywords": "Few-Shot Learning;Transfer Learning;Data-centric",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Raphael Lafargue;Yassir Bendou;Bastien Pasdeloup;Jean-Philippe DIGUET;Ian Reid;Vincent Gripon;Jack Valmadre",
        "authorids": "~Raphael_Lafargue1;~Yassir_Bendou1;~Bastien_Pasdeloup1;~Jean-Philippe_DIGUET1;~Ian_Reid1;~Vincent_Gripon1;~Jack_Valmadre1",
        "gender": "M;M;;;M;M;M",
        "homepage": ";;https://labsticc.fr/fr/annuaire/pasdeloup-bastien;;;https://www.vincent-gripon.com;https://jack.valmadre.net/",
        "dblp": "291/4152;312/5088;160/8453;;r/IanDReid1;64/3058;50/8535",
        "google_scholar": "SbgHbt8AAAAJ;https://scholar.google.fr/citations?user=Hfzg6rcAAAAJ;dKOgoG4AAAAJ;;https://scholar.google.com.au/citations?user=ATkNLcQAAAAJ;n3IKEqgAAAAJ;_VSBqL0AAAAJ",
        "orcid": "0000-0003-4385-5749;0000-0001-7158-4451;0000-0002-8417-7537;;0000-0001-7790-6423;;",
        "linkedin": "rapha%C3%ABl-lafargue-0a33431b9?trk=people-guest_people_search-card;yassir-bendou/;;;;;",
        "or_profile": "~Raphael_Lafargue1;~Yassir_Bendou1;~Bastien_Pasdeloup1;~Jean-Philippe_DIGUET1;~Ian_Reid1;~Vincent_Gripon1;~Jack_Valmadre1",
        "aff": "University of Adelaide;IMT Atlantique;Ecole Normale Superieure de Rennes;;University of Adelaide;IMT Atlantique;University of Adelaide",
        "aff_domain": "adelaide.edu.au;imt-atlantique.fr;ens-rennes.fr;;adelaide.edu.au;imt-atlantique.fr;adelaide.edu.au",
        "position": "PhD student;PhD student;MS student;;Professor;Full Professor;Lecturer",
        "bibtex": "@misc{\nlafargue2024few,\ntitle={Few and Fewer: Learning Better from Few Examples Using Fewer Base Classes},\nauthor={Raphael Lafargue and Yassir Bendou and Bastien Pasdeloup and Jean-Philippe DIGUET and Ian Reid and Vincent Gripon and Jack Valmadre},\nyear={2024},\nurl={https://openreview.net/forum?id=jrm33chK71}\n}",
        "github": "",
        "project": "",
        "reviewers": "oGJc;u4xN;snfD;fEBb;8Z55",
        "site": "https://openreview.net/forum?id=jrm33chK71",
        "pdf_size": 1707400,
        "rating": "5;5;6;6;6",
        "confidence": "4;4;4;3;4",
        "soundness": "2;2;3;3;3",
        "contribution": "2;2;3;2;4",
        "presentation": "2;2;4;3;3",
        "wc_summary": "35;40;105;91;67",
        "wc_strengths": "17;22;240;100;73",
        "wc_weaknesses": "126;83;426;75;275",
        "wc_questions": "10;3;278;233;26",
        "wc_review": "188;148;1049;499;441",
        "wc_reply_reviewers": "0;0;64;0;0",
        "wc_reply_authors": "450;348;944;826;665",
        "reply_reviewers": "0;0;1;0;0",
        "reply_authors": "1;1;2;1;1",
        "rating_avg": [
            5.6,
            0.48989794855663565
        ],
        "confidence_avg": [
            3.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.6,
            0.8
        ],
        "presentation_avg": [
            2.8,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            67.6,
            27.463430230034994
        ],
        "wc_strengths_avg": [
            90.4,
            81.04467903570227
        ],
        "wc_weaknesses_avg": [
            197.0,
            135.23756874478335
        ],
        "wc_questions_avg": [
            110.0,
            119.88160826415368
        ],
        "wc_review_avg": [
            465.0,
            322.49217044759394
        ],
        "wc_reply_reviewers_avg": [
            12.8,
            25.600000000000005
        ],
        "wc_reply_authors_avg": [
            646.6,
            223.06196448520757
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            1.2,
            0.4
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.408248290463863,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17477628901798595949&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;0;1;0",
        "aff_unique_norm": "University of Adelaide;IMT Atlantique;Ecole Normale Superieure de Rennes",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.adelaide.edu.au;https://www.imt-atlantique.fr;https://www.ens-rennes.fr",
        "aff_unique_abbr": "Adelaide;IMT Atlantique;ENS Rennes",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Rennes",
        "aff_country_unique_index": "0;1;1;0;1;0",
        "aff_country_unique": "Australia;France"
    },
    {
        "id": "jsQPjIaNNh",
        "title": "Illuminating Protein Function Prediction through Inter-Protein Similarity Modeling",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Proteins, central to biological systems, are complex due to interactions between sequences, structures, and functions shaped by physics and evolution, posing a challenge for accurate function prediction. Recent advancements in deep learning techniques demonstrate substantial potential for precise function prediction through learning representations from extensive protein sequences and structures. Nevertheless, practical function annotation heavily relies on modeling protein similarity using sequence or structure retrieval tools, given their accuracy and interpretability. To study the effect of inter-protein similarity modeling, in this paper, we comprehensively benchmark the retriever-based methods against predictors on protein function tasks, demonstrating the potency of retriever-based approaches. Inspired by these findings, we introduce an innovative variational pseudo-likelihood framework, ProtIR, designed to improve function prediction through iterative refinement between predictors and retrievers. ProtIR combines the strengths of both predictors and retrievers, showcasing an around 10% improvement over vanilla predictor-based methods. Furthermore, it achieves comparable performance to the state-of-the-art protein language model-based methods with significantly smaller training time, highlighting the efficacy of our approach.",
        "keywords": "Protein function prediction;retrieveal-based methods;transductive learning",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Zuobai Zhang;Jiarui Lu;Vijil Chenthamarakshan;Aurelie Lozano;Payel Das;Jian Tang",
        "authorids": "~Zuobai_Zhang1;~Jiarui_Lu2;~Vijil_Chenthamarakshan1;~Aurelie_Lozano1;~Payel_Das1;~Jian_Tang1",
        "gender": "M;Not Specified;M;F;F;",
        "homepage": "https://oxer11.github.io/;https://lujiarui.github.io/;https://researcher.watson.ibm.com/researcher/view.php?person=us-ecvijil;https://research.ibm.com/people/aurelie-lozano;;http://www.jian-tang.com",
        "dblp": "256/9098.html;;;06/274;56/7926;181/2667-5",
        "google_scholar": "UCDbNccAAAAJ;POV9jiIAAAAJ;g9hboJ0AAAAJ;4wTGaDsAAAAJ;;https://scholar.google.ca/citations?user=1ir6WUEAAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";lujiarui/;;;;",
        "or_profile": "~Zuobai_Zhang1;~Jiarui_Lu2;~Vijil_Chenthamarakshan1;~Aurelie_Lozano1;~Payel_Das1;~Jian_Tang1",
        "aff": "NVIDIA;Mila - Qu\u00e9bec AI Institute; Universit\u00e9 de Montr\u00e9al;International Business Machines;IBM Research;IBM, International Business Machines;Mila, HEC Montreal",
        "aff_domain": "nvidia.com;umontreal.ca;ibm.com;us.ibm.com;us.ibm.com;hec.ca",
        "position": "Intern;PhD student;Senior Technical Staff member;Principal Researcher;Principal Researcher;Assistant Professor",
        "bibtex": "@misc{\nzhang2024illuminating,\ntitle={Illuminating Protein Function Prediction through Inter-Protein Similarity Modeling},\nauthor={Zuobai Zhang and Jiarui Lu and Vijil Chenthamarakshan and Aurelie Lozano and Payel Das and Jian Tang},\nyear={2024},\nurl={https://openreview.net/forum?id=jsQPjIaNNh}\n}",
        "github": "",
        "project": "",
        "reviewers": "iEQ7;MNvs;Rgn7;ZTPG;v1LN;fLin;gh7e;Fp4G",
        "site": "https://openreview.net/forum?id=jsQPjIaNNh",
        "pdf_size": 749936,
        "rating": "3;5;5;5;6;6;6;6",
        "confidence": "4;4;3;3;3;3;3;4",
        "soundness": "2;3;3;2;2;3;2;3",
        "contribution": "2;2;3;2;2;3;2;3",
        "presentation": "3;2;2;2;3;3;2;4",
        "wc_summary": "59;61;77;54;199;66;58;66",
        "wc_strengths": "35;62;50;34;47;47;37;58",
        "wc_weaknesses": "145;74;263;340;67;56;322;361",
        "wc_questions": "5;139;58;4;35;185;47;46",
        "wc_review": "244;336;448;432;348;354;464;531",
        "wc_reply_reviewers": "0;0;0;31;0;17;13;53",
        "wc_reply_authors": "527;362;558;507;224;652;519;782",
        "reply_reviewers": "0;0;0;1;0;1;1;1",
        "reply_authors": "1;1;1;1;1;1;1;1",
        "rating_avg": [
            5.25,
            0.9682458365518543
        ],
        "confidence_avg": [
            3.375,
            0.4841229182759271
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.375,
            0.4841229182759271
        ],
        "presentation_avg": [
            2.625,
            0.6959705453537527
        ],
        "wc_summary_avg": [
            80.0,
            45.447772222629354
        ],
        "wc_strengths_avg": [
            46.25,
            9.76921184128996
        ],
        "wc_weaknesses_avg": [
            203.5,
            123.2892939390927
        ],
        "wc_questions_avg": [
            64.875,
            60.032152843288905
        ],
        "wc_review_avg": [
            394.625,
            84.85714097823471
        ],
        "wc_reply_reviewers_avg": [
            14.25,
            18.039886363278455
        ],
        "wc_reply_authors_avg": [
            516.375,
            158.19524131591317
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.4666666666666667,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Ukyb0qsWOCQJ:scholar.google.com/&scioq=Illuminating+Protein+Function+Prediction+through+Inter-Protein+Similarity+Modeling&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;4;5;6",
        "aff_unique_norm": "NVIDIA;Qu\u00e9bec AI Institute;Universit\u00e9 de Montr\u00e9al;International Business Machines Corporation;IBM;International Business Machines;HEC Montreal",
        "aff_unique_dep": "NVIDIA Corporation;AI Institute;;;IBM Research;;HEC Business School",
        "aff_unique_url": "https://www.nvidia.com;https://mila.quebec;https://www.umontreal.ca;https://www.ibm.com;https://www.ibm.com/research;https://www.ibm.com;https://www.hec.ca",
        "aff_unique_abbr": "NVIDIA;Mila;UdeM;IBM;IBM;IBM;HEC",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Montreal",
        "aff_country_unique_index": "0;1;1;0;0;0;1",
        "aff_country_unique": "United States;Canada"
    },
    {
        "title": "Deep Reinforcement Learning Guided Improvement Heuristic for Job Shop Scheduling",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18004",
        "id": "jsWCmrsHHs",
        "author_site": "Cong Zhang, Zhiguang Cao, Wen Song, Yaoxin Wu, Jie Zhang",
        "tldr": "",
        "abstract": "Recent studies in using deep reinforcement learning (DRL) to solve Job-shop scheduling problems (JSSP) focus on construction heuristics. However, their performance is still far from optimality, mainly because the underlying graph representation scheme is unsuitable for modelling partial solutions at each construction step. This paper proposes a novel DRL-guided improvement heuristic for solving JSSP, where graph representation is employed to encode complete solutions. We design a Graph-Neural-Network-based representation scheme, consisting of two modules to effectively capture the information of dynamic topology and different types of nodes in graphs encountered during the improvement process. To speed up solution evaluation during improvement, we present a novel message-passing mechanism that can evaluate multiple solutions simultaneously. We prove that the computational complexity of our method scales linearly with problem size. Experiments on classic benchmarks show that the improvement policy learned by our method outperforms state-of-the-art DRL-based methods by a large margin.",
        "keywords": "Deep Reinforcement Learning;Graph Neural Network;Job Shop Scheduling;Combinatorial Optimization",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Cong Zhang;Zhiguang Cao;Wen Song;Yaoxin Wu;Jie Zhang",
        "authorids": "~Cong_Zhang3;~Zhiguang_Cao1;~Wen_Song1;~Yaoxin_Wu2;~Jie_Zhang9",
        "gender": "M;M;M;M;M",
        "homepage": "https://scholar.google.com.sg/citations?user=lSC-K24AAAAJ&hl=zh-CN;https://zhiguangcaosg.github.io/;https://songwenas12.github.io/;https://personal.ntu.edu.sg/zhangj/;https://research.tue.nl/en/persons/yaoxin-wu",
        "dblp": "18/2908-4;178/8621;50/5489;84/6889-2;192/4964",
        "google_scholar": "https://scholar.google.com.sg/citations?user=lSC-K24AAAAJ;https://scholar.google.com.sg/citations?user=2R-cOkYAAAAJ;s8Nz-xoAAAAJ;IFV_RdMAAAAJ;0qRnmK8AAAAJ",
        "orcid": "0000-0002-8434-1181;0000-0002-4499-759X;0000-0001-7624-1861;;0000-0002-3625-6599",
        "linkedin": "cong-zhang-5b9358122/;;;;",
        "or_profile": "~Cong_Zhang3;~Zhiguang_Cao1;~Wen_Song1;~Jie_Zhang9;~YAOXIN_WU1",
        "aff": "Huawei Technologies Ltd.;Singapore Management University;Shandong University;Nanyang Technological University;Eindhoven University of Technology",
        "aff_domain": "huawei.com;smu.edu.sg;sdu.edu.cn;ntu.edu.sg;tue.nl",
        "position": "Researcher;Assistant Professor;Associate Professor;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nzhang2024deep,\ntitle={Deep Reinforcement Learning Guided Improvement Heuristic for Job Shop Scheduling},\nauthor={Cong Zhang and Zhiguang Cao and Wen Song and Yaoxin Wu and Jie Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=jsWCmrsHHs}\n}",
        "github": "",
        "project": "",
        "reviewers": "Sv6i;W4mB;Yw7H;jCmi",
        "pdf_size": 1131733,
        "rating": "6;8;8;8",
        "confidence": "3;3;3;4",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "39;124;116;55",
        "wc_strengths": "54;134;100;84",
        "wc_weaknesses": "24;97;124;106",
        "wc_questions": "108;67;121;89",
        "wc_review": "225;422;461;334",
        "wc_reply_reviewers": "38;0;0;0",
        "wc_reply_authors": "937;919;450;883",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "2;2;1;2",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            83.5,
            37.04389288398291
        ],
        "wc_strengths_avg": [
            93.0,
            28.861739379323623
        ],
        "wc_weaknesses_avg": [
            87.75,
            38.06819538670043
        ],
        "wc_questions_avg": [
            96.25,
            20.363877332178173
        ],
        "wc_review_avg": [
            360.5,
            90.75378779973869
        ],
        "wc_reply_reviewers_avg": [
            9.5,
            16.454482671904334
        ],
        "wc_reply_authors_avg": [
            797.25,
            201.42538941255643
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 21,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=80395946121213299&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=jsWCmrsHHs",
        "pdf": "https://openreview.net/pdf?id=jsWCmrsHHs",
        "email": "huawei.com;smu.edu.sg;sdu.edu.cn;ntu.edu.sg;tue.nl",
        "author_num": 5,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "Huawei;Singapore Management University;Shandong University;Nanyang Technological University;Eindhoven University of Technology",
        "aff_unique_dep": "Huawei Technologies;;;;",
        "aff_unique_url": "https://www.huawei.com;https://www.smu.edu.sg;http://www.sdu.edu.cn;https://www.ntu.edu.sg;https://www.tue.nl",
        "aff_unique_abbr": "Huawei;SMU;SDU;NTU;TU/e",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;1;2",
        "aff_country_unique": "China;Singapore;Netherlands"
    },
    {
        "title": "What Makes a Good Prune? Maximal Unstructured Pruning for Maximal Cosine Similarity",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18003",
        "id": "jsvvPVVzwf",
        "author_site": "Gabryel Mason-Williams, Fredrik Dahlqvist",
        "tldr": "",
        "abstract": "Pruning is an effective method to reduce the size of deep neural network models, maintain accuracy, and, in some cases, improve the network's overall performance. However, the mechanisms underpinning pruning remain unclear. Why can different methods prune by different percentages yet achieve similar performance? Why can we not prune at the start of training? Why are some models more amenable to being pruned than others? Given a model, what is the maximum amount it can be pruned before significantly affecting the performance? This paper explores and answers these questions from the global unstructured magnitude pruning perspective with one epoch of fine-tuning. We develop the idea that cosine similarity is an effective proxy measure for functional similarity between the parent and the pruned network. We prove that the L1 pruning method is optimal when pruning by cosine similarity. We show that the higher the kurtosis of a model's parameter distribution, the more it can be pruned while maintaining performance. Finally, we present a simple method to determine the optimal amount by which a network can be L1-pruned based on its parameter distribution. The code demonstrating the method is available at https://github.com/gmw99/what_makes_a_good_prune",
        "keywords": "Pruning;Deep Learning;Neural Networks;Interpretability;Loss landscapes;Optimization;Kurtosis",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Gabryel Mason-Williams;Fredrik Dahlqvist",
        "authorids": "~Gabryel_Mason-Williams1;f.dahlqvist@qmul.ac.uk",
        "gender": ";",
        "homepage": "https://gmw99.github.io/;",
        "dblp": ";",
        "google_scholar": "Ofmd8TAAAAAJ;",
        "orcid": ";",
        "linkedin": "gabryel-mason-williams/;",
        "or_profile": "~Gabryel_Mason-Williams1;f.dahlqvist@qmul.ac.uk",
        "aff": " The Rosalind Franklin Institute;",
        "aff_domain": "rfi.ac.uk;",
        "position": "Researcher;",
        "bibtex": "@inproceedings{\nmason-williams2024what,\ntitle={What Makes a Good Prune? Maximal Unstructured Pruning for Maximal Cosine Similarity},\nauthor={Gabryel Mason-Williams and Fredrik Dahlqvist},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=jsvvPVVzwf}\n}",
        "github": "",
        "project": "",
        "reviewers": "AdU1;U3zy;vmPe;cZNh",
        "pdf_size": 2352917,
        "rating": "1;5;6;8",
        "confidence": "5;4;4;3",
        "soundness": "2;3;3;3",
        "contribution": "1;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "38;122;98;113",
        "wc_strengths": "21;53;110;82",
        "wc_weaknesses": "451;45;154;105",
        "wc_questions": "122;129;2;135",
        "wc_review": "632;349;364;435",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "308;179;178;306",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.0,
            2.5495097567963922
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            92.75,
            32.751908341347075
        ],
        "wc_strengths_avg": [
            66.5,
            33.10966626228661
        ],
        "wc_weaknesses_avg": [
            188.75,
            156.25359995852895
        ],
        "wc_questions_avg": [
            97.0,
            55.04089388809015
        ],
        "wc_review_avg": [
            445.0,
            112.74528814988234
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            242.75,
            64.25486362914484
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.9707253433941508,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14201688886671841711&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=jsvvPVVzwf",
        "pdf": "https://openreview.net/pdf?id=jsvvPVVzwf",
        "email": "rfi.ac.uk;",
        "author_num": 2,
        "aff_unique_index": "0",
        "aff_unique_norm": "Rosalind Franklin Institute",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.rosalindfranklin.org",
        "aff_unique_abbr": "",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "title": "EX-Graph: A Pioneering Dataset Bridging Ethereum and X",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18002",
        "id": "juE0rWGCJW",
        "author_site": "Qian Wang, Zhen Zhang, Zemin Liu, Shengliang Lu, Bingqiao Luo, Bingsheng He",
        "tldr": "",
        "abstract": "While numerous public blockchain datasets are available, their utility is constrained by an exclusive focus on blockchain data. This constraint limits the incorporation of relevant social network data into blockchain analysis, thereby diminishing the breadth and depth of insight that can be derived. To address the above limitation, we introduce EX-Graph, a novel dataset that authentically links Ethereum and X, marking the first and largest dataset of its kind. EX-Graph combines Ethereum transaction records (2 million nodes and 30 million edges) and X following data (1 million nodes and 3 million edges), bonding 30,667 Ethereum addresses with verified X accounts sourced from OpenSea. Detailed statistical analysis on EX- Graph highlights the structural differences between X-matched and non-X-matched Ethereum addresses. Extensive experiments, including Ethereum link prediction, wash-trading Ethereum addresses detection, and X-Ethereum matching link pre- diction, emphasize the significant role of X data in enhancing Ethereum analysis. EX-Graph is available at https://exgraph.deno.dev/.",
        "keywords": "Ethereum;X;GNN",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/75384370d82c4e0859ec3381f786bb63acc58870.pdf",
        "author": "Qian Wang;Zhen Zhang;Zemin Liu;Shengliang Lu;Bingqiao Luo;Bingsheng He",
        "authorids": "~Qian_Wang25;~Zhen_Zhang14;~Zemin_Liu1;~Shengliang_Lu1;~Bingqiao_Luo1;~Bingsheng_He1",
        "gender": ";M;M;M;;M",
        "homepage": ";https://cszhangzhen.github.io/;https://zemin-liu.github.io/;https://www.linkedin.com/in/shengliang-lu/;;http://www.comp.nus.edu.sg/~hebs/",
        "dblp": ";19/5112-23;17/964.html;;344/3342;h/BingshengHe.html",
        "google_scholar": "KAGrBdoAAAAJ;8hclVjIAAAAJ;IxHO1nkAAAAJ;;;https://scholar.google.com.tw/citations?user=RogYLKYAAAAJ",
        "orcid": ";0000-0001-5769-8786;0000-0001-6262-9435;;;0000-0001-8618-4581",
        "linkedin": ";;;shengliang-lu/;bingqiao-luo-3993031a3/;bingsheng-he-7734b131",
        "or_profile": "~Qian_Wang25;~Zhen_Zhang14;~Zemin_Liu1;~Shengliang_Lu1;~Bingqiao_Luo1;~Bingsheng_He1",
        "aff": "National University of Singapore;National University of Singapore;National University of Singapore;National University of Singapore;National University of Singapore;National University of Singapore",
        "aff_domain": "nus.edu.sg;nus.edu.sg;nus.edu;nus.edu.sg;u.nus.edu;nus.edu.sg",
        "position": "PhD student;Postdoc;Postdoc;Postdoc;PhD student;Full Professor",
        "bibtex": "@inproceedings{\nwang2024exgraph,\ntitle={{EX}-Graph: A Pioneering Dataset Bridging Ethereum and X},\nauthor={Qian Wang and Zhen Zhang and Zemin Liu and Shengliang Lu and Bingqiao Luo and Bingsheng He},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=juE0rWGCJW}\n}",
        "github": "",
        "project": "",
        "reviewers": "AoG7;SzMQ;hHyG",
        "pdf_size": 834812,
        "rating": "5;6;8",
        "confidence": "3;5;3",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "3;3;3",
        "wc_summary": "82;82;190",
        "wc_strengths": "47;79;82",
        "wc_weaknesses": "255;40;326",
        "wc_questions": "4;2;289",
        "wc_review": "388;203;887",
        "wc_reply_reviewers": "0;0;148",
        "wc_reply_authors": "2452;386;3250",
        "reply_reviewers": "0;0;1",
        "reply_authors": "8;2;6",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            118.0,
            50.91168824543142
        ],
        "wc_strengths_avg": [
            69.33333333333333,
            15.839472494022296
        ],
        "wc_weaknesses_avg": [
            207.0,
            121.5922146630559
        ],
        "wc_questions_avg": [
            98.33333333333333,
            134.82416532489847
        ],
        "wc_review_avg": [
            492.6666666666667,
            288.88329054404574
        ],
        "wc_reply_reviewers_avg": [
            49.333333333333336,
            69.76786907707269
        ],
        "wc_reply_authors_avg": [
            2029.3333333333333,
            1206.8165652750306
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            5.333333333333333,
            2.494438257849294
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.18898223650461365,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7060916059837677639&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=juE0rWGCJW",
        "pdf": "https://openreview.net/pdf?id=juE0rWGCJW",
        "email": "nus.edu.sg;nus.edu.sg;nus.edu;nus.edu.sg;u.nus.edu;nus.edu.sg",
        "author_num": 6,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "National University of Singapore",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nus.edu.sg",
        "aff_unique_abbr": "NUS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "Singapore"
    },
    {
        "id": "juStNETXI5",
        "title": "Tiny-StyleWizard: Unleashing the Potential of Small Language Models in Complex Style Transfer",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Text style transfer is a crucial task in natural language processing. While previous studies focused on simple styles like sentiment and formality, they overlooked the transfer of valuable complex styles. In this paper, we propose a framework named Tiny-StyleWizard to address this challenge. It first generates a specialized dataset retaining key aspects of the desired complex style based on diverse corpora and a large language model (LLM) and then fine-tines a small language model to achieve the goal of complex style transfer. Additionally, a novel evaluation protocol is devised to rank the quality of the generated specialized dataset and to measure the performance of different models. Extensive experiments on two representative complex style transfer tasks reveal that small language models like BART-base/large can produce stylized text on par with ChatGPT while the tinier ones like T5-mini (about 30M parameters) could surpass the state-of-the-art models. Intriguingly, Our investigation on the efficient construction of the training corpus shows the phenomenon named \"less is more\" and the subsequent similar \"ungrokking\" observation, emphasizing the supreme importance of data quality. Further exploration also showcases the sufficient diversity of the generation texts obtained by our Tiny-StyleWizard framework.",
        "keywords": "complex style transfer;large language model;less is more;ungrokking;diversity",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/9e0fce28838696f6158c9cb57bf6c835368e3fff.pdf",
        "author": "Xin Chen;Yongfeng Huang",
        "authorids": "~Xin_Chen34;~Yongfeng_Huang2",
        "gender": "M;",
        "homepage": ";",
        "dblp": ";",
        "google_scholar": "xHQXtYMAAAAJ;",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Xin_Chen34;~Yongfeng_Huang2",
        "aff": ";",
        "aff_domain": ";",
        "position": ";",
        "bibtex": "@misc{\nchen2024tinystylewizard,\ntitle={Tiny-StyleWizard: Unleashing the Potential of Small Language Models in Complex Style Transfer},\nauthor={Xin Chen and Yongfeng Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=juStNETXI5}\n}",
        "github": "",
        "project": "",
        "reviewers": "B8Me;Yb3s;Lzy3;KX34",
        "site": "https://openreview.net/forum?id=juStNETXI5",
        "pdf_size": 1764113,
        "rating": "3;3;3;6",
        "confidence": "3;5;5;4",
        "soundness": "3;3;2;3",
        "contribution": "2;2;3;2",
        "presentation": "1;2;3;3",
        "wc_summary": "76;105;47;75",
        "wc_strengths": "87;59;40;62",
        "wc_weaknesses": "292;251;234;103",
        "wc_questions": "167;67;17;25",
        "wc_review": "622;482;338;265",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "586;368;330;435",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            75.75,
            20.51066795596867
        ],
        "wc_strengths_avg": [
            62.0,
            16.718253497300488
        ],
        "wc_weaknesses_avg": [
            220.0,
            70.76369125476708
        ],
        "wc_questions_avg": [
            69.0,
            59.682493245507096
        ],
        "wc_review_avg": [
            426.75,
            137.12653827760693
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            429.75,
            97.73017701815544
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.17407765595569782,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:nBDE8a6YKM4J:scholar.google.com/&scioq=Tiny-StyleWizard:+Unleashing+the+Potential+of+Small+Language+Models+in+Complex+Style+Transfer&hl=en&as_sdt=0,5",
        "gs_version_total": 0
    },
    {
        "title": "Language-Informed Visual Concept Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18001",
        "id": "juuyW8B8ig",
        "author_site": "Sharon Lee, Yunzhi Zhang, Shangzhe Wu, Jiajun Wu",
        "tldr": "",
        "abstract": "Our understanding of the visual world is centered around various concept axes, characterizing different aspects of visual entities. While different concept axes can be easily specified by language, e.g., color, the exact visual nuances along each axis often exceed the limitations of linguistic articulations, e.g., a particular style of painting. In this work, our goal is to learn a language-informed visual concept representation, by simply distilling large pre-trained vision-language models. Specifically, we train a set of concept encoders to encode the information pertinent to a set of language-informed concept axes, with an objective of reproducing the input image through a pre-trained Text-to-Image (T2I) model. To encourage better disentanglement of different concept encoders, we anchor the concept embeddings to a set of text embeddings obtained from a pre-trained Visual Question Answering (VQA) model. At inference time, the model extracts concept embeddings along various axes from new test images, which can be remixed to generate images with novel compositions of visual concepts. With a lightweight test-time finetuning procedure, it can also generalize to novel concepts unseen at training.\nProject page at https://cs.stanford.edu/~yzzhang/projects/concept-axes.",
        "keywords": "Image generation; vision language models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/877db5129a7b9b7bdc7dc7e07bb79c89bdd51463.pdf",
        "author": "Sharon Lee;Yunzhi Zhang;Shangzhe Wu;Jiajun Wu",
        "authorids": "~Sharon_Lee1;~Yunzhi_Zhang1;~Shangzhe_Wu2;~Jiajun_Wu1",
        "gender": "F;F;M;M",
        "homepage": ";https://cs.stanford.edu/~yzzhang/;https://elliottwu.com/;https://jiajunwu.com",
        "dblp": "51/758;58/10932;164/9884;117/4768",
        "google_scholar": "jGwt3mcAAAAJ;https://scholar.google.com/citations?hl=en;36NmvrMAAAAJ;2efgcS0AAAAJ",
        "orcid": ";;0000-0003-1011-5963;0000-0002-4176-343X",
        "linkedin": "sharonleeyen;;;jiajunwu/",
        "or_profile": "~Sharon_Lee1;~Yunzhi_Zhang1;~Shangzhe_Wu2;~Jiajun_Wu1",
        "aff": "Stanford University;Stanford University;Stanford University;Stanford University",
        "aff_domain": "stanford.edu;stanford.edu;stanford.edu;stanford.edu",
        "position": "PhD student;PhD student;Postdoc;Assistant Professor",
        "bibtex": "@inproceedings{\nlee2024languageinformed,\ntitle={Language-Informed Visual Concept Learning},\nauthor={Sharon Lee and Yunzhi Zhang and Shangzhe Wu and Jiajun Wu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=juuyW8B8ig}\n}",
        "github": "",
        "project": "",
        "reviewers": "Bcg9;dyyk;jNDi;qJGK",
        "pdf_size": 7542641,
        "rating": "5;5;6;8",
        "confidence": "5;4;3;3",
        "soundness": "2;2;3;2",
        "contribution": "2;3;2;2",
        "presentation": "3;2;3;3",
        "wc_summary": "21;141;90;81",
        "wc_strengths": "21;87;53;48",
        "wc_weaknesses": "68;350;115;136",
        "wc_questions": "4;166;13;126",
        "wc_review": "114;744;271;391",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "213;378;358;565",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            83.25,
            42.60501731017135
        ],
        "wc_strengths_avg": [
            52.25,
            23.466731770743024
        ],
        "wc_weaknesses_avg": [
            167.25,
            108.34522370644679
        ],
        "wc_questions_avg": [
            77.25,
            70.2615648843662
        ],
        "wc_review_avg": [
            380.0,
            231.97736958591457
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            378.5,
            125.0929654297155
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.7385489458759963,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7465266089996451092&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=juuyW8B8ig",
        "pdf": "https://openreview.net/pdf?id=juuyW8B8ig",
        "email": "stanford.edu;stanford.edu;stanford.edu;stanford.edu",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Stanford University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.stanford.edu",
        "aff_unique_abbr": "Stanford",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Stanford",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "jvOvJ3XSjK",
        "title": "Predict-then-Optimize via Learning to Optimize from Features",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Many real-world decision processes are modeled by optimization problems whose defining parameters are unknown and must be inferred from observable data. \nThe Predict-Then-Optimize framework uses machine learning models to predict unknown parameters of an optimization problem from features before solving. Recent works show that decision quality can be improved in this setting by solving and differentiating the optimization problem in the training loop, enabling end-to-end training with loss functions defined directly on the resulting decisions. However, this approach can be inefficient and requires handcrafted, problem-specific rules for backpropagation through the optimization step. This paper proposes an alternative approach, in which optimal solutions are learned directly from the observable features by predictive models. The approach is generic and based on a simple adaptation of the Learning-to-Optimize paradigm from which a rich variety of existing techniques can be employed. Experimental evaluations show the ability of several Learning-to-Optimize methods to provide efficient, accurate, and flexible solutions to an array of challenging Predict-Then-Optimize problems.",
        "keywords": "Predict-the-optimize;Learning to Optimize;ML and Optimization",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "/attachment/37619a49a8300e494424a5b6901f69c10e527d25.zip",
        "author": "James Kotary;Vincenzo Di Vito Francesco;Jacob K Christopher;Pascal Van Hentenryck;Ferdinando Fioretto",
        "authorids": "~James_Kotary1;~Vincenzo_Di_Vito_Francesco1;~Jacob_K_Christopher1;~Pascal_Van_Hentenryck2;~Ferdinando_Fioretto1",
        "gender": ";M;M;M;M",
        "homepage": "https://j-kota.github.io;;https://www.linkedin.com/in/jacob-christopher-834a02239;https://sites.gatech.edu/pascal-van-hentenryck/;http://nandofioretto.com",
        "dblp": "289/0221;332/2193.html;;h/PVHentenryck.html;119/6404",
        "google_scholar": ";tlri3OQAAAAJ;;https://scholar.google.com/citations?hl=en;ASf9Q04AAAAJ",
        "orcid": ";0000-0001-8266-6233;;0000-0001-7085-9994;",
        "linkedin": ";;;;",
        "or_profile": "~James_Kotary1;~Vincenzo_Di_Vito_Francesco1;~Jacob_K_Christopher1;~Pascal_Van_Hentenryck2;~Ferdinando_Fioretto1",
        "aff": "University of Virginia, Charlottesville;University of Virginia, Charlottesville;University of Virginia, Charlottesville;Georgia Institute of Technology;University of Virginia, Charlottesville",
        "aff_domain": "virginia.edu;virginia.edu;virginia.edu;gatech.edu;virginia.edu",
        "position": "PhD student;PhD student;PhD student;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nkotary2024predictthenoptimize,\ntitle={Predict-then-Optimize  via Learning to Optimize from Features},\nauthor={James Kotary and Vincenzo Di Vito Francesco and Jacob K Christopher and Pascal Van Hentenryck and Ferdinando Fioretto},\nyear={2024},\nurl={https://openreview.net/forum?id=jvOvJ3XSjK}\n}",
        "github": "",
        "project": "",
        "reviewers": "Lqhu;rTig;Q2Xf;BPgy",
        "site": "https://openreview.net/forum?id=jvOvJ3XSjK",
        "pdf_size": 2405576,
        "rating": "3;3;3;5",
        "confidence": "3;4;4;3",
        "soundness": "1;2;2;3",
        "contribution": "1;2;2;2",
        "presentation": "3;3;3;3",
        "wc_summary": "34;320;65;300",
        "wc_strengths": "29;29;15;93",
        "wc_weaknesses": "58;424;850;188",
        "wc_questions": "218;6;9;125",
        "wc_review": "339;779;939;706",
        "wc_reply_reviewers": "255;303;585;0",
        "wc_reply_authors": "753;787;1915;435",
        "reply_reviewers": "1;1;2;0",
        "reply_authors": "2;2;4;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            179.75,
            130.9014419324707
        ],
        "wc_strengths_avg": [
            41.5,
            30.277879714405366
        ],
        "wc_weaknesses_avg": [
            380.0,
            301.4067019825538
        ],
        "wc_questions_avg": [
            89.5,
            88.35298523536146
        ],
        "wc_review_avg": [
            690.75,
            219.87311681967853
        ],
        "wc_reply_reviewers_avg": [
            285.75,
            207.63354136555105
        ],
        "wc_reply_authors_avg": [
            972.5,
            561.2047309137727
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.25,
            1.0897247358851685
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7765689528815595610&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "University of Virginia;Georgia Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.virginia.edu;https://www.gatech.edu",
        "aff_unique_abbr": "UVA;Georgia Tech",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Charlottesville;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "jvoK9rUl7W",
        "title": "MoveAnything: Controllable Scene Generation with Text-to-Image Diffusion Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Controllable scene generation, i.e., the task of generating images in which objects are at specific locations, is an active area of research with a wide range of applications in computer vision and graphics. Although Generative Adversarial Networks (GAN) have shown some successful results at this task by devising intermediate representations in which spatial content is disentangled, the quality of the generated images and the mid-level control they offer remains limited. Diffusion models, on the other hand, have been able to generate images with an unprecedented level of quality, but their generation process is hard to control and GAN-based techniques are not directly applicable to them. In this work, we propose SceneDiffusion, a framework that optimizes spatially disentangled representations for diffusion models. Our method jointly denoises multiple scene layouts during diffusion sampling, allowing controllable scene generation with any off-the-self text-to-image diffusion model. The proposed approach is training-free, has negligible time overhead, and is agnostic to any specific denoiser architecture. In addition, it further enables in-the-wild spatial image editing, allowing us to move any object in any given image while keeping the scene consistent. We build a comprehensive benchmark to quantitatively and qualitatively evaluate our approach and show that it outperforms previous works by a large margin on image quality and layout consistency.",
        "keywords": "controllable scene generation; text-to-image diffusion; spatial image editing",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Jiawei Ren;Mengmeng Xu;Jui-Chieh Wu;Ziwei Liu;Tao Xiang;Antoine Toisoul",
        "authorids": "~Jiawei_Ren1;~Mengmeng_Xu1;~Jui-Chieh_Wu1;~Ziwei_Liu1;~Tao_Xiang1;~Antoine_Toisoul1",
        "gender": "Unspecified;M;M;M;M;",
        "homepage": "https://jiawei-ren.github.io/;https://ivul.kaust.edu.sa/Pages/Frost-Xu.aspx;;https://liuziwei7.github.io/;https://www.surrey.ac.uk/people/tao-xiang;",
        "dblp": "122/3626-1;;68/3290.html;05/6300-2;22/4460-2.html;",
        "google_scholar": "https://scholar.google.com.sg/citations?user=YUKPVCoAAAAJ;be_ox9QAAAAJ;56ijCc0AAAAJ;https://scholar.google.com.hk/citations?user=lc45xlcAAAAJ;MeS5d4gAAAAJ;",
        "orcid": "0000-0003-1950-5976;;;;0000-0002-2530-1059;",
        "linkedin": ";;jerry-wu-02143a22/;;;",
        "or_profile": "~Jiawei_Ren1;~Mengmeng_Xu1;~Jui-Chieh_Wu1;~Ziwei_Liu1;~Tao_Xiang1;~Antoine_Toisoul1",
        "aff": "Nanyang Technological University;Meta ;Meta;Nanyang Technological University;University of Surrey;",
        "aff_domain": "ntu.edu.sg;meta.com;meta.com;ntu.edu.sg;surrey.ac.uk;",
        "position": "PhD student;Researcher;Researcher;Assistant Professor;Full Professor;",
        "bibtex": "@misc{\nren2024moveanything,\ntitle={MoveAnything: Controllable Scene Generation with Text-to-Image Diffusion Models},\nauthor={Jiawei Ren and Mengmeng Xu and Jui-Chieh Wu and Ziwei Liu and Tao Xiang and Antoine Toisoul},\nyear={2024},\nurl={https://openreview.net/forum?id=jvoK9rUl7W}\n}",
        "github": "",
        "project": "",
        "reviewers": "b2vZ;M51x;hfBH;Ndze",
        "site": "https://openreview.net/forum?id=jvoK9rUl7W",
        "pdf_size": 9807303,
        "rating": "3;5;5;5",
        "confidence": "4;3;2;1",
        "soundness": "2;3;1;2",
        "contribution": "2;2;3;2",
        "presentation": "2;2;3;3",
        "wc_summary": "74;122;166;119",
        "wc_strengths": "56;68;186;40",
        "wc_weaknesses": "363;286;345;214",
        "wc_questions": "233;14;73;18",
        "wc_review": "726;490;770;391",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            2.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            120.25,
            32.545160930620696
        ],
        "wc_strengths_avg": [
            87.5,
            57.72997488307092
        ],
        "wc_weaknesses_avg": [
            302.0,
            58.24517147369385
        ],
        "wc_questions_avg": [
            84.5,
            88.8495920080672
        ],
        "wc_review_avg": [
            594.25,
            158.44932155108773
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.7745966692414834,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:UkyWE-RT0S4J:scholar.google.com/&scioq=MoveAnything:+Controllable+Scene+Generation+with+Text-to-Image+Diffusion+Models&hl=en&as_sdt=0,9",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;0;2",
        "aff_unique_norm": "Nanyang Technological University;Meta;University of Surrey",
        "aff_unique_dep": ";Meta Platforms, Inc.;",
        "aff_unique_url": "https://www.ntu.edu.sg;https://meta.com;https://www.surrey.ac.uk",
        "aff_unique_abbr": "NTU;Meta;Surrey",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;0;2",
        "aff_country_unique": "Singapore;United States;United Kingdom"
    },
    {
        "title": "Statistical Perspective of Top-K Sparse Softmax Gating Mixture of Experts",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/18000",
        "id": "jvtmdK69KQ",
        "author_site": "Huy Nguyen, Pedram Akbarian Saravi, Fanqi Yan, Nhat Ho",
        "tldr": "",
        "abstract": "Top-K sparse softmax gating mixture of experts has been widely used for scaling up massive deep-learning architectures without increasing the computational cost. Despite its popularity in real-world applications, the theoretical understanding of that gating function has remained an open problem. The main challenge comes from the structure of the top-K sparse softmax gating function, which partitions the input space into multiple regions with distinct behaviors. By focusing on a Gaussian mixture of experts, we establish theoretical results on the effects of the top-K sparse softmax gating function on both density and parameter estimations. Our results hinge upon defining novel loss functions among parameters to capture different behaviors of the input regions. When the true number of experts $k_{\\ast}$ is known, we demonstrate that the convergence rates of density and parameter estimations are both parametric on the sample size. However, when $k_{\\ast}$ becomes unknown and the true model is over-specified by a Gaussian mixture of $k$ experts where $k > k_{\\ast}$, our findings suggest that the number of experts selected from the top-K sparse softmax gating function must exceed the total cardinality of a certain number of Voronoi cells associated with the true parameters to guarantee the convergence of the density estimation. Moreover, while the density estimation rate remains parametric under this setting, the parameter estimation rates become substantially slow due to an intrinsic interaction between the softmax gating and expert functions.",
        "keywords": "Mixture of Experts;Maximum Likelihood Estimation;Voronoi Loss Function",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/0ab4499caadd154d69b94cf867880c715ae28a35.pdf",
        "author": "Huy Nguyen;Pedram Akbarian;Fanqi Yan;Nhat Ho",
        "authorids": "~Huy_Nguyen5;~Pedram_Akbarian1;~Fanqi_Yan1;~Nhat_Ho1",
        "gender": "M;M;F;M",
        "homepage": "https://huynm99.github.io/;https://pedakb.github.io/;https://franziskayan.github.io/;https://nhatptnk8912.github.io/",
        "dblp": "48/6075;358/2800;249/2741;203/4479",
        "google_scholar": "_YYwzhQAAAAJ;eg68QWIAAAAJ;;https://scholar.google.ca/citations?user=Xs7cKMwAAAAJ",
        "orcid": ";;;",
        "linkedin": "huy-nguyen-081199/;;;nhat-pham-minh-ho-267b8164/",
        "or_profile": "~Huy_Nguyen5;~Pedram_Akbarian1;~Fanqi_Yan1;~Nhat_Ho1",
        "aff": "Microsoft AI;University of Texas at Austin;University of Texas at Austin;University of Texas, Austin",
        "aff_domain": "microsoft.com;utexas.edu;utexas.edu;utexas.edu",
        "position": "Intern;PhD student;PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nnguyen2024statistical,\ntitle={Statistical Perspective of Top-K Sparse Softmax Gating Mixture of Experts},\nauthor={Huy Nguyen and Pedram Akbarian and Fanqi Yan and Nhat Ho},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=jvtmdK69KQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "dwg3;X5io;qHcA",
        "pdf_size": 873482,
        "rating": "6;6;6",
        "confidence": "1;3;2",
        "soundness": "3;3;2",
        "contribution": "3;3;3",
        "presentation": "3;3;2",
        "wc_summary": "42;33;96",
        "wc_strengths": "55;30;62",
        "wc_weaknesses": "26;56;60",
        "wc_questions": "22;44;58",
        "wc_review": "145;163;276",
        "wc_reply_reviewers": "0;0;13",
        "wc_reply_authors": "838;804;683",
        "reply_reviewers": "0;0;1",
        "reply_authors": "3;2;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            2.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            57.0,
            27.820855486487112
        ],
        "wc_strengths_avg": [
            49.0,
            13.73559851869101
        ],
        "wc_weaknesses_avg": [
            47.333333333333336,
            15.173075568988056
        ],
        "wc_questions_avg": [
            41.333333333333336,
            14.817407180595247
        ],
        "wc_review_avg": [
            194.66666666666666,
            57.978923373546316
        ],
        "wc_reply_reviewers_avg": [
            4.333333333333333,
            6.128258770283413
        ],
        "wc_reply_authors_avg": [
            775.0,
            66.51816794430427
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 17,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9518933379498645640&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=jvtmdK69KQ",
        "pdf": "https://openreview.net/pdf?id=jvtmdK69KQ",
        "email": "microsoft.com;utexas.edu;utexas.edu;utexas.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Microsoft;University of Texas at Austin",
        "aff_unique_dep": "Microsoft AI;",
        "aff_unique_url": "https://www.microsoft.com;https://www.utexas.edu",
        "aff_unique_abbr": "Microsoft;UT Austin",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Austin",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Fair Classifiers that Abstain without Harm",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17999",
        "id": "jvveGAbkVx",
        "author_site": "Tongxin Yin, Jean-Francois Ton, Ruocheng Guo, Yuanshun Yao, Mingyan Liu, Yang Liu",
        "tldr": "",
        "abstract": "In critical applications, it is vital for classifiers to defer decision-making to humans. We propose a post-hoc method that makes existing classifiers selectively abstain from predicting certain samples. Our abstaining classifier is incentivized to maintain the original accuracy for each sub-population (i.e. no harm) while achieving a set of group fairness definitions to a user specified degree. To this end, we design an Integer Programming (IP) procedure that assigns abstention decisions for each training sample to satisfy a set of constraints. To generalize the abstaining decisions to test samples, we then train a surrogate model to learn the abstaining decisions based on the IP solutions in an end-to-end manner. We analyze the feasibility of the IP procedure to determine the possible abstention rate for different levels of unfairness tolerance and accuracy constraint for achieving no harm. To the best of our knowledge, this work is the first to identify the theoretical relationships between the constraint parameters and the required abstention rate. Our theoretical results are important since a high abstention rate is often infeasible in practice due to a lack of human resources. Our framework outperforms existing methods in terms of fairness disparity without sacrificing accuracy at similar abstention rates.",
        "keywords": "Fairness;Classification with abstention",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/2adcf8cedb9db329a27b45f23f17dcb04b229a38.pdf",
        "author": "Tongxin Yin;Jean-Francois Ton;Ruocheng Guo;Yuanshun Yao;Mingyan Liu;Yang Liu",
        "authorids": "~Tongxin_Yin1;~Jean-Francois_Ton2;~Ruocheng_Guo1;~Yuanshun_Yao2;~Mingyan_Liu1;~Yang_Liu3",
        "gender": "F;Not Specified;M;F;M;M",
        "homepage": "https://www.linkedin.com/in/tongxinyin/;https://savior287.github.io/JFT-webpage/;https://rguo12.github.io;https://liu.engin.umich.edu;http://www.yliuu.com;https://kevyao.com",
        "dblp": "305/3911;;167/4378;97/5725;51/3710-18;186/1486",
        "google_scholar": "_02Q5nEAAAAJ;WWVOu4kAAAAJ;8Nuj8NwAAAAJ;WiIM-MgAAAAJ;jKrIVCIAAAAJ;AG51Bv4AAAAJ",
        "orcid": "0000-0002-6166-3890;;;0000-0003-3295-9200;0000-0001-8420-6011;",
        "linkedin": "tongxinyin/;;;;;",
        "or_profile": "~Tongxin_Yin1;~Jean-Francois_Ton2;~Ruocheng_Guo1;~Mingyan_Liu1;~Yang_Liu3;~Kevin_Yao1",
        "aff": "University of Michigan - Ann Arbor;Bytedance;Bytedance Research;University of Michigan - Ann Arbor;University of California, Santa Cruz;ByteDance Research",
        "aff_domain": "umich.edu;bytedance.com;bytedance.com;umich.edu;ucsc.edu;bytedance.com",
        "position": "PhD student;Researcher;Researcher;Full Professor;Assistant Professor;Researcher",
        "bibtex": "@inproceedings{\nyin2024fair,\ntitle={Fair Classifiers that Abstain without Harm},\nauthor={Tongxin Yin and Jean-Francois Ton and Ruocheng Guo and Yuanshun Yao and Mingyan Liu and Yang Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=jvveGAbkVx}\n}",
        "github": "",
        "project": "",
        "reviewers": "7v7y;RYdg;JZKB;GsZB",
        "pdf_size": 1340092,
        "rating": "6;6;6;8",
        "confidence": "3;4;2;4",
        "soundness": "3;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "3;4;3;3",
        "wc_summary": "194;79;95;123",
        "wc_strengths": "77;79;48;101",
        "wc_weaknesses": "197;197;39;451",
        "wc_questions": "18;39;22;145",
        "wc_review": "486;394;204;820",
        "wc_reply_reviewers": "0;0;0;21",
        "wc_reply_authors": "1099;695;358;1291",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "3;2;2;3",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            122.75,
            44.04755952376931
        ],
        "wc_strengths_avg": [
            76.25,
            18.833148966649205
        ],
        "wc_weaknesses_avg": [
            221.0,
            147.6279106402309
        ],
        "wc_questions_avg": [
            56.0,
            51.98557492228012
        ],
        "wc_review_avg": [
            476.0,
            223.12776608929693
        ],
        "wc_reply_reviewers_avg": [
            5.25,
            9.093266739736606
        ],
        "wc_reply_authors_avg": [
            860.75,
            361.28546538713675
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5222329678670935,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1748520407755307869&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=jvveGAbkVx",
        "pdf": "https://openreview.net/pdf?id=jvveGAbkVx",
        "email": "umich.edu;bytedance.com;bytedance.com;umich.edu;ucsc.edu;bytedance.com",
        "author_num": 6,
        "aff_unique_index": "0;1;1;0;2;1",
        "aff_unique_norm": "University of Michigan;ByteDance;University of California, Santa Cruz",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.umich.edu;https://www.bytedance.com;https://www.ucsc.edu",
        "aff_unique_abbr": "UM;Bytedance;UCSC",
        "aff_campus_unique_index": "0;0;2",
        "aff_campus_unique": "Ann Arbor;;Santa Cruz",
        "aff_country_unique_index": "0;1;1;0;0;1",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "jw8EoY1FvF",
        "title": "Delayed Local-SGD for Distributed Learning with Linear Speedup",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Local-SGD-based algorithms have gained much popularity in distributed learning to reduce the communication overhead, where each client conducts multiple localized iterations before communicating with the central server. However, since all participating clients are required to initiate iterations from the latest global model in each round of Local-SGD, the overall training process can be slowed down due to the straggler effect. To address this issue, we propose a Delayed Local-SGD (DLSGD) framework for distributed and federated learning with partial client participation. In DLSGD, each client performs local training starting from outdated models, regardless of whether it participates in the global aggregation. We investigate two types of DLSGD methods applied to scenarios where clients have identical or different local objective functions. Theoretical analyses demonstrate that DLSGD achieves asymptotic convergence rates that are on par with the classic Local-SGD methods for solving nonconvex problems, and guarantees linear speedup with respect to the number of participating clients. Additionally, we carry out numerical experiments using real datasets to validate the efficiency and scalability of our approach when training neural networks.",
        "keywords": "Distributed Learning;Federated Learning;Distributed Optimization;Linear Speedup",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Xiaolu Wang;Zijian Li;Jun Zhang",
        "authorids": "~Xiaolu_Wang1;~Zijian_Li2;~Jun_Zhang25",
        "gender": ";;",
        "homepage": ";https://scholar.google.com/citations?user=ocn7vOMAAAAJ&hl=en;https://eejzhang.people.ust.hk/",
        "dblp": ";27/10487-2;z/JunZhang4",
        "google_scholar": ";;1Is687QAAAAJ",
        "orcid": ";;0000-0002-5222-1898",
        "linkedin": ";;",
        "or_profile": "~Xiaolu_Wang1;~Zijian_Li2;~Jun_Zhang25",
        "aff": ";Hong Kong University of Science and Technology;Hong Kong University of Science and Technology",
        "aff_domain": ";connect.ust.hk;ust.hk",
        "position": ";PhD student;Associate Professor",
        "bibtex": "@misc{\nwang2024delayed,\ntitle={Delayed Local-{SGD} for Distributed Learning with Linear Speedup},\nauthor={Xiaolu Wang and Zijian Li and Jun Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=jw8EoY1FvF}\n}",
        "github": "",
        "project": "",
        "reviewers": "3asx;gXZN;iNrr;JkMR",
        "site": "https://openreview.net/forum?id=jw8EoY1FvF",
        "pdf_size": 1183448,
        "rating": "3;3;5;5",
        "confidence": "3;5;3;4",
        "soundness": "2;2;3;2",
        "contribution": "2;2;2;2",
        "presentation": "2;2;2;3",
        "wc_summary": "44;23;41;149",
        "wc_strengths": "21;12;21;146",
        "wc_weaknesses": "245;69;83;421",
        "wc_questions": "4;69;234;7",
        "wc_review": "314;173;379;723",
        "wc_reply_reviewers": "125;0;14;0",
        "wc_reply_authors": "698;443;677;626",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            64.25,
            49.58515402819679
        ],
        "wc_strengths_avg": [
            50.0,
            55.54727716099143
        ],
        "wc_weaknesses_avg": [
            204.5,
            142.8591964138116
        ],
        "wc_questions_avg": [
            78.5,
            93.45185926454326
        ],
        "wc_review_avg": [
            397.25,
            202.2775012204768
        ],
        "wc_reply_reviewers_avg": [
            34.75,
            52.41838894891754
        ],
        "wc_reply_authors_avg": [
            611.0,
            100.46641229784211
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.30151134457776363,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:oBDOBLMWG40J:scholar.google.com/&scioq=Delayed+Local-SGD+for+Distributed+Learning+with+Linear+Speedup&hl=en&as_sdt=0,31",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Hong Kong University of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ust.hk",
        "aff_unique_abbr": "HKUST",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "jwzm44fsJ8",
        "title": "Multilingual Code Retrieval Without Paired Data: New Datasets and Benchmarks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We seek to overcome limitations to code retrieval quality posed by the scarcity of data containing pairs of code snippets and natural language queries in languages other than English. To do so, we introduce two new datasets. First, we make a new evaluation benchmark available, dubbed M$^2$CRB, containing pairs of text and code, for multiple natural and programming language pairs - namely: Spanish, Portuguese, German, and French, each paired with code snippets for: Python, Java, and JavaScript. The dataset is curated via an automated filtering pipeline from source files within GitHub followed by human verification to ensure accurate language classification. Additionally, in order be able to train models and evaluate on the proposed task, we pose the following hypothesis: if a model can map from English to code, and from other natural languages to English, then the model can directly map from those non-English languages into code. We thus build a training corpus made of a new paired English/Code dataset we curate, and further combine it with existing translation datasets given by pairs of English and other natural languages. Extensive evaluations on both our new tasks as well as on existing code-to-code search benchmarks confirm our hypothesis: models are able to generalize to unseen language pairs they indirectly observed during training. We examine a broad set of model classes and report the influence of different design choices on the observed generalization capabilities.",
        "keywords": "Multilingual data;Code retrieval from text;Contrastive learning;Generalization to unseen conditions",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Joao Monteiro;Torsten Scholak;Virendra Mehta;David Vazquez;Christopher Pal",
        "authorids": "~Joao_Monteiro1;~Torsten_Scholak1;~Virendra_Mehta1;~David_Vazquez1;~Christopher_Pal1",
        "gender": "M;M;;M;",
        "homepage": ";https://tscholak.github.com;http://knowdive.disi.unitn.it/virendra-mehta/;http://www.david-vazquez.com;https://scholar.google.ca/citations?user=1ScWJOoAAAAJ&hl=en&oi=ao",
        "dblp": "215/5354-2;277/0957;303/4829;94/8653;45/1217",
        "google_scholar": "https://scholar.google.ca/citations?hl=en;https://scholar.google.ca/citations?user=BgkjtKgAAAAJ;rMFe4bsAAAAJ;1jHvtfsAAAAJ;https://scholar.google.ca/citations?user=1ScWJOoAAAAJ",
        "orcid": ";;0000-0001-9447-401X;0000-0002-2845-8158;",
        "linkedin": "joao-monteiro-47180256/;tscholak;;https://www.linkedin.com/company/david-vazquez/;",
        "or_profile": "~Joao_Monteiro1;~Torsten_Scholak1;~Virendra_Mehta1;~David_Vazquez1;~Christopher_Pal1",
        "aff": "ServiceNow Research;ServiceNow Research;University of Trento;ServiceNow research;Polytechnique Montreal",
        "aff_domain": "servicenow.com;servicenow.com;unitn.it;servicenow.com;polymtl.ca",
        "position": "Researcher;Researcher;PhD student;Researcher;Full Professor",
        "bibtex": "@misc{\nmonteiro2024multilingual,\ntitle={Multilingual Code Retrieval Without Paired Data: New Datasets and Benchmarks},\nauthor={Joao Monteiro and Torsten Scholak and Virendra Mehta and David Vazquez and Christopher Pal},\nyear={2024},\nurl={https://openreview.net/forum?id=jwzm44fsJ8}\n}",
        "github": "",
        "project": "",
        "reviewers": "MZBA;z3xc;mHNB;QVKG",
        "site": "https://openreview.net/forum?id=jwzm44fsJ8",
        "pdf_size": 460327,
        "rating": "3;5;6;6",
        "confidence": "4;4;3;3",
        "soundness": "2;3;2;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;2;3",
        "wc_summary": "61;138;140;180",
        "wc_strengths": "8;79;33;121",
        "wc_weaknesses": "66;81;116;218",
        "wc_questions": "205;117;160;2",
        "wc_review": "340;415;449;521",
        "wc_reply_reviewers": "113;0;67;0",
        "wc_reply_authors": "1616;777;1079;607",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "4;2;4;2",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            129.75,
            43.083494519363214
        ],
        "wc_strengths_avg": [
            60.25,
            43.34382885717412
        ],
        "wc_weaknesses_avg": [
            120.25,
            59.280582824395374
        ],
        "wc_questions_avg": [
            121.0,
            75.42214528903298
        ],
        "wc_review_avg": [
            431.25,
            65.11672212266217
        ],
        "wc_reply_reviewers_avg": [
            45.0,
            47.84871994108097
        ],
        "wc_reply_authors_avg": [
            1019.75,
            383.5083929981194
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.0,
            1.0
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.8164965809277259,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:CaAJV8xs7PcJ:scholar.google.com/&scioq=Multilingual+Code+Retrieval+Without+Paired+Data:+New+Datasets+and+Benchmarks&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;2",
        "aff_unique_norm": "ServiceNow;University of Trento;Polytechnique Montreal",
        "aff_unique_dep": "Research;;",
        "aff_unique_url": "https://www.servicenow.com;https://www.unitn.it;https://www.polymtl.ca",
        "aff_unique_abbr": "ServiceNow;UniTN;PolyMTL",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Montreal",
        "aff_country_unique_index": "0;0;1;0;2",
        "aff_country_unique": "United States;Italy;Canada"
    },
    {
        "id": "jx6njBKH8E",
        "title": "Amplifying Training Data Exposure through Fine-Tuning with Pseudo-Labeled Memberships",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Neural language models (LMs) are vulnerable to training data extraction attacks due to data memorization. This paper introduces a novel attack scenario wherein an attacker adversarially fine-tunes pre-trained LMs to amplify the exposure of the original training data. This strategy differs from prior studies by aiming to intensify the LM's retention of its pre-training dataset. To achieve this, the attacker needs to collect generated texts that are closely aligned with the pre-training data. However, without knowledge of the actual dataset, quantifying the amount of pre-training data within generated texts is challenging. To address this, we propose the use of pseudo-labels for these generated texts, leveraging membership approximations indicated by machine-generated probabilities from the target LM. We subsequently fine-tune the LM to favor generations with higher likelihoods of originating from the pre-training data, based on their membership probabilities. Our empirical findings indicate a remarkable outcome: LMs with over 1B parameters exhibit a four to eight-fold increase in training data exposure. We discuss potential mitigations and suggest future research directions.",
        "keywords": "large language model;training data extraction;fine-tuning;pseudo-labeling with membership;privacy",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/dc613caf91afa791754206d7e2ce3a65a5370e3d.zip",
        "author": "Myung Gyo Oh;Hong Eun Ahn;Leo Hyun Park;Taekyoung Kwon",
        "authorids": "~Myung_Gyo_Oh2;~Hong_Eun_Ahn1;~Leo_Hyun_Park1;~Taekyoung_Kwon1",
        "gender": "M;F;;M",
        "homepage": ";http://seclab.yonsei.ac.kr/;;http://seclab.yonsei.ac.kr",
        "dblp": ";;;",
        "google_scholar": "9HOGtJYAAAAJ;;https://scholar.google.co.kr/citations?user=VkwXKtgAAAAJ;QWKskOIAAAAJ",
        "orcid": "0000-0002-0253-1580;;my-orcid?orcid=0000-0002-3100-2258;",
        "linkedin": ";;;",
        "or_profile": "~Myung_Gyo_Oh2;~Hong_Eun_Ahn1;~Leo_Hyun_Park1;~Taekyoung_Kwon1",
        "aff": "Yonsei University;Yonsei University;Yonsei University;Yonsei University",
        "aff_domain": "yonsei.ac.kr;yonsei.ac.kr;yonsei.ac.kr;yonsei.ac.kr",
        "position": "MS student;MS student;PhD student;Full Professor",
        "bibtex": "@misc{\noh2024amplifying,\ntitle={Amplifying Training Data Exposure through Fine-Tuning with Pseudo-Labeled Memberships},\nauthor={Myung Gyo Oh and Hong Eun Ahn and Leo Hyun Park and Taekyoung Kwon},\nyear={2024},\nurl={https://openreview.net/forum?id=jx6njBKH8E}\n}",
        "github": "",
        "project": "",
        "reviewers": "JBPh;cSHP;ZqEj;VkQN",
        "site": "https://openreview.net/forum?id=jx6njBKH8E",
        "pdf_size": 549457,
        "rating": "5;6;6;6",
        "confidence": "4;3;3;2",
        "soundness": "2;2;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;2",
        "wc_summary": "223;87;158;67",
        "wc_strengths": "78;48;348;35",
        "wc_weaknesses": "248;68;194;72",
        "wc_questions": "219;38;87;2",
        "wc_review": "768;241;787;176",
        "wc_reply_reviewers": "79;74;0;0",
        "wc_reply_authors": "1959;660;1327;400",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "3;2;3;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            133.75,
            61.633493329520114
        ],
        "wc_strengths_avg": [
            127.25,
            128.4004964943672
        ],
        "wc_weaknesses_avg": [
            145.5,
            77.88934458576475
        ],
        "wc_questions_avg": [
            86.5,
            82.23290095819313
        ],
        "wc_review_avg": [
            493.0,
            285.5056917120918
        ],
        "wc_reply_reviewers_avg": [
            38.25,
            38.290827883450106
        ],
        "wc_reply_authors_avg": [
            1086.5,
            606.6879346088893
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:LyilWRzQNSwJ:scholar.google.com/&scioq=Amplifying+Training+Data+Exposure+through+Fine-Tuning+with+Pseudo-Labeled+Memberships&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Yonsei University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.yonsei.ac.kr",
        "aff_unique_abbr": "Yonsei",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "From Sparse to Soft Mixtures of Experts",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17998",
        "id": "jxpsAj7ltE",
        "author_site": "Joan Puigcerver, Carlos Riquelme Ruiz, Basil Mustafa, Neil Houlsby",
        "tldr": "",
        "abstract": "Sparse mixture of expert architectures (MoEs) scale model capacity without significant increases in training or inference costs.\nDespite their success, MoEs suffer from a number of issues: training instability, token dropping, inability to scale the number of experts, or ineffective finetuning.\nIn this work, we propose Soft MoE, a fully-differentiable sparse Transformer that addresses these challenges, while maintaining the benefits of MoEs.\nSoft MoE performs an implicit soft assignment by passing different weighted combinations of all input tokens to each expert.\nAs in other MoEs, experts in Soft MoE only process a subset of the (combined) tokens, enabling larger model capacity (and performance) at lower inference cost.\nIn the context of visual recognition, Soft MoE greatly outperforms dense Transformers (ViTs) and popular MoEs (Tokens Choice and Experts Choice).\nSoft MoE scales well: Soft MoE Huge/14 with 128 experts in 16 MoE layers has over 40x more parameters than ViT Huge/14, with only 2% increased inference time, and substantially better quality.",
        "keywords": "transformers;mixtures of experts;computer vision",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/3e2b005182e069947f86fb9e6d523631e4c8e460.pdf",
        "author": "Joan Puigcerver;Carlos Riquelme Ruiz;Basil Mustafa;Neil Houlsby",
        "authorids": "~Joan_Puigcerver1;~Carlos_Riquelme_Ruiz1;~Basil_Mustafa1;~Neil_Houlsby1",
        "gender": "M;M;M;M",
        "homepage": "http://www.jpuigcerver.net;https://rikel.github.io/;https://www.basilmustafa.com/;https://neilhoulsby.github.io/",
        "dblp": "155/3271;https://dblp.uni-trier.de/pers/hd/r/Riquelme:Carlos;;91/10669",
        "google_scholar": "https://scholar.google.com/citations?hl=en;Es2BBeYAAAAJ;https://scholar.google.co.uk/citations?user=LuxZAJwAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;",
        "linkedin": ";;basil-mustafa/;",
        "or_profile": "~Joan_Puigcerver1;~Carlos_Riquelme_Ruiz1;~Basil_Mustafa1;~Neil_Houlsby1",
        "aff": "Google;Google;Google;Google",
        "aff_domain": "google.com;google.com;google.com;google.com",
        "position": "Software Engineer in Research;Researcher;Research Software Engineer;Researcher",
        "bibtex": "@inproceedings{\npuigcerver2024from,\ntitle={From Sparse to Soft Mixtures of Experts},\nauthor={Joan Puigcerver and Carlos Riquelme Ruiz and Basil Mustafa and Neil Houlsby},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=jxpsAj7ltE}\n}",
        "github": "",
        "project": "",
        "reviewers": "HCxh;pKE3;wHYN;fyPo",
        "pdf_size": 665649,
        "rating": "6;8;8;8",
        "confidence": "3;3;4;4",
        "soundness": "3;3;4;4",
        "contribution": "4;3;3;4",
        "presentation": "4;2;4;4",
        "wc_summary": "147;53;398;90",
        "wc_strengths": "64;52;47;263",
        "wc_weaknesses": "127;18;124;65",
        "wc_questions": "37;76;65;23",
        "wc_review": "375;199;634;441",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "10;10;10;10",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.5,
            0.5
        ],
        "presentation_avg": [
            3.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            172.0,
            134.70894550845537
        ],
        "wc_strengths_avg": [
            106.5,
            90.56627407594948
        ],
        "wc_weaknesses_avg": [
            83.5,
            45.18019477602991
        ],
        "wc_questions_avg": [
            50.25,
            21.20583646074825
        ],
        "wc_review_avg": [
            412.25,
            155.61390522700728
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            10.0,
            0.0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 138,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14576886702901370721&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=jxpsAj7ltE",
        "pdf": "https://openreview.net/pdf?id=jxpsAj7ltE",
        "email": "google.com;google.com;google.com;google.com",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Google",
        "aff_unique_dep": "Google",
        "aff_unique_url": "https://www.google.com",
        "aff_unique_abbr": "Google",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Mountain View",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "jyiD0q2wp2",
        "title": "Human Pose Estimation via Parse Graph of Body Structure",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "When observing a person's body, humans can extract the structured representation of the body called a parse graph, which includes the hierarchical decompositions from the entire body to parts and primitives and the context relations by horizontal links between the body parts. This ability helps humans better locate body structures at different levels. In order for the model to have this ability for human pose estimation (HPE), We design a hierarchical network to model the context relations and hierarchical structure in the parsing graph by convolutional neural networks. It overcomes the problem that most methods ignore context relations in the inference of hierarchical structure for HPE. Our network contains bottom-up and top-down stages. In the bottom-up stage, the structural features of the hierarchy are captured from primitives to parts and the entire body. Then in the top-down stage, with the context information of each body part, the structural features of the body parts are refined separately rather than together from the entire body to parts and primitives. Experiments show that our model enhances the reasonableness of predictions and achieves superior results on the COCO keypoint detection and MPII human pose datasets.",
        "keywords": "Human Pose Estimation;Parse Graph;Context Relations;Hierarchical Structure;Hierarchical Decompositions",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Shibang Liu;Xuemei Xie;Guangming Shi",
        "authorids": "~Shibang_Liu1;~Xuemei_Xie1;~Guangming_Shi1",
        "gender": "M;F;M",
        "homepage": ";https://web.xidian.edu.cn/xmxie/;http://see.xidian.edu.cn/faculty/gmshi/",
        "dblp": ";06/5645;97/3742",
        "google_scholar": ";;11aRt9oAAAAJ",
        "orcid": "0009-0007-7572-3667;0000-0001-7857-0845;",
        "linkedin": ";;",
        "or_profile": "~Shibang_Liu1;~Xuemei_Xie1;~Guangming_Shi1",
        "aff": "Xidian University;Xidian University;Xidian University",
        "aff_domain": "stu.xidian.edu.cn;xidian.edu.cn;xidian.edu.cn",
        "position": "PhD student;Full Professor;Full Professor",
        "bibtex": "@misc{\nliu2024human,\ntitle={Human Pose Estimation via Parse Graph of Body Structure},\nauthor={Shibang Liu and Xuemei Xie and Guangming Shi},\nyear={2024},\nurl={https://openreview.net/forum?id=jyiD0q2wp2}\n}",
        "github": "",
        "project": "",
        "reviewers": "6Yh6;qq5T;y1Ri;8zRF",
        "site": "https://openreview.net/forum?id=jyiD0q2wp2",
        "pdf_size": 1984214,
        "rating": "3;3;3;5",
        "confidence": "5;4;5;3",
        "soundness": "2;3;2;3",
        "contribution": "1;2;2;2",
        "presentation": "3;2;2;2",
        "wc_summary": "34;49;82;67",
        "wc_strengths": "23;38;24;31",
        "wc_weaknesses": "255;141;572;91",
        "wc_questions": "30;2;18;2",
        "wc_review": "342;230;696;191",
        "wc_reply_reviewers": "0;42;0;0",
        "wc_reply_authors": "713;758;670;314",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            58.0,
            18.12456896039186
        ],
        "wc_strengths_avg": [
            29.0,
            6.041522986797286
        ],
        "wc_weaknesses_avg": [
            264.75,
            187.08337045285452
        ],
        "wc_questions_avg": [
            13.0,
            11.789826122551595
        ],
        "wc_review_avg": [
            364.75,
            199.11727072255687
        ],
        "wc_reply_reviewers_avg": [
            10.5,
            18.186533479473212
        ],
        "wc_reply_authors_avg": [
            613.75,
            175.83568323864188
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8703882797784891,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5939646888545829353&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Xidian University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.xidian.edu.cn/",
        "aff_unique_abbr": "Xidian",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "jz35igczhm",
        "title": "Brain-inspired $L_p$-Convolution benefits large kernels and aligns better with visual cortex",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Convolutional Neural Networks (CNNs) have profoundly influenced the field of computer vision, drawing significant inspiration from the visual processing mechanisms inherent in the brain. Despite sharing fundamental structural and representational similarities with the biological visual system, differences in local connectivity patterns within CNNs open up an interesting area to explore. In this work, we explore whether integrating biologically observed receptive fields (RFs) can enhance model performance and foster alignment with brain representations. We introduce a novel methodology, termed $L_p$-convolution, which employs the multivariate $p$-generalized normal distribution as an adaptable $L_p$-masks, to reconcile disparities between artificial and biological RFs. $L_p$-masks finds the optimal RFs through task-dependent adaptation of conformation such as distortion, scale, and rotation. This allows $L_p$-convolution to excel in tasks that require flexible RF shapes, including not only square-shaped regular RFs but also horizontal and vertical ones. Furthermore, we demonstrate that $L_p$-convolution with biological RFs significantly enhances the performance of large kernel CNNs possibly by introducing Gaussian-like structured sparsity in convolution. Lastly, we present that neural representations of CNNs align more closely with the visual cortex when $L_p$-convolution is close to biological RFs. This research shines a light on the potential of brain-inspired models that merge insights from neuroscience and machine learning, with the hope of bridging the gap between artificial and biological visual systems.",
        "keywords": "Lp-Convolution;Receptive Field;Multivariate p-generalized normal distribution;Representation Similarity;Visual Cortex;Gaussian Sparsity",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "Jea Kwon;Kyungwoo Song;C. Justin Lee",
        "authorids": "~Jea_Kwon1;~Kyungwoo_Song1;~C._Justin_Lee1",
        "gender": "M;;M",
        "homepage": "https://jeakwon.github.io;https://mlai.yonsei.ac.kr;https://www.ibs.re.kr/glia/",
        "dblp": ";155/4867;",
        "google_scholar": "6I0mg_EAAAAJ;HWxRii4AAAAJ;v3aGpogAAAAJ",
        "orcid": "0000-0003-4318-4383;0000-0003-0082-4280;0000-0002-3555-0980",
        "linkedin": ";kyungwoo-song-862863155/;",
        "or_profile": "~Jea_Kwon1;~Kyungwoo_Song1;~C._Justin_Lee1",
        "aff": "Institute for Basic Science;Yonsei University;Insitute for Basic Science",
        "aff_domain": "ibs.re.kr;yonsei.ac.kr;ibs.re.kr",
        "position": "Postdoc;Assistant Professor;Principal Researcher",
        "bibtex": "@misc{\nkwon2024braininspired,\ntitle={Brain-inspired \\$L\\_p\\$-Convolution benefits large kernels and aligns better with visual cortex},\nauthor={Jea Kwon and Kyungwoo Song and C. Justin Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=jz35igczhm}\n}",
        "github": "",
        "project": "",
        "reviewers": "qr9c;oxDe;Bf1L;UBiz;YKuY",
        "site": "https://openreview.net/forum?id=jz35igczhm",
        "pdf_size": 7528559,
        "rating": "5;5;8;8;8",
        "confidence": "4;3;3;3;3",
        "soundness": "4;3;3;4;4",
        "contribution": "2;2;3;3;4",
        "presentation": "3;1;4;4;4",
        "wc_summary": "85;149;41;95;62",
        "wc_strengths": "19;90;25;37;50",
        "wc_weaknesses": "21;334;88;132;9",
        "wc_questions": "584;10;672;117;16",
        "wc_review": "709;583;826;381;137",
        "wc_reply_reviewers": "0;114;25;35;0",
        "wc_reply_authors": "1554;840;2348;717;187",
        "reply_reviewers": "0;1;1;1;0",
        "reply_authors": "3;2;3;1;1",
        "rating_avg": [
            6.8,
            1.469693845669907
        ],
        "confidence_avg": [
            3.2,
            0.39999999999999997
        ],
        "soundness_avg": [
            3.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.8,
            0.7483314773547882
        ],
        "presentation_avg": [
            3.2,
            1.16619037896906
        ],
        "wc_summary_avg": [
            86.4,
            36.47245536017557
        ],
        "wc_strengths_avg": [
            44.2,
            25.24598978055723
        ],
        "wc_weaknesses_avg": [
            116.8,
            117.50302123775371
        ],
        "wc_questions_avg": [
            279.8,
            288.1821646112056
        ],
        "wc_review_avg": [
            527.2,
            244.57178905180376
        ],
        "wc_reply_reviewers_avg": [
            34.8,
            41.930418552645044
        ],
        "wc_reply_authors_avg": [
            1129.2,
            749.2949752934421
        ],
        "reply_reviewers_avg": [
            0.6,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            2.0,
            0.8944271909999159
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.6123724356957946,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:3sewXo9qSHgJ:scholar.google.com/&scioq=Brain-inspired+%24L_p%24-Convolution+benefits+large+kernels+and+aligns+better+with+visual+cortex&hl=en&as_sdt=0,5",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Institute for Basic Science;Yonsei University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ibs.re.kr;https://www.yonsei.ac.kr",
        "aff_unique_abbr": "IBS;Yonsei",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "jzdQPKgIWA",
        "title": "Learning to Explore with In-Context Policy for Fast Peer Adaptation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Adapting to different peers in multi-agent settings requires agents to quickly learn about the peer\u2019s policy from a few interactions and act accordingly. In this paper, we present a novel end-to-end method that learns an in-context policy that actively explores the peer\u2019s policy, recognizes its pattern, and adapts to it. The agent is trained on a diverse set of peer policies to learn how to balance exploration and exploitation based on the observed context, which is the history of interactions with the peer. The agent proposes exploratory actions when the context is uncertain, which can elicit informative feedback from the peer and help infer its preferences. To encourage such exploration behavior, we introduce an intrinsic reward based on the accuracy of the peer identification. The agent exploits the context when it is confident, which can optimize its performance with the peer. We evaluate our method on two tasks that involve competitive (Kuhn Poker) or cooperative (Overcooked) interactions with peer agents. We demonstrate that our method induces active exploration behavior, achieving faster adaptation and better outcomes than existing methods.",
        "keywords": "Multi-agent Reinforcement Learning;In-Context Learning;Peer Adaptation",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Long Ma;Yuanfei Wang;Fangwei Zhong;Song-Chun Zhu;Yizhou Wang",
        "authorids": "~Long_Ma5;~Yuanfei_Wang1;~Fangwei_Zhong3;~Song-Chun_Zhu1;~Yizhou_Wang1",
        "gender": "M;M;M;M;M",
        "homepage": "https://sites.google.com/view/long-ma-homepage/home;https://yuanfei-wang.github.io/;https://zhusongchun.net/;https://cfcs.pku.edu.cn/wangyizhou/;https://fangweizhong.xyz/",
        "dblp": ";47/10626;10/10313;71/3387-1;207/1900",
        "google_scholar": ";;https://scholar.google.com.tw/citations?user=Al8dyb4AAAAJ;831z_VcAAAAJ;ejDz1bYAAAAJ",
        "orcid": ";0009-0008-8908-1981;;;0000-0002-0428-4552",
        "linkedin": ";;;;",
        "or_profile": "~Long_Ma5;~Yuanfei_Wang1;~Song-Chun_Zhu1;~Yizhou_Wang1;~fangwei_zhong1",
        "aff": "Peking University;Peking University;Peking University;Peking University;Peking University",
        "aff_domain": "pku.edu.cn;pku.edu.cn;pku.edu.cn;pku.edu.cn;pku.edu.cn",
        "position": "PhD student;PhD student;Full Professor;Full Professor;Postdoc",
        "bibtex": "@misc{\nma2024learning,\ntitle={Learning to Explore with In-Context Policy for Fast Peer Adaptation},\nauthor={Long Ma and Yuanfei Wang and Fangwei Zhong and Song-Chun Zhu and Yizhou Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=jzdQPKgIWA}\n}",
        "github": "",
        "project": "",
        "reviewers": "wMXp;gKAo;cQ6z;VfPt",
        "site": "https://openreview.net/forum?id=jzdQPKgIWA",
        "pdf_size": 2280524,
        "rating": "3;5;5;6",
        "confidence": "4;4;4;3",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "1;3;4;3",
        "wc_summary": "117;148;125;121",
        "wc_strengths": "109;104;35;63",
        "wc_weaknesses": "257;193;186;61",
        "wc_questions": "24;174;54;85",
        "wc_review": "507;619;400;330",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "791;682;739;652",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            127.75,
            12.028611723719408
        ],
        "wc_strengths_avg": [
            77.75,
            30.457962834043908
        ],
        "wc_weaknesses_avg": [
            174.25,
            70.99779926166725
        ],
        "wc_questions_avg": [
            84.25,
            56.126531159514926
        ],
        "wc_review_avg": [
            464.0,
            109.46003837017416
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            716.0,
            53.39943819929195
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.6622661785325219,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:s2dhll87ZRoJ:scholar.google.com/&scioq=Learning+to+Explore+with+In-Context+Policy+for+Fast+Peer+Adaptation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Peking University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.pku.edu.cn",
        "aff_unique_abbr": "Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Language Modeling Is Compression",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17997",
        "id": "jznbgiynus",
        "author_site": "Gregoire Deletang, Anian Ruoss, Paul-Ambroise Duquenne, Elliot Catt, Tim Genewein, Christopher Mattern, Jordi Grau-Moya, Li Kevin Wenliang, Matthew Aitchison, Laurent Orseau, Marcus Hutter, Joel Veness",
        "tldr": "",
        "abstract": "It has long been established that predictive models can be transformed into lossless compressors and vice versa. Incidentally, in recent years, the machine learning community has focused on training increasingly large and powerful self-supervised (language) models. Since these large language models exhibit impressive predictive capabilities, they are well-positioned to be strong compressors. In this work, we advocate for viewing the prediction problem through the lens of compression and evaluate the compression capabilities of large (foundation) models. We show that large language models are powerful general-purpose predictors and that the compression viewpoint provides novel insights into scaling laws, tokenization, and in-context learning. For example, Chinchilla 70B, while trained primarily on text, compresses ImageNet patches to 43.4% and LibriSpeech samples to 16.4% of their raw size, beating domain-specific compressors like PNG (58.5%) or FLAC (30.3%), respectively. Finally, we show that the prediction-compression equivalence allows us to use any compressor (like gzip) to build a conditional generative model.",
        "keywords": "lossless compression;arithmetic coding;language models;scaling laws;in-context learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Gregoire Deletang;Anian Ruoss;Paul-Ambroise Duquenne;Elliot Catt;Tim Genewein;Christopher Mattern;Jordi Grau-Moya;Li Kevin Wenliang;Matthew Aitchison;Laurent Orseau;Marcus Hutter;Joel Veness",
        "authorids": "~Gregoire_Deletang1;~Anian_Ruoss1;~Paul-Ambroise_Duquenne1;~Elliot_Catt1;~Tim_Genewein1;~Christopher_Mattern1;~Jordi_Grau-Moya2;~Li_Kevin_Wenliang1;~Matthew_Aitchison1;~Laurent_Orseau1;~Marcus_Hutter1;~Joel_Veness2",
        "gender": ";M;M;M;M;;;;M;;;",
        "homepage": ";;;;http://tim.inversetemperature.net/;;;https://kevin-w-li.github.io/;;;http://www.hutter1.net/;",
        "dblp": ";259/2083;;204/2511;116/3039;19/10437.html;116/3023;255/7009;;79/1040;h/MarcusHutter;",
        "google_scholar": ";gFkwD3kAAAAJ;Uah8IcAAAAAJ;d1JYeMIAAAAJ;https://scholar.google.de/citations?user=peNTK9oAAAAJ;;;https://scholar.google.co.uk/citations?user=MW45NMEAAAAJ;81URpqMAAAAJ;;https://scholar.google.com.tw/citations?user=7hmCntEAAAAJ;",
        "orcid": ";;;0000-0001-9411-927X;;;;;;;0000-0002-3263-4097;",
        "linkedin": ";anian-ruoss;;;;;jordi-g-9a1b02104;;;;hutter1/;",
        "or_profile": "~Gregoire_Deletang1;~Anian_Ruoss1;~Paul-Ambroise_Duquenne1;~Elliot_Catt1;~Tim_Genewein1;~Christopher_Mattern1;~Jordi_Grau-Moya2;~Li_Kevin_Wenliang1;~Matthew_Aitchison1;~Laurent_Orseau1;~Marcus_Hutter1;~Joel_Veness2",
        "aff": ";Google DeepMind;Meta Facebook;Google DeepMind;Google DeepMind;Google DeepMind;Google DeepMind;Google DeepMind;Australian National University;;Australian National University;",
        "aff_domain": ";deepmind.com;fb.com;deepmind.com;google.com;deepmind.com;deepmind.com;deepmind.com;anu.edu.au;;anu.edu.au;",
        "position": ";Researcher;Research Assistant, PhD resident;Researcher;Researcher;Researcher;Researcher;Researcher;PhD student;;Full Professor;",
        "bibtex": "@inproceedings{\ndeletang2024language,\ntitle={Language Modeling Is Compression},\nauthor={Gregoire Deletang and Anian Ruoss and Paul-Ambroise Duquenne and Elliot Catt and Tim Genewein and Christopher Mattern and Jordi Grau-Moya and Li Kevin Wenliang and Matthew Aitchison and Laurent Orseau and Marcus Hutter and Joel Veness},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=jznbgiynus}\n}",
        "github": "",
        "project": "",
        "reviewers": "55Jb;NHbN;8SR8;hCy6",
        "pdf_size": 2218154,
        "rating": "6;6;6;6",
        "confidence": "4;3;3;3",
        "soundness": "4;3;3;3",
        "contribution": "3;3;2;2",
        "presentation": "4;3;3;3",
        "wc_summary": "75;49;31;163",
        "wc_strengths": "56;55;20;128",
        "wc_weaknesses": "366;28;257;234",
        "wc_questions": "4;8;32;174",
        "wc_review": "501;140;340;699",
        "wc_reply_reviewers": "0;0;25;75",
        "wc_reply_authors": "472;135;651;1125",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            79.5,
            50.68283733178323
        ],
        "wc_strengths_avg": [
            64.75,
            39.28978874975024
        ],
        "wc_weaknesses_avg": [
            221.25,
            122.20755909517217
        ],
        "wc_questions_avg": [
            54.5,
            69.81940990870662
        ],
        "wc_review_avg": [
            420.0,
            205.67085355003513
        ],
        "wc_reply_reviewers_avg": [
            25.0,
            30.618621784789728
        ],
        "wc_reply_authors_avg": [
            595.75,
            357.33833757379017
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            12,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 173,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8098408536892148709&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=jznbgiynus",
        "pdf": "https://openreview.net/pdf?id=jznbgiynus",
        "email": ";deepmind.com;fb.com;deepmind.com;google.com;deepmind.com;deepmind.com;deepmind.com;anu.edu.au;;anu.edu.au;",
        "author_num": 12,
        "aff_unique_index": "0;1;0;0;0;0;0;2;2",
        "aff_unique_norm": "Google;Meta;Australian National University",
        "aff_unique_dep": "Google DeepMind;Meta Platforms, Inc.;",
        "aff_unique_url": "https://deepmind.com;https://meta.com;https://www.anu.edu.au",
        "aff_unique_abbr": "DeepMind;Meta;ANU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;0;0;0;2;2",
        "aff_country_unique": "United Kingdom;United States;Australia"
    },
    {
        "id": "jzvWwv4gMx",
        "title": "On the Paradox of Generalizable Logical Reasoning in Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The emergent few-shot reasoning capabilities of Large Language Models (LLMs) have excited the natural language and machine learning community over recent years. Despite the numerous successful applications, it remains an open question whether LLMs have generalizable logical reasoning abilities. In this work, we expose a surprising failure of generalization in logical reasoning tasks (deduction, induction, and abduction)---when semantics are decoupled from the language reasoning process (\\ie, replacing semantic words with pure symbols), LLMs tend to perform much worse. We hypothesize that the learned \\textit{semantics} of language tokens do the most heavy lifting during the reasoning process but fail to imitate the basic formal reasoning abilities of humans. Furthermore, we also attempt to fine-tune Llama-2 on pure symbolic reasoning tasks to narrow the gap. However, the results indicate that FT-Llama2 can utilize similar template matching to respond to reasoning queries, but it falls short of generalizing to novel logic rules. These surprising observations question whether modern LLMs have mastered the inductive, deductive, and abductive reasoning abilities as in human intelligence, and motivate research on unveiling the magic existing within the black-box LLMs and evaluating and improving language models' reasoning abilities.",
        "keywords": "Large Language Models; Symbolic Reasoning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/f2d875eed9f70745a5c5aa3e35b7555584d4cb87.zip",
        "author": "Xiaojuan Tang;Zilong Zheng;Jiaqi Li;Fanxu Meng;Song-Chun Zhu;Yitao Liang;Muhan Zhang",
        "authorids": "~Xiaojuan_Tang1;~Zilong_Zheng1;~Jiaqi_Li10;~Fanxu_Meng1;~Song-Chun_Zhu1;~Yitao_Liang1;~Muhan_Zhang1",
        "gender": "F;M;Not Specified;M;M;M;M",
        "homepage": "https://xiaojuantang.github.io/;http://zilongzheng.github.io;;https://fxmeng.github.io/;https://zhusongchun.net/;https://web.cs.ucla.edu/~yliang/;https://muhanzhang.github.io/",
        "dblp": "332/0595;218/5234;118/4502-3;;10/10313;173/4969;157/5518",
        "google_scholar": ";9sDx70IAAAAJ;https://scholar.google.com.hk/citations?user=C4Z2-rsAAAAJ;xvfuhRUAAAAJ;https://scholar.google.com.tw/citations?user=Al8dyb4AAAAJ;KVzR1XEAAAAJ;https://scholar.google.com.hk/citations?user=OBBqkosAAAAJ",
        "orcid": ";;;;;;0000-0002-7680-6401",
        "linkedin": ";;;;;;jerry-muhan-zhang-a33a1777/",
        "or_profile": "~Xiaojuan_Tang1;~Zilong_Zheng1;~Jiaqi_Li10;~Fanxu_Meng1;~Song-Chun_Zhu1;~Yitao_Liang1;~Muhan_Zhang1",
        "aff": "Peking University;Beijing Institute for General Artificial Intelligence;Beijing Institute for General Artificial Intelligence;Peking University;Peking University;Peking University;Peking University",
        "aff_domain": "pku.edu.cn;bigai.ai;bigai.com;pku.edu.cn;pku.edu.cn;pku.edu.cn;pku.edu.cn",
        "position": "PhD student;Researcher;Researcher;PhD student;Full Professor;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\ntang2024on,\ntitle={On the Paradox of Generalizable Logical Reasoning in Large Language Models},\nauthor={Xiaojuan Tang and Zilong Zheng and Jiaqi Li and Fanxu Meng and Song-Chun Zhu and Yitao Liang and Muhan Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=jzvWwv4gMx}\n}",
        "github": "",
        "project": "",
        "reviewers": "qhHL;nbkm;Zwsu;oqtQ;np2z;VR1b",
        "site": "https://openreview.net/forum?id=jzvWwv4gMx",
        "pdf_size": 607248,
        "rating": "3;3;3;5;5;6",
        "confidence": "2;4;3;3;4;3",
        "soundness": "2;1;3;2;2;3",
        "contribution": "2;1;2;3;2;2",
        "presentation": "2;3;3;3;2;3",
        "wc_summary": "26;103;122;139;96;132",
        "wc_strengths": "15;70;71;73;110;24",
        "wc_weaknesses": "205;498;255;55;535;22",
        "wc_questions": "217;297;41;102;103;48",
        "wc_review": "463;968;489;369;844;226",
        "wc_reply_reviewers": "0;487;0;0;0;0",
        "wc_reply_authors": "1550;1302;1000;411;1184;66",
        "reply_reviewers": "0;1;0;0;0;0",
        "reply_authors": "3;2;2;1;2;1",
        "rating_avg": [
            4.166666666666667,
            1.2133516482134197
        ],
        "confidence_avg": [
            3.1666666666666665,
            0.6871842709362768
        ],
        "soundness_avg": [
            2.1666666666666665,
            0.6871842709362768
        ],
        "contribution_avg": [
            2.0,
            0.5773502691896257
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            103.0,
            37.58545818087983
        ],
        "wc_strengths_avg": [
            60.5,
            32.170120712653016
        ],
        "wc_weaknesses_avg": [
            261.6666666666667,
            197.47207960170527
        ],
        "wc_questions_avg": [
            134.66666666666666,
            92.63308744119936
        ],
        "wc_review_avg": [
            559.8333333333334,
            261.2810853382915
        ],
        "wc_reply_reviewers_avg": [
            81.16666666666667,
            181.49418417373295
        ],
        "wc_reply_authors_avg": [
            918.8333333333334,
            517.5758935224433
        ],
        "reply_reviewers_avg": [
            0.16666666666666666,
            0.372677996249965
        ],
        "reply_authors_avg": [
            1.8333333333333333,
            0.6871842709362768
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.1665741511631924,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11902623347367462579&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;0;0;0;0",
        "aff_unique_norm": "Peking University;Beijing Institute for General Artificial Intelligence",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.pku.edu.cn;http://www.bigaiai.org/",
        "aff_unique_abbr": "Peking U;BIGAI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "C-TPT: Calibrated Test-Time Prompt Tuning for Vision-Language Models via Text Feature Dispersion",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17996",
        "id": "jzzEHTBFOT",
        "author_site": "Hee Suk Yoon, Eunseop Yoon, Joshua Tian Jin Tee, Mark Hasegawa-Johnson, Yingzhen Li, Chang Yoo",
        "tldr": "",
        "abstract": "In deep learning, test-time adaptation has gained attention as a method for model fine-tuning without the need for labeled data. A prime exemplification is the recently proposed test-time prompt tuning for large-scale vision-language models such as CLIP. Unfortunately, these prompts have been mainly developed to improve accuracy, overlooking the importance of calibration, which is a crucial aspect for quantifying prediction uncertainty. However, traditional calibration methods rely on substantial amounts of labeled data, making them impractical for test-time scenarios. To this end, this paper explores calibration during test-time prompt tuning by leveraging the inherent properties of CLIP. Through a series of observations, we find that the prompt choice significantly affects the calibration in CLIP, where the prompts leading to higher text feature dispersion result in better-calibrated predictions. Introducing the Average Text Feature Dispersion (ATFD), we establish its relationship with calibration error and present a novel method, Calibrated Test-time Prompt Tuning (C-TPT), for optimizing prompts during test-time with enhanced calibration. Through extensive experiments on different CLIP architectures and datasets, we show that C-TPT can effectively improve the calibration of test-time prompt tuning without needing labeled data. The code is publicly accessible at https://github.com/hee-suk-yoon/C-TPT.",
        "keywords": "Calibration;Test-time adaptation;CLIP;Prompt tuning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Hee Suk Yoon;Eunseop Yoon;Joshua Tian Jin Tee;Mark A. Hasegawa-Johnson;Yingzhen Li;Chang D. Yoo",
        "authorids": "~Hee_Suk_Yoon1;~Eunseop_Yoon1;~Joshua_Tian_Jin_Tee1;~Mark_A._Hasegawa-Johnson1;~Yingzhen_Li1;~Chang_D._Yoo1",
        "gender": "M;F;M;M;F;M",
        "homepage": "https://hee-suk-yoon.github.io/;https://esyoon7.github.io/;;http://speechtechnology.web.illinois.edu;http://yingzhenli.net/home/en/;https://sanctusfactory.com/family.php",
        "dblp": "331/3851;331/3764;;70/3186;117/9230;31/7819",
        "google_scholar": "eJ_iOQEAAAAJ;QbEnxx0AAAAJ;x90yFvMAAAAJ;18O0OAwAAAAJ;https://scholar.google.se/citations?hl=en;gFWgUQEAAAAJ",
        "orcid": "0000-0003-2115-8459;0000-0002-5580-5354;;0000-0002-5631-2893;;0000-0002-0756-7179",
        "linkedin": "https://www.linkedin.com/mwlite/in/hee-suk-yoon-262935137;;;mark-hasegawa-johnson-21a86825/;;",
        "or_profile": "~Hee_Suk_Yoon1;~Eunseop_Yoon1;~Joshua_Tian_Jin_Tee1;~Mark_A._Hasegawa-Johnson1;~Yingzhen_Li1;~Chang_D._Yoo1",
        "aff": "Korea Advanced Institute of Science & Technology;KAIST;KAIST, Korea Advanced Institute of Science & Technology;University of Illinois, Urbana Champaign;Imperial College London;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;ee.kaist.ac.kr;ee.kaist.ac.kr;illinois.edu;imperial.ac.uk;kaist.ac.kr",
        "position": "PhD student;PhD student;PhD student;Full Professor;Associate Professor;Full Professor",
        "bibtex": "@inproceedings{\nyoon2024ctpt,\ntitle={C-{TPT}: Calibrated Test-Time Prompt Tuning for Vision-Language Models via Text Feature Dispersion},\nauthor={Hee Suk Yoon and Eunseop Yoon and Joshua Tian Jin Tee and Mark A. Hasegawa-Johnson and Yingzhen Li and Chang D. Yoo},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=jzzEHTBFOT}\n}",
        "github": "",
        "project": "",
        "reviewers": "CqA1;eM6j;H39i;fxyk",
        "pdf_size": 6851874,
        "rating": "6;6;6;6",
        "confidence": "3;5;4;4",
        "soundness": "3;3;3;3",
        "contribution": "3;3;2;2",
        "presentation": "3;4;3;4",
        "wc_summary": "32;104;108;97",
        "wc_strengths": "43;84;82;80",
        "wc_weaknesses": "58;271;140;203",
        "wc_questions": "29;6;28;23",
        "wc_review": "162;465;358;403",
        "wc_reply_reviewers": "15;67;0;19",
        "wc_reply_authors": "513;1397;1214;276",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "3;5;4;3",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            85.25,
            30.994959267597046
        ],
        "wc_strengths_avg": [
            72.25,
            16.946607330082326
        ],
        "wc_weaknesses_avg": [
            168.0,
            78.60979582723772
        ],
        "wc_questions_avg": [
            21.5,
            9.233092656309694
        ],
        "wc_review_avg": [
            347.0,
            113.36445651084823
        ],
        "wc_reply_reviewers_avg": [
            25.25,
            25.1234452255259
        ],
        "wc_reply_authors_avg": [
            850.0,
            467.6403532630605
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.75,
            0.82915619758885
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 30,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17710052127676580968&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=jzzEHTBFOT",
        "pdf": "https://openreview.net/pdf?id=jzzEHTBFOT",
        "email": "kaist.ac.kr;ee.kaist.ac.kr;ee.kaist.ac.kr;illinois.edu;imperial.ac.uk;kaist.ac.kr",
        "author_num": 6,
        "aff_unique_index": "0;0;0;1;2;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology;University of Illinois Urbana-Champaign;Imperial College London",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.kaist.ac.kr;https://illinois.edu;https://www.imperial.ac.uk",
        "aff_unique_abbr": "KAIST;UIUC;ICL",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Urbana-Champaign",
        "aff_country_unique_index": "0;0;0;1;2;0",
        "aff_country_unique": "South Korea;United States;United Kingdom"
    },
    {
        "id": "k06CbKrdIk",
        "title": "A Effective Variance Change Detection Method under constantly Changing Mean",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Effectively evaluating the viability of a procured organ in the transplant patient prior the procedure is of critical importance. Current viability assessment methods rely on evaluating the organ\u2019s morphology and/or laboratory biopsy results with limited effectiveness. A recently proposed, well-designed noninvasive method evaluated the viability status of organs by detecting the variance change point of their surface temperature through exploring the entire data profile. However, most part of the data in a temperature profile barely contains the change information, which yields a waste of computational resources of their method. This paper proposes an accelerating algorithm with a well-designed dual control windows scheme that can be extended to online change detection. The proposed method significantly improves the computational speed and retains the same change detection power as the method Gao19 through the removal of redundant data. Simulation and application results demonstrate the robust performance of the proposed method.",
        "keywords": "Dual control windows;Variance change point detection;Smoothly changing mean trend;Subsampling;Liver procurement",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Zhenguo Gao;Yan Li",
        "authorids": "~Zhenguo_Gao1;~Yan_Li28",
        "gender": "M;",
        "homepage": "https://math.sjtu.edu.cn/Default/teachershow/tags/MDAwMDAwMDAwMLJ4nJg;",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": ";0009-0005-2379-491X",
        "linkedin": ";",
        "or_profile": "~Zhenguo_Gao1;~Yan_Li28",
        "aff": "Shanghai Jiaotong University;",
        "aff_domain": "sjtu.edu.cn;",
        "position": "Associate Professor;",
        "bibtex": "@misc{\ngao2024a,\ntitle={A Effective Variance Change Detection Method under constantly Changing Mean},\nauthor={Zhenguo Gao and Yan Li},\nyear={2024},\nurl={https://openreview.net/forum?id=k06CbKrdIk}\n}",
        "github": "",
        "project": "",
        "reviewers": "dHKn;Cj8H;daaU",
        "site": "https://openreview.net/forum?id=k06CbKrdIk",
        "pdf_size": 1043990,
        "rating": "5;5;5",
        "confidence": "4;4;3",
        "soundness": "2;2;3",
        "contribution": "3;1;2",
        "presentation": "2;2;2",
        "wc_summary": "122;70;181",
        "wc_strengths": "118;14;24",
        "wc_weaknesses": "77;156;55",
        "wc_questions": "130;80;229",
        "wc_review": "447;320;489",
        "wc_reply_reviewers": "0;35;55",
        "wc_reply_authors": "121;560;243",
        "reply_reviewers": "0;1;1",
        "reply_authors": "1;2;2",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            124.33333333333333,
            45.345586579315764
        ],
        "wc_strengths_avg": [
            52.0,
            46.847269575362304
        ],
        "wc_weaknesses_avg": [
            96.0,
            43.36665385600631
        ],
        "wc_questions_avg": [
            146.33333333333334,
            61.9157133170212
        ],
        "wc_review_avg": [
            418.6666666666667,
            71.84396673037726
        ],
        "wc_reply_reviewers_avg": [
            30.0,
            22.73030282830976
        ],
        "wc_reply_authors_avg": [
            308.0,
            185.02071956044995
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:NM3RuLXcGv8J:scholar.google.com/&scioq=A+Effective+Variance+Change+Detection+Method+under+constantly+Changing+Mean&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Shanghai Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sjtu.edu.cn",
        "aff_unique_abbr": "SJTU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "k0RQHNulm7",
        "title": "Generalizable Cross-Modality Distillation with Contrastive Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Cross-modality distillation arises as an important topic for data modalities containing limited knowledge such as depth maps and high-quality sketches. Such techniques are of great importance, especially for memory and privacy-restricted scenarios where labeled training data is generally unavailable. To solve the problem, existing label-free methods leverage a few pairwise unlabeled data to distill the knowledge by aligning features or statistics between the source and target modalities. For instance, one typically aims to minimize the L2 distance between the learned features of pairs of samples in the source (e.g. image) and the target (e.g. sketch) modalities. \nHowever, these approaches only consider the positive correspondence in paired samples, which is typically limited in quantity, while overlooking the potential information within the negative relationship present in the unpaired data, which is more abundant in cross-modality datasets. To exploit such a negative relationship which plays a vital role in learning discriminative feature representation, we propose a novel framework called generalizable cross-modality contrastive distillation (CMCD), built upon contrastive learning that leverages both positive and negative correspondence, towards a better distillation of generalizable features. Extensive experimental results show that our algorithm outperforms existing algorithms consistently by a margin of 2-3\\% across diverse modalities and tasks, covering modalities of image, sketch, depth map, and audio and tasks of recognition and segmentation. Our convergence analysis reveals that the distance between source and target modalities significantly impacts the test error on downstream tasks within the target modality which is also validated by the empirical results.",
        "keywords": "contrastive learning;cross-modality distillation;unsupervised learning;generalization bound",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/f7c2a3ca692be23492a0ac9889aef9b875490163.zip",
        "author": "Hangyu Lin;Chen Liu;Chengming Xu;Zhengqi Gao;Hang Zhao;Yanwei Fu;Yuan Yao",
        "authorids": "~Hangyu_Lin2;~Chen_Liu4;~Chengming_Xu1;~Zhengqi_Gao1;~Hang_Zhao1;~Yanwei_Fu2;~Yuan_Yao1",
        "gender": "M;M;M;M;M;M;Unspecified",
        "homepage": ";;https://chmxu.github.io;http://zhengqigao.github.io/;http://www.mit.edu/~hangzhao/;http://yanweifu.github.io;https://yao-lab.github.io/",
        "dblp": "178/8696;;115/9183-1;256/9403;;63/9065;25/4120-11.html",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;pjcYzvYAAAAJ;igvvVY4AAAAJ;DmahiOYAAAAJ;https://scholar.google.co.uk/citations?user=Vg54TcsAAAAJ;OOlHr-wAAAAJ",
        "orcid": ";;0000-0003-3891-2227;;;0000-0002-6595-6893;0000-0001-5814-1162",
        "linkedin": ";;;zhengqi-gao-729b51146/;;;",
        "or_profile": "~Hangyu_Lin2;~Chen_Liu4;~Chengming_Xu1;~Zhengqi_Gao1;~Hang_Zhao1;~Yanwei_Fu2;~Yuan_Yao1",
        "aff": "Hong Kong University of Science and Technology;Hong Kong University of Science and Technology;Tencent;Massachusetts Institute of Technology;Tsinghua University;Fudan University,;Hong Kong University of Science and Technology",
        "aff_domain": "ust.hk;connect.ust.hk;tencent.com;mit.edu;tsinghua.edu.cn;fudan.edu.cn;ust.hk",
        "position": "PhD student;PhD student;Researcher;PhD student;Assistant Professor;Professor;Full Professor",
        "bibtex": "@misc{\nlin2024generalizable,\ntitle={Generalizable Cross-Modality Distillation with Contrastive Learning},\nauthor={Hangyu Lin and Chen Liu and Chengming Xu and Zhengqi Gao and Hang Zhao and Yanwei Fu and Yuan Yao},\nyear={2024},\nurl={https://openreview.net/forum?id=k0RQHNulm7}\n}",
        "github": "",
        "project": "",
        "reviewers": "QE51;qhgx;3kmi;s3Ct",
        "site": "https://openreview.net/forum?id=k0RQHNulm7",
        "pdf_size": 376145,
        "rating": "5;5;5;6",
        "confidence": "4;3;3;3",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;2;3",
        "wc_summary": "70;87;62;73",
        "wc_strengths": "45;75;45;64",
        "wc_weaknesses": "276;139;221;304",
        "wc_questions": "88;46;2;9",
        "wc_review": "479;347;330;450",
        "wc_reply_reviewers": "101;48;0;65",
        "wc_reply_authors": "1507;854;574;649",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "4;2;2;2",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            73.0,
            9.027735042633894
        ],
        "wc_strengths_avg": [
            57.25,
            12.852528934026953
        ],
        "wc_weaknesses_avg": [
            235.0,
            62.956334073705406
        ],
        "wc_questions_avg": [
            36.25,
            34.23722389446901
        ],
        "wc_review_avg": [
            401.5,
            64.11123146532127
        ],
        "wc_reply_reviewers_avg": [
            53.5,
            36.33524459804833
        ],
        "wc_reply_authors_avg": [
            896.0,
            367.34792771975725
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.8660254037844386
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9766945686625600915&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2;3;4;0",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Tencent;Massachusetts Institute of Technology;Tsinghua University;Fudan University",
        "aff_unique_dep": ";Tencent Holdings Limited;;;",
        "aff_unique_url": "https://www.ust.hk;https://www.tencent.com;https://web.mit.edu;https://www.tsinghua.edu.cn;https://www.fudan.edu.cn",
        "aff_unique_abbr": "HKUST;Tencent;MIT;THU;Fudan",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;1;0;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "k0nlUXYKhX",
        "title": "A Fault Forecasting Approach Using Two-Dimensional Optimization (TDO)",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Data preparation plays a pivotal role in every machine learning-based approach, and this holds true for the task of detecting claims in the automotive industry as well. Handling high-dimensional feature spaces, especially when dealing with imbalanced data, poses a significant challenge in sectors where a vast amount of data accumulates over time. Machine learning models trained on highly imbalanced data often result in unreliable and untrustworthy predictions. Therefore, addressing the aforementioned issues is essential during the data pre-processing phase. In this paper, we propose an innovative two-dimensional optimization approach to effectively address the challenge of highly imbalanced data in the context of fault detection. We employ a heuristic optimization algorithm called Genetic Algorithm to concurrently reduce both the data point tuples and the feature space. Furthermore, we constructed and evaluated two-dimensional reduction using particle swarm optimization (PSO) and Whale optimization algorithms. The empirical results of the proposed techniques on the data collected from thousands of vehicles show promise.",
        "keywords": "Fault Detection; Tuple Selection; Feature Selection",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "mohsen Tajgardan;Reza Khoshkangini;Mahdi Rabbani",
        "authorids": "~mohsen_Tajgardan1;~Reza_Khoshkangini1;~Mahdi_Rabbani1",
        "gender": "M;;M",
        "homepage": ";;",
        "dblp": ";;",
        "google_scholar": "q4yJHBIAAAAJ;jTfKNxMAAAAJ;https://scholar.google.ca/citations?user=PYrO57QAAAAJ",
        "orcid": "0000-0003-1220-5196;;",
        "linkedin": ";;",
        "or_profile": "~mohsen_Tajgardan1;~Reza_Khoshkangini1;~Mahdi_Rabbani1",
        "aff": ";Malmo University;University of New Brunswick",
        "aff_domain": ";mau.se;unb.ca",
        "position": ";Lecturer;Postdoc",
        "bibtex": "@misc{\ntajgardan2024a,\ntitle={A Fault Forecasting Approach Using Two-Dimensional Optimization ({TDO})},\nauthor={mohsen Tajgardan and Reza Khoshkangini and Mahdi Rabbani},\nyear={2024},\nurl={https://openreview.net/forum?id=k0nlUXYKhX}\n}",
        "github": "",
        "project": "",
        "reviewers": "5nRP;SqTT;wBRJ;gDy3",
        "site": "https://openreview.net/forum?id=k0nlUXYKhX",
        "pdf_size": 317552,
        "rating": "1;3;3;3",
        "confidence": "3;4;5;4",
        "soundness": "2;2;2;2",
        "contribution": "2;1;2;2",
        "presentation": "2;2;2;2",
        "wc_summary": "89;87;59;76",
        "wc_strengths": "23;81;10;27",
        "wc_weaknesses": "54;200;131;127",
        "wc_questions": "44;89;39;63",
        "wc_review": "210;457;239;293",
        "wc_reply_reviewers": "19;0;0;0",
        "wc_reply_authors": "17;118;54;300",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            77.75,
            11.903255857117413
        ],
        "wc_strengths_avg": [
            35.25,
            27.151197027018902
        ],
        "wc_weaknesses_avg": [
            128.0,
            51.647846034466916
        ],
        "wc_questions_avg": [
            58.75,
            19.62619423117992
        ],
        "wc_review_avg": [
            299.75,
            95.54939821893176
        ],
        "wc_reply_reviewers_avg": [
            4.75,
            8.227241335952167
        ],
        "wc_reply_authors_avg": [
            122.25,
            108.79883960778258
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:3Ba0Pi-LN9cJ:scholar.google.com/&scioq=A+Fault+Forecasting+Approach+Using+Two-Dimensional+Optimization+(TDO)&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Malm\u00f6 University;University of New Brunswick",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.mah.se;https://www.unb.ca",
        "aff_unique_abbr": "MAH;UNB",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Sweden;Canada"
    },
    {
        "title": "TAB: Temporal Accumulated Batch Normalization in Spiking Neural Networks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17995",
        "id": "k1wlmtPGLq",
        "author_site": "Haiyan Jiang, Vincent Zoonekynd, Giulia De Masi, Bin Gu, Huan Xiong",
        "tldr": "",
        "abstract": "Spiking Neural Networks (SNNs) are attracting growing interest for their energy-efficient computing when implemented on neuromorphic hardware. However, directly training SNNs, even adopting batch normalization (BN), is highly challenging due to their non-differentiable activation function and the temporally delayed accumulation of outputs over time.\n    For SNN training, this temporal accumulation gives rise to Temporal Covariate Shifts (TCS) along the temporal dimension, a phenomenon that would become increasingly pronounced with layer-wise computations across multiple layers and multiple time-steps. \n    In this paper, we introduce TAB (Temporal Accumulated Batch Normalization), a novel SNN batch normalization method that addresses the temporal covariate shift issue by aligning with neuron dynamics (specifically the accumulated membrane potential) and utilizing temporal accumulated statistics for data normalization. \n    Within its framework, TAB effectively encapsulates the historical temporal dependencies that underlie the membrane potential accumulation process, thereby establishing a natural connection between neuron dynamics and TAB batch normalization. \n    Experimental results on CIFAR-10, CIFAR-100, and DVS-CIFAR10 show that our TAB method outperforms other state-of-the-art methods.",
        "keywords": "Temporal Batch Normalization;Spiking Neural Networks",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/8194240a1aed47d6bfdfd948c4703b4c1787fd50.zip",
        "author": "Haiyan Jiang;Vincent Zoonekynd;Giulia De Masi;Bin Gu;Huan Xiong",
        "authorids": "~Haiyan_Jiang1;~Vincent_Zoonekynd1;~Giulia_De_Masi1;~Bin_Gu1;~Huan_Xiong1",
        "gender": "F;;;M;M",
        "homepage": ";http://zoonek.free.fr/blosxom/;;https://mbzuai.ac.ae/study/faculty/bin-gu/;https://scholar.google.com/citations?user=l4hm14MAAAAJ&hl=en",
        "dblp": ";;147/8719;29/1758-1;",
        "google_scholar": "vpHnhJsAAAAJ;w-ALx3wAAAAJ;G1K5hX0AAAAJ;Vo8OgCgAAAAJ;l4hm14MAAAAJ",
        "orcid": "0000-0002-4099-480X;;0000-0003-3284-880X;0000-0001-6049-1815;",
        "linkedin": ";vincent-zoonekynd-0075ba24/;;;",
        "or_profile": "~Haiyan_Jiang1;~Vincent_Zoonekynd1;~Giulia_De_Masi1;~Bin_Gu1;~Huan_Xiong1",
        "aff": "Mohamed bin Zayed University of Artificial Intelligence;ADIA;Technology Innovation Institute;Mohamed bin Zayed University of Artificial Intelligence;Harbin Institute of Technology",
        "aff_domain": "mbzuai.ac.ae;adia.ae;tii.ae;mbzuai.ac.ae;hit.edu.cn",
        "position": "Researcher;Principal Researcher;Principal Researcher;Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\njiang2024tab,\ntitle={{TAB}: Temporal Accumulated Batch Normalization in Spiking Neural Networks},\nauthor={Haiyan Jiang and Vincent Zoonekynd and Giulia De Masi and Bin Gu and Huan Xiong},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=k1wlmtPGLq}\n}",
        "github": "",
        "project": "",
        "reviewers": "vi7C;ZLsc;34HL;Y1dw",
        "pdf_size": 509760,
        "rating": "6;6;8;8",
        "confidence": "4;3;5;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "90;218;39;67",
        "wc_strengths": "56;42;32;49",
        "wc_weaknesses": "75;48;78;130",
        "wc_questions": "118;43;3;5",
        "wc_review": "339;351;152;251",
        "wc_reply_reviewers": "0;19;23;29",
        "wc_reply_authors": "849;936;937;1239",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "2;3;2;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            103.5,
            68.52919086053767
        ],
        "wc_strengths_avg": [
            44.75,
            8.870597499605086
        ],
        "wc_weaknesses_avg": [
            82.75,
            29.67637949615822
        ],
        "wc_questions_avg": [
            42.25,
            46.54769059792333
        ],
        "wc_review_avg": [
            273.25,
            79.94490290193616
        ],
        "wc_reply_reviewers_avg": [
            17.75,
            10.848386976873567
        ],
        "wc_reply_authors_avg": [
            990.25,
            147.99218729378927
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.7071067811865475,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6653569479953643479&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=k1wlmtPGLq",
        "pdf": "https://openreview.net/pdf?id=k1wlmtPGLq",
        "email": "mbzuai.ac.ae;adia.ae;tii.ae;mbzuai.ac.ae;hit.edu.cn",
        "author_num": 5,
        "aff_unique_index": "0;1;2;0;3",
        "aff_unique_norm": "Mohamed bin Zayed University of Artificial Intelligence;ADIA;Technology Innovation Institute;Harbin Institute of Technology",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://mbzuai.ac.ae;;;http://www.hit.edu.cn/",
        "aff_unique_abbr": "MBZUAI;;;HIT",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Harbin",
        "aff_country_unique_index": "0;0;2",
        "aff_country_unique": "United Arab Emirates;;China"
    },
    {
        "id": "k2a2aPOA4b",
        "title": "Towards Realistic Unsupervised Fine-tuning with Vision-Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The emergence of vision-language models (VLMs), such as CLIP, has spurred a significant research effort towards their application for downstream supervised learning tasks.\nAlthough some previous studies have explored the unsupervised fine-tuning of CLIP, they often rely on prior knowledge in the form of class names associated with ground truth labels.\nIn this paper, we delve into a realistic unsupervised fine-tuning scenario by assuming that the unlabeled data might contain out-of-distribution samples from unknown classes.\nFurthermore, we emphasize the importance of simultaneously enhancing out-of-distribution detection capabilities alongside the recognition of instances associated with predefined class labels.\n\nTo tackle this problem, we present a simple, efficient, and effective fine-tuning approach called Universal Entropy Optimization (UEO).\nUEO leverages sample-level confidence to approximately minimize the conditional entropy of confident instances and maximize the marginal entropy of less confident instances.\nApart from optimizing the textual prompts, UEO also incorporates optimization of channel-wise affine transformations within the visual branch of CLIP.\nThrough extensive experiments conducted across 15 domains and 4 different types of prior knowledge, we demonstrate that UEO surpasses baseline methods in terms of both generalization and out-of-distribution detection.",
        "keywords": "CLIP;unsupervised fine-tuning;universal adaptation;OOD detection",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/cabcbce8640024518e5d9eb40e9a1bc4d4f2fa0e.zip",
        "author": "Jian Liang;Lijun Sheng;Zhengbo Wang;Ran He;Tieniu Tan",
        "authorids": "~Jian_Liang1;~Lijun_Sheng1;~Zhengbo_Wang1;~Ran_He1;~Tieniu_Tan1",
        "gender": "M;M;;M;",
        "homepage": "https://liangjian.xyz;https://tomsheng21.github.io/;https://github.com/mrflogs;https://rhe-web.github.io/;",
        "dblp": "19/2208-1;321/3477;193/0358;61/6198-1;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.com.sg/citations?user=1sM6ZrcAAAAJ;;ayrg9AUAAAAJ;",
        "orcid": "0000-0003-3890-1894;;;0000-0002-3807-991X;",
        "linkedin": ";;;;",
        "or_profile": "~Jian_Liang1;~Lijun_Sheng1;~Zhengbo_Wang1;~Ran_He1;~Tieniu_Tan1",
        "aff": "Institute of Automation, Chinese Academy of Sciences;University of Science and Technology of China;University of Science and Technology of China;Institute of Automation, Chinese Academy of Sciences;",
        "aff_domain": "ia.ac.cn;ustc.edu.cn;ustc.edu.cn;ia.ac.cn;",
        "position": "Associate Professor;PhD student;PhD student;Full Professor;",
        "bibtex": "@misc{\nliang2024towards,\ntitle={Towards Realistic Unsupervised Fine-tuning with Vision-Language Models},\nauthor={Jian Liang and Lijun Sheng and Zhengbo Wang and Ran He and Tieniu Tan},\nyear={2024},\nurl={https://openreview.net/forum?id=k2a2aPOA4b}\n}",
        "github": "",
        "project": "",
        "reviewers": "pTa8;eDVD;spW5;tymK",
        "site": "https://openreview.net/forum?id=k2a2aPOA4b",
        "pdf_size": 3578826,
        "rating": "5;5;6;8",
        "confidence": "4;4;4;3",
        "soundness": "1;2;3;3",
        "contribution": "3;2;3;3",
        "presentation": "3;3;3;2",
        "wc_summary": "80;111;89;70",
        "wc_strengths": "46;95;219;88",
        "wc_weaknesses": "210;382;152;66",
        "wc_questions": "2;153;94;223",
        "wc_review": "338;741;554;447",
        "wc_reply_reviewers": "88;136;15;53",
        "wc_reply_authors": "1681;2896;636;790",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "5;7;2;3",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            87.5,
            15.14100392972672
        ],
        "wc_strengths_avg": [
            112.0,
            64.55617708631762
        ],
        "wc_weaknesses_avg": [
            202.5,
            115.60601195439621
        ],
        "wc_questions_avg": [
            118.0,
            81.0586207630009
        ],
        "wc_review_avg": [
            520.0,
            148.70272357963051
        ],
        "wc_reply_reviewers_avg": [
            73.0,
            44.603811496328426
        ],
        "wc_reply_authors_avg": [
            1500.75,
            898.9119464663934
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            4.25,
            1.920286436967152
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9428090415820632,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:CllouvMxvKAJ:scholar.google.com/&scioq=Towards+Realistic+Unsupervised+Fine-tuning+with+Vision-Language+Models&hl=en&as_sdt=0,31",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;0",
        "aff_unique_norm": "Chinese Academy of Sciences;University of Science and Technology of China",
        "aff_unique_dep": "Institute of Automation;",
        "aff_unique_url": "http://www.ia.cas.cn;http://www.ustc.edu.cn",
        "aff_unique_abbr": "CAS;USTC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "k2lkeCCfRK",
        "title": "GFLOWNET TRAINING BY POLICY GRADIENTS",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Generative Flow Networks (GFlowNets) have been shown with an attractive capability to generate combinatorial objects with desired properties. In this paper, we propose a policy-dependent reward that bridges the flow balance in GFlowNet training to optimizing the expected accumulated reward in traditional Reinforcement-Learning (RL). This allows us to derive policy-based GFlowNet training strategies. It is known that the training efficiency is affected by the design of backward policies in GFlowNets. We propose a coupled training strategy that can jointly solve the GFlowNet training and backward policy design. Performance analysis is provided with a theoretical guarantee of our proposed methods. We further conduct experiments on both simulated and real-world datasets to verify that our policy-based strategy outperforms the existing GFlowNet training strategies.",
        "keywords": "Generative model;Variational Inference;Reinforcement Learning",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/239d8f8fe10aae7dc2c72ae21d065980a4d982db.zip",
        "author": "Puhua Niu;Shili Wu;Mingzhou Fan;Xiaoning Qian",
        "authorids": "~Puhua_Niu2;shiliwu@tamu.edu;~Mingzhou_Fan1;~Xiaoning_Qian2",
        "gender": "M;;M;M",
        "homepage": ";;https://www.google.com/;https://www.ece.tamu.edu/~xqian",
        "dblp": "353/4360;;294/0813;62/4504",
        "google_scholar": "LWOKY7oAAAAJ;;;dXGlddgAAAAJ",
        "orcid": "0000-0002-5127-1690;;;0000-0002-4347-2476",
        "linkedin": ";;;",
        "or_profile": "~Puhua_Niu2;shiliwu@tamu.edu;~Mingzhou_Fan1;~Xiaoning_Qian2",
        "aff": "Texas A&M;;Texas A&M;Texas A&M",
        "aff_domain": "tamu.edu;;tamu.edu;tamu.edu",
        "position": "Texas A&M Unverisity;;PhD student;Full Professor",
        "bibtex": "@misc{\nniu2024gflownet,\ntitle={{GFLOWNET} {TRAINING} {BY} {POLICY} {GRADIENTS}},\nauthor={Puhua Niu and Shili Wu and Mingzhou Fan and Xiaoning Qian},\nyear={2024},\nurl={https://openreview.net/forum?id=k2lkeCCfRK}\n}",
        "github": "",
        "project": "",
        "reviewers": "cxrP;gXTK;MZqG;U7wX;xjL5",
        "site": "https://openreview.net/forum?id=k2lkeCCfRK",
        "pdf_size": 1853603,
        "rating": "5;5;5;5;5",
        "confidence": "3;4;4;2;4",
        "soundness": "3;3;2;3;3",
        "contribution": "2;2;2;3;3",
        "presentation": "2;2;1;4;3",
        "wc_summary": "74;82;61;64;31",
        "wc_strengths": "56;32;21;101;62",
        "wc_weaknesses": "755;297;47;150;164",
        "wc_questions": "3;372;96;39;35",
        "wc_review": "888;783;225;354;292",
        "wc_reply_reviewers": "139;276;0;0;44",
        "wc_reply_authors": "1539;1139;280;637;323",
        "reply_reviewers": "1;1;0;0;1",
        "reply_authors": "3;3;2;2;3",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.4,
            0.8
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.4,
            1.019803902718557
        ],
        "wc_summary_avg": [
            62.4,
            17.3735431043872
        ],
        "wc_strengths_avg": [
            54.4,
            27.7459907013608
        ],
        "wc_weaknesses_avg": [
            282.6,
            249.20882809403042
        ],
        "wc_questions_avg": [
            109.0,
            134.8703080740902
        ],
        "wc_review_avg": [
            508.4,
            272.20771480617515
        ],
        "wc_reply_reviewers_avg": [
            91.8,
            105.16349176401475
        ],
        "wc_reply_authors_avg": [
            783.6,
            486.66111412357577
        ],
        "reply_reviewers_avg": [
            0.6,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            2.6,
            0.4898979485566356
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14916572601665811036&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Texas A&M University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tamu.edu",
        "aff_unique_abbr": "TAMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "k542OjwsQK",
        "title": "AV-CPL: Continuous Pseudo-Labeling for Audio-Visual Speech Recognition",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Audio-visual speech contains synchronized audio and visual information that provides cross-modal supervision to learn representations for both automatic speech recognition (ASR) and visual speech recognition (VSR).\nWe introduce continuous pseudo-labeling for audio-visual speech recognition (AV-CPL), a semi-supervised method to train an audio-visual speech recognition (AVSR) model on a combination of labeled and unlabeled videos with continuously regenerated pseudo-labels.\nOur models are trained for speech recognition from audio-visual inputs and can perform speech recognition using both audio and visual modalities, or only one modality.\nOur method uses the same audio-visual model for both supervised training and pseudo-label generation, mitigating the need for external speech recognition models to generate pseudo-labels.\nAV-CPL obtains significant improvements in VSR performance on the LRS3 dataset while maintaining practical ASR and AVSR performance.\nFinally, using visual-only speech data, our method is able to leverage unlabeled visual speech to improve VSR.",
        "keywords": "pseudo-labeling;self-training;audio-visual;speech recognition;ASR;multi-modal",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/6787efa7792599247d7581960fab8efc4102f41a.pdf",
        "author": "Andrew Rouditchenko;Ronan Collobert;Tatiana Likhomanenko",
        "authorids": "~Andrew_Rouditchenko1;~Ronan_Collobert1;~Tatiana_Likhomanenko1",
        "gender": ";M;F",
        "homepage": ";http://ronan.collobert.com;https://github.com/tlikhomanenko/tlikhomanenko",
        "dblp": "218/5458;03/4032;202/2094",
        "google_scholar": ";32w7x1cAAAAJ;https://scholar.google.ru/citations?user=x7Z3ysQAAAAJ",
        "orcid": ";;0000-0003-0351-9839",
        "linkedin": ";;",
        "or_profile": "~Andrew_Rouditchenko1;~Ronan_Collobert1;~Tatiana_Likhomanenko1",
        "aff": "Massachusetts Institute of Technology;Apple;Apple",
        "aff_domain": "mit.edu;apple.com;apple.com",
        "position": "PhD student;Research Scientist;Research Scientist",
        "bibtex": "@misc{\nrouditchenko2024avcpl,\ntitle={{AV}-{CPL}: Continuous Pseudo-Labeling for Audio-Visual Speech Recognition},\nauthor={Andrew Rouditchenko and Ronan Collobert and Tatiana Likhomanenko},\nyear={2024},\nurl={https://openreview.net/forum?id=k542OjwsQK}\n}",
        "github": "",
        "project": "",
        "reviewers": "24HW;CBFK;AEBL;iRHK;2p3J",
        "site": "https://openreview.net/forum?id=k542OjwsQK",
        "pdf_size": 475766,
        "rating": "3;3;3;5;5",
        "confidence": "3;4;3;4;4",
        "soundness": "2;3;3;3;3",
        "contribution": "2;2;2;2;2",
        "presentation": "2;3;3;3;3",
        "wc_summary": "19;82;84;72;23",
        "wc_strengths": "21;100;21;58;15",
        "wc_weaknesses": "146;154;127;73;149",
        "wc_questions": "68;86;82;17;117",
        "wc_review": "254;422;314;220;304",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            3.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            56.0,
            28.892905703649813
        ],
        "wc_strengths_avg": [
            43.0,
            32.3295530436163
        ],
        "wc_weaknesses_avg": [
            129.8,
            29.83554926593442
        ],
        "wc_questions_avg": [
            74.0,
            32.686388604432885
        ],
        "wc_review_avg": [
            302.8,
            68.66265360441584
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.6666666666666667,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11467090736278913471&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Massachusetts Institute of Technology;Apple",
        "aff_unique_dep": ";Apple Inc.",
        "aff_unique_url": "https://web.mit.edu;https://www.apple.com",
        "aff_unique_abbr": "MIT;Apple",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Diagnosing Transformers: Illuminating Feature Spaces for Clinical Decision-Making",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17994",
        "id": "k581sTMyPt",
        "author_site": "Aliyah Hsu, Yeshwanth Cherapanamjeri, Briton Park, Tristan Naumann, Anobel Odisho, Bin Yu",
        "tldr": "",
        "abstract": "Pre-trained transformers are often fine-tuned to aid clinical decision-making using limited clinical notes. Model interpretability is crucial, especially in high-stakes domains like medicine, to establish trust and ensure safety, which requires human engagement. We introduce SUFO, a systematic framework that enhances interpretability of fine-tuned transformer feature spaces. SUFO utilizes a range of analytic and visualization techniques, including Supervised probing, Unsupervised similarity analysis, Feature dynamics, and Outlier analysis to address key questions about model trust and interpretability (e.g. model suitability for a task, feature space evolution during fine-tuning, and interpretation of fine-tuned features and failure modes). We conduct a case study investigating the impact of pre-training data where we focus on real-world pathology classification tasks, and validate our findings on MedNLI. We evaluate five 110M-sized pre-trained transformer models, categorized into general-domain (BERT, TNLR), mixed-domain (BioBERT, Clinical BioBERT), and domain-specific (PubMedBERT) groups. Our SUFO analyses reveal that: (1) while PubMedBERT, the domain-specific model, contains valuable information for fine-tuning, it can overfit to minority classes when class imbalances exist. In contrast, mixed-domain models exhibit greater resistance to overfitting, suggesting potential improvements in domain-specific model robustness; (2) in-domain pre-training accelerates feature disambiguation during fine-tuning; and (3) feature spaces undergo significant sparsification during this process, enabling clinicians to identify common outlier modes among fine-tuned models as demonstrated in this paper. These findings showcase the utility of SUFO in enhancing trust and safety when using transformers in medicine, and we believe SUFO can aid practitioners in evaluating fine-tuned language models (LMs) for other applications in medicine and in more critical domains.",
        "keywords": "fine-tuning;transformer-based language models;feature analysis;interpretation;clinical classification",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/1e9924da9b21fd688057ec1c1fc8d155cdfa2e4f.pdf",
        "author": "Aliyah R. Hsu;Yeshwanth Cherapanamjeri;Briton Park;Tristan Naumann;Anobel Odisho;Bin Yu",
        "authorids": "~Aliyah_R._Hsu1;~Yeshwanth_Cherapanamjeri1;~Briton_Park1;~Tristan_Naumann1;~Anobel_Odisho1;~Bin_Yu5",
        "gender": "F;M;M;M;M;M",
        "homepage": "https://adelaidehsu.github.io/;http://yeshwanth94.github.io;;https://www.microsoft.com/en-us/research/people/tristan/;https://urology.ucsf.edu/people/anobel-y-odisho;https://binyu.stat.berkeley.edu",
        "dblp": "263/4967;182/2247;265/6584;148/5539;;27/116",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;;cjlSeqwAAAAJ;UKnQ0ZwAAAAJ;https://scholar.google.com.hk/citations?user=z1iJa3UAAAAJ",
        "orcid": ";;;0000-0003-2150-1747;0000-0003-0975-0812;0000-0003-3097-1433",
        "linkedin": ";;briton-park-597372177/;tristan-naumann/;;bin-yu-b665063/",
        "or_profile": "~Aliyah_R._Hsu1;~Yeshwanth_Cherapanamjeri1;~Briton_Park1;~Tristan_Naumann1;~Anobel_Odisho1;~Bin_Yu5",
        "aff": "University of California, Berkeley;Massachusetts Institute of Technology;Citadel Securities;Microsoft Research;;University of California, Berkeley",
        "aff_domain": "berkeley.edu;mit.edu;citadelsecurities.com;microsoft.com;;berkeley.edu",
        "position": "PhD student;Postdoc;Researcher;Principal Researcher;;Full Professor",
        "bibtex": "@inproceedings{\nhsu2024diagnosing,\ntitle={Diagnosing Transformers: Illuminating Feature Spaces for Clinical Decision-Making},\nauthor={Aliyah R. Hsu and Yeshwanth Cherapanamjeri and Briton Park and Tristan Naumann and Anobel Odisho and Bin Yu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=k581sTMyPt}\n}",
        "github": "",
        "project": "",
        "reviewers": "bnKW;zoU3;Y739",
        "pdf_size": 29062790,
        "rating": "6;6;8",
        "confidence": "4;3;4",
        "soundness": "3;3;4",
        "contribution": "3;3;4",
        "presentation": "3;4;4",
        "wc_summary": "31;50;55",
        "wc_strengths": "35;53;151",
        "wc_weaknesses": "147;106;148",
        "wc_questions": "5;2;33",
        "wc_review": "218;211;387",
        "wc_reply_reviewers": "13;49;0",
        "wc_reply_authors": "392;374;526",
        "reply_reviewers": "1;1;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            45.333333333333336,
            10.338708279513883
        ],
        "wc_strengths_avg": [
            79.66666666666667,
            50.97275960964074
        ],
        "wc_weaknesses_avg": [
            133.66666666666666,
            19.567546828585563
        ],
        "wc_questions_avg": [
            13.333333333333334,
            13.960261060914615
        ],
        "wc_review_avg": [
            272.0,
            81.36747917114471
        ],
        "wc_reply_reviewers_avg": [
            20.666666666666668,
            20.725722075613085
        ],
        "wc_reply_authors_avg": [
            430.6666666666667,
            67.8101926130742
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.49999999999999983,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13137443831110247361&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=k581sTMyPt",
        "pdf": "https://openreview.net/pdf?id=k581sTMyPt",
        "email": "berkeley.edu;mit.edu;citadelsecurities.com;microsoft.com;;berkeley.edu",
        "author_num": 6,
        "aff_unique_index": "0;1;2;3;0",
        "aff_unique_norm": "University of California, Berkeley;Massachusetts Institute of Technology;Citadel Securities;Microsoft",
        "aff_unique_dep": ";;;Microsoft Research",
        "aff_unique_url": "https://www.berkeley.edu;https://web.mit.edu;https://www.citadel.com;https://www.microsoft.com/en-us/research",
        "aff_unique_abbr": "UC Berkeley;MIT;Citadel;MSR",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Berkeley;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Deep Generative Clustering with Multimodal Diffusion Variational Autoencoders",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17993",
        "id": "k5THrhXDV3",
        "author_site": "Emanuele Palumbo, Laura Manduchi, Sonia Laguna, Daphn\u00e9 Chopard, Julia E Vogt",
        "tldr": "",
        "abstract": "Multimodal VAEs have recently gained significant attention as generative models for weakly-supervised learning with multiple heterogeneous modalities. In parallel, VAE-based methods have been explored as probabilistic approaches for clustering tasks. At the intersection of these two research directions, we propose a novel multimodal VAE model in which the latent space is extended to learn data clusters, leveraging shared information across modalities. Our experiments show that our proposed model improves generative performance over existing multimodal VAEs, particularly for unconditional generation. Furthermore, we propose a post-hoc procedure to automatically select the number of true clusters thus mitigating critical limitations of previous clustering frameworks. Notably, our method favorably compares to alternative clustering approaches, in weakly-supervised settings. Finally, we integrate recent advancements in diffusion models into the proposed method to improve generative quality for real-world images.",
        "keywords": "Generative Clustering;Multimodal VAEs;Variational Autoencoder;Multimodal Learning;Generative Models",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Emanuele Palumbo;Laura Manduchi;Sonia Laguna;Daphn\u00e9 Chopard;Julia E Vogt",
        "authorids": "~Emanuele_Palumbo1;~Laura_Manduchi2;~Sonia_Laguna1;~Daphn\u00e9_Chopard1;~Julia_E_Vogt1",
        "gender": "M;F;F;F;F",
        "homepage": ";https://mds.inf.ethz.ch/team/detail/laura-manduchi/;https://mds.inf.ethz.ch/team/detail/sonia-laguna;;http://mds.inf.ethz.ch",
        "dblp": ";249/9257;313/3156;249/5730;13/8412",
        "google_scholar": "Y7VFjEpEmyoC;;PljVnCQAAAAJ;hUQArCkAAAAJ;UoeV-8kAAAAJ",
        "orcid": ";;0000-0003-3504-2051;0000-0002-7964-1681;",
        "linkedin": ";;;daphne-chopard;julia-vogt-50b53895",
        "or_profile": "~Emanuele_Palumbo1;~Laura_Manduchi2;~Sonia_Laguna1;~Daphn\u00e9_Chopard1;~Julia_E_Vogt1",
        "aff": "Department of Computer Science, ETHZ - ETH Zurich;Swiss Federal Institute of Technology;Department of Computer Science, ETHZ - ETH Zurich;Kinderspital Zurich;Swiss Federal Institute of Technology",
        "aff_domain": "inf.ethz.ch;ethz.ch;inf.ethz.ch;kispi.uzh.ch;ethz.ch",
        "position": "PhD student;PhD student;PhD student;Postdoc;Assistant Professor",
        "bibtex": "@inproceedings{\npalumbo2024deep,\ntitle={Deep Generative Clustering with Multimodal Diffusion Variational Autoencoders},\nauthor={Emanuele Palumbo and Laura Manduchi and Sonia Laguna and Daphn{\\'e} Chopard and Julia E Vogt},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=k5THrhXDV3}\n}",
        "github": "",
        "project": "",
        "reviewers": "XPst;i4Eb;GVdd",
        "pdf_size": 26355083,
        "rating": "6;6;8",
        "confidence": "3;4;3",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "3;4;2",
        "wc_summary": "38;55;181",
        "wc_strengths": "39;124;81",
        "wc_weaknesses": "219;223;62",
        "wc_questions": "118;32;20",
        "wc_review": "414;434;344",
        "wc_reply_reviewers": "0;0;42",
        "wc_reply_authors": "1508;1022;446",
        "reply_reviewers": "0;0;1",
        "reply_authors": "4;3;2",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            91.33333333333333,
            63.782616928299696
        ],
        "wc_strengths_avg": [
            81.33333333333333,
            34.70190516703978
        ],
        "wc_weaknesses_avg": [
            168.0,
            74.97110554518099
        ],
        "wc_questions_avg": [
            56.666666666666664,
            43.64503280888776
        ],
        "wc_review_avg": [
            397.3333333333333,
            38.58612300930075
        ],
        "wc_reply_reviewers_avg": [
            14.0,
            19.79898987322333
        ],
        "wc_reply_authors_avg": [
            992.0,
            434.07833394446214
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.0,
            0.816496580927726
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11285035641824809574&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=k5THrhXDV3",
        "pdf": "https://openreview.net/pdf?id=k5THrhXDV3",
        "email": "inf.ethz.ch;ethz.ch;inf.ethz.ch;kispi.uzh.ch;ethz.ch",
        "author_num": 5,
        "aff_unique_index": "0;1;0;2;1",
        "aff_unique_norm": "ETH Zurich;Swiss Federal Institute of Technology;Kinderspital Zurich",
        "aff_unique_dep": "Department of Computer Science;;",
        "aff_unique_url": "https://www.ethz.ch;https://www.ethz.ch;https://www.kinderspital-zuerich.ch",
        "aff_unique_abbr": "ETHZ;ETH Zurich;",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Zurich;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Switzerland"
    },
    {
        "id": "k65Nh7IV6X",
        "title": "Two-shot learning of continuous interpolation using a conceptor-aided recurrent autoencoder",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Generalizing from only two time series towards unseen intermediate patterns poses a significant challenge in representation learning. In this paper, we introduce a novel representation learning algorithm, \"Conceptor-Aided Recurrent Autoencoder\" (CARAE), which leverages a conceptor-based regularization to learn to generate a continuous spectrum of intermediate temporal patterns while just being trained on two distinct examples. Here, conceptors, a linear subspace characterization of neuron activations, are employed to impose a low-dimensional geometrical bottleneck on the neural dynamics. During training,  CARAE assembles a continuous and stable manifold between the two trained temporal patterns. Exploiting this manifold in the inference, CARAE facilitates continuous and phase-aligned interpolation between temporal patterns that are not linked within the training data. We demonstrate the effectiveness of the CARAE framework through comprehensive experiments on temporal pattern generation tasks and the generation of novel complex motion patterns based on the MoCap data set.",
        "keywords": "Conceptors;Few Shot Learning;Recurrent Neural Networks;BPTT;Motion Modelling;Low Dimensional Dynamics",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/0bc996dd381211fab1c693eb156302ff5c0ad3df.zip",
        "author": "Guillaume Pourcel;Mirko Goldmann;Steven Abreu;Miguel C. Soriano",
        "authorids": "~Guillaume_Pourcel1;~Mirko_Goldmann1;~Steven_Abreu1;~Miguel_C._Soriano1",
        "gender": "M;M;M;",
        "homepage": "https://guillaumepourcel.github.io;;https://stevenabreu.com;https://ifisc.uib-csic.es/miguel",
        "dblp": "264/0054;;247/9483;",
        "google_scholar": "mh96JwEAAAAJ;Z4y1LTUAAAAJ;CqbIOvMAAAAJ;",
        "orcid": "0000-0002-7147-3652;0000-0002-9650-2018;0000-0002-2272-315X;",
        "linkedin": ";;https://linkedin.com/in/stevenabreu7;",
        "or_profile": "~Guillaume_Pourcel1;~Mirko_Goldmann1;~Steven_Abreu1;~Miguel_C._Soriano1",
        "aff": "INRIA;Universitat de les Illes Balears;Google;Universitat de les Illes Balears",
        "aff_domain": "inria.fr;uib.es;google.com;uib.es",
        "position": "Intern;PhD student;Intern;Assistant Professor",
        "bibtex": "@misc{\npourcel2024twoshot,\ntitle={Two-shot learning of continuous interpolation using a conceptor-aided recurrent autoencoder},\nauthor={Guillaume Pourcel and Mirko Goldmann and Steven Abreu and Miguel C. Soriano},\nyear={2024},\nurl={https://openreview.net/forum?id=k65Nh7IV6X}\n}",
        "github": "",
        "project": "",
        "reviewers": "PFFz;Wnkt;cFnM;T2vx",
        "site": "https://openreview.net/forum?id=k65Nh7IV6X",
        "pdf_size": 5126526,
        "rating": "3;3;6;6",
        "confidence": "4;3;1;2",
        "soundness": "2;2;2;3",
        "contribution": "2;1;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "115;95;46;102",
        "wc_strengths": "25;41;9;58",
        "wc_weaknesses": "246;277;120;98",
        "wc_questions": "54;40;37;2",
        "wc_review": "440;453;212;260",
        "wc_reply_reviewers": "146;257;0;0",
        "wc_reply_authors": "1362;1310;628;303",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "3;3;1;1",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            2.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            89.5,
            26.119915773217954
        ],
        "wc_strengths_avg": [
            33.25,
            18.226011631731172
        ],
        "wc_weaknesses_avg": [
            185.25,
            77.42536729005552
        ],
        "wc_questions_avg": [
            33.25,
            19.149086140074676
        ],
        "wc_review_avg": [
            341.25,
            106.70842281657058
        ],
        "wc_reply_reviewers_avg": [
            100.75,
            108.1234826483128
        ],
        "wc_reply_authors_avg": [
            900.75,
            450.5371100142584
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            1.0
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.894427190999916,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:dCBACK3ClFcJ:scholar.google.com/&scioq=Two-shot+learning+of+continuous+interpolation+using+a+conceptor-aided+recurrent+autoencoder&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "INRIA;Universitat de les Illes Balears;Google",
        "aff_unique_dep": ";;Google",
        "aff_unique_url": "https://www.inria.fr;https://www UIB.es;https://www.google.com",
        "aff_unique_abbr": "INRIA;UIB;Google",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;2;1",
        "aff_country_unique": "France;Spain;United States"
    },
    {
        "id": "k7jhe7gr7C",
        "title": "Instant Complexity Reduction in CNNs using Locality-Sensitive Hashing",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "To reduce the computational cost of convolutional neural networks (CNNs) for usage on resource-constrained devices, structured pruning approaches have shown promising results, drastically reducing floating-point operations (FLOPs) without substantial drops in accuracy. \nHowever, most recent methods require fine-tuning or specific training procedures to achieve a reasonable trade-off between retained accuracy and reduction in FLOPs. This introduces additional cost in the form of computational overhead and requires training data to be available. \nTo this end, we propose HASTE ($\\textbf{Has}$hing for $\\textbf{T}$ractable $\\textbf{E}$fficiency), a parameter-free and data-free module that acts as a plug-and-play replacement for any regular convolution module. It instantly reduces the network\u2019s test-time inference cost without requiring any training or fine-tuning. \nWe are able to drastically compress latent feature maps without sacrificing much accuracy by using locality-sensitive hashing (LSH) to detect redundancies in the channel dimension. Similar channels are aggregated to reduce the input and filter depth simultaneously, allowing for cheaper convolutions.\nWe demonstrate our approach on the popular vision benchmarks CIFAR-10 and ImageNet.\nIn particular, we are able to instantly drop 46.72\\% of FLOPs while only losing 1.25\\% accuracy by just swapping the convolution modules in a ResNet34 on CIFAR-10 for our HASTE module.",
        "keywords": "Model Compression;Structured Pruning;Hashing;CNNs",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Lukas Meiner;Jens Mehnert;Alexandru Paul Condurache",
        "authorids": "~Lukas_Meiner1;~Jens_Mehnert1;~Alexandru_Paul_Condurache1",
        "gender": ";M;",
        "homepage": ";http://www.drmehnert.de;",
        "dblp": ";09/5738;",
        "google_scholar": ";https://scholar.google.co.in/citations?user=HZ1Y4jgAAAAJ;",
        "orcid": ";0000-0002-0079-0036;",
        "linkedin": ";drjensmehnert/;",
        "or_profile": "~Lukas_Meiner1;~Jens_Mehnert1;~Alexandru_Paul_Condurache1",
        "aff": ";Robert Bosch GmbH, Bosch;",
        "aff_domain": ";de.bosch.com;",
        "position": ";Researcher;",
        "bibtex": "@misc{\nmeiner2024instant,\ntitle={Instant Complexity Reduction in {CNN}s using Locality-Sensitive Hashing},\nauthor={Lukas Meiner and Jens Mehnert and Alexandru Paul Condurache},\nyear={2024},\nurl={https://openreview.net/forum?id=k7jhe7gr7C}\n}",
        "github": "",
        "project": "",
        "reviewers": "AoyU;JSr2;dkAQ;fMDs;988t",
        "site": "https://openreview.net/forum?id=k7jhe7gr7C",
        "pdf_size": 3833729,
        "rating": "3;3;5;6;6",
        "confidence": "3;4;4;5;4",
        "soundness": "3;2;2;3;3",
        "contribution": "1;1;2;3;3",
        "presentation": "3;3;3;3;3",
        "wc_summary": "26;56;236;85;53",
        "wc_strengths": "26;65;240;76;73",
        "wc_weaknesses": "152;296;380;545;137",
        "wc_questions": "66;57;221;44;33",
        "wc_review": "270;474;1077;750;296",
        "wc_reply_reviewers": "182;0;0;58;0",
        "wc_reply_authors": "774;761;737;642;297",
        "reply_reviewers": "1;0;0;1;0",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            4.6,
            1.3564659966250536
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.0,
            0.8944271909999159
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            91.2,
            74.77272229897746
        ],
        "wc_strengths_avg": [
            96.0,
            74.19703498119046
        ],
        "wc_weaknesses_avg": [
            302.0,
            151.58759843733918
        ],
        "wc_questions_avg": [
            84.2,
            69.31493345592997
        ],
        "wc_review_avg": [
            573.4,
            304.52691178285045
        ],
        "wc_reply_reviewers_avg": [
            48.0,
            70.66540879383632
        ],
        "wc_reply_authors_avg": [
            642.2,
            178.68116856568855
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.6993786061802353,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6868240130430215687&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0",
        "aff_unique_norm": "Robert Bosch GmbH",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.bosch.com",
        "aff_unique_abbr": "Bosch",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "k82MvVIbrC",
        "title": "Learning Structured Sparse Neural Networks Using Group Envelope Regularization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We propose an efficient method to learn both unstructured and structured sparse neural networks during training, utilizing a novel generalization of the sparse envelope function (SEF) used as a regularizer, termed {\\itshape{weighted group sparse envelope function}} (WGSEF). The WGSEF acts as a neuron group selector, which is leveraged to induce structured sparsity. The method ensures a hardware-friendly structured sparsity of a deep neural network (DNN) to efficiently accelerate the DNN's evaluation. Notably, the method is adaptable, letting any hardware specify group definitions, such as filters, channels, filter shapes, layer depths, a single parameter (unstructured), etc. Owing to the WGSEF's properties, the proposed method allows to a pre-define sparsity level that would be achieved at the training convergence, while maintaining negligible network accuracy degradation or even improvement in the case of redundant parameters. We introduce an efficient technique to calculate the exact value of the WGSEF along with its proximal operator in a worst-case complexity of $O(n)$, where $n$ is the total number of group variables. In addition, we propose a proximal-gradient-based optimization method to train the model, that is, the non-convex minimization of the sum of the neural network loss and the WGSEF. Finally, we conduct an experiment and illustrate the efficiency of our proposed technique in terms of the completion ratio, accuracy, and inference latency.",
        "keywords": "learning sparse neural network;structured sparse inducing regularization;structured pruning;neural network compression",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Yehonathan Refael;Iftach Arbel;Wasim Huleihel",
        "authorids": "~Yehonathan_Refael1;~Iftach_Arbel1;~Wasim_Huleihel1",
        "gender": "M;;M",
        "homepage": ";https://il.linkedin.com/in/iftach-arbel-950192a8;https://www.wasimh.sites.tau.ac.il/",
        "dblp": ";;",
        "google_scholar": ";;",
        "orcid": ";;",
        "linkedin": "yehonathan-refael-184100193/;;",
        "or_profile": "~Yehonathan_Refael1;~Iftach_Arbel1;~Wasim_Huleihel1",
        "aff": "Microsoft;;Tel Aviv University, Tel Aviv University",
        "aff_domain": "microsoft.com;;tauex.tau.ac.il",
        "position": "Intern;;Assistant Professor",
        "bibtex": "@misc{\nrefael2024learning,\ntitle={Learning Structured Sparse Neural Networks Using Group Envelope Regularization},\nauthor={Yehonathan Refael and Iftach Arbel and Wasim Huleihel},\nyear={2024},\nurl={https://openreview.net/forum?id=k82MvVIbrC}\n}",
        "github": "",
        "project": "",
        "reviewers": "FGZh;xL1V;kcJf",
        "site": "https://openreview.net/forum?id=k82MvVIbrC",
        "pdf_size": 666572,
        "rating": "3;3;5",
        "confidence": "3;3;5",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "1;2;2",
        "wc_summary": "58;53;25",
        "wc_strengths": "31;26;8",
        "wc_weaknesses": "140;616;240",
        "wc_questions": "5;2;49",
        "wc_review": "234;697;322",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "242;804;331",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            45.333333333333336,
            14.522013940527977
        ],
        "wc_strengths_avg": [
            21.666666666666668,
            9.877021593352701
        ],
        "wc_weaknesses_avg": [
            332.0,
            204.92600290511368
        ],
        "wc_questions_avg": [
            18.666666666666668,
            21.483844059096025
        ],
        "wc_review_avg": [
            417.6666666666667,
            200.75911491691284
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            459.0,
            246.64279163735287
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:fGGLjRuODvYJ:scholar.google.com/&scioq=Learning+Structured+Sparse+Neural+Networks+Using+Group+Envelope+Regularization&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Microsoft;Tel Aviv University",
        "aff_unique_dep": "Microsoft Corporation;",
        "aff_unique_url": "https://www.microsoft.com;https://www.tau.ac.il",
        "aff_unique_abbr": "Microsoft;TAU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Tel Aviv",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United States;Israel"
    },
    {
        "id": "k8Y71G7Xpz",
        "title": "FORKS: Fast Second-Order Online Kernel Learning using Incremental Sketching",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Online Kernel Learning (OKL) has attracted considerable research interest due to its promising predictive performance. \nSecond-order methods are particularly appealing for OKL as they often offer substantial improvements in regret guarantees. \nHowever, existing approaches like PROS-N-KONS suffer from at least quadratic time complexity with respect to the budget, rendering them unsuitable for meeting the real-time demands of large-scale online learning. \nAdditionally, current OKL methods are typically prone to concept drifting in data streams, making them vulnerable in adversarial environments. \nTo address these issues, we introduce FORKS, a fast incremental sketching approach for second-order online kernel learning. \nFORKS maintains an efficient time-varying explicit feature mapping that enables rapid updates and decomposition of sketches using incremental sketching techniques. \nTheoretical analysis demonstrates that FORKS achieves a logarithmic regret guarantee, on par with other second-order approaches, while maintaining a linear time complexity w.r.t. the budget. \nWe validate the performance of FORKS through extensive experiments conducted on real-world datasets, demonstrating its superior scalability and robustness against adversarial attacks.",
        "keywords": "Online Kernel Learning;Second-Order Method;Randomized Sketch",
        "primary_area": "metric learning, kernel learning, and sparse coding",
        "supplementary_material": "/attachment/a08d70471958a2278a877d665cf4ec1de57c00f2.zip",
        "author": "Dongxie Wen;Xiao Zhang;Zhewei Wei",
        "authorids": "~Dongxie_Wen1;~Xiao_Zhang7;~Zhewei_Wei1",
        "gender": "M;M;M",
        "homepage": "https://github.com/Henry-ruc;https://pinkfloyd1989.github.io/Xiao_Zhang/;http://weizhewei.com",
        "dblp": ";49/4478-34;94/4260",
        "google_scholar": ";https://scholar.google.com.hk/citations?user=5FZ6wbAAAAAJ;https://scholar.google.com.hk/citations?user=qZ7dj4gAAAAJ",
        "orcid": ";0000-0001-7397-5632;0000-0003-3620-5086",
        "linkedin": ";;",
        "or_profile": "~Dongxie_Wen1;~Xiao_Zhang7;~Zhewei_Wei1",
        "aff": "Renmin University of China;Renmin University of China;Renmin University of China",
        "aff_domain": "ruc.edu.cn;ruc.edu.cn;ruc.edu.cn",
        "position": "PhD student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nwen2024forks,\ntitle={{FORKS}: Fast Second-Order Online Kernel Learning using Incremental Sketching},\nauthor={Dongxie Wen and Xiao Zhang and Zhewei Wei},\nyear={2024},\nurl={https://openreview.net/forum?id=k8Y71G7Xpz}\n}",
        "github": "",
        "project": "",
        "reviewers": "SDsQ;XAux;jbwL;Rsps;9VaC",
        "site": "https://openreview.net/forum?id=k8Y71G7Xpz",
        "pdf_size": 648202,
        "rating": "1;3;5;5;6",
        "confidence": "4;4;2;4;4",
        "soundness": "1;2;3;3;3",
        "contribution": "2;1;2;3;3",
        "presentation": "2;2;2;2;3",
        "wc_summary": "652;36;108;169;107",
        "wc_strengths": "3;15;60;89;115",
        "wc_weaknesses": "3;56;93;173;52",
        "wc_questions": "573;2;17;104;32",
        "wc_review": "1231;109;278;535;306",
        "wc_reply_reviewers": "39;17;0;0;0",
        "wc_reply_authors": "239;263;0;54;40",
        "reply_reviewers": "1;1;0;0;0",
        "reply_authors": "2;1;0;1;1",
        "rating_avg": [
            4.0,
            1.7888543819998317
        ],
        "confidence_avg": [
            3.6,
            0.8
        ],
        "soundness_avg": [
            2.4,
            0.8
        ],
        "contribution_avg": [
            2.2,
            0.7483314773547882
        ],
        "presentation_avg": [
            2.2,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            214.4,
            222.81705500252892
        ],
        "wc_strengths_avg": [
            56.4,
            42.603286258221914
        ],
        "wc_weaknesses_avg": [
            75.4,
            56.5706637754941
        ],
        "wc_questions_avg": [
            145.6,
            216.54800853390455
        ],
        "wc_review_avg": [
            491.8,
            393.7132967020545
        ],
        "wc_reply_reviewers_avg": [
            11.2,
            15.380507143784303
        ],
        "wc_reply_authors_avg": [
            119.2,
            109.32776408579845
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.0,
            0.6324555320336759
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.2795084971874737,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:GAfYPzX5C8UJ:scholar.google.com/&scioq=FORKS:+Fast+Second-Order+Online+Kernel+Learning+using+Incremental+Sketching&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Renmin University of China",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.ruc.edu.cn",
        "aff_unique_abbr": "RUC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "k9NYnsC4Mq",
        "title": "Learning without Forgetting for Vision-Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Class-Incremental Learning (CIL) or continual learning is a desired capability in the real world, which requires a learning system to adapt to new tasks without forgetting former ones. While traditional CIL methods focus on visual information to grasp core features, recent advances in Vision-Language Models (VLM) have shown promising capabilities in learning generalizable representations with the aid of textual information. However, when continually trained with new classes, VLMs often suffer from catastrophic forgetting of former knowledge. Applying VLMs to CIL poses two major challenges: 1) how to adapt the model without forgetting; and 2) how to make full use of the multi-modal information. To this end, we propose PROjectiOn Fusion (PROOF) that enables VLMs to learn without forgetting. To handle the first challenge, we propose training task-specific projections based on the frozen image/text encoders. When facing new tasks, new projections are expanded, and former projections are fixed, alleviating the forgetting of old concepts. For the second challenge, we propose the fusion module to better utilize the cross-modality information. By jointly adjusting visual and textual features, the model can capture better semantic information.  Extensive experiments on nine benchmark datasets with various continual learning scenarios and various VLMs validate PROOF achieves state-of-the-art performance.",
        "keywords": "class-incremental learning;vision-language model tuning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/61c2b8e1c138b4c4c046fd85dfa6a6ec5d124106.zip",
        "author": "Da-Wei Zhou;Yuanhan Zhang;Jingyi Ning;Han-Jia Ye;De-Chuan Zhan;Ziwei Liu",
        "authorids": "~Da-Wei_Zhou1;~Yuanhan_Zhang1;~Jingyi_Ning1;~Han-Jia_Ye1;~De-Chuan_Zhan1;~Ziwei_Liu1",
        "gender": ";M;;M;M;M",
        "homepage": "http://www.lamda.nju.edu.cn/zhoudw/;https://zhangyuanhan-ai.github.io/;;http://www.lamda.nju.edu.cn/yehj;http://www.lamda.nju.edu.cn/zhandc/;https://liuziwei7.github.io/",
        "dblp": "120/6109;10/2476;;165/3014;74/498;05/6300-2",
        "google_scholar": "kMNaR-YAAAAJ;g6grFy0AAAAJ;;mgOYhtoAAAAJ;mYJf4TcAAAAJ;https://scholar.google.com.hk/citations?user=lc45xlcAAAAJ",
        "orcid": ";;;;0000-0002-3533-2078;",
        "linkedin": ";;;;;",
        "or_profile": "~Da-Wei_Zhou1;~Yuanhan_Zhang1;~Jingyi_Ning1;~Han-Jia_Ye1;~De-Chuan_Zhan1;~Ziwei_Liu1",
        "aff": "Nanjing University;Nanyang Technological University;;Nanjing University;Nanjing University;Nanyang Technological University",
        "aff_domain": "nju.edu.cn;ntu.edu.sg;;nju.edu.cn;nju.edu.cn;ntu.edu.sg",
        "position": "PhD student;PhD student;;Associate Professor;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nzhou2024learning,\ntitle={Learning without Forgetting for Vision-Language Models},\nauthor={Da-Wei Zhou and Yuanhan Zhang and Jingyi Ning and Han-Jia Ye and De-Chuan Zhan and Ziwei Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=k9NYnsC4Mq}\n}",
        "github": "",
        "project": "",
        "reviewers": "s6fA;VzW8;asYX",
        "site": "https://openreview.net/forum?id=k9NYnsC4Mq",
        "pdf_size": 2888412,
        "rating": "5;6;6",
        "confidence": "4;5;5",
        "soundness": "3;2;3",
        "contribution": "2;2;2",
        "presentation": "2;2;3",
        "wc_summary": "47;136;85",
        "wc_strengths": "47;16;33",
        "wc_weaknesses": "118;94;197",
        "wc_questions": "65;26;24",
        "wc_review": "277;272;339",
        "wc_reply_reviewers": "34;26;17",
        "wc_reply_authors": "2583;1409;1000",
        "reply_reviewers": "2;1;1",
        "reply_authors": "7;5;4",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            89.33333333333333,
            36.46307112073194
        ],
        "wc_strengths_avg": [
            32.0,
            12.675435561221029
        ],
        "wc_weaknesses_avg": [
            136.33333333333334,
            44.00252518006464
        ],
        "wc_questions_avg": [
            38.333333333333336,
            18.873850222522755
        ],
        "wc_review_avg": [
            296.0,
            30.474032661705056
        ],
        "wc_reply_reviewers_avg": [
            25.666666666666668,
            6.944222218666553
        ],
        "wc_reply_authors_avg": [
            1664.0,
            670.9401364254986
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            5.333333333333333,
            1.247219128924647
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.9999999999999998,
        "gs_citation": 61,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=756299852172566900&as_sdt=5,31&sciodt=0,31&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;0;0;1",
        "aff_unique_norm": "Nanjing University;Nanyang Technological University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.nju.edu.cn;https://www.ntu.edu.sg",
        "aff_unique_abbr": "Nanjing U;NTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;1",
        "aff_country_unique": "China;Singapore"
    },
    {
        "title": "BECLR: Batch Enhanced Contrastive Few-Shot Learning",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17992",
        "id": "k9SVcrmXL8",
        "author_site": "Stylianos Poulakakis-Daktylidis, Hadi Jamali-Rad",
        "tldr": "",
        "abstract": "Learning quickly from very few labeled samples is a fundamental attribute that separates machines and humans in the era of deep representation learning. Unsupervised few-shot learning (U-FSL) aspires to bridge this gap by discarding the reliance on annotations at training time. Intrigued by the success of contrastive learning approaches in the realm of U-FSL, we structurally approach their shortcomings in both pretraining and downstream inference stages. We propose a novel Dynamic Clustered mEmory (DyCE) module to promote a highly separable latent representation space for enhancing positive sampling at the pretraining phase and infusing implicit class-level insights into unsupervised contrastive learning. We then tackle the, somehow overlooked yet critical, issue of sample bias at the few-shot inference stage. We propose an iterative Optimal Transport-based distribution Alignment (OpTA) strategy and demonstrate that it efficiently addresses the problem, especially in low-shot scenarios where FSL approaches suffer the most from sample bias. We later on discuss that DyCE and OpTA are two intertwined pieces of a novel end-to-end approach (we coin as BECLR), constructively magnifying each other's impact. We then present a suite of extensive quantitative and qualitative experimentation to corroborate that BECLR sets a new state-of-the-art across ALL existing U-FSL benchmarks (to the best of our knowledge), and significantly outperforms the best of the current baselines (codebase available at https://github.com/stypoumic/BECLR).",
        "keywords": "few-shot classification;unsupervised few-shot learning;deep representation learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/7b9ba2e59af2fe6b2b5152312209ca71fdeb082e.zip",
        "author": "Stylianos Poulakakis-Daktylidis;Hadi Jamali-Rad",
        "authorids": "~Stylianos_Poulakakis-Daktylidis1;~Hadi_Jamali-Rad1",
        "gender": "M;M",
        "homepage": ";https://sites.google.com/view/jamalirad/home",
        "dblp": ";63/8297",
        "google_scholar": "https://scholar.google.com/citations?hl=en;l4hw34oAAAAJ",
        "orcid": ";",
        "linkedin": "stelios-poulakakis-daktylidis-b733a51b3/;hjamalirad/",
        "or_profile": "~Stylianos_Poulakakis-Daktylidis1;~Hadi_Jamali-Rad1",
        "aff": ";Shell",
        "aff_domain": ";shell.com",
        "position": ";Principal Researcher",
        "bibtex": "@inproceedings{\npoulakakis-daktylidis2024beclr,\ntitle={{BECLR}: Batch Enhanced Contrastive Few-Shot Learning},\nauthor={Stylianos Poulakakis-Daktylidis and Hadi Jamali-Rad},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=k9SVcrmXL8}\n}",
        "github": "",
        "project": "",
        "reviewers": "wMvt;WH4q;msQP",
        "pdf_size": 3963679,
        "rating": "6;6;8",
        "confidence": "4;5;3",
        "soundness": "3;3;3",
        "contribution": "3;2;3",
        "presentation": "3;3;3",
        "wc_summary": "92;99;61",
        "wc_strengths": "38;112;40",
        "wc_weaknesses": "48;147;93",
        "wc_questions": "110;177;2",
        "wc_review": "288;535;196",
        "wc_reply_reviewers": "164;128;0",
        "wc_reply_authors": "2155;2956;1672",
        "reply_reviewers": "2;2;0",
        "reply_authors": "5;7;5",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            84.0,
            16.51262143533445
        ],
        "wc_strengths_avg": [
            63.333333333333336,
            34.4222150491349
        ],
        "wc_weaknesses_avg": [
            96.0,
            40.47221268969612
        ],
        "wc_questions_avg": [
            96.33333333333333,
            72.09407434425908
        ],
        "wc_review_avg": [
            339.6666666666667,
            143.13707493945174
        ],
        "wc_reply_reviewers_avg": [
            97.33333333333333,
            70.37676384211545
        ],
        "wc_reply_authors_avg": [
            2261.0,
            529.5224263428321
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            5.666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            30,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11432753081968140552&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=k9SVcrmXL8",
        "pdf": "https://openreview.net/pdf?id=k9SVcrmXL8",
        "email": ";shell.com",
        "author_num": 2,
        "aff_unique_index": "0",
        "aff_unique_norm": "Shell",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.shell.com",
        "aff_unique_abbr": "Shell",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "k9qsOjvD1U",
        "title": "Matrix and Tensor Completion with Noise via Low-rank Deconvolution",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Low-rank Deconvolution (LRD) has been recently introduced as a new representation model for multi-dimensional data. In this work we consider its use for tackling the problem of matrix and tensor completion. This model is designed to encode information in a very efficient manner using a limited number of parameters and to be flexible by providing a simple framework that allows for easy inclusion of priors such different types of regularizers while, at the same time, letting for easy algorithms to solve the (generally non-convex) learning process. We suspect that these properties will facilitate the resolution of tensor completion problems, i.e the reconstruction of a tensor from incomplete and randomly corrupted entries. Then, our contribution is twofold: first we show that this model acts as a relaxation of the classical low-rank approach allowing for a greater number of solutions than the imposed by the low-rank constraint while using a similar number\nof parameters. And second, we present an algorithm based on a block multi-convex optimization method with nuclear norm minimization and squared total variation regularization that solves the tensor completion problem. Theoretical and empirical results are presented that support our claims.",
        "keywords": "Tensors;Completion;Denoising;Low-rank;Deconvolution",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/974fcd87c64f88e6c967e322a61424443747d4e3.pdf",
        "author": "David Reixach;Ramon Morros",
        "authorids": "~David_Reixach1;~Ramon_Morros1",
        "gender": "M;M",
        "homepage": ";https://imatge.upc.edu/web/people/josep-ramon-morros",
        "dblp": "346/0254;76/993",
        "google_scholar": ";https://scholar.google.com.tw/citations?user=Eh5V620AAAAJ",
        "orcid": ";0000-0002-1395-487X",
        "linkedin": "davreixach/;rmorros",
        "or_profile": "~David_Reixach1;~Ramon_Morros1",
        "aff": "Universidad Polit\u00e9cnica de Cataluna;Universidad Polit\u00e9cnica de Cataluna",
        "aff_domain": "upc.edu;upc.edu",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\nreixach2024matrix,\ntitle={Matrix and Tensor Completion with Noise via Low-rank Deconvolution},\nauthor={David Reixach and Ramon Morros},\nyear={2024},\nurl={https://openreview.net/forum?id=k9qsOjvD1U}\n}",
        "github": "",
        "project": "",
        "reviewers": "1xgP;BDxW;PNwi",
        "site": "https://openreview.net/forum?id=k9qsOjvD1U",
        "pdf_size": 330706,
        "rating": "1;3;6",
        "confidence": "4;3;3",
        "soundness": "1;3;3",
        "contribution": "1;2;4",
        "presentation": "1;2;2",
        "wc_summary": "60;41;91",
        "wc_strengths": "9;16;34",
        "wc_weaknesses": "259;214;99",
        "wc_questions": "4;28;149",
        "wc_review": "332;299;373",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.3333333333333335,
            2.0548046676563256
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            64.0,
            20.607442021431645
        ],
        "wc_strengths_avg": [
            19.666666666666668,
            10.530379332620875
        ],
        "wc_weaknesses_avg": [
            190.66666666666666,
            67.37127643802579
        ],
        "wc_questions_avg": [
            60.333333333333336,
            63.457772486031125
        ],
        "wc_review_avg": [
            334.6666666666667,
            30.26916289265731
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.8029550685469661,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:RrTT_hcLseIJ:scholar.google.com/&scioq=Matrix+and+Tensor+Completion+with+Noise+via+Low-rank+Deconvolution&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Universitat Polit\u00e8cnica de Catalunya",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.upc.edu",
        "aff_unique_abbr": "UPC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Spain"
    },
    {
        "title": "Task structure and nonlinearity jointly determine learned representational geometry",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17991",
        "id": "k9t8dQ30kU",
        "author_site": "Matteo Alleman, Jack Lindsey, Stefano Fusi",
        "tldr": "",
        "abstract": "The utility of a learned neural representation depends on how well its geometry supports performance in downstream tasks. This geometry depends on the structure of the inputs, the structure of the target outputs, and on the architecture of the network.  By studying the learning dynamics of networks with one hidden layer, we discovered that the network's activation function has an unexpectedly strong impact on the representational geometry: Tanh networks tend to learn representations that reflect the structure of the target outputs, while ReLU networks retain more information about the structure of the raw inputs. This difference is consistently observed across a broad class of parameterized tasks in which we modulated the degree of alignment between the geometry of the task inputs and that of the task labels. We analyzed the learning dynamics in weight space and show how the differences between the networks with Tanh and ReLU nonlinearities arise from the asymmetric saturation of ReLU, which leads feature neurons to specialize for different regions of input space. Feature neurons in Tanh networks, by contrast, tend to inherit the task label structure. Consequently, when the target outputs are low dimensional, Tanh networks generate neural representations that are more disentangled than those obtained with a ReLU nonlinearity. Our findings shed light on the interplay between input-output geometry, nonlinearity, and learned representations in neural networks.",
        "keywords": "representational geometry;kernel target alignment;disentanglement;activation function;out-of-distribution generalization",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/d73ef6192109d283a6bd1ae9ace97dc1eb0dd296.pdf",
        "author": "Matteo Alleman;Jack Lindsey;Stefano Fusi",
        "authorids": "~Matteo_Alleman1;~Jack_Lindsey1;~Stefano_Fusi1",
        "gender": ";;M",
        "homepage": "https://twitter.com/;;https://ctn.zuckermaninstitute.columbia.edu/people/stefano-fusi",
        "dblp": ";;",
        "google_scholar": ";CNrQvh4AAAAJ;ojfX4RwAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Matteo_Alleman1;~Jack_Lindsey1;~Stefano_Fusi1",
        "aff": "Columbia University;Columbia University;Columbia University",
        "aff_domain": "columbia.edu;columbia.edu;columbia.edu",
        "position": "PhD student;Student;Full Professor",
        "bibtex": "@inproceedings{\nalleman2024task,\ntitle={Task structure and nonlinearity jointly determine learned representational geometry},\nauthor={Matteo Alleman and Jack Lindsey and Stefano Fusi},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=k9t8dQ30kU}\n}",
        "github": "",
        "project": "",
        "reviewers": "dzyA;HXSW;eLPi;MMx3",
        "pdf_size": 4796553,
        "rating": "5;6;8;8",
        "confidence": "2;3;3;3",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "55;127;58;87",
        "wc_strengths": "66;181;68;94",
        "wc_weaknesses": "68;145;46;318",
        "wc_questions": "31;58;190;207",
        "wc_review": "220;511;362;706",
        "wc_reply_reviewers": "0;0;13;54",
        "wc_reply_authors": "139;295;591;420",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            81.75,
            28.960101864461734
        ],
        "wc_strengths_avg": [
            102.25,
            46.78875399067601
        ],
        "wc_weaknesses_avg": [
            144.25,
            106.8372009180323
        ],
        "wc_questions_avg": [
            121.5,
            77.8219120813669
        ],
        "wc_review_avg": [
            449.75,
            180.2087331402116
        ],
        "wc_reply_reviewers_avg": [
            16.75,
            22.151467220028564
        ],
        "wc_reply_authors_avg": [
            361.25,
            165.84687968122884
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.7777777777777777,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14628064229748118159&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=k9t8dQ30kU",
        "pdf": "https://openreview.net/pdf?id=k9t8dQ30kU",
        "email": "columbia.edu;columbia.edu;columbia.edu",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Columbia University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.columbia.edu",
        "aff_unique_abbr": "Columbia",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "kA7vZQG34x",
        "title": "Adversarial Imitation Learning from Visual Observations using Latent Information",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We focus on the problem of imitation learning from visual observations, where the learning agent has access to videos of experts as its sole learning source. The challenges of this framework include the absence of expert actions and the partial observability of the environment, as the ground-truth states can only be inferred from pixels. To tackle this problem, we first conduct a theoretical analysis of imitation learning in partially observable environments. We establish upper bounds on the suboptimality of the learning agent with respect to the divergence between the expert and the agent latent state-transition distributions. Motivated by this analysis, we introduce an algorithm called Latent Adversarial Imitation from Observations, which combines off-policy adversarial imitation techniques with a learned latent representation of the agent's state from sequences of observations. In experiments on high-dimensional continuous robotic tasks, we show that our algorithm matches state-of-the-art performance while providing significant computational advantages. Additionally, we show how our method can be used to improve the efficiency of reinforcement learning from pixels by leveraging expert videos. To ensure reproducibility, we provide free access to our code.",
        "keywords": "Adversarial Imitation Learning;Learning from experts;Learning from pixels;Reinforcement Learning.",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/6cb05bb6e5b9ad2bffa7ae5f4b91b64aea736d4f.pdf",
        "author": "Vittorio Giammarino;James Queeney;Ioannis Paschalidis",
        "authorids": "~Vittorio_Giammarino1;~James_Queeney1;~Ioannis_Paschalidis1",
        "gender": "M;M;M",
        "homepage": ";https://jqueeney.github.io/;http://sites.bu.edu/paschalidis/",
        "dblp": "263/6539;281/8330;44/2060",
        "google_scholar": "https://scholar.google.com/citations?hl=it;ybOJ8CwAAAAJ;Es_hZ0QAAAAJ",
        "orcid": ";0000-0003-0655-3637;0000-0002-3343-2913",
        "linkedin": "vittoriogiammarino/;jimmy-queeney/;yannis-paschalidis-75a921/",
        "or_profile": "~Vittorio_Giammarino1;~James_Queeney1;~Ioannis_Paschalidis1",
        "aff": "Boston University;Massachusetts Institute of Technology;Boston University",
        "aff_domain": "bu.edu;mit.edu;bu.edu",
        "position": "PhD student;Postdoc;Full Professor",
        "bibtex": "@misc{\ngiammarino2024adversarial,\ntitle={Adversarial Imitation Learning from Visual Observations using Latent Information},\nauthor={Vittorio Giammarino and James Queeney and Ioannis Paschalidis},\nyear={2024},\nurl={https://openreview.net/forum?id=kA7vZQG34x}\n}",
        "github": "",
        "project": "",
        "reviewers": "f9wd;UdfL;Eep1",
        "site": "https://openreview.net/forum?id=kA7vZQG34x",
        "pdf_size": 841468,
        "rating": "3;5;8",
        "confidence": "4;3;5",
        "soundness": "2;2;3",
        "contribution": "2;2;2",
        "presentation": "3;3;4",
        "wc_summary": "137;67;251",
        "wc_strengths": "49;7;233",
        "wc_weaknesses": "634;63;129",
        "wc_questions": "142;18;102",
        "wc_review": "962;155;715",
        "wc_reply_reviewers": "214;0;32",
        "wc_reply_authors": "1588;364;736",
        "reply_reviewers": "1;0;1",
        "reply_authors": "3;1;1",
        "rating_avg": [
            5.333333333333333,
            2.0548046676563256
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            151.66666666666666,
            75.83021971629927
        ],
        "wc_strengths_avg": [
            96.33333333333333,
            98.14728161741868
        ],
        "wc_weaknesses_avg": [
            275.3333333333333,
            255.04291577867616
        ],
        "wc_questions_avg": [
            87.33333333333333,
            51.67419300020293
        ],
        "wc_review_avg": [
            610.6666666666666,
            337.61549464179245
        ],
        "wc_reply_reviewers_avg": [
            82.0,
            94.24790006502354
        ],
        "wc_reply_authors_avg": [
            896.0,
            512.3436346828172
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5960395606792698,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14159174065849429924&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Boston University;Massachusetts Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.bu.edu;https://web.mit.edu",
        "aff_unique_abbr": "BU;MIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "kALZASidYe",
        "title": "Towards Enhanced Controllability of Diffusion Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "As Diffusion Models have shown remarkable capabilities in generating images, the controllability of Diffusion Models has received much attention. However, there is still room for improvement of controllability in some aspects, such as feature disentanglement of Diffusion Models for extended editability and composing multiple conditions naturally. In this paper, we present three methods that can be used in either training or sampling to enhance the controllability of Diffusion Models. Concisely, we train Diffusion Models conditioned on two latent codes, a spatial content mask, and a flattened style embedding. We rely on the inductive bias of the progressive denoising process of Diffusion Models to encode pose/layout information in the spatial structure mask and semantic/style information in the style code. We also propose two generic sampling techniques for improving controllability. First, we extend Composable Diffusion Models to allow for some dependence between conditional inputs, to improve the quality of generations while also providing control over the amount of guidance from each condition and their joint distribution. Second, we propose timestep-dependent weight scheduling for content and style latents to further improve the translations. We observe better controllability compared to existing methods and show that with our proposed methods, Diffusion Models can be used for effective image manipulation and image translation.",
        "keywords": "Diffusion Models;Generative Models;Controllability;Editability",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/7df6e1570d52fd31e01a44de730fe45e659083d6.pdf",
        "author": "Wonwoong Cho;Hareesh Ravi;Midhun Harikumar;Vinh Khuc;Krishna Kumar Singh;Jingwan Lu;David I. Inouye;Ajinkya Kale",
        "authorids": "~Wonwoong_Cho1;~Hareesh_Ravi1;~Midhun_Harikumar1;~Vinh_Khuc2;~Krishna_Kumar_Singh4;~Jingwan_Lu1;~David_I._Inouye1;~Ajinkya_Kale1",
        "gender": "M;M;M;;F;;M;M",
        "homepage": "https://wonwoongcho.github.io/;https://hareesh-ravi.github.io/;;;https://research.adobe.com/person/jingwan-lu/;;http://davidinouye.com;http://krsingh.cs.ucdavis.edu/",
        "dblp": "218/5243;158/9316;;;08/7867;04/6453;76/10817;97/7285",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en;;KkLL4-IAAAAJ;jN2Y51YAAAAJ;;SVMQ_g4AAAAJ;3TMipekAAAAJ",
        "orcid": "0000-0003-0898-0341;;;;;;;",
        "linkedin": "wonwoong-cho-9730921a0/;rhareesh/;midhun-harikumar-9574b524/;vinh-khuc-3390a52a/;jingwanlu/;;;krishna-kumar-singh-66586128",
        "or_profile": "~Wonwoong_Cho1;~Hareesh_Ravi1;~Midhun_Harikumar1;~Vinh_Khuc2;~Jingwan_Lu1;~Ajinkya_Kale1;~David_I_Inouye1;~Krishna_Kumar_Singh3",
        "aff": "Purdue University;Adobe Systems;;Adobe Systems;Adobe Research & Firefly;Adobe Systems;Purdue University;Adobe Research",
        "aff_domain": "purdue.edu;adobe.com;;adobe.com;research.adobe.com;adobe.com;purdue.edu;adobe.com",
        "position": "PhD student;Researcher;;Machine Learning Engineer;Principal Researcher;Researcher;Assistant Professor;Research Scientist",
        "bibtex": "@misc{\ncho2024towards,\ntitle={Towards Enhanced Controllability of Diffusion Models},\nauthor={Wonwoong Cho and Hareesh Ravi and Midhun Harikumar and Vinh Khuc and Krishna Kumar Singh and Jingwan Lu and David I. Inouye and Ajinkya Kale},\nyear={2024},\nurl={https://openreview.net/forum?id=kALZASidYe}\n}",
        "github": "",
        "project": "",
        "reviewers": "e2QG;gF5P;HEZE;4fTL",
        "site": "https://openreview.net/forum?id=kALZASidYe",
        "pdf_size": 15434943,
        "rating": "3;3;3;6",
        "confidence": "5;4;4;4",
        "soundness": "3;2;1;3",
        "contribution": "2;2;2;2",
        "presentation": "3;3;2;3",
        "wc_summary": "78;96;22;132",
        "wc_strengths": "33;22;65;84",
        "wc_weaknesses": "57;97;255;84",
        "wc_questions": "59;39;57;97",
        "wc_review": "227;254;399;397",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "381;441;791;581",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            82.0,
            39.72404813208241
        ],
        "wc_strengths_avg": [
            51.0,
            24.748737341529164
        ],
        "wc_weaknesses_avg": [
            123.25,
            77.42213830681764
        ],
        "wc_questions_avg": [
            63.0,
            21.118712081942874
        ],
        "wc_review_avg": [
            319.25,
            79.32961300800604
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            548.5,
            157.6982878791016
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=102229588350022890&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;1;1;1;0;1",
        "aff_unique_norm": "Purdue University;Adobe",
        "aff_unique_dep": ";Adobe Systems Incorporated",
        "aff_unique_url": "https://www.purdue.edu;https://www.adobe.com",
        "aff_unique_abbr": "Purdue;Adobe",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "FasterViT: Fast Vision Transformers with Hierarchical Attention",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17990",
        "id": "kB4yBiNmXX",
        "author_site": "Ali Hatamizadeh, Greg Heinrich, Hongxu Yin, Andrew Tao, Jose M. Alvarez, Jan Kautz, Pavlo Molchanov",
        "tldr": "",
        "abstract": "We design a new family of hybrid CNN-ViT neural networks, named FasterViT, with a focus on high image throughput for computer vision (CV) applications. FasterViT combines the benefits of fast local representation learning in CNNs and global modeling properties in ViT. Our newly introduced Hierarchical Attention (HAT) approach decomposes global self-attention with quadratic complexity into a multi-level attention with reduced computational costs. We benefit from efficient window-based self-attention. Each window has access to dedicated carrier tokens that participate in local and global representation learning. At a high level, global self-attentions enable the efficient cross-window communication at lower costs. FasterViT achieves a SOTA Pareto-front in terms of accuracy and image throughput. We have extensively validated its effectiveness on various CV tasks including classification, object detection and segmentation. We also show that HAT can be used as a plug-and-play module for existing networks and enhance them. We further demonstrate significantly faster and more accurate performance than competitive counterparts for images with high resolution. Code is available at https://github.com/NVlabs/FasterViT.",
        "keywords": "Vision Transformers;Classification;Detection;Instance Segmentation;Semantic Segmentation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/74f6a534791a635383eef56678e67d89caa7978c.pdf",
        "author": "Ali Hatamizadeh;Greg Heinrich;Hongxu Yin;Andrew Tao;Jose M. Alvarez;Jan Kautz;Pavlo Molchanov",
        "authorids": "~Ali_Hatamizadeh1;~Greg_Heinrich1;~Hongxu_Yin2;~Andrew_Tao1;~Jose_M._Alvarez2;~Jan_Kautz1;~Pavlo_Molchanov1",
        "gender": ";M;;M;;;M",
        "homepage": ";;;;;http://jankautz.com;",
        "dblp": ";;;210/2645;;48/6214;165/8169.html",
        "google_scholar": ";VrjibvwAAAAJ;;Wel9l1wAAAAJ;;P9FclNEAAAAJ;J9PoyoIAAAAJ",
        "orcid": ";;;;;;",
        "linkedin": ";gheinrich/;;;;;",
        "or_profile": "~Ali_Hatamizadeh1;~Greg_Heinrich1;~Hongxu_Yin2;~Andrew_Tao1;~Jose_M._Alvarez2;~Jan_Kautz1;~Pavlo_Molchanov1",
        "aff": ";NVIDIA;;NVIDIA Corporation;;NVIDIA;NVIDIA Research",
        "aff_domain": ";nvidia.com;;nvidia.com;;nvidia.com;nvidia.com",
        "position": ";Researcher;;Vice President of Applied Research;;VP Research;Research Scientist",
        "bibtex": "@inproceedings{\nhatamizadeh2024fastervit,\ntitle={FasterViT: Fast Vision Transformers with Hierarchical Attention},\nauthor={Ali Hatamizadeh and Greg Heinrich and Hongxu Yin and Andrew Tao and Jose M. Alvarez and Jan Kautz and Pavlo Molchanov},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=kB4yBiNmXX}\n}",
        "github": "",
        "project": "",
        "reviewers": "tsUS;oF4Y;Wvdn;B19F",
        "pdf_size": 1338951,
        "rating": "5;6;6;6",
        "confidence": "5;4;4;4",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "82;78;133;45",
        "wc_strengths": "96;64;88;66",
        "wc_weaknesses": "131;161;51;136",
        "wc_questions": "322;1;18;77",
        "wc_review": "631;304;290;324",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "664;475;313;602",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            84.5,
            31.468237955119125
        ],
        "wc_strengths_avg": [
            78.5,
            13.811227316933133
        ],
        "wc_weaknesses_avg": [
            119.75,
            41.287861412284364
        ],
        "wc_questions_avg": [
            104.5,
            128.70217558378724
        ],
        "wc_review_avg": [
            387.25,
            141.24690262090706
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            513.5,
            134.31772034992255
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 81,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12593234190146641259&as_sdt=5,34&sciodt=0,34&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=kB4yBiNmXX",
        "pdf": "https://openreview.net/pdf?id=kB4yBiNmXX",
        "email": ";nvidia.com;;nvidia.com;;nvidia.com;nvidia.com",
        "author_num": 7,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "NVIDIA",
        "aff_unique_dep": "NVIDIA Corporation",
        "aff_unique_url": "https://www.nvidia.com",
        "aff_unique_abbr": "NVIDIA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Lifting Architectural Constraints of Injective Flows",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17989",
        "id": "kBNIx4Biq4",
        "author_site": "Peter Sorrenson, Felix Draxler, Armand Rousselot, Sander Hummerich, Lea Zimmermann, Ullrich Koethe",
        "tldr": "",
        "abstract": "Normalizing Flows explicitly maximize a full-dimensional likelihood on the training data. However, real data is typically only supported on a lower-dimensional manifold leading the model to expend significant compute on modeling noise. Injective Flows fix this by jointly learning a manifold and the distribution on it. So far, they have been limited by restrictive architectures and/or high computational cost. We lift both constraints by a new efficient estimator for the maximum likelihood loss, compatible with free-form bottleneck architectures. We further show that naively learning both the data manifold and the distribution on it can lead to divergent solutions, and use this insight to motivate a stable maximum likelihood training objective. We perform extensive experiments on toy, tabular and image data, demonstrating the competitive performance of the resulting model.",
        "keywords": "normalizing flows;injective flows;manifold learning;maximum likelihood;generative model;auto encoder",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Peter Sorrenson;Felix Draxler;Armand Rousselot;Sander Hummerich;Lea Zimmermann;Ullrich Koethe",
        "authorids": "~Peter_Sorrenson1;~Felix_Draxler1;~Armand_Rousselot1;~Sander_Hummerich1;~Lea_Zimmermann1;~Ullrich_Koethe1",
        "gender": "M;M;M;F;M;M",
        "homepage": ";;;;https://hci.iwr.uni-heidelberg.de/vislearn/people/ullrich-koethe/;",
        "dblp": "242/9148;304/8323;304/8414;;15/809;256/5384",
        "google_scholar": "rFbxDSAAAAAJ;FqvjidYAAAAJ;https://scholar.google.de/citations?user=ELi2EVIAAAAJ;;gt-yaNMAAAAJ;894uGm4AAAAJ",
        "orcid": "0000-0003-0978-1539;;;;0000-0001-6036-1287;",
        "linkedin": "felix-draxler/;;;https://linkedin.com/in/lea-zimmermann;;",
        "or_profile": "~Felix_Draxler1;~Armand_Rousselot1;~Sander_Hummerich1;~Lea_Zimmermann1;~Ullrich_Koethe1;~Peter_Rangi_Sorrenson1",
        "aff": "Heidelberg University;Heidelberg University, Ruprecht-Karls-Universit\u00e4t Heidelberg;Ruprecht-Karls-Universit\u00e4t Heidelberg;Heidelberg University, Ruprecht-Karls-Universit\u00e4t Heidelberg;Heidelberg University;Heidelberg University",
        "aff_domain": "uni-heidelberg.de;iwr.uni-heidelberg.de;uni-heidelberg.de;iwr.uni-heidelberg.de;uni-heidelberg.de;uni-heidelberg.de",
        "position": "PhD student;PhD student;MS student;PhD student;Adjunct Professor;PhD student",
        "bibtex": "@inproceedings{\nsorrenson2024lifting,\ntitle={Lifting Architectural Constraints of Injective Flows},\nauthor={Peter Sorrenson and Felix Draxler and Armand Rousselot and Sander Hummerich and Lea Zimmermann and Ullrich Koethe},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=kBNIx4Biq4}\n}",
        "github": "",
        "project": "",
        "reviewers": "RfcP;vmge;SnSS;KrZV",
        "pdf_size": 5126379,
        "rating": "5;5;8;8",
        "confidence": "4;4;5;5",
        "soundness": "3;2;4;3",
        "contribution": "2;3;3;3",
        "presentation": "3;2;4;4",
        "wc_summary": "90;71;382;93",
        "wc_strengths": "24;21;120;181",
        "wc_weaknesses": "101;24;424;613",
        "wc_questions": "188;80;173;53",
        "wc_review": "403;196;1099;940",
        "wc_reply_reviewers": "531;291;408;287",
        "wc_reply_authors": "1494;1148;1127;1116",
        "reply_reviewers": "3;2;3;2",
        "reply_authors": "4;3;4;2",
        "rating_avg": [
            6.5,
            1.5
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            159.0,
            129.02519133874594
        ],
        "wc_strengths_avg": [
            86.5,
            67.54442982215484
        ],
        "wc_weaknesses_avg": [
            290.5,
            239.14483059434926
        ],
        "wc_questions_avg": [
            123.5,
            58.03662636645931
        ],
        "wc_review_avg": [
            659.5,
            371.639946722631
        ],
        "wc_reply_reviewers_avg": [
            379.25,
            100.19075556157864
        ],
        "wc_reply_authors_avg": [
            1221.25,
            157.8913788020106
        ],
        "reply_reviewers_avg": [
            2.5,
            0.5
        ],
        "reply_authors_avg": [
            3.25,
            0.82915619758885
        ],
        "replies_avg": [
            30,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12926385544353195172&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=kBNIx4Biq4",
        "pdf": "https://openreview.net/pdf?id=kBNIx4Biq4",
        "email": "uni-heidelberg.de;iwr.uni-heidelberg.de;uni-heidelberg.de;iwr.uni-heidelberg.de;uni-heidelberg.de;uni-heidelberg.de",
        "author_num": 6,
        "aff_unique_index": "0;0;1;0;0;0",
        "aff_unique_norm": "Heidelberg University;Ruprecht-Karls-Universit\u00e4t Heidelberg",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uni-heidelberg.de;https://www.uni-heidelberg.de/",
        "aff_unique_abbr": "Uni Heidelberg;Uni Heidelberg",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Heidelberg",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "title": "Faithful Rule Extraction for Differentiable Rule Learning Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17988",
        "id": "kBTzlxM2J1",
        "author_site": "Xiaxia Wang, David Jaime Tena Cucala, Bernardo Grau, Ian Horrocks",
        "tldr": "",
        "abstract": "There is increasing interest in methods for extracting interpretable rules from ML models trained to solve a wide range of tasks over knowledge graphs (KGs), such as KG completion, node classification, question answering and recommendation. Many such approaches, however, lack formal guarantees establishing the precise relationship between the model and the extracted rules, and this lack of assurance becomes especially problematic when the extracted rules are applied in safety-critical contexts or to ensure compliance with legal requirements. Recent research has examined whether the rules derived from the influential Neural-LP model exhibit soundness (or completeness), which means that the results obtained by applying the model to any dataset always contain (or are contained in) the results obtained by applying the rules to the same dataset. In this paper, we extend this analysis to the context of DRUM, an approach that has demonstrated superior practical performance. After observing that the rules currently extracted from a DRUM model can be unsound and/or incomplete, we propose a novel algorithm where the output rules, expressed in an extension of Datalog, ensure both soundness and completeness. This algorithm, however, can be inefficient in practice and hence we propose additional constraints to DRUM models facilitating rule extraction, albeit at the expense of reduced expressive power.",
        "keywords": "Faithful Rule Extraction;Rule Learning;Knowledge Graph;Datalog",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "",
        "author": "Xiaxia Wang;David Jaime Tena Cucala;Bernardo Cuenca Grau;Ian Horrocks",
        "authorids": "~Xiaxia_Wang2;~David_Jaime_Tena_Cucala1;~Bernardo_Cuenca_Grau1;~Ian_Horrocks1",
        "gender": "F;Non-Binary;;",
        "homepage": "https://xiaxia-wang.github.io/;https://www.cs.ox.ac.uk/people/david.tenacucala/;https://www.cs.ox.ac.uk/people/bernardo.cuencagrau/;http://www.cs.ox.ac.uk/ian.horrocks/",
        "dblp": "126/2338-1;;71/6448;h/IanHorrocks",
        "google_scholar": "AXCigpUAAAAJ;;THu1uZMAAAAJ;0ypdmcYAAAAJ",
        "orcid": "0000-0003-4184-0754;;;",
        "linkedin": "xiaxia-wang/;;;",
        "or_profile": "~Xiaxia_Wang2;~David_Jaime_Tena_Cucala1;~Bernardo_Cuenca_Grau1;~Ian_Horrocks1",
        "aff": "University of Oxford;University of Oxford;University of Oxford;University of Oxford",
        "aff_domain": "ox.ac.uk;ox.ac.uk;cs.ox.ac.uk;ox.ac.uk",
        "position": "PhD student;Postdoc;Professor;Full Professor",
        "bibtex": "@inproceedings{\nwang2024faithful,\ntitle={Faithful Rule Extraction for Differentiable Rule Learning Models},\nauthor={Xiaxia Wang and David Jaime Tena Cucala and Bernardo Cuenca Grau and Ian Horrocks},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=kBTzlxM2J1}\n}",
        "github": "",
        "project": "",
        "reviewers": "dHjy;piEQ;BVyG;Crqq",
        "pdf_size": 627429,
        "rating": "5;6;8;8",
        "confidence": "2;3;3;2",
        "soundness": "2;2;3;4",
        "contribution": "2;3;3;3",
        "presentation": "2;2;3;2",
        "wc_summary": "174;47;165;87",
        "wc_strengths": "9;48;9;35",
        "wc_weaknesses": "28;259;32;249",
        "wc_questions": "28;2;1;40",
        "wc_review": "239;356;207;411",
        "wc_reply_reviewers": "4;162;0;0",
        "wc_reply_authors": "259;442;25;316",
        "reply_reviewers": "1;2;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            2.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            118.25,
            53.26056233274298
        ],
        "wc_strengths_avg": [
            25.25,
            16.887495373796554
        ],
        "wc_weaknesses_avg": [
            142.0,
            112.06471344718639
        ],
        "wc_questions_avg": [
            17.75,
            16.798437427332342
        ],
        "wc_review_avg": [
            303.25,
            83.3437910104886
        ],
        "wc_reply_reviewers_avg": [
            41.5,
            69.58986995245787
        ],
        "wc_reply_authors_avg": [
            260.5,
            151.23243699682948
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.19245008972987526,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8695620258426014690&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=kBTzlxM2J1",
        "pdf": "https://openreview.net/pdf?id=kBTzlxM2J1",
        "email": "ox.ac.uk;ox.ac.uk;cs.ox.ac.uk;ox.ac.uk",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of Oxford",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ox.ac.uk",
        "aff_unique_abbr": "Oxford",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "kBuvY8mzJK",
        "title": "G-TIGRE: A new generative framework for Multivariate Time Series Imputation By Graph Neural Networks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The persistent challenge of handling missing values in multivariate time series (MTS) data demands precise solutions to avoid potential pitfalls in real-world applications. Conventional imputation methods often struggle to capture effective spatio-temporal representations of such data, failing to exploit its intrinsic temporal nature and intricate inter-variable relationships. In recent years, deep learning-based imputation methods have gained popularity. However, they often lack dedicated structures and models specifically designed to address this unique challenge. In response to these challenges, we introduce a novel framework called G-TIGRE, which synergistically leverages the capabilities of two prominent research streams in this field: Generative Adversarial Networks (GANs) and Graph Neural Networks (GNNs). GANs excel at effectively modeling data distributions, while GNNs demonstrate remarkable proficiency in extracting spatio-temporal features from data. By integrating these two techniques, which have not previously been explored together in this domain, G-TIGRE addresses several critical issues, including the elimination of the need to make assumptions about data stationarity, the ability to train with incomplete data, and the enhancement of spatio-temporal representation learning. Through extensive experiments conducted on a diverse benchmark of state-of-the-art methods, we establish that G-TIGRE achieves competitive performance, closely rivaling the top-performing models. Furthermore, an in-depth ablation study sheds light on the unique contributions of each component within G-TIGRE, elucidating its effectiveness in MTS imputation. This work introduces an exciting shift in addressing the persistent challenges of missing data in multivariate time series, with far-reaching implications across various domains.",
        "keywords": "generative adversarial network;graph neural network;time series;imputation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/49f6b18e4a5a1b4fc6b439ebb8c9fcf2f4956c16.zip",
        "author": "Javier Sol\u00eds-Garc\u00eda;Bel\u00e9n Vega-M\u00e1rquez;Juan A. Nepomuceno;Isabel A. Nepomuceno-Chamorro",
        "authorids": "~Javier_Sol\u00eds-Garc\u00eda1;~Bel\u00e9n_Vega-M\u00e1rquez1;~Juan_A._Nepomuceno1;~Isabel_A._Nepomuceno-Chamorro1",
        "gender": "M;F;M;F",
        "homepage": ";;http://www.lsi.us.es/~janepo/;",
        "dblp": ";;https://dblp.uni-trier.de/pid/81/3812.html;",
        "google_scholar": "https://scholar.google.es/citations?user=XD4awt0AAAAJ;;https://scholar.google.es/citations?hl=en;https://scholar.google.com/citations?hl=es",
        "orcid": "0000-0002-2036-3605;0000-0002-2466-6486;;",
        "linkedin": "javier-solis-garcia/;;;",
        "or_profile": "~Javier_Sol\u00eds-Garc\u00eda1;~Bel\u00e9n_Vega-M\u00e1rquez1;~Juan_A._Nepomuceno1;~Isabel_A._Nepomuceno-Chamorro1",
        "aff": "Universidad de Sevilla;Universidad de Sevilla;Universidad de Sevilla;Universidad de Sevilla",
        "aff_domain": "us.es;us.es;us.es;us.es",
        "position": "Researcher;Lecturer;Lecturer;Associate Professor",
        "bibtex": "@misc{\nsol{\\'\\i}s-garc{\\'\\i}a2024gtigre,\ntitle={G-{TIGRE}: A new generative framework for Multivariate Time Series Imputation By Graph Neural Networks},\nauthor={Javier Sol{\\'\\i}s-Garc{\\'\\i}a and Bel{\\'e}n Vega-M{\\'a}rquez and Juan A. Nepomuceno and Isabel A. Nepomuceno-Chamorro},\nyear={2024},\nurl={https://openreview.net/forum?id=kBuvY8mzJK}\n}",
        "github": "",
        "project": "",
        "reviewers": "FuJh;vBVz;mn2X;XP5p",
        "site": "https://openreview.net/forum?id=kBuvY8mzJK",
        "pdf_size": 605137,
        "rating": "3;3;3;3",
        "confidence": "4;3;3;4",
        "soundness": "2;2;2;2",
        "contribution": "1;2;2;2",
        "presentation": "3;2;3;2",
        "wc_summary": "53;64;106;73",
        "wc_strengths": "15;83;55;15",
        "wc_weaknesses": "262;213;302;195",
        "wc_questions": "10;369;88;2",
        "wc_review": "340;729;551;285",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            74.0,
            19.78635893740938
        ],
        "wc_strengths_avg": [
            42.0,
            28.75760768909681
        ],
        "wc_weaknesses_avg": [
            243.0,
            41.970227542866624
        ],
        "wc_questions_avg": [
            117.25,
            149.18005060999275
        ],
        "wc_review_avg": [
            476.25,
            176.50123937241915
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:hyG53C7KGtoJ:scholar.google.com/&scioq=G-TIGRE:+A+new+generative+framework+for+Multivariate+Time+Series+Imputation+By+Graph+Neural+Networks&hl=en&as_sdt=0,33",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Universidad de Sevilla",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.us.es",
        "aff_unique_abbr": "US",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Spain"
    },
    {
        "id": "kC5i5X9xrn",
        "title": "LightSeq: Sequence Level Parallelism for Distributed Training of Long Context Transformers",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Increasing the context length of large language models (LLMs) unlocks fundamentally new capabilities, but also significantly increases the memory footprints of training. Previous model-parallel systems such as Megatron-LM partition and compute different attention heads in parallel, resulting in large communication volumes, so they cannot scale beyond the number of attention heads, thereby hindering its adoption. In this paper, we introduce a new approach, LightSeq, for long-context LLMs training. LightSeq has many notable advantages. First, LightSeq partitions over the sequence dimension, hence is agnostic to model architectures and readily applicable for models with varying numbers of attention heads, such as Multi-Head, Multi-Query and Grouped-Query attention. Second, LightSeq not only requires up to 4.7\u00d7 less communication than Megatron-LM on popular LLMs but also overlaps the communication with computation. To further reduce the training time, LightSeq features a novel gradient checkpointing scheme to bypass an forward computation for memory-efficient attention. We evaluate LightSeq on Llama-7B and its variants with sequence lengths from 32K to 512K. Through comprehensive experiments on single and cross-node training, we show that LightSeq achieves up to 1.24-2.01\u00d7 end-to-end speedup, and a 2-8\u00d7 longer sequence length on models with fewer heads, compared to Megatron-LM. Anonymous codes available at https://anonymous.4open.science/r/lightseq-anonymized.",
        "keywords": "Distributed Large language models training;long context;sequence parallelism;recomputation;overlap communication",
        "primary_area": "infrastructure, software libraries, hardware, etc.",
        "supplementary_material": "/attachment/0efad59733aea2b6279341986732e18ee5f46789.pdf",
        "author": "Dacheng Li;Rulin Shao;Anze Xie;Eric Xing;Joseph E. Gonzalez;Ion Stoica;Xuezhe Ma;Hao Zhang",
        "authorids": "~Dacheng_Li1;~Rulin_Shao1;~Anze_Xie1;~Eric_Xing1;~Joseph_E._Gonzalez1;~Ion_Stoica1;~Xuezhe_Ma1;~Hao_Zhang2",
        "gender": ";;;M;M;M;M;M",
        "homepage": ";https://rulinshao.github.io/;;http://www.cs.cmu.edu/~epxing/;http://eecs.berkeley.edu/~jegonzal;http://people.eecs.berkeley.edu/~istoica/;https://xuezhemax.github.io/;https://cseweb.ucsd.edu/~haozhang/",
        "dblp": ";;;36/3855;61/8262;s/IonStoica;127/0230;55/2270-25",
        "google_scholar": ";Vdwh6bcAAAAJ;;https://scholar.google.com.tw/citations?user=5pKTRxEAAAAJ;https://scholar.google.com.tw/citations?user=gM2WW9UAAAAJ;vN-is70AAAAJ;6_MQLIcAAAAJ;H1d4BS8AAAAJ",
        "orcid": ";;;;0000-0003-2921-956X;;;",
        "linkedin": ";;;;;ionstoica;xuezhe-ma-b5354731;",
        "or_profile": "~Dacheng_Li1;~Rulin_Shao1;~Anze_Xie1;~Eric_Xing1;~Joseph_E._Gonzalez1;~Ion_Stoica1;~Xuezhe_Ma1;~Hao_Zhang2",
        "aff": ";University of Washington;;School of Computer Science, Carnegie Mellon University;University of California, Berkeley;University of California, Berkeley;USC/ISI;Carnegie Mellon University",
        "aff_domain": ";uw.edu;;cs.cmu.edu;berkeley.edu;berkeley.edu;isi.edu;cmu.edu",
        "position": ";PhD student;;Full Professor;Associate Professor;Full Professor;Assistant Professor;PhD student",
        "bibtex": "@misc{\nli2024lightseq,\ntitle={LightSeq: Sequence Level Parallelism for Distributed Training of Long Context Transformers},\nauthor={Dacheng Li and Rulin Shao and Anze Xie and Eric Xing and Joseph E. Gonzalez and Ion Stoica and Xuezhe Ma and Hao Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=kC5i5X9xrn}\n}",
        "github": "",
        "project": "",
        "reviewers": "AsB4;Fg9E;xpDg;ZAxH",
        "site": "https://openreview.net/forum?id=kC5i5X9xrn",
        "pdf_size": 4843865,
        "rating": "3;5;6;6",
        "confidence": "4;3;5;3",
        "soundness": "3;2;3;3",
        "contribution": "2;2;2;2",
        "presentation": "3;2;3;2",
        "wc_summary": "61;103;98;166",
        "wc_strengths": "60;20;116;34",
        "wc_weaknesses": "332;69;624;65",
        "wc_questions": "3;197;97;288",
        "wc_review": "456;389;935;553",
        "wc_reply_reviewers": "46;0;0;0",
        "wc_reply_authors": "1591;752;1597;904",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "6;3;5;3",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            107.0,
            37.72929895982696
        ],
        "wc_strengths_avg": [
            57.5,
            36.69809259348502
        ],
        "wc_weaknesses_avg": [
            272.5,
            229.9788033710933
        ],
        "wc_questions_avg": [
            146.25,
            106.78804942501759
        ],
        "wc_review_avg": [
            583.25,
            211.286979011959
        ],
        "wc_reply_reviewers_avg": [
            11.5,
            19.91858428704209
        ],
        "wc_reply_authors_avg": [
            1211.0,
            386.7576760712061
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.25,
            1.299038105676658
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 29,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8902669087669322212&as_sdt=5,31&sciodt=0,31&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;2;3;1",
        "aff_unique_norm": "University of Washington;Carnegie Mellon University;University of California, Berkeley;University of Southern California",
        "aff_unique_dep": ";School of Computer Science;;",
        "aff_unique_url": "https://www.washington.edu;https://www.cmu.edu;https://www.berkeley.edu;https://isi.usc.edu",
        "aff_unique_abbr": "UW;CMU;UC Berkeley;USC",
        "aff_campus_unique_index": "1;2;2;3",
        "aff_campus_unique": ";Pittsburgh;Berkeley;ISI",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Selective Visual Representations Improve Convergence and Generalization for Embodied AI",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17987",
        "id": "kC5nZDU5zf",
        "author_site": "Ainaz Eftekhar, Kuo-Hao Zeng, Jiafei Duan, Ali Farhadi, Aniruddha Kembhavi, Ranjay Krishna",
        "tldr": "",
        "abstract": "Embodied AI models often employ off the shelf vision backbones like CLIP to encode their visual observations. Although such general purpose representations encode rich syntactic and semantic information about the scene, much of this information is often irrelevant to the specific task at hand. This introduces noise within the learning process and distracts the agent's focus from task-relevant visual cues.\nInspired by selective attention in humans\u2014the process through which people filter their perception based on their experiences, knowledge, and the task at hand\u2014we introduce a parameter-efficient approach to filter visual stimuli for embodied AI.\nOur approach induces a task-conditioned bottleneck using a small learnable codebook module. This codebook is trained jointly to optimize task reward and acts as a task-conditioned selective filter over the visual observation.\nOur experiments showcase state-of-the-art performance for object goal navigation and object displacement across $5$ benchmarks, ProcTHOR, ArchitecTHOR, RoboTHOR, AI2-iTHOR, and ManipulaTHOR. The filtered representations produced by the codebook are also able generalize better and converge faster when adapted to other simulation environments such as Habitat. Our qualitative analyses show that agents explore their environments more effectively and their representations retain task-relevant information like target object recognition while ignoring superfluous information about other objects.",
        "keywords": "Embodied-AI;Task-conditioned Representations;Visual Navigation;Reinforcement Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Ainaz Eftekhar;Kuo-Hao Zeng;Jiafei Duan;Ali Farhadi;Aniruddha Kembhavi;Ranjay Krishna",
        "authorids": "~Ainaz_Eftekhar1;~Kuo-Hao_Zeng3;~Jiafei_Duan1;~Ali_Farhadi3;~Aniruddha_Kembhavi1;~Ranjay_Krishna1",
        "gender": "F;M;M;M;M;M",
        "homepage": "https://ainaz99.github.io/;https://kuohaozeng.github.io;https://duanjiafei.com/;https://homes.cs.washington.edu/~ali/;https://anikem.github.io/;http://ranjaykrishna.com",
        "dblp": ";185/0743;275/9973.html;37/5826;81/7583;167/3785",
        "google_scholar": "_jKxsTgAAAAJ;SRWelkkAAAAJ;d1WCSJIAAAAJ;jeOFRDsAAAAJ;JnUevM0AAAAJ;IcqahyAAAAAJ",
        "orcid": ";;;;;0000-0001-8784-2531",
        "linkedin": ";%E5%9C%8B%E8%B1%AA-%E6%9B%BE-0165b7b9/?locale=en_US;jiafei-duan-a69b11112/;;;ranjay-krishna-1a344444/",
        "or_profile": "~Ainaz_Eftekhar1;~Kuo-Hao_Zeng3;~Jiafei_Duan1;~Ali_Farhadi3;~Aniruddha_Kembhavi1;~Ranjay_Krishna1",
        "aff": "University of Washington;Allen Institute for Artificial Intelligence;NVIDIA;University of Washington;Allen Institute for Artificial Intelligence;University of Washington",
        "aff_domain": "uw.edu;allenai.org;nvidia.com;cs.uw.edu;allenai.org;cs.washington.edu",
        "position": "PhD student;Research Scientist;Intern;Full Professor;Research Manager;Assistant Professor",
        "bibtex": "@inproceedings{\neftekhar2024selective,\ntitle={Selective Visual Representations Improve Convergence and Generalization for Embodied {AI}},\nauthor={Ainaz Eftekhar and Kuo-Hao Zeng and Jiafei Duan and Ali Farhadi and Aniruddha Kembhavi and Ranjay Krishna},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=kC5nZDU5zf}\n}",
        "github": "",
        "project": "",
        "reviewers": "NmEd;vxKH;YjyH;X3Z2",
        "pdf_size": 19788453,
        "rating": "6;8;8;8",
        "confidence": "4;3;3;4",
        "soundness": "3;3;3;3",
        "contribution": "3;3;2;2",
        "presentation": "3;4;3;3",
        "wc_summary": "55;73;97;64",
        "wc_strengths": "63;113;56;51",
        "wc_weaknesses": "174;24;131;117",
        "wc_questions": "38;98;97;126",
        "wc_review": "330;308;381;358",
        "wc_reply_reviewers": "47;0;0;16",
        "wc_reply_authors": "550;693;943;568",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            72.25,
            15.642490210960657
        ],
        "wc_strengths_avg": [
            70.75,
            24.762623043611516
        ],
        "wc_weaknesses_avg": [
            111.5,
            54.71060226318113
        ],
        "wc_questions_avg": [
            89.75,
            32.06536293261001
        ],
        "wc_review_avg": [
            344.25,
            27.643941470058138
        ],
        "wc_reply_reviewers_avg": [
            15.75,
            19.188212527486765
        ],
        "wc_reply_authors_avg": [
            688.5,
            156.91797220203938
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5890582974513816933&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=kC5nZDU5zf",
        "pdf": "https://openreview.net/pdf?id=kC5nZDU5zf",
        "email": "uw.edu;allenai.org;nvidia.com;cs.uw.edu;allenai.org;cs.washington.edu",
        "author_num": 6,
        "aff_unique_index": "0;1;2;0;1;0",
        "aff_unique_norm": "University of Washington;Allen Institute for Artificial Intelligence;NVIDIA",
        "aff_unique_dep": ";;NVIDIA Corporation",
        "aff_unique_url": "https://www.washington.edu;https://allenai.org;https://www.nvidia.com",
        "aff_unique_abbr": "UW;AI2;NVIDIA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "kCcIYc98ho",
        "title": "Mixing Corrupted Preferences for Robust and Feedback-Efficient Preference-Based Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Preference-based reinforcement learning (RL) trains agents using non-expert feedback without the need for detailed reward design. In this approach, a human teacher provides feedback to the agent by comparing two behavior trajectories and labeling the preference. Although recent studies have improved feedback efficiency through methods like unsupervised exploration to collect various trajectories and combined self- or semi-supervised learning for unlabeled queries, they often assume flawless human annotation. In practice, human teachers might make mistakes or have conflicting opinions about trajectory preferences. The potential negative impact of such corrupted preferences on capturing user intent remains an underexplored challenge. To address this challenge, we introduce mixing corrupted preferences (MCP) for robust and feedback-efficient preference-based RL. Mixup has shown robustness against corrupted labels by reducing the influence of faulty instances. By generating new preference data through the component-wise mixing of two labeled preferences, our method lessens the impact of corrupted feedback, thereby enhancing robustness. Furthermore, MCP improves feedback efficiency: even with limited labeled feedback, it can generate unlimited new data. We evaluate our method on three locomotion and six robotic manipulation tasks in B-Pref benchmark, comparing it with PEBBLE in contexts with both perfectly rational and imperfect teachers. Our results show that MCP significantly outperforms PEBBLE, requiring fewer feedback instances and a shorter training period, highlighting its superior feedback efficiency.",
        "keywords": "preference-based reinforcement learning;label noise;robotic manipulation;locomotion",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/e6cf1452b054d50254c4318147047529038ac6ed.zip",
        "author": "Jongkook Heo;Young Jae Lee;Jaehoon Kim;Min Gu Kwak;Youngjoon Park;Seoung Bum Kim",
        "authorids": "~Jongkook_Heo1;~Young_Jae_Lee1;~Jaehoon_Kim2;~Min_Gu_Kwak1;~Youngjoon_Park1;~Seoung_Bum_Kim1",
        "gender": "M;M;M;M;;M",
        "homepage": ";;;;;http://dmqa.korea.ac.kr/",
        "dblp": ";;;;;48/803",
        "google_scholar": ";;d1DjmOQAAAAJ;sFsZSfMAAAAJ;;https://scholar.google.co.kr/citations?user=-ACQ0GAAAAAJ",
        "orcid": "0009-0005-7437-5985;0000-0002-1309-0602;0000-0002-4773-6467;0000-0003-0649-9909;;",
        "linkedin": ";;;min-gu-kwak-787b35199/;;",
        "or_profile": "~Jongkook_Heo1;~Young_Jae_Lee1;~Jaehoon_Kim2;~Min_Gu_Kwak1;~Youngjoon_Park1;~Seoung_Bum_Kim1",
        "aff": "Korea University;Korea University;Korea University;Georgia Institute of Technology;;Korea University",
        "aff_domain": "korea.ac.kr;korea.ac.kr;korea.ac.kr;gatech.edu;;korea.ac.kr",
        "position": "PhD student;PhD student;PhD student;Postdoc;;Full Professor",
        "bibtex": "@misc{\nheo2024mixing,\ntitle={Mixing Corrupted Preferences for Robust and Feedback-Efficient Preference-Based Reinforcement Learning},\nauthor={Jongkook Heo and Young Jae Lee and Jaehoon Kim and Min Gu Kwak and Youngjoon Park and Seoung Bum Kim},\nyear={2024},\nurl={https://openreview.net/forum?id=kCcIYc98ho}\n}",
        "github": "",
        "project": "",
        "reviewers": "77Am;2zSd;4pKf",
        "site": "https://openreview.net/forum?id=kCcIYc98ho",
        "pdf_size": 3663980,
        "rating": "5;6;6",
        "confidence": "4;4;4",
        "soundness": "2;2;3",
        "contribution": "2;2;2",
        "presentation": "3;3;2",
        "wc_summary": "65;137;51",
        "wc_strengths": "18;126;61",
        "wc_weaknesses": "189;208;186",
        "wc_questions": "36;56;330",
        "wc_review": "308;527;628",
        "wc_reply_reviewers": "214;91;894",
        "wc_reply_authors": "932;1402;1101",
        "reply_reviewers": "1;2;3",
        "reply_authors": "3;4;3",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            84.33333333333333,
            37.67698973585278
        ],
        "wc_strengths_avg": [
            68.33333333333333,
            44.39469437769438
        ],
        "wc_weaknesses_avg": [
            194.33333333333334,
            9.741092797468305
        ],
        "wc_questions_avg": [
            140.66666666666666,
            134.12763407375164
        ],
        "wc_review_avg": [
            487.6666666666667,
            133.56729473273845
        ],
        "wc_reply_reviewers_avg": [
            399.6666666666667,
            353.1348499117897
        ],
        "wc_reply_authors_avg": [
            1145.0,
            194.38278387415554
        ],
        "reply_reviewers_avg": [
            2.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:kY8c8Ru7jk8J:scholar.google.com/&scioq=Mixing+Corrupted+Preferences+for+Robust+and+Feedback-Efficient+Preference-Based+Reinforcement+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "Korea University;Georgia Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.korea.ac.kr;https://www.gatech.edu",
        "aff_unique_abbr": "KU;Georgia Tech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "id": "kCnLHHtk1y",
        "title": "Building a Special Representation for the Chinese Ancient Buildings in Diffusion models.",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Benefit from the great generative ability of diffusion models, people can build various images based on their imaginations via some carefully designing prompts. Acctually, the functional blocks, like CLIP, for the alignment between prompts and representation of images plays the key role. Limited by the training data, these models performs worse in some rare areas, like Chinese ancient buildings. The reason comes from the missing of special representation of these building's elements, such as breckets, roofs, bias of different periods. In this paper, we firstly collect more than 400 images of ancient buildings. Several subsets are separated by their generalities.  Secondly, pinyin, the basic tool for learning Chinese,  is firstly introduced into large models as the specific tools to describe the characters of these buildings. Thirdly, we train several fine-tuning models to exhibit the ideal performance of our models compared with existing models. Experiments prove that  our route can resolve the barriers between English-centric models and other cultures.",
        "keywords": "Fine-tuning;Chinese Ancient Buildings;Pinyin;Diffusion Model",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Biao Li;JINYUAN FENG;Yunxi Yan;Gang Kou;Yong Shi;Fan Meng",
        "authorids": "~Biao_Li1;~JINYUAN_FENG2;~Yunxi_Yan1;~Gang_Kou1;~Yong_Shi1;~Fan_Meng1",
        "gender": "M;M;F;M;M;M",
        "homepage": "https://gs.swufe.edu.cn/info/1571/10285.htm;https://github.com/FengJinyuan-sudo;https://github.com/yanyunxi;;;",
        "dblp": ";;;84/5885;84/5467;",
        "google_scholar": "fFRnSxwAAAAJ;;;https://scholar.google.com/citations?hl=en;;",
        "orcid": "0000-0002-8952-1990;;0000-0003-4842-0074;0000-0002-9220-8647;; 0000-0002-7742-3015",
        "linkedin": ";;;;;",
        "or_profile": "~Biao_Li1;~JINYUAN_FENG2;~Yunxi_Yan1;~Gang_Kou1;~Yong_Shi1;~Fan_Meng1",
        "aff": "Southwest University of Finance and Economics;Southwest University of Finance and Economics;Southwest University of Finance and Economics;Southwest University of Finance and Economics;University of Chinese Academy of Sciences;Peking University",
        "aff_domain": "swufe.edu.cn;swufe.edu.cn;swufe.edu.cn;swufe.edu.cn;ucas.edu;pku.edu.cn",
        "position": "Associate Professor;MS student;MS student;Full Professor;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nli2024building,\ntitle={Building a Special Representation for the Chinese Ancient Buildings in Diffusion models.},\nauthor={Biao Li and JINYUAN FENG and Yunxi Yan and Gang Kou and Yong Shi and Fan Meng},\nyear={2024},\nurl={https://openreview.net/forum?id=kCnLHHtk1y}\n}",
        "github": "",
        "project": "",
        "reviewers": "3LWK;szHe;Wuxm",
        "site": "https://openreview.net/forum?id=kCnLHHtk1y",
        "pdf_size": 9067381,
        "rating": "1;3;5",
        "confidence": "4;2;4",
        "soundness": "1;2;3",
        "contribution": "1;2;2",
        "presentation": "1;1;3",
        "wc_summary": "51;89;86",
        "wc_strengths": "10;61;24",
        "wc_weaknesses": "20;201;103",
        "wc_questions": "8;15;18",
        "wc_review": "89;366;231",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            1.632993161855452
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            75.33333333333333,
            17.249798710580816
        ],
        "wc_strengths_avg": [
            31.666666666666668,
            21.51485275080657
        ],
        "wc_weaknesses_avg": [
            108.0,
            73.9774740489743
        ],
        "wc_questions_avg": [
            13.666666666666666,
            4.189935029992179
        ],
        "wc_review_avg": [
            228.66666666666666,
            113.09681201912319
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:h13eqCTnsT0J:scholar.google.com/&scioq=Building+a+Special+Representation+for+the+Chinese+Ancient+Buildings+in+Diffusion+models.&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;1;2",
        "aff_unique_norm": "Southwest University of Finance and Economics;University of Chinese Academy of Sciences;Peking University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.swufe.edu.cn;http://www.ucas.ac.cn;http://www.pku.edu.cn",
        "aff_unique_abbr": "SWUFE;UCAS;Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "kDoKXaucJV",
        "title": "Sparse-Guard: Sparse Coding-Based Defense against Model Inversion Attacks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this paper, we study neural network architectures that are robust to model inversion attacks. It is well-known that standard network architectures are vulnerable to model inversion, where an adversary can reconstruct images or data used to train the network by inspecting the network's output or the intermediate outputs from a single hidden network layer. Surprisingly, very little is known about how a network's architecture contributes to its robustness (or vulnerability). Instead, recent work on mitigating such attacks has focused on injecting random noise into the network layers or augmenting the training dataset with synthetic data. \n\nOur main result is a novel sparse coding-based network architecture, $Sparse$-$Guard$, that is robust to model inversion attacks. Three decades of computer science research has studied sparse coding in the context of image denoising, object recognition, and adversarial misclassification settings, but to the best of our knowledge, its connection to state-of-the-art privacy vulnerabilities remains unstudied. However, sparse coding architectures suggest an advantageous means to prevent privacy attacks because they allow us to control the amount of irrelevant private information encoded in a model's intermediate representations in a manner that can be computed efficiently during training, that adds little to the trained model's overall parameter complexity, and that is known to have little effect on classification accuracy. Specifically, we demonstrate that compared to networks trained with state-of-the-art noise-based or data augmentation-based defenses, $Sparse$-$Guard$ networks maintain comparable or higher classification accuracy while degrading state-of-the-art training data reconstructions by a factor of $1.2$ to $16.2$ across a variety of reconstruction quality metrics (PSNR, SSIM, FID) on standard datasets. We also show that $Sparse$-$Guard$ is equally robust to attacks regardless of whether the leaked layer is earlier or later, suggesting it is also an effective defense under novel security paradigms such as Federated Learning.",
        "keywords": "Privacy Attacks;Model Inversion Attack;Sparse Coding;Attack Defense;Image Reconstruction",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Sayanton V. Dibbo;Adam Breuer;Juston Moore;Michael Teti",
        "authorids": "~Sayanton_V._Dibbo1;~Adam_Breuer1;~Juston_Moore2;~Michael_Teti1",
        "gender": ";;M;Not Specified",
        "homepage": ";;;",
        "dblp": ";;126/1789;",
        "google_scholar": ";;gyFa3X0AAAAJ;cTWaSg8AAAAJ",
        "orcid": ";;;0000-0002-0754-1761",
        "linkedin": "svdibbo/;;;",
        "or_profile": "~Sayanton_V._Dibbo1;~Adam_Breuer1;~Juston_Moore2;~Michael_Teti1",
        "aff": "Dartmouth College;;Los Alamos National Laboratory;Los Alamos National Laboratory",
        "aff_domain": "dartmouth.edu;;lanl.gov;lanl.gov",
        "position": "PhD student;;Scientist;Researcher",
        "bibtex": "@misc{\ndibbo2024sparseguard,\ntitle={Sparse-Guard: Sparse Coding-Based Defense against Model Inversion Attacks},\nauthor={Sayanton V. Dibbo and Adam Breuer and Juston Moore and Michael Teti},\nyear={2024},\nurl={https://openreview.net/forum?id=kDoKXaucJV}\n}",
        "github": "",
        "project": "",
        "reviewers": "jF3v;ETXH;CjY9;kXvF",
        "site": "https://openreview.net/forum?id=kDoKXaucJV",
        "pdf_size": 3631292,
        "rating": "3;5;5;6",
        "confidence": "4;4;3;4",
        "soundness": "1;3;3;3",
        "contribution": "2;2;2;2",
        "presentation": "2;2;2;3",
        "wc_summary": "70;109;39;27",
        "wc_strengths": "20;111;34;55",
        "wc_weaknesses": "116;509;124;113",
        "wc_questions": "2;54;25;132",
        "wc_review": "208;783;222;327",
        "wc_reply_reviewers": "99;603;0;0",
        "wc_reply_authors": "575;1626;233;771",
        "reply_reviewers": "1;2;0;0",
        "reply_authors": "2;4;1;2",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            61.25,
            31.72045869781835
        ],
        "wc_strengths_avg": [
            55.0,
            34.64823227814083
        ],
        "wc_weaknesses_avg": [
            215.5,
            169.5
        ],
        "wc_questions_avg": [
            53.25,
            49.05800138611438
        ],
        "wc_review_avg": [
            385.0,
            234.3426977740079
        ],
        "wc_reply_reviewers_avg": [
            175.5,
            250.10447816862455
        ],
        "wc_reply_authors_avg": [
            801.25,
            513.6206649853567
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.25,
            1.0897247358851685
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.13245323570650439,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=497663154974795221&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Dartmouth College;Los Alamos National Laboratory",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.dartmouth.edu;https://www.lanl.gov",
        "aff_unique_abbr": "Dartmouth;LANL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "kE9bsfMgin",
        "title": "Bias A-head? Analyzing Bias in Transformer-Based Language Model Attention Heads",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Transformer-based pretrained large language models (PLM) such as BERT and GPT have achieved remarkable success in NLP tasks. \nHowever, PLMs are prone to encoding stereotypical biases. Although a burgeoning literature has emerged on stereotypical bias mitigation in PLMs, such as work on debiasing gender and racial stereotyping, how such biases manifest and behave internally within PLMs remains largely unknown. Understanding the internal stereotyping mechanisms may allow better assessment of model fairness and guide the development of effective mitigation strategies. In this work, we focus on attention heads,  a major component of the Transformer architecture, and propose a bias analysis framework to explore and identify a small set of \\textbf{biased heads} that are found to contribute to a PLM's stereotypical bias. We conduct extensive experiments to validate the existence of these biased heads and to better understand how they behave. We investigate gender and racial bias in the English language in two types of Transformer-based PLMs: the encoder-based BERT model and the decoder-based autoregressive GPT model. Overall, the results shed light on understanding the bias behavior in pretrained language models.",
        "keywords": "pretrained language model;stereotypical biases;BERT;self-attention",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Yi Yang;Hanyu Duan;Ahmed Abbasi;John P. Lalor;KAR YAN TAM",
        "authorids": "~Yi_Yang7;~Hanyu_Duan2;~Ahmed_Abbasi2;~John_P._Lalor1;~KAR_YAN_TAM1",
        "gender": ";M;M;M;M",
        "homepage": "http://yya518.github.io/;https://ahmedabbasi.com/;http://jplalor.github.io/;https://facultyprofiles.hkust.edu.hk/profiles.php?profile=kar-yan-tam-kytam;",
        "dblp": ";65/64.html;159/0111;;305/9869",
        "google_scholar": "https://scholar.google.com.hk/citations?user=Prh_dHkAAAAJ;2MG9-NAAAAAJ;d7r0R14AAAAJ;prT6OvEAAAAJ;",
        "orcid": "0000-0001-8863-112X;0000-0001-7698-7794;;0000-0003-3242-0184;",
        "linkedin": ";ahmednabbasi;jlalor/;;",
        "or_profile": "~Yi_Yang7;~Ahmed_Abbasi2;~John_P._Lalor1;~KAR_YAN_TAM1;~HANYU_DUAN1",
        "aff": "Hong Kong University of Science and Technology;University of Notre Dame;University of Notre Dame;;Hong Kong University of Science and Technology",
        "aff_domain": "ust.hk;nd.edu;nd.edu;;ust.hk",
        "position": "Associate Professor;Full Professor;Assistant Professor;;PhD student",
        "bibtex": "@misc{\nyang2024bias,\ntitle={Bias A-head? Analyzing Bias in Transformer-Based Language Model Attention Heads},\nauthor={Yi Yang and Hanyu Duan and Ahmed Abbasi and John P. Lalor and KAR YAN TAM},\nyear={2024},\nurl={https://openreview.net/forum?id=kE9bsfMgin}\n}",
        "github": "",
        "project": "",
        "reviewers": "ELVt;6KTe;fmfX",
        "site": "https://openreview.net/forum?id=kE9bsfMgin",
        "pdf_size": 2603864,
        "rating": "3;5;6",
        "confidence": "3;4;4",
        "soundness": "2;3;2",
        "contribution": "2;2;3",
        "presentation": "3;3;3",
        "wc_summary": "69;90;132",
        "wc_strengths": "86;65;14",
        "wc_weaknesses": "140;112;140",
        "wc_questions": "66;1;80",
        "wc_review": "361;268;366",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            97.0,
            26.19160170741759
        ],
        "wc_strengths_avg": [
            55.0,
            30.23243291566195
        ],
        "wc_weaknesses_avg": [
            130.66666666666666,
            13.199326582148888
        ],
        "wc_questions_avg": [
            49.0,
            34.418987008142274
        ],
        "wc_review_avg": [
            331.6666666666667,
            45.065384597148274
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.9449111825230683,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18120225908243270565&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1;0",
        "aff_unique_norm": "Hong Kong University of Science and Technology;University of Notre Dame",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ust.hk;https://www.nd.edu",
        "aff_unique_abbr": "HKUST;Notre Dame",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Bias Runs Deep: Implicit Reasoning Biases in Persona-Assigned LLMs",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17986",
        "id": "kGteeZ18Ir",
        "author_site": "Shashank Gupta, Vaishnavi Shrivastava, Ameet Deshpande, Ashwin Kalyan, Peter Clark, Ashish Sabharwal, Tushar Khot",
        "tldr": "",
        "abstract": "Recent works have showcased the ability of large-scale language models (LLMs) to embody diverse personas in their responses, exemplified by prompts like \u2018_You are Yoda. Explain the Theory of Relativity._\u2019 While this ability allows personalization of LLMs and enables human behavior simulation, its effect on LLMs\u2019 capabilities remains unclear. To fill this gap, we present the first extensive study of the unintended side-effects of persona assignment on the ability of LLMs to perform _basic reasoning tasks_. Our study covers 24 reasoning datasets (spanning mathematics, law, medicine, morals, and more), 4 LLMs (2 versions of ChatGPT-3.5, GPT-4-Turbo, and Llama-2-70b-chat), and 19 diverse personas (e.g., \u2018an Asian person\u2019) spanning 5 socio-demographic groups: race, gender, religion, disability, and political affiliation. Our experiments unveil that LLMs harbor deep rooted bias against various socio-demographics underneath a veneer of fairness. While they overtly reject stereotypes when explicitly asked (\u2018_Are Black people less skilled at mathematics?_\u2019), they manifest stereotypical and often erroneous presumptions when prompted to answer questions while adopting a persona. These can be observed as abstentions in the model\u2019s response, e.g., \u2018_As a Black person, I am unable to answer this question as it requires math knowledge_\u2019, and generally result in a substantial drop in performance on reasoning tasks. Our experiments with ChatGPT-3.5 show that this bias is _ubiquitous_&mdash;80% of our personas demonstrate bias; it is _significant_&mdash;some datasets show performance drops of 70%+; and can be especially _harmful for certain groups_&mdash;some personas suffer statistically significant drops on 80%+ of the datasets. Overall, all four LLMs exhibit persona-induced bias to varying extents, with GPT-4-Turbo showing the least but still a problematic amount of bias (evident in 42% of the personas). Further analysis shows that these persona-induced errors can be hard-to-discern as they do not always manifest as explicit abstentions, and can also be hard-to-avoid&mdash;we find de-biasing prompts to have minimal to no effect. Our findings serve as a cautionary tale that the practice of assigning personas to LLMs&mdash;a trend on the rise&mdash;can surface their deep-rooted biases and have unforeseeable and detrimental side-effects.",
        "keywords": "Bias;Fairness;LLM;Reasoning;Persona;Safety",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Shashank Gupta;Vaishnavi Shrivastava;Ameet Deshpande;Ashwin Kalyan;Peter Clark;Ashish Sabharwal;Tushar Khot",
        "authorids": "~Shashank_Gupta3;~Vaishnavi_Shrivastava1;~Ameet_Deshpande1;~Ashwin_Kalyan6;~Peter_Clark1;~Ashish_Sabharwal1;~Tushar_Khot1",
        "gender": "M;F;M;M;M;M;M",
        "homepage": "https://shashankgupta.info/;;https://allenai.org/team/peterc;;https://allenai.org/team/tushark/;https://ameet-1997.github.io;http://ashwinkalyan.com/",
        "dblp": ";;34/1184;13/154;83/8117;220/4337;173/5217",
        "google_scholar": "U2Gz-NIAAAAJ;;o-5vyEsAAAAJ;7VspfeAAAAAJ;_8mkIjgAAAAJ;332L1coAAAAJ;KYHL9aIAAAAJ",
        "orcid": "0000-0002-3683-3739;;;;;;",
        "linkedin": "shashank-gupta-5182bb28/;vaish-shrivastava/;peter-clark-a8b556/;ashish-sabharwal-82a2b661;;;",
        "or_profile": "~Shashank_Gupta3;~Vaishnavi_Shrivastava1;~Peter_Clark1;~Ashish_Sabharwal1;~Tushar_Khot1;~Ameet_S_Deshpande1;~Ashwin_Kalyan_Vijayakumar1",
        "aff": "Allen Institute for Artificial Intelligence;Stanford University;Allen Institute for Artificial Intelligence;Allen Institute for AI;Allen Institute for Artificial Intelligence;Princeton University;Allen Institute for Artificial Intelligence",
        "aff_domain": "allenai.org;stanford.edu;allenai.org;allenai.org;allenai.org;princeton.edu;allenai.org",
        "position": "Researcher;MS student;Senior Research Manager;Principal Researcher;Lead Research Scientist;PhD student;Research Scientist",
        "bibtex": "@inproceedings{\ngupta2024bias,\ntitle={Bias Runs Deep: Implicit Reasoning Biases in Persona-Assigned {LLM}s},\nauthor={Shashank Gupta and Vaishnavi Shrivastava and Ameet Deshpande and Ashwin Kalyan and Peter Clark and Ashish Sabharwal and Tushar Khot},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=kGteeZ18Ir}\n}",
        "github": "",
        "project": "",
        "reviewers": "s6hK;mMGg;34gE;jUKs",
        "pdf_size": 1117182,
        "rating": "5;5;5;8",
        "confidence": "4;4;4;5",
        "soundness": "2;3;2;3",
        "contribution": "2;3;2;3",
        "presentation": "3;3;2;4",
        "wc_summary": "76;64;59;125",
        "wc_strengths": "51;62;28;41",
        "wc_weaknesses": "264;365;150;114",
        "wc_questions": "81;188;30;112",
        "wc_review": "472;679;267;392",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "760;1178;763;535",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            5.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            81.0,
            26.143832924802744
        ],
        "wc_strengths_avg": [
            45.5,
            12.539936203984453
        ],
        "wc_weaknesses_avg": [
            223.25,
            98.81137333323528
        ],
        "wc_questions_avg": [
            102.75,
            57.26855594477654
        ],
        "wc_review_avg": [
            452.5,
            149.79402524800514
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            809.0,
            232.24663614356183
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 101,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4437674499831377938&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=kGteeZ18Ir",
        "pdf": "https://openreview.net/pdf?id=kGteeZ18Ir",
        "email": "allenai.org;stanford.edu;allenai.org;allenai.org;allenai.org;princeton.edu;allenai.org",
        "author_num": 7,
        "aff_unique_index": "0;1;0;2;0;3;0",
        "aff_unique_norm": "Allen Institute for Artificial Intelligence;Stanford University;Allen Institute for AI;Princeton University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://allenai.org;https://www.stanford.edu;https://allenai.org;https://www.princeton.edu",
        "aff_unique_abbr": "AI2;Stanford;AI2;Princeton",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Stanford",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "kHTHf1XrFt",
        "title": "MultiReAct: Multimodal Tools Augmented Reasoning-Acting Traces for Embodied Agent Planning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In the field of embodied AI, Large Language Models (LLMs) have demonstrated remarkable proficiency in tasks involving straightforward reasoning.\nHowever, they encounter substantial challenges when confronted with longer-horizon tasks described in abstract instructions, especially those involving intricate visual concepts.\nThese challenges arise from two main limitations: \nLLMs, primarily reliant on text, struggle to grapple with the demands of complex embodied tasks that necessitate nuanced multimodal reasoning;\nLLMs encounter difficulties in recognizing and autonomously recovering from intermediate execution failures.\nTo address these limitations and improve the planning capabilities of LLMs in embodied scenarios, we propose a novel approach named MultiReAct.\nOur framework made the following efforts:\n1. We employ a parameter-efficient adaptation of a pre-trained visual language model, enabling it to tackle embodied planning tasks by translating visual demonstrations into sequences of actionable language commands.\n2.  Leveraging CLIP as a reward model, we identify instances of sub-instruction execution failure, significantly boosting the success rate in achieving final objectives.\n3. We introduce an adaptable paradigm for embodied planning through in-context learning from demonstration, agnostic of the specific Visual Language Model (VLM), and low-level actor. \nOur model accommodates two distinct low-level actors: an imitation learning agent and a code generation-based actor.\nWe apply the MultiReAct framework to a diverse set of long-horizon planning tasks and exhibit superior performance than previous LLM-based methods.\nThe extensive experimental results underscore the effectiveness of our approach in addressing long-horizon embodied planning.",
        "keywords": "Large Language Model;Embodied Agent Planning;Multimodal Reasoning",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/58d8a8a15a845b4574918f66669893041f6187a3.zip",
        "author": "Zhouliang Yu;Jie Fu;Yao Mu;Chenguang Wang;Lin Shao;Yaodong Yang",
        "authorids": "~Zhouliang_Yu1;~Jie_Fu2;~Yao_Mu1;~Chenguang_Wang2;~Lin_Shao2;~Yaodong_Yang1",
        "gender": "M;M;M;M;M;M",
        "homepage": ";https://yaomarkmu.github.io/;https://github.com/Wastedzz/cgwang;https://linsats.github.io/;https://www.yangyaodong.com;https://bigaidream.github.io/",
        "dblp": ";260/0674;62/3432-11;26/8546-2;170/1496-1;",
        "google_scholar": "qUMjnPcAAAAJ;;Ptf3uO0AAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.co.uk/citations?user=6yL0xw8AAAAJ;66osleIAAAAJ",
        "orcid": ";;0009-0008-4097-1174;;0000-0001-8132-5613;0000-0002-4494-843X",
        "linkedin": ";;;;yaodong-yang;",
        "or_profile": "~Zhouliang_Yu1;~Yao_Mu1;~Chenguang_Wang2;~Lin_Shao2;~Yaodong_Yang1;~Jie_Fu1",
        "aff": "School of Data Science, The Chinese University of Hongkong, Shenzhen;The University of Hong Kong;The Chinese University of Hong Kong, Shenzhen;National University of Singapore;Peking University;Hong Kong University of Science and Technology",
        "aff_domain": "cuhk.edu.cn;hku.hk;cuhk.edu.cn;nus.edu.sg;pku.edu.cn;ust.hk",
        "position": "Undergrad student;PhD student;PhD student;Assistant Professor;Assistant Professor;Researcher",
        "bibtex": "@misc{\nyu2024multireact,\ntitle={MultiReAct: Multimodal Tools Augmented Reasoning-Acting Traces for Embodied Agent Planning},\nauthor={Zhouliang Yu and Jie Fu and Yao Mu and Chenguang Wang and Lin Shao and Yaodong Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=kHTHf1XrFt}\n}",
        "github": "",
        "project": "",
        "reviewers": "L9T3;ftHn;Ufhp;LrB8",
        "site": "https://openreview.net/forum?id=kHTHf1XrFt",
        "pdf_size": 784534,
        "rating": "3;3;5;8",
        "confidence": "4;3;4;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;2;3",
        "wc_summary": "91;234;48;80",
        "wc_strengths": "16;41;62;82",
        "wc_weaknesses": "165;94;136;2",
        "wc_questions": "14;113;393;16",
        "wc_review": "286;482;639;180",
        "wc_reply_reviewers": "0;71;0;49",
        "wc_reply_authors": "332;1057;0;506",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "1;2;0;2",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            113.25,
            71.48207817348346
        ],
        "wc_strengths_avg": [
            50.25,
            24.519125188309634
        ],
        "wc_weaknesses_avg": [
            99.25,
            61.560437782718864
        ],
        "wc_questions_avg": [
            134.0,
            154.79502575987382
        ],
        "wc_review_avg": [
            396.75,
            176.9171769501198
        ],
        "wc_reply_reviewers_avg": [
            30.0,
            30.99193443462347
        ],
        "wc_reply_authors_avg": [
            473.75,
            382.6724284554611
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.82915619758885
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.3665083330689157,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9749709018514054475&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;2;3;4",
        "aff_unique_norm": "Chinese University of Hong Kong;University of Hong Kong;National University of Singapore;Peking University;Hong Kong University of Science and Technology",
        "aff_unique_dep": "School of Data Science;;;;",
        "aff_unique_url": "https://www.cuhk.edu.cn;https://www.hku.hk;https://www.nus.edu.sg;http://www.pku.edu.cn;https://www.ust.hk",
        "aff_unique_abbr": "CUHK;HKU;NUS;Peking U;HKUST",
        "aff_campus_unique_index": "0;1;0;1",
        "aff_campus_unique": "Shenzhen;Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;1;0;0",
        "aff_country_unique": "China;Singapore"
    },
    {
        "id": "kIDbvowuce",
        "title": "FENNs: A Resource-Efficient, Adaptive, Privacy-Preserving Decentralized Learning Framework",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Deep neural networks have demonstrated exceptional performance in various tasks; yet, their resource-intensive nature and ongoing data privacy concerns remain key obstacles. In response, we introduce Federated Ephemeral Neural Networks (FENNs), a pioneering architecture that ingeniously addresses both challenges.  FENNs rely on the concept of ephemeral neural networks (ENNs), a novel paradigm where neural networks exhibit dynamic adaptability in their architecture based on available computing resources. FENNs seamlessly blend the flexibility of ENNs with the privacy-preserving features of federated learning to tailor their structures to task complexity while ensuring data privacy within a decentralized learning environment. Rigorous tests conducted on resource-constrained devices within federated environments validate the effectiveness of FENNs. We also introduce a novel metric for evaluating the efficacy of resource-constrained learning and/or machine learning in resource-constrained environments. The proposed architecture shows significant prospects in the domains of edge computing and decentralized artificial intelligence applications.",
        "keywords": "Ephemeral Neural Networks;Federated Ephemeral Neural Networks;Resource-Constrained Learning",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Paapa Kwesi Quansah;Edwin Kwesi Ansah Tenkorang;Nana Maryam Abdul-Bassit Munagah",
        "authorids": "~Paapa_Kwesi_Quansah1;~Edwin_Kwesi_Ansah_Tenkorang1;~Nana_Maryam_Abdul-Bassit_Munagah1",
        "gender": ";M;F",
        "homepage": ";;",
        "dblp": ";;",
        "google_scholar": ";;",
        "orcid": ";;",
        "linkedin": ";-tenkorang/;nanamaryam-munagah",
        "or_profile": "~Paapa_Kwesi_Quansah1;~Edwin_Kwesi_Ansah_Tenkorang1;~Nana_Maryam_Abdul-Bassit_Munagah1",
        "aff": ";;",
        "aff_domain": ";;",
        "position": ";;",
        "bibtex": "@misc{\nquansah2024fenns,\ntitle={{FENN}s: A Resource-Efficient, Adaptive, Privacy-Preserving Decentralized Learning Framework},\nauthor={Paapa Kwesi Quansah and Edwin Kwesi Ansah Tenkorang and Nana Maryam Abdul-Bassit Munagah},\nyear={2024},\nurl={https://openreview.net/forum?id=kIDbvowuce}\n}",
        "github": "",
        "project": "",
        "reviewers": "gra1;AX8d;JR2g;8qfQ",
        "site": "https://openreview.net/forum?id=kIDbvowuce",
        "pdf_size": 160174,
        "rating": "1;1;1;3",
        "confidence": "4;4;5;4",
        "soundness": "1;2;1;2",
        "contribution": "1;1;1;2",
        "presentation": "1;2;1;2",
        "wc_summary": "43;142;48;67",
        "wc_strengths": "55;82;28;25",
        "wc_weaknesses": "209;193;161;57",
        "wc_questions": "18;82;3;38",
        "wc_review": "325;499;240;187",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            1.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.5,
            0.5
        ],
        "contribution_avg": [
            1.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            75.0,
            39.70516339218364
        ],
        "wc_strengths_avg": [
            47.5,
            23.092206477510977
        ],
        "wc_weaknesses_avg": [
            155.0,
            59.16079783099616
        ],
        "wc_questions_avg": [
            35.25,
            29.710057219736214
        ],
        "wc_review_avg": [
            312.75,
            118.26321279248252
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:T2B0Vi6TNqQJ:scholar.google.com/&scioq=FENNs:+A+Resource-Efficient,+Adaptive,+Privacy-Preserving+Decentralized+Learning+Framework&hl=en&as_sdt=0,44",
        "gs_version_total": 0
    },
    {
        "title": "On the Generalization and Approximation Capacities of Neural Controlled Differential Equations",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17985",
        "id": "kILAd8RdzA",
        "author_site": "Linus Bleistein, Agathe Guilloux",
        "tldr": "",
        "abstract": "Neural Controlled Differential Equations (NCDE) are a state-of-the-art tool for supervised learning with irregularly sampled time series (Kidger 2020). However, no theoretical analysis of their performance has been provided yet, and it remains unclear in particular how the roughness of the sampling affects their predictions. By merging the rich theory of controlled differential equations (CDE) and Lipschitz-based measures of the complexity of deep neural nets, we take a first step towards the theoretical understanding of NCDE. Our first result is a sampling-dependant generalization bound for this class of predictors. In a second time, we leverage the continuity of the flow of CDEs to provide a detailed analysis of both the sampling-induced bias and the approximation bias. Regarding this last result, we show how classical approximation results on neural nets may transfer to NCDE. Our theoretical results are validated through a series of experiments.",
        "keywords": "statistical learning;generalization theory;differential equations;time series",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Linus Bleistein;Agathe Guilloux",
        "authorids": "~Linus_Bleistein1;~Agathe_Guilloux1",
        "gender": "M;F",
        "homepage": "https://linusbleistein.com/;https://sites.google.com/view/agatheguilloux-personalwebsite/",
        "dblp": "338/9094;",
        "google_scholar": "N5js_UkAAAAJ;",
        "orcid": ";0000-0003-0473-1970",
        "linkedin": "linus-bleistein-431388114/;",
        "or_profile": "~Linus_Bleistein1;~Agathe_Guilloux1",
        "aff": "INRIA;INRIA",
        "aff_domain": "inria.fr;inria.fr",
        "position": "PhD student;Principal Researcher",
        "bibtex": "@inproceedings{\nbleistein2024on,\ntitle={On the Generalization and Approximation Capacities of Neural Controlled Differential Equations},\nauthor={Linus Bleistein and Agathe Guilloux},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=kILAd8RdzA}\n}",
        "github": "",
        "project": "",
        "reviewers": "c9Ry;V1D4;QrUR",
        "pdf_size": 899156,
        "rating": "5;6;8",
        "confidence": "3;3;4",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "3;2;3",
        "wc_summary": "13;65;64",
        "wc_strengths": "24;22;86",
        "wc_weaknesses": "278;75;87",
        "wc_questions": "72;24;90",
        "wc_review": "387;186;327",
        "wc_reply_reviewers": "228;0;4",
        "wc_reply_authors": "1251;344;701",
        "reply_reviewers": "1;0;1",
        "reply_authors": "3;1;1",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            47.333333333333336,
            24.280765135299085
        ],
        "wc_strengths_avg": [
            44.0,
            29.709706606876257
        ],
        "wc_weaknesses_avg": [
            146.66666666666666,
            92.99581830503037
        ],
        "wc_questions_avg": [
            62.0,
            27.85677655436824
        ],
        "wc_review_avg": [
            300.0,
            84.24962907930218
        ],
        "wc_reply_reviewers_avg": [
            77.33333333333333,
            106.54993612803759
        ],
        "wc_reply_authors_avg": [
            765.3333333333334,
            373.06508219820785
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.944911182523068,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1440354435840473334&as_sdt=4005&sciodt=0,6&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=kILAd8RdzA",
        "pdf": "https://openreview.net/pdf?id=kILAd8RdzA",
        "email": "inria.fr;inria.fr",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "INRIA",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.inria.fr",
        "aff_unique_abbr": "INRIA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "France"
    },
    {
        "title": "Test-Time Adaptation with CLIP Reward for Zero-Shot Generalization in Vision-Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17984",
        "id": "kIP0duasBb",
        "author_site": "Shuai Zhao, Xiaohan Wang, Linchao Zhu, Yi Yang",
        "tldr": "",
        "abstract": "One fascinating aspect of pre-trained vision-language models (VLMs) learning under language supervision is their impressive zero-shot generalization capability.\nHowever, this ability is hindered by distribution shifts between the training and testing data.\nPrevious test time adaptation (TTA) methods for VLMs in zero-shot classification rely on minimizing the entropy of model outputs, tending to be stuck in incorrect model predictions.\nIn this work, we propose TTA with feedback to rectify the model output and prevent the model from becoming blindly confident.\nSpecifically, a CLIP model is adopted as the reward model during TTA and provides feedback for the VLM.\nGiven a single test sample,\nthe VLM is forced to maximize the CLIP reward between the input and sampled results from the VLM output distribution.\nThe proposed \\textit{reinforcement learning with CLIP feedback~(RLCF)} framework is highly flexible and universal.\nBeyond the classification task, with task-specific sampling strategies and a proper reward baseline choice, RLCF can be easily extended to not only discrimination tasks like retrieval but also generalization tasks like image captioning,\nimproving the zero-shot generalization capacity of VLMs.\nAccording to the characteristics of these VL tasks, we build different fully TTA pipelines with RLCF to improve the zero-shot generalization ability of various VLMs.\nExtensive experiments along with promising\nempirical results demonstrate the effectiveness of RLCF.\nThe code is available at https://github.com/mzhaoshuai/RLCF.",
        "keywords": "Vision-Language Models;Zero-Shot Generalization;Test-Time Adaptation;CLIP reward",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Shuai Zhao;Xiaohan Wang;Linchao Zhu;Yi Yang",
        "authorids": "~Shuai_Zhao1;~Xiaohan_Wang2;~Linchao_Zhu1;~Yi_Yang22",
        "gender": "M;M;M;M",
        "homepage": ";https://wxh1996.github.io/;http://ffmpbgrnn.github.io/;https://person.zju.edu.cn/yiyang",
        "dblp": "116/8682-6;;172/1383.html;33/4854-1.html",
        "google_scholar": ";iGA10XoAAAAJ;9ZukE28AAAAJ;RMSuNFwAAAAJ",
        "orcid": "0000-0003-1320-4283;;;",
        "linkedin": ";%E6%99%93%E6%99%97-%E6%B1%AA-883895bb/;;",
        "or_profile": "~Shuai_Zhao1;~Xiaohan_Wang2;~Linchao_Zhu1;~Yi_Yang22",
        "aff": "University of Technology Sydney;Stanford University;Zhejiang University;Zhejiang University",
        "aff_domain": "student.uts.edu.au;stanford.edu;zju.edu.cn;zju.edu.cn",
        "position": "PhD student;Postdoc;Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\nzhao2024testtime,\ntitle={Test-Time Adaptation with {CLIP} Reward for Zero-Shot Generalization in Vision-Language Models},\nauthor={Shuai Zhao and Xiaohan Wang and Linchao Zhu and Yi Yang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=kIP0duasBb}\n}",
        "github": "",
        "project": "",
        "reviewers": "uHKV;9Cat;efhx",
        "pdf_size": 6203496,
        "rating": "6;6;8",
        "confidence": "4;5;4",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "3;3;4",
        "wc_summary": "63;42;67",
        "wc_strengths": "40;86;161",
        "wc_weaknesses": "174;113;98",
        "wc_questions": "30;9;70",
        "wc_review": "307;250;396",
        "wc_reply_reviewers": "21;0;19",
        "wc_reply_authors": "1208;346;1348",
        "reply_reviewers": "1;0;1",
        "reply_authors": "3;1;3",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            57.333333333333336,
            10.96458946893235
        ],
        "wc_strengths_avg": [
            95.66666666666667,
            49.86871653540813
        ],
        "wc_weaknesses_avg": [
            128.33333333333334,
            32.86673427984932
        ],
        "wc_questions_avg": [
            36.333333333333336,
            25.30261295246446
        ],
        "wc_review_avg": [
            317.6666666666667,
            60.07957685899224
        ],
        "wc_reply_reviewers_avg": [
            13.333333333333334,
            9.46337971105226
        ],
        "wc_reply_authors_avg": [
            967.3333333333334,
            443.05103794283366
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 24,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13354273242354297247&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=kIP0duasBb",
        "pdf": "https://openreview.net/pdf?id=kIP0duasBb",
        "email": "student.uts.edu.au;stanford.edu;zju.edu.cn;zju.edu.cn",
        "author_num": 4,
        "aff_unique_index": "0;1;2;2",
        "aff_unique_norm": "University of Technology Sydney;Stanford University;Zhejiang University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.uts.edu.au;https://www.stanford.edu;https://www.zju.edu.cn",
        "aff_unique_abbr": "UTS;Stanford;ZJU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Stanford",
        "aff_country_unique_index": "0;1;2;2",
        "aff_country_unique": "Australia;United States;China"
    },
    {
        "title": "Reverse Diffusion Monte Carlo",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17983",
        "id": "kIPEyMSdFV",
        "author_site": "Xunpeng Huang, Hanze Dong, Yifan HAO, Yian Ma, Tong Zhang",
        "tldr": "",
        "abstract": "We propose a Monte Carlo sampler from the reverse diffusion process. Unlike the practice of diffusion models, where the intermediary updates---the score functions---are learned with a neural network, we transform the score matching problem into a mean estimation one.\nBy estimating the means of the regularized posterior distributions, we derive a novel Monte Carlo sampling algorithm called reverse diffusion Monte Carlo (rdMC), which is distinct from the Markov chain Monte Carlo (MCMC) methods. We determine the sample size from the error tolerance and the properties of the posterior distribution to yield an algorithm that can approximately sample the target distribution with any desired accuracy. Additionally, we demonstrate and prove under suitable conditions that sampling with rdMC can be significantly faster than that with MCMC.  For multi-modal target distributions such as those in Gaussian mixture models, rdMC greatly improves over the Langevin-style MCMC sampling methods both theoretically and in practice. The proposed rdMC method offers a new perspective and solution beyond classical MCMC algorithms for the challenging complex distributions.",
        "keywords": "posterior Sampling;multi-modal sampling;diffusion process",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Xunpeng Huang;Hanze Dong;Yifan HAO;Yian Ma;Tong Zhang",
        "authorids": "~Xunpeng_Huang2;~Hanze_Dong1;~Yifan_HAO2;~Yian_Ma1;~Tong_Zhang2",
        "gender": "M;M;F;M;M",
        "homepage": "https://xunpeng746.github.io;https://hendrydong.github.io/;https://github.com/haoyifan99/iff;https://sites.google.com/view/yianma;http://tongzhang-ml.org",
        "dblp": ";228/7798;118/3316-2;;07/4227-1",
        "google_scholar": "T2L6rKcAAAAJ;g9WLzWoAAAAJ;https://scholar.google.com.hk/citations?user=lzI8IicAAAAJ;A0TFlacAAAAJ;LurWtuYAAAAJ",
        "orcid": ";;;;0000-0002-5511-2558",
        "linkedin": ";hanze-dong/;yifan-hao-23a5b2337/;;",
        "or_profile": "~Xunpeng_Huang2;~Hanze_Dong1;~Yifan_HAO2;~Yian_Ma1;~Tong_Zhang2",
        "aff": "Hong Kong University of Science and Technology;SalesForce;Hong Kong University of Science and Technology;University of California, San Diego;UIUC",
        "aff_domain": "ust.hk;salesforce.com;ust.hk;ucsd.edu;illinois.edu",
        "position": "PhD student;Researcher;MS student;Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\nhuang2024reverse,\ntitle={Reverse Diffusion Monte Carlo},\nauthor={Xunpeng Huang and Hanze Dong and Yifan HAO and Yian Ma and Tong Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=kIPEyMSdFV}\n}",
        "github": "",
        "project": "",
        "reviewers": "qHDx;UPK6;NhM6;dWe5",
        "pdf_size": 1607314,
        "rating": "6;6;8;8",
        "confidence": "5;4;3;2",
        "soundness": "3;2;3;3",
        "contribution": "3;2;3;3",
        "presentation": "3;2;3;2",
        "wc_summary": "45;17;379;69",
        "wc_strengths": "25;40;226;16",
        "wc_weaknesses": "324;14;306;85",
        "wc_questions": "6;164;471;144",
        "wc_review": "400;235;1382;314",
        "wc_reply_reviewers": "76;40;2148;25",
        "wc_reply_authors": "1028;863;1653;406",
        "reply_reviewers": "1;1;6;1",
        "reply_authors": "4;5;7;3",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            127.5,
            146.36512562765762
        ],
        "wc_strengths_avg": [
            76.75,
            86.59496232460639
        ],
        "wc_weaknesses_avg": [
            182.25,
            135.25231051630874
        ],
        "wc_questions_avg": [
            196.25,
            169.89169344026212
        ],
        "wc_review_avg": [
            582.75,
            465.12222855933254
        ],
        "wc_reply_reviewers_avg": [
            572.25,
            909.9484532104003
        ],
        "wc_reply_authors_avg": [
            987.5,
            446.7026415861003
        ],
        "reply_reviewers_avg": [
            2.25,
            2.165063509461097
        ],
        "reply_authors_avg": [
            4.75,
            1.479019945774904
        ],
        "replies_avg": [
            36,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.8944271909999159,
        "gs_citation": 28,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7539842835913680497&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=kIPEyMSdFV",
        "pdf": "https://openreview.net/pdf?id=kIPEyMSdFV",
        "email": "ust.hk;salesforce.com;ust.hk;ucsd.edu;illinois.edu",
        "author_num": 5,
        "aff_unique_index": "0;1;0;2;3",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Salesforce;University of California, San Diego;University of Illinois Urbana-Champaign",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.ust.hk;https://www.salesforce.com;https://www.ucsd.edu;https://www illinois.edu",
        "aff_unique_abbr": "HKUST;Salesforce;UCSD;UIUC",
        "aff_campus_unique_index": "0;0;2;3",
        "aff_campus_unique": "Hong Kong SAR;;San Diego;Urbana-Champaign",
        "aff_country_unique_index": "0;1;0;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Outliers with Opposing Signals Have an Outsized Effect on Neural Network Optimization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17982",
        "id": "kIZ3S3tel6",
        "author_site": "Elan Rosenfeld, Andrej Risteski",
        "tldr": "",
        "abstract": "We identify a new phenomenon in neural network optimization which arises from the interaction of depth and a particular heavy-tailed structure in natural data. Our result offers intuitive explanations for several previously reported observations about network training dynamics, including a conceptually new cause for progressive sharpening and the edge of stability. We further draw connections to related phenomena including grokking and simplicity bias.\n\nExperimentally, we demonstrate the significant influence of paired groups of outliers in the training data with strong *Opposing Signals*: consistent, large magnitude features which dominate the network output and provide gradients which point in opposite directions. Due to these outliers, early optimization enters a narrow valley which carefully balances the opposing groups; subsequent sharpening causes their loss to rise rapidly, oscillating between high on one group and then the other, until the overall loss spikes. We carefully study these groups' effect on the network's optimization and behavior, and we complement this with a theoretical analysis of a two-layer linear network under a simplified model.\n\nOur finding enables new qualitative predictions of training behavior which we confirm experimentally. It also provides a new lens through which to study and improve modern training practices for stochastic optimization, which we highlight via a case study of Adam versus SGD.",
        "keywords": "neural network optimization;progressive sharpening;edge of stability;adaptive gradient methods;batch normalization",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Elan Rosenfeld;Andrej Risteski",
        "authorids": "~Elan_Rosenfeld1;~Andrej_Risteski2",
        "gender": "M;M",
        "homepage": ";",
        "dblp": "236/4508;63/11143",
        "google_scholar": "f0j0K8QAAAAJ;",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Elan_Rosenfeld1;~Andrej_Risteski2",
        "aff": "Carnegie Mellon University;Carnegie Mellon University",
        "aff_domain": "andrew.cmu.edu;cmu.edu",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nrosenfeld2024outliers,\ntitle={Outliers with Opposing Signals Have an Outsized Effect on Neural Network Optimization},\nauthor={Elan Rosenfeld and Andrej Risteski},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=kIZ3S3tel6}\n}",
        "github": "",
        "project": "",
        "reviewers": "5nbF;u2Ni;VsCH;scXv",
        "pdf_size": 8426244,
        "rating": "3;5;6;8",
        "confidence": "2;2;3;4",
        "soundness": "1;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "91;78;18;96",
        "wc_strengths": "50;54;46;133",
        "wc_weaknesses": "381;156;3;177",
        "wc_questions": "2;196;69;160",
        "wc_review": "524;484;136;566",
        "wc_reply_reviewers": "0;139;0;0",
        "wc_reply_authors": "1400;1007;529;822",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "3;3;2;2",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            70.75,
            31.155858197135252
        ],
        "wc_strengths_avg": [
            70.75,
            36.05117889889317
        ],
        "wc_weaknesses_avg": [
            179.25,
            134.45515051495795
        ],
        "wc_questions_avg": [
            106.75,
            76.15567936798936
        ],
        "wc_review_avg": [
            427.5,
            170.77690124838313
        ],
        "wc_reply_reviewers_avg": [
            34.75,
            60.188765563018485
        ],
        "wc_reply_authors_avg": [
            939.5,
            315.8057155910893
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.9198662110077999,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3365589771661607435&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=kIZ3S3tel6",
        "pdf": "https://openreview.net/pdf?id=kIZ3S3tel6",
        "email": "andrew.cmu.edu;cmu.edu",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Carnegie Mellon University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cmu.edu",
        "aff_unique_abbr": "CMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "kIZcruKmBg",
        "title": "Physics-informed neural networks for transformed geometries and manifolds",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Physics-informed neural networks (PINNs) effectively embed physical principles into machine learning, but often struggle with complex or alternating geometries.\nWe propose a novel method for integrating geometric transformations within PINNs to robustly accommodate geometric variations. Our method incorporates a diffeomorphism as a mapping of a reference domain and adapts the derivative computation of the physics-informed loss function. This generalizes the applicability of PINNs not only to smoothly deformed domains, but also to lower-dimensional manifolds and allows for direct shape optimization while training the network.\nWe demonstrate the effectivity of our approach on several problems: (i) Eikonal equation on Archimedean spiral, (ii) Poisson problem on surface manifold, (iii) Incompressible Stokes flow in deformed tube, and (iv) Shape optimization with Laplace operator.\nThrough these examples, we demonstrate the enhanced flexibility over traditional PINNs, especially under geometric variations. The proposed framework presents an outlook for training deep neural operators over parametrized geometries, paving the way for advanced modeling with PDEs on complex geometries in science and engineering.",
        "keywords": "physics-informed;neural networks;transformation;manifold;diffeomorphism;parametrized;geometry;reference domain;free boundary;shape optimization",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/d66c11bceaa363e74cdab58ab53c56f27d1f7493.zip",
        "author": "Samuel Burbulla",
        "authorids": "~Samuel_Burbulla1",
        "gender": "M",
        "homepage": "",
        "dblp": "",
        "google_scholar": "uUkxLGAAAAAJ",
        "orcid": "0000-0002-2566-9777",
        "linkedin": "samuelburbulla/",
        "or_profile": "~Samuel_Burbulla1",
        "aff": "AppliedAI Institute for Europe",
        "aff_domain": "appliedai-institute.de",
        "position": "Researcher",
        "bibtex": "@misc{\nburbulla2024physicsinformed,\ntitle={Physics-informed neural networks for transformed geometries and manifolds},\nauthor={Samuel Burbulla},\nyear={2024},\nurl={https://openreview.net/forum?id=kIZcruKmBg}\n}",
        "github": "",
        "project": "",
        "reviewers": "2kyY;2tfv;VH6u;UpPb",
        "site": "https://openreview.net/forum?id=kIZcruKmBg",
        "pdf_size": 829489,
        "rating": "1;3;3;6",
        "confidence": "4;4;3;4",
        "soundness": "2;2;2;3",
        "contribution": "1;2;2;3",
        "presentation": "2;1;2;3",
        "wc_summary": "92;53;36;70",
        "wc_strengths": "33;58;16;30",
        "wc_weaknesses": "234;47;110;53",
        "wc_questions": "35;50;45;197",
        "wc_review": "394;208;207;350",
        "wc_reply_reviewers": "10;71;0;0",
        "wc_reply_authors": "797;313;464;476",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            3.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            62.75,
            20.72890493972125
        ],
        "wc_strengths_avg": [
            34.25,
            15.138939857202683
        ],
        "wc_weaknesses_avg": [
            111.0,
            75.1498502992521
        ],
        "wc_questions_avg": [
            81.75,
            66.758426434421
        ],
        "wc_review_avg": [
            289.75,
            83.70894516119529
        ],
        "wc_reply_reviewers_avg": [
            20.25,
            29.583568074186047
        ],
        "wc_reply_authors_avg": [
            512.5,
            176.3696402445727
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0.08084520834544431,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11275397686559014859&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "AppliedAI Institute for Europe",
        "aff_unique_dep": "",
        "aff_unique_url": "",
        "aff_unique_abbr": "",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Unknown"
    },
    {
        "title": "Towards Aligned Layout Generation via Diffusion Model with Aesthetic Constraints",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17981",
        "id": "kJ0qp9Xdsh",
        "author_site": "Jian Chen, Ruiyi Zhang, Yufan Zhou, Changyou Chen",
        "tldr": "",
        "abstract": "Controllable layout generation refers to the process of creating a plausible visual arrangement of elements within a graphic design (*e.g.*, document and web designs) with constraints representing design intentions. Although recent diffusion-based models have achieved state-of-the-art FID scores, they tend to exhibit more pronounced misalignment compared to earlier transformer-based models. In this work, we propose the **LA**yout **C**onstraint diffusion mod**E**l (LACE), a unified model to handle a broad range of layout generation tasks, such as arranging elements with specified attributes and refining or completing a coarse layout design. The model is based on continuous diffusion models. Compared with existing methods that use discrete diffusion models, continuous state-space design can enable the incorporation of continuous aesthetic constraint functions in training more naturally. For conditional generation, we propose injecting layout conditions in the form of masks or gradient guidance during inference. Empirical results show that LACE produces high-quality layouts and outperforms existing state-of-the-art baselines. We will release our source code and model checkpoints.",
        "keywords": "Diffusion model;Layout generation;Constrained Optimization",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/a101a473865e0d4a3f7d7df6f6a4d69a3429705d.pdf",
        "author": "Jian Chen;Ruiyi Zhang;Yufan Zhou;Changyou Chen",
        "authorids": "~Jian_Chen9;~Ruiyi_Zhang3;~Yufan_Zhou1;~Changyou_Chen1",
        "gender": "M;M;M;M",
        "homepage": "https://puar-playground.github.io/CV/;https://www.yufanzhou.com/;https://www.cse.buffalo.edu/~changyou/;http://zhangry868.github.io/",
        "dblp": "49/6002-43;;65/2802;",
        "google_scholar": "uBGjz-EAAAAJ;0eVrHJAAAAAJ;LtEcKBcAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0002-1999-1137;;;",
        "linkedin": "jian-chen-1a0b9a11b/;;;",
        "or_profile": "~Jian_Chen9;~Yufan_Zhou1;~Changyou_Chen1;~RUIYI_ZHANG1",
        "aff": "Mohamed bin Zayed University of Artificial Intelligence;Adobe ;State University of New York, Buffalo;Adobe Systems",
        "aff_domain": "mbzuai.ac.ae;adobe.com;buffalo.edu;adobe.com",
        "position": "Researcher;Researcher;Assistant Professor;Research Scientist",
        "bibtex": "@inproceedings{\nchen2024towards,\ntitle={Towards Aligned Layout Generation via Diffusion Model with Aesthetic Constraints},\nauthor={Jian Chen and Ruiyi Zhang and Yufan Zhou and Changyou Chen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=kJ0qp9Xdsh}\n}",
        "github": "",
        "project": "",
        "reviewers": "w7ws;5Gyc;DJP7;6Y7v",
        "pdf_size": 3632557,
        "rating": "6;6;6;8",
        "confidence": "4;4;3;3",
        "soundness": "3;2;3;3",
        "contribution": "3;2;2;3",
        "presentation": "4;3;3;4",
        "wc_summary": "62;59;135;79",
        "wc_strengths": "40;47;155;98",
        "wc_weaknesses": "85;204;30;156",
        "wc_questions": "6;29;66;68",
        "wc_review": "193;339;386;401",
        "wc_reply_reviewers": "0;0;0;21",
        "wc_reply_authors": "356;909;285;497",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;3;1;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            83.75,
            30.55630049596973
        ],
        "wc_strengths_avg": [
            85.0,
            46.20064934608604
        ],
        "wc_weaknesses_avg": [
            118.75,
            66.465686636038
        ],
        "wc_questions_avg": [
            42.25,
            26.06122598804592
        ],
        "wc_review_avg": [
            329.75,
            82.19907237919416
        ],
        "wc_reply_reviewers_avg": [
            5.25,
            9.093266739736606
        ],
        "wc_reply_authors_avg": [
            511.75,
            241.71199287581905
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1161242402292265658&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=kJ0qp9Xdsh",
        "pdf": "https://openreview.net/pdf?id=kJ0qp9Xdsh",
        "email": "mbzuai.ac.ae;adobe.com;buffalo.edu;adobe.com",
        "author_num": 4,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "Mohamed bin Zayed University of Artificial Intelligence;Adobe;State University of New York at Buffalo",
        "aff_unique_dep": ";Adobe Inc.;",
        "aff_unique_url": "https://mbzuai.ac.ae;https://www.adobe.com;https://www.buffalo.edu",
        "aff_unique_abbr": "MBZUAI;Adobe;SUNY Buffalo",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Buffalo",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "United Arab Emirates;United States"
    },
    {
        "title": "SE(3)-Stochastic Flow Matching for Protein Backbone Generation",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17980",
        "id": "kJFIH23hXb",
        "author_site": "Joey Bose, Tara Akhound-Sadegh, Kilian FATRAS, Guillaume Huguet, Jarrid Rector-Brooks, Chenghao Liu, Andrei Nica, Maksym Korablyov, Michael Bronstein, Alexander Tong",
        "tldr": "",
        "abstract": "The computational design of novel protein structures has the potential to impact numerous scientific disciplines greatly. Toward this goal, we introduce \\foldflow, a series of novel generative models of increasing modeling power based on the flow-matching paradigm over $3\\mathrm{D}$ rigid motions---i.e. the group $\\mathrm{SE(3)}$---enabling accurate modeling of protein backbones. We first introduce $\\text{FoldFlow-Base}$, a simulation-free approach to learning deterministic continuous-time dynamics and matching invariant target distributions on $\\mathrm{SE(3)}$. We next accelerate training by incorporating Riemannian optimal transport to create $\\text{FoldFlow-OT}$, leading to the construction of both more simple and stable flows. Finally, we design \\foldflowsfm, coupling both Riemannian OT and simulation-free training to learn stochastic continuous-time dynamics over $\\mathrm{SE(3)}$. Our family of $\\text{FoldFlow}$, generative models offers several key advantages over previous approaches to the generative modeling of proteins: they are more stable and faster to train than diffusion-based approaches, and our models enjoy the ability to map any invariant source distribution to any invariant target distribution over $\\mathrm{SE(3)}$. Empirically, we validate $\\text{FoldFlow}$, on protein backbone generation of up to $300$ amino acids leading to high-quality designable, diverse, and novel samples.",
        "keywords": "Proteins; Equivariance; Riemannian; Flow Matching; Generative models",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Joey Bose;Tara Akhound-Sadegh;Guillaume Huguet;Kilian FATRAS;Jarrid Rector-Brooks;Cheng-Hao Liu;Andrei Cristian Nica;Maksym Korablyov;Michael M. Bronstein;Alexander Tong",
        "authorids": "~Joey_Bose1;~Tara_Akhound-Sadegh1;~Guillaume_Huguet1;~Kilian_FATRAS1;~Jarrid_Rector-Brooks2;~Cheng-Hao_Liu1;~Andrei_Cristian_Nica1;~Maksym_Korablyov1;~Michael_M._Bronstein1;~Alexander_Tong1",
        "gender": "M;;M;M;M;M;M;;M;",
        "homepage": "https://joeybose.github.io/;https://sites.google.com/view/taraakhound-sadegh/home;https://mila.quebec/personne/guillaume-huguet/;http://kilianfatras.github.io;;https://pchliu.github.io/;https://www.linkedin.com/in/andrei-nica-24357b27/;;http://www.inf.usi.ch/bronstein/;https://alextong.net",
        "dblp": "174/3372;;286/5365;;230/4010;;230/0706;;07/2668;153/9296",
        "google_scholar": "ybPyI7IAAAAJ;RHDoTkkAAAAJ;L8kYu9IAAAAJ;https://scholar.google.ca/citations?user=DHMjyDgAAAAJ;gxRPZh4AAAAJ;iVJGx0cAAAAJ;;TpuvCSwAAAAJ;UU3N6-UAAAAJ;CS80pt4AAAAJ",
        "orcid": ";;;;;0000-0001-7923-6806;;;;0000-0002-2031-4096",
        "linkedin": ";tara-akhound-sadegh-574748101/;;;;chenghao-peter-liu/;;;mbronstein/;atong01/",
        "or_profile": "~Joey_Bose1;~Tara_Akhound-Sadegh1;~Guillaume_Huguet1;~Kilian_FATRAS1;~Jarrid_Rector-Brooks2;~Cheng-Hao_Liu1;~Andrei_Cristian_Nica1;~Maksym_Korablyov1;~Michael_M._Bronstein1;~Alexander_Tong1",
        "aff": "University of Oxford;McGill University;University of Montreal;McGill University;Montreal Institute for Learning Algorithms, University of Montreal, University of Montreal;Montreal Institute for Learning Algorithms, University of Montreal, Universit\u00e9 de Montr\u00e9al;UiPath;;University of Oxford;Universit\u00e9 de Montr\u00e9al",
        "aff_domain": "oxford.ac.uk;mcgill.ca;umontreal.ca;mcgill.ca;mila.umontreal.ca;mila.umontreal.ca;uipath.com;;ox.ac.uk;umontreal.ca",
        "position": "Postdoc;PhD student;PhD student;Postdoc;PhD student;PhD student intern;Researcher;;Full Professor;Postdoc",
        "bibtex": "@inproceedings{\nbose2024sestochastic,\ntitle={{SE}(3)-Stochastic Flow Matching for Protein Backbone Generation},\nauthor={Joey Bose and Tara Akhound-Sadegh and Guillaume Huguet and Kilian FATRAS and Jarrid Rector-Brooks and Cheng-Hao Liu and Andrei Cristian Nica and Maksym Korablyov and Michael M. Bronstein and Alexander Tong},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=kJFIH23hXb}\n}",
        "github": "",
        "project": "",
        "reviewers": "Nm3A;zh9j;PWT4;4M3T",
        "pdf_size": 40063529,
        "rating": "8;8;8;8",
        "confidence": "4;3;4;4",
        "soundness": "4;4;4;2",
        "contribution": "3;4;4;3",
        "presentation": "4;3;4;3",
        "wc_summary": "65;76;156;98",
        "wc_strengths": "46;176;112;66",
        "wc_weaknesses": "34;582;60;349",
        "wc_questions": "108;57;37;14",
        "wc_review": "253;891;365;527",
        "wc_reply_reviewers": "38;212;154;0",
        "wc_reply_authors": "653;1707;726;1303",
        "reply_reviewers": "2;1;2;0",
        "reply_authors": "2;4;2;3",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            3.5,
            0.5
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            98.75,
            35.12388788275011
        ],
        "wc_strengths_avg": [
            100.0,
            49.9799959983992
        ],
        "wc_weaknesses_avg": [
            256.25,
            225.06929488493094
        ],
        "wc_questions_avg": [
            54.0,
            34.69149751740331
        ],
        "wc_review_avg": [
            509.0,
            241.1016383187804
        ],
        "wc_reply_reviewers_avg": [
            101.0,
            85.58621384311844
        ],
        "wc_reply_authors_avg": [
            1097.25,
            432.8142644368367
        ],
        "reply_reviewers_avg": [
            1.25,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 76,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10667294284506902150&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=kJFIH23hXb",
        "pdf": "https://openreview.net/pdf?id=kJFIH23hXb",
        "email": "oxford.ac.uk;mcgill.ca;umontreal.ca;mcgill.ca;mila.umontreal.ca;mila.umontreal.ca;uipath.com;;ox.ac.uk;umontreal.ca",
        "author_num": 10,
        "aff_unique_index": "0;1;2;1;2;2;3;0;4",
        "aff_unique_norm": "University of Oxford;McGill University;University of Montreal;UiPath;Universit\u00e9 de Montr\u00e9al",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.ox.ac.uk;https://www.mcgill.ca;https://wwwumontreal.ca;https://www.uipath.com;https://www.umontreal.ca",
        "aff_unique_abbr": "Oxford;McGill;UM;UiPath;UdeM",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Montreal",
        "aff_country_unique_index": "0;1;1;1;1;1;2;0;1",
        "aff_country_unique": "United Kingdom;Canada;Romania"
    },
    {
        "id": "kKRbAY4CXv",
        "title": "Neural Evolutionary Kernel Method: A Knowledge-Based Learning Architechture for Evolutionary PDEs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Numerical solution of partial differential equations (PDEs) plays a vital role in various fields of science and engineering. In recent years, deep neural networks (DNNs) have emerged as a powerful tool for solving PDEs. DNN-based methods exploit the approximation capabilities of neural networks to obtain solutions to PDEs in general domains or high-dimensional spaces. However, many of these methods lack the use of mathematical prior knowledge, and DNN-based methods usually require a large number of sample points and parameters, making them computationally expensive and challenging to train. This paper aims to introduce a novel method named the Neural Evolutionary Kernel Method (NEKM) for solving a class of evolutionary PDEs through DNNs based kernels. By using operator splitting and boundary integral techniques, we propose particular neural network architectures which approximate evolutionary kernels of solutions and preserve structures of time-dependent PDEs. Mathematical prior knowledge are naturally built into these DNNs based kernels through convolutional representation with pre-trained Green functions, leading to serious reduction in the number of parameters in the NEKM and very efficient training processes. Experimental results demonstrate the efficiency and accuracy of the NEKM in solving heat equations and Allen-Cahn equations in complex domains and on manifolds, showcasing its promising potential for applications in data driven scientific computing.",
        "keywords": "Numerical PDE;structure preserving neural network;operator learning;boundary integral",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Shuo Ling;Wenjun Ying;Zhen Zhang",
        "authorids": "~Shuo_Ling1;wying@sjtu.edu.cn;~Zhen_Zhang26",
        "gender": ";;M",
        "homepage": "https://github.com/excellentgithubuser;;https://faculty.sustech.edu.cn/?tagid=zhangz&iscss=1&snapid=1&orderby=date&go=1&lang=en",
        "dblp": ";;19/5112-18",
        "google_scholar": ";;",
        "orcid": ";;0000-0002-7444-6692",
        "linkedin": ";;",
        "or_profile": "~Shuo_Ling1;wying@sjtu.edu.cn;~Zhen_Zhang26",
        "aff": "Shanghai Jiaotong University;;",
        "aff_domain": "sjtu.edu.cn;;",
        "position": "MS student;;",
        "bibtex": "@misc{\nling2024neural,\ntitle={Neural Evolutionary Kernel Method: A Knowledge-Based Learning Architechture for Evolutionary {PDE}s},\nauthor={Shuo Ling and Wenjun Ying and Zhen Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=kKRbAY4CXv}\n}",
        "github": "",
        "project": "",
        "reviewers": "tJtQ;Ljfw;sX1E;71KZ",
        "site": "https://openreview.net/forum?id=kKRbAY4CXv",
        "pdf_size": 10239094,
        "rating": "3;3;5;6",
        "confidence": "3;4;4;2",
        "soundness": "2;2;3;2",
        "contribution": "2;2;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "79;50;114;302",
        "wc_strengths": "21;47;137;362",
        "wc_weaknesses": "54;151;618;396",
        "wc_questions": "105;84;26;382",
        "wc_review": "259;332;895;1442",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "750;746;725;755",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            136.25,
            98.34219592829926
        ],
        "wc_strengths_avg": [
            141.75,
            134.24860334469034
        ],
        "wc_weaknesses_avg": [
            304.75,
            219.63990416133404
        ],
        "wc_questions_avg": [
            149.25,
            137.4579481150508
        ],
        "wc_review_avg": [
            732.0,
            478.1208006351533
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            744.0,
            11.423659658795863
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:tdnXJcenaoEJ:scholar.google.com/&scioq=Neural+Evolutionary+Kernel+Method:+A+Knowledge-Based+Learning+Architechture+for+Evolutionary+PDEs&hl=en&as_sdt=0,47",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Shanghai Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sjtu.edu.cn",
        "aff_unique_abbr": "SJTU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "kKXIYUi8ff",
        "title": "DynamicsDiffusion: Generating and Rare Event Sampling of Molecular Dynamic Trajectories Using Diffusion Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Molecular dynamics simulations are fundamental tools for quantitative molecular sciences. However, these simulations are computationally demanding and often struggle to sample rare events crucial for understanding spontaneous organization and reconfiguration in complex systems. To improve general speed and the ability to sample rare events in a directed fashion, we propose a method called $\\textit{DynamicsDiffusion}$ based on denoising diffusion probabilistic models (DDPM) to generate molecular dynamics trajectories from noise. The generative model can then serve as a surrogate to sample rare events. We leverage the properties of DDPMs, such as conditional generation, the ability to generate variations of trajectories, and those with certain conditions, such as crossing from one state to another, using the 'inpainting' property of DDPMs, which became only applicable when generating whole trajectories and not just individual conformations. To our knowledge, this is the first deep generative modeling for generating molecular dynamics trajectories. We hope this work will motivate a new generation of generative modeling for the study of molecular dynamics.",
        "keywords": "Diffusion Models;DDPM;Molecular Dynamics;Physics",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/0e643d07602922f1d23f44bbf825d08face0fd90.zip",
        "author": "Magnus Petersen;Gemma Roig;Roberto Covino",
        "authorids": "~Magnus_Petersen1;~Gemma_Roig1;~Roberto_Covino1",
        "gender": "M;F;",
        "homepage": "https://magnuspetersen.com/;http://www.cvai.cs.uni-frankfurt.de/;",
        "dblp": ";58/9606;",
        "google_scholar": "yWSSx4wAAAAJ;6MjMhT4AAAAJ;",
        "orcid": ";0000-0002-6439-8076;",
        "linkedin": ";gemma-roig-5830b414/;",
        "or_profile": "~Magnus_Petersen1;~Gemma_Roig1;~Roberto_Covino1",
        "aff": ", Johann Wolfgang Goethe Universit\u00e4t Frankfurt am Main;Johann Wolfgang Goethe Universit\u00e4t Frankfurt am Main;",
        "aff_domain": "fias.uni-frankfurt.de;uni-frankfurt.de;",
        "position": "PhD student;Full Professor;",
        "bibtex": "@misc{\npetersen2024dynamicsdiffusion,\ntitle={DynamicsDiffusion: Generating and Rare Event Sampling of Molecular Dynamic Trajectories Using Diffusion Models},\nauthor={Magnus Petersen and Gemma Roig and Roberto Covino},\nyear={2024},\nurl={https://openreview.net/forum?id=kKXIYUi8ff}\n}",
        "github": "",
        "project": "",
        "reviewers": "3FPR;2a4b;BCdf;2zYs;njs8",
        "site": "https://openreview.net/forum?id=kKXIYUi8ff",
        "pdf_size": 1569170,
        "rating": "3;3;3;3;3",
        "confidence": "5;5;4;5;4",
        "soundness": "2;2;2;2;3",
        "contribution": "2;2;3;1;2",
        "presentation": "3;1;1;2;1",
        "wc_summary": "84;71;154;19;43",
        "wc_strengths": "57;76;119;16;88",
        "wc_weaknesses": "272;41;295;52;103",
        "wc_questions": "2;1940;175;1;91",
        "wc_review": "415;2128;743;88;325",
        "wc_reply_reviewers": "0;0;0;560;0",
        "wc_reply_authors": "0;0;0;32;0",
        "reply_reviewers": "0;0;0;1;0",
        "reply_authors": "0;0;0;1;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.2,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            1.6,
            0.8
        ],
        "wc_summary_avg": [
            74.2,
            45.81440821401058
        ],
        "wc_strengths_avg": [
            71.2,
            34.17250356646407
        ],
        "wc_weaknesses_avg": [
            152.6,
            109.1505382487874
        ],
        "wc_questions_avg": [
            441.8,
            751.87429800466
        ],
        "wc_review_avg": [
            739.8,
            725.1905680578037
        ],
        "wc_reply_reviewers_avg": [
            112.0,
            224.0
        ],
        "wc_reply_authors_avg": [
            6.4,
            12.8
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4
        ],
        "reply_authors_avg": [
            0.2,
            0.4
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2338980484302008687&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Johann Wolfgang Goethe Universit\u00e4t Frankfurt am Main;Johann Wolfgang Goethe University Frankfurt am Main",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uni-frankfurt.de;https://www.uni-frankfurt.de",
        "aff_unique_abbr": "Johann Wolfgang Goethe Universit\u00e4t;JWGU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Frankfurt am Main",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "kKmi2UTlBN",
        "title": "Cosine Similarity Knowledge Distillation for Individual Class Information Transfer",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Previous logits-based Knowledge Distillation (KD) have utilized predictions about multiple categories within each sample (i.e., class predictions) and have employed Kullback-Leibler (KL) divergence to reduce the discrepancy between the student\u2019s and teacher\u2019s predictions. Despite the proliferation of KD techniques, the student model continues to fall short of achieving a similar level as teachers. In response, we introduce a novel and effective KD method capable of achieving results on par with or superior to the teacher model\u2019s performance. We utilize teacher and student predictions about multiple samples for each category (i.e., batch predictions) and apply cosine similarity, a commonly used technique in Natural Language Processing (NLP) for measuring the resemblance between text embeddings. This metric's inherent scale-invariance property, which relies solely on vector direction and not magnitude, allows the student to dynamically learn from the teacher's knowledge, rather than being bound by a fixed distribution of the teacher's knowledge. Furthermore, we propose a method called cosine similarity weighted temperature (CSWT) to improve the performance. CSWT reduces the temperature scaling in KD when the cosine similarity between the student and teacher models is high, and conversely, it increases the temperature scaling when the cosine similarity is low. This adjustment optimizes the transfer of information from the teacher to the student model. Extensive experimental results show that our proposed method serves as a viable alternative to existing methods. We anticipate that this approach will offer valuable insights for future research on model compression.",
        "keywords": "Deep learning;image classification;knowledge distillation;cosine similarity;cosine distance",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/198005ee43311b63739fae29da25be07dd98a9fe.zip",
        "author": "Gyeongdo Ham;Seonghak KIM;Suin Lee;Jae-Hyeok Lee;Daeshik Kim",
        "authorids": "~Gyeongdo_Ham2;~Seonghak_KIM1;~Suin_Lee1;~Jae-Hyeok_Lee1;~Daeshik_Kim1",
        "gender": "M;;;;",
        "homepage": "http://brain.kaist.ac.kr/brain/main.php;;;;",
        "dblp": "323/5665;;361/7005;;",
        "google_scholar": ";;https://scholar.google.com/citations?hl=ko;;",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Gyeongdo_Ham2;~Seonghak_KIM1;~Suin_Lee1;~Jae-Hyeok_Lee1;~Daeshik_Kim1",
        "aff": "KAIST;;Korea Advanced Institute of Science & Technology;;",
        "aff_domain": "ee.kaist.ac.kr;;kaist.edu;;",
        "position": "PhD student;;MS student;;",
        "bibtex": "@misc{\nham2024cosine,\ntitle={Cosine Similarity Knowledge Distillation for Individual Class Information Transfer},\nauthor={Gyeongdo Ham and Seonghak KIM and Suin Lee and Jae-Hyeok Lee and Daeshik Kim},\nyear={2024},\nurl={https://openreview.net/forum?id=kKmi2UTlBN}\n}",
        "github": "",
        "project": "",
        "reviewers": "9Nip;RUAZ;j6ZX",
        "site": "https://openreview.net/forum?id=kKmi2UTlBN",
        "pdf_size": 577164,
        "rating": "3;5;6",
        "confidence": "4;4;4",
        "soundness": "2;2;3",
        "contribution": "1;3;3",
        "presentation": "2;2;3",
        "wc_summary": "296;45;76",
        "wc_strengths": "2;18;75",
        "wc_weaknesses": "2;29;28",
        "wc_questions": "2;282;13",
        "wc_review": "302;374;192",
        "wc_reply_reviewers": "0;41;17",
        "wc_reply_authors": "962;1021;224",
        "reply_reviewers": "0;1;1",
        "reply_authors": "2;2;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            139.0,
            111.73480508179475
        ],
        "wc_strengths_avg": [
            31.666666666666668,
            31.329787033357814
        ],
        "wc_weaknesses_avg": [
            19.666666666666668,
            12.498888839501783
        ],
        "wc_questions_avg": [
            99.0,
            129.47844093387388
        ],
        "wc_review_avg": [
            289.3333333333333,
            74.8390866385266
        ],
        "wc_reply_reviewers_avg": [
            19.333333333333332,
            16.81930108205715
        ],
        "wc_reply_authors_avg": [
            735.6666666666666,
            362.6038548547927
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1386065991650166254&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "kKxvFpvV04",
        "title": "Towards Exact Computation of Inductive Bias",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Much research in machine learning involves finding appropriate inductive biases (e.g. convolutional neural networks, momentum-based optimizers, transformers) to promote generalization on tasks. However, quantification of the amount of inductive bias associated with these architectures and hyperparameters has been limited. We propose a novel method for efficiently computing the inductive bias required for generalization on a task with a fixed training data budget; formally, this corresponds to the amount of information required to specify well-generalizing models within a specific hypothesis space of models. Our approach involves sampling from the hypothesis space and modeling the loss distribution of hypotheses to estimate the required inductive bias for a task. Unlike prior work, our method provides a direct estimate of inductive bias without using bounds and is applicable to diverse hypothesis spaces. Moreover, we derive approximation error bounds for our estimation approach in terms of the number of sampled hypotheses. Consistent with prior results, our empirical results demonstrate that higher dimensional tasks require greater inductive bias. We show that relative to other expressive model classes, neural networks as a model class encode massive amounts of inductive bias. Furthermore, our measure quantifies the relative difference in inductive bias between different neural network architectures (e.g. with varying width and depth). Our proposed inductive bias metric provides an information-theoretic interpretation of the benefits of specific model architectures for certain tasks and provides a quantitative guide to developing tasks requiring greater inductive bias, thereby encouraging the development of more powerful inductive biases.",
        "keywords": "generalization;inductive bias;efficiency;information theory;complexity",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Akhilan Boopathy;William Yue;Jaedong Hwang;Abhiram Iyer;Ila R Fiete",
        "authorids": "~Akhilan_Boopathy1;~William_Yue1;~Jaedong_Hwang1;~Abhiram_Iyer1;~Ila_R_Fiete1",
        "gender": "M;M;M;;F",
        "homepage": ";;https://jd730.github.io/;;https://fietelab.mit.edu/",
        "dblp": "230/8358;;239/1982;;",
        "google_scholar": ";;https://scholar.google.co.kr/citations?user=bITgqEUAAAAJ;pXIRasMAAAAJ;uE-CihIAAAAJ",
        "orcid": ";0000-0002-1923-5470;;;0000-0003-4738-2539",
        "linkedin": ";willyue/;;;",
        "or_profile": "~Akhilan_Boopathy1;~William_Yue1;~Jaedong_Hwang1;~Abhiram_Iyer1;~Ila_R_Fiete1",
        "aff": "Amazon;Massachusetts Institute of Technology;Massachusetts Institute of Technology;Massachusetts Institute of Technology;Massachusetts Institute of Technology",
        "aff_domain": "amazon.com;mit.edu;mit.edu;mit.edu;mit.edu",
        "position": "Intern;Undergrad student;PhD student;PhD student;Professor",
        "bibtex": "@misc{\nboopathy2024towards,\ntitle={Towards Exact Computation of Inductive Bias},\nauthor={Akhilan Boopathy and William Yue and Jaedong Hwang and Abhiram Iyer and Ila R Fiete},\nyear={2024},\nurl={https://openreview.net/forum?id=kKxvFpvV04}\n}",
        "github": "",
        "project": "",
        "reviewers": "9oUe;Fhpo;VSJh;VP96",
        "site": "https://openreview.net/forum?id=kKxvFpvV04",
        "pdf_size": 605448,
        "rating": "3;3;5;5",
        "confidence": "3;2;3;3",
        "soundness": "2;1;3;2",
        "contribution": "2;2;2;3",
        "presentation": "3;1;2;2",
        "wc_summary": "155;55;188;167",
        "wc_strengths": "24;33;115;54",
        "wc_weaknesses": "348;196;275;505",
        "wc_questions": "70;98;3;72",
        "wc_review": "597;382;581;798",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "342;320;177;832",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            141.25,
            51.17799820235254
        ],
        "wc_strengths_avg": [
            56.5,
            35.485912697858005
        ],
        "wc_weaknesses_avg": [
            331.0,
            113.93638575977386
        ],
        "wc_questions_avg": [
            60.75,
            35.12388788275011
        ],
        "wc_review_avg": [
            589.5,
            147.18780520138208
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            417.75,
            247.41501066022653
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:zcMrEGcQxn8J:scholar.google.com/&scioq=Towards+Exact+Computation+of+Inductive+Bias&hl=en&as_sdt=0,5",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;1;1;1",
        "aff_unique_norm": "Amazon;Massachusetts Institute of Technology",
        "aff_unique_dep": "Amazon.com, Inc.;",
        "aff_unique_url": "https://www.amazon.com;https://web.mit.edu",
        "aff_unique_abbr": "Amazon;MIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "kMOHMk1h0Y",
        "title": "GNeRV: A Global Embedding Neural Representation For Videos",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In recent years, Implicit Neural Representation (INR) has garnered considerable attention for its effectiveness in compressing various visual information while delivering significant advantages in decoding speed. Video compression work with INR use time index as input and corresponding frame in RGB format as output. However, related work suffers from poor representation performance due to insufficient information in the embedding structure. In this paper, we introduce a global embedding structure, whose parameters are generated by random initialization and back propagation without any other constraint, and this embedding is shared by all frames. Furthermore, we propose a progressive training pipeline wherein large models are built upon the reuse and expansion of small models. Our Global embedding Neural Representation for Videos (GNeRV) achieves SOTA results on multiple datasets. Taking UVG dataset as an example, GNeRV model outperforms the previously leading model HiNeRV by 1.5-2 dB at the same bitrate. And our progressive pipeline can effectively reduce the computational complexity of multi-bitrate encoding and save the storage space of multi-bitrate compressed files.",
        "keywords": "INR;video compression;progressive pipeline",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Bing He;Chen Zhu;Guo Lu;Zhiyu Zhang;Yunuo Chen;Li Song",
        "authorids": "~Bing_He5;~Chen_Zhu6;~Guo_Lu2;~Zhiyu_Zhang4;~Yunuo_Chen1;~Li_Song3",
        "gender": "M;M;M;;M;M",
        "homepage": "https://github.com/hebing-sjtu;https://github.com/zc635068702;https://guolusjtu.github.io/guoluhomepage/;;;http://medialab.sjtu.edu.cn",
        "dblp": ";;76/7805;;;20/872-1",
        "google_scholar": ";;R9iwlJcAAAAJ;tXJKKLMAAAAJ;;jKIoTVoAAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";;;;https://www.linkedin.cn/incareer/in/unochenyn;",
        "or_profile": "~Bing_He5;~Chen_Zhu6;~Guo_Lu2;~Zhiyu_Zhang4;~Yunuo_Chen1;~Li_Song3",
        "aff": "Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn",
        "position": "PhD student;PhD student;Assistant Professor;MS student;PhD student;Full Professor",
        "bibtex": "@misc{\nhe2024gnerv,\ntitle={{GN}e{RV}: A Global Embedding Neural Representation For Videos},\nauthor={Bing He and Chen Zhu and Guo Lu and Zhiyu Zhang and Yunuo Chen and Li Song},\nyear={2024},\nurl={https://openreview.net/forum?id=kMOHMk1h0Y}\n}",
        "github": "",
        "project": "",
        "reviewers": "vfx3;qKqs;ggkq;nVh1",
        "site": "https://openreview.net/forum?id=kMOHMk1h0Y",
        "pdf_size": 9336179,
        "rating": "3;3;6;6",
        "confidence": "3;3;4;4",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;1;2;3",
        "wc_summary": "96;115;88;66",
        "wc_strengths": "19;44;51;58",
        "wc_weaknesses": "101;137;121;25",
        "wc_questions": "80;58;43;62",
        "wc_review": "296;354;303;211",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            91.25,
            17.5695048308141
        ],
        "wc_strengths_avg": [
            43.0,
            14.713938969562161
        ],
        "wc_weaknesses_avg": [
            96.0,
            42.930175867331364
        ],
        "wc_questions_avg": [
            60.75,
            13.179055353097201
        ],
        "wc_review_avg": [
            291.0,
            51.327380607235355
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:LgvmNeM4MgcJ:scholar.google.com/&scioq=GNeRV:+A+Global+Embedding+Neural+Representation+For+Videos&hl=en&as_sdt=0,34",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "Shanghai Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sjtu.edu.cn",
        "aff_unique_abbr": "SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "ASMR: Activation-Sharing Multi-Resolution Coordinate Networks for Efficient Inference",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17979",
        "id": "kMp8zCsXNb",
        "author_site": "Jason Chun Lok Li, Steven Luo, Le Xu, Ngai Wong",
        "tldr": "",
        "abstract": "Coordinate network or implicit neural representation (INR) is a fast-emerging method for encoding natural signals (such as images and videos) with the benefits of a compact neural representation. While numerous methods have been proposed to increase the encoding capabilities of an INR, an often overlooked aspect is the inference efficiency, usually measured in multiply-accumulate (MAC) count. This is particularly critical in use cases where inference bandwidth is greatly limited by hardware constraints. To this end, we propose the Activation-Sharing Multi-Resolution (ASMR) coordinate network that combines multi-resolution coordinate decomposition with hierarchical modulations. Specifically, an ASMR model enables the sharing of activations across grids of the data. This largely decouples its inference cost from its depth which is directly correlated to its reconstruction capability, and renders a near $O(1)$ inference complexity irrespective of the number of layers. Experiments show that ASMR can reduce the MAC of a vanilla SIREN model by up to 500$\\times$ while achieving an even higher reconstruction quality than its SIREN baseline.",
        "keywords": "Implicit Neural Representation;Coordinate Network;Multi-resolution;Efficient Inference",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Jason Chun Lok Li;Steven Tin Sui Luo;Le Xu;Ngai Wong",
        "authorids": "~Jason_Chun_Lok_Li1;~Steven_Tin_Sui_Luo1;~Le_Xu3;~Ngai_Wong1",
        "gender": "M;M;M;M",
        "homepage": ";https://stevolopolis.github.io/;;https://www.eee.hku.hk/~nwong/",
        "dblp": ";377/7023;;88/3656",
        "google_scholar": "Tcpdsh0AAAAJ;https://scholar.google.ca/citations?user=2ASNx9AAAAAJ;https://scholar.google.com/citations?hl=zh-CN;PM_uMYIAAAAJ",
        "orcid": ";0009-0004-7907-7680;;0000-0002-3026-0108",
        "linkedin": "jason-chun-lok-li-0590b3166;steven-luo-uoft/;;",
        "or_profile": "~Jason_Chun_Lok_Li1;~Steven_Tin_Sui_Luo1;~Le_Xu3;~Ngai_Wong1",
        "aff": "University of Hong Kong;University of Hong Kong;;The University of Hong Kong",
        "aff_domain": "eee.hku.hk;eee.hku.hk;;hku.hk",
        "position": "PhD student;Intern;;Associate Professor",
        "bibtex": "@inproceedings{\nli2024asmr,\ntitle={{ASMR}: Activation-Sharing Multi-Resolution Coordinate Networks for Efficient Inference},\nauthor={Jason Chun Lok Li and Steven Tin Sui Luo and Le Xu and Ngai Wong},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=kMp8zCsXNb}\n}",
        "github": "",
        "project": "",
        "reviewers": "zbDF;24bM;rQpt",
        "pdf_size": 13611401,
        "rating": "5;6;8",
        "confidence": "5;4;4",
        "soundness": "3;4;2",
        "contribution": "2;3;3",
        "presentation": "3;2;2",
        "wc_summary": "91;58;276",
        "wc_strengths": "36;29;105",
        "wc_weaknesses": "607;99;269",
        "wc_questions": "6;51;73",
        "wc_review": "740;237;723",
        "wc_reply_reviewers": "644;127;308",
        "wc_reply_authors": "1544;791;909",
        "reply_reviewers": "1;1;1",
        "reply_authors": "4;2;2",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            141.66666666666666,
            95.93863779636555
        ],
        "wc_strengths_avg": [
            56.666666666666664,
            34.296096311711956
        ],
        "wc_weaknesses_avg": [
            325.0,
            211.1366066476078
        ],
        "wc_questions_avg": [
            43.333333333333336,
            27.884683171152503
        ],
        "wc_review_avg": [
            566.6666666666666,
            233.21282602426098
        ],
        "wc_reply_reviewers_avg": [
            359.6666666666667,
            214.20291522033233
        ],
        "wc_reply_authors_avg": [
            1081.3333333333333,
            330.68245930029144
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.7559289460184544,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11195912026177081357&as_sdt=5,31&sciodt=0,31&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=kMp8zCsXNb",
        "pdf": "https://openreview.net/pdf?id=kMp8zCsXNb",
        "email": "eee.hku.hk;eee.hku.hk;;hku.hk",
        "author_num": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Hong Kong",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.hku.hk",
        "aff_unique_abbr": "HKU",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "kNGxg8shA1",
        "title": "Noise Robust Graph Learning under Feature-Dependent Graph-Noise",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In real-world scenarios, node features frequently exhibit noise due to various factors, making GNNs vulnerable. Various methods enhance robustness, but they make an unrealistic assumption that the noise in node features is independent of the graph structure of node labels, restricting their practicality. To this end, we introduce more realistic noise scenario, called feature-dependent graph-noise (FDGN), where noisy node features may entail both structure and label noise, and propose a generative model to capture these causal relationships. Our proposed method, PRINGLE, outperforms baselines on commonly used benchmark datasets and newly introduced real-world graph datasets that simulate FDGN in e-commerce systems.",
        "keywords": "Graph Neural Networks;Robust Graph Neural Networks;Graph Noise",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/abc3923a9403875c5189f36bfb10b877d26d7d02.zip",
        "author": "Yeonjun In;Kanghoon Yoon;Kibum Kim;Sungchul Kim;Chanyoung Park",
        "authorids": "~Yeonjun_In1;~Kanghoon_Yoon2;~Kibum_Kim1;~Sungchul_Kim1;~Chanyoung_Park1",
        "gender": "M;M;M;M;M",
        "homepage": "https://yeonjun-in.notion.site/;https://kanghoonyoon.github.io/;https://rlqja1107.github.io;https://sites.google.com/site/subright;https://dsail.kaist.ac.kr/",
        "dblp": "317/6906;327/3704;;61/1573;170/5430.html",
        "google_scholar": "bBJXfnUAAAAJ;cHwMvgYAAAAJ;https://scholar.google.com/citations?hl=ko;v8ISLgIAAAAJ;lWk2LtQAAAAJ",
        "orcid": "0000-0003-0408-4259;0000-0001-6947-2944;0000-0002-7381-019X;0000-0003-3580-5290;0000-0002-5957-5816",
        "linkedin": "yeonjun-in-9654b0180/;;kibum-kim-253b01206/;;",
        "or_profile": "~Yeonjun_In1;~Kanghoon_Yoon2;~Kibum_Kim1;~Sungchul_Kim1;~Chanyoung_Park1",
        "aff": "Adobe Systems;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Adobe Systems;Korea Advanced Institute of Science & Technology",
        "aff_domain": "adobe.com;kaist.ac.kr;kaist.ac.kr;adobe.com;kaist.ac.kr",
        "position": "Intern;PhD student;PhD student;Researcher;Assistant Professor",
        "bibtex": "@misc{\nin2024noise,\ntitle={Noise Robust Graph Learning under Feature-Dependent Graph-Noise},\nauthor={Yeonjun In and Kanghoon Yoon and Kibum Kim and Sungchul Kim and Chanyoung Park},\nyear={2024},\nurl={https://openreview.net/forum?id=kNGxg8shA1}\n}",
        "github": "",
        "project": "",
        "reviewers": "MMoz;sE61;sHVZ;7Duj",
        "site": "https://openreview.net/forum?id=kNGxg8shA1",
        "pdf_size": 977059,
        "rating": "3;5;6;8",
        "confidence": "3;4;4;4",
        "soundness": "3;2;3;4",
        "contribution": "2;2;3;4",
        "presentation": "2;2;2;4",
        "wc_summary": "52;46;107;92",
        "wc_strengths": "16;47;71;119",
        "wc_weaknesses": "91;81;265;42",
        "wc_questions": "2;4;7;1",
        "wc_review": "161;178;450;254",
        "wc_reply_reviewers": "82;374;39;0",
        "wc_reply_authors": "1356;1240;1370;39",
        "reply_reviewers": "1;2;1;0",
        "reply_authors": "4;5;2;1",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            74.25,
            25.8879798362097
        ],
        "wc_strengths_avg": [
            63.25,
            37.632266740126084
        ],
        "wc_weaknesses_avg": [
            119.75,
            85.83523460677439
        ],
        "wc_questions_avg": [
            3.5,
            2.29128784747792
        ],
        "wc_review_avg": [
            260.75,
            114.73747208301218
        ],
        "wc_reply_reviewers_avg": [
            123.75,
            147.36413233891074
        ],
        "wc_reply_authors_avg": [
            1001.25,
            557.8419915173113
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            3.0,
            1.5811388300841898
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.8006407690254357,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ny5_XZQU100J:scholar.google.com/&scioq=Noise+Robust+Graph+Learning+under+Feature-Dependent+Graph-Noise&hl=en&as_sdt=0,14",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;1;0;1",
        "aff_unique_norm": "Adobe;Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "Adobe Systems Incorporated;",
        "aff_unique_url": "https://www.adobe.com;https://www.kaist.ac.kr",
        "aff_unique_abbr": "Adobe;KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;0;1",
        "aff_country_unique": "United States;South Korea"
    },
    {
        "title": "What's in a Prior? Learned Proximal Networks for Inverse Problems",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17978",
        "id": "kNPcOaqC5r",
        "author_site": "Zhenghan Fang, Sam Buchanan, Jeremias Sulam",
        "tldr": "",
        "abstract": "Proximal operators are ubiquitous in inverse problems, commonly appearing as part of algorithmic strategies to regularize problems that are otherwise ill-posed. Modern deep learning models have been brought to bear for these tasks too, as in the framework of plug-and-play or deep unrolling, where they loosely resemble proximal operators. Yet, something essential is lost in employing these purely data-driven approaches: there is no guarantee that a general deep network represents the proximal operator of any function, nor is there any characterization of the function for which the network might provide some approximate proximal. This not only makes guaranteeing convergence of iterative schemes challenging but, more fundamentally, complicates the analysis of what has been learned by these networks about their training data. Herein we provide a framework to develop *learned proximal networks* (LPN), prove that they provide exact proximal operators for a data-driven nonconvex regularizer, and show how a new training strategy, dubbed *proximal matching*, provably promotes the recovery of the log-prior of the true data distribution. Such LPN provide general, unsupervised, expressive proximal operators that can be used for general inverse problems with convergence guarantees. We illustrate our results in a series of cases of increasing complexity, demonstrating that these models not only result in state-of-the-art performance, but provide a window into the resulting priors learned from data.",
        "keywords": "Inverse problems;Proximal operators;Plug-and-play;Explicit regularizer;Convergent PnP;Input convex neural networks",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Zhenghan Fang;Sam Buchanan;Jeremias Sulam",
        "authorids": "~Zhenghan_Fang1;~Sam_Buchanan1;~Jeremias_Sulam1",
        "gender": ";M;M",
        "homepage": "https://zhenghanfang.github.io/;http://sdbuchanan.com;",
        "dblp": "226/4875;226/5790;156/3028",
        "google_scholar": "O5HDpGwAAAAJ;5WT38A0AAAAJ;1awx1aIAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Zhenghan_Fang1;~Sam_Buchanan1;~Jeremias_Sulam1",
        "aff": "Amazon;Toyota Technological Institute at Chicago;Johns Hopkins University",
        "aff_domain": "amazon.com;ttic.edu;jhu.edu",
        "position": "Intern;Research Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nfang2024whats,\ntitle={What's in a Prior? Learned Proximal Networks for Inverse Problems},\nauthor={Zhenghan Fang and Sam Buchanan and Jeremias Sulam},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=kNPcOaqC5r}\n}",
        "github": "",
        "project": "",
        "reviewers": "XDuj;hkxu;fi4Y;8FVJ",
        "pdf_size": 8775108,
        "rating": "5;5;5;8",
        "confidence": "5;3;3;3",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;1;3",
        "wc_summary": "123;49;123;118",
        "wc_strengths": "57;30;50;102",
        "wc_weaknesses": "557;23;448;147",
        "wc_questions": "2;153;9;124",
        "wc_review": "739;255;630;491",
        "wc_reply_reviewers": "119;0;26;21",
        "wc_reply_authors": "2704;1051;1569;822",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "4;2;4;2",
        "rating_avg": [
            5.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            103.25,
            31.38769663419092
        ],
        "wc_strengths_avg": [
            59.75,
            26.328454189336675
        ],
        "wc_weaknesses_avg": [
            293.75,
            216.75720864598713
        ],
        "wc_questions_avg": [
            72.0,
            67.331270595467
        ],
        "wc_review_avg": [
            528.75,
            180.84575610171225
        ],
        "wc_reply_reviewers_avg": [
            41.5,
            45.79574216016157
        ],
        "wc_reply_authors_avg": [
            1536.5,
            726.3492617191815
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            1.0
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1475576075592716505&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=kNPcOaqC5r",
        "pdf": "https://openreview.net/pdf?id=kNPcOaqC5r",
        "email": "amazon.com;ttic.edu;jhu.edu",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Amazon;Toyota Technological Institute at Chicago;Johns Hopkins University",
        "aff_unique_dep": "Amazon.com, Inc.;;",
        "aff_unique_url": "https://www.amazon.com;https://www.tti-chicago.org;https://www.jhu.edu",
        "aff_unique_abbr": "Amazon;TTI Chicago;JHU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Chicago",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Leveraging Unpaired Data for Vision-Language Generative Models via Cycle Consistency",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17977",
        "id": "kNjrhD67LP",
        "author_site": "Tianhong Li, Sangnie Bhardwaj, Yonglong Tian, Han Zhang, Jarred Barber, Dina Katabi, Guillaume Lajoie, Huiwen Chang, Dilip Krishnan",
        "tldr": "",
        "abstract": "Current vision-language generative models rely on expansive corpora of $\\textit{paired}$ image-text data to attain optimal performance and generalization capabilities. However, automatically collecting such data (e.g. via large-scale web scraping) leads to low quality and poor image-text correlation, while human annotation is more accurate but requires significant manual effort and expense. We introduce $\\textbf{ITIT}$ ($\\textbf{I}$n$\\textbf{T}$egrating $\\textbf{I}$mage $\\textbf{T}$ext): an innovative training paradigm grounded in the concept of cycle consistency which allows vision-language training on $\\textit{unpaired}$ image and text data. ITIT is comprised of a joint image-text encoder with disjoint image and text decoders that enable bidirectional image-to-text and text-to-image generation in a single framework. During training, ITIT leverages a small set of paired image-text data to ensure its output matches the input reasonably well in both directions. Simultaneously, the model is also trained on much larger datasets containing only images or texts. This is achieved by enforcing cycle consistency between the original unpaired samples and the cycle-generated counterparts. For instance, it generates a caption for a given input image and then uses the caption to create an output image, and enforces similarity between the input and output images. Our experiments show that ITIT with unpaired datasets exhibits similar scaling behavior as using high-quality paired data. We demonstrate image generation and captioning performance on par with state-of-the-art text-to-image and image-to-text models with orders of magnitude fewer (only 3M) paired image-text data. Code will be released at https://github.com/LTH14/itit.",
        "keywords": "vision-language generative model;cycle consistency",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/e2810d43574b4f9e99e6abfb714a7259d7806e78.pdf",
        "author": "Tianhong Li;Sangnie Bhardwaj;Yonglong Tian;Han Zhang;Jarred Barber;Dina Katabi;Guillaume Lajoie;Huiwen Chang;Dilip Krishnan",
        "authorids": "~Tianhong_Li3;~Sangnie_Bhardwaj1;~Yonglong_Tian1;~Han_Zhang5;~Jarred_Barber1;~Dina_Katabi1;~Guillaume_Lajoie1;~Huiwen_Chang2;~Dilip_Krishnan1",
        "gender": "M;F;;M;;M;F;M;M",
        "homepage": "http://www.tianhongli.me/;https://sangnie.github.io/;http://people.csail.mit.edu/yonglong/;;;https://dms.umontreal.ca/~lajoie/;;http://dilipkay.wordpress.com;https://sites.google.com/corp/view/hanzhang",
        "dblp": "195/5632;;151/6328;;k/DinaKatabi;31/10384;131/4389;08/2316;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;0IWgVz4AAAAJ;https://scholar.google.com.hk/citations?user=OsP7JHAAAAAJ;UbjqML8AAAAJ;;;eZQNcvcAAAAJ;_MEuWIMAAAAJ;cxEoVL4AAAAJ",
        "orcid": ";;;;;;;;",
        "linkedin": ";;;jarred-barber-77947458/;;;;;",
        "or_profile": "~Tianhong_Li3;~Sangnie_Bhardwaj1;~Yonglong_Tian1;~Jarred_Barber1;~Dina_Katabi1;~Guillaume_Lajoie1;~Huiwen_Chang2;~Dilip_Krishnan1;~Han_Zhang1",
        "aff": "Massachusetts Institute of Technology;Google;Google;Google;Massachusetts Institute of Technology;Mila - Quebec Artificial Intelligence Institute;OpenAI;Google;Google",
        "aff_domain": "mit.edu;google.com;google.com;google.com;mit.edu;mila.quebec;openai.com;google.com;google.com",
        "position": "PhD student;Researcher;Researcher;Researcher;Full Professor;Associate Professor;Researcher;Research Scientist;Researcher",
        "bibtex": "@inproceedings{\nli2024leveraging,\ntitle={Leveraging Unpaired Data for Vision-Language Generative Models via Cycle Consistency},\nauthor={Tianhong Li and Sangnie Bhardwaj and Yonglong Tian and Han Zhang and Jarred Barber and Dina Katabi and Guillaume Lajoie and Huiwen Chang and Dilip Krishnan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=kNjrhD67LP}\n}",
        "github": "",
        "project": "",
        "reviewers": "ySUK;Qb8X;NW6v;xcv8",
        "pdf_size": 9029062,
        "rating": "6;6;8;8",
        "confidence": "4;3;3;4",
        "soundness": "3;3;4;3",
        "contribution": "3;3;4;3",
        "presentation": "3;3;3;4",
        "wc_summary": "82;66;130;64",
        "wc_strengths": "79;100;112;44",
        "wc_weaknesses": "221;151;129;344",
        "wc_questions": "8;104;71;5",
        "wc_review": "390;421;442;457",
        "wc_reply_reviewers": "0;17;0;0",
        "wc_reply_authors": "770;1051;441;1347",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "2;3;1;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            85.5,
            26.622359023948274
        ],
        "wc_strengths_avg": [
            83.75,
            25.810608284191986
        ],
        "wc_weaknesses_avg": [
            211.25,
            83.83428594554856
        ],
        "wc_questions_avg": [
            47.0,
            42.16040796766559
        ],
        "wc_review_avg": [
            427.5,
            25.144581921360317
        ],
        "wc_reply_reviewers_avg": [
            4.25,
            7.361215932167728
        ],
        "wc_reply_authors_avg": [
            902.25,
            335.4738253575083
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4808759083423112697&as_sdt=5,31&sciodt=0,31&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=kNjrhD67LP",
        "pdf": "https://openreview.net/pdf?id=kNjrhD67LP",
        "email": "mit.edu;google.com;google.com;google.com;mit.edu;mila.quebec;openai.com;google.com;google.com",
        "author_num": 9,
        "aff_unique_index": "0;1;1;1;0;2;3;1;1",
        "aff_unique_norm": "Massachusetts Institute of Technology;Google;Quebec Artificial Intelligence Institute;OpenAI",
        "aff_unique_dep": ";Google;Artificial Intelligence;",
        "aff_unique_url": "https://web.mit.edu;https://www.google.com;https://mila.quebec;https://openai.com",
        "aff_unique_abbr": "MIT;Google;Mila;OpenAI",
        "aff_campus_unique_index": "1;1;1;1;1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0;0;0;0;1;0;0;0",
        "aff_country_unique": "United States;Canada"
    },
    {
        "id": "kNm7TNIL6O",
        "title": "UPAR: A Kantian-Inspired Prompting Framework for Enhancing Large Language Model Capabilities",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) have demonstrated impressive inferential capabilities, with numerous research endeavors devoted to enhancing this capacity through prompting. Despite these efforts, a unified epistemological foundation is still conspicuously absent. Drawing inspiration from Kant's a priori philosophy, we propose the UPAR prompting framework, designed to emulate the structure of human cognition within LLMs. The UPAR framework is delineated into four phases: \u201cUnderstand\u201d, \u201cPlan\u201d, \u201cAct\u201d, and \u201cReflect\u201d, enabling the extraction of structured information from complex contexts, prior planning of solutions, execution according to plan, and self-reflection. This structure significantly augments the explainability and accuracy of LLM inference, producing a human-understandable and inspectable inferential trajectory. Furthermore, our work offers an epistemological foundation for existing prompting techniques, allowing for a possible systematic integration of these methods. With GPT-4, our approach elevates the accuracy from COT baseline of 22.92% to 58.33% in a challenging subset of GSM8K, and from 67.91% to 75.40% in the causal judgment task.",
        "keywords": "Natural Language Processing;Large Language Models;Transcendental Philosophy;Prompt;Reasoning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/a9b6fd3d987ac59c92a908390714f3e814ee78cc.zip",
        "author": "Hejia Geng;Boxun Xu;Peng Li",
        "authorids": "~Hejia_Geng1;~Boxun_Xu1;~Peng_Li8",
        "gender": "M;;M",
        "homepage": ";;https://www.ece.ucsb.edu/~lip/",
        "dblp": "355/2680;;83/6353-1.html",
        "google_scholar": "ameiXi0AAAAJ;;QYQUS7gAAAAJ",
        "orcid": ";;0000-0003-3548-4589",
        "linkedin": ";;peng-li-ucsb/",
        "or_profile": "~Hejia_Geng1;~Boxun_Xu1;~Peng_Li8",
        "aff": "University of California, Santa Barbara;;UC Santa Barbara",
        "aff_domain": "ucsb.edu;;ucsb.edu",
        "position": "MS student;;Professor",
        "bibtex": "@misc{\ngeng2024upar,\ntitle={{UPAR}: A Kantian-Inspired Prompting Framework for Enhancing Large Language Model Capabilities},\nauthor={Hejia Geng and Boxun Xu and Peng Li},\nyear={2024},\nurl={https://openreview.net/forum?id=kNm7TNIL6O}\n}",
        "github": "",
        "project": "",
        "reviewers": "Eftc;RawG;Yqz2",
        "site": "https://openreview.net/forum?id=kNm7TNIL6O",
        "pdf_size": 927697,
        "rating": "3;6;6",
        "confidence": "3;2;2",
        "soundness": "2;3;3",
        "contribution": "2;2;3",
        "presentation": "2;4;4",
        "wc_summary": "66;41;110",
        "wc_strengths": "75;34;51",
        "wc_weaknesses": "371;333;154",
        "wc_questions": "58;114;83",
        "wc_review": "570;522;398",
        "wc_reply_reviewers": "0;0;57",
        "wc_reply_authors": "750;1237;1078",
        "reply_reviewers": "0;0;1",
        "reply_authors": "2;3;3",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            72.33333333333333,
            28.522895287041873
        ],
        "wc_strengths_avg": [
            53.333333333333336,
            16.81930108205715
        ],
        "wc_weaknesses_avg": [
            286.0,
            94.61853236373236
        ],
        "wc_questions_avg": [
            85.0,
            22.90560339014597
        ],
        "wc_review_avg": [
            496.6666666666667,
            72.46761728907302
        ],
        "wc_reply_reviewers_avg": [
            19.0,
            26.870057685088806
        ],
        "wc_reply_authors_avg": [
            1021.6666666666666,
            202.76806673854958
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2664914605212641840&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of California, Santa Barbara",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucsb.edu",
        "aff_unique_abbr": "UCSB",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Santa Barbara",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Maximum Entropy Model Correction in Reinforcement Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17976",
        "id": "kNpSUN0uCc",
        "author_site": "Amin Rakhsha, Mete Kemertas, Mohammad Ghavamzadeh, Amir-massoud Farahmand",
        "tldr": "",
        "abstract": "We propose and theoretically analyze an approach for planning with an approximate model in reinforcement learning that can reduce the adverse impact of model error. If the model is accurate enough, it accelerates the convergence to the true value function too. One of its key components is the MaxEnt Model Correction (MoCo) procedure that corrects the model\u2019s next-state distributions based on a Maximum Entropy density estimation formulation. Based on MoCo, we introduce the Model Correcting Value Iteration (MoCoVI) algorithm, and its sampled-based variant MoCoDyna. We show that MoCoVI and MoCoDyna\u2019s convergence can be much faster than the conventional model-free algorithms. Unlike traditional model-based algorithms, MoCoVI and MoCoDyna effectively utilize an approximate model and still converge to the correct value function.",
        "keywords": "reinforcement learning;model-based reinforcement learning;maximum entropy;planning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Amin Rakhsha;Mete Kemertas;Mohammad Ghavamzadeh;Amir-massoud Farahmand",
        "authorids": "~Amin_Rakhsha1;~Mete_Kemertas1;~Mohammad_Ghavamzadeh2;~Amir-massoud_Farahmand1",
        "gender": "M;;M;M",
        "homepage": "https://arakhsha.github.io/;https://metekemertas.github.io/;http://academic.sologen.net/;https://mohammadghavamzadeh.github.io/",
        "dblp": "261/9027.html;;17/671;88/6389",
        "google_scholar": "Uqpl3zwAAAAJ;W6ANHtcAAAAJ;https://scholar.google.ca/citations?user=G5SAV7gAAAAJ;https://scholar.google.ca/citations?user=LHIPpCsAAAAJ",
        "orcid": ";;;",
        "linkedin": ";metekemertas/;amir-massoud-farahmand/;",
        "or_profile": "~Amin_Rakhsha1;~Mete_Kemertas1;~Amir-massoud_Farahmand1;~Mohammad_Ghavamzadeh1",
        "aff": "University of Toronto;University of Toronto;Vector Institute;Amazon AGI",
        "aff_domain": "toronto.edu;toronto.edu;vectorinstitute.ai;amazon.com",
        "position": "PhD student;PhD Candidate;Faculty Member;Senior Principal Scientist",
        "bibtex": "@inproceedings{\nrakhsha2024maximum,\ntitle={Maximum Entropy Model Correction in Reinforcement Learning},\nauthor={Amin Rakhsha and Mete Kemertas and Mohammad Ghavamzadeh and Amir-massoud Farahmand},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=kNpSUN0uCc}\n}",
        "github": "",
        "project": "",
        "reviewers": "aRvY;gS8c;sy6v",
        "pdf_size": 707642,
        "rating": "6;8;8",
        "confidence": "3;4;3",
        "soundness": "3;3;3",
        "contribution": "2;4;3",
        "presentation": "2;3;3",
        "wc_summary": "118;116;83",
        "wc_strengths": "31;29;74",
        "wc_weaknesses": "538;23;110",
        "wc_questions": "8;210;103",
        "wc_review": "695;378;370",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "2070;814;688",
        "reply_reviewers": "0;0;0",
        "reply_authors": "3;1;1",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            105.66666666666667,
            16.048537489614297
        ],
        "wc_strengths_avg": [
            44.666666666666664,
            20.75786330258702
        ],
        "wc_weaknesses_avg": [
            223.66666666666666,
            225.08714361824894
        ],
        "wc_questions_avg": [
            107.0,
            82.51464516476253
        ],
        "wc_review_avg": [
            481.0,
            151.35609226809032
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1190.6666666666667,
            623.9066881798556
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.49999999999999983,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17481700977021059088&as_sdt=800005&sciodt=0,15&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=kNpSUN0uCc",
        "pdf": "https://openreview.net/pdf?id=kNpSUN0uCc",
        "email": "toronto.edu;toronto.edu;vectorinstitute.ai;amazon.com",
        "author_num": 4,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "University of Toronto;Vector Institute;Amazon",
        "aff_unique_dep": ";;Amazon AGI",
        "aff_unique_url": "https://www.utoronto.ca;https://vectorinstitute.ai/;https://www.amazon.com",
        "aff_unique_abbr": "U of T;Vector Institute;Amazon",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "Canada;United States"
    },
    {
        "id": "kO8AxyGBxG",
        "title": "UNITE:Universally Trustworthy GNN Via Subgraph Identification",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph Neural Networks (GNNs) have become instrumental in modeling graph-structured data, with applications spanning diverse fields. Despite their prowess, challenges such as susceptibility to adversarial attacks, inherent biases, and opacity in decision-making processes have emerged. While efforts exist to address individual trustworthiness facets like robustness, interpretability, and fairness, a comprehensive solution remains elusive. This study introduces \\Algname(\\unite), a novel end-to-end framework uniquely designed to holistically integrate these dimensions. Unlike traditional approaches, \\Algname leverages the intricate relationships between these aspects in graph data, presenting optimization goals grounded in information-theoretic principles. Preliminary experiments on real-world datasets indicate that \\Algname outperforms existing methods, achieving a harmonious blend of interpretability, robustness, and fairness. This work   addresses the pressing challenges in GNNs for trustworthy graph neural networks, paving the way for their broader adoption in critical domains.",
        "keywords": "GNN;Trustworthy;Explainability;Robustness;Fairness",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Qizhang Feng;Qiaoyu Tan;Chaozhuo Li;Lichao Sun;Na Zou;Xing Xie;Xia Hu",
        "authorids": "~Qizhang_Feng1;~Qiaoyu_Tan2;~Chaozhuo_Li1;~Lichao_Sun1;~Na_Zou2;~Xing_Xie3;~Xia_Hu4",
        "gender": "M;M;;M;F;M;M",
        "homepage": ";https://qiaoyu-tan.github.io/;https://scss.bupt.edu.cn/info/1063/5534.htm;https://lichao-sun.github.io/;https://nzou1.github.io/;http://research.microsoft.com/en-us/people/xingx/;https://cs.rice.edu/~xh37/index.html",
        "dblp": "323/5667.html;197/5465.html;316/1269.html;121/0780-1.html;152/0090-1.html;08/6809-1;256/9406.html",
        "google_scholar": ";V9bOnV4AAAAJ;https://scholar.google.com/citations?hl=zh-CN;WhGUE7AAAAAJ;https://scholar.google.com/citations?hl=en;5EQfAFIAAAAJ;https://scholar.google.com.tw/citations?user=pcCS60IAAAAJ",
        "orcid": "0000-0002-2574-0270;0000-0001-8999-968X;0000-0002-8179-7503;;0000-0003-1984-795X;0000-0002-8608-8482;",
        "linkedin": "qizhang-feng-355478197/;;;lichao-sun-b273a290/;na-zou-a1721535/;xingx/;",
        "or_profile": "~Qizhang_Feng1;~Qiaoyu_Tan2;~Chaozhuo_Li1;~Lichao_Sun1;~Na_Zou2;~Xing_Xie3;~Xia_Hu2",
        "aff": "Texas A&M;New York University Shanghai;Beijing University of Posts and Telecommunications;Lehigh University;University of Houston;Microsoft Research Asia;Rice University",
        "aff_domain": "tamu.edu;nyu.edu;bupt.edu.cn;lehigh.edu;uh.edu;microsoft.com;rice.edu",
        "position": "PhD student;Assistant Professor;Associate Professor;Assistant Professor;Assistant Professor;Senior Principal Researcher;Associate Professor",
        "bibtex": "@misc{\nfeng2024uniteuniversally,\ntitle={{UNITE}:Universally Trustworthy {GNN} Via Subgraph Identification},\nauthor={Qizhang Feng and Qiaoyu Tan and Chaozhuo Li and Lichao Sun and Na Zou and Xing Xie and Xia Hu},\nyear={2024},\nurl={https://openreview.net/forum?id=kO8AxyGBxG}\n}",
        "github": "",
        "project": "",
        "reviewers": "XTBN;cwPo;Qd3u;4AEk;mTgk",
        "site": "https://openreview.net/forum?id=kO8AxyGBxG",
        "pdf_size": 350117,
        "rating": "3;3;3;5;8",
        "confidence": "4;4;4;3;5",
        "soundness": "3;3;2;2;4",
        "contribution": "2;2;2;2;4",
        "presentation": "1;4;2;3;3",
        "wc_summary": "24;40;42;85;112",
        "wc_strengths": "23;23;27;53;184",
        "wc_weaknesses": "147;238;167;136;143",
        "wc_questions": "286;118;299;21;106",
        "wc_review": "480;419;535;295;545",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            4.4,
            1.9595917942265424
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.8,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.4,
            0.8
        ],
        "presentation_avg": [
            2.6,
            1.019803902718557
        ],
        "wc_summary_avg": [
            60.6,
            32.702293497551516
        ],
        "wc_strengths_avg": [
            62.0,
            62.01935181860578
        ],
        "wc_weaknesses_avg": [
            166.2,
            37.34916331057498
        ],
        "wc_questions_avg": [
            166.0,
            108.64437399147735
        ],
        "wc_review_avg": [
            454.8,
            91.67420575058178
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.48412291827592707,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:vrxjPmR2Ir4J:scholar.google.com/&scioq=UNITE:Universally+Trustworthy+GNN+Via+Subgraph+Identification&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;4;5;6",
        "aff_unique_norm": "Texas A&M University;New York University;Beijing University of Posts and Telecommunications;Lehigh University;University of Houston;Microsoft;Rice University",
        "aff_unique_dep": ";;;;;Research;",
        "aff_unique_url": "https://www.tamu.edu;https://www.nyu.edu;http://www.bupt.edu.cn/;https://www.lehigh.edu;https://www.uh.edu;https://www.microsoft.com/en-us/research/group/asia;https://www.rice.edu",
        "aff_unique_abbr": "TAMU;NYU;BUPT;Lehigh;UH;MSR Asia;Rice",
        "aff_campus_unique_index": "1;2;3",
        "aff_campus_unique": ";Shanghai;Beijing;Asia",
        "aff_country_unique_index": "0;0;1;0;0;1;0",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "Dynamic Sparse Training with Structured Sparsity",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17975",
        "id": "kOBkxFRKTA",
        "author_site": "Mike Lasby, Anna Golubeva, Utku Evci, Mihai Nica, Yani Ioannou",
        "tldr": "",
        "abstract": "Dynamic Sparse Training (DST) methods achieve state-of-the-art results in sparse neural network training, matching the generalization of dense models while enabling sparse training and inference. Although the resulting models are highly sparse and theoretically less computationally expensive, achieving speedups with unstructured sparsity on real-world hardware is challenging. In this work, we propose a sparse-to-sparse DST method, Structured RigL (SRigL), to learn a variant of fine-grained structured N:M sparsity by imposing a constant fan-in constraint. Using our empirical analysis of existing DST methods at high sparsity, we additionally employ a neuron ablation method which enables SRigL to achieve state-of-the-art sparse-to-sparse structured DST performance on a variety of Neural Network (NN) architectures. Using a 90% sparse linear layer, we demonstrate a real-world acceleration of 3.4\u00d7/2.5\u00d7 on CPU for online inference and 1.7\u00d7/13.0\u00d7 on GPU for inference with a batch size of 256 when compared to equivalent dense/unstructured (CSR) sparse layers, respectively.",
        "keywords": "Machine Learning;dynamic sparse training;structured sparsity;N:M sparsity;efficient deep learning;RigL;SRigL;constant fan-in;dynamic neuron ablation;neuron ablation;structured and fine-grained sparsity;online inference;accelerating inference",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/4376ef03a99fb2d7635e3bd56023068affa04263.pdf",
        "author": "Mike Lasby;Anna Golubeva;Utku Evci;Mihai Nica;Yani Ioannou",
        "authorids": "~Mike_Lasby1;~Anna_Golubeva1;~Utku_Evci1;~Mihai_Nica1;~Yani_Ioannou1",
        "gender": "M;F;;M;M",
        "homepage": ";;http://evcu.github.io;https://nicam.uoguelph.ca/;https://yani.ai",
        "dblp": "319/5507;;179/8146;82/1677;119/5087",
        "google_scholar": "4odTWZMAAAAJ;https://scholar.google.com/citations?hl=en;8yGMMwcAAAAJ;R9L0aqAAAAAJ;Qy9yv44AAAAJ",
        "orcid": "0000-0002-7090-8773;;;0000-0002-4172-2195;0000-0002-9797-5888",
        "linkedin": "mike-lasby-779b4388/;;;;yanii/",
        "or_profile": "~Mike_Lasby1;~Anna_Golubeva1;~Utku_Evci1;~Mihai_Nica1;~Yani_Ioannou1",
        "aff": "Cerebras Systems, Inc;MIT;Google;University of Guelph;University of Calgary",
        "aff_domain": "cerebras.net;iaifi.org;google.com;uoguelph.ca;ucalgary.ca",
        "position": "Intern;Postdoc;Researcher;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nlasby2024dynamic,\ntitle={Dynamic Sparse Training with Structured Sparsity},\nauthor={Mike Lasby and Anna Golubeva and Utku Evci and Mihai Nica and Yani Ioannou},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=kOBkxFRKTA}\n}",
        "github": "",
        "project": "",
        "reviewers": "LY1T;HJFn;qWXP;UhkR;43nv",
        "pdf_size": 1139408,
        "rating": "5;6;6;6;8",
        "confidence": "4;4;2;3;4",
        "soundness": "3;3;3;3;3",
        "contribution": "3;2;2;2;3",
        "presentation": "2;3;3;3;3",
        "wc_summary": "70;23;51;98;32",
        "wc_strengths": "77;84;45;67;174",
        "wc_weaknesses": "111;185;40;130;165",
        "wc_questions": "162;99;38;94;143",
        "wc_review": "420;391;174;389;514",
        "wc_reply_reviewers": "84;32;17;0;85",
        "wc_reply_authors": "1060;923;853;662;1011",
        "reply_reviewers": "1;1;1;0;1",
        "reply_authors": "3;2;2;1;2",
        "rating_avg": [
            6.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.4,
            0.8
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            54.8,
            26.9918506219933
        ],
        "wc_strengths_avg": [
            89.4,
            44.301692969908046
        ],
        "wc_weaknesses_avg": [
            126.2,
            50.27683363140523
        ],
        "wc_questions_avg": [
            107.2,
            43.16202034196267
        ],
        "wc_review_avg": [
            377.6,
            111.50354254462053
        ],
        "wc_reply_reviewers_avg": [
            43.6,
            34.897564384925204
        ],
        "wc_reply_authors_avg": [
            901.8,
            139.4896411924556
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4
        ],
        "reply_authors_avg": [
            2.0,
            0.6324555320336759
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.15309310892394865,
        "gs_citation": 20,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12485754398035177555&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=kOBkxFRKTA",
        "pdf": "https://openreview.net/pdf?id=kOBkxFRKTA",
        "email": "cerebras.net;iaifi.org;google.com;uoguelph.ca;ucalgary.ca",
        "author_num": 5,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "Cerebras Systems;Massachusetts Institute of Technology;Google;University of Guelph;University of Calgary",
        "aff_unique_dep": ";;Google;;",
        "aff_unique_url": "https://www.cerebras.com;https://web.mit.edu;https://www.google.com;https://www.uoguelph.ca;https://www.ucalgary.ca",
        "aff_unique_abbr": "Cerebras;MIT;Google;U of G;U of C",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0;0;1;1",
        "aff_country_unique": "United States;Canada"
    },
    {
        "id": "kP6X9QBF1t",
        "title": "A Reinforcement Learning Approach to Effective Forecasting of Pediatric Hypoglycemia in Diabetes I Patients: an extended de Bruijn Graph",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Pediatric diabetes I is an endemic and an especially difficult disease; indeed, at this point, there does not exist a cure, but only careful management that relies on anticipating hypoglycemia. The changing physiology of children producing unique blood glucose signatures, coupled with inconsistent activities, e.g., playing, eating, napping, makes \u201cforecasting\u201d elusive.  While work has been done for adult diabetes I, this does not successfully translate for children.  In the work presented here, we adopt a reinforcement approach by leveraging the de Bruijn graph that has had success in detecting patterns in sequences of symbols\u2013most notably, genomics and proteomics.  We translate a continuous signal of blood glucose levels into an alphabet that then can be used to build a de Bruijn, with some extensions, to determine blood glucose states. The graph allows us to \u201ctune\u201d its efficacy by computationally ignoring edges that provide either no information or are not related to entering a hypoglycemic episode. We can then use paths in the graph to anticipate hypoglycemia in advance of about 30 minutes sufficient for a clinical setting and additionally find actionable rules that accurate and effective.",
        "keywords": "Reinforcement Learning;Forecasting;de Bruijn Graphs;Markov Chains",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Mert Onur Cakiroglu;HASAN KURBAN;Lilia Aljihmani;Khalid Qaraqe;Goran Petrovski;Mehmet Dalkilic",
        "authorids": "~Mert_Onur_Cakiroglu1;~HASAN_KURBAN1;~Lilia_Aljihmani1;~Khalid_Qaraqe1;~Goran_Petrovski1;~Mehmet_Dalkilic1",
        "gender": "M;M;F;M;M;M",
        "homepage": ";https://www.hasankurban.com;;http://people.qatar.tamu.edu/khalid.qaraqe/kqperso/;https://www.sidra.org/doctors-and-nurse-practitioners/goran-petrovski;https://luddy.indiana.edu/",
        "dblp": ";151/4752;;;;",
        "google_scholar": ";;https://scholar.google.com/citations?view_op=search_authors;https://scholar.google.com.tw/citations?user=bY3oBEAAAAAJ;;https://scholar.google.com.tw/citations?user=yW-I2CEAAAAJ",
        "orcid": ";0000-0003-3142-2866;0000-0001-7006-2432;;;",
        "linkedin": "mert-onur-cakiroglu/;;lilia-aljihmani-36345747/;;;",
        "or_profile": "~Mert_Onur_Cakiroglu1;~HASAN_KURBAN1;~Lilia_Aljihmani1;~Khalid_Qaraqe1;~Goran_Petrovski1;~Mehmet_Dalkilic1",
        "aff": "Indiana University;Texas A&M at Qatar;University of Chemical Technology and Metallurgy;Texas A&M University - College Station;Weill Cornell Medicine, Cornell University;",
        "aff_domain": "iu.edu;qatar.tamu.edu;uctm.edu;tamu.edu;med.cornell.edu;",
        "position": "PhD student;Assistant Professor;Associate Professor;Full Professor;Associate Professor;",
        "bibtex": "@misc{\ncakiroglu2024a,\ntitle={A Reinforcement Learning Approach to Effective Forecasting of Pediatric Hypoglycemia in Diabetes I Patients: an extended de Bruijn Graph},\nauthor={Mert Onur Cakiroglu and HASAN KURBAN and Lilia Aljihmani and Khalid Qaraqe and Goran Petrovski and Mehmet Dalkilic},\nyear={2024},\nurl={https://openreview.net/forum?id=kP6X9QBF1t}\n}",
        "github": "",
        "project": "",
        "reviewers": "LJA3;SBtP;SYj4",
        "site": "https://openreview.net/forum?id=kP6X9QBF1t",
        "pdf_size": 5794490,
        "rating": "3;3;3",
        "confidence": "5;3;4",
        "soundness": "2;1;2",
        "contribution": "2;2;2",
        "presentation": "3;2;3",
        "wc_summary": "76;55;53",
        "wc_strengths": "30;104;12",
        "wc_weaknesses": "108;111;174",
        "wc_questions": "32;171;5",
        "wc_review": "246;441;244",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            61.333333333333336,
            10.402991022884823
        ],
        "wc_strengths_avg": [
            48.666666666666664,
            39.81066300488964
        ],
        "wc_weaknesses_avg": [
            131.0,
            30.430248109405877
        ],
        "wc_questions_avg": [
            69.33333333333333,
            72.72933077896121
        ],
        "wc_review_avg": [
            310.3333333333333,
            92.39889369227078
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:G1tUC6G8xmIJ:scholar.google.com/&scioq=A+Reinforcement+Learning+Approach+to+Effective+Forecasting+of+Pediatric+Hypoglycemia+in+Diabetes+I+Patients:+an+extended+de+Bruijn+Graph&hl=en&as_sdt=0,10",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;2;1;3",
        "aff_unique_norm": "Indiana University;Texas A&M University;Meta;Cornell University",
        "aff_unique_dep": ";;University of Chemical Technology and Metallurgy;",
        "aff_unique_url": "https://www.indiana.edu;https://www.tamu.edu;https://uctm.bg;https://www.weill.cornell.edu",
        "aff_unique_abbr": "IU;TAMU;;Cornell",
        "aff_campus_unique_index": "1;2;3",
        "aff_campus_unique": ";Qatar;College Station;Weill Cornell Medicine",
        "aff_country_unique_index": "0;1;2;0;0",
        "aff_country_unique": "United States;Qatar;Bulgaria"
    },
    {
        "id": "kPVSWonJqs",
        "title": "Accelerated Inference and Reduced Forgetting: The Dual Benefits of Early-Exit Networks in Continual Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In the pursuit of a sustainable future for machine learning, energy-efficient neural network models are crucial. A practical approach to achieving this efficiency is through early-exit strategies. These strategies allow for swift predictions by making decisions early in the network, thereby conserving computation time and resources. However, so far the early-exit neural networks have only been developed\nfor stationary data distributions, which restricts their application in real-world scenarios where training data is derived from continuous non-stationary data. In this study, we aim to explore the continual training for early-exit networks. Specifically, we adapt the existing continual learning methods to fit early-exit architectures and introduce task-aware dynamic inference to improve the network accuracy for a given compute budgets. Finally, we evaluate continually those methods on the standard benchmarks to assess their accuracy and efficiency. Our work highlights the practical advantages of the early-exit networks in real-world continual learning scenarios.",
        "keywords": "Continual learning;dynamic network",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/98cf1f3a7055db4469a030feaa303f2f508d004d.pdf",
        "author": "Filip Szatkowski;Fei Yang;Bart\u0142omiej Twardowski;Tomasz Trzcinski;Joost van de Weijer",
        "authorids": "~Filip_Szatkowski1;~Fei_Yang4;~Bart\u0142omiej_Twardowski1;~Tomasz_Trzcinski2;~Joost_van_de_Weijer5",
        "gender": "M;M;M;M;M",
        "homepage": ";;;https://cvlab.ii.pw.edu.pl/ttrzcins/;http://lamp.cvc.uab.es/",
        "dblp": "323/8425;19/2504-4;156/6628;05/11408;67/3379",
        "google_scholar": "xjnAIOEAAAAJ;S1gksNwAAAAJ;https://scholar.google.pl/citations?user=8yywECgAAAAJ;https://scholar.google.pl/citations?user=bJMRBFoAAAAJ;https://scholar.google.es/citations?user=Gsw2iUEAAAAJ",
        "orcid": "0000-0001-8592-2001;;0000-0003-2117-8679;;0000-0002-9656-9706",
        "linkedin": "fszatkowski/;;bartlomiejtwardowski/;;",
        "or_profile": "~Filip_Szatkowski1;~Fei_Yang4;~Bart\u0142omiej_Twardowski1;~Tomasz_Trzcinski2;~Joost_van_de_Weijer1",
        "aff": "Amazon;Nankai University;Computer Vision Center, Universitat Aut\u00f2noma de Barcelona;Warsaw University of Technology;Computer Vision Center, Universitat Aut\u00f3noma de Barcelona",
        "aff_domain": "amazon.de;nankai.edu.cn;cvc.uab.es;pw.edu.pl;cvc.uab.es",
        "position": "Intern;Assistant Professor;Postdoc;Full Professor;Researcher",
        "bibtex": "@misc{\nszatkowski2024accelerated,\ntitle={Accelerated Inference and Reduced Forgetting: The Dual Benefits of Early-Exit Networks in Continual Learning},\nauthor={Filip Szatkowski and Fei Yang and Bart{\\l}omiej Twardowski and Tomasz Trzcinski and Joost van de Weijer},\nyear={2024},\nurl={https://openreview.net/forum?id=kPVSWonJqs}\n}",
        "github": "",
        "project": "",
        "reviewers": "Xsg7;cGA4;AuwN",
        "site": "https://openreview.net/forum?id=kPVSWonJqs",
        "pdf_size": 2071975,
        "rating": "3;3;6",
        "confidence": "4;4;4",
        "soundness": "2;3;3",
        "contribution": "2;2;3",
        "presentation": "2;4;3",
        "wc_summary": "140;128;72",
        "wc_strengths": "42;69;41",
        "wc_weaknesses": "289;215;153",
        "wc_questions": "10;64;2",
        "wc_review": "481;476;268",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            113.33333333333333,
            29.634814361190493
        ],
        "wc_strengths_avg": [
            50.666666666666664,
            12.970050972229146
        ],
        "wc_weaknesses_avg": [
            219.0,
            55.59376463837169
        ],
        "wc_questions_avg": [
            25.333333333333332,
            27.535835237417846
        ],
        "wc_review_avg": [
            408.3333333333333,
            99.25164426289818
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:kjh2HC_FpSQJ:scholar.google.com/&scioq=Accelerated+Inference+and+Reduced+Forgetting:+The+Dual+Benefits+of+Early-Exit+Networks+in+Continual+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "Amazon;Nankai University;Universitat Aut\u00f2noma de Barcelona;Warsaw University of Technology;Universitat Aut\u00f3noma de Barcelona",
        "aff_unique_dep": "Amazon.com, Inc.;;Computer Vision Center;;Computer Vision Center",
        "aff_unique_url": "https://www.amazon.com;http://www.nankai.edu.cn;https://www.uab.cat;https://www.pw.edu.pl;https://www.uab.cat",
        "aff_unique_abbr": "Amazon;NKU;UAB;WUT;UAB",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;3;2",
        "aff_country_unique": "United States;China;Spain;Poland"
    },
    {
        "title": "Neuron-Enhanced AutoEncoder Matrix Completion and Collaborative Filtering: Theory and Practice",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17974",
        "id": "kPrxk6tUcg",
        "author_site": "Jicong Fan, Rui Chen, Zhao Zhang, Chris Ding",
        "tldr": "",
        "abstract": "Neural networks have shown promising performance in collaborative filtering and matrix completion but the theoretical analysis is limited and there is still room for improvement in terms of the accuracy of recovering missing values. This paper presents a neuron-enhanced autoencoder matrix completion (AEMC-NE) method and applies it to collaborative filtering. Our AEMC-NE adds an element-wise autoencoder to each output of the main autoencoder to enhance the reconstruction capability. Thus it can adaptively learn an activation function for the output layer to approximate possibly complicated response functions in real data. We provide theoretical analysis for AEMC-NE as well as AEMC to investigate the generalization ability of autoencoder and deep learning in matrix completion, considering both missing completely at random and missing not at random. We show that the element-wise neural network has the potential to reduce the generalization error bound, the data sparsity can be useful, and the prediction performance is closely related to the difference between the numbers of variables and samples. The numerical results on synthetic data and benchmark datasets demonstrated the effectiveness of AEMC-NE in comparison to many baselines.",
        "keywords": "autoencoder;matrix completion;collaborative filtering",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/c82d72d1b6aa10a807f6aa1e80507abb00897f90.zip",
        "author": "Jicong Fan;Rui Chen;Zhao Zhang;Chris Ding",
        "authorids": "~Jicong_Fan2;~Rui_Chen10;~Zhao_Zhang3;~Chris_Ding1",
        "gender": "M;;M;M",
        "homepage": "https://jicongfan.github.io/;;http://www.escience.cn/people/cszzhang;http://ranger.uta.edu/~chqding/",
        "dblp": "139/1570;;87/6853-1;https://dblp.uni-trier.de/pers/hd/d/Ding:Chris",
        "google_scholar": "vdJsnhIAAAAJ;;h6SCUNwAAAAJ;q7FfnjgAAAAJ",
        "orcid": "0000-0001-9665-0355;;0000-0002-5703-7969;",
        "linkedin": ";%E7%9D%BF-%E9%99%88-7936b3160/;;",
        "or_profile": "~Jicong_Fan2;~Rui_Chen10;~Zhao_Zhang3;~Chris_Ding1",
        "aff": "The Chinese University of Hong Kong, Shenzhen;;Hefei University of Technology;University of Texas at Arlington",
        "aff_domain": "cuhk.edu.cn;;hfut.edu;cse.uta.edu",
        "position": "Assistant Professor;;Full Professor;Professor",
        "bibtex": "@inproceedings{\nfan2024neuronenhanced,\ntitle={Neuron-Enhanced AutoEncoder Matrix Completion and Collaborative Filtering: Theory and Practice},\nauthor={Jicong Fan and Rui Chen and Zhao Zhang and Chris Ding},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=kPrxk6tUcg}\n}",
        "github": "",
        "project": "",
        "reviewers": "fr12;THxa;fbH8;uVGT",
        "pdf_size": 2207603,
        "rating": "6;8;8;8",
        "confidence": "5;4;5;5",
        "soundness": "4;3;4;3",
        "contribution": "3;3;3;4",
        "presentation": "3;3;4;3",
        "wc_summary": "44;35;47;52",
        "wc_strengths": "75;58;93;74",
        "wc_weaknesses": "56;64;74;5",
        "wc_questions": "94;184;153;100",
        "wc_review": "269;341;367;231",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "267;487;499;284",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            44.5,
            6.18465843842649
        ],
        "wc_strengths_avg": [
            75.0,
            12.389511693363866
        ],
        "wc_weaknesses_avg": [
            49.75,
            26.61179249881526
        ],
        "wc_questions_avg": [
            132.75,
            37.45246987850067
        ],
        "wc_review_avg": [
            302.0,
            54.48853090330111
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            384.25,
            108.99856650433527
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9477203699750124873&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=kPrxk6tUcg",
        "pdf": "https://openreview.net/pdf?id=kPrxk6tUcg",
        "email": "cuhk.edu.cn;;hfut.edu;cse.uta.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Chinese University of Hong Kong;Hefei University of Technology;University of Texas at Arlington",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.cuhk.edu.cn;http://www.hfut.edu.cn/;https://www.uta.edu",
        "aff_unique_abbr": "CUHK;HUT;UTA",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Shenzhen;;Arlington",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "kQPAAXRswY",
        "title": "Stabilizing Policy Gradients for Stochastic Differential Equations by enforcing Consistency with Perturbation Process",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep neural networks parameterized stochastic differential equations (SDEs) received increasing attention from the machine learning community due to their high expressiveness and solid theoretical foundations, with a wide range of applications in generative models. However, maximizing likelihood of training data, the objective of generative models, does not always meet our requirements in many real-world problems. Fortunately, introducing reinforcement learning (e.g., policy gradient) here to maximize a reward, using SDE-based policy, may bridge this gap. Nevertheless, when applying policy gradients to SDEs, since the policy gradient is estimated on a finite set of trajectories, it can be ill-defined, and the policy behavior in data-scarce regions may be uncontrolled. These challenges compromise the stability of policy gradients and negatively impact sample complexity. To address these issues, we propose constraining the SDE to be consistent with its associated perturbation process. Since the perturbation process covers the entire space and is easy to sample, we can mitigate the aforementioned problems. Our framework offers a general approach for training SDEs using policy gradients, allowing for a versatile selection of policy gradients to effectively and efficiently train SDEs. We evaluate our algorithm on the task of structure-based drug design and optimize the binding affinity of generated ligand molecules. Our method achieves the best Vina score (-9.07)  on the CrossDocked2020 dataset.",
        "keywords": "stochastic differential equation; reinforcement learning; diffusion models",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/1976de642cbab134a232fb3a42b0d36def419dcc.zip",
        "author": "Xiangxin Zhou;Liang Wang;Yichi Zhou",
        "authorids": "~Xiangxin_Zhou1;~Liang_Wang3;~Yichi_Zhou2",
        "gender": "Not Specified;M;",
        "homepage": ";;https://www.microsoft.com/en-us/research/people/yiczho/",
        "dblp": "247/9275;56/4499-1;203/4453",
        "google_scholar": "eQgIWcQAAAAJ;;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Xiangxin_Zhou1;~Liang_Wang3;~Yichi_Zhou2",
        "aff": "Institute of Automation, Chinese Academy of Sciences;Institute of Automation\uff0c CAS\uff0cChina;Microsoft",
        "aff_domain": "ia.ac.cn;ia.ac.cn;microsoft.com",
        "position": "PhD student;Full Professor;Microsoft research",
        "bibtex": "@misc{\nzhou2024stabilizing,\ntitle={Stabilizing Policy Gradients for Stochastic Differential Equations by enforcing Consistency with Perturbation Process},\nauthor={Xiangxin Zhou and Liang Wang and Yichi Zhou},\nyear={2024},\nurl={https://openreview.net/forum?id=kQPAAXRswY}\n}",
        "github": "",
        "project": "",
        "reviewers": "QQeh;4LjP;eNtv",
        "site": "https://openreview.net/forum?id=kQPAAXRswY",
        "pdf_size": 8347384,
        "rating": "5;6;6",
        "confidence": "3;1;2",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "2;3;3",
        "wc_summary": "113;60;45",
        "wc_strengths": "47;54;22",
        "wc_weaknesses": "282;104;63",
        "wc_questions": "4;74;100",
        "wc_review": "446;292;230",
        "wc_reply_reviewers": "0;35;247",
        "wc_reply_authors": "1285;930;1168",
        "reply_reviewers": "0;1;2",
        "reply_authors": "3;2;4",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            2.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            72.66666666666667,
            29.169999809545573
        ],
        "wc_strengths_avg": [
            41.0,
            13.73559851869101
        ],
        "wc_weaknesses_avg": [
            149.66666666666666,
            95.05904597786694
        ],
        "wc_questions_avg": [
            59.333333333333336,
            40.54078878802872
        ],
        "wc_review_avg": [
            322.6666666666667,
            90.80871225946451
        ],
        "wc_reply_reviewers_avg": [
            94.0,
            109.12683751793904
        ],
        "wc_reply_authors_avg": [
            1127.6666666666667,
            147.70766925097544
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            3.0,
            0.816496580927726
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:42gg-TqnObsJ:scholar.google.com/&scioq=Stabilizing+Policy+Gradients+for+Stochastic+Differential+Equations+by+enforcing+Consistency+with+Perturbation+Process&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Chinese Academy of Sciences;Microsoft",
        "aff_unique_dep": "Institute of Automation;Microsoft Corporation",
        "aff_unique_url": "http://www.ia.cas.cn;https://www.microsoft.com",
        "aff_unique_abbr": "CAS;Microsoft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "kQqZVayz07",
        "title": "Aligning Agents like Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Training agents to behave as desired in complex 3D environments from visual information is challenging. Imitation learning from diverse human behaviour provides a scalable mechanism for training an agent with generally sensible behaviours, but such an agent may not perform the specific behaviours of interest when deployed. To address this issue, we draw an analogy between the undesirable behaviours of imitation learning agents and the unhelpful responses of unaligned large language models (LLMs). We then investigate how the procedure for aligning LLMs can be applied to aligning agents from pixels in a complex 3D environment. For our analysis, we utilise an academically illustrative part of a modern console game in which the human behaviour distribution is diverse, but we would like our agent to imitate a single mode of this behaviour. We find that we can align our base agent to consistently perform the desired behaviour, providing a demonstration of a general approach for training agents to perform specific behaviours in complex environments.",
        "keywords": "imitation learning;reinforcement learning;preference learning;alignment",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Adam Jelley;Yuhan Cao;David Bignell;Sam Devlin;Tabish Rashid",
        "authorids": "~Adam_Jelley1;~Yuhan_Cao1;~David_Bignell1;~Sam_Devlin2;~Tabish_Rashid1",
        "gender": "M;;M;M;M",
        "homepage": "https://adamjelley.github.io;https://yyyuhan.github.io/;;;",
        "dblp": "339/0093;;183/0963;64/7502;196/5069",
        "google_scholar": "39t3yJcAAAAJ;;;https://scholar.google.com/citations?hl=en;d4BeWwcAAAAJ",
        "orcid": "0000-0002-0052-482X;;;0000-0002-7769-3090;",
        "linkedin": "adamjelley/;yuhan-cao-859633129/;;https://www.linkedin.com/pub/sam-devlin/83/810/b23;",
        "or_profile": "~Adam_Jelley1;~Yuhan_Cao1;~David_Bignell1;~Sam_Devlin2;~Tabish_Rashid1",
        "aff": "University of Edinburgh, University of Edinburgh;;Microsoft Research;Microsoft Research;Microsoft",
        "aff_domain": "ed.ac.uk;;research.microsoft.com;microsoft.com;microsoft.com",
        "position": "PhD student;;Researcher;Principal Researcher;Researcher",
        "bibtex": "@misc{\njelley2024aligning,\ntitle={Aligning Agents like Large Language Models},\nauthor={Adam Jelley and Yuhan Cao and David Bignell and Sam Devlin and Tabish Rashid},\nyear={2024},\nurl={https://openreview.net/forum?id=kQqZVayz07}\n}",
        "github": "",
        "project": "",
        "reviewers": "Lh2V;S6ki;B6a1;SbPz",
        "site": "https://openreview.net/forum?id=kQqZVayz07",
        "pdf_size": 5984471,
        "rating": "3;3;5;5",
        "confidence": "3;3;4;4",
        "soundness": "1;3;2;3",
        "contribution": "1;1;2;2",
        "presentation": "2;3;3;2",
        "wc_summary": "88;108;56;115",
        "wc_strengths": "22;102;17;140",
        "wc_weaknesses": "175;269;183;281",
        "wc_questions": "2;2;16;70",
        "wc_review": "287;481;272;606",
        "wc_reply_reviewers": "34;0;28;0",
        "wc_reply_authors": "979;1038;1308;1262",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            91.75,
            22.895141405983935
        ],
        "wc_strengths_avg": [
            70.25,
            52.52796874047196
        ],
        "wc_weaknesses_avg": [
            227.0,
            48.27007354458868
        ],
        "wc_questions_avg": [
            22.5,
            28.01338965566288
        ],
        "wc_review_avg": [
            411.5,
            139.3027278986309
        ],
        "wc_reply_reviewers_avg": [
            15.5,
            15.644487847162015
        ],
        "wc_reply_authors_avg": [
            1146.75,
            140.75754864304793
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14134211168879493167&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "University of Edinburgh;Microsoft",
        "aff_unique_dep": ";Microsoft Research",
        "aff_unique_url": "https://www.ed.ac.uk;https://www.microsoft.com/en-us/research",
        "aff_unique_abbr": "Edinburgh;MSR",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "id": "kQwULZhiSF",
        "title": "Unsupervised Discovery of Object-Centric Neural Fields",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We study inferring 3D object-centric scene representations from a single image. While recent methods have shown potential in unsupervised 3D object discovery from simple synthetic images, they fail to generalize to real-world scenes with visually rich and diverse objects. This limitation stems from their object representations, which entangle objects' intrinsic attributes like shape and appearance with extrinsic, viewer-centric properties such as their 3D location. To address this fundamental bottleneck, we propose unsupervised discovery of Object-Centric neural Fields (uOCF). uOCF focuses on learning the intrinsics of objects and models the extrinsics separately. Our approach significantly improves systematic generalization, thus enabling unsupervised learning of high-fidelity object-centric scene representations from sparse real-world images. To evaluate our approach, we collect three new datasets including two real kitchen environments. Extensive experiments show that uOCF enables unsupervised discovery of visually rich objects from a single real image, allowing applications such as 3D object segmentation and scene manipulation. Impressively, uOCF even demonstrates zero-shot generalizability to unseen, more difficult objects. We attach an overview video in our supplement.",
        "keywords": "object discovery;scene decomposition;3D scene representations;object-centric learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/2cf6aa13b747968b9580c64be11142f17e88bdd9.zip",
        "author": "Rundong Luo;Hong-Xing Yu;Jiajun Wu",
        "authorids": "~Rundong_Luo1;~Hong-Xing_Yu1;~Jiajun_Wu1",
        "gender": "M;M;M",
        "homepage": "https://red-fairy.github.io/;https://kovenyu.com;https://jiajunwu.com",
        "dblp": "328/0914;205/2676.html;117/4768",
        "google_scholar": "dc8tL2sAAAAJ;kNKncZcAAAAJ;2efgcS0AAAAJ",
        "orcid": "0009-0005-3219-0376;;0000-0002-4176-343X",
        "linkedin": ";;jiajunwu/",
        "or_profile": "~Rundong_Luo1;~Hong-Xing_Yu1;~Jiajun_Wu1",
        "aff": "Peking University;Stanford University;Stanford University",
        "aff_domain": "pku.edu.cn;cs.stanford.edu;stanford.edu",
        "position": "Undergrad student;PhD student;Assistant Professor",
        "bibtex": "@misc{\nluo2024unsupervised,\ntitle={Unsupervised Discovery of Object-Centric Neural Fields},\nauthor={Rundong Luo and Hong-Xing Yu and Jiajun Wu},\nyear={2024},\nurl={https://openreview.net/forum?id=kQwULZhiSF}\n}",
        "github": "",
        "project": "",
        "reviewers": "TQPk;jMSr;Qciw;ZWx8",
        "site": "https://openreview.net/forum?id=kQwULZhiSF",
        "pdf_size": 6904063,
        "rating": "3;6;6;8",
        "confidence": "5;4;4;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;4;3",
        "wc_summary": "95;79;60;89",
        "wc_strengths": "46;64;92;86",
        "wc_weaknesses": "249;602;163;134",
        "wc_questions": "111;3;105;78",
        "wc_review": "501;748;420;387",
        "wc_reply_reviewers": "571;22;8;133",
        "wc_reply_authors": "1940;1446;541;696",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "3;2;1;1",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            80.75,
            13.273563952458284
        ],
        "wc_strengths_avg": [
            72.0,
            18.275666882497067
        ],
        "wc_weaknesses_avg": [
            287.0,
            186.71770135688797
        ],
        "wc_questions_avg": [
            74.25,
            42.97310205233036
        ],
        "wc_review_avg": [
            514.0,
            141.3240956100551
        ],
        "wc_reply_reviewers_avg": [
            183.5,
            228.90445605099086
        ],
        "wc_reply_authors_avg": [
            1155.75,
            567.5783536217709
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8892972917998875,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7808202271013791706&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Peking University;Stanford University",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.stanford.edu",
        "aff_unique_abbr": "Peking U;Stanford",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Stanford",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "kRdcwzEL5J",
        "title": "CUS3D: A New Comprehensive Urban-Scale Semantic Segmentation 3D Benchmark Dataset",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "With the continuous advancement of smart city construction, the availability of large-scale and semantically enriched datasets is essential for enhancing the machine\u2019s ability to understand urban scene. When dealing with large-scale scene, mesh data has a distinct advantage over point cloud data, as it can provide inherent geometric topology information and consume low memory space. However, existing publicly available large-scale scene mesh datasets have limitations in scale and semantic richness, and cannot cover a wider range of urban semantic information. Moreover, the prevailing large-scale 3D datasets mainly consist of a single data type, which restricts the wide applicability of benchmark applications and hinders the further development of 3D semantic segmentation techniques in urban scene. To address these issues, we propose a comprehensive urban-scale semantic segmentation benchmark dataset. This dataset provides finely annotated point cloud and mesh data types for 3D, as well as high-resolution original 2D images with detailed 2D semantic annotations. It is well suited for various research pursuits on semantic segmentation methodologies. The dataset covers a vast area of approximately 2.85 square kilometers, containing 10 semantic labels that span both urban and rural scenes. Each 3D point or triangular mesh in the dataset is meticulously labeled with one of ten semantic categories. We evaluate the performance of this novel benchmark dataset using 6 widely adopted deep learning baselines. The dataset will be publicly available upon the publish of the paper.",
        "keywords": "Urban scene understanding;Comprehensive urban-scale dataset;Semantic segmentation;Benchmark dataset",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/e96d12d1350732bb69d9112fd3b22e757022b1e2.pdf",
        "author": "Lin Gao;Yu Liu;Shen Yan;Yuxiang Liu;Maojun Zhang",
        "authorids": "~Lin_Gao3;~Yu_Liu4;~Shen_Yan6;~Yuxiang_Liu2;~Maojun_Zhang1",
        "gender": "M;M;M;M;M",
        "homepage": "https://blog.csdn.net/RhythmKD7?type=blog;;;;",
        "dblp": ";97/2274-8;;;",
        "google_scholar": ";;;;",
        "orcid": ";;0000-0002-1415-5113;0000-0001-5565-8297;0000-0001-6748-0545",
        "linkedin": ";;;;",
        "or_profile": "~Lin_Gao3;~Yu_Liu4;~Shen_Yan6;~Yuxiang_Liu2;~Maojun_Zhang1",
        "aff": "National University of Defense Technology;National University of Defense Technology;National University of Defense Technology;National University of Defense Technology;National University of Defense Technology",
        "aff_domain": "nudt.edu.cn;nudt.edu.cn;nudt.edu.cn;nudt.edu.cn;nudt.edu.cn",
        "position": "MS student;Full Professor;Lecturer;PhD student;Full Professor",
        "bibtex": "@misc{\ngao2024cusd,\ntitle={{CUS}3D: A New Comprehensive Urban-Scale Semantic Segmentation 3D Benchmark Dataset},\nauthor={Lin Gao and Yu Liu and Shen Yan and Yuxiang Liu and Maojun Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=kRdcwzEL5J}\n}",
        "github": "",
        "project": "",
        "reviewers": "a7Fe;e913;ta5R;WLD1",
        "site": "https://openreview.net/forum?id=kRdcwzEL5J",
        "pdf_size": 13290904,
        "rating": "5;5;5;6",
        "confidence": "5;4;5;4",
        "soundness": "3;2;3;3",
        "contribution": "3;3;2;4",
        "presentation": "3;3;4;3",
        "wc_summary": "64;162;64;49",
        "wc_strengths": "52;96;65;67",
        "wc_weaknesses": "202;760;196;292",
        "wc_questions": "29;136;139;3",
        "wc_review": "347;1154;464;411",
        "wc_reply_reviewers": "0;50;0;0",
        "wc_reply_authors": "820;1723;1263;1006",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "5;9;8;5",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            84.75,
            45.018746095376756
        ],
        "wc_strengths_avg": [
            70.0,
            16.077935190813527
        ],
        "wc_weaknesses_avg": [
            362.5,
            232.62577243289275
        ],
        "wc_questions_avg": [
            76.75,
            61.45069161531056
        ],
        "wc_review_avg": [
            594.0,
            325.9593532942413
        ],
        "wc_reply_reviewers_avg": [
            12.5,
            21.650635094610966
        ],
        "wc_reply_authors_avg": [
            1203.0,
            338.9314089900787
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            6.75,
            1.7853571071357126
        ],
        "replies_avg": [
            33,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13934713030644646290&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "National University of Defense Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.nudt.edu.cn/",
        "aff_unique_abbr": "NUDT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "kT0vIJA8CT",
        "title": "Can Differentiable Decision Trees Learn Interpretable Reward Functions?",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "There is an increasing interest in learning reward functions that model human\nintent and human preferences. However, many frameworks use blackbox learning\nmethods that, while expressive, are difficult to interpret. We propose and evaluate\na novel approach for learning expressive and interpretable reward functions from\npreferences using Differentiable Decision Trees (DDTs). Our experiments across\nseveral domains, including Cartpole, Visual Gridworld environments and Atari\ngames, provide evidence that that the tree structure of our learned reward function is\nuseful in determining the extent to which the reward function is aligned with human\npreferences. We experimentally demonstrate that using reward DDTs results in\ncompetitive performance when compared with larger capacity deep neural network\nreward functions. We also observe that the choice between soft and hard (argmax)\noutput of reward DDT reveals a tension between wanting highly shaped rewards\nto ensure good RL performance, while also wanting simpler, more interpretable\nrewards.",
        "keywords": "Reinforcement Learning;Human-AI Alignment;Explainability;Reward Functions;Interpretability;RLHF;Visualization or interpretation of learned representations",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/6776701e36443ddb9712d197431bacdcf33d37d5.pdf",
        "author": "Akansha Kalra;Daniel S. Brown",
        "authorids": "~Akansha_Kalra1;~Daniel_S._Brown1",
        "gender": "F;M",
        "homepage": ";https://www.cs.utah.edu/~dsbrown/",
        "dblp": ";141/7769",
        "google_scholar": "QrkO660AAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";",
        "linkedin": "akansha-kalra/;",
        "or_profile": "~Akansha_Kalra1;~Daniel_S._Brown1",
        "aff": "University of Utah;University of Utah",
        "aff_domain": "cs.utah.edu;utah.edu",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nkalra2024can,\ntitle={Can Differentiable Decision Trees Learn Interpretable Reward Functions?},\nauthor={Akansha Kalra and Daniel S. Brown},\nyear={2024},\nurl={https://openreview.net/forum?id=kT0vIJA8CT}\n}",
        "github": "",
        "project": "",
        "reviewers": "sBA3;wNaa;V4Dp;qpnV",
        "site": "https://openreview.net/forum?id=kT0vIJA8CT",
        "pdf_size": 1985495,
        "rating": "3;5;6;6",
        "confidence": "4;3;4;4",
        "soundness": "2;2;3;3",
        "contribution": "3;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "42;91;65;44",
        "wc_strengths": "40;24;52;41",
        "wc_weaknesses": "189;138;3;79",
        "wc_questions": "49;8;92;22",
        "wc_review": "320;261;212;186",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "866;928;894;773",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;2;2;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            60.5,
            19.78004044485248
        ],
        "wc_strengths_avg": [
            39.25,
            9.98436277385793
        ],
        "wc_weaknesses_avg": [
            102.25,
            69.27255950230222
        ],
        "wc_questions_avg": [
            42.75,
            32.02635633349507
        ],
        "wc_review_avg": [
            244.75,
            51.11445490269851
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            865.25,
            57.60805065266486
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12045135874522168958&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Utah",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.utah.edu",
        "aff_unique_abbr": "Utah",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "kTRGF2JEcx",
        "title": "Instructing Large Language Models to Identify and Ignore Irrelevant Conditions",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Math word problem (MWP) solving requires generating a reasoning path based on a given problem description that often contains irrelevant conditions. Existing chain-of-thought (CoT) prompting methods elicited multi-step reasoning abilities of large language models (LLMs) to solve MWPs. However, they were seriously confused by the irrelevant conditions, resulting in low accuracy. In this paper, we propose a novel approach named I$^3$C that instructs LLMs to identify and ignore irrelevant conditions. It identifies a set of irrelevant condition candidates that have a weak semantic relevance with the question. Then it prompts LLMs to verify the irrelevant conditions. Lastly it instructs the LLMs with the verification on relevant and irrelevant conditions to avoid confusion and improve reasoning paths. Moreover, we propose to select (problem, reasoning paths)-pairs as demonstrations to enhance I$^3$C with few-shot reasoning. We develop I$^3$C-Select that selects the most confusing problems based on the semantic relevance measurement. We conduct extensive experiments on six MWP datasets. I$^3$C can be combined with any CoT prompting methods to improve the performance of solving MWPs. Notably, I$^3$C-Select achieves an accuracy of $93.7$ and $90.9$ on GSM-IC2-1K and GSM-ICM-1K, respectively, significantly outperforming the state-of-the-art few-shot prompting method Auto-CoT by $+19.4$ and $+25.7$.",
        "keywords": "Math Word Problem Solving;Multi-step Reasoning;Prompting;Chain-of-Thought;Large Language Models",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/4fb948b6786d80230ba862a93dc64ba21e6a04df.zip",
        "author": "Zhenyu Wu;Meng Jiang;Chao Shen",
        "authorids": "~Zhenyu_Wu9;~Meng_Jiang3;~Chao_Shen2",
        "gender": "M;M;M",
        "homepage": "https://www.linkedin.com/in/%E6%8C%AF%E5%AE%87-%E5%90%B4-759373321/;http://www.meng-jiang.com/;http://gr.xjtu.edu.cn/web/cshen",
        "dblp": "41/1571.html;69/339-1;48/4825-1",
        "google_scholar": "https://scholar.google.com/citations?hl=en;LZIPfCkAAAAJ;m6QY7-wAAAAJ",
        "orcid": "0009-0001-2674-6762;0000-0002-3009-519X;0000-0002-6959-0569",
        "linkedin": ";meng-jiang-94b10916/;",
        "or_profile": "~Zhenyu_Wu9;~Meng_Jiang3;~Chao_Shen2",
        "aff": "University of Notre Dame;University of Notre Dame;Xi\u2019an Jiaotong University",
        "aff_domain": "nd.edu;nd.edu;xjtu.edu.cn",
        "position": "Research Scholar;Associate Professor;Full Professor",
        "bibtex": "@misc{\nwu2024instructing,\ntitle={Instructing Large Language Models to Identify and Ignore Irrelevant Conditions},\nauthor={Zhenyu Wu and Meng Jiang and Chao Shen},\nyear={2024},\nurl={https://openreview.net/forum?id=kTRGF2JEcx}\n}",
        "github": "",
        "project": "",
        "reviewers": "d3U4;2AS5;vMNk;jEnd",
        "site": "https://openreview.net/forum?id=kTRGF2JEcx",
        "pdf_size": 1525045,
        "rating": "3;5;6;6",
        "confidence": "4;3;4;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;2",
        "presentation": "2;2;3;4",
        "wc_summary": "84;117;124;265",
        "wc_strengths": "36;51;42;124",
        "wc_weaknesses": "160;437;232;139",
        "wc_questions": "6;19;84;129",
        "wc_review": "286;624;482;657",
        "wc_reply_reviewers": "473;39;155;105",
        "wc_reply_authors": "2577;1890;2318;1305",
        "reply_reviewers": "3;1;2;1",
        "reply_authors": "10;6;7;4",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            147.5,
            69.5
        ],
        "wc_strengths_avg": [
            63.25,
            35.47798613224826
        ],
        "wc_weaknesses_avg": [
            242.0,
            117.74761144074219
        ],
        "wc_questions_avg": [
            59.5,
            49.83221849366131
        ],
        "wc_review_avg": [
            512.25,
            146.2401706098567
        ],
        "wc_reply_reviewers_avg": [
            193.0,
            166.8112706024386
        ],
        "wc_reply_authors_avg": [
            2022.5,
            481.443921968073
        ],
        "reply_reviewers_avg": [
            1.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            6.75,
            2.165063509461097
        ],
        "replies_avg": [
            44,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.40824829046386296,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17915465429154384519&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "University of Notre Dame;Xi'an Jiao Tong University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.nd.edu;https://www.xjtu.edu.cn",
        "aff_unique_abbr": "Notre Dame;XJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "SF(DA)$^2$: Source-free Domain Adaptation Through the Lens of Data Augmentation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17973",
        "id": "kUCgHbmO11",
        "author_site": "Uiwon Hwang, Jonghyun Lee, Juhyeon Shin, Sungroh Yoon",
        "tldr": "",
        "abstract": "In the face of the deep learning model's vulnerability to domain shift, source-free domain adaptation (SFDA) methods have been proposed to adapt models to new, unseen target domains without requiring access to source domain data. Although the potential benefits of applying data augmentation to SFDA are attractive, several challenges arise such as the dependence on prior knowledge of class-preserving transformations and the increase in memory and computational requirements. In this paper, we propose Source-free Domain Adaptation Through the Lens of Data Augmentation (SF(DA)$^2$), a novel approach that leverages the benefits of data augmentation without suffering from these challenges. We construct an augmentation graph in the feature space of the pretrained model using the neighbor relationships between target features and propose spectral neighborhood clustering to identify partitions in the prediction space. Furthermore, we propose implicit feature augmentation and feature disentanglement as regularization loss functions that effectively utilize class semantic information within the feature space. These regularizers simulate the inclusion of an unlimited number of augmented target features into the augmentation graph while minimizing computational and memory demands. Our method shows superior adaptation performance in SFDA scenarios, including 2D image and 3D point cloud datasets and a highly imbalanced dataset.",
        "keywords": "Source-free domain adaptation;Data augmentation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/99754b0466ea46e79e1e4b581030f3d198b047c0.zip",
        "author": "Uiwon Hwang;Jonghyun Lee;Juhyeon Shin;Sungroh Yoon",
        "authorids": "~Uiwon_Hwang1;~Jonghyun_Lee1;~Juhyeon_Shin1;~Sungroh_Yoon1",
        "gender": "M;M;F;",
        "homepage": "https://sites.google.com/view/uiwon-hwang;;https://github.com/newjh12;http://ailab.snu.ac.kr",
        "dblp": "207/8512;;;99/1474",
        "google_scholar": "https://scholar.google.co.kr/citations?user=CJ8-pGIAAAAJ;;;Bphl_fIAAAAJ",
        "orcid": "0000-0001-5054-2236;;;0000-0002-2367-197X",
        "linkedin": "uiwon-hwang/;jonghyun-lee-0886061a3/;;",
        "or_profile": "~Uiwon_Hwang1;~Jonghyun_Lee1;~Juhyeon_Shin1;~Sungroh_Yoon1",
        "aff": "Yonsei University - Mirae Campus;Seoul National University;Seoul National University;Seoul National University",
        "aff_domain": "yonsei.ac.kr;snu.ac.kr;snu.ac.kr;snu.ac.kr",
        "position": "Assistant Professor;PhD student;PhD student;Full Professor",
        "bibtex": "@inproceedings{\nhwang2024sfda,\ntitle={{SF}({DA})\\${\\textasciicircum}2\\$: Source-free Domain Adaptation Through the Lens of Data Augmentation},\nauthor={Uiwon Hwang and Jonghyun Lee and Juhyeon Shin and Sungroh Yoon},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=kUCgHbmO11}\n}",
        "github": "",
        "project": "",
        "reviewers": "s4wJ;jaw9;7eAE;44EQ",
        "pdf_size": 1337754,
        "rating": "5;6;6;8",
        "confidence": "4;4;4;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "135;22;167;121",
        "wc_strengths": "30;57;113;126",
        "wc_weaknesses": "437;93;48;184",
        "wc_questions": "4;245;45;5",
        "wc_review": "606;417;373;436",
        "wc_reply_reviewers": "15;16;0;24",
        "wc_reply_authors": "1364;1200;579;901",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "5;3;3;3",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            111.25,
            54.1589097009901
        ],
        "wc_strengths_avg": [
            81.5,
            39.44933459514875
        ],
        "wc_weaknesses_avg": [
            190.5,
            150.5132884498907
        ],
        "wc_questions_avg": [
            74.75,
            99.67541070896071
        ],
        "wc_review_avg": [
            458.0,
            88.4505511571296
        ],
        "wc_reply_reviewers_avg": [
            13.75,
            8.671072598012312
        ],
        "wc_reply_authors_avg": [
            1011.0,
            299.60557404694595
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.5,
            0.8660254037844386
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 21,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4710263072760736985&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=kUCgHbmO11",
        "pdf": "https://openreview.net/pdf?id=kUCgHbmO11",
        "email": "yonsei.ac.kr;snu.ac.kr;snu.ac.kr;snu.ac.kr",
        "author_num": 4,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Yonsei University;Seoul National University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.yonsei.ac.kr;https://www.snu.ac.kr",
        "aff_unique_abbr": "Yonsei;SNU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Mirae;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "Multi-resolution HuBERT: Multi-resolution Speech Self-Supervised Learning with Masked Unit Prediction",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17972",
        "id": "kUuKFW7DIF",
        "author_site": "Jiatong Shi, Hirofumi Inaguma, Xutai Ma, Ilia Kulikov, Anna Sun",
        "tldr": "",
        "abstract": "Existing Self-Supervised Learning (SSL) models for speech typically process speech signals at a fixed resolution of 20 milliseconds. This approach overlooks the varying informational content present at different resolutions in speech signals. In contrast, this paper aims to incorporate multi-resolution information into speech self-supervised representation learning. We introduce an SSL model that leverages a hierarchical Transformer architecture, complemented by HuBERT-style masked prediction objectives, to process speech at multiple resolutions. Experimental results indicate that the proposed model not only achieves more efficient inference but also exhibits superior or comparable performance to the original HuBERT model over various tasks. Specifically, significant performance improvements over the original HuBERT have been observed in fine-tuning experiments on the LibriSpeech speech recognition benchmark as well as in evaluations using the Speech Universal PERformance Benchmark (SUPERB) and Multilingual SUPERB (ML-SUPERB).",
        "keywords": "Speech Representation Learning;Self-supervised Learning;Multi-resolution",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Jiatong Shi;Hirofumi Inaguma;Xutai Ma;Ilia Kulikov;Anna Sun",
        "authorids": "~Jiatong_Shi1;~Hirofumi_Inaguma1;~Xutai_Ma1;~Ilia_Kulikov1;~Anna_Sun1",
        "gender": "M;M;M;;F",
        "homepage": "http://shijt.site;https://hirofumi0810.github.io/;https://scholar.google.com/citations?user=al5bfIwAAAAJ&hl=en;;",
        "dblp": "229/3529.html;212/6161.html;163/2004.html;;292/8268.html",
        "google_scholar": "FEDNbgkAAAAJ;1oanW5sAAAAJ;al5bfIwAAAAJ;;Ky_pMLQAAAAJ",
        "orcid": ";0000-0003-0610-1251;;;0000-0002-6212-1313",
        "linkedin": "jiatong-shi-608b3016b/;hirofumi-inaguma-171ab6131/?originalSubdomain=jp;;;",
        "or_profile": "~Jiatong_Shi1;~Hirofumi_Inaguma1;~Xutai_Ma1;~Ilia_Kulikov1;~Anna_Sun1",
        "aff": "Carnegie Mellon University;Meta;Meta FAIR;;Meta Facebook",
        "aff_domain": "andrew.cmu.edu;meta.com;meta.com;;fb.com",
        "position": "PhD student;Researcher;Researcher;;Researcher",
        "bibtex": "@inproceedings{\nshi2024multiresolution,\ntitle={Multi-resolution Hu{BERT}: Multi-resolution Speech Self-Supervised Learning with Masked Unit Prediction},\nauthor={Jiatong Shi and Hirofumi Inaguma and Xutai Ma and Ilia Kulikov and Anna Sun},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=kUuKFW7DIF}\n}",
        "github": "",
        "project": "",
        "reviewers": "nPyR;hKsL;vPyr;MxEg",
        "pdf_size": 1039488,
        "rating": "8;8;8;8",
        "confidence": "4;3;3;5",
        "soundness": "4;3;4;3",
        "contribution": "4;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "65;105;37;39",
        "wc_strengths": "136;92;108;39",
        "wc_weaknesses": "8;169;177;78",
        "wc_questions": "74;3;30;10",
        "wc_review": "283;369;352;166",
        "wc_reply_reviewers": "0;12;0;17",
        "wc_reply_authors": "239;366;347;216",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            61.5,
            27.436289836637897
        ],
        "wc_strengths_avg": [
            93.75,
            35.31554190437972
        ],
        "wc_weaknesses_avg": [
            108.0,
            69.60962577115323
        ],
        "wc_questions_avg": [
            29.25,
            27.67105888830422
        ],
        "wc_review_avg": [
            292.5,
            79.82011024798199
        ],
        "wc_reply_reviewers_avg": [
            7.25,
            7.46240577829965
        ],
        "wc_reply_authors_avg": [
            292.0,
            65.35671350366387
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 26,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7067681971216917737&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=kUuKFW7DIF",
        "pdf": "https://openreview.net/pdf?id=kUuKFW7DIF",
        "email": "andrew.cmu.edu;meta.com;meta.com;;fb.com",
        "author_num": 5,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Carnegie Mellon University;Meta",
        "aff_unique_dep": ";Meta Platforms, Inc.",
        "aff_unique_url": "https://www.cmu.edu;https://meta.com",
        "aff_unique_abbr": "CMU;Meta",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Improving equilibrium propagation without weight symmetry through Jacobian homeostasis",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17971",
        "id": "kUveo5k1GF",
        "author_site": "Axel Laborieux, Friedemann Zenke",
        "tldr": "",
        "abstract": "Equilibrium propagation (EP) is a compelling alternative to the back propagation of error algorithm (BP) for computing gradients of neural networks on biological or analog neuromorphic substrates. \nStill, the algorithm requires weight symmetry and infinitesimal equilibrium perturbations, i.e., nudges, to yield unbiased gradient estimates.\nBoth requirements are challenging to implement in physical systems.\nYet, whether and how weight asymmetry contributes to bias is unknown because, in practice, its contribution may be masked by a finite nudge. \nTo address this question, we study generalized EP, which can be formulated without weight symmetry, and analytically isolate the two sources of bias.\nFor complex-differentiable non-symmetric networks, we show that bias due to finite nudge can be avoided by estimating exact derivatives via a Cauchy integral.\nIn contrast, weight asymmetry induces residual bias  through poor alignment of EP's neuronal error vectors compared to BP resulting in low task performance.\nTo mitigate the latter issue, we present a new homeostatic objective that directly penalizes functional asymmetries of the Jacobian at the network's fixed point. \nThis homeostatic objective dramatically improves the network's ability to solve complex tasks such as ImageNet 32$\\times$32. \nOur results lay the theoretical groundwork for studying and mitigating the adverse effects of imperfections of physical networks on learning algorithms that rely on the substrate's relaxation dynamics.",
        "keywords": "Equilibrium propagation;local learning;weight transport;jacobian regularization",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/a2f72c4e65f9e3c90a0b752527ad6ff0dee0fe2c.zip",
        "author": "Axel Laborieux;Friedemann Zenke",
        "authorids": "~Axel_Laborieux1;~Friedemann_Zenke1",
        "gender": "M;M",
        "homepage": "https://laborieux-axel.github.io/;https://fzenke.net",
        "dblp": "260/0533;155/2110",
        "google_scholar": "wodyq68AAAAJ;_IxvO8QAAAAJ",
        "orcid": "0000-0003-3630-2863;0000-0003-1883-644X",
        "linkedin": "https://linkedin.com/in/axel-lbx;",
        "or_profile": "~Axel_Laborieux1;~Friedemann_Zenke1",
        "aff": "Friedrich Miescher Institute for Biomedical Research;Friedrich Miescher Institute",
        "aff_domain": "fmi.ch;fmi.ch",
        "position": "Postdoc;Principal Researcher",
        "bibtex": "@inproceedings{\nlaborieux2024improving,\ntitle={Improving equilibrium propagation without weight symmetry through Jacobian homeostasis},\nauthor={Axel Laborieux and Friedemann Zenke},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=kUveo5k1GF}\n}",
        "github": "",
        "project": "",
        "reviewers": "2L2m;nv6j;EQJi;8uWs",
        "pdf_size": 782558,
        "rating": "5;6;6;8",
        "confidence": "3;3;4;4",
        "soundness": "3;3;3;4",
        "contribution": "2;2;3;2",
        "presentation": "3;3;3;2",
        "wc_summary": "42;121;53;218",
        "wc_strengths": "31;86;57;93",
        "wc_weaknesses": "117;174;24;800",
        "wc_questions": "35;6;14;147",
        "wc_review": "225;387;148;1258",
        "wc_reply_reviewers": "30;0;0;1149",
        "wc_reply_authors": "713;559;70;3272",
        "reply_reviewers": "1;0;0;6",
        "reply_authors": "2;1;1;7",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            108.5,
            70.08744538075275
        ],
        "wc_strengths_avg": [
            66.75,
            24.661457783350926
        ],
        "wc_weaknesses_avg": [
            278.75,
            305.66924526356917
        ],
        "wc_questions_avg": [
            50.5,
            56.71199167724583
        ],
        "wc_review_avg": [
            504.5,
            443.50338217425127
        ],
        "wc_reply_reviewers_avg": [
            294.75,
            493.3535116931874
        ],
        "wc_reply_authors_avg": [
            1153.5,
            1245.9419127712174
        ],
        "reply_reviewers_avg": [
            1.75,
            2.48746859276655
        ],
        "reply_authors_avg": [
            2.75,
            2.48746859276655
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.6882472016116854,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4793330844483334379&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=kUveo5k1GF",
        "pdf": "https://openreview.net/pdf?id=kUveo5k1GF",
        "email": "fmi.ch;fmi.ch",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Friedrich Miescher Institute for Biomedical Research;Friedrich Miescher Institute",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.fmi.ch;https://www.fmi.ch",
        "aff_unique_abbr": "FMI;FMI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Switzerland"
    },
    {
        "id": "kVSmnzcXDK",
        "title": "Combine and Conquer: A Meta-Analysis on Data Shift and Out-of-Distribution Detection",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "This paper describes a universal approach to combining detectors and compares combination methods for data distribution shift and out-of-distribution detection. By aligning each individual detector score's distribution into p-values through a quantile normalization, we transform the problem into a multi-variate hypothesis test that we combine by leveraging established meta-analysis tools. The resulting test can effectively fuse the individual decision boundaries to create a more capable detector. Furthermore, we can obtain a fully interpretable criterion by reshaping the final statistics of the in-distribution score. Our framework is easily extensible to future development of detection scores. Through a comprehensive empirical investigation, we examine diverse kinds of shifts with different magnitudes and fractions of affected data, showing that our framework is advantageous in improving overall robustness and performance across domains and types of shift and out-of-distribution detection.",
        "keywords": "out-of-distribution detection;data distribution shift detection",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/2b58ee161895483676f34e9a6782855682a1d51a.zip",
        "author": "Eduardo Dadalto C\u00e2mara Gomes;Florence Alberge;Pierre Duhamel;Pablo Piantanida",
        "authorids": "~Eduardo_Dadalto_C\u00e2mara_Gomes1;~Florence_Alberge1;~Pierre_Duhamel1;~Pablo_Piantanida2",
        "gender": "F;M;M;M",
        "homepage": "https://l2s.centralesupelec.fr/u/alberge-florence/;;https://www.pablo-piantanida.org;https://edadaltocg.github.io",
        "dblp": ";;44/1416;306/2391",
        "google_scholar": "8CcRfB8AAAAJ;https://scholar.google.fr/citations?user=gWj_W9YAAAAJ;https://scholar.google.fr/citations?user=QyBEFv0AAAAJ;ImL09qAAAAAJ",
        "orcid": ";0000-0002-7942-0934;;",
        "linkedin": ";;pablo-piantanida-60a51bb5/?locale=en_US;edadaltocg/",
        "or_profile": "~Florence_Alberge1;~Pierre_Duhamel1;~Pablo_Piantanida2;~Eduardo_Dadalto_Camara_Gomes1",
        "aff": "Universite Paris-Saclay;;Mila - Quebec AI Institute ;Universit\u00e9 Paris-Saclay CNRS CentraleSup\u00e9lec",
        "aff_domain": "univ-paris-saclay.fr;;mila.quebec;centralesupelec.fr",
        "position": "Full Professor;;Full Professor;PhD student",
        "bibtex": "@misc{\ngomes2024combine,\ntitle={Combine and Conquer: A Meta-Analysis on Data Shift and Out-of-Distribution Detection},\nauthor={Eduardo Dadalto C{\\^a}mara Gomes and Florence Alberge and Pierre Duhamel and Pablo Piantanida},\nyear={2024},\nurl={https://openreview.net/forum?id=kVSmnzcXDK}\n}",
        "github": "",
        "project": "",
        "reviewers": "UAHM;yLhF;2NKy",
        "site": "https://openreview.net/forum?id=kVSmnzcXDK",
        "pdf_size": 761594,
        "rating": "3;5;6",
        "confidence": "4;3;2",
        "soundness": "2;3;3",
        "contribution": "2;2;1",
        "presentation": "3;1;3",
        "wc_summary": "82;119;49",
        "wc_strengths": "48;131;79",
        "wc_weaknesses": "158;234;17",
        "wc_questions": "86;5;40",
        "wc_review": "374;489;185",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            83.33333333333333,
            28.592928418676454
        ],
        "wc_strengths_avg": [
            86.0,
            34.2442209236342
        ],
        "wc_weaknesses_avg": [
            136.33333333333334,
            89.9048880144394
        ],
        "wc_questions_avg": [
            43.666666666666664,
            33.169597860423664
        ],
        "wc_review_avg": [
            349.3333333333333,
            125.32712750593501
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9819805060619659,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:REhgUgqC23wJ:scholar.google.com/&scioq=Combine+and+Conquer:+A+Meta-Analysis+on+Data+Shift+and+Out-of-Distribution+Detection&hl=en&as_sdt=0,33",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Universit\u00e9 Paris-Saclay;Quebec AI Institute",
        "aff_unique_dep": ";AI Institute",
        "aff_unique_url": "https://www.universite-paris-saclay.fr;https://mila.quebec",
        "aff_unique_abbr": "UPSaclay;Mila",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "France;Canada"
    },
    {
        "id": "kVj2uyytyg",
        "title": "Unsupervised Federated Graph Matching with Graphlet Feature Extraction and Separate Trust Region",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph matching in the setting of federated learning is still an open problem. This paper proposes an unsupervised federated graph matching algorithm, UFGM, for inferring matched node pairs on different graphs across clients while maintaining privacy requirement, by leveraging graphlet theory and trust region optimization. First, the nodes' graphlet features are captured to generate pseudo matched node pairs on different graphs across clients as pseudo training data for tackling the dilemma of unsupervised graph matching in federated setting and leveraging the strength of supervised graph matching. An approximate graphlet enumeration method is proposed to sample a small number of graphlets and capture nodes' graphlet features. Theoretical analysis is conducted to demonstrate that the approximate method is able to maintain the quality of graphlet estimation while reducing its expensive cost. Second, we propose a separate trust region algorithm for pseudo supervised federated graph matching while maintaining the privacy constraints. In order to avoid expensive cost of the second-order Hessian computation in the trust region algorithm, we propose two weak quasi-Newton conditions to construct a positive definite scalar matrix as the Hessian approximation with only first-order gradients. We theoretically derive the error introduced by the separate trust region due to the Hessian approximation and conduct the convergence analysis of the approximation method.",
        "keywords": "Federated graph matching;unsupervised learning;graphlet feature extraction;pseudo training data;separate trust region",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Zijie Zhang;Yang Zhou;Zeru Zhang;Lingjuan Lyu;Wei-Shinn Ku",
        "authorids": "~Zijie_Zhang1;~Yang_Zhou4;~Zeru_Zhang1;~Lingjuan_Lyu1;~Wei-Shinn_Ku1",
        "gender": "M;;M;F;M",
        "homepage": ";http://eng.auburn.edu/users/yangzhou/;;https://sites.google.com/view/lingjuan-lyu;http://www.eng.auburn.edu/~weishinn/",
        "dblp": "63/8333.html;07/4580-1;280/1147;178/9876;21/1694",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;yvE8Po0AAAAJ;;;https://scholar.google.com.tw/citations?user=ZQ87sO4AAAAJ",
        "orcid": "0000-0003-1254-098X;0000-0001-7839-4933;;;0000-0001-8636-4689",
        "linkedin": ";;;;",
        "or_profile": "~Zijie_Zhang1;~Yang_Zhou4;~Zeru_Zhang1;~Lingjuan_Lyu1;~Wei-Shinn_Ku1",
        "aff": "University of Texas at San Antonio;Auburn University;Auburn University;Sony;Auburn University",
        "aff_domain": "utsa.edu;auburn.edu;auburn.edu;sony.com;auburn.edu",
        "position": "Assistant Professor;Assistant Professor;PhD student;scientist;Full Professor",
        "bibtex": "@misc{\nzhang2024unsupervised,\ntitle={Unsupervised Federated Graph Matching with Graphlet Feature Extraction and Separate Trust Region},\nauthor={Zijie Zhang and Yang Zhou and Zeru Zhang and Lingjuan Lyu and Wei-Shinn Ku},\nyear={2024},\nurl={https://openreview.net/forum?id=kVj2uyytyg}\n}",
        "github": "",
        "project": "",
        "reviewers": "3NNH;D7Az;SCKR;TsnJ",
        "site": "https://openreview.net/forum?id=kVj2uyytyg",
        "pdf_size": 831933,
        "rating": "6;6;8;8",
        "confidence": "3;3;5;4",
        "soundness": "3;2;4;4",
        "contribution": "3;2;4;4",
        "presentation": "3;2;3;3",
        "wc_summary": "144;42;123;127",
        "wc_strengths": "146;22;103;118",
        "wc_weaknesses": "365;84;66;92",
        "wc_questions": "72;15;5;3",
        "wc_review": "727;163;297;340",
        "wc_reply_reviewers": "110;286;31;0",
        "wc_reply_authors": "1356;1677;565;536",
        "reply_reviewers": "1;2;1;0",
        "reply_authors": "3;4;2;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            3.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            109.0,
            39.477841886303764
        ],
        "wc_strengths_avg": [
            97.25,
            46.10517866791105
        ],
        "wc_weaknesses_avg": [
            151.75,
            123.47950234755565
        ],
        "wc_questions_avg": [
            23.75,
            28.225653225390552
        ],
        "wc_review_avg": [
            381.75,
            209.74672226282823
        ],
        "wc_reply_reviewers_avg": [
            106.75,
            110.98958284451744
        ],
        "wc_reply_authors_avg": [
            1033.5,
            496.2602643774736
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.9045340337332909,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Q6L75UJ0jhgJ:scholar.google.com/&scioq=Unsupervised+Federated+Graph+Matching+with+Graphlet+Feature+Extraction+and+Separate+Trust+Region&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;2;1",
        "aff_unique_norm": "University of Texas at San Antonio;Auburn University;Sony Corporation",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.utsa.edu;https://www.auburn.edu;https://www.sony.com",
        "aff_unique_abbr": "UTSA;Auburn;Sony",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "San Antonio;",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "United States;Japan"
    },
    {
        "id": "kWS4iOkhXv",
        "title": "Scalable Lipschitz Estimation for CNNs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Estimating the Lipschitz constant of deep neural networks is of growing interest as it is useful for informing on generalisability and adversarial robustness. Convolutional neural networks (CNNs) in particular, underpin much of the recent success in computer vision related applications. Existing methods for estimating the Lipschitz constant can be tight but have limited scalability when applied to CNNs. In this work, we propose a novel method to accelerate Lipschitz constant estimation for CNNs. The core idea is to divide a large convolutional block via a joint layer and width-wise partition, into a collection of smaller blocks. We prove an upper-bound on the Lipschitz constant of the larger block in terms of the Lipschitz constants of the smaller blocks. We demonstrate an enhanced scalability and comparable accuracy to existing baselines through a range of experiments.",
        "keywords": "Lipschitz Estimation;Convolutional Neural Networks",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/b98da8b40eee2b950641bf62517dc2dc932496b3.zip",
        "author": "Yusuf Sulehman;Tingting Mu",
        "authorids": "~Yusuf_Sulehman1;~Tingting_Mu1",
        "gender": "M;F",
        "homepage": ";https://personalpages.manchester.ac.uk/staff/tingting.mu/Site/About_Me.html",
        "dblp": ";89/4352",
        "google_scholar": ";https://scholar.google.co.uk/citations?user=dOG10IUAAAAJ",
        "orcid": ";",
        "linkedin": "yusuf-sulehman-68061716a;",
        "or_profile": "~Yusuf_Sulehman1;~Tingting_Mu1",
        "aff": "University of Manchester;University of Manchester",
        "aff_domain": "cs.manchester.ac.uk;manchester.ac.uk",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\nsulehman2024scalable,\ntitle={Scalable Lipschitz Estimation for {CNN}s},\nauthor={Yusuf Sulehman and Tingting Mu},\nyear={2024},\nurl={https://openreview.net/forum?id=kWS4iOkhXv}\n}",
        "github": "",
        "project": "",
        "reviewers": "sG95;qywJ;szVD;G8PH",
        "site": "https://openreview.net/forum?id=kWS4iOkhXv",
        "pdf_size": 443230,
        "rating": "5;5;6;6",
        "confidence": "3;4;4;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;2",
        "presentation": "3;3;3;3",
        "wc_summary": "125;61;135;51",
        "wc_strengths": "33;27;144;49",
        "wc_weaknesses": "229;129;59;156",
        "wc_questions": "17;320;63;130",
        "wc_review": "404;537;401;386",
        "wc_reply_reviewers": "41;74;16;21",
        "wc_reply_authors": "490;540;130;396",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            93.0,
            37.33630940518894
        ],
        "wc_strengths_avg": [
            63.25,
            47.30948636373048
        ],
        "wc_weaknesses_avg": [
            143.25,
            60.862036607395915
        ],
        "wc_questions_avg": [
            132.5,
            115.46969299344309
        ],
        "wc_review_avg": [
            432.0,
            61.00409822298826
        ],
        "wc_reply_reviewers_avg": [
            38.0,
            22.792542640082964
        ],
        "wc_reply_authors_avg": [
            389.0,
            158.21820375671064
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18346480080957343930&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Manchester",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.manchester.ac.uk",
        "aff_unique_abbr": "UoM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "kWsJkH1tNi",
        "title": "Federated Learning, Lessons from Generalization Study: Communicate Less, Learn More",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We investigate the generalization error of statistical learning models in a Federated Learning (FL) setting. Specifically, we study the evolution of the generalization error with the number of communication rounds between the clients and the parameter server, i.e., the effect on the generalization error of how often the local models as computed by the clients are aggregated at the parameter server. We establish PAC-Bayes and rate-distortion theoretic bounds on the generalization error that account explicitly for the effect of the number of rounds, say $R \\in \\mathbb{N}^*$, in addition to the number of participating devices $K$ and individual datasets size $n$. The bounds, which apply in their generality for a large class of loss functions and learning algorithms, appear to be the first of their kind for the FL setting. Furthermore, we apply our bounds to FL-type Support Vector Machines (FSVM); and we derive (more) explicit bounds on the generalization error in this case. In particular, we show that the generalization bound of FSVM increases with $R$, suggesting that more frequent communication with the parameter server diminishes the generalization power of such learning algorithms. Combined with the fact that the empirical risk generally decreases for larger values of $R$, this indicates that $R$ might be a parameter to optimize to minimize the population risk of FSVM. Moreover, our bound suggests that for any $R$, the generalization error of the FSVM setting decreases faster than that of centralized learning by a factor of $\\mathcal{O}(\\sqrt{\\log(K)/K})$, thereby generalizing recent findings in this direction for $R=1$ (sometimes referred to as ``one-shot'' FL or distributed learning) to any arbitrary number of rounds. Furthermore, we also provide results of experiments that are obtained using neural networks (ResNet-56), and which suggest that our observations for FSVM may hold true more generally.",
        "keywords": "Federated Learning;Generalization Error;SGD;PAC-Bayes;Rate-Distortion Theoretic bounds;Support Vector Machines",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/681fd50a82422a4830147e96c4cae2393a347da6.zip",
        "author": "Milad Sefidgaran;Romain Chor;Abdellatif Zaidi;Yijun Wan",
        "authorids": "~Milad_Sefidgaran1;~Romain_Chor1;~Abdellatif_Zaidi1;~Yijun_Wan1",
        "gender": "M;M;M;",
        "homepage": ";;http://www-syscom.univ-mlv.fr/~zaidi/;",
        "dblp": "56/9885.html;;07/3113;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;VNjZ9WwAAAAJ;;",
        "orcid": ";;;",
        "linkedin": "milad-sefidgaran;romain-chor/;;",
        "or_profile": "~Milad_Sefidgaran1;~Romain_Chor1;~Abdellatif_Zaidi1;~Yijun_Wan1",
        "aff": "Huawei Technologies Ltd. (Pairs Resaerch Center);Huawei Technologies France;Universit\u00e9 Gustave Eiffel;",
        "aff_domain": "huawei.com;huawei.com;univ-eiffel.fr;",
        "position": "Researcher;PhD student;Associate Professor;",
        "bibtex": "@misc{\nsefidgaran2024federated,\ntitle={Federated Learning, Lessons from Generalization Study: Communicate Less, Learn More},\nauthor={Milad Sefidgaran and Romain Chor and Abdellatif Zaidi and Yijun Wan},\nyear={2024},\nurl={https://openreview.net/forum?id=kWsJkH1tNi}\n}",
        "github": "",
        "project": "",
        "reviewers": "yDVy;9uEx;jTnd",
        "site": "https://openreview.net/forum?id=kWsJkH1tNi",
        "pdf_size": 1573450,
        "rating": "5;5;5",
        "confidence": "4;4;3",
        "soundness": "3;2;2",
        "contribution": "2;3;2",
        "presentation": "3;2;3",
        "wc_summary": "89;72;56",
        "wc_strengths": "195;21;75",
        "wc_weaknesses": "155;21;363",
        "wc_questions": "102;538;4",
        "wc_review": "541;652;498",
        "wc_reply_reviewers": "0;366;247",
        "wc_reply_authors": "274;937;1026",
        "reply_reviewers": "0;3;2",
        "reply_authors": "1;3;2",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            72.33333333333333,
            13.474255287605157
        ],
        "wc_strengths_avg": [
            97.0,
            72.71863585079137
        ],
        "wc_weaknesses_avg": [
            179.66666666666666,
            140.7061555946371
        ],
        "wc_questions_avg": [
            214.66666666666666,
            232.10534006973836
        ],
        "wc_review_avg": [
            563.6666666666666,
            64.88108781112996
        ],
        "wc_reply_reviewers_avg": [
            204.33333333333334,
            152.43432101145143
        ],
        "wc_reply_authors_avg": [
            745.6666666666666,
            335.49201017146277
        ],
        "reply_reviewers_avg": [
            1.6666666666666667,
            1.247219128924647
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:QQD5WMmH_1oJ:scholar.google.com/&scioq=Federated+Learning,+Lessons+from+Generalization+Study:+Communicate+Less,+Learn+More&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Huawei;Universit\u00e9 Gustave Eiffel",
        "aff_unique_dep": "Huawei Technologies Ltd.;",
        "aff_unique_url": "https://www.huawei.com;https://www.univ-gustave-eiffel.fr",
        "aff_unique_abbr": "Huawei;UGE",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Pairs Resaerch Center;",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "China;France"
    },
    {
        "title": "Simple Hierarchical Planning with Diffusion",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17970",
        "id": "kXHEBK9uAY",
        "author_site": "Chang Chen, Fei Deng, Kenji Kawaguchi, Caglar Gulcehre, Sungjin Ahn",
        "tldr": "",
        "abstract": "Diffusion-based generative methods have proven effective in modeling trajectories with offline datasets. However, they often face computational challenges and can falter in generalization, especially in capturing temporal abstractions for long-horizon tasks. To overcome this, we introduce the Hierarchical Diffuser, a simple, fast, yet effective planning method combining the advantages of hierarchical and diffusion-based planning. Our model adopts a \u201cjumpy\u201d planning strategy at the high level, which allows it to have a larger receptive field but at a lower computational cost\u2014a crucial factor for diffusion-based planning methods, as we have empirically verified. Additionally, the jumpy sub-goals guide our low-level planner, facilitating a fine-tuning stage and further improving our approach\u2019s effectiveness. We conducted empirical evaluations on standard offline reinforcement learning benchmarks, demonstrating our method\u2019s superior performance and efficiency in terms of training and planning speed compared to the non-hierarchical Diffuser as well as other hierarchical planning methods. Moreover, we explore our model\u2019s generalization capability, particularly on how our method improves generalization capabilities on compositional out-of-distribution tasks.",
        "keywords": "Hierarchical Offline RL;Hierarchical planning;Hierarchical Reinforcement Learning;Diffusion-Based Planning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/5226776c9fa436a6bdb040c7434032b505f9f9f3.pdf",
        "author": "Chang Chen;Fei Deng;Kenji Kawaguchi;Caglar Gulcehre;Sungjin Ahn",
        "authorids": "~Chang_Chen1;~Fei_Deng1;~Kenji_Kawaguchi1;~Caglar_Gulcehre1;~Sungjin_Ahn1",
        "gender": ";M;;M;",
        "homepage": "https://www.linkedin.com/in/chen-chang-bba27643/;;https://ml.comp.nus.edu.sg/#members;http://caglarg.com;",
        "dblp": ";46/10037-1;;125/2132;",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;aLl3rYoAAAAJ;https://scholar.google.ca/citations?user=7hwJ2ckAAAAJ;",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Chang_Chen1;~Fei_Deng1;~Kenji_Kawaguchi1;~Caglar_Gulcehre1;~Sungjin_Ahn1",
        "aff": "Rutgers University;Rutgers University;National University of Singapore;EPFL - EPF Lausanne;",
        "aff_domain": "rutgers.edu;rutgers.edu;nus.edu;epfl.ch;",
        "position": "Phd student;PhD student;Presidential Young Professor;EPFL;",
        "bibtex": "@inproceedings{\nchen2024simple,\ntitle={Simple Hierarchical Planning with Diffusion},\nauthor={Chang Chen and Fei Deng and Kenji Kawaguchi and Caglar Gulcehre and Sungjin Ahn},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=kXHEBK9uAY}\n}",
        "github": "",
        "project": "",
        "reviewers": "zGcK;KFqH;AgLN;u9ra",
        "pdf_size": 2774089,
        "rating": "5;6;6;6",
        "confidence": "5;3;4;4",
        "soundness": "3;3;3;4",
        "contribution": "2;3;2;3",
        "presentation": "3;3;3;4",
        "wc_summary": "100;91;87;112",
        "wc_strengths": "36;60;85;101",
        "wc_weaknesses": "126;58;188;216",
        "wc_questions": "29;85;101;3",
        "wc_review": "291;294;461;432",
        "wc_reply_reviewers": "150;0;37;0",
        "wc_reply_authors": "1501;857;1490;720",
        "reply_reviewers": "2;0;1;0",
        "reply_authors": "4;1;3;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            97.5,
            9.604686356149273
        ],
        "wc_strengths_avg": [
            70.5,
            24.70323865407125
        ],
        "wc_weaknesses_avg": [
            147.0,
            60.83584469702052
        ],
        "wc_questions_avg": [
            54.5,
            39.98437194704951
        ],
        "wc_review_avg": [
            369.5,
            77.68687147774713
        ],
        "wc_reply_reviewers_avg": [
            46.75,
            61.495426659224016
        ],
        "wc_reply_authors_avg": [
            1142.0,
            356.8241863999692
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.25,
            1.299038105676658
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 27,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=671459677131833726&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=kXHEBK9uAY",
        "pdf": "https://openreview.net/pdf?id=kXHEBK9uAY",
        "email": "rutgers.edu;rutgers.edu;nus.edu;epfl.ch;",
        "author_num": 5,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "Rutgers University;National University of Singapore;EPFL",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.rutgers.edu;https://www.nus.edu.sg;https://www.epfl.ch",
        "aff_unique_abbr": "Rutgers;NUS;EPFL",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Lausanne",
        "aff_country_unique_index": "0;0;1;2",
        "aff_country_unique": "United States;Singapore;Switzerland"
    },
    {
        "title": "Accelerated Sampling with Stacked Restricted Boltzmann Machines",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17969",
        "id": "kXNJ48Hvw1",
        "author_site": "Cl\u00e9ment Roussel, Jorge Fernandez-de-Cossio-Diaz, Simona Cocco, Remi Monasson",
        "tldr": "",
        "abstract": "Sampling complex distributions is an important but difficult objective in various fields, including physics, chemistry, and statistics. An improvement of standard Monte Carlo (MC) methods, intensively used in particular in the context of disordered systems, is Parallel Tempering, also called replica exchange MC, in which a sequence of MC Markov chains at decreasing temperatures are run in parallel and can swap their configurations. In this work we apply the ideas of parallel tempering in the context of restricted Boltzmann machines (RBM), a paradigm of unsupervised architectures, capable to learn complex, multimodal distributions. \nInspired by Deep Tempering, an approach introduced for deep belief networks, we  show how to learn on top of the first RBM a stack of nested RBMs, using the representations of a RBM as \u2019data\u2019 for the next one along the stack. In our Stacked Tempering approach the hidden configurations of a machine can be exchanged with the visible configurations of the next one in the stack. Replica exchanges between the different RBMs is facilitated by the increasingly clustered representations learnt by deeper RBMs, allowing for fast transitions between the different modes of the data distribution. Analytical calculations of mixing times in a simplified theoretical setting shed light on why Stacked Tempering works, and how hyperparameters, such as the aspect ratios of the RBMs and weight regularization should be chosen. We illustrate the efficiency of the Stacked Tempering method with respect to standard and replica exchange MC on several datasets: MNIST, in-silico Lattice Proteins, and the 2D-Ising model.",
        "keywords": "sampling;Restricted Boltzmann Machines;statistical physics",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/7164d66c953224cff85276630203b13c8c5588fa.pdf",
        "author": "Jorge Fernandez-de-Cossio-Diaz;Cl\u00e9ment Roussel;Simona Cocco;Remi Monasson",
        "authorids": "~Jorge_Fernandez-de-Cossio-Diaz1;~Cl\u00e9ment_Roussel1;~Simona_Cocco1;~Remi_Monasson1",
        "gender": ";M;F;M",
        "homepage": ";;http://www.lps.ens.fr/~cocco/;http://www.phys.ens.fr/~monasson/",
        "dblp": ";;;",
        "google_scholar": ";Bq0U-lUAAAAJ;;J6LkBeUAAAAJ",
        "orcid": ";;0000-0002-1852-7789;",
        "linkedin": ";;;",
        "or_profile": "~Jorge_Fernandez-de-Cossio-Diaz1;~Cl\u00e9ment_Roussel1;~Simona_Cocco1;~Remi_Monasson1",
        "aff": ";Ecole Normale Sup\u00e9rieure de Paris;Ecole Normale Sup\u00e9rieure de Paris;Ecole Normale Sup\u00e9rieure de Paris",
        "aff_domain": ";ens.fr;ens.fr;ens.fr",
        "position": ";Postdoc;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nfernandez-de-cossio-diaz2024accelerated,\ntitle={Accelerated Sampling with Stacked Restricted Boltzmann Machines},\nauthor={Jorge Fernandez-de-Cossio-Diaz and Cl{\\'e}ment Roussel and Simona Cocco and Remi Monasson},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=kXNJ48Hvw1}\n}",
        "github": "",
        "project": "",
        "reviewers": "mREg;fKHh;4ET5",
        "pdf_size": 1312114,
        "rating": "6;6;8",
        "confidence": "4;4;3",
        "soundness": "3;3;4",
        "contribution": "3;2;3",
        "presentation": "4;3;3",
        "wc_summary": "26;91;199",
        "wc_strengths": "25;91;95",
        "wc_weaknesses": "15;26;102",
        "wc_questions": "95;18;6",
        "wc_review": "161;226;402",
        "wc_reply_reviewers": "240;40;12",
        "wc_reply_authors": "860;594;255",
        "reply_reviewers": "1;1;1",
        "reply_authors": "2;1;1",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            105.33333333333333,
            71.35046523246285
        ],
        "wc_strengths_avg": [
            70.33333333333333,
            32.097074979228594
        ],
        "wc_weaknesses_avg": [
            47.666666666666664,
            38.681031814343086
        ],
        "wc_questions_avg": [
            39.666666666666664,
            39.432079439066975
        ],
        "wc_review_avg": [
            263.0,
            101.80700696252035
        ],
        "wc_reply_reviewers_avg": [
            97.33333333333333,
            101.52613237760787
        ],
        "wc_reply_authors_avg": [
            569.6666666666666,
            247.58881683594316
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9999999999999998,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17190126772987670980&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=kXNJ48Hvw1",
        "pdf": "https://openreview.net/pdf?id=kXNJ48Hvw1",
        "email": ";ens.fr;ens.fr;ens.fr",
        "author_num": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Ecole Normale Sup\u00e9rieure de Paris",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ens.fr",
        "aff_unique_abbr": "ENS Paris",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Paris",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "France"
    },
    {
        "id": "kYXZ4FT2b3",
        "title": "Grid Cell-Inspired Fragmentation and Recall for Efficient Map Building",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Animals and robots navigate through environments by building and refining maps of space. These maps enable functions including navigation back to home, planning, search and foraging. Here, we use observations from neuroscience, specifically the observed fragmentation of grid cell map in compartmentalized spaces, to propose and apply the concept of Fragmentation-and-Recall (FARMap) in the mapping of large spaces. Agents solve the mapping problem by building local maps via a surprisal-based clustering of space, which they use to set subgoals for spatial exploration. Agents build and use a local map to predict their observations; high surprisal leads to a \"fragmentation event\" that truncates the local map. At these events, the recent local map is placed into long-term memory (LTM) and a different local map is initialized. If observations at a fracture point match observations in one of the stored local maps, that map is recalled (and thus reused) from LTM. The fragmentation points induce a natural online clustering of the larger space, forming a set of intrinsic potential subgoals that are stored in LTM as a topological graph. Agents choose their next subgoal from the set of near and far potential subgoals from within the current local map or LTM, respectively. Thus, local maps guide exploration locally, while LTM promotes global exploration. We evaluate FARMap on complex procedurally-generated spatial environments and realistic simulations to demonstrate that this mapping strategy much more rapidly covers the environment (number of agent steps and wall clock time) and is more efficient in active memory usage, without loss of performance.",
        "keywords": "neuroscience;grid cell;remapping;fragmentation;recall",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "Jaedong Hwang;Zhang-Wei Hong;Eric R Chen;Akhilan Boopathy;Pulkit Agrawal;Ila R Fiete",
        "authorids": "~Jaedong_Hwang1;~Zhang-Wei_Hong1;~Eric_R_Chen1;~Akhilan_Boopathy1;~Pulkit_Agrawal1;~Ila_R_Fiete1",
        "gender": "M;M;;M;M;F",
        "homepage": "https://jd730.github.io/;;https://echen9898.github.io/;;https://people.eecs.berkeley.edu/~pulkitag/;https://fietelab.mit.edu/",
        "dblp": "239/1982;198/0600;;230/8358;149/2672;",
        "google_scholar": "https://scholar.google.co.kr/citations?user=bITgqEUAAAAJ;GZkyN4cAAAAJ;;;UpZmJI0AAAAJ;uE-CihIAAAAJ",
        "orcid": ";;;;;0000-0003-4738-2539",
        "linkedin": ";;;;;",
        "or_profile": "~Jaedong_Hwang1;~Zhang-Wei_Hong1;~Eric_R_Chen1;~Akhilan_Boopathy1;~Pulkit_Agrawal1;~Ila_R_Fiete1",
        "aff": "Massachusetts Institute of Technology;Massachusetts Institute of Technology;;Amazon;Massachusetts Institute of Technology;Massachusetts Institute of Technology",
        "aff_domain": "mit.edu;mit.edu;;amazon.com;mit.edu;mit.edu",
        "position": "PhD student;PhD student;;Intern;Assistant Professor;Professor",
        "bibtex": "@misc{\nhwang2024grid,\ntitle={Grid Cell-Inspired Fragmentation and Recall for Efficient Map Building},\nauthor={Jaedong Hwang and Zhang-Wei Hong and Eric R Chen and Akhilan Boopathy and Pulkit Agrawal and Ila R Fiete},\nyear={2024},\nurl={https://openreview.net/forum?id=kYXZ4FT2b3}\n}",
        "github": "",
        "project": "",
        "reviewers": "6iE9;LKBe;VpdJ",
        "site": "https://openreview.net/forum?id=kYXZ4FT2b3",
        "pdf_size": 3774448,
        "rating": "3;3;6",
        "confidence": "5;4;4",
        "soundness": "3;2;3",
        "contribution": "2;2;3",
        "presentation": "3;2;3",
        "wc_summary": "89;38;145",
        "wc_strengths": "55;10;31",
        "wc_weaknesses": "446;557;60",
        "wc_questions": "13;36;56",
        "wc_review": "603;641;292",
        "wc_reply_reviewers": "315;23;22",
        "wc_reply_authors": "1398;952;540",
        "reply_reviewers": "2;1;1",
        "reply_authors": "3;3;2",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            90.66666666666667,
            43.69846170697036
        ],
        "wc_strengths_avg": [
            32.0,
            18.384776310850235
        ],
        "wc_weaknesses_avg": [
            354.3333333333333,
            213.00130411703012
        ],
        "wc_questions_avg": [
            35.0,
            17.568911937472585
        ],
        "wc_review_avg": [
            512.0,
            156.33511015337106
        ],
        "wc_reply_reviewers_avg": [
            120.0,
            137.88642669482255
        ],
        "wc_reply_authors_avg": [
            963.3333333333334,
            350.3686946949202
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4963580668068294333&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "Massachusetts Institute of Technology;Amazon",
        "aff_unique_dep": ";Amazon.com, Inc.",
        "aff_unique_url": "https://web.mit.edu;https://www.amazon.com",
        "aff_unique_abbr": "MIT;Amazon",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Large Language Models as Automated Aligners for benchmarking Vision-Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17968",
        "id": "kZEXgtMNNo",
        "author_site": "Yuanfeng Ji, Chongjian GE, Weikai Kong, Enze Xie, Zhengying Liu, Zhenguo Li, Ping Luo",
        "tldr": "",
        "abstract": "With the advancements in Large Language Models (LLMs), Vision-Language Models (VLMs) have reached a new level of sophistication, showing notable competence in executing intricate cognition and reasoning tasks. However, existing evaluation benchmarks, primarily relying on rigid, hand-crafted datasets to measure task-specific performance, face significant limitations in assessing the alignment of these increasingly anthropomorphic models with human intelligence. In this work, we address the limitations via Auto-Bench, which delves into exploring LLMs as proficient aligners, measuring the alignment between VLMs and human intelligence and value through automatic data curation and assessment. Specifically, for data curation, Auto-Bench utilizes LLMs (e.g., GPT-4) to automatically generate a vast set of question-answer-reasoning triplets via prompting on visual symbolic representations (e.g., captions, object locations, instance relationships, and etc. The curated data closely matches human intent, owing to the extensive world knowledge embedded in LLMs. Through this pipeline, a total of 28.5K human-verified and 3,504K unfiltered question-answer-reasoning triplets have been curated, covering 4 primary abilities and 16 sub-abilities. We subsequently engage LLMs like GPT-3.5 to serve as judges, implementing the quantitative and qualitative automated assessments to facilitate a comprehensive evaluation of VLMs. Our validation results reveal that LLMs are proficient in both evaluation data curation and model assessment, achieving an average agreement rate of 85%. We envision Auto-Bench as a flexible, scalable, and comprehensive benchmark for evaluating the evolving sophisticated VLMs.",
        "keywords": "LLMs;VLMs;Benchmark",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Yuanfeng Ji;Chongjian GE;Weikai Kong;Enze Xie;Zhengying Liu;Zhenguo Li;Ping Luo",
        "authorids": "~Yuanfeng_Ji1;~Chongjian_GE1;~Weikai_Kong1;~Enze_Xie1;~Zhengying_Liu2;~Zhenguo_Li1;~Ping_Luo2",
        "gender": "M;M;M;M;M;M;",
        "homepage": ";https://chongjiange.github.io;https://www.researchgate.net/profile/Weikai-Kong;https://xieenze.github.io/;;http://www.ee.columbia.edu/~zgli/;http://luoping.me/",
        "dblp": "227/4488;287/4197;;218/5441;241/1782;23/6479;54/4989-2.html",
        "google_scholar": "7HGv1bkAAAAJ;https://scholar.google.com.hk/citations?user=7DA_vcUAAAAJ;;42MVVPgAAAAJ;http:// DFme0joAAAAJ;XboZC1AAAAAJ;https://scholar.google.com.hk/citations?hl=en",
        "orcid": ";;;;;;0000-0002-6685-7950",
        "linkedin": ";chongjian-ge-%EF%BC%88%E8%91%9B%E5%B4%87%E5%89%91%EF%BC%89-3b393310b/;;;;;",
        "or_profile": "~Yuanfeng_Ji1;~Chongjian_GE1;~Weikai_Kong1;~Enze_Xie1;~Zhengying_Liu2;~Zhenguo_Li1;~Luo_Ping2",
        "aff": "University of Hong Kong;The University of Hong Kong;;Huawei Noah's Ark Lab;Huawei Technologies Ltd.;Huawei Noah's Ark Lab;The University of Hong Kong",
        "aff_domain": "hku.hk;hku.hk;;huawei.com;huawei.com;huawei.com;hku.hk",
        "position": "PhD student;PhD student;;Researcher;Researcher;Principal Researcher;Associate Professor",
        "bibtex": "@inproceedings{\nji2024large,\ntitle={Large Language Models as Automated Aligners for  benchmarking  Vision-Language Models},\nauthor={Yuanfeng Ji and Chongjian GE and Weikai Kong and Enze Xie and Zhengying Liu and Zhenguo Li and Ping Luo},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=kZEXgtMNNo}\n}",
        "github": "",
        "project": "",
        "reviewers": "G18f;69zX;m7V9",
        "pdf_size": 16442384,
        "rating": "5;5;8",
        "confidence": "4;5;4",
        "soundness": "2;2;4",
        "contribution": "2;2;4",
        "presentation": "3;3;4",
        "wc_summary": "58;465;86",
        "wc_strengths": "42;4;181",
        "wc_weaknesses": "162;4;81",
        "wc_questions": "4;4;22",
        "wc_review": "266;477;370",
        "wc_reply_reviewers": "0;394;0",
        "wc_reply_authors": "862;2697;243",
        "reply_reviewers": "0;1;0",
        "reply_authors": "3;5;1",
        "rating_avg": [
            6.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            203.0,
            185.6142954264748
        ],
        "wc_strengths_avg": [
            75.66666666666667,
            76.08036686440347
        ],
        "wc_weaknesses_avg": [
            82.33333333333333,
            64.51011979182456
        ],
        "wc_questions_avg": [
            10.0,
            8.48528137423857
        ],
        "wc_review_avg": [
            371.0,
            86.14329147801742
        ],
        "wc_reply_reviewers_avg": [
            131.33333333333334,
            185.73338119166644
        ],
        "wc_reply_authors_avg": [
            1267.3333333333333,
            1042.0333754518401
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.0,
            1.632993161855452
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9959602426096390638&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=kZEXgtMNNo",
        "pdf": "https://openreview.net/pdf?id=kZEXgtMNNo",
        "email": "hku.hk;hku.hk;;huawei.com;huawei.com;huawei.com;hku.hk",
        "author_num": 7,
        "aff_unique_index": "0;0;1;1;1;0",
        "aff_unique_norm": "University of Hong Kong;Huawei",
        "aff_unique_dep": ";Noah's Ark Lab",
        "aff_unique_url": "https://www.hku.hk;https://www.huawei.com",
        "aff_unique_abbr": "HKU;Huawei",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "kaAtQwhnM2",
        "title": "Perturb and Learn: Energy-Based Modelling in Discrete Spaces without MCMC",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Energy-based models (EBMs) offer a flexible framework for probabilistic modelling across various data domains. However, training EBMs on discrete data poses significant challenges, primarily due to the intricacies of sampling in such spaces. In this work, we propose to train discrete EBMs with Energy Discrepancy which only requires the evaluation of the energy function at data points and their perturbed counterparts, thus eliminating the need for demanding sampling techniques like Markov chain Monte Carlo. Energy discrepancy offers theoretical guarantees applicable to a broad class of perturbation processes, of which we investigate three types: perturbations based on Bernoulli noise, deterministic transforms, and neighbourhood structures. We estimate the energy discrepancy loss effectively using importance sampling with two types of proposal distributions: uninformed and gradient-informed. Empirically, we demonstrate the efficacy of the proposed approaches in a wide range of applications, including Ising models training, discrete density estimation, graph generation, and discrete image modelling.",
        "keywords": "Energy-based models;discrete probabilistic modelling;importance sampling",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/5be1d2378523f08c70c0add40ed5b9045e9a3857.zip",
        "author": "Tobias Schr\u00f6der;Zijing Ou;Yingzhen Li;Andrew B. Duncan",
        "authorids": "~Tobias_Schr\u00f6der2;~Zijing_Ou1;~Yingzhen_Li1;~Andrew_B._Duncan1",
        "gender": ";F;M;M",
        "homepage": "https://j-zin.github.io/;http://yingzhenli.net/home/en/;;https://tobias-schroeder.github.io",
        "dblp": "246/3072;117/9230;189/0076;",
        "google_scholar": "zZg3Cm0AAAAJ;https://scholar.google.se/citations?hl=en;https://scholar.google.co.uk/citations?user=3ZzC72cAAAAJ;",
        "orcid": ";;;",
        "linkedin": ";;andrew-duncan-404690140/;tobias-schroeder-3295b3215/",
        "or_profile": "~Zijing_Ou1;~Yingzhen_Li1;~Andrew_Duncan1;~Tobias_Schroeder1",
        "aff": "Imperial College London;Imperial College London;;Imperial College London",
        "aff_domain": "imperial.ac.uk;imperial.ac.uk;;ic.ac.uk",
        "position": "PhD student;Associate Professor;;PhD student",
        "bibtex": "@misc{\nschr{\\\"o}der2024perturb,\ntitle={Perturb and Learn: Energy-Based Modelling in Discrete Spaces without {MCMC}},\nauthor={Tobias Schr{\\\"o}der and Zijing Ou and Yingzhen Li and Andrew B. Duncan},\nyear={2024},\nurl={https://openreview.net/forum?id=kaAtQwhnM2}\n}",
        "github": "",
        "project": "",
        "reviewers": "g3dj;BscE;wato;tPh7;kTVF",
        "site": "https://openreview.net/forum?id=kaAtQwhnM2",
        "pdf_size": 3145402,
        "rating": "3;5;5;6;8",
        "confidence": "5;4;4;3;4",
        "soundness": "2;3;2;3;4",
        "contribution": "2;2;2;2;4",
        "presentation": "3;3;3;3;4",
        "wc_summary": "52;64;84;87;224",
        "wc_strengths": "38;44;56;120;20",
        "wc_weaknesses": "135;249;728;178;22",
        "wc_questions": "198;147;5;43;78",
        "wc_review": "423;504;873;428;344",
        "wc_reply_reviewers": "32;115;72;28;22",
        "wc_reply_authors": "1711;1332;1257;1010;717",
        "reply_reviewers": "1;1;1;1;1",
        "reply_authors": "3;2;3;3;2",
        "rating_avg": [
            5.4,
            1.624807680927192
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.8,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.4,
            0.8
        ],
        "presentation_avg": [
            3.2,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            102.2,
            62.25238951237133
        ],
        "wc_strengths_avg": [
            55.6,
            34.23214863253547
        ],
        "wc_weaknesses_avg": [
            262.4,
            244.1758382805309
        ],
        "wc_questions_avg": [
            94.2,
            69.8610048596497
        ],
        "wc_review_avg": [
            514.4,
            186.3100641404001
        ],
        "wc_reply_reviewers_avg": [
            53.8,
            35.295325469529246
        ],
        "wc_reply_authors_avg": [
            1205.4,
            331.9750593041592
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.6,
            0.4898979485566356
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5838742081211422,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:lGpRDOWtGgEJ:scholar.google.com/&scioq=Perturb+and+Learn:+Energy-Based+Modelling+in+Discrete+Spaces+without+MCMC&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Imperial College London",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.imperial.ac.uk",
        "aff_unique_abbr": "ICL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "kaESRw3ydg",
        "title": "Knowledge-Augmented Large Vision-and-Language Assistant",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recent advancements in vision and language foundation models have enabled interaction with visual input through image-based queries and improved human-machine interaction and robotics applications. However, this paper argues that relying solely on visual input from pre-trained models may not suffice, with some tasks demanding additional knowledge. Therefore, it focuses on augmenting pre-trained VL foundation models with external knowledge to enhance performance and applicability. The paper introduces a novel approach that constructs a diverse knowledge database, clusters word knowledge, and integrates it into VL models, such as InstructBLIP, demonstrating improved results in open-ended multi-modal tasks. In summary, the paper contributes an innovative method for knowledge augmentation in VL models, enhancing their performance and applicability to a range of tasks.",
        "keywords": "vision and language; knowledge augmentation; instruction tuning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Chia-Wen Kuo;Chunyuan Li;Jianwei Yang;Zsolt Kira",
        "authorids": "~Chia-Wen_Kuo1;~Chunyuan_Li1;~Jianwei_Yang1;~Zsolt_Kira1",
        "gender": "M;;M;M",
        "homepage": "https://sites.google.com/view/chiawen-kuo/home;http://chunyuan.li/;https://faculty.cc.gatech.edu/~zk15;https://jwyang.github.io/",
        "dblp": ";64/9590;36/4127;",
        "google_scholar": "iip65VkAAAAJ;Zd7WmXUAAAAJ;2a5XgNAAAAAJ;Cl9byD8AAAAJ",
        "orcid": ";;0000-0002-2626-2004;",
        "linkedin": ";;;",
        "or_profile": "~Chia-Wen_Kuo1;~Chunyuan_Li1;~Zsolt_Kira1;~Jianwei_Yang2",
        "aff": "ByteDance Inc.;Microsoft Research;Georgia Institute of Technology;Microsoft",
        "aff_domain": "bytedance.com;microsoft.com;gatech.edu;microsoft.com",
        "position": "Researcher;Principal Researcher;Assistant Professor;Researcher",
        "bibtex": "@misc{\nkuo2024knowledgeaugmented,\ntitle={Knowledge-Augmented Large Vision-and-Language Assistant},\nauthor={Chia-Wen Kuo and Chunyuan Li and Jianwei Yang and Zsolt Kira},\nyear={2024},\nurl={https://openreview.net/forum?id=kaESRw3ydg}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=kaESRw3ydg",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ttde0W_Ho1wJ:scholar.google.com/&scioq=Knowledge-Augmented+Large+Vision-and-Language+Assistant&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "ByteDance;Microsoft;Georgia Institute of Technology",
        "aff_unique_dep": ";Microsoft Research;",
        "aff_unique_url": "https://www.bytedance.com;https://www.microsoft.com/en-us/research;https://www.gatech.edu",
        "aff_unique_abbr": "ByteDance;MSR;Georgia Tech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "kaFrlUcAn3",
        "title": "Debiasing Language Models Using Energy-Guided Ordinary Differential Equations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Language Models (LMs) excel in learning from training datasets. However, they often inadvertently incorporate societal biases within the data they draw from, raising fairness concerns in their applications. In response, this paper introduces a novel method to reduce such biases. Our approach leverages the Energy-Based Model (EBM) gradient to navigate Ordinary Differential Equations (ODEs) sampling within a latent space. Firstly, we create a latent space and link it with text space in LMs through efficient tuning. Then, we train classifiers in this space that discriminate certain bias attributes. By integrating these classifiers into an EBM frame, we use the EBM gradient to gradually steer the ODE solver in choosing less-biased samples from the latent space. Finally, the LM decodes the latent sample back into the text space, thus generating debiased output across multiple attributes. The preliminary evaluation demonstrates that our method successfully decreases joint bias while retaining essential semantic content, representing a promising step towards more equitable LMs.",
        "keywords": "Language Model;Debiasing;Ordinary Differential Equation;Energy-based Model",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Mingzhe Du;Anh Tuan Luu;Bin Ji;See-Kiong Ng",
        "authorids": "~Mingzhe_Du1;~Anh_Tuan_Luu2;~Bin_Ji3;~See-Kiong_Ng1",
        "gender": "M;M;M;M",
        "homepage": "https://elfsong.github.io/;https://tuanluu.github.io/;https://jibin5167.github.io/;https://www.comp.nus.edu.sg/~ngsk/",
        "dblp": ";81/8329.html;119/1943-2.html;00/5480",
        "google_scholar": "CJHW1IgAAAAJ;https://scholar.google.com.sg/citations?hl=en;31ZXPVQAAAAJ;https://scholar.google.com.tw/citations?user=_wsommYAAAAJ",
        "orcid": ";;0000-0002-5508-5051;0000-0001-6565-7511",
        "linkedin": ";;bin-ji-3b89a3269/;seekiong/?originalSubdomain=sg",
        "or_profile": "~Mingzhe_Du1;~Anh_Tuan_Luu2;~Bin_Ji3;~See-Kiong_Ng1",
        "aff": "National University of Singapore;Nanyang Technological University;National University of Singapore;National University of Singapore",
        "aff_domain": "nus.edu;ntu.edu.sg;nus.edu.sg;nus.edu.sg",
        "position": "Researcher;Assistant Professor;Postdoc;Full Professor",
        "bibtex": "@misc{\ndu2024debiasing,\ntitle={Debiasing Language Models Using Energy-Guided Ordinary Differential Equations},\nauthor={Mingzhe Du and Anh Tuan Luu and Bin Ji and See-Kiong Ng},\nyear={2024},\nurl={https://openreview.net/forum?id=kaFrlUcAn3}\n}",
        "github": "",
        "project": "",
        "reviewers": "PBNe;kTHj;CA2c;bvt7",
        "site": "https://openreview.net/forum?id=kaFrlUcAn3",
        "pdf_size": 3352045,
        "rating": "5;5;5;5",
        "confidence": "4;4;3;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;1",
        "presentation": "2;2;3;2",
        "wc_summary": "79;101;70;109",
        "wc_strengths": "52;38;23;21",
        "wc_weaknesses": "180;213;2;94",
        "wc_questions": "43;276;353;220",
        "wc_review": "354;628;448;444",
        "wc_reply_reviewers": "21;636;0;16",
        "wc_reply_authors": "1611;2038;836;1152",
        "reply_reviewers": "1;5;0;1",
        "reply_authors": "4;6;3;3",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            89.75,
            15.833114033569013
        ],
        "wc_strengths_avg": [
            33.5,
            12.539936203984453
        ],
        "wc_weaknesses_avg": [
            122.25,
            81.89742059430199
        ],
        "wc_questions_avg": [
            223.0,
            114.14683526055376
        ],
        "wc_review_avg": [
            468.5,
            99.46230441730174
        ],
        "wc_reply_reviewers_avg": [
            168.25,
            270.16696226592916
        ],
        "wc_reply_authors_avg": [
            1409.25,
            455.74739439737886
        ],
        "reply_reviewers_avg": [
            1.75,
            1.920286436967152
        ],
        "reply_authors_avg": [
            4.0,
            1.224744871391589
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:EhEWYffNuqUJ:scholar.google.com/&scioq=Debiasing+Language+Models+Using+Energy-Guided+Ordinary+Differential+Equations&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "National University of Singapore;Nanyang Technological University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.nus.edu.sg;https://www.ntu.edu.sg",
        "aff_unique_abbr": "NUS;NTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Singapore"
    },
    {
        "id": "kaGA40pfFY",
        "title": "Rationality of Thought Improves Reasoning in Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "While the capabilities of large language models (LLMs) have been progressively advanced, their competence in addressing intricate reasoning tasks remains inadequate, primarily due to their insufficient cognitive capabilities. To explore the cognitive proficiency of models like GPT-4, we turn to methodologies from cognitive psychology: cognitive abilities reflect rational thinking skills, and cognitive bias tasks are often used to assess rational thinking levels. In this paper, we develop a cognitive bias dataset to measure the rational thinking and cognitive levels of LLMs. Our observations indicate that GPT-4, akin to humans, exhibits limitations in its rational thinking ability. We propose a new method, \u201cRationality of Thought\u201d (RoT), to prompt LLMs into a rational thinking process during task execution. This method significantly improves the accuracy of GPT-4 on the cognitive bias task by 18.7\\%. Cognitive capacity is also essential for tackling complex issues, therefore, we implement RoT across various reasoning tasks. Using only a zero-shot setting, RoT outperforms inference enhancement techniques such as CoT using few-shot, such as GSM8K (+0.4), AQUA-RAT (+4.8), ARC-c (+0.7) in multiple arithmetic and common sense reasoning tasks. Our empirical evaluation shows that RoT helps LLMs elevate their cognitive capabilities through rational thinking, thereby becoming more adept at navigating complex reasoning tasks.",
        "keywords": "Large Language Model;Rational Thinking;Rationality of Thought;Cognitive Bias",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Tian Gou;Boyao Zhang;Zhenglie Sun;Jing Wang;Yangang Wang;Jue Wang",
        "authorids": "~Tian_Gou2;~Boyao_Zhang2;~Zhenglie_Sun1;~Jing_Wang42;~Yangang_Wang4;~Jue_Wang11",
        "gender": "F;M;F;;M;M",
        "homepage": "https://www.researchgate.net/profile/Tian-Gou-3;;http://cnic.cas.cn/sourcedb_cnic_cas/zw/zjrc/dsdw/202304/t20230421_6742780.html;;http://cnic.cas.cn/sourcedb_cnic_cas/zw/rcdw/yjy/202107/t20210702_6125763.html;https://www.researchgate.net/profile/Sun-Lie",
        "dblp": "382/5497;;;83/9429.html;;",
        "google_scholar": ";https://scholar.google.co.uk/citations?hl=en;;;;jycVbzIAAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Tian_Gou2;~Boyao_Zhang2;~Jing_Wang42;~Yangang_Wang4;~Jue_Wang11;~Sun_Zheng_lie1",
        "aff": "Computer Network Information Center, Chinese Academy of Sciences;Computer Network Information Center, Chinese Academy of Sciences;;;Computer Network Information Center,Chinese Academy of Sciences;Chinese Academy of SciencesComputer Network Information Center",
        "aff_domain": "cnic.cn;english.cnic.cas.cn;;;cnic.cn;cnic.cn",
        "position": "PhD student;Associate Professor;;;Full Professor;PhD student",
        "bibtex": "@misc{\ngou2024rationality,\ntitle={Rationality of Thought Improves Reasoning in Large Language Models},\nauthor={Tian Gou and Boyao Zhang and Zhenglie Sun and Jing Wang and Yangang Wang and Jue Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=kaGA40pfFY}\n}",
        "github": "",
        "project": "",
        "reviewers": "58ny;QJRm;BFjh;Zkyz",
        "site": "https://openreview.net/forum?id=kaGA40pfFY",
        "pdf_size": 6099543,
        "rating": "6;6;6;8",
        "confidence": "4;4;4;5",
        "soundness": "3;2;3;4",
        "contribution": "3;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "59;91;55;57",
        "wc_strengths": "29;64;33;59",
        "wc_weaknesses": "476;120;51;38",
        "wc_questions": "148;203;2;289",
        "wc_review": "712;478;141;443",
        "wc_reply_reviewers": "30;0;12;7",
        "wc_reply_authors": "2729;1682;401;2464",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "5;3;2;5",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            65.5,
            14.79019945774904
        ],
        "wc_strengths_avg": [
            46.25,
            15.417117110536587
        ],
        "wc_weaknesses_avg": [
            171.25,
            178.686002529577
        ],
        "wc_questions_avg": [
            160.5,
            104.39947317874741
        ],
        "wc_review_avg": [
            443.5,
            202.9710570500139
        ],
        "wc_reply_reviewers_avg": [
            12.25,
            11.098986440211556
        ],
        "wc_reply_authors_avg": [
            1819.0,
            904.657117365469
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.75,
            1.299038105676658
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7678247999139440672&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Chinese Academy of Sciences",
        "aff_unique_dep": "Computer Network Information Center",
        "aff_unique_url": "http://www.cas.cn",
        "aff_unique_abbr": "CAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "kaZAKvjLro",
        "title": "Semi-supervised Long-tailed Recognition using Alternate Sampling",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Long tailed recognition is confronted by two interven-\ning challenges, i.e., the sample scarcity in the tail classes\nand the imbalanced class distribution. The class geome-\ntry in feature space mainly suffers from the data scarcity,\nwhile imbalance distribution biases the decision boundary\nof classes. Previous work makes assumptions on the under-\nneath geometric structure of the tail classes to address the\ndata scarcity challenge, and resorts to class balanced sam-\npling or reweighting to address the data imbalance chal-\nlenge. We advocate to leverage the readily available un-\nlabeled data in a semi-supervised setting to approach to\nlong tailed recognition. An alternate sampling strategy is\nthen introduced to overcome the two challenges in a single\nframework. The feature embedding (geometric structure)\nand classifier are updated in an iterative fashion. The extra\nunlabeled data, regularized by a consistency loss, leads to\na better geometric structure. The class-balanced sampling\nis implemented to train the classifier such that it is not af-\nfected by the imbalance distribution or the quality of pseudo\nlabels. We demonstrate significant accuracy improvements\nover other competitive methods on two datasets, where we\nimprove on tail classes without much, if at all, degradations\non head classes.",
        "keywords": "Long-tailed Recognition;Semi-supervised Learning",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Bo Liu;Haoxiang Li;Hao Kang;Nuno Vasconcelos;Gang Hua",
        "authorids": "~Bo_Liu16;~Haoxiang_Li1;~Hao_Kang2;~Nuno_Vasconcelos1;~Gang_Hua3",
        "gender": "M;M;M;M;M",
        "homepage": "http://www.svcl.ucsd.edu/people/liubo/;https://resume.haoxiang.org;https://www.linkedin.com/in/haokang2017;http://www.svcl.ucsd.edu/~nuno/;http://www.ganghua.org",
        "dblp": ";;;78/4806;75/5209.html",
        "google_scholar": ";Fu6aoXAAAAAJ;VeTCSyEAAAAJ;Fykyo9gAAAAJ;7SgUlggAAAAJ",
        "orcid": ";;;0000-0002-9024-4302;0000-0001-9522-6157",
        "linkedin": ";haoxiangli/;;;ganghua/",
        "or_profile": "~Bo_Liu16;~Haoxiang_Li1;~Hao_Kang2;~Nuno_Vasconcelos1;~Gang_Hua3",
        "aff": "Wormpex AI Research;Wormpex AI Research;Wormpex AI Research;University of California, San Diego;Wormpex AI Research",
        "aff_domain": "bianlifeng.com;wormpexai.com;wormpex.com;ucsd.edu;bianlifeng.com",
        "position": "Researcher;Principal Researcher;Researcher;Professor;Chief Scientist and Managing Director",
        "bibtex": "@misc{\nliu2024semisupervised,\ntitle={Semi-supervised Long-tailed Recognition using Alternate Sampling},\nauthor={Bo Liu and Haoxiang Li and Hao Kang and Nuno Vasconcelos and Gang Hua},\nyear={2024},\nurl={https://openreview.net/forum?id=kaZAKvjLro}\n}",
        "github": "",
        "project": "",
        "reviewers": "9E5Z;a8kj;3b2a;TaGn",
        "site": "https://openreview.net/forum?id=kaZAKvjLro",
        "pdf_size": 451645,
        "rating": "3;3;3;5",
        "confidence": "5;4;4;4",
        "soundness": "2;2;3;2",
        "contribution": "1;2;1;2",
        "presentation": "2;3;3;2",
        "wc_summary": "72;44;194;68",
        "wc_strengths": "17;19;42;23",
        "wc_weaknesses": "102;182;81;144",
        "wc_questions": "4;2;73;6",
        "wc_review": "195;247;390;241",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            94.5,
            58.43586227651647
        ],
        "wc_strengths_avg": [
            25.25,
            9.908960591303208
        ],
        "wc_weaknesses_avg": [
            127.25,
            38.90613704802881
        ],
        "wc_questions_avg": [
            21.25,
            29.911327285829362
        ],
        "wc_review_avg": [
            268.25,
            73.11420860544139
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3146115032091924551&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "Wormpex AI Research;University of California, San Diego",
        "aff_unique_dep": "AI Research;",
        "aff_unique_url": ";https://www.ucsd.edu",
        "aff_unique_abbr": "Wormpex AI;UCSD",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";San Diego",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "kbQIWi4ZiL",
        "title": "Unsupervised combinatorial optimization under complex conditions: Principled objectives and incremental greedy derandomization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Combinatorial optimization (CO) has significant theoretical and practical implications.\nCO problems are naturally discrete, making typical machine-learning techniques based on differentiable optimization inapplicable.\nKaralias & Loukas (2020) adapted the probabilistic method, an important tool in combinatorics, to incorporate CO problems into differentiable optimization. \nTheir work ignited the research on unsupervised learning for CO, composed of two main components: probabilistic objectives and derandomization.\nSeveral desirable properties of probabilistic objectives have been proposed, but without principled schemes to satisfy them.\nAlso, the derandomization process is still underexplored.\nMotivated by the limitations, we propose our method UCom2, consisting of two schemes:\n(1) a *principled* probabilistic objective construction scheme that provably satisfies the good properties, and\n(2) a *fast* and *effective* derandomization scheme with a quality guarantee.\nWe apply UCom2 to various *complex conditions* (e.g., cardinality constraints, non-binary decisions) and problems involving them, highlighting that UCom2 is *general* and *practical*.\nWe further show the empirical superiority of UCom2 w.r.t. both optimization quality and speed.",
        "keywords": "Unsupervised combinatorial optimization;the probabilistic method;derandomization",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/b46fbcf0dae3035f2fd0e3f2bf03e7b27d650ab1.zip",
        "author": "Fanchen Bu;Hyeonsoo Jo;Sungsoo Ahn;Kijung Shin",
        "authorids": "~Fanchen_Bu1;~Hyeonsoo_Jo1;~Sungsoo_Ahn1;~Kijung_Shin2",
        "gender": "M;M;M;M",
        "homepage": "https://github.com/bokveizen;https://hyeonsoojo.github.io/;https://sungsooahn.super.site/;https://kijungs.github.io/",
        "dblp": "270/0123;254/8496;90/5164;153/2052",
        "google_scholar": "XjNu7-AAAAAJ;dx5_RmkAAAAJ;XTenHs0AAAAJ;https://scholar.google.co.kr/citations?user=Yp3Cz5AAAAAJ",
        "orcid": "0000-0003-0497-3902;0000-0002-9281-8672;;0000-0002-2872-1526",
        "linkedin": "fanchen-bu-1268a1255/;hyeonsoo-jo-203960179/;;kijungshin/",
        "or_profile": "~Fanchen_Bu1;~Hyeonsoo_Jo1;~Sungsoo_Ahn1;~Kijung_Shin2",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Pohang University of Science and Technology;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr;postech.ac.kr;kaist.ac.kr",
        "position": "PhD student;PhD student;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nbu2024unsupervised,\ntitle={Unsupervised combinatorial optimization under complex conditions: Principled objectives and incremental greedy derandomization},\nauthor={Fanchen Bu and Hyeonsoo Jo and Sungsoo Ahn and Kijung Shin},\nyear={2024},\nurl={https://openreview.net/forum?id=kbQIWi4ZiL}\n}",
        "github": "",
        "project": "",
        "reviewers": "M2Ai;yrHB;RnVS",
        "site": "https://openreview.net/forum?id=kbQIWi4ZiL",
        "pdf_size": 657924,
        "rating": "3;6;6",
        "confidence": "2;3;3",
        "soundness": "2;3;3",
        "contribution": "2;3;2",
        "presentation": "3;2;3",
        "wc_summary": "47;65;70",
        "wc_strengths": "36;84;64",
        "wc_weaknesses": "138;110;74",
        "wc_questions": "50;56;45",
        "wc_review": "271;315;253",
        "wc_reply_reviewers": "4;212;0",
        "wc_reply_authors": "1920;4143;1166",
        "reply_reviewers": "1;5;0",
        "reply_authors": "6;14;6",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            60.666666666666664,
            9.877021593352703
        ],
        "wc_strengths_avg": [
            61.333333333333336,
            19.68643074697787
        ],
        "wc_weaknesses_avg": [
            107.33333333333333,
            26.195843605851334
        ],
        "wc_questions_avg": [
            50.333333333333336,
            4.4969125210773475
        ],
        "wc_review_avg": [
            279.6666666666667,
            26.04269997949948
        ],
        "wc_reply_reviewers_avg": [
            72.0,
            99.00841715059718
        ],
        "wc_reply_authors_avg": [
            2409.6666666666665,
            1263.7147181578955
        ],
        "reply_reviewers_avg": [
            2.0,
            2.160246899469287
        ],
        "reply_authors_avg": [
            8.666666666666666,
            3.7712361663282534
        ],
        "replies_avg": [
            36,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:OTAoDoYumiEJ:scholar.google.com/&scioq=Unsupervised+combinatorial+optimization+under+complex+conditions:+Principled+objectives+and+incremental+greedy+derandomization&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology;Pohang University of Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.kaist.ac.kr;https://www.postech.ac.kr",
        "aff_unique_abbr": "KAIST;POSTECH",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Pohang",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "kcKfkJiKw5",
        "title": "In-context Curriculum for Mathematical Reasoning in Small Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Specializing Small Language Models (SLMs) in mathematical reasoning improves the scaling of model performance and reduces the cost of inference. Leveraging the model's context is key for specialization and parameter-free adaptation in the In-context Learning (ICL) paradigm. In the case of Large Language Models (LLMs), more reasoning steps in the chain-of-thought (COT) based demonstrations within an ICL prompt are known to result in higher accuracy during testing on mathematical reasoning datasets such as GSM8K. Although SLMs have limited capability for multi-step COT reasoning, prior works in specializing SLMs use multi-step COT-based demonstrations to encapsulate model context. We propose an alternative termed the In-context Curriculum Random (ICCR) prompt which varies the complexity of demonstrations, ranging from a simple single COT-based reasoning step to more complex multi-step COT-based demonstrations. ICCR achieves a 16.15\\% inference accuracy on the GSM8K dataset, surpassing the 14.33\\% accuracy displayed by the GPT 3.5-distilled COT baseline for SLM specialization. Unlike the aforementioned baseline, ICCR uses out-of-distribution datasets, i.e., ASDiv, SVAMP, and MathQA, which serve to emphasize simpler COT-based reasoning prompts. In the context of ICL, basic arithmetic calculation-based demonstrations in a natural language format are shown to outperform both the baseline and ICCR prompts on the Google FLAN-T5 XL and XXL models. We conclude that at model scales from 250M to 11B parameters, simpler COT-based reasoning prompts result in higher performance.",
        "keywords": "small language models;mathematical reasoning;in-context learning;specialization;Chain-of-thought prompting;deep learning;transformers;large language models",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/4ee879dda4687fdf7fafe1f9c841f308ec4e9c6a.zip",
        "author": "Jayant Parashar;Suchendra M. Bhandarkar",
        "authorids": "~Jayant_Parashar1;~Suchendra_M._Bhandarkar1",
        "gender": "M;",
        "homepage": ";",
        "dblp": ";",
        "google_scholar": "HZn8WI8AAAAJ;",
        "orcid": ";",
        "linkedin": "jayant-parashar-771039129/;",
        "or_profile": "~Jayant_Parashar1;~Suchendra_M._Bhandarkar1",
        "aff": "University of Georgia;",
        "aff_domain": "uga.edu;",
        "position": "PhD student;",
        "bibtex": "@misc{\nparashar2024incontext,\ntitle={In-context Curriculum for Mathematical Reasoning in Small Language Models},\nauthor={Jayant Parashar and Suchendra M. Bhandarkar},\nyear={2024},\nurl={https://openreview.net/forum?id=kcKfkJiKw5}\n}",
        "github": "",
        "project": "",
        "reviewers": "LFaS;VGtM;Rowt;QfrS;QtAE",
        "site": "https://openreview.net/forum?id=kcKfkJiKw5",
        "pdf_size": 3254281,
        "rating": "3;3;3;5;6",
        "confidence": "3;4;4;4;4",
        "soundness": "2;2;3;2;3",
        "contribution": "2;1;2;2;3",
        "presentation": "2;1;3;2;3",
        "wc_summary": "98;53;70;136;64",
        "wc_strengths": "51;69;50;24;61",
        "wc_weaknesses": "51;232;217;142;59",
        "wc_questions": "83;151;6;226;54",
        "wc_review": "283;505;343;528;238",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            4.0,
            1.2649110640673518
        ],
        "confidence_avg": [
            3.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            2.2,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            84.2,
            29.855652731099347
        ],
        "wc_strengths_avg": [
            51.0,
            15.192103211866355
        ],
        "wc_weaknesses_avg": [
            140.2,
            75.99842103622943
        ],
        "wc_questions_avg": [
            104.0,
            76.9909085541923
        ],
        "wc_review_avg": [
            379.4,
            117.02068193272504
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.39528470752104744,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:LqFADK8y9tUJ:scholar.google.com/&scioq=In-context+Curriculum+for+Mathematical+Reasoning+in+Small+Language+Models&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Georgia",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uga.edu",
        "aff_unique_abbr": "UGA",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "kce6LTZ5vY",
        "title": "Instruction Mining: Instruction Data Selection for Tuning Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs) are initially pretrained for broad capabilities and then finetuned with instruction-following datasets to improve their performance in interacting with humans. Despite advances in finetuning, a standardized guideline for selecting high-quality datasets to optimize this process remains elusive. In this paper, we first propose InstructMining, an innovative method designed for automatically selecting premium instruction-following data for finetuning LLMs. Specifically, InstructMining utilizes natural language indicators as a measure of data quality, applying them to evaluate unseen datasets. During experimentation, we discover that double descent phenomenon exists in large language model finetuning. Based on this observation, we further leverage BlendSearch to help find the best subset among the entire dataset (i.e., 2,532 out of 100,000). Experiment results show that InstructMining-7B achieves state-of-the-art performance on two of the most popular benchmarks: LLM-as-a-judge and OpenLLM benchmark.",
        "keywords": "data-centric machine learning;large language models;data mining;generative models;language model finetuning",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/39f14657c0b33cbdb74fa297d5c04a460ec8e4e2.zip",
        "author": "Yihan Cao;Yanbin Kang;Chi Wang;Lichao Sun",
        "authorids": "~Yihan_Cao1;~Yanbin_Kang1;~Chi_Wang3;~Lichao_Sun1",
        "gender": "F;;M;M",
        "homepage": ";;http://chiwang.cc;https://lichao-sun.github.io/",
        "dblp": ";;09/404-1;121/0780-1.html",
        "google_scholar": "OqAc0T0AAAAJ;;https://scholar.google.com/citations?hl=en;WhGUE7AAAAAJ",
        "orcid": "0000-0003-4420-8252;;;",
        "linkedin": ";yanbinkang/;chi-wang-autogen/;lichao-sun-b273a290/",
        "or_profile": "~Yihan_Cao1;~Yanbin_Kang1;~Chi_Wang3;~Lichao_Sun1",
        "aff": "LinkedIn;LinkedIn;Microsoft Research;Lehigh University",
        "aff_domain": "linkedin.com;linkedin.com;microsoft.com;lehigh.edu",
        "position": "Researcher;Machine Learning Engineer;Principal Researcher;Assistant Professor",
        "bibtex": "@misc{\ncao2024instruction,\ntitle={Instruction Mining: Instruction Data Selection for Tuning Large Language Models},\nauthor={Yihan Cao and Yanbin Kang and Chi Wang and Lichao Sun},\nyear={2024},\nurl={https://openreview.net/forum?id=kce6LTZ5vY}\n}",
        "github": "",
        "project": "",
        "reviewers": "TXJx;rbEk;CNR2;9wuG",
        "site": "https://openreview.net/forum?id=kce6LTZ5vY",
        "pdf_size": 800149,
        "rating": "3;5;6;6",
        "confidence": "4;4;4;4",
        "soundness": "2;3;2;4",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "40;51;104;81",
        "wc_strengths": "32;45;131;77",
        "wc_weaknesses": "303;138;358;45",
        "wc_questions": "5;148;107;57",
        "wc_review": "380;382;700;260",
        "wc_reply_reviewers": "0;259;207;63",
        "wc_reply_authors": "1142;2263;1234;687",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "4;6;2;2",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            69.0,
            25.16942589730644
        ],
        "wc_strengths_avg": [
            71.25,
            38.18622133702155
        ],
        "wc_weaknesses_avg": [
            211.0,
            125.45716400429272
        ],
        "wc_questions_avg": [
            79.25,
            53.6300988251933
        ],
        "wc_review_avg": [
            430.5,
            163.250574271578
        ],
        "wc_reply_reviewers_avg": [
            132.25,
            104.80785991518003
        ],
        "wc_reply_authors_avg": [
            1331.5,
            576.3004858578553
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.5,
            1.6583123951777
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 23,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=946685413099878255&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "LinkedIn Corporation;Microsoft;Lehigh University",
        "aff_unique_dep": ";Microsoft Research;",
        "aff_unique_url": "https://www.linkedin.com;https://www.microsoft.com/en-us/research;https://www.lehigh.edu",
        "aff_unique_abbr": "LinkedIn;MSR;Lehigh",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "keA1Ea7v6p",
        "title": "Federated Learning Empowered by Generative Content",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Federated learning (FL) enables leveraging distributed private data for model training in a privacy-preserving way. \nHowever, data heterogeneity significantly limits the performance of current FL methods. \nIn this paper, we propose a novel FL framework termed FedGC, designed to mitigate data heterogeneity issues by diversifying private data with generative content.\nFedGC is a simple-to-implement framework as it only introduces a one-shot step of data generation.\nIn data generation, we summarize three crucial and worth-exploring aspects (budget allocation, prompt design, and generation guidance) and propose three solution candidates for each aspect.\nSpecifically, to achieve a better trade-off between data diversity and fidelity for generation guidance, we propose to generate data based on the guidance of prompts and real data simultaneously.\nThe generated data is then merged with private data to facilitate local model training.\nSuch generative data increases the diversity of private data to prevent each client from fitting the potentially biased private data, alleviating the issue of data heterogeneity.\nWe conduct a systematic empirical study on FedGC, covering diverse baselines, datasets, scenarios, and modalities.\nInteresting findings include (1) FedGC consistently and significantly enhances the performance of FL methods, even when notable disparities exist between generative and private data; \n(2) FedGC achieves both better performance and privacy-preservation.\nWe wish this work can inspire future works to further explore the potential of enhancing FL with generative content.",
        "keywords": "federated learning;generative models",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Rui Ye;Xinyu Zhu;Jingyi Chai;Siheng Chen;Yanfeng Wang",
        "authorids": "~Rui_Ye1;~Xinyu_Zhu5;~Jingyi_Chai1;~Siheng_Chen1;~Yanfeng_Wang1",
        "gender": "M;M;F;M;M",
        "homepage": "http://rui-ye.github.io/;https://github.com/a-died-fish;;https://cmic.sjtu.edu.cn/wangyanfeng/;https://siheng-chen.github.io/",
        "dblp": ";;340/7940;55/5407-1.html;136/4945",
        "google_scholar": "Q4-VTxcAAAAJ;;aeYq_ScAAAAJ;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;0000-0002-3196-2347;",
        "linkedin": ";;;;",
        "or_profile": "~Rui_Ye1;~Xinyu_Zhu5;~Jingyi_Chai1;~Yanfeng_Wang1;~Siheng_Chen2",
        "aff": "Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn",
        "position": "PhD student;Undergrad student;Undergrad student;Full Professor;Associate Professor",
        "bibtex": "@misc{\nye2024federated,\ntitle={Federated Learning Empowered by Generative Content},\nauthor={Rui Ye and Xinyu Zhu and Jingyi Chai and Siheng Chen and Yanfeng Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=keA1Ea7v6p}\n}",
        "github": "",
        "project": "",
        "reviewers": "kHC9;c8uL;kS7r",
        "site": "https://openreview.net/forum?id=keA1Ea7v6p",
        "pdf_size": 3823400,
        "rating": "3;6;8",
        "confidence": "5;3;4",
        "soundness": "3;2;3",
        "contribution": "2;2;3",
        "presentation": "3;3;3",
        "wc_summary": "52;245;124",
        "wc_strengths": "23;48;19",
        "wc_weaknesses": "154;118;277",
        "wc_questions": "47;31;41",
        "wc_review": "276;442;461",
        "wc_reply_reviewers": "132;50;429",
        "wc_reply_authors": "1712;821;2412",
        "reply_reviewers": "1;1;3",
        "reply_authors": "5;3;5",
        "rating_avg": [
            5.666666666666667,
            2.0548046676563256
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            140.33333333333334,
            79.63388446858256
        ],
        "wc_strengths_avg": [
            30.0,
            12.832251036613439
        ],
        "wc_weaknesses_avg": [
            183.0,
            68.07348970047003
        ],
        "wc_questions_avg": [
            39.666666666666664,
            6.599663291074443
        ],
        "wc_review_avg": [
            393.0,
            83.09432391365048
        ],
        "wc_reply_reviewers_avg": [
            203.66666666666666,
            162.8134583571709
        ],
        "wc_reply_authors_avg": [
            1648.3333333333333,
            651.0813227922367
        ],
        "reply_reviewers_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5960395606792698,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5918951425568644820&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Shanghai Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sjtu.edu.cn",
        "aff_unique_abbr": "SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "kf21zlGvAc",
        "title": "Prompt-Based Length Controlled Generation with Reinforcement Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large language models (LLMs) like ChatGPT and GPT-4 have attracted great attention given their surprising performance on a wide range of NLP tasks. Length controlled generation of LLMs emerges as an important topic, which enables users to fully leverage the capability of LLMs in more real-world scenarios like generating a proper answer or essay of a desired length. In addition, the autoregressive generation in LLMs is extremely time-consuming, while the ability of controlling this generated length can reduce the inference cost by limiting the length.\nTherefore, we propose a prompt-based length control method to achieve high-accuracy length controlled generation. In particular, we adopt reinforcement learning with the reward signal given by either trainable or rule-based reward models, which further enhances the length-control ability of LLMs by rewarding outputs that follows pre-defined control instruction. To enable rule-based inference, we also introduce standard prompt extractor to collect the standard control information from users' input. Experiments show that our method significantly improves the accuracy of prompt-based length control for summarization task on popular datasets like CNNDM and NYT. Both the standard prompt extractor and the RL-tuned model have show strong generalization ability to unseen control prompt templates.",
        "keywords": "Text Generation;Length Control;GPT;Large Language Models;Prompt;Reinforcement Learning",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "RENLONG JIE;Xiaojun Meng;Lifeng Shang;Xin Jiang;Qun Liu",
        "authorids": "~RENLONG_JIE1;~Xiaojun_Meng1;~Lifeng_Shang1;~Xin_Jiang1;~Qun_Liu1",
        "gender": "M;M;M;M;M",
        "homepage": ";;;;http://liuquncn.github.io/",
        "dblp": ";79/9935;70/4288;42/4142-2;75/4402-1",
        "google_scholar": "qtBf5BAAAAAJ;https://scholar.google.com.sg/citations?hl=en;https://scholar.google.com.hk/citations?user=jMQIjYoAAAAJ;DUfcez0AAAAJ;2HhiGzcAAAAJ",
        "orcid": ";0000-0003-2425-7217;;0000-0002-9117-8247;0000-0002-7000-1792",
        "linkedin": ";mengxiaojun/;;xin-jiang-9577b76/;qunliu/",
        "or_profile": "~RENLONG_JIE1;~Xiaojun_Meng1;~Lifeng_Shang1;~Xin_Jiang1;~Qun_Liu1",
        "aff": "Northwest Polytechnical University Xi'an;Noah\u2019s Ark Lab, Huawei Technologies Ltd.;Huawei Technologies Ltd.;Noah\u2019s Ark Lab, Huawei Technologies;Huawei Noah's Ark Lab",
        "aff_domain": "nwpu.edu.cn;huawei.com;huawei.com;huawei.com;huawei.com",
        "position": "Associate Professor;Researcher;Researcher;Principal Researcher;Chief Scientist of Speech and Language Computing",
        "bibtex": "@misc{\njie2024promptbased,\ntitle={Prompt-Based Length Controlled Generation with Reinforcement Learning},\nauthor={RENLONG JIE and Xiaojun Meng and Lifeng Shang and Xin Jiang and Qun Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=kf21zlGvAc}\n}",
        "github": "",
        "project": "",
        "reviewers": "JNfU;Dv7r;8j8F;ZCo7",
        "site": "https://openreview.net/forum?id=kf21zlGvAc",
        "pdf_size": 472177,
        "rating": "3;5;5;5",
        "confidence": "4;4;4;4",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;2",
        "presentation": "2;3;3;3",
        "wc_summary": "64;183;87;94",
        "wc_strengths": "137;72;39;52",
        "wc_weaknesses": "401;274;199;196",
        "wc_questions": "43;31;36;13",
        "wc_review": "645;560;361;355",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "286;94;92;91",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            107.0,
            45.260357930533424
        ],
        "wc_strengths_avg": [
            75.0,
            37.676252467569014
        ],
        "wc_weaknesses_avg": [
            267.5,
            83.17000661296115
        ],
        "wc_questions_avg": [
            30.75,
            11.098986440211556
        ],
        "wc_review_avg": [
            480.25,
            125.90745609375165
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            140.75,
            83.86708233866253
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5160243059755837595&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1;1;1",
        "aff_unique_norm": "Northwest Polytechnical University;Huawei",
        "aff_unique_dep": ";Noah\u2019s Ark Lab",
        "aff_unique_url": "http://www.nwpu.edu.cn;https://www.huawei.com",
        "aff_unique_abbr": "NWPU;Huawei",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Xi'an;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "kgy2swARws",
        "title": "S\\(^{2}\\)-DMs: Skip-Step Diffusion Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Diffusion models have emerged as powerful generative tools, rivaling GANs in sample quality and mirroring the likelihood scores of autoregressive models. A subset of these models, exemplified by DDIMs, exhibit an inherent asymmetry: they are trained over $T$ steps but only sample from a subset of  $T$ during generation.     This selective sampling approach, though optimized for speed, inadvertently misses out on vital information from the unsampled steps, leading to potential compromises in sample quality.     We refer to this phenomenon as ``asymmetric diffusion models\".  To address this issue, we present the S\\(^{2}\\)-DMs, which use an innovative $L_{skip}$, meticulously designed to reintegrate the information omitted during the selective sampling phase. The benefits of this approach are manifold: it notably enhances sample quality, is exceptionally simple to implement, necessitates minimal code modifications, and is flexible enough to be compatible with various sampling algorithms.    The S\\(^{2}\\)-DMs achieves strong results on the CIFAR10 (32x32) and CelebA (64x64) datasets(e.g., FID scores of 8.01/6.41 in just 10 steps, surpassing the performance of DDIMs and PNDMs).     Access to the code and additional resources is provided in material.",
        "keywords": "Diffusion;DDIMs;DDPMs;Training algorithm",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/6fa20851ab100306a14a2e001f25063328911bbb.zip",
        "author": "Yixuan Wang;Shuangyin Li",
        "authorids": "~Yixuan_Wang9;~Shuangyin_Li1",
        "gender": "M;M",
        "homepage": "https://github.com/kingkingofall;http://www.shuangyinli.cn/",
        "dblp": ";133/1966",
        "google_scholar": ";LQITVaEAAAAJ",
        "orcid": "0009-0006-6716-700X;0000-0001-6404-3438",
        "linkedin": ";shuangyinli/",
        "or_profile": "~Yixuan_Wang9;~Shuangyin_Li1",
        "aff": "Huawei Technologies Ltd.;South China Normal University",
        "aff_domain": "h-partners.com;scnu.edu.cn",
        "position": "Full-time employee;Associate Professor",
        "bibtex": "@misc{\nwang2024sdms,\ntitle={S{\\textbackslash}({\\textasciicircum}\\{2\\}{\\textbackslash})-{DM}s: Skip-Step Diffusion Models},\nauthor={Yixuan Wang and Shuangyin Li},\nyear={2024},\nurl={https://openreview.net/forum?id=kgy2swARws}\n}",
        "github": "",
        "project": "",
        "reviewers": "wDjU;uLTx;2AL9;4Hkm",
        "site": "https://openreview.net/forum?id=kgy2swARws",
        "pdf_size": 6321951,
        "rating": "3;3;5;8",
        "confidence": "3;4;3;2",
        "soundness": "2;1;2;4",
        "contribution": "2;2;3;3",
        "presentation": "1;2;3;4",
        "wc_summary": "82;103;116;56",
        "wc_strengths": "32;39;16;22",
        "wc_weaknesses": "114;420;71;11",
        "wc_questions": "46;52;194;26",
        "wc_review": "274;614;397;115",
        "wc_reply_reviewers": "640;194;0;0",
        "wc_reply_authors": "1348;608;500;30",
        "reply_reviewers": "4;1;0;0",
        "reply_authors": "6;2;2;1",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            1.0897247358851685
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            89.25,
            22.708753818736948
        ],
        "wc_strengths_avg": [
            27.25,
            8.870597499605086
        ],
        "wc_weaknesses_avg": [
            154.0,
            157.8717834193305
        ],
        "wc_questions_avg": [
            79.5,
            66.80381725620175
        ],
        "wc_review_avg": [
            350.0,
            182.28137590000796
        ],
        "wc_reply_reviewers_avg": [
            208.5,
            261.41298743559014
        ],
        "wc_reply_authors_avg": [
            621.5,
            472.39258038203775
        ],
        "reply_reviewers_avg": [
            1.25,
            1.6393596310755
        ],
        "reply_authors_avg": [
            2.75,
            1.920286436967152
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.8638684255813602,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Huawei;South China Normal University",
        "aff_unique_dep": "Huawei Technologies;",
        "aff_unique_url": "https://www.huawei.com;http://www.scnu.edu.cn",
        "aff_unique_abbr": "Huawei;SCNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Towards Unified Multi-Modal Personalization: Large Vision-Language Models for Generative Recommendation and Beyond",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17967",
        "id": "khAE1sTMdX",
        "author_site": "Tianxin Wei, Bowen Jin, Ruirui Li, Hansi Zeng, Zhengyang Wang, Jianhui Sun, Qingyu Yin, Hanqing Lu, Suhang Wang, Jingrui He, Xianfeng Tang",
        "tldr": "",
        "abstract": "Developing a universal model that can effectively harness heterogeneous resources and respond to a wide range of personalized needs has been a longstanding community aspiration. Our daily choices, especially in domains like fashion and retail, are substantially shaped by multi-modal data, such as pictures and textual descriptions. These modalities not only offer intuitive guidance but also cater to personalized user preferences. However, the predominant personalization approaches mainly focus on ID or text-based recommendation problems, failing to comprehend the information spanning various tasks or modalities. In this paper, our goal is to establish a Unified paradigm for Multi-modal Personalization systems (UniMP), which effectively leverages multi-modal data while eliminating the complexities associated with task- and modality-specific customization. We argue that the advancements in foundational generative modeling have provided the flexibility and effectiveness necessary to achieve the objective. In light of this, we develop a generic and extensible personalization generative framework, that can handle a wide range of personalized needs including item recommendation, product search, preference prediction, explanation generation, and further user-guided image generation. Our methodology enhances the capabilities of foundational language models for personalized tasks by seamlessly ingesting interleaved cross-modal user history information, ensuring a more precise and customized experience for users. To train and evaluate the proposed multi-modal personalized tasks, we also introduce a novel and comprehensive benchmark covering a variety of user requirements. Our experiments on the real-world benchmark showcase the model's potential, outperforming competitive methods specialized for each task.",
        "keywords": "multimodal personalization;user modeling;generative modeling;instruction tuning;large vision-language model",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Tianxin Wei;Bowen Jin;Ruirui Li;Hansi Zeng;Zhengyang Wang;Jianhui Sun;Qingyu Yin;Hanqing Lu;Suhang Wang;Jingrui He;Xianfeng Tang",
        "authorids": "~Tianxin_Wei1;~Bowen_Jin1;~Ruirui_Li3;~Hansi_Zeng1;~Zhengyang_Wang1;~Jianhui_Sun1;~Qingyu_Yin2;~Hanqing_Lu3;~Suhang_Wang1;~Jingrui_He1;~Xianfeng_Tang1",
        "gender": ";M;M;;M;;M;M;M;F;M",
        "homepage": "https://weitianxin.github.io/;https://peterjin.me/;https://ruiruili.mystrikingly.com/;https://hansizeng.github.io/;;https://jsycsjh.github.io/;;;https://faculty.ist.psu.edu/szw494/;https://www.hejingrui.org;https://xta.ng/",
        "dblp": "277/5800;235/8066;12/8221-2;;;207/9364;179/2542;39/6752;136/9440;34/2685;33/7694",
        "google_scholar": "_LU2-kMAAAAJ;https://scholar.google.com/citations?hl=zh-CN;gYCtd6cAAAAJ;;A4fNBtEAAAAJ;https://scholar.google.com/citations?hl=en;P-mBKNYAAAAJ;pNYuJQIAAAAJ;cdT_WMMAAAAJ;hXpZynkAAAAJ;u1PEv-QAAAAJ",
        "orcid": "0000-0003-4450-2005;0000-0003-1295-2829;;;0000-0002-5146-2884;;;;0000-0003-3448-4878;0000-0002-6429-6272;",
        "linkedin": "tianxin-wei-7063a2180/;bowen-peter-jin/;;;;jianhui-sun-76a722a6/;;;;;xianfengtang/",
        "or_profile": "~Tianxin_Wei1;~Bowen_Jin1;~Ruirui_Li3;~Hansi_Zeng1;~Zhengyang_Wang1;~Jianhui_Sun1;~Qingyu_Yin2;~Hanqing_Lu3;~Suhang_Wang1;~Jingrui_He1;~Xianfeng_Tang1",
        "aff": "University of Illinois, Urbana-Champaign;University of Illinois, Urbana Champaign;Amazon;University of Massachusetts at Amherst;Amazon;University of Virginia;Amazon;Amazon;Pennsylvania State University;University of Illinois, Urbana Champaign;Amazon",
        "aff_domain": "uiuc.edu;illinois.edu;amazon.com;umass.edu;amazon.com;virginia.edu;amazon.com;amazon.com;psu.edu;illinois.edu;amazon.com",
        "position": "PhD student;PhD student;Researcher;PhD student;Researcher;PhD student;Researcher;Researcher;Assistant Professor;Full Professor;Researcher",
        "bibtex": "@inproceedings{\nwei2024towards,\ntitle={Towards Unified Multi-Modal Personalization: Large Vision-Language Models for Generative Recommendation and Beyond},\nauthor={Tianxin Wei and Bowen Jin and Ruirui Li and Hansi Zeng and Zhengyang Wang and Jianhui Sun and Qingyu Yin and Hanqing Lu and Suhang Wang and Jingrui He and Xianfeng Tang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=khAE1sTMdX}\n}",
        "github": "",
        "project": "",
        "reviewers": "Y26x;s3tt;Epwj;4rAY",
        "pdf_size": 645526,
        "rating": "5;6;6;8",
        "confidence": "2;4;4;3",
        "soundness": "3;2;3;3",
        "contribution": "2;3;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "86;34;83;97",
        "wc_strengths": "42;15;33;45",
        "wc_weaknesses": "113;34;35;49",
        "wc_questions": "82;124;227;96",
        "wc_review": "323;207;378;287",
        "wc_reply_reviewers": "11;15;43;11",
        "wc_reply_authors": "1327;1045;1142;796",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "3;3;4;2",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            75.0,
            24.238399287081645
        ],
        "wc_strengths_avg": [
            33.75,
            11.691342951089922
        ],
        "wc_weaknesses_avg": [
            57.75,
            32.44514601600677
        ],
        "wc_questions_avg": [
            132.25,
            56.75550634079481
        ],
        "wc_review_avg": [
            298.75,
            62.09820850878067
        ],
        "wc_reply_reviewers_avg": [
            20.0,
            13.379088160259652
        ],
        "wc_reply_authors_avg": [
            1077.5,
            191.51305438533427
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": 0.20751433915982243,
        "gs_citation": 20,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1137485699936379961&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 9,
        "openreview": "https://openreview.net/forum?id=khAE1sTMdX",
        "pdf": "https://openreview.net/pdf?id=khAE1sTMdX",
        "email": "uiuc.edu;illinois.edu;amazon.com;umass.edu;amazon.com;virginia.edu;amazon.com;amazon.com;psu.edu;illinois.edu;amazon.com",
        "author_num": 11,
        "aff_unique_index": "0;1;2;3;2;4;2;2;5;1;2",
        "aff_unique_norm": "University of Illinois;University of Illinois Urbana-Champaign;Amazon;University of Massachusetts Amherst;University of Virginia;Pennsylvania State University",
        "aff_unique_dep": ";;Amazon.com, Inc.;;;",
        "aff_unique_url": "https://illinois.edu;https://illinois.edu;https://www.amazon.com;https://www.umass.edu;https://www.virginia.edu;https://www.psu.edu",
        "aff_unique_abbr": "UIUC;UIUC;Amazon;UMass Amherst;UVA;PSU",
        "aff_campus_unique_index": "0;0;2;0",
        "aff_campus_unique": "Urbana-Champaign;;Amherst",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "ki4NYmRTQI",
        "title": "Operator-theoretic Implicit Neural Representation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The idea of representing a signal as the weights of a neural network, called Implicit Neural Representations (INR), has led to exciting implications for compression, view synthesis and 3D volumetric data understanding. An emergent problem setting here pertains to the use of INR for downstream processing tasks. Despite a few conceptual results, this remains extremely challenging because the INR for a given signal often exists in isolation. What does the local region in the neighborhood around a given INR even correspond to? Based on this inspiration, we offer an operator theoretic reformulation of the INR model, which we call Operator INR (or O-INR). At a high level, instead of mapping positional encodings to a signal, O-INR maps function spaces to function spaces. A practical form of this general casting of the problem is obtained by appealing to Integral Transform. The resultant model can mostly do away with Multi-layer Perceptrons (MLPs) that dominate nearly all existing INR models -- we show that convolutions are sufficient and offer numerous benefits in training including numerically stable behavior. We show that O-INR can easily handle most problem settings in the literature, where it meets or exceeds the performance profile of baselines. These benefits come with minimal, if any, compromise.",
        "keywords": "implicit neural representation;operator",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/384336342474e397eebabd291ed7ae5491a263b6.zip",
        "author": "Sourav Pal;Harshavardhan Adepu;Clinton Wang;Polina Golland;Vikas Singh",
        "authorids": "~Sourav_Pal1;~Harshavardhan_Adepu1;~Clinton_Wang1;~Polina_Golland1;~Vikas_Singh1",
        "gender": "M;M;M;;M",
        "homepage": ";https://harshauwm163.github.io/;https://clintonjwang.github.io/;https://people.csail.mit.edu/polina;http://vsingh-www.cs.wisc.edu/",
        "dblp": "19/5611;372/1508;239/1852.html;g/PolinaGolland;",
        "google_scholar": "672qcz0AAAAJ;dOUqv1AAAAAJ;7ICTJmoAAAAJ;;d32BmwcAAAAJ",
        "orcid": ";;;;",
        "linkedin": "souravpalkgp/;adepu-harshavardhan-9a7006ba/;;;",
        "or_profile": "~Sourav_Pal1;~Harshavardhan_Adepu1;~Clinton_Wang1;~Polina_Golland1;~Vikas_Singh1",
        "aff": "University of Wisconsin, Madison;Google;Massachusetts Institute of Technology;Massachusetts Institute of Technology;University of Wisconsin, Madison",
        "aff_domain": "wisc.edu;google.com;mit.edu;mit.edu;wisc.edu",
        "position": "PhD student;Intern;PhD student;Full Professor;Professor",
        "bibtex": "@misc{\npal2024operatortheoretic,\ntitle={Operator-theoretic Implicit Neural Representation},\nauthor={Sourav Pal and Harshavardhan Adepu and Clinton Wang and Polina Golland and Vikas Singh},\nyear={2024},\nurl={https://openreview.net/forum?id=ki4NYmRTQI}\n}",
        "github": "",
        "project": "",
        "reviewers": "x28W;255q;LTrk;mmzV",
        "site": "https://openreview.net/forum?id=ki4NYmRTQI",
        "pdf_size": 38078537,
        "rating": "1;3;3;5",
        "confidence": "4;3;3;4",
        "soundness": "2;2;2;2",
        "contribution": "2;2;1;2",
        "presentation": "1;2;1;3",
        "wc_summary": "54;171;41;65",
        "wc_strengths": "26;65;24;117",
        "wc_weaknesses": "387;471;136;298",
        "wc_questions": "65;50;82;171",
        "wc_review": "532;757;283;651",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            82.75,
            51.6545012559409
        ],
        "wc_strengths_avg": [
            58.0,
            37.78227097462512
        ],
        "wc_weaknesses_avg": [
            323.0,
            124.09069264050386
        ],
        "wc_questions_avg": [
            92.0,
            46.994680550036726
        ],
        "wc_review_avg": [
            555.75,
            176.44457345013475
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:7XtL1yLYhJQJ:scholar.google.com/&scioq=Operator-theoretic+Implicit+Neural+Representation&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;2;0",
        "aff_unique_norm": "University of Wisconsin;Google;Massachusetts Institute of Technology",
        "aff_unique_dep": ";Google;",
        "aff_unique_url": "https://www.wisc.edu;https://www.google.com;https://web.mit.edu",
        "aff_unique_abbr": "UW;Google;MIT",
        "aff_campus_unique_index": "0;1;0",
        "aff_campus_unique": "Madison;Mountain View;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "kiwyQsZIGP",
        "title": "Evaluating the Evaluators: Are Current Few-Shot Learning Benchmarks Fit for Purpose?",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Numerous benchmarks for Few-Shot Learning have been proposed in the last decade. However all of these benchmarks focus on performance averaged over many tasks, and the question of how to reliably evaluate and tune models trained for individual tasks in this regime has not been addressed. This paper presents the first investigation into task-level evaluation\u2014a fundamental step when deploying a model. We measure the accuracy of performance estimators in the few-shot setting, consider strategies for model selection, and examine the reasons for the failure of evaluators usually thought of as being robust. We conclude that cross-validation with a low number\nof folds is the best choice for directly estimating the performance of a model, whereas using bootstrapping or cross validation with a large number of folds is better for model selection purposes. Overall, we find that existing benchmarks for few-shot learning are not designed in such a way that one can get a reliable picture of how effectively methods can be used on individual tasks",
        "keywords": "few-shot learning;model validation",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Lu\u00edsa Shimabucoro;Yongshuo Zong;Timothy Hospedales;Henry Gouk",
        "authorids": "~Lu\u00edsa_Shimabucoro1;~Yongshuo_Zong1;~Timothy_Hospedales1;~Henry_Gouk1",
        "gender": "F;;M;M",
        "homepage": ";https://ys-zong.github.io/;http://homepages.inf.ed.ac.uk/thospeda/;https://www.henrygouk.com",
        "dblp": ";;32/3545;172/0943",
        "google_scholar": "IYVqNJAAAAAJ;38-dM-MAAAAJ;https://scholar.google.fr/citations?user=nHhtvqkAAAAJ;https://scholar.google.co.nz/citations?user=i1bzlyAAAAAJ",
        "orcid": ";;0000-0003-4867-7486;",
        "linkedin": "lushimabucoro/;;timothyhospedales/;",
        "or_profile": "~Lu\u00edsa_Shimabucoro1;~Yongshuo_Zong1;~Timothy_Hospedales1;~Henry_Gouk1",
        "aff": "Universidade de S\u00e3o Paulo;University of Edinburgh;Samsung AI Research Centre;University of Edinburgh",
        "aff_domain": "usp.br;ed.ac.uk;samsung.com;ed.ac.uk",
        "position": "Undergrad student;PhD student;Principal Researcher;RAEng Research Fellow",
        "bibtex": "@misc{\nshimabucoro2024evaluating,\ntitle={Evaluating the Evaluators: Are Current Few-Shot Learning Benchmarks Fit for Purpose?},\nauthor={Lu{\\'\\i}sa Shimabucoro and Yongshuo Zong and Timothy Hospedales and Henry Gouk},\nyear={2024},\nurl={https://openreview.net/forum?id=kiwyQsZIGP}\n}",
        "github": "",
        "project": "",
        "reviewers": "Unr2;ZAXf;KXUd;CrkK",
        "site": "https://openreview.net/forum?id=kiwyQsZIGP",
        "pdf_size": 401621,
        "rating": "3;3;6;8",
        "confidence": "3;2;2;4",
        "soundness": "3;3;3;3",
        "contribution": "2;1;3;3",
        "presentation": "3;2;2;3",
        "wc_summary": "75;89;87;172",
        "wc_strengths": "14;61;81;269",
        "wc_weaknesses": "67;445;105;177",
        "wc_questions": "2;166;71;150",
        "wc_review": "158;761;344;768",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "176;210;200;162",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            105.75,
            38.62237046065402
        ],
        "wc_strengths_avg": [
            106.25,
            97.0602261485105
        ],
        "wc_weaknesses_avg": [
            198.5,
            147.69817195889732
        ],
        "wc_questions_avg": [
            97.25,
            65.70911276223413
        ],
        "wc_review_avg": [
            507.75,
            265.04940577182964
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            187.0,
            19.0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5685352436149612,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:gnUx3pQqLR4J:scholar.google.com/&scioq=Evaluating+the+Evaluators:+Are+Current+Few-Shot+Learning+Benchmarks+Fit+for+Purpose%3F&hl=en&as_sdt=0,33",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "Universidade de S\u00e3o Paulo;University of Edinburgh;Samsung",
        "aff_unique_dep": ";;AI Research",
        "aff_unique_url": "https://www.usp.br;https://www.ed.ac.uk;https://www.samsung.com/global/researchers/samsung-ai-research-centre/",
        "aff_unique_abbr": "USP;Edinburgh;SARC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;1",
        "aff_country_unique": "Brazil;United Kingdom;South Korea"
    },
    {
        "id": "kjLM36ucJS",
        "title": "Synthetic data shuffling accelerates the convergence of federated learning under data heterogeneity",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In federated learning, data heterogeneity is a critical challenge. A straightforward solution is to shuffle the clients' data to homogenize the distribution. However, this may violate data access rights, and how and when shuffling can accelerate the convergence of a federated optimization algorithm is not theoretically well understood. In this paper, we establish a precise and quantifiable correspondence between data heterogeneity and parameters in the convergence rate when a fraction of data is shuffled across clients. We discuss that shuffling can in some cases quadratically reduce the gradient dissimilarity with respect to the shuffling percentage, accelerating convergence. Inspired by the theory, we propose a practical approach that addresses the data access rights issue by shuffling locally generated synthetic data. The experimental results show that shuffling synthetic data improves the performance of multiple existing federated learning algorithms by a large margin.",
        "keywords": "Federated learning;Optimization;Decentralized learning;Distributed optimization;Data heterogeneity",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/f3b19de71d33411c79bc80a3b0e44bec75c63ab5.zip",
        "author": "Bo Li;Yasin Esfandiari;Mikkel N. Schmidt;Tommy Sonne Alstr\u00f8m;Sebastian U Stich",
        "authorids": "~Bo_Li34;~Yasin_Esfandiari1;~Mikkel_N._Schmidt1;~Tommy_Sonne_Alstr\u00f8m1;~Sebastian_U_Stich1",
        "gender": ";M;M;M;M",
        "homepage": ";https://cispa.de/en/people/c01yaes;;https://www.sstich.ch;http://www.mikkelschmidt.dk",
        "dblp": "50/3402-119;;120/7016;04/10549;63/6524",
        "google_scholar": "3Wz--mMAAAAJ;gkGubIEAAAAJ;https://scholar.google.dk/citations?user=jAmaPr4AAAAJ;https://scholar.google.ch/citations?user=8l-mDfQAAAAJ;https://scholar.google.dk/citations?user=IjF4ExkAAAAJ",
        "orcid": "0000-0002-2534-4622;;0000-0003-0941-3146;;0000-0001-6927-8869",
        "linkedin": ";yasin-esfandiari;;;",
        "or_profile": "~Bo_Li34;~Yasin_Esfandiari1;~Tommy_Sonne_Alstr\u00f8m1;~Sebastian_U_Stich1;~Mikkel_N_Schmidt1",
        "aff": "Technical University of Denmark;Helmholtz Zentrum M\u00fcnchen;Technical University of Denmark;CISPA Helmholtz Center for Information Security;Technical University of Denmark",
        "aff_domain": "dtu.dk;helmholtz-munich.de;dtu.dk;cispa.de;dtu.dk",
        "position": "PhD student;Research Assistant;Associate Professor;Tenure Track Faculty;Associate Professor",
        "bibtex": "@misc{\nli2024synthetic,\ntitle={Synthetic data shuffling accelerates the convergence of federated learning under data heterogeneity},\nauthor={Bo Li and Yasin Esfandiari and Mikkel N. Schmidt and Tommy Sonne Alstr{\\o}m and Sebastian U Stich},\nyear={2024},\nurl={https://openreview.net/forum?id=kjLM36ucJS}\n}",
        "github": "",
        "project": "",
        "reviewers": "wuSQ;zeqb;suLd;s3fS",
        "site": "https://openreview.net/forum?id=kjLM36ucJS",
        "pdf_size": 1716800,
        "rating": "3;5;5;5",
        "confidence": "5;3;4;4",
        "soundness": "2;2;3;2",
        "contribution": "1;2;2;2",
        "presentation": "3;2;4;3",
        "wc_summary": "125;117;152;110",
        "wc_strengths": "21;74;19;63",
        "wc_weaknesses": "195;199;138;342",
        "wc_questions": "1;16;86;126",
        "wc_review": "342;406;395;641",
        "wc_reply_reviewers": "393;0;0;0",
        "wc_reply_authors": "306;0;0;393",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "2;0;0;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            126.0,
            15.921683328090658
        ],
        "wc_strengths_avg": [
            44.25,
            24.57005290999594
        ],
        "wc_weaknesses_avg": [
            218.5,
            75.2744976735149
        ],
        "wc_questions_avg": [
            57.25,
            51.036139156484005
        ],
        "wc_review_avg": [
            446.0,
            115.15424438551972
        ],
        "wc_reply_reviewers_avg": [
            98.25,
            170.1739918436422
        ],
        "wc_reply_authors_avg": [
            174.75,
            177.43643227928135
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            0.75,
            0.82915619758885
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=390660513644649612&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;0;2;0",
        "aff_unique_norm": "Technical University of Denmark;Helmholtz Zentrum M\u00fcnchen;CISPA Helmholtz Center for Information Security",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.tek.dk;https://www.helmholtz-muenchen.de;https://www.cispa.de/",
        "aff_unique_abbr": "DTU;;CISPA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;1;0",
        "aff_country_unique": "Denmark;Germany"
    },
    {
        "id": "kjOegmWcko",
        "title": "SR-OOD: Out-of-Distribution Detection via Sample Repairing",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Out-of-distribution (OOD) detection is a crucial task for ensuring the reliability and robustness of machine learning models. Recent works have shown that generative models often assign high confidence scores to OOD samples, indicating that they fail to capture the semantic information of the data. To tackle this problem, we take advantage of sample repairing and propose a novel OOD detection framework, namely SR-OOD. Our framework leverages the idea that repairing an OOD sample can reveal its semantic inconsistency with the in-distribution data. Specifically, our framework consists of two components: a sample repairing module and a detection module. The sample repairing module applies erosion to an input sample and uses a generative adversarial network to repair it. The detection module then \ndetermines whether the input sample is OOD using a distance metric. Our framework does not require any additional data or label information for detection, making it applicable to various scenarios. We conduct extensive experiments on three image datasets: CIFAR-10, CelebA, and Pokemon, and demonstrate that our approach achieves superior performance over the state-of-the-art generative methods in OOD detection.",
        "keywords": "OOD Detection;Generative Model",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Rui Sun;Andi Zhang;Haiming Zhang;J.K. Kingsley Ren;Yao Zhu;Ruimao Zhang;Zhen Li",
        "authorids": "~Rui_Sun3;~Andi_Zhang2;~Haiming_Zhang1;~J.K._Kingsley_Ren1;~Yao_Zhu2;~Ruimao_Zhang1;~Zhen_Li6",
        "gender": "M;M;M;;M;M;",
        "homepage": ";http://andi.ac;;;;http://zhangruimao.site/#;",
        "dblp": ";200/8255-1;;;;54/10697;",
        "google_scholar": "EabySvsAAAAJ;qGAOAoYAAAAJ;RPWMpyIAAAAJ;;Te8bmo0AAAAJ;ZJwZdtgAAAAJ;",
        "orcid": ";;0000-0002-0432-4606;;0000-0003-0991-1970;;",
        "linkedin": "rui-sun-35a456191/;zhangandi/;;;;;",
        "or_profile": "~Rui_Sun3;~Andi_Zhang2;~Haiming_Zhang1;~J.K._Kingsley_Ren1;~Yao_Zhu2;~Ruimao_Zhang1;~Zhen_Li6",
        "aff": "The Chinese University of HongKong, Shenzhen;University of Cambridge;The Chinese University of Hong Kong, Shenzhen;;Zhejiang University;The Chinese University of Hong Kong (Shenzhen);",
        "aff_domain": "cuhk.edu.cn;cam.ac.uk;cuhk.edu.cn;;zju.edu.cn;cuhk.edu.cn;",
        "position": "PhD student;PhD student;PhD student;;PhD student;Assistant Professor;",
        "bibtex": "@misc{\nsun2024srood,\ntitle={{SR}-{OOD}: Out-of-Distribution Detection via Sample Repairing},\nauthor={Rui Sun and Andi Zhang and Haiming Zhang and J.K. Kingsley Ren and Yao Zhu and Ruimao Zhang and Zhen Li},\nyear={2024},\nurl={https://openreview.net/forum?id=kjOegmWcko}\n}",
        "github": "",
        "project": "",
        "reviewers": "LA54;RvbJ;wrBi;9Wxr",
        "site": "https://openreview.net/forum?id=kjOegmWcko",
        "pdf_size": 3094718,
        "rating": "3;3;3;6",
        "confidence": "5;5;4;3",
        "soundness": "2;2;3;3",
        "contribution": "1;2;2;3",
        "presentation": "2;1;3;3",
        "wc_summary": "42;72;58;58",
        "wc_strengths": "40;8;35;73",
        "wc_weaknesses": "371;870;165;129",
        "wc_questions": "37;4;5;134",
        "wc_review": "490;954;263;394",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            57.5,
            10.618380290797651
        ],
        "wc_strengths_avg": [
            39.0,
            23.097618924902193
        ],
        "wc_weaknesses_avg": [
            383.75,
            295.52950360327816
        ],
        "wc_questions_avg": [
            45.0,
            53.07070755134135
        ],
        "wc_review_avg": [
            525.25,
            260.3222762269875
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.8703882797784892,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12076250943356528550&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;2;0",
        "aff_unique_norm": "Chinese University of Hong Kong;University of Cambridge;Zhejiang University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.cuhk.edu.cn;https://www.cam.ac.uk;https://www.zju.edu.cn",
        "aff_unique_abbr": "CUHK;Cambridge;ZJU",
        "aff_campus_unique_index": "0;1;0;0",
        "aff_campus_unique": "Shenzhen;Cambridge;",
        "aff_country_unique_index": "0;1;0;0;0",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "id": "kjZlzuVJF0",
        "title": "Boosting Multi-Agent Reinforcement Learning via Transition-Informed Representations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Effective coordination among agents in a multi-agent system necessitates an understanding of the underlying dynamics of the environment. \nHowever, in the context of multi-agent reinforcement learning (MARL), agent partially observed information leads to a lack of consideration for agent interactions and coordination from an ego perspective under the world model, which becomes the main obstacle to improving the data efficiency of MARL methods. To address this, motivated by the success of learning a world model in RL and cognitive science, we devise a world-model-driven learning paradigm enabling agents to gain a more holistic representation of individual observation of the environment. Specifically, we present the Transition-Informed Multi-Agent Representations (TIMAR) framework, which leverages the joint transition model, i.e., the surrogate world model, to learn effective representations among agents through a self-supervised learning objective. TIMAR incorporates an auxiliary module to predict future transitions based on sequential observations and actions, allowing agents to infer the latent state of the system and consider the influences of others. Experimental evaluation of TIMAR in various MARL environments demonstrates its significantly improved performance and data efficiency compared to strong baselines such as MAPPO, HAPPO, finetuned QMIX, MAT, and MA2CL. In addition, we found TIMAR can also improve the robustness and generalization of the Transformer-based MARL algorithm such as MAT.",
        "keywords": "SSL;MARL",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Mingxiao Feng;Wengang Zhou;Yaodong Yang;Houqiang Li",
        "authorids": "~Mingxiao_Feng1;~Wengang_Zhou1;~Yaodong_Yang1;~Houqiang_Li1",
        "gender": ";M;M;M",
        "homepage": "https://fmxfranky.github.io/;http://staff.ustc.edu.cn/~zhwg/index.html;https://www.yangyaodong.com;https://staff.ustc.edu.cn/~lihq/",
        "dblp": ";22/4544-1;170/1496-1;59/7017.html",
        "google_scholar": ";8s1JF8YAAAAJ;https://scholar.google.co.uk/citations?user=6yL0xw8AAAAJ;7sFMIKoAAAAJ",
        "orcid": ";0000-0003-1690-9836;0000-0001-8132-5613;0000-0003-2188-3028",
        "linkedin": ";;yaodong-yang;",
        "or_profile": "~Mingxiao_Feng1;~Wengang_Zhou1;~Yaodong_Yang1;~Houqiang_Li1",
        "aff": ";University of Science and Technology of China;Peking University;University of Science and Technology of China",
        "aff_domain": ";ustc.edu.cn;pku.edu.cn;ustc.edu.cn",
        "position": ";Full Professor;Assistant Professor;Professor",
        "bibtex": "@misc{\nfeng2024boosting,\ntitle={Boosting Multi-Agent Reinforcement Learning via Transition-Informed Representations},\nauthor={Mingxiao Feng and Wengang Zhou and Yaodong Yang and Houqiang Li},\nyear={2024},\nurl={https://openreview.net/forum?id=kjZlzuVJF0}\n}",
        "github": "",
        "project": "",
        "reviewers": "YZm1;1XWc;x75r;vJUQ",
        "site": "https://openreview.net/forum?id=kjZlzuVJF0",
        "pdf_size": 3902593,
        "rating": "3;3;3;5",
        "confidence": "4;4;4;3",
        "soundness": "2;2;2;1",
        "contribution": "2;1;1;2",
        "presentation": "1;3;2;1",
        "wc_summary": "88;142;113;203",
        "wc_strengths": "51;21;35;153",
        "wc_weaknesses": "124;133;262;513",
        "wc_questions": "184;184;184;121",
        "wc_review": "447;480;594;990",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            136.5,
            42.88647805544307
        ],
        "wc_strengths_avg": [
            65.0,
            51.90375708944392
        ],
        "wc_weaknesses_avg": [
            258.0,
            157.02069927242076
        ],
        "wc_questions_avg": [
            168.25,
            27.279800219209818
        ],
        "wc_review_avg": [
            627.75,
            216.13927801304416
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:KaSls-6g7pUJ:scholar.google.com/&scioq=Boosting+Multi-Agent+Reinforcement+Learning+via+Transition-Informed+Representations&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Science and Technology of China;Peking University",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.ustc.edu.cn;http://www.pku.edu.cn",
        "aff_unique_abbr": "USTC;Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "FedDA: Faster Adaptive Gradient Methods for Federated Constrained Optimization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17966",
        "id": "kjn99xFUF3",
        "author_site": "Junyi Li, Feihu Huang, Heng Huang",
        "tldr": "",
        "abstract": "Federated learning (FL) is an emerging learning paradigm where a set of distributed clients learns a task under the coordination of a server. The FedAvg algorithm is one of the most widely used methods in FL. In FedAvg, the learning rate is a constant rather than changing adaptively. Adaptive gradient methods have demonstrated superior performance over the constant learning rate schedules in non-distributed settings, and they have recently been adapted to FL. However, the majority of these methods are designed for unconstrained settings. Meanwhile, many crucial FL applications, like disease diagnosis and biomarker identification, often rely on constrained formulations such as Lasso and group Lasso. It remains an open question as to whether adaptive gradient methods can be effectively applied to FL problems with constrains. In this work, we introduce \\textbf{FedDA}, a novel adaptive gradient framework for FL. This framework utilizes a restarted dual averaging technique and is compatible with a range of gradient estimation methods and adaptive learning rate schedules.  Specifically, an instantiation of our framework FedDA-MVR achieves sample complexity $\\tilde{O}(K^{-1}\\epsilon^{-1.5})$ and communication complexity $\\tilde{O}(K^{-0.25}\\epsilon^{-1.25})$ for finding a stationary point $\\epsilon$ in the constrained setting with $K$ be the number of clients. We conduct experiments over both constrained and unconstrained tasks to confirm the effectiveness of our approach.",
        "keywords": "Federated Learning;Adaptive Gradient Methods",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/884bf90414917ca43dba0f26309eb759b7e56d76.pdf",
        "author": "Junyi Li;Feihu Huang;Heng Huang",
        "authorids": "~Junyi_Li1;~Feihu_Huang1;~Heng_Huang1",
        "gender": "M;M;M",
        "homepage": ";;https://www.cs.umd.edu/~heng/",
        "dblp": ";169/6247;03/281",
        "google_scholar": "MzvZSs0AAAAJ;tRQwlHUAAAAJ;4OqLaDwAAAAJ",
        "orcid": ";0000-0003-0806-6074;",
        "linkedin": ";;",
        "or_profile": "~Junyi_Li1;~Feihu_Huang1;~Heng_Huang1",
        "aff": "University of Maryland, College Park;Nanjing University of Aeronautics and Astronautics;Department of Computer Science, University of Maryland, College Park",
        "aff_domain": "umd.edu;nuaa.edu.cn;cs.umd.edu",
        "position": "PhD student;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nli2024fedda,\ntitle={Fed{DA}: Faster Adaptive Gradient Methods for Federated Constrained Optimization},\nauthor={Junyi Li and Feihu Huang and Heng Huang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=kjn99xFUF3}\n}",
        "github": "",
        "project": "",
        "reviewers": "pEfb;hZzf;VFUm",
        "pdf_size": 2689058,
        "rating": "6;6;6",
        "confidence": "4;3;3",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "3;1;2",
        "wc_summary": "77;163;63",
        "wc_strengths": "89;44;39",
        "wc_weaknesses": "160;164;90",
        "wc_questions": "64;26;77",
        "wc_review": "390;397;269",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "663;611;496",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;2;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            101.0,
            44.21161235090467
        ],
        "wc_strengths_avg": [
            57.333333333333336,
            22.484562605386735
        ],
        "wc_weaknesses_avg": [
            138.0,
            33.980386499665755
        ],
        "wc_questions_avg": [
            55.666666666666664,
            21.63844315615664
        ],
        "wc_review_avg": [
            352.0,
            58.75939641169459
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            590.0,
            69.77583153690587
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:rySSh1R10MwJ:scholar.google.com/&scioq=FedDA:+Faster+Adaptive+Gradient+Methods+for+Federated+Constrained+Optimization&hl=en&as_sdt=0,47",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=kjn99xFUF3",
        "pdf": "https://openreview.net/pdf?id=kjn99xFUF3",
        "email": "umd.edu;nuaa.edu.cn;cs.umd.edu",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of Maryland;Nanjing University of Aeronautics and Astronautics;University of Maryland, College Park",
        "aff_unique_dep": ";;Department of Computer Science",
        "aff_unique_url": "https://www/umd.edu;http://www.nuaa.edu.cn;https://www/umd.edu",
        "aff_unique_abbr": "UMD;NUAA;UMD",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "College Park;",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "kkQSwtx0p3",
        "title": "Leveraging Task Structures for Improved Identifiability in Neural Network Representations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This work extends the theory of identifiability in supervised learning by considering the consequences of having access to a distribution of tasks. In such cases, we show that identifiability is achievable even in the case of regression, extending prior work restricted to linear identifiability in the single-task classification case. Furthermore, we show that the existence of a task distribution which defines a conditional prior over latent factors reduces the equivalence class for identifiability to permutations and scaling, a much stronger and more useful result than linear identifiability. When we further assume a causal structure over these tasks, our approach enables simple maximum marginal likelihood optimization together with downstream applicability to causal representation learning. Empirically, we validate that our model outperforms more general unsupervised models in recovering canonical representations for both synthetic and real-world molecular data.",
        "keywords": "multi-task learning;identifiability;representation learning;causality;molecules",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Wenlin Chen;Julien Horwood;Juyeon Heo;Jos\u00e9 Miguel Hern\u00e1ndez-Lobato",
        "authorids": "~Wenlin_Chen2;~Julien_Horwood1;~Juyeon_Heo1;~Jos\u00e9_Miguel_Hern\u00e1ndez-Lobato1",
        "gender": ";;F;",
        "homepage": "https://wenlin-chen.github.io/;;https://sites.google.com/view/juyeonheo/%ED%99%88;http://jmhl.org",
        "dblp": ";;;40/6058",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.ca/citations?user=1q-mRKAAAAAJ;;BEBccCQAAAAJ",
        "orcid": ";;;0000-0001-7610-949X",
        "linkedin": ";;;",
        "or_profile": "~Wenlin_Chen2;~Julien_Horwood1;~Juyeon_Heo1;~Jose_Miguel_Hernandez_Lobato1",
        "aff": "Microsoft Research;University of Cambridge;University of Cambridge;University of Cambridge",
        "aff_domain": "microsoft.com;cam.ac.uk;cam.ac.uk;cam.ac.uk",
        "position": "Research Intern;PhD student;PhD student;Associate Professor",
        "bibtex": "@misc{\nchen2024leveraging,\ntitle={Leveraging Task Structures for Improved Identifiability in Neural Network Representations},\nauthor={Wenlin Chen and Julien Horwood and Juyeon Heo and Jos{\\'e} Miguel Hern{\\'a}ndez-Lobato},\nyear={2024},\nurl={https://openreview.net/forum?id=kkQSwtx0p3}\n}",
        "github": "",
        "project": "",
        "reviewers": "mdpZ;NHKJ;2cPA;wjky",
        "site": "https://openreview.net/forum?id=kkQSwtx0p3",
        "pdf_size": 528109,
        "rating": "5;5;5;6",
        "confidence": "2;3;4;3",
        "soundness": "3;2;3;2",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;4",
        "wc_summary": "18;116;71;64",
        "wc_strengths": "5;31;61;12",
        "wc_weaknesses": "99;231;568;84",
        "wc_questions": "12;183;203;64",
        "wc_review": "134;561;903;224",
        "wc_reply_reviewers": "0;0;107;63",
        "wc_reply_authors": "412;500;1563;599",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "1;2;4;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            67.25,
            34.737407790449765
        ],
        "wc_strengths_avg": [
            27.25,
            21.683807322516035
        ],
        "wc_weaknesses_avg": [
            245.5,
            194.7825710888939
        ],
        "wc_questions_avg": [
            115.5,
            79.9640544244725
        ],
        "wc_review_avg": [
            455.5,
            303.4555156855779
        ],
        "wc_reply_reviewers_avg": [
            42.5,
            45.2575960475145
        ],
        "wc_reply_authors_avg": [
            768.5,
            463.4503749054477
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10838055286499514591&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Microsoft;University of Cambridge",
        "aff_unique_dep": "Microsoft Research;",
        "aff_unique_url": "https://www.microsoft.com/en-us/research;https://www.cam.ac.uk",
        "aff_unique_abbr": "MSR;Cambridge",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Cambridge",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "title": "Local Composite Saddle Point Optimization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17965",
        "id": "kklwv4c4dI",
        "author_site": "Site Bai, Brian Bullins",
        "tldr": "",
        "abstract": "Distributed optimization (DO) approaches for saddle point problems (SPP) have recently gained in popularity due to the critical role they play in machine learning (ML). Existing works mostly target smooth unconstrained objectives in Euclidean space, whereas ML problems often involve constraints or non-smooth regularization, which results in a need for composite optimization. Moreover, although non-smooth regularization often serves to induce structure (e.g., sparsity), standard aggregation schemes in distributed optimization break this structure. Addressing these issues, we propose Federated Dual Extrapolation (FeDualEx), an extra-step primal-dual algorithm with local updates, which is the first of its kind to encompass both saddle point optimization and composite objectives under the distributed paradigm. Using a generalized notion of Bregman divergence, we analyze its convergence and communication complexity in the homogeneous setting. Furthermore, the empirical evaluation demonstrates the effectiveness of FeDualEx for inducing structure in these challenging settings.",
        "keywords": "Saddle Point Optimization;Distributed Optimization;Federated Optimization;Composite Optimization;Dual Extrapolation;Mirror Prox;Convex Optimization;Bregman Divergence",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/95b7c8ba502149c68f392e1ba499aba4da49cb1b.pdf",
        "author": "Site Bai;Brian Bullins",
        "authorids": "~Site_Bai1;~Brian_Bullins2",
        "gender": "M;M",
        "homepage": "https://best99317.github.io/SiteBai/;https://bbullins.github.io",
        "dblp": "245/8818;176/5583",
        "google_scholar": "Vnc1dYAAAAAJ;PCUwf-8AAAAJ",
        "orcid": ";",
        "linkedin": "best99317/;",
        "or_profile": "~Site_Bai1;~Brian_Bullins1",
        "aff": "Purdue University;Purdue University",
        "aff_domain": "purdue.edu;purdue.edu",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nbai2024local,\ntitle={Local Composite Saddle Point Optimization},\nauthor={Site Bai and Brian Bullins},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=kklwv4c4dI}\n}",
        "github": "",
        "project": "",
        "reviewers": "rzX1;geTM;jzbD",
        "pdf_size": 936425,
        "rating": "5;6;6",
        "confidence": "4;4;3",
        "soundness": "2;3;3",
        "contribution": "3;3;3",
        "presentation": "2;3;3",
        "wc_summary": "39;47;109",
        "wc_strengths": "18;31;100",
        "wc_weaknesses": "333;299;71",
        "wc_questions": "55;5;64",
        "wc_review": "445;382;344",
        "wc_reply_reviewers": "278;14;0",
        "wc_reply_authors": "1132;946;739",
        "reply_reviewers": "2;1;0",
        "reply_authors": "4;2;1",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            65.0,
            31.283648551066843
        ],
        "wc_strengths_avg": [
            49.666666666666664,
            35.98456459218159
        ],
        "wc_weaknesses_avg": [
            234.33333333333334,
            116.32521461641736
        ],
        "wc_questions_avg": [
            41.333333333333336,
            25.952948879762307
        ],
        "wc_review_avg": [
            390.3333333333333,
            41.651997417757634
        ],
        "wc_reply_reviewers_avg": [
            97.33333333333333,
            127.87841447597359
        ],
        "wc_reply_authors_avg": [
            939.0,
            160.51791177311023
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:oJNds1VtogMJ:scholar.google.com/&scioq=Local+Composite+Saddle+Point+Optimization&hl=en&as_sdt=0,44",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=kklwv4c4dI",
        "pdf": "https://openreview.net/pdf?id=kklwv4c4dI",
        "email": "purdue.edu;purdue.edu",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Purdue University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.purdue.edu",
        "aff_unique_abbr": "Purdue",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "kkpVgxHQ1S",
        "title": "Latent Diffusion Counterfactual Explanations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Counterfactual explanations have emerged as a promising method for elucidating the behavior of opaque black-box models. Recently, several works leveraged pixel-space diffusion models for counterfactual generation. To handle noisy, adversarial gradients during counterfactual generation--causing unrealistic artifacts or mere adversarial perturbations--they required either auxiliary adversarially robust models or computationally intensive guidance schemes. However, such requirements limit their applicability, e.g., in scenarios with restricted access to the model's training data. To address these limitations, we introduce Latent Diffusion Counterfactual Explanations (LDCE). LDCE harnesses the capabilities of recent class- or text-conditional foundation latent diffusion models to expedite counterfactual generation and focus on the important, semantic parts of the data. Furthermore, we propose a novel consensus guidance mechanism to filter out noisy, adversarial gradients that are misaligned with the diffusion model's implicit classifier. We demonstrate the versatility of LDCE across a wide spectrum of models trained on diverse datasets with different learning paradigms. Finally, we showcase how LDCE can provide insights into model errors, enhancing our understanding of black-box model behavior.",
        "keywords": "Counterfactual Explanations;Diffusion Models;Explainable AI",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Simon Schrodi;Karim Farid;Max Argus;Thomas Brox",
        "authorids": "~Simon_Schrodi1;~Karim_Farid1;~Max_Argus2;~Thomas_Brox1",
        "gender": "M;M;M;M",
        "homepage": "https://lmb.informatik.uni-freiburg.de/people/schrodi/;;https://lmb.informatik.uni-freiburg.de/people/brox/index.en.html;https://lmb.informatik.uni-freiburg.de/people/argusm/",
        "dblp": "289/1328;287/9435;97/4586;192/2010",
        "google_scholar": "https://scholar.google.de/citations?user=yC-y0PEAAAAJ;O8ZkpVoAAAAJ;https://scholar.google.com/citations?hl=de;",
        "orcid": "0009-0003-7006-953X;0000-0001-8054-0004;0000-0002-6282-8861;0000-0002-1288-7476",
        "linkedin": "simon-schrodi-7b55161bb/;karimibrahimyehia/;;max-argus-5810636/",
        "or_profile": "~Simon_Schrodi1;~Karim_Farid1;~Thomas_Brox1;~Max_Argus1",
        "aff": "University of Freiburg, Albert-Ludwigs-Universit\u00e4t Freiburg;;University of Freiburg;University of Freiburg, Albert-Ludwigs-Universit\u00e4t Freiburg",
        "aff_domain": "cs.uni-freiburg.de;;uni-freiburg.de;cs.uni-freiburg.de",
        "position": "PhD student;;Full Professor;Postdoc",
        "bibtex": "@misc{\nschrodi2024latent,\ntitle={Latent Diffusion Counterfactual Explanations},\nauthor={Simon Schrodi and Karim Farid and Max Argus and Thomas Brox},\nyear={2024},\nurl={https://openreview.net/forum?id=kkpVgxHQ1S}\n}",
        "github": "",
        "project": "",
        "reviewers": "wLyZ;nXBG;LUsN",
        "site": "https://openreview.net/forum?id=kkpVgxHQ1S",
        "pdf_size": 8747645,
        "rating": "3;6;6",
        "confidence": "3;3;2",
        "soundness": "2;3;3",
        "contribution": "1;3;3",
        "presentation": "2;3;3",
        "wc_summary": "98;47;49",
        "wc_strengths": "40;49;31",
        "wc_weaknesses": "151;72;77",
        "wc_questions": "19;7;5",
        "wc_review": "308;175;162",
        "wc_reply_reviewers": "0;0;24",
        "wc_reply_authors": "645;272;325",
        "reply_reviewers": "0;0;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            64.66666666666667,
            23.584363935078308
        ],
        "wc_strengths_avg": [
            40.0,
            7.3484692283495345
        ],
        "wc_weaknesses_avg": [
            100.0,
            36.12016980395672
        ],
        "wc_questions_avg": [
            10.333333333333334,
            6.182412330330469
        ],
        "wc_review_avg": [
            215.0,
            65.9747426419131
        ],
        "wc_reply_reviewers_avg": [
            8.0,
            11.313708498984761
        ],
        "wc_reply_authors_avg": [
            414.0,
            164.76852450230496
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13401481030364884316&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Freiburg",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uni-freiburg.de",
        "aff_unique_abbr": "UoF",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Freiburg;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "title": "Beyond Memorization: Violating Privacy via Inference with Large Language Models",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17964",
        "id": "kmn0BhQk7p",
        "author_site": "Robin Staab, Mark Vero, Mislav Balunovic, Martin Vechev",
        "tldr": "",
        "abstract": "Current privacy research on large language models (LLMs) primarily focuses on the issue of extracting memorized training data. At the same time, models\u2019 inference capabilities have increased drastically. This raises the key question of whether current LLMs could violate individuals\u2019 privacy by inferring personal attributes from text given at inference time. In this work, we present the first comprehensive study on the capabilities of pretrained LLMs to infer personal attributes from text. We construct a dataset consisting of real Reddit profiles, and show that current LLMs can infer a wide range of personal attributes (e.g., location, income, sex), achieving up to 85% top-1 and 95% top-3 accuracy at a fraction of the cost (100x) and time (240x) required by humans. As people increasingly interact with LLM-powered chatbots across all aspects of life, we also explore the emerging threat of privacy-invasive chatbots trying to extract personal information through seemingly benign questions. Finally, we show that common mitigations, i.e., text anonymization and model alignment, are currently ineffective at protecting user privacy against LLM inference. Our findings highlight that current LLMs can infer personal data at a previously unattainable scale. In the absence of working defenses, we advocate for a broader discussion around LLM privacy implications beyond memorization, striving for stronger and wider privacy protection.",
        "keywords": "Privacy;Large Language Models",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/61cc0fc6c710cade7f97605f0d40b5f909c094c2.zip",
        "author": "Robin Staab;Mark Vero;Mislav Balunovic;Martin Vechev",
        "authorids": "~Robin_Staab1;~Mark_Vero1;~Mislav_Balunovic1;~Martin_Vechev1",
        "gender": "M;M;M;M",
        "homepage": ";https://www.sri.inf.ethz.ch/people/markvero;https://www.sri.inf.ethz.ch/people/mislav;https://www.sri.inf.ethz.ch/people/martin",
        "dblp": "304/3512;319/4985;231/7686;93/2189.html",
        "google_scholar": ";vguDYtQAAAAJ;fxkgmGwAAAAJ;https://scholar.google.ch/citations?user=aZ1Rh50AAAAJ",
        "orcid": ";;;",
        "linkedin": "robin-staab-b778a51a6/;https://linkedin.com/in/mark-vero-9a32bb17a;;",
        "or_profile": "~Robin_Staab1;~Mark_Vero1;~Mislav_Balunovic1;~Martin_Vechev1",
        "aff": "ETHZ - ETH Zurich;ETHZ-ETH Zurich;Swiss Federal Institute of Technology;Swiss Federal Institute of Technology",
        "aff_domain": "ethz.ch;inf.ethz.ch;ethz.ch;ethz.ch",
        "position": "PhD student;PhD student;PhD student;Full Professor",
        "bibtex": "@inproceedings{\nstaab2024beyond,\ntitle={Beyond Memorization: Violating Privacy via Inference with Large Language Models},\nauthor={Robin Staab and Mark Vero and Mislav Balunovic and Martin Vechev},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=kmn0BhQk7p}\n}",
        "github": "",
        "project": "",
        "reviewers": "WVSy;buQH;uZeq;h2Jj;FqCb",
        "pdf_size": 3238142,
        "rating": "6;6;8;8;8",
        "confidence": "3;5;4;2;4",
        "soundness": "3;3;4;3;4",
        "contribution": "3;3;4;3;3",
        "presentation": "4;2;3;3;3",
        "wc_summary": "35;42;104;83;28",
        "wc_strengths": "57;33;60;49;56",
        "wc_weaknesses": "82;45;16;111;176",
        "wc_questions": "9;316;13;61;16",
        "wc_review": "183;436;193;304;276",
        "wc_reply_reviewers": "17;69;0;16;18",
        "wc_reply_authors": "717;1248;332;385;547",
        "reply_reviewers": "1;2;0;1;1",
        "reply_authors": "2;4;2;2;1",
        "rating_avg": [
            7.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.6,
            1.019803902718557
        ],
        "soundness_avg": [
            3.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            3.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            3.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            58.4,
            29.74962184633613
        ],
        "wc_strengths_avg": [
            51.0,
            9.695359714832659
        ],
        "wc_weaknesses_avg": [
            86.0,
            55.35702304134499
        ],
        "wc_questions_avg": [
            83.0,
            118.01525325143356
        ],
        "wc_review_avg": [
            278.4,
            91.53491137265605
        ],
        "wc_reply_reviewers_avg": [
            24.0,
            23.45207879911715
        ],
        "wc_reply_authors_avg": [
            645.8,
            329.83717195003965
        ],
        "reply_reviewers_avg": [
            1.0,
            0.6324555320336759
        ],
        "reply_authors_avg": [
            2.2,
            0.9797958971132712
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.32025630761017426,
        "gs_citation": 164,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17530915112162893314&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=kmn0BhQk7p",
        "pdf": "https://openreview.net/pdf?id=kmn0BhQk7p",
        "email": "ethz.ch;inf.ethz.ch;ethz.ch;ethz.ch",
        "author_num": 4,
        "aff_unique_index": "0;0;1;1",
        "aff_unique_norm": "ETH Zurich;Swiss Federal Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ethz.ch;https://www.ethz.ch",
        "aff_unique_abbr": "ETHZ;ETH Zurich",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Switzerland"
    },
    {
        "id": "kmnQYA8snK",
        "title": "Scaling up Trustless DNN Inference with Zero-Knowledge Proofs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "As ML models have increased in capabilities and accuracy, so has the complexity of their deployments. Increasingly, ML model consumers are turning to service providers to serve the ML models in the ML-as-a-service (MLaaS) paradigm. As MLaaS proliferates, a critical requirement emerges: how can model consumers verify that the correct predictions were served, in the face of malicious, lazy, or buggy service providers?\n\nWe present the first practical ImageNet-scale method to verify ML model inference non-interactively, i.e., after the inference has been done. To do so, we leverage recent developments in ZK-SNARKs (zero-knowledge succinct non-interactive argument of knowledge), a form of zero-knowledge proofs. ZK-SNARKs allows us to verify ML model execution non-interactively and with only standard cryptographic hardness assumptions. We provide the first ZK-SNARK proof of valid inference for a full-resolution ImageNet model, achieving 79% top-5 accuracy, with verification taking as little as one second. We further use these ZK-SNARKs to design protocols to verify ML model execution in a variety of scenarios, including verifying MLaaS predictions, verifying MLaaS model accuracy, and using ML models for trustless retrieval. Together, our results show that ZK-SNARKs have the promise to make verified ML model inference practical.",
        "keywords": "zero knowledge proof;trustless DNN execution",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/60396c4db5f7ae8472dce744d1abd20e786e373d.pdf",
        "author": "Daniel Kang;Tatsunori Hashimoto;Ion Stoica;Yi Sun",
        "authorids": "~Daniel_Kang1;~Tatsunori_Hashimoto1;~Ion_Stoica1;~Yi_Sun3",
        "gender": ";M;M;",
        "homepage": "https://ddkang.github.io/;https://thashim.github.io;http://people.eecs.berkeley.edu/~istoica/;https://yisun.io/",
        "dblp": "40/6300.html;;s/IonStoica;",
        "google_scholar": "CpMjT0YAAAAJ;5ygiTwsAAAAJ;vN-is70AAAAJ;FdNHp8QAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;ionstoica;",
        "or_profile": "~Daniel_Kang1;~Tatsunori_Hashimoto1;~Ion_Stoica1;~Yi_Sun3",
        "aff": "Department of Computer Science;Stanford University;University of California, Berkeley;University of Chicago",
        "aff_domain": "cs.illinois.edu;stanford.edu;berkeley.edu;statistics.uchicago.edu",
        "position": "Assistant Professor;Assistant Professor;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nkang2024scaling,\ntitle={Scaling up Trustless {DNN} Inference with Zero-Knowledge Proofs},\nauthor={Daniel Kang and Tatsunori Hashimoto and Ion Stoica and Yi Sun},\nyear={2024},\nurl={https://openreview.net/forum?id=kmnQYA8snK}\n}",
        "github": "",
        "project": "",
        "reviewers": "U2XN;hiWG;mW1C;EWEY",
        "site": "https://openreview.net/forum?id=kmnQYA8snK",
        "pdf_size": 238965,
        "rating": "3;5;5;6",
        "confidence": "3;2;3;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;2",
        "presentation": "2;2;3;3",
        "wc_summary": "148;95;62;80",
        "wc_strengths": "31;13;51;42",
        "wc_weaknesses": "662;116;340;49",
        "wc_questions": "95;94;16;42",
        "wc_review": "936;318;469;213",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            96.25,
            32.080952292598795
        ],
        "wc_strengths_avg": [
            34.25,
            14.16642156650719
        ],
        "wc_weaknesses_avg": [
            291.75,
            239.3891967069525
        ],
        "wc_questions_avg": [
            61.75,
            34.01745875282279
        ],
        "wc_review_avg": [
            484.0,
            276.3720318700863
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.13245323570650439,
        "gs_citation": 45,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17985089328129541892&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Unknown Institution;Stanford University;University of California, Berkeley;University of Chicago",
        "aff_unique_dep": "Department of Computer Science;;;",
        "aff_unique_url": ";https://www.stanford.edu;https://www.berkeley.edu;https://www.uchicago.edu",
        "aff_unique_abbr": ";Stanford;UC Berkeley;UChicago",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Stanford;Berkeley",
        "aff_country_unique_index": "1;1;1",
        "aff_country_unique": ";United States"
    },
    {
        "id": "knl4kGCagT",
        "title": "ON TRAINING DERIVATIVE-CONSTRAINED NEURAL NETWORKS",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We refer to the setting where the (partial) derivatives of a neural network\u2019s (NN\u2019s)\npredictions with respect to its inputs are used as additional training signal as a\nderivative-constrained (DC) NN. This situation is common in physics-informed\nsettings in the natural sciences. We propose an integrated RELU (IReLU) acti-\nvation function to improve training of DC NNs. We also investigate denormal-\nization and label rescaling to help stabilize DC training. We evaluate our meth-\nods on physics-informed settings including quantum chemistry and Scientific Ma-\nchine Learning (SciML) tasks. We demonstrate that existing architectures with\nactivations replaced with IReLU activations combined with denormalization/label\nrescaling better incorporate training signal provided by derivative constraints.",
        "keywords": "Scientific Machine learning;Physics-informed neural networks;Derivative-constrained",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/cdfef5f9cfbbc2ed062f59527ffd044b8389bfa4.zip",
        "author": "Kai Chieh Lo;Daniel Huang",
        "authorids": "~Kai_Chieh_Lo1;~Daniel_Huang3",
        "gender": "M;M",
        "homepage": "https://github.com/sage66730;https://danehuang.github.io/",
        "dblp": ";21/2554-1",
        "google_scholar": ";VTe4SGUAAAAJ",
        "orcid": ";0000-0002-1949-1116",
        "linkedin": ";",
        "or_profile": "~Kai_Chieh_Lo1;~Daniel_Huang3",
        "aff": ";San Francisco State University",
        "aff_domain": ";sfsu.edu",
        "position": ";Assistant Professor",
        "bibtex": "@misc{\nlo2024on,\ntitle={{ON} {TRAINING} {DERIVATIVE}-{CONSTRAINED} {NEURAL} {NETWORKS}},\nauthor={Kai Chieh Lo and Daniel Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=knl4kGCagT}\n}",
        "github": "",
        "project": "",
        "reviewers": "LFn2;WsvB;6cYD",
        "site": "https://openreview.net/forum?id=knl4kGCagT",
        "pdf_size": 576674,
        "rating": "3;3;6",
        "confidence": "4;4;3",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "2;1;3",
        "wc_summary": "75;33;42",
        "wc_strengths": "34;37;140",
        "wc_weaknesses": "41;337;265",
        "wc_questions": "186;146;63",
        "wc_review": "336;553;510",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "487;424;211",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            50.0,
            18.05547008526779
        ],
        "wc_strengths_avg": [
            70.33333333333333,
            49.27699485786671
        ],
        "wc_weaknesses_avg": [
            214.33333333333334,
            126.04055784636239
        ],
        "wc_questions_avg": [
            131.66666666666666,
            51.227162933567016
        ],
        "wc_review_avg": [
            466.3333333333333,
            93.81660596906902
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            374.0,
            118.09318354587617
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14340137920482519610&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0",
        "aff_unique_norm": "San Francisco State University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sfsu.edu",
        "aff_unique_abbr": "SFSU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "San Francisco",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "title": "DynaVol: Unsupervised Learning for Dynamic Scenes through Object-Centric Voxelization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17963",
        "id": "koYsgfEwCQ",
        "author_site": "Yanpeng Zhao, Siyu Gao, Yunbo Wang, Xiaokang Yang",
        "tldr": "",
        "abstract": "Unsupervised learning of object-centric representations in dynamic visual scenes is challenging. Unlike most previous approaches that learn to decompose 2D images, we present DynaVol, a 3D scene generative model that unifies geometric structures and object-centric learning in a differentiable volume rendering framework. The key idea is to perform object-centric voxelization to capture the 3D nature of the scene, which infers the probability distribution over objects at individual spatial locations. These voxel features evolve over time through a canonical-space deformation function, forming the basis for global representation learning via slot attention. The voxel features and global features are complementary and are both leveraged by a compositional NeRF decoder for volume rendering. DynaVol remarkably outperforms existing approaches for unsupervised dynamic scene decomposition. Once trained, the explicitly meaningful voxel features enable additional capabilities that 2D scene decomposition methods cannot achieve: it is possible to freely edit the geometric shapes or manipulate the motion trajectories of the objects.",
        "keywords": "Unsupervised Learning;Object-Centric Representation Learning;Dynamic Scene Decomposition;Inverse Rendering",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/aa3d55a3aa5340244af977b10481d0f1eeb49900.zip",
        "author": "Yanpeng Zhao;Siyu Gao;Yunbo Wang;Xiaokang Yang",
        "authorids": "~Yanpeng_Zhao2;~Siyu_Gao1;~Yunbo_Wang2;~Xiaokang_Yang1",
        "gender": "M;F;M;M",
        "homepage": "https://github.com/zyp123494;https://gsyyysg.github.io/;https://icne.sjtu.edu.cn/info/1064/1078.htm;https://wyb15.github.io/",
        "dblp": ";;06/3071-1.html;84/3894",
        "google_scholar": ";;yDEavdMAAAAJ;C8bGfr0AAAAJ",
        "orcid": ";;0000-0003-4029-3322;",
        "linkedin": ";;;",
        "or_profile": "~Yanpeng_Zhao2;~Siyu_Gao1;~Xiaokang_Yang1;~Yunbo_Wang1",
        "aff": "Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn",
        "position": "MS student;MS student;Full Professor;Associate Professor",
        "bibtex": "@inproceedings{\nzhao2024dynavol,\ntitle={DynaVol: Unsupervised Learning for Dynamic Scenes through Object-Centric Voxelization},\nauthor={Yanpeng Zhao and Siyu Gao and Yunbo Wang and Xiaokang Yang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=koYsgfEwCQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "p1WX;FQjp;B2an;8F9K",
        "pdf_size": 6818532,
        "rating": "3;6;6;6",
        "confidence": "3;3;2;4",
        "soundness": "3;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "2;2;3;4",
        "wc_summary": "87;89;96;141",
        "wc_strengths": "28;131;122;26",
        "wc_weaknesses": "245;144;114;385",
        "wc_questions": "59;129;125;39",
        "wc_review": "419;493;457;591",
        "wc_reply_reviewers": "0;81;20;0",
        "wc_reply_authors": "1573;1344;877;1913",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "3;3;2;5",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            103.25,
            22.049659861322123
        ],
        "wc_strengths_avg": [
            76.75,
            49.85666956386076
        ],
        "wc_weaknesses_avg": [
            222.0,
            105.88437089580313
        ],
        "wc_questions_avg": [
            88.0,
            39.66106403010388
        ],
        "wc_review_avg": [
            490.0,
            63.914004725099176
        ],
        "wc_reply_reviewers_avg": [
            25.25,
            33.20673877392961
        ],
        "wc_reply_authors_avg": [
            1426.75,
            376.46405870946035
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.25,
            1.0897247358851685
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5099599571608862310&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=koYsgfEwCQ",
        "pdf": "https://openreview.net/pdf?id=koYsgfEwCQ",
        "email": "sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Shanghai Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sjtu.edu.cn",
        "aff_unique_abbr": "SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "kpEz4Bxs6e",
        "title": "Dataset Distillation in Large Data Era",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Dataset distillation aims to generate a smaller but representative subset from a large dataset, which allows a model to be trained efficiently, meanwhile evaluating on the original testing data distribution to achieve decent performance. Many prior works have aimed to align with diverse aspects of the original datasets, such as matching the training weight trajectories, gradient, feature/BatchNorm distributions, etc. \nIn this work, we show how to distill various large-scale datasets such as full ImageNet-1K/21K under a conventional input resolution of 224$\\times$224 to obtain the best accuracy over all previous approaches, including SRe$^2$L, TESLA and MTT. To achieve this, we introduce a simple yet effective ${\\bf C}$urriculum ${\\bf D}$ata ${\\bf A}$ugmentation ($\\texttt{CDA}$) during data synthesis that obtains the accuracy on large-scale ImageNet-1K and 21K with 63.2\\% (IPC 50) and 36.1\\% (IPC 20), respectively. Finally, we show that, by integrating all our enhancements together, the proposed model beats the current state-of-the-art by more than 4\\% top-1 accuracy on ImageNet-1K and for the first time, reduces the gap to its full-data training counterpart to less than absolute 15\\%. Moreover, this work represents the inaugural success in dataset distillation on larger-scale ImageNet-21K under the standard 224$\\times$224 resolution. Our distilled ImageNet-21K dataset of 20 IPC, 2K recovery budget are available anonymously at https://drive.google.com/drive/folders/12pC0GDTURdYLThAbVHkTw2lkF2KF_85i?usp=sharing.",
        "keywords": "Dataset Distillation;ImageNet-21K;Large-scale Datasets",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/2d8fc9214a9ee0844fdee9a2976054439b349cbd.zip",
        "author": "Zeyuan Yin;Zhiqiang Shen",
        "authorids": "~Zeyuan_Yin1;~Zhiqiang_Shen1",
        "gender": "M;",
        "homepage": "https://zeyuanyin.github.io/;",
        "dblp": "302/4051-1.html;",
        "google_scholar": "QyV0vm8AAAAJ;",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Zeyuan_Yin1;~Zhiqiang_Shen1",
        "aff": "Mohamed bin Zayed University of Artificial Intelligence;",
        "aff_domain": "mbzuai.ac.ae;",
        "position": "MS student;",
        "bibtex": "@misc{\nyin2024dataset,\ntitle={Dataset Distillation in Large Data Era},\nauthor={Zeyuan Yin and Zhiqiang Shen},\nyear={2024},\nurl={https://openreview.net/forum?id=kpEz4Bxs6e}\n}",
        "github": "",
        "project": "",
        "reviewers": "tRFy;Vmep;7cBa;tmMV",
        "site": "https://openreview.net/forum?id=kpEz4Bxs6e",
        "pdf_size": 6125783,
        "rating": "5;5;5;5",
        "confidence": "4;5;2;5",
        "soundness": "3;3;3;2",
        "contribution": "3;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "52;61;78;66",
        "wc_strengths": "95;38;47;62",
        "wc_weaknesses": "101;163;78;121",
        "wc_questions": "41;47;335;6",
        "wc_review": "289;309;538;255",
        "wc_reply_reviewers": "0;65;0;0",
        "wc_reply_authors": "918;1848;3095;878",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "2;4;6;2",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            1.224744871391589
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            64.25,
            9.390819985496474
        ],
        "wc_strengths_avg": [
            60.5,
            21.68524844220144
        ],
        "wc_weaknesses_avg": [
            115.75,
            31.235996862594284
        ],
        "wc_questions_avg": [
            107.25,
            132.4204950149334
        ],
        "wc_review_avg": [
            347.75,
            111.5243807425085
        ],
        "wc_reply_reviewers_avg": [
            16.25,
            28.145825622994256
        ],
        "wc_reply_authors_avg": [
            1684.75,
            901.9710014739942
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.5,
            1.6583123951777
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7451517040807433888&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "Mohamed bin Zayed University of Artificial Intelligence",
        "aff_unique_dep": "",
        "aff_unique_url": "https://mbzuai.ac.ae",
        "aff_unique_abbr": "MBZUAI",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United Arab Emirates"
    },
    {
        "id": "kpFkx09YZl",
        "title": "Estimating and Implementing Conventional Fairness Metrics With Probabilistic Protected Features",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The vast majority of techniques to train fair models require access to the protected attribute (e.g., race, gender), either at train time or in production. However, in many practically important applications this protected attribute is largely unavailable. In this paper, we develop methods for measuring and reducing fairness violations in a setting with limited access to protected attribute labels. Specifically, we assume access to protected attribute labels on a small subset of the dataset of interest, but only probabilistic estimates of protected attribute labels (e.g., via Bayesian Improved Surname Geocoding or BISG) for the rest of the dataset. With this setting in mind, we propose a method for measuring common fairness metrics for an existing classifier, as well as a method for training a model to limit fairness violations by solving a constrained non-convex optimization problem. Unlike similar existing approaches, our methods take advantage of contextual information -- specifically, the relationships between a model's predictions and the probabilistic prediction of protected attributes, given the true protected attribute, and vice versa -- to provide tighter bounds on the true disparity. We provide an empirical illustration of our methods using voting data. First, we show our measurement method can bound the true disparity up to 5.5x tighter than previous methods in these applications. Then, we demonstrate that our training technique effectively reduces disparity in comparison to an unconstrained model while incurring lesser fairness-accuracy trade-offs than other fair optimization methods with limited access to protected attributes.",
        "keywords": "fairness;anti-discrimination;measuring;disparity;disparity reduction;enforcing fairness;probabilistic protected attribute",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/012731574f0b89745c5f23044ac658634679835b.pdf",
        "author": "Hadi Elzayn;Emily Black;Patrick Vossler;Nathanael Jo;JACOB GOLDIN;Daniel E. Ho",
        "authorids": "~Hadi_Elzayn1;~Emily_Black1;~Patrick_Vossler1;~Nathanael_Jo1;~JACOB_GOLDIN1;~Daniel_E._Ho1",
        "gender": "M;F;M;M;;M",
        "homepage": "https://hselzayn.github.io/;https://emblack.github.io/;https://patvoss.me;;;https://dho.stanford.edu",
        "dblp": "225/7810;197/2977;308/2445;;;240/9334",
        "google_scholar": ";dBkGY6gAAAAJ;U7n4zfEAAAAJ;oBcEJDUAAAAJ;;",
        "orcid": ";;0000-0002-9506-0940;0000-0003-2295-9952;;",
        "linkedin": ";;;nathanaeljo/;;",
        "or_profile": "~Hadi_Elzayn1;~Emily_Black1;~Patrick_Vossler1;~Nathanael_Jo1;~JACOB_GOLDIN1;~Daniel_E._Ho1",
        "aff": "Meta;Barnard College;Stanford University;Massachusetts Institute of Technology;;Stanford University",
        "aff_domain": "fb.com;barnard.edu;stanford.edu;mit.edu;;stanford.edu",
        "position": "Researcher;Assistant Professor;Postdoc;PhD student;;Professor",
        "bibtex": "@misc{\nelzayn2024estimating,\ntitle={Estimating and Implementing Conventional Fairness Metrics With Probabilistic Protected Features},\nauthor={Hadi Elzayn and Emily Black and Patrick Vossler and Nathanael Jo and JACOB GOLDIN and Daniel E. Ho},\nyear={2024},\nurl={https://openreview.net/forum?id=kpFkx09YZl}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=kpFkx09YZl",
        "pdf_size": 624917,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6174017653445167101&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;2;3;2",
        "aff_unique_norm": "Meta;Barnard College;Stanford University;Massachusetts Institute of Technology",
        "aff_unique_dep": "Meta Platforms, Inc.;;;",
        "aff_unique_url": "https://meta.com;https://www.barnard.edu;https://www.stanford.edu;https://web.mit.edu",
        "aff_unique_abbr": "Meta;Barnard;Stanford;MIT",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Stanford",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "kqHxpHKMSz",
        "title": "Towards Generalizable Multi-Camera 3D Object Detection via Perspective Debiasing",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Detecting objects in 3D space using multiple cameras, known as Multi-Camera 3D Object Detection (MC3D-Det), has gained prominence with the advent of bird's-eye view (BEV) approaches. However, these methods often struggle when faced with unfamiliar testing environments due to the lack of diverse training data encompassing various viewpoints and environments. To address this, we propose a novel method that aligns 3D detection with 2D camera plane results, ensuring consistent and accurate detections. Our framework, anchored in perspective debiasing, helps the learning of features resilient to domain shifts. In our approach, we render diverse view maps from BEV features and rectify the perspective bias of these maps, leveraging implicit foreground volumes to bridge the camera and BEV planes. This two-step process promotes the learning of perspective- and context-independent features, crucial for accurate object detection across varying viewpoints, camera parameters and environment conditions. Notably, our model-agnostic approach preserves the original network structure without incurring additional inference costs, facilitating seamless integration across various models and simplifying deployment. Furthermore, we also show our approach achieves satisfactory results in real data when trained only with virtual datasets, eliminating the need for real scene annotations. Experimental results on both Domain Generalization (DG) and Unsupervised Domain Adaptation (UDA) clearly demonstrate its effectiveness. Our code will be released.",
        "keywords": "Multi-Camera 3D Object Detection; Domain Generalization; Unsupervised Domain Adaptation",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/efc987f2d3989be690dbf4c5a581d4ae8a23671b.pdf",
        "author": "Hao LU;Yunpeng Zhang;Qing LIAN;Dalong Du;Ying-Cong Chen",
        "authorids": "~Hao_LU8;~Yunpeng_Zhang2;~Qing_LIAN3;~Dalong_Du3;~Ying-Cong_Chen1",
        "gender": "M;M;M;M;M",
        "homepage": "https://scholar.google.com/citations?user=OrbGCGkAAAAJ&hl=zh-TW;https://github.com/zhangyp15;https://www.lianqing11.github.io;;https://www.yingcong.me/",
        "dblp": "72/5422-9;;234/4406;159/2057.html;137/6578",
        "google_scholar": ";UgadGL8AAAAJ;;;https://scholar.google.com.hk/citations?user=n7j4bJUAAAAJ",
        "orcid": "0000-0002-2241-6598;;;;",
        "linkedin": ";;;;",
        "or_profile": "~Hao_LU8;~Yunpeng_Zhang2;~Qing_LIAN3;~Dalong_Du3;~Ying-Cong_Chen1",
        "aff": "Hong Kong University of Science and Technology;PhiGent Robotics;Hong Kong University of Science and Technology;PhiGent Robotics;Hong Kong University of Science and Technology",
        "aff_domain": "hkust.edu;phigent.ai;ust.hk;phigent.ai;hkust-gz.edu.cn",
        "position": "PhD student;Engineer;PhD student;Researcher;Assistant Professor",
        "bibtex": "@misc{\nlu2024towards,\ntitle={Towards Generalizable Multi-Camera 3D Object Detection via Perspective Debiasing},\nauthor={Hao LU and Yunpeng Zhang and Qing LIAN and Dalong Du and Ying-Cong Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=kqHxpHKMSz}\n}",
        "github": "",
        "project": "",
        "reviewers": "tA1k;kBUt;seTP;S4As;HYKF",
        "site": "https://openreview.net/forum?id=kqHxpHKMSz",
        "pdf_size": 2378577,
        "rating": "5;6;6;6;8",
        "confidence": "5;5;3;4;5",
        "soundness": "3;3;3;3;3",
        "contribution": "2;3;3;3;3",
        "presentation": "3;3;1;2;4",
        "wc_summary": "87;51;73;224;44",
        "wc_strengths": "24;31;32;155;32",
        "wc_weaknesses": "174;136;73;483;26",
        "wc_questions": "29;4;48;21;24",
        "wc_review": "314;222;226;883;126",
        "wc_reply_reviewers": "0;0;22;19;0",
        "wc_reply_authors": "1590;1425;1380;1100;707",
        "reply_reviewers": "0;0;1;1;0",
        "reply_authors": "4;3;4;3;2",
        "rating_avg": [
            6.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            4.4,
            0.7999999999999999
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.8,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.6,
            1.019803902718557
        ],
        "wc_summary_avg": [
            95.8,
            65.91327635613328
        ],
        "wc_strengths_avg": [
            54.8,
            50.18924187512698
        ],
        "wc_weaknesses_avg": [
            178.4,
            160.58219079337536
        ],
        "wc_questions_avg": [
            25.2,
            14.161920773680384
        ],
        "wc_review_avg": [
            354.2,
            271.01025810843396
        ],
        "wc_reply_reviewers_avg": [
            8.2,
            10.087616170334794
        ],
        "wc_reply_authors_avg": [
            1240.4,
            309.84292794898516
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            3.2,
            0.7483314773547882
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.15309310892394862,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1633574828781368794&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;1;0",
        "aff_unique_norm": "Hong Kong University of Science and Technology;PhiGent Robotics",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ust.hk;",
        "aff_unique_abbr": "HKUST;",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China;"
    },
    {
        "id": "kqq95wrZWp",
        "title": "Accelerating Diffusion Models for Inverse Problems through Shortcut Sampling",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recently, diffusion models have demonstrated a remarkable ability to solve inverse problems in an unsupervised manner. Existing methods mainly focus on modifying the posterior sampling process while neglecting the potential of the forward process. \nIn this work, we propose Shortcut Sampling for Diffusion (SSD), a novel pipeline for solving inverse problems. Instead of initiating from random noise, the key concept of SSD is to find the \"Embryo\", a transitional state that bridges the measurement image $y$ and the restored image $x$. By utilizing the \"shortcut\" path of \"input-Embryo-output\", SSD can achieve precise restoration with reduced steps.  \nTo obtain the Embryo in the forward process, We propose Distortion Adaptive Inversion~(DA Inversion). Moreover, we apply back projection and attention injection as additional consistency constraints during the generation process. \nExperimentally, we demonstrate the effectiveness of SSD on several representative IR tasks. Compared to state-of-the-art zero-shot methods, our method achieves competitive results with only 30 NFEs. Moreover, SSD with 100 NFEs can outperform state-of-the-art zero-shot methods in certain tasks.",
        "keywords": "zero-shot;inverse problems;image restoration;diffusion models;super resolution;debluring;colorization",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Gongye Liu;Haoze Sun;Jiayi Li;Fei Yin;Yujiu Yang",
        "authorids": "~Gongye_Liu1;~Haoze_Sun2;~Jiayi_Li2;~Fei_Yin3;~Yujiu_Yang2",
        "gender": "M;M;M;M;M",
        "homepage": "https://gongyeliu.github.io/;;;https://feiiyin.github.io/;https://sites.google.com/view/iigroup-thu",
        "dblp": "348/6403;177/9281.html;130/6398;;30/3847",
        "google_scholar": "AWngqwgAAAAJ;;https://scholar.google.com/citations?hl=zh-CN;dHpevJAAAAAJ;4gH3sxsAAAAJ",
        "orcid": "0009-0003-6536-282X;0000-0003-4689-2086;;0000-0002-5146-7685;0000-0002-6427-1024",
        "linkedin": ";;joey-lee-93b38b221/;;",
        "or_profile": "~Gongye_Liu1;~Haoze_Sun2;~Jiayi_Li2;~Fei_Yin3;~Yujiu_Yang2",
        "aff": "Tsinghua University;Tsinghua University;Baidu;University of Cambridge;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;tsinghua.edu.cn;baidu.com;cam.ac.uk;tsinghua.edu.cn",
        "position": "MS student;MS student;Emeritus;PhD student;Full Professor",
        "bibtex": "@misc{\nliu2024accelerating,\ntitle={Accelerating Diffusion Models for Inverse Problems through Shortcut Sampling},\nauthor={Gongye Liu and Haoze Sun and Jiayi Li and Fei Yin and Yujiu Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=kqq95wrZWp}\n}",
        "github": "",
        "project": "",
        "reviewers": "4hTS;7SJJ;Fzfq;X46h",
        "site": "https://openreview.net/forum?id=kqq95wrZWp",
        "pdf_size": 8297466,
        "rating": "3;5;5;5",
        "confidence": "3;4;4;2",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "101;55;90;77",
        "wc_strengths": "58;30;60;63",
        "wc_weaknesses": "360;87;184;200",
        "wc_questions": "7;48;5;3",
        "wc_review": "526;220;339;343",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            80.75,
            17.122718826167766
        ],
        "wc_strengths_avg": [
            52.75,
            13.254716141811564
        ],
        "wc_weaknesses_avg": [
            207.75,
            97.96013219672582
        ],
        "wc_questions_avg": [
            15.75,
            18.673175948402566
        ],
        "wc_review_avg": [
            357.0,
            109.37321427113679
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.17407765595569782,
        "gs_citation": 18,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4843811930488077941&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;0;1;2;0",
        "aff_unique_norm": "Tsinghua University;Baidu;University of Cambridge",
        "aff_unique_dep": ";Baidu, Inc.;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.baidu.com;https://www.cam.ac.uk",
        "aff_unique_abbr": "THU;Baidu;Cambridge",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Cambridge",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "id": "krIOxfqsOh",
        "title": "Masked Pretraining for Multi-Agent Decision Making",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Building a single generalist agent with zero-shot capability has recently sparked significant advancements in decision-making. However, extending this capability to multi-agent scenarios presents challenges. Most current works struggle with zero-shot capabilities, due to two challenges particular to the multi-agent settings: a mismatch between centralized pretraining and decentralized execution, and varying agent numbers and action spaces, making it difficult to create generalizable representations across diverse downstream tasks. To overcome these challenges, we propose a \\textbf{Mask}ed pretraining framework for \\textbf{M}ulti-\\textbf{a}gent decision making (MaskMA). This model, based on transformer architecture, employs a mask-based collaborative learning strategy suited for decentralized execution with partial observation. Moreover, MaskMA integrates a generalizable action representation by dividing the action space into actions toward self-information and actions related to other entities. This flexibility allows MaskMA to tackle tasks with varying agent numbers and thus different action spaces. Extensive experiments in SMAC reveal MaskMA, with a single model pretrained on 11 training maps, can achieve an impressive 77.8\\% zero-shot win rate on 60 unseen test maps by decentralized execution, while also performing effectively on other types of downstream tasks (\\textit{e.g.,}  varied policies collaboration and ad hoc team play).",
        "keywords": "Multi-agent Decision Making;Deep Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/ea0b84f19c537514893d19ea98071c58ca98d1c5.zip",
        "author": "Jie Liu;Yinmin Zhang;Chuming Li;Chao Yang;Yaodong Yang;Yu Liu;Wanli Ouyang",
        "authorids": "~Jie_Liu13;~Yinmin_Zhang1;~Chuming_Li3;~Chao_Yang3;~Yaodong_Yang1;~Yu_Liu2;~Wanli_Ouyang1",
        "gender": ";F;M;;M;M;",
        "homepage": ";https://yinminzhang.github.io/;https://scholar.google.com.sg/citations?user=ZfB7vEcAAAAJ&hl=en;;https://www.yangyaodong.com;http://liuyu.us;",
        "dblp": ";289/0508;241/6082;;170/1496-1;97/2274-15;",
        "google_scholar": ";https://scholar.google.com.hk/citations?user=aSxDzKUAAAAJ;https://scholar.google.com.sg/citations?user=ZfB7vEcAAAAJ;;https://scholar.google.co.uk/citations?user=6yL0xw8AAAAJ;;",
        "orcid": ";;;;0000-0001-8132-5613;;",
        "linkedin": ";;;;yaodong-yang;;",
        "or_profile": "~Jie_Liu13;~Yinmin_Zhang1;~Chuming_Li3;~Chao_Yang3;~Yaodong_Yang1;~Yu_Liu2;~Wanli_Ouyang1",
        "aff": ";University of Sydney;;;Peking University;SenseTime;",
        "aff_domain": ";sydney.edu.au;;;pku.edu.cn;sensetime.com;",
        "position": ";PHD;;;Assistant Professor;Principal Researcher;",
        "bibtex": "@misc{\nliu2024masked,\ntitle={Masked Pretraining for Multi-Agent Decision Making},\nauthor={Jie Liu and Yinmin Zhang and Chuming Li and Chao Yang and Yaodong Yang and Yu Liu and Wanli Ouyang},\nyear={2024},\nurl={https://openreview.net/forum?id=krIOxfqsOh}\n}",
        "github": "",
        "project": "",
        "reviewers": "Y6zM;FVLE;cZoR;famv;pTAk",
        "site": "https://openreview.net/forum?id=krIOxfqsOh",
        "pdf_size": 7772336,
        "rating": "3;3;5;5;6",
        "confidence": "4;4;3;3;2",
        "soundness": "3;3;2;3;3",
        "contribution": "2;2;2;2;3",
        "presentation": "2;2;2;2;3",
        "wc_summary": "117;63;45;58;70",
        "wc_strengths": "71;51;14;30;59",
        "wc_weaknesses": "252;352;28;200;129",
        "wc_questions": "89;315;273;18;23",
        "wc_review": "529;781;360;306;281",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            4.4,
            1.2
        ],
        "confidence_avg": [
            3.2,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.2,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            70.6,
            24.597560854686385
        ],
        "wc_strengths_avg": [
            45.0,
            20.464603587658374
        ],
        "wc_weaknesses_avg": [
            192.2,
            109.66202624427473
        ],
        "wc_questions_avg": [
            143.6,
            126.03428105083157
        ],
        "wc_review_avg": [
            451.4,
            186.11243913290699
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.9799578870122229,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15790064583536652661&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of Sydney;Peking University;SenseTime",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.sydney.edu.au;http://www.pku.edu.cn;https://www.sensetime.com",
        "aff_unique_abbr": "USYD;Peking U;SenseTime",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "Australia;China"
    },
    {
        "title": "Hiding in Plain Sight: Disguising Data Stealing Attacks in Federated Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17962",
        "id": "krx55l2A6G",
        "author_site": "Kostadin Garov, Dimitar I. Dimitrov, Nikola Jovanovi\u0107, Martin Vechev",
        "tldr": "",
        "abstract": "Malicious server (MS) attacks have enabled the scaling of data stealing in federated learning to large batch sizes and secure aggregation, settings previously considered private. However, many concerns regarding the client-side detectability of MS attacks were raised, questioning their practicality. In this work, for the first time, we thoroughly study client-side detectability. We first demonstrate that all prior MS attacks are detectable by principled checks, and formulate a necessary set of requirements that a practical MS attack must satisfy. Next, we propose SEER, a novel attack framework that satisfies these requirements. The key insight of SEER is the use of a secret decoder, jointly trained with the shared model. We show that SEER can steal user data from gradients of realistic networks, even for large batch sizes of up to 512 and under secure aggregation. Our work is a promising step towards assessing the true vulnerability of federated learning in real-world settings.",
        "keywords": "Privacy;Federated Learning;Gradient Leakage",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/927408f6251e7e83daa02a971c8edb6ebf6eac52.zip",
        "author": "Kostadin Garov;Dimitar Iliev Dimitrov;Nikola Jovanovi\u0107;Martin Vechev",
        "authorids": "~Kostadin_Garov1;~Dimitar_Iliev_Dimitrov2;~Nikola_Jovanovi\u01071;~Martin_Vechev1",
        "gender": ";M;M;M",
        "homepage": "https://insait.ai/kostadin-garov/;https://www.sri.inf.ethz.ch/people/dimitadi;https://www.sri.inf.ethz.ch/people/nikola;https://www.sri.inf.ethz.ch/people/martin",
        "dblp": ";271/0915;230/4424-1;93/2189.html",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en;https://scholar.google.ch/citations?user=aZ1Rh50AAAAJ",
        "orcid": ";0000-0001-9813-0900;;",
        "linkedin": ";;nikola-jovanovi%C4%87-9b599b105/;",
        "or_profile": "~Kostadin_Garov1;~Dimitar_Iliev_Dimitrov2;~Nikola_Jovanovi\u01071;~Martin_Vechev1",
        "aff": "INSAIT;Swiss Federal Institute of Technology;ETHZ - ETH Zurich;Swiss Federal Institute of Technology",
        "aff_domain": "insait.ai;ethz.ch;ethz.ch;ethz.ch",
        "position": "PhD student;PhD student;PhD student;Full Professor",
        "bibtex": "@inproceedings{\ngarov2024hiding,\ntitle={Hiding in Plain Sight: Disguising Data Stealing Attacks in Federated Learning},\nauthor={Kostadin Garov and Dimitar Iliev Dimitrov and Nikola Jovanovi{\\'c} and Martin Vechev},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=krx55l2A6G}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZL2M;SRu7;dXt6;Lg7w;sMvX",
        "pdf_size": 1150944,
        "rating": "5;6;6;6;8",
        "confidence": "4;2;3;3;4",
        "soundness": "1;3;2;3;3",
        "contribution": "2;2;3;3;4",
        "presentation": "3;3;3;3;3",
        "wc_summary": "35;113;105;40;156",
        "wc_strengths": "12;122;76;26;47",
        "wc_weaknesses": "349;13;238;52;116",
        "wc_questions": "49;3;134;1;22",
        "wc_review": "445;251;553;119;341",
        "wc_reply_reviewers": "27;16;25;0;19",
        "wc_reply_authors": "1948;195;814;414;199",
        "reply_reviewers": "1;1;1;0;1",
        "reply_authors": "3;1;1;1;1",
        "rating_avg": [
            6.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.2,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.4,
            0.8
        ],
        "contribution_avg": [
            2.8,
            0.7483314773547882
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            89.8,
            46.11897657147218
        ],
        "wc_strengths_avg": [
            56.6,
            39.16937579283081
        ],
        "wc_weaknesses_avg": [
            153.6,
            123.94289007442097
        ],
        "wc_questions_avg": [
            41.8,
            49.223571589229486
        ],
        "wc_review_avg": [
            341.8,
            150.4265933935885
        ],
        "wc_reply_reviewers_avg": [
            17.4,
            9.562426470305537
        ],
        "wc_reply_authors_avg": [
            714.0,
            656.8625426982421
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4
        ],
        "reply_authors_avg": [
            1.4,
            0.8000000000000002
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.21821789023599233,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12301670613672993697&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=krx55l2A6G",
        "pdf": "https://openreview.net/pdf?id=krx55l2A6G",
        "email": "insait.ai;ethz.ch;ethz.ch;ethz.ch",
        "author_num": 4,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "Instituto de Engenharia de Sistemas e Computadores, Investiga\u00e7\u00e3o e Tecnologia;Swiss Federal Institute of Technology;ETH Zurich",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.insait.pt;https://www.ethz.ch;https://www.ethz.ch",
        "aff_unique_abbr": "INSAIT;ETH Zurich;ETHZ",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "Portugal;Switzerland"
    },
    {
        "title": "Text-to-3D with Classifier Score Distillation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17961",
        "id": "ktG8Tun1Cy",
        "author_site": "Xin Yu, Yuan-Chen Guo, Yangguang Li, Ding Liang, Song-Hai Zhang, XIAOJUAN QI",
        "tldr": "",
        "abstract": "Text-to-3D generation has made remarkable progress recently, particularly with methods based on Score Distillation Sampling (SDS) that leverages pre-trained 2D diffusion models. While the usage of classifier-free guidance is well acknowledged to be crucial for successful optimization, it is considered an auxiliary trick rather than the most essential component. In this paper, we re-evaluate the role of classifier-free guidance in score distillation and discover a surprising finding: the guidance alone is enough for effective text-to-3D generation tasks. \nWe name this method Classifier Score Distillation (CSD), which can be interpreted as using an implicit classification model for generation. This new perspective reveals new insights for understanding existing techniques. We validate the effectiveness of CSD across a variety of text-to-3D tasks including shape generation, texture synthesis, and shape editing, achieving results superior to those of state-of-the-art methods. Our project page is https://xinyu-andy.github.io/Classifier-Score-Distillation",
        "keywords": "3D modeling;generative models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/537361c71e10454fd4d1ebab05cf94de6c23a2ec.zip",
        "author": "Xin Yu;Yuan-Chen Guo;Yangguang Li;Ding Liang;Song-Hai Zhang;XIAOJUAN QI",
        "authorids": "~Xin_Yu6;~Yuan-Chen_Guo1;~Yangguang_Li1;~Ding_Liang1;~Song-Hai_Zhang1;~XIAOJUAN_QI2",
        "gender": "M;;M;;M;F",
        "homepage": "https://xinyu-andy.github.io/;;https://yg256li.github.io/;;https://www.cs.tsinghua.edu.cn/csen/info/1307/4342.htm;https://xjqi.github.io/",
        "dblp": "54/1184-4;;132/4829-1.html;;45/6733;176/1445-1.html",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;a7AMvgkAAAAJ;;https://scholar.google.com.tw/citations?user=AWtV-EQAAAAJ;bGn0uacAAAAJ",
        "orcid": "0000-0002-4531-1254;;;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Xin_Yu6;~Yuan-Chen_Guo1;~Yangguang_Li1;~Ding_Liang1;~Song-Hai_Zhang1;~XIAOJUAN_QI2",
        "aff": "The University of Hong Kong;;Shanghai AI Laboratory;;Tsinghua University;University of Hong Kong",
        "aff_domain": "hku.hk;;pjlab.org.cn;;tsinghua.edu.cn;hku.hk",
        "position": "PhD student;;Researcher;;Associate Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nyu2024texttod,\ntitle={Text-to-3D with Classifier Score Distillation},\nauthor={Xin Yu and Yuan-Chen Guo and Yangguang Li and Ding Liang and Song-Hai Zhang and XIAOJUAN QI},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ktG8Tun1Cy}\n}",
        "github": "",
        "project": "",
        "reviewers": "FT6d;pueN;8VxR;oCeh",
        "pdf_size": 7253328,
        "rating": "5;6;8;8",
        "confidence": "4;5;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;3;4;4",
        "wc_summary": "111;25;165;52",
        "wc_strengths": "25;39;73;100",
        "wc_weaknesses": "117;309;166;38",
        "wc_questions": "54;17;166;37",
        "wc_review": "307;390;570;227",
        "wc_reply_reviewers": "149;0;0;0",
        "wc_reply_authors": "1577;1905;774;350",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "4;3;2;1",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            88.25,
            54.135824552693386
        ],
        "wc_strengths_avg": [
            59.25,
            29.294837429144405
        ],
        "wc_weaknesses_avg": [
            157.5,
            98.67243789427725
        ],
        "wc_questions_avg": [
            68.5,
            57.79489596841576
        ],
        "wc_review_avg": [
            373.5,
            127.24877209623675
        ],
        "wc_reply_reviewers_avg": [
            37.25,
            64.51889258194068
        ],
        "wc_reply_authors_avg": [
            1151.5,
            619.2174496895254
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 85,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2286070963806767038&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=ktG8Tun1Cy",
        "pdf": "https://openreview.net/pdf?id=ktG8Tun1Cy",
        "email": "hku.hk;;pjlab.org.cn;;tsinghua.edu.cn;hku.hk",
        "author_num": 6,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "University of Hong Kong;Shanghai AI Laboratory;Tsinghua University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.hku.hk;https://www.shanghai-ai-lab.com;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "HKU;SAIL;THU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "On Accelerating Diffusion-Based Sampling Processes via Improved Integration Approximation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17960",
        "id": "ktJAF3lxbi",
        "author_site": "Guoqiang Zhang, Kenta Niwa, W. Bastiaan Kleijn",
        "tldr": "",
        "abstract": "A popular approach to sample a diffusion-based generative model is to solve an ordinary differential equation (ODE). In existing samplers, the coefficients of the ODE solvers are pre-determined by the ODE formulation, the reverse discrete timesteps, and the employed ODE methods. In this paper, we consider accelerating several popular ODE-based sampling processes (including EDM, DDIM, and DPM-Solver) by optimizing certain coefficients via improved integration approximation (IIA). We propose to minimize, for each time step, a mean squared error (MSE) function with respect to the selected coefficients.  The MSE is constructed by applying the original ODE solver for a set of fine-grained timesteps, which in principle provides a more accurate integration approximation in predicting the next diffusion state. The proposed IIA technique does not require any change of a pre-trained model, and only introduces a very small computational overhead for solving a number of quadratic optimization problems. Extensive experiments show that considerably better FID scores can be achieved by using IIA-EDM, IIA-DDIM, and IIA-DPM-Solver than the original counterparts when the neural function evaluation (NFE) is small (i.e., less than 25).",
        "keywords": "diffusion;EDM;DDIM;DPM-Solver;optimal stepsize",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/4323d6f5c92795968d2f1459b77226dbbc430a5f.zip",
        "author": "Guoqiang Zhang;Kenta Niwa;W. Bastiaan Kleijn",
        "authorids": "~Guoqiang_Zhang1;~Kenta_Niwa1;~W._Bastiaan_Kleijn1",
        "gender": "M;M;M",
        "homepage": ";http://www.kecl.ntt.co.jp/icl/ls/members/niwa/index.html;",
        "dblp": ";64/1008.html;30/797",
        "google_scholar": "https://scholar.google.nl/citations?hl=en;Btla06EAAAAJ;https://scholar.google.co.nz/citations?user=bOfLAC4AAAAJ",
        "orcid": ";0000-0002-6911-0238;",
        "linkedin": ";;",
        "or_profile": "~Guoqiang_Zhang1;~Kenta_Niwa1;~W._Bastiaan_Kleijn1",
        "aff": "University of Exeter;NTT Corporation;Victoria University of Wellington",
        "aff_domain": "exeter.ac.uk;ntt.co.jp;victoria.ac.nz",
        "position": "Assistant Professor;Researcher;Full Professor",
        "bibtex": "@inproceedings{\nzhang2024on,\ntitle={On Accelerating Diffusion-Based Sampling Processes via Improved Integration Approximation},\nauthor={Guoqiang Zhang and Kenta Niwa and W. Bastiaan Kleijn},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ktJAF3lxbi}\n}",
        "github": "",
        "project": "",
        "reviewers": "t2so;8gXX;SzoU;an6f",
        "pdf_size": 2891888,
        "rating": "6;6;6;6",
        "confidence": "3;2;3;4",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;2",
        "presentation": "3;3;4;3",
        "wc_summary": "72;102;145;61",
        "wc_strengths": "84;28;59;31",
        "wc_weaknesses": "168;88;49;136",
        "wc_questions": "2;5;94;50",
        "wc_review": "326;223;347;278",
        "wc_reply_reviewers": "0;9;81;23",
        "wc_reply_authors": "505;447;885;614",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "1;2;2;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            95.0,
            32.53459696999488
        ],
        "wc_strengths_avg": [
            50.5,
            22.808989455914087
        ],
        "wc_weaknesses_avg": [
            110.25,
            45.40030286242593
        ],
        "wc_questions_avg": [
            37.75,
            37.632266740126084
        ],
        "wc_review_avg": [
            293.5,
            47.77290026782967
        ],
        "wc_reply_reviewers_avg": [
            28.25,
            31.538666744172936
        ],
        "wc_reply_authors_avg": [
            612.75,
            168.22956785297882
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7586634098892914175&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=ktJAF3lxbi",
        "pdf": "https://openreview.net/pdf?id=ktJAF3lxbi",
        "email": "exeter.ac.uk;ntt.co.jp;victoria.ac.nz",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of Exeter;NTT Corporation;Victoria University of Wellington",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.exeter.ac.uk;https://www.ntt.co.jp;https://www.victoria.ac.nz",
        "aff_unique_abbr": "Exeter;NTT;VUW",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2",
        "aff_country_unique": "United Kingdom;Japan;New Zealand"
    },
    {
        "id": "ktVzWL9BAQ",
        "title": "Provable Dynamic Regularization Calibration",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Miscalibration in deep learning refers to the confidence of the model does not match the performance. This problem usually arises due to the overfitting issue in deep learning models, resulting in overly confident predictions during testing. Existing methods typically prevent overfitting and mitigate miscalibration by adding a maximum-entropy regularizer to the objective function. The objective of these method can be understood as seeking a model that not only fits the ground-truth labels by increasing the confidence but also maximizes the entropy of predicted probabilities by decreasing the confidence. However, previous methods cannot provide clear guidance on when to increase the confidence (known knowns) or decrease the confidence (known unknowns), leading to the two conflicting optimization objectives (increasing but also decreasing confidence). In this work, we propose a simple yet effective method called dynamic regularization calibration (drc), to address this trade-off by exploring outlier samples within the training set, resulting in a reliable model that can admit it knows somethings and does not know others. drc effectively fits the labels for in-distribution samples while applying regularization to potential outliers dynamically, thereby obtaining robust calibrated model. Both theoretical and empirical analyses demonstrate the superiority of drc compared with previous methods.",
        "keywords": "calibration;regularization",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/24c0d706b5f49d4474fdcef6a48858704cb176af.pdf",
        "author": "Zongbo Han;Yifeng Yang;Changqing Zhang;Linjun Zhang;Joey Tianyi Zhou;Qinghua Hu;Huaxiu Yao",
        "authorids": "~Zongbo_Han1;~Yifeng_Yang1;~Changqing_Zhang1;~Linjun_Zhang1;~Joey_Tianyi_Zhou1;~Qinghua_Hu1;~Huaxiu_Yao1",
        "gender": "M;M;M;M;M;M;M",
        "homepage": "https://zongbo-han.github.io/;https://zxk1212.github.io/;http://cic.tju.edu.cn/faculty/zhangchangqing/index.html;;https://joeyzhouty.github.io/;http://cic.tju.edu.cn/faculty/huqinghua/index.html;http://huaxiuyao.mystrikingly.com",
        "dblp": "255/6965;;78/2668;;123/5110;;197/1635",
        "google_scholar": "F2BBkQEAAAAJ;yourID;yJGhdykAAAAJ;TUAzs3sAAAAJ;https://scholar.google.com.sg/citations?user=cYNqDokAAAAJ;TVSNq_wAAAAJ;A20BZnQAAAAJ",
        "orcid": ";;;;0000-0002-4675-7055;0000-0001-7765-8095;",
        "linkedin": ";;;;;;huaxiuyao/",
        "or_profile": "~Zongbo_Han1;~Yifeng_Yang1;~Changqing_Zhang1;~Linjun_Zhang1;~Joey_Tianyi_Zhou1;~Qinghua_Hu1;~Huaxiu_Yao1",
        "aff": "Tianjin University;Tianjin University;Tianjin University;Rutgers University;A*STAR Centre for Frontier AI Research;Tianjin University;Department of Computer Science, University of North Carolina at Chapel Hill",
        "aff_domain": "tju.edu.cn;tju.edu.cn;tju.edu.cn;rutgers.edu;cfar.a-star.edu.sg;tju.edu.cn;cs.unc.edu",
        "position": "PhD student;Undergrad student;Associate Professor;Assistant Professor;Principal Researcher;Professor;Assistant Professor",
        "bibtex": "@misc{\nhan2024provable,\ntitle={Provable Dynamic Regularization Calibration},\nauthor={Zongbo Han and Yifeng Yang and Changqing Zhang and Linjun Zhang and Joey Tianyi Zhou and Qinghua Hu and Huaxiu Yao},\nyear={2024},\nurl={https://openreview.net/forum?id=ktVzWL9BAQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "m76P;wg6U;Vf1p;nfky",
        "site": "https://openreview.net/forum?id=ktVzWL9BAQ",
        "pdf_size": 750327,
        "rating": "3;3;3;5",
        "confidence": "4;3;4;4",
        "soundness": "3;2;2;3",
        "contribution": "2;2;1;3",
        "presentation": "2;2;1;3",
        "wc_summary": "171;25;40;81",
        "wc_strengths": "183;27;19;113",
        "wc_weaknesses": "525;204;255;597",
        "wc_questions": "169;4;20;113",
        "wc_review": "1048;260;334;904",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            79.25,
            56.79953785023255
        ],
        "wc_strengths_avg": [
            85.5,
            67.28112662552553
        ],
        "wc_weaknesses_avg": [
            395.25,
            168.65997598719147
        ],
        "wc_questions_avg": [
            76.5,
            67.70708973216911
        ],
        "wc_review_avg": [
            636.5,
            344.2916641453871
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ku2mjn8ZkXQJ:scholar.google.com/&scioq=Provable+Dynamic+Regularization+Calibration&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;2;0;3",
        "aff_unique_norm": "Tianjin University;Rutgers University;A*STAR;University of North Carolina at Chapel Hill",
        "aff_unique_dep": ";;Centre for Frontier AI Research;Department of Computer Science",
        "aff_unique_url": "http://www.tju.edu.cn;https://www.rutgers.edu;https://www.a-star.edu.sg;https://www.unc.edu",
        "aff_unique_abbr": "TJU;Rutgers;A*STAR;UNC Chapel Hill",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Chapel Hill",
        "aff_country_unique_index": "0;0;0;1;2;0;1",
        "aff_country_unique": "China;United States;Singapore"
    },
    {
        "title": "Towards image compression with perfect realism at ultra-low bitrates",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17959",
        "id": "ktdETU9JBg",
        "author_site": "Marlene Careil, Matthew J Muckley, Jakob Verbeek, St\u00e9phane Lathuili\u00e8re",
        "tldr": "",
        "abstract": "Image  codecs are typically optimized to trade-off bitrate vs. distortion metrics. At low bitrates, this leads to  compression artefacts which are easily perceptible, even when training with perceptual or adversarial losses. To improve image quality and remove dependency on the bitrate we propose to decode with iterative diffusion models. We condition the decoding process on a vector-quantized image representation, as well as a global image description to provide additional context. We dub our model `PerCo'' for ``perceptual compression'', and compare it to state-of-the-art codecs at rates from 0.1 down to 0.003 bits per pixel. The latter rate  is more than an order of magnitude smaller than those considered in most prior work, compressing a 512x768 Kodak image with less than 153 bytes. Despite this ultra-low bitrate, our approach maintains the ability to reconstruct realistic images. We find that our model leads to reconstructions with state-of-the-art visual quality as measured by FID and KID. As predicted by rate-distortion-perception theory, visual quality is less dependent on the bitrate than previous methods.",
        "keywords": "image compression;diffusion models;generative image models",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Marlene Careil;Matthew J. Muckley;Jakob Verbeek;St\u00e9phane Lathuili\u00e8re",
        "authorids": "~Marlene_Careil1;~Matthew_J._Muckley1;~Jakob_Verbeek1;~St\u00e9phane_Lathuili\u00e8re1",
        "gender": ";M;Not Specified;M",
        "homepage": ";https://mmuckley.github.io/;http://lear.inrialpes.fr/~verbeek;http://stelat.eu",
        "dblp": ";158/8226;v/JakobJVerbeek;151/8604",
        "google_scholar": ";Iz9v6dcAAAAJ;oZGA-rAAAAAJ;https://scholar.google.fr/citations?user=xllguWMAAAAJ",
        "orcid": ";0000-0002-6525-8817;0000-0003-1419-1816;",
        "linkedin": "marl%C3%A8ne-careil-901804155/?originalSubdomain=fr;matthew-muckley-33a9b558/;jakob-verbeek-3b11aa14a/;",
        "or_profile": "~Marlene_Careil1;~Matthew_J._Muckley1;~Jakob_Verbeek1;~St\u00e9phane_Lathuili\u00e8re1",
        "aff": "T\u00e9l\u00e9com ParisTech;Meta;Meta;T\u00e9l\u00e9com ParisTech",
        "aff_domain": "telecom-paristech.fr;fb.com;meta.com;telecom-paristech.fr",
        "position": "PhD student;Research Engineer;Research Scientist;Associate Professor",
        "bibtex": "@inproceedings{\ncareil2024towards,\ntitle={Towards image compression with perfect realism at ultra-low bitrates},\nauthor={Marlene Careil and Matthew J. Muckley and Jakob Verbeek and St{\\'e}phane Lathuili{\\`e}re},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ktdETU9JBg}\n}",
        "github": "",
        "project": "",
        "reviewers": "Z1Pi;p6Yn;FDrq;6W37",
        "pdf_size": 50443672,
        "rating": "6;6;6;6",
        "confidence": "4;4;4;4",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "49;37;53;73",
        "wc_strengths": "78;100;73;50",
        "wc_weaknesses": "177;126;63;122",
        "wc_questions": "18;77;42;4",
        "wc_review": "322;340;231;249",
        "wc_reply_reviewers": "8;27;9;15",
        "wc_reply_authors": "397;556;244;175",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            53.0,
            12.96148139681572
        ],
        "wc_strengths_avg": [
            75.25,
            17.76759691123141
        ],
        "wc_weaknesses_avg": [
            122.0,
            40.37945021913993
        ],
        "wc_questions_avg": [
            35.25,
            27.67105888830422
        ],
        "wc_review_avg": [
            285.5,
            46.38156961552724
        ],
        "wc_reply_reviewers_avg": [
            14.75,
            7.562241731127087
        ],
        "wc_reply_authors_avg": [
            343.0,
            146.8928180681411
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 49,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5173946939728620900&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=ktdETU9JBg",
        "pdf": "https://openreview.net/pdf?id=ktdETU9JBg",
        "email": "telecom-paristech.fr;fb.com;meta.com;telecom-paristech.fr",
        "author_num": 4,
        "aff_unique_index": "0;1;1;0",
        "aff_unique_norm": "T\u00e9l\u00e9com ParisTech;Meta",
        "aff_unique_dep": ";Meta Platforms, Inc.",
        "aff_unique_url": "https://www.telecom-paristech.fr;https://meta.com",
        "aff_unique_abbr": "TP;Meta",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "France;United States"
    },
    {
        "id": "ktiikNTgK5",
        "title": "Compresso: Structured Pruning with Collaborative Prompting Learns Compact Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Despite the remarkable success of  Large Language Models (LLMs), the massive size poses significant deployment challenges, particularly on resource-constrained hardware. While existing LLM compression methods focus on quantization, pruning remains relatively unexplored due to the high cost of training-based approaches and data collection challenges. One-shot pruning methods, although cost-effective and data-free, have become dominant in LLM pruning, but lead to performance decline under the structured pruning setting. \nIn this work, we introduce a new paradigm for structurally pruning LLMs, called Compresso. Our approach, through the collaboration of the proposed resource-efficient pruning algorithm and the LLM itself, learns optimal pruning decisions during the training process. Compresso addresses the challenges of expensive training costs and data collection by incorporating  Low-Rank Adaptation (LoRA) into the $L_0$ regularization during the instruction tuning process. Then, we further augment the pruning algorithm by introducing a collaborative prompt that fosters collaboration between the LLM and the pruning algorithm, significantly boosting the overall performance.  To this end,  Compresso prunes LLaMA-7B to 5.4B, maintaining original performance and even surpassing LLaMA-7B in reading comprehension by 2.62\\%. Extensive experiments demonstrate that  Compresso significantly outperforms one-shot pruning baselines across various sparsity ratios, achieving up to 2.21\\%, 11.43\\%, 7.04\\%, and 4.81\\% higher scores on the commonsense reasoning, reading comprehension, MMLU, and BBH benchmarks, respectively.",
        "keywords": "Structured Pruning;Large Language Model",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/b6859a8f2be5dd90d4129c926e927a6dbcd81ef0.zip",
        "author": "Song Guo;Jiahang Xu;Li Lyna Zhang;Mao Yang",
        "authorids": "~Song_Guo7;~Jiahang_Xu2;~Li_Lyna_Zhang1;~Mao_Yang1",
        "gender": ";F;F;",
        "homepage": "https://mac.xmu.edu.cn/members.htm;https://jiahangxu.github.io/;https://www.microsoft.com/en-us/research/people/lzhani/;",
        "dblp": ";133/5457;195/5224;",
        "google_scholar": ";PuecdZgAAAAJ;-_ItfAoAAAAJ;LgJqohwAAAAJ",
        "orcid": ";0000-0001-9186-619X;;",
        "linkedin": ";;;",
        "or_profile": "~Song_Guo7;~Jiahang_Xu2;~Li_Lyna_Zhang1;~Mao_Yang1",
        "aff": "Xiamen University;Microsoft Research;Microsoft Research Asia;",
        "aff_domain": "xmu.edu.cn;research.microsoft.com;microsoft.com;",
        "position": "MS student;Researcher;Researcher;",
        "bibtex": "@misc{\nguo2024compresso,\ntitle={Compresso: Structured Pruning with Collaborative Prompting Learns Compact Large Language Models},\nauthor={Song Guo and Jiahang Xu and Li Lyna Zhang and Mao Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=ktiikNTgK5}\n}",
        "github": "",
        "project": "",
        "reviewers": "dFpf;FZK6;uGct;VBbn",
        "site": "https://openreview.net/forum?id=ktiikNTgK5",
        "pdf_size": 740478,
        "rating": "5;5;5;6",
        "confidence": "5;3;4;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "34;87;51;440",
        "wc_strengths": "36;50;17;198",
        "wc_weaknesses": "138;118;200;100",
        "wc_questions": "2;5;96;67",
        "wc_review": "210;260;364;805",
        "wc_reply_reviewers": "0;40;0;0",
        "wc_reply_authors": "914;1827;1569;1460",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "3;4;4;3",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            153.0,
            166.80077937467797
        ],
        "wc_strengths_avg": [
            75.25,
            71.83096477146886
        ],
        "wc_weaknesses_avg": [
            139.0,
            37.69615364994153
        ],
        "wc_questions_avg": [
            42.5,
            40.33918690305991
        ],
        "wc_review_avg": [
            409.75,
            234.86206058024783
        ],
        "wc_reply_reviewers_avg": [
            10.0,
            17.320508075688775
        ],
        "wc_reply_authors_avg": [
            1442.5,
            332.96433742970135
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.5,
            0.5
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 32,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9699256993304883255&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Xiamen University;Microsoft",
        "aff_unique_dep": ";Microsoft Research",
        "aff_unique_url": "https://www.xmu.edu.cn;https://www.microsoft.com/en-us/research",
        "aff_unique_abbr": "XMU;MSR",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Asia",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "ktmMkOOeYb",
        "title": "Dual Grained Quantization: Efficient Fine-grained Quantization for LLM",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) pose significant hardware challenges related to memory requirements and computational ability.\n   There are two mainstream quantization schemes for LLMs: coarse-grained (\\textit{e.g.,} channel-wise) quantization and fine-grained ( \\textit{e.g.,} group-wise) quantization. \n   Fine-grained quantization has smaller quantization loss, consequently achieving superior performance. However, when applied to weight-activation quantization, it disrupts continuous integer matrix multiplication, leading to inefficient inference.\n   In this paper, we introduce Dual Grained Quantization (DGQ), a novel A8W4 quantization for LLM that maintains superior performance while ensuring fast inference speed. DSQ dequantizes the fine-grained INT4 weight into coarse-grained INT8 representation and preform matrix multiplication using INT8 kernels. Besides, we develop a two-phase grid search algorithm to simplify the determination of fine-grained and coarse-grained quantization scales. We also devise a percentile clipping schema for smoothing the activation outliers without the need for complex optimization techniques. Experimental results demonstrate that DGQ consistently outperforms prior methods across various LLM architectures and a wide range of tasks. Remarkably, by our implemented efficient CUTLASS kernel, we achieve $\\textbf{1.12 $\\times$}$ memory reduction and $\\textbf{3.24 $\\times$}$ speed gains comparing A16W4 implementation.\n  These advancements enable efficient deployment of A8W4 LLMs for real-world applications.",
        "keywords": "Model Compression; Model Quantization; LLM",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Luoming Zhang;Wen Fei;Weijia Wu;Yefei He;Zhenyu Lou;Hong Zhou",
        "authorids": "~Luoming_Zhang1;~Wen_Fei1;~Weijia_Wu2;~Yefei_He1;~Zhenyu_Lou1;~Hong_Zhou3",
        "gender": "M;M;M;M;M;M",
        "homepage": ";;https://weijiawu.github.io/;https://hexy.tech/;;https://person.zju.edu.cn/zhouhong",
        "dblp": "125/0980;276/7132;87/7695-1;92/6254;333/1095;45/3426",
        "google_scholar": ";;NgjTRe4AAAAJ;CTEQwwwAAAAJ;;",
        "orcid": "0000-0003-2188-4485;0000-0002-1682-4480;0000-0003-3912-7212;0000-0002-2171-4518;0000-0002-1165-3301;",
        "linkedin": ";;%E5%A8%81%E4%BD%B3-%E5%90%B4-07a852280/;;;",
        "or_profile": "~Luoming_Zhang1;~Wen_Fei1;~Weijia_Wu2;~Yefei_He1;~Zhenyu_Lou1;~Hong_Zhou3",
        "aff": "Zhejiang University;Shanghai Jiaotong University;National University of Singapore;Zhejiang University;Zhejiang University;Zhejiang University",
        "aff_domain": "zju.edu.cn;sjtu.edu.cn;nus.edu;zju.edu.cn;zju.edu.cn;zju.edu.cn",
        "position": "PhD student;PhD student;Postdoc;PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nzhang2024dual,\ntitle={Dual Grained Quantization: Efficient Fine-grained Quantization for {LLM}},\nauthor={Luoming Zhang and Wen Fei and Weijia Wu and Yefei He and Zhenyu Lou and Hong Zhou},\nyear={2024},\nurl={https://openreview.net/forum?id=ktmMkOOeYb}\n}",
        "github": "",
        "project": "",
        "reviewers": "h9HQ;XQ5m;FXW6;s9uD",
        "site": "https://openreview.net/forum?id=ktmMkOOeYb",
        "pdf_size": 560806,
        "rating": "3;3;3;5",
        "confidence": "5;3;4;4",
        "soundness": "2;3;2;2",
        "contribution": "1;2;1;2",
        "presentation": "2;1;1;2",
        "wc_summary": "79;96;95;111",
        "wc_strengths": "50;38;25;65",
        "wc_weaknesses": "176;64;317;125",
        "wc_questions": "8;300;3;74",
        "wc_review": "313;498;440;375",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            95.25,
            11.321991874224253
        ],
        "wc_strengths_avg": [
            44.5,
            14.773286702694158
        ],
        "wc_weaknesses_avg": [
            170.5,
            93.41439931830638
        ],
        "wc_questions_avg": [
            96.25,
            120.92637222707047
        ],
        "wc_review_avg": [
            406.5,
            69.33433492866287
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5503722139318959617&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;0;0;0",
        "aff_unique_norm": "Zhejiang University;Shanghai Jiao Tong University;National University of Singapore",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.zju.edu.cn;https://www.sjtu.edu.cn;https://www.nus.edu.sg",
        "aff_unique_abbr": "ZJU;SJTU;NUS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0;0",
        "aff_country_unique": "China;Singapore"
    },
    {
        "title": "Continuous Field Reconstruction from Sparse Observations with Implicit Neural Networks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17958",
        "id": "kuTZMZdCPZ",
        "author_site": "Xihaier Luo, Wei Xu, Balasubramanya T. Nadiga, Yihui Ren, Shinjae Yoo",
        "tldr": "",
        "abstract": "Reliably reconstructing physical fields from sparse sensor data is a challenge that frequenty arises in many scientific domains. In practice, the process generating the data is often not known to sufficient accuracy. Therefore, there is a growing interest in the deep neural network route to the problem. In this work, we present a novel approach that learns a continuous representation of the field using implicit neural representations (INR). Specifically, after factorizing spatiotemporal variability into spatial and temporal components using the technique of separation of variables, the method learns relevant basis functions from sparsely sampled irregular data points to thus develop a continuous representation of the data. In experimental evaluations, the proposed model outperforms recent INR methods, offering superior reconstruction quality on simulation data from a state of the art climate model and on a second dataset that comprises of ultra-high resolution satellite-based sea surface temperature field. [Website for the Project: Both data and code are accessible.](https://xihaier.github.io/ICLR-2024-MMGN/)",
        "keywords": "implicit neural representations;field reconstruction;sparse observation",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Xihaier Luo;Wei Xu;Balu Nadiga;Yihui Ren;Shinjae Yoo",
        "authorids": "~Xihaier_Luo1;~Wei_Xu4;~Balu_Nadiga1;~Yihui_Ren1;~Shinjae_Yoo1",
        "gender": "M;;;;M",
        "homepage": "https://xihaier.github.io/;;;;",
        "dblp": ";;;;69/1062",
        "google_scholar": "aZyVAYwAAAAJ;BEr_82MAAAAJ;_E8MTDgAAAAJ;XCByFMoAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;0000-0001-8100-4692;0000-0002-5750-6964;",
        "linkedin": ";;;;",
        "or_profile": "~Xihaier_Luo1;~Wei_Xu4;~Balu_Nadiga1;~Yihui_Ren1;~Shinjae_Yoo1",
        "aff": "Brookhaven National Laboratory;Brookhaven National Laboratory;;Brookhaven National Laboratory;Brookhaven National Lab",
        "aff_domain": "bnl.gov;bnl.gov;;bnl.gov;bnl.gov",
        "position": "Researcher;Scientist;;Researcher;Scientist",
        "bibtex": "@inproceedings{\nluo2024continuous,\ntitle={Continuous Field Reconstruction from Sparse Observations with Implicit Neural Networks},\nauthor={Xihaier Luo and Wei Xu and Balu Nadiga and Yihui Ren and Shinjae Yoo},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=kuTZMZdCPZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "xFQb;8E6g;A6YW;MqB4",
        "pdf_size": 22587289,
        "rating": "6;6;6;6",
        "confidence": "4;3;5;3",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;2",
        "presentation": "3;3;3;2",
        "wc_summary": "42;41;42;53",
        "wc_strengths": "36;21;83;56",
        "wc_weaknesses": "94;131;391;380",
        "wc_questions": "154;420;8;74",
        "wc_review": "326;613;524;563",
        "wc_reply_reviewers": "0;423;130;63",
        "wc_reply_authors": "952;1718;1111;1323",
        "reply_reviewers": "0;2;1;2",
        "reply_authors": "2;4;2;4",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            44.5,
            4.924428900898052
        ],
        "wc_strengths_avg": [
            49.0,
            23.22713929867387
        ],
        "wc_weaknesses_avg": [
            249.0,
            137.18053797824237
        ],
        "wc_questions_avg": [
            164.0,
            156.5822467586923
        ],
        "wc_review_avg": [
            506.5,
            108.88181666375704
        ],
        "wc_reply_reviewers_avg": [
            154.0,
            161.96758935046233
        ],
        "wc_reply_authors_avg": [
            1276.0,
            287.1297616061421
        ],
        "reply_reviewers_avg": [
            1.25,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.0,
            1.0
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15071981198323925115&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=kuTZMZdCPZ",
        "pdf": "https://openreview.net/pdf?id=kuTZMZdCPZ",
        "email": "bnl.gov;bnl.gov;;bnl.gov;bnl.gov",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Brookhaven National Laboratory",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.bnl.gov",
        "aff_unique_abbr": "BNL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "kunueR6cZU",
        "title": "Universal Algorithm for Extreme Bandits with the Minimal Complexities",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The Multi-Armed Bandit is a classic reinforcement learning problem that exemplifies the exploration\u2013exploitation trade-off dilemma. When extreme values rather than expected values are of interest, the Extreme Bandit is introduced. The motivation for this work comes from black-box optimization problems and meta learning, where the goal is to find the best value for a target function from different search spaces or using multiple search heuristics. Previous work on the extreme bandit problem has assumed that rewards are drawn from an i.i.d manner, which severely limits the applicability of this class of algorithm. In this paper, with minimal temporal and spatial cost and minimal assumptions about the reward distribution, we present an novel algorithm and provide its analysis. Numerical experiments highlight the performance of the proposed algorithm to the existing approaches.",
        "keywords": "extreme bandits;online optimization;heavy-tails;non-iid data;non-parametric",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Zongyuan He;Yifeng Chen",
        "authorids": "~Zongyuan_He1;~Yifeng_Chen1",
        "gender": "M;M",
        "homepage": "https://github.com/FusionKernel;http://eecs.pku.edu.cn/EN/People/Faculty/Detail/?ID=6054",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Zongyuan_He1;~Yifeng_Chen1",
        "aff": "Peking University;",
        "aff_domain": "pku.edu.cn;",
        "position": "PhD student;",
        "bibtex": "@misc{\nhe2024universal,\ntitle={Universal Algorithm for Extreme Bandits with the Minimal Complexities},\nauthor={Zongyuan He and Yifeng Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=kunueR6cZU}\n}",
        "github": "",
        "project": "",
        "reviewers": "Cn3G;7QCU;PRiS;bVtC",
        "site": "https://openreview.net/forum?id=kunueR6cZU",
        "pdf_size": 293484,
        "rating": "1;3;3;5",
        "confidence": "3;4;4;3",
        "soundness": "1;2;2;3",
        "contribution": "1;2;2;3",
        "presentation": "2;2;1;1",
        "wc_summary": "52;67;43;89",
        "wc_strengths": "44;118;38;55",
        "wc_weaknesses": "57;169;329;105",
        "wc_questions": "142;63;2;45",
        "wc_review": "295;417;412;294",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            62.75,
            17.41228014936585
        ],
        "wc_strengths_avg": [
            63.75,
            31.90905044027478
        ],
        "wc_weaknesses_avg": [
            165.0,
            102.68398122394748
        ],
        "wc_questions_avg": [
            63.0,
            50.709959574032396
        ],
        "wc_review_avg": [
            354.5,
            60.02707722353305
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Q9LtY1OeXnEJ:scholar.google.com/&scioq=Universal+Algorithm+for+Extreme+Bandits+with+the+Minimal+Complexities&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Peking University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.pku.edu.cn",
        "aff_unique_abbr": "Peking U",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "title": "JointNet: Extending Text-to-Image Diffusion for Dense Distribution Modeling",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17957",
        "id": "kv5xE1p3jz",
        "author_site": "Jingyang Zhang, Shiwei Li, Yuanxun Lu, Tian Fang, David McKinnon, Yanghai Tsin, Long Quan, Yao Yao",
        "tldr": "",
        "abstract": "We introduce JointNet, a novel neural network architecture for modeling the joint distribution of images and an additional dense modality (e.g., depth maps). \nJointNet is extended from a pre-trained text-to-image diffusion model, where a copy of the original network is created for the new dense modality branch and is densely connected with the RGB branch. \nThe RGB branch is locked during network fine-tuning, which enables efficient learning of the new modality distribution while maintaining the strong generalization ability of the large-scale pre-trained diffusion model.\nWe demonstrate the effectiveness of JointNet by using the RGB-D diffusion as an example and through extensive experiments, showcasing its applicability in a variety of applications, including joint RGB-D generation, dense depth prediction, depth-conditioned image generation, and high-resolution 3D panorama generation.",
        "keywords": "Generative AI;Computer Vision;Machine Learning",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/4febdb4c284b9f0631556892c227458af4905260.pdf",
        "author": "Jingyang Zhang;Shiwei Li;Yuanxun Lu;Tian Fang;David Neil McKinnon;Yanghai Tsin;Long Quan;Yao Yao",
        "authorids": "~Jingyang_Zhang3;~Shiwei_Li4;~Yuanxun_Lu1;~Tian_Fang1;~David_Neil_McKinnon1;~Yanghai_Tsin1;~Long_Quan2;~Yao_Yao1",
        "gender": ";;M;;M;M;M;M",
        "homepage": ";;;;;http://www.cs.cmu.edu/~ytsin/;https://www.cse.ust.hk/~quan/;https://yoyo000.github.io/",
        "dblp": ";;302/4574;;28/723.html;17/4227.html;04/575;07/4410-8",
        "google_scholar": ";;ZBozF3sAAAAJ;CtpU8mUAAAAJ;https://scholar.google.com/citations?hl=en;;ZMLhZJ8AAAAJ;MGxaDVEAAAAJ",
        "orcid": ";;;;;;0000-0001-8148-1771;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Jingyang_Zhang3;~Shiwei_Li4;~Yuanxun_Lu1;~Tian_Fang1;~David_Neil_McKinnon1;~Yanghai_Tsin1;~Long_Quan2;~Yao_Yao1",
        "aff": ";;Nanjing University;Apple;Apple;Apple;Hong Kong University of Science and Technology;Nanjing University",
        "aff_domain": ";;nju.edu.cn;apple.com;apple.com;apple.com;ust.hk;nju.edu.cn",
        "position": ";;PhD student;Researcher;Researcher;Principal Researcher;Full Professor;Associate Professor",
        "bibtex": "@inproceedings{\nzhang2024jointnet,\ntitle={JointNet: Extending Text-to-Image Diffusion for Dense Distribution Modeling},\nauthor={Jingyang Zhang and Shiwei Li and Yuanxun Lu and Tian Fang and David Neil McKinnon and Yanghai Tsin and Long Quan and Yao Yao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=kv5xE1p3jz}\n}",
        "github": "",
        "project": "",
        "reviewers": "yguJ;4SM3;cBx7;UNzu",
        "pdf_size": 11460635,
        "rating": "3;5;6;8",
        "confidence": "4;3;3;3",
        "soundness": "2;3;2;4",
        "contribution": "2;2;2;4",
        "presentation": "2;3;3;3",
        "wc_summary": "21;122;83;114",
        "wc_strengths": "13;47;55;43",
        "wc_weaknesses": "58;162;40;45",
        "wc_questions": "29;75;118;8",
        "wc_review": "121;406;296;210",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "267;751;380;144",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            85.0,
            39.717754216471
        ],
        "wc_strengths_avg": [
            39.5,
            15.898113095584646
        ],
        "wc_weaknesses_avg": [
            76.25,
            49.94184117551134
        ],
        "wc_questions_avg": [
            57.5,
            42.51176307799995
        ],
        "wc_review_avg": [
            258.25,
            105.38115343836392
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            385.5,
            226.92785197062082
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.8006407690254357,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4833846345551526967&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=kv5xE1p3jz",
        "pdf": "https://openreview.net/pdf?id=kv5xE1p3jz",
        "email": ";;nju.edu.cn;apple.com;apple.com;apple.com;ust.hk;nju.edu.cn",
        "author_num": 8,
        "aff_unique_index": "0;1;1;1;2;0",
        "aff_unique_norm": "Nanjing University;Apple;Hong Kong University of Science and Technology",
        "aff_unique_dep": ";Apple Inc.;",
        "aff_unique_url": "https://www.nju.edu.cn;https://www.apple.com;https://www.ust.hk",
        "aff_unique_abbr": "Nanjing U;Apple;HKUST",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;1;1;1;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Estimating Shape Distances on Neural Representations with Limited Samples",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17956",
        "id": "kvByNnMERu",
        "author_site": "Dean Pospisil, Brett Larsen, Sarah Harvey, Alex Williams",
        "tldr": "",
        "abstract": "Measuring geometric similarity between high-dimensional network representations is a topic of longstanding interest to neuroscience and deep learning. Although many methods have been proposed, only a few works have rigorously analyzed their statistical efficiency or quantified estimator uncertainty in data-limited regimes. Here, we derive upper and lower bounds on the worst-case convergence\nof standard estimators of shape distance\u2014a measure of representational dissimilarity proposed by Williams et al. (2021). These bounds reveal the challenging nature of the problem in high-dimensional feature spaces. To overcome these challenges, we introduce a novel method-of-moments estimator with a tunable bias-variance tradeoff parameterized by an upper bound on bias. We show that this estimator achieves superior performance to standard estimators in simulation and on neural data, particularly in high-dimensional settings. Our theoretical work and estimator thus respectively define and dramatically expand the scope of neural data for which geometric similarity can be accurately measured.",
        "keywords": "representational geometry;shape metrics;dissimilarity metrics",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "Dean A Pospisil;Brett W. Larsen;Sarah E Harvey;Alex H Williams",
        "authorids": "~Dean_A_Pospisil1;~Brett_W._Larsen1;~Sarah_E_Harvey1;~Alex_H_Williams1",
        "gender": "M;;M;M",
        "homepage": ";https://sarahharvey.github.io/;http://alexhwilliams.info;http://www.bwlarsen.com",
        "dblp": ";;126/4222;268/6684",
        "google_scholar": "dE5KBCMAAAAJ;Be6-rWoAAAAJ;7_GzzXMAAAAJ;qzNuoRoAAAAJ",
        "orcid": ";;0000-0001-5853-103X;",
        "linkedin": ";;;",
        "or_profile": "~Dean_A_Pospisil1;~Sarah_E_Harvey1;~Alex_H_Williams1;~Brett_W_Larsen1",
        "aff": "Princeton University;Flatiron Institute;Flatiron Institute;Databricks Mosaic Research",
        "aff_domain": "princeton.edu;simonsfoundation.org;flatironinstitute.org;databricks.com",
        "position": "Postdoc;Postdoc;Researcher;Research Scientist",
        "bibtex": "@inproceedings{\npospisil2024estimating,\ntitle={Estimating Shape Distances on Neural Representations with Limited Samples},\nauthor={Dean A Pospisil and Brett W. Larsen and Sarah E Harvey and Alex H Williams},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=kvByNnMERu}\n}",
        "github": "",
        "project": "",
        "reviewers": "sJ3L;ATPd;emQE;GC8w",
        "pdf_size": 1508381,
        "rating": "6;6;8;10",
        "confidence": "2;3;4;4",
        "soundness": "2;3;3;4",
        "contribution": "1;3;3;4",
        "presentation": "2;3;3;4",
        "wc_summary": "81;63;102;51",
        "wc_strengths": "40;84;75;80",
        "wc_weaknesses": "223;187;101;60",
        "wc_questions": "20;88;73;1",
        "wc_review": "364;422;351;192",
        "wc_reply_reviewers": "305;61;61;0",
        "wc_reply_authors": "1660;892;886;308",
        "reply_reviewers": "2;1;1;0",
        "reply_authors": "3;2;2;1",
        "rating_avg": [
            7.5,
            1.6583123951777
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            1.0897247358851685
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            74.25,
            19.253246479490155
        ],
        "wc_strengths_avg": [
            69.75,
            17.469616481193857
        ],
        "wc_weaknesses_avg": [
            142.75,
            65.17044959182037
        ],
        "wc_questions_avg": [
            45.5,
            36.03123644839294
        ],
        "wc_review_avg": [
            332.25,
            85.27125834652611
        ],
        "wc_reply_reviewers_avg": [
            106.75,
            117.13747265499627
        ],
        "wc_reply_authors_avg": [
            936.5,
            480.36314388179284
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.8181818181818182,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14621243941859613028&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=kvByNnMERu",
        "pdf": "https://openreview.net/pdf?id=kvByNnMERu",
        "email": "princeton.edu;simonsfoundation.org;flatironinstitute.org;databricks.com",
        "author_num": 4,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "Princeton University;Flatiron Institute;Databricks",
        "aff_unique_dep": ";;Mosaic Research",
        "aff_unique_url": "https://www.princeton.edu;https://flatironinstitute.org;https://databricks.com",
        "aff_unique_abbr": "Princeton;Flatiron;Databricks",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Successor Heads: Recurring, Interpretable Attention Heads In The Wild",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17955",
        "id": "kvcbV8KQsi",
        "author_site": "Rhys Gould, Euan Ong, George Ogden, Arthur Conmy",
        "tldr": "",
        "abstract": "In this work we describe successor heads: attention heads that increment tokens with a natural ordering, such as numbers, months, and days.\nFor example, successor heads increment 'Monday' into 'Tuesday'.\nWe explain the successor head behavior with an approach rooted in mechanistic interpretability, the field that aims to explain how models complete tasks in human-understandable terms.\nExisting research in this area has struggled to find recurring, mechanistically interpretable large language model (LLM) components beyond small toy models. Further, existing results have led to very little insight to explain the internals of the larger models that are used in practice.\nIn this paper, we analyze the behavior of successor heads in LLMs and find that they implement abstract representations that are common to different architectures. \nSuccessor heads form in LLMs with as few as 31 million parameters, and at least as many as 12 billion parameters, such as GPT-2, Pythia, and Llama-2.\nWe find a set of 'mod 10' features that underlie how successor heads increment in LLMs across different architectures and sizes.\nWe perform vector arithmetic with these features to edit head behavior and provide insights into numeric representations within LLMs. Additionally, we study the behavior of successor heads on natural language data, where we find that successor heads are important for achieving a low loss on examples involving succession, and also identify interpretable polysemanticity in a Pythia successor head.",
        "keywords": "Interpretability;Large Language Models;Natural Language Processing;Science of Deep Learning;Representation Learning",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Rhys Gould;Euan Ong;George Ogden;Arthur Conmy",
        "authorids": "~Rhys_Gould1;~Euan_Ong1;~George_Ogden1;~Arthur_Conmy1",
        "gender": "M;M;M;M",
        "homepage": "https://r-gould.github.io/;;https://go281.user.srcf.net/;https://arthurconmy.github.io/",
        "dblp": ";;;",
        "google_scholar": ";;;",
        "orcid": ";;;",
        "linkedin": "rhys-gould-a54361221/;euanong/;george-ogden;",
        "or_profile": "~Rhys_Gould1;~Euan_Ong1;~George_Ogden1;~Arthur_Conmy1",
        "aff": "University of Cambridge;;University of Cambridge;Google DeepMind",
        "aff_domain": "cam.ac.uk;;cam.ac.uk;google.com",
        "position": "Undergrad student;;Undergrad student;Researcher",
        "bibtex": "@inproceedings{\ngould2024successor,\ntitle={Successor Heads: Recurring, Interpretable Attention Heads In The Wild},\nauthor={Rhys Gould and Euan Ong and George Ogden and Arthur Conmy},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=kvcbV8KQsi}\n}",
        "github": "",
        "project": "",
        "reviewers": "ExhM;uBkt;Vpua;uo7e",
        "pdf_size": 1411836,
        "rating": "3;8;8;8",
        "confidence": "5;3;4;3",
        "soundness": "3;4;3;3",
        "contribution": "1;3;3;3",
        "presentation": "3;2;4;2",
        "wc_summary": "89;201;55;74",
        "wc_strengths": "110;68;43;60",
        "wc_weaknesses": "472;77;194;146",
        "wc_questions": "363;166;46;45",
        "wc_review": "1034;512;338;325",
        "wc_reply_reviewers": "209;24;94;0",
        "wc_reply_authors": "1466;425;500;311",
        "reply_reviewers": "3;1;1;0",
        "reply_authors": "4;2;2;2",
        "rating_avg": [
            6.75,
            2.165063509461097
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            104.75,
            56.86112468110352
        ],
        "wc_strengths_avg": [
            70.25,
            24.661457783350926
        ],
        "wc_weaknesses_avg": [
            222.25,
            150.07060838152154
        ],
        "wc_questions_avg": [
            155.0,
            129.77480495072993
        ],
        "wc_review_avg": [
            552.25,
            287.7710678647178
        ],
        "wc_reply_reviewers_avg": [
            81.75,
            81.17996982014714
        ],
        "wc_reply_authors_avg": [
            675.5,
            461.32987113344393
        ],
        "reply_reviewers_avg": [
            1.25,
            1.0897247358851685
        ],
        "reply_authors_avg": [
            2.5,
            0.8660254037844386
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8703882797784891,
        "gs_citation": 40,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2410351853462566657&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=kvcbV8KQsi",
        "pdf": "https://openreview.net/pdf?id=kvcbV8KQsi",
        "email": "cam.ac.uk;;cam.ac.uk;google.com",
        "author_num": 4,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "University of Cambridge;Google",
        "aff_unique_dep": ";Google DeepMind",
        "aff_unique_url": "https://www.cam.ac.uk;https://deepmind.com",
        "aff_unique_abbr": "Cambridge;DeepMind",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Cambridge;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "kwn9ySjbc1",
        "title": "Variable resolution: improving scene visual question answering with a limited pixel budget",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Artificial intelligence (AI) scene understanding systems can benefit from utilizing a large visual field of view (FOV). Some existing systems already employ multiple cameras to extend their FOV, however,  increasing image size and quality presents an overwhelming challenge to the acquisition and computing resources for such systems. An effective solution is to sub-sample the FOV, without impairing the model's  performance on complex visual tasks. In this paper, we show that a variable sampling scheme, inspired by human vision, remarkably outperforms a uniform sampling scheme by 2% accuracy (65% vs. 63%) in the challenging task of scene visual question answering (VQA), under a limited samples budget (3% of the full resolution baseline). The improvement is achieved without any image scanning, and the variable resolution peaks at an arbitrarily chosen fixed image location. Our study also compared basic visual sub-tasks, in particular image classification and object detection. Comparing the variable and uniform models revealed differences in the representations learned by the different models which yield a consistently improved performance of the variable resolution models. We show that the variable sampling scheme allows the models to benefit in low resolution areas, by propagating information from the finer resolution areas, and at the same time higher resolution areas benefit from contextual information at lower resolution in the periphery. The results show the potential of the biologically-inspired image representation to improve the design of visual acquisition and processing models in future AI-based systems.",
        "keywords": "Biologically-inspired learning;subsampling;variable resolution;scene understanding;interpretability",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Andrey Gizdov;Shimon Ullman;Daniel Harari",
        "authorids": "~Andrey_Gizdov1;~Shimon_Ullman1;~Daniel_Harari2",
        "gender": "M;M;M",
        "homepage": ";http://www.weizmann.ac.il/math/shimon/;https://www.weizmann.ac.il/math/dannyh/",
        "dblp": ";93/2158;35/383",
        "google_scholar": ";XOfA8ckAAAAJ;xwdcDjUAAAAJ",
        "orcid": ";0000-0003-4331-298X;0000-0003-4745-9292",
        "linkedin": "andreygizdo;;daniel-harari-8b71a16/",
        "or_profile": "~Andrey_Gizdov1;~Shimon_Ullman1;~Daniel_Harari1",
        "aff": "Weizmann Institute of Science;Weizmann Institute of Science;Weizmann Institute of Science",
        "aff_domain": "weizmann.ac.il;weizmann.ac.il;weizmann.ac.il",
        "position": "Researcher;Emeritus;Principal Researcher",
        "bibtex": "@misc{\ngizdov2024variable,\ntitle={Variable resolution: improving scene visual question answering with a limited pixel budget},\nauthor={Andrey Gizdov and Shimon Ullman and Daniel Harari},\nyear={2024},\nurl={https://openreview.net/forum?id=kwn9ySjbc1}\n}",
        "github": "",
        "project": "",
        "reviewers": "youK;hgaY;V3rN",
        "site": "https://openreview.net/forum?id=kwn9ySjbc1",
        "pdf_size": 14467260,
        "rating": "5;5;6",
        "confidence": "4;5;5",
        "soundness": "2;2;3",
        "contribution": "3;2;3",
        "presentation": "3;3;3",
        "wc_summary": "94;47;94",
        "wc_strengths": "90;47;114",
        "wc_weaknesses": "384;144;198",
        "wc_questions": "69;4;239",
        "wc_review": "637;242;645",
        "wc_reply_reviewers": "0;22;0",
        "wc_reply_authors": "537;528;626",
        "reply_reviewers": "0;1;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            78.33333333333333,
            22.15601247717849
        ],
        "wc_strengths_avg": [
            83.66666666666667,
            27.716822007983207
        ],
        "wc_weaknesses_avg": [
            242.0,
            102.80077820717118
        ],
        "wc_questions_avg": [
            104.0,
            99.079092984679
        ],
        "wc_review_avg": [
            508.0,
            188.11875681777897
        ],
        "wc_reply_reviewers_avg": [
            7.333333333333333,
            10.370899457402697
        ],
        "wc_reply_authors_avg": [
            563.6666666666666,
            44.22920101270452
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:wKj9xU1syxoJ:scholar.google.com/&scioq=Variable+resolution:+improving+scene+visual+question+answering+with+a+limited+pixel+budget&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Weizmann Institute of Science",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.weizmann.org.il",
        "aff_unique_abbr": "Weizmann",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Israel"
    },
    {
        "title": "Enhancing Contrastive Learning for Ordinal Regression via Ordinal Content Preserved Data Augmentation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17954",
        "id": "kx2XZlmgB1",
        "author_site": "Jiyang Zheng, Yu Yao, Bo Han, Dadong Wang, Tongliang Liu",
        "tldr": "",
        "abstract": "Contrastive learning, while highly effective for a lot of tasks, shows limited improvement in ordinal regression. We find that the limitation comes from the predefined strong data augmentations employed in contrastive learning.  Intuitively, for ordinal regression datasets, the discriminative information (ordinal content information) contained in instances is subtle. The strong augmentations can easily overshadow or diminish this ordinal content information. As a result, when contrastive learning is used to extract common features between weakly and strongly augmented images, the derived features often lack this essential ordinal content, rendering them less useful in training models for ordinal regression. To improve contrastive learning's utility for ordinal regression, we propose a novel augmentation method to replace the predefined strong argumentation based on the principle of minimal change. Our method is designed in a generative manner that can effectively generate images with different styles but contains desired ordinal content information. Extensive experiments validate the effectiveness of our proposed method, which serves as a plug-and-play solution and consistently improves the performance of existing state-of-the-art methods in ordinal regression tasks.",
        "keywords": "Contrastive Learning;Ordinal Classification/Regression",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Jiyang Zheng;Yu Yao;Bo Han;Dadong Wang;Tongliang Liu",
        "authorids": "~Jiyang_Zheng1;~Yu_Yao3;~Bo_Han1;~Dadong_Wang1;~Tongliang_Liu1",
        "gender": "Non-Binary;M;;;M",
        "homepage": ";https://a5507203.github.io/;;;https://tongliang-liu.github.io/",
        "dblp": "317/1139;230/9625;;;150/6667",
        "google_scholar": "https://scholar.google.com.au/citations?user=pM9DLNIAAAAJ;OkcaMKAAAAAJ;;;https://scholar.google.com.au/citations?user=EiLdZ_YAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";yu-yao-150377134/;;;",
        "or_profile": "~Jiyang_Zheng1;~Yu_Yao3;~Bo_Han1;~Dadong_Wang1;~Tongliang_Liu1",
        "aff": "University of Sydney;University of Sydney;;;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_domain": "usyd.edu.au;sydney.edu.au;;;mbzuai.ac.ae",
        "position": "PhD student;Lecturer;;;Affiliated Associate Professor",
        "bibtex": "@inproceedings{\nzheng2024enhancing,\ntitle={Enhancing Contrastive Learning for Ordinal Regression via  Ordinal Content Preserved Data Augmentation},\nauthor={Jiyang Zheng and Yu Yao and Bo Han and Dadong Wang and Tongliang Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=kx2XZlmgB1}\n}",
        "github": "",
        "project": "",
        "reviewers": "yfaW;gbdG;PxYT;gPMn;SPqB",
        "pdf_size": 2511545,
        "rating": "5;6;6;6;6",
        "confidence": "4;4;3;4;4",
        "soundness": "2;2;3;3;2",
        "contribution": "3;3;2;3;2",
        "presentation": "3;3;2;3;4",
        "wc_summary": "70;49;80;107;45",
        "wc_strengths": "51;15;39;96;17",
        "wc_weaknesses": "165;140;92;240;156",
        "wc_questions": "147;2;67;240;25",
        "wc_review": "433;206;278;683;243",
        "wc_reply_reviewers": "144;0;19;0;85",
        "wc_reply_authors": "2581;1232;897;660;1525",
        "reply_reviewers": "1;0;1;0;2",
        "reply_authors": "8;6;4;2;4",
        "rating_avg": [
            5.8,
            0.39999999999999997
        ],
        "confidence_avg": [
            3.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            3.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            70.2,
            22.51577224969199
        ],
        "wc_strengths_avg": [
            43.6,
            29.48626799037138
        ],
        "wc_weaknesses_avg": [
            158.6,
            47.86480962042992
        ],
        "wc_questions_avg": [
            96.2,
            87.24081613556811
        ],
        "wc_review_avg": [
            368.6,
            175.16689184888793
        ],
        "wc_reply_reviewers_avg": [
            49.6,
            56.60600674840083
        ],
        "wc_reply_authors_avg": [
            1379.0,
            668.8817533764843
        ],
        "reply_reviewers_avg": [
            0.8,
            0.7483314773547883
        ],
        "reply_authors_avg": [
            4.8,
            2.039607805437114
        ],
        "replies_avg": [
            35,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.25000000000000006,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9582523711261920088&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=kx2XZlmgB1",
        "pdf": "https://openreview.net/pdf?id=kx2XZlmgB1",
        "email": "usyd.edu.au;sydney.edu.au;;;mbzuai.ac.ae",
        "author_num": 5,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "University of Sydney;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.sydney.edu.au;https://mbzuai.ac.ae",
        "aff_unique_abbr": "USYD;MBZUAI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "Australia;United Arab Emirates"
    },
    {
        "id": "kxLMnvnZv0",
        "title": "CoMNet: Where Biology Meets ConvNets",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Designing ConvNet and exploring its design space is a highly challenging research\narea. In this paper, inspired by the structural organization of cortical modules in the\nbiological visual cortex, we present a pragmatically designed ConvNet architecture,\ncalled CoMNet which is simplified yet powerful. The bio-inspired design of CoM-\nNet offers efficiency in multiple dimensions such as network depth, parameters,\nFLOPs, latency, branching, and memory budget at once while having a simple\ndesign space, in contrast to the existing designs which are limited only to fewer\ndimensions. We also develop a Multi-Dimensional Efficiency (MDE) evaluation\nprotocol to compare models across dimensions. Our comprehensive evaluations\nshow that in the MDE setting, CoMNet outperforms many representative ConvNet\ndesigns such as ResNet, ResNeXt, RegNet, RepVGG, and ParNet (Figure 1).",
        "keywords": "ConvNet;cortical modules;pyramidal neurons;long range connections",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Ashish Kumar;Jaesik Park;Laxmidhar Behera",
        "authorids": "~Ashish_Kumar2;~Jaesik_Park3;~Laxmidhar_Behera1",
        "gender": "M;M;M",
        "homepage": "https://ashishkumar822.github.io;http://jaesik.info;https://home.iitk.ac.in/~lbehera/",
        "dblp": "34/5378-6;00/10336;14/1412",
        "google_scholar": "n-oRDEYAAAAJ;_3q6KBIAAAAJ;https://scholar.google.co.in/citations?user=QWTcyP8AAAAJ",
        "orcid": ";;",
        "linkedin": "ashishkumar822/;;laxmidhar-behera-a74a5b174/?originalSubdomain=in",
        "or_profile": "~Ashish_Kumar2;~Jaesik_Park3;~Laxmidhar_Behera1",
        "aff": "ScorelabsAI, USA;Seoul National University;Indian Institute of Technology, Kanpur",
        "aff_domain": "scorelabsai.com;snu.ac.kr;iitmandi.ac.in",
        "position": "Researcher;Assistant Professor;Director",
        "bibtex": "@misc{\nkumar2024comnet,\ntitle={Co{MN}et: Where Biology Meets ConvNets},\nauthor={Ashish Kumar and Jaesik Park and Laxmidhar Behera},\nyear={2024},\nurl={https://openreview.net/forum?id=kxLMnvnZv0}\n}",
        "github": "",
        "project": "",
        "reviewers": "Y3Qk;mQDh;Kwm3;nTg9",
        "site": "https://openreview.net/forum?id=kxLMnvnZv0",
        "pdf_size": 5357706,
        "rating": "3;5;5;6",
        "confidence": "3;4;5;2",
        "soundness": "1;3;3;3",
        "contribution": "3;3;2;2",
        "presentation": "1;3;3;3",
        "wc_summary": "37;66;80;59",
        "wc_strengths": "33;71;137;23",
        "wc_weaknesses": "327;126;87;90",
        "wc_questions": "78;505;85;3",
        "wc_review": "475;768;389;175",
        "wc_reply_reviewers": "398;170;0;38",
        "wc_reply_authors": "989;1295;809;224",
        "reply_reviewers": "3;1;0;1",
        "reply_authors": "3;3;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            60.5,
            15.532224567009067
        ],
        "wc_strengths_avg": [
            66.0,
            44.73253849269008
        ],
        "wc_weaknesses_avg": [
            157.5,
            99.05680188659434
        ],
        "wc_questions_avg": [
            167.75,
            197.34661765533252
        ],
        "wc_review_avg": [
            451.75,
            212.76909432528024
        ],
        "wc_reply_reviewers_avg": [
            151.5,
            155.67514252442487
        ],
        "wc_reply_authors_avg": [
            829.25,
            390.2501601537147
        ],
        "reply_reviewers_avg": [
            1.25,
            1.0897247358851685
        ],
        "reply_authors_avg": [
            2.0,
            1.0
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.10259783520851541,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:q2WO1SifBn4J:scholar.google.com/&scioq=CoMNet:+Where+Biology+Meets+ConvNets&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "ScorelabsAI;Seoul National University;Indian Institute of Technology Kanpur",
        "aff_unique_dep": ";;",
        "aff_unique_url": ";https://www.snu.ac.kr;https://www.iitk.ac.in",
        "aff_unique_abbr": ";SNU;IIT Kanpur",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Kanpur",
        "aff_country_unique_index": "0;1;2",
        "aff_country_unique": "United States;South Korea;India"
    },
    {
        "id": "kxe0hQ5mxp",
        "title": "Elephant Neural Networks: Born to Be a Continual Learner",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Catastrophic forgetting remains a significant challenge to continual learning for decades. While recent works have proposed effective methods to mitigate this problem, they mainly focus on the algorithmic side. Meanwhile, we do not fully understand what architectural properties of neural networks lead to catastrophic forgetting. This study aims to fill this gap by studying the role of activation functions in the training dynamics of neural networks and their impact on catastrophic forgetting. Our study reveals that, besides sparse representations, the gradient sparsity of activation functions also plays an important role in reducing forgetting. Based on this insight, we propose a new class of activation functions, elephant activation functions, that can generate both sparse representations and sparse gradients. We show that by simply replacing classical activation functions with elephant activation functions, we can significantly improve the resilience of neural networks to catastrophic forgetting. Our method has broad applicability and benefits for continual learning in regression, class incremental learning, and reinforcement learning tasks. Specifically, we achieves excellent performance on Split MNIST dataset in just one single pass, without using replay buffer, task boundary information, or pre-training.",
        "keywords": "streaming Learning;catastrophic forgetting;training dynamics",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Qingfeng Lan;A. Rupam Mahmood",
        "authorids": "~Qingfeng_Lan1;~A._Rupam_Mahmood1",
        "gender": ";",
        "homepage": ";",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Qingfeng_Lan1;~A._Rupam_Mahmood1",
        "aff": ";",
        "aff_domain": ";",
        "position": ";",
        "bibtex": "@misc{\nlan2024elephant,\ntitle={Elephant Neural Networks: Born to Be a Continual Learner},\nauthor={Qingfeng Lan and A. Rupam Mahmood},\nyear={2024},\nurl={https://openreview.net/forum?id=kxe0hQ5mxp}\n}",
        "github": "",
        "project": "",
        "reviewers": "nrBP;HrPu;rwQQ",
        "site": "https://openreview.net/forum?id=kxe0hQ5mxp",
        "pdf_size": 1547567,
        "rating": "1;3;5",
        "confidence": "5;5;4",
        "soundness": "2;2;3",
        "contribution": "2;2;2",
        "presentation": "2;2;3",
        "wc_summary": "80;39;76",
        "wc_strengths": "167;5;90",
        "wc_weaknesses": "370;87;217",
        "wc_questions": "63;624;146",
        "wc_review": "680;755;529",
        "wc_reply_reviewers": "21;19;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "1;1;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            1.632993161855452
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            65.0,
            18.457157599876172
        ],
        "wc_strengths_avg": [
            87.33333333333333,
            66.16309814054625
        ],
        "wc_weaknesses_avg": [
            224.66666666666666,
            115.66138316463086
        ],
        "wc_questions_avg": [
            277.6666666666667,
            247.2277402630125
        ],
        "wc_review_avg": [
            654.6666666666666,
            93.98699673654625
        ],
        "wc_reply_reviewers_avg": [
            13.333333333333334,
            9.46337971105226
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6571925504452746090&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5
    },
    {
        "title": "TRAM: Bridging Trust Regions and Sharpness Aware Minimization",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17953",
        "id": "kxebDHZ7b7",
        "author_site": "Tom Sherborne, Naomi Saphra, Pradeep Dasigi, Hao Peng",
        "tldr": "",
        "abstract": "Sharpness-aware minimization (SAM) reports improving domain generalization by\nreducing the loss surface curvature in the parameter space. However,\ngeneralization during _fine-tuning_ is often more dependent on the\ntransferability of _representations_ in the function space. Trust-region\nmethods (TR) target this goal by regularizing representation curvature to reduce\ncatastrophic forgetting of pre-trained task-agnostic information while adopting\ntask-specific skills. We consider unifying these strategies for low curvature in\nboth parameter space and function space to improve out-of-domain (OOD)\ngeneralization. We propose **Trust Region Aware Minimization** (TRAM), a\nSAM algorithm fine-tuning for low parameter sharpness and smooth, informative\nrepresentations preserving pre-trained structure. TRAM uses a trust region bound\nto inform the SAM adversarial neighborhood, introducing an awareness of function\ncurvature within optimization for flatter minima. We empirically validate TRAM\nin vision (cross-dataset adaptation) and text (OOD language modeling, zero-shot\ncross-lingual transfer) tasks where robust domain transfer and representation\ngenerality are critical. TRAM outperforms SAM- and TR-based optimization across\nall tasks, notably surpassing competing methods for hard transfer between\n_anticorrelated_ domains. TRAM establishes a novel standard in\nfine-tuning for domain-generalizable models with minimal additional computation\nover previous sharpness-aware methods.",
        "keywords": "sharpness-aware minimization;sam;trust region;optimization;cross-lingual transfer;language modeling",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Tom Sherborne;Naomi Saphra;Pradeep Dasigi;Hao Peng",
        "authorids": "~Tom_Sherborne2;~Naomi_Saphra1;~Pradeep_Dasigi1;~Hao_Peng4",
        "gender": "F;M;M;M",
        "homepage": "http://nsaphra.github.io/;https://pdasigi.github.io/;https://haopeng-nlp.github.io/;https://tomsherborne.github.io/",
        "dblp": "131/6883;27/7184;;203/6427",
        "google_scholar": "TPhVfX8AAAAJ;https://scholar.google.com/citations?authorid=Bpd76vcAAAAJ;6Y37nm0AAAAJ;50nZ2yAAAAAJ",
        "orcid": ";0000-0001-7127-1316;;0000-0002-2005-6541",
        "linkedin": "naomi-saphra-028b8060/;;;",
        "or_profile": "~Naomi_Saphra1;~Pradeep_Dasigi1;~Hao_Peng1;~Thomas_Sherborne1",
        "aff": "Harvard University;Allen Institute for Artificial Intelligence;University of Illinois Urbana-Champaign;University of Edinburgh",
        "aff_domain": "harvard.edu;allenai.org;illinois.edu;ed.ac.uk",
        "position": "Fellow;Research Scientist;Assistant Professor;PhD student",
        "bibtex": "@inproceedings{\nsherborne2024tram,\ntitle={{TRAM}: Bridging Trust Regions and Sharpness Aware Minimization},\nauthor={Tom Sherborne and Naomi Saphra and Pradeep Dasigi and Hao Peng},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=kxebDHZ7b7}\n}",
        "github": "",
        "project": "",
        "reviewers": "cqYa;2Ruf;MZmv;AFpQ",
        "pdf_size": 506222,
        "rating": "5;6;8;8",
        "confidence": "4;4;3;4",
        "soundness": "2;2;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "224;87;66;154",
        "wc_strengths": "35;71;34;58",
        "wc_weaknesses": "276;347;28;6",
        "wc_questions": "40;2;27;434",
        "wc_review": "575;507;155;652",
        "wc_reply_reviewers": "0;80;29;59",
        "wc_reply_authors": "1385;1058;873;1004",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "3;2;2;2",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            132.75,
            61.90062600652759
        ],
        "wc_strengths_avg": [
            49.5,
            15.692354826475215
        ],
        "wc_weaknesses_avg": [
            164.25,
            149.57669437449138
        ],
        "wc_questions_avg": [
            125.75,
            178.49142136248454
        ],
        "wc_review_avg": [
            472.25,
            190.21221701036976
        ],
        "wc_reply_reviewers_avg": [
            42.0,
            30.273751006441206
        ],
        "wc_reply_authors_avg": [
            1080.0,
            188.50331562070733
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5555555555555555,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3787745882092344794&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=kxebDHZ7b7",
        "pdf": "https://openreview.net/pdf?id=kxebDHZ7b7",
        "email": "harvard.edu;allenai.org;illinois.edu;ed.ac.uk",
        "author_num": 4,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Harvard University;Allen Institute for Artificial Intelligence;University of Illinois Urbana-Champaign;University of Edinburgh",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.harvard.edu;https://allenai.org;https://illinois.edu;https://www.ed.ac.uk",
        "aff_unique_abbr": "Harvard;AI2;UIUC;Edinburgh",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Urbana-Champaign",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "title": "COLLIE: Systematic Construction of Constrained Text Generation Tasks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17952",
        "id": "kxgSlyirUZ",
        "author_site": "Shunyu Yao, Howard Chen, Austin Hanjie, Runzhe Yang, Karthik Narasimhan",
        "tldr": "",
        "abstract": "Text generation under constraints have seen increasing interests in natural language processing, especially with the rapidly improving capabilities of large language models. However, existing benchmarks for constrained generation usually focus on fixed constraint types (e.g. generate a sentence containing certain words) that have proved to be easy for state-of-the-art models like GPT-4. We present COLLIE, a grammar-based framework that allows the specification of rich, compositional constraints with diverse generation levels (word, sentence, paragraph, passage) and modeling challenges (e.g. language understanding, logical reasoning, counting, semantic planning). We also develop tools for automatic extraction of task instances given a constraint structure and a raw text corpus. Using COLLIE, we compile the COLLIE-v1 dataset with 1,132 instances comprising 13 constraint structures. We perform systematic experiments across five state-of-the-art instruction-tuned language models and analyze their performances to reveal shortcomings. COLLIE is designed to be extensible and lightweight, and we hope the community finds it useful to develop more complex constraints and evaluations in the future.",
        "keywords": "constrained text generation;large language models;compositional benchmark",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/46d554feb444395549dd744cec0c18722b675fbe.pdf",
        "author": "Shunyu Yao;Howard Chen;Austin W. Hanjie;Runzhe Yang;Karthik R Narasimhan",
        "authorids": "~Shunyu_Yao1;~Howard_Chen1;~Austin_W._Hanjie1;~Runzhe_Yang1;~Karthik_R_Narasimhan1",
        "gender": "M;M;M;M;M",
        "homepage": "https://ysymyth.github.io;https://howard50b.github.io/;https://runzhe-yang.science;http://www.karthiknarasimhan.com;",
        "dblp": "156/1038;06/2061;204/1127;147/0322;",
        "google_scholar": "qJBXk9cAAAAJ;wsNa_W4AAAAJ;;euc0GX4AAAAJ;",
        "orcid": ";;0000-0001-8891-5149;;",
        "linkedin": ";;runzhe-yang/;;ahjwang/",
        "or_profile": "~Shunyu_Yao1;~Howard_Chen1;~Runzhe_Yang1;~Karthik_R_Narasimhan1;~H._J._Austin_Wang1",
        "aff": "Princeton University;Princeton University;SIG;Princeton University;",
        "aff_domain": "princeton.edu;princeton.edu;sig.com;princeton.edu;",
        "position": "PhD student;PhD student;Researcher;Assistant Professor;",
        "bibtex": "@inproceedings{\nyao2024collie,\ntitle={{COLLIE}: Systematic Construction of Constrained Text Generation Tasks},\nauthor={Shunyu Yao and Howard Chen and Austin W. Hanjie and Runzhe Yang and Karthik R Narasimhan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=kxgSlyirUZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "p51c;PuAQ;6Jty;nWAg",
        "pdf_size": 2133569,
        "rating": "6;6;8;10",
        "confidence": "4;3;3;4",
        "soundness": "3;3;3;4",
        "contribution": "3;2;3;4",
        "presentation": "3;3;3;4",
        "wc_summary": "125;50;95;146",
        "wc_strengths": "50;16;55;50",
        "wc_weaknesses": "37;98;153;42",
        "wc_questions": "3;26;3;22",
        "wc_review": "215;190;306;260",
        "wc_reply_reviewers": "0;22;0;0",
        "wc_reply_authors": "61;482;16;177",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            7.5,
            1.6583123951777
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            104.0,
            36.062445840513924
        ],
        "wc_strengths_avg": [
            42.75,
            15.578430601315397
        ],
        "wc_weaknesses_avg": [
            82.5,
            47.225522760473496
        ],
        "wc_questions_avg": [
            13.5,
            10.594810050208546
        ],
        "wc_review_avg": [
            242.75,
            44.302229063558414
        ],
        "wc_reply_reviewers_avg": [
            5.5,
            9.526279441628825
        ],
        "wc_reply_authors_avg": [
            184.0,
            181.80071507010086
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.30151134457776363,
        "gs_citation": 29,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6062557723745127097&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=kxgSlyirUZ",
        "pdf": "https://openreview.net/pdf?id=kxgSlyirUZ",
        "email": "princeton.edu;princeton.edu;sig.com;princeton.edu;",
        "author_num": 5,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Princeton University;SIG",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.princeton.edu;",
        "aff_unique_abbr": "Princeton;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States;"
    },
    {
        "id": "kxpswbhr1r",
        "title": "In-context Convergence of Transformers",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Transformers have recently revolutionized many domains in modern machine learning and one salient discovery is their remarkable in-context learning capability, where models can solve an unseen task by utilizing task-specific prompts without further parameters fine-tuning.  This also inspired recent theoretical studies aiming to understand the in-context learning mechanism of transformers, which however focused only on  $\\textit{linear}$ transformers.  In this work, we take the first step toward studying the learning dynamics of a one-layer transformer with $\\textit{softmax}$ attention trained via gradient descent in order to in-context learn linear function classes. We consider a structured data model, where each token is randomly sampled from a set of feature vectors in either balanced or imbalanced fashion. For data with balanced features, we establish the finite-time convergence guarantee with near-zero prediction error by navigating our analysis over two phases of the training dynamics of the attention map. More notably, for data with imbalanced features, we show that the learning dynamics take a stage-wise convergence process, where the transformer first converges to a near-zero prediction error for the query tokens of dominant features, and then converges later to a near-zero prediction error for the query tokens of under-represented features, respectively via one and four training phases. Our proof features new techniques for analyzing the competing strengths of two types of attention weights, the change of which determines different training phases.",
        "keywords": "Theoretical in-context learning;Softmax attention;Training dynamics;Finite-time convergence",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Yu Huang;Yuan Cheng;Yingbin Liang",
        "authorids": "~Yu_Huang3;~Yuan_Cheng6;~Yingbin_Liang1",
        "gender": "F;;F",
        "homepage": "https://yuhuang42.org/;;https://sites.google.com/view/yingbinliang/home",
        "dblp": "39/6301-23;;51/332",
        "google_scholar": ";5v47GU0AAAAJ;lGgLAiIAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Yu_Huang3;~Yuan_Cheng6;~Yingbin_Liang1",
        "aff": "The Wharton School, University of Pennsylvania;National University of Singapore;The Ohio State University",
        "aff_domain": "wharton.upenn.edu;u.nus.edu;osu.edu",
        "position": "PhD student;PhD student;Professor",
        "bibtex": "@misc{\nhuang2024incontext,\ntitle={In-context Convergence of Transformers},\nauthor={Yu Huang and Yuan Cheng and Yingbin Liang},\nyear={2024},\nurl={https://openreview.net/forum?id=kxpswbhr1r}\n}",
        "github": "",
        "project": "",
        "reviewers": "AAX6;xLBH;kkxb;VMhr",
        "site": "https://openreview.net/forum?id=kxpswbhr1r",
        "pdf_size": 1545428,
        "rating": "5;6;6;6",
        "confidence": "3;2;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;4;2;3",
        "presentation": "3;4;3;2",
        "wc_summary": "118;65;107;100",
        "wc_strengths": "87;145;67;170",
        "wc_weaknesses": "166;92;162;230",
        "wc_questions": "2;192;51;112",
        "wc_review": "373;494;387;612",
        "wc_reply_reviewers": "0;12;119;11",
        "wc_reply_authors": "0;1002;960;1128",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "0;3;3;3",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            97.5,
            19.83053201505194
        ],
        "wc_strengths_avg": [
            117.25,
            41.811332195948985
        ],
        "wc_weaknesses_avg": [
            162.5,
            48.833902158234295
        ],
        "wc_questions_avg": [
            89.25,
            70.97666870176424
        ],
        "wc_review_avg": [
            466.5,
            96.16262267638086
        ],
        "wc_reply_reviewers_avg": [
            35.5,
            48.43810483493342
        ],
        "wc_reply_authors_avg": [
            772.5,
            450.26742054028296
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            1.299038105676658
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 90,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9211398343281116288&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 10,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of Pennsylvania;National University of Singapore;Ohio State University",
        "aff_unique_dep": "The Wharton School;;",
        "aff_unique_url": "https://www.wharton.upenn.edu;https://www.nus.edu.sg;https://www.osu.edu",
        "aff_unique_abbr": "UPenn Wharton;NUS;OSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United States;Singapore"
    },
    {
        "id": "ky2JYPKkml",
        "title": "Towards Explainable and Efficient Multi-Modality Learning: Domain-Agnostic Concept Space Paired with Domain-Specific Projection Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In an effort to create a more explainable AI system, we introduce a novel multi-modality learning framework in this study. This framework leverages a domain-agnostic concept space designed to be transparent and interpretable and a set of domain-specific projection models tailored to process distinct modality inputs and map them onto this concept space. This separation of the concept space and the projection models brings versatility to our framework, allowing easy adaptations to various modalities and downstream tasks. We evaluate our framework's performance in a zero-shot setting on two popular tasks: Image-Text Matching and Visual Question Answering. Our framework achieves performance levels on par with benchmark fine-tuned models for these tasks while maintaining an explainable architecture.",
        "keywords": "Concept Learning;Muti-Modality Model;Probabilistic Reasoning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yuchong Geng;Ao Tang",
        "authorids": "~Yuchong_Geng1;~Ao_Tang1",
        "gender": "M;",
        "homepage": "https://yuchong-geng.github.io/;",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": "yuchong-geng;",
        "or_profile": "~Yuchong_Geng1;~Ao_Tang1",
        "aff": "Cornell University;",
        "aff_domain": "cornell.edu;",
        "position": "PhD student;",
        "bibtex": "@misc{\ngeng2024towards,\ntitle={Towards Explainable and Efficient Multi-Modality Learning: Domain-Agnostic Concept Space Paired with Domain-Specific Projection Models},\nauthor={Yuchong Geng and Ao Tang},\nyear={2024},\nurl={https://openreview.net/forum?id=ky2JYPKkml}\n}",
        "github": "",
        "project": "",
        "reviewers": "knsN;xec7;L6aq",
        "site": "https://openreview.net/forum?id=ky2JYPKkml",
        "pdf_size": 565294,
        "rating": "3;3;3",
        "confidence": "4;4;4",
        "soundness": "2;2;2",
        "contribution": "2;2;1",
        "presentation": "2;2;2",
        "wc_summary": "105;69;88",
        "wc_strengths": "83;63;47",
        "wc_weaknesses": "262;50;614",
        "wc_questions": "137;217;176",
        "wc_review": "587;399;925",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1139;671;1799",
        "reply_reviewers": "0;0;0",
        "reply_authors": "3;1;4",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            87.33333333333333,
            14.70449666674185
        ],
        "wc_strengths_avg": [
            64.33333333333333,
            14.72714802291635
        ],
        "wc_weaknesses_avg": [
            308.6666666666667,
            232.6045762423622
        ],
        "wc_questions_avg": [
            176.66666666666666,
            32.6632651290236
        ],
        "wc_review_avg": [
            637.0,
            217.62965484204275
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1203.0,
            462.7223789703714
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:TOKEmJKXY3EJ:scholar.google.com/&scioq=Towards+Explainable+and+Efficient+Multi-Modality+Learning:+Domain-Agnostic+Concept+Space+Paired+with+Domain-Specific+Projection+Models&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Cornell University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cornell.edu",
        "aff_unique_abbr": "Cornell",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "kz5igjl04W",
        "title": "Approaching an unknown communication system by latent space exploration and causal inference",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper proposes a methodology for discovering meaningful properties in data by exploring the latent space of unsupervised deep generative models. We combine manipulation of individual latent variables to extreme values with methods inspired by causal inference into an approach we call causal disentanglement with extreme values (CDEV) and show that this method yields insights for model interpretability. With this, we can test for what properties of unknown data the model encodes as meaningful, using it to glean insight into the communication system of sperm whales (Physeter macrocephalus), one of the most intriguing and understudied animal communication systems. The network architecture used has been shown to learn meaningful representations of speech; here, it is used as a learning mechanism to decipher the properties of another vocal communication system in which case we have no ground truth. The proposed methodology suggests that sperm whales encode information using the number of clicks in a sequence, the regularity of their timing, and audio properties such as the spectral mean and the acoustic regularity of the sequences. Some of these findings are consistent with existing hypotheses, while others are proposed for the first time. We also argue that our models uncover rules that govern the structure of units in the communication system and apply them while generating innovative data not shown during training. This paper suggests that an interpretation of the outputs of deep neural networks with causal inference methodology can be a viable strategy for approaching data about which little is known and presents another case of how deep learning can limit the hypothesis space. Finally, the proposed approach can be extended to other architectures and datasets.",
        "keywords": "unsupervised learning;structure discovery;generative adversarial networks;causal inference;audio",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/dffe7e549561683ae50d8ecea3ec4cb17d98b2e4.zip",
        "author": "Gasper Begus;Andrej Leban;Shane Gero",
        "authorids": "~Gasper_Begus1;~Andrej_Leban1;~Shane_Gero1",
        "gender": "M;;M",
        "homepage": "https://www.gasperbegus.com/;https://andleb.netlify.app/;http://www.shanegero.com/",
        "dblp": "266/7874;342/9113;290/7525",
        "google_scholar": "r7gAWagAAAAJ;dHJ98jAAAAAJ;https://scholar.google.ca/citations?user=gznWHL4AAAAJ",
        "orcid": "0000-0002-6459-0551;0000-0003-0617-6843;0000-0001-6854-044X",
        "linkedin": "gbegus/;;shanegero/?originalSubdomain=ca",
        "or_profile": "~Gasper_Begus1;~Andrej_Leban1;~Shane_Gero1",
        "aff": "University of California, Berkeley;University of Michigan - Ann Arbor;Carleton University",
        "aff_domain": "berkeley.edu;umich.edu;carleton.ca",
        "position": "Associate Professor;PhD student;Principal Researcher",
        "bibtex": "@misc{\nbegus2024approaching,\ntitle={Approaching an unknown communication system by latent space exploration and causal inference},\nauthor={Gasper Begus and Andrej Leban and Shane Gero},\nyear={2024},\nurl={https://openreview.net/forum?id=kz5igjl04W}\n}",
        "github": "",
        "project": "",
        "reviewers": "w8kr;H1P3;zdFA;iB7G",
        "site": "https://openreview.net/forum?id=kz5igjl04W",
        "pdf_size": 3195654,
        "rating": "3;5;6;8",
        "confidence": "4;2;2;3",
        "soundness": "2;2;1;3",
        "contribution": "2;2;2;3",
        "presentation": "2;4;2;4",
        "wc_summary": "125;73;48;180",
        "wc_strengths": "35;74;27;163",
        "wc_weaknesses": "668;394;12;68",
        "wc_questions": "45;153;117;353",
        "wc_review": "873;694;204;764",
        "wc_reply_reviewers": "757;64;22;63",
        "wc_reply_authors": "2923;1149;858;220",
        "reply_reviewers": "2;1;1;1",
        "reply_authors": "6;4;3;2",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            1.0
        ],
        "wc_summary_avg": [
            106.5,
            50.71735403192876
        ],
        "wc_strengths_avg": [
            74.75,
            53.9646875280493
        ],
        "wc_weaknesses_avg": [
            285.5,
            264.66346555578843
        ],
        "wc_questions_avg": [
            167.0,
            114.21033228215387
        ],
        "wc_review_avg": [
            633.75,
            256.1838939121661
        ],
        "wc_reply_reviewers_avg": [
            226.5,
            306.75275059891476
        ],
        "wc_reply_authors_avg": [
            1287.5,
            1002.2560800514009
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.75,
            1.479019945774904
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.4181210050035454,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=896912031384611923&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of California, Berkeley;University of Michigan;Carleton University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.berkeley.edu;https://www.umich.edu;https://carleton.ca",
        "aff_unique_abbr": "UC Berkeley;UM;Carleton",
        "aff_campus_unique_index": "0;1",
        "aff_campus_unique": "Berkeley;Ann Arbor;",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "United States;Canada"
    },
    {
        "title": "Navigating the Design Space of Equivariant Diffusion-Based Generative Models for De Novo 3D Molecule Generation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17951",
        "id": "kzGuiRXZrQ",
        "author_site": "Tuan Le, Julian Cremer, Frank Noe, Djork-Arn\u00e9 Clevert, Kristof T. Sch\u00fctt",
        "tldr": "",
        "abstract": "Deep generative diffusion models are a promising avenue for 3D de novo molecular design in materials science and drug discovery.\nHowever, their utility is still limited by suboptimal performance on large molecular structures and limited training data.\nTo address this gap, we explore the design space of E(3)-equivariant diffusion models, focusing on previously unexplored areas.  \nOur extensive comparative analysis evaluates the interplay between continuous and discrete state spaces.\nFrom this investigation, we present the EQGAT-diff model, which consistently outperforms established models for the QM9 and GEOM-Drugs datasets.  \nSignificantly, EQGAT-diff takes continuous atom positions, while chemical elements and bond types are categorical and uses time-dependent loss weighting, substantially increasing training convergence, the quality of generated samples, and inference time. We also showcase that including chemically motivated additional features like hybridization states in the diffusion process enhances the validity of generated molecules.  \nTo further strengthen the applicability of diffusion models to limited training data, we investigate the transferability of EQGAT-diff trained on the large PubChem3D dataset with implicit hydrogen atoms to target different data distributions. Fine-tuning EQGAT-diff for just a few iterations shows an efficient distribution shift, further improving performance throughout data sets.   \nFinally, we test our model on the Crossdocked data set for structure-based de novo ligand generation, underlining the importance of our findings showing state-of-the-art performance on Vina docking scores.",
        "keywords": "Generative Modelling;Molecule Design;Denoising Diffusion Probabilistic Models;Ablation Study;Equivariant Graph Neural Network;3D Molecule Generation;Diffusion Model",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Tuan Le;Julian Cremer;Frank Noe;Djork-Arn\u00e9 Clevert;Kristof T Sch\u00fctt",
        "authorids": "~Tuan_Le2;~Julian_Cremer1;~Frank_Noe1;~Djork-Arn\u00e9_Clevert2;~Kristof_T_Sch\u00fctt1",
        "gender": "M;M;M;M;M",
        "homepage": "https://tuanle618.github.io/;;;;",
        "dblp": ";;;;121/2851",
        "google_scholar": "Fk1A1p4AAAAJ;9nGNPFcAAAAJ;QGiLc_cAAAAJ;id2clmMAAAAJ;https://scholar.google.de/citations?user=0e49RfgAAAAJ",
        "orcid": "0000-0001-7634-502X;;;;0000-0001-8342-0964",
        "linkedin": "tuan-le618/;;;;",
        "or_profile": "~Tuan_Le2;~Julian_Cremer1;~Frank_Noe1;~Djork-Arne_Clevert1;~Kristof_T._Sch\u00fctt1",
        "aff": "Freie Universit\u00e4t Berlin;Universitat Pompeu Fabra;Freie Universit\u00e4t Berlin;Pfizer;Pfizer",
        "aff_domain": "fu-berlin.de;upf.es;fu-berlin.de;pfizer.com;pfizer.com",
        "position": "PhD student;PhD student;Professor;Vice President;Researcher",
        "bibtex": "@inproceedings{\nle2024navigating,\ntitle={Navigating the Design Space of Equivariant Diffusion-Based Generative Models for De Novo 3D Molecule Generation},\nauthor={Tuan Le and Julian Cremer and Frank Noe and Djork-Arn{\\'e} Clevert and Kristof T Sch{\\\"u}tt},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=kzGuiRXZrQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "WVdk;sxkU;XyXs;AUdU",
        "pdf_size": 629027,
        "rating": "3;6;6;8",
        "confidence": "4;4;3;4",
        "soundness": "2;3;2;3",
        "contribution": "1;3;2;3",
        "presentation": "1;3;2;3",
        "wc_summary": "143;89;44;86",
        "wc_strengths": "14;44;40;145",
        "wc_weaknesses": "76;73;90;285",
        "wc_questions": "45;198;1;327",
        "wc_review": "278;404;175;843",
        "wc_reply_reviewers": "212;20;0;0",
        "wc_reply_authors": "1982;1300;540;2212",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "4;3;2;5",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            90.5,
            35.14612354157995
        ],
        "wc_strengths_avg": [
            60.75,
            49.9868732768914
        ],
        "wc_weaknesses_avg": [
            131.0,
            89.14314331455897
        ],
        "wc_questions_avg": [
            142.75,
            129.0820959699679
        ],
        "wc_review_avg": [
            425.0,
            254.59477606581012
        ],
        "wc_reply_reviewers_avg": [
            58.0,
            89.28605714219886
        ],
        "wc_reply_authors_avg": [
            1508.5,
            652.0312492511383
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.5,
            1.118033988749895
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.08084520834544431,
        "gs_citation": 24,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10669620657416399165&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=kzGuiRXZrQ",
        "pdf": "https://openreview.net/pdf?id=kzGuiRXZrQ",
        "email": "fu-berlin.de;upf.es;fu-berlin.de;pfizer.com;pfizer.com",
        "author_num": 5,
        "aff_unique_index": "0;1;0;2;2",
        "aff_unique_norm": "Freie Universit\u00e4t Berlin;Universitat Pompeu Fabra;Pfizer",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.fu-berlin.de;https://www.upf.edu/;https://www.pfizer.com",
        "aff_unique_abbr": "FU Berlin;UPF;Pfizer",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;2;2",
        "aff_country_unique": "Germany;Spain;United States"
    },
    {
        "id": "l0pPTGMqZt",
        "title": "Domain Generalization for Domain-Linked Classes",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Domain generalization (DG) focuses on transferring domain-invariant knowledge from multiple source domains (available at train time) to an $\\textit{a priori}$ unseen target domain(s). This task implicitly assumes that a class of interest is expressed in multiple source domains ($\\textit{domain-shared}$), which helps break the spurious correlations between domain and class and enables domain-invariant learning. However, in real-world applications, classes may often be expressed only in a specific domain ($\\textit{domain-linked}$), which leads to extremely poor generalization performance for these classes. In this work, we introduce this task to the community and develop an algorithm to learn generalizable representations for these domain-linked classes by transferring useful representations from domain-shared classes. Specifically, we propose a $\\textbf{F}$air and c$\\textbf{ON}$trastive feature-space regularization algorithm for $\\textbf{D}$omain-linked DG, $\\texttt{FOND}$. Rigorous and reproducible experiments with baselines across popular DG tasks demonstrate our method and its variants' ability to accomplish state-of-the-art DG results for domain-linked classes, given sufficient number of domain-shared classes. Complementary to these contributions, we develop theoretical insights for this task and practical insights for domain-linked class generalizability in real-world settings.",
        "keywords": "Domain Generalization;Fairness;Transfer Learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/246b909ea02ee04564f61d3fdceb9eb3356cd6a4.zip",
        "author": "Kimathi Kaai;Saad Hossain;Sirisha Rambhatla",
        "authorids": "~Kimathi_Kaai1;~Saad_Hossain1;~Sirisha_Rambhatla1",
        "gender": "M;M;F",
        "homepage": "https://kimathkaai.com;https://saad-hossain.github.io/;",
        "dblp": "322/4009;322/3947;123/4808.html",
        "google_scholar": "https://scholar.google.ca/citations?user=XpCEjJ4AAAAJ;;EOSZeBMAAAAJ",
        "orcid": ";0009-0006-9844-8437;",
        "linkedin": "kimathikaai/;s42hossa/;",
        "or_profile": "~Kimathi_Kaai1;~Saad_Hossain1;~Sirisha_Rambhatla1",
        "aff": "University of Waterloo;Kolena;University of Waterloo",
        "aff_domain": "uwaterloo.ca;kolena.com;uwaterloo.ca",
        "position": "MS student;Intern;Assistant Professor",
        "bibtex": "@misc{\nkaai2024domain,\ntitle={Domain Generalization for Domain-Linked Classes},\nauthor={Kimathi Kaai and Saad Hossain and Sirisha Rambhatla},\nyear={2024},\nurl={https://openreview.net/forum?id=l0pPTGMqZt}\n}",
        "github": "",
        "project": "",
        "reviewers": "UVpZ;8VB1;x5U3",
        "site": "https://openreview.net/forum?id=l0pPTGMqZt",
        "pdf_size": 2529582,
        "rating": "3;5;5",
        "confidence": "5;4;4",
        "soundness": "2;2;3",
        "contribution": "2;2;2",
        "presentation": "3;2;3",
        "wc_summary": "97;28;83",
        "wc_strengths": "50;27;103",
        "wc_weaknesses": "98;178;201",
        "wc_questions": "118;5;56",
        "wc_review": "363;238;443",
        "wc_reply_reviewers": "97;67;24",
        "wc_reply_authors": "932;601;727",
        "reply_reviewers": "1;1;1",
        "reply_authors": "2;1;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            69.33333333333333,
            29.780679792256066
        ],
        "wc_strengths_avg": [
            60.0,
            31.822423959633664
        ],
        "wc_weaknesses_avg": [
            159.0,
            44.14370472294625
        ],
        "wc_questions_avg": [
            59.666666666666664,
            46.20485784946091
        ],
        "wc_review_avg": [
            348.0,
            84.36033823229177
        ],
        "wc_reply_reviewers_avg": [
            62.666666666666664,
            29.95923155816176
        ],
        "wc_reply_authors_avg": [
            753.3333333333334,
            136.40707052381444
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.9999999999999997,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10983727855392767517&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Waterloo;Kolena",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://uwaterloo.ca;",
        "aff_unique_abbr": "UW;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Canada;"
    },
    {
        "id": "l18hiEXRJS",
        "title": "MAGDiff: Covariate Data Set Shift Detection via Activation Graphs of Deep Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Despite their successful application to a variety of tasks, neural networks remain limited, like other machine learning methods, by their sensitivity to shifts in the data: their performance can be severely impacted by differences in distribution between the data on which they were trained and that on which they are deployed. \n In this article, we propose a new family of representations, called MAGDiff, that we extract from any given neural network classifier and that allows for efficient covariate data shift detection without the need to train a new model dedicated to this task. These representations are computed by comparing the activation graphs of the neural network for samples belonging to the training distribution and to the target distribution, and yield powerful data- and task-adapted statistics for the two-sample tests commonly used for data set shift detection. We demonstrate this empirically by measuring the statistical powers of two-sample Kolmogorov-Smirnov (KS) tests on several different data sets and shift types, and showing that our novel representations induce significant improvements over a state-of-the-art baseline relying on the network output.",
        "keywords": "shift detection;dimensionality reduction;neural networks;activation graphs",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/e0e6cd65513d1706bfad537f918357078c7c65c3.zip",
        "author": "Charles Arnal;Felix Hensel;Mathieu Carri\u00e8re;Th\u00e9o Lacombe;Hiroaki Kurihara;Yuichi Ike;Frederic Chazal",
        "authorids": "~Charles_Arnal1;~Felix_Hensel1;~Mathieu_Carri\u00e8re1;~Th\u00e9o_Lacombe1;~Hiroaki_Kurihara1;~Yuichi_Ike1;~Frederic_Chazal1",
        "gender": "M;;;M;M;M;M",
        "homepage": "https://charlesarnal.github.io/;;https://mathieucarriere.github.io/website/;https://tlacombe.github.io;https://www.fujitsu.com/global/about/research/;https://sites.google.com/view/yuichi-ike;https://geometrica.saclay.inria.fr/team/Fred.Chazal/",
        "dblp": ";;167/1015;220/5549;;https://dblp.uni-trier.de/pid/230/3805;",
        "google_scholar": "Pre7QicAAAAJ;;;https://scholar.google.fr/citations?user=e9Xx4ZEAAAAJ;;https://scholar.google.com/citations?hl=ja;https://scholar.google.fr/citations?user=OVl2-30AAAAJ",
        "orcid": "0000-0002-3306-0574;;;;;0000-0002-8907-8319;",
        "linkedin": "charles-arnal-049001183/;;;;;yuichi-ike-a74305169/;frederic-chazal-4103203/",
        "or_profile": "~Charles_Arnal1;~Felix_Hensel1;~Mathieu_Carri\u00e8re1;~Th\u00e9o_Lacombe1;~Hiroaki_Kurihara1;~Yuichi_Ike1;~Frederic_Chazal1",
        "aff": "INRIA;;INRIA;Universit\u00e9 Gustave Eiffel;Fujitsu Research and Development Center Co. Ltm.;Institute of Mathematics for Industry, Kyushu University;INRIA",
        "aff_domain": "inria.fr;;inria.fr;univ-eiffel.fr;fujitsu.com;kyushu-u.ac.jp;inria.fr",
        "position": "Postdoc;;Researcher;Lecturer;Researcher;Associate Professor;Full Professor",
        "bibtex": "@misc{\narnal2024magdiff,\ntitle={{MAGD}iff: Covariate Data Set Shift Detection via Activation Graphs of Deep Neural Networks},\nauthor={Charles Arnal and Felix Hensel and Mathieu Carri{\\`e}re and Th{\\'e}o Lacombe and Hiroaki Kurihara and Yuichi Ike and Frederic Chazal},\nyear={2024},\nurl={https://openreview.net/forum?id=l18hiEXRJS}\n}",
        "github": "",
        "project": "",
        "reviewers": "WvRV;QE2P;hyAB;f2j1",
        "site": "https://openreview.net/forum?id=l18hiEXRJS",
        "pdf_size": 1224318,
        "rating": "3;5;5;5",
        "confidence": "4;3;3;3",
        "soundness": "3;3;2;3",
        "contribution": "2;2;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "82;79;85;112",
        "wc_strengths": "87;27;144;108",
        "wc_weaknesses": "404;51;147;291",
        "wc_questions": "224;1;56;393",
        "wc_review": "797;158;432;904",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            89.5,
            13.162446581088183
        ],
        "wc_strengths_avg": [
            91.5,
            42.45291509425472
        ],
        "wc_weaknesses_avg": [
            223.25,
            134.8561733848325
        ],
        "wc_questions_avg": [
            168.5,
            153.45439061818988
        ],
        "wc_review_avg": [
            572.75,
            296.58167087667437
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16465748549674207260&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;1;2;3;0",
        "aff_unique_norm": "INRIA;Universit\u00e9 Gustave Eiffel;Fujitsu Research and Development Center;Kyushu University",
        "aff_unique_dep": ";;Research and Development;Institute of Mathematics for Industry",
        "aff_unique_url": "https://www.inria.fr;https://www.univ-gustave-eiffel.fr;https://www.fujitsu.com/global/;https://www.kyushu-u.ac.jp",
        "aff_unique_abbr": "INRIA;UGE;Fujitsu R&D;Kyushu U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;1;0",
        "aff_country_unique": "France;Japan"
    },
    {
        "title": "DV-3DLane: End-to-end Multi-modal 3D Lane Detection with Dual-view Representation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17950",
        "id": "l1U6sEgYkb",
        "author_site": "Yueru Luo, Shuguang Cui, Zhen Li",
        "tldr": "",
        "abstract": "Accurate 3D lane estimation is crucial for ensuring safety in autonomous driving. However, prevailing monocular techniques suffer from depth loss and lighting variations, hampering accurate 3D lane detection. In contrast, LiDAR points offer geometric cues and enable precise localization. In this paper, we present DV-3DLane, a novel end-to-end **D**ual-**V**iew multi-modal **3D Lane** detection framework that synergizes the strengths of both images and LiDAR points. We propose to learn multi-modal features in dual-view spaces, *i.e.*, *perspective view* (PV) and *bird's-eye-view* (BEV), effectively leveraging the modal-specific information. To achieve this, we introduce three designs: 1) A bidirectional feature fusion strategy that integrates multi-modal features into each view space, exploiting their unique strengths. 2) A unified query generation approach that leverages lane-aware knowledge from both PV and BEV spaces to generate queries. 3) A 3D dual-view deformable attention mechanism, which aggregates discriminative features from both PV and BEV spaces into queries for accurate 3D lane detection. Extensive experiments on the public benchmark, OpenLane, demonstrate the efficacy and efficiency of DV-3DLane. It achieves state-of-the-art performance, with a remarkable 11.2 gain in F1 score and a substantial 53.5% reduction in errors. Code is available on [github](https://github.com/JMoonr/dv-3dlane).",
        "keywords": "3D Lane Detection;Multi-modal",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/0e8383d29b798e28149ed15a41b3dac6e4b11346.pdf",
        "author": "Yueru Luo;Shuguang Cui;Zhen Li",
        "authorids": "~Yueru_Luo1;~Shuguang_Cui1;~Zhen_Li6",
        "gender": "F;M;M",
        "homepage": ";https://sse.cuhk.edu.cn/en/content/1415;https://mypage.cuhk.edu.cn/academics/lizhen/",
        "dblp": "308/2405;48/4914;74/2397-26",
        "google_scholar": "B588EyYAAAAJ;https://scholar.google.com.hk/citations?user=1o_qvR0AAAAJ;https://scholar.google.com.hk/citations?user=0TTt3QsAAAAJ",
        "orcid": ";0000-0003-2608-775X;0000-0002-7669-2686",
        "linkedin": ";;",
        "or_profile": "~Yueru_Luo1;~Shuguang_Cui1;~Zhen_LI_Jason1",
        "aff": "The Chinese University of Hong Kong;The Chinese University of Hong Kong, Shenzhen;The Chinese University of Hong Kong, Shenzhen",
        "aff_domain": "cuhk.edu.cn;cuhk.edu.cn;edu.cn",
        "position": "PhD student;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nluo2024dvdlane,\ntitle={{DV}-3{DL}ane: End-to-end Multi-modal 3D Lane Detection with Dual-view Representation},\nauthor={Yueru Luo and Shuguang Cui and Zhen Li},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=l1U6sEgYkb}\n}",
        "github": "",
        "project": "",
        "reviewers": "Z8i9;ECVn;7Rt7;nYY6;9oXi",
        "pdf_size": 6184529,
        "rating": "3;6;6;6;10",
        "confidence": "5;5;5;3;5",
        "soundness": "3;3;3;3;4",
        "contribution": "1;3;3;3;4",
        "presentation": "2;3;4;3;4",
        "wc_summary": "75;55;34;85;16",
        "wc_strengths": "36;24;96;112;35",
        "wc_weaknesses": "129;65;239;45;1",
        "wc_questions": "66;1;187;18;1",
        "wc_review": "306;145;556;260;53",
        "wc_reply_reviewers": "0;13;198;21;0",
        "wc_reply_authors": "1209;606;1811;380;53",
        "reply_reviewers": "0;1;1;1;0",
        "reply_authors": "4;1;4;1;1",
        "rating_avg": [
            6.2,
            2.227105745132009
        ],
        "confidence_avg": [
            4.6,
            0.7999999999999999
        ],
        "soundness_avg": [
            3.2,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.8,
            0.9797958971132712
        ],
        "presentation_avg": [
            3.2,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            53.0,
            25.463699652642777
        ],
        "wc_strengths_avg": [
            60.6,
            36.04219749127403
        ],
        "wc_weaknesses_avg": [
            95.8,
            82.61331611792374
        ],
        "wc_questions_avg": [
            54.6,
            70.34941364361184
        ],
        "wc_review_avg": [
            264.0,
            170.7196532330124
        ],
        "wc_reply_reviewers_avg": [
            46.4,
            76.22230644634153
        ],
        "wc_reply_authors_avg": [
            811.8,
            626.2189393494898
        ],
        "reply_reviewers_avg": [
            0.6,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            2.2,
            1.469693845669907
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.044901325506693755,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17026821602610942697&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=l1U6sEgYkb",
        "pdf": "https://openreview.net/pdf?id=l1U6sEgYkb",
        "email": "cuhk.edu.cn;cuhk.edu.cn;edu.cn",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Chinese University of Hong Kong",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cuhk.edu.hk",
        "aff_unique_abbr": "CUHK",
        "aff_campus_unique_index": "0;1;1",
        "aff_campus_unique": "Hong Kong SAR;Shenzhen",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "l1pNNQSzZv",
        "title": "Rational Decision-Making Agent with Internalized Utility Judgment",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs) have demonstrated remarkable advancements and have attracted significant efforts to develop LLMs into agents capable of executing intricate multi-step decision-making tasks beyond traditional NLP applications. Existing approaches to LLM-based decision-making predominantly build upon the external performance measure to guide the decision-making process. However, reliance on the external performance measure as prior is problematic in real-world scenarios, where such prior may be unavailable, flawed, or even erroneous. For genuine autonomous decision making for LLM-based agents, it is imperative to develop rationality from their posterior experiences to judge decisions independently. Central to the development of rationality is the construction of an internalized utility judgment, capable of assigning numerical utilities to each decision. In this work, we propose RADAGENT (Rational Decision-Making Agent), which fosters the development of its rationality through an iterative framework involving Experience Exploration and Utility Learning. Within this framework, Elo-based Utility Construction is devised to assign Elo scores to individual decision steps to judge their utilities via pairwise comparisons. Consequently, these Elo scores guide the decision-making process to derive optimal outcomes. Experimental results on the Game of 24, WebShop, and ToolBench dataset demonstrate RADAGENT\u2019s superiority over baselines, achieving over 10% improvement in Pass Rate on diverse tasks. It offers higher-quality solutions and reduces costs (ChatGPT API calls), highlighting its effectiveness and efficiency.",
        "keywords": "Decision Making;Large Lanugage Model;Elo Rating",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Yining Ye;Xin Cong;Shizuo Tian;Yujia Qin;Chong Liu;Yankai Lin;Zhiyuan Liu;Maosong Sun",
        "authorids": "~Yining_Ye1;~Xin_Cong1;~Shizuo_Tian1;~Yujia_Qin1;~Chong_Liu5;~Yankai_Lin1;~Zhiyuan_Liu1;~Maosong_Sun1",
        "gender": "M;;M;M;M;M;M;M",
        "homepage": ";;https://yujia-qin.github.io/;https://chong-thu.github.io/LiuChong/;https://linyankai.github.io/;http://nlp.csai.tsinghua.edu.cn/~lzy;https://www.cs.tsinghua.edu.cn/csen/info/1312/4394.htm;https://scholar.google.com/citations?user=AUKaXYkAAAAJ&hl=en",
        "dblp": "141/4386.html;;126/2333;;161/0001.html;53/3245-1;95/3291-1;",
        "google_scholar": "RL9CmXgAAAAJ;https://scholar.google.com/citations?hl=zh-CN;;;https://scholar.google.com.hk/citations?user=j8K1FqEAAAAJ;dT0v5u0AAAAJ;https://scholar.google.com.tw/citations?user=zIgT0HMAAAAJ;",
        "orcid": ";;;;0000-0002-9182-8158;0000-0002-7709-2543;;",
        "linkedin": ";;yujia-qin-672595181/;;;;;",
        "or_profile": "~Xin_Cong1;~Shizuo_Tian1;~Yujia_Qin1;~Chong_Liu5;~Yankai_Lin1;~Zhiyuan_Liu1;~Maosong_Sun1;~Ye_Yi_ning1",
        "aff": "Tsinghua University;Tsinghua University;Tsinghua University;Tsinghua University;Renmin University of China;Tsinghua University;Tsinghua University;",
        "aff_domain": "mail.tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;ruc.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;",
        "position": "Postdoc;Undergrad student;PhD student;PhD student;Assistant Professor;Associate Professor;Full Professor;",
        "bibtex": "@misc{\nye2024rational,\ntitle={Rational Decision-Making Agent with Internalized Utility Judgment},\nauthor={Yining Ye and Xin Cong and Shizuo Tian and Yujia Qin and Chong Liu and Yankai Lin and Zhiyuan Liu and Maosong Sun},\nyear={2024},\nurl={https://openreview.net/forum?id=l1pNNQSzZv}\n}",
        "github": "",
        "project": "",
        "reviewers": "Zp4E;4ygb;1oKH;ynxx",
        "site": "https://openreview.net/forum?id=l1pNNQSzZv",
        "pdf_size": 569383,
        "rating": "5;6;6;8",
        "confidence": "4;3;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;2;4;3",
        "wc_summary": "171;82;122;34",
        "wc_strengths": "23;147;87;68",
        "wc_weaknesses": "179;336;82;261",
        "wc_questions": "10;42;51;71",
        "wc_review": "383;607;342;434",
        "wc_reply_reviewers": "182;17;0;0",
        "wc_reply_authors": "1284;1641;1580;942",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "4;4;4;4",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            102.25,
            50.45976119642264
        ],
        "wc_strengths_avg": [
            81.25,
            44.51053246142985
        ],
        "wc_weaknesses_avg": [
            214.5,
            94.52645132448377
        ],
        "wc_questions_avg": [
            43.5,
            22.005681084665387
        ],
        "wc_review_avg": [
            441.5,
            100.95667387547986
        ],
        "wc_reply_reviewers_avg": [
            49.75,
            76.66933872155153
        ],
        "wc_reply_authors_avg": [
            1361.75,
            277.42059674797036
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            4.0,
            0.0
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.13245323570650439,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1903892390055760986&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0;1;0;0",
        "aff_unique_norm": "Tsinghua University;Renmin University of China",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tsinghua.edu.cn;http://www.ruc.edu.cn",
        "aff_unique_abbr": "THU;RUC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "A Poincar\u00e9 Inequality and Consistency Results for Signal Sampling on Large Graphs",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17949",
        "id": "l3qtSNsPvC",
        "author_site": "Thien Le, Luana Ruiz, Stefanie Jegelka",
        "tldr": "",
        "abstract": "Large-scale graph machine learning is challenging as the complexity of learning models scales with the graph size. Subsampling the graph is a viable alternative, but sampling on graphs is nontrivial as graphs are non-Euclidean. Existing graph sampling techniques require not only computing the spectra of large matrices but also repeating these computations when the graph changes, e.g., grows. In this paper, we introduce a signal sampling theory for a type of graph limit---the graphon. We prove a Poincar\u00e9 inequality for graphon signals and show that complements of node subsets satisfying this inequality are unique sampling sets for Paley-Wiener spaces of graphon signals. Exploiting connections with spectral clustering and Gaussian elimination, we prove that such sampling sets are consistent in the sense that unique sampling sets on a convergent graph sequence converge to unique sampling sets on the graphon. We then propose a related graphon signal sampling algorithm for large graphs, and demonstrate its good empirical performance on graph machine learning tasks.",
        "keywords": "large-scale graphs;signal sampling;graphons",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Thien Le;Luana Ruiz;Stefanie Jegelka",
        "authorids": "~Thien_Le1;~Luana_Ruiz1;~Stefanie_Jegelka3",
        "gender": "M;F;F",
        "homepage": "https://steven-le-thien.github.io;https://sites.google.com/view/luana-ruiz/home;http://people.csail.mit.edu/stefje/",
        "dblp": "194/5549;;38/7003",
        "google_scholar": "WhFGh74AAAAJ;J-rZew8AAAAJ;gTWUZlsAAAAJ",
        "orcid": "0000-0001-5476-8451;;",
        "linkedin": ";;",
        "or_profile": "~Thien_Le1;~Luana_Ruiz1;~Stefanie_Jegelka3",
        "aff": "Massachusetts Institute of Technology;Whiting School of Engineering;Massachusetts Institute of Technology",
        "aff_domain": "mit.edu;engineering.jhu.edu;mit.edu",
        "position": "PhD student;Assistant Professor;Associate Professor",
        "bibtex": "@inproceedings{\nle2024a,\ntitle={A Poincar\\'e Inequality and Consistency Results for Signal Sampling on Large Graphs},\nauthor={Thien Le and Luana Ruiz and Stefanie Jegelka},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=l3qtSNsPvC}\n}",
        "github": "",
        "project": "",
        "reviewers": "KQ8B;2prr;3x8Y;1oL4",
        "pdf_size": 413475,
        "rating": "6;8;8;8",
        "confidence": "3;4;2;4",
        "soundness": "3;3;4;3",
        "contribution": "3;3;3;4",
        "presentation": "3;3;3;4",
        "wc_summary": "84;53;80;58",
        "wc_strengths": "105;123;33;119",
        "wc_weaknesses": "34;70;66;100",
        "wc_questions": "111;113;24;151",
        "wc_review": "334;359;203;428",
        "wc_reply_reviewers": "106;0;27;0",
        "wc_reply_authors": "867;282;358;509",
        "reply_reviewers": "2;0;1;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            68.75,
            13.442005058770064
        ],
        "wc_strengths_avg": [
            95.0,
            36.41428291206625
        ],
        "wc_weaknesses_avg": [
            67.5,
            23.382685902179844
        ],
        "wc_questions_avg": [
            99.75,
            46.54769059792333
        ],
        "wc_review_avg": [
            331.0,
            81.52606945020715
        ],
        "wc_reply_reviewers_avg": [
            33.25,
            43.42450345139251
        ],
        "wc_reply_authors_avg": [
            504.0,
            224.94110340264626
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.17407765595569782,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=314824949564951837&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=l3qtSNsPvC",
        "pdf": "https://openreview.net/pdf?id=l3qtSNsPvC",
        "email": "mit.edu;engineering.jhu.edu;mit.edu",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Massachusetts Institute of Technology;Johns Hopkins University",
        "aff_unique_dep": ";School of Engineering",
        "aff_unique_url": "https://web.mit.edu;https://engineering.jhu.edu",
        "aff_unique_abbr": "MIT;JHU Engineering",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Baltimore",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "l3s3HwJYDm",
        "title": "Opponent Modeling based on Sub-Goal Inference",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "When an agent is in a multi-agent environment, it may face previously unseen opponents, and it is a challenge to cooperate with other agents to accomplish the task together or to maximize its own rewards. Most opponent modeling methods deal with the non-stationarity caused by unknown opponent policies via predicting the opponent's actions. However, focusing on the opponent's action is shortsighted, which also constrains the adaptability to unknown opponents in complex tasks. In this paper, we propose opponent modeling based on subgoal inference, which infers the opponent's subgoals through historical trajectories. As subgoals are likely to be shared by different opponent policies, predicting subgoals can yield better generalization to unknown opponents. Additionally, we design two subgoal selection modes for cooperative games and general-sum games respectively. Empirically, we show that our method achieves more effective adaptation than existing methods in a variety of complex tasks.",
        "keywords": "multi-agent;reinforment learning;opponent modeling",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "XiaoPeng Yu;Jiechuan Jiang;Zongqing Lu",
        "authorids": "~XiaoPeng_Yu1;~Jiechuan_Jiang1;~Zongqing_Lu2",
        "gender": ";;",
        "homepage": ";;",
        "dblp": ";220/4026;",
        "google_scholar": ";;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~XiaoPeng_Yu1;~Jiechuan_Jiang1;~Zongqing_Lu2",
        "aff": ";Tsinghua University;",
        "aff_domain": ";mail.tsinghua.edu.cn;",
        "position": ";Intern;",
        "bibtex": "@misc{\nyu2024opponent,\ntitle={Opponent Modeling based on Sub-Goal Inference},\nauthor={XiaoPeng Yu and Jiechuan Jiang and Zongqing Lu},\nyear={2024},\nurl={https://openreview.net/forum?id=l3s3HwJYDm}\n}",
        "github": "",
        "project": "",
        "reviewers": "8YJ7;W6q1;nLrr;ZFnJ",
        "site": "https://openreview.net/forum?id=l3s3HwJYDm",
        "pdf_size": 865080,
        "rating": "3;3;3;6",
        "confidence": "4;5;4;3",
        "soundness": "2;2;3;3",
        "contribution": "2;1;3;3",
        "presentation": "2;3;2;2",
        "wc_summary": "88;77;233;108",
        "wc_strengths": "33;12;79;228",
        "wc_weaknesses": "50;405;283;372",
        "wc_questions": "387;42;116;22",
        "wc_review": "558;536;711;730",
        "wc_reply_reviewers": "0;0;49;236",
        "wc_reply_authors": "924;749;1000;631",
        "reply_reviewers": "0;0;1;2",
        "reply_authors": "2;1;2;2",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            126.5,
            62.483997951475544
        ],
        "wc_strengths_avg": [
            88.0,
            84.38305517104723
        ],
        "wc_weaknesses_avg": [
            277.5,
            138.72004181083568
        ],
        "wc_questions_avg": [
            141.75,
            145.86016419845413
        ],
        "wc_review_avg": [
            633.75,
            87.3566683201689
        ],
        "wc_reply_reviewers_avg": [
            71.25,
            97.19921553181383
        ],
        "wc_reply_authors_avg": [
            826.0,
            144.7705080463559
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0",
        "aff_unique_norm": "Tsinghua University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "THU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "l4k0MJuO9D",
        "title": "Network calibration under domain shift based on estimating the target domain accuracy",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this study, we address the problem of calibrating network confidence while adapting a model that was originally trained on a source domain to a target domain using unlabeled samples from the target domain. The absence of labels from the target domain makes it impossible to directly calibrate the adapted network on the target domain.  To tackle this challenge, we introduce a calibration procedure that relies on estimating the network's accuracy on the target domain.  The network accuracy is first computed on the labeled source data and then is modified to represent the actual accuracy of the model on the target domain.  The proposed algorithm calibrates the prediction confidence directly in the target domain by minimizing the disparity between the estimated accuracy and the computed confidence. The experimental results show that our method significantly outperforms existing methods, which rely on importance weighting, across several standard datasets.",
        "keywords": "domain shift;confidence calibration;unsupervised domain adaptation",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Coby Penso;Jacob Goldberger",
        "authorids": "~Coby_Penso1;~Jacob_Goldberger1",
        "gender": "M;M",
        "homepage": ";http://www.eng.biu.ac.il/goldbej/",
        "dblp": ";65/6574",
        "google_scholar": ";https://scholar.google.co.il/citations?user=vgzrOK4AAAAJ",
        "orcid": ";",
        "linkedin": "coby-penso-0190a81a7;",
        "or_profile": "~Coby_Penso1;~Jacob_Goldberger1",
        "aff": "Bar Ilan University;Bar-Ilan University",
        "aff_domain": "biu.ac.il;biu.ac.il",
        "position": "MS student;Full Professor",
        "bibtex": "@misc{\npenso2024network,\ntitle={Network calibration under domain shift based on estimating the  target domain accuracy},\nauthor={Coby Penso and Jacob Goldberger},\nyear={2024},\nurl={https://openreview.net/forum?id=l4k0MJuO9D}\n}",
        "github": "",
        "project": "",
        "reviewers": "kS8x;LtNi;fEXd;YiVF",
        "site": "https://openreview.net/forum?id=l4k0MJuO9D",
        "pdf_size": 587211,
        "rating": "3;3;3;5",
        "confidence": "5;4;5;4",
        "soundness": "1;3;2;2",
        "contribution": "2;1;1;2",
        "presentation": "2;3;2;3",
        "wc_summary": "105;73;84;163",
        "wc_strengths": "66;31;47;105",
        "wc_weaknesses": "459;132;189;213",
        "wc_questions": "71;5;47;32",
        "wc_review": "701;241;367;513",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            106.25,
            34.723011102149535
        ],
        "wc_strengths_avg": [
            62.25,
            27.616797424755827
        ],
        "wc_weaknesses_avg": [
            248.25,
            125.18261660470274
        ],
        "wc_questions_avg": [
            38.75,
            23.94133454926855
        ],
        "wc_review_avg": [
            455.5,
            171.33227950389266
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:eAk_XxoadqQJ:scholar.google.com/&scioq=Network+calibration+under+domain+shift+based+on+estimating+the+target+domain+accuracy&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Bar-Ilan University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.biu.ac.il",
        "aff_unique_abbr": "BIU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Israel"
    },
    {
        "id": "l5ouuojPGe",
        "title": "Red Pill or Blue Pill? Thresholding Strategies for Neural Network Monitoring",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "With the increasing deployment of neural networks in critical systems, runtime monitoring plays a critical role in rejecting unsafe predictions during inference. Various techniques have emerged to establish rejection scores that aim to maximize the separability between the distributions of safe and unsafe predictions. In most works, the efficacy of these approaches is evaluated using threshold-agnostic metrics, such as the area under the receiver operating characteristic curve. However, in real-world applications, the effectiveness of a monitor also requires identifying a good threshold to transform these scores into meaningful binary decisions. Despite the pivotal importance of threshold optimization in practice, this problem has received little to no attention in the literature. In this work, we address this question by comparing four strategies for constructing threshold optimization datasets, each reflecting a different assumption about the data available for threshold tuning. We present rigorous experiments on various image datasets and conclude that: 1. Knowledge about runtime threats actually impacting the system helps greatly in identifying an optimal threshold. 2. Without this information, relying solely on in-distribution data is advised, as adding unrelated generic threat data produces worse thresholds.",
        "keywords": "Neural Network Runtime Monitoring;Machine Learning Safety;Threshold Optimization",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/28fc3ba6a97f4e846ef777619240899e237490c1.zip",
        "author": "Khoi Tran DANG;Kevin Delmas;Jeremie Guiochet;Joris Guerin",
        "authorids": "~Khoi_Tran_DANG2;~Kevin_Delmas1;~Jeremie_Guiochet1;~Joris_Guerin1",
        "gender": ";M;M;M",
        "homepage": ";https://www.onera.fr/en/staff/kevin-delmas;https://homepages.laas.fr/guiochet/;https://espace-dev.pages.ird.fr/personnels/guerin/homepage/",
        "dblp": ";https://dblp.uni-trier.de/pid/167/9836.html;00/905.html;194/2302",
        "google_scholar": ";VXWBR28AAAAJ;https://scholar.google.fr/citations?user=yxa9u84AAAAJ;https://scholar.google.fr/citations?user=gO-31VYAAAAJ",
        "orcid": ";0000-0002-7654-0332;0000-0002-1285-8974;0000-0002-8048-8960",
        "linkedin": "tran-khoi-dang/;;jeremie-guiochet-185155b2/;",
        "or_profile": "~Khoi_Tran_DANG2;~Kevin_Delmas1;~Jeremie_Guiochet1;~Joris_Guerin1",
        "aff": "Institut National des Sciences Appliqu\u00e9es de Toulouse;Onera - The french aerospace lab;Universit\u00e9 de Toulouse, LAAS CNRS;IRD",
        "aff_domain": "insa-tlse.fr;onera.fr;univ-tlse3.fr;ird.fr",
        "position": "MS student;Researcher;Full Professor;Researcher",
        "bibtex": "@misc{\ndang2024red,\ntitle={Red Pill or Blue Pill? Thresholding Strategies for Neural Network Monitoring},\nauthor={Khoi Tran DANG and Kevin Delmas and Jeremie Guiochet and Joris Guerin},\nyear={2024},\nurl={https://openreview.net/forum?id=l5ouuojPGe}\n}",
        "github": "",
        "project": "",
        "reviewers": "qZZ4;f9sx;VKDA",
        "site": "https://openreview.net/forum?id=l5ouuojPGe",
        "pdf_size": 1158717,
        "rating": "1;3;5",
        "confidence": "3;3;2",
        "soundness": "1;3;4",
        "contribution": "1;1;2",
        "presentation": "1;3;2",
        "wc_summary": "26;53;74",
        "wc_strengths": "44;31;44",
        "wc_weaknesses": "212;139;284",
        "wc_questions": "55;33;114",
        "wc_review": "337;256;516",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            1.632993161855452
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "contribution_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            51.0,
            19.6468827043885
        ],
        "wc_strengths_avg": [
            39.666666666666664,
            6.128258770283412
        ],
        "wc_weaknesses_avg": [
            211.66666666666666,
            59.19647136630884
        ],
        "wc_questions_avg": [
            67.33333333333333,
            34.19876540981495
        ],
        "wc_review_avg": [
            369.6666666666667,
            108.62882776787302
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:o2qc7fmLMcoJ:scholar.google.com/&scioq=Red+Pill+or+Blue+Pill%3F+Thresholding+Strategies+for+Neural+Network+Monitoring&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Institut National des Sciences Appliqu\u00e9es de Toulouse;ONERA;Universit\u00e9 de Toulouse;Institut de Recherche pour le Developpement",
        "aff_unique_dep": ";The french aerospace lab;LAAS CNRS;",
        "aff_unique_url": "https://www.insa-toulouse.fr;https://www.onera.fr;https://www.laas.fr/;https://www.ird.fr",
        "aff_unique_abbr": "INSA Toulouse;Onera;;IRD",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "France"
    },
    {
        "id": "l5rEkR8OgU",
        "title": "Implicit Intermediate Supervision for Learning Complex Functions",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large Language models often rely on explicit intermediate step-by-step supervision, such as chain-of-thought, to solve complex tasks. However, this approach necessitates highly curated data and incurs increased inference time costs. In this study, we investigate the potential of implicit intermediate supervision as an alternative, focusing on multi-task and multi-label learning settings. We demonstrate that training on a dataset with a mixture of tasks allows the learner to utilize the solutions of simpler tasks as intermediate steps for solving more complex ones, reducing the reliance on curated data and explicit supervision. In the multi-label setting, the learner can leverage the signal propagated from easily inferred labels to learn targets that require more subtle computations. We present both theoretical and empirical evidence supporting the notion that neural networks can effectively harness such implicit supervision to tackle complex tasks. Our findings suggest that implicit supervision can shed light on how large language models learn complex tasks while potentially offering valuable insights into developing new versatile methods for solving intricate tasks in language modeling.",
        "keywords": "Large Language Models;Learning Theory;Theory of Deep Learning;Multi-Task Learning;Chain-of-Thought",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "eran malach;Gal Kaplun;Noam Wies",
        "authorids": "~eran_malach1;~Gal_Kaplun1;~Noam_Wies1",
        "gender": "M;M;M",
        "homepage": ";http://www.galkaplun.com;",
        "dblp": "202/2566;237/9816;236/6106",
        "google_scholar": "I15dUOwAAAAJ;y4BzFYsAAAAJ;https://scholar.google.co.il/citations?user=FxlR8voAAAAJ",
        "orcid": ";;0000-0002-1337-2298",
        "linkedin": ";gal-kaplun-865496151/;noam-wies-a5ab1663/",
        "or_profile": "~eran_malach1;~Gal_Kaplun1;~Noam_Wies1",
        "aff": "Harvard University;;Hebrew University of Jerusalem",
        "aff_domain": "harvard.edu;;huji.ac.il",
        "position": "Postdoc;;PhD student",
        "bibtex": "@misc{\nmalach2024implicit,\ntitle={Implicit Intermediate Supervision for Learning Complex Functions},\nauthor={eran malach and Gal Kaplun and Noam Wies},\nyear={2024},\nurl={https://openreview.net/forum?id=l5rEkR8OgU}\n}",
        "github": "",
        "project": "",
        "reviewers": "vLEV;rg2R;JC1K;JwBs",
        "site": "https://openreview.net/forum?id=l5rEkR8OgU",
        "pdf_size": 443905,
        "rating": "5;5;5;6",
        "confidence": "3;4;3;4",
        "soundness": "2;2;3;3",
        "contribution": "3;2;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "60;28;86;186",
        "wc_strengths": "101;59;41;58",
        "wc_weaknesses": "94;110;77;135",
        "wc_questions": "22;50;5;36",
        "wc_review": "277;247;209;415",
        "wc_reply_reviewers": "0;0;36;73",
        "wc_reply_authors": "188;360;207;349",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            90.0,
            59.1100668245266
        ],
        "wc_strengths_avg": [
            64.75,
            22.117583502724706
        ],
        "wc_weaknesses_avg": [
            104.0,
            21.365860619221497
        ],
        "wc_questions_avg": [
            28.25,
            16.67895380412093
        ],
        "wc_review_avg": [
            287.0,
            77.7303029712351
        ],
        "wc_reply_reviewers_avg": [
            27.25,
            30.22726418318403
        ],
        "wc_reply_authors_avg": [
            276.0,
            78.88282449304158
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:mx0eQzMCuPwJ:scholar.google.com/&scioq=Implicit+Intermediate+Supervision+for+Learning+Complex+Functions&hl=en&as_sdt=0,11",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Harvard University;Hebrew University of Jerusalem",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.harvard.edu;https://www.huji.ac.il",
        "aff_unique_abbr": "Harvard;HUJI",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Jerusalem",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United States;Israel"
    },
    {
        "id": "l5u7V2zD7K",
        "title": "Temporal Spiking Generative Adversarial Networks for Heading Direction Decoding",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The spike-based neuronal responses of the ventral intraparietal area (VIP) for different heading directions appear highly spatial and temporal dynamics in the posterior parietal cortex. The data amount of biological population level VIP neuronal response is usually relatively small due to the practical data collection difficulty, which impedes the application of the complex decoding model and even causes model overfitting. To overcome the above problem, we attempt to build the unified spike-based decoding framework with a spiking neural network (SNN) for the generative and decoding model since the SNN is biologically plausible and quite suitable for neural decoding. In this paper, we propose the temporal spiking generative adversarial networks (T-SGAN) based on a spiking transformer to generate synthetic time-series data of the neuronal response of VIP neurons, followed by the recurrent SNNs with an attention mechanism to capture the spatial and temporal dynamics and decoding the heading direction. The temporal segmentation is designed in T-SGAN to reduce the length of temporal dimension and spatial self-attention is adopted to extract associated information among VIP neurons. The experiments are conducted on the collected biological datasets from monkeys to evaluate the decoding performance of the proposed framework. Experiments show that the proposed T-SGAN successfully generates realistic synthetic data and promote decoding accuracy of recurrent SNNs up to 1.75%. The above SNN-based decoding framework could further exploit the low power consumption advantages and benefit the neuronal response decoding application.",
        "keywords": "Generative Spiking neural networks;Heading direction",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/ea04f95e9ca1f4275068546eef3f424ab4d855c2.pdf",
        "author": "Jiangrong Shen;Kejun Wang;Wei Gao;Jian K Liu;Qi Xu;Gang Pan;Xiaodong Chen;Huajin Tang",
        "authorids": "~Jiangrong_Shen1;~Kejun_Wang2;~Wei_Gao14;~Jian_K_Liu1;~Qi_Xu1;~Gang_Pan1;~Xiaodong_Chen5;~Huajin_Tang1",
        "gender": "F;M;M;;M;;Not Specified;M",
        "homepage": ";https://github.com/vnovovbnr;;;https://www.researchgate.net/profile/Qi_Xu43;;http://person.zju.edu.cn/0014003;https://person.zju.edu.cn/htang",
        "dblp": "208/3564;;;;;;;18/434",
        "google_scholar": "3XK6COkAAAAJ;;;;dGEcAuYAAAAJ;;;U041O4QAAAAJ",
        "orcid": ";;0009-0005-5074-3296;;0000-0001-9245-5544;;;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Jiangrong_Shen1;~Kejun_Wang2;~Wei_Gao14;~Jian_K_Liu1;~Qi_Xu1;~Gang_Pan1;~Xiaodong_Chen5;~Huajin_Tang1",
        "aff": "Zhejiang University;Zhejiang University;;;School of Computer Science and Technology;;Zhejiang University;Zhejiang University",
        "aff_domain": "zju.edu.cn;zju.edu.cn;;;dlut.edu.cn;;zju.edu.cn;zju.edu.cn",
        "position": "Postdoc;MS student;;;Associate Professor;;Full Professor;Full Professor",
        "bibtex": "@misc{\nshen2024temporal,\ntitle={Temporal Spiking Generative Adversarial Networks for Heading Direction Decoding},\nauthor={Jiangrong Shen and Kejun Wang and Wei Gao and Jian K Liu and Qi Xu and Gang Pan and Xiaodong Chen and Huajin Tang},\nyear={2024},\nurl={https://openreview.net/forum?id=l5u7V2zD7K}\n}",
        "github": "",
        "project": "",
        "reviewers": "rvuq;1g5p;2sPx;w27Z",
        "site": "https://openreview.net/forum?id=l5u7V2zD7K",
        "pdf_size": 628653,
        "rating": "1;5;5;8",
        "confidence": "4;4;4;4",
        "soundness": "1;2;3;4",
        "contribution": "1;2;3;3",
        "presentation": "1;2;2;4",
        "wc_summary": "94;58;84;116",
        "wc_strengths": "15;51;59;115",
        "wc_weaknesses": "30;128;142;71",
        "wc_questions": "108;164;73;2",
        "wc_review": "247;401;358;304",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "725;707;730;247",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.75,
            2.48746859276655
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            1.118033988749895
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            88.0,
            20.83266665599966
        ],
        "wc_strengths_avg": [
            60.0,
            35.81898937714463
        ],
        "wc_weaknesses_avg": [
            92.75,
            44.94093345715017
        ],
        "wc_questions_avg": [
            86.75,
            58.717012015258405
        ],
        "wc_review_avg": [
            327.5,
            57.803546603993084
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            602.25,
            205.2819707134555
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9633242773689314992&as_sdt=5,38&sciodt=0,38&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "Zhejiang University;School of Computer Science and Technology",
        "aff_unique_dep": ";Computer Science and Technology",
        "aff_unique_url": "https://www.zju.edu.cn;",
        "aff_unique_abbr": "ZJU;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China;"
    },
    {
        "title": "Revisiting Deep Audio-Text Retrieval Through the Lens of Transportation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17948",
        "id": "l60EM8md3t",
        "author_site": "Tien Manh Luong, Khai Nguyen, Nhat Ho, Reza Haffari, Dinh Phung, Lizhen Qu",
        "tldr": "",
        "abstract": "The Learning-to-match (LTM) framework proves to be an effective inverse optimal transport approach for learning the underlying ground metric between two sources of data, facilitating subsequent matching. However, the conventional LTM framework faces scalability challenges, necessitating the use of the entire dataset each time the parameters of the ground metric are updated. In adapting LTM to the deep learning context, we introduce the mini-batch Learning-to-match (m-LTM) framework for audio-text retrieval problems. This framework leverages mini-batch subsampling and Mahalanobis-enhanced family of ground metrics. Moreover, to cope with misaligned training data in practice, we propose a variant using partial optimal transport to mitigate the harm of misaligned data pairs in training data. We conduct extensive experiments on audio-text matching problems using three datasets: AudioCaps, Clotho, and ESC-50. Results demonstrate that our proposed method is capable of learning rich and expressive joint embedding space, which achieves SOTA performance. Beyond this, the proposed m-LTM framework is able to close the modality gap across audio and text embedding, which surpasses both triplet and contrastive loss in the zero-shot sound event detection task on the ESC-50 dataset. Notably, our strategy of employing partial optimal transport with m-LTM demonstrates greater noise tolerance than contrastive loss, especially under varying noise ratios in training data on the AudioCaps dataset. Our code is available at https://github.com/v-manhlt3/m-LTM-Audio-Text-Retrieval",
        "keywords": "Cross-modal;Audio-text Retrieval;Representation Learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/269cc98e63e4932a44c41ec78ef05de5637de737.zip",
        "author": "Manh Luong;Khai Nguyen;Nhat Ho;Gholamreza Haffari;Dinh Phung;Lizhen Qu",
        "authorids": "~Manh_Luong3;~Khai_Nguyen1;~Nhat_Ho1;~Gholamreza_Haffari2;~Dinh_Phung2;~Lizhen_Qu2",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://scholar.google.com.au/citations?user=Vb7bL0YAAAAJ&hl=en;https://khainb.com;https://nhatptnk8912.github.io/;https://research.monash.edu/en/persons/lizhen-qu;https://research.monash.edu/en/persons/dinh-phung;https://rezahaffari.github.io/HomePage/HomePage.html",
        "dblp": ";120/4308;203/4479;58/3601;71/5859;",
        "google_scholar": "https://scholar.google.com.au/citations?user=Vb7bL0YAAAAJ;im5fNaQAAAAJ;https://scholar.google.ca/citations?user=Xs7cKMwAAAAJ;https://scholar.google.com.au/citations?user=cHXZgHUAAAAJ;https://scholar.google.com.au/citations?user=OtA9SwIAAAAJ;https://scholar.google.com.tw/citations?user=Perjx5EAAAAJ",
        "orcid": ";;;0000-0002-7764-431X;0000-0002-9977-8247;",
        "linkedin": ";;nhat-pham-minh-ho-267b8164/;lizhen-qu-50017717/;https://linkedin.com/in/dinh-phung-6b537a6;gholamrezahaffari/?originalSubdomain=au",
        "or_profile": "~Manh_Luong3;~Khai_Nguyen1;~Nhat_Ho1;~Lizhen_Qu2;~Dinh_Phung1;~Gholamreza_Haffari1",
        "aff": "Monash University;University of Texas, Austin;University of Texas, Austin;Monash University;Monash University;Monash University",
        "aff_domain": "monash.edu;utexas.edu;utexas.edu;monash.edu.au;monash.edu;monash.edu",
        "position": "PhD student;PhD student;Assistant Professor;Lecturer;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nluong2024revisiting,\ntitle={Revisiting Deep Audio-Text Retrieval Through the Lens of Transportation},\nauthor={Manh Luong and Khai Nguyen and Nhat Ho and Gholamreza Haffari and Dinh Phung and Lizhen Qu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=l60EM8md3t}\n}",
        "github": "",
        "project": "",
        "reviewers": "Mpor;efev;Rq97",
        "pdf_size": 846957,
        "rating": "6;6;8",
        "confidence": "4;4;4",
        "soundness": "4;3;3",
        "contribution": "3;2;3",
        "presentation": "3;3;3",
        "wc_summary": "32;202;82",
        "wc_strengths": "34;46;29",
        "wc_weaknesses": "121;216;130",
        "wc_questions": "270;3;119",
        "wc_review": "457;467;360",
        "wc_reply_reviewers": "0;0;18",
        "wc_reply_authors": "1202;797;403",
        "reply_reviewers": "0;0;1",
        "reply_authors": "2;2;1",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            105.33333333333333,
            71.33644853010898
        ],
        "wc_strengths_avg": [
            36.333333333333336,
            7.1336448530109
        ],
        "wc_weaknesses_avg": [
            155.66666666666666,
            42.82003684673281
        ],
        "wc_questions_avg": [
            130.66666666666666,
            109.3140226849033
        ],
        "wc_review_avg": [
            428.0,
            48.25626038833372
        ],
        "wc_reply_reviewers_avg": [
            6.0,
            8.48528137423857
        ],
        "wc_reply_authors_avg": [
            800.6666666666666,
            326.2006880570439
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9632693780665765286&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=l60EM8md3t",
        "pdf": "https://openreview.net/pdf?id=l60EM8md3t",
        "email": "monash.edu;utexas.edu;utexas.edu;monash.edu.au;monash.edu;monash.edu",
        "author_num": 6,
        "aff_unique_index": "0;1;1;0;0;0",
        "aff_unique_norm": "Monash University;University of Texas at Austin",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.monash.edu;https://www.utexas.edu",
        "aff_unique_abbr": "Monash;UT Austin",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Austin",
        "aff_country_unique_index": "0;1;1;0;0;0",
        "aff_country_unique": "Australia;United States"
    },
    {
        "id": "l6eA8Srlqd",
        "title": "Scalable Long Range Propagation on Continuous-Time Dynamic Graphs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent research on Deep Graph Networks (DGNs) has broadened the domain of learning on graphs to real-world systems of interconnected entities that evolve over time. This paper addresses prediction problems on graphs defined by a stream of events, possibly irregularly sampled over time, generally referred to as Continuous-Time Dynamic Graphs (C-TDGs). While many predictive problems on graphs may require capturing interactions between nodes at different distances, existing DGNs for C-TDGs are not designed to propagate and preserve long-range information - resulting in suboptimal performance. In this work, we present Continuous-Time Graph Anti-Symmetric Network (CTAN), a DGN for C-TDGs designed within the ordinary differential equations framework that enables efficient propagation of long-range dependencies. We show that our method robustly performs stable and non-dissipative information propagation over dynamically evolving graphs, where the number of ODE discretization steps allows scaling the propagation range.\nWe empirically validate the proposed approach on several real and synthetic graph benchmarks, showing that CTAN leads to improved performance while enabling the propagation of long-range information.",
        "keywords": "deep graph network;graph neural network;long range interactions;continuous time dynamic graphs;dynamic graphs;temporal graphs;ordinary differential equations",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/14a349ca40c026883ccb0ed30ff4023b7ee985ff.zip",
        "author": "Alessio Gravina;Giulio Lovisotto;Claudio Gallicchio;Davide Bacciu;Claas Grohnfeldt",
        "authorids": "~Alessio_Gravina1;~Giulio_Lovisotto2;~Claudio_Gallicchio1;~Davide_Bacciu1;~Claas_Grohnfeldt1",
        "gender": ";M;M;M;",
        "homepage": "http://pages.di.unipi.it/gravina/;https://giuliolovisotto.github.io/;https://sites.google.com/site/cgallicch/;http://pages.di.unipi.it/bacciu/;",
        "dblp": ";;41/9473;07/6626;",
        "google_scholar": "oAzxkbYAAAAJ;;https://scholar.google.com/citations?hl=en;https://scholar.google.it/citations?user=1d5n2WkAAAAJ;https://scholar.google.de/citations?user=wcbFVEQAAAAJ",
        "orcid": "0000-0001-5526-2479;;;0000-0001-5213-2468;",
        "linkedin": "alessio-gravina/;;claudio-gallicchio-05a47038/;bacciu/;",
        "or_profile": "~Alessio_Gravina1;~Giulio_Lovisotto2;~Claudio_Gallicchio1;~Davide_Bacciu1;~Claas_Grohnfeldt1",
        "aff": "University of Pisa;;University of Pisa;University of Pisa;Huawei Technologies Ltd.",
        "aff_domain": "unipi.it;;unipi.it;unipi.it;huawei.com",
        "position": "PhD student;;Assistant Professor;Full Professor;Principal Research Engineer",
        "bibtex": "@misc{\ngravina2024scalable,\ntitle={Scalable Long Range Propagation on Continuous-Time Dynamic Graphs},\nauthor={Alessio Gravina and Giulio Lovisotto and Claudio Gallicchio and Davide Bacciu and Claas Grohnfeldt},\nyear={2024},\nurl={https://openreview.net/forum?id=l6eA8Srlqd}\n}",
        "github": "",
        "project": "",
        "reviewers": "udjB;tkro;Bq6a;eCU8",
        "site": "https://openreview.net/forum?id=l6eA8Srlqd",
        "pdf_size": 1622629,
        "rating": "5;5;6;6",
        "confidence": "5;5;3;3",
        "soundness": "3;3;3;3",
        "contribution": "2;4;3;3",
        "presentation": "3;4;3;4",
        "wc_summary": "57;49;46;75",
        "wc_strengths": "45;42;32;66",
        "wc_weaknesses": "200;189;210;113",
        "wc_questions": "72;82;71;8",
        "wc_review": "374;362;359;262",
        "wc_reply_reviewers": "0;0;8;34",
        "wc_reply_authors": "957;2376;1461;638",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "3;5;4;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            4.0,
            1.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            56.75,
            11.277743568639961
        ],
        "wc_strengths_avg": [
            46.25,
            12.376893794486563
        ],
        "wc_weaknesses_avg": [
            178.0,
            38.255718526777144
        ],
        "wc_questions_avg": [
            58.25,
            29.328953271468794
        ],
        "wc_review_avg": [
            339.25,
            44.95205779494416
        ],
        "wc_reply_reviewers_avg": [
            10.5,
            13.955285736952863
        ],
        "wc_reply_authors_avg": [
            1358.0,
            656.9120945758268
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.5,
            1.118033988749895
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:_BLRFXpFWo8J:scholar.google.com/&scioq=Scalable+Long+Range+Propagation+on+Continuous-Time+Dynamic+Graphs&hl=en&as_sdt=0,23",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "University of Pisa;Huawei",
        "aff_unique_dep": ";Huawei Technologies",
        "aff_unique_url": "https://www.unipi.it;https://www.huawei.com",
        "aff_unique_abbr": "UNIP;Huawei",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "Italy;China"
    },
    {
        "id": "l7aD9VMQUq",
        "title": "AS-LLM: When Algorithm Selection Meets Large Language Model",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Algorithm selection aims to identify the most suitable algorithm for solving a specific problem before execution, which has become a critical process of the AutoML. Current mainstream algorithm selection techniques rely heavily on feature representations of various problems and employ the performance of each algorithm as supervised information. However, there is a significant research gap concerning the consideration of algorithm features. This gap is primarily attributed to the inherent complexity of algorithms, making it particularly challenging to find a universally effective feature extraction method that is applicable across a diverse range of algorithms. Unfortunately, neglecting this aspect undoubtedly impacts the accuracy of algorithm selection and indirectly necessitates an increased volume of problem data for training purposes. This paper takes a significant stride towards addressing this gap by proposing an approach that integrates algorithm representation into the algorithm selection process. Specifically, our proposed model employs distinct modules to extract representations of both problems and algorithms, where the algorithm representation leverages the capabilities of pre-trained LLMs in the realm of code comprehension. Following the extraction of embedding vectors for both algorithms and problems, the most suitable algorithm is determined through calculations of matching degrees. Our experiments not only validate the effectiveness of the proposed model but also showcase the performance of different embedded pre-trained LLMs, which suggests that the proposed algorithm selection framework holds the potential to serve as a baseline task for evaluating the code representation capabilities of LLMs. The code will make publicly available after the review process.",
        "keywords": "algorithm selection;feature extraction;large language model;algorithm representation",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/e0324b3bfdbf04a5f1f6a888c783f3a02e6bd924.pdf",
        "author": "Xingyu Wu;Yan Zhong;Jibin Wu;KC Tan",
        "authorids": "~Xingyu_Wu3;~Yan_Zhong2;~Jibin_Wu1;~KC_Tan1",
        "gender": "M;M;M;",
        "homepage": "https://wuxingyu-ai.github.io/;;https://www.jibinwu.com/;",
        "dblp": "143/0523.html;81/5094-1.html;228/1824;",
        "google_scholar": "E10XSzEAAAAJ;;https://scholar.google.com.sg/citations?user=QwDyvrgAAAAJ;",
        "orcid": "0000-0002-8204-6197;0000-0003-0005-2620;;",
        "linkedin": ";;;",
        "or_profile": "~Xingyu_Wu3;~Yan_Zhong2;~Jibin_Wu1;~KC_Tan1",
        "aff": "Hong Kong Polytechnic University;Peking University;Hong Kong Polytechnic University;",
        "aff_domain": "polyu.edu.hk;pku.edu.cn;polyu.edu.hk;",
        "position": "Postdoc;PhD student;Assistant Professor;",
        "bibtex": "@misc{\nwu2024asllm,\ntitle={{AS}-{LLM}: When Algorithm Selection Meets Large Language Model},\nauthor={Xingyu Wu and Yan Zhong and Jibin Wu and KC Tan},\nyear={2024},\nurl={https://openreview.net/forum?id=l7aD9VMQUq}\n}",
        "github": "",
        "project": "",
        "reviewers": "KfZ1;R4Vs;rWvh;qdqu",
        "site": "https://openreview.net/forum?id=l7aD9VMQUq",
        "pdf_size": 530296,
        "rating": "3;3;3;5",
        "confidence": "4;4;4;2",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;3;3",
        "wc_summary": "51;81;31;81",
        "wc_strengths": "103;20;2;60",
        "wc_weaknesses": "1167;508;112;81",
        "wc_questions": "277;97;2;64",
        "wc_review": "1598;706;147;286",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            61.0,
            21.213203435596427
        ],
        "wc_strengths_avg": [
            46.25,
            38.91256223894798
        ],
        "wc_weaknesses_avg": [
            467.0,
            437.80760614680963
        ],
        "wc_questions_avg": [
            110.0,
            102.27169696450724
        ],
        "wc_review_avg": [
            684.25,
            566.2713020275705
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13909300757500220560&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Hong Kong Polytechnic University;Peking University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.polyu.edu.hk;http://www.pku.edu.cn",
        "aff_unique_abbr": "PolyU;Peking U",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "l7n59aufeT",
        "title": "Learning to (Learn at Test Time)",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "For each unlabeled test instance, test-time training (TTT) performs self-supervised learning on this single instance before making a prediction. We parameterize the self-supervised task and optimize it on the training set, such that TTT improves the final prediction. This form of learning to learn works in standard benchmarks such as ImageNet. In the simplest case, TTT with only linear components can implement linear attention, therefore can be dropped into linear transformers as a TTT layer. To evaluate the prescriptive power of our framework, we substitute the linear model in each TTT layer with a neural network, using heuristics such as stochastic gradient descent and layer norm. This shows significant improvements in performance comparing to linear transformers, i.e. TTT with linear models.",
        "keywords": "learning to learn;test-time training",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Yu Sun;Xinhao Li;Karan Dalal;Chloe Hsu;Sanmi Koyejo;Carlos Guestrin;Xiaolong Wang;Tatsunori Hashimoto;Xinlei Chen",
        "authorids": "~Yu_Sun1;~Xinhao_Li3;~Karan_Dalal1;~Chloe_Hsu1;~Sanmi_Koyejo1;~Carlos_Guestrin1;~Xiaolong_Wang3;~Tatsunori_Hashimoto1;~Xinlei_Chen1",
        "gender": "M;M;M;F;M;M;M;M;M",
        "homepage": "https://yueatsprograms.github.io/;https://leoxinhaolee.github.io/;https://www.karansdalal.com/;http://chloe-hsu.com/;https://guestrin.stanford.edu;https://xiaolonw.github.io/;https://thashim.github.io;http://xinleic.xyz;https://cs.stanford.edu/~sanmi/",
        "dblp": ";271/4947-2;;203/8309;38/769;91/952-4;;;14/8885",
        "google_scholar": "a7drwRMAAAAJ;RG9pwnUAAAAJ;XPFPohcAAAAJ;;DpLFv4gAAAAJ;Y8O9N_0AAAAJ;5ygiTwsAAAAJ;bSU7LYoAAAAJ;EaaOeJwAAAAJ",
        "orcid": ";;;;;;;;0000-0002-4023-419X",
        "linkedin": ";;karan--dalal/;;carlos-guestrin-5352a869/;;;;sanmi-koyejo-984754/",
        "or_profile": "~Yu_Sun1;~Xinhao_Li3;~Karan_Dalal1;~Chloe_Hsu1;~Carlos_Guestrin1;~Xiaolong_Wang3;~Tatsunori_Hashimoto1;~Xinlei_Chen1;~Oluwasanmi_O_Koyejo1",
        "aff": "Stanford University;University of California, San Diego;University of California, Berkeley;University of California, Berkeley;Stanford University;University of California, San Diego;Stanford University;Meta;Google",
        "aff_domain": "stanford.edu;ucsd.edu;berkeley.edu;berkeley.edu;stanford.edu;ucsd.edu;stanford.edu;meta.com;google.com",
        "position": "Postdoc;MS student;Undergrad student;PhD student;Full Professor;Assistant Professor;Assistant Professor;Researcher;Research Scientist",
        "bibtex": "@misc{\nsun2024learning,\ntitle={Learning to (Learn at Test Time)},\nauthor={Yu Sun and Xinhao Li and Karan Dalal and Chloe Hsu and Sanmi Koyejo and Carlos Guestrin and Xiaolong Wang and Tatsunori Hashimoto and Xinlei Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=l7n59aufeT}\n}",
        "github": "",
        "project": "",
        "reviewers": "tf1h;sCDR;DvfS;vvKb",
        "site": "https://openreview.net/forum?id=l7n59aufeT",
        "pdf_size": 467606,
        "rating": "3;3;3;6",
        "confidence": "5;3;4;4",
        "soundness": "2;1;2;3",
        "contribution": "2;1;2;4",
        "presentation": "3;1;2;3",
        "wc_summary": "90;107;93;44",
        "wc_strengths": "104;11;65;36",
        "wc_weaknesses": "311;218;144;244",
        "wc_questions": "73;2;3;86",
        "wc_review": "578;338;305;410",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            1.0897247358851685
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            83.5,
            23.69071548096427
        ],
        "wc_strengths_avg": [
            54.0,
            34.61935874622752
        ],
        "wc_weaknesses_avg": [
            229.25,
            59.780327031557796
        ],
        "wc_questions_avg": [
            41.0,
            38.77499194068259
        ],
        "wc_review_avg": [
            407.75,
            105.37166364825033
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=397625295244718789&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;2;0;1;0;3;4",
        "aff_unique_norm": "Stanford University;University of California, San Diego;University of California, Berkeley;Meta;Google",
        "aff_unique_dep": ";;;Meta Platforms, Inc.;Google",
        "aff_unique_url": "https://www.stanford.edu;https://www.ucsd.edu;https://www.berkeley.edu;https://meta.com;https://www.google.com",
        "aff_unique_abbr": "Stanford;UCSD;UC Berkeley;Meta;Google",
        "aff_campus_unique_index": "0;1;2;2;0;1;0;4",
        "aff_campus_unique": "Stanford;San Diego;Berkeley;;Mountain View",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "l8DoOsQHvm",
        "title": "Exploiting Implicit Rigidity Constraints via Weight-Sharing Aggregation for Scene Flow Estimation from Point Clouds",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Scene flow estimation, which predicts the 3D motion of  scene points from point clouds, is a core task in autonomous driving and many other 3D vision applications. Existing methods either suffer from structure distortion due to ignorance of rigid motion consistency or require explicit pose estimation and 3D object segmentation. Errors of estimated poses and segmented objects would yield inaccurate rigidity constraints and in turn mislead scene flow estimation. In this paper, we propose a novel weight-sharing aggregation (WSA) method for feature and scene flow up-sampling.  WSA does not rely on estimated poses and segmented objects, and can implicitly enforce rigidity constraints to avoid structure distortion in scene flow estimation. To further exploit geometric information and preserve local structure, we design a deformation degree module aim to keep the local region invariance. We modify the PointPWC-Net and integrate the proposed WSA and deformation degree module into the enhanced PointPWC-Net to derive an end-to-end scene flow estimation network, called WSAFlowNet. Extensive experimental results on the FlyingThings3D and KITTI datasets demonstrate that our WSAFlowNet achieves the state-of-the-art performance and outperforms previous methods by a large margin. We will release the source code of WSAFlowNet upon the publicity of the paper.",
        "keywords": "scene flow;deep learning;coarse-to-fine structure;rigidity constraints;point clouds;autonomous driving",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Yun Wang;Cheng Chi;Xin Yang",
        "authorids": "~Yun_Wang7;~Cheng_Chi_1;~Xin_Yang2",
        "gender": "F;;F",
        "homepage": ";;https://sites.google.com/view/xinyang/home",
        "dblp": ";;44/1152-8",
        "google_scholar": "9tbpemIAAAAJ;p1tCuLAAAAAJ;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Yun_Wang7;~Cheng_Chi_1;~Xin_Yang2",
        "aff": "Huazhong University of Science and Technology;Huazhong University of Science and Technology, Tsinghua University;Huazhong University of Science and Technology",
        "aff_domain": "hust.edu.cn;hust.edu.cn;hust.edu.cn",
        "position": "PhD student;MS student;Full Professor",
        "bibtex": "@misc{\nwang2024exploiting,\ntitle={Exploiting Implicit Rigidity Constraints via Weight-Sharing Aggregation for Scene Flow Estimation from Point Clouds},\nauthor={Yun Wang and Cheng Chi and Xin Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=l8DoOsQHvm}\n}",
        "github": "",
        "project": "",
        "reviewers": "BuUw;YnNz;gEsZ",
        "site": "https://openreview.net/forum?id=l8DoOsQHvm",
        "pdf_size": 3532250,
        "rating": "3;3;6",
        "confidence": "4;4;3",
        "soundness": "2;3;3",
        "contribution": "2;2;2",
        "presentation": "3;3;3",
        "wc_summary": "44;87;97",
        "wc_strengths": "45;48;105",
        "wc_weaknesses": "230;155;187",
        "wc_questions": "20;5;14",
        "wc_review": "339;295;403",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            76.0,
            22.992752481307377
        ],
        "wc_strengths_avg": [
            66.0,
            27.60434748368452
        ],
        "wc_weaknesses_avg": [
            190.66666666666666,
            30.728199137310703
        ],
        "wc_questions_avg": [
            13.0,
            6.164414002968976
        ],
        "wc_review_avg": [
            345.6666666666667,
            44.34210439550904
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14407582717420754050&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Huazhong University of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.hust.edu.cn",
        "aff_unique_abbr": "HUST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "l8je4qJR4K",
        "title": "Domain Generalization via Content Factors Isolation: A Two-level Latent Variable Modeling Approach",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The purpose of domain generalization is to develop models that exhibit a higher degree of generality, meaning they perform better when evaluated on data coming from previously unseen distributions. Models obtained via traditional methods often cannot distinguish between label-specific and domain-related features in the latent space. To confront this difficulty, we propose formulating a novel data generation process using a latent variable model and postulating a partition of the latent space into content and style parts while allowing for statistical dependency to exist between them. In this model, the distribution of content factors associated with observations belonging to the same class depends on only the label corresponding to that class. In contrast, the distribution of style factors has an additional dependency on the domain variable. We derive constraints that suffice to recover the collection of content factors block-wise and the collection of style factors component-wise while guaranteeing the isolation of content factors. This allows us to produce a stable predictor solely relying on the latent content factors. Building upon these theoretical insights, we propose a practical and efficient algorithm for determining the latent variables under the variational auto-encoder framework. Our simulations with dependent latent variables produce results consistent with our theory, and real-world experiments show that our method outperforms the competitors.",
        "keywords": "distribution shifts;generative model;identifiability",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Erdun Gao;Howard Bondell;Shaoli Huang;Mingming Gong",
        "authorids": "~Erdun_Gao1;~Howard_Bondell2;~Shaoli_Huang2;~Mingming_Gong1",
        "gender": "M;;M;M",
        "homepage": ";;;https://mingming-gong.github.io/",
        "dblp": "246/5884;;80/8502;98/8479",
        "google_scholar": ";;o31BPFsAAAAJ;https://scholar.google.com.au/citations?user=6BmiCJIAAAAJ",
        "orcid": "0000-0003-1736-2764;;;0000-0001-7147-5589",
        "linkedin": ";;;",
        "or_profile": "~Erdun_Gao1;~Howard_Bondell2;~Shaoli_Huang2;~Mingming_Gong1",
        "aff": "University of Melbourne;;Tencent AI Lab;University of Melbourne",
        "aff_domain": "unimelb.edu.au;;tencent.com;unimelb.edu.au",
        "position": "PhD student;;Researcher;Assistant Professor",
        "bibtex": "@misc{\ngao2024domain,\ntitle={Domain Generalization via Content Factors Isolation: A Two-level Latent Variable Modeling Approach},\nauthor={Erdun Gao and Howard Bondell and Shaoli Huang and Mingming Gong},\nyear={2024},\nurl={https://openreview.net/forum?id=l8je4qJR4K}\n}",
        "github": "",
        "project": "",
        "reviewers": "XKs5;Vftx;f1Ds;2mKD",
        "site": "https://openreview.net/forum?id=l8je4qJR4K",
        "pdf_size": 1296981,
        "rating": "5;6;6;6",
        "confidence": "3;2;3;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;3;2",
        "wc_summary": "67;56;274;33",
        "wc_strengths": "49;42;159;13",
        "wc_weaknesses": "127;157;98;140",
        "wc_questions": "2;4;3;43",
        "wc_review": "245;259;534;229",
        "wc_reply_reviewers": "0;26;0;18",
        "wc_reply_authors": "775;848;1179;1355",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "2;2;3;3",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            107.5,
            96.90846196282345
        ],
        "wc_strengths_avg": [
            65.75,
            55.50394130149678
        ],
        "wc_weaknesses_avg": [
            130.5,
            21.569654610122992
        ],
        "wc_questions_avg": [
            13.0,
            17.334935823359714
        ],
        "wc_review_avg": [
            316.75,
            125.87766878998038
        ],
        "wc_reply_reviewers_avg": [
            11.0,
            11.357816691600547
        ],
        "wc_reply_authors_avg": [
            1039.25,
            237.50407891234204
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3475594525984180328&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Melbourne;Tencent",
        "aff_unique_dep": ";Tencent AI Lab",
        "aff_unique_url": "https://www.unimelb.edu.au;https://ai.tencent.com",
        "aff_unique_abbr": "UniMelb;Tencent AI Lab",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Australia;China"
    },
    {
        "id": "l9GaXJnMJ8",
        "title": "Fast Stochastic Kernel Approximation by Dual Wasserstein Distance Method",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We introduce a generalization of the Wasserstein metric, originally designed for probability measures, to establish a novel distance between probability kernels of Markov systems. We illustrate how this kernel metric may serve as the foundation for an efficient approximation technique, enabling the replacement of the original system's kernel with a kernel with a discrete support of limited cardinality.\nTo facilitate practical implementation, we present a specialized dual algorithm capable of constructing these approximate kernels quickly and efficiently, without requiring computationally expensive matrix operations. Finally, we demonstrate the effectiveness of our method through several illustrative examples, showcasing its utility in diverse practical scenarios, including dynamic risk estimation. This advancement offers new possibilities for the streamlined analysis and manipulation of Markov systems represented by kernels.",
        "keywords": "Markov System;Kernel Distance;Wasserstein Distance;Dual Subgradient Method",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Zhengqi Lin;Andrzej Ruszczynski",
        "authorids": "~Zhengqi_Lin1;~Andrzej_Ruszczynski1",
        "gender": "M;M",
        "homepage": ";http://www.rusz.rutgers.edu/",
        "dblp": "362/5960;54/4075",
        "google_scholar": ";O5SjWqAAAAAJ",
        "orcid": "0000-0002-0952-1019;0000-0002-4571-1469",
        "linkedin": "zhengqilin;",
        "or_profile": "~Zhengqi_Lin1;~Andrzej_Ruszczynski1",
        "aff": "Rutgers University;Rutgers University",
        "aff_domain": "rutgers.edu;rutgers.edu",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nanonymous2024fast,\ntitle={Fast Stochastic Kernel Approximation by Dual Wasserstein Distance Method},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=l9GaXJnMJ8}\n}",
        "github": "",
        "project": "",
        "reviewers": "B8LX;uLtp;Vxjx",
        "site": "https://openreview.net/forum?id=l9GaXJnMJ8",
        "pdf_size": 440559,
        "rating": "1;5;8",
        "confidence": "5;4;3",
        "soundness": "1;2;4",
        "contribution": "1;2;3",
        "presentation": "1;1;3",
        "wc_summary": "42;72;34",
        "wc_strengths": "30;8;114",
        "wc_weaknesses": "161;28;92",
        "wc_questions": "1;135;69",
        "wc_review": "234;243;309",
        "wc_reply_reviewers": "33;159;5",
        "wc_reply_authors": "229;431;228",
        "reply_reviewers": "1;2;1",
        "reply_authors": "2;2;1",
        "rating_avg": [
            4.666666666666667,
            2.8674417556808756
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            49.333333333333336,
            16.35712552851373
        ],
        "wc_strengths_avg": [
            50.666666666666664,
            45.67518168789504
        ],
        "wc_weaknesses_avg": [
            93.66666666666667,
            54.309810859139944
        ],
        "wc_questions_avg": [
            68.33333333333333,
            54.70730197047639
        ],
        "wc_review_avg": [
            262.0,
            33.436506994600975
        ],
        "wc_reply_reviewers_avg": [
            65.66666666666667,
            66.97926710723418
        ],
        "wc_reply_authors_avg": [
            296.0,
            95.4602884275271
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.996615895540124,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:WQeVN6Aw0P8J:scholar.google.com/&scioq=Fast+Stochastic+Kernel+Approximation+by+Dual+Wasserstein+Distance+Method&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Rutgers University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.rutgers.edu",
        "aff_unique_abbr": "Rutgers",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "l9ZIU71zQK",
        "title": "Rethinking Effectiveness of Unsupervised Domain Adaptation Methods",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recently, significant progress has been made in unsupervised domain adaptation (UDA) through techniques that enable reduction of the domain gap between labeled source domain data and unlabeled target domain data. In this work, we examine the diverse factors that may influence the effectiveness of UDA methods, and devise a comprehensive empirical study through the lens of backbone architectures,  quantity of data and pre-training datasets to gain insights into the effectiveness of modern adaptation approaches on standard UDA benchmarks. Our findings reveal several non-trivial, yet valuable observations: (i) the benefits of adaptation methods decrease with advanced backbones, (ii) current methods under-utilize unlabeled data, and (iii) pre-training data matters for downstream adaptation in both supervised and self-supervised settings. To standardize evaluation across various UDA methods, we develop a novel PyTorch framework for domain adaptation and will release the framework, along with the trained models, publicly.",
        "keywords": "domain adaptation;transfer learning;unsupervised learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/b5f39a089548b4b9de0ce83a1d392e8a69ffdef0.zip",
        "author": "Tarun Kalluri;Sreyas Ravichandran;Manmohan Chandraker",
        "authorids": "~Tarun_Kalluri1;~Sreyas_Ravichandran1;~Manmohan_Chandraker3",
        "gender": "M;M;M",
        "homepage": "https://tarun005.github.io/;https://sreyas-108.github.io/;http://cseweb.ucsd.edu/~mkchandraker/",
        "dblp": "167/4104;;79/589",
        "google_scholar": "https://scholar.google.co.in/citations?user=AeraUlMAAAAJ;;oPFCNk4AAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Tarun_Kalluri1;~Sreyas_Ravichandran1;~Manmohan_Chandraker2",
        "aff": "University of California, San Diego, University of California, San Diego;University of California, San Diego;University of California, San Diego",
        "aff_domain": "eng.ucsd.edu;ucsd.edu;ucsd.edu",
        "position": "PhD student;MS student;Full Professor",
        "bibtex": "@misc{\nkalluri2024rethinking,\ntitle={Rethinking Effectiveness of Unsupervised Domain Adaptation Methods},\nauthor={Tarun Kalluri and Sreyas Ravichandran and Manmohan Chandraker},\nyear={2024},\nurl={https://openreview.net/forum?id=l9ZIU71zQK}\n}",
        "github": "",
        "project": "",
        "reviewers": "iPUs;bJYV;ew3y;txAu",
        "site": "https://openreview.net/forum?id=l9ZIU71zQK",
        "pdf_size": 4293544,
        "rating": "3;3;5;6",
        "confidence": "5;5;3;4",
        "soundness": "2;2;3;3",
        "contribution": "1;2;2;3",
        "presentation": "2;3;3;2",
        "wc_summary": "85;80;25;154",
        "wc_strengths": "76;107;87;94",
        "wc_weaknesses": "605;181;64;104",
        "wc_questions": "11;83;1;43",
        "wc_review": "777;451;177;395",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            86.0,
            45.77663159298639
        ],
        "wc_strengths_avg": [
            91.0,
            11.247221879201993
        ],
        "wc_weaknesses_avg": [
            238.5,
            215.73652912754483
        ],
        "wc_questions_avg": [
            34.5,
            32.01171660501823
        ],
        "wc_review_avg": [
            450.0,
            214.75800334329801
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.7543365091413573,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:gGDQvfMBaw4J:scholar.google.com/&scioq=Rethinking+Effectiveness+of+Unsupervised+Domain+Adaptation+Methods&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of California, San Diego",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucsd.edu",
        "aff_unique_abbr": "UCSD",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "San Diego",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "lAScUJDwJ5",
        "title": "POUTA - Produce once, utilize twice for anomaly detection",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Visual anomaly detection aims at classifying and locating the regions that deviate from the normal appearance. One of the solutions is the reconstruction-based approach, which locates the anomaly by analyzing the difference between the original and reconstructed images. However, when the reconstructed image is of low-quality or the anomaly is fine-grained, the image-level difference analysis approach usually fails. To deal with the above two cases, it is necessary to learn more accurate information. According to our observation, the features of the reconstructive network contains more accurate information about the anomaly than the image-level difference. To leverage the feature-level information, POUTA is proposed. In POUTA, the discriminative network  takes the encoder and decoder features of the reconstructive network as the features of the original and reconstructed image respectively. And there is a coarse-to-fine process in each discriminative layer, the above information is refined by the high-level semantics and semantic supervision loss. The discriminative network accepts features as input now, so the feature extraction process (discriminative encoder) is unnecessary. In other words, POUTA produces the features in reconstructive network once but utilizes them twice for reconstruction and discrimination separately, which reduces the parameters and improves the efficiency. The experiments show that, compared with the vanilla method, POUTA achieves better performance with even fewer parameters and less inference time. On MVTec AD, VisA and DAGM dataset, POUTA also outperforms the state-of-the-art reconstruction-based methods.",
        "keywords": "anomaly detection;anomaly escape;overkill;reconstruction-based",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/0c0f11168d665dc128653d46b056b45522049499.pdf",
        "author": "Shuyuan Wang;Huiyuan Luo;Qi Li;Chengkan Lv;Zhengtao Zhang",
        "authorids": "~Shuyuan_Wang2;~Huiyuan_Luo2;~Qi_Li2;~Chengkan_Lv1;~Zhengtao_Zhang1",
        "gender": ";M;M;M;M",
        "homepage": ";;https://liqi-casia.github.io/;https://scholar.google.com/citations?user=Z5xP37UAAAAJ;https://people.ucas.ac.cn/~zhangzhengtao",
        "dblp": ";271/2920;181/2688-5;;",
        "google_scholar": ";;https://scholar.google.com.hk/citations?user=OZxJfuMAAAAJ;Z5xP37UAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";0000-0001-7855-9902;;;",
        "linkedin": ";;;;",
        "or_profile": "~Shuyuan_Wang2;~Huiyuan_Luo2;~Qi_Li2;~Chengkan_Lv1;~Zhengtao_Zhang1",
        "aff": ";Institute of Automation, Chinese Academy of Sciences;Institute of Automation, Chinese Academy of Sciences;Institute of Automation, Chinese Academy of Sciences;Institute of Automation, Chinese Academy of Sciences",
        "aff_domain": ";ia.ac.cn;ia.ac.cn;ia.ac.cn;ia.ac.cn",
        "position": ";Postdoc;Associate Professor;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nwang2024pouta,\ntitle={{POUTA} - Produce once, utilize twice for anomaly detection},\nauthor={Shuyuan Wang and Huiyuan Luo and Qi Li and Chengkan Lv and Zhengtao Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=lAScUJDwJ5}\n}",
        "github": "",
        "project": "",
        "reviewers": "9oym;iu96;QRqr",
        "site": "https://openreview.net/forum?id=lAScUJDwJ5",
        "pdf_size": 1969185,
        "rating": "3;5;5",
        "confidence": "5;4;4",
        "soundness": "2;3;3",
        "contribution": "1;2;2",
        "presentation": "1;3;2",
        "wc_summary": "49;90;50",
        "wc_strengths": "19;61;50",
        "wc_weaknesses": "278;151;225",
        "wc_questions": "3;22;94",
        "wc_review": "349;324;419",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            63.0,
            19.096247449870006
        ],
        "wc_strengths_avg": [
            43.333333333333336,
            17.78263822446552
        ],
        "wc_weaknesses_avg": [
            218.0,
            52.083266666624
        ],
        "wc_questions_avg": [
            39.666666666666664,
            39.19467083956979
        ],
        "wc_review_avg": [
            364.0,
            40.2077936060494
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9999999999999997,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:r6vKmKh5GqAJ:scholar.google.com/&scioq=POUTA+-+Produce+once,+utilize+twice+for+anomaly+detection&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Chinese Academy of Sciences",
        "aff_unique_dep": "Institute of Automation",
        "aff_unique_url": "http://www.ia.cas.cn",
        "aff_unique_abbr": "CAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "lATusnzNRT",
        "title": "Enhancing Graph Injection Attacks Through Over-Smoothing Amplification",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph Injection Attack (GIA) on Graph Neural Networks (GNNs) has attracted significant attention due to its serious threats to the deployment of GNNs by carefully injecting a few malicious nodes into graphs.\nExisting GIA defense methods mostly follow a framework similar to the defense depicted in the images. Instead, we aim to enhance the attack capabilities of GIA by studying the properties of the graph itself. Considering the negative impact of the over-smoothing issue in GNNs, we propose $\\textit{O}$ver-$\\textit{S}$moothing adversarial $\\textit{I}$njection (OSI), a universal method that can be combined with any GIA to enhance the attack power by amplifying the over-smoothing on graphs. Specifically, OSI proposes two metrics to evaluate the over-smoothing of the graph. We prove that these two metrics are highly correlated with singular values of the adjacency matrix. Thus, OSI further introduces a Smooth Injection Loss (SIL) which aims to smooth the singular values. By fine-tuning the adjacency matrix using SIL, OSI can amplify over-smoothing and enhance the attack power of GIA. We conduct experiments on 4 benchmark datasets and the state-of-the-art GNNs and GIA attacks. Empirical experiments show that OSI can significantly improve the attack capabilities of existing GIA attacks on different defense GNN models in most scenarios.",
        "keywords": "Graph Neural Networks;Adversarial Machine Learning;Graph Adversarial Attack",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Haoqiang Zhang;Yonggang Zhang;Rongfei Zeng;Bo Han;Hao Wang;Defu Lian;Enhong Chen",
        "authorids": "~Haoqiang_Zhang1;~Yonggang_Zhang1;~Rongfei_Zeng1;~Bo_Han1;~Hao_Wang32;~Defu_Lian1;~Enhong_Chen1",
        "gender": ";M;M;M;M;M;M",
        "homepage": "https://github.com/zhq615;https://yonggangzhangben.github.io/index.html;https://wingfeitsang.github.io/home/;http://staff.ustc.edu.cn/~wanghao3/;https://faculty.ustc.edu.cn/liandefu/en/index.htm;http://staff.ustc.edu.cn/~cheneh;https://bhanml.github.io/",
        "dblp": ";27/6859-3;60/4331.html;181/2812-76;87/10734;07/258;241/0472-3",
        "google_scholar": ";XSbEr98AAAAJ;https://scholar.google.com/citations?hl=en;ou4Miu4AAAAJ;QW0ad4sAAAAJ;Q9h02J0AAAAJ;nTNjqHwAAAAJ",
        "orcid": ";0000-0002-4080-7592;;0000-0001-9921-2078;0000-0002-3507-9607;0000-0002-4835-4102;",
        "linkedin": ";;;;;;",
        "or_profile": "~Haoqiang_Zhang1;~Yonggang_Zhang1;~Rongfei_Zeng1;~Hao_Wang32;~Defu_Lian1;~Enhong_Chen1;~bo_han2",
        "aff": "University of Science and Technology of China;Hong Kong Baptist University;Northeastern University;University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China;MBZUAI",
        "aff_domain": "ustc.edu.cn;hkbu.edu.hk;neu.edu.cn;ustc.edu.cn;ustc.edu.cn;ustc.edu.cn;mbzuai.ac.ae",
        "position": "MS student;Postdoc;Associate Professor;Associate Researcher;Full Professor;Full Professor;Researcher",
        "bibtex": "@misc{\nzhang2024enhancing,\ntitle={Enhancing Graph Injection Attacks Through Over-Smoothing Amplification},\nauthor={Haoqiang Zhang and Yonggang Zhang and Rongfei Zeng and Bo Han and Hao Wang and Defu Lian and Enhong Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=lATusnzNRT}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZeoF;TwVy;Fsqv;Q12J;QKJu",
        "site": "https://openreview.net/forum?id=lATusnzNRT",
        "pdf_size": 451934,
        "rating": "3;3;3;5;5",
        "confidence": "5;3;3;4;4",
        "soundness": "2;2;2;3;2",
        "contribution": "2;2;2;2;2",
        "presentation": "2;2;3;3;2",
        "wc_summary": "43;94;51;112;39",
        "wc_strengths": "21;61;48;46;23",
        "wc_weaknesses": "173;158;243;185;192",
        "wc_questions": "105;6;160;3;79",
        "wc_review": "342;319;502;346;333",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            3.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.8,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.2,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            67.8,
            29.552664854459405
        ],
        "wc_strengths_avg": [
            39.8,
            15.43243337908834
        ],
        "wc_weaknesses_avg": [
            190.2,
            28.812497288503128
        ],
        "wc_questions_avg": [
            70.6,
            59.9819972991897
        ],
        "wc_review_avg": [
            368.4,
            67.44064056635287
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.21821789023599233,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:YNXxsN_SKYUJ:scholar.google.com/&scioq=Enhancing+Graph+Injection+Attacks+Through+Over-Smoothing+Amplification&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0;0;0;3",
        "aff_unique_norm": "University of Science and Technology of China;Hong Kong Baptist University;Northeastern University;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "http://www.ustc.edu.cn;https://www.hkbu.edu.hk;https://www.northeastern.edu;https://www.mbzuai.ac.ae",
        "aff_unique_abbr": "USTC;HKBU;NEU;MBZUAI",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;1;0;0;0;2",
        "aff_country_unique": "China;United States;United Arab Emirates"
    },
    {
        "title": "Assessing Uncertainty in Similarity Scoring: Performance & Fairness in Face Recognition",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17947",
        "id": "lAhQCHuANV",
        "author_site": "Jean-R\u00e9my Conti, Stephan CLEMENCON",
        "tldr": "",
        "abstract": "The ROC curve is the major tool for assessing not only the performance but also the fairness properties of a similarity scoring function. In order to draw reliable conclusions based on empirical ROC analysis, accurately evaluating the uncertainty level related to statistical versions of the ROC curves of interest is absolutely necessary, especially for applications with considerable societal impact such as Face Recognition.  In this article, we prove asymptotic guarantees for empirical ROC curves of similarity functions as well as for by-product metrics useful to assess fairness. We also explain that, because the false acceptance/rejection rates are of the form of U-statistics in the case of similarity scoring, the naive bootstrap approach may jeopardize the assessment procedure. A dedicated recentering technique must be used instead. Beyond the theoretical analysis carried out, various experiments using real face image datasets provide strong empirical evidence of the practical relevance of the methods promoted here, when applied to several ROC-based measures such as popular fairness metrics.",
        "keywords": "Uncertainty;Face;Recognition;Performance;ROC;Fairness;Bootstrap",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/239227429c3d2becfcf601e294b5477f223faddc.pdf",
        "author": "Jean-R\u00e9my Conti;Stephan Cl\u00e9men\u00e7on",
        "authorids": "~Jean-R\u00e9my_Conti1;~Stephan_Cl\u00e9men\u00e7on1",
        "gender": "M;M",
        "homepage": ";https://perso.telecom-paristech.fr/clemenco/",
        "dblp": ";85/6714",
        "google_scholar": "KdMJugsAAAAJ;",
        "orcid": ";",
        "linkedin": "jean-remy-conti-901354104;",
        "or_profile": "~Jean-R\u00e9my_Conti1;~Stephan_CLEMENCON1",
        "aff": "T\u00e9l\u00e9com ParisTech;T\u00e9l\u00e9com ParisTech",
        "aff_domain": "telecom-paristech.fr;telecom-paristech.fr",
        "position": "PhD student;Full Professor",
        "bibtex": "@inproceedings{\nconti2024assessing,\ntitle={Assessing Uncertainty in Similarity Scoring: Performance \\& Fairness in Face Recognition},\nauthor={Jean-R{\\'e}my Conti and Stephan Cl{\\'e}men{\\c{c}}on},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=lAhQCHuANV}\n}",
        "github": "",
        "project": "",
        "reviewers": "EFt7;XZHc;DZ4X",
        "pdf_size": 2301323,
        "rating": "5;6;8",
        "confidence": "3;4;3",
        "soundness": "3;3;4",
        "contribution": "2;3;3",
        "presentation": "2;3;3",
        "wc_summary": "105;16;82",
        "wc_strengths": "64;29;189",
        "wc_weaknesses": "128;68;168",
        "wc_questions": "128;1;60",
        "wc_review": "425;114;499",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "2111;1665;1108",
        "reply_reviewers": "0;0;0",
        "reply_authors": "4;3;2",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            67.66666666666667,
            37.72119946248911
        ],
        "wc_strengths_avg": [
            94.0,
            68.67799259345506
        ],
        "wc_weaknesses_avg": [
            121.33333333333333,
            41.096093353126506
        ],
        "wc_questions_avg": [
            63.0,
            51.89091121445707
        ],
        "wc_review_avg": [
            346.0,
            166.80727402204818
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1628.0,
            410.3080143826911
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            3.0,
            0.816496580927726
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.18898223650461363,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14874809423961291616&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=lAhQCHuANV",
        "pdf": "https://openreview.net/pdf?id=lAhQCHuANV",
        "email": "telecom-paristech.fr;telecom-paristech.fr",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "T\u00e9l\u00e9com ParisTech",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.telecom-paristech.fr",
        "aff_unique_abbr": "TP",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "France"
    },
    {
        "title": "Multi-Scale Representations by Varying Window Attention for Semantic Segmentation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17946",
        "id": "lAhWGOkpSR",
        "author_site": "Haotian Yan, Ming Wu, Chuang Zhang",
        "tldr": "",
        "abstract": "Multi-scale learning is central to semantic segmentation. We visualize the effective receptive field (ERF) of canonical multi-scale representations and point out two risks learning them: \\textit{scale inadequacy} and \\textit{field inactivation}. A novel multi-scale learner, \\textbf{varying window attention} (VWA), is presented to address these issues. VWA leverages the local window attention (LWA) and disentangles LWA into the query window and context window, allowing the context's scale to vary for the query to learn representations at multiple scales. \nHowever, varying the context to large-scale windows (enlarging ratio $R$) can significantly increase the memory footprint and computation cost ($R^2$ times larger than LWA). We propose a simple but professional re-scaling strategy to zero the extra induced cost without compromising performance. \nConsequently, VWA uses the same cost as LWA to overcome the receptive limitation of the local window.\nFurthermore, depending on VWA and employing various MLPs, we introduce a multi-scale decoder (MSD), \\textbf{VWFormer}, to improve multi-scale representations for semantic segmentation. VWFormer achieves efficiency competitive with the most compute-friendly MSDs, like FPN and MLP decoder, but performs much better than any MSDs. \nFor instance, using nearly half of UPerNet's computation, VWFormer outperforms it by $1.0\\%-2.5\\%$ mIoU on ADE20K.\nAt little extra overhead, $\\sim 10$G FLOPs, Mask2Former armed with VWFormer improves by $1.0\\%-1.3\\%$.",
        "keywords": "Semantic Segmentation;Multi-Scale Representations Learning;Attention",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Haotian Yan;Ming Wu;Chuang Zhang",
        "authorids": "~Haotian_Yan1;~Ming_Wu2;~Chuang_Zhang1",
        "gender": "M;;M",
        "homepage": "https://github.com/yan-hao-tian;;",
        "dblp": ";;",
        "google_scholar": ";;",
        "orcid": ";;0000-0002-1115-5580",
        "linkedin": ";;",
        "or_profile": "~Haotian_Yan1;~Ming_Wu2;~Chuang_Zhang1",
        "aff": "Beijing University of Posts and Telecommunications;;Beijing University of Posts and Telecommunications",
        "aff_domain": "bupt.edu.cn;;bupt.edu.cn",
        "position": "PhD student;;Full Professor",
        "bibtex": "@inproceedings{\nyan2024multiscale,\ntitle={Multi-Scale Representations by Varying Window Attention for Semantic Segmentation},\nauthor={Haotian Yan and Ming Wu and Chuang Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=lAhWGOkpSR}\n}",
        "github": "",
        "project": "",
        "reviewers": "Vryj;L266;u8Vk;1jxp",
        "pdf_size": 9322343,
        "rating": "5;6;6;6",
        "confidence": "3;5;4;3",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "96;57;60;84",
        "wc_strengths": "55;85;74;58",
        "wc_weaknesses": "127;256;56;31",
        "wc_questions": "39;152;48;30",
        "wc_review": "317;550;238;203",
        "wc_reply_reviewers": "30;58;12;18",
        "wc_reply_authors": "1053;1455;727;1056",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "4;3;2;3",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            74.25,
            16.345871038277526
        ],
        "wc_strengths_avg": [
            68.0,
            12.186057606953941
        ],
        "wc_weaknesses_avg": [
            117.5,
            87.3741952752642
        ],
        "wc_questions_avg": [
            67.25,
            49.342552629550894
        ],
        "wc_review_avg": [
            327.0,
            135.209097327066
        ],
        "wc_reply_reviewers_avg": [
            29.5,
            17.684739183827393
        ],
        "wc_reply_authors_avg": [
            1072.75,
            258.0352446856824
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5222329678670935,
        "gs_citation": 17,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8467536814256737550&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=lAhWGOkpSR",
        "pdf": "https://openreview.net/pdf?id=lAhWGOkpSR",
        "email": "bupt.edu.cn;;bupt.edu.cn",
        "author_num": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Beijing University of Posts and Telecommunications",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.bupt.edu.cn/",
        "aff_unique_abbr": "BUPT",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Beijing",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "lBUUNj0Fnz",
        "title": "Active Learning for Image Segmentation with Binary User Feedback",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep learning algorithms have depicted commendable performance in a variety of computer vision applications. However, training a robust deep neural network necessitates a large amount of labeled training data, which is time-consuming and labor-intensive to acquire. This problem is even more serious for an application like image segmentation, as the human oracle has to hand-annotate each and every pixel in a given training image, which is extremely laborious. Active learning algorithms automatically identify the salient and exemplar samples from large amounts of unlabeled data, and tremendously reduce human annotation effort in inducing a machine learning model. In this paper, we propose a novel active learning algorithm for image segmentation, with the goal of further reducing the labeling burden on the human oracles. Our framework identifies a batch of informative images, together with a list of semantic classes for each, and the human annotator merely needs to answer whether a given semantic class is present or absent in a given image. To the best of our knowledge, this is the first research effort to develop an active learning framework for image segmentation, which poses only binary (yes/no) queries to the users. We pose the image and class selection as a constrained optimization problem and derive a linear programming relaxation to select a batch of (image-class) pairs, which are maximally informative to the underlying deep neural network. Our extensive empirical studies on three challenging datasets corroborate the potential of our method in substantially reducing human annotation effort in real-world image segmentation applications.",
        "keywords": "active learning;image segmentation;binary user feedback",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Debanjan Goswami;Shayok Chakraborty",
        "authorids": "~Debanjan_Goswami1;~Shayok_Chakraborty1",
        "gender": "M;M",
        "homepage": ";http://shayokch.com/",
        "dblp": "298/8319;70/908",
        "google_scholar": "Ce-FKAYAAAAJ;5f3w1p0AAAAJ",
        "orcid": ";",
        "linkedin": "debanjan-goswami/;",
        "or_profile": "~Debanjan_Goswami1;~Shayok_Chakraborty1",
        "aff": "Intel Corporation;Florida State University",
        "aff_domain": "intel.com;fsu.edu",
        "position": "Intern;Associate Professor",
        "bibtex": "@misc{\ngoswami2024active,\ntitle={Active Learning for Image Segmentation with Binary User Feedback},\nauthor={Debanjan Goswami and Shayok Chakraborty},\nyear={2024},\nurl={https://openreview.net/forum?id=lBUUNj0Fnz}\n}",
        "github": "",
        "project": "",
        "reviewers": "eZUf;cBzD;nZpY;ZnPV",
        "site": "https://openreview.net/forum?id=lBUUNj0Fnz",
        "pdf_size": 2398387,
        "rating": "5;5;5;6",
        "confidence": "3;5;3;4",
        "soundness": "2;3;2;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;2;2",
        "wc_summary": "270;68;52;81",
        "wc_strengths": "175;15;49;19",
        "wc_weaknesses": "431;171;639;45",
        "wc_questions": "242;2;129;102",
        "wc_review": "1118;256;869;247",
        "wc_reply_reviewers": "26;0;0;32",
        "wc_reply_authors": "1456;875;871;213",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "3;3;3;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            117.75,
            88.49964689195093
        ],
        "wc_strengths_avg": [
            64.5,
            65.1363953562062
        ],
        "wc_weaknesses_avg": [
            321.5,
            230.16244263563073
        ],
        "wc_questions_avg": [
            118.75,
            85.44991222932883
        ],
        "wc_review_avg": [
            622.5,
            381.31515836640955
        ],
        "wc_reply_reviewers_avg": [
            14.5,
            14.654350889752845
        ],
        "wc_reply_authors_avg": [
            853.75,
            439.8905403620314
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            0.8660254037844386
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.17407765595569782,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:lQqIuYXGvnwJ:scholar.google.com/&scioq=Active+Learning+for+Image+Segmentation+with+Binary+User+Feedback&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Intel;Florida State University",
        "aff_unique_dep": "Intel Corporation;",
        "aff_unique_url": "https://www.intel.com;https://www.fsu.edu",
        "aff_unique_abbr": "Intel;FSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "lBY65YaAho",
        "title": "Self Guided Exploration for Automatic and Diverse AI Supervision",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Training large transformers using next-token prediction has given rise to groundbreaking advancements in AI. \nWhile this generative AI approach has produced impressive results, it heavily leans on human supervision. \nEven state-of-the-art AI models like ChatGPT depend on fine-tuning through human demonstrations, demanding extensive human input and domain expertise. This strong reliance on human oversight poses a significant hurdle to the advancement of AI innovation.\nTo address this limitation, we propose a novel paradigm termed Exploratory AI (EAI) aimed at autonomously generating high-quality training data. \nDrawing inspiration from the principles of unsupervised reinforcement learning (RL) pretraining, EAI achieves exploration within the natural language space. We accomplish this by harnessing large language models to assess the novelty of generated content. Our approach employs two key components: an actor that generates novel content and a critic that evaluates the generated content, offering critiques to guide the actor. \nEmpirical evaluations demonstrate that EAI significantly boosts model performance on complex reasoning tasks, addressing the limitations of human-intensive supervision.",
        "keywords": "Language models;Reinforcement Learning;Unsupervised Reinforcement Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/9e9fb11fe9a182dc12dae9ba88e8bf31eed71bf1.pdf",
        "author": "Hao Liu;Matei Zaharia;Pieter Abbeel",
        "authorids": "~Hao_Liu1;~Matei_Zaharia1;~Pieter_Abbeel2",
        "gender": "M;M;M",
        "homepage": "https://cs.stanford.edu/~matei/;https://people.eecs.berkeley.edu/~pabbeel/;https://haoliu.ai",
        "dblp": "36/2133;;09/3214-55",
        "google_scholar": "I1EvjZsAAAAJ;https://scholar.google.com.tw/citations?user=vtwH6GkAAAAJ;wtK4Yh4AAAAJ",
        "orcid": "0000-0002-7547-7204;;",
        "linkedin": "mateizaharia/;;",
        "or_profile": "~Matei_Zaharia1;~Pieter_Abbeel2;~Hao_Liu10",
        "aff": "Databricks;Covariant;University of California, Berkeley",
        "aff_domain": "databricks.com;covariant.ai;berkeley.edu",
        "position": "CTO;Founder;PhD student",
        "bibtex": "@misc{\nliu2024self,\ntitle={Self Guided Exploration for Automatic and Diverse {AI} Supervision},\nauthor={Hao Liu and Matei Zaharia and Pieter Abbeel},\nyear={2024},\nurl={https://openreview.net/forum?id=lBY65YaAho}\n}",
        "github": "",
        "project": "",
        "reviewers": "uvsC;td87;1gMq;7sTU",
        "site": "https://openreview.net/forum?id=lBY65YaAho",
        "pdf_size": 1929799,
        "rating": "3;3;6;6",
        "confidence": "3;3;3;4",
        "soundness": "1;2;3;4",
        "contribution": "1;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "295;43;113;44",
        "wc_strengths": "82;33;116;43",
        "wc_weaknesses": "403;148;212;156",
        "wc_questions": "7;2;34;4",
        "wc_review": "787;226;475;247",
        "wc_reply_reviewers": "0;0;0;26",
        "wc_reply_authors": "786;810;876;498",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "2;2;2;1",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            1.118033988749895
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            123.75,
            102.8624688601241
        ],
        "wc_strengths_avg": [
            68.5,
            32.973474187595095
        ],
        "wc_weaknesses_avg": [
            229.75,
            103.0203256644047
        ],
        "wc_questions_avg": [
            11.75,
            12.968712349342937
        ],
        "wc_review_avg": [
            433.75,
            226.12095767531147
        ],
        "wc_reply_reviewers_avg": [
            6.5,
            11.258330249197702
        ],
        "wc_reply_authors_avg": [
            742.5,
            144.95775246602025
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5773502691896258,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:8MjPNn3_11EJ:scholar.google.com/&scioq=Self+Guided+Exploration+for+Automatic+and+Diverse+AI+Supervision&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Databricks;Covariant;University of California, Berkeley",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://databricks.com;;https://www.berkeley.edu",
        "aff_unique_abbr": "Databricks;;UC Berkeley",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Berkeley",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States;"
    },
    {
        "id": "lBdE9r5XZV",
        "title": "Factored-NeuS: Reconstructing Surfaces, Illumination, and Materials of Possibly Glossy Objects",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We develop a method that recovers the surface, materials, and illumination of a scene from its posed multi-view images. In contrast to prior work, it does not require any additional data and can handle glossy objects or bright lighting. It is a progressive inverse rendering approach, which consists of three stages. In the first stage, we reconstruct the scene radiance and signed distance function (SDF) with a novel regularization strategy for specular reflections. Our approach considers both the diffuse and specular colors, which allows for handling complex view-dependent lighting effects for surface reconstruction. In the second stage, we distill light visibility and indirect illumination from the learned SDF and radiance field using learnable mapping functions. Finally, we design a method for estimating the ratio of incoming direct light reflected in a specular manner and use it to reconstruct the materials and direct illumination. Experimental results demonstrate that the proposed method outperforms the current state-of-the-art in recovering surfaces, materials, and lighting without relying on any additional data.",
        "keywords": "Glossy surface;materials;illumination;diffuse;specular",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/5ff53e4cc24d1bbd8453562d24c12556365dd61a.zip",
        "author": "Yue Fan;Ivan Skorokhodov;Oleg Voynov;Savva Victorovich Ignatyev;Evgeny Burnaev;Peter Wonka;Yiqun Wang",
        "authorids": "~Yue_Fan4;~Ivan_Skorokhodov1;~Oleg_Voynov1;~Savva_Victorovich_Ignatyev1;~Evgeny_Burnaev1;~Peter_Wonka1;~Yiqun_Wang1",
        "gender": "M;M;M;M;M;M;M",
        "homepage": "https://github.com/lin-yao-yue;https://universome.github.io/;;;http://faculty.skoltech.ru/people/evgenyburnaev;http://peterwonka.net;",
        "dblp": ";223/0010;255/4779;;144/7845;98/5522;71/2818-1",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;https://scholar.google.ru/citations?user=tMqapicAAAAJ;aJyxXoMAAAAJ;https://scholar.google.ru/citations?user=pCRdcOwAAAAJ;https://scholar.google.com.tw/citations?user=0EKXSXgAAAAJ;g55eWKgAAAAJ",
        "orcid": ";0000-0002-7611-9310;0000-0002-3666-9166;;0000-0001-8424-0690;0000-0003-0627-9746;",
        "linkedin": ";ivan-skorokhodov;;;;;",
        "or_profile": "~Yue_Fan4;~Ivan_Skorokhodov1;~Oleg_Voynov1;~Savva_Victorovich_Ignatyev1;~Evgeny_Burnaev1;~Peter_Wonka1;~Yiqun_Wang1",
        "aff": "Chongqing University;Snap Inc.;Artificial Intelligence Research Institute;Skolkovo Institute of Science and Technology;Skolkovo Institute of Science and Technology;KAUST;Chongqing University",
        "aff_domain": "cqu.edu.cn;snap.com;airi.net;skoltech.ru;skoltech.ru;kaust.edu.sa;cqu.edu.cn",
        "position": "MS student;Researcher;Researcher;Researcher;Full Professor;Full Professor;Associate Professor",
        "bibtex": "@misc{\nfan2024factoredneus,\ntitle={Factored-NeuS: Reconstructing Surfaces, Illumination, and Materials of Possibly Glossy Objects},\nauthor={Yue Fan and Ivan Skorokhodov and Oleg Voynov and Savva Victorovich Ignatyev and Evgeny Burnaev and Peter Wonka and Yiqun Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=lBdE9r5XZV}\n}",
        "github": "",
        "project": "",
        "reviewers": "4mZH;8TvC;c69R;nhZb",
        "site": "https://openreview.net/forum?id=lBdE9r5XZV",
        "pdf_size": 12201282,
        "rating": "3;6;6;8",
        "confidence": "4;5;4;4",
        "soundness": "2;3;3;4",
        "contribution": "2;3;3;4",
        "presentation": "2;4;3;3",
        "wc_summary": "104;124;144;78",
        "wc_strengths": "75;163;163;171",
        "wc_weaknesses": "394;147;214;287",
        "wc_questions": "126;72;100;133",
        "wc_review": "699;506;621;669",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1952;484;616;799",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;1;1;2",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            112.5,
            24.428467000612216
        ],
        "wc_strengths_avg": [
            143.0,
            39.395431207184416
        ],
        "wc_weaknesses_avg": [
            260.5,
            91.6092244263644
        ],
        "wc_questions_avg": [
            107.75,
            24.02472684548151
        ],
        "wc_review_avg": [
            623.75,
            73.4553435768971
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            962.75,
            581.9937177495991
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.08084520834544431,
        "gs_citation": 17,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13011501718079605659&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;2;3;3;4;0",
        "aff_unique_norm": "Chongqing University;Snap Inc.;Artificial Intelligence Research Institute;Skolkovo Institute of Science and Technology;King Abdullah University of Science and Technology",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.cqu.edu.cn;https://www.snapinc.com;;https://www.skoltech.ru;https://www.kaust.edu.sa",
        "aff_unique_abbr": "CQU;Snap;;Skoltech;KAUST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;2;2;3;0",
        "aff_country_unique": "China;United States;Russian Federation;Saudi Arabia"
    },
    {
        "id": "lBwxmTbY6Z",
        "title": "Tensor Time-Series Forecasting and Anomaly Detection with Augmented Causality",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In time series, variables often exhibit high-dimensional characteristics, and relationships between variables tend to be intricate, encompassing aspects such as non-linearity and time-dependency. Understanding the interaction of variables and comprehending the distribution of their values can significantly enhance the effectiveness of time series data analysis tasks, such as forecasting and anomaly detection. Hence, in this paper, we start from the tensor time series, which can encode higher dimensional information than classic multivariate time series, and aim to discover and leverage their fine-grained time-dependent causal relations to contribute to a more accurate analysis. To this end, we first form an augmented Granger Causality model, named TBN-Granger Causality, which adds time-respecting Bayesian Networks to the time-lagged Neural Granger Causality through a bi-level optimization, such that the overlooking of instantaneous effects in typical causal time series analysis can be addressed. Then, we propose an end-to-end deep generative model, named TacSas, which takes the historical tensor time series, outputs the future tensor time series, and detects possible anomalies, by leveraging the TBN-Granger Causality in the history. Moreover, we show TacSas not only can capture the ground-truth causality but also can be applied when the ground-truth causal structures are hardly available, to help forecasting and anomaly detection. For evaluations, besides synthetic benchmark data, we have four datasets from the climate domain benchmark database ERA5 as the real-world tensor time series for forecasting. Moreover, we extend ERA5 with the extreme weather database NOAA for testing anomaly detection accuracy. We show the effectiveness of TacSas in different time series analysis tasks by comparing with causal baselines, forecasting baselines, and anomaly detection baselines.",
        "keywords": "Time Series;Forecasting;Anomaly Detection",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Dongqi Fu;Yada Zhu;Hanghang Tong;Kommy Weldemariam;Onkar Bhardwaj;Jingrui He",
        "authorids": "~Dongqi_Fu1;~Yada_Zhu1;~Hanghang_Tong3;~Kommy_Weldemariam1;~Onkar_Bhardwaj1;~Jingrui_He1",
        "gender": "M;;;;;F",
        "homepage": "https://dongqifu.github.io/;https://researcher.watson.ibm.com/researcher/view.php?person=us-yzhu;http://tonghanghang.org;https://research.ibm.com/people/kommy-weldemariam--1;;https://www.hejingrui.org",
        "dblp": "273/0228;56/8808;58/1757;61/5240.html;;34/2685",
        "google_scholar": "WByXZAcAAAAJ;AJb408gAAAAJ;RaINcuUAAAAJ;lHXu6nkAAAAJ;;hXpZynkAAAAJ",
        "orcid": "0000-0002-8726-9234;0000-0002-3338-6371;0000-0003-4405-3887;;;0000-0002-6429-6272",
        "linkedin": ";yadazhu/;htong/;https://www.linkedin.com/feed/;;",
        "or_profile": "~Dongqi_Fu1;~Yada_Zhu1;~Hanghang_Tong3;~Kommy_Weldemariam1;~Onkar_Bhardwaj1;~Jingrui_He1",
        "aff": "University of Illinois, Urbana Champaign;IBM Research;University of Illinois, Urbana Champaign;;;University of Illinois, Urbana Champaign",
        "aff_domain": "illinois.edu;us.ibm.com;illinois.edu;;;illinois.edu",
        "position": "PhD student;Principal Research Scientist;Associate Professor;;;Full Professor",
        "bibtex": "@misc{\nfu2024tensor,\ntitle={Tensor Time-Series Forecasting and Anomaly Detection with Augmented Causality},\nauthor={Dongqi Fu and Yada Zhu and Hanghang Tong and Kommy Weldemariam and Onkar Bhardwaj and Jingrui He},\nyear={2024},\nurl={https://openreview.net/forum?id=lBwxmTbY6Z}\n}",
        "github": "",
        "project": "",
        "reviewers": "TM7t;TMqL;kqnD;kHDs",
        "site": "https://openreview.net/forum?id=lBwxmTbY6Z",
        "pdf_size": 7264721,
        "rating": "1;3;3;8",
        "confidence": "3;4;3;3",
        "soundness": "1;2;3;3",
        "contribution": "1;1;2;3",
        "presentation": "2;2;3;3",
        "wc_summary": "80;86;55;67",
        "wc_strengths": "26;29;48;34",
        "wc_weaknesses": "202;371;220;20",
        "wc_questions": "1;6;88;44",
        "wc_review": "309;492;411;165",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "307;450;483;200",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.75,
            2.5860201081971503
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            72.0,
            11.979148550710939
        ],
        "wc_strengths_avg": [
            34.25,
            8.437268515343103
        ],
        "wc_weaknesses_avg": [
            203.25,
            124.50175701571445
        ],
        "wc_questions_avg": [
            34.75,
            34.95264653785175
        ],
        "wc_review_avg": [
            344.25,
            122.12570368272193
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            360.0,
            113.6199806372101
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.16744367165578428,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ULW8C_Ibo4MJ:scholar.google.com/&scioq=Tensor+Time-Series+Forecasting+and+Anomaly+Detection+with+Augmented+Causality&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "University of Illinois Urbana-Champaign;IBM",
        "aff_unique_dep": ";IBM Research",
        "aff_unique_url": "https://illinois.edu;https://www.ibm.com/research",
        "aff_unique_abbr": "UIUC;IBM",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Urbana-Champaign;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "lCLdLlXAvt",
        "title": "Average Sensitivity of Hierarchical Clustering",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Hierarchical clustering is one of the most popular methods used to extract cluster structures in a dataset.\nHowever, if the hierarchical clustering algorithm is sensitive to a small perturbation to the dataset, then the credibility and replicability of the output hierarchical clustering are compromised. \nTo address this issue, we consider the average sensitivity of hierarchical clustering algorithms, which measures the change in the output hierarchical clustering upon deletion of a random data point from the dataset.\nThen, we propose a divisive hierarchical clustering algorithm with which we can tune the average sensitivity.\nExperimental results on benchmark and real-world datasets confirm that the proposed method is stable against the deletion of a few data points, while existing algorithms are not.",
        "keywords": "hierarchical clustering;average sensitivity",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/c7b247cd43cab299c4c3acea03efdbc22a6f6cd8.zip",
        "author": "Satoshi Hara;Koh Takeuchi;Yuichi Yoshida",
        "authorids": "~Satoshi_Hara1;~Koh_Takeuchi1;~Yuichi_Yoshida1",
        "gender": "M;M;M",
        "homepage": "https://sites.google.com/site/sato9hara/;https://www.ml.ist.i.kyoto-u.ac.jp/koh.takeuchi/;http://research.nii.ac.jp/~yyoshida/",
        "dblp": "08/778-1;124/7243-1.html;36/4449.html",
        "google_scholar": "https://scholar.google.co.jp/citations?user=ELhfkiMAAAAJ;https://scholar.google.co.jp/citations?user=TG7jlRoAAAAJ;https://scholar.google.co.jp/citations?user=EIXTG_UAAAAJ",
        "orcid": ";0000-0002-3245-888X;",
        "linkedin": ";;",
        "or_profile": "~Satoshi_Hara1;~Koh_Takeuchi1;~Yuichi_Yoshida1",
        "aff": "Osaka University;Kyoto University;National Institute of Informatics",
        "aff_domain": "osaka-u.ac.jp;i.kyoto-u.ac.jp;nii.ac.jp",
        "position": "Associate Professor;Lecturer;Full Professor",
        "bibtex": "@misc{\nhara2024average,\ntitle={Average Sensitivity of Hierarchical Clustering},\nauthor={Satoshi Hara and Koh Takeuchi and Yuichi Yoshida},\nyear={2024},\nurl={https://openreview.net/forum?id=lCLdLlXAvt}\n}",
        "github": "",
        "project": "",
        "reviewers": "qQY7;seUc;8UiG;essW",
        "site": "https://openreview.net/forum?id=lCLdLlXAvt",
        "pdf_size": 1493602,
        "rating": "3;3;5;6",
        "confidence": "4;3;4;4",
        "soundness": "2;3;2;3",
        "contribution": "2;1;2;2",
        "presentation": "2;3;2;3",
        "wc_summary": "23;188;58;191",
        "wc_strengths": "71;30;27;88",
        "wc_weaknesses": "114;170;163;77",
        "wc_questions": "21;130;8;61",
        "wc_review": "229;518;256;417",
        "wc_reply_reviewers": "0;27;0;94",
        "wc_reply_authors": "360;441;350;507",
        "reply_reviewers": "0;1;0;2",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            115.0,
            75.5281404510928
        ],
        "wc_strengths_avg": [
            54.0,
            26.22022120425379
        ],
        "wc_weaknesses_avg": [
            131.0,
            37.914377220257755
        ],
        "wc_questions_avg": [
            55.0,
            47.502631506054485
        ],
        "wc_review_avg": [
            355.0,
            118.41663734458938
        ],
        "wc_reply_reviewers_avg": [
            30.25,
            38.42118556213486
        ],
        "wc_reply_authors_avg": [
            414.5,
            64.0097648800556
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5555555555555555,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:UtHjorn9XgoJ:scholar.google.com/&scioq=Average+Sensitivity+of+Hierarchical+Clustering&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Osaka University;Kyoto University;National Institute of Informatics",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.osaka-u.ac.jp;https://www.kyoto-u.ac.jp;https://www.nii.ac.jp/",
        "aff_unique_abbr": "Osaka U;Kyoto U;NII",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Japan"
    },
    {
        "id": "lCxic1APct",
        "title": "Balance Beam: adaptive computation for affordable training and inference with high-throughput offloading for LLMs",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "With the surging growth of model parameters, foundation models pose unprecedented challenges to traditional computational infrastructure. These large models intrinsically require substantial accelerator memory to accommodate massive tensors including model weights, activations, and optimizer states during pre-training, fine-tuning or even inference stages. To alleviate such intense pressure on memory, besides introducing excessive accelerators to suffice high demand of memory, offloading these parameters from accelerator to other storage medium such as DRAM is a preferable option for fine-tuning or inference with the model under computationally restricted circumstances. However, the prohibitive costs of data movement render it a theoretically plausible yet practically unpreferred solution. Previously state-of-the-art methodologies enhanced inference performance by retaining partial model state $\\textit{in-situ}$ across multiple mini batches to boost inference performance but incur intricate hyperparameters and excessive overhead of exchanging cache. In this work, we propose a comprehensive workflow to address these challenges, with focuses on dynamic analysis of model-system compatibility and prioritizing computational intensity over data movement. We have shown that the proposed workflow facilitates both fine-tuning and inference of foundation models with higher throughput in restricted computational resources. Compared to state-of-the-art approach, our framework attains a remarkable speedup of over 4x for training and 2x for inference, using a 30-billion parameter model on a singular NVIDIA A100 GPU.",
        "keywords": "Deep Learning;Heterogenous Computing;Offloading;Large Batch Training;Large Language Model",
        "primary_area": "infrastructure, software libraries, hardware, etc.",
        "supplementary_material": "",
        "author": "Yiqi Zhang;Yang You",
        "authorids": "~Yiqi_Zhang2;~Yang_You1",
        "gender": "M;M",
        "homepage": ";https://www.comp.nus.edu.sg/~youy/",
        "dblp": ";33/8167-1.html",
        "google_scholar": "https://scholar.google.com/citations?hl=en;jF4dPZwAAAAJ",
        "orcid": "0000-0002-8337-5929;",
        "linkedin": ";yang-you-0b92914b/",
        "or_profile": "~Yiqi_Zhang2;~Yang_You1",
        "aff": "National University of Singapore;National University of Singapore",
        "aff_domain": "nus.edu;nus.edu.sg",
        "position": "PhD student;Professor",
        "bibtex": "@misc{\nzhang2024balance,\ntitle={Balance Beam: adaptive computation for affordable training and inference with high-throughput offloading for {LLM}s},\nauthor={Yiqi Zhang and Yang You},\nyear={2024},\nurl={https://openreview.net/forum?id=lCxic1APct}\n}",
        "github": "",
        "project": "",
        "reviewers": "ttTz;uQcc;uduE",
        "site": "https://openreview.net/forum?id=lCxic1APct",
        "pdf_size": 4721911,
        "rating": "3;3;5",
        "confidence": "4;4;4",
        "soundness": "2;3;2",
        "contribution": "1;2;2",
        "presentation": "1;1;2",
        "wc_summary": "42;56;39",
        "wc_strengths": "30;116;27",
        "wc_weaknesses": "403;434;73",
        "wc_questions": "11;26;102",
        "wc_review": "486;632;241",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            45.666666666666664,
            7.408703590297623
        ],
        "wc_strengths_avg": [
            57.666666666666664,
            41.26607430915726
        ],
        "wc_weaknesses_avg": [
            303.3333333333333,
            163.3612221088251
        ],
        "wc_questions_avg": [
            46.333333333333336,
            39.83577398380617
        ],
        "wc_review_avg": [
            453.0,
            161.32162491949634
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:q8nQijbDHDIJ:scholar.google.com/&scioq=Balance+Beam:+adaptive+computation+for+affordable+training+and+inference+with+high-throughput+offloading+for+LLMs&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "National University of Singapore",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nus.edu.sg",
        "aff_unique_abbr": "NUS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Singapore"
    },
    {
        "title": "Predicting Emergent Abilities with Infinite Resolution Evaluation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17945",
        "id": "lDbjooxLkD",
        "author_site": "Shengding Hu, Xin Liu, Xu Han, Xinrong Zhang, Chaoqun He, Weilin Zhao, Yankai Lin, Ning Ding, Zebin Ou, Guoyang Zeng, Zhiyuan Liu, Maosong Sun",
        "tldr": "",
        "abstract": "The scientific scale-up of large language models (LLMs) necessitates a comprehensive understanding of their scaling properties. However, the existing literature on the scaling properties only yields an incomplete answer: optimization loss decreases predictably as the model size increases, in line with established scaling law; yet no scaling law for task has been established and the task performances are far from predictable during scaling. Task performances typically show minor gains on small models until they improve dramatically once models exceed a size threshold, exemplifying the ''emergent abilities''. In this study, we discover that small models, although they exhibit minor performance, demonstrate critical and consistent task performance improvements that are not captured by conventional evaluation strategies due to insufficient measurement resolution. To measure such improvements, we introduce PassUntil, an evaluation strategy with theoretically infinite resolution, through massive sampling in the decoding phase. With PassUntil, we conduct a quantitative investigation into the scaling law of task performance. The investigation contains two parts. Firstly, a strict task scaling law that is not conventionally known to exist, is identified, enhancing the predictability of task performances. Remarkably, we are able to predict the performance of the 2.4B model on code generation with merely 0.05\\% deviation before training starts, which is the first systematic attempt to verify predictable scaling proposed by GPT-4's report. Secondly, underpinned by PassUntil, we are able to study emergent abilities quantitatively. We identify a kind of accelerated emergence whose scaling curve cannot be fitted by standard scaling law function and has a increasing speed. We then examine two hypothesis and imply that the ``multiple circuits hypothesis'' might be responsible for the accelerated emergence.",
        "keywords": "Predictable Scaling; Scaling Law; Large Language Models; Pre-train;",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/aed2c4d7016a3fd7578c1134c9b9213ec1349569.zip",
        "author": "Shengding Hu;Xin Liu;Xu Han;Xinrong Zhang;Chaoqun He;Weilin Zhao;Yankai Lin;Ning Ding;Zebin Ou;Guoyang Zeng;Zhiyuan Liu;Maosong Sun",
        "authorids": "~Shengding_Hu2;~Xin_Liu19;~Xu_Han2;~Xinrong_Zhang1;~Chaoqun_He1;~Weilin_Zhao1;~Yankai_Lin1;~Ning_Ding5;~Zebin_Ou1;~Guoyang_Zeng1;~Zhiyuan_Liu1;~Maosong_Sun1",
        "gender": ";M;;F;M;M;M;M;;M;M;M",
        "homepage": ";https://github.com/liuxin99;;;https://hothan01.github.io/;https://brawny-college-5b2.notion.site/Weilin-Zhao-11d20b7deb8280388213d5f5ed072992?pvs=4;https://linyankai.github.io/;https://www.stingning.cn/;;https://github.com/a710128/;http://nlp.csai.tsinghua.edu.cn/~lzy;https://www.cs.tsinghua.edu.cn/csen/info/1312/4394.htm",
        "dblp": ";;;;358/5914;197/5702.html;161/0001.html;;195/1849;252/5581;53/3245-1;95/3291-1",
        "google_scholar": ";;;https://scholar.google.com.hk/citations?user=IvTrgR0AAAAJ;hTVIwkwAAAAJ;_CR92HUAAAAJ;https://scholar.google.com.hk/citations?user=j8K1FqEAAAAJ;uZXQuYAAAAAJ;znJISzAAAAAJ;;dT0v5u0AAAAJ;https://scholar.google.com.tw/citations?user=zIgT0HMAAAAJ",
        "orcid": ";;;0009-0001-3963-8891;;0000-0001-8016-1952;0000-0002-9182-8158;;;;0000-0002-7709-2543;",
        "linkedin": ";;;;;;;;;;;",
        "or_profile": "~Shengding_Hu2;~Xin_Liu19;~Xu_Han2;~Xinrong_Zhang1;~Chaoqun_He1;~Weilin_Zhao1;~Yankai_Lin1;~Ning_Ding5;~Zebin_Ou1;~Guoyang_Zeng1;~Zhiyuan_Liu1;~Maosong_Sun1",
        "aff": ";Beijing Language and Culture University;;Tsinghua University;Tsinghua University;Tsinghua University;Renmin University of China;Tsinghua University;Zhihu;;Tsinghua University;Tsinghua University",
        "aff_domain": ";blcu.edu.cn;;tsinghua.edu.cn;mail.tsinghua.edu.cn;tsinghua.edu.cn;ruc.edu.cn;mail.tsinghua.edu.cn;zhihu.com;;tsinghua.edu.cn;tsinghua.edu.cn",
        "position": ";MS student;;PhD student;MS student;PhD student;Assistant Professor;Postdoc;Researcher;;Associate Professor;Full Professor",
        "bibtex": "@inproceedings{\nhu2024predicting,\ntitle={Predicting Emergent Abilities with Infinite Resolution Evaluation},\nauthor={Shengding Hu and Xin Liu and Xu Han and Xinrong Zhang and Chaoqun He and Weilin Zhao and Yankai Lin and Ning Ding and Zebin Ou and Guoyang Zeng and Zhiyuan Liu and Maosong Sun},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=lDbjooxLkD}\n}",
        "github": "",
        "project": "",
        "reviewers": "jwFq;BHGc;5dKH;v7YM",
        "pdf_size": 3002146,
        "rating": "5;5;6;8",
        "confidence": "3;3;4;5",
        "soundness": "3;2;3;4",
        "contribution": "2;3;3;4",
        "presentation": "3;3;3;4",
        "wc_summary": "63;81;61;37",
        "wc_strengths": "66;88;43;41",
        "wc_weaknesses": "198;82;106;1399",
        "wc_questions": "146;213;27;81",
        "wc_review": "473;464;237;1558",
        "wc_reply_reviewers": "0;0;52;0",
        "wc_reply_authors": "482;770;480;1790",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;2;4",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            60.5,
            15.644487847162015
        ],
        "wc_strengths_avg": [
            59.5,
            19.1637678967368
        ],
        "wc_weaknesses_avg": [
            446.25,
            551.7718618233445
        ],
        "wc_questions_avg": [
            116.75,
            69.73655784450506
        ],
        "wc_review_avg": [
            683.0,
            513.9557373937954
        ],
        "wc_reply_reviewers_avg": [
            13.0,
            22.516660498395403
        ],
        "wc_reply_authors_avg": [
            880.5,
            538.192112539751
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            12,
            0
        ],
        "corr_rating_confidence": 0.9847319278346618,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10206273354320291446&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=lDbjooxLkD",
        "pdf": "https://openreview.net/pdf?id=lDbjooxLkD",
        "email": ";blcu.edu.cn;;tsinghua.edu.cn;mail.tsinghua.edu.cn;tsinghua.edu.cn;ruc.edu.cn;mail.tsinghua.edu.cn;zhihu.com;;tsinghua.edu.cn;tsinghua.edu.cn",
        "author_num": 12,
        "aff_unique_index": "0;1;1;1;2;1;3;1;1",
        "aff_unique_norm": "Beijing Language and Culture University;Tsinghua University;Renmin University of China;Zhihu",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "http://www.blcu.edu.cn;https://www.tsinghua.edu.cn;http://www.ruc.edu.cn;https://www.zhihu.com",
        "aff_unique_abbr": "BLCU;THU;RUC;Zhihu",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "lEkFq4RUCX",
        "title": "Directional Distance Field for Modeling the Difference between 3D Point Clouds",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Quantifying the dissimilarity between two unstructured 3D point clouds is challenging yet essential, with existing metrics often relying on measuring the distance between corresponding points which can be either inefficient or ineffective. In this paper, we propose a novel distance metric called directional distance field (DDF), which computes the difference between the underlying 3D surfaces calibrated and induced by a set of reference points. By associating each reference point with two given point clouds through computing its directional distances to them, the difference in directional distances of an identical reference point characterizes the geometric difference between a typical local region of the two point clouds. Finally, DDF is obtained by averaging the directional distance differences of all reference points. We evaluate DDF on various optimization and unsupervised learning-based tasks, including shape reconstruction, rigid registration, scene flow estimation, and feature representation. Extensive experiments show that DDF achieves significantly higher accuracy under all tasks in a memory and computationally efficient manner, compared with existing metrics. As a generic metric, DDF can unleash the potential of optimization and learning-based frameworks for 3D point cloud processing and analysis. We include the source code in the supplementary material.",
        "keywords": "3D point cloud",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/3576d4998e3e1612594f9cf7eb78d8768a197a90.zip",
        "author": "Siyu Ren;Junhui Hou",
        "authorids": "~Siyu_Ren3;~Junhui_Hou2",
        "gender": "M;M",
        "homepage": "https://scholars.cityu.edu.hk/en/persons/siyu-ren(3eb70e9f-b56c-4ce5-88e6-c7ffbbcbaf36).html;http://www.cityu.edu.hk/stfprofile/csjhhou.htm",
        "dblp": ";122/2673.html",
        "google_scholar": "xSm7_VwAAAAJ;j6eefhwAAAAJ",
        "orcid": ";0000-0003-3431-2021",
        "linkedin": "siyu-ren-22403a227/;",
        "or_profile": "~Siyu_Ren3;~Junhui_Hou2",
        "aff": "Tianjin University;City University of Hong Kong",
        "aff_domain": "tju.edu.cn;cityu.edu.hk",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nren2024directional,\ntitle={Directional Distance Field for Modeling the Difference between 3D Point Clouds},\nauthor={Siyu Ren and Junhui Hou},\nyear={2024},\nurl={https://openreview.net/forum?id=lEkFq4RUCX}\n}",
        "github": "",
        "project": "",
        "reviewers": "4UtW;pepa;UzJy",
        "site": "https://openreview.net/forum?id=lEkFq4RUCX",
        "pdf_size": 18247405,
        "rating": "5;6;8",
        "confidence": "4;5;3",
        "soundness": "2;3;4",
        "contribution": "1;3;3",
        "presentation": "2;2;3",
        "wc_summary": "50;45;64",
        "wc_strengths": "50;57;51",
        "wc_weaknesses": "194;174;26",
        "wc_questions": "13;22;42",
        "wc_review": "307;298;183",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "835;718;393",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            53.0,
            8.04155872120988
        ],
        "wc_strengths_avg": [
            52.666666666666664,
            3.091206165165235
        ],
        "wc_weaknesses_avg": [
            131.33333333333334,
            74.92811369721129
        ],
        "wc_questions_avg": [
            25.666666666666668,
            12.119772641798562
        ],
        "wc_review_avg": [
            262.6666666666667,
            56.45253660278596
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            648.6666666666666,
            186.98722475672562
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.6546536707079772,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:6VPomDOi8QsJ:scholar.google.com/&scioq=Directional+Distance+Field+for+Modeling+the+Difference+between+3D+Point+Clouds&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Tianjin University;City University of Hong Kong",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.tju.edu.cn;https://www.cityu.edu.hk",
        "aff_unique_abbr": "TJU;CityU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "lEmm0hYA2u",
        "title": "ZeroP: Zero-Shot Quantization via Proxy Data",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Zero-shot quantization (ZSQ) is a promising approach for achieving low-bit constraint networks without relying on the original data (OD). However, due to the high cost and privacy concerns associated with OD, it is often scarce, leading to the unsatisfactory performance of ZSQ. Most ZSQ methods rely solely on synthetic data (SD) to mitigate this issue. In this paper, we propose a novel ZSQ framework, named ZeroP, that leverages publicly available data - proxy data (PD) - as a substitute for the OD. We first explore the impact of PD on the performance of current ZSQ methods over 16 different computer vision datasets and introduce a simple and effective PD selection method based on batch-normalization statistics(BNS) to select the optimal PD. We then apply ZeroP to three state-of-the-art pure-SD (using only SD) methods, achieving 7% to 16% improvements in accuracy for MobileNetV1 on ImageNet-1K in a 4-bit setting. Furthermore, we demonstrate the effectiveness of ZeroP on extensive models and datasets. For example, ZeroP achieves a top-1 accuracy of 72.17% for ResNet-50 on ImageNet-1K in a 4-bit setting, outperforming the SOTA pure-SD method by 3.9%. Overall, our results indicate that ZeroP offers a promising solution for achieving high-performance low-bit networks without relying on original training data and opens up new avenues for using publicly available data for data-free tasks.",
        "keywords": "Zero-Shot; Quantization; Data-Free; Proxy Data;",
        "primary_area": "infrastructure, software libraries, hardware, etc.",
        "supplementary_material": "/attachment/cb6015d4ea64b280fde3e3a3822f795938249d40.pdf",
        "author": "GuangYan Zhang;Hongmin Xu;Zhitong Zheng;Haifeng Liu",
        "authorids": "~GuangYan_Zhang2;~Hongmin_Xu1;~Zhitong_Zheng2;~Haifeng_Liu6",
        "gender": "M;M;;M",
        "homepage": "https://github.com/GuangyanZhang;https://hermetist.github.io/hongmim-xu/;https://www.sgpjbg.com/baogao/82896.html;https://www.linkedin.com/in/haifeng-liu/",
        "dblp": ";27/8538;;84/33",
        "google_scholar": ";gWi-1VUAAAAJ;;",
        "orcid": ";;;",
        "linkedin": ";;;haifeng-liu/",
        "or_profile": "~GuangYan_Zhang2;~Hongmin_Xu1;~Zhitong_Zheng2;~Haifeng_Liu6",
        "aff": "OPPO Inc.;ByteDance Inc.;OPPO Inc.;OPPO",
        "aff_domain": "oppo.com;bytedance.com;oppo.com;oppo.com",
        "position": "Senior Research Engineer;Senior Research Engineer;Principal Researcher;VP of Engineering",
        "bibtex": "@misc{\nzhang2024zerop,\ntitle={ZeroP: Zero-Shot Quantization via Proxy Data},\nauthor={GuangYan Zhang and Hongmin Xu and Zhitong Zheng and Haifeng Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=lEmm0hYA2u}\n}",
        "github": "",
        "project": "",
        "reviewers": "MuxB;qH2g;FpNc;7Mby;AkjD",
        "site": "https://openreview.net/forum?id=lEmm0hYA2u",
        "pdf_size": 1911996,
        "rating": "3;3;5;5;6",
        "confidence": "4;5;5;4;3",
        "soundness": "2;4;3;3;3",
        "contribution": "2;2;2;2;2",
        "presentation": "1;4;3;3;3",
        "wc_summary": "105;38;31;77;53",
        "wc_strengths": "54;21;28;75;64",
        "wc_weaknesses": "84;115;93;182;60",
        "wc_questions": "57;2;4;1;46",
        "wc_review": "300;176;156;335;223",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            4.4,
            1.2
        ],
        "confidence_avg": [
            4.2,
            0.7483314773547882
        ],
        "soundness_avg": [
            3.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.8,
            0.9797958971132712
        ],
        "wc_summary_avg": [
            60.8,
            27.147007201531444
        ],
        "wc_strengths_avg": [
            48.4,
            20.732583051805193
        ],
        "wc_weaknesses_avg": [
            106.8,
            41.52782199923324
        ],
        "wc_questions_avg": [
            22.0,
            24.355697485393435
        ],
        "wc_review_avg": [
            238.0,
            69.34839579975878
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5345224838248488,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:3ZKnP8dlMf4J:scholar.google.com/&scioq=ZeroP:+Zero-Shot+Quantization+via+Proxy+Data&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "OPPO Inc.;ByteDance;OPPO",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.oppo.com;https://www.bytedance.com;https://www.oppo.com",
        "aff_unique_abbr": "OPPO;ByteDance;OPPO",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Demonstration-Regularized RL",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17944",
        "id": "lF2aip4Scn",
        "author_site": "Daniil Tiapkin, Denis Belomestny, Daniele Calandriello, Eric Moulines, Alexey Naumov, Pierre Perrault, Michal Valko, Pierre M\u00e9nard",
        "tldr": "",
        "abstract": "Incorporating expert demonstrations has empirically helped to improve the sample efficiency of reinforcement learning (RL). This paper quantifies theoretically to what extent this extra information reduces RL's sample complexity. In particular, we study the demonstration-regularized reinforcement learning framework that leverages the expert demonstrations by $\\mathrm{KL}$-regularization for a policy learned by behavior cloning. Our findings reveal that using $N^{\\mathrm{E}}$ expert demonstrations enables the identification of an optimal policy at a sample complexity of order $\\widetilde{\\mathcal{O}}(\\mathrm{Poly}(S,A,H)/(\\varepsilon^2 N^{\\mathrm{E}}))$ in finite and $\\widetilde{\\mathcal{O}}(\\mathrm{Poly}(d,H)/(\\varepsilon^2 N^{\\mathrm{E}}))$ in linear Markov decision processes, where $\\varepsilon$is the target precision, $H$ the horizon, $A$ the number of action, $S$ the number of states in the finite case and $d$ the dimension of the feature space in the linear case. As a by-product, we provide tight convergence guarantees for the behavior cloning procedure under general assumptions on the policy classes. Additionally, we establish that demonstration-regularized methods are provably efficient for reinforcement learning from human feedback (RLHF). In this respect, we provide theoretical evidence showing the benefits of KL-regularization for RLHF  in tabular and linear MDPs. \nInterestingly, we avoid pessimism injection by employing computationally feasible regularization to handle reward estimation uncertainty, thus setting our approach apart from the prior works.",
        "keywords": "reinforcement learning;regularization in reinforcement leaning;learning with demonstrations;reinforcemenet learning with human feedback",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Daniil Tiapkin;Denis Belomestny;Daniele Calandriello;Eric Moulines;Alexey Naumov;Pierre Perrault;Michal Valko;Pierre Menard",
        "authorids": "~Daniil_Tiapkin1;~Denis_Belomestny1;~Daniele_Calandriello1;~Eric_Moulines1;~Alexey_Naumov1;~Pierre_Perrault1;~Michal_Valko1;~Pierre_Menard2",
        "gender": "M;M;M;M;M;M;Not Specified;M",
        "homepage": "https://d-tiapkin.github.io/;https://denbel.github.io;;;https://www.hse.ru/en/staff/anaumov;https://misovalko.github.io/research.html;https://menardprr.github.io/;",
        "dblp": "267/5445;;129/1542;54/2358;196/2848;03/5455;176/5039;222/3254",
        "google_scholar": "https://scholar.google.ru/citations?user=AB23PXQAAAAJ;https://scholar.google.de/citations?user=WFjIBlcAAAAJ;;https://scholar.google.fr/citations?user=_XE1LvQAAAAJ;5723KoYAAAAJ;jrazNCQAAAAJ;KXimUncAAAAJ;https://scholar.google.fr/citations?user=KIIpLJsAAAAJ",
        "orcid": "0000-0002-8832-7926;0000-0002-9482-6430;;0000-0002-2058-0693;;;;",
        "linkedin": "daniil-tiapkin-049714240/;;;;;michalvalko/;;",
        "or_profile": "~Daniil_Tiapkin1;~Denis_Belomestny1;~Daniele_Calandriello1;~Eric_Moulines1;~Alexey_Naumov1;~Michal_Valko1;~Pierre_MENARD1;~pierre_perrault2",
        "aff": "Google Deepmind;Duisburg-Essen University;Google DeepMind;Ecole polytechnique;Higher School of Economics;Meta;;IDEMIA",
        "aff_domain": "google.com;uni-due.de;deepmind.com;polytechnique.edu;hse.ru;meta.com;;idemia.com",
        "position": "Intern;Full Professor;Researcher;Full Professor;Full Professor;Principal Researcher;;Researcher",
        "bibtex": "@inproceedings{\ntiapkin2024demonstrationregularized,\ntitle={Demonstration-Regularized {RL}},\nauthor={Daniil Tiapkin and Denis Belomestny and Daniele Calandriello and Eric Moulines and Alexey Naumov and Pierre Perrault and Michal Valko and Pierre Menard},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=lF2aip4Scn}\n}",
        "github": "",
        "project": "",
        "reviewers": "UXmS;Muxw;XPKe;zApY",
        "pdf_size": 800923,
        "rating": "6;6;6;8",
        "confidence": "2;3;4;2",
        "soundness": "3;3;3;4",
        "contribution": "3;3;2;4",
        "presentation": "3;3;3;4",
        "wc_summary": "65;72;26;130",
        "wc_strengths": "11;26;23;161",
        "wc_weaknesses": "263;107;34;17",
        "wc_questions": "101;20;57;15",
        "wc_review": "440;225;140;323",
        "wc_reply_reviewers": "423;41;17;0",
        "wc_reply_authors": "1345;361;340;19",
        "reply_reviewers": "3;1;1;0",
        "reply_authors": "4;1;2;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            73.25,
            37.157603528753036
        ],
        "wc_strengths_avg": [
            55.25,
            61.31221330208199
        ],
        "wc_weaknesses_avg": [
            105.25,
            97.15033453364944
        ],
        "wc_questions_avg": [
            48.25,
            34.50633999716574
        ],
        "wc_review_avg": [
            282.0,
            111.86822605190449
        ],
        "wc_reply_reviewers_avg": [
            120.25,
            175.39865307350567
        ],
        "wc_reply_authors_avg": [
            516.25,
            497.30542677513586
        ],
        "reply_reviewers_avg": [
            1.25,
            1.0897247358851685
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "openreview": "https://openreview.net/forum?id=lF2aip4Scn",
        "pdf": "https://openreview.net/pdf?id=lF2aip4Scn",
        "email": "google.com;uni-due.de;deepmind.com;polytechnique.edu;hse.ru;meta.com;;idemia.com",
        "author_num": 8,
        "aff_unique_index": "0;1;2;3;4;5;6",
        "aff_unique_norm": "DeepMind;University of Duisburg-Essen;Google;Ecole Polytechnique;Higher School of Economics;Meta;IDEMIA",
        "aff_unique_dep": "DeepMind;;Google DeepMind;;;Meta Platforms, Inc.;",
        "aff_unique_url": "https://deepmind.com;https://www.uni-due.de;https://deepmind.com;https://www.polytechnique.edu;https://www.hse.ru;https://meta.com;https://www.idemia.com",
        "aff_unique_abbr": "DeepMind;UDE;DeepMind;X;HSE;Meta;IDEMIA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;2;3;4;2",
        "aff_country_unique": "United Kingdom;Germany;France;Russian Federation;United States"
    },
    {
        "title": "Vision-Language Foundation Models as Effective Robot Imitators",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17943",
        "id": "lFYj0oibGR",
        "author_site": "Xinghang Li, Minghuan Liu, Hanbo Zhang, Cunjun Yu, Jie Xu, Hongtao Wu, Chilam Cheang, Ya Jing, Weinan Zhang, Huaping Liu, Hang Li, Tao Kong",
        "tldr": "",
        "abstract": "Recent progress in vision language foundation models has shown their ability to understand multimodal data and resolve complicated vision language tasks, including robotics manipulation. We seek a straightforward way of making use of existing vision-language models (VLMs) with simple fine-tuning on robotics data.\nTo this end, we derive a simple and novel vision-language manipulation framework, dubbed RoboFlamingo, built upon the open-source VLMs, OpenFlamingo. Unlike prior works, RoboFlamingo utilizes pre-trained VLMs for single-step vision-language comprehension, models sequential history information with an explicit policy head, and is slightly fine-tuned by imitation learning only on language-conditioned manipulation datasets. Such a decomposition provides RoboFlamingo the flexibility for open-loop control and deployment on low-performance platforms. By exceeding the state-of-the-art performance with a large margin on the tested benchmark, we show RoboFlamingo can be an effective and competitive alternative to adapt VLMs to robot control.\nOur extensive experimental results also reveal several interesting conclusions regarding the behavior of different pre-trained VLMs on manipulation tasks. We believe RoboFlamingo has the potential to be a cost-effective and easy-to-use solution for robotics manipulation, empowering everyone with the ability to fine-tune their own robotics policy. Our code will be made public upon acceptance.",
        "keywords": "Large Visual Language Model;Robotics;Imitation Learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Xinghang Li;Minghuan Liu;Hanbo Zhang;Cunjun Yu;Jie Xu;Hongtao Wu;Chilam Cheang;Ya Jing;Weinan Zhang;Huaping Liu;Hang Li;Tao Kong",
        "authorids": "~Xinghang_Li1;~Minghuan_Liu1;~Hanbo_Zhang1;~Cunjun_Yu1;~Jie_Xu17;~Hongtao_Wu2;~Chilam_Cheang1;~Ya_Jing2;~Weinan_Zhang1;~Huaping_Liu3;~Hang_Li4;~Tao_Kong3",
        "gender": "M;M;M;Unspecified;M;;F;;M;M;M;M",
        "homepage": ";http://minghuanliu.com;;;https://sites.google.com/view/jxu/home;;;;http://wnzhang.net;https://sites.google.com/site/thuliuhuaping/;https://hangli-hl.github.io/;http://www.taokong.org",
        "dblp": "304/4145;249/7554;119/1807;232/3014;37/5126;;;;28/10261-1;69/1097-1;https://dblp.org/pers/hd/l/Li_0001:Hang;01/2492",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;;1qfEEwsAAAAJ;4xwyGM8AAAAJ;;7u0TYgIAAAAJ;;;Qzss0GEAAAAJ;https://scholar.google.com.hk/citations?user=HXnkIkwAAAAJ;nTl5mSwAAAAJ;kSUXLPkAAAAJ",
        "orcid": ";;;;;;;;0000-0002-0127-2425;;0000-0001-9628-3487;",
        "linkedin": ";;;;;;chilam-cheang-36868319a/;;;;hang-li-84aa6314/;",
        "or_profile": "~Xinghang_Li1;~Minghuan_Liu1;~Hanbo_Zhang1;~Cunjun_Yu1;~Jie_Xu17;~Hongtao_Wu2;~Chilam_Cheang1;~Ya_Jing2;~Weinan_Zhang1;~Huaping_Liu3;~Hang_Li4;~Tao_Kong3",
        "aff": "Tsinghua University;Shanghai Jiaotong University;ByteDance Ltd;Toyota Research Institute;Xi'an Jiaotong University;Bytedance Research;ByteDance Inc.;;Shanghai Jiaotong University;Tsinghua University;ByteDance Technology;Bytedance",
        "aff_domain": "mail.tsinghua.edu.cn;sjtu.edu.cn;bytedance.com;tri.global;xjtu.edu.cn;bytedance.com;bytedance.com;;sjtu.edu.cn;tsinghua.edu.cn;bytedance.com;bytedance.com",
        "position": "PhD student;PhD student;Researcher;Intern;PhD student;Researcher;Researcher;;Associate Professor;Full Professor;Head of Research;Researcher",
        "bibtex": "@inproceedings{\nli2024visionlanguage,\ntitle={Vision-Language Foundation Models as Effective Robot Imitators},\nauthor={Xinghang Li and Minghuan Liu and Hanbo Zhang and Cunjun Yu and Jie Xu and Hongtao Wu and Chilam Cheang and Ya Jing and Weinan Zhang and Huaping Liu and Hang Li and Tao Kong},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=lFYj0oibGR}\n}",
        "github": "",
        "project": "",
        "reviewers": "iuWF;fijq;qVoh;8RDp",
        "pdf_size": 15465717,
        "rating": "6;6;6;8",
        "confidence": "4;4;4;4",
        "soundness": "3;3;4;3",
        "contribution": "3;3;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "66;89;160;81",
        "wc_strengths": "152;60;94;43",
        "wc_weaknesses": "343;358;310;56",
        "wc_questions": "159;75;40;89",
        "wc_review": "720;582;604;269",
        "wc_reply_reviewers": "0;211;42;0",
        "wc_reply_authors": "1409;1516;1484;1156",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "2;3;2;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            99.0,
            36.173194495371845
        ],
        "wc_strengths_avg": [
            87.25,
            41.64957982981341
        ],
        "wc_weaknesses_avg": [
            266.75,
            122.90926531388918
        ],
        "wc_questions_avg": [
            90.75,
            43.25722483007896
        ],
        "wc_review_avg": [
            543.75,
            167.0664164337046
        ],
        "wc_reply_reviewers_avg": [
            63.25,
            87.00969773536741
        ],
        "wc_reply_authors_avg": [
            1391.25,
            141.26460101525788
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            12,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 133,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13943604845524895622&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=lFYj0oibGR",
        "pdf": "https://openreview.net/pdf?id=lFYj0oibGR",
        "email": "mail.tsinghua.edu.cn;sjtu.edu.cn;bytedance.com;tri.global;xjtu.edu.cn;bytedance.com;bytedance.com;;sjtu.edu.cn;tsinghua.edu.cn;bytedance.com;bytedance.com",
        "author_num": 12,
        "aff_unique_index": "0;1;2;3;4;2;2;1;0;2;2",
        "aff_unique_norm": "Tsinghua University;Shanghai Jiao Tong University;ByteDance;Toyota Research Institute;Xi'an Jiao Tong University",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.sjtu.edu.cn;https://www.bytedance.com;https://www.tri.global;https://www.xjtu.edu.cn",
        "aff_unique_abbr": "THU;SJTU;ByteDance;TRI;XJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0;0;0;0;0;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "lG6frgiJAU",
        "title": "Diffusion Models as Strong Adversaries",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Diffusion models have demonstrated their great ability to generate high-quality images for various tasks. With such a strong performance, diffusion models can potentially pose a severe threat to both humans and deep learning models. However, their abilities as adversaries have not been well explored. Among different adversarial scenarios, the no-box adversarial attack is the most practical one, as it assumes that the attacker has no access to the training dataset or the target model. Existing works still require some data from the training dataset, which may not be feasible in real-world scenarios. In this paper, we investigate the adversarial capabilities of diffusion models by conducting no-box attacks solely using data generated by diffusion models. Specifically, our attack method generates a synthetic dataset using diffusion models to train a substitute model. We then employ a classification diffusion model to fine-tune the substitute model, considering model uncertainty and incorporating noise augmentation. Finally, we sample adversarial examples from the diffusion models using the average approximation over the diffusion substitute model with multiple inferences. Extensive experiments on the ImageNet dataset demonstrate that the proposed attack method achieves state-of-the-art performance in both no-box attack and black-box attack scenarios.",
        "keywords": "Adversarial Attack;Diffusion Models;No-box Attack;Adversarial Transferability",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/d4d99b59524beeffbbd9d7500af52ffb1b14f00e.pdf",
        "author": "Xuelong Dai;Yanjie Li;Duan Mingxing;Bin Xiao",
        "authorids": "~Xuelong_Dai2;~Yanjie_Li3;~Duan_Mingxing2;~Bin_Xiao6",
        "gender": "M;M;M;",
        "homepage": ";;http://csee.hnu.edu.cn/people/duanmingxing;",
        "dblp": "251/0904;;157/2422;",
        "google_scholar": "WMV5yIQAAAAJ;h3Chje4AAAAJ;2mnGWRMAAAAJ;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Xuelong_Dai2;~Yanjie_Li3;~Duan_Mingxing2;~Bin_Xiao6",
        "aff": "The Hong Kong Polytechnic University;The Hong Kong Polytechnic University;Hunan University;",
        "aff_domain": "polyu.edu.hk;polyu.edu.hk;hnu.edu.cn;",
        "position": "PhD student;PhD student;Associate Professor;",
        "bibtex": "@misc{\ndai2024diffusion,\ntitle={Diffusion Models as Strong Adversaries},\nauthor={Xuelong Dai and Yanjie Li and Duan Mingxing and Bin Xiao},\nyear={2024},\nurl={https://openreview.net/forum?id=lG6frgiJAU}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZkvQ;UuiP;BsHh;ht9W",
        "site": "https://openreview.net/forum?id=lG6frgiJAU",
        "pdf_size": 5073113,
        "rating": "3;3;5;5",
        "confidence": "3;4;3;4",
        "soundness": "2;2;4;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;1;3",
        "wc_summary": "36;17;64;77",
        "wc_strengths": "23;26;37;93",
        "wc_weaknesses": "134;242;91;132",
        "wc_questions": "3;2;86;6",
        "wc_review": "196;287;278;308",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            48.5,
            23.4574082114798
        ],
        "wc_strengths_avg": [
            44.75,
            28.340562803162538
        ],
        "wc_weaknesses_avg": [
            149.75,
            55.95701475239722
        ],
        "wc_questions_avg": [
            24.25,
            35.68175303989421
        ],
        "wc_review_avg": [
            267.25,
            42.55217385751285
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12103633500313031230&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Hong Kong Polytechnic University;Hunan University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.polyu.edu.hk;http://www.hunu.edu.cn/",
        "aff_unique_abbr": "PolyU;HNU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Can we get the best of both Binary Neural Networks and Spiking Neural Networks for Efficient Computer Vision?",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17942",
        "id": "lGUyAuuTYZ",
        "author_site": "Gourav Datta, Zeyu Liu, Peter Beerel",
        "tldr": "",
        "abstract": "Binary Neural networks (BNN) have emerged as an attractive computing paradigm for a wide range of low-power vision tasks. However, state-of-the-art (SOTA) BNNs do not yield any sparsity, and induce a significant number of non-binary operations. On the other hand, activation sparsity can be provided by spiking neural networks (SNN), that too have gained significant traction in recent times. Thanks to this sparsity, SNNs when implemented on neuromorphic hardware, have the potential to be significantly more power-efficient compared to traditional artifical neural networks (ANN). However, SNNs incur multiple time steps to achieve close to SOTA accuracy. Ironically, this increases latency and energy---costs that SNNs were proposed to reduce---and presents itself as a major hurdle in realizing SNNs\u2019 theoretical gains in practice. This raises an intriguing question: *Can we obtain SNN-like sparsity and BNN-like accuracy and enjoy the energy-efficiency benefits of both?* To answer this question, in this paper, we present a training framework for sparse binary activation neural networks (BANN) using a novel variant of the Hoyer regularizer. We estimate the threshold of each BANN layer as the Hoyer extremum of a clipped version of its activation map, where the clipping value is trained using gradient descent with our Hoyer regularizer. \nThis approach shifts the activation values away from the threshold, thereby mitigating the effect of noise that can otherwise degrade the BANN accuracy. Our approach outperforms existing BNNs, SNNs, and adder neural networks (that also avoid energy-expensive multiplication operations similar to BNNs and SNNs) in terms of the accuracy-FLOPs trade-off for complex image recognition tasks. Downstream experiments on object detection further demonstrate the efficacy of our approach. Lastly, we demonstrate the portability of our approach to SNNs with multiple time steps. Codes are publicly available [here](https://github.com/godatta/Ultra-Low-Latency-SNN).",
        "keywords": "BNN;Hoyer regularizer;gradient descent;FLOPs;object detection",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/043135c3e554a6f0f9c023d4dedcddb146a40021.zip",
        "author": "Gourav Datta;Zeyu Liu;Peter Anthony Beerel",
        "authorids": "~Gourav_Datta1;~Zeyu_Liu2;~Peter_Anthony_Beerel1",
        "gender": "M;M;M",
        "homepage": "https://godatta.github.io;;http://sites.usc.edu/eessc.html",
        "dblp": "250/9607.html;116/0645-3;29/6330",
        "google_scholar": "hxSN-fcAAAAJ;Gk5kyEEAAAAJ;JSdH7PsAAAAJ",
        "orcid": ";;",
        "linkedin": "gourav-datta-959571a3/;zeyu-liu-364982220/;peter-beerel-b9902a1/",
        "or_profile": "~Gourav_Datta1;~Zeyu_Liu2;~Peter_Anthony_Beerel1",
        "aff": "Amazon;University of Southern California;University of Southern California",
        "aff_domain": "amazon.com;usc.edu;usc.edu",
        "position": "Researcher;PhD student;Full Professor",
        "bibtex": "@inproceedings{\ndatta2024can,\ntitle={Can we get the best of both Binary Neural Networks and Spiking Neural Networks for Efficient Computer Vision?},\nauthor={Gourav Datta and Zeyu Liu and Peter Anthony Beerel},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=lGUyAuuTYZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "J4aA;X4qq;gkE7",
        "pdf_size": 4336698,
        "rating": "5;6;6",
        "confidence": "4;4;5",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "2;2;3",
        "wc_summary": "62;66;45",
        "wc_strengths": "76;95;28",
        "wc_weaknesses": "190;320;111",
        "wc_questions": "4;114;51",
        "wc_review": "332;595;235",
        "wc_reply_reviewers": "166;18;28",
        "wc_reply_authors": "1657;730;964",
        "reply_reviewers": "1;1;1",
        "reply_authors": "4;4;4",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            57.666666666666664,
            9.104333522498441
        ],
        "wc_strengths_avg": [
            66.33333333333333,
            28.193773938387338
        ],
        "wc_weaknesses_avg": [
            207.0,
            86.16650548018451
        ],
        "wc_questions_avg": [
            56.333333333333336,
            45.065384597148274
        ],
        "wc_review_avg": [
            387.3333333333333,
            152.08842457231546
        ],
        "wc_reply_reviewers_avg": [
            70.66666666666667,
            67.53435339802174
        ],
        "wc_reply_authors_avg": [
            1117.0,
            393.60640238695305
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            4.0,
            0.0
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5199537527799665195&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=lGUyAuuTYZ",
        "pdf": "https://openreview.net/pdf?id=lGUyAuuTYZ",
        "email": "amazon.com;usc.edu;usc.edu",
        "author_num": 3,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Amazon;University of Southern California",
        "aff_unique_dep": "Amazon.com, Inc.;",
        "aff_unique_url": "https://www.amazon.com;https://www.usc.edu",
        "aff_unique_abbr": "Amazon;USC",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Los Angeles",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Efficient ConvBN Blocks for Transfer Learning and Beyond",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17941",
        "id": "lHZm9vNm5H",
        "author_site": "Kaichao You, Guo Qin, Anchang Bao, Meng Cao, Ping Huang, Jiulong Shan, Mingsheng Long",
        "tldr": "",
        "abstract": "Convolution-BatchNorm (ConvBN) blocks are integral components in various computer vision tasks and other domains. A ConvBN block can operate in three modes: Train, Eval, and Deploy. While the Train mode is indispensable for training models from scratch, the Eval mode is suitable for transfer learning and beyond, and the Deploy mode is designed for the deployment of models. This paper focuses on the trade-off between stability and efficiency in ConvBN blocks: Deploy mode is efficient but suffers from training instability; Eval mode is widely used in transfer learning but lacks efficiency. To solve the dilemma, we theoretically reveal the reason behind the diminished training stability observed in the Deploy mode. Subsequently, we propose a novel Tune mode to bridge the gap between Eval mode and Deploy mode. The proposed Tune mode is as stable as Eval mode for transfer learning, and its computational efficiency closely matches that of the Deploy mode. Through extensive experiments in object detection, classification, and adversarial example generation across $5$ datasets and $12$ model architectures, we demonstrate that the proposed Tune mode retains the performance while significantly reducing GPU memory footprint and training time, thereby contributing efficient ConvBN blocks for transfer learning and beyond. Our method has been integrated into both PyTorch (general machine learning framework) and MMCV/MMEngine (computer vision framework). Practitioners just need one line of code to enjoy our efficient ConvBN blocks thanks to PyTorch's builtin machine learning compilers.",
        "keywords": "transfer learning;batch normalization;efficient training",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/649ca1bbf5a75656460578b1f1dfce43aab955ad.pdf",
        "author": "Kaichao You;Guo Qin;Anchang Bao;Meng Cao;Ping Huang;Jiulong Shan;Mingsheng Long",
        "authorids": "~Kaichao_You1;~Guo_Qin1;~Anchang_Bao1;~Meng_Cao2;~Ping_Huang1;~Jiulong_Shan2;~Mingsheng_Long5",
        "gender": "M;M;;M;M;;",
        "homepage": "https://youkaichao.github.io;;;https://www.linkedin.com/in/caomeng/;;;",
        "dblp": "238/1508;;;;;;",
        "google_scholar": "https://scholar.google.com.sg/citations?user=Ke4w3KkAAAAJ;;;;;;",
        "orcid": ";0009-0003-7468-0475;0009-0000-1429-8475;;;;",
        "linkedin": ";;;caomeng/;ping-huang-82845138/;;",
        "or_profile": "~Kaichao_You1;~Guo_Qin1;~Anchang_Bao1;~Meng_Cao2;~Ping_Huang1;~Jiulong_Shan2;~Mingsheng_Long5",
        "aff": "Tsinghua University;Tsinghua University;Tsinghua University;Apple;Apple;;",
        "aff_domain": "tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;apple.com;apple.com;;",
        "position": "PhD student;Undergrad student;Undergrad student;Researcher;Researcher;;",
        "bibtex": "@inproceedings{\nyou2024efficient,\ntitle={Efficient Conv{BN} Blocks for Transfer Learning and Beyond},\nauthor={Kaichao You and Guo Qin and Anchang Bao and Meng Cao and Ping Huang and Jiulong Shan and Mingsheng Long},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=lHZm9vNm5H}\n}",
        "github": "",
        "project": "",
        "reviewers": "1pnn;iJzH;nwrB;E7re",
        "pdf_size": 1480257,
        "rating": "6;8;8;8",
        "confidence": "4;4;4;3",
        "soundness": "3;3;4;3",
        "contribution": "3;4;3;3",
        "presentation": "4;4;4;3",
        "wc_summary": "46;77;79;154",
        "wc_strengths": "51;80;24;74",
        "wc_weaknesses": "93;35;2;61",
        "wc_questions": "91;3;8;2",
        "wc_review": "281;195;113;291",
        "wc_reply_reviewers": "0;33;9;0",
        "wc_reply_authors": "366;218;158;783",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            89.0,
            39.74292389847531
        ],
        "wc_strengths_avg": [
            57.25,
            22.038318901404434
        ],
        "wc_weaknesses_avg": [
            47.75,
            33.46173187388842
        ],
        "wc_questions_avg": [
            26.0,
            37.59654239421492
        ],
        "wc_review_avg": [
            220.0,
            72.17340230306452
        ],
        "wc_reply_reviewers_avg": [
            10.5,
            13.5
        ],
        "wc_reply_authors_avg": [
            381.25,
            243.99116274980125
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1186870115113854731&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=lHZm9vNm5H",
        "pdf": "https://openreview.net/pdf?id=lHZm9vNm5H",
        "email": "tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;apple.com;apple.com;;",
        "author_num": 7,
        "aff_unique_index": "0;0;0;1;1",
        "aff_unique_norm": "Tsinghua University;Apple",
        "aff_unique_dep": ";Apple Inc.",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.apple.com",
        "aff_unique_abbr": "THU;Apple",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "LightHGNN: Distilling Hypergraph Neural Networks into MLPs for 100x Faster Inference",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17940",
        "id": "lHasEfGsXL",
        "author_site": "Yifan Feng, Yihe Luo, Shihui Ying, Yue Gao",
        "tldr": "",
        "abstract": "Hypergraph Neural Networks (HGNNs) have recently attracted much attention and exhibited satisfactory performance due to their superiority in high-order correlation modeling. \nHowever, it is noticed that the high-order modeling capability of hypergraph also brings increased computation complexity, which hinders its practical industrial deployment.\nIn practice, we find that one key barrier to the efficient deployment of HGNNs is the high-order structural dependencies during inference.\nIn this paper, we propose to bridge the gap between the HGNNs and inference-efficient Multi-Layer Perceptron (MLPs) to eliminate the hypergraph dependency of HGNNs and thus reduce computational complexity as well as improve inference speed. \nSpecifically, we introduce LightHGNN and LightHGNN$^+$ for fast inference with low complexity. LightHGNN directly distills the knowledge from teacher HGNNs to student MLPs via soft labels, and LightHGNN$^+$ further explicitly injects reliable high-order correlations into the student MLPs to achieve topology-aware distillation and resistance to over-smoothing.\nExperiments on eight hypergraph datasets demonstrate that even without hypergraph dependency, the proposed LightHGNNs can still achieve competitive or even better performance than HGNNs and outperform vanilla MLPs by $16.3$ on average. Extensive experiments on three graph datasets further show the average best performance of our LightHGNNs compared with all other methods.\nExperiments on synthetic hypergraphs with 5.5w vertices indicate LightHGNNs can run $100\\times$ faster than HGNNs, showcasing their ability for latency-sensitive deployments.",
        "keywords": "Hypergraph;HGNN;Knowledge Distillation;MLPs;Reliale Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/4921ce80a4ebdd41f624446746e45b4c5e510f8b.zip",
        "author": "Yifan Feng;Yihe Luo;Shihui Ying;Yue Gao",
        "authorids": "~Yifan_Feng1;~Yihe_Luo1;~Shihui_Ying1;~Yue_Gao4",
        "gender": "M;M;M;M",
        "homepage": ";https://www.gaoyue.org/people;;http://www.gaoyue.org",
        "dblp": "225/5463;;52/2125;33/3099-2",
        "google_scholar": "https://scholar.google.com.hk/citations?user=WntYF-sAAAAJ;;dU6ePjIAAAAJ;UTDfWocAAAAJ",
        "orcid": "0000-0003-0878-2986;;0000-0001-9423-0146;",
        "linkedin": ";;;",
        "or_profile": "~Yifan_Feng1;~Yihe_Luo1;~Shihui_Ying1;~Yue_Gao4",
        "aff": "Tsinghua University;Tsinghua University;Shanghai University;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;cs.tsinghua.edu.cn;shu.edu.cn;tsinghua.edu.cn",
        "position": "PhD student;Undergrad student;Full Professor;Associate Professor",
        "bibtex": "@inproceedings{\nfeng2024lighthgnn,\ntitle={Light{HGNN}: Distilling Hypergraph Neural Networks into {MLP}s for 100x Faster Inference},\nauthor={Yifan Feng and Yihe Luo and Shihui Ying and Yue Gao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=lHasEfGsXL}\n}",
        "github": "",
        "project": "",
        "reviewers": "U1AB;PX2s;uHuc;tcvF",
        "pdf_size": 7206240,
        "rating": "6;6;6;6",
        "confidence": "3;5;2;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;3;4",
        "wc_summary": "37;55;90;43",
        "wc_strengths": "35;86;18;51",
        "wc_weaknesses": "202;137;61;149",
        "wc_questions": "12;154;70;66",
        "wc_review": "286;432;239;309",
        "wc_reply_reviewers": "28;46;0;16",
        "wc_reply_authors": "1561;2708;895;2257",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "4;4;2;6",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            56.25,
            20.535031044534605
        ],
        "wc_strengths_avg": [
            47.5,
            25.104780421266383
        ],
        "wc_weaknesses_avg": [
            137.25,
            50.360574857719804
        ],
        "wc_questions_avg": [
            75.5,
            50.78139423056441
        ],
        "wc_review_avg": [
            316.5,
            71.29691437923523
        ],
        "wc_reply_reviewers_avg": [
            22.5,
            16.815171720800237
        ],
        "wc_reply_authors_avg": [
            1855.25,
            688.7032652020753
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.0,
            1.4142135623730951
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9517393506417599458&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=lHasEfGsXL",
        "pdf": "https://openreview.net/pdf?id=lHasEfGsXL",
        "email": "tsinghua.edu.cn;cs.tsinghua.edu.cn;shu.edu.cn;tsinghua.edu.cn",
        "author_num": 4,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Tsinghua University;Shanghai University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.shu.edu.cn",
        "aff_unique_abbr": "THU;SHU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "lHtNW6xqCd",
        "title": "Incorporating Implicit Regularization to Enhance the Transition Matrix Method for Effective Handling of Diverse Label Noise",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Among various methods for learning with noisy labels, the transition matrix method has attracted sustained attention due to its simplicity and statistical consistency. However, estimating the transition matrix for each sample may be unidentifiable and computationally expensive in the case of instance-dependent label noise and real-world situations. In this paper, we propose a concise method that only requires estimating a global matrix, combining with implicit regularization, to replace the estimation of the individual transition matrix for each sample. Specifically, by estimating the transition matrix, we can determine the overall probability transfer from correct labels to noisy labels and use implicit regularization to adjust the sparse form representation of the difference between the estimated posterior probability distribution and the noisy label distribution. This approach can be applied to diverse types of noise as well as alleviating the problem of inaccurate posterior probability estimation. We theoretically analyze the consistency and generalization results of the proposed method and conduct experiments on synthetic and real-world datasets with different types of label noise. The experimental results show that our method significantly outperforms previous transition matrix methods and has a wider range of applicability. Additionally, our method achieves impressive results without the need for additional auxiliary techniques. Our code will be open source and put on Github.",
        "keywords": "Learning with Noisy Labels;Transition Matrix;Implicit Regularization;Theoretical Analysis",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/cc8e43f52b94936073260e4cbee16b94f24660c8.zip",
        "author": "Haixin Yang;Ruirui Li;Xiangzhong Fang;Yukun Yang;Naihao Wang",
        "authorids": "~Haixin_Yang1;~Ruirui_Li2;~Xiangzhong_Fang2;~Yukun_Yang3;~Naihao_Wang2",
        "gender": "M;F;M;M;M",
        "homepage": "https://github.com/DrawFlatbread/xin;;https://www.math.pku.edu.cn/jsdw/js_20180628175159671361/f_20180628175159671361/69902.htm;https://github.com/Tyrantyyk;https://github.com/wangnaihao",
        "dblp": ";;;;",
        "google_scholar": ";Tg_SltkAAAAJ;;;",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Haixin_Yang1;~Ruirui_Li2;~Xiangzhong_Fang2;~Yukun_Yang3;~NaiHao_Wang1",
        "aff": "Peking University;Beijing University of Chemical Technology;School of mathematical Science, Peking University, Peking University;Beijing University of Chemical Technology;Beijing University of Chemical Technology",
        "aff_domain": "pku.edu.cn;buct.edu.cn;math.pku.edu.cn;buct.edu.cn;buct.edu.cn",
        "position": "PhD student;Full Professor;Full Professor;Undergrad student;MS student",
        "bibtex": "@misc{\nyang2024incorporating,\ntitle={Incorporating Implicit Regularization to Enhance the Transition Matrix Method for Effective Handling of Diverse Label Noise},\nauthor={Haixin Yang and Ruirui Li and Xiangzhong Fang and Yukun Yang and Naihao Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=lHtNW6xqCd}\n}",
        "github": "",
        "project": "",
        "reviewers": "HJZZ;q63a;11Gr;h1VJ",
        "site": "https://openreview.net/forum?id=lHtNW6xqCd",
        "pdf_size": 303580,
        "rating": "3;5;5;5",
        "confidence": "4;5;5;4",
        "soundness": "2;2;2;2",
        "contribution": "2;2;3;2",
        "presentation": "3;3;2;3",
        "wc_summary": "85;94;88;98",
        "wc_strengths": "20;41;52;89",
        "wc_weaknesses": "380;48;246;84",
        "wc_questions": "4;260;15;216",
        "wc_review": "489;443;401;487",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1012;1143;955;756",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;2;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            91.25,
            5.0682837331783235
        ],
        "wc_strengths_avg": [
            50.5,
            25.024987512484397
        ],
        "wc_weaknesses_avg": [
            189.5,
            132.88622953489198
        ],
        "wc_questions_avg": [
            123.75,
            115.36978590601613
        ],
        "wc_review_avg": [
            455.0,
            36.193922141707716
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            966.5,
            139.3422046617607
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:4z8oT-LdlW0J:scholar.google.com/&scioq=Incorporating+Implicit+Regularization+to+Enhance+the+Transition+Matrix+Method+for+Effective+Handling+of+Diverse+Label+Noise&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;1;1",
        "aff_unique_norm": "Peking University;Beijing University of Chemical Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.pku.edu.cn;http://www.buct.edu.cn",
        "aff_unique_abbr": "Peking U;BUCT",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Peking",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "lIYxAcxY1B",
        "title": "Understanding Sparse Feature Updates in Deep Networks using Iterative Linearisation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Larger and deeper networks generalise well despite their increased capacity to overfit. Understanding why this happens is theoretically and practically important. One recent approach looks at the infinitely wide limits of such networks and their corresponding kernels. However, these theoretical tools cannot fully explain finite networks as the empirical kernel changes significantly during gradient-descent-based training in contrast to infinite networks. In this work, we derive an iterative linearised training method as a novel empirical tool to further investigate this distinction, allowing us to control for sparse (i.e. infrequent) feature updates and quantify the frequency of feature learning needed to achieve comparable performance. We justify iterative linearisation as an interpolation between a finite analog of the infinite width regime, which does not learn features, and standard gradient descent training, which does. Informally, we also show that it is analogous to a damped version of the Gauss-Newton algorithm --- a second-order method. We show that in a variety of cases, iterative linearised training surprisingly performs on par with standard training, noting in particular how much less frequent feature learning is required to achieve comparable performance. We also show that feature learning is essential for good performance. Since such feature learning inevitably causes changes in the NTK kernel, we provide direct negative evidence for the NTK theory, which states the NTK kernel remains constant during training.",
        "keywords": "neural tangent kernel;ntk;optimization;feature learning;infinite width network;deep learning optimization",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/3e7d8918d16407ecc482fedc7067e73c5618c379.zip",
        "author": "Adrian Goldwaser;Hong Ge",
        "authorids": "~Adrian_Goldwaser1;~Hong_Ge1",
        "gender": ";M",
        "homepage": "https://diagonalrewards.com/;",
        "dblp": "199/6639;31/835",
        "google_scholar": "https://scholar.google.com/citations?hl=en;",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Adrian_Goldwaser1;~Hong_Ge1",
        "aff": "University of Cambridge;University of Cambridge",
        "aff_domain": "cam.ac.uk;cam.ac.uk",
        "position": "PhD student;Senior Research Fellow",
        "bibtex": "@misc{\ngoldwaser2024understanding,\ntitle={Understanding Sparse Feature Updates in Deep Networks using Iterative Linearisation},\nauthor={Adrian Goldwaser and Hong Ge},\nyear={2024},\nurl={https://openreview.net/forum?id=lIYxAcxY1B}\n}",
        "github": "",
        "project": "",
        "reviewers": "XVAB;XaXy;3pTU",
        "site": "https://openreview.net/forum?id=lIYxAcxY1B",
        "pdf_size": 517147,
        "rating": "3;5;5",
        "confidence": "4;4;4",
        "soundness": "2;2;3",
        "contribution": "1;2;2",
        "presentation": "2;2;3",
        "wc_summary": "205;60;85",
        "wc_strengths": "38;56;162",
        "wc_weaknesses": "381;231;314",
        "wc_questions": "1;32;63",
        "wc_review": "625;379;624",
        "wc_reply_reviewers": "0;0;324",
        "wc_reply_authors": "788;630;1167",
        "reply_reviewers": "0;0;4",
        "reply_authors": "1;1;4",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            116.66666666666667,
            63.28945848682508
        ],
        "wc_strengths_avg": [
            85.33333333333333,
            54.70730197047638
        ],
        "wc_weaknesses_avg": [
            308.6666666666667,
            61.35325763333372
        ],
        "wc_questions_avg": [
            32.0,
            25.311394008759507
        ],
        "wc_review_avg": [
            542.6666666666666,
            115.73052991996344
        ],
        "wc_reply_reviewers_avg": [
            108.0,
            152.73506473629428
        ],
        "wc_reply_authors_avg": [
            861.6666666666666,
            225.33284023614686
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            1.8856180831641267
        ],
        "reply_authors_avg": [
            2.0,
            1.4142135623730951
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:5t3yEY3TbEYJ:scholar.google.com/&scioq=Understanding+Sparse+Feature+Updates+in+Deep+Networks+using+Iterative+Linearisation&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Cambridge",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cam.ac.uk",
        "aff_unique_abbr": "Cambridge",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Cambridge",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "lIfPlwkBeU",
        "title": "Multi-conditioned Graph Diffusion for Neural Architecture Search",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Neural architecture search automates the design of neural network architectures usually by exploring a large and thus complex architecture search space. To advance the architecture search, we present a graph diffusion-based NAS approach that uses discrete conditional graph diffusion processes to generate high-performing neural network architectures. Our method is based on the idea of classifier-free guidance, which we introduce for graph diffusion models. We then propose a multi-conditioned classifier-free guidance approach applied to graph diffusion networks to jointly impose constraints such as high accuracy and low hardware latency. Unlike the related work, our method is completely differentiable and requires only a single model training. In our evaluations, we show promising results on six standard benchmarks, yielding novel and unique architectures at a fast speed, i.e. less than 0.2 seconds per architecture. Furthermore, we demonstrate the generalisability and efficiency of our method through experiments on ImageNet dataset.",
        "keywords": "Neural Architecture Search;Diffusion Models;Deep Neural Networks;Generative Models",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Rohan Asthana;Joschua Conrad;Youssef Dawoud;Maurits Ortmanns;Vasileios Belagiannis",
        "authorids": "~Rohan_Asthana1;~Joschua_Conrad1;~Youssef_Dawoud1;~Maurits_Ortmanns1;~Vasileios_Belagiannis1",
        "gender": "M;;M;M;M",
        "homepage": ";https://www.uni-ulm.de/en/in/mikro/institut/conrad/;;https://www.uni-ulm.de/in/mikro/institut/ortmanns/;https://www.lms.tf.fau.eu/person/vasileios-belagiannis/",
        "dblp": ";;268/8176;19/4534.html;75/7627",
        "google_scholar": "UU0oy7sAAAAJ;w5KsH-8AAAAJ;qKLK1kQAAAAJ;https://scholar.google.de/citations?hl=de;4IlWd90AAAAJ",
        "orcid": ";0000-0003-4780-8042;;;0000-0003-0960-8453",
        "linkedin": "rohan-asthana/;;;;",
        "or_profile": "~Rohan_Asthana1;~Joschua_Conrad1;~Youssef_Dawoud1;~Maurits_Ortmanns1;~Vasileios_Belagiannis1",
        "aff": "Friedrich-Alexander Universit\u00e4t Erlangen-N\u00fcrnberg;Universit\u00e4t Ulm;Friedrich-Alexander Universit\u00e4t Erlangen-N\u00fcrnberg;Universit\u00e4t Ulm;Friedrich-Alexander Universit\u00e4t Erlangen-N\u00fcrnberg",
        "aff_domain": "fau.de;uni-ulm.de;fau.de;uni-ulm.de;fau.de",
        "position": "PhD student;PhD student;Researcher;Full Professor;Professor",
        "bibtex": "@misc{\nasthana2024multiconditioned,\ntitle={Multi-conditioned Graph Diffusion for Neural Architecture Search},\nauthor={Rohan Asthana and Joschua Conrad and Youssef Dawoud and Maurits Ortmanns and Vasileios Belagiannis},\nyear={2024},\nurl={https://openreview.net/forum?id=lIfPlwkBeU}\n}",
        "github": "",
        "project": "",
        "reviewers": "KRAY;QYgS;2Rg5",
        "site": "https://openreview.net/forum?id=lIfPlwkBeU",
        "pdf_size": 1096225,
        "rating": "3;3;5",
        "confidence": "5;4;3",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "3;3;3",
        "wc_summary": "45;59;107",
        "wc_strengths": "24;20;35",
        "wc_weaknesses": "260;118;451",
        "wc_questions": "191;2;6",
        "wc_review": "520;199;599",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            70.33333333333333,
            26.5497436689865
        ],
        "wc_strengths_avg": [
            26.333333333333332,
            6.342099196813483
        ],
        "wc_weaknesses_avg": [
            276.3333333333333,
            136.4363913656796
        ],
        "wc_questions_avg": [
            66.33333333333333,
            88.16776936928571
        ],
        "wc_review_avg": [
            439.3333333333333,
            172.97462883967182
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.8660254037844387,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13373081321859590072&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0;1;0",
        "aff_unique_norm": "Friedrich-Alexander University Erlangen-N\u00fcrnberg;University of Ulm",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www fau.de;https://www.uni-ulm.de",
        "aff_unique_abbr": "FAU;Ulm",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Erlangen-N\u00fcrnberg;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "lIwp1C1eSK",
        "title": "Compositional Instruction Following with Language Models and Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Combining reinforcement learning with language grounding is challenging as the agent needs to explore the environment for different language commands at the same time. We present a method to reduce the sample complexity of RL tasks specified with language by using compositional policy representations. We evaluate our approach in an environment requiring reward function approximation and demonstrate compositional generalization to novel tasks. Our method significantly outperforms the previous best non-compositional baseline in terms of sample complexity on 162 tasks. Our compositional model attains a success rate equal to an oracle policy's upper-bound performance of 92%. With the same number of environment steps the baseline only reaches a success rate of 80%.",
        "keywords": "reinforcement learning;language models;composition;NLP",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Vanya Cohen;Geraud Nangue Tasse;Nakul Gopalan;Steven James;Matthew Gombolay;Ray Mooney;Benjamin Rosman",
        "authorids": "~Vanya_Cohen1;~Geraud_Nangue_Tasse1;~Nakul_Gopalan1;~Steven_James1;~Matthew_Gombolay1;~Ray_Mooney1;~Benjamin_Rosman1",
        "gender": ";M;;M;M;M;M",
        "homepage": ";https://geraudnt.github.io/;http://nakulgopalan.github.io/;;https://core-robotics.gatech.edu/;https://www.cs.utexas.edu/~mooney/;http://www.raillab.org",
        "dblp": ";256/0971;135/8173;195/8202;144/1022;m/RaymondJMooney.html;45/4591",
        "google_scholar": ";CAfsMIsAAAAJ;dPsQR14AAAAJ;;Ihyz20wAAAAJ;p9RsPG4AAAAJ;https://scholar.google.co.za/citations?user=pWJ0SocAAAAJ",
        "orcid": ";0000-0002-6152-8429;;;;0000-0002-4504-0490;",
        "linkedin": ";geraud-nangue-tasse-264281a5/;;;;;",
        "or_profile": "~Vanya_Cohen1;~Geraud_Nangue_Tasse1;~Nakul_Gopalan1;~Steven_James1;~Matthew_Gombolay1;~Ray_Mooney1;~Benjamin_Rosman1",
        "aff": ";University of the Witwatersrand;Arizona State University;University of the Witwatersrand;Georgia Institute of Technology;University of Texas at Austin;University of the Witwatersrand",
        "aff_domain": ";wits.ac.za;asu.edu;wits.ac.za;cc.gatech.edu;cs.utexas.edu;wits.ac.za",
        "position": ";PhD student;Assistant Professor;Senior Lecturer;Assistant Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\ncohen2024compositional,\ntitle={Compositional Instruction Following with Language Models and Reinforcement Learning},\nauthor={Vanya Cohen and Geraud Nangue Tasse and Nakul Gopalan and Steven James and Matthew Gombolay and Ray Mooney and Benjamin Rosman},\nyear={2024},\nurl={https://openreview.net/forum?id=lIwp1C1eSK}\n}",
        "github": "",
        "project": "",
        "reviewers": "wEbe;6vbo;VNmK;Gnf9",
        "site": "https://openreview.net/forum?id=lIwp1C1eSK",
        "pdf_size": 519459,
        "rating": "3;5;5;5",
        "confidence": "4;4;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;2",
        "presentation": "3;1;3;3",
        "wc_summary": "117;94;137;131",
        "wc_strengths": "86;36;68;100",
        "wc_weaknesses": "267;277;204;292",
        "wc_questions": "97;85;46;157",
        "wc_review": "567;492;455;680",
        "wc_reply_reviewers": "122;0;86;189",
        "wc_reply_authors": "769;1104;664;966",
        "reply_reviewers": "1;0;1;2",
        "reply_authors": "3;3;3;3",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            119.75,
            16.543503256565703
        ],
        "wc_strengths_avg": [
            72.5,
            23.93219588754864
        ],
        "wc_weaknesses_avg": [
            260.0,
            33.53356527421443
        ],
        "wc_questions_avg": [
            96.25,
            39.820691857374854
        ],
        "wc_review_avg": [
            548.5,
            85.97819491010497
        ],
        "wc_reply_reviewers_avg": [
            99.25,
            68.18861708525844
        ],
        "wc_reply_authors_avg": [
            875.75,
            170.6434513832863
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            3.0,
            0.0
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:GxSxzu5hC0gJ:scholar.google.com/&scioq=Compositional+Instruction+Following+with+Language+Models+and+Reinforcement+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;0;2;3;0",
        "aff_unique_norm": "University of the Witwatersrand;Arizona State University;Georgia Institute of Technology;University of Texas at Austin",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.wits.ac.za;https://www.asu.edu;https://www.gatech.edu;https://www.utexas.edu",
        "aff_unique_abbr": "Wits;ASU;Georgia Tech;UT Austin",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Austin",
        "aff_country_unique_index": "0;1;0;1;1;0",
        "aff_country_unique": "South Africa;United States"
    },
    {
        "title": "Context-Aware Meta-Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17939",
        "id": "lJYAkDVnRU",
        "author_site": "Christopher Fifty, Dennis Duan, Ronald Junkins, Ehsan Amid, Jure Leskovec, Christopher Re, Sebastian Thrun",
        "tldr": "",
        "abstract": "Large Language Models like ChatGPT demonstrate a remarkable capacity to learn new concepts during inference without any fine-tuning. However, visual models trained to detect new objects during inference have been unable to replicate this ability, and instead either perform poorly or require meta-training and/or fine-tuning on similar objects. In this work, we propose a meta-learning algorithm that emulates Large Language Models by learning new visual concepts during inference without fine-tuning. Our approach leverages a frozen pre-trained feature extractor, and analogous to in-context learning, recasts meta-learning as sequence modeling over datapoints with known labels and a test datapoint with an unknown label. On 8 out of 11 meta-learning benchmarks, our approach---without meta-training or fine-tuning---exceeds or matches the state-of-the-art algorithm, P>M>F, which is meta-trained on these benchmarks.",
        "keywords": "meta-learning;in-context learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Christopher Fifty;Dennis Duan;Ronald Guenther Junkins;Ehsan Amid;Jure Leskovec;Christopher Re;Sebastian Thrun",
        "authorids": "~Christopher_Fifty2;~Dennis_Duan1;~Ronald_Guenther_Junkins1;~Ehsan_Amid1;~Jure_Leskovec1;~Christopher_Re1;~Sebastian_Thrun1",
        "gender": ";;M;M;;;M",
        "homepage": ";;https://profiles.stanford.edu/ronny-junkins;https://sites.google.com/corp/view/eamid/;http://cs.stanford.edu/~jure/;;http://robot.cc",
        "dblp": ";;;142/5754;l/JureLeskovec;;t/SebastianThrun",
        "google_scholar": ";;;https://scholar.google.fi/citations?user=F6omR3gAAAAJ;Q_kKkIUAAAAJ;;",
        "orcid": ";;;;0000-0002-5411-923X;;",
        "linkedin": ";;;ehsan-amid-63aba754;leskovec/;;sebastian-thrun-59a0b273/",
        "or_profile": "~Christopher_Fifty2;~Dennis_Duan1;~Ronald_Guenther_Junkins1;~Ehsan_Amid1;~Jure_Leskovec1;~Christopher_Re1;~Sebastian_Thrun1",
        "aff": ";;Stanford University;Google DeepMind;Kumo.AI;;",
        "aff_domain": ";;stanford.edu;google.com;kumo.ai;;",
        "position": ";;Undergrad student;Research Scientist;Chief Scientist;;",
        "bibtex": "@inproceedings{\nfifty2024contextaware,\ntitle={Context-Aware Meta-Learning},\nauthor={Christopher Fifty and Dennis Duan and Ronald Guenther Junkins and Ehsan Amid and Jure Leskovec and Christopher Re and Sebastian Thrun},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=lJYAkDVnRU}\n}",
        "github": "",
        "project": "",
        "reviewers": "GdKg;8Akm;Hb5r;yxC1",
        "pdf_size": 6933131,
        "rating": "5;5;6;6",
        "confidence": "3;5;3;3",
        "soundness": "3;3;3;3",
        "contribution": "1;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "149;75;71;23",
        "wc_strengths": "71;32;140;52",
        "wc_weaknesses": "225;84;155;94",
        "wc_questions": "119;4;65;2",
        "wc_review": "564;195;431;171",
        "wc_reply_reviewers": "100;0;71;66",
        "wc_reply_authors": "1622;1038;1841;439",
        "reply_reviewers": "1;0;1;2",
        "reply_authors": "4;3;5;3",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            79.5,
            45.04164739438379
        ],
        "wc_strengths_avg": [
            73.75,
            40.6594085052894
        ],
        "wc_weaknesses_avg": [
            139.5,
            56.349356695529366
        ],
        "wc_questions_avg": [
            47.5,
            48.427781283061066
        ],
        "wc_review_avg": [
            340.25,
            164.34928506081187
        ],
        "wc_reply_reviewers_avg": [
            59.25,
            36.588078659585285
        ],
        "wc_reply_authors_avg": [
            1235.0,
            545.3049605495993
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            3.75,
            0.82915619758885
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3408551413917483880&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=lJYAkDVnRU",
        "pdf": "https://openreview.net/pdf?id=lJYAkDVnRU",
        "email": ";;stanford.edu;google.com;kumo.ai;;",
        "author_num": 7,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Stanford University;Google;Kumo.AI",
        "aff_unique_dep": ";Google DeepMind;",
        "aff_unique_url": "https://www.stanford.edu;https://deepmind.com;https://www.kumo.ai",
        "aff_unique_abbr": "Stanford;DeepMind;Kumo.AI",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Stanford;",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "title": "Pathformer: Multi-scale Transformers with Adaptive Pathways for Time Series Forecasting",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17938",
        "id": "lJkOCMP2aW",
        "author_site": "Peng Chen, Yingying ZHANG, Yunyao Cheng, Yang Shu, Yihang Wang, Qingsong Wen, Bin Yang, Chenjuan Guo",
        "tldr": "",
        "abstract": "Transformers for time series forecasting mainly model time series from limited or fixed scales, making it challenging to capture different characteristics spanning various scales. We propose Pathformer, a multi-scale Transformer with adaptive pathways. It integrates both temporal resolution and temporal distance for multi-scale modeling. Multi-scale division divides the time series into different temporal resolutions using patches of various sizes. Based on the division of each scale, dual attention is performed over these patches to capture global correlations and local details as temporal dependencies. We further enrich the multi-scale Transformer with adaptive pathways, which adaptively adjust the multi-scale modeling process based on the varying temporal dynamics of the input, improving the accuracy and generalization of Pathformer. Extensive experiments on eleven real-world datasets demonstrate that Pathformer not only achieves state-of-the-art performance by surpassing all current models but also exhibits stronger generalization abilities under various transfer scenarios. The code is made available at  https://github.com/decisionintelligence/pathformer.",
        "keywords": "Time series;Transformer;Multi-scale",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Peng Chen;Yingying ZHANG;Yunyao Cheng;Yang Shu;Yihang Wang;Qingsong Wen;Bin Yang;Chenjuan Guo",
        "authorids": "~Peng_Chen14;~Yingying_ZHANG4;~Yunyao_Cheng1;~Yang_Shu1;~Yihang_Wang2;~Qingsong_Wen2;~Bin_Yang4;~Chenjuan_Guo1",
        "gender": ";;M;M;M;;M;",
        "homepage": ";https://github.com/fjzhzhyy;;https://shuyang96.github.io/;https://github.com/wyhzunzun123123;;https://faculty.ecnu.edu.cn/_s37/yb2/main.psp;",
        "dblp": ";;336/5531;13/4526;161/4762-4.html;;77/377-2;",
        "google_scholar": ";;;VdyHmIwAAAAJ;uDN_qloAAAAJ;;qjBQhoUAAAAJ;",
        "orcid": ";0009-0005-1574-922X;0000-0002-1819-4056;0000-0002-9009-2775;0009-0008-2868-990X;;0000-0002-1658-1079;",
        "linkedin": ";;yunyao-cheng-35083621a/;;;;;",
        "or_profile": "~Peng_Chen14;~Yingying_ZHANG4;~Yunyao_Cheng1;~Yang_Shu1;~Yihang_Wang2;~Qingsong_Wen2;~Bin_Yang4;~Chenjuan_Guo1",
        "aff": ";Alibaba Group;Aalborg University;East China Normal University;East China Normal University;;Aalborg University;",
        "aff_domain": ";alibaba-inc.com;cs.aau.dk;ecnu.edu.cn;ecnu.edu.cn;;aau.dk;",
        "position": ";Researcher;PhD student;Assistant Professor;MS student;;Full Professor;",
        "bibtex": "@inproceedings{\nchen2024pathformer,\ntitle={Pathformer: Multi-scale Transformers with Adaptive Pathways for Time Series Forecasting},\nauthor={Peng Chen and Yingying ZHANG and Yunyao Cheng and Yang Shu and Yihang Wang and Qingsong Wen and Bin Yang and Chenjuan Guo},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=lJkOCMP2aW}\n}",
        "github": "",
        "project": "",
        "reviewers": "LNPN;Sqch;5cD6",
        "pdf_size": 2977976,
        "rating": "6;6;8",
        "confidence": "4;4;5",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "2;3;3",
        "wc_summary": "41;85;15",
        "wc_strengths": "30;39;30",
        "wc_weaknesses": "64;24;309",
        "wc_questions": "65;16;34",
        "wc_review": "200;164;388",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "704;601;2040",
        "reply_reviewers": "0;0;0",
        "reply_authors": "3;2;5",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            47.0,
            28.890598240027266
        ],
        "wc_strengths_avg": [
            33.0,
            4.242640687119285
        ],
        "wc_weaknesses_avg": [
            132.33333333333334,
            125.9850079264284
        ],
        "wc_questions_avg": [
            38.333333333333336,
            20.237478982214054
        ],
        "wc_review_avg": [
            250.66666666666666,
            98.2151832570821
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1115.0,
            655.4240357712454
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            1.247219128924647
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.9999999999999997,
        "gs_citation": 101,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2848590206034544321&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=lJkOCMP2aW",
        "pdf": "https://openreview.net/pdf?id=lJkOCMP2aW",
        "email": ";alibaba-inc.com;cs.aau.dk;ecnu.edu.cn;ecnu.edu.cn;;aau.dk;",
        "author_num": 8,
        "aff_unique_index": "0;1;2;2;1",
        "aff_unique_norm": "Alibaba Group;Aalborg University;East China Normal University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.alibaba.com;https://www.aau.dk;http://www.ecnu.edu.cn",
        "aff_unique_abbr": "Alibaba;AAU;ECNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;1",
        "aff_country_unique": "China;Denmark"
    },
    {
        "id": "lK0WxHeups",
        "title": "Iteration and Stochastic First-order Oracle Complexities of Stochastic Gradient Descent using Constant and Decaying Learning Rates",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The performance of stochastic gradient descent (SGD), which is the simplest first-order optimizer for training deep neural networks, depends on not only the learning rate but also the batch size. They both affect the number of iterations and the stochastic first-order oracle (SFO) complexity needed for training. In particular, the previous numerical results indicated that, for SGD using a constant learning rate, the number of iterations needed for training decreases when the batch size increases, and the SFO complexity needed for training is minimized at a critical batch size and increases once the batch size exceeds that size. This paper studies the relationship between batch size and the iteration and the SFO complexities needed for nonconvex optimization in deep learning with SGD using constant/decay learning rates. We show that SGD using a step-decay learning rate and a small batch size reduces the SFO complexity to find a local minimizer of a loss function. We also provide numerical comparisons of SGD with the existing first-order optimizers and show the usefulness of SGD using a step-decay learning rate and a small batch size.",
        "keywords": "batch size;iteration complexity;nonconvex optimization;SFO complexity;SGD;step-decay learning rate",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Kento Imaizumi;Hideaki Iiduka",
        "authorids": "~Kento_Imaizumi1;~Hideaki_Iiduka1",
        "gender": "M;M",
        "homepage": "https://github.com/imakn0907;https://iiduka.net/en/",
        "dblp": ";48/8221",
        "google_scholar": ";https://scholar.google.co.jp/citations?user=jr5sK30AAAAJ",
        "orcid": ";0000-0001-9173-6723",
        "linkedin": ";",
        "or_profile": "~Kento_Imaizumi1;~Hideaki_Iiduka1",
        "aff": "Meiji University;Meiji University",
        "aff_domain": "meiji.ac.jp;meiji.ac.jp",
        "position": "Undergrad student;Full Professor",
        "bibtex": "@misc{\nimaizumi2024iteration,\ntitle={Iteration and Stochastic First-order Oracle Complexities of Stochastic Gradient Descent using Constant and Decaying Learning Rates},\nauthor={Kento Imaizumi and Hideaki Iiduka},\nyear={2024},\nurl={https://openreview.net/forum?id=lK0WxHeups}\n}",
        "github": "",
        "project": "",
        "reviewers": "xRbi;JhF4;1sx5;BdrQ",
        "site": "https://openreview.net/forum?id=lK0WxHeups",
        "pdf_size": 414298,
        "rating": "1;3;3;3",
        "confidence": "5;4;4;4",
        "soundness": "2;2;1;2",
        "contribution": "1;1;1;3",
        "presentation": "2;2;3;2",
        "wc_summary": "47;156;48;95",
        "wc_strengths": "4;35;28;156",
        "wc_weaknesses": "107;257;206;252",
        "wc_questions": "17;4;15;491",
        "wc_review": "175;452;297;994",
        "wc_reply_reviewers": "92;27;46;72",
        "wc_reply_authors": "633;641;723;1142",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;1;1;2",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            86.5,
            44.56736474147871
        ],
        "wc_strengths_avg": [
            55.75,
            59.010062701203765
        ],
        "wc_weaknesses_avg": [
            205.5,
            60.24325688406961
        ],
        "wc_questions_avg": [
            131.75,
            207.47213668345927
        ],
        "wc_review_avg": [
            479.5,
            312.8470073374524
        ],
        "wc_reply_reviewers_avg": [
            59.25,
            24.752525123712125
        ],
        "wc_reply_authors_avg": [
            784.75,
            209.24432489317363
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13800239544630422406&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Meiji University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.meiji.ac.jp",
        "aff_unique_abbr": "Meiji",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Japan"
    },
    {
        "title": "Bridging Vision and Language Spaces with Assignment Prediction",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17937",
        "id": "lK2V2E2MNv",
        "author_site": "Jungin Park, Jiyoung Lee, Kwanghoon Sohn",
        "tldr": "",
        "abstract": "This paper introduces VLAP, a novel approach that bridges pretrained vision models and large language models (LLMs) to make frozen LLMs understand the visual world. VLAP transforms the embedding space of pretrained vision models into the LLMs' word embedding space using a single linear layer for efficient and general-purpose visual and language understanding. Specifically, we harness well-established word embeddings to bridge two modality embedding spaces. The visual and text representations are simultaneously assigned to a set of word embeddings within pretrained LLMs by formulating the assigning procedure as an optimal transport problem. We predict the assignment of one modality from the representation of another modality data, enforcing consistent assignments for paired multimodal data. This allows vision and language representations to contain the same information, grounding the frozen LLMs' word embedding space in visual data. Moreover, a robust semantic taxonomy of LLMs can be preserved with visual data since the LLMs interpret and reason linguistic information from correlations between word embeddings. Experimental results show that VLAP achieves substantial improvements over the previous linear transformation-based approaches across a range of vision-language tasks, including image captioning, visual question answering, and cross-modal retrieval. We also demonstrate the learned visual representations hold a semantic taxonomy of LLMs, making visual semantic arithmetic possible.",
        "keywords": "Multimodal learning;vision-language tasks;frozen LLMs;optimal transport;assignment prediction",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Jungin Park;Jiyoung Lee;Kwanghoon Sohn",
        "authorids": "~Jungin_Park1;~Jiyoung_Lee2;~Kwanghoon_Sohn2",
        "gender": "M;F;M",
        "homepage": "https://park-jungin.github.io;https://lee-jiyoung.github.io/;https://diml.yonsei.ac.kr",
        "dblp": "231/5157.html;;21/2373",
        "google_scholar": "Eqcge14AAAAJ;nIPWv9EAAAAJ;zEtk0QsAAAAJ",
        "orcid": "0000-0003-4580-1461;0009-0000-6647-9403;",
        "linkedin": "jungin-park-569aa1216/;;",
        "or_profile": "~Jungin_Park1;~Jiyoung_Lee2;~Kwanghoon_Sohn2",
        "aff": "Yonsei University;NAVER;Yonsei University",
        "aff_domain": "yonsei.ac.kr;navercorp.com;yonsei.ac.kr",
        "position": "PhD student;Research Scientist;Full Professor",
        "bibtex": "@inproceedings{\npark2024bridging,\ntitle={Bridging Vision and Language Spaces with Assignment Prediction},\nauthor={Jungin Park and Jiyoung Lee and Kwanghoon Sohn},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=lK2V2E2MNv}\n}",
        "github": "",
        "project": "",
        "reviewers": "zAaX;dYxb;oDtB;5A8P;m8gW",
        "pdf_size": 15616931,
        "rating": "5;5;5;6;8",
        "confidence": "4;5;4;5;3",
        "soundness": "2;2;2;3;3",
        "contribution": "2;2;3;2;3",
        "presentation": "3;3;3;4;3",
        "wc_summary": "118;128;71;116;79",
        "wc_strengths": "57;38;40;47;44",
        "wc_weaknesses": "271;228;108;132;34",
        "wc_questions": "52;7;18;15;20",
        "wc_review": "498;401;237;310;177",
        "wc_reply_reviewers": "0;0;123;61;0",
        "wc_reply_authors": "522;1092;866;722;605",
        "reply_reviewers": "0;0;1;1;0",
        "reply_authors": "3;4;4;3;3",
        "rating_avg": [
            5.8,
            1.16619037896906
        ],
        "confidence_avg": [
            4.2,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            3.2,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            102.4,
            22.878811157925142
        ],
        "wc_strengths_avg": [
            45.2,
            6.675327707311453
        ],
        "wc_weaknesses_avg": [
            154.6,
            85.04492930210478
        ],
        "wc_questions_avg": [
            22.4,
            15.447977213862014
        ],
        "wc_review_avg": [
            324.6,
            114.52266151290756
        ],
        "wc_reply_reviewers_avg": [
            36.8,
            49.15038148376877
        ],
        "wc_reply_authors_avg": [
            761.4,
            201.77373466336
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            3.4,
            0.4898979485566356
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.6416889479197478,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9342346157973545946&as_sdt=4000005&sciodt=0,18&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=lK2V2E2MNv",
        "pdf": "https://openreview.net/pdf?id=lK2V2E2MNv",
        "email": "yonsei.ac.kr;navercorp.com;yonsei.ac.kr",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Yonsei University;NAVER Corporation",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.yonsei.ac.kr;https://www.naver.com",
        "aff_unique_abbr": "Yonsei;NAVER",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "lK4QHgjUU8",
        "title": "SteinDreamer: Variance Reduction for Text-to-3D Score Distillation via Stein Identity",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Score distillation has emerged as one of the most prevalent approaches for text-to-3D asset synthesis. Essentially, score distillation updates 3D parameters by lifting and back-propagating scores averaged over different views. In this paper, we reveal that the gradient estimation in score distillation is inherent to high variance. Through the lens of variance reduction, the effectiveness of SDS and VSD can be interpreted as applications of various control variates to the Monte Carlo estimator of the distilled score. Motivated by this rethinking and based on Stein's identity, we propose a more general solution to reduce variance for score distillation, termed *Stein Score Distillation (SSD)*. SSD incorporates control variates constructed by Stein identity, allowing for arbitrary baseline functions. This enables us to include flexible guidance priors and network architectures to explicitly optimize for variance reduction. In our experiments, the overall pipeline, dubbed *SteinDreamer*, is implemented by instantiating the control variate with a monocular depth estimator. The results suggest that SSD can effectively reduce the distillation variance and consistently improve visual quality for both object- and scene-level generation. Moreover, we demonstrate that SteinDreamer achieves faster convergence than existing methods due to more stable gradient updates.",
        "keywords": "Text-to-3D Generation;Variance Reduction;Score Distillation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/02fc23ebf19ea997782da7574ac31cf3edd32433.zip",
        "author": "Peihao Wang;Zhiwen Fan;Dejia Xu;Dilin Wang;Sreyas Mohan;Forrest Iandola;Rakesh Ranjan;YILEI LI;qiang liu;Zhangyang Wang;Vikas Chandra",
        "authorids": "~Peihao_Wang1;~Zhiwen_Fan2;~Dejia_Xu1;~Dilin_Wang1;~Sreyas_Mohan1;~Forrest_Iandola1;~Rakesh_Ranjan2;~YILEI_LI1;~qiang_liu4;~Zhangyang_Wang1;~Vikas_Chandra2",
        "gender": "M;;M;;M;;;;;M;M",
        "homepage": "https://peihaowang.github.io/;;https://ir1d.github.io;;https://sreyas-mohan.github.io;http://forrestiandola.com;;https://liyilui.github.io/personal_page/;;https://vita-group.github.io;https://v-chandra.github.io/",
        "dblp": "239/4075;;264/5685;;200/8516;89/10238;;;;119/4026;57/5163",
        "google_scholar": "fqf2tBsAAAAJ;;ET0e93cAAAAJ;;https://scholar.google.co.in/citations?user=jaobZDsAAAAJ;;;iTp5xFcAAAAJ;;pxFyKAIAAAAJ;p-h_BvcAAAAJ",
        "orcid": ";;;;;;;;;;",
        "linkedin": "peihao-wang-25a411162/;;;;;;;;;;vchandra/",
        "or_profile": "~Peihao_Wang1;~Zhiwen_Fan2;~Dejia_Xu1;~Dilin_Wang1;~Sreyas_Mohan1;~Forrest_Iandola1;~Rakesh_Ranjan2;~YILEI_LI1;~qiang_liu4;~Zhangyang_Wang1;~Vikas_Chandra2",
        "aff": "University of Texas, Austin;;University of Texas at Austin;;Meta;Meta;;Meta Facebook;;University of Texas at Austin;Meta",
        "aff_domain": "utexas.edu;;utexas.edu;;meta.com;meta.com;;fb.com;;utexas.edu;meta.com",
        "position": "PhD student;;PhD student;;Researcher;Researcher;;Researcher;;Associate Professor;Director, AI",
        "bibtex": "@misc{\nwang2024steindreamer,\ntitle={SteinDreamer: Variance Reduction for Text-to-3D Score Distillation via Stein Identity},\nauthor={Peihao Wang and Zhiwen Fan and Dejia Xu and Dilin Wang and Sreyas Mohan and Forrest Iandola and Rakesh Ranjan and YILEI LI and qiang liu and Zhangyang Wang and Vikas Chandra},\nyear={2024},\nurl={https://openreview.net/forum?id=lK4QHgjUU8}\n}",
        "github": "",
        "project": "",
        "reviewers": "HqJT;D8i1;4Z6k;XeQE",
        "site": "https://openreview.net/forum?id=lK4QHgjUU8",
        "pdf_size": 19460586,
        "rating": "3;5;6;6",
        "confidence": "5;3;4;4",
        "soundness": "2;3;3;3",
        "contribution": "1;3;3;3",
        "presentation": "2;2;3;2",
        "wc_summary": "66;100;41;69",
        "wc_strengths": "28;67;38;91",
        "wc_weaknesses": "407;195;77;132",
        "wc_questions": "29;13;49;5",
        "wc_review": "530;375;205;297",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "558;325;384;333",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            69.0,
            20.940391591371924
        ],
        "wc_strengths_avg": [
            56.0,
            24.76893215300167
        ],
        "wc_weaknesses_avg": [
            202.75,
            125.0967125867023
        ],
        "wc_questions_avg": [
            24.0,
            16.822603841260722
        ],
        "wc_review_avg": [
            351.75,
            119.2127824522186
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            400.0,
            93.98670118692326
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 20,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1700215967855032093&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;1;1;0;1",
        "aff_unique_norm": "University of Texas at Austin;Meta",
        "aff_unique_dep": ";Meta Platforms, Inc.",
        "aff_unique_url": "https://www.utexas.edu;https://meta.com",
        "aff_unique_abbr": "UT Austin;Meta",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Austin;",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "TokenFlow: Consistent Diffusion Features for Consistent Video Editing",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17936",
        "id": "lKK50q2MtV",
        "author_site": "Michal Geyer, Omer Bar Tal, Shai Bagon, Tali Dekel",
        "tldr": "",
        "abstract": "The generative AI revolution has recently expanded to videos. Nevertheless, current state-of-the-art video models are still lagging behind image models in terms of visual quality and user control over the generated content. In this work, we present a framework that harnesses the power of a text-to-image diffusion model for the task of text-driven video editing. Specifically, given a source video and a target text-prompt, our method generates a high-quality video that adheres to the target text, while preserving the spatial layout and motion of the input video. Our method is based on a key observation that consistency in the edited video can be obtained by enforcing consistency in the diffusion feature space. We achieve this by explicitly propagating diffusion features based on inter-frame correspondences, readily available in the model. Thus, our framework does not require any training or fine-tuning, and can work in conjunction with any off-the-shelf text-to-image editing method. We demonstrate state-of-the-art editing results on a variety of real-world videos.",
        "keywords": "Computer Vision Applications;Video Editing and Synthesis;Text-to-Image Diffusion Models;Text-driven Video Editing",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/0d45a5016ac6f6c7dfa79a0d9951f7ab56700856.zip",
        "author": "Michal Geyer;Omer Bar-Tal;Shai Bagon;Tali Dekel",
        "authorids": "~Michal_Geyer1;~Omer_Bar-Tal2;~Shai_Bagon1;~Tali_Dekel1",
        "gender": "F;;M;F",
        "homepage": ";https://omerbt.github.io/;https://www.weizmann.ac.il/math/bagon/;https://www.weizmann.ac.il/math/dekel/home",
        "dblp": ";310/1524;67/3849;",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;Uyi1fqMAAAAJ;N_maL_AAAAAJ;https://scholar.google.co.il/citations?user=T0-Wo0EAAAAJ",
        "orcid": ";0000-0003-1622-3674;0000-0002-6057-4263;",
        "linkedin": ";;shai-bagon-315595a;",
        "or_profile": "~Michal_Geyer1;~Omer_Bar-Tal2;~Shai_Bagon1;~Tali_Dekel1",
        "aff": "Weizmann Institute of Science;Google;Weizmann Institute of Science, Israel;Google",
        "aff_domain": "weizmann.ac.il;google.com;weizmann.ac.il;google.com",
        "position": "PhD student;Intern;Research Associate;Researcher",
        "bibtex": "@inproceedings{\ngeyer2024tokenflow,\ntitle={TokenFlow: Consistent Diffusion Features for Consistent Video Editing},\nauthor={Michal Geyer and Omer Bar-Tal and Shai Bagon and Tali Dekel},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=lKK50q2MtV}\n}",
        "github": "",
        "project": "",
        "reviewers": "Mqtb;vSnb;6aWr;FeQk",
        "pdf_size": 15716111,
        "rating": "6;6;8;8",
        "confidence": "4;4;4;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;4",
        "wc_summary": "55;95;137;88",
        "wc_strengths": "130;105;236;70",
        "wc_weaknesses": "174;133;154;13",
        "wc_questions": "121;80;58;29",
        "wc_review": "480;413;585;200",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "321;441;259;157",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            93.75,
            29.18368551091517
        ],
        "wc_strengths_avg": [
            135.25,
            61.949071825169426
        ],
        "wc_weaknesses_avg": [
            118.5,
            62.61189982742897
        ],
        "wc_questions_avg": [
            72.0,
            33.57826678076163
        ],
        "wc_review_avg": [
            419.5,
            140.77730640980457
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            294.5,
            102.87249389414062
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 244,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8848843134234027713&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=lKK50q2MtV",
        "pdf": "https://openreview.net/pdf?id=lKK50q2MtV",
        "email": "weizmann.ac.il;google.com;weizmann.ac.il;google.com",
        "author_num": 4,
        "aff_unique_index": "0;1;0;1",
        "aff_unique_norm": "Weizmann Institute of Science;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.weizmann.org.il;https://www.google.com",
        "aff_unique_abbr": "Weizmann;Google",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;0;1",
        "aff_country_unique": "Israel;United States"
    },
    {
        "title": "CLIP-MUSED: CLIP-Guided Multi-Subject Visual Neural Information Semantic Decoding",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17935",
        "id": "lKxL5zkssv",
        "author_site": "Qiongyi Zhou, Changde Du, Shengpei Wang, Huiguang He",
        "tldr": "",
        "abstract": "The study of decoding visual neural information faces challenges in generalizing single-subject decoding models to multiple subjects, due to individual differences. Moreover, the limited availability of data from a single subject has a constraining impact on model performance. Although prior multi-subject decoding methods have made significant progress, they still suffer from several limitations, including difficulty in extracting global neural response features, linear scaling of model parameters with the number of subjects, and inadequate characterization of the relationship between neural responses of different subjects to various stimuli.\nTo overcome these limitations, we propose a CLIP-guided Multi-sUbject visual neural information SEmantic Decoding (CLIP-MUSED) method. Our method consists of a Transformer-based feature extractor to effectively model global neural representations. It also incorporates learnable subject-specific tokens that facilitates the aggregation of multi-subject data without a linear increase of parameters. Additionally, we employ representational similarity analysis (RSA) to guide token representation learning based on the topological relationship of visual stimuli in the representation space of CLIP, enabling full characterization of the relationship between neural responses of different subjects under different stimuli. Finally, token representations are used for multi-subject semantic decoding. Our proposed method outperforms single-subject decoding methods and achieves state-of-the-art performance among the existing multi-subject methods on two fMRI datasets. Visualization results provide insights into the effectiveness of our proposed method. Code is available at https://github.com/CLIP-MUSED/CLIP-MUSED.",
        "keywords": "Multi-subject visual neural decoding;representational similarity analysis;CLIP;transformer",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/f14ce0bd0cf430d283aa61d322c6c8592a1b15bc.zip",
        "author": "Qiongyi Zhou;Changde Du;Shengpei Wang;Huiguang He",
        "authorids": "~Qiongyi_Zhou2;~Changde_Du2;~Shengpei_Wang1;~Huiguang_He1",
        "gender": ";M;M;M",
        "homepage": "https://github.com/ZhouqyCH;https://changdedu.github.io/;;http://nica.net.cn/",
        "dblp": "https://dblp.uni-trier.de/pid/231/3564;178/4485.html;191/3892;https://dblp.uni-trier.de/pid/84/5905",
        "google_scholar": ";ef2EFsYAAAAJ;AqoWVdsAAAAJ;https://scholar.google.com.hk/citations?user=dlvs3e4AAAAJ",
        "orcid": ";;0000-0001-6032-9578;0000-0002-0684-1711",
        "linkedin": ";;;",
        "or_profile": "~Qiongyi_Zhou2;~Changde_Du2;~Shengpei_Wang1;~Huiguang_He1",
        "aff": ";Institute of Automation, Chinese Academy of Sciences;Institute of Automation, Chinese Academy of Sciences;Institute of Automation Chinese Academy of Sciences",
        "aff_domain": ";ia.ac.cn;ia.ac.cn;ia.ac.cn",
        "position": ";Associate Professor;Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\nzhou2024clipmused,\ntitle={{CLIP}-{MUSED}: {CLIP}-Guided Multi-Subject Visual Neural Information Semantic Decoding},\nauthor={Qiongyi Zhou and Changde Du and Shengpei Wang and Huiguang He},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=lKxL5zkssv}\n}",
        "github": "",
        "project": "",
        "reviewers": "UuaC;qr5q;mWYc",
        "pdf_size": 6055743,
        "rating": "5;6;8",
        "confidence": "4;3;3",
        "soundness": "3;3;3",
        "contribution": "3;2;3",
        "presentation": "3;2;3",
        "wc_summary": "79;127;129",
        "wc_strengths": "56;103;74",
        "wc_weaknesses": "96;388;83",
        "wc_questions": "84;220;48",
        "wc_review": "315;838;334",
        "wc_reply_reviewers": "0;270;0",
        "wc_reply_authors": "810;1434;952",
        "reply_reviewers": "0;2;0",
        "reply_authors": "3;4;3",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            111.66666666666667,
            23.11324776447962
        ],
        "wc_strengths_avg": [
            77.66666666666667,
            19.362047641943477
        ],
        "wc_weaknesses_avg": [
            189.0,
            140.81429851640303
        ],
        "wc_questions_avg": [
            117.33333333333333,
            74.06903686576614
        ],
        "wc_review_avg": [
            495.6666666666667,
            242.19046682770613
        ],
        "wc_reply_reviewers_avg": [
            90.0,
            127.27922061357856
        ],
        "wc_reply_authors_avg": [
            1065.3333333333333,
            267.0547176558059
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.7559289460184545,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4905006205744203535&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=lKxL5zkssv",
        "pdf": "https://openreview.net/pdf?id=lKxL5zkssv",
        "email": ";ia.ac.cn;ia.ac.cn;ia.ac.cn",
        "author_num": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Chinese Academy of Sciences",
        "aff_unique_dep": "Institute of Automation",
        "aff_unique_url": "http://www.ia.cas.cn",
        "aff_unique_abbr": "CAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "lLhEQWQYtb",
        "title": "Parameter Estimation of Long Memory Stochastic Processes with Deep Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We present a pure deep neural network-based approach for estimating long memory parameters of time series models that incorporate the phenomenon of long range dependence. Long memory parameters such as the Hurst exponent are critical in characterizing the long-range dependence, roughness, and self-similarity of stochastic processes. The accurate and fast estimation of these parameters is of paramount importance in various scientific fields, including finance, physics, and engineering. We harnessed efficient process generators to provide high-quality synthetic training data to train 1D Convolutional Neural Network (CNN) and Long Short-Term Memory (LSTM) models. Our neural models outperform conventional statistical methods, even if the latter have neural network extensions. Precision, speed as well as consistency and robustness of the estimators are supported by experiments with fractional Brownian motion (fBm), the Autoregressive Fractionally Integrated Moving Average (ARFIMA) process, and the fractional Ornstein-Uhlenbeck process (fOU). We believe that our work will inspire further research in the application of deep learning techniques for stochastic process modeling and parameter estimation.",
        "keywords": "Hurst parameter;Fractional Brownian motion;ARFIMA;Fractional Ornstein-Uhlenbeck processes;1D convolutional neural networks;LSTM",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Balint Csanady;L\u00f3r\u00e1nt Nagy;D\u00e1vid Kov\u00e1cs;Daniel Boros;Ivan Ivkovic;Dalma T\u00f3th-Lakits;Laszlo Markus;Andr\u00e1s Luk\u00e1cs",
        "authorids": "~Balint_Csanady1;~L\u00f3r\u00e1nt_Nagy1;~D\u00e1vid_Kov\u00e1cs1;~Daniel_Boros1;~Ivan_Ivkovic1;~Dalma_T\u00f3th-Lakits1;~Laszlo_Markus1;~Andr\u00e1s_Luk\u00e1cs1",
        "gender": "M;M;Not Specified;M;M;F;M;M",
        "homepage": "https://web.cs.elte.hu/~csbalint;;https://davidkovacs.ai.elte.hu;;https://www.renyi.hu/hu/kutatok/ivkovic-ivan;;http://www.math.elte.hu;https://ai.elte.hu/",
        "dblp": "311/4784;;;;;;;44/1215",
        "google_scholar": ";https://scholar.google.com/citations?hl=hu;;;;;;https://scholar.google.hu/citations?user=4h1kkMAAAAAJ",
        "orcid": ";0000-0001-9092-9478;;;;;;0000-0003-3955-9824",
        "linkedin": ";;;daniel-boros-b86a5373/;;dalma-t%C3%B3th-lakits-873390131/;;alukacs/",
        "or_profile": "~Balint_Csanady1;~L\u00f3r\u00e1nt_Nagy1;~D\u00e1vid_Kov\u00e1cs1;~Daniel_Boros1;~Ivan_Ivkovic1;~Dalma_T\u00f3th-Lakits1;~Laszlo_Markus1;~Andr\u00e1s_Luk\u00e1cs1",
        "aff": "E\u00f6tv\u00f6s Lorand University;Alfr\u00e9d R\u00e9nyi Institute of Mathematics, Hungarian Academy of Sciences;E\u00f6tv\u00f6s Lorand University;E\u00f6tv\u00f6s Lorand University;Alfr\u00e9d R\u00e9nyi Institute of Mathematics;Morgan Stanley;E\u00f6tv\u00f6s Lorand University;E\u00f6tv\u00f6s Lor\u00e1nd University",
        "aff_domain": "elte.hu;renyi.mta.hu;elte.hu;elte.hu;renyi.hu;morganstanley.com;elte.hu;elte.hu",
        "position": "PhD student;Researcher;MS student;Researcher;Researcher;Intern;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\ncsanady2024parameter,\ntitle={Parameter Estimation of Long Memory Stochastic Processes with Deep Neural Networks},\nauthor={Balint Csanady and L{\\'o}r{\\'a}nt Nagy and D{\\'a}vid Kov{\\'a}cs and Daniel Boros and Ivan Ivkovic and Dalma T{\\'o}th-Lakits and Laszlo Markus and Andr{\\'a}s Luk{\\'a}cs},\nyear={2024},\nurl={https://openreview.net/forum?id=lLhEQWQYtb}\n}",
        "github": "",
        "project": "",
        "reviewers": "Rt5S;pWyU;4CiJ;H3eJ",
        "site": "https://openreview.net/forum?id=lLhEQWQYtb",
        "pdf_size": 5347885,
        "rating": "3;3;3;5",
        "confidence": "3;3;3;3",
        "soundness": "2;3;2;3",
        "contribution": "2;1;1;3",
        "presentation": "2;2;2;1",
        "wc_summary": "50;49;56;53",
        "wc_strengths": "26;22;25;40",
        "wc_weaknesses": "146;69;99;151",
        "wc_questions": "159;1;36;21",
        "wc_review": "381;141;216;265",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "732;289;426;404",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            52.0,
            2.7386127875258306
        ],
        "wc_strengths_avg": [
            28.25,
            6.94172168845741
        ],
        "wc_weaknesses_avg": [
            116.25,
            33.995404101142846
        ],
        "wc_questions_avg": [
            54.25,
            61.738865392878736
        ],
        "wc_review_avg": [
            250.75,
            87.20772614854718
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            462.75,
            163.925859765932
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10884163366515752187&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;0;0;2;3;0;0",
        "aff_unique_norm": "E\u00f6tv\u00f6s Lor\u00e1nd University;Hungarian Academy of Sciences;Alfr\u00e9d R\u00e9nyi Institute of Mathematics;Morgan Stanley",
        "aff_unique_dep": ";Alfr\u00e9d R\u00e9nyi Institute of Mathematics;Institute of Mathematics;",
        "aff_unique_url": "https://www.elte.hu;https://www.mta.hu;https://www.renyi.hu;https://www.morganstanley.com",
        "aff_unique_abbr": "ELTE;MTA;R\u00e9nyi Institute;Morgan Stanley",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;1;0;0",
        "aff_country_unique": "Hungary;United States"
    },
    {
        "title": "Grounding Multimodal Large Language Models to the World",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17934",
        "id": "lLmqxkfSIw",
        "author_site": "Zhiliang Peng, Wenhui Wang, Li Dong, Yaru Hao, Shaohan Huang, Shuming Ma, Qixiang Ye, Furu Wei",
        "tldr": "",
        "abstract": "We introduce Kosmos-2, a Multimodal Large Language Model (MLLM), enabling new capabilities of perceiving object descriptions (e.g., bounding boxes) and grounding text to the visual world. Specifically, we represent text spans (i.e., referring expressions and noun phrases) as links in Markdown, i.e., [text span](bounding boxes), where object descriptions are sequences of location tokens. To train the model, we construct a large-scale dataset about grounded image-text pairs (GrIT) together with multimodal corpora. In addition to the existing capabilities of MLLMs (e.g., perceiving general modalities, following instructions, and performing in-context learning), Kosmos-2 integrates the grounding capability to downstream applications, while maintaining the conventional capabilities of MLLMs (e.g., perceiving general modalities, following instructions, and performing in-context learning). Kosmos-2 is evaluated on a wide range of tasks, including (i) multimodal grounding, such as referring expression comprehension and phrase grounding, (ii) multimodal referring, such as referring expression generation, (iii) perception-language tasks, and (iv) language understanding and generation. This study sheds a light on the big convergence of language, multimodal perception, and world modeling, which is a key step toward artificial general intelligence. Code can be found in [https://aka.ms/kosmos-2](https://aka.ms/kosmos-2).",
        "keywords": "large language model;multimodal large language model;grounding;referring",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/5a756f8d39985b7203b649d6e93c1f2190bddd94.zip",
        "author": "Zhiliang Peng;Wenhui Wang;Li Dong;Yaru Hao;Shaohan Huang;Shuming Ma;Qixiang Ye;Furu Wei",
        "authorids": "~Zhiliang_Peng1;~Wenhui_Wang1;~Li_Dong1;~Yaru_Hao1;~Shaohan_Huang1;~Shuming_Ma1;~Qixiang_Ye1;~Furu_Wei1",
        "gender": "M;M;M;F;M;;M;M",
        "homepage": ";;http://dong.li;https://yaruhao.github.io/;;https://www.microsoft.com/en-us/research/people/shumma/;http://people.ucas.ac.cn/~qxye?language=en;https://www.microsoft.com/en-us/research/people/fuwei/",
        "dblp": "289/0209;37/2855;85/5090-4;173/4242;176/0380;;06/4335;72/5870",
        "google_scholar": "-X1tyN0AAAAJ;BxmpMVUAAAAJ;wEfQgPgAAAAJ;https://scholar.google.com/citations?hl=zh-CN;;;https://scholar.google.com.hk/citations?user=tjEfgsEAAAAJ;G-V1VpwAAAAJ",
        "orcid": ";;;;;;;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Zhiliang_Peng1;~Wenhui_Wang1;~Li_Dong1;~Yaru_Hao1;~Shaohan_Huang1;~Shuming_Ma1;~Qixiang_Ye1;~Furu_Wei1",
        "aff": "University of Chinese Academy of Sciences;Microsoft;Microsoft Research;Microsoft Research Asia;Microsoft;Microsoft;University of Chinese Academy of Sciences;Microsoft Research",
        "aff_domain": "ucas.ac.cn;microsoft.com;microsoft.com;microsoft.com;microsoft.com;microsoft.com;ucas.ac.cn;microsoft.com",
        "position": "PhD student;Researcher;Principal Researcher;Researcher;Researcher;Researcher;Full Professor;Distinguished Scientist",
        "bibtex": "@inproceedings{\npeng2024grounding,\ntitle={Grounding Multimodal Large Language Models to the World},\nauthor={Zhiliang Peng and Wenhui Wang and Li Dong and Yaru Hao and Shaohan Huang and Shuming Ma and Qixiang Ye and Furu Wei},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=lLmqxkfSIw}\n}",
        "github": "",
        "project": "",
        "reviewers": "873R;n3ax;Cmrj;vJ2h",
        "pdf_size": 7499538,
        "rating": "6;6;8;8",
        "confidence": "4;4;4;4",
        "soundness": "3;3;3;3",
        "contribution": "3;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "99;80;87;153",
        "wc_strengths": "96;98;91;98",
        "wc_weaknesses": "579;179;49;58",
        "wc_questions": "74;13;31;51",
        "wc_review": "848;370;258;360",
        "wc_reply_reviewers": "15;30;0;15",
        "wc_reply_authors": "445;809;420;302",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            104.75,
            28.673812093964763
        ],
        "wc_strengths_avg": [
            95.75,
            2.8613807855648994
        ],
        "wc_weaknesses_avg": [
            216.25,
            215.63322448082994
        ],
        "wc_questions_avg": [
            42.25,
            22.730761095924613
        ],
        "wc_review_avg": [
            459.0,
            228.82526084329064
        ],
        "wc_reply_reviewers_avg": [
            15.0,
            10.606601717798213
        ],
        "wc_reply_authors_avg": [
            494.0,
            189.71425882099638
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 54,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6569695609335586478&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=lLmqxkfSIw",
        "pdf": "https://openreview.net/pdf?id=lLmqxkfSIw",
        "email": "ucas.ac.cn;microsoft.com;microsoft.com;microsoft.com;microsoft.com;microsoft.com;ucas.ac.cn;microsoft.com",
        "author_num": 8,
        "aff_unique_index": "0;1;1;1;1;1;0;1",
        "aff_unique_norm": "University of Chinese Academy of Sciences;Microsoft",
        "aff_unique_dep": ";Microsoft Corporation",
        "aff_unique_url": "http://www.ucas.ac.cn;https://www.microsoft.com",
        "aff_unique_abbr": "UCAS;Microsoft",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Asia",
        "aff_country_unique_index": "0;1;1;0;1;1;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "lM2In9x2c7",
        "title": "BCN: Batch Channel Normalization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Normalization techniques enable higher learning rates and are less careful in initialization. Unlike the standard Batch Normalization (BN) and Layer Normalization (LN), where BN computes the mean and variance along the (N, H, W) axes (N is the batch axes, H and W are the spatial height and width axes) and LN computes the mean and variance along the (C, H, W) axes (C is the channel axes), this paper presents a simple normalization technique called Batch Channel Normalization (BCN). BCN separately normalizes inputs along the (N, H, W) and (C, H, W) axes, then combine the normalized outputs based on adaptive parameters. BCN exploits both the channel and batch dependence and adaptively combines the advantages of BN and LN. As a basic block, BCN can be easily integrated into existing models for various applications in the field of computer vision. Empirical results show that the proposed (BCN) technique improves the\ngeneralization performance of various models.",
        "keywords": "Normalization technique;batch normalization;batch channel normalization",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Afifa Abduljabbar Qahtan Khaled;Chao Li;Kun He",
        "authorids": "~Afifa_Abduljabbar_Qahtan_Khaled1;~Chao_Li14;~Kun_He1",
        "gender": "F;M;F",
        "homepage": "https://github.com/AfifaKhaled;https://github.com/lichaoaaron;http://faculty.hust.edu.cn/hekun/zh_CN/more/1411001/jsjjgd/index.htm",
        "dblp": ";;59/1028-1",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;Wik8bkIAAAAJ;YTQnGJsAAAAJ",
        "orcid": ";0000-0001-9066-1440;0000-0001-7627-4604",
        "linkedin": ";;",
        "or_profile": "~Afifa_Abduljabbar_Qahtan_Khaled1;~Chao_Li14;~Kun_He1",
        "aff": "Tianjin University;Huazhong University of Science and Technology;Huazhong University of Sceince and Technology",
        "aff_domain": "tju.edu.cn;hust.edu.cn;hust.edu.cn",
        "position": "MS student;PhD student;Full Professor",
        "bibtex": "@misc{\nkhaled2024bcn,\ntitle={{BCN}: Batch Channel Normalization},\nauthor={Afifa Abduljabbar Qahtan Khaled and Chao Li and Kun He},\nyear={2024},\nurl={https://openreview.net/forum?id=lM2In9x2c7}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=lM2In9x2c7",
        "pdf_size": 337286,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ymiXGg1BHEcJ:scholar.google.com/&scioq=BCN:+Batch+Channel+Normalization&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Tianjin University;Huazhong University of Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.tju.edu.cn;http://www.hust.edu.cn",
        "aff_unique_abbr": "TJU;HUST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Non-negative Contrastive Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17933",
        "id": "lNCnZwcH5Z",
        "author_site": "Yifei Wang, Qi Zhang, Yaoyu Guo, Yisen Wang",
        "tldr": "",
        "abstract": "Deep representations have shown promising performance when transferred to downstream tasks in a black-box manner. Yet, their inherent lack of interpretability remains a significant challenge, as these features are often opaque to human understanding. In this paper, we propose Non-negative Contrastive Learning (NCL), a renaissance of Non-negative Matrix Factorization (NMF) aimed at deriving interpretable features. The power of NCL lies in its enforcement of non-negativity constraints on features, reminiscent of NMF's capability to extract features that align closely with sample clusters. NCL not only aligns mathematically well with an NMF objective but also preserves NMF's interpretability attributes, resulting in a more sparse and disentangled representation compared to standard contrastive learning (CL). Theoretically, we establish guarantees on the identifiability and downstream generalization of NCL. Empirically, we show that these advantages enable NCL to outperform CL significantly on feature disentanglement, feature selection, as well as downstream classification tasks. At last, we show that NCL can be easily extended to other learning scenarios and benefit supervised learning as well. Code is available at https://github.com/PKU-ML/non_neg.",
        "keywords": "Contrastive Learning;Representation Learning;Self-supervised Learning;Deep Learning;Disentanglement;Interpretability",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Yifei Wang;Qi Zhang;Yaoyu Guo;Yisen Wang",
        "authorids": "~Yifei_Wang1;~Qi_Zhang28;~Yaoyu_Guo1;~Yisen_Wang1",
        "gender": "M;;M;M",
        "homepage": "https://yifeiwang77.com;https://github.com/Yaoyu77;https://yisenwang.github.io/;https://github.com/zhangq327",
        "dblp": "00/555-1;;172/1346-1;",
        "google_scholar": "-CLy6YsAAAAJ;;uMWPDboAAAAJ;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Yifei_Wang1;~Yaoyu_Guo1;~Yisen_Wang1;~zhang_qi2",
        "aff": "Massachusetts Institute of Technology;Peking University;Peking University;Peking University",
        "aff_domain": "mit.edu;pku.edu.cn;pku.edu.cn;pku.edu.cn",
        "position": "Postdoc;Undergrad student;Assistant Professor;PhD student",
        "bibtex": "@inproceedings{\nwang2024nonnegative,\ntitle={Non-negative Contrastive Learning},\nauthor={Yifei Wang and Qi Zhang and Yaoyu Guo and Yisen Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=lNCnZwcH5Z}\n}",
        "github": "",
        "project": "",
        "reviewers": "Szt3;kpGZ;eLwm;R2Pb",
        "pdf_size": 7496833,
        "rating": "5;6;6;6",
        "confidence": "4;3;3;3",
        "soundness": "2;2;3;3",
        "contribution": "2;3;3;2",
        "presentation": "2;3;3;3",
        "wc_summary": "46;58;81;151",
        "wc_strengths": "17;54;77;22",
        "wc_weaknesses": "61;191;383;224",
        "wc_questions": "77;139;126;148",
        "wc_review": "201;442;667;545",
        "wc_reply_reviewers": "0;104;496;210",
        "wc_reply_authors": "1210;1694;2177;2266",
        "reply_reviewers": "0;1;2;1",
        "reply_authors": "3;3;4;4",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            84.0,
            40.675545478825484
        ],
        "wc_strengths_avg": [
            42.5,
            24.45914961727002
        ],
        "wc_weaknesses_avg": [
            214.75,
            114.66990668872108
        ],
        "wc_questions_avg": [
            122.5,
            27.408940147331492
        ],
        "wc_review_avg": [
            463.75,
            171.33501539381842
        ],
        "wc_reply_reviewers_avg": [
            202.5,
            185.0047296692709
        ],
        "wc_reply_authors_avg": [
            1836.75,
            422.26139712268275
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            3.5,
            0.5
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2111794499205366772&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=lNCnZwcH5Z",
        "pdf": "https://openreview.net/pdf?id=lNCnZwcH5Z",
        "email": "mit.edu;pku.edu.cn;pku.edu.cn;pku.edu.cn",
        "author_num": 4,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Massachusetts Institute of Technology;Peking University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://web.mit.edu;http://www.pku.edu.cn",
        "aff_unique_abbr": "MIT;Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "lNIj5FdXsC",
        "title": "Recurrent Distance-Encoding Neural Networks for Graph Representation Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph neural networks based on iterative one-hop message-passing have been shown to struggle in harnessing information from distant nodes effectively. Conversely, graph transformers allow each node to attend to all other nodes directly, but suffer from high computational complexity and have to rely on ad-hoc positional encodings to bake in the graph inductive bias. In this paper, we propose a new architecture to reconcile these challenges. Our approach stems from the recent breakthroughs in long-range modeling provided by deep state-space models on sequential data: for a given target node, our model aggregates nodes at different distances and uses a parallelizable linear recurrent network over the chain of distances to provide a natural encoding of its neighborhood structure. With no need for positional encoding, we empirically show that the performance of our model is competitive compared with that of state-of-the-art graph transformers on various benchmarks, at a drastically reduced computational complexity. In addition, we show that our model is theoretically more expressive than one-hop message-passing neural networks.",
        "keywords": "Recurrent Neural Networks;Graph Neural Networks",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Yuhui Ding;Antonio Orvieto;Bobby He;Thomas Hofmann",
        "authorids": "~Yuhui_Ding1;~Antonio_Orvieto3;~Bobby_He1;~Thomas_Hofmann1",
        "gender": "M;M;;M",
        "homepage": "https://skeletondyh.github.io;http://orvi.altervista.org/;http://csml.stats.ox.ac.uk/people/he/;http://www.da.inf.ethz.ch/",
        "dblp": "230/3524;;270/3685;h/ThHofmann",
        "google_scholar": "r7KsfaAAAAAJ;xkuLyHoAAAAJ;;T3hAyLkAAAAJ",
        "orcid": ";;;",
        "linkedin": ";antonio-orvieto-947ab0130/;;thomas-hofmann-1ab2402/",
        "or_profile": "~Yuhui_Ding1;~Antonio_Orvieto3;~Bobby_He1;~Thomas_Hofmann1",
        "aff": "Department of Computer Science, ETHZ - ETH Zurich;ELLIS Institute T\u00fcbingen, Max Planck Institute for Intelligent Systems, T\u00fcbingen AI Center, T\u00fcbingen, Germany;Department of Computer Science, ETHZ - ETH Zurich;Swiss Federal Institute of Technology",
        "aff_domain": "inf.ethz.ch;tue.ellis.eu;inf.ethz.ch;ethz.ch",
        "position": "PhD student;Principal Researcher;Postdoc;Full Professor",
        "bibtex": "@misc{\nding2024recurrent,\ntitle={Recurrent Distance-Encoding Neural Networks for Graph Representation Learning},\nauthor={Yuhui Ding and Antonio Orvieto and Bobby He and Thomas Hofmann},\nyear={2024},\nurl={https://openreview.net/forum?id=lNIj5FdXsC}\n}",
        "github": "",
        "project": "",
        "reviewers": "8Mos;hzhG;bs5m;e7jX",
        "site": "https://openreview.net/forum?id=lNIj5FdXsC",
        "pdf_size": 1531388,
        "rating": "3;6;6;6",
        "confidence": "4;4;3;3",
        "soundness": "3;3;3;4",
        "contribution": "2;2;3;4",
        "presentation": "3;3;3;3",
        "wc_summary": "69;33;62;39",
        "wc_strengths": "106;13;71;99",
        "wc_weaknesses": "259;85;141;75",
        "wc_questions": "71;29;37;28",
        "wc_review": "505;160;311;241",
        "wc_reply_reviewers": "0;20;20;0",
        "wc_reply_authors": "835;692;671;685",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "3;1;2;2",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            50.75,
            15.105876340020794
        ],
        "wc_strengths_avg": [
            72.25,
            36.62905267680288
        ],
        "wc_weaknesses_avg": [
            140.0,
            73.16419889536138
        ],
        "wc_questions_avg": [
            41.25,
            17.52676524633111
        ],
        "wc_review_avg": [
            304.25,
            127.62714248936234
        ],
        "wc_reply_reviewers_avg": [
            10.0,
            10.0
        ],
        "wc_reply_authors_avg": [
            720.75,
            66.39418272710343
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1221768142465384619&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "ETH Zurich;ELLIS Institute T\u00fcbingen;Swiss Federal Institute of Technology",
        "aff_unique_dep": "Department of Computer Science;;",
        "aff_unique_url": "https://www.ethz.ch;;https://www.ethz.ch",
        "aff_unique_abbr": "ETHZ;;ETH Zurich",
        "aff_campus_unique_index": "0;1;0",
        "aff_campus_unique": "Zurich;T\u00fcbingen;",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "Switzerland;Germany"
    },
    {
        "id": "lNLVvdHyAw",
        "title": "Detecting Language Model Attacks With Perplexity",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "A novel hack involving Large Language Models (LLMs) has emerged, exploiting adversarial suffixes to deceive models into generating perilous responses. Such jailbreaks can trick LLMs into providing intricate instructions to a malicious user for creating explosives, orchestrating a bank heist, or facilitating the creation of offensive content. By evaluating the perplexity of queries with adversarial suffixes using an open-source LLM (GPT-2), we found that they have exceedingly high perplexity values. As we explored a broad range of regular (non-adversarial) prompt varieties, we concluded that false positives are a significant challenge for plain perplexity filtering. A Light-GBM trained on perplexity and token length resolved the false positives and correctly detected most adversarial attacks in the test set.",
        "keywords": "perplexity;jailbreak;llm;adversarial;attack;ChatGPT;BARD;LLaMA-2-Chat;Claude;generative model;neural network;adversarial string;adversarial suffix;nlp;transformer",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Gabriel Alon;Michael J Kamfonas",
        "authorids": "~Gabriel_Alon1;~Michael_J_Kamfonas1",
        "gender": ";",
        "homepage": "https://galonpy.github.io/;",
        "dblp": ";",
        "google_scholar": "jmQMOTsAAAAJ;",
        "orcid": "0009-0008-5775-0458;0000-0001-9114-0495",
        "linkedin": "gabrielalon/;kamfonas",
        "or_profile": "~Gabriel_Alon1;~Michael_J_Kamfonas1",
        "aff": ";",
        "aff_domain": ";",
        "position": ";",
        "bibtex": "@misc{\nalon2024detecting,\ntitle={Detecting Language Model Attacks With Perplexity},\nauthor={Gabriel Alon and Michael J Kamfonas},\nyear={2024},\nurl={https://openreview.net/forum?id=lNLVvdHyAw}\n}",
        "github": "",
        "project": "",
        "reviewers": "8VeL;hkGN;VSJg",
        "site": "https://openreview.net/forum?id=lNLVvdHyAw",
        "pdf_size": 7721096,
        "rating": "5;5;5",
        "confidence": "3;3;3",
        "soundness": "2;2;3",
        "contribution": "3;2;2",
        "presentation": "2;1;2",
        "wc_summary": "63;61;87",
        "wc_strengths": "93;28;66",
        "wc_weaknesses": "116;173;73",
        "wc_questions": "82;6;28",
        "wc_review": "354;268;254",
        "wc_reply_reviewers": "85;65;0",
        "wc_reply_authors": "969;1171;903",
        "reply_reviewers": "1;1;0",
        "reply_authors": "4;6;3",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            70.33333333333333,
            11.8133634311129
        ],
        "wc_strengths_avg": [
            62.333333333333336,
            26.662499674428293
        ],
        "wc_weaknesses_avg": [
            120.66666666666667,
            40.95797304012438
        ],
        "wc_questions_avg": [
            38.666666666666664,
            31.930480039541457
        ],
        "wc_review_avg": [
            292.0,
            44.21161235090467
        ],
        "wc_reply_reviewers_avg": [
            50.0,
            36.2859017617954
        ],
        "wc_reply_authors_avg": [
            1014.3333333333334,
            114.0097461720805
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            4.333333333333333,
            1.247219128924647
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 197,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2077601786741689410&as_sdt=5,39&sciodt=0,39&hl=en",
        "gs_version_total": 4
    },
    {
        "title": "MCM: Masked Cell Modeling for Anomaly Detection in Tabular Data",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17932",
        "id": "lNZJyEDxy4",
        "author_site": "Jiaxin Yin, Yuanyuan Qiao, Zitang Zhou, Xiangchao Wang, Jie Yang",
        "tldr": "",
        "abstract": "This paper addresses the problem of anomaly detection in tabular data, which is usually implemented in an one-class classification setting where the training set only contains normal samples. Inspired by the success of masked image/language modeling in vision and natural language domains, we extend masked modeling methods to address this problem by capturing intrinsic correlations between features in training set. Thus, a sample deviate from such correlations is related to a high possibility of anomaly. To obtain multiple and diverse correlations, we propose a novel masking strategy which generates multiple masks by learning, and design a diversity loss to reduce the similarity of different masks. Extensive experiments show our method achieves state-of-the-art performance. We also discuss the interpretability from the perspective of each individual feature and correlations between features.",
        "keywords": "anomaly detection;tabular data;self-supervised learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/8be1c2b5eb05316275cb539b78aa1e2fb29f015c.zip",
        "author": "Jiaxin Yin;Yuanyuan Qiao;Zitang Zhou;Xiangchao Wang;Jie Yang",
        "authorids": "~Jiaxin_Yin1;~Yuanyuan_Qiao1;~Zitang_Zhou1;~Xiangchao_Wang1;~Jie_Yang30",
        "gender": "M;F;F;M;F",
        "homepage": ";https://yuanyuanqiao.github.io/;;;",
        "dblp": ";27/6943;;;",
        "google_scholar": ";OwtSap4AAAAJ;;;",
        "orcid": "0000-0002-3944-7796;0000-0002-3573-9847;0009-0007-1490-9687;0009-0005-2396-5037;0000-0002-0294-1037",
        "linkedin": ";;;;",
        "or_profile": "~Jiaxin_Yin1;~Yuanyuan_Qiao1;~Zitang_Zhou1;~Xiangchao_Wang1;~Jie_Yang30",
        "aff": "Beijing University of Posts and Telecommunications;Beijing University of Posts and Telecommunications;Beijing University of Posts and Telecommunications;Hangzhou Dianzi University;Beijing University of Posts and Telecommunications",
        "aff_domain": "bupt.edu.cn;bupt.edu.cn;bupt.edu.cn;hdu.edu.cn;bupt.edu.cn",
        "position": "PhD student;Associate Professor;MS student;Undergrad student;Full Professor",
        "bibtex": "@inproceedings{\nyin2024mcm,\ntitle={{MCM}: Masked Cell Modeling for Anomaly Detection in Tabular Data},\nauthor={Jiaxin Yin and Yuanyuan Qiao and Zitang Zhou and Xiangchao Wang and Jie Yang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=lNZJyEDxy4}\n}",
        "github": "",
        "project": "",
        "reviewers": "8h9M;cK19;yu8Y",
        "pdf_size": 1059940,
        "rating": "6;6;8",
        "confidence": "3;4;4",
        "soundness": "3;3;4",
        "contribution": "3;3;3",
        "presentation": "2;3;3",
        "wc_summary": "21;177;172",
        "wc_strengths": "28;50;41",
        "wc_weaknesses": "17;146;33",
        "wc_questions": "112;2;9",
        "wc_review": "178;375;255",
        "wc_reply_reviewers": "0;0;8",
        "wc_reply_authors": "678;963;359",
        "reply_reviewers": "0;0;1",
        "reply_authors": "1;2;2",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            123.33333333333333,
            72.38937920870866
        ],
        "wc_strengths_avg": [
            39.666666666666664,
            9.030811456096044
        ],
        "wc_weaknesses_avg": [
            65.33333333333333,
            57.41273571449302
        ],
        "wc_questions_avg": [
            41.0,
            50.2858495669176
        ],
        "wc_review_avg": [
            269.3333333333333,
            81.0610195401519
        ],
        "wc_reply_reviewers_avg": [
            2.6666666666666665,
            3.7712361663282534
        ],
        "wc_reply_authors_avg": [
            666.6666666666666,
            246.712157967314
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.49999999999999983,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12165259150663332555&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=lNZJyEDxy4",
        "pdf": "https://openreview.net/pdf?id=lNZJyEDxy4",
        "email": "bupt.edu.cn;bupt.edu.cn;bupt.edu.cn;hdu.edu.cn;bupt.edu.cn",
        "author_num": 5,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "Beijing University of Posts and Telecommunications;Hangzhou Dianzi University",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.bupt.edu.cn/;http://www.hdu.edu.cn/",
        "aff_unique_abbr": "BUPT;HGHDU",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Beijing;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "lOsF9k1sxW",
        "title": "Fisher Information Guided Backdoor Purification Via Naive Exploitation of Smoothness",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Backdoor attacks during deep neural network (DNN) training have gained popularity in recent times since they can easily compromise the safety of a model of high importance, e.g., large language or vision models.  Our study shows that a backdoor model converges to a *bad local minima*, i.e., sharper minima as compared to a benign model. Intuitively, the backdoor can be purified by re-optimizing the model to smoother minima.  To obtain such re-optimization, we propose *Smooth Fine-Tuning (SFT)*, a novel backdoor purification framework that exploits the knowledge of *Fisher Information Matrix (FIM)*. However, purification in this manner can lead to poor clean test time performance due to drastic changes in the original backdoor model parameters. To preserve the original test accuracy, a novel regularizer has been designed to explicitly remember the learned clean data distribution. In addition, we introduce an efficient variant of SFT, dubbed as *Fast SFT*, which reduces the number of tunable parameters significantly and obtains an impressive runtime gain of almost $5\\times$. Extensive experiments show that the proposed method achieves state-of-the-art performance on a wide range of backdoor defense benchmarks: *four different tasks---Image Recognition, Object Detection, Video Action Recognition, 3D point Cloud; 10 different datasets including ImageNet, PASCAL VOC, UCF101; diverse model architectures spanning both CNN and vision transformer; 14 different backdoor attacks, e.g., Dynamic, WaNet, ISSBA, etc.*",
        "keywords": "Backdoor Attack;AI Security;Fisher Information;DNN Smoothness",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Nazmul Karim;Abdullah Al Arafat;Umar Khalid;Zhishan Guo;Nazanin Rahnavard",
        "authorids": "~Nazmul_Karim1;~Abdullah_Al_Arafat1;~Umar_Khalid1;~Zhishan_Guo2;~Nazanin_Rahnavard1",
        "gender": "M;M;M;M;F",
        "homepage": "https://nazmul-karim170.github.io/;;;https://www.csc.ncsu.edu/people/zguo32;http://lcwnlab.eecs.ucf.edu/",
        "dblp": "229/0090;292/5715;149/5861;39/4489.html;",
        "google_scholar": "mgi3sEgAAAAJ;TM7bqtYAAAAJ;hGJD_XUAAAAJ;e3_l6fwAAAAJ;https://scholar.google.com.tw/citations?user=PzgFISkAAAAJ",
        "orcid": ";0000-0002-7017-0158;;0000-0002-5967-1058;",
        "linkedin": "nazmul-karim-1b5805115/;abdullah-al-arafat-12a951bb/;;;",
        "or_profile": "~Nazmul_Karim1;~Abdullah_Al_Arafat1;~Umar_Khalid1;~Zhishan_Guo2;~Nazanin_Rahnavard1",
        "aff": "Bosch;North Carolina State University;University of Central Florida;North Carolina State University;University of Central Florida",
        "aff_domain": "bosch.com;ncsu.edu;ucf.edu;ncsu.edu;ucf.edu",
        "position": "Researcher;PhD student;PhD student;Associate Professor;Full Professor",
        "bibtex": "@misc{\nkarim2024fisher,\ntitle={Fisher Information Guided Backdoor Purification Via Naive Exploitation of Smoothness},\nauthor={Nazmul Karim and Abdullah Al Arafat and Umar Khalid and Zhishan Guo and Nazanin Rahnavard},\nyear={2024},\nurl={https://openreview.net/forum?id=lOsF9k1sxW}\n}",
        "github": "",
        "project": "",
        "reviewers": "DGHS;cxbT;Xtwr;dBn1",
        "site": "https://openreview.net/forum?id=lOsF9k1sxW",
        "pdf_size": 30772132,
        "rating": "3;6;6;8",
        "confidence": "4;2;4;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;2;2;3",
        "wc_summary": "52;90;107;62",
        "wc_strengths": "17;74;68;43",
        "wc_weaknesses": "149;107;137;59",
        "wc_questions": "3;69;50;16",
        "wc_review": "221;340;362;180",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1276;1109;852;114",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;2;2;1",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            77.75,
            21.890351755967743
        ],
        "wc_strengths_avg": [
            50.5,
            22.566568192793515
        ],
        "wc_weaknesses_avg": [
            113.0,
            34.72751070837067
        ],
        "wc_questions_avg": [
            34.5,
            26.291633650269812
        ],
        "wc_review_avg": [
            275.75,
            77.02718675896193
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            837.75,
            444.31316377078
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.08084520834544431,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:WwESovxEX70J:scholar.google.com/&scioq=Fisher+Information+Guided+Backdoor+Purification+Via+Naive+Exploitation+of+Smoothness&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;1;2",
        "aff_unique_norm": "Robert Bosch GmbH;North Carolina State University;University of Central Florida",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.bosch.com;https://www.ncsu.edu;https://www.ucf.edu",
        "aff_unique_abbr": "Bosch;NCSU;UCF",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;1",
        "aff_country_unique": "Germany;United States"
    },
    {
        "title": "Improved Efficiency Based on Learned Saccade and Continuous Scene Reconstruction From Foveated Visual Sampling",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17931",
        "id": "lOwkOIUJtx",
        "author_site": "Jiayang Liu, Yiming Bu, Daniel Tso, Qinru Qiu",
        "tldr": "",
        "abstract": "High accuracy, low latency and high energy efficiency represent a set of contradictory goals when searching for  system solutions for image classification and detection. While high-quality images naturally result in more precise detection and classification, they also result in a heavier computational workload for imaging and processing, reduce camera refresh rates, and increase the volume of data communication between the camera and processor. Taking inspiration from the foveal-peripheral sampling mechanism, saccade mechanism observed in the human visual system and the filling-in phenomena of brain, we have developed an active scene reconstruction architecture based on multiple foveal views. This model stitches together information from foveal and peripheral vision, which are sampled from multiple glances. Assisted by a reinforcement learning-based saccade mechanism, our model reduces the required input pixels by over 90\\% per frame while maintaining the same level of performance in image recognition as with the original images. We evaluated the effectiveness of our model using the GTSRB dataset and the ImageNet dataset. Using an equal number of input pixels, our study demonstrates a 5\\% higher image recognition accuracy compared to state-of-the-art foveal-peripheral vision systems. Furthermore, we demonstrate that our foveal sampling/saccadic scene reconstruction model exhibits significantly lower complexity and higher data efficiency during the training phase compared to existing approaches.",
        "keywords": "Biological inspired high performance energy efficient vision system;data efficient training;energy saving sensoring;learned saccade;reinforcement learning;foveated visual sampling;continuous scene reconstruction.",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Jiayang Liu;Yiming Bu;Daniel Tso;Qinru Qiu",
        "authorids": "~Jiayang_Liu2;~Yiming_Bu1;~Daniel_Tso1;~Qinru_Qiu1",
        "gender": "M;M;M;",
        "homepage": ";https://www.linkedin.com/in/yiming-bu-467466227;https://www.upstate.edu/search/?tab=people&ID=tsod&q=tso;",
        "dblp": ";;;",
        "google_scholar": ";;lg7_gLgAAAAJ;",
        "orcid": ";;0000-0002-5652-4896;",
        "linkedin": "jiayang-aaron-liu-614558192/;;;",
        "or_profile": "~Jiayang_Liu2;~Yiming_Bu1;~Daniel_Tso1;~Qinru_Qiu1",
        "aff": "Syracuse University;Syracuse University;SUNY Upstate Medical University;",
        "aff_domain": "syr.edu;syr.edu;upstate.edu;",
        "position": "PhD student;PhD student;Associate Professor;",
        "bibtex": "@inproceedings{\nliu2024improved,\ntitle={Improved Efficiency Based on Learned Saccade and Continuous Scene Reconstruction From Foveated Visual Sampling},\nauthor={Jiayang Liu and Yiming Bu and Daniel Tso and Qinru Qiu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=lOwkOIUJtx}\n}",
        "github": "",
        "project": "",
        "reviewers": "rEUv;cXLY;7Zf9;5v5k",
        "pdf_size": 13039819,
        "rating": "6;6;8;8",
        "confidence": "4;2;3;5",
        "soundness": "2;3;3;2",
        "contribution": "3;2;3;3",
        "presentation": "3;2;3;2",
        "wc_summary": "70;54;99;67",
        "wc_strengths": "89;56;27;74",
        "wc_weaknesses": "110;215;388;358",
        "wc_questions": "2;36;77;75",
        "wc_review": "271;361;591;574",
        "wc_reply_reviewers": "16;15;13;142",
        "wc_reply_authors": "612;921;930;925",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "3;4;4;5",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            72.5,
            16.439282222773596
        ],
        "wc_strengths_avg": [
            61.5,
            23.092206477510977
        ],
        "wc_weaknesses_avg": [
            267.75,
            112.10792790877905
        ],
        "wc_questions_avg": [
            47.5,
            30.939457008809963
        ],
        "wc_review_avg": [
            449.25,
            137.12836139909206
        ],
        "wc_reply_reviewers_avg": [
            46.5,
            55.14752940975688
        ],
        "wc_reply_authors_avg": [
            847.0,
            135.71477443521024
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            4.0,
            0.7071067811865476
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.4472135954999579,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8140336271352741151&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=lOwkOIUJtx",
        "pdf": "https://openreview.net/pdf?id=lOwkOIUJtx",
        "email": "syr.edu;syr.edu;upstate.edu;",
        "author_num": 4,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Syracuse University;State University of New York Upstate Medical University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.syracuse.edu;https://www.upstate.edu",
        "aff_unique_abbr": "Syracuse;SUNY Upstate",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "lPckjmWJ6C",
        "title": "Revisiting Few-Shot Object Detection using Vision-Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Few-shot object detection (FSOD) benchmarks have advanced techniques for detecting new categories using limited annotations. Existing FSOD benchmarks re-purpose well-established datasets like COCO by partitioning categories into base and novel classes for pre-training and fine-tuning respectively. However, these benchmarks do not reflect how FSOD is deployed in practice. Rather than pre-training on only a small number of categories, we argue that it is more practical to download a foundational model (e.g., a vision-language model (VLM) pretrained on web-scale data) and finetune it for specific applications. Surprisingly, we find that zero-shot inference from foundational VLMs like GroundingDINO significantly outperform state-of-the-art methods (48.3 vs. 33.1 AP) on COCO, suggesting that few-shot detection should be reframed in the context of foundation models. In this work, we propose a new FSOD benchmark protocol that evaluates detectors pre-trained on any external dataset (not including the target dataset), and finetuned on K-shot annotations per C target classes. Further, we note that FSOD benchmarks are actually federated datasets, which are exhaustively annotated for a single category only on a subset of data. We leverage this insight and propose simple strategies for fine-tuning VLMs to improve FSOD. We demonstrate the\neffectiveness of our approach on LVIS and nuImages",
        "keywords": "Object Detection;Vision-Language Models;Few-Shot Object Detection",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/fd17b1fede3c1879432e585d140f17cbbb1d7d17.zip",
        "author": "Anish Madan;Neehar Peri;Shu Kong;Deva Ramanan",
        "authorids": "~Anish_Madan1;~Neehar_Peri1;~Shu_Kong1;~Deva_Ramanan1",
        "gender": "M;M;M;M",
        "homepage": ";http://neeharperi.com;https://aimerykong.github.io/;https://www.cs.cmu.edu/~deva/",
        "dblp": "265/6058;241/5094;26/11141;49/488",
        "google_scholar": "eZ4WZmIAAAAJ;X3cGY7wAAAAJ;sm9FdLoAAAAJ;9B8PoXUAAAAJ",
        "orcid": ";;0000-0002-1362-5937;",
        "linkedin": ";neeharperi/;aimerykong/;",
        "or_profile": "~Anish_Madan1;~Neehar_Peri1;~Shu_Kong1;~Deva_Ramanan1",
        "aff": "Carnegie Mellon University;Carnegie Mellon University;Texas A&M University - College Station;School of Computer Science, Carnegie Mellon University",
        "aff_domain": "andrew.cmu.edu;cmu.edu;tamu.edu;cs.cmu.edu",
        "position": "MS student;PhD student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nmadan2024revisiting,\ntitle={Revisiting Few-Shot Object Detection using Vision-Language Models},\nauthor={Anish Madan and Neehar Peri and Shu Kong and Deva Ramanan},\nyear={2024},\nurl={https://openreview.net/forum?id=lPckjmWJ6C}\n}",
        "github": "",
        "project": "",
        "reviewers": "PgvU;C7qU;sSNJ;mJBQ",
        "site": "https://openreview.net/forum?id=lPckjmWJ6C",
        "pdf_size": 4084809,
        "rating": "3;3;5;5",
        "confidence": "4;3;4;5",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "3;3;2;2",
        "wc_summary": "70;152;66;66",
        "wc_strengths": "60;45;61;43",
        "wc_weaknesses": "125;29;401;168",
        "wc_questions": "162;72;69;5",
        "wc_review": "417;298;597;282",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            88.5,
            36.69809259348502
        ],
        "wc_strengths_avg": [
            52.25,
            8.287792227125388
        ],
        "wc_weaknesses_avg": [
            180.75,
            136.75594137001872
        ],
        "wc_questions_avg": [
            77.0,
            55.89722712263999
        ],
        "wc_review_avg": [
            398.5,
            125.91366089507524
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.7071067811865475,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:-zmfvMZyMKUJ:scholar.google.com/&scioq=Revisiting+Few-Shot+Object+Detection+using+Vision-Language+Models&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Carnegie Mellon University;Texas A&M University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cmu.edu;https://www.tamu.edu",
        "aff_unique_abbr": "CMU;TAMU",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";College Station;Pittsburgh",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "lQ5mbHhfQv",
        "title": "Q-Tuning: Continual Queue-based Prompt Tuning for Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "This paper introduces **Q-tuning**, a novel approach for continual prompt tuning that enables the lifelong learning of a pretrained language model on a sequence of tasks. For each new task, Q-tuning trains a task-specific prompt by adding it to the prompt queue consisting of the prompts from older tasks. To better transfer the knowledge of older tasks, we design an ensemble mechanism that reweighs previous prompts in queue with a learnable low-rank matrix that reflects their relevance to the current task. To facilitate training and inference with manageable complexity, once the prompt queue reaches its maximum capacity, we leverage a PCA-based eviction rule to reduce the queue's size, allowing the newly trained prompt to be added while preserving the primary knowledge of older tasks. In order to mitigate the accumulation of information loss caused by the eviction, we additionally propose a globally shared prefix prompt and a memory retention regularization based on the information theory. Extensive experiments demonstrate that our approach outperforms the state-of-the-art methods substantially on both short and long task sequences. Moreover, our approach enables the lifelong learning on an extremely long task sequence while requiring only $\\mathcal{O}(1)$ complexity for training and inference, which could not be achieved by existing technologies.",
        "keywords": "Continual Leanring;Prompt Tuning;Continual Prompt Tuning;Language Model",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Yanhui Guo;Shaoyuan Xu;Jinmiao Fu;Jia Liu;Chaosheng Dong;Bryan Wang",
        "authorids": "~Yanhui_Guo1;~Shaoyuan_Xu1;~Jinmiao_Fu1;~Jia_Liu1;~Chaosheng_Dong1;~Bryan_Wang2",
        "gender": "M;M;M;M;M;M",
        "homepage": ";;;https://kevinliu-osu.github.io/index.html;https://chaoshengdong.github.io/;https://www.linkedin.com/in/bryan-w-79ab1334/",
        "dblp": ";;;;225/6556;",
        "google_scholar": "XwxwxfQAAAAJ;cTzILkQAAAAJ;https://scholar.google.com/citations?hl=en;Ofx3dScAAAAJ;nPratvEAAAAJ;",
        "orcid": "0000-0002-9908-3795;;;;0000-0003-4491-0594;",
        "linkedin": ";shaoyuan-xu-1301a0174/;jinmiao-fu-32429438/;;chaosheng-dong/;bryan-w-79ab1334/",
        "or_profile": "~Yanhui_Guo1;~Shaoyuan_Xu1;~Jinmiao_Fu1;~Jia_Liu1;~Chaosheng_Dong1;~Bryan_Wang2",
        "aff": "McMaster University;Amazon;Amazon;The Ohio State University;Amazon;Amazon",
        "aff_domain": "mcmaster.ca;amazon.com;amazon.com;osu.edu;amazon.com;amazon.com",
        "position": "Ph.D.;Researcher;Researcher;Assistant Professor;Researcher;Researcher",
        "bibtex": "@misc{\nguo2024qtuning,\ntitle={Q-Tuning: Continual Queue-based Prompt Tuning for Language Models},\nauthor={Yanhui Guo and Shaoyuan Xu and Jinmiao Fu and Jia Liu and Chaosheng Dong and Bryan Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=lQ5mbHhfQv}\n}",
        "github": "",
        "project": "",
        "reviewers": "r9Qa;tNki;itxM;KTxv",
        "site": "https://openreview.net/forum?id=lQ5mbHhfQv",
        "pdf_size": 3203296,
        "rating": "5;5;5;5",
        "confidence": "5;5;4;4",
        "soundness": "3;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "4;3;3;3",
        "wc_summary": "128;105;60;126",
        "wc_strengths": "71;66;39;91",
        "wc_weaknesses": "513;255;350;230",
        "wc_questions": "95;1;105;23",
        "wc_review": "807;427;554;470",
        "wc_reply_reviewers": "0;0;52;0",
        "wc_reply_authors": "2548;970;2866;1056",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "5;3;5;3",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            104.75,
            27.36215452043205
        ],
        "wc_strengths_avg": [
            66.75,
            18.552290963651902
        ],
        "wc_weaknesses_avg": [
            337.0,
            111.03828168699297
        ],
        "wc_questions_avg": [
            56.0,
            44.82186966202994
        ],
        "wc_review_avg": [
            564.5,
            147.2693111276073
        ],
        "wc_reply_reviewers_avg": [
            13.0,
            22.516660498395403
        ],
        "wc_reply_authors_avg": [
            1860.0,
            854.9701749184003
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.0,
            1.0
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:dLtP9C9kn3QJ:scholar.google.com/&scioq=Q-Tuning:+Continual+Queue-based+Prompt+Tuning+for+Language+Models&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;2;1;1",
        "aff_unique_norm": "McMaster University;Amazon;Ohio State University",
        "aff_unique_dep": ";Amazon.com, Inc.;",
        "aff_unique_url": "https://www.mcmaster.ca;https://www.amazon.com;https://www.osu.edu",
        "aff_unique_abbr": "McMaster;Amazon;OSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;1;1",
        "aff_country_unique": "Canada;United States"
    },
    {
        "id": "lQgm3UvGNY",
        "title": "Synergistic Information Retrieval: Interplay between Search and Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Information retrieval (IR) plays a crucial role in locating relevant resources from vast amounts of data, and its applications have evolved from traditional knowledge bases to modern retrieval models (RMs). The emergence of large language models (LLMs) has further revolutionized the IR field by enabling users to interact with search systems in natural languages. In this paper, we explore the advantages and disadvantages of LLMs and RMs, highlighting their respective strengths in understanding user-issued queries and retrieving up-to-date information. To leverage the benefits of both paradigms while circumventing their limitations, we propose $\\textbf{InteR}$, a novel framework that facilitates information refinement through synergy between RMs and LLMs. InteR allows RMs to expand knowledge in queries using LLM-generated knowledge collections and enables LLMs to enhance prompt formulation using retrieved documents. This iterative refinement process augments the inputs of RMs and LLMs, leading to more accurate retrieval. Experiments on large-scale retrieval benchmarks involving web search and low-resource retrieval tasks demonstrate that InteR achieves overall superior zero-shot retrieval performance compared to state-of-the-art methods, even those using relevance judgment.",
        "keywords": "Large-Scale Retrieval;Large Language Models;Information Refinement",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/156024a403c5b676d9f66cf6f269463c01d1a999.zip",
        "author": "Jiazhan Feng;Chongyang Tao;Xiubo Geng;Tao Shen;Can Xu;Guodong Long;Dongyan Zhao;Daxin Jiang",
        "authorids": "~Jiazhan_Feng1;~Chongyang_Tao1;~Xiubo_Geng2;~Tao_Shen1;~Can_Xu2;~Guodong_Long2;~Dongyan_Zhao1;~Daxin_Jiang2",
        "gender": "M;M;F;M;M;M;M;M",
        "homepage": "https://sites.google.com/view/jzfeng/home/;;https://xiubo0211.github.io/;;;https://www.uts.edu.au/staff/guodong.long;https://www.microsoft.com/en-us/research/people/djiang/;https://www.wict.pku.edu.cn/zhaodongyan/en/",
        "dblp": "242/9191;;19/189;95/4097-1;;34/10089;77/5094;63/1870",
        "google_scholar": "uYHmew8AAAAJ;x_cOKuwAAAAJ;XxeX3FgAAAAJ;https://scholar.google.com.au/citations?user=SegyX9AAAAAJ;5aiE_NcAAAAJ;https://scholar.google.com.au/citations?user=Pl8m7hMAAAAJ;N-wAHCoAAAAJ;lhR8-68AAAAJ",
        "orcid": "0000-0002-5832-6199;;;;0000-0002-1949-5715;0000-0003-3740-9515;;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Jiazhan_Feng1;~Chongyang_Tao1;~Xiubo_Geng2;~Tao_Shen1;~Can_Xu2;~Guodong_Long2;~Daxin_Jiang2;~Dongyan_Zhao2",
        "aff": "Peking University;Microsoft;Microsoft;University of Technology Sydney;Microsoft;University of Technology Sydney;StepFun;Peking University",
        "aff_domain": "pku.edu.cn;microsoft.com;microsoft.com;uts.edu.au;microsoft.com;uts.edu.au;stepfun.com;pku.edu.cn",
        "position": "PhD student;Researcher;Researcher;Postdoc;Researcher;Associate Professor;CEO;Full Professor",
        "bibtex": "@misc{\nfeng2024synergistic,\ntitle={Synergistic Information Retrieval: Interplay between Search and Large Language Models},\nauthor={Jiazhan Feng and Chongyang Tao and Xiubo Geng and Tao Shen and Can Xu and Guodong Long and Dongyan Zhao and Daxin Jiang},\nyear={2024},\nurl={https://openreview.net/forum?id=lQgm3UvGNY}\n}",
        "github": "",
        "project": "",
        "reviewers": "nUtT;zzZ7;8fe1;gmGa",
        "site": "https://openreview.net/forum?id=lQgm3UvGNY",
        "pdf_size": 474141,
        "rating": "3;5;6;6",
        "confidence": "5;5;4;2",
        "soundness": "1;3;3;3",
        "contribution": "1;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "59;92;70;127",
        "wc_strengths": "15;60;43;66",
        "wc_weaknesses": "127;69;110;94",
        "wc_questions": "47;37;111;119",
        "wc_review": "248;258;334;406",
        "wc_reply_reviewers": "0;11;0;40",
        "wc_reply_authors": "551;569;310;59",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.0,
            1.224744871391589
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            87.0,
            25.971137826441105
        ],
        "wc_strengths_avg": [
            46.0,
            19.78635893740938
        ],
        "wc_weaknesses_avg": [
            100.0,
            21.365860619221497
        ],
        "wc_questions_avg": [
            78.5,
            36.77974986320598
        ],
        "wc_review_avg": [
            311.5,
            63.896400524599194
        ],
        "wc_reply_reviewers_avg": [
            12.75,
            16.361158271956175
        ],
        "wc_reply_authors_avg": [
            372.25,
            207.7635374650711
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.6666666666666665,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:2DoVdEKlG4kJ:scholar.google.com/&scioq=Synergistic+Information+Retrieval:+Interplay+between+Search+and+Large+Language+Models&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;2;1;2;3;0",
        "aff_unique_norm": "Peking University;Microsoft;University of Technology Sydney;StepFun",
        "aff_unique_dep": ";Microsoft Corporation;;",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.microsoft.com;https://www.uts.edu.au;",
        "aff_unique_abbr": "Peking U;Microsoft;UTS;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;2;1;2;0",
        "aff_country_unique": "China;United States;Australia;"
    },
    {
        "id": "lQhh1sbfzp",
        "title": "Differential Model Scaling using Differential Topk",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Over the past few years, as large language models have ushered in an era of intelligence emergence, there has been an intensified focus on scaling networks. Currently, many network architectures are designed manually, often resulting in sub-optimal configurations. Although Neural Architecture Search (NAS) methods have been proposed to automate this process, they suffer from low search efficiency.This study introduces Differential Model Scaling (DMS), increasing the efficiency for searching optimal width and depth in networks.DMS can model both width and depth in a direct and fully differentiable way, making it easy to optimize.We have evaluated our DMS across diverse tasks, ranging from vision tasks to NLP tasks and various network architectures, including CNNs and Transformers. Results consistently indicate that our DMS can find improved structures and outperforms state-of-the-art NAS methods.Specifically, for image classification on ImageNet, our DMS improves the top-1 accuracy of EfficientNet-B0 and Deit-Tiny by 1.4% and 0.6%, respectively, and outperforms the state-of-the-art zero-shot NAS method, ZiCo, by 0.7% while requiring only 0.4 GPU days for searching. For object detection on COCO, DMS improves the mAP of Yolo-v8-n by 2.0%. For language modeling, Our pruned Llama-7B outperforms the prior method with lower perplexity and higher zero-shot classification accuracy.",
        "keywords": "Neural Architecture Search;Model Scaling",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Kai Liu;Ruohui Wang;Jianfei Gao;Kai Chen",
        "authorids": "~Kai_Liu16;~Ruohui_Wang3;~Jianfei_Gao1;~Kai_Chen4",
        "gender": ";;M;M",
        "homepage": "https://github.com/LKJacky;;https://chenkai.site/;https://github.com/pppppM",
        "dblp": ";;181/2839-26;",
        "google_scholar": "https://scholar.google.com.hk/citations?user=b6NWTbAAAAAJ;G-9-nIYAAAAJ;https://scholar.google.com.hk/citations?user=eGD0b7IAAAAJ;",
        "orcid": ";;0000-0002-6820-2325;",
        "linkedin": ";;;",
        "or_profile": "~Kai_Liu16;~Ruohui_Wang3;~Kai_Chen4;~Gao_Jianfei1",
        "aff": "Shanghai Artificial Intelligence Laboratory;shanghai ai laboratory;Shanghai AI Laboratory;Shanghai Artificial Intelligence Laboratory",
        "aff_domain": "pjlab.org.cn;pjlab.org.cn;pjlab.org.cn;shlab.org.cn",
        "position": "Researcher;Researcher;Researcher;Researcher",
        "bibtex": "@misc{\nliu2024differential,\ntitle={Differential Model Scaling using Differential Topk},\nauthor={Kai Liu and Ruohui Wang and Jianfei Gao and Kai Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=lQhh1sbfzp}\n}",
        "github": "",
        "project": "",
        "reviewers": "nwwR;L4n8;9aAa;EkDu;AHK9",
        "site": "https://openreview.net/forum?id=lQhh1sbfzp",
        "pdf_size": 659362,
        "rating": "3;5;6;6;6",
        "confidence": "2;5;3;5;4",
        "soundness": "2;3;2;3;3",
        "contribution": "2;2;3;3;3",
        "presentation": "2;4;3;3;4",
        "wc_summary": "165;25;50;104;90",
        "wc_strengths": "121;7;58;91;80",
        "wc_weaknesses": "187;24;237;74;68",
        "wc_questions": "142;23;77;29;223",
        "wc_review": "615;79;422;298;461",
        "wc_reply_reviewers": "324;0;177;0;0",
        "wc_reply_authors": "3378;832;2477;736;878",
        "reply_reviewers": "1;0;3;0;0",
        "reply_authors": "7;2;7;2;2",
        "rating_avg": [
            5.2,
            1.16619037896906
        ],
        "confidence_avg": [
            3.8,
            1.16619037896906
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            3.2,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            86.8,
            48.15558119263021
        ],
        "wc_strengths_avg": [
            71.4,
            38.06625802466011
        ],
        "wc_weaknesses_avg": [
            118.0,
            80.24213357083671
        ],
        "wc_questions_avg": [
            98.8,
            75.34560372045605
        ],
        "wc_review_avg": [
            375.0,
            179.3042107704111
        ],
        "wc_reply_reviewers_avg": [
            100.2,
            131.22865540726997
        ],
        "wc_reply_authors_avg": [
            1660.2,
            1074.2343133599857
        ],
        "reply_reviewers_avg": [
            0.8,
            1.1661903789690604
        ],
        "reply_authors_avg": [
            4.0,
            2.449489742783178
        ],
        "replies_avg": [
            32,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.6176470588235294,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0;1;1;0",
        "aff_unique_norm": "Shanghai Artificial Intelligence Laboratory;Shanghai AI Laboratory",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.shailab.org/;",
        "aff_unique_abbr": "Shanghai AI Lab;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "On Diffusion Modeling for Anomaly Detection",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17930",
        "id": "lR3rk7ysXz",
        "author_site": "Victor Livernoche, Vineet Jain, Yashar Hezaveh, Siamak Ravanbakhsh",
        "tldr": "",
        "abstract": "Known for their impressive performance in generative modeling, diffusion models are attractive candidates for density-based anomaly detection. This paper investigates different variations of diffusion modeling for unsupervised and semi-supervised anomaly detection. In particular, we find that Denoising Diffusion Probability Models (DDPM) are performant on anomaly detection benchmarks yet computationally expensive. By simplifying DDPM in application to anomaly detection, we are naturally led to an alternative approach called Diffusion Time Estimation (DTE). DTE estimates the distribution over diffusion time for a given input and uses the mode or mean of this distribution as the anomaly score. We derive an analytical form for this density and leverage a deep neural network to improve inference efficiency. Through empirical evaluations on the ADBench benchmark, we demonstrate that all diffusion-based anomaly detection methods perform competitively for both semi-supervised and unsupervised settings. Notably, DTE achieves orders of magnitude faster inference time than DDPM, while outperforming it on this benchmark. These results establish diffusion-based anomaly detection as a scalable alternative to traditional methods and recent deep-learning techniques for standard unsupervised and semi-supervised anomaly detection settings.",
        "keywords": "Diffusion based models;Anomaly detection;Probabilistic Inference",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/d1a5a7c4099974be80d2a2dfd690e85cceae3cae.zip",
        "author": "Victor Livernoche;Vineet Jain;Yashar Hezaveh;Siamak Ravanbakhsh",
        "authorids": "~Victor_Livernoche1;~Vineet_Jain1;~Yashar_Hezaveh1;~Siamak_Ravanbakhsh1",
        "gender": "M;;M;",
        "homepage": ";;https://www.astro.umontreal.ca/~hezaveh/hezaveh/Home.html;",
        "dblp": ";92/3653;332/6554;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en;4tQoRHoAAAAJ;",
        "orcid": "0000-0002-3819-730X;;0000-0002-8669-5733;",
        "linkedin": "victor-livernoche/;;;",
        "or_profile": "~Victor_Livernoche1;~Vineet_Jain1;~Yashar_Hezaveh1;~Siamak_Ravanbakhsh1",
        "aff": "McGill University, McGill University;McGill University;Universit\u00e9 de Montr\u00e9al;",
        "aff_domain": "mail.mcgill.ca;mcgill.ca;umontreal.ca;",
        "position": "MS student;PhD student;Assistant Professor;",
        "bibtex": "@inproceedings{\nlivernoche2024on,\ntitle={On Diffusion Modeling for Anomaly Detection},\nauthor={Victor Livernoche and Vineet Jain and Yashar Hezaveh and Siamak Ravanbakhsh},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=lR3rk7ysXz}\n}",
        "github": "",
        "project": "",
        "reviewers": "udy2;ahnY;vggP;BHmN",
        "pdf_size": 3962688,
        "rating": "6;6;8;8",
        "confidence": "5;3;4;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;4",
        "presentation": "3;3;3;3",
        "wc_summary": "37;75;84;176",
        "wc_strengths": "39;68;95;53",
        "wc_weaknesses": "181;267;34;64",
        "wc_questions": "2;4;34;2",
        "wc_review": "259;414;247;295",
        "wc_reply_reviewers": "59;95;0;0",
        "wc_reply_authors": "754;648;201;166",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            93.0,
            51.063685726747146
        ],
        "wc_strengths_avg": [
            63.75,
            20.753011829611623
        ],
        "wc_weaknesses_avg": [
            136.5,
            93.23759971170429
        ],
        "wc_questions_avg": [
            10.5,
            13.592277219068187
        ],
        "wc_review_avg": [
            303.75,
            66.05821296402137
        ],
        "wc_reply_reviewers_avg": [
            38.5,
            40.549352645880795
        ],
        "wc_reply_authors_avg": [
            442.25,
            261.7425977940924
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 33,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15322795632975826930&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=lR3rk7ysXz",
        "pdf": "https://openreview.net/pdf?id=lR3rk7ysXz",
        "email": "mail.mcgill.ca;mcgill.ca;umontreal.ca;",
        "author_num": 4,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "McGill University;Universit\u00e9 de Montr\u00e9al",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.mcgill.ca;https://www.umontreal.ca",
        "aff_unique_abbr": "McGill;UdeM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "title": "Node2ket: Efficient High-Dimensional Network Embedding in Quantum Hilbert Space",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17929",
        "id": "lROh08eK6n",
        "author_site": "Hao Xiong, Yehui Tang, Yunlin He, Wei Tan, Junchi Yan",
        "tldr": "",
        "abstract": "Network embedding (NE) is a prominent technique for network analysis where the nodes are represented as vectorized embeddings in a continuous space. Existing works tend to resort to the low-dimensional embedding space for efficiency and less risk of over-fitting. In this paper, we explore a new NE paradigm whose embedding dimension goes exponentially high w.r.t. the number of parameters, yet being very efficient and effective. Specifically, the node embeddings are represented as product states that lie in a super high-dimensional (e.g. $2^{32}$-dim) quantum Hilbert space, with a carefully designed optimization approach to guarantee the robustness to work in different scenarios. In the experiments, we show diverse virtues of our methods, including but not limited to: the overwhelming performance on downstream tasks against conventional low-dimensional NE baselines with the similar amount of computing resources, the super high efficiency for a fixed low embedding dimension (e.g. 512) with less than 1/200 memory usage, the robustness when equipped with different objectives and sampling strategies as a fundamental tool for future NE research. As a relatively unexplored topic in literature, the high-dimensional NE paradigm is demonstrated effective both experimentally and theoretically.",
        "keywords": "high-dimensional network embedding;quantum mechanics",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/f630b26b26072200911418c791ad6ae64e3df9ed.pdf",
        "author": "Hao Xiong;Yehui Tang;Yunlin He;Wei Tan;Junchi Yan",
        "authorids": "~Hao_Xiong5;~Yehui_Tang3;~Yunlin_He1;~Wei_Tan4;~Junchi_Yan2",
        "gender": ";;M;M;",
        "homepage": ";;;;",
        "dblp": ";;;;",
        "google_scholar": ";;;;",
        "orcid": ";;;;",
        "linkedin": ";;https://www.linkedin.cn/incareer/in/%E9%8B%86%E6%9E%97-%E4%BD%95-661a31250;https://www.linkedin.cn/incareer/in/ACoAAC74btQBuO6mg2RXf43b0oJtliamq_1IsC4;",
        "or_profile": "~Hao_Xiong5;~Yehui_Tang3;~Yunlin_He1;~Wei_Tan4;~Junchi_Yan2",
        "aff": ";;Shanghai Jiaotong University;;",
        "aff_domain": ";;sjtu.edu.cn;;",
        "position": ";;Undergrad student;;",
        "bibtex": "@inproceedings{\nxiong2024nodeket,\ntitle={Node2ket: Efficient High-Dimensional Network Embedding in Quantum Hilbert Space},\nauthor={Hao Xiong and Yehui Tang and Yunlin He and Wei Tan and Junchi Yan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=lROh08eK6n}\n}",
        "github": "",
        "project": "",
        "reviewers": "8cxP;RkWJ;VRn5",
        "pdf_size": 2008790,
        "rating": "6;6;6",
        "confidence": "2;2;4",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "3;3;3",
        "wc_summary": "47;59;98",
        "wc_strengths": "67;37;88",
        "wc_weaknesses": "48;52;46",
        "wc_questions": "136;5;84",
        "wc_review": "298;153;316",
        "wc_reply_reviewers": "65;15;0",
        "wc_reply_authors": "770;469;588",
        "reply_reviewers": "1;1;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            68.0,
            21.77154105707724
        ],
        "wc_strengths_avg": [
            64.0,
            20.92844953645635
        ],
        "wc_weaknesses_avg": [
            48.666666666666664,
            2.494438257849294
        ],
        "wc_questions_avg": [
            75.0,
            53.85783756025363
        ],
        "wc_review_avg": [
            255.66666666666666,
            72.96726815649755
        ],
        "wc_reply_reviewers_avg": [
            26.666666666666668,
            27.78888666755511
        ],
        "wc_reply_authors_avg": [
            609.0,
            123.77668062549854
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3807659511588688327&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=lROh08eK6n",
        "pdf": "https://openreview.net/pdf?id=lROh08eK6n",
        "email": ";;sjtu.edu.cn;;",
        "author_num": 5,
        "aff_unique_index": "0",
        "aff_unique_norm": "Shanghai Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sjtu.edu.cn",
        "aff_unique_abbr": "SJTU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "lSYPdXPuD9",
        "title": "Marrying Pixel and Latent Diffusion Models for Text-to-Video Generation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Significant advancements have been achieved in the realm of large-scale pre-trained text-to-video Diffusion Models (VDMs). However, previous methods either rely solely on pixel-based VDMs, which come with high computational costs, or on latent-based VDMs, which often struggle with precise text-video alignment. In this paper, we are the first to propose a hybrid model, dubbed as MPL-Video , which marries pixel-based and latent-based VDMs for text-to-video generation. Our model first uses pixel-based VDMs to produce a low-resolution video of strong text-video correlation. After that, we propose a novel expert translation method that employs the latent-based VDMs to further upsample the low-resolution video to high resolution. Compared to latent VDMs, MPL-Video can produce high-quality videos of precise text-video alignment; Compared to pixel VDMs, MPL-Video is much more efficient  (GPU memory usage during inference is 15G vs 72G). We also validate our model on standard video generation benchmarks. Our code will be publicly available.",
        "keywords": "video generation;diffusion models",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "David Junhao Zhang;Jay Zhangjie Wu;Jia-Wei Liu;Rui Zhao;Lingmin Ran;Yuchao Gu;Difei Gao;Mike Zheng Shou",
        "authorids": "~David_Junhao_Zhang1;~Jay_Zhangjie_Wu1;~Jia-Wei_Liu1;~Rui_Zhao12;~Lingmin_Ran1;~Yuchao_Gu1;~Difei_Gao1;~Mike_Zheng_Shou1",
        "gender": ";M;M;M;M;M;;",
        "homepage": ";https://zhangjiewu.github.io/;https://jia-wei-liu.github.io/;;https://www.linkedin.com/me?trk=p_mwlite_my_network-secondary_n;https://ycgu.site/;;",
        "dblp": ";322/0749;85/3336;26/2578-19;339/3288;266/4395;;",
        "google_scholar": ";WVp4yjoAAAAJ;stQQf7wAAAAJ;https://scholar.google.com.hk/citations?user=wYs7vogAAAAJ;;YpfrXyQAAAAJ;;",
        "orcid": ";;;0000-0003-4271-0206;;;;",
        "linkedin": ";;;;https://www.linkedin.com/me?trk=p_mwlite_my_network-secondary_n;;;",
        "or_profile": "~David_Junhao_Zhang1;~Jay_Zhangjie_Wu1;~Jia-Wei_Liu1;~Rui_Zhao12;~Lingmin_Ran1;~Yuchao_Gu1;~Difei_Gao1;~Mike_Zheng_Shou1",
        "aff": ";National University of Singapore;National University of Singapore;Alibaba Group;National University of Singapore;National University of Singapore;;",
        "aff_domain": ";u.nus.edu;u.nus.edu;alibaba-inc.com;u.nus.edu;u.nus.edu;;",
        "position": ";PhD student;PhD student;Intern;PhD student;PhD student;;",
        "bibtex": "@misc{\nzhang2024marrying,\ntitle={Marrying Pixel and Latent Diffusion Models for Text-to-Video Generation},\nauthor={David Junhao Zhang and Jay Zhangjie Wu and Jia-Wei Liu and Rui Zhao and Lingmin Ran and Yuchao Gu and Difei Gao and Mike Zheng Shou},\nyear={2024},\nurl={https://openreview.net/forum?id=lSYPdXPuD9}\n}",
        "github": "",
        "project": "",
        "reviewers": "554b;WLJK;JANw;uFUa",
        "site": "https://openreview.net/forum?id=lSYPdXPuD9",
        "pdf_size": 39994995,
        "rating": "5;5;5;5",
        "confidence": "4;4;5;5",
        "soundness": "2;3;3;2",
        "contribution": "3;2;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "88;68;74;94",
        "wc_strengths": "79;63;56;78",
        "wc_weaknesses": "172;224;192;240",
        "wc_questions": "70;127;34;5",
        "wc_review": "409;482;356;417",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "740;1042;561;628",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            81.0,
            10.44030650891055
        ],
        "wc_strengths_avg": [
            69.0,
            9.82344135219425
        ],
        "wc_weaknesses_avg": [
            207.0,
            26.589471600616662
        ],
        "wc_questions_avg": [
            59.0,
            45.513734190901104
        ],
        "wc_review_avg": [
            416.0,
            44.73812691653507
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            742.75,
            184.22727132539308
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 212,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14596580428759386251&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "National University of Singapore;Alibaba Group",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.nus.edu.sg;https://www.alibaba.com",
        "aff_unique_abbr": "NUS;Alibaba",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "Singapore;China"
    },
    {
        "id": "lSzO8atM7F",
        "title": "Culture in Artificial Intelligence: A Literature Review & Proposal",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Within the last few years, there has been an explosion of various Artificial Intelligence technologies poised to change the world. However, a lot of these technologies are made by the few to represent the many. This absence of diversity amongst researchers and overall innovators creates technology that is microscopic in worldview. It brings questions of Fairness, Accountability, Transparency, and Ethics (FATE) to the forefront. Most research undertaken in the context of FATE is done within a Western cultural context, which, in turn, imparts Western values. However, most research does not holistically address the question of the relationship between culture and AI. In this paper, we conduct a literature review of relevant research on Artificial Intelligence and culture and its importance in analyzing concepts of FATE. Additionally, we argue for and propose a definition of Culture in AI. We assume that through a combination of activation points (data collection and annotation, algorithm choice/development, problem framing, etc.), AI systems/agents perpetuate and produce culture in their dealings. This paper posits the need to situate Artificial intelligence systems within specific cultural paradigms consistent with their operative environments. We end by discussing future areas of study to be considered.",
        "keywords": "FATE;Fairness;Bias Mitigation;Culture in AI;Human-Value Alignment",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Cesa Salaam;Danda Rawat",
        "authorids": "~Cesa_Salaam1;~Danda_Rawat1",
        "gender": "M;Not Specified",
        "homepage": "https://sites.google.com/view/cesasalaam/home;https://www.rawatonline.com/",
        "dblp": "277/8028;79/2597.html",
        "google_scholar": "zuSCBmcAAAAJ;sucI8EAAAAAJ",
        "orcid": "my-orcid?orcid=0000-0002-5006-5932;0000-0003-3638-3464",
        "linkedin": "cesa-salaam-003132134/;dbrawat",
        "or_profile": "~Cesa_Salaam1;~Danda_Rawat1",
        "aff": "Howard University;Howard University",
        "aff_domain": "howard.edu;howard.edu",
        "position": "PhD student;Pof",
        "bibtex": "@misc{\nsalaam2024culture,\ntitle={Culture in Artificial Intelligence: A Literature Review \\& Proposal},\nauthor={Cesa Salaam and Danda Rawat},\nyear={2024},\nurl={https://openreview.net/forum?id=lSzO8atM7F}\n}",
        "github": "",
        "project": "",
        "reviewers": "ftsk;VFYa;T5ua",
        "site": "https://openreview.net/forum?id=lSzO8atM7F",
        "pdf_size": 131941,
        "rating": "1;3;8",
        "confidence": "4;3;5",
        "soundness": "1;1;4",
        "contribution": "2;1;3",
        "presentation": "2;2;3",
        "wc_summary": "59;19;55",
        "wc_strengths": "24;42;65",
        "wc_weaknesses": "171;161;46",
        "wc_questions": "166;46;85",
        "wc_review": "420;268;251",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.0,
            2.943920288775949
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.0,
            1.4142135623730951
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            44.333333333333336,
            17.987650084309387
        ],
        "wc_strengths_avg": [
            43.666666666666664,
            16.779617264870957
        ],
        "wc_weaknesses_avg": [
            126.0,
            56.71566509057852
        ],
        "wc_questions_avg": [
            99.0,
            49.9799959983992
        ],
        "wc_review_avg": [
            313.0,
            75.97806701059633
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.6933752452815365,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:_duhKRHcAOAJ:scholar.google.com/&scioq=Culture+in+Artificial+Intelligence:+A+Literature+Review+%26+Proposal&hl=en&as_sdt=0,48",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Howard University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.howard.edu",
        "aff_unique_abbr": "HU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "lT6R0TYeVu",
        "title": "ThEBES: Thorough Energy-Based Evolution Strategy",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recently, Evolution Strategies (ESs) have achieved state-of-the-art results: ESs are a family of evolutionary algorithms that iteratively update the parameters of a search distribution to sample solutions to be evaluated. By optimizing a population, ESs promise to evolve solutions that are robust. Nevertheless, current methods have yet to deliver on this promise. We include an explicit drive towards robustness by applying noise to the search distribution mean after evaluating the solutions, adding a stochastic drift to the ES search trajectory. We mathematically ground our algorithm on Energy-Based Models (EBMs) and interpret it as performing Langevin dynamics on the search space, thus converging to a probability distribution and not a point estimate for the search distribution parameters. So we introduce ThEBES, the Thorough Energy-Based Evolution Strategy. We compare ThEBES against state-of-the-art ESs on continuous policy search tasks. Our results show that ThEBES is competitive in terms of effectiveness. We also find that, by virtue of its stochastic dynamics, ThEBES evolves policies that are more robust to observational noise. We thus believe our work to be a promising avenue for future research and to strengthen the theoretical backings of ESs, since it provides a solid mathematical ground to ESs in the context of energy-based models.",
        "keywords": "evolution strategies;reinforcement learning;energy-based models",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Federico Pigozzi;Joel Lehman;Eric Medvet",
        "authorids": "~Federico_Pigozzi1;~Joel_Lehman1;~Eric_Medvet1",
        "gender": "M;;M",
        "homepage": "https://pigozzif.github.io;http://joellehman.com;https://medvet.inginf.units.it/",
        "dblp": "295/6474;47/8285;49/5937.html",
        "google_scholar": "https://scholar.google.ch/citations?user=B2eGlnQAAAAJ;GcvxHWQAAAAJ;Te6XLnAAAAAJ",
        "orcid": "0000-0003-3315-6768;;0000-0001-5652-2113",
        "linkedin": ";;",
        "or_profile": "~Federico_Pigozzi1;~Joel_Lehman1;~Eric_Medvet1",
        "aff": ";Carper.AI;University of Trieste",
        "aff_domain": ";carper.ai;units.it",
        "position": ";Research Advisor;Associate Professor",
        "bibtex": "@misc{\npigozzi2024thebes,\ntitle={Th{EBES}: Thorough Energy-Based Evolution Strategy},\nauthor={Federico Pigozzi and Joel Lehman and Eric Medvet},\nyear={2024},\nurl={https://openreview.net/forum?id=lT6R0TYeVu}\n}",
        "github": "",
        "project": "",
        "reviewers": "NT4U;Ew2x;HLqH;Qw4z",
        "site": "https://openreview.net/forum?id=lT6R0TYeVu",
        "pdf_size": 592829,
        "rating": "1;3;3;3",
        "confidence": "5;4;5;3",
        "soundness": "1;2;1;2",
        "contribution": "1;2;1;2",
        "presentation": "2;3;1;1",
        "wc_summary": "29;80;52;28",
        "wc_strengths": "24;24;10;31",
        "wc_weaknesses": "910;145;228;330",
        "wc_questions": "29;93;7;97",
        "wc_review": "992;342;297;486",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            1.5,
            0.5
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            47.25,
            21.20583646074825
        ],
        "wc_strengths_avg": [
            22.25,
            7.628073151196179
        ],
        "wc_weaknesses_avg": [
            403.25,
            299.8194248210079
        ],
        "wc_questions_avg": [
            56.5,
            39.303307748839664
        ],
        "wc_review_avg": [
            529.25,
            276.1388916831528
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:aXENaEyN7WIJ:scholar.google.com/&scioq=ThEBES:+Thorough+Energy-Based+Evolution+Strategy&hl=en&as_sdt=0,34",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Carper.AI;University of Trieste",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.carper.ai;https://www.units.it",
        "aff_unique_abbr": "Carper.AI;UniTS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United States;Italy"
    },
    {
        "id": "lUWf41nR4v",
        "title": "Addressing Long-Horizon Tasks by Integrating Program Synthesis and State Machines",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep reinforcement learning excels in various domains but lacks generalizability and interoperability. Programmatic RL (Trivedi et al., 2021; Liu et al., 2023) methods reformulate solving RL tasks as synthesizing interpretable programs that can be executed in the environments. Despite encouraging results, these methods are limited to short-horizon tasks. On the other hand, representing RL policies using state machines  (Inala et al., 2020) can inductively generalize to long-horizon tasks; however, it struggles to scale up to acquire diverse and complex behaviors and is difficult to be interpreted by human users. This work proposes Program Machine Policies (POMPs), which bridge the advantages of programmatic RL and state machine policies, allowing for representing complex behaviors and addressing long-horizon tasks. Specifically, we introduce a method that can retrieve a set of effective, diverse, compatible programs. Then, we use these programs as modes of a state machine and learn a transition function to transition among mode programs, allowing for capturing long-horizon repetitive behaviors. Our proposed framework outperforms programmatic RL and deep RL baselines on various tasks and demonstrates the ability to inductively generalize to even longer horizons without any fine-tuning. Ablation studies justify the effectiveness of our proposed search algorithm for retrieving a set of programs as modes.",
        "keywords": "Programmatic Reinforcement Learning;Program Synthesis",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/addb9c9e84ee34afd5ba094d6212d00754fda35f.pdf",
        "author": "Yu-An Lin;Chen-Tao Lee;Guan-Ting Liu;Pu-Jen Cheng;Shao-Hua Sun",
        "authorids": "~Yu-An_Lin2;~Chen-Tao_Lee1;~Guan-Ting_Liu1;~Pu-Jen_Cheng1;~Shao-Hua_Sun1",
        "gender": "M;M;M;M;M",
        "homepage": "https://github.com/AndyLinGitHub;https://github.com/boris-CTL;https://www.csie.ntu.edu.tw/~pjcheng/;http://shaohua0116.github.io;https://dannyliu15.github.io/",
        "dblp": ";;45/160;158/9680;71/7317",
        "google_scholar": ";;https://scholar.google.com.tw/citations?user=uYdM_rwAAAAJ;uXsfnaQAAAAJ;https://scholar.google.com/citations?hl=zh-TW",
        "orcid": ";;;0000-0001-7579-6734;0000-0002-7300-9036",
        "linkedin": ";;;shaohua0116/;",
        "or_profile": "~Yu-An_Lin2;~Chen-Tao_Lee1;~Pu-Jen_Cheng1;~Shao-Hua_Sun1;~Guan_Ting_Liu1",
        "aff": ";;National Taiwan University;National Taiwan University;Department of computer science and information engineering, National Taiwan University",
        "aff_domain": ";;ntu.edu.tw;ntu.edu.tw;csie.ntu.edu.tw",
        "position": ";;Full Professor;Assistant Professor;PhD student",
        "bibtex": "@misc{\nlin2024addressing,\ntitle={Addressing Long-Horizon Tasks by Integrating Program Synthesis and State Machines},\nauthor={Yu-An Lin and Chen-Tao Lee and Guan-Ting Liu and Pu-Jen Cheng and Shao-Hua Sun},\nyear={2024},\nurl={https://openreview.net/forum?id=lUWf41nR4v}\n}",
        "github": "",
        "project": "",
        "reviewers": "dxYr;bA3y;HDvE;NAAH",
        "site": "https://openreview.net/forum?id=lUWf41nR4v",
        "pdf_size": 4977674,
        "rating": "3;5;5;5",
        "confidence": "3;3;5;3",
        "soundness": "2;2;2;3",
        "contribution": "3;2;1;2",
        "presentation": "3;3;2;2",
        "wc_summary": "109;53;93;126",
        "wc_strengths": "370;39;111;33",
        "wc_weaknesses": "439;70;579;452",
        "wc_questions": "65;158;57;9",
        "wc_review": "983;320;840;620",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "2183;1497;1834;1442",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "4;3;3;2",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            95.25,
            27.040478915877213
        ],
        "wc_strengths_avg": [
            138.25,
            137.27595383023205
        ],
        "wc_weaknesses_avg": [
            385.0,
            189.9118216436249
        ],
        "wc_questions_avg": [
            72.25,
            53.94151925928672
        ],
        "wc_review_avg": [
            690.75,
            250.07336423537794
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1739.0,
            297.04124292764465
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12743148802264101335&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "National Taiwan University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ntu.edu.tw",
        "aff_unique_abbr": "NTU",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Taiwan",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Delphic Offline Reinforcement Learning under Nonidentifiable Hidden Confounding",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17928",
        "id": "lUYY2qsRTI",
        "author_site": "Aliz\u00e9e Pace, Hugo Y\u00e8che, Bernhard Schoelkopf, Gunnar Ratsch, Guy Tennenholtz",
        "tldr": "",
        "abstract": "A prominent challenge of offline reinforcement learning (RL) is the issue of hidden confounding: unobserved variables may influence both the actions taken by the agent and the observed outcomes. Hidden confounding can compromise the validity of any causal conclusion drawn from data and presents a major obstacle to effective offline RL. In the present paper, we tackle the problem of hidden confounding in the nonidentifiable setting. We propose a definition of uncertainty due to hidden confounding bias, termed delphic uncertainty, which uses variation over world models compatible with the observations, and differentiate it from the well-known epistemic and aleatoric uncertainties. We derive a practical method for estimating the three types of uncertainties, and construct a pessimistic offline RL algorithm to account for them. Our method does not assume identifiability of the unobserved confounders, and attempts to reduce the amount of confounding bias. We demonstrate through extensive experiments and ablations the efficacy of our approach on a sepsis management benchmark, as well as on electronic health records. Our results suggest that nonidentifiable hidden confounding bias can be mitigated to improve offline RL solutions in practice.",
        "keywords": "offline reinforcement learning;hidden confounding;uncertainty quantification;causal inference;healthcare;vasopressor and fluid administration",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/7d3d39dc20dd397d021eb4f4b62d01cdf1c837cf.zip",
        "author": "Aliz\u00e9e Pace;Hugo Y\u00e8che;Bernhard Sch\u00f6lkopf;Gunnar Ratsch;Guy Tennenholtz",
        "authorids": "~Aliz\u00e9e_Pace1;~Hugo_Y\u00e8che1;~Bernhard_Sch\u00f6lkopf1;~Gunnar_Ratsch1;~Guy_Tennenholtz2",
        "gender": "F;M;;M;",
        "homepage": "https://alizeepace.com/;https://bmi.inf.ethz.ch/people/person/hugo-yeche;;http://bmi.inf.ethz.ch;https://guytenn.com",
        "dblp": "317/0381;251/6034;;https://dblp.uni-trier.de/pers/hd/r/R=auml=tsch:Gunnar;",
        "google_scholar": "p6gHZiUAAAAJ;;;https://scholar.google.ch/citations?user=tQuQ1FwAAAAJ;https://scholar.google.co.il/citations?user=pldrn8IAAAAJ",
        "orcid": "0000-0002-8328-8817;;;0000-0001-5486-8532;",
        "linkedin": "aliz%C3%A9e-pace-516b4314b/;;;;",
        "or_profile": "~Aliz\u00e9e_Pace1;~Hugo_Y\u00e8che1;~Bernhard_Sch\u00f6lkopf1;~Gunnar_Ratsch1;~Guy_Tennenholtz2",
        "aff": "Swiss Federal Institute of Technology;Swiss Federal Institute of Technology;;Swiss Federal Institute of Technology;Google",
        "aff_domain": "ethz.ch;ethz.ch;;ethz.ch;google.com",
        "position": "PhD student;PhD student;;Professor;Researcher",
        "bibtex": "@inproceedings{\npace2024delphic,\ntitle={Delphic Offline Reinforcement Learning under Nonidentifiable Hidden Confounding},\nauthor={Aliz{\\'e}e Pace and Hugo Y{\\`e}che and Bernhard Sch{\\\"o}lkopf and Gunnar Ratsch and Guy Tennenholtz},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=lUYY2qsRTI}\n}",
        "github": "",
        "project": "",
        "reviewers": "qrjW;Lkaz;x1vz;3wVu",
        "pdf_size": 771448,
        "rating": "6;8;8;8",
        "confidence": "4;3;3;4",
        "soundness": "4;3;3;3",
        "contribution": "3;3;3;4",
        "presentation": "3;4;3;3",
        "wc_summary": "72;53;66;86",
        "wc_strengths": "13;38;31;66",
        "wc_weaknesses": "12;418;108;56",
        "wc_questions": "127;15;72;111",
        "wc_review": "224;524;277;319",
        "wc_reply_reviewers": "14;206;72;85",
        "wc_reply_authors": "705;2220;1416;1064",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;4;4;4",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            69.25,
            11.861176164276458
        ],
        "wc_strengths_avg": [
            37.0,
            19.06567596493762
        ],
        "wc_weaknesses_avg": [
            148.5,
            159.26314702403693
        ],
        "wc_questions_avg": [
            81.25,
            43.16465568031326
        ],
        "wc_review_avg": [
            336.0,
            113.64198167930724
        ],
        "wc_reply_reviewers_avg": [
            94.25,
            69.83686347481536
        ],
        "wc_reply_authors_avg": [
            1351.25,
            561.0416094194796
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.25,
            1.299038105676658
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11489343289577790075&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 8,
        "openreview": "https://openreview.net/forum?id=lUYY2qsRTI",
        "pdf": "https://openreview.net/pdf?id=lUYY2qsRTI",
        "email": "ethz.ch;ethz.ch;;ethz.ch;google.com",
        "author_num": 5,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "Swiss Federal Institute of Technology;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.ethz.ch;https://www.google.com",
        "aff_unique_abbr": "ETH Zurich;Google",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "Switzerland;United States"
    },
    {
        "id": "lVZ7Tafw51",
        "title": "Co-learning synaptic delays, weights and adaptation in spiking neural networks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Spiking neural networks (SNN) distinguish themselves from artificial neural networks (ANN) because of their inherent temporal processing and spike-based computations, enabling a power-efficient implementation in neuromorphic hardware. \nIn this paper, we demonstrate that data processing with spiking neurons can be enhanced by co-learning the connection weights with two other biologically inspired neuronal features: 1) a set of parameters describing neuronal adaptation processes and 2) synaptic propagation delays. \nThe former allows the spiking neuron to learn how to specifically react to incoming spikes based on its past. The trained adaptation parameters result in neuronal heterogeneity, which is found in the brain and also leads to a greater variety in available spike patterns. The latter enables to learn to explicitly correlate patterns that are temporally distanced. Synaptic delays reflect the time an action potential requires to travel from one neuron to another. We show that each of the co-learned features separately leads to an improvement over the baseline SNN and that the combination of both leads to state-of-the-art SNN results on all speech recognition datasets investigated with a simple 2-hidden layer feed-forward network. Our SNN outperforms the ANN on the neuromorpic datasets (Spiking Heidelberg Digits and Spiking Speech Commands), even with fewer trainable parameters. On the 35-class Google Speech Commands dataset, our SNN also outperforms a GRU of similar size.\nOur work presents brain-inspired improvements to SNN that enable them to excel over an equivalent ANN of similar size on tasks with rich temporal dynamics.",
        "keywords": "Spiking neural networks;neuronal adaptation;synaptic delays",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Lucas Deckers;Laurens Van Damme;Ing Jyh Tsang;Werner Van Leekwijck;Steven Latre",
        "authorids": "~Lucas_Deckers1;~Laurens_Van_Damme1;~Ing_Jyh_Tsang1;~Werner_Van_Leekwijck1;~Steven_Latre1",
        "gender": "M;M;M;M;M",
        "homepage": ";https://www.uantwerpen.be/en/staff/laurens-van-damme_23131/;;https://www.uantwerpen.be/en/staff/werner-vanleekwijck/;https://www.uantwerpen.be/en/staff/steven-latre/",
        "dblp": ";;;;",
        "google_scholar": "c5Tl6qcAAAAJ;;YiSnYf0AAAAJ;;",
        "orcid": "0000-0002-5275-4854;0000-0001-8965-1632;0000-0002-8104-0164;;",
        "linkedin": "lucas-deckers;;;;",
        "or_profile": "~Lucas_Deckers1;~Laurens_Van_Damme1;~Ing_Jyh_Tsang1;~Werner_Van_Leekwijck1;~Steven_Latre1",
        "aff": "Universiteit Antwerpen;Universiteit Antwerpen;Universiteit Antwerpen;University of Antwerp;University of Antwerp",
        "aff_domain": "uantwerpen.be;uantwerpen.be;ua.ac.be;uantwerpen.be;uantwerpen.be",
        "position": "PhD student;PhD student;Principal Researcher;Researcher;Full Professor",
        "bibtex": "@misc{\ndeckers2024colearning,\ntitle={Co-learning synaptic delays, weights and adaptation in spiking neural networks},\nauthor={Lucas Deckers and Laurens Van Damme and Ing Jyh Tsang and Werner Van Leekwijck and Steven Latre},\nyear={2024},\nurl={https://openreview.net/forum?id=lVZ7Tafw51}\n}",
        "github": "",
        "project": "",
        "reviewers": "fvm6;XBEc;2Gfg;mMin",
        "site": "https://openreview.net/forum?id=lVZ7Tafw51",
        "pdf_size": 1622132,
        "rating": "3;3;3;5",
        "confidence": "4;5;4;5",
        "soundness": "3;1;2;2",
        "contribution": "2;3;2;2",
        "presentation": "3;2;2;2",
        "wc_summary": "38;64;34;132",
        "wc_strengths": "26;64;13;118",
        "wc_weaknesses": "42;256;67;205",
        "wc_questions": "77;87;2;39",
        "wc_review": "183;471;116;494",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            67.0,
            39.25557285278104
        ],
        "wc_strengths_avg": [
            55.25,
            40.78832553562355
        ],
        "wc_weaknesses_avg": [
            142.5,
            90.2621182999823
        ],
        "wc_questions_avg": [
            51.25,
            33.60338524613257
        ],
        "wc_review_avg": [
            316.0,
            168.37309761360333
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15101566853225010987&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 10,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "University of Antwerp",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uantwerp.be",
        "aff_unique_abbr": "UA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Belgium"
    },
    {
        "id": "lWXedJyLuL",
        "title": "A Unified Causal View of Instruction Tuning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Instruction tuning on a mixture of tasks has improved zero-shot capabilities in natural language processing (NLP). Nevertheless, existing methods often learn features that exhibit correlations between instruction-formatted samples and target labels, rather than causal relationships. Termed as \"spurious correlation'' in statistics, such a correlation may change drastically in a new task, making the effect from the learned features to be misleading. To this end, we develop a meta Structural Causal Model (meta-SCM) to integrate different NLP tasks under a single causal structure of the data. Specifically, the meta-SCM introduces multiple latent factors that represent properties of source context language, only some of which causally influence the target labels for a specific task. The key idea is to learn task-required causal factors and only use those to make predictions for a given task. Theoretically, we prove the causal factor can be identified without mixing information from others. Guided by the identifiability, we propose a Structural Instruction Tuning (SIT) method to learn the task-required causal representations that can mimic the causal factors for each task. The utility of our approach is verified by improvements of zero-shot ability on a range of unseen datasets and tasks.",
        "keywords": "causal representation learning;identifiability analysis;instruction tuning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/870e49ee614351695b65668fe59acbc5c157651b.pdf",
        "author": "Lu Chen;Wei Huang;Ruqing Zhang;Wei Chen;Jiafeng Guo;Xueqi Cheng",
        "authorids": "~Lu_Chen9;~Wei_Huang22;~Ruqing_Zhang3;~Wei_Chen1;~Jiafeng_Guo1;~Xueqi_Cheng1",
        "gender": ";M;F;F;M;M",
        "homepage": ";;https://daqingchong.github.io/;https://weichen-cas.github.io/;http://www.bigdatalab.ac.cn/gjf/;https://people.ucas.ac.cn/~cxq?language=en",
        "dblp": ";;;;02/146;44/912",
        "google_scholar": ";;qwdqaO4AAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?view_op=list_works;hY8aLqAAAAAJ",
        "orcid": "0000-0001-6747-8015;0009-0001-1556-8198;;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Lu_Chen9;~Wei_Huang22;~Ruqing_Zhang3;~Wei_Chen1;~Jiafeng_Guo1;~Xueqi_Cheng1",
        "aff": "Institute of Computing Technology, Chinese Academy of Sciences; University of Chinese Academy of Sciences;University of Chinese Academy of Sciences;Institute of Computing Technology, Chinese Academy of Sciences; Chinese Academy of Sciences;Institute of Computing Technolgy, Chinese Academy of Sciences;Institute of Computing Technology, Chinese Academy",
        "aff_domain": "ict.ac.cn;ucas.ac.cn;ict.ac.cn;ict.ac.cn;ict.ac.cn;ict.ac.cn",
        "position": "PhD student;PhD student;Associate Professor;Full Professor;Researcher;Full Professor",
        "bibtex": "@misc{\nchen2024a,\ntitle={A Unified Causal View of Instruction Tuning},\nauthor={Lu Chen and Wei Huang and Ruqing Zhang and Wei Chen and Jiafeng Guo and Xueqi Cheng},\nyear={2024},\nurl={https://openreview.net/forum?id=lWXedJyLuL}\n}",
        "github": "",
        "project": "",
        "reviewers": "nrtp;GNKT;6m14",
        "site": "https://openreview.net/forum?id=lWXedJyLuL",
        "pdf_size": 1342007,
        "rating": "5;6;6",
        "confidence": "2;3;1",
        "soundness": "1;3;3",
        "contribution": "2;3;3",
        "presentation": "2;3;3",
        "wc_summary": "79;71;43",
        "wc_strengths": "22;84;20",
        "wc_weaknesses": "29;44;59",
        "wc_questions": "471;2;20",
        "wc_review": "601;201;142",
        "wc_reply_reviewers": "151;0;0",
        "wc_reply_authors": "1316;106;76",
        "reply_reviewers": "1;0;0",
        "reply_authors": "4;1;1",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            2.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            64.33333333333333,
            15.434449203720302
        ],
        "wc_strengths_avg": [
            42.0,
            29.709706606876257
        ],
        "wc_weaknesses_avg": [
            44.0,
            12.24744871391589
        ],
        "wc_questions_avg": [
            164.33333333333334,
            216.97055611815676
        ],
        "wc_review_avg": [
            314.6666666666667,
            203.89594296001957
        ],
        "wc_reply_reviewers_avg": [
            50.333333333333336,
            71.18208263944578
        ],
        "wc_reply_authors_avg": [
            499.3333333333333,
            577.6004001229763
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            1.4142135623730951
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16518673366832451685&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1;0;0;0;0",
        "aff_unique_norm": "Chinese Academy of Sciences;University of Chinese Academy of Sciences",
        "aff_unique_dep": "Institute of Computing Technology;",
        "aff_unique_url": "http://www.ict.ac.cn;http://www.ucas.ac.cn",
        "aff_unique_abbr": "CAS;UCAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "lWe3GBRem8",
        "title": "Offline RL for Online RL: Decoupled Policy Learning for Mitigating Exploration Bias",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "It is desirable for policies to optimistically explore new states and behaviors during online reinforcement learning (RL) or fine-tuning, especially when any prior offline data does not provide enough state coverage. However, exploration bonuses can bias the learned policy, and our experiments find that na\\\"ive, yet standard use of such bonuses can fail to recover a performant policy. Concurrently, pessimistic training in offline RL has enabled recovery of performant policies from static datasets. Can we leverage offline RL to recover better policies from online interaction? We make a simple observation that a policy can be trained from scratch on all interaction data with pessimistic objectives, thereby decoupling the policies used for data collection and for evaluation. Specifically, we propose the Offline-to-Online-to-Offline (OOO) framework for reinforcement learning (RL), where an optimistic (_exploration_) policy is used to interact with the environment, and a _separate_ pessimistic (_exploitation_) policy is trained on all the observed data for evaluation. Such decoupling can reduce any bias from online interaction (intrinsic rewards, primacy bias) in the evaluation policy, and can allow more exploratory behaviors during online interaction which in turn can generate better data for exploitation. OOO is complementary to several offline-to-online RL and online RL methods, and improves their average performance by 14\\% to 26\\% in our fine-tuning experiments, achieves state-of-the-art performance on several environments in the D4RL benchmarks, and also improves online RL performance by 165\\% on two OpenAI gym environments. Further, OOO RL can enable fine-tuning from incomplete offline datasets where prior methods can fail to recover a performant policy.",
        "keywords": "reinforcement learning;offline reinforcement learning;exploration;fine-tuning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Max Sobol Mark;Archit Sharma;Fahim Tajwar;Rafael Rafailov;Sergey Levine;Chelsea Finn",
        "authorids": "~Max_Sobol_Mark1;~Archit_Sharma1;~Fahim_Tajwar1;~Rafael_Rafailov1;~Sergey_Levine1;~Chelsea_Finn1",
        "gender": "M;M;M;M;M;F",
        "homepage": "https://github.com/MaxSobolMark/;;https://tajwarfahim.github.io/;https://rmrafailov.github.io/;https://people.eecs.berkeley.edu/~svlevine/;https://ai.stanford.edu/~cbfinn/",
        "dblp": ";220/3163.html;292/1504;272/5358;80/7594;131/1783",
        "google_scholar": "https://scholar.google.com/citations?hl=en;_0IIzxgAAAAJ;iMlmLO4AAAAJ;TwABcRgAAAAJ;8R35rCwAAAAJ;vfPE6hgAAAAJ",
        "orcid": ";;0000-0001-9257-6282;;;",
        "linkedin": "max-sobol-mark/;;fahim-tajwar-8a5377162/;;;",
        "or_profile": "~Max_Sobol_Mark1;~Archit_Sharma1;~Fahim_Tajwar1;~Rafael_Rafailov1;~Sergey_Levine1;~Chelsea_Finn1",
        "aff": "Computer Science Department, Stanford University;Stanford University;Carnegie Mellon University;Stanford University;Google;Google",
        "aff_domain": "cs.stanford.edu;stanford.edu;andrew.cmu.edu;stanford.edu;google.com;google.com",
        "position": "MS student;Graduate Student;PhD student;PhD student;Research Scientist;Research Scientist",
        "bibtex": "@misc{\nmark2024offline,\ntitle={Offline {RL} for Online {RL}: Decoupled Policy Learning for Mitigating Exploration Bias},\nauthor={Max Sobol Mark and Archit Sharma and Fahim Tajwar and Rafael Rafailov and Sergey Levine and Chelsea Finn},\nyear={2024},\nurl={https://openreview.net/forum?id=lWe3GBRem8}\n}",
        "github": "",
        "project": "",
        "reviewers": "vvG4;eqEe;UwhL;Pgjg",
        "site": "https://openreview.net/forum?id=lWe3GBRem8",
        "pdf_size": 9659536,
        "rating": "5;5;6;8",
        "confidence": "4;3;3;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "4;3;3;4",
        "wc_summary": "60;97;91;76",
        "wc_strengths": "22;89;140;78",
        "wc_weaknesses": "142;234;48;150",
        "wc_questions": "228;34;72;64",
        "wc_review": "452;454;351;368",
        "wc_reply_reviewers": "1184;190;0;52",
        "wc_reply_authors": "3397;1478;427;182",
        "reply_reviewers": "8;1;0;1",
        "reply_authors": "7;3;1;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            81.0,
            14.33527118683145
        ],
        "wc_strengths_avg": [
            82.25,
            41.91882035553959
        ],
        "wc_weaknesses_avg": [
            143.5,
            65.86918854821273
        ],
        "wc_questions_avg": [
            99.5,
            75.52979544524135
        ],
        "wc_review_avg": [
            406.25,
            47.14008379288268
        ],
        "wc_reply_reviewers_avg": [
            356.5,
            482.77608681458116
        ],
        "wc_reply_authors_avg": [
            1371.0,
            1266.9828333485816
        ],
        "reply_reviewers_avg": [
            2.5,
            3.2015621187164243
        ],
        "reply_authors_avg": [
            3.0,
            2.449489742783178
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.4714045207910316,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3227208330346187663&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;2;2",
        "aff_unique_norm": "Stanford University;Carnegie Mellon University;Google",
        "aff_unique_dep": "Computer Science Department;;Google",
        "aff_unique_url": "https://www.stanford.edu;https://www.cmu.edu;https://www.google.com",
        "aff_unique_abbr": "Stanford;CMU;Google",
        "aff_campus_unique_index": "0;0;0;2;2",
        "aff_campus_unique": "Stanford;;Mountain View",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "lYy9zPOxXS",
        "title": "Topology-Informed Graph Transformer",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Transformers have revolutionized performance in Natural Language Processing and Vision, paving the way for their integration with Graph Neural Networks (GNNs). One key challenge in enhancing graph transformers is strengthening the discriminative power of distinguishing isomorphisms of graphs, which plays a crucial role in boosting their predictive performances. To address this challenge, we introduce 'Topology-Informed Graph Transformer (TIGT)', a novel transformer enhancing both discriminative power in detecting graph isomorphisms and the overall performance of Graph Transformers. \nTIGT consists of four components: A topological positional embedding layer using non-isomorphic universal covers based on cyclic subgraphs of graphs to ensure unique graph representation: A dual-path message-passing layer to explicitly encode topological characteristics throughout the encoder layers: A global attention mechanism: And a graph information layer to recalibrate channel-wise graph features for better feature representation.\nTIGT outperforms previous Graph Transformers in classifying synthetic dataset aimed at distinguishing isomorphism classes of graphs. Additionally, mathematical analysis and empirical evaluations highlight our model's competitive edge over state-of-the-art Graph Transformers across various benchmark datasets.",
        "keywords": "Graph Neural Network;Topology;Graph Classification;Transformer",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/18aaf9564ee739000c5ef661864e5c84b527e760.zip",
        "author": "Yun Young Choi;Sun Woo Park;Minho Lee;Youngho Woo",
        "authorids": "~Yun_Young_Choi1;~Sun_Woo_Park1;~Minho_Lee5;~Youngho_Woo1",
        "gender": ";M;M;M",
        "homepage": ";https://sites.google.com/wisc.edu/spark483;https://leemingo.github.io/;",
        "dblp": ";;;",
        "google_scholar": ";;JHgYc48AAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;",
        "linkedin": ";;minho-lee-9a96191a4/;",
        "or_profile": "~Yun_Young_Choi1;~Sun_Woo_Park1;~Minho_Lee5;~Youngho_Woo1",
        "aff": ";;Yonsei University;National Institute for mathematical Sciences ",
        "aff_domain": ";;yonsei.ac.kr;nims.re.kr",
        "position": ";;MS student;Full Professor",
        "bibtex": "@misc{\nchoi2024topologyinformed,\ntitle={Topology-Informed Graph Transformer},\nauthor={Yun Young Choi and Sun Woo Park and Minho Lee and Youngho Woo},\nyear={2024},\nurl={https://openreview.net/forum?id=lYy9zPOxXS}\n}",
        "github": "",
        "project": "",
        "reviewers": "Cu2Y;apGs;8s8z",
        "site": "https://openreview.net/forum?id=lYy9zPOxXS",
        "pdf_size": 333260,
        "rating": "3;5;5",
        "confidence": "4;3;4",
        "soundness": "2;3;4",
        "contribution": "2;2;3",
        "presentation": "1;3;3",
        "wc_summary": "67;67;75",
        "wc_strengths": "21;31;41",
        "wc_weaknesses": "96;216;157",
        "wc_questions": "107;3;78",
        "wc_review": "291;317;351",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "637;534;282",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            69.66666666666667,
            3.7712361663282534
        ],
        "wc_strengths_avg": [
            31.0,
            8.16496580927726
        ],
        "wc_weaknesses_avg": [
            156.33333333333334,
            48.99206284922306
        ],
        "wc_questions_avg": [
            62.666666666666664,
            43.82034027962611
        ],
        "wc_review_avg": [
            319.6666666666667,
            24.567367696917707
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            484.3333333333333,
            149.12261919492818
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9639990207530141368&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Yonsei University;National Institute for Mathematical Sciences",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.yonsei.ac.kr;http://www.nims.re.kr/english/",
        "aff_unique_abbr": "Yonsei;NIMS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "SRL: Scaling Distributed Reinforcement Learning to Over Ten Thousand Cores",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17927",
        "id": "lajn1iROCu",
        "author_site": "Zhiyu Mei, Wei Fu, Jiaxuan Gao, Guangju Wang, Huanchen Zhang, Yi Wu",
        "tldr": "",
        "abstract": "The ever-growing complexity of reinforcement learning (RL) tasks demands a distributed system to efficiently generate and process a massive amount of data. However, existing open-source libraries suffer from various limitations, which impede their practical use in challenging scenarios where large-scale training is necessary. In this paper, we present a novel abstraction on the dataflows of RL\ntraining, which unifies diverse RL training applications into a general framework. Following this abstraction, we develop a scalable, efficient, and extensible distributed RL system called ReaLly Scalable RL (SRL), which allows efficient and massively parallelized training and easy development of customized algorithms. Our evaluation shows that SRL outperforms existing academic libraries, reaching at most 21x higher training throughput in a distributed setting. On learning performance, beyond performing and scaling well on common RL benchmarks with different RL algorithms, SRL can reproduce the same solution in the challenging hide-and-seek environment as reported by OpenAI with up to 5x speedup in wallclock time. Notably, SRL is the first in the academic community to perform RL experiments at a large scale with over 15k CPU cores. SRL anonymous repository is available at: https://anonymous.4open.science/r/srl-1E45/.",
        "keywords": "Reinforcement Learning;Distributed Systems;Large Scale Training",
        "primary_area": "infrastructure, software libraries, hardware, etc.",
        "supplementary_material": "/attachment/3c0339a20075d12b064b80daac155ee4a30304cb.zip",
        "author": "Zhiyu Mei;Wei Fu;Jiaxuan Gao;Guangju Wang;Huanchen Zhang;Yi Wu",
        "authorids": "~Zhiyu_Mei1;~Wei_Fu1;~Jiaxuan_Gao1;~Guangju_Wang1;~Huanchen_Zhang1;~Yi_Wu1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://nuzant.github.io;https://garrett4wade.github.io/;https://github.com/samjia2000/;https://www.linkedin.com/in/guangju-wang/;http://people.iiis.tsinghua.edu.cn/~huanchen/index.html;https://jxwuyi.weebly.com",
        "dblp": "299/5277.html;;304/2243;;;",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;;;filGbagAAAAJ;dusV5HMAAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Zhiyu_Mei1;~Wei_Fu1;~Jiaxuan_Gao1;~Guangju_Wang1;~Huanchen_Zhang1;~Yi_Wu1",
        "aff": "Tsinghua University;Institute for Interdisciplinary Information Sciences, Tsinghua University, Tsinghua University;Tsinghua University;Tianyancha;Tsinghua University;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;mails.tsinghua.edu.cn;mails.tsinghua.edu.cn;tianyancha.com;tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "PhD student;PhD student;PhD student;Principal Researcher;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nmei2024srl,\ntitle={{SRL}: Scaling Distributed Reinforcement Learning to Over Ten Thousand Cores},\nauthor={Zhiyu Mei and Wei Fu and Jiaxuan Gao and Guangju Wang and Huanchen Zhang and Yi Wu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=lajn1iROCu}\n}",
        "github": "",
        "project": "",
        "reviewers": "YF9q;Wery;bQuB;Qkzp",
        "pdf_size": 1134632,
        "rating": "6;8;8;8",
        "confidence": "4;4;3;3",
        "soundness": "3;3;3;4",
        "contribution": "2;3;3;3",
        "presentation": "2;3;3;4",
        "wc_summary": "19;120;301;67",
        "wc_strengths": "31;45;284;92",
        "wc_weaknesses": "110;33;117;131",
        "wc_questions": "6;64;18;21",
        "wc_review": "166;262;720;311",
        "wc_reply_reviewers": "110;14;0;11",
        "wc_reply_authors": "747;244;80;270",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            126.75,
            106.7576109698976
        ],
        "wc_strengths_avg": [
            113.0,
            101.2793167433509
        ],
        "wc_weaknesses_avg": [
            97.75,
            38.140365755980895
        ],
        "wc_questions_avg": [
            27.25,
            21.947380253688593
        ],
        "wc_review_avg": [
            364.75,
            211.63101733914147
        ],
        "wc_reply_reviewers_avg": [
            33.75,
            44.33043536894263
        ],
        "wc_reply_authors_avg": [
            335.25,
            248.63364112685957
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12882115082541447026&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=lajn1iROCu",
        "pdf": "https://openreview.net/pdf?id=lajn1iROCu",
        "email": "tsinghua.edu.cn;mails.tsinghua.edu.cn;mails.tsinghua.edu.cn;tianyancha.com;tsinghua.edu.cn;tsinghua.edu.cn",
        "author_num": 6,
        "aff_unique_index": "0;0;0;1;0;0",
        "aff_unique_norm": "Tsinghua University;Tianyancha",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.tianyancha.com",
        "aff_unique_abbr": "THU;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "lbjKcEn0gQ",
        "title": "Cross-Modal Self-Supervised Learning with Effective Contrastive Units for Point Clouds",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "3D perception in LiDAR point clouds is crucial for an autonomous driving vehicle to properly act in 3D environment. However, manually labeling point clouds is hard and costly. There has been a growing interest in self-supervised pre-training of 3D perception models. Following the success of contrastive learning in images, current methods mostly conduct contrastive pre-training on point clouds only. Yet a self-driving vehicle is typically supplied with multiple sensors including cameras and LiDAR. In this context, we systematically study single modality, cross-modality, and multi-modality for contrastive learning of point clouds, and find that cross-modality wins over other alternatives. In addition, considering the huge difference between the training sources in 2D images and 3D point clouds, it remains unclear how to design more effective contrastive units for LiDAR. We therefore propose the instance-aware and similarity-balanced contrastive units that are tailored for self-driving point clouds. Extensive experiments reveal that our approach achieves remarkable performance gains over various point cloud models across the downstream perception tasks of LiDAR based 3D object detection and 3D semantic segmentation on the four popular benchmarks including Waymo Open Dataset, nuScenes, SemanticKITTI and ONCE.",
        "keywords": "LiDAR;point cloud;autonomous driving;contrastive learning",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Mu Cai;Chenxu Luo;Yong Jae Lee;Xiaodong Yang",
        "authorids": "~Mu_Cai1;~Chenxu_Luo1;~Yong_Jae_Lee2;~Xiaodong_Yang4",
        "gender": "M;;;M",
        "homepage": "https://pages.cs.wisc.edu/~mucai/;;;https://xiaodongyang.org",
        "dblp": "279/6529;;;",
        "google_scholar": "euruCPEAAAAJ;;;yWsMg_gAAAAJ",
        "orcid": "0009-0008-7967-9752;;;",
        "linkedin": "mu-cai/;;;",
        "or_profile": "~Mu_Cai1;~Chenxu_Luo1;~Yong_Jae_Lee2;~Xiaodong_Yang4",
        "aff": "Microsoft;;;QCraft",
        "aff_domain": "microsoft.com;;;qcraft.ai",
        "position": "Intern;;;Researcher",
        "bibtex": "@misc{\ncai2024crossmodal,\ntitle={Cross-Modal Self-Supervised Learning with Effective Contrastive Units for Point Clouds},\nauthor={Mu Cai and Chenxu Luo and Yong Jae Lee and Xiaodong Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=lbjKcEn0gQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "djbZ;BAN3;6wPD;uZYu",
        "site": "https://openreview.net/forum?id=lbjKcEn0gQ",
        "pdf_size": 10197251,
        "rating": "3;3;3;6",
        "confidence": "4;4;5;3",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;2",
        "presentation": "2;3;2;3",
        "wc_summary": "192;57;43;137",
        "wc_strengths": "43;41;9;84",
        "wc_weaknesses": "51;201;394;144",
        "wc_questions": "421;4;15;4",
        "wc_review": "707;303;461;369",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            107.25,
            60.664548955712185
        ],
        "wc_strengths_avg": [
            44.25,
            26.621185172715357
        ],
        "wc_weaknesses_avg": [
            197.5,
            125.44819647966247
        ],
        "wc_questions_avg": [
            111.0,
            179.03491279635935
        ],
        "wc_review_avg": [
            460.0,
            153.2481647524694
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6327627863130544262&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Microsoft;QCraft",
        "aff_unique_dep": "Microsoft Corporation;",
        "aff_unique_url": "https://www.microsoft.com;",
        "aff_unique_abbr": "Microsoft;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States;"
    },
    {
        "title": "The Cost of Scaling Down Large Language Models: Reducing Model Size Affects Memory before In-context Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17926",
        "id": "ldJXXxPE0L",
        "author_site": "Tian Jin, Nolan Clement, Xin Dong, Vaishnavh Nagarajan, Michael Carbin, Jonathan Ragan-Kelley, Gintare Karolina Dziugaite",
        "tldr": "",
        "abstract": "We study how down-scaling large language model (LLM) size impacts LLM capabilities. We begin by measuring the effects of weight pruning \u2013 a popular technique for reducing model size \u2013 on the two abilities of LLMs: (a) recalling facts presented during pre-training and (b) processing information presented in context. Surprisingly, we find that existing pruning techniques affect these two abilities of LLMs differently. For example, pruning more than 30% of weights significantly decreases an LLM\u2019s ability to recall facts presented during pre-training. Yet pruning 60-70% of weights largely preserves an LLM\u2019s ability to process information in-context, ranging from retrieving answers based on information presented in context to learning parameterized functions such as a linear classifier based on a few examples. Moderate pruning impairs LLM\u2019s ability to recall facts learnt from pre-training. However, its effect on model\u2019s ability to process information presented in context is much less pronounced. The said disparate effects similarly arise when replacing the original model with a smaller dense one with reduced width and depth. This similarity suggests that model size reduction in general underpins the said disparity.",
        "keywords": "large language model;scaling;in-context learning;pruning",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Tian Jin;Nolan Clement;Xin Dong;Vaishnavh Nagarajan;Michael Carbin;Jonathan Ragan-Kelley;Gintare Karolina Dziugaite",
        "authorids": "~Tian_Jin1;~Nolan_Clement1;~Xin_Dong1;~Vaishnavh_Nagarajan3;~Michael_Carbin1;~Jonathan_Ragan-Kelley1;~Gintare_Karolina_Dziugaite1",
        "gender": "M;M;M;M;M;F;M",
        "homepage": "https://www.tjin.org;;http://www.simonxin.com/;http://people.csail.mit.edu/mcarbin/;https://people.csail.mit.edu/jrk;http://gkdz.org/;https://vaishnavh.github.io/",
        "dblp": ";;25/7257-9;07/3119;;163/1774;161/0079",
        "google_scholar": ";;O8nBN64AAAAJ;mtejbKYAAAAJ;https://scholar.google.com.tw/citations?user=nBcay4oAAAAJ;5K1QB_8AAAAJ;https://scholar.google.nl/citations?user=LrsjJfwAAAAJ",
        "orcid": ";;;;;;",
        "linkedin": ";nolan-clement-940139204/;;;;;",
        "or_profile": "~Tian_Jin1;~Nolan_Clement1;~Xin_Dong1;~Michael_Carbin1;~Jonathan_Ragan-Kelley1;~Gintare_Karolina_Dziugaite1;~Vaishnavh_Nagarajan1",
        "aff": "Massachusetts Institute of Technology;Massachusetts Institute of Technology;Sony Research;Massachusetts Institute of Technology;Adobe Systems;Montreal Institute for Learning Algorithms, University of Montreal, University of Montreal;Google",
        "aff_domain": "mit.edu;mit.edu;sony.com;mit.edu;adobe.com;mila.umontreal.ca;google.com",
        "position": "PhD student;Undergrad student;Researcher;Associate Professor;Researcher;Member;Researcher",
        "bibtex": "@inproceedings{\njin2024the,\ntitle={The Cost of Scaling Down Large Language Models: Reducing Model Size Affects Memory before In-context Learning},\nauthor={Tian Jin and Nolan Clement and Xin Dong and Vaishnavh Nagarajan and Michael Carbin and Jonathan Ragan-Kelley and Gintare Karolina Dziugaite},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ldJXXxPE0L}\n}",
        "github": "",
        "project": "",
        "reviewers": "B31e;2TYK;xD3m;ecKe",
        "pdf_size": 669577,
        "rating": "6;6;6;6",
        "confidence": "4;2;4;4",
        "soundness": "4;2;3;2",
        "contribution": "4;2;2;2",
        "presentation": "3;3;3;3",
        "wc_summary": "144;161;65;100",
        "wc_strengths": "79;57;38;79",
        "wc_weaknesses": "84;1309;114;66",
        "wc_questions": "152;57;29;13",
        "wc_review": "459;1584;246;258",
        "wc_reply_reviewers": "0;23;0;0",
        "wc_reply_authors": "801;2527;363;169",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "2;5;1;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            117.5,
            37.606515392947536
        ],
        "wc_strengths_avg": [
            63.25,
            17.122718826167766
        ],
        "wc_weaknesses_avg": [
            393.25,
            528.9864719442265
        ],
        "wc_questions_avg": [
            62.75,
            53.881235138032984
        ],
        "wc_review_avg": [
            636.75,
            553.4019222048294
        ],
        "wc_reply_reviewers_avg": [
            5.75,
            9.959292143521045
        ],
        "wc_reply_authors_avg": [
            965.0,
            930.4246342396573
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            1.5
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:AzHjAW0mm30J:scholar.google.com/&scioq=The+Cost+of+Scaling+Down+Large+Language+Models:+Reducing+Model+Size+Affects+Memory+before+In-context+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=ldJXXxPE0L",
        "pdf": "https://openreview.net/pdf?id=ldJXXxPE0L",
        "email": "mit.edu;mit.edu;sony.com;mit.edu;adobe.com;mila.umontreal.ca;google.com",
        "author_num": 7,
        "aff_unique_index": "0;0;1;0;2;3;4",
        "aff_unique_norm": "Massachusetts Institute of Technology;Sony;Adobe;University of Montreal;Google",
        "aff_unique_dep": ";Research;Adobe Systems Incorporated;Montreal Institute for Learning Algorithms;Google",
        "aff_unique_url": "https://web.mit.edu;https://www.sony.com;https://www.adobe.com;https://www.umontreal.ca;https://www.google.com",
        "aff_unique_abbr": "MIT;Sony;Adobe;UM;Google",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Montreal;Mountain View",
        "aff_country_unique_index": "0;0;1;0;0;2;0",
        "aff_country_unique": "United States;Japan;Canada"
    },
    {
        "id": "le1UUMd45T",
        "title": "Solving Multiobjective Combinatorial Optimization via Learn to Improve Method",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recently, deep reinforcement learning (DRL) has been prevailing for solving multiobjective combinatorial optimization problems (MOCOPs). Most DRL methods are based on the \"Learn to Construct\" paradigm, where the trained model(s) can directly generate a set of approximate Pareto optimal solutions. However, these methods still suffer from insufficient proximity and poor diversity towards the true Pareto front. In this paper, we propose \"Learn to Improve\" (L2I), a learning-based improvement method for solving MOCOPs. We embed a weight-related policy network into multiobjective evolutionary algorithm (MOEA) frameworks to effectively guide the search direction. A shared baseline for proximal policy optimization is presented to reduce variance in model training. A quality enhancement mechanism is designed to further improve the Pareto set in model inference. Computational experiments conducted on two classic MOCOPs, i.e., multiobjective traveling salesman problem and multiobjective vehicle routing problem, indicate that our method achieves state-of-the-art results. Notably, our L2I module can be easily integrated into various MOEA frameworks such as NSGA-II, MOEA/D and MOGLS.",
        "keywords": "multi-objective combinatorial optimization;neural heuristic;learning to optimize;deep reinforcement learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Te Ye;Zizhen Zhang;Jinbiao Chen;Jiahai Wang",
        "authorids": "~Te_Ye1;~Zizhen_Zhang1;~Jinbiao_Chen1;~Jiahai_Wang1",
        "gender": "M;;M;M",
        "homepage": ";;;",
        "dblp": ";45/9055;;00/2989",
        "google_scholar": ";;;",
        "orcid": "0000-0001-8152-9931;;0000-0001-7417-0430;",
        "linkedin": ";;;",
        "or_profile": "~Te_Ye1;~Zizhen_Zhang1;~Jinbiao_Chen1;~Jiahai_Wang1",
        "aff": "SUN YAT-SEN UNIVERSITY;SUN YAT-SEN UNIVERSITY;SUN YAT-SEN UNIVERSITY;SUN YAT-SEN UNIVERSITY",
        "aff_domain": "sysu.edu.cn;sysu.edu.cn;sysu.edu.cn;sysu.edu.cn",
        "position": "MS student;Associate Professor;PhD student;Full Professor",
        "bibtex": "@misc{\nye2024solving,\ntitle={Solving Multiobjective Combinatorial Optimization via Learn to Improve Method},\nauthor={Te Ye and Zizhen Zhang and Jinbiao Chen and Jiahai Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=le1UUMd45T}\n}",
        "github": "",
        "project": "",
        "reviewers": "ru1d;Rq8H;BJaC;P9jg",
        "site": "https://openreview.net/forum?id=le1UUMd45T",
        "pdf_size": 690750,
        "rating": "6;8;8;8",
        "confidence": "4;3;4;4",
        "soundness": "4;3;4;3",
        "contribution": "2;3;3;3",
        "presentation": "2;2;4;2",
        "wc_summary": "67;55;78;70",
        "wc_strengths": "59;32;80;46",
        "wc_weaknesses": "132;70;14;34",
        "wc_questions": "61;24;43;15",
        "wc_review": "319;181;215;165",
        "wc_reply_reviewers": "10;0;0;19",
        "wc_reply_authors": "582;459;75;270",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "2;1;1;2",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            67.5,
            8.261355820929152
        ],
        "wc_strengths_avg": [
            54.25,
            17.66882848408462
        ],
        "wc_weaknesses_avg": [
            62.5,
            44.86368241685027
        ],
        "wc_questions_avg": [
            35.75,
            17.73943347460679
        ],
        "wc_review_avg": [
            220.0,
            59.941638282582836
        ],
        "wc_reply_reviewers_avg": [
            7.25,
            7.917543811056558
        ],
        "wc_reply_authors_avg": [
            346.5,
            192.14642853823747
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13342282217744222734&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Sun Yat-sen University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.sysu.edu.cn",
        "aff_unique_abbr": "SYSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "leQBhMjje3",
        "title": "FinDA: A New Dataset for Query-focused and Trustworthy Document Analysis Generation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Financial documents such as company earnings reports are crucial for informed decision-making or targeted information-seeking. \nGenerating tailored and trustworthy analyses from these reports, could provide immense value to individuals and financial professionals.\nSuch tailored reports often delve deep into the intricate details and narratives of financial data and encompass information from multiple modalities including tables and text, offering contextual insights rather than merely extracting surface-level facts.\nHowever, existing document question answering and summarization datasets and methods typically focus on generic factoid-type information from text-only documents. In contrast, generating query-tailored analysis over financial documents is more challenging as it requires models to perform expert-like reasoning over long documents that contains both tables and text.\nWe therefore present \\dataset, an expert-curated dataset of xxx query-analysis pairs over xxx company earning reports across various industries.\nWe investigate a set of popular large language models, along with various prompting techniques for long-form text generation, on \\dataset. We also develop and thoroughly investigate the potential of applying muli-agent collaboration pipeline on this new task. Experimental results demonstrate that ...",
        "keywords": "Natural Language Processing; Text Generation; Documemt Processing",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Yilun Zhao",
        "authorids": "~Yilun_Zhao1",
        "gender": "",
        "homepage": "https://yilunzhao.github.io/",
        "dblp": "271/8391",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Yilun_Zhao1",
        "aff": "Yale University",
        "aff_domain": "yale.edu",
        "position": "PhD student",
        "bibtex": "@misc{\nzhao2024finda,\ntitle={Fin{DA}: A New Dataset for Query-focused and Trustworthy Document Analysis Generation},\nauthor={Yilun Zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=leQBhMjje3}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=leQBhMjje3",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:tMzFIKb9rPoJ:scholar.google.com/&scioq=FinDA:+A+New+Dataset+for+Query-focused+and+Trustworthy+Document+Analysis+Generation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Yale University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.yale.edu",
        "aff_unique_abbr": "Yale",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "leWAmr2pzJ",
        "title": "Understanding the Approximation Gap of Neural Networks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Neural networks have gained popularity in scientific computing in recent years. However, they often fail to achieve the same level of accuracy as classical methods, even on the simplest problems. As this appears to contradict the universal approximation theorem, we seek to understand neural network approximation from a different perspective: their approximation capability can be explained by the non-compactness of their image sets, which, in turn, influences the existence of a global minimum, especially when the target function is discontinuous. Furthermore, we demonstrate that in the presence of machine precision, the minimum achievable error of neural networks depends on the grid size, even when the theoretical infimum is zero. Finally, we draw on the classification theory and discuss the roles of width and depth in classifying labeled data points, explaining why neural networks also fail to approximate smooth target functions with complex level sets, and increasing the depth alone is not enough to solve it. Numerical experiments are presented in support of our theoretical claims.",
        "keywords": "Neural networks;function approximation;classification;scientific computing",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Tao Wang;Bo Zhao;Sicun Gao;Rose Yu",
        "authorids": "~Tao_Wang27;~Bo_Zhao6;~Sicun_Gao1;~Rose_Yu1",
        "gender": ";;M;F",
        "homepage": "https://taowang0.github.io/;https://b-zhao.github.io;;http://roseyu.com",
        "dblp": ";;22/8296;164/7314",
        "google_scholar": ";ZCCrFoIAAAAJ;;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Tao_Wang27;~Bo_Zhao6;~Sicun_Gao1;~Rose_Yu1",
        "aff": "University of California, San Diego;University of California, San Diego;University of California, San Diego;University of California, San Diego",
        "aff_domain": "ucsd.edu;ucsd.edu;ucsd.edu;ucsd.edu",
        "position": "PhD student;PhD student;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nwang2024understanding,\ntitle={Understanding the Approximation Gap of Neural Networks},\nauthor={Tao Wang and Bo Zhao and Sicun Gao and Rose Yu},\nyear={2024},\nurl={https://openreview.net/forum?id=leWAmr2pzJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "KVYb;oTBq;WKkT;Bouw",
        "site": "https://openreview.net/forum?id=leWAmr2pzJ",
        "pdf_size": 3204197,
        "rating": "3;3;5;6",
        "confidence": "3;3;2;3",
        "soundness": "2;2;3;2",
        "contribution": "2;2;2;3",
        "presentation": "3;1;2;2",
        "wc_summary": "166;160;55;74",
        "wc_strengths": "83;13;108;98",
        "wc_weaknesses": "453;124;63;202",
        "wc_questions": "5;62;23;109",
        "wc_review": "707;359;249;483",
        "wc_reply_reviewers": "364;0;0;53",
        "wc_reply_authors": "707;372;119;572",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            113.75,
            49.7512562655457
        ],
        "wc_strengths_avg": [
            75.5,
            37.16517186829626
        ],
        "wc_weaknesses_avg": [
            210.5,
            148.42253871969714
        ],
        "wc_questions_avg": [
            49.75,
            39.93353853592241
        ],
        "wc_review_avg": [
            449.5,
            170.16095321782845
        ],
        "wc_reply_reviewers_avg": [
            104.25,
            151.51959444243508
        ],
        "wc_reply_authors_avg": [
            442.5,
            221.55868297135186
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:D6TvCjAiWbMJ:scholar.google.com/&scioq=Understanding+the+Approximation+Gap+of+Neural+Networks&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of California, San Diego",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucsd.edu",
        "aff_unique_abbr": "UCSD",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "San Diego",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "lebNJk3ul9",
        "title": "A space-continuous implementation of Proper Orthogonal Decomposition by means of Neural Networks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In the realm of reduced order modeling, the Proper Orthogonal Decomposition (POD) has established itself as a widely adopted technique for efficiently handling parametric partial differential equations. This approach exploits principles of linear algebra to extract, from a collection of high-fidelity numerical solutions, an optimized reduced space capable of linearly representing the input data. This paper aims to introduce an innovative alternative to replicate the capabilities of POD by harnessing the power of neural networks, thereby overcoming the constraint of exclusively working with solutions confined to the same topological space.\n\nOur method centers around the utilization of the DeepONet architecture, which is applied and minimally modified to emulate the POD spatial-temporal (or parametric) decomposition. This novel adaptation enables the creation of a continuous representation of spatial modes. Although the accuracy gap between neural networks and linear algebraic tools is still evident, this architecture exhibits a distinct advantage: it can accept solutions generated through different discretization schemes, contrary to the conventional POD approach.\n\nFurthermore, our approach allows various enhancements and variants developed to augment the capabilities of POD. These can be seamlessly integrated into the architecture, offering a versatile and adaptable framework known as PODNet.\n\nTo validate its effectiveness, we apply it to two distinct test cases: a simple 1D trigonometric problem and a more complex 2-dimensional Graetz problem. In doing so, we conduct a comprehensive comparison between our proposed methodology and established approaches, shedding light on the potential advantages and trade-offs inherent to this innovative fusion of neural networks and traditional reduced order modeling techniques.",
        "keywords": "ROM;Operator Learning;Dimensionality Reduction",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Nicola Demo;Dario Coscia;Gianluigi Rozza",
        "authorids": "~Nicola_Demo1;~Dario_Coscia1;~Gianluigi_Rozza1",
        "gender": "M;M;M",
        "homepage": "https://nicolademo.xyz;;http://people.sissa.it/grozza",
        "dblp": ";;",
        "google_scholar": ";X6wlDE8AAAAJ;https://scholar.google.it/citations?user=5LtMTMwAAAAJ",
        "orcid": ";0000-0001-8833-6833;",
        "linkedin": ";dario-coscia/;",
        "or_profile": "~Nicola_Demo1;~Dario_Coscia1;~Gianluigi_Rozza1",
        "aff": ";International Higher School for Advanced Studies Trieste;International Higher School for Advanced Studies Trieste",
        "aff_domain": ";sissa.it;sissa.it",
        "position": ";PhD student;Full Professor",
        "bibtex": "@misc{\ndemo2024a,\ntitle={A space-continuous implementation of Proper Orthogonal Decomposition by means of Neural Networks},\nauthor={Nicola Demo and Dario Coscia and Gianluigi Rozza},\nyear={2024},\nurl={https://openreview.net/forum?id=lebNJk3ul9}\n}",
        "github": "",
        "project": "",
        "reviewers": "zc9S;xumW;7r7x;tLNX;GGNn",
        "site": "https://openreview.net/forum?id=lebNJk3ul9",
        "pdf_size": 1390203,
        "rating": "3;3;3;5;5",
        "confidence": "3;4;4;2;2",
        "soundness": "2;1;2;3;2",
        "contribution": "2;1;2;1;2",
        "presentation": "1;2;1;3;2",
        "wc_summary": "154;37;53;31;96",
        "wc_strengths": "24;11;38;14;118",
        "wc_weaknesses": "94;90;378;16;104",
        "wc_questions": "368;35;50;1;135",
        "wc_review": "640;173;519;62;453",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            3.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.0,
            0.8944271909999159
        ],
        "soundness_avg": [
            2.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            1.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            1.8,
            0.7483314773547883
        ],
        "wc_summary_avg": [
            74.2,
            45.9190592238125
        ],
        "wc_strengths_avg": [
            41.0,
            39.63836525387998
        ],
        "wc_weaknesses_avg": [
            136.4,
            124.79358957895232
        ],
        "wc_questions_avg": [
            117.8,
            132.6580566720318
        ],
        "wc_review_avg": [
            369.4,
            217.09960847500392
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.9128709291752769,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:A4AxvdUxH28J:scholar.google.com/&scioq=A+space-continuous+implementation+of+Proper+Orthogonal+Decomposition+by+means+of+Neural+Networks&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "International Higher School for Advanced Studies",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sissa.it",
        "aff_unique_abbr": "SISSA",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Trieste",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Italy"
    },
    {
        "id": "ledQ1BCrwc",
        "title": "GraphMaker: Can Diffusion Models Generate Large Attributed Graphs?",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large-scale graphs with node attributes are fundamental in real-world scenarios, such as social and financial networks. The generation of synthetic graphs that emulate real-world ones is pivotal in graph machine learning, aiding network evolution understanding and data utility preservation when original data cannot be shared. Traditional models for graph generation suffer from limited model capacity. Recent developments in diffusion models have shown promise in merely graph structure generation or the generation of small molecular graphs with attributes. However, their applicability to large attributed graphs remains unaddressed due to challenges in capturing intricate patterns and scalability. This paper introduces GraphMaker, a novel diffusion model tailored for generating large attributed graphs. We study the diffusion models that either couple or decouple graph structure and node attribute generation to address their complex correlation. We also employ node-level conditioning and adopt a minibatch strategy for scalability. We further propose a new evaluation pipeline using models trained on generated synthetic graphs and tested on original graphs to evaluate the quality of synthetic data. Empirical evaluations on real-world datasets showcase GraphMaker's superiority in generating realistic and diverse large-attributed graphs beneficial for downstream tasks.",
        "keywords": "graph generation;large attributed graphs;denoising diffusion model;discrete diffusion;graph neural networks",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/fa95c8e35f9a5ada562dec90a268e0ee5abce34a.zip",
        "author": "Mufei Li;Eleonora Kreacic;Vamsi K. Potluru;Pan Li",
        "authorids": "~Mufei_Li2;~Eleonora_Kreacic1;~Vamsi_K._Potluru1;~Pan_Li2",
        "gender": ";F;Not Specified;",
        "homepage": "https://mufeili.github.io/;;;",
        "dblp": "248/7450;;21/4837;https://dblp.org/pers/hd/l/Li_0005:Pan",
        "google_scholar": "lwbnLDYAAAAJ;;uC_8kekAAAAJ;IroP0EwAAAAJ",
        "orcid": "0000-0001-6123-2188;;;",
        "linkedin": ";eleonora-kreacic-3b1a84164/?originalSubdomain=uk;;pan-li-b951105a/",
        "or_profile": "~Mufei_Li2;~Eleonora_Kreacic1;~Vamsi_K._Potluru1;~Pan_Li2",
        "aff": "Georgia Institute of Technology;J.P. Morgan Chase;J.P. Morgan Chase;Purdue University",
        "aff_domain": "gatech.edu;jpmorgan.com;jpmorgan.com;purdue.edu",
        "position": "PhD student;Researcher;Researcher;Assistant Professor",
        "bibtex": "@misc{\nli2024graphmaker,\ntitle={GraphMaker: Can Diffusion Models Generate Large Attributed Graphs?},\nauthor={Mufei Li and Eleonora Kreacic and Vamsi K. Potluru and Pan Li},\nyear={2024},\nurl={https://openreview.net/forum?id=ledQ1BCrwc}\n}",
        "github": "",
        "project": "",
        "reviewers": "muBL;4wGq;xCEF",
        "site": "https://openreview.net/forum?id=ledQ1BCrwc",
        "pdf_size": 602674,
        "rating": "3;5;5",
        "confidence": "4;5;4",
        "soundness": "2;2;2",
        "contribution": "2;2;2",
        "presentation": "2;3;3",
        "wc_summary": "44;224;144",
        "wc_strengths": "33;93;67",
        "wc_weaknesses": "156;198;201",
        "wc_questions": "81;105;2",
        "wc_review": "314;620;414",
        "wc_reply_reviewers": "166;32;33",
        "wc_reply_authors": "493;533;459",
        "reply_reviewers": "1;1;2",
        "reply_authors": "1;2;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            137.33333333333334,
            73.63574011458174
        ],
        "wc_strengths_avg": [
            64.33333333333333,
            24.567367696917707
        ],
        "wc_weaknesses_avg": [
            185.0,
            20.54263858417414
        ],
        "wc_questions_avg": [
            62.666666666666664,
            44.00252518006464
        ],
        "wc_review_avg": [
            449.3333333333333,
            127.39788939469217
        ],
        "wc_reply_reviewers_avg": [
            77.0,
            62.93382768167424
        ],
        "wc_reply_authors_avg": [
            495.0,
            30.243456592570013
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14923418773435484697&as_sdt=805&sciodt=0,3&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "Georgia Institute of Technology;JPMorgan Chase & Co.;Purdue University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.gatech.edu;https://www.jpmorganchase.com;https://www.purdue.edu",
        "aff_unique_abbr": "Georgia Tech;JPM;Purdue",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "lesQevLmgD",
        "title": "Generalization Error Analysis of Deep Physical Models With Latent Variables Trained on Trajectory Data",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In this paper, we investigate the generalization error of deep physical models with latent variables. Deep physical models, such as Hamiltonian Neural Networks, are neural network models for learning equations of motion from observational data of physical phenomena and have attracted much attention in recent years. In particular, in such cases, the data are not completely random, but rather given as random trajectories. We provide an error bound for the case where the training data are given in such a way. Our results show that it is important to collect data from many trajectories, rather than simply collecting a large number of data, to improve generalization performance. In addition, an important application of the combination of deep physics models with latent variables is the interpolation of images from videos while preserving the laws of physics, such as the energy conservation law. However, when the frame interval of the video is large, it can be difficult to preserve the laws of physics. In this paper, we show that it is possible to interpolate the images from videos so that the laws of physics are preserved, provided that the generalization error is sufficiently small.",
        "keywords": "Hamiltonian Neural Networks;Generalization Error;AI for Science",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "/attachment/d53583b3da47d111416ac55551db3eeaf67c72f6.pdf",
        "author": "Yuhan Chen;Takashi Matsubara;Takaharu Yaguchi",
        "authorids": "~Yuhan_Chen1;~Takashi_Matsubara1;~Takaharu_Yaguchi1",
        "gender": "F;M;M",
        "homepage": ";https://tksmatsubara.github.io/;http://www.math.kobe-u.ac.jp/HOME/yaguchi/indexe.htm",
        "dblp": ";70/6748-1.html;40/8408",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;https://scholar.google.co.jp/citations?user=aubjjjwAAAAJ;5pYoTyYAAAAJ",
        "orcid": "0000-0001-8485-4713;0000-0003-0642-4800;0000-0001-9025-6015",
        "linkedin": ";;",
        "or_profile": "~Yuhan_Chen1;~Takashi_Matsubara1;~Takaharu_Yaguchi1",
        "aff": "Kobe University;Osaka University;Kobe University",
        "aff_domain": "kobe-u.ac.jp;osaka-u.ac.jp;kobe-u.ac.jp",
        "position": "PhD student;Associate Professor;Full Professor",
        "bibtex": "@misc{\nchen2024generalization,\ntitle={Generalization Error Analysis of Deep Physical Models With Latent Variables Trained on Trajectory Data},\nauthor={Yuhan Chen and Takashi Matsubara and Takaharu Yaguchi},\nyear={2024},\nurl={https://openreview.net/forum?id=lesQevLmgD}\n}",
        "github": "",
        "project": "",
        "reviewers": "pXTH;dY6S;QwHa;2r94",
        "site": "https://openreview.net/forum?id=lesQevLmgD",
        "pdf_size": 1184958,
        "rating": "3;5;5;8",
        "confidence": "4;1;3;1",
        "soundness": "3;3;2;4",
        "contribution": "2;3;2;4",
        "presentation": "2;3;2;3",
        "wc_summary": "83;70;110;80",
        "wc_strengths": "57;89;63;97",
        "wc_weaknesses": "181;25;96;27",
        "wc_questions": "71;142;277;27",
        "wc_review": "392;326;546;231",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            2.25,
            1.299038105676658
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            85.75,
            14.804982269492928
        ],
        "wc_strengths_avg": [
            76.5,
            16.874537030686206
        ],
        "wc_weaknesses_avg": [
            82.25,
            63.77842503543028
        ],
        "wc_questions_avg": [
            129.25,
            94.65826693955474
        ],
        "wc_review_avg": [
            373.75,
            114.73965094944293
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.7815036806726284,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:p1RY-gD_jKAJ:scholar.google.com/&scioq=Generalization+Error+Analysis+of+Deep+Physical+Models+With+Latent+Variables+Trained+on+Trajectory+Data&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Kobe University;Osaka University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.kobe-u.ac.jp;https://www.osaka-u.ac.jp",
        "aff_unique_abbr": "Kobe U;Osaka U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Japan"
    },
    {
        "id": "lf7gguJgpq",
        "title": "UniINR: Unifying Spatial-Temporal INR for RS Video Correction, Deblur, and Interpolation with an Event Camera",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Images captured by rolling shutter (RS) cameras under fast camera motion often contain obvious image distortions and blur, which can be modeled as a row-wise combination of a sequence of global shutter (GS) frames within the exposure time. \nNaturally, recovering high-frame-rate GS sharp frames from an RS blur image needs to simultaneously consider RS correction, deblur, and frame interpolation.\nTacking this task is nontrivial, and to the best of our knowledge, no feasible solutions exist by far.\nA naive way is to decompose the whole process into separate tasks and simply cascade existing methods; however, this results in cumulative errors and noticeable artifacts. \nEvent cameras enjoy many advantages, \\eg, high temporal resolution, making them potential for our problem. To this end, we propose the \\textbf{first} and novel approach, named \\textbf{UniINR}, to recover arbitrary frame-rate sharp GS frames from an RS blur image and paired event data. Our key idea is \\textit{unifying spatial-temporal implicit neural representation (INR) to directly map the position and time coordinates to RGB values to address the interlocking degradations in the image restoration process}. \nSpecifically, we introduce spatial-temporal implicit encoding (STE) to convert an RS blur image and events into a spatial-temporal representation (STR).\nTo query a specific sharp frame (GS or RS), we embed the exposure time into STR and decode the embedded features pixel-by-pixel to recover a sharp frame.\nOur method features a lightweight model with only \\textbf{$0.379 M$} parameters, and it also enjoys high inference efficiency, achieving $2.83 ms/frame$ in $31 \\times$ frame interpolation of an RS blur frame.\nExtensive experiments show that our method significantly outperforms prior methods.",
        "keywords": "implicit neural representation;rolling shutter camera;deblur;frame interpolation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/9bfbe6c1be35cb39a4d79984519b937a70826dd6.zip",
        "author": "Yunfan LU;Guoqiang Liang;Lin Wang",
        "authorids": "~Yunfan_LU1;~Guoqiang_Liang2;~Lin_Wang2",
        "gender": "M;M;M",
        "homepage": "https://yunfanlu.github.io/;;https://dr.ntu.edu.sg/cris/rp/rp02550",
        "dblp": "162/6651.html;;",
        "google_scholar": "nPUR_0sAAAAJ;https://scholar.google.com.hk/citations?user=GHz1gUIAAAAJ;SReb2csAAAAJ",
        "orcid": "0000-0002-7371-3189;0000-0003-4790-7075;0000-0002-7485-4493",
        "linkedin": "yunfanlu/;;",
        "or_profile": "~Yunfan_LU1;~Guoqiang_Liang2;~Lin_Wang2",
        "aff": "Hong Kong University of Science and Technology(GuangZhou);Hong Kong University of Science and Technology;Hong Kong University of Science and Technology",
        "aff_domain": "ust.hk;hkust.edu;ust.hk",
        "position": "PhD student;MS student;Assistant Professor",
        "bibtex": "@misc{\nlu2024uniinr,\ntitle={Uni{INR}: Unifying Spatial-Temporal {INR} for {RS} Video Correction, Deblur, and Interpolation with an Event Camera},\nauthor={Yunfan LU and Guoqiang Liang and Lin Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=lf7gguJgpq}\n}",
        "github": "",
        "project": "",
        "reviewers": "gAyr;QpjK;w92c;xnov",
        "site": "https://openreview.net/forum?id=lf7gguJgpq",
        "pdf_size": 2647109,
        "rating": "5;5;5;5",
        "confidence": "4;1;5;4",
        "soundness": "3;2;3;2",
        "contribution": "2;3;2;2",
        "presentation": "3;3;3;3",
        "wc_summary": "85;98;68;51",
        "wc_strengths": "39;44;105;36",
        "wc_weaknesses": "121;246;90;125",
        "wc_questions": "60;2;279;4",
        "wc_review": "305;390;542;216",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "766;684;1024;726",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;2;2",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            1.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            75.5,
            17.698870020427858
        ],
        "wc_strengths_avg": [
            56.0,
            28.434134416225863
        ],
        "wc_weaknesses_avg": [
            145.5,
            59.583974355526166
        ],
        "wc_questions_avg": [
            86.25,
            113.6933925080961
        ],
        "wc_review_avg": [
            363.25,
            120.14860590119221
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            800.0,
            132.53678734600442
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Es0K4dMZW8MJ:scholar.google.com/&scioq=UniINR:+Unifying+Spatial-Temporal+INR+for+RS+Video+Correction,+Deblur,+and+Interpolation+with+an+Event+Camera&hl=en&as_sdt=0,34",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Hong Kong University of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ust.hk",
        "aff_unique_abbr": "HKUST",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "lf8QQ2KMgv",
        "title": "Is Memorization Actually Necessary for Generalization?",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Memorization is the ability of deep models to associate training data with seemingly random labels. Even though memorization may not align with models\u2019 ability to generalize, recent work by Feldman and Zhang (2020) has demonstrated that memorization is in fact necessary for generalization. However, upon closer inspection of this work, we uncover several methodological errors including lack of model convergence, data leakage, and sub- population shift. We show that these errors led to a significant overestimation of memorization\u2019s impact on test accuracy (by over five times). After accounting for these errors, we demonstrate that memorization does not impact prediction accuracy as previously reported, and therefore, it is not necessary for generalization. In light of these findings, future researchers are encouraged to design better techniques to identify memorized points that can avoid some of the earlier stated problems.",
        "keywords": "memorization;subpopulations;influence functions",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/49a6cbb7dc7610e29ba6e2a97471619a27369b8d.pdf",
        "author": "Hadi Abdullah;Ke Wang;Blaine Hoak;Yizhen Wang;Sunpreet S. Arora;Yiwei Cai",
        "authorids": "~Hadi_Abdullah1;~Ke_Wang1;~Blaine_Hoak1;~Yizhen_Wang1;~Sunpreet_S._Arora1;~Yiwei_Cai1",
        "gender": ";;F;M;M;M",
        "homepage": "https://hadiabdullah.github.io/;https://kbwang.bitbucket.io/;https://hoak.me/;;https://sites.google.com/site/arorasunpreet/;",
        "dblp": "205/2013;181/2613-9;293/7182;35/625;118/1516;",
        "google_scholar": ";KIe98hIAAAAJ;P6jPU9AAAAAJ;;;",
        "orcid": ";;0000-0003-2960-0686;;;0009-0002-3532-4323",
        "linkedin": ";;blaine-hoak-97270b158/;;sunpreet-singh-arora-a918a222/;",
        "or_profile": "~Hadi_Abdullah1;~Ke_Wang1;~Blaine_Hoak1;~Yizhen_Wang1;~Sunpreet_S._Arora1;~Yiwei_Cai1",
        "aff": "VISA;Visa Research;University of Wisconsin - Madison;VISA;Visa;PayPal Inc.",
        "aff_domain": "visa.com;visa.com;wisc.edu;visa.com;visa.com;paypal.com",
        "position": "Researcher;Research Scientist;PhD student;Research Scientist;Principal Researcher;Principal Scientist",
        "bibtex": "@misc{\nabdullah2024is,\ntitle={Is Memorization Actually Necessary for Generalization?},\nauthor={Hadi Abdullah and Ke Wang and Blaine Hoak and Yizhen Wang and Sunpreet S. Arora and Yiwei Cai},\nyear={2024},\nurl={https://openreview.net/forum?id=lf8QQ2KMgv}\n}",
        "github": "",
        "project": "",
        "reviewers": "DdXc;Bqf3;Uoom;9ksD",
        "site": "https://openreview.net/forum?id=lf8QQ2KMgv",
        "pdf_size": 1275872,
        "rating": "3;3;3;6",
        "confidence": "4;4;5;3",
        "soundness": "2;1;2;3",
        "contribution": "1;2;3;3",
        "presentation": "3;1;4;4",
        "wc_summary": "77;90;121;150",
        "wc_strengths": "30;23;83;34",
        "wc_weaknesses": "193;553;312;89",
        "wc_questions": "83;86;64;123",
        "wc_review": "383;752;580;396",
        "wc_reply_reviewers": "167;34;0;85",
        "wc_reply_authors": "532;412;627;582",
        "reply_reviewers": "1;1;0;2",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            1.224744871391589
        ],
        "wc_summary_avg": [
            109.5,
            28.324018076537094
        ],
        "wc_strengths_avg": [
            42.5,
            23.71181140275875
        ],
        "wc_weaknesses_avg": [
            286.75,
            172.78653738066515
        ],
        "wc_questions_avg": [
            89.0,
            21.365860619221497
        ],
        "wc_review_avg": [
            527.75,
            151.1032345782181
        ],
        "wc_reply_reviewers_avg": [
            71.5,
            62.890778338322384
        ],
        "wc_reply_authors_avg": [
            538.25,
            80.26323878339323
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12841045015962858062&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0;1;3",
        "aff_unique_norm": "VISA;Visa Inc.;University of Wisconsin-Madison;PayPal",
        "aff_unique_dep": ";Research;;",
        "aff_unique_url": "https://www.visa.com;https://www.visa.com/;https://www.wisc.edu;https://www.paypal.com",
        "aff_unique_abbr": "VISA;Visa;UW-Madison;PayPal",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Madison",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "lgA84TbHxm",
        "title": "DySTreSS: Dynamically Scaled Temperature in Self-Supervised Contrastive Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In contemporary self-supervised contrastive algorithms like SimCLR, MoCo, etc.,the task of balancing attraction between two semantically similar samples and repulsion between two samples from different classes is primarily affected by the presence of hard negative samples. While the InfoNCE loss has been shown to impose penalties based on hardness, the temperature hyper-parameter is the key to regulating the penalties and the trade-off between uniformity and tolerance. In this work, we focus our attention on improving the performance of InfoNCE loss in Self-supervised learning by proposing a novel cosine-similarity dependent temperature scaling function to effectively optimize the distribution of the samples in the feature space. We also provide mathematical analyses to support the construction of such a dynamically scaled temperature function. Experimental evidence shows that the proposed framework outperforms the contrastive loss-based SSL algorithms. Our code is available at https://www.github.com/subanon/dystress.",
        "keywords": "Self-supervised;Contrastive Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Siladittya Manna;Soumitri Chattopadhyay;Rakesh Dey;Saumik Bhattacharya;Umapada Pal",
        "authorids": "~Siladittya_Manna1;~Soumitri_Chattopadhyay1;~Rakesh_Dey1;~Saumik_Bhattacharya1;~Umapada_Pal1",
        "gender": "M;M;M;M;M",
        "homepage": "https://sadimanna.github.io;https://soumitri2001.github.io;;https://www.iitkgp.ac.in/department/EC/faculty/ec-saumik;https://www.isical.ac.in/~umapada/",
        "dblp": "270/2011;312/5599;354/6521;154/8318.html;p/UmapadaPal",
        "google_scholar": "6V9sqi0AAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en;https://scholar.google.co.in/citations?user=8pffuA4AAAAJ;https://scholar.google.co.in/citations?user=2_z_CogAAAAJ",
        "orcid": "0000-0001-6364-8654;0000-0002-2647-6053;;0000-0003-1273-7969;",
        "linkedin": "siladittya-manna-063939a0/;https://linkedin.com/in/soumitri-chattopadhyay-246477191/;rakesh-dey-161149179/?originalSubdomain=in;;",
        "or_profile": "~Siladittya_Manna1;~Soumitri_Chattopadhyay1;~Rakesh_Dey1;~Saumik_Bhattacharya1;~Umapada_Pal1",
        "aff": "Indian Statistical Institute, Kolkata;SRI International;Indian Statistical Institute, Kolkata;Indian Institute of Technology Kharagpur;Indian Statistical Institute",
        "aff_domain": "isical.ac.in;sri.com;isical.ac.in;iitkgp.ac.in;isical.ac.in",
        "position": "PhD student;Intern;Researcher;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nmanna2024dystress,\ntitle={Dy{ST}re{SS}: Dynamically Scaled Temperature in Self-Supervised Contrastive Learning},\nauthor={Siladittya Manna and Soumitri Chattopadhyay and Rakesh Dey and Saumik Bhattacharya and Umapada Pal},\nyear={2024},\nurl={https://openreview.net/forum?id=lgA84TbHxm}\n}",
        "github": "",
        "project": "",
        "reviewers": "7bH3;iD3A;S1Ew;RTHa",
        "site": "https://openreview.net/forum?id=lgA84TbHxm",
        "pdf_size": 1990403,
        "rating": "3;5;5;6",
        "confidence": "4;5;4;3",
        "soundness": "2;2;2;2",
        "contribution": "2;1;2;2",
        "presentation": "2;3;2;2",
        "wc_summary": "24;79;32;62",
        "wc_strengths": "15;24;37;128",
        "wc_weaknesses": "97;255;42;220",
        "wc_questions": "224;2;116;176",
        "wc_review": "360;360;227;586",
        "wc_reply_reviewers": "506;379;0;75",
        "wc_reply_authors": "2043;2501;1655;1763",
        "reply_reviewers": "1;2;0;1",
        "reply_authors": "3;5;3;4",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            49.25,
            22.26404051379713
        ],
        "wc_strengths_avg": [
            51.0,
            45.13867521316947
        ],
        "wc_weaknesses_avg": [
            153.5,
            87.10482191015605
        ],
        "wc_questions_avg": [
            129.5,
            82.962340854149
        ],
        "wc_review_avg": [
            383.25,
            129.03754298652777
        ],
        "wc_reply_reviewers_avg": [
            240.0,
            209.10643223009663
        ],
        "wc_reply_authors_avg": [
            1990.5,
            326.9873850777733
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            3.75,
            0.82915619758885
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.3244428422615251,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6718565463104392233&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;0;2;0",
        "aff_unique_norm": "Indian Statistical Institute;SRI International;Indian Institute of Technology Kharagpur",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.isical.ac.in;https://www.sri.com;https://www.iitkgp.ac.in",
        "aff_unique_abbr": "ISI;SRI;IIT Kharagpur",
        "aff_campus_unique_index": "0;0;2",
        "aff_campus_unique": "Kolkata;;Kharagpur",
        "aff_country_unique_index": "0;1;0;0;0",
        "aff_country_unique": "India;United States"
    },
    {
        "id": "lgDrVM9Rpx",
        "title": "P-MapNet: Far-seeing Map Constructer Enhanced by both SDMap and HDMap Priors",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Autonomous vehicles are gradually entering city roads today, with the help of high-definition maps (HDMaps). However, the reliance on HDMaps prevents autonomous vehicles from stepping into regions without this expensive digital infrastructure. This fact drives many researchers to study online HDMap construction algorithms, but the performance of these algorithms is still unsatisfying. We present P-MapNet, in which the letter P highlights the fact that we focus on incorporating map priors to improve model performance. Specifically, we exploit priors in both SDMap and HDMap. On one hand, we extract weakly aligned SDMap from OpenStreetMap, and encode it as an alternative conditioning branch. Despite the misalignment challenge, our attention-based architecture adaptively attends to relevant SDMap skeletons and significantly improves performance. On the other hand, we exploit a masked autoencoder to capture the prior distribution of HDMap, which can serve as a refinement module to mitigate occlusions and artifacts. Both priors lead to performance improvements, especially in farther regions. We benchmark on the nuScenes dataset, demonstrating 13.46% mIoU margin over the baseline. Codes and models will be publicly available.",
        "keywords": "online HDMap generation;SDMap prior;HDMap prior;far-seeing",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Zhou Jiang;Zhenxin Zhu;Pengfei Li;Huan-ang Gao;Tianyuan Yuan;Yongliang Shi;Hang Zhao;Hao Zhao",
        "authorids": "~Zhou_Jiang1;~Zhenxin_Zhu1;~Pengfei_Li6;~Huan-ang_Gao1;~Tianyuan_Yuan1;~Yongliang_Shi1;~Hang_Zhao1;~Hao_Zhao1",
        "gender": "M;M;M;M;M;M;M;M",
        "homepage": "https://github.com/Jzian;;https://github.com/Philipflyg;https://c7w.tech/about;;;http://www.mit.edu/~hangzhao/;https://sites.google.com/view/fromandto",
        "dblp": ";329/6347;;339/0975;344/9098;;;08/3737-2.html",
        "google_scholar": ";NkJw6owAAAAJ;https://scholar.google.com/citations?view_op=list_works;WvbKfLgAAAAJ;https://scholar.google.com/citations?hl=en;;DmahiOYAAAAJ;ygQznUQAAAAJ",
        "orcid": ";;;;;0000-0003-3086-729X;;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Zhou_Jiang1;~Zhenxin_Zhu1;~Pengfei_Li6;~Huan-ang_Gao1;~Tianyuan_Yuan1;~Yongliang_Shi1;~Hang_Zhao1;~Hao_Zhao1",
        "aff": "Beijing Institute of Technology;Beijing Jingwei Hirain Technologies Co., Inc.;Tsinghua University;Tsinghua University;Tsinghua University;Tsinghua University;Tsinghua University;Peking University",
        "aff_domain": "bit.edu.cn;hirain.com;tsinghua.edu.cn;cs.tsinghua.edu.cn;mails.tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;pku.edu.cn",
        "position": "MS student;Intern;PhD student;Undergrad student;PhD student;Postdoc;Assistant Professor;Postdoc",
        "bibtex": "@misc{\njiang2024pmapnet,\ntitle={P-MapNet: Far-seeing Map Constructer Enhanced by both {SDM}ap and {HDM}ap Priors},\nauthor={Zhou Jiang and Zhenxin Zhu and Pengfei Li and Huan-ang Gao and Tianyuan Yuan and Yongliang Shi and Hang Zhao and Hao Zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=lgDrVM9Rpx}\n}",
        "github": "",
        "project": "",
        "reviewers": "6mPa;mZgt;8h86;Je8q",
        "site": "https://openreview.net/forum?id=lgDrVM9Rpx",
        "pdf_size": 23220653,
        "rating": "5;5;5;5",
        "confidence": "4;5;5;4",
        "soundness": "2;3;2;2",
        "contribution": "2;3;2;2",
        "presentation": "2;3;3;3",
        "wc_summary": "129;81;82;54",
        "wc_strengths": "76;59;49;53",
        "wc_weaknesses": "134;216;74;61",
        "wc_questions": "309;43;22;181",
        "wc_review": "648;399;227;349",
        "wc_reply_reviewers": "72;0;0;0",
        "wc_reply_authors": "1029;636;614;494",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            86.5,
            26.98610753702727
        ],
        "wc_strengths_avg": [
            59.25,
            10.304731922762475
        ],
        "wc_weaknesses_avg": [
            121.25,
            61.24285672631544
        ],
        "wc_questions_avg": [
            138.75,
            115.72461924759139
        ],
        "wc_review_avg": [
            405.75,
            153.21777801547705
        ],
        "wc_reply_reviewers_avg": [
            18.0,
            31.176914536239792
        ],
        "wc_reply_authors_avg": [
            693.25,
            201.23788783427437
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Ir9lPSav_GwJ:scholar.google.com/&scioq=P-MapNet:+Far-seeing+Map+Constructer+Enhanced+by+both+SDMap+and+HDMap+Priors&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;2;2;2;2;3",
        "aff_unique_norm": "Beijing Institute of Technology;Beijing Jingwei Hirain Technologies Co., Inc.;Tsinghua University;Peking University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "http://www.bit.edu.cn/;;https://www.tsinghua.edu.cn;http://www.pku.edu.cn",
        "aff_unique_abbr": "BIT;;THU;Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Structuring Representation Geometry with Rotationally Equivariant Contrastive Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17925",
        "id": "lgaFMvZHSJ",
        "author_site": "Sharut Gupta, Joshua Robinson, Derek Lim, Soledad Villar, Stefanie Jegelka",
        "tldr": "",
        "abstract": "Self-supervised learning converts raw perceptual data such as images to a compact space where simple Euclidean distances measure meaningful variations in data. In this paper, we extend this formulation by adding additional geometric structure to the embedding space by enforcing transformations of input space to correspond to simple (i.e., linear) transformations of embedding space. Specifically, in the contrastive learning setting, we introduce an equivariance objective and theoretically prove that its minima force augmentations on input space to correspond to rotations on the spherical embedding space. We show that merely combining our equivariant loss with a non-collapse term results in non-trivial representations, without requiring invariance to data augmentations. Optimal performance is achieved by also encouraging approximate invariance, where input augmentations correspond to small rotations. Our method, CARE: Contrastive Augmentation-induced Rotational Equivariance, leads to improved performance on downstream tasks and ensures sensitivity in embedding space to important variations in data (e.g., color) that standard contrastive methods do not achieve. Code is available at https://github.com/Sharut/CARE",
        "keywords": "Self supervised learning;Equivariance;Contrastive learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Sharut Gupta;Joshua Robinson;Derek Lim;Soledad Villar;Stefanie Jegelka",
        "authorids": "~Sharut_Gupta1;~Joshua_Robinson4;~Derek_Lim1;~Soledad_Villar2;~Stefanie_Jegelka3",
        "gender": "F;M;F;M;F",
        "homepage": "https://www.mit.edu/~sharut/;https://cptq.github.io/;http://people.csail.mit.edu/stefje/;https://joshrobinson.mit.edu/;https://www.ams.jhu.edu/villar/",
        "dblp": ";267/5433;38/7003;15/4759;https://dblp.uni-trier.de/pers/hd/v/Villar:Soledad",
        "google_scholar": "https://scholar.google.com/citations?hl=en;y9YTBIsAAAAJ;gTWUZlsAAAAJ;E02doCkAAAAJ;JBGlsDoAAAAJ",
        "orcid": ";;;;",
        "linkedin": "sharut-gupta/;;;;",
        "or_profile": "~Sharut_Gupta1;~Derek_Lim1;~Stefanie_Jegelka3;~Joshua_David_Robinson1;~Soledad_Villar1",
        "aff": "Google;Liquid AI;Massachusetts Institute of Technology;Stanford University;Johns Hopkins University",
        "aff_domain": "google.com;liquid.ai;mit.edu;stanford.edu;jhu.edu",
        "position": "Student Researcher;Researcher;Associate Professor;Postdoc;Assistant Professor",
        "bibtex": "@inproceedings{\ngupta2024structuring,\ntitle={Structuring Representation Geometry with Rotationally Equivariant Contrastive Learning},\nauthor={Sharut Gupta and Joshua Robinson and Derek Lim and Soledad Villar and Stefanie Jegelka},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=lgaFMvZHSJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "avuo;4N3v;MvBZ;Dtcq",
        "pdf_size": 18942005,
        "rating": "6;6;8;8",
        "confidence": "4;3;3;3",
        "soundness": "2;3;3;4",
        "contribution": "3;3;3;3",
        "presentation": "2;3;3;4",
        "wc_summary": "312;81;88;193",
        "wc_strengths": "39;81;61;106",
        "wc_weaknesses": "824;169;109;298",
        "wc_questions": "267;34;15;49",
        "wc_review": "1442;365;273;646",
        "wc_reply_reviewers": "634;16;45;42",
        "wc_reply_authors": "2072;550;845;536",
        "reply_reviewers": "2;1;1;1",
        "reply_authors": "3;1;2;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            168.5,
            93.98005107468286
        ],
        "wc_strengths_avg": [
            71.75,
            24.732316915323562
        ],
        "wc_weaknesses_avg": [
            350.0,
            282.0558455341779
        ],
        "wc_questions_avg": [
            91.25,
            102.18212906374578
        ],
        "wc_review_avg": [
            681.5,
            460.07200523396335
        ],
        "wc_reply_reviewers_avg": [
            184.25,
            259.9080366206478
        ],
        "wc_reply_authors_avg": [
            1000.75,
            630.6747874300986
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 19,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=265186884684155588&as_sdt=8005&sciodt=0,7&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=lgaFMvZHSJ",
        "pdf": "https://openreview.net/pdf?id=lgaFMvZHSJ",
        "email": "google.com;liquid.ai;mit.edu;stanford.edu;jhu.edu",
        "author_num": 5,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "Google;Liquid AI;Massachusetts Institute of Technology;Stanford University;Johns Hopkins University",
        "aff_unique_dep": "Google;;;;",
        "aff_unique_url": "https://www.google.com;;https://web.mit.edu;https://www.stanford.edu;https://www.jhu.edu",
        "aff_unique_abbr": "Google;;MIT;Stanford;JHU",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Mountain View;;Stanford",
        "aff_country_unique_index": "0;1;0;0;0",
        "aff_country_unique": "United States;Unknown"
    },
    {
        "id": "lgmCGI2IpI",
        "title": "An Efficient Query Strategy for Active Learning via Optimal Transport",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Active Learning (AL) aims to reduce labeling costs by iteratively querying instances. Existing AL methods typically query instances based on either informativeness or representativeness. Only considering informativeness leads to sample bias. Only considering representativeness leads to query amount of instances before the optimal decision boundary is found. It is essential to consider both when querying instances. However, current hybrid methods are also time-consuming. To query instance efficiently while considering both informativeness and representativeness, we propose an efficient active query strategy based on optimal transport called Active Query by Optimal Transport (AQOT). Optimal Transport (OT) enables us to measure the difference between two distributions efficiently, allowing us considering the distribution of instances easily. Via entropy regularization, we can solve OT efficiently. Specifically, we make use of the sparseness of the solution of OT to querying the most informative instance while considering representativeness. Additionally, we introduce a dynamic adjustment to AQOT. By concatenating AQOT to multiple classification models, we show AQOT is a broad-spectrum active query strategy. Experimental results demonstrate that our method surpasses state-of-the-art active learning methods and shows high efficiency.",
        "keywords": "Active Learning;Optimal Transport",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Zhenyu Zhu;Teng Zhang;Xuanhua Shi;Hai Jin",
        "authorids": "~Zhenyu_Zhu3;~Teng_Zhang3;~Xuanhua_Shi1;~Hai_Jin1",
        "gender": "M;M;M;M",
        "homepage": "https://github.com/HustNorth/;;https://sites.google.com/view/xhshi/home;http://www.linkedin.com/in/jinhust",
        "dblp": ";38/5156-1;85/5317.html;98/4156",
        "google_scholar": ";https://scholar.google.com.hk/citations?user=gysI2pYAAAAJ;https://scholar.google.com/citations?hl=en;",
        "orcid": ";;0000-0001-8451-8656;0000-0002-3934-7605",
        "linkedin": ";;;jinhust",
        "or_profile": "~Zhenyu_Zhu3;~Teng_Zhang3;~Xuanhua_Shi1;~Hai_Jin1",
        "aff": ";Huazhong University of Science and Technology;Huazhong University of Science and Technology;Huazhong University of Science and Technology",
        "aff_domain": ";hust.edu.cn;hust.edu.cn;hust.edu.cn",
        "position": ";Associate Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nzhu2024an,\ntitle={An Efficient Query Strategy for Active Learning via Optimal Transport},\nauthor={Zhenyu Zhu and Teng Zhang and Xuanhua Shi and Hai Jin},\nyear={2024},\nurl={https://openreview.net/forum?id=lgmCGI2IpI}\n}",
        "github": "",
        "project": "",
        "reviewers": "xjm3;2t83;A9xS;nES8",
        "site": "https://openreview.net/forum?id=lgmCGI2IpI",
        "pdf_size": 594389,
        "rating": "3;5;5;5",
        "confidence": "5;3;3;4",
        "soundness": "2;2;2;3",
        "contribution": "1;2;2;2",
        "presentation": "2;3;2;3",
        "wc_summary": "65;93;52;197",
        "wc_strengths": "36;41;37;42",
        "wc_weaknesses": "223;51;159;117",
        "wc_questions": "3;10;94;85",
        "wc_review": "327;195;342;441",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            101.75,
            56.95338005772792
        ],
        "wc_strengths_avg": [
            39.0,
            2.5495097567963922
        ],
        "wc_weaknesses_avg": [
            137.5,
            62.599920127744575
        ],
        "wc_questions_avg": [
            48.0,
            41.69532347877877
        ],
        "wc_review_avg": [
            326.25,
            87.52535346972327
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8703882797784891,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:IHqAFPm0bCoJ:scholar.google.com/&scioq=An+Efficient+Query+Strategy+for+Active+Learning+via+Optimal+Transport&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Huazhong University of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.hust.edu.cn",
        "aff_unique_abbr": "HUST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "lgvOSEMEQS",
        "title": "Lightweight Unsupervised Federated Learning with Pretrained Vision Language Model",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Federated learning aims to tackle the ``isolated data island\" problem, where it trains a collective model from physically isolated clients while safeguarding the privacy of users' data. However, supervised federated learning necessitates that each client labels their data for training, which can be both time-consuming and resource-intensive, and may even be impractical for edge devices. Moreover, the training and transmission of deep models present challenges to the computation and communication capabilities of the clients.\nTo address these two inherent challenges in supervised federated learning, we propose a novel lightweight unsupervised federated learning approach that leverages unlabeled data on each client to perform lightweight model training and communication by harnessing pretrained vision-language models, such as CLIP. By capitalizing on the zero-shot prediction capability and the well-trained image encoder of the pre-trained CLIP model, we have carefully crafted an efficient and resilient self-training approach. This method refines the initial zero-shot predicted pseudo-labels of unlabeled instances through the sole training of a linear classifier on top of the fixed image encoder. Additionally, to address data heterogeneity within each client, we propose a class-balanced text feature sampling strategy for generating synthetic instances in the feature space to support local training. \nExperiments are conducted on multiple benchmark datasets. The experimental results demonstrate that our proposed method greatly enhances model performance in comparison to CLIP's zero-shot predictions and even outperforms supervised federated learning benchmark methods given limited computational and communication overhead.",
        "keywords": "unsupervised federated learning;vision-language model",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Hao Yan;Yuhong Guo",
        "authorids": "~Hao_Yan4;~Yuhong_Guo1",
        "gender": ";",
        "homepage": ";",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": ";",
        "aff": ";",
        "aff_domain": ";",
        "position": ";",
        "bibtex": "@misc{\nyan2024lightweight,\ntitle={Lightweight Unsupervised Federated Learning with Pretrained Vision Language Model},\nauthor={Hao Yan and Yuhong Guo},\nyear={2024},\nurl={https://openreview.net/forum?id=lgvOSEMEQS}\n}",
        "github": "",
        "project": "",
        "reviewers": "91xa;b2QK;JRVk",
        "site": "https://openreview.net/forum?id=lgvOSEMEQS",
        "pdf_size": 323290,
        "rating": "3;3;5",
        "confidence": "4;3;4",
        "soundness": "2;2;3",
        "contribution": "2;2;2",
        "presentation": "3;2;3",
        "wc_summary": "45;45;39",
        "wc_strengths": "50;48;39",
        "wc_weaknesses": "179;165;127",
        "wc_questions": "25;5;5",
        "wc_review": "299;263;210",
        "wc_reply_reviewers": "0;0;58",
        "wc_reply_authors": "694;595;632",
        "reply_reviewers": "0;0;1",
        "reply_authors": "1;1;2",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            43.0,
            2.8284271247461903
        ],
        "wc_strengths_avg": [
            45.666666666666664,
            4.784233364802441
        ],
        "wc_weaknesses_avg": [
            157.0,
            21.96967607104544
        ],
        "wc_questions_avg": [
            11.666666666666666,
            9.428090415820634
        ],
        "wc_review_avg": [
            257.3333333333333,
            36.55437350334734
        ],
        "wc_reply_reviewers_avg": [
            19.333333333333332,
            27.34146220587984
        ],
        "wc_reply_authors_avg": [
            640.3333333333334,
            40.84387618997764
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=623847624600598227&as_sdt=80005&sciodt=0,11&hl=en",
        "gs_version_total": 3
    },
    {
        "id": "lhZEodF8Dn",
        "title": "Efficient Denoising Diffusion via Probabilistic Masking",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Diffusion models have exhibited remarkable advancements in generating high-quality data. However, a critical drawback of these models is their computationally intensive inference process, which requires a large number of timesteps to generate a single sample. Existing methods address this challenge by decoupling the forward and reverse processes, and they rely on handcrafted rules (e.g., uniform skipping) for sampling acceleration, leading to the risk of discarding important steps and deviating from the optimal trajectory. In this paper, we propose an Efficient Denoising Diffusion method via Probabilistic Masking (EDDPM) that can identify and skip the redundant steps during training. To determine whether a timestep should be skipped or not, we employ probabilistic reparameterization to continualize the binary determination mask. The mask distribution parameters are learned jointly with the diffusion model weights. By incorporating a real-time sparse constraint, our method can effectively identify and eliminate unnecessary steps during the training iterations, thereby improving inference efficiency. Notably, as the model becomes fully trained, the random masks converge to a sparse and deterministic one, retaining only a small number of essential steps. Empirical results demonstrate the superiority of our proposed EDDPM over the state-of-the-art sampling acceleration methods across various domains. EDDPM can generate high-quality samples with only 20\\% of the  steps for time series imputation and achieve 4.89 FID with 5 steps for CIFAR-10. Moreover, when starting from a pretrained model, our method efficiently identifies the most informative timesteps within a single epoch, which demonstrates the potential of EDDPM to be a practical tool to explore large diffusion models with limited resources.",
        "keywords": "Diffusion Model;Sparse Training;Model Compression",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/43d868db2b9d44120494297226a5a1de58eb0710.pdf",
        "author": "Zhiwei Zhang;Renjie Pi;Zhongming Jin;Yuan Gao;Jieping Ye;Kani Chen;WEIZHONG ZHANG",
        "authorids": "~Zhiwei_Zhang3;~Renjie_Pi1;~Zhongming_Jin1;~Yuan_Gao4;~Jieping_Ye4;~Kani_Chen1;~WEIZHONG_ZHANG2",
        "gender": ";M;M;;M;M;",
        "homepage": ";;https://sites.google.com/site/zjuzhongmingjin/;;http://yelabs.net/;https://seng.hkust.edu.hk/about/people/faculty/kani-chen;",
        "dblp": ";67/2156;;;03/5454;;",
        "google_scholar": ";XUq0HwcAAAAJ;fOC90nQAAAAJ;;T9AzhwcAAAAJ;;",
        "orcid": ";;;;0000-0001-8662-5818;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Zhiwei_Zhang3;~Renjie_Pi1;~Zhongming_Jin1;~Yuan_Gao4;~Jieping_Ye4;~Kani_Chen1;~WEIZHONG_ZHANG2",
        "aff": ";Hong Kong University of Science and Technology;Alibaba Cloud Computing;;Alibaba Group;Hong Kong University of Science and Technology;",
        "aff_domain": ";ust.hk;alibaba-inc.com;;alibaba-inc.com;ust.hk;",
        "position": ";PhD student;Researcher;;Principal Researcher;Full Professor;",
        "bibtex": "@misc{\nanonymous2024efficient,\ntitle={Efficient Denoising Diffusion via Probabilistic Masking},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=lhZEodF8Dn}\n}",
        "github": "",
        "project": "",
        "reviewers": "jbL3;MPYQ;v4Co;1NMC",
        "site": "https://openreview.net/forum?id=lhZEodF8Dn",
        "pdf_size": 3287206,
        "rating": "6;6;8;8",
        "confidence": "4;3;3;2",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "85;100;68;84",
        "wc_strengths": "57;30;45;80",
        "wc_weaknesses": "42;31;35;189",
        "wc_questions": "388;596;58;2",
        "wc_review": "572;757;206;355",
        "wc_reply_reviewers": "20;69;0;21",
        "wc_reply_authors": "1021;1644;269;509",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "4;5;1;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            84.25,
            11.321991874224253
        ],
        "wc_strengths_avg": [
            53.0,
            18.289341158171883
        ],
        "wc_weaknesses_avg": [
            74.25,
            66.36781976229142
        ],
        "wc_questions_avg": [
            261.0,
            243.23034350179256
        ],
        "wc_review_avg": [
            472.5,
            209.56442923358915
        ],
        "wc_reply_reviewers_avg": [
            27.5,
            25.38208029299411
        ],
        "wc_reply_authors_avg": [
            860.75,
            527.5075236430282
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            1.5811388300841898
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.7071067811865475,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10315798789718667343&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;1;0",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Alibaba Group",
        "aff_unique_dep": ";Cloud Computing",
        "aff_unique_url": "https://www.ust.hk;https://www.alibabacloud.com",
        "aff_unique_abbr": "HKUST;Alibaba Cloud",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "li1Z0OQfnA",
        "title": "On Local Equilibrium in Non-Concave Games",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "While Online Gradient Descent and other no-regret learning procedures are known to efficiently converge to coarse correlated equilibrium in  games where each agent's utility is concave in their own strategies, this is not the case when the utilities are non-concave, a situation that is  common in machine learning applications where the agents' strategies are parametrized by deep neural networks, or the agents' utilities are computed by a  neural network, or both. Indeed,  non-concave games present a host of game-theoretic and optimization challenges:  (i) Nash equilibria may fail to exist; (ii) local Nash equilibria exist but are intractable; and (iii) mixed Nash, correlated, and coarse correlated equilibria have infinite support, in general, and are intractable. To sidestep these challenges we propose a new solution concept, termed  *local correlated equilibrium*, which generalizes local Nash equilibrium. Importantly, we show that this solution concept captures the convergence guarantees of Online Gradient Descent and no-regret learning, which we show efficiently converge to this type of equilibrium in non-concave games with smooth utilities.",
        "keywords": "non-concave games;learning in games;no-regret algorithms;local equilibrium",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Yang Cai;Constantinos Costis Daskalakis;Haipeng Luo;Chen-Yu Wei;Weiqiang Zheng",
        "authorids": "~Yang_Cai1;~Constantinos_Costis_Daskalakis1;~Haipeng_Luo1;~Chen-Yu_Wei1;~Weiqiang_Zheng1",
        "gender": ";M;M;M;M",
        "homepage": ";http://people.csail.mit.edu/costis/;https://haipeng-luo.net/;https://bahh723.github.io/;https://weiqiang-zheng.com/",
        "dblp": ";;62/2576;183/1729;277/5088",
        "google_scholar": ";iTv2cOgAAAAJ;ct2hw4UAAAAJ;2L2cR-kAAAAJ;YrfhnIwAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Yang_Cai1;~Constantinos_Costis_Daskalakis1;~Haipeng_Luo1;~Chen-Yu_Wei1;~Weiqiang_Zheng1",
        "aff": ";Massachusetts Institute of Technology;University of Southern California;University of Virginia, Charlottesville;Yale University",
        "aff_domain": ";mit.edu;usc.edu;virginia.edu;yale.edu",
        "position": ";Full Professor;Associate Professor;Assistant Professor;PhD student",
        "bibtex": "@misc{\ncai2024on,\ntitle={On Local Equilibrium in Non-Concave Games},\nauthor={Yang Cai and Constantinos Costis Daskalakis and Haipeng Luo and Chen-Yu Wei and Weiqiang Zheng},\nyear={2024},\nurl={https://openreview.net/forum?id=li1Z0OQfnA}\n}",
        "github": "",
        "project": "",
        "reviewers": "J78b;Ge5S;oLqg;kZP2",
        "site": "https://openreview.net/forum?id=li1Z0OQfnA",
        "pdf_size": 434382,
        "rating": "3;6;8;10",
        "confidence": "3;4;3;4",
        "soundness": "3;3;4;4",
        "contribution": "1;3;3;4",
        "presentation": "2;2;3;3",
        "wc_summary": "23;78;422;79",
        "wc_strengths": "10;77;73;29",
        "wc_weaknesses": "116;102;105;76",
        "wc_questions": "130;2;78;319",
        "wc_review": "279;259;678;503",
        "wc_reply_reviewers": "169;0;0;193",
        "wc_reply_authors": "1061;232;1109;1610",
        "reply_reviewers": "2;0;0;2",
        "reply_authors": "4;1;3;3",
        "rating_avg": [
            6.75,
            2.5860201081971503
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            1.0897247358851685
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            150.5,
            158.38008081826453
        ],
        "wc_strengths_avg": [
            47.25,
            28.586491565073178
        ],
        "wc_weaknesses_avg": [
            99.75,
            14.669270602180601
        ],
        "wc_questions_avg": [
            132.25,
            117.03498408595611
        ],
        "wc_review_avg": [
            429.75,
            172.39108880681738
        ],
        "wc_reply_reviewers_avg": [
            90.5,
            90.89691963977657
        ],
        "wc_reply_authors_avg": [
            1003.0,
            494.3404697169755
        ],
        "reply_reviewers_avg": [
            1.0,
            1.0
        ],
        "reply_authors_avg": [
            2.75,
            1.0897247358851685
        ],
        "replies_avg": [
            36,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.4833682445228318,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:sKaardO8B9gJ:scholar.google.com/&scioq=On+Local+Equilibrium+in+Non-Concave+Games&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Massachusetts Institute of Technology;University of Southern California;University of Virginia;Yale University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://web.mit.edu;https://www.usc.edu;https://www.virginia.edu;https://www.yale.edu",
        "aff_unique_abbr": "MIT;USC;UVA;Yale",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Los Angeles;Charlottesville",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Sliced Denoising: A Physics-Informed Molecular Pre-Training Method",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17924",
        "id": "liKkG1zcWq",
        "author_site": "yuyan ni, Shikun Feng, Wei-Ying Ma, Zhi-Ming Ma, Yanyan Lan",
        "tldr": "",
        "abstract": "While molecular pre-training has shown great potential in enhancing drug discovery, the lack of a solid physical interpretation in current methods raises concerns about whether the learned representation truly captures the underlying explanatory factors in observed data, ultimately resulting in limited generalization and robustness. Although denoising methods offer a physical interpretation, their accuracy is often compromised by ad-hoc noise design, leading to inaccurate learned force fields. To address this limitation, this paper proposes a new method for molecular pre-training, called sliced denoising (SliDe), which is based on the classical mechanical intramolecular potential theory. SliDe utilizes a novel noise strategy that perturbs bond lengths, angles, and torsion angles to achieve better sampling over conformations. Additionally, it introduces a random slicing approach that circumvents the computationally expensive calculation of the Jacobian matrix, which is otherwise essential for estimating the force field. By aligning with physical principles, SliDe shows a 42\\% improvement in the accuracy of estimated force fields compared to current state-of-the-art denoising methods, and thus outperforms traditional baselines on various molecular property prediction tasks.",
        "keywords": "Molecule Representation; Pretraining; Denoising; Force Field",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Yuyan Ni;Shikun Feng;Wei-Ying Ma;Zhi-Ming Ma;Yanyan Lan",
        "authorids": "~Yuyan_Ni1;~Shikun_Feng3;~Wei-Ying_Ma2;~Zhi-Ming_Ma1;~Yanyan_Lan2",
        "gender": ";M;M;;",
        "homepage": "https://nyyxxx.github.io/;https://fengshikun.github.io;https://air.tsinghua.edu.cn/en/info/1046/1189.htm;http://homepage.amss.ac.cn/research/homePage/8eb59241e2e74d828fb84eec0efadba5/myHomePage.html;",
        "dblp": "117/6286;;m/WYMa.html;;00/6040.html",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;;SToCbu8AAAAJ;;",
        "orcid": ";;;;",
        "linkedin": ";;wei-ying-ma-16a0171/;;",
        "or_profile": "~Yuyan_Ni1;~Shikun_Feng3;~Wei-Ying_Ma2;~Zhi-Ming_Ma1;~Yanyan_Lan2",
        "aff": "University of Chinese Academy of Sciences;Tsinghua University;Tsinghua University;Academy of Mathematics and Systems Science, Chinese Academy of Sciences, Chinese Academy of Sciences;Tsinghua University",
        "aff_domain": "ucas.ac.cn;tsinghua.edu.cn;tsinghua.edu.cn;amss.ac.cn;tsinghua.edu.cn",
        "position": "PhD student;PhD student;Full Professor;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nni2024sliced,\ntitle={Sliced Denoising: A Physics-Informed Molecular Pre-Training Method},\nauthor={Yuyan Ni and Shikun Feng and Wei-Ying Ma and Zhi-Ming Ma and Yanyan Lan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=liKkG1zcWq}\n}",
        "github": "",
        "project": "",
        "reviewers": "j2Vc;mZU2;nTFT;ft62",
        "pdf_size": 1576782,
        "rating": "5;5;8;8",
        "confidence": "4;2;5;3",
        "soundness": "2;3;3;3",
        "contribution": "3;2;3;3",
        "presentation": "3;2;3;4",
        "wc_summary": "38;74;90;63",
        "wc_strengths": "35;60;86;158",
        "wc_weaknesses": "134;135;214;62",
        "wc_questions": "47;1;58;167",
        "wc_review": "254;270;448;450",
        "wc_reply_reviewers": "209;0;28;31",
        "wc_reply_authors": "1341;237;673;1310",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "5;1;3;3",
        "rating_avg": [
            6.5,
            1.5
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            66.25,
            18.925842121290138
        ],
        "wc_strengths_avg": [
            84.75,
            45.97485725915851
        ],
        "wc_weaknesses_avg": [
            136.25,
            53.769763808296574
        ],
        "wc_questions_avg": [
            68.25,
            60.890783374826114
        ],
        "wc_review_avg": [
            355.5,
            93.67363556518984
        ],
        "wc_reply_reviewers_avg": [
            67.0,
            82.8703807159108
        ],
        "wc_reply_authors_avg": [
            890.25,
            461.87085586774145
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            1.4142135623730951
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.447213595499958,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6106645199751692722&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=liKkG1zcWq",
        "pdf": "https://openreview.net/pdf?id=liKkG1zcWq",
        "email": "ucas.ac.cn;tsinghua.edu.cn;tsinghua.edu.cn;amss.ac.cn;tsinghua.edu.cn",
        "author_num": 5,
        "aff_unique_index": "0;1;1;2;1",
        "aff_unique_norm": "University of Chinese Academy of Sciences;Tsinghua University;Chinese Academy of Sciences",
        "aff_unique_dep": ";;Academy of Mathematics and Systems Science",
        "aff_unique_url": "http://www.ucas.ac.cn;https://www.tsinghua.edu.cn;http://www.cas.cn",
        "aff_unique_abbr": "UCAS;THU;CAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "libLqoInAd",
        "title": "Reliable Classifications with Guaranteed Confidence using the Dempster-Shafer Theory of Evidence",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Reliably capturing predictive uncertainty is indispensable for the deployment of machine learning (ML) models in safety-critical domains. The most commonly used approaches to uncertainty quantification are, however, either computationally costly in inference or incapable of capturing different types of uncertainty (i.e., aleatoric and epistemic). In this paper, we tackle this issue using the Dempster-Shafer theory of evidence, which only recently gained attention as a tool to estimate uncertainty in ML. By training a neural network to return a generalized probability measure and combining it with conformal prediction, we obtain set predictions with guaranteed user-specified confidence. We test our method on various datasets and empirically show that it reflects uncertainty more reliably than a calibrated classifier with softmax output, since our approach yields smaller and hence more informative prediction sets at the same bounded error level in particular for samples with high epistemic uncertainty. In order to deal with the exponential scaling inherent to classifiers within Dempster-Shafer theory, we introduce a second approach with reduced complexity, which also returns smaller sets than the comparative method, even on large classification tasks with more than 40 distinct labels. Our results indicate that the proposed methods are promising approaches to obtain reliable and informative predictions in the presence of both aleatoric and epistemic uncertainty in only one forward-pass through the network.",
        "keywords": "Reliable ML;Uncertainty Quantification;Conformal Prediction;Dempster-Shafer Theory",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Marie Christine Kempkes;Vedran Dunjko;Evert van Nieuwenburg;Jakob Spiegelberg",
        "authorids": "~Marie_Christine_Kempkes1;~Vedran_Dunjko1;~Evert_van_Nieuwenburg1;~Jakob_Spiegelberg1",
        "gender": "F;M;M;",
        "homepage": ";https://liacs.leidenuniv.nl/~dunjkov/index.html;https://evert.info;",
        "dblp": ";;;",
        "google_scholar": ";syyWEfIAAAAJ;dhjwTtQAAAAJ;GJ0LKzUAAAAJ",
        "orcid": "0000-0003-0336-825X;;0000-0003-0323-0031;0000-0002-6550-0087",
        "linkedin": "https://linkedin.com/in/marie-kempkes;;evert-van-nieuwenburg-a3491936/;",
        "or_profile": "~Marie_Christine_Kempkes1;~Vedran_Dunjko1;~Evert_van_Nieuwenburg1;~Jakob_Spiegelberg1",
        "aff": "Group Innovation, Volkswagen Group;Leiden University;Leiden University;",
        "aff_domain": "volkswagen.de;leidenuniv.nl;leidenuniv.nl;",
        "position": "PhD student;Assistant Professor;Assistant Professor;",
        "bibtex": "@misc{\nkempkes2024reliable,\ntitle={Reliable Classifications with Guaranteed Confidence using the Dempster-Shafer Theory of Evidence},\nauthor={Marie Christine Kempkes and Vedran Dunjko and Evert van Nieuwenburg and Jakob Spiegelberg},\nyear={2024},\nurl={https://openreview.net/forum?id=libLqoInAd}\n}",
        "github": "",
        "project": "",
        "reviewers": "JFXw;FfYh;oMQV;HmNM",
        "site": "https://openreview.net/forum?id=libLqoInAd",
        "pdf_size": 2072729,
        "rating": "3;5;5;8",
        "confidence": "5;4;3;2",
        "soundness": "2;3;3;4",
        "contribution": "1;2;2;3",
        "presentation": "2;2;2;4",
        "wc_summary": "43;68;92;112",
        "wc_strengths": "43;12;96;75",
        "wc_weaknesses": "1046;40;169;46",
        "wc_questions": "2;564;210;6",
        "wc_review": "1134;684;567;239",
        "wc_reply_reviewers": "163;0;19;0",
        "wc_reply_authors": "2345;1549;999;101",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "4;3;2;1",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            78.75,
            25.85899263312475
        ],
        "wc_strengths_avg": [
            56.5,
            31.87867625859016
        ],
        "wc_weaknesses_avg": [
            325.25,
            419.297850578798
        ],
        "wc_questions_avg": [
            195.5,
            228.77663779328518
        ],
        "wc_review_avg": [
            656.0,
            320.57682386598066
        ],
        "wc_reply_reviewers_avg": [
            45.5,
            68.28067076413353
        ],
        "wc_reply_authors_avg": [
            1248.5,
            817.2543973573956
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9393364366277244,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ssJFgs-pArEJ:scholar.google.com/&scioq=Reliable+Classifications+with+Guaranteed+Confidence+using+the+Dempster-Shafer+Theory+of+Evidence&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Volkswagen Group;Leiden University",
        "aff_unique_dep": "Group Innovation;",
        "aff_unique_url": "https://www.volkswagenag.com;https://www.leidenuniv.nl",
        "aff_unique_abbr": "Volkswagen;LU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "Germany;Netherlands"
    },
    {
        "id": "lifLHzadgr",
        "title": "Cumulative Reasoning with Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "While language models are powerful and versatile, they often fail to address highly complex problems. This is because solving complex problems requires deliberate thinking, which has been only minimally guided during training. In this paper, we propose a new method called Cumulative Reasoning (CR), which employs language models in a cumulative and iterative manner to emulate human thought processes. By decomposing tasks into smaller components, CR streamlines the problem-solving process, rendering it both more manageable and effective. For logical inference tasks, CR consistently outperforms existing methods with an improvement up to 9.3%, and achieves an accuracy of 98.04% on the curated FOLIO wiki dataset. In the context of the Game of 24, CR achieves an accuracy of 98%, which signifies a substantial enhancement of 24% over the previous state-of-the-art method. Finally, on the MATH dataset, we establish new state-of-the-art results with 58.0% overall accuracy, surpassing the previous best approach by a margin of 4.2%, and achieving 43% relative improvement on the hardest level 5 problems (22.4% to 32.1%).",
        "keywords": "cumulative reasoning;large language models;reasoning",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "",
        "author": "Yifan Zhang;Jingqin Yang;Yang Yuan;Andrew C Yao",
        "authorids": "~Yifan_Zhang16;~Jingqin_Yang2;~Yang_Yuan4;~Andrew_C_Yao1",
        "gender": ";M;M;M",
        "homepage": ";https://github.com/yjqqqaq;http://people.iiis.tsinghua.edu.cn/~yuanyang/index.html;https://iiis.tsinghua.edu.cn/en/yao/",
        "dblp": ";267/1955;;y/AndrewChiChihYao",
        "google_scholar": ";;;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Yifan_Zhang16;~Jingqin_Yang2;~Yang_Yuan4;~Andrew_C_Yao1",
        "aff": ";Tsinghua University;Tsinghua University;Tsinghua University",
        "aff_domain": ";tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn",
        "position": ";PhD student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nzhang2024cumulative,\ntitle={Cumulative Reasoning with Large Language Models},\nauthor={Yifan Zhang and Jingqin Yang and Yang Yuan and Andrew C Yao},\nyear={2024},\nurl={https://openreview.net/forum?id=lifLHzadgr}\n}",
        "github": "",
        "project": "",
        "reviewers": "1GrV;zUS6;MLNq;L3qv",
        "site": "https://openreview.net/forum?id=lifLHzadgr",
        "pdf_size": 825640,
        "rating": "5;5;6;6",
        "confidence": "4;4;4;3",
        "soundness": "3;2;3;3",
        "contribution": "2;2;4;2",
        "presentation": "3;3;2;3",
        "wc_summary": "92;80;100;49",
        "wc_strengths": "82;224;46;31",
        "wc_weaknesses": "338;435;213;45",
        "wc_questions": "118;14;363;68",
        "wc_review": "630;753;722;193",
        "wc_reply_reviewers": "94;0;485;0",
        "wc_reply_authors": "678;470;1776;407",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "3;2;4;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            80.25,
            19.395553614166314
        ],
        "wc_strengths_avg": [
            95.75,
            76.32946678708034
        ],
        "wc_weaknesses_avg": [
            257.75,
            145.87901665421248
        ],
        "wc_questions_avg": [
            140.75,
            133.4829108912448
        ],
        "wc_review_avg": [
            574.5,
            224.85606507274827
        ],
        "wc_reply_reviewers_avg": [
            144.75,
            200.1566573961506
        ],
        "wc_reply_authors_avg": [
            832.75,
            553.7415349240113
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 93,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12498281829120693895&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Tsinghua University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "The Expressive Power of Low-Rank Adaptation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17923",
        "id": "likXVjmh3E",
        "author_site": "Yuchen Zeng, Kangwook Lee",
        "tldr": "",
        "abstract": "*Low-Rank Adaptation* (LoRA), a parameter-efficient fine-tuning method that leverages low-rank adaptation of weight matrices, has emerged as a prevalent technique for fine-tuning pre-trained models such as large language models and diffusion models.\nDespite its huge success in practice, the theoretical underpinnings of LoRA have largely remained unexplored. \nThis paper takes the first step to bridge this gap by theoretically analyzing the expressive power of LoRA. \nWe prove that, for fully connected neural networks, LoRA can adapt any model $f$ to accurately represent any smaller target model $\\bar{f}$ if LoRA-rank $\\geq(\\text{width of }f) \\times \\frac{\\text{depth of }\\bar{f}}{\\text{depth of }f}$, under a mild assumption. \nWe also quantify the approximation error when the LoRA-rank is lower than the threshold. \nFor Transformer networks, we show any model can be adapted to a target model of the same size with rank-$(\\frac{\\text{embedding size}}{2})$ LoRA adapters.\nAll our theoretical insights are validated by numerical experiments.",
        "keywords": "LoRA;expressive power;parameter-efficient fine-tuning;adaptation;neural networks;transformer",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Yuchen Zeng;Kangwook Lee",
        "authorids": "~Yuchen_Zeng1;~Kangwook_Lee1",
        "gender": "F;M",
        "homepage": "https://yzeng58.github.io;http://kangwooklee.com/",
        "dblp": ";88/9826-1",
        "google_scholar": ";sCEl8r-n5VEC",
        "orcid": "0000-0002-2766-0055;",
        "linkedin": ";",
        "or_profile": "~Yuchen_Zeng1;~Kangwook_Lee1",
        "aff": "Microsoft;KRAFTON",
        "aff_domain": "microsoft.com;krafton.com",
        "position": "Intern;Researcher",
        "bibtex": "@inproceedings{\nzeng2024the,\ntitle={The Expressive Power of Low-Rank Adaptation},\nauthor={Yuchen Zeng and Kangwook Lee},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=likXVjmh3E}\n}",
        "github": "",
        "project": "",
        "reviewers": "SRgL;F9Xm;YxPR;U2Yh",
        "pdf_size": 1772018,
        "rating": "6;6;6;8",
        "confidence": "2;4;3;4",
        "soundness": "3;2;3;4",
        "contribution": "3;2;3;4",
        "presentation": "3;3;3;4",
        "wc_summary": "69;187;122;56",
        "wc_strengths": "46;83;71;41",
        "wc_weaknesses": "18;253;61;53",
        "wc_questions": "19;5;5;2",
        "wc_review": "152;528;259;152",
        "wc_reply_reviewers": "0;41;0;13",
        "wc_reply_authors": "316;798;299;212",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            108.5,
            51.62605931116571
        ],
        "wc_strengths_avg": [
            60.25,
            17.36915369268175
        ],
        "wc_weaknesses_avg": [
            96.25,
            91.93305988598443
        ],
        "wc_questions_avg": [
            7.75,
            6.609652033201143
        ],
        "wc_review_avg": [
            272.75,
            153.706497910791
        ],
        "wc_reply_reviewers_avg": [
            13.5,
            16.740669042783207
        ],
        "wc_reply_authors_avg": [
            406.25,
            229.59134892238427
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.5222329678670935,
        "gs_citation": 68,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15516676828287442049&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 8,
        "openreview": "https://openreview.net/forum?id=likXVjmh3E",
        "pdf": "https://openreview.net/pdf?id=likXVjmh3E",
        "email": "microsoft.com;krafton.com",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Microsoft;KRAFTON Inc.",
        "aff_unique_dep": "Microsoft Corporation;",
        "aff_unique_url": "https://www.microsoft.com;https://www.krafton.com",
        "aff_unique_abbr": "Microsoft;KRAFTON",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United States;South Korea"
    },
    {
        "title": "ViLMA: A Zero-Shot Benchmark for Linguistic and Temporal Grounding in Video-Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17922",
        "id": "liuqDwmbQJ",
        "author_site": "\u0130lker Kesen, Andrea Pedrotti, Mustafa Dogan, Michele Cafagna, Emre Can Acikgoz, Letitia Parcalabescu, Iacer Calixto, Anette Frank, Albert Gatt, Aykut Erdem, Erkut Erdem",
        "tldr": "",
        "abstract": "With the ever-increasing popularity of pretrained Video-Language Models (VidLMs), there is a pressing need to develop robust evaluation methodologies that delve deeper into their visio-linguistic capabilities. To address this challenge, we present ViLMA (Video Language Model Assessment), a task-agnostic benchmark that places the assessment of fine-grained capabilities of these models on a firm footing. Task-based evaluations, while valuable, fail to capture the complexities and specific temporal aspects of moving images that VidLMs need to process. Through carefully curated counterfactuals, ViLMA offers a controlled evaluation suite that sheds light on the true potential of these models, as well as their performance gaps compared to human-level understanding. ViLMA also includes proficiency tests, which assess basic capabilities deemed essential to solving the main counterfactual tests. We show that current VidLMs\u2019 grounding abilities are no better than those of vision-language models which use static images. This is especially striking once the performance on proficiency tests is factored in. Our benchmark serves as a catalyst for future research on VidLMs, helping to highlight areas that still need to be explored.",
        "keywords": "vision-language benchmark;spatio-temporal grounding;video-language models;benchmark;evaluation;zero-shot",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Ilker Kesen;Andrea Pedrotti;Mustafa Dogan;Michele Cafagna;Emre Can Acikgoz;Letitia Parcalabescu;Iacer Calixto;Anette Frank;Albert Gatt;Aykut Erdem;Erkut Erdem",
        "authorids": "~Ilker_Kesen1;~Andrea_Pedrotti1;~Mustafa_Dogan1;~Michele_Cafagna1;~Emre_Can_Acikgoz1;~Letitia_Parcalabescu1;~Iacer_Calixto2;~Anette_Frank1;~Albert_Gatt2;~Aykut_Erdem1;~Erkut_Erdem1",
        "gender": "M;M;M;M;F;M;F;M;M;M;M",
        "homepage": "https://github.com/ilkerkesen;https://mustafaadogan.github.io/;https://michelecafagna26.github.io/;https://emrecanacikgoz.github.io/;https://www.cl.uni-heidelberg.de/~parcalabescu/;https://iacercalixto.github.io;https://www.cl.uni-heidelberg.de/nlpgroup/person/frank;https://aykuterdem.github.io;https://web.cs.hacettepe.edu.tr/~erkut;https://albertgatt.github.io;",
        "dblp": "228/2036;;252/0944;332/1546.html;257/3297;174/7199;82/6572.html;04/1832;79/6569;https://dblp.uni-trier.de/pers/hd/g/Gatt:Albert;",
        "google_scholar": ";https://scholar.google.com.tr/citations?user=jlajt9oAAAAJ;GOXgBVAAAAAJ;l6h_3H8AAAAJ;https://scholar.google.de/citations?user=EeIGHM0AAAAJ;https://scholar.google.ca/citations?user=W0prRUMAAAAJ;https://scholar.google.de/citations?user=9FP2fokAAAAJ;-xA1_OAAAAAJ;https://scholar.google.com.tr/citations?user=eALwl74AAAAJ;uF5HKZQAAAAJ;ec7IvDsAAAAJ",
        "orcid": ";0009-0005-2591-783X;;;0000-0002-3892-5629;0000-0001-6244-7906;0000-0003-4706-9817;0000-0002-6280-8422;;0000-0001-6388-8244;",
        "linkedin": ";dogan-mustafa/;;;letitia-parcalabescu/;iacercalixto/;;;;;",
        "or_profile": "~Ilker_Kesen1;~Mustafa_Dogan1;~Michele_Cafagna1;~Emre_Can_Acikgoz1;~Letitia_Parcalabescu1;~Iacer_Calixto2;~Anette_Frank1;~Aykut_Erdem1;~Erkut_Erdem1;~Albert_Gatt1;~Andrea_Pedrotti2",
        "aff": "Ko\u00e7 University;Hacettepe University;Okra.ai;University of Illinois, Urbana Champaign;Heidelberg University;Amsterdam UMC, University of Amsterdam;Ruprecht-Karls-Universit\u00e4t Heidelberg;Ko\u00e7 University;Hacettepe University;Utrecht University;University of Pisa",
        "aff_domain": "ku.edu.tr;hacettepe.edu.tr;okra.ai;illinois.edu;uni-heidelberg.de;amsterdamumc.nl;uni-heidelberg.de;ku.edu.tr;hacettepe.edu.tr;uu.nl;unipi.it",
        "position": "Researcher;MS student;Researcher;PhD student;PhD student;Assistant Professor;Full Professor;Associate Professor;Full Professor;Associate Professor;PhD student",
        "bibtex": "@inproceedings{\nkesen2024vilma,\ntitle={Vi{LMA}: A Zero-Shot Benchmark for Linguistic and Temporal Grounding in Video-Language Models},\nauthor={Ilker Kesen and Andrea Pedrotti and Mustafa Dogan and Michele Cafagna and Emre Can Acikgoz and Letitia Parcalabescu and Iacer Calixto and Anette Frank and Albert Gatt and Aykut Erdem and Erkut Erdem},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=liuqDwmbQJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "DXPK;9Dpj;cNVC;f3MM",
        "pdf_size": 26400415,
        "rating": "6;6;6;6",
        "confidence": "2;4;3;4",
        "soundness": "3;2;3;3",
        "contribution": "2;3;3;4",
        "presentation": "3;3;3;3",
        "wc_summary": "66;58;184;122",
        "wc_strengths": "73;34;63;92",
        "wc_weaknesses": "144;70;113;129",
        "wc_questions": "40;64;5;1",
        "wc_review": "323;226;365;344",
        "wc_reply_reviewers": "107;24;50;0",
        "wc_reply_authors": "399;388;371;446",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            107.5,
            50.584088407324295
        ],
        "wc_strengths_avg": [
            65.5,
            20.958291915134687
        ],
        "wc_weaknesses_avg": [
            114.0,
            27.667670664513846
        ],
        "wc_questions_avg": [
            27.5,
            25.96632434519757
        ],
        "wc_review_avg": [
            314.5,
            53.20949163448191
        ],
        "wc_reply_reviewers_avg": [
            45.25,
            39.79557136164777
        ],
        "wc_reply_authors_avg": [
            401.0,
            27.829840100151493
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7837509848885416527&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=liuqDwmbQJ",
        "pdf": "https://openreview.net/pdf?id=liuqDwmbQJ",
        "email": "ku.edu.tr;hacettepe.edu.tr;okra.ai;illinois.edu;uni-heidelberg.de;amsterdamumc.nl;uni-heidelberg.de;ku.edu.tr;hacettepe.edu.tr;uu.nl;unipi.it",
        "author_num": 11,
        "aff_unique_index": "0;1;2;3;4;5;6;0;1;7;8",
        "aff_unique_norm": "Ko\u00e7 University;Hacettepe University;Okra.ai;University of Illinois Urbana-Champaign;Heidelberg University;University of Amsterdam;Ruprecht-Karls-Universit\u00e4t Heidelberg;Utrecht University;University of Pisa",
        "aff_unique_dep": ";;;;;;;;",
        "aff_unique_url": "https://www.ku.edu.tr;https://www.hacettepe.edu.tr;https://okra.ai;https://illinois.edu;https://www.uni-heidelberg.de;https://www.uva.nl;https://www.uni-heidelberg.de/;https://www.uu.nl;https://www.unipi.it",
        "aff_unique_abbr": "Ko\u00e7;Hacettepe;Okra.ai;UIUC;Uni Heidelberg;UvA;Uni Heidelberg;UU;UNIP",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Urbana-Champaign;Amsterdam",
        "aff_country_unique_index": "0;0;1;1;2;3;2;0;0;3;4",
        "aff_country_unique": "T\u00fcrkiye;United States;Germany;Netherlands;Italy"
    },
    {
        "id": "ljVCPV7jK3",
        "title": "Fairness Under Demographic Scarce Regime",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Most existing works on fairness assume the model has full access to demographic information. However, there exist scenarios where demographic information is partially available because a record was not maintained throughout data collection or due to privacy reasons. This setting is known as demographic scarce regime. Prior research have shown that training an attribute classifier to replace the missing sensitive attributes (proxy) can still improve fairness. However, the use of proxy-sensitive attributes worsens fairness-accuracy trade-offs compared to true sensitive attributes. To address this limitation, we propose a framework to build attribute classifiers that achieve better fairness-accuracy trade-offs. Our method introduces uncertainty awareness in the attribute classifier and enforces fairness on samples with demographic information inferred with the lowest uncertainty.  We show empirically that enforcing fairness constraints on samples with uncertain sensitive attributes is detrimental to fairness and accuracy. Our experiments on five datasets showed that the proposed framework yields models with significantly better fairness-accuracy trade-offs compared to classic attribute classifiers. Surprisingly, our framework outperforms models trained with constraints on the true sensitive attributes.",
        "keywords": "Fairness;Bias mitigation;Limited demographic information;Fair decision-making",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/f8b8e4bfdc9b86cbee3ef4e9d98b5777f256f412.pdf",
        "author": "Patrik Joslin Kenfack;Samira Ebrahimi Kahou;Ulrich A\u00efvodji",
        "authorids": "~Patrik_Joslin_Kenfack1;~Samira_Ebrahimi_Kahou1;~Ulrich_A\u00efvodji1",
        "gender": "M;F;M",
        "homepage": "https://patrikken.github.io;https://saebrahimi.github.io;https://aivodji.github.io/",
        "dblp": "264/1806;20/11069;217/4301",
        "google_scholar": "bWvJMcgAAAAJ;https://scholar.google.ca/citations?user=F99FuaAAAAAJ;47kuuqIAAAAJ",
        "orcid": ";;0000-0003-4247-1444",
        "linkedin": ";;umaivodji/",
        "or_profile": "~Patrik_Joslin_Kenfack1;~Samira_Ebrahimi_Kahou1;~Ulrich_A\u00efvodji1",
        "aff": "Mila / \u00c9cole de technologie sup\u00e9rieure, Universit\u00e9 du Qu\u00e9bec;\u00c9cole de technologie sup\u00e9rieure;\u00c9cole de technologie sup\u00e9rieure, Universit\u00e9 du Qu\u00e9bec",
        "aff_domain": "etsmtl.ca;etsmtl.ca;etsmtl.ca",
        "position": "PhD student;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nanonymous2024fairness,\ntitle={Fairness Under Demographic Scarce Regime},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=ljVCPV7jK3}\n}",
        "github": "",
        "project": "",
        "reviewers": "EiNj;PEk1;CnjD",
        "site": "https://openreview.net/forum?id=ljVCPV7jK3",
        "pdf_size": 1054762,
        "rating": "3;3;6",
        "confidence": "4;2;4",
        "soundness": "1;2;3",
        "contribution": "2;1;3",
        "presentation": "3;3;3",
        "wc_summary": "55;57;72",
        "wc_strengths": "207;27;27",
        "wc_weaknesses": "609;277;123",
        "wc_questions": "222;82;209",
        "wc_review": "1093;443;431",
        "wc_reply_reviewers": "611;442;0",
        "wc_reply_authors": "2415;1143;868",
        "reply_reviewers": "3;2;0",
        "reply_authors": "6;3;2",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            61.333333333333336,
            7.586537784494029
        ],
        "wc_strengths_avg": [
            87.0,
            84.8528137423857
        ],
        "wc_weaknesses_avg": [
            336.3333333333333,
            202.79601135678735
        ],
        "wc_questions_avg": [
            171.0,
            63.15589178110516
        ],
        "wc_review_avg": [
            655.6666666666666,
            309.28016784498516
        ],
        "wc_reply_reviewers_avg": [
            351.0,
            257.6056417601654
        ],
        "wc_reply_authors_avg": [
            1475.3333333333333,
            673.8626632251478
        ],
        "reply_reviewers_avg": [
            1.6666666666666667,
            1.247219128924647
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            1.699673171197595
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5000000000000001,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18409368728152635520&as_sdt=5,31&sciodt=0,31&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Universit\u00e9 du Qu\u00e9bec;\u00c9cole de technologie sup\u00e9rieure",
        "aff_unique_dep": "Mila;",
        "aff_unique_url": "https://www.etsmtl.ca;https://www.etsmtl.ca",
        "aff_unique_abbr": "ETS;ETS",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "\u00c9cole de technologie sup\u00e9rieure;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "title": "Deep Neural Networks Tend To Extrapolate Predictably",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17921",
        "id": "ljwoQ3cvQh",
        "author_site": "Katie Kang, Amrith Setlur, Claire Tomlin, Sergey Levine",
        "tldr": "",
        "abstract": "Conventional wisdom suggests that neural network predictions tend to be unpredictable and overconfident when faced with out-of-distribution (OOD) inputs. Our work reassesses this assumption for neural networks with high-dimensional inputs. Rather than extrapolating in arbitrary ways, we observe that neural network predictions often tend towards a constant value as input data becomes increasingly OOD. Moreover, we find that this value often closely approximates the optimal constant solution (OCS), i.e., the prediction that minimizes the average loss over the training data without observing the input. We present results showing this phenomenon across 8 datasets with different distributional shifts (including CIFAR10-C and ImageNet-R, S), different loss functions (cross entropy, MSE, and Gaussian NLL), and different architectures (CNNs and transformers). Furthermore, we present an explanation for this behavior, which we first validate empirically and then study theoretically in a simplified setting involving deep homogeneous networks with ReLU activations. Finally, we show how one can leverage our insights in practice to enable risk-sensitive decision-making in the presence of OOD inputs.",
        "keywords": "extrapolation;OOD generalization;deep neural networks;decision-making",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Katie Kang;Amrith Setlur;Claire Tomlin;Sergey Levine",
        "authorids": "~Katie_Kang1;~Amrith_Setlur1;~Claire_Tomlin1;~Sergey_Levine1",
        "gender": "F;M;;M",
        "homepage": "http://katiekang.com/;http://ars22.github.io;;https://people.eecs.berkeley.edu/~svlevine/",
        "dblp": "236/5055;https://dblp.uni-trier.de/pers/hd/s/Setlur:Amrith;;80/7594",
        "google_scholar": ";https://scholar.google.ru/citations?user=i7V1kJgAAAAJ;;8R35rCwAAAAJ",
        "orcid": ";0000-0002-7061-3094;;",
        "linkedin": ";;;",
        "or_profile": "~Katie_Kang1;~Amrith_Setlur1;~Claire_Tomlin1;~Sergey_Levine1",
        "aff": ";Carnegie Mellon University;;Google",
        "aff_domain": ";cmu.edu;;google.com",
        "position": ";PhD student;;Research Scientist",
        "bibtex": "@inproceedings{\nkang2024deep,\ntitle={Deep Neural Networks Tend To Extrapolate Predictably},\nauthor={Katie Kang and Amrith Setlur and Claire Tomlin and Sergey Levine},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ljwoQ3cvQh}\n}",
        "github": "",
        "project": "",
        "reviewers": "Spup;KwvU;5N2a;DSRT",
        "pdf_size": 3235146,
        "rating": "6;6;8;8",
        "confidence": "4;3;3;4",
        "soundness": "2;3;3;3",
        "contribution": "3;2;3;4",
        "presentation": "3;3;4;3",
        "wc_summary": "163;157;336;124",
        "wc_strengths": "57;109;206;27",
        "wc_weaknesses": "113;175;288;5",
        "wc_questions": "121;129;113;50",
        "wc_review": "454;570;943;206",
        "wc_reply_reviewers": "247;0;107;0",
        "wc_reply_authors": "991;752;777;212",
        "reply_reviewers": "4;0;1;0",
        "reply_authors": "5;1;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            195.0,
            82.74962235563375
        ],
        "wc_strengths_avg": [
            99.75,
            67.99770216705856
        ],
        "wc_weaknesses_avg": [
            145.25,
            102.43626066974527
        ],
        "wc_questions_avg": [
            103.25,
            31.259998400511794
        ],
        "wc_review_avg": [
            543.25,
            265.6213235039687
        ],
        "wc_reply_reviewers_avg": [
            88.5,
            101.40142997019322
        ],
        "wc_reply_authors_avg": [
            683.0,
            287.35953090162155
        ],
        "reply_reviewers_avg": [
            1.25,
            1.6393596310755
        ],
        "reply_authors_avg": [
            2.0,
            1.7320508075688772
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8744003868740638203&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=ljwoQ3cvQh",
        "pdf": "https://openreview.net/pdf?id=ljwoQ3cvQh",
        "email": ";cmu.edu;;google.com",
        "author_num": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Carnegie Mellon University;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.cmu.edu;https://www.google.com",
        "aff_unique_abbr": "CMU;Google",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "lkIRFglmTp",
        "title": "Resolving Partial Observability in Decision Processes via the Lambda Discrepancy",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We consider the reinforcement learning problem under partial observability, where observations in the decision process lack the Markov property. To cope with partial observability, first we must detect it. We introduce the $\\lambda$-discrepancy: a measure of the degree of non-Markovianity of system dynamics. The $\\lambda$-discrepancy is the difference between TD($\\lambda$) value functions for two different values of $\\lambda$; for example, between 1-step temporal difference learning (TD($0$)), which makes an implicit Markov assumption, and Monte Carlo value estimation (TD($1$)), which does not. We prove that this observable and scalable value-based measure is a reliable signal of partial observability. We then use it as an optimization target for resolving partial observability by searching for memory functions---functions over the agent's history---to augment the agent's observations and reduce $\\lambda$-discrepancy.  We empirically demonstrate that our approach produces memory-augmented observations that resolve partial observability and improve decision making.",
        "keywords": "reinforcement learning;partial observability;value estimation;memory",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Cameron Allen;Aaron T. Kirtland;Ruo Yu Tao;Daniel Scott;Sam Lobel;Nicholas Petrocelli;Omer Gottesman;Michael Littman;George Konidaris",
        "authorids": "~Cameron_Allen1;~Aaron_T._Kirtland1;~Ruo_Yu_Tao1;~Daniel_Scott1;~Sam_Lobel1;~Nicholas_Petrocelli1;~Omer_Gottesman1;~Michael_Littman1;~George_Konidaris1",
        "gender": ";;M;;M;M;M;M;M",
        "homepage": ";;http://taodav.cc/;https://dsctt.github.io/;https://samlobel.github.io/;;https://omergott.github.io/;http://www.cs.brown.edu/~mlittman;http://cs.brown.edu/people/gdk/",
        "dblp": ";;;;242/8872;;;http://dblp.uni-trier.de/pers/hd/l/Littman:Michael_L=;56/6762",
        "google_scholar": ";;https://scholar.google.ca/citations?user=71xWQKZSflwC;;;;glNJx5zYUbsC;Jj00ksMAAAAJ;9UERvVEAAAAJ",
        "orcid": ";;;;;;;0000-0002-5596-1840;",
        "linkedin": ";;taodav/;;;nicholasrp/;;michael-littman-b26351/;",
        "or_profile": "~Cameron_Allen1;~Aaron_T._Kirtland1;~Ruo_Yu_Tao1;~Daniel_Scott1;~Sam_Lobel1;~Nicholas_Petrocelli1;~Omer_Gottesman1;~Michael_Littman1;~George_Konidaris1",
        "aff": ";;Brown University;;Brown University;;Amazon;Georgia Institute of Technology;Brown University",
        "aff_domain": ";;brown.edu;;brown.edu;;amazon.com;gatech.edu;brown.edu",
        "position": ";;PhD student;;PhD student;;Researcher;Adjunct;Assistant Professor",
        "bibtex": "@misc{\nallen2024resolving,\ntitle={Resolving Partial Observability in Decision Processes via the Lambda Discrepancy},\nauthor={Cameron Allen and Aaron T. Kirtland and Ruo Yu Tao and Daniel Scott and Sam Lobel and Nicholas Petrocelli and Omer Gottesman and Michael Littman and George Konidaris},\nyear={2024},\nurl={https://openreview.net/forum?id=lkIRFglmTp}\n}",
        "github": "",
        "project": "",
        "reviewers": "zLef;Rr9Z;ni5q;QHWA",
        "site": "https://openreview.net/forum?id=lkIRFglmTp",
        "pdf_size": 1069143,
        "rating": "3;3;3;6",
        "confidence": "4;4;3;5",
        "soundness": "1;3;2;2",
        "contribution": "2;2;2;3",
        "presentation": "1;3;3;3",
        "wc_summary": "76;60;149;155",
        "wc_strengths": "107;75;32;163",
        "wc_weaknesses": "487;76;113;43",
        "wc_questions": "17;105;29;105",
        "wc_review": "687;316;323;466",
        "wc_reply_reviewers": "0;0;141;0",
        "wc_reply_authors": "1189;743;264;549",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            110.0,
            42.432299018554254
        ],
        "wc_strengths_avg": [
            94.25,
            47.7879430400598
        ],
        "wc_weaknesses_avg": [
            179.75,
            179.11082463100882
        ],
        "wc_questions_avg": [
            64.0,
            41.2189276910499
        ],
        "wc_review_avg": [
            448.0,
            150.41110331355196
        ],
        "wc_reply_reviewers_avg": [
            35.25,
            61.054790966802926
        ],
        "wc_reply_authors_avg": [
            686.25,
            336.56750808715924
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:M5dtUxeox4YJ:scholar.google.com/&scioq=Resolving+Partial+Observability+in+Decision+Processes+via+the+Lambda+Discrepancy&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2;0",
        "aff_unique_norm": "Brown University;Amazon;Georgia Institute of Technology",
        "aff_unique_dep": ";Amazon.com, Inc.;",
        "aff_unique_url": "https://www.brown.edu;https://www.amazon.com;https://www.gatech.edu",
        "aff_unique_abbr": "Brown;Amazon;Georgia Tech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "llLnMfrnHj",
        "title": "Federated Tuning for Black Box Large Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "With the blowout development of pre-trained models (PTMs), the efficient tuning of these models for diverse downstream applications has emerged as a pivotal research concern. Although recent investigations into prompt tuning have provided promising avenues, three salient challenges persist: (1) memory constraint: the continuous growth in the size of open-source PTMs renders fine-tuning, even a fraction of their parameters, challenging for many practitioners. (2) model privacy: existing PTMs often function as public API services, with their parameters inaccessible for effective or tailored fine-tuning. (3) data privacy: the fine-tuning of PTMs necessitates high-quality datasets, which are typically localized and not shared to public. To optimally harness each local dataset while navigating memory constraints and preserving privacy, we propose Federated Black-Box Prompt Tuning (Fed-BBPT). This innovative approach eschews reliance on parameter architectures and private dataset access, instead capitalizing on a central server that aids local users in collaboratively training a prompt generator through regular aggregation. Local users leverage API-driven learning via a zero-order optimizer, obviating the need for PTM deployment. Relative to extensive fine-tuning, Fed- BBPT proficiently sidesteps memory challenges tied to PTM storage and fine- tuning on local machines, tapping into comprehensive, high-quality, yet private training datasets. A thorough evaluation across 40 datasets spanning CV and NLP tasks underscores the robustness of our proposed model.",
        "keywords": "Federated Learning;Black Box Tuning;Prompt Tuning;Instruct Tuning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Zihao Lin;Yan Sun;Yifan Shi;Xueqian Wang;Lifu Huang;Li Shen;Dacheng Tao",
        "authorids": "~Zihao_Lin1;~Yan_Sun3;~Yifan_Shi1;~Xueqian_Wang1;~Lifu_Huang1;~Li_Shen1;~Dacheng_Tao1",
        "gender": "M;M;;M;M;M;",
        "homepage": "https://github.com/ZihaoLin0123;;;;https://wilburone.github.io/;https://sites.google.com/site/mathshenli/home;",
        "dblp": "241/2108-3;;;43/3563-1;127/0072;91/3680-8;",
        "google_scholar": "4h_A4n4AAAAJ;_-hoDQkAAAAJ;;h9dN_ykAAAAJ;76IEGtYAAAAJ;yVhgENIAAAAJ;",
        "orcid": ";0000-0003-2271-252X;;0000-0003-3542-0593;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Zihao_Lin1;~Yan_Sun3;~Yifan_Shi1;~Xueqian_Wang1;~Lifu_Huang1;~Li_Shen1;~Dacheng_Tao1",
        "aff": "Virginia Polytechnic Institute and State University;University of Sydney;;Tsinghua University;Virginia Tech;JD Explore Academy;",
        "aff_domain": "vt.edu;uni.sydney.edu.au;;tsinghua.edu.cn;vt.edu;jd.com;",
        "position": "PhD student;PhD student;;Full Professor;Assistant Professor;Researcher;",
        "bibtex": "@misc{\nlin2024federated,\ntitle={Federated Tuning for Black Box Large Models},\nauthor={Zihao Lin and Yan Sun and Yifan Shi and Xueqian Wang and Lifu Huang and Li Shen and Dacheng Tao},\nyear={2024},\nurl={https://openreview.net/forum?id=llLnMfrnHj}\n}",
        "github": "",
        "project": "",
        "reviewers": "viQp;aER3;sZJ9;NEfj",
        "site": "https://openreview.net/forum?id=llLnMfrnHj",
        "pdf_size": 1866062,
        "rating": "3;3;5;6",
        "confidence": "4;4;5;3",
        "soundness": "2;2;3;2",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;2",
        "wc_summary": "91;75;40;77",
        "wc_strengths": "34;51;49;51",
        "wc_weaknesses": "462;178;19;54",
        "wc_questions": "1;6;223;9",
        "wc_review": "588;310;331;191",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            70.75,
            18.793283374652763
        ],
        "wc_strengths_avg": [
            46.25,
            7.119515432949071
        ],
        "wc_weaknesses_avg": [
            178.25,
            174.14989951188602
        ],
        "wc_questions_avg": [
            59.75,
            94.29574486688145
        ],
        "wc_review_avg": [
            355.0,
            144.72905720690645
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.2721655269759087,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:s2q_DXIa8l8J:scholar.google.com/&scioq=Federated+Tuning+for+Black+Box+Large+Models&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0;3",
        "aff_unique_norm": "Virginia Tech;University of Sydney;Tsinghua University;JD",
        "aff_unique_dep": ";;;JD Explore Academy",
        "aff_unique_url": "https://www.vt.edu;https://www.sydney.edu.au;https://www.tsinghua.edu.cn;",
        "aff_unique_abbr": "VT;USYD;THU;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;0",
        "aff_country_unique": "United States;Australia;China;"
    },
    {
        "id": "llXCyLhOY4",
        "title": "Bias Resilient Multi-Step Off-Policy Goal-Conditioned Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In goal-conditioned reinforcement learning (GCRL), sparse rewards present significant challenges, often obstructing efficient learning. Although multi-step GCRL can boost this efficiency, it can also lead to off-policy biases in target values. This paper dives deep into these biases, categorizing them into two distinct categories: ``shooting\" and ``shifting\". Recognizing that certain behavior policies can hasten policy refinement, we present solutions designed to capitalize on the positive aspects of these biases while minimizing their drawbacks, enabling the use of larger step sizes to speed up GCRL. An empirical study demonstrates that our approach ensures a resilient and robust improvement, even in ten-step learning scenarios, leading to superior learning efficiency and performance that generally surpass the baseline and several state-of-the-art multi-step GCRL benchmarks.",
        "keywords": "Goal-Conditioned Reinforcement Learning;Multi-Step Reinforcement Learning;Off-Policy Bias",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/b56bb519d7322ee25352f70af451a2851b4757d9.pdf",
        "author": "Lisheng Wu;Ke Chen",
        "authorids": "~Lisheng_Wu1;~Ke_Chen12",
        "gender": "M;",
        "homepage": ";",
        "dblp": "78/1255;",
        "google_scholar": "Fz2WocgAAAAJ;",
        "orcid": "0000-0002-5604-4593;",
        "linkedin": "lisheng-wu-b4a18b152/;",
        "or_profile": "~Lisheng_Wu1;~Ke_Chen12",
        "aff": ";",
        "aff_domain": ";",
        "position": ";",
        "bibtex": "@misc{\nwu2024bias,\ntitle={Bias Resilient Multi-Step Off-Policy Goal-Conditioned Reinforcement Learning},\nauthor={Lisheng Wu and Ke Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=llXCyLhOY4}\n}",
        "github": "",
        "project": "",
        "reviewers": "GrEH;NQk6;aQNs;3TCh",
        "site": "https://openreview.net/forum?id=llXCyLhOY4",
        "pdf_size": 561864,
        "rating": "3;3;3;3",
        "confidence": "4;3;3;4",
        "soundness": "2;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "1;1;1;1",
        "wc_summary": "108;163;60;34",
        "wc_strengths": "84;49;66;24",
        "wc_weaknesses": "242;464;198;229",
        "wc_questions": "319;153;29;5",
        "wc_review": "753;829;353;292",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.0,
            0.0
        ],
        "wc_summary_avg": [
            91.25,
            49.20048272120915
        ],
        "wc_strengths_avg": [
            55.75,
            22.117583502724706
        ],
        "wc_weaknesses_avg": [
            283.25,
            105.57313815549863
        ],
        "wc_questions_avg": [
            126.5,
            124.52610168153502
        ],
        "wc_review_avg": [
            556.75,
            236.77032647694685
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10391586689851332127&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 6
    },
    {
        "title": "Ring-A-Bell! How Reliable are Concept Removal Methods For Diffusion Models?",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17920",
        "id": "lm7MRcsFiS",
        "author_site": "Yu-Lin Tsai, Chia-Yi Hsu, Chulin Xie, Chih-Hsun Lin, Jia You Chen, Bo Li, Pin-Yu Chen, Chia-Mu Yu, Chun-Ying Huang",
        "tldr": "",
        "abstract": "Diffusion models for text-to-image (T2I) synthesis, such as Stable Diffusion (SD), have recently demonstrated exceptional capabilities for generating high-quality content. However, this progress has raised several concerns of potential misuse, particularly in creating copyrighted, prohibited, and restricted content, or NSFW (not safe for work) images. While efforts have been made to mitigate such problems, either by implementing a safety filter at the evaluation stage or by fine-tuning models to eliminate undesirable concepts or styles, the effectiveness of these safety measures in dealing with a wide range of prompts remains largely unexplored. In this work, we aim to investigate these safety mechanisms by proposing one novel concept retrieval algorithm for evaluation. We introduce Ring-A-Bell, a model-agnostic red-teaming scheme for T2I diffusion models, where the whole evaluation can be prepared in advance without prior knowledge of the target model.\nSpecifically, Ring-A-Bell first performs concept extraction to obtain holistic representations for sensitive and inappropriate concepts. Subsequently, by leveraging the extracted concept, Ring-A-Bell automatically identifies problematic prompts for diffusion models with the corresponding generation of inappropriate content, allowing the user to assess the reliability of deployed safety mechanisms. Finally, we empirically validate our method by testing online services such as Midjourney and various methods of concept removal. Our results show that Ring-A-Bell, by manipulating safe prompting benchmarks, can transform prompts that were originally regarded as safe to evade existing safety mechanisms, thus revealing the defects of the so-called safety mechanisms which could practically lead to the generation of harmful contents. In essence, Ring-A-Bell could serve as a red-teaming tool to understand the limitations of deployed safety mechanisms and to explore the risk under plausible attacks. Our codes are available at https://github.com/chiayi-hsu/Ring-A-Bell.",
        "keywords": "redteaming;stable diffusion;text-to-image model",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/1afc545a6fc6f8f4110d4cb715f1ed6d8439ecf5.pdf",
        "author": "Yu-Lin Tsai;Chia-Yi Hsu;Chulin Xie;Chih-Hsun Lin;Jia You Chen;Bo Li;Pin-Yu Chen;Chia-Mu Yu;Chun-Ying Huang",
        "authorids": "~Yu-Lin_Tsai1;~Chia-Yi_Hsu1;~Chulin_Xie1;~Chih-Hsun_Lin2;~Jia_You_Chen1;~Bo_Li19;~Pin-Yu_Chen1;~Chia-Mu_Yu1;~Chun-Ying_Huang1",
        "gender": "M;F;F;M;F;M;M;Not Specified;M",
        "homepage": "https://www.linkedin.com/in/uriah-tsai-bbb36516b/;;;https://github.com/JiaYouChen2003;http://boli.cs.illinois.edu/;http://www.pinyuchen.com;https://chiamuyu.weebly.com/;https://people.cs.nycu.edu.tw/~chuang/;",
        "dblp": ";227/2154;245/4284;;50/3402-26;39/8969;91/1919.html;08/3422;21/8858",
        "google_scholar": "https://scholar.google.com.tw/citations?hl=zh-TW;;WeJnzAgAAAAJ;;K8vJkTcAAAAJ;jxwlCUUAAAAJ;https://scholar.google.com.tw/citations?user=dW4W4isAAAAJ;ixq3XDUAAAAJ;https://scholar.google.com.tw/citations?user=T48_vqUAAAAJ",
        "orcid": ";;;;;0000-0003-1039-8369;0000-0002-1677-2131;0000-0001-5503-9541;0000-0002-2668-0556",
        "linkedin": ";chia-yi-hsu-136a86155;;;;pin-yu-chen-940062a2;chia-mu-yu-0b130988?originalSubdomain=tw;;",
        "or_profile": "~Yu-Lin_Tsai1;~Chia-Yi_Hsu1;~Chulin_Xie1;~Jia_You_Chen1;~Bo_Li19;~Pin-Yu_Chen1;~Chia-Mu_Yu1;~Chun-Ying_Huang1;~CHIH-HSUN_LIN1",
        "aff": "National Yang Ming Chiao Tung University;National Yang Ming Chiao Tung University;University of Illinois, Urbana Champaign;National Chiao Tung University;University of Illinois, Urbana Champaign;International Business Machines;National Yang Ming Chiao Tung University;National Yang Ming Chiao Tung University;National Yang Ming Chiao Tung University",
        "aff_domain": "nycu.edu.tw;nycu.edu.tw;illinois.edu;nctu.edu.tw;illinois.edu;ibm.com;nycu.edu.tw;nycu.edu.tw;nycu.edu.tw",
        "position": "Undergrad student;PhD student;PhD student;Undergrad student;Assistant Professor;Principal Researcher;Associate Professor;Full Professor;PhD student",
        "bibtex": "@inproceedings{\ntsai2024ringabell,\ntitle={Ring-A-Bell! How Reliable are Concept Removal Methods For Diffusion Models?},\nauthor={Yu-Lin Tsai and Chia-Yi Hsu and Chulin Xie and Chih-Hsun Lin and Jia You Chen and Bo Li and Pin-Yu Chen and Chia-Mu Yu and Chun-Ying Huang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=lm7MRcsFiS}\n}",
        "github": "",
        "project": "",
        "reviewers": "WiiG;UevV;nnoZ;nmRw",
        "pdf_size": 15708370,
        "rating": "5;5;6;8",
        "confidence": "5;3;3;5",
        "soundness": "3;2;3;2",
        "contribution": "3;3;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "70;68;32;37",
        "wc_strengths": "84;83;24;36",
        "wc_weaknesses": "70;157;4;350",
        "wc_questions": "118;3;78;22",
        "wc_review": "342;311;138;445",
        "wc_reply_reviewers": "0;0;19;0",
        "wc_reply_authors": "1317;1393;364;2097",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "3;3;2;5",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.0,
            1.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            51.75,
            17.354754391808605
        ],
        "wc_strengths_avg": [
            56.75,
            27.086666461563706
        ],
        "wc_weaknesses_avg": [
            145.25,
            130.07185514168697
        ],
        "wc_questions_avg": [
            55.25,
            45.526777834588735
        ],
        "wc_review_avg": [
            309.0,
            110.48755586037733
        ],
        "wc_reply_reviewers_avg": [
            4.75,
            8.227241335952167
        ],
        "wc_reply_authors_avg": [
            1292.75,
            616.448041200554
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.25,
            1.0897247358851685
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.40824829046386296,
        "gs_citation": 90,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7579360821556703282&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "openreview": "https://openreview.net/forum?id=lm7MRcsFiS",
        "pdf": "https://openreview.net/pdf?id=lm7MRcsFiS",
        "email": "nycu.edu.tw;nycu.edu.tw;illinois.edu;nctu.edu.tw;illinois.edu;ibm.com;nycu.edu.tw;nycu.edu.tw;nycu.edu.tw",
        "author_num": 9,
        "aff_unique_index": "0;0;1;2;1;3;0;0;0",
        "aff_unique_norm": "National Yang Ming Chiao Tung University;University of Illinois Urbana-Champaign;National Chiao Tung University;International Business Machines Corporation",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.nycu.edu.tw;https://illinois.edu;https://www.nctu.edu.tw;https://www.ibm.com",
        "aff_unique_abbr": "NYCU;UIUC;NCTU;IBM",
        "aff_campus_unique_index": "0;0;1;0;1;0;0;0",
        "aff_campus_unique": "Taiwan;Urbana-Champaign;",
        "aff_country_unique_index": "0;0;1;0;1;1;0;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Bounding Box Stability against Feature Dropout Reflects Detector Generalization across Environments",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17919",
        "id": "lmM4Ecm4HJ",
        "author_site": "Yang Yang, Wenhai Wang, Zhe Chen, Jifeng Dai, Liang Zheng",
        "tldr": "",
        "abstract": "Bounding boxes uniquely characterize object detection, where a good detector gives accurate bounding boxes of categories of interest. However, in the real-world where test ground truths are not provided, it is non-trivial to find out whether bounding boxes are accurate, thus preventing us from assessing the detector generalization ability. In this work, we find under feature map dropout, good detectors tend to output bounding boxes whose locations do not change much, while bounding boxes of poor detectors will undergo noticeable position changes. We compute the box stability score (BS score) to reflect this stability. Specifically, given an image, we compute a normal set of bounding boxes and a second set after feature map dropout. To obtain BS score, we use bipartite matching to find the corresponding boxes between the two sets and compute the average Intersection over Union (IoU) across the entire test set. We contribute to finding that BS score has a strong, positive correlation with detection accuracy measured by mean average precision (mAP) under various test environments. This relationship allows us to predict the accuracy of detectors on various real-world test sets without accessing test ground truths, verified on canonical detection tasks such as vehicle detection and pedestrian detection.",
        "keywords": "Object Detection;Model Generalization",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Yang Yang;Wenhai Wang;Zhe Chen;Jifeng Dai;Liang Zheng",
        "authorids": "~Yang_Yang32;~Wenhai_Wang2;~Zhe_Chen10;~Jifeng_Dai1;~Liang_Zheng4",
        "gender": "F;M;M;M;M",
        "homepage": "https://yangyanggirl.github.io/;https://czczup.github.io/;https://jifengdai.org/;http://zheng-lab.cecs.anu.edu.au/;http://whai362.github.io/",
        "dblp": ";06/4240-17;14/9399;61/7360-1;122/3593.html",
        "google_scholar": "Q6TME0QAAAAJ;j1rq_lYAAAAJ;SH_-B_AAAAAJ;https://scholar.google.com.au/citations?user=vNHqr3oAAAAJ;WM0OglcAAAAJ",
        "orcid": ";;;;",
        "linkedin": "yang-yang-girl/;;;liang-zheng-76341311a/;",
        "or_profile": "~Yang_Yang32;~Zhe_Chen10;~Jifeng_Dai1;~Liang_Zheng4;~Wenhai_Wang1",
        "aff": "Australian National University;Nanjing University;Tsinghua University;Australian National University;The Chinese University of Hong Kong",
        "aff_domain": "anu.edu.au;nju.edu.cn;tsinghua.edu.cn;anu.edu.au;cuhk.edu.hk",
        "position": "PhD student;PhD student;Associate Professor;Associate Professor;Postdoc",
        "bibtex": "@inproceedings{\nyang2024bounding,\ntitle={Bounding Box Stability against Feature Dropout Reflects Detector Generalization across Environments},\nauthor={Yang Yang and Wenhai Wang and Zhe Chen and Jifeng Dai and Liang Zheng},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=lmM4Ecm4HJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "xRLp;mbpe;h1Z9;19ZD",
        "pdf_size": 7126734,
        "rating": "6;6;8;10",
        "confidence": "4;3;3;4",
        "soundness": "2;3;3;4",
        "contribution": "2;2;3;4",
        "presentation": "4;2;3;4",
        "wc_summary": "63;45;106;81",
        "wc_strengths": "58;9;135;116",
        "wc_weaknesses": "155;79;42;24",
        "wc_questions": "109;29;1;26",
        "wc_review": "385;162;284;247",
        "wc_reply_reviewers": "190;448;22;483",
        "wc_reply_authors": "799;1787;359;22",
        "reply_reviewers": "2;3;1;1",
        "reply_authors": "2;3;1;1",
        "rating_avg": [
            7.5,
            1.6583123951777
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            73.75,
            22.554101622543072
        ],
        "wc_strengths_avg": [
            79.5,
            49.61098668641856
        ],
        "wc_weaknesses_avg": [
            75.0,
            50.264301447448766
        ],
        "wc_questions_avg": [
            41.25,
            40.59787556018172
        ],
        "wc_review_avg": [
            269.5,
            80.02030992191919
        ],
        "wc_reply_reviewers_avg": [
            285.75,
            189.71343521216414
        ],
        "wc_reply_authors_avg": [
            741.75,
            663.3933128243003
        ],
        "reply_reviewers_avg": [
            1.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.30151134457776363,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12659659578558285203&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=lmM4Ecm4HJ",
        "pdf": "https://openreview.net/pdf?id=lmM4Ecm4HJ",
        "email": "anu.edu.au;nju.edu.cn;tsinghua.edu.cn;anu.edu.au;cuhk.edu.hk",
        "author_num": 5,
        "aff_unique_index": "0;1;2;0;3",
        "aff_unique_norm": "Australian National University;Nanjing University;Tsinghua University;Chinese University of Hong Kong",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.anu.edu.au;https://www.nju.edu.cn;https://www.tsinghua.edu.cn;https://www.cuhk.edu.hk",
        "aff_unique_abbr": "ANU;Nanjing U;THU;CUHK",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;1;1;0;1",
        "aff_country_unique": "Australia;China"
    },
    {
        "id": "lmShn57DRD",
        "title": "Connecting the Patches: Multivariate Long-term Forecasting using Graph and Recurrent Neural Network",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Many Transformer-based models have achieved great performance on multivariate long-term time series forecasting (MLTSF) tasks in the past few years, but they are ineffective in capturing cross-channel dependencies and temporal order information. In multivariate time series analysis, the cross-channel dependencies can help the model understand the correlations between multivariate time series, and the consistency of time series is also essential for more accurate predictions. Therefore, we propose GRformer, adopting the Graph neural network (GNN) and position encoding based on recurrent neural network (RNN) to better process multivariate time series data. We design a mix-hop propagation layer and embed it in the feedforward neural network to encourage proper interaction between different time series. To introduce temporal order information, we use a multi-layer RNN to recursively generate positional embeddings for sequence elements. Experiments on eight real-world datasets show that our model can achieve more accurate predictions on MLTSF tasks.",
        "keywords": "multivariate time series forecasting;Transformer;graph neural network;temporal order information",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/977d8ff6d17882eb1f701cfeb56e5d6a9041dad9.zip",
        "author": "Aobo Liang;Xiaolin Chai;Yan Sun",
        "authorids": "~Aobo_Liang1;~Xiaolin_Chai1;~Yan_Sun10",
        "gender": "M;F;",
        "homepage": "https://github.com/Leopold2333;;https://teacher.bupt.edu.cn/sunyan/zh_CN/index.htm",
        "dblp": ";;",
        "google_scholar": "https://scholar.google.com/citations?view_op=new_profile;;",
        "orcid": ";0000-0002-7447-3367;",
        "linkedin": ";;",
        "or_profile": "~Aobo_Liang1;~Xiaolin_Chai1;~Yan_Sun10",
        "aff": ";Beijing University of Posts and Telecommunications;Beijing University of Posts and Telecommunications",
        "aff_domain": ";bupt.edu.cn;bupt.edu.cn",
        "position": ";PhD student;Full Professor",
        "bibtex": "@misc{\nliang2024connecting,\ntitle={Connecting the Patches: Multivariate Long-term Forecasting using Graph and Recurrent Neural Network},\nauthor={Aobo Liang and Xiaolin Chai and Yan Sun},\nyear={2024},\nurl={https://openreview.net/forum?id=lmShn57DRD}\n}",
        "github": "",
        "project": "",
        "reviewers": "Evwp;rJkP;qMLP",
        "site": "https://openreview.net/forum?id=lmShn57DRD",
        "pdf_size": 2205985,
        "rating": "3;3;6",
        "confidence": "4;4;2",
        "soundness": "2;1;3",
        "contribution": "2;1;3",
        "presentation": "3;2;3",
        "wc_summary": "65;224;166",
        "wc_strengths": "20;54;148",
        "wc_weaknesses": "162;204;164",
        "wc_questions": "82;114;84",
        "wc_review": "329;596;562",
        "wc_reply_reviewers": "125;0;0",
        "wc_reply_authors": "1859;1417;812",
        "reply_reviewers": "1;0;0",
        "reply_authors": "3;2;2",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            151.66666666666666,
            65.69796208576201
        ],
        "wc_strengths_avg": [
            74.0,
            54.135632135098106
        ],
        "wc_weaknesses_avg": [
            176.66666666666666,
            19.344824171395878
        ],
        "wc_questions_avg": [
            93.33333333333333,
            14.636332266733433
        ],
        "wc_review_avg": [
            495.6666666666667,
            118.66573033338462
        ],
        "wc_reply_reviewers_avg": [
            41.666666666666664,
            58.92556509887896
        ],
        "wc_reply_authors_avg": [
            1362.6666666666667,
            429.1591261473482
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:R-vb4odfDEgJ:scholar.google.com/&scioq=Connecting+the+Patches:+Multivariate+Long-term+Forecasting+using+Graph+and+Recurrent+Neural+Network&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Beijing University of Posts and Telecommunications",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.bupt.edu.cn/",
        "aff_unique_abbr": "BUPT",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Beijing",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "lmYGRGyL4i",
        "title": "Uncovering the Spectrum of Graph Generative Models: From One-Shot to Sequential",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In the field of deep graph generative models, two families coexist: one-shot models, which fill the graph content in one go given a number of nodes, and sequential models, where new nodes and edges are inserted sequentially and autoregressively. Recently, one-shot models are seeing great popularity due to their rising sample quality and lower sampling time compared to the more costly autoregressive models. With this paper we unify the two worlds in a single framework, unlocking the whole spectrum of options where one-shot and sequential models are but the two extremes. We use the denoising diffusion models' theory to develop a node removal process, which destroys a given graph through many steps. An insertion model reverses this process by predicting how many nodes have been removed from the intermediate subgraphs. Then, generation happens by iteratively adding new blocks of nodes, with size sampled from the insertion model, and content generated using any one-shot model. By adjusting the knob on node removal, the framework allows for any degree of sequentiality, from one-shot to fully sequential, and any node ordering, e.g., random and BFS. Based on this, we conduct the first analysis of the sample quality-time trade-off across a range of molecular and generic graphs datasets. As a case study, we adapt DiGress, a diffusion-based one-shot model, to the whole spectrum of sequentiality, reaching new state of the art results, and motivating a renewed interest in developing autoregressive graph generative models.",
        "keywords": "Graph generation;One-shot generation;Autoregressive generation;Unified framework;Diffusion Model;Molecule generation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/0e004c98b31c60bd888f4f7aefff69bdc3f5ecf0.zip",
        "author": "Samuel Cognolato;Alessandro Sperduti;Luciano Serafini",
        "authorids": "~Samuel_Cognolato1;~Alessandro_Sperduti1;~Luciano_Serafini1",
        "gender": "M;M;M",
        "homepage": "http://hit.psy.unipd.it/samuel-cognolato-0;https://www.math.unipd.it/~sperduti/;https://dkm.fbk.eu/author/lucianoserafini/",
        "dblp": ";s/ASperduti;s/LucianoSerafini",
        "google_scholar": ";JsExaWMAAAAJ;rfCV4fwAAAAJ",
        "orcid": ";0000-0002-8686-850X;0000-0003-4812-1031",
        "linkedin": ";;",
        "or_profile": "~Samuel_Cognolato1;~Alessandro_Sperduti1;~Luciano_Serafini1",
        "aff": "Fondazione Bruno Kessler;Universita' degli studi di Padova;Fondazione Bruno Kessler",
        "aff_domain": "fbk.eu;unipd.it;fbk.eu",
        "position": "PhD student;Full Professor;Principal Researcher",
        "bibtex": "@misc{\ncognolato2024uncovering,\ntitle={Uncovering the Spectrum of Graph Generative Models: From One-Shot to Sequential},\nauthor={Samuel Cognolato and Alessandro Sperduti and Luciano Serafini},\nyear={2024},\nurl={https://openreview.net/forum?id=lmYGRGyL4i}\n}",
        "github": "",
        "project": "",
        "reviewers": "9h17;gvwJ;yahf;HNVY;H5VJ",
        "site": "https://openreview.net/forum?id=lmYGRGyL4i",
        "pdf_size": 492440,
        "rating": "3;5;5;5;6",
        "confidence": "3;4;4;3;3",
        "soundness": "2;3;3;2;3",
        "contribution": "2;3;3;2;2",
        "presentation": "3;3;3;2;3",
        "wc_summary": "102;60;75;104;108",
        "wc_strengths": "99;33;28;39;65",
        "wc_weaknesses": "227;150;224;46;133",
        "wc_questions": "69;63;54;6;2",
        "wc_review": "497;306;381;195;308",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "1139;786;765;599;567",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "2;1;1;1;1",
        "rating_avg": [
            4.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.4,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            89.8,
            18.914544668059023
        ],
        "wc_strengths_avg": [
            52.8,
            26.38484413446477
        ],
        "wc_weaknesses_avg": [
            156.0,
            66.82813778641449
        ],
        "wc_questions_avg": [
            38.8,
            28.84024965217881
        ],
        "wc_review_avg": [
            337.4,
            99.49994974873104
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            771.2,
            203.41327390315513
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.2,
            0.4000000000000001
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.16666666666666663,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:fH5tRM1UOXMJ:scholar.google.com/&scioq=Uncovering+the+Spectrum+of+Graph+Generative+Models:+From+One-Shot+to+Sequential&hl=en&as_sdt=0,48",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Fondazione Bruno Kessler;University of Padova",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.fbk.eu;https://www.unipd.it",
        "aff_unique_abbr": "FBK;Unipd",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Italy"
    },
    {
        "id": "lnB7rTsT9Y",
        "title": "Knowledge Transfer through Value Function for Compositional Tasks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep Reinforcement Learning methods are sample inefficient when exploring the environment from scratch. In this work, we introduce an approach of knowledge transfer using the value function combined with curriculum learning, which aims to leverage the learning process by transferring knowledge among progressively increasing task complexity. Our main contribution is demonstrating the effectiveness of this approach by modifying the degrees of freedom of the target task, breaking it down into simpler sub-tasks, and transferring the knowledge along the curriculum steps. We empirically demonstrate the broad possibilities of modifying the degrees of freedom of the target task to leverage learning in classical Reinforcement Learning problems and a real-world control task.",
        "keywords": "Transfer Learnig;Curriculum Learning;Deep Reinforcement Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Henrique Donancio;Matteo Leonetti;Laurent Vercouter",
        "authorids": "~Henrique_Donancio1;~Matteo_Leonetti1;~Laurent_Vercouter1",
        "gender": ";M;M",
        "homepage": ";;",
        "dblp": ";26/8524;10/2920",
        "google_scholar": ";23uzLe0AAAAJ;",
        "orcid": ";;",
        "linkedin": ";matteo-leonetti-21814622;",
        "or_profile": "~Henrique_Donancio1;~Matteo_Leonetti1;~Laurent_Vercouter1",
        "aff": ";King's College London, University of London;Institut National des Sciences Appliqu\u00e9es de Rouen",
        "aff_domain": ";kcl.ac.uk;insa-rouen.fr",
        "position": ";Associate Professor;Full Professor",
        "bibtex": "@misc{\ndonancio2024knowledge,\ntitle={Knowledge Transfer through Value Function for Compositional Tasks},\nauthor={Henrique Donancio and Matteo Leonetti and Laurent Vercouter},\nyear={2024},\nurl={https://openreview.net/forum?id=lnB7rTsT9Y}\n}",
        "github": "",
        "project": "",
        "reviewers": "QcHM;xTEq;mFvk;Xw5P;Jyv8",
        "site": "https://openreview.net/forum?id=lnB7rTsT9Y",
        "pdf_size": 875342,
        "rating": "3;3;3;3;5",
        "confidence": "4;3;4;4;4",
        "soundness": "2;2;1;2;3",
        "contribution": "2;2;1;2;2",
        "presentation": "2;1;1;1;3",
        "wc_summary": "65;117;62;39;197",
        "wc_strengths": "95;34;49;23;63",
        "wc_weaknesses": "106;202;324;266;64",
        "wc_questions": "46;136;94;7;47",
        "wc_review": "312;489;529;335;371",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            3.4,
            0.8
        ],
        "confidence_avg": [
            3.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            1.8,
            0.4
        ],
        "presentation_avg": [
            1.6,
            0.8
        ],
        "wc_summary_avg": [
            96.0,
            56.58268286322238
        ],
        "wc_strengths_avg": [
            52.8,
            25.06312031651287
        ],
        "wc_weaknesses_avg": [
            192.4,
            96.72559123623903
        ],
        "wc_questions_avg": [
            66.0,
            44.55558326405345
        ],
        "wc_review_avg": [
            407.2,
            86.15428021868676
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.25,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:TX7uhYaMViIJ:scholar.google.com/&scioq=Knowledge+Transfer+through+Value+Function+for+Compositional+Tasks&hl=en&as_sdt=0,33",
        "gs_version_total": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "King's College London;Institut National des Sciences Appliqu\u00e9es",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.kcl.ac.uk;https://www.insa-rouen.fr",
        "aff_unique_abbr": "KCL;INSA Rouen",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Rouen",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United Kingdom;France"
    },
    {
        "id": "lnffMykYSj",
        "title": "On the Long Range Abilities of Transformers",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Despite their dominance in modern DL and, especially, NLP domains, transformer architectures exhibit sub-optimal performance on long-range tasks compared to recent layers that are specifically designed for this purpose. In this work, drawing inspiration from key attributes of long-range layers, such as state-space layers, linear RNN layers, and global convolution layers, we demonstrate that minimal mod-\nifications to the transformer architecture can significantly enhance performance on the Long Range Arena (LRA) benchmark, thus narrowing the gap with these specialized layers. We identify that two key principles for long-range tasks are (i) incorporating an inductive bias towards smoothness, and (ii) locality. As we show, integrating these ideas into the attention mechanism improves results with a negligible amount of additional computation and without any additional trainable parameters. Our experiments also shed light on the reasons for the inferior\nperformance of transformers on long-range tasks and identify critical properties that are essential for successfully capturing long-range dependencies. Our code is attached as supplementary.",
        "keywords": "Transformers;Long Range;LRA Benchmark",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/21d315d2b5c0313f1927981c0d01cc6747065a9b.zip",
        "author": "Itamar Zimerman;Lior Wolf",
        "authorids": "~Itamar_Zimerman1;~Lior_Wolf1",
        "gender": "M;M",
        "homepage": ";http://www.cs.tau.ac.il/~wolf",
        "dblp": "294/8621;83/4103",
        "google_scholar": "01s_DpwAAAAJ;UbFrXTsAAAAJ",
        "orcid": "0000-0001-8321-0609;0000-0001-5578-8892",
        "linkedin": ";",
        "or_profile": "~Itamar_Zimerman1;~Lior_Wolf1",
        "aff": "International Business Machines;Tel Aviv University",
        "aff_domain": "ibm.com;tau.ac.il",
        "position": "Researcher;Full Professor",
        "bibtex": "@misc{\nzimerman2024on,\ntitle={On the Long Range Abilities of Transformers},\nauthor={Itamar Zimerman and Lior Wolf},\nyear={2024},\nurl={https://openreview.net/forum?id=lnffMykYSj}\n}",
        "github": "",
        "project": "",
        "reviewers": "nsrb;tj55;LwQf;hVaG",
        "site": "https://openreview.net/forum?id=lnffMykYSj",
        "pdf_size": 10306441,
        "rating": "3;5;5;5",
        "confidence": "4;4;4;3",
        "soundness": "1;3;3;3",
        "contribution": "2;2;2;2",
        "presentation": "2;3;3;3",
        "wc_summary": "60;113;127;190",
        "wc_strengths": "34;50;36;106",
        "wc_weaknesses": "738;71;126;169",
        "wc_questions": "152;81;130;417",
        "wc_review": "984;315;419;882",
        "wc_reply_reviewers": "0;0;582;0",
        "wc_reply_authors": "1572;588;862;575",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "3;1;2;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            122.5,
            46.295248136282844
        ],
        "wc_strengths_avg": [
            56.5,
            29.236107812087436
        ],
        "wc_weaknesses_avg": [
            276.0,
            268.9879179442824
        ],
        "wc_questions_avg": [
            195.0,
            130.72298956189763
        ],
        "wc_review_avg": [
            650.0,
            287.648222660944
        ],
        "wc_reply_reviewers_avg": [
            145.5,
            252.01339250127165
        ],
        "wc_reply_authors_avg": [
            899.25,
            404.96751412922
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1935130411934079623&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "International Business Machines Corporation;Tel Aviv University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ibm.com;https://www.tau.ac.il",
        "aff_unique_abbr": "IBM;TAU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United States;Israel"
    },
    {
        "title": "Submodular Reinforcement Learning",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17918",
        "id": "loYSzjSaAK",
        "author_site": "Manish Prajapat, Mojmir Mutny, Melanie Zeilinger, Andreas Krause",
        "tldr": "",
        "abstract": "In reinforcement learning (RL), rewards of states are typically considered additive, and following the Markov assumption, they are independent of states visited previously. In many important applications, such as coverage control, experiment design and informative path planning, rewards naturally have diminishing returns, i.e., their value decreases in light of similar states visited previously. To tackle this, we propose Submodular RL (subRL), a paradigm which seeks to optimize more general, non-additive (and history-dependent) rewards modelled via submodular set functions, which capture diminishing returns. Unfortunately, in general, even in tabular settings, we show that the resulting optimization problem is hard to approximate. On the other hand, motivated by the success of greedy algorithms in classical submodular optimization, we propose subPO, a simple policy gradient-based algorithm for subRL that handles non-additive rewards by greedily maximizing marginal gains. Indeed, under some assumptions on the underlying Markov Decision Process (MDP), subPO recovers optimal constant factor approximations of submodular bandits. Moreover, we derive a natural policy gradient approach for locally optimizing subRL instances even in large state- and action- spaces. We showcase the versatility of our approach by applying subPO to several applications, such as biodiversity monitoring, Bayesian experiment design, informative path planning, and coverage maximization. Our results demonstrate sample efficiency, as well as scalability to high-dimensional state-action spaces.",
        "keywords": "Reinforcement learning;Non-Markovian rewards;Submodular optimization;Policy gradient;Complex objectives in RL",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/30112daa3ee7bea02cf8fee5a080ef72001b7eb5.zip",
        "author": "Manish Prajapat;Mojmir Mutny;Melanie Zeilinger;Andreas Krause",
        "authorids": "~Manish_Prajapat1;~Mojmir_Mutny1;~Melanie_Zeilinger1;~Andreas_Krause1",
        "gender": "M;M;F;M",
        "homepage": "https://www.linkedin.com/in/manish-prajapat-eth/;;;https://las.inf.ethz.ch/krausea",
        "dblp": "227/2093;173/5114;41/7142;87/1831-1.html",
        "google_scholar": "qnobH84AAAAJ;;;https://scholar.google.ch/citations?user=eDHv58AAAAAJ",
        "orcid": "0000-0002-3867-4575;;0000-0003-4570-7571;0000-0001-7260-9673",
        "linkedin": "manish-prajapat-eth/;;;krausea/",
        "or_profile": "~Manish_Prajapat1;~Mojmir_Mutny1;~Melanie_Zeilinger1;~Andreas_Krause1",
        "aff": "Swiss Federal Institute of Technology;Swiss Federal Institute of Technology;ETHZ - ETH Zurich;ETH Zurich",
        "aff_domain": "ethz.ch;ethz.ch;ethz.ch;ethz.ch",
        "position": "PhD student;PhD student;Associate Professor;Full Professor",
        "bibtex": "@inproceedings{\nprajapat2024submodular,\ntitle={Submodular Reinforcement Learning},\nauthor={Manish Prajapat and Mojmir Mutny and Melanie Zeilinger and Andreas Krause},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=loYSzjSaAK}\n}",
        "github": "",
        "project": "",
        "reviewers": "6FV4;u5A8;oKKZ;uscY",
        "pdf_size": 804792,
        "rating": "6;6;8;8",
        "confidence": "4;3;3;4",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;4",
        "presentation": "3;3;4;3",
        "wc_summary": "161;109;66;70",
        "wc_strengths": "45;31;36;54",
        "wc_weaknesses": "210;48;36;91",
        "wc_questions": "56;42;2;13",
        "wc_review": "472;230;140;228",
        "wc_reply_reviewers": "29;15;0;0",
        "wc_reply_authors": "752;347;83;100",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            101.5,
            38.23937760999779
        ],
        "wc_strengths_avg": [
            41.5,
            8.789197915623474
        ],
        "wc_weaknesses_avg": [
            96.25,
            68.78362813926
        ],
        "wc_questions_avg": [
            28.25,
            21.683807322516035
        ],
        "wc_review_avg": [
            267.5,
            123.5344081622606
        ],
        "wc_reply_reviewers_avg": [
            11.0,
            12.062338081814818
        ],
        "wc_reply_authors_avg": [
            320.5,
            270.14857023497274
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 17,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2679578689823041065&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=loYSzjSaAK",
        "pdf": "https://openreview.net/pdf?id=loYSzjSaAK",
        "email": "ethz.ch;ethz.ch;ethz.ch;ethz.ch",
        "author_num": 4,
        "aff_unique_index": "0;0;1;1",
        "aff_unique_norm": "Swiss Federal Institute of Technology;ETH Zurich",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ethz.ch;https://www.ethz.ch",
        "aff_unique_abbr": "ETH Zurich;ETHZ",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Switzerland"
    },
    {
        "id": "lpxcCD7WbQ",
        "title": "Task adaptation by biologically inspired stochastic comodulation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Brain representations must strike a balance between generalizability and adaptability. Neural codes capture general statistical regularities in the world, while dynamically adjusting to reflect current goals. One aspect of this adaptation is stochastically co-modulating neurons' gains based on their task relevance. These fluctuations then propagate downstream to guide decision making. Here, we test the computational viability of such a scheme in the context of multi-task learning. We show that fine-tuning convolutional networks by stochastic modulation improves on deterministic gain increases, achieving state-of-the-art results on the CelebA dataset. To better understand the mechanisms supporting this improvement, we explore how fine-tuning performance is affected by architecture using Cifar-100. Overall, our results suggest that stochastic comodulation can significantly enhance learning efficiency and performance in multi-task learning, without additional learnable parameters. This offers a promising new direction for developing more flexible and robust intelligent systems.",
        "keywords": "computational neuroscience;stochastic gain modulation;attention;task fine-tuning",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/49b13ced16692251f05d443b8acf179e5ee08549.zip",
        "author": "Gauthier Boeshertz;Caroline Haimerl;Cristina Savin",
        "authorids": "~Gauthier_Boeshertz1;~Caroline_Haimerl1;~Cristina_Savin1",
        "gender": "M;F;F",
        "homepage": ";;http://csavin.wixsite.com/savinlab",
        "dblp": ";;23/10829",
        "google_scholar": "https://scholar.google.com/citations?hl=en;oljDL7MAAAAJ;muNtwgcAAAAJ",
        "orcid": ";;0000-0002-3414-8244",
        "linkedin": ";;cristina-savin-1889199b/",
        "or_profile": "~Gauthier_Boeshertz1;~Caroline_Haimerl1;~Cristina_Savin1",
        "aff": ";Champalimaud Centre for the Unknown;New York University",
        "aff_domain": ";research.fchampalimaud.org;nyu.edu",
        "position": ";Postdoc;Assistant Professor",
        "bibtex": "@misc{\nboeshertz2024task,\ntitle={Task adaptation by biologically inspired stochastic comodulation},\nauthor={Gauthier Boeshertz and Caroline Haimerl and Cristina Savin},\nyear={2024},\nurl={https://openreview.net/forum?id=lpxcCD7WbQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "iLtH;d7DF;cKzA;8Tjw",
        "site": "https://openreview.net/forum?id=lpxcCD7WbQ",
        "pdf_size": 8495346,
        "rating": "3;5;5;8",
        "confidence": "3;3;4;2",
        "soundness": "2;2;3;4",
        "contribution": "2;3;3;3",
        "presentation": "2;2;2;3",
        "wc_summary": "54;136;142;282",
        "wc_strengths": "96;46;90;145",
        "wc_weaknesses": "274;152;161;413",
        "wc_questions": "394;150;25;48",
        "wc_review": "818;484;418;888",
        "wc_reply_reviewers": "0;0;53;0",
        "wc_reply_authors": "602;632;206;641",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            153.5,
            81.93137372215847
        ],
        "wc_strengths_avg": [
            94.25,
            35.088281519618484
        ],
        "wc_weaknesses_avg": [
            250.0,
            105.67639282261672
        ],
        "wc_questions_avg": [
            154.25,
            146.1957164215149
        ],
        "wc_review_avg": [
            652.0,
            203.85779357189168
        ],
        "wc_reply_reviewers_avg": [
            13.25,
            22.949673200287624
        ],
        "wc_reply_authors_avg": [
            520.25,
            182.00600951616954
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5940885257860046,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ARIT08OX0MYJ:scholar.google.com/&scioq=Task+adaptation+by+biologically+inspired+stochastic+comodulation&hl=en&as_sdt=0,33",
        "gs_version_total": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Champalimaud Centre for the Unknown;New York University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.champalimaud.org;https://www.nyu.edu",
        "aff_unique_abbr": "CCU;NYU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Portugal;United States"
    },
    {
        "id": "lpyxWITF2c",
        "title": "Topology Matters in Fair Graph Learning: a Theoretical Pilot Study",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent advances in fair graph learning observe that graph neural networks (GNNs) further amplify prediction bias compared with multilayer perception (MLP), while the reason behind this is unknown. In this paper, \\reviseb{as a pilot study, we provide a theoretical understanding of when and why the bias enhancement happens in GCN-like aggregation within contexture stochastic block model (CSBM)\\footnote{We leave more general analysis on other aggregation operations and random graph models in future work. See Appendix~\\ref{app:future} for more discussions.}. Specifically, we define bias enhancement as higher node representation bias after aggregation compared with that before aggregation. We provide a sufficient condition related to the statistical information of graph data to provably and comprehensively delineate instances of bias enhancement during aggregation. \nAdditionally, the proposed sufficient condition goes beyond intuition, serving as a valuable tool to derive data-centric insights. Motivated by data-centric insights,} we propose a fair graph rewiring algorithm, named \\textit{FairGR}, to reduce sensitive homophily coefficient while preserving useful graph topology. Experiments on node classification tasks demonstrate that \\textit{FairGR} can mitigate the prediction bias with comparable performance on three real-world datasets. Additionally, \\textit{FairGR} is compatible with many state-of-the-art methods, such as adding regularization, adversarial debiasing, and Fair mixup via refining graph topology, i.e., \\textit{FairGR} is a plug-in fairness method and can be adapted to improve existing fair graph learning strategies. The code is available in {\\color{blue}\\url{https://anonymous.4open.science/r/FairGR-B65D/}}.",
        "keywords": "Topology; Fair Graph Learning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Zhimeng Jiang;Xiaotian Han;Chao Fan;Zirui Liu;Xiao Huang;Na Zou;Ali Mostafavi;Xia Hu",
        "authorids": "~Zhimeng_Jiang1;~Xiaotian_Han1;~Chao_Fan2;~Zirui_Liu1;~Xiao_Huang1;~Na_Zou2;~Ali_Mostafavi2;~Xia_Hu4",
        "gender": "M;M;;M;M;F;M;M",
        "homepage": "http://www.zhimengjiang.com/;https://ahxt.github.io/;https://fanchaolab.com;https://zirui-ray-liu.github.io/;https://www4.comp.polyu.edu.hk/~xiaohuang/;https://nzou1.github.io/;;https://cs.rice.edu/~xh37/index.html",
        "dblp": "217/3235;;;196/8629-1.html;25/692-1.html;152/0090-1.html;;256/9406.html",
        "google_scholar": "5Es3Yk4AAAAJ;Uromx98AAAAJ;3k_B_zUAAAAJ;https://scholar.google.com/citations?hl=zh-CN;Be21PkYAAAAJ;https://scholar.google.com/citations?hl=en;DFNvQPYAAAAJ;https://scholar.google.com.tw/citations?user=pcCS60IAAAAJ",
        "orcid": "0000-0001-6933-3952;;;;0000-0002-3867-900X;0000-0003-1984-795X;;",
        "linkedin": ";;;;;na-zou-a1721535/;;",
        "or_profile": "~Zhimeng_Jiang1;~Xiaotian_Han1;~Chao_Fan2;~Zirui_Liu1;~Xiao_Huang1;~Na_Zou2;~Ali_Mostafavi2;~Xia_Hu2",
        "aff": "VISA Research;Texas A&M University;Clemson University;Rice University;The Hong Kong Polytechnic University;University of Houston;Texas A&M;Rice University",
        "aff_domain": "visa.com;tamu.edu;clemson.edu;rice.edu;polyu.edu.hk;uh.edu;tamu.edu;rice.edu",
        "position": "Researcher;PhD student;Assistant Professor;PhD student;Assistant Professor;Assistant Professor;Associate Professor;Associate Professor",
        "bibtex": "@misc{\njiang2024topology,\ntitle={Topology Matters in Fair Graph Learning: a Theoretical Pilot Study},\nauthor={Zhimeng Jiang and Xiaotian Han and Chao Fan and Zirui Liu and Xiao Huang and Na Zou and Ali Mostafavi and Xia Hu},\nyear={2024},\nurl={https://openreview.net/forum?id=lpyxWITF2c}\n}",
        "github": "",
        "project": "",
        "reviewers": "iP2Z;eDBe;4d2P",
        "site": "https://openreview.net/forum?id=lpyxWITF2c",
        "pdf_size": 2082186,
        "rating": "3;5;5",
        "confidence": "5;5;3",
        "soundness": "2;3;3",
        "contribution": "1;2;3",
        "presentation": "2;3;3",
        "wc_summary": "60;47;110",
        "wc_strengths": "20;42;140",
        "wc_weaknesses": "189;222;231",
        "wc_questions": "44;31;80",
        "wc_review": "313;342;561",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            72.33333333333333,
            27.157974069424906
        ],
        "wc_strengths_avg": [
            67.33333333333333,
            52.16214037871614
        ],
        "wc_weaknesses_avg": [
            214.0,
            18.05547008526779
        ],
        "wc_questions_avg": [
            51.666666666666664,
            20.725722075613085
        ],
        "wc_review_avg": [
            405.3333333333333,
            110.70782367214264
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16508704730984092978&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;3;4;5;1;3",
        "aff_unique_norm": "VISA;Texas A&M University;Clemson University;Rice University;Hong Kong Polytechnic University;University of Houston",
        "aff_unique_dep": "Research;;;;;",
        "aff_unique_url": "https://www.visa.com/;https://www.tamu.edu;https://www.clemson.edu;https://www.rice.edu;https://www.polyu.edu.hk;https://www.uh.edu",
        "aff_unique_abbr": "VISA;TAMU;Clemson;Rice;PolyU;UH",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;1;0;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "lr0byX2aNO",
        "title": "Counterfactual Fairness on Graphs: Augmentations, Hidden Confounders, and Identifiability",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We consider augmenting graph data with counterfactual generation in order to achieve fairness on downstream tasks. While this direction has been explored previously, existing methods invariably consider oversimplified causal relationships. Moreover, they often rely on unidentifiable models to encode causal relationships, making it hard to identify the true joint distribution and thus recover counterfactual graphs. To tackle these challenges, we introduce a causal model with hidden confounders on graphs, which considers the existence of hidden confounders affecting both node features and graph structures. We use an identifiable graph VAE model to simultaneously estimate hidden confounders and learn generation functions of the causal model. By incorporating a Gaussian mixture prior distribution, we improve the identifiability of our model to recover the joint distribution of observed data and hidden confounders. Using the generated counterfactual graphs, we enforce consistency in the predictions of classifiers for different counterfactual graphs, thereby achieving graph counterfactual fairness in these classifiers. Experimental results demonstrate the effectiveness of our method in improving the counterfactual fairness of classifiers on various graph tasks. Moreover, theoretical analysis, coupled with empirical results, illustrates the capability of our method to successfully identify hidden confounders.",
        "keywords": "Counterfactual Fairness on Graphs;Graph Data Augmentation",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Hongyi Ling;Zhimeng Jiang;Na Zou;Shuiwang Ji",
        "authorids": "~Hongyi_Ling1;~Zhimeng_Jiang1;~Na_Zou2;~Shuiwang_Ji1",
        "gender": ";M;F;M",
        "homepage": ";http://www.zhimengjiang.com/;https://nzou1.github.io/;http://people.tamu.edu/~sji",
        "dblp": "259/0934;217/3235;152/0090-1.html;84/6405",
        "google_scholar": "ei8O1BEAAAAJ;5Es3Yk4AAAAJ;https://scholar.google.com/citations?hl=en;BZGj6sAAAAAJ",
        "orcid": ";0000-0001-6933-3952;0000-0003-1984-795X;0000-0002-4205-4563",
        "linkedin": ";;na-zou-a1721535/;shuiwang-ji-9a040715/",
        "or_profile": "~Hongyi_Ling1;~Zhimeng_Jiang1;~Na_Zou2;~Shuiwang_Ji1",
        "aff": "Texas A&M University - College Station;VISA Research;University of Houston;Texas A&M University",
        "aff_domain": "tamu.edu;visa.com;uh.edu;tamu.edu",
        "position": "PhD student;Researcher;Assistant Professor;Professor",
        "bibtex": "@misc{\nling2024counterfactual,\ntitle={Counterfactual Fairness on Graphs: Augmentations, Hidden Confounders, and Identifiability},\nauthor={Hongyi Ling and Zhimeng Jiang and Na Zou and Shuiwang Ji},\nyear={2024},\nurl={https://openreview.net/forum?id=lr0byX2aNO}\n}",
        "github": "",
        "project": "",
        "reviewers": "GkRy;t9GV;7FQE;QRDh",
        "site": "https://openreview.net/forum?id=lr0byX2aNO",
        "pdf_size": 444807,
        "rating": "5;5;5;5",
        "confidence": "3;4;3;3",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;2;4;3",
        "wc_summary": "96;77;280;36",
        "wc_strengths": "80;54;111;68",
        "wc_weaknesses": "138;201;217;105",
        "wc_questions": "106;50;93;5",
        "wc_review": "420;382;701;214",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            122.25,
            93.6225800755352
        ],
        "wc_strengths_avg": [
            78.25,
            21.0282548015759
        ],
        "wc_weaknesses_avg": [
            165.25,
            45.630992757116296
        ],
        "wc_questions_avg": [
            63.5,
            39.62638010214912
        ],
        "wc_review_avg": [
            429.25,
            174.99910714057944
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11916306380323873813&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Texas A&M University;VISA;University of Houston",
        "aff_unique_dep": ";Research;",
        "aff_unique_url": "https://www.tamu.edu;https://www.visa.com/;https://www.uh.edu",
        "aff_unique_abbr": "TAMU;VISA;UH",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "College Station;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "lr69PmF2Ov",
        "title": "Discriminatively Matched Part Tokens for Pointly Supervised Instance Segmentation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The self-attention mechanism of vision transformer has demonstrated potential for instance segmentation even using a single point as supervision. However, when it comes to objects with significant deformation and variations in appearance, this attention mechanism encounters a challenge of semantic variation among object parts. In this study, we propose discriminatively matched part tokens (DMPT), to extend the capacity of self-attention for pointly supervised instance segmentation. DMPT first allocates a token for each object part by finding a semantic extreme point, and then introduces part classifiers with deformable constraint to re-estimate part tokens which are utilized to guide and enhance the fine-grained localization capability of the self-attention mechanism. Through iterative optimization, DMPT matches the most discriminative part tokens which facilitate capturing fine-grained semantics and activating full object extent. Extensive experiments on PASCAL VOC and MS-COCO segmentation datasets show that DMPT respectively improves the state-of-the-art method by 2.0% mAP50 and 1.6% AP, achieving the best performance under point supervision. DMPT is combination with the Segment Anything Model (SAM), demonstrating the great potential to reform point prompt learning. Code is enclosed in the supplementary material.",
        "keywords": "Instance Segmentation; Pointly supervision; Visual Transformer; Part-based Model;Segment Anything Model",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/70f5226cb27beb8d77f5b00249da3da692b1222a.zip",
        "author": "Zonghao Guo;Mingxiang Liao;Zhiliang Peng;Yidan Zhang;Peng Yuan;Qixiang Ye;Fang Wan",
        "authorids": "~Zonghao_Guo1;~Mingxiang_Liao1;~Zhiliang_Peng1;~Yidan_Zhang5;~Peng_Yuan3;~Qixiang_Ye1;~Fang_Wan1",
        "gender": "M;M;M;F;;M;M",
        "homepage": "https://guozonghao96.github.io/;https://github.com/MingXiangL;;;;http://people.ucas.ac.cn/~qxye?language=en;https://people.ucas.ac.cn/~wanfang?language=en",
        "dblp": ";;289/0209;;99/1838;06/4335;",
        "google_scholar": "https://scholar.google.com.hk/citations?hl=;;-X1tyN0AAAAJ;;ayofPmMAAAAJ;https://scholar.google.com.hk/citations?user=tjEfgsEAAAAJ;https://scholar.google.com.hk/citations?user=0IKavloAAAAJ",
        "orcid": ";;;0000-0002-7466-0234;;;0000-0002-8083-9257",
        "linkedin": ";;;;;;",
        "or_profile": "~Zonghao_Guo1;~Mingxiang_Liao1;~Zhiliang_Peng1;~Yidan_Zhang5;~Peng_Yuan3;~Qixiang_Ye1;~Fang_Wan1",
        "aff": "University of Chinese Academy of Sciences;University of Chinese Academy of Sciences;University of Chinese Academy of Sciences;University of Chinese Academy of Sciences;Huawei Noah' Ark Lab;University of Chinese Academy of Sciences;University of Chinese Academy of Sciences",
        "aff_domain": "ucas.ac.cn;ucas.ac.cn;ucas.ac.cn;ucas.ac.cn;huawei.com;ucas.ac.cn;ucas.ac.cn",
        "position": "PhD student;PhD student;PhD student;Instructor;Researcher;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nguo2024discriminatively,\ntitle={Discriminatively Matched Part Tokens for Pointly Supervised Instance Segmentation},\nauthor={Zonghao Guo and Mingxiang Liao and Zhiliang Peng and Yidan Zhang and Peng Yuan and Qixiang Ye and Fang Wan},\nyear={2024},\nurl={https://openreview.net/forum?id=lr69PmF2Ov}\n}",
        "github": "",
        "project": "",
        "reviewers": "Br6s;bde7;QnBw;5abY",
        "site": "https://openreview.net/forum?id=lr69PmF2Ov",
        "pdf_size": 2745150,
        "rating": "6;6;6;6",
        "confidence": "4;4;4;3",
        "soundness": "3;3;3;3",
        "contribution": "3;2;3;3",
        "presentation": "3;1;3;3",
        "wc_summary": "93;108;69;55",
        "wc_strengths": "55;32;96;50",
        "wc_weaknesses": "98;333;42;64",
        "wc_questions": "50;5;3;4",
        "wc_review": "296;478;210;173",
        "wc_reply_reviewers": "0;146;0;52",
        "wc_reply_authors": "342;762;252;421",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "1;2;1;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            81.25,
            20.571521577170707
        ],
        "wc_strengths_avg": [
            58.25,
            23.41340428045439
        ],
        "wc_weaknesses_avg": [
            134.25,
            116.46968489697223
        ],
        "wc_questions_avg": [
            15.5,
            19.93113142799475
        ],
        "wc_review_avg": [
            289.25,
            117.75690001014803
        ],
        "wc_reply_reviewers_avg": [
            49.5,
            59.621724228673564
        ],
        "wc_reply_authors_avg": [
            444.25,
            192.95125679818725
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:PeFplBZOkloJ:scholar.google.com/&scioq=Discriminatively+Matched+Part+Tokens+for+Pointly+Supervised+Instance+Segmentation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;1;0;0",
        "aff_unique_norm": "University of Chinese Academy of Sciences;Huawei",
        "aff_unique_dep": ";Noah' Ark Lab",
        "aff_unique_url": "http://www.ucas.ac.cn;https://www.huawei.com",
        "aff_unique_abbr": "UCAS;Huawei",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "lr806pdNZa",
        "title": "LLM Censorship: The Problem and its Limitations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs) have exhibited impressive capabilities in comprehending complex instructions. However, their blind adherence to provided instructions has led to concerns regarding risks of malicious use. Existing defence mechanisms, such as model fine-tuning or output censorship using LLMs, have proven to be fallible, and LLMs can still generate problematic responses. Commonly employed censorship approaches treat the issue as a machine learning problem and rely on another LM to detect undesirable content in LLM outputs. In this paper, we present the theoretical limitations of such semantic censorship approaches. Specifically, we demonstrate that semantic censorship can be perceived as an undecidable problem, highlighting the inherent challenges in censorship that arise due to LLMs' programmatic and instruction-following capabilities. Furthermore, we argue that the challenges extend beyond semantic censorship, as knowledgeable attackers can reconstruct impermissible outputs from a collection of permissible ones. As a result, we propose that the problem of censorship needs to be reevaluated, and viewed as a security problem with adaptation of security-based defenses to mitigate potential risks.",
        "keywords": "LLM Safety;Adversarial Machine Learning;Security;Safety;Censorship",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "David Glukhov;Ilia Shumailov;Yarin Gal;Nicolas Papernot;Vardan Papyan",
        "authorids": "~David_Glukhov1;~Ilia_Shumailov1;~Yarin_Gal1;~Nicolas_Papernot1;~Vardan_Papyan1",
        "gender": "M;;M;M;Unspecified",
        "homepage": "http://www.cs.toronto.edu/~dglukhov/;http://www.cs.ox.ac.uk/people/yarin.gal/website//;https://www.papernot.fr;https://sites.google.com/view/vardan-papyan;https://www.cl.cam.ac.uk/~is410/",
        "dblp": ";67/9076;162/1405;173/9783;213/8587",
        "google_scholar": ";https://scholar.google.co.uk/citations?user=SIayDoQAAAAJ;cGxq0cMAAAAJ;https://scholar.google.co.il/citations?user=VrE-Gd4AAAAJ;https://scholar.google.co.uk/citations?hl=en",
        "orcid": ";;;;",
        "linkedin": ";;nicolaspapernot;;ilia-shumailov/",
        "or_profile": "~David_Glukhov1;~Yarin_Gal1;~Nicolas_Papernot1;~Vardan_Papyan1;~I_Shumailov1",
        "aff": "University of Toronto;University of Oxford;Google;University of Toronto;Google DeepMind",
        "aff_domain": "utoronto.ca;ox.ac.uk;google.com;toronto.edu;google.com",
        "position": "MS student;Associate Professor;Research Scientist;Assistant Professor;Research Scientist",
        "bibtex": "@misc{\nglukhov2024llm,\ntitle={{LLM} Censorship: The Problem and its Limitations},\nauthor={David Glukhov and Ilia Shumailov and Yarin Gal and Nicolas Papernot and Vardan Papyan},\nyear={2024},\nurl={https://openreview.net/forum?id=lr806pdNZa}\n}",
        "github": "",
        "project": "",
        "reviewers": "3fNc;BZEx;ST3b;xHLz",
        "site": "https://openreview.net/forum?id=lr806pdNZa",
        "pdf_size": 568877,
        "rating": "3;5;5;5",
        "confidence": "3;4;2;3",
        "soundness": "2;2;3;2",
        "contribution": "1;2;2;3",
        "presentation": "2;4;2;4",
        "wc_summary": "340;85;43;113",
        "wc_strengths": "2;172;11;102",
        "wc_weaknesses": "2;1838;10;218",
        "wc_questions": "2;186;330;104",
        "wc_review": "346;2281;394;537",
        "wc_reply_reviewers": "43;200;0;0",
        "wc_reply_authors": "698;1427;353;554",
        "reply_reviewers": "1;2;0;0",
        "reply_authors": "1;3;1;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            1.0
        ],
        "wc_summary_avg": [
            145.25,
            115.16591292565695
        ],
        "wc_strengths_avg": [
            71.75,
            69.85833880074733
        ],
        "wc_weaknesses_avg": [
            517.0,
            767.5799632611576
        ],
        "wc_questions_avg": [
            155.5,
            119.99479155363369
        ],
        "wc_review_avg": [
            889.5,
            806.4491614478869
        ],
        "wc_reply_reviewers_avg": [
            60.75,
            82.29026370112081
        ],
        "wc_reply_authors_avg": [
            758.0,
            405.216608741547
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5695512520121634126&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0;2",
        "aff_unique_norm": "University of Toronto;University of Oxford;Google",
        "aff_unique_dep": ";;Google",
        "aff_unique_url": "https://www.utoronto.ca;https://www.ox.ac.uk;https://www.google.com",
        "aff_unique_abbr": "U of T;Oxford;Google",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;2;0;1",
        "aff_country_unique": "Canada;United Kingdom;United States"
    },
    {
        "title": "A Dynamical View of the Question of Why",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17917",
        "id": "lrQlLqQase",
        "author_site": "Mehdi Fatemi, Sindhu Chatralinganadoddi Mariyappa Gowda",
        "tldr": "",
        "abstract": "We address causal reasoning in multivariate time series data generated by stochastic processes. Existing approaches are largely restricted to static settings, ignoring the continuity and emission of variations across time. In contrast, we propose a learning paradigm that directly establishes causation between events in the course of time. We present two key lemmas to compute causal contributions and frame them as reinforcement learning problems. Our approach offers formal and computational tools for uncovering and quantifying causal relationships in diffusion processes, subsuming various important settings such as discrete-time Markov decision processes. Finally, in fairly intricate experiments and through sheer learning, our framework reveals and quantifies causal links, which otherwise seem inexplicable.",
        "keywords": "Dynamical Causality;Reinforcement Learning",
        "primary_area": "causal reasoning",
        "supplementary_material": "",
        "author": "Mehdi Fatemi;Sindhu C. M. Gowda",
        "authorids": "~Mehdi_Fatemi1;~Sindhu_C._M._Gowda1",
        "gender": ";",
        "homepage": ";https://sindhucmgowda.github.io/",
        "dblp": ";",
        "google_scholar": "X9_mSpYAAAAJ;",
        "orcid": "0000-0001-9598-6164;",
        "linkedin": "fatemi/;",
        "or_profile": "~Mehdi_Fatemi1;~Sindhu_C._M._Gowda1",
        "aff": "Wand AI;",
        "aff_domain": "wand.ai;",
        "position": "Principal Researcher;",
        "bibtex": "@inproceedings{\nfatemi2024a,\ntitle={A Dynamical View of the Question of Why},\nauthor={Mehdi Fatemi and Sindhu C. M. Gowda},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=lrQlLqQase}\n}",
        "github": "",
        "project": "",
        "reviewers": "nNBo;6KUF;7WTp;f34o",
        "pdf_size": 846463,
        "rating": "3;5;6;8",
        "confidence": "4;4;3;3",
        "soundness": "2;2;3;4",
        "contribution": "2;2;3;3",
        "presentation": "1;2;3;2",
        "wc_summary": "38;27;125;126",
        "wc_strengths": "55;998;108;66",
        "wc_weaknesses": "68;8;230;257",
        "wc_questions": "3;26;71;99",
        "wc_review": "164;1059;534;548",
        "wc_reply_reviewers": "0;34;0;0",
        "wc_reply_authors": "655;3181;634;427",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;5;1;1",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            79.0,
            46.66369038128039
        ],
        "wc_strengths_avg": [
            306.75,
            399.58314216192855
        ],
        "wc_weaknesses_avg": [
            140.75,
            105.35030849503954
        ],
        "wc_questions_avg": [
            49.75,
            37.50583287970019
        ],
        "wc_review_avg": [
            576.25,
            318.426109953314
        ],
        "wc_reply_reviewers_avg": [
            8.5,
            14.722431864335457
        ],
        "wc_reply_authors_avg": [
            1224.25,
            1133.238583661887
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            1.7320508075688772
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.8320502943378437,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:5TZF6JPEY0kJ:scholar.google.com/&scioq=A+Dynamical+View+of+the+Question+of+Why&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=lrQlLqQase",
        "pdf": "https://openreview.net/pdf?id=lrQlLqQase",
        "email": "wand.ai;",
        "author_num": 2,
        "aff_unique_index": "0",
        "aff_unique_norm": "Wand AI",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.wand.ai",
        "aff_unique_abbr": "Wand AI",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "title": "EControl: Fast Distributed Optimization with Compression and Error Control",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17916",
        "id": "lsvlvWB9vz",
        "author_site": "Yuan Gao, Rustem Islamov, Sebastian Stich",
        "tldr": "",
        "abstract": "Modern distributed training relies heavily on communication compression to reduce the communication overhead. In this work, we study algorithms employing a popular class of contractive compressors in order to reduce communication overhead. However, the naive implementation often leads to unstable convergence or even exponential divergence due to the compression bias. Error Compensation (EC) is an extremely popular mechanism to mitigate the aforementioned issues during the training of models enhanced by contractive compression operators. Compared to the effectiveness of EC in the data homogeneous regime, the understanding of the practicality and theoretical foundations of EC in the data heterogeneous regime is limited. Existing convergence analyses typically rely on strong assumptions such as bounded gradients, bounded data heterogeneity, or large batch accesses, which are often infeasible in modern Machine Learning Applications. We resolve the majority of current issues by proposing EControl, a novel mechanism that can regulate error compensation by controlling the strength of the feedback signal. We prove fast convergence for EControl in standard strongly convex, general convex, and nonconvex settings without any additional assumptions on the problem or data heterogeneity. We conduct extensive numerical evaluations to illustrate the efficacy of our method and support our theoretical findings.",
        "keywords": "Optimization;Federated Learning;Contractive Compression",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/58841fc63f6467f3e09cfb1ec215109b3f62d696.zip",
        "author": "Yuan Gao;Rustem Islamov;Sebastian U Stich",
        "authorids": "~Yuan_Gao23;~Rustem_Islamov1;~Sebastian_U_Stich1",
        "gender": ";M;M",
        "homepage": "https://cispa.de/en/people/c01yuga;https://rustem-islamov.github.io/;https://www.sstich.ch",
        "dblp": ";285/5128;04/10549",
        "google_scholar": ";-dlYjUsAAAAJ;https://scholar.google.ch/citations?user=8l-mDfQAAAAJ",
        "orcid": "0009-0004-2339-1718;;",
        "linkedin": ";rustem-islamov-053345228/;",
        "or_profile": "~Yuan_Gao23;~Rustem_Islamov1;~Sebastian_U_Stich1",
        "aff": "CISPA, saarland university, saarland informatics campus;University of Basel;CISPA Helmholtz Center for Information Security",
        "aff_domain": "cispa.saarland;unibas.ch;cispa.de",
        "position": "PhD student;PhD student;Tenure Track Faculty",
        "bibtex": "@inproceedings{\ngao2024econtrol,\ntitle={{EC}ontrol: Fast Distributed Optimization with Compression and Error Control},\nauthor={Yuan Gao and Rustem Islamov and Sebastian U Stich},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=lsvlvWB9vz}\n}",
        "github": "",
        "project": "",
        "reviewers": "6rfE;iMbi;NamU;8MAp",
        "pdf_size": 1158663,
        "rating": "6;6;6;8",
        "confidence": "3;3;3;3",
        "soundness": "3;3;3;3",
        "contribution": "3;3;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "38;129;58;58",
        "wc_strengths": "29;30;61;38",
        "wc_weaknesses": "5;78;139;1",
        "wc_questions": "220;14;31;1",
        "wc_review": "292;251;289;98",
        "wc_reply_reviewers": "240;11;0;0",
        "wc_reply_authors": "1257;404;521;0",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "4;1;1;0",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            70.75,
            34.60762199285007
        ],
        "wc_strengths_avg": [
            39.5,
            12.893796958227627
        ],
        "wc_weaknesses_avg": [
            55.75,
            57.00603038275863
        ],
        "wc_questions_avg": [
            66.5,
            89.25945328087104
        ],
        "wc_review_avg": [
            232.5,
            79.31740036082877
        ],
        "wc_reply_reviewers_avg": [
            62.75,
            102.43382009863734
        ],
        "wc_reply_authors_avg": [
            545.5,
            453.98926198754964
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            1.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2070793902360602906&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "openreview": "https://openreview.net/forum?id=lsvlvWB9vz",
        "pdf": "https://openreview.net/pdf?id=lsvlvWB9vz",
        "email": "cispa.saarland;unibas.ch;cispa.de",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Saarland University;University of Basel;CISPA Helmholtz Center for Information Security",
        "aff_unique_dep": "CISPA;;",
        "aff_unique_url": "https://www.uni-saarland.de;https://www.unibas.ch;https://www.cispa.de/",
        "aff_unique_abbr": "Saarland U;UniBas;CISPA",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Saarland Informatics Campus;",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Germany;Switzerland"
    },
    {
        "title": "Bandits Meet Mechanism Design to Combat Clickbait in Online Recommendation",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17915",
        "id": "lsxeNvYqCj",
        "author_site": "Thomas Kleine Buening, Aadirupa Saha, Christos Dimitrakakis, Haifeng Xu",
        "tldr": "",
        "abstract": "We study a strategic variant of the multi-armed bandit problem, which we coin the strategic click-bandit. This model is motivated by applications in online recommendation where the choice of recommended items depends on both the click-through rates and the post-click rewards. Like in classical bandits, rewards follow a fixed unknown distribution. However, we assume that the click-rate of each arm is chosen  strategically by the arm (e.g., a host on Airbnb)  in order to maximize  the number of times it gets clicked. The algorithm designer does not know the post-click rewards nor the arms' actions (i.e., strategically chosen click-rates) in advance, and must learn both values over time. To solve this problem, we design an incentive-aware learning algorithm, UCB-S, which achieves two goals simultaneously: (a) incentivizing desirable arm behavior under uncertainty; (b) minimizing regret by learning unknown parameters.  We approximately characterize all Nash equilibria of the arms under UCB-S and show a $\\tilde{\\mathcal{O}} (\\sqrt{KT})$ regret bound uniformly in every equilibrium. We also show that incentive-unaware algorithms generally fail to achieve low regret in the strategic click-bandit. Finally, we support our theoretical results by simulations of strategic arm behavior which confirm the effectiveness and robustness of our proposed incentive design.",
        "keywords": "bandits;mechanism design;incentive-aware learning;nash equilibrium",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/f795d33127e6fcaa20ae9722fd1e4b2e7fecba63.pdf",
        "author": "Thomas Kleine Buening;Aadirupa Saha;Christos Dimitrakakis;Haifeng Xu",
        "authorids": "~Thomas_Kleine_Buening1;~Aadirupa_Saha1;~Christos_Dimitrakakis1;~Haifeng_Xu1",
        "gender": "M;;M;M",
        "homepage": "https://thomasklbg.github.io/;http://aadirupa.github.io/;https://sites.google.com/site/christosdimitrakakis/;http://www.haifeng-xu.com/",
        "dblp": "286/5270;;17/2535;04/1895",
        "google_scholar": "1VT2sBgAAAAJ;https://scholar.google.co.in/citations?user=7a49tQYAAAAJ;9Kw4t_kAAAAJ;nLgg388AAAAJ",
        "orcid": ";0000-0003-4965-6417;0000-0002-5367-5189;",
        "linkedin": "thomas-kleine-b%C3%BCning-594a4414a/;aadirupa-saha;;",
        "or_profile": "~Thomas_Kleine_Buening1;~Aadirupa_Saha1;~Christos_Dimitrakakis1;~Haifeng_Xu1",
        "aff": "University of Oslo, Norway;Apple;Chalmers University;University of Chicago",
        "aff_domain": "uio.no;apple.com;chalmers.se;cs.uchicago.edu",
        "position": "PhD student;Researcher;Senior Researcher;Assistant Professor",
        "bibtex": "@inproceedings{\nbuening2024bandits,\ntitle={Bandits Meet Mechanism Design to Combat Clickbait in Online Recommendation},\nauthor={Thomas Kleine Buening and Aadirupa Saha and Christos Dimitrakakis and Haifeng Xu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=lsxeNvYqCj}\n}",
        "github": "",
        "project": "",
        "reviewers": "KcYc;Se7C;byQz;cU9Z",
        "pdf_size": 3413445,
        "rating": "6;6;8;8",
        "confidence": "4;3;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;4;3",
        "wc_summary": "156;126;132;87",
        "wc_strengths": "65;36;89;42",
        "wc_weaknesses": "156;419;260;129",
        "wc_questions": "512;69;58;4",
        "wc_review": "889;650;539;262",
        "wc_reply_reviewers": "265;44;46;4",
        "wc_reply_authors": "1228;841;362;262",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "4;2;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            125.25,
            24.772716847370617
        ],
        "wc_strengths_avg": [
            58.0,
            20.91650066335189
        ],
        "wc_weaknesses_avg": [
            241.0,
            113.81344384561957
        ],
        "wc_questions_avg": [
            160.75,
            204.28090341488115
        ],
        "wc_review_avg": [
            585.0,
            225.3253203703481
        ],
        "wc_reply_reviewers_avg": [
            89.75,
            102.55821517557723
        ],
        "wc_reply_authors_avg": [
            673.25,
            387.9080915629371
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2201330690871986915&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=lsxeNvYqCj",
        "pdf": "https://openreview.net/pdf?id=lsxeNvYqCj",
        "email": "uio.no;apple.com;chalmers.se;cs.uchicago.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "University of Oslo;Apple;Chalmers University of Technology;University of Chicago",
        "aff_unique_dep": ";Apple Inc.;;",
        "aff_unique_url": "https://www.uio.no;https://www.apple.com;https://www.chalmers.se;https://www.uchicago.edu",
        "aff_unique_abbr": "UiO;Apple;Chalmers;UChicago",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;1",
        "aff_country_unique": "Norway;United States;Sweden"
    },
    {
        "id": "lt6xKGGWov",
        "title": "Feature selection with neural estimation of mutual information",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We describe a novel approach to supervised feature selection based on neural estimation of mutual information between features and targets. Our feature selection filter evaluates subsets of features as an ensemble, instead of considering one feature at a time as most feature selection filters do. This allows us to capture sophisticated relationships between features and targets, and to take such sophisticated\nrelationships into account when selecting relevant features. We give examples of such relationships, and we demonstrate that in this way we are capable of performing an exact selection, whereas other existing methods fail to do so.",
        "keywords": "Feature selection;mutual information;MINE;neural networks",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Claudio Bellani;Egor Kraev;Alex Shestopaloff",
        "authorids": "~Claudio_Bellani1;~Egor_Kraev1;~Alex_Shestopaloff1",
        "gender": "M;M;",
        "homepage": ";;",
        "dblp": ";;220/1933.html",
        "google_scholar": ";;",
        "orcid": "0009-0004-5044-6032;;",
        "linkedin": ";egorkraev/;",
        "or_profile": "~Claudio_Bellani1;~Egor_Kraev1;~Alex_Shestopaloff1",
        "aff": ";Wise Plc;Queen Mary, University of London",
        "aff_domain": ";wise.com;qmul.ac.uk",
        "position": ";Head of AI;Senior Lecturer",
        "bibtex": "@misc{\nbellani2024feature,\ntitle={Feature selection with neural estimation of mutual information},\nauthor={Claudio Bellani and Egor Kraev and Alex Shestopaloff},\nyear={2024},\nurl={https://openreview.net/forum?id=lt6xKGGWov}\n}",
        "github": "",
        "project": "",
        "reviewers": "5aJX;Mxn5;R5qG",
        "site": "https://openreview.net/forum?id=lt6xKGGWov",
        "pdf_size": 472676,
        "rating": "1;3;3",
        "confidence": "5;4;4",
        "soundness": "1;2;2",
        "contribution": "1;2;2",
        "presentation": "1;2;2",
        "wc_summary": "40;36;46",
        "wc_strengths": "17;24;12",
        "wc_weaknesses": "315;109;51",
        "wc_questions": "12;28;352",
        "wc_review": "384;197;461",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            40.666666666666664,
            4.109609335312651
        ],
        "wc_strengths_avg": [
            17.666666666666668,
            4.9216076867444665
        ],
        "wc_weaknesses_avg": [
            158.33333333333334,
            113.2823414698376
        ],
        "wc_questions_avg": [
            130.66666666666666,
            156.64255133548127
        ],
        "wc_review_avg": [
            347.3333333333333,
            110.85225402409381
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:SbQcYsLil9MJ:scholar.google.com/&scioq=Feature+selection+with+neural+estimation+of+mutual+information&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Wise Plc;Queen Mary, University of London",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://wise.com;https://www.qmul.ac.uk",
        "aff_unique_abbr": "Wise;QMUL",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";London",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "ltUJYnkVJ7",
        "title": "Contrastive Learning to rank with Weak Supervision",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Fine-tuned pre-trained contextual word embedding models to supervised downstream tasks have become commonplace in natural language processing. However, modern deep learning natural language processing (NLP) tasks require a large amount of labeled data. We study the problem of fine-tuned pre-trained language models without using any labeled data, but only weak supervision sources. This problem is technically challenging due to the labels generated by weak supervision being noisy, it may cause over-fitting, and is inapplicable for construction labels in a continuous sample space. To address these two challenges, we design a contrastive learning framework with weak supervision, CLWS, to enable modeling language models. The unlabeled data is modeled according to the partial order relationship of weak supervision signal, which estimates the source reliability by self-attention mechanism and then reduces label noise by fusing weak labels. The discriminant model aligned with the input pair in continuous space, using the generated labels with contrastive learning to address the above issue. Experiments on multi-turn dialogue, search ranking tasks show that our model outperforms the strongest baseline by large margins and achieves competitive performance with fully-supervised methods.",
        "keywords": "gpt",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Kai Zheng",
        "authorids": "~Kai_Zheng8",
        "gender": "",
        "homepage": "https://www.microsoft.com/en-us/research/people/zhengkai/",
        "dblp": "73/3928-2.html",
        "google_scholar": "dxjqLjsAAAAJ",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Kai_Zheng8",
        "aff": "Microsoft",
        "aff_domain": "microsoft.com",
        "position": "Researcher",
        "bibtex": "@misc{\nzheng2024contrastive,\ntitle={Contrastive Learning to rank with Weak Supervision},\nauthor={Kai Zheng},\nyear={2024},\nurl={https://openreview.net/forum?id=ltUJYnkVJ7}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=ltUJYnkVJ7",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:aancMLE7n_gJ:scholar.google.com/&scioq=Contrastive+Learning+to+rank+with+Weak+Supervision&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Microsoft",
        "aff_unique_dep": "Microsoft Corporation",
        "aff_unique_url": "https://www.microsoft.com",
        "aff_unique_abbr": "Microsoft",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "title": "RobustTSF: Towards Theory and Design of Robust Time Series Forecasting with Anomalies",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17914",
        "id": "ltZ9ianMth",
        "author_site": "Hao Cheng, Qingsong Wen, Yang Liu, Liang Sun",
        "tldr": "",
        "abstract": "Time series forecasting is an important and forefront task whose techniques have been applied to electricity forecasting, trajectory prediction, labor planning, etc. However, most of time series forecasting techniques assume that the training data is clean without anomalies. This assumption is unrealistic since the collected time series data can be contaminated in practice. The forecasting model will be inferior if it is directly trained by time series with anomalies. Thus it is essential to develop methods to automatically learn a robust forecasting model from the contaminated data. In this paper, we first statistically define three types of anomalies, then theoretically and experimentally analyze the loss robustness and sample robustness when these anomalies exist. Based on our analyses, we propose a simple and efficient algorithm to learn a robust forecasting model. Extensive experiments show that our method is highly robust and outperforms all existing approaches. The code is available at https://github.com/haochenglouis/RobustTSF.",
        "keywords": "Robust time series forecasting; learning with noisy labels",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Hao Cheng;Qingsong Wen;Yang Liu;Liang Sun",
        "authorids": "~Hao_Cheng5;~Qingsong_Wen2;~Yang_Liu3;~Liang_Sun2",
        "gender": "M;M;M;M",
        "homepage": "https://haochenglouis.github.io;http://www.yliuu.com;https://www.linkedin.com/in/liang-sun-a0a87621/;https://sites.google.com/site/qingsongwen8/",
        "dblp": ";51/3710-18;18/5837-1;27/561",
        "google_scholar": "ftlVqVIAAAAJ;jKrIVCIAAAAJ;D_cOMBgAAAAJ;vjPJvwYAAAAJ",
        "orcid": "0000-0001-8864-7818;0000-0001-8420-6011;0009-0002-5835-7259;0000-0003-4516-2524",
        "linkedin": ";;;qingsong-wen-22814156/",
        "or_profile": "~Hao_Cheng5;~Yang_Liu3;~Liang_Sun2;~Qingsong_Wen1",
        "aff": "University of California, Santa Cruz;University of California, Santa Cruz;Alibaba Group;Squirrel Ai Learning",
        "aff_domain": "ucsc.edu;ucsc.edu;alibaba-inc.com;squirrelai.com",
        "position": "PhD student;Assistant Professor;Staff Software Engineer;Principal Researcher",
        "bibtex": "@inproceedings{\ncheng2024robusttsf,\ntitle={Robust{TSF}: Towards Theory and Design of Robust Time Series Forecasting with Anomalies},\nauthor={Hao Cheng and Qingsong Wen and Yang Liu and Liang Sun},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ltZ9ianMth}\n}",
        "github": "",
        "project": "",
        "reviewers": "442h;FUy4;Swrw;5W9f",
        "pdf_size": 577748,
        "rating": "5;5;6;6",
        "confidence": "4;3;4;4",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;3;4",
        "wc_summary": "225;97;107;21",
        "wc_strengths": "202;53;116;41",
        "wc_weaknesses": "160;323;127;107",
        "wc_questions": "82;20;240;60",
        "wc_review": "669;493;590;229",
        "wc_reply_reviewers": "23;193;42;0",
        "wc_reply_authors": "787;1268;1933;1010",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "2;3;5;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            112.5,
            72.97088460475177
        ],
        "wc_strengths_avg": [
            103.0,
            63.863134905828105
        ],
        "wc_weaknesses_avg": [
            179.25,
            85.12454111476902
        ],
        "wc_questions_avg": [
            100.5,
            83.55088270030426
        ],
        "wc_review_avg": [
            495.25,
            165.8770252325499
        ],
        "wc_reply_reviewers_avg": [
            64.5,
            75.66538178057387
        ],
        "wc_reply_authors_avg": [
            1249.5,
            429.76185265795755
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            1.224744871391589
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3164057914003174687&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=ltZ9ianMth",
        "pdf": "https://openreview.net/pdf?id=ltZ9ianMth",
        "email": "ucsc.edu;ucsc.edu;alibaba-inc.com;squirrelai.com",
        "author_num": 4,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "University of California, Santa Cruz;Alibaba Group;Squirrel Ai Learning",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ucsc.edu;https://www.alibaba.com;https://www.squirrelai.com/",
        "aff_unique_abbr": "UCSC;Alibaba;",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Santa Cruz;",
        "aff_country_unique_index": "0;0;1;1",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "ltutP1Iwqq",
        "title": "Investigating Feature Alignment Under An Infant-Inspired Visual Distribution Shift",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent work on visual learning in people finds that human infants often experience extended bouts of experience with a small number of familiar objects (e.g., toy ducks at home), with a very long tail of less frequent exposures to less familiar objects (e.g., real ducks at the park).  When facing this type of distribution shift between toy ducks and real ducks, learners trying to build coherent representations that bridge these two distributions can leverage at least two distinct types of learning signals: (1) categorical learning signals, which explicitly assign two inputs to the same class (e.g., hearing adults label both toy ducks and real ducks with the same word, ``duck;'' and (2) perceptual learning signals, which implicitly assign two inputs to the same class because of perceived similarities (e.g., both toy ducks and real ducks have bills, wings, and webbed feet).  In this paper, we examine how these two types of learning signals interact to impact a learner's cross-domain classification performance, through the lens of feature alignment as an interim goal for the learner.  We propose new cluster-based metrics to quantify feature alignment in an infant-inspired two-domain learning problem, and we describe a series of experiments that systematically vary these learning signals to observe impacts on feature alignment and overall learning outcomes.",
        "keywords": "infant learning; distribution shift;",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/e1751f1d1de3ea3241ae8739f64db317331b9f8e.pdf",
        "author": "Deepayan Sanyal;James Ainooson;Joel Phillips Michelson;Yuan Yang;Maithilee Kunda",
        "authorids": "~Deepayan_Sanyal1;~James_Ainooson1;~Joel_Phillips_Michelson1;~Yuan_Yang2;~Maithilee_Kunda1",
        "gender": "M;M;M;;F",
        "homepage": "https://my.vanderbilt.edu/aivaslab/people/;http://ekowabaka.me;;https://my.vanderbilt.edu/aivaslab/;https://my.vanderbilt.edu/aivaslab/",
        "dblp": ";;;;",
        "google_scholar": ";;QwKHSlYAAAAJ;;",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Deepayan_Sanyal1;~James_Ainooson1;~Joel_Phillips_Michelson1;~Yuan_Yang2;~Maithilee_Kunda1",
        "aff": ";Vanderbilt University;Vanderbilt University;Vanderbilt University;Vanderbilt University",
        "aff_domain": ";vanderbilt.edu;vanderbilt.edu;vanderbilt.edu;vanderbilt.edu",
        "position": ";PhD student;PhD student;PhD student;Associate Professor",
        "bibtex": "@misc{\nsanyal2024investigating,\ntitle={Investigating Feature Alignment Under An Infant-Inspired Visual Distribution Shift},\nauthor={Deepayan Sanyal and James Ainooson and Joel Phillips Michelson and Yuan Yang and Maithilee Kunda},\nyear={2024},\nurl={https://openreview.net/forum?id=ltutP1Iwqq}\n}",
        "github": "",
        "project": "",
        "reviewers": "2WNu;dPPP;dHsC;Hbmk;5jV7",
        "site": "https://openreview.net/forum?id=ltutP1Iwqq",
        "pdf_size": 1427068,
        "rating": "3;5;5;6;6",
        "confidence": "4;3;2;5;3",
        "soundness": "2;2;2;3;3",
        "contribution": "2;2;2;3;3",
        "presentation": "2;2;2;2;3",
        "wc_summary": "90;211;89;52;53",
        "wc_strengths": "32;104;181;61;60",
        "wc_weaknesses": "354;119;530;195;169",
        "wc_questions": "135;31;69;106;1",
        "wc_review": "611;465;869;414;283",
        "wc_reply_reviewers": "106;0;0;0;0",
        "wc_reply_authors": "107;201;271;18;141",
        "reply_reviewers": "1;0;0;0;0",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            5.0,
            1.0954451150103321
        ],
        "confidence_avg": [
            3.4,
            1.019803902718557
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.2,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            99.0,
            58.39520528262573
        ],
        "wc_strengths_avg": [
            87.6,
            52.063807006403216
        ],
        "wc_weaknesses_avg": [
            273.4,
            150.48269003443554
        ],
        "wc_questions_avg": [
            68.4,
            48.561713314091385
        ],
        "wc_review_avg": [
            528.4,
            200.07958416590137
        ],
        "wc_reply_reviewers_avg": [
            21.2,
            42.4
        ],
        "wc_reply_authors_avg": [
            147.6,
            85.51865293607003
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:DJFHpMSZbaAJ:scholar.google.com/&scioq=Investigating+Feature+Alignment+Under+An+Infant-Inspired+Visual+Distribution+Shift&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Vanderbilt University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.vanderbilt.edu",
        "aff_unique_abbr": "Vanderbilt",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Faster Approximation of Probabilistic and Distributional Values via Least Squares",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17913",
        "id": "lvSMIsztka",
        "author_site": "Weida Li, Yaoliang Yu",
        "tldr": "",
        "abstract": "The family of probabilistic values, axiomatically-grounded in cooperative game theory, has recently received much attention in data valuation. However, it is often computationally expensive to compute exactly (exponential w.r.t. the number of data to valuate denoted by $n$). The existing generic estimator costs $O(n^2\\log n)$ utility evaluations to achieve an $(\\epsilon,\\delta)$-approximation under the 2-norm, while faster estimators have been developed recently for special cases (e.g., empirically for the Shapley value and theoretically for the Banzhaf value). In this work, starting from the discovered connection between probabilistic values and least square regressions, we propose a Generic Estimator based on Least Squares (GELS) along with its variants that cost $O(n\\log n)$ utility evaluations for many probabilistic values, largely extending the scope of this currently best complexity bound. Moreover, we show that each distributional value, proposed by Ghorbani et al. (2020) to alleviate the inconsistency of probabilistic values induced by using distinct databases, can also be cast as optimizing a similar least square regression. This observation leads to a theoretically-grounded framework TrELS (Training Estimators based on Least Squares) that can train estimators towards the specified distributional values without requiring any supervised signals. Particularly, the trained estimators are capable of predicting the corresponding distributional values for unseen data, largely saving the budgets required for running Monte-Carlo methods otherwise. Our experiments verify the faster convergence of GELS, and demonstrate the effectiveness of TrELS in learning distributional values. Our code is available at https://github.com/watml/fastpvalue.",
        "keywords": "data valuation;probabilistic values;approximation;distributional Shapley value",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Weida Li;Yaoliang Yu",
        "authorids": "~Weida_Li1;~Yaoliang_Yu1",
        "gender": ";M",
        "homepage": ";https://cs.uwaterloo.ca/~y328yu/",
        "dblp": "121/8659;90/4989",
        "google_scholar": "claK_XkAAAAJ;https://scholar.google.ca/citations?user=zbXIQMsAAAAJ",
        "orcid": ";0000-0002-3823-0720",
        "linkedin": ";",
        "or_profile": "~Weida_Li1;~Yaoliang_Yu1",
        "aff": "University of Waterloo;University of Waterloo",
        "aff_domain": "uwaterloo.ca;uwaterloo.ca",
        "position": "Intern;Associate Professor",
        "bibtex": "@inproceedings{\nli2024faster,\ntitle={Faster Approximation of Probabilistic and Distributional Values via Least Squares},\nauthor={Weida Li and Yaoliang Yu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=lvSMIsztka}\n}",
        "github": "",
        "project": "",
        "reviewers": "s6uD;3wRG;XZSz;wdkt",
        "pdf_size": 26857397,
        "rating": "6;8;8;8",
        "confidence": "3;3;2;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;4;3",
        "presentation": "2;3;3;2",
        "wc_summary": "256;71;211;52",
        "wc_strengths": "13;50;92;39",
        "wc_weaknesses": "49;105;68;158",
        "wc_questions": "16;45;30;8",
        "wc_review": "334;271;401;257",
        "wc_reply_reviewers": "4;23;12;15",
        "wc_reply_authors": "666;505;780;1007",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;1;2;2",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            147.5,
            87.71687408931078
        ],
        "wc_strengths_avg": [
            48.5,
            28.48245073725223
        ],
        "wc_weaknesses_avg": [
            95.0,
            41.57523301197481
        ],
        "wc_questions_avg": [
            24.75,
            14.095655359010449
        ],
        "wc_review_avg": [
            315.75,
            57.12869244083922
        ],
        "wc_reply_reviewers_avg": [
            13.5,
            6.800735254367722
        ],
        "wc_reply_authors_avg": [
            739.5,
            182.7491450048399
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8319498597337361413&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=lvSMIsztka",
        "pdf": "https://openreview.net/pdf?id=lvSMIsztka",
        "email": "uwaterloo.ca;uwaterloo.ca",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Waterloo",
        "aff_unique_dep": "",
        "aff_unique_url": "https://uwaterloo.ca",
        "aff_unique_abbr": "UW",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "lvjz7Bm3Ea",
        "title": "ChronoGAM: An End-to-End One-Class Time Series Gaussian Mixture Model",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recently, several algorithms have been proposed for One Class Learning (OCL) with time series. However, several problems can be found in these methods, problems involving the collapse of hyperspheres, manual thresholds, numerical instabilities and even the use of unlabeled instances during training, which directly violates the concept of OCL. To avoid these problems and solve cases like the numerical instability of some methods this paper proposes an end-to-end method for time series one-class learning based on a Gaussian Mixture Model (GMM). The proposed method combines the unsupervised learning technique of an autoencoder adapted to extract temporal and structural features of a time series, combined with distribution learning, to provide better performance than other state-of-the-art methods for the classification of time series data. ChronoGAM is a novel method that is capable of improving the temporal importance of the representations learned by the autoencoding system. We propose a new objective function with modifications to penalize the small values on the covariance matrix without resulting in exploding gradient propagation, causing numerical instabilities, and adapting the energy calculus to avoid the use of exponential functions. The method is tested on over $85$ benchmark datasets, generating $652$ datasets. We gain in $369$ datasets, with an average ranking of $2.68$, being the top-ranked method.",
        "keywords": "one-class;time series;gaussian mixture;deep learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Jose Gilberto Medeiros;Marcos G\u00f4lo;Marcelo Isaias de Moraes J\u00fanior;Ricardo Marcacini;Diego Furtado Silva",
        "authorids": "~Jose_Gilberto_Medeiros1;~Marcos_G\u00f4lo1;marcelo.junior@usp.br;~Ricardo_Marcacini1;~Diego_Furtado_Silva1",
        "gender": "M;M;;;M",
        "homepage": "https://jose-gilberto.github.io/;;;;https://www.linkedin.com/in/diego-furtado-silva-02a54317/",
        "dblp": ";302/7005;;69/8767;124/2376",
        "google_scholar": "OvRan0cAAAAJ;https://scholar.google.com.br/citations?user=CeyvhM8AAAAJ;;hPfaIZIAAAAJ;HXu5lB4AAAAJ",
        "orcid": "0009-0008-8793-6528;0000-0002-9093-8195;;0000-0002-2309-3487;0000-0002-5184-9413",
        "linkedin": ";marcosgolo/;;;",
        "or_profile": "~Jose_Gilberto_Medeiros1;~Marcos_G\u00f4lo1;marcelo.junior@usp.br;~Ricardo_Marcacini1;~Diego_Furtado_Silva1",
        "aff": "Universidade de S\u00e3o Paulo;Universidade de S\u00e3o Paulo;;Universidade de S\u00e3o Paulo;Universidade de S\u00e3o Paulo",
        "aff_domain": "usp.br;usp.br;;usp.br;usp.br",
        "position": "MS student;PhD student;;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nmedeiros2024chronogam,\ntitle={Chrono{GAM}: An End-to-End One-Class Time Series Gaussian Mixture Model},\nauthor={Jose Gilberto Medeiros and Marcos G{\\^o}lo and Marcelo Isaias de Moraes J{\\'u}nior and Ricardo Marcacini and Diego Furtado Silva},\nyear={2024},\nurl={https://openreview.net/forum?id=lvjz7Bm3Ea}\n}",
        "github": "",
        "project": "",
        "reviewers": "5RCZ;yKkP;JBii;ahgt",
        "site": "https://openreview.net/forum?id=lvjz7Bm3Ea",
        "pdf_size": 6275271,
        "rating": "1;3;5;6",
        "confidence": "5;4;4;3",
        "soundness": "1;2;2;2",
        "contribution": "1;2;2;3",
        "presentation": "2;2;2;3",
        "wc_summary": "42;55;85;150",
        "wc_strengths": "16;23;21;138",
        "wc_weaknesses": "493;89;35;280",
        "wc_questions": "30;5;76;326",
        "wc_review": "581;172;217;894",
        "wc_reply_reviewers": "375;0;0;31",
        "wc_reply_authors": "813;390;377;750",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            3.75,
            1.920286436967152
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            83.0,
            41.70731350734545
        ],
        "wc_strengths_avg": [
            49.5,
            51.15906566777779
        ],
        "wc_weaknesses_avg": [
            224.25,
            179.89076546615726
        ],
        "wc_questions_avg": [
            109.25,
            127.7054716917016
        ],
        "wc_review_avg": [
            466.0,
            293.6179490426292
        ],
        "wc_reply_reviewers_avg": [
            101.5,
            158.41164729905438
        ],
        "wc_reply_authors_avg": [
            582.5,
            200.29540683700162
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9205746178983233,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:eKIfROxSLUsJ:scholar.google.com/&scioq=ChronoGAM:+An+End-to-End+One-Class+Time+Series+Gaussian+Mixture+Model&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Universidade de S\u00e3o Paulo",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.usp.br",
        "aff_unique_abbr": "USP",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Brazil"
    },
    {
        "id": "lwT5CRq1PO",
        "title": "Federated Learning with a Single Shared Image",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Federated Learning (FL) enables multiple machines to collaboratively train a machine learning model without sharing of private training data. \nYet, especially for heterogeneous models, a key bottleneck remains the transfer of knowledge gained from each client model with the server.\nOne popular method, FedDF, uses distillation to tackle this task with the use of a common, shared dataset on which predictions are exchanged.\nHowever, in many contexts such a dataset might be difficult to acquire due to privacy and the clients might not allow for storage of a large shared dataset. \nTo this end, in this paper, we introduce a new method that improves this knowledge distillation method to only rely on a \\textit{single} shared image between clients and server. \nIn particular, we propose a novel adaptive dataset pruning algorithm that selects the most informative crops generated from only a single image. \nWith this, we show that federated learning with distillation under a limited shared dataset budget works better by using a single image compared to multiple individual ones. \nFinally, we extend our approach to allow for training heterogeneous client architectures by incorporating a non-uniform distillation schedule and client-model-mirroring on the server-side.",
        "keywords": "Single Datum;Federated Learning;Knowledge Distillation;Single Image",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/2eae50c45ff6cd15fa1706142ac22d6d7ef14e58.pdf",
        "author": "Sunny Soni;Aaqib Saeed;Yuki M Asano",
        "authorids": "~Sunny_Soni1;~Aaqib_Saeed1;~Yuki_M_Asano1",
        "gender": "M;;M",
        "homepage": "https://sunnysoni97.github.io/;http://aqibsaeed.github.io/;https://yukimasano.github.io/",
        "dblp": ";210/1023;239/8823",
        "google_scholar": ";O0nlHrkAAAAJ;CdpLhlgAAAAJ",
        "orcid": ";0000-0003-1473-0322;",
        "linkedin": "sunnysoni97/;aqibsaeed/;",
        "or_profile": "~Sunny_Soni1;~Aaqib_Saeed1;~Yuki_Asano1",
        "aff": ";Eindhoven University of Technology;University of Amsterdam",
        "aff_domain": ";tue.nl;uva.nl",
        "position": ";Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nsoni2024federated,\ntitle={Federated Learning with a Single Shared Image},\nauthor={Sunny Soni and Aaqib Saeed and Yuki M Asano},\nyear={2024},\nurl={https://openreview.net/forum?id=lwT5CRq1PO}\n}",
        "github": "",
        "project": "",
        "reviewers": "7jD4;qTUJ;9upr;LPBt",
        "site": "https://openreview.net/forum?id=lwT5CRq1PO",
        "pdf_size": 1180474,
        "rating": "3;3;3;5",
        "confidence": "4;5;4;3",
        "soundness": "2;2;1;3",
        "contribution": "2;2;2;3",
        "presentation": "1;2;1;3",
        "wc_summary": "105;85;36;46",
        "wc_strengths": "33;21;30;42",
        "wc_weaknesses": "207;121;259;44",
        "wc_questions": "57;33;6;40",
        "wc_review": "402;260;331;172",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            68.0,
            28.1336097932704
        ],
        "wc_strengths_avg": [
            31.5,
            7.5
        ],
        "wc_weaknesses_avg": [
            157.75,
            82.10777977755824
        ],
        "wc_questions_avg": [
            34.0,
            18.371173070873837
        ],
        "wc_review_avg": [
            291.25,
            85.20966787870964
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11338920197203581491&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Eindhoven University of Technology;University of Amsterdam",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tue.nl;https://www.uva.nl",
        "aff_unique_abbr": "TU/e;UvA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Netherlands"
    },
    {
        "id": "lwtaEhDx9x",
        "title": "Elephants Never Forget: Testing Language Models for Memorization of Tabular Data",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "While many have shown how Large Language Models (LLMs) can be applied to a diverse set of tasks, the critical issues of data contamination and memorization are often glossed over. In this work, we address this concern for tabular data. Starting with simple qualitative tests for whether an LLM knows the names and values of features, we introduce a variety of different techniques to assess the degrees of contamination, including statistical tests for conditional distribution modeling and four tests that identify memorization. Our investigation reveals that LLMs are pre-trained on many popular tabular datasets. This exposure can lead to invalid performance evaluation on downstream tasks because the LLMs have, in effect, been fit to the test set. Interestingly, we also identify a regime where the language model reproduces important statistics of the data, but fails to reproduce the dataset verbatim. On these datasets, although seen during training, good performance on downstream tasks might not be due to overfitting. Our findings underscore the need for ensuring data integrity in machine learning tasks with LLMs. To facilitate future research, we release an open-source tool that can perform various tests for memorization https://github.com/tabmem/tool.",
        "keywords": "Language Models;Memorization;Tabular Data",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Sebastian Bordt;Harsha Nori;Rich Caruana",
        "authorids": "~Sebastian_Bordt1;~Harsha_Nori1;~Rich_Caruana1",
        "gender": ";;M",
        "homepage": "http://www.tml.cs.uni-tuebingen.de/team/bordt/index.php;;",
        "dblp": "270/0462;217/2494;",
        "google_scholar": "https://scholar.google.de/citations?user=6PnL3BgAAAAJ;HmxjgMAAAAAJ;https://scholar.google.com/scholar?hl=en",
        "orcid": ";;",
        "linkedin": ";harshanori;",
        "or_profile": "~Sebastian_Bordt1;~Harsha_Nori1;~Rich_Caruana1",
        "aff": "Eberhard-Karls-Universit\u00e4t T\u00fcbingen;Microsoft;",
        "aff_domain": "uni-tuebingen.de;microsoft.com;",
        "position": "Postdoc;Research Engineer;",
        "bibtex": "@misc{\nbordt2024elephants,\ntitle={Elephants Never Forget: Testing Language Models for Memorization of Tabular Data},\nauthor={Sebastian Bordt and Harsha Nori and Rich Caruana},\nyear={2024},\nurl={https://openreview.net/forum?id=lwtaEhDx9x}\n}",
        "github": "",
        "project": "",
        "reviewers": "YJg3;aXk7;8936;ELKr",
        "site": "https://openreview.net/forum?id=lwtaEhDx9x",
        "pdf_size": 3611360,
        "rating": "3;3;5;8",
        "confidence": "4;4;3;4",
        "soundness": "2;2;2;4",
        "contribution": "2;2;2;3",
        "presentation": "1;3;2;4",
        "wc_summary": "212;84;73;303",
        "wc_strengths": "60;140;83;91",
        "wc_weaknesses": "311;799;126;155",
        "wc_questions": "18;69;54;15",
        "wc_review": "601;1092;336;564",
        "wc_reply_reviewers": "0;0;89;0",
        "wc_reply_authors": "403;1131;436;237",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            168.0,
            95.18665872904668
        ],
        "wc_strengths_avg": [
            93.5,
            29.159046623646667
        ],
        "wc_weaknesses_avg": [
            347.75,
            269.8623491708319
        ],
        "wc_questions_avg": [
            39.0,
            23.140872930812268
        ],
        "wc_review_avg": [
            648.25,
            275.5652146044562
        ],
        "wc_reply_reviewers_avg": [
            22.25,
            38.53813046840752
        ],
        "wc_reply_authors_avg": [
            551.75,
            342.8274894170536
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.07053456158585983,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16237948276314896438&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Eberhard Karls University of T\u00fcbingen;Microsoft",
        "aff_unique_dep": ";Microsoft Corporation",
        "aff_unique_url": "https://www.uni-tuebingen.de/;https://www.microsoft.com",
        "aff_unique_abbr": "Uni T\u00fcbingen;Microsoft",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "T\u00fcbingen;",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Germany;United States"
    },
    {
        "id": "lxgrWqxRzx",
        "title": "The Noise Geometry of Stochastic Gradient Descent: A Quantitative and Analytical Characterization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Empirical studies have demonstrated that the noise in stochastic gradient descent (SGD) aligns favorably with the local geometry of loss landscape. However, theoretical and quantitative explanations for this phenomenon remain sparse. In this paper, we offer a comprehensive theoretical investigation into the aforementioned {\\em noise geometry} for over-parameterized linear (OLMs) models and two-layer neural networks. We scrutinize both average and directional alignments, paying special attention to  how factors like sample size and input data degeneracy affect the alignment strength.  As a specific application, we leverage our noise geometry characterizations to study how SGD escapes from sharp minima, revealing that the escape direction has significant components along flat directions. This is in stark contrast to GD, which escapes only along the sharpest directions.  To substantiate our theoretical findings, both synthetic and real-world  experiments are provided.",
        "keywords": "Stochastic gradient descent;Noise geometry;Loss landscape;Fisher matrix",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Mingze Wang;Lei Wu",
        "authorids": "~Mingze_Wang2;~Lei_Wu1",
        "gender": ";M",
        "homepage": "https://wmz9.github.io/;https://leiwu0.github.io/",
        "dblp": "296/7556;",
        "google_scholar": "CkU47X0AAAAJ;CMweeYcAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Mingze_Wang2;~Lei_Wu1",
        "aff": "Peking University;Peking University",
        "aff_domain": "pku.edu.cn;math.pku.edu.cn",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nwang2024the,\ntitle={The Noise Geometry of Stochastic Gradient Descent: A Quantitative and Analytical Characterization},\nauthor={Mingze Wang and Lei Wu},\nyear={2024},\nurl={https://openreview.net/forum?id=lxgrWqxRzx}\n}",
        "github": "",
        "project": "",
        "reviewers": "UF1v;GyvU;6rxs;anvg",
        "site": "https://openreview.net/forum?id=lxgrWqxRzx",
        "pdf_size": 838369,
        "rating": "3;3;5;6",
        "confidence": "4;3;3;2",
        "soundness": "2;3;2;3",
        "contribution": "1;1;3;3",
        "presentation": "2;3;1;3",
        "wc_summary": "71;243;124;120",
        "wc_strengths": "31;67;69;97",
        "wc_weaknesses": "394;267;184;121",
        "wc_questions": "3;4;449;277",
        "wc_review": "499;581;826;615",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            1.0
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            139.5,
            63.29494450586081
        ],
        "wc_strengths_avg": [
            66.0,
            23.430749027719962
        ],
        "wc_weaknesses_avg": [
            241.5,
            102.1432817173993
        ],
        "wc_questions_avg": [
            183.25,
            189.75823434043647
        ],
        "wc_review_avg": [
            630.25,
            120.62623056367136
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8236492504993365610&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Peking University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.pku.edu.cn",
        "aff_unique_abbr": "Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "lxlMFlzZO9",
        "title": "DS-Prover: A Dynamic Sampling Based Approach for Neural Theorem Proving",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Theorem proving is a fundamental task in mathematics. With the advent of large language models (LLMs) and interactive theorem provers (ITPs) like Lean, there has been growing interest in integrating LLMs and ITPs to automate theorem proving. In this approach, the LLM generates proof steps (tactics), and the ITP checks the applicability of the tactics at the current goal. The two systems work together to complete the proof. In this paper, we introduce DS-Prover, a novel dynamic sampling method for theorem proving. This method dynamically determines the number of tactics to apply to expand the current goal, taking into account the remaining time compared to the total allocated time for proving a theorem. This makes the proof search process more efficient by adjusting the balance between exploration and exploitation as time passes. We also study the effect of augmenting the training dataset by decomposing simplification and rewrite tactics with multiple premises into tactics with single premises. This gives the model more examples to learn from and helps it to predict the tactics with premises more accurately. We perform our experiments using the Mathlib dataset of the Lean theorem prover and report the performance on two standard datasets, MiniF2F and ProofNet. Our methods achieve significant performance gains on both datasets. We achieve a new state-of-the-art performance of 30.6% on MiniF2F using Lean, and a performance of 13.65% on ProofNet, which is comparable to the state-of-the-art.",
        "keywords": "Interactive Theorem Prover;Large Language Model;Neural Theorem Proving;Dynamic Sampling",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "",
        "author": "Rahul Vishwakarma;Subhankar Mishra",
        "authorids": "~Rahul_Vishwakarma2;~Subhankar_Mishra1",
        "gender": "M;M",
        "homepage": ";https://www.niser.ac.in/~smishra/",
        "dblp": ";147/8391",
        "google_scholar": "GVG1s7YAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";",
        "linkedin": "rahul3613/;",
        "or_profile": "~Rahul_Vishwakarma2;~Subhankar_Mishra1",
        "aff": "National Institute of Science Education and Reasearch;National Institute of Science Education and Research",
        "aff_domain": "niser.ac.in;niser.ac.in",
        "position": "Undergrad student;Assistant Professor",
        "bibtex": "@misc{\nvishwakarma2024dsprover,\ntitle={{DS}-Prover: A Dynamic Sampling Based Approach for Neural Theorem Proving},\nauthor={Rahul Vishwakarma and Subhankar Mishra},\nyear={2024},\nurl={https://openreview.net/forum?id=lxlMFlzZO9}\n}",
        "github": "",
        "project": "",
        "reviewers": "MSm4;6Nhd;X3v4;FKE8",
        "site": "https://openreview.net/forum?id=lxlMFlzZO9",
        "pdf_size": 728462,
        "rating": "3;3;3;6",
        "confidence": "5;3;4;4",
        "soundness": "1;2;3;3",
        "contribution": "2;2;2;2",
        "presentation": "2;2;2;2",
        "wc_summary": "48;77;53;100",
        "wc_strengths": "17;44;40;93",
        "wc_weaknesses": "472;139;166;76",
        "wc_questions": "30;37;77;82",
        "wc_review": "567;297;336;351",
        "wc_reply_reviewers": "18;197;69;0",
        "wc_reply_authors": "247;497;336;242",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "1;2;2;1",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            69.5,
            20.74246851269154
        ],
        "wc_strengths_avg": [
            48.5,
            27.681221071332818
        ],
        "wc_weaknesses_avg": [
            213.25,
            152.91725703791576
        ],
        "wc_questions_avg": [
            56.5,
            23.200215516240362
        ],
        "wc_review_avg": [
            387.75,
            105.35030849503954
        ],
        "wc_reply_reviewers_avg": [
            71.0,
            77.02272391963297
        ],
        "wc_reply_authors_avg": [
            330.5,
            103.14674013268669
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:vCinkSBAEfcJ:scholar.google.com/&scioq=DS-Prover:+A+Dynamic+Sampling+Based+Approach+for+Neural+Theorem+Proving&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "National Institute of Science Education and Research",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.niser.ac.in",
        "aff_unique_abbr": "NISER",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "India"
    },
    {
        "id": "ly10tMV6cD",
        "title": "Structure-Rich Text Benchmark for Knowledge Inference Evaluation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We  construct a benchmark for LLMs (Large Language Models) composed of structure-rich and syntactically rigorous corpus with mainly semantics-independent tasks, in purpose of evaluating the abilities of knowledge inference from small structured text and construction rules. The tasks also involve the capacity to generate strictly formatted response given the specification, i.e. to output the same structure-rich texts as the inputs. We also experimented on the popular LLMs with our benchmark to compare their competence to mine for information from syntax and condense information into structure.",
        "keywords": "Language Model;Structured Text;Benchmark;Evaluation;Dataset",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Haoning Ye;Zhouhong Gu;Zeyang Zhou;Sihang Jiang;Hongwei Feng;Yanghua Xiao",
        "authorids": "~Haoning_Ye1;~Zhouhong_Gu1;~Zeyang_Zhou3;~Sihang_Jiang1;~Hongwei_Feng1;~Yanghua_Xiao1",
        "gender": "M;M;F;M;M;",
        "homepage": "https://yhn-ice.github.io/Blog/;https://www.zhihu.com/people/shou-zu-ji-qiang-bing;https://honey-lily-f34.notion.site/profile-4adb7c3d552246e0b93de39e7aa8f73c?pvs=4;;https://cs.fudan.edu.cn/3e/77/c25930a278135/page.htm;",
        "dblp": ";317/4558;;236/6174;191/2477;96/999",
        "google_scholar": ";https://scholar.google.com/citations?view_op=list_works;;ZGTHnpAAAAAJ;w9f5xakAAAAJ;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": ";;;;;0000-0001-8403-9591",
        "linkedin": ";;;;;",
        "or_profile": "~Haoning_Ye1;~Zhouhong_Gu1;~Zeyang_Zhou3;~Sihang_Jiang1;~Hongwei_Feng1;~Yanghua_Xiao1",
        "aff": "Fudan University;Fudan University;Fudan University;Fudan University;Fudan University;Fudan University",
        "aff_domain": "fudan.edu.cn;fudan.edu.cn;fudan.edu.cn;fudan.edu.cn;fudan.edu.cn;fudan.edu.cn",
        "position": "Undergrad student;PhD student;Undergrad student;PhD student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nye2024structurerich,\ntitle={Structure-Rich Text Benchmark for Knowledge Inference Evaluation},\nauthor={Haoning Ye and Zhouhong Gu and Zeyang Zhou and Sihang Jiang and Hongwei Feng and Yanghua Xiao},\nyear={2024},\nurl={https://openreview.net/forum?id=ly10tMV6cD}\n}",
        "github": "",
        "project": "",
        "reviewers": "qcK5;k2bc;oBCJ;yLrc",
        "site": "https://openreview.net/forum?id=ly10tMV6cD",
        "pdf_size": 1481343,
        "rating": "1;3;3;6",
        "confidence": "4;4;3;3",
        "soundness": "2;1;2;3",
        "contribution": "1;1;2;3",
        "presentation": "2;2;2;3",
        "wc_summary": "32;89;75;39",
        "wc_strengths": "12;21;14;42",
        "wc_weaknesses": "11;96;159;88",
        "wc_questions": "29;34;3;48",
        "wc_review": "84;240;251;217",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            58.75,
            23.8995292840675
        ],
        "wc_strengths_avg": [
            22.25,
            11.882234638316145
        ],
        "wc_weaknesses_avg": [
            88.5,
            52.5190441649503
        ],
        "wc_questions_avg": [
            28.5,
            16.28649747490233
        ],
        "wc_review_avg": [
            198.0,
            66.95147496508199
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.7001400420140049,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:S2Zdiz3rhcAJ:scholar.google.com/&scioq=Structure-Rich+Text+Benchmark+for+Knowledge+Inference+Evaluation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "Fudan University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.fudan.edu.cn",
        "aff_unique_abbr": "Fudan",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "lygdvIKDxi",
        "title": "SEEKER: Semi-Supervised Knowledge Transfer for Query-Efficient Model Extraction",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Model extraction attacks against neural networks aim at extracting models without white-box access to model internals and training datasets. Unfortunately, most existing methods demand an excessive number of queries (up to millions) to reproduce a functional substitute model, greatly limiting their real-world applicability. In this work, we propose a query-efficient model extraction attack that effectively distills knowledge from publicly available data. To this end, we we introduce a semantic alignment approach that trains the substitute model without interacting with the victim model. The proposed approach optimizes the substitute model to learn a generalizable image encoding pattern based on semantic consistency of neural networks. We further propose a query generator that enhances the information density of generated queries by aggregating public information, thereby greatly reducing the query cost required for constructing the substitute model. Extensive experiments demonstrate that our method achieves state-of-the-art performance which improves query-efficiency by as much as 50\u00d7 with higher accuracy. Additionally, our attack demonstrates the capability of bypassing most types of existing defense mechanisms.",
        "keywords": "model extraction;knowledge transfer;semi-supervised learning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/2a9e7a072ee5c5adcb0dcedb78928692af3735a8.zip",
        "author": "Bihe Zhao;Zhenyu Guan;Junpeng Jing;Yanting Zhang;Xianglun Leng;Song Bian",
        "authorids": "~Bihe_Zhao1;~Zhenyu_Guan1;~Junpeng_Jing1;~Yanting_Zhang2;~Xianglun_Leng1;~Song_Bian3",
        "gender": "M;;M;F;;M",
        "homepage": "https://bihezhao.github.io;;https://tomtomtommi.github.io/;;;https://sbian3.github.io/",
        "dblp": "341/2036;121/1665;315/5225;210/4905-2;307/9864;179/7914",
        "google_scholar": "https://scholar.google.com.sg/citations?hl=zh-CN;https://scholar.google.com/citations?hl=zh-TW;https://scholar.google.com.hk/citations?user=OefyYf0AAAAJ;;;https://scholar.google.com/citations?hl=ja",
        "orcid": "0000-0001-8349-4533;;0000-0001-5669-8573;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Bihe_Zhao1;~Zhenyu_Guan1;~Junpeng_Jing1;~Yanting_Zhang2;~Xianglun_Leng1;~Song_Bian3",
        "aff": "Beihang University of Aeronautics and Astronautics;Beihang University;Imperial College London;;PowerTensors Technology;Beihang University",
        "aff_domain": "buaa.edu.cn;buaa.edu.cn;imperial.ac.uk;;powertensors.ai;buaa.edu.cn",
        "position": "MS student;Full Professor;PhD student;;Researcher;Associate Professor",
        "bibtex": "@misc{\nzhao2024seeker,\ntitle={{SEEKER}: Semi-Supervised Knowledge Transfer for Query-Efficient Model Extraction},\nauthor={Bihe Zhao and Zhenyu Guan and Junpeng Jing and Yanting Zhang and Xianglun Leng and Song Bian},\nyear={2024},\nurl={https://openreview.net/forum?id=lygdvIKDxi}\n}",
        "github": "",
        "project": "",
        "reviewers": "8x4q;WA7v;c2Ta",
        "site": "https://openreview.net/forum?id=lygdvIKDxi",
        "pdf_size": 4248897,
        "rating": "5;5;6",
        "confidence": "2;3;3",
        "soundness": "3;3;3",
        "contribution": "3;2;3",
        "presentation": "1;3;3",
        "wc_summary": "107;135;28",
        "wc_strengths": "55;210;20",
        "wc_weaknesses": "125;805;22",
        "wc_questions": "16;74;2",
        "wc_review": "303;1224;72",
        "wc_reply_reviewers": "0;286;0",
        "wc_reply_authors": "988;2282;577",
        "reply_reviewers": "0;1;0",
        "reply_authors": "2;4;1",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            90.0,
            45.306364527146364
        ],
        "wc_strengths_avg": [
            95.0,
            82.56310717667223
        ],
        "wc_weaknesses_avg": [
            317.3333333333333,
            347.38675213018064
        ],
        "wc_questions_avg": [
            30.666666666666668,
            31.16978594016256
        ],
        "wc_review_avg": [
            533.0,
            497.6283753967412
        ],
        "wc_reply_reviewers_avg": [
            95.33333333333333,
            134.8216929462351
        ],
        "wc_reply_authors_avg": [
            1282.3333333333333,
            726.512368939595
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:yYJGJeZWpMIJ:scholar.google.com/&scioq=SEEKER:+Semi-Supervised+Knowledge+Transfer+for+Query-Efficient+Model+Extraction&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2;0",
        "aff_unique_norm": "Beihang University;Imperial College London;PowerTensors Technology",
        "aff_unique_dep": "Aeronautics and Astronautics;;",
        "aff_unique_url": "http://www.buaa.edu.cn/;https://www.imperial.ac.uk;",
        "aff_unique_abbr": "BUAA;ICL;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "China;United Kingdom;"
    },
    {
        "id": "lyoOWX0e0O",
        "title": "Maintaining Plasticity in Continual Learning via Regenerative Regularization",
        "track": "main",
        "status": "Desk Reject",
        "tldr": "",
        "abstract": "In continual learning, plasticity refers to the ability of an agent to quickly adapt to new information. Neural networks are known to lose plasticity when processing non-stationary data streams. In this paper, we propose L2 Init, a simple approach for maintaining plasticity by incorporating in the loss function L2 regularization toward initial parameters.  This is very similar to standard L2 regularization (L2), the only difference being that L2 regularizes toward the origin. L2 Init is simple to implement and requires selecting only a single hyper-parameter. The motivation for this method is the same as that of methods that reset neurons or parameter values. Intuitively, when recent losses are insensitive to particular parameters, these parameters should drift toward their initial values. This prepares parameters to adapt quickly to new tasks. On problems representative of different types of nonstationarity in continual supervised learning, we demonstrate that L2 Init most consistently mitigates plasticity loss compared to previously proposed approaches.",
        "keywords": "continual learning;plasticity loss",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/5b39e6dfc4c3f05a3ee683682d5a5d59ad8aed3d.zip",
        "author": "Saurabh Kumar;Henrik Marklund;Benjamin Van Roy",
        "authorids": "~Saurabh_Kumar1;~Henrik_Marklund1;~Benjamin_Van_Roy1",
        "gender": ";;M",
        "homepage": ";;https://web.stanford.edu/~bvr/",
        "dblp": ";;41/4314",
        "google_scholar": ";;05sMX8MAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Saurabh_Kumar1;~Henrik_Marklund1;~Benjamin_Van_Roy1",
        "aff": ";;Stanford University",
        "aff_domain": ";;stanford.edu",
        "position": ";;Full Professor",
        "bibtex": "@misc{\nkumar2024maintaining,\ntitle={Maintaining Plasticity in Continual Learning via Regenerative Regularization},\nauthor={Saurabh Kumar and Henrik Marklund and Benjamin Van Roy},\nyear={2024},\nurl={https://openreview.net/forum?id=lyoOWX0e0O}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=lyoOWX0e0O",
        "pdf_size": 2022517,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 44,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5205748658039637760&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0",
        "aff_unique_norm": "Stanford University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.stanford.edu",
        "aff_unique_abbr": "Stanford",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Stanford",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "lzpHNyhIbr",
        "title": "CropNet: An Open Large-Scale Dataset with Multiple Modalities for Climate Change-aware Crop Yield Predictions",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Precise crop yield predictions are of national importance for ensuring food security and sustainable agricultural practices. While AI-for-science approaches have exhibited promising achievements in solving many scientific problems such as drug discovery, precipitation nowcasting, etc., the development of deep learning models for predicting crop yields is constantly hindered by the lack of an open and large-scale deep learning-ready dataset with multiple modalities to accommodate sufficient information. To remedy this, we introduce the CropNet dataset, the first terabyte-sized, publicly available, and multi-modal dataset specifically targeting crop yield predictions for the contiguous United States (U.S.) continent at the county level. Our CropNet dataset is composed of three modalities of data, i.e., Sentinel-2 Imagery, WRF-HRRR Computed Dataset, and USDA Crop Dataset, for over 2200 U.S. counties spanning 6 years (2017-2022), expected to facilitate researchers in developing versatile deep learning models for timely and precisely predicting crop yields at the county-level, by accounting for the effects of both short-term growing season weather variations and long-term climate change on crop yields. Besides, we release our CropNet package in the Python Package Index (PyPI), with three types of APIs developed for facilitating researchers in downloading the CropNet data on the fly over the time and region of interest, and flexibly building their deep learning models for accurate crop yield predictions. Extensive experiments have been conducted on our CropNet dataset via employing various types of deep learning solutions, with the results validating the general applicability and the efficacy of the CropNet dataset in climate change-aware crop yield predictions. Our dataset is available at https://anonymous.4open.science/r/CropNet, and our CropNet package is available at https://pypi.org/project/cropnet/.",
        "keywords": "Crop Dataset;Crop Yield Predictions;AI for Science",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/17992e62c36feab75e0ef0055e5bd31ddb72ef73.pdf",
        "author": "Fudong Lin;Kaleb Guillot;Summer Crawford;Yihe Zhang;Xu Yuan;Nian-Feng Tzeng",
        "authorids": "~Fudong_Lin1;~Kaleb_Guillot1;~Summer_Crawford1;~Yihe_Zhang1;~Xu_Yuan1;~Nian-Feng_Tzeng1",
        "gender": "M;M;F;M;M;M",
        "homepage": "https://fudong03.github.io/;;;;https://yuanxuyx.github.io/;https://people.cmix.louisiana.edu/tzeng/",
        "dblp": "299/4832;;;237/7632;24/6114-1;82/4827",
        "google_scholar": "matL_nIAAAAJ;;;nnWcnHsAAAAJ;R3XkwA8AAAAJ;6zq-c5cAAAAJ",
        "orcid": "0000-0003-0457-2527;;0009-0006-8132-2184;;;0000-0002-8357-6632",
        "linkedin": ";kalebguillot;summercrawford/;;;",
        "or_profile": "~Fudong_Lin1;~Kaleb_Guillot1;~Summer_Crawford1;~Yihe_Zhang1;~Xu_Yuan1;~Nian-Feng_Tzeng1",
        "aff": "University of Delaware;;University of Louisiana at Lafeyette;University of Louisiana at Lafeyette;University of Delaware;University of Louisiana at Lafeyette",
        "aff_domain": "udel.edu;;louisiana.edu;louisiana.edu;udel.edu;louisiana.edu",
        "position": "PhD student;;Undergrad student;PhD student;Associate Professor;Full Professor",
        "bibtex": "@misc{\nlin2024cropnet,\ntitle={CropNet: An Open Large-Scale Dataset with Multiple Modalities for Climate Change-aware Crop Yield Predictions},\nauthor={Fudong Lin and Kaleb Guillot and Summer Crawford and Yihe Zhang and Xu Yuan and Nian-Feng Tzeng},\nyear={2024},\nurl={https://openreview.net/forum?id=lzpHNyhIbr}\n}",
        "github": "",
        "project": "",
        "reviewers": "ME5N;m3sL;ma3c;yC3M",
        "site": "https://openreview.net/forum?id=lzpHNyhIbr",
        "pdf_size": 10308027,
        "rating": "1;3;3;6",
        "confidence": "5;4;5;3",
        "soundness": "1;1;2;3",
        "contribution": "1;2;2;3",
        "presentation": "1;1;2;2",
        "wc_summary": "703;71;49;78",
        "wc_strengths": "16;52;39;45",
        "wc_weaknesses": "70;864;147;20",
        "wc_questions": "72;302;92;102",
        "wc_review": "861;1289;327;245",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            225.25,
            276.0365691353231
        ],
        "wc_strengths_avg": [
            38.0,
            13.509256086106296
        ],
        "wc_weaknesses_avg": [
            275.25,
            342.9120696330183
        ],
        "wc_questions_avg": [
            142.0,
            93.00537618869137
        ],
        "wc_review_avg": [
            680.5,
            423.51948007146024
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.8866206949335731,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4073136618736438840&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;0;1",
        "aff_unique_norm": "University of Delaware;University of Louisiana at Lafayette",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.udel.edu;https://www.louisiana.edu",
        "aff_unique_abbr": "UD;UL Lafayette",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Lafayette",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "lzt60v45V4",
        "title": "Variational Federated Continual Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Federated continual learning (FCL) is an emerging learning paradigm with the potential to augment the scalability of federated learning by facilitating continual learning among multiple learners. However, FCL is beset by the significant challenges of local overfitting and catastrophic forgetting. To address both simultaneously, we propose Variational Federated Continual Learning (VFCL), a novel Bayesian neural network-based FCL framework that consists of two cores. First, we propose variational inference with mixture prior that merges global and local historical knowledge, which addresses local overfitting caused by the absence of global knowledge and catastrophic forgetting caused by the absence of historical knowledge simultaneously. Furthermore, to minimize the error in global knowledge acquisition, we present an effective global posterior aggregation method. Additionally, we provide a theoretical analysis on the upper bound of the generalization error of VFCL, which further helps to select the optimal hyperparameters. Empirical evaluations are conducted on VFCL, which outperforms other state-of-the-art methods on the widely used CIFAR100 and TinyImageNet datasets.",
        "keywords": "Federated Continual Learning;Bayesian Neural Network;Variational Inference",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Haodong Zhang;Liu Yang;Zixuan Qin;Qilong Wang;Yahong Han;Qinghua Hu;Yingjun Deng",
        "authorids": "~Haodong_Zhang3;~Liu_Yang7;~Zixuan_Qin1;~Qilong_Wang3;~Yahong_Han1;~Qinghua_Hu1;~Yingjun_Deng1",
        "gender": "M;F;M;;M;M;",
        "homepage": "https://github.com/zhanghad;http://cic.tju.edu.cn/faculty/yangliu/index.html;https://github.com/QinZixuan1958;https://csqlwang.github.io/homepage/;http://cic.tju.edu.cn/faculty/hanyahong/;http://cic.tju.edu.cn/faculty/huqinghua/index.html;",
        "dblp": ";;;119/1488.html;15/6265;;",
        "google_scholar": ";;;qdPVJN0AAAAJ;t4283loAAAAJ;TVSNq_wAAAAJ;",
        "orcid": ";0000-0001-8555-5387;;0000-0002-3765-9787;;0000-0001-7765-8095;0000-0001-8467-7526",
        "linkedin": ";;;;;;",
        "or_profile": "~Haodong_Zhang3;~Liu_Yang7;~Zixuan_Qin1;~Qilong_Wang3;~Yahong_Han1;~Qinghua_Hu1;~Yingjun_Deng1",
        "aff": "Tianjin University;Tianjin University;Tianjin University;Tianjin University;Tianjin University;Tianjin University;Tianjin University",
        "aff_domain": "tju.edu.cn;tju.edu.cn;tju.edu.cn;tju.edu.cn;tju.edu.cn;tju.edu.cn;tju.edu.cn",
        "position": "MS student;Full Professor;MS student;Associate Professor;Full Professor;Professor;Assistant Professor",
        "bibtex": "@misc{\nzhang2024variational,\ntitle={Variational Federated Continual Learning},\nauthor={Haodong Zhang and Liu Yang and Zixuan Qin and Qilong Wang and Yahong Han and Qinghua Hu and Yingjun Deng},\nyear={2024},\nurl={https://openreview.net/forum?id=lzt60v45V4}\n}",
        "github": "",
        "project": "",
        "reviewers": "uvyG;ouu6;J3Yt;Htsy",
        "site": "https://openreview.net/forum?id=lzt60v45V4",
        "pdf_size": 1123966,
        "rating": "3;6;6;8",
        "confidence": "4;3;4;5",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "118;48;126;97",
        "wc_strengths": "44;45;62;132",
        "wc_weaknesses": "327;38;182;283",
        "wc_questions": "82;36;115;160",
        "wc_review": "571;167;485;672",
        "wc_reply_reviewers": "199;12;5;76",
        "wc_reply_authors": "1341;156;484;784",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "3;1;1;2",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            97.25,
            30.34283276162593
        ],
        "wc_strengths_avg": [
            70.75,
            36.07890657988404
        ],
        "wc_weaknesses_avg": [
            207.5,
            111.08667786913064
        ],
        "wc_questions_avg": [
            98.25,
            45.36725140450984
        ],
        "wc_review_avg": [
            473.75,
            189.0652995660494
        ],
        "wc_reply_reviewers_avg": [
            73.0,
            77.82994282408282
        ],
        "wc_reply_authors_avg": [
            691.25,
            435.9537676176225
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.39605901719066966,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:gQKHExn6CWMJ:scholar.google.com/&scioq=Variational+Federated+Continual+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0;0;0",
        "aff_unique_norm": "Tianjin University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.tju.edu.cn",
        "aff_unique_abbr": "TJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "m0GP6qVpEx",
        "title": "RDBench: ML Benchmark for Relational Databases",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Benefiting from high-quality datasets and standardized evaluation metrics, machine learning (ML) has achieved sustained progress and widespread applications. However, while applying machine learning to relational databases, the absence of a well-established benchmark remains a significant obstacle to the development of ML. To address this issue, we introduce \\textit{ML Benchmark For Relational Databases} (RDBench), a benchmark that aims to promote hierarchical, robust, and reproducible ML research on relational databases. RDBench offers hierarchical datasets of varying scales, domains, and relations. It provides three types of data: tabular data, homogeneous graphs, and heterogeneous graphs. Importantly, all data formats share the same task definition, allowing for meaningful comparisons between methods across different data formats. Reported results are averaged over the same datasets and tasks (classification or regression), further enhancing the robustness of the experimental findings. In addition to dataset construction, we conduct extensive experiments to uncover performance differences between models. To better present our proposed RDBench, we offer a user-friendly API that provides standardized formats for three types of data.",
        "keywords": "Relational Databases;Graph Representation Learning;Machine Learning Benchmark",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Zizhao Zhang;Yi Yang;Lutong Zou;He Wen;Tao Feng;Jiaxuan You",
        "authorids": "~Zizhao_Zhang4;~Yi_Yang27;~Lutong_Zou1;~He_Wen3;~Tao_Feng5;~Jiaxuan_You2",
        "gender": ";M;M;M;M;",
        "homepage": ";https://yiyang-github.github.io/;https://lugartang.github.io/;https://confucianism72.github.io/wenhe.github.io/;;",
        "dblp": ";33/4854-61;;;;",
        "google_scholar": ";FMptpWQAAAAJ;;;3xK6SlIAAAAJ;",
        "orcid": ";0000-0002-5687-7819;;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Zizhao_Zhang4;~Yi_Yang27;~Lutong_Zou1;~He_Wen3;~Tao_Feng5;~Jiaxuan_You2",
        "aff": ";USTC;Peking University;Tsinghua University;Department of Computer Science, University of Illinois at Urbana-Champaign;",
        "aff_domain": ";mail.ustc.edu;pku.edu.cn;tsinghua.edu.cn;cs.illinois.edu;",
        "position": ";Undergrad student;Undergrad student;Undergrad student;PhD student;",
        "bibtex": "@misc{\nzhang2024rdbench,\ntitle={{RDB}ench: {ML} Benchmark for Relational Databases},\nauthor={Zizhao Zhang and Yi Yang and Lutong Zou and He Wen and Tao Feng and Jiaxuan You},\nyear={2024},\nurl={https://openreview.net/forum?id=m0GP6qVpEx}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=m0GP6qVpEx",
        "pdf_size": 1185014,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13539523672657075147&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "University of Science and Technology of China;Peking University;Tsinghua University;University of Illinois Urbana-Champaign",
        "aff_unique_dep": ";;;Department of Computer Science",
        "aff_unique_url": "https://www.ustc.edu.cn;http://www.pku.edu.cn;https://www.tsinghua.edu.cn;https://illinois.edu",
        "aff_unique_abbr": "USTC;Peking U;THU;UIUC",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Urbana-Champaign",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Time-Varying Propensity Score to Bridge the Gap between the Past and Present",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17912",
        "id": "m0x0rv6Iwm",
        "author_site": "Rasool Fakoor, Jonas Mueller, Zachary Lipton, Pratik A Chaudhari, Alex Smola",
        "tldr": "",
        "abstract": "Real-world deployment of machine learning models is challenging because data evolves over time. While no model can work when data evolves in an arbitrary fashion, if there is some pattern to these changes, we might be able to design methods to address it. This paper addresses situations when data evolves gradually. We introduce a time-varying propensity score that can detect gradual shifts in the distribution of data which allows us to selectively sample past data to update the model---not just similar data from the past like that of a standard propensity score but also data that evolved in a similar fashion in the past. The time-varying propensity score is quite general: we demonstrate different ways of implementing it and evaluate it on a variety of problems ranging from supervised learning (e.g., image classification problems) where data undergoes a sequence of gradual shifts, to reinforcement learning tasks (e.g., robotic manipulation and continuous control) where data shifts as the policy or the task changes.",
        "keywords": "model adaptation to changing data;distribution shift",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Rasool Fakoor;Jonas Mueller;Zachary Chase Lipton;Pratik Chaudhari;Alex Smola",
        "authorids": "~Rasool_Fakoor1;~Jonas_Mueller1;~Zachary_Chase_Lipton1;~Pratik_Chaudhari1;~Alex_Smola1",
        "gender": "M;M;Unspecified;M;M",
        "homepage": "http://rasoolfa.github.io;;http://zacklipton.com;https://pratikac.github.io/;http://alex.smola.org",
        "dblp": "123/2447;178/3250;;;s/AlexanderJSmola",
        "google_scholar": "nVsOPtQAAAAJ;HeVcLzAAAAAJ;MN9Kfg8AAAAJ;c_z5hWEAAAAJ;Tb0ZrYwAAAAJ",
        "orcid": ";;;;",
        "linkedin": "rasool-fakoor-695b5845/;;;pratik-chaudhari-59508765;smola",
        "or_profile": "~Rasool_Fakoor1;~Jonas_Mueller1;~Zachary_Chase_Lipton1;~Pratik_Chaudhari1;~Alex_Smola1",
        "aff": "Amazon Web Services;Cleanlab;Carnegie Mellon University;School of Engineering and Applied Science, University of Pennsylvania;Boson AI",
        "aff_domain": "amazon.com;cleanlab.ai;cmu.edu;seas.upenn.edu;boson.ai",
        "position": "Researcher;Researcher;Assistant Professor;Assistant Professor;CEO",
        "bibtex": "@inproceedings{\nfakoor2024timevarying,\ntitle={Time-Varying Propensity Score to Bridge the Gap between the Past and Present},\nauthor={Rasool Fakoor and Jonas Mueller and Zachary Chase Lipton and Pratik Chaudhari and Alex Smola},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=m0x0rv6Iwm}\n}",
        "github": "",
        "project": "",
        "reviewers": "A4rR;evvV;LkU5;bXrx",
        "pdf_size": 5370317,
        "rating": "5;6;6;8",
        "confidence": "2;4;4;2",
        "soundness": "3;3;4;4",
        "contribution": "3;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "80;82;182;75",
        "wc_strengths": "71;50;215;55",
        "wc_weaknesses": "127;818;102;205",
        "wc_questions": "2;13;241;48",
        "wc_review": "280;963;740;383",
        "wc_reply_reviewers": "612;637;0;113",
        "wc_reply_authors": "1552;2699;1321;904",
        "reply_reviewers": "1;2;0;1",
        "reply_authors": "3;5;2;3",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.0,
            1.0
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            104.75,
            44.67311831515682
        ],
        "wc_strengths_avg": [
            97.75,
            68.13726953730975
        ],
        "wc_weaknesses_avg": [
            313.0,
            294.02635936255786
        ],
        "wc_questions_avg": [
            76.0,
            96.76517968773685
        ],
        "wc_review_avg": [
            591.5,
            274.12086750191054
        ],
        "wc_reply_reviewers_avg": [
            340.5,
            286.93248334756385
        ],
        "wc_reply_authors_avg": [
            1619.0,
            665.3792151848448
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            3.25,
            1.0897247358851685
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.2294157338705618,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7052663439196844060&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=m0x0rv6Iwm",
        "pdf": "https://openreview.net/pdf?id=m0x0rv6Iwm",
        "email": "amazon.com;cleanlab.ai;cmu.edu;seas.upenn.edu;boson.ai",
        "author_num": 5,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "Amazon;Cleanlab;Carnegie Mellon University;University of Pennsylvania;Boson AI",
        "aff_unique_dep": "Amazon Web Services;;;School of Engineering and Applied Science;",
        "aff_unique_url": "https://aws.amazon.com;https://www.cleanlab.ai;https://www.cmu.edu;https://www.upenn.edu;https://www.boson.ai",
        "aff_unique_abbr": "AWS;;CMU;UPenn;Boson AI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;1",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "To the Cutoff... and Beyond? A Longitudinal Perspective on LLM Data Contamination",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17911",
        "id": "m2NVG4Htxs",
        "author_site": "Manley Roberts, Himanshu Thakur, Christine Herlihy, Colin White, Samuel Dooley",
        "tldr": "",
        "abstract": "Recent claims about the impressive abilities of large language models (LLMs) are often supported by evaluating publicly available benchmarks. \nSince LLMs train on wide swaths of the internet, this practice raises concerns of data contamination, i.e., evaluating on examples that are explicitly or implicitly included in the training data. \nData contamination remains notoriously challenging to measure and mitigate, even with partial attempts like controlled experimentation of training data, canary strings, or embedding similarities. \nIn this work, we conduct the first thorough longitudinal analysis of data contamination in LLMs by using the natural experiment of training cutoffs in GPT models to look at benchmarks released over time.\nSpecifically, we consider two code/mathematical problem-solving datasets, Codeforces and Project Euler, and find statistically significant trends among LLM pass rate vs. GitHub popularity and release date that provide strong evidence of contamination. \nBy open-sourcing our dataset, raw results, and evaluation framework, our work paves the way for rigorous analyses of data contamination in modern models. We conclude with a discussion of best practices and future steps for publicly releasing benchmark in the age of LLMs which  train on webscale data.",
        "keywords": "contamination;memorization;llm;codeforces;project euler;datasets;benchmarks;training cutoff",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Manley Roberts;Himanshu Thakur;Christine Herlihy;Colin White;Samuel Dooley",
        "authorids": "~Manley_Roberts1;~Himanshu_Thakur1;~Christine_Herlihy1;~Colin_White1;~Samuel_Dooley1",
        "gender": ";;;M;",
        "homepage": ";;;https://crwhite.ml/;",
        "dblp": ";;;136/9162;",
        "google_scholar": ";;;LS6HY-gAAAAJ;",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Manley_Roberts1;~Himanshu_Thakur1;~Christine_Herlihy1;~Colin_White1;~Samuel_Dooley1",
        "aff": ";;;Abacus.AI;",
        "aff_domain": ";;;abacus.ai;",
        "position": ";;;Head of Research;",
        "bibtex": "@inproceedings{\nroberts2024to,\ntitle={To the Cutoff... and Beyond? A Longitudinal Perspective on {LLM} Data Contamination},\nauthor={Manley Roberts and Himanshu Thakur and Christine Herlihy and Colin White and Samuel Dooley},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=m2NVG4Htxs}\n}",
        "github": "",
        "project": "",
        "reviewers": "VA65;XbnJ;yfjE;EfiM",
        "pdf_size": 5456473,
        "rating": "5;6;8;8",
        "confidence": "2;2;4;4",
        "soundness": "1;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "3;3;3;4",
        "wc_summary": "103;79;46;34",
        "wc_strengths": "39;80;62;56",
        "wc_weaknesses": "119;46;99;420",
        "wc_questions": "1;4;39;52",
        "wc_review": "262;209;246;562",
        "wc_reply_reviewers": "0;26;138;510",
        "wc_reply_authors": "798;1092;832;1738",
        "reply_reviewers": "0;1;1;2",
        "reply_authors": "2;3;2;3",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.0,
            1.0
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            65.5,
            27.207535720825582
        ],
        "wc_strengths_avg": [
            59.25,
            14.652218262092603
        ],
        "wc_weaknesses_avg": [
            171.0,
            146.2138844296259
        ],
        "wc_questions_avg": [
            24.0,
            22.01136070305514
        ],
        "wc_review_avg": [
            319.75,
            141.1778576831367
        ],
        "wc_reply_reviewers_avg": [
            168.5,
            203.8694435171686
        ],
        "wc_reply_authors_avg": [
            1115.0,
            377.23865125408344
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.9622504486493761,
        "gs_citation": 27,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2471365827562186906&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=m2NVG4Htxs",
        "pdf": "https://openreview.net/pdf?id=m2NVG4Htxs",
        "email": ";;;abacus.ai;",
        "author_num": 5,
        "aff_unique_index": "0",
        "aff_unique_norm": "Abacus.AI",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.abacus.ai",
        "aff_unique_abbr": "Abacus.AI",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "title": "DENEVIL: TOWARDS DECIPHERING AND NAVIGATING THE ETHICAL VALUES OF LARGE LANGUAGE MODELS VIA INSTRUCTION LEARNING",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17910",
        "id": "m3RRWWFaVe",
        "author_site": "Shitong Duan, Xiaoyuan Yi, Peng Zhang, Tun Lu, Xing Xie, Ning Gu",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) have made unprecedented breakthroughs, yet their increasing integration into everyday life might raise societal risks due to generated unethical content. Despite extensive study on specific issues like bias, the intrinsic values of LLMs remain largely unexplored from a moral philosophy perspective. This work delves into ethical values utilizing Moral Foundation Theory. Moving beyond conventional discriminative evaluations with poor reliability, we propose DeNEVIL, a novel prompt generation algorithm tailored to dynamically exploit LLMs\u2019 value vulnerabilities and elicit the violation of ethics in a generative manner, revealing their underlying value inclinations. On such a basis, we construct MoralPrompt, a high-quality dataset comprising 2,397 prompts covering 500+ value principles, and then benchmark the intrinsic values across a spectrum of LLMs. We discovered that most models are essentially misaligned, necessitating further ethical value alignment. In response, we develop VILMO, an in-context alignment method that substantially enhances the value compliance of LLM outputs by learning to generate appropriate value instructions, outperforming existing competitors. Our methods are suitable for black-box and open-source models, offering a promising initial step in studying the ethical values of LLMs.",
        "keywords": "Ethical values;Large Language Models;Alignment",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Shitong Duan;Xiaoyuan Yi;Peng Zhang;Tun Lu;Xing Xie;Ning Gu",
        "authorids": "~Shitong_Duan1;~Xiaoyuan_Yi1;~Peng_Zhang31;~Tun_Lu1;~Xing_Xie3;~Ning_Gu2",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://dsttsd.github.io/about/;;https://cscw.fudan.edu.cn/pengzhang/list.htm;;http://research.microsoft.com/en-us/people/xingx/;https://cscw.fudan.edu.cn/",
        "dblp": "301/6088;179/2248;;41/2472;08/6809-1;",
        "google_scholar": "k5vOJbMAAAAJ;BdpXcLgAAAAJ;;;5EQfAFIAAAAJ;https://scholar.google.com.au/citations?user=AUnPpaUAAAAJ",
        "orcid": ";0000-0003-2710-1613;;0000-0002-6633-4826;0000-0002-8608-8482;0000-0002-2915-974X",
        "linkedin": ";xiaoyuan-yi-471212a5/;;;xingx/;",
        "or_profile": "~Shitong_Duan1;~Xiaoyuan_Yi1;~Peng_Zhang31;~Tun_Lu1;~Xing_Xie3;~Ning_Gu2",
        "aff": "Fudan University;Microsoft Research;;Fudan University;Microsoft Research Asia;Fudan University",
        "aff_domain": "fudan.edu.cn;research.microsoft.com;;fudan.edu.cn;microsoft.com;fudan.edu.cn",
        "position": "MS student;Senior Researcher;;Full Professor;Senior Principal Researcher;Full Professor",
        "bibtex": "@inproceedings{\nduan2024denevil,\ntitle={{DENEVIL}: {TOWARDS} {DECIPHERING} {AND} {NAVIGATING} {THE} {ETHICAL} {VALUES} {OF} {LARGE} {LANGUAGE} {MODELS} {VIA} {INSTRUCTION} {LEARNING}},\nauthor={Shitong Duan and Xiaoyuan Yi and Peng Zhang and Tun Lu and Xing Xie and Ning Gu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=m3RRWWFaVe}\n}",
        "github": "",
        "project": "",
        "reviewers": "cFWK;7uMF;6fGR;AiAD",
        "pdf_size": 1757404,
        "rating": "5;5;6;10",
        "confidence": "3;3;3;4",
        "soundness": "3;2;3;4",
        "contribution": "3;2;3;4",
        "presentation": "1;1;3;3",
        "wc_summary": "106;76;71;99",
        "wc_strengths": "32;21;57;54",
        "wc_weaknesses": "84;226;43;17",
        "wc_questions": "2;90;37;128",
        "wc_review": "224;413;208;298",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1159;2401;2512;1278",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;4;4;2",
        "rating_avg": [
            6.5,
            2.0615528128088303
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.0,
            1.0
        ],
        "wc_summary_avg": [
            88.0,
            14.815532390029054
        ],
        "wc_strengths_avg": [
            41.0,
            15.049916943292411
        ],
        "wc_weaknesses_avg": [
            92.5,
            80.69231685854608
        ],
        "wc_questions_avg": [
            64.25,
            48.334123556758534
        ],
        "wc_review_avg": [
            285.75,
            80.93322865177196
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1837.5,
            621.6681188544254
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            3.0,
            1.0
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.9801960588196067,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14170368506340063286&as_sdt=5,30&sciodt=0,30&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=m3RRWWFaVe",
        "pdf": "https://openreview.net/pdf?id=m3RRWWFaVe",
        "email": "fudan.edu.cn;research.microsoft.com;;fudan.edu.cn;microsoft.com;fudan.edu.cn",
        "author_num": 6,
        "aff_unique_index": "0;1;0;1;0",
        "aff_unique_norm": "Fudan University;Microsoft",
        "aff_unique_dep": ";Microsoft Research",
        "aff_unique_url": "https://www.fudan.edu.cn;https://www.microsoft.com/en-us/research",
        "aff_unique_abbr": "Fudan;MSR",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Asia",
        "aff_country_unique_index": "0;1;0;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Sentence-level Prompts Benefit Composed Image Retrieval",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17909",
        "id": "m3ch3kJL7q",
        "author_site": "Yang Bai, Xinxing Xu, Yong Liu, Salman Khan, Fahad Khan, Wangmeng Zuo, Rick Siow Mong Mong, Chun-Mei Feng",
        "tldr": "",
        "abstract": "Composed image retrieval (CIR) is the task of retrieving specific images by using a query that involves both a reference image and a relative caption. Most existing CIR models adopt the late-fusion strategy to combine visual and language features. Besides, several approaches have also been suggested to generate a pseudo-word token from the reference image, which is further integrated into the relative caption for CIR. However, these pseudo-word-based prompting methods have limitations when target image encompasses complex changes on reference image, e.g., object removal and attribute modification. In this work, we demonstrate that learning an appropriate sentence-level prompt for the relative caption (SPRC) is sufficient for achieving effective composed image retrieval. Instead of relying on pseudo- word-based prompts, we propose to leverage pretrained V-L models, e.g., BLIP-2, to generate sentence-level prompts. By concatenating the learned sentence-level prompt with the relative caption, one can readily use existing text-based image retrieval models to enhance CIR performance. Furthermore, we introduce both image-text contrastive loss and text prompt alignment loss to enforce the learning of suitable sentence-level prompts. Experiments show that our proposed method performs favorably against the state-of-the-art CIR methods on the Fashion-IQ and CIRR datasets.",
        "keywords": "Composed Image Retrieval;Vision-Language Pre-trained Models",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yang bai;Xinxing Xu;Yong Liu;Salman Khan;Fahad Khan;Wangmeng Zuo;Rick Siow Mong Goh;Chun-Mei Feng",
        "authorids": "~Yang_bai4;~Xinxing_Xu1;~Yong_Liu10;~Salman_Khan4;~Fahad_Khan1;~Wangmeng_Zuo3;~Rick_Siow_Mong_Goh1;~Chun-Mei_Feng1",
        "gender": ";M;M;M;M;M;;F",
        "homepage": ";https://sites.google.com/site/xinxingxu666/;;https://salman-h-khan.github.io/;https://sites.google.com/view/fahadkhans/home;;https://sites.google.com/view/rickgoh/home;https://scholar.google.com.hk/citations?user=g2nqHBcAAAAJ&hl=zh-CN",
        "dblp": "166/7551;15/10654;29/4867-26;32/11535-1;05/8618;93/2671;https://dblp.uni-trier.de/pers/g/Goh:Rick_Siow_Mong;182/8416-1",
        "google_scholar": "yGGlkIsAAAAJ;https://scholar.google.com.sg/citations?user=neFbpuEAAAAJ;QujHYk0AAAAJ;https://scholar.google.es/citations?user=M59O9lkAAAAJ;zvaeYnUAAAAJ;rUOpCEYAAAAJ;https://scholar.google.com.sg/citations?user=fBsBJjoAAAAJ;https://scholar.google.com.hk/citations?user=g2nqHBcAAAAJ",
        "orcid": ";0000-0003-1449-3072;;0000-0002-9502-1749;;0000-0002-3330-783X;0000-0001-9116-1595;0000-0002-3044-9779",
        "linkedin": ";;liuyongsg;;;;rickgoh/;https://linkedin.com/in/chunmei-feng-719a72229",
        "or_profile": "~Yang_bai4;~Xinxing_Xu1;~Yong_Liu10;~Salman_Khan4;~Fahad_Khan1;~Wangmeng_Zuo3;~Rick_Siow_Mong_Goh1;~Chun-Mei_Feng1",
        "aff": "Institute of High Performance Computing, Singapore, A*STAR;Institute of High Performance Computing;Institute of High Performance Computing, Singapore, A*STAR;Australian National University;Link\u00f6ping University;Harbin Institute of Technology;Institute of High Performance Computing, Singapore, A*STAR;IHPC",
        "aff_domain": "ihpc.a-star.edu.sg;ihpc.a-star.edu.sg;ihpc.a-star.edu.sg;anu.edu.au;liu.se;hit.edu.cn;ihpc.a-star.edu.sg;astar.edu.sg",
        "position": "Researcher;Scientist;Senior Scientist, Adjunct Assistant Professor;Lecturer;Associate Professor;Full Professor;Director;Researcher",
        "bibtex": "@inproceedings{\nbai2024sentencelevel,\ntitle={Sentence-level Prompts Benefit Composed Image Retrieval},\nauthor={Yang bai and Xinxing Xu and Yong Liu and Salman Khan and Fahad Khan and Wangmeng Zuo and Rick Siow Mong Goh and Chun-Mei Feng},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=m3ch3kJL7q}\n}",
        "github": "",
        "project": "",
        "reviewers": "NuL6;fBxs;a9pf",
        "pdf_size": 5641958,
        "rating": "6;6;8",
        "confidence": "4;3;5",
        "soundness": "3;3;3",
        "contribution": "2;2;3",
        "presentation": "3;3;3",
        "wc_summary": "74;71;83",
        "wc_strengths": "48;47;28",
        "wc_weaknesses": "165;99;17",
        "wc_questions": "4;35;19",
        "wc_review": "291;252;147",
        "wc_reply_reviewers": "69;0;0",
        "wc_reply_authors": "864;727;630",
        "reply_reviewers": "2;0;0",
        "reply_authors": "4;2;2",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            76.0,
            5.0990195135927845
        ],
        "wc_strengths_avg": [
            41.0,
            9.201449161228174
        ],
        "wc_weaknesses_avg": [
            93.66666666666667,
            60.53832578531462
        ],
        "wc_questions_avg": [
            19.333333333333332,
            12.657891697365017
        ],
        "wc_review_avg": [
            230.0,
            60.81118318204309
        ],
        "wc_reply_reviewers_avg": [
            23.0,
            32.526911934581186
        ],
        "wc_reply_authors_avg": [
            740.3333333333334,
            95.99421278852641
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.8660254037844385,
        "gs_citation": 19,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5393257189262978466&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=m3ch3kJL7q",
        "pdf": "https://openreview.net/pdf?id=m3ch3kJL7q",
        "email": "ihpc.a-star.edu.sg;ihpc.a-star.edu.sg;ihpc.a-star.edu.sg;anu.edu.au;liu.se;hit.edu.cn;ihpc.a-star.edu.sg;astar.edu.sg",
        "author_num": 8,
        "aff_unique_index": "0;0;0;1;2;3;0;0",
        "aff_unique_norm": "Institute of High Performance Computing;Australian National University;Link\u00f6ping University;Harbin Institute of Technology",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.ihpc.a-star.edu.sg;https://www.anu.edu.au;https://www.liu.se;http://www.hit.edu.cn/",
        "aff_unique_abbr": "IHPC;ANU;LiU;HIT",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Harbin",
        "aff_country_unique_index": "0;0;0;1;2;3;0;0",
        "aff_country_unique": "Singapore;Australia;Sweden;China"
    },
    {
        "id": "m3kghqPaGL",
        "title": "Energy Calibration Head: A Plug-In Neural Network Head with Human-like Uncertainty",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The ability to distinguish what it knows from what it does not, known as metacognition, has been one of the fundamental challenges in modern AI. One benefit of metacognition is that it could preclude overconfident learning about out-of-distributions. For instance, machine learning models often exhibit excessive confidence when dealing with uncertain inputs. To mitigate this issue, we leverage the relationship between the marginal probability and conditional uncertainty found in our human behavioral experiments classifying out-of-distribution (OOD) images. Theoretical analyses reveal that uncertainty and marginal energy are loosely related and significantly influenced by the latent vector norm. Building upon this finding, we propose a novel plug-in type layer: energy calibration head (ECH). The ECH uses a metacognition module that calibrates uncertainty by evaluating the difference between actual marginal energy (indicative of how much it knows) and the marginal energy predicted based on the uncertainty level, leading to the attenuated joint energies for the OOD samples. We showed that a neural network with ECH emulates human-like uncertainty in OOD images (45.1% AUROC error reduction on average compared to a linear head) and can effectively perform anomaly detection tasks.",
        "keywords": "Metacognition;Overconfidence;Uncertainty;Energy;OOD",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/6d471e97f37e6790c027bdfe4b6f3634c7a8a547.zip",
        "author": "Myoung Hoon Ha;Jungwon Ryu;ChangHwa Lee;SungHeon Jeong;Geon Yeong Park;Sang Wan Lee",
        "authorids": "~Myoung_Hoon_Ha1;~Jungwon_Ryu1;~ChangHwa_Lee2;~SungHeon_Jeong1;~Geon_Yeong_Park1;~Sang_Wan_Lee1",
        "gender": "M;M;M;M;M;M",
        "homepage": ";https://github.com/ckdghk77;;https://geonyeong-park.github.io/;https://aibrain.kaist.ac.kr/sang-wan-lee;https://mhha.netlify.app/",
        "dblp": ";;120/1499;289/5924;77/6650;150/6888",
        "google_scholar": ";;IEgLrnQAAAAJ;HGF4a14AAAAJ;0rMoHW4AAAAJ;thAB-qQAAAAJ",
        "orcid": "0000-0002-5718-829X;;0000-0003-3540-7065;;;",
        "linkedin": ";;evan-jeong-69b4812a5/;;;",
        "or_profile": "~Jungwon_Ryu1;~ChangHwa_Lee2;~SungHeon_Jeong1;~Geon_Yeong_Park1;~Sang_Wan_Lee1;~Myounghoon_Ha1",
        "aff": "Korea Advanced Institute of Science & Technology;KAIST;University of California, Irvine;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr;uci.edu;kaist.ac.kr;kaist.ac.kr;kaist.ac.kr",
        "position": "Postdoc;PhD student;PhD student;PhD student;Associate Professor;Postdoc",
        "bibtex": "@misc{\nha2024energy,\ntitle={Energy Calibration Head: A Plug-In Neural Network Head with Human-like Uncertainty},\nauthor={Myoung Hoon Ha and Jungwon Ryu and ChangHwa Lee and SungHeon Jeong and Geon Yeong Park and Sang Wan Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=m3kghqPaGL}\n}",
        "github": "",
        "project": "",
        "reviewers": "BC71;2EYy;Gi7P;CexK",
        "site": "https://openreview.net/forum?id=m3kghqPaGL",
        "pdf_size": 31773200,
        "rating": "3;3;5;5",
        "confidence": "3;4;2;3",
        "soundness": "2;2;2;3",
        "contribution": "3;1;2;3",
        "presentation": "3;1;2;3",
        "wc_summary": "344;116;89;84",
        "wc_strengths": "122;35;81;68",
        "wc_weaknesses": "186;177;420;77",
        "wc_questions": "63;324;139;434",
        "wc_review": "715;652;729;663",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            158.25,
            107.93140182541872
        ],
        "wc_strengths_avg": [
            76.5,
            31.164884084494844
        ],
        "wc_weaknesses_avg": [
            215.0,
            125.85110249815057
        ],
        "wc_questions_avg": [
            240.0,
            146.8179144382592
        ],
        "wc_review_avg": [
            689.75,
            32.85859857023729
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.7071067811865475,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:PG6DGvYv1cwJ:scholar.google.com/&scioq=Energy+Calibration+Head:+A+Plug-In+Neural+Network+Head+with+Human-like+Uncertainty&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology;University of California, Irvine",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.kaist.ac.kr;https://www.uci.edu",
        "aff_unique_abbr": "KAIST;UCI",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Irvine",
        "aff_country_unique_index": "0;0;1;0;0;0",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "title": "Policy Rehearsing: Training Generalizable Policies for Reinforcement Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17908",
        "id": "m3xVPaZp6Z",
        "author_site": "Chengxing Jia, Chen-Xiao Gao, Hao Yin, Fuxiang Zhang, XiongHui Chen, Tian Xu, Lei Yuan, Zongzhang Zhang, Zhi-Hua Zhou, Yang Yu",
        "tldr": "",
        "abstract": "Human beings can make adaptive decisions in a preparatory manner, i.e., by making preparations in advance, which offers significant advantages in scenarios where both online and offline experiences are expensive and limited. Meanwhile, current reinforcement learning methods commonly rely on numerous environment interactions but hardly obtain generalizable policies. In this paper, we introduce the idea of \\textit{rehearsal} into policy optimization, where the agent plans for all possible outcomes in mind and acts adaptively according to actual responses from the environment. To effectively rehearse, we propose ReDM, an algorithm that generates a diverse and eligible set of dynamics models and then rehearse the policy via adaptive training on the generated model set. Rehearsal enables the policy to make decision plans for various hypothetical dynamics and to naturally generalize to previously unseen environments. Our experimental results demonstrate that ReDM is capable of learning a valid policy solely through rehearsal, even with \\emph{zero} interaction data. We further extend ReDM to scenarios where limited or mismatched interaction data is available, and our experimental results reveal that ReDM produces high-performing policies compared to other offline RL baselines.",
        "keywords": "Reinforcement Learning;Model-based Reinforcement Learning;Offline Reinforcement Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/60060d3cb210a5ee5a27e73d89d9c10b6fdf84b3.zip",
        "author": "Chengxing Jia;Chenxiao Gao;Hao Yin;Fuxiang Zhang;Xiong-Hui Chen;Tian Xu;Lei Yuan;Zongzhang Zhang;Zhi-Hua Zhou;Yang Yu",
        "authorids": "~Chengxing_Jia1;~Chenxiao_Gao1;~Hao_Yin3;~Fuxiang_Zhang1;~Xiong-Hui_Chen1;~Tian_Xu2;~Lei_Yuan2;~Zongzhang_Zhang1;~Zhi-Hua_Zhou2;~Yang_Yu5",
        "gender": "M;;M;M;M;M;M;M;;",
        "homepage": "http://www.lamda.nju.edu.cn/jiacx/;;http://www.lamda.nju.edu.cn/yinh/;http://www.lamda.nju.edu.cn/zhangfx/;http://www.lamda.nju.edu.cn/chenxh/;http://www.lamda.nju.edu.cn/xut/;http://www.lamda.nju.edu.cn/yuanl/;http://www.lamda.nju.edu.cn/zhangzz;;",
        "dblp": ";;;12/3884;241/7938;07/2985-3;23/6750-1;90/8724;;",
        "google_scholar": ";;;;H5pguCYAAAAJ;e5mnk1wAAAAJ;https://scholar.google.com/citations?hl=zh-CN;sG7WEAgAAAAJ;;",
        "orcid": ";;;;;;;;;",
        "linkedin": ";;;;;;;;;",
        "or_profile": "~Chengxing_Jia1;~Chenxiao_Gao1;~Hao_Yin3;~Fuxiang_Zhang1;~Xiong-Hui_Chen1;~Tian_Xu2;~Lei_Yuan2;~Zongzhang_Zhang1;~Zhi-Hua_Zhou2;~Yang_Yu5",
        "aff": "Nanjing University;;;Nanjing University;Nanjing University;Nanjing University;Nanjing University;Nanjing University;;",
        "aff_domain": "nju.edu.cn;;;nju.edu.cn;nju.edu.cn;nju.edu.cn;nju.edu.cn;nju.edu.cn;;",
        "position": "PhD student;;;MS student;PhD student;PhD student;Researcher;Associate Professor;;",
        "bibtex": "@inproceedings{\njia2024policy,\ntitle={Policy Rehearsing: Training Generalizable Policies for Reinforcement Learning},\nauthor={Chengxing Jia and Chenxiao Gao and Hao Yin and Fuxiang Zhang and Xiong-Hui Chen and Tian Xu and Lei Yuan and Zongzhang Zhang and Zhi-Hua Zhou and Yang Yu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=m3xVPaZp6Z}\n}",
        "github": "",
        "project": "",
        "reviewers": "AWzJ;GFGi;anZu;YzNF",
        "pdf_size": 1274407,
        "rating": "6;8;8;8",
        "confidence": "4;3;3;3",
        "soundness": "3;4;3;2",
        "contribution": "3;4;3;3",
        "presentation": "2;2;2;3",
        "wc_summary": "130;187;188;184",
        "wc_strengths": "119;67;55;68",
        "wc_weaknesses": "222;173;372;94",
        "wc_questions": "249;110;137;268",
        "wc_review": "720;537;752;614",
        "wc_reply_reviewers": "169;32;296;45",
        "wc_reply_authors": "897;325;1222;766",
        "reply_reviewers": "1;1;2;1",
        "reply_authors": "3;1;3;1",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            172.25,
            24.437420076595647
        ],
        "wc_strengths_avg": [
            77.25,
            24.641174890820444
        ],
        "wc_weaknesses_avg": [
            215.25,
            101.36906579425501
        ],
        "wc_questions_avg": [
            191.0,
            68.50182479321262
        ],
        "wc_review_avg": [
            655.75,
            85.49378632391947
        ],
        "wc_reply_reviewers_avg": [
            135.5,
            106.987148760961
        ],
        "wc_reply_authors_avg": [
            802.5,
            321.81089167397676
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            1.0
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14590984540876042063&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=m3xVPaZp6Z",
        "pdf": "https://openreview.net/pdf?id=m3xVPaZp6Z",
        "email": "nju.edu.cn;;;nju.edu.cn;nju.edu.cn;nju.edu.cn;nju.edu.cn;nju.edu.cn;;",
        "author_num": 10,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "Nanjing University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nju.edu.cn",
        "aff_unique_abbr": "Nanjing U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "m4Ya9RkEEW",
        "title": "Fast Sampling via De-randomization for Discrete Diffusion Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Diffusion models have emerged as powerful tools for high-quality data generation, such as image generation. Despite its success in continuous spaces, discrete diffusion models, which apply to domains such as texts and natural languages, remain under-studied and often suffer from slow generation speed. In this paper, we propose a novel de-randomized diffusion process, which leads to an accelerated algorithm for discrete diffusion models.  Our technique significantly reduces the number of function evaluations (i.e., calls to the score network), making the sampling process much faster. Furthermore, we introduce a continuous-time (i.e., infinite-step) sampling algorithm that can provide even better sample qualities than its discrete-time (finite-step) counterpart. Extensive experiments on natural language generation and machine translation tasks demonstrate the superior performance of our method in terms of both generation speed and sample quality over existing methods for discrete diffusion models.",
        "keywords": "Sampling;Discrete Diffusion;Text Generation",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Zixiang Chen;Huizhuo Yuan;Yongqian Li;Yiwen Kou;Junkai Zhang;Quanquan Gu",
        "authorids": "~Zixiang_Chen1;~Huizhuo_Yuan1;~Yongqian_Li4;~Yiwen_Kou1;~Junkai_Zhang2;~Quanquan_Gu1",
        "gender": "M;;;F;;M",
        "homepage": "https://sites.google.com/view/zxchen;;https://github.com/YLtrees2;https://evankou.github.io/;;http://web.cs.ucla.edu/~qgu/",
        "dblp": "137/3624;;;323/9058;;50/4597",
        "google_scholar": "6nrCHr0AAAAJ;;;https://scholar.google.com/citations?hl=en;;GU9HgNAAAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";;yongqian-li-318970192/;yiwen-kou-5a444916b/;;",
        "or_profile": "~Zixiang_Chen1;~Huizhuo_Yuan1;~Yongqian_Li4;~Yiwen_Kou1;~Junkai_Zhang2;~Quanquan_Gu1",
        "aff": " University of California, Los Angeles;;University of California, Los Angeles;University of California, Los Angeles;;University of California, Los Angeles",
        "aff_domain": "cs.ucla.edu;;ucla.edu;ucla.edu;;cs.ucla.edu",
        "position": "PhD student;;MS student;PhD student;;Associate Professor",
        "bibtex": "@misc{\nchen2024fast,\ntitle={Fast Sampling via De-randomization for Discrete Diffusion Models},\nauthor={Zixiang Chen and Huizhuo Yuan and Yongqian Li and Yiwen Kou and Junkai Zhang and Quanquan Gu},\nyear={2024},\nurl={https://openreview.net/forum?id=m4Ya9RkEEW}\n}",
        "github": "",
        "project": "",
        "reviewers": "B4eP;yTYV;y1n6;7d5g",
        "site": "https://openreview.net/forum?id=m4Ya9RkEEW",
        "pdf_size": 552902,
        "rating": "5;5;6;6",
        "confidence": "4;4;3;5",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "121;161;62;100",
        "wc_strengths": "152;123;186;40",
        "wc_weaknesses": "910;205;139;300",
        "wc_questions": "167;370;161;14",
        "wc_review": "1350;859;548;454",
        "wc_reply_reviewers": "385;360;64;30",
        "wc_reply_authors": "3651;2154;1045;1501",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "7;4;3;4",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            111.0,
            35.78407467016578
        ],
        "wc_strengths_avg": [
            125.25,
            54.03413273108027
        ],
        "wc_weaknesses_avg": [
            388.5,
            306.47879208845757
        ],
        "wc_questions_avg": [
            178.0,
            126.65899099550731
        ],
        "wc_review_avg": [
            802.75,
            349.7037138779055
        ],
        "wc_reply_reviewers_avg": [
            209.75,
            163.43251665442835
        ],
        "wc_reply_authors_avg": [
            2087.75,
            984.8531299132882
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            4.5,
            1.5
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4847848577599621751&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of California, Los Angeles",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucla.edu",
        "aff_unique_abbr": "UCLA",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Los Angeles",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "m4mwbPjOwb",
        "title": "Simple-TTS: End-to-End Text-to-Speech Synthesis with Latent Diffusion",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We propose an end-to-end text-to-speech (TTS) latent diffusion model as a simpler alternative to more complicated pipelined approaches for TTS synthesis. In particular, we show that one can adapt a recently proposed text-to-image diffusion architecture, U-ViT, as an excellent backbone for audio generation.  We identify and explain the changes required for this adaptation and demonstrate that latent diffusion is an effective approach for end-to-end speech synthesis, without the need for phonemizers, forced aligners, or complex multi-stage pipelines. Despite its simplicity, our proposed approach, Simple-TTS, outperforms more complex models that rely on explicit alignment components and significantly outperforms the best open-source multi-speaker TTS system. We will open-source Simple-TTS upon acceptance, making it the strongest system publicly available to the community. Due to its straight-forward design, we expect that Simple-TTS can easily be adapted to many diverse TTS settings --- opening the stage to repeat the success of Stable Diffusion in computer vision, in audio generation.",
        "keywords": "diffusion;latent diffusion;text-to-speech;speech generation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/c412263a97211b68fa7b33aadb3ff54b4b6bc1b9.zip",
        "author": "Justin Lovelace;Soham Ray;Kwangyoun Kim;Kilian Q Weinberger;Felix Wu",
        "authorids": "~Justin_Lovelace1;sray@asapp.com;~Kwangyoun_Kim1;~Kilian_Q_Weinberger1;~Felix_Wu1",
        "gender": "M;;;M;M",
        "homepage": "https://justinlovelace.github.io/;;;http://www.cs.cornell.edu/~kilian/;https://sites.google.com/view/felixwu/home",
        "dblp": "251/9496;;;88/4801;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;;jsxk8vsAAAAJ;sNL8SSoAAAAJ",
        "orcid": ";;;0009-0008-9313-7239;",
        "linkedin": ";;kwangyoun-kim-97b286b6/;;",
        "or_profile": "~Justin_Lovelace1;sray@asapp.com;~Kwangyoun_Kim1;~Kilian_Q_Weinberger1;~Felix_Wu1",
        "aff": "Cornell University;;ASAPP;ASAPP Inc.;ASAPP Inc.",
        "aff_domain": "cornell.edu;;asapp.com;asapp.com;asapp.com",
        "position": "PhD student;;Researcher;Principal Researcher;Research Scientist",
        "bibtex": "@misc{\nlovelace2024simpletts,\ntitle={Simple-{TTS}: End-to-End Text-to-Speech Synthesis with Latent Diffusion},\nauthor={Justin Lovelace and Soham Ray and Kwangyoun Kim and Kilian Q Weinberger and Felix Wu},\nyear={2024},\nurl={https://openreview.net/forum?id=m4mwbPjOwb}\n}",
        "github": "",
        "project": "",
        "reviewers": "nfMt;Smvk;etZW",
        "site": "https://openreview.net/forum?id=m4mwbPjOwb",
        "pdf_size": 774629,
        "rating": "1;3;5",
        "confidence": "5;3;5",
        "soundness": "1;2;3",
        "contribution": "1;2;3",
        "presentation": "1;2;3",
        "wc_summary": "31;16;48",
        "wc_strengths": "26;22;79",
        "wc_weaknesses": "321;170;143",
        "wc_questions": "20;9;135",
        "wc_review": "398;217;405",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            1.632993161855452
        ],
        "confidence_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            31.666666666666668,
            13.072447700751718
        ],
        "wc_strengths_avg": [
            42.333333333333336,
            25.978623691198287
        ],
        "wc_weaknesses_avg": [
            211.33333333333334,
            78.32553152637325
        ],
        "wc_questions_avg": [
            54.666666666666664,
            56.981478472297376
        ],
        "wc_review_avg": [
            340.0,
            87.02107024546795
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6439284493589641611&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;2",
        "aff_unique_norm": "Cornell University;ASAPP;ASAPP Inc.",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.cornell.edu;https://www.asapp.com;https://www.asapp.com",
        "aff_unique_abbr": "Cornell;ASAPP;ASAPP",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Fantastic Gains and Where to Find Them: On the Existence and Prospect of General Knowledge Transfer between Any Pretrained Model",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17907",
        "id": "m50eKHCttz",
        "author_site": "Karsten Roth, Lukas Thede, A. Sophia Koepke, Oriol Vinyals, Olivier Henaff, Zeynep Akata",
        "tldr": "",
        "abstract": "Training deep networks requires various design decisions regarding for instance their architecture, data augmentation, or optimization. In this work, we find these training variations to result in networks learning unique feature sets from the data. Using public model libraries comprising thousands of models trained on canonical datasets like ImageNet, we observe that for arbitrary pairings of pretrained models, one model extracts significant data context unavailable in the other \u2013 independent of overall performance. Given any arbitrary pairing of pretrained models and no external rankings (such as separate test sets, e.g. due to data privacy), we investigate if it is possible to transfer such \"complementary\" knowledge from one model to another without performance degradation \u2013 a task made particularly difficult as additional knowledge can be contained in stronger, equiperformant or weaker models. Yet facilitating robust transfer in scenarios agnostic to pretrained model pairings would unlock auxiliary gains and knowledge fusion from any model repository without restrictions on model and problem specifics - including from weaker, lower-performance models. This work therefore provides an initial, in-depth exploration on the viability of such general-purpose knowledge transfer. Across large-scale experiments, we first reveal the shortcomings of standard knowledge distillation techniques, and then propose a much more general extension through data partitioning for successful transfer between nearly all pretrained models, which we show can also be done unsupervised. Finally, we assess both the scalability and impact of fundamental model properties on successful model-agnostic knowledge transfer.",
        "keywords": "transfer learning;pretraining;weak-to-strong transfer;continual learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/b0f528a5c48ddd8701ddfb01ab27872d4d891e9a.pdf",
        "author": "Karsten Roth;Lukas Thede;A. Sophia Koepke;Oriol Vinyals;Olivier J Henaff;Zeynep Akata",
        "authorids": "~Karsten_Roth1;~Lukas_Thede1;~A._Sophia_Koepke1;~Oriol_Vinyals1;~Olivier_J_Henaff1;~Zeynep_Akata1",
        "gender": "Not Specified;M;F;;;F",
        "homepage": "https://karroth.com/;;https://www.robots.ox.ac.uk/~koepke/;;https://www.olivierhenaff.com/;https://eml-unitue.de/people/zeynep-akata",
        "dblp": "234/7803;344/9231;223/9859;05/726;156/0035.html;117/4838",
        "google_scholar": "93ZjIs0AAAAJ;https://scholar.google.de/citations?view_op=list_works;q9zQhj8AAAAJ;https://scholar.google.co.uk/citations?user=NkzyCvUAAAAJ;Sx75CVsAAAAJ;jQl9RtkAAAAJ",
        "orcid": ";;;;0000-0001-8183-9489;0000-0002-1432-7747",
        "linkedin": ";lukas-thede-3b6700166/;;;;zeynep-akata-36182045/?ppe=1",
        "or_profile": "~Karsten_Roth1;~Lukas_Thede1;~A._Sophia_Koepke1;~Oriol_Vinyals1;~Olivier_J_Henaff1;~Zeynep_Akata1",
        "aff": "University of Tuebingen;Eberhard-Karls-Universit\u00e4t T\u00fcbingen;University of Tuebingen;Electrical Engineering & Computer Science Department;Google DeepMind;Helmholtz Munich",
        "aff_domain": "uni-tuebingen.de;uni-tuebingen.de;uni-tuebingen.de;eecs.berkeley.edu;google.com;helmholtz-munich.de",
        "position": "PhD student;PhD student;Postdoc;Researcher;Research Scientist;Researcher",
        "bibtex": "@inproceedings{\nroth2024fantastic,\ntitle={Fantastic Gains and Where to Find Them: On the Existence and Prospect of General Knowledge Transfer between Any Pretrained Model},\nauthor={Karsten Roth and Lukas Thede and A. Sophia Koepke and Oriol Vinyals and Olivier J Henaff and Zeynep Akata},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=m50eKHCttz}\n}",
        "github": "",
        "project": "",
        "reviewers": "LBqG;yxq3;QCZm;epvt",
        "pdf_size": 1470625,
        "rating": "5;8;8;8",
        "confidence": "4;3;4;3",
        "soundness": "2;4;4;3",
        "contribution": "2;4;4;3",
        "presentation": "3;4;4;3",
        "wc_summary": "50;77;124;76",
        "wc_strengths": "21;130;124;79",
        "wc_weaknesses": "63;111;137;164",
        "wc_questions": "3;101;42;171",
        "wc_review": "137;419;427;490",
        "wc_reply_reviewers": "0;28;26;0",
        "wc_reply_authors": "528;761;706;1441",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "2;1;1;4",
        "rating_avg": [
            7.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            3.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            81.75,
            26.686841326766267
        ],
        "wc_strengths_avg": [
            88.5,
            43.67207345661527
        ],
        "wc_weaknesses_avg": [
            118.75,
            37.24496610281717
        ],
        "wc_questions_avg": [
            79.25,
            63.42860159265692
        ],
        "wc_review_avg": [
            368.25,
            136.31466355458608
        ],
        "wc_reply_reviewers_avg": [
            13.5,
            13.518505834595775
        ],
        "wc_reply_authors_avg": [
            859.0,
            346.87822070576874
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9760324845553156281&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=m50eKHCttz",
        "pdf": "https://openreview.net/pdf?id=m50eKHCttz",
        "email": "uni-tuebingen.de;uni-tuebingen.de;uni-tuebingen.de;eecs.berkeley.edu;google.com;helmholtz-munich.de",
        "author_num": 6,
        "aff_unique_index": "0;1;0;2;3;4",
        "aff_unique_norm": "University of Tuebingen;Eberhard Karls University of T\u00fcbingen;Electrical Engineering & Computer Science Department;Google;Helmholtz Zentrum M\u00fcnchen",
        "aff_unique_dep": ";;Electrical Engineering & Computer Science;Google DeepMind;",
        "aff_unique_url": "https://www.uni-tuebingen.de/;https://www.uni-tuebingen.de/;;https://deepmind.com;https://www.helmholtz-muenchen.de",
        "aff_unique_abbr": "Uni T\u00fcbingen;Uni T\u00fcbingen;;DeepMind;HMGU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";T\u00fcbingen",
        "aff_country_unique_index": "0;0;0;2;0",
        "aff_country_unique": "Germany;;United Kingdom"
    },
    {
        "title": "Constructing Adversarial Examples for Vertical Federated Learning: Optimal Client Corruption through Multi-Armed Bandit",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17906",
        "id": "m52uU0dVbH",
        "author_site": "Duanyi YAO, Songze Li, Ye XUE, Jin Liu",
        "tldr": "",
        "abstract": "Vertical federated learning (VFL), where each participating client holds a subset of data features, has found numerous applications in finance, healthcare, and IoT systems. However, adversarial attacks, particularly through the injection of adversarial examples (AEs), pose serious challenges to the security of VFL models. In this paper, we investigate such vulnerabilities through developing a novel attack to disrupt the VFL inference process, under a practical scenario where the adversary is able to *adaptively corrupt a subset of clients*. We formulate the problem of finding optimal attack strategies as an online optimization problem, which is decomposed into an inner problem of adversarial example generation (AEG) and an outer problem of corruption pattern selection (CPS). Specifically, we establish the equivalence between the formulated CPS problem and a multi-armed bandit (MAB) problem, and propose the Thompson sampling with Empirical maximum reward (E-TS) algorithm for the adversary to efficiently identify the optimal subset of clients for corruption. The key idea of E-TS is to introduce an estimation of the expected maximum reward for each arm, which helps to specify a small set of *competitive arms*, on which the exploration for the optimal arm is performed. This significantly reduces the exploration space, which otherwise can quickly become prohibitively large as the number of clients increases. We analytically characterize the regret bound of E-TS, and empirically demonstrate its capability of efficiently revealing the optimal corruption pattern with the highest attack success rate, under various datasets of popular VFL tasks.",
        "keywords": "Vertical Federated Learning;Adversarial Examples;Adaptive Client Corruption;Multi-armed Bandit",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/4d242b73e1a68d34c246f6a73a4c32fe335b3432.pdf",
        "author": "Duanyi YAO;Songze Li;Ye XUE;Jin Liu",
        "authorids": "~Duanyi_YAO1;~Songze_Li1;~Ye_XUE3;~Jin_Liu14",
        "gender": "F;M;M;F",
        "homepage": ";https://s3di-lab.github.io/;;https://yokoxue.github.io/",
        "dblp": "345/8638;119/2630;;17/5691",
        "google_scholar": ";vcGuNDYAAAAJ;;",
        "orcid": "0000-0001-8520-4069;;;",
        "linkedin": ";;https://www.linkedin.cn/incareer/in/%E7%91%BE-%E5%88%98-07359b1b5;",
        "or_profile": "~Duanyi_YAO1;~Songze_Li1;~Jin_Liu14;~YE_XUE2",
        "aff": "Hong Kong University of Science and Technology;Southeast University;HKUST(GZ);",
        "aff_domain": "ust.hk;seu.edu.cn;hkust.edu;",
        "position": "PhD student;Full Professor;MS student;",
        "bibtex": "@inproceedings{\nyao2024constructing,\ntitle={Constructing Adversarial Examples for Vertical Federated Learning: Optimal Client Corruption through Multi-Armed Bandit},\nauthor={Duanyi YAO and Songze Li and Ye XUE and Jin Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=m52uU0dVbH}\n}",
        "github": "",
        "project": "",
        "reviewers": "qKnn;HdL1;GNem;XBEx",
        "pdf_size": 847045,
        "rating": "5;5;6;8",
        "confidence": "4;3;4;4",
        "soundness": "3;1;2;3",
        "contribution": "2;2;3;2",
        "presentation": "3;3;3;2",
        "wc_summary": "53;95;110;98",
        "wc_strengths": "88;190;21;18",
        "wc_weaknesses": "165;151;51;887",
        "wc_questions": "4;97;447;49",
        "wc_review": "310;533;629;1052",
        "wc_reply_reviewers": "0;149;193;59",
        "wc_reply_authors": "1245;1534;2509;4778",
        "reply_reviewers": "0;1;2;1",
        "reply_authors": "3;4;6;9",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            89.0,
            21.529050141610984
        ],
        "wc_strengths_avg": [
            79.25,
            69.79747488269186
        ],
        "wc_weaknesses_avg": [
            313.5,
            334.0160924266973
        ],
        "wc_questions_avg": [
            149.25,
            175.02339129384964
        ],
        "wc_review_avg": [
            631.0,
            269.2071692953217
        ],
        "wc_reply_reviewers_avg": [
            100.25,
            75.38360232835785
        ],
        "wc_reply_authors_avg": [
            2516.5,
            1387.1244536810675
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            5.5,
            2.29128784747792
        ],
        "replies_avg": [
            35,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.4714045207910316,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=713772989889457972&as_sdt=5,34&sciodt=0,34&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=m52uU0dVbH",
        "pdf": "https://openreview.net/pdf?id=m52uU0dVbH",
        "email": "ust.hk;seu.edu.cn;hkust.edu;",
        "author_num": 4,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Southeast University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ust.hk;https://www.seu.edu.cn/",
        "aff_unique_abbr": "HKUST;SEU",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Hong Kong SAR;;Guangzhou",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "m5m3nugttY",
        "title": "UniVis: A Universal Framework for Computer Vision Tasks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We propose $\\texttt{UniVis}$, a universal learning framework to tam a wide range of computer vision tasks, including visual understanding (e.g., semantic segmentation), low-level image processing (e.g., denoising), and conditional image generation (e.g., edge-to-image synthesis). Built on a large-scale pre-trained text-to-image diffusion model, $\\texttt{UniVis}$ unifies various vision tasks through a general framework using instruction tuning, where its unifying ability comes from the generative and reasoning power of the pre-trained model. Specifically, $\\texttt{UniVis}$ defines a general image completion task wherein the input consists of a pair of input-output images corresponding to the target task and a query image, and the aim is to generate the ''missing'' data paired to the query. The paired images play the role of image instruction defining the task, e.g., semantic segmentation is represented by an RGB image and its segmentation mask. Our rationale is that each computer vision task can be characterized by its unique input-output pair, which informs our $\\texttt{UniVis}$ model about the expected output for the given query. Furthermore, a task-level or instance-level prompt can be optionally added to provide text instruction. By unifying various visual tasks, $\\texttt{UniVis}$ has the advantage of minimizing the inductive bias inherent in designing models for individual tasks, and it also suggests that the understanding of different visual tasks can be achieved through a shared generative model. In experiments, $\\texttt{UniVis}$ showcases impressive performance on a bunch of standard computer vision benchmarks including ten tasks in total. The source code will be made publicly available.",
        "keywords": "Universal framework; Diffusion models; Instruction tuning; In-context learning",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Han Xue;Qianru Sun;Li Song;Wenjun Zhang;Zhiwu Huang",
        "authorids": "~Han_Xue2;~Qianru_Sun2;~Li_Song3;~Wenjun_Zhang3;~Zhiwu_Huang1",
        "gender": ";F;M;M;M",
        "homepage": ";https://qianrusun.com/;http://medialab.sjtu.edu.cn;https://ee.sjtu.edu.cn/FacultyDetail.aspx?id=14&infoid=66&flag=66;https://zhiwu-huang.github.io",
        "dblp": "384/4926;127/6132.html;20/872-1;;47/7711.html",
        "google_scholar": "eHk4sVMAAAAJ;https://scholar.google.de/citations?user=fNfrGMIAAAAJ;jKIoTVoAAAAJ;;https://scholar.google.ch/citations?user=yh6t92AAAAAJ",
        "orcid": "0000-0003-4699-4701;0000-0003-2689-317X;;;",
        "linkedin": ";;;;",
        "or_profile": "~Han_Xue2;~Qianru_Sun2;~Li_Song3;~Wenjun_Zhang3;~Zhiwu_Huang1",
        "aff": "Shanghai Jiaotong University;Singapore Management University;Shanghai Jiaotong University;Shanghai Jiaotong University;University of Southampton",
        "aff_domain": "sjtu.edu.cn;smu.edu.sg;sjtu.edu.cn;sjtu.edu.cn;soton.ac.uk",
        "position": "PhD student;Assistant Professor;Full Professor;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nxue2024univis,\ntitle={UniVis: A Universal Framework for Computer Vision Tasks},\nauthor={Han Xue and Qianru Sun and Li Song and Wenjun Zhang and Zhiwu Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=m5m3nugttY}\n}",
        "github": "",
        "project": "",
        "reviewers": "bP4y;zYeV;ZgiD;YRyF",
        "site": "https://openreview.net/forum?id=m5m3nugttY",
        "pdf_size": 49763715,
        "rating": "3;5;5;8",
        "confidence": "4;4;4;3",
        "soundness": "2;2;2;4",
        "contribution": "1;2;2;3",
        "presentation": "3;3;3;4",
        "wc_summary": "66;59;165;391",
        "wc_strengths": "49;36;59;122",
        "wc_weaknesses": "239;203;192;563",
        "wc_questions": "3;2;34;200",
        "wc_review": "357;300;450;1276",
        "wc_reply_reviewers": "198;119;130;217",
        "wc_reply_authors": "934;1135;883;1507",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "3;4;3;4",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            170.25,
            134.166640786747
        ],
        "wc_strengths_avg": [
            66.5,
            33.06433123473088
        ],
        "wc_weaknesses_avg": [
            299.25,
            153.26508897984564
        ],
        "wc_questions_avg": [
            59.75,
            81.98894742585735
        ],
        "wc_review_avg": [
            595.75,
            396.3750591296077
        ],
        "wc_reply_reviewers_avg": [
            166.0,
            42.2196636651691
        ],
        "wc_reply_authors_avg": [
            1114.75,
            245.27981470149555
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.5,
            0.5
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.8892972917998875,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:CuxlfgV4pOEJ:scholar.google.com/&scioq=UniVis:+A+Universal+Framework+for+Computer+Vision+Tasks&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0;2",
        "aff_unique_norm": "Shanghai Jiao Tong University;Singapore Management University;University of Southampton",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.sjtu.edu.cn;https://www.smu.edu.sg;https://www.southampton.ac.uk",
        "aff_unique_abbr": "SJTU;SMU;Southampton",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;2",
        "aff_country_unique": "China;Singapore;United Kingdom"
    },
    {
        "id": "m5xRuGtQEi",
        "title": "Latent Space Simulator for Unveiling Molecular Free Energy Landscapes and Predicting Transition Dynamics",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Free Energy Surfaces (FES) and metastable transition rates are key elements in understanding the behavior of molecules within a system. However, the typical approaches require computing force fields across billions of time steps in a molecular dynamics (MD) simulation, which is often considered intractable when dealing with large systems or databases. In this work, we propose LaMoDy, a latent-space MD simulator, to effectively tackle the intractability with around 20-fold speed improvements compared to classical MD. The model leverages a chirality-aware SE(3)-invariant encoder-decoder architecture to generate a latent space coupled with a recurrent neural network to run the time-wise dynamics. We show that LaMoDy effectively recovers realistic trajectories and FES more accurately and faster than existing methods while capturing their major dynamical and conformational properties. Furthermore, the proposed approach can generalize to molecules outside the training distribution.",
        "keywords": "molecular dynamics;simulation;Boltzmann distribution;sampling",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/fcc39fcd46b6a616e33020c2835397a7d84de06b.zip",
        "author": "Simon Dobers;Hannes Stark;Xiang Fu;Dominique Beaini;Stephan G\u00fcnnemann",
        "authorids": "~Simon_Dobers1;~Hannes_Stark1;~Xiang_Fu4;~Dominique_Beaini1;~Stephan_G\u00fcnnemann1",
        "gender": "M;M;M;M;M",
        "homepage": "http://linkedin.com/in/simon-dobers;https://xiangfu.co/;;http://www.daml.in.tum.de;https://hannes-stark.com/",
        "dblp": ";97/374-5.html;201/8526;43/3011;300/4627",
        "google_scholar": ";https://scholar.google.com/citations?view_op=list_works;https://scholar.google.ca/citations?hl=en;;bnXfJdEAAAAJ",
        "orcid": ";;0000-0002-4613-9388;;0000-0002-4463-326X",
        "linkedin": ";;dbeaini/;;hannes-stark/",
        "or_profile": "~Simon_Dobers1;~Xiang_Fu4;~Dominique_Beaini1;~Stephan_G\u00fcnnemann1;~Hannes_St\u00e4rk1",
        "aff": ";Massachusetts Institute of Technology;Mila - Institut Qu\u00e9b\u00e9cois d'intelligence artificielle;Technical University Munich;Massachusetts Institute of Technology",
        "aff_domain": ";mit.edu;mila.quebec;tum.de;mit.edu",
        "position": ";PhD student;Associate Professor;Professor;PhD student",
        "bibtex": "@misc{\ndobers2024latent,\ntitle={Latent Space Simulator for Unveiling Molecular Free Energy Landscapes and Predicting Transition Dynamics},\nauthor={Simon Dobers and Hannes Stark and Xiang Fu and Dominique Beaini and Stephan G{\\\"u}nnemann},\nyear={2024},\nurl={https://openreview.net/forum?id=m5xRuGtQEi}\n}",
        "github": "",
        "project": "",
        "reviewers": "aLv7;4Vhr;1u1D;HMfm",
        "site": "https://openreview.net/forum?id=m5xRuGtQEi",
        "pdf_size": 9101900,
        "rating": "3;3;3;5",
        "confidence": "5;4;4;5",
        "soundness": "2;2;2;2",
        "contribution": "3;2;2;2",
        "presentation": "2;3;3;2",
        "wc_summary": "98;82;102;47",
        "wc_strengths": "157;50;71;44",
        "wc_weaknesses": "49;473;46;10",
        "wc_questions": "1965;158;203;134",
        "wc_review": "2269;763;422;235",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            82.25,
            21.683807322516035
        ],
        "wc_strengths_avg": [
            80.5,
            45.29072752782847
        ],
        "wc_weaknesses_avg": [
            144.5,
            190.27939983088027
        ],
        "wc_questions_avg": [
            615.0,
            779.8163245277698
        ],
        "wc_review_avg": [
            922.25,
            800.2591377172772
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11178972109150808609&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Massachusetts Institute of Technology;Mila - Quebec Artificial Intelligence Institute;Technical University of Munich",
        "aff_unique_dep": ";Artificial Intelligence;",
        "aff_unique_url": "https://web.mit.edu;https://mila.quebec;https://www.tum.de",
        "aff_unique_abbr": "MIT;Mila;TUM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;0",
        "aff_country_unique": "United States;Canada;Germany"
    },
    {
        "id": "m7C04OET3V",
        "title": "Binning as a Pretext Task: Improving Self-Supervised Learning in Tabular Domains",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The ability of deep networks to learn superior representations hinges on leveraging the proper inductive biases, considering the inherent properties of datasets. In tabular domains, it is critical to effectively handle heterogeneous features (both categorical and numerical) in a unified manner and to grasp irregular functions like piecewise constant functions. To address the challenges in the self-supervised learning framework, we propose a novel pretext task based on the classical binning method. The idea is straightforward: reconstructing the bin indices (either orders or classes) rather than the original values. This pretext task provides the encoder with an inductive bias to capture the irregular dependencies, mapping from continuous inputs to discretized bins, and mitigates the feature heterogeneity by setting all features to have category-type targets. Our empirical investigations ascertain several advantages of binning: compatibility with encoder architecture and additional modifications, standardizing all features into equal sets, grouping similar values within a feature, and providing ordering information. Comprehensive evaluations across diverse tabular datasets corroborate that our method consistently improves tabular representation learning performance for a wide range of downstream tasks. The codes are available in the supplementary material.",
        "keywords": "Tabular learning;Tabular data;Self-supervised learning;Representation learning;Tabular SSL;Tabular representations",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/ba126c3043589e66d4e6566a5ef3b2b4aa2d1637.zip",
        "author": "Kyungeun Lee;Ye Seul Sim;Hyeseung Cho;Suhee Yoon;Sanghyu Yoon;Woohyung Lim",
        "authorids": "~Kyungeun_Lee1;~Ye_Seul_Sim1;~Hyeseung_Cho1;~Suhee_Yoon1;~Sanghyu_Yoon1;~Woohyung_Lim1",
        "gender": "F;F;F;F;F;M",
        "homepage": "https://sites.google.com/view/cvkyungeunlee/;;https://www.lgresearch.ai/ourwork/research?tab=PD;https://sites.google.com/view/suheeyoon;;",
        "dblp": "230/3844;377/9202;169/2928.html;315/6798;377/9441.html;86/7195",
        "google_scholar": "ASy-_MEAAAAJ;;;JMaHBwgAAAAJ;napP2_oAAAAJ;https://scholar.google.co.kr/citations?user=gtvxdcUAAAAJ",
        "orcid": "0000-0002-1674-7147;0009-0006-5082-5790;0009-0009-4165-7643;0000-0003-3496-6578;0009-0007-6301-6922;0000-0003-0525-9065",
        "linkedin": ";ye-seul-sim-664320139;;suheey/?originalSubdomain=kr;hyu0901/;woohyunglim/",
        "or_profile": "~Kyungeun_Lee1;~Ye_Seul_Sim1;~Hyeseung_Cho1;~Suhee_Yoon1;~Sanghyu_Yoon1;~Woohyung_Lim1",
        "aff": "LG AI Research;LG AI Research;LG AI Research;LG AI Research;LG AI Research;LG AI Research",
        "aff_domain": "lgresearch.ai;lgresearch.ai;lgresearch.ai;lgresearch.ai;lgresearch.ai;lgresearch.ai",
        "position": "Researcher;Researcher;Researcher;Researcher;Researcher;Vice President",
        "bibtex": "@misc{\nlee2024binning,\ntitle={Binning as a Pretext Task: Improving Self-Supervised Learning in Tabular Domains},\nauthor={Kyungeun Lee and Ye Seul Sim and Hyeseung Cho and Suhee Yoon and Sanghyu Yoon and Woohyung Lim},\nyear={2024},\nurl={https://openreview.net/forum?id=m7C04OET3V}\n}",
        "github": "",
        "project": "",
        "reviewers": "j3rL;wzCM;m34i;nMrZ",
        "site": "https://openreview.net/forum?id=m7C04OET3V",
        "pdf_size": 714541,
        "rating": "5;5;6;8",
        "confidence": "4;4;4;3",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "1;2;3;3",
        "wc_summary": "83;118;50;102",
        "wc_strengths": "67;145;49;98",
        "wc_weaknesses": "48;222;45;78",
        "wc_questions": "48;88;59;72",
        "wc_review": "246;573;203;350",
        "wc_reply_reviewers": "0;0;44;22",
        "wc_reply_authors": "457;2161;470;1459",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "1;5;1;5",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            88.25,
            25.321680433968044
        ],
        "wc_strengths_avg": [
            89.75,
            36.396256675652786
        ],
        "wc_weaknesses_avg": [
            98.25,
            72.60294415517872
        ],
        "wc_questions_avg": [
            66.75,
            14.922717580923388
        ],
        "wc_review_avg": [
            343.0,
            143.14153834579255
        ],
        "wc_reply_reviewers_avg": [
            16.5,
            18.2414363469547
        ],
        "wc_reply_authors_avg": [
            1136.75,
            717.55640022231
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.0,
            2.0
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.9428090415820632,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1724767256159466789&as_sdt=5,34&sciodt=0,34&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "LG",
        "aff_unique_dep": "LG AI Research",
        "aff_unique_url": "https://www.lgaires.com",
        "aff_unique_abbr": "LG AI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "m7SyTzLv6J",
        "title": "Self-supervised debiasing using low rank regularization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Spurious correlations can cause strong biases in deep neural networks, impairing generalization ability. While most existing debiasing methods require full supervision on either spurious attributes or target labels, training a debiased model from a limited amount of both annotations is still an open question. To address this issue, we investigate an interesting phenomenon using the spectral analysis of latent representations: spuriously correlated attributes make neural networks inductively biased towards encoding lower effective rank representations. We also show that a rank regularization can amplify this bias in a way that encourages highly correlated features. Leveraging these findings, we propose a self-supervised debiasing framework potentially compatible with unlabeled samples. \nSpecifically, we first pretrain a biased encoder in a self-supervised manner with the rank regularization, serving as a semantic bottleneck to enforce the encoder to learn the spuriously correlated attributes. This biased encoder is then used to discover and upweight bias-conflicting samples in a downstream task, serving as a boosting to effectively debias the main model. Remarkably, the proposed debiasing framework significantly improves the generalization performance of self-supervised learning baselines and, in some cases, even outperforms state-of-the-art supervised debiasing approaches.",
        "keywords": "Debiasing;spurious correlation;self-supervised learning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/d726077fb535b603e4c71780f3bb84b2e944b57a.zip",
        "author": "Geon Yeong Park;Chanyong Jung;Sangmin Lee;Jong Chul Ye;Sang Wan Lee",
        "authorids": "~Geon_Yeong_Park1;~Chanyong_Jung1;~Sangmin_Lee3;~Jong_Chul_Ye1;~Sang_Wan_Lee1",
        "gender": "M;M;M;M;M",
        "homepage": "https://geonyeong-park.github.io/;https://sites.google.com/view/jcy132;;https://bispl.weebly.com/;https://aibrain.kaist.ac.kr/sang-wan-lee",
        "dblp": "289/5924;221/2728;;15/5613;77/6650",
        "google_scholar": "HGF4a14AAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.co.kr/citations?user=2wp3excAAAAJ;HNMjoNEAAAAJ;0rMoHW4AAAAJ",
        "orcid": ";;;;",
        "linkedin": ";chanyongjung/;;;",
        "or_profile": "~Geon_Yeong_Park1;~Chanyong_Jung1;~Sangmin_Lee3;~Jong_Chul_Ye1;~Sang_Wan_Lee1",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr;kaist.ac.kr;kaist.ac.kr;kaist.ac.kr",
        "position": "PhD student;PhD student;PhD student;Full Professor;Associate Professor",
        "bibtex": "@misc{\npark2024selfsupervised,\ntitle={Self-supervised debiasing using low rank regularization},\nauthor={Geon Yeong Park and Chanyong Jung and Sangmin Lee and Jong Chul Ye and Sang Wan Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=m7SyTzLv6J}\n}",
        "github": "",
        "project": "",
        "reviewers": "xxLf;Txeo;bvf8",
        "site": "https://openreview.net/forum?id=m7SyTzLv6J",
        "pdf_size": 3111717,
        "rating": "3;3;6",
        "confidence": "3;4;4",
        "soundness": "2;2;3",
        "contribution": "2;3;2",
        "presentation": "3;2;3",
        "wc_summary": "83;65;134",
        "wc_strengths": "66;44;41",
        "wc_weaknesses": "151;644;198",
        "wc_questions": "2;51;94",
        "wc_review": "302;804;467",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            94.0,
            29.223278392404914
        ],
        "wc_strengths_avg": [
            50.333333333333336,
            11.14550233153366
        ],
        "wc_weaknesses_avg": [
            331.0,
            222.15460082264033
        ],
        "wc_questions_avg": [
            49.0,
            37.58545818087983
        ],
        "wc_review_avg": [
            524.3333333333334,
            208.91199635784974
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=587174693536049422&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "DRSM: De-Randomized Smoothing on Malware Classifier Providing Certified Robustness",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17905",
        "id": "m7aPLHwsLr",
        "author_site": "Shoumik Saha, Wenxiao Wang, Yigitcan Kaya, Soheil Feizi, Tudor Dumitras",
        "tldr": "",
        "abstract": "Machine Learning (ML) models have been utilized for malware detection for over two decades. Consequently, this ignited an ongoing arms race between malware authors and antivirus systems, compelling researchers to propose defenses for malware-detection models against evasion attacks. However, most if not all existing defenses against evasion attacks suffer from sizable performance degradation and/or can defend against only specific attacks, which makes them less practical in real-world settings. In this work, we develop a certified defense, DRSM (De-Randomized Smoothed MalConv), by redesigning the *de-randomized smoothing* technique for the domain of malware detection. Specifically, we propose a *window ablation* scheme to provably limit the impact of adversarial bytes while maximally preserving local structures of the executables. After showing how DRSM is theoretically robust against attacks with contiguous adversarial bytes, we verify its performance and certified robustness experimentally, where we observe only marginal accuracy drops as the cost of robustness. To our knowledge, we are the first to offer certified robustness in the realm of static detection of malware executables. More surprisingly, through evaluating DRSM against $9$ empirical attacks of different types, we observe that the proposed defense is empirically robust to some extent against a diverse set of attacks, some of which even fall out of the scope of its original threat model. In addition, we collected $15.5K$ recent benign raw executables from diverse sources, which will be made public as a dataset called PACE (Publicly Accessible Collection(s) of Executables) to alleviate the scarcity of publicly available benign datasets for studying malware detection and provide future research with more representative data of the time. Our code and dataset are available at - https://github.com/ShoumikSaha/DRSM",
        "keywords": "machine learning;adversarial;malware;smoothing;robustness;defense;attack",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/7a8d6e8734a35870a66ba71905608d3d1a61888d.zip",
        "author": "Shoumik Saha;Wenxiao Wang;Yigitcan Kaya;Soheil Feizi;Tudor Dumitras",
        "authorids": "~Shoumik_Saha1;~Wenxiao_Wang1;~Yigitcan_Kaya2;~Soheil_Feizi2;~Tudor_Dumitras1",
        "gender": "M;M;M;M;M",
        "homepage": "https://shoumiksaha.github.io/;https://wangwenxiao.github.io;https://yigitcankaya.github.io/;https://www.cs.umd.edu/~sfeizi/;http://users.umiacs.umd.edu/~tdumitra/",
        "dblp": "307/5377;243/5853-2;217/2488;57/2132;01/4921",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;hn0u5VgAAAAJ;tPiXuV0AAAAJ;lptAmrMAAAAJ;",
        "orcid": "0009-0007-7461-5306;;;;",
        "linkedin": "shoumik-saha/;wenxiaowang/;yigitcankaya/;;",
        "or_profile": "~Shoumik_Saha1;~Wenxiao_Wang1;~Yigitcan_Kaya2;~Soheil_Feizi2;~Tudor_Dumitras1",
        "aff": "University of Maryland, College Park;University of Maryland, College Park;University of California, Santa Barbara;University of Maryland, College Park;University of Maryland, College Park",
        "aff_domain": "umd.edu;umd.edu;ucsb.edu;umd.edu;umd.edu",
        "position": "MS student;PhD student;Postdoc;Associate Professor;Associate Professor",
        "bibtex": "@inproceedings{\nsaha2024drsm,\ntitle={{DRSM}: De-Randomized Smoothing on Malware Classifier Providing Certified Robustness},\nauthor={Shoumik Saha and Wenxiao Wang and Yigitcan Kaya and Soheil Feizi and Tudor Dumitras},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=m7aPLHwsLr}\n}",
        "github": "",
        "project": "",
        "reviewers": "4y7b;grdf;sYdT;5AC4;EohB",
        "pdf_size": 1432852,
        "rating": "5;6;6;6;8",
        "confidence": "4;4;4;4;4",
        "soundness": "2;3;3;2;2",
        "contribution": "2;2;2;2;3",
        "presentation": "3;3;2;3;3",
        "wc_summary": "74;58;160;41;117",
        "wc_strengths": "60;31;113;27;76",
        "wc_weaknesses": "367;136;848;27;379",
        "wc_questions": "21;123;42;153;50",
        "wc_review": "522;348;1163;248;622",
        "wc_reply_reviewers": "0;33;156;0;378",
        "wc_reply_authors": "1479;616;1719;600;1643",
        "reply_reviewers": "0;1;5;0;6",
        "reply_authors": "6;4;11;3;12",
        "rating_avg": [
            6.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            90.0,
            43.15089802078283
        ],
        "wc_strengths_avg": [
            61.4,
            31.57594020769611
        ],
        "wc_weaknesses_avg": [
            351.4,
            282.57713991050304
        ],
        "wc_questions_avg": [
            77.8,
            50.948601550974885
        ],
        "wc_review_avg": [
            580.6,
            319.08093017289514
        ],
        "wc_reply_reviewers_avg": [
            113.4,
            144.2298166122387
        ],
        "wc_reply_authors_avg": [
            1211.4,
            498.7699269202184
        ],
        "reply_reviewers_avg": [
            2.4,
            2.5768197453450252
        ],
        "reply_authors_avg": [
            7.2,
            3.6551333764994136
        ],
        "replies_avg": [
            55,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2384878708221480113&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=m7aPLHwsLr",
        "pdf": "https://openreview.net/pdf?id=m7aPLHwsLr",
        "email": "umd.edu;umd.edu;ucsb.edu;umd.edu;umd.edu",
        "author_num": 5,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "University of Maryland;University of California, Santa Barbara",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www/umd.edu;https://www.ucsb.edu",
        "aff_unique_abbr": "UMD;UCSB",
        "aff_campus_unique_index": "0;0;1;0;0",
        "aff_campus_unique": "College Park;Santa Barbara",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Federated Causal Discovery from Heterogeneous Data",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17904",
        "id": "m7tJxajC3G",
        "author_site": "Loka Li, Ignavier Ng, Gongxu Luo, Biwei Huang, Guangyi Chen, Tongliang Liu, Bin Gu, Kun Zhang",
        "tldr": "",
        "abstract": "Conventional causal discovery methods rely on centralized data, which is inconsistent with the decentralized nature of data in many real-world situations. This discrepancy has motivated the development of federated causal discovery (FCD) approaches. However, existing FCD methods may be limited by their potentially restrictive assumptions of identifiable functional causal models or homogeneous data distributions, narrowing their applicability in diverse scenarios. In this paper, we propose a novel FCD method attempting to accommodate arbitrary causal models and heterogeneous data. We first utilize a surrogate variable corresponding to the client index to account for the data heterogeneity across different clients. We then develop a federated conditional independence test (FCIT) for causal skeleton discovery and establish a federated independent change principle (FICP) to determine causal directions. These approaches involve constructing summary statistics as a proxy of the raw data to protect data privacy. Owing to the nonparametric properties, FCIT and FICP make no assumption about particular functional forms, thereby facilitating the handling of arbitrary causal models. We conduct extensive experiments on synthetic and real datasets to show the efficacy of our method. The code is available at https://github.com/lokali/FedCDH.git.",
        "keywords": "Causal Discovery;Structure Learning;Federated Learning;Heterogeneous Data",
        "primary_area": "causal reasoning",
        "supplementary_material": "/attachment/bffc102543ee3a0e59a22fba5ca8b19294cf905f.zip",
        "author": "Loka Li;Ignavier Ng;Gongxu Luo;Biwei Huang;Guangyi Chen;Tongliang Liu;Bin Gu;Kun Zhang",
        "authorids": "~Loka_Li1;~Ignavier_Ng1;~Gongxu_Luo1;~Biwei_Huang1;~Guangyi_Chen1;~Tongliang_Liu1;~Bin_Gu1;~Kun_Zhang1",
        "gender": "M;M;M;F;M;M;M;M",
        "homepage": "https://lokali.github.io;https://ignavierng.github.io/;https://dblp.org/pid/252/7950.html;;https://chengy12.github.io/;https://tongliang-liu.github.io/;https://mbzuai.ac.ae/study/faculty/bin-gu/;http://www.andrew.cmu.edu/user/kunz1/",
        "dblp": "371/1096;251/3037;252/7950.html;165/3288;c/GuangyiChen-2;150/6667;29/1758-1;96/3115-1",
        "google_scholar": "PT5AMzgAAAAJ;;;;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com.au/citations?user=EiLdZ_YAAAAJ;Vo8OgCgAAAAJ;RGoypN4AAAAJ",
        "orcid": ";;;;;;0000-0001-6049-1815;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Loka_Li1;~Ignavier_Ng1;~Gongxu_Luo1;~Biwei_Huang1;~Guangyi_Chen1;~Tongliang_Liu1;~Bin_Gu1;~Kun_Zhang1",
        "aff": "Mohamed bin Zayed University of Artificial Intelligence;Carnegie Mellon University;Mohamed bin Zayed University of Artificial Intelligence;University of California, San Diego;Carnegie Mellon University;Mohamed bin Zayed University of Artificial Intelligence;Mohamed bin Zayed University of Artificial Intelligence;Carnegie Mellon University",
        "aff_domain": "mbzuai.ac.ae;cmu.edu;mbzuai.ac.ae;ucsd.edu;cmu.edu;mbzuai.ac.ae;mbzuai.ac.ae;cmu.edu",
        "position": "PhD student;PhD student;PhD student;Assistant Professor;Postdoc;Affiliated Associate Professor;Assistant Professor;Associate Professor",
        "bibtex": "@inproceedings{\nli2024federated,\ntitle={Federated Causal Discovery from Heterogeneous Data},\nauthor={Loka Li and Ignavier Ng and Gongxu Luo and Biwei Huang and Guangyi Chen and Tongliang Liu and Bin Gu and Kun Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=m7tJxajC3G}\n}",
        "github": "",
        "project": "",
        "reviewers": "VxyA;157B;j4X7;SgBE;71ck",
        "pdf_size": 2729157,
        "rating": "5;5;5;8;8",
        "confidence": "4;4;4;3;3",
        "soundness": "3;3;3;4;4",
        "contribution": "3;3;2;3;4",
        "presentation": "1;2;3;3;4",
        "wc_summary": "74;120;94;123;52",
        "wc_strengths": "62;13;53;23;45",
        "wc_weaknesses": "52;61;198;13;17",
        "wc_questions": "242;4;28;223;46",
        "wc_review": "430;198;373;382;160",
        "wc_reply_reviewers": "34;0;0;79;22",
        "wc_reply_authors": "1229;889;964;952;605",
        "reply_reviewers": "1;0;0;1;1",
        "reply_authors": "3;3;3;2;3",
        "rating_avg": [
            6.2,
            1.469693845669907
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            3.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            3.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            2.6,
            1.019803902718557
        ],
        "wc_summary_avg": [
            92.6,
            27.096863287103915
        ],
        "wc_strengths_avg": [
            39.2,
            18.4
        ],
        "wc_weaknesses_avg": [
            68.2,
            67.5733675348506
        ],
        "wc_questions_avg": [
            108.6,
            102.21467604996847
        ],
        "wc_review_avg": [
            308.6,
            108.2471246731293
        ],
        "wc_reply_reviewers_avg": [
            27.0,
            29.10670025956223
        ],
        "wc_reply_authors_avg": [
            927.8,
            199.1596344644165
        ],
        "reply_reviewers_avg": [
            0.6,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            2.8,
            0.39999999999999997
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1538266232253795248&as_sdt=805&sciodt=0,3&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=m7tJxajC3G",
        "pdf": "https://openreview.net/pdf?id=m7tJxajC3G",
        "email": "mbzuai.ac.ae;cmu.edu;mbzuai.ac.ae;ucsd.edu;cmu.edu;mbzuai.ac.ae;mbzuai.ac.ae;cmu.edu",
        "author_num": 8,
        "aff_unique_index": "0;1;0;2;1;0;0;1",
        "aff_unique_norm": "Mohamed bin Zayed University of Artificial Intelligence;Carnegie Mellon University;University of California, San Diego",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://mbzuai.ac.ae;https://www.cmu.edu;https://www.ucsd.edu",
        "aff_unique_abbr": "MBZUAI;CMU;UCSD",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";San Diego",
        "aff_country_unique_index": "0;1;0;1;1;0;0;1",
        "aff_country_unique": "United Arab Emirates;United States"
    },
    {
        "id": "m7tuMFc6xQ",
        "title": "Prompt Backdoors in Visual Prompt Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Fine-tuning large pre-trained computer vision models is infeasible for resource-limited users. Visual prompt learning (VPL) has thus emerged to provide an efficient and flexible alternative to model fine-tuning through Visual Prompt as a Service (VPPTaaS). Specifically, the VPPTaaS provider optimizes a visual prompt given downstream data, and downstream users can use this prompt together with the large pre-trained model for prediction. However, this new learning paradigm may also pose security risks when the VPPTaaS provider instead provides a malicious visual prompt. In this paper, we take the first step to explore such risks through the lens of backdoor attacks. Specifically, we propose BadVisualPrompt, a simple yet effective backdoor attack against VPL. For example, poisoning 5\\% CIFAR10 training data leads to above 99\\% attack success rates with only negligible model accuracy drop by 1.5\\%. In particular, we identify and then address a new technical challenge related to interactions between the backdoor trigger and visual prompt, which does not exist in conventional, model-level backdoors. Moreover, we provide in-depth analyses of seven backdoor defenses from model, prompt, and input levels. Overall, all these defenses are either ineffective or impractical to mitigate our BadVisualPrompt, implying the critical vulnerability of VPL.",
        "keywords": "visual prompt learning;backdoor attacks",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Hai Huang;Zhengyu Zhao;Michael Backes;Yun Shen;Yang Zhang",
        "authorids": "~Hai_Huang4;~Zhengyu_Zhao1;~Michael_Backes3;~Yun_Shen3;~Yang_Zhang15",
        "gender": ";M;;M;M",
        "homepage": "https://miraclehh.github.io;https://zhengyuzhao.github.io/;;https://uk.linkedin.com/in/yun-shen-24336257;https://yangzhangalmo.github.io/",
        "dblp": "51/944-14;58/10770-1;;;06/6785-16",
        "google_scholar": "DECqXdAAAAAJ;pC8KpPMAAAAJ;;Gx_JJ6cAAAAJ;Xeb2888AAAAJ",
        "orcid": "0000-0002-4898-4972;;;;0000-0003-3612-7348",
        "linkedin": ";;;;",
        "or_profile": "~Hai_Huang4;~Zhengyu_Zhao1;~Michael_Backes3;~Yun_Shen3;~Yang_Zhang15",
        "aff": "CISPA Helmholtz Center for Information Security;Xi'an Jiaotong University;;NetApp;CISPA Helmholtz Center for Information Security",
        "aff_domain": "cispa.de;xjtu.edu.cn;;netapp.com;cispa.de",
        "position": "PhD student;Researcher;;Technical Director;Full Professor",
        "bibtex": "@misc{\nhuang2024prompt,\ntitle={Prompt Backdoors in Visual Prompt Learning},\nauthor={Hai Huang and Zhengyu Zhao and Michael Backes and Yun Shen and Yang Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=m7tuMFc6xQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "v9j8;jfFZ;ugXM;jCHm",
        "site": "https://openreview.net/forum?id=m7tuMFc6xQ",
        "pdf_size": 8877178,
        "rating": "3;3;5;5",
        "confidence": "4;4;4;4",
        "soundness": "2;3;3;3",
        "contribution": "1;2;2;2",
        "presentation": "3;3;3;3",
        "wc_summary": "61;87;54;90",
        "wc_strengths": "47;53;81;20",
        "wc_weaknesses": "306;290;65;250",
        "wc_questions": "61;81;47;11",
        "wc_review": "475;511;247;371",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "504;547;276;409",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            73.0,
            15.732132722552274
        ],
        "wc_strengths_avg": [
            50.25,
            21.672274915199836
        ],
        "wc_weaknesses_avg": [
            227.75,
            96.15189805718866
        ],
        "wc_questions_avg": [
            50.0,
            25.553864678361276
        ],
        "wc_review_avg": [
            401.0,
            102.70345661174214
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            434.0,
            103.99278821149089
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2246564964982923574&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "CISPA Helmholtz Center for Information Security;Xi'an Jiao Tong University;NetApp",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.cispa.de/;https://www.xjtu.edu.cn;https://www.netapp.com",
        "aff_unique_abbr": "CISPA;XJTU;NetApp",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;0",
        "aff_country_unique": "Germany;China;United States"
    },
    {
        "id": "m8KWOgE0Cn",
        "title": "FENDA-FL: Personalized Federated Learning on Heterogeneous Clinical Datasets",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Federated learning (FL) is increasingly being recognized as a key approach to overcoming the data silos that so frequently obstruct the training and deployment of machine-learning models in clinical settings. This work contributes to a growing body of FL research specifically focused on clinical applications along three important directions. First, an extension of the FENDA method (Kim et al., 2016) to the FL setting is proposed. Experiments conducted on the FLamby benchmarks (du Terrail et al., 2022a) and GEMINI datasets (Verma et al., 2017) show that the approach is robust to heterogeneous clinical data and often outperforms existing global and personalized FL techniques. Further, the experimental results represent substantive improvements over the original FLamby benchmarks and expand such benchmarks to include evaluation of personalized FL methods. Finally, we advocate for a comprehensive checkpointing and evaluation framework for FL to better reflect practical settings and provide multiple baselines for comparison.",
        "keywords": "Federated Learning;Clinical Machine Learning;Heterogeneous Datasets",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/db6d5c58c76ada30720958eadfdb522f6fb95e08.zip",
        "author": "Fatemeh Tavakoli;D. B. Emerson;John Taylor Jewell;Amrit Krishnan;Yuchong Zhang;Amol Verma;Fahad Razak",
        "authorids": "~Fatemeh_Tavakoli2;~D._B._Emerson1;~John_Taylor_Jewell1;~Amrit_Krishnan1;~Yuchong_Zhang1;~Amol_Verma1;~Fahad_Razak1",
        "gender": "F;;M;M;M;M;M",
        "homepage": ";;https://amrit110.github.io/;;https://www geminimedicine.ca;;https://sites.google.com/view/dbemerson",
        "dblp": "165/0482;;;;;;171/9961",
        "google_scholar": "KHW7kYIAAAAJ;https://scholar.google.ca/citations?user=Mpjt07UAAAAJ;PD1A_I4AAAAJ;;;yki_A5EAAAAJ;",
        "orcid": "0000-0002-3562-8928;;;;;;0000-0002-4630-7003",
        "linkedin": "fatemeh-tavakoli/?originalSubdomain=ca;;amritkrishnan/;yuchong-zhang-6aaba9207/;;;david-emerson-1b9b2225/",
        "or_profile": "~Fatemeh_Tavakoli2;~John_Taylor_Jewell1;~Amrit_Krishnan1;~Yuchong_Zhang1;~Amol_Verma1;~Fahad_Razak1;~David_Bruce_Emerson1",
        "aff": "Vector Institute;;;;University of Toronto;;Vector Institute",
        "aff_domain": "vectorinstitute.ai;;;;utoronto.ca;;vectorinstitute.ai",
        "position": "ML specialist;;;;Associate Professor;;Researcher",
        "bibtex": "@misc{\ntavakoli2024fendafl,\ntitle={{FENDA}-{FL}: Personalized Federated Learning on Heterogeneous Clinical Datasets},\nauthor={Fatemeh Tavakoli and D. B. Emerson and John Taylor Jewell and Amrit Krishnan and Yuchong Zhang and Amol Verma and Fahad Razak},\nyear={2024},\nurl={https://openreview.net/forum?id=m8KWOgE0Cn}\n}",
        "github": "",
        "project": "",
        "reviewers": "ewfD;Hvzv;kWTA;ubEK",
        "site": "https://openreview.net/forum?id=m8KWOgE0Cn",
        "pdf_size": 2330130,
        "rating": "3;3;3;5",
        "confidence": "4;5;4;3",
        "soundness": "1;2;2;3",
        "contribution": "1;2;2;3",
        "presentation": "3;3;2;3",
        "wc_summary": "66;71;62;30",
        "wc_strengths": "14;34;31;22",
        "wc_weaknesses": "208;66;176;86",
        "wc_questions": "5;29;4;63",
        "wc_review": "293;200;273;201",
        "wc_reply_reviewers": "24;54;0;126",
        "wc_reply_authors": "666;404;822;769",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "1;1;2;2",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            57.25,
            16.052647756678645
        ],
        "wc_strengths_avg": [
            25.25,
            7.854139036202504
        ],
        "wc_weaknesses_avg": [
            134.0,
            59.51470406546604
        ],
        "wc_questions_avg": [
            25.25,
            23.98306694315804
        ],
        "wc_review_avg": [
            241.75,
            41.853165949543175
        ],
        "wc_reply_reviewers_avg": [
            51.0,
            47.3392015141785
        ],
        "wc_reply_authors_avg": [
            665.25,
            160.9244776284826
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:M4NEYODEFugJ:scholar.google.com/&scioq=FENDA-FL:+Personalized+Federated+Learning+on+Heterogeneous+Clinical+Datasets&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Vector Institute;University of Toronto",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://vectorinstitute.ai/;https://www.utoronto.ca",
        "aff_unique_abbr": "Vector Institute;U of T",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "m9zWBn1Y2j",
        "title": "Ligand Conformation Generation: from singleton to pairwise",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Drug discovery is a time-consuming process, primarily due to the vast number of molecular structures that need to be explored. One of the challenges in drug design involves generating rational ligand conformations. For this task, most previous approaches fall into the singleton category, which solely rely on ligand molecular information to generate ligand conformations. In this work, we contend that the ligand-target interactions are also very important in providing crucial semantics for ligand generation. To address this, we introduce PsiDiff, a comprehensive diffusion model that incorporates target and ligand interactions, as well as ligand chemical properties. By transitioning from singleton to pairwise modeling, PsiDiff offers a more holistic approach. One challenge of the pairwise design is that the ligand-target binding site is not available in most cases and thus hinders the accurate message-passing between the ligand and target. To overcome this challenge, we employ graph prompt learning to bridge the gap between ligand and target graphs. The graph prompt learning of the insert patterns enables us to learn the hidden pairwise interaction at each diffusion step. Upon this, our model leverages the Target-Ligand Pairwise Graph Encoder (TLPE) and captures ligand prompt entity fusion and complex information. Experimental results demonstrate significant improvements in ligand conformation generation, with a remarkable 18\\% enhancement in Aligned RMSD compared to the baseline approach.",
        "keywords": "molecular conformation generation;conditional diffusion model;graph neural network",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Jiamin WU;He CAO;Jia Li;Yuan Yao",
        "authorids": "~Jiamin_WU3;~He_CAO1;~Jia_Li4;~Yuan_Yao1",
        "gender": "F;M;M;Unspecified",
        "homepage": "https://jwubz123.github.io/;https://github.com/CiaoHe;https://sites.google.com/view/lijia;https://yao-lab.github.io/",
        "dblp": ";;23/6950-9;25/4120-11.html",
        "google_scholar": "tlwQZ4wAAAAJ;tLZ2V2kAAAAJ;1gSbcYoAAAAJ;OOlHr-wAAAAJ",
        "orcid": "0000-0002-4716-3339;;0000-0002-6362-4385;0000-0001-5814-1162",
        "linkedin": ";he-cao/;;",
        "or_profile": "~Jiamin_WU3;~He_CAO1;~Jia_Li4;~Yuan_Yao1",
        "aff": "Hong Kong University of Science and Technology;Hong Kong University of Science and Technology;Hong Kong University of Science and Technology (Guangzhou);Hong Kong University of Science and Technology",
        "aff_domain": "ust.hk;ust.hk;ust.hk;ust.hk",
        "position": "PhD student;PhD student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nwu2024ligand,\ntitle={Ligand Conformation Generation: from singleton to pairwise},\nauthor={Jiamin WU and He CAO and Jia Li and Yuan Yao},\nyear={2024},\nurl={https://openreview.net/forum?id=m9zWBn1Y2j}\n}",
        "github": "",
        "project": "",
        "reviewers": "yEdr;crGs;6Z6H",
        "site": "https://openreview.net/forum?id=m9zWBn1Y2j",
        "pdf_size": 2993368,
        "rating": "3;3;3",
        "confidence": "2;3;4",
        "soundness": "2;2;2",
        "contribution": "2;2;2",
        "presentation": "1;2;3",
        "wc_summary": "33;61;49",
        "wc_strengths": "20;40;43",
        "wc_weaknesses": "48;127;210",
        "wc_questions": "129;50;6",
        "wc_review": "230;278;308",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "266;513;430",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            47.666666666666664,
            11.469767022723502
        ],
        "wc_strengths_avg": [
            34.333333333333336,
            10.208928554075703
        ],
        "wc_weaknesses_avg": [
            128.33333333333334,
            66.14294285023074
        ],
        "wc_questions_avg": [
            61.666666666666664,
            50.88767587103538
        ],
        "wc_review_avg": [
            272.0,
            32.12475680841802
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            403.0,
            102.62878088853373
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:CSA_c1qrQQwJ:scholar.google.com/&scioq=Ligand+Conformation+Generation:+from+singleton+to+pairwise&hl=en&as_sdt=0,39",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Hong Kong University of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ust.hk",
        "aff_unique_abbr": "HKUST",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "mBzsKsrXf9",
        "title": "ArtWhisperer: A Dataset for Characterizing Human-AI Interactions in Artistic Creations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "As generative AI becomes more prevalent, it is important to study how human users interact with such models. In this work, we investigate how people use text-to-image models to generate desired target images. To study this interaction, we created ArtWhisperer, an online game where users are given a target image and are tasked with iteratively finding a prompt that creates a similar-looking image as the target. Through this game, we recorded over 50,000 human-AI interactions; each interaction corresponds to one text prompt created by a user and the corresponding generated image. The majority of these are repeated interactions where a user iterates to find the best prompt for their target image, making this a unique sequential dataset for studying human-AI collaborations. In an initial analysis of this dataset, we identify several characteristics of prompt interactions and user strategies. People submit diverse prompts and are able to discover a variety of text descriptions that generate similar images. Interestingly, prompt diversity does not decrease as users find better prompts. We further propose a new metric to quantify the steerability of AI using our dataset. We define steerability as the expected number of interactions required to adequately complete a task. We estimate this value by fitting a Markov chain for each target task and calculating the expected time to reach an adequate score in the Markov chain. We  quantify and compare AI steerability across different types of target images and two different models, finding that images of cities and natural world images are more steerable than artistic and fantasy images. These findings provide insights into human-AI interaction behavior, present a concrete method of assessing AI steerability, and demonstrate the general utility of the ArtWhisperer dataset.",
        "keywords": "Human-AI Interaction;Dataset",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/3bb7a938f8908b4a325c6c7fe13e95888125c51a.zip",
        "author": "Kailas Vodrahalli;James Zou",
        "authorids": "~Kailas_Vodrahalli1;~James_Zou1",
        "gender": ";",
        "homepage": ";",
        "dblp": ";",
        "google_scholar": "0DeyGMcAAAAJ;23ZXZvEAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Kailas_Vodrahalli1;~James_Zou1",
        "aff": "Stanford University;Stanford University",
        "aff_domain": "stanford.edu;stanford.edu",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nvodrahalli2024artwhisperer,\ntitle={ArtWhisperer: A Dataset for Characterizing Human-{AI} Interactions in Artistic Creations},\nauthor={Kailas Vodrahalli and James Zou},\nyear={2024},\nurl={https://openreview.net/forum?id=mBzsKsrXf9}\n}",
        "github": "",
        "project": "",
        "reviewers": "Ww77;oZkf;1NDi;kk5o",
        "site": "https://openreview.net/forum?id=mBzsKsrXf9",
        "pdf_size": 3923407,
        "rating": "5;5;5;6",
        "confidence": "4;3;4;4",
        "soundness": "3;3;2;4",
        "contribution": "3;3;2;3",
        "presentation": "4;2;3;4",
        "wc_summary": "127;101;78;72",
        "wc_strengths": "35;86;180;86",
        "wc_weaknesses": "48;158;314;142",
        "wc_questions": "59;30;156;80",
        "wc_review": "269;375;728;380",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "408;450;580;473",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            94.5,
            21.66217902243447
        ],
        "wc_strengths_avg": [
            96.75,
            52.38022050354504
        ],
        "wc_weaknesses_avg": [
            165.5,
            95.48167363426344
        ],
        "wc_questions_avg": [
            81.25,
            46.66569939473746
        ],
        "wc_review_avg": [
            438.0,
            173.20075057574087
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            477.75,
            63.46800374992111
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13182927881668708200&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Stanford University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.stanford.edu",
        "aff_unique_abbr": "Stanford",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Stanford",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "EquiformerV2: Improved Equivariant Transformer for Scaling to Higher-Degree Representations",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17903",
        "id": "mCOBKZmrzD",
        "author_site": "Yi-Lun Liao, Brandon Wood, Abhishek Das, Tess Smidt",
        "tldr": "",
        "abstract": "Equivariant Transformers such as Equiformer have demonstrated the efficacy of applying Transformers to the domain of 3D atomistic systems. However, they are limited to small degrees of equivariant representations due to their computational complexity. In this paper, we investigate whether these architectures can scale well to higher degrees. Starting from Equiformer, we first replace $SO(3)$ convolutions\nwith eSCN convolutions to efficiently incorporate higher-degree tensors. Then, to better leverage the power of higher degrees, we propose three architectural improvements \u2013 attention re-normalization, separable $S^2$ activation and separable layer normalization. Putting these all together, we propose EquiformerV2, which outperforms previous state-of-the-art methods on large-scale OC20 dataset by up to 9% on forces, 4% on energies, offers better speed-accuracy trade-offs, and 2$\\times$ reduction in DFT calculations needed for computing adsorption energies. Additionally, EquiformerV2 trained on only OC22 dataset outperforms GemNet-OC trained on both OC20 and OC22 datasets, achieving much better data efficiency. Finally, we compare EquiformerV2 with Equiformer on QM9 and OC20 S2EF-2M\ndatasets to better understand the performance gain brought by higher degrees.",
        "keywords": "equivariant neural networks;graph neural networks;computational physics;transformer networks",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/1ad298c602cd5dcadbb18fcd6aeb9df803eab7ad.zip",
        "author": "Yi-Lun Liao;Brandon M Wood;Abhishek Das;Tess Smidt",
        "authorids": "~Yi-Lun_Liao1;~Brandon_M_Wood1;~Abhishek_Das1;~Tess_Smidt1",
        "gender": "M;M;M;F",
        "homepage": ";https://www.bmwood.org;https://abhishekdas.com/;https://blondegeek.github.io/",
        "dblp": "225/6644.html;276/7546;40/5262;215/4978.html",
        "google_scholar": ";KbqboRgAAAAJ;t6exkOAAAAAJ;",
        "orcid": ";0000-0002-7251-337X;;0000-0001-5581-5344",
        "linkedin": "yilunliao/;;;",
        "or_profile": "~Yi-Lun_Liao1;~Brandon_M_Wood1;~Abhishek_Das1;~Tess_Smidt1",
        "aff": "Massachusetts Institute of Technology;FAIR at Meta;FAIR, Meta AI;Massachusetts Institute of Technology",
        "aff_domain": "mit.edu;meta.com;meta.com;mit.edu",
        "position": "PhD student;Researcher;Research Scientist;Assistant Professor",
        "bibtex": "@inproceedings{\nliao2024equiformerv,\ntitle={EquiformerV2: Improved Equivariant Transformer for Scaling to Higher-Degree Representations},\nauthor={Yi-Lun Liao and Brandon M Wood and Abhishek Das and Tess Smidt},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=mCOBKZmrzD}\n}",
        "github": "",
        "project": "",
        "reviewers": "c4fs;3vjk;Joeu",
        "pdf_size": 5919785,
        "rating": "6;6;6",
        "confidence": "5;4;4",
        "soundness": "3;4;3",
        "contribution": "3;3;2",
        "presentation": "2;3;3",
        "wc_summary": "89;54;39",
        "wc_strengths": "111;39;53",
        "wc_weaknesses": "112;30;127",
        "wc_questions": "7;32;2",
        "wc_review": "319;155;221",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "247;265;383",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            60.666666666666664,
            20.949675149960893
        ],
        "wc_strengths_avg": [
            67.66666666666667,
            31.169785940162562
        ],
        "wc_weaknesses_avg": [
            89.66666666666667,
            42.63279905841927
        ],
        "wc_questions_avg": [
            13.666666666666666,
            13.123346456686352
        ],
        "wc_review_avg": [
            231.66666666666666,
            67.37622396332074
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            298.3333333333333,
            60.31767752676012
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 164,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7055967944586657720&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=mCOBKZmrzD",
        "pdf": "https://openreview.net/pdf?id=mCOBKZmrzD",
        "email": "mit.edu;meta.com;meta.com;mit.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;1;0",
        "aff_unique_norm": "Massachusetts Institute of Technology;Meta",
        "aff_unique_dep": ";AI Research",
        "aff_unique_url": "https://web.mit.edu;https://ai.facebook.com",
        "aff_unique_abbr": "MIT;FAIR",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "mCnWT9OVvK",
        "title": "Understanding Retrieval Augmentation for Long-Form Question Answering",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We present a study of retrieval-augmented language models (LMs) on long-form question answering. We analyze how retrieval augmentation impacts different LMs, by comparing answers generated from models while using the same evidence documents, and how differing quality of retrieval document set impacts the answers generated from the same LM. We study various attributes of generated answers (e.g., fluency, length, variance) with an emphasis on the *attribution* of generated long-form answers to in-context evidence documents. We collect human annotations of answer attribution and evaluate methods for automatically judging attribution. Our\ncontrolled study provides new insights on how retrieval augmentation impacts long, knowledge-rich text generation of LMs. We further reveal novel attribution patterns for long text generation and analyze the main culprits of attribution errors. Together, our analysis reveals how retrieval augmentation impacts long knowledge-rich text generation and provide directions for future work.",
        "keywords": "Question Answering;Retrieval;Retrieval Augmented Generation;Long-Form Question Answering;Attribution;NLP;QA",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/fbce110d492244fca10904705a448c68c2a47a92.zip",
        "author": "Hung-Ting Chen;Fangyuan Xu;Shane Arora;Eunsol Choi",
        "authorids": "~Hung-Ting_Chen1;~Fangyuan_Xu1;~Shane_Arora1;~Eunsol_Choi1",
        "gender": "M;;;",
        "homepage": "https://timchen0618.github.io/;;;https://eunsol.github.io/",
        "dblp": ";;;116/2765",
        "google_scholar": "dApuTpsAAAAJ;gAzZXuEAAAAJ;;6wulN88AAAAJ",
        "orcid": ";;0000-0003-1199-770X;0000-0003-3607-9104",
        "linkedin": "hungtingchen/;;;",
        "or_profile": "~Hung-Ting_Chen1;~Fangyuan_Xu1;~Shane_Arora1;~Eunsol_Choi1",
        "aff": "University of Texas at Austin;University of Texas at Austin;University of Texas at Austin;University of Texas, Austin",
        "aff_domain": "utexas.edu;utexas.edu;utexas.edu;cs.utexas.edu",
        "position": "PhD student;PhD student;MS student;Assistant Professor",
        "bibtex": "@misc{\nchen2024understanding,\ntitle={Understanding Retrieval Augmentation for Long-Form Question Answering},\nauthor={Hung-Ting Chen and Fangyuan Xu and Shane Arora and Eunsol Choi},\nyear={2024},\nurl={https://openreview.net/forum?id=mCnWT9OVvK}\n}",
        "github": "",
        "project": "",
        "reviewers": "6bfG;kK3e;T5uy;o7Hh",
        "site": "https://openreview.net/forum?id=mCnWT9OVvK",
        "pdf_size": 1355480,
        "rating": "3;5;5;8",
        "confidence": "3;4;3;4",
        "soundness": "3;3;2;4",
        "contribution": "1;2;2;3",
        "presentation": "3;3;2;3",
        "wc_summary": "83;119;82;67",
        "wc_strengths": "152;114;39;37",
        "wc_weaknesses": "71;184;48;92",
        "wc_questions": "119;101;31;1",
        "wc_review": "425;518;200;197",
        "wc_reply_reviewers": "83;210;0;0",
        "wc_reply_authors": "856;441;309;229",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            87.75,
            19.122957407263137
        ],
        "wc_strengths_avg": [
            85.5,
            49.36851223198852
        ],
        "wc_weaknesses_avg": [
            98.75,
            51.62061119359204
        ],
        "wc_questions_avg": [
            63.0,
            48.60041152089147
        ],
        "wc_review_avg": [
            335.0,
            140.40833308603874
        ],
        "wc_reply_reviewers_avg": [
            73.25,
            85.91674749430405
        ],
        "wc_reply_authors_avg": [
            458.75,
            241.52264386595309
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.7001400420140049,
        "gs_citation": 29,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13555030950984354517&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of Texas at Austin",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.utexas.edu",
        "aff_unique_abbr": "UT Austin",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Austin",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "mDBsBB1enO",
        "title": "LLM-QAT: Data-Free Quantization Aware Training for Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Several post-training quantization methods have been applied to large language models (LLMs), and have been shown to perform well down to 8-bits.  We find that these methods break down at lower bit precision, and investigate quantization aware training for LLMs (LLM-QAT) to push quantization levels even further.  We propose a data-free distillation method that leverages generations produced by the pre-trained model, which better preserves the original output distribution and allows quantizing any generative model independent of its training data, similar to post-training quantization methods.  In addition to quantizing weights and activations, we also quantize the KV cache, which is critical for increasing throughput and support long sequence dependencies at current model sizes.  We experiment with LLaMA models of sizes 7B, 13B, and 30B, at quantization levels down to 4-bits.  We observe large improvements over training-free methods, especially in the low-bit settings.",
        "keywords": "data-free;quantization",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Zechun Liu;Barlas Oguz;Changsheng Zhao;Ernie Chang;Pierre Stock;Yashar Mehdad;Yangyang Shi;Raghuraman Krishnamoorthi;Vikas Chandra",
        "authorids": "~Zechun_Liu1;~Barlas_Oguz1;~Changsheng_Zhao2;~Ernie_Chang4;~Pierre_Stock1;~Yashar_Mehdad2;~Yangyang_Shi1;~Raghuraman_Krishnamoorthi1;~Vikas_Chandra2",
        "gender": ";;M;M;M;;M;M;M",
        "homepage": ";;;https://scholar.google.com/citations?user=FbR5cAMAAAAJ&hl=en;https://research.fb.com/people/stock-pierre/;;;;https://v-chandra.github.io/",
        "dblp": ";https://dblp.org/pers/hd/o/Oguz:Barlas;148/3002-2;198/1211.html;210/2208;;;;57/5163",
        "google_scholar": ";iPmTQZMAAAAJ;bXnrlyAAAAAJ;FbR5cAMAAAAJ;https://scholar.google.fr/citations?user=3e2-59cAAAAJ;;https://scholar.google.com/citations?hl=en;F1mr9C0AAAAJ;p-h_BvcAAAAJ",
        "orcid": ";;0000-0002-1655-9787;;;;;;",
        "linkedin": ";barlas-o%C4%9Fuz-25465050;changsheng-zhao/;;;;;raghuraman-krishnamoorthi-b8670a5/;vchandra/",
        "or_profile": "~Zechun_Liu1;~Barlas_Oguz1;~Changsheng_Zhao2;~Ernie_Chang4;~Pierre_Stock1;~Yashar_Mehdad2;~Yangyang_Shi1;~Raghuraman_Krishnamoorthi1;~Vikas_Chandra2",
        "aff": ";Meta;Meta Inc.;Meta AI;Meta Facebook;;Meta;Meta Facebook;Meta",
        "aff_domain": ";meta.com;meta.com;meta.com;fb.com;;meta.com;meta.com;meta.com",
        "position": ";Research Scientist;Researcher;Research Scientist;Research Scientist;;Researcher;Researcher;Director, AI",
        "bibtex": "@misc{\nliu2024llmqat,\ntitle={{LLM}-{QAT}: Data-Free Quantization Aware Training for Large Language Models},\nauthor={Zechun Liu and Barlas Oguz and Changsheng Zhao and Ernie Chang and Pierre Stock and Yashar Mehdad and Yangyang Shi and Raghuraman Krishnamoorthi and Vikas Chandra},\nyear={2024},\nurl={https://openreview.net/forum?id=mDBsBB1enO}\n}",
        "github": "",
        "project": "",
        "reviewers": "dtJe;WoMH;hBhR;KC6W",
        "site": "https://openreview.net/forum?id=mDBsBB1enO",
        "pdf_size": 610085,
        "rating": "5;5;5;5",
        "confidence": "4;4;4;4",
        "soundness": "2;2;3;2",
        "contribution": "2;3;2;2",
        "presentation": "3;3;3;3",
        "wc_summary": "59;133;120;179",
        "wc_strengths": "56;63;70;31",
        "wc_weaknesses": "213;208;130;67",
        "wc_questions": "105;157;58;34",
        "wc_review": "433;561;378;311",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "643;391;795;339",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            122.75,
            42.83908845902303
        ],
        "wc_strengths_avg": [
            55.0,
            14.713938969562161
        ],
        "wc_weaknesses_avg": [
            154.5,
            60.2930344235551
        ],
        "wc_questions_avg": [
            88.5,
            47.077064479425644
        ],
        "wc_review_avg": [
            420.75,
            91.77792490572011
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            542.0,
            185.88975227268446
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 280,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11402089836523723994&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;0;0;0;0;0",
        "aff_unique_norm": "Meta",
        "aff_unique_dep": "Meta Platforms, Inc.",
        "aff_unique_url": "https://meta.com",
        "aff_unique_abbr": "Meta",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "mDIXfHvoqH",
        "title": "ITPNet: Towards Instantaneous Trajectory Prediction for Autonomous Driving",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Trajectory prediction of moving traffic agents is crucial for the safety of autonomous vehicles, whereas previous approaches usually rely on sufficiently long-tracked locations (e.g., 2 seconds) to predict the future locations of the agents. However, in many real-world scenarios, it is not realistic to collect adequate observations for moving agents, leading to the collapse of most prediction models. For instance, when a moving car suddenly appears and is very close to an autonomous vehicle because of the obstruction, it is quite necessary for the autonomous vehicle to quickly and accurately predict the trajectories of the car with limited tracked trajectories.  In light of this, we focus on investigating the task of instantaneous trajectory prediction, i.e., two tracked locations are available during inference. To this end, we put forward a general and plug-and-play instantaneous trajectory prediction approach, called ITPNet. At its heart, we propose a backward forecasting mechanism to reversely predict the latent feature representations of unobserved historical trajectories of the agent based on its two observed locations and then leverage them as complementary information for future trajectory prediction. Moreover, due to the inevitable existence of noise and redundancy in the predicted latent feature representations and the difficulty of automatically determining the optimal length of unobserved trajectories, we further devise a Noise Redundancy Reduction Former (NRRFormer) module, which attempts to filter out noise and redundancy from a longer sequence of unobserved trajectories and integrate the filtered features and the observed features into a compact query representation for future trajectory predictions. In essence, ITPNet can be naturally compatible with existing trajectory prediction models, enabling them to gracefully handle the case of instantaneous trajectory prediction. Extensive experiments on the Argoverse and nuScenes datasets demonstrate that ITPNet outperforms the baselines by a large margin and shows its efficacy with different trajectory prediction models.",
        "keywords": "Trajectory prediction",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/71918ef2b3b93035f023e6632e0aeb4cf87fd45d.pdf",
        "author": "Rongqing Li;Changsheng Li;Yuhang Li;Hanjie Li;Yi Chen;Dongchun Ren;Ye Yuan;Guoren Wang",
        "authorids": "~Rongqing_Li1;~Changsheng_Li4;~Yuhang_Li5;~Hanjie_Li1;~Yi_Chen16;~Dongchun_Ren2;~Ye_Yuan15;~Guoren_Wang2",
        "gender": ";M;M;M;;;;M",
        "homepage": ";;https://github.com/bit-lyh;;;;;https://guorenwang.github.io/",
        "dblp": ";;;;;;;",
        "google_scholar": ";FfJnUioAAAAJ;;;;;;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": ";0000-0001-9789-7632;;;;;;",
        "linkedin": ";;;https://www.linkedin.cn/incareer/in/ACoAAEHBy1wBXUkAJ4KqHQbm23g0zsp0l8Jgys8;https://www.linkedin.cn/incareer/in/ACoAAEHBxO0BMufj4Y0msyLHVJyzZx3DTuGqSZU;;;",
        "or_profile": "~Rongqing_Li1;~Changsheng_Li4;~Yuhang_Li5;~Hanjie_Li1;~Yi_Chen16;~Dongchun_Ren2;~Ye_Yuan15;~Guoren_Wang2",
        "aff": ";Beijing Institute of Technology;Beijing Institute of Technology;Beijing Institute of Technology;;;;Beijing Institute of Technology",
        "aff_domain": ";bit.edu.cn;bit.edu.cn;bit.edu.cn;;;;bit.edu.cn",
        "position": ";Full Professor;MS student;MS student;;;;Full Professor",
        "bibtex": "@misc{\nli2024itpnet,\ntitle={{ITPN}et: Towards Instantaneous Trajectory Prediction for Autonomous Driving},\nauthor={Rongqing Li and Changsheng Li and Yuhang Li and Hanjie Li and Yi Chen and Dongchun Ren and Ye Yuan and Guoren Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=mDIXfHvoqH}\n}",
        "github": "",
        "project": "",
        "reviewers": "oKM3;1F4C;ptje;LWjU",
        "site": "https://openreview.net/forum?id=mDIXfHvoqH",
        "pdf_size": 896103,
        "rating": "5;6;8;8",
        "confidence": "5;3;5;3",
        "soundness": "2;3;3;4",
        "contribution": "2;3;3;3",
        "presentation": "3;3;2;4",
        "wc_summary": "44;298;223;88",
        "wc_strengths": "26;27;121;114",
        "wc_weaknesses": "145;536;137;164",
        "wc_questions": "109;166;26;123",
        "wc_review": "324;1027;507;489",
        "wc_reply_reviewers": "0;11;138;85",
        "wc_reply_authors": "1225;1864;1156;749",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "2;3;4;2",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            1.0
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            163.25,
            101.9935659735456
        ],
        "wc_strengths_avg": [
            72.0,
            45.56862956025779
        ],
        "wc_weaknesses_avg": [
            245.5,
            168.00669629511796
        ],
        "wc_questions_avg": [
            106.0,
            50.73953093988946
        ],
        "wc_review_avg": [
            586.75,
            263.99467324171525
        ],
        "wc_reply_reviewers_avg": [
            58.5,
            56.349356695529366
        ],
        "wc_reply_authors_avg": [
            1248.5,
            399.20201652797294
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.19245008972987526,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17249458484004080956&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Beijing Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.bit.edu.cn/",
        "aff_unique_abbr": "BIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "An Analytical Solution to Gauss-Newton Loss for Direct Image Alignment",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17902",
        "id": "mE52zURNGc",
        "author_site": "Sergei Solonets, Daniil Sinitsyn, Lukas Von Stumberg, Nikita Araslanov, Daniel Cremers",
        "tldr": "",
        "abstract": "Direct image alignment is a widely used technique for relative 6DoF pose estimation between two images, but its accuracy strongly depends on pose initialization.\nTherefore, recent end-to-end frameworks increase the convergence basin of the learned feature descriptors with special training objectives, such as the Gauss-Newton loss.\nHowever, the training data may exhibit bias toward a specific type of motion and pose initialization,\nthus limiting the generalization of these methods.\nIn this work, we derive a closed-form solution to the expected optimum of the Gauss-Newton loss. \nThe solution is agnostic to the underlying feature representation and allows us to dynamically adjust the basin of convergence according to our assumptions about the uncertainty in the current estimates. These properties allow for effective control over the convergence in the alignment process.\nDespite using self-supervised feature embeddings, our solution achieves compelling accuracy w.r.t. the state-of-the-art direct image alignment methods trained end-to-end with pose supervision, and demonstrates improved robustness to pose initialization.\nOur analytical solution exposes some inherent limitations of end-to-end learning with the Gauss-Newton loss, and establishes an intriguing connection between direct image alignment and feature-matching approaches.",
        "keywords": "featuremetric image alignment",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Sergei Solonets;Daniil Sinitsyn;Lukas Von Stumberg;Nikita Araslanov;Daniel Cremers",
        "authorids": "~Sergei_Solonets1;~Daniil_Sinitsyn1;~Lukas_Von_Stumberg1;~Nikita_Araslanov1;~Daniel_Cremers1",
        "gender": "M;M;;M;M",
        "homepage": "https://cvg.cit.tum.de/members/sols;https://cvg.cit.tum.de/members/sida;https://vision.in.tum.de/members/stumberg;https://arnike.github.io;https://vision.in.tum.de/members/cremers",
        "dblp": "211/9945;;186/8102;173/7854;c/DanielCremers",
        "google_scholar": "XmYld6oAAAAJ;G5Ygwp8AAAAJ;https://scholar.google.de/citations?user=jBgFEukAAAAJ;RdMFioAAAAAJ;cXQciMEAAAAJ",
        "orcid": "0000-0002-3469-7489;0000-0002-9102-9065;;;",
        "linkedin": "sergei-solonets-4169998b/;https://linkedin.com/in/daniil-sinitsyn-763a481b4;;;",
        "or_profile": "~Sergei_Solonets1;~Daniil_Sinitsyn1;~Lukas_Von_Stumberg1;~Nikita_Araslanov1;~Daniel_Cremers1",
        "aff": "Technische Universit\u00e4t M\u00fcnchen;Department of Informatics, Technische Universit\u00e4t M\u00fcnchen;Valve Corporation;Technische Universit\u00e4t M\u00fcnchen;Technical University Munich",
        "aff_domain": "tum.de;in.tum.de;valvesoftware.com;tum.de;tum.de",
        "position": "PhD student;PhD student;Software Engineer;Postdoc;Full Professor",
        "bibtex": "@inproceedings{\nsolonets2024an,\ntitle={An Analytical Solution to Gauss-Newton Loss for Direct Image Alignment},\nauthor={Sergei Solonets and Daniil Sinitsyn and Lukas Von Stumberg and Nikita Araslanov and Daniel Cremers},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=mE52zURNGc}\n}",
        "github": "",
        "project": "",
        "reviewers": "TZP4;1Yhm;hDb9",
        "pdf_size": 28592370,
        "rating": "6;8;8",
        "confidence": "3;3;3",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "3;3;4",
        "wc_summary": "71;98;224",
        "wc_strengths": "53;63;265",
        "wc_weaknesses": "42;52;328",
        "wc_questions": "4;1;81",
        "wc_review": "170;214;898",
        "wc_reply_reviewers": "7;0;45",
        "wc_reply_authors": "145;159;225",
        "reply_reviewers": "1;0;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            131.0,
            66.6783323126786
        ],
        "wc_strengths_avg": [
            127.0,
            97.6660978367963
        ],
        "wc_weaknesses_avg": [
            140.66666666666666,
            132.52756526683632
        ],
        "wc_questions_avg": [
            28.666666666666668,
            37.025516726831626
        ],
        "wc_review_avg": [
            427.3333333333333,
            333.2959979090991
        ],
        "wc_reply_reviewers_avg": [
            17.333333333333332,
            19.770910168449223
        ],
        "wc_reply_authors_avg": [
            176.33333333333334,
            34.883934538536344
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:vl23vAco0U8J:scholar.google.com/&scioq=An+Analytical+Solution+to+Gauss-Newton+Loss+for+Direct+Image+Alignment&hl=en&as_sdt=0,33",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=mE52zURNGc",
        "pdf": "https://openreview.net/pdf?id=mE52zURNGc",
        "email": "tum.de;in.tum.de;valvesoftware.com;tum.de;tum.de",
        "author_num": 5,
        "aff_unique_index": "0;0;1;0;2",
        "aff_unique_norm": "Technische Universit\u00e4t M\u00fcnchen;Valve Corporation;Technical University of Munich",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.tum.de;https://www.valvesoftware.com;https://www.tum.de",
        "aff_unique_abbr": "TUM;Valve;TUM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "Germany;United States"
    },
    {
        "id": "mEJAp7Gh2F",
        "title": "Language-Conditioned Imitation Learning With Base Skill Priors Under Unstructured Data",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The growing interest in language-conditioned robot manipulation aims to develop robots capable of understanding and executing complex tasks, with the objective of enabling robots to interpret language commands and manipulate objects accordingly. While language-conditioned approaches demonstrate impressive capabilities for addressing tasks in familiar environments, they encounter limitations in adapting to unfamiliar environment settings. In this study, we propose a general-purpose, language-conditioned approach that combines base skill priors and imitation learning under unstructured data to enhance the algorithm's generalization in adapting to unfamiliar environments. We assess our model's performance in both simulated and real-world environments using a zero-shot setting. In the simulated environment, the proposed approach surpasses previously reported scores for CALVIN benchmark, especially in the challenging Zero-Shot Multi-Environment setting. The average completed task length, indicating the average number of tasks the agent can continuously complete, improves more than 2.5 times compared to the state-of-the-art method HULC. In addition, we conduct a zero-shot evaluation of our policy in a real-world setting, following training exclusively in simulated environments without additional specific adaptations. In this evaluation, we set up ten tasks and achieved an average 30% improvement in our approach compared to the current state-of-the-art approach, demonstrating a high generalization capability in both simulated environments and the real world. For further details, including access to our code and videos, please refer to our supplementary materials.",
        "keywords": "imitation Learning;robot manipulation",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/feb8d319464ba2048533d40c784475cff7cdb348.zip",
        "author": "Hongkuan Zhou;Zhenshan Bing;Xiangtong Yao;Xiaojie Su;Chenguang Yang;Kai Huang;Alois Knoll",
        "authorids": "~Hongkuan_Zhou2;~Zhenshan_Bing1;~Xiangtong_Yao1;~Xiaojie_Su1;~Chenguang_Yang1;~Kai_Huang2;~Alois_Knoll1",
        "gender": "M;M;M;M;M;;M",
        "homepage": "https://hongkuan-zhou.github.io/Homepage/;;;https://orcid.org/0000-0003-1802-0264;https://www.liverpool.ac.uk/people/charlie-yang;;https://www.in.tum.de/i06/people/prof-dr-ing-habil-alois-knoll/",
        "dblp": ";203/4777;248/3613;66/8680.html;96/928;86/489-1.html;k/AloisKnoll",
        "google_scholar": "dw7M_j8AAAAJ;https://scholar.google.de/citations?user=eIz0XvMAAAAJ;tWPlsXkAAAAJ;;https://scholar.google.com/citations?hl=en;;https://scholar.google.de/citations?user=-CA8QgwAAAAJ",
        "orcid": "0000-0002-3665-9822;;;;0000-0001-5255-5559;;0000-0003-4840-076X",
        "linkedin": "hongkuan-zhou-a1aa60215;;;;;;alois-knoll-505480166",
        "or_profile": "~Hongkuan_Zhou2;~Zhenshan_Bing1;~Xiangtong_Yao1;~Xiaojie_Su1;~Chenguang_Yang1;~Kai_Huang2;~Alois_Knoll1",
        "aff": "Bosch;Technical University of Munich;Technische Universit\u00e4t M\u00fcnchen;Chongqing University;University of the West of England, Bristol;SUN YAT-SEN UNIVERSITY;Technical University Munich",
        "aff_domain": "bosch.de;tum.de;tum.de;cqu.edu.cn;uwe.ac.uk;sysu.edu.cn;tum.de",
        "position": "PhD student;Postdoc;PhD student;Full Professor;Full Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nzhou2024languageconditioned,\ntitle={Language-Conditioned Imitation Learning With Base Skill Priors Under Unstructured Data},\nauthor={Hongkuan Zhou and Zhenshan Bing and Xiangtong Yao and Xiaojie Su and Chenguang Yang and Kai Huang and Alois Knoll},\nyear={2024},\nurl={https://openreview.net/forum?id=mEJAp7Gh2F}\n}",
        "github": "",
        "project": "",
        "reviewers": "yTpt;h9E8;WrLY;iKk6",
        "site": "https://openreview.net/forum?id=mEJAp7Gh2F",
        "pdf_size": 14407541,
        "rating": "3;3;3;3",
        "confidence": "4;4;4;3",
        "soundness": "3;2;2;2",
        "contribution": "2;2;2;1",
        "presentation": "2;3;2;1",
        "wc_summary": "130;113;39;67",
        "wc_strengths": "43;123;53;48",
        "wc_weaknesses": "712;472;182;244",
        "wc_questions": "275;38;60;44",
        "wc_review": "1160;746;334;403",
        "wc_reply_reviewers": "0;0;14;0",
        "wc_reply_authors": "0;737;606;550",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "0;1;1;1",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            87.25,
            36.15504805694496
        ],
        "wc_strengths_avg": [
            66.75,
            32.66783586342995
        ],
        "wc_weaknesses_avg": [
            402.5,
            208.78397927044114
        ],
        "wc_questions_avg": [
            104.25,
            98.9099969669396
        ],
        "wc_review_avg": [
            660.75,
            327.76468311884975
        ],
        "wc_reply_reviewers_avg": [
            3.5,
            6.06217782649107
        ],
        "wc_reply_authors_avg": [
            473.25,
            281.532746763143
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            0.75,
            0.4330127018922193
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12299449602188364309&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;2;3;4;5;1",
        "aff_unique_norm": "Robert Bosch GmbH;Technical University of Munich;Technische Universit\u00e4t M\u00fcnchen;Chongqing University;University of the West of England;Sun Yat-sen University",
        "aff_unique_dep": ";;;;;",
        "aff_unique_url": "https://www.bosch.com;https://www.tum.de;https://www.tum.de;https://www.cqu.edu.cn;https://www.uwe.ac.uk;http://www.sysu.edu.cn",
        "aff_unique_abbr": "Bosch;TUM;TUM;CQU;UWE;SYSU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Bristol",
        "aff_country_unique_index": "0;0;0;1;2;1;0",
        "aff_country_unique": "Germany;China;United Kingdom"
    },
    {
        "title": "Sum-Product-Set Networks: Deep Tractable Models for Tree-Structured Graphs",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17901",
        "id": "mF3cTns4pe",
        "author_site": "Milan Papez, Martin Rektoris, Vaclav Smidl, Tom\u00e1\u0161 Pevn\u00fd",
        "tldr": "",
        "abstract": "Daily internet communication relies heavily on tree-structured graphs, embodied by popular data formats such as XML and JSON. However, many recent generative (probabilistic) models utilize neural networks to learn a probability distribution over undirected cyclic graphs. This assumption of a generic graph structure brings various computational challenges, and, more importantly, the presence of non-linearities in neural networks does not permit tractable probabilistic inference. We address these problems by proposing sum-product-set networks, an extension of probabilistic circuits from unstructured tensor data to tree-structured graph data. To this end, we use random finite sets to reflect a variable number of nodes and edges in the graph and to allow for exact and efficient inference. We demonstrate that our tractable model performs comparably to various intractable models based on neural networks.",
        "keywords": "Sum-product networks;graph neural networks;probabilistic circuits;tree-structured graphs;supervised learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Milan Papez;Martin Rektoris;Vaclav Smidl;Tom\u00e1\u0161 Pevn\u00fd",
        "authorids": "~Milan_Papez1;~Martin_Rektoris1;~Vaclav_Smidl1;~Tom\u00e1\u0161_Pevn\u00fd1",
        "gender": ";M;M;M",
        "homepage": ";;https://www.linkedin.com/in/vaclav-smidl-4b224423/;https://cs.felk.cvut.cz/en/people/pevnytom",
        "dblp": ";;63/5293;20/1317",
        "google_scholar": ";;https://scholar.google.cz/citations?user=-eKEWPEAAAAJ;MnXqDssAAAAJ",
        "orcid": "0000-0002-6700-081X;0000-0003-0742-7253;0000-0003-3027-6174;0000-0002-5768-9713",
        "linkedin": ";;vaclav-smidl-4b224423/;",
        "or_profile": "~Milan_Papez1;~Martin_Rektoris1;~Vaclav_Smidl1;~Tom\u00e1\u0161_Pevn\u00fd1",
        "aff": "Czech technical university in Prague;Czech Technical Univeresity in Prague, Czech Technical University of Prague;Czech Academy of Sciences;Czech Technical University in Prague",
        "aff_domain": "cvut.cz;fel.cvut.cz;utia.cas.cz;cvut.cz",
        "position": "Postdoc;MS student;Researcher;Associate Professor",
        "bibtex": "@inproceedings{\npapez2024sumproductset,\ntitle={Sum-Product-Set Networks: Deep Tractable Models for Tree-Structured Graphs},\nauthor={Milan Papez and Martin Rektoris and Vaclav Smidl and Tom{\\'a}{\\v{s}} Pevn{\\'y}},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=mF3cTns4pe}\n}",
        "github": "",
        "project": "",
        "reviewers": "9xzE;gTbZ;snrr;k1pi",
        "pdf_size": 530354,
        "rating": "6;6;8;8",
        "confidence": "4;2;3;3",
        "soundness": "3;3;4;4",
        "contribution": "3;3;3;3",
        "presentation": "4;3;3;3",
        "wc_summary": "133;43;62;68",
        "wc_strengths": "162;84;49;54",
        "wc_weaknesses": "71;12;151;257",
        "wc_questions": "284;16;375;63",
        "wc_review": "650;155;637;442",
        "wc_reply_reviewers": "99;0;22;0",
        "wc_reply_authors": "616;22;828;869",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            76.5,
            33.90058996536786
        ],
        "wc_strengths_avg": [
            87.25,
            45.18503623988809
        ],
        "wc_weaknesses_avg": [
            122.75,
            91.87593536938822
        ],
        "wc_questions_avg": [
            184.5,
            149.45316992288923
        ],
        "wc_review_avg": [
            471.0,
            200.18366566730663
        ],
        "wc_reply_reviewers_avg": [
            30.25,
            40.69628361410904
        ],
        "wc_reply_authors_avg": [
            583.75,
            338.2413154834873
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6853838509062441982&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=mF3cTns4pe",
        "pdf": "https://openreview.net/pdf?id=mF3cTns4pe",
        "email": "cvut.cz;fel.cvut.cz;utia.cas.cz;cvut.cz",
        "author_num": 4,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Czech Technical University;Czech Technical University in Prague;Czech Academy of Sciences",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ctu.cz;https://www.ctu.cz;https://www.cas.cz",
        "aff_unique_abbr": "CTU;CTU;CAS",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Prague;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Czech Republic"
    },
    {
        "id": "mFBR2ksIwY",
        "title": "MACCA: Offline Multi-agent Reinforcement Learning with Causal Credit Assignment",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Offline Multi-agent Reinforcement Learning (MARL) is valuable in scenarios where online interaction is impractical or risky. While independent learning in MARL offers flexibility and scalability, accurately assigning credit to individual agents in offline settings poses challenges due to partial observability and emergent behavior. Directly transferring online credit assignment method to offline settings results in suboptimal outcomes due to the absence of real-time feedback and intricate agent interactions. Our approach, MACCA, characterizing the generative process as a Dynamic Bayesian Network, captures relationships between environmental variables, states, actions, and rewards. Estimating this model on offline data, MACCA can learn each agent's contribution by analyzing the causal relationship of their individual rewards, ensuring accurate and interpretable credit assignment. Additionally, the modularity of our approach allows it to seamlessly integrate with various offline MARL methods. Theoretically, we proved that under the setting of offline dataset, the underlying causal structure and the function for generating the individual rewards of agents are identifiable, which laid the foundation for the correctness of our modeling. Experimentally, we tested MACCA in three environments, including discrete and continuous action settings. The results show that MACCA outperforms SOTA methods and improves performance upon their backbones.",
        "keywords": "Offline Multi-Agent Reinforcement Learning;Credit Assignment;Causal Inference",
        "primary_area": "causal reasoning",
        "supplementary_material": "",
        "author": "Ziyan Wang;Yali Du;Yudi Zhang;Meng Fang;Biwei Huang",
        "authorids": "~Ziyan_Wang3;~Yali_Du1;~Yudi_Zhang3;~Meng_Fang1;~Biwei_Huang1",
        "gender": "M;;F;M;F",
        "homepage": "https://ziyan-wang98.github.io/;;https://github.com/ReedZyd;;",
        "dblp": ";;344/3890;67/463;165/3288",
        "google_scholar": "1Yu8JFIAAAAJ;;https://scholar.google.com/citations?hl=en;IcNYP1oAAAAJ;",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Ziyan_Wang3;~Yali_Du1;~Yudi_Zhang3;~Meng_Fang1;~Biwei_Huang1",
        "aff": "King's College London;;Eindhoven University of Technology;Eindhoven University of Technology;University of California, San Diego",
        "aff_domain": "kcl.ac.uk;;tue.nl;tue.nl;ucsd.edu",
        "position": "PhD student;;PhD student;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nwang2024macca,\ntitle={{MACCA}: Offline Multi-agent Reinforcement Learning with Causal Credit Assignment},\nauthor={Ziyan Wang and Yali Du and Yudi Zhang and Meng Fang and Biwei Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=mFBR2ksIwY}\n}",
        "github": "",
        "project": "",
        "reviewers": "SGeQ;XKou;jLy1;9GYs",
        "site": "https://openreview.net/forum?id=mFBR2ksIwY",
        "pdf_size": 5831120,
        "rating": "3;5;6;6",
        "confidence": "4;5;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "59;176;44;121",
        "wc_strengths": "23;146;30;42",
        "wc_weaknesses": "120;295;24;116",
        "wc_questions": "28;154;30;196",
        "wc_review": "230;771;128;475",
        "wc_reply_reviewers": "427;51;22;35",
        "wc_reply_authors": "2287;1581;390;1351",
        "reply_reviewers": "2;1;1;1",
        "reply_authors": "5;5;3;4",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            100.0,
            52.52142420003479
        ],
        "wc_strengths_avg": [
            60.25,
            49.97186708539115
        ],
        "wc_weaknesses_avg": [
            138.75,
            98.044313960576
        ],
        "wc_questions_avg": [
            102.0,
            74.4983221287567
        ],
        "wc_review_avg": [
            401.0,
            248.06551553974606
        ],
        "wc_reply_reviewers_avg": [
            133.75,
            169.61924271732852
        ],
        "wc_reply_authors_avg": [
            1402.25,
            678.6034832654486
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.25,
            0.82915619758885
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.28867513459481287,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5056785356690668534&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "King's College London;Eindhoven University of Technology;University of California, San Diego",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.kcl.ac.uk;https://www.tue.nl;https://www.ucsd.edu",
        "aff_unique_abbr": "KCL;TU/e;UCSD",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";San Diego",
        "aff_country_unique_index": "0;1;1;2",
        "aff_country_unique": "United Kingdom;Netherlands;United States"
    },
    {
        "id": "mFTPRV5hYw",
        "title": "Where have you been? A Study of Privacy Risk for Point-of-Interest Recommendation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "As location-based services (LBS) have grown in popularity, the collection of human mobility data has become increasingly extensive to build machine learning (ML) models offering enhanced convenience to LBS users. However, the convenience comes with the risk of privacy leakage since this type of data might contain sensitive information related to user identities, such as home/work locations. Prior work focuses on protecting mobility data privacy during transmission or prior to release, lacking the privacy risk evaluation of mobility data-based ML models. To better understand and quantify the privacy leakage in mobility data-based ML models, we design a privacy attack suite containing data extraction and membership inference attacks tailored for point-of-interest (POI) recommendation models, one of the most widely used mobility data-based ML models. These attacks in our attack suite assume different adversary knowledge and aim to extract different types of sensitive information from mobility data, providing a holistic privacy risk assessment for POI recommendation models. Our experimental evaluation using two real-world mobility datasets demonstrates that current POI recommendation models are vulnerable to our attacks. We also present unique findings to understand what types of mobility data are more susceptible to privacy attacks. Finally, we evaluate defenses against these attacks and highlight future directions and challenges.",
        "keywords": "Privacy Attack;POI Recommendation",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Kunlin Cai;Jinghuai Zhang;William Shand;Zhiqing Hong;Guang Wang;Desheng Zhang;Jianfeng Chi;Yuan Tian",
        "authorids": "~Kunlin_Cai1;~Jinghuai_Zhang2;~William_Shand1;~Zhiqing_Hong2;~Guang_Wang1;~Desheng_Zhang2;~Jianfeng_Chi1;~Yuan_Tian2",
        "gender": "M;;Not Specified;M;;;M;F",
        "homepage": ";;https://kernelmethod.org;http://www.zhiqinghong.site/;http://guangwang.me/;;https://jfchi.github.io/;https://www.ytian.info/",
        "dblp": ";;321/0940;248/4120;54/1738-1;;231/6028.html;",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;;;8pMYf88AAAAJ;DfHyVboAAAAJ;;S_7a_B4AAAAJ;",
        "orcid": ";;0000-0001-6525-7091;;0000-0002-7739-7945;;;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Kunlin_Cai1;~Jinghuai_Zhang2;~William_Shand1;~Zhiqing_Hong2;~Guang_Wang1;~Desheng_Zhang2;~Jianfeng_Chi1;~Yuan_Tian2",
        "aff": "University of California, Los Angeles;;University of California, Los Angeles;Rutgers University, New Brunswick;Florida State University;;Meta AI;University of Virginia",
        "aff_domain": "ucla.edu;;ucla.edu;rutgers.edu;fsu.edu;;meta.com;virginia.edu",
        "position": "PhD student;;PhD student;PhD student;Assistant Professor;;Research Scientist;Assistant Professor",
        "bibtex": "@misc{\ncai2024where,\ntitle={Where have you been? A Study of Privacy Risk for Point-of-Interest Recommendation},\nauthor={Kunlin Cai and Jinghuai Zhang and William Shand and Zhiqing Hong and Guang Wang and Desheng Zhang and Jianfeng Chi and Yuan Tian},\nyear={2024},\nurl={https://openreview.net/forum?id=mFTPRV5hYw}\n}",
        "github": "",
        "project": "",
        "reviewers": "KUtq;1v9T;iRwY;sUA6",
        "site": "https://openreview.net/forum?id=mFTPRV5hYw",
        "pdf_size": 1095709,
        "rating": "5;5;6;8",
        "confidence": "4;4;2;4",
        "soundness": "3;2;3;4",
        "contribution": "3;2;2;3",
        "presentation": "3;3;3;4",
        "wc_summary": "115;53;33;46",
        "wc_strengths": "113;27;35;42",
        "wc_weaknesses": "58;48;130;89",
        "wc_questions": "62;312;1;90",
        "wc_review": "348;440;199;267",
        "wc_reply_reviewers": "0;17;0;0",
        "wc_reply_authors": "1111;1916;492;1211",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "4;6;3;4",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            61.75,
            31.5703579327191
        ],
        "wc_strengths_avg": [
            54.25,
            34.332018583240924
        ],
        "wc_weaknesses_avg": [
            81.25,
            31.948200262299597
        ],
        "wc_questions_avg": [
            116.25,
            117.50824439161705
        ],
        "wc_review_avg": [
            313.5,
            90.09023254493242
        ],
        "wc_reply_reviewers_avg": [
            4.25,
            7.361215932167728
        ],
        "wc_reply_authors_avg": [
            1182.5,
            505.15764866029696
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.25,
            1.0897247358851685
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6234887356315756888&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;1;2;3;4",
        "aff_unique_norm": "University of California, Los Angeles;Rutgers University;Florida State University;Meta;University of Virginia",
        "aff_unique_dep": ";;;Meta AI;",
        "aff_unique_url": "https://www.ucla.edu;https://www.rutgers.edu;https://www.fsu.edu;https://meta.com;https://www.virginia.edu",
        "aff_unique_abbr": "UCLA;Rutgers;FSU;Meta;UVA",
        "aff_campus_unique_index": "0;0;1",
        "aff_campus_unique": "Los Angeles;New Brunswick;",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Rethinking the Benefits of Steerable Features in 3D Equivariant Graph Neural Networks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17900",
        "id": "mGHJAyR8w0",
        "author_site": "Shih-Hsin Wang, Yung-Chang Hsu, Justin Baker, Andrea Bertozzi, Jack Xin, Bao Wang",
        "tldr": "",
        "abstract": "Theoretical and empirical comparisons have been made to assess the expressive power and performance of invariant and equivariant GNNs. However, there is currently no theoretical result comparing the expressive power of $k$-hop invariant GNNs and equivariant GNNs. Additionally, little is understood about whether the performance of equivariant GNNs, employing steerable features up to type-$L$, increases as $L$ grows -- especially when the feature dimension is held constant. In this study, we introduce a key lemma that allows us to analyze steerable features by examining their corresponding invariant features. The lemma facilitates us in understanding the limitations of $k$-hop invariant GNNs, which fail to capture the global geometric structure due to the loss of geometric information between local structures. Furthermore, we investigate the invariant features associated with different types of steerable features and demonstrate that the expressiveness of steerable features is primarily determined by their dimension -- independent of their irreducible decomposition. This suggests that when the feature dimension is constant, increasing $L$ does not lead to essentially improved performance in equivariant GNNs employing steerable features up to type-$L$. We substantiate our theoretical insights with numerical evidence.",
        "keywords": "Steerable features;Equivariant graph neural networks;Message passing",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/0f2695a7074df05404f35ad452a29b3a5af1d80f.zip",
        "author": "Shih-Hsin Wang;Yung-Chang Hsu;Justin Baker;Andrea L. Bertozzi;Jack Xin;Bao Wang",
        "authorids": "~Shih-Hsin_Wang1;~Yung-Chang_Hsu1;~Justin_Baker1;~Andrea_L._Bertozzi2;~Jack_Xin2;~Bao_Wang1",
        "gender": "M;M;;;;M",
        "homepage": ";https://sites.google.com/view/martin-hsu;;;;https://www.math.utah.edu/~bwang/index.html",
        "dblp": ";;;;;",
        "google_scholar": ";;;;;",
        "orcid": ";;;;;",
        "linkedin": "shih-hsin-sam-wang-9803671a5/;;;;;",
        "or_profile": "~Shih-Hsin_Wang1;~Yung-Chang_Hsu1;~Justin_Baker1;~Andrea_L._Bertozzi2;~Jack_Xin2;~Bao_Wang1",
        "aff": "University of Utah;Purdue University;;;;University of Utah",
        "aff_domain": "utah.edu;purdue.edu;;;;utah.edu",
        "position": "PhD student;PhD student;;;;Assistant Professor",
        "bibtex": "@inproceedings{\nwang2024rethinking,\ntitle={Rethinking the Benefits of Steerable Features in 3D Equivariant Graph Neural Networks},\nauthor={Shih-Hsin Wang and Yung-Chang Hsu and Justin Baker and Andrea L. Bertozzi and Jack Xin and Bao Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=mGHJAyR8w0}\n}",
        "github": "",
        "project": "",
        "reviewers": "3HqL;BvXD;WxNP;nbPE",
        "pdf_size": 687229,
        "rating": "6;6;6;8",
        "confidence": "3;3;5;3",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;4",
        "presentation": "3;2;2;4",
        "wc_summary": "154;101;140;114",
        "wc_strengths": "56;36;59;113",
        "wc_weaknesses": "112;254;183;830",
        "wc_questions": "1086;161;474;90",
        "wc_review": "1408;552;856;1147",
        "wc_reply_reviewers": "167;67;506;131",
        "wc_reply_authors": "4364;1697;3081;2186",
        "reply_reviewers": "1;1;3;1",
        "reply_authors": "7;4;7;4",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            127.25,
            20.873128658636684
        ],
        "wc_strengths_avg": [
            66.0,
            28.53944638566067
        ],
        "wc_weaknesses_avg": [
            344.75,
            284.6220081090006
        ],
        "wc_questions_avg": [
            452.75,
            393.116633456281
        ],
        "wc_review_avg": [
            990.75,
            319.83228026576677
        ],
        "wc_reply_reviewers_avg": [
            217.75,
            170.23127650346748
        ],
        "wc_reply_authors_avg": [
            2832.0,
            1014.2196507660459
        ],
        "reply_reviewers_avg": [
            1.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            5.5,
            1.5
        ],
        "replies_avg": [
            35,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14371278746717616562&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=mGHJAyR8w0",
        "pdf": "https://openreview.net/pdf?id=mGHJAyR8w0",
        "email": "utah.edu;purdue.edu;;;;utah.edu",
        "author_num": 6,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Utah;Purdue University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.utah.edu;https://www.purdue.edu",
        "aff_unique_abbr": "Utah;Purdue",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "mGmx41FTTy",
        "title": "Two Time-Slices Help Topological Ordering for Learning Directed Acyclic Graphs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Learning causal relations from observational data is an important task in the real world, yet it remains challenging due to the super-exponential search space and the acyclicity constraint. To address these issues, practitioners develop promising topology-based methods to generate a complete topological ordering, reducing the search space and automatically maintaining the acyclicity constraint. However, these methods typically produce non-unique topological orderings with numerous spurious edges, resulting in decreased accuracy and efficiency in downstream search tasks. While using interventional data can quickly identify (non-)descendants for each node and construct a more precise topological ordering, full interventions are often expensive, unethical, or even infeasible. Therefore, we explore how the more readily available two time-slices data can replace intervention data to improve topological ordering. Based on a conditional independence criterion using two time-slices as auxiliary instrumental variables, we propose a novel Descendant Hierarchical Topology algorithm with Conditional Independence Test (DHT-CIT) to learn causal relations more efficiently, with a smaller search space and fewer spurious edges. Empirical results on both synthetic and real-world datasets demonstrate the superiority of our DHT-CIT algorithm.",
        "keywords": "Two Time-Slices;Topology-based Algorithm;Descendant Hierarchical Topology;Conditional Independence Criterion",
        "primary_area": "causal reasoning",
        "supplementary_material": "/attachment/8507587ff3243f45649e4da6044be2b677c2b475.zip",
        "author": "Anpeng Wu;Haoxuan Li;Kun Kuang;Zhang Keli;Fei Wu",
        "authorids": "~Anpeng_Wu1;~Haoxuan_Li6;~Kun_Kuang1;~Zhang_Keli1;~Fei_Wu1",
        "gender": "M;M;M;M;M",
        "homepage": "https://scholar.google.com.hk/citations?user=VQ4m6zQAAAAJ&hl=zh-CN&oi=sra;https://haoxuanli-pku.github.io/;http://kunkuang.github.io;;https://person.zju.edu.cn/wufei",
        "dblp": "267/5637;145/4965-1.html;194/4245;92/573;84/3254-1",
        "google_scholar": "https://scholar.google.com.hk/citations?user=VQ4m6zQAAAAJ;gtDqiucAAAAJ;https://scholar.google.com.hk/citations?user=FOsNiMQAAAAJ;;XJLn4MYAAAAJ",
        "orcid": "0000-0003-3898-7122;0000-0003-3620-3769;0009-0000-7528-8131;0000-0002-7883-0552;",
        "linkedin": ";;;;",
        "or_profile": "~Anpeng_Wu1;~Haoxuan_Li6;~Kun_Kuang1;~Zhang_Keli1;~Fei_Wu1",
        "aff": "Mohamed bin Zayed University of Artificial Intelligence;Peking University;Zhejiang University;Huawei Technologies Ltd.;Zhejiang University",
        "aff_domain": "mbzuai.ac.ae;pku.edu.cn;zju.edu.cn;huawei.com;zju.edu.cn",
        "position": "Researcher;PhD student;Associate Professor;Researcher;Full Professor",
        "bibtex": "@misc{\nwu2024two,\ntitle={Two Time-Slices Help Topological Ordering for Learning Directed Acyclic Graphs},\nauthor={Anpeng Wu and Haoxuan Li and Kun Kuang and Zhang Keli and Fei Wu},\nyear={2024},\nurl={https://openreview.net/forum?id=mGmx41FTTy}\n}",
        "github": "",
        "project": "",
        "reviewers": "mehL;5w1M;w8o3",
        "site": "https://openreview.net/forum?id=mGmx41FTTy",
        "pdf_size": 937881,
        "rating": "5;6;8",
        "confidence": "3;2;4",
        "soundness": "2;3;3",
        "contribution": "2;3;4",
        "presentation": "2;3;3",
        "wc_summary": "77;92;48",
        "wc_strengths": "42;74;96",
        "wc_weaknesses": "108;78;125",
        "wc_questions": "576;66;2",
        "wc_review": "803;310;271",
        "wc_reply_reviewers": "153;87;0",
        "wc_reply_authors": "4199;1779;472",
        "reply_reviewers": "1;1;0",
        "reply_authors": "8;4;1",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            72.33333333333333,
            18.263503375736967
        ],
        "wc_strengths_avg": [
            70.66666666666667,
            22.17105219775452
        ],
        "wc_weaknesses_avg": [
            103.66666666666667,
            19.430788855719562
        ],
        "wc_questions_avg": [
            214.66666666666666,
            256.83371187512665
        ],
        "wc_review_avg": [
            461.3333333333333,
            242.11888723425847
        ],
        "wc_reply_reviewers_avg": [
            80.0,
            62.65780079128216
        ],
        "wc_reply_authors_avg": [
            2150.0,
            1543.9911485065795
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            4.333333333333333,
            2.8674417556808756
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.6546536707079772,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:xyHhUQoiXfsJ:scholar.google.com/&scioq=Two+Time-Slices+Help+Topological+Ordering+for+Learning+Directed+Acyclic+Graphs&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;2",
        "aff_unique_norm": "Mohamed bin Zayed University of Artificial Intelligence;Peking University;Zhejiang University;Huawei",
        "aff_unique_dep": ";;;Huawei Technologies",
        "aff_unique_url": "https://mbzuai.ac.ae;http://www.pku.edu.cn;https://www.zju.edu.cn;https://www.huawei.com",
        "aff_unique_abbr": "MBZUAI;Peking U;ZJU;Huawei",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;1",
        "aff_country_unique": "United Arab Emirates;China"
    },
    {
        "id": "mH3yfzIPsL",
        "title": "XTSFormer: Cross-Temporal-Scale Transformer for Irregular Time Event Prediction",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Event prediction aims to forecast the time and type of a future event based on a historical event sequence. Despite its significance, several challenges exist, including the irregularity of time intervals between events, cycles, periodicity, and the complex multi-scale nature of event interactions, as well as the potentially high computational costs for long event sequences. However, current neural temporal point processes (TPPs) methods do not capture the multi-scale nature of event interactions, which is common in many real-world applications such as clinical event data. To address these issues, we propose the cross-temporal-scale transformer (XTSFormer), designed specifically for irregularly timed event data. Our model comprises two vital components: a novel Feature-based Cycle-aware Positional Encoding (FCPE) that adeptly captures the cyclical nature of time, and a hierarchical multi-scale temporal attention mechanism. These scales are determined by a bottom-up clustering algorithm. Extensive experiments on several real-world datasets show that our XTSFormer outperforms several baseline methods in prediction performance.",
        "keywords": "transformer;event sequence prediction;irregular time",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Tingsong Xiao;Zelin Xu;Jim Su;Wenchong He;Jiang Bian;Zhe Jiang",
        "authorids": "~Tingsong_Xiao1;~Zelin_Xu1;~Jim_Su1;~Wenchong_He1;~Jiang_Bian2;~Zhe_Jiang1",
        "gender": ";M;M;M;M;M",
        "homepage": ";https://zelinxu2000.github.io/;https://www.cise.ufl.edu/~jimsu/;https://wenchonghekk.github.io/;https://jiangbian.me/;https://www.jiangteam.org",
        "dblp": ";15/3244-1;;266/5559.html;09/851-1;50/4629-1",
        "google_scholar": ";18rG-NkAAAAJ;;NXyd1-sAAAAJ;ysr--voAAAAJ;R7xPuT8AAAAJ",
        "orcid": ";0009-0004-4419-3155;;;0000-0002-2238-5429;0000-0002-3576-6976",
        "linkedin": ";;;;;",
        "or_profile": "~Tingsong_Xiao1;~Zelin_Xu1;~Jim_Su1;~Wenchong_He1;~Jiang_Bian2;~Zhe_Jiang1",
        "aff": ";University of Florida;University of Florida;University of Florida;University of Florida;University of Florida",
        "aff_domain": ";ufl.edu;ufl.edu;ufl.edu;ufl.edu;ufl.edu",
        "position": ";PhD student;Undergrad student;PhD student;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nxiao2024xtsformer,\ntitle={{XTSF}ormer: Cross-Temporal-Scale Transformer for Irregular Time Event Prediction},\nauthor={Tingsong Xiao and Zelin Xu and Jim Su and Wenchong He and Jiang Bian and Zhe Jiang},\nyear={2024},\nurl={https://openreview.net/forum?id=mH3yfzIPsL}\n}",
        "github": "",
        "project": "",
        "reviewers": "TWtn;cLDM;XqYU;AZAP",
        "site": "https://openreview.net/forum?id=mH3yfzIPsL",
        "pdf_size": 1038724,
        "rating": "3;3;6;8",
        "confidence": "3;4;3;4",
        "soundness": "3;2;3;3",
        "contribution": "2;1;2;3",
        "presentation": "2;2;3;3",
        "wc_summary": "70;69;44;42",
        "wc_strengths": "71;64;30;35",
        "wc_weaknesses": "263;219;105;93",
        "wc_questions": "39;4;77;2",
        "wc_review": "443;356;256;172",
        "wc_reply_reviewers": "27;188;0;75",
        "wc_reply_authors": "765;2352;735;698",
        "reply_reviewers": "1;2;0;1",
        "reply_authors": "2;4;2;2",
        "rating_avg": [
            5.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            56.25,
            13.273563952458284
        ],
        "wc_strengths_avg": [
            50.0,
            17.76231966833161
        ],
        "wc_weaknesses_avg": [
            170.0,
            72.80796659706958
        ],
        "wc_questions_avg": [
            30.5,
            30.614539029683264
        ],
        "wc_review_avg": [
            306.75,
            102.13073729294233
        ],
        "wc_reply_reviewers_avg": [
            72.5,
            71.89054179793055
        ],
        "wc_reply_authors_avg": [
            1137.5,
            701.5933651339642
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.5,
            0.8660254037844386
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.23570226039551587,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5048547268461947389&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "University of Florida",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ufl.edu",
        "aff_unique_abbr": "UF",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "mHF35XVjmm",
        "title": "MADiff: Offline Multi-agent Learning with Diffusion Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Diffusion model (DM), as a powerful generative model, recently achieved huge success in various scenarios including offline reinforcement learning, where the policy learns to conduct planning by generating trajectory in the online evaluation.\nHowever, despite the effectiveness shown for single-agent learning, it remains unclear how DMs can operate in multi-agent problems, where agents can hardly complete teamwork without good coordination by independently modeling each agent's trajectories.\nIn this paper, we propose MADiff, a novel generative multi-agent learning framework to tackle this problem.\nMADiff is realized with an attention-based diffusion model to model the complex coordination among behaviors of multiple diffusion agents. \nTo the best of our knowledge, MADiff is the first diffusion-based multi-agent offline RL framework, which behaves as both a decentralized policy and a centralized controller. During decentralized executions, MADiff simultaneously performs opponent modeling, and the centralized controller can also be applied in multi-agent trajectory predictions. \nOur experiments show the superior performance of MADiff compared to baseline algorithms in a wide range of multi-agent learning tasks, which emphasizes the effectiveness of MADiff in modeling complex multi-agent interactions.",
        "keywords": "Multi-agent RL;Diffusion Models;Offline RL",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/dd70ec83d48974a7e26a43e5ebbf0d15e2964f77.zip",
        "author": "Zhengbang Zhu;Minghuan Liu;Liyuan Mao;Bingyi Kang;Minkai Xu;Yong Yu;Stefano Ermon;Weinan Zhang",
        "authorids": "~Zhengbang_Zhu1;~Minghuan_Liu1;~Liyuan_Mao2;~Bingyi_Kang1;~Minkai_Xu1;~Yong_Yu1;~Stefano_Ermon1;~Weinan_Zhang1",
        "gender": "M;M;;M;;M;M;M",
        "homepage": "https://github.com/zbzhu99;http://minghuanliu.com;https://bingykang.github.io/;https://minkaixu.com;https://apex.sjtu.edu.cn/members/yyu;http://cs.stanford.edu/~ermon/;http://wnzhang.net;https://github.com/maoliyuan",
        "dblp": "277/0869;249/7554;;257/3355;43/5685.html;47/8135;28/10261-1;",
        "google_scholar": ";;https://scholar.google.com.sg/citations?user=NmHgX-wAAAAJ;https://scholar.google.com/citations?hl=en;;;Qzss0GEAAAAJ;",
        "orcid": ";;;;0000-0003-4457-2820;;0000-0002-0127-2425;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Zhengbang_Zhu1;~Minghuan_Liu1;~Bingyi_Kang1;~Minkai_Xu1;~Yong_Yu1;~Stefano_Ermon1;~Weinan_Zhang1;~Liyuan_Richard_Mao1",
        "aff": "Shanghai Jiaotong University;Shanghai Jiaotong University;Bytedance;Stanford University;Shanghai Jiaotong University;Stanford University;Shanghai Jiaotong University;Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn;sjtu.edu.cn;bytedance.com;stanford.edu;sjtu.edu.cn;stanford.edu;sjtu.edu.cn;sjtu.edu.cn",
        "position": "PhD student;PhD student;Researcher;PhD student;Full Professor;Associate Professor;Associate Professor;Undergrad student",
        "bibtex": "@misc{\nzhu2024madiff,\ntitle={{MAD}iff: Offline Multi-agent Learning with Diffusion Models},\nauthor={Zhengbang Zhu and Minghuan Liu and Liyuan Mao and Bingyi Kang and Minkai Xu and Yong Yu and Stefano Ermon and Weinan Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=mHF35XVjmm}\n}",
        "github": "",
        "project": "",
        "reviewers": "Tx3W;QCKf;Khwp;nDb9;Gpw8",
        "site": "https://openreview.net/forum?id=mHF35XVjmm",
        "pdf_size": 2622393,
        "rating": "5;5;5;6;6",
        "confidence": "4;4;3;3;3",
        "soundness": "2;2;3;3;2",
        "contribution": "3;2;3;3;2",
        "presentation": "2;2;3;4;2",
        "wc_summary": "127;75;85;64;126",
        "wc_strengths": "64;111;49;36;85",
        "wc_weaknesses": "253;279;110;115;306",
        "wc_questions": "42;70;147;15;88",
        "wc_review": "486;535;391;230;605",
        "wc_reply_reviewers": "269;0;0;105;642",
        "wc_reply_authors": "2071;1328;1298;504;2316",
        "reply_reviewers": "2;0;0;1;1",
        "reply_authors": "4;3;3;2;5",
        "rating_avg": [
            5.4,
            0.48989794855663565
        ],
        "confidence_avg": [
            3.4,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.6,
            0.8
        ],
        "wc_summary_avg": [
            95.4,
            26.24957142507283
        ],
        "wc_strengths_avg": [
            69.0,
            26.58571044753177
        ],
        "wc_weaknesses_avg": [
            212.6,
            83.44722883355684
        ],
        "wc_questions_avg": [
            72.4,
            44.79553549183222
        ],
        "wc_review_avg": [
            449.4,
            129.9424487994589
        ],
        "wc_reply_reviewers_avg": [
            203.2,
            240.45739747406398
        ],
        "wc_reply_authors_avg": [
            1503.4,
            640.974757693312
        ],
        "reply_reviewers_avg": [
            0.8,
            0.7483314773547883
        ],
        "reply_authors_avg": [
            3.4,
            1.019803902718557
        ],
        "replies_avg": [
            30,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.6666666666666665,
        "gs_citation": 39,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6620009748424414321&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;1;2;0;2;0;0",
        "aff_unique_norm": "Shanghai Jiao Tong University;ByteDance;Stanford University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.sjtu.edu.cn;https://www.bytedance.com;https://www.stanford.edu",
        "aff_unique_abbr": "SJTU;Bytedance;Stanford",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Stanford",
        "aff_country_unique_index": "0;0;0;1;0;1;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "mHQEyXaULY",
        "title": "Personalized Residuals for Concept-Driven Text-to-Image Generation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We present personalized residuals and localized attention-guided sampling for efficient concept-driven generation using text-to-image diffusion models. Our method first represents concepts by freezing the weights of a pretrained text-conditioned diffusion model and learning low-rank residuals for a small subset of the model's layers. The residual-based approach then directly enables application of our proposed sampling technique, which applies the learned residuals only in areas where the concept is localized via cross-attention and applies the original diffusion weights in all other regions. Localized sampling therefore combines the learned identity of the concept with the existing generative prior of the underlying diffusion model. We show that personalized residuals effectively capture the identity of a concept in ~3 minutes on a single GPU without the use of regularization images and with fewer parameters than previous models, and localized sampling allows using the original model as strong prior for large parts of the image.",
        "keywords": "image generation;image synthesis;personalization;generative models;diffusion models",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Cusuh Ham;Matthew Fisher;James Hays;Nicholas Kolkin;Yuchen Liu;Richard Zhang;Tobias Hinz",
        "authorids": "~Cusuh_Ham1;~Matthew_Fisher2;~James_Hays1;~Nicholas_Kolkin2;~Yuchen_Liu5;~Richard_Zhang1;~Tobias_Hinz1",
        "gender": ";M;M;M;;M;M",
        "homepage": "https://cusuh.github.io;https://techmatt.github.io/;http://www.cc.gatech.edu/~hays/;;https://lychenyoko.github.io/;http://richzhang.github.io;https://www.inf.uni-hamburg.de/en/inst/ab/wtm/people/hinz.html",
        "dblp": "182/9376;57/5879;57/5958;155/9989;69/10440-2;;08/645",
        "google_scholar": "-2uX93cAAAAJ;PUSWc4EAAAAJ;vjZrDKQAAAAJ;MqWYTj0AAAAJ;yYGI_XsAAAAJ;LW8ze_UAAAAJ;https://scholar.google.de/citations?user=SugTw28AAAAJ",
        "orcid": "0009-0002-2686-052X;0000-0002-8908-3417;0000-0001-7016-4252;;;;0000-0003-1354-1562",
        "linkedin": "cusuh;;james-h-hays/;;;;tobias-hinz-397881123",
        "or_profile": "~Cusuh_Ham1;~Matthew_Fisher2;~James_Hays1;~Nicholas_Kolkin2;~Yuchen_Liu5;~Richard_Zhang1;~Tobias_Hinz1",
        "aff": "Adobe Systems;Adobe;Georgia Institute of Technology;Adobe Systems;Adobe Systems;Adobe Systems;Adobe Systems",
        "aff_domain": "adobe.com;adobe.com;gatech.edu;adobe.com;adobe.com;adobe.com;adobe.com",
        "position": "Research Scientist;Research scientist;Associate professor;Researcher;Researcher;Research Scientist;Researcher",
        "bibtex": "@misc{\nham2024personalized,\ntitle={Personalized Residuals for Concept-Driven Text-to-Image Generation},\nauthor={Cusuh Ham and Matthew Fisher and James Hays and Nicholas Kolkin and Yuchen Liu and Richard Zhang and Tobias Hinz},\nyear={2024},\nurl={https://openreview.net/forum?id=mHQEyXaULY}\n}",
        "github": "",
        "project": "",
        "reviewers": "98Kb;szNh;dZ91;mRPT",
        "site": "https://openreview.net/forum?id=mHQEyXaULY",
        "pdf_size": 5046864,
        "rating": "3;5;5;6",
        "confidence": "4;4;4;4",
        "soundness": "3;3;2;3",
        "contribution": "2;2;1;4",
        "presentation": "3;3;3;3",
        "wc_summary": "53;58;55;135",
        "wc_strengths": "54;89;34;105",
        "wc_weaknesses": "319;146;257;83",
        "wc_questions": "5;2;19;39",
        "wc_review": "431;295;365;362",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            1.0897247358851685
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            75.25,
            34.54254622925183
        ],
        "wc_strengths_avg": [
            70.5,
            28.00446392988089
        ],
        "wc_weaknesses_avg": [
            201.25,
            92.20730719416981
        ],
        "wc_questions_avg": [
            16.25,
            14.618053906043718
        ],
        "wc_review_avg": [
            363.25,
            48.095607907583414
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9079958966074453682&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;1;0;0;0;0",
        "aff_unique_norm": "Adobe;Georgia Institute of Technology",
        "aff_unique_dep": "Adobe Systems Incorporated;",
        "aff_unique_url": "https://www.adobe.com;https://www.gatech.edu",
        "aff_unique_abbr": "Adobe;Georgia Tech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "mHXCByvrLd",
        "title": "Rethinking Optimal Transport in Offline Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We present a novel approach for offline reinforcement learning that bridges the gap between recent advances in neural optimal transport and reinforcement learning algorithms. Our key idea is to compute the optimal transport between states and actions with an action-value cost function and implicitly recover an optimal map that can serve as a policy. Building on this concept, we develop a new algorithm called Extremal Monge Reinforcement Learning that treats offline reinforcement learning as an extremal optimal transport problem. Unlike previous transport-based offline reinforcement learning algorithms, our method focuses on improving the policy beyond the behavior policy, rather than addressing the distribution shift problem. We evaluated the performance of our method on various continuous control problems and demonstrated improvements over existing algorithms.",
        "keywords": "Reinforcement Learning;Offline Reinforcement Learning;Optimal Transport",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/18419ddbef5297ace7e1220f75f15db6e165881c.zip",
        "author": "Arip Asadulaev;Alexander Korotin;Vage Egiazarian;Rostislav Korst;Andrey Filchenkov;Evgeny Burnaev",
        "authorids": "~Arip_Asadulaev1;~Alexander_Korotin2;~Vage_Egiazarian1;~Rostislav_Korst1;~Andrey_Filchenkov2;~Evgeny_Burnaev1",
        "gender": "M;M;;M;M;M",
        "homepage": ";;https://github.com/RostislavKorst;https://research.itmo.ru/en/person/188779/andrey_aleksandrovich_filchenkov.htm;http://faculty.skoltech.ru/people/evgenyburnaev;https://akorotin.netlify.app",
        "dblp": "243/2822;232/3274;;169/0448.html;144/7845;209/9906",
        "google_scholar": "wcdrgdYAAAAJ;Bktg6JEAAAAJ;;ry63T9QAAAAJ;https://scholar.google.ru/citations?user=pCRdcOwAAAAJ;https://scholar.google.ru/citations?user=1rIIvjAAAAAJ",
        "orcid": ";0000-0003-4444-9769;;0000-0002-1133-8432;0000-0001-8424-0690;0000-0003-4286-925X",
        "linkedin": ";;;;;",
        "or_profile": "~Arip_Asadulaev1;~Vage_Egiazarian1;~Rostislav_Korst1;~Andrey_Filchenkov2;~Evgeny_Burnaev1;~Alexander_Andreevich_Korotin1",
        "aff": "ITMO University;Yandex;MIPT;ITMO University;Skolkovo Institute of Science and Technology;Skolkovo Institute of Science and Technology",
        "aff_domain": "itmo.ru;yandex-team.ru;phystech.edu;itmo.ru;skoltech.ru;skoltech.ru",
        "position": "PhD student;Researcher;PhD student;Associate Professor;Full Professor;Head of Research Group",
        "bibtex": "@misc{\nasadulaev2024rethinking,\ntitle={Rethinking Optimal Transport in Offline Reinforcement Learning},\nauthor={Arip Asadulaev and Alexander Korotin and Vage Egiazarian and Rostislav Korst and Andrey Filchenkov and Evgeny Burnaev},\nyear={2024},\nurl={https://openreview.net/forum?id=mHXCByvrLd}\n}",
        "github": "",
        "project": "",
        "reviewers": "Z7BD;sJfc;wDEF",
        "site": "https://openreview.net/forum?id=mHXCByvrLd",
        "pdf_size": 4591729,
        "rating": "3;6;6",
        "confidence": "4;2;3",
        "soundness": "2;3;2",
        "contribution": "2;3;2",
        "presentation": "2;3;3",
        "wc_summary": "68;29;126",
        "wc_strengths": "40;39;91",
        "wc_weaknesses": "312;37;115",
        "wc_questions": "15;102;1",
        "wc_review": "435;207;333",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "917;417;427",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            74.33333333333333,
            39.85250584621025
        ],
        "wc_strengths_avg": [
            56.666666666666664,
            24.280765135299085
        ],
        "wc_weaknesses_avg": [
            154.66666666666666,
            115.71900833004442
        ],
        "wc_questions_avg": [
            39.333333333333336,
            44.67910274638717
        ],
        "wc_review_avg": [
            325.0,
            93.25234581499814
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            587.0,
            233.38094752285727
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.8660254037844387,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11971310469757434203&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2;0;3;3",
        "aff_unique_norm": "ITMO University;Yandex;Moscow Institute of Physics and Technology;Skolkovo Institute of Science and Technology",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.itmo.ru;https://yandex.com;https://mipt.ru;https://www.skoltech.ru",
        "aff_unique_abbr": "ITMO;Yandex;MIPT;Skoltech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "Russian Federation"
    },
    {
        "id": "mHYkcQzdae",
        "title": "A Novel Approach for Micro-Expression Recognition Incorporating Vertical Attention and Position Localization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Micro-expression (ME) is a kind of facial expression that is short-lived and difficult for ordinary people to detect. Micro-expression can reflect the real emotion that people try to hide. It is difficult to identify micro-expression due to the fact that the duration is short and it only involves partial muscle motions, which brings great challenges to the accurate identification of micro-expression. To address these issues, we propose a novel neural network for micro-expression recognition (MER), focusing on subtle changes in facial movements using a CVA (Continuously Vertical Attention) block, which models the local muscle changes with minimal identity information. Additionally, we propose a facial position localization module called FPF (Facial Position Focalizer) based on Swin Transformer, which incorporates spatial information into the facial muscle movement pattern features used for MER. We also proved that including AU (Action Units) can further enhance accuracy, and therefore we have incorporated AU information to assist in micro-expression recognition. The experimental results indicate that the model achieved an average recognition accuracy of 94.35\\% and 86.76\\% on the popular CASME II and SAMM micro-expression datasets, improved by 6\\% and 1.98\\% compared to state-of-the-art models, respectively.",
        "keywords": "Micro-Expression Recognition;Representation Learning for Computer Vision;Self-Attention Mechanism",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Linquan Wu;Wenhao Duan;Tianxiang Jiang",
        "authorids": "~Linquan_Wu1;~Wenhao_Duan1;~Tianxiang_Jiang1",
        "gender": "M;M;M",
        "homepage": "https://github.com/Svardfox;https://769321291.github.io/;https://jiangtianxiang.github.io",
        "dblp": ";;",
        "google_scholar": ";;54jmoNYAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Linquan_Wu1;~Wenhao_Duan1;~Tianxiang_Jiang1",
        "aff": "University of Electronic Science and Technology of China;Ocean University of China;Shanghai Artificial Intelligence Laboratory",
        "aff_domain": "uestc.edu.cn;ouc.edu.cn;pjlab.org.cn",
        "position": "Undergrad student;Undergrad student;Intern",
        "bibtex": "@misc{\nwu2024a,\ntitle={A Novel Approach for Micro-Expression Recognition Incorporating Vertical Attention and Position Localization},\nauthor={Linquan Wu and Wenhao Duan and Tianxiang Jiang},\nyear={2024},\nurl={https://openreview.net/forum?id=mHYkcQzdae}\n}",
        "github": "",
        "project": "",
        "reviewers": "Vkxu;Bj7L;d3J6;gEuL",
        "site": "https://openreview.net/forum?id=mHYkcQzdae",
        "pdf_size": 604443,
        "rating": "3;5;5;6",
        "confidence": "4;5;5;3",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;2",
        "presentation": "3;3;3;3",
        "wc_summary": "63;60;75;102",
        "wc_strengths": "55;50;64;116",
        "wc_weaknesses": "187;240;135;121",
        "wc_questions": "80;4;63;58",
        "wc_review": "385;354;337;397",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            75.0,
            16.56804152578089
        ],
        "wc_strengths_avg": [
            71.25,
            26.31895704620531
        ],
        "wc_weaknesses_avg": [
            170.75,
            46.938124163626306
        ],
        "wc_questions_avg": [
            51.25,
            28.472574523565655
        ],
        "wc_review_avg": [
            368.25,
            23.909987452945266
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.20751433915982243,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:GlNECKT1b5wJ:scholar.google.com/&scioq=A+Novel+Approach+for+Micro-Expression+Recognition+Incorporating+Vertical+Attention+and+Position+Localization&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of Electronic Science and Technology of China;Ocean University of China;Shanghai Artificial Intelligence Laboratory",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.uestc.edu.cn;http://www.ouc.edu.cn;http://www.shailab.org/",
        "aff_unique_abbr": "UESTC;OUC;Shanghai AI Lab",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "mHv6wcBb0z",
        "title": "Preventing Model Collapse in Deep Canonical Correlation Analysis by Noise Regularization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Multi-View Representation Learning (MVRL) aims to learn a unified representation of an object from multi-view data. Deep Canonical Correlation Analysis (DCCA) and its variants share simple formulations and demonstrate state-of-the-art performance. However, with extensive experiments, we observe the issue of model collapse, i.e., the performance of DCCA-based methods will drop drastically when training proceeds. The model collapse issue could significantly hinder the wide adoption of DCCA-based methods because it is challenging to decide when to early stop. To this end, we develop NR-DCCA, which is equipped with a novel noise regularization approach to prevent model collapse. Theoretical analysis shows that the full-rank property is the key to preventing model collapse, and our noise regularization constrains the neural network to be \"full-rank\". A framework to construct synthetic data with different common and complementary information is also developed to compare MVRL methods comprehensively. The developed NR-DCCA outperforms baselines stably and consistently in both synthetic and real-world datasets, and the proposed noise regularization approach can also be generalized to other DCCA-based methods such as DGCCA.",
        "keywords": "multi-view representation learning;canonical correlation analysis;deep canonical correlation analysis;noise regularization; model collapse",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/9f5bdba84312707af4bfb1b0451e458e7b8522f7.zip",
        "author": "Junlin He;Jinxiao Du;Wei Ma",
        "authorids": "~Junlin_He2;~Jinxiao_Du1;~Wei_Ma3",
        "gender": ";M;M",
        "homepage": ";;http://polyu-mobility-ai-lab.com/",
        "dblp": ";;",
        "google_scholar": "1wyJPxQAAAAJ;;syUpc-gAAAAJ",
        "orcid": ";0000-0003-0247-6339;0000-0001-8945-5877",
        "linkedin": ";;",
        "or_profile": "~Junlin_He2;~Jinxiao_Du1;~Wei_Ma3",
        "aff": "Hong Kong Polytechnic University;Hong Kong Polytechnic University;Hong Kong Polytechnic University",
        "aff_domain": "polyu.edu.hk;polyu.edu.hk;polyu.edu.hk",
        "position": "PhD student;PhD student;Assistant Professor",
        "bibtex": "@misc{\nhe2024preventing,\ntitle={Preventing Model Collapse in Deep Canonical Correlation Analysis by Noise Regularization},\nauthor={Junlin He and Jinxiao Du and Wei Ma},\nyear={2024},\nurl={https://openreview.net/forum?id=mHv6wcBb0z}\n}",
        "github": "",
        "project": "",
        "reviewers": "w9Bv;ZnnT;5U9E;hTsZ",
        "site": "https://openreview.net/forum?id=mHv6wcBb0z",
        "pdf_size": 8478411,
        "rating": "3;3;6;10",
        "confidence": "4;5;2;4",
        "soundness": "2;2;3;4",
        "contribution": "2;1;3;4",
        "presentation": "2;2;3;4",
        "wc_summary": "43;61;134;234",
        "wc_strengths": "14;72;36;86",
        "wc_weaknesses": "283;449;9;130",
        "wc_questions": "24;8;175;6",
        "wc_review": "364;590;354;456",
        "wc_reply_reviewers": "180;0;0;0",
        "wc_reply_authors": "2279;0;794;351",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "6;0;2;1",
        "rating_avg": [
            5.5,
            2.8722813232690143
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            1.118033988749895
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            118.0,
            75.14319663149818
        ],
        "wc_strengths_avg": [
            52.0,
            28.53068523537421
        ],
        "wc_weaknesses_avg": [
            217.75,
            165.08388019428185
        ],
        "wc_questions_avg": [
            53.25,
            70.63772009344582
        ],
        "wc_review_avg": [
            441.0,
            94.76813810558906
        ],
        "wc_reply_reviewers_avg": [
            45.0,
            77.94228634059948
        ],
        "wc_reply_authors_avg": [
            856.0,
            868.4086019841121
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            2.277608394786075
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.27955307234080506,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:8pxL4GgJFFYJ:scholar.google.com/&scioq=Preventing+Model+Collapse+in+Deep+Canonical+Correlation+Analysis+by+Noise+Regularization&hl=en&as_sdt=0,44",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Hong Kong Polytechnic University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.polyu.edu.hk",
        "aff_unique_abbr": "PolyU",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Seeking Neural Nuggets: Knowledge Transfer in Large Language Models from a Parametric Perspective",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17899",
        "id": "mIEHIcHGOo",
        "author_site": "Ming Zhong, Chenxin An, Weizhu Chen, Jiawei Han, Pengcheng He",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) inherently encode a wealth of knowledge within their parameters through pre-training on extensive corpora. While prior research has delved into operations on these parameters to manipulate the underlying implicit knowledge \u2014 encompassing detection, editing, and merging \u2014 there remains an ambiguous understanding regarding their transferability across models with varying scales. In this paper, we seek to empirically investigate knowledge transfer from larger to smaller models through a parametric perspective. To achieve this, we employ sensitivity-based techniques to extract and align knowledge-specific parameters between different LLMs. Moreover, the LoRA module is used as the intermediary mechanism for injecting the extracted knowledge into smaller models. Evaluations across four benchmarks validate the efficacy of our proposed method. Our findings highlight the critical factors contributing to the process of parametric knowledge transfer, underscoring the transferability of model parameters across LLMs of different scales. Project website: https://maszhongming.github.io/ParaKnowTransfer.",
        "keywords": "Parametric Knowledge Transfer;Large Language Model",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Ming Zhong;Chenxin An;Weizhu Chen;Jiawei Han;Pengcheng He",
        "authorids": "~Ming_Zhong2;~Chenxin_An1;~Weizhu_Chen1;~Jiawei_Han1;~Pengcheng_He2",
        "gender": "M;M;M;M;M",
        "homepage": "https://maszhongming.github.io/;https://chenxinan-fdu.github.io/;https://www.microsoft.com/en-us/research/people/wzchen/;http://hanj.cs.illinois.edu/;",
        "dblp": ";289/7002;79/2536;h/JiaweiHan.html;116/8665",
        "google_scholar": "mnifqeUAAAAJ;fY69CxIAAAAJ;LG_E-4EAAAAJ;https://scholar.google.com.tw/citations?user=Kv9AbjMAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;0000-0002-3629-2696;",
        "linkedin": ";;;;",
        "or_profile": "~Ming_Zhong2;~Chenxin_An1;~Weizhu_Chen1;~Jiawei_Han1;~Pengcheng_He2",
        "aff": "University of Illinois Urbana Champaign;University of Hong Kong;Microsoft GenAI;University of Illinois at Urbana-Champaign (UIUC);Microsoft",
        "aff_domain": "illinois.edu;hku.hk;microsoft.com;illinois.edu;microsoft.com",
        "position": "PhD student;PhD student;Vice President;Full Professor;Principal Researcher",
        "bibtex": "@inproceedings{\nzhong2024seeking,\ntitle={Seeking Neural Nuggets: Knowledge Transfer in Large Language Models from a Parametric Perspective},\nauthor={Ming Zhong and Chenxin An and Weizhu Chen and Jiawei Han and Pengcheng He},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=mIEHIcHGOo}\n}",
        "github": "",
        "project": "",
        "reviewers": "ccZi;Df53;NWu9",
        "pdf_size": 4701048,
        "rating": "6;6;8",
        "confidence": "3;4;1",
        "soundness": "4;3;4",
        "contribution": "3;3;4",
        "presentation": "3;3;4",
        "wc_summary": "159;79;97",
        "wc_strengths": "118;19;148",
        "wc_weaknesses": "123;89;25",
        "wc_questions": "57;55;20",
        "wc_review": "457;242;290",
        "wc_reply_reviewers": "81;118;15",
        "wc_reply_authors": "1237;1932;916",
        "reply_reviewers": "2;1;1",
        "reply_authors": "3;4;3",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "soundness_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            111.66666666666667,
            34.26692606905706
        ],
        "wc_strengths_avg": [
            95.0,
            55.11805511808268
        ],
        "wc_weaknesses_avg": [
            79.0,
            40.62839729384691
        ],
        "wc_questions_avg": [
            44.0,
            16.990193249832878
        ],
        "wc_review_avg": [
            329.6666666666667,
            92.14601938710585
        ],
        "wc_reply_reviewers_avg": [
            71.33333333333333,
            42.60151275352659
        ],
        "wc_reply_authors_avg": [
            1361.6666666666667,
            424.0442848990604
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9449111825230679,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17007993893933436202&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=mIEHIcHGOo",
        "pdf": "https://openreview.net/pdf?id=mIEHIcHGOo",
        "email": "illinois.edu;hku.hk;microsoft.com;illinois.edu;microsoft.com",
        "author_num": 5,
        "aff_unique_index": "0;1;2;0;2",
        "aff_unique_norm": "University of Illinois Urbana-Champaign;University of Hong Kong;Microsoft",
        "aff_unique_dep": ";;Microsoft GenAI",
        "aff_unique_url": "https://illinois.edu;https://www.hku.hk;https://www.microsoft.com",
        "aff_unique_abbr": "UIUC;HKU;Microsoft",
        "aff_campus_unique_index": "0;1;0",
        "aff_campus_unique": "Urbana-Champaign;Hong Kong SAR;",
        "aff_country_unique_index": "0;1;0;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "mIQ2puu82H",
        "title": "DIFFNAT: IMPROVING DIFFUSION IMAGE QUALITY USING NATURAL IMAGE STATISTICS",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Diffusion models have advanced generative AI significantly in terms of editing\nand creating naturalistic images. However, while editing images using text-prompt\nor image guidance, some unnatural artefacts or effects can be generated by the\ndiffusion model. This problem is more prominent in the context of few-shot\npersonalization of text-to-image diffusion model, where the large diffusion model\nhas to be finetuned from few examples of certain subject identity to produce\nedited images conditioned on text prompts. In this context, we propose a generic\n\u201cnaturalness\u201d preserving loss function, viz., kurtosis concentration (KC) loss, which\ncan be readily applied to any standard diffusion model pipeline to elevate the image\nquality. Our motivation stems from the projected kurtosis concentration property\nof natural images, which states that natural images have nearly constant kurtosis\nvalues across different band-pass versions of the image. In order to retain the\n\u201cnaturalness\u201d of the generated images, we enforce reducing the gap between the\nhighest and lowest kurtosis values across the band-pass versions (e.g., Discrete\nWavelet Transform (DWT)) of images. Note that our approach does not require\nany additional guidance like classifer or classifer-free guidance in order to improve\nthe image quality. We validate the proposed approach for three diverse tasks, viz.,\n(1) personalized few-shot finetuning using text guidance, (2) unconditional image\ngeneration, and (3) image super-resolution. Integrating the proposed KC loss have\nimproved the perceptual quality across all these tasks in terms of both FID, MUSIQ\nscore and user evaluation.",
        "keywords": "diffusion model;natural image statistics",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Aniket Roy;Maitreya Suin;Anshul Shah;Ketul Shah;Jiang Liu;Rama Chellappa",
        "authorids": "~Aniket_Roy1;~Maitreya_Suin1;~Anshul_Shah1;~Ketul_Shah1;~Jiang_Liu6;~Rama_Chellappa1",
        "gender": ";M;M;M;;",
        "homepage": ";https://maitreyasuin.github.io/;;;;",
        "dblp": "173/0075;254/1457;250/5430;220/4323;23/108-14;",
        "google_scholar": "https://scholar.google.co.in/citations?user=9y2gsDwAAAAJ;https://scholar.google.co.in/citations?user=Yjf3OKcAAAAJ;akf8VG8AAAAJ;E89_UrMAAAAJ;IbeXR9cAAAAJ;",
        "orcid": ";0000-0002-0004-181X;;;;",
        "linkedin": ";maitreya-suin-7103897a/?originalSubdomain=in;;shah-ketul/;jiang-liu-4a2283131/;",
        "or_profile": "~Aniket_Roy1;~Maitreya_Suin1;~Anshul_Shah1;~Ketul_Shah1;~Jiang_Liu6;~Rama_Chellappa1",
        "aff": "Johns Hopkins University;Johns Hopkins University;Johns Hopkins University;Johns Hopkins University;Johns Hopkins University;",
        "aff_domain": "jhu.edu;jh.edu;jhu.edu;jhu.edu;jhu.edu;",
        "position": "PhD student;Postdoc;PhD student;PhD student;PhD student;",
        "bibtex": "@misc{\nroy2024diffnat,\ntitle={{DIFFNAT}: {IMPROVING} {DIFFUSION} {IMAGE} {QUALITY} {USING} {NATURAL} {IMAGE} {STATISTICS}},\nauthor={Aniket Roy and Maitreya Suin and Anshul Shah and Ketul Shah and Jiang Liu and Rama Chellappa},\nyear={2024},\nurl={https://openreview.net/forum?id=mIQ2puu82H}\n}",
        "github": "",
        "project": "",
        "reviewers": "4XiE;en6K;NS8z;XKja",
        "site": "https://openreview.net/forum?id=mIQ2puu82H",
        "pdf_size": 13705379,
        "rating": "5;5;6;6",
        "confidence": "2;4;4;3",
        "soundness": "3;2;3;2",
        "contribution": "3;2;3;2",
        "presentation": "3;3;2;3",
        "wc_summary": "54;40;55;47",
        "wc_strengths": "47;34;50;55",
        "wc_weaknesses": "94;286;52;135",
        "wc_questions": "29;7;4;6",
        "wc_review": "224;367;161;243",
        "wc_reply_reviewers": "0;271;13;0",
        "wc_reply_authors": "471;2500;149;505",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "3;7;3;3",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            49.0,
            6.041522986797286
        ],
        "wc_strengths_avg": [
            46.5,
            7.762087348130012
        ],
        "wc_weaknesses_avg": [
            141.75,
            88.30168458189232
        ],
        "wc_questions_avg": [
            11.5,
            10.161200716450788
        ],
        "wc_review_avg": [
            248.75,
            74.71403817222036
        ],
        "wc_reply_reviewers_avg": [
            71.0,
            115.5919547373432
        ],
        "wc_reply_authors_avg": [
            906.25,
            930.5792215066915
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            4.0,
            1.7320508075688772
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.30151134457776363,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8323300018776008275&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Johns Hopkins University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.jhu.edu",
        "aff_unique_abbr": "JHU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "mJgymwRsWw",
        "title": "Active Probabilistic Drug Discovery",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Early drug discovery plays a crucial role in the development of new medications\nby focusing on the identification and optimization of lead molecules that specif-\nically bind to target proteins. However, this process is accompanied by various\nchallenges, such as the vastness of molecule libraries, high attrition rate, and the\nintricate nature of molecular interactions. To overcome these challenges, there is\na paradigm shift towards integrating intelligence and automation into end-to-end\noperations. Intelligent computing aids in the discovery and recommendation of\nmolecules, while automated experiments offer data validation and feedback. This\ninnovative approach can be viewed as an active probabilistic learning problem,\nassuming that active molecules binding to a specific target are typically a small\nproportion and exhibit cluster-distributed characteristics. Based on this formu-\nlation, we propose a novel active probabilistic drug discovery (APDD) method,\nwhich iteratively updates the binding probabilities of molecules to progressively\nenhance drug discovery performance with three consecutive steps of probabilistic\nclustering, selective docking, and active wet-experiment. We conduct extensive\nexperiments on two benchmark datasets of DUD-E and LIT-PCBA and a simu-\nlated virtual library. The results demonstrate the feasibility and efficiency of our\napproach, showcasing substantial cost savings with an average reduction of 80% in\ncomputational docking expenses and 70% in wet experimental costs, while main-\ntaining high accuracy in lead molecule discovery.",
        "keywords": "Drug Discovery;Active Learning;Molecule Clustering",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Xun Deng;Junlong Liu;Jiansheng Wu;Fuli Feng;Xiangnan He;Zheng Wang;Jieping Ye",
        "authorids": "~Xun_Deng1;~Junlong_Liu2;~Jiansheng_Wu1;~Fuli_Feng1;~Xiangnan_He1;~Zheng_Wang32;~Jieping_Ye4",
        "gender": "M;M;M;M;M;;M",
        "homepage": ";;http://lamda.nju.edu.cn/wujs/;https://fulifeng.github.io/;http://staff.ustc.edu.cn/~hexn;;http://yelabs.net/",
        "dblp": "154/0106/;;;183/9198;59/1007;;03/5454",
        "google_scholar": "LILR85MAAAAJ;;;https://scholar.google.com.sg/citations?user=QePM4u8AAAAJ;https://scholar.google.com.sg/citations?user=X45Go24AAAAJ;;T9AzhwcAAAAJ",
        "orcid": ";0000-0001-5125-3022;;0000-0002-5828-9842;0000-0001-8472-7992;;0000-0001-8662-5818",
        "linkedin": ";;;;;;",
        "or_profile": "~Xun_Deng1;~Junlong_Liu2;~Jiansheng_Wu1;~Fuli_Feng1;~Xiangnan_He1;~Zheng_Wang32;~Jieping_Ye4",
        "aff": "University of Science and Technology of China;;;University of Science and Technology of China;University of Science and Technology of China;;Alibaba Group",
        "aff_domain": "mail.ustc.edu.cn;;;ustc.edu.cn;ustc.edu.cn;;alibaba-inc.com",
        "position": "PhD student;;;Full Professor;Professor;;Principal Researcher",
        "bibtex": "@misc{\ndeng2024active,\ntitle={Active Probabilistic Drug Discovery},\nauthor={Xun Deng and Junlong Liu and Jiansheng Wu and Fuli Feng and Xiangnan He and Zheng Wang and Jieping Ye},\nyear={2024},\nurl={https://openreview.net/forum?id=mJgymwRsWw}\n}",
        "github": "",
        "project": "",
        "reviewers": "vXPn;FDuX;Fua7;LU6u",
        "site": "https://openreview.net/forum?id=mJgymwRsWw",
        "pdf_size": 261308,
        "rating": "1;3;3;3",
        "confidence": "5;3;2;5",
        "soundness": "1;2;2;2",
        "contribution": "1;2;2;2",
        "presentation": "1;3;2;2",
        "wc_summary": "92;102;93;212",
        "wc_strengths": "17;56;41;61",
        "wc_weaknesses": "458;565;23;509",
        "wc_questions": "1;60;16;144",
        "wc_review": "568;783;173;926",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            1.299038105676658
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            124.75,
            50.52412789945018
        ],
        "wc_strengths_avg": [
            43.75,
            17.108112110925624
        ],
        "wc_weaknesses_avg": [
            388.75,
            214.53015522298958
        ],
        "wc_questions_avg": [
            55.25,
            55.63890275697392
        ],
        "wc_review_avg": [
            612.5,
            283.9423356951196
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5555555555555555,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:qXOGX32vun8J:scholar.google.com/&scioq=Active+Probabilistic+Drug+Discovery&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "University of Science and Technology of China;Alibaba Group",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.ustc.edu.cn;https://www.alibaba.com",
        "aff_unique_abbr": "USTC;Alibaba",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Emu: Generative Pretraining in Multimodality",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17898",
        "id": "mL8Q9OOamV",
        "author_site": "Quan Sun, Qiying Yu, Yufeng Cui, Fan Zhang, Xiaosong Zhang, Yueze Wang, Hongcheng Gao, Jingjing Liu, Tiejun Huang, Xinlong Wang",
        "tldr": "",
        "abstract": "We present Emu, a multimodal foundation model that seamlessly generates images and text in multimodal context. This omnivore model can take in any single-modality or multimodal data input indiscriminately (e.g., interleaved image, text and video) through a one-model-for-all autoregressive training process. First, visual signals are encoded into embeddings, and together with text tokens form an interleaved input sequence. Emu is end-to-end trained with a unified objective of classifying the next text token or regressing the next visual embedding in the multimodal sequence. This versatile multimodality empowers the leverage of diverse pretraining data sources at scale, such as videos with interleaved frames and text, webpages with interleaved images and text, as well as web-scale image-text pairs and video-text pairs. Emu can serve as a generalist multimodal interface for both image-to-text and text-to-image tasks, supporting in-context image and text generation. Across a broad range of zero-shot/few-shot tasks including image captioning, visual question answering, video question answering and text-to-image generation, Emu demonstrates superb performance compared to state-of-the-art large multimodal models. Extended capabilities such as multimodal assistants via instruction tuning are also demonstrated with impressive performance.",
        "keywords": "Generative pretraining;Multimodal generalist;Foundation models;In-context multimodal learning",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Quan Sun;Qiying Yu;Yufeng Cui;Fan Zhang;Xiaosong Zhang;Yueze Wang;Hongcheng Gao;Jingjing Liu;Tiejun Huang;Xinlong Wang",
        "authorids": "~Quan_Sun3;~Qiying_Yu1;~Yufeng_Cui1;~Fan_Zhang15;~Xiaosong_Zhang2;~Yueze_Wang1;~Hongcheng_Gao1;~Jingjing_Liu2;~Tiejun_Huang1;~Xinlong_Wang2",
        "gender": "M;;M;M;M;M;M;;M;M",
        "homepage": ";https://yqy2001.github.io;;;https://zhangxiaosong18.github.io/XiaosongZhang.htm;https://yuezewang.github.io/;https://gao-hongcheng.github.io/;https://air.tsinghua.edu.cn/en/info/1046/1194.htm#:~:text=Jingjing%20Liu%20is%20Professor%2C%20Principal,CVPR%2C%20ACL%2C%20etc.);https://idm.pku.edu.cn/~tjhuang/;",
        "dblp": ";324/5612;;;26/3075-4;;318/1404;30/3008-1;h/TiejunHuang;",
        "google_scholar": "pVKiHdEAAAAJ;eFFssJYAAAAJ;https://scholar.google.com/citations?hl=zh-CN;VsJ39HMAAAAJ;98exn6wAAAAJ;;https://scholar.google.com/citations?hl=en;BzJ_GboAAAAJ;https://scholar.google.com.tw/citations?user=knvEK4AAAAAJ;DPz0DjYAAAAJ",
        "orcid": ";;;;;;;;0000-0002-4234-6099;",
        "linkedin": "quan-sun-cornell4954366;;;;;;;jingjing-liu-65703431/;;",
        "or_profile": "~Quan_Sun3;~Qiying_Yu1;~Yufeng_Cui1;~Fan_Zhang15;~Xiaosong_Zhang2;~Yueze_Wang1;~Hongcheng_Gao1;~Jingjing_Liu2;~Tiejun_Huang1;~Xinlong_Wang2",
        "aff": "BAAI;Tsinghua University;Beijing Academy of Artificial Intelligence;Beijing Academy of Artificial Intelligence;Beijing Academy of Artificial Intelligence;Beijing Academy of Artificial Intelligence;University of Chinese Academy of Sciences;Tsinghua University;Peking University;Beijing Academy of Artificial Intelligence",
        "aff_domain": "baai.ac.cn;mails.tsinghua.edu.cn;baai.ac.cn;baai.ac.cn;baai.ac.cn;baai.ac.cn;ucas.ac.cn;tsinghua.edu.cn;pku.edu.cn;baai.ac.cn",
        "position": "Researcher;PhD student;Researcher;Researcher;Researcher;Researcher;MS student;Full Professor;Full Professor;Researcher",
        "bibtex": "@inproceedings{\nsun2024emu,\ntitle={Emu: Generative Pretraining in Multimodality},\nauthor={Quan Sun and Qiying Yu and Yufeng Cui and Fan Zhang and Xiaosong Zhang and Yueze Wang and Hongcheng Gao and Jingjing Liu and Tiejun Huang and Xinlong Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=mL8Q9OOamV}\n}",
        "github": "",
        "project": "",
        "reviewers": "paGX;qbfH;qjEg;yynn",
        "pdf_size": 6529667,
        "rating": "6;6;6;6",
        "confidence": "4;4;4;4",
        "soundness": "3;3;3;2",
        "contribution": "3;3;3;3",
        "presentation": "3;3;3;4",
        "wc_summary": "72;400;171;84",
        "wc_strengths": "49;171;13;86",
        "wc_weaknesses": "58;165;130;70",
        "wc_questions": "84;31;11;92",
        "wc_review": "263;767;325;332",
        "wc_reply_reviewers": "0;0;15;94",
        "wc_reply_authors": "341;730;1013;685",
        "reply_reviewers": "0;0;1;2",
        "reply_authors": "2;2;3;3",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            181.75,
            131.6707541559628
        ],
        "wc_strengths_avg": [
            79.75,
            58.66589724874239
        ],
        "wc_weaknesses_avg": [
            105.75,
            43.751428548105714
        ],
        "wc_questions_avg": [
            54.5,
            34.35476677260377
        ],
        "wc_review_avg": [
            421.75,
            201.13102073026926
        ],
        "wc_reply_reviewers_avg": [
            27.25,
            39.02162861798569
        ],
        "wc_reply_authors_avg": [
            692.25,
            238.607811062421
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 269,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1158042305220705369&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=mL8Q9OOamV",
        "pdf": "https://openreview.net/pdf?id=mL8Q9OOamV",
        "email": "baai.ac.cn;mails.tsinghua.edu.cn;baai.ac.cn;baai.ac.cn;baai.ac.cn;baai.ac.cn;ucas.ac.cn;tsinghua.edu.cn;pku.edu.cn;baai.ac.cn",
        "author_num": 10,
        "aff_unique_index": "0;1;0;0;0;0;2;1;3;0",
        "aff_unique_norm": "Beijing Academy of Artificial Intelligence;Tsinghua University;University of Chinese Academy of Sciences;Peking University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.baaic.cn;https://www.tsinghua.edu.cn;http://www.ucas.ac.cn;http://www.pku.edu.cn",
        "aff_unique_abbr": "BAAI;THU;UCAS;Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "SOTOPIA: Interactive Evaluation for Social Intelligence in Language Agents",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17897",
        "id": "mM7VurbA4r",
        "author_site": "Xuhui Zhou, Hao Zhu, Leena Mathur, Ruohong Zhang, Haofei Yu, Zhengyang Qi, Louis-Philippe Morency, Yonatan Bisk, Daniel Fried, Graham Neubig, Maarten Sap",
        "tldr": "",
        "abstract": "*Humans are social beings*; we pursue social goals in our daily interactions, which is a crucial aspect of social intelligence. Yet, AI systems' abilities in this realm remain elusive. We present SOTOPIA, an open-ended environment to simulate complex social interactions between artificial agents and evaluate their social intelligence. In our environment, agents role-play and *interact* under a wide variety of scenarios; they coordinate, collaborate, exchange, and compete with each other to achieve complex social goals. We simulate the role-play interaction between LLM-based agents and humans within this task space and evaluate their performance with a holistic evaluation framework called SOTOPIA-Eval. With SOTOPIA, we find significant differences between these models in terms of their social intelligence, and we identify a subset of SOTOPIA scenarios, SOTOPIA-hard, that is generally challenging for all models. We find that on this subset, GPT-4 achieves a significantly lower goal completion rate than humans and struggles to exhibit social commonsense reasoning and strategic communication skills. These findings demonstrate SOTOPIA's promise as a general platform for research on evaluating and improving social intelligence in artificial agents.",
        "keywords": "Social;Interaction;Agent;Social intelligence;Large Language Models;Evaluation;Theory of Mind",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Xuhui Zhou;Hao Zhu;Leena Mathur;Ruohong Zhang;Haofei Yu;Zhengyang Qi;Louis-Philippe Morency;Yonatan Bisk;Daniel Fried;Graham Neubig;Maarten Sap",
        "authorids": "~Xuhui_Zhou1;~Hao_Zhu1;~Leena_Mathur1;~Ruohong_Zhang1;~Haofei_Yu1;~Zhengyang_Qi1;~Louis-Philippe_Morency1;~Yonatan_Bisk1;~Daniel_Fried1;~Graham_Neubig1;~Maarten_Sap1",
        "gender": "M;M;;M;M;M;M;M;M;M;M",
        "homepage": "https://xuhuizhou.github.io/;http://www.zhuhao.me;https://l-mathur.github.io;;https://www.haofeiyu.me;;https://www.cs.cmu.edu/~morency/;http://www.YonatanBisk.com;https://dpfried.github.io/;http://phontron.com;http://maartensap.com",
        "dblp": ";10/3520-6;263/4173;254/1608;156/1412;;31/739;38/9282;117/4804;03/8155;153/9519",
        "google_scholar": "CKyX_Y8AAAAJ;-3yFcsMAAAAJ;loh93ZkAAAAJ;https://scholar.google.com/citations?pli=1;EL-QbZ4AAAAJ;4WAn1gwAAAAJ;https://scholar.google.com.tw/citations?user=APgaFK0AAAAJ;bWoGh8UAAAAJ;sJDqACEAAAAJ;wlosgkoAAAAJ;gFN4QUYAAAAJ",
        "orcid": ";;;;;;0000-0001-6376-7696;0000-0002-2111-9081;;;",
        "linkedin": ";;leena-mathur/;;%E6%98%8A%E9%A3%9E-%E4%BA%8E-a04247188/;zhengyang-jason-qi/;morency?challengeId=AQELGK_OvMa0vwAAAY72L-VV4X9hW8juuY80VHVeeSGHZ1PJHeeEa5LTFoeTmDGU0t1OL07MXJTYC9EAi6qgPDd2z9ztnbdFYA&submissionId=09a0ff34-04ac-c717-bef7-8c9c8811b463&challengeSource=AgFhxWkU3q7v4wAAAY72L-1xRE0eG-BnZUNE9e3eAG95pgOCZ9u1nxEg-1dK2Dw&challegeType=AgHMzV0lqKgEFwAAAY72L-11X6DHMd3V_A3Iur8XZeyYF2-oBzoufs8&memberId=AgH4yz7pZ_riCgAAAY72L-146jmR2pdr3dmhy2icxBtEQzQ&recognizeDevice=AgFDCNyrhKiFSAAAAY72L-16m7z2EH2t0ueWmMKjyk1_ZJAkfFVe;yonatanbisk/;;;",
        "or_profile": "~Xuhui_Zhou1;~Hao_Zhu1;~Leena_Mathur1;~Ruohong_Zhang1;~Haofei_Yu1;~Zhengyang_Qi1;~Louis-Philippe_Morency1;~Yonatan_Bisk1;~Daniel_Fried1;~Graham_Neubig1;~Maarten_Sap1",
        "aff": "Allen Institute for Artificial Intelligence;Carnegie Mellon University;Carnegie Mellon University;;Carnegie Mellon University;School of Computer Science, Carnegie Mellon University;Carnegie Mellon University;Meta;Carnegie Mellon University;Carnegie Mellon University;Carnegie Mellon University",
        "aff_domain": "allenai.org;cmu.edu;cmu.edu;;cmu.edu;cs.cmu.edu;cmu.edu;meta.com;cmu.edu;cmu.edu;cmu.edu",
        "position": "Intern;PhD student;PhD student;;MS student;MS student;Associate Professor;Visiting Professor;Assistant Professor;Associate Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nzhou2024sotopia,\ntitle={{SOTOPIA}: Interactive Evaluation for Social Intelligence in Language Agents},\nauthor={Xuhui Zhou and Hao Zhu and Leena Mathur and Ruohong Zhang and Haofei Yu and Zhengyang Qi and Louis-Philippe Morency and Yonatan Bisk and Daniel Fried and Graham Neubig and Maarten Sap},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=mM7VurbA4r}\n}",
        "github": "",
        "project": "",
        "reviewers": "8Vfe;qjhX;UDk9",
        "pdf_size": 8846212,
        "rating": "6;6;8",
        "confidence": "4;5;4",
        "soundness": "3;2;4",
        "contribution": "3;2;4",
        "presentation": "3;3;4",
        "wc_summary": "101;143;33",
        "wc_strengths": "164;71;140",
        "wc_weaknesses": "173;182;503",
        "wc_questions": "128;78;338",
        "wc_review": "566;474;1014",
        "wc_reply_reviewers": "0;306;45",
        "wc_reply_authors": "861;1720;1022",
        "reply_reviewers": "0;2;1",
        "reply_authors": "4;4;2",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            92.33333333333333,
            45.32352835142275
        ],
        "wc_strengths_avg": [
            125.0,
            39.42080668885405
        ],
        "wc_weaknesses_avg": [
            286.0,
            153.4861557274792
        ],
        "wc_questions_avg": [
            181.33333333333334,
            112.64496832477201
        ],
        "wc_review_avg": [
            684.6666666666666,
            235.88321027340814
        ],
        "wc_reply_reviewers_avg": [
            117.0,
            134.89996293550269
        ],
        "wc_reply_authors_avg": [
            1201.0,
            372.8279317147076
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 148,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14064774469264271145&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=mM7VurbA4r",
        "pdf": "https://openreview.net/pdf?id=mM7VurbA4r",
        "email": "allenai.org;cmu.edu;cmu.edu;;cmu.edu;cs.cmu.edu;cmu.edu;meta.com;cmu.edu;cmu.edu;cmu.edu",
        "author_num": 11,
        "aff_unique_index": "0;1;1;1;1;1;2;1;1;1",
        "aff_unique_norm": "Allen Institute for Artificial Intelligence;Carnegie Mellon University;Meta",
        "aff_unique_dep": ";;Meta Platforms, Inc.",
        "aff_unique_url": "https://allenai.org;https://www.cmu.edu;https://meta.com",
        "aff_unique_abbr": "AI2;CMU;Meta",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Pittsburgh",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Beyond task performance: evaluating and reducing the flaws of large multimodal models with in-context-learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17896",
        "id": "mMaQvkMzDi",
        "author_site": "Mustafa Shukor, Alexandre Rame, Corentin Dancette, MATTHIEU CORD",
        "tldr": "",
        "abstract": "Following the success of Large Language Models (LLMs), Large Multimodal Models (LMMs), such as the Flamingo model and its subsequent competitors, have started to emerge as natural steps towards generalist agents. However, interacting with recent LMMs reveals major limitations that are hardly captured by the current evaluation benchmarks. Indeed, task performances (e.g., VQA accuracy) alone do not provide enough clues to understand their real capabilities, limitations, and to which extent such models are aligned to human expectations. To refine our understanding of those flaws, we deviate from the current evaluation paradigm, and (1) evaluate 10 recent open-source LMMs from 3B up to 80B parameter scale,  on 5 different axes; hallucinations, abstention, compositionality, explainability and instruction following. Our evaluation on these axes reveals major flaws in LMMs. While the current go-to solution to align these models is based on training, such as instruction tuning or RLHF, we rather (2) explore the training-free in-context learning (ICL) as a solution, and study how it affects these limitations. Based on our ICL study, (3) we push ICL further and propose new multimodal ICL variants such as; Multitask-ICL, Chain-of-Hindsight-ICL, and Self-Correcting-ICL. Our findings are as follows; (1) Despite their success, LMMs have flaws that remain unsolved with scaling alone. (2) The effect of ICL on LMMs flaws is nuanced; despite its effectiveness for improved explainability, answer abstention, ICL only slightly improves instruction following, does not improve compositional abilities, and actually even amplifies hallucinations. (3) The proposed ICL variants are promising as post-hoc approaches to efficiently tackle some of those flaws. The code is available here: https://github.com/mshukor/EvALign-ICL.",
        "keywords": "large multimodal models;in-context-learning;evaluation;alignment to human preferences",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Mustafa Shukor;Alexandre Rame;Corentin Dancette;Matthieu Cord",
        "authorids": "~Mustafa_Shukor1;~Alexandre_Rame1;~Corentin_Dancette1;~Matthieu_Cord1",
        "gender": "M;M;M;M",
        "homepage": "https://twitter.com/MustafaShukor1;https://alexrame.github.io/;https://cdancette.fr;https://cord.isir.upmc.fr/",
        "dblp": ";;;68/3117",
        "google_scholar": "lhp9mRgAAAAJ;7znwivwAAAAJ;https://scholar.google.fr/citations?user=2zReQdQAAAAJ;SpAotDcAAAAJ",
        "orcid": ";;;",
        "linkedin": ";alexandre-ram%C3%A9-05259587;;",
        "or_profile": "~Mustafa_Shukor1;~Alexandre_Rame1;~Corentin_Dancette1;~Matthieu_Cord1",
        "aff": "Universit\u00e9 Pierre et Marie Curie - Paris 6, Sorbonne Universit\u00e9 - Facult\u00e9 des Sciences (Paris VI);Google;Raidium;Sorbonne Universit\u00e9",
        "aff_domain": "isir.upmc.fr;google.com;raidium.fr;isir.upmc.fr",
        "position": "PhD student;research scientist;Researcher;Full Professor",
        "bibtex": "@inproceedings{\nshukor2024beyond,\ntitle={Beyond task performance: evaluating and reducing the flaws of large multimodal models with in-context-learning},\nauthor={Mustafa Shukor and Alexandre Rame and Corentin Dancette and Matthieu Cord},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=mMaQvkMzDi}\n}",
        "github": "",
        "project": "",
        "reviewers": "PTKm;wHgE;sfnT;dAEJ",
        "pdf_size": 14186683,
        "rating": "3;3;8;8",
        "confidence": "4;3;4;3",
        "soundness": "3;3;3;3",
        "contribution": "3;2;3;4",
        "presentation": "3;2;4;4",
        "wc_summary": "73;71;56;75",
        "wc_strengths": "35;32;79;66",
        "wc_weaknesses": "114;86;121;103",
        "wc_questions": "37;35;9;20",
        "wc_review": "259;224;265;264",
        "wc_reply_reviewers": "214;0;0;46",
        "wc_reply_authors": "1099;690;295;697",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "3;2;1;2",
        "rating_avg": [
            5.5,
            2.5
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            68.75,
            7.495832175282475
        ],
        "wc_strengths_avg": [
            53.0,
            20.062402647738878
        ],
        "wc_weaknesses_avg": [
            106.0,
            13.209844813622906
        ],
        "wc_questions_avg": [
            25.25,
            11.453711188955307
        ],
        "wc_review_avg": [
            253.0,
            16.896745248715803
        ],
        "wc_reply_reviewers_avg": [
            65.0,
            88.05112151472007
        ],
        "wc_reply_authors_avg": [
            695.25,
            284.2730861337387
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 18,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9675254616965979400&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 9,
        "openreview": "https://openreview.net/forum?id=mMaQvkMzDi",
        "pdf": "https://openreview.net/pdf?id=mMaQvkMzDi",
        "email": "isir.upmc.fr;google.com;raidium.fr;isir.upmc.fr",
        "author_num": 4,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Universit\u00e9 Pierre et Marie Curie - Paris 6;Google;Raidium;Sorbonne Universit\u00e9",
        "aff_unique_dep": "Facult\u00e9 des Sciences;Google;;",
        "aff_unique_url": "https://www.upmc.fr;https://www.google.com;;https://www.sorbonne-universite.fr",
        "aff_unique_abbr": "UPMC;Google;;Sorbonne U",
        "aff_campus_unique_index": "0;1",
        "aff_campus_unique": "Paris;Mountain View;",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "France;United States;"
    },
    {
        "id": "mMh4W72Hhe",
        "title": "Improving Branching in Neural Network Verification with Bound Implication Graph",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Many state-of-the-art neural network verifiers for ReLU networks rely on Branch and Bound (BaB)-based methods. They branch ReLUs into positive (active) and negative (inactive) parts, and bound each subproblem independently. Since the cost of verification heavily depends on the number of subproblems, reducing the total number of branches is the key to verifying neural networks efficiently. In this paper, we consider \\emph{bound implications} during branching - i.e., when one or more ReLU neurons are branched into the active (or inactive) case, they may imply that a set of other neurons from any layers become active or inactive, or have their bounds tightened. These implications can eliminate subproblems and improve bounds. We propose a scalable method to find implications among all neurons within tens of seconds even for large ResNets, by reusing pre-computed variables in popular bound-propagation-based verification methods such as $\\alpha$-CROWN, and solving a cheap linear programming problem. Then, we build the bound implication graph (BIG) which connects neurons with bound implications, and it can be used by any BaB-based verifier to reduce the number of branching needed. When evaluated on a set of popular verification benchmarks and a new benchmark consisting of harder verification problems, BIG consistently reduces the verification time and verifies more problems than state-of-the-art verification tools.",
        "keywords": "neural network verification;adversarial robustness;branch and bound",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/9d3d2098ee120b16e9ae845f182acbf40d51ce3c.pdf",
        "author": "Zhuolin Yang;Kaidi Xu;Bo Li;Huan Zhang",
        "authorids": "~Zhuolin_Yang1;~Kaidi_Xu1;~Bo_Li19;~Huan_Zhang1",
        "gender": "M;M;F;M",
        "homepage": "https://lucas110550.github.io/about;https://kaidixu.com/;http://boli.cs.illinois.edu/;http://huan-zhang.com",
        "dblp": ";195/8175;50/3402-26;23/1797-1.html",
        "google_scholar": "BvSv-C0AAAAJ;lYK0wlsAAAAJ;K8vJkTcAAAAJ;LTa3GzEAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Zhuolin_Yang1;~Kaidi_Xu1;~Bo_Li19;~Huan_Zhang1",
        "aff": "University of Illinois at Urbana Champaign;Drexel University;University of Illinois, Urbana Champaign;University of Illinois, Urbana Champaign",
        "aff_domain": "illinois.edu;drexel.edu;illinois.edu;uiuc.edu",
        "position": "PhD student;Assistant Professor;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nyang2024improving,\ntitle={Improving Branching in Neural Network Verification with Bound Implication Graph},\nauthor={Zhuolin Yang and Kaidi Xu and Bo Li and Huan Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=mMh4W72Hhe}\n}",
        "github": "",
        "project": "",
        "reviewers": "HQLe;2ULS;Wsyq;2T3h",
        "site": "https://openreview.net/forum?id=mMh4W72Hhe",
        "pdf_size": 600840,
        "rating": "5;5;6;8",
        "confidence": "5;4;4;3",
        "soundness": "3;3;3;4",
        "contribution": "2;3;3;4",
        "presentation": "1;2;2;4",
        "wc_summary": "78;113;15;77",
        "wc_strengths": "21;100;68;124",
        "wc_weaknesses": "298;91;90;15",
        "wc_questions": "3;369;32;27",
        "wc_review": "400;673;205;243",
        "wc_reply_reviewers": "0;439;20;0",
        "wc_reply_authors": "1296;1197;1026;369",
        "reply_reviewers": "0;2;1;0",
        "reply_authors": "3;3;2;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            70.75,
            35.301380992816696
        ],
        "wc_strengths_avg": [
            78.25,
            38.564070065282266
        ],
        "wc_weaknesses_avg": [
            123.5,
            105.3577239693417
        ],
        "wc_questions_avg": [
            107.75,
            151.23057726531366
        ],
        "wc_review_avg": [
            380.25,
            184.14854737412404
        ],
        "wc_reply_reviewers_avg": [
            114.75,
            187.38379732516896
        ],
        "wc_reply_authors_avg": [
            972.0,
            361.2914336100429
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8660254037844386,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:GifUWEOdFE8J:scholar.google.com/&scioq=Improving+Branching+in+Neural+Network+Verification+with+Bound+Implication+Graph&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "University of Illinois Urbana-Champaign;Drexel University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://illinois.edu;https://www.drexel.edu",
        "aff_unique_abbr": "UIUC;Drexel",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Urbana-Champaign;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "LLM Blueprint: Enabling Text-to-Image Generation with Complex and Detailed Prompts",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17895",
        "id": "mNYF0IHbRy",
        "author_site": "Hanan Gani, Shariq Bhat, Muzammal Naseer, Salman Khan, Peter Wonka",
        "tldr": "",
        "abstract": "Diffusion-based generative models have significantly advanced text-to-image generation but encounter challenges when processing lengthy and intricate text prompts describing complex scenes with multiple objects. While excelling in generating images from short, single-object descriptions, these models often struggle to faithfully capture all the nuanced details within longer and more elaborate textual inputs. In response, we present a novel approach leveraging Large Language Models (LLMs) to extract critical components from text prompts, including bounding box coordinates for foreground objects, detailed textual descriptions for individual objects, and a succinct background context. These components form the foundation of our layout-to-image generation model, which operates in two phases. The initial Global Scene Generation utilizes object layouts and background context to create an initial scene but often falls short in faithfully representing object characteristics as specified in the prompts. To address this limitation, we introduce an Iterative Refinement Scheme that iteratively evaluates and refines box-level content to align them with their textual descriptions, recomposing objects as needed to ensure consistency. Our evaluation on complex prompts featuring multiple objects demonstrates a substantial improvement in recall compared to baseline diffusion models. This is further validated by a user study, underscoring the efficacy of our approach in generating coherent and detailed scenes from intricate textual inputs. Our iterative framework offers a promising solution for enhancing text-to-image generation models' fidelity with lengthy, multifaceted descriptions, opening new possibilities for accurate and diverse image synthesis from textual inputs.",
        "keywords": "diffusion;LLM",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Hanan Gani;Shariq Farooq Bhat;Muzammal Naseer;Salman Khan;Peter Wonka",
        "authorids": "~Hanan_Gani1;~Shariq_Farooq_Bhat1;~Muzammal_Naseer1;~Salman_Khan4;~Peter_Wonka1",
        "gender": "M;M;M;M;M",
        "homepage": "https://hananshafi.github.io/;https://shariqfarooq123.github.io;https://muzammal-naseer.com/;https://salman-h-khan.github.io/;http://peterwonka.net",
        "dblp": ";279/6311;;32/11535-1;98/5522",
        "google_scholar": "https://scholar.google.co.in/citations?user=XFugeQ4AAAAJ;nGbEcI8AAAAJ;https://scholar.google.ch/citations?user=tM9xKA8AAAAJ;https://scholar.google.es/citations?user=M59O9lkAAAAJ;https://scholar.google.com.tw/citations?user=0EKXSXgAAAAJ",
        "orcid": ";0000-0002-7668-4424;0000-0001-7663-7161;0000-0002-9502-1749;0000-0003-0627-9746",
        "linkedin": "hanan-gani-269a73134/;shariqfarooq/;muzammalnaseer/;;",
        "or_profile": "~Hanan_Gani1;~Shariq_Farooq_Bhat1;~Muzammal_Naseer1;~Salman_Khan4;~Peter_Wonka1",
        "aff": "Mohamed bin Zayed University of Artificial Intelligence;KAUST;Mohamed bin Zayed University of Artificial Intelligence;Australian National University;KAUST",
        "aff_domain": "mbzuai.ac.ae;kaust.edu.sa;mbzuai.ac.ae;anu.edu.au;kaust.edu.sa",
        "position": "MS student;PhD student;Researcher;Lecturer;Full Professor",
        "bibtex": "@inproceedings{\ngani2024llm,\ntitle={{LLM} Blueprint: Enabling Text-to-Image Generation with Complex and Detailed Prompts},\nauthor={Hanan Gani and Shariq Farooq Bhat and Muzammal Naseer and Salman Khan and Peter Wonka},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=mNYF0IHbRy}\n}",
        "github": "",
        "project": "",
        "reviewers": "Br9r;XXwY;kt1C;c4Qg",
        "pdf_size": 37558507,
        "rating": "5;5;6;6",
        "confidence": "4;3;4;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "96;78;52;126",
        "wc_strengths": "99;70;36;42",
        "wc_weaknesses": "329;171;201;114",
        "wc_questions": "15;54;55;34",
        "wc_review": "539;373;344;316",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;827;652;695",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;2;1;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            88.0,
            26.94438717061496
        ],
        "wc_strengths_avg": [
            61.75,
            25.043711785596
        ],
        "wc_weaknesses_avg": [
            203.75,
            78.77618612245708
        ],
        "wc_questions_avg": [
            39.5,
            16.439282222773596
        ],
        "wc_review_avg": [
            393.0,
            86.66891022737046
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            543.5,
            320.34707740199536
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.7071067811865476
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 32,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17715348993612335596&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=mNYF0IHbRy",
        "pdf": "https://openreview.net/pdf?id=mNYF0IHbRy",
        "email": "mbzuai.ac.ae;kaust.edu.sa;mbzuai.ac.ae;anu.edu.au;kaust.edu.sa",
        "author_num": 5,
        "aff_unique_index": "0;1;0;2;1",
        "aff_unique_norm": "Mohamed bin Zayed University of Artificial Intelligence;King Abdullah University of Science and Technology;Australian National University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://mbzuai.ac.ae;https://www.kaust.edu.sa;https://www.anu.edu.au",
        "aff_unique_abbr": "MBZUAI;KAUST;ANU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;2;1",
        "aff_country_unique": "United Arab Emirates;Saudi Arabia;Australia"
    },
    {
        "id": "mOFACpjXe2",
        "title": "Listen to Motion: Robustly Learning Correlated Audio-Visual Representations",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Audio-visual correlation learning has many applications and is pivotal in broader multimodal understanding and generation. Recently, many existing methods try to learn audio-visual contrastive representations from web-scale videos and show impressive performance. However, these methods mainly focus on learning the correlation between audio and static visual information (such as objects and background) while ignoring the crucial role of motion information in determining sounds in videos. Besides, the widespread presence of false and multiple positive audio-visual pairs in web-scale unlabeled videos also limits the performance of audio-visual representations. In this paper, we propose \\textbf{Li}sten to \\textbf{Mo}tion (LiMo) to capture motion information explicitly and align motion and audio robustly. Specifically, for modeling the motion in video, we extract the temporal visual semantic by facilitating the interaction between frames, while retaining static visual-audio correlation knowledge acquired in previous models. To prompt a more robust audio-visual alignment, we propose learning motion-audio alignment more specifically by distinguishing different clips within the same video. And we quantitatively measure the likelihood of each sample being false positive or containing multiple positive instances, then adaptively reweight samples in the final learning objective. Our extensive experiments demonstrate the effectiveness of LiMo on various audio-visual downstream tasks. On audio-visual retrieval, LiMo achieves absolute improvements of at least 15\\% top1 accuracy on AudioSet and VGGSound. On our newly proposed motion-specific tasks, LiMo exhibits much better performance. Moreover, LiMo also achieves advanced accuracy on audio event recognition, demonstrating enhanced discriminability of audio representations.",
        "keywords": "audio-visual representation learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Zehan Wang;Xize Cheng;Li Tang;Luping Liu;Yang Zhao;Tao Jin;Chengfei Cai;WANG HongFa;Wei Liu;Zhou Zhao",
        "authorids": "~Zehan_Wang2;~Xize_Cheng1;~Li_Tang3;~Luping_Liu2;~Yang_Zhao14;~Tao_Jin2;~Chengfei_Cai1;~WANG_HongFa1;~Wei_Liu3;~Zhou_Zhao3",
        "gender": "M;M;M;;M;M;M;M;M;",
        "homepage": "https://github.com/12zehan17;https://exgc.github.io/;;;;https://hugddygff.github.io/;;;https://sites.google.com/view/cuweiliu;",
        "dblp": "126/7826-1;334/2167;;;50/2082-22;88/4850-4.html;;91/330;49/3283-5;",
        "google_scholar": "euXK0lkAAAAJ;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com.hk/citations?hl=en;;;;r2CFicAAAAAJ;https://scholar.google.com.hk/citations?user=q9Fn50QAAAAJ;AjxoEpIAAAAJ;",
        "orcid": "0009-0007-7509-7563;0000-0001-9708-3225;;;;0000-0003-3564-1628;;0000-0001-8230-9471;0000-0002-3865-8145;",
        "linkedin": ";;;;;;;;;",
        "or_profile": "~Zehan_Wang2;~Xize_Cheng1;~Li_Tang3;~Luping_Liu2;~Yang_Zhao14;~Tao_Jin2;~Chengfei_Cai1;~WANG_HongFa1;~Wei_Liu3;~Zhou_Zhao3",
        "aff": "Zhejiang University;Zhejiang University;Zhejiang University;;ByteDance Inc.;Zhejiang University;Tencent ;Tsinghua University;Tencent;",
        "aff_domain": "zju.edu.cn;zju.edu.cn;zju.edu.cn;;bytedance.com;zju.edu.cn;tencent.com;tsinghua.edu.cn;tencent.com;",
        "position": "PhD student;PhD student;PhD student;;Researcher;Assistant Professor;Researcher;PhD student;Distinguished Scientist;",
        "bibtex": "@misc{\nwang2024listen,\ntitle={Listen to Motion: Robustly Learning Correlated Audio-Visual Representations},\nauthor={Zehan Wang and Xize Cheng and Li Tang and Luping Liu and Yang Zhao and Tao Jin and Chengfei Cai and WANG HongFa and Wei Liu and Zhou Zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=mOFACpjXe2}\n}",
        "github": "",
        "project": "",
        "reviewers": "5gkS;2yxk;bjXv",
        "site": "https://openreview.net/forum?id=mOFACpjXe2",
        "pdf_size": 6790884,
        "rating": "1;5;5",
        "confidence": "1;4;3",
        "soundness": "1;2;2",
        "contribution": "2;2;3",
        "presentation": "2;3;2",
        "wc_summary": "80;148;192",
        "wc_strengths": "42;95;42",
        "wc_weaknesses": "599;199;307",
        "wc_questions": "4;25;91",
        "wc_review": "725;467;632",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            1.8856180831641267
        ],
        "confidence_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            140.0,
            46.07240678178932
        ],
        "wc_strengths_avg": [
            59.666666666666664,
            24.98443960192468
        ],
        "wc_weaknesses_avg": [
            368.3333333333333,
            168.96021885507713
        ],
        "wc_questions_avg": [
            40.0,
            37.067505985701274
        ],
        "wc_review_avg": [
            608.0,
            106.68645649753299
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.9449111825230678,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:BolzlQKnWFwJ:scholar.google.com/&scioq=Listen+to+Motion:+Robustly+Learning+Correlated+Audio-Visual+Representations&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;0;2;3;2",
        "aff_unique_norm": "Zhejiang University;ByteDance;Tencent;Tsinghua University",
        "aff_unique_dep": ";;Tencent Holdings Limited;",
        "aff_unique_url": "https://www.zju.edu.cn;https://www.bytedance.com;https://www.tencent.com;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "ZJU;ByteDance;Tencent;THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "mOTiVzTgF2",
        "title": "ResiDual: Transformer with Dual Residual Connections",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Transformer networks have become the preferred architecture for many tasks due to their state-of-the-art performance. However, the optimal way to implement residual connections in Transformer, which are essential for effective training, is still debated. Two widely used variants are the Post-Layer-Normalization (Post-LN) and Pre-Layer-Normalization (Pre-LN) Transformers, which apply layer normalization after each residual block's output or before each residual block's input, respectively. While both variants enjoy their advantages, they also suffer from severe limitations: Post-LN causes gradient vanishing issue that hinders training deep Transformers, and Pre-LN causes representation collapse issue that limits model capacity. In this paper, we propose ResiDual, a novel Transformer architecture with Pre-Post-LN (PPLN), which fuses the connections in Post-LN and Pre-LN together, and inherits their advantages while avoids their limitations. We conduct both theoretical analyses and empirical experiments to verify the effectiveness of ResiDual. Theoretically, we prove that ResiDual has a lower bound on the gradient to avoid the vanishing issue due to the residual connection from Pre-LN. Moreover, ResiDual also has diverse model representations to avoid the collapse issue due to the residual connection from Post-LN. Empirically, ResiDual outperforms both Post-LN and Pre-LN on several machine translation benchmarks across different network depths and data sizes.",
        "keywords": "Transformers;Residual Connection",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Shufang Xie;Huishuai Zhang;Junliang Guo;Xu Tan;Jiang Bian;Hany Hassan Awadalla;Arul Menezes;Tao Qin;Rui Yan",
        "authorids": "~Shufang_Xie1;~Huishuai_Zhang3;~Junliang_Guo1;~Xu_Tan1;~Jiang_Bian1;~Hany_Hassan_Awadalla1;~Arul_Menezes1;~Tao_Qin1;~Rui_Yan2",
        "gender": "M;M;M;M;M;M;M;M;M",
        "homepage": ";https://leoguojl.me/;https://tan-xu.github.io/;https://sites.google.com/view/jiangbian;https://www.linkedin.com/in/arulmenezes;https://www.microsoft.com/en-us/research/people/taoqin/;https://gsai.ruc.edu.cn/english/ruiyan;;https://huishuai-git.github.io",
        "dblp": "https://dblp.uni-trier.de/pid/163/2704-3;209/9674;96/10484-3;09/851-2.html;89/2869;14/6841;19/2405-1;83/64;144/7537",
        "google_scholar": ";https://scholar.google.com.sg/citations?user=S88C9ewAAAAJ;tob-U1oAAAAJ;pZBEnY8AAAAJ;DnhOg3YAAAAJ;Bl4SRU0AAAAJ;eLw6g-UAAAAJ;;w1srHyIAAAAJ",
        "orcid": ";0000-0001-8360-5483;0000-0001-5631-0639;0000-0002-9472-600X;;;0000-0002-3356-6823;;",
        "linkedin": ";;;jbian/;arulmenezes;;;;",
        "or_profile": "~Shufang_Xie1;~Junliang_Guo1;~Xu_Tan1;~Jiang_Bian1;~Arul_Menezes1;~Tao_Qin1;~Rui_Yan2;~Hany_Hassan1;~Huishuai_Zhang2",
        "aff": "Renmin University of China;Microsoft;Microsoft;Microsoft;None;;Renmin University of China;Microsoft;Peking University",
        "aff_domain": "ruc.edu.cn;microsoft.com;microsoft.com;microsoft.com;microsoft.com;;ruc.edu.cn;microsoft.com;pku.edu.cn",
        "position": "PhD student;Researcher;Principal Researcher;Partner Research Manager;Advisor;;Associate Professor;Research Scientist;Assistant Professor",
        "bibtex": "@misc{\nxie2024residual,\ntitle={ResiDual: Transformer with Dual Residual Connections},\nauthor={Shufang Xie and Huishuai Zhang and Junliang Guo and Xu Tan and Jiang Bian and Hany Hassan Awadalla and Arul Menezes and Tao Qin and Rui Yan},\nyear={2024},\nurl={https://openreview.net/forum?id=mOTiVzTgF2}\n}",
        "github": "",
        "project": "",
        "reviewers": "EUoZ;q8he;ygjB;e3RM;9QNj",
        "site": "https://openreview.net/forum?id=mOTiVzTgF2",
        "pdf_size": 607065,
        "rating": "1;3;5;6;6",
        "confidence": "5;3;3;3;2",
        "soundness": "1;2;3;3;2",
        "contribution": "1;3;3;3;2",
        "presentation": "2;3;3;3;3",
        "wc_summary": "103;68;69;126;87",
        "wc_strengths": "29;73;39;50;69",
        "wc_weaknesses": "168;61;101;80;67",
        "wc_questions": "309;69;5;44;3",
        "wc_review": "609;271;214;300;226",
        "wc_reply_reviewers": "58;0;0;0;0",
        "wc_reply_authors": "723;0;0;0;0",
        "reply_reviewers": "1;0;0;0;0",
        "reply_authors": "1;0;0;0;0",
        "rating_avg": [
            4.2,
            1.9390719429665317
        ],
        "confidence_avg": [
            3.2,
            0.9797958971132712
        ],
        "soundness_avg": [
            2.2,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.4,
            0.8
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            90.6,
            21.8961183774659
        ],
        "wc_strengths_avg": [
            52.0,
            16.923356641044943
        ],
        "wc_weaknesses_avg": [
            95.4,
            38.8051542968199
        ],
        "wc_questions_avg": [
            86.0,
            114.22083872919161
        ],
        "wc_review_avg": [
            324.0,
            145.8176943995481
        ],
        "wc_reply_reviewers_avg": [
            11.6,
            23.2
        ],
        "wc_reply_authors_avg": [
            144.6,
            289.2
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            0.2,
            0.4000000000000001
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -0.8632057190931819,
        "gs_citation": 20,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13454570814273304026&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1;1;2;0;1;3",
        "aff_unique_norm": "Renmin University of China;Microsoft;Google;Peking University",
        "aff_unique_dep": ";Microsoft Corporation;Google AI;",
        "aff_unique_url": "http://www.ruc.edu.cn;https://www.microsoft.com;https://ai.google;http://www.pku.edu.cn",
        "aff_unique_abbr": "RUC;Microsoft;Google AI;Peking U",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;1;1;1;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "mPAhClBy8F",
        "title": "Overcoming both Domain Shift and Label Shift for Referring Video Segmentation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Open-set domain generalization (OSDG) aims to enhance the robustness of the model when facing both domain shift and label shift, highlighting a wide range of potential in real-world applications. However, previous OSDG methods can only recognize seen objects and mark all unseen objects as ``unknown'' category during inference, which is far from satisfactory. In this paper, we explore the scenario of referring video segmentation to study how to make the modal maintain good segmentation ability for unknown objects under OSDG setting. To bridge the huge gap caused by label shift, we propose CLIP-based Reasoning Prompt (CRPrompt), which can combine text and visual prompt together to improve text-object matching ability of CLIP, transferring the segmentation ability to unseen classes based on the knowledge learned from seen classes and large-scale text-image pairs, i.e., color, shape, spatial relationships. Meanwhile, to improve the robustness of CRPrompt, we propose Select Instance Normalization (SelectIN), which can effectively enhance the robustness of the model by selecting visual objects with similar semantic concepts through input query and performing Instance Norm among them. Extensive experiments on open-set and zero-shot domain generalization tasks demonstrate the effectiveness of our approach. The code is available in supplementary material.",
        "keywords": "domain generalization;multi-modal;video segmentation;open-set",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/3354e1fe52fb9c9f971cda1b41531bdd0a8606cc.zip",
        "author": "Yan Xia;Hai Huang;Zhou Zhao;Jieming Zhu",
        "authorids": "~Yan_Xia4;~Hai_Huang6;~Zhou_Zhao3;~Jieming_Zhu2",
        "gender": "M;;M;M",
        "homepage": "https://github.com/marmot-xy;https://haihuangcode.github.io/;https://jiemingzhu.github.io/;https://dblp.uni-trier.de/pid/75/7785.html?",
        "dblp": "17/6518-6;51/944-13.html;10/2717;75/7785",
        "google_scholar": "6kEbV3IAAAAJ;FKvBzQwAAAAJ;oNKerP8AAAAJ;https://scholar.google.com.hk/citations?user=IIoFY90AAAAJ",
        "orcid": "0000-0003-4631-741X;0009-0003-8813-2306;0000-0002-5666-8320;0000-0001-6121-0384",
        "linkedin": ";;;",
        "or_profile": "~Yan_Xia4;~Hai_Huang6;~Jieming_Zhu2;~Zhou_Zhao2",
        "aff": "Zhejiang University;Zhejiang University;Huawei Noah's Ark Lab;Zhejiang University",
        "aff_domain": "zju.edu.cn;zju.edu.cn;huawei.com;zju.edu.cn",
        "position": "PhD student;MS student;Researcher;Associate Professor",
        "bibtex": "@misc{\nxia2024overcoming,\ntitle={Overcoming both Domain Shift and Label Shift for Referring Video Segmentation},\nauthor={Yan Xia and Hai Huang and Zhou Zhao and Jieming Zhu},\nyear={2024},\nurl={https://openreview.net/forum?id=mPAhClBy8F}\n}",
        "github": "",
        "project": "",
        "reviewers": "qcvG;WCGM;GHiP;hGmE",
        "site": "https://openreview.net/forum?id=mPAhClBy8F",
        "pdf_size": 3365402,
        "rating": "3;3;5;6",
        "confidence": "4;4;3;3",
        "soundness": "2;2;2;3",
        "contribution": "2;1;2;3",
        "presentation": "2;1;2;3",
        "wc_summary": "72;91;59;45",
        "wc_strengths": "44;58;36;57",
        "wc_weaknesses": "229;250;140;87",
        "wc_questions": "2;74;32;78",
        "wc_review": "347;473;267;267",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            66.75,
            16.946607330082326
        ],
        "wc_strengths_avg": [
            48.75,
            9.202581159652981
        ],
        "wc_weaknesses_avg": [
            176.5,
            66.14567257198313
        ],
        "wc_questions_avg": [
            46.5,
            31.38072656902641
        ],
        "wc_review_avg": [
            338.5,
            84.24221032237936
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9622504486493761,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:TFVXTPljxDgJ:scholar.google.com/&scioq=Overcoming+both+Domain+Shift+and+Label+Shift+for+Referring+Video+Segmentation&hl=en&as_sdt=0,31",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Zhejiang University;Huawei",
        "aff_unique_dep": ";Noah's Ark Lab",
        "aff_unique_url": "https://www.zju.edu.cn;https://www.huawei.com",
        "aff_unique_abbr": "ZJU;Huawei",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "mPONXmVmZ6",
        "title": "Multi-Agent Interpolated Policy Gradients",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Policy gradient method typically suffers high variance, which is further amplified in the multi-agent setting due to the exponential explosive growth of the joint action space.\nWhile value factorization is a popular approach for efficiently reducing the complexity of the value function, integrating it with policy gradient to reduce variance is challenging, as bias is introduced due to the limitations of factorization structure.\nThis paper addresses the underexplored bias-variance trade-off problem by proposing a novel policy gradient method in MARL that uses a convex combination of joint Q-function and a factorized Q-function. This results in a policy gradient approach that balances stochastic and factorized deterministic policy gradients, enabling a more flexible trade-off between bias and variance. Theoretical results validate the effectiveness of our approach, showing that factorized value functions can effectively reduce variance while potentially maintaining low bias.\nEmpirical experiments on several benchmarks demonstrate that our approach outperforms existing state-of-the-art methods in terms of efficiency and stability.",
        "keywords": "multi-agent reinforcement learning;stochastic policy gradients;deterministic policy gradients;value function factorization;bias-variance trade-off",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/15e0d854d2fcfa39e774b164cf4d58b0dafe16d0.zip",
        "author": "Yueheng Li;Guangming Xie",
        "authorids": "~Yueheng_Li1;~Guangming_Xie1",
        "gender": "M;M",
        "homepage": ";",
        "dblp": ";",
        "google_scholar": "http://scholar.google.com.hk/citations?hl=en;MBfvORIAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Guangming_Xie1;~YH_L1",
        "aff": "Peking University, Tsinghua University;Peking University",
        "aff_domain": "pku.edu.cn;pku.edu.cn",
        "position": "Full Professor;PhD student",
        "bibtex": "@misc{\nli2024multiagent,\ntitle={Multi-Agent Interpolated Policy Gradients},\nauthor={Yueheng Li and Guangming Xie},\nyear={2024},\nurl={https://openreview.net/forum?id=mPONXmVmZ6}\n}",
        "github": "",
        "project": "",
        "reviewers": "4F8p;ZGxu;JyH2",
        "site": "https://openreview.net/forum?id=mPONXmVmZ6",
        "pdf_size": 1758518,
        "rating": "5;6;6",
        "confidence": "4;4;2",
        "soundness": "3;3;3",
        "contribution": "2;2;3",
        "presentation": "3;3;2",
        "wc_summary": "53;80;111",
        "wc_strengths": "57;62;90",
        "wc_weaknesses": "437;279;48",
        "wc_questions": "104;1;157",
        "wc_review": "651;422;406",
        "wc_reply_reviewers": "268;49;50",
        "wc_reply_authors": "1176;466;390",
        "reply_reviewers": "2;1;1",
        "reply_authors": "3;1;2",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            81.33333333333333,
            23.697163449568293
        ],
        "wc_strengths_avg": [
            69.66666666666667,
            14.522013940527977
        ],
        "wc_weaknesses_avg": [
            254.66666666666666,
            159.73797989902783
        ],
        "wc_questions_avg": [
            87.33333333333333,
            64.76796190161375
        ],
        "wc_review_avg": [
            493.0,
            111.91365719458312
        ],
        "wc_reply_reviewers_avg": [
            122.33333333333333,
            103.00269683632345
        ],
        "wc_reply_authors_avg": [
            677.3333333333334,
            353.9730058759974
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:3EZEYiYM1ToJ:scholar.google.com/&scioq=Multi-Agent+Interpolated+Policy+Gradients&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Peking University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.pku.edu.cn",
        "aff_unique_abbr": "Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "mPOVOwsDOO",
        "title": "Talking Models: Distill Pre-trained Knowledge to Downstream Models via Interactive Communication",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Many recent breakthroughs in machine learning have been enabled by the pre-trained foundation models. By scaling up model parameters, training data, and computation resources, foundation models have significantly advanced the state-of-the-art in many applications. However, it is still an open question of how to use these models to perform downstream tasks efficiently. Knowledge distillation (KD) has been explored to tackle this challenge. KD is a technique that transfers knowledge from a large teacher model to a smaller student model. While KD has been successful in improving student model performance, recent research has discovered that a powerful teacher does not necessarily lead to a powerful student, due to their huge capacity gap. In addition, the potential distribution shifts between the pre-training data and downstream tasks can make knowledge transfer in KD sub-optimal for improving downstream task performance.\n\nIn this paper, we extend the knowledge distillation paradigm by introducing an interactive communication process to help student models of downstream tasks learn effectively from pre-trained foundation models. Our design is inspired by the way humans learn from teachers who can explain knowledge in a way that meets the students' needs. Specifically, we let each model (i.e., student and teacher) train two components: (1) an encoder which encodes the model's hidden states to a message in a shared message space with other models and (2) a decoder which decodes any message to its own hidden states. With encoder and decoder, not only can the teacher model transfer rich information by encoding its hidden states to messages, but also the student model can send messages with information of downstream tasks to teacher so that the teacher can interpret and generate responses. With this interactive communication process, knowledge passing from teacher to student can be tailored to the student's model capacity and downstream tasks' distributions. We conducted experiments on benchmark datasets for computer vision and recommendation tasks to show that our communication mechanism outperforms state-of-the-art distillation techniques.",
        "keywords": "Knowledge Distillation;Interactive Communication;Distill Foundation Model",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/5054b43e6c3c4293e9307b8eae3f65d130a8a4b5.pdf",
        "author": "Zhe Zhao;Qingyun Liu;Huan Gui;Bang An;Lichan Hong;Ed H. Chi",
        "authorids": "~Zhe_Zhao3;~Qingyun_Liu1;~Huan_Gui4;~Bang_An1;~Lichan_Hong1;~Ed_H._Chi1",
        "gender": "M;;;;M;M",
        "homepage": "https://sites.google.com/view/zhezhao;https://www.linkedin.com/in/qingyun-sunny-liu-45307141/;https://huangui.me/;https://bangann.github.io/;;http://edchi.net",
        "dblp": "28/6429-1.html;47/9461-3;;188/0741;85/4697;13/310",
        "google_scholar": "TRZB0J4AAAAJ;zCHUfgoAAAAJ;VDohxnoAAAAJ;3ce6z_sAAAAJ;https://scholar.google.com/citations?view_op=list_works;VuWl-KUAAAAJ",
        "orcid": ";0000-0001-7545-4902;;;;0000-0003-3230-5338",
        "linkedin": ";;;;lichanhong/;edchi/",
        "or_profile": "~Zhe_Zhao3;~Qingyun_Liu1;~Huan_Gui4;~Bang_An1;~Lichan_Hong1;~Ed_Chi1",
        "aff": "Google;Google DeepMind;Google;University of Maryland, College Park;Google ;Google",
        "aff_domain": "google.com;google.com;google.com;umd.edu;google.com;google.com",
        "position": "Research Scientist;Researcher;Software Engineer;PhD student;Software Engineer;Researcher",
        "bibtex": "@misc{\nzhao2024talking,\ntitle={Talking Models: Distill Pre-trained Knowledge to Downstream Models via Interactive Communication},\nauthor={Zhe Zhao and Qingyun Liu and Huan Gui and Bang An and Lichan Hong and Ed H. Chi},\nyear={2024},\nurl={https://openreview.net/forum?id=mPOVOwsDOO}\n}",
        "github": "",
        "project": "",
        "reviewers": "2VSL;yycb;93jL;njLH",
        "site": "https://openreview.net/forum?id=mPOVOwsDOO",
        "pdf_size": 453811,
        "rating": "5;5;6;6",
        "confidence": "4;2;4;3",
        "soundness": "3;1;2;2",
        "contribution": "3;2;3;3",
        "presentation": "2;1;3;3",
        "wc_summary": "89;25;42;67",
        "wc_strengths": "42;25;52;89",
        "wc_weaknesses": "249;527;79;141",
        "wc_questions": "110;6;3;71",
        "wc_review": "490;583;176;368",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "840;681;366;883",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;1;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            55.75,
            24.324627438051337
        ],
        "wc_strengths_avg": [
            52.0,
            23.441416339462084
        ],
        "wc_weaknesses_avg": [
            249.0,
            171.64498244924027
        ],
        "wc_questions_avg": [
            47.5,
            45.16912662427734
        ],
        "wc_review_avg": [
            404.25,
            152.2471264096633
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            692.5,
            202.96613017939717
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.30151134457776363,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:3kR63nAyxHAJ:scholar.google.com/&scioq=Talking+Models:+Distill+Pre-trained+Knowledge+to+Downstream+Models+via+Interactive+Communication&hl=en&as_sdt=0,5",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;1;0;0",
        "aff_unique_norm": "Google;University of Maryland",
        "aff_unique_dep": "Google;",
        "aff_unique_url": "https://www.google.com;https://www/umd.edu",
        "aff_unique_abbr": "Google;UMD",
        "aff_campus_unique_index": "0;0;2;0;0",
        "aff_campus_unique": "Mountain View;;College Park",
        "aff_country_unique_index": "0;1;0;0;0;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "title": "A Hierarchical Bayesian Model for Few-Shot Meta Learning",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17894",
        "id": "mQ72XRfYRZ",
        "author_site": "Minyoung Kim, Timothy Hospedales",
        "tldr": "",
        "abstract": "We propose a novel hierarchical Bayesian model for the few-shot meta learning problem. We consider episode-wise random variables to model episode-specific generative processes, where these local random variables are governed by a higher-level global random variable. The global variable captures information shared across episodes, while controlling how much the model needs to be adapted to new episodes in a principled Bayesian manner. Within our  framework, prediction on a novel episode/task can be seen as a Bayesian inference problem. For tractable training, we need to be able to relate each local episode-specific solution to the global higher-level parameters. We propose a Normal-Inverse-Wishart model, for which establishing this local-global relationship becomes feasible due to the approximate closed-form solutions for the local posterior distributions. The resulting algorithm is more attractive than the MAML in that it does not maintain a costly computational graph for the sequence of gradient descent steps in an episode. Our approach is also different from existing Bayesian meta learning methods in that rather than modeling a single random variable for all episodes, it leverages a hierarchical structure that exploits the local-global relationships desirable for principled Bayesian learning with many related tasks.",
        "keywords": "Bayesian models;Meta learning;Few-shot learning",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/55645679512920438f3f5d32717a02eef451866a.zip",
        "author": "Minyoung Kim;Timothy Hospedales",
        "authorids": "~Minyoung_Kim2;~Timothy_Hospedales1",
        "gender": "M;M",
        "homepage": "https://sites.google.com/site/mikim21/;http://homepages.inf.ed.ac.uk/thospeda/",
        "dblp": ";32/3545",
        "google_scholar": ";https://scholar.google.fr/citations?user=nHhtvqkAAAAJ",
        "orcid": ";0000-0003-4867-7486",
        "linkedin": ";timothyhospedales/",
        "or_profile": "~Minyoung_Kim2;~Timothy_Hospedales1",
        "aff": ";Samsung AI Research Centre",
        "aff_domain": ";samsung.com",
        "position": ";Principal Researcher",
        "bibtex": "@inproceedings{\nkim2024a,\ntitle={A Hierarchical Bayesian Model for Few-Shot Meta Learning},\nauthor={Minyoung Kim and Timothy Hospedales},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=mQ72XRfYRZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "Whmq;EN3o;PGLR;ZG8Z;kRtC;wcX1",
        "pdf_size": 1031814,
        "rating": "6;6;6;6;8;8",
        "confidence": "4;4;2;3;4;3",
        "soundness": "3;2;3;3;4;3",
        "contribution": "3;2;3;3;4;4",
        "presentation": "3;3;2;3;4;3",
        "wc_summary": "48;153;44;66;98;132",
        "wc_strengths": "58;100;49;28;58;106",
        "wc_weaknesses": "100;1157;84;152;68;110",
        "wc_questions": "1;2;36;129;51;49",
        "wc_review": "207;1412;213;375;275;397",
        "wc_reply_reviewers": "22;49;0;0;0;25",
        "wc_reply_authors": "220;1484;224;766;372;423",
        "reply_reviewers": "1;1;0;0;0;1",
        "reply_authors": "1;3;1;1;1;2",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.7453559924999298
        ],
        "soundness_avg": [
            3.0,
            0.5773502691896257
        ],
        "contribution_avg": [
            3.1666666666666665,
            0.6871842709362768
        ],
        "presentation_avg": [
            3.0,
            0.5773502691896257
        ],
        "wc_summary_avg": [
            90.16666666666667,
            41.33770138209859
        ],
        "wc_strengths_avg": [
            66.5,
            27.735356496717326
        ],
        "wc_weaknesses_avg": [
            278.5,
            393.73415312026634
        ],
        "wc_questions_avg": [
            44.666666666666664,
            42.76551050658566
        ],
        "wc_review_avg": [
            479.8333333333333,
            423.15892076408153
        ],
        "wc_reply_reviewers_avg": [
            16.0,
            18.138357147217054
        ],
        "wc_reply_authors_avg": [
            581.5,
            442.72781329691344
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.7637626158259734
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.15811388300841897,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=647250995528936006&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=mQ72XRfYRZ",
        "pdf": "https://openreview.net/pdf?id=mQ72XRfYRZ",
        "email": ";samsung.com",
        "author_num": 2,
        "aff_unique_index": "0",
        "aff_unique_norm": "Samsung",
        "aff_unique_dep": "AI Research",
        "aff_unique_url": "https://www.samsung.com/global/researchers/samsung-ai-research-centre/",
        "aff_unique_abbr": "SARC",
        "aff_country_unique_index": "0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "BrainSCUBA: Fine-Grained Natural Language Captions of Visual Cortex Selectivity",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17893",
        "id": "mQYHXUUTkU",
        "author_site": "Andrew Luo, Maggie Henderson, Michael Tarr, Leila Wehbe",
        "tldr": "",
        "abstract": "Understanding the functional organization of higher visual cortex is a central focus in neuroscience. Past studies have primarily mapped the visual and semantic selectivity of neural populations using hand-selected stimuli, which may potentially bias results towards pre-existing hypotheses of visual cortex functionality. Moving beyond conventional approaches, we introduce a data-driven method that generates natural language descriptions for images predicted to maximally activate individual voxels of interest. Our method -- Semantic Captioning Using Brain Alignments (\"BrainSCUBA\") -- builds upon the rich embedding space learned by a contrastive vision-language model and utilizes a pre-trained large language model to generate interpretable captions. We validate our method through fine-grained voxel-level captioning across higher-order visual regions. We further perform text-conditioned image synthesis with the captions, and show that our images are semantically coherent and yield high predicted activations. Finally, to demonstrate how our method enables scientific discovery, we perform exploratory investigations on the distribution of \"person\" representations in the brain, and discover fine-grained semantic selectivity in body-selective areas. Unlike earlier studies that decode text, our method derives *voxel-wise captions of semantic selectivity*. Our results show that BrainSCUBA is a promising means for understanding functional preferences in the brain, and provides motivation for further hypothesis-driven investigation of visual cortex.",
        "keywords": "neuroscience;brain;fmri;captions;image synthesis;visual cortex;computational neuroscience",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "Andrew Luo;Margaret Marie Henderson;Michael J. Tarr;Leila Wehbe",
        "authorids": "~Andrew_Luo2;~Margaret_Marie_Henderson1;~Michael_J._Tarr1;~Leila_Wehbe1",
        "gender": "M;F;F;M",
        "homepage": "https://andrewluo.net/;https://www.hendersonneurolab.com;http://www.cs.cmu.edu/~lwehbe/;https://tarrlab.org",
        "dblp": "234/8054;348/9728.html;125/4359;36/1880",
        "google_scholar": "bWYvvkUAAAAJ;91bNlCUAAAAJ;YezyUawAAAAJ;O8ALPlkAAAAJ",
        "orcid": ";0000-0001-9375-6680;0000-0001-8545-2062;0000-0003-4724-1744",
        "linkedin": ";;;michael-tarr-ab078046/",
        "or_profile": "~Andrew_Luo2;~Margaret_Marie_Henderson1;~Leila_Wehbe1;~Michael_Tarr1",
        "aff": "Carnegie Mellon University;Carnegie Mellon University;Carnegie Mellon University;Carnegie Mellon University",
        "aff_domain": "cmu.edu;cmu.edu;cmu.edu;cmu.edu",
        "position": "PhD student;Postdoc;Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\nluo2024brainscuba,\ntitle={Brain{SCUBA}: Fine-Grained Natural Language Captions of Visual Cortex Selectivity},\nauthor={Andrew Luo and Margaret Marie Henderson and Michael J. Tarr and Leila Wehbe},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=mQYHXUUTkU}\n}",
        "github": "",
        "project": "",
        "reviewers": "79Ny;aznk;G8Co;xxME",
        "pdf_size": 28942319,
        "rating": "6;6;8;8",
        "confidence": "3;3;4;4",
        "soundness": "3;3;3;4",
        "contribution": "2;2;3;4",
        "presentation": "3;3;4;4",
        "wc_summary": "91;78;59;109",
        "wc_strengths": "30;65;163;163",
        "wc_weaknesses": "83;58;60;124",
        "wc_questions": "253;266;88;50",
        "wc_review": "457;467;370;446",
        "wc_reply_reviewers": "25;53;0;141",
        "wc_reply_authors": "1476;984;803;1131",
        "reply_reviewers": "1;1;0;2",
        "reply_authors": "3;3;2;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            84.25,
            18.267115262131565
        ],
        "wc_strengths_avg": [
            105.25,
            59.060879607401716
        ],
        "wc_weaknesses_avg": [
            81.25,
            26.564779313971346
        ],
        "wc_questions_avg": [
            164.25,
            96.30258303908572
        ],
        "wc_review_avg": [
            435.0,
            38.255718526777144
        ],
        "wc_reply_reviewers_avg": [
            54.75,
            53.20890433000852
        ],
        "wc_reply_authors_avg": [
            1098.5,
            246.97823790771525
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18416808513947964476&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=mQYHXUUTkU",
        "pdf": "https://openreview.net/pdf?id=mQYHXUUTkU",
        "email": "cmu.edu;cmu.edu;cmu.edu;cmu.edu",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Carnegie Mellon University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cmu.edu",
        "aff_unique_abbr": "CMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "mR5pknv2oP",
        "title": "Chain-of-Thought Reasoning is a Policy Improvement Operator",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models have astounded the world with fascinating new capabilities. However, they currently lack the ability to teach themselves new skills, relying instead on large amounts of human-generated training data. We introduce SECToR (Self-Education via Chain-of-Thought Reasoning), a proof-of-concept demonstration that language models can teach themselves new skills using chain-of-thought reasoning. During the self-learning loop, SECToR asks models to solve addition problems using chain-of-thought reasoning before training the next version of the model to solve those same problems directly without using such reasoning. This process often results in an improved model which can, when again augmented with chain-of-thought reasoning, solve even harder problems than the original model, allowing the self-learning loop to continue. Language models trained via SECToR autonomously learn to add up to 29-digit numbers without access to any ground truth examples beyond an initial supervised fine-tuning phase consisting only of numbers with 6 or fewer digits. Our central hypothesis is that chain-of-thought reasoning can act as a policy improvement operator, similarly to how Monte-Carlo Tree Search is used in AlphaZero \\citep{silver2017mastering}. We hope that this research can lead to new directions in which language models can learn to teach themselves without the need for human demonstrations.",
        "keywords": "language models;chain-of-thought reasoning;self-learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/8af053a01aff6d8d4e07178532e82f75e5cb4593.zip",
        "author": "Hugh Zhang;David C. Parkes",
        "authorids": "~Hugh_Zhang1;~David_C._Parkes1",
        "gender": ";M",
        "homepage": ";https://parkes.seas.harvard.edu/",
        "dblp": "239/4076;p/DavidCParkes.html",
        "google_scholar": ";JUn8PgwAAAAJ",
        "orcid": ";0000-0002-2701-3464",
        "linkedin": ";",
        "or_profile": "~Hugh_Zhang1;~David_C._Parkes1",
        "aff": "Harvard University;Harvard University",
        "aff_domain": "harvard.edu;harvard.edu",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nzhang2024chainofthought,\ntitle={Chain-of-Thought Reasoning is a Policy Improvement Operator},\nauthor={Hugh Zhang and David C. Parkes},\nyear={2024},\nurl={https://openreview.net/forum?id=mR5pknv2oP}\n}",
        "github": "",
        "project": "",
        "reviewers": "WpSN;btm4;KjP6;wTSJ",
        "site": "https://openreview.net/forum?id=mR5pknv2oP",
        "pdf_size": 1091880,
        "rating": "3;3;5;8",
        "confidence": "3;4;4;5",
        "soundness": "2;3;3;3",
        "contribution": "2;3;2;4",
        "presentation": "3;3;3;3",
        "wc_summary": "75;85;46;164",
        "wc_strengths": "52;24;49;303",
        "wc_weaknesses": "191;183;336;504",
        "wc_questions": "46;174;2;72",
        "wc_review": "364;466;433;1043",
        "wc_reply_reviewers": "0;0;109;0",
        "wc_reply_authors": "608;406;413;180",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            92.5,
            43.69496538504179
        ],
        "wc_strengths_avg": [
            107.0,
            113.68157282515051
        ],
        "wc_weaknesses_avg": [
            303.5,
            130.7985091658158
        ],
        "wc_questions_avg": [
            73.5,
            63.18821092577317
        ],
        "wc_review_avg": [
            576.5,
            271.8368076622443
        ],
        "wc_reply_reviewers_avg": [
            27.25,
            47.198384506251905
        ],
        "wc_reply_authors_avg": [
            401.75,
            151.53939256840118
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.8638684255813602,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4492886645847007062&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Harvard University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.harvard.edu",
        "aff_unique_abbr": "Harvard",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "mRw9BuNO9i",
        "title": "Effortless Cross-Platform Video Codec: A Codebook-Based Method",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Under certain circumstances, advanced neural video codecs can surpass the most complex traditional codecs in their rate-distortion (RD) performance.  One of the main reasons for the high performance of existing neural video codecs is the use of the entropy model, which can provide more accurate probability distribution estimations for compressing the latents. This also implies the rigorous requirement that entropy models running on different platforms should use consistent distribution estimations. However, in cross-platform scenarios, entropy models running on different platforms usually yield inconsistent probability distribution estimations due to floating point computation errors that are platform-dependent, which can cause the decoding side to fail in correctly decoding the compressed bitstream sent by the encoding side. In this paper, we propose a cross-platform video compression framework based on codebooks, which avoids autoregressive entropy modeling and achieves video compression by transmitting the index sequence of the codebooks. Moreover, instead of using optical flow for context alignment, we propose to use the conditional cross-attention module to obtain the context between frames. Due to the absence of autoregressive modeling and optical flow alignment, we can design an extremely minimalist framework that can greatly benefit computational efficiency. Importantly, our framework no longer contains any distribution estimation modules for entropy modeling, and thus computations across platforms are not necessarily consistent. Experimental results show that our method can outperform the traditional H.265 (medium) even without any entropy constraints, while achieving the cross-platform property intrinsically.",
        "keywords": "Video Codec;Codebook-based Method;Cross-Platform",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Kuan Tian;Yonghang Guan;Jinxi Xiang;Jun Zhang;Xiao Han;Yang Wei",
        "authorids": "~Kuan_Tian1;~Yonghang_Guan1;~Jinxi_Xiang1;~Jun_Zhang17;~Xiao_Han2;~Yang_Wei2",
        "gender": ";M;M;M;M;M",
        "homepage": ";;https://jinxixiang.netlify.app/;https://junzhang.org;;",
        "dblp": ";;227/4249;29/4190-18.html;01/2095-7;03/1094-32.html",
        "google_scholar": "https://scholar.google.com.hk/citations?user=zZeo7hwAAAAJ;;Zn-0LioAAAAJ;;XGVV3gEAAAAJ;",
        "orcid": "0000-0002-9409-5842;;;0000-0001-5579-7094;;",
        "linkedin": ";yonghang-guan-75709b205;;;xiaohan2009;",
        "or_profile": "~Kuan_Tian1;~Yonghang_Guan1;~Jinxi_Xiang1;~Jun_Zhang17;~Xiao_Han2;~Yang_Wei2",
        "aff": "Tencent AI Lab;Tencent AI Lab;Tencent AI Lab;Tencent AI Lab;Tencent AI Lab;Tencent AI Lab",
        "aff_domain": "tencent.com;tencent.com;tencent.com;tencent.com;tencent.com;tencent.com",
        "position": "Researcher;Researcher;Researcher;Principal Researcher;Principal Researcher;Researcher",
        "bibtex": "@misc{\ntian2024effortless,\ntitle={Effortless Cross-Platform Video Codec: A Codebook-Based Method},\nauthor={Kuan Tian and Yonghang Guan and Jinxi Xiang and Jun Zhang and Xiao Han and Yang Wei},\nyear={2024},\nurl={https://openreview.net/forum?id=mRw9BuNO9i}\n}",
        "github": "",
        "project": "",
        "reviewers": "g8nh;6Bc6;iHcA;z95x",
        "site": "https://openreview.net/forum?id=mRw9BuNO9i",
        "pdf_size": 10382233,
        "rating": "5;5;6;8",
        "confidence": "4;5;4;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "105;61;59;30",
        "wc_strengths": "32;59;24;9",
        "wc_weaknesses": "360;214;298;5",
        "wc_questions": "6;23;95;18",
        "wc_review": "503;357;476;62",
        "wc_reply_reviewers": "0;0;62;0",
        "wc_reply_authors": "2209;1895;2368;875",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "5;4;5;2",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            63.75,
            26.789690181112583
        ],
        "wc_strengths_avg": [
            31.0,
            18.152134860671346
        ],
        "wc_weaknesses_avg": [
            219.25,
            134.11072850447127
        ],
        "wc_questions_avg": [
            35.5,
            34.90343822605446
        ],
        "wc_review_avg": [
            349.5,
            174.84064172840365
        ],
        "wc_reply_reviewers_avg": [
            15.5,
            26.846787517317598
        ],
        "wc_reply_authors_avg": [
            1836.75,
            580.7651741452822
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.0,
            1.224744871391589
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.4714045207910316,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16993593551665549821&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "Tencent",
        "aff_unique_dep": "Tencent AI Lab",
        "aff_unique_url": "https://ai.tencent.com",
        "aff_unique_abbr": "Tencent AI Lab",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "mSSi0zYkEA",
        "title": "Initializing the Layer-wise Learning Rate",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The standard method to assign learning rates has been to rely on the optimizer and to use a single, global learning rate across all its layers. We propose to assign individual learning rates as well, according to the layer-wise gradient magnitude at initialization. Even if individual layers are initialized to preserve gradient variance, architectural characteristics result in uneven gradient magnitude even when the network has not started training. We interpret this gradient magnitude as a measure of architecture-induced convergence bias, and adjust the layer-wise learning rate opposite to its gradient magnitude at initialization. This relative learning rate is maintained throughout the entire training scheme. Experiments on convolutional and transformer architectures on ImageNet-1k show improved accuracy and training stability.",
        "keywords": "Learning Rate;Exploding Gradient;Vanishing Gradient",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Kwang Yong Shin;Suhyun Kim;Soo-Mook Moon",
        "authorids": "~Kwang_Yong_Shin1;~Suhyun_Kim1;~Soo-Mook_Moon1",
        "gender": "M;;M",
        "homepage": "https://altair.snu.ac.kr/students/;https://kdst.tistory.com/;https://altair.snu.ac.kr/smoon/",
        "dblp": ";45/6898-1;37/4764",
        "google_scholar": "4sg7eZ0AAAAJ;;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Kwang_Yong_Shin1;~Suhyun_Kim1;~Soo-Mook_Moon1",
        "aff": "Seoul National University;Korea Institute of Science and Technology;Seoul National University",
        "aff_domain": "snu.ac.kr;kist.re.kr;snu.ac.kr",
        "position": "PhD student;Principal Researcher;Full Professor",
        "bibtex": "@misc{\nshin2024initializing,\ntitle={Initializing the Layer-wise Learning Rate},\nauthor={Kwang Yong Shin and Suhyun Kim and Soo-Mook Moon},\nyear={2024},\nurl={https://openreview.net/forum?id=mSSi0zYkEA}\n}",
        "github": "",
        "project": "",
        "reviewers": "R9Q4;cEsi;LTJF;5Czw",
        "site": "https://openreview.net/forum?id=mSSi0zYkEA",
        "pdf_size": 561979,
        "rating": "3;3;3;6",
        "confidence": "4;3;3;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;2;2",
        "wc_summary": "55;108;43;60",
        "wc_strengths": "29;75;17;68",
        "wc_weaknesses": "364;181;81;149",
        "wc_questions": "140;133;83;86",
        "wc_review": "588;497;224;363",
        "wc_reply_reviewers": "0;181;0;0",
        "wc_reply_authors": "507;436;420;318",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            66.5,
            24.743686063317245
        ],
        "wc_strengths_avg": [
            47.25,
            24.742423082632794
        ],
        "wc_weaknesses_avg": [
            193.75,
            104.71717862891455
        ],
        "wc_questions_avg": [
            110.5,
            26.139051245215462
        ],
        "wc_review_avg": [
            418.0,
            137.6608150491635
        ],
        "wc_reply_reviewers_avg": [
            45.25,
            78.3752990424917
        ],
        "wc_reply_authors_avg": [
            420.25,
            67.50694408725668
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:rbsf8N4FyV0J:scholar.google.com/&scioq=Initializing+the+Layer-wise+Learning+Rate&hl=en&as_sdt=0,14",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Seoul National University;Korea Institute of Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.snu.ac.kr;https://www.kist.re.kr",
        "aff_unique_abbr": "SNU;KIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "mUAV0OMf4j",
        "title": "Revisiting Subsampling and Mixup for WSI Classification: A Slot-Attention-Based Approach",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Whole slide image (WSI) classification requires repetitive zoom-in and out for pathologists, as only small portions of the slide may be relevant to detecting cancer. Due to the lack of patch-level labels, multiple instance learning (MIL) is common practice for training a WSI classifier. One of the challenges in MIL for WSI is the weak supervision coming only from the slide-level labels, often resulting in severe overfitting. In response, researchers have considered adapting patch-level augmentation or applying mixup augmentation, but their applicability remains unverified. Our approach augments the training dataset by sampling a subset of patches in the WSI without significantly altering the underlying semantics of the original slides. Additionally, we introduce an efficient model (Slot-MIL) that organizes patches into a fixed number of slots, the abstract representation of patches, using an attention mechanism. We empirically demonstrate that the subsampling augmentation helps to make more informative slots by restricting the over-concentration of attention and to improve interpretability. Finally, we illustrate that combining our attention-based aggregation model with subsampling and mixup, which has shown limited compatibility in existing MIL methods, can enhance both generalization and calibration. Our proposed methods achieve the state-of-the-art performance across various benchmark datasets including class imbalance and distribution shifts.",
        "keywords": "multiple instance learning;regularizer;attention mechanism;medical imaging;histopathology;weakly-supervised learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/15e299df602409c0cb0b641f10a264f28a8f4e64.zip",
        "author": "Seongho Keum;Sanghyun Kim;Soojeong Lee;Juho Lee",
        "authorids": "~Seongho_Keum1;~Sanghyun_Kim2;~Soojeong_Lee1;~Juho_Lee2",
        "gender": ";M;;M",
        "homepage": ";https://nannullna.github.io;;https://juho.lee.github.io",
        "dblp": ";;;55/3410-1",
        "google_scholar": ";BBQXZhkAAAAJ;-_5kgT0AAAAJ;Py4URJUAAAAJ",
        "orcid": ";0009-0008-9163-168X;;",
        "linkedin": "seongho-keum-b0086b267/;;;",
        "or_profile": "~Seongho_Keum1;~Sanghyun_Kim2;~Soojeong_Lee1;~Juho_Lee2",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Sung Kyun Kwan University;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;kaist.edu;skku.edu;kaist.ac.kr",
        "position": "MS student;MS student;Undergrad student;Associate Professor",
        "bibtex": "@misc{\nkeum2024revisiting,\ntitle={Revisiting Subsampling and Mixup for {WSI} Classification: A Slot-Attention-Based Approach},\nauthor={Seongho Keum and Sanghyun Kim and Soojeong Lee and Juho Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=mUAV0OMf4j}\n}",
        "github": "",
        "project": "",
        "reviewers": "5YV1;Wtm8;vwP9",
        "site": "https://openreview.net/forum?id=mUAV0OMf4j",
        "pdf_size": 10364369,
        "rating": "3;6;6",
        "confidence": "5;4;4",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "2;3;4",
        "wc_summary": "72;123;104",
        "wc_strengths": "79;134;136",
        "wc_weaknesses": "553;283;122",
        "wc_questions": "3;2;50",
        "wc_review": "707;542;412",
        "wc_reply_reviewers": "1133;40;75",
        "wc_reply_authors": "1761;1274;1082",
        "reply_reviewers": "3;1;1",
        "reply_authors": "4;3;3",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            99.66666666666667,
            21.044925490219462
        ],
        "wc_strengths_avg": [
            116.33333333333333,
            26.411277052720408
        ],
        "wc_weaknesses_avg": [
            319.3333333333333,
            177.82075869319144
        ],
        "wc_questions_avg": [
            18.333333333333332,
            22.395436042987765
        ],
        "wc_review_avg": [
            553.6666666666666,
            120.71545974821214
        ],
        "wc_reply_reviewers_avg": [
            416.0,
            507.196871704338
        ],
        "wc_reply_authors_avg": [
            1372.3333333333333,
            285.78818885476863
        ],
        "reply_reviewers_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13655577726043959547&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology;Sungkyunkwan University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.kaist.ac.kr;https://www.skku.edu",
        "aff_unique_abbr": "KAIST;SKKU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "mWT3Ftkc3e",
        "title": "Sampling is as easy as keeping the consistency: convergence guarantee for Consistency Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We provide the first convergence guarantee for the Consistency Models (CMs), a newly emerging type of one-step generative models that is capable of generating comparable samples to those sampled from state-of-the-art Diffusion Models. Our main result is that, under the basic assumptions on score-matching errors, consistency errors, and smoothness of the data distribution,  CMs can efficiently generate samples in one step with small $W_2$ error to any real data distribution. Our results (1) hold for $L^2$-accurate assumptions on both score and consistency functions (rather than $L^\\infty$-accurate assumptions); (2) do not require strong assumptions on the data distribution such as log-Sobelev conditions; (3) scale polynomially in all parameters; and (4) match the state-of-the-art convergence guarantee for score-based generative models. \nWe also show that the Multi-step Consistency Sampling procedure can further reduce the error comparing to one step sampling, which supports the original statement of Yang Song's work. Our result can be generalized to arbitrary bounded data distributions that may be supported on some low-dimensional sub-manifolds.\nOur results further imply  TV error guarantees when making some Langevin-based modifications to the output distributions.",
        "keywords": "Generative Models; Convergence Analysis;",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Junlong Lyu;Zhitang Chen;Shoubo Feng",
        "authorids": "~Junlong_Lyu1;~Zhitang_Chen1;~Shoubo_Feng1",
        "gender": "M;M;M",
        "homepage": ";;",
        "dblp": "243/2962.html;06/10875;",
        "google_scholar": "S8ogqFcAAAAJ;;06JUo1MAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Junlong_Lyu1;~Zhitang_Chen1;~Shoubo_Feng1",
        "aff": "Huawei Technologies Ltd.;Huawei Technologies Ltd.;Huawei Technologies Ltd.",
        "aff_domain": "huawei.com;huawei.com;huawei.com",
        "position": "Researcher;Researcher;Researcher",
        "bibtex": "@misc{\nlyu2024sampling,\ntitle={Sampling is as easy as keeping the consistency: convergence guarantee for Consistency Models},\nauthor={Junlong Lyu and Zhitang Chen and Shoubo Feng},\nyear={2024},\nurl={https://openreview.net/forum?id=mWT3Ftkc3e}\n}",
        "github": "",
        "project": "",
        "reviewers": "CiGA;fM3B;8oEy;N63V",
        "site": "https://openreview.net/forum?id=mWT3Ftkc3e",
        "pdf_size": 380950,
        "rating": "6;6;6;8",
        "confidence": "2;4;4;3",
        "soundness": "3;3;4;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "77;45;33;107",
        "wc_strengths": "41;36;54;111",
        "wc_weaknesses": "134;132;42;352",
        "wc_questions": "150;96;100;226",
        "wc_review": "402;309;229;796",
        "wc_reply_reviewers": "36;29;89;0",
        "wc_reply_authors": "867;596;1081;653",
        "reply_reviewers": "1;1;2;0",
        "reply_authors": "4;4;5;3",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            65.5,
            28.85740806101615
        ],
        "wc_strengths_avg": [
            60.5,
            29.88728826775691
        ],
        "wc_weaknesses_avg": [
            165.0,
            114.17968295629481
        ],
        "wc_questions_avg": [
            143.0,
            52.43090691567332
        ],
        "wc_review_avg": [
            434.0,
            217.78314902673256
        ],
        "wc_reply_reviewers_avg": [
            38.5,
            32.12864765283469
        ],
        "wc_reply_authors_avg": [
            799.25,
            191.48939265661687
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            4.0,
            0.7071067811865476
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.17407765595569782,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14628412173401979341&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Huawei",
        "aff_unique_dep": "Huawei Technologies",
        "aff_unique_url": "https://www.huawei.com",
        "aff_unique_abbr": "Huawei",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "mWf3RGc6HG",
        "title": "Revisiting Ternary Neural Networks towards Asymmetric Thresholds and Uniform Distribution",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recently, researchers have made significant progress in ternary logic circuits, which has spurred the utilization of Ternary Neural Network (TNN) due to its compatibility with ternary coding instead of the 2-bit coding used in binary system. However, TNN exhibits significant accuracy degradation compared to its full-precision counterpart. Therefore, we are motivated to revisit ternary neural networks and enhance their performance. To fully leverage the limited representation space, we apply a uniform distribution to three quantized values {-1,0,+1} to maximize the information entropy. To balance the representation ability of TNN while considering convenient hardware implementation, we adopt the asymmetric thresholds and symmetric scaling factors quantization scheme and introduce the bi-STE optimization method. Moreover, a two-stage knowledge distillation scheme is employed to further enhance the performance. Experimental results demonstrate the effectiveness of the proposed method for TNNs, achieving a top-1 accuracy of 74.5% for ResNet-50 on ImageNet. This outperforms previous ternary quantization methods by a large margin and even surpasses representative 2-bit quantization methods such as LSQ (73.7%).",
        "keywords": "Ternary neural networks;asymmetric thresholds;uniform distribution",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Zhenhua Liu;Kai Han;Yunhe Wang",
        "authorids": "~Zhenhua_Liu2;~Kai_Han2;~Yunhe_Wang1",
        "gender": "M;M;M",
        "homepage": ";https://iamhankai.github.io;https://www.wangyunhe.site/",
        "dblp": "02/1825-3.html;51/4757-2;63/8217-1",
        "google_scholar": "bihqxP4AAAAJ;vThoBVcAAAAJ;https://scholar.google.com.sg/citations?user=isizOkYAAAAJ",
        "orcid": ";0000-0002-9761-2702;0000-0002-0142-509X",
        "linkedin": ";;",
        "or_profile": "~Zhenhua_Liu2;~Kai_Han2;~Yunhe_Wang1",
        "aff": "Huawei Technologies Ltd.;Huawei Noah's Ark Lab;Huawei Noah's Ark Lab",
        "aff_domain": "huawei.com;huawei.com;huawei.com",
        "position": "Researcher;Principal Researcher;Principal Researcher",
        "bibtex": "@misc{\nliu2024revisiting,\ntitle={Revisiting Ternary Neural Networks towards Asymmetric Thresholds and Uniform Distribution},\nauthor={Zhenhua Liu and Kai Han and Yunhe Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=mWf3RGc6HG}\n}",
        "github": "",
        "project": "",
        "reviewers": "8ZRJ;Dqjz;FfEp;TP94",
        "site": "https://openreview.net/forum?id=mWf3RGc6HG",
        "pdf_size": 780390,
        "rating": "3;3;5;5",
        "confidence": "5;4;4;4",
        "soundness": "2;3;2;2",
        "contribution": "1;2;2;2",
        "presentation": "2;3;1;3",
        "wc_summary": "40;49;104;64",
        "wc_strengths": "35;82;51;30",
        "wc_weaknesses": "144;174;290;165",
        "wc_questions": "41;60;289;63",
        "wc_review": "260;365;734;322",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            64.25,
            24.498724456591614
        ],
        "wc_strengths_avg": [
            49.5,
            20.303940504246953
        ],
        "wc_weaknesses_avg": [
            193.25,
            56.90946757789955
        ],
        "wc_questions_avg": [
            113.25,
            101.81938666089086
        ],
        "wc_review_avg": [
            420.25,
            184.94914841653096
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:leKsja95BY8J:scholar.google.com/&scioq=Revisiting+Ternary+Neural+Networks+towards+Asymmetric+Thresholds+and+Uniform+Distribution&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Huawei",
        "aff_unique_dep": "Huawei Technologies",
        "aff_unique_url": "https://www.huawei.com",
        "aff_unique_abbr": "Huawei",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "mWxcEm7jIv",
        "title": "Training Diffusion Classifiers with Denoising Assistance",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Score-matching and diffusion models have emerged as state-of-the-art generative models for both conditional and unconditional generation. Classifier-guided diffusion models are created by training a classifier on samples obtained from the forward-diffusion process (i.e., from data to noise). In this paper, we propose denoising-assisted (DA) classifiers wherein the diffusion classifier is trained using both noisy and denoised examples as simultaneous inputs to the model. We differentiate between denoising-assisted (DA) classifiers and noisy classifiers, which are diffusion classifiers that are only trained on noisy examples. Our experiments on Cifar10 and Imagenet show that DA-classifiers improve over noisy classifiers both quantitatively in terms of generalization to test data and qualitatively in terms of perceptually-aligned classifier-gradients and generative modeling metrics. We theoretically characterize the gradients of DA-classifiers to explain improved perceptual alignment. Building upon the observed generalization benefits of DA-classifiers, we propose and evaluate a semi-supervised framework for training diffusion classifiers and demonstrate improved generalization of DA-classifiers over noisy classifiers.",
        "keywords": "Score-matching SDEs;Guided Diffusion;DDPMs;Semi-supervised Diffusion",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/d22897cd91c3a0d6b809155d68151f3a8f8341d7.zip",
        "author": "Chandramouli Shama Sastry;Sri Harsha Dumpala;Sageev Oore",
        "authorids": "~Chandramouli_Shama_Sastry1;~Sri_Harsha_Dumpala3;~Sageev_Oore1",
        "gender": "M;M;M",
        "homepage": "https://scholar.google.com/citations?user=yR5pPqAAAAAJ&hl=en;;",
        "dblp": "223/6317;148/9851;67/4980",
        "google_scholar": ";https://scholar.google.ca/citations?user=D4KhVXoAAAAJ;https://scholar.google.ca/citations?user=cI0dYX4AAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Chandramouli_Shama_Sastry1;~Sri_Harsha_Dumpala3;~Sageev_Oore1",
        "aff": "Vector Institute/Dalhousie University;Dalhousie University;Vector Institute",
        "aff_domain": "dal.ca;dal.ca;vectorinstitute.ai",
        "position": "PhD student;PhD student;Researcher",
        "bibtex": "@misc{\nsastry2024training,\ntitle={Training Diffusion Classifiers with Denoising Assistance},\nauthor={Chandramouli Shama Sastry and Sri Harsha Dumpala and Sageev Oore},\nyear={2024},\nurl={https://openreview.net/forum?id=mWxcEm7jIv}\n}",
        "github": "",
        "project": "",
        "reviewers": "dXPD;JmSU;F98v;YWxN",
        "site": "https://openreview.net/forum?id=mWxcEm7jIv",
        "pdf_size": 13441385,
        "rating": "3;5;5;6",
        "confidence": "4;4;2;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;2;3",
        "wc_summary": "69;134;40;56",
        "wc_strengths": "42;63;50;64",
        "wc_weaknesses": "280;238;183;100",
        "wc_questions": "157;2;2;16",
        "wc_review": "548;437;275;236",
        "wc_reply_reviewers": "717;28;6;0",
        "wc_reply_authors": "3376;1251;541;443",
        "reply_reviewers": "5;1;1;0",
        "reply_authors": "9;2;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            74.75,
            35.716767770894386
        ],
        "wc_strengths_avg": [
            54.75,
            9.202581159652981
        ],
        "wc_weaknesses_avg": [
            200.25,
            67.328949939829
        ],
        "wc_questions_avg": [
            44.25,
            65.34667168264961
        ],
        "wc_review_avg": [
            374.0,
            125.58861413360687
        ],
        "wc_reply_reviewers_avg": [
            187.75,
            305.7403923265619
        ],
        "wc_reply_authors_avg": [
            1402.75,
            1181.15163611621
        ],
        "reply_reviewers_avg": [
            1.75,
            1.920286436967152
        ],
        "reply_authors_avg": [
            3.25,
            3.344772040064913
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.48420012470625223,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11883577657481458770&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Dalhousie University;Vector Institute",
        "aff_unique_dep": "Vector Institute;",
        "aff_unique_url": "https://www.dal.ca;https://vectorinstitute.ai/",
        "aff_unique_abbr": "Dal;Vector Institute",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "title": "On the Vulnerability of Adversarially Trained Models Against Two-faced Attacks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17892",
        "id": "mXpNp8MMr5",
        "author_site": "Shengjie Zhou, Lue Tao, Yuzhou Cao, Tao Xiang, Bo An, Lei Feng",
        "tldr": "",
        "abstract": "Adversarial robustness is an important standard for measuring the quality of learned models, and adversarial training is an effective strategy for improving the adversarial robustness of models. In this paper, we disclose that adversarially trained models are vulnerable to two-faced attacks, where slight perturbations in input features are crafted to make the model exhibit a false sense of robustness in the verification phase. Such a threat is significantly important as it can mislead our evaluation of the adversarial robustness of models, which could cause unpredictable security issues when deploying substandard models in reality. More seriously, this threat seems to be pervasive and tricky: we find that many types of models suffer from this threat, and models with higher adversarial robustness tend to be more vulnerable. Furthermore, we provide the first attempt to formulate this threat, disclose its relationships with adversarial risk, and try to circumvent it via a simple countermeasure. These findings serve as a crucial reminder for practitioners to exercise caution in the verification phase, urging them to refrain from blindly trusting the exhibited adversarial robustness of models.",
        "keywords": "adversarial training;adversarial robustness;two-faced attacks",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/94de07d537b28610af9290e183305101a4be93e7.zip",
        "author": "Shengjie Zhou;Lue Tao;Yuzhou Cao;Tao Xiang;Bo An;Lei Feng",
        "authorids": "~Shengjie_Zhou1;~Lue_Tao1;~Yuzhou_Cao1;~Tao_Xiang2;~Bo_An2;~Lei_Feng1",
        "gender": "M;M;M;M;M;M",
        "homepage": ";http://www.lamda.nju.edu.cn/taol/;https://yzcao-nkg.github.io/;;https://personal.ntu.edu.sg/boan/;https://lfeng1995.github.io/",
        "dblp": "206/7802.html;247/1090;256/5052;22/4460-1.html;42/6178-1.html;76/847-6",
        "google_scholar": ";9Cc-vdAAAAAJ;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com/citations?hl=en;PEEpuNwAAAAJ;https://scholar.google.com.sg/citations?user=KomQOFkAAAAJ",
        "orcid": ";;;0000-0002-9439-4623;0000-0002-7064-7438;0000-0003-2839-5799",
        "linkedin": ";;;;;",
        "or_profile": "~Shengjie_Zhou1;~Lue_Tao1;~Yuzhou_Cao1;~Tao_Xiang2;~Bo_An2;~Lei_Feng1",
        "aff": "Chongqing University;Nanjing University;Nanyang Technological University;Chongqing University;Nanyang Technological University;Singapore University of Technology and Design",
        "aff_domain": "cqu.edu.cn;nju.edu.cn;ntu.edu;cqu.edu.cn;ntu.edu.sg;sutd.edu.sg",
        "position": "MS student;PhD student;PhD student;Full Professor;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nzhou2024on,\ntitle={On the Vulnerability of Adversarially Trained Models Against Two-faced Attacks},\nauthor={Shengjie Zhou and Lue Tao and Yuzhou Cao and Tao Xiang and Bo An and Lei Feng},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=mXpNp8MMr5}\n}",
        "github": "",
        "project": "",
        "reviewers": "ox78;J5b2;rs75",
        "pdf_size": 644225,
        "rating": "6;8;8",
        "confidence": "5;4;5",
        "soundness": "4;4;3",
        "contribution": "3;4;3",
        "presentation": "3;3;3",
        "wc_summary": "118;107;105",
        "wc_strengths": "40;107;131",
        "wc_weaknesses": "90;77;126",
        "wc_questions": "43;60;82",
        "wc_review": "291;351;444",
        "wc_reply_reviewers": "44;74;0",
        "wc_reply_authors": "1207;885;1260",
        "reply_reviewers": "1;1;0",
        "reply_authors": "4;3;3",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            110.0,
            5.715476066494082
        ],
        "wc_strengths_avg": [
            92.66666666666667,
            38.50829636440554
        ],
        "wc_weaknesses_avg": [
            97.66666666666667,
            20.725722075613085
        ],
        "wc_questions_avg": [
            61.666666666666664,
            15.965240019770729
        ],
        "wc_review_avg": [
            362.0,
            62.94441992742486
        ],
        "wc_reply_reviewers_avg": [
            39.333333333333336,
            30.39005685344395
        ],
        "wc_reply_authors_avg": [
            1117.3333333333333,
            165.70321528430145
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:1CriON2_EPQJ:scholar.google.com/&scioq=On+the+Vulnerability+of+Adversarially+Trained+Models+Against+Two-faced+Attacks&hl=en&as_sdt=0,33",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=mXpNp8MMr5",
        "pdf": "https://openreview.net/pdf?id=mXpNp8MMr5",
        "email": "cqu.edu.cn;nju.edu.cn;ntu.edu;cqu.edu.cn;ntu.edu.sg;sutd.edu.sg",
        "author_num": 6,
        "aff_unique_index": "0;1;2;0;2;3",
        "aff_unique_norm": "Chongqing University;Nanjing University;Nanyang Technological University;Singapore University of Technology and Design",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.cqu.edu.cn;https://www.nju.edu.cn;https://www.ntu.edu.sg;https://www.sutd.edu.sg",
        "aff_unique_abbr": "CQU;Nanjing U;NTU;SUTD",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;1;1",
        "aff_country_unique": "China;Singapore"
    },
    {
        "id": "mYOYjhXGop",
        "title": "A Weakly Supervised and Globally Explainable Learning Framework for Brain Tumor Segmentation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Brain tumors are a prevalent clinical disease that causes significant suffering for patients. Machine-based segmentation of brain tumors can assist doctors in diagnosis and providing better treatment. However, the complex structure of brain tumors presents a challenge for automatic tumor detection. Deep learning techniques have shown great potential in learning feature representations, but they often require a large number of samples with pixel-level annotations for training for implementing objects segmentation. Additionally, the lack of interpretability in deep learning models hinders their application in medical scenarios. In this paper, we propose a counterfactual generation framework that not only achieves exceptional performance in brain tumor segmentation without the need for pixel-level annotations, but also provides explainability. Our framework effectively separate class-related features from class-unrelated features of the samples, and generate new samples that preserve identity features while altering class attributes by embedding different class-related features.  We can accurately identify tumor regions through performing comparison between original abnormal images and generated normal samples which preserve original identity features. We employ topological data analysis for projecting extracted class-related features into a globally explainable class-related manifold. Furthermore, by actively manipulating the generation of images with different class attributes with defined paths, we can provide a more comprehensive and robust explanation of the model. We evaluate our proposed method through experiments conducted on two datasets, which demonstrates superior performance of brain segmentation.",
        "keywords": "brain tumor segmentation;weakly supervised learning;explainable learning;counterfactual generation;class association embedding;topological data analysis",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Ruitao Xie;Xiaoxi He;Yi Pan;Yunpeng Cai",
        "authorids": "~Ruitao_Xie1;xjy109204@siat.ac.cn;~Yi_Pan5;~Yunpeng_Cai1",
        "gender": "M;;M;M",
        "homepage": ";;https://jcjs.siat.ac.cn/jcjsen/editorial/view/20210121115957001;",
        "dblp": ";;46/7028-1;80/6847",
        "google_scholar": ";;https://scholar.google.com/citations?hl=zh-CN;_N0JJiEAAAAJ",
        "orcid": "0000-0002-4180-8212;;0000-0002-2766-3096;0000-0001-8797-4243",
        "linkedin": ";;;",
        "or_profile": "~Ruitao_Xie1;xjy109204@siat.ac.cn;~Yi_Pan5;~Yunpeng_Cai1",
        "aff": "Shenzhen Institutes of Advanced Technology, Chinese Academy of Sciences, Chinese Academy of Sciences;;Shenzhen Institutes of Advanced Technology, Chinese Academy of Sciences, Chinese Academy of Sciences;Shenzhen Institutes of Advanced Technology, Chinese Academy of Sciences, Chinese Academy of Sciences",
        "aff_domain": "siat.ac.cn;;siat.ac.cn;siat.ac.cn",
        "position": "PhD student;;Principal Researcher;Full Professor",
        "bibtex": "@misc{\nxie2024a,\ntitle={A Weakly Supervised and Globally Explainable Learning Framework for Brain Tumor Segmentation},\nauthor={Ruitao Xie and Xiaoxi He and Yi Pan and Yunpeng Cai},\nyear={2024},\nurl={https://openreview.net/forum?id=mYOYjhXGop}\n}",
        "github": "",
        "project": "",
        "reviewers": "4gaV;Er7v;Bw47;naJ9",
        "site": "https://openreview.net/forum?id=mYOYjhXGop",
        "pdf_size": 13790948,
        "rating": "3;3;3;3",
        "confidence": "4;3;4;4",
        "soundness": "2;2;2;2",
        "contribution": "2;2;1;2",
        "presentation": "3;2;3;2",
        "wc_summary": "94;133;43;78",
        "wc_strengths": "32;118;52;41",
        "wc_weaknesses": "51;194;80;245",
        "wc_questions": "52;94;80;5",
        "wc_review": "229;539;255;369",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            87.0,
            32.334192428449484
        ],
        "wc_strengths_avg": [
            60.75,
            33.80366104433069
        ],
        "wc_weaknesses_avg": [
            142.5,
            79.74490579341104
        ],
        "wc_questions_avg": [
            57.75,
            34.00275724114149
        ],
        "wc_review_avg": [
            348.0,
            122.20065466273084
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15783381370213415914&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Chinese Academy of Sciences",
        "aff_unique_dep": "Shenzhen Institutes of Advanced Technology",
        "aff_unique_url": "http://www.cas.cn",
        "aff_unique_abbr": "CAS",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Shenzhen",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Analyzing Feed-Forward Blocks in Transformers through the Lens of Attention Maps",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17891",
        "id": "mYWsyTuiRp",
        "author_site": "Goro Kobayashi, Tatsuki Kuribayashi, Sho Yokoi, Kentaro Inui",
        "tldr": "",
        "abstract": "Transformers are ubiquitous in wide tasks.\nInterpreting their internals is a pivotal goal. \nNevertheless, their particular components, feed-forward (FF) blocks, have typically been less analyzed despite their substantial parameter amounts.\nWe analyze the input contextualization effects of FF blocks by rendering them in the attention maps as a human-friendly visualization scheme.\nOur experiments with both masked- and causal-language models reveal that FF networks modify the input contextualization to emphasize specific types of linguistic compositions. \nIn addition, FF and its surrounding components tend to cancel out each other's effects, suggesting potential redundancy in the processing of the Transformer layer.",
        "keywords": "Transformer;Attention map;Feed-forward;Contextualization;Interpretation;Analysis;Pre-trained models;Masked language models;Causal language models",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Goro Kobayashi;Tatsuki Kuribayashi;Sho Yokoi;Kentaro Inui",
        "authorids": "~Goro_Kobayashi1;~Tatsuki_Kuribayashi1;~Sho_Yokoi1;~Kentaro_Inui1",
        "gender": "M;M;;M",
        "homepage": "https://sites.google.com/view/goro-kobayashi;https://kuribayashi4.github.io/;http://www.cl.ecei.tohoku.ac.jp/~yokoi/;http://www.cl.ecei.tohoku.ac.jp/~inui/",
        "dblp": ";228/5787;184/8316;90/3315",
        "google_scholar": "AT-ybe0AAAAJ;https://scholar.google.co.jp/citations?user=-bqmkaAAAAAJ;https://scholar.google.co.jp/citations?user=EW2QPKoAAAAJ;https://scholar.google.co.jp/citations?user=38_o3-kAAAAJ",
        "orcid": ";;0009-0002-4437-5245;0000-0001-6510-604X",
        "linkedin": ";;shoyokoi/;kentaro-inui-52401a31/",
        "or_profile": "~Goro_Kobayashi1;~Tatsuki_Kuribayashi1;~Sho_Yokoi1;~Kentaro_Inui1",
        "aff": "Tohoku University;Mohamed bin Zayed University of Artificial Intelligence;Tohoku University;Tohoku University",
        "aff_domain": "tohoku.ac.jp;mbzuai.ac.ae;tohoku.ac.jp;tohoku.ac.jp",
        "position": "PhD student;Postdoc;Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\nkobayashi2024analyzing,\ntitle={Analyzing Feed-Forward Blocks in Transformers through the Lens of Attention Maps},\nauthor={Goro Kobayashi and Tatsuki Kuribayashi and Sho Yokoi and Kentaro Inui},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=mYWsyTuiRp}\n}",
        "github": "",
        "project": "",
        "reviewers": "GB37;wwew;Dtpy;Ur6S",
        "pdf_size": 7281742,
        "rating": "6;6;8;8",
        "confidence": "3;4;4;3",
        "soundness": "3;3;3;4",
        "contribution": "3;2;3;4",
        "presentation": "3;3;3;4",
        "wc_summary": "126;92;195;141",
        "wc_strengths": "150;66;36;87",
        "wc_weaknesses": "85;121;110;17",
        "wc_questions": "23;77;127;14",
        "wc_review": "384;356;468;259",
        "wc_reply_reviewers": "0;10;0;0",
        "wc_reply_authors": "336;1053;664;143",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            138.5,
            37.13825520941984
        ],
        "wc_strengths_avg": [
            84.75,
            41.80535252811534
        ],
        "wc_weaknesses_avg": [
            83.25,
            40.41271458340803
        ],
        "wc_questions_avg": [
            60.25,
            45.449834983198784
        ],
        "wc_review_avg": [
            366.75,
            74.62363901606514
        ],
        "wc_reply_reviewers_avg": [
            2.5,
            4.330127018922194
        ],
        "wc_reply_authors_avg": [
            549.0,
            345.487336960416
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 17,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2079429729939922698&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=mYWsyTuiRp",
        "pdf": "https://openreview.net/pdf?id=mYWsyTuiRp",
        "email": "tohoku.ac.jp;mbzuai.ac.ae;tohoku.ac.jp;tohoku.ac.jp",
        "author_num": 4,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Tohoku University;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tohoku.ac.jp;https://mbzuai.ac.ae",
        "aff_unique_abbr": "Tohoku U;MBZUAI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "Japan;United Arab Emirates"
    },
    {
        "title": "Rethinking CNN\u2019s Generalization to Backdoor Attack from Frequency Domain",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17890",
        "id": "mYhH0CDFFa",
        "author_site": "Quanrui Rao, Lin Wang, Wuying Liu",
        "tldr": "",
        "abstract": "Convolutional  neural network  (CNN) is easily affected by backdoor injections, whose models perform normally on clean samples but produce specific outputs on poisoned ones. Most of the existing studies have focused on the effect of trigger feature changes of poisoned samples on model generalization in spatial domain. We focus on the mechanism of CNN memorize poisoned samples in frequency domain, and find that CNN generate generalization to poisoned samples by memorizing the frequency domain distribution of trigger changes. We also explore the influence of trigger perturbations in different frequency domain components on the generalization of poisoned models from visible and invisible backdoor attacks, and prove that high-frequency components are more susceptible to perturbations than low-frequency components. Based on the above fundings, we propose a universal invisible strategy for visible triggers, which can achieve trigger invisibility while maintaining raw attack performance. We also design a novel frequency domain backdoor attack method based on low-frequency semantic information, which can achieve 100\\% attack accuracy on multiple models and multiple datasets, and can bypass multiple defenses.",
        "keywords": "Backdoor attack;Generalization;Frequency domain;CNN",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/bee0eb8862a818b8a5ea80f0f824927460a59aeb.zip",
        "author": "Quanrui Rao;Lin Wang;Wuying Liu",
        "authorids": "~Quanrui_Rao1;~Lin_Wang21;~Wuying_Liu3",
        "gender": "M;F;M",
        "homepage": "https://github.com/quanruirao;https://www.sohu.com/a/396737167_768812;https://dblp.org/pid/94/2092.html",
        "dblp": ";;",
        "google_scholar": ";;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Quanrui_Rao1;~Lin_Wang21;~Wuying_Liu3",
        "aff": "Ludong University;Xianda College of Economics and Humanities Shanghai International Studies University;Ludong University",
        "aff_domain": "ldu.edu.cn;xdsisu.edu.cn;ldu.edu.cn",
        "position": "Undergrad student;Associate Professor;Full Professor",
        "bibtex": "@inproceedings{\nrao2024rethinking,\ntitle={Rethinking {CNN}{\\textquoteright}s Generalization to Backdoor Attack from Frequency Domain},\nauthor={Quanrui Rao and Lin Wang and Wuying Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=mYhH0CDFFa}\n}",
        "github": "",
        "project": "",
        "reviewers": "2gr1;6jrw;F6E6;Uoqj",
        "pdf_size": 5742535,
        "rating": "5;6;6;6",
        "confidence": "3;3;2;3",
        "soundness": "3;2;3;2",
        "contribution": "2;3;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "48;167;106;48",
        "wc_strengths": "13;45;79;36",
        "wc_weaknesses": "449;127;80;237",
        "wc_questions": "3;87;5;85",
        "wc_review": "513;426;270;406",
        "wc_reply_reviewers": "0;34;0;32",
        "wc_reply_authors": "2684;884;1072;1370",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "5;3;2;4",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            92.25,
            49.225882419719
        ],
        "wc_strengths_avg": [
            43.25,
            23.710493457539005
        ],
        "wc_weaknesses_avg": [
            223.25,
            142.2469243955735
        ],
        "wc_questions_avg": [
            45.0,
            41.012193308819754
        ],
        "wc_review_avg": [
            403.75,
            87.0700149305144
        ],
        "wc_reply_reviewers_avg": [
            16.5,
            16.515144564913744
        ],
        "wc_reply_authors_avg": [
            1502.5,
            703.8059036410535
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.5,
            1.118033988749895
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6992510009052480671&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=mYhH0CDFFa",
        "pdf": "https://openreview.net/pdf?id=mYhH0CDFFa",
        "email": "ldu.edu.cn;xdsisu.edu.cn;ldu.edu.cn",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Ludong University;Shanghai International Studies University",
        "aff_unique_dep": ";Xianda College of Economics and Humanities",
        "aff_unique_url": "http://www.ldu.edu.cn;http://www.shisu.edu.cn",
        "aff_unique_abbr": "LDU;SISU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Shanghai",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "mYjaLLViSt",
        "title": "EMP-SSL: Towards Self-Supervised Learning in One Training Epoch",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recently, self-supervised learning (SSL) has achieved tremendous success in learning image representation. Despite the empirical success, most self-supervised learning methods are rather \"inefficient\" learners, typically taking hundreds of training epochs to fully converge. In this work, we show that the key towards efficient self-supervised learning is to increase the number of crops from each image instance. Leveraging one of the state-of-the-art SSL method, we introduce a simplistic form of self-supervised learning method called Extreme-Multi-Patch Self-Supervised-Learning (EMP-SSL) that does not rely on many heuristic techniques for SSL such as weight sharing between the branches, feature-wise normalization, output quantization, and stop gradient, etc, and reduces the training epochs by two orders of magnitude. We show that the proposed method is able to converge to 85.1% on CIFAR-10, 58.5% on CIFAR-100, 38.1% on Tiny ImageNet and 58.5% on ImageNet-100 in just one epoch. Furthermore, the proposed method achieves 91.5% on CIFAR-10, 70.1% on CIFAR-100, 51.5% on Tiny ImageNet and 78.9% on ImageNet-100 with linear probing in less than ten training epochs. In addition, we show that EMP-SSL shows significantly better transferability to out-of-domain datasets compared to baseline SSL methods.",
        "keywords": "Self-supervised Learning;Online Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Shengbang Tong;Yubei Chen;Yi Ma;Yann LeCun",
        "authorids": "~Shengbang_Tong1;~Yubei_Chen1;~Yi_Ma4;~Yann_LeCun1",
        "gender": "M;M;M;M",
        "homepage": "https://tsb0601.github.io/petertongsb/;https://redwood.berkeley.edu/people/yubei-chen/;http://people.eecs.berkeley.edu/~yima/;http://yann.lecun.com",
        "dblp": "306/1406;30/10064;;l/YannLeCun",
        "google_scholar": "https://scholar.google.com/citations?hl=en;WeyLqFUAAAAJ;https://scholar.google.com.hk/citations?user=XqLiBQMAAAAJ;WLN3QrAAAAAJ",
        "orcid": ";;;",
        "linkedin": ";yubei-chen-05998a39/;;",
        "or_profile": "~Shengbang_Tong1;~Yubei_Chen1;~Yi_Ma4;~Yann_LeCun1",
        "aff": "New York University;University of California, Davis;University of California, Berkeley;New York University",
        "aff_domain": "nyu.edu;ucdavis.edu;berkeley.edu;nyu.edu",
        "position": "PhD student;Assistant Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\ntong2024empssl,\ntitle={{EMP}-{SSL}: Towards Self-Supervised Learning in One Training Epoch},\nauthor={Shengbang Tong and Yubei Chen and Yi Ma and Yann LeCun},\nyear={2024},\nurl={https://openreview.net/forum?id=mYjaLLViSt}\n}",
        "github": "",
        "project": "",
        "reviewers": "R77R;tvSj;tgxj;FQ2Z",
        "site": "https://openreview.net/forum?id=mYjaLLViSt",
        "pdf_size": 836402,
        "rating": "3;3;5;5",
        "confidence": "5;4;4;4",
        "soundness": "2;2;3;2",
        "contribution": "2;3;3;2",
        "presentation": "2;2;3;3",
        "wc_summary": "96;36;141;96",
        "wc_strengths": "32;50;62;49",
        "wc_weaknesses": "217;270;255;193",
        "wc_questions": "577;70;62;105",
        "wc_review": "922;426;520;443",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            92.25,
            37.31202889149825
        ],
        "wc_strengths_avg": [
            48.25,
            10.685855136581255
        ],
        "wc_weaknesses_avg": [
            233.75,
            30.441542339375644
        ],
        "wc_questions_avg": [
            203.5,
            216.24580920794742
        ],
        "wc_review_avg": [
            577.75,
            201.88409422240278
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 33,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9943400277440799349&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "New York University;University of California, Davis;University of California, Berkeley",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.nyu.edu;https://www.ucdavis.edu;https://www.berkeley.edu",
        "aff_unique_abbr": "NYU;UC Davis;UC Berkeley",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Davis;Berkeley",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "mYo9r0CwUf",
        "title": "Continuously Volumetric Rendering with Neural Density-Distance Fields",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper proposes a continuous volumetric rendering and a bisection sampling utilizing the Neural Density-Distance Field (NeDDF) that can synthesize novel views with bouncing transparency during each rendering segment. Since, unlike the density field, the distance field retains the state of the nearby free space, efficient sampling, such as sphere tracing, has been attempted by assuming a solid object. However, distance fields struggle to represent transparency, detailed shapes, and distant landscapes. We derive bounds on transparency in the interval in volume rendering based on NeDDF, which extends distance fields to non-solids. Through realizing the derivation, we invent an efficient bisectional exploratory sampling method that minimizes the maximum of the bound range. For scaling to fit the Eikonal constraints on distance fields, Multi-resolution Hash Encoding, which is excellent for detailed description, is used with frequency separation. We achieve unmasked acquisition of scenes with distant scenery by introducing contract coordinates and scaling the distance field so finite values can describe it. Experiments on synthetic and real data show that the proposed rendering bounds work reasonably.",
        "keywords": "NeRF;Neural Fields;Volumetric Rendering",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Itsuki Ueda;Naoya Chiba;Hirokatsu Kataoka;Hiroaki Aizawa;Itaru Kitahara",
        "authorids": "~Itsuki_Ueda1;~Naoya_Chiba1;~Hirokatsu_Kataoka1;~Hiroaki_Aizawa1;~Itaru_Kitahara1",
        "gender": "M;M;M;M;M",
        "homepage": ";https://sites.google.com/view/n-chiba-;https://hirokatsukataoka.net/;https://aizawan.github.io/;https://sites.google.com/image.iit.tsukuba.ac.jp/kitahara/home/top-e?authuser=0",
        "dblp": ";202/5745;128/7522;;85/2726",
        "google_scholar": "https://scholar.google.co.jp/citations?user=l6Vw4HIAAAAJ;https://scholar.google.co.jp/citations?user=TkFr708AAAAJ;https://scholar.google.com.au/citations?user=f1CePVQAAAAJ;https://scholar.google.co.jp/citations?user=pOicPvQAAAAJ;https://scholar.google.co.jp/citations?user=mphxDdYAAAAJ",
        "orcid": "0000-0002-2681-1229;;0000-0001-8844-165X;;0000-0002-5186-789X",
        "linkedin": ";;hirokatsu-kataoka-83b84846/;;itaru-kitahara-0a491712",
        "or_profile": "~Itsuki_Ueda1;~Naoya_Chiba1;~Hirokatsu_Kataoka1;~Hiroaki_Aizawa1;~Itaru_Kitahara1",
        "aff": "University of Tsukuba, Tsukuba University;Tohoku University;National Institute of Advanced Industrial Science and Technology (AIST);Hiroshima University;The University of Tsukuba",
        "aff_domain": "u.tsukuba.ac.jp;tohoku.ac.jp;aist.go.jp;hiroshima-u.ac.jp;tsukuba.ac.jp",
        "position": "PhD student;Assistant Professor;Principal Researcher;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nueda2024continuously,\ntitle={Continuously Volumetric Rendering with Neural Density-Distance Fields},\nauthor={Itsuki Ueda and Naoya Chiba and Hirokatsu Kataoka and Hiroaki Aizawa and Itaru Kitahara},\nyear={2024},\nurl={https://openreview.net/forum?id=mYo9r0CwUf}\n}",
        "github": "",
        "project": "",
        "reviewers": "mezv;vVNf;81Bz",
        "site": "https://openreview.net/forum?id=mYo9r0CwUf",
        "pdf_size": 826821,
        "rating": "1;3;3",
        "confidence": "3;4;4",
        "soundness": "2;2;2",
        "contribution": "2;2;2",
        "presentation": "1;2;2",
        "wc_summary": "67;122;27",
        "wc_strengths": "32;20;19",
        "wc_weaknesses": "557;227;54",
        "wc_questions": "34;4;42",
        "wc_review": "690;373;142",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            72.0,
            38.94440481849308
        ],
        "wc_strengths_avg": [
            23.666666666666668,
            5.90668171555645
        ],
        "wc_weaknesses_avg": [
            279.3333333333333,
            208.6565492754914
        ],
        "wc_questions_avg": [
            26.666666666666668,
            16.35712552851373
        ],
        "wc_review_avg": [
            401.6666666666667,
            224.63649649056484
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Xnl0lOvr7AwJ:scholar.google.com/&scioq=Continuously+Volumetric+Rendering+with+Neural+Density-Distance+Fields&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;0",
        "aff_unique_norm": "University of Tsukuba;Tohoku University;National Institute of Advanced Industrial Science and Technology;Hiroshima University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.tsukuba.ac.jp;https://www.tohoku.ac.jp;https://www.aist.go.jp;https://www.hiroshima-u.ac.jp",
        "aff_unique_abbr": "UT;Tohoku U;AIST;Hiroshima U",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Tsukuba;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Japan"
    },
    {
        "id": "mYp2KwjCWx",
        "title": "Hierarchical Empowerment: Towards Tractable Empowerment-Based Skill Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "General purpose agents will require large repertoires of skills.  Empowerment---the maximum mutual information between skills and the states---provides a pathway for learning large collections of distinct skills, but mutual information is difficult to optimize.  We introduce a new framework, Hierarchical Empowerment, that makes computing empowerment more tractable by integrating concepts from Goal-Conditioned Hierarchical Reinforcement Learning.  Our framework makes two specific contributions.  First, we introduce a new variational lower bound on mutual information that can be used to compute empowerment over short horizons.  Second, we introduce a hierarchical architecture for computing empowerment over exponentially longer time scales.  We verify the contributions of the framework in a series of simulated robotics tasks.  In a popular ant navigation domain, our four level agents are able to learn skills that cover a surface area over two orders of magnitude larger than prior work.",
        "keywords": "Hierarchical Reinforcement Learning;Goal-Conditioned Reinforcement Learning;Intrinsic Motivation;Skill Learning;Empowerment;Curriculum Learning;Deep Reinforcement Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Andrew Levy;Sreehari Rammohan;Alessandro G Allievi;Scott Niekum;George Konidaris",
        "authorids": "~Andrew_Levy1;~Sreehari_Rammohan1;~Alessandro_G_Allievi1;~Scott_Niekum1;~George_Konidaris1",
        "gender": "M;M;;M;M",
        "homepage": ";https://sreeharirammohan.com/;;https://people.cs.umass.edu/~sniekum/index.php;http://cs.brown.edu/people/gdk/",
        "dblp": "53/3725;277/6972;125/4680;62/8399;56/6762",
        "google_scholar": "t2eNzb8AAAAJ;;https://scholar.google.co.uk/citations?user=T5JSHMoAAAAJ;4wXYfSUAAAAJ;9UERvVEAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;alessandro-allievi-a54b67b0/;;",
        "or_profile": "~Andrew_Levy1;~Sreehari_Rammohan1;~Alessandro_G_Allievi1;~Scott_Niekum1;~George_Konidaris1",
        "aff": "Brown University;Brown University;University of Texas at Austin;University of Massachusetts at Amherst;Brown University",
        "aff_domain": "brown.edu;brown.edu;utexas.edu;umass.edu;brown.edu",
        "position": "PhD Student;Undergrad student;Postdoc;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nlevy2024hierarchical,\ntitle={Hierarchical Empowerment: Towards Tractable Empowerment-Based Skill Learning},\nauthor={Andrew Levy and Sreehari Rammohan and Alessandro G Allievi and Scott Niekum and George Konidaris},\nyear={2024},\nurl={https://openreview.net/forum?id=mYp2KwjCWx}\n}",
        "github": "",
        "project": "",
        "reviewers": "6xWS;2VaP;zB9W;CmJ8",
        "site": "https://openreview.net/forum?id=mYp2KwjCWx",
        "pdf_size": 2615733,
        "rating": "3;5;5;6",
        "confidence": "4;4;3;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;3;4",
        "wc_summary": "71;91;106;103",
        "wc_strengths": "26;127;49;64",
        "wc_weaknesses": "492;273;152;52",
        "wc_questions": "154;223;17;34",
        "wc_review": "743;714;324;253",
        "wc_reply_reviewers": "208;63;0;0",
        "wc_reply_authors": "731;677;238;156",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            92.75,
            13.754544703478919
        ],
        "wc_strengths_avg": [
            66.5,
            37.459978643880724
        ],
        "wc_weaknesses_avg": [
            242.25,
            164.05848804618432
        ],
        "wc_questions_avg": [
            107.0,
            85.28481693713131
        ],
        "wc_review_avg": [
            508.5,
            221.6647243022669
        ],
        "wc_reply_reviewers_avg": [
            67.75,
            84.95991701973348
        ],
        "wc_reply_authors_avg": [
            450.5,
            255.86568742213169
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.6882472016116854,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1927544255098271824&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;2;0",
        "aff_unique_norm": "Brown University;University of Texas at Austin;University of Massachusetts Amherst",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.brown.edu;https://www.utexas.edu;https://www.umass.edu",
        "aff_unique_abbr": "Brown;UT Austin;UMass Amherst",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Austin;Amherst",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "FlashAttention-2: Faster Attention with Better Parallelism and Work Partitioning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17889",
        "id": "mZn2Xyh9Ec",
        "tldr": "",
        "abstract": "Scaling Transformers to longer sequence lengths has been a major problem in the last several years, promising to improve performance in language modeling and high-resolution image understanding, as well as to unlock new applications in code, audio, and video generation. The attention layer is the main bottleneck in scaling to longer sequences, as its runtime and memory increase quadratically in the sequence length. FlashAttention [5] exploits the asymmetric GPU memory hierarchy to bring significant memory saving (linear instead of quadratic) and runtime speedup (2-4\u00d7 compared to optimized baselines), with no approximation. However, FlashAttention is still not nearly as fast as optimized matrix-multiply (GEMM) operations, reaching only 25-40% of the theoretical maximum FLOPs/s. We observe that the inefficiency is due to suboptimal work partitioning between different thread blocks and warps on the GPU, causing either low-occupancy or unnecessary shared memory reads/writes. We propose FlashAttention-2, with better work partitioning to address these issues. In particular, we (1) tweak the algorithm to reduce the number of non-matmul FLOPs (2) parallelize the attention computation, even for a single head, across different thread blocks to increase occupancy, and (3) within each thread block, distribute the work between warps to reduce communication through shared memory. These yield around 2\u00d7 speedup compared to FlashAttention, reaching 50-73% of the theoretical maximum FLOPs/s on A100 and getting close to the efficiency of GEMM operations. We empirically validate that when used end-to-end to train GPT-style models, FlashAttention-2 reaches training speed of up to 225 TFLOPs/s per A100 GPU (72% model FLOPs utilization).",
        "keywords": "Attention;GPUs;LLM training;LLM inference",
        "primary_area": "infrastructure, software libraries, hardware, etc.",
        "supplementary_material": "/attachment/625d7bd009f281a6047fb597029c3d8c41cb7942.zip",
        "author": "Tri Dao",
        "authorids": "~Tri_Dao1",
        "gender": "",
        "homepage": "https://tridao.me/",
        "dblp": "206/7018",
        "google_scholar": "NQRw0bQAAAAJ",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Tri_Dao1",
        "aff": "Princeton University",
        "aff_domain": "princeton.edu",
        "position": "Assistant Professor",
        "bibtex": "@inproceedings{\ndao2024flashattention,\ntitle={FlashAttention-2: Faster Attention with Better Parallelism and Work Partitioning},\nauthor={Tri Dao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=mZn2Xyh9Ec}\n}",
        "github": "",
        "project": "",
        "reviewers": "Jn9J;AK2B;hPzR;RLZf",
        "pdf_size": 1197098,
        "rating": "5;6;8;10",
        "confidence": "3;4;5;4",
        "soundness": "2;4;2;4",
        "contribution": "2;3;3;4",
        "presentation": "2;3;3;3",
        "wc_summary": "45;98;181;75",
        "wc_strengths": "11;27;148;70",
        "wc_weaknesses": "21;48;360;44",
        "wc_questions": "501;189;167;46",
        "wc_review": "578;362;856;235",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "338;221;339;94",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            7.25,
            1.920286436967152
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            1.0
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            99.75,
            50.53402319230085
        ],
        "wc_strengths_avg": [
            64.0,
            53.08012810836085
        ],
        "wc_weaknesses_avg": [
            118.25,
            139.9542335908421
        ],
        "wc_questions_avg": [
            225.75,
            167.984188244013
        ],
        "wc_review_avg": [
            507.75,
            235.50411355218407
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            248.0,
            101.02722405371732
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0.552344770738994,
        "gs_citation": 1041,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5278299529267697144&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 9,
        "openreview": "https://openreview.net/forum?id=mZn2Xyh9Ec",
        "pdf": "https://openreview.net/pdf?id=mZn2Xyh9Ec",
        "email": "princeton.edu",
        "author_num": 1,
        "aff_unique_index": "0",
        "aff_unique_norm": "Princeton University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.princeton.edu",
        "aff_unique_abbr": "Princeton",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "title": "LLM-Assisted Code Cleaning For Training Accurate Code Generators",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17888",
        "id": "maRYffiUpI",
        "author_site": "Naman Jain, Tianjun Zhang, Wei-Lin Chiang, Joseph E Gonzalez, Koushik Sen, Ion Stoica",
        "tldr": "",
        "abstract": "Natural language to code generation is an important application area of LLMs and has received wide attention from the community. \nThe majority of relevant studies have exclusively concentrated on increasing the quantity and functional correctness of training sets while disregarding other stylistic elements of programs. More recently, data quality has garnered a lot of interest and multiple works have showcased its importance for improving performance. In this work, we investigate data quality for code and find that making the code more structured and readable leads to improved code generation performance of the system. We build a novel data-cleaning pipeline that uses these principles to transform existing programs by 1.) renaming variables, 2.) modularizing and decomposing complex code into smaller helper sub-functions, and 3.) inserting natural-language based planning annotations. We evaluate our approach on two challenging algorithmic code generation benchmarks and find that fine-tuning CodeLLaMa-7B on our transformed programs improves the performance by up to \\textbf{30\\%} compared to fine-tuning on the original dataset. Additionally, we demonstrate improved performance from using a smaller amount of higher-quality data, finding that a model fine-tuned on the entire original dataset is outperformed by a model trained on one-eighth of our cleaned dataset. Even in comparison to closed-source models, our models outperform the much larger AlphaCode models.",
        "keywords": "Code Generation;Data Quality;Synthetic Data",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Naman Jain;Tianjun Zhang;Wei-Lin Chiang;Joseph E. Gonzalez;Koushik Sen;Ion Stoica",
        "authorids": "~Naman_Jain2;~Tianjun_Zhang1;~Wei-Lin_Chiang1;~Joseph_E._Gonzalez1;~Koushik_Sen2;~Ion_Stoica1",
        "gender": "M;;;M;M;M",
        "homepage": "https://naman-ntc.github.io/;https://tianjunz.github.io;https://infwinston.github.io/;http://eecs.berkeley.edu/~jegonzal;https://people.eecs.berkeley.edu/~ksen/;http://people.eecs.berkeley.edu/~istoica/",
        "dblp": ";;174/2148;61/8262;https://dblp.uni-trier.de/pid/04/418.html;s/IonStoica",
        "google_scholar": "6oqV3v8AAAAJ;UE9jz_MAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com.tw/citations?user=gM2WW9UAAAAJ;Vn3L_ioAAAAJ;vN-is70AAAAJ",
        "orcid": ";;;0000-0003-2921-956X;;",
        "linkedin": ";;;;;ionstoica",
        "or_profile": "~Naman_Jain2;~Tianjun_Zhang1;~Wei-Lin_Chiang1;~Joseph_E._Gonzalez1;~Koushik_Sen2;~Ion_Stoica1",
        "aff": "University of California, Berkeley;University of California, Berkeley;University of California, Berkeley;University of California, Berkeley;UC Berkeley, University of California, Berkeley;University of California, Berkeley",
        "aff_domain": "berkeley.edu;berkeley.edu;berkeley.edu;berkeley.edu;cs.berkeley.edu;berkeley.edu",
        "position": "PhD student;PhD student;PhD student;Associate Professor;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\njain2024llmassisted,\ntitle={{LLM}-Assisted Code Cleaning For Training Accurate Code Generators},\nauthor={Naman Jain and Tianjun Zhang and Wei-Lin Chiang and Joseph E. Gonzalez and Koushik Sen and Ion Stoica},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=maRYffiUpI}\n}",
        "github": "",
        "project": "",
        "reviewers": "DhCg;FtQG;MNi4",
        "pdf_size": 1065208,
        "rating": "5;8;8",
        "confidence": "3;5;3",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "3;2;4",
        "wc_summary": "81;122;108",
        "wc_strengths": "34;133;180",
        "wc_weaknesses": "283;214;94",
        "wc_questions": "23;216;336",
        "wc_review": "421;685;718",
        "wc_reply_reviewers": "0;19;32",
        "wc_reply_authors": "1193;788;778",
        "reply_reviewers": "0;1;1",
        "reply_authors": "3;2;2",
        "rating_avg": [
            7.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            103.66666666666667,
            17.016332024133625
        ],
        "wc_strengths_avg": [
            115.66666666666667,
            60.85136718997273
        ],
        "wc_weaknesses_avg": [
            197.0,
            78.08969202141856
        ],
        "wc_questions_avg": [
            191.66666666666666,
            128.93495345414377
        ],
        "wc_review_avg": [
            608.0,
            132.9135057095403
        ],
        "wc_reply_reviewers_avg": [
            17.0,
            13.140268896284683
        ],
        "wc_reply_authors_avg": [
            919.6666666666666,
            193.3189649833203
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5000000000000001,
        "gs_citation": 33,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12902330141507891704&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=maRYffiUpI",
        "pdf": "https://openreview.net/pdf?id=maRYffiUpI",
        "email": "berkeley.edu;berkeley.edu;berkeley.edu;berkeley.edu;cs.berkeley.edu;berkeley.edu",
        "author_num": 6,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "University of California, Berkeley",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.berkeley.edu",
        "aff_unique_abbr": "UC Berkeley",
        "aff_campus_unique_index": "0;0;0;0;0;0",
        "aff_campus_unique": "Berkeley",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "mao3y822aM",
        "title": "NanoLM: An Affordable LLM Study Benchmark via Accurate Loss Prediction Across Scales",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "High computational cost, data collection, and difficulty in distributed training are the three significant barriers in pre-training large language models (LLMs) for many researchers. \nIn this paper, we try to solve the question ''Under constrained computational resources, what type of model design(eg. model size, model architecture) should I train in order to to achieve the best possible performance?\" To answer this question, based on Scaling Laws for LLM, we introduce nanoLM: an affordable LLM Study Benchmark via Accurate Loss Prediction across scales. This benchmark unlocks a new LLM study paradigm without direct training. Under the loss basin area, the training loss and model size can be accurately fitted as a power law. This allows us to extrapolate LM from small- to large-scale. For example, with just 13.1%, 14.2% of the total pretraining cost, we can accurately forecast the loss for models sized 26B and 52B. To ensure compatibility with mainstream Transformer architectures, nanoLM offers support for decoder-only structures (eg., GPT), encoder-only structures (eg., BERT), and encoder-decoder structures (eg., T5). Considering that excessive model parameters might lead to GPU memory overflow, nanoLM also supports for data parallelism strategies. Our goal with nanoLM is to empower researchers to make cheap and meaningful comparisons of varying model designs at large scales. We also aspire for our benchmark to serve as a bridge between the academic community and the industry.",
        "keywords": "Large Language Model;Scaling Law;Hyperparameter Transfer;Hyperparameter Tuning",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/205a1df9235cbbec3ae15f9681de501973cd3d06.pdf",
        "author": "Siqi Fan;Xiusheng Huang;Xuezhi Fang;Yiqun Yao;Xiang Li;Ziyi Ni;Xin Jiang;Xuying Meng;Peng Han;Shuo Shang;Kang Liu;Aixin Sun;Yequan Wang",
        "authorids": "~Siqi_Fan4;~Xiusheng_Huang1;~Xuezhi_Fang1;~Yiqun_Yao1;~Xiang_Li32;~Ziyi_Ni1;~Xin_Jiang6;~Xuying_Meng1;~Peng_Han3;~Shuo_Shang1;~Kang_Liu1;~Aixin_Sun1;~Yequan_Wang1",
        "gender": ";F;M;M;F;M;F;M;;M;M;M;M",
        "homepage": ";https://github.com/Huangxiusheng;;https://github.com/keshuichonglx;https://www.researchgate.net/profile/Ziyi-Ni-2;;https://people.ucas.ac.cn/~0038059;https://www.linkedin.com/in/peng-han-062480177/;https://sites.google.com/site/jedishang;http://www.nlpr.ia.ac.cn/cip/~liukang/index.html;https://personal.ntu.edu.sg/axsun/;http://www.wangyequan.com;https://github.com/Jason3900",
        "dblp": "149/1267-1;298/0049;186/7879;40/1491;;42/4142-5;146/8088;51/4558-5;29/8750;42/4903.html;78/5155;188/9082;319/2634",
        "google_scholar": "pybmbCYAAAAJ;4mY2E30AAAAJ;;;;3mqJwa8AAAAJ;SzdXry0AAAAJ;8XxCgFEAAAAJ;https://scholar.google.com/citations?hl=en;DtZCfl0AAAAJ;https://scholar.google.com.sg/citations?user=wyKGVKUAAAAJ;7Gqp6FsAAAAJ;",
        "orcid": ";;;0000-0003-2991-4327;;;;0000-0003-1201-2060;0000-0002-1117-2890;;0000-0003-0764-4258;;",
        "linkedin": ";;;;;;;;;;aixin-sun-%E5%AD%99%E7%88%B1%E6%AC%A3-43056622/;;",
        "or_profile": "~Siqi_Fan4;~Xiusheng_Huang1;~Yiqun_Yao1;~Xiang_Li32;~Ziyi_Ni1;~Xin_Jiang6;~Xuying_Meng1;~Peng_Han3;~Shuo_Shang1;~Kang_Liu1;~Aixin_Sun1;~Yequan_Wang1;~Jason_Fang1",
        "aff": "University of Electronic Science and Technology of China;University of Chinese Academy of Sciences;Beijing Academy of Artificial Intelligence;Beijing Academy of Artificial Intelligence;Institute of Automation, Chinese Academy of Sciences;Beijing Academy of Artificial Intelligence;Chinese Academy of Sciences;University of Electronic Science and Technology of China;University of Electronic Science and Technology of China;Institute of Automation, Chinese Academy of Sciences;Nanyang Technological University;Beijing Academy of Artificial Intelligence;Beijing Academy of Artificial Intelligence",
        "aff_domain": "uestc.edu.cn;ucas.ac.cn;baai.ac.cn;baai.ac.cn;ia.ac.cn;baai.ac.cn;ict.ac.cn;uestc.edu.cn;uestc.edu.cn;ia.ac.cn;ntu.edu.sg;baai.ac.cn;baai.ac.cn",
        "position": "PhD student;PhD student;Researcher;Researcher;PhD student;Researcher;Associate Professor;Full Professor;Full Professor;Professor;Associate Professor;Researcher;Researcher",
        "bibtex": "@misc{\nfan2024nanolm,\ntitle={Nano{LM}: An Affordable {LLM} Study Benchmark via Accurate Loss Prediction Across Scales},\nauthor={Siqi Fan and Xiusheng Huang and Xuezhi Fang and Yiqun Yao and Xiang Li and Ziyi Ni and Xin Jiang and Xuying Meng and Peng Han and Shuo Shang and Kang Liu and Aixin Sun and Yequan Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=mao3y822aM}\n}",
        "github": "",
        "project": "",
        "reviewers": "Ahkx;z2mu;Fxnv;eip6",
        "site": "https://openreview.net/forum?id=mao3y822aM",
        "pdf_size": 758471,
        "rating": "5;5;6;6",
        "confidence": "3;3;4;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;2;3",
        "wc_summary": "94;42;39;382",
        "wc_strengths": "97;72;22;158",
        "wc_weaknesses": "82;80;49;146",
        "wc_questions": "74;2;192;89",
        "wc_review": "347;196;302;775",
        "wc_reply_reviewers": "0;22;14;118",
        "wc_reply_authors": "582;674;607;744",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            139.25,
            141.84740921144805
        ],
        "wc_strengths_avg": [
            87.25,
            48.96618731328793
        ],
        "wc_weaknesses_avg": [
            89.25,
            35.280128968018246
        ],
        "wc_questions_avg": [
            89.25,
            67.82836795913639
        ],
        "wc_review_avg": [
            405.0,
            220.5413793373026
        ],
        "wc_reply_reviewers_avg": [
            38.5,
            46.569840025492894
        ],
        "wc_reply_authors_avg": [
            651.75,
            62.993551257251724
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            13,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:R61EPBY8jPUJ:scholar.google.com/&scioq=NanoLM:+An+Affordable+LLM+Study+Benchmark+via+Accurate+Loss+Prediction+Across+Scales&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;2;3;2;3;0;0;3;4;2;2",
        "aff_unique_norm": "University of Electronic Science and Technology of China;University of Chinese Academy of Sciences;Beijing Academy of Artificial Intelligence;Chinese Academy of Sciences;Nanyang Technological University",
        "aff_unique_dep": ";;;Institute of Automation;",
        "aff_unique_url": "https://www.uestc.edu.cn;http://www.ucas.ac.cn;https://www.baaic.cn;http://www.ia.cas.cn;https://www.ntu.edu.sg",
        "aff_unique_abbr": "UESTC;UCAS;BAAI;CAS;NTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0;1;0;0",
        "aff_country_unique": "China;Singapore"
    },
    {
        "id": "mavWQw7DnC",
        "title": "Explaining recommendation systems through contrapositive perturbations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recommender systems are widely used to help users discover new items online. A popular method for recommendations is factorization models, which predict a user's preference for an item based on latent factors derived from their interaction history. However, explaining why a particular item was recommended to a user is challenging, and current approaches such as counterfactual explanations can be computationally expensive. In this paper, we propose a new approach called contrapositive explanations that leverages a different logical structure to counterfactual explanations. We show how contrapositive explanations can be used to explain recommendation systems by finding the minimum change that would have resulted in a different recommendation. Specifically, we present a methodology that focuses on finding an explanation in the form of \"Because the user interacted with item, j we recommend item i to the user,\" which is easier to compute and find compared to traditional counterfactual approaches which aim at \"Because the user $\\textbf{did not}$\n interacted with item j, we $\\textbf{did not}$ recommend item i to the user,\". We evaluate our approach on several real-world datasets and show that it provides effective and efficient explanations compared to other existing methods.",
        "keywords": "Explanations;XAI",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/c643b57e6e916e3cbeeea84fe9d12338a7aa08fe.pdf",
        "author": "Jean-Francois Ton;Yegor Klochkov;Yang Liu;Hang Li",
        "authorids": "~Jean-Francois_Ton2;~Yegor_Klochkov2;~Yang_Liu3;~Hang_Li4",
        "gender": "Not Specified;M;M;M",
        "homepage": "https://savior287.github.io/JFT-webpage/;;http://www.yliuu.com;https://hangli-hl.github.io/",
        "dblp": ";251/3118;51/3710-18;https://dblp.org/pers/hd/l/Li_0001:Hang",
        "google_scholar": "WWVOu4kAAAAJ;T3CDHrEAAAAJ;jKrIVCIAAAAJ;nTl5mSwAAAAJ",
        "orcid": ";;0000-0001-8420-6011;0000-0001-9628-3487",
        "linkedin": ";;;hang-li-84aa6314/",
        "or_profile": "~Jean-Francois_Ton2;~Yegor_Klochkov2;~Yang_Liu3;~Hang_Li4",
        "aff": "Bytedance;ByteDance, AI Lab;University of California, Santa Cruz;ByteDance Technology",
        "aff_domain": "bytedance.com;bytedance.com;ucsc.edu;bytedance.com",
        "position": "Researcher;Researcher;Assistant Professor;Head of Research",
        "bibtex": "@misc{\nton2024explaining,\ntitle={Explaining recommendation systems through contrapositive perturbations},\nauthor={Jean-Francois Ton and Yegor Klochkov and Yang Liu and Hang Li},\nyear={2024},\nurl={https://openreview.net/forum?id=mavWQw7DnC}\n}",
        "github": "",
        "project": "",
        "reviewers": "ck6L;PpEb;5dmR",
        "site": "https://openreview.net/forum?id=mavWQw7DnC",
        "pdf_size": 1907222,
        "rating": "3;5;5",
        "confidence": "4;3;2",
        "soundness": "2;3;2",
        "contribution": "2;2;3",
        "presentation": "3;2;3",
        "wc_summary": "109;128;172",
        "wc_strengths": "15;56;62",
        "wc_weaknesses": "38;307;90",
        "wc_questions": "328;48;78",
        "wc_review": "490;539;402",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1222;1362;632",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;2;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            136.33333333333334,
            26.386023236217735
        ],
        "wc_strengths_avg": [
            44.333333333333336,
            20.885933597094056
        ],
        "wc_weaknesses_avg": [
            145.0,
            116.50178825523093
        ],
        "wc_questions_avg": [
            151.33333333333334,
            125.52113589175154
        ],
        "wc_review_avg": [
            477.0,
            56.680390495008645
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1072.0,
            316.3331577098213
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Xs86uA5WxCkJ:scholar.google.com/&scioq=Explaining+recommendation+systems+through+contrapositive+perturbations&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "ByteDance;University of California, Santa Cruz",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.bytedance.com;https://www.ucsc.edu",
        "aff_unique_abbr": "Bytedance;UCSC",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Santa Cruz",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "mbPvdO2dxb",
        "title": "Meta-Guided Diffusion Models for Zero-Shot Medical Imaging Inverse Problems",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In the realm of medical imaging, inverse problems aim to infer high-quality images from incomplete, noisy measurements, with the objective of minimizing expenses and risks to patients in clinical settings. The Diffusion Models have recently emerged as a promising approach to such practical challenges, proving particularly useful for the zero-shot inference of images from partially acquired measurements in Magnetic Resonance Imaging (MRI) and Computed Tomography (CT). A central challenge in this approach, however, is how to guide an unconditional prediction to conform to the measurement information. In this paper, we propose a Meta-Guided Diffusion Model (MGDM) that tackles this challenge through a \\emph{bi-level} guidance strategy, where the \\emph{outer level} solves a proximal optimization problem to impose measurement consistency and the \\emph{inner level} approximates the measurement-conditioned posterior mean as the initial prediction. Furthermore, we introduce a refinement phase, termed the \"discrepancy gradient'', designed to reduce the distance between the outputs of the aforementioned levels, thereby acting as an effective regularizer to further enhance data consistency in the recovered samples. Empirical results on publicly available medical datasets in MRI and CT highlight the superior performance of our proposed algorithm, faithfully reproducing high-fidelity medical images consistent with measurements, and notably mitigating the generation of hallucinatory images observed in state-of-the-art methods under similar conditions.",
        "keywords": "Zero-shot Imaging;Inverse Problems;Posterior Sampling;Proximal Optimization",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/db64136ea2ed754b73a2102219fa1d2cdd514415.zip",
        "author": "Hossein Askari;Fred Roosta;Hongfu Sun",
        "authorids": "~Hossein_Askari1;~Fred_Roosta1;~Hongfu_Sun1",
        "gender": "M;M;M",
        "homepage": ";https://people.smp.uq.edu.au/FredRoosta/;https://researchers.uq.edu.au/researcher/24057",
        "dblp": ";133/8630;165/5587.html",
        "google_scholar": "ZNLvHpoAAAAJ;https://scholar.google.com/citations?hl=en;aY5eZ54AAAAJ",
        "orcid": ";;0000-0003-3436-7831",
        "linkedin": "hossein-askari-978895232/;;",
        "or_profile": "~Hossein_Askari1;~Fred_Roosta1;~Hongfu_Sun1",
        "aff": "University of Queensland;University of Queensland;University of Queensland",
        "aff_domain": "uq.edu.au;uq.edu.au;uq.edu.au",
        "position": "PhD student;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nanonymous2024metaguided,\ntitle={Meta-Guided Diffusion Models for Zero-Shot Medical Imaging Inverse Problems},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=mbPvdO2dxb}\n}",
        "github": "",
        "project": "",
        "reviewers": "TLju;dvv8;Bg7d;sAeb",
        "site": "https://openreview.net/forum?id=mbPvdO2dxb",
        "pdf_size": 4682710,
        "rating": "3;5;6;6",
        "confidence": "3;5;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "57;94;128;69",
        "wc_strengths": "29;91;41;63",
        "wc_weaknesses": "294;316;53;296",
        "wc_questions": "34;45;150;8",
        "wc_review": "414;546;372;436",
        "wc_reply_reviewers": "1099;0;20;71",
        "wc_reply_authors": "2794;698;1389;596",
        "reply_reviewers": "6;0;1;1",
        "reply_authors": "9;1;2;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            87.0,
            27.175356483402386
        ],
        "wc_strengths_avg": [
            56.0,
            23.600847442411894
        ],
        "wc_weaknesses_avg": [
            239.75,
            108.16278241613425
        ],
        "wc_questions_avg": [
            59.25,
            54.08962469827277
        ],
        "wc_review_avg": [
            442.0,
            64.29618962271404
        ],
        "wc_reply_reviewers_avg": [
            297.5,
            463.4697940535068
        ],
        "wc_reply_authors_avg": [
            1369.25,
            877.3247332088615
        ],
        "reply_reviewers_avg": [
            2.0,
            2.345207879911715
        ],
        "reply_authors_avg": [
            3.25,
            3.344772040064913
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.24618298195866545,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:9RUTFg92Ot0J:scholar.google.com/&scioq=Meta-Guided+Diffusion+Models+for+Zero-Shot+Medical+Imaging+Inverse+Problems&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Queensland",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uq.edu.au",
        "aff_unique_abbr": "UQ",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Australia"
    },
    {
        "id": "mdqOjfQ29b",
        "title": "D^3: Distributional Dataset Distillation with Latent Priors",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Dataset distillation, the process of condensing a dataset into a smaller synthetic version while retaining downstream predictive performance, has gained traction in diverse machine learning applications, including neural architecture search, privacy-preserving learning and continual learning. Existing methods face challenges in scaling efficiently beyond toy datasets. They also suffer from diminishing returns when increasing the distilled dataset size. We present Distributional Data Distillation (D$^3$), a novel approach that reframes data distillation problem into a distributional one. In contrast to existing methods that distill a dataset into a finite set of real or synthetic examples, D$^3$ produces a probability distribution and a decoder from which the original dataset can be approximately regenerated. We use Deep Latent Variable Models (DLVMs) to parametrize the condensed data distribution and introduce a new training objective that combines a trajectory-matching distillation loss with a distributional discrepancy term, such as Maximum Mean Discrepancy, to encourage alignment between original and distilled distributions. Experimental results across various computer vision datasets show that our method effectively distills with minimal performance degradation. Even for large high-resolution datasets like ImageNet, our method consistently outperforms sample-based distillation methods.",
        "keywords": "Dataset Distillation;Dataset Compression;Latent Variable Models;Generative Models",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/0dcbadfdae5a8f9068edcccbb0c9dfbf2ce0f2d7.zip",
        "author": "Tian Qin;David Alvarez-Melis",
        "authorids": "~Tian_Qin3;~David_Alvarez-Melis1",
        "gender": "F;M",
        "homepage": "https://sunnytqin.github.io/;https://dmelis.github.io/",
        "dblp": ";168/8255",
        "google_scholar": ";XsxZrYYAAAAJ",
        "orcid": ";0000-0002-9591-8986",
        "linkedin": "sunny-qin-b70567203/;",
        "or_profile": "~Tian_Qin3;~David_Alvarez-Melis1",
        "aff": "Harvard University, Harvard University;Microsoft",
        "aff_domain": "g.harvard.edu;microsoft.com",
        "position": "PhD student;Senior Researcher",
        "bibtex": "@misc{\nqin2024d,\ntitle={D{\\textasciicircum}3: Distributional Dataset Distillation with Latent Priors},\nauthor={Tian Qin and David Alvarez-Melis},\nyear={2024},\nurl={https://openreview.net/forum?id=mdqOjfQ29b}\n}",
        "github": "",
        "project": "",
        "reviewers": "3cs3;yDY8;TU1J",
        "site": "https://openreview.net/forum?id=mdqOjfQ29b",
        "pdf_size": 1343923,
        "rating": "3;3;6",
        "confidence": "4;4;3",
        "soundness": "3;2;3",
        "contribution": "1;1;2",
        "presentation": "2;2;3",
        "wc_summary": "92;109;182",
        "wc_strengths": "13;28;118",
        "wc_weaknesses": "195;63;55",
        "wc_questions": "65;20;3",
        "wc_review": "365;220;358",
        "wc_reply_reviewers": "45;0;6",
        "wc_reply_authors": "354;710;298",
        "reply_reviewers": "1;0;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            127.66666666666667,
            39.04128868547018
        ],
        "wc_strengths_avg": [
            53.0,
            46.36809247747852
        ],
        "wc_weaknesses_avg": [
            104.33333333333333,
            64.19414995845719
        ],
        "wc_questions_avg": [
            29.333333333333332,
            26.157641755751268
        ],
        "wc_review_avg": [
            314.3333333333333,
            66.76492758593808
        ],
        "wc_reply_reviewers_avg": [
            17.0,
            19.949937343260004
        ],
        "wc_reply_authors_avg": [
            454.0,
            182.45730094097814
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:LRKRzU3JSgwJ:scholar.google.com/&scioq=D%5E3:+Distributional+Dataset+Distillation+with+Latent+Priors&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Harvard University;Microsoft",
        "aff_unique_dep": ";Microsoft Corporation",
        "aff_unique_url": "https://www.harvard.edu;https://www.microsoft.com",
        "aff_unique_abbr": "Harvard;Microsoft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Noise Map Guidance: Inversion with Spatial Context for Real Image Editing",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17887",
        "id": "mhgm0IXtHw",
        "author_site": "Hansam Cho, Jonghyun Lee, Seoung Bum Kim, Tae-Hyun Oh, Yonghyun Jeong",
        "tldr": "",
        "abstract": "Text-guided diffusion models have become a popular tool in image synthesis, known for producing high-quality and diverse images. However, their application to editing real images often encounters hurdles primarily due to the text condition deteriorating the reconstruction quality and subsequently affecting editing fidelity. Null-text Inversion (NTI) has made strides in this area, but it fails to capture spatial context and requires computationally intensive per-timestep optimization. Addressing these challenges, we present Noise Map Guidance (NMG), an inversion method rich in a spatial context, tailored for real-image editing. Significantly, NMG achieves this without necessitating optimization, yet preserves the editing quality. Our empirical investigations highlight NMG's adaptability across various editing techniques and its robustness to variants of DDIM inversions.",
        "keywords": "Generative Models;Diffusion Models;Image Editing",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Hansam Cho;Jonghyun Lee;Seoung Bum Kim;Tae-Hyun Oh;Yonghyun Jeong",
        "authorids": "~Hansam_Cho1;~Jonghyun_Lee2;~Seoung_Bum_Kim1;~Tae-Hyun_Oh3;~Yonghyun_Jeong1",
        "gender": "M;M;M;M;M",
        "homepage": ";http://dmqa.korea.ac.kr/;https://ami.kaist.ac.kr;https://github.com/TeamSAIDA/SAIDA;",
        "dblp": "367/1773;48/803;119/1450;260/0615.html;",
        "google_scholar": "YBvima8AAAAJ;https://scholar.google.co.kr/citations?user=-ACQ0GAAAAAJ;dMCBjeIAAAAJ;e9pHCjUAAAAJ;DrIILGsAAAAJ",
        "orcid": ";;0000-0003-0468-1571;;",
        "linkedin": ";;tae-hyun-oh-at-mit/;;jonghyun-lee-9b7754222/",
        "or_profile": "~Hansam_Cho1;~Seoung_Bum_Kim1;~Tae-Hyun_Oh3;~Yonghyun_Jeong1;~Jong_Hyun_Lee2",
        "aff": "Korea University;Korea University;POSTECH;NAVER;Korea University",
        "aff_domain": "korea.ac.kr;korea.ac.kr;postech.ac.kr;navercorp.com;korea.ac.kr",
        "position": "PhD student;Full Professor;Associate Professor;Researcher;MS student",
        "bibtex": "@inproceedings{\ncho2024noise,\ntitle={Noise Map Guidance: Inversion with Spatial Context for Real Image Editing},\nauthor={Hansam Cho and Jonghyun Lee and Seoung Bum Kim and Tae-Hyun Oh and Yonghyun Jeong},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=mhgm0IXtHw}\n}",
        "github": "",
        "project": "",
        "reviewers": "pVhT;yyX5;9KmB",
        "pdf_size": 4698481,
        "rating": "6;6;8",
        "confidence": "3;4;4",
        "soundness": "3;4;3",
        "contribution": "3;3;3",
        "presentation": "3;4;3",
        "wc_summary": "99;91;56",
        "wc_strengths": "90;83;36",
        "wc_weaknesses": "129;69;218",
        "wc_questions": "65;82;2",
        "wc_review": "383;325;312",
        "wc_reply_reviewers": "0;14;0",
        "wc_reply_authors": "693;714;679",
        "reply_reviewers": "0;1;0",
        "reply_authors": "2;2;2",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            82.0,
            18.672618098881223
        ],
        "wc_strengths_avg": [
            69.66666666666667,
            23.976840677805924
        ],
        "wc_weaknesses_avg": [
            138.66666666666666,
            61.211836182954755
        ],
        "wc_questions_avg": [
            49.666666666666664,
            34.41253001774531
        ],
        "wc_review_avg": [
            340.0,
            30.865298745786774
        ],
        "wc_reply_reviewers_avg": [
            4.666666666666667,
            6.599663291074443
        ],
        "wc_reply_authors_avg": [
            695.3333333333334,
            14.38363267359428
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.49999999999999983,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14086496212473613054&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=mhgm0IXtHw",
        "pdf": "https://openreview.net/pdf?id=mhgm0IXtHw",
        "email": "korea.ac.kr;korea.ac.kr;postech.ac.kr;navercorp.com;korea.ac.kr",
        "author_num": 5,
        "aff_unique_index": "0;0;1;2;0",
        "aff_unique_norm": "Korea University;Pohang University of Science and Technology;NAVER Corporation",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.korea.ac.kr;https://www.postech.ac.kr;https://www.naver.com",
        "aff_unique_abbr": "KU;POSTECH;NAVER",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Pohang",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "mhtD74Jgyw",
        "title": "Video Anomaly Detection via Semantic Attributes",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Video anomaly detection (VAD) is a challenging computer vision task with many practical applications. As anomalies are inherently ambiguous, it is essential for users to understand the reasoning behind a system's decision in order to determine if the rationale is sound. In this paper, we propose a simple but highly effective method that pushes the boundaries of VAD accuracy and interpretability using attribute-based representations. Our method represents every object by its velocity and pose. The anomaly scores are computed using a density-based approach. Surprisingly, we find that this simple representation is sufficient to achieve state-of-the-art performance in ShanghaiTech, the largest and most complex VAD dataset. Combining our interpretable attribute-based representations with implicit, deep representation yields state-of-the-art performance with a $99.1\\%, 93.8\\%$, and $85.9\\%$ AUROC on Ped2, Avenue, and ShanghaiTech, respectively. Our method is accurate, interpretable, and easy to implement.",
        "keywords": "anomaly detection",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/b9b5de34b7b383c5fa9b6ebe64cb8e8c7b12f2db.zip",
        "author": "Tal Reiss;Yedid Hoshen",
        "authorids": "~Tal_Reiss1;~Yedid_Hoshen3",
        "gender": "M;M",
        "homepage": ";https://www.cs.huji.ac.il/~ydidh/",
        "dblp": "276/6114;136/0280",
        "google_scholar": "sgMIT6EAAAAJ;https://scholar.google.co.il/citations?user=6y1-qS4AAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Tal_Reiss1;~Yedid_Hoshen3",
        "aff": "Hebrew University of Jerusalem;Google",
        "aff_domain": "huji.ac.il;google.com",
        "position": "PhD student;Researcher",
        "bibtex": "@misc{\nreiss2024video,\ntitle={Video Anomaly Detection via Semantic Attributes},\nauthor={Tal Reiss and Yedid Hoshen},\nyear={2024},\nurl={https://openreview.net/forum?id=mhtD74Jgyw}\n}",
        "github": "",
        "project": "",
        "reviewers": "W9ta;EZHR;p8Zy;fxdo",
        "site": "https://openreview.net/forum?id=mhtD74Jgyw",
        "pdf_size": 4659992,
        "rating": "3;3;5;5",
        "confidence": "5;4;5;4",
        "soundness": "1;2;3;2",
        "contribution": "1;2;1;2",
        "presentation": "2;3;4;3",
        "wc_summary": "64;60;55;154",
        "wc_strengths": "61;43;15;182",
        "wc_weaknesses": "281;154;345;105",
        "wc_questions": "71;3;30;5",
        "wc_review": "477;260;445;446",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            83.25,
            40.97178907492325
        ],
        "wc_strengths_avg": [
            75.25,
            63.774505094120485
        ],
        "wc_weaknesses_avg": [
            221.25,
            96.07386481244522
        ],
        "wc_questions_avg": [
            27.25,
            27.407799984675894
        ],
        "wc_review_avg": [
            407.0,
            85.83996738116808
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:q-5gnTxQ_ecJ:scholar.google.com/&scioq=Video+Anomaly+Detection+via+Semantic+Attributes&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Hebrew University of Jerusalem;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.huji.ac.il;https://www.google.com",
        "aff_unique_abbr": "HUJI;Google",
        "aff_campus_unique_index": "0;1",
        "aff_campus_unique": "Jerusalem;Mountain View",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Israel;United States"
    },
    {
        "title": "Enabling Efficient Equivariant Operations in the Fourier Basis via Gaunt Tensor Products",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17886",
        "id": "mhyQXJ6JsK",
        "author_site": "Shengjie Luo, Tianlang Chen, Aditi Krishnapriyan",
        "tldr": "",
        "abstract": "Developing equivariant neural networks for the E(3) group plays an important role in modeling 3D data across real-world applications. Enforcing this equivariance primarily involves the tensor products of irreducible representations (irreps). However, the computational complexity of such operations increases significantly as higher-order tensors are used. In this work, we propose a systematic approach to substantially accelerate the computation of the tensor products of irreps. We mathematically connect the commonly used Clebsch-Gordan coefficients to the Gaunt coefficients, which are integrals of products of three spherical harmonics. Through Gaunt coefficients, the tensor product of irreps becomes equivalent to the multiplication between spherical functions represented by spherical harmonics. This perspective further allows us to change the basis for the equivariant operations from spherical harmonics to a 2D Fourier basis. Consequently, the multiplication between spherical functions represented by a 2D Fourier basis can be efficiently computed via the convolution theorem and Fast Fourier Transforms. This transformation reduces the complexity of full tensor products of irreps from $\\mathcal{O}(L^6)$ to $\\mathcal{O}(L^3)$, where $L$ is the max degree of irreps. Leveraging this approach, we introduce the Gaunt Tensor Product, which serves as a new method to construct efficient equivariant operations across different model architectures. Our experiments on the Open Catalyst Project and 3BPA datasets demonstrate both the increased efficiency and improved performance of our approach. The code and models will be made publicly available at https://github.com/lsj2408/Gaunt-Tensor-Product.",
        "keywords": "Equivariant Operations; Tensor Product; Change of basis; Spherical Harmonics; Fourier Basis; equivariant neural networks",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Shengjie Luo;Tianlang Chen;Aditi S. Krishnapriyan",
        "authorids": "~Shengjie_Luo1;~Tianlang_Chen2;~Aditi_S._Krishnapriyan1",
        "gender": "M;;",
        "homepage": "https://lsj2408.github.io;;",
        "dblp": "274/2110;;",
        "google_scholar": "ImWO7WYAAAAJ;;",
        "orcid": ";;",
        "linkedin": "shengjie-luo-ba6137193/;;",
        "or_profile": "~Shengjie_Luo1;~Tianlang_Chen2;~Aditi_S._Krishnapriyan1",
        "aff": "Microsoft;;",
        "aff_domain": "microsoft.com;;",
        "position": "Intern;;",
        "bibtex": "@inproceedings{\nluo2024enabling,\ntitle={Enabling Efficient Equivariant Operations in the Fourier Basis via Gaunt Tensor Products},\nauthor={Shengjie Luo and Tianlang Chen and Aditi S. Krishnapriyan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=mhyQXJ6JsK}\n}",
        "github": "",
        "project": "",
        "reviewers": "AAYb;1Msw;wTba",
        "pdf_size": 725503,
        "rating": "6;8;8",
        "confidence": "3;3;4",
        "soundness": "4;3;4",
        "contribution": "3;3;3",
        "presentation": "4;3;3",
        "wc_summary": "39;81;61",
        "wc_strengths": "43;74;97",
        "wc_weaknesses": "44;126;78",
        "wc_questions": "81;6;2",
        "wc_review": "207;287;238",
        "wc_reply_reviewers": "12;13;0",
        "wc_reply_authors": "3041;815;701",
        "reply_reviewers": "1;1;0",
        "reply_authors": "8;3;1",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            60.333333333333336,
            17.15290710702481
        ],
        "wc_strengths_avg": [
            71.33333333333333,
            22.125902367034783
        ],
        "wc_weaknesses_avg": [
            82.66666666666667,
            33.6386021641143
        ],
        "wc_questions_avg": [
            29.666666666666668,
            36.33486235314814
        ],
        "wc_review_avg": [
            244.0,
            32.93427798915086
        ],
        "wc_reply_reviewers_avg": [
            8.333333333333334,
            5.90668171555645
        ],
        "wc_reply_authors_avg": [
            1519.0,
            1077.2223540198188
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            4.0,
            2.943920288775949
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.49999999999999983,
        "gs_citation": 23,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8697019708749008456&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=mhyQXJ6JsK",
        "pdf": "https://openreview.net/pdf?id=mhyQXJ6JsK",
        "email": "microsoft.com;;",
        "author_num": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "Microsoft",
        "aff_unique_dep": "Microsoft Corporation",
        "aff_unique_url": "https://www.microsoft.com",
        "aff_unique_abbr": "Microsoft",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "miGpIhquyB",
        "title": "Understanding Large Language Models Through the Lens of Dataset Generation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "There has been increased interest in using Large Language Models (LLMs) for text dataset generation subject to a desired attribute, e.g., for use in downstream fine-tuning or training. These works generally focus on a single quality metric of the generated text, typically accuracy on a downstream task. However, this fails to consider whether the model even has the ability to faithfully model the data distribution of the desired real-world domain. In contrast, in this work, we additionally focus on important distributional metrics agnostic to the downstream task, such as data diversity and faithfulness. We show that even in simple domains, generated datasets reveal inherent trade-offs between these metrics across models and training regimes. Further, we find that our metrics not only describe the generated dataset, but also capture key aspects of the underlying model. This allows us to characterize the generated datasets, individual models and by comparison the properties of different model families and training paradigms. By focusing on sub-distributions well-represented in the training data of LLMs, we can, for example, show that popular instruction-tuning techniques strongly decrease the LLM\u2019s text generation abilities, with respect to distributional aspects like diversity.",
        "keywords": "Large Language Model;dataset generation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/b4dbf65f832a7aaadefb44d7ca7ee20518915d78.zip",
        "author": "Jasper Dekoninck;Marc Fischer;Luca Beurer-Kellner;Martin Vechev",
        "authorids": "~Jasper_Dekoninck1;~Marc_Fischer1;~Luca_Beurer-Kellner1;~Martin_Vechev1",
        "gender": "M;M;M;M",
        "homepage": ";;;https://www.sri.inf.ethz.ch/people/martin",
        "dblp": "361/7298;37/9373-2;314/2627;93/2189.html",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;https://scholar.google.com/citations?hl=de;https://scholar.google.ch/citations?user=aZ1Rh50AAAAJ",
        "orcid": ";;;",
        "linkedin": "jasper-dekoninck-8a1bb41a1/;;;",
        "or_profile": "~Jasper_Dekoninck1;~Marc_Fischer1;~Luca_Beurer-Kellner1;~Martin_Vechev1",
        "aff": "Department of Computer Science, ETHZ - ETH Zurich;Swiss Federal Institute of Technology;ETHZ - ETH Zurich;Swiss Federal Institute of Technology",
        "aff_domain": "inf.ethz.ch;ethz.ch;ethz.ch;ethz.ch",
        "position": "PhD student;PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\ndekoninck2024understanding,\ntitle={Understanding Large Language Models Through the Lens of Dataset Generation},\nauthor={Jasper Dekoninck and Marc Fischer and Luca Beurer-Kellner and Martin Vechev},\nyear={2024},\nurl={https://openreview.net/forum?id=miGpIhquyB}\n}",
        "github": "",
        "project": "",
        "reviewers": "Afrd;fcAm;wzFz;PKWU",
        "site": "https://openreview.net/forum?id=miGpIhquyB",
        "pdf_size": 721662,
        "rating": "3;5;6;8",
        "confidence": "5;4;4;4",
        "soundness": "2;2;4;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;4",
        "wc_summary": "48;109;157;85",
        "wc_strengths": "44;44;59;58",
        "wc_weaknesses": "236;176;317;286",
        "wc_questions": "157;49;41;10",
        "wc_review": "485;378;574;439",
        "wc_reply_reviewers": "523;0;0;10",
        "wc_reply_authors": "871;841;836;559",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "2;2;2;1",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            99.75,
            39.55613100392909
        ],
        "wc_strengths_avg": [
            51.25,
            7.258615570478987
        ],
        "wc_weaknesses_avg": [
            253.75,
            53.38714732967102
        ],
        "wc_questions_avg": [
            64.25,
            55.494932201057786
        ],
        "wc_review_avg": [
            469.0,
            71.52272366178458
        ],
        "wc_reply_reviewers_avg": [
            133.25,
            225.0592977417285
        ],
        "wc_reply_authors_avg": [
            776.75,
            126.42858656174243
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8006407690254357,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:4CFKJd76V50J:scholar.google.com/&scioq=Understanding+Large+Language+Models+Through+the+Lens+of+Dataset+Generation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;1",
        "aff_unique_norm": "ETH Zurich;Swiss Federal Institute of Technology",
        "aff_unique_dep": "Department of Computer Science;",
        "aff_unique_url": "https://www.ethz.ch;https://www.ethz.ch",
        "aff_unique_abbr": "ETHZ;ETH Zurich",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Zurich;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Switzerland"
    },
    {
        "id": "mivL0akE5E",
        "title": "SpecFormer: Guarding Vision Transformer Robustness via Maximum Singular Value Penalization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Vision Transformers (ViTs) have gained prominence as a preferred choice for a wide range of computer vision tasks due to their exceptional performance. However, their widespread adoption has raised concerns about security in the face of malicious attacks. Most existing methods rely on empirical adjustments during the training process, lacking a clear theoretical foundations. In this study, we address this gap by introducing SpecFormer, specifically designed to enhance ViTs' resilience against adversarial attacks, with support from carefully derived theoretical guarantees. We establish local Lipschitz bounds for the self-attention layer and introduce a novel approach, Maximum Singular Value Penalization (MSVP), to attain precise control over these bounds. We seamlessly integrating MSVP into ViTs' attention layers, using the power iteration method for enhanced computational efficiency. The modified model, SpecFormer, effectively reduces the spectral norms of attention weight matrices, thereby enhancing network local Lipschitzness. This, in turn, leads to improved training efficiency and robustness. Extensive experiments on CIFAR and ImageNet datasets confirm SpecFormer's superior performance in defending against adversarial attacks.",
        "keywords": "Vision Transformer;Adversarial Robustness;Lipschitz Continuity;Computer Vision",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Xixu HU;Runkai Zheng;Jindong Wang;Cheuk Hang LEUNG;Qi WU;Xing Xie",
        "authorids": "~Xixu_HU2;~Runkai_Zheng1;~Jindong_Wang1;~Cheuk_Hang_LEUNG2;~Qi_WU5;~Xing_Xie3",
        "gender": ";M;;;;M",
        "homepage": ";;;;;http://research.microsoft.com/en-us/people/xingx/",
        "dblp": ";;;;;08/6809-1",
        "google_scholar": ";;;;;5EQfAFIAAAAJ",
        "orcid": ";;;;;0000-0002-8608-8482",
        "linkedin": ";%E6%B6%A6%E9%94%B4-%E9%83%91-551606156/;;;;xingx/",
        "or_profile": "~Xixu_HU2;~Runkai_Zheng1;~Jindong_Wang1;~Cheuk_Hang_LEUNG2;~Qi_WU5;~Xing_Xie3",
        "aff": ";Carnegie Mellon University;;;;Microsoft Research Asia",
        "aff_domain": ";andrew.cmu.edu;;;;microsoft.com",
        "position": ";MS student;;;;Senior Principal Researcher",
        "bibtex": "@misc{\nhu2024specformer,\ntitle={SpecFormer: Guarding Vision Transformer Robustness via Maximum Singular Value Penalization},\nauthor={Xixu HU and Runkai Zheng and Jindong Wang and Cheuk Hang LEUNG and Qi WU and Xing Xie},\nyear={2024},\nurl={https://openreview.net/forum?id=mivL0akE5E}\n}",
        "github": "",
        "project": "",
        "reviewers": "J9Ns;Q4D5;B7sA",
        "site": "https://openreview.net/forum?id=mivL0akE5E",
        "pdf_size": 1228596,
        "rating": "3;5;8",
        "confidence": "5;5;5",
        "soundness": "2;3;4",
        "contribution": "2;2;4",
        "presentation": "3;3;3",
        "wc_summary": "120;201;69",
        "wc_strengths": "37;81;129",
        "wc_weaknesses": "707;184;87",
        "wc_questions": "36;75;68",
        "wc_review": "900;541;353",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            5.333333333333333,
            2.0548046676563256
        ],
        "confidence_avg": [
            5.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            130.0,
            54.35071296680477
        ],
        "wc_strengths_avg": [
            82.33333333333333,
            37.57067414294766
        ],
        "wc_weaknesses_avg": [
            326.0,
            272.30252783745266
        ],
        "wc_questions_avg": [
            59.666666666666664,
            16.97710877099579
        ],
        "wc_review_avg": [
            598.0,
            226.91995651918026
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13808280996595184104&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 11,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Carnegie Mellon University;Microsoft",
        "aff_unique_dep": ";Research",
        "aff_unique_url": "https://www.cmu.edu;https://www.microsoft.com/en-us/research/group/asia",
        "aff_unique_abbr": "CMU;MSR Asia",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Asia",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "mjDROBU93g",
        "title": "DISTA: DENOISING SPIKING TRANSFORMER WITH INTRINSIC PLASTICITY AND SPATIOTEMPORAL ATTENTION",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Among the array of neural network architectures, the Vision Transformer (ViT) stands out as a prominent choice, acclaimed for its exceptional expressiveness and consistent high performance in various vision applications. Recently, the emerging Spiking ViT approach has endeavored to harness spiking neurons, paving the way for a more brain-inspired transformer architecture that thrives in ultra-low power operations on dedicated neuromorphic hardware. Nevertheless, this approach remains confined to spatial self-attention and doesn't fully unlock the potential of spiking neural networks.\nWe introduce DISTA, a Denoising Spiking Transformer with Intrinsic Plasticity and SpatioTemporal Attention, designed to maximize the spatiotemporal computational prowess of spiking neurons, particularly for vision applications. DISTA explores two types of spatiotemporal attentions: intrinsic neuron-level attention and network-level attention with explicit memory. Additionally, DISTA incorporates an efficient nonlinear denoising mechanism to quell the noise inherent in computed spatiotemporal attention maps, thereby resulting in further performance gains. Our DISTA transformer undergoes joint training involving synaptic plasticity (i.e., weight tuning) and intrinsic plasticity (i.e., membrane time constant tuning) and delivers state-of-the-art performances across several static image and dynamic neuromorphic datasets. With only 6 time steps, DISTA achieves remarkable top-1 accuracy on CIFAR10 (96.26\\%) and CIFAR100 (79.15\\%), as well as 79.1\\% on CIFAR10-DVS using 10 time steps.",
        "keywords": "Spiking Neural Networks;Spatiotemporal Attention;Transformer;Intrinsic Plasticity",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Boxun Xu;Hejia Geng;Yuxuan Yin;Peng Li",
        "authorids": "~Boxun_Xu1;~Hejia_Geng1;~Yuxuan_Yin1;~Peng_Li8",
        "gender": ";M;M;M",
        "homepage": ";;;https://www.ece.ucsb.edu/~lip/",
        "dblp": ";355/2680;287/5093;83/6353-1.html",
        "google_scholar": ";ameiXi0AAAAJ;g6SyvToAAAAJ;QYQUS7gAAAAJ",
        "orcid": ";;;0000-0003-3548-4589",
        "linkedin": ";;;peng-li-ucsb/",
        "or_profile": "~Boxun_Xu1;~Hejia_Geng1;~Yuxuan_Yin1;~Peng_Li8",
        "aff": ";University of California, Santa Barbara;University of California, Santa Barbara;UC Santa Barbara",
        "aff_domain": ";ucsb.edu;ucsb.edu;ucsb.edu",
        "position": ";MS student;PhD student;Professor",
        "bibtex": "@misc{\nxu2024dista,\ntitle={{DISTA}: {DENOISING} {SPIKING} {TRANSFORMER} {WITH} {INTRINSIC} {PLASTICITY} {AND} {SPATIOTEMPORAL} {ATTENTION}},\nauthor={Boxun Xu and Hejia Geng and Yuxuan Yin and Peng Li},\nyear={2024},\nurl={https://openreview.net/forum?id=mjDROBU93g}\n}",
        "github": "",
        "project": "",
        "reviewers": "kKsP;5bGj;DFpL;AvKg",
        "site": "https://openreview.net/forum?id=mjDROBU93g",
        "pdf_size": 786046,
        "rating": "3;3;6;6",
        "confidence": "5;4;4;4",
        "soundness": "2;2;3;2",
        "contribution": "2;2;3;2",
        "presentation": "2;4;3;3",
        "wc_summary": "19;78;25;90",
        "wc_strengths": "25;42;112;392",
        "wc_weaknesses": "84;50;274;138",
        "wc_questions": "2;34;27;86",
        "wc_review": "130;204;438;706",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "419;239;437;159",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            53.0,
            31.36080356113344
        ],
        "wc_strengths_avg": [
            142.75,
            147.55232122877635
        ],
        "wc_weaknesses_avg": [
            136.5,
            85.36246247619617
        ],
        "wc_questions_avg": [
            37.25,
            30.55630049596973
        ],
        "wc_review_avg": [
            369.5,
            225.0972012264924
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            313.5,
            118.11329307067854
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896258,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2617900573439330839&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of California, Santa Barbara",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucsb.edu",
        "aff_unique_abbr": "UCSB",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Santa Barbara",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "mjzwioGLux",
        "title": "ROBUST SPARSE AND DENSE MATCHING",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Finding corresponding pixels within a pair of images is a fundamental computer vision task with various applications. Due to the specific requirements of different tasks like optical flow estimation and local feature matching, previous works are primarily categorized into dense matching and sparse feature matching focusing on specialized architectures along with task-specific datasets, which may somewhat hinder the generalization performance of specialized models. In this paper, we propose RSDM, a robust network for sparse and dense matching. A cascaded GRU module is elaborately designed for refinement to explore the geometric similarity iteratively at multiple scales following an independent uncertainty estimation module for sparsification. To narrow the gap between synthetic samples and real-world scenarios, we organize a new dataset with sparse correspondence ground truth by generating optical flow supervision with greater intervals. In due course, we are able to mix up various dense and sparse matching datasets significantly improving the training diversity. The generalization capacity of our proposed RSDM is greatly enhanced by learning the matching and uncertainty estimation in a two-stage manner on the mixed data. Superior performance is achieved for zero-shot matching as well as downstream geometry estimation across multiple datasets, outperforming the previous methods by a large margin.",
        "keywords": "sparse matching;dense matching;optical flow;geometry estimation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Songyan Zhang;Xinyu Sun;Hao Chen;Bo Li;Chunhua Shen",
        "authorids": "~Songyan_Zhang1;~Xinyu_Sun3;~Hao_Chen17;~Bo_Li35;~Chunhua_Shen2",
        "gender": ";;;M;",
        "homepage": ";https://github.com/xy0601-xy;;;",
        "dblp": ";;;50/3402-90;",
        "google_scholar": ";;;https://scholar.google.com/citations?hl=zh-CN;",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Songyan_Zhang1;~Xinyu_Sun3;~Hao_Chen17;~Bo_Li35;~Chunhua_Shen2",
        "aff": ";Zhejiang University;;Northwestern Polytechnical University Xi'an;",
        "aff_domain": ";zju.edu.cn;;nwpu.edu.cn;",
        "position": ";MS student;;Associate Professor;",
        "bibtex": "@misc{\nzhang2024robust,\ntitle={{ROBUST} {SPARSE} {AND} {DENSE} {MATCHING}},\nauthor={Songyan Zhang and Xinyu Sun and Hao Chen and Bo Li and Chunhua Shen},\nyear={2024},\nurl={https://openreview.net/forum?id=mjzwioGLux}\n}",
        "github": "",
        "project": "",
        "reviewers": "Bj1C;Sn8S;gGcr",
        "site": "https://openreview.net/forum?id=mjzwioGLux",
        "pdf_size": 4112030,
        "rating": "5;5;6",
        "confidence": "4;3;4",
        "soundness": "2;3;2",
        "contribution": "2;3;2",
        "presentation": "3;3;3",
        "wc_summary": "50;95;112",
        "wc_strengths": "133;118;27",
        "wc_weaknesses": "228;102;216",
        "wc_questions": "24;2;4",
        "wc_review": "435;317;359",
        "wc_reply_reviewers": "19;0;36",
        "wc_reply_authors": "684;717;728",
        "reply_reviewers": "1;0;1",
        "reply_authors": "2;1;1",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            85.66666666666667,
            26.157641755751268
        ],
        "wc_strengths_avg": [
            92.66666666666667,
            46.83540920666281
        ],
        "wc_weaknesses_avg": [
            182.0,
            56.78027826631356
        ],
        "wc_questions_avg": [
            10.0,
            9.93310961716756
        ],
        "wc_review_avg": [
            370.3333333333333,
            48.835324191499836
        ],
        "wc_reply_reviewers_avg": [
            18.333333333333332,
            14.704496666741854
        ],
        "wc_reply_authors_avg": [
            709.6666666666666,
            18.696404883173543
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:KzVPVlJheqoJ:scholar.google.com/&scioq=ROBUST+SPARSE+AND+DENSE+MATCHING&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Zhejiang University;Northwestern Polytechnical University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.zju.edu.cn;http://www.nwpu.edu.cn",
        "aff_unique_abbr": "ZJU;NWPU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Xi'an",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "mkfvssecfl",
        "title": "Point Cloud Completion with Landau Distribution: A Probabilistic View",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Point clouds are fundamental discrete representations used in computer vision, robotics, etc. Chamfer Distance (CD) is widely adopted as a metric and training loss to evaluate the similarity between two point clouds. However, the vanilla CD is sensitive to outliers, which means a few widely distributed points can disproportionately affect the final similarity score. Besides, CD calculates the simple average of distances of matched point pairs between two sets, which does not take into account the underlying point-wise distance distribution across two point clouds (same weights assigned for  short- and  long-distance pairs by using uniform distribution). To mitigate these issues, we analyze the effect of prioritizing short- and long-distance pairs with Gaussian distributions obtained with grid search, and based on the findings, we take an indirect approach to find Landau distribution, out of many distributions, fits in the form of bimodal Gaussian mixture model which balances two types of pairs. Based on this observation, we propose LandauCD, an innovative loss function grounded in the Landau distribution. We conduct comprehensive experiments using LandauCD and observe significant improvements consistently over all the popular baseline networks trained with CD-based losses, leading to new state-of-the-art results on several benchmarks (PCN, Shapet-55/34, ShapeNet-Part). We also delve into the theoretical explanation behind the consistent improvements of LandauCD.  Code and weights will be released upon acceptance.",
        "keywords": "Point Cloud Completion;Landau Distribution;Loss Function Design",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Fangzhou Lin;Songlin Hou;Haotian Liu;Haoying Zhou;Xuechu Yu;Kazunori Yamada;Ziming Zhang",
        "authorids": "~Fangzhou_Lin1;~Songlin_Hou1;~Haotian_Liu6;~Haoying_Zhou1;~Xuechu_Yu2;~Kazunori_Yamada1;~Ziming_Zhang4",
        "gender": "M;M;M;M;M;M;M",
        "homepage": ";;https://andyliu7081.github.io/;;https://zhang-vislab.github.io/;https://yamada-kd.com/;https://zimingzhang.wordpress.com/",
        "dblp": "30/8685;267/6618.html;;309/1441;;;",
        "google_scholar": "https://scholar.google.co.jp/citations?user=ninTViIAAAAJ;sWVl1TgAAAAJ;kHsMnEYAAAAJ;rVeVNB0AAAAJ;;;2yqx3oIAAAAJ",
        "orcid": "0000-0002-1749-3599;;0009-0006-5770-6030;0000-0001-6976-4015;;;",
        "linkedin": ";songlin-hou/;;haoyingzhoujack/;;;",
        "or_profile": "~Fangzhou_Lin1;~Songlin_Hou1;~Haotian_Liu6;~Haoying_Zhou1;~Xuechu_Yu2;~Kazunori_Yamada1;~Ziming_Zhang1",
        "aff": "Worcester Polytechnic Institute;Georgia Institute of Technology;Northeastern University;Worcester Polytechnic Institute;Worcester Polytechnic Institute;Tohoku University;Worcester Polytechnic Institute",
        "aff_domain": "wpi.edu;gatech.edu;northeastern.edu;wpi.edu;wpi.edu;tohoku.ac.jp;wpi.edu",
        "position": "Researcher;MS student;Intern;PhD student;PhD student;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nlin2024point,\ntitle={Point Cloud Completion with Landau Distribution: A Probabilistic View},\nauthor={Fangzhou Lin and Songlin Hou and Haotian Liu and Haoying Zhou and Xuechu Yu and Kazunori Yamada and Ziming Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=mkfvssecfl}\n}",
        "github": "",
        "project": "",
        "reviewers": "eHnS;1Bi4;GMc1;oZ1H",
        "site": "https://openreview.net/forum?id=mkfvssecfl",
        "pdf_size": 2252125,
        "rating": "3;3;5;6",
        "confidence": "5;4;4;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;2",
        "presentation": "2;2;3;1",
        "wc_summary": "85;132;195;84",
        "wc_strengths": "22;103;87;195",
        "wc_weaknesses": "60;194;55;364",
        "wc_questions": "283;33;33;64",
        "wc_review": "450;462;370;707",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            124.0,
            45.348649373492925
        ],
        "wc_strengths_avg": [
            101.75,
            61.79552977360094
        ],
        "wc_weaknesses_avg": [
            168.25,
            126.02058363616636
        ],
        "wc_questions_avg": [
            103.25,
            104.54753703459494
        ],
        "wc_review_avg": [
            497.25,
            126.15739177709723
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:TMdRysxqMh4J:scholar.google.com/&scioq=Point+Cloud+Completion+with+Landau+Distribution:+A+Probabilistic+View&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0;0;3;0",
        "aff_unique_norm": "Worcester Polytechnic Institute;Georgia Institute of Technology;Northeastern University;Tohoku University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.wpi.edu;https://www.gatech.edu;https://www.northeastern.edu;https://www.tohoku.ac.jp",
        "aff_unique_abbr": "WPI;Georgia Tech;NEU;Tohoku U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;1;0",
        "aff_country_unique": "United States;Japan"
    },
    {
        "id": "mkjKqeBXkt",
        "title": "KITS: Inductive Spatio-Temporal Kriging with Increment Training Strategy",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Sensors are commonly deployed to perceive the environment. However, due to the high cost, sensors are usually sparsely deployed. Kriging is the tailored task to infer the unobserved nodes (without sensors) using the observed source nodes (with sensors). The essence of kriging task is transferability. Recently, several inductive spatio-temporal kriging methods have been proposed based on graph neural networks, being trained based on a graph built on top of observed nodes via pretext tasks such as masking nodes out and reconstructing them. However, the graph in training is inevitably much sparser than the graph in inference that includes all the observed and unobserved nodes. The learned pattern cannot be well generalized for inference, denoted as graph gap. To address this issue, we first present a novel Increment training strategy: instead of masking nodes (and reconstructing them), we add virtual nodes into the training graph so as to mitigate the graph gap issue naturally. Nevertheless, the empty-shell virtual nodes without labels could have bad-learned features and lack supervision signals. To solve these issues, we pair each virtual node with its most similar observed node and fuse their features together; to enhance the supervision signal, we construct reliable pseudo labels for virtual nodes. As a result, the learned pattern of virtual nodes could be safely transferred to real unobserved nodes for reliable kriging. We name our new Kriging model with Increment Training Strategy as KITS. Extensive experiments demonstrate that KITS consistently outperforms existing kriging methods by large margins, e.g., the improvement over MAE score could be as high as 18.33\\%.",
        "keywords": "Inductive kriging;spatio-temporal data;increment training strategy",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/db0458f4200d5dbebe23c0a449a4ac7a63a6c689.zip",
        "author": "Qianxiong Xu;Cheng Long;Ziyue Li;Sijie Ruan;Rui Zhao;zhishuai Li",
        "authorids": "~Qianxiong_Xu1;~Cheng_Long1;~Ziyue_Li2;~Sijie_Ruan1;~Rui_Zhao6;~zhishuai_Li1",
        "gender": "M;M;;M;M;M",
        "homepage": "https://github.com/Sam1224;https://personal.ntu.edu.sg/c.long/index.html;https://bonaldli.github.io/;http://www.sjruan.me/;http://zhaorui.xyz/;",
        "dblp": "328/0688;58/10813;189/5871-2;204/3375;26/2578-1;234/3635.html",
        "google_scholar": "1jz1_hMAAAAJ;LybJ7ksAAAAJ;q5_My2AAAAAJ;oecbn38AAAAJ;1c9oQNMAAAAJ;KN7DA0sAAAAJ",
        "orcid": "0000-0001-9175-6783;0000-0001-6806-8405;0000-0003-4983-9352;0000-0002-4520-7174;;",
        "linkedin": ";;;;;",
        "or_profile": "~Qianxiong_Xu1;~Cheng_Long1;~Ziyue_Li2;~Sijie_Ruan1;~Rui_Zhao6;~zhishuai_Li1",
        "aff": "Nanyang Technological University;Nanyang Technological University;University of Cologne;Beijing Institute of Technology;SenseTime Research;SenseTime Research",
        "aff_domain": "ntu.edu.sg;ntu.edu.sg;uni-koeln.de;bit.edu.cn;sensetime.com;sentime.com",
        "position": "PhD student;Assistant Professor;Assistant Professor;Assistant Professor;Researcher;Researcher",
        "bibtex": "@misc{\nxu2024kits,\ntitle={{KITS}: Inductive Spatio-Temporal Kriging with Increment Training Strategy},\nauthor={Qianxiong Xu and Cheng Long and Ziyue Li and Sijie Ruan and Rui Zhao and zhishuai Li},\nyear={2024},\nurl={https://openreview.net/forum?id=mkjKqeBXkt}\n}",
        "github": "",
        "project": "",
        "reviewers": "FRYk;env1;Ge1P",
        "site": "https://openreview.net/forum?id=mkjKqeBXkt",
        "pdf_size": 2011634,
        "rating": "5;6;6",
        "confidence": "4;3;2",
        "soundness": "1;3;3",
        "contribution": "3;3;3",
        "presentation": "3;2;3",
        "wc_summary": "177;367;108",
        "wc_strengths": "24;69;45",
        "wc_weaknesses": "235;329;186",
        "wc_questions": "1;98;28",
        "wc_review": "437;863;367",
        "wc_reply_reviewers": "267;148;75",
        "wc_reply_authors": "1947;1538;861",
        "reply_reviewers": "2;2;1",
        "reply_authors": "4;4;3",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            217.33333333333334,
            109.51509282083248
        ],
        "wc_strengths_avg": [
            46.0,
            18.384776310850235
        ],
        "wc_weaknesses_avg": [
            250.0,
            59.33520596295817
        ],
        "wc_questions_avg": [
            42.333333333333336,
            40.87650778734515
        ],
        "wc_review_avg": [
            555.6666666666666,
            219.18840196405364
        ],
        "wc_reply_reviewers_avg": [
            163.33333333333334,
            79.12999150483687
        ],
        "wc_reply_authors_avg": [
            1448.6666666666667,
            447.8350390737891
        ],
        "reply_reviewers_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=554749475617286194&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;2;3;3",
        "aff_unique_norm": "Nanyang Technological University;University of Cologne;Beijing Institute of Technology;SenseTime",
        "aff_unique_dep": ";;;SenseTime Research",
        "aff_unique_url": "https://www.ntu.edu.sg;https://www.uni-koeln.de/;http://www.bit.edu.cn/;https://www.sensetime.com",
        "aff_unique_abbr": "NTU;UC;BIT;SenseTime",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;2;2;2",
        "aff_country_unique": "Singapore;Germany;China"
    },
    {
        "id": "mkwOQGaIrQ",
        "title": "Learning then Leveraging Structures Help with Complex, Compositional, Causal Sequential Tasks in Inverse Reinforcement Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The field of Inverse Reinforcement Learning (IRL) has experienced substantial advancements in recent years, with commendable newer approaches yielding crucial applications in diverse areas such as robotics, cognition, and healthcare. This paper underscores the limitations of foundational IRL methods when learning an agent\u2019s reward function from *expert trajectories that have underlying causal reward structure*. We posit that imbuing IRL models with causal structural motifs capturing underlying relationships between actions and outcomes or, the reward logic can enable and enhance their performance. Based on this hypothesis, we propose SMIRL \u2013 an IRL approach that initially learns the task\u2019s structure as a finite-state-automaton (FSA) and subsequently leverages this structural motif to solve the IRL problem. We demonstrate SMIRL\u2019s capabilities in both discrete (grid world) and high-dimensional continuous domain environments across four logic based tasks. The SMIRL approach proves adept at learning tasks characterized by causal reward functions, a known limitation of foundational IRL approaches.Our model also outperforms the baselines in sample efficiency on tasks. We further show promising test results in a modified continuous domain on tasks with compositional reward functions.",
        "keywords": "Reinforcement learning;inverse reinforcement learning;belief propagation",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/2edee8cfab3e87f9eff7a13178aa75bd323b91d3.zip",
        "author": "Raeid Saqur",
        "authorids": "~Raeid_Saqur1",
        "gender": "M",
        "homepage": "http://www.cs.toronto.edu/~raeidsaqur/",
        "dblp": "",
        "google_scholar": "0aJ--58AAAAJ",
        "orcid": "0000-0002-6330-5480",
        "linkedin": "raeidsaqur/",
        "or_profile": "~Raeid_Saqur1",
        "aff": "University of Toronto",
        "aff_domain": "toronto.edu",
        "position": "PhD student",
        "bibtex": "@misc{\nsaqur2024learning,\ntitle={Learning then Leveraging Structures Help with Complex, Compositional, Causal Sequential Tasks in Inverse Reinforcement Learning},\nauthor={Raeid Saqur},\nyear={2024},\nurl={https://openreview.net/forum?id=mkwOQGaIrQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "aQAV;XJYd;eYKt",
        "site": "https://openreview.net/forum?id=mkwOQGaIrQ",
        "pdf_size": 1574583,
        "rating": "3;3;5",
        "confidence": "3;4;4",
        "soundness": "2;2;2",
        "contribution": "2;2;2",
        "presentation": "2;2;3",
        "wc_summary": "82;86;47",
        "wc_strengths": "63;174;30",
        "wc_weaknesses": "333;844;242",
        "wc_questions": "145;55;131",
        "wc_review": "623;1159;450",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            71.66666666666667,
            17.518244457961217
        ],
        "wc_strengths_avg": [
            89.0,
            61.59545437773797
        ],
        "wc_weaknesses_avg": [
            473.0,
            264.954084072442
        ],
        "wc_questions_avg": [
            110.33333333333333,
            39.541820336898446
        ],
        "wc_review_avg": [
            744.0,
            301.82886983631414
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:DCR2FvhG7KkJ:scholar.google.com/&scioq=Learning+then+Leveraging+Structures+Help+with+Complex,+Compositional,+Causal+Sequential+Tasks+in+Inverse+Reinforcement+Learning&hl=en&as_sdt=0,48",
        "gs_version_total": 4,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Toronto",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.utoronto.ca",
        "aff_unique_abbr": "U of T",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Canada"
    },
    {
        "title": "RECOMP: Improving Retrieval-Augmented LMs with Context Compression and Selective Augmentation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17885",
        "id": "mlJLVigNHp",
        "author_site": "Fangyuan Xu, Weijia Shi, Eunsol Choi",
        "tldr": "",
        "abstract": "Retrieval-augmented language models improve language models (LMs) by retrieving documents and prepending them in-context.\nHowever, these documents, often spanning hundreds of words, make inference substantially less efficient. We propose compressing the retrieved documents into textual summaries prior to in-context integration. This not only reduces the computational costs but also relieve the burden of LMs to identify relevant information in long retrieved documents. We present two compressors -- an extractive compressor which selects useful sentences from retrieved documents  and an abstractive compressor which generates summary by synthesizing information from multiple documents. Both are trained to achieve performance gain in LMs when we prepend the generated summary from the compressor to LMs' input, while minimizing the summary length. When retrieved documents are irrelevant to the input or offer no additional information to LM, our compressors output an empty string, enabling selective augmentation. We evaluate our approach on the language modeling task and open domain question answering task. We achieve a compression rate of as low as 6% with minimal loss in performance for both tasks, significantly outperforming the off-the-shelf summarization models. We show that our compressors trained for one LM can transfer to other LMs on the language modeling task and provide a summary largely faithful to the retrieved documents.",
        "keywords": "retrieval augmented language model;language modeling;question answering;summarization;distillation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Fangyuan Xu;Weijia Shi;Eunsol Choi",
        "authorids": "~Fangyuan_Xu1;~Weijia_Shi1;~Eunsol_Choi1",
        "gender": ";;",
        "homepage": ";https://weijiashi.notion.site/;https://eunsol.github.io/",
        "dblp": ";132/80601;116/2765",
        "google_scholar": "gAzZXuEAAAAJ;https://scholar.google.com/citations?hl=en;6wulN88AAAAJ",
        "orcid": ";0000-3200-0000-0011;0000-0003-3607-9104",
        "linkedin": ";weijia-shi-773768112;",
        "or_profile": "~Fangyuan_Xu1;~Weijia_Shi1;~Eunsol_Choi1",
        "aff": "University of Texas at Austin;University of Washington, Seattle;University of Texas, Austin",
        "aff_domain": "utexas.edu;uw.edu;cs.utexas.edu",
        "position": "PhD student;PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nxu2024recomp,\ntitle={{RECOMP}: Improving Retrieval-Augmented {LM}s with Context Compression and Selective Augmentation},\nauthor={Fangyuan Xu and Weijia Shi and Eunsol Choi},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=mlJLVigNHp}\n}",
        "github": "",
        "project": "",
        "reviewers": "hWi7;pQZH;WhGn;VoPU",
        "pdf_size": 652675,
        "rating": "6;6;8;8",
        "confidence": "3;4;4;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;3;2",
        "presentation": "3;3;4;3",
        "wc_summary": "109;83;102;66",
        "wc_strengths": "74;50;23;23",
        "wc_weaknesses": "38;93;144;63",
        "wc_questions": "103;52;24;45",
        "wc_review": "324;278;293;197",
        "wc_reply_reviewers": "40;0;10;0",
        "wc_reply_authors": "306;283;528;361",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "2;2;2;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            90.0,
            16.80773631397161
        ],
        "wc_strengths_avg": [
            42.5,
            21.266170318136737
        ],
        "wc_weaknesses_avg": [
            84.5,
            39.48733974326455
        ],
        "wc_questions_avg": [
            56.0,
            29.025850547399983
        ],
        "wc_review_avg": [
            273.0,
            46.90948731333567
        ],
        "wc_reply_reviewers_avg": [
            12.5,
            16.393596310755
        ],
        "wc_reply_authors_avg": [
            369.5,
            95.79796448776978
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 70,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1273467594883212962&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=mlJLVigNHp",
        "pdf": "https://openreview.net/pdf?id=mlJLVigNHp",
        "email": "utexas.edu;uw.edu;cs.utexas.edu",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Texas at Austin;University of Washington",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.utexas.edu;https://www.washington.edu",
        "aff_unique_abbr": "UT Austin;UW",
        "aff_campus_unique_index": "0;1;0",
        "aff_campus_unique": "Austin;Seattle",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Class Probability Matching with Calibrated Networks for Label Shift Adaption",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17884",
        "id": "mliQ2huFrZ",
        "author_site": "Hongwei Wen, Annika Betken, Hanyuan Hang",
        "tldr": "",
        "abstract": "We consider the domain adaptation problem in the context of label shift, where the label distributions  between source and target domain differ, but the conditional distributions of features given the label are the same. To solve the label shift adaption problem, we develop a novel matching framework named \\textit{class probability matching} (\\textit{CPM}). It is inspired by a new understanding of the source domain's class probability, as well as a specific relationship between class probability ratios and feature probability ratios between the source and target domains. CPM is able to maintain the same theoretical guarantee with the existing feature probability matching framework, while significantly improving the computational efficiency due to directly matching the probabilities of the label variable. Within the CPM framework, we propose an algorithm named \\textit{class probability matching with calibrated networks} (\\textit{CPMCN}) for target domain classification. From the theoretical perspective, we establish the generalization bound of the CPMCN method in order to explain the benefits of introducing calibrated networks. From the experimental perspective, real data comparisons show that CPMCN outperforms existing matching-based and EM-based algorithms.",
        "keywords": "Domain adaptation;Label shift;Matching methods",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Hongwei Wen;Annika Betken;Hanyuan Hang",
        "authorids": "~Hongwei_Wen1;~Annika_Betken1;~Hanyuan_Hang1",
        "gender": ";;M",
        "homepage": "https://www.researchgate.net/profile/Hongwei_Wen2;https://people.utwente.nl/a.betken;",
        "dblp": "41/1357;305/5986;180/5385",
        "google_scholar": ";;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Hongwei_Wen1;~Annika_Betken1;~Hanyuan_Hang1",
        "aff": "University of Twente;University of Twente;University of Twente",
        "aff_domain": "utwente.nl;utwente.nl;utwente.nl",
        "position": "PhD student;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nwen2024class,\ntitle={Class Probability Matching with Calibrated Networks for Label Shift Adaption},\nauthor={Hongwei Wen and Annika Betken and Hanyuan Hang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=mliQ2huFrZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "PKvz;FsKm;Y2x9;t6VC",
        "pdf_size": 486325,
        "rating": "5;8;8;8",
        "confidence": "4;3;5;3",
        "soundness": "3;3;4;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;4;3",
        "wc_summary": "88;78;94;66",
        "wc_strengths": "33;52;39;60",
        "wc_weaknesses": "175;32;290;102",
        "wc_questions": "48;109;34;22",
        "wc_review": "344;271;457;250",
        "wc_reply_reviewers": "0;19;0;0",
        "wc_reply_authors": "1025;874;633;577",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "2;3;1;1",
        "rating_avg": [
            7.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            81.5,
            10.618380290797651
        ],
        "wc_strengths_avg": [
            46.0,
            10.606601717798213
        ],
        "wc_weaknesses_avg": [
            149.75,
            95.4630163990223
        ],
        "wc_questions_avg": [
            53.25,
            33.47667098144617
        ],
        "wc_review_avg": [
            330.5,
            80.93979243857746
        ],
        "wc_reply_reviewers_avg": [
            4.75,
            8.227241335952167
        ],
        "wc_reply_authors_avg": [
            777.25,
            181.41716429268757
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.17407765595569782,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6992043003828438249&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=mliQ2huFrZ",
        "pdf": "https://openreview.net/pdf?id=mliQ2huFrZ",
        "email": "utwente.nl;utwente.nl;utwente.nl",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Twente",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.utwente.nl",
        "aff_unique_abbr": "UT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Netherlands"
    },
    {
        "id": "mlxaJl9FrZ",
        "title": "DIFFender: Diffusion-Based Adversarial Defense against Patch Attacks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Adversarial attacks, particularly patch attacks, pose significant threats to the robustness and reliability of deep learning models. Developing reliable defenses against patch attacks is crucial for real-world applications, yet current research in this area is not satisfactory. In this paper, we propose DIFFender, a novel defense method that leverages a text-guided diffusion model to defend against adversarial patches. DIFFender includes two main stages: patch localization and patch restoration. In the localization stage, we find and exploit an intriguing property of the diffusion model to effectively identify the locations of adversarial patches. In the restoration stage, we employ the diffusion model to reconstruct the adversarial regions in the images while preserving the integrity of the visual content. Importantly, these two stages are carefully guided by a unified diffusion model, thus we can utilize the close interaction between them to improve the whole defense performance. Moreover, we propose a few-shot prompt-tuning algorithm to fine-tune the diffusion model, enabling the pre-trained diffusion model to easily adapt to the defense task. We conduct extensive experiments on the image classification and face recognition tasks, demonstrating that our proposed method exhibits superior robustness under strong adaptive attacks and generalizes well across various scenarios, diverse classifiers, and multiple patch attack methods.",
        "keywords": "Diffusion;Adversarial;Defense",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/67b6bf7ee9e0da703c6fc848cc37bd40af558426.zip",
        "author": "Caixin Kang;Yinpeng Dong;Zhengyi Wang;Shouwei Ruan;Yubo Chen;Hang Su;Xingxing Wei",
        "authorids": "~Caixin_Kang1;~Yinpeng_Dong2;~Zhengyi_Wang1;~Shouwei_Ruan1;~Yubo_Chen3;~Hang_Su3;~Xingxing_Wei1",
        "gender": "M;M;M;M;M;M;M",
        "homepage": ";https://dongyp13.github.io;https://thuwzy.github.io;https://github.com/Heathcliff-saku;https://openreview.net/profile?id=~Yubo_Chen3;https://sites.google.com/site/xingxingwei1988/;",
        "dblp": "330/9728;183/0980;;330/9483;;57/4066;26/5371-6",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;6_4ad84AAAAJ;dtuPuRQAAAAJ;1pggtuUAAAAJ;;ak8D_cQAAAAJ;dxN1_X0AAAAJ",
        "orcid": "0009-0001-1924-9311;;;;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Caixin_Kang1;~Yinpeng_Dong2;~Zhengyi_Wang1;~Shouwei_Ruan1;~Yubo_Chen3;~Xingxing_Wei1;~Hang_Su2",
        "aff": "Beihang University;Tsinghua University;Tsinghua University;Institute of Artificial Intelligence, Beihang University;Beijing Institute of Technology;Beihang University;Tsinghua University",
        "aff_domain": "buaa.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;buaa.edu.cn;bit.edu.cn;buaa.edu.cn;tsinghua.edu.cn",
        "position": "MS student;Postdoc;PhD student;PhD student;Undergrad student;Associate Professor;Associate Professor",
        "bibtex": "@misc{\nkang2024diffender,\ntitle={{DIFF}ender: Diffusion-Based Adversarial Defense against Patch Attacks},\nauthor={Caixin Kang and Yinpeng Dong and Zhengyi Wang and Shouwei Ruan and Yubo Chen and Hang Su and Xingxing Wei},\nyear={2024},\nurl={https://openreview.net/forum?id=mlxaJl9FrZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "jfCV;Xs1L;xWTm;2k2w",
        "site": "https://openreview.net/forum?id=mlxaJl9FrZ",
        "pdf_size": 3866035,
        "rating": "3;5;5;5",
        "confidence": "3;5;3;4",
        "soundness": "3;3;2;2",
        "contribution": "2;2;2;2",
        "presentation": "3;3;2;3",
        "wc_summary": "54;89;111;147",
        "wc_strengths": "43;24;15;44",
        "wc_weaknesses": "31;168;49;556",
        "wc_questions": "64;2;314;167",
        "wc_review": "192;283;489;914",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            100.25,
            33.7888665095472
        ],
        "wc_strengths_avg": [
            31.5,
            12.419742348374221
        ],
        "wc_weaknesses_avg": [
            201.0,
            211.61167264591055
        ],
        "wc_questions_avg": [
            136.75,
            118.09186043076805
        ],
        "wc_review_avg": [
            469.5,
            278.27549299210665
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.5222329678670935,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18337222984156951384&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;1;0;2;0;1",
        "aff_unique_norm": "Beihang University;Tsinghua University;Beijing Institute of Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.buaa.edu.cn/;https://www.tsinghua.edu.cn;http://www.bit.edu.cn/",
        "aff_unique_abbr": "BUAA;THU;BIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "mmCIov21zD",
        "title": "RoDyn-SLAM: Robust Dynamic Dense RGB-D SLAM with Neural Radiance Fields",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Leveraging neural implicit representation to conduct dense RGB-D SLAM has been studied in recent years. However, this approach relies on a static environment assumption and does not work robustly within a dynamic environment due to the inconsistent observation of geometry and photometry. To address the challenges presented in dynamic environments, we propose a novel dynamic SLAM framework with neural radiance field. Specifically, we introduce a motion mask generation method to filter out the invalid sampled rays. This design effectively fuses the optical flow mask and semantic mask to enhance the precision of motion mask. To further improve the accuracy of pose estimation, we have designed a divide-and-conquer pose optimization algorithm that distinguishes between keyframes and non-keyframes. The proposed edge warp loss can effectively enhance the geometry constraints between adjacent frames. Extensive experiments are conducted on the two challenging datasets, and the results show that RoDyn-SLAM achieves state-of-the-art performance among recent neural RGB-D methods in both accuracy and robustness.",
        "keywords": "SLAM;Dynamic Scene;Pose estimation;NeRF",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/981dea577e60b2fbcf9014e896d9eb6adb8fd122.zip",
        "author": "Haochen Jiang;Yueming Xu;Kejie Li;Li Zhang;Jianfeng Feng",
        "authorids": "~Haochen_Jiang1;~Yueming_Xu1;~Kejie_Li2;~Li_Zhang5;~Jianfeng_Feng2",
        "gender": "M;M;M;M;M",
        "homepage": ";https://github.com/ming82871;https://likojack.github.io/kejieli/#/home;http://www.robots.ox.ac.uk/~lz/;https://www.dcs.warwick.ac.uk/~feng/",
        "dblp": ";42/10611;44/3202;89/5992-40;19/6212",
        "google_scholar": ";;https://scholar.google.com.au/citations?user=JBwsoCUAAAAJ;-wOTCE8AAAAJ;https://scholar.google.co.uk/citations?user=0MtAVz4AAAAJ",
        "orcid": "0000-0003-3081-0891;;;;",
        "linkedin": ";;kejie-li-3b8ab4100/?trk=public_profile_browsemap&originalSubdomain=uk;;",
        "or_profile": "~Haochen_Jiang1;~Yueming_Xu1;~Kejie_Li2;~Li_Zhang5;~Feng_Jian_Feng1",
        "aff": "Fudan University;Fudan University;ByteDance;Fudan University;The University of Warwick",
        "aff_domain": "fudan.edu.cn;fudan.edu.cn;bytedance.com;fudan.edu.cn;warwick.ac.uk",
        "position": "PhD student;PhD student;Researcher;Associate Professor;Full Professor",
        "bibtex": "@misc{\njiang2024rodynslam,\ntitle={RoDyn-{SLAM}: Robust Dynamic Dense {RGB}-D {SLAM} with Neural Radiance Fields},\nauthor={Haochen Jiang and Yueming Xu and Kejie Li and Li Zhang and Jianfeng Feng},\nyear={2024},\nurl={https://openreview.net/forum?id=mmCIov21zD}\n}",
        "github": "",
        "project": "",
        "reviewers": "az7R;HXpV;x3wF;H57b",
        "site": "https://openreview.net/forum?id=mmCIov21zD",
        "pdf_size": 16179131,
        "rating": "5;5;6;8",
        "confidence": "4;5;4;3",
        "soundness": "3;3;3;3",
        "contribution": "3;2;3;3",
        "presentation": "3;3;3;4",
        "wc_summary": "42;53;59;56",
        "wc_strengths": "43;20;37;83",
        "wc_weaknesses": "37;106;113;43",
        "wc_questions": "201;2;8;63",
        "wc_review": "323;181;217;245",
        "wc_reply_reviewers": "21;0;0;0",
        "wc_reply_authors": "1069;942;456;396",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "3;3;1;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            52.5,
            6.422616289332565
        ],
        "wc_strengths_avg": [
            45.75,
            23.101677428273472
        ],
        "wc_weaknesses_avg": [
            74.75,
            34.90254288730264
        ],
        "wc_questions_avg": [
            68.5,
            80.10773995064397
        ],
        "wc_review_avg": [
            241.5,
            52.23743868146676
        ],
        "wc_reply_reviewers_avg": [
            5.25,
            9.093266739736606
        ],
        "wc_reply_authors_avg": [
            715.75,
            293.9748075941202
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            1.0
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.8660254037844386,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17965240852541424661&as_sdt=4005&sciodt=0,6&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;0;2",
        "aff_unique_norm": "Fudan University;ByteDance;University of Warwick",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.fudan.edu.cn;https://www.bytedance.com;https://warwick.ac.uk",
        "aff_unique_abbr": "Fudan;ByteDance;Warwick",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;1",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "id": "mmSmQ0gNyZ",
        "title": "Contrastive Post-training Large Language Models on Data Curriculum",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Alignment serves as an important step to steer large language models (LLMs) towards human preferences. In this paper, we explore contrastive post-training techniques for alignment by automatically constructing preference pairs from multiple models of varying strengths (e.g., InstructGPT, ChatGPT and GPT-4). We carefully compare the contrastive techniques of SLiC and DPO to SFT baselines and find that DPO provides a step-function improvement even after continueing SFT saturates. We also explore a data curriculum learning scheme for contrastive post-training, which starts by learning from \"easier\" pairs and transitioning to \"harder\" ones, which further improves alignment. Finally, we scale up our experiments to train with more data and larger models like Orca. Remarkably, contrastive post-training further improves the performance of Orca, already a state-of-the-art instruction learning model tuned with GPT-4 outputs, to exceed that of ChatGPT.",
        "keywords": "large language model;curriculum learning;contrastive learning;alignment",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Canwen Xu;Corby Rosset;Luciano Del Corro;Shweti Mahajan;Julian McAuley;Jennifer Neville;Ahmed Hassan Awadallah;Nikhil Rao",
        "authorids": "~Canwen_Xu1;~Corby_Rosset2;~Luciano_Del_Corro1;~Shweti_Mahajan1;~Julian_McAuley1;~Jennifer_Neville1;~Ahmed_Hassan_Awadallah1;~Nikhil_Rao1",
        "gender": ";;M;F;M;F;M;M",
        "homepage": ";;http://people.mpi-inf.mpg.de/~corrogg/;;http://cseweb.ucsd.edu/~jmcauley/;;https://www.microsoft.com/en-us/research/people/hassanam/publications/;",
        "dblp": ";;127/0394;;29/3483;n/JenniferNeville;147/9148;57/9513.html",
        "google_scholar": ";;https://scholar.google.de/citations?user=vJfDxrIAAAAJ;https://scholar.google.com/citations?hl=en;icbo4M0AAAAJ;6CTPn44AAAAJ;sNGk-9MAAAAJ;GhqD_rwAAAAJ",
        "orcid": ";;;;0000-0003-0955-7588;0009-0007-1157-018X;;",
        "linkedin": ";;lucianodelcorro/;shweti-mahajan/;;;ahmed-hassan-awadallah-a355a27/;nikhil-rao-012068a1/",
        "or_profile": "~Canwen_Xu1;~Corby_Rosset2;~Luciano_Del_Corro1;~Shweti_Mahajan1;~Julian_McAuley1;~Jennifer_Neville1;~Ahmed_Hassan_Awadallah1;~Nikhil_Rao1",
        "aff": ";;Microsoft Research;Microsoft;University of California, San Diego, University of California, San Diego;Purdue University;Microsoft Research;Microsoft",
        "aff_domain": ";;microsoft.com;microsoft.com;eng.ucsd.edu;purdue.edu;microsoft.com;microsoft.com",
        "position": ";;Researcher;Software Engineer;Full Professor;Full Professor;Principal Researcher;Principal Researcher",
        "bibtex": "@misc{\nxu2024contrastive,\ntitle={Contrastive Post-training Large Language Models on Data Curriculum},\nauthor={Canwen Xu and Corby Rosset and Luciano Del Corro and Shweti Mahajan and Julian McAuley and Jennifer Neville and Ahmed Hassan Awadallah and Nikhil Rao},\nyear={2024},\nurl={https://openreview.net/forum?id=mmSmQ0gNyZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "kAVD;ohbY;Vr47;7AN3",
        "site": "https://openreview.net/forum?id=mmSmQ0gNyZ",
        "pdf_size": 255493,
        "rating": "3;3;5;5",
        "confidence": "2;2;4;3",
        "soundness": "2;2;3;3",
        "contribution": "1;2;2;3",
        "presentation": "2;1;3;3",
        "wc_summary": "190;75;88;59",
        "wc_strengths": "43;42;51;62",
        "wc_weaknesses": "195;222;167;61",
        "wc_questions": "47;647;192;63",
        "wc_review": "475;986;498;245",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            103.0,
            51.268898954434356
        ],
        "wc_strengths_avg": [
            49.5,
            8.0156097709407
        ],
        "wc_weaknesses_avg": [
            161.25,
            61.058885512265945
        ],
        "wc_questions_avg": [
            237.25,
            243.15671386988268
        ],
        "wc_review_avg": [
            551.0,
            269.9286942879545
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.9045340337332909,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2760606711320779663&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2;0;0",
        "aff_unique_norm": "Microsoft;University of California, San Diego;Purdue University",
        "aff_unique_dep": "Microsoft Research;;",
        "aff_unique_url": "https://www.microsoft.com/en-us/research;https://www.ucsd.edu;https://www.purdue.edu",
        "aff_unique_abbr": "MSR;UCSD;Purdue",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";San Diego",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Multi-Resolution Diffusion Models for Time Series Forecasting",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17883",
        "id": "mmjnr0G8ZY",
        "author_site": "Lifeng Shen, Weiyu Chen, James Kwok",
        "tldr": "",
        "abstract": "The diffusion model has been successfully used in many computer vision applications, such as text-guided image generation and image-to-image translation. Recently, there have been attempts on extending the diffusion model for time series data. However, these extensions are fairly straightforward and do not utilize the unique properties of time series data. As different patterns are usually exhibited at multiple scales of a time series, we in this paper leverage this multi-resolution temporal structure and propose the multi-resolution diffusion model (mr-Diff). By using the seasonal-trend decomposition, we sequentially extract fine-to-coarse trends from the time series for forward diffusion. The denoising process then proceeds in an easy-to-hard non-autoregressive manner. The coarsest trend is generated first. Finer details are progressively added, using the predicted coarser trends as condition variables. Experimental results on nine real-world time series datasets demonstrate that mr-Diff outperforms state-of-the-art time series diffusion models. It is also better than or comparable across a wide variety of advanced time series prediction models.",
        "keywords": "diffusion model;time series;multiscale",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Lifeng Shen;Weiyu Chen;James Kwok",
        "authorids": "~Lifeng_Shen1;~Weiyu_Chen1;~James_Kwok1",
        "gender": "M;M;",
        "homepage": "https://www.lshenae.cn/;;",
        "dblp": "65/9544;73/6153;",
        "google_scholar": "https://scholar.google.com.hk/citations?user=MW_qCGoAAAAJ;;",
        "orcid": "0000-0003-0787-3835;0000-0002-1620-6500;",
        "linkedin": ";;",
        "or_profile": "~Lifeng_Shen1;~Weiyu_Chen1;~James_Kwok1",
        "aff": "Hong Kong University of Science and Technology;Hong Kong University of Science and Technology;",
        "aff_domain": "ust.hk;ust.hk;",
        "position": "PhD student;PhD student;",
        "bibtex": "@inproceedings{\nshen2024multiresolution,\ntitle={Multi-Resolution Diffusion Models for Time Series Forecasting},\nauthor={Lifeng Shen and Weiyu Chen and James Kwok},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=mmjnr0G8ZY}\n}",
        "github": "",
        "project": "",
        "reviewers": "WNFV;xEhe;aTA7;V8ZH",
        "pdf_size": 4601588,
        "rating": "6;6;6;8",
        "confidence": "3;4;4;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "50;30;43;57",
        "wc_strengths": "40;26;37;25",
        "wc_weaknesses": "80;9;169;139",
        "wc_questions": "115;164;2;67",
        "wc_review": "285;229;251;288",
        "wc_reply_reviewers": "0;0;52;108",
        "wc_reply_authors": "499;753;744;2199",
        "reply_reviewers": "0;0;1;2",
        "reply_authors": "1;1;1;5",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            45.0,
            9.974968671630002
        ],
        "wc_strengths_avg": [
            32.0,
            6.59545297913646
        ],
        "wc_weaknesses_avg": [
            99.25,
            61.15707236289193
        ],
        "wc_questions_avg": [
            87.0,
            59.87069399965228
        ],
        "wc_review_avg": [
            263.25,
            24.539508960042376
        ],
        "wc_reply_reviewers_avg": [
            40.0,
            44.63182720884279
        ],
        "wc_reply_authors_avg": [
            1048.75,
            671.8706627766984
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.0,
            1.7320508075688772
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 21,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=615009149614363683&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=mmjnr0G8ZY",
        "pdf": "https://openreview.net/pdf?id=mmjnr0G8ZY",
        "email": "ust.hk;ust.hk;",
        "author_num": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Hong Kong University of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ust.hk",
        "aff_unique_abbr": "HKUST",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "mmykTCbjXH",
        "title": "FedConv: Enhancing Convolutional Neural Networks for Handling Data Heterogeneity in Federated Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Federated learning (FL) is an emerging paradigm in machine learning, where a shared model is collaboratively learned using data from multiple devices to mitigate the risk of data leakage. While recent studies posit that Vision Transformer (ViT) outperforms Convolutional Neural Networks (CNNs) in addressing data heterogeneity in FL, the specific architectural components that underpin this advantage have yet to be elucidated. In this paper, we systematically investigate the impact of different architectural elements, such as activation functions and normalization layers, on the performance within heterogeneous FL. Through rigorous empirical analyses, we are able to offer the first-of-its-kind general guidance on micro-architecture design principles for heterogeneous FL. Intriguingly, our findings indicate that with strategic architectural modifications, pure CNNs can achieve a level of robustness that either matches or even exceeds that of ViTs when handling heterogeneous data clients in FL. Additionally, our approach is compatible with existing FL techniques and delivers state-of-the-art solutions across a broad spectrum of FL benchmarks.",
        "keywords": "Federated Learning;Data Heterogeneity;CNNs;Transformers",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/97baaf7f51c792fc2c14cf73a50cdc0e5a4805ef.pdf",
        "author": "Peiran Xu;Zeyu Wang;Jieru Mei;Alan Yuille;Liangqiong Qu;Cihang Xie;Yuyin Zhou",
        "authorids": "~Peiran_Xu2;~Zeyu_Wang2;~Jieru_Mei2;~Alan_Yuille1;~Liangqiong_Qu2;~Cihang_Xie3;~Yuyin_Zhou1",
        "gender": ";;M;M;F;;",
        "homepage": ";;https://meijieru.com/;;https://liangqiong.github.io/;;https://yuyinzhou.github.io/",
        "dblp": ";;198/9332.html;y/AlanLYuille;149/2634;;192/1413",
        "google_scholar": ";;nHKExN0AAAAJ;;ruKpgzwAAAAJ;;eiqVLC0AAAAJ",
        "orcid": ";;;;0000-0001-8235-7852;;",
        "linkedin": ";;meijieru/;;;;",
        "or_profile": "~Peiran_Xu2;~Zeyu_Wang2;~Jieru_Mei2;~Alan_Yuille1;~Liangqiong_Qu2;~Cihang_Xie3;~Yuyin_Zhou1",
        "aff": ";;Johns Hopkins University;Johns Hopkins University;University of Hong Kong;;University of California, Santa Cruz",
        "aff_domain": ";;jhu.edu;johnshopkins.edu;hku.hk;;ucsc.edu",
        "position": ";;PhD student;Full Professor;Assistant Professor;;Assistant Professor",
        "bibtex": "@misc{\nxu2024fedconv,\ntitle={FedConv: Enhancing Convolutional Neural Networks for Handling Data Heterogeneity in Federated Learning},\nauthor={Peiran Xu and Zeyu Wang and Jieru Mei and Alan Yuille and Liangqiong Qu and Cihang Xie and Yuyin Zhou},\nyear={2024},\nurl={https://openreview.net/forum?id=mmykTCbjXH}\n}",
        "github": "",
        "project": "",
        "reviewers": "nqDj;vWDW;4TD6;Ggo2",
        "site": "https://openreview.net/forum?id=mmykTCbjXH",
        "pdf_size": 325684,
        "rating": "3;3;6;6",
        "confidence": "4;5;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "70;50;85;56",
        "wc_strengths": "34;47;122;68",
        "wc_weaknesses": "101;675;96;82",
        "wc_questions": "392;77;173;43",
        "wc_review": "597;849;476;249",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            65.25,
            13.516193990913271
        ],
        "wc_strengths_avg": [
            67.75,
            33.58850249713434
        ],
        "wc_weaknesses_avg": [
            238.5,
            252.10959918257774
        ],
        "wc_questions_avg": [
            171.25,
            136.07419850948966
        ],
        "wc_review_avg": [
            542.75,
            216.4929271362
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5773502691896258,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3754143497995856435&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "Johns Hopkins University;University of Hong Kong;University of California, Santa Cruz",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.jhu.edu;https://www.hku.hk;https://www.ucsc.edu",
        "aff_unique_abbr": "JHU;HKU;UCSC",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Hong Kong SAR;Santa Cruz",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "mnHpxTxnYg",
        "title": "Black-Box Privacy Attacks Against GANs via Detector Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Since their inception Generative Adversarial Networks (GANs) have been popular generative models for various data types, including images, audio, video, and tabular data. One promising application of generative models like GANs  is to share restricted or sensitive data with third parties through the creation of synthetic data or the model itself, rather than sharing the underlying data. However, recent research on diffusion models has highlighted privacy vulnerabilities in this approach -- namely that the models memorize significant quantities of the training data, and that existing membership inference attacks can identify generated samples as training points. This paper investigates the privacy implications of using GANs in black-box settings, where adversaries only have access to samples from the generator, rather than access to the discriminator as is often assumed in prior work. We introduce a suite of membership inference attacks against GANs in the black-box setting and evaluate our attacks on image GANs trained on the CIFAR10 dataset and tabular GANs trained on genomic data. Our most successful attack, called The Distinguisher, involve training a second network to score samples based on their likelihood of being generated by the GAN as opposed to a sample from the distribution. A key insight is that a network capable of distinguishing GAN-generated samples from true distribution samples can also distinguish training samples from the distribution. Our main findings indicate that across various GAN architectures and data types, adversaries can orchestrate non-trivial privacy attacks when provided with access to samples from the generator. However, the observed privacy leakage in GANs appears to be lower compared to other generative and discriminative models.",
        "keywords": "privacy attacks;generative models;generative adversarial networks;membership inference",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/c152bb08548072188548a9282a9e0dd03b8a113d.zip",
        "author": "Lukman Olagoke;Salil Vadhan;Seth Neel",
        "authorids": "lolabisiolagoke@hbs.edu;~Salil_Vadhan1;~Seth_Neel2",
        "gender": ";M;",
        "homepage": ";http://salil.seas.harvard.edu/;",
        "dblp": ";v/SPVadhan;",
        "google_scholar": ";;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "lolabisiolagoke@hbs.edu;~Salil_Vadhan1;~Seth_Neel2",
        "aff": ";;",
        "aff_domain": ";;",
        "position": ";;",
        "bibtex": "@misc{\nolagoke2024blackbox,\ntitle={Black-Box Privacy Attacks Against {GAN}s via Detector Networks},\nauthor={Lukman Olagoke and Salil Vadhan and Seth Neel},\nyear={2024},\nurl={https://openreview.net/forum?id=mnHpxTxnYg}\n}",
        "github": "",
        "project": "",
        "reviewers": "rp3W;bnwi;QeZK;zbzo",
        "site": "https://openreview.net/forum?id=mnHpxTxnYg",
        "pdf_size": 7095819,
        "rating": "3;5;5;8",
        "confidence": "4;3;5;4",
        "soundness": "2;2;3;4",
        "contribution": "1;3;2;4",
        "presentation": "2;2;1;3",
        "wc_summary": "88;58;49;67",
        "wc_strengths": "10;89;64;174",
        "wc_weaknesses": "37;305;182;211",
        "wc_questions": "449;31;2;40",
        "wc_review": "584;483;297;492",
        "wc_reply_reviewers": "299;0;0;0",
        "wc_reply_authors": "898;460;404;371",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            1.118033988749895
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            65.5,
            14.465476141489432
        ],
        "wc_strengths_avg": [
            84.25,
            59.16238247400116
        ],
        "wc_weaknesses_avg": [
            183.75,
            96.15449807471308
        ],
        "wc_questions_avg": [
            130.5,
            184.4213924684444
        ],
        "wc_review_avg": [
            464.0,
            104.20412659775043
        ],
        "wc_reply_reviewers_avg": [
            74.75,
            129.4707978657736
        ],
        "wc_reply_authors_avg": [
            533.25,
            212.97813854947648
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:gnJwcyURIYUJ:scholar.google.com/&scioq=Black-Box+Privacy+Attacks+Against+GANs+via+Detector+Networks&hl=en&as_sdt=0,33",
        "gs_version_total": 0
    },
    {
        "id": "mnRLzeNsVN",
        "title": "Travelling Salesman Problem Goes Sparse With Graph Neural Networks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Machine learning based approaches to solve the Travelling Salesman Problem (TSP) have achieved astonishing performance in the last years.\nA large number of works proposing such approaches use a type of encoder in their underlying frameworks to learn vector representations of the given problem.\nSince TSP can easily be interpreted as a graph theoretic problem, Graph Neural Networks (GNNs) have been a popular encoder architecture for this task. \nHowever, most papers ignore that GNNs are not designed to operate on complete graph instances like the TSP.\nWe therefore propose two data preprocessing methods for GNNs to make the TSP instances sparse: a nearest neighbor based heuristic and a method based on minimum spanning tree called 1-Tree.\nWe show that making the underlying TSP instances sparse by deleting unpromising edges in the preprocessing step improves the performance of the overall learning framework while, at the same time, the runtime decreases. \nIn particular, the proposed method achieves an up to $\\times 2 $ performance improvement w.r.t. the optimality gap and a decrease in runtime by 10\\% during training and validation, when applied to GCNs. \nFor GATs, the improvements in regards of runtime and optimality gap are even bigger when sparsifying the data first: We report up to $\\times 22$ improvements for the optimality gap while reducing the runtime by 50\\%.",
        "keywords": "Graph Neural Networks;Travelling Salesman Problem;Graph Sparsification",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Attila Lischka;Jiaming Wu;Rafael Basso;Morteza Haghir Chehreghani;Balazs Kulcsar",
        "authorids": "~Attila_Lischka1;~Jiaming_Wu3;~Rafael_Basso1;~Morteza_Haghir_Chehreghani2;~Balazs_Kulcsar1",
        "gender": ";M;M;;",
        "homepage": "https://www.chalmers.se/personer/lischka/;https://research.chalmers.se/en/person/jiwu;;;",
        "dblp": ";;;;",
        "google_scholar": ";GRBQMhwAAAAJ;t4FYahcAAAAJ;;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Attila_Lischka1;~Jiaming_Wu3;~Rafael_Basso1;~Morteza_Haghir_Chehreghani2;~Balazs_Kulcsar1",
        "aff": "Chalmers University of Technology;;;;Chalmers University of Technology",
        "aff_domain": "chalmers.se;;;;chalmers.se",
        "position": "PhD student;;;;Prof",
        "bibtex": "@misc{\nlischka2024travelling,\ntitle={Travelling Salesman Problem Goes Sparse With Graph Neural Networks},\nauthor={Attila Lischka and Jiaming Wu and Rafael Basso and Morteza Haghir Chehreghani and Balazs Kulcsar},\nyear={2024},\nurl={https://openreview.net/forum?id=mnRLzeNsVN}\n}",
        "github": "",
        "project": "",
        "reviewers": "stG3;CDdM;oBRi;gtua",
        "site": "https://openreview.net/forum?id=mnRLzeNsVN",
        "pdf_size": 1915575,
        "rating": "3;3;3;3",
        "confidence": "4;3;4;4",
        "soundness": "3;2;2;1",
        "contribution": "1;2;2;1",
        "presentation": "2;3;3;2",
        "wc_summary": "35;53;71;57",
        "wc_strengths": "9;42;10;15",
        "wc_weaknesses": "240;211;48;96",
        "wc_questions": "15;44;16;208",
        "wc_review": "299;350;145;376",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "479;435;169;576",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            54.0,
            12.84523257866513
        ],
        "wc_strengths_avg": [
            19.0,
            13.47219358530748
        ],
        "wc_weaknesses_avg": [
            148.75,
            79.26971363641981
        ],
        "wc_questions_avg": [
            70.75,
            80.09174426868228
        ],
        "wc_review_avg": [
            292.5,
            89.55026521457097
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            414.75,
            150.77528809456808
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:9ciB4Rirc58J:scholar.google.com/&scioq=Travelling+Salesman+Problem+Goes+Sparse+With+Graph+Neural+Networks&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Chalmers University of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.chalmers.se",
        "aff_unique_abbr": "Chalmers",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Sweden"
    },
    {
        "title": "Open the Black Box: Step-based Policy Updates for Temporally-Correlated Episodic Reinforcement Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17882",
        "id": "mnipav175N",
        "author_site": "Ge Li, Hongyi Zhou, Dominik Roth, Serge Thilges, Fabian Otto, Rudolf Lioutikov, Gerhard Neumann",
        "tldr": "",
        "abstract": "Current advancements in reinforcement learning (RL) have predominantly focused on learning step-based policies that generate actions for each perceived state. While these methods efficiently leverage step information from environmental interaction, they often ignore the temporal correlation between actions, resulting in inefficient exploration and unsmooth trajectories that are challenging to implement on real hardware. Episodic RL (ERL) seeks to overcome these challenges by exploring in parameters space that capture the correlation of actions. However, these approaches typically compromise data efficiency, as they treat trajectories as opaque black boxes. In this work, we introduce a novel ERL algorithm, Temporally-Correlated Episodic RL (TCE), which effectively utilizes step information in episodic policy updates, opening the 'black box' in existing ERL methods while retaining the smooth and consistent exploration in parameter space. TCE synergistically combines the advantages of step-based and episodic RL, achieving comparable performance to recent ERL methods while maintaining data efficiency akin to state-of-the-art (SoTA) step-based RL.",
        "keywords": "Reinforcement Learning;Trajectory Correlation Modeling;Robot Manipulation;Movement Primitives",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/ce524f8996bd138af0e8437b330e3ba8d2b0adac.zip",
        "author": "Ge Li;Hongyi Zhou;Dominik Roth;Serge Thilges;Fabian Otto;Rudolf Lioutikov;Gerhard Neumann",
        "authorids": "~Ge_Li3;~Hongyi_Zhou1;~Dominik_Roth1;~Serge_Thilges1;~Fabian_Otto1;~Rudolf_Lioutikov1;~Gerhard_Neumann2",
        "gender": "M;M;M;M;;M;M",
        "homepage": ";https://hongyizhoucn.github.io/;https://dominik-roth.eu;;;https://rudolf.intuitive-robots.net;https://alr.anthropomatik.kit.edu/",
        "dblp": ";;367/4094.html;367/3763;284/0547;151/9451;60/4878",
        "google_scholar": ";W35-J2sAAAAJ;;;dV8eLH8AAAAJ;hvjV43MAAAAJ;https://scholar.google.com.tw/citations?user=GL360kMAAAAJ",
        "orcid": ";;;;0000-0003-3484-1054;;",
        "linkedin": "geli-bruce/;hongyi-zhou-9413b9242/;;serge-t-73b6941a0/;ottofabian/;rudolf-lioutikov-74830730a/;",
        "or_profile": "~Ge_Li3;~Hongyi_Zhou1;~Dominik_Roth1;~Serge_Thilges1;~Fabian_Otto1;~Rudolf_Lioutikov1;~Gerhard_Neumann1",
        "aff": "Karlsruhe Institute of Technology;Karlsruher Institut f\u00fcr Technologie;Karlsruher Institut f\u00fcr Technologie;Karlsruher Institut f\u00fcr Technologie;University of T\u00fcbingen;Karlsruher Institut f\u00fcr Technologie;Karlsruhe Institute of Technology",
        "aff_domain": "kit.edu;kit.edu;kit.edu;kit.edu;uni-tuebingen.de;kit.edu;kit.edu",
        "position": "PhD student;PhD student;MS student;MS student;PhD student;Tenure-Track Professor;Full Professor",
        "bibtex": "@inproceedings{\nli2024open,\ntitle={Open the Black Box: Step-based Policy Updates for Temporally-Correlated Episodic Reinforcement Learning},\nauthor={Ge Li and Hongyi Zhou and Dominik Roth and Serge Thilges and Fabian Otto and Rudolf Lioutikov and Gerhard Neumann},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=mnipav175N}\n}",
        "github": "",
        "project": "",
        "reviewers": "DXh7;psBV;ALmz;dLeV",
        "pdf_size": 4742109,
        "rating": "6;6;6;6",
        "confidence": "3;3;3;3",
        "soundness": "2;3;3;2",
        "contribution": "2;2;2;1",
        "presentation": "3;2;3;1",
        "wc_summary": "73;128;109;58",
        "wc_strengths": "39;38;28;13",
        "wc_weaknesses": "509;232;191;443",
        "wc_questions": "41;16;32;399",
        "wc_review": "662;414;360;913",
        "wc_reply_reviewers": "16;125;0;230",
        "wc_reply_authors": "1153;1212;781;1558",
        "reply_reviewers": "1;2;0;1",
        "reply_authors": "4;4;2;4",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            92.0,
            27.847800631288642
        ],
        "wc_strengths_avg": [
            29.5,
            10.452272480183437
        ],
        "wc_weaknesses_avg": [
            343.75,
            135.07289698529456
        ],
        "wc_questions_avg": [
            122.0,
            160.17646518761737
        ],
        "wc_review_avg": [
            587.25,
            219.86288340690885
        ],
        "wc_reply_reviewers_avg": [
            92.75,
            92.6967502127232
        ],
        "wc_reply_authors_avg": [
            1176.0,
            275.5784824691507
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            3.5,
            0.8660254037844386
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11019351766915719387&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=mnipav175N",
        "pdf": "https://openreview.net/pdf?id=mnipav175N",
        "email": "kit.edu;kit.edu;kit.edu;kit.edu;uni-tuebingen.de;kit.edu;kit.edu",
        "author_num": 7,
        "aff_unique_index": "0;1;1;1;2;1;0",
        "aff_unique_norm": "Karlsruhe Institute of Technology;Karlsruher Institut f\u00fcr Technologie;University of T\u00fcbingen",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.kit.edu;https://www.kit.edu;https://www.uni-tuebingen.de/",
        "aff_unique_abbr": "KIT;KIT;Uni T\u00fcbingen",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "mnyXZBa5dP",
        "title": "Image Authenticity Detection using Eye Gazing Data: A Performance Comparison Beyond Human Capabilities via Attention Mechanism, ResNet, and Cascade Strategies",
        "track": "main",
        "status": "Desk Reject",
        "tldr": "",
        "abstract": "In the digital age, determining the authenticity of images has become \nincreasingly crucial. This study aims to explore the capability of machine \nlearning models in identifying manipulated images using eye movement data and \ncompares this with human judgment. We collected a series of both manipulated \nand unaltered images and conducted eye-tracking experiments on a set of \nparticipants. After data preprocessing, various machine learning models were \ntrained and validated, including a simple classifier, cascade-optimized classifier, \nand models integrating attention mechanisms with ResNet architectures. Results \nindicate that all models outperformed the baseline set by human judgment. \nSpecifically, the Attention-ResNet model achieved the highest accuracy at 0.685, \nmaking it the top-performing model. Our analysis delves further into the stability, \ngeneralization capabilities, and practical value of these models. Ultimately, this \nresearch underscores the immense potential of deep learning strategies in \nverifying image authenticity, providing valuable insights for future research and \napplications.",
        "keywords": "Image Manipulation Detection;Cascade Networks;Eye-tracking  Data;Model Stability",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "Ping Zhang",
        "authorids": "~Ping_Zhang10",
        "gender": "M",
        "homepage": "",
        "dblp": "",
        "google_scholar": "",
        "orcid": "",
        "linkedin": "ping-zhang-45b514275/",
        "or_profile": "~Ping_Zhang10",
        "aff": "Australian National University",
        "aff_domain": "anu.edu.au",
        "position": "MS student",
        "bibtex": "@misc{\nzhang2024image,\ntitle={Image Authenticity Detection using Eye Gazing Data:  A Performance Comparison Beyond Human Capabilities  via Attention Mechanism, ResNet, and Cascade  Strategies},\nauthor={Ping Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=mnyXZBa5dP}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=mnyXZBa5dP",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:QK7xj2x-IOIJ:scholar.google.com/&scioq=Image+Authenticity+Detection+using+Eye+Gazing+Data:+A+Performance+Comparison+Beyond+Human+Capabilities+via+Attention+Mechanism,+ResNet,+and+Cascade+Strategies&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Australian National University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.anu.edu.au",
        "aff_unique_abbr": "ANU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Australia"
    },
    {
        "id": "mp8ZgMZ1RG",
        "title": "HarmonyLM: Advancing Unified Large-Scale Language Modeling for Sound and Music Generation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The fields of sound generation and music generation have seen notable advancements with the development of specialized models tailored to each domain. However, these domains share commonalities, and the use of specialized models can lead to increased hardware resource requirements. On the other hand, recent breakthroughs in large language models, particularly in natural language processing, have showcased their ability to capture complex patterns and generate coherent and contextually relevant outputs in various tasks. Leveraging the success of these language models, we present HarmonyLM, a unified framework designed to synthesize sound and music from discrete representations. HarmonyLM adopts a unified perspective in modeling sound and music, discrete tokens are modeled from text descriptions using a decoder-only model, which are converted back to harmonious and consistent audio outputs. HarmonyLM offers significant advantages as a unified sound and music generation framework. (1) Model Scalability: the model we use in acoustic modeling a decoder-only transformer, which is free to scale up model size. (2) Data Scalability: the acoustic modeling and reconstructing audio models do not require any annotations, which accommodate different scales of data. Experimental results demonstrate the effectiveness of HarmonyLM, as it achieves superior audio quality compared to competitive baseline models. \\footnote{Audio samples are available at \\url{https://HarmonyLM.github.io}}",
        "keywords": "large language model;sound generation;music generation",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Huadai Liu;Yongqi Wang;Ruofan Hu;Ruiqi Li;Bai Jionghao;Jiawei Huang;Rongjie Huang;Zhou Zhao",
        "authorids": "~Huadai_Liu1;~Yongqi_Wang1;~Ruofan_Hu2;~Ruiqi_Li2;~Bai_Jionghao1;~Jiawei_Huang5;~Rongjie_Huang1;~Zhou_Zhao3",
        "gender": "M;M;;;M;M;M;",
        "homepage": ";;;;https://www.researchgate.net/profile/Bai-Jionghao;;;",
        "dblp": "321/0749;;;;356/8993;13/4208-8;212/8936-1;",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;9_79D6IAAAAJ;;;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com/citations?hl=zh-CN;iRHBUsgAAAAJ;",
        "orcid": ";0000-0003-4695-3440;;;0009-0005-7106-513X;;;",
        "linkedin": "https://www.linkedin.cn/injobs/in/%E5%8D%8E%E5%B2%B1-%E5%88%98-463b1622a;;;;;;;",
        "or_profile": "~Huadai_Liu1;~Yongqi_Wang1;~Ruofan_Hu2;~Ruiqi_Li2;~Bai_Jionghao1;~Jiawei_Huang5;~Rongjie_Huang1;~Zhou_Zhao3",
        "aff": "Zhejiang University;Zhejiang University;;;Zhejiang University;Zhejiang University;Zhejiang University;",
        "aff_domain": "zju.edu.cn;zju.edu.cn;;;zju.edu.cn;zju.edu.cn;zju.edu.cn;",
        "position": "MS student;MS student;;;Undergrad student;MS student;MS student;",
        "bibtex": "@misc{\nliu2024harmonylm,\ntitle={Harmony{LM}: Advancing Unified Large-Scale Language Modeling for Sound and Music Generation},\nauthor={Huadai Liu and Yongqi Wang and Ruofan Hu and Ruiqi Li and Bai Jionghao and Jiawei Huang and Rongjie Huang and Zhou Zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=mp8ZgMZ1RG}\n}",
        "github": "",
        "project": "",
        "reviewers": "Vp5Z;GKXd;PQPu",
        "site": "https://openreview.net/forum?id=mp8ZgMZ1RG",
        "pdf_size": 413418,
        "rating": "1;1;3",
        "confidence": "5;4;4",
        "soundness": "1;3;2",
        "contribution": "1;1;2",
        "presentation": "2;1;2",
        "wc_summary": "29;49;66",
        "wc_strengths": "52;31;100",
        "wc_weaknesses": "328;373;112",
        "wc_questions": "24;41;123",
        "wc_review": "433;494;401",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            48.0,
            15.121728296285006
        ],
        "wc_strengths_avg": [
            61.0,
            28.879058156387302
        ],
        "wc_weaknesses_avg": [
            271.0,
            113.92102527628515
        ],
        "wc_questions_avg": [
            62.666666666666664,
            43.22293629801453
        ],
        "wc_review_avg": [
            442.6666666666667,
            38.57748335781148
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:4IK1xGMIuxEJ:scholar.google.com/&scioq=HarmonyLM:+Advancing+Unified+Large-Scale+Language+Modeling+for+Sound+and+Music+Generation&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Zhejiang University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.zju.edu.cn",
        "aff_unique_abbr": "ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "KW-Design: Pushing the Limit of Protein Design via Knowledge Refinement",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17881",
        "id": "mpqMVWgqjn",
        "author_site": "Zhangyang Gao, Cheng Tan, Xingran Chen, Yijie Zhang, Jun Xia, Siyuan Li, Stan Z Li",
        "tldr": "",
        "abstract": "Recent studies have shown competitive performance in protein inverse folding, while most of them disregard the importance of predictive confidence, fail to cover the vast protein space, and do not incorporate common protein knowledge. Given the great success of pretrained models on diverse protein-related tasks and the fact that recovery is highly correlated with confidence, we wonder whether this knowledge can push the limits of protein design further. As a solution, we propose a knowledge-aware module that refines low-quality residues. We also introduce a memory-retrieval mechanism to save more than 50\\% of the training time. We extensively evaluate our proposed method on the CATH, TS50, TS500, and PDB datasets and our results show that our KW-Design method outperforms the previous PiFold method by approximately 9\\% on the CATH dataset. KW-Design is the first method that achieves 60+\\% recovery on all these benchmarks. We also provide additional analysis to demonstrate the effectiveness of our proposed method. The code is publicly available via \\href{https://github.com/A4Bio/ProteinInvBench}{GitHub}.",
        "keywords": "Protein Design;Graph;Finetuning",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/5da2a5627a01d8081be3f02fa6787c456612fe40.pdf",
        "author": "Zhangyang Gao;Cheng Tan;Xingran Chen;Yijie Zhang;Jun Xia;Siyuan Li;Stan Z. Li",
        "authorids": "~Zhangyang_Gao1;~Cheng_Tan1;~Xingran_Chen1;~Yijie_Zhang3;~Jun_Xia1;~Siyuan_Li6;~Stan_Z._Li2",
        "gender": "M;M;M;F;M;M;M",
        "homepage": ";https://chengtan9907.github.io/;https://www.chenxingran.com/;https://forrest-yijie-zhang.github.io/;http://junxia97.github.io/;https://lupin1998.github.io/;https://en.westlake.edu.cn/academics/School_of_Engineering/About/Our_People/Faculty/201912/t20191206_2497.shtml",
        "dblp": "275/3266;70/1533-12.html;203/8349;;;63/9705-2;l/StanZLi",
        "google_scholar": "4SclT-QAAAAJ;6kTV6aMAAAAJ;X01oTv8AAAAJ;Q9Gby5wAAAAJ;aPKKpSYAAAAJ;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": "0000-0003-1026-6083;;;;;0000-0001-6806-2468;",
        "linkedin": ";;;;;https://www.linkedin.cn/incareer/in/siyuan-li-lupin1998/;stan-z-li-%E6%9D%8E%E5%AD%90%E9%9D%92-55753224/",
        "or_profile": "~Zhangyang_Gao1;~Cheng_Tan1;~Xingran_Chen1;~Yijie_Zhang3;~Jun_Xia1;~Siyuan_Li6;~Stan_Z._Li1",
        "aff": "Westlake University, China;Zhejiang University & Westlake University;University of Michigan - Ann Arbor;McGill University;Westlake University, China;Alibaba Group;Westlake University",
        "aff_domain": "westlake.edu.cn;westlake.edu.cn;umich.edu;mail.mcgill.ca;westlake.edu.cn;alibaba-inc.com;westlake.edu.cn",
        "position": "PhD student;PhD student;MS student;MS student;PhD student;Intern;Chair Professor",
        "bibtex": "@inproceedings{\ngao2024kwdesign,\ntitle={{KW}-Design: Pushing the Limit of Protein Design via Knowledge Refinement},\nauthor={Zhangyang Gao and Cheng Tan and Xingran Chen and Yijie Zhang and Jun Xia and Siyuan Li and Stan Z. Li},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=mpqMVWgqjn}\n}",
        "github": "",
        "project": "",
        "reviewers": "4EsM;KJsj;Mme4",
        "pdf_size": 2926831,
        "rating": "6;6;6",
        "confidence": "5;3;3",
        "soundness": "2;3;3",
        "contribution": "3;3;2",
        "presentation": "2;3;1",
        "wc_summary": "60;63;59",
        "wc_strengths": "24;70;54",
        "wc_weaknesses": "232;93;251",
        "wc_questions": "254;101;6",
        "wc_review": "570;327;370",
        "wc_reply_reviewers": "0;37;0",
        "wc_reply_authors": "751;673;1607",
        "reply_reviewers": "0;1;0",
        "reply_authors": "2;3;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            60.666666666666664,
            1.699673171197595
        ],
        "wc_strengths_avg": [
            49.333333333333336,
            19.067132861433457
        ],
        "wc_weaknesses_avg": [
            192.0,
            70.43200030289263
        ],
        "wc_questions_avg": [
            120.33333333333333,
            102.16435560191997
        ],
        "wc_review_avg": [
            422.3333333333333,
            105.88148510900709
        ],
        "wc_reply_reviewers_avg": [
            12.333333333333334,
            17.441967269268172
        ],
        "wc_reply_authors_avg": [
            1010.3333333333334,
            423.10702612407135
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 27,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1175433185354623964&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=mpqMVWgqjn",
        "pdf": "https://openreview.net/pdf?id=mpqMVWgqjn",
        "email": "westlake.edu.cn;westlake.edu.cn;umich.edu;mail.mcgill.ca;westlake.edu.cn;alibaba-inc.com;westlake.edu.cn",
        "author_num": 7,
        "aff_unique_index": "0;1;2;3;0;4;0",
        "aff_unique_norm": "Westlake University;Zhejiang University;University of Michigan;McGill University;Alibaba Group",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.westlake.edu.cn;http://www.zju.edu.cn;https://www.umich.edu;https://www.mcgill.ca;https://www.alibaba.com",
        "aff_unique_abbr": "WU;ZJU;UM;McGill;Alibaba",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Ann Arbor",
        "aff_country_unique_index": "0;0;1;2;0;0;0",
        "aff_country_unique": "China;United States;Canada"
    },
    {
        "id": "mqCt76eiNt",
        "title": "Advantage-Aware Policy Optimization for Offline Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Offline Reinforcement Learning (RL)  endeavors to leverage offline datasets to craft effective agent policy without online interaction, which imposes proper conservative constraints to tackle the Out-Of-Distribution (OOD) problem. However, existing works often suffer from the constraint conflict issue when offline datasets are collected from multiple sources with distinct returns. To remedy this issue, previous Advantage-Weighted (AW) methods prioritize samples with high advantage values to perform agent training while inevitably leading to overfitting on these samples. In this paper, we introduce a novel Advantage-Aware Policy Optimization (A2PO) method to explicitly construct the advantage-aware policy constraint from the multi-source dataset for agent learning. Specifically, A2PO employs a Conditional Variational Auto-Encoder (CVAE) to  disentangle the action distributions of different behavior policies by modeling the advantage values of all training data as conditional variables. Then we can optimize the advantage-aware agent policy  towards high advantage values while adhering to such disentangled distribution constraint of the multi-source dataset. Extensive experiments conducted on both the single-source and multi-source datasets of the D4RL benchmark demonstrate that A2PO yields results superior to state-of-the-art counterparts. Our code will be made publicly available.",
        "keywords": "Offline Reinforcement Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/80926b6651825f841a13fbada4cb83183c62d189.zip",
        "author": "Yunpeng Qing;Shunyu Liu;Jingyuan Cong;Kaixuan Chen;Yihe Zhou;Mingli Song",
        "authorids": "~Yunpeng_Qing1;~Shunyu_Liu1;~Jingyuan_Cong1;~Kaixuan_Chen2;~Yihe_Zhou1;~Mingli_Song1",
        "gender": "M;;M;M;M;M",
        "homepage": "https://plankson.github.io/;https://liushunyu.github.io/;;;https://person.zju.edu.cn/msong;https://chenchkx.github.io/",
        "dblp": "333/0812;235/0752-1;;324/2516;71/5333;220/5629",
        "google_scholar": "-RvDl44AAAAJ;4U-X6d4AAAAJ;;;7oLbhAwAAAAJ;",
        "orcid": "0000-0001-7376-9847;0000-0003-0584-9129;0000-0002-8974-4609;0009-0004-2595-6743;0000-0003-2621-6048;0000-0002-2492-5230",
        "linkedin": ";;;;;",
        "or_profile": "~Yunpeng_Qing1;~Shunyu_Liu1;~Jingyuan_Cong1;~Yihe_Zhou1;~Mingli_Song1;~Kai-Xuan_Chen1",
        "aff": "Zhejiang University;Zhejiang University;Zhejiang University;Zhejiang University;Zhejiang University;Zhejiang University",
        "aff_domain": "zju.edu.cn;zju.edu.cn;zju.edu.cn;zju.edu.cn;zju.edu.cn;zju.edu.cn",
        "position": "MS student;PhD student;Undergrad student;MS student;Full Professor;Researcher",
        "bibtex": "@misc{\nqing2024advantageaware,\ntitle={Advantage-Aware Policy Optimization for Offline Reinforcement Learning},\nauthor={Yunpeng Qing and Shunyu Liu and Jingyuan Cong and Kaixuan Chen and Yihe Zhou and Mingli Song},\nyear={2024},\nurl={https://openreview.net/forum?id=mqCt76eiNt}\n}",
        "github": "",
        "project": "",
        "reviewers": "HeZ6;Mmfe;R6oW;TZv3;KGRx",
        "site": "https://openreview.net/forum?id=mqCt76eiNt",
        "pdf_size": 2258139,
        "rating": "3;5;5;6;6",
        "confidence": "4;4;4;3;4",
        "soundness": "2;2;2;3;3",
        "contribution": "2;2;2;3;2",
        "presentation": "2;3;2;4;3",
        "wc_summary": "91;47;102;87;56",
        "wc_strengths": "29;38;21;88;40",
        "wc_weaknesses": "548;115;81;129;125",
        "wc_questions": "84;150;39;93;22",
        "wc_review": "752;350;243;397;243",
        "wc_reply_reviewers": "303;0;0;62;119",
        "wc_reply_authors": "3776;1581;1172;1256;1789",
        "reply_reviewers": "1;0;0;1;2",
        "reply_authors": "8;5;4;4;4",
        "rating_avg": [
            5.0,
            1.0954451150103321
        ],
        "confidence_avg": [
            3.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.8,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            76.6,
            21.265935201631738
        ],
        "wc_strengths_avg": [
            43.2,
            23.404273114113156
        ],
        "wc_weaknesses_avg": [
            199.6,
            175.01725629205822
        ],
        "wc_questions_avg": [
            77.6,
            44.947079994144225
        ],
        "wc_review_avg": [
            397.0,
            187.4385232549595
        ],
        "wc_reply_reviewers_avg": [
            96.8,
            112.2165763156228
        ],
        "wc_reply_authors_avg": [
            1914.8,
            956.7740381093124
        ],
        "reply_reviewers_avg": [
            0.8,
            0.7483314773547883
        ],
        "reply_authors_avg": [
            5.0,
            1.5491933384829668
        ],
        "replies_avg": [
            37,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.4564354645876385,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=76114135510241319&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "Zhejiang University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.zju.edu.cn",
        "aff_unique_abbr": "ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Skeleton-of-Thought: Prompting LLMs for Efficient Parallel Generation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17880",
        "id": "mqVgBbNCm9",
        "author_site": "Xuefei Ning, Zinan Lin, Zixuan Zhou, Zifu Wang, Huazhong Yang, Yu Wang",
        "tldr": "",
        "abstract": "This work aims at decreasing the end-to-end generation latency of large language models (LLMs). One of the major causes of the high generation latency is the sequential decoding approach adopted by almost all state-of-the-art LLMs. In this work, motivated by the thinking and writing process of humans, we propose Skeleton-of-Thought (SoT), which first guides LLMs to generate the skeleton of the answer, and then conducts parallel API calls or batched decoding to complete the contents of each skeleton point in parallel. Not only does SoT provide considerable speed-ups across 12 LLMs, but it can also potentially improve the answer quality on several question categories. SoT is an initial attempt at data-centric optimization for inference efficiency, and showcases the potential of eliciting high-quality answers by explicitly planning the answer structure in language.",
        "keywords": "large language model;efficient inference;data-centric optimization;parallel generation;prompt engineering;planning",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/c0b74bdcf243b7a56b7186cd99073d2d5e4a2ff6.zip",
        "author": "Xuefei Ning;Zinan Lin;Zixuan Zhou;Zifu Wang;Huazhong Yang;Yu Wang",
        "authorids": "~Xuefei_Ning1;~Zinan_Lin1;~Zixuan_Zhou2;~Zifu_Wang1;~Huazhong_Yang2;~Yu_Wang3",
        "gender": "Not Specified;M;M;M;M;M",
        "homepage": "https://nics-effalg.com/ningxuefei/;https://zinanlin.me/;;https://zifuwang.com;http://web.ee.tsinghua.edu.cn/yanghuazhong/en/index.htm;https://nicsefc.ee.tsinghua.edu.cn",
        "dblp": "202/9525;64/237-1;;;94/1128.html;w/YuWang2.html",
        "google_scholar": "oVslpJsAAAAJ;67nE-wQ_g_cC;iIrXDM8AAAAJ;https://scholar.google.com/citations?hl=en;;https://scholar.google.com.hk/citations?user=j8JGVvoAAAAJ",
        "orcid": ";;;;0000-0003-2421-353X;0000-0001-6108-5157",
        "linkedin": ";;;;;",
        "or_profile": "~Xuefei_Ning1;~Zinan_Lin1;~Zixuan_Zhou2;~Zifu_Wang1;~Huazhong_Yang2;~Yu_Wang3",
        "aff": "Tsinghua University;Microsoft;Tsinghua University;KU Leuven;Tsinghua University;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;microsoft.com;tsinghua.edu.cn;kuleuven.be;tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "Research Assistant Professor;Senior Researcher;MS student;PhD student;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nning2024skeletonofthought,\ntitle={Skeleton-of-Thought: Prompting {LLM}s for Efficient Parallel Generation},\nauthor={Xuefei Ning and Zinan Lin and Zixuan Zhou and Zifu Wang and Huazhong Yang and Yu Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=mqVgBbNCm9}\n}",
        "github": "",
        "project": "",
        "reviewers": "vbj6;KKRk;N4tW;4Trv;JQY3;ieuZ",
        "pdf_size": 1397414,
        "rating": "3;5;6;6;6;8",
        "confidence": "4;4;4;3;3;4",
        "soundness": "3;2;2;4;3;2",
        "contribution": "2;2;2;3;2;3",
        "presentation": "4;3;3;3;3;3",
        "wc_summary": "56;33;121;50;231;129",
        "wc_strengths": "6;6;113;64;43;138",
        "wc_weaknesses": "177;37;203;217;58;383",
        "wc_questions": "1;41;197;3;174;271",
        "wc_review": "240;117;634;334;506;921",
        "wc_reply_reviewers": "198;0;127;0;178;14",
        "wc_reply_authors": "2457;470;1687;797;1103;1706",
        "reply_reviewers": "1;0;1;0;1;1",
        "reply_authors": "6;2;4;2;4;5",
        "rating_avg": [
            5.666666666666667,
            1.4907119849998596
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.7453559924999298
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.1666666666666665,
            0.3726779962499649
        ],
        "wc_summary_avg": [
            103.33333333333333,
            67.4553350167518
        ],
        "wc_strengths_avg": [
            61.666666666666664,
            50.02221728614418
        ],
        "wc_weaknesses_avg": [
            179.16666666666666,
            114.34220082230746
        ],
        "wc_questions_avg": [
            114.5,
            104.52710972119465
        ],
        "wc_review_avg": [
            458.6666666666667,
            266.7168702742459
        ],
        "wc_reply_reviewers_avg": [
            86.16666666666667,
            84.32559253011837
        ],
        "wc_reply_authors_avg": [
            1370.0,
            658.8591149353049
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.8333333333333335,
            1.462494064565354
        ],
        "replies_avg": [
            36,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.15811388300841897,
        "gs_citation": 42,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17426777270752251520&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=mqVgBbNCm9",
        "pdf": "https://openreview.net/pdf?id=mqVgBbNCm9",
        "email": "tsinghua.edu.cn;microsoft.com;tsinghua.edu.cn;kuleuven.be;tsinghua.edu.cn;tsinghua.edu.cn",
        "author_num": 6,
        "aff_unique_index": "0;1;0;2;0;0",
        "aff_unique_norm": "Tsinghua University;Microsoft;Katholieke Universiteit Leuven",
        "aff_unique_dep": ";Microsoft Corporation;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.microsoft.com;https://www.kuleuven.be",
        "aff_unique_abbr": "THU;Microsoft;KU Leuven",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;2;0;0",
        "aff_country_unique": "China;United States;Belgium"
    },
    {
        "id": "mqfGDHdrhL",
        "title": "Tracking the Change of Knowledge Through Layers in Neural Networks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "This paper aims to explain how a deep neural network (DNN) gradually extracts new knowledge and forgets noisy features\nthrough layers in forward propagation. \nUp to now, although how to define knowledge encoded by the DNN has not reached a consensus so far, previous studies have derived a series of mathematical evidences to take interactions as symbolic primitive inference patterns encoded by a DNN. \nWe extend the definition of interactions and, for the first time, extract interactions encoded by intermediate layers. \nWe quantify and track the newly emerged interactions and the forgotten interactions in each layer during the forward propagation, which shed new light on the learning behavior of DNNs. \nThe layer-wise change of interactions also reveals the change of the generalization capacity and instability of feature representations of a DNN.",
        "keywords": "Explainability;Forward Propagation;Neural Network;Representation Learning",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "",
        "author": "Xu Cheng;Lei Cheng;Zhaoran Peng;Quanshi Zhang",
        "authorids": "~Xu_Cheng1;~Lei_Cheng2;~Zhaoran_Peng2;~Quanshi_Zhang1",
        "gender": "F;M;;M",
        "homepage": "https://cx1208.github.io/ChengXuSJTU.github.io/;https://github.com/chengstones;;http://qszhang.com",
        "dblp": "30/828-5;;;http://dblp.uni-trier.de/pers/hd/z/Zhang:Quanshi",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;;;iFFhHK0AAAAJ",
        "orcid": "0009-0001-5086-5673;;;",
        "linkedin": ";;zhaoran-peng-712b32264/;",
        "or_profile": "~Xu_Cheng1;~Lei_Cheng2;~Zhaoran_Peng2;~Quanshi_Zhang1",
        "aff": "Nanjing University of Science and Technology;Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University",
        "aff_domain": "njust.edu.cn;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn",
        "position": "Assistant Professor;Undergrad student;Undergrad student;Associate Professor",
        "bibtex": "@misc{\ncheng2024tracking,\ntitle={Tracking the Change of Knowledge Through Layers in Neural Networks},\nauthor={Xu Cheng and Lei Cheng and Zhaoran Peng and Quanshi Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=mqfGDHdrhL}\n}",
        "github": "",
        "project": "",
        "reviewers": "1uPT;ihkY;4wCW;fz2n",
        "site": "https://openreview.net/forum?id=mqfGDHdrhL",
        "pdf_size": 6316621,
        "rating": "1;3;3;6",
        "confidence": "2;4;3;3",
        "soundness": "1;2;1;3",
        "contribution": "1;3;2;3",
        "presentation": "1;1;2;2",
        "wc_summary": "49;164;129;54",
        "wc_strengths": "30;107;30;20",
        "wc_weaknesses": "621;485;450;130",
        "wc_questions": "8;203;43;107",
        "wc_review": "708;959;652;311",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            99.0,
            49.11720676097125
        ],
        "wc_strengths_avg": [
            46.75,
            35.02409884636577
        ],
        "wc_weaknesses_avg": [
            421.5,
            180.01180516843888
        ],
        "wc_questions_avg": [
            90.25,
            74.14639235997932
        ],
        "wc_review_avg": [
            657.5,
            231.0546472157615
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.39605901719066966,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:c9UD9nIv8jwJ:scholar.google.com/&scioq=Tracking+the+Change+of+Knowledge+Through+Layers+in+Neural+Networks&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Nanjing University of Science and Technology;Shanghai Jiao Tong University",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.nust.edu.cn/;https://www.sjtu.edu.cn",
        "aff_unique_abbr": "NUST;SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "mrBd4hyWlP",
        "title": "CRL-NET: ACCELERATED MAGNETIC RESONANCE IMAGING RECONSTRUCTION THROUGH COIL REPRESENTATION LEARNING",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Magnetic Resonance Imaging(MRI) is a lengthy medical scan that stems from a long acquisition time. Its length is mainly due to the traditional sampling theorem, which defines a lower bound for sampling. However, it is still possible to accelerate the scan by using a different approach such as Compress Sensing(CS) or multi-coil Parallel Imaging(PI). These two complementary methods can be combined to achieve a faster scan with high-fidelity imaging. Recent advancements in Deep Learning (DL) have shown the potential to outperform traditional CS reconstruction techniques. This paper introduces CRL-Net, a novel Coil Representation Learning Network for accelerated multi-coil MRI reconstruction.The architecture of CRL-Net comprises a coil-wise encoder, devised to ascertain the distinctive representations of each coil. This is further complemented by a coil-attention layer, which synergistically assimilates inputs from both the sensitivity map estimations and the coil-wise encoder. Comprehensive evaluations of the CRL-Net, using the FastMRI benchmark for multi-coil datasets across knee and brain regions at both 4x and 8x acceleration, manifest significant advancements over the prevailing state-of-the-art methodologies. Such results elucidate the promising capability of CRL-Net in refining the accuracy and efficiency of MRI reconstructions.",
        "keywords": "Magnetic Resonance Imaging;Medical Imaging;Representation learning;Computer Vision",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Omer Cahana;Maya Herman;Ofer Levi",
        "authorids": "~Omer_Cahana1;~Maya_Herman1;~Ofer_Levi1",
        "gender": "M;F;M",
        "homepage": ";;https://www.openu.ac.il/personal_sites/ofer-levi/",
        "dblp": ";46/3874;",
        "google_scholar": ";;https://scholar.google.com/citations?hl=iw",
        "orcid": ";;0000-0001-7523-642X",
        "linkedin": "omer-cahana-791040151/;;ofer-levi-9979267/",
        "or_profile": "~Omer_Cahana1;~Maya_Herman1;~Ofer_Levi1",
        "aff": ";Open University of Israel;",
        "aff_domain": ";openu.ac.il;",
        "position": ";Lecturer;",
        "bibtex": "@misc{\ncahana2024crlnet,\ntitle={{CRL}-{NET}: {ACCELERATED} {MAGNETIC} {RESONANCE} {IMAGING} {RECONSTRUCTION} {THROUGH} {COIL} {REPRESENTATION} {LEARNING}},\nauthor={Omer Cahana and Maya Herman and Ofer Levi},\nyear={2024},\nurl={https://openreview.net/forum?id=mrBd4hyWlP}\n}",
        "github": "",
        "project": "",
        "reviewers": "3r6G;Q3j2;H3Dq",
        "site": "https://openreview.net/forum?id=mrBd4hyWlP",
        "pdf_size": 386653,
        "rating": "1;1;3",
        "confidence": "5;4;4",
        "soundness": "1;1;1",
        "contribution": "1;1;2",
        "presentation": "1;1;1",
        "wc_summary": "31;58;17",
        "wc_strengths": "28;14;37",
        "wc_weaknesses": "162;129;96",
        "wc_questions": "10;40;52",
        "wc_review": "231;241;202",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            1.0,
            0.0
        ],
        "contribution_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.0,
            0.0
        ],
        "wc_summary_avg": [
            35.333333333333336,
            17.016332024133625
        ],
        "wc_strengths_avg": [
            26.333333333333332,
            9.463379711052259
        ],
        "wc_weaknesses_avg": [
            129.0,
            26.94438717061496
        ],
        "wc_questions_avg": [
            34.0,
            17.663521732655695
        ],
        "wc_review_avg": [
            224.66666666666666,
            16.539514973407037
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:x709o9J6h3gJ:scholar.google.com/&scioq=CRL-NET:+ACCELERATED+MAGNETIC+RESONANCE+IMAGING+RECONSTRUCTION+THROUGH+COIL+REPRESENTATION+LEARNING&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Open University of Israel",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.openu.ac.il",
        "aff_unique_abbr": "OUI",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Israel"
    },
    {
        "id": "mrRbIcyouU",
        "title": "Revisiting Class-Incremental Learning with Pre-Trained Models: Generalizability and Adaptivity are All You Need",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Class-incremental learning (CIL) aims to adapt to emerging new classes without forgetting old ones. Traditional CIL models are trained from scratch to continually acquire knowledge as data evolves. Recently, pre-training has achieved substantial progress, making vast pre-trained models (PTMs) accessible for CIL. Contrary to traditional methods, PTMs possess generalizable embeddings, which can be easily transferred. In this work, we revisit CIL with PTMs and argue that the core factors in CIL are adaptivity for model updating and generalizability for knowledge transferring. 1) We first reveal that frozen PTM can already provide generalizable embeddings for CIL. Surprisingly, a simple baseline (SimpleCIL) which continually sets the classifiers of PTM to prototype features can beat state-of-the-art even without training on the downstream task. 2) Due to the distribution gap between pre-trained and downstream datasets, PTM can be further cultivated with adaptivity via model adapting. We propose ADapt And Merge (APER), which aggregates the embeddings of PTM and adapted models for classifier construction. APER is a general framework that can be orthogonally combined with any parameter-efficient tuning method, which holds the advantages of PTM's generalizability and adapted model's adaptivity. 3) Additionally, we find previous benchmarks are unsuitable in the era of PTM due to data overlapping and propose four new benchmarks for assessment, namely ImageNet-A, ObjectNet, OmniBenchmark, and VTAB. Extensive experiments validate the effectiveness of APER with a unified and concise framework.",
        "keywords": "class-incremental learning;pre-trained models",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/92fcb13c1d2bd6dff0f07102aae212681a77321e.zip",
        "author": "Da-Wei Zhou;Han-Jia Ye;De-Chuan Zhan;Ziwei Liu",
        "authorids": "~Da-Wei_Zhou1;~Han-Jia_Ye1;~De-Chuan_Zhan1;~Ziwei_Liu1",
        "gender": ";M;M;M",
        "homepage": "http://www.lamda.nju.edu.cn/zhoudw/;http://www.lamda.nju.edu.cn/yehj;http://www.lamda.nju.edu.cn/zhandc/;https://liuziwei7.github.io/",
        "dblp": "120/6109;165/3014;74/498;05/6300-2",
        "google_scholar": "kMNaR-YAAAAJ;mgOYhtoAAAAJ;mYJf4TcAAAAJ;https://scholar.google.com.hk/citations?user=lc45xlcAAAAJ",
        "orcid": ";;0000-0002-3533-2078;",
        "linkedin": ";;;",
        "or_profile": "~Da-Wei_Zhou1;~Han-Jia_Ye1;~De-Chuan_Zhan1;~Ziwei_Liu1",
        "aff": "Nanjing University;Nanjing University;Nanjing University;Nanyang Technological University",
        "aff_domain": "nju.edu.cn;nju.edu.cn;nju.edu.cn;ntu.edu.sg",
        "position": "PhD student;Associate Professor;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nzhou2024revisiting,\ntitle={Revisiting Class-Incremental Learning with Pre-Trained Models: Generalizability and Adaptivity are All You Need},\nauthor={Da-Wei Zhou and Han-Jia Ye and De-Chuan Zhan and Ziwei Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=mrRbIcyouU}\n}",
        "github": "",
        "project": "",
        "reviewers": "6wZj;o8FW;PEMr;rLJS",
        "site": "https://openreview.net/forum?id=mrRbIcyouU",
        "pdf_size": 5084104,
        "rating": "3;5;5;6",
        "confidence": "5;4;3;5",
        "soundness": "2;4;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "58;78;76;72",
        "wc_strengths": "28;202;91;65",
        "wc_weaknesses": "874;567;247;106",
        "wc_questions": "36;1;159;34",
        "wc_review": "996;848;573;277",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            71.0,
            7.810249675906654
        ],
        "wc_strengths_avg": [
            96.5,
            64.8941445740677
        ],
        "wc_weaknesses_avg": [
            448.5,
            297.0694363276034
        ],
        "wc_questions_avg": [
            57.5,
            60.226655228395344
        ],
        "wc_review_avg": [
            673.5,
            274.6675262931532
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.20751433915982243,
        "gs_citation": 125,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6334290244911765194&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "Nanjing University;Nanyang Technological University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.nju.edu.cn;https://www.ntu.edu.sg",
        "aff_unique_abbr": "Nanjing U;NTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "China;Singapore"
    },
    {
        "title": "Bridging State and History Representations: Understanding Self-Predictive RL",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17879",
        "id": "ms0VgzSGF2",
        "author_site": "Tianwei Ni, Benjamin Eysenbach, Erfan Seyedsalehi, Michel Ma, Clement Gehring, Aditya Mahajan, Pierre-Luc Bacon",
        "tldr": "",
        "abstract": "Representations are at the core of all deep reinforcement learning (RL) methods for both Markov decision processes (MDPs) and partially observable Markov decision processes (POMDPs). Many representation learning methods and theoretical frameworks have been developed to understand what constitutes an effective representation. However, the relationships between these methods and the shared properties among them remain unclear. In this paper, we show that many of these seemingly distinct methods and frameworks for state and history abstractions are, in fact, based on a common idea of self-predictive abstraction. Furthermore, we provide theoretical insights into the widely adopted objectives and optimization, such as the stop-gradient technique, in learning self-predictive representations. These findings together yield a minimalist algorithm to learn self-predictive representations for states and histories. We validate our theories by applying our algorithm to standard MDPs, MDPs with distractors, and POMDPs with sparse rewards. These findings culminate in a set of preliminary guidelines for RL practitioners.",
        "keywords": "Reinforcement Learning;Representation Learning;POMDPs;Information States;Self-supervised Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/c9a55205be2a417553b771f3af1c3bd406cacf47.pdf",
        "author": "Tianwei Ni;Benjamin Eysenbach;Erfan SeyedSalehi;Michel Ma;Clement Gehring;Aditya Mahajan;Pierre-Luc Bacon",
        "authorids": "~Tianwei_Ni1;~Benjamin_Eysenbach1;~Erfan_SeyedSalehi1;~Michel_Ma1;~Clement_Gehring1;~Aditya_Mahajan1;~Pierre-Luc_Bacon1",
        "gender": "M;M;M;M;M;M;",
        "homepage": "https://twni2016.github.io/;https://ben-eysenbach.github.io/;;;http://people.csail.mit.edu/gehring/;http://cim.mcgill.ca/~adityam/;",
        "dblp": "230/8153;192/1863;;;131/5247;84/6024;",
        "google_scholar": "njAD34UAAAAJ;DRnOvU8AAAAJ;;;KvX7mJUAAAAJ;https://scholar.google.com/citations?hl=en;",
        "orcid": ";0009-0000-7136-6307;;;;0000-0001-8125-1191;",
        "linkedin": ";benjamin-eysenbach-a7235775/;erfan-seyedsalehi-17a937129/;michel-ma/;;;",
        "or_profile": "~Tianwei_Ni1;~Benjamin_Eysenbach1;~Erfan_SeyedSalehi1;~Michel_Ma1;~Clement_Gehring1;~Aditya_Mahajan1;~Pierre-Luc_Bacon1",
        "aff": "Amazon Web Services;Princeton University;Huawei Technologies Ltd.;University of Montreal;Massachusetts Institute of Technology;McGill University;",
        "aff_domain": "amazon.com;princeton.edu;huawei.com;umontreal.ca;mit.edu;mcgill.ca;",
        "position": "Intern;Assistant Professor;Associate Researcher;PhD student;PhD student;Associate Professor;",
        "bibtex": "@inproceedings{\nni2024bridging,\ntitle={Bridging State and History Representations: Understanding Self-Predictive {RL}},\nauthor={Tianwei Ni and Benjamin Eysenbach and Erfan SeyedSalehi and Michel Ma and Clement Gehring and Aditya Mahajan and Pierre-Luc Bacon},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ms0VgzSGF2}\n}",
        "github": "",
        "project": "",
        "reviewers": "fv1F;sXU8;kS5Z;5DUm",
        "pdf_size": 4094699,
        "rating": "3;8;8;8",
        "confidence": "2;3;4;3",
        "soundness": "3;3;3;3",
        "contribution": "2;4;3;3",
        "presentation": "1;3;2;3",
        "wc_summary": "52;63;37;107",
        "wc_strengths": "37;224;51;179",
        "wc_weaknesses": "276;27;2;268",
        "wc_questions": "77;166;312;29",
        "wc_review": "442;480;402;583",
        "wc_reply_reviewers": "652;40;42;24",
        "wc_reply_authors": "2151;755;703;962",
        "reply_reviewers": "4;1;1;1",
        "reply_authors": "5;2;1;2",
        "rating_avg": [
            6.75,
            2.165063509461097
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            64.75,
            26.080404521402652
        ],
        "wc_strengths_avg": [
            122.75,
            80.49340035058775
        ],
        "wc_weaknesses_avg": [
            143.25,
            129.0840327073802
        ],
        "wc_questions_avg": [
            146.0,
            107.7102594927707
        ],
        "wc_review_avg": [
            476.75,
            67.25836379217085
        ],
        "wc_reply_reviewers_avg": [
            189.5,
            267.1156116740465
        ],
        "wc_reply_authors_avg": [
            1142.75,
            590.1204855790045
        ],
        "reply_reviewers_avg": [
            1.75,
            1.299038105676658
        ],
        "reply_authors_avg": [
            2.5,
            1.5
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.816496580927726,
        "gs_citation": 26,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3782297979274743890&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=ms0VgzSGF2",
        "pdf": "https://openreview.net/pdf?id=ms0VgzSGF2",
        "email": "amazon.com;princeton.edu;huawei.com;umontreal.ca;mit.edu;mcgill.ca;",
        "author_num": 7,
        "aff_unique_index": "0;1;2;3;4;5",
        "aff_unique_norm": "Amazon;Princeton University;Huawei;University of Montreal;Massachusetts Institute of Technology;McGill University",
        "aff_unique_dep": "Amazon Web Services;;Huawei Technologies;;;",
        "aff_unique_url": "https://aws.amazon.com;https://www.princeton.edu;https://www.huawei.com;https://wwwumontreal.ca;https://web.mit.edu;https://www.mcgill.ca",
        "aff_unique_abbr": "AWS;Princeton;Huawei;UM;MIT;McGill",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;2;0;2",
        "aff_country_unique": "United States;China;Canada"
    },
    {
        "title": "FedCompass: Efficient Cross-Silo Federated Learning on Heterogeneous Client Devices Using a Computing Power-Aware Scheduler",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17878",
        "id": "msXxrttLOi",
        "author_site": "Zilinghan Li, Pranshu Chaturvedi, Shilan He, Han Chen, Gagandeep Singh, Volodymyr Kindratenko, Eliu Huerta, Kibaek Kim, Ravi Madduri",
        "tldr": "",
        "abstract": "Cross-silo federated learning offers a promising solution to collaboratively train robust and generalized AI models without compromising the privacy of local datasets, e.g., healthcare, financial, as well as scientific projects that lack a centralized data facility. Nonetheless, because of the disparity of computing resources among different clients (i.e., device heterogeneity), synchronous federated learning algorithms suffer from degraded efficiency when waiting for straggler clients. Similarly, asynchronous federated learning algorithms experience degradation in the convergence rate and final model accuracy on non-identically and independently distributed (non-IID) heterogeneous datasets due to stale local models and client drift. To address these limitations in cross-silo federated learning with heterogeneous clients and data, we propose FedCompass, an innovative semi-asynchronous federated learning algorithm with a computing power-aware scheduler on the server side, which adaptively assigns varying amounts of training tasks to different clients using the knowledge of the computing power of individual clients. FedCompass ensures that multiple locally trained models from clients are received almost simultaneously as a group for aggregation, effectively reducing the staleness of local models. At the same time, the overall training process remains asynchronous, eliminating prolonged waiting periods from straggler clients. Using diverse non-IID heterogeneous distributed datasets, we demonstrate that FedCompass achieves faster convergence and higher accuracy than other asynchronous algorithms while remaining more efficient than synchronous algorithms when performing federated learning on heterogeneous clients. The source code for FedCompass is available at https://github.com/APPFL/FedCompass.",
        "keywords": "Federated Learning;Device Heterogeneity;Cross-silo Federated Learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/8dfe39c36a611f79c543382c39ee28cca44a3404.zip",
        "author": "Zilinghan Li;Pranshu Chaturvedi;Shilan He;Han Chen;Gagandeep Singh;Volodymyr Kindratenko;Eliu A Huerta;Kibaek Kim;Ravi Madduri",
        "authorids": "~Zilinghan_Li1;~Pranshu_Chaturvedi1;~Shilan_He1;~Han_Chen4;~Gagandeep_Singh1;~Volodymyr_Kindratenko1;~Eliu_A_Huerta1;~Kibaek_Kim1;~Ravi_Madduri1",
        "gender": "M;M;F;M;M;M;M;M;M",
        "homepage": ";;https://www.linkedin.com/in/shilan-he-aa665a249/;https://www.linkedin.com/in/han-chen-617485249/;https://ggndpsngh.github.io/;https://ece.illinois.edu/about/directory/faculty/kindrtnk;https://www.anl.gov/profile/eliu-a-huerta;https://kibaekkim.github.io;https://www.anl.gov/profile/ravi-k-madduri",
        "dblp": "294/4241;;;;64/3747-1;70/536.html;;124/2557;02/1272",
        "google_scholar": "4JbL29YAAAAJ;https://scholar.google.com/citations?view_op=search_authors;;;https://scholar.google.ch/citations?user=m4b2ruEAAAAJ;Cy81VegAAAAJ;CZQuCS0AAAAJ;RE9h8MsAAAAJ;1NoINjMAAAAJ",
        "orcid": ";;;;0000-0002-9299-2961;0000-0002-9336-4756;0000-0002-9682-3604;0000-0002-5820-6533;0000-0003-2130-2887",
        "linkedin": ";;;;gagandeep-singh-1bb01b49/;;eliu-huerta-72a84165/;kibaekkim/;",
        "or_profile": "~Zilinghan_Li1;~Pranshu_Chaturvedi1;~Shilan_He1;~Han_Chen4;~Gagandeep_Singh1;~Volodymyr_Kindratenko1;~Eliu_A_Huerta1;~Kibaek_Kim1;~Ravi_Madduri1",
        "aff": "University of Illinois, Urbana Champaign;Argonne National Laboratory;University of Illinois, Urbana Champaign;University of Illinois, Urbana Champaign;University of Illinois, Urbana Champaign;University of Illinois, Urbana Champaign;Argonne National Laboratory;Argonne National Laboratory;Argonne National Laboratory",
        "aff_domain": "illinois.edu;anl.gov;illinois.edu;illinois.edu;illinois.edu;ncsa.illinois.edu;anl.gov;anl.gov;anl.gov",
        "position": "MS student;Researcher;MS student;Undergrad student;Assistant Professor;Assistant Director;Principal Researcher;Researcher;Principal Researcher",
        "bibtex": "@inproceedings{\nli2024fedcompass,\ntitle={FedCompass: Efficient Cross-Silo Federated Learning on Heterogeneous Client Devices Using a Computing Power-Aware Scheduler},\nauthor={Zilinghan Li and Pranshu Chaturvedi and Shilan He and Han Chen and Gagandeep Singh and Volodymyr Kindratenko and Eliu A Huerta and Kibaek Kim and Ravi Madduri},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=msXxrttLOi}\n}",
        "github": "",
        "project": "",
        "reviewers": "UVPW;DhHF;7w8f;vABe",
        "pdf_size": 22967385,
        "rating": "5;6;6;8",
        "confidence": "3;3;4;4",
        "soundness": "2;2;3;4",
        "contribution": "2;2;2;2",
        "presentation": "3;2;3;3",
        "wc_summary": "59;79;97;56",
        "wc_strengths": "18;61;85;129",
        "wc_weaknesses": "376;87;345;156",
        "wc_questions": "68;103;4;4",
        "wc_review": "521;330;531;345",
        "wc_reply_reviewers": "412;394;95;162",
        "wc_reply_authors": "3130;2165;1227;1065",
        "reply_reviewers": "2;3;1;2",
        "reply_authors": "6;5;3;4",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            72.75,
            16.55860803328589
        ],
        "wc_strengths_avg": [
            73.25,
            40.15205474194316
        ],
        "wc_weaknesses_avg": [
            241.0,
            122.45611458804333
        ],
        "wc_questions_avg": [
            44.75,
            42.587410111440214
        ],
        "wc_review_avg": [
            431.75,
            94.46527139642377
        ],
        "wc_reply_reviewers_avg": [
            265.75,
            139.42448673027275
        ],
        "wc_reply_authors_avg": [
            1896.75,
            826.6251795705234
        ],
        "reply_reviewers_avg": [
            2.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            4.5,
            1.118033988749895
        ],
        "replies_avg": [
            32,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.6882472016116854,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13132918754287176781&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=msXxrttLOi",
        "pdf": "https://openreview.net/pdf?id=msXxrttLOi",
        "email": "illinois.edu;anl.gov;illinois.edu;illinois.edu;illinois.edu;ncsa.illinois.edu;anl.gov;anl.gov;anl.gov",
        "author_num": 9,
        "aff_unique_index": "0;1;0;0;0;0;1;1;1",
        "aff_unique_norm": "University of Illinois Urbana-Champaign;Argonne National Laboratory",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://illinois.edu;https://www.anl.gov",
        "aff_unique_abbr": "UIUC;ANL",
        "aff_campus_unique_index": "0;0;0;0;0",
        "aff_campus_unique": "Urbana-Champaign;",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "mssRRt6OPE",
        "title": "Relevance-based embeddings for efficient relevance retrieval",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In many machine learning applications, the most relevant items for a particular query should be efficiently extracted. The relevance function is typically an expensive neural similarity model making the exhaustive search infeasible. A typical solution to this problem is to train another model that separately embeds queries and items to a vector space, where similarity is defined via the dot product or cosine similarity. This allows one to search the most relevant objects through fast approximate nearest neighbors search at the cost of some reduction in quality. To compensate for this reduction, the found candidates are then re-ranked by the expensive similarity model. In this paper, we propose an alternative approach that utilizes the relevances of the expensive model to make relevance-based embeddings. We show both theoretically and empirically that describing each query by its relevance for a set of support items creates a powerful query representation. Additionally, we investigate several strategies for selecting these support items and show that additional significant improvements can be obtained. Our experiments on diverse datasets show improved performance over existing approaches.",
        "keywords": "Information search;Relevance search;Nearest neighbor search;Relevance-based embeddings;Recommendation systems",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Kirill Sergeevich Shevkunov;Andrey Ploskonosov;Liudmila Prokhorenkova",
        "authorids": "~Kirill_Sergeevich_Shevkunov1;~Andrey_Ploskonosov1;~Liudmila_Prokhorenkova1",
        "gender": "M;;F",
        "homepage": ";;",
        "dblp": "269/9486.html;;45/11468",
        "google_scholar": "https://scholar.google.ru/citations?user=nXjVs34AAAAJ;;https://scholar.google.ru/citations?user=6JyZlSEAAAAJ",
        "orcid": ";;",
        "linkedin": ";https://www.linkedin.cn/in/andrey-ploskonosov-a06537213/;",
        "or_profile": "~Kirill_Sergeevich_Shevkunov1;~Andrey_Ploskonosov1;~Liudmila_Prokhorenkova1",
        "aff": "Yandex;;Yandex",
        "aff_domain": "yandex-team.ru;;yandex-team.ru",
        "position": "Researcher;;Researcher",
        "bibtex": "@misc{\nshevkunov2024relevancebased,\ntitle={Relevance-based embeddings for efficient relevance retrieval},\nauthor={Kirill Sergeevich Shevkunov and Andrey Ploskonosov and Liudmila Prokhorenkova},\nyear={2024},\nurl={https://openreview.net/forum?id=mssRRt6OPE}\n}",
        "github": "",
        "project": "",
        "reviewers": "NsRC;ayPq;9wpg;UmnS",
        "site": "https://openreview.net/forum?id=mssRRt6OPE",
        "pdf_size": 308846,
        "rating": "5;6;6;6",
        "confidence": "3;3;4;3",
        "soundness": "4;3;3;3",
        "contribution": "3;2;3;2",
        "presentation": "3;3;2;3",
        "wc_summary": "81;68;80;86",
        "wc_strengths": "55;94;129;21",
        "wc_weaknesses": "153;347;323;56",
        "wc_questions": "84;14;5;34",
        "wc_review": "373;523;537;197",
        "wc_reply_reviewers": "89;39;0;0",
        "wc_reply_authors": "1012;658;674;516",
        "reply_reviewers": "2;1;0;0",
        "reply_authors": "3;4;2;2",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            78.75,
            6.609652033201143
        ],
        "wc_strengths_avg": [
            74.75,
            40.59787556018172
        ],
        "wc_weaknesses_avg": [
            219.75,
            120.54330134851956
        ],
        "wc_questions_avg": [
            34.25,
            30.58083550199373
        ],
        "wc_review_avg": [
            407.5,
            137.4872721381874
        ],
        "wc_reply_reviewers_avg": [
            32.0,
            36.55817282086182
        ],
        "wc_reply_authors_avg": [
            715.0,
            182.16750533506243
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:8t5ilg5B91IJ:scholar.google.com/&scioq=Relevance-based+embeddings+for+efficient+relevance+retrieval&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Yandex",
        "aff_unique_dep": "",
        "aff_unique_url": "https://yandex.com",
        "aff_unique_abbr": "Yandex",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Russian Federation"
    },
    {
        "id": "msuaCcTMQ2",
        "title": "Active Automated Machine Learning with Self-Training",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Automated Machine Learning (AutoML) aims to automatically select and configure machine learning algorithms for optimal performance on given datasets. In real-world applications, training data oftentimes contain a large amount of unlabeled examples, whereas the amount of labeled examples is limited. However, AutoML tools have so far only focused on supervised learning, i.e., utilizing labeled data for training, leaving the valuable information provided by unlabeled data untapped. To address this limitation, we introduce our augmented AutoML system AutoActiveSelf-Labeling (AutoASL), which combines principles from self-training and active learning to effectively leverage unlabeled data during the training process. AutoASL iteratively self-labels previously unlabeled data instances, which is achieved through a powerful ensemble of AutoML and traditional ML algorithms, resulting in a substantial expansion of the labeled training data. We observe synergetic effects between the incorporated self-training and active learning components, leading to an improvement of the overall accuracy compared to state-of-the-art tools.",
        "keywords": "Active Learning;Semi-supervised Learning;Automated Machine Learning;Tabular Data",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/ea42ed0ab6992d365a14900015e0d6d729ccd742.pdf",
        "author": "Valentin Margraf;Julian Lienen;Eyke H\u00fcllermeier;Marcel Wever",
        "authorids": "~Valentin_Margraf1;~Julian_Lienen1;~Eyke_H\u00fcllermeier1;~Marcel_Wever1",
        "gender": "M;M;M;M",
        "homepage": "https://www.kiml.ifi.lmu.de/people/employees/margraf/index.html;;https://cs.uni-paderborn.de/index.php?id=60202;https://www.marcelwever.de",
        "dblp": ";277/5028;h/EykeHullermeier;202/9010",
        "google_scholar": ";https://scholar.google.de/citations?hl=de;https://scholar.google.de/citations?user=usVJeNN3xFAC;ZaE04WUAAAAJ",
        "orcid": ";0000-0003-2162-8107;0000-0002-9944-4108;0000-0001-9782-6818",
        "linkedin": "valentin-margraf-5a85621b8/;julian-lienen-7046b3185/;;",
        "or_profile": "~Valentin_Margraf1;~Julian_Lienen1;~Eyke_H\u00fcllermeier1;~Marcel_Wever1",
        "aff": "Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen;Beckhoff Automation;Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen;Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen",
        "aff_domain": "lmu.de;beckhoff.com;lmu.de;lmu.de",
        "position": "PhD student;Researcher;Full Professor;Postdoc",
        "bibtex": "@misc{\nmargraf2024active,\ntitle={Active Automated Machine Learning with Self-Training},\nauthor={Valentin Margraf and Julian Lienen and Eyke H{\\\"u}llermeier and Marcel Wever},\nyear={2024},\nurl={https://openreview.net/forum?id=msuaCcTMQ2}\n}",
        "github": "",
        "project": "",
        "reviewers": "VFs5;pCRY;XfBj;HF5Z",
        "site": "https://openreview.net/forum?id=msuaCcTMQ2",
        "pdf_size": 459265,
        "rating": "3;3;3;6",
        "confidence": "3;3;4;4",
        "soundness": "2;1;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "255;45;37;52",
        "wc_strengths": "77;36;37;7",
        "wc_weaknesses": "249;90;137;13",
        "wc_questions": "205;86;3;68",
        "wc_review": "786;257;214;140",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "163;170;62;100",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            97.25,
            91.23150497498109
        ],
        "wc_strengths_avg": [
            39.25,
            24.903564001965663
        ],
        "wc_weaknesses_avg": [
            122.25,
            85.52594635547742
        ],
        "wc_questions_avg": [
            90.5,
            72.9606058088884
        ],
        "wc_review_avg": [
            349.25,
            255.60650911117267
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            123.75,
            44.87970031094236
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Fkm5xCXzXRUJ:scholar.google.com/&scioq=Active+Automated+Machine+Learning+with+Self-Training&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen;Beckhoff Automation",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.lmu.de;https://www.beckhoff.com",
        "aff_unique_abbr": "LMU;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "mt5NPvTp5a",
        "title": "Improved Operator Learning by Orthogonal Attention",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Neural operators, as an efficient surrogate model for learning the solutions of PDEs, have received extensive attention in the field of scientific machine learning.\nAmong them, attention-based neural operators have become one of the mainstreams in related research.\nHowever, existing approaches overfit the limited training data due to the considerable number of parameters in the attention mechanism.\nTo address this, we develop an orthogonal attention based on the eigendecomposition of the kernel integral operator and the neural approximation of eigenfunctions. \nThe orthogonalization naturally poses a proper regularization effect on the resulting neural operator, which aids in resisting overfitting and boosting generalization. \nExperiments on six standard neural operator benchmark datasets comprising both regular and irregular geometries show that our method can outperform competing baselines with decent margins.",
        "keywords": "neural operator;attention;transformer;PDE",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/4447c4a1c26ce0a3b4d74d1d218d2851fa5f4a71.zip",
        "author": "Zipeng Xiao;Zhongkai Hao;Bokai Lin;Zhijie Deng;Hang Su",
        "authorids": "~Zipeng_Xiao1;~Zhongkai_Hao1;~Bokai_Lin1;~Zhijie_Deng1;~Hang_Su3",
        "gender": "M;M;M;M;M",
        "homepage": "https://github.com/xzppp;https://github.com/zhuanrangqun;https://thudzj.github.io/;;https://haozhongkai.github.io/",
        "dblp": ";;209/4959;26/5371-6;270/0220.html",
        "google_scholar": ";;J3dR0sUAAAAJ;dxN1_X0AAAAJ;dfSzq27ZiVoC",
        "orcid": ";;0000-0002-0932-1631;;",
        "linkedin": ";;;;",
        "or_profile": "~Zipeng_Xiao1;~Bokai_Lin1;~Zhijie_Deng1;~Hang_Su2;~Hao_Zhongkai1",
        "aff": "Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;Tsinghua University;Tsinghua University",
        "aff_domain": "sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;tsinghua.edu.cn;mails.tsinghua.edu.cn",
        "position": "MS student;Undergrad student;Assistant Professor;Associate Professor;PhD student",
        "bibtex": "@misc{\nxiao2024improved,\ntitle={Improved Operator Learning by Orthogonal Attention},\nauthor={Zipeng Xiao and Zhongkai Hao and Bokai Lin and Zhijie Deng and Hang Su},\nyear={2024},\nurl={https://openreview.net/forum?id=mt5NPvTp5a}\n}",
        "github": "",
        "project": "",
        "reviewers": "bpG7;TYEx;rVud;DnDW",
        "site": "https://openreview.net/forum?id=mt5NPvTp5a",
        "pdf_size": 889287,
        "rating": "5;6;6;6",
        "confidence": "2;3;3;3",
        "soundness": "3;3;2;3",
        "contribution": "2;3;2;3",
        "presentation": "2;4;2;3",
        "wc_summary": "18;41;183;62",
        "wc_strengths": "21;34;134;76",
        "wc_weaknesses": "37;115;174;145",
        "wc_questions": "15;164;3;1",
        "wc_review": "91;354;494;284",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "422;398;404;264",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;1;1;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            76.0,
            63.70635761052424
        ],
        "wc_strengths_avg": [
            66.25,
            44.08160047003738
        ],
        "wc_weaknesses_avg": [
            117.75,
            51.07531204016281
        ],
        "wc_questions_avg": [
            45.75,
            68.48129306606295
        ],
        "wc_review_avg": [
            305.75,
            145.22116753421315
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            372.0,
            62.976185975335156
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5762943687772372832&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;0;1;1",
        "aff_unique_norm": "Shanghai Jiao Tong University;Tsinghua University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.sjtu.edu.cn;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "SJTU;THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "mu1UUl14cw",
        "title": "Ctrl-Room: Controllable Text-to-3D Room Meshes Generation with Layout Constraints",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Text-driven 3D indoor scene generation could be useful for gaming, film industry,\nand AR/VR applications. However, existing methods cannot faithfully capture the\nroom layout, nor do they allow flexible editing of individual objects in the room.\nTo address these problems, we present Ctrl-Room, which is able to generate con-\nvincing 3D rooms with designer-style layouts and high-fidelity textures from just\na text prompt. Moreover, Ctrl-Room enables versatile interactive editing opera-\ntions such as resizing or moving individual furniture items. Our key insight is\nto separate the modeling of layouts and appearance. Our proposed method con-\nsists of two stages, a \u2018Layout Generation Stage\u2019 and an \u2018Appearance Generation\nStage\u2019. The \u2018Layout Generation Stage\u2019 trains a text-conditional diffusion model to\nlearn the layout distribution with our holistic scene code parameterization. Next,\nthe \u2018Appearance Generation Stage\u2019 employs a fine-tuned ControlNet to produce a\nvivid panoramic image of the room guided by the 3D scene layout and text prompt.\nIn this way, we achieve a high-quality 3D room with convincing layouts and lively\ntextures. Benefiting from the scene code parameterization, we can easily edit the\ngenerated room model through our mask-guided editing module, without expen-\nsive editing-specific training. Extensive experiments on the Structured3D dataset\ndemonstrate that our method outperforms existing methods in producing more rea-\nsonable, view-consistent, and editable 3D rooms from natural language prompts.",
        "keywords": "text-driven 3D room generation;3D scene editing;diffusion model;indoor scene layout;panorama generation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/b9b44fb1fa35e40a597963db89c616c9e2290a3d.pdf",
        "author": "Chuan Fang;Xiaotao Hu;Kunming Luo;Ping Tan",
        "authorids": "~Chuan_Fang1;~Xiaotao_Hu1;~Kunming_Luo1;~Ping_Tan2",
        "gender": "M;M;M;M",
        "homepage": "https://github.com/fangchuan/fangchuan.github.io;;https://coolbeam.github.io/index.html;http://www.cs.sfu.ca/~pingtan/",
        "dblp": "289/0014;174/1500;213/4872;",
        "google_scholar": "cBUlGS8AAAAJ;PRcnqk4AAAAJ;https://scholar.google.com.hk/citations?hl=zh-CN;XhyKVFMAAAAJ",
        "orcid": "0000-0003-2626-6029;;0000-0002-5070-7392;0000-0002-4506-6973",
        "linkedin": ";;;",
        "or_profile": "~Chuan_Fang1;~Xiaotao_Hu1;~Kunming_Luo1;~Ping_Tan2",
        "aff": "Hong Kong University of Science and Technology;Nankai University;Hong Kong University of Science and Technology;Hong Kong University of Science and Technology",
        "aff_domain": "ust.hk;nankai.edu.cn;ust.hk;ust.hk",
        "position": "PhD student;MS student;PhD student;Full Professor",
        "bibtex": "@misc{\nfang2024ctrlroom,\ntitle={Ctrl-Room: Controllable Text-to-3D Room Meshes Generation with Layout Constraints},\nauthor={Chuan Fang and Xiaotao Hu and Kunming Luo and Ping Tan},\nyear={2024},\nurl={https://openreview.net/forum?id=mu1UUl14cw}\n}",
        "github": "",
        "project": "",
        "reviewers": "DxGi;83GV;Bzvn;eF7g",
        "site": "https://openreview.net/forum?id=mu1UUl14cw",
        "pdf_size": 7631025,
        "rating": "5;5;6;6",
        "confidence": "4;5;4;5",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "78;87;61;67",
        "wc_strengths": "79;19;37;38",
        "wc_weaknesses": "107;54;229;36",
        "wc_questions": "108;46;63;65",
        "wc_review": "372;206;390;206",
        "wc_reply_reviewers": "71;0;38;0",
        "wc_reply_authors": "1206;304;521;569",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "3;2;2;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            73.25,
            10.0093706095838
        ],
        "wc_strengths_avg": [
            43.25,
            21.98152633462927
        ],
        "wc_weaknesses_avg": [
            106.5,
            75.38733315352123
        ],
        "wc_questions_avg": [
            70.5,
            22.874658467395747
        ],
        "wc_review_avg": [
            293.5,
            87.73112332576164
        ],
        "wc_reply_reviewers_avg": [
            27.25,
            29.642663510555188
        ],
        "wc_reply_authors_avg": [
            650.0,
            336.1748057186915
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 40,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5635216092201148476&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Nankai University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ust.hk;http://www.nankai.edu.cn",
        "aff_unique_abbr": "HKUST;NKU",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Views Can Be Deceiving: Improved SSL Through Feature Space Augmentation",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17877",
        "id": "mutJBk3ILg",
        "author_site": "Kimia Hamidieh, Haoran Zhang, Swami Sankaranarayanan, Marzyeh Ghassemi",
        "tldr": "",
        "abstract": "Supervised learning methods have been found to exhibit inductive biases favoring simpler features. When such features are spuriously correlated with the label, this can result in suboptimal performance on minority subgroups. Despite the growing popularity of methods which learn from unlabeled data, the extent to which these representations rely on spurious features for prediction is unclear. In this work, we explore the impact of spurious features on Self-Supervised Learning (SSL) for visual representation learning. We first empirically show that commonly used augmentations in SSL can cause undesired invariances in the image space, and illustrate this with a simple example. We further show that classical approaches in combating spurious correlations, such as dataset re-sampling during SSL, do not consistently lead to invariant representations. Motivated by these findings, we propose LateTVG to remove spurious information from these representations during pre-training, by regularizing later layers of the encoder via pruning. We find that our method produces representations which outperform the baselines on several benchmarks, without the need for group or label information during SSL.",
        "keywords": "Representation Learning;Spurious Correlations;Self-supervised Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/a63edb02cc0c798131510de9e6e8cd4760e79ec0.zip",
        "author": "Kimia Hamidieh;Haoran Zhang;Swami Sankaranarayanan;Marzyeh Ghassemi",
        "authorids": "~Kimia_Hamidieh1;~Haoran_Zhang4;~Swami_Sankaranarayanan1;~Marzyeh_Ghassemi2",
        "gender": "F;M;M;F",
        "homepage": ";https://haoran.ca;https://swamiviv.github.io;https://www.healthyml.org/",
        "dblp": ";95/4452-3.html;172/9983;145/6563",
        "google_scholar": ";https://scholar.google.ca/citations?user=6aWRAPkAAAAJ;w3KgvQIAAAAJ;",
        "orcid": ";;;",
        "linkedin": "kimia-hamidieh-956519212/;;swamiviv/;",
        "or_profile": "~Kimia_Hamidieh1;~Haoran_Zhang4;~Swami_Sankaranarayanan1;~Marzyeh_Ghassemi2",
        "aff": "Massachusetts Institute of Technology;Massachusetts Institute of Technology;Sony AI America;Massachusetts Institute of Technology",
        "aff_domain": "mit.edu;mit.edu;sony.com;mit.edu",
        "position": "PhD student;PhD student;Researcher;Assistant Professor",
        "bibtex": "@inproceedings{\nhamidieh2024views,\ntitle={Views Can Be Deceiving: Improved {SSL} Through Feature Space Augmentation},\nauthor={Kimia Hamidieh and Haoran Zhang and Swami Sankaranarayanan and Marzyeh Ghassemi},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=mutJBk3ILg}\n}",
        "github": "",
        "project": "",
        "reviewers": "32bS;H1ZX;GmKS;BzfQ",
        "pdf_size": 4390673,
        "rating": "5;6;6;8",
        "confidence": "4;3;3;4",
        "soundness": "2;3;3;4",
        "contribution": "2;3;3;3",
        "presentation": "2;3;3;4",
        "wc_summary": "80;157;191;98",
        "wc_strengths": "35;172;252;69",
        "wc_weaknesses": "123;134;256;24",
        "wc_questions": "32;21;198;83",
        "wc_review": "270;484;897;274",
        "wc_reply_reviewers": "0;19;0;38",
        "wc_reply_authors": "677;537;463;739",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "2;2;2;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            131.5,
            44.62342434193055
        ],
        "wc_strengths_avg": [
            132.0,
            85.70005834303731
        ],
        "wc_weaknesses_avg": [
            134.25,
            82.31760139848585
        ],
        "wc_questions_avg": [
            83.5,
            70.12310603502956
        ],
        "wc_review_avg": [
            481.25,
            255.16404037403075
        ],
        "wc_reply_reviewers_avg": [
            14.25,
            15.75396775418815
        ],
        "wc_reply_authors_avg": [
            604.0,
            109.45775440780794
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.2294157338705618,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11343377350615966548&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=mutJBk3ILg",
        "pdf": "https://openreview.net/pdf?id=mutJBk3ILg",
        "email": "mit.edu;mit.edu;sony.com;mit.edu",
        "author_num": 4,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Massachusetts Institute of Technology;Sony AI America",
        "aff_unique_dep": ";Sony AI",
        "aff_unique_url": "https://web.mit.edu;https://www.sonyai.com",
        "aff_unique_abbr": "MIT;Sony AI America",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "mvGa1ikBD3",
        "title": "Graph Neural Networks with Directional Encodings for Anisotropic Elasticity",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Simulating the behavior of nonlinear and anisotropic materials is a central problem with applications across engineering, computer graphics, robotics, and beyond. While conventional mesh-based simulations provide accurate and reliable predictions, their computational overhead typically prevents their use in interactive applications. Graph neural networks (GNN) have recently emerged as a compelling alternative to conventional simulations for time-critical applications.  However, existing GNN-based methods cannot distinguish between deformations in different directions and are thus limited to isotropic materials. To address this limitation, we propose a novel and easy-to-implement GNN architecture based on directional encodings of edge features. By preserving directional information during message passing, our method has access to the full state of deformation and can thus model anisotropic materials. We demonstrate through a set of qualitative and quantitative evaluations that our approach outperforms existing mesh-based GNN approaches for modeling anisotropic materials.",
        "keywords": "Graph Neural Networks;Anisotropic Elasticity;Elastodynamics",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Fabian Haller;Yue Li;Stelian Coros;Bernhard Thomaszewski",
        "authorids": "~Fabian_Haller1;~Yue_Li7;~Stelian_Coros1;~Bernhard_Thomaszewski1",
        "gender": "M;M;M;",
        "homepage": ";https://liyuesolo.github.io/;http://crl.ethz.ch/index.html;https://n.ethz.ch/~bthomasz/",
        "dblp": ";;;",
        "google_scholar": ";bBcDQlsAAAAJ;sX31JjwAAAAJ;IDw2HJAAAAAJ",
        "orcid": ";;;",
        "linkedin": "fabian-haller-a78047221/;yue-li-730515a5/;;",
        "or_profile": "~Fabian_Haller1;~Yue_Li7;~Stelian_Coros1;~Bernhard_Thomaszewski1",
        "aff": ";Department of Computer Science, Swiss Federal Institute of Technology;ETHZ - ETH Zurich;Swiss Federal Institute of Technology",
        "aff_domain": ";inf.ethz.ch;ethz.ch;ethz.ch",
        "position": ";PhD student;Associate Professor;Researcher",
        "bibtex": "@misc{\nhaller2024graph,\ntitle={Graph Neural Networks with Directional Encodings for Anisotropic Elasticity},\nauthor={Fabian Haller and Yue Li and Stelian Coros and Bernhard Thomaszewski},\nyear={2024},\nurl={https://openreview.net/forum?id=mvGa1ikBD3}\n}",
        "github": "",
        "project": "",
        "reviewers": "kvP8;RLHk;EyHC;r4js",
        "site": "https://openreview.net/forum?id=mvGa1ikBD3",
        "pdf_size": 1979893,
        "rating": "3;3;5;6",
        "confidence": "3;4;4;3",
        "soundness": "2;2;3;4",
        "contribution": "2;2;2;2",
        "presentation": "3;3;2;3",
        "wc_summary": "43;75;30;103",
        "wc_strengths": "39;57;20;46",
        "wc_weaknesses": "353;203;109;63",
        "wc_questions": "747;76;26;88",
        "wc_review": "1182;411;185;300",
        "wc_reply_reviewers": "22;75;73;202",
        "wc_reply_authors": "723;424;238;193",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            62.75,
            28.428638729281428
        ],
        "wc_strengths_avg": [
            40.5,
            13.46291201783626
        ],
        "wc_weaknesses_avg": [
            182.0,
            110.87380213558116
        ],
        "wc_questions_avg": [
            234.25,
            296.94812257362395
        ],
        "wc_review_avg": [
            519.5,
            390.7521593030549
        ],
        "wc_reply_reviewers_avg": [
            93.0,
            66.41912375212428
        ],
        "wc_reply_authors_avg": [
            394.5,
            208.4928056312735
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.19245008972987526,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:vvcnA3d4mmAJ:scholar.google.com/&scioq=Graph+Neural+Networks+with+Directional+Encodings+for+Anisotropic+Elasticity&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Swiss Federal Institute of Technology;ETH Zurich",
        "aff_unique_dep": "Department of Computer Science;",
        "aff_unique_url": "https://www.ethz.ch;https://www.ethz.ch",
        "aff_unique_abbr": "ETH Zurich;ETHZ",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Switzerland"
    },
    {
        "title": "Mega-TTS 2: Boosting Prompting Mechanisms for Zero-Shot Speech Synthesis",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17876",
        "id": "mvMI3N4AvD",
        "author_site": "Ziyue Jiang, Jinglin Liu, Yi Ren, Jinzheng He, Zhenhui Ye, Shengpeng Ji, Qian Yang, Chen Zhang, Pengfei Wei, Chunfeng Wang, Xiang Yin, Zejun MA, Zhou Zhao",
        "tldr": "",
        "abstract": "Zero-shot text-to-speech (TTS) aims to synthesize voices with unseen speech prompts, which significantly reduces the data and computation requirements for voice cloning by skipping the fine-tuning process. However, the prompting mechanisms of zero-shot TTS still face challenges in the following aspects: 1) previous works of zero-shot TTS are typically trained with single-sentence prompts, which significantly restricts their performance when the data is relatively sufficient during the inference stage. 2) The prosodic information in prompts is highly coupled with timbre, making it untransferable to each other.\nThis paper introduces Mega-TTS 2, a generic prompting mechanism for zero-shot TTS, to tackle the aforementioned challenges. Specifically, we design a powerful acoustic autoencoder that separately encodes the prosody and timbre information into the compressed latent space while providing high-quality reconstructions. Then, we propose a multi-reference timbre encoder and a prosody latent language model (P-LLM) to extract useful information from multi-sentence prompts. We further leverage the probabilities derived from multiple P-LLM outputs to produce transferable and controllable prosody. \nExperimental results demonstrate that Mega-TTS 2 could not only synthesize identity-preserving speech with a short prompt of an unseen speaker from arbitrary sources but consistently outperform the fine-tuning method when the volume of data ranges from 10 seconds to 5 minutes. Furthermore, our method enables to transfer various speaking styles to the target timbre in a fine-grained and controlled manner. Audio samples can be found in https://boostprompt.github.io/boostprompt/.",
        "keywords": "Prompting Mechanisms;Zero-Shot Text-to-Speech;Multi-Sentence Prompts",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Ziyue Jiang;Jinglin Liu;Yi Ren;Jinzheng He;Zhenhui Ye;Shengpeng Ji;Qian Yang;Chen Zhang;Pengfei Wei;Chunfeng Wang;Xiang Yin;Zejun MA;Zhou Zhao",
        "authorids": "~Ziyue_Jiang1;~Jinglin_Liu1;~Yi_Ren2;~Jinzheng_He1;~Zhenhui_Ye1;~Shengpeng_Ji1;~Qian_Yang5;~Chen_Zhang3;~Pengfei_Wei3;~Chunfeng_Wang2;~Xiang_Yin2;~Zejun_MA1;~Zhou_Zhao3",
        "gender": "M;M;M;;M;M;M;F;M;M;M;M;M",
        "homepage": ";;https://rayeren.github.io/;;https://yerfor.github.io;https://novateurjsp.github.io/;;https://actuy.github.io/;;;;https://pengfei-wei.com/;https://dblp.uni-trier.de/pid/75/7785.html?",
        "dblp": "258/6865;;75/6568-6;272/8857;265/6375;349/0678;15/3199;94/4084-20;;18/1022-6.html;;29/11273-1;75/7785",
        "google_scholar": "wDgSBssAAAAJ;Ri8x0jEAAAAJ;4FA6C0AAAAAJ;https://scholar.google.com/citations?hl=zh-CN;;zuRaB-oAAAAJ;https://scholar.google.com.sg/citations?hl=zh-CN;eBBFeVcAAAAJ;wPHfG5wAAAAJ;e6_J-lEAAAAJ;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com.sg/citations?user=a94WthkAAAAJ;https://scholar.google.com.hk/citations?user=IIoFY90AAAAJ",
        "orcid": ";;;;;0000-0002-0129-4843;;;;;;;0000-0001-6121-0384",
        "linkedin": ";;;;;;;;;;zejun-ma-58614365/;;",
        "or_profile": "~Ziyue_Jiang1;~Jinglin_Liu1;~Yi_Ren2;~Jinzheng_He1;~Zhenhui_Ye1;~Shengpeng_Ji1;~Qian_Yang5;~Chen_Zhang3;~Chunfeng_Wang2;~Xiang_Yin2;~Zejun_MA1;~pengfei_wei2;~Zhou_Zhao2",
        "aff": "Zhejiang University;ByteDance;ByteDance;Zhejiang University;Zhejiang University;Zhejiang University;Zhejiang University;Bytedance;ByteDance, Inc.;ByteDance Inc.;ByteDance Inc.;AI LAB Bytedance;Zhejiang University",
        "aff_domain": "zju.edu.cn;bytedance.com;bytedance.com;zju.edu.cn;zju.edu.cn;zju.edu.cn;zju.edu.cn;bytedance.com;bytedance.com;bytedance.com;bytedance.com;bytedance.com;zju.edu.cn",
        "position": "PhD student;Research Scientist;Researcher;MS student;PhD student;PhD student;MS student;Research Scientist;Researcher;Researcher;Principal Researcher;Researcher;Associate Professor",
        "bibtex": "@inproceedings{\njiang2024megatts,\ntitle={Mega-{TTS} 2: Boosting Prompting Mechanisms for Zero-Shot Speech Synthesis},\nauthor={Ziyue Jiang and Jinglin Liu and Yi Ren and Jinzheng He and Zhenhui Ye and Shengpeng Ji and Qian Yang and Chen Zhang and Pengfei Wei and Chunfeng Wang and Xiang Yin and Zejun MA and Zhou Zhao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=mvMI3N4AvD}\n}",
        "github": "",
        "project": "",
        "reviewers": "WuFJ;azu9;6vRj;pM8F",
        "pdf_size": 740971,
        "rating": "6;6;6;8",
        "confidence": "5;4;3;3",
        "soundness": "3;3;3;3",
        "contribution": "2;4;3;3",
        "presentation": "3;4;2;3",
        "wc_summary": "49;71;118;105",
        "wc_strengths": "125;96;83;100",
        "wc_weaknesses": "138;197;223;128",
        "wc_questions": "213;69;122;121",
        "wc_review": "525;433;546;454",
        "wc_reply_reviewers": "185;0;22;0",
        "wc_reply_authors": "1772;593;1496;631",
        "reply_reviewers": "2;0;1;0",
        "reply_authors": "5;1;3;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            85.75,
            27.288962970402523
        ],
        "wc_strengths_avg": [
            101.0,
            15.215124054702938
        ],
        "wc_weaknesses_avg": [
            171.5,
            39.73977856002723
        ],
        "wc_questions_avg": [
            131.25,
            51.83808927805885
        ],
        "wc_review_avg": [
            489.5,
            47.18315377335432
        ],
        "wc_reply_reviewers_avg": [
            51.75,
            77.45442208163456
        ],
        "wc_reply_authors_avg": [
            1123.0,
            520.4070522197023
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.5,
            1.6583123951777
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            13,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 41,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5311787723872082481&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=mvMI3N4AvD",
        "pdf": "https://openreview.net/pdf?id=mvMI3N4AvD",
        "email": "zju.edu.cn;bytedance.com;bytedance.com;zju.edu.cn;zju.edu.cn;zju.edu.cn;zju.edu.cn;bytedance.com;bytedance.com;bytedance.com;bytedance.com;bytedance.com;zju.edu.cn",
        "author_num": 13,
        "aff_unique_index": "0;1;1;0;0;0;0;1;1;1;1;1;0",
        "aff_unique_norm": "Zhejiang University;ByteDance",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.zju.edu.cn;https://www.bytedance.com",
        "aff_unique_abbr": "ZJU;ByteDance",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "OctoPack: Instruction Tuning Code Large Language Models",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17875",
        "id": "mw1PWNSWZP",
        "author_site": "Niklas Muennighoff, Qian Liu, Armel Zebaze, Qinkai Zheng, Binyuan Hui, Terry Yue Zhuo, Swayam Singh, Xiangru Tang, Leandro Von Werra, Shayne Longpre",
        "tldr": "",
        "abstract": "Finetuning large language models (LLMs) on instructions leads to vast performance improvements on natural language tasks. We apply instruction tuning using code, leveraging the natural structure of Git commits, which pair code changes with human instructions. We compile CommitPack: 4 terabytes of Git commits across 350 programming languages. We benchmark CommitPack against other natural and synthetic code instructions (xP3x, Self-Instruct, OASST) on the 16B parameter StarCoder model, and achieve state-of-the-art performance among models not trained on OpenAI outputs, on the HumanEval Python benchmark (46.2% pass@1). We further introduce HumanEvalPack, expanding the HumanEval benchmark to a total of 3 coding tasks (Code Repair, Code Explanation, Code Synthesis) across 6 languages (Python, JavaScript, Java, Go, C++, Rust). Our models, OctoCoder and OctoGeeX, achieve the best performance across HumanEvalPack among all permissive models, demonstrating CommitPack's benefits in generalizing to a wider set of languages and natural coding tasks. Code, models and data are freely available at https://github.com/bigcode-project/octopack.",
        "keywords": "large language models;large code models;instruction tuning",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/a20c35288ef2a0187601f4ac830a3883dd7ebf1f.pdf",
        "author": "Niklas Muennighoff;Qian Liu;Armel Randy Zebaze;Qinkai Zheng;Binyuan Hui;Terry Yue Zhuo;Swayam Singh;Xiangru Tang;Leandro Von Werra;Shayne Longpre",
        "authorids": "~Niklas_Muennighoff1;~Qian_Liu2;~Armel_Randy_Zebaze1;~Qinkai_Zheng2;~Binyuan_Hui1;~Terry_Yue_Zhuo1;~Swayam_Singh1;~Xiangru_Tang2;~Leandro_Von_Werra1;~Shayne_Longpre1",
        "gender": "M;M;M;F;M;M;M;M;M;M",
        "homepage": "https://muennighoff.github.io/;http://siviltaram.github.io/;;https://huybery.github.io/;https://swayaminsync.github.io/;https://xiangrutang.github.io/;https://github.com/lvwerra;https://www.shaynelongpre.com;;http://terryyz.github.io/",
        "dblp": "281/6745;;347/2063;246/4699;;246/8064;223/1855;190/7024;https://dblp.uni-trier.de/pers/hd/z/Zheng:Qinkai;",
        "google_scholar": "Me0IoRMAAAAJ;bcbeUo0AAAAJ;;RBb3ItMAAAAJ;https://scholar.google.com/citations?view_op=list_works;;https://scholar.google.com/citations?hl=en;ADd_YfkAAAAJ;54wdDqcAAAAJ;https://scholar.google.com.au/citations?hl=en",
        "orcid": ";;;;;;;;;0000-0002-5760-5188",
        "linkedin": "niklasmuennighoff/;;armel-randy-zebaze-9a273b1b2/;;swayam-singh-406610213/;;lvwerra/;shayne-redford-longpre/;;",
        "or_profile": "~Niklas_Muennighoff1;~Qian_Liu2;~Armel_Randy_Zebaze1;~Binyuan_Hui1;~Swayam_Singh1;~Xiangru_Tang2;~Leandro_Von_Werra1;~Shayne_Longpre1;~QINKAI_ZHENG1;~Terry_Zhuo1",
        "aff": "Allen Institute for Artificial Intelligence;Tiktok;INRIA;Alibaba Group;University of Allahabad;Yale University;Hugging Face;Massachusetts Institute of Technology;;Sea AI Lab",
        "aff_domain": "allenai.org;bytedance.com;inria.fr;alibaba-inc.com;allduniv.ac.in;yale.edu;hf.co;mit.edu;;sea.com",
        "position": "Researcher;Researcher;PhD student;Researcher;Undergrad student;PhD student;Researcher;PhD student;;Researcher",
        "bibtex": "@inproceedings{\nmuennighoff2024octopack,\ntitle={OctoPack: Instruction Tuning Code Large Language Models},\nauthor={Niklas Muennighoff and Qian Liu and Armel Randy Zebaze and Qinkai Zheng and Binyuan Hui and Terry Yue Zhuo and Swayam Singh and Xiangru Tang and Leandro Von Werra and Shayne Longpre},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=mw1PWNSWZP}\n}",
        "github": "",
        "project": "",
        "reviewers": "SuJc;eETk;LDX4",
        "pdf_size": 1807464,
        "rating": "6;8;8",
        "confidence": "3;4;5",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "3;3;4",
        "wc_summary": "71;108;77",
        "wc_strengths": "98;84;88",
        "wc_weaknesses": "77;81;851",
        "wc_questions": "35;18;43",
        "wc_review": "281;291;1059",
        "wc_reply_reviewers": "0;0;76",
        "wc_reply_authors": "147;138;732",
        "reply_reviewers": "0;0;1",
        "reply_authors": "1;1;2",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            85.33333333333333,
            16.21384867602041
        ],
        "wc_strengths_avg": [
            90.0,
            5.887840577551898
        ],
        "wc_weaknesses_avg": [
            336.3333333333333,
            363.92795379794006
        ],
        "wc_questions_avg": [
            32.0,
            10.424330514074594
        ],
        "wc_review_avg": [
            543.6666666666666,
            364.4185627666199
        ],
        "wc_reply_reviewers_avg": [
            25.333333333333332,
            35.82674358011841
        ],
        "wc_reply_authors_avg": [
            339.0,
            277.9172538724431
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.8660254037844385,
        "gs_citation": 235,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12599770879883139414&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=mw1PWNSWZP",
        "pdf": "https://openreview.net/pdf?id=mw1PWNSWZP",
        "email": "allenai.org;bytedance.com;inria.fr;alibaba-inc.com;allduniv.ac.in;yale.edu;hf.co;mit.edu;;sea.com",
        "author_num": 10,
        "aff_unique_index": "0;1;2;3;4;5;6;7;8",
        "aff_unique_norm": "Allen Institute for Artificial Intelligence;TikTok;INRIA;Alibaba Group;University of Allahabad;Yale University;Hugging Face;Massachusetts Institute of Technology;Sea AI Lab",
        "aff_unique_dep": ";;;;;;;;",
        "aff_unique_url": "https://allenai.org;https://www.tiktok.com;https://www.inria.fr;https://www.alibaba.com;https://www.allduniv.ac.in;https://www.yale.edu;https://huggingface.co;https://web.mit.edu;",
        "aff_unique_abbr": "AI2;TikTok;INRIA;Alibaba;UoA;Yale;Hugging Face;MIT;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;1;3;0;0;0",
        "aff_country_unique": "United States;China;France;India;"
    },
    {
        "id": "mxCX2bSV0Z",
        "title": "Using Forwards-Backwards Models to Approximate MDP Homomorphisms",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Animals are able to rapidly infer, from limited experience, when sets of state-action pairs have equivalent reward and transition dynamics. On the other hand, modern reinforcement learning systems must painstakingly learn through trial and error that sets of state-action pairs are value equivalent\u2014requiring an often prohibitively large amount of samples from their environment. MDP homomorphisms have been proposed that reduce the observed MDP of an environment to an abstract MDP, which can enable more sample efficient policy learning. Consequently, impressive improvements in sample efficiency have been achieved when a suitable MDP homomorphism can be constructed a priori\u2014usually by exploiting a practitioner's knowledge of environment symmetries. We propose a novel approach to constructing a homomorphism in discrete action spaces, which uses a partial model of environment dynamics to infer which state-action pairs lead to the same state\u2014reducing the size of the state-action space by a factor equal to the cardinality of the action space. On MDP homomorphism benchmarks, we demonstrate improved sample efficiency over previous attempts to learn MDP homomorphisms, while achieving comparable sample efficiency to approaches that rely on prior knowledge of environment symmetries.",
        "keywords": "Reinforcement Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Augustine N. Mavor-Parker;Matthew James Sargent;Andrea Banino;Lewis Griffin;Caswell Barry",
        "authorids": "~Augustine_N._Mavor-Parker1;~Matthew_James_Sargent1;~Andrea_Banino1;~Lewis_Griffin1;~Caswell_Barry1",
        "gender": "M;M;;M;",
        "homepage": "https://self-supervisor.github.io/;;;http://www.cs.ucl.ac.uk/people/L.Griffin.html/;",
        "dblp": ";;;93/910;220/3769",
        "google_scholar": "J7XkuPwAAAAJ;;;https://scholar.google.com.tw/citations?hl=en;",
        "orcid": ";;;;",
        "linkedin": ";matthewjsargent;;lewis-griffin-290b433/;",
        "or_profile": "~Augustine_N._Mavor-Parker1;~Matthew_James_Sargent1;~Andrea_Banino1;~Lewis_Griffin1;~Caswell_Barry1",
        "aff": ";University College London;;University College London, University of London;University College London",
        "aff_domain": ";ucl.ac.uk;;ucl.ac.uk;ucl.ac.uk",
        "position": ";PhD student;;Full Professor;Principal Researcher",
        "bibtex": "@misc{\nmavor-parker2024using,\ntitle={Using Forwards-Backwards Models to Approximate {MDP} Homomorphisms},\nauthor={Augustine N. Mavor-Parker and Matthew James Sargent and Andrea Banino and Lewis Griffin and Caswell Barry},\nyear={2024},\nurl={https://openreview.net/forum?id=mxCX2bSV0Z}\n}",
        "github": "",
        "project": "",
        "reviewers": "YpK3;QLTL;NiFy;1RGv",
        "site": "https://openreview.net/forum?id=mxCX2bSV0Z",
        "pdf_size": 1831059,
        "rating": "3;3;3;5",
        "confidence": "3;4;4;3",
        "soundness": "1;1;1;3",
        "contribution": "2;2;1;1",
        "presentation": "1;2;1;3",
        "wc_summary": "37;51;198;89",
        "wc_strengths": "14;36;47;109",
        "wc_weaknesses": "229;320;347;124",
        "wc_questions": "122;24;121;11",
        "wc_review": "402;431;713;333",
        "wc_reply_reviewers": "216;39;0;42",
        "wc_reply_authors": "548;495;320;326",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            1.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            93.75,
            63.12438118508569
        ],
        "wc_strengths_avg": [
            51.5,
            35.259750424527965
        ],
        "wc_weaknesses_avg": [
            255.0,
            87.35845694607936
        ],
        "wc_questions_avg": [
            69.5,
            52.203927055347094
        ],
        "wc_review_avg": [
            469.75,
            144.88163272133565
        ],
        "wc_reply_reviewers_avg": [
            74.25,
            83.49962574766428
        ],
        "wc_reply_authors_avg": [
            422.25,
            101.02567742905761
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:56GcJhzGhn0J:scholar.google.com/&scioq=Using+Forwards-Backwards+Models+to+Approximate+MDP+Homomorphisms&hl=en&as_sdt=0,44",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University College London",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucl.ac.uk",
        "aff_unique_abbr": "UCL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "mxJEX6w5uN",
        "title": "Scaff-PD: Communication Efficient Fair and Robust Federated Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We present Scaff-PD, a fast and communication-efficient algorithm for distributionally robust federated learning. Our approach improves fairness by optimizing a family of distributionally robust objectives tailored to heterogeneous clients. We leverage the special structure of these objectives, and design an accelerated primal dual (APD) algorithm which uses bias corrected local steps (as in Scaffold) to achieve significant gains in communication efficiency and convergence speed. We evaluate Scaff-PD on several benchmark datasets and demonstrate its effectiveness in improving fairness and robustness while maintaining competitive accuracy. Our results suggest that Scaff-PD is a promising approach for federated learning in resource-constrained and heterogeneous settings.",
        "keywords": "federated learning",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/77ac3a599a292b08c894b4aeb7f7ecec6f4c6b73.pdf",
        "author": "Yaodong Yu;Sai Praneeth Karimireddy;Yi Ma;Michael Jordan",
        "authorids": "~Yaodong_Yu4;~Sai_Praneeth_Karimireddy1;~Yi_Ma4;~Michael_Jordan1",
        "gender": "M;M;M;M",
        "homepage": "https://yaodongyu.github.io;https://spkreddy.org;http://people.eecs.berkeley.edu/~yima/;http://www.cs.berkeley.edu/~jordan/",
        "dblp": ";217/3342;;j/MichaelIJordan",
        "google_scholar": "bZ9oyW8AAAAJ;wKJeOQoAAAAJ;https://scholar.google.com.hk/citations?user=XqLiBQMAAAAJ;https://scholar.google.com.tw/citations?user=yxUduqMAAAAJ",
        "orcid": ";;;0000-0001-8935-817X",
        "linkedin": ";;;",
        "or_profile": "~Yaodong_Yu4;~Sai_Praneeth_Karimireddy1;~Yi_Ma4;~Michael_Jordan1",
        "aff": "Electrical Engineering & Computer Science Department, University of California Berkeley;University of California, Berkeley;University of California, Berkeley;University of California, Berkeley",
        "aff_domain": "eecs.berkeley.edu;berkeley.edu;berkeley.edu;berkeley.edu",
        "position": "PhD student;Postdoc;Full Professor;Full Professor",
        "bibtex": "@misc{\nyu2024scaffpd,\ntitle={Scaff-{PD}: Communication Efficient Fair and Robust Federated Learning},\nauthor={Yaodong Yu and Sai Praneeth Karimireddy and Yi Ma and Michael Jordan},\nyear={2024},\nurl={https://openreview.net/forum?id=mxJEX6w5uN}\n}",
        "github": "",
        "project": "",
        "reviewers": "b279;2GJD;v329;W5dA",
        "site": "https://openreview.net/forum?id=mxJEX6w5uN",
        "pdf_size": 1032705,
        "rating": "5;5;5;6",
        "confidence": "4;4;4;4",
        "soundness": "3;2;2;2",
        "contribution": "2;2;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "157;103;38;76",
        "wc_strengths": "56;32;32;37",
        "wc_weaknesses": "301;518;125;146",
        "wc_questions": "46;100;19;89",
        "wc_review": "560;753;214;348",
        "wc_reply_reviewers": "0;0;0;22",
        "wc_reply_authors": "831;922;504;1087",
        "reply_reviewers": "0;0;0;2",
        "reply_authors": "2;2;1;2",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            93.5,
            43.32724316177986
        ],
        "wc_strengths_avg": [
            39.25,
            9.883698700385398
        ],
        "wc_weaknesses_avg": [
            272.5,
            157.19494266674104
        ],
        "wc_questions_avg": [
            63.5,
            32.668792447839266
        ],
        "wc_review_avg": [
            468.75,
            205.3063260106712
        ],
        "wc_reply_reviewers_avg": [
            5.5,
            9.526279441628825
        ],
        "wc_reply_authors_avg": [
            836.0,
            212.51235258214993
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10462664669332720650&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of California, Berkeley",
        "aff_unique_dep": "Electrical Engineering & Computer Science Department",
        "aff_unique_url": "https://www.berkeley.edu",
        "aff_unique_abbr": "UC Berkeley",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Berkeley",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "mxaOpDHpCW",
        "title": "Breadth First Exploration in Grid-based Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recently, graph-based planners have gained significant attention for goal-conditioned reinforcement learning (RL), where they construct a graph that represents confident transitions between \"subgoals'' as edges and run shortest path algorithms to exploit the confident edges. Such a graph construction consists of only achieved subgoals while recording unattained ones in history is also crucial. Indeed, it often wastes an excessive number of attempts to unattainable subgoals.\nTo alleviate this issue, we propose a graph construction method that efficiently manages all the achieved and unattained subgoals on a grid graph adaptively discretizing the goal space. This enables a breadth-first exploration strategy, grounded in local adaptive grid refinement,\nthat prioritizes broad probing of subgoals on a coarse grid over meticulous one on a dense grid. We empirically verify the effectiveness of our method through extensive experiments.",
        "keywords": "goal-conditioned RL;graph-based RL",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/26cb216150a1e26e4c0afd3afb8a1b61d3bae93a.zip",
        "author": "Youngsik Yoon;Gangbok Lee;Sungsoo Ahn;Jungseul Ok",
        "authorids": "~Youngsik_Yoon1;~Gangbok_Lee1;~Sungsoo_Ahn1;~Jungseul_Ok2",
        "gender": "M;;M;M",
        "homepage": "http://ml.postech.ac.kr/;http://ml.postech.ac.kr;https://sungsooahn.super.site/;https://sites.google.com/view/jungseulok",
        "dblp": "273/1365;;90/5164;117/3448",
        "google_scholar": ";;XTenHs0AAAAJ;KWG3UUMAAAAJ",
        "orcid": ";;;0000-0003-4742-2473",
        "linkedin": ";;;",
        "or_profile": "~Youngsik_Yoon1;~Gangbok_Lee1;~Sungsoo_Ahn1;~Jungseul_Ok2",
        "aff": "POSTECH;POSTECH;Pohang University of Science and Technology;POSTECH",
        "aff_domain": "postech.ac.kr;postech.ac.kr;postech.ac.kr;postech.ac.kr",
        "position": "PhD student;MS student;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nyoon2024breadth,\ntitle={Breadth First Exploration in Grid-based Reinforcement Learning},\nauthor={Youngsik Yoon and Gangbok Lee and Sungsoo Ahn and Jungseul Ok},\nyear={2024},\nurl={https://openreview.net/forum?id=mxaOpDHpCW}\n}",
        "github": "",
        "project": "",
        "reviewers": "SMnh;z2kz;fvhd;qmXA",
        "site": "https://openreview.net/forum?id=mxaOpDHpCW",
        "pdf_size": 1531017,
        "rating": "5;5;5;6",
        "confidence": "4;4;4;4",
        "soundness": "3;2;2;3",
        "contribution": "3;2;2;2",
        "presentation": "2;2;1;3",
        "wc_summary": "63;62;70;80",
        "wc_strengths": "45;48;57;91",
        "wc_weaknesses": "191;87;143;289",
        "wc_questions": "431;33;53;11",
        "wc_review": "730;230;323;471",
        "wc_reply_reviewers": "13;26;75;39",
        "wc_reply_authors": "1695;721;1501;634",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "3;1;3;2",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            68.75,
            7.189401922274203
        ],
        "wc_strengths_avg": [
            60.25,
            18.2944663764757
        ],
        "wc_weaknesses_avg": [
            177.5,
            74.15355689378629
        ],
        "wc_questions_avg": [
            132.0,
            173.2656919300529
        ],
        "wc_review_avg": [
            438.5,
            188.97155870659478
        ],
        "wc_reply_reviewers_avg": [
            38.25,
            23.12331074911203
        ],
        "wc_reply_authors_avg": [
            1137.75,
            466.34824702147216
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:AKo5qLOk0FQJ:scholar.google.com/&scioq=Breadth+First+Exploration+in+Grid-based+Reinforcement+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Pohang University of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.postech.ac.kr",
        "aff_unique_abbr": "POSTECH",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Pohang",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "my0RqY48xz",
        "title": "Awakening Collective Wisdom: Elevating Super-Resolution Network Generalization through Cooperative Game Theory",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Improving the generalization capability of image super-resolution algorithms is a fundamental challenge when deploying them in real-world scenarios. Prior methods often relied on the assumption that training on diverse data can improve generalization capabilities, leading to the development of complex degradation models that simulate real-world degradation.Unlike previous works, we present a novel training strategy grounded in cooperative game theory to improve the generalization capacity of existing image super-resolution algorithms. Within this framework, we conceptualize all neurons in the network as participants engaged in a cooperative relationship, where their collective responses determine the final prediction. As a solution, we propose to awaken suppressed neurons that hinder the generalization capability through our Erase-and-Awaken Training Strategy (EATS), thus fostering equitable contributions among all neurons and effectively improving generalization performance. EATS offers several compelling benefits.1) Seamless integration with existing architecture: It integrates with existing networks to enhance their generalization capability for unseen scenarios. 2) Theoretically feasible strategy: We theoretically prove the effectiveness of our strategy in enhancing the Shapely value (reflecting each participant's contributions to prediction). 3) Consistent performance improvements: Comprehensive experiments on various challenging datasets consistently demonstrate performance improvements when employing our strategy. The code will be publicly available.",
        "keywords": "Super-resolution; image restoration; low-level vision",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Naishan Zheng;Man Zhou;Bing Li;Jie Huang;Chongyi Li;Chen Change Loy;Feng Zhao",
        "authorids": "~Naishan_Zheng1;~Man_Zhou4;~Bing_Li16;~Jie_Huang4;~Chongyi_Li1;~Chen_Change_Loy2;~Feng_Zhao6",
        "gender": "M;;M;M;;M;M",
        "homepage": ";;https://www.ustc.edu.cn/;;;https://www.mmlab-ntu.com/person/ccloy/index.html;https://bivlab123.github.io/",
        "dblp": "324/4929;;;;;01/5855;181/2734-4",
        "google_scholar": "aL_WRTkAAAAJ;;;https://scholar.google.com/citations?hl=zh-CN;;https://scholar.google.co.uk/citations?user=559LF80AAAAJ;https://scholar.google.co.uk/citations?hl=en",
        "orcid": "0000-0002-7451-8780;;;0000-0002-3518-3404;;0000-0001-5345-1591;0000-0001-6767-8105",
        "linkedin": ";;;;;;",
        "or_profile": "~Naishan_Zheng1;~Man_Zhou4;~Bing_Li16;~Jie_Huang4;~Chongyi_Li1;~Chen_Change_Loy2;~Feng_Zhao6",
        "aff": "University of Science and Technology of China;;University of Science and Technology of China;University of Science and Technology of China;;Nanyang Technological University;University of Science and Technology of China",
        "aff_domain": "ustc.edu.cn;;ustc.edu.cn;ustc.edu.cn;;ntu.edu.sg;ustc.edu.cn",
        "position": "PhD student;;MS student;PhD student;;Full Professor;Full Professor",
        "bibtex": "@misc{\nzheng2024awakening,\ntitle={Awakening Collective Wisdom: Elevating Super-Resolution Network Generalization through Cooperative Game Theory},\nauthor={Naishan Zheng and Man Zhou and Bing Li and Jie Huang and Chongyi Li and Chen Change Loy and Feng Zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=my0RqY48xz}\n}",
        "github": "",
        "project": "",
        "reviewers": "5MNR;1q9R;P3P8;inny",
        "site": "https://openreview.net/forum?id=my0RqY48xz",
        "pdf_size": 5459437,
        "rating": "6;6;6;8",
        "confidence": "5;5;3;4",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;4",
        "presentation": "4;3;3;4",
        "wc_summary": "53;52;190;45",
        "wc_strengths": "107;142;47;101",
        "wc_weaknesses": "93;101;122;74",
        "wc_questions": "4;66;198;4",
        "wc_review": "257;361;557;224",
        "wc_reply_reviewers": "0;0;73;0",
        "wc_reply_authors": "159;247;717;682",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            85.0,
            60.700082372267005
        ],
        "wc_strengths_avg": [
            99.25,
            33.98804937033015
        ],
        "wc_weaknesses_avg": [
            97.5,
            17.211914478058507
        ],
        "wc_questions_avg": [
            68.0,
            79.20858539325141
        ],
        "wc_review_avg": [
            349.75,
            129.89875865457682
        ],
        "wc_reply_reviewers_avg": [
            18.25,
            31.60992723813201
        ],
        "wc_reply_authors_avg": [
            451.25,
            250.49787923253962
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.17407765595569782,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:L2VJ7zm_pVEJ:scholar.google.com/&scioq=Awakening+Collective+Wisdom:+Elevating+Super-Resolution+Network+Generalization+through+Cooperative+Game+Theory&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "University of Science and Technology of China;Nanyang Technological University",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.ustc.edu.cn;https://www.ntu.edu.sg",
        "aff_unique_abbr": "USTC;NTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "China;Singapore"
    },
    {
        "id": "mz0SkLZbaz",
        "title": "DIVA: A Dirichlet Process Mixtures Based Incremental Deep Clustering Algorithm via Variational Auto-Encoder",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Generative model-based deep clustering frameworks excel in classifying complex data, but their effectiveness is limited when dealing with dynamically changing features due to their reliance on prior knowledge of the number of clusters. \nIn this paper, we propose a nonparametric deep clustering framework that employs an infinite mixture of Gaussians as a prior.\nOur framework utilizes a memoized online variational inference method that enables the \"birth\" and \"merge\" moves of clusters, allowing our framework to cluster data in a \"dynamic-adaptive'' manner, without requiring prior knowledge of the number of features.\nWe name the framework as **DIVA**, a **D**irichlet Process Mixtures based **I**ncremental deep clustering framework via **V**ariational **A**uto-Encoder. \nOur framework, which outperforms state-of-the-art baselines, exhibits superior performance in classifying complex data with dynamically changing features, particularly in the case of incremental features.",
        "keywords": "Unsupervised representation learning;Generative model;Bayes non-parametrics;deep clustering;variational auto-encoder;incremental features",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/853f85ea2a4855134b30f1dad99529752e9383f7.zip",
        "author": "Zhenshan Bing;Yuan Meng;Yuqi Yun;Hang Su;Xiaojie Su;Kai Huang;Alois Knoll",
        "authorids": "~Zhenshan_Bing1;~Yuan_Meng3;~Yuqi_Yun1;~Hang_Su6;~Xiaojie_Su1;~Kai_Huang2;~Alois_Knoll1",
        "gender": "M;M;;M;M;;M",
        "homepage": ";;https://github.com/awesome-amy;https://suhangself.github.io/;https://orcid.org/0000-0003-1802-0264;;https://www.in.tum.de/i06/people/prof-dr-ing-habil-alois-knoll/",
        "dblp": "203/4777;;;26/5371-1;66/8680.html;86/489-1.html;k/AloisKnoll",
        "google_scholar": "https://scholar.google.de/citations?user=eIz0XvMAAAAJ;;;;;;https://scholar.google.de/citations?user=-CA8QgwAAAAJ",
        "orcid": ";;;0000-0002-6877-6783;;;0000-0003-4840-076X",
        "linkedin": ";yuan-meng-a781ba111/;;;;;alois-knoll-505480166",
        "or_profile": "~Zhenshan_Bing1;~Yuan_Meng3;~Yuqi_Yun1;~Hang_Su6;~Xiaojie_Su1;~Kai_Huang2;~Alois_Knoll1",
        "aff": "Technical University of Munich;;;;Chongqing University;SUN YAT-SEN UNIVERSITY;Technical University Munich",
        "aff_domain": "tum.de;;;;cqu.edu.cn;sysu.edu.cn;tum.de",
        "position": "Postdoc;;;;Full Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nbing2024diva,\ntitle={{DIVA}: A Dirichlet Process Mixtures Based Incremental Deep Clustering Algorithm via Variational Auto-Encoder},\nauthor={Zhenshan Bing and Yuan Meng and Yuqi Yun and Hang Su and Xiaojie Su and Kai Huang and Alois Knoll},\nyear={2024},\nurl={https://openreview.net/forum?id=mz0SkLZbaz}\n}",
        "github": "",
        "project": "",
        "reviewers": "Ggf7;Hi2d;pC7Y",
        "site": "https://openreview.net/forum?id=mz0SkLZbaz",
        "pdf_size": 1997268,
        "rating": "3;3;5",
        "confidence": "5;4;3",
        "soundness": "2;2;2",
        "contribution": "2;3;2",
        "presentation": "2;2;2",
        "wc_summary": "24;65;76",
        "wc_strengths": "36;90;24",
        "wc_weaknesses": "138;373;73",
        "wc_questions": "17;180;96",
        "wc_review": "215;708;269",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            55.0,
            22.37558192911788
        ],
        "wc_strengths_avg": [
            50.0,
            28.705400188814647
        ],
        "wc_weaknesses_avg": [
            194.66666666666666,
            128.86254520051804
        ],
        "wc_questions_avg": [
            97.66666666666667,
            66.55490632219052
        ],
        "wc_review_avg": [
            397.3333333333333,
            220.77791757530665
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.8660254037844387,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6201089314684772808&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Technical University of Munich;Chongqing University;Sun Yat-sen University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.tum.de;https://www.cqu.edu.cn;http://www.sysu.edu.cn",
        "aff_unique_abbr": "TUM;CQU;SYSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "Germany;China"
    },
    {
        "title": "Scalable Language Model with Generalized Continual Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17874",
        "id": "mz8owj4DXu",
        "author_site": "Bohao PENG, Zhuotao Tian, Shu Liu, Ming-Chang Yang, Jiaya Jia",
        "tldr": "",
        "abstract": "Continual learning has gained increasing importance as it facilitates the acquisition and refinement of scalable knowledge and skills in language models. However, existing methods typically encounter strict limitations and challenges in real-world scenarios, such as reliance on experience replay, optimization constraints, and inference task-ID. In this study, we introduce the Scalable Language Model (SLM) to overcome these limitations within a more challenging and generalized setting, representing a significant advancement toward practical applications for continual learning. Specifically, we propose the Joint Adaptive Re-Parameterization (JARe), integrated with Dynamic Task-related Knowledge Retrieval (DTKR), to enable adaptive adjustment of language models based on specific downstream tasks. This approach leverages the task distribution within the vector space, aiming to achieve a smooth and effortless continual learning process. Our method demonstrates state-of-the-art performance on diverse backbones and benchmarks, achieving effective continual learning in both full-set and few-shot scenarios with minimal forgetting. Moreover, while prior research primarily focused on a single task type such as classification, our study goes beyond, with the large language model, i.e., LLaMA-2, to explore the effects across diverse domains and task types, such that a single language model can be decently scaled to broader applications. The code and models will be released to the public.",
        "keywords": "continual learning;natural language processing;large language model",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Bohao PENG;Zhuotao Tian;Shu Liu;Ming-Chang Yang;Jiaya Jia",
        "authorids": "~Bohao_PENG1;~Zhuotao_Tian1;~Shu_Liu4;~Ming-Chang_Yang1;~Jiaya_Jia1",
        "gender": "M;M;M;M;M",
        "homepage": "https://pbihao.github.io/;https://scholar.google.com/citations?user=mEjhz-IAAAAJ&hl=zh-CN;https://shuliu1993.github.io/;http://www.cse.cuhk.edu.hk/~mcyang/;https://jiaya.me",
        "dblp": ";243/7181;57/1180-5;123/7774.html;31/5649",
        "google_scholar": ";mEjhz-IAAAAJ;BUEDUFkAAAAJ;sVkR5hYAAAAJ;https://scholar.google.com.tw/citations?user=XPAkzTEAAAAJ",
        "orcid": ";;;0000-0002-4029-757X;",
        "linkedin": ";;;;",
        "or_profile": "~Bohao_PENG1;~Zhuotao_Tian1;~Shu_Liu4;~Ming-Chang_Yang1;~Jiaya_Jia1",
        "aff": "Department of Computer Science and Engineering, The Chinese University of Hong Kong;SmartMore;SmartMore Ltd.;Department of Computer Science and Engineering, The Chinese University of Hong Kong;Department of Computer Science and Engineering, Hong Kong University of Science and Technology",
        "aff_domain": "cse.cuhk.edu.hk;smartmore.com;smartmore.com;cse.cuhk.edu.hk;cse.ust.hk",
        "position": "PhD student;Researcher;Principal Researcher;Associate Professor;Full Professor",
        "bibtex": "@inproceedings{\npeng2024scalable,\ntitle={Scalable Language Model with Generalized Continual Learning},\nauthor={Bohao PENG and Zhuotao Tian and Shu Liu and Ming-Chang Yang and Jiaya Jia},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=mz8owj4DXu}\n}",
        "github": "",
        "project": "",
        "reviewers": "hwoc;phuQ;3jYk;US6d",
        "pdf_size": 1174964,
        "rating": "6;6;6;8",
        "confidence": "2;4;3;4",
        "soundness": "3;3;3;3",
        "contribution": "3;2;3;4",
        "presentation": "3;4;3;3",
        "wc_summary": "42;88;99;233",
        "wc_strengths": "70;97;31;197",
        "wc_weaknesses": "21;283;198;211",
        "wc_questions": "1;2;120;110",
        "wc_review": "134;470;448;751",
        "wc_reply_reviewers": "0;36;499;0",
        "wc_reply_authors": "111;840;2045;649",
        "reply_reviewers": "0;1;2;0",
        "reply_authors": "1;2;4;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            115.5,
            71.12840501515551
        ],
        "wc_strengths_avg": [
            98.75,
            61.385564263921204
        ],
        "wc_weaknesses_avg": [
            178.25,
            96.38821245359829
        ],
        "wc_questions_avg": [
            58.25,
            56.86112468110352
        ],
        "wc_review_avg": [
            450.75,
            218.43691881181624
        ],
        "wc_reply_reviewers_avg": [
            133.75,
            211.38871185567123
        ],
        "wc_reply_authors_avg": [
            911.25,
            707.0432713066435
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5222329678670935,
        "gs_citation": 17,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=442083912262668729&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=mz8owj4DXu",
        "pdf": "https://openreview.net/pdf?id=mz8owj4DXu",
        "email": "cse.cuhk.edu.hk;smartmore.com;smartmore.com;cse.cuhk.edu.hk;cse.ust.hk",
        "author_num": 5,
        "aff_unique_index": "0;1;1;0;2",
        "aff_unique_norm": "Chinese University of Hong Kong;SmartMore;Hong Kong University of Science and Technology",
        "aff_unique_dep": "Department of Computer Science and Engineering;;Department of Computer Science and Engineering",
        "aff_unique_url": "https://www.cuhk.edu.hk;;https://www.ust.hk",
        "aff_unique_abbr": "CUHK;;HKUST",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China;"
    },
    {
        "id": "mzWQ2hOKNX",
        "title": "Learning to Select Camera Views: Efficient Multiview Understanding at Few Glances",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Multiview camera setups have proven useful in many computer vision applications for reducing ambiguities, mitigating occlusions, and increasing field-of-view coverage. However, the high computational cost associated with multiple views creates a significant challenge for end devices with limited computational resources. To address this issue, we propose a view selection approach that analyzes the target object or scenario from given views and selects the next-best-view for recognition or detection. Our approach features a reinforcement learning based camera selection module, MVSelect, that not only selects views but also facilitates joint training with the task network. Experimental results on multiview classification and detection tasks show that our approach achieves promising performance while using only 2 or 3 out of N available views, significantly reducing computational costs. Furthermore, analysis on the selected views reveals that certain cameras can be shut off with minimal performance impact, shedding light on future camera layout optimization for multiview systems.",
        "keywords": "Multi-view classification; multi-view detection; efficient algorithm; reinforcement learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yunzhong Hou;Stephen Gould;Liang Zheng",
        "authorids": "~Yunzhong_Hou2;~Stephen_Gould1;~Liang_Zheng4",
        "gender": "M;M;M",
        "homepage": "https://hou-yz.github.io/;http://users.cecs.anu.edu.au/~sgould/;http://zheng-lab.cecs.anu.edu.au/",
        "dblp": "237/9968;89/1569.html;61/7360-1",
        "google_scholar": "pFD8DoIAAAAJ;YvdzeM8AAAAJ;https://scholar.google.com.au/citations?user=vNHqr3oAAAAJ",
        "orcid": ";0000-0001-8929-7899;",
        "linkedin": "yunzhong-hou-693794103/;;liang-zheng-76341311a/",
        "or_profile": "~Yunzhong_Hou2;~Stephen_Gould1;~Liang_Zheng4",
        "aff": "Australian National University;Australian National University;Australian National University",
        "aff_domain": "anu.edu.au;anu.edu.au;anu.edu.au",
        "position": "Postdoc;Full Professor;Associate Professor",
        "bibtex": "@misc{\nhou2024learning,\ntitle={Learning to Select Camera Views: Efficient Multiview Understanding at Few Glances},\nauthor={Yunzhong Hou and Stephen Gould and Liang Zheng},\nyear={2024},\nurl={https://openreview.net/forum?id=mzWQ2hOKNX}\n}",
        "github": "",
        "project": "",
        "reviewers": "cq5m;SBYb;xRSL;8HDd",
        "site": "https://openreview.net/forum?id=mzWQ2hOKNX",
        "pdf_size": 9672269,
        "rating": "3;5;5;5",
        "confidence": "5;4;3;3",
        "soundness": "2;2;3;3",
        "contribution": "2;3;2;2",
        "presentation": "2;3;3;3",
        "wc_summary": "126;34;131;96",
        "wc_strengths": "12;19;53;31",
        "wc_weaknesses": "51;297;124;258",
        "wc_questions": "37;2;26;17",
        "wc_review": "226;352;334;402",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            96.75,
            38.62237046065402
        ],
        "wc_strengths_avg": [
            28.75,
            15.562374497485916
        ],
        "wc_weaknesses_avg": [
            182.5,
            99.40447676035521
        ],
        "wc_questions_avg": [
            20.5,
            12.816005617976296
        ],
        "wc_review_avg": [
            328.5,
            64.20864427785405
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8703882797784891,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2882515014628435890&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Australian National University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.anu.edu.au",
        "aff_unique_abbr": "ANU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Australia"
    },
    {
        "id": "mzkpLkd1S8",
        "title": "Improving Robustness in Vision Transformers with Nullspace Noise Augmented Finetuning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Enhancing the robustness of deep learning models, particularly in the realm of vision transformers (ViTs), is crucial for their real-world deployment. In this work, we explore the robustness of vision transformer models through the lens of nullspace, a fundamental concept in linear algebra, to propose a fine-tuning method that improves model robustness under various input perturbations. Our investigation centers on whether a vision transformer can exhibit resilience to input variations akin to the nullspace property in linear mappings, implying that perturbations sampled from this nullspace do not influence the model's output when added to the input. We confirm this by demonstrating the existence of a non-trivial nullspace in vision transformers, primarily attributed to the patch embedding layer. Moreover, we extend this idea beyond the linear layers, showcasing the feasibility of learning a non-linear counterpart (approximate nullspace) to the traditional nullspace for vision transformers through optimization techniques. Based on these insights, we propose a fine-tuning approach employing approximate nullspace noise to bolster the robustness of ViT models. Remarkably, within just a single epoch of fine-tuning, our method effectively mitigates the adverse effects of distribution shifts and adversarial perturbations across a wide spectrum of scenarios.",
        "keywords": "Robustness; Computer Vision; Transformer",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Haoyang Liu;Aditya Singh;Yijiang Li;Haohan Wang",
        "authorids": "~Haoyang_Liu1;~Aditya_Singh3;~Yijiang_Li1;~Haohan_Wang1",
        "gender": "M;M;Not Specified;M",
        "homepage": ";;https://williamium3000.github.io/;http://cs.cmu.edu/~haohanw",
        "dblp": "53/8773-1;;;132/4066",
        "google_scholar": "1jLWSKAAAAAJ;kkE_sOoAAAAJ;https://scholar.google.com.hk/citations?user=Dx3z0m8AAAAJ;nZxJGeUAAAAJ",
        "orcid": "0000-0002-9657-9007;;;",
        "linkedin": "haoyang-liu-58268a1a2/;;;haohanwang/",
        "or_profile": "~Haoyang_Liu1;~Aditya_Singh3;~Yijiang_Li1;~Haohan_Wang1",
        "aff": "University of Illinois, Urbana-Champaign;Zebra Technologies;Johns Hopkins University;University of Illinois, Urbana Champaign",
        "aff_domain": "uiuc.edu;zebra.com;jh.edu;illinois.edu",
        "position": "PhD student;Computer Vision Researcher II;MS student;Assistant Professor",
        "bibtex": "@misc{\nliu2024improving,\ntitle={Improving Robustness in Vision Transformers with Nullspace Noise Augmented Finetuning},\nauthor={Haoyang Liu and Aditya Singh and Yijiang Li and Haohan Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=mzkpLkd1S8}\n}",
        "github": "",
        "project": "",
        "reviewers": "WMY4;43dA;hjZY;LAzm",
        "site": "https://openreview.net/forum?id=mzkpLkd1S8",
        "pdf_size": 8715895,
        "rating": "3;5;5;8",
        "confidence": "3;4;4;2",
        "soundness": "2;2;3;4",
        "contribution": "1;3;2;3",
        "presentation": "1;3;3;3",
        "wc_summary": "62;84;40;61",
        "wc_strengths": "21;56;28;49",
        "wc_weaknesses": "120;205;152;44",
        "wc_questions": "796;87;6;63",
        "wc_review": "999;432;226;217",
        "wc_reply_reviewers": "276;0;0;0",
        "wc_reply_authors": "2736;782;831;402",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "4;3;3;1",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            61.75,
            15.562374497485916
        ],
        "wc_strengths_avg": [
            38.5,
            14.430869689661812
        ],
        "wc_weaknesses_avg": [
            130.25,
            58.31970078798416
        ],
        "wc_questions_avg": [
            238.0,
            323.50193198804857
        ],
        "wc_review_avg": [
            468.5,
            318.12772592152356
        ],
        "wc_reply_reviewers_avg": [
            69.0,
            119.51150572225254
        ],
        "wc_reply_authors_avg": [
            1187.75,
            909.1733539320211
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            1.0897247358851685
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5488604301969737,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Mvi55hF2iEkJ:scholar.google.com/&scioq=Improving+Robustness+in+Vision+Transformers+with+Nullspace+Noise+Augmented+Finetuning&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "University of Illinois;Zebra Technologies Corporation;Johns Hopkins University;University of Illinois Urbana-Champaign",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://illinois.edu;https://www.zebra.com;https://www.jhu.edu;https://illinois.edu",
        "aff_unique_abbr": "UIUC;Zebra;JHU;UIUC",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Urbana-Champaign;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "mzo7N2XkJ2",
        "title": "Corrupting Unbounded Unlearnable Datasets with Pixel-based Image Transformations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Unlearnable datasets (UDs) lead to a drastic drop in the generalization performance of models trained on them by introducing elaborate and imperceptible perturbations into clean training sets. Many existing defenses, e.g., JPEG compression and adversarial training, effectively counter UDs based on norm constraints (i.e., bounded UDs). However, the recent emergence of unbounded UDs renders existing defense measures completely ineffective, presenting a greater challenge to defenders. To address this, we express the unbounded unlearnable sample as the result of multiplying a matrix by a clean sample in a simplified scenario. Meanwhile, we note in existing unbounded UDs that the consistency of intra-class and inter-class noise  significantly affects unlearnable effect, which motivates us to formalize the intra-class matrix inconsistency as $\\Theta_{imi}$ and inter-class matrix consistency as $\\Theta_{imc}$ and conjecture that increasing both of these metrics enhances the test accuracy. Through validation experiments that commendably support our hypothesis, we further design a random matrix to boost both $\\Theta_{imi}$ and $\\Theta_{imc}$, achieving a notable degree of defense effect. Hence, by building upon and extending these facts, we first propose a brand-new image COrruption that employs randomly multiplicative transformation via INterpolation operation (COIN) to successfully defend against existing unbounded UDs. Our approach leverages global pixel random interpolations, effectively suppressing the impact of multiplicative noise in unbounded UDs. Extensive experiments demonstrate that our defense approach outperforms state-of-the-art defenses, achieving an improvement of 23.55\\%-48.11\\% in average test accuracy on the CIFAR-10 dataset.",
        "keywords": "Unlearnable datasets;deep neural networks;image transformations",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Xianlong Wang;Shengshan Hu;Minghui Li;Zhifei Yu;Ziqi Zhou;Leo Yu Zhang;Hai Jin",
        "authorids": "~Xianlong_Wang1;~Shengshan_Hu1;~Minghui_Li2;~Zhifei_Yu2;~Ziqi_Zhou2;~Leo_Yu_Zhang1;~Hai_Jin1",
        "gender": "M;M;F;M;M;M;M",
        "homepage": "https://wxldragon.github.io/;http://faculty.hust.edu.cn/HUSHENGSHAN;;https://palmyu.github.io/;https://zhou-zi7.github.io;https://leozhangcs.github.io/;http://www.linkedin.com/in/jinhust",
        "dblp": ";169/2268;;;;117/3526;98/4156",
        "google_scholar": "https://scholar.google.com.hk/citations?user=EgsgIq0AAAAJ;lkAFwJgAAAAJ;j_y67gEAAAAJ;;-eyLn4wAAAAJ;https://scholar.google.com.hk/citations?user=JK21OM0AAAAJ;",
        "orcid": "0009-0009-3057-827X;;;;;0000-0001-9330-2662;0000-0002-3934-7605",
        "linkedin": ";;;;;;jinhust",
        "or_profile": "~Xianlong_Wang1;~Shengshan_Hu1;~Minghui_Li2;~Zhifei_Yu2;~Ziqi_Zhou2;~Leo_Yu_Zhang1;~Hai_Jin1",
        "aff": "Huazhong University of Science and Technology;Huazhong University of Science and Technology;Huazhong University of Science and Technology;Huazhong University of Science and Technology;Huazhong University of Science and Technology;Griffith University;Huazhong University of Science and Technology",
        "aff_domain": "hust.edu.cn;hust.edu.cn;hust.edu.cn;hust.edu.cn;hust.edu.cn;griffith.edu.au;hust.edu.cn",
        "position": "PhD student;Associate Professor;Assistant Professor;Undergrad student;PhD student;Researcher;Full Professor",
        "bibtex": "@misc{\nwang2024corrupting,\ntitle={Corrupting Unbounded Unlearnable Datasets with Pixel-based Image Transformations},\nauthor={Xianlong Wang and Shengshan Hu and Minghui Li and Zhifei Yu and Ziqi Zhou and Leo Yu Zhang and Hai Jin},\nyear={2024},\nurl={https://openreview.net/forum?id=mzo7N2XkJ2}\n}",
        "github": "",
        "project": "",
        "reviewers": "T4ea;R3xq;ASN6",
        "site": "https://openreview.net/forum?id=mzo7N2XkJ2",
        "pdf_size": 1414847,
        "rating": "3;3;6",
        "confidence": "5;3;4",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "3;2;3",
        "wc_summary": "82;84;91",
        "wc_strengths": "46;69;27",
        "wc_weaknesses": "464;74;217",
        "wc_questions": "5;37;72",
        "wc_review": "597;264;407",
        "wc_reply_reviewers": "555;0;46",
        "wc_reply_authors": "2127;1060;1234",
        "reply_reviewers": "3;0;1",
        "reply_authors": "5;4;4",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            85.66666666666667,
            3.858612300930075
        ],
        "wc_strengths_avg": [
            47.333333333333336,
            17.172329163188344
        ],
        "wc_weaknesses_avg": [
            251.66666666666666,
            161.0927958938229
        ],
        "wc_questions_avg": [
            38.0,
            27.36177382164151
        ],
        "wc_review_avg": [
            422.6666666666667,
            136.39729550919338
        ],
        "wc_reply_reviewers_avg": [
            200.33333333333334,
            251.48934150156123
        ],
        "wc_reply_authors_avg": [
            1473.6666666666667,
            467.405843162259
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            1.247219128924647
        ],
        "reply_authors_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:r_X2HXQw5CUJ:scholar.google.com/&scioq=Corrupting+Unbounded+Unlearnable+Datasets+with+Pixel-based+Image+Transformations&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0;1;0",
        "aff_unique_norm": "Huazhong University of Science and Technology;Griffith University",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.hust.edu.cn;https://www.griffith.edu.au",
        "aff_unique_abbr": "HUST;Griffith",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;1;0",
        "aff_country_unique": "China;Australia"
    },
    {
        "id": "mzxKLZNbrQ",
        "title": "Youku-mPLUG: A 10 Million Large-scale Chinese Video-Language Dataset for Pre-training and Benchmarks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We firstly release the largest public Chinese high-quality video-language dataset named Youku-mPLUG, which is collected from Youku, a well-known Chinese video-sharing website, with strict criteria of safety, diversity, quality, and copyright. Youku-mPLUG contains 10 million Chinese video-text pairs filtered from 400 million raw videos across a wide range of 45 diverse categories for large-scale pre-training. In addition, to facilitate a comprehensive evaluation of video-language models, we carefully build the largest human-annotated Chinese benchmarks covering three popular video-language tasks across cross-modal retrieval, video captioning, and video category classification. \nWe also provide comprehensive benchmark evaluations of models across different architectures including encoder-only (i.e., ALPRO), encoder-decoder (i.e., mPLUG-2), and decoder-only (i.e., mPLUG-Video) for comparison. Especially, we train the first Chinese Multimodal LLM with only 1.7% trainable parameters for video understanding. Experiments show that models pre-trained on Youku-mPLUG gain up to 23.1% improvement in video category classification. Besides, mPLUG-video achieves a new state-of-the-art result on these benchmarks with 80.5% top-1 accuracy in video category classification and 68.9 CIDEr score in video captioning, respectively. Finally, the 2.7B version of mPLUG-video demonstrates impressive instruction and video understanding ability. The zero-shot instruction understanding experiment indicates that pretraining with Youku-mPLUG can enhance the ability to comprehend overall and detailed visual semantics, recognize scene text, and leverage open-domain knowledge.",
        "keywords": "Chinese;Video-language pre-training;video-language benchmarks;mPLUG;Youku;video captioning;video classification",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Haiyang Xu;Qinghao Ye;Xuan Wu;Ming Yan;Yuan Miao;Jiabo Ye;Anwen Hu;Guohai Xu;Yaya Shi;Guangwei Xu;Chenliang Li;Qi Qian;Maofei Que;Ji Zhang;Xiao Zeng;Fei Huang",
        "authorids": "~Haiyang_Xu1;~Qinghao_Ye1;~Xuan_Wu5;~Ming_Yan2;~Yuan_Miao1;~Jiabo_Ye1;~Anwen_Hu1;~Guohai_Xu1;~Yaya_Shi1;~Guangwei_Xu2;~Chenliang_Li2;~Qi_Qian1;~Maofei_Que1;~Ji_Zhang3;~Xiao_Zeng4;~Fei_Huang1",
        "gender": "M;;F;M;;M;M;;F;M;M;;M;;M;M",
        "homepage": ";;https://dblp.org/pid/54/2088-3.html;;http://www.lamda.nju.edu.cn/miaoy/?AspxAutoDetectCookieSupport=1;https://github.com/LukeForeverYoung;;;https://shiyaya.github.io/;;;http://qi-qian.com;;;https://github.com/zengxiao29;https://sites.google.com/view/fei-huang",
        "dblp": ";254/3247;54/2088-3.html;51/5332-4.html;74/1798-2;304/1336;249/1182.html;205/7621;216/1114;119/3569.html;52/9457;05/2084-1;;86/1953-11;;h/FeiHuang.html",
        "google_scholar": "qZYvce8AAAAJ;ZYOhaGwAAAAJ;;uIUfGxYAAAAJ;W9_DokwAAAAJ;;FqvDzH8AAAAJ;bS8Ku4MAAAAJ;dqLvhvIAAAAJ;;3P2ZMKcAAAAJ;Rp_40_gAAAAJ;;cgnuJDUAAAAJ;;9r98PpoAAAAJ",
        "orcid": ";;;0000-0003-4959-8878;;;;;0000-0003-0465-6712;;;;;;;",
        "linkedin": ";;;;;;;;;;;;que-mike-61b89540/;;;fei-huang-cas-cmu",
        "or_profile": "~Haiyang_Xu1;~Qinghao_Ye1;~Xuan_Wu5;~Ming_Yan2;~Yuan_Miao1;~Jiabo_Ye1;~Anwen_Hu1;~Guohai_Xu1;~Yaya_Shi1;~Guangwei_Xu2;~Chenliang_Li2;~Qi_Qian1;~Maofei_Que1;~Ji_Zhang3;~Xiao_Zeng4;~Fei_Huang2",
        "aff": "Alibaba Group;ByteDance Inc.;Alibaba Group;Alibaba Group;Alibaba Group;East China Normal University;Alibaba Group;Xiaohongshu;University of Science and Technology of China;Alibaba Group;;Alibaba Group;;Alibaba Group;Alibaba Group;Alibaba Group US",
        "aff_domain": "alibaba-inc.com;bytedance.com;alibaba-inc.com;alibaba-inc.com;alibaba-inc.com;ecnu.edu.cn;alibaba-inc.com;xiaohongshu.com;ustc.edu.cn;alibaba-inc.com;;alibaba-inc.com;;alibaba-inc.com;alibaba-inc.com;alibaba-inc.com",
        "position": "Researcher;Researcher;Engineer;Instructor;Researcher;PhD student;Researcher;Algorithm Engineer;PhD student;Researcher;;Researcher;;Senior Staff Engineer;Researcher;Senior Research Director",
        "bibtex": "@misc{\nxu2024youkumplug,\ntitle={Youku-m{PLUG}: A 10 Million Large-scale Chinese Video-Language Dataset for Pre-training and Benchmarks},\nauthor={Haiyang Xu and Qinghao Ye and Xuan Wu and Ming Yan and Yuan Miao and Jiabo Ye and Anwen Hu and Guohai Xu and Yaya Shi and Guangwei Xu and Chenliang Li and Qi Qian and Maofei Que and Ji Zhang and Xiao Zeng and Fei Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=mzxKLZNbrQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "kj3u;bL3j;HLpF;umKn",
        "site": "https://openreview.net/forum?id=mzxKLZNbrQ",
        "pdf_size": 5072074,
        "rating": "3;5;6;8",
        "confidence": "4;5;5;4",
        "soundness": "2;3;2;3",
        "contribution": "2;2;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "102;129;43;49",
        "wc_strengths": "210;38;22;74",
        "wc_weaknesses": "242;78;67;35",
        "wc_questions": "2;38;24;67",
        "wc_review": "556;283;156;225",
        "wc_reply_reviewers": "204;0;0;0",
        "wc_reply_authors": "1696;1067;600;342",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "5;3;2;2",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            80.75,
            36.09968836430586
        ],
        "wc_strengths_avg": [
            86.0,
            74.02702209328699
        ],
        "wc_weaknesses_avg": [
            105.5,
            80.37568040147467
        ],
        "wc_questions_avg": [
            32.75,
            23.573024837725004
        ],
        "wc_review_avg": [
            305.0,
            151.72837572451635
        ],
        "wc_reply_reviewers_avg": [
            51.0,
            88.33459118601274
        ],
        "wc_reply_authors_avg": [
            926.25,
            514.8088844415955
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            1.224744871391589
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            16,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 31,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10334443441692689522&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;0;0;2;0;3;4;0;0;0;0;0",
        "aff_unique_norm": "Alibaba Group;ByteDance;East China Normal University;Xiaohongshu;University of Science and Technology of China",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.alibaba.com;https://www.bytedance.com;http://www.ecnu.edu.cn;https://www.xiaohongshu.com;http://www.ustc.edu.cn",
        "aff_unique_abbr": "Alibaba;ByteDance;ECNU;XHS;USTC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0;0;0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Expressive Losses for Verified Robustness via Convex Combinations",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17873",
        "id": "mzyZ4wzKlM",
        "author_site": "Alessandro De Palma, Rudy R Bunel, Krishnamurthy Dvijotham, M. Pawan Kumar, Robert Stanforth, Alessio Lomuscio",
        "tldr": "",
        "abstract": "In order to train networks for verified adversarial robustness, it is common to over-approximate the worst-case loss over perturbation regions, resulting in networks that attain verifiability at the expense of standard performance.\nAs shown in recent work, better trade-offs between accuracy and robustness can be obtained by carefully coupling adversarial training with over-approximations. \nWe hypothesize that the expressivity of a loss function, which we formalize as the ability to span a range of trade-offs between lower and upper bounds to the worst-case loss through a single parameter (the over-approximation coefficient), is key to attaining state-of-the-art performance. \nTo support our hypothesis, we show that trivial expressive losses, obtained via convex combinations between adversarial attacks and IBP bounds, yield state-of-the-art results across a variety of settings in spite of their conceptual simplicity.\nWe provide a detailed analysis of the relationship between the over-approximation coefficient and performance profiles across different expressive losses, showing that, while expressivity is essential, better approximations of the worst-case loss are not necessarily linked to superior robustness-accuracy trade-offs.",
        "keywords": "Verified Training;Neural Network Verification;Verified Adversarial Robustness",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Alessandro De Palma;Rudy R Bunel;Krishnamurthy Dj Dvijotham;M. Pawan Kumar;Robert Stanforth;Alessio Lomuscio",
        "authorids": "~Alessandro_De_Palma1;~Rudy_R_Bunel1;~Krishnamurthy_Dj_Dvijotham1;~M._Pawan_Kumar1;~Robert_Stanforth1;~Alessio_Lomuscio1",
        "gender": "M;M;;M;M;M",
        "homepage": "https://adpperspective.wordpress.com/publications/;http://www.robots.ox.ac.uk/~rudy/;;;http://www.doc.ic.ac.uk/~alessio/;http://dvij.github.io",
        "dblp": "211/7156;180/5419;45/2527;;l/AlessioLomuscio;16/8758",
        "google_scholar": "https://scholar.google.co.uk/citations?user=IIx6YsQAAAAJ;https://scholar.google.fr/citations?user=7cqQFSoAAAAJ;https://scholar.google.com/citations?hl=en;;https://scholar.google.com.tw/citations?user=xdWZkEEAAAAJ;BUtloecAAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Alessandro_De_Palma1;~Rudy_R_Bunel1;~M._Pawan_Kumar1;~Robert_Stanforth1;~Alessio_Lomuscio1;~Krishnamurthy_Dvijotham2",
        "aff": "INRIA;;Google DeepMind;Google DeepMind;Imperial College London;Google DeepMind",
        "aff_domain": "inria.fr;;deepmind.com;deepmind.com;imperial.ac.uk;google.com",
        "position": "Postdoc;;Researcher;Researcher;Full Professor;Researcher",
        "bibtex": "@inproceedings{\npalma2024expressive,\ntitle={Expressive Losses for Verified Robustness via Convex Combinations},\nauthor={Alessandro De Palma and Rudy R Bunel and Krishnamurthy Dj Dvijotham and M. Pawan Kumar and Robert Stanforth and Alessio Lomuscio},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=mzyZ4wzKlM}\n}",
        "github": "",
        "project": "",
        "reviewers": "tVkU;2HZC;eo5p;oQBq",
        "pdf_size": 538610,
        "rating": "5;6;8;8",
        "confidence": "2;2;4;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;1;3",
        "presentation": "3;1;3;3",
        "wc_summary": "61;28;18;385",
        "wc_strengths": "45;16;31;39",
        "wc_weaknesses": "198;288;42;42",
        "wc_questions": "4;5;76;37",
        "wc_review": "308;337;167;503",
        "wc_reply_reviewers": "0;0;745;0",
        "wc_reply_authors": "640;778;1776;273",
        "reply_reviewers": "0;0;3;0",
        "reply_authors": "1;1;5;1",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.0,
            1.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            123.0,
            152.10029585770042
        ],
        "wc_strengths_avg": [
            32.75,
            10.871407452579449
        ],
        "wc_weaknesses_avg": [
            142.5,
            105.4170289848846
        ],
        "wc_questions_avg": [
            30.5,
            29.432125305522874
        ],
        "wc_review_avg": [
            328.75,
            119.39927763600582
        ],
        "wc_reply_reviewers_avg": [
            186.25,
            322.5944629097034
        ],
        "wc_reply_authors_avg": [
            866.75,
            556.4545691249197
        ],
        "reply_reviewers_avg": [
            0.75,
            1.299038105676658
        ],
        "reply_authors_avg": [
            2.0,
            1.7320508075688772
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.9622504486493761,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12541694326055820524&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=mzyZ4wzKlM",
        "pdf": "https://openreview.net/pdf?id=mzyZ4wzKlM",
        "email": "inria.fr;;deepmind.com;deepmind.com;imperial.ac.uk;google.com",
        "author_num": 6,
        "aff_unique_index": "0;1;1;2;1",
        "aff_unique_norm": "INRIA;Google;Imperial College London",
        "aff_unique_dep": ";Google DeepMind;",
        "aff_unique_url": "https://www.inria.fr;https://deepmind.com;https://www.imperial.ac.uk",
        "aff_unique_abbr": "INRIA;DeepMind;ICL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;1",
        "aff_country_unique": "France;United Kingdom"
    },
    {
        "id": "n08o3DJtHL",
        "title": "NF-ICP: Neural Field ICP for Robust 3D Human Registration",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Aligning a template to 3D human point clouds is a long-standing problem crucial for tasks like animation, reconstruction, and most supervised learning pipelines. Recent data-driven methods leverage predicted surface correspondences; however, they are not robust to varied poses or distributions. In contrast, industrial solutions often rely on expensive manual annotations or multi-view capture systems. In this work, we present NF-ICP, a method that, for the first time, generalizes well on a large set of challenges, including complex poses, clothed humans, and noisy scans. Leveraging the large MoCap dataset AMASS, we learn a neural field model to predict the direction towards the localized SMPL vertices on the target surface. Such neural field leads to a reasonable initialization, but the resulting template often does not overlap with the target surface. NF-ICP exploits a classical Iterative Closest Point objective adapted to our model to quickly fine-tune the model, resulting in a significantly improved template to target surface overlap. NF-ICP constitutes a simple and computationally efficient registration method that significantly improves over public benchmarks and solidly surpasses the state of the art. We will release code and checkpoints in \\url{link}.",
        "keywords": "3D Non-rigid Registration; 3D Shape matching; Neural Fields; Virtual Humans",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/1ce4623ef53527680db1d4c1f8e9bb355ee26dc9.zip",
        "author": "Riccardo Marin;Enric Corona;Gerard Pons-Moll",
        "authorids": "~Riccardo_Marin1;~Enric_Corona1;~Gerard_Pons-Moll2",
        "gender": ";M;",
        "homepage": ";https://www.iri.upc.edu/people/ecorona/;",
        "dblp": ";182/5401;",
        "google_scholar": ";https://scholar.google.es/citations?user=I2ZJlLEAAAAJ;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Riccardo_Marin1;~Enric_Corona1;~Gerard_Pons-Moll2",
        "aff": ";Google DeepMind;",
        "aff_domain": ";google.com;",
        "position": ";Researcher;",
        "bibtex": "@misc{\nmarin2024nficp,\ntitle={{NF}-{ICP}: Neural Field {ICP} for Robust 3D Human Registration},\nauthor={Riccardo Marin and Enric Corona and Gerard Pons-Moll},\nyear={2024},\nurl={https://openreview.net/forum?id=n08o3DJtHL}\n}",
        "github": "",
        "project": "",
        "reviewers": "HArx;JdQC;FtZ7",
        "site": "https://openreview.net/forum?id=n08o3DJtHL",
        "pdf_size": 21301248,
        "rating": "5;5;5",
        "confidence": "5;3;4",
        "soundness": "3;2;3",
        "contribution": "2;3;2",
        "presentation": "3;3;2",
        "wc_summary": "51;89;36",
        "wc_strengths": "69;30;35",
        "wc_weaknesses": "390;167;162",
        "wc_questions": "202;2;8",
        "wc_review": "712;288;241",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1031;631;567",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            58.666666666666664,
            22.305953365762143
        ],
        "wc_strengths_avg": [
            44.666666666666664,
            17.326921891156033
        ],
        "wc_weaknesses_avg": [
            239.66666666666666,
            106.32131593533923
        ],
        "wc_questions_avg": [
            70.66666666666667,
            92.89898934984288
        ],
        "wc_review_avg": [
            413.6666666666667,
            211.82435071434907
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            743.0,
            205.31601658581502
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:cI_olHMoplcJ:scholar.google.com/&scioq=NF-ICP:+Neural+Field+ICP+for+Robust+3D+Human+Registration&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Google",
        "aff_unique_dep": "Google DeepMind",
        "aff_unique_url": "https://deepmind.com",
        "aff_unique_abbr": "DeepMind",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "n1LiKueC4F",
        "title": "Personalized Language Generation via Bayesian Metric Augmented Retrieval",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Our paper presents a Bayesian adaptation of Retrieval Augmented Generation (RAG) designed to capture the characteristics of each user, encompassing factors such as their educational background and professions. We model each individual's characteristics using specific perturbations of the local metric of the embedding space. This perturbation introduces a crucial shift in the distance evaluation between the query's and the document's embedding, leading to different pertinent rankings of the retrieved documents. We propose a Bayesian learning procedure that assimilates user feedback and continuously enhances our estimation of the user-specific  metric. In the beginning, when there is no information about the user, we use a diverse retrieval method for generation. After this burn-in phase, we learn a Bayesian posterior estimate of the metric, and inject this metric into the nearest neighbor search for document retrieval. This additional layer of metric information acquisition leads to empirical improvement in the retrieval quality and in the performance of the generated text on multiple concept explanation tasks.",
        "keywords": "Retrieval Augmented Generation;Bayesian Metric Learning",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Hieu Trung Nguyen;Viet Anh Nguyen",
        "authorids": "~Hieu_Trung_Nguyen2;~Viet_Anh_Nguyen2",
        "gender": "M;M",
        "homepage": ";http://www.vietanhnguyen.net",
        "dblp": ";",
        "google_scholar": "OlFCFKgAAAAJ;3iyf-EoAAAAJ",
        "orcid": ";",
        "linkedin": "hieu-nguyen-08774317a/;",
        "or_profile": "~Hieu_Trung_Nguyen2;~Viet_Anh_Nguyen2",
        "aff": "The Chinese University of Hong Kong;The Chinese University of Hong Kong",
        "aff_domain": "cuhk.edu.hk;cuhk.edu.hk",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nnguyen2024personalized,\ntitle={Personalized Language Generation via Bayesian Metric Augmented Retrieval},\nauthor={Hieu Trung Nguyen and Viet Anh Nguyen},\nyear={2024},\nurl={https://openreview.net/forum?id=n1LiKueC4F}\n}",
        "github": "",
        "project": "",
        "reviewers": "u3r5;NT9n;Qd94;zTRj",
        "site": "https://openreview.net/forum?id=n1LiKueC4F",
        "pdf_size": 639309,
        "rating": "3;5;5;8",
        "confidence": "4;5;3;2",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;3;4",
        "wc_summary": "26;92;140;121",
        "wc_strengths": "31;111;32;33",
        "wc_weaknesses": "210;123;85;44",
        "wc_questions": "19;29;306;42",
        "wc_review": "286;355;563;240",
        "wc_reply_reviewers": "89;59;29;38",
        "wc_reply_authors": "875;1002;687;10",
        "reply_reviewers": "1;2;1;1",
        "reply_authors": "2;3;2;1",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            94.75,
            43.21675022488387
        ],
        "wc_strengths_avg": [
            51.75,
            34.2153109002388
        ],
        "wc_weaknesses_avg": [
            115.5,
            61.296410987920005
        ],
        "wc_questions_avg": [
            99.0,
            119.78939852925217
        ],
        "wc_review_avg": [
            361.0,
            123.59813914456802
        ],
        "wc_reply_reviewers_avg": [
            53.75,
            23.080023830143677
        ],
        "wc_reply_authors_avg": [
            643.5,
            382.5339854182893
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.6888467201936643,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:nJR43c-mbE4J:scholar.google.com/&scioq=Personalized+Language+Generation+via+Bayesian+Metric+Augmented+Retrieval&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Chinese University of Hong Kong",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cuhk.edu.hk",
        "aff_unique_abbr": "CUHK",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "n2Jyi6h7Pv",
        "title": "Why do Features of Multi-Layer Perceptrons Condense in Training?",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "This paper focuses on the problem of feature condensation in early epochs of learning multi-layer perceptrons (MLPs). In fact, the feature condensation is related to many other phenomena in deep learning, and people have some empirical operations to avoid these problems. However, current studies do not well explain essential mechanisms that lead to the feature condensation, i.e., which factors will determine (or alleviate) the feature condensation. The explanation of determinants of feature condensation is crucial for both theoreticians and practitioners. To this end, we theoretically analyze the learning dynamics of MLPs, which clarifies how four typical operations (including batch normalization, momentum, weight initialization, and $L_2$ regularization) affect the feature condensation.",
        "keywords": "Neural Networks;Deep Learning Theory;Multi-Layer Perceptrons",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/ab8be08c09a5fe851695015493e5a1d27b8acaab.zip",
        "author": "Dongrui Liu;Shaobo Wang;Jie Ren;Kangrui Wang;Sheng Yin;Huiqi Deng;Wenming Tan;Quanshi Zhang",
        "authorids": "~Dongrui_Liu1;~Shaobo_Wang1;~Jie_Ren1;~Kangrui_Wang2;~Sheng_Yin1;~Huiqi_Deng1;~Wenming_Tan1;~Quanshi_Zhang1",
        "gender": "M;M;F;M;M;F;M;M",
        "homepage": "https://shenqildr.github.io/;https://gszfwsb.github.io/;https://jie-ren.github.io/;https://jameskrw.github.io/;https://shengyin1224.github.io/;;;http://qszhang.com",
        "dblp": "199/9200.html;44/9990-1;r/JieRen-18;216/9159;52/2662;229/1317;224/0172;http://dblp.uni-trier.de/pers/hd/z/Zhang:Quanshi",
        "google_scholar": "https://scholar.google.com.hk/citations?hl=zh-CN;https://scholar.google.co.in/citations?hl=zh-CN;https://scholar.google.com/citations?hl=zh-CN;;eS2g0gIAAAAJ;QEjqzXgAAAAJ;https://scholar.google.com/citations?hl=en;iFFhHK0AAAAJ",
        "orcid": "0000-0003-0087-1124;;0000-0001-9918-3000;;;;0000-0003-1338-4536;",
        "linkedin": ";;;wang-kangrui-8b9a37257/;;;;",
        "or_profile": "~Dongrui_Liu1;~Shaobo_Wang1;~Jie_Ren1;~Kangrui_Wang2;~Sheng_Yin1;~Huiqi_Deng1;~Wenming_Tan1;~Quanshi_Zhang1",
        "aff": "Shanghai Artificial Intelligence Laboratory;Shanghai Jiaotong University;Shanghai Jiaotong University;Northwestern University;Shanghai Jiaotong University;Xi'an jiaotong University;Hikvision Research Institute;Shanghai Jiaotong University",
        "aff_domain": "pjlab.org.cn;sjtu.edu.cn;sjtu.edu.cn;northwestern.edu;sjtu.edu.cn;edu.cn;hikvision.com;sjtu.edu.cn",
        "position": "Researcher;MS student;PhD student;PhD student;PhD student;Assistant Professor;Researcher;Associate Professor",
        "bibtex": "@misc{\nliu2024why,\ntitle={Why do Features of Multi-Layer Perceptrons Condense in Training?},\nauthor={Dongrui Liu and Shaobo Wang and Jie Ren and Kangrui Wang and Sheng Yin and Huiqi Deng and Wenming Tan and Quanshi Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=n2Jyi6h7Pv}\n}",
        "github": "",
        "project": "",
        "reviewers": "zGRs;HLbC;17pC",
        "site": "https://openreview.net/forum?id=n2Jyi6h7Pv",
        "pdf_size": 7358692,
        "rating": "5;5;5",
        "confidence": "4;3;4",
        "soundness": "4;2;2",
        "contribution": "2;2;2",
        "presentation": "4;2;2",
        "wc_summary": "87;119;83",
        "wc_strengths": "27;11;32",
        "wc_weaknesses": "109;186;507",
        "wc_questions": "2;88;25",
        "wc_review": "225;404;647",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            96.33333333333333,
            16.110727964792762
        ],
        "wc_strengths_avg": [
            23.333333333333332,
            8.956685895029603
        ],
        "wc_weaknesses_avg": [
            267.3333333333333,
            172.36073283153044
        ],
        "wc_questions_avg": [
            38.333333333333336,
            36.353205574688396
        ],
        "wc_review_avg": [
            425.3333333333333,
            172.93993819306812
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:o_0CTpMzTegJ:scholar.google.com/&scioq=Why+do+Features+of+Multi-Layer+Perceptrons+Condense+in+Training%3F&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;2;1;3;4;1",
        "aff_unique_norm": "Shanghai Artificial Intelligence Laboratory;Shanghai Jiao Tong University;Northwestern University;Xi'an Jiao Tong University;Hikvision Research Institute",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "http://www.shailab.org/;https://www.sjtu.edu.cn;https://www.northwestern.edu;https://www.xjtu.edu.cn;https://www.hikvision.com/cn/",
        "aff_unique_abbr": "Shanghai AI Lab;SJTU;NU;XJTU;Hikvision",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0;0;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "n2nPeZ9VJ0",
        "title": "Optimized Large Language Models Accurately Identify Recurrence of VT After Ablation from Complex Medical Notes: Will Chart Review Become Obsolete?",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large language models (LLMs) provide impressive out-of-the-box performance to queries for which data are in the public domain using prompt engineering. However, they are less effective when analyzing important datasets that are not publicly available, such as electronic health records (EHRs), where current prompting strategies are either suboptimal or require domain-specific expertise. To overcome these limitations, we proposed a $\\textit{non-domain-specific}$ prompting strategy\u2014termed $\\textbf{Structured Rationale Responses}$ (SRR)\u2014designed to enhance the accuracy and reliability of LLM responses to nuanced inquiries in EHRs compared with expert interpretations. Specifically, SRR guides LLMs to generate responses 1) in a structured format (e.g., JSON), and 2) with rationales, which are sentences excerpted from the query note that the LLM used to support its answer. In 499 full-text EHR notes (474.6\u00b1164.3 words) in 125 patients with life-threatening heart rhythm disorders, we asked LLM whether a patient had an acute event of ventricular arrhythmias which required it to remove parse contradictory information on prior events. In an independent hold-out test set of 398 notes (471.8\u00b1160.1 words), our SRR achieved a balanced accuracy of 86.6\\%\u00b14.0\\% without any in-context examples, demonstrating an average performance lift of 30.5\\% over the standard prompts, 12.2\\% over Zero-shot-CoT prompts, and 10.4\\% over 5-shot prompts. Notably, for true positives where LLM correctly identified acute events, 94.4\\%\u00b15.2\\% had at least one LLM-generated rationale considered clinically relevant by experts. Our code can be found at https://github.com/***.",
        "keywords": "Large Language Models;Natural Language Processing;Prompt Engineering;Electronic Health Records;Ventricular Arrhythmias",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Ruibin Feng",
        "authorids": "~Ruibin_Feng1",
        "gender": "",
        "homepage": "https://profiles.stanford.edu/ruibin-feng",
        "dblp": "136/9458",
        "google_scholar": "5E_MZX4AAAAJ",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Ruibin_Feng1",
        "aff": "Stanford University",
        "aff_domain": "stanford.edu",
        "position": "Postdoc",
        "bibtex": "@misc{\nfeng2024optimized,\ntitle={Optimized Large Language Models Accurately Identify Recurrence of {VT} After Ablation from Complex Medical Notes: Will Chart Review Become Obsolete?},\nauthor={Ruibin Feng},\nyear={2024},\nurl={https://openreview.net/forum?id=n2nPeZ9VJ0}\n}",
        "github": "",
        "project": "",
        "reviewers": "NLwC;QmtS;T6RQ",
        "site": "https://openreview.net/forum?id=n2nPeZ9VJ0",
        "pdf_size": 1552521,
        "rating": "3;3;6",
        "confidence": "4;3;3",
        "soundness": "2;2;2",
        "contribution": "2;1;3",
        "presentation": "2;2;3",
        "wc_summary": "15;67;30",
        "wc_strengths": "81;23;41",
        "wc_weaknesses": "111;158;107",
        "wc_questions": "50;5;10",
        "wc_review": "257;253;188",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "779;1288;891",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;4;2",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            37.333333333333336,
            21.85304453744502
        ],
        "wc_strengths_avg": [
            48.333333333333336,
            24.239545283597124
        ],
        "wc_weaknesses_avg": [
            125.33333333333333,
            23.156472577277874
        ],
        "wc_questions_avg": [
            21.666666666666668,
            20.138409955990955
        ],
        "wc_review_avg": [
            232.66666666666666,
            31.626290048347787
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            986.0,
            218.3865075197336
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10447116408710643641&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Stanford University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.stanford.edu",
        "aff_unique_abbr": "Stanford",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Stanford",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "n39ilTxSDY",
        "title": "Ditto: Quantization-Aware Secure Inference of Transformers upon MPC",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Due to the rising privacy concerns on sensitive client data and trained models like Transformers, secure multi-party computation (MPC) techniques are employed to enable secure inference despite attendant overhead. Existing works attempt to reduce the overhead using more MPC-friendly non-linear function approximations. However, the integration of quantization widely used in plaintext inference into the MPC domain remains unclear. \nTo bridge this gap, we propose the framework named Ditto to enable more efficient quantization-aware secure Transformer inference.\nConcretely, we first incorporate an MPC-friendly quantization into Transformer inference and employ a quantization-aware distillation procedure to maintain the model utility. Then, we propose MPC primitives to support the type conversions that are essential in quantization and enable the quantization-aware MPC execution of secure quantized inference. As a result, the computation and communication overhead are reduced, thus enhancing the overall efficiency.\nWe conduct extensive experiments on Bert and GPT2 models to evaluate the performance of Ditto. The results demonstrate that Ditto is about $3.14\\sim 4.40\\times$ faster than MPCFormer (ICLR 2023) and $1.44\\sim 2.35\\times$ faster than the state-of-the-art work PUMA with negligible utility degradation.",
        "keywords": "Transformer model;Secure Multi-Party Computation;Secure Inference;Quantization",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Haoqi Wu;Wenjing Fang;Yancheng Zheng;Junming Ma;Jin Tan;Lei Wang",
        "authorids": "~Haoqi_Wu1;~Wenjing_Fang1;~Yancheng_Zheng1;~Junming_Ma1;~Jin_Tan2;~Lei_Wang30",
        "gender": "M;;M;M;M;M",
        "homepage": ";;https://www.linkedin.com/in/yancheng-zheng-bab7746a/;;https://github.com/rivertalk;",
        "dblp": ";;;203/0941;;",
        "google_scholar": "gCfQJOEAAAAJ;;;;;",
        "orcid": "0000-0003-0650-5459;;;;;",
        "linkedin": ";;;;;%E7%A3%8A-%E7%8E%8B-b4994abb/",
        "or_profile": "~Haoqi_Wu1;~Wenjing_Fang1;~Yancheng_Zheng1;~Junming_Ma1;~Jin_Tan2;~Lei_Wang30",
        "aff": "Ant Group;;Ant Group;Ant Group;Alibaba Group;Ant Group",
        "aff_domain": "antgroup.com;;antgroup.com;antgroup.com;antgroup.com;antgroup.com",
        "position": "Researcher;;Senior Software Engineer;Software engineer;Researcher;Principal Researcher",
        "bibtex": "@misc{\nwu2024ditto,\ntitle={Ditto: Quantization-Aware Secure Inference of Transformers upon {MPC}},\nauthor={Haoqi Wu and Wenjing Fang and Yancheng Zheng and Junming Ma and Jin Tan and Lei Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=n39ilTxSDY}\n}",
        "github": "",
        "project": "",
        "reviewers": "iucu;sjar;MwvF",
        "site": "https://openreview.net/forum?id=n39ilTxSDY",
        "pdf_size": 837613,
        "rating": "5;5;6",
        "confidence": "2;4;4",
        "soundness": "3;3;3",
        "contribution": "3;2;3",
        "presentation": "3;3;3",
        "wc_summary": "74;10;23",
        "wc_strengths": "121;17;47",
        "wc_weaknesses": "94;18;9",
        "wc_questions": "43;54;29",
        "wc_review": "332;99;108",
        "wc_reply_reviewers": "0;0;82",
        "wc_reply_authors": "693;674;509",
        "reply_reviewers": "0;0;2",
        "reply_authors": "1;1;3",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            35.666666666666664,
            27.620443314488796
        ],
        "wc_strengths_avg": [
            61.666666666666664,
            43.70608907489004
        ],
        "wc_weaknesses_avg": [
            40.333333333333336,
            38.12552367582058
        ],
        "wc_questions_avg": [
            42.0,
            10.23067283548187
        ],
        "wc_review_avg": [
            179.66666666666666,
            107.77857960755571
        ],
        "wc_reply_reviewers_avg": [
            27.333333333333332,
            38.6551707048646
        ],
        "wc_reply_authors_avg": [
            625.3333333333334,
            82.62498949403194
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7398384900077253212&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "Ant Group;Alibaba Group",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.antgroup.com;https://www.alibaba.com",
        "aff_unique_abbr": "Ant Group;Alibaba",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "n39lFIzkLI",
        "title": "Addressing Challenges in Reinforcement Learning for Recommender Systems with Conservative Objectives",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Attention-based sequential recommendation methods have shown promise in accurately capturing users' evolving interests from their past interactions. Recent research has also explored the integration of reinforcement learning (RL) into these models, in addition to generating superior user representations. By framing sequential recommendation as an RL problem with reward signals, we can develop recommender systems that incorporate direct user feedback in the form of rewards, enhancing personalization for users.\n\nNonetheless, employing RL algorithms presents challenges, including off-policy training, expansive combinatorial action spaces, and the scarcity of datasets with sufficient reward signals. Contemporary approaches have attempted to combine RL and sequential modeling, incorporating contrastive-based objectives and negative sampling strategies for training the RL component. \nIn this work, we further emphasize the efficacy of contrastive-based objectives paired with augmentation to address datasets with extended horizons. Additionally, we recognize the potential instability issues that may arise during the application of negative sampling. These challenges primarily stem from the data imbalance prevalent in real-world datasets, which is a common issue in offline RL contexts. Furthermore, we introduce an enhanced methodology aimed at providing a more effective solution to these challenges. Experimental results across several real datasets show our method with increased robustness and state-of-the-art performance.",
        "keywords": "Sequential Recommendation;Reinforcement Learning;Q-learning;Contrastive Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/ef4ff9ade79c506e4b2291155483ded70c3e5895.pdf",
        "author": "Melissa Mozifian;Tristan Sylvain;R. David Evans;Lili Meng",
        "authorids": "~Melissa_Mozifian1;~Tristan_Sylvain2;~R._David_Evans1;~Lili_Meng2",
        "gender": "F;Unspecified;;",
        "homepage": "https://melfm.github.io/about.html;https://sites.google.com/view/tristansylvain;;",
        "dblp": "211/6963;190/7311;;",
        "google_scholar": "sygJEU0AAAAJ;https://scholar.google.ca/citations?user=Dg5qUb0AAAAJ;;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Melissa_Mozifian1;~Tristan_Sylvain2;~R._David_Evans1;~Lili_Meng2",
        "aff": "Mila;Borealis AI;;",
        "aff_domain": "mila.quebec;borealisai.com;;",
        "position": "PhD student;Machine Learning Researcher;;",
        "bibtex": "@misc{\nmozifian2024addressing,\ntitle={Addressing Challenges in Reinforcement Learning for Recommender Systems with Conservative Objectives},\nauthor={Melissa Mozifian and Tristan Sylvain and R. David Evans and Lili Meng},\nyear={2024},\nurl={https://openreview.net/forum?id=n39lFIzkLI}\n}",
        "github": "",
        "project": "",
        "reviewers": "Gn3Q;EFLR;zZt2;jovo",
        "site": "https://openreview.net/forum?id=n39lFIzkLI",
        "pdf_size": 1052588,
        "rating": "3;5;5;5",
        "confidence": "4;5;4;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;2",
        "wc_summary": "50;59;172;93",
        "wc_strengths": "63;45;57;41",
        "wc_weaknesses": "99;127;53;132",
        "wc_questions": "232;4;1546;50",
        "wc_review": "444;235;1828;316",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            93.5,
            48.075461516245475
        ],
        "wc_strengths_avg": [
            51.5,
            8.874119674649425
        ],
        "wc_weaknesses_avg": [
            102.75,
            31.355820831226854
        ],
        "wc_questions_avg": [
            458.0,
            633.9163982734632
        ],
        "wc_review_avg": [
            705.75,
            652.2017996755299
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:pnb3aJHGX8UJ:scholar.google.com/&scioq=Addressing+Challenges+in+Reinforcement+Learning+for+Recommender+Systems+with+Conservative+Objectives&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Mila;Borealis AI",
        "aff_unique_dep": "Quebec Artificial Intelligence Institute;",
        "aff_unique_url": "https://mila.quebec;https://www.borealisai.com",
        "aff_unique_abbr": "Mila;Borealis AI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "n3ZXEQKRbO",
        "title": "Bridging Debiasing Tasks with Sufficient Projection: A General Theoretical Framework for Vector Representations",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Pre-trained vector representations in natural language processing often inadvertently encode undesirable social biases. Identifying and removing unwanted biased information from vector representation is an evolving and significant challenge. Our study uniquely addresses this issue from the perspective of statistical independence, proposing a framework for reducing bias by transforming vector representations to an unbiased subspace using sufficient projection. The key to our framework lies in its generality: it adeptly mitigates bias across both debiasing and fairness tasks, and across various vector representation types, including word embeddings and output representations of transformer models. Importantly, we establish the connection between debiasing and fairness, offering theoretical guarantees and elucidating our algorithm's efficacy. Through extensive evaluation of intrinsic and extrinsic metrics, our method achieves superior performance in bias reduction while maintaining high task performance, and offers superior computational efficiency.",
        "keywords": "Gender Debias; Vector Representation; NLP; Algorithmic Fairness",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/2f641aa28a1330f32a53bf4708d38f00c3c8098a.zip",
        "author": "Enze Shi;Lei Ding;Linglong Kong;Bei Jiang",
        "authorids": "~Enze_Shi1;~Lei_Ding6;~Linglong_Kong2;~Bei_Jiang1",
        "gender": "M;M;M;F",
        "homepage": ";;https://www.ualberta.ca/~lkong;https://www.ualberta.ca/~bei1",
        "dblp": ";;35/8525;190/4697",
        "google_scholar": ";ICUOaR4AAAAJ;https://scholar.google.ca/citations?hl=en;https://scholar.google.ca/citations?user=MfOZ8G0AAAAJ",
        "orcid": ";;0000-0003-3011-9216;0000-0002-0033-839X",
        "linkedin": "enze-shi-554b621bb/;;;",
        "or_profile": "~Enze_Shi1;~Lei_Ding6;~Linglong_Kong2;~Bei_Jiang1",
        "aff": "University of Alberta;University of Alberta;University of Alberta;University of Alberta",
        "aff_domain": "ualberta.ca;ualberta.ca;ualberta.ca;ualberta.ca",
        "position": "PhD student;PhD student;Full Professor;Associate Professor",
        "bibtex": "@misc{\nshi2024bridging,\ntitle={Bridging Debiasing Tasks with Sufficient Projection: A General Theoretical Framework for Vector Representations},\nauthor={Enze Shi and Lei Ding and Linglong Kong and Bei Jiang},\nyear={2024},\nurl={https://openreview.net/forum?id=n3ZXEQKRbO}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZSuS;PbJ8;acJ7",
        "site": "https://openreview.net/forum?id=n3ZXEQKRbO",
        "pdf_size": 679748,
        "rating": "3;3;5",
        "confidence": "3;3;4",
        "soundness": "1;3;4",
        "contribution": "2;2;3",
        "presentation": "3;2;4",
        "wc_summary": "68;61;70",
        "wc_strengths": "16;45;66",
        "wc_weaknesses": "395;33;429",
        "wc_questions": "22;96;119",
        "wc_review": "501;235;684",
        "wc_reply_reviewers": "217;370;397",
        "wc_reply_authors": "751;834;1272",
        "reply_reviewers": "1;1;2",
        "reply_authors": "1;2;2",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            66.33333333333333,
            3.858612300930075
        ],
        "wc_strengths_avg": [
            42.333333333333336,
            20.49932248202906
        ],
        "wc_weaknesses_avg": [
            285.6666666666667,
            179.20069444309888
        ],
        "wc_questions_avg": [
            79.0,
            41.38437708443449
        ],
        "wc_review_avg": [
            473.3333333333333,
            184.34448429201478
        ],
        "wc_reply_reviewers_avg": [
            328.0,
            79.25906888173743
        ],
        "wc_reply_authors_avg": [
            952.3333333333334,
            228.5641169465486
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ysgPOCnT6FMJ:scholar.google.com/&scioq=Bridging+Debiasing+Tasks+with+Sufficient+Projection:+A+General+Theoretical+Framework+for+Vector+Representations&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of Alberta",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ualberta.ca",
        "aff_unique_abbr": "UAlberta",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "n3kFlvVhJM",
        "title": "Adder: Adapted Dense Retrieval",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Information retrieval involves selecting artifacts from a corpus that are most relevant to a given search query.  The flavor of retrieval typically used in classical applications can be termed as homogeneous and relaxed, where queries and corpus elements are both natural language (NL) utterances (homogeneous) and the goal is to pick most relevant elements from the corpus in the Top-K, where K is large, such as 10, 25, 50 or even 100 (relaxed).  Recently, retrieval is being used extensively in preparing prompts for large language models (LLMs) to enable LLMs to perform targeted tasks.  These new applications of retrieval are often heterogeneous and strict -- the queries and the corpus contain different kinds of entities, such as NL and code, and there is a need for improving retrieval at Top-K for small values of K, such as K=1 or 3 or 5.  Current dense retrieval techniques based on pretrained embeddings provide a general-purpose and powerful approach for retrieval, but they are oblivious to task-specific notions of similarity of heterogeneous artifacts.  We introduce Adapted Dense Retrieval, a mechanism to transform embeddings to enable improved task-specific, heterogeneous and strict retrieval. Adapted Dense Retrieval works by learning a low-rank residual adaptation of the pretrained black-box embedding.  We empirically validate our approach by showing improvements over the state-of-the-art general-purpose embeddings-based baseline.",
        "keywords": "dense retrieval;large language models;embeddings;prompt engineering",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Anirudh Khatry;Yasharth Bajpai;Priyanshu Gupta;Sumit Gulwani;Ashish Tiwari",
        "authorids": "~Anirudh_Khatry1;~Yasharth_Bajpai1;~Priyanshu_Gupta1;~Sumit_Gulwani1;~Ashish_Tiwari2",
        "gender": "M;M;M;;M",
        "homepage": "https://www.microsoft.com/en-us/research/people/ybajpai/;https://www.microsoft.com/en-us/research/people/priyansgupta/;https://www.microsoft.com/en-us/research/people/sumitg/;http://www.csl.sri.com/~tiwari;https://anirudhkhatry.com",
        "dblp": ";155/3225;g/SumitGulwani;t/AshishTiwari;318/1060",
        "google_scholar": "bKgL-J8AAAAJ;D7fTw_YAAAAJ;fZinJ_AAAAAJ;-TFCgqsAAAAJ;vE2VuVwAAAAJ",
        "orcid": ";0000-0002-5599-5004;0000-0002-9226-9634;0000-0002-5153-2686;0009-0004-7773-4405",
        "linkedin": ";priyanshu-gupta-42000;sumit-gulwani/;ashish-tiwari-3b54001/;anirudh-khatry/",
        "or_profile": "~Yasharth_Bajpai1;~Priyanshu_Gupta1;~Sumit_Gulwani1;~Ashish_Tiwari2;~Anirudh_Vishal_Khatry1",
        "aff": "Microsoft;Microsoft;Microsoft Research;Microsoft;Microsoft",
        "aff_domain": "microsoft.com;microsoft.com;research.microsoft.com;microsoft.com;microsoft.com",
        "position": "Researcher;Researcher;Researcher;Principal Researcher;Research Fellow",
        "bibtex": "@misc{\nkhatry2024adder,\ntitle={Adder: Adapted Dense Retrieval},\nauthor={Anirudh Khatry and Yasharth Bajpai and Priyanshu Gupta and Sumit Gulwani and Ashish Tiwari},\nyear={2024},\nurl={https://openreview.net/forum?id=n3kFlvVhJM}\n}",
        "github": "",
        "project": "",
        "reviewers": "YJBY;Tp6G;qgfm;LpK4;Y6UA;j6bh",
        "site": "https://openreview.net/forum?id=n3kFlvVhJM",
        "pdf_size": 257374,
        "rating": "3;3;5;5;6;6",
        "confidence": "4;3;4;3;4;4",
        "soundness": "2;2;2;3;3;3",
        "contribution": "1;2;2;2;2;3",
        "presentation": "3;2;3;3;3;3",
        "wc_summary": "59;60;82;169;79;487",
        "wc_strengths": "33;26;71;81;52;97",
        "wc_weaknesses": "232;321;397;94;118;209",
        "wc_questions": "38;123;62;65;42;57",
        "wc_review": "362;530;612;409;291;850",
        "wc_reply_reviewers": "120;252;236;14;0;47",
        "wc_reply_authors": "821;914;1094;922;579;459",
        "reply_reviewers": "1;1;1;1;0;1",
        "reply_authors": "3;2;3;2;2;2",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.5773502691896257
        ],
        "presentation_avg": [
            2.8333333333333335,
            0.3726779962499649
        ],
        "wc_summary_avg": [
            156.0,
            152.6215362697327
        ],
        "wc_strengths_avg": [
            60.0,
            25.4296414970142
        ],
        "wc_weaknesses_avg": [
            228.5,
            106.1771318756225
        ],
        "wc_questions_avg": [
            64.5,
            27.968732541893992
        ],
        "wc_review_avg": [
            509.0,
            185.50112308734592
        ],
        "wc_reply_reviewers_avg": [
            111.5,
            101.16941237350349
        ],
        "wc_reply_authors_avg": [
            798.1666666666666,
            215.97022685752057
        ],
        "reply_reviewers_avg": [
            0.8333333333333334,
            0.37267799624996495
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.37796447300922736,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:FSMM1B3p84QJ:scholar.google.com/&scioq=Adder:+Adapted+Dense+Retrieval&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Microsoft",
        "aff_unique_dep": "Microsoft Corporation",
        "aff_unique_url": "https://www.microsoft.com",
        "aff_unique_abbr": "Microsoft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "n3z5oALWci",
        "title": "ReX: A Framework for Incorporating Temporal Information in Model-Agnostic Local Explanation Techniques",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Advanced machine learning models that can handle inputs of variable lengths are powerful, but often hard to interpret. The lack of transparency hinders their adoption in many domains. Explanation techniques are essential for improving transparency. However, existing model-agnostic general explanation techniques do not consider the variable lengths of input data points, which limits their effectiveness. To address this limitation, we propose ReX, a general framework for adapting various explanation techniques to models that process variable-length inputs, expanding explanation coverage to data points of different lengths. Our approach adds temporal information to the explanations generated by existing techniques without altering their core algorithms. We instantiate our approach on three popular explanation techniques: Anchors, LIME, and Kernel SHAP.  To evaluate the effectiveness of ReX, we apply our approach to five models in two different tasks. Our evaluation results demonstrate that our approach significantly improves the fidelity and understandability of explanations.",
        "keywords": "machine learning;interpretability;temporal;local;model-agnostic",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/9280956d729a737c1e94b3c39d2af8831363145b.zip",
        "author": "Junhao Liu;Xin Zhang",
        "authorids": "~Junhao_Liu2;~Xin_Zhang1",
        "gender": "M;M",
        "homepage": "https://outerform.github.io/;https://xinpl.github.io",
        "dblp": ";76/1584-35.html",
        "google_scholar": "oX5qFaYAAAAJ;D9NJsrcAAAAJ",
        "orcid": ";",
        "linkedin": "%E4%BF%8A%E8%B1%AA-%E5%88%98-75a155177/;",
        "or_profile": "~Junhao_Liu2;~Xin_Zhang1",
        "aff": "Peking University;Peking University",
        "aff_domain": "pku.edu.cn;pku.edu.cn",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nliu2024rex,\ntitle={ReX: A Framework for Incorporating Temporal Information in Model-Agnostic Local Explanation Techniques},\nauthor={Junhao Liu and Xin Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=n3z5oALWci}\n}",
        "github": "",
        "project": "",
        "reviewers": "MXvE;9eyb;s4Qe;zbfs",
        "site": "https://openreview.net/forum?id=n3z5oALWci",
        "pdf_size": 2668263,
        "rating": "3;5;5;6",
        "confidence": "3;4;4;3",
        "soundness": "2;2;2;3",
        "contribution": "2;3;2;3",
        "presentation": "1;2;2;3",
        "wc_summary": "126;49;108;100",
        "wc_strengths": "94;52;107;64",
        "wc_weaknesses": "667;44;229;65",
        "wc_questions": "421;52;71;111",
        "wc_review": "1308;197;515;340",
        "wc_reply_reviewers": "262;0;88;10",
        "wc_reply_authors": "2803;362;1189;417",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "5;2;3;2",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            95.75,
            28.586491565073178
        ],
        "wc_strengths_avg": [
            79.25,
            22.151467220028564
        ],
        "wc_weaknesses_avg": [
            251.25,
            250.4918910863184
        ],
        "wc_questions_avg": [
            163.75,
            150.04228570639677
        ],
        "wc_review_avg": [
            590.0,
            429.5631501886539
        ],
        "wc_reply_reviewers_avg": [
            90.0,
            104.98571331376475
        ],
        "wc_reply_authors_avg": [
            1192.75,
            985.5014903590964
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            1.224744871391589
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.2294157338705618,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7585640195096056068&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Peking University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.pku.edu.cn",
        "aff_unique_abbr": "Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "HAZARD Challenge: Embodied Decision Making in Dynamically Changing Environments",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17872",
        "id": "n6mLhaBahJ",
        "author_site": "Qinhong Zhou, Sunli Chen, Yisong Wang, Haozhe Xu, Weihua Du, Hongxin Zhang, Yilun Du, Joshua B Tenenbaum, Chuang Gan",
        "tldr": "",
        "abstract": "Recent advances in high-fidelity virtual environments serve as one of the major driving forces for building intelligent embodied agents to perceive, reason and interact with the physical world. Typically, these environments remain unchanged unless agents interact with them. However, in real-world scenarios, agents might also face dynamically changing environments characterized by unexpected events and need to rapidly take action accordingly. To remedy this gap, we propose a new simulated embodied benchmark, called HAZARD, specifically designed to assess the decision-making abilities of embodied agents in dynamic situations. HAZARD consists of three unexpected disaster scenarios, including fire, flood, and wind, and specifically supports the utilization of large language models (LLMs) to assist common sense reasoning and decision-making. This benchmark enables us to evaluate autonomous agents' decision-making capabilities across various pipelines, including reinforcement learning (RL), rule-based, and search-based methods in dynamically changing environments. As a first step toward addressing this challenge using large language models, we further develop an LLM-based agent and perform an in-depth analysis of its promise and challenge of solving these challenging tasks. HAZARD is available at https://vis-www.cs.umass.edu/hazard/.",
        "keywords": "embodied AI;decision making",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Qinhong Zhou;Sunli Chen;Yisong Wang;Haozhe Xu;Weihua Du;Hongxin Zhang;Yilun Du;Joshua B. Tenenbaum;Chuang Gan",
        "authorids": "~Qinhong_Zhou1;~Sunli_Chen1;~Yisong_Wang3;~Haozhe_Xu1;~Weihua_Du1;~Hongxin_Zhang1;~Yilun_Du1;~Joshua_B._Tenenbaum1;~Chuang_Gan1",
        "gender": "M;M;;M;M;M;;;M",
        "homepage": "https://zhouqqhh.github.io/;https://eeeeeerickkk.github.io/;https://github.com/pigeon23;https://xhzgenius.github.io;https://stiglidu.github.io/;https://icefoxzhx.github.io/;https://yilundu.github.io;;http://people.csail.mit.edu/ganchuang/",
        "dblp": "337/9618;359/3746;;;229/1269;284/2962-5;204/4379;t/JoshuaBTenenbaum;139/6993",
        "google_scholar": "sQW6Ni4AAAAJ;7LxAwLwAAAAJ;;;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en;;;PTeSCbIAAAAJ",
        "orcid": ";;;;0000-0002-8856-0277;0000-0002-6041-2440;;;",
        "linkedin": "https://www.linkedin.cn/incareer/in/%E6%B2%81%E6%B3%93-%E5%91%A8-9500b7127;;;;;;;;",
        "or_profile": "~Qinhong_Zhou1;~Sunli_Chen1;~Yisong_Wang3;~Haozhe_Xu1;~Weihua_Du1;~Hongxin_Zhang1;~Yilun_Du1;~Joshua_B._Tenenbaum1;~Chuang_Gan1",
        "aff": "University of Massachusetts at Amherst;Tsinghua University;Peking University;Peking University;Tsinghua University;University of Massachusetts at Amherst;Massachusetts Institute of Technology;Massachusetts Institute of Technology;University of Massachusetts at Amherst",
        "aff_domain": "umass.edu;tsinghua.edu.cn;pku.edu.cn;stu.pku.edu.cn;mails.tsinghua.edu.cn;umass.edu;mit.edu;mit.edu;umass.edu",
        "position": "PhD student;Undergrad student;Undergrad student;Undergrad student;Undergrad student;PhD student;PhD student;Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nzhou2024hazard,\ntitle={{HAZARD} Challenge: Embodied Decision Making in Dynamically Changing Environments},\nauthor={Qinhong Zhou and Sunli Chen and Yisong Wang and Haozhe Xu and Weihua Du and Hongxin Zhang and Yilun Du and Joshua B. Tenenbaum and Chuang Gan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=n6mLhaBahJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "p2Ka;oxZh;qCJU;BqkX",
        "pdf_size": 11863373,
        "rating": "5;6;8;8",
        "confidence": "3;4;3;4",
        "soundness": "2;4;3;3",
        "contribution": "2;4;3;3",
        "presentation": "3;4;3;3",
        "wc_summary": "78;76;27;91",
        "wc_strengths": "77;167;43;132",
        "wc_weaknesses": "170;116;2;324",
        "wc_questions": "5;2;23;136",
        "wc_review": "330;361;95;683",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "551;383;198;1016",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            68.0,
            24.361855430159665
        ],
        "wc_strengths_avg": [
            104.75,
            47.96027001592047
        ],
        "wc_weaknesses_avg": [
            153.0,
            115.86630226256467
        ],
        "wc_questions_avg": [
            41.5,
            55.14752940975688
        ],
        "wc_review_avg": [
            367.25,
            209.31122162941958
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            537.0,
            303.4279156570799
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.19245008972987526,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14134700290526897473&as_sdt=805&sciodt=0,3&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=n6mLhaBahJ",
        "pdf": "https://openreview.net/pdf?id=n6mLhaBahJ",
        "email": "umass.edu;tsinghua.edu.cn;pku.edu.cn;stu.pku.edu.cn;mails.tsinghua.edu.cn;umass.edu;mit.edu;mit.edu;umass.edu",
        "author_num": 9,
        "aff_unique_index": "0;1;2;2;1;0;3;3;0",
        "aff_unique_norm": "University of Massachusetts Amherst;Tsinghua University;Peking University;Massachusetts Institute of Technology",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.umass.edu;https://www.tsinghua.edu.cn;http://www.pku.edu.cn;https://web.mit.edu",
        "aff_unique_abbr": "UMass Amherst;THU;Peking U;MIT",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Amherst;",
        "aff_country_unique_index": "0;1;1;1;1;0;0;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "Mayfly: a Neural Data Structure for Graph Stream Summarization",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17871",
        "id": "n7Sr8SW4bn",
        "author_site": "yuan feng, Yukun Cao, Hairu Wang, Xike Xie, S Kevin Zhou",
        "tldr": "",
        "abstract": "A graph is a structure made up of vertices and edges used to represent complex relationships between entities, while a graph stream is a continuous flow of graph updates that convey evolving relationships between entities. The massive volume and high dynamism of graph streams promote research on data structures of graph summarization, which provides a concise and approximate view of graph streams with sub-linear space and linear construction time, enabling real-time graph analytics in various domains, such as social networking, financing, and cybersecurity.\nIn this work, we propose the Mayfly, the first neural data structure for summarizing graph streams. The Mayfly replaces handcrafted data structures with better accuracy and adaptivity.\nTo cater to practical applications, Mayfly incorporates two offline training phases.\nDuring the larval phase, the Mayfly learns basic summarization abilities from automatically and synthetically constituted meta-tasks, and in the metamorphosis phase, it rapidly adapts to real graph streams via meta-tasks.\nWith specific configurations of information pathways, the Mayfly enables flexible support for miscellaneous graph queries, including edge, node, and connectivity queries.\nExtensive empirical studies show that the Mayfly significantly outperforms its handcrafted competitors.",
        "keywords": "Meta-Learning;Memory Augmented Neural Network; Deep Neural Network Application;Graph Summarization",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/1e7c460d76c9e3c2112df084fb3a30394314a15f.zip",
        "author": "Yuan Feng;Yukun Cao;Wang Hairu;Xike Xie;S Kevin Zhou",
        "authorids": "~Yuan_Feng10;~Yukun_Cao1;~Wang_Hairu2;~Xike_Xie1;~S_Kevin_Zhou1",
        "gender": "M;M;M;M;F",
        "homepage": ";https://caoyukunustc.github.io/;http://staff.ustc.edu.cn/~xkxie;;https://gitee.com/WangHairu",
        "dblp": ";96/5464;64/1308;57/98;",
        "google_scholar": ";;;8eNm2GMAAAAJ;",
        "orcid": "0009-0007-7344-0487;;;0000-0002-6881-4444;",
        "linkedin": "yuan-feng-81a225275/;;;s-kevin-zhou-231a094b/;",
        "or_profile": "~Yuan_Feng10;~Yukun_Cao1;~Xike_Xie1;~S_Kevin_Zhou1;~Hairu_Wang1",
        "aff": "University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China",
        "aff_domain": "ustc.edu.cn;mail.ustc.edu.cn;ustc.edu.cn;ustc.edu.cn;ustc.edu.cn",
        "position": "PhD student;PhD student;Research Professor;Full Professor;MS student",
        "bibtex": "@inproceedings{\nfeng2024mayfly,\ntitle={Mayfly: a Neural Data Structure for Graph Stream Summarization},\nauthor={Yuan Feng and Yukun Cao and Wang Hairu and Xike Xie and S Kevin Zhou},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=n7Sr8SW4bn}\n}",
        "github": "",
        "project": "",
        "reviewers": "wDZJ;AAng;GvCp",
        "pdf_size": 1283023,
        "rating": "6;8;8",
        "confidence": "4;4;3",
        "soundness": "2;4;4",
        "contribution": "2;4;4",
        "presentation": "3;3;4",
        "wc_summary": "67;70;54",
        "wc_strengths": "13;45;83",
        "wc_weaknesses": "173;66;14",
        "wc_questions": "4;89;31",
        "wc_review": "257;270;182",
        "wc_reply_reviewers": "27;13;0",
        "wc_reply_authors": "677;1117;604",
        "reply_reviewers": "1;1;0",
        "reply_authors": "1;2;1",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "contribution_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            63.666666666666664,
            6.944222218666553
        ],
        "wc_strengths_avg": [
            47.0,
            28.61235164516658
        ],
        "wc_weaknesses_avg": [
            84.33333333333333,
            66.19331956893804
        ],
        "wc_questions_avg": [
            41.333333333333336,
            35.462029772075304
        ],
        "wc_review_avg": [
            236.33333333333334,
            38.784303812524755
        ],
        "wc_reply_reviewers_avg": [
            13.333333333333334,
            11.025223605694151
        ],
        "wc_reply_authors_avg": [
            799.3333333333334,
            226.5926349690612
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14645659447386349442&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=n7Sr8SW4bn",
        "pdf": "https://openreview.net/pdf?id=n7Sr8SW4bn",
        "email": "ustc.edu.cn;mail.ustc.edu.cn;ustc.edu.cn;ustc.edu.cn;ustc.edu.cn",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "University of Science and Technology of China",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.ustc.edu.cn",
        "aff_unique_abbr": "USTC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "n7wGjiVP6b",
        "title": "LLM2Labels: Zero-shot dataset summarizing and labeling using foundational LLM models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We introduce the LLM2Labels framework for systematically generating a label vocabulary tailored to image segmentation within a comprehensive image dataset. This framework leverages the capabilities of Visual Language Models (VLMs) and Large Language Models (LLMs). Our methodology unfolds in two distinct stages. Firstly, we perform per-image processing, encompassing the Image Label Proposal and Filtering stage, comprising the Label Proposal Module (LPM) and the Label Filtering Module (LFM). In this stage, LPM employs VLMs to suggest candidate labels for each image, with consideration for the context of the task at hand. Subsequently, the suggested labels undergo a rigorous filtering process in the LFM, guided by a predetermined filtering strategy. Secondly, the Logical Grouping stage leverages well-established LLMs, notably Llama2, to empower the logical categorization of the meticulously filtered candidate labels. This categorization process resembles the organization of labels into coherent groups, akin to WordNet synonym sets. We assess the effectiveness of our framework on segmentation datasets, with a primary focus on ground truth segmentation labels within a closed-set scenario, while also revisiting the open-set evaluation. Notably, this research pioneers a novel application of VLMs and LLMs for zero-shot vocabulary discovery without manual annotators or experts. Our results reveal performance levels rival trained close-set multi-label classification while surpassing naive zero-shot models. This work signifies a pioneering leap in harnessing advanced language models for vocabulary generation in computer vision. Beyond its immediate applications in vocabulary creation for image segmentation, it promises to substantially benefit image analysis and research across the field.",
        "keywords": "Vocabulary Creation;zero-shot multi-label classification",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Aleksandar Cveji\u0107;Rameen Abdal;Peter Wonka",
        "authorids": "~Aleksandar_Cveji\u01071;~Rameen_Abdal1;~Peter_Wonka1",
        "gender": "M;M;M",
        "homepage": ";https://rameenabdal.github.io/;http://peterwonka.net",
        "dblp": ";239/4322;98/5522",
        "google_scholar": "xbAU9sIAAAAJ;https://scholar.google.co.in/citations?user=kEQimk0AAAAJ;https://scholar.google.com.tw/citations?user=0EKXSXgAAAAJ",
        "orcid": "0009-0005-4414-4457;;0000-0003-0627-9746",
        "linkedin": "aleksandar-cvejic/;;",
        "or_profile": "~Aleksandar_Cveji\u01071;~Rameen_Abdal1;~Peter_Wonka1",
        "aff": "King Abdullah University of Science and Technology;Stanford University;KAUST",
        "aff_domain": "kaust.edu.sa;stanford.edu;kaust.edu.sa",
        "position": "PhD student;Postdoc;Full Professor",
        "bibtex": "@misc{\ncveji{\\'c}2024llmlabels,\ntitle={{LLM}2Labels: Zero-shot dataset summarizing and labeling using foundational {LLM} models},\nauthor={Aleksandar Cveji{\\'c} and Rameen Abdal and Peter Wonka},\nyear={2024},\nurl={https://openreview.net/forum?id=n7wGjiVP6b}\n}",
        "github": "",
        "project": "",
        "reviewers": "UakG;VpyB;Het9;afgG",
        "site": "https://openreview.net/forum?id=n7wGjiVP6b",
        "pdf_size": 2640446,
        "rating": "1;3;5;5",
        "confidence": "5;4;3;5",
        "soundness": "1;2;3;2",
        "contribution": "1;1;2;2",
        "presentation": "1;1;2;2",
        "wc_summary": "23;87;31;34",
        "wc_strengths": "36;68;37;19",
        "wc_weaknesses": "124;225;71;70",
        "wc_questions": "3;14;6;2",
        "wc_review": "186;394;145;125",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            1.6583123951777
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            43.75,
            25.292044203662147
        ],
        "wc_strengths_avg": [
            40.0,
            17.67766952966369
        ],
        "wc_weaknesses_avg": [
            122.5,
            63.08129675268257
        ],
        "wc_questions_avg": [
            6.25,
            4.710360920354193
        ],
        "wc_review_avg": [
            212.5,
            107.07123796799961
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.4545454545454545,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:RzS1eimYeYUJ:scholar.google.com/&scioq=LLM2Labels:+Zero-shot+dataset+summarizing+and+labeling+using+foundational+LLM+models&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "King Abdullah University of Science and Technology;Stanford University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.kast.kau.edu.sa;https://www.stanford.edu",
        "aff_unique_abbr": "KAUST;Stanford",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Stanford",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Saudi Arabia;United States"
    },
    {
        "id": "n8UYBYE9SQ",
        "title": "Overcoming Generic Knowledge Loss with Selective Parameter Update",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Foundation models encompass an extensive knowledge base and offer remarkable transferability. However, this knowledge becomes outdated or insufficient over time. The challenge lies in  continuously updating foundation models to accommodate novel information while retaining their original capabilities.  Leveraging the fact that foundation models have initial knowledge on various tasks and domains, we propose a novel approach that,  instead of updating all parameters equally,  localizes the updates to  a sparse set of parameters relevant to the task being learned. We strike a  balance between efficiency and new tasks performance, while maintaining the transferability and generalizability of foundation models. We extensively  evaluate our method on foundational vision-language models with a diverse spectrum of continual learning tasks. Our method achieves  improvements on the newly learned  tasks accuracy up to 7% while preserving the pretraining knowledge with a negligible  decrease of 0.9% on a representative control set accuracy.",
        "keywords": "Continual Learning;Foundation Models",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/29e9c0123ff49220110c60816cb34aafe7ad28d2.zip",
        "author": "Wenxuan Zhang;Paul Janson;Rahaf Aljundi;Mohamed Elhoseiny",
        "authorids": "~Wenxuan_Zhang3;~Paul_Janson1;~Rahaf_Aljundi1;~Mohamed_Elhoseiny1",
        "gender": "F;M;F;M",
        "homepage": "https://cemse.kaust.edu.sa/vcc/people/person/wenxuan-zhang;https://pauljanson002.github.io;https://rahafaljundi.com/;http://www.mohamed-elhoseiny.com",
        "dblp": ";;169/4970;125/2894",
        "google_scholar": ";wfKn1W0AAAAJ;https://scholar.google.be/citations?user=YLh7yrwAAAAJ;iRBUTOAAAAAJ",
        "orcid": ";;;0000-0001-9659-1551",
        "linkedin": ";pauljanson002;;mohamed-elhoseiny-8a836215/",
        "or_profile": "~Wenxuan_Zhang3;~Paul_Janson1;~Rahaf_Aljundi1;~Mohamed_Elhoseiny1",
        "aff": "Samsung Research America;Mila Quebec AI institute;Toyota Motor Europe;KAUST",
        "aff_domain": "samsung.com;mila.quebec;toyota-europe.com;kaust.edu.sa",
        "position": "Intern;PhD student;Researcher;Associate Professor",
        "bibtex": "@misc{\nzhang2024overcoming,\ntitle={Overcoming Generic Knowledge Loss with Selective Parameter Update},\nauthor={Wenxuan Zhang and Paul Janson and Rahaf Aljundi and Mohamed Elhoseiny},\nyear={2024},\nurl={https://openreview.net/forum?id=n8UYBYE9SQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "KY5L;RovQ;J6w2;N81h",
        "site": "https://openreview.net/forum?id=n8UYBYE9SQ",
        "pdf_size": 487819,
        "rating": "3;3;5;5",
        "confidence": "3;3;5;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;3;2",
        "presentation": "3;2;3;3",
        "wc_summary": "65;93;55;101",
        "wc_strengths": "20;41;42;76",
        "wc_weaknesses": "22;259;347;341",
        "wc_questions": "160;62;5;7",
        "wc_review": "267;455;449;525",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            78.5,
            19.04599695474091
        ],
        "wc_strengths_avg": [
            44.75,
            20.06707502353046
        ],
        "wc_weaknesses_avg": [
            242.25,
            131.82825000734857
        ],
        "wc_questions_avg": [
            58.5,
            62.906676911119696
        ],
        "wc_review_avg": [
            424.0,
            95.44108130150245
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.9045340337332909,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10665413992395089397&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Samsung;Mila Quebec AI Institute;Toyota Motor Corporation;King Abdullah University of Science and Technology",
        "aff_unique_dep": "Samsung Research America;AI Institute;;",
        "aff_unique_url": "https://www.samsung.com/us/careers/research/;https://mila.quebec;https://www.toyota-europe.com;https://www.kaust.edu.sa",
        "aff_unique_abbr": "SRA;Mila;TME;KAUST",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Montreal",
        "aff_country_unique_index": "0;1;2;3",
        "aff_country_unique": "United States;Canada;Unknown;Saudi Arabia"
    },
    {
        "id": "n9CqhWGK4o",
        "title": "Cellular Interplay in COVID-19: Insights from Graph Neural Networks with Multidimensional Edge Features",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The COVID-19 has emerged as a global pandemic, posing a significant public health threat with its widespread infection and the potential for severe respiratory complications. Among the various methodologies employed, single-cell omics-based studies have been at the forefront, concentrating on \u201cintra\u201d-cellular properties exhibited by gene expression. However, given its infectious nature, complex biological processes, such as immune responses performed between immune cells, infected cells, etc., necessitate a deeper analysis on \u201cinter\u201d-cellular properties exhibited by cell-cell interaction scores calculated using ligand and receptor expression information. The differences in these interactions in addition to gene expression between severe and non-severe cases could be pivotal in understanding the disease\u2019s onset and progression, including mechanism leading to disease severity. Since the structure representing the overall nature of immune response can be implemented by directed graph with cell types as nodes and their interactions as edges, we employed a Graph Neural Network (GNN) model architecture accommodating multi-dimensional edge features, one of the first applications in biological context. In this study, our model incorporates edge features of cell-cell interaction scores, and node features of transcriptional factors and their target genes, which are \u201cintra\u201d-cellular features affected in the downstream by \u201cinter\u201d-cellular features. By leveraging the power of GNNs and the innovative use of multiple edge features, our model offers a groundbreaking perspective on the biological complexity of COVID-19, holding promise for the development of more effective treatments and preventive measures.",
        "keywords": "Graph neural network;Classification;Biological application;Single cell RNA-seq;Cell-Cell Interaction",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Kyeonghun Jeong;Yooeun Kim;Kwangsoo Kim",
        "authorids": "~Kyeonghun_Jeong1;~Yooeun_Kim1;~Kwangsoo_Kim1",
        "gender": ";F;",
        "homepage": ";;",
        "dblp": ";;",
        "google_scholar": ";;",
        "orcid": "0000-0001-8265-1576;0009-0000-7328-4612;",
        "linkedin": ";;",
        "or_profile": "~Kyeonghun_Jeong1;~Yooeun_Kim1;~Kwangsoo_Kim1",
        "aff": "Seoul National University;Seoul National University;",
        "aff_domain": "snu.ac.kr;snu.ac.kr;",
        "position": "PhD student;MS student;",
        "bibtex": "@misc{\njeong2024cellular,\ntitle={Cellular Interplay in {COVID}-19: Insights from Graph Neural Networks with Multidimensional Edge Features},\nauthor={Kyeonghun Jeong and Yooeun Kim and Kwangsoo Kim},\nyear={2024},\nurl={https://openreview.net/forum?id=n9CqhWGK4o}\n}",
        "github": "",
        "project": "",
        "reviewers": "CTJa;Fa7B;MUv9;vxYD",
        "site": "https://openreview.net/forum?id=n9CqhWGK4o",
        "pdf_size": 5519603,
        "rating": "1;3;3;3",
        "confidence": "4;4;4;4",
        "soundness": "2;2;2;2",
        "contribution": "1;1;1;2",
        "presentation": "2;2;1;2",
        "wc_summary": "94;38;32;94",
        "wc_strengths": "62;31;21;29",
        "wc_weaknesses": "243;483;180;14",
        "wc_questions": "81;38;41;307",
        "wc_review": "480;590;274;444",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            64.5,
            29.576172842340505
        ],
        "wc_strengths_avg": [
            35.75,
            15.610493265749165
        ],
        "wc_weaknesses_avg": [
            230.0,
            168.32557737907808
        ],
        "wc_questions_avg": [
            116.75,
            111.14489416972783
        ],
        "wc_review_avg": [
            447.0,
            113.44161493913951
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:86mJENdysM8J:scholar.google.com/&scioq=Cellular+Interplay+in+COVID-19:+Insights+from+Graph+Neural+Networks+with+Multidimensional+Edge+Features&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Seoul National University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.snu.ac.kr",
        "aff_unique_abbr": "SNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "The Consensus Game: Language Model Generation via Equilibrium Search",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17870",
        "id": "n9xeGcI4Yg",
        "author_site": "Athul Jacob, Yikang Shen, Gabriele Farina, Jacob Andreas",
        "tldr": "",
        "abstract": "When applied to question answering and other text generation tasks, language models (LMs) may be queried generatively (by sampling answers from their output distribution) or discriminatively (by using them to score or rank a set of candidate answers). These procedures sometimes yield very different predictions. How do we reconcile mutually incompatible scoring procedures to obtain coherent LM predictions? We introduce a new, a training-free, game-theoretic procedure for language model decoding. Our approach casts language model decoding as a regularized imperfect-information sequential signaling game\u2014which we term the concensus game\u2014in which a generator seeks to communicate an abstract correctness parameter using natural language sentences to a discriminator. We develop computational procedures for finding approximate equilibria of this game, resulting in a decoding algorithm we call equilibrium-ranking. Applied to a large number of tasks (including reading comprehension, commonsense reasoning, mathematical problem-solving, and assistive dialog), equilibrium-ranking consistently improves performance over existing LM decoding procedures. These improvements are sometimes substantial\u2014on multiple benchmarks, we observe that applying equilibrium-ranking to LLaMA-7B outperforms the much larger LLaMA-65B and PaLM-540B models.",
        "keywords": "language models;decoding;planning;game theory",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Athul Paul Jacob;Yikang Shen;Gabriele Farina;Jacob Andreas",
        "authorids": "~Athul_Paul_Jacob1;~Yikang_Shen1;~Gabriele_Farina1;~Jacob_Andreas1",
        "gender": ";M;M;M",
        "homepage": "http://apjacob.me/;;http://www.cs.cmu.edu/~gfarina/about/;http://web.mit.edu/jda/www",
        "dblp": "192/1229;152/8226;;97/8154",
        "google_scholar": "https://scholar.google.ca/citations?user=XT3E7RoAAAAJ;qff5rRYAAAAJ;sktDNcEAAAAJ;dnZ8udEAAAAJ",
        "orcid": ";;;",
        "linkedin": "apjacob/;;;",
        "or_profile": "~Athul_Paul_Jacob1;~Yikang_Shen1;~Gabriele_Farina1;~Jacob_Andreas1",
        "aff": "Massachusetts Institute of Technology;International Business Machines;Massachusetts Institute of Technology;Microsoft",
        "aff_domain": "mit.edu;ibm.com;mit.edu;microsoft.com",
        "position": "PhD student;Researcher;Assistant Professor;Researcher",
        "bibtex": "@inproceedings{\njacob2024the,\ntitle={The Consensus Game: Language Model Generation via Equilibrium Search},\nauthor={Athul Paul Jacob and Yikang Shen and Gabriele Farina and Jacob Andreas},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=n9xeGcI4Yg}\n}",
        "github": "",
        "project": "",
        "reviewers": "ji8z;Jsc5;XHXa;DG2h",
        "pdf_size": 440806,
        "rating": "6;6;8;10",
        "confidence": "3;2;4;4",
        "soundness": "3;3;3;4",
        "contribution": "3;2;3;4",
        "presentation": "3;3;3;3",
        "wc_summary": "108;63;97;83",
        "wc_strengths": "155;46;55;343",
        "wc_weaknesses": "80;127;192;362",
        "wc_questions": "10;4;118;136",
        "wc_review": "353;240;462;924",
        "wc_reply_reviewers": "0;13;109;11",
        "wc_reply_authors": "201;717;1530;600",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "1;2;3;1",
        "rating_avg": [
            7.5,
            1.6583123951777
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            87.75,
            16.813313177360374
        ],
        "wc_strengths_avg": [
            149.75,
            119.49346216425398
        ],
        "wc_weaknesses_avg": [
            190.25,
            106.8372009180323
        ],
        "wc_questions_avg": [
            67.0,
            60.37383539249432
        ],
        "wc_review_avg": [
            494.75,
            259.96093456517656
        ],
        "wc_reply_reviewers_avg": [
            33.25,
            44.01349224953639
        ],
        "wc_reply_authors_avg": [
            762.0,
            482.91148257211694
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.8181818181818182,
        "gs_citation": 21,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8812787488324652741&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=n9xeGcI4Yg",
        "pdf": "https://openreview.net/pdf?id=n9xeGcI4Yg",
        "email": "mit.edu;ibm.com;mit.edu;microsoft.com",
        "author_num": 4,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "Massachusetts Institute of Technology;International Business Machines Corporation;Microsoft",
        "aff_unique_dep": ";;Microsoft Corporation",
        "aff_unique_url": "https://web.mit.edu;https://www.ibm.com;https://www.microsoft.com",
        "aff_unique_abbr": "MIT;IBM;Microsoft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "nAR9xu8WM6",
        "title": "Safeguarding Data in Multimodal AI: A Differentially Private Approach to CLIP Training",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The surge in multimodal AI's success has sparked concerns over data privacy in vision-and-language tasks.  While CLIP has revolutionized multimodal learning through joint training on images and text, its potential to unintentionally disclose sensitive information necessitates the integration of privacy-preserving mechanisms. We introduce a differentially private adaptation of the Contrastive Language-Image Pretraining (CLIP) model that effectively addresses privacy concerns while retaining accuracy. Our proposed method, \\dpclip, is rigorously evaluated on benchmark datasets encompassing diverse vision-and-language tasks such as image classification and image captioning. We demonstrate that our approach retains performance on par with the standard non-private CLIP model. Furthermore, we analyze our proposed algorithm under linear representation settings. We derive the convergence rate of our algorithm and show a trade-off between utility and privacy when gradients are clipped per-\\textit{batch} and the loss function does not satisfy smoothness conditions assumed in the literature for the analysis of DP-SGD.",
        "keywords": "Differential Privacy; Contrastive Language Image Pretraining; Multimodality",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/7f7c636abe04650b6994d23367ad17e64dfc6315.zip",
        "author": "Alyssa Huang;Peihan Liu;Ryumei Nakada;Linjun Zhang;Wanrong Zhang",
        "authorids": "~Alyssa_Huang1;~Peihan_Liu1;~Ryumei_Nakada1;~Linjun_Zhang1;~Wanrong_Zhang2",
        "gender": "F;;;M;F",
        "homepage": ";;https://statistics.rutgers.edu/people-pages/faculty/people/135-graduate-students/581-ryumei-nakada;;https://wanrongz.github.io",
        "dblp": ";;;;84/8554-1",
        "google_scholar": ";;;TUAzs3sAAAAJ;y8s4ok0AAAAJ",
        "orcid": ";;;;",
        "linkedin": "alyssa-huang-15608314a/;;;;",
        "or_profile": "~Alyssa_Huang1;~Peihan_Liu1;~Ryumei_Nakada1;~Linjun_Zhang1;~Wanrong_Zhang2",
        "aff": "Harvard University;;Rutgers University;Rutgers University;Tiktok",
        "aff_domain": "harvard.edu;;rutgers.edu;rutgers.edu;tiktok.com",
        "position": "Undergrad student;;PhD student;Assistant Professor;Researcher",
        "bibtex": "@misc{\nhuang2024safeguarding,\ntitle={Safeguarding Data in Multimodal {AI}: A Differentially Private Approach to {CLIP} Training},\nauthor={Alyssa Huang and Peihan Liu and Ryumei Nakada and Linjun Zhang and Wanrong Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=nAR9xu8WM6}\n}",
        "github": "",
        "project": "",
        "reviewers": "68X7;mwbE;WDu3;7tKv",
        "site": "https://openreview.net/forum?id=nAR9xu8WM6",
        "pdf_size": 692148,
        "rating": "1;1;8;8",
        "confidence": "4;4;2;4",
        "soundness": "3;1;3;3",
        "contribution": "1;1;3;4",
        "presentation": "1;2;3;3",
        "wc_summary": "77;38;110;96",
        "wc_strengths": "16;29;85;97",
        "wc_weaknesses": "383;694;46;92",
        "wc_questions": "114;2;51;3",
        "wc_review": "590;763;292;288",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1318;662;194;241",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;1;1;1",
        "rating_avg": [
            4.5,
            3.5
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.25,
            1.299038105676658
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            80.25,
            27.058963394779187
        ],
        "wc_strengths_avg": [
            56.75,
            34.816483165305485
        ],
        "wc_weaknesses_avg": [
            303.75,
            259.7348407511014
        ],
        "wc_questions_avg": [
            42.5,
            45.78482281280556
        ],
        "wc_review_avg": [
            483.25,
            202.70344718331754
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            603.75,
            450.8405344464936
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5773502691896256,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9279252900622887854&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "Harvard University;Rutgers University;TikTok",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.harvard.edu;https://www.rutgers.edu;https://www.tiktok.com",
        "aff_unique_abbr": "Harvard;Rutgers;TikTok",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "nATTIkte9f",
        "title": "LMO-DP: Accurately Fine-Tuning Language Models with Stronger Differential Privacy",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Differentially Private Stochastic Gradient Descent (DP-SGD) and its variants have been proposed to ensure rigorous privacy for fine-tuning large-scale pre-trained language models. State-of-the-art (SOTA) DP-SGD methods rely heavily on the Gaussian mechanism since its key component \u2013 moment accountant (MA) leverages the properties of Gaussian noise to accumulate the overall privacy budget via tight DP composition. However, the privacy constraints imposed in DP-SGD, solely on the Gaussian noise, may still overly perturb the gradients and degrade the fine-tuning accuracy, especially in stronger privacy regimes (e.g., the total privacy budget $\\epsilon < 3$). To address such limitations, we propose a novel Language Model-based Optimal Differential Privacy (LMO-DP) framework, which takes the first step to enable the tight composition of a sub-optimal DP mechanism (non-Gaussian) for accurately fine-tuning language models, even in stronger privacy regimes (e.g., $0.5 \\leq \\epsilon < 3$). Furthermore, LMO-DP efficiently approximates the sub-optimal DP and fast convergence, compared to the SOTA methods. For instance, fine-tuning RoBERTa-large (with 300M parameters) on the SST-2 dataset can achieve the 92.20% accuracy (given the total privacy budgets $\\epsilon = 0.3$ and $\\delta = 0$), compared with the \u223c50% accuracy of most SOTA methods. We also draw similar findings on text generation tasks while privately fine-tuning GPT-2.",
        "keywords": "Differential Privacy;Natural Language Processing;Fine-tuning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/edd654d9e2eb780eb42963320790d6f9b14bc94f.pdf",
        "author": "Qin Yang;Meisam Mohammady;Han Wang;Ali Payani;Ashish Kundu;Kai Shu;Yan Yan;Yuan Hong",
        "authorids": "~Qin_Yang3;~Meisam_Mohammady1;~Han_Wang28;~Ali_Payani1;~Ashish_Kundu1;~Kai_Shu1;~Yan_Yan6;~Yuan_Hong1",
        "gender": "F;M;F;M;;;M;M",
        "homepage": ";https://meisamcs.github.io/;https://hwangcsiit.github.io;;;https://www.cs.emory.edu/~kshu5/;;https://yhongcs.github.io/",
        "dblp": ";;;184/3921;;153/5265;13/3953-2;79/5433-1",
        "google_scholar": ";;7ZNrN9UAAAAJ;9rHwD8wAAAAJ;;-6bAV2cAAAAJ;;KJuZW2wAAAAJ",
        "orcid": "0000-0003-3792-2116;;0009-0008-4310-4623;0000-0003-4054-2958;;;;",
        "linkedin": ";;;ali-payani-59267515;;;;",
        "or_profile": "~Qin_Yang3;~Meisam_Mohammady1;~Han_Wang28;~Ali_Payani1;~Ashish_Kundu1;~Kai_Shu1;~Yan_Yan6;~Yuan_Hong1",
        "aff": "University of Connecticut;Iowa State University;University of Kansas;Cisco;;Emory University;University of Illinois Chicago;University of Connecticut",
        "aff_domain": "uconn.edu;isu.edu;ku.edu;cisco.com;;emory.edu;uic.edu;uconn.edu",
        "position": "PhD student;Assistant Professor;Assistant Professor;Researcher;;Assistant Professor;Associate Professor;Associate Professor",
        "bibtex": "@misc{\nyang2024lmodp,\ntitle={{LMO}-{DP}: Accurately Fine-Tuning Language Models with Stronger Differential Privacy},\nauthor={Qin Yang and Meisam Mohammady and Han Wang and Ali Payani and Ashish Kundu and Kai Shu and Yan Yan and Yuan Hong},\nyear={2024},\nurl={https://openreview.net/forum?id=nATTIkte9f}\n}",
        "github": "",
        "project": "",
        "reviewers": "LUi6;4F9v;tr6o;9q2i",
        "site": "https://openreview.net/forum?id=nATTIkte9f",
        "pdf_size": 1559947,
        "rating": "3;5;5;6",
        "confidence": "4;3;4;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;4;3",
        "presentation": "2;3;1;3",
        "wc_summary": "78;49;91;31",
        "wc_strengths": "146;28;76;68",
        "wc_weaknesses": "591;203;94;72",
        "wc_questions": "9;61;186;36",
        "wc_review": "824;341;447;207",
        "wc_reply_reviewers": "312;128;46;0",
        "wc_reply_authors": "1422;488;737;470",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            62.25,
            23.594225988576103
        ],
        "wc_strengths_avg": [
            79.5,
            42.482349275905165
        ],
        "wc_weaknesses_avg": [
            240.0,
            208.6324519340172
        ],
        "wc_questions_avg": [
            73.0,
            67.78274116617003
        ],
        "wc_review_avg": [
            454.75,
            229.52382773908246
        ],
        "wc_reply_reviewers_avg": [
            121.5,
            119.15850787921104
        ],
        "wc_reply_authors_avg": [
            779.25,
            385.80265356785713
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.6882472016116854,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Esb5wdGvpRwJ:scholar.google.com/&scioq=LMO-DP:+Accurately+Fine-Tuning+Language+Models+with+Stronger+Differential+Privacy&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;4;5;0",
        "aff_unique_norm": "University of Connecticut;Iowa State University;University of Kansas;Cisco Systems;Emory University;University of Illinois at Chicago",
        "aff_unique_dep": ";;;;;",
        "aff_unique_url": "https://www.uconn.edu;https://www.iastate.edu;https://www.ku.edu;https://www.cisco.com;https://www.emory.edu;https://www.uic.edu",
        "aff_unique_abbr": "UConn;ISU;KU;Cisco;Emory;UIC",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Chicago",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Federated Orthogonal Training: Mitigating Global Catastrophic Forgetting in Continual Federated Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17869",
        "id": "nAs4LdaP9Y",
        "author_site": "Yavuz Faruk Bakman, Duygu Nur Yaldiz, Yahya Ezzeldin, Salman Avestimehr",
        "tldr": "",
        "abstract": "Federated Learning (FL) has gained significant attraction due to its ability to enable privacy-preserving training over decentralized data. Current literature in FL mostly focuses on single-task learning. However, over time, new tasks may appear in the clients and the global model should learn these tasks without forgetting previous tasks. This real-world scenario is known as Continual Federated Learning (CFL). The main challenge of CFL is \\textit{Global Catastrophic Forgetting}, which corresponds to the fact that when the global model is trained on new tasks, its performance on old tasks decreases. There have been a few recent works on CFL to propose methods that aim to address the global catastrophic forgetting problem. However, these works either have unrealistic assumptions on the availability of past data samples or violate the privacy principles of FL. We propose a novel method, Federated Orthogonal Training (FOT), to overcome these drawbacks and address the global catastrophic forgetting in CFL. Our algorithm extracts the global input subspace of each layer for old tasks and modifies the aggregated updates of new tasks such that they are orthogonal to the global principal subspace of old tasks for each layer. This decreases the interference between tasks, which is the main cause for forgetting. Our method is almost computation-free on the client side and has negligible communication cost. We empirically show that FOT outperforms state-of-the-art continual learning methods in the CFL setting, achieving an average accuracy gain of up to 15% with 27% lower forgetting while only incurring a minimal computation and communication cost. Code can be found [here ](https://github.com/duygunuryldz/Federated_Orthogonal_Training)",
        "keywords": "Federated Learning;Continual Learning;Catastrophic Forgetting",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/fd7f227dff853b4e08e15cde05cedbaa60b83d50.zip",
        "author": "Yavuz Faruk Bakman;Duygu Nur Yaldiz;Yahya H. Ezzeldin;Salman Avestimehr",
        "authorids": "~Yavuz_Faruk_Bakman1;~Duygu_Nur_Yaldiz1;~Yahya_H._Ezzeldin1;~Salman_Avestimehr1",
        "gender": "M;F;;",
        "homepage": "https://ybakman.com/;https://www.duygunuryaldiz.com/;;",
        "dblp": "345/2151;327/1655;;",
        "google_scholar": "HCH-T5UAAAAJ;SY6gzIgAAAAJ;;",
        "orcid": ";0009-0008-1340-5978;;",
        "linkedin": "yavuz-bakman-b33509147/;duygu-nur-yald\u0131z-338b04181;;",
        "or_profile": "~Yavuz_Faruk_Bakman1;~Duygu_Nur_Yaldiz1;~Yahya_H._Ezzeldin1;~Salman_Avestimehr1",
        "aff": "University of Southern California;University of Southern California;;",
        "aff_domain": "usc.edu;usc.edu;;",
        "position": "PhD student;PhD student;;",
        "bibtex": "@inproceedings{\nbakman2024federated,\ntitle={Federated Orthogonal Training: Mitigating Global Catastrophic Forgetting in Continual Federated Learning},\nauthor={Yavuz Faruk Bakman and Duygu Nur Yaldiz and Yahya H. Ezzeldin and Salman Avestimehr},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=nAs4LdaP9Y}\n}",
        "github": "",
        "project": "",
        "reviewers": "VJN9;Zv1b;vBpD",
        "pdf_size": 2664129,
        "rating": "5;6;8",
        "confidence": "3;3;4",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "3;3;3",
        "wc_summary": "170;71;26",
        "wc_strengths": "49;55;107",
        "wc_weaknesses": "135;57;135",
        "wc_questions": "22;18;142",
        "wc_review": "376;201;410",
        "wc_reply_reviewers": "36;13;13",
        "wc_reply_authors": "472;1007;1162",
        "reply_reviewers": "1;1;1",
        "reply_authors": "2;3;3",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            89.0,
            60.149812967290266
        ],
        "wc_strengths_avg": [
            70.33333333333333,
            26.04269997949948
        ],
        "wc_weaknesses_avg": [
            109.0,
            36.76955262170047
        ],
        "wc_questions_avg": [
            60.666666666666664,
            57.53453069437712
        ],
        "wc_review_avg": [
            329.0,
            91.5678254992804
        ],
        "wc_reply_reviewers_avg": [
            20.666666666666668,
            10.842303978193728
        ],
        "wc_reply_authors_avg": [
            880.3333333333334,
            295.58792638100465
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.944911182523068,
        "gs_citation": 18,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14811053816838942432&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=nAs4LdaP9Y",
        "pdf": "https://openreview.net/pdf?id=nAs4LdaP9Y",
        "email": "usc.edu;usc.edu;;",
        "author_num": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Southern California",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.usc.edu",
        "aff_unique_abbr": "USC",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Los Angeles",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Self-Supervised Contrastive Learning for Long-term Forecasting",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17868",
        "id": "nBCuRzjqK7",
        "author_site": "Junwoo Park, Daehoon Gwak, Jaegul Choo, Edward Choi",
        "tldr": "",
        "abstract": "Long-term forecasting presents unique challenges due to the time and memory\ncomplexity of handling long sequences. Existing methods, which rely on sliding windows to process long sequences, struggle to effectively capture long-term variations that are partially caught within the short window (i.e., outer-window variations). In this paper, we introduce a novel approach that overcomes this limitation by employing contrastive learning and enhanced decomposition architecture,\nspecifically designed to focus on long-term variations. To this end, our contrastive\nloss incorporates global autocorrelation held in the whole time series, which facilitates the construction of positive and negative pairs in a self-supervised manner. When combined with our decomposition networks, our constrative learning significantly improves long-term forecasting performance. Extensive experiments demonstrate that our approach outperforms 14 baseline models on well-established\nnine long-term benchmarks, especially in challenging scenarios that require a significantly long output for forecasting. This paper not only presents a novel direction for long-term forecasting but also offers a more reliable method for effectively integrating long-term variations into time-series representation learning.",
        "keywords": "Contrastive learning;time-series representation;long-term forecasting",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Junwoo Park;Daehoon Gwak;Jaegul Choo;Edward Choi",
        "authorids": "~Junwoo_Park2;~Daehoon_Gwak1;~Jaegul_Choo1;~Edward_Choi1",
        "gender": "M;M;M;M",
        "homepage": ";;https://sites.google.com/site/jaegulchoo/;http://mp2893.com",
        "dblp": "164/8456;276/7016;07/2074;41/3886",
        "google_scholar": ";NyQ42l8AAAAJ;GHJYsLEAAAAJ;GUlGIPkAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Junwoo_Park2;~Daehoon_Gwak1;~Jaegul_Choo1;~Edward_Choi1",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr;kaist.ac.kr;kaist.ac.kr",
        "position": "PhD student;PhD student;Associate Professor;Associate Professor",
        "bibtex": "@inproceedings{\npark2024selfsupervised,\ntitle={Self-Supervised Contrastive Learning for Long-term Forecasting},\nauthor={Junwoo Park and Daehoon Gwak and Jaegul Choo and Edward Choi},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=nBCuRzjqK7}\n}",
        "github": "",
        "project": "",
        "reviewers": "MDze;hiP7;eBaK;pLfj",
        "pdf_size": 9259826,
        "rating": "5;6;6;8",
        "confidence": "5;4;4;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "85;60;93;87",
        "wc_strengths": "52;92;58;115",
        "wc_weaknesses": "77;156;92;101",
        "wc_questions": "15;6;29;25",
        "wc_review": "229;314;272;328",
        "wc_reply_reviewers": "0;104;0;0",
        "wc_reply_authors": "1658;1290;774;1088",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "4;3;2;2",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            81.25,
            12.616952880945542
        ],
        "wc_strengths_avg": [
            79.25,
            25.66490794840301
        ],
        "wc_weaknesses_avg": [
            106.5,
            29.837057495671385
        ],
        "wc_questions_avg": [
            18.75,
            8.954747344286158
        ],
        "wc_review_avg": [
            285.75,
            38.70642711488623
        ],
        "wc_reply_reviewers_avg": [
            26.0,
            45.033320996790806
        ],
        "wc_reply_authors_avg": [
            1202.5,
            320.8812085492075
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.6622661785325219,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4830997130180877406&as_sdt=80005&sciodt=0,11&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=nBCuRzjqK7",
        "pdf": "https://openreview.net/pdf?id=nBCuRzjqK7",
        "email": "kaist.ac.kr;kaist.ac.kr;kaist.ac.kr;kaist.ac.kr",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "nBYDP46s5N",
        "title": "Policy Gradient without Boostrapping via Truncated Value Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Reinforcement learning algorithms have typically used discounting to reduce the variance of return estimates. However, this reward transformation causes the agent to optimize an objective other than what is specified by the designer. We present a novel deep policy gradient algorithm, \\textit{Truncated Value Learning} (TVL), which can learn rewards \\textit{discount free} while simultaneously learning value estimates for \\textit{all} summable discount functions. Moreover, unlike many other algorithms, TVL learns values without bootstrapping. We hypothesize that bootstrap-free learning improves performance in high-noise environments due to reduced error propagation. We tested TVL empirically on the challenging high-noise \\textit{Procgen} benchmark and found it outperformed the previous best algorithm, Phasic Policy Gradient. We also show that our method produces state-of-the-art performance on the challenging long-horizon Atari game \\env{Skiing} while using less than 1\\% of the training data of the previous best result.",
        "keywords": "Reinforcement Learning;Policy Gradient;Discounting;Atari",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/c352ed78420d28f1d2e0264440668c1f70f3a01f.zip",
        "author": "Matthew Aitchison;Penny Sweetser;Gregoire Deletang;Marcus Hutter",
        "authorids": "~Matthew_Aitchison1;~Penny_Sweetser1;~Gregoire_Deletang1;~Marcus_Hutter1",
        "gender": "M;F;;M",
        "homepage": ";https://cecs.anu.edu.au/people/penny-kyburz;http://www.hutter1.net/;http://gdeletang.com/",
        "dblp": ";;h/MarcusHutter;277/0588",
        "google_scholar": "81URpqMAAAAJ;https://scholar.google.com.au/citations?hl=en;https://scholar.google.com.tw/citations?user=7hmCntEAAAAJ;OgVNoSkAAAAJ",
        "orcid": ";;0000-0002-3263-4097;",
        "linkedin": ";;hutter1/;gr%C3%A9goire-del%C3%A9tang-4a1900128/",
        "or_profile": "~Matthew_Aitchison1;~Penny_Sweetser1;~Marcus_Hutter1;~Gregoire_Detetang1",
        "aff": "Australian National University;Australian National University;Australian National University;",
        "aff_domain": "anu.edu.au;anu.edu.au;anu.edu.au;",
        "position": "PhD student;Lecturer;Full Professor;",
        "bibtex": "@misc{\naitchison2024policy,\ntitle={Policy Gradient without Boostrapping via Truncated Value Learning},\nauthor={Matthew Aitchison and Penny Sweetser and Gregoire Deletang and Marcus Hutter},\nyear={2024},\nurl={https://openreview.net/forum?id=nBYDP46s5N}\n}",
        "github": "",
        "project": "",
        "reviewers": "tc1K;ynUz;wjX3;Mwb3",
        "site": "https://openreview.net/forum?id=nBYDP46s5N",
        "pdf_size": 3208867,
        "rating": "3;5;5;6",
        "confidence": "2;3;3;3",
        "soundness": "2;2;3;3",
        "contribution": "2;1;2;2",
        "presentation": "2;3;3;3",
        "wc_summary": "40;50;73;45",
        "wc_strengths": "25;24;33;21",
        "wc_weaknesses": "476;91;81;32",
        "wc_questions": "78;60;28;19",
        "wc_review": "619;225;215;117",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "716;305;383;305",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            52.0,
            12.62933094031509
        ],
        "wc_strengths_avg": [
            25.75,
            4.437059837324712
        ],
        "wc_weaknesses_avg": [
            170.0,
            178.074422644017
        ],
        "wc_questions_avg": [
            46.25,
            23.836683913665507
        ],
        "wc_review_avg": [
            294.0,
            192.32524535276173
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            427.25,
            169.72385660242347
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.9271726499455306,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17044345001839201641&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Australian National University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.anu.edu.au",
        "aff_unique_abbr": "ANU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Australia"
    },
    {
        "title": "Listen, Think, and Understand",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17867",
        "id": "nBZBPXdJlC",
        "author_site": "Yuan Gong, Hongyin Luo, Alexander Liu, Leonid Karlinsky, James R Glass",
        "tldr": "",
        "abstract": "The ability of artificial intelligence (AI) systems to perceive and comprehend audio signals is crucial for many applications. Although significant progress has been made in this area since the development of AudioSet, most existing models are designed to map audio inputs to pre-defined, discrete sound label sets. In contrast, humans possess the ability to not only classify sounds into general categories, but also to listen to the finer details of the sounds, explain the reason for the predictions, think about what the sound infers, and understand the scene and what action needs to be taken, if any. Such capabilities beyond perception are not yet present in existing audio models. On the other hand, modern large language models (LLMs) exhibit emerging reasoning ability but they lack audio perception capabilities. Therefore, we ask the question: can we build a model that has both audio perception and reasoning ability? \n\nIn this paper, we propose a new audio foundation model, called LTU (Listen, Think, and Understand). To train LTU, we created a new OpenAQA-5M dataset consisting of 1.9 million closed-ended and 3.7 million open-ended, diverse (audio, question, answer) tuples, and have used an autoregressive training framework with a perception-to-understanding curriculum. LTU demonstrates strong performance and generalization ability on conventional audio tasks such as classification and captioning. More importantly, it exhibits emerging audio reasoning and comprehension abilities that are absent in existing audio models. To the best of our knowledge, LTU is the first multimodal large language model that focuses on general audio (rather than just speech) understanding.",
        "keywords": "audio processing; large language model",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/29d5103c2301bb719572f8c42a045531f911d31a.zip",
        "author": "Yuan Gong;Hongyin Luo;Alexander H. Liu;Leonid Karlinsky;James R. Glass",
        "authorids": "~Yuan_Gong3;~Hongyin_Luo1;~Alexander_H._Liu1;~Leonid_Karlinsky3;~James_R._Glass1",
        "gender": "M;M;M;M;",
        "homepage": ";;https://alexander-h-liu.github.io/;;",
        "dblp": ";147/4317;227/2380;05/4463;",
        "google_scholar": "MuhvvOkAAAAJ;;LIiCDa0AAAAJ;https://scholar.google.co.il/citations?user=WbO7tjYAAAAJ;",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Yuan_Gong3;~Hongyin_Luo1;~Alexander_H._Liu1;~Leonid_Karlinsky3;~James_R._Glass1",
        "aff": "Massachusetts Institute of Technology;Massachusetts Institute of Technology;NVIDIA;International Business Machines;",
        "aff_domain": "mit.edu;mit.edu;nvidia.com;ibm.com;",
        "position": "Researcher;Postdoc;Intern;Principal Researcher;",
        "bibtex": "@inproceedings{\ngong2024listen,\ntitle={Listen, Think, and Understand},\nauthor={Yuan Gong and Hongyin Luo and Alexander H. Liu and Leonid Karlinsky and James R. Glass},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=nBZBPXdJlC}\n}",
        "github": "",
        "project": "",
        "reviewers": "oFtB;1UHZ;wB1w;2qgj",
        "pdf_size": 1230223,
        "rating": "6;6;8;8",
        "confidence": "4;5;4;5",
        "soundness": "3;3;3;4",
        "contribution": "3;3;3;4",
        "presentation": "3;3;3;4",
        "wc_summary": "125;73;77;354",
        "wc_strengths": "123;84;44;223",
        "wc_weaknesses": "180;57;145;208",
        "wc_questions": "55;110;110;5",
        "wc_review": "483;324;376;790",
        "wc_reply_reviewers": "39;0;35;0",
        "wc_reply_authors": "2485;1809;2542;1831",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "6;3;5;3",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            157.25,
            115.42178087345559
        ],
        "wc_strengths_avg": [
            118.5,
            66.48496070541066
        ],
        "wc_weaknesses_avg": [
            147.5,
            56.817690906970164
        ],
        "wc_questions_avg": [
            70.0,
            43.73213921133976
        ],
        "wc_review_avg": [
            493.25,
            180.6645717898227
        ],
        "wc_reply_reviewers_avg": [
            18.5,
            18.553975315279473
        ],
        "wc_reply_authors_avg": [
            2166.75,
            347.422203521882
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            4.25,
            1.299038105676658
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 177,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10650236499486566217&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 9,
        "openreview": "https://openreview.net/forum?id=nBZBPXdJlC",
        "pdf": "https://openreview.net/pdf?id=nBZBPXdJlC",
        "email": "mit.edu;mit.edu;nvidia.com;ibm.com;",
        "author_num": 5,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "Massachusetts Institute of Technology;NVIDIA;International Business Machines Corporation",
        "aff_unique_dep": ";NVIDIA Corporation;",
        "aff_unique_url": "https://web.mit.edu;https://www.nvidia.com;https://www.ibm.com",
        "aff_unique_abbr": "MIT;NVIDIA;IBM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "nFG1YmQTqi",
        "title": "TSGM: Regular and Irregular Time-series Generation using Score-based Generative Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Score-based generative models (SGMs) have demonstrated unparalleled sampling quality and diversity in numerous fields, such as image generation, voice synthesis, and tabular data synthesis, etc. Inspired by those outstanding results, we apply SGMs to synthesize time-series by learning its conditional score function. To this end, we present a conditional score network for time-series synthesis, deriving a denoising score matching loss tailored for our purposes. In particular, our presented denoising score matching loss is the first denoising score matching loss for time-series synthesis. In addition, our framework is such flexible that both regular and irregular time-series can be synthesized with minimal changes to our model design. Finally, we obtain exceptional synthesis performance on various time-series datasets, achieving state-of-the-art sampling diversity and quality.",
        "keywords": "Time-series Generation;Score-based Generative Model",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/4927b73f3daa8fa88804aecc19f39d42448d5e01.zip",
        "author": "Haksoo Lim;Minjung Kim;Sewon Park;Jaehoon Lee;Noseong Park",
        "authorids": "~Haksoo_Lim1;~Minjung_Kim5;~Sewon_Park2;~Jaehoon_Lee6;~Noseong_Park1",
        "gender": "M;;M;;",
        "homepage": ";;;;",
        "dblp": ";92/4738;322/5828.html;;",
        "google_scholar": "ZJvEyqwAAAAJ;;;;",
        "orcid": ";;0000-0002-6811-4632;;",
        "linkedin": ";min-jung-kim-15a169199/;;;",
        "or_profile": "~Haksoo_Lim1;~Minjung_Kim5;~Sewon_Park2;~Jaehoon_Lee6;~Noseong_Park1",
        "aff": "Yonsei University;;Samsung SDS;;",
        "aff_domain": "yonsei.ac.kr;;samsung.com;;",
        "position": "MS student;;Researcher;;",
        "bibtex": "@misc{\nlim2024tsgm,\ntitle={{TSGM}: Regular and Irregular Time-series Generation using Score-based Generative Models},\nauthor={Haksoo Lim and Minjung Kim and Sewon Park and Jaehoon Lee and Noseong Park},\nyear={2024},\nurl={https://openreview.net/forum?id=nFG1YmQTqi}\n}",
        "github": "",
        "project": "",
        "reviewers": "ox1H;Y133;thaZ;KQyu",
        "site": "https://openreview.net/forum?id=nFG1YmQTqi",
        "pdf_size": 3156763,
        "rating": "5;5;5;8",
        "confidence": "3;3;4;3",
        "soundness": "2;2;2;3",
        "contribution": "2;4;2;3",
        "presentation": "2;1;3;3",
        "wc_summary": "56;78;71;52",
        "wc_strengths": "42;102;28;38",
        "wc_weaknesses": "35;838;303;108",
        "wc_questions": "107;256;2;8",
        "wc_review": "240;1274;404;206",
        "wc_reply_reviewers": "262;691;156;0",
        "wc_reply_authors": "1259;955;849;98",
        "reply_reviewers": "2;1;1;0",
        "reply_authors": "4;3;3;2",
        "rating_avg": [
            5.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            64.25,
            10.638961415476606
        ],
        "wc_strengths_avg": [
            52.5,
            29.03015673398957
        ],
        "wc_weaknesses_avg": [
            321.0,
            314.1568079797094
        ],
        "wc_questions_avg": [
            93.25,
            102.79925826580657
        ],
        "wc_review_avg": [
            531.0,
            435.454934522506
        ],
        "wc_reply_reviewers_avg": [
            277.25,
            256.4131188141512
        ],
        "wc_reply_authors_avg": [
            790.25,
            427.0628612979593
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 62,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10621111847482912677&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Yonsei University;Samsung",
        "aff_unique_dep": ";Samsung SDS",
        "aff_unique_url": "https://www.yonsei.ac.kr;https://www.samsungsds.com",
        "aff_unique_abbr": "Yonsei;Samsung SDS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "Communication-Efficient Federated Non-Linear Bandit Optimization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17866",
        "id": "nFI3wFM9yN",
        "author_site": "Chuanhao Li, Chong Liu, Yu-Xiang Wang",
        "tldr": "",
        "abstract": "Federated optimization studies the problem of collaborative function optimization among multiple clients (e.g. mobile devices or organizations) under the coordination of a central server. Since the data is collected separately by each client and always remains decentralized, federated optimization preserves data privacy and allows for large-scale computing, which makes it a promising decentralized machine learning paradigm. Though it is often deployed for tasks that are online in nature, e.g., next-word prediction on keyboard apps, most works formulate it as an offline problem. The few exceptions that consider federated bandit optimization are limited to very simplistic function classes, e.g., linear, generalized linear, or non-parametric function class with bounded RKHS norm, which severely hinders its practical usage. In this paper, we propose a new algorithm, named Fed-GO-UCB, for federated bandit optimization with generic non-linear objective function. Under some mild conditions, we rigorously prove that Fed-GO-UCB is able to achieve sub-linear rate for both cumulative regret and communication cost. At the heart of our theoretical analysis are distributed regression oracle and individual confidence set construction, which can be of independent interests. Empirical evaluations also demonstrate the effectiveness of the proposed algorithm.",
        "keywords": "federated optimization;communication cost;non-linear bandit;bandit optimization;cumulative regret",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Chuanhao Li;Chong Liu;Yu-Xiang Wang",
        "authorids": "~Chuanhao_Li1;~Chong_Liu1;~Yu-Xiang_Wang1",
        "gender": ";M;",
        "homepage": "https://cyrilli.github.io/;https://chong-l.github.io/;http://www.cs.ucsb.edu/~yuxiangw/publications.html",
        "dblp": "195/9947;47/2929-7.html;62/1637-3.html",
        "google_scholar": "w2ShljkAAAAJ;https://scholar.google.com/citations?hl=en;HGNZ1fkAAAAJ",
        "orcid": ";0000-0002-7028-7508;",
        "linkedin": ";danielcliu/;",
        "or_profile": "~Chuanhao_Li1;~Chong_Liu1;~Yu-Xiang_Wang1",
        "aff": "Yale University;University of Chicago;UC Santa Barbara",
        "aff_domain": "yale.edu;uchicago.edu;ucsb.edu",
        "position": "Postdoc;Postdoc;Assistant Professor",
        "bibtex": "@inproceedings{\nli2024communicationefficient,\ntitle={Communication-Efficient Federated Non-Linear Bandit Optimization},\nauthor={Chuanhao Li and Chong Liu and Yu-Xiang Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=nFI3wFM9yN}\n}",
        "github": "",
        "project": "",
        "reviewers": "6154;yBxF;emcJ;rFun",
        "pdf_size": 760931,
        "rating": "6;6;6;6",
        "confidence": "3;4;2;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "182;87;52;67",
        "wc_strengths": "64;73;53;40",
        "wc_weaknesses": "86;222;50;253",
        "wc_questions": "69;9;75;145",
        "wc_review": "401;391;230;505",
        "wc_reply_reviewers": "14;0;14;11",
        "wc_reply_authors": "969;559;688;1246",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "3;2;2;3",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            97.0,
            50.62114182829147
        ],
        "wc_strengths_avg": [
            57.5,
            12.338962679253067
        ],
        "wc_weaknesses_avg": [
            152.75,
            86.39842301801579
        ],
        "wc_questions_avg": [
            74.5,
            48.194916744403656
        ],
        "wc_review_avg": [
            381.75,
            98.32948438794948
        ],
        "wc_reply_reviewers_avg": [
            9.75,
            5.7608593109014565
        ],
        "wc_reply_authors_avg": [
            865.5,
            265.019338916993
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13079940696514658064&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=nFI3wFM9yN",
        "pdf": "https://openreview.net/pdf?id=nFI3wFM9yN",
        "email": "yale.edu;uchicago.edu;ucsb.edu",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Yale University;University of Chicago;University of California, Santa Barbara",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.yale.edu;https://www.uchicago.edu;https://www.ucsb.edu",
        "aff_unique_abbr": "Yale;UChicago;UCSB",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Santa Barbara",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "nFJVpeYcnv",
        "title": "Bandit Learning in Matching: Unknown Preferences On Both Sides",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Two-sided matching under uncertainty has recently drawn much attention due to its wide applications. Matching bandits model the learning process in matching markets with the multi-player multi-armed bandit framework, i.e. participants learn their preferences from the stochastic rewards after being matched. Existing works in matching bandits mainly focus on the one-sided setting (i.e. arms are aware of their own preferences accurately) and design algorithms with the objective of converging to stable matching with low regret.  In this paper, we consider the more general two-sided setting, i.e. participants on both sides have to learn their preferences over the other side through repeated interactions.  Specifically, we formally introduce the two-sided setting and consider the rational and general case where arms adopt \"sample efficient\" strategies.    Facing the challenge of unstable and unreliable feedback from arms, we design an effective algorithm that requires no restrictive assumptions such as special preference structure and observation of winning players. Moreover, our algorithm is the first to provide a theoretical upper bound and achieves $O(\\log T)$ regret which is proved optimal in terms of $T$.",
        "keywords": "Bandits;Matching",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/90187535d1a21abe74910f4357ce7d5ea6d28fd2.zip",
        "author": "YiRui Zhang;Zhixuan Fang",
        "authorids": "~YiRui_Zhang1;~Zhixuan_Fang1",
        "gender": ";M",
        "homepage": "https://people.iiis.tsinghua.edu.cn/~fang/yirui.html;https://people.iiis.tsinghua.edu.cn/~fang/",
        "dblp": ";179/2243",
        "google_scholar": ";0N4s3CAAAAAJ",
        "orcid": "0009-0005-5171-389X;",
        "linkedin": ";",
        "or_profile": "~YiRui_Zhang1;~Zhixuan_Fang1",
        "aff": "Tsinghua University;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nzhang2024bandit,\ntitle={Bandit Learning in Matching: Unknown Preferences On Both Sides},\nauthor={YiRui Zhang and Zhixuan Fang},\nyear={2024},\nurl={https://openreview.net/forum?id=nFJVpeYcnv}\n}",
        "github": "",
        "project": "",
        "reviewers": "X1qd;V2Kp;QoQ1;hbNf",
        "site": "https://openreview.net/forum?id=nFJVpeYcnv",
        "pdf_size": 0,
        "rating": "3;5;5;5",
        "confidence": "3;3;5;3",
        "soundness": "3;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;4;2;2",
        "wc_summary": "112;58;52;132",
        "wc_strengths": "51;36;59;73",
        "wc_weaknesses": "148;302;174;47",
        "wc_questions": "28;22;4;21",
        "wc_review": "339;418;289;273",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "563;876;733;102",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            88.5,
            34.30378987808781
        ],
        "wc_strengths_avg": [
            54.75,
            13.386093530227555
        ],
        "wc_weaknesses_avg": [
            167.75,
            90.87457015029013
        ],
        "wc_questions_avg": [
            18.75,
            8.926785535678562
        ],
        "wc_review_avg": [
            329.75,
            56.46846465063487
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            568.5,
            291.2340124367345
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:kBfU3XBp_noJ:scholar.google.com/&scioq=Bandit+Learning+in+Matching:+Unknown+Preferences+On+Both+Sides&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Tsinghua University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Cross-Modal Contextualized Diffusion Models for Text-Guided Visual Generation and Editing",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17865",
        "id": "nFMS6wF2xq",
        "author_site": "Ling Yang, Zhilong Zhang, Zhaochen Yu, Jingwei Liu, Minkai Xu, Stefano Ermon, Bin CUI",
        "tldr": "",
        "abstract": "Conditional diffusion models have exhibited superior performance in high-fidelity text-guided visual generation and editing. Nevertheless, prevailing text-guided visual diffusion models primarily focus on incorporating text-visual relationships exclusively into the reverse process, often disregarding their relevance in the forward process. This inconsistency between forward and reverse processes may\nlimit the precise conveyance of textual semantics in visual synthesis results. To address this issue, we propose a novel and general contextualized diffusion model (ContextDiff) by incorporating the cross-modal context encompassing interactions and alignments between text condition and visual sample into forward and reverse processes. We propagate this context to all timesteps in the two processes to adapt their trajectories, thereby facilitating cross-modal conditional modeling. We generalize our contextualized diffusion to both DDPMs and DDIMs with theoretical derivations, and demonstrate the effectiveness of our model in evaluations with two challenging tasks: text-to-image generation, and text-to-video editing. In each task, our ContextDiff achieves new state-of-the-art performance, significantly enhancing the semantic alignment between text condition and generated samples, as evidenced by quantitative and qualitative evaluations. Our code is available at https://github.com/YangLing0818/ContextDiff",
        "keywords": "Diffusion Model;Text-to-Image Generation;Text-to-Video Editing",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/524da777e4d9031126b820e6523b0bfe4db389dc.zip",
        "author": "Ling Yang;Zhilong Zhang;Zhaochen Yu;Jingwei Liu;Minkai Xu;Stefano Ermon;Bin CUI",
        "authorids": "~Ling_Yang1;~Zhilong_Zhang1;~Zhaochen_Yu2;~Jingwei_Liu4;~Minkai_Xu1;~Stefano_Ermon1;~Bin_CUI2",
        "gender": "M;;M;M;M;M;M",
        "homepage": "https://yangling0818.github.io/;;https://zhaochenyu0201.github.io;;https://minkaixu.com;http://cs.stanford.edu/~ermon/;https://cuibinpku.github.io/index.html",
        "dblp": "01/24-6.html;06/8799;;;257/3355;47/8135;55/5031.html",
        "google_scholar": "https://scholar.google.com.hk/citations?user=sIKujqAAAAAJ;https://scholar.google.com/citations?hl=zh-CN;9RNgZOIAAAAJ;;https://scholar.google.com/citations?hl=en;;IJAU8KoAAAAJ",
        "orcid": "0000-0003-1905-8053;0009-0009-9307-8440;;;;;0000-0003-1681-4677",
        "linkedin": ";;;%E7%BB%8F%E7%BA%AC-%E5%88%98-181399263/;;;",
        "or_profile": "~Ling_Yang1;~Zhilong_Zhang1;~Zhaochen_Yu2;~Jingwei_Liu4;~Minkai_Xu1;~Stefano_Ermon1;~Bin_CUI2",
        "aff": "Peking University;Korea Advanced Institute of Science & Technology;Peking University;Peking University;Stanford University;Stanford University;Peking University",
        "aff_domain": "pku.edu.cn;kaist.ac.kr;pku.edu.cn;pku.edu.cn;stanford.edu;stanford.edu;pku.edu.cn",
        "position": "PhD student;Intern;Intern;PhD student;PhD student;Associate Professor;Full Professor",
        "bibtex": "@inproceedings{\nyang2024crossmodal,\ntitle={Cross-Modal Contextualized Diffusion Models for Text-Guided Visual Generation and Editing},\nauthor={Ling Yang and Zhilong Zhang and Zhaochen Yu and Jingwei Liu and Minkai Xu and Stefano Ermon and Bin CUI},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=nFMS6wF2xq}\n}",
        "github": "",
        "project": "",
        "reviewers": "D2VS;YRdg;DNxF;zGd6",
        "pdf_size": 32564397,
        "rating": "5;6;6;8",
        "confidence": "4;4;3;3",
        "soundness": "3;3;4;4",
        "contribution": "2;3;3;4",
        "presentation": "2;3;4;3",
        "wc_summary": "82;92;57;63",
        "wc_strengths": "59;68;57;95",
        "wc_weaknesses": "98;145;174;105",
        "wc_questions": "85;35;28;53",
        "wc_review": "324;340;316;316",
        "wc_reply_reviewers": "0;25;23;35",
        "wc_reply_authors": "1366;916;723;441",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "4;2;2;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            73.5,
            14.115594213493104
        ],
        "wc_strengths_avg": [
            69.75,
            15.155444566227676
        ],
        "wc_weaknesses_avg": [
            130.5,
            30.858548248418945
        ],
        "wc_questions_avg": [
            50.25,
            22.038318901404434
        ],
        "wc_review_avg": [
            324.0,
            9.797958971132712
        ],
        "wc_reply_reviewers_avg": [
            20.75,
            12.813567028739499
        ],
        "wc_reply_authors_avg": [
            861.5,
            336.70944447698525
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            1.0897247358851685
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.6882472016116854,
        "gs_citation": 16,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3326314209657076418&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=nFMS6wF2xq",
        "pdf": "https://openreview.net/pdf?id=nFMS6wF2xq",
        "email": "pku.edu.cn;kaist.ac.kr;pku.edu.cn;pku.edu.cn;stanford.edu;stanford.edu;pku.edu.cn",
        "author_num": 7,
        "aff_unique_index": "0;1;0;0;2;2;0",
        "aff_unique_norm": "Peking University;Korea Advanced Institute of Science and Technology;Stanford University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.kaist.ac.kr;https://www.stanford.edu",
        "aff_unique_abbr": "Peking U;KAIST;Stanford",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Stanford",
        "aff_country_unique_index": "0;1;0;0;2;2;0",
        "aff_country_unique": "China;South Korea;United States"
    },
    {
        "id": "nFYksmdqgY",
        "title": "Beyond Language: Empowering Unsupervised Machine Translation with Cross-modal Alignment",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Unsupervised machine translation (UMT) has achieved notable performance without any parallel corpora in recent years. Nevertheless, aligning the source language with the target language in the latent space remains a challenge for UMT. While different languages may exhibit variations in their textual representations, they often share a common visual description. Taking inspiration from this, in this paper, we propose a novel unsupervised multi-modal machine translation method using images as pivots to align different languages. Specifically, we introduce cross-modal contrastive learning to achieve sentence-level and token-level alignment. By leveraging monolingual image-text pairs, we align both the source and target languages in a shared semantic space using images as intermediaries, thus achieving source-to-target alignment. Experimental results demonstrate that our approach can effectively learn the source-to-target alignment with monolingual data only and achieves significant improvements over state-of-the-art methods.",
        "keywords": "Neural machine translation; Unsupervised machine translation; Multi-modal machine translation; Cross-modal alignment",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Zhe Yang;Qingkai Fang;Yang Feng",
        "authorids": "~Zhe_Yang7;~Qingkai_Fang1;~Yang_Feng4",
        "gender": "M;M;",
        "homepage": "http://yangzhe.github.io;https://fangqingkai.github.io/;http://people.ucas.edu.cn/~yangfeng?language=en",
        "dblp": "181/2876;301/3107;07/6095-4.html",
        "google_scholar": ";n2lRntoAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";0000-0001-8575-591X;",
        "linkedin": ";;",
        "or_profile": "~Zhe_Yang7;~Qingkai_Fang1;~Yang_Feng4",
        "aff": "Institute of Computing Technology, Chinese Academy of Sciences;Institute of Computing Technology, Chinese Academy of Sciences;Institute of Computing Technology, Chinese Academy of Sciences",
        "aff_domain": "ict.ac.cn;ict.ac.cn;ict.ac.cn",
        "position": "MS student;PhD student;Full Professor",
        "bibtex": "@misc{\nyang2024beyond,\ntitle={Beyond Language: Empowering Unsupervised Machine Translation with Cross-modal Alignment},\nauthor={Zhe Yang and Qingkai Fang and Yang Feng},\nyear={2024},\nurl={https://openreview.net/forum?id=nFYksmdqgY}\n}",
        "github": "",
        "project": "",
        "reviewers": "fBBj;QtWc;QpzC;rLq9",
        "site": "https://openreview.net/forum?id=nFYksmdqgY",
        "pdf_size": 625462,
        "rating": "5;5;5;6",
        "confidence": "4;5;3;4",
        "soundness": "3;3;2;3",
        "contribution": "3;3;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "132;57;46;53",
        "wc_strengths": "61;49;11;68",
        "wc_weaknesses": "319;143;66;79",
        "wc_questions": "206;24;148;113",
        "wc_review": "718;273;271;313",
        "wc_reply_reviewers": "441;0;0;42",
        "wc_reply_authors": "2080;910;899;914",
        "reply_reviewers": "2;0;0;1",
        "reply_authors": "5;3;3;3",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            72.0,
            34.86402156952063
        ],
        "wc_strengths_avg": [
            47.25,
            22.00426095100674
        ],
        "wc_weaknesses_avg": [
            151.75,
            100.86469897838391
        ],
        "wc_questions_avg": [
            122.75,
            65.9824787348884
        ],
        "wc_review_avg": [
            393.75,
            187.9539504772379
        ],
        "wc_reply_reviewers_avg": [
            120.75,
            185.68976143018764
        ],
        "wc_reply_authors_avg": [
            1200.75,
            507.66493625224894
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.5,
            0.8660254037844386
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:9N6I3SxGpSkJ:scholar.google.com/&scioq=Beyond+Language:+Empowering+Unsupervised+Machine+Translation+with+Cross-modal+Alignment&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Chinese Academy of Sciences",
        "aff_unique_dep": "Institute of Computing Technology",
        "aff_unique_url": "http://www.ict.ac.cn",
        "aff_unique_abbr": "CAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Monte Carlo guided Denoising Diffusion models for Bayesian linear inverse problems.",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17864",
        "id": "nHESwXvxWK",
        "author_site": "Gabriel Cardoso, Yazid Janati el idrissi, Eric Moulines, Sylvain Le Corff",
        "tldr": "",
        "abstract": "Ill-posed linear inverse problems arise frequently in various applications, from computational photography to medical imaging.\nA recent line of research exploits Bayesian inference with informative priors to handle the ill-posedness of such problems.\nAmongst such priors, score-based generative models (SGM) have recently been successfully applied to several different inverse problems.\nIn this study, we exploit the particular structure of the prior defined by the SGM to define a sequence of intermediate linear inverse problems. As the noise level decreases, the posteriors of these inverse problems get closer to the target posterior of the original inverse problem. \nTo sample from this sequence of posteriors, we propose the use of Sequential Monte Carlo (SMC) methods.\nThe proposed algorithm, \\algo, is shown to be theoretically grounded and we provide numerical simulations showing that it outperforms competing baselines when dealing with ill-posed inverse problems in a Bayesian setting.",
        "keywords": "Monte Carlo;Denoising Diffusion model;score-based generative models;Sequential Monte Carlo;Bayesian Inverse Problems;Generative Models.",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Gabriel Cardoso;Yazid Janati el idrissi;Sylvain Le Corff;Eric Moulines",
        "authorids": "~Gabriel_Cardoso1;~Yazid_Janati_el_idrissi3;~Sylvain_Le_Corff1;~Eric_Moulines1",
        "gender": "M;M;M;M",
        "homepage": "https://gabrielvc.github.io/;http://yazidjanati.github.io;https://sylvainlc.github.io/;",
        "dblp": "320/0681;319/4479;29/10875;54/2358",
        "google_scholar": "WJbgdMsAAAAJ;JGor6XwAAAAJ;gHRCj-EAAAAJ;https://scholar.google.fr/citations?user=_XE1LvQAAAAJ",
        "orcid": ";;0000-0001-5211-2328;0000-0002-2058-0693",
        "linkedin": "gabriel-victorino-cardoso-379b09127/;;;",
        "or_profile": "~Gabriel_Cardoso1;~Yazid_Janati_el_idrissi3;~Sylvain_Le_Corff1;~Eric_Moulines1",
        "aff": "\u00c9cole Polytechnique;\u00c9cole Polytechnique;Sorbonne Universit\u00e9, LPSM;Ecole polytechnique",
        "aff_domain": "polytechnique.edu;polytechnique.edu;sorbonne-universite.fr;polytechnique.edu",
        "position": "PhD student;Postdoc;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\ncardoso2024monte,\ntitle={Monte Carlo guided Denoising Diffusion models for Bayesian linear inverse problems.},\nauthor={Gabriel Cardoso and Yazid Janati el idrissi and Sylvain Le Corff and Eric Moulines},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=nHESwXvxWK}\n}",
        "github": "",
        "project": "",
        "reviewers": "68J7;3L38;3cyr;3c1h",
        "pdf_size": 24850227,
        "rating": "6;8;10;10",
        "confidence": "4;4;3;2",
        "soundness": "3;4;4;4",
        "contribution": "3;4;4;4",
        "presentation": "3;3;4;4",
        "wc_summary": "53;80;91;74",
        "wc_strengths": "26;75;165;134",
        "wc_weaknesses": "76;185;55;44",
        "wc_questions": "49;58;20;57",
        "wc_review": "204;398;331;309",
        "wc_reply_reviewers": "108;0;33;71",
        "wc_reply_authors": "501;401;140;85",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            8.5,
            1.6583123951777
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            74.5,
            13.82931668593933
        ],
        "wc_strengths_avg": [
            100.0,
            53.57704732439069
        ],
        "wc_weaknesses_avg": [
            90.0,
            56.040164168210644
        ],
        "wc_questions_avg": [
            46.0,
            15.411035007422441
        ],
        "wc_review_avg": [
            310.5,
            69.67962399439308
        ],
        "wc_reply_reviewers_avg": [
            53.0,
            40.4907396820557
        ],
        "wc_reply_authors_avg": [
            281.75,
            173.9933547581631
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8181818181818182,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "openreview": "https://openreview.net/forum?id=nHESwXvxWK",
        "pdf": "https://openreview.net/pdf?id=nHESwXvxWK",
        "email": "polytechnique.edu;polytechnique.edu;sorbonne-universite.fr;polytechnique.edu",
        "author_num": 4,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Ecole Polytechnique;Sorbonne Universit\u00e9",
        "aff_unique_dep": ";LPSM",
        "aff_unique_url": "https://www.polytechnique.edu;https://www.sorbonne-universite.fr",
        "aff_unique_abbr": "X;Sorbonne U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "France"
    },
    {
        "title": "Structural Estimation of Partially Observed Linear Non-Gaussian Acyclic Model: A Practical Approach with Identifiability",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17863",
        "id": "nHkMm0ywWm",
        "author_site": "Songyao Jin, Feng Xie, Guangyi Chen, Biwei Huang, Zhengming Chen, Xinshuai Dong, Kun Zhang",
        "tldr": "",
        "abstract": "Conventional causal discovery approaches, which seek to uncover causal relationships among measured variables, are typically fragile to the presence of latent variables. While various methods have been developed to address this confounding issue, they often rely on strong assumptions about the underlying causal structure. In this paper, we consider a general scenario where measured and latent variables collectively form a partially observed causally sufficient linear system and latent variables may be anywhere in the causal structure. We theoretically show that with the aid of high-order statistics, the causal graph is (almost) fully identifiable if, roughly speaking, each latent set has a sufficient number of pure children, which can be either latent or measured. Naturally, LiNGAM, a model without latent variables, is encompassed as a special case. Based on the identification theorem, we develop a principled algorithm to identify the causal graph by testing for statistical independence involving only measured variables in specific manners. Experimental results show that our method effectively recovers the causal structure, even when latent variables are influenced by measured variables.",
        "keywords": "causal discovery;latent variable model;structure learning",
        "primary_area": "causal reasoning",
        "supplementary_material": "/attachment/d2475cdda64cb6a37c453d317a1269629ff66144.zip",
        "author": "Songyao Jin;Feng Xie;Guangyi Chen;Biwei Huang;Zhengming Chen;Xinshuai Dong;Kun Zhang",
        "authorids": "~Songyao_Jin1;~Feng_Xie1;~Guangyi_Chen1;~Biwei_Huang1;~Zhengming_Chen2;~Xinshuai_Dong1;~Kun_Zhang1",
        "gender": "M;M;M;F;M;M;M",
        "homepage": "https://github.com/Songyao-Jin;https://fengxie.site/;https://chengy12.github.io/;;https://dongxinshuai.github.io/;http://www.andrew.cmu.edu/user/kunz1/;https://scholar.google.com/citations?user=QBUnTqkAAAAJ",
        "dblp": "365/4229;11/4605-2;c/GuangyiChen-2;165/3288;279/6151.html;96/3115-1;17/7724",
        "google_scholar": "IPNzHfgAAAAJ;stLFCtQAAAAJ;https://scholar.google.com/citations?hl=zh-CN;;A7JyL1sAAAAJ;RGoypN4AAAAJ;QBUnTqkAAAAJ",
        "orcid": ";0000-0001-7229-3955;;;;;0000-0002-3839-5269",
        "linkedin": "songyao-jin-b97466223/;;;;;;",
        "or_profile": "~Songyao_Jin1;~Feng_Xie1;~Guangyi_Chen1;~Biwei_Huang1;~Xinshuai_Dong1;~Kun_Zhang1;~zhengming_Chen1",
        "aff": "Mohamed bin Zayed University of Artificial Intelligence;Beijing Technology and Business University;Carnegie Mellon University;University of California, San Diego;Carnegie Mellon University;Carnegie Mellon University;Guangdong University of Technology",
        "aff_domain": "mbzuai.ac.ae;btbu.edu.cn;cmu.edu;ucsd.edu;cmu.edu;cmu.edu;gdut.edu.cn",
        "position": "MS student;Associate Professor;Postdoc;Assistant Professor;PhD student;Associate Professor;PhD student",
        "bibtex": "@inproceedings{\njin2024structural,\ntitle={Structural Estimation of Partially Observed Linear Non-Gaussian Acyclic Model: A Practical Approach with Identifiability},\nauthor={Songyao Jin and Feng Xie and Guangyi Chen and Biwei Huang and Zhengming Chen and Xinshuai Dong and Kun Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=nHkMm0ywWm}\n}",
        "github": "",
        "project": "",
        "reviewers": "53sg;e967;BTCR;XS6k",
        "pdf_size": 593048,
        "rating": "6;6;6;8",
        "confidence": "3;3;4;4",
        "soundness": "3;3;3;4",
        "contribution": "3;3;3;4",
        "presentation": "3;4;3;3",
        "wc_summary": "57;128;166;85",
        "wc_strengths": "47;98;59;29",
        "wc_weaknesses": "8;137;59;91",
        "wc_questions": "68;19;39;172",
        "wc_review": "180;382;323;377",
        "wc_reply_reviewers": "9;31;0;22",
        "wc_reply_authors": "860;1221;641;2336",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "3;4;2;5",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            109.0,
            41.50301193889427
        ],
        "wc_strengths_avg": [
            58.25,
            25.31180554602931
        ],
        "wc_weaknesses_avg": [
            73.75,
            47.00731326081081
        ],
        "wc_questions_avg": [
            74.5,
            58.92580080066795
        ],
        "wc_review_avg": [
            315.5,
            81.57971561607701
        ],
        "wc_reply_reviewers_avg": [
            15.5,
            11.884864324004713
        ],
        "wc_reply_authors_avg": [
            1264.5,
            652.3758502581162
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.5,
            1.118033988749895
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11315733490540896574&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=nHkMm0ywWm",
        "pdf": "https://openreview.net/pdf?id=nHkMm0ywWm",
        "email": "mbzuai.ac.ae;btbu.edu.cn;cmu.edu;ucsd.edu;cmu.edu;cmu.edu;gdut.edu.cn",
        "author_num": 7,
        "aff_unique_index": "0;1;2;3;2;2;4",
        "aff_unique_norm": "Mohamed bin Zayed University of Artificial Intelligence;Beijing Technology and Business University;Carnegie Mellon University;University of California, San Diego;Guangdong University of Technology",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://mbzuai.ac.ae;http://www.btbu.edu.cn;https://www.cmu.edu;https://www.ucsd.edu;http://www.gdut.edu.cn",
        "aff_unique_abbr": "MBZUAI;BTBU;CMU;UCSD;GDUT",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";San Diego",
        "aff_country_unique_index": "0;1;2;2;2;2;1",
        "aff_country_unique": "United Arab Emirates;China;United States"
    },
    {
        "id": "nJ0vLrKKba",
        "title": "Do different self-supervised learning tasks for medical imaging result in better downstreaming performance?",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Vision transformers pretrained on relatively large and diverse medical images have demonstrated capabilities to generate highly accurate segmentations of normal tissues from various anatomic sites and medical imaging modalities. However, there are limited studies on their capability for reliably segmenting tumors. Hence, we comprehensively evaluate two state-of-the-art transformers, SwinUNETR and SMIT, for segmenting primary and metastatic lung and ovarian cancers arising from two completely different organs. We systematically evaluate the ability of these two pretrained models, after finetuning, to the individual tumor types in terms of in-distribution (3D computed tomography (CT) using similar imaging acquisitions), as well as out-of-distribution (OOD) data consisting of CTs with different anatomical regions and different acquisitions. Our work, primarily on transformers, highlights the need to analyze previously forgotten metrics for 3D medical imaging to mitigate misdiagnoses and ensure patient safety.",
        "keywords": "medical imaging;tumor segmentation;swin transformer;representation analysis",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Aneesh Rangnekar;Jue Jiang;Yuliya Lakhman;Harini Veeraraghavan",
        "authorids": "~Aneesh_Rangnekar1;~Jue_Jiang1;~Yuliya_Lakhman1;~Harini_Veeraraghavan1",
        "gender": "M;M;;F",
        "homepage": ";;;https://www.mskcc.org/research-areas/labs/harini-veeraraghavan",
        "dblp": "203/8396;;;78/1912",
        "google_scholar": "2UtY2BIAAAAJ;gJhLEPsAAAAJ;;https://scholar.google.com/citations?view_op=search_authors",
        "orcid": "0000-0002-0079-9495;;;0000-0002-4054-5529",
        "linkedin": ";;;harini-veeraraghavan-6a13202/",
        "or_profile": "~Aneesh_Rangnekar1;~Jue_Jiang1;~Yuliya_Lakhman1;~Harini_Veeraraghavan1",
        "aff": "Memorial Sloan Kettering Cancer Center;Memorial Sloan Kettering Cancer Centre;;Memorial Sloan Kettering Cancer Centre",
        "aff_domain": "mskcc.org;mskcc.org;;mskcc.org",
        "position": "Postdoc;Researcher;;Associate Professor",
        "bibtex": "@misc{\nrangnekar2024do,\ntitle={Do different self-supervised learning tasks for medical imaging result in better downstreaming performance?},\nauthor={Aneesh Rangnekar and Jue Jiang and Yuliya Lakhman and Harini Veeraraghavan},\nyear={2024},\nurl={https://openreview.net/forum?id=nJ0vLrKKba}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=nJ0vLrKKba",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:iQcLkzb5dIYJ:scholar.google.com/&scioq=Do+different+self-supervised+learning+tasks+for+medical+imaging+result+in+better+downstreaming+performance%3F&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Memorial Sloan Kettering Cancer Center",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.mskcc.org",
        "aff_unique_abbr": "MSKCC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Are Transformers with One Layer Self-Attention Using Low-Rank Weight Matrices Universal Approximators?",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17862",
        "id": "nJnky5K944",
        "author_site": "Tokio Kajitsuka, Issei Sato",
        "tldr": "",
        "abstract": "Existing analyses of the expressive capacity of Transformer models have required excessively deep layers for data memorization, leading to a discrepancy with the Transformers actually used in practice. \nThis is primarily due to the interpretation of the softmax function as an approximation of the hardmax function.\nBy clarifying the connection between the softmax function and the Boltzmann operator, we prove that a single layer of self-attention with low-rank weight matrices possesses the capability to perfectly capture the context of an entire input sequence.\nAs a consequence, we show that one-layer and single-head Transformers have a memorization capacity for finite samples, and that Transformers consisting of one self-attention layer with two feed-forward neural networks are universal approximators for continuous functions on a compact domain.",
        "keywords": "Transformer;Self-Attention;Memorization;Universal Approximation Theorem;Contextual Mapping",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Tokio Kajitsuka;Issei Sato",
        "authorids": "~Tokio_Kajitsuka1;sato@g.ecc.u-tokyo.ac.jp",
        "gender": "M;",
        "homepage": "https://www.ml.is.s.u-tokyo.ac.jp/members-en;",
        "dblp": ";",
        "google_scholar": "https://scholar.google.co.jp/citations?user=NawthAcAAAAJ;",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Tokio_Kajitsuka1;sato@g.ecc.u-tokyo.ac.jp",
        "aff": "The University of Tokyo;",
        "aff_domain": "u-tokyo.ac.jp;",
        "position": "PhD student;",
        "bibtex": "@inproceedings{\nkajitsuka2024are,\ntitle={Are Transformers with One Layer Self-Attention Using Low-Rank Weight Matrices Universal Approximators?},\nauthor={Tokio Kajitsuka and Issei Sato},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=nJnky5K944}\n}",
        "github": "",
        "project": "",
        "reviewers": "mvi8;EXsH;A9Eo",
        "pdf_size": 482309,
        "rating": "6;6;8",
        "confidence": "4;3;3",
        "soundness": "3;3;4",
        "contribution": "2;3;4",
        "presentation": "3;3;3",
        "wc_summary": "55;66;121",
        "wc_strengths": "24;40;104",
        "wc_weaknesses": "410;84;176",
        "wc_questions": "46;4;108",
        "wc_review": "535;194;509",
        "wc_reply_reviewers": "164;0;0",
        "wc_reply_authors": "1389;357;626",
        "reply_reviewers": "2;0;0",
        "reply_authors": "4;1;1",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            80.66666666666667,
            28.871362204709975
        ],
        "wc_strengths_avg": [
            56.0,
            34.56395039150859
        ],
        "wc_weaknesses_avg": [
            223.33333333333334,
            137.23297303814738
        ],
        "wc_questions_avg": [
            52.666666666666664,
            42.71871824960211
        ],
        "wc_review_avg": [
            412.6666666666667,
            154.98458704730035
        ],
        "wc_reply_reviewers_avg": [
            54.666666666666664,
            77.3103414097292
        ],
        "wc_reply_authors_avg": [
            790.6666666666666,
            437.1058859767911
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            2.0,
            1.4142135623730951
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 28,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18004641131863224996&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=nJnky5K944",
        "pdf": "https://openreview.net/pdf?id=nJnky5K944",
        "email": "u-tokyo.ac.jp;",
        "author_num": 2,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Tokyo",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.u-tokyo.ac.jp",
        "aff_unique_abbr": "UTokyo",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Japan"
    },
    {
        "id": "nJsfYo3HDy",
        "title": "Why are Modern GANs Poor Density Models?",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Modern generative adversarial networks (GANs) generate extremely realistic images and are generally believed to capture the true data distribution. In this work, we evaluate modern GANs as density models and ask whether they can be used for tasks such as outlier detection and generative classification. We find that the performance of state-of-the-art GANs is very poor on these tasks and is often close to (or worse than) random. For instance, a modern GAN that generates remarkably realistic samples when trained on  CIFAR10, consistently assigns higher likelihood to flat images than to images from the training set. \nTo try and understand the source of this poor performance, we show that the likelihood that a GAN assigns to an input image is dominated by the quality of the GAN reconstruction. Surprisingly, GANs often fail to reconstruct images from the training set while  they are highly effective at reconstructing images outside the distribution. Taken together, our results indicate that modern GANs do not truly learn the underlying distribution, despite the impressive quality of the generated samples.",
        "keywords": "GANs;density estimation;prior",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/a82d61e2f00ae728515994329bf38c3570f1683a.zip",
        "author": "Roy Friedman;Yair Weiss",
        "authorids": "~Roy_Friedman2;~Yair_Weiss1",
        "gender": ";M",
        "homepage": "https://friedmanroy.github.io/;http://www.cs.huji.ac.il/~yweiss/",
        "dblp": "f/RoyFriedman;44/1092",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.com.tw/citations?user=9DXQi8gAAAAJ",
        "orcid": "0000-0001-5061-4084;",
        "linkedin": "roy-friedman-a8a85116/;",
        "or_profile": "~Roy_Friedman2;~Yair_Weiss1",
        "aff": "Hebrew University of Jerusalem;Hebrew University of Jerusalem",
        "aff_domain": "huji.ac.il;huji.ac.il",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nfriedman2024why,\ntitle={Why are Modern {GAN}s Poor Density Models?},\nauthor={Roy Friedman and Yair Weiss},\nyear={2024},\nurl={https://openreview.net/forum?id=nJsfYo3HDy}\n}",
        "github": "",
        "project": "",
        "reviewers": "SxfR;pQQy;GHc8;kwJr;PGsS",
        "site": "https://openreview.net/forum?id=nJsfYo3HDy",
        "pdf_size": 7783467,
        "rating": "3;3;3;5;5",
        "confidence": "4;4;3;4;4",
        "soundness": "2;3;2;2;2",
        "contribution": "2;2;2;2;2",
        "presentation": "2;3;2;2;3",
        "wc_summary": "169;103;50;117;61",
        "wc_strengths": "32;38;53;37;50",
        "wc_weaknesses": "655;570;421;306;355",
        "wc_questions": "93;37;53;126;2",
        "wc_review": "949;748;577;586;468",
        "wc_reply_reviewers": "0;25;48;49;25",
        "wc_reply_authors": "459;684;301;442;343",
        "reply_reviewers": "0;1;1;1;1",
        "reply_authors": "1;1;1;2;1",
        "rating_avg": [
            3.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.2,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            100.0,
            42.61455150532503
        ],
        "wc_strengths_avg": [
            42.0,
            8.07465169527454
        ],
        "wc_weaknesses_avg": [
            461.4,
            131.43606810917618
        ],
        "wc_questions_avg": [
            62.2,
            43.27308632394967
        ],
        "wc_review_avg": [
            665.6,
            167.53339965511356
        ],
        "wc_reply_reviewers_avg": [
            29.4,
            18.07318455613177
        ],
        "wc_reply_authors_avg": [
            445.8,
            133.01338278534232
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            1.2,
            0.4
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.408248290463863,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:-nc8pgery84J:scholar.google.com/&scioq=Why+are+Modern+GANs+Poor+Density+Models%3F&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Hebrew University of Jerusalem",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.huji.ac.il",
        "aff_unique_abbr": "HUJI",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Jerusalem",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Israel"
    },
    {
        "id": "nKYTiJhhAu",
        "title": "REDUCR: Robust Data Downsampling Using Class Priority Reweighting",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Modern machine learning models are becoming increasingly expensive to train for real-world image and text classification tasks, where massive web-scale data is collected in a streaming fashion. To reduce the training cost, online batch selection techniques have been developed to choose the most informative datapoints. However, these techniques can suffer from poor worst-class generalization performance due to class imbalance and distributional shifts. This work introduces REDUCR, a robust and efficient data downsampling method that uses class priority reweighting. REDUCR reduces the training data while preserving worst-class generalization performance. REDUCR assigns priority weights to datapoints in a class-aware manner using an online learning algorithm. We demonstrate the data efficiency and robust performance of REDUCR on vision and text classification tasks. On web-scraped datasets with imbalanced class distributions, REDUCR achieves significant test accuracy boosts for the worst-performing class (but also on average), surpassing state-of-the-art methods by around 15\\%.",
        "keywords": "Class Robustness;Online Batch Selection;Robust Machine Learning;Training Efficiency;Data Downsampling;Class Imbalance",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "William Bankes;George Hughes;Ilija Bogunovic;Zi Wang",
        "authorids": "~William_Bankes1;~George_Hughes1;~Ilija_Bogunovic2;~Zi_Wang1",
        "gender": "M;M;F;M",
        "homepage": "https://github.com/williambankes;https://github.com/ghughes1200;http://zi-wang.com/;http://ilijabogunovic.com/",
        "dblp": ";;78/8711-4;142/2725",
        "google_scholar": ";;U0egIsIAAAAJ;xMvt3NEAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~William_Bankes1;~George_Hughes1;~Zi_Wang1;~Ilija_Bogunovic1",
        "aff": "University College London, University of London;;Google DeepMind;Swiss Federal Institute of Technology",
        "aff_domain": "ucl.ac.uk;;google.com;ethz.ch",
        "position": "PhD student;;Research scientist;Postdoc",
        "bibtex": "@misc{\nbankes2024reducr,\ntitle={{REDUCR}: Robust Data Downsampling Using Class Priority Reweighting},\nauthor={William Bankes and George Hughes and Ilija Bogunovic and Zi Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=nKYTiJhhAu}\n}",
        "github": "",
        "project": "",
        "reviewers": "3z1f;sdUG;CKWX",
        "site": "https://openreview.net/forum?id=nKYTiJhhAu",
        "pdf_size": 1086274,
        "rating": "3;3;5",
        "confidence": "4;3;4",
        "soundness": "2;3;2",
        "contribution": "2;2;2",
        "presentation": "2;3;3",
        "wc_summary": "62;30;28",
        "wc_strengths": "51;57;15",
        "wc_weaknesses": "124;95;196",
        "wc_questions": "2;95;75",
        "wc_review": "239;277;314",
        "wc_reply_reviewers": "136;77;78",
        "wc_reply_authors": "812;570;792",
        "reply_reviewers": "1;1;1",
        "reply_authors": "3;3;3",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            40.0,
            15.57776192739723
        ],
        "wc_strengths_avg": [
            41.0,
            18.547236990991408
        ],
        "wc_weaknesses_avg": [
            138.33333333333334,
            42.460439103816256
        ],
        "wc_questions_avg": [
            57.333333333333336,
            39.96943276499625
        ],
        "wc_review_avg": [
            276.6666666666667,
            30.619528989773105
        ],
        "wc_reply_reviewers_avg": [
            97.0,
            27.58018612458347
        ],
        "wc_reply_authors_avg": [
            724.6666666666666,
            109.67021270862729
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.0,
            0.0
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=529242377943779083&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University College London;Google;Swiss Federal Institute of Technology",
        "aff_unique_dep": ";Google DeepMind;",
        "aff_unique_url": "https://www.ucl.ac.uk;https://deepmind.com;https://www.ethz.ch",
        "aff_unique_abbr": "UCL;DeepMind;ETH Zurich",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "United Kingdom;Switzerland"
    },
    {
        "id": "nKvGCUoiuW",
        "title": "MiniGPT-v2: Large Language Model as a Unified Interface for Vision-Language Multi-task Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models have shown their remarkable capabilities as a general interface for various language-related applications. Motivated by this, we target to build a unified interface for completing many vision-language tasks including image description, visual question answering, and visual grounding, among others. The challenge for achieving this is to use a single model for performing diverse vision-language tasks effectively with simple multi-modal instructions. To address this issue, we introduce MiniGPT-v2, a model can be treated a unified interface for better handling various vision-language tasks. We propose using unique identifiers for different tasks when training the model. These identifiers enable our model to distinguish each task instruction effortlessly and also improve the model learning efficiency for each task. After our three-stage training, our experiments show that MiniGPT-v2 achieves strong performance on many visual question answering and visual grounding benchmarks compared to other vision-language generalist models. Our trained models and codes will be made available.",
        "keywords": "vision-language foundation model",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/487245e31e657e6482b8036863e8abf5ee6174f3.pdf",
        "author": "Jun Chen;Deyao Zhu;Xiaoqian Shen;Xiang Li;Zechun Liu;Pengchuan Zhang;Raghuraman Krishnamoorthi;Vikas Chandra;Yunyang Xiong;Mohamed Elhoseiny",
        "authorids": "~Jun_Chen11;~Deyao_Zhu1;~Xiaoqian_Shen3;~Xiang_Li18;~Zechun_Liu1;~Pengchuan_Zhang1;~Raghuraman_Krishnamoorthi1;~Vikas_Chandra2;~Yunyang_Xiong2;~Mohamed_Elhoseiny1",
        "gender": "M;M;F;M;;M;M;M;M;M",
        "homepage": "https://junchen14.github.io/;https://tsutikgiau.github.io/;https://xiaoqian-shen.github.io;http://xiangli.ac.cn;;https://pzzhang.github.io/pzzhang/;;https://v-chandra.github.io/;;http://www.mohamed-elhoseiny.com",
        "dblp": "85/5901-21;251/6017;197/6114;40/1491-46;;;;57/5163;140/7645;125/2894",
        "google_scholar": "9G2OQmkAAAAJ;dENNKrsAAAAJ;uToGtIwAAAAJ;4Apl5FgAAAAJ;;3VZ_E64AAAAJ;F1mr9C0AAAAJ;p-h_BvcAAAAJ;k5FaRwcAAAAJ;iRBUTOAAAAAJ",
        "orcid": "0000-0001-8883-0970;;;0000-0002-9946-7000;;;;;;0000-0001-9659-1551",
        "linkedin": ";deyao-zhu-205774154/;xiaoqian-shen-759991264;;;;raghuraman-krishnamoorthi-b8670a5/;vchandra/;;mohamed-elhoseiny-8a836215/",
        "or_profile": "~Jun_Chen11;~Deyao_Zhu1;~Xiaoqian_Shen3;~Xiang_Li18;~Zechun_Liu1;~Pengchuan_Zhang1;~Raghuraman_Krishnamoorthi1;~Vikas_Chandra2;~Yunyang_Xiong2;~Mohamed_Elhoseiny1",
        "aff": "KAUST;ByteDance Inc.;Meta Facebook;King Abdullah University of Science and Technology;;;Meta Facebook;Meta;Meta Facebook;KAUST",
        "aff_domain": "kaust.edu.sa;bytedance.com;meta.com;kaust.edu.sa;;;meta.com;meta.com;fb.com;kaust.edu.sa",
        "position": "PhD student;Researcher;Intern;Postdoc;;;Researcher;Director, AI;Researcher;Associate Professor",
        "bibtex": "@misc{\nchen2024minigptv,\ntitle={Mini{GPT}-v2: Large Language Model as a Unified Interface for Vision-Language Multi-task Learning},\nauthor={Jun Chen and Deyao Zhu and Xiaoqian Shen and Xiang Li and Zechun Liu and Pengchuan Zhang and Raghuraman Krishnamoorthi and Vikas Chandra and Yunyang Xiong and Mohamed Elhoseiny},\nyear={2024},\nurl={https://openreview.net/forum?id=nKvGCUoiuW}\n}",
        "github": "",
        "project": "",
        "reviewers": "FCUs;AcHr;NiES;WwXo",
        "site": "https://openreview.net/forum?id=nKvGCUoiuW",
        "pdf_size": 29749526,
        "rating": "5;5;6;8",
        "confidence": "4;4;4;4",
        "soundness": "2;3;3;4",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;4",
        "wc_summary": "72;141;63;137",
        "wc_strengths": "25;68;46;52",
        "wc_weaknesses": "223;186;184;109",
        "wc_questions": "1;89;82;13",
        "wc_review": "321;484;375;311",
        "wc_reply_reviewers": "387;0;113;77",
        "wc_reply_authors": "910;743;890;321",
        "reply_reviewers": "2;0;1;1",
        "reply_authors": "2;1;2;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            103.25,
            35.91918011313733
        ],
        "wc_strengths_avg": [
            47.75,
            15.400892831261439
        ],
        "wc_weaknesses_avg": [
            175.5,
            41.415576779757636
        ],
        "wc_questions_avg": [
            46.25,
            39.55613100392909
        ],
        "wc_review_avg": [
            372.75,
            68.68906390394325
        ],
        "wc_reply_reviewers_avg": [
            144.25,
            145.97495504366495
        ],
        "wc_reply_authors_avg": [
            716.0,
            236.9947256797079
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 614,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14490472280249281004&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 10,
        "aff_unique_index": "0;1;2;0;2;2;2;0",
        "aff_unique_norm": "King Abdullah University of Science and Technology;ByteDance;Meta",
        "aff_unique_dep": ";;Meta Platforms, Inc.",
        "aff_unique_url": "https://www.kaust.edu.sa;https://www.bytedance.com;https://meta.com",
        "aff_unique_abbr": "KAUST;ByteDance;Meta",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;0;2;2;2;0",
        "aff_country_unique": "Saudi Arabia;China;United States"
    },
    {
        "title": "Input-gradient space particle inference for neural network ensembles",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17861",
        "id": "nLWiR5P3wr",
        "author_site": "Trung Trinh, Markus Heinonen, Luigi Acerbi, Samuel Kaski",
        "tldr": "",
        "abstract": "Deep Ensembles (DEs) demonstrate improved accuracy, calibration and robustness to perturbations over single neural networks partly due to their functional diversity. Particle-based variational inference (ParVI) methods enhance diversity by formalizing a repulsion term based on a network similarity kernel. However, weight-space repulsion is inefficient due to over-parameterization, while direct function-space repulsion has been found to produce little improvement over DEs. To sidestep these difficulties, we propose First-order Repulsive Deep Ensemble (FoRDE), an ensemble learning method based on ParVI, which performs repulsion in the space of first-order input gradients. As input gradients uniquely characterize a function up to translation and are much smaller in dimension than the weights, this method guarantees that ensemble members are functionally different. Intuitively, diversifying the input gradients encourages each network to learn different features, which is expected to improve the robustness of an ensemble. Experiments on image classification datasets and transfer learning tasks show that FoRDE significantly outperforms the gold-standard DEs and other ensemble methods in accuracy and calibration under covariate shift due to input perturbations.",
        "keywords": "deep ensembles;diversity;input gradient;robustness;covariate shift;particle variational inference",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/9051ebcb267f3101b5766b887c71216f3f29d45f.zip",
        "author": "Trung Trinh;Markus Heinonen;Luigi Acerbi;Samuel Kaski",
        "authorids": "~Trung_Trinh1;~Markus_Heinonen1;~Luigi_Acerbi1;~Samuel_Kaski1",
        "gender": "M;M;M;M",
        "homepage": "https://trungtr.com;https://users.aalto.fi/~heinom10/;http://luigiacerbi.com/;https://people.aalto.fi/samuel.kaski",
        "dblp": "323/9628;22/7709;72/1450;64/5826",
        "google_scholar": "QL_WEh8AAAAJ;hFtfHZoAAAAJ;https://scholar.google.co.uk/citations?user=QYBZoGwAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;0000-0001-7471-7336;0000-0003-1925-9154",
        "linkedin": ";;luigi-acerbi-719b492/;samuel-kaski-27790/",
        "or_profile": "~Trung_Trinh1;~Markus_Heinonen1;~Luigi_Acerbi1;~Samuel_Kaski1",
        "aff": "Aalto University;Aalto University;University of Helsinki;Aalto University",
        "aff_domain": "aalto.fi;aalto.fi;helsinki.fi;aalto.fi",
        "position": "PhD student;Researcher;Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\ntrinh2024inputgradient,\ntitle={Input-gradient space particle inference for neural network ensembles},\nauthor={Trung Trinh and Markus Heinonen and Luigi Acerbi and Samuel Kaski},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=nLWiR5P3wr}\n}",
        "github": "",
        "project": "",
        "reviewers": "aXJD;eVm5;XVK8;VQHQ",
        "pdf_size": 1106317,
        "rating": "6;6;8;8",
        "confidence": "4;3;4;3",
        "soundness": "3;2;4;3",
        "contribution": "2;2;3;4",
        "presentation": "3;3;4;3",
        "wc_summary": "49;77;106;57",
        "wc_strengths": "51;114;110;42",
        "wc_weaknesses": "111;125;122;199",
        "wc_questions": "23;259;98;10",
        "wc_review": "234;575;436;308",
        "wc_reply_reviewers": "26;121;394;138",
        "wc_reply_authors": "717;1291;827;710",
        "reply_reviewers": "1;1;1;2",
        "reply_authors": "1;3;2;3",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            72.25,
            21.992896580487074
        ],
        "wc_strengths_avg": [
            79.25,
            32.93459427410637
        ],
        "wc_weaknesses_avg": [
            139.25,
            34.888214342382156
        ],
        "wc_questions_avg": [
            97.5,
            99.1072651221897
        ],
        "wc_review_avg": [
            388.25,
            129.79671606015307
        ],
        "wc_reply_reviewers_avg": [
            169.75,
            136.32383320608324
        ],
        "wc_reply_authors_avg": [
            886.25,
            238.24501568763196
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12185113201192149749&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 11,
        "openreview": "https://openreview.net/forum?id=nLWiR5P3wr",
        "pdf": "https://openreview.net/pdf?id=nLWiR5P3wr",
        "email": "aalto.fi;aalto.fi;helsinki.fi;aalto.fi",
        "author_num": 4,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Aalto University;University of Helsinki",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.aalto.fi;https://www.helsinki.fi",
        "aff_unique_abbr": "Aalto;UH",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Finland"
    },
    {
        "id": "nLmUiJ5Gpc",
        "title": "Characterizing Training Dynamics for Finite-width Deep Neural Networks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We study the impact of (stochastic) gradient descent on feature learning through the change in weights and activations of finite-width deep fully connected networks. Under the linear width limit, where the input dimension and sample size scale proportionally with the width, we provide non-asymptotic bounds on the norm of the change in weights which characterizes the initialization schemes that allow feature learning for high-dimensional problems. Based on our bounds, we find that the asymptotic rate of the norm of the change in activations is non-increasing as we move towards earlier layers. In addition, we find that common parameterizations such as the NTK or standard parameterization are largely influenced by the last layer during training implying the importance of the last layer for feature learning. Another behavior that we find is that the gradients of each layer have a low rank suggesting that (stochastic) gradient descent for feed-forward networks results in weights with a bulk + spike structure. We empirically confirm these findings on both synthetic data and CIFAR-2 data.",
        "keywords": "feature learning;training dynamics;high dimensional statistics",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Shawn Im",
        "authorids": "~Shawn_Im1",
        "gender": "M",
        "homepage": "https://shawn-im.github.io/",
        "dblp": "",
        "google_scholar": "",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Shawn_Im1",
        "aff": "Department of Computer Science, University of Wisconsin - Madison",
        "aff_domain": "cs.wisc.edu",
        "position": "PhD student",
        "bibtex": "@misc{\nim2024characterizing,\ntitle={Characterizing Training Dynamics for Finite-width Deep Neural Networks},\nauthor={Shawn Im},\nyear={2024},\nurl={https://openreview.net/forum?id=nLmUiJ5Gpc}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=nLmUiJ5Gpc",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:cScCJN3i6SgJ:scholar.google.com/&scioq=Characterizing+Training+Dynamics+for+Finite-width+Deep+Neural+Networks&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Wisconsin-Madison",
        "aff_unique_dep": "Department of Computer Science",
        "aff_unique_url": "https://www.wisc.edu",
        "aff_unique_abbr": "UW-Madison",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Madison",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "nLxH6a6Afe",
        "title": "CITING: Large Language Models Create Curriculum for Instruction Tuning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The recent advancement of large language models (LLMs) has been achieved through a combo of instruction tuning and human alignment. However, building manually crafted instruction datasets and performing human alignment become the bottleneck for scaling the development of LLMs. In this paper, we exploit the idea of leveraging AI models in lieu of humans as the teacher to train student LLMs. Our method is inspired by how human students refine their writing skills by following the rubrics and learning from the revisions offered by their tutors. Specifically, we employ a teacher LLM to create a curriculum for instruction tuning of the student LLM, namely Curriculum Instruction TunING (CITING). It encompasses two main steps: (1) the teacher LLM crafts the rubrics for evaluating the answers corresponding to various types of questions, and (2) the student LLM learns to follow the rubrics and perform self-correction from the revision made by the teacher. We further iteratively carry out it to embody the procedure of CITING. We compare CITING to a series of state-of-the-art baselines on four datasets. Our method demonstrates strong improvement in terms of articulate, in-depth, and comprehensive by GPT-4 evaluation. Specifically, it achieves an average winning rate of 79.4\\% over SFT, 73.4\\% over RLHF, 78.1\\% over RRHF, and 76.3\\% over RAFT, respectively.",
        "keywords": "large language model;instruction learning;curriculum learning;RLHF",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/4bc98ef01e5ebf5f2de5f0cf9526162e9b159067.zip",
        "author": "Tao Feng;Zifeng Wang;Jimeng Sun",
        "authorids": "~Tao_Feng5;~Zifeng_Wang3;~Jimeng_Sun3",
        "gender": "M;M;",
        "homepage": ";https://zifengwang.xyz;http://sunlab.org",
        "dblp": ";;",
        "google_scholar": "3xK6SlIAAAAJ;kMlWwTAAAAAJ;9jmmp5sAAAAJ",
        "orcid": ";;0000-0003-1512-6426",
        "linkedin": ";;jimengsun/",
        "or_profile": "~Tao_Feng5;~Zifeng_Wang3;~Jimeng_Sun3",
        "aff": "Department of Computer Science, University of Illinois at Urbana-Champaign;University of Illinois, Urbana Champaign;Georgia Institute of Technology",
        "aff_domain": "cs.illinois.edu;illinois.edu;gatech.edu",
        "position": "PhD student;PhD student;Associate Professor",
        "bibtex": "@misc{\nfeng2024citing,\ntitle={{CITING}: Large Language Models Create Curriculum for Instruction Tuning},\nauthor={Tao Feng and Zifeng Wang and Jimeng Sun},\nyear={2024},\nurl={https://openreview.net/forum?id=nLxH6a6Afe}\n}",
        "github": "",
        "project": "",
        "reviewers": "4C6N;ygGy;TqZ2;6BWB",
        "site": "https://openreview.net/forum?id=nLxH6a6Afe",
        "pdf_size": 686528,
        "rating": "3;5;6;6",
        "confidence": "5;4;3;4",
        "soundness": "2;2;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "59;197;64;95",
        "wc_strengths": "27;43;92;64",
        "wc_weaknesses": "230;366;49;101",
        "wc_questions": "37;70;2;54",
        "wc_review": "353;676;207;314",
        "wc_reply_reviewers": "128;0;0;0",
        "wc_reply_authors": "1109;845;505;428",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "3;2;1;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            103.75,
            55.57596153014359
        ],
        "wc_strengths_avg": [
            56.5,
            24.336187047275914
        ],
        "wc_weaknesses_avg": [
            186.5,
            122.80981231155758
        ],
        "wc_questions_avg": [
            40.75,
            25.232667318379164
        ],
        "wc_review_avg": [
            387.5,
            174.93212969606242
        ],
        "wc_reply_reviewers_avg": [
            32.0,
            55.42562584220407
        ],
        "wc_reply_authors_avg": [
            721.75,
            273.1404171850076
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8660254037844386,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13964960675486706033&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "University of Illinois Urbana-Champaign;Georgia Institute of Technology",
        "aff_unique_dep": "Department of Computer Science;",
        "aff_unique_url": "https://illinois.edu;https://www.gatech.edu",
        "aff_unique_abbr": "UIUC;Georgia Tech",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Urbana-Champaign;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "CircuitNet 2.0: An Advanced Dataset for Promoting Machine Learning Innovations in Realistic Chip Design Environment",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17860",
        "id": "nMFSUjxMIl",
        "author_site": "Xun Jiang, zhuomin chai, Yuxiang Zhao, Yibo Lin, Runsheng Wang, Ru Huang",
        "tldr": "",
        "abstract": "Integrated circuits or chips are key to enable computing in modern industry. Designing a chip relies on human experts to produce chip data through professional electronic design automation (EDA) software and complicated procedures. Nowadays, prompted by the wide variety of machine learning (ML) datasets, we have witnessed great advancement of ML algorithms in computer vision, natural language processing, and other fields. However, in chip design, high human workload and data sensitivity cause the lack of public datasets, which hinders the progress of ML development for EDA. To this end, we introduce an advanced large-scale dataset, CircuitNet 2.0, which targets promoting ML innovations in a realistic chip design environment. In order to approach the realistic chip design space, we collect more than 10,000 samples with a variety of chip designs (e.g., CPU, GPU, and AI Chip). All the designs are conducted through complete commercial design flows in a widely-used technology node, 14nm FinFET. We collect comprehensive data, including routability, timing, and power, from the design flow to support versatile ML tasks in EDA. Besides, we also introduce some realistic ML tasks with CircuitNet 2.0 to verify the potential for boosting innovations.",
        "keywords": "Chip Design;Machine Learning;Dataset",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Xun Jiang;zhuomin chai;Yuxiang Zhao;Yibo Lin;Runsheng Wang;Ru Huang",
        "authorids": "~Xun_Jiang2;~zhuomin_chai1;~Yuxiang_Zhao2;~Yibo_Lin1;~Runsheng_Wang3;~Ru_Huang2",
        "gender": "M;M;;M;M;F",
        "homepage": ";https://circuitnet.github.io/;;;;http://www.aais.pku.edu.cn/en/duiwu/showproduct.php?id=107&lang=cn",
        "dblp": "181/7509-2;;;98/8892;;",
        "google_scholar": "L3qtP3kAAAAJ;;;;TZ_39qQAAAAJ;",
        "orcid": "0009-0006-7958-8485;;;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Xun_Jiang2;~zhuomin_chai1;~Yuxiang_Zhao2;~Yibo_Lin1;~Runsheng_Wang3;~Ru_Huang2",
        "aff": "Peking University;Wuhan University;Peking University;Peking University;Peking University;Peking University",
        "aff_domain": "pku.edu.cn;whu.edu.cn;pku.edu.cn;pku.edu.cn;pku.edu.cn;pku.edu.cn",
        "position": "PhD student;PhD student;PhD student;Assistant Professor;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\njiang2024circuitnet,\ntitle={CircuitNet 2.0: An Advanced Dataset for Promoting Machine Learning Innovations in Realistic Chip Design Environment},\nauthor={Xun Jiang and zhuomin chai and Yuxiang Zhao and Yibo Lin and Runsheng Wang and Ru Huang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=nMFSUjxMIl}\n}",
        "github": "",
        "project": "",
        "reviewers": "Xf2K;StPZ;uzNQ;XfNZ",
        "pdf_size": 2227470,
        "rating": "5;6;6;6",
        "confidence": "4;5;4;4",
        "soundness": "3;2;3;3",
        "contribution": "3;2;2;4",
        "presentation": "3;3;3;3",
        "wc_summary": "76;37;26;87",
        "wc_strengths": "42;94;100;83",
        "wc_weaknesses": "64;94;105;118",
        "wc_questions": "54;24;53;124",
        "wc_review": "236;249;284;412",
        "wc_reply_reviewers": "0;0;0;117",
        "wc_reply_authors": "443;494;454;740",
        "reply_reviewers": "0;0;0;2",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            56.5,
            25.59785147234041
        ],
        "wc_strengths_avg": [
            79.75,
            22.63155982251334
        ],
        "wc_weaknesses_avg": [
            95.25,
            19.942103700462496
        ],
        "wc_questions_avg": [
            63.75,
            36.81287139031673
        ],
        "wc_review_avg": [
            295.25,
            69.6540558761656
        ],
        "wc_reply_reviewers_avg": [
            29.25,
            50.66248612138966
        ],
        "wc_reply_authors_avg": [
            532.75,
            121.15150638766322
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4649151783646077645&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=nMFSUjxMIl",
        "pdf": "https://openreview.net/pdf?id=nMFSUjxMIl",
        "email": "pku.edu.cn;whu.edu.cn;pku.edu.cn;pku.edu.cn;pku.edu.cn;pku.edu.cn",
        "author_num": 6,
        "aff_unique_index": "0;1;0;0;0;0",
        "aff_unique_norm": "Peking University;Wuhan University",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.pku.edu.cn;http://www.whu.edu.cn/",
        "aff_unique_abbr": "Peking U;WHU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "nMbWsXPUVL",
        "title": "LLM-Codebook for Extreme Compression of Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) have exhibited outstanding performance in both understanding and generating language. However, their remarkable abilities often correlate with large model sizes, leading to challenges during deployment, inference, and training phases. While weight quantization and pruning are prevalent strategies, they tend to lose crucial information under extreme compression.\nIn this paper, we propose LLM-Codebook for extreme compression of large language models (LLM-Codebook), which maps expansive LLMs (in GB) to compact codebooks (in KB). The foundation of LLM-Codebook is our novel Hessian-aware K-means algorithm, which clusters weights into codebooks based on Hessian information, preserving parameters that have significant impacts on predictions. Simultaneously, the tuning technique, LoRA is adopted to update layers that have not been compressed, aiming to recover performance using only a limited corpus. LLM-Codebook effectively preserves the generation and multi-task solving abilities of LLMs, surpassing advanced methods such as GPTQ, QLoRA, LLM-Pruner, and SparseGPT. We validate our approach by extremely compressing LLaMA-7B and Vicuna-7B to a memory requirement of 2GB (a 6x compression factor) while retaining 99% of the baseline performance. Furthermore, our approach maintains reasonable accuracy even under extreme compression ratio, achieving 90% of the original performance (36% better than GPTQ) when the model size is compressed to one-eighth.",
        "keywords": "large language model;compression;codebook;Hessian information",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/0fcbace6b1fe307686fbd65fc0a6b93a48ce06ad.zip",
        "author": "Juncan Deng;Shuaiting Li;Chengxuan Wang;Hong Gu;Haibin Shen;Kejie Huang",
        "authorids": "~Juncan_Deng1;~Shuaiting_Li1;~Chengxuan_Wang1;~Hong_Gu1;~Haibin_Shen1;~Kejie_Huang1",
        "gender": ";M;M;M;;M",
        "homepage": "https://scholar.google.com/citations?hl=zh-CN&view_op=list_works&gmla=AP6z3OYwjL-ohG2n1oAx5yMSCvLwcqPD2JVI6lLGLtvR9yOXN7wtEEk20ZFrQWKPRtMmLDKWx1w8X_cIaBopu2qMYObDXTiDxqLbRIMB0EVsSswDtDwtgqgelkDQzQMrtvo&user=fwk1CPcAAAAJ;https://github.com/list0830;;https://www.vivo.com/;;https://person.zju.edu.cn/huangkejie",
        "dblp": "304/8451;380/8076;;;;05/10461",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;gO6MtK0AAAAJ;;;;",
        "orcid": ";0009-0002-7726-4883;0009-0002-6677-2145;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Juncan_Deng1;~Shuaiting_Li1;~Chengxuan_Wang1;~Hong_Gu1;~Haibin_Shen1;~Kejie_Huang1",
        "aff": "Zhejiang University;Zhejiang University;Zhejiang University;Hangzhou VIVO Information Technology Co., Ltd;;Zhejiang University",
        "aff_domain": "zju.edu.cn;zju.edu.cn;zju.edu.cn;vivo.com;;zju.edu.cn",
        "position": "PhD student;PhD student;MS student;Director;;Full Professor",
        "bibtex": "@misc{\ndeng2024llmcodebook,\ntitle={{LLM}-Codebook for Extreme Compression of Large Language Models},\nauthor={Juncan Deng and Shuaiting Li and Chengxuan Wang and Hong Gu and Haibin Shen and Kejie Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=nMbWsXPUVL}\n}",
        "github": "",
        "project": "",
        "reviewers": "kbsm;1Uyx;LrZH;5akx",
        "site": "https://openreview.net/forum?id=nMbWsXPUVL",
        "pdf_size": 815870,
        "rating": "3;5;5;6",
        "confidence": "4;5;5;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;2;2",
        "presentation": "3;3;3;2",
        "wc_summary": "38;87;65;57",
        "wc_strengths": "22;69;18;34",
        "wc_weaknesses": "50;98;49;297",
        "wc_questions": "232;6;7;4",
        "wc_review": "342;260;139;392",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1125;1368;0;1169",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;0;2",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            61.75,
            17.5695048308141
        ],
        "wc_strengths_avg": [
            35.75,
            20.07952937695503
        ],
        "wc_weaknesses_avg": [
            123.5,
            102.10901037616611
        ],
        "wc_questions_avg": [
            62.25,
            98.01116007884
        ],
        "wc_review_avg": [
            283.25,
            95.69058208622205
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            915.5,
            536.4347583816693
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.2294157338705618,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ELO24GAK0GMJ:scholar.google.com/&scioq=LLM-Codebook+for+Extreme+Compression+of+Large+Language+Models&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "Zhejiang University;VIVO Information Technology Co.",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.zju.edu.cn;https://www.vivo.com.cn",
        "aff_unique_abbr": "ZJU;VIVO",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "nN1bEm8cna",
        "title": "Are Spiking Neural Networks more expressive than Artificial Neural Networks?",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This article studies the expressive power of spiking neural networks with firing-time-based information encoding, highlighting their potential for future energy-efficient AI applications when deployed on neuromorphic hardware. The computational power of a network of spiking neurons has already been studied via their capability of approximating any continuous function. By using the Spike Response Model as a mathematical model of a spiking neuron and assuming a linear response function, we delve deeper into this analysis and prove that spiking neural networks generate continuous piecewise linear mappings. We also show that they can emulate any multi-layer (ReLU) neural network with similar complexity. Furthermore, we show that the maximum number of linear regions generated by a spiking neuron scales exponentially with respect to the input dimension, a characteristic that distinguishes it significantly from an artificial (ReLU) neuron. Our results further extend the understanding of the approximation properties of spiking neural networks and open up new avenues where spiking neural networks can be deployed instead of artificial neural networks without any performance loss.",
        "keywords": "Expressivity;Spiking Neural Networks;Approximation Theory",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Manjot Singh;Adalbert Fono;Gitta Kutyniok",
        "authorids": "~Manjot_Singh1;~Adalbert_Fono1;~Gitta_Kutyniok2",
        "gender": ";;F",
        "homepage": ";;https://www.ai.math.lmu.de/kutyniok",
        "dblp": ";;13/2736",
        "google_scholar": ";;https://scholar.google.de/citations?user=JHs9LssAAAAJ",
        "orcid": "0009-0002-6334-6407;;0000-0001-9738-2487",
        "linkedin": "manjot-singh-2a727712a/;;gitta-kutyniok-2606b215/?originalSubdomain=de",
        "or_profile": "~Manjot_Singh1;~Adalbert_Fono1;~Gitta_Kutyniok2",
        "aff": "Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen;;LMU Munich",
        "aff_domain": "lmu.de;;uni-muenchen.de",
        "position": "PhD student;;Full Professor",
        "bibtex": "@misc{\nsingh2024are,\ntitle={Are Spiking Neural Networks more expressive than Artificial Neural Networks?},\nauthor={Manjot Singh and Adalbert Fono and Gitta Kutyniok},\nyear={2024},\nurl={https://openreview.net/forum?id=nN1bEm8cna}\n}",
        "github": "",
        "project": "",
        "reviewers": "3s5T;Azjn;bNbs;2Xv7",
        "site": "https://openreview.net/forum?id=nN1bEm8cna",
        "pdf_size": 1685072,
        "rating": "3;6;6;6",
        "confidence": "5;4;4;4",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;2",
        "presentation": "3;3;3;2",
        "wc_summary": "86;130;47;58",
        "wc_strengths": "40;91;7;61",
        "wc_weaknesses": "198;174;25;573",
        "wc_questions": "13;280;56;27",
        "wc_review": "337;675;135;719",
        "wc_reply_reviewers": "273;65;308;456",
        "wc_reply_authors": "1092;882;646;1815",
        "reply_reviewers": "1;2;2;2",
        "reply_authors": "2;2;2;3",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            80.25,
            32.04976598978532
        ],
        "wc_strengths_avg": [
            49.75,
            30.621683493890405
        ],
        "wc_weaknesses_avg": [
            242.5,
            201.99566827038643
        ],
        "wc_questions_avg": [
            94.0,
            108.50115206761632
        ],
        "wc_review_avg": [
            466.5,
            241.81139344538752
        ],
        "wc_reply_reviewers_avg": [
            275.5,
            139.60032234919802
        ],
        "wc_reply_authors_avg": [
            1108.75,
            437.21354908099545
        ],
        "reply_reviewers_avg": [
            1.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:9wSPQmsAGV0J:scholar.google.com/&scioq=Are+Spiking+Neural+Networks+more+expressive+than+Artificial+Neural+Networks%3F&hl=en&as_sdt=0,48",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen;Ludwig Maximilian University of Munich",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.lmu.de;https://www.lmu.de",
        "aff_unique_abbr": "LMU;LMU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Munich",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "nNZzt54ZmU",
        "title": "Rethink Depth Separation with Intra-layer Links",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The depth separation theory indicates that depth is significantly more powerful than width, which consists of two parts: i) there exists a function representable by a deep network; ii) such a function cannot be represented by a shallow network whose width is lower than a large threshold. However, the depth-width comparison therein is always based on the standard fully-connected networks, which motivates us to consider the question: Is width always significantly weaker than depth? Here, we report through bound estimation, explicit construction, and functional space analysis that adding shortcuts to connect neurons within a layer can greatly empower the width, such that a slender and shallow network can represent a deep network. Specifically, the width needed can be \\textit{exponentially} reduced by intra-layer links to represent the renowned \u201csawtooth\" functions, compared to the threshold prescribed earlier. This means that width can also be powerful when armed with intra-layer links. Because the sawtooth function is a fundamental module in approximating polynomials and smooth functions, our saving of width is general for broader classes of functions. Lastly, the mechanism we identify can be translated into analyzing the expressivity of popular shortcut networks such as ResNet and DenseNet. We demonstrate that the addition of intra-layer links can also empower a ResNet to generate more linear pieces.",
        "keywords": "Deep learning theory;depth separation;width;intra-layer links",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "FENGLEI FAN;Ze Yu Li;Huan Xiong;Tieyong Zeng",
        "authorids": "~FENGLEI_FAN1;~Ze_Yu_Li1;~Huan_Xiong1;~Tieyong_Zeng2",
        "gender": "M;M;M;M",
        "homepage": ";;https://scholar.google.com/citations?user=l4hm14MAAAAJ&hl=en;https://www.math.cuhk.edu.hk/~zeng/",
        "dblp": ";;;63/2745.html",
        "google_scholar": "YPmyK2wAAAAJ;https://scholar.google.com/citations?view_op=list_works;l4hm14MAAAAJ;https://scholar.google.com.hk/citations?user=2yyTgRwAAAAJ",
        "orcid": ";;;0000-0002-0688-202X",
        "linkedin": ";;;",
        "or_profile": "~FENGLEI_FAN1;~Ze_Yu_Li1;~Huan_Xiong1;~Tieyong_Zeng2",
        "aff": "City University of Hong Kong;The Chinese University of Hong Kong;Harbin Institute of Technology;The Chinese University of Hong Kong",
        "aff_domain": "cityu.edu;cuhk.edu.hk;hit.edu.cn;cuhk.edu.hk",
        "position": "Assistant Professor;PhD student;Full Professor;Full Professor",
        "bibtex": "@misc{\nfan2024rethink,\ntitle={Rethink Depth Separation with Intra-layer Links},\nauthor={FENGLEI FAN and Ze Yu Li and Huan Xiong and Tieyong Zeng},\nyear={2024},\nurl={https://openreview.net/forum?id=nNZzt54ZmU}\n}",
        "github": "",
        "project": "",
        "reviewers": "vJDK;45bo;Nadz;b7mN;4fqv",
        "site": "https://openreview.net/forum?id=nNZzt54ZmU",
        "pdf_size": 833939,
        "rating": "1;5;5;6;6",
        "confidence": "5;2;3;2;4",
        "soundness": "2;3;3;3;3",
        "contribution": "1;2;3;2;3",
        "presentation": "2;2;3;4;2",
        "wc_summary": "32;33;76;152;126",
        "wc_strengths": "4;50;38;147;59",
        "wc_weaknesses": "252;104;110;294;54",
        "wc_questions": "1;2;78;2;95",
        "wc_review": "289;189;302;595;334",
        "wc_reply_reviewers": "241;0;0;87;144",
        "wc_reply_authors": "760;804;971;757;949",
        "reply_reviewers": "1;0;0;1;1",
        "reply_authors": "1;1;2;1;2",
        "rating_avg": [
            4.6,
            1.8547236990991407
        ],
        "confidence_avg": [
            3.2,
            1.16619037896906
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.2,
            0.7483314773547882
        ],
        "presentation_avg": [
            2.6,
            0.8
        ],
        "wc_summary_avg": [
            83.8,
            48.49082387421356
        ],
        "wc_strengths_avg": [
            59.6,
            47.51673389449237
        ],
        "wc_weaknesses_avg": [
            162.8,
            93.00838671861803
        ],
        "wc_questions_avg": [
            35.6,
            41.90751722543344
        ],
        "wc_review_avg": [
            341.8,
            135.5660724517753
        ],
        "wc_reply_reviewers_avg": [
            94.4,
            91.46496597058352
        ],
        "wc_reply_authors_avg": [
            848.2,
            93.04923427949313
        ],
        "reply_reviewers_avg": [
            0.6,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.4,
            0.4898979485566356
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.7027403853825437,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=618602334751742394&as_sdt=80005&sciodt=0,11&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "City University of Hong Kong;Chinese University of Hong Kong;Harbin Institute of Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.cityu.edu.hk;https://www.cuhk.edu.hk;http://www.hit.edu.cn/",
        "aff_unique_abbr": "CityU;CUHK;HIT",
        "aff_campus_unique_index": "0;0;1;0",
        "aff_campus_unique": "Hong Kong SAR;Harbin",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "nNyjIMKGCH",
        "title": "Reinforced UI Instruction Grounding: Towards a Generic UI Task Automation API",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent popularity of Large Language Models (LLMs) has opened countless possibilities in automating numerous AI tasks by connecting LLMs to various domain-specific models or APIs, where LLMs serve as dispatchers while domain-specific models or APIs are action executors. Despite the vast numbers of domain-specific models/APIs, they still struggle to comprehensively cover super diverse automation demands in the interaction between human and User Interfaces (UIs). In this work, we build a multimodal model to ground natural language instructions in given UI screenshots as a generic UI task automation executor. This metadata-free grounding model, consisting of a visual encoder and a language decoder, is first pretrained on well studied document understanding tasks and then learns to decode spatial information from UI screenshots in a promptable way. To facilitate the exploitation of image-to-text pretrained knowledge, we follow the \\textit{pixel-to-sequence} paradigm to predict geometric coordinates in a sequence of tokens using a language decoder. We further propose an innovative Reinforcement Learning (RL) based algorithm to supervise the tokens in such sequence jointly with visually semantic metrics, which effectively strengthens the spatial decoding capability of the \\textit{pixel-to-sequence} paradigm. Extensive experiments demonstrate our proposed reinforced UI instruction grounding model outperforms the state-of-the-art methods by a clear margin and shows the potential as a generic UI task automation API.",
        "keywords": "UI task automation; Instruction grounding; RL for computer vision",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Zhizheng Zhang;Wenxuan Xie;Xiaoyi Zhang;Yan Lu",
        "authorids": "~Zhizheng_Zhang1;~Wenxuan_Xie1;~Xiaoyi_Zhang3;~Yan_Lu7",
        "gender": "M;M;M;M",
        "homepage": ";https://www.microsoft.com/en-us/research/people/wenxie/;https://www.microsoft.com/en-us/research/people/xiaoyizhang/;https://www.microsoft.com/en-us/research/people/yanlu/",
        "dblp": "67/4758;142/0064;;15/4830-1",
        "google_scholar": "X7M0I8kAAAAJ;7vjHnasAAAAJ;;djk5l-4AAAAJ",
        "orcid": ";;;0000-0001-5383-6424",
        "linkedin": ";;;",
        "or_profile": "~Zhizheng_Zhang1;~Wenxuan_Xie1;~Xiaoyi_Zhang3;~Yan_Lu7",
        "aff": "Beijing Galbot Co., Ltd;Microsoft Research Asia;Microsoft;Microsoft Research Asia",
        "aff_domain": "galbot.com;microsoft.com;microsoft.com;microsoft.com",
        "position": "Principal Researcher;Researcher;Researcher;Partner Research Manager",
        "bibtex": "@misc{\nzhang2024reinforced,\ntitle={Reinforced {UI} Instruction Grounding: Towards a Generic {UI} Task Automation {API}},\nauthor={Zhizheng Zhang and Wenxuan Xie and Xiaoyi Zhang and Yan Lu},\nyear={2024},\nurl={https://openreview.net/forum?id=nNyjIMKGCH}\n}",
        "github": "",
        "project": "",
        "reviewers": "tJUL;Nz5p;3sqL;yPFE",
        "site": "https://openreview.net/forum?id=nNyjIMKGCH",
        "pdf_size": 2322879,
        "rating": "5;6;6;6",
        "confidence": "5;3;4;3",
        "soundness": "2;3;3;3",
        "contribution": "2;3;2;2",
        "presentation": "3;2;3;3",
        "wc_summary": "88;168;120;145",
        "wc_strengths": "60;65;62;42",
        "wc_weaknesses": "310;197;229;102",
        "wc_questions": "123;80;77;94",
        "wc_review": "581;510;488;383",
        "wc_reply_reviewers": "873;28;27;23",
        "wc_reply_authors": "1783;519;788;459",
        "reply_reviewers": "2;1;1;1",
        "reply_authors": "4;1;1;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            130.25,
            29.71847068743612
        ],
        "wc_strengths_avg": [
            57.25,
            8.98262211161084
        ],
        "wc_weaknesses_avg": [
            209.5,
            74.48657597178165
        ],
        "wc_questions_avg": [
            93.5,
            18.200274723201296
        ],
        "wc_review_avg": [
            490.5,
            70.94540154231281
        ],
        "wc_reply_reviewers_avg": [
            237.75,
            366.76652996150017
        ],
        "wc_reply_authors_avg": [
            887.25,
            531.7952496027019
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            1.299038105676658
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8703882797784891,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10745915689166667755&as_sdt=5,24&sciodt=0,24&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Galbot;Microsoft",
        "aff_unique_dep": ";Research",
        "aff_unique_url": ";https://www.microsoft.com/en-us/research/group/asia",
        "aff_unique_abbr": ";MSR Asia",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Asia",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "A Simple and Scalable Representation for Graph Generation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17859",
        "id": "nO344avRib",
        "author_site": "Yunhui Jang, Seul Lee, Sungsoo Ahn",
        "tldr": "",
        "abstract": "Recently, there has been a surge of interest in employing neural networks for graph generation, a fundamental statistical learning problem with critical applications like molecule design and community analysis. However, most approaches encounter significant limitations when generating large-scale graphs. This is due to their requirement to output the full adjacency matrices whose size grows quadratically with the number of nodes. In response to this challenge, we introduce a new, simple, and scalable graph representation named gap encoded edge list (GEEL) that has a small representation size that aligns with the number of edges. In addition, GEEL significantly reduces the vocabulary size by incorporating the gap encoding and bandwidth restriction schemes. GEEL can be autoregressively generated with the incorporation of node positional encoding, and we further extend GEEL to deal with attributed graphs by designing a new grammar. Our findings reveal that the adoption of this compact representation not only enhances scalability but also bolsters performance by simplifying the graph generation process. We conduct a comprehensive evaluation across ten non-attributed and two molecular graph generation tasks, demonstrating the effectiveness of GEEL.",
        "keywords": "Graph generative models;graph neural networks;graph representation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/2db16c3abda69465ef0459cc46f71bca20d32cb5.zip",
        "author": "Yunhui Jang;Seul Lee;Sungsoo Ahn",
        "authorids": "~Yunhui_Jang1;~Seul_Lee1;~Sungsoo_Ahn1",
        "gender": "F;Not Specified;M",
        "homepage": "https://yunhuijang.github.io;https://seullee05.github.io;https://sungsooahn.super.site/",
        "dblp": ";159/0357;90/5164",
        "google_scholar": "https://scholar.google.co.kr/citations?user=mYHCTYQAAAAJ;Ek0N9YYAAAAJ;XTenHs0AAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Yunhui_Jang1;~Seul_Lee1;~Sungsoo_Ahn1",
        "aff": "Pohang University of Science and Technology;Korea Advanced Institute of Science & Technology;Pohang University of Science and Technology",
        "aff_domain": "postech.edu;kaist.ac.kr;postech.ac.kr",
        "position": "PhD student;PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\njang2024a,\ntitle={A Simple and Scalable Representation for Graph Generation},\nauthor={Yunhui Jang and Seul Lee and Sungsoo Ahn},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=nO344avRib}\n}",
        "github": "",
        "project": "",
        "reviewers": "aPij;RDfu;EmZF;kVSU",
        "pdf_size": 25678644,
        "rating": "5;6;6;8",
        "confidence": "4;3;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;3;3;4",
        "wc_summary": "50;136;78;232",
        "wc_strengths": "35;112;48;155",
        "wc_weaknesses": "112;56;201;171",
        "wc_questions": "38;179;121;247",
        "wc_review": "235;483;448;805",
        "wc_reply_reviewers": "30;188;0;65",
        "wc_reply_authors": "730;1697;611;1226",
        "reply_reviewers": "1;2;0;1",
        "reply_authors": "2;4;3;3",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            124.0,
            69.6419413859206
        ],
        "wc_strengths_avg": [
            87.5,
            48.66466890876789
        ],
        "wc_weaknesses_avg": [
            135.0,
            55.72701319826857
        ],
        "wc_questions_avg": [
            146.25,
            76.77686826121524
        ],
        "wc_review_avg": [
            492.75,
            203.73558231197612
        ],
        "wc_reply_reviewers_avg": [
            70.75,
            71.49606632535807
        ],
        "wc_reply_authors_avg": [
            1066.0,
            431.1849951007108
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.13245323570650439,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6785226650612220377&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=nO344avRib",
        "pdf": "https://openreview.net/pdf?id=nO344avRib",
        "email": "postech.edu;kaist.ac.kr;postech.ac.kr",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Pohang University of Science and Technology;Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.postech.ac.kr;https://www.kaist.ac.kr",
        "aff_unique_abbr": "POSTECH;KAIST",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Pohang;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "nOf6sb63dT",
        "title": "Generative Models are Self-Watermarked: Intellectual Property Declaration through Re-Generation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Protecting intellectual property for generated data has emerged as a critical concern for AI corporations, as machine-generated content proliferates. Reusing generated data without permission poses a formidable barrier to safeguarding the intellectual property tied to these models. The verification of data ownership is further complicated by the use of Machine Learning as a Service (MLaaS), which\noften operates as a black-box system.\nOur work is dedicated to detecting data reuse from even an individual sample. In contrast to watermarking techniques that embed additional information as watermark triggers into models or generated content, our approach does not introduce artificial watermarks which may compromise the quality of model outputs. Our investigation reveals the existence of latent fingerprints inherently present within deep learning models. In response, we propose an explainable verification procedure to verify data ownership through re-generation. Furthermore, we introduce a novel methodology to amplify the model fingerprints through iterative data regeneration and a theoretical grounding on the proposed approach. We demonstrate the viability of our approach using recent advanced text and image generative\nmodels.",
        "keywords": "Watermark;Generative Model;Re-generation;Fixed-point Theory",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Aditya Desu;Xuanli He;Qiongkai Xu;Wei Lu",
        "authorids": "~Aditya_Desu1;~Xuanli_He2;~Qiongkai_Xu1;~Wei_Lu10",
        "gender": "M;M;M;M",
        "homepage": ";;https://xuqiongkai.github.io;https://istd.sutd.edu.sg/people/faculty/lu-wei",
        "dblp": ";182/1859;127/0174;98/6613-11.html",
        "google_scholar": ";TU8t0iAAAAAJ;https://scholar.google.com.au/citations?user=wCer2WUAAAAJ;n41KN9AAAAAJ",
        "orcid": ";;0000-0003-3312-6825;0000-0003-0827-0382",
        "linkedin": "https://www.linkedin.com/feed/;;;wei-lu-59aa9615/",
        "or_profile": "~Aditya_Desu1;~Xuanli_He2;~Qiongkai_Xu1;~Wei_Lu9",
        "aff": ";University College London, University of London;Macquarie University;Singapore University of Technology and Design",
        "aff_domain": ";ucl.ac.uk;mq.edu.au;sutd.edu.sg",
        "position": ";Postdoc;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\ndesu2024generative,\ntitle={Generative Models are Self-Watermarked: Intellectual Property Declaration through Re-Generation},\nauthor={Aditya Desu and Xuanli He and Qiongkai Xu and Wei Lu},\nyear={2024},\nurl={https://openreview.net/forum?id=nOf6sb63dT}\n}",
        "github": "",
        "project": "",
        "reviewers": "Eg4r;66tW;Bepi;XHuY",
        "site": "https://openreview.net/forum?id=nOf6sb63dT",
        "pdf_size": 29677246,
        "rating": "3;3;5;5",
        "confidence": "4;4;3;3",
        "soundness": "2;2;3;2",
        "contribution": "2;2;2;2",
        "presentation": "2;1;3;3",
        "wc_summary": "50;30;56;74",
        "wc_strengths": "13;24;42;44",
        "wc_weaknesses": "14;236;293;50",
        "wc_questions": "313;5;2;75",
        "wc_review": "390;295;393;243",
        "wc_reply_reviewers": "0;125;0;0",
        "wc_reply_authors": "862;791;1358;960",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            52.5,
            15.708278072405008
        ],
        "wc_strengths_avg": [
            30.75,
            12.871965661856
        ],
        "wc_weaknesses_avg": [
            148.25,
            118.66839301178726
        ],
        "wc_questions_avg": [
            98.75,
            127.09912470194277
        ],
        "wc_review_avg": [
            330.25,
            63.95848262740447
        ],
        "wc_reply_reviewers_avg": [
            31.25,
            54.12658773652741
        ],
        "wc_reply_authors_avg": [
            992.75,
            219.2480045519229
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:BnJ8mFUul6EJ:scholar.google.com/&scioq=Generative+Models+are+Self-Watermarked:+Intellectual+Property+Declaration+through+Re-Generation&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University College London;Macquarie University;Singapore University of Technology and Design",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ucl.ac.uk;https://www.mq.edu.au;https://www.sutd.edu.sg",
        "aff_unique_abbr": "UCL;MQ;SUTD",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2",
        "aff_country_unique": "United Kingdom;Australia;Singapore"
    },
    {
        "id": "nQsimt9atc",
        "title": "IPR-NeRF: Ownership Verification Meets Neural Radiance Field",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Neural Radiance Field (NeRF) models have gained significant attention in the computer vision community in the recent past with state-of-the-art visual quality and produced impressive demonstrations. Since then, technopreneurs have sought to leverage NeRF models into a profitable business. Therefore, NeRF models make it worth the risk of plagiarizers illegally copying, re-distributing, or misusing those models. This paper proposes a comprehensive intellectual property (IP) protection framework for the NeRF model in both black-box and white-box settings, namely IPR-NeRF. In the black-box setting, a diffusion-based solution is introduced to embed and extract the watermark via a two-stage optimization process. In the white-box setting, a designated digital signature is embedded into the weights of the NeRF model by adopting the sign loss objective. Our extensive experiments demonstrate that not only does our approach maintain the fidelity (i.e., the rendering quality) of IPR-NeRF models, but it is also robust against both ambiguity and removal attacks compared to prior arts.",
        "keywords": "ownership verification; neural radiance field; intellectual property right",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Win Kent Ong;Kam Woh Ng;Chee Seng Chan;Yi-Zhe Song;Tao Xiang",
        "authorids": "~Win_Kent_Ong1;~Kam_Woh_Ng1;~Chee_Seng_Chan1;~Yi-Zhe_Song2;~Tao_Xiang1",
        "gender": ";M;;M;M",
        "homepage": ";https://kamwoh.github.io;;http://personal.ee.surrey.ac.uk/Personal/Y.Song/;https://www.surrey.ac.uk/people/tao-xiang",
        "dblp": ";234/8663;;98/1684;22/4460-2.html",
        "google_scholar": ";HxEQkLoAAAAJ;;https://scholar.google.co.uk/citations?user=irZFP_AAAAAJ;MeS5d4gAAAAJ",
        "orcid": ";;;;0000-0002-2530-1059",
        "linkedin": ";thomas-ng-kam-woh/;;;",
        "or_profile": "~Win_Kent_Ong1;~Kam_Woh_Ng1;~Chee_Seng_Chan1;~Yi-Zhe_Song2;~Tao_Xiang1",
        "aff": ";University of Surrey;;University of Surrey;University of Surrey",
        "aff_domain": ";surrey.ac.uk;;surrey.ac.uk;surrey.ac.uk",
        "position": ";PhD student;;Professor;Full Professor",
        "bibtex": "@misc{\nong2024iprnerf,\ntitle={{IPR}-Ne{RF}: Ownership Verification Meets Neural Radiance Field},\nauthor={Win Kent Ong and Kam Woh Ng and Chee Seng Chan and Yi-Zhe Song and Tao Xiang},\nyear={2024},\nurl={https://openreview.net/forum?id=nQsimt9atc}\n}",
        "github": "",
        "project": "",
        "reviewers": "Cayy;qCQu;hWgR;eU8D",
        "site": "https://openreview.net/forum?id=nQsimt9atc",
        "pdf_size": 18996779,
        "rating": "5;6;6;6",
        "confidence": "2;3;2;4",
        "soundness": "2;3;3;3",
        "contribution": "1;2;2;2",
        "presentation": "2;1;3;3",
        "wc_summary": "55;90;83;82",
        "wc_strengths": "51;27;70;38",
        "wc_weaknesses": "109;89;251;25",
        "wc_questions": "7;82;2;47",
        "wc_review": "222;288;406;192",
        "wc_reply_reviewers": "54;199;0;0",
        "wc_reply_authors": "1040;1466;743;864",
        "reply_reviewers": "1;3;0;0",
        "reply_authors": "3;4;2;2",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            77.5,
            13.35102992281869
        ],
        "wc_strengths_avg": [
            46.5,
            16.00781059358212
        ],
        "wc_weaknesses_avg": [
            118.5,
            82.55149907784836
        ],
        "wc_questions_avg": [
            34.5,
            32.5
        ],
        "wc_review_avg": [
            277.0,
            82.17663901620703
        ],
        "wc_reply_reviewers_avg": [
            63.25,
            81.4167519617431
        ],
        "wc_reply_authors_avg": [
            1028.25,
            273.9109116117867
        ],
        "reply_reviewers_avg": [
            1.0,
            1.224744871391589
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5222329678670935,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3782764175391705331&as_sdt=20000005&sciodt=0,21&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Surrey",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.surrey.ac.uk",
        "aff_unique_abbr": "Surrey",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "nR1EEDuov7",
        "title": "Securing Deep Generative Models with Universal Adversarial Signature",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent advances in deep generative models have led to the development of methods capable of synthesizing high-quality, realistic images. These models pose threats to society due to their potential misuse. Prior research attempted to mitigate these threats by detecting generated images, but the varying traces left by different generative models make it challenging to create a universal detector capable of generalizing to new, unseen generative models. In this paper, we propose to inject a universal adversarial signature into an arbitrary pre-trained generative model, in order to make its generated contents more detectable and traceable. First, the imperceptible optimal signature for each image can be found by a signature injector through adversarial training. Subsequently, the signature can be incorporated into an arbitrary generator by fine-tuning it with the images processed by the signature injector. In this way, the detector corresponding to the signature can be reused for any fine-tuned generator for tracking the generator identity. The proposed method is validated on the FFHQ and ImageNet datasets with various state-of-the-art generative models, consistently showing a promising detection rate. Code will be made publicly available.",
        "keywords": "image generation;generated image detection",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Yu Zeng;Mo Zhou;Yuan Xue;Vishal M. Patel",
        "authorids": "~Yu_Zeng1;~Mo_Zhou1;~Yuan_Xue4;~Vishal_M._Patel1",
        "gender": "Not Specified;M;M;M",
        "homepage": ";;;https://engineering.jhu.edu/vpatel36/",
        "dblp": ";;41/5526-2;76/6100",
        "google_scholar": "https://scholar.google.com/citations?hl=en;BVIO95UAAAAJ;yRf1kygAAAAJ;AkEXTbIAAAAJ",
        "orcid": ";0000-0003-3813-4875;;",
        "linkedin": ";mo-zhou-9bb99021b/;;",
        "or_profile": "~Yu_Zeng1;~Mo_Zhou1;~Yuan_Xue4;~Vishal_Patel2",
        "aff": "Johns Hopkins University;Johns Hopkins University;Ohio State University, Columbus;Johns Hopkins University",
        "aff_domain": "jhu.edu;jhu.edu;osu.edu;jhu.edu",
        "position": "PhD student;PhD student;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nzeng2024securing,\ntitle={Securing Deep Generative Models with Universal Adversarial Signature},\nauthor={Yu Zeng and Mo Zhou and Yuan Xue and Vishal M. Patel},\nyear={2024},\nurl={https://openreview.net/forum?id=nR1EEDuov7}\n}",
        "github": "",
        "project": "",
        "reviewers": "D7DW;uR7H;3Y41;ce6G",
        "site": "https://openreview.net/forum?id=nR1EEDuov7",
        "pdf_size": 2137281,
        "rating": "3;5;6;6",
        "confidence": "3;4;4;5",
        "soundness": "2;3;2;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;2;3",
        "wc_summary": "142;22;117;75",
        "wc_strengths": "161;9;82;41",
        "wc_weaknesses": "277;24;95;583",
        "wc_questions": "152;3;130;3",
        "wc_review": "732;58;424;702",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "719;165;573;785",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            89.0,
            45.49175749517708
        ],
        "wc_strengths_avg": [
            73.25,
            56.88749862667544
        ],
        "wc_weaknesses_avg": [
            244.75,
            215.99117458822246
        ],
        "wc_questions_avg": [
            72.0,
            69.43702182553626
        ],
        "wc_review_avg": [
            479.0,
            271.11067850603007
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            560.5,
            240.88327048593473
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.8660254037844386,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3319126060451509697&as_sdt=4005&sciodt=0,6&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Johns Hopkins University;Ohio State University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.jhu.edu;https://www.osu.edu",
        "aff_unique_abbr": "JHU;OSU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Columbus",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "nSDOkm0SKo",
        "title": "Analyzing Complex Interdependencies in Financial Markets: A Neural Network-Based Approach for News Impact Assessment",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Analyzing Complex Interdependencies in Financial Markets: A Neural Network-Based Approach for News Impact Assessment\n\n\nIn the ever-evolving landscape of financial markets, the intricate web of interdependencies among companies, driven by supply chain intricacies and competitive dynamics, has become a central concern for investors and analysts alike. Our research endeavors to shed light on these intricate relationships and their susceptibility to external news events.\n\nIn this study, we examine a hypothetical scenario where Company A relies on Companies B and C, Company B depends on Company D, and Company C's fortunes are intertwined with those of Companies E and F, all while these companies are directly reliant on finite natural resources. We use this scenario to illustrate the profound impact of news pertaining to any one of these companies, be it Company A, B, C, or their competitors, on the entire ecosystem. The ripple effect extends through supply chains and demand chains, with repercussions resonating both directly and indirectly. Of importance, we show how emerging ML techniques can model and predict such effects.\n\nTo navigate this complex terrain, we introduce a novel approach based on constructing dependency graphs for each company using a suitable methodology akin to BFS. This method involves expanding the nodes in the graph to represent companies, scrutinizing their lists of competitors, suppliers, and clients, with terminal nodes denoting natural resources often owned by government entities.\n\nOur research harnesses the wealth of sentiment and dependency information extracted from news articles covering a diverse array of companies. These companies are integrated as nodes into our data model. Through the aggregation of stock values for these nodes during successive news intervals, coupled with a meticulous analysis of news sentiment's influence on each node and the deduction of intricate relationships among them, we present a comprehensive view of the interplay between news events and the financial market landscape.\n\nThe culmination of our efforts culminates in the integration of this analysis into a neural network-based stock trend prediction model. The objective is to assess the effectiveness of our approach in gauging the impact of news on associated companies, providing investors and analysts with a powerful tool to navigate the complex and interconnected world of financial markets. This research not only contributes to a deeper understanding of market dynamics but also offers practical insights for informed decision-making in an increasingly volatile financial landscape.",
        "keywords": "Stock Market Trend Prediction;Market Volatility;LSTM Sentiment Analysis;Demand & Supply Dependency tree;Multi Layer Neural Networks;Learning Statistics;Regressions;Depth-First-Search;Advance Web Scraping;Balance Sheet",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Manaswini Swamy;Arunima Shukla;James Purtilo",
        "authorids": "~Manaswini_Swamy1;~Arunima_Shukla1;~James_Purtilo1",
        "gender": "F;F;",
        "homepage": ";;",
        "dblp": ";;",
        "google_scholar": ";;",
        "orcid": "0009-0009-5764-1494;0009-0007-0343-9616;",
        "linkedin": "manaswini-swamy/;arunima-shukla-pg;",
        "or_profile": "~Manaswini_Swamy1;~Arunima_Shukla1;~James_Purtilo1",
        "aff": ";;University of Maryland, College Park",
        "aff_domain": ";;umd.edu",
        "position": ";;Associate Professor",
        "bibtex": "@misc{\nswamy2024analyzing,\ntitle={Analyzing Complex Interdependencies in Financial Markets: A Neural Network-Based Approach for News Impact Assessment},\nauthor={Manaswini Swamy and Arunima Shukla and James Purtilo},\nyear={2024},\nurl={https://openreview.net/forum?id=nSDOkm0SKo}\n}",
        "github": "",
        "project": "",
        "reviewers": "vZ8q;rbKL;fXLD",
        "site": "https://openreview.net/forum?id=nSDOkm0SKo",
        "pdf_size": 1948099,
        "rating": "1;1;1",
        "confidence": "5;5;4",
        "soundness": "1;2;1",
        "contribution": "1;2;1",
        "presentation": "1;1;1",
        "wc_summary": "18;51;65",
        "wc_strengths": "42;15;1",
        "wc_weaknesses": "199;33;23",
        "wc_questions": "27;1;1",
        "wc_review": "286;100;90",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            1.0,
            0.0
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.0,
            0.0
        ],
        "wc_summary_avg": [
            44.666666666666664,
            19.70335560817553
        ],
        "wc_strengths_avg": [
            19.333333333333332,
            17.016332024133625
        ],
        "wc_weaknesses_avg": [
            85.0,
            80.7134850360624
        ],
        "wc_questions_avg": [
            9.666666666666666,
            12.256517540566824
        ],
        "wc_review_avg": [
            158.66666666666666,
            90.13076919429655
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:_7x0JqfUqLgJ:scholar.google.com/&scioq=Analyzing+Complex+Interdependencies+in+Financial+Markets:+A+Neural+Network-Based+Approach+for+News+Impact+Assessment&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Maryland",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www/umd.edu",
        "aff_unique_abbr": "UMD",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "College Park",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "nTNElfN4O5",
        "title": "3D Interacting Hands Diffusion Model",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Humans make two-hands interactions in a variety of ways. Learning prior distributions of interactions between hands is critical for 1) generating new interacting hands and 2) recovering plausible and accurate interacting hands. Unfortunately, there have been no attempts to learn the prior distribution of interactions between two hands. Due to the lack of prior distribution, previous 3D interacting hands recovery methods often produce hands with physically implausible interactions, such as severe collisions, and semantically meaningless interactions. We present IHDiff, the first generative model for learning the prior distribution of interacting hands. Motivated by the strong performance of recent diffusion models, we learn the prior distributions using the diffusion process. For the reverse diffusion process, we design a novel Transformer-based network, which effectively captures correlations between joints of two hands using self- and cross-attention. We showcase three applications of IHDiff including random sampling, conditional random sampling, and fitting to observations.\nThe code and pre-trained model will be publicly available.",
        "keywords": "3D interacting hands;generative model",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/21e7034fab530b18347e7df279611f4f382f3504.zip",
        "author": "Gyeongsik Moon;Weipeng Xu;Rohan Joshi;Breannan Smith;Takaaki Shiratori",
        "authorids": "~Gyeongsik_Moon1;~Weipeng_Xu1;~Rohan_Joshi1;~Breannan_Smith1;~Takaaki_Shiratori3",
        "gender": "M;M;M;;M",
        "homepage": "https://mks0601.github.io/;https://sites.google.com/view/xuweipeng;;https://breannansmith.com/;https://sites.google.com/view/takaaki-shiratori/home",
        "dblp": "185/6852;190/7431;;72/7188;17/5270.html",
        "google_scholar": "2f2D258AAAAJ;https://scholar.google.de/citations?user=vy8xXDQAAAAJ;;ve3Ki9kAAAAJ;YvS3QpkAAAAJ",
        "orcid": ";;;;",
        "linkedin": "gyeongsik-moon-bb9a73152/;;rohan-m-joshi/;;",
        "or_profile": "~Gyeongsik_Moon1;~Weipeng_Xu1;~Rohan_Joshi1;~Breannan_Smith1;~Takaaki_Shiratori3",
        "aff": "Meta;Meta Reality Labs;Meta Facebook;Meta;Meta",
        "aff_domain": "meta.com;meta.com;fb.com;meta.com;meta.com",
        "position": "Postdoc;Researcher;Researcher;Researcher;Research Scientist",
        "bibtex": "@misc{\nmoon2024d,\ntitle={3D Interacting Hands Diffusion Model},\nauthor={Gyeongsik Moon and Weipeng Xu and Rohan Joshi and Breannan Smith and Takaaki Shiratori},\nyear={2024},\nurl={https://openreview.net/forum?id=nTNElfN4O5}\n}",
        "github": "",
        "project": "",
        "reviewers": "MWq4;Z2YY;uZ7W;h3k4",
        "site": "https://openreview.net/forum?id=nTNElfN4O5",
        "pdf_size": 11385444,
        "rating": "5;5;6;6",
        "confidence": "5;5;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;1;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "52;57;53;41",
        "wc_strengths": "43;74;132;29",
        "wc_weaknesses": "77;51;75;57",
        "wc_questions": "54;57;5;145",
        "wc_review": "226;239;265;272",
        "wc_reply_reviewers": "225;102;0;53",
        "wc_reply_authors": "1277;833;347;401",
        "reply_reviewers": "2;1;0;1",
        "reply_authors": "4;2;1;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            50.75,
            5.931905258852336
        ],
        "wc_strengths_avg": [
            69.5,
            39.588508433635134
        ],
        "wc_weaknesses_avg": [
            65.0,
            11.224972160321824
        ],
        "wc_questions_avg": [
            65.25,
            50.45976119642264
        ],
        "wc_review_avg": [
            250.5,
            18.741664813991314
        ],
        "wc_reply_reviewers_avg": [
            95.0,
            83.27364529069206
        ],
        "wc_reply_authors_avg": [
            714.5,
            375.42875489232307
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.25,
            1.0897247358851685
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9045340337332909,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ld-WJtFhlVsJ:scholar.google.com/&scioq=3D+Interacting+Hands+Diffusion+Model&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Meta",
        "aff_unique_dep": "Meta Platforms, Inc.",
        "aff_unique_url": "https://meta.com",
        "aff_unique_abbr": "Meta",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "FedInverse: Evaluating Privacy Leakage in Federated Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17858",
        "id": "nTNgkEIfeb",
        "author_site": "DI WU, Jun Bai, Yiliao Song, Junjun Chen, Wei Zhou, Yong Xiang, Atul Sajjanhar",
        "tldr": "",
        "abstract": "Federated Learning (FL) is a distributed machine learning technique where multiple devices (such as smartphones or IoT devices) train a shared global model by using their local data. FL claims that the data privacy of local participants is preserved well because local data will not be shared with either the server-side or other training participants. However, this paper discovers a pioneering finding that a model inversion (MI) attacker, who acts as a benign participant, can invert the shared global model and obtain the data belonging to other participants. This will lead to severe data-leakage risk in FL because it is difficult to identify attackers from benign participants.\nIn addition, we found even the most advanced defense approaches could not effectively address this issue. Therefore, it is important to evaluate such data-leakage risks of an FL system before using it. To alleviate this issue, we propose FedInverse to evaluate whether the FL global model can be inverted by MI attackers. In particular, FedInverse can be optimized by leveraging the Hilbert-Schmidt independence criterion (HSIC) as a regularizer to adjust the diversity of the MI attack generator. We test FedInverse with three typical MI attackers, GMI, KED-MI, and VMI, and the experiments show our FedInverse method can successfully obtain the data belonging to other participants. The code of this work is available at https://github.com/Jun-B0518/FedInverse",
        "keywords": "Federated learning;Model Inversion Attack;Privacy-Preserving",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/85b985630a1cb31b60217284fd57f21dae85bf45.zip",
        "author": "Di Wu;Jun Bai;Yiliao Song;Junjun Chen;Wei Zhou;Yong Xiang;Atul Sajjanhar",
        "authorids": "~Di_Wu39;~Jun_Bai3;~Yiliao_Song2;~Junjun_Chen1;~Wei_Zhou15;~Yong_Xiang3;~Atul_Sajjanhar1",
        "gender": "M;M;F;;F;M;M",
        "homepage": "https://diwu.work/;;https://songyiliao.github.io/;;;https://personal-sites.deakin.edu.au/~yxiang/;https://experts.deakin.edu.au/720-Atul-Sajjanhar",
        "dblp": "52/328-50;;186/7620;;69/5011-30.html;98/2912-1;81/6885.html",
        "google_scholar": "https://scholar.google.com.au/citations?user=p-L_yWgAAAAJ;https://scholar.google.com.au/citations?user=HwhA77kAAAAJ;lKzKBHUAAAAJ;;Z-3Gy5sAAAAJ;https://scholar.google.com.au/citations?user=W5VJ07UAAAAJ;GnVqjEcAAAAJ",
        "orcid": "0000-0002-4753-8161;0000-0003-3349-5161;0000-0002-6633-2695;;0000-0002-2548-6348;0000-0003-3545-7863;0000-0002-0445-0573",
        "linkedin": "di-wu-1a273a22/;jun-bai-6623822b2/;;;;yong-xiang-293398255/?originalSubdomain=au;atul-sajjanhar-b657804/",
        "or_profile": "~Di_Wu39;~Jun_Bai3;~Yiliao_Song2;~Junjun_Chen1;~Wei_Zhou15;~Yong_Xiang3;~Atul_Sajjanhar1",
        "aff": "University of Southern Queensland;Deakin University;Royal Melbourne Institute of Technology;;Swinburne University of Technology;Deakin University;Deakin University",
        "aff_domain": "unisq.edu.au;deakin.edu.au;rmit.edu.au;;swin.edu.au;edu.au;deakin.edu.au",
        "position": "Lecturer;PhD student;Postdoc;;Postdoc;Full Professor;Lecturer",
        "bibtex": "@inproceedings{\nwu2024fedinverse,\ntitle={FedInverse: Evaluating Privacy Leakage in Federated Learning},\nauthor={Di Wu and Jun Bai and Yiliao Song and Junjun Chen and Wei Zhou and Yong Xiang and Atul Sajjanhar},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=nTNgkEIfeb}\n}",
        "github": "",
        "project": "",
        "reviewers": "Do36;hL64;5eXT;E5kp",
        "pdf_size": 2763620,
        "rating": "6;6;8;8",
        "confidence": "4;4;3;4",
        "soundness": "3;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;2;3",
        "wc_summary": "87;228;86;77",
        "wc_strengths": "53;103;68;42",
        "wc_weaknesses": "235;309;315;21",
        "wc_questions": "72;44;77;184",
        "wc_review": "447;684;546;324",
        "wc_reply_reviewers": "197;102;55;60",
        "wc_reply_authors": "2728;1751;2300;668",
        "reply_reviewers": "2;2;1;2",
        "reply_authors": "8;5;6;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            119.5,
            62.76344477480502
        ],
        "wc_strengths_avg": [
            66.5,
            23.005434140654682
        ],
        "wc_weaknesses_avg": [
            220.0,
            119.13437790998869
        ],
        "wc_questions_avg": [
            94.25,
            53.32154817707378
        ],
        "wc_review_avg": [
            500.25,
            132.05751587849895
        ],
        "wc_reply_reviewers_avg": [
            103.5,
            56.984647055149864
        ],
        "wc_reply_authors_avg": [
            1861.75,
            771.3230111308751
        ],
        "reply_reviewers_avg": [
            1.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            5.25,
            2.165063509461097
        ],
        "replies_avg": [
            35,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11509418229322101090&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=nTNgkEIfeb",
        "pdf": "https://openreview.net/pdf?id=nTNgkEIfeb",
        "email": "unisq.edu.au;deakin.edu.au;rmit.edu.au;;swin.edu.au;edu.au;deakin.edu.au",
        "author_num": 7,
        "aff_unique_index": "0;1;2;3;1;1",
        "aff_unique_norm": "University of Southern Queensland;Deakin University;Royal Melbourne Institute of Technology;Swinburne University of Technology",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.usq.edu.au;https://www.deakin.edu.au;https://www.rmit.edu.au;https://www.swinburne.edu.au",
        "aff_unique_abbr": "USQ;Deakin;RMIT;SUT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "Australia"
    },
    {
        "title": "Rethinking the Power of Graph Canonization in Graph Representation Learning with Stability",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17857",
        "id": "nTwb2vBLOV",
        "author_site": "Zehao Dong, Muhan Zhang, Philip Payne, Michael Province, Carlos Cruchaga, Tianyu Zhao, Fuhai Li, Yixin Chen",
        "tldr": "",
        "abstract": "The expressivity of Graph Neural Networks (GNNs) has been studied broadly in recent years to reveal the design principles for more powerful GNNs. Graph canonization is known as a typical approach to distinguish non-isomorphic graphs, yet rarely adopted when developing expressive GNNs. This paper proposes to maximize the expressivity of GNNs by graph canonization, then the power of such GNNs is studies from the perspective of model stability. A stable GNN will map similar graphs to close graph representations in the vectorial space, and the stability of GNNs is critical to generalize their performance to unseen graphs. We theoretically reveal the trade-off of expressivity and stability in graph-canonization-enhanced GNNs. Then we introduce a notion of universal graph canonization as the general solution to address the trade-off and characterize a widely applicable sufficient condition to solve the universal graph canonization. A comprehensive set of experiments demonstrates the effectiveness of the proposed method. In many popular graph benchmark datasets, graph canonization successfully enhances GNNs and provides highly competitive performance, indicating the capability and great potential of proposed method in general graph representation learning. In graph datasets where the sufficient condition holds, GNNs enhanced by universal graph canonization consistently outperform GNN baselines and successfully improve the SOTA performance up to $31$%, providing the optimal solution to numerous challenging real-world graph analytical tasks like gene network representation learning in bioinformatics.",
        "keywords": "Graph neural networks;Graph canonization;Stability",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/39ae3370e9fa8e5c3ac0d89a48f15c56bf5f2f40.zip",
        "author": "Zehao Dong;Muhan Zhang;Philip Payne;Michael A Province;Carlos Cruchaga;Tianyu Zhao;Fuhai Li;Yixin Chen",
        "authorids": "~Zehao_Dong1;~Muhan_Zhang1;~Philip_Payne2;~Michael_A_Province2;~Carlos_Cruchaga1;~Tianyu_Zhao4;~Fuhai_Li1;~Yixin_Chen1",
        "gender": "M;M;M;M;M;;M;M",
        "homepage": "https://www.zehaodong.com;https://muhanzhang.github.io/;https://i2db.wustl.edu/faculty-staff/speakers-bureau/speakers-bureau-philip-r-o-payne/;http://genetics.wustl.edu/staff-members/michael-province/;https://cruchagalab.wustl.edu/;https://radonc.wustl.edu/people/tianyu-zhao-phd/;https://profiles.wustl.edu/en/persons/fuhai-li;https://www.cse.wustl.edu/~yixin.chen/",
        "dblp": "292/7480;157/5518;96/6655.html;;;;;59/983",
        "google_scholar": ";https://scholar.google.com.hk/citations?user=OBBqkosAAAAJ;kYypRqUAAAAJ;;;;rVZfU9sAAAAJ;NByrsK0AAAAJ",
        "orcid": ";0000-0002-7680-6401;0000-0002-9532-2998;;;;0000-0002-3773-146X;",
        "linkedin": ";jerry-muhan-zhang-a33a1777/;prpayne/;;;;fuhai-li-1b05611a/;",
        "or_profile": "~Zehao_Dong1;~Muhan_Zhang1;~Philip_Payne2;~Michael_A_Province2;~Carlos_Cruchaga1;~Tianyu_Zhao4;~Fuhai_Li1;~Yixin_Chen1",
        "aff": "Washington University, St. Louis;Peking University;Washington University, Saint Louis;Washington University in St. Louis;;Washington University, Saint Louis;Washington University, Saint Louis;Washington University, Saint Louis",
        "aff_domain": "wustl.edu;pku.edu.cn;wustl.edu;wust.edu;;wustl.edu;wustl.edu;wustl.edu",
        "position": "PhD student;Assistant Professor;Full Professor;Full Professor;;Associate Professor;Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\ndong2024rethinking,\ntitle={Rethinking the Power of Graph Canonization in Graph Representation Learning with Stability},\nauthor={Zehao Dong and Muhan Zhang and Philip Payne and Michael A Province and Carlos Cruchaga and Tianyu Zhao and Fuhai Li and Yixin Chen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=nTwb2vBLOV}\n}",
        "github": "",
        "project": "",
        "reviewers": "RfLx;abzL",
        "pdf_size": 671259,
        "rating": "6;6",
        "confidence": "3;3",
        "soundness": "3;2",
        "contribution": "2;1",
        "presentation": "3;2",
        "wc_summary": "102;56",
        "wc_strengths": "88;52",
        "wc_weaknesses": "370;560",
        "wc_questions": "4;5",
        "wc_review": "564;673",
        "wc_reply_reviewers": "0;289",
        "wc_reply_authors": "1567;2547",
        "reply_reviewers": "0;1",
        "reply_authors": "3;5",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            79.0,
            23.0
        ],
        "wc_strengths_avg": [
            70.0,
            18.0
        ],
        "wc_weaknesses_avg": [
            465.0,
            95.0
        ],
        "wc_questions_avg": [
            4.5,
            0.5
        ],
        "wc_review_avg": [
            618.5,
            54.5
        ],
        "wc_reply_reviewers_avg": [
            144.5,
            144.5
        ],
        "wc_reply_authors_avg": [
            2057.0,
            490.0
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            4.0,
            1.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6194898609402158044&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=nTwb2vBLOV",
        "pdf": "https://openreview.net/pdf?id=nTwb2vBLOV",
        "email": "wustl.edu;pku.edu.cn;wustl.edu;wust.edu;;wustl.edu;wustl.edu;wustl.edu",
        "author_num": 8,
        "aff_unique_index": "0;1;0;0;0;0;0",
        "aff_unique_norm": "Washington University in St. Louis;Peking University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://wustl.edu;http://www.pku.edu.cn",
        "aff_unique_abbr": "WUSTL;Peking U",
        "aff_campus_unique_index": "0;2;0;2;2;2",
        "aff_campus_unique": "St. Louis;;Saint Louis",
        "aff_country_unique_index": "0;1;0;0;0;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "Tight Rates in Supervised Outlier Transfer Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17856",
        "id": "nUBLhhVM1l",
        "author_site": "Mohammadreza Mousavi Kalan, Samory Kpotufe",
        "tldr": "",
        "abstract": "A critical barrier to learning an accurate decision rule for outlier detection is the scarcity of outlier data. As such, practitioners often turn to the use of similar but imperfect outlier data from which they might \\emph{transfer} information to the target outlier detection task. Despite the recent empirical success of transfer learning in outlier detection, a fundamental understanding of when and how knowledge can be transferred from a source to a target in outlier detection remains elusive. In this work, we adopt the traditional framework of Neyman-Pearson classification---which formalizes \\emph{supervised outlier detection}, i.e., unbalanced classification---with the added assumption that we have access to both source and (some or no) target outlier data. Our main results are then as follows:\n\nWe first determine the information-theoretic limits of the problem under a measure of discrepancy that extends some existing notions from traditional balanced classification; interestingly, unlike in balanced classification, seemingly very dissimilar sources can provide much information about a target, thus resulting in fast transfer.\n\nWe then show that, in principle, these information-theoretic limits are achievable by \\emph{adaptive} procedures, i.e., procedures with no a priori information on the discrepancy between source and target distributions.",
        "keywords": "Minimax rate;outlier detection;transfer learning;Neyman-Pearson;unbalanced classification",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Mohammadreza Mousavi Kalan;Samory Kpotufe",
        "authorids": "~Mohammadreza_Mousavi_Kalan1;~Samory_Kpotufe3",
        "gender": "M;M",
        "homepage": ";http://www.columbia.edu/~skk2175/",
        "dblp": "207/8487;",
        "google_scholar": "UaxZ3xgAAAAJ;9r7_pN8AAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Mohammadreza_Mousavi_Kalan1;~Samory_Kpotufe3",
        "aff": "Columbia University;Columbia University",
        "aff_domain": "columbia.edu;columbia.edu",
        "position": "Postdoc;Full Professor",
        "bibtex": "@inproceedings{\nkalan2024tight,\ntitle={Tight Rates in Supervised Outlier Transfer Learning},\nauthor={Mohammadreza Mousavi Kalan and Samory Kpotufe},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=nUBLhhVM1l}\n}",
        "github": "",
        "project": "",
        "reviewers": "kTQ3;3fJQ;Ag52",
        "pdf_size": 616206,
        "rating": "5;6;8",
        "confidence": "3;4;4",
        "soundness": "2;4;3",
        "contribution": "2;2;4",
        "presentation": "2;4;4",
        "wc_summary": "249;66;57",
        "wc_strengths": "8;83;55",
        "wc_weaknesses": "145;134;18",
        "wc_questions": "60;2;13",
        "wc_review": "462;285;143",
        "wc_reply_reviewers": "14;0;110",
        "wc_reply_authors": "566;305;64",
        "reply_reviewers": "1;0;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            124.0,
            88.46468221838589
        ],
        "wc_strengths_avg": [
            48.666666666666664,
            30.944394574067136
        ],
        "wc_weaknesses_avg": [
            99.0,
            57.45142876088171
        ],
        "wc_questions_avg": [
            25.0,
            25.152865973217974
        ],
        "wc_review_avg": [
            296.6666666666667,
            130.4922305051999
        ],
        "wc_reply_reviewers_avg": [
            41.333333333333336,
            48.88989897946427
        ],
        "wc_reply_authors_avg": [
            311.6666666666667,
            204.99485088384267
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.7559289460184545,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8126232121370559700&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=nUBLhhVM1l",
        "pdf": "https://openreview.net/pdf?id=nUBLhhVM1l",
        "email": "columbia.edu;columbia.edu",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Columbia University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.columbia.edu",
        "aff_unique_abbr": "Columbia",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "nUBSQKeROV",
        "title": "Emergent Mixture-of-Experts: Can Dense Pre-trained Transformers Benefit from Emergent Modular Structures?",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Incorporating modular designs into neural networks demonstrates superior out-of-generalization, learning efficiency, etc.\nExisting modular neural networks are generally $\\textit{explicit}$ because their modular architectures are pre-defined, and individual modules are expected to implement distinct functions.\nConversely, recent works reveal that there exist $\\textit{implicit}$ modular structures in standard pre-trained transformers, namely $\\textit{Emergent Modularity}$.\nThey indicate that such modular structures exhibit during the early pre-training phase and are totally spontaneous.\nHowever, most transformers are still treated as monolithic models with their modular natures underutilized.\nTherefore, given the excellent properties of explicit modular architecture, we explore $\\textit{whether and how dense pre-trained transformers can benefit from emergent modular structures.}$\nTo study this question, we construct $\\textbf{E}$mergent $\\textbf{M}$ixture-$\\textbf{o}$f-$\\textbf{E}$xperts (EMoE).\nWithout introducing additional parameters, EMoE can be seen as the modular counterpart of the original model and can be effortlessly incorporated into downstream task tuning.\nExtensive experiments on various downstream tasks (visions and languages) and models (from 22M to 1.5B) demonstrate that EMoE effectively boosts in-domain and out-of-domain generalization abilities.\nFurther analysis and ablation studies suggest that EMoE mitigates negative knowledge transfer and is robust to various configurations.",
        "keywords": "Modular networks;Mixture-of-Experts;Emergent Modularity",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/61d945f22664568b1e1c211540c6aef5c3faea1e.zip",
        "author": "Zihan Qiu;Zeyu Huang;Jie Fu",
        "authorids": "~Zihan_Qiu1;~Zeyu_Huang1;~Jie_Fu2",
        "gender": "M;;M",
        "homepage": ";;https://bigaidream.github.io/",
        "dblp": "313/9471;;",
        "google_scholar": "24eVHiYAAAAJ;https://scholar.google.com/citations?hl=en;66osleIAAAAJ",
        "orcid": ";;0000-0002-4494-843X",
        "linkedin": "zihan-qiu-33a172249/;;",
        "or_profile": "~Zihan_Qiu1;~Zeyu_Huang1;~Jie_Fu1",
        "aff": "Tsinghua University;University of Edinburgh, University of Edinburgh;Hong Kong University of Science and Technology",
        "aff_domain": "tsinghua.edu.cn;ed.ac.uk;ust.hk",
        "position": "Undergrad student;PhD student;Researcher",
        "bibtex": "@misc{\nqiu2024emergent,\ntitle={Emergent Mixture-of-Experts: Can Dense Pre-trained Transformers Benefit from Emergent Modular Structures?},\nauthor={Zihan Qiu and Zeyu Huang and Jie Fu},\nyear={2024},\nurl={https://openreview.net/forum?id=nUBSQKeROV}\n}",
        "github": "",
        "project": "",
        "reviewers": "xYuL;3WYM;qXUa;wdQa;6Xtr",
        "site": "https://openreview.net/forum?id=nUBSQKeROV",
        "pdf_size": 1685671,
        "rating": "3;3;3;6;8",
        "confidence": "4;3;4;4;3",
        "soundness": "2;2;2;4;4",
        "contribution": "1;2;2;3;3",
        "presentation": "3;3;2;3;3",
        "wc_summary": "58;53;174;104;84",
        "wc_strengths": "41;31;250;88;138",
        "wc_weaknesses": "117;160;1211;123;115",
        "wc_questions": "15;363;46;214;107",
        "wc_review": "231;607;1681;529;444",
        "wc_reply_reviewers": "280;401;1172;11;0",
        "wc_reply_authors": "1155;2369;4005;759;163",
        "reply_reviewers": "1;1;2;1;0",
        "reply_authors": "3;4;7;1;1",
        "rating_avg": [
            4.6,
            2.0591260281974
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.8,
            0.9797958971132712
        ],
        "contribution_avg": [
            2.2,
            0.7483314773547882
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            94.6,
            43.76117000264047
        ],
        "wc_strengths_avg": [
            109.6,
            79.83633258109994
        ],
        "wc_weaknesses_avg": [
            345.2,
            433.2086795067707
        ],
        "wc_questions_avg": [
            149.0,
            126.76750372236569
        ],
        "wc_review_avg": [
            698.4,
            507.09667717310083
        ],
        "wc_reply_reviewers_avg": [
            372.8,
            428.4872926937274
        ],
        "wc_reply_authors_avg": [
            1690.2,
            1364.1833307880581
        ],
        "reply_reviewers_avg": [
            1.0,
            0.6324555320336759
        ],
        "reply_authors_avg": [
            3.2,
            2.227105745132009
        ],
        "replies_avg": [
            30,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.35687321357316487,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8968451606990701919&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Tsinghua University;University of Edinburgh;Hong Kong University of Science and Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.ed.ac.uk;https://www.ust.hk",
        "aff_unique_abbr": "THU;Edinburgh;HKUST",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "id": "nUGFpDCu3W",
        "title": "What does GPT store in its MLP weights? A case study of long-range dependencies",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large Language Models such as GPT are able to recall factual information about the world that they have learnt during training. This information must be stored in the model weights yet there is much we do not know about exactly what information is stored, where it is located and how it is retrieved. In this paper, we test and develop existing theories about information storage and retrieval through the example of bracketed sentences. We show that, in the case of recognizing brackets, where a model must learn during training to associate matching opening and closing brackets, very early multi-layer perceptron (MLP) layers in the source position  are responsible for this association. This supports existing work on the importance of MLP layers as key-value memory stores (Meng et al., 2023) and a potential hierarchy of roles within transformers, whereby early layers are responsible for storing and retrieving lower level information compared to more abstract information which is stored in later layers (Geva et al., 2021).",
        "keywords": "Mechanistic Interpretability",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Theo Clark;Shay B Cohen;Fazl Barez",
        "authorids": "~Theo_Clark1;~Shay_B_Cohen1;~Fazl_Barez1",
        "gender": ";M;",
        "homepage": "https://theoclark.co.uk;http://homepages.inf.ed.ac.uk/scohen;",
        "dblp": ";04/5629;",
        "google_scholar": ";;",
        "orcid": ";0000-0003-4753-8353;",
        "linkedin": "theoclark1;;",
        "or_profile": "~Theo_Clark1;~Shay_B_Cohen1;~Fazl_Barez1",
        "aff": "Speechmatics;University of Edinburgh;",
        "aff_domain": "speechmatics.com;ed.ac.uk;",
        "position": "Researcher;Reader;",
        "bibtex": "@misc{\nanonymous2024what,\ntitle={What does {GPT} store in its {MLP} weights? A case study of long-range dependencies},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=nUGFpDCu3W}\n}",
        "github": "",
        "project": "",
        "reviewers": "cp3K;5apn;Un4f",
        "site": "https://openreview.net/forum?id=nUGFpDCu3W",
        "pdf_size": 370102,
        "rating": "3;3;6",
        "confidence": "4;2;3",
        "soundness": "3;2;4",
        "contribution": "2;2;3",
        "presentation": "3;2;3",
        "wc_summary": "57;42;132",
        "wc_strengths": "40;28;30",
        "wc_weaknesses": "264;97;47",
        "wc_questions": "8;31;49",
        "wc_review": "369;198;258",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            77.0,
            39.370039370059054
        ],
        "wc_strengths_avg": [
            32.666666666666664,
            5.2493385826745405
        ],
        "wc_weaknesses_avg": [
            136.0,
            92.78290072349897
        ],
        "wc_questions_avg": [
            29.333333333333332,
            16.77961726487096
        ],
        "wc_review_avg": [
            275.0,
            70.83784299369935
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:nBEKkUtgQsIJ:scholar.google.com/&scioq=What+does+GPT+store+in+its+MLP+weights%3F+A+case+study+of+long-range+dependencies&hl=en&as_sdt=0,30",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Speechmatics;University of Edinburgh",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.speechmatics.com;https://www.ed.ac.uk",
        "aff_unique_abbr": ";Edinburgh",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "nUH5liW3c1",
        "title": "When Hard Negative Sampling Meets Supervised Contrastive Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "State-of-the-art pre-trained image models predominantly follow a two-stage strategy: pre-training on large datasets and fine-tuning on a task-specific labeled dataset with a cross-entropy objective function. However, many studies have shown that cross-entropy can result in sub-optimal generalization and stability. While supervised contrastive learning addresses some limitations of cross-entropy objective function by emphasizing intra-class similarities and inter-class differences, it neglects the importance of hard negative mining. We hypothesize that weighting negative samples by their dissimilarity to positives enhances the efficacy of contrastive learning. This paper introduces a new supervised contrastive learning objective function, named SCHaNe, which incorporates hard negative sampling during the fine-tuning phase. Without requiring specialized architectures, additional data, or extra computational resources, experimental results indicate that SCHaNe outperforms the strong baseline BEiT-3 in Top-1 accuracy across twelve benchmarks, with significant gains of up to 3.32% in few-shot learning settings and 3.41% in full-dataset fine-tuning. Importantly, our proposed objective function sets a new state-of-the-art for base models (parameter size at 88 million) on ImageNet-1k, achieving an accuracy of 86.14%. Furthermore, we demonstrate that the proposed objective function yields better embeddings and explains the improved effectiveness observed in our experiments. Our code is available at https://anonymous.4open.science/r/SCHaNe-61C6/.",
        "keywords": "Contrastive Learning;Hard negative sampling;Supervised Contrastive Learning;Image Classification",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/2f72f194a67f65976967920ede5fc783d806acdb.zip",
        "author": "ZIJUN LONG;George Killick;Richard McCreadie;Gerardo Aragon-Camarasa",
        "authorids": "~ZIJUN_LONG1;~George_Killick1;~Richard_McCreadie2;~Gerardo_Aragon-Camarasa1",
        "gender": "M;M;M;",
        "homepage": "https://longkukuhi.github.io.;;https://www.dcs.gla.ac.uk/~richardm/Home/;",
        "dblp": "218/1189;;;",
        "google_scholar": "717cT8wAAAAJ;;https://scholar.google.co.uk/citations?user=p8550tQAAAAJ;",
        "orcid": "0000-0002-2008-960X;;0000-0002-2751-2087;",
        "linkedin": "zijun-long-10a273197/;george-killick-47315a158/;https://linkedin.com/in/richard-mccreadie-04b62727;",
        "or_profile": "~ZIJUN_LONG1;~George_Killick1;~Richard_McCreadie2;~Gerardo_Aragon-Camarasa1",
        "aff": "University of Glasgow;University of Glasgow;;",
        "aff_domain": "gla.ac.uk;gla.ac.uk;;",
        "position": "PhD student;PhD student;;",
        "bibtex": "@misc{\nlong2024when,\ntitle={When Hard Negative Sampling Meets Supervised Contrastive Learning},\nauthor={ZIJUN LONG and George Killick and Richard McCreadie and Gerardo Aragon-Camarasa},\nyear={2024},\nurl={https://openreview.net/forum?id=nUH5liW3c1}\n}",
        "github": "",
        "project": "",
        "reviewers": "owdS;7hRi;SnpE",
        "site": "https://openreview.net/forum?id=nUH5liW3c1",
        "pdf_size": 1906693,
        "rating": "3;5;6",
        "confidence": "4;4;4",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "2;3;2",
        "wc_summary": "128;47;55",
        "wc_strengths": "44;52;50",
        "wc_weaknesses": "155;171;315",
        "wc_questions": "94;114;6",
        "wc_review": "421;384;426",
        "wc_reply_reviewers": "0;116;0",
        "wc_reply_authors": "2837;1239;1243",
        "reply_reviewers": "0;1;0",
        "reply_authors": "6;3;3",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            76.66666666666667,
            36.444783196257625
        ],
        "wc_strengths_avg": [
            48.666666666666664,
            3.39934634239519
        ],
        "wc_weaknesses_avg": [
            213.66666666666666,
            71.95060033723756
        ],
        "wc_questions_avg": [
            71.33333333333333,
            46.91363222869115
        ],
        "wc_review_avg": [
            410.3333333333333,
            18.732028424302822
        ],
        "wc_reply_reviewers_avg": [
            38.666666666666664,
            54.68292441175968
        ],
        "wc_reply_authors_avg": [
            1773.0,
            752.3633873778459
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            4.0,
            1.4142135623730951
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2087548751482185396&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Glasgow",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.gla.ac.uk",
        "aff_unique_abbr": "Glasgow",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "nW0sCc3LLN",
        "title": "Model Inversion Robustness: Can Transfer Learning Help?",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Model Inversion (MI) attacks aim to reconstruct private training data by abusing access to machine learning models. Contemporary MI attacks have achieved impressive attack performance posing serious threats to privacy. Meanwhile, all existing MI defense methods rely on regularization that has direct conflict with the training objective, resulting in noticeable degradation in model utility. **In this work**, we take a different perspective, and  propose a novel and simple method based on transfer learning (TL) to render MI-robust models. Particularly, by leveraging TL, we limit the number of  layers encoding sensitive information from private training dataset, thereby degrading the performance of  MI attack. We conduct an analysis using Fisher Information to justify our method. Our defense is remarkably simple to implement. Without bells and whistles, we show in extensive experiments that our method achieves state-of-the-art (SOTA) MI robustness. **Our code, pre-trained models, demo and inverted data are included in Appx.**",
        "keywords": "Model Inversion;Transfer Learning;Model Inversion Defense",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Sy-Tuyen Ho;Koh Jun Hao;Keshigeyan Chandrasegaran;Ngoc-Bao Nguyen;Ngai-man Cheung",
        "authorids": "~Sy-Tuyen_Ho1;~Koh_Jun_Hao1;~Keshigeyan_Chandrasegaran1;~Ngoc-Bao_Nguyen1;~Ngai-man_Cheung1",
        "gender": "M;M;M;F;M",
        "homepage": ";;https://keshik6.github.io/;;https://sites.google.com/site/mancheung0407/",
        "dblp": "287/7389;;289/0842;151/8719;82/3605",
        "google_scholar": "fvuhLpIAAAAJ;PN-tchoAAAAJ;vh2Ywj8AAAAJ;zQPES6kAAAAJ;https://scholar.google.com.sg/citations?hl=en",
        "orcid": "0000-0003-3707-257X;0000-0003-0781-7120;;0000-0002-4689-5861;0000-0003-0135-3791",
        "linkedin": ";jun-hao-koh-b729a919b/;keshigeyan-chandrasegaran/;;",
        "or_profile": "~Sy-Tuyen_Ho1;~Koh_Jun_Hao1;~Keshigeyan_Chandrasegaran1;~Ngoc-Bao_Nguyen1;~Ngai-man_Cheung1",
        "aff": "Singapore University of Technology and Design;Singapore University of Technology and Design;Stanford University;Singapore University of Technology and Design;Singapore University of Technology and Design",
        "aff_domain": "sutd.edu.sg;sutd.edu.sg;stanford.edu;sutd.edu.sg;sutd.edu.sg",
        "position": "Researcher;PhD student;PhD student;Postdoc;Associate Professor",
        "bibtex": "@misc{\nho2024model,\ntitle={Model Inversion Robustness: Can Transfer Learning Help?},\nauthor={Sy-Tuyen Ho and Koh Jun Hao and Keshigeyan Chandrasegaran and Ngoc-Bao Nguyen and Ngai-man Cheung},\nyear={2024},\nurl={https://openreview.net/forum?id=nW0sCc3LLN}\n}",
        "github": "",
        "project": "",
        "reviewers": "zxaM;8Fh6;LRKJ;TtAY",
        "site": "https://openreview.net/forum?id=nW0sCc3LLN",
        "pdf_size": 4757101,
        "rating": "3;5;5;6",
        "confidence": "5;4;4;5",
        "soundness": "3;3;3;3",
        "contribution": "1;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "36;80;156;99",
        "wc_strengths": "27;53;50;132",
        "wc_weaknesses": "388;58;225;201",
        "wc_questions": "155;289;35;52",
        "wc_review": "606;480;466;484",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            92.75,
            43.077691442323136
        ],
        "wc_strengths_avg": [
            65.5,
            39.68941924493227
        ],
        "wc_weaknesses_avg": [
            218.0,
            117.08757406317717
        ],
        "wc_questions_avg": [
            132.75,
            101.22345330999136
        ],
        "wc_review_avg": [
            509.0,
            56.4003546088143
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.2294157338705618,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13118229443501945022&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "Singapore University of Technology and Design;Stanford University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.sutd.edu.sg;https://www.stanford.edu",
        "aff_unique_abbr": "SUTD;Stanford",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Stanford",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "Singapore;United States"
    },
    {
        "title": "MIntRec2.0: A Large-scale Benchmark Dataset for Multimodal Intent Recognition and Out-of-scope Detection in Conversations",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17855",
        "id": "nY9nITZQjc",
        "author_site": "Hanlei Zhang, Xin Wang, Hua Xu, Qianrui Zhou, Kai Gao, Jianhua Su, jinyue Zhao, Wenrui Li, Yanting Chen",
        "tldr": "",
        "abstract": "Multimodal intent recognition poses significant challenges, requiring the incorporation of non-verbal modalities from real-world contexts to enhance the comprehension of human intentions. However, most existing multimodal intent benchmark datasets are limited in scale and suffer from difficulties in handling out-of-scope samples that arise in multi-turn conversational interactions. In this paper, we introduce MIntRec2.0, a large-scale benchmark dataset for multimodal intent recognition in multi-party conversations. It contains 1,245 high-quality dialogues with 15,040 samples, each annotated within a new intent taxonomy of 30 fine-grained classes, across text, video, and audio modalities. In addition to more than 9,300 in-scope samples, it also includes over 5,700 out-of-scope samples appearing in multi-turn contexts, which naturally occur in real-world open scenarios, enhancing its practical applicability. Furthermore, we provide comprehensive information on the speakers in each utterance, enriching its utility for multi-party conversational research. We establish a general framework supporting the organization of single-turn and multi-turn dialogue data, modality feature extraction, multimodal fusion, as well as in-scope classification and out-of-scope detection. Evaluation benchmarks are built using classic multimodal fusion methods, ChatGPT, and human evaluators. While existing methods incorporating nonverbal information yield improvements, effectively leveraging context information and detecting out-of-scope samples remains a substantial challenge. Notably, powerful large language models exhibit a significant performance gap compared to humans, highlighting the limitations of machine learning methods in the advanced cognitive intent understanding task. We believe that MIntRec2.0 will serve as a valuable resource, providing a pioneering foundation for research in human-machine conversational interactions, and significantly facilitating related applications.\nThe full dataset and codes are available for use at https://github.com/thuiar/MIntRec2.0.",
        "keywords": "intent recognition;multimodal dataset;out-of-scope detection;multi-turn conversations;benchmark framework;benchmark evaluation",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/76f1e21001418990387aac029f66664cf7c4ff01.zip",
        "author": "Hanlei Zhang;Xin Wang;Hua Xu;Qianrui Zhou;Kai Gao;Jianhua Su;jinyue Zhao;Wenrui Li;Yanting Chen",
        "authorids": "~Hanlei_Zhang1;~Xin_Wang36;~Hua_Xu1;~Qianrui_Zhou1;~Kai_Gao3;~Jianhua_Su2;~jinyue_Zhao1;~Wenrui_Li3;~Yanting_Chen1",
        "gender": "M;M;M;M;M;;F;;M",
        "homepage": "https://hanleizhang.github.io/;https://github.com/mrFocusXin;https://thu-xuhua.github.io/;https://scholar.google.com/citations?user=nzQYQ6QAAAAJ&hl=zh-CN&oi=sra;;https://github.com/JianhuaSu/JianhuaSu.github.io;https://github.com/zjy825297610;;https://github.com/1025378573",
        "dblp": "254/1852;;31/4114-3;274/6997;;;;;",
        "google_scholar": "PS5KVSQAAAAJ;;;nzQYQ6QAAAAJ;https://scholar.google.com/zgVbWLYAAAAJ;;;;",
        "orcid": "0000-0003-3448-6793;;;0000-0002-6550-5216;;;;;",
        "linkedin": "hanlei-zhang-a42347137/;;;;;;;https://www.linkedin.cn/in/%E6%96%87%E7%91%9E-%E6%9D%8E-5b9895278;",
        "or_profile": "~Hanlei_Zhang1;~Xin_Wang36;~Hua_Xu1;~Qianrui_Zhou1;~Kai_Gao3;~Jianhua_Su2;~jinyue_Zhao1;~Wenrui_Li3;~Yanting_Chen1",
        "aff": "Tsinghua University;Hebei University of Science & Technology;Tsinghua University;Tsinghua University;;Hebei University of Science and Technology;Hebei University of Science and Technology;University College London, University of London;",
        "aff_domain": "tsinghua.edu.cn;hebust.edu;tsinghua.edu.cn;tsinghua.edu.cn;;hebust.edu.cn;hebust.edu.cn;ucl.ac.uk;",
        "position": "PhD student;MS student;Associate Professor;PhD student;;MS student;MS student;MS student;",
        "bibtex": "@inproceedings{\nzhang2024mintrec,\ntitle={{MI}ntRec2.0: A Large-scale Benchmark Dataset for Multimodal Intent Recognition and Out-of-scope Detection in Conversations},\nauthor={Hanlei Zhang and Xin Wang and Hua Xu and Qianrui Zhou and Kai Gao and Jianhua Su and jinyue Zhao and Wenrui Li and Yanting Chen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=nY9nITZQjc}\n}",
        "github": "",
        "project": "",
        "reviewers": "ju3D;SFq3;Un9C;kGfg",
        "pdf_size": 4189554,
        "rating": "6;6;6;8",
        "confidence": "4;4;3;3",
        "soundness": "4;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;3;4",
        "wc_summary": "98;76;81;51",
        "wc_strengths": "102;30;73;92",
        "wc_weaknesses": "150;91;145;8",
        "wc_questions": "85;65;138;1",
        "wc_review": "435;262;437;152",
        "wc_reply_reviewers": "43;0;0;0",
        "wc_reply_authors": "3687;2702;4983;19",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "5;4;7;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            76.5,
            16.830032679706836
        ],
        "wc_strengths_avg": [
            74.25,
            27.589626673806226
        ],
        "wc_weaknesses_avg": [
            98.5,
            57.142366069318484
        ],
        "wc_questions_avg": [
            72.25,
            49.02741579973393
        ],
        "wc_review_avg": [
            321.5,
            120.92663064850521
        ],
        "wc_reply_reviewers_avg": [
            10.75,
            18.619546181365433
        ],
        "wc_reply_authors_avg": [
            2847.75,
            1822.5464843180268
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.25,
            2.165063509461097
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3862124638840681229&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=nY9nITZQjc",
        "pdf": "https://openreview.net/pdf?id=nY9nITZQjc",
        "email": "tsinghua.edu.cn;hebust.edu;tsinghua.edu.cn;tsinghua.edu.cn;;hebust.edu.cn;hebust.edu.cn;ucl.ac.uk;",
        "author_num": 9,
        "aff_unique_index": "0;1;0;0;1;1;2",
        "aff_unique_norm": "Tsinghua University;Hebei University of Science and Technology;University College London",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;http://www.hbust.edu.cn;https://www.ucl.ac.uk",
        "aff_unique_abbr": "THU;HUST;UCL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;1",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "id": "nYqUmSYoHi",
        "title": "A Geometric Analysis of Multi-label Learning under Pick-all-label Loss via Neural Collapse",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In this study, we explore multi-label learning, an important subfield of supervised learning that aims to predict multiple labels from a single input data point. This research investigates the training of deep neural networks for multi-label learning through the lens of neural collapse, an intriguing phenomenon that occurs during the terminal phase of training. Previously, neural collapse (NC) has been investigated both theoretically and empirically in the context of multi-class classification. For last-layer features, it has been demonstrated that (i) the variability of features within classes collapses to zero, and (ii) the feature means between classes become maximally and equally separated. In this work, we demonstrate that the NC phenomenon can be extended to multi-label learning, revealing that the \"pick-all-label\" training formulation for multi-label learning exhibits the NC phenomenon in a more general context. Specifically, under the natural analog of the unconstrained feature model, we establish that the only global minimizers of the pick-all-label loss display the same equi-angular tight frame (ETF) geometry. Additionally, scaled average of the ETF are used to represent the features of samples with multiple labels. We also provide empirical evidence to support our investigation into training deep neural networks on multi-label datasets, resulting in improved training efficiency.",
        "keywords": "Multi-label learning;Neural Collapse;Representation Learning",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/a21cdd4ffd92e3f0d245cf975daac0e03793b8d0.zip",
        "author": "Pengyu Li;Yutong Wang;Xiao Li;Qing Qu",
        "authorids": "~Pengyu_Li6;~Yutong_Wang1;~Xiao_Li8;~Qing_Qu2",
        "gender": "M;M;;M",
        "homepage": "https://scholar.google.com/citations?user=QKNif2sAAAAJ&hl=en;https://yutongwang.me/;https://heimine.github.io/;https://qingqu.engin.umich.edu/",
        "dblp": ";90/3631;66/2069-26.html;127/6874-1",
        "google_scholar": ";GH7ryE4AAAAJ;aAX0au8AAAAJ;JfblW3MAAAAJ",
        "orcid": ";0000-0001-7472-6750;;0000-0001-9136-558X",
        "linkedin": ";;;qing-q-1a0b9746/",
        "or_profile": "~Pengyu_Li6;~Yutong_Wang1;~Xiao_Li8;~Qing_Qu2",
        "aff": "University of Michigan - Ann Arbor;University of Michigan - Ann Arbor;University of Michigan;University of Michigan",
        "aff_domain": "umich.edu;umich.edu;umich.edu;umich.edu",
        "position": "PhD student;Postdoc;PhD student;Assistant Professor",
        "bibtex": "@misc{\nli2024a,\ntitle={A Geometric Analysis of Multi-label Learning under Pick-all-label Loss via Neural Collapse},\nauthor={Pengyu Li and Yutong Wang and Xiao Li and Qing Qu},\nyear={2024},\nurl={https://openreview.net/forum?id=nYqUmSYoHi}\n}",
        "github": "",
        "project": "",
        "reviewers": "V285;VsPM;mLb8",
        "site": "https://openreview.net/forum?id=nYqUmSYoHi",
        "pdf_size": 5219041,
        "rating": "3;3;6",
        "confidence": "4;5;2",
        "soundness": "2;2;3",
        "contribution": "1;1;2",
        "presentation": "4;2;3",
        "wc_summary": "81;65;98",
        "wc_strengths": "55;34;40",
        "wc_weaknesses": "111;107;216",
        "wc_questions": "43;3;6",
        "wc_review": "290;209;360",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1075;338;1038",
        "reply_reviewers": "0;0;0",
        "reply_authors": "4;2;3",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            1.247219128924647
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            81.33333333333333,
            13.474255287605157
        ],
        "wc_strengths_avg": [
            43.0,
            8.831760866327848
        ],
        "wc_weaknesses_avg": [
            144.66666666666666,
            50.46671070011289
        ],
        "wc_questions_avg": [
            17.333333333333332,
            18.190351532856337
        ],
        "wc_review_avg": [
            286.3333333333333,
            61.69999099585744
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            817.0,
            339.0408038373356
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            3.0,
            0.816496580927726
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9449111825230683,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Bd7MKIaphGIJ:scholar.google.com/&scioq=A+Geometric+Analysis+of+Multi-label+Learning+under+Pick-all-label+Loss+via+Neural+Collapse&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of Michigan",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.umich.edu",
        "aff_unique_abbr": "UM",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Ann Arbor;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "nZ7rpEp6wj",
        "title": "Multi-Resolution Learning with DeepONets and Long Short-Term Memory Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep operator networks (DeepONets, DONs) offer a distinct advantage over traditional neural networks in their ability to be trained on multi-resolution data. This property becomes especially relevant in real-world scenarios where high-resolution measurements are difficult to obtain, while low-resolution data is more readily available. Nevertheless, DeepONets alone often struggle to capture and maintain dependencies over long sequences compared to other state-of-the-art algorithms.\nWe propose a novel architecture, named DON-LSTM, which extends the DeepONet with a long short-term memory network (LSTM). Combining these two architectures, we equip the network with explicit mechanisms to leverage multi-resolution data, as well as capture temporal dependencies in long sequences. We test our method on long-time-evolution modeling of multiple non-linear systems and show that the proposed multi-resolution DON-LSTM achieves significantly lower generalization error and requires fewer high-resolution samples compared to its vanilla counterparts.",
        "keywords": "multi-resolution learning;operator learning;recurrent neural networks;DeepONet;LSTM;dynamical systems",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/363e501fce10b030c129f7fba86296b351fa2e81.zip",
        "author": "Katarzyna Micha\u0142owska;Somdatta Goswami;George Em Karniadakis;Signe Riemer-S\u00f8rensen",
        "authorids": "~Katarzyna_Micha\u0142owska1;~Somdatta_Goswami1;~George_Em_Karniadakis1;~Signe_Riemer-S\u00f8rensen1",
        "gender": "F;F;;F",
        "homepage": ";https://sites.google.com/view/centrum-intelliphysics/publications?authuser=1;;",
        "dblp": ";239/8600;;",
        "google_scholar": "58ZjvzMAAAAJ;GaKrpSkAAAAJ;;_EQPk6YAAAAJ",
        "orcid": ";0000-0002-8255-9080;;0000-0002-5308-7651",
        "linkedin": "kmichalowska/;somdatta-goswami-ph-d-03a21943/;;signe-riemer-s\u00f8rensen/",
        "or_profile": "~Katarzyna_Micha\u0142owska1;~Somdatta_Goswami1;~George_Em_Karniadakis1;~Signe_Riemer-S\u00f8rensen1",
        "aff": "University of Oslo;Johns Hopkins University;Brown University;SINTEF",
        "aff_domain": "uio.no;jhu.edu;brown.edu;sintef.no",
        "position": "PhD student;Assistant Professor;;Researcher",
        "bibtex": "@misc{\nmicha{\\l}owska2024multiresolution,\ntitle={Multi-Resolution Learning with Deep{ON}ets and Long Short-Term Memory Neural Networks},\nauthor={Katarzyna Micha{\\l}owska and Somdatta Goswami and George Em Karniadakis and Signe Riemer-S{\\o}rensen},\nyear={2024},\nurl={https://openreview.net/forum?id=nZ7rpEp6wj}\n}",
        "github": "",
        "project": "",
        "reviewers": "FcVp;LP9x;qWGe",
        "site": "https://openreview.net/forum?id=nZ7rpEp6wj",
        "pdf_size": 548746,
        "rating": "3;5;6",
        "confidence": "4;2;3",
        "soundness": "2;3;3",
        "contribution": "1;2;2",
        "presentation": "3;3;4",
        "wc_summary": "116;55;153",
        "wc_strengths": "29;39;118",
        "wc_weaknesses": "179;49;210",
        "wc_questions": "60;43;10",
        "wc_review": "384;186;491",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1540;416;990",
        "reply_reviewers": "0;0;0",
        "reply_authors": "3;1;2",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            108.0,
            40.40627014049511
        ],
        "wc_strengths_avg": [
            62.0,
            39.80787191833629
        ],
        "wc_weaknesses_avg": [
            146.0,
            69.74716242734658
        ],
        "wc_questions_avg": [
            37.666666666666664,
            20.75786330258702
        ],
        "wc_review_avg": [
            353.6666666666667,
            126.34960317398001
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            982.0,
            458.9059453381125
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.6546536707079772,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:pPw2-GpkLgsJ:scholar.google.com/&scioq=Multi-Resolution+Learning+with+DeepONets+and+Long+Short-Term+Memory+Neural+Networks&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "University of Oslo;Johns Hopkins University;Brown University;SINTEF",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.uio.no;https://www.jhu.edu;https://www.brown.edu;https://www.sintef.no",
        "aff_unique_abbr": "UiO;JHU;Brown;SINTEF",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "Norway;United States"
    },
    {
        "title": "Optimal transport based adversarial patch to leverage large scale attack transferability",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17854",
        "id": "nZP10evtkV",
        "author_site": "Pol Labarbarie, Adrien CHAN-HON-TONG, St\u00e9phane Herbin, Milad Leyli-abadi",
        "tldr": "",
        "abstract": "Adversarial patch attacks, where a small patch is placed in the scene to fool neural networks, have been studied for numerous applications. Focusing on image classification, we consider the setting of a black-box transfer attack where an attacker does not know the target model. Instead of forcing corrupted image representations to cross the nearest decision boundaries or converge to a particular point, we propose a distribution-oriented approach. We rely on optimal transport to push the feature distribution of attacked images towards an already modeled distribution. We show that this new distribution-oriented approach leads to better transferable patches. Through digital experiments conducted on ImageNet-1K, we provide evidence that our new patches are the only ones that can simultaneously influence multiple Transformer models and Convolutional Neural Networks. Physical world experiments demonstrate that our patch can affect systems in deployment without explicit knowledge.",
        "keywords": "adversarial patch attack;transferability",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/5b4d9c9814d7fd5b2d4d97e32d8482aafc77b475.zip",
        "author": "Pol Labarbarie;Adrien CHAN-HON-TONG;St\u00e9phane Herbin;Milad Leyli-abadi",
        "authorids": "~Pol_Labarbarie1;~Adrien_CHAN-HON-TONG1;~St\u00e9phane_Herbin1;~Milad_Leyli-abadi1",
        "gender": "M;M;M;M",
        "homepage": ";https://www.onera.fr/fr/staff/adrien-chan-hon-tong;https://stepherbin.github.io/;https://dataexpertise.org/",
        "dblp": "322/9197;132/2136.html;49/247;",
        "google_scholar": "5t1MkagAAAAJ;tDnr7esAAAAJ;https://scholar.google.fr/citations?user=xap7jEQAAAAJ;4wFjQ5QAAAAJ",
        "orcid": ";0000-0002-7333-2765;0000-0002-3341-3018;",
        "linkedin": ";;;milad-leyliabadi/",
        "or_profile": "~Pol_Labarbarie1;~Adrien_CHAN-HON-TONG1;~St\u00e9phane_Herbin1;~Milad_Leyli-abadi1",
        "aff": "Onera - The french aerospace lab;Onera - The french aerospace lab;ONERA;Irt SystemX",
        "aff_domain": "onera.fr;onera.fr;onera.fr;irt-systemx.fr",
        "position": "PhD student;Associate Professor;Research Scientist;Researcher",
        "bibtex": "@inproceedings{\nlabarbarie2024optimal,\ntitle={Optimal transport based adversarial patch to leverage large scale attack transferability},\nauthor={Pol Labarbarie and Adrien CHAN-HON-TONG and St{\\'e}phane Herbin and Milad Leyli-abadi},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=nZP10evtkV}\n}",
        "github": "",
        "project": "",
        "reviewers": "edp6;MKWR;dpUD;Ctvh;bKEx",
        "pdf_size": 7252016,
        "rating": "5;6;6;6;8",
        "confidence": "4;4;4;4;4",
        "soundness": "2;3;3;3;3",
        "contribution": "2;3;3;3;3",
        "presentation": "3;3;3;3;4",
        "wc_summary": "54;61;79;88;107",
        "wc_strengths": "23;17;99;71;173",
        "wc_weaknesses": "102;148;253;219;70",
        "wc_questions": "21;7;43;3;63",
        "wc_review": "200;233;474;381;413",
        "wc_reply_reviewers": "0;0;0;0;246",
        "wc_reply_authors": "254;657;439;576;429",
        "reply_reviewers": "0;0;0;0;1",
        "reply_authors": "2;3;2;2;2",
        "rating_avg": [
            6.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.8,
            0.39999999999999997
        ],
        "presentation_avg": [
            3.2,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            77.8,
            19.009471323527123
        ],
        "wc_strengths_avg": [
            76.6,
            57.010876155344256
        ],
        "wc_weaknesses_avg": [
            158.4,
            68.88425073991877
        ],
        "wc_questions_avg": [
            27.4,
            22.64155471693585
        ],
        "wc_review_avg": [
            340.2,
            105.8440362042189
        ],
        "wc_reply_reviewers_avg": [
            49.2,
            98.4
        ],
        "wc_reply_authors_avg": [
            471.0,
            138.20130245406517
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4
        ],
        "reply_authors_avg": [
            2.2,
            0.39999999999999997
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14661325495075826963&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "openreview": "https://openreview.net/forum?id=nZP10evtkV",
        "pdf": "https://openreview.net/pdf?id=nZP10evtkV",
        "email": "onera.fr;onera.fr;onera.fr;irt-systemx.fr",
        "author_num": 4,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "ONERA;SystemX",
        "aff_unique_dep": "The french aerospace lab;",
        "aff_unique_url": "https://www.onera.fr;https://www.systemx.fr",
        "aff_unique_abbr": "Onera;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "France"
    },
    {
        "title": "AdaMerging: Adaptive Model Merging for Multi-Task Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17853",
        "id": "nZP6NgD3QY",
        "author_site": "Enneng Yang, Zhenyi Wang, Li Shen, Shiwei Liu, Guibing Guo, Xingwei Wang, Dacheng Tao",
        "tldr": "",
        "abstract": "Multi-task learning (MTL) aims to empower a model to tackle multiple tasks simultaneously. A recent development known as task arithmetic has revealed that several models, each fine-tuned for distinct tasks, can be directly merged into a single model to execute MTL without necessitating a retraining process using the initial training data. Nevertheless, this direct addition of models often leads to a significant deterioration in the overall performance of the merged model. This decline occurs due to potential conflicts and intricate correlations among the multiple tasks. Consequently, the challenge emerges of how to merge pre-trained models more effectively without using their original training data. This paper introduces an innovative technique called Adaptive Model Merging (AdaMerging). This approach aims to autonomously learn the coefficients for model merging, either in a task-wise or layer-wise manner, without relying on the original training data. Specifically, our AdaMerging method operates as an automatic, unsupervised task arithmetic scheme. It leverages entropy minimization on unlabeled test samples from the multi-task setup as a surrogate objective function to iteratively refine the merging coefficients of the multiple models. Our experimental findings across eight tasks demonstrate the efficacy of the AdaMerging scheme we put forth. Compared to the current state-of-the-art (SOTA) task arithmetic merging scheme, AdaMerging showcases a remarkable 11\\% improvement in performance. Notably, AdaMerging also exhibits superior generalization capabilities when applied to unseen downstream tasks. Furthermore, it displays a significantly enhanced robustness to data distribution shifts that may occur during the testing phase.",
        "keywords": "Multi-task Learning;Model Editing;Task Arithmetic",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/c59aef656b2c29b249c2c83b9456a9029b7b4b10.zip",
        "author": "Enneng Yang;Zhenyi Wang;Li Shen;Shiwei Liu;Guibing Guo;Xingwei Wang;Dacheng Tao",
        "authorids": "~Enneng_Yang1;~Zhenyi_Wang1;~Li_Shen1;~Shiwei_Liu2;~Guibing_Guo2;~Xingwei_Wang3;~Dacheng_Tao1",
        "gender": "M;;M;M;M;M;",
        "homepage": ";;https://sites.google.com/site/mathshenli/home;https://shiweiliuiiiiiii.github.io/;https://guoguibing.github.io/cn/;https://www.neu.edu.cn/info/1012/3221.htm;",
        "dblp": "246/2889;;91/3680-8;234/8697-3.html;84/10716;99/4694-1;",
        "google_scholar": ";;yVhgENIAAAAJ;73IbXtsAAAAJ;YMXJa2EAAAAJ;;",
        "orcid": "0000-0001-5419-5286;;;;;0000-0003-2856-4716;",
        "linkedin": ";;;;;;",
        "or_profile": "~Enneng_Yang1;~Zhenyi_Wang1;~Li_Shen1;~Shiwei_Liu2;~Guibing_Guo2;~Xingwei_Wang3;~Dacheng_Tao1",
        "aff": "Northeastern University;;JD Explore Academy;University of Oxford;Northeastern University;Northeastern University;",
        "aff_domain": "neu.edu.cn;;jd.com;ox.ac.uk;neu.edu.cn;neu.edu;",
        "position": "PhD student;;Researcher;Postdoc;Full Professor;Full Professor;",
        "bibtex": "@inproceedings{\nyang2024adamerging,\ntitle={AdaMerging: Adaptive Model Merging for Multi-Task Learning},\nauthor={Enneng Yang and Zhenyi Wang and Li Shen and Shiwei Liu and Guibing Guo and Xingwei Wang and Dacheng Tao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=nZP6NgD3QY}\n}",
        "github": "",
        "project": "",
        "reviewers": "zdU4;eRin;3WDA;88YY",
        "pdf_size": 1580320,
        "rating": "6;6;6;8",
        "confidence": "4;5;3;4",
        "soundness": "2;3;2;3",
        "contribution": "1;3;2;3",
        "presentation": "3;3;4;4",
        "wc_summary": "100;175;264;69",
        "wc_strengths": "16;174;95;62",
        "wc_weaknesses": "25;129;352;38",
        "wc_questions": "381;83;118;30",
        "wc_review": "522;561;829;199",
        "wc_reply_reviewers": "15;105;834;0",
        "wc_reply_authors": "1300;1491;2618;325",
        "reply_reviewers": "1;2;4;0",
        "reply_authors": "3;4;7;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            152.0,
            75.27615824416121
        ],
        "wc_strengths_avg": [
            86.75,
            57.66010319102802
        ],
        "wc_weaknesses_avg": [
            136.0,
            130.98664054017112
        ],
        "wc_questions_avg": [
            153.0,
            135.31260103922324
        ],
        "wc_review_avg": [
            527.75,
            223.5882096623165
        ],
        "wc_reply_reviewers_avg": [
            238.5,
            346.14917304537937
        ],
        "wc_reply_authors_avg": [
            1433.5,
            814.3925650446472
        ],
        "reply_reviewers_avg": [
            1.75,
            1.479019945774904
        ],
        "reply_authors_avg": [
            3.75,
            2.165063509461097
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 121,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13566734225805515719&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=nZP6NgD3QY",
        "pdf": "https://openreview.net/pdf?id=nZP6NgD3QY",
        "email": "neu.edu.cn;;jd.com;ox.ac.uk;neu.edu.cn;neu.edu;",
        "author_num": 7,
        "aff_unique_index": "0;1;2;0;0",
        "aff_unique_norm": "Northeastern University;JD;University of Oxford",
        "aff_unique_dep": ";JD Explore Academy;",
        "aff_unique_url": "https://www.northeastern.edu;;https://www.ox.ac.uk",
        "aff_unique_abbr": "NEU;;Oxford",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;2;0;0",
        "aff_country_unique": "United States;;United Kingdom"
    },
    {
        "id": "na7AgFyp1r",
        "title": "Empowering Active Learning for 3D Molecular Graphs with Geometric Graph Isomorphism",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Molecular learning is pivotal in many real-world applications, such as drug discovery. Supervised learning requires heavy human annotation, which is particularly challenging for molecular data, e.g., the commonly used density functional theory (DFT) is computationally very expensive. Active Learning (AL) automatically queries labels for most informative samples, thereby remarkably alleviating the annotation hurdle. In this paper, we present a novel and powerful AL paradigm for molecular learning, where we treat molecules as 3D molecular graphs. Specifically, we propose a new diversity sampling method to eliminate mutual redundancy built on distributions of 3D geometries. We first propose a set of new 3D graph isometrics for 3D graph isomorphism analysis. Our method is provably more powerful than the geometric Weisfeiler-Lehman (GWL) test. The moments of the distributions of the associated geometries are then extracted for efficient diversity computing. To ensure our AL paradigm selects samples with maximal uncertainties, we carefully design a Bayesian geometric graph neural network to compute uncertainties specifically for 3D molecular graphs. We pose active sampling as a quadratic programming (QP) problem using the novel components and conduct extensive experiments on the QM9 dataset. Results demonstrate the effectiveness of our AL paradigm, as well as the proposed diversity and uncertainty methods.",
        "keywords": "Active learning;3D molecular graphs;graph neural networks;molecular diversity",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Ronast Subedi;Lu Wei;Shayok Chakraborty;Yi Liu",
        "authorids": "~Ronast_Subedi1;~Lu_Wei2;~Shayok_Chakraborty1;~Yi_Liu12",
        "gender": "M;F;M;",
        "homepage": "https://sronast.github.io/;https://rombergliwei.github.io/;http://shayokch.com/;",
        "dblp": "317/7000;;70/908;",
        "google_scholar": "ky1Tq6QAAAAJ;QuVuEikAAAAJ;5f3w1p0AAAAJ;",
        "orcid": "0000-0002-7569-724X;;;",
        "linkedin": "sronast/;;;",
        "or_profile": "~Ronast_Subedi1;~Lu_Wei2;~Shayok_Chakraborty1;~Yi_Liu12",
        "aff": "Florida State University;State University of New York at Stony Brook;Florida State University;",
        "aff_domain": "fsu.edu;stonybrook.edu;fsu.edu;",
        "position": "PhD student;PhD student;Associate Professor;",
        "bibtex": "@misc{\nsubedi2024empowering,\ntitle={Empowering Active Learning for 3D Molecular Graphs with Geometric Graph Isomorphism},\nauthor={Ronast Subedi and Lu Wei and Shayok Chakraborty and Yi Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=na7AgFyp1r}\n}",
        "github": "",
        "project": "",
        "reviewers": "wRPn;6CA5;TZEh",
        "site": "https://openreview.net/forum?id=na7AgFyp1r",
        "pdf_size": 615235,
        "rating": "6;6;6",
        "confidence": "2;4;2",
        "soundness": "2;3;2",
        "contribution": "3;3;3",
        "presentation": "2;3;2",
        "wc_summary": "49;104;31",
        "wc_strengths": "16;123;22",
        "wc_weaknesses": "170;91;290",
        "wc_questions": "40;224;2",
        "wc_review": "275;542;345",
        "wc_reply_reviewers": "12;17;138",
        "wc_reply_authors": "2380;1456;1682",
        "reply_reviewers": "1;1;2",
        "reply_authors": "5;3;6",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            61.333333333333336,
            31.051927834229907
        ],
        "wc_strengths_avg": [
            53.666666666666664,
            49.08722395446249
        ],
        "wc_weaknesses_avg": [
            183.66666666666666,
            81.81415253827149
        ],
        "wc_questions_avg": [
            88.66666666666667,
            96.94442852594584
        ],
        "wc_review_avg": [
            387.3333333333333,
            113.03785010143973
        ],
        "wc_reply_reviewers_avg": [
            55.666666666666664,
            58.25423208278997
        ],
        "wc_reply_authors_avg": [
            1839.3333333333333,
            393.2847427613852
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13810471184642762099&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Florida State University;State University of New York at Stony Brook",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.fsu.edu;https://www.stonybrook.edu",
        "aff_unique_abbr": "FSU;SUNY Stony Brook",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Stony Brook",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "naEeJTlRsr",
        "title": "Revisiting High-Resolution ODEs for Faster Convergence Rates",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "There has been a growing interest in high-resolution ordinary differential equations (HR-ODEs) for investigating the dynamics and convergence characteristics of momentum-based optimization algorithms. As a result, the literature includes a number of HR-ODEs that represent diverse methods. In this work, we demonstrate that these different HR-ODEs can be unified as special cases of a general HR-ODE model with varying parameters. In addition, by using the integral quadratic constraints from robust control theory, we introduce a general Lyapunov function for the convergence analysis of the proposed HR-ODE. Not only can a large number of popular optimization algorithms be viewed as discretizations of our general HR-ODE, but our analysis also leads to several critical improvements in the convergence guarantees of these methods, both in continuous and discrete-time settings. The notable improvements include enhanced convergence guarantees, compared to prior art, for the triple momentum method ODE in continuous-time and for the quasi hyperbolic momentum algorithm in discrete-time settings.",
        "keywords": "Convex optimization;first-order method;ordinary differential equation;accelerated method;Lyapunov function;convergence rate;semi-implicit Euler;high-resolution ODE;gradient minimization",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/1c851401a720e52c33d8384df9426274f655717f.zip",
        "author": "Hoomaan Maskan;Armin Eftekhari;Konstantinos C. Zygalakis;Alp Yurtsever",
        "authorids": "~Hoomaan_Maskan1;~Armin_Eftekhari2;~Konstantinos_C._Zygalakis1;~Alp_Yurtsever2",
        "gender": "M;;M;M",
        "homepage": ";;;https://alpyurtsever.github.io",
        "dblp": "228/8319;;80/9576;174/9621",
        "google_scholar": "https://scholar.google.com.au/citations?hl=en;;;wa_n-xYAAAAJ",
        "orcid": "0000-0001-8251-2605;;;",
        "linkedin": ";;;",
        "or_profile": "~Hoomaan_Maskan1;~Armin_Eftekhari2;~Konstantinos_C._Zygalakis1;~Alp_Yurtsever2",
        "aff": "Umea University;;University of Edinburgh;Ume\u00e5 University",
        "aff_domain": "umu.se;;ed.ac.uk;umu.se",
        "position": "PhD student;;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nmaskan2024revisiting,\ntitle={Revisiting High-Resolution {ODE}s for Faster Convergence Rates},\nauthor={Hoomaan Maskan and Armin Eftekhari and Konstantinos C. Zygalakis and Alp Yurtsever},\nyear={2024},\nurl={https://openreview.net/forum?id=naEeJTlRsr}\n}",
        "github": "",
        "project": "",
        "reviewers": "oAou;ut71;6yy2;fWEa",
        "site": "https://openreview.net/forum?id=naEeJTlRsr",
        "pdf_size": 538378,
        "rating": "1;3;3;8",
        "confidence": "5;4;4;2",
        "soundness": "2;3;3;3",
        "contribution": "2;2;1;3",
        "presentation": "2;2;3;3",
        "wc_summary": "11;57;87;79",
        "wc_strengths": "1;41;33;67",
        "wc_weaknesses": "22;101;570;1",
        "wc_questions": "21;124;277;1",
        "wc_review": "55;323;967;148",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;862;1352;11",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;2;2;1",
        "rating_avg": [
            3.75,
            2.5860201081971503
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            58.5,
            29.542342493444895
        ],
        "wc_strengths_avg": [
            35.5,
            23.553131426627754
        ],
        "wc_weaknesses_avg": [
            173.5,
            231.93587475852027
        ],
        "wc_questions_avg": [
            105.75,
            109.33292047686278
        ],
        "wc_review_avg": [
            373.25,
            356.0494172162061
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            556.25,
            577.3674631463051
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.82915619758885
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9980305249223754,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:msdNa_MeHTIJ:scholar.google.com/&scioq=Revisiting+High-Resolution+ODEs+for+Faster+Convergence+Rates&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Ume\u00e5 University;University of Edinburgh",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.umu.se;https://www.ed.ac.uk",
        "aff_unique_abbr": "UMU;Edinburgh",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Sweden;United Kingdom"
    },
    {
        "title": "Out-of-Distribution Detection with Negative Prompts",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17852",
        "id": "nanyAujl6e",
        "author_site": "Jun Nie, Yonggang Zhang, Zhen Fang, Tongliang Liu, Bo Han, Xinmei Tian",
        "tldr": "",
        "abstract": "Out-of-distribution (OOD) detection is indispensable for open-world machine learning models. Inspired by recent success in large pre-trained language-vision models, e.g., CLIP, advanced works have achieved impressive OOD detection results by matching the *similarity* between image features and features of learned prompts, i.e., positive prompts. However, existing works typically struggle with OOD samples having similar features with those of known classes. One straightforward approach is to introduce negative prompts to achieve a *dissimilarity* matching, which further assesses the anomaly level of image features by introducing the absence of specific features. Unfortunately, our experimental observations show that either employing a prompt like \"not a photo of a\" or learning a prompt to represent \"not containing\" fails to capture the dissimilarity for identifying OOD samples. The failure may be contributed to the diversity of negative features, i.e., tons of features could indicate features not belonging to a known class. To this end, we propose to learn a set of negative prompts for each class. The learned positive prompt (for all classes) and negative prompts (for each class) are leveraged to measure the similarity and dissimilarity in the feature space simultaneously, enabling more accurate detection of OOD samples. Extensive experiments are conducted on diverse OOD detection benchmarks, showing the effectiveness of our proposed method.",
        "keywords": "out-of-distribution dection;CLIP;prompt learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Jun Nie;Yonggang Zhang;Zhen Fang;Tongliang Liu;Bo Han;Xinmei Tian",
        "authorids": "~Jun_Nie1;~Yonggang_Zhang1;~Zhen_Fang2;~Tongliang_Liu1;~Bo_Han1;~Xinmei_Tian1",
        "gender": ";M;M;M;F;M",
        "homepage": "http://staff.ustc.edu.cn/~xinmei/students.html;https://yonggangzhangben.github.io/index.html;https://fang-zhen.github.io/index.html;https://tongliang-liu.github.io/;https://faculty.ustc.edu.cn/tianxinmei1/zh_CN/index.htm;https://bhanml.github.io/",
        "dblp": ";27/6859-3;;150/6667;03/5204-1;241/0472-3",
        "google_scholar": ";XSbEr98AAAAJ;OzD6WJcAAAAJ;https://scholar.google.com.au/citations?user=EiLdZ_YAAAAJ;https://scholar.google.com.au/citations?hl=zh-CN;nTNjqHwAAAAJ",
        "orcid": ";0000-0002-4080-7592;0000-0003-0602-6255;;0000-0002-5952-8753;",
        "linkedin": ";;;;;",
        "or_profile": "~Jun_Nie1;~Yonggang_Zhang1;~Zhen_Fang2;~Tongliang_Liu1;~Xinmei_Tian1;~bo_han2",
        "aff": "University of Science and Technology of China;Hong Kong Baptist University;University of Technology Sydney;Mohamed bin Zayed University of Artificial Intelligence;University of Science and Technology of China;MBZUAI",
        "aff_domain": "ustc.edu.cn;hkbu.edu.hk;uts.edu.au;mbzuai.ac.ae;ustc.edu.cn;mbzuai.ac.ae",
        "position": "MS student;Postdoc;Assistant Professor;Affiliated Associate Professor;Full Professor;Researcher",
        "bibtex": "@inproceedings{\nnie2024outofdistribution,\ntitle={Out-of-Distribution Detection with Negative Prompts},\nauthor={Jun Nie and Yonggang Zhang and Zhen Fang and Tongliang Liu and Bo Han and Xinmei Tian},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=nanyAujl6e}\n}",
        "github": "",
        "project": "",
        "reviewers": "ayMs;ZZhi;Dyvx;r91y",
        "pdf_size": 3231938,
        "rating": "5;6;6;8",
        "confidence": "4;5;5;4",
        "soundness": "2;3;2;3",
        "contribution": "2;3;2;3",
        "presentation": "2;3;3;4",
        "wc_summary": "58;48;51;140",
        "wc_strengths": "46;39;28;55",
        "wc_weaknesses": "129;71;92;15",
        "wc_questions": "35;89;10;106",
        "wc_review": "268;247;181;316",
        "wc_reply_reviewers": "0;0;738;0",
        "wc_reply_authors": "1067;869;3247;671",
        "reply_reviewers": "0;0;4;0",
        "reply_authors": "5;3;9;3",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            74.25,
            38.13381045738807
        ],
        "wc_strengths_avg": [
            42.0,
            9.874208829065749
        ],
        "wc_weaknesses_avg": [
            76.75,
            41.25757506204164
        ],
        "wc_questions_avg": [
            60.0,
            38.99358921669048
        ],
        "wc_review_avg": [
            253.0,
            48.51288488638869
        ],
        "wc_reply_reviewers_avg": [
            184.5,
            319.56337399645787
        ],
        "wc_reply_authors_avg": [
            1463.5,
            1039.1788825798953
        ],
        "reply_reviewers_avg": [
            1.0,
            1.7320508075688772
        ],
        "reply_authors_avg": [
            5.0,
            2.449489742783178
        ],
        "replies_avg": [
            30,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.2294157338705618,
        "gs_citation": 22,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7837333973961582918&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=nanyAujl6e",
        "pdf": "https://openreview.net/pdf?id=nanyAujl6e",
        "email": "ustc.edu.cn;hkbu.edu.hk;uts.edu.au;mbzuai.ac.ae;ustc.edu.cn;mbzuai.ac.ae",
        "author_num": 6,
        "aff_unique_index": "0;1;2;3;0;3",
        "aff_unique_norm": "University of Science and Technology of China;Hong Kong Baptist University;University of Technology Sydney;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "http://www.ustc.edu.cn;https://www.hkbu.edu.hk;https://www.uts.edu.au;https://mbzuai.ac.ae",
        "aff_unique_abbr": "USTC;HKBU;UTS;MBZUAI",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;1;2;0;2",
        "aff_country_unique": "China;Australia;United Arab Emirates"
    },
    {
        "id": "nat6EsXhPm",
        "title": "IMAST: Importance-Aware Statistical Test for Transformer Interpretability Evaluation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Post-hoc explanations offer a promising avenue to interpret Transformer models. Despite plausible visualizations, rigorous evaluations of their efficacy remain largely unexplored. In this paper, we focus on the principle of faithfulness, a fundamental property of explanation methods: the importance scores derived from explanation methods should reflect the anticipated impact of corresponding input elements. To this end, we propose a novel evaluation framework, the IMportance-Aware Statistical Test (IMAST). Unlike traditional metrics that rely on cumulative perturbation and quantify performance reduction, IMAST performs statistical comparisons among individual pixel subsets, thereby aggregating their importance score differences into a resulting faithfulness coefficient. Extensive experiments demonstrate the shortcomings of existing metrics in aligning with the faithfulness assumption, as they often cannot distinguish Random Attribution from advanced explanations. In contrast, IMAST is effective in setting a baseline for evaluating faithfulness, which provides a robust benchmark for explanations. Moreover, using the proposed IMAST, we find through ablation studies that the incorporation of gradient information and cross-layer aggregation significantly improves the faithfulness of attention-based methods, providing guidance for the future development of Transformer interpretability.",
        "keywords": "Post-hoc Explainability;Vision Transformer;Explainable AI",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Junyi Wu;Weitai Kang;Hao Tang;Yuan Hong;Yan Yan",
        "authorids": "~Junyi_Wu1;~Weitai_Kang1;~Hao_Tang6;~Yuan_Hong1;~Yan_Yan6",
        "gender": "M;M;M;M;M",
        "homepage": "https://adreamwu.github.io/;https://weitaikang.github.io/;https://ha0tang.github.io/;https://yhongcs.github.io/;",
        "dblp": ";372/4979;07/5751-5;79/5433-1;13/3953-2",
        "google_scholar": "Akua_xUAAAAJ;hDl0MkwAAAAJ;9zJkeEMAAAAJ;KJuZW2wAAAAJ;",
        "orcid": ";0009-0007-6484-0665;0000-0002-2077-1246;;",
        "linkedin": "junyi-wu-82a92b24a/;weitaikang/;hao-tang-887475138/;;",
        "or_profile": "~Junyi_Wu1;~Weitai_Kang1;~Hao_Tang6;~Yuan_Hong1;~Yan_Yan6",
        "aff": "Illinois Institute of Technology;Illinois Institute of Technology;Carnegie Mellon University;University of Connecticut;University of Illinois Chicago",
        "aff_domain": "iit.edu;hawk.iit.edu;cmu.edu;uconn.edu;uic.edu",
        "position": "PhD student;PhD student;Postdoc;Associate Professor;Associate Professor",
        "bibtex": "@misc{\nwu2024imast,\ntitle={{IMAST}: Importance-Aware Statistical Test for Transformer Interpretability Evaluation},\nauthor={Junyi Wu and Weitai Kang and Hao Tang and Yuan Hong and Yan Yan},\nyear={2024},\nurl={https://openreview.net/forum?id=nat6EsXhPm}\n}",
        "github": "",
        "project": "",
        "reviewers": "M9vu;cy4w;a94J;wvzY",
        "site": "https://openreview.net/forum?id=nat6EsXhPm",
        "pdf_size": 948980,
        "rating": "3;3;5;6",
        "confidence": "4;4;5;4",
        "soundness": "3;2;2;3",
        "contribution": "2;3;1;3",
        "presentation": "3;3;2;3",
        "wc_summary": "121;64;24;77",
        "wc_strengths": "94;26;12;54",
        "wc_weaknesses": "792;926;16;228",
        "wc_questions": "3;44;11;4",
        "wc_review": "1010;1060;63;363",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            71.5,
            34.61574786134195
        ],
        "wc_strengths_avg": [
            46.5,
            31.316928329579195
        ],
        "wc_weaknesses_avg": [
            490.5,
            379.01813940760144
        ],
        "wc_questions_avg": [
            15.5,
            16.740669042783207
        ],
        "wc_review_avg": [
            624.0,
            424.83349679609773
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:iz-fQrgTEuEJ:scholar.google.com/&scioq=IMAST:+Importance-Aware+Statistical+Test+for+Transformer+Interpretability+Evaluation&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2;3",
        "aff_unique_norm": "Illinois Institute of Technology;Carnegie Mellon University;University of Connecticut;University of Illinois at Chicago",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.iit.edu;https://www.cmu.edu;https://www.uconn.edu;https://www.uic.edu",
        "aff_unique_abbr": "IIT;CMU;UConn;UIC",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Chicago",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "nbN8Ilbg8c",
        "title": "Towards Cost-Efficient Federated Multi-Agent Reinforcement Learning with Learnable Aggregation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Multi-agent reinforcement learning (MARL) often adopts centralized training with a decentralized execution (CTDE) framework to facilitate cooperation among agents. When it comes to deploying MARL algorithms in real-world scenarios, CTDE requires gradient transmission and parameter synchronization for each training step, which can incur disastrous communication overhead. To enhance communication efficiency, federated MARL is proposed to average the gradients periodically during communication. However, such straightforward averaging leads to poor coordination and slow convergence arising from the non-i.i.d. problem which is evidenced by our theoretical analysis. To address the two challenges, we propose a federated MARL framework, termed cost-efficient federated multi-agent reinforcement learning with learnable aggregation (FMRL-LA). Specifically, we use asynchronous critics to optimize communication efficiency by filtering out redundant local updates based on the estimation of agent utilities. A centralized aggregator rectifies these estimations conditioned on global information to improve cooperation and reduce non-i.i.d. impact by maximizing the composite system objectives. For a comprehensive evaluation, we re-create a federated multi-agent autonomous driving environment based on MetaDrive. Our findings indicate that FMRL-LA can outperform other baselines by at least 5% with respect to the system utility on average.",
        "keywords": "Multi-agent Reinforcement Learning; Federated Reinforcement Learning; Multi-agent System",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/cf33fb4707419dc499e6a9e2ab64db964a289684.zip",
        "author": "Yi Zhang;Sen Wang;Zhi Chen;Xuwei Xu;Stano Funiak;Frank de Hoog;Jiajun Liu",
        "authorids": "~Yi_Zhang31;~Sen_Wang3;~Zhi_Chen4;~Xuwei_Xu1;stano.funiak@data61.csiro.au;~Frank_de_Hoog1;~Jiajun_Liu1",
        "gender": "M;M;M;M;;M;M",
        "homepage": ";https://csenw.github.io/;https://uqzhichen.github.io/;;;https://www.csiro.au/en/;",
        "dblp": ";69/6403-1;05/1539-10;332/1103;;;",
        "google_scholar": ";L6BLX7gAAAAJ;https://scholar.google.com.au/citations?user=9ZypKEYAAAAJ;;;JZZV9X8AAAAJ;https://scholar.google.com.au/citations?user=xZGKQkcAAAAJ",
        "orcid": "0000-0002-2976-7972;0000-0002-5414-8276;0000-0002-9385-144X;0000-0003-3434-7451;;0000-0002-4632-564X;0000-0001-8160-1796",
        "linkedin": "yi-zhang-8b0b93137;;simon-chen-qld/;;;;",
        "or_profile": "~Yi_Zhang31;~Sen_Wang3;~Zhi_Chen4;~Xuwei_Xu1;stano.funiak@data61.csiro.au;~Frank_de_Hoog1;~Jiajun_Liu1",
        "aff": "University of Queensland;The University of Queensland;University of Queensland;University of Queensland;;CSIRO;CSIRO",
        "aff_domain": "uq.edu.au;uq.edu.au;uq.edu.au;uq.edu.au;;csiro.au;csiro.au",
        "position": "PhD student;Associate Professor;Postdoc;PhD student;;Emeritus;Principal Researcher",
        "bibtex": "@misc{\nzhang2024towards,\ntitle={Towards Cost-Efficient Federated Multi-Agent Reinforcement Learning with Learnable Aggregation},\nauthor={Yi Zhang and Sen Wang and Zhi Chen and Xuwei Xu and Stano Funiak and Frank de Hoog and Jiajun Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=nbN8Ilbg8c}\n}",
        "github": "",
        "project": "",
        "reviewers": "XrBt;PGsv;Vyxa",
        "site": "https://openreview.net/forum?id=nbN8Ilbg8c",
        "pdf_size": 564694,
        "rating": "3;5;5",
        "confidence": "4;3;4",
        "soundness": "2;3;3",
        "contribution": "2;2;2",
        "presentation": "2;3;3",
        "wc_summary": "107;55;123",
        "wc_strengths": "93;25;76",
        "wc_weaknesses": "370;96;169",
        "wc_questions": "6;106;4",
        "wc_review": "576;282;372",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            95.0,
            29.028721409436322
        ],
        "wc_strengths_avg": [
            64.66666666666667,
            28.89444391035911
        ],
        "wc_weaknesses_avg": [
            211.66666666666666,
            115.85719178751438
        ],
        "wc_questions_avg": [
            38.666666666666664,
            47.618857142476195
        ],
        "wc_review_avg": [
            410.0,
            122.99593489217439
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:8VxIkFBX3zAJ:scholar.google.com/&scioq=Towards+Cost-Efficient+Federated+Multi-Agent+Reinforcement+Learning+with+Learnable+Aggregation&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;1;1",
        "aff_unique_norm": "University of Queensland;Commonwealth Scientific and Industrial Research Organisation",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uq.edu.au;https://www.csiro.au",
        "aff_unique_abbr": "UQ;CSIRO",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "Australia"
    },
    {
        "title": "FedCDA: Federated Learning with Cross-rounds Divergence-aware Aggregation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17851",
        "id": "nbPGqeH3lt",
        "author_site": "Haozhao Wang, Haoran Xu, Yichen Li, Yuan Xu, Ruixuan Li, Tianwei Zhang",
        "tldr": "",
        "abstract": "In Federated Learning (FL), model aggregation is pivotal. It involves a global server iteratively aggregating client local trained models in successive rounds without accessing private data. Traditional methods typically aggregate the local models from the current round alone. However, due to the statistical heterogeneity across clients, the local models from different clients may be greatly diverse, making the obtained global model incapable of maintaining the specific knowledge of each local model. In this paper, we introduce a novel method, FedCDA, which selectively aggregates cross-round local models, decreasing discrepancies between the global model and local models.\nThe principle behind FedCDA is that due to the different global model parameters received in different rounds and the non-convexity of deep neural networks, the local models from each client may converge to different local optima across rounds. Therefore, for each client, we select a local model from its several recent local models obtained in multiple rounds, where the local model is selected by minimizing its divergence from the local models of other clients. This ensures the aggregated global model remains close to all selected local models to maintain their data knowledge. Extensive experiments conducted on various models and datasets reveal our approach outperforms state-of-the-art aggregation methods.",
        "keywords": "Federated Learning;Aggregation;Cross-round;Divergence-aware",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/d25d5e545e5bb39e4f6375248bd4a67bd095ecd2.zip",
        "author": "Haozhao Wang;Haoran Xu;Yichen Li;Yuan Xu;Ruixuan Li;Tianwei Zhang",
        "authorids": "~Haozhao_Wang1;~Haoran_Xu8;~Yichen_Li5;~Yuan_Xu3;~Ruixuan_Li1;~Tianwei_Zhang1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://wanghaozhao.mysxl.cn/;https://github.com/xuhaoran1;https://github.com/liyichen1234;;http://idc.hust.edu.cn/rxli/index.html;https://personal.ntu.edu.sg/tianwei.zhang/index.html",
        "dblp": "224/4500.html;;27/2248-6;89/3127;60/4429.html;77/7902-4",
        "google_scholar": "https://scholar.google.com.hk/citations?user=yFrOuMEAAAAJ;;meEbYo0AAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com/scholar?q=ruixuan+li;9vpiYDIAAAAJ",
        "orcid": "0000-0002-7591-5315;0000-0003-2091-6158;0009-0009-8630-2504;;0000-0002-7791-5511;",
        "linkedin": ";;;;https://www.linkedin.cn/incareer/in/ruixuan-li-b367319;",
        "or_profile": "~Haozhao_Wang1;~Haoran_Xu8;~Yichen_Li5;~Yuan_Xu3;~Ruixuan_Li1;~Tianwei_Zhang1",
        "aff": "Huazhong University of Science and Technology;Zhejiang University;Huazhong University of Science and Technology;;Huazhong University of Science and Technology;Nanyang Technological University",
        "aff_domain": "hust.edu.cn;zju.edu.cn;hust.edu.cn;;hust.edu.cn;ntu.edu.sg",
        "position": "Postdoc;MS student;PhD student;;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nwang2024fedcda,\ntitle={Fed{CDA}: Federated Learning with Cross-rounds Divergence-aware Aggregation},\nauthor={Haozhao Wang and Haoran Xu and Yichen Li and Yuan Xu and Ruixuan Li and Tianwei Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=nbPGqeH3lt}\n}",
        "github": "",
        "project": "",
        "reviewers": "jkW8;rxU6;Pshb;erYc",
        "pdf_size": 709712,
        "rating": "5;6;6;6",
        "confidence": "4;4;4;3",
        "soundness": "2;2;3;3",
        "contribution": "2;3;2;3",
        "presentation": "2;1;2;3",
        "wc_summary": "56;119;79;70",
        "wc_strengths": "52;68;34;61",
        "wc_weaknesses": "170;342;64;77",
        "wc_questions": "126;4;72;220",
        "wc_review": "404;533;249;428",
        "wc_reply_reviewers": "0;49;0;0",
        "wc_reply_authors": "838;1188;631;1610",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "2;4;2;4",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            81.0,
            23.42007685726074
        ],
        "wc_strengths_avg": [
            53.75,
            12.735285626950029
        ],
        "wc_weaknesses_avg": [
            163.25,
            111.00309680364778
        ],
        "wc_questions_avg": [
            105.5,
            78.98575820994567
        ],
        "wc_review_avg": [
            403.5,
            101.53940121942811
        ],
        "wc_reply_reviewers_avg": [
            12.25,
            21.21762239271875
        ],
        "wc_reply_authors_avg": [
            1066.75,
            371.49251338351354
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            1.0
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 31,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14853863222276510112&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=nbPGqeH3lt",
        "pdf": "https://openreview.net/pdf?id=nbPGqeH3lt",
        "email": "hust.edu.cn;zju.edu.cn;hust.edu.cn;;hust.edu.cn;ntu.edu.sg",
        "author_num": 6,
        "aff_unique_index": "0;1;0;0;2",
        "aff_unique_norm": "Huazhong University of Science and Technology;Zhejiang University;Nanyang Technological University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.hust.edu.cn;https://www.zju.edu.cn;https://www.ntu.edu.sg",
        "aff_unique_abbr": "HUST;ZJU;NTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;1",
        "aff_country_unique": "China;Singapore"
    },
    {
        "title": "An Image Is Worth 1000 Lies: Transferability of Adversarial Images across Prompts on Vision-Language Models",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17850",
        "id": "nc5GgFAvtk",
        "author_site": "Haochen Luo, Jindong Gu, Fengyuan Liu, Philip Torr",
        "tldr": "",
        "abstract": "Different from traditional task-specific vision models, recent large VLMs can readily adapt to different vision tasks by simply using different textual instructions, i.e., prompts. However, a well-known concern about traditional task-specific vision models is that they can be misled by imperceptible adversarial perturbations. Furthermore, the concern is exacerbated by the phenomenon that the same adversarial perturbations can fool different task-specific models. Given that VLMs rely on prompts to adapt to different tasks, an intriguing question emerges: Can a single adversarial image mislead all predictions of VLMs when a thousand different prompts are given? This question essentially introduces a novel perspective on adversarial transferability: cross-prompt adversarial transferability. In this work, we propose the Cross-Prompt Attack (CroPA). This proposed method updates the visual adversarial perturbation with learnable textual prompts, which are designed to counteract the misleading effects of the adversarial image. By doing this, CroPA significantly improves the transferability of adversarial examples across prompts. Extensive experiments are conducted to verify the strong cross-prompt adversarial transferability of CroPA with prevalent VLMs including Flamingo, BLIP-2, and InstructBLIP in various different tasks.",
        "keywords": "Vision Language Model;Adversarial Transferability;Prompt Tuning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Haochen Luo;Jindong Gu;Fengyuan Liu;Philip Torr",
        "authorids": "~Haochen_Luo1;~Jindong_Gu1;~Fengyuan_Liu1;~Philip_Torr1",
        "gender": "M;;M;",
        "homepage": ";;;http://www.robots.ox.ac.uk/~tvg/",
        "dblp": ";;;",
        "google_scholar": ";;7gxp6NkAAAAJ;",
        "orcid": ";;0009-0008-3451-6132;",
        "linkedin": "haochen-luo-3a1290188/;;lfy0x4c-15481919b/;",
        "or_profile": "~Haochen_Luo1;~Jindong_Gu1;~Fengyuan_Liu1;~Philip_Torr1",
        "aff": "University of Oxford;;University of Oxford;University of Oxford",
        "aff_domain": "ox.ac.uk;;ox.ac.uk;ox.ac.uk",
        "position": "Intern;;MS student;Full Professor",
        "bibtex": "@inproceedings{\nluo2024an,\ntitle={An Image Is Worth 1000 Lies: Transferability of Adversarial Images across Prompts on Vision-Language Models},\nauthor={Haochen Luo and Jindong Gu and Fengyuan Liu and Philip Torr},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=nc5GgFAvtk}\n}",
        "github": "",
        "project": "",
        "reviewers": "iSYx;av8s;HSuq;Fnt8;FoXe",
        "pdf_size": 626896,
        "rating": "6;6;6;8;8",
        "confidence": "4;5;4;4;4",
        "soundness": "2;3;3;2;3",
        "contribution": "2;2;2;2;3",
        "presentation": "3;3;3;3;4",
        "wc_summary": "43;62;72;60;91",
        "wc_strengths": "196;26;58;46;46",
        "wc_weaknesses": "290;264;145;182;82",
        "wc_questions": "3;66;56;58;15",
        "wc_review": "532;418;331;346;234",
        "wc_reply_reviewers": "0;0;19;17;0",
        "wc_reply_authors": "459;778;682;630;246",
        "reply_reviewers": "0;0;1;1;0",
        "reply_authors": "2;2;1;1;1",
        "rating_avg": [
            6.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            4.2,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            3.2,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            65.6,
            15.755633912984903
        ],
        "wc_strengths_avg": [
            74.4,
            61.66230615213804
        ],
        "wc_weaknesses_avg": [
            192.6,
            76.41361135295203
        ],
        "wc_questions_avg": [
            39.6,
            25.49195951667898
        ],
        "wc_review_avg": [
            372.2,
            99.1128649570781
        ],
        "wc_reply_reviewers_avg": [
            7.2,
            8.840814442120138
        ],
        "wc_reply_authors_avg": [
            559.0,
            187.66992300312802
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.4,
            0.4898979485566356
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.40824829046386296,
        "gs_citation": 35,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11024081308302989453&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=nc5GgFAvtk",
        "pdf": "https://openreview.net/pdf?id=nc5GgFAvtk",
        "email": "ox.ac.uk;;ox.ac.uk;ox.ac.uk",
        "author_num": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Oxford",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ox.ac.uk",
        "aff_unique_abbr": "Oxford",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "ncbDXOdURn",
        "title": "Characterizing Robust Overfitting in Adversarial Training via Cross-Class Features",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Adversarial training (AT) has been considered one of the most effective methods for making deep neural networks robust to adversarial attacks. However, AT can lead to a phenomenon known as robust overfitting where the test robust error gradually increases during training, resulting in a large robust generalization gap. In this paper, we present a novel interpretation of robust overfitting from the perspective of feature attribution. We find that at the best checkpoint of AT, the model tends to involve more cross-class features, which are shared by multiple classes, in its decision-making process. These features are useful for robust classification. However, as AT further squeezes the training robust loss, the model tends to make decisions based on more class-specific features, giving rise to robust overfitting. We also provide theoretical evidence for this understanding using a synthetic data model. In addition, our understanding can also justify why knowledge distillation is helpful for mitigating robust overfitting, and we further propose a weight-average guided knowledge distillation AT approach for improved robustness.",
        "keywords": "Adversarial Training;Robust Overfitting;Cross-Class Features",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/8d0f60f1e7f90acb58d7bb088e18ca6a4c48a218.pdf",
        "author": "Zeming Wei;Yiwen Guo;Yisen Wang",
        "authorids": "~Zeming_Wei1;~Yiwen_Guo1;~Yisen_Wang1",
        "gender": "M;;M",
        "homepage": "https://weizeming.github.io;;https://yisenwang.github.io/",
        "dblp": "276/6608;;172/1346-1",
        "google_scholar": "Kyn1zdQAAAAJ;;uMWPDboAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Zeming_Wei1;~Yiwen_Guo1;~Yisen_Wang1",
        "aff": "University of California, Berkeley;;Peking University",
        "aff_domain": "berkeley.edu;;pku.edu.cn",
        "position": "Undergrad student;;Assistant Professor",
        "bibtex": "@misc{\nwei2024characterizing,\ntitle={Characterizing Robust Overfitting in Adversarial Training via Cross-Class Features},\nauthor={Zeming Wei and Yiwen Guo and Yisen Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=ncbDXOdURn}\n}",
        "github": "",
        "project": "",
        "reviewers": "quy6;NSUP;iycg;fn47",
        "site": "https://openreview.net/forum?id=ncbDXOdURn",
        "pdf_size": 1969071,
        "rating": "3;3;5;6",
        "confidence": "4;5;5;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;3;2",
        "wc_summary": "39;33;52;360",
        "wc_strengths": "24;18;46;99",
        "wc_weaknesses": "181;155;186;177",
        "wc_questions": "57;55;26;655",
        "wc_review": "301;261;310;1291",
        "wc_reply_reviewers": "69;201;0;425",
        "wc_reply_authors": "1319;1787;875;1952",
        "reply_reviewers": "1;1;0;3",
        "reply_authors": "3;5;3;6",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            121.0,
            138.15751879648099
        ],
        "wc_strengths_avg": [
            46.75,
            31.91688424642982
        ],
        "wc_weaknesses_avg": [
            174.75,
            11.840080236214618
        ],
        "wc_questions_avg": [
            198.25,
            263.98993825522973
        ],
        "wc_review_avg": [
            540.75,
            433.5495213928854
        ],
        "wc_reply_reviewers_avg": [
            173.75,
            162.0422398635615
        ],
        "wc_reply_authors_avg": [
            1483.25,
            420.99190906714585
        ],
        "reply_reviewers_avg": [
            1.25,
            1.0897247358851685
        ],
        "reply_authors_avg": [
            4.25,
            1.299038105676658
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.19245008972987526,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8313923104092285608&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of California, Berkeley;Peking University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.berkeley.edu;http://www.pku.edu.cn",
        "aff_unique_abbr": "UC Berkeley;Peking U",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Berkeley;",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "Analysis of Learning a Flow-based Generative Model from Limited Sample Complexity",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17849",
        "id": "ndCJeysCPe",
        "author_site": "Hugo Cui, Eric Vanden-Eijnden, Florent Krzakala, Lenka Zdeborova",
        "tldr": "",
        "abstract": "We study the problem of training a flow-based generative model, parametrized by a two-layer autoencoder, to sample from a high-dimensional Gaussian mixture. We provide a sharp end-to-end analysis of the problem. First, we provide a tight closed-form characterization of the learnt velocity field, when parametrized by a shallow denoising auto-encoder trained on a finite number $n$ of samples from the target distribution. Building on this analysis, we provide a sharp description of the corresponding generative flow, which pushes the base Gaussian density forward to an approximation of the target density. In particular, we provide closed-form formulae for the distance between the means of the generated mixture and the mean of the target mixture, which we show decays as $\\Theta_n(\\frac{1}{n})$. Finally, this rate is shown to be in fact Bayes-optimal.",
        "keywords": "statistical physics;flow-based generative model;stochastic interpolation;gaussian mixture;auto-encoder",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/b5365fa27675bce9db6492b33c42161bb2dce44d.zip",
        "author": "Hugo Cui;Florent Krzakala;Eric Vanden-Eijnden;Lenka Zdeborova",
        "authorids": "~Hugo_Cui1;~Florent_Krzakala1;~Eric_Vanden-Eijnden1;~Lenka_Zdeborova1",
        "gender": ";;M;F",
        "homepage": ";http://Krzakala.org;https://wp.nyu.edu/courantinstituteofmathematicalsciences-eve2/;http://artax.karlin.mff.cuni.cz/~zdebl9am/",
        "dblp": ";25/1282;88/7927;27/6064.html",
        "google_scholar": ";https://scholar.google.fr/citations?user=3jDeUlMAAAAJ;A5Gx65gAAAAJ;https://scholar.google.fr/citations?user=gkCjy_UAAAAJ",
        "orcid": ";0000-0003-2313-2578;;",
        "linkedin": ";;;",
        "or_profile": "~Hugo_Cui1;~Florent_Krzakala1;~Eric_Vanden-Eijnden1;~Lenka_Zdeborova1",
        "aff": ";Swiss Federal Institute of Technology Lausanne;New York University;Swiss Federal Institute of Technology Lausanne",
        "aff_domain": ";epfl.ch;nyu.edu;epfl.ch",
        "position": ";Full Professor;Full Professor;Associate Professor",
        "bibtex": "@inproceedings{\ncui2024analysis,\ntitle={Analysis of Learning a Flow-based Generative Model from Limited Sample Complexity},\nauthor={Hugo Cui and Florent Krzakala and Eric Vanden-Eijnden and Lenka Zdeborova},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ndCJeysCPe}\n}",
        "github": "",
        "project": "",
        "reviewers": "v6CB;AsnX;wFJz",
        "pdf_size": 905423,
        "rating": "3;8;8",
        "confidence": "5;4;4",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "3;3;3",
        "wc_summary": "155;66;66",
        "wc_strengths": "49;30;30",
        "wc_weaknesses": "328;26;13",
        "wc_questions": "239;1;23",
        "wc_review": "771;123;132",
        "wc_reply_reviewers": "573;0;0",
        "wc_reply_authors": "2045;102;151",
        "reply_reviewers": "2;0;0",
        "reply_authors": "4;1;1",
        "rating_avg": [
            6.333333333333333,
            2.357022603955158
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            95.66666666666667,
            41.95500235040182
        ],
        "wc_strengths_avg": [
            36.333333333333336,
            8.9566858950296
        ],
        "wc_weaknesses_avg": [
            122.33333333333333,
            145.525102836437
        ],
        "wc_questions_avg": [
            87.66666666666667,
            107.38508069352817
        ],
        "wc_review_avg": [
            342.0,
            303.37105992497044
        ],
        "wc_reply_reviewers_avg": [
            191.0,
            270.1147904132612
        ],
        "wc_reply_authors_avg": [
            766.0,
            904.6107818651437
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            2.0,
            1.4142135623730951
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 26,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4556663775544091849&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=ndCJeysCPe",
        "pdf": "https://openreview.net/pdf?id=ndCJeysCPe",
        "email": ";epfl.ch;nyu.edu;epfl.ch",
        "author_num": 4,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Swiss Federal Institute of Technology Lausanne;New York University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.epfl.ch;https://www.nyu.edu",
        "aff_unique_abbr": "EPFL;NYU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Lausanne;",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Switzerland;United States"
    },
    {
        "title": "Escape Sky-high Cost: Early-stopping Self-Consistency for Multi-step Reasoning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17848",
        "id": "ndR8Ytrzhh",
        "author_site": "Yiwei Li, Peiwen Yuan, Shaoxiong Feng, Boyuan Pan, Xinglin Wang, Bin Sun, Heda Wang, Kan Li",
        "tldr": "",
        "abstract": "Self-consistency (SC) has been a widely used decoding strategy for chain-of-thought reasoning. Despite bringing significant performance improvements across a variety of multi-step reasoning tasks, it is a high-cost method that requires multiple sampling with the preset size. In this paper, we propose a simple and scalable sampling process, Early-Stopping Self-Consistency (ESC), to greatly reduce the cost of SC without sacrificing performance. On this basis, one control scheme for ESC is further derivated to dynamically choose the performance-cost balance for different tasks and models. To demonstrate ESC's effectiveness, we conducted extensive experiments on three popular categories of reasoning tasks: arithmetic, commonsense and symbolic reasoning over language models with varying scales. The empirical results show that ESC reduces the average number of sampling of chain-of-thought reasoning by a significant margin on six benchmarks, including MATH (-33.8%), GSM8K (-80.1%), StrategyQA (-76.8%), CommonsenseQA (-78.5%), Coin Flip (-84.2%) and Last Letters (-67.4%), while attaining comparable performances.",
        "keywords": "Self-consistency;Chain-of-Thoughts;Multi-Step Reasoning;Large Language Models",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/35eeba346f7fd550814066e1ed0c57445c026217.zip",
        "author": "Yiwei Li;Peiwen Yuan;Shaoxiong Feng;Boyuan Pan;Xinglin Wang;Bin Sun;Heda Wang;Kan Li",
        "authorids": "~Yiwei_Li1;~Peiwen_Yuan1;~Shaoxiong_Feng1;~Boyuan_Pan1;~Xinglin_Wang1;~Bin_Sun3;~Heda_Wang1;~Kan_Li3",
        "gender": "M;M;M;M;M;M;M;M",
        "homepage": ";https://ypw0102.github.io/;http://shaoxiongfeng.com/;http://panboyuan.net/;https://github.com/WangXinglin;;https://github.com/wangheda;",
        "dblp": "48/9884-1;327/9196.html;260/0224;203/8799;02/1010;01/5401-4.html;;21/2083-1.html",
        "google_scholar": "https://scholar.google.com.hk/citations?user=yMZeaoMAAAAJ;https://scholar.google.com.hk/citations?user=cUB5XN8AAAAJ;BaNQV40AAAAJ;lVFNAxcAAAAJ;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com/citations?hl=zh-CN;;",
        "orcid": ";0000-0002-2403-8295;;;0000-0002-5834-1508;;;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Yiwei_Li1;~Peiwen_Yuan1;~Shaoxiong_Feng1;~Boyuan_Pan1;~Xinglin_Wang1;~Bin_Sun3;~Heda_Wang1;~Kan_Li3",
        "aff": "Beijing Institute of Technology;Beijing Institute of Technology;RedNote;Xiaohongshu;Beijing Institute of Technology;Beijing Institute of Technology;;Beijing Institute of Technology",
        "aff_domain": "bit.edu.cn;bit.edu.cn;xiaohongshu.com;xiaohongshu.com;bit.edu.cn;bit.edu.cn;;bit.edu.cn",
        "position": "PhD student;PhD student;Researcher;Researcher;PhD student;PhD student;;Full Professor",
        "bibtex": "@inproceedings{\nli2024escape,\ntitle={Escape Sky-high Cost: Early-stopping Self-Consistency for Multi-step Reasoning},\nauthor={Yiwei Li and Peiwen Yuan and Shaoxiong Feng and Boyuan Pan and Xinglin Wang and Bin Sun and Heda Wang and Kan Li},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ndR8Ytrzhh}\n}",
        "github": "",
        "project": "",
        "reviewers": "rrBP;J879;qSHs;UrCF",
        "pdf_size": 818260,
        "rating": "5;5;5;8",
        "confidence": "4;3;5;4",
        "soundness": "3;2;3;3",
        "contribution": "3;2;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "70;82;85;199",
        "wc_strengths": "46;95;39;28",
        "wc_weaknesses": "38;94;187;105",
        "wc_questions": "66;3;114;86",
        "wc_review": "220;274;425;418",
        "wc_reply_reviewers": "0;30;9;26",
        "wc_reply_authors": "420;394;793;732",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            5.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            109.0,
            52.263754170553035
        ],
        "wc_strengths_avg": [
            52.0,
            25.64176280991617
        ],
        "wc_weaknesses_avg": [
            106.0,
            53.22123636294069
        ],
        "wc_questions_avg": [
            67.25,
            40.82508420077048
        ],
        "wc_review_avg": [
            334.25,
            89.34868493716066
        ],
        "wc_reply_reviewers_avg": [
            16.25,
            12.255100978776143
        ],
        "wc_reply_authors_avg": [
            584.75,
            179.28939594967684
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 21,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4013415234955111671&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=ndR8Ytrzhh",
        "pdf": "https://openreview.net/pdf?id=ndR8Ytrzhh",
        "email": "bit.edu.cn;bit.edu.cn;xiaohongshu.com;xiaohongshu.com;bit.edu.cn;bit.edu.cn;;bit.edu.cn",
        "author_num": 8,
        "aff_unique_index": "0;0;1;2;0;0;0",
        "aff_unique_norm": "Beijing Institute of Technology;RedNote;Xiaohongshu",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.bit.edu.cn/;;https://www.xiaohongshu.com",
        "aff_unique_abbr": "BIT;;XHS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China;"
    },
    {
        "id": "ndRkLsoQ1Q",
        "title": "Unleashing the Potential of Regularization Strategies in Learning with Noisy Labels",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In recent years, research on learning with noisy labels has focused on devising novel algorithms that can achieve robustness to noisy training labels while generalizing to clean data. These algorithms often incorporate sophisticated techniques, such as noise modeling, label correction, and co-training. In this study, we demonstrate that a simple baseline using cross-entropy loss, combined with widely used regularization strategies like learning rate decay, model weights average, and data augmentations, can outperform state-of-the-art methods. Our findings suggest that employing a combination of regularization strategies can be more effective than intricate algorithms in tackling the challenges of learning with noisy labels. While some of these regularization strategies have been utilized in previous noisy label learning research, their full potential has not been thoroughly explored. Our results encourage a reevaluation of benchmarks for learning with noisy labels and prompt reconsideration of the role of specialized learning algorithms designed for training with noisy labels.",
        "keywords": "Machine Learning;Label Noise;Robustness;Regularization",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Hui Kang;Sheng Liu;Huaxi Huang;Jun Yu;Bo Han;Dadong Wang;Tongliang Liu",
        "authorids": "~Hui_Kang1;~Sheng_Liu2;~Huaxi_Huang1;~Jun_Yu3;~Bo_Han1;~Dadong_Wang1;~Tongliang_Liu1",
        "gender": "M;;M;M;;;M",
        "homepage": "https://randydl.github.io;https://shengliu66.github.io/;;https://faculty.ustc.edu.cn/yujun_AI/en/index.htm;;;https://tongliang-liu.github.io/",
        "dblp": ";;184/0802.html;50/5754-1.html;;;150/6667",
        "google_scholar": ";rzhzR-cAAAAJ;F4icUy8AAAAJ;efZyqyQAAAAJ;;;https://scholar.google.com.au/citations?user=EiLdZ_YAAAAJ",
        "orcid": ";;;0000-0002-3197-8103;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Hui_Kang1;~Sheng_Liu2;~Huaxi_Huang1;~Jun_Yu3;~Bo_Han1;~Dadong_Wang1;~Tongliang_Liu1",
        "aff": "University of Sydney;Stanford University;Lumachain;University of Science and Technology of China;;;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_domain": "usyd.edu.au;stanford.edu;lumachain.io;ustc.edu.cn;;;mbzuai.ac.ae",
        "position": "MS student;Postdoc;Researcher;Associate Professor;;;Affiliated Associate Professor",
        "bibtex": "@misc{\nkang2024unleashing,\ntitle={Unleashing the Potential of Regularization Strategies in Learning with Noisy Labels},\nauthor={Hui Kang and Sheng Liu and Huaxi Huang and Jun Yu and Bo Han and Dadong Wang and Tongliang Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=ndRkLsoQ1Q}\n}",
        "github": "",
        "project": "",
        "reviewers": "Mfti;7dS9;tMPC;m1A7",
        "site": "https://openreview.net/forum?id=ndRkLsoQ1Q",
        "pdf_size": 1596061,
        "rating": "3;3;3;6",
        "confidence": "4;4;3;5",
        "soundness": "2;3;2;3",
        "contribution": "2;2;1;3",
        "presentation": "2;3;3;3",
        "wc_summary": "51;62;297;37",
        "wc_strengths": "47;31;84;113",
        "wc_weaknesses": "43;76;1223;83",
        "wc_questions": "145;8;454;2",
        "wc_review": "286;177;2058;235",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            111.75,
            107.32048965598321
        ],
        "wc_strengths_avg": [
            68.75,
            31.971667144520318
        ],
        "wc_weaknesses_avg": [
            356.25,
            500.64626983529996
        ],
        "wc_questions_avg": [
            152.25,
            183.36353917832193
        ],
        "wc_review_avg": [
            689.0,
            791.3327365906202
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.816496580927726,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11161109906123921047&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "University of Sydney;Stanford University;Lumachain;University of Science and Technology of China;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.sydney.edu.au;https://www.stanford.edu;https://www.lumachain.com;http://www.ustc.edu.cn;https://mbzuai.ac.ae",
        "aff_unique_abbr": "USYD;Stanford;Lumachain;USTC;MBZUAI",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Stanford",
        "aff_country_unique_index": "0;1;1;2;3",
        "aff_country_unique": "Australia;United States;China;United Arab Emirates"
    },
    {
        "title": "Provable and Practical: Efficient Exploration in Reinforcement Learning via Langevin Monte Carlo",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17847",
        "id": "nfIAEJFiBZ",
        "author_site": "Haque Ishfaq, Qingfeng Lan, Pan Xu, A. Rupam Mahmood, Doina Precup, anima anandkumar, Kamyar Azizzadenesheli",
        "tldr": "",
        "abstract": "We present a scalable and effective exploration strategy based on Thompson sampling for reinforcement learning (RL). One of the key shortcomings of  existing Thompson sampling algorithms is the need to perform a Gaussian approximation of the posterior distribution, which is not a good surrogate in most practical settings. We instead directly sample the Q function from its posterior distribution, by using  Langevin Monte Carlo, an efficient type of Markov Chain Monte Carlo (MCMC) method. Our method only needs to perform noisy gradient descent updates to learn the exact posterior distribution of the Q function, which makes our approach easy to deploy in deep RL.  We provide a rigorous theoretical analysis for the proposed method and demonstrate that, in the linear Markov decision process (linear MDP) setting, it has a regret bound of $\\tilde{O}(d^{3/2}H^{3/2}\\sqrt{T})$, where $d$ is the dimension of the feature mapping, $H$ is the planning horizon, and $T$ is the total number of steps. We apply this approach to deep RL, by using Adam optimizer to perform gradient updates. Our approach achieves better or similar results compared with state-of-the-art deep RL algorithms on several challenging exploration tasks from the Atari57 suite.",
        "keywords": "Exploration;Reinforcement Learning;Thompson Sampling;Langevin Monte Carlo;Deep Reinforcement learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/fa48d1476ac0423b200d04066ae91e6a056678a5.pdf",
        "author": "Haque Ishfaq;Qingfeng Lan;Pan Xu;A. Rupam Mahmood;Doina Precup;Anima Anandkumar;Kamyar Azizzadenesheli",
        "authorids": "~Haque_Ishfaq1;~Qingfeng_Lan1;~Pan_Xu1;~A._Rupam_Mahmood1;~Doina_Precup1;~Anima_Anandkumar1;~Kamyar_Azizzadenesheli1",
        "gender": ";;M;;F;;M",
        "homepage": ";;https://panxulab.github.io/;;http://cs.mcgill.ca/~dprecup/;;https://kamyar.page/",
        "dblp": ";;11/9718-2;;p/DoinaPrecup;;176/5584",
        "google_scholar": ";;UkYBx6YAAAAJ;;https://scholar.google.com.tw/citations?user=j54VcVEAAAAJ;;CxAS4SQAAAAJ",
        "orcid": ";;0000-0002-2559-8622;;;;",
        "linkedin": ";;pan-xu-0931a2a6/;;;;",
        "or_profile": "~Haque_Ishfaq1;~Qingfeng_Lan1;~Pan_Xu1;~A._Rupam_Mahmood1;~Doina_Precup1;~Anima_Anandkumar1;~Kamyar_Azizzadenesheli1",
        "aff": ";;Duke University;;McGill University;;NVIDIA",
        "aff_domain": ";;duke.edu;;mcgill.ca;;nvidia.com",
        "position": ";;Assistant Professor;;Associate Professor;;Researcher",
        "bibtex": "@inproceedings{\nishfaq2024provable,\ntitle={Provable and Practical: Efficient Exploration in Reinforcement Learning via Langevin Monte Carlo},\nauthor={Haque Ishfaq and Qingfeng Lan and Pan Xu and A. Rupam Mahmood and Doina Precup and Anima Anandkumar and Kamyar Azizzadenesheli},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=nfIAEJFiBZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "SrMF;yHqj;dAXr",
        "pdf_size": 5853097,
        "rating": "6;6;8",
        "confidence": "2;4;3",
        "soundness": "3;2;3",
        "contribution": "3;3;3",
        "presentation": "3;3;3",
        "wc_summary": "43;53;92",
        "wc_strengths": "73;39;128",
        "wc_weaknesses": "179;329;40",
        "wc_questions": "8;7;238",
        "wc_review": "303;428;498",
        "wc_reply_reviewers": "327;0;46",
        "wc_reply_authors": "966;1261;1055",
        "reply_reviewers": "1;0;1",
        "reply_authors": "3;3;4",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            62.666666666666664,
            21.139746660943903
        ],
        "wc_strengths_avg": [
            80.0,
            36.669696844488186
        ],
        "wc_weaknesses_avg": [
            182.66666666666666,
            118.01224041975006
        ],
        "wc_questions_avg": [
            84.33333333333333,
            108.65950896672086
        ],
        "wc_review_avg": [
            409.6666666666667,
            80.65702421708573
        ],
        "wc_reply_reviewers_avg": [
            124.33333333333333,
            144.5321955674775
        ],
        "wc_reply_authors_avg": [
            1094.0,
            123.5502596786695
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 22,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8192940951372416944&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=nfIAEJFiBZ",
        "pdf": "https://openreview.net/pdf?id=nfIAEJFiBZ",
        "email": ";;duke.edu;;mcgill.ca;;nvidia.com",
        "author_num": 7,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Duke University;McGill University;NVIDIA",
        "aff_unique_dep": ";;NVIDIA Corporation",
        "aff_unique_url": "https://www.duke.edu;https://www.mcgill.ca;https://www.nvidia.com",
        "aff_unique_abbr": "Duke;McGill;NVIDIA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United States;Canada"
    },
    {
        "title": "Video Decomposition Prior: Editing Videos Layer by Layer",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17846",
        "id": "nfMyERXNru",
        "author_site": "Gaurav Shrivastava, Ser-Nam Lim, Abhinav Shrivastava",
        "tldr": "",
        "abstract": "In the evolving landscape of video editing methodologies, a majority of  deep learning techniques are often reliant on extensive datasets of observed input and ground truth sequence pairs for optimal performance. Such reliance often falters when acquiring data becomes challenging, especially in tasks like video dehazing and relighting, where replicating identical motions and camera angles in both corrupted and ground truth sequences is complicated. Moreover, these conventional methodologies perform best when the test distribution closely mirrors the training distribution. Recognizing these challenges, this paper introduces a novel video decomposition prior `VDP' framework which derives inspiration from professional video editing practices. Our methodology does not mandate task-specific external data corpus collection, instead pivots to utilizing the motion and appearance of the input video. VDP framework decomposes a video sequence into a set of multiple RGB layers and associated opacity levels. These set of layers are then manipulated individually to obtain the desired results. We addresses tasks such as video object segmentation, dehazing, and relighting. Moreover, we introduce a novel logarithmic video decomposition formulation for video relighting tasks, setting a new benchmark over the existing methodologies. We evaluate our approach on standard video datasets like DAVIS, REVIDE, & SDSD and show qualitative results on a diverse array of internet videos.",
        "keywords": "Video decomposition;Test-time optimization technique;Video Relighting;Video Dehazing;Unsupervised Video Object Segmentation;Edits Propagation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Gaurav Shrivastava;Ser-Nam Lim;Abhinav Shrivastava",
        "authorids": "~Gaurav_Shrivastava1;~Ser-Nam_Lim3;~Abhinav_Shrivastava2",
        "gender": "M;M;M",
        "homepage": "http://www.cs.umd.edu/~gauravsh/;http://abhinavsh.info;https://sites.google.com/site/sernam",
        "dblp": "225/6433;65/10572;04/6633",
        "google_scholar": ";mIF9BowAAAAJ;HX0BfLYAAAAJ",
        "orcid": ";0000-0001-8928-8554;",
        "linkedin": "gshrivastava1/;;",
        "or_profile": "~Gaurav_Shrivastava1;~Abhinav_Shrivastava2;~Ser-Nam_Lim1",
        "aff": "Department of Computer Science, University of Maryland, College Park;Department of Computer Science, University of Maryland, College Park;University of Central Florida",
        "aff_domain": "cs.umd.edu;cs.umd.edu;ucf.edu",
        "position": "PhD student;Assistant Professor;Associate Professor",
        "bibtex": "@inproceedings{\nshrivastava2024video,\ntitle={Video Decomposition Prior: Editing Videos Layer by Layer},\nauthor={Gaurav Shrivastava and Ser-Nam Lim and Abhinav Shrivastava},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=nfMyERXNru}\n}",
        "github": "",
        "project": "",
        "reviewers": "u6Cn;6Tks;XPSu;8QGm",
        "pdf_size": 3702327,
        "rating": "5;6;6;6",
        "confidence": "4;5;4;4",
        "soundness": "2;3;3;3",
        "contribution": "3;2;2;2",
        "presentation": "2;3;3;3",
        "wc_summary": "96;83;91;56",
        "wc_strengths": "10;26;44;74",
        "wc_weaknesses": "191;402;113;85",
        "wc_questions": "3;60;8;4",
        "wc_review": "300;571;256;219",
        "wc_reply_reviewers": "297;1143;0;0",
        "wc_reply_authors": "1189;1908;527;288",
        "reply_reviewers": "2;3;0;0",
        "reply_authors": "3;3;1;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            81.5,
            15.435349040433131
        ],
        "wc_strengths_avg": [
            38.5,
            23.76446927663229
        ],
        "wc_weaknesses_avg": [
            197.75,
            124.15589998062919
        ],
        "wc_questions_avg": [
            18.75,
            23.889066536807167
        ],
        "wc_review_avg": [
            336.5,
            138.39165437265356
        ],
        "wc_reply_reviewers_avg": [
            360.0,
            468.04326723071233
        ],
        "wc_reply_authors_avg": [
            978.0,
            630.2622470051652
        ],
        "reply_reviewers_avg": [
            1.25,
            1.299038105676658
        ],
        "reply_authors_avg": [
            2.0,
            1.0
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18371018683061227299&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=nfMyERXNru",
        "pdf": "https://openreview.net/pdf?id=nfMyERXNru",
        "email": "cs.umd.edu;cs.umd.edu;ucf.edu",
        "author_num": 3,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "University of Maryland, College Park;University of Central Florida",
        "aff_unique_dep": "Department of Computer Science;",
        "aff_unique_url": "https://www/umd.edu;https://www.ucf.edu",
        "aff_unique_abbr": "UMD;UCF",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "College Park;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "ngp5jzx5oK",
        "title": "Encoding Speaker-Specific Latent Speech Feature for Speech Synthesis",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this work, we propose a novel method for modeling numerous speakers, which enables expressing the overall characteristics of a speaker like a trained multi-speaker model without additional training on the target speaker's dataset. Although various works for a similar purpose have been actively studied, it does not perform as well as a trained multi-speaker model due to the limitations of its fundamental principles. We propose a method to encode speakers' overall speech characteristics into latent speech features, discretize them, and express the speech characteristics from the encoded features with a combining method. Our method performs superior to the best-performing multi-speaker model and outperforms a zero-shot model by significant margins in a general text-to-speech scenario. Furthermore, it shows remarkable performance in generating new artificial speakers. In addition, we demonstrate that the encoded latent features are sufficiently informative to reconstruct an original speaker's speech completely. It implies that our method can be used as a general methodology to encode and reconstruct speakers' characteristics in various tasks.",
        "keywords": "Speech Synthesis;Text-To-Speech;Representation Learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Jungil Kong;Junmo Lee;Jeongmin Kim;Beomjeong Kim;JIHOON PARK;Dohee Kong;Changheon Lee;Sangjin Kim",
        "authorids": "~Jungil_Kong3;~Junmo_Lee1;~Jeongmin_Kim2;~Beomjeong_Kim1;~JIHOON_PARK2;~Dohee_Kong1;~Changheon_Lee1;~Sangjin_Kim1",
        "gender": ";M;M;M;;M;M;M",
        "homepage": ";;;;;;;",
        "dblp": "266/1599;254/3810;;;;;;",
        "google_scholar": "-P4Jn3kAAAAJ;;;;;https://scholar.google.com/citations?hl=ko;;",
        "orcid": ";;;;;;;",
        "linkedin": ";ljun4121/;jeongmin-kim-683a30276/;beomjeong-kim-3714a0226;dohee-kong/;;sangjin-kim-samprate1st;https://www.linkedin.com/mwlite/in/jihoon-park-084151b5",
        "or_profile": "~Jungil_Kong3;~Junmo_Lee1;~Jeongmin_Kim2;~Beomjeong_Kim1;~Dohee_Kong1;~Changheon_Lee1;~Sangjin_Kim1;~JIHUN_PARK1",
        "aff": "SK Telecom AI&CO;;SK Telecom;;SK Telecom AI&CO;SK Telecom;;",
        "aff_domain": "sk.com;;sk.com;;sk.com;sktelecom.com;;",
        "position": "Researcher;;Researcher;;Researcher;Researcher;;",
        "bibtex": "@misc{\nkong2024encoding,\ntitle={Encoding Speaker-Specific Latent Speech Feature for Speech Synthesis},\nauthor={Jungil Kong and Junmo Lee and Jeongmin Kim and Beomjeong Kim and JIHOON PARK and Dohee Kong and Changheon Lee and Sangjin Kim},\nyear={2024},\nurl={https://openreview.net/forum?id=ngp5jzx5oK}\n}",
        "github": "",
        "project": "",
        "reviewers": "8YZU;reHV;WfZD",
        "site": "https://openreview.net/forum?id=ngp5jzx5oK",
        "pdf_size": 1940817,
        "rating": "3;5;5",
        "confidence": "3;4;4",
        "soundness": "2;2;3",
        "contribution": "1;3;2",
        "presentation": "3;2;2",
        "wc_summary": "53;83;81",
        "wc_strengths": "4;31;22",
        "wc_weaknesses": "81;251;136",
        "wc_questions": "62;1;115",
        "wc_review": "200;366;354",
        "wc_reply_reviewers": "44;87;385",
        "wc_reply_authors": "1334;852;1889",
        "reply_reviewers": "1;1;3",
        "reply_authors": "2;3;4",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            72.33333333333333,
            13.695092389449425
        ],
        "wc_strengths_avg": [
            19.0,
            11.224972160321824
        ],
        "wc_weaknesses_avg": [
            156.0,
            70.82843120291926
        ],
        "wc_questions_avg": [
            59.333333333333336,
            46.578488120113505
        ],
        "wc_review_avg": [
            306.6666666666667,
            75.58365490560037
        ],
        "wc_reply_reviewers_avg": [
            172.0,
            151.6333296695244
        ],
        "wc_reply_authors_avg": [
            1358.3333333333333,
            423.7029882148841
        ],
        "reply_reviewers_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            3.0,
            0.816496580927726
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.9999999999999998,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16998420983970854481&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "SK Telecom",
        "aff_unique_dep": "AI&CO",
        "aff_unique_url": "https://www.sktelecom.com",
        "aff_unique_abbr": "SKT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "nh4vQ1tGCt",
        "title": "Forgedit: Text Guided Image Editing via Learning and Forgetting",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Text guided image editing is a recently popular but challenging task. It requires an editing model to estimate by itself which part of the image should be edited, and then perform  complicated non-rigid editing while preserving the characteristics of original image.   Previous fine-tuning based approaches are often time-consuming  and vulnerable to overfitting, which catastrophically limits their editing capabilities. To tackle these issues, we design a novel text guided image editing method, named as Forgedit. First, we propose a novel fine-tuning framework able to reconstruct a given image efficiently by jointly learning vision and language information. Then we introduce  vector subtraction and projection mechanisms to explore accurate text embeddings for editing. We also find a general property of UNet structures in Diffusion Models, which inspired us to design new forgetting strategies to diminish the fatal overfitting issues,  significantly boosting the editing abilities of Diffusion Models. Our method, Forgedit, built on Stable Diffusion, achieves new state-of-the-art results on the challenging text guided image editing benchmark: TEdBench,  surpassing the previous SOTA methods such as Imagic (even built on stronger Imagen), in terms of both CLIP score and LPIPS score.",
        "keywords": "Text guided image editing;Diffusion Models;Image manipulation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/95343c10d6c08421de06b3336227b6a2f31c730e.zip",
        "author": "Shiwen Zhang;Shuai Xiao;Weilin Huang",
        "authorids": "~Shiwen_Zhang1;~Shuai_Xiao1;~Weilin_Huang1",
        "gender": "M;M;M",
        "homepage": "https://openreview.net/profile?id=~Shiwen_Zhang1;https://sites.google.com/view/xiao-shuai/home;http://www.whuang.org/",
        "dblp": ";;",
        "google_scholar": ";qBTDCawAAAAJ;78vU1IUAAAAJ",
        "orcid": ";;0000-0002-1520-4140",
        "linkedin": ";;",
        "or_profile": "~Shiwen_Zhang1;~Shuai_Xiao1;~Weilin_Huang1",
        "aff": "Alibaba Group;Alibaba Group;Alibaba Group",
        "aff_domain": "alibaba-inc.com;alibaba-inc.com;alibaba-inc.com",
        "position": "Researcher;Researcher;Director",
        "bibtex": "@misc{\nzhang2024forgedit,\ntitle={Forgedit: Text Guided Image Editing via Learning and Forgetting},\nauthor={Shiwen Zhang and Shuai Xiao and Weilin Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=nh4vQ1tGCt}\n}",
        "github": "",
        "project": "",
        "reviewers": "xeZb;kPUJ;MyDZ;9c4b",
        "site": "https://openreview.net/forum?id=nh4vQ1tGCt",
        "pdf_size": 25611996,
        "rating": "3;5;5;6",
        "confidence": "4;3;4;2",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "63;61;42;46",
        "wc_strengths": "9;61;66;64",
        "wc_weaknesses": "128;73;237;84",
        "wc_questions": "4;37;4;8",
        "wc_review": "204;232;349;202",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "755;602;946;570",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;2;2",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            53.0,
            9.137833441248533
        ],
        "wc_strengths_avg": [
            50.0,
            23.73815494093844
        ],
        "wc_weaknesses_avg": [
            130.5,
            64.8401881551866
        ],
        "wc_questions_avg": [
            13.25,
            13.808964479641476
        ],
        "wc_review_avg": [
            246.75,
            60.21368200002388
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            718.25,
            148.92342831133053
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.7608859102526822,
        "gs_citation": 23,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15482567212279744653&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Alibaba Group",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.alibaba.com",
        "aff_unique_abbr": "Alibaba",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "nh5tSrqTpe",
        "title": "Don't Pre-train, Teach Your Small Model",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this paper, we reconsider the question: What is the most effective way to train a small model? A standard approach is to train it from scratch in a supervised manner on the desired task for satisfactory results at a low cost. Alternatively, one can first pre-train it on a large foundation dataset and then finetune it on the downstream task to obtain strong performance, albeit at a much higher total training cost. Is there a middle way that balances high performance with low resources? We find the answer to be yes. If, while training from scratch, we regularize the feature backbone (and optionally task-specific head) to match an existing pre-trained one on the relevant subset of the data manifold, a small model can achieve similar or better performance than if it was completely pre-trained and finetuned. We achieve this via a novel knowledge distillation loss based on the Alignment/Uniformity theory of contrastive learning by Wang & Isola (2020), which we use to transfer the knowledge of the task dataset augmented with synthetic inputs generated from existing pre-trained diffusion models. Across 6 image recognition datasets, utilizing pre-trained convolution and attention-based teachers from public model hubs, we show significant improvements to small model performance at a slightly higher cost than supervised learning from scratch. Seeing as our method can hold its weight against, and often surpass, the pre-training regime, we refer to our paradigm as: Don\u2019t Pre-train, Teach (DPT).",
        "keywords": "Small models;supervised learning;pre-training;finetuning;knowledge distillation;low cost;synthetic dataset;contrastive learning;diffusion models",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/ed4295bca09e0cba254e3559f915690a311d0714.zip",
        "author": "Sean Farhat;Deming Chen",
        "authorids": "~Sean_Farhat1;~Deming_Chen1",
        "gender": "M;",
        "homepage": "https://sfarhat.github.io;",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": "seanfarhat/;",
        "or_profile": "~Sean_Farhat1;~Deming_Chen1",
        "aff": ";",
        "aff_domain": ";",
        "position": ";",
        "bibtex": "@misc{\nfarhat2024dont,\ntitle={Don't Pre-train, Teach Your Small Model},\nauthor={Sean Farhat and Deming Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=nh5tSrqTpe}\n}",
        "github": "",
        "project": "",
        "reviewers": "YmUb;vMzu;FsBG;r4D4",
        "site": "https://openreview.net/forum?id=nh5tSrqTpe",
        "pdf_size": 531382,
        "rating": "1;3;3;5",
        "confidence": "5;4;3;3",
        "soundness": "3;3;2;3",
        "contribution": "1;2;2;2",
        "presentation": "3;3;4;3",
        "wc_summary": "83;77;73;85",
        "wc_strengths": "15;21;50;53",
        "wc_weaknesses": "377;400;255;65",
        "wc_questions": "36;2;2;84",
        "wc_review": "511;500;380;287",
        "wc_reply_reviewers": "508;0;0;0",
        "wc_reply_authors": "610;499;454;310",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            79.5,
            4.769696007084728
        ],
        "wc_strengths_avg": [
            34.75,
            16.917077170717167
        ],
        "wc_weaknesses_avg": [
            274.25,
            132.78436466692906
        ],
        "wc_questions_avg": [
            31.0,
            33.60059523282288
        ],
        "wc_review_avg": [
            419.5,
            92.15340471192586
        ],
        "wc_reply_reviewers_avg": [
            127.0,
            219.9704525612474
        ],
        "wc_reply_authors_avg": [
            468.25,
            107.56945430743804
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.8528028654224418,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:kTCks2hSDFIJ:scholar.google.com/&scioq=Don%27t+Pre-train,+Teach+Your+Small+Model&hl=en&as_sdt=0,23",
        "gs_version_total": 0
    },
    {
        "id": "nhgTmx1TZJ",
        "title": "UniAudio: An Audio Foundation Model Toward Universal Audio Generation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Language models (LMs) have demonstrated the capability to handle a variety of generative tasks. This paper presents the UniAudio system, which, unlike prior task-specific approaches, leverages LMs techniques to generate multiple types of audio (including speech, sounds, music, and singing) with given input conditions. \nUniAudio 1) first tokenizes all types of target audio along with other condition modalities, 2) concatenates source-target pair as a single sequence, and 3) performs next-token prediction using LMs. Also, a multi-scale Transformer model is proposed to handle the overly long sequences caused by the residual vector quantization based neural codec in tokenization. Training of UniAudio is scaled up to 165K hours of audio and 1B parameters, based on all generative tasks, aiming to obtain sufficient prior knowledge not only in the intrinsic properties of audio but also the inter-relationship between audio and other modalities. Therefore, the trained UniAudio model has the potential to become a foundation model for universal audio generation: it shows strong capability in all trained tasks and can seamlessly support new audio generation tasks after simple fine-tuning. Experiments demonstrate that UniAudio achieves state-of-the-art or at least competitive results on most of the 11 tasks. Demo and code are released\\footnote{\\url{https://uniaudio666.github.io/demo_UniAudio/}}",
        "keywords": "Audio Language Model;Universal Audio Generation;Foundation Model;Zero-shot",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/2a399bad4066453c955a8cb7f987d6091cde5a1a.zip",
        "author": "Dongchao Yang;Jinchuan Tian;Xu Tan;Rongjie Huang;Songxiang Liu;Xuankai Chang;Jiatong Shi;sheng zhao;Jiang Bian;Xixin Wu;Zhou Zhao;Shinji Watanabe;Helen M. Meng",
        "authorids": "~Dongchao_Yang1;~Jinchuan_Tian1;~Xu_Tan1;~Rongjie_Huang1;~Songxiang_Liu1;~Xuankai_Chang1;~Jiatong_Shi1;~sheng_zhao1;~Jiang_Bian1;~Xixin_Wu1;~Zhou_Zhao3;~Shinji_Watanabe1;~Helen_M._Meng1",
        "gender": "M;M;M;M;M;M;M;M;M;;M;F;M",
        "homepage": "http://dongchaoyang.top;;https://tan-xu.github.io/;;liusongxiang.com;https://www.xuankaic.com;http://shijt.site;https://www.aaai.org/ojs/index.php/AAAI/article/view/4642;https://sites.google.com/view/jiangbian;https://www1.se.cuhk.edu.hk/~wuxx/;https://sites.google.com/view/shinjiwatanabe;http://www.se.cuhk.edu.hk/people/academic-staff/prof-meng-mei-ling-helen/;https://dblp.uni-trier.de/pid/75/7785.html?",
        "dblp": ";;96/10484-3;212/8936-1;;194/1149.html;229/3529.html;;09/851-2.html;125/2836;39/3245-1;92/3270;75/7785",
        "google_scholar": "WNiojyAAAAAJ;https://scholar.google.com.hk/citations?user=KE5I4R0AAAAJ;tob-U1oAAAAJ;iRHBUsgAAAAJ;;cIl2jpMAAAAJ;FEDNbgkAAAAJ;689bIIwAAAAJ;pZBEnY8AAAAJ;;U5xRA6QAAAAJ;;https://scholar.google.com.hk/citations?user=IIoFY90AAAAJ",
        "orcid": ";;0000-0001-5631-0639;;;0000-0002-5221-5412;;;0000-0002-9472-600X;;0000-0002-5970-8631;;0000-0001-6121-0384",
        "linkedin": ";;;;;;jiatong-shi-608b3016b/;;jbian/;;shinji-watanabe-82533520;;",
        "or_profile": "~Dongchao_Yang1;~Jinchuan_Tian1;~Xu_Tan1;~Rongjie_Huang1;~Songxiang_Liu1;~Xuankai_Chang1;~Jiatong_Shi1;~sheng_zhao1;~Jiang_Bian1;~Xixin_Wu1;~Shinji_Watanabe1;~Helen_M._Meng1;~Zhou_Zhao2",
        "aff": "Chinese University of Hong Kong;Carnegie Mellon University;Microsoft;Zhejiang University;;Carnegie Mellon University;Carnegie Mellon University;Microsoft;Microsoft;The Chinese University of Hong Kong;Carnegie Mellon University;The Chinese University of Hong Kong;Zhejiang University",
        "aff_domain": "cuhk.hk;andrew.cmu.edu;microsoft.com;zju.edu.cn;;andrew.cmu.edu;andrew.cmu.edu;microsoft.com;microsoft.com;cuhk.edu.hk;cmu.edu;cuhk.edu.hk;zju.edu.cn",
        "position": "PhD student;PhD student;Principal Researcher;MS student;;PhD student;PhD student;Researcher;Partner Research Manager;Assistant Professor;Associate Professor;Full Professor;Associate Professor",
        "bibtex": "@misc{\nyang2024uniaudio,\ntitle={UniAudio: An  Audio Foundation Model Toward Universal Audio Generation},\nauthor={Dongchao Yang and Jinchuan Tian and Xu Tan and Rongjie Huang and Songxiang Liu and Xuankai Chang and Jiatong Shi and sheng zhao and Jiang Bian and Xixin Wu and Zhou Zhao and Shinji Watanabe and Helen M. Meng},\nyear={2024},\nurl={https://openreview.net/forum?id=nhgTmx1TZJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "kfiC;EAVx;dsre;gngw",
        "site": "https://openreview.net/forum?id=nhgTmx1TZJ",
        "pdf_size": 533006,
        "rating": "1;5;5;10",
        "confidence": "5;4;3;3",
        "soundness": "3;3;3;4",
        "contribution": "1;3;2;4",
        "presentation": "2;3;3;4",
        "wc_summary": "49;189;74;97",
        "wc_strengths": "20;86;56;140",
        "wc_weaknesses": "153;265;389;141",
        "wc_questions": "1;46;72;45",
        "wc_review": "223;586;591;423",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1004;942;1424;756",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;3;1",
        "rating_avg": [
            5.25,
            3.191786333700926
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            1.118033988749895
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            102.25,
            52.88371677558226
        ],
        "wc_strengths_avg": [
            75.5,
            43.96305266925854
        ],
        "wc_weaknesses_avg": [
            237.0,
            100.1998003990028
        ],
        "wc_questions_avg": [
            41.0,
            25.5049014897137
        ],
        "wc_review_avg": [
            455.75,
            150.41837487488024
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1031.5,
            244.29643877879187
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            13,
            0
        ],
        "corr_rating_confidence": -0.8265666900065862,
        "gs_citation": 130,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6416249801268158267&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;3;1;1;2;2;0;1;0;3",
        "aff_unique_norm": "Chinese University of Hong Kong;Carnegie Mellon University;Microsoft;Zhejiang University",
        "aff_unique_dep": ";;Microsoft Corporation;",
        "aff_unique_url": "https://www.cuhk.edu.hk;https://www.cmu.edu;https://www.microsoft.com;https://www.zju.edu.cn",
        "aff_unique_abbr": "CUHK;CMU;Microsoft;ZJU",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;1;1;0;1;1;1;1;0;1;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "nhub8Pjp7y",
        "title": "Fewer is More: Trojan Attacks on Parameter-Efficient Fine-Tuning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Parameter-efficient fine-tuning (PEFT) enables efficient adaptation of pre-trained language models (PLMs) to specific tasks. By tuning only a minimal set of (extra) parameters, PEFT achieves performance comparable to full fine-tuning. However, despite its prevalent use, the security implications of PEFT remain largely unexplored. In this paper, we conduct a pilot study revealing that PEFT exhibits unique vulnerability to trojan attacks. Specifically, we present PETA, a novel attack that accounts for downstream adaptation through bilevel optimization: the upper-level objective embeds the backdoor into a PLM while the lower-level objective simulates PEFT to retain the PLM's task-specific performance. With extensive evaluation across a variety of downstream tasks and trigger designs, we demonstrate PETA's effectiveness in terms of both attack success rate and unaffected clean accuracy, even after the victim user performs PEFT over the backdoored PLM using untainted data. Moreover, we empirically provide possible explanations for PETA's efficacy: the bilevel optimization inherently 'orthogonalizes' the backdoor and PEFT modules, thereby retaining the backdoor throughout PEFT. Based on this insight, we explore a simple defense that omits PEFT in selected layers of the backdoored PLM and unfreezes a subset of these layers' parameters, which is shown to effectively neutralize PETA.",
        "keywords": "Trojan attacks;Parameter-efficient fine-tuning;Pre-trained language models",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/5ad965d58a5fc11fd4defb09c71d15d3dee90ffb.zip",
        "author": "Lauren Hong;Ting Wang",
        "authorids": "~Lauren_Hong1;~Ting_Wang1",
        "gender": "F;M",
        "homepage": "https://qqqube.github.io/;https://alps-lab.github.io/",
        "dblp": "347/2720.html;12/2633-6.html",
        "google_scholar": "6nLvvAEAAAAJ;cwcBTegAAAAJ",
        "orcid": ";",
        "linkedin": "spencerrhongg/;",
        "or_profile": "~Lauren_Hong1;~Ting_Wang1",
        "aff": ";State University of New York at Stony Brook",
        "aff_domain": ";cs.stonybrook.edu",
        "position": ";Associate Professor",
        "bibtex": "@misc{\nhong2024fewer,\ntitle={Fewer is More: Trojan Attacks on Parameter-Efficient Fine-Tuning},\nauthor={Lauren Hong and Ting Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=nhub8Pjp7y}\n}",
        "github": "",
        "project": "",
        "reviewers": "oWxS;zL4D;tYon;EEAs",
        "site": "https://openreview.net/forum?id=nhub8Pjp7y",
        "pdf_size": 857442,
        "rating": "5;6;6;6",
        "confidence": "4;3;3;5",
        "soundness": "2;2;2;3",
        "contribution": "3;2;2;2",
        "presentation": "3;3;3;3",
        "wc_summary": "88;83;45;49",
        "wc_strengths": "29;53;32;11",
        "wc_weaknesses": "87;182;62;14",
        "wc_questions": "3;4;33;263",
        "wc_review": "207;322;172;337",
        "wc_reply_reviewers": "34;19;13;11",
        "wc_reply_authors": "446;355;516;363",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            66.25,
            19.382659776202026
        ],
        "wc_strengths_avg": [
            31.25,
            14.905955185763842
        ],
        "wc_weaknesses_avg": [
            86.25,
            61.18976630123701
        ],
        "wc_questions_avg": [
            75.75,
            108.77815727433519
        ],
        "wc_review_avg": [
            259.5,
            71.28288714691627
        ],
        "wc_reply_reviewers_avg": [
            19.25,
            9.01041064547005
        ],
        "wc_reply_authors_avg": [
            420.0,
            65.89005994837157
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.17407765595569782,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6096396761506337592&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "State University of New York at Stony Brook",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.stonybrook.edu",
        "aff_unique_abbr": "SUNY Stony Brook",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Stony Brook",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "ni3MozjX5D",
        "title": "InsightMapper: A closer look at inner-instance information for vectorized High-Definition Mapping",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Vectorized high-definition (HD) maps contain detailed information about surrounding road elements, which are crucial for various downstream tasks in modern autonomous vehicles, such as motion planning and vehicle control. Recent works have attempted to directly detect the vectorized HD map as a point set prediction task, resulting in significant improvements in detection performance. However, these methods fail to analyze and exploit the inner-instance correlations between predicted points, impeding further advancements. To address this issue, we investigate the utilization of inner-$\\textbf{INS}$tance information for vectorized h$\\textbf{IGH}$-definition mapping through $\\textbf{T}$ransformers and introduce InsightMapper. This paper presents three novel designs within InsightMapper that leverage inner-instance information in distinct ways, including hybrid query generation, inner-instance query fusion, and inner-instance feature aggregation. Comparative experiments are conducted on the NuScenes dataset, showcasing the superiority of our proposed method. InsightMapper surpasses previous state-of-the-art (SOTA) methods by 5.78 mAP and 7.03 TOPO, which assess topology correctness. Simultaneously, InsightMapper maintains high efficiency during both training and inference phases, resulting in remarkable comprehensive performance.",
        "keywords": "Vector map detection;computer vision;autonomous driving;robotics",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/d9b9b8f3da47fd839cff07b24a7a69dab9856605.zip",
        "author": "Zhenhua Xu;Kwan-Yee K. Wong;Hengshuang Zhao",
        "authorids": "~Zhenhua_Xu1;~Kwan-Yee_K._Wong1;~Hengshuang_Zhao2",
        "gender": ";;M",
        "homepage": ";;https://hszhao.github.io",
        "dblp": ";;185/7848",
        "google_scholar": ";;4uE10I0AAAAJ",
        "orcid": ";;0000-0001-8277-2706",
        "linkedin": ";;hengshuang-zhao-347b8391/?originalSubdomain=hk",
        "or_profile": "~Zhenhua_Xu1;~Kwan-Yee_K._Wong1;~Hengshuang_Zhao2",
        "aff": ";;The University of Hong Kong",
        "aff_domain": ";;hku.hk",
        "position": ";;Assistant Professor",
        "bibtex": "@misc{\nxu2024insightmapper,\ntitle={InsightMapper: A closer look at inner-instance information for vectorized High-Definition Mapping},\nauthor={Zhenhua Xu and Kwan-Yee K. Wong and Hengshuang Zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=ni3MozjX5D}\n}",
        "github": "",
        "project": "",
        "reviewers": "iyCD;rWBZ;658H;wpLq",
        "site": "https://openreview.net/forum?id=ni3MozjX5D",
        "pdf_size": 9159933,
        "rating": "3;5;5;5",
        "confidence": "5;4;4;3",
        "soundness": "1;3;2;1",
        "contribution": "2;3;2;2",
        "presentation": "2;3;3;2",
        "wc_summary": "121;68;100;96",
        "wc_strengths": "63;66;91;67",
        "wc_weaknesses": "321;86;299;189",
        "wc_questions": "347;135;144;65",
        "wc_review": "852;355;634;417",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1013;473;796;230",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;2;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            96.25,
            18.872930350107268
        ],
        "wc_strengths_avg": [
            71.75,
            11.211043662389331
        ],
        "wc_weaknesses_avg": [
            223.75,
            93.94513026229725
        ],
        "wc_questions_avg": [
            172.75,
            105.14840702549897
        ],
        "wc_review_avg": [
            564.5,
            195.66105897699725
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            628.0,
            299.53213517083606
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 22,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10615499886668344313&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Hong Kong",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.hku.hk",
        "aff_unique_abbr": "HKU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "njXj1MMqth",
        "title": "Zero-shot Visual Recognition via Pairwise Attribute Contrasting",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Vision-language models like CLIP have excelled in zero-shot inference by training on vast image-text datasets. However, relying solely on category names during inference limits their performance. Prior work introduced category descriptions generated by large language models (LLMs), aiming to enhance recognition and interpretability, albeit with challenges in capturing distinctions between fine-grained classes. We introduce Pairwise Attribute Contrasting (PAC), a zero-shot inference framework for vision-language models. PAC prompts LLMs to provide specific visual attributes that distinguish category pairs.   \nTo aggregate the pairwise comparisons into a single classification, PAC uses a voting procedure.  Specifically, for each test image, all pairwise classifiers are first applied using their own pair-specific attributes to compute image-text similarities.  A category receives a vote when it exhibits higher image-text similarity compared to the other class in the pair. Finally, the category that receives the highest vote becomes the final prediction.\nPAC shows consistent improvement on 18 benchmark datasets over other strong baselines across various model architectures. We further provide an efficient implementation by only computing text embeddings for unique attributes of a category, which significantly reduces the computation complexity compared to naively computing text embeddings for all attributes.",
        "keywords": "zero-shot learning;vision-language",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Zhuoran Yu;Yong Jae Lee",
        "authorids": "~Zhuoran_Yu2;~Yong_Jae_Lee2",
        "gender": "M;M",
        "homepage": "https://www.zhuoranyu.com;https://pages.cs.wisc.edu/~yongjaelee/",
        "dblp": "120/3973;15/5471",
        "google_scholar": "txxhxREAAAAJ;4GTpCxcAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Zhuoran_Yu2;~Yong_Jae_Lee1",
        "aff": "University of Wisconsin, Madison;University of Wisconsin - Madison",
        "aff_domain": "wisc.edu;cs.wisc.edu",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\nyu2024zeroshot,\ntitle={Zero-shot Visual Recognition via Pairwise Attribute Contrasting},\nauthor={Zhuoran Yu and Yong Jae Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=njXj1MMqth}\n}",
        "github": "",
        "project": "",
        "reviewers": "Zv8d;udyw;3Fkf;qUu9",
        "site": "https://openreview.net/forum?id=njXj1MMqth",
        "pdf_size": 733562,
        "rating": "3;5;5;5",
        "confidence": "4;4;3;3",
        "soundness": "2;3;2;2",
        "contribution": "1;2;2;2",
        "presentation": "3;3;2;2",
        "wc_summary": "66;66;53;42",
        "wc_strengths": "65;47;20;45",
        "wc_weaknesses": "185;85;191;123",
        "wc_questions": "3;8;4;3",
        "wc_review": "319;206;268;213",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            56.75,
            10.034316120194738
        ],
        "wc_strengths_avg": [
            44.25,
            16.021469970012117
        ],
        "wc_weaknesses_avg": [
            146.0,
            44.14748010928823
        ],
        "wc_questions_avg": [
            4.5,
            2.0615528128088303
        ],
        "wc_review_avg": [
            251.5,
            45.77390086064329
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:IjPc6rtEcQIJ:scholar.google.com/&scioq=Zero-shot+Visual+Recognition+via+Pairwise+Attribute+Contrasting&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Wisconsin;University of Wisconsin-Madison",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.wisc.edu;https://www.wisc.edu",
        "aff_unique_abbr": "UW;UW-Madison",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Madison",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "nji0ztL5rP",
        "title": "Best Arm Identification for Stochastic Rising Bandits",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Stochastic Rising Bandits (SRBs) model sequential decision-making problems in which the expected reward of the available options increases every time they are selected. This setting captures a wide range of scenarios in which the available options are learning entities whose performance improves (in expectation) over time. While previous works addressed the regret minimization problem, this paper focuses on the fixed-budget Best Arm Identification (BAI) problem for SRBs. In this scenario, given a fixed budget of rounds, we are asked to provide a recommendation about the best option at the end of the identification process. We propose two algorithms to tackle the above-mentioned setting, namely R-UCBE, which resorts to a UCB-like approach, and R-SR, which employs a successive reject procedure. Then, we prove that, with a sufficiently large budget, they provide guarantees on the probability of properly identifying the optimal option at the end of the learning process. Furthermore, we derive a lower bound on the error probability, matched by our R-SR (up to constant factors), and illustrate how the need for a sufficiently large budget is unavoidable in the SRB setting.\nFinally, we numerically validate the proposed algorithms in synthetic and real-world environments and compare them with the currently available BAI strategies.",
        "keywords": "Best Arm Identification;Rising;Rested;Stochastic;Bandits",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/68bb5d01b4d0188330ba7aea7c151f808311067b.zip",
        "author": "Marco Mussi;Alessandro Montenegro;Francesco Trov\u00f2;Marcello Restelli;Alberto Maria Metelli",
        "authorids": "~Marco_Mussi1;~Alessandro_Montenegro1;~Francesco_Trov\u00f21;~Marcello_Restelli1;~Alberto_Maria_Metelli2",
        "gender": "M;M;M;M;M",
        "homepage": "https://marcomussi.github.io/;;https://trovo.faculty.polimi.it/;http://home.deib.polimi.it/restelli/;https://albertometelli.github.io/",
        "dblp": "321/0756;;69/11487;64/1011;209/4941",
        "google_scholar": "3gca-JUAAAAJ;CugD-ogAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com.tw/citations?user=xdgxRiEAAAAJ;R31IsPwAAAAJ",
        "orcid": "0000-0001-8356-6744;;0000-0001-5796-7667;0000-0002-6322-1076;0000-0002-3424-5212",
        "linkedin": "marcomussi95/;alessandro-montenegro-3266291b7/;;;",
        "or_profile": "~Marco_Mussi1;~Alessandro_Montenegro1;~Francesco_Trov\u00f21;~Marcello_Restelli1;~Alberto_Maria_Metelli2",
        "aff": "Politecnico di Milano;Politecnico di Milano;Politecnico di Milano;Politecnico di Milano;Politecnico di Milano",
        "aff_domain": "polimi.it;polimi.it;polimi.it;polimi.it;polimi.it",
        "position": "PhD student;PhD student;Assistant Professor;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nmussi2024best,\ntitle={Best Arm Identification for Stochastic Rising Bandits},\nauthor={Marco Mussi and Alessandro Montenegro and Francesco Trov{\\`o} and Marcello Restelli and Alberto Maria Metelli},\nyear={2024},\nurl={https://openreview.net/forum?id=nji0ztL5rP}\n}",
        "github": "",
        "project": "",
        "reviewers": "nQcR;BjA1;CfKv",
        "site": "https://openreview.net/forum?id=nji0ztL5rP",
        "pdf_size": 1295011,
        "rating": "5;5;6",
        "confidence": "4;3;3",
        "soundness": "3;4;3",
        "contribution": "3;2;3",
        "presentation": "4;2;3",
        "wc_summary": "104;60;117",
        "wc_strengths": "48;59;31",
        "wc_weaknesses": "129;173;99",
        "wc_questions": "67;2;3",
        "wc_review": "348;294;250",
        "wc_reply_reviewers": "544;0;0",
        "wc_reply_authors": "2439;644;400",
        "reply_reviewers": "3;0;0",
        "reply_authors": "4;1;1",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            93.66666666666667,
            24.390344173235622
        ],
        "wc_strengths_avg": [
            46.0,
            11.51810169544733
        ],
        "wc_weaknesses_avg": [
            133.66666666666666,
            30.390056853443948
        ],
        "wc_questions_avg": [
            24.0,
            30.40833219146796
        ],
        "wc_review_avg": [
            297.3333333333333,
            40.07770230717103
        ],
        "wc_reply_reviewers_avg": [
            181.33333333333334,
            256.4440593103212
        ],
        "wc_reply_authors_avg": [
            1161.0,
            909.1560188805146
        ],
        "reply_reviewers_avg": [
            1.0,
            1.4142135623730951
        ],
        "reply_authors_avg": [
            2.0,
            1.4142135623730951
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17019165035024854401&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 11,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Politecnico di Milano",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.polimi.it",
        "aff_unique_abbr": "Polimi",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Italy"
    },
    {
        "id": "nk8HrBad2O",
        "title": "Task-Guided Biased Diffusion Models for Point Localization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We hypothesize that diffusion models can be used to enhance the performance of deep learning methods for predictive tasks involving sparse outputs, such as point-localization tasks. However, this has two difficulties: slow inference and the stochastic nature of sampling, which leads to variable predictions for different initialization seeds of the sampling chain. To improve inference efficiency, we propose the introduction of task bias in the forward diffusion process, replacing the standard convergence to zero-mean Gaussian noise by convergence to a noise distribution closer to that of the target sparse point localization data. This simplifies the reverse diffusion process and is shown to decrease the number of necessary denoising steps, while improving prediction quality. To decrease prediction variance due to seed stochasticity, we propose a task-guided loss that is shown to decrease the average distance between predictions from different noise realizations. The two contributions are combined into the  Task-Guided Biased Diffusion Model (TGBDM), which maps an initial prediction from a classical localization method into a refined localization map. This is shown to achieve state-of-the-art performance for crowd localization, pose estimation, and cell localization.",
        "keywords": "Diffusion models; crowd localization; cell localization; human pose estimation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Jia Wan;Langechuan Liu;Yunxiang Mao;Pengyue Zhang;Antoni B. Chan;Nuno Vasconcelos",
        "authorids": "~Jia_Wan2;~Langechuan_Liu1;~Yunxiang_Mao2;~Pengyue_Zhang2;~Antoni_B._Chan1;~Nuno_Vasconcelos1",
        "gender": "M;M;M;M;M;M",
        "homepage": ";;;;http://www.cs.cityu.edu.hk/~abchan/;http://www.svcl.ucsd.edu/~nuno/",
        "dblp": "13/6504-1.html;;;;55/5814;78/4806",
        "google_scholar": "8VCYME8AAAAJ;u9geL_oAAAAJ;KpKvmpEAAAAJ;KcjjbfcAAAAJ;j4vFSn8AAAAJ;Fykyo9gAAAAJ",
        "orcid": ";0000-0001-5476-0169;;;0000-0002-2886-2513;0000-0002-9024-4302",
        "linkedin": ";;yunxiang-mao-217b35a7/;pengyue-zhang-391202a3;;",
        "or_profile": "~Jia_Wan2;~Langechuan_Liu1;~Yunxiang_Mao2;~Pengyue_Zhang2;~Antoni_B._Chan1;~Nuno_Vasconcelos1",
        "aff": "Boston College;;;XSense.ai Inc.;City University of Hong Kong;University of California, San Diego",
        "aff_domain": "bc.edu;;;xiaopeng.com;cityu.edu.hk;ucsd.edu",
        "position": "Postdoc;;;Researcher;Full Professor;Professor",
        "bibtex": "@misc{\nwan2024taskguided,\ntitle={Task-Guided Biased Diffusion Models for Point Localization},\nauthor={Jia Wan and Langechuan Liu and Yunxiang Mao and Pengyue Zhang and Antoni B. Chan and Nuno Vasconcelos},\nyear={2024},\nurl={https://openreview.net/forum?id=nk8HrBad2O}\n}",
        "github": "",
        "project": "",
        "reviewers": "SXa8;nqfL;UDgf;EsEY",
        "site": "https://openreview.net/forum?id=nk8HrBad2O",
        "pdf_size": 10687976,
        "rating": "5;5;5;5",
        "confidence": "4;4;4;3",
        "soundness": "2;3;2;2",
        "contribution": "2;3;2;2",
        "presentation": "3;3;2;2",
        "wc_summary": "127;59;51;52",
        "wc_strengths": "49;39;53;23",
        "wc_weaknesses": "538;159;506;199",
        "wc_questions": "83;6;8;8",
        "wc_review": "797;263;618;282",
        "wc_reply_reviewers": "0;0;22;0",
        "wc_reply_authors": "174;101;273;139",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            72.25,
            31.75984099456419
        ],
        "wc_strengths_avg": [
            41.0,
            11.575836902790225
        ],
        "wc_weaknesses_avg": [
            350.5,
            172.45361695250116
        ],
        "wc_questions_avg": [
            26.25,
            32.774799770555425
        ],
        "wc_review_avg": [
            490.0,
            226.6197255315609
        ],
        "wc_reply_reviewers_avg": [
            5.5,
            9.526279441628825
        ],
        "wc_reply_authors_avg": [
            171.75,
            63.90373619750257
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:CsoqUbEXXzwJ:scholar.google.com/&scioq=Task-Guided+Biased+Diffusion+Models+for+Point+Localization&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Boston College;XSense.ai;City University of Hong Kong;University of California, San Diego",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.bostoncollege.edu;https://www.xsense.ai;https://www.cityu.edu.hk;https://www.ucsd.edu",
        "aff_unique_abbr": "BC;XSense;CityU;UCSD",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Hong Kong SAR;San Diego",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "nkCWKkSLyb",
        "title": "Benchmarking Diffusion Based Text-Guided Image Editing Methods",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "A plethora of text-guided image editing methods have recently been developed by leveraging the impressive capabilities of large-scale diffusion-based generative models such as Imagen and Stable Diffusion. A standardized evaluation protocol, however, does not exist to compare methods across different types of fine-grained edits. To address this gap, we introduce EditVal, a standardized benchmark for quantitatively evaluating text-guided image editing methods. EditVal consists of a curated dataset of images, a set of editable attributes for each image drawn from 13 possible edit types, and an automated evaluation pipeline that uses pre-trained vision-language models to assess the fidelity of generated images for each edit type. We use EditVal to benchmark 8 cutting-edge diffusion-based editing methods including SINE, Imagic and Instruct-Pix2Pix. We complement this with a large-scale human study where we show that EditVal's automated evaluation pipeline is strongly correlated with human-preferences for the edit types we considered.From both the human study and automated evaluation, we find that: (i) Instruct-Pix2Pix, Null-Text and SINE are the top-performing methods averaged across different edit-types, however only Instruct-Pix2Pix and Null-Text are able to preserve original image properties; (ii) Most of the editing methods fail at edits involving spatial operations (e.g., {\\it changing the position of an object}).  (iii) There is no `winner' method which ranks the best individually across a range of different edit types. We hope that our benchmark can pave the way to developing more reliable text-guided image editing tools in the future. We will publicly release EditVal, and all associated code and human-study templates to support these research directions in https://deep-ml-research.github.io/editval.",
        "keywords": "text-to-image models;image editing;benchmarks",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Samyadeep Basu;Mehrdad Saberi;Shweta Bhardwaj;Atoosa Chegini;Daniela Massiceti;Maziar Sanjabi;Shell Xu Hu;Soheil Feizi",
        "authorids": "~Samyadeep_Basu1;~Mehrdad_Saberi1;~Shweta_Bhardwaj2;~Atoosa_Chegini1;~Daniela_Massiceti1;~Maziar_Sanjabi1;~Shell_Xu_Hu1;~Soheil_Feizi2",
        "gender": "M;M;F;F;F;M;M;M",
        "homepage": "https://samyadeepbasu.github.io/;https://mehrdadsaberi.github.io/;http://shwetabhardwaj44.github.io/;;https://danielamassiceti.github.io/;https://sites.google.com/view/maziar;https://www.cs.umd.edu/~sfeizi/;http://hushell.github.io/",
        "dblp": "250/9138;289/1707;213/7873;;186/8148;21/8577;57/2132;",
        "google_scholar": "6aRwDecAAAAJ;qCZacxgAAAAJ;;5nY9tagAAAAJ;-4fo-SwAAAAJ;bc_N2-oAAAAJ;lptAmrMAAAAJ;https://scholar.google.fr/citations?user=jU7nGnEAAAAJ",
        "orcid": ";;;;0000-0002-1273-0591;;;",
        "linkedin": ";mehrdads/;shweta-bhardwaj-57524b125/;atoosa-chegini-6713741a3/;;;;",
        "or_profile": "~Samyadeep_Basu1;~Mehrdad_Saberi1;~Shweta_Bhardwaj2;~Atoosa_Chegini1;~Daniela_Massiceti1;~Maziar_Sanjabi1;~Soheil_Feizi2;~Xu_Shell_Hu1",
        "aff": "Adobe Systems;Department of Computer Science, University of Maryland, College Park;University of Maryland, College Park;University of Maryland, College Park;Microsoft Research;Meta;University of Maryland, College Park;Samsung",
        "aff_domain": "adobe.com;cs.umd.edu;umd.edu;umd.edu;research.microsoft.com;meta.com;umd.edu;samsung.com",
        "position": "Intern;PhD student;PhD student;PhD student;Researcher;Researcher;Associate Professor;Researcher",
        "bibtex": "@misc{\nbasu2024benchmarking,\ntitle={Benchmarking Diffusion Based Text-Guided Image Editing Methods},\nauthor={Samyadeep Basu and Mehrdad Saberi and Shweta Bhardwaj and Atoosa Chegini and Daniela Massiceti and Maziar Sanjabi and Shell Xu Hu and Soheil Feizi},\nyear={2024},\nurl={https://openreview.net/forum?id=nkCWKkSLyb}\n}",
        "github": "",
        "project": "",
        "reviewers": "mpAW;KGHZ;b2qM;YjMj",
        "site": "https://openreview.net/forum?id=nkCWKkSLyb",
        "pdf_size": 23839318,
        "rating": "5;5;6;6",
        "confidence": "4;4;3;3",
        "soundness": "3;2;3;3",
        "contribution": "2;3;2;3",
        "presentation": "3;1;3;3",
        "wc_summary": "25;127;72;102",
        "wc_strengths": "40;114;50;74",
        "wc_weaknesses": "156;436;68;89",
        "wc_questions": "43;126;65;4",
        "wc_review": "264;803;255;269",
        "wc_reply_reviewers": "121;0;0;0",
        "wc_reply_authors": "1064;1985;777;569",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "3;4;2;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            81.5,
            37.99013029722325
        ],
        "wc_strengths_avg": [
            69.5,
            28.508770580296865
        ],
        "wc_weaknesses_avg": [
            187.25,
            147.2470288325031
        ],
        "wc_questions_avg": [
            59.5,
            44.17295552710957
        ],
        "wc_review_avg": [
            397.75,
            234.02497195812245
        ],
        "wc_reply_reviewers_avg": [
            30.25,
            52.39453692895854
        ],
        "wc_reply_authors_avg": [
            1098.75,
            541.0186572568455
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:-E_G8Hj0CCgJ:scholar.google.com/&scioq=Benchmarking+Diffusion+Based+Text-Guided+Image+Editing+Methods&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;2;3;4;2;5",
        "aff_unique_norm": "Adobe;University of Maryland, College Park;University of Maryland;Microsoft;Meta;Samsung",
        "aff_unique_dep": "Adobe Systems Incorporated;Department of Computer Science;;Microsoft Research;Meta Platforms, Inc.;Samsung",
        "aff_unique_url": "https://www.adobe.com;https://www/umd.edu;https://www/umd.edu;https://www.microsoft.com/en-us/research;https://meta.com;https://www.samsung.com",
        "aff_unique_abbr": "Adobe;UMD;UMD;MSR;Meta;Samsung",
        "aff_campus_unique_index": "1;1;1;1",
        "aff_campus_unique": ";College Park",
        "aff_country_unique_index": "0;0;0;0;0;0;0;1",
        "aff_country_unique": "United States;South Korea"
    },
    {
        "id": "nkKWY5JjtZ",
        "title": "Exact Mean Square Linear Stability Analysis for SGD",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The dynamical stability of optimization methods at the vicinity of minima of the loss has recently attracted significant attention. For gradient descent (GD), stable convergence is possible only to minima that are sufficiently flat w.r.t. the step size, and those have been linked with favorable properties of the trained model. However, while the stability threshold of GD is well-known, to date, no explicit expression has been derived for the exact threshold of stochastic GD (SGD). In this paper, we derive such a closed-form expression. Specifically, we provide an explicit condition on the step size that is both necessary and sufficient for the stability of SGD in the mean square sense. Our analysis sheds light on the precise role of the batch size $B$. Particularly, we show that the stability threshold is a monotonically non-decreasing function of the batch size, which means that reducing the batch size can only decrease stability. Furthermore, we show that SGD's stability threshold is equivalent to that of a process which takes in each iteration a full batch gradient step w.p. $1-p$, and a single sample gradient step w.p. $p$, where $p \\approx 1/B $. This indicates that even with moderate batch sizes, SGD's stability threshold is very close to that of GD's. Finally, we prove simple necessary conditions for stability, which depend on the batch size, and are easier to compute than the precise threshold. We demonstrate our theoretical findings through experiments on the MNIST dataset.",
        "keywords": "Linear stability;Dynamical systems;SGD;Mean square stability",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Rotem Mulayoff;Tomer Michaeli",
        "authorids": "~Rotem_Mulayoff1;~Tomer_Michaeli1",
        "gender": "M;M",
        "homepage": ";https://tomer.net.technion.ac.il/",
        "dblp": "210/6266;70/3188.html",
        "google_scholar": "sqOg-58AAAAJ;n2EbR2cAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Rotem_Mulayoff1;~Tomer_Michaeli1",
        "aff": "Technion - Israel Institute of Technology, Technion;Technion, Technion",
        "aff_domain": "technion.ac.il;technion.ac.il",
        "position": "Postdoc;Associate Professor",
        "bibtex": "@misc{\nmulayoff2024exact,\ntitle={Exact Mean Square Linear Stability Analysis for {SGD}},\nauthor={Rotem Mulayoff and Tomer Michaeli},\nyear={2024},\nurl={https://openreview.net/forum?id=nkKWY5JjtZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "GWmw;YQoF;Dxwn",
        "site": "https://openreview.net/forum?id=nkKWY5JjtZ",
        "pdf_size": 723895,
        "rating": "5;6;6",
        "confidence": "2;4;3",
        "soundness": "3;3;3",
        "contribution": "3;3;2",
        "presentation": "2;3;3",
        "wc_summary": "40;43;74",
        "wc_strengths": "48;87;72",
        "wc_weaknesses": "157;66;70",
        "wc_questions": "18;1;98",
        "wc_review": "263;197;314",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "766;192;1155",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;2",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            52.333333333333336,
            15.369522511198006
        ],
        "wc_strengths_avg": [
            69.0,
            16.06237840420901
        ],
        "wc_weaknesses_avg": [
            97.66666666666667,
            41.98677040317448
        ],
        "wc_questions_avg": [
            39.0,
            42.29263135188761
        ],
        "wc_review_avg": [
            258.0,
            47.89572005931219
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            704.3333333333334,
            395.55390136982453
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.8660254037844385,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10948614325254158105&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Technion - Israel Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.technion.ac.il",
        "aff_unique_abbr": "Technion",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Israel"
    },
    {
        "id": "nkUQPOwYy0",
        "title": "Fast Multipole Attention: A Divide-and-Conquer Attention Mechanism for Long Sequences",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Transformer-based models have achieved state-of-the-art performance in many areas. However, the quadratic complexity of self-attention  with respect to the input length hinders the applicability of Transformer-based models to long sequences.\nTo address this, we present Fast Multipole Attention, a new attention mechanism that uses a divide-and-conquer strategy to reduce the time and memory complexity of attention for sequences of length $n$ from $\\mathcal{O}(n^2)$ to \n$\\mathcal{O}(n \\log n)$ or\n$O(n)$, while retaining a global receptive field. \nThe hierarchical approach groups queries, keys, and values into $\\mathcal{O}( \\log n)$ levels of resolution, where groups at greater distance are increasingly larger in size and the weights to compute group quantities are learned. As such, interaction between tokens far from each other is considered in lower resolution in an efficient hierarchical manner. The overall complexity of Fast Multipole Attention is $\\mathcal{O}(n \\log n)$ or $\\mathcal{O}(n)$, depending on whether the queries are down-sampled or not.\nThis multi-level divide-and-conquer strategy is inspired by fast summation methods from $n$-body physics and the Fast Multipole Method.\nWe perform evaluation on autoregressive and bidirectional language modeling tasks by comparing our Fast Multipole Attention model with other efficient attention variants on medium-size datasets.\nWe find empirically that the Fast Multipole Transformer performs much better than other efficient transformers in terms of memory size and accuracy.\nThe Fast Multipole Attention mechanism has the potential to empower large language models with much greater sequence lengths, taking the full context into account in an efficient, naturally hierarchical manner during training and when generating long sequences.",
        "keywords": "Neural Networks;Natural Language Processing;Transformer;Attention;Language Model",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/2a837eff02e5338685da52e73c74113a4eee6e70.zip",
        "author": "Yanming Kang;Hans De Sterck;Giang Tran",
        "authorids": "~Yanming_Kang1;~Hans_De_Sterck1;~Giang_Tran2",
        "gender": "M;M;",
        "homepage": ";https://uwaterloo.ca/scholar/hdesterc;https://uwaterloo.ca/applied-mathematics/people-profiles/giang-tran",
        "dblp": ";35/5649;",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;-zCxA1AAAAAJ",
        "orcid": ";;0000-0002-3518-153X",
        "linkedin": "yanming-kang-047a1a151/;;",
        "or_profile": "~Yanming_Kang1;~Hans_De_Sterck1;~Giang_Tran2",
        "aff": "University of Waterloo;University of Waterloo;University of Waterloo",
        "aff_domain": "uwaterloo.ca;uwaterloo.ca;uwaterloo.ca",
        "position": "PhD student;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nkang2024fast,\ntitle={Fast Multipole Attention: A Divide-and-Conquer Attention Mechanism for Long Sequences},\nauthor={Yanming Kang and Hans De Sterck and Giang Tran},\nyear={2024},\nurl={https://openreview.net/forum?id=nkUQPOwYy0}\n}",
        "github": "",
        "project": "",
        "reviewers": "xWY6;3Dja;AtqH",
        "site": "https://openreview.net/forum?id=nkUQPOwYy0",
        "pdf_size": 557338,
        "rating": "5;5;5",
        "confidence": "5;4;4",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "3;3;3",
        "wc_summary": "89;44;80",
        "wc_strengths": "72;32;47",
        "wc_weaknesses": "257;103;134",
        "wc_questions": "51;31;62",
        "wc_review": "469;210;323",
        "wc_reply_reviewers": "7;0;0",
        "wc_reply_authors": "905;926;442",
        "reply_reviewers": "1;0;0",
        "reply_authors": "4;3;2",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            71.0,
            19.44222209522358
        ],
        "wc_strengths_avg": [
            50.333333333333336,
            16.49915822768611
        ],
        "wc_weaknesses_avg": [
            164.66666666666666,
            66.50480350237032
        ],
        "wc_questions_avg": [
            48.0,
            12.832251036613439
        ],
        "wc_review_avg": [
            334.0,
            106.0220102934606
        ],
        "wc_reply_reviewers_avg": [
            2.3333333333333335,
            3.2998316455372216
        ],
        "wc_reply_authors_avg": [
            757.6666666666666,
            223.37462304886432
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.0,
            0.816496580927726
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16874368194417296576&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Waterloo",
        "aff_unique_dep": "",
        "aff_unique_url": "https://uwaterloo.ca",
        "aff_unique_abbr": "UW",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "nliDYxirqq",
        "title": "EduGym: An Environment Suite for Reinforcement Learning Education",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Due to the empirical success of reinforcement learning, an increasing number of students study the subject. However, from our practical teaching experience, we see students entering the field (bachelor, master and early PhD) often struggle. On the one hand, textbooks and (online) lectures provide the fundamentals, but students find it hard to translate between equations and code. On the other hand, public codebases do provide practical examples, but the implemented algorithms tend to be complex, and the underlying test environments contain multiple reinforcement learning challenges at once. Although this is realistic from a research perspective, it often hinders educational conceptual understanding. To solve this issue we introduce EduGym, as a set of educational reinforcement learning environments and associated interactive notebooks tailored for education. Each EduGym environment is specifically designed to illustrate a certain aspect/challenge of reinforcement learning (e.g., exploration, partial observability, stochasticity, etc.), while the associated interactive notebook explains the challenge and its possible solution approaches, connecting equations and code in a single document. An evaluation among RL students and researchers shows 86% of them think EduGym is a useful tool for reinforcement learning education. All notebooks are available from https://sites.google.com/view/edu-gym/home, while the full software package can be installed from www.github.com/anonymized.",
        "keywords": "reinforcement learning;education;environment suite;interactive notebooks",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/d4763ee0fbfeb871a7bb124de8423ef824ca8720.zip",
        "author": "Thomas M. Moerland;Matthias M\u00fcller-Brockhausen;Zhao Yang;Koen Ponse;Bram M. Renting;Michiel van der Meer;Andrius Bernatavicius;Andreas W.M. Sauter;Tom Kouwenhoven;Aske Plaat",
        "authorids": "~Thomas_M._Moerland1;~Matthias_M\u00fcller-Brockhausen1;~Zhao_Yang3;~Koen_Ponse1;~Bram_M._Renting1;~Michiel_van_der_Meer1;~Andrius_Bernatavicius1;~Andreas_W.M._Sauter1;~Tom_Kouwenhoven1;~Aske_Plaat1",
        "gender": "M;M;M;M;M;M;M;M;M;M",
        "homepage": "http://thomasmoerland.nl/;;https://yangzhao-666.github.io;;https://bramrenting.nl;https://liacs.leidenuniv.nl/~meermtvander/;;http://www.sauter.at;;https://askeplaat.wordpress.com",
        "dblp": "200/7623;262/3686;21/2326-3;311/5217;https://dblp.uni-trier.de/pid/262/3547;191/7975;;;320/1588;53/5607",
        "google_scholar": "c54IheQAAAAJ;Dp-Yx28AAAAJ;;;3HpSdGoAAAAJ;rSOe9c4AAAAJ;;https://scholar.google.com/citations?hl=nl;vbIiimUAAAAJ;scYqr58AAAAJ",
        "orcid": ";0000-0002-2107-2180;;0000-0002-6542-3042;;0000-0003-1877-6002;0000-0002-0058-3678;0000-0001-6643-4205;0000-0003-2480-4073;0000-0001-7202-3322",
        "linkedin": ";;;;bram-renting-b7120495/;;andrius-bernatavicius/;;;",
        "or_profile": "~Thomas_M._Moerland1;~Matthias_M\u00fcller-Brockhausen1;~Zhao_Yang3;~Koen_Ponse1;~Bram_M._Renting1;~Michiel_van_der_Meer1;~Andrius_Bernatavicius1;~Andreas_W.M._Sauter1;~Tom_Kouwenhoven1;~Aske_Plaat1",
        "aff": "Leiden University;Leiden University, Leiden University;Leiden University, Leiden University;Leiden University;Delft University of Technology;Leiden University;Leiden University, Leiden University;Vrije Universiteit Amsterdam;Leiden University, Leiden University;Leiden University",
        "aff_domain": "leidenuniv.nl;liacs.leidenuniv.nl;liacs.leidenuniv.nl;leidenuniv.nl;tudelft.nl;leidenuniv.nl;liacs.leidenuniv.nl;vu.nl;liacs.leidenuniv.nl;leidenuniv.nl",
        "position": "Assistant Professor;PhD student;PhD student;PhD student;PhD student;PhD student;PhD student;PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nmoerland2024edugym,\ntitle={EduGym: An Environment Suite for Reinforcement Learning Education},\nauthor={Thomas M. Moerland and Matthias M{\\\"u}ller-Brockhausen and Zhao Yang and Koen Ponse and Bram M. Renting and Michiel van der Meer and Andrius Bernatavicius and Andreas W.M. Sauter and Tom Kouwenhoven and Aske Plaat},\nyear={2024},\nurl={https://openreview.net/forum?id=nliDYxirqq}\n}",
        "github": "",
        "project": "",
        "reviewers": "16ha;pfPX;kARL;FCg2;iCzW",
        "site": "https://openreview.net/forum?id=nliDYxirqq",
        "pdf_size": 560983,
        "rating": "3;3;3;6;6",
        "confidence": "5;3;4;3;4",
        "soundness": "2;3;2;3;3",
        "contribution": "1;3;1;3;2",
        "presentation": "2;2;3;4;3",
        "wc_summary": "76;73;43;57;56",
        "wc_strengths": "112;40;54;98;65",
        "wc_weaknesses": "151;53;209;34;59",
        "wc_questions": "13;32;7;38;103",
        "wc_review": "352;198;313;227;283",
        "wc_reply_reviewers": "0;0;0;62;38",
        "wc_reply_authors": "585;359;408;105;411",
        "reply_reviewers": "0;0;0;1;1",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            4.2,
            1.469693845669907
        ],
        "confidence_avg": [
            3.8,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.0,
            0.8944271909999159
        ],
        "presentation_avg": [
            2.8,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            61.0,
            12.116104984688768
        ],
        "wc_strengths_avg": [
            73.8,
            27.04366839021659
        ],
        "wc_weaknesses_avg": [
            101.2,
            67.41038495662222
        ],
        "wc_questions_avg": [
            38.6,
            34.191226944934286
        ],
        "wc_review_avg": [
            274.6,
            55.980710963688196
        ],
        "wc_reply_reviewers_avg": [
            20.0,
            25.64371267971937
        ],
        "wc_reply_authors_avg": [
            373.6,
            154.68109128138448
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": -0.32732683535398854,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ewnCqAp7FA0J:scholar.google.com/&scioq=EduGym:+An+Environment+Suite+for+Reinforcement+Learning+Education&hl=en&as_sdt=0,23",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0;1;0;0;2;0;0",
        "aff_unique_norm": "Leiden University;Delft University of Technology;Vrije Universiteit Amsterdam",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.leidenuniv.nl;https://www.tudelft.nl;https://www.vu.nl",
        "aff_unique_abbr": "LU;TU Delft;VU Amsterdam",
        "aff_campus_unique_index": "1;1;1;1",
        "aff_campus_unique": ";Leiden",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "Netherlands"
    },
    {
        "title": "Graph Lottery Ticket Automated",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17845",
        "id": "nmBjBZoySX",
        "author_site": "Guibin Zhang, Kun Wang, Wei Huang, Yanwei Yue, Yang Wang, Roger Zimmermann, Aojun Zhou, Dawei Cheng, Jin Zeng, Yuxuan Liang",
        "tldr": "",
        "abstract": "Graph Neural Networks (GNNs) have emerged as the leading deep learning models for graph-based representation learning. However, the training and inference of  GNNs on large graphs remain resource-intensive, impeding their utility in real-world scenarios and curtailing their applicability in deeper and more sophisticated GNN architectures. To address this issue, the Graph Lottery Ticket (GLT) hypothesis assumes that GNN with random initialization harbors a pair of core subgraph and sparse subnetwork, which can yield comparable performance and higher efficiency to that of the original dense network and complete graph. Despite that GLT offers a new paradigm for GNN training and inference, existing GLT algorithms heavily rely on trial-and-error pruning rate tuning and scheduling, and adhere to an irreversible pruning paradigm that lacks elasticity. Worse still, current methods suffer scalability issues when applied to deep GNNs, as they maintain the same topology structure across all layers. These challenges hinder the integration of GLT into deeper and larger-scale GNN contexts.  To bridge this critical gap, this paper introduces an $\\textbf{A}$daptive, $\\textbf{D}$ynamic, and $\\textbf{A}$utomated framework for identifying $\\textbf{G}$raph $\\textbf{L}$ottery $\\textbf{T}$ickets ($\\textbf{AdaGLT}$). Our proposed method derives its key advantages and addresses the above limitations through the following three aspects: 1) tailoring layer-adaptive sparse structures for various datasets and GNNs, thus endowing it with the capability to facilitate deeper GNNs; 2) integrating the pruning and training processes, thereby achieving a dynamic workflow encompassing both pruning and restoration; 3) automatically capturing graph lottery tickets across diverse sparsity levels, obviating the necessity for extensive pruning parameter tuning. More importantly, we rigorously provide theoretical proofs to guarantee $\\textbf{AdaGLT}$  to mitigate over-smoothing issues and obtain improved sparse structures in deep GNN scenarios. Extensive experiments demonstrate that $\\textbf{AdaGLT}$ outperforms state-of-the-art competitors across multiple graph datasets of various scales and types, particularly in scenarios involving deep GNNs.",
        "keywords": "Lottery Ticket Hypothesis;Graph Neural Networks;Graph Neural Tangent Kernel",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/10efe5d2518089f28d01d587dbf5f36707e8b4f0.zip",
        "author": "Guibin Zhang;Kun Wang;Wei Huang;Yanwei Yue;Yang Wang;Roger Zimmermann;Aojun Zhou;Dawei Cheng;Jin Zeng;Yuxuan Liang",
        "authorids": "~Guibin_Zhang1;~Kun_Wang15;~Wei_Huang6;~Yanwei_Yue1;~Yang_Wang32;~Roger_Zimmermann1;~Aojun_Zhou2;~Dawei_Cheng1;~Jin_Zeng1;~Yuxuan_Liang1",
        "gender": ";M;M;M;M;M;;M;F;M",
        "homepage": ";http://home.ustc.edu.cn/~wk520529/#home;https://weihuang05.github.io/;https://yanweiyue.github.io/;http://staff.ustc.edu.cn/~angyan/;https://www.comp.nus.edu.sg/cs/bio/rogerz/;;http://cs1.tongji.edu.cn/~dawei/;https://jzengust.github.io/;https://yuxuanliang.com",
        "dblp": ";;81/6685-34;289/8664;;79/1490;;135/6864;52/331;183/0977",
        "google_scholar": ";UnyqjWQAAAAJ;RZfDh4MAAAAJ;https://scholar.google.com.hk/citations?user=JaJm738AAAAJ;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com.tw/citations?user=IDREwXEAAAAJ;;4UD20ukAAAAJ;https://scholar.google.com.hk/citations?user=jBxf3FYAAAAJ;n9cODgcAAAAJ",
        "orcid": ";0000-0003-0602-169X;0000-0001-5674-7021;;0000-0002-6079-7053;0000-0002-7410-2590;;0000-0002-5877-7387;;0000-0003-2817-7337",
        "linkedin": ";;;;;roger-zimmermann-76b56b6/;;;;yoshall/",
        "or_profile": "~Guibin_Zhang1;~Kun_Wang15;~Wei_Huang6;~Yanwei_Yue1;~Yang_Wang32;~Roger_Zimmermann1;~Aojun_Zhou2;~Dawei_Cheng1;~Jin_Zeng1;~Yuxuan_Liang1",
        "aff": ";University of Science and Technology of China;RIKEN AIP;Tongji University;University of Science and Technology of China;National University of Singapore;;Tongji University;Tongji University;The Hong Kong University of Science and Technology (Guangzhou)",
        "aff_domain": ";ustc.edu.cn;riken.jp;tongji.edu.cn;ustc.edu.cn;nus.edu.sg;;tongji.edu.cn;tongji.edu.cn;hkust-gz.edu.cn",
        "position": ";PhD student;Research Scientist;Undergrad student;Associate Professor;Full Professor;;Associate Professor;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nzhang2024graph,\ntitle={Graph Lottery Ticket Automated},\nauthor={Guibin Zhang and Kun Wang and Wei Huang and Yanwei Yue and Yang Wang and Roger Zimmermann and Aojun Zhou and Dawei Cheng and Jin Zeng and Yuxuan Liang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=nmBjBZoySX}\n}",
        "github": "",
        "project": "",
        "reviewers": "2ZB4;9nRP;9csi",
        "pdf_size": 18427969,
        "rating": "5;6;6",
        "confidence": "3;4;3",
        "soundness": "3;3;3",
        "contribution": "3;2;3",
        "presentation": "3;3;3",
        "wc_summary": "80;82;63",
        "wc_strengths": "93;69;31",
        "wc_weaknesses": "94;95;82",
        "wc_questions": "2;20;90",
        "wc_review": "269;266;266",
        "wc_reply_reviewers": "0;0;11",
        "wc_reply_authors": "1408;1537;1791",
        "reply_reviewers": "0;0;1",
        "reply_authors": "3;3;4",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            75.0,
            8.524474568362947
        ],
        "wc_strengths_avg": [
            64.33333333333333,
            25.525586292102197
        ],
        "wc_weaknesses_avg": [
            90.33333333333333,
            5.90668171555645
        ],
        "wc_questions_avg": [
            37.333333333333336,
            37.959042254631356
        ],
        "wc_review_avg": [
            267.0,
            1.4142135623730951
        ],
        "wc_reply_reviewers_avg": [
            3.6666666666666665,
            5.185449728701348
        ],
        "wc_reply_authors_avg": [
            1578.6666666666667,
            159.11072315284792
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 17,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=946624832309361533&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=nmBjBZoySX",
        "pdf": "https://openreview.net/pdf?id=nmBjBZoySX",
        "email": ";ustc.edu.cn;riken.jp;tongji.edu.cn;ustc.edu.cn;nus.edu.sg;;tongji.edu.cn;tongji.edu.cn;hkust-gz.edu.cn",
        "author_num": 10,
        "aff_unique_index": "0;1;2;0;3;2;2;4",
        "aff_unique_norm": "University of Science and Technology of China;RIKEN;Tongji University;National University of Singapore;Hong Kong University of Science and Technology",
        "aff_unique_dep": ";Advanced Institute for Computational Science;;;",
        "aff_unique_url": "http://www.ustc.edu.cn;https://www.aip.riken.jp;https://www.tongji.edu.cn;https://www.nus.edu.sg;https://www.ust.hk",
        "aff_unique_abbr": "USTC;RIKEN AIP;Tongji;NUS;HKUST",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Guangzhou",
        "aff_country_unique_index": "0;1;0;0;2;0;0;0",
        "aff_country_unique": "China;Japan;Singapore"
    },
    {
        "title": "Think-on-Graph: Deep and Responsible Reasoning of Large Language Model on Knowledge Graph",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17844",
        "id": "nnVO1PvbTv",
        "author_site": "Jiashuo Sun, Chengjin Xu, Lumingyuan Tang, Saizhuo Wang, Chen Lin, Yeyun Gong, Lionel Ni, Heung-Yeung Shum, Jian Guo",
        "tldr": "",
        "abstract": "Although large language models (LLMs) have achieved significant success in various tasks, they often struggle with hallucination problems, especially in scenarios requiring deep and responsible reasoning. These issues could be partially addressed by introducing external knowledge graphs (KG) in LLM reasoning. In this paper, we propose a new LLM-KG integrating paradigm ``$\\hbox{LLM}\\otimes\\hbox{KG}$'' which treats the LLM as an agent to interactively explore related entities and relations on KGs and perform reasoning based on the retrieved knowledge. We further implement this paradigm by introducing a new approach called Think-on-Graph (ToG), in which the LLM agent iteratively executes beam search on KG, discovers the most promising reasoning paths, and returns the most likely reasoning results. We use a number of well-designed experiments to examine and illustrate the following advantages of ToG: 1) compared with LLMs, ToG has better deep reasoning power; 2) ToG has the ability of knowledge traceability and knowledge correctability by leveraging LLMs reasoning and expert feedback; 3) ToG provides a flexible plug-and-play framework for different LLMs, KGs and prompting strategies without any additional training cost; 4) the performance of ToG with small LLM models could exceed large LLM such as GPT-4 in certain scenarios and this reduces the cost of LLM deployment and application. As a training-free method with lower computational cost and better generality, ToG achieves overall SOTA in 6 out of 9 datasets where most previous SOTAs rely on additional training.",
        "keywords": "Knowledge Graph;Chain-of-Thought;Large Language Models",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "/attachment/b474e269515e65142636a06158ebf2a5515310ce.zip",
        "author": "Jiashuo Sun;Chengjin Xu;Lumingyuan Tang;Saizhuo Wang;Chen Lin;Yeyun Gong;Lionel Ni;Heung-Yeung Shum;Jian Guo",
        "authorids": "~Jiashuo_Sun1;~Chengjin_Xu1;~Lumingyuan_Tang1;~Saizhuo_Wang1;~Chen_Lin5;~Yeyun_Gong2;~Lionel_Ni1;~Heung-Yeung_Shum1;~Jian_Guo2",
        "gender": "M;M;M;M;F;M;M;M;M",
        "homepage": "https://github.com/gasolsun36;https://soledad921.github.io/chengjin_xu/;https://tanglumy.com;https://saizhuo.wang;https://xmudm.github.io/publications/;;http://repository.ust.hk/ir/AuthorProfile/ni-lionel;https://www.microsoft.com/en-us/research/people/hshum/;https://idea.edu.cn/person/guojian/",
        "dblp": "336/2528;247/6268.html;;;37/3102-1.html;06/10400.html;n/LionelMNi;;96/2596-2",
        "google_scholar": "https://scholar.google.com.hk/citations?user=JCUiEM4AAAAJ;https://scholar.google.de/citations?user=sIts5VgAAAAJ;;;z1l2JSMAAAAJ;piUkwMYAAAAJ;https://scholar.google.com.tw/citations?user=OzMYwDIAAAAJ;;",
        "orcid": ";;;;0000-0002-2275-997X;;;;",
        "linkedin": "jiashuo-sun-b67857190/;;tanglumy/;;;;;;",
        "or_profile": "~Jiashuo_Sun1;~Chengjin_Xu1;~Lumingyuan_Tang1;~Saizhuo_Wang1;~Chen_Lin5;~Yeyun_Gong2;~Lionel_Ni1;~Heung-Yeung_Shum1;~Jian_Guo2",
        "aff": "Xiamen University;International Digital Economy Academy;University of Southern California;Hong Kong University of Science and Technology;Xiamen University;Microsoft;Hong Kong University of Science and Technology;;International Digital Economy Academy, International Digital Economy Academy",
        "aff_domain": "xmu.edu.cn;idea.edu.cn;usc.edu;ust.hk;xmu.edu.cn;microsoft.com;ust.hk;;idea.edu.cn",
        "position": "MS student;Researcher;MS student;PhD student;Full Professor;Researcher;Full Professor;;Researcher",
        "bibtex": "@inproceedings{\nsun2024thinkongraph,\ntitle={Think-on-Graph: Deep and Responsible Reasoning of Large Language Model on Knowledge Graph},\nauthor={Jiashuo Sun and Chengjin Xu and Lumingyuan Tang and Saizhuo Wang and Chen Lin and Yeyun Gong and Lionel Ni and Heung-Yeung Shum and Jian Guo},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=nnVO1PvbTv}\n}",
        "github": "",
        "project": "",
        "reviewers": "ezze;nifq;LtPr;K4jf",
        "pdf_size": 3613228,
        "rating": "6;6;8;8",
        "confidence": "4;4;4;4",
        "soundness": "3;3;3;3",
        "contribution": "3;3;4;3",
        "presentation": "2;3;4;3",
        "wc_summary": "51;96;68;75",
        "wc_strengths": "71;46;38;57",
        "wc_weaknesses": "179;173;133;142",
        "wc_questions": "120;5;1;173",
        "wc_review": "421;320;240;447",
        "wc_reply_reviewers": "41;0;0;71",
        "wc_reply_authors": "2101;911;985;1203",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "4;2;2;3",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            72.5,
            16.132265804901678
        ],
        "wc_strengths_avg": [
            53.0,
            12.389511693363866
        ],
        "wc_weaknesses_avg": [
            156.75,
            19.62619423117992
        ],
        "wc_questions_avg": [
            74.75,
            74.16999056222132
        ],
        "wc_review_avg": [
            357.0,
            82.54392769913484
        ],
        "wc_reply_reviewers_avg": [
            28.0,
            29.941609843159736
        ],
        "wc_reply_authors_avg": [
            1300.0,
            474.75151395229904
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 275,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17400716338910902015&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=nnVO1PvbTv",
        "pdf": "https://openreview.net/pdf?id=nnVO1PvbTv",
        "email": "xmu.edu.cn;idea.edu.cn;usc.edu;ust.hk;xmu.edu.cn;microsoft.com;ust.hk;;idea.edu.cn",
        "author_num": 9,
        "aff_unique_index": "0;1;2;3;0;4;3;1",
        "aff_unique_norm": "Xiamen University;International Digital Economy Academy;University of Southern California;Hong Kong University of Science and Technology;Microsoft",
        "aff_unique_dep": ";;;;Microsoft Corporation",
        "aff_unique_url": "https://www.xmu.edu.cn;;https://www.usc.edu;https://www.ust.hk;https://www.microsoft.com",
        "aff_unique_abbr": "XMU;;USC;HKUST;Microsoft",
        "aff_campus_unique_index": "1;2;2",
        "aff_campus_unique": ";Los Angeles;Hong Kong SAR",
        "aff_country_unique_index": "0;2;0;0;2;0",
        "aff_country_unique": "China;;United States"
    },
    {
        "id": "nnYsWoe1ST",
        "title": "Self-Supervision is Not All You Need: In Defense of Semi-Supervised Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Self-supervised (Self-SL) and Semi-supervised learning (Semi-SL) are two dominant approaches in limited label representation learning. Recent advances in Self-SL demonstrate its importance as a pretraining step to initialize the model with strong representations for virtually every supervised learning task. This \"Self-SL pretraining followed by supervised finetuning\" pipeline challenges the benefits of Semi-SL frameworks. This paper studies the advantages/disadvantages of Self-SL and Semi-SL frameworks under different conditions. At its core, this paper tries to answer the question \"When to favor one over the other?\". In particular, we explore how the choice of Self-SL versus Semi-SL framework affects performance on in-domain, near-domain and out-of-distribution data, robustness to image corruptions and adversarial attacks, cross-domain few-shot learning, and ability to learn from imbalanced data. Our extensive experiments demonstrate that in-domain performance and robustness to perturbations are the two biggest strengths of Semi-SL approaches, where they outperform Self-SL methods by huge margins, while also matching Self-supervised techniques on other evaluation settings.",
        "keywords": "Self-Supervised Learning;Semi-Supervised Learning;Learning with Limited Labels",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Rohit Gupta;Mamshad Nayeem Rizve;Swetha Sirnam;Navid Kardan;Mubarak Shah",
        "authorids": "~Rohit_Gupta3;~Mamshad_Nayeem_Rizve1;~Swetha_Sirnam1;~Navid_Kardan1;~Mubarak_Shah3",
        "gender": "M;M;;;M",
        "homepage": "https://rohit-gupta.github.io/;https://nayeemrizve.github.io/;;;https://www.crcv.ucf.edu/person/mubarak-shah/",
        "dblp": "47/3340-12;260/4900;;;s/MubarakShah",
        "google_scholar": "0WukQpMAAAAJ;kA8ZM5oAAAAJ;;;https://scholar.google.com.tw/citations?user=p8gsO3gAAAAJ",
        "orcid": ";;;;0000-0002-8216-1128",
        "linkedin": ";;;;mubarak-shah-b6aa68213/",
        "or_profile": "~Rohit_Gupta3;~Mamshad_Nayeem_Rizve1;~Swetha_Sirnam1;~Navid_Kardan1;~Mubarak_Shah3",
        "aff": "University of Central Florida;Amazon;;;University of Central Florida",
        "aff_domain": "ucf.edu;amazon.com;;;ucf.edu",
        "position": "PhD student;Postdoc;;;Full Professor",
        "bibtex": "@misc{\ngupta2024selfsupervision,\ntitle={Self-Supervision is Not All You Need: In Defense of Semi-Supervised Learning},\nauthor={Rohit Gupta and Mamshad Nayeem Rizve and Swetha Sirnam and Navid Kardan and Mubarak Shah},\nyear={2024},\nurl={https://openreview.net/forum?id=nnYsWoe1ST}\n}",
        "github": "",
        "project": "",
        "reviewers": "9YZg;TpWL;1DSs;UA6u",
        "site": "https://openreview.net/forum?id=nnYsWoe1ST",
        "pdf_size": 965841,
        "rating": "3;3;5;5",
        "confidence": "4;5;4;4",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "3;2;3;4",
        "wc_summary": "137;48;61;46",
        "wc_strengths": "54;32;15;45",
        "wc_weaknesses": "225;38;310;225",
        "wc_questions": "104;162;5;40",
        "wc_review": "520;280;391;356",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "103;66;115;154",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            73.0,
            37.39652390263031
        ],
        "wc_strengths_avg": [
            36.5,
            14.67140075112121
        ],
        "wc_weaknesses_avg": [
            199.5,
            99.48994924111682
        ],
        "wc_questions_avg": [
            77.75,
            60.21783373719118
        ],
        "wc_review_avg": [
            386.75,
            86.76800965793787
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            109.5,
            31.40461749488441
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:LnN7-0Pz1KkJ:scholar.google.com/&scioq=Self-Supervision+is+Not+All+You+Need:+In+Defense+of+Semi-Supervised+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Central Florida;Amazon",
        "aff_unique_dep": ";Amazon.com, Inc.",
        "aff_unique_url": "https://www.ucf.edu;https://www.amazon.com",
        "aff_unique_abbr": "UCF;Amazon",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Interpretable Meta-Learning of Physical Systems",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17843",
        "id": "nnicaG5xiH",
        "author_site": "Matthieu Blanke, marc lelarge",
        "tldr": "",
        "abstract": "Machine learning methods can be a valuable aid in the scientific process, but they need to face challenging settings where data come from inhomogeneous experimental conditions. Recent meta-learning methods have made significant progress in multi-task learning, but they rely on black-box neural networks, resulting in high computational costs and limited interpretability. We introduce CAMEL, a new meta-learning architecture capable of learning efficiently from multiple environments, with an affine structure with respect to the learning task. We prove that CAMEL can identify the physical parameters of the system, enabling interpreable learning. We demonstrate the competitive generalization performance and the low computational cost of our method by comparing it to state-of-the-art algorithms on physical systems, ranging from toy models to complex, non-analytical systems. The interpretability of our method is illustrated with original applications to parameter identification and to adaptive control and system identification.",
        "keywords": "meta-learning;physical systems;multi-task learning;interpretable deep learning;identifiability;electrostatics;robotics;control;reinforcement learning;scientific discovery",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Matthieu Blanke;Marc Lelarge",
        "authorids": "~Matthieu_Blanke1;~Marc_Lelarge2",
        "gender": "M;M",
        "homepage": "https://mb-29.github.io/;http://www.di.ens.fr/~lelarge/",
        "dblp": "318/3876;21/462",
        "google_scholar": ";cLGOIdMAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Matthieu_Blanke1;~marc_lelarge1",
        "aff": "Inria;INRIA",
        "aff_domain": "inria.fr;inria.fr",
        "position": "PhD student;Researcher",
        "bibtex": "@inproceedings{\nblanke2024interpretable,\ntitle={Interpretable Meta-Learning of Physical Systems},\nauthor={Matthieu Blanke and Marc Lelarge},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=nnicaG5xiH}\n}",
        "github": "",
        "project": "",
        "reviewers": "X11Z;3DG3;rUF2",
        "pdf_size": 1150694,
        "rating": "5;6;8",
        "confidence": "4;3;3",
        "soundness": "3;2;3",
        "contribution": "2;3;3",
        "presentation": "2;4;3",
        "wc_summary": "90;135;67",
        "wc_strengths": "20;96;151",
        "wc_weaknesses": "684;250;543",
        "wc_questions": "87;65;74",
        "wc_review": "881;546;835",
        "wc_reply_reviewers": "620;782;0",
        "wc_reply_authors": "1909;2366;1226",
        "reply_reviewers": "2;3;0",
        "reply_authors": "4;4;2",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            97.33333333333333,
            28.241026106633512
        ],
        "wc_strengths_avg": [
            89.0,
            53.70909296075169
        ],
        "wc_weaknesses_avg": [
            492.3333333333333,
            180.76565553838546
        ],
        "wc_questions_avg": [
            75.33333333333333,
            9.030811456096044
        ],
        "wc_review_avg": [
            754.0,
            148.2722720762944
        ],
        "wc_reply_reviewers_avg": [
            467.3333333333333,
            337.00774801511943
        ],
        "wc_reply_authors_avg": [
            1833.6666666666667,
            468.4416244907743
        ],
        "reply_reviewers_avg": [
            1.6666666666666667,
            1.247219128924647
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.7559289460184545,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13084879018649468595&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=nnicaG5xiH",
        "pdf": "https://openreview.net/pdf?id=nnicaG5xiH",
        "email": "inria.fr;inria.fr",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "INRIA",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.inria.fr",
        "aff_unique_abbr": "Inria",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "France"
    },
    {
        "id": "nnsPXGPcgI",
        "title": "MetaDist: An Infrastructure for Automatic Parallelism via ShardCombine Algorithm",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "As models become larger and hardware limitations widen, parallel training techniques have become increasingly important for improving training efficiency. However, the choice and combination of these techniques can greatly impact their effectiveness. Automatic parallelism methods have emerged to select the best combination of strategies from a selection space of parallel strategies. However, these methods rely heavily on manual annotation of operator SPMD sharding rules, which makes them difficult to develop, maintain and benchmark, and lacking in ecological compatibility. In this work, we present MetaDist, an infrastructure for automatic parallelism. We propose two abstract data structures, MetaOp and MetaIR, which enable us to construct the MetaSPMD space. The ShardCombine Algorithm obviates the need for manual annotation, significantly reducing the development and maintenance cost. Moreover, our approach is natively compatible with multiple ecologies, including PyTorch and JAX. To validate our design, we implement two baseline automatic parallelism algorithms based on MetaDist. Our experiments demonstrate that our approach achieves state-of-the-art performance compared with other distributed solutions.",
        "keywords": "Automatic Parallelism;Distributed Training;Machine Learning Framework;Single Program Multiple Data",
        "primary_area": "infrastructure, software libraries, hardware, etc.",
        "supplementary_material": "/attachment/d0d37cf443d5473a4fd138cc62512b0b98b114dd.zip",
        "author": "Shenggan Cheng;Lansong Diao;Zongyan Cao;Siyu Wang;Wei Lin;Yang You",
        "authorids": "~Shenggan_Cheng1;~Lansong_Diao1;~Zongyan_Cao1;~Siyu_Wang3;~Wei_Lin5;~Yang_You1",
        "gender": "M;M;M;M;M;M",
        "homepage": ";;;https://github.com/wangsiyu;;https://www.comp.nus.edu.sg/~youy/",
        "dblp": "258/2485;236/6998.html;https://dblp.org/search/pid/api?q=author:Zongyan_Cao:;;;33/8167-1.html",
        "google_scholar": "kDdwP6UAAAAJ;;hurZdZsAAAAJ;;LXSkrXkAAAAJ;jF4dPZwAAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";lansong-diao;;;;yang-you-0b92914b/",
        "or_profile": "~Shenggan_Cheng1;~Lansong_Diao1;~Zongyan_Cao1;~Siyu_Wang3;~Wei_Lin5;~Yang_You1",
        "aff": "National University of Singapore;;Alibaba Group;Alibaba Group;;National University of Singapore",
        "aff_domain": "nus.edu;;alibaba-inc.com;alibaba-inc.com;;nus.edu.sg",
        "position": "PhD student;;Engineer;Researcher;;Professor",
        "bibtex": "@misc{\ncheng2024metadist,\ntitle={MetaDist: An Infrastructure for Automatic Parallelism via ShardCombine Algorithm},\nauthor={Shenggan Cheng and Lansong Diao and Zongyan Cao and Siyu Wang and Wei Lin and Yang You},\nyear={2024},\nurl={https://openreview.net/forum?id=nnsPXGPcgI}\n}",
        "github": "",
        "project": "",
        "reviewers": "brSL;9K4K;Rppy;KMij",
        "site": "https://openreview.net/forum?id=nnsPXGPcgI",
        "pdf_size": 632204,
        "rating": "3;3;3;6",
        "confidence": "3;4;5;4",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;2",
        "presentation": "3;3;2;2",
        "wc_summary": "53;16;121;103",
        "wc_strengths": "32;40;17;34",
        "wc_weaknesses": "223;51;89;142",
        "wc_questions": "6;458;285;83",
        "wc_review": "314;565;512;362",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            73.25,
            41.390669238368204
        ],
        "wc_strengths_avg": [
            30.75,
            8.46684711093805
        ],
        "wc_weaknesses_avg": [
            126.25,
            64.53439005677515
        ],
        "wc_questions_avg": [
            208.0,
            176.6762576012974
        ],
        "wc_review_avg": [
            438.25,
            103.3885269263471
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:5Rh5ANSupVwJ:scholar.google.com/&scioq=MetaDist:+An+Infrastructure+for+Automatic+Parallelism+via+ShardCombine+Algorithm&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;0",
        "aff_unique_norm": "National University of Singapore;Alibaba Group",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.nus.edu.sg;https://www.alibaba.com",
        "aff_unique_abbr": "NUS;Alibaba",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "Singapore;China"
    },
    {
        "title": "PF-LRM: Pose-Free Large Reconstruction Model for Joint Pose and Shape Prediction",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17842",
        "id": "noe76eRcPC",
        "author_site": "Peng Wang, Hao Tan, Sai Bi, Yinghao Xu, Fujun Luan, Kalyan Sunkavalli, Wenping Wang, Zexiang Xu, Kai Zhang",
        "tldr": "",
        "abstract": "We propose a Pose-Free Large Reconstruction Model (PF-LRM) for reconstructing a 3D object from a few unposed images even with little visual overlap, while simultaneously estimating the relative camera poses in ~1.3 seconds on a single A100 GPU. PF-LRM is a highly scalable method utilizing self-attention blocks to exchange information between 3D object tokens and 2D image tokens; we predict a coarse point cloud for each view, and then use a differentiable Perspective-n-Point (PnP) solver to obtain camera poses. When trained on a huge amount of multi-view posed data of ~1M objects, PF-LRM shows strong cross-dataset generalization ability, and outperforms baseline methods by a large margin in terms of pose prediction accuracy and 3D reconstruction quality on various unseen evaluation datasets. We also demonstrate our model's applicability in downstream text/image-to-3D task with fast feed-forward inference. Our project website is at: https://totoro97.github.io/pf-lrm.",
        "keywords": "Pose estimation;NeRF;3D Reconstruction;Transformer",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Peng Wang;Hao Tan;Sai Bi;Yinghao Xu;Fujun Luan;Kalyan Sunkavalli;Wenping Wang;Zexiang Xu;Kai Zhang",
        "authorids": "~Peng_Wang17;~Hao_Tan1;~Sai_Bi1;~Yinghao_Xu1;~Fujun_Luan2;~Kalyan_Sunkavalli1;~Wenping_Wang1;~Zexiang_Xu1;~Kai_Zhang7",
        "gender": "M;M;M;M;M;M;M;M;M",
        "homepage": "https://totoro97.github.io;http://www.cs.unc.edu/~airsplay/;https://sai-bi.github.io/;https://justimyhxu.github.io/;https://luanfujun.com/;http://www.kalyans.org/;https://engineering.tamu.edu/cse/profiles/Wang-Wenping.html;https://cseweb.ucsd.edu/~zex014/;https://kai-46.github.io/website/",
        "dblp": "95/4442-99;94/877-2;165/9898;232/2482;183/9337;42/5978;;154/0366;55/957-45",
        "google_scholar": "KvXvmawAAAAJ;OV1Y3FUAAAAJ;-q4nE1kAAAAJ;https://scholar.google.com/citations?hl=en;NLxrmYQAAAAJ;j7uL6VEAAAAJ;28shvv0AAAAJ;_RRIYvEAAAAJ;6B7FPMoAAAAJ",
        "orcid": ";;;;;;0000-0002-2284-3952;;",
        "linkedin": ";hao-tan-23677180/;;;luanfujun/;;;;",
        "or_profile": "~Peng_Wang17;~Hao_Tan1;~Sai_Bi1;~Yinghao_Xu1;~Fujun_Luan2;~Kalyan_Sunkavalli1;~Wenping_Wang1;~Zexiang_Xu1;~Kai_Zhang7",
        "aff": "The University of Hong Kong;Adobe Systems;Adobe Systems;Stanford University;Adobe Systems;Adobe Research;Texas A&M University - College Station;Adobe Research;Adobe Systems",
        "aff_domain": "hku.hk;adobe.com;adobe.com;stanford.edu;adobe.com;adobe.com;tamu.edu;adobe.com;adobe.com",
        "position": "PhD student;Research Scientist;Researcher;Postdoc;Researcher;Principal Scientist;Full Professor;Researcher;Researcher",
        "bibtex": "@inproceedings{\nwang2024pflrm,\ntitle={{PF}-{LRM}: Pose-Free Large Reconstruction Model for Joint Pose and Shape Prediction},\nauthor={Peng Wang and Hao Tan and Sai Bi and Yinghao Xu and Fujun Luan and Kalyan Sunkavalli and Wenping Wang and Zexiang Xu and Kai Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=noe76eRcPC}\n}",
        "github": "",
        "project": "",
        "reviewers": "XwFE;T3us;Pk6q;5PYC",
        "pdf_size": 5016794,
        "rating": "8;8;8;8",
        "confidence": "5;4;3;4",
        "soundness": "2;3;4;3",
        "contribution": "3;4;4;3",
        "presentation": "3;3;3;4",
        "wc_summary": "74;80;68;96",
        "wc_strengths": "67;34;44;73",
        "wc_weaknesses": "323;196;80;215",
        "wc_questions": "86;48;10;9",
        "wc_review": "550;358;202;393",
        "wc_reply_reviewers": "526;55;63;179",
        "wc_reply_authors": "1135;288;498;901",
        "reply_reviewers": "3;2;1;2",
        "reply_authors": "3;3;3;3",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            79.5,
            10.428326807307105
        ],
        "wc_strengths_avg": [
            54.5,
            16.03901493234544
        ],
        "wc_weaknesses_avg": [
            203.5,
            86.19889790478763
        ],
        "wc_questions_avg": [
            38.25,
            31.736217480979047
        ],
        "wc_review_avg": [
            375.75,
            123.657541217671
        ],
        "wc_reply_reviewers_avg": [
            205.75,
            191.29737975204992
        ],
        "wc_reply_authors_avg": [
            705.5,
            331.6824535606308
        ],
        "reply_reviewers_avg": [
            2.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            3.0,
            0.0
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 101,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1892380369621852899&as_sdt=40000005&sciodt=0,22&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=noe76eRcPC",
        "pdf": "https://openreview.net/pdf?id=noe76eRcPC",
        "email": "hku.hk;adobe.com;adobe.com;stanford.edu;adobe.com;adobe.com;tamu.edu;adobe.com;adobe.com",
        "author_num": 9,
        "aff_unique_index": "0;1;1;2;1;1;3;1;1",
        "aff_unique_norm": "University of Hong Kong;Adobe;Stanford University;Texas A&M University",
        "aff_unique_dep": ";Adobe Systems Incorporated;;",
        "aff_unique_url": "https://www.hku.hk;https://www.adobe.com;https://www.stanford.edu;https://www.tamu.edu",
        "aff_unique_abbr": "HKU;Adobe;Stanford;TAMU",
        "aff_campus_unique_index": "0;2;3",
        "aff_campus_unique": "Hong Kong SAR;;Stanford;College Station",
        "aff_country_unique_index": "0;1;1;1;1;1;1;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "nonqjVFiE9",
        "title": "Improving Prompt-based Continual Learning with Key-Query Orthogonal Projection and Prototype-based One-Versus-All",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Drawing inspiration from prompt tuning techniques applied to Large Language Models, recent methods based on pre-trained ViT networks have achieved remarkable results in the field of Continual Learning. Specifically, these approaches propose to maintain a set of prompts and allocate a subset of them to learn each task using a key-query matching strategy. However, they may encounter limitations when lacking control over the shift of features in the latent space and the relative separation of latent vectors learned in independent tasks. In this work, we introduce a novel key-query learning strategy based on orthogonal projection, inspired by model-agnostic meta-learning, to enhance prompt matching efficiency and address the challenge of shifting features. Furthermore, to harness the benefits of reduced feature shifting, we introduce a One-Versus-All (OVA) prototype-based component that enhances the performance of the classification head. Experimental results on benchmark datasets demonstrate that our method empowers the model to achieve results surpassing those of current state-of-the-art approaches by a large margin of up to 20%.",
        "keywords": "continual learning;prompt tuning;ViT",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/00d179ac4518e98858bf2606106bf0a7cc2847eb.pdf",
        "author": "Quyen Tran;Tung Lam Tran;Khoat Than;Toan Tran;Dinh Phung;Trung Le",
        "authorids": "~Quyen_Tran1;~Tung_Lam_Tran1;~Khoat_Than1;~Toan_Tran1;~Dinh_Phung2;~Trung_Le2",
        "gender": "F;;M;M;M;M",
        "homepage": "https://tranquyenbk173.github.io;;https://users.soict.hust.edu.vn/khoattq/;;;https://research.monash.edu/en/persons/dinh-phung",
        "dblp": "298/2261;178/8536;118/4726;207/8479-3;;71/5859",
        "google_scholar": "ZtuZhrMAAAAJ;--2qc0UAAAAJ;;https://scholar.google.com.au/citations?user=PnwSuNMAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com.au/citations?user=OtA9SwIAAAAJ",
        "orcid": "0000-0001-5081-3489;;;0000-0001-7182-7548;;0000-0002-9977-8247",
        "linkedin": "tranquyenbk173;;;;;https://linkedin.com/in/dinh-phung-6b537a6",
        "or_profile": "~Quyen_Tran1;~Tung_Lam_Tran1;~Khoat_Than1;~Toan_Tran1;~Trung_Le2;~Dinh_Phung1",
        "aff": "VinAI Research;VinAi Research;Hanoi University of Science and Technology;Hanoi University of Science and Technology;Monash University;Monash University",
        "aff_domain": "vinai.io;vinai.io;hust.edu.vn;hust.edu.vn;monash.edu;monash.edu",
        "position": "Research Resident;Research resident;Associate Professor;Lecturer;Assistant Professor;Full Professor",
        "bibtex": "@misc{\ntran2024improving,\ntitle={Improving Prompt-based Continual Learning with Key-Query Orthogonal Projection and Prototype-based One-Versus-All},\nauthor={Quyen Tran and Tung Lam Tran and Khoat Than and Toan Tran and Dinh Phung and Trung Le},\nyear={2024},\nurl={https://openreview.net/forum?id=nonqjVFiE9}\n}",
        "github": "",
        "project": "",
        "reviewers": "G1mq;WdvC;m1q8;t1j7",
        "site": "https://openreview.net/forum?id=nonqjVFiE9",
        "pdf_size": 559592,
        "rating": "3;3;5;5",
        "confidence": "4;4;4;4",
        "soundness": "3;2;3;3",
        "contribution": "2;3;2;2",
        "presentation": "3;2;2;2",
        "wc_summary": "80;89;96;168",
        "wc_strengths": "58;32;25;115",
        "wc_weaknesses": "451;106;295;158",
        "wc_questions": "82;282;6;7",
        "wc_review": "671;509;422;448",
        "wc_reply_reviewers": "0;18;114;84",
        "wc_reply_authors": "1425;2254;2841;891",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "4;5;7;3",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            108.25,
            34.959798340379486
        ],
        "wc_strengths_avg": [
            57.5,
            35.40127116361784
        ],
        "wc_weaknesses_avg": [
            252.5,
            133.7918158932003
        ],
        "wc_questions_avg": [
            94.25,
            112.69510858950356
        ],
        "wc_review_avg": [
            512.5,
            96.80521680157531
        ],
        "wc_reply_reviewers_avg": [
            54.0,
            46.66904755831214
        ],
        "wc_reply_authors_avg": [
            1852.75,
            749.2617616694449
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.75,
            1.479019945774904
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13302700107554401301&as_sdt=5,24&sciodt=0,24&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;1;2;2",
        "aff_unique_norm": "VinAI Research;Hanoi University of Science and Technology;Monash University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.vinai.io/;https://www.hust.edu.vn;https://www.monash.edu",
        "aff_unique_abbr": "VinAI;HUST;Monash",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Hanoi",
        "aff_country_unique_index": "0;0;0;0;1;1",
        "aff_country_unique": "Vietnam;Australia"
    },
    {
        "id": "npf3gREtf7",
        "title": "Which Examples to Annotate for In-Context Learning? Towards Effective and Efficient Selection",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) can adapt to new tasks via in-context learning (ICL). ICL is efficient as it does not require any parameter updates to the trained LLM, but only few annotated examples as input for the LLM. In this work, we investigate an active learning approach for ICL, where there is a limited budget for annotating examples. We propose a model-adaptive optimization-free algorithm, termed AdaICL, which identifies examples that the model is uncertain about, and performs semantic diversity-based example selection. Diversity-based sampling improves overall effectiveness, while uncertainty sampling improves budget efficiency and helps the LLM learn new information. Moreover, AdaICL poses its sampling strategy as a Maximum Coverage problem, that dynamically adapts based on the model\u2019s feedback and can be approximately solved via greedy algorithms. Extensive experiments on nine datasets and seven LLMs show that AdaICL improves performance by 4.4% accuracy points over SOTA (7.7% relative improvement), is up to 3\u00d7 more budget-efficient than performing annotations uniformly at random, while it outperforms SOTA with 2\u00d7 fewer ICL examples.",
        "keywords": "in-context learning;language models;active learning;few-shot learning",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/9d70b6803eeb4315c26bb8883b682034de87a707.zip",
        "author": "Costas Mavromatis;Balasubramaniam Srinivasan;Zhengyuan Shen;Jiani Zhang;Huzefa Rangwala;Christos Faloutsos;George Karypis",
        "authorids": "~Costas_Mavromatis1;~Balasubramaniam_Srinivasan1;~Zhengyuan_Shen1;~Jiani_Zhang2;~Huzefa_Rangwala2;~Christos_Faloutsos1;~George_Karypis1",
        "gender": "M;;M;F;M;M;M",
        "homepage": ";;;https://jennyzhang0215.github.io/;http://www.cs.gmu.edu/~rangwala;https://www.cs.cmu.edu/~christos/;",
        "dblp": "274/3263.html;230/3792;;186/6870;30/444;f/CFaloutsos;",
        "google_scholar": "uDHOG6oAAAAJ;uM4EhgEAAAAJ;mX2LPRwAAAAJ;CBmDAOEAAAAJ;yWJ9BqEAAAAJ;nd8lQQIAAAAJ;ElqwScwAAAAJ",
        "orcid": ";;;0000-0003-0074-6761;;0000-0003-2996-9790;",
        "linkedin": ";;donshen16/;;;christos-faloutsos-43a7aa2/;",
        "or_profile": "~Costas_Mavromatis1;~Balasubramaniam_Srinivasan1;~Zhengyuan_Shen1;~Jiani_Zhang2;~Huzefa_Rangwala2;~Christos_Faloutsos1;~George_Karypis1",
        "aff": "University of Minnesota - Twin Cities;Amazon;Amazon;AWS;Computer Science, George Mason University;Carnegie Mellon University;University of Minnesota, Minneapolis",
        "aff_domain": "umn.edu;amazon.com;amazon.com;amazon.com;cs.gmu.edu;cmu.edu;umn.edu",
        "position": "PhD student;Senior Applied Scientist;Researcher;Researcher;Full Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nmavromatis2024which,\ntitle={Which Examples to Annotate for In-Context Learning? Towards Effective and Efficient Selection},\nauthor={Costas Mavromatis and Balasubramaniam Srinivasan and Zhengyuan Shen and Jiani Zhang and Huzefa Rangwala and Christos Faloutsos and George Karypis},\nyear={2024},\nurl={https://openreview.net/forum?id=npf3gREtf7}\n}",
        "github": "",
        "project": "",
        "reviewers": "LBWT;hvtd;m5zU;6M3N",
        "site": "https://openreview.net/forum?id=npf3gREtf7",
        "pdf_size": 1364854,
        "rating": "3;3;5;6",
        "confidence": "3;4;3;3",
        "soundness": "2;2;3;3",
        "contribution": "2;1;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "105;91;128;84",
        "wc_strengths": "50;32;34;43",
        "wc_weaknesses": "40;193;66;95",
        "wc_questions": "241;2;94;2",
        "wc_review": "436;318;322;224",
        "wc_reply_reviewers": "0;0;198;0",
        "wc_reply_authors": "1014;1105;1464;337",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "2;3;3;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            102.0,
            16.80773631397161
        ],
        "wc_strengths_avg": [
            39.75,
            7.224091638399945
        ],
        "wc_weaknesses_avg": [
            98.5,
            57.92451985126851
        ],
        "wc_questions_avg": [
            84.75,
            97.7173858635197
        ],
        "wc_review_avg": [
            325.0,
            75.13321502504735
        ],
        "wc_reply_reviewers_avg": [
            49.5,
            85.73651497465943
        ],
        "wc_reply_authors_avg": [
            980.0,
            407.5800534864286
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5555555555555555,
        "gs_citation": 16,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10271656761384964283&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1;1;2;3;0",
        "aff_unique_norm": "University of Minnesota;Amazon;George Mason University;Carnegie Mellon University",
        "aff_unique_dep": ";Amazon.com, Inc.;Computer Science;",
        "aff_unique_url": "https://www.minnesota.edu;https://www.amazon.com;https://www.gmu.edu;https://www.cmu.edu",
        "aff_unique_abbr": "UMN;Amazon;GMU;CMU",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Twin Cities;;Minneapolis",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "npoi2fr882",
        "title": "3D-GOI: 3D GAN Omni-Inversion for Multifaceted and Multi-object Editing",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The current GAN inversion methods typically can only edit the appearance and shape of a single object and background while overlooking spatial information. In this work, we propose a 3D editing framework, 3D-GOI, to enable multifaceted editing of affine information (scale, translation, and rotation) on multiple objects. 3D-GOI realizes the complex editing function by inverting the abundance of attribute codes (object shape/appearance/scale/rotation/translation, background shape/appearance, and camera pose) controlled by GIRAFFE, a renowned 3D GAN. Accurately inverting all the codes is challenging, 3D-GOI solves this challenge following three main steps. First, we segment the objects and the background in a multi-object image. Second, we use a custom Neural Inversion Encoder to obtain coarse codes of each object. Finally, we use a round-robin optimization algorithm to get precise codes to reconstruct the image. To the best of our knowledge, 3D-GOI is the first framework to enable multifaceted editing on multiple objects. Both qualitative and quantitative experiments demonstrate that 3D-GOI holds immense potential for flexible, multifaceted editing in complex multi-object scenes.",
        "keywords": "3D GAN;3D GAN Inversion;Multi-object Image Editing",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Haoran Li;Long Ma;Yong Liao;Lechao Cheng;Yanbin Hao;Pengyuan Zhou",
        "authorids": "~Haoran_Li10;~Long_Ma6;~Yong_Liao1;~Lechao_Cheng2;~Yanbin_Hao1;~Pengyuan_Zhou1",
        "gender": ";;M;M;M;",
        "homepage": ";;https://dspace.ustc.edu.cn/?p=1057;https://faculty.hfut.edu.cn/ChengLechao;https://haoyanbin918.github.io/;",
        "dblp": ";;;165/9781;96/1538;",
        "google_scholar": ";;;PKFAv-cAAAAJ;vhPSOkEAAAAJ;",
        "orcid": ";;0000-0001-6403-0557;0000-0002-7546-9052;0000-0002-0695-1566;",
        "linkedin": ";;;;;",
        "or_profile": "~Haoran_Li10;~Long_Ma6;~Yong_Liao1;~Lechao_Cheng2;~Yanbin_Hao1;~Pengyuan_Zhou1",
        "aff": ";;China Academic of Electronics and Information Technology;Hefei University of Technology;University of Science and Technology of China;",
        "aff_domain": ";;yjsy.cetc.com.cn;hfut.edu.cn;ustc.edu.cn;",
        "position": ";;Principal Researcher;Associate Professor;Associate Professor;",
        "bibtex": "@misc{\nli2024dgoi,\ntitle={3D-{GOI}: 3D {GAN} Omni-Inversion for Multifaceted and Multi-object Editing},\nauthor={Haoran Li and Long Ma and Yong Liao and Lechao Cheng and Yanbin Hao and Pengyuan Zhou},\nyear={2024},\nurl={https://openreview.net/forum?id=npoi2fr882}\n}",
        "github": "",
        "project": "",
        "reviewers": "YC1j;gkt1;f1rX",
        "site": "https://openreview.net/forum?id=npoi2fr882",
        "pdf_size": 41319899,
        "rating": "5;5;6",
        "confidence": "4;4;3",
        "soundness": "2;3;3",
        "contribution": "3;2;3",
        "presentation": "2;2;2",
        "wc_summary": "45;96;131",
        "wc_strengths": "38;54;67",
        "wc_weaknesses": "75;318;182",
        "wc_questions": "113;71;35",
        "wc_review": "271;539;415",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "667;728;357",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            90.66666666666667,
            35.31131389355102
        ],
        "wc_strengths_avg": [
            53.0,
            11.86029791643813
        ],
        "wc_weaknesses_avg": [
            191.66666666666666,
            99.43954053706314
        ],
        "wc_questions_avg": [
            73.0,
            31.874754901018456
        ],
        "wc_review_avg": [
            408.3333333333333,
            109.51204905803237
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            584.0,
            162.43357616781904
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.9999999999999997,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14856777662657483784&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "China Academy of Electronics and Information Technology;Hefei University of Technology;University of Science and Technology of China",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.caep.ac.cn/;http://www.hfut.edu.cn/;http://www.ustc.edu.cn",
        "aff_unique_abbr": "CAEIT;HUT;USTC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Searching for High-Value Molecules Using Reinforcement Learning and Transformers",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17841",
        "id": "nqlymMx42E",
        "author_site": "Raj Ghugare, Santiago Miret, Adriana Hugessen, mariano Phielipp, Glen Berseth",
        "tldr": "",
        "abstract": "Reinforcement learning (RL) over text representations can be effective for finding high-value policies that can search over graphs. However, RL requires careful structuring of the search space and algorithm design to be effective in this challenge. Through extensive experiments, we explore how different design choices for text grammar and algorithmic choices for training can affect an RL policy's ability to generate molecules with desired properties. We arrive at a new RL-based molecular design algorithm (ChemRLformer) and perform a thorough analysis using 25 molecule design tasks, including computationally complex protein docking simulations. From this analysis, we discover unique insights in this problem space and show that ChemRLformer achieves state-of-the-art performance while being more straightforward than prior work by demystifying which design choices are actually helpful for text-based molecule design.",
        "keywords": "chemistry;reinforcement learning;language models",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Raj Ghugare;Santiago Miret;Adriana Hugessen;Mariano Phielipp;Glen Berseth",
        "authorids": "~Raj_Ghugare1;~Santiago_Miret1;~Adriana_Hugessen1;~Mariano_Phielipp2;~Glen_Berseth1",
        "gender": "M;M;F;M;M",
        "homepage": "https://github.com/RajGhugare19;https://www.intel.ai/bio/santiago-miret/;https://ahugs.github.io/;https://www.intel.com/content/www/us/en/research/researchers/mariano-phielipp.html;http://fracturedplane.com/",
        "dblp": ";241/5030;358/6207;23/4518;147/5478",
        "google_scholar": "hzxdkrIAAAAJ;HLQ_te4AAAAJ;Z0q7bU0AAAAJ;YArRsvEAAAAJ;https://scholar.google.ca/citations?user=-WZcuuwAAAAJ",
        "orcid": ";0000-0002-5121-3853;;;0000-0001-7351-8028",
        "linkedin": "raj-ghugare-917137169/;santiago-miret/;adriana-hugessen-20a68062/;mariano-phielipp-941624;glen-berseth-0523278b?trk=hp-identity-name",
        "or_profile": "~Raj_Ghugare1;~Santiago_Miret1;~Adriana_Hugessen1;~Mariano_Phielipp2;~Glen_Berseth1",
        "aff": "Montreal Institute for Learning Algorithms, University of Montreal, Universit\u00e9 de Montr\u00e9al;Intel;Universit\u00e9 de Montr\u00e9al;Intel Labs;Montreal Institute for Learning Algorithms, University of Montreal, Universit\u00e9 de Montr\u00e9al",
        "aff_domain": "mila.umontreal.ca;intel.com;umontreal.ca;intel.com;mila.umontreal.ca",
        "position": "MS student;Researcher;MS student;Principal Researcher;Assistant Professor",
        "bibtex": "@inproceedings{\nghugare2024searching,\ntitle={Searching for High-Value Molecules Using Reinforcement Learning and Transformers},\nauthor={Raj Ghugare and Santiago Miret and Adriana Hugessen and Mariano Phielipp and Glen Berseth},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=nqlymMx42E}\n}",
        "github": "",
        "project": "",
        "reviewers": "AgdE;QKJh;feem;ANoo",
        "pdf_size": 1060776,
        "rating": "6;6;8;8",
        "confidence": "4;2;4;2",
        "soundness": "4;2;4;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;4;3",
        "wc_summary": "23;71;123;49",
        "wc_strengths": "40;176;150;23",
        "wc_weaknesses": "164;202;35;129",
        "wc_questions": "107;4;194;330",
        "wc_review": "334;453;502;531",
        "wc_reply_reviewers": "17;0;36;407",
        "wc_reply_authors": "1023;554;432;1687",
        "reply_reviewers": "1;0;1;3",
        "reply_authors": "3;2;2;4",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.0,
            1.0
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            66.5,
            36.77974986320598
        ],
        "wc_strengths_avg": [
            97.25,
            66.66098934159318
        ],
        "wc_weaknesses_avg": [
            132.5,
            61.9293952820468
        ],
        "wc_questions_avg": [
            158.75,
            119.57711946689467
        ],
        "wc_review_avg": [
            455.0,
            75.21635460456721
        ],
        "wc_reply_reviewers_avg": [
            115.0,
            169.06655494212922
        ],
        "wc_reply_authors_avg": [
            924.0,
            492.67991637573374
        ],
        "reply_reviewers_avg": [
            1.25,
            1.0897247358851685
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14461129249140516364&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=nqlymMx42E",
        "pdf": "https://openreview.net/pdf?id=nqlymMx42E",
        "email": "mila.umontreal.ca;intel.com;umontreal.ca;intel.com;mila.umontreal.ca",
        "author_num": 5,
        "aff_unique_index": "0;1;2;1;0",
        "aff_unique_norm": "University of Montreal;Intel;Universit\u00e9 de Montr\u00e9al",
        "aff_unique_dep": "Montreal Institute for Learning Algorithms;Intel Corporation;",
        "aff_unique_url": "https://www.mila.quebec;https://www.intel.com;https://www.umontreal.ca",
        "aff_unique_abbr": "MILA;Intel;UdeM",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Montreal;",
        "aff_country_unique_index": "0;1;0;1;0",
        "aff_country_unique": "Canada;United States"
    },
    {
        "id": "nr0w6CH7v4",
        "title": "Quality Diversity through Human Feedback",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Reinforcement learning from human feedback (RLHF) has exhibited the potential to enhance the performance of foundation models for qualitative tasks. Despite its promise, its efficacy is often restricted when conceptualized merely as a mechanism to maximize learned reward models of averaged human preferences, especially in areas such as image generation which demand diverse model responses. Meanwhile, quality diversity (QD) algorithms, dedicated to seeking diverse, high-quality solutions, are often constrained by the dependency on manually defined diversity metrics. Interestingly, such limitations of RLHF and QD can be overcome by blending insights from both. This paper introduces Quality Diversity through Human Feedback (QDHF), which employs human feedback for inferring diversity metrics, expanding the applicability of QD algorithms. Empirical results reveal that QDHF outperforms existing QD methods regarding automatic diversity discovery, and matches the search capabilities of QD with human-constructed metrics. Notably, when deployed for a latent space illumination task, QDHF markedly enhances the diversity of images generated by a Diffusion model. The study concludes with an in-depth analysis of QDHF's sample efficiency and the quality of its derived diversity metrics, emphasizing its promise for enhancing exploration and diversity in optimization for complex, open-ended tasks.",
        "keywords": "quality diversity;human feedback;constrastive learning;reinforcement learning;image generation;robotics",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/41bf9c4f95937acb1db23b3b77287ac5477c4774.zip",
        "author": "Li Ding;Jenny Zhang;Jeff Clune;Lee Spector;Joel Lehman",
        "authorids": "~Li_Ding3;~Jenny_Zhang1;~Jeff_Clune3;~Lee_Spector2;~Joel_Lehman1",
        "gender": "M;;;;",
        "homepage": "https://liding.info;;;https://leespector.com;http://joellehman.com",
        "dblp": "58/4543-10;;;68/434;47/8285",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;;wtKLtLUAAAAJ;GcvxHWQAAAAJ",
        "orcid": "0000-0002-1315-1196;;; 0000-0001-5299-4797;",
        "linkedin": "liding256;;;lee-spector-77990b9/;",
        "or_profile": "~Li_Ding3;~Jenny_Zhang1;~Jeff_Clune3;~Lee_Spector2;~Joel_Lehman1",
        "aff": "University of Massachusetts, Amherst;;;Amherst College;Carper.AI",
        "aff_domain": "umass.edu;;;amherst.edu;carper.ai",
        "position": "PhD student;;;Full Professor;Research Advisor",
        "bibtex": "@misc{\nding2024quality,\ntitle={Quality Diversity through Human Feedback},\nauthor={Li Ding and Jenny Zhang and Jeff Clune and Lee Spector and Joel Lehman},\nyear={2024},\nurl={https://openreview.net/forum?id=nr0w6CH7v4}\n}",
        "github": "",
        "project": "",
        "reviewers": "5CR4;2snW;XG8W;FS1c",
        "site": "https://openreview.net/forum?id=nr0w6CH7v4",
        "pdf_size": 4407485,
        "rating": "3;3;5;6",
        "confidence": "2;4;3;3",
        "soundness": "2;2;2;2",
        "contribution": "3;2;2;3",
        "presentation": "2;2;2;2",
        "wc_summary": "45;97;64;97",
        "wc_strengths": "25;64;70;42",
        "wc_weaknesses": "210;125;127;98",
        "wc_questions": "3;2;5;43",
        "wc_review": "283;288;266;280",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1242;1023;843;957",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            75.75,
            22.286486937155438
        ],
        "wc_strengths_avg": [
            50.25,
            17.92170471802278
        ],
        "wc_weaknesses_avg": [
            140.0,
            42.005951959216446
        ],
        "wc_questions_avg": [
            13.25,
            17.210098779495716
        ],
        "wc_review_avg": [
            279.25,
            8.166241485530538
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1016.25,
            145.37430137407367
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9025180567219126453&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of Massachusetts Amherst;Amherst College;Carper.AI",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.umass.edu;https://www.amherst.edu;https://www.carper.ai",
        "aff_unique_abbr": "UMass Amherst;Amherst;Carper.AI",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Amherst;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "nrDRBhNHiB",
        "title": "A multiobjective continuation method to compute the regularization path of deep neural networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Sparsity is a highly desired feature in deep neural networks (DNNs) since it ensures numerical efficiency, improves the interpretability of models (due to the smaller number of relevant features), and robustness. In machine learning approaches based on linear models, it is well known that there exists a connecting path between the sparsest solution in terms of the $\\ell^1$ norm (i.e., zero weights) and the non-regularized solution, which is called the regularization path. Very recently, there was a first attempt to extend the concept of regularization paths to DNNs by means of treating the empirical loss and sparsity ($\\ell^1$ norm) as two conflicting criteria and solving the resulting multiobjective optimization problem. However, due to the non-smoothness of the $\\ell^1$ norm and the high number of parameters, this approach is not very efficient from a computational perspective. To overcome this limitation, we present an algorithm that allows for the approximation of the entire Pareto front for the above-mentioned objectives in a very efficient manner. We present numerical examples using both deterministic and stochastic gradients. We furthermore demonstrate that knowledge of the regularization path allows for a well-generalizing network parametrization.",
        "keywords": "multioobjective optimization;regularization path;continuation method;predictor;corrector;deep neural network;Pareto set",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/92c2f6aa7a4fa9e24125d7d8bab35513c82a5149.zip",
        "author": "Augustina C. Amakor;Konstantin Sonntag;Sebastian Peitz",
        "authorids": "~Augustina_C._Amakor1;konstantin.sonntag@uni-paderborn.de;~Sebastian_Peitz1",
        "gender": "F;;M",
        "homepage": "https://www.uni-paderborn.de/en/person/97916;;https://sas.cs.tu-dortmund.de",
        "dblp": ";;220/5539",
        "google_scholar": "5W9TbLoAAAAJ;;https://scholar.google.de/citations?user=9GsnuucAAAAJ",
        "orcid": ";;0000-0002-3389-793X",
        "linkedin": "augustina-amakor-a85419146/augustina-amakor-a85419146/;;",
        "or_profile": "~Augustina_C._Amakor1;konstantin.sonntag@uni-paderborn.de;~Sebastian_Peitz1",
        "aff": "Universit\u00e4t Paderborn;;Universit\u00e4t Paderborn",
        "aff_domain": "uni-paderborn.de;;uni-paderborn.de",
        "position": "PhD student;;Assistant Professor",
        "bibtex": "@misc{\namakor2024a,\ntitle={A multiobjective continuation method to compute the regularization path of deep neural networks},\nauthor={Augustina C. Amakor and Konstantin Sonntag and Sebastian Peitz},\nyear={2024},\nurl={https://openreview.net/forum?id=nrDRBhNHiB}\n}",
        "github": "",
        "project": "",
        "reviewers": "dHK2;PWoo;4ykt;oW7r",
        "site": "https://openreview.net/forum?id=nrDRBhNHiB",
        "pdf_size": 486316,
        "rating": "3;3;6;6",
        "confidence": "4;4;5;3",
        "soundness": "2;3;3;3",
        "contribution": "1;3;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "36;127;34;62",
        "wc_strengths": "19;73;14;87",
        "wc_weaknesses": "123;299;110;131",
        "wc_questions": "3;4;44;256",
        "wc_review": "181;503;202;536",
        "wc_reply_reviewers": "0;10;0;0",
        "wc_reply_authors": "496;268;432;634",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            64.75,
            37.599035891894886
        ],
        "wc_strengths_avg": [
            48.25,
            32.18209906143476
        ],
        "wc_weaknesses_avg": [
            165.75,
            77.29610274781
        ],
        "wc_questions_avg": [
            76.75,
            104.80308917202775
        ],
        "wc_review_avg": [
            355.5,
            164.5820464084707
        ],
        "wc_reply_reviewers_avg": [
            2.5,
            4.330127018922194
        ],
        "wc_reply_authors_avg": [
            457.5,
            131.52471250681373
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13056007645412602692&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Paderborn",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uni-paderborn.de",
        "aff_unique_abbr": "UPB",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "nrctFaenIZ",
        "title": "GradSkip: Communication-Accelerated Local Gradient Methods with Better Computational Complexity",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We study a class of distributed optimization algorithms that aim to alleviate high communication costs by allowing clients to perform multiple local gradient-type training steps prior to communication. While methods of this type have been studied for about a decade, the empirically observed acceleration properties of local training have eluded all attempts at theoretical understanding. In a recent breakthrough, Mishchenko et al. (ICML 2022) proved that local training, when properly executed, leads to provable communication acceleration, and this holds in the strongly convex regime without relying on any data similarity assumptions. However, their ProxSkip method requires all clients to take the same number of local training steps in each communication round. Inspired by a common sense intuition, we start our investigation by conjecturing that clients with ``less important'' data should be able to get away with fewer local training steps without this impacting the overall communication complexity of the method. It turns out that this intuition is correct: we managed to redesign the original ProxSkip method to achieve this. In particular, we prove that our modified method, for which we coined the name GradSkip, converges linearly under the same assumptions and has the same accelerated communication complexity, while the number of local gradient steps can be reduced relative to a local condition number. We further generalize our method by extending the randomness of probabilistic alternations to arbitrary unbiased compression operators and by considering a generic proximable regularizer. This generalization, which we call GradSkip+, recovers several related methods in the literature as special cases. Finally, we present an empirical study on carefully designed toy problems that confirm our theoretical claims.",
        "keywords": "Federated Learning;Local training",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/47db5765779d8410705e742b501482317492a220.zip",
        "author": "Arto Maranjyan;Mher Safaryan;Peter Richt\u00e1rik",
        "authorids": "~Arto_Maranjyan1;~Mher_Safaryan1;~Peter_Richt\u00e1rik1",
        "gender": "M;M;M",
        "homepage": "https://artomaranjyan.github.io/;https://mher-safaryan.github.io;https://richtarik.org",
        "dblp": "332/0784;259/1444;62/8001",
        "google_scholar": "93WEFj8AAAAJ;dJNwgT8AAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0001-8409-817X;0000-0001-6290-1398;0000-0003-4380-5848",
        "linkedin": "arto-maranjyan/;mher-safaryan-94565a257/;richtarik/",
        "or_profile": "~Arto_Maranjyan1;~Mher_Safaryan1;~Peter_Richtarik1",
        "aff": "King Abdullah University of Science and Technology;Institute of Science and Technology;King Abdullah University of Science and Technology (KAUST)",
        "aff_domain": "kaust.edu.sa;ist.ac.at;kaust.edu.sa",
        "position": "PhD student;Postdoc;Full Professor",
        "bibtex": "@misc{\nmaranjyan2024gradskip,\ntitle={GradSkip: Communication-Accelerated Local Gradient Methods with Better Computational Complexity},\nauthor={Arto Maranjyan and Mher Safaryan and Peter Richt{\\'a}rik},\nyear={2024},\nurl={https://openreview.net/forum?id=nrctFaenIZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "NZhx;8o1X;ENdC;su5x",
        "site": "https://openreview.net/forum?id=nrctFaenIZ",
        "pdf_size": 820714,
        "rating": "5;5;5;8",
        "confidence": "3;4;4;4",
        "soundness": "1;2;3;4",
        "contribution": "1;2;2;3",
        "presentation": "1;3;3;4",
        "wc_summary": "45;46;28;127",
        "wc_strengths": "57;68;32;128",
        "wc_weaknesses": "120;113;218;15",
        "wc_questions": "5;5;56;57",
        "wc_review": "227;232;334;327",
        "wc_reply_reviewers": "153;0;104;118",
        "wc_reply_authors": "768;921;1153;244",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "1;2;2;1",
        "rating_avg": [
            5.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            1.118033988749895
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            61.5,
            38.48701079585163
        ],
        "wc_strengths_avg": [
            71.25,
            35.26595383652624
        ],
        "wc_weaknesses_avg": [
            116.5,
            71.81399585039117
        ],
        "wc_questions_avg": [
            30.75,
            25.752427070084092
        ],
        "wc_review_avg": [
            280.0,
            50.59150126256385
        ],
        "wc_reply_reviewers_avg": [
            93.75,
            56.992872361375156
        ],
        "wc_reply_authors_avg": [
            771.5,
            333.9764213234222
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16128551404749510427&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "King Abdullah University of Science and Technology;Institute of Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.kast.kau.edu.sa;",
        "aff_unique_abbr": "KAUST;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Saudi Arabia;"
    },
    {
        "id": "ns8qw9q19b",
        "title": "Hybrid Defense Strategy for Face Recognition Model Inversion Attack",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The utilization of personal sensitive data in training face recognition (FR) models poses significant privacy concerns, as adversaries can employ model inversion attacks (MIA) to infer the original training data. Existing defense methods, such as data augmentation and differential privacy, have been employed to mitigate this issue. However, these methods often fail to strike an optimal balance between privacy and accuracy.\nTo address this limitation, this paper introduces an adaptive hybrid masking algorithm against MIA. Specifically, face images are masked in the frequency domain using an adaptive MixUp strategy. Unlike the traditional MixUp algorithm, which is predominantly used for data augmentation, our modified approach incorporates frequency domain mixing. Previous studies have shown that increasing the number of images mixed in MixUp can enhance privacy preservation but at the expense of reduced face recognition accuracy. To overcome this trade-off, we develop an enhanced adaptive MixUp strategy based on reinforcement learning, which enables us to mix a larger number of images while maintaining satisfactory recognition accuracy.\nTo optimize privacy protection, we propose maximizing the reward function (i.e., the loss function of the FR system) during the training of the strategy network. While the loss function of the FR network is minimized in the phase of training the FR network. The strategy network and the face recognition network can be viewed as antagonistic entities in the training process, ultimately reaching a more balanced trade-off.\nExperimental results demonstrate that our proposed hybrid masking scheme outperforms existing defense algorithms in terms of privacy preservation and recognition accuracy against MIA.",
        "keywords": "Privacy preserving;Face recognition;Defense algorithm against Model Inversion Attack;Reinforcement learning.",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Yuanqing Huang;Yinggui Wang;Jianshu Li;Le Yang;Kai Song;Lei Wang",
        "authorids": "~Yuanqing_Huang1;~Yinggui_Wang1;~Jianshu_Li1;~Le_Yang6;~Kai_Song6;~Lei_Wang30",
        "gender": ";M;M;M;M;M",
        "homepage": ";;;https://www.canterbury.ac.nz/engineering/contact-us/people/le-yang.html;http://www.caict.ac.cn/english/yjcg/zjtd/;",
        "dblp": ";136/1775;142/8988.html;;;",
        "google_scholar": ";;;l-xC8hMAAAAJ;;",
        "orcid": ";;;;;",
        "linkedin": ";;;;;%E7%A3%8A-%E7%8E%8B-b4994abb/",
        "or_profile": "~Yuanqing_Huang1;~Yinggui_Wang1;~Jianshu_Li1;~Le_Yang6;~Kai_Song6;~Lei_Wang30",
        "aff": ";Ant Group;Ant Group;University of Canterbury;CAICT;Ant Group",
        "aff_domain": ";antgroup.com;antgroup.com;canterbury.ac.nz;caict.au.cn;antgroup.com",
        "position": ";Principal Researcher;Researcher;Lecturer;Principal Researcher;Principal Researcher",
        "bibtex": "@misc{\nhuang2024hybrid,\ntitle={Hybrid Defense Strategy for Face Recognition Model Inversion Attack},\nauthor={Yuanqing Huang and Yinggui Wang and Jianshu Li and Le Yang and Kai Song and Lei Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=ns8qw9q19b}\n}",
        "github": "",
        "project": "",
        "reviewers": "dDsq;tfZL;LCMn",
        "site": "https://openreview.net/forum?id=ns8qw9q19b",
        "pdf_size": 1659659,
        "rating": "1;3;5",
        "confidence": "4;3;4",
        "soundness": "2;2;2",
        "contribution": "2;2;2",
        "presentation": "1;1;2",
        "wc_summary": "105;24;55",
        "wc_strengths": "33;30;60",
        "wc_weaknesses": "659;191;230",
        "wc_questions": "68;114;7",
        "wc_review": "865;359;352",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            1.632993161855452
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            61.333333333333336,
            33.369979855486214
        ],
        "wc_strengths_avg": [
            41.0,
            13.490737563232042
        ],
        "wc_weaknesses_avg": [
            360.0,
            212.02358359390118
        ],
        "wc_questions_avg": [
            63.0,
            43.825411197918804
        ],
        "wc_review_avg": [
            525.3333333333334,
            240.19760383669296
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:yhsNklILmB4J:scholar.google.com/&scioq=Hybrid+Defense+Strategy+for+Face+Recognition+Model+Inversion+Attack&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2;0",
        "aff_unique_norm": "Ant Group;University of Canterbury;China Academy of Information and Communications Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.antgroup.com;https://www.canterbury.ac.nz;http://www.caict.ac.cn/",
        "aff_unique_abbr": "Ant Group;UC;CAICT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "China;New Zealand"
    },
    {
        "title": "Leveraging Uncertainty Estimates To Improve Classifier Performance",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17840",
        "id": "nsNyDvNQTc",
        "author_site": "Gundeep Arora, Srujana Merugu, Anoop Saladi, Rajeev Rastogi",
        "tldr": "",
        "abstract": "Binary classification typically involves predicting the label of an instance based on whether the model score for the positive class exceeds a threshold chosen based on the application requirements (e.g., maximizing recall for a precision bound). However, model scores are often not aligned with true positivity rate. This is especially true when the training involves a differential sampling of classes or there is distributional drift between train and test settings. In this paper, we provide theoretical analysis and empirical evidence of the dependence of estimation bias on both uncertainty and model score. Further, we  formulate the decision boundary selection using both model score and uncertainty, prove that it is NP-hard, and present  algorithms  based on dynamic programming and isotonic regression.  Evaluation of the proposed algorithms on three real-world datasets yield  25\\%-40\\%  improvement in recall at high precision bounds over the traditional approach of using model score alone, highlighting the benefits of leveraging uncertainty.",
        "keywords": "Uncertainty estimation;binary classification;imbalanced classification;score recalibration;uncertainty based decision making;classification decision boundary;bin packing;estimation bias;posterior networks",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Gundeep Arora;Srujana Merugu;Anoop Saladi;Rajeev Rastogi",
        "authorids": "~Gundeep_Arora1;~Srujana_Merugu2;~Anoop_Saladi1;~Rajeev_Rastogi2",
        "gender": "M;;M;M",
        "homepage": ";;;",
        "dblp": ";;334/1869;r/RajeevRastogi.html",
        "google_scholar": "https://scholar.google.co.in/citations?user=AUqUjuoAAAAJ;;https://scholar.google.com/citations?hl=en;",
        "orcid": ";;;",
        "linkedin": ";;anoopsaladi/;",
        "or_profile": "~Gundeep_Arora1;~Srujana_Merugu2;~Anoop_Saladi1;~Rajeev_Rastogi2",
        "aff": "Amazon;;Amazon;Amazon",
        "aff_domain": "amazon.com;;amazon.com;amazon.com",
        "position": "Researcher;;Researcher;Researcher",
        "bibtex": "@inproceedings{\narora2024leveraging,\ntitle={Leveraging Uncertainty Estimates To Improve Classifier Performance},\nauthor={Gundeep Arora and Srujana Merugu and Anoop Saladi and Rajeev Rastogi},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=nsNyDvNQTc}\n}",
        "github": "",
        "project": "",
        "reviewers": "D6i1;i837;ZEGe",
        "pdf_size": 8459418,
        "rating": "3;6;6",
        "confidence": "4;4;3",
        "soundness": "1;3;3",
        "contribution": "1;2;3",
        "presentation": "1;2;3",
        "wc_summary": "143;152;91",
        "wc_strengths": "17;66;87",
        "wc_weaknesses": "574;462;48",
        "wc_questions": "2;329;20",
        "wc_review": "736;1009;246",
        "wc_reply_reviewers": "0;34;39",
        "wc_reply_authors": "1379;2599;137",
        "reply_reviewers": "0;1;1",
        "reply_authors": "2;4;1",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            128.66666666666666,
            26.886593106767712
        ],
        "wc_strengths_avg": [
            56.666666666666664,
            29.32954520994525
        ],
        "wc_weaknesses_avg": [
            361.3333333333333,
            226.22898920243523
        ],
        "wc_questions_avg": [
            117.0,
            150.08664164408503
        ],
        "wc_review_avg": [
            663.6666666666666,
            315.6647307226802
        ],
        "wc_reply_reviewers_avg": [
            24.333333333333332,
            17.326921891156037
        ],
        "wc_reply_authors_avg": [
            1371.6666666666667,
            1005.1206671616874
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8375184105036456853&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=nsNyDvNQTc",
        "pdf": "https://openreview.net/pdf?id=nsNyDvNQTc",
        "email": "amazon.com;;amazon.com;amazon.com",
        "author_num": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Amazon",
        "aff_unique_dep": "Amazon.com, Inc.",
        "aff_unique_url": "https://www.amazon.com",
        "aff_unique_abbr": "Amazon",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "nsvgVuaWXK",
        "title": "Provably Efficient Learning in Partially Observable Contextual Bandit",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this paper, we investigate transfer learning in partially observable contextual bandits, where agents have limited knowledge from other agents and partial information about hidden confounders. We first convert the problem to identifying or partially identifying causal effects between actions and rewards through optimization problems. To solve these optimization problems, we sample compatible causal models via sequentially solving linear programmings to obtain causal bounds with the consideration of estimation error. Our sampling algorithms provide desirable convergence results for suitable sampling distributions. We then show how causal bounds can be applied to improving classical bandit algorithms and affect the regrets with respect to the size of action sets and function spaces. Notably, in the task with function approximation which allows us to handle general context distributions, our method improves the order dependence on function space size compared with previous literatures. We formally prove that our causally enhanced algorithms outperform classical bandit algorithms and achieve orders of magnitude faster convergence rates. Finally, we perform simulations that demonstrate the efficiency of our strategy compared to the current state-of-the-art methods.",
        "keywords": "partially observable contextual bandit;causal bound;provably efficient",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/8762c2e1ea3d84db11630257acb22c88bd5daa25.pdf",
        "author": "Xueping Gong;Jiheng Zhang",
        "authorids": "~Xueping_Gong1;~Jiheng_Zhang1",
        "gender": ";",
        "homepage": ";https://reijz.github.io",
        "dblp": ";13/7602",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Xueping_Gong1;~Jiheng_Zhang1",
        "aff": ";Hong Kong University of Science and Technology",
        "aff_domain": ";ust.hk",
        "position": ";Full Professor",
        "bibtex": "@misc{\ngong2024provably,\ntitle={Provably Efficient Learning in Partially Observable Contextual Bandit},\nauthor={Xueping Gong and Jiheng Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=nsvgVuaWXK}\n}",
        "github": "",
        "project": "",
        "reviewers": "whdt;yo3f;eQpB;DQyy",
        "site": "https://openreview.net/forum?id=nsvgVuaWXK",
        "pdf_size": 454496,
        "rating": "3;3;5;6",
        "confidence": "3;3;3;2",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;1;2;2",
        "wc_summary": "70;71;89;94",
        "wc_strengths": "103;27;23;126",
        "wc_weaknesses": "271;369;112;17",
        "wc_questions": "179;3;41;283",
        "wc_review": "623;470;265;520",
        "wc_reply_reviewers": "0;0;0;157",
        "wc_reply_authors": "786;656;432;912",
        "reply_reviewers": "0;0;0;2",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            81.0,
            10.653637876331258
        ],
        "wc_strengths_avg": [
            69.75,
            45.50480743833557
        ],
        "wc_weaknesses_avg": [
            192.25,
            136.56019734900795
        ],
        "wc_questions_avg": [
            126.5,
            111.5918903863538
        ],
        "wc_review_avg": [
            469.5,
            130.31979895625992
        ],
        "wc_reply_reviewers_avg": [
            39.25,
            67.98299419707844
        ],
        "wc_reply_authors_avg": [
            696.5,
            177.51830891488348
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.7777777777777777,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:QtaLDuIzCfMJ:scholar.google.com/&scioq=Provably+Efficient+Learning+in+Partially+Observable+Contextual+Bandit&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "Hong Kong University of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ust.hk",
        "aff_unique_abbr": "HKUST",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "ntSP0bzr8Y",
        "title": "PowerGPT: Foundation Model for Power Systems",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We propose a foundation model, namely PowerGPT, to model electricity time series (ETS) data, which learns generic representations of load and electricity consumption data by pre-training, providing a large-scale, off-the-shelf model for power systems. PowerGPT is the largest model in the field of power systems and is pre-trained on a large-scale ETS data including load and electricity consumption data. The design of PowerGPT is to capture long-term temporal dependency and hierarchical correlation from massive ETS data, providing information that spans from the fine-grained to coarse-grained scales. As a foundation model, PowerGPT achieves SOTA performance on various downstream tasks in power systems (i.e. forecasting, missing value imputation, and anomaly detection), showing the generalization ability to a wide range of tasks. The low-resource label analysis further illustrates the effectiveness of our pre-training strategy. In addition, we explore the effect of model size to show that a larger-scale model with a higher capacity can lead to performance improvements.",
        "keywords": "power systems;foundation model;self-supervised learning;time series",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Shihao Tu;Yupeng Zhang;Yan Huajiang;Fangbin Ye;An Wen;Zhendong Fu;Yang Yang",
        "authorids": "~Shihao_Tu4;yuppzhang@zju.edu.cn;~Yan_Huajiang1;~Fangbin_Ye1;~An_Wen1;~Zhendong_Fu1;~Yang_Yang35",
        "gender": ";;M;M;M;;M",
        "homepage": ";;;;;;http://yangy.org",
        "dblp": ";;259/8863.html;227/6711.html;;;",
        "google_scholar": ";;;;;;",
        "orcid": ";;;;0009-0009-9880-3357;;0000-0002-5058-4417",
        "linkedin": ";;;;;;",
        "or_profile": "~Shihao_Tu4;yuppzhang@zju.edu.cn;~Yan_Huajiang1;~Fangbin_Ye1;~An_Wen1;~Zhendong_Fu1;~Yang_Yang35",
        "aff": ";;;;;;Zhejiang University",
        "aff_domain": ";;;;;;zju.edu.cn",
        "position": ";;;;;;Associate Professor",
        "bibtex": "@misc{\ntu2024powergpt,\ntitle={Power{GPT}: Foundation Model for Power Systems},\nauthor={Shihao Tu and Yupeng Zhang and Yan Huajiang and Fangbin Ye and An Wen and Zhendong Fu and Yang Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=ntSP0bzr8Y}\n}",
        "github": "",
        "project": "",
        "reviewers": "mCC2;A7y6;QMPP;fens",
        "site": "https://openreview.net/forum?id=ntSP0bzr8Y",
        "pdf_size": 614530,
        "rating": "1;3;3;5",
        "confidence": "4;3;4;4",
        "soundness": "2;1;2;3",
        "contribution": "1;2;1;2",
        "presentation": "2;2;3;3",
        "wc_summary": "71;30;93;66",
        "wc_strengths": "30;35;83;63",
        "wc_weaknesses": "60;78;379;176",
        "wc_questions": "21;445;38;54",
        "wc_review": "182;588;593;359",
        "wc_reply_reviewers": "0;16;20;0",
        "wc_reply_authors": "528;421;514;518",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            65.0,
            22.616365755797283
        ],
        "wc_strengths_avg": [
            52.75,
            21.52179128232592
        ],
        "wc_weaknesses_avg": [
            173.25,
            126.72682233844579
        ],
        "wc_questions_avg": [
            139.5,
            176.76608837670193
        ],
        "wc_review_avg": [
            430.5,
            171.81167015077875
        ],
        "wc_reply_reviewers_avg": [
            9.0,
            9.1104335791443
        ],
        "wc_reply_authors_avg": [
            495.25,
            43.170447067409434
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0",
        "aff_unique_norm": "Zhejiang University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.zju.edu.cn",
        "aff_unique_abbr": "ZJU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "ntUmktUfZg",
        "title": "Generate to Discriminate: Expert Routing for Continual Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In many real-world settings, norms, regulations, or economic incentives\npermit the sharing of models but not data across environments. \nProminent examples arise in healthcare \ndue to regulatory concerns. \nIn this scenario, the practitioner wishes to adapt the model to each new environment\nbut faces the danger of losing performance on previous environments\ndue to the well-known problem of catastrophic forgetting. \nIn this paper, we propose Generate-to-Discriminate (G2D), a novel approach that leverages recent advancements in generative models to alleviate the catastrophic forgetting problem in continual learning. \nUnlike previous approaches based on generative models \nthat primarily use synthetic data\nfor training the label classifier,\nwe use synthetic data to train a domain discriminator.\nOur method involves the following steps:\nFor each domain, (i) fine-tune the classifier and adapt a \ngenerative model to the current domain data;\n(ii) train a domain discriminator to distinguish synthetic samples \nfrom past versus current domain data; \nand (iii) during inference, route samples to the respective classifier.\nWe compare G2D to an alternative approach, where we simply replay the generated synthetic data, and, surprisingly, we find that training a domain discriminator is significantly more effective than augmenting the training data with the same synthetic samples. We consistently outperform previous state-of-the-art domain-incremental learning algorithms \nby up to $7.6$ and $6.2$ points across three standard \ndomain incremental learning benchmarks in the vision and language modalities, respectively,\nand $10.0$ points on a challenging real-world dermatology medical imaging task.",
        "keywords": "Domain Incremental Learning;Continual Learning;Distribution Shift;Transfer Learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Yewon Byun;Sanket Vaibhav Mehta;Saurabh Garg;Emma Strubell;Bryan Wilder;Zachary Chase Lipton",
        "authorids": "~Yewon_Byun1;~Sanket_Vaibhav_Mehta2;~Saurabh_Garg3;~Emma_Strubell1;~Bryan_Wilder2;~Zachary_Chase_Lipton1",
        "gender": ";M;M;Non-Binary;;Unspecified",
        "homepage": ";https://sanketvmehta.github.io;http://saurabhgarg1996.github.io/;http://strubell.github.io;https://bryanwilder.github.io/;http://zacklipton.com",
        "dblp": ";225/7804;80/208;153/2253;164/1648;",
        "google_scholar": ";H4pn-ogAAAAJ;SAnJ1hIAAAAJ;UCDMtM0AAAAJ;;MN9Kfg8AAAAJ",
        "orcid": ";0000-0003-1809-4685;;;;",
        "linkedin": ";sanketvmehta/;saurabh-garg-b680b5b8/;;;",
        "or_profile": "~Yewon_Byun1;~Sanket_Vaibhav_Mehta2;~Saurabh_Garg3;~Emma_Strubell1;~Bryan_Wilder2;~Zachary_Chase_Lipton1",
        "aff": ";Google ;Carnegie Mellon University;Allen Institute for Artificial Intelligence;Carnegie Mellon University;Carnegie Mellon University",
        "aff_domain": ";google.com;cmu.edu;allenai.org;cmu.edu;cmu.edu",
        "position": ";Researcher;PhD student;Visiting Researcher;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nbyun2024generate,\ntitle={Generate to Discriminate: Expert Routing for Continual Learning},\nauthor={Yewon Byun and Sanket Vaibhav Mehta and Saurabh Garg and Emma Strubell and Bryan Wilder and Zachary Chase Lipton},\nyear={2024},\nurl={https://openreview.net/forum?id=ntUmktUfZg}\n}",
        "github": "",
        "project": "",
        "reviewers": "YtsH;9jT2;833z",
        "site": "https://openreview.net/forum?id=ntUmktUfZg",
        "pdf_size": 4554006,
        "rating": "5;5;6",
        "confidence": "3;4;3",
        "soundness": "2;3;3",
        "contribution": "3;2;3",
        "presentation": "3;3;2",
        "wc_summary": "80;127;78",
        "wc_strengths": "51;56;68",
        "wc_weaknesses": "212;206;47",
        "wc_questions": "72;61;8",
        "wc_review": "415;450;201",
        "wc_reply_reviewers": "410;47;0",
        "wc_reply_authors": "2445;1510;706",
        "reply_reviewers": "2;1;0",
        "reply_authors": "6;4;3",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            95.0,
            22.642143596988927
        ],
        "wc_strengths_avg": [
            58.333333333333336,
            7.1336448530109
        ],
        "wc_weaknesses_avg": [
            155.0,
            76.40680597957227
        ],
        "wc_questions_avg": [
            47.0,
            27.94041278626117
        ],
        "wc_review_avg": [
            355.3333333333333,
            110.06159891422419
        ],
        "wc_reply_reviewers_avg": [
            152.33333333333334,
            183.20540991527028
        ],
        "wc_reply_authors_avg": [
            1553.6666666666667,
            710.6149136878254
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            4.333333333333333,
            1.247219128924647
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15700856995401509201&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;1;1",
        "aff_unique_norm": "Google;Carnegie Mellon University;Allen Institute for Artificial Intelligence",
        "aff_unique_dep": "Google;;",
        "aff_unique_url": "https://www.google.com;https://www.cmu.edu;https://allenai.org",
        "aff_unique_abbr": "Google;CMU;AI2",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Mountain View;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "nuSbbzqULg",
        "title": "Structured Pruning of CNNs at Initialization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Pruning-at-initialization (PAI) methods prune the individual weights of a convolutional neural network (CNN) before training, thus avoiding expensive fine-tuning or retraining of the pruned model. While PAI shows promising results in reducing model size, the pruned model still requires unstructured sparse matrix computation, making it difficult to achieve a real speedup. In this work, we show both theoretically and empirically that the accuracy of CNN models pruned by a PAI method is independent of the granularity of pruning when layer-wise density (i.e., the fraction of the remaining parameters in each layer) remains the same. We formulate PAI as a convex optimization problem based on an expectation-based proxy for model accuracy, which can instantly produce the optimal allocation of the layer-wise densities with respect to the proxy model. Using our formulation, we further propose a structured and hardware-friendly PAI method, named PreCrop, to prune or reconfigure CNNs in the channel dimension. Our empirical results show that PreCrop achieves a higher accuracy than existing PAI methods on several popular CNN architectures, including ResNet, MobileNetV2, and EfficientNet, on both CIFAR-10 and ImageNet. Notably, PreCrop achieves an accuracy improvement of up to 1.9% over a state-of-the-art PAI algorithm when pruning MobileNetV2 on ImageNet.",
        "keywords": "Pruning;Pruning-at-Initialization;Structured Pruning;Efficient Deep Learning;Efficient Model;Acceleration;Deep Learning Acceleration;Convolutional Neural Network",
        "primary_area": "infrastructure, software libraries, hardware, etc.",
        "supplementary_material": "/attachment/dc4d4251076dbb2142437b692bb142b3a711e6b4.zip",
        "author": "Yaohui Cai;Weizhe Hua;Hongzheng Chen;G. Edward Suh;Christopher De Sa;Zhiru Zhang",
        "authorids": "~Yaohui_Cai1;~Weizhe_Hua1;~Hongzheng_Chen1;~G._Edward_Suh2;~Christopher_De_Sa2;~Zhiru_Zhang2",
        "gender": ";M;M;;;M",
        "homepage": ";https://weizhehua.github.io/;https://chhzh123.github.io/;;;https://www.csl.cornell.edu/~zhiruz",
        "dblp": ";https://dblp.org/pers/h/Hua:Weizhe.html;236/6631;;;81/4227",
        "google_scholar": ";KsykV2cAAAAJ;5lRicPwAAAAJ;;;https://scholar.google.com.tw/citations?user=x05pUHsAAAAJ",
        "orcid": ";;0000-0002-6617-0075;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Yaohui_Cai1;~Weizhe_Hua1;~Hongzheng_Chen1;~G._Edward_Suh2;~Christopher_De_Sa2;~Zhiru_Zhang2",
        "aff": ";Google Brain;Cornell University;;;Cornell University",
        "aff_domain": ";google.com;cornell.edu;;;cornell.edu",
        "position": ";Researcher;PhD student;;;Associate Professor",
        "bibtex": "@misc{\ncai2024structured,\ntitle={Structured Pruning of {CNN}s at Initialization},\nauthor={Yaohui Cai and Weizhe Hua and Hongzheng Chen and G. Edward Suh and Christopher De Sa and Zhiru Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=nuSbbzqULg}\n}",
        "github": "",
        "project": "",
        "reviewers": "gkKF;mFWq;umau;BbJ9",
        "site": "https://openreview.net/forum?id=nuSbbzqULg",
        "pdf_size": 552999,
        "rating": "3;3;5;5",
        "confidence": "4;5;5;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "84;53;108;74",
        "wc_strengths": "42;31;60;82",
        "wc_weaknesses": "243;129;282;210",
        "wc_questions": "38;4;6;60",
        "wc_review": "407;217;456;426",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            79.75,
            19.778460506318485
        ],
        "wc_strengths_avg": [
            53.75,
            19.3180614969515
        ],
        "wc_weaknesses_avg": [
            216.0,
            56.324950066555765
        ],
        "wc_questions_avg": [
            27.0,
            23.345235059857504
        ],
        "wc_review_avg": [
            376.5,
            93.72966446115124
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.30151134457776363,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Google;Cornell University",
        "aff_unique_dep": "Google Brain;",
        "aff_unique_url": "https://brain.google.com;https://www.cornell.edu",
        "aff_unique_abbr": "Google Brain;Cornell",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Mountain View;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "nuWVS4SBUu",
        "title": "Rethinking Audiovisual Segmentation with Semantic Quantization and Decomposition",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Audiovisual segmentation (AVS) is a challenging task that aims to segment visual objects in videos based on their associated acoustic cues. With multiple sound sources involved, establishing robust correspondences between audio and visual contents poses unique challenges due to its (1) intricate entanglement across sound sources and (2) frequent shift among sound events. Assuming sound events occur independently, the multi-source semantic space (which encompasses all possible semantic categories) can be viewed as the Cartesian product of single-source sub-spaces. This motivates us to decompose the multi-source audio semantics into single-source semantics, allowing for more effective interaction with visual content. Specifically, we propose a semantic decomposition method based on product quantization, where the multi-source semantics can be decomposed and represented by several quantized single-source semantics. Furthermore, we introduce a global-to-local quantization mechanism that distills knowledge from stable global (clip-level) features into local (frame-level) ones to handle the constant shift of audio semantics. Extensive experiments demonstrate that semantically quantized and decomposed audio representation significantly improves AVS performance, e.g., +21.2\\% mIoU on the most challenging AVS-Semantic benchmark.",
        "keywords": "Audiovisual segmentation;Audio semantic decomposition",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/37706dbea8bb51b66683610bb31a0d9b47b1b3dd.zip",
        "author": "Xiang Li;Jinglu Wang;Xiaohao Xu;Xiulian Peng;Rita Singh;Yan Lu;Bhiksha Raj",
        "authorids": "~Xiang_Li35;~Jinglu_Wang3;~Xiaohao_Xu1;~Xiulian_Peng1;~Rita_Singh1;~Yan_Lu7;~Bhiksha_Raj1",
        "gender": ";;;;F;M;M",
        "homepage": ";;;;http://mlsp.cs.cmu.edu/people/rsingh/index.html;https://www.microsoft.com/en-us/research/people/yanlu/;https://www.cs.cmu.edu/directory/bhikshar/",
        "dblp": ";;;;;15/4830-1;60/3996",
        "google_scholar": ";;;;;djk5l-4AAAAJ;",
        "orcid": ";;;;;0000-0001-5383-6424;",
        "linkedin": ";;;;;;",
        "or_profile": "~Xiang_Li35;~Jinglu_Wang3;~Xiaohao_Xu1;~Xiulian_Peng1;~Rita_Singh1;~Yan_Lu7;~Bhiksha_Raj1",
        "aff": ";;;;School of Computer Science, Carnegie Mellon University;Microsoft Research Asia;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_domain": ";;;;cs.cmu.edu;microsoft.com;mbzuai.ac.ae",
        "position": ";;;;Research Professor;Partner Research Manager;Full Professor",
        "bibtex": "@misc{\nli2024rethinking,\ntitle={Rethinking Audiovisual Segmentation with Semantic Quantization and Decomposition},\nauthor={Xiang Li and Jinglu Wang and Xiaohao Xu and Xiulian Peng and Rita Singh and Yan Lu and Bhiksha Raj},\nyear={2024},\nurl={https://openreview.net/forum?id=nuWVS4SBUu}\n}",
        "github": "",
        "project": "",
        "reviewers": "1erG;cNHw;vB2P",
        "site": "https://openreview.net/forum?id=nuWVS4SBUu",
        "pdf_size": 3166136,
        "rating": "5;5;5",
        "confidence": "4;3;3",
        "soundness": "3;2;3",
        "contribution": "2;2;2",
        "presentation": "3;3;2",
        "wc_summary": "42;112;84",
        "wc_strengths": "67;36;58",
        "wc_weaknesses": "86;423;308",
        "wc_questions": "50;7;433",
        "wc_review": "245;578;883",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            79.33333333333333,
            28.767265347188555
        ],
        "wc_strengths_avg": [
            53.666666666666664,
            13.021349989749739
        ],
        "wc_weaknesses_avg": [
            272.3333333333333,
            139.8721638576533
        ],
        "wc_questions_avg": [
            163.33333333333334,
            191.489483320161
        ],
        "wc_review_avg": [
            568.6666666666666,
            260.546007880033
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=19508592485397749&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Carnegie Mellon University;Microsoft;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_unique_dep": "School of Computer Science;Research;",
        "aff_unique_url": "https://www.cmu.edu;https://www.microsoft.com/en-us/research/group/asia;https://mbzuai.ac.ae",
        "aff_unique_abbr": "CMU;MSR Asia;MBZUAI",
        "aff_campus_unique_index": "0;1",
        "aff_campus_unique": "Pittsburgh;Asia;",
        "aff_country_unique_index": "0;1;2",
        "aff_country_unique": "United States;China;United Arab Emirates"
    },
    {
        "id": "nubKjBbazd",
        "title": "APD: Boosting Adversarial Transferability via Perturbation Dropout",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The transferability of adversarial attack to deep neural networks (DNNs) accounts for the possibility that the adversarial examples crafted for a known model can also mislead other unseen models in black-box setting. Existing literature to improve the adversarial transferability often focus on spreading the adversarial perturbations towards the whole image, which can be counter-productive as the extended perturbation can hardly track the attention regions across different models. That's because although they spread the perturbation throughout the entire image but they do not consider the mutual influence of different perturbation regions. In this paper, we propose a simple yet effective perturbation-dropping scheme that can enhance the transferability of the adversarial examples by incorporating the dropout mechanism during their optimization process. Specifically, we leverage the class activation map (CAM) to locate the midpoint of the dropped regions, whereby the effective perturbation can be generated for the target models while maintaining the attack rate towards the source model even if some blocks of the perturbation noises are dropped. Extensive experiments are conducted on the ImageNet dataset, which demonstrates that the proposed method outperforms state-of-the-art methods, that achieve both high attack efficiency and transferability.",
        "keywords": "adversarial example;trustworthy AI",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/f94139d64cdd2a777cf7b30cf85f11f75c2e27db.zip",
        "author": "Zongqi Wang;Wenchao Xu;Haozhao Wang;Nan Cheng",
        "authorids": "~Zongqi_Wang2;~Wenchao_Xu1;~Haozhao_Wang1;~Nan_Cheng1",
        "gender": "M;;M;M",
        "homepage": "https://liudan193.github.io/;;https://wanghaozhao.mysxl.cn/;https://web.xidian.edu.cn/nancheng/en/index.html",
        "dblp": "383/7776;;224/4500.html;",
        "google_scholar": "dbCdFjoAAAAJ;;https://scholar.google.com.hk/citations?user=yFrOuMEAAAAJ;Cxm51twAAAAJ",
        "orcid": ";;0000-0002-7591-5315;0000-0002-2007-8468",
        "linkedin": ";;;",
        "or_profile": "~Zongqi_Wang2;~Wenchao_Xu1;~Haozhao_Wang1;~Nan_Cheng1",
        "aff": "Xidian University;;Huazhong University of Science and Technology;Xidian University",
        "aff_domain": "xidian.edu.cn;;hust.edu.cn;xidian.edu.cn",
        "position": "Undergrad student;;Postdoc;Full Professor",
        "bibtex": "@misc{\nwang2024apd,\ntitle={{APD}: Boosting Adversarial Transferability via Perturbation Dropout},\nauthor={Zongqi Wang and Wenchao Xu and Haozhao Wang and Nan Cheng},\nyear={2024},\nurl={https://openreview.net/forum?id=nubKjBbazd}\n}",
        "github": "",
        "project": "",
        "reviewers": "3YWF;e8ZY;PxjZ;at4m",
        "site": "https://openreview.net/forum?id=nubKjBbazd",
        "pdf_size": 772964,
        "rating": "5;5;5;5",
        "confidence": "4;4;4;3",
        "soundness": "2;2;2;2",
        "contribution": "1;2;2;2",
        "presentation": "2;3;3;3",
        "wc_summary": "70;62;100;57",
        "wc_strengths": "18;45;85;71",
        "wc_weaknesses": "198;161;350;141",
        "wc_questions": "2;27;65;2",
        "wc_review": "288;295;600;271",
        "wc_reply_reviewers": "0;0;80;0",
        "wc_reply_authors": "2076;1957;2922;645",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "6;5;7;2",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            72.25,
            16.67895380412093
        ],
        "wc_strengths_avg": [
            54.75,
            25.616157010761782
        ],
        "wc_weaknesses_avg": [
            212.5,
            81.97713095735908
        ],
        "wc_questions_avg": [
            24.0,
            25.777897509300484
        ],
        "wc_review_avg": [
            363.5,
            136.8219646109498
        ],
        "wc_reply_reviewers_avg": [
            20.0,
            34.64101615137755
        ],
        "wc_reply_authors_avg": [
            1900.0,
            814.5142724348052
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            5.0,
            1.8708286933869707
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:64qLw95a03gJ:scholar.google.com/&scioq=APD:+Boosting+Adversarial+Transferability+via+Perturbation+Dropout&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Xidian University;Huazhong University of Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.xidian.edu.cn/;http://www.hust.edu.cn",
        "aff_unique_abbr": "Xidian;HUST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "nudMydhZZW",
        "title": "A primal-dual perspective for distributed TD-learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The goal of this paper is to investigate distributed temporal difference (TD) learning for a networked multi-agent Markov decision process. The proposed approach is based on distributed optimization algorithms, which can be interpreted as primal-dual Ordinary differential equation (ODE) dynamics subject to null-space constraints. Based on the exponential convergence behavior of the primal-dual ODE dynamics subject to null-space constraints, we examine the behavior of the final iterate in various distributed TD-learning scenarios, considering both constant and diminishing step-sizes and incorporating both i.i.d. and Markovian observation models. Unlike existing methods, the proposed algorithm does not require the assumption that the underlying communication network structure is characterized by a doubly stochastic matrix.",
        "keywords": "TD-learning;distributed learning;primal-dual method",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Han-Dong Lim;Donghwan Lee",
        "authorids": "~Han-Dong_Lim1;~Donghwan_Lee2",
        "gender": "M;M",
        "homepage": ";https://sites.google.com/site/donghwanleehome",
        "dblp": "301/8950;",
        "google_scholar": "n2Vw99sAAAAJ;",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Han-Dong_Lim1;~Donghwan_Lee2",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nlim2024a,\ntitle={A primal-dual perspective for distributed {TD}-learning},\nauthor={Han-Dong Lim and Donghwan Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=nudMydhZZW}\n}",
        "github": "",
        "project": "",
        "reviewers": "3CVE;u6NQ;ZkTm;7B2c",
        "site": "https://openreview.net/forum?id=nudMydhZZW",
        "pdf_size": 937724,
        "rating": "5;6;6;8",
        "confidence": "4;3;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;2;2;3",
        "wc_summary": "52;145;53;64",
        "wc_strengths": "90;63;21;29",
        "wc_weaknesses": "116;211;141;26",
        "wc_questions": "94;200;10;1",
        "wc_review": "352;619;225;120",
        "wc_reply_reviewers": "25;0;0;0",
        "wc_reply_authors": "1037;1245;510;57",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "3;2;1;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            78.5,
            38.68139087468288
        ],
        "wc_strengths_avg": [
            50.75,
            27.60774347895894
        ],
        "wc_weaknesses_avg": [
            123.5,
            66.19101147436864
        ],
        "wc_questions_avg": [
            76.25,
            80.12607253572335
        ],
        "wc_review_avg": [
            329.0,
            186.49798926530013
        ],
        "wc_reply_reviewers_avg": [
            6.25,
            10.825317547305483
        ],
        "wc_reply_authors_avg": [
            712.25,
            463.5576420468117
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.2294157338705618,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12844657777217152097&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "nxPTSDp9xK",
        "title": "CrossGET: Cross-Guided Ensemble of Tokens for Accelerating Vision-Language Transformers",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recent vision-language models have achieved tremendous progress far beyond what we ever expected. However, their computational costs are also dramatically growing with rapid development, especially for the large models. It makes model acceleration exceedingly critical in a scenario of limited resources. Although extensively studied for unimodal models, the acceleration for multimodal models, especially the vision-language Transformers, is relatively under-explored.  To pursue more efficient and accessible vision-language Transformers, this paper introduces \\textbf{Cross}-\\textbf{G}uided \\textbf{E}nsemble of \\textbf{T}okens (\\textbf{\\emph{CrossGET}}), a universal acceleration framework for vision-language Transformers. This framework adaptively combines tokens through real-time, cross-modal guidance, thereby achieving substantial acceleration while keeping high performance. \\textit{CrossGET} has two key innovations: 1) \\textit{Cross-Guided Matching and Ensemble}. \\textit{CrossGET} incorporates cross-modal guided token matching and ensemble to exploit cross-modal information effectively, only introducing cross-modal tokens with negligible extra parameters. 2) \\textit{Complete-Graph Soft Matching}. In contrast to the existing bipartite soft matching approach, \\textit{CrossGET} introduces a complete-graph soft matching policy to achieve more reliable token-matching results while maintaining parallelizability and high efficiency. Extensive experiments are conducted on various vision-language tasks, including image-text retrieval, visual reasoning, image captioning, and visual question answering. Performance on both classic multimodal architectures and emerging multimodal LLMs demonstrate the effectiveness and versatility of the proposed \\textit{CrossGET} framework. The code and models will be made public.",
        "keywords": "Multimodal Model;Vision-Language Transformers;Model Acceleration;Token Ensemble",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Dachuan Shi;Chaofan Tao;Anyi Rao;Zhendong Yang;Chun Yuan;Jiaqi Wang",
        "authorids": "~Dachuan_Shi2;~Chaofan_Tao1;~Anyi_Rao2;~Zhendong_Yang2;~Chun_Yuan1;~Jiaqi_Wang1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://www.dachuanshi.com;;http://anyirao.com/;;https://www.sigs.tsinghua.edu.cn/fg3/105064.jhtml;https://myownskyw7.github.io/",
        "dblp": "283/0549;239/5831;211/7941;14/1820;;44/740-3",
        "google_scholar": "https://scholar.google.com/citations?hl=en;gjmfLroAAAAJ;8lKr7j4AAAAJ;M9qKrogAAAAJ;https://scholar.google.com.hk/citations?user=fYdxi2sAAAAJ;https://scholar.google.com.hk/citations?user=GDvt570AAAAJ",
        "orcid": ";;0000-0003-1004-7753;;;",
        "linkedin": ";;anyirao/;;;",
        "or_profile": "~Dachuan_Shi2;~Chaofan_Tao1;~Anyi_Rao2;~Zhendong_Yang2;~Chun_Yuan1;~Jiaqi_Wang1",
        "aff": "Tsinghua University;The University of Hong Kong;Stanford University; Tsinghua University;Tsinghua University;Shanghai AI Laboratory",
        "aff_domain": "tsinghua.edu.cn;hku.hk;stanford.edu;mails.tsinghua.edu.cn;tsinghua.edu.cn;pjlab.org.cn",
        "position": "MS student;PhD Student;Postdoc;MS student;Full Professor;Research Scientist",
        "bibtex": "@misc{\nshi2024crossget,\ntitle={Cross{GET}: Cross-Guided Ensemble of Tokens for Accelerating Vision-Language Transformers},\nauthor={Dachuan Shi and Chaofan Tao and Anyi Rao and Zhendong Yang and Chun Yuan and Jiaqi Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=nxPTSDp9xK}\n}",
        "github": "",
        "project": "",
        "reviewers": "Uwik;Yt1v;4d9L;oYGw",
        "site": "https://openreview.net/forum?id=nxPTSDp9xK",
        "pdf_size": 2477474,
        "rating": "5;5;6;6",
        "confidence": "5;4;5;4",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "69;39;70;31",
        "wc_strengths": "119;16;12;54",
        "wc_weaknesses": "237;197;404;68",
        "wc_questions": "161;31;3;30",
        "wc_review": "586;283;489;183",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1699;2135;1725;917",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;4;3;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            52.25,
            17.483921184905864
        ],
        "wc_strengths_avg": [
            50.25,
            42.944004238077284
        ],
        "wc_weaknesses_avg": [
            226.5,
            120.00937463381767
        ],
        "wc_questions_avg": [
            56.25,
            61.5116858816274
        ],
        "wc_review_avg": [
            385.25,
            160.01933476927093
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1619.0,
            440.6517899657279
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 22,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14864616039322790915&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;2;0;0;3",
        "aff_unique_norm": "Tsinghua University;University of Hong Kong;Stanford University;Shanghai AI Laboratory",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.hku.hk;https://www.stanford.edu;https://www.shanghai-ai-lab.com",
        "aff_unique_abbr": "THU;HKU;Stanford;SAIL",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Hong Kong SAR;Stanford",
        "aff_country_unique_index": "0;0;1;0;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Flat Minima in Linear Estimation and an Extended Gauss Markov Theorem",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17839",
        "id": "nxnbPPVvOG",
        "tldr": "",
        "abstract": "We consider the problem of linear estimation, and establish an extension of the Gauss-Markov theorem, in which the bias operator is allowed to be non-zero but bounded with respect to a matrix norm of Schatten type.  We derive simple and explicit formulas for the optimal estimator in the cases of Nuclear and  Spectral norms (with the Frobenius case recovering ridge regression). Additionally, we analytically derive the generalization error in multiple random matrix ensembles, and compare with Ridge regression. Finally, we conduct an extensive simulation study, in which we show that the cross-validated Nuclear and Spectral regressors can outperform Ridge in several circumstances.",
        "keywords": "regularization;regression;optimization",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/67221fa40f762384a44dafad402538ccadecea23.zip",
        "author": "Simon Segert",
        "authorids": "~Simon_Segert1",
        "gender": "",
        "homepage": "https://pni.princeton.edu/directory/simon-segert",
        "dblp": "",
        "google_scholar": "",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Simon_Segert1",
        "aff": "Princeton University",
        "aff_domain": "princeton.edu",
        "position": "PhD student",
        "bibtex": "@inproceedings{\nsegert2024flat,\ntitle={Flat Minima in Linear Estimation and an Extended Gauss Markov Theorem},\nauthor={Simon Segert},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=nxnbPPVvOG}\n}",
        "github": "",
        "project": "",
        "reviewers": "ACbc;v15j;cHcu",
        "pdf_size": 1336248,
        "rating": "5;6;6",
        "confidence": "3;4;4",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "2;2;3",
        "wc_summary": "54;105;281",
        "wc_strengths": "75;126;42",
        "wc_weaknesses": "242;125;421",
        "wc_questions": "9;208;109",
        "wc_review": "380;564;853",
        "wc_reply_reviewers": "0;12;258",
        "wc_reply_authors": "448;811;1942",
        "reply_reviewers": "0;1;1",
        "reply_authors": "1;1;3",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            146.66666666666666,
            97.24310886752964
        ],
        "wc_strengths_avg": [
            81.0,
            34.55430508634199
        ],
        "wc_weaknesses_avg": [
            262.6666666666667,
            121.72190526861722
        ],
        "wc_questions_avg": [
            108.66666666666667,
            81.24175171808041
        ],
        "wc_review_avg": [
            599.0,
            194.68093555011149
        ],
        "wc_reply_reviewers_avg": [
            90.0,
            118.89491158161479
        ],
        "wc_reply_authors_avg": [
            1067.0,
            636.2185159204344
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0.9999999999999997,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14773519917988383154&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=nxnbPPVvOG",
        "pdf": "https://openreview.net/pdf?id=nxnbPPVvOG",
        "email": "princeton.edu",
        "author_num": 1,
        "aff_unique_index": "0",
        "aff_unique_norm": "Princeton University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.princeton.edu",
        "aff_unique_abbr": "Princeton",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "nzvoDKEvU1",
        "title": "DeepHandMesh-lite: Learning personalized hand shape using limited data and weak supervision",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Being able to control the deformation of personalized, high-fidelity hand meshes in real-time contributes strongly to the feeling of presence in virtual reality. We present a method to learn an individual's hand shape based on 3D scans of the hand in different poses. For this, we rely on the data and hand shape model from the work of Moon et al. titled \"DeepHandMesh\" (DHM). We propose a novel algorithm to approximate hand joint pose based on joint position, and a loss function which leverages shape information contained in the silhouette. Of the 1070 high-resolution hand scans that DHM trains on in total, we choose only 24 poses representing primarily grasping scenarios. While the scans in DHM have been obtained with highly specialized equipment, our approach makes personalization of the hand mesh more feasible using limited resources. Our model is able to create subject-specific, posed meshes in real-time using joint positions as input, though there are sometimes artefacts visible in extreme poses that detract from the realism.",
        "keywords": "Human hand mesh;Computer Vision;Computer Graphics;Deep Learning;Human-centered computing",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Victor Miro Kolenic;Rahul Chaudhari",
        "authorids": "~Victor_Miro_Kolenic1;~Rahul_Chaudhari1",
        "gender": "M;",
        "homepage": ";",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": "victor-miro-kolenic-8a6717287/;",
        "or_profile": "~Victor_Miro_Kolenic1;~Rahul_Chaudhari1",
        "aff": "Technische Universit\u00e4t M\u00fcnchen;",
        "aff_domain": "tum.de;",
        "position": "MS student;",
        "bibtex": "@misc{\nkolenic2024deephandmeshlite,\ntitle={DeepHandMesh-lite: Learning personalized hand shape using limited data and weak supervision},\nauthor={Victor Miro Kolenic and Rahul Chaudhari},\nyear={2024},\nurl={https://openreview.net/forum?id=nzvoDKEvU1}\n}",
        "github": "",
        "project": "",
        "reviewers": "unTW;Z5hG;YMSw",
        "site": "https://openreview.net/forum?id=nzvoDKEvU1",
        "pdf_size": 11079039,
        "rating": "3;3;3",
        "confidence": "5;4;2",
        "soundness": "2;1;2",
        "contribution": "1;1;2",
        "presentation": "3;2;2",
        "wc_summary": "103;94;103",
        "wc_strengths": "26;28;34",
        "wc_weaknesses": "36;218;81",
        "wc_questions": "34;2;376",
        "wc_review": "199;342;594",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            1.247219128924647
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            100.0,
            4.242640687119285
        ],
        "wc_strengths_avg": [
            29.333333333333332,
            3.39934634239519
        ],
        "wc_weaknesses_avg": [
            111.66666666666667,
            77.400832611083
        ],
        "wc_questions_avg": [
            137.33333333333334,
            169.26770381722423
        ],
        "wc_review_avg": [
            378.3333333333333,
            163.2918314620245
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:gfSueKHPXFMJ:scholar.google.com/&scioq=DeepHandMesh-lite:+Learning+personalized+hand+shape+using+limited+data+and+weak+supervision&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Technische Universit\u00e4t M\u00fcnchen",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tum.de",
        "aff_unique_abbr": "TUM",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "o0C2v4xTdS",
        "title": "CoarsenConf: Equivariant Coarsening with Aggregated Attention for Molecular Conformer Generation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Molecular conformer generation (MCG) is an important task in cheminformatics and drug discovery. The ability to efficiently generate low-energy 3D structures can avoid expensive quantum mechanical simulations, leading to accelerated virtual screenings and enhanced structural exploration. Several generative models have been developed for MCG, but many struggle to consistently produce high-quality conformers. To address these issues, we introduce CoarsenConf, which coarse-grains molecular graphs based on torsional angles and integrates them into an SE(3)-equivariant hierarchical variational autoencoder. Through equivariant coarse-graining, we aggregate the fine-grained atomic coordinates of subgraphs connected via rotatable bonds, creating a variable-length coarse-grained latent representation. Our model uses a novel aggregated attention mechanism to restore fine-grained coordinates from the coarse-grained latent representation, enabling efficient generation of accurate conformers. Furthermore, we evaluate the chemical and biochemical quality of our generated conformers on multiple downstream applications, including property prediction and oracle-based protein docking. Overall, CoarsenConf generates more accurate conformer ensembles compared to prior generative models.",
        "keywords": "conformer generation;coarse-grained;coarse-graining;3D molecule generation;equivariance;SE(3)-equivariance;ligand;protein-ligand;binding affinity;structure-based drug discovery;variational autoencoder",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/1410f35f408f22e5ab89a23782e834adefb9e4b2.zip",
        "author": "Danny Reidenbach;Aditi S. Krishnapriyan",
        "authorids": "~Danny_Reidenbach1;~Aditi_S._Krishnapriyan1",
        "gender": "M;",
        "homepage": ";https://a1k12.github.io",
        "dblp": "326/8720;256/5472",
        "google_scholar": ";7HoFN1wAAAAJ",
        "orcid": ";",
        "linkedin": "daniel-reidenbach/;",
        "or_profile": "~Danny_Reidenbach1;~Aditi_Krishnapriyan1",
        "aff": "NVIDIA;University of California, Berkeley",
        "aff_domain": "nvidia.com;berkeley.edu",
        "position": "Researcher;Assistant Professor",
        "bibtex": "@misc{\nreidenbach2024coarsenconf,\ntitle={CoarsenConf: Equivariant Coarsening with Aggregated Attention for Molecular Conformer Generation},\nauthor={Danny Reidenbach and Aditi S. Krishnapriyan},\nyear={2024},\nurl={https://openreview.net/forum?id=o0C2v4xTdS}\n}",
        "github": "",
        "project": "",
        "reviewers": "NaAP;vgnz;qQEF;6Hjw",
        "site": "https://openreview.net/forum?id=o0C2v4xTdS",
        "pdf_size": 1982418,
        "rating": "5;5;6;8",
        "confidence": "3;3;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "52;50;65;53",
        "wc_strengths": "4;39;81;113",
        "wc_weaknesses": "123;139;87;61",
        "wc_questions": "1;30;48;105",
        "wc_review": "180;258;281;332",
        "wc_reply_reviewers": "94;20;0;0",
        "wc_reply_authors": "1355;1364;976;1123",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "3;3;2;2",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            55.0,
            5.873670062235365
        ],
        "wc_strengths_avg": [
            59.25,
            41.30602256330183
        ],
        "wc_weaknesses_avg": [
            102.5,
            30.475399915341555
        ],
        "wc_questions_avg": [
            46.0,
            37.96709101313926
        ],
        "wc_review_avg": [
            262.75,
            54.76940295456944
        ],
        "wc_reply_reviewers_avg": [
            28.5,
            38.687853390954636
        ],
        "wc_reply_authors_avg": [
            1204.5,
            163.51223195834615
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.9428090415820632,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12598750375398325568&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "NVIDIA;University of California, Berkeley",
        "aff_unique_dep": "NVIDIA Corporation;",
        "aff_unique_url": "https://www.nvidia.com;https://www.berkeley.edu",
        "aff_unique_abbr": "NVIDIA;UC Berkeley",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Berkeley",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "o0oroLuPLZ",
        "title": "Sp-R-IP: A Decision-Focused Learning Strategy for Linear Programs that Avoids Overfitting",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "For forecast-informed linear optimization problems, neural networks have shown to be effective tools for achieving robust out-of-sample performance. Various decision-focused learning paradigms have further refined those outcomes by integrating the downstream decision problem in the training pipeline. One of these strategies involves using a convex surrogate of the regret loss function to train the forecaster, called the SPO+ loss function. It allows for the training problem to be reformulated as a linear optimization program. However, this strategy has only been applied to linear forecasters, and is prone to overfitting. In this paper, we propose an extension of the SPO+ reformulation framework that solves the forecaster training procedure using an interior-point optimization method, and tracks the validation regret of intermediate results obtained for different weights of the barrier term. Additionally, we extend the reformulation framework to include the possibility of neural network forecasters with non-linear activation functions. On a real-life experiment of maximizing storage profits in a day-ahead electricity market using actual price data, we show that the proposed methodology effectively solves the problem of overfitting, and that it can outperform other decision-focused benchmarks including training the forecaster with implicit differentiation.",
        "keywords": "Decision-focused learning;interior point optimization;neural networks;linear programs",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/0ccf05d4f957e6ec5f8acffbc516318985fdd406.pdf",
        "author": "Ruben Smets;Mihaly Dolanyi;Jean-Fran\u00e7ois Toubeau;Kenneth Bruninx;Erik Delarue",
        "authorids": "~Ruben_Smets1;~Mihaly_Dolanyi1;~Jean-Fran\u00e7ois_Toubeau1;~Kenneth_Bruninx1;~Erik_Delarue1",
        "gender": "M;M;;M;M",
        "homepage": ";;;https://www.kennethbruninx.com/;https://www.mech.kuleuven.be/en/tme/research/energy-systems-integration-modeling",
        "dblp": ";;;;",
        "google_scholar": ";https://scholar.google.be/citations?user=GCT8KnQAAAAJ;https://scholar.google.be/citations?view_op=list_works;https://scholar.google.com/citations?hl=nl;CsSbk_4AAAAJ",
        "orcid": ";;;;0000-0003-1798-1274",
        "linkedin": "ruben-smets-796b7290/;mih%C3%A1ly-dol%C3%A1nyi-1536636a/;;;",
        "or_profile": "~Ruben_Smets1;~Mihaly_Dolanyi1;~Jean-Fran\u00e7ois_Toubeau1;~Kenneth_Bruninx1;~Erik_Delarue1",
        "aff": "KU Leuven;University of Mons;University of Mons;Delft University of Technology;",
        "aff_domain": "kuleuven.be;umons.ac.be;umons.ac.be;tudelft.nl;",
        "position": "PhD student;Postdoc;Postdoc;Assistant Professor;",
        "bibtex": "@misc{\nsmets2024sprip,\ntitle={Sp-R-{IP}: A Decision-Focused Learning Strategy for Linear Programs that Avoids Overfitting},\nauthor={Ruben Smets and Mihaly Dolanyi and Jean-Fran{\\c{c}}ois Toubeau and Kenneth Bruninx and Erik Delarue},\nyear={2024},\nurl={https://openreview.net/forum?id=o0oroLuPLZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "G7zN;XyMG;AP5r;pKJU;ysWa",
        "site": "https://openreview.net/forum?id=o0oroLuPLZ",
        "pdf_size": 1887641,
        "rating": "3;3;5;6;6",
        "confidence": "4;4;3;3;4",
        "soundness": "3;2;3;3;3",
        "contribution": "2;2;2;3;3",
        "presentation": "2;3;3;3;3",
        "wc_summary": "96;233;105;103;126",
        "wc_strengths": "73;132;107;79;270",
        "wc_weaknesses": "242;338;99;133;116",
        "wc_questions": "48;220;10;5;491",
        "wc_review": "459;923;321;320;1003",
        "wc_reply_reviewers": "145;0;0;0;0",
        "wc_reply_authors": "170;658;187;178;844",
        "reply_reviewers": "1;0;0;0;0",
        "reply_authors": "1;1;1;1;2",
        "rating_avg": [
            4.6,
            1.3564659966250536
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            132.6,
            51.188279908588456
        ],
        "wc_strengths_avg": [
            132.2,
            72.05386873721632
        ],
        "wc_weaknesses_avg": [
            185.6,
            91.12321328838222
        ],
        "wc_questions_avg": [
            154.8,
            185.52347560349338
        ],
        "wc_review_avg": [
            605.2,
            297.5650517113863
        ],
        "wc_reply_reviewers_avg": [
            29.0,
            58.0
        ],
        "wc_reply_authors_avg": [
            407.4,
            286.6981688117313
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            1.2,
            0.4
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5417363388859615,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:td3U0ErggL4J:scholar.google.com/&scioq=Sp-R-IP:+A+Decision-Focused+Learning+Strategy+for+Linear+Programs+that+Avoids+Overfitting&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "Katholieke Universiteit Leuven;University of Mons;Delft University of Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.kuleuven.be;https://www.umons.ac.be;https://www.tudelft.nl",
        "aff_unique_abbr": "KU Leuven;UMons;TU Delft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "Belgium;Netherlands"
    },
    {
        "id": "o0tdWqZ7Sd",
        "title": "Linguistically-Inspired and Explainable Demonstration Retrieval for In-Context Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In-context learning (ICL) is an emerging ability of language models, and its effectiveness hinges on the selection of effective in-context examples for every query. Existing research predominantly rely on retrieval techniques to curate such potential examples for each query. These examples are then ranked by a specialized scoring language model, distinguishing between positive (effective) and negative (ineffective) examples as demonstrations. These results then inform the training of a dense retriever to select effective demonstrations for queries at test time. Existing approaches suffers from narrow selection criteria, lack of explainability, and limited robustness and transferability. This paper introduces a novel approach, grounded in linguistic principles, which defines the key criteria that effective demonstrations should meet. These criteria are language model agnostic, demonstrate superior performance not only in a standard ICL setting but also in domain adaptation settings and in contexts devoid of task-specific instructions, provide explanations for selecting demonstrations, and shed light on inherent biases in existing methods. The proposed approach outperforms five strong baselines across seven tasks. Notably, it achieves higher performance than explicitly optimized models for ICL, such as MetaICL, highlighting its potential applications on large scale models.",
        "keywords": "In-Context Learning;Demonstration Retrieval;Explainability",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Jiali Cheng;Hadi Amiri",
        "authorids": "~Jiali_Cheng1;~Hadi_Amiri1",
        "gender": ";Not Specified",
        "homepage": ";https://cs.uml.edu/~hadi/",
        "dblp": ";41/7403",
        "google_scholar": ";https://scholar.google.com/citations?hl=en",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Jiali_Cheng1;~Hadi_Amiri1",
        "aff": ";University of Massachusetts Lowell",
        "aff_domain": ";uml.edu",
        "position": ";Assistant Professor",
        "bibtex": "@misc{\ncheng2024linguisticallyinspired,\ntitle={Linguistically-Inspired and Explainable Demonstration Retrieval for In-Context Learning},\nauthor={Jiali Cheng and Hadi Amiri},\nyear={2024},\nurl={https://openreview.net/forum?id=o0tdWqZ7Sd}\n}",
        "github": "",
        "project": "",
        "reviewers": "m8eZ;2Ceg;Sf1P;y4Ji;6tfm",
        "site": "https://openreview.net/forum?id=o0tdWqZ7Sd",
        "pdf_size": 349636,
        "rating": "3;5;5;5;6",
        "confidence": "4;3;4;3;4",
        "soundness": "2;3;3;2;3",
        "contribution": "2;2;2;2;3",
        "presentation": "2;3;3;2;4",
        "wc_summary": "88;50;63;117;217",
        "wc_strengths": "28;32;55;59;77",
        "wc_weaknesses": "174;115;117;446;174",
        "wc_questions": "82;5;280;2;2",
        "wc_review": "372;202;515;624;470",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            4.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.8,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            107.0,
            59.575162609933344
        ],
        "wc_strengths_avg": [
            50.2,
            18.126224096595518
        ],
        "wc_weaknesses_avg": [
            205.2,
            123.1639557662874
        ],
        "wc_questions_avg": [
            74.2,
            107.3580923824562
        ],
        "wc_review_avg": [
            436.6,
            142.5420639670971
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.16666666666666663,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:me9f3xHEBEsJ:scholar.google.com/&scioq=Linguistically-Inspired+and+Explainable+Demonstration+Retrieval+for+In-Context+Learning&hl=en&as_sdt=0,11",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Massachusetts Lowell",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uml.edu",
        "aff_unique_abbr": "UMass Lowell",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Lowell",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "o1RqSVIf3c",
        "title": "Bayesian Preference Elicitation for Personalized Prefactual Recommendation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "A prefactual recommendation, also known as an algorithmic recourse, provides actionable guidance to an individual to overturn a machine learning prediction at a minimal cost of efforts. Existing methods impose an explicit assumption on the cost function, but in reality, different individuals may possess diverse and unique cost preferences. Failing to adapt the guidance to an individual's cost preference can lead to irrelevant and inefficient recommendations. To personalize the guidance to the individual cost, we propose a Bayesian preference elicitation framework that learns the cost function from the individual's feedback on a small number of pairwise comparisons. This framework relies on a sequential, mutual-information-maximization question-answering scheme to obtain a posterior distribution of an individual's cost weighting matrix. We then deploy this posterior to recommend a graph-based sequential guidance with minimal expected cost, leading the individual to achieve the desired algorithmic outcome. Numerical experiments on synthetic and real-world datasets demonstrate the power of our method in capturing the individual's preference and recommending personalized recourse.",
        "keywords": "Bayesian Preference Elicitation;Recourse Generation;Mutual Information",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/e55bf2c62e6e6950605b41a48a52e46a583eae7c.zip",
        "author": "Lemin Kong;Marshal Arijona Sinaga;Anthony Man-Cho So;Viet Anh Nguyen",
        "authorids": "~Lemin_Kong1;~Marshal_Arijona_Sinaga2;~Anthony_Man-Cho_So1;~Viet_Anh_Nguyen2",
        "gender": ";M;M;M",
        "homepage": ";https://marshalarijona.github.io/;http://www1.se.cuhk.edu.hk/~manchoso/;http://www.vietanhnguyen.net",
        "dblp": "320/8260;;82/3202;",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;https://scholar.google.com.hk/citations?user=whi3UisAAAAJ;3iyf-EoAAAAJ",
        "orcid": ";;0000-0003-2588-7851;",
        "linkedin": "lemin-kong/;;;",
        "or_profile": "~Lemin_Kong1;~Marshal_Arijona_Sinaga2;~Anthony_Man-Cho_So1;~Viet_Anh_Nguyen2",
        "aff": "Chinese University of Hong Kong, The Chinese University of Hong Kong;Aalto University;The Chinese University of Hong Kong;The Chinese University of Hong Kong",
        "aff_domain": "se.cuhk.edu.hk;aalto.fi;cuhk.edu.hk;cuhk.edu.hk",
        "position": "PhD student;PhD student;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nkong2024bayesian,\ntitle={Bayesian Preference Elicitation for Personalized Prefactual Recommendation},\nauthor={Lemin Kong and Marshal Arijona Sinaga and Anthony Man-Cho So and Viet Anh Nguyen},\nyear={2024},\nurl={https://openreview.net/forum?id=o1RqSVIf3c}\n}",
        "github": "",
        "project": "",
        "reviewers": "yvPj;mLqk;tJ3D;iStc",
        "site": "https://openreview.net/forum?id=o1RqSVIf3c",
        "pdf_size": 642315,
        "rating": "3;3;5;6",
        "confidence": "5;3;4;4",
        "soundness": "3;2;2;4",
        "contribution": "1;2;2;3",
        "presentation": "3;1;3;3",
        "wc_summary": "86;15;99;45",
        "wc_strengths": "40;13;34;43",
        "wc_weaknesses": "161;44;23;193",
        "wc_questions": "40;255;498;34",
        "wc_review": "327;327;654;315",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "601;911;1480;372",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;2;4;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            61.25,
            33.31947628640042
        ],
        "wc_strengths_avg": [
            32.5,
            11.715374513859981
        ],
        "wc_weaknesses_avg": [
            105.25,
            73.01498133944841
        ],
        "wc_questions_avg": [
            206.75,
            190.26478260571503
        ],
        "wc_review_avg": [
            405.75,
            143.41090439712036
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            841.0,
            415.56648084271666
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:K2OsC8aZs3AJ:scholar.google.com/&scioq=Bayesian+Preference+Elicitation+for+Personalized+Prefactual+Recommendation&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Chinese University of Hong Kong;Aalto University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cuhk.edu.hk;https://www.aalto.fi",
        "aff_unique_abbr": "CUHK;Aalto",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "China;Finland"
    },
    {
        "id": "o1TKGCrSL7",
        "title": "Cross-modality debiasing: using language to mitigate sub-population shifts in imaging",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Sub-population shift is a specific type of domain shift that highlights changes in data distribution within specific sub-groups or populations between training and testing. Sub-population shift accounts for a significant source of algorithmic bias and calls for distributional robustness. Recent studies found inherent distributional robustness in multi-modality foundation models, such as the vision-language model CLIP, yet this robustness is vulnerable through parameter fine-tuning. In this paper, we propose leveraging the connection of robustness among different modalities and reshaping the distributional robustness of one modality with another. Specifically, in the context of the distributional robustness of CLIP, we propose to leverage natural language inputs to debias the image feature representations, to improve worst-case performance on sub-populations. Our extensive empirical studies show that image representations debiased by natural language can achieve significant performance improvement and reduction of performance instability under sub-population shifts.",
        "keywords": "cross-modality;sub-population shift",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/8cfba7501af0f0937f7a8bdd5b03d94729bbf030.pdf",
        "author": "Yijiang Pang;Bao Hoang;Jiayu Zhou",
        "authorids": "~Yijiang_Pang1;hoangbao@msu.edu;~Jiayu_Zhou1",
        "gender": "M;;M",
        "homepage": "https://www.egr.msu.edu/~pangyiji/;;http://jiayuzhou.github.io/",
        "dblp": "258/3653;;73/1353",
        "google_scholar": "qCz2e0oAAAAJ;;https://scholar.google.com.tw/citations?user=yQKlLTQAAAAJ",
        "orcid": "0000-0003-0895-088X;;0000-0003-4336-6777",
        "linkedin": "yijiangpang/;;jiayuzhou/",
        "or_profile": "~Yijiang_Pang1;hoangbao@msu.edu;~Jiayu_Zhou1",
        "aff": "Michigan State University;;Michigan State University",
        "aff_domain": "msu.edu;;msu.edu",
        "position": "PhD student;;Associate Professor",
        "bibtex": "@misc{\npang2024crossmodality,\ntitle={Cross-modality debiasing: using language to mitigate sub-population shifts in imaging},\nauthor={Yijiang Pang and Bao Hoang and Jiayu Zhou},\nyear={2024},\nurl={https://openreview.net/forum?id=o1TKGCrSL7}\n}",
        "github": "",
        "project": "",
        "reviewers": "FPNj;KXPh;BEYs;cXZe",
        "site": "https://openreview.net/forum?id=o1TKGCrSL7",
        "pdf_size": 926413,
        "rating": "3;5;5;6",
        "confidence": "4;4;3;3",
        "soundness": "2;3;2;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;4",
        "wc_summary": "77;391;58;83",
        "wc_strengths": "32;61;68;80",
        "wc_weaknesses": "179;209;86;113",
        "wc_questions": "115;295;48;104",
        "wc_review": "403;956;260;380",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "534;535;303;196",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            152.25,
            138.15095909909564
        ],
        "wc_strengths_avg": [
            60.25,
            17.66882848408462
        ],
        "wc_weaknesses_avg": [
            146.75,
            49.35775015131869
        ],
        "wc_questions_avg": [
            140.5,
            92.74831534858194
        ],
        "wc_review_avg": [
            499.75,
            268.95387615723257
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            392.0,
            147.4364269778673
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.6882472016116854,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17568020758397927328&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Michigan State University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.msu.edu",
        "aff_unique_abbr": "MSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "o1YIpFkPSf",
        "title": "Hyperbolic Visual-Semantic Alignment for Structural Visual Recognition",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Visual and semantic concepts inherently organize themselves in a hierarchy, where a higher-level textual concept, e.g., Animal, entails all images containing, e.g., Cat. Despite being intuitive, conventional visual recognition systems strive to establish single-level correspondence between images and semantic concepts, and do not explicitly capture the hierarchical relationships that exist. We present HVSA to probe multi-level semantic information, from fine-grained to fully abstracted, within the tree-shaped hierarchy to realize structural visual recognition. Our main idea is to learn shared representations of images and semantic concepts in the hyperbolic space. Hyperbolic spaces possess suitable geometric properties to embed tree-like data structures, thus will help capture the underlying hierarchy. While it is challenging to acquire structure alignment of the two modalities, we achieve the goal through a joint optimization process guided by two primary objectives. First, we propose hierarchy-agnostic visual-semantic alignment, which leverages a Gaussian mixture VAE to establish a \u201cflat\u201d representation space shared by both modalities. Second, we introduce hierarchy-aware semantic learning to cultivate a \u201chierarchical\u201d feature space for semantic concepts solely through hyperbolic metric learning. These two distinct objectives operate on different granularity and synergistically contribute to hierarchical alignment of visual-semantic features, ultimately enhancing structural image understanding. HVSA shows high efficacy and generality, as evidenced by its notable performance improvements across six datasets, for both image-level (i.e., ImCLEF07A, ImCLEF07D and tieredImageNet-H) and pixel-level (i.e., Cityscapes, LIP, and PASCAL-Person- Part) visual recognition. Our code shall be released.",
        "keywords": "visual recognition;semantic segmentation;semantic hierarchy",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Binglu Wang;Zhaozhong Wang;Tianfei Zhou",
        "authorids": "~Binglu_Wang1;~Zhaozhong_Wang1;~Tianfei_Zhou2",
        "gender": "M;M;M",
        "homepage": ";;https://www.tfzhou.com/",
        "dblp": "205/4112;17/5775;150/6710",
        "google_scholar": "-eey0pkAAAAJ;;https://scholar.google.ae/citations?user=-_33ccMAAAAJ",
        "orcid": "0000-0002-9266-4685;0009-0008-9461-8237;0000-0001-5475-1473",
        "linkedin": ";;",
        "or_profile": "~Binglu_Wang1;~Zhaozhong_Wang1;~Tianfei_Zhou2",
        "aff": "Xi'an University of Architecture and Technology;Northwest Polytechnical University Xi'an;Beijing Institute of Technology",
        "aff_domain": "xauat.edu.cn;nwpu.edu.cn;bit.edu.cn",
        "position": "Associate Professor;PhD student;Full Professor",
        "bibtex": "@misc{\nanonymous2024hyperbolic,\ntitle={Hyperbolic Visual-Semantic Alignment for Structural Visual Recognition},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=o1YIpFkPSf}\n}",
        "github": "",
        "project": "",
        "reviewers": "Lirp;SCte;rCAE",
        "site": "https://openreview.net/forum?id=o1YIpFkPSf",
        "pdf_size": 2743240,
        "rating": "3;6;6",
        "confidence": "4;3;2",
        "soundness": "2;3;3",
        "contribution": "2;3;2",
        "presentation": "3;3;2",
        "wc_summary": "47;94;45",
        "wc_strengths": "27;57;32",
        "wc_weaknesses": "121;89;130",
        "wc_questions": "34;12;77",
        "wc_review": "229;252;284",
        "wc_reply_reviewers": "1353;0;81",
        "wc_reply_authors": "2843;422;1138",
        "reply_reviewers": "7;0;1",
        "reply_authors": "7;1;2",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            62.0,
            22.642143596988927
        ],
        "wc_strengths_avg": [
            38.666666666666664,
            13.123346456686352
        ],
        "wc_weaknesses_avg": [
            113.33333333333333,
            17.594190960528863
        ],
        "wc_questions_avg": [
            41.0,
            26.993826454703797
        ],
        "wc_review_avg": [
            255.0,
            22.55363976538303
        ],
        "wc_reply_reviewers_avg": [
            478.0,
            619.6014848271427
        ],
        "wc_reply_authors_avg": [
            1467.6666666666667,
            1015.4868564169383
        ],
        "reply_reviewers_avg": [
            2.6666666666666665,
            3.091206165165235
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            2.6246692913372702
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8660254037844387,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:S2Xg-wG29akJ:scholar.google.com/&scioq=Hyperbolic+Visual-Semantic+Alignment+for+Structural+Visual+Recognition&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Xi'an University of Architecture and Technology;Northwest Polytechnical University;Beijing Institute of Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.xauat.edu.cn;http://www.nwpu.edu.cn;http://www.bit.edu.cn/",
        "aff_unique_abbr": "XAUAT;NWPU;BIT",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Xi'an;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Pre-Training Goal-based Models for Sample-Efficient Reinforcement Learning",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17838",
        "id": "o2IEmeLL9r",
        "author_site": "Haoqi Yuan, Zhancun Mu, Feiyang Xie, Zongqing Lu",
        "tldr": "",
        "abstract": "Pre-training on task-agnostic large datasets is a promising approach for enhancing the sample efficiency of reinforcement learning (RL) in solving complex tasks. We present PTGM, a novel method that pre-trains goal-based models to augment RL by providing temporal abstractions and behavior regularization. PTGM involves pre-training a low-level, goal-conditioned policy and training a high-level policy to generate goals for subsequent RL tasks. To address the challenges posed by the high-dimensional goal space, while simultaneously maintaining the agent's capability to accomplish various skills, we propose clustering goals in the dataset to form a discrete high-level action space. Additionally, we introduce a pre-trained goal prior model to regularize the behavior of the high-level policy in RL, enhancing sample efficiency and learning stability. Experimental results in a robotic simulation environment and the challenging open-world environment of Minecraft demonstrate PTGM\u2019s superiority in sample efficiency and task performance compared to baselines. Moreover, PTGM exemplifies enhanced interpretability and generalization of the acquired low-level skills.",
        "keywords": "reinforcement learning;pre-training;goal-conditioned RL;open-world environments",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Haoqi Yuan;Zhancun Mu;Feiyang Xie;Zongqing Lu",
        "authorids": "~Haoqi_Yuan1;~Zhancun_Mu1;~Feiyang_Xie1;~Zongqing_Lu2",
        "gender": "M;M;;",
        "homepage": ";https://muzhancun.github.io;https://github.com/Xiefeiy;",
        "dblp": "254/2084;381/4972;301/5891;",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;mwN8K4IAAAAJ;;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Haoqi_Yuan1;~Zhancun_Mu1;~Feiyang_Xie1;~Zongqing_Lu2",
        "aff": "Peking University;Peking University;Peking University;",
        "aff_domain": "pku.edu.cn;pku.edu.cn;pku.edu.cn;",
        "position": "PhD student;Undergrad student;Undergrad student;",
        "bibtex": "@inproceedings{\nyuan2024pretraining,\ntitle={Pre-Training Goal-based Models for Sample-Efficient Reinforcement Learning},\nauthor={Haoqi Yuan and Zhancun Mu and Feiyang Xie and Zongqing Lu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=o2IEmeLL9r}\n}",
        "github": "",
        "project": "",
        "reviewers": "VFeh;WXZL;NwB4",
        "pdf_size": 1749539,
        "rating": "6;8;8",
        "confidence": "4;3;4",
        "soundness": "2;3;3",
        "contribution": "2;2;3",
        "presentation": "2;3;3",
        "wc_summary": "53;111;201",
        "wc_strengths": "16;98;119",
        "wc_weaknesses": "146;165;314",
        "wc_questions": "32;306;216",
        "wc_review": "247;680;850",
        "wc_reply_reviewers": "74;70;58",
        "wc_reply_authors": "687;1049;754",
        "reply_reviewers": "1;1;1",
        "reply_authors": "2;3;2",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            121.66666666666667,
            60.88969991349568
        ],
        "wc_strengths_avg": [
            77.66666666666667,
            44.43972197132751
        ],
        "wc_weaknesses_avg": [
            208.33333333333334,
            75.11916459126051
        ],
        "wc_questions_avg": [
            184.66666666666666,
            114.03313358649562
        ],
        "wc_review_avg": [
            592.3333333333334,
            253.8586658403101
        ],
        "wc_reply_reviewers_avg": [
            67.33333333333333,
            6.79869268479038
        ],
        "wc_reply_authors_avg": [
            830.0,
            157.25351082461296
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7844336804199622729&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=o2IEmeLL9r",
        "pdf": "https://openreview.net/pdf?id=o2IEmeLL9r",
        "email": "pku.edu.cn;pku.edu.cn;pku.edu.cn;",
        "author_num": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Peking University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.pku.edu.cn",
        "aff_unique_abbr": "Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Manifold Preserving Guided Diffusion",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17837",
        "id": "o3BxOLoxm1",
        "author_site": "Yutong He, Naoki Murata, Chieh-Hsin Lai, Yuhta Takida, Toshimitsu Uesaka, Dongjun Kim, WeiHsiang Liao, Yuki Mitsufuji, J Kolter, Ruslan Salakhutdinov, Stefano Ermon",
        "tldr": "",
        "abstract": "Despite the recent advancements, conditional image generation still faces challenges of cost, generalizability, and the need for task-specific training. In this paper, we propose Manifold Preserving Guided Diffusion (MPGD), a training-free conditional generation framework that leverages pretrained diffusion models and off-the-shelf neural networks with minimal additional inference cost for a broad range of tasks. Specifically, we leverage the manifold hypothesis to refine the guided diffusion steps and introduce a shortcut algorithm in the process. We then propose two methods for on-manifold training-free guidance using pre-trained autoencoders and demonstrate that our shortcut inherently preserves the manifolds when applied to latent diffusion models. Our experiments show that MPGD is efficient and effective for solving a variety of conditional generation applications in low-compute settings, and can consistently offer up to 3.8\u00d7 speed-ups with the same number of diffusion steps while maintaining high sample quality compared to the baselines.",
        "keywords": "generative model;diffusion model;controllable generation",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Yutong He;Naoki Murata;Chieh-Hsin Lai;Yuhta Takida;Toshimitsu Uesaka;Dongjun Kim;Wei-Hsiang Liao;Yuki Mitsufuji;J Zico Kolter;Ruslan Salakhutdinov;Stefano Ermon",
        "authorids": "~Yutong_He1;~Naoki_Murata1;~Chieh-Hsin_Lai2;~Yuhta_Takida1;~Toshimitsu_Uesaka1;~Dongjun_Kim1;~Wei-Hsiang_Liao1;~Yuki_Mitsufuji1;~J_Zico_Kolter1;~Ruslan_Salakhutdinov1;~Stefano_Ermon1",
        "gender": "F;M;M;M;M;M;M;M;M;M;M",
        "homepage": "https://kellyyutonghe.github.io/;;https://chiehhsinjesselai.github.io/;;;https://sites.google.com/view/dongjun-kim?pli=1;;https://www.yukimitsufuji.com/;http://cs.stanford.edu/~ermon/;http://www.zicokolter.com;https://www.cs.cmu.edu/~rsalakhu/",
        "dblp": ";166/6626;239/4021;225/9928;204/3391;03/4394;18/4227;136/5043;47/8135;67/2526;",
        "google_scholar": "uNF3hk0AAAAJ;https://scholar.google.co.jp/citations?user=oyuTmwoAAAAJ;KDnKGu8AAAAJ;https://scholar.google.co.jp/citations?user=ahqdEYUAAAAJ;;https://scholar.google.com/citations?hl=ko;zhV53JEAAAAJ;https://scholar.google.com/citations?hl=en;;UXh1I6UAAAAJ;",
        "orcid": ";0000-0001-7418-5173;;;0009-0007-0747-8305;;;0000-0002-6806-6140;;;",
        "linkedin": "yutong-he-b7608b12b/;;;;;;wei-hsiang-liao-66283154/;mittu1204;;;",
        "or_profile": "~Yutong_He1;~Naoki_Murata1;~Chieh-Hsin_Lai2;~Yuhta_Takida1;~Toshimitsu_Uesaka1;~Dongjun_Kim1;~Wei-Hsiang_Liao1;~Yuki_Mitsufuji1;~Stefano_Ermon1;~Zico_Kolter1;~Russ_Salakhutdinov1",
        "aff": "School of Computer Science, Carnegie Mellon University;Sony Group Corporation;Sony AI;Sony AI;Sony AI;Sony AI;Sony Research Inc.;Tokyo Institute of Technology, Tokyo Institute of Technology;Stanford University;Carnegie Mellon University;School of Computer Science, Carnegie Mellon University",
        "aff_domain": "cs.cmu.edu;sony.com;sony.com;sony.com;sony.com;sony.com;sony.com;titech.ac.jp;stanford.edu;cmu.edu;cs.cmu.edu",
        "position": "PhD student;Researcher;Researcher;AI Engineer;Researcher;Intern;Staff Research Scientist;Associate Professor;Associate Professor;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nhe2024manifold,\ntitle={Manifold Preserving Guided Diffusion},\nauthor={Yutong He and Naoki Murata and Chieh-Hsin Lai and Yuhta Takida and Toshimitsu Uesaka and Dongjun Kim and Wei-Hsiang Liao and Yuki Mitsufuji and J Zico Kolter and Ruslan Salakhutdinov and Stefano Ermon},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=o3BxOLoxm1}\n}",
        "github": "",
        "project": "",
        "reviewers": "smw4;mY9K;obSn;Yt4g",
        "pdf_size": 0,
        "rating": "6;6;6;8",
        "confidence": "3;3;4;3",
        "soundness": "3;3;3;4",
        "contribution": "3;3;3;3",
        "presentation": "3;3;3;4",
        "wc_summary": "58;79;40;98",
        "wc_strengths": "43;39;49;124",
        "wc_weaknesses": "112;149;220;96",
        "wc_questions": "16;14;54;29",
        "wc_review": "229;281;363;347",
        "wc_reply_reviewers": "41;0;101;83",
        "wc_reply_authors": "412;1223;653;563",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "3;3;2;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            68.75,
            21.810261346439663
        ],
        "wc_strengths_avg": [
            63.75,
            34.966948680146515
        ],
        "wc_weaknesses_avg": [
            144.25,
            47.77224612680463
        ],
        "wc_questions_avg": [
            28.25,
            15.943258763502524
        ],
        "wc_review_avg": [
            305.0,
            53.5723809439155
        ],
        "wc_reply_reviewers_avg": [
            56.25,
            39.098433472455135
        ],
        "wc_reply_authors_avg": [
            712.75,
            306.92049051831
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 50,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6441363629580447014&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=o3BxOLoxm1",
        "pdf": "https://openreview.net/pdf?id=o3BxOLoxm1",
        "email": "cs.cmu.edu;sony.com;sony.com;sony.com;sony.com;sony.com;sony.com;titech.ac.jp;stanford.edu;cmu.edu;cs.cmu.edu",
        "author_num": 11,
        "aff_unique_index": "0;1;2;2;2;2;3;4;5;0;0",
        "aff_unique_norm": "Carnegie Mellon University;Sony Group Corporation;Sony;Sony Research Inc.;Tokyo Institute of Technology;Stanford University",
        "aff_unique_dep": "School of Computer Science;;Sony AI;;;",
        "aff_unique_url": "https://www.cmu.edu;https://www.sony.com;https://www.sony.com;https://www.sony.com;https://www.titech.ac.jp;https://www.stanford.edu",
        "aff_unique_abbr": "CMU;Sony;Sony AI;SRI;Titech;Stanford",
        "aff_campus_unique_index": "0;2;3;0",
        "aff_campus_unique": "Pittsburgh;;Tokyo;Stanford",
        "aff_country_unique_index": "0;1;1;1;1;1;0;1;0;0;0",
        "aff_country_unique": "United States;Japan"
    },
    {
        "id": "o4AydSd3Lp",
        "title": "Harnessing Discrete Representations for Continual Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Reinforcement learning (RL) agents make decisions using nothing but observations from the environment, and consequently, heavily rely on the representations of those observations. Though some recent breakthroughs have used vector-based categorical representations of observations, often referred to as discrete representations, there is little work explicitly assessing the significance of such a choice. In this work, we provide a thorough empirical investigation of the advantages of representing observations as vectors of categorical values within the context of reinforcement learning. We perform evaluations on world-model learning, model-free RL, and ultimately continual RL problems, where the benefits best align with the needs of the problem setting. We find that, when compared to traditional continuous representations, world models learned over discrete representations accurately model more of the world with less capacity, and that agents trained with discrete representations learn better policies with less data. In the context of continual RL, these benefits translate into faster adapting agents. Additionally, our analysis suggests that the observed performance improvements can be attributed to the information contained within the latent vectors and potentially the encoding of the discrete representation itself.",
        "keywords": "reinforcement learning;continual reinforcement learning;discrete representations;representation learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/cc1a53671ed035245212794cb5f678068fb88ee1.zip",
        "author": "Edan Jacob Meyer;Adam White;Marlos C. Machado",
        "authorids": "~Edan_Jacob_Meyer1;~Adam_White1;~Marlos_C._Machado1",
        "gender": ";M;M",
        "homepage": ";https://webdocs.cs.ualberta.ca/~machado/;http://adamwhite.ca",
        "dblp": ";21/10949;91/10481",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.ca/citations?user=xf_n4xUAAAAJ;https://scholar.google.ca/citations?user=1GqGhcsAAAAJ",
        "orcid": ";;",
        "linkedin": "edan-meyer/;cholodovskis/;",
        "or_profile": "~Edan_Jacob_Meyer1;~Marlos_C._Machado1;~Adam_M_White1",
        "aff": ";University of Alberta;University of Alberta",
        "aff_domain": ";ualberta.ca;ualberta.ca",
        "position": ";Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nmeyer2024harnessing,\ntitle={Harnessing Discrete Representations for Continual Reinforcement Learning},\nauthor={Edan Jacob Meyer and Adam White and Marlos C. Machado},\nyear={2024},\nurl={https://openreview.net/forum?id=o4AydSd3Lp}\n}",
        "github": "",
        "project": "",
        "reviewers": "KUuk;CBeE;Cvsu;Ys23",
        "site": "https://openreview.net/forum?id=o4AydSd3Lp",
        "pdf_size": 1499475,
        "rating": "5;5;6;8",
        "confidence": "4;4;4;3",
        "soundness": "3;2;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;4;3",
        "wc_summary": "74;95;97;89",
        "wc_strengths": "109;116;145;104",
        "wc_weaknesses": "288;211;138;91",
        "wc_questions": "201;84;84;91",
        "wc_review": "672;506;464;375",
        "wc_reply_reviewers": "473;169;0;0",
        "wc_reply_authors": "1181;681;325;619",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "2;2;1;2",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            88.75,
            9.01041064547005
        ],
        "wc_strengths_avg": [
            118.5,
            15.88238017426859
        ],
        "wc_weaknesses_avg": [
            182.0,
            74.65587719664138
        ],
        "wc_questions_avg": [
            115.0,
            49.73429400323282
        ],
        "wc_review_avg": [
            504.25,
            107.78305757399907
        ],
        "wc_reply_reviewers_avg": [
            160.5,
            193.16379060269034
        ],
        "wc_reply_authors_avg": [
            701.5,
            307.7738617881642
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.9428090415820632,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15238769717886196836&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Alberta",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ualberta.ca",
        "aff_unique_abbr": "UAlberta",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Canada"
    },
    {
        "title": "Learning Robust Generalizable Radiance Field with Visibility and Feature Augmented Point Representation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17836",
        "id": "o4CLLlIaaH",
        "author_site": "Jiaxu Wang, Ziyi Zhang, Renjing Xu",
        "tldr": "",
        "abstract": "This paper introduces a novel paradigm for the generalizable neural radiance field (NeRF). Previous generic NeRFs combine multiview stereo techniques with image-based neural rendering, yielding impressive results, while suffering from three issues. First, occlusions often result in inconsistent feature matching. Then, they deliver distortions and artifacts in geometric discontinuities and locally sharp shapes due to their individual process of sampled points and rough feature aggregation. Third, their image-based representations experience severe degradations\nwhen source views are not near enough to the target view. To address challenges, we propose the first paradigm that constructs the generalizable neural field based on point-based rather than image-based rendering, which we call the Generalizable neural Point Field (GPF). Our approach explicitly models visibilities by geometric priors and augments them with neural features. We propose a novel nonuniform log sampling strategy to improve rendering speed and reconstruction quality. Moreover, we present a learnable kernel spatially augmented\nwith features for feature aggregations, mitigating distortions at places with drastically varying geometries. Besides, our representation can be easily manipulated. Experiments show that our model can deliver better geometries, view consistencies, and rendering quality than all counterparts and benchmarks on three datasets in both generalization and finetuning settings, preliminarily proving the potential of the new paradigm for generalizable NeRF",
        "keywords": "Generalizable Neural Radiance Field; Point-based Rendering;",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/8d7f20036249027916bff2f8b726c5fbbc3468b7.zip",
        "author": "WANG Jiaxu;Ziyi Zhang;Renjing Xu",
        "authorids": "~WANG_Jiaxu1;~Ziyi_Zhang6;~Renjing_Xu1",
        "gender": ";F;",
        "homepage": ";https://github.com/Zerory1;",
        "dblp": ";;",
        "google_scholar": ";;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~WANG_Jiaxu1;~Ziyi_Zhang6;~Renjing_Xu1",
        "aff": ";Hong Kong University of Science and Technology (Guangzhou);",
        "aff_domain": ";hkust-gz.edu.cn;",
        "position": ";PhD student;",
        "bibtex": "@inproceedings{\njiaxu2024learning,\ntitle={Learning Robust Generalizable Radiance Field with Visibility and Feature Augmented Point Representation},\nauthor={WANG Jiaxu and Ziyi Zhang and Renjing Xu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=o4CLLlIaaH}\n}",
        "github": "",
        "project": "",
        "reviewers": "gQRV;s3fi;BQBs;BFzR",
        "pdf_size": 24840615,
        "rating": "6;6;6;8",
        "confidence": "4;3;4;4",
        "soundness": "3;2;2;3",
        "contribution": "2;2;3;3",
        "presentation": "3;2;2;3",
        "wc_summary": "99;59;87;103",
        "wc_strengths": "121;76;22;78",
        "wc_weaknesses": "200;75;112;110",
        "wc_questions": "27;101;104;196",
        "wc_review": "447;311;325;487",
        "wc_reply_reviewers": "34;26;0;12",
        "wc_reply_authors": "1486;1234;964;1690",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "5;5;2;6",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            87.0,
            17.204650534085253
        ],
        "wc_strengths_avg": [
            74.25,
            35.116769498346514
        ],
        "wc_weaknesses_avg": [
            124.25,
            46.14311974715191
        ],
        "wc_questions_avg": [
            107.0,
            59.9291248058905
        ],
        "wc_review_avg": [
            392.5,
            75.99177587081381
        ],
        "wc_reply_reviewers_avg": [
            18.0,
            13.038404810405298
        ],
        "wc_reply_authors_avg": [
            1343.5,
            272.20350842705903
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.5,
            1.5
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6512193854012514492&as_sdt=5,39&sciodt=0,39&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=o4CLLlIaaH",
        "pdf": "https://openreview.net/pdf?id=o4CLLlIaaH",
        "email": ";hkust-gz.edu.cn;",
        "author_num": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "Hong Kong University of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ust.hk",
        "aff_unique_abbr": "HKUST",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "o4Uheo6nR1",
        "title": "Robust prediction under missingness shifts",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Prediction becomes more challenging with missing data. What method is chosen to handle missing data can greatly affect how models perform. In many real-world problems, the best prediction performance is achieved by models that also leverage the informative nature of a value being missing. However, the reasons why data goes missing can change once a model is deployed in practice. In this case, prediction performance in the development data may no longer be a good selection criterion, and approaches that do not rely on informative missingness may be preferable. To identify the conditions that lead to robust prediction, we formalise the problem of missingness shifts as any change in the conditional probability of a value being missing. We then show that the optimal predictor is only affected by non-ignorable shifts, where the probability of missingness depends on unobserved data. When the optimal predictor is changed due to a non-ignorable shift, we find empirically that even predictors which utilise information encoded in the missingness may still achieve robust predictions, although different methods appear robust to different types of shifts. Disregarding informative missingness was most beneficial when the probability of missingness was influenced by the outcome.",
        "keywords": "supervised learning;missing data;distribution shift",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/74d1ff826541b0f4352c26e5bd98fadd679508bc.zip",
        "author": "Patrick Rockenschaub;Zhicong Xian;Alireza Zamanian;Marta Piperno;Octavia-Andreea Ciora;Elisabeth Pachl;Narges Ahmidi",
        "authorids": "~Patrick_Rockenschaub1;~Zhicong_Xian2;~Alireza_Zamanian1;~Marta_Piperno1;~Octavia-Andreea_Ciora1;~Elisabeth_Pachl1;~Narges_Ahmidi2",
        "gender": "M;M;M;F;F;F;F",
        "homepage": "https://patrick-rockenschaub.com/;https://www.linkedin.com/in/zhicong-xian-43a20075/;;;;;",
        "dblp": ";;;;;;",
        "google_scholar": "1BEClqkAAAAJ;;NDlpy9oAAAAJ;;tiuByTsAAAAJ;2YeoguUAAAAJ;SKLSzpEAAAAJ",
        "orcid": "0000-0002-6499-7933;;;;0000-0002-9399-781X;0000-0002-6567-8715;",
        "linkedin": ";;;marta-piperno-786067234;;elisabeth-pachl-5b9338166;",
        "or_profile": "~Patrick_Rockenschaub1;~Zhicong_Xian2;~Alireza_Zamanian1;~Marta_Piperno1;~Octavia-Andreea_Ciora1;~Elisabeth_Pachl1;~Narges_Ahmidi2",
        "aff": "Medizinische Universit\u00e4t Innsbruck;;Technische Universit\u00e4t M\u00fcnchen;Technische Universit\u00e4t M\u00fcnchen;Fraunhofer IKS;Fraunhofer Institut f\u00fcr Kognitive Systeme IKS;Fraunhofer IKS",
        "aff_domain": "i-med.ac.at;;tum.de;tum.de;iks.fraunhofer.de;iks.fraunhofer.de;fraunhofer.de",
        "position": "Postdoc;;PhD student;MS student;Researcher;Researcher;Principal Researcher",
        "bibtex": "@misc{\nrockenschaub2024robust,\ntitle={Robust prediction under missingness shifts},\nauthor={Patrick Rockenschaub and Zhicong Xian and Alireza Zamanian and Marta Piperno and Octavia-Andreea Ciora and Elisabeth Pachl and Narges Ahmidi},\nyear={2024},\nurl={https://openreview.net/forum?id=o4Uheo6nR1}\n}",
        "github": "",
        "project": "",
        "reviewers": "P8Mn;tBPA;ExJF;ntEa",
        "site": "https://openreview.net/forum?id=o4Uheo6nR1",
        "pdf_size": 703836,
        "rating": "3;5;6;8",
        "confidence": "4;3;5;3",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;4;2",
        "wc_summary": "79;58;46;117",
        "wc_strengths": "67;31;39;59",
        "wc_weaknesses": "339;90;294;72",
        "wc_questions": "106;3;21;280",
        "wc_review": "591;182;400;528",
        "wc_reply_reviewers": "0;0;33;14",
        "wc_reply_authors": "846;532;478;703",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            75.0,
            26.972207918522354
        ],
        "wc_strengths_avg": [
            49.0,
            14.560219778561036
        ],
        "wc_weaknesses_avg": [
            198.75,
            118.99028321674001
        ],
        "wc_questions_avg": [
            102.5,
            109.61409580888764
        ],
        "wc_review_avg": [
            425.25,
            156.3959318524622
        ],
        "wc_reply_reviewers_avg": [
            11.75,
            13.534677683639163
        ],
        "wc_reply_authors_avg": [
            639.75,
            145.18328932766332
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.25087260300212727,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Sbys2Ef09yEJ:scholar.google.com/&scioq=Robust+prediction+under+missingness+shifts&hl=en&as_sdt=0,33",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1;2;3;2",
        "aff_unique_norm": "Medizinische Universit\u00e4t Innsbruck;Technische Universit\u00e4t M\u00fcnchen;Fraunhofer Institute for Integrated Systems and Device Technology;Fraunhofer Institute for Cognitive Systems IKS",
        "aff_unique_dep": ";;;Institute for Cognitive Systems",
        "aff_unique_url": "https://www.i-med.ac.at;https://www.tum.de;https://www.iks.fraunhofer.de/;https://www.iks.fraunhofer.de/",
        "aff_unique_abbr": "MUI;TUM;Fraunhofer IKS;Fraunhofer IKS",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Innsbruck;",
        "aff_country_unique_index": "0;1;1;1;1;1",
        "aff_country_unique": "Austria;Germany"
    },
    {
        "id": "o4XNuQ5qft",
        "title": "Optimum Shifting to Stabilize Training and Improve Generalization of Deep Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent studies have shown that generalization is correlated with the sharpness of the loss landscape and flat minima suggests a better generalization ability than sharp minima.\nIn this paper, we introduce a method called optimum shifting (OS), which changes the parameters of a neural network from sharper minima to a flatter one while maintaining the same training loss.\nOur approach is based on the observation that when the input and output of a neural network are fixed, the matrix multiplications within the network can be treated as systems of under-determined linear equations, enabling adjustment of parameters in solution space.\nThis can be accomplished by solving a constrained optimization problem, which is easy to implement.\nWe prove that the minima we move to will be flatter than the original one. \nFurthermore, we introduce a practical stochastic optimum shifting (SOS) technique utilizing neural collapse theory to reduce computational costs and provide more degrees of freedom for optimum shifting. \nIn our experiments, we present various DNNs (e.g., VGG, ResNet, DenseNet and Vit) on the Cifar 10/100 and Tiny-Imagenet datasets to validate the effectiveness of our method.",
        "keywords": "Deep Networks; Optimization; Generalization;",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/41268d7b5055927073c3923d917b6697a0c850c1.zip",
        "author": "Zhou Yuyan;Ye Li;Sheng-Jun Huang",
        "authorids": "~Zhou_Yuyan2;~Ye_Li6;~Sheng-Jun_Huang1",
        "gender": "M;M;",
        "homepage": ";;http://parnec.nuaa.edu.cn/huangsj",
        "dblp": ";;01/3367.html",
        "google_scholar": "YdxIUxsAAAAJ;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": ";0000-0003-3986-129X;0000-0002-7673-5367",
        "linkedin": ";;",
        "or_profile": "~Zhou_Yuyan2;~Ye_Li6;~Sheng-Jun_Huang1",
        "aff": ";Nanjing University of Aeronautics and Astronautics;Nanjing University of Aeronautics and Astronautics",
        "aff_domain": ";nuaa.edu.cn;nuaa.edu.cn",
        "position": ";Assistant Professor;Full Professor",
        "bibtex": "@misc{\nyuyan2024optimum,\ntitle={Optimum Shifting to Stabilize Training and Improve Generalization of Deep Neural Networks},\nauthor={Zhou Yuyan and Ye Li and Sheng-Jun Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=o4XNuQ5qft}\n}",
        "github": "",
        "project": "",
        "reviewers": "DgxS;WtMt;urCd;KEY9",
        "site": "https://openreview.net/forum?id=o4XNuQ5qft",
        "pdf_size": 2305145,
        "rating": "3;5;5;8",
        "confidence": "3;4;4;5",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "25;94;72;128",
        "wc_strengths": "38;17;34;180",
        "wc_weaknesses": "25;91;104;210",
        "wc_questions": "39;52;10;9",
        "wc_review": "127;254;220;527",
        "wc_reply_reviewers": "0;0;0;36",
        "wc_reply_authors": "513;654;471;577",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            79.75,
            37.37897136091361
        ],
        "wc_strengths_avg": [
            67.25,
            65.57200240956502
        ],
        "wc_weaknesses_avg": [
            107.5,
            66.32684222846736
        ],
        "wc_questions_avg": [
            27.5,
            18.580904176062045
        ],
        "wc_review_avg": [
            282.0,
            148.8942577804799
        ],
        "wc_reply_reviewers_avg": [
            9.0,
            15.588457268119896
        ],
        "wc_reply_authors_avg": [
            553.75,
            69.09911359778792
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.9901475429766743,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:zYvKi5y5rTQJ:scholar.google.com/&scioq=Optimum+Shifting+to+Stabilize+Training+and+Improve+Generalization+of+Deep+Neural+Networks&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Nanjing University of Aeronautics and Astronautics",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.nuaa.edu.cn",
        "aff_unique_abbr": "NUAA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "$\\pi$2vec: Policy Representation with Successor Features",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17835",
        "id": "o5Bqa4o5Mi",
        "author_site": "Gianluca Scarpellini, Ksenia Konyushkova, Claudio Fantacci, Thomas Paine, Yutian Chen, Misha Denil",
        "tldr": "",
        "abstract": "This paper introduces $\\pi$2vec, a method for representing black box policies as comparable feature vectors.\nOur method combines the strengths of foundation models that serve as generic and powerful state representations and successor features that can model the future occurrence of the states for a policy.\n$\\pi$2vec represents the behavior of policies by capturing the statistics of the features from a pretrained model with the help of successor feature framework. \nWe focus on the offline setting where policies and their representations are trained on a fixed dataset of trajectories.\nFinally, we employ linear regression on $\\pi$2vec vector representations to predict the performance of held out policies.\nThe synergy of these techniques results in a method for efficient policy evaluation in resource constrained environments.",
        "keywords": "Policy representation;offline policy selection;robotics;evaluation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Gianluca Scarpellini;Ksenia Konyushkova;Claudio Fantacci;Thomas Paine;Yutian Chen;Misha Denil",
        "authorids": "~Gianluca_Scarpellini1;~Ksenia_Konyushkova1;~Claudio_Fantacci1;~Thomas_Paine1;~Yutian_Chen1;~Misha_Denil1",
        "gender": "M;F;M;M;;M",
        "homepage": "https://scarpellini.dev/;https://ksenia.konyushkova.com/;;http://tomlepaine.github.io;http://yutianchen.com/;mdenil.com",
        "dblp": "290/7952;127/6394;129/8516;139/1033;95/7441-1;48/8092",
        "google_scholar": "Wlye2XUAAAAJ;https://scholar.google.ch/citations?user=gTACuSgAAAAJ;https://scholar.google.it/citations?user=p6iM9gIAAAAJ;oFIvUSQAAAAJ;fAWKizAAAAAJ;https://scholar.google.co.uk/citations?user=XrKLUO0AAAAJ",
        "orcid": ";;0000-0002-9980-3617;;;",
        "linkedin": ";;claudiofantacci;;;",
        "or_profile": "~Gianluca_Scarpellini1;~Ksenia_Konyushkova1;~Claudio_Fantacci1;~Thomas_Paine1;~Yutian_Chen1;~Misha_Denil1",
        "aff": "Istituto Italiano di Tecnologia;Google DeepMind;Google DeepMind;Google/DeepMind;Google DeepMind;Google",
        "aff_domain": "iit.it;google.com;deepmind.com;google.com;google.com;google.com",
        "position": "PhD student;Research Scientist;Researcher;Research Scientist;Research Scientist;Research Scientist",
        "bibtex": "@inproceedings{\nscarpellini2024pivec,\ntitle={\\${\\textbackslash}pi\\$2vec: Policy Representation with Successor Features},\nauthor={Gianluca Scarpellini and Ksenia Konyushkova and Claudio Fantacci and Thomas Paine and Yutian Chen and Misha Denil},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=o5Bqa4o5Mi}\n}",
        "github": "",
        "project": "",
        "reviewers": "Kqe9;4YPE;81Fm;eE8e",
        "pdf_size": 2354783,
        "rating": "5;5;5;6",
        "confidence": "4;3;3;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;3;3",
        "wc_summary": "78;89;84;85",
        "wc_strengths": "23;38;120;74",
        "wc_weaknesses": "141;199;96;67",
        "wc_questions": "2;6;318;98",
        "wc_review": "244;332;618;324",
        "wc_reply_reviewers": "0;127;0;0",
        "wc_reply_authors": "413;1161;469;470",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            84.0,
            3.9370039370059056
        ],
        "wc_strengths_avg": [
            63.75,
            37.392345473371954
        ],
        "wc_weaknesses_avg": [
            125.75,
            49.8366080306435
        ],
        "wc_questions_avg": [
            106.0,
            128.2809416865966
        ],
        "wc_review_avg": [
            379.5,
            141.93220212481734
        ],
        "wc_reply_reviewers_avg": [
            31.75,
            54.99261314031185
        ],
        "wc_reply_authors_avg": [
            628.25,
            308.44721995829366
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10771560183042952825&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=o5Bqa4o5Mi",
        "pdf": "https://openreview.net/pdf?id=o5Bqa4o5Mi",
        "email": "iit.it;google.com;deepmind.com;google.com;google.com;google.com",
        "author_num": 6,
        "aff_unique_index": "0;1;1;1;1;1",
        "aff_unique_norm": "Istituto Italiano di Tecnologia;Google",
        "aff_unique_dep": ";Google DeepMind",
        "aff_unique_url": "https://www.iit.it;https://deepmind.com",
        "aff_unique_abbr": "IIT;DeepMind",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;1;1;1;2",
        "aff_country_unique": "Italy;United Kingdom;United States"
    },
    {
        "id": "o6AN2ZoNw2",
        "title": "Pseudo-Mask and Language: A Simple Recipe for Open-Vocabulary Semantic Segmentation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We present a conceptually simple framework for open-vocabulary semantic segmentation, which accurately assigns a semantic label to each pixel in an image from a set of arbitrary open-vocabulary texts. Our method, P-Seg, leverages pseudo-mask and language to train a MaskFormer, and can be easily trained from publicly available image-text datasets. Once trained, P-Seg generalizes well to multiple testing datasets without requiring fine-tuning. Without bells and whistles, our method achieves state-of-the-art open-vocabulary semantic segmentation results on three widely tested benchmarks (Pascal VOC, Pascal Context, and COCO). In addition, P-Seg has the extra benefits of scalability with data and consistently improving when augmented with self-training. We believe that our simple yet effective approach will serve as a solid baseline for future research. Our code and demo will be made publicly available soon.",
        "keywords": "vision-language understanding;segmentation;open-vocabulary segmentation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Zihang Lai",
        "authorids": "~Zihang_Lai1",
        "gender": "",
        "homepage": "",
        "dblp": "227/2343",
        "google_scholar": "31eXgMYAAAAJ",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Zihang_Lai1",
        "aff": "University of Oxford",
        "aff_domain": "ox.ac.uk",
        "position": "PhD student",
        "bibtex": "@misc{\nlai2024pseudomask,\ntitle={Pseudo-Mask and Language: A Simple Recipe for Open-Vocabulary Semantic Segmentation},\nauthor={Zihang Lai},\nyear={2024},\nurl={https://openreview.net/forum?id=o6AN2ZoNw2}\n}",
        "github": "",
        "project": "",
        "reviewers": "hdj1;dUwF;ddmt",
        "site": "https://openreview.net/forum?id=o6AN2ZoNw2",
        "pdf_size": 5952444,
        "rating": "3;3;5",
        "confidence": "4;5;3",
        "soundness": "1;3;3",
        "contribution": "2;2;2",
        "presentation": "1;3;3",
        "wc_summary": "114;65;52",
        "wc_strengths": "53;44;65",
        "wc_weaknesses": "1116;241;85",
        "wc_questions": "139;9;26",
        "wc_review": "1422;359;228",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            77.0,
            26.695817400234567
        ],
        "wc_strengths_avg": [
            54.0,
            8.602325267042627
        ],
        "wc_weaknesses_avg": [
            480.6666666666667,
            453.7402585425082
        ],
        "wc_questions_avg": [
            58.0,
            57.69459824512748
        ],
        "wc_review_avg": [
            669.6666666666666,
            534.661471296454
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.8660254037844387,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:6rbJ1amwnjoJ:scholar.google.com/&scioq=Pseudo-Mask+and+Language:+A+Simple+Recipe+for+Open-Vocabulary+Semantic+Segmentation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Oxford",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ox.ac.uk",
        "aff_unique_abbr": "Oxford",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "o6XxdC4QsX",
        "title": "StudentEval: A Benchmark of Student-Written Prompts for Large Language Models of Code",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Code LLMs are being rapidly deployed and there is evidence that they can make professional programmers more productive. Current benchmarks for code generation measure whether models generate correct programs given an expert prompt. We present the first \nbenchmark with prompts written by a uniform population of non-experts: students with just one semester of Python programming. StudentEval has 1,749 prompts for 48 problems, written by 80 students. Our students wrote these prompts while working interactively with a Code LLM, and we observed very mixed success rates. We use StudentEval to evaluate contemporary Code LLMs and find that StudentEval is a better discriminator of model performance than existing benchmarks. We analyze the prompts and find significant variation in students\u2019 prompting techniques. We also find that nondeterministic LLM sampling could mislead students into thinking that their prompts are more (or less) effective than they actually are, which has implications for how to teach with Code LLMs.",
        "keywords": "code generation;large language models;prompt engineering",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/0040dfb52cdc3a87ce20e04e6142b7ef5ac9dbd0.zip",
        "author": "Hannah McLean Babe;Sydney Nguyen;Yangtian Zi;Molly Q Feldman;Carolyn Jane Anderson;Arjun Guha",
        "authorids": "~Hannah_McLean_Babe1;~Sydney_Nguyen1;~Yangtian_Zi1;~Molly_Q_Feldman1;~Carolyn_Jane_Anderson1;~Arjun_Guha3",
        "gender": "F;;F;F;M;F",
        "homepage": ";https://ytzi.org;https://www.feldmanmolly.com/;http://canders1.github.io/;https://khoury.northeastern.edu/~arjunguha;",
        "dblp": ";;217/9190;139/2447;15/2016;",
        "google_scholar": ";;https://scholar.google.com/citations?hl=en;tJ2RaucAAAAJ;yMU0f9EAAAAJ;",
        "orcid": "0000-0002-7053-699X;0000-0003-2606-3280;0000-0002-5222-7720;;;",
        "linkedin": ";;;;;hannahbabe/",
        "or_profile": "~Sydney_Nguyen1;~Yangtian_Zi1;~Molly_Q_Feldman1;~Carolyn_Jane_Anderson1;~Arjun_Guha3;~Hannah_Babe1",
        "aff": "Wellesley College;Northeastern University;Oberlin College;Wellesley College;Roblox Research;",
        "aff_domain": "wellesley.edu;northeastern.edu;oberlin.edu;wellesley.edu;roblox.com;",
        "position": "Undergrad student;PhD student;Assistant Professor;Assistant Professor;Visiting Professor;",
        "bibtex": "@misc{\nbabe2024studenteval,\ntitle={StudentEval: A Benchmark of Student-Written Prompts for Large Language Models of Code},\nauthor={Hannah McLean Babe and Sydney Nguyen and Yangtian Zi and Molly Q Feldman and Carolyn Jane Anderson and Arjun Guha},\nyear={2024},\nurl={https://openreview.net/forum?id=o6XxdC4QsX}\n}",
        "github": "",
        "project": "",
        "reviewers": "RtHt;4LKr;8Caj;Z4ry",
        "site": "https://openreview.net/forum?id=o6XxdC4QsX",
        "pdf_size": 372377,
        "rating": "3;3;5;6",
        "confidence": "4;4;3;5",
        "soundness": "3;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "4;2;3;3",
        "wc_summary": "42;85;30;119",
        "wc_strengths": "20;102;59;232",
        "wc_weaknesses": "128;100;103;222",
        "wc_questions": "1;32;29;11",
        "wc_review": "191;319;221;584",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            69.0,
            35.37654590261746
        ],
        "wc_strengths_avg": [
            103.25,
            79.79152523921321
        ],
        "wc_weaknesses_avg": [
            138.25,
            49.55993845839601
        ],
        "wc_questions_avg": [
            18.25,
            12.794041581923986
        ],
        "wc_review_avg": [
            328.75,
            154.7843257568414
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.2721655269759087,
        "gs_citation": 38,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16193343836086653008&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;2;0;3",
        "aff_unique_norm": "Wellesley College;Northeastern University;Oberlin College;Roblox Corporation",
        "aff_unique_dep": ";;;Research",
        "aff_unique_url": "https://www.wellesley.edu;https://www.northeastern.edu;https://www.oberlin.edu;https://www.roblox.com",
        "aff_unique_abbr": "Wellesley;NEU;Oberlin;Roblox",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "o6eUNPBAEc",
        "title": "Language Models Struggle to Explain Themselves",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs) perform well at a myriad of tasks, but explaining the processes behind this performance is a challenge. This paper investigates whether LLMs can give faithful high-level explanations of their own internal processes. To explore this, we introduce a dataset, ArticulateRules, of few-shot text-based classification tasks generated by simple rules. Each rule is associated with a simple natural-language explanation. We test whether models that have learned to classify inputs competently (both in- and out-of-distribution) are able to articulate freeform natural language explanations that match their classification behaviour, using the simple rules as ground-truth explanations. Our dataset can be used for both in-context and finetuning evaluations. We evaluate a range of LLMs, demonstrating that articulation accuracy increases with model size, with a particularly sharp jump from GPT-3 to GPT-4. We then investigate whether we can improve GPT-3's articulation accuracy through finetuning. GPT-3 completely fails to articulate $7/10$ rules in our test, even after additional finetuning on correct explanations. We release our dataset, ArticulateRules, which can be used to test self-explanation for LLMs trained either in-context or by finetuning.",
        "keywords": "LLM;introspection;explainability;interpretability;self-explanation;honesty;faithfulness;truthfulness;classification;benchmark;evaluation;alignment;safety;dataset",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Dane Sherburn;Bilal Chughtai;Owain Evans",
        "authorids": "~Dane_Sherburn1;~Bilal_Chughtai1;~Owain_Evans1",
        "gender": "M;M;",
        "homepage": "http://danesherbs.com;;https://owainevans.github.io/",
        "dblp": ";;52/10432",
        "google_scholar": "bCz6Lq0AAAAJ;;4VpTwzIAAAAJ",
        "orcid": ";;",
        "linkedin": ";https://www.linkedin.com/feed/;",
        "or_profile": "~Dane_Sherburn1;~Bilal_Chughtai1;~Owain_Evans1",
        "aff": "OpenAI;;Truthful AI",
        "aff_domain": "openai.com;;owainevans.com",
        "position": "Researcher;;Principal Researcher",
        "bibtex": "@misc{\nsherburn2024language,\ntitle={Language Models Struggle to Explain Themselves},\nauthor={Dane Sherburn and Bilal Chughtai and Owain Evans},\nyear={2024},\nurl={https://openreview.net/forum?id=o6eUNPBAEc}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZS9G;8rGm;ZENG",
        "site": "https://openreview.net/forum?id=o6eUNPBAEc",
        "pdf_size": 1909033,
        "rating": "5;5;5",
        "confidence": "3;4;4",
        "soundness": "2;3;3",
        "contribution": "2;2;2",
        "presentation": "2;2;2",
        "wc_summary": "79;63;114",
        "wc_strengths": "125;67;109",
        "wc_weaknesses": "344;311;163",
        "wc_questions": "280;119;6",
        "wc_review": "828;560;392",
        "wc_reply_reviewers": "445;52;0",
        "wc_reply_authors": "1503;1072;1012",
        "reply_reviewers": "2;1;0",
        "reply_authors": "4;3;3",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            85.33333333333333,
            21.29684379328438
        ],
        "wc_strengths_avg": [
            100.33333333333333,
            24.458581770458856
        ],
        "wc_weaknesses_avg": [
            272.6666666666667,
            78.7076164604728
        ],
        "wc_questions_avg": [
            135.0,
            112.43071940829458
        ],
        "wc_review_avg": [
            593.3333333333334,
            179.55005492124533
        ],
        "wc_reply_reviewers_avg": [
            165.66666666666666,
            198.6560399842457
        ],
        "wc_reply_authors_avg": [
            1195.6666666666667,
            218.69359590278106
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:VHWtSmm1nVsJ:scholar.google.com/&scioq=Language+Models+Struggle+to+Explain+Themselves&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "OpenAI;Truthful AI",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://openai.com;",
        "aff_unique_abbr": "OpenAI;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States;"
    },
    {
        "id": "o7BwUyXz1f",
        "title": "Catastrophic Negative Transfer: An Overlooked Problem in Continual Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Continual Reinforcement Learning (CRL) recently witnessed significant advancements, but negative transfer, a phenomenon in which policy training for new task fails when trained after a specific previous task, has been largely overlooked. In this paper, we shed light on the prevalence and catastrophic nature of the negative transfer in CRL through systematic experiments on the Meta-World RL environments. Our findings highlight that this phenomenon possesses a unique characteristic distinct from the mere reduction in plasticity or capacity observed in conventional RL algorithms. Then, we introduce a simple yet effective baseline called Reset \\& Distill (R\\&D) to address the issue of negative transfer in CRL. R\\&D combines a strategy of resetting the agent's online actor and critic networks to learn a new task and an offline learning step for distilling the knowledge from the online actor and previous expert's action probabilities. As a result, our method can successfully mitigate both catastrophic negative transfer and forgetting in CRL. We carried out extensive experiments on long sequence of Meta-World tasks and show that our method consistently outperforms recent baselines, achieving significantly higher success rates across a range of tasks. Our findings highlight the importance of considering negative transfer in CRL and emphasize the need for robust strategies like R\\&D to mitigate its detrimental effects.",
        "keywords": "Continual reinforcement learning;negative transfer;SAC;Behavioral Cloning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/83bbe49b9d46dfbaaf4c86805eb5759b5bee0c13.pdf",
        "author": "Hongjoon Ahn;Jinu Hyeon;Youngmin Oh;Bosun Hwang;Taesup Moon",
        "authorids": "~Hongjoon_Ahn2;~Jinu_Hyeon1;~Youngmin_Oh2;~Bosun_Hwang1;~Taesup_Moon1",
        "gender": "M;M;M;M;",
        "homepage": "https://sites.google.com/view/hongjoon-ahn/;https://sites.google.com/snu.ac.kr/jinuhyeon/;https://sites.google.com/view/youngmin0oh;;https://mindlab-snu.github.io/people/pi/",
        "dblp": "236/5812;;;;05/4084",
        "google_scholar": "uYaCitcAAAAJ;;_6sDqYYAAAAJ;;lQlioBoAAAAJ",
        "orcid": ";;0000-0002-9279-0155;;0000-0002-9257-6503",
        "linkedin": ";;youngmin-oh-124593166/;%EB%B3%B4%EC%84%A0-%ED%99%A9-79baab159/;",
        "or_profile": "~Hongjoon_Ahn2;~Jinu_Hyeon1;~Youngmin_Oh2;~Bosun_Hwang1;~Taesup_Moon1",
        "aff": "Seoul National University;Seoul National University;Samsung;Samsung Advanced Institute of Technology;Seoul National University",
        "aff_domain": "snu.ac.kr;snu.ac.kr;samsung.com;samsung.com;snu.ac.kr",
        "position": "PhD student;MS student;Researcher;Principal Researcher;Associate Professor",
        "bibtex": "@misc{\nahn2024catastrophic,\ntitle={Catastrophic Negative Transfer: An Overlooked Problem in Continual Reinforcement Learning},\nauthor={Hongjoon Ahn and Jinu Hyeon and Youngmin Oh and Bosun Hwang and Taesup Moon},\nyear={2024},\nurl={https://openreview.net/forum?id=o7BwUyXz1f}\n}",
        "github": "",
        "project": "",
        "reviewers": "p3gB;274b;u4tG;oDoz",
        "site": "https://openreview.net/forum?id=o7BwUyXz1f",
        "pdf_size": 1625780,
        "rating": "3;3;5;8",
        "confidence": "5;3;4;4",
        "soundness": "2;2;3;4",
        "contribution": "2;1;3;4",
        "presentation": "3;3;3;4",
        "wc_summary": "111;64;52;106",
        "wc_strengths": "40;21;8;115",
        "wc_weaknesses": "822;32;101;216",
        "wc_questions": "482;617;84;6",
        "wc_review": "1455;734;245;443",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1628;1015;663;185",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;2;1;1",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            1.118033988749895
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            83.25,
            25.66490794840301
        ],
        "wc_strengths_avg": [
            46.0,
            41.430664971733194
        ],
        "wc_weaknesses_avg": [
            292.75,
            312.5518956909396
        ],
        "wc_questions_avg": [
            297.25,
            258.2028030444286
        ],
        "wc_review_avg": [
            719.25,
            459.0132759517964
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            872.75,
            526.2206642654771
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:B9uBGWDB1zMJ:scholar.google.com/&scioq=Catastrophic+Negative+Transfer:+An+Overlooked+Problem+in+Continual+Reinforcement+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;1;0",
        "aff_unique_norm": "Seoul National University;Samsung",
        "aff_unique_dep": ";Samsung",
        "aff_unique_url": "https://www.snu.ac.kr;https://www.samsung.com",
        "aff_unique_abbr": "SNU;Samsung",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "Sample-Efficient Multi-Agent RL: An Optimization Perspective",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17834",
        "id": "o7qhUMylLU",
        "author_site": "Nuoya Xiong, Zhihan Liu, Zhaoran Wang, Zhuoran Yang",
        "tldr": "",
        "abstract": "We study multi-agent reinforcement learning (MARL) for the general-sum Markov Games (MGs) under general function approximation. \n    In order to find the minimum assumption for sample-efficient learning, we introduce a novel complexity measure called the Multi-Agent Decoupling Coefficient (MADC) for general-sum MGs. Using this measure, we propose the first unified algorithmic framework that ensures sample efficiency in learning Nash Equilibrium, Coarse Correlated Equilibrium, and Correlated Equilibrium for both model-based and model-free MARL problems with low MADC. We also show that our algorithm provides comparable sublinear regret to the existing works. Moreover, our algorithm combines an equilibrium-solving oracle with a single objective optimization subprocedure that solves for the regularized payoff of each deterministic joint policy, which avoids solving constrained optimization problems within data-dependent constraints (Jin et al. 2020; Wang et al. 2023) or executing sampling procedures with complex multi-objective optimization problems (Foster et al. 2023), thus being more amenable to empirical implementation.",
        "keywords": "multi-agent reinforcement learning;theory;general function approximation;general-sum Markov Games",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Nuoya Xiong;Zhihan Liu;Zhaoran Wang;Zhuoran Yang",
        "authorids": "~Nuoya_Xiong1;~Zhihan_Liu1;~Zhaoran_Wang1;~Zhuoran_Yang1",
        "gender": "M;M;Not Specified;M",
        "homepage": "https://xiongny.github.io/index.html;;https://zhaoranwang.github.io/;https://zhuoranyang.github.io/",
        "dblp": "322/6141;;117/2756;",
        "google_scholar": "K7Q4GWQAAAAJ;0VVg_R4AAAAJ;https://scholar.google.com.tw/citations?user=HSx0BgQAAAAJ;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Nuoya_Xiong1;~Zhihan_Liu1;~Zhaoran_Wang1;~Zhuoran_Yang1",
        "aff": "Tsinghua University;Northwestern University;Northwestern University;Yale University",
        "aff_domain": "tsinghua.edu.cn;northwestern.edu;northwestern.edu;yale.edu",
        "position": "Undergrad student;PhD student;Associate Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nxiong2024sampleefficient,\ntitle={Sample-Efficient Multi-Agent {RL}: An Optimization Perspective},\nauthor={Nuoya Xiong and Zhihan Liu and Zhaoran Wang and Zhuoran Yang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=o7qhUMylLU}\n}",
        "github": "",
        "project": "",
        "reviewers": "FdZN;hiyJ;JQUp;cnZv;pi75",
        "pdf_size": 576241,
        "rating": "6;6;6;6;6",
        "confidence": "2;3;4;4;3",
        "soundness": "3;4;3;3;3",
        "contribution": "3;3;2;3;3",
        "presentation": "2;4;3;3;3",
        "wc_summary": "66;51;93;75;249",
        "wc_strengths": "40;65;58;34;54",
        "wc_weaknesses": "65;58;92;175;126",
        "wc_questions": "39;195;384;4;2",
        "wc_review": "210;369;627;288;431",
        "wc_reply_reviewers": "168;48;484;20;0",
        "wc_reply_authors": "888;1075;1697;864;986",
        "reply_reviewers": "2;1;1;1;0",
        "reply_authors": "2;2;3;2;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.2,
            0.7483314773547882
        ],
        "soundness_avg": [
            3.2,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.8,
            0.39999999999999997
        ],
        "presentation_avg": [
            3.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            106.8,
            72.38894943290722
        ],
        "wc_strengths_avg": [
            50.2,
            11.496086290559932
        ],
        "wc_weaknesses_avg": [
            103.2,
            43.13420916163875
        ],
        "wc_questions_avg": [
            124.8,
            147.7476226543087
        ],
        "wc_review_avg": [
            385.0,
            142.10559454152394
        ],
        "wc_reply_reviewers_avg": [
            144.0,
            179.72423320186957
        ],
        "wc_reply_authors_avg": [
            1102.0,
            306.8061277093403
        ],
        "reply_reviewers_avg": [
            1.0,
            0.6324555320336759
        ],
        "reply_authors_avg": [
            2.2,
            0.39999999999999997
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1436648461237250736&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=o7qhUMylLU",
        "pdf": "https://openreview.net/pdf?id=o7qhUMylLU",
        "email": "tsinghua.edu.cn;northwestern.edu;northwestern.edu;yale.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "Tsinghua University;Northwestern University;Yale University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.northwestern.edu;https://www.yale.edu",
        "aff_unique_abbr": "THU;NU;Yale",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "MaGIC: Multi-modality Guided Image Completion",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17833",
        "id": "o7x0XVlCpX",
        "author_site": "Hao Wang, Yongsheng Yu, Tiejian Luo, Heng Fan, Libo Zhang",
        "tldr": "",
        "abstract": "Vanilla image completion approaches exhibit sensitivity to large missing regions, attributed to the limited availability of reference information for plausible generation. To mitigate this, existing methods incorporate the extra cue as guidance for image completion. Despite improvements, these approaches are often restricted to employing a *single modality* (e.g., *segmentation* or *sketch* maps), which lacks scalability in leveraging multi-modality for more plausible completion.\nIn this paper, we propose a novel, simple yet effective method for **M**ulti-mod**a**l **G**uided **I**mage **C**ompletion, dubbed **MaGIC**, which not only supports a wide range of single modality as the guidance (e.g., *text*, *canny edge*, *sketch*, *segmentation*, *depth*, and *pose*), but also adapts to arbitrarily customized combinations of these modalities (i.e., *arbitrary multi-modality*) for image completion.\nFor building MaGIC, we first introduce a modality-specific conditional U-Net (MCU-Net) that injects single-modal signal into a U-Net denoiser for single-modal guided image completion. Then, we devise a consistent modality blending (CMB) method to leverage modality signals encoded in multiple learned MCU-Nets through gradient guidance in latent space. Our CMB is *training-free*, thereby avoiding the cumbersome joint re-training of different modalities, which is the secret of MaGIC to achieve exceptional flexibility in accommodating new modalities for completion.\nExperiments show the superiority of MaGIC over state-of-the-art methods and its generalization to various completion tasks.",
        "keywords": "Multi-modality;Image Completion;Diffusion Model",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Hao Wang;Yongsheng Yu;Tiejian Luo;Heng Fan;Libo Zhang",
        "authorids": "~Hao_Wang27;~Yongsheng_Yu1;~Tiejian_Luo2;~Heng_Fan3;~Libo_Zhang1",
        "gender": "M;M;M;M;M",
        "homepage": "https://github.com/wanghao14;;;;https://hengfan2010.github.io/",
        "dblp": ";00/10049;;78/33-1.html;20/10120-1",
        "google_scholar": ";QXF5p7QAAAAJ;;https://scholar.google.com/citations?hl=zh-CN;MVQYJiMAAAAJ",
        "orcid": "0000-0002-9274-2698;;;;",
        "linkedin": ";;tiejian-luo-18632a89/;;",
        "or_profile": "~Hao_Wang27;~Yongsheng_Yu1;~Tiejian_Luo2;~Libo_Zhang1;~Heng_Fan1",
        "aff": "University of Chinese Academy of Sciences;University of Rochester;University of Chinese Academy of Sciences;Institute of Software Chinese Academy of Sciences;Temple University",
        "aff_domain": "ucas.ac.cn;ur.rochester.edu;ucas.ac.cn;iscas.ac.cn;temple.edu",
        "position": "PhD student;PhD student;Full Professor;Associate Professor;PhD student",
        "bibtex": "@inproceedings{\nwang2024magic,\ntitle={Ma{GIC}: Multi-modality Guided Image Completion},\nauthor={Hao Wang and Yongsheng Yu and Tiejian Luo and Heng Fan and Libo Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=o7x0XVlCpX}\n}",
        "github": "",
        "project": "",
        "reviewers": "jMgg;c8RF;VxR9",
        "pdf_size": 22692944,
        "rating": "6;6;8",
        "confidence": "3;4;4",
        "soundness": "2;2;3",
        "contribution": "1;3;3",
        "presentation": "2;2;3",
        "wc_summary": "212;54;34",
        "wc_strengths": "72;53;104",
        "wc_weaknesses": "277;217;50",
        "wc_questions": "96;16;3",
        "wc_review": "657;340;191",
        "wc_reply_reviewers": "0;403;0",
        "wc_reply_authors": "1377;1705;250",
        "reply_reviewers": "0;3;0",
        "reply_authors": "5;6;2",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            100.0,
            79.61574383667258
        ],
        "wc_strengths_avg": [
            76.33333333333333,
            21.044925490219462
        ],
        "wc_weaknesses_avg": [
            181.33333333333334,
            96.04281452676312
        ],
        "wc_questions_avg": [
            38.333333333333336,
            41.12041936664665
        ],
        "wc_review_avg": [
            396.0,
            194.3210402058065
        ],
        "wc_reply_reviewers_avg": [
            134.33333333333334,
            189.97602187878573
        ],
        "wc_reply_authors_avg": [
            1110.6666666666667,
            623.1406119185478
        ],
        "reply_reviewers_avg": [
            1.0,
            1.4142135623730951
        ],
        "reply_authors_avg": [
            4.333333333333333,
            1.699673171197595
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.49999999999999983,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11786251522572107823&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=o7x0XVlCpX",
        "pdf": "https://openreview.net/pdf?id=o7x0XVlCpX",
        "email": "ucas.ac.cn;ur.rochester.edu;ucas.ac.cn;iscas.ac.cn;temple.edu",
        "author_num": 5,
        "aff_unique_index": "0;1;0;2;3",
        "aff_unique_norm": "University of Chinese Academy of Sciences;University of Rochester;Chinese Academy of Sciences;Temple University",
        "aff_unique_dep": ";;Institute of Software;",
        "aff_unique_url": "http://www.ucas.ac.cn;https://www.rochester.edu;http://www.is.cas.cn;https://www.temple.edu",
        "aff_unique_abbr": "UCAS;U of R;CAS;Temple",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Information Retention via Learning Supplemental Features",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17832",
        "id": "o83eu4H9Mb",
        "author_site": "Zhipeng Xie, Yahe Li",
        "tldr": "",
        "abstract": "The information bottleneck principle provides an information-theoretic method for learning a good representation as a trade-off between conciseness and predictive ability, which can reduce information redundancy, eliminate irrelevant and superfluous features, and thus enhance the in-domain generalizability. However, in low-resource or out-of-domain scenarios where the assumption of i.i.d does not necessarily hold true, superfluous (or redundant) relevant features may be supplemental to the mainline features of the model, and be beneficial in making prediction for test dataset with distribution shift. Therefore, instead of squeezing the input information by information bottleneck, we propose to keep as much relevant information as possible in use for making predictions. A three-stage supervised learning framework is designed and implemented to jointly learn the mainline and supplemental features, relieving supplemental features from the suppression of mainline features. Extensive experiments have shown that the learned representations of our method have good in-domain and out-of-domain generalization abilities, especially in low-resource cases.",
        "keywords": "Information Retention;Few-shot Learning;Deep Neural Network",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Zhipeng Xie;Yahe Li",
        "authorids": "~Zhipeng_Xie1;~Yahe_Li1",
        "gender": "M;M",
        "homepage": ";https://github.com/liyahe",
        "dblp": "05/4323;",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Zhipeng_Xie1;~Yahe_Li1",
        "aff": "Fudan University;Fudan University",
        "aff_domain": "fudan.edu.cn;fudan.edu.cn",
        "position": "Associate Professor;MS student",
        "bibtex": "@inproceedings{\nxie2024information,\ntitle={Information Retention via Learning Supplemental Features},\nauthor={Zhipeng Xie and Yahe Li},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=o83eu4H9Mb}\n}",
        "github": "",
        "project": "",
        "reviewers": "LTAN;BzTN;GgyT;WVdm;RFaU",
        "pdf_size": 1277545,
        "rating": "6;6;8;8;8",
        "confidence": "3;4;4;2;4",
        "soundness": "3;1;4;3;4",
        "contribution": "3;1;3;3;3",
        "presentation": "2;1;3;2;3",
        "wc_summary": "72;23;101;97;82",
        "wc_strengths": "85;10;64;125;87",
        "wc_weaknesses": "118;85;70;128;62",
        "wc_questions": "8;22;18;73;49",
        "wc_review": "283;140;253;423;280",
        "wc_reply_reviewers": "240;30;17;19;18",
        "wc_reply_authors": "622;310;565;730;530",
        "reply_reviewers": "1;1;1;1;1",
        "reply_authors": "2;1;1;1;1",
        "rating_avg": [
            7.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.4,
            0.8
        ],
        "soundness_avg": [
            3.0,
            1.0954451150103321
        ],
        "contribution_avg": [
            2.6,
            0.8000000000000002
        ],
        "presentation_avg": [
            2.2,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            75.0,
            28.007141946296482
        ],
        "wc_strengths_avg": [
            74.2,
            37.64784190362045
        ],
        "wc_weaknesses_avg": [
            92.6,
            26.089078174592522
        ],
        "wc_questions_avg": [
            34.0,
            23.757104200638594
        ],
        "wc_review_avg": [
            275.8,
            90.22061848602014
        ],
        "wc_reply_reviewers_avg": [
            64.8,
            87.72548090492295
        ],
        "wc_reply_authors_avg": [
            551.4,
            138.41907383016257
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.2,
            0.4000000000000001
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.10206207261596574,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:UeWeQSCeMi0J:scholar.google.com/&scioq=Information+Retention+via+Learning+Supplemental+Features&hl=en&as_sdt=0,24",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=o83eu4H9Mb",
        "pdf": "https://openreview.net/pdf?id=o83eu4H9Mb",
        "email": "fudan.edu.cn;fudan.edu.cn",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Fudan University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.fudan.edu.cn",
        "aff_unique_abbr": "Fudan",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "o87xfYKQC1",
        "title": "Image as First-Order Norm+Linear Autoregression: Unveiling Mathematical Invariance",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper introduces a novel mathematical property applicable to diverse images, referred to as FINOLA (First-Order Norm+Linear Autoregressive). FINOLA represents each image in the latent space as a first-order autoregressive process, in which each regression step simply applies a shared linear model on the normalized value of its immediate neighbor. This intriguing property reveals a mathematical invariance that transcends individual images. Expanding from image grids to continuous coordinates, we unveil the presence of two underlying partial differential equations. \n\nWe validate the FINOLA property from two distinct angles: image reconstruction and self-supervised learning. Firstly, we demonstrate the ability of FINOLA to auto-regress up to a 256$\\times$256 feature map (the same resolution to the image) from a single vector placed at the center, successfully reconstructing the original image by only using three 3$\\times$3 convolution layers as decoder. Secondly, we leverage FINOLA for self-supervised learning by employing a simple masked prediction approach. Encoding a single unmasked quadrant block, we autoregressively predict the surrounding masked region. Remarkably, this pre-trained representation proves highly effective in image classification and object detection tasks, even when integrated into lightweight networks, all without the need for extensive fine-tuning. The code will be made publicly available.",
        "keywords": "mathematical property of images;partial differential equation",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Yinpeng Chen;Xiyang Dai;Dongdong Chen;Mengchen Liu;Lu Yuan;Zicheng Liu;Youzuo Lin",
        "authorids": "~Yinpeng_Chen1;~Xiyang_Dai4;~Dongdong_Chen1;~Mengchen_Liu3;~Lu_Yuan1;~Zicheng_Liu1;~Youzuo_Lin1",
        "gender": "M;M;M;M;M;M;M",
        "homepage": "https://scholar.google.com/citations?user=V_VpLksAAAAJ&hl=en;http://www.dongdongchen.bid/;https://scholar.google.com/citations?user=cOPQtYgAAAAJ&hl=en;https://www.microsoft.com/en-us/research/people/luyuan/;https://sites.google.com/view/zichengliu/home?pli=1;https://sites.google.com/site/youzuolin044/;https://sites.google.com/site/xiyangdai/",
        "dblp": "45/6977;92/1489-1;;;l/ZichengLiu;;176/5470",
        "google_scholar": ";https://scholar.google.com.sg/citations?user=sYKpKqEAAAAJ;cOPQtYgAAAAJ;k9TsUVsAAAAJ;bkALdvsAAAAJ;CMXuHYgAAAAJ;QC8RwcoAAAAJ",
        "orcid": ";;;;0000-0001-5894-7828;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Yinpeng_Chen1;~Dongdong_Chen1;~Mengchen_Liu3;~Lu_Yuan1;~Zicheng_Liu1;~Youzuo_Lin1;~Xiyang_Dai2",
        "aff": "Google DeepMind;Microsoft Research;Microsoft;Microsoft;Microsoft;Los Alamos National Laboratory;Microsoft",
        "aff_domain": "google.com;microsoft.com;microsoft.com;microsoft.com;microsoft.com;lanl.gov;microsoft.com",
        "position": "Research Scientist;Principal Researcher;Researcher;Principal Research Manager;partner research manager;Researcher;Researcher",
        "bibtex": "@misc{\nchen2024image,\ntitle={Image as First-Order Norm+Linear Autoregression: Unveiling Mathematical Invariance},\nauthor={Yinpeng Chen and Xiyang Dai and Dongdong Chen and Mengchen Liu and Lu Yuan and Zicheng Liu and Youzuo Lin},\nyear={2024},\nurl={https://openreview.net/forum?id=o87xfYKQC1}\n}",
        "github": "",
        "project": "",
        "reviewers": "QCbo;FEae;P6tB;JB6i",
        "site": "https://openreview.net/forum?id=o87xfYKQC1",
        "pdf_size": 9321895,
        "rating": "3;5;6;6",
        "confidence": "4;3;3;3",
        "soundness": "2;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "45;71;64;61",
        "wc_strengths": "27;67;67;11",
        "wc_weaknesses": "17;138;154;53",
        "wc_questions": "158;6;5;375",
        "wc_review": "247;282;290;500",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "913;640;893;1964",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;2;4",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            60.25,
            9.522998477370455
        ],
        "wc_strengths_avg": [
            43.0,
            24.657656011875904
        ],
        "wc_weaknesses_avg": [
            90.5,
            57.221062555670876
        ],
        "wc_questions_avg": [
            136.0,
            151.38196722199115
        ],
        "wc_review_avg": [
            329.75,
            99.6151971337707
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1102.5,
            508.89316167541494
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.25,
            1.0897247358851685
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.9428090415820632,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7599647174054975935&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1;1;1;2;1",
        "aff_unique_norm": "Google;Microsoft;Los Alamos National Laboratory",
        "aff_unique_dep": "Google DeepMind;Microsoft Research;",
        "aff_unique_url": "https://deepmind.com;https://www.microsoft.com/en-us/research;https://www.lanl.gov",
        "aff_unique_abbr": "DeepMind;MSR;LANL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;1;1;1",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "title": "Adversarial AutoMixup",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17831",
        "id": "o8tjamaJ80",
        "author_site": "Huafeng Qin, Xin Jin, Yun Jiang, Moun\u00eem El-Yacoubi, Xinbo Gao",
        "tldr": "",
        "abstract": "Data mixing augmentation has been widely applied to improve the generalization ability of deep neural networks. Recently, offline data mixing augmentation, e.g. handcrafted and saliency information-based mixup, has been gradually replaced by automatic mixing approaches. Through minimizing two sub-tasks, namely, mixed sample generation and mixup classification in an end-to-end way, AutoMix significantly improves accuracy on image classification tasks. However, as the optimization objective is consistent for the two sub-tasks, this approach is prone to generating consistent instead of diverse mixed samples, which results in overfitting for target task training. In this paper, we propose AdAutomixup, an adversarial automatic mixup augmentation approach that generates challenging samples to train a robust classifier for image classification, by alternatively optimizing the classifier and the mixup sample generator. AdAutomixup comprises two modules, a mixed example generator, and a target classifier. The mixed sample generator aims to produce hard mixed examples to challenge the target classifier, while the target classifier's aim is to learn robust features from hard mixed examples to improve generalization. To prevent the collapse of the inherent meanings of images, we further introduce an exponential moving average (EMA) teacher and cosine similarity to train AdAutomixup in an end-to-end way. Extensive experiments on seven image benchmarks consistently prove that our approach outperforms the state of the art in various classification scenarios. The source code is available at \nhttps://github.com/JinXins/Adversarial-AutoMixup.",
        "keywords": "Data Augmentation;Mixup;Image Classification",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Huafeng Qin;Xin Jin;Yun Jiang;Moun\u00eem El-Yacoubi;Xinbo Gao",
        "authorids": "~Huafeng_Qin1;~Xin_Jin20;~Yun_Jiang2;~Moun\u00eem_El-Yacoubi1;~Xinbo_Gao5",
        "gender": "M;M;F;M;M",
        "homepage": ";https://jinxins.github.io/;https://scsie2014.ctbu.edu.cn/info/1055/3650.htm;https://elyacoubi.wp.imt.fr/;https://faculty.cqupt.edu.cn/gaoxinbo/zh_CN/index.htm",
        "dblp": ";;;54/3370.html;",
        "google_scholar": "https://scholar.google.cz/citations?user=5jvXcJ0AAAAJ;https://scholar.google.com/citations?hl=zh-CN;;ObFYefYAAAAJ;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": ";0009-0005-0983-6853;;0000-0002-7383-0588;0000-0002-7985-0037",
        "linkedin": ";;;moun%C3%AEm-a-el-yacoubi-26b1269/;xinbo-gao-151a2224/",
        "or_profile": "~Huafeng_Qin1;~Xin_Jin20;~Yun_Jiang2;~Moun\u00eem_El-Yacoubi1;~Xinbo_Gao5",
        "aff": "Chongqing Technology and Business University;Chongqing Technology and Business University;Chongqing Technology and Business University;Telecom SudParis;Chongqing University of Post and Telecommunications",
        "aff_domain": "ctbu.edu.cn;ctbu.edu.cn;ctbu.edu.cn;telecom-sudparis.fr;cqupt.edu.cn",
        "position": "Full Professor;MS student;Associate Professor;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nqin2024adversarial,\ntitle={Adversarial AutoMixup},\nauthor={Huafeng Qin and Xin Jin and Yun Jiang and Moun{\\^\\i}m El-Yacoubi and Xinbo Gao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=o8tjamaJ80}\n}",
        "github": "",
        "project": "",
        "reviewers": "xmzW;sHE4;vYYM",
        "pdf_size": 1444141,
        "rating": "6;8;8",
        "confidence": "3;4;5",
        "soundness": "3;4;3",
        "contribution": "2;4;3",
        "presentation": "3;3;3",
        "wc_summary": "105;28;121",
        "wc_strengths": "74;23;66",
        "wc_weaknesses": "432;31;269",
        "wc_questions": "59;9;39",
        "wc_review": "670;91;495",
        "wc_reply_reviewers": "122;0;90",
        "wc_reply_authors": "2673;74;745",
        "reply_reviewers": "1;0;1",
        "reply_authors": "6;1;2",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            84.66666666666667,
            40.59830319388019
        ],
        "wc_strengths_avg": [
            54.333333333333336,
            22.395436042987768
        ],
        "wc_weaknesses_avg": [
            244.0,
            164.65924409721632
        ],
        "wc_questions_avg": [
            35.666666666666664,
            20.548046676563256
        ],
        "wc_review_avg": [
            418.6666666666667,
            242.46007689697882
        ],
        "wc_reply_reviewers_avg": [
            70.66666666666667,
            51.64838386199084
        ],
        "wc_reply_authors_avg": [
            1164.0,
            1101.6263734436766
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.0,
            2.160246899469287
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.8660254037844385,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7501714803060613766&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=o8tjamaJ80",
        "pdf": "https://openreview.net/pdf?id=o8tjamaJ80",
        "email": "ctbu.edu.cn;ctbu.edu.cn;ctbu.edu.cn;telecom-sudparis.fr;cqupt.edu.cn",
        "author_num": 5,
        "aff_unique_index": "0;0;0;1;2",
        "aff_unique_norm": "Chongqing Technology and Business University;Telecom SudParis;Chongqing University of Post and Telecommunications",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.cqtbu.edu.cn;https://www.telecom-sudparis.eu;http://www.cqupt.edu.cn",
        "aff_unique_abbr": ";TSP;CQUPT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "China;France"
    },
    {
        "title": "Sampling Multimodal Distributions with the Vanilla Score: Benefits of Data-Based Initialization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17830",
        "id": "oAMArMMQxb",
        "author_site": "Frederic Koehler, Thuy-Duong Vuong",
        "tldr": "",
        "abstract": "There is a long history, as well as a recent explosion of interest, in statistical and generative modeling approaches based on \\emph{score functions} --- derivatives of the log-likelihood of a distribution. In seminal works, Hyv\\\"arinen proposed vanilla score matching as a way to learn distributions from data by computing an estimate of the score function of the underlying ground truth, and established connections between this method and established techniques like Contrastive Divergence and Pseudolikelihood estimation. It is by now well-known that vanilla score matching has significant difficulties learning multimodal distributions. Although there are various ways to overcome this difficulty, the following question has remained unanswered --- is there a natural way to sample multimodal distributions using just the vanilla score? Inspired by a long line of related experimental works, we prove that the Langevin diffusion with early stopping, initialized at the empirical distribution, and run on a score function estimated from data successfully generates natural multimodal distributions (mixtures of log-concave distributions).",
        "keywords": "sampling;score matching;contrastive divergence;langevin dynamics",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/37c7cf2c20b6735cbfeb3be53b10dafdf4c66878.zip",
        "author": "Frederic Koehler;Thuy-Duong Vuong",
        "authorids": "~Frederic_Koehler1;~Thuy-Duong_Vuong1",
        "gender": ";F",
        "homepage": "https://frkoehle.github.io/;https://thuyduongvuong.github.io/index.html",
        "dblp": "132/1904;263/9904",
        "google_scholar": ";aFn9qL8AAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Frederic_Koehler1;~Thuy-Duong_Vuong1",
        "aff": "University of Chicago;Stanford University",
        "aff_domain": "uchicago.edu;stanford.edu",
        "position": "Assistant Professor;PhD student",
        "bibtex": "@inproceedings{\nkoehler2024sampling,\ntitle={Sampling Multimodal Distributions with the Vanilla Score: Benefits of Data-Based Initialization},\nauthor={Frederic Koehler and Thuy-Duong Vuong},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=oAMArMMQxb}\n}",
        "github": "",
        "project": "",
        "reviewers": "7jZP;94gx;3d8a;vctH",
        "pdf_size": 1021968,
        "rating": "3;6;8;8",
        "confidence": "5;2;3;3",
        "soundness": "2;2;4;4",
        "contribution": "2;3;3;3",
        "presentation": "1;2;3;3",
        "wc_summary": "27;83;94;122",
        "wc_strengths": "9;60;189;188",
        "wc_weaknesses": "70;194;592;309",
        "wc_questions": "354;53;143;101",
        "wc_review": "460;390;1018;720",
        "wc_reply_reviewers": "78;0;219;0",
        "wc_reply_authors": "1807;532;1679;1910",
        "reply_reviewers": "1;0;4;0",
        "reply_authors": "3;1;5;3",
        "rating_avg": [
            6.25,
            2.0463381929681126
        ],
        "confidence_avg": [
            3.25,
            1.0897247358851685
        ],
        "soundness_avg": [
            3.0,
            1.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            81.5,
            34.528973341239094
        ],
        "wc_strengths_avg": [
            111.5,
            79.08381629638266
        ],
        "wc_weaknesses_avg": [
            291.25,
            193.11573602376373
        ],
        "wc_questions_avg": [
            162.75,
            114.91817741332308
        ],
        "wc_review_avg": [
            647.0,
            246.9757073074192
        ],
        "wc_reply_reviewers_avg": [
            74.25,
            89.43258634301034
        ],
        "wc_reply_authors_avg": [
            1482.0,
            554.5534239367746
        ],
        "reply_reviewers_avg": [
            1.25,
            1.6393596310755
        ],
        "reply_authors_avg": [
            3.0,
            1.4142135623730951
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.7006898183390131,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6158189946763421339&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=oAMArMMQxb",
        "pdf": "https://openreview.net/pdf?id=oAMArMMQxb",
        "email": "uchicago.edu;stanford.edu",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Chicago;Stanford University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uchicago.edu;https://www.stanford.edu",
        "aff_unique_abbr": "UChicago;Stanford",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Stanford",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "oDGkq0AleM",
        "title": "Anomaly Detection with Variance Stabilized Density Estimation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We propose a modified density estimation problem that is highly effective for detecting anomalies in tabular data. Specifically, we hypothesize that the density function is more stable (with lower variance) around normal samples than anomalies. We first corroborate this hypothesis empirically using a wide range of real-world data. Then, we propose a variance-stabilized density estimation problem for maximizing the likelihood of the observed samples while minimizing the variance of the density around normal samples. To obtain a reliable anomaly detector, we introduce a spectral ensemble of autoregressive models for learning the variance-stabilized distribution. Finally, we perform an extensive benchmark with 52 datasets, demonstrating that our method leads to state-of-the-art results while alleviating the need for data-specific hyperparameter tuning.",
        "keywords": "Anomaly detection;Density estimation;Autoregresive model;Outlier detection",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/f20a52028c38dc6d2bb757ecd50ab26e0d17f96c.zip",
        "author": "Amit Rozner;Barak Battash;Henry Li;Lior Wolf;Ofir Lindenbaum",
        "authorids": "~Amit_Rozner1;~Barak_Battash1;~Henry_Li2;~Lior_Wolf1;~Ofir_Lindenbaum1",
        "gender": ";;;M;M",
        "homepage": ";;https://hnry.li;http://www.cs.tau.ac.il/~wolf;https://www.eng.biu.ac.il/lindeno/",
        "dblp": ";;31/6498;83/4103;142/4140",
        "google_scholar": ";https://scholar.google.co.il/citations?user=-tkVh1IAAAAJ;o7-TIlcAAAAJ;UbFrXTsAAAAJ;https://scholar.google.co.il/citations?user=jXxk6gcAAAAJ",
        "orcid": ";;;0000-0001-5578-8892;",
        "linkedin": ";battash/;;;",
        "or_profile": "~Amit_Rozner1;~Barak_Battash1;~Henry_Li2;~Lior_Wolf1;~Ofir_Lindenbaum1",
        "aff": ";Bar-Ilan University;Yale University;Tel Aviv University;Bar-Ilan University",
        "aff_domain": ";biu.ac.il;yale.edu;tau.ac.il;biu.ac.il",
        "position": ";PhD student;PhD student;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nrozner2024anomaly,\ntitle={Anomaly Detection with Variance Stabilized Density Estimation},\nauthor={Amit Rozner and Barak Battash and Henry Li and Lior Wolf and Ofir Lindenbaum},\nyear={2024},\nurl={https://openreview.net/forum?id=oDGkq0AleM}\n}",
        "github": "",
        "project": "",
        "reviewers": "K52R;Arov;ahvn",
        "site": "https://openreview.net/forum?id=oDGkq0AleM",
        "pdf_size": 1671317,
        "rating": "1;3;5",
        "confidence": "4;3;4",
        "soundness": "1;1;2",
        "contribution": "2;2;2",
        "presentation": "3;2;2",
        "wc_summary": "121;113;97",
        "wc_strengths": "73;43;113",
        "wc_weaknesses": "441;912;359",
        "wc_questions": "3;15;3",
        "wc_review": "638;1083;572",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            1.632993161855452
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            110.33333333333333,
            9.977753031397176
        ],
        "wc_strengths_avg": [
            76.33333333333333,
            28.674417556808756
        ],
        "wc_weaknesses_avg": [
            570.6666666666666,
            243.66963062492806
        ],
        "wc_questions_avg": [
            7.0,
            5.656854249492381
        ],
        "wc_review_avg": [
            764.3333333333334,
            226.9366039717309
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1837543919113732639&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 10,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Bar-Ilan University;Yale University;Tel Aviv University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.biu.ac.il;https://www.yale.edu;https://www.tau.ac.il",
        "aff_unique_abbr": "BIU;Yale;TAU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "Israel;United States"
    },
    {
        "id": "oDYXpvnv5f",
        "title": "Deep Anti-Regularized Ensembles",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We consider the problem of uncertainty quantification in high dimensional regression and classification, for which deep ensembles have proven to be promising methods. Recent observations have shown that deep ensembles often return overconfident estimates outside the training domain, which is a major limitation because shifted distributions are often encountered in real-life scenarios. The principal challenge for this problem is to solve the trade-off between increasing the diversity of the ensemble outputs and making accurate in-distribution predictions. In this work, we show that an ensemble of networks with large weights fitting the training data are likely to meet these two objectives. We derive a simple and practical approach to produce such ensembles, based on an original anti-regularization term penalizing small weights and a control process of the weight increase which maintains the in-distribution loss under an acceptable threshold. The developed approach does not require any out-of-distribution training data neither any trade-off hyper-parameter calibration. We derive a theoretical framework for this approach and show that the proposed optimization can be seen as a \"water-filling\" problem. Several experiments in both regression and classification settings highlight that Deep Anti-Regularized Ensembles (DARE) significantly improve uncertainty quantification outside the training domain in comparison to recent deep ensembles and out-of-distribution detection methods.",
        "keywords": "Deep Ensemble;Uncertainty;Out-of-distribution;Anti-regularization",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Antoine de Mathelin;Fran\u00e7ois Deheeger;Mathilde MOUGEOT;Nicolas Vayatis",
        "authorids": "~Antoine_de_Mathelin2;~Fran\u00e7ois_Deheeger1;~Mathilde_MOUGEOT1;~Nicolas_Vayatis1",
        "gender": "M;F;M;",
        "homepage": "https://www.linkedin.com/in/fran%C3%A7ois-deheeger-88370054/?originalSubdomain=fr;https://sites.google.com/site/mougeotmathilde/;;",
        "dblp": ";59/6349;00/582;",
        "google_scholar": ";j2cJzNAAAAAJ;;https://scholar.google.fr/citations?user=h79bffAAAAAJ",
        "orcid": ";0009-0009-6346-4519;;",
        "linkedin": ";mathilde-mougeot-bb5a8a24/?originalSubdomain=fr;;",
        "or_profile": "~Fran\u00e7ois_Deheeger1;~Mathilde_MOUGEOT1;~Nicolas_Vayatis1;~Antoine_De_mathelin1",
        "aff": ";ENSIIE;Ecole Normale Superieure Paris-Saclay;CMLA - ENS Paris Saclay, ENS Paris-Saclay",
        "aff_domain": ";ensiie.fr;ens-paris-saclay.fr;cmla.ens-cachan.fr",
        "position": ";Full Professor;Full Professor;PhD student",
        "bibtex": "@misc{\nmathelin2024deep,\ntitle={Deep Anti-Regularized Ensembles},\nauthor={Antoine de Mathelin and Fran{\\c{c}}ois Deheeger and Mathilde MOUGEOT and Nicolas Vayatis},\nyear={2024},\nurl={https://openreview.net/forum?id=oDYXpvnv5f}\n}",
        "github": "",
        "project": "",
        "reviewers": "jYun;vXUV;d3RB;i1WL",
        "site": "https://openreview.net/forum?id=oDYXpvnv5f",
        "pdf_size": 951595,
        "rating": "3;5;5;5",
        "confidence": "4;3;4;3",
        "soundness": "3;3;2;3",
        "contribution": "2;3;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "119;52;99;147",
        "wc_strengths": "32;35;118;71",
        "wc_weaknesses": "159;426;1148;160",
        "wc_questions": "36;198;222;143",
        "wc_review": "346;711;1587;521",
        "wc_reply_reviewers": "0;39;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            104.25,
            34.65093793824346
        ],
        "wc_strengths_avg": [
            64.0,
            34.74910070778811
        ],
        "wc_weaknesses_avg": [
            473.25,
            404.47458201968635
        ],
        "wc_questions_avg": [
            149.75,
            71.64626647634893
        ],
        "wc_review_avg": [
            791.25,
            477.21608051280083
        ],
        "wc_reply_reviewers_avg": [
            9.75,
            16.887495373796554
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:WsTNHY3yQRIJ:scholar.google.com/&scioq=Deep+Anti-Regularized+Ensembles&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "\u00c9cole Nationale Sup\u00e9rieure d'Informatique pour l'Ing\u00e9nierie et les Techniques Avanc\u00e9es;Ecole Normale Superieure Paris-Saclay;\u00c9cole Normale Sup\u00e9rieure Paris-Saclay",
        "aff_unique_dep": ";;CMLA",
        "aff_unique_url": "https://www.ensiie.fr;https://www.ensparis-saclay.fr;https://www.ens-paris-saclay.fr",
        "aff_unique_abbr": "ENSIIE;ENS Paris-Saclay;ENS Paris-Saclay",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Paris-Saclay",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "France"
    },
    {
        "title": "Transformer-VQ: Linear-Time Transformers via Vector Quantization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17829",
        "id": "oDdzXQzP2F",
        "author_site": "Lucas D. Lingle",
        "tldr": "",
        "abstract": "We introduce Transformer-VQ, a decoder-only transformer computing softmax-based dense self-attention in linear time.  Transformer-VQ's efficient attention is enabled by vector-quantized keys and a novel caching mechanism. \nIn our large-scale experiments, Transformer-VQ is shown highly competitive in quality, obtaining 0.99 bpb on Enwik8, 26.6 ppl on PG-19, and 3.16 bpb on ImageNet64. In addition, the optimized implementation of Transformer-VQ is over 3x faster than a comparable quadratic-time transformer at sequence length 8k, is over 12x faster at 32k, and can scale to 131k with similar throughput. Code available: \\url{https://github.com/transformer-vq/transformer_vq}",
        "keywords": "Transformer;Transformer Decoder;Decoder-Only Transformer;Natural Language Processing;NLP;Vector Quantization;VQ;K-Means;Clustering;Causal Attention;Autoregressive Attention;Efficient Attention;Linear-Time Attention;Autoregressive Modeling;Generative Modeling;Gated Attention;Compressive Attention;Kernelized Attention;Kernelizable Attention;Hierarchical Attention;Segment-Level Recurrent Attention;Long-Context Modeling;Long-Range Modeling;Long-Range Dependencies;Long-Term Dependencies;Cached Attention;Shift-Equivariant Attention",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Lucas Dax Lingle",
        "authorids": "~Lucas_Dax_Lingle1",
        "gender": "M",
        "homepage": "https://lucaslingle.wordpress.com",
        "dblp": "",
        "google_scholar": "",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Lucas_Dax_Lingle1",
        "aff": "",
        "aff_domain": "",
        "position": "",
        "bibtex": "@inproceedings{\nlingle2024transformervq,\ntitle={Transformer-{VQ}: Linear-Time Transformers via Vector Quantization},\nauthor={Lucas Dax Lingle},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=oDdzXQzP2F}\n}",
        "github": "",
        "project": "",
        "reviewers": "5aiB;gEU7;1jb5",
        "pdf_size": 1548551,
        "rating": "6;8;8",
        "confidence": "2;3;3",
        "soundness": "2;3;4",
        "contribution": "2;3;3",
        "presentation": "2;3;3",
        "wc_summary": "22;84;75",
        "wc_strengths": "46;64;44",
        "wc_weaknesses": "180;113;203",
        "wc_questions": "2;210;53",
        "wc_review": "250;471;375",
        "wc_reply_reviewers": "262;98;109",
        "wc_reply_authors": "1541;1706;1838",
        "reply_reviewers": "1;1;1",
        "reply_authors": "6;7;5",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            60.333333333333336,
            27.35365098523819
        ],
        "wc_strengths_avg": [
            51.333333333333336,
            8.993825042154695
        ],
        "wc_weaknesses_avg": [
            165.33333333333334,
            38.177945931591914
        ],
        "wc_questions_avg": [
            88.33333333333333,
            88.51490772117931
        ],
        "wc_review_avg": [
            365.3333333333333,
            90.48142841980828
        ],
        "wc_reply_reviewers_avg": [
            156.33333333333334,
            74.85244744755437
        ],
        "wc_reply_authors_avg": [
            1695.0,
            121.49897118905987
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            6.0,
            0.816496580927726
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0.9999999999999998,
        "gs_citation": 20,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3639933601958166651&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=oDdzXQzP2F",
        "pdf": "https://openreview.net/pdf?id=oDdzXQzP2F",
        "email": "",
        "author_num": 1
    },
    {
        "title": "LMUFormer: Low Complexity Yet Powerful Spiking Model With Legendre Memory Units",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17828",
        "id": "oEF7qExD9F",
        "author_site": "Zeyu Liu, Gourav Datta, Anni Li, Peter Beerel",
        "tldr": "",
        "abstract": "Transformer models have demonstrated high accuracy in numerous applications but have high complexity and lack sequential processing capability making them ill-suited for many streaming applications at the edge where devices are heavily resource-constrained. Thus motivated, many researchers have proposed reformulating the transformer models as RNN modules which modify the self-attention computation with explicit states. However, these approaches often incur significant performance degradation.\nThe ultimate goal is to develop a model that has the following properties: parallel training, streaming and low-cost inference, and state-of-the-art (SOTA) performance. In this paper, we propose a new direction to achieve this goal. We show how architectural modifications to a fully-sequential recurrent model can help push its performance toward Transformer models while retaining its sequential processing capability. Specifically, inspired by the recent success of Legendre Memory Units (LMU) in sequence learning tasks, we propose LMUFormer, which augments the LMU with convolutional patch embedding and convolutional channel mixer. \nMoreover, we present a spiking version of this architecture, which introduces the benefit of states within the patch embedding and channel mixer modules while simultaneously reducing the computing complexity. \nWe evaluated our architectures on multiple sequence datasets. Of particular note is our performance on the Speech Commands V2 dataset (35 classes). In comparison to SOTA transformer-based models within the ANN domain, our LMUFormer demonstrates comparable performance while necessitating a remarkable $70\\times$ reduction in parameters and a substantial $140\\times$ decrement in FLOPs. Furthermore, when benchmarked against extant low-complexity SNN variants, our model establishes a new SOTA with an accuracy of 96.12\\%. \nAdditionally, owing to our model's proficiency in real-time data processing, we are able to achieve a 32.03\\% reduction in sequence length, all while incurring an inconsequential decline in performance.",
        "keywords": "Legendre Memory Unit;Spiking Neural Network;Recurrent Neural Network",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/c6bc9a0adcea1902bc52078dde824aa5b7cf921a.zip",
        "author": "Zeyu Liu;Gourav Datta;Anni Li;Peter Anthony Beerel",
        "authorids": "~Zeyu_Liu2;~Gourav_Datta1;~Anni_Li1;~Peter_Anthony_Beerel1",
        "gender": "M;M;F;M",
        "homepage": ";https://godatta.github.io;;http://sites.usc.edu/eessc.html",
        "dblp": "116/0645-3;250/9607.html;;29/6330",
        "google_scholar": "Gk5kyEEAAAAJ;hxSN-fcAAAAJ;U_bNWpwAAAAJ;JSdH7PsAAAAJ",
        "orcid": ";;0000-0002-7989-2894;",
        "linkedin": "zeyu-liu-364982220/;gourav-datta-959571a3/;anni-li-10746519b/;peter-beerel-b9902a1/",
        "or_profile": "~Zeyu_Liu2;~Gourav_Datta1;~Anni_Li1;~Peter_Anthony_Beerel1",
        "aff": "University of Southern California;Amazon;University of Southern California;University of Southern California",
        "aff_domain": "usc.edu;amazon.com;usc.edu;usc.edu",
        "position": "PhD student;Researcher;MS student;Full Professor",
        "bibtex": "@inproceedings{\nliu2024lmuformer,\ntitle={{LMUF}ormer: Low Complexity Yet Powerful Spiking Model With Legendre Memory Units},\nauthor={Zeyu Liu and Gourav Datta and Anni Li and Peter Anthony Beerel},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=oEF7qExD9F}\n}",
        "github": "",
        "project": "",
        "reviewers": "KEVY;4AC7;FTnd;2bBb",
        "pdf_size": 962806,
        "rating": "3;6;6;8",
        "confidence": "4;2;2;2",
        "soundness": "2;3;2;3",
        "contribution": "1;3;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "44;245;33;88",
        "wc_strengths": "28;263;58;96",
        "wc_weaknesses": "143;135;82;74",
        "wc_questions": "6;29;18;92",
        "wc_review": "221;672;191;350",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "411;577;635;622",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            2.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            102.5,
            84.80713413386871
        ],
        "wc_strengths_avg": [
            111.25,
            90.86631664153664
        ],
        "wc_weaknesses_avg": [
            108.5,
            30.76117683054405
        ],
        "wc_questions_avg": [
            36.25,
            33.199209327934305
        ],
        "wc_review_avg": [
            358.5,
            190.60233471812458
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            561.25,
            89.3766608237296
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8892972917998875,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3870004424967450026&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=oEF7qExD9F",
        "pdf": "https://openreview.net/pdf?id=oEF7qExD9F",
        "email": "usc.edu;amazon.com;usc.edu;usc.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "University of Southern California;Amazon",
        "aff_unique_dep": ";Amazon.com, Inc.",
        "aff_unique_url": "https://www.usc.edu;https://www.amazon.com",
        "aff_unique_abbr": "USC;Amazon",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Los Angeles;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "oEuTWBfVoe",
        "title": "Model Based Inference of Synaptic Plasticity Rules",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Understanding learning through synaptic plasticity rules in the brain is a grand challenge for neuroscience. Here we introduce a novel computational framework for inferring plasticity rules from experimental data on neural activity trajectories and behavioral learning dynamics. Our methodology parameterizes the plasticity function to provide theoretical interpretability and facilitate gradient-based optimization. For instance, we use Taylor series expansions or multilayer perceptrons to approximate plasticity rules, and we adjust their parameters via gradient descent over entire trajectories to closely match observed neural activity and behavioral data. Notably, our approach can learn intricate rules that induce long time-dependencies, such as those incorporating weight decay. We validate our method through simulations, accurately recovering established rules, like Oja's, and more complex hypothetical rules incorporating reward-modulated terms. We assess the resilience of our technique to noise and, as a tangible application, apply it to behavioral data from \\emph{Drosophila} during a probabilistic reward-learning experiment. Remarkably, we identify an active forgetting component of reward learning in flies that enhances the predictive accuracy of previous models. Overall, our modeling framework provides an exciting new avenue to elucidate the computational principles governing synaptic plasticity and learning in the brain.",
        "keywords": "synaptic plasticity;neuroscience;biologically plausible learning;model fitting",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "Yash Mehta;Danil Tyulmankov;Adithya Echambadi Rajagopalan;Glenn C Turner;James E Fitzgerald;Jan Funke",
        "authorids": "~Yash_Mehta1;~Danil_Tyulmankov1;~Adithya_Echambadi_Rajagopalan1;~Glenn_C_Turner1;~James_E_Fitzgerald1;~Jan_Funke3",
        "gender": "M;;M;M;M;",
        "homepage": "https://yashsmehta.com/;;;https://www.janelia.org/lab/turner-lab;https://www.janelia.org/lab/fitzgerald-lab;https://www.janelia.org/lab/funke-lab",
        "dblp": ";;;;;60/9514",
        "google_scholar": "zFqBbIkAAAAJ;;xOYdbhEAAAAJ;Mr8K0jMAAAAJ;https://scholar.google.com/citations?hl=en;7rqAapgAAAAJ",
        "orcid": "0000-0002-9610-7077;;0000-0002-3184-3647;0000-0002-5341-2784;0000-0002-0949-4188;",
        "linkedin": "yashsmehta/;;rajagopalana1995;;;",
        "or_profile": "~Yash_Mehta1;~Danil_Tyulmankov1;~Adithya_Echambadi_Rajagopalan1;~Glenn_C_Turner1;~James_E_Fitzgerald1;~Jan_Funke3",
        "aff": "Johns Hopkins University;;New York University;;Northwestern University;HHMI Janelia Research Campus",
        "aff_domain": "johnshopkins.edu;;nyu.edu;;northwestern.edu;janelia.hhmi.org",
        "position": "PhD student;;Postdoc;;Associate Professor;Group leader",
        "bibtex": "@misc{\nmehta2024model,\ntitle={Model Based Inference of Synaptic Plasticity Rules},\nauthor={Yash Mehta and Danil Tyulmankov and Adithya Echambadi Rajagopalan and Glenn C Turner and James E Fitzgerald and Jan Funke},\nyear={2024},\nurl={https://openreview.net/forum?id=oEuTWBfVoe}\n}",
        "github": "",
        "project": "",
        "reviewers": "qMGi;QuAL;Xu3v;s75f",
        "site": "https://openreview.net/forum?id=oEuTWBfVoe",
        "pdf_size": 3773855,
        "rating": "5;5;5;6",
        "confidence": "4;3;4;3",
        "soundness": "3;2;2;3",
        "contribution": "3;2;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "98;63;170;52",
        "wc_strengths": "79;94;96;66",
        "wc_weaknesses": "113;396;478;302",
        "wc_questions": "158;78;113;114",
        "wc_review": "448;631;857;534",
        "wc_reply_reviewers": "114;367;377;133",
        "wc_reply_authors": "1013;2212;2064;1018",
        "reply_reviewers": "1;1;1;2",
        "reply_authors": "4;4;5;3",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            95.75,
            46.11060073345391
        ],
        "wc_strengths_avg": [
            83.75,
            12.173228823939851
        ],
        "wc_weaknesses_avg": [
            322.25,
            135.91610463811858
        ],
        "wc_questions_avg": [
            115.75,
            28.375825979167548
        ],
        "wc_review_avg": [
            617.5,
            152.6802213778851
        ],
        "wc_reply_reviewers_avg": [
            247.75,
            124.48167535826308
        ],
        "wc_reply_authors_avg": [
            1576.75,
            563.6866926759935
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.0,
            0.7071067811865476
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=199466819784415940&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Johns Hopkins University;New York University;Northwestern University;HHMI Janelia Research Campus",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.jhu.edu;https://www.nyu.edu;https://www.northwestern.edu;https://www.janelia.org",
        "aff_unique_abbr": "JHU;NYU;NU;HHMI Janelia",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Janelia",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "oEzY6fRUMH",
        "title": "State Chrono Representation for Enhancing Generalization in Reinforcement Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Developing a robust and generalizable state representation is essential for overcoming the challenges posed by reinforcement learning tasks that rely on images as input. Recent developments in metric learning, including techniques like deep bisimulation metric approaches, have facilitated the transformation of states into structured representation spaces, allowing the measurement of distances based on task-relevant features. However, these approaches face challenges in handling demanding generalization tasks and scenarios characterized by sparse rewards. Their limited one-step update strategy often falls short of capturing adequate long-term behaviors within their representations. To address these challenges, we present the State Chrono Representation (SCR) approach, which enhances state representations by integrating long-term information alongside the bisimulation metric. SCR learns state distances and measurements within a temporal framework, considering future dynamics and accumulated rewards across current and long-term future states. The resulting representation space not only captures sequential behavioral information but also integrates distances and measurements from the present to the future. This temporal-aware learning strategy does not introduce a significant number of additional parameters for modeling dynamics, ensuring the efficiency of the entire learning process. Comprehensive experiments conducted within DeepMind Control environments reveal that SCR achieves state-of-the-art performance in demanding generalization tasks and scenarios characterized by sparse rewards.",
        "keywords": "Deep Reinforcement Learning; Representation Learning; Bisimulation Metric",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Jianda Chen;Wen Zheng Terence Ng;Zichen Chen;Sinno Jialin Pan;Tianwei Zhang",
        "authorids": "~Jianda_Chen1;ngwe0099@e.ntu.edu.sg;~Zichen_Chen1;~Sinno_Jialin_Pan1;~Tianwei_Zhang1",
        "gender": ";;F;;M",
        "homepage": ";;;;https://personal.ntu.edu.sg/tianwei.zhang/index.html",
        "dblp": "176/6660;;23/7781;;77/7902-4",
        "google_scholar": "jEOSgcUAAAAJ;;X4goIzYAAAAJ;;9vpiYDIAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Jianda_Chen1;ngwe0099@e.ntu.edu.sg;~Zichen_Chen1;~Sinno_Jialin_Pan1;~Tianwei_Zhang1",
        "aff": "Nanyang Technological University;;University of California, Santa Barbara;;Nanyang Technological University",
        "aff_domain": "ntu.edu.sg;;ucsb.edu;;ntu.edu.sg",
        "position": "Researcher;;PhD student;;Assistant Professor",
        "bibtex": "@misc{\nanonymous2024state,\ntitle={State Chrono Representation for Enhancing Generalization in Reinforcement Learning},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=oEzY6fRUMH}\n}",
        "github": "",
        "project": "",
        "reviewers": "JyET;w1s3;AZZ2;yyec",
        "site": "https://openreview.net/forum?id=oEzY6fRUMH",
        "pdf_size": 3895171,
        "rating": "3;3;5;8",
        "confidence": "5;3;4;3",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;2;3",
        "wc_summary": "87;15;116;170",
        "wc_strengths": "27;27;68;84",
        "wc_weaknesses": "526;155;35;303",
        "wc_questions": "80;20;50;72",
        "wc_review": "720;217;269;629",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1710;1383;582;988",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;2;1;2",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            97.0,
            55.93299562869845
        ],
        "wc_strengths_avg": [
            51.5,
            25.144581921360317
        ],
        "wc_weaknesses_avg": [
            254.75,
            183.1288822114087
        ],
        "wc_questions_avg": [
            55.5,
            23.25403190846697
        ],
        "wc_review_avg": [
            458.75,
            218.90908501019322
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1165.75,
            423.0144057830655
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.47886115464444223,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:9O66YYNCCOQJ:scholar.google.com/&scioq=State+Chrono+Representation+for+Enhancing+Generalization+in+Reinforcement+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Nanyang Technological University;University of California, Santa Barbara",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ntu.edu.sg;https://www.ucsb.edu",
        "aff_unique_abbr": "NTU;UCSB",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Santa Barbara",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Singapore;United States"
    },
    {
        "id": "oFNpRlPxyQ",
        "title": "MSPipe: Minimal Staleness Pipeline for Efficient Temporal GNN Training",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Temporal graph neural networks (TGNNs) have demonstrated exceptional performance in modeling interactions on dynamic graphs. However, the adoption of memory modules in state-of-the-art TGNNs introduces significant overhead, leading to performance bottlenecks during training. This paper presents MSPipe, a minimal staleness pipeline design for maximizing training throughput of memory-based TGNNs, tailored to maintain model accuracy and reduce resource contention. Our design addresses the unique challenges associated with fetching and updating memory modules in TGNNs. We propose an online pipeline scheduling algorithm that strategically breaks temporal dependencies between iterations with minimal staleness and delays memory fetching (for obtaining fresher memory vectors) without stalling the GNN training stage or causing resource contention. We further design a staleness mitigation mechanism to improve training convergence and model accuracy. We provide convergence analysis and demonstrate that MSPipe retains the same convergence rate as vanilla sampling-based GNN training. Our experiments show that MSPipe achieves up to 2.45$\\times$ speed-up without sacrificing accuracy, making it a promising solution for efficient TGNN training. The implementation (anonymous) for our paper can be found at [https://anonymous.4open.science/r/MSPipe/](https://anonymous.4open.science/r/MSPipe/).",
        "keywords": "Representation Learning;Temporal Graph Neural Networks;Asynchronous Training;Staled Memory",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Guangming Sheng;Junwei Su;Chuan Wu",
        "authorids": "~Guangming_Sheng1;~Junwei_Su1;~Chuan_Wu1",
        "gender": "M;M;",
        "homepage": ";;https://i.cs.hku.hk/~cwu/",
        "dblp": "72/9556;226/0880;34/3772-1",
        "google_scholar": ";https://scholar.google.ca/citations?user=jtWS-OMAAAAJ;mY7MWXMAAAAJ",
        "orcid": "0000-0003-3395-3994;;",
        "linkedin": ";;",
        "or_profile": "~Guangming_Sheng1;~Junwei_Su1;~Chuan_Wu1",
        "aff": "University of Hong Kong;The University of Hong Kong;The University of Hong Kong",
        "aff_domain": "hku.hk;hku.hk;hku.hk",
        "position": "PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nsheng2024mspipe,\ntitle={{MSP}ipe: Minimal Staleness Pipeline for Efficient Temporal {GNN} Training},\nauthor={Guangming Sheng and Junwei Su and Chuan Wu},\nyear={2024},\nurl={https://openreview.net/forum?id=oFNpRlPxyQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "6Ut8;a7Lb;Vi4E;juas",
        "site": "https://openreview.net/forum?id=oFNpRlPxyQ",
        "pdf_size": 10830944,
        "rating": "1;5;6;6",
        "confidence": "4;3;4;3",
        "soundness": "1;3;2;3",
        "contribution": "1;2;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "167;46;107;134",
        "wc_strengths": "36;73;41;112",
        "wc_weaknesses": "318;73;168;100",
        "wc_questions": "104;3;100;109",
        "wc_review": "625;195;416;455",
        "wc_reply_reviewers": "0;0;162;0",
        "wc_reply_authors": "1101;574;1826;761",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "3;2;4;2",
        "rating_avg": [
            4.5,
            2.0615528128088303
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            113.5,
            44.38749823993238
        ],
        "wc_strengths_avg": [
            65.5,
            30.36856927812043
        ],
        "wc_weaknesses_avg": [
            164.75,
            95.00888116381542
        ],
        "wc_questions_avg": [
            79.0,
            43.99431781491787
        ],
        "wc_review_avg": [
            422.75,
            153.1835092299429
        ],
        "wc_reply_reviewers_avg": [
            40.5,
            70.14805770653953
        ],
        "wc_reply_authors_avg": [
            1065.5,
            477.99398531780713
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.48507125007266594,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:T8cYMZqj3kwJ:scholar.google.com/&scioq=MSPipe:+Minimal+Staleness+Pipeline+for+Efficient+Temporal+GNN+Training&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Hong Kong",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.hku.hk",
        "aff_unique_abbr": "HKU",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Entropy-MCMC: Sampling from Flat Basins with Ease",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17827",
        "id": "oGNdBvymod",
        "author_site": "Bolian Li, Ruqi Zhang",
        "tldr": "",
        "abstract": "Bayesian deep learning counts on the quality of posterior distribution estimation. However, the posterior of deep neural networks is highly multi-modal in nature, with local modes exhibiting varying generalization performance. Given a practical budget, targeting at the original posterior can lead to suboptimal performance, as some samples may become trapped in \"bad\" modes and suffer from overfitting. Leveraging the observation that \"good\" modes with low generalization error often reside in flat basins of the energy landscape, we propose to bias sampling on the posterior toward these flat regions. Specifically, we introduce an auxiliary guiding variable, the stationary distribution of which resembles a smoothed posterior free from sharp modes, to lead the MCMC sampler to flat basins. By integrating this guiding variable with the model parameter, we create a simple joint distribution that enables efficient sampling with minimal computational overhead. We prove the convergence of our method and further show that it converges faster than several existing flatness-aware methods in the strongly convex setting. Empirical results demonstrate that our method can successfully sample from flat basins of the posterior, and outperforms all compared baselines on multiple benchmarks including classification, calibration, and out-of-distribution detection.",
        "keywords": "MCMC;Bayesian Deep Learning;Flatness-aware Learning",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Bolian Li;Ruqi Zhang",
        "authorids": "~Bolian_Li1;~Ruqi_Zhang1",
        "gender": "M;F",
        "homepage": "https://lblaoke.github.io/;https://ruqizhang.github.io/",
        "dblp": "304/3220.html;",
        "google_scholar": "wNDoepwAAAAJ;4ojpmc8AAAAJ",
        "orcid": "0000-0002-1977-0764;",
        "linkedin": "bolian-li-554001297/;",
        "or_profile": "~Bolian_Li1;~Ruqi_Zhang1",
        "aff": "Purdue University;Purdue University",
        "aff_domain": "purdue.edu;purdue.edu",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nli2024entropymcmc,\ntitle={Entropy-{MCMC}: Sampling from Flat Basins with Ease},\nauthor={Bolian Li and Ruqi Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=oGNdBvymod}\n}",
        "github": "",
        "project": "",
        "reviewers": "Prwy;JBLt;nUGC;CmLw;QrYa",
        "pdf_size": 1616670,
        "rating": "5;6;6;6;8",
        "confidence": "3;3;4;4;4",
        "soundness": "2;3;3;3;3",
        "contribution": "3;3;3;3;3",
        "presentation": "2;3;4;3;4",
        "wc_summary": "113;56;118;55;188",
        "wc_strengths": "55;125;92;40;99",
        "wc_weaknesses": "163;237;145;210;139",
        "wc_questions": "234;27;249;4;59",
        "wc_review": "565;445;604;309;485",
        "wc_reply_reviewers": "503;22;451;0;26",
        "wc_reply_authors": "1677;696;1591;1102;871",
        "reply_reviewers": "3;1;1;0;1",
        "reply_authors": "6;2;4;3;3",
        "rating_avg": [
            6.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.2,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            106.0,
            49.02652343374961
        ],
        "wc_strengths_avg": [
            82.2,
            30.759713912843857
        ],
        "wc_weaknesses_avg": [
            178.8,
            38.306135278829686
        ],
        "wc_questions_avg": [
            114.6,
            105.18288834216332
        ],
        "wc_review_avg": [
            481.6,
            103.03319853328829
        ],
        "wc_reply_reviewers_avg": [
            200.4,
            226.61385659310423
        ],
        "wc_reply_authors_avg": [
            1187.4,
            387.6795583984278
        ],
        "reply_reviewers_avg": [
            1.2,
            0.9797958971132712
        ],
        "reply_authors_avg": [
            3.6,
            1.3564659966250536
        ],
        "replies_avg": [
            32,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.5833333333333334,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11803003165271411759&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=oGNdBvymod",
        "pdf": "https://openreview.net/pdf?id=oGNdBvymod",
        "email": "purdue.edu;purdue.edu",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Purdue University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.purdue.edu",
        "aff_unique_abbr": "Purdue",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "oGsR3MJvwS",
        "title": "Generalizable Deep RL-Based TSP Solver via Approximate Invariance",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recently, deep reinforcement learning (DRL) has shown promising results for learning fast heuristics to solve traveling salesman problems (TSP). Meanwhile, most existing state-of-the-art (SOTA) DRL methods yield solvers that do not generalize well on TSP instances larger than those seen during training. However, such generalization ability is crucial in practice since training on large instances is impractical. To tackle this issue, we propose a novel DRL method, called TS$^3$, which is designed to enforce a variety of (possibly approximate) invariances to promote the generalizability of the learned solver. More specifically, TS$^3$ applies a modified policy gradient algorithm enhanced with data augmentation to train a Transformer-based model to select the next city to visit among the k-nearest neighbors of the last visited city by integrating a local view and global view of a TSP instance. To further validate the capability of TS$^3$, we also propose its combination with Monte-Carlo Tree Search. Abundant experiments on random TSP and TSPLIB instances demonstrate that our propositions achieve a dominant performance when generalizing to large-sized TSPs.",
        "keywords": "Travelling Salesman Problem;Transformer;Invariance;Augmentation;Monte-Carlo Tree Search",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/9aea3ee982d23e14e62ea5c3346d6f85f8545661.zip",
        "author": "Han Fang;Zhihao Song;Paul Weng",
        "authorids": "~Han_Fang7;~Zhihao_Song1;~Paul_Weng1",
        "gender": "M;M;M",
        "homepage": "https://github.com/Kasumigaoka-Utaha;https://github.com/howord-texin;http://weng.fr",
        "dblp": ";;http://dblp.uni-trier.de/pers/hd/w/Weng:Paul",
        "google_scholar": ";;_Hd6AeQAAAAJ",
        "orcid": ";;",
        "linkedin": ";;paul-weng-69a15980/",
        "or_profile": "~Han_Fang7;~Zhihao_Song1;~Paul_Weng1",
        "aff": "Shanghai Jiaotong University;Shanghai Jiaotong University;Duke Kunshan University",
        "aff_domain": "sjtu.edu.cn;sjtu.edu.cn;dukekunshan.edu.cn",
        "position": "MS student;PhD student;Associate Professor",
        "bibtex": "@misc{\nfang2024generalizable,\ntitle={Generalizable Deep {RL}-Based {TSP} Solver via Approximate Invariance},\nauthor={Han Fang and Zhihao Song and Paul Weng},\nyear={2024},\nurl={https://openreview.net/forum?id=oGsR3MJvwS}\n}",
        "github": "",
        "project": "",
        "reviewers": "tWCL;xEdU;jwE3;dYNB",
        "site": "https://openreview.net/forum?id=oGsR3MJvwS",
        "pdf_size": 1466957,
        "rating": "1;3;3;5",
        "confidence": "5;4;3;4",
        "soundness": "2;2;3;3",
        "contribution": "1;1;2;2",
        "presentation": "2;3;2;2",
        "wc_summary": "62;76;54;58",
        "wc_strengths": "13;11;64;56",
        "wc_weaknesses": "213;177;186;380",
        "wc_questions": "6;28;91;70",
        "wc_review": "294;292;395;564",
        "wc_reply_reviewers": "0;0;0;44",
        "wc_reply_authors": "8;289;310;527",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            62.5,
            8.2915619758885
        ],
        "wc_strengths_avg": [
            36.0,
            24.176434807473164
        ],
        "wc_weaknesses_avg": [
            239.0,
            82.4772695959317
        ],
        "wc_questions_avg": [
            48.75,
            33.521448357730605
        ],
        "wc_review_avg": [
            386.25,
            110.75282163448477
        ],
        "wc_reply_reviewers_avg": [
            11.0,
            19.05255888325765
        ],
        "wc_reply_authors_avg": [
            283.5,
            184.34003905825776
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:_AMFnhxZdIgJ:scholar.google.com/&scioq=Generalizable+Deep+RL-Based+TSP+Solver+via+Approximate+Invariance&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Shanghai Jiao Tong University;Duke Kunshan University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.sjtu.edu.cn;https://www.duk/Dk.edu",
        "aff_unique_abbr": "SJTU;DKU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Kunshan",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "oHJPxZDoPl",
        "title": "SEGO: Sequential Subgoal Optimization for Mathematical Problem-Solving",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) have driven substantial progress in artificial intelligence in recent years, exhibiting impressive capabilities across a wide range of tasks, including mathematical problem-solving. Inspired by the success of subgoal-based methods, we propose a novel framework called \\textbf{SE}quential sub\\textbf{G}oal \\textbf{O}ptimization (SEGO) to enhance LLMs' ability to solve mathematical problems. By establishing a connection between the subgoal breakdown process and the probability of solving problems, SEGO aims to identify better subgoals with theoretical guarantees. Addressing the challenge of identifying suitable subgoals in a large solution space, our framework generates problem-specific subgoals and adjusts them according to carefully designed criteria. Incorporating these optimized subgoals into the policy model training leads to significant improvements in problem-solving performance. We validate SEGO's efficacy through experiments on two benchmarks, GSM8K and MATH, where our approach outperforms existing methods, highlighting the potential of SEGO in AI-driven mathematical problem-solving. \\footnote{All data and code will be open-sourced upon publication.}",
        "keywords": "large language models;mathematical problem-solving;reinforcement learning",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "",
        "author": "Xueliang Zhao;Xinting Huang;Wei Bi;Lingpeng Kong",
        "authorids": "~Xueliang_Zhao1;~Xinting_Huang1;~Wei_Bi1;~Lingpeng_Kong1",
        "gender": "M;M;F;M",
        "homepage": ";https://timhuang1.github.io/;https://scholar.google.com.hk/citations?hl=en&user=aSJcgQMAAAAJ&view_op=list_works&sortby=pubdate#d=gsc_md_iad&u=%2Fcitations%3Fview_op%3Dimport_lookup%26hl%3Den%26imq%3DWei%2BBi%26json%3D%26btnA%3D1;https://ikekonglp.github.io/",
        "dblp": ";;38/1163;144/7656",
        "google_scholar": "h-87C9cAAAAJ;QmyPDWQAAAAJ;https://scholar.google.com.hk/citations?hl=en;f1hBi5wAAAAJ",
        "orcid": ";;0000-0001-8457-0630;",
        "linkedin": ";xintingh/;;",
        "or_profile": "~Xueliang_Zhao1;~Xinting_Huang1;~Wei_Bi1;~Lingpeng_Kong1",
        "aff": "The University of Hong Kong;Tencent;Hong Kong University of Science and Technology;Department of Computer Science, The University of Hong Kong",
        "aff_domain": "cs.hku.hk;tencent.com;ust.hk;cs.hku.hk",
        "position": "PhD student;Researcher;PhD student;Assistant Professor",
        "bibtex": "@misc{\nzhao2024sego,\ntitle={{SEGO}: Sequential Subgoal Optimization for Mathematical Problem-Solving},\nauthor={Xueliang Zhao and Xinting Huang and Wei Bi and Lingpeng Kong},\nyear={2024},\nurl={https://openreview.net/forum?id=oHJPxZDoPl}\n}",
        "github": "",
        "project": "",
        "reviewers": "DwRV;PGvU;A5yj;bT9K",
        "site": "https://openreview.net/forum?id=oHJPxZDoPl",
        "pdf_size": 545599,
        "rating": "3;5;6;6",
        "confidence": "4;3;3;3",
        "soundness": "2;2;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;2;2;3",
        "wc_summary": "78;63;98;165",
        "wc_strengths": "40;35;42;105",
        "wc_weaknesses": "537;74;149;109",
        "wc_questions": "59;414;74;133",
        "wc_review": "714;586;363;512",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            101.0,
            38.98076448711595
        ],
        "wc_strengths_avg": [
            55.5,
            28.692333470807146
        ],
        "wc_weaknesses_avg": [
            217.25,
            186.5051942976388
        ],
        "wc_questions_avg": [
            170.0,
            143.56357476741795
        ],
        "wc_review_avg": [
            543.75,
            126.93379179714124
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9428090415820632,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17669959869248336769&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "University of Hong Kong;Tencent;Hong Kong University of Science and Technology",
        "aff_unique_dep": ";Tencent Holdings Limited;",
        "aff_unique_url": "https://www.hku.hk;https://www.tencent.com;https://www.ust.hk",
        "aff_unique_abbr": "HKU;Tencent;HKUST",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "oIwoBDsJJI",
        "title": "Measuring Graph Similarity Using Transfer Cost of Forster Distributions",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In recent years, optimal transport-based distance metrics have shown to be effective similarity and dissimilarity measures for tackling learning problems involving network data. Prominent examples range from graph classification and community detection to object matching. However, the high computational complexity of calculating optimal transport costs substantially confines their applications to large-scale networks. To address this challenge, in this paper, we introduce a probability distribution on the set of edges of a graph, referred to as the Foster distribution of the graph, by extending Foster's theorem from electrical to general networks. Then, we represent Foster distributions as probability measures on the real line and estimate the Wasserstein metric between the corresponding probability measures to quantify graph similarity. The applicability of the proposed approach is corroborated on diverse graph-structured datasets, through which we particularly demonstrate the high efficiency of computing the proposed graph distance for sparse graphs.",
        "keywords": "Graph similarity;Foster distributions",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/5fc57ceca8422c03e2ae5306b7b11992369b358c.pdf",
        "author": "Lin Li;Bharat Singhal;Wei Zhang;Jr-Shin Li",
        "authorids": "~Lin_Li23;~Bharat_Singhal1;~Wei_Zhang67;~Jr-Shin_Li1",
        "gender": "M;M;M;M",
        "homepage": ";;;https://www.ese.wustl.edu/~jsli/AMLab/Home.html",
        "dblp": ";;;",
        "google_scholar": ";0xeNvrsAAAAJ;;",
        "orcid": ";;0000-0003-0003-0341;",
        "linkedin": "linliwashu;;;",
        "or_profile": "~Lin_Li23;~Bharat_Singhal1;~Wei_Zhang67;~Jr-Shin_Li1",
        "aff": "Duke University;Washington University, Saint Louis;Washington University, Saint Louis;Washington University, St. Louis",
        "aff_domain": "duke.edu;wustl.edu;wustl.edu;wustl.edu",
        "position": "Researcher;PhD student;Postdoc;Full Professor",
        "bibtex": "@misc{\nli2024measuring,\ntitle={Measuring Graph Similarity Using Transfer Cost of Forster Distributions},\nauthor={Lin Li and Bharat Singhal and Wei Zhang and Jr-Shin Li},\nyear={2024},\nurl={https://openreview.net/forum?id=oIwoBDsJJI}\n}",
        "github": "",
        "project": "",
        "reviewers": "Gupv;zerX;hTPf;XoAE",
        "site": "https://openreview.net/forum?id=oIwoBDsJJI",
        "pdf_size": 1582123,
        "rating": "3;3;3;5",
        "confidence": "4;4;3;4",
        "soundness": "1;2;2;4",
        "contribution": "1;2;2;2",
        "presentation": "2;2;2;4",
        "wc_summary": "65;90;33;161",
        "wc_strengths": "48;91;32;47",
        "wc_weaknesses": "74;307;96;48",
        "wc_questions": "297;79;81;36",
        "wc_review": "484;567;242;292",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            1.0897247358851685
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            87.25,
            47.129475914760604
        ],
        "wc_strengths_avg": [
            54.5,
            22.005681084665387
        ],
        "wc_weaknesses_avg": [
            131.25,
            102.88191046048863
        ],
        "wc_questions_avg": [
            123.25,
            101.91264641839108
        ],
        "wc_review_avg": [
            396.25,
            133.71307901622788
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:m1C29VFFNj4J:scholar.google.com/&scioq=Measuring+Graph+Similarity+Using+Transfer+Cost+of+Forster+Distributions&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Duke University;Washington University in St. Louis",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.duke.edu;https://wustl.edu",
        "aff_unique_abbr": "Duke;WUSTL",
        "aff_campus_unique_index": "1;1;2",
        "aff_campus_unique": ";Saint Louis;St. Louis",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "oJ1tx3fXDA",
        "title": "Communication-Efficient Heterogeneous Federated Learning with Generalized Heavy-Ball Momentum",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In recent years Federated Learning (FL) has emerged as the state-of-the-art approach for learning from decentralized data, thanks to its privacy-preserving and communication-efficiency characteristics. \nAs the current literature reports, the main problems associated with FL refer to system and statistical challenges: former ones demand for efficient learning from edge devices, including lowering communication bandwidth and frequency, while the latter require algorithms robust to non-iidness. \nA principled way to address this issue relies on additional control variables to correct the local client's updates, but the convergence guarantees come at the cost of doubled communication cost. This motivates the need for a communication-efficient FL algorithm that robustly handles data heterogeneity.\nIn this work we generalize the heavy-ball momentum to the FL scenario, effectively addressing the statistical heterogeneity without introducing any communication overhead.\nWe conduct extensive experimentation on common FL vision and NLP datasets, showing that our FedHBM algorithm empirically yields better model quality and higher convergence speed w.r.t. the state-of-art, especially in pathological non-iid scenarios.\nExperiments in controlled small-scale scenarios are extended to large-scale real-world federated datasets, further corroborating the effectiveness of our approach for real-world FL applications. \nWe additionally show how, while being designed for cross-silo settings, FedHBM is applicable in moderate-to-high cross-device scenarios, and how good model initializations (e.g. pre-training) can be exploited for prompt acceleration.",
        "keywords": "federated learning;computer vision;machine learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/24ef9b09f5060cc3355ad15f04cb1bb063ce450d.zip",
        "author": "Riccardo Zaccone;Carlo Masone;Barbara Caputo;Marco Ciccone",
        "authorids": "~Riccardo_Zaccone1;~Carlo_Masone1;~Barbara_Caputo1;~Marco_Ciccone1",
        "gender": "M;M;F;M",
        "homepage": ";https://cmas1.github.io/;http://www.dauin.polito.it/personale/scheda/(nominativo)/barbara.caputo;https://marcociccone.github.io/",
        "dblp": "312/5698;26/8365;04/7038;191/9375",
        "google_scholar": "7gyywFsAAAAJ;https://scholar.google.it/citations?user=cM3Iz_4AAAAJ;https://scholar.google.it/citations?user=mHbdIAwAAAAJ;https://scholar.google.it/citations?user=hOQjblcAAAAJ",
        "orcid": ";0000-0002-1609-9338;;",
        "linkedin": "riccardozacc/;;;",
        "or_profile": "~Riccardo_Zaccone1;~Carlo_Masone1;~Barbara_Caputo1;~Marco_Ciccone1",
        "aff": "Polytechnic Institute of Turin;Polytechnic Institute of Turin;Sapienza University of Rome;Vector Institute",
        "aff_domain": "polito.it;polito.it;uniroma1.it;vectorinstitute.ai",
        "position": "PhD student;Assistant Professor;Associate Professor;Postdoc",
        "bibtex": "@misc{\nzaccone2024communicationefficient,\ntitle={Communication-Efficient Heterogeneous Federated Learning with Generalized Heavy-Ball Momentum},\nauthor={Riccardo Zaccone and Carlo Masone and Barbara Caputo and Marco Ciccone},\nyear={2024},\nurl={https://openreview.net/forum?id=oJ1tx3fXDA}\n}",
        "github": "",
        "project": "",
        "reviewers": "8a6j;Yr1w;ZLT2;wwM7",
        "site": "https://openreview.net/forum?id=oJ1tx3fXDA",
        "pdf_size": 831952,
        "rating": "3;3;6;8",
        "confidence": "5;3;4;4",
        "soundness": "2;2;3;3",
        "contribution": "1;1;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "62;129;104;109",
        "wc_strengths": "43;23;120;95",
        "wc_weaknesses": "468;153;158;166",
        "wc_questions": "35;39;3;111",
        "wc_review": "608;344;385;481",
        "wc_reply_reviewers": "215;0;80;14",
        "wc_reply_authors": "1491;711;832;438",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "4;1;2;1",
        "rating_avg": [
            5.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            101.0,
            24.38237068047322
        ],
        "wc_strengths_avg": [
            70.25,
            38.931831449342326
        ],
        "wc_weaknesses_avg": [
            236.25,
            133.88124401871983
        ],
        "wc_questions_avg": [
            47.0,
            39.496835316262995
        ],
        "wc_review_avg": [
            454.5,
            101.61815782624679
        ],
        "wc_reply_reviewers_avg": [
            77.25,
            85.07459961704198
        ],
        "wc_reply_authors_avg": [
            868.0,
            386.96705286109307
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "Polytechnic Institute of Turin;Sapienza University of Rome;Vector Institute",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.polito.it;https://www.uniroma1.it;https://vectorinstitute.ai/",
        "aff_unique_abbr": "Polito;Sapienza;Vector Institute",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Rome",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "Italy;Canada"
    },
    {
        "id": "oKGDfMrD4A",
        "title": "Exploring Adversarial Robustness of Graph Neural Networks in Directed Graphs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Existing research on robust Graph Neural Networks (GNNs) focuses predominantly on undirected graphs, neglecting the trustworthiness inherent in directed graphs. This work analyzes the limitations of existing approaches from both attack and defense perspectives, and we present an exploration of the adversarial robustness of GNNs in directed graphs. Specifically, we first introduce a new and more realistic directed graph attack setting to overcome the limitations of existing attacks. Then we propose a simple and effective message-passing framework as a plug-in layer to enhance the robustness of GNNs while avoiding a false sense of security. Our findings demonstrate that the profound trust implications offered by directed graphs can be harnessed to bolster the robustness and resilience of GNNs significantly. When coupled with existing defense strategies, this framework achieves outstanding clean accuracy and state-of-the-art robust performance against both transfer and adaptive attacks.",
        "keywords": "Adversarial Robustness;Graph Neural Networks;Directed Graphs",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/8ccdfd7ebd3d45342f137106acbd6939c78dfda7.pdf",
        "author": "Zhichao Hou;Xitong Zhang;Wei Wang;Charu C. Aggarwal;Xiaorui Liu",
        "authorids": "~Zhichao_Hou1;~Xitong_Zhang1;~Wei_Wang78;~Charu_C._Aggarwal2;~Xiaorui_Liu1",
        "gender": "M;M;F;M;M",
        "homepage": "https://chris-hzc.github.io/;;https://wangwe90.github.io/;http://www.charuaggarwal.net;https://sites.google.com/ncsu.edu/xiaorui/",
        "dblp": "188/4064;156/9687;35/7092-337;a/CharuCAggarwal;172/0995",
        "google_scholar": "rraC4ZMAAAAJ;Ci9svAcAAAAJ;G80HY5EAAAAJ;x_wsduUAAAAJ;NhvN1KoAAAAJ",
        "orcid": "0000-0002-3989-2654;;;0000-0003-2579-7581;0000-0001-8217-5688",
        "linkedin": "zhichao-hou-b022931a4/;xitong-zhang-70118915a/;wei-wang-2a9819105/;;",
        "or_profile": "~Zhichao_Hou1;~Xitong_Zhang1;~Wei_Wang78;~Charu_C._Aggarwal2;~Xiaorui_Liu1",
        "aff": "Amazon;Michigan State University;Meta Facebook;International Business Machines;North Carolina State University",
        "aff_domain": "amazon.com;msu.edu;fb.com;ibm.com;ncsu.edu",
        "position": "Intern;PhD student;Researcher;Distinguished Research Staff Member;Assistant Professor",
        "bibtex": "@misc{\nhou2024exploring,\ntitle={Exploring Adversarial Robustness of Graph Neural Networks in Directed Graphs},\nauthor={Zhichao Hou and Xitong Zhang and Wei Wang and Charu C. Aggarwal and Xiaorui Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=oKGDfMrD4A}\n}",
        "github": "",
        "project": "",
        "reviewers": "54vV;pTW4;twAK;kogv",
        "site": "https://openreview.net/forum?id=oKGDfMrD4A",
        "pdf_size": 514129,
        "rating": "5;6;6;6",
        "confidence": "4;5;4;5",
        "soundness": "1;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;2;3",
        "wc_summary": "42;76;123;125",
        "wc_strengths": "32;47;110;85",
        "wc_weaknesses": "384;335;369;305",
        "wc_questions": "97;5;5;135",
        "wc_review": "555;463;607;650",
        "wc_reply_reviewers": "73;0;0;14",
        "wc_reply_authors": "1975;2315;1797;1966",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "4;6;5;5",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            91.5,
            34.659053651246744
        ],
        "wc_strengths_avg": [
            68.5,
            30.777426793024787
        ],
        "wc_weaknesses_avg": [
            348.25,
            30.638007441738115
        ],
        "wc_questions_avg": [
            60.5,
            57.102977155311265
        ],
        "wc_review_avg": [
            568.75,
            69.7078725826574
        ],
        "wc_reply_reviewers_avg": [
            21.75,
            30.13614938906429
        ],
        "wc_reply_authors_avg": [
            2013.25,
            188.0909022254931
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            5.0,
            0.7071067811865476
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:UTy9nt9vhOsJ:scholar.google.com/&scioq=Exploring+Adversarial+Robustness+of+Graph+Neural+Networks+in+Directed+Graphs&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "Amazon;Michigan State University;Meta;International Business Machines Corporation;North Carolina State University",
        "aff_unique_dep": "Amazon.com, Inc.;;Meta Platforms, Inc.;;",
        "aff_unique_url": "https://www.amazon.com;https://www.msu.edu;https://meta.com;https://www.ibm.com;https://www.ncsu.edu",
        "aff_unique_abbr": "Amazon;MSU;Meta;IBM;NCSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "oKglS1cFdb",
        "title": "Feature Accompaniment: Is It Feasible to Learn Out-of-Distribution Generalizable Representations with In-Distribution Data?",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Learning representations that generalize out-of-distribution (OOD) is critical for machine learning models to be deployed in the real world. However, despite the significant effort in the last decade, algorithmic advances in this direction have been limited. In this work, we seek to answer the fundamental question: is learning OOD generalizable representations with only in-distribution data really feasible? We first empirically show that perhaps surprisingly, even with an \"oracle'' representation learning objective that allows the model to explicitly fit good representations on the training set, the learned model still underperforms OOD in a wide range of distribution shift benchmarks. To explain the gap, we then formally study the OOD generalization of two-layer ReLU networks trained by stochastic gradient descent (SGD) in a structured setting, unveiling an unexplored OOD generalization failure mode that we refer to as feature accompaniment. We show that this failure mode essentially stems from the inductive biases of non-linear neural networks and fundamentally differs from the prevailing narrative of spurious correlations. Overall, our results imply that it may be generally not feasible to learn OOD generalizable representations without explicitly considering the inductive biases of SGD-trained neural networks and provide new insights into the OOD generalization failure, suggesting that OOD generalization in practice may behave very differently from existing theoretical models.",
        "keywords": "out-of-distribution generalization;representation learning;neural networks",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/55a5a02e1e164b0a51f35fe5eafb8e9603d2fe9c.zip",
        "author": "Tianren Zhang;Chujie Zhao;Guanyu Chen;Yizhou Jiang;Feng Chen",
        "authorids": "~Tianren_Zhang1;~Chujie_Zhao1;~Guanyu_Chen1;~Yizhou_Jiang1;~Feng_Chen1",
        "gender": "M;M;M;M;M",
        "homepage": ";;;;",
        "dblp": ";366/5498;;201/8247;21/3047-7",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;;;oM8ue_UAAAAJ;",
        "orcid": "0000-0001-9687-5263;0000-0003-3710-2644;0009-0008-0131-7006;;0000-0003-4813-2494",
        "linkedin": "%E5%A4%A9%E4%BB%BB-%E7%AB%A0-622b30110/;;;;",
        "or_profile": "~Tianren_Zhang1;~Chujie_Zhao1;~Guanyu_Chen1;~Yizhou_Jiang1;~Feng_Chen1",
        "aff": "Tsinghua University;Tsinghua University;Tsinghua University;Tsinghua University;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "PhD student;MS student;PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nzhang2024feature,\ntitle={Feature Accompaniment: Is It Feasible to Learn Out-of-Distribution Generalizable Representations with In-Distribution Data?},\nauthor={Tianren Zhang and Chujie Zhao and Guanyu Chen and Yizhou Jiang and Feng Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=oKglS1cFdb}\n}",
        "github": "",
        "project": "",
        "reviewers": "Lh7e;jEjy;9qmH",
        "site": "https://openreview.net/forum?id=oKglS1cFdb",
        "pdf_size": 1897112,
        "rating": "5;6;6",
        "confidence": "4;4;4",
        "soundness": "2;3;3",
        "contribution": "2;3;4",
        "presentation": "3;4;3",
        "wc_summary": "209;151;45",
        "wc_strengths": "73;81;156",
        "wc_weaknesses": "446;109;150",
        "wc_questions": "4;235;3",
        "wc_review": "732;576;354",
        "wc_reply_reviewers": "251;0;0",
        "wc_reply_authors": "1446;733;646",
        "reply_reviewers": "1;0;0",
        "reply_authors": "3;2;2",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            135.0,
            67.90189000805992
        ],
        "wc_strengths_avg": [
            103.33333333333333,
            37.38389433373088
        ],
        "wc_weaknesses_avg": [
            235.0,
            150.13549435981707
        ],
        "wc_questions_avg": [
            80.66666666666667,
            109.13091017468678
        ],
        "wc_review_avg": [
            554.0,
            155.09996776273036
        ],
        "wc_reply_reviewers_avg": [
            83.66666666666667,
            118.32253471854894
        ],
        "wc_reply_authors_avg": [
            941.6666666666666,
            358.3818571796786
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:aCPVN43sCmQJ:scholar.google.com/&scioq=Feature+Accompaniment:+Is+It+Feasible+to+Learn+Out-of-Distribution+Generalizable+Representations+with+In-Distribution+Data%3F&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Tsinghua University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "oKn2eMAdfc",
        "title": "OrthCaps: An Orthogonal CapsNet with Sparse Attention Routing and Pruning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Redundancy is a persistent challenge in Capsule Networks (CapsNet), leading to high computational costs and parameter counts (Jeong et al., 2019; Sharifi et al., 2021; Renzulli & Grangetto, 2022). Although previous works have introduced pruning after the initial capsule layer, dynamic routing\u2019s iterative and fully connected nature reintroduces inefficiencies and redundancy in deeper layers. In this paper, we propose the Orthogonal Capsule Network (OrthCaps) to reduce redundancy, improve routing performance and decrease parameter count. Specifically, an efficient pruned capsule layer is placed to discard redundant capsules and dynamic routing is replaced with orthogonal sparse attention routing. Besides, we orthogonalize weight matrices during routing to ensure feature diversity and sustain low capsule similarity, the idea of which is inspired by the application of orthogonality in Convolutional Neural Networks (CNNs). Moreover, a novel activation function named Capsule ReLU is proposed to address vanishing gradients. Our experiments on baseline datasets affirm the efficiency and robustness of OrthCaps in classification tasks, in which ablation studies validate the criticality of each component. Remarkably, with only 110k parameters, merely 1.25% of a standard Capsule Network\u2019s total, OrthCaps-Shallow outperforms state-of-the-art (SOTA) benchmarks on four datasets, while OrthCaps-Deep attains nearly SOTA accuracy with 1.2% of its parameters on four datasets. The code is available at https://github.com/ornamentt/Orthogonal-Capsnet",
        "keywords": "Deep Learing;Capsule Network;Orthogonality;Pruning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/5c44e2e2f58d60020a0fdf6e297047c53473d089.zip",
        "author": "Xinyu Geng;Jiaming Wang;Jiawei Gong;yuerong xue;Jun Xu;Fanglin Chen;Xiaolin Huang",
        "authorids": "~Xinyu_Geng1;~Jiaming_Wang6;~Jiawei_Gong1;~yuerong_xue1;~Jun_Xu11;~Fanglin_Chen1;~Xiaolin_Huang1",
        "gender": "F;;M;Not Specified;F;;M",
        "homepage": ";;;https://l1ack.github.io/;http://faculty.hitsz.edu.cn/xuyun;http://faculty.hitsz.edu.cn/chenfanglin?lang=en;http://www.pami.sjtu.edu.cn/en/xiaolin",
        "dblp": ";;;;90/514-8;85/7057-1;61/2227",
        "google_scholar": ";;;;bsD6IowAAAAJ;viaT8ZMAAAAJ;DR-gBcEAAAAJ",
        "orcid": "0009-0004-6632-8751;0009-0009-3417-2402;0000-0002-8307-1327;;;0000-0002-9193-5412;",
        "linkedin": ";;;%E6%82%A6%E6%A6%95-%E8%96%9B-a4303b23b/;;;",
        "or_profile": "~Xinyu_Geng1;~Jiaming_Wang6;~Jiawei_Gong1;~yuerong_xue1;~Jun_Xu11;~Fanglin_Chen1;~Xiaolin_Huang1",
        "aff": "Harbin Institute of Technology;Harbin Institute of Technology;Harbin Institute of Technology;;Harbin Institute of Technology;Harbin Institute of Technology (Shenzhen);Shanghai Jiaotong University",
        "aff_domain": "hit.edu.cn;hit.edu.cn;hit.edu.cn;;hit.edu.cn;hit.edu.cn;sjtu.edu.cn",
        "position": "MS student;MS student;MS student;;Associate Professor;Associate Professor;Full Professor",
        "bibtex": "@misc{\ngeng2024orthcaps,\ntitle={OrthCaps: An Orthogonal CapsNet with Sparse Attention Routing and Pruning},\nauthor={Xinyu Geng and Jiaming Wang and Jiawei Gong and yuerong xue and Jun Xu and Fanglin Chen and Xiaolin Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=oKn2eMAdfc}\n}",
        "github": "",
        "project": "",
        "reviewers": "TYvA;ETfq;1dRT;EBRe;g9dd",
        "site": "https://openreview.net/forum?id=oKn2eMAdfc",
        "pdf_size": 3249884,
        "rating": "1;3;5;6;6",
        "confidence": "2;5;4;5;5",
        "soundness": "2;2;2;3;2",
        "contribution": "2;2;3;3;2",
        "presentation": "1;2;2;3;3",
        "wc_summary": "53;56;38;186;66",
        "wc_strengths": "19;28;26;126;50",
        "wc_weaknesses": "245;86;14;118;140",
        "wc_questions": "4;86;152;118;65",
        "wc_review": "321;256;230;548;321",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            4.2,
            1.9390719429665317
        ],
        "confidence_avg": [
            4.2,
            1.16619037896906
        ],
        "soundness_avg": [
            2.2,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.2,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            79.8,
            53.8531336135605
        ],
        "wc_strengths_avg": [
            49.8,
            39.488732570190194
        ],
        "wc_weaknesses_avg": [
            120.6,
            75.39124617619741
        ],
        "wc_questions_avg": [
            85.0,
            50.07993610219566
        ],
        "wc_review_avg": [
            335.2,
            112.2735944022458
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.7783040514449476,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4332948569549160393&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;0;0;0;1",
        "aff_unique_norm": "Harbin Institute of Technology;Shanghai Jiao Tong University",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.hit.edu.cn/;https://www.sjtu.edu.cn",
        "aff_unique_abbr": "HIT;SJTU",
        "aff_campus_unique_index": "0;0;0;0;1",
        "aff_campus_unique": "Harbin;Shenzhen;",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "WebArena: A Realistic Web Environment for Building Autonomous Agents",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17826",
        "id": "oKn9c6ytLx",
        "author_site": "Shuyan Zhou, Frank F Xu, Hao Zhu, Xuhui Zhou, Robert Lo, Abishek Sridhar, Xianyi Cheng, Tianyue Ou, Yonatan Bisk, Daniel Fried, Uri Alon, Graham Neubig",
        "tldr": "",
        "abstract": "With advances in generative AI, there is now potential for autonomous agents to manage daily tasks via natural language commands. However, current agents are primarily created and tested in simplified synthetic environments, leading to a disconnect with real-world scenarios. In this paper, we build an environment for language-guided agents that is highly realistic and reproducible. Specifically, we focus on agents that perform tasks on the web, and create an environment with fully functional websites from four common domains: e-commerce, social forum discussions, collaborative software development, and content management. Our environment is enriched with tools (e.g., a map) and external knowledge bases (e.g., user manuals) to encourage human-like task-solving. Building upon our environment, we release a set of benchmark tasks focusing on evaluating the functional correctness of task completions. The tasks in our benchmark are diverse, long-horizon, and designed to emulate tasks that humans routinely perform on the internet. We experiment with several baseline agents, integrating recent techniques such as reasoning before acting.  The results demonstrate that solving complex tasks is challenging: our best GPT-4-based agent only achieves an end-to-end task success rate of 14.41%, significantly lower than the human performance of 78.24%. These results highlight the need for further development of robust agents, that current state-of-the-art large language models are far from perfect performance in these real-life tasks, and that \\ours can be used to measure such progress.\\footnote{Code, data, environment reproduction instructions, video demonstrations are available in the supplementary.}",
        "keywords": "language-guided agents; web automation; benchmark",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/b7853b0e5e6a77013f76005b1f8a39263902acd2.zip",
        "author": "Shuyan Zhou;Frank F. Xu;Hao Zhu;Xuhui Zhou;Robert Lo;Abishek Sridhar;Xianyi Cheng;Tianyue Ou;Yonatan Bisk;Daniel Fried;Uri Alon;Graham Neubig",
        "authorids": "~Shuyan_Zhou1;~Frank_F._Xu1;~Hao_Zhu1;~Xuhui_Zhou1;~Robert_Lo1;~Abishek_Sridhar1;~Xianyi_Cheng1;~Tianyue_Ou1;~Yonatan_Bisk1;~Daniel_Fried1;~Uri_Alon1;~Graham_Neubig1",
        "gender": "Non-Binary;M;M;M;;M;;;M;M;M;M",
        "homepage": "https://shuyanzhou.github.io/;https://frankxfz.me/;http://www.zhuhao.me;https://xuhuizhou.github.io/;https://robertlo.tech;;https://xianyicheng.github.io/;;http://www.YonatanBisk.com;https://dpfried.github.io/;https://urialon.ml/;http://phontron.com",
        "dblp": ";190/4519;10/3520-6;;;;;;38/9282;117/4804;40/2257-2;03/8155",
        "google_scholar": "t6YzEpgAAAAJ;1hXyfIkAAAAJ;-3yFcsMAAAAJ;CKyX_Y8AAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en;;bWoGh8UAAAAJ;sJDqACEAAAAJ;https://scholar.google.co.il/citations?user=QBn7vq8AAAAJ;wlosgkoAAAAJ",
        "orcid": ";;;;;;;;0000-0002-2111-9081;;;",
        "linkedin": ";;;;robert1003/;abishek-sridhar5/;;;yonatanbisk/;;https://linkedin.com/in/urialon1/;",
        "or_profile": "~Shuyan_Zhou1;~Frank_F._Xu1;~Hao_Zhu1;~Xuhui_Zhou1;~Robert_Lo1;~Abishek_Sridhar1;~Xianyi_Cheng1;~Tianyue_Ou1;~Yonatan_Bisk1;~Daniel_Fried1;~Uri_Alon1;~Graham_Neubig1",
        "aff": "Carnegie Mellon University;Carnegie Mellon University;Carnegie Mellon University;Allen Institute for Artificial Intelligence;Carnegie Mellon University;;Carnegie Mellon University;;Meta;Carnegie Mellon University;Google DeepMind;Carnegie Mellon University",
        "aff_domain": "cs.cmu.edu;cmu.edu;cmu.edu;allenai.org;cmu.edu;;cmu.edu;;meta.com;cmu.edu;google.com;cmu.edu",
        "position": "PhD student;PhD student;PhD student;Intern;MS student;;PhD student;;Visiting Professor;Assistant Professor;Researcher;Associate Professor",
        "bibtex": "@inproceedings{\nzhou2024webarena,\ntitle={WebArena: A Realistic Web Environment for Building Autonomous Agents},\nauthor={Shuyan Zhou and Frank F. Xu and Hao Zhu and Xuhui Zhou and Robert Lo and Abishek Sridhar and Xianyi Cheng and Tianyue Ou and Yonatan Bisk and Daniel Fried and Uri Alon and Graham Neubig},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=oKn9c6ytLx}\n}",
        "github": "",
        "project": "",
        "reviewers": "Y9es;uu7U;JxdP",
        "pdf_size": 9007218,
        "rating": "5;6;8",
        "confidence": "3;3;4",
        "soundness": "2;2;3",
        "contribution": "2;3;4",
        "presentation": "3;3;4",
        "wc_summary": "76;113;137",
        "wc_strengths": "36;157;173",
        "wc_weaknesses": "153;176;536",
        "wc_questions": "23;61;4",
        "wc_review": "288;507;850",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "464;1033;769",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;2;1",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            108.66666666666667,
            25.090945688745084
        ],
        "wc_strengths_avg": [
            122.0,
            61.16098974564315
        ],
        "wc_weaknesses_avg": [
            288.3333333333333,
            175.37832122459022
        ],
        "wc_questions_avg": [
            29.333333333333332,
            23.697163449568293
        ],
        "wc_review_avg": [
            548.3333333333334,
            231.2896212303719
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            755.3333333333334,
            232.49420542360954
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            12,
            0
        ],
        "corr_rating_confidence": 0.944911182523068,
        "gs_citation": 363,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3258285043140770141&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=oKn9c6ytLx",
        "pdf": "https://openreview.net/pdf?id=oKn9c6ytLx",
        "email": "cs.cmu.edu;cmu.edu;cmu.edu;allenai.org;cmu.edu;;cmu.edu;;meta.com;cmu.edu;google.com;cmu.edu",
        "author_num": 12,
        "aff_unique_index": "0;0;0;1;0;0;2;0;3;0",
        "aff_unique_norm": "Carnegie Mellon University;Allen Institute for Artificial Intelligence;Meta;Google",
        "aff_unique_dep": ";;Meta Platforms, Inc.;Google DeepMind",
        "aff_unique_url": "https://www.cmu.edu;https://allenai.org;https://meta.com;https://deepmind.com",
        "aff_unique_abbr": "CMU;AI2;Meta;DeepMind",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;1;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "title": "RLIF: Interactive Imitation Learning as Reinforcement Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17825",
        "id": "oLLZhbBSOU",
        "author_site": "Jianlan Luo, Perry Dong, Yuexiang Zhai, Yi Ma, Sergey Levine",
        "tldr": "",
        "abstract": "Although reinforcement learning methods offer a powerful framework for auto-\nmatic skill acquisition, for practical learning-based control problems in domains\nsuch as robotics, imitation learning often provides a more convenient and accessible\nalternative. In particular, an interactive imitation learning method such as DAgger,\nwhich queries a near-optimal expert to intervene online to collect correction data for\naddressing the distributional shift challenges that afflict na\u00efve behavioral cloning,\ncan enjoy good performance both in theory and practice without requiring manually\nspecified reward functions and other components of full reinforcement learning\nmethods. In this paper, we explore how off-policy reinforcement learning can\nenable improved performance under assumptions that are similar but potentially\neven more practical than those of interactive imitation learning. Our proposed\nmethod uses reinforcement learning with user intervention signals themselves as\nrewards. This relaxes the assumption that intervening experts in interactive imita-\ntion learning should be near-optimal and enables the algorithm to learn behaviors\nthat improve over the potential suboptimal human expert. We also provide a uni-\nfied framework to analyze our RL method and DAgger; for which we present the\nasymptotic analysis of the suboptimal gap for both methods as well as the non-\nasymptotic sample complexity bound of our method. We then evaluate our method\non challenging high-dimensional continuous control simulation benchmarks as\nwell as real-world robotic vision-based manipulation tasks. The results show that it\nstrongly outperforms DAgger-like approaches across the different tasks, especially\nwhen the intervening experts are suboptimal. Additional ablations also empirically\nverify the proposed theoretical justification that the performance of our method is\nassociated with the choice of intervention model and suboptimality of the expert.\nCode and videos can be found on the project website: https://rlif-page.github.io",
        "keywords": "Reinforcement learning;imitation learning;online learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Jianlan Luo;Perry Dong;Yuexiang Zhai;Yi Ma;Sergey Levine",
        "authorids": "~Jianlan_Luo1;~Perry_Dong1;~Yuexiang_Zhai1;~Yi_Ma4;~Sergey_Levine1",
        "gender": ";;;M;M",
        "homepage": "https://people.eecs.berkeley.edu/~jianlanluo/;;;http://people.eecs.berkeley.edu/~yima/;https://people.eecs.berkeley.edu/~svlevine/",
        "dblp": "161/1838;;241/6124.html;;80/7594",
        "google_scholar": "SJoRNbYAAAAJ;;78WTKm4AAAAJ;https://scholar.google.com.hk/citations?user=XqLiBQMAAAAJ;8R35rCwAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Jianlan_Luo1;~Perry_Dong1;~Yuexiang_Zhai1;~Yi_Ma4;~Sergey_Levine1",
        "aff": "University of California, Berkeley;;University of California, Berkeley;University of California, Berkeley;Google",
        "aff_domain": "eecs.berkeley.edu;;berkeley.edu;berkeley.edu;google.com",
        "position": "Postdoc;;PhD student;Full Professor;Research Scientist",
        "bibtex": "@inproceedings{\nluo2024rlif,\ntitle={{RLIF}: Interactive Imitation Learning as Reinforcement Learning},\nauthor={Jianlan Luo and Perry Dong and Yuexiang Zhai and Yi Ma and Sergey Levine},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=oLLZhbBSOU}\n}",
        "github": "",
        "project": "",
        "reviewers": "guRK;RarS;9AYW;48gS",
        "pdf_size": 9826859,
        "rating": "6;6;6;8",
        "confidence": "3;3;4;4",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;3;4",
        "wc_summary": "50;79;101;106",
        "wc_strengths": "36;33;48;84",
        "wc_weaknesses": "73;65;95;131",
        "wc_questions": "14;47;12;205",
        "wc_review": "173;224;256;526",
        "wc_reply_reviewers": "447;0;0;8",
        "wc_reply_authors": "921;518;519;899",
        "reply_reviewers": "5;0;0;1",
        "reply_authors": "7;3;3;3",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            84.0,
            22.102036105300343
        ],
        "wc_strengths_avg": [
            50.25,
            20.27775875189366
        ],
        "wc_weaknesses_avg": [
            91.0,
            25.573423705088842
        ],
        "wc_questions_avg": [
            69.5,
            79.45596264598397
        ],
        "wc_review_avg": [
            294.75,
            136.7541132836596
        ],
        "wc_reply_reviewers_avg": [
            113.75,
            192.42969495376747
        ],
        "wc_reply_authors_avg": [
            714.25,
            195.90479192709913
        ],
        "reply_reviewers_avg": [
            1.5,
            2.0615528128088303
        ],
        "reply_authors_avg": [
            4.0,
            1.7320508075688772
        ],
        "replies_avg": [
            30,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 20,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1359010594434388801&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=oLLZhbBSOU",
        "pdf": "https://openreview.net/pdf?id=oLLZhbBSOU",
        "email": "eecs.berkeley.edu;;berkeley.edu;berkeley.edu;google.com",
        "author_num": 5,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "University of California, Berkeley;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.berkeley.edu;https://www.google.com",
        "aff_unique_abbr": "UC Berkeley;Google",
        "aff_campus_unique_index": "0;0;0;1",
        "aff_campus_unique": "Berkeley;Mountain View",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "oLTgo1dcIl",
        "title": "Stochastic Extragradient with Flip-Flop Shuffling & Anchoring: Provable Improvements",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In minimax optimization, the extragradient (EG) method has been extensively studied because it outperforms the gradient descent-ascent (GDA) method in both strongly-convex-strongly-concave (SC-SC) and convex-concave (C-C) problems. However, stochastic EG (SEG) has seen limited success, as it is known to converge only up to neighborhoods of equilibria for C-C problems. Motivated by the recent progress in analysis of shuffling-based stochastic optimization methods, we investigate the convergence of shuffling-based SEG in finite-sum minimax problems, in search of improved convergence guarantees for SEG under minimal algorithm modifications. Our analysis reveals that both random reshuffling and the recently proposed flip-flop shuffling (Rajput et al., 2022) alone cannot fix the nonconvergence issue in C-C problems. However, with an additional simple trick called anchoring, we develop the SEG with flip-flop anchoring (SEG-FFA) method which successfully converges in C-C problems. We also show upper and lower bounds in the SC-SC setting, demonstrating that SEG-FFA has a provably faster convergence rate compared to other shuffling-based methods as well.",
        "keywords": "minimax optimization;stochastic optimization;extragradient method;without-replacement sampling",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/20d93a221fc1e6a016a4b527adb9b8da23b387af.pdf",
        "author": "Jiseok Chae;Chulhee Yun;Donghwan Kim",
        "authorids": "~Jiseok_Chae1;~Chulhee_Yun1;~Donghwan_Kim2",
        "gender": "M;M;M",
        "homepage": "https://jsch8q.github.io/;https://chulheeyun.github.io/;http://mathsci.kaist.ac.kr/~donghwankim/",
        "dblp": "348/5478;138/0148.html;05/1032",
        "google_scholar": ";Ukl64ggAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": "0009-0009-0672-3422;;",
        "linkedin": ";;",
        "or_profile": "~Jiseok_Chae1;~Chulhee_Yun1;~Donghwan_Kim2",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.edu;kaist.ac.kr;kaist.ac.kr",
        "position": "PhD student;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nchae2024stochastic,\ntitle={Stochastic Extragradient with Flip-Flop Shuffling \\& Anchoring: Provable Improvements},\nauthor={Jiseok Chae and Chulhee Yun and Donghwan Kim},\nyear={2024},\nurl={https://openreview.net/forum?id=oLTgo1dcIl}\n}",
        "github": "",
        "project": "",
        "reviewers": "ojxo;emGH;ZXRs",
        "site": "https://openreview.net/forum?id=oLTgo1dcIl",
        "pdf_size": 772560,
        "rating": "3;3;8",
        "confidence": "4;4;3",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "2;3;3",
        "wc_summary": "65;77;65",
        "wc_strengths": "45;71;67",
        "wc_weaknesses": "650;652;2",
        "wc_questions": "2;4;90",
        "wc_review": "762;804;224",
        "wc_reply_reviewers": "0;338;43",
        "wc_reply_authors": "1404;911;206",
        "reply_reviewers": "0;1;1",
        "reply_authors": "3;2;1",
        "rating_avg": [
            4.666666666666667,
            2.357022603955158
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            69.0,
            5.656854249492381
        ],
        "wc_strengths_avg": [
            61.0,
            11.430952132988164
        ],
        "wc_weaknesses_avg": [
            434.6666666666667,
            305.94262352423027
        ],
        "wc_questions_avg": [
            32.0,
            41.02032016777376
        ],
        "wc_review_avg": [
            596.6666666666666,
            264.07238065012064
        ],
        "wc_reply_reviewers_avg": [
            127.0,
            150.228714521115
        ],
        "wc_reply_authors_avg": [
            840.3333333333334,
            491.6274560635884
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.9999999999999998,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:z3UVapOXQ5EJ:scholar.google.com/&scioq=Stochastic+Extragradient+with+Flip-Flop+Shuffling+%26+Anchoring:+Provable+Improvements&hl=en&as_sdt=0,33",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "oLxcG8xYo4",
        "title": "Adversarial Contrastive Graph Augmentation with Counterfactual Regularization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "With the development of graph representation learning, self-supervised graph contrastive learning (GCL) has become one of the most important techniques. In GCL, a set of positive and negative samples are generated by data augmentation. However, the majority of existing methods rely on empirical rule-based graph augmentations, which might lead to failures in learning useful graph patterns. To address this issue, we propose a novel model-based adversarial contrastive graph augmentation (ACGA) method for generating both positive samples with minimal sufficient information and hard negative graph samples automatically. We also provide a theoretical framework to analyze the positive and negative graph augmenting process in self-supervised GCL. We evaluate our ACGA via extensive experiments on five benchmark datasets. The experimental results show that ACGA outperforms the state-of-the-art baselines.",
        "keywords": "Node Representation Learning;Contrastive Learning;Node Classification",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Tao Long;Liang Zhang",
        "authorids": "~Tao_Long3;~Liang_Zhang17",
        "gender": "M;M",
        "homepage": "https://sites.google.com/view/liangzhang1111/liang-zhang-hk-polyu;https://github.com/longtao-09",
        "dblp": ";",
        "google_scholar": "MKlx5KsAAAAJ;",
        "orcid": "0000-0002-5805-7099;0009-0002-1422-5529",
        "linkedin": ";",
        "or_profile": "~Liang_Zhang17;~tao_long2",
        "aff": "Shenzhen Research Institute of Big Data;Shenzhen University",
        "aff_domain": "sribd.cn;szu.edu.cn",
        "position": "Researcher;MS student",
        "bibtex": "@misc{\nlong2024adversarial,\ntitle={Adversarial Contrastive Graph Augmentation with Counterfactual Regularization},\nauthor={Tao Long and Liang Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=oLxcG8xYo4}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=oLxcG8xYo4",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:HER3VFd_2v4J:scholar.google.com/&scioq=Adversarial+Contrastive+Graph+Augmentation+with+Counterfactual+Regularization&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Shenzhen Research Institute of Big Data;Shenzhen University",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.sribd.cn;https://www.szu.edu.cn",
        "aff_unique_abbr": ";SZU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Multimodal Molecular Pretraining via Modality Blending",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17824",
        "id": "oM7Jbxdk6Z",
        "author_site": "Qiying Yu, Yudi Zhang, yuyan ni, Shikun Feng, Yanyan Lan, Hao Zhou, Jingjing Liu",
        "tldr": "",
        "abstract": "Self-supervised learning has recently gained growing interest in molecular modeling for scientific tasks such as AI-assisted drug discovery. Current studies consider leveraging both 2D and 3D molecular structures for representation learning. However, relying on straightforward alignment strategies that treat each modality separately, these methods fail to exploit the intrinsic correlation between 2D and 3D representations that reflect the underlying structural characteristics of molecules, and only perform coarse-grained molecule-level alignment. To derive fine-grained alignment and promote structural molecule understanding, we introduce an atomic-relation level \"blend-then-predict\" self-supervised learning approach, MoleBLEND, which first blends atom relations represented by different modalities into one unified relation matrix for joint encoding, then recovers modality-specific information for 2D and 3D structures individually. By treating atom relationships as anchors, MoleBLEND organically aligns and integrates visually dissimilar 2D and 3D modalities of the same molecule at fine-grained atomic level, painting a more comprehensive depiction of each molecule. Extensive experiments show that MoleBLEND achieves state-of-the-art performance across major 2D/3D molecular benchmarks. We further provide theoretical insights from the perspective of mutual-information maximization, demonstrating that our method unifies contrastive, generative (cross-modality prediction) and mask-then-predict (single-modality prediction) objectives into one single cohesive framework.",
        "keywords": "multimodal molecular pretraining;molecular representation learning;modality blending",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Qiying Yu;Yudi Zhang;Yuyan Ni;Shikun Feng;Yanyan Lan;Hao Zhou;Jingjing Liu",
        "authorids": "~Qiying_Yu1;~Yudi_Zhang2;~Yuyan_Ni1;~Shikun_Feng3;~Yanyan_Lan2;~Hao_Zhou5;~Jingjing_Liu2",
        "gender": ";;;M;;M;",
        "homepage": "https://yqy2001.github.io;https://github.com/YudiZh;https://nyyxxx.github.io/;https://fengshikun.github.io;;https://zhouh.github.io/;https://air.tsinghua.edu.cn/en/info/1046/1194.htm#:~:text=Jingjing%20Liu%20is%20Professor%2C%20Principal,CVPR%2C%20ACL%2C%20etc.)",
        "dblp": "324/5612;;117/6286;;00/6040.html;63/778-12;30/3008-1",
        "google_scholar": "eFFssJYAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=zh-CN;;;https://scholar.google.com/citations?hl=zh-CN;BzJ_GboAAAAJ",
        "orcid": ";;;;;;",
        "linkedin": ";;;;;;jingjing-liu-65703431/",
        "or_profile": "~Qiying_Yu1;~Yudi_Zhang2;~Yuyan_Ni1;~Shikun_Feng3;~Yanyan_Lan2;~Hao_Zhou5;~Jingjing_Liu2",
        "aff": "Tsinghua University;Harbin Institute of Technology;University of Chinese Academy of Sciences;Tsinghua University;Tsinghua University;Tsinghua University;Tsinghua University",
        "aff_domain": "mails.tsinghua.edu.cn;hit.edu.cn;ucas.ac.cn;tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "PhD student;MS student;PhD student;PhD student;Full Professor;Associate Professor;Full Professor",
        "bibtex": "@inproceedings{\nyu2024multimodal,\ntitle={Multimodal Molecular Pretraining via Modality Blending},\nauthor={Qiying Yu and Yudi Zhang and Yuyan Ni and Shikun Feng and Yanyan Lan and Hao Zhou and Jingjing Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=oM7Jbxdk6Z}\n}",
        "github": "",
        "project": "",
        "reviewers": "w2xw;XaRC;3A6t;TmmD",
        "pdf_size": 1094984,
        "rating": "5;5;6;8",
        "confidence": "4;2;4;3",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "54;111;58;36",
        "wc_strengths": "27;43;36;28",
        "wc_weaknesses": "120;69;117;210",
        "wc_questions": "4;115;2;28",
        "wc_review": "205;338;213;302",
        "wc_reply_reviewers": "0;0;448;7",
        "wc_reply_authors": "751;1072;1494;751",
        "reply_reviewers": "0;0;4;1",
        "reply_authors": "2;3;5;2",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            64.75,
            27.958674861301994
        ],
        "wc_strengths_avg": [
            33.5,
            6.5
        ],
        "wc_weaknesses_avg": [
            129.0,
            50.95586325438909
        ],
        "wc_questions_avg": [
            37.25,
            46.04006407467305
        ],
        "wc_review_avg": [
            264.5,
            57.01096385784054
        ],
        "wc_reply_reviewers_avg": [
            113.75,
            193.00048575068405
        ],
        "wc_reply_authors_avg": [
            1017.0,
            304.9860652554474
        ],
        "reply_reviewers_avg": [
            1.25,
            1.6393596310755
        ],
        "reply_authors_avg": [
            3.0,
            1.224744871391589
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 18,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=743810403351825935&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=oM7Jbxdk6Z",
        "pdf": "https://openreview.net/pdf?id=oM7Jbxdk6Z",
        "email": "mails.tsinghua.edu.cn;hit.edu.cn;ucas.ac.cn;tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn",
        "author_num": 7,
        "aff_unique_index": "0;1;2;0;0;0;0",
        "aff_unique_norm": "Tsinghua University;Harbin Institute of Technology;University of Chinese Academy of Sciences",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;http://www.hit.edu.cn/;http://www.ucas.ac.cn",
        "aff_unique_abbr": "THU;HIT;UCAS",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Harbin",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "DNABERT-2: Efficient Foundation Model and Benchmark For Multi-Species Genomes",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17823",
        "id": "oMLQB4EZE1",
        "author_site": "Zhihan Zhou, Yanrong Ji, Weijian Li, Pratik Dutta, Ramana Davuluri, Han Liu",
        "tldr": "",
        "abstract": "Decoding the linguistic intricacies of the genome is a crucial problem in biology, and pre-trained foundational models such as DNABERT and Nucleotide Transformer have made significant strides in this area. Existing works have largely hinged on k-mer, fixed-length permutations of A, T, C, and G, as the token of the genome language due to its simplicity. However, we argue that the computation and sample inefficiencies introduced by k-mer tokenization are primary obstacles in developing large genome foundational models. We provide conceptual and empirical insights into genome tokenization, building on which we propose to replace k-mer tokenization with Byte Pair Encoding (BPE), a statistics-based data compression algorithm that constructs tokens by iteratively merging the most frequent co-occurring genome segment in the corpus. We demonstrate that BPE not only overcomes the limitations of k-mer tokenization but also benefits from the computational efficiency of non-overlapping tokenization.\nBased on these insights, we introduce DNABERT-2, a refined genome foundation model that adapts an efficient tokenizer and employs multiple strategies to overcome input length constraints, reduce time and memory expenditure, and enhance model capability. Furthermore, we identify the absence of a comprehensive and standardized benchmark for genome understanding as another significant impediment to fair comparative analysis. In response, we propose the Genome Understanding Evaluation (GUE), a comprehensive multi-species genome classification dataset that amalgamates $36$ distinct datasets across $9$ tasks, with input lengths ranging from $70$ to $10000$. Through comprehensive experiments on the GUE benchmark, we demonstrate that DNABERT-2 achieves comparable performance to the state-of-the-art model with $21 \\times$ fewer parameters and approximately $92 \\times$ less GPU time in pre-training. \nCompared to DNABERT, while being $3 \\times$ more efficient, DNABERT-2 outperforms it on $23$ out of $28$ datasets, with an average improvement of $6$ absolute scores on GUE.\nThe code, data, and pre-trained model are available at \\url{https://github.com/MAGICS-LAB/DNABERT_2}.",
        "keywords": "DNA;Genome;Language Model;Foundation Model;Benchmark",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/d32d53a0c7cc8ddf08b15f108e62010d6ce4f85b.zip",
        "author": "Zhihan Zhou;Yanrong Ji;Weijian Li;Pratik Dutta;Ramana V Davuluri;Han Liu",
        "authorids": "~Zhihan_Zhou1;~Yanrong_Ji1;~Weijian_Li2;~Pratik_Dutta1;~Ramana_V_Davuluri1;~Han_Liu4",
        "gender": "M;;M;M;;",
        "homepage": "http://zhihan1996.github.io/;;;https://duttaprat.github.io/;https://davulurilab.github.io/;",
        "dblp": "226/5688-1.html;;;;;",
        "google_scholar": "bNerBT8AAAAJ;KuXoQp8AAAAJ;https://scholar.google.com/citations?hl=en;hqhM6YAAAAAJ;https://scholar.google.com/citations?hl=en;",
        "orcid": ";0000-0002-0134-664X;0009-0003-4158-4380;;0000-0002-7053-1064;",
        "linkedin": "zhihan-zhou-6a057716b/;;weijian-li-b52566153/;;ramana-davuluri-0049a118/;",
        "or_profile": "~Zhihan_Zhou1;~Yanrong_Ji1;~Weijian_Li2;~Pratik_Dutta1;~Ramana_V_Davuluri1;~Han_Liu4",
        "aff": "Northwestern University;;Northwestern University;;Academic medical center at State University of New York at Stony Brook;Northwestern University",
        "aff_domain": "u.northwestern.edu;;northwestern.edu;;stonybrookmedicine.edu;u.northwestern.edu",
        "position": "PhD student;;PhD student;;Full Professor;Associate Professor",
        "bibtex": "@inproceedings{\nzhou2024dnabert,\ntitle={{DNABERT}-2: Efficient Foundation Model and Benchmark For Multi-Species Genomes},\nauthor={Zhihan Zhou and Yanrong Ji and Weijian Li and Pratik Dutta and Ramana V Davuluri and Han Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=oMLQB4EZE1}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZSAj;1Kmp;cVdN;cdaf",
        "pdf_size": 409202,
        "rating": "6;6;6;8",
        "confidence": "4;4;5;4",
        "soundness": "4;3;3;3",
        "contribution": "2;3;2;4",
        "presentation": "4;4;3;3",
        "wc_summary": "35;218;129;24",
        "wc_strengths": "35;218;65;116",
        "wc_weaknesses": "30;218;82;59",
        "wc_questions": "199;218;108;227",
        "wc_review": "299;872;384;426",
        "wc_reply_reviewers": "12;5;136;55",
        "wc_reply_authors": "1493;611;2156;663",
        "reply_reviewers": "1;1;2;1",
        "reply_authors": "4;2;6;3",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            101.5,
            78.67178655655405
        ],
        "wc_strengths_avg": [
            108.5,
            69.53596191899555
        ],
        "wc_weaknesses_avg": [
            97.25,
            72.10885867908326
        ],
        "wc_questions_avg": [
            188.0,
            47.281074437876306
        ],
        "wc_review_avg": [
            495.25,
            222.27615144229935
        ],
        "wc_reply_reviewers_avg": [
            52.0,
            52.13923666491484
        ],
        "wc_reply_authors_avg": [
            1230.75,
            638.6103565555447
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.75,
            1.479019945774904
        ],
        "replies_avg": [
            32,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 262,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9999028608202476233&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=oMLQB4EZE1",
        "pdf": "https://openreview.net/pdf?id=oMLQB4EZE1",
        "email": "u.northwestern.edu;;northwestern.edu;;stonybrookmedicine.edu;u.northwestern.edu",
        "author_num": 6,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Northwestern University;State University of New York at Stony Brook",
        "aff_unique_dep": ";Academic medical center",
        "aff_unique_url": "https://www.northwestern.edu;https://www.stonybrookmedicine.edu",
        "aff_unique_abbr": "NU;SUNY Stony Brook",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Stony Brook",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "A Unified Framework for Bayesian Optimization under Contextual Uncertainty",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17822",
        "id": "oMNkj4ER7V",
        "author_site": "Sebastian Shenghong Tay, Chuan-Sheng Foo, Daisuke Urano, Richalynn Leong, Bryan Kian Hsiang Low",
        "tldr": "",
        "abstract": "Bayesian optimization under contextual uncertainty (BOCU) is a family of BO problems in which the learner makes a decision prior to observing the context and must manage the risks involved. Distributionally robust BO (DRBO) is a subset of BOCU that affords robustness against context distribution shift, and includes the optimization of expected values and worst-case values as special cases. By considering the first derivatives of the DRBO objective, we generalize DRBO to one that includes several other uncertainty objectives studied in the BOCU literature such as worst-case sensitivity (and thus notions of risk such as variance, range, and conditional value-at-risk) and mean-risk tradeoffs. We develop a general Thompson sampling algorithm that is able to optimize any objective within the BOCU framework, analyze its theoretical properties, and compare it to suitable baselines across different experimental settings and uncertainty objectives.",
        "keywords": "Bayesian optimization;Gaussian processes",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/2b825fddb03ff5f8744ed64067c18eb9be41a715.zip",
        "author": "Sebastian Shenghong Tay;Chuan-Sheng Foo;Daisuke Urano;Richalynn Leong;Bryan Kian Hsiang Low",
        "authorids": "~Sebastian_Shenghong_Tay1;~Chuan-Sheng_Foo1;~Daisuke_Urano1;~Richalynn_Leong1;~Bryan_Kian_Hsiang_Low1",
        "gender": "M;M;M;F;M",
        "homepage": ";http://ai.stanford.edu/~csfoo;http://www.tll.org.sg/group-leaders/urano-daisuke/;;http://www.comp.nus.edu.sg/~lowkh",
        "dblp": "281/7664;73/1823;;;97/4877",
        "google_scholar": "https://scholar.google.com/citations?hl=en;AgbeqGkAAAAJ;ixmLRN0AAAAJ;;https://scholar.google.com.tw/citations?user=2P-Q09UAAAAJ",
        "orcid": ";0000-0002-4748-5792;;;",
        "linkedin": ";;daisuke-urano-73206a86/?originalSubdomain=sg;www.linkedin.com/in/richalynn-leong-41432b39;",
        "or_profile": "~Sebastian_Shenghong_Tay1;~Chuan-Sheng_Foo1;~Daisuke_Urano1;~Richalynn_Leong1;~Bryan_Kian_Hsiang_Low1",
        "aff": "National University of Singapore;Institute for Infocomm Research, A*STAR;Temasek Life Sciences Laboratory / National University of Singapore;National University of Singapore;National University of Singapore",
        "aff_domain": "nus.edu;i2r.a-star.edu.sg;nus.edu.sg;nus.edu.sg;nus.edu.sg",
        "position": "PhD student;Principal Scientist;Assistant Professor;PhD student;Associate Professor",
        "bibtex": "@inproceedings{\ntay2024a,\ntitle={A Unified Framework for Bayesian Optimization under Contextual Uncertainty},\nauthor={Sebastian Shenghong Tay and Chuan-Sheng Foo and Daisuke Urano and Richalynn Leong and Bryan Kian Hsiang Low},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=oMNkj4ER7V}\n}",
        "github": "",
        "project": "",
        "reviewers": "B6kd;9tD6;Lem3;WGc6",
        "pdf_size": 3408146,
        "rating": "5;5;6;8",
        "confidence": "4;3;3;3",
        "soundness": "3;3;3;3",
        "contribution": "3;2;3;3",
        "presentation": "3;1;3;3",
        "wc_summary": "46;46;88;97",
        "wc_strengths": "20;17;115;101",
        "wc_weaknesses": "61;203;122;154",
        "wc_questions": "51;58;81;100",
        "wc_review": "178;324;406;452",
        "wc_reply_reviewers": "0;45;39;29",
        "wc_reply_authors": "598;645;840;712",
        "reply_reviewers": "0;2;1;1",
        "reply_authors": "2;3;2;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            69.25,
            23.466731770743024
        ],
        "wc_strengths_avg": [
            63.25,
            45.03540274051071
        ],
        "wc_weaknesses_avg": [
            135.0,
            51.55094567512802
        ],
        "wc_questions_avg": [
            72.5,
            19.371370627810517
        ],
        "wc_review_avg": [
            340.0,
            104.1633332799983
        ],
        "wc_reply_reviewers_avg": [
            28.25,
            17.282577932704367
        ],
        "wc_reply_authors_avg": [
            698.75,
            91.05870359279227
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.4714045207910316,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:9nnwEm5VqNUJ:scholar.google.com/&scioq=A+Unified+Framework+for+Bayesian+Optimization+under+Contextual+Uncertainty&hl=en&as_sdt=0,44",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=oMNkj4ER7V",
        "pdf": "https://openreview.net/pdf?id=oMNkj4ER7V",
        "email": "nus.edu;i2r.a-star.edu.sg;nus.edu.sg;nus.edu.sg;nus.edu.sg",
        "author_num": 5,
        "aff_unique_index": "0;1;0;0;0",
        "aff_unique_norm": "National University of Singapore;Institute for Infocomm Research",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.nus.edu.sg;https://www.i2r.a-star.edu.sg",
        "aff_unique_abbr": "NUS;I2R",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Singapore",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Singapore"
    },
    {
        "id": "oMRrVXrHxW",
        "title": "SimVLG: Simple and Efficient Pretraining of Visual Language Generative Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In this paper, we propose ``SimVLG'', a streamlined framework for the pre-training of computationally intensive vision-language generative models, leveraging frozen pre-trained large language models (LLMs). The prevailing paradigm in vision-language pre-training (VLP) typically involves a two-stage optimization process: an initial resource-intensive phase dedicated to general-purpose vision-language representation learning, aimed at extracting and consolidating pertinent visual features, followed by a subsequent phase focusing on end-to-end alignment between visual and linguistic modalities. Our one-stage, single-loss framework circumvents the aforementioned computationally demanding first stage of training by gradually merging similar visual tokens during training. This gradual merging process effectively compacts the visual information while preserving the richness of semantic content, leading to fast convergence without sacrificing performance. Our experiments show that our approach can speed up the training of vision-language models by a factor $\\times 5$ without noticeable impact on the overall performance. Additionally, we show that our models can achieve comparable performance to current vision-language models with only $1/10$ of the data. Finally, we demonstrate how our image-text models can be easily adapted to video-language generative tasks through a novel soft attentive temporal token merging modules.",
        "keywords": "vision-language models;efficient training;generative models",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Yiren Jian;Tingkai Liu;Yunzhe Tao;Soroush Vosoughi;Hongxia Yang",
        "authorids": "~Yiren_Jian1;~Tingkai_Liu1;~Yunzhe_Tao2;~Soroush_Vosoughi1;~Hongxia_Yang2",
        "gender": "M;M;M;;F",
        "homepage": "https://yiren-jian.github.io/;https://tk-21st.github.io/;;https://www.cs.dartmouth.edu/~soroush/;https://www4.comp.polyu.edu.hk/~hongxyang/",
        "dblp": "226/8387;270/4091;;01/1709;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;hUYLD3_8Z1sC;gldelC4AAAAJ;45DAXkwAAAAJ;iJlC5mMAAAAJ",
        "orcid": ";0000-0003-3075-7648;;0000-0002-2564-8909;",
        "linkedin": ";;yunzhe-tao/;;",
        "or_profile": "~Yiren_Jian1;~Tingkai_Liu1;~Yunzhe_Tao2;~Soroush_Vosoughi1;~Hongxia_Yang2",
        "aff": "Dartmouth College;ByteDance Inc.;ByteDance;Dartmouth College;ByteDance Inc.",
        "aff_domain": "dartmouth.edu;bytedance.com;bytedance.com;dartmouth.edu;bytedance.com",
        "position": "PhD student;Researcher;Researcher;Assistant Professor;Principal Researcher",
        "bibtex": "@misc{\njian2024simvlg,\ntitle={Sim{VLG}: Simple and Efficient Pretraining of Visual Language Generative Models},\nauthor={Yiren Jian and Tingkai Liu and Yunzhe Tao and Soroush Vosoughi and Hongxia Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=oMRrVXrHxW}\n}",
        "github": "",
        "project": "",
        "reviewers": "rom5;QWmK;K4ZT;KSpy",
        "site": "https://openreview.net/forum?id=oMRrVXrHxW",
        "pdf_size": 5572125,
        "rating": "3;3;3;5",
        "confidence": "4;5;4;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;1;2",
        "presentation": "2;2;3;3",
        "wc_summary": "76;70;89;36",
        "wc_strengths": "53;18;19;20",
        "wc_weaknesses": "297;110;150;35",
        "wc_questions": "36;46;94;64",
        "wc_review": "462;244;352;155",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            67.75,
            19.57517560585345
        ],
        "wc_strengths_avg": [
            27.5,
            14.739402972983676
        ],
        "wc_weaknesses_avg": [
            148.0,
            95.41750363533936
        ],
        "wc_questions_avg": [
            60.0,
            22.045407685048602
        ],
        "wc_review_avg": [
            303.25,
            115.18110739179407
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4174019401154708619&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;0;1",
        "aff_unique_norm": "Dartmouth College;ByteDance",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.dartmouth.edu;https://www.bytedance.com",
        "aff_unique_abbr": "Dartmouth;ByteDance",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;0;1",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "oMTa1tcn7V",
        "title": "3D Point Cloud Sequences as 2D Videos",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The irregular and unstructured nature of 3D point cloud sequences in both spatial and temporal domains poses great difficulties in extracting their discriminative features effectively and efficiently. To tackle these challenges, in contrast to existing methods devoted to developing special architectures for modeling sequences, we advocate a new paradigm by proposing a novel representation modality, called point geometry video (PGV), that encodes the coordinates of the 3D points of a sequence as the pixel values of a 2D color video, with the original spatial neighborhood relationship and temporal consistency preserved. PGV significantly facilitates the processing of sequential 3D point clouds by enabling the adaption of powerful learning techniques for 2D image and video processing. Technically, by leveraging the local aggregation and kernel-sharing properties of the convolution operation, we build a self-supervised auto-encoder composed of convolutional layers, that consumes pre-defined regular grids to produce the PGV representation of a sequence of point clouds. We demonstrate the superiority and generality of the PGV on downstream tasks, including sequence correspondence, spatial upsampling, and forecasting. The PGV as a novel representation modality opens up new possibilities for deep learning-based processing and analysis of point cloud sequences. The code and data will be made publicly available.",
        "keywords": "3D point cloud",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/98bb24b5bacc4c44918ed8d8da447e291ab74663.zip",
        "author": "YIMING ZENG;Junhui Hou;Qijian Zhang;Wenping Wang",
        "authorids": "~YIMING_ZENG2;~Junhui_Hou2;~Qijian_Zhang1;~Wenping_Wang1",
        "gender": "M;M;M;M",
        "homepage": ";http://www.cityu.edu.hk/stfprofile/csjhhou.htm;https://keeganhk.github.io/;https://engineering.tamu.edu/cse/profiles/Wang-Wenping.html",
        "dblp": "10/1103;122/2673.html;201/6850.html;",
        "google_scholar": "1BSTaEUAAAAJ;j6eefhwAAAAJ;4NIiTYgAAAAJ;28shvv0AAAAJ",
        "orcid": "0000-0002-4662-0315;0000-0003-3431-2021;0000-0003-4723-6136;0000-0002-2284-3952",
        "linkedin": ";;;",
        "or_profile": "~YIMING_ZENG2;~Junhui_Hou2;~Qijian_Zhang1;~Wenping_Wang1",
        "aff": "City University of Hong Kong;City University of Hong Kong;City University of Hong Kong;Texas A&M University - College Station",
        "aff_domain": "cityu.edu.hk;cityu.edu.hk;cityu.edu.hk;tamu.edu",
        "position": "PhD student;Assistant Professor;PhD student;Full Professor",
        "bibtex": "@misc{\nzeng2024d,\ntitle={3D Point Cloud Sequences as 2D Videos},\nauthor={YIMING ZENG and Junhui Hou and Qijian Zhang and Wenping Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=oMTa1tcn7V}\n}",
        "github": "",
        "project": "",
        "reviewers": "eyf9;a2nk;BEST;3RY6",
        "site": "https://openreview.net/forum?id=oMTa1tcn7V",
        "pdf_size": 22504478,
        "rating": "3;5;6;8",
        "confidence": "4;2;4;5",
        "soundness": "3;2;3;3",
        "contribution": "3;2;4;2",
        "presentation": "3;1;3;3",
        "wc_summary": "54;51;91;104",
        "wc_strengths": "64;36;35;51",
        "wc_weaknesses": "182;71;95;362",
        "wc_questions": "22;26;70;16",
        "wc_review": "322;184;291;533",
        "wc_reply_reviewers": "0;0;54;283",
        "wc_reply_authors": "1646;836;1324;1186",
        "reply_reviewers": "0;0;1;2",
        "reply_authors": "5;3;3;3",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            75.0,
            22.9891278651453
        ],
        "wc_strengths_avg": [
            46.5,
            11.926860441876563
        ],
        "wc_weaknesses_avg": [
            177.5,
            114.24644414597769
        ],
        "wc_questions_avg": [
            33.5,
            21.37171027316251
        ],
        "wc_review_avg": [
            332.5,
            126.57507653562766
        ],
        "wc_reply_reviewers_avg": [
            84.25,
            116.84685489990734
        ],
        "wc_reply_authors_avg": [
            1248.0,
            290.58905691715233
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.5,
            0.8660254037844386
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.44539933408304444,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:3TQ7QsljWMIJ:scholar.google.com/&scioq=3D+Point+Cloud+Sequences+as+2D+Videos&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "City University of Hong Kong;Texas A&M University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cityu.edu.hk;https://www.tamu.edu",
        "aff_unique_abbr": "CityU;TAMU",
        "aff_campus_unique_index": "0;0;0;1",
        "aff_campus_unique": "Hong Kong SAR;College Station",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "oNkYPgnfHt",
        "title": "Learning to Intervene on Concept Bottlenecks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "While deep learning models often lack interpretability, concept bottleneck models (CBMs) provide inherent explanations via their concept representations. Moreover, they allow users to perform interventional interactions on these concepts by updating the concept values and thus correcting the predictive output of the model. Up to this point, these interventions were typically applied to the model just once and then discarded. To rectify this, we present concept bottleneck memory models (CB2Ms), which keep a memory of past interventions. Specifically, CB2Ms leverage a two-fold, differentiable memory to generalize interventions to appropriate novel situations, enabling the model to identify errors and reapply previous interventions. This way, a CB2M learns to automatically improve model performance from a few initially obtained interventions. If no prior human interventions are available, a CB2M can detect potential mistakes of the CBM bottleneck and request targeted interventions. Our experimental evaluations on challenging scenarios like handling distribution shifts and confounded data demonstrate that CB2Ms are able to successfully generalize interventions to unseen data and can indeed identify wrongly inferred concepts. Hence, CB2Ms are a valuable tool for users to provide interactive feedback on CBMs, e.g., by guiding a user\u2019s interaction and requiring fewer interventions.",
        "keywords": "Concept Bottleneck Models;Intervention;Interaction",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "David Steinmann;Wolfgang Stammer;Felix Friedrich;Kristian Kersting",
        "authorids": "~David_Steinmann1;~Wolfgang_Stammer1;~Felix_Friedrich1;~Kristian_Kersting1",
        "gender": "M;M;;M",
        "homepage": ";https://ml-research.github.io/people/wstammer/;https://ml-research.github.io/people/ffriedrich/;http://www.ml.informatik.tu-darmstadt.de/",
        "dblp": ";256/5497;18/4626;40/3793",
        "google_scholar": ";66-aU5AAAAAJ;RfM9ud0AAAAJ;QY-earAAAAAJ",
        "orcid": "0000-0001-5823-2945;0000-0003-3793-8046;0000-0001-8387-793X;0000-0002-2873-9152",
        "linkedin": ";https://linkedin.com/in/wolfgang-stammer-7835a4207/en-us?trk=people-guest_people_search-card;;",
        "or_profile": "~David_Steinmann1;~Wolfgang_Stammer1;~Felix_Friedrich1;~Kristian_Kersting1",
        "aff": "Technische Universit\u00e4t Darmstadt;CS Department, TU Darmstadt;TU Darmstadt;TU Darmstadt",
        "aff_domain": "tu-darmstadt.de;cs.tu-darmstadt.de;tu-darmstadt.de;tu-darmstadt.de",
        "position": "PhD student;PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nsteinmann2024learning,\ntitle={Learning to Intervene on Concept Bottlenecks},\nauthor={David Steinmann and Wolfgang Stammer and Felix Friedrich and Kristian Kersting},\nyear={2024},\nurl={https://openreview.net/forum?id=oNkYPgnfHt}\n}",
        "github": "",
        "project": "",
        "reviewers": "fRVj;XnGw;oJVX",
        "site": "https://openreview.net/forum?id=oNkYPgnfHt",
        "pdf_size": 469831,
        "rating": "5;6;6",
        "confidence": "4;4;4",
        "soundness": "1;2;3",
        "contribution": "2;4;2",
        "presentation": "3;3;3",
        "wc_summary": "126;125;48",
        "wc_strengths": "296;104;131",
        "wc_weaknesses": "979;472;333",
        "wc_questions": "596;314;80",
        "wc_review": "1997;1015;592",
        "wc_reply_reviewers": "791;126;135",
        "wc_reply_authors": "895;822;636",
        "reply_reviewers": "1;1;1",
        "reply_authors": "2;2;2",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            99.66666666666667,
            36.53613127971938
        ],
        "wc_strengths_avg": [
            177.0,
            84.86459803710851
        ],
        "wc_weaknesses_avg": [
            594.6666666666666,
            277.62604744912215
        ],
        "wc_questions_avg": [
            330.0,
            210.9597117935081
        ],
        "wc_review_avg": [
            1201.3333333333333,
            588.5271635381176
        ],
        "wc_reply_reviewers_avg": [
            350.6666666666667,
            311.3843641261106
        ],
        "wc_reply_authors_avg": [
            784.3333333333334,
            109.03923860498823
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 19,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10644770077055091326&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Technische Universit\u00e4t Darmstadt",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tu-darmstadt.de",
        "aff_unique_abbr": "TUD",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Darmstadt",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "oNlPtI7QfQ",
        "title": "Embed-Search-Align: DNA Sequence Alignment using Transformer models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "DNA sequence alignment involves assigning short DNA reads to the most probable locations on an extensive reference genome. This process is crucial for various genomic analyses, including variant calling, transcriptomics, and epigenomics. Conventional methods, refined over decades, tackle this challenge in two steps: genome indexing followed by efficient search to locate likely positions for given reads. Building on the success of Large Language Models (LLM) in encoding text into embeddings, where the distance metric captures semantic similarity, recent efforts have explored whether the same Transformer architecture can produce numerical representations for DNA sequences. Such models have shown early promise in tasks involving classification of short DNA sequences, such as the detection of coding- vs non-coding regions, as well as the identification of enhancer and promoter sequences. Performance at sequence classification tasks does not, however, translate to sequence alignment, where it is necessary to conduct a genome-wide search to successfully align every read. We address this open problem by framing it as an ``Embed-Search-Align'' task. In this framework, a novel encoder model DNA-ESA generates representations of reads and fragments of the reference, which are projected into a shared vector space where the read-fragment distance is used as a surrogate for alignment. In particular, DNA-ESA introduces: (1) Contrastive loss for self-supervised training of DNA sequence representations, facilitating rich sequence-level embeddings, and (2) a DNA vector store to enable search across fragments on a global scale. DNA-ESA is $>97\\\\%$ accurate when aligning $250$-length reads onto a human reference genome of $3$ gigabases (single-haploid), far exceeds the performance of $6$ recent DNA-Transformer model baselines and shows task transfer across chromosomes and species.",
        "keywords": "dna;sequence alignment;self-supervision;Transformers;large-language models",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Pavan S Holur;Kenneth Enevoldsen;Lajoyce Mboning;Thalia Georgiou;Louis Bouchard;Matteo Pellegrini;vwani Roychowdhury",
        "authorids": "~Pavan_S_Holur1;~Kenneth_Enevoldsen1;~Lajoyce_Mboning1;~Thalia_Georgiou1;~Louis_Bouchard1;~Matteo_Pellegrini1;~vwani_Roychowdhury1",
        "gender": "M;M;F;F;;M;",
        "homepage": "https://pholur.github.io/research/;https://pure.au.dk/portal/da/persons/kenneth.enevoldsen%40cas.au.dk;;;http://bouchard.chem.ucla.edu;http://pellegrini.mcdb.ucla.edu;http://vwaniroychowdhury.com ",
        "dblp": ";;;;;;",
        "google_scholar": "PFQE6v8AAAAJ;VJRMvHUAAAAJ;;;;;GrBOKEsAAAAJ",
        "orcid": "0000-0002-8495-9416;0000-0001-8733-0966;;;;;0000-0003-0832-6489",
        "linkedin": "pavanholur/;kennethenevoldsen/?originalSubdomain=dk;lajoyce-mboning-1b401561/;https://linkedin.com/in/thaliageorgiou;;;",
        "or_profile": "~Pavan_S_Holur1;~Kenneth_Enevoldsen1;~Lajoyce_Mboning1;~Thalia_Georgiou1;~Louis_Bouchard1;~Matteo_Pellegrini1;~vwani_Roychowdhury1",
        "aff": ";Aarhus University;University of California, Los Angeles;University of California, Los Angeles;University of California, Los Angeles;;University of California, Los Angeles",
        "aff_domain": ";au.dk;ucla.edu;ucla.edu;ucla.edu;;ucla.edu",
        "position": ";Postdoc;PhD student;PhD student;Associate Professor;;Full Professor",
        "bibtex": "@misc{\nholur2024embedsearchalign,\ntitle={Embed-Search-Align: {DNA} Sequence Alignment using Transformer models},\nauthor={Pavan S Holur and Kenneth Enevoldsen and Lajoyce Mboning and Thalia Georgiou and Louis Bouchard and Matteo Pellegrini and vwani Roychowdhury},\nyear={2024},\nurl={https://openreview.net/forum?id=oNlPtI7QfQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "nXVu;o7rD;ModJ",
        "site": "https://openreview.net/forum?id=oNlPtI7QfQ",
        "pdf_size": 2327788,
        "rating": "3;3;6",
        "confidence": "4;4;3",
        "soundness": "1;2;3",
        "contribution": "3;2;3",
        "presentation": "3;2;3",
        "wc_summary": "64;446;225",
        "wc_strengths": "34;1;88",
        "wc_weaknesses": "120;1;95",
        "wc_questions": "35;1;43",
        "wc_review": "253;449;451",
        "wc_reply_reviewers": "0;0;134",
        "wc_reply_authors": "639;766;904",
        "reply_reviewers": "0;0;1",
        "reply_authors": "1;1;2",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            245.0,
            156.59076175389998
        ],
        "wc_strengths_avg": [
            41.0,
            35.86084215408221
        ],
        "wc_weaknesses_avg": [
            72.0,
            51.23150072627842
        ],
        "wc_questions_avg": [
            26.333333333333332,
            18.208667044996883
        ],
        "wc_review_avg": [
            384.3333333333333,
            92.87027990099357
        ],
        "wc_reply_reviewers_avg": [
            44.666666666666664,
            63.168205785998246
        ],
        "wc_reply_authors_avg": [
            769.6666666666666,
            108.21686046494276
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16601273406817904753&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;1;1;1",
        "aff_unique_norm": "Aarhus University;University of California, Los Angeles",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://au.dk;https://www.ucla.edu",
        "aff_unique_abbr": "AU;UCLA",
        "aff_campus_unique_index": "1;1;1;1",
        "aff_campus_unique": ";Los Angeles",
        "aff_country_unique_index": "0;1;1;1;1",
        "aff_country_unique": "Denmark;United States"
    },
    {
        "title": "Graph Neural Networks for Learning Equivariant Representations of Neural Networks",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17821",
        "id": "oO6FsMyDBt",
        "author_site": "Miltiadis (Miltos) Kofinas, Boris Knyazev, Yan Zhang, Yunlu Chen, Gertjan J Burghouts, Efstratios Gavves, Cees G Snoek, David Zhang",
        "tldr": "",
        "abstract": "Neural networks that process the parameters of other neural networks find applications in domains as diverse as classifying implicit neural representations, generating neural network weights, and predicting generalization errors. However, existing approaches either overlook the inherent permutation symmetry in the neural network or rely on intricate weight-sharing patterns to achieve equivariance, while ignoring the impact of the network architecture itself. In this work, we propose to represent neural networks as computational graphs of parameters, which allows us to harness powerful graph neural networks and transformers that preserve permutation symmetry. Consequently, our approach enables a single model to encode neural computational graphs with diverse architectures. We showcase the effectiveness of our method on a wide range of tasks, including classification and editing of implicit neural representations, predicting generalization performance, and learning to optimize, while consistently outperforming state-of-the-art methods. The source code is open-sourced at https://github.com/mkofinas/neural-graphs.",
        "keywords": "Deep weight space;Graph neural networks;Transformers;Permutation equivariance;Implicit neural representations;Networks for networks;Neural graphs",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/1e7b5b69325338b8f37fe9e58c18d76ca055edf5.zip",
        "author": "Miltiadis Kofinas;Boris Knyazev;Yan Zhang;Yunlu Chen;Gertjan J. Burghouts;Efstratios Gavves;Cees G. M. Snoek;David W. Zhang",
        "authorids": "~Miltiadis_Kofinas2;~Boris_Knyazev1;~Yan_Zhang1;~Yunlu_Chen1;~Gertjan_J._Burghouts1;~Efstratios_Gavves1;~Cees_G._M._Snoek1;~David_W._Zhang1",
        "gender": "M;M;M;;M;M;;",
        "homepage": "https://mkofinas.github.io;https://bknyaz.github.io/;https://www.cyanogenoid.com;;https://gertjanburghouts.github.io/;https://www.egavves.com;;",
        "dblp": "305/0160;181/5675-1;04/3348-67;;84/2061;03/8693;;",
        "google_scholar": "Ur5BV8MAAAAJ;https://scholar.google.ca/citations?user=Dp9VFB0AAAAJ;https://scholar.google.co.uk/citations?user=XtCqbfEAAAAJ;;zN6afwwAAAAJ;https://scholar.google.nl/citations?user=QqfCvsgAAAAJ;;",
        "orcid": "0000-0002-3392-4037;0000-0002-9484-1534;0000-0003-3470-3663;;0000-0001-6265-7276;;;",
        "linkedin": "miltiadiskofinas/;boris-knyazev-39690948/;;;gertjanburghouts/;;;",
        "or_profile": "~Miltiadis_Kofinas2;~Boris_Knyazev1;~Yan_Zhang1;~Yunlu_Chen1;~Gertjan_J._Burghouts1;~Efstratios_Gavves1;~Cees_G._M._Snoek1;~David_W._Zhang1",
        "aff": "University of Amsterdam;Samsung;Mila - Quebec Artificial Intelligence Institute;;TNO;University of Amsterdam;;",
        "aff_domain": "uva.nl;samsung.com;mila.quebec;;tno.nl;uva.nl;;",
        "position": "PhD student;Researcher;Industrial Partner;;Researcher;Associate Professor;;",
        "bibtex": "@inproceedings{\nkofinas2024graph,\ntitle={Graph Neural Networks for Learning Equivariant Representations of Neural Networks},\nauthor={Miltiadis Kofinas and Boris Knyazev and Yan Zhang and Yunlu Chen and Gertjan J. Burghouts and Efstratios Gavves and Cees G. M. Snoek and David W. Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=oO6FsMyDBt}\n}",
        "github": "",
        "project": "",
        "reviewers": "6cHp;qkCh;rtFz",
        "pdf_size": 1200522,
        "rating": "6;8;8",
        "confidence": "4;4;4",
        "soundness": "2;3;4",
        "contribution": "3;3;3",
        "presentation": "3;3;4",
        "wc_summary": "56;118;149",
        "wc_strengths": "59;92;160",
        "wc_weaknesses": "58;95;182",
        "wc_questions": "43;78;232",
        "wc_review": "216;383;723",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "519;957;1346",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;2;2",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            107.66666666666667,
            38.663792996664064
        ],
        "wc_strengths_avg": [
            103.66666666666667,
            42.05023450852827
        ],
        "wc_weaknesses_avg": [
            111.66666666666667,
            51.97649041206568
        ],
        "wc_questions_avg": [
            117.66666666666667,
            82.09885640020951
        ],
        "wc_review_avg": [
            440.6666666666667,
            210.9602384863608
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            940.6666666666666,
            337.8188206058916
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 39,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13113532483383938746&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=oO6FsMyDBt",
        "pdf": "https://openreview.net/pdf?id=oO6FsMyDBt",
        "email": "uva.nl;samsung.com;mila.quebec;;tno.nl;uva.nl;;",
        "author_num": 8,
        "aff_unique_index": "0;1;2;3;0",
        "aff_unique_norm": "University of Amsterdam;Samsung;Quebec Artificial Intelligence Institute;TNO",
        "aff_unique_dep": ";Samsung;Artificial Intelligence;",
        "aff_unique_url": "https://www.uva.nl;https://www.samsung.com;https://mila.quebec;https://www.tno.nl",
        "aff_unique_abbr": "UvA;Samsung;Mila;TNO",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;0;0",
        "aff_country_unique": "Netherlands;South Korea;Canada"
    },
    {
        "title": "Treatment Effects Estimation By Uniform Transformer",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17820",
        "id": "oOGqJ6Z1sA",
        "author_site": "Ruoqi Yu, Shulei Wang",
        "tldr": "",
        "abstract": "In observational studies, balancing covariates in different treatment groups is essential to estimate treatment effects. One of the most commonly used methods for such purposes is weighting. The performance of this class of methods usually depends on strong regularity conditions for the underlying model, which might not hold in practice. In this paper, we investigate weighting methods from a functional estimation perspective and argue that the weights needed for covariate balancing could differ from those needed for treatment effects estimation under low regularity conditions. Motivated by this observation, we introduce a new framework of weighting that directly targets the treatment effects estimation. Unlike existing methods, the resulting estimator for a treatment effect under this new framework is a simple kernel-based $U$-statistic after applying a data-driven transformation to the observed covariates. We characterize the theoretical properties of the new estimators of treatment effects under a nonparametric setting and show that they are able to work robustly under low regularity conditions. The new framework is also applied to several numerical examples to demonstrate its practical merits.",
        "keywords": "Causal inference;covariate balance;nonparametric estimation;observational studies;weighting method",
        "primary_area": "causal reasoning",
        "supplementary_material": "",
        "author": "Ruoqi Yu;Shulei Wang",
        "authorids": "~Ruoqi_Yu1;~Shulei_Wang1",
        "gender": ";M",
        "homepage": "https://sites.google.com/view/ruoqi-yu/;https://sites.google.com/view/shulei-wang/",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": ";0000-0001-7440-9544",
        "linkedin": ";",
        "or_profile": "~Ruoqi_Yu1;~Shulei_Wang1",
        "aff": "University of Illinois Urbana-Champaign;University of Illinois Urbana-Champaign",
        "aff_domain": "illinois.edu;illinois.edu",
        "position": "Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nyu2024treatment,\ntitle={Treatment Effects Estimation By Uniform Transformer},\nauthor={Ruoqi Yu and Shulei Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=oOGqJ6Z1sA}\n}",
        "github": "",
        "project": "",
        "reviewers": "oSbf;424z;Ybv2",
        "pdf_size": 348659,
        "rating": "5;6;8",
        "confidence": "2;4;4",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "2;3;3",
        "wc_summary": "58;89;95",
        "wc_strengths": "389;53;58",
        "wc_weaknesses": "2;124;77",
        "wc_questions": "2;103;69",
        "wc_review": "451;369;299",
        "wc_reply_reviewers": "0;5;0",
        "wc_reply_authors": "874;851;536",
        "reply_reviewers": "0;1;0",
        "reply_authors": "2;2;1",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            80.66666666666667,
            16.21384867602041
        ],
        "wc_strengths_avg": [
            166.66666666666666,
            157.22665875169588
        ],
        "wc_weaknesses_avg": [
            67.66666666666667,
            50.24163833139025
        ],
        "wc_questions_avg": [
            58.0,
            41.960298696108765
        ],
        "wc_review_avg": [
            373.0,
            62.1181669615795
        ],
        "wc_reply_reviewers_avg": [
            1.6666666666666667,
            2.357022603955158
        ],
        "wc_reply_authors_avg": [
            753.6666666666666,
            154.19972618508618
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.7559289460184546,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14995173196518878482&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=oOGqJ6Z1sA",
        "pdf": "https://openreview.net/pdf?id=oOGqJ6Z1sA",
        "email": "illinois.edu;illinois.edu",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Illinois Urbana-Champaign",
        "aff_unique_dep": "",
        "aff_unique_url": "https://illinois.edu",
        "aff_unique_abbr": "UIUC",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Urbana-Champaign",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "oOa3ZCtMjJ",
        "title": "generative adversarial network with hierarchical semantic prompt constrainting clip for high-quality text-to-image synthesis",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "How to synthesize efficient, controllable, and semantically relevant high-quality images based on text is currently a very challenging task. Combining generative adversarial networks with CLIP models to improve the quality of synthesized images has revitalized GAN in the field of generation. Compared with diffusion models, GAN has faster generation speed, fewer training resources and parameters, and more controllable generation results. However, the current methods for combining CLIP and GAN are relatively rough, mostly used as text encoders and feature bridges, without fully utilizing the semantic alignment ability of CLIP networks, ignoring the structural and hierarchical nature of semantic features, and resulting in poor semantic consistency in synthesized images. In response to these problems, we propose HSPC-GAN, which is a method of constructing structural semantic prompts and using them to hierarchically guide CLIP to adjust visual features for generation of high-quality images with controllable semantic consistency. HSPC-GAN extracts semantic concepts through part of speech analysis, constructs a prompt generator and a prompt adaptor to generate learnable hierarchical semantic prompts, and using these prompts to selectively guide CLIP adapters to adjust image features to improve semantic consistency between synthesized images and conditional texts. At the same time, we introduced the mining of hard negative samples into the construction of the discriminator loss function for the first time, improving the discriminator\u2019s ability to distinguish mismatched samples and reducing the impact of the generated model\u2019s requirements for batch size and epoch on training results. A large number of experimental results have proven the effectiveness of our method, which can quickly synthesize high-quality images with consistent semantics, and achieve state of the art on public datasets.",
        "keywords": "Text-To-Image\uff0cHierarchical Semantic Guide \uff0cCLIP\uff0cPrompt Constrain\uff0cGAN\uff0cHard Mining",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Shuheng Ge;Xiangqian Wu",
        "authorids": "~Shuheng_Ge1;~Xiangqian_Wu1",
        "gender": ";M",
        "homepage": ";http://homepage.hit.edu.cn",
        "dblp": ";56/4291-2",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Shuheng_Ge1;~Xiangqian_Wu1",
        "aff": ";Harbin Institute of Technology",
        "aff_domain": ";hit.edu.cn",
        "position": ";Full Professor",
        "bibtex": "@misc{\nanonymous2024generative,\ntitle={generative adversarial network with hierarchical semantic prompt constrainting clip for high-quality text-to-image synthesis},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=oOa3ZCtMjJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "hvaD;v8PS;rmDR;rLWE",
        "site": "https://openreview.net/forum?id=oOa3ZCtMjJ",
        "pdf_size": 5366923,
        "rating": "1;3;3;5",
        "confidence": "4;4;5;3",
        "soundness": "1;2;2;2",
        "contribution": "1;2;2;2",
        "presentation": "1;1;3;2",
        "wc_summary": "83;78;77;62",
        "wc_strengths": "16;54;8;45",
        "wc_weaknesses": "160;407;52;131",
        "wc_questions": "11;8;2;2",
        "wc_review": "270;547;139;240",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "196;612;238;317",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            75.0,
            7.842193570679061
        ],
        "wc_strengths_avg": [
            30.75,
            19.22725929507375
        ],
        "wc_weaknesses_avg": [
            187.5,
            132.7488229702998
        ],
        "wc_questions_avg": [
            5.75,
            3.897114317029974
        ],
        "wc_review_avg": [
            299.0,
            151.1836631385812
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            340.75,
            162.51980648524045
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:K01JVjPgheYJ:scholar.google.com/&scioq=generative+adversarial+network+with+hierarchical+semantic+prompt+constrainting+clip+for+high-quality+text-to-image+synthesis&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Harbin Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.hit.edu.cn/",
        "aff_unique_abbr": "HIT",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Harbin",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "oOjX2hIdWo",
        "title": "Drag View: Generalizable Novel View Synthesis with Unposed Imagery",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We introduce DragView, a novel and interactive framework for generating novel views of unseen scenes. DragView initializes the new view from a single source image, and the rendering is supported by a sparse set of unposed multi-view images, all seamlessly executed within a single feed-forward pass. Our approach begins with users dragging a source view through a local relative coordinate system. Pixel-aligned features are obtained by projecting the sampled 3D points along the target ray onto the source view. We then incorporate a view-dependent modulation layer to effectively handle occlusion during the projection. Additionally, we broaden the epipolar attention mechanism to encompass all source pixels, facilitating the aggregation of initialized coordinate-aligned point features from other unposed views. Finally, we employ another transformer to decode ray features into final pixel intensities. Crucially, our framework does not rely on either 2D prior models or the explicit estimation of camera poses. During testing, DragView showcases the capability to generalize to new scenes unseen during training, also utilizing only unposed support images, enabling the generation of photo-realistic new views characterized by flexible camera trajectories. In our experiments, we conduct a comprehensive comparison of the performance of DragView with recent scene representation networks operating under pose-free conditions, as well as with generalizable NeRFs subject to noisy test camera poses. DragView consistently demonstrates its superior performance in view synthesis quality, while also being more user-friendly. Codes will be released.",
        "keywords": "Novel view synthesis;Generalizable Neural Rendering;Transformer",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/7e2457f3015a45126680ef3cf40514043fd0bb0e.zip",
        "author": "Zhiwen Fan;Panwang Pan;Peihao Wang;Yifan Jiang;Hanwen Jiang;Dejia Xu;Zehao Zhu;Dilin Wang;Zhangyang Wang",
        "authorids": "~Zhiwen_Fan2;~Panwang_Pan1;~Peihao_Wang1;~Yifan_Jiang2;~Hanwen_Jiang1;~Dejia_Xu1;~Zehao_Zhu1;~Dilin_Wang1;~Zhangyang_Wang1",
        "gender": ";M;M;M;M;M;M;;M",
        "homepage": ";https://paulpanwang.github.io/;https://peihaowang.github.io/;https://yifanjiang19.github.io/;https://hwjiang1510.github.io/;https://ir1d.github.io;https://zehaozhu.github.io/;;https://vita-group.github.io",
        "dblp": ";;239/4075;81/7246-1;237/9854;264/5685;;;119/4026",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;fqf2tBsAAAAJ;PMeFEOIAAAAJ;https://scholar.google.com.sg/citations?user=HJHSuxUAAAAJ;ET0e93cAAAAJ;;;pxFyKAIAAAAJ",
        "orcid": ";0000-0001-8631-012X;;;;;;;",
        "linkedin": ";;peihao-wang-25a411162/;;;;;;",
        "or_profile": "~Zhiwen_Fan2;~Panwang_Pan1;~Peihao_Wang1;~Yifan_Jiang2;~Hanwen_Jiang1;~Dejia_Xu1;~Zehao_Zhu1;~Dilin_Wang1;~Zhangyang_Wang1",
        "aff": ";ByteDance;University of Texas, Austin;University of Texas, Austin;University of Texas at Austin;University of Texas at Austin;University of Texas at Austin;;University of Texas at Austin",
        "aff_domain": ";bytedance.com;utexas.edu;utexas.edu;utexas.edu;utexas.edu;utexas.edu;;utexas.edu",
        "position": ";Researcher;PhD student;PhD student;PhD student;PhD student;PhD student;;Associate Professor",
        "bibtex": "@misc{\nfan2024drag,\ntitle={Drag View: Generalizable Novel View Synthesis with Unposed Imagery},\nauthor={Zhiwen Fan and Panwang Pan and Peihao Wang and Yifan Jiang and Hanwen Jiang and Dejia Xu and Zehao Zhu and Dilin Wang and Zhangyang Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=oOjX2hIdWo}\n}",
        "github": "",
        "project": "",
        "reviewers": "iswE;cpwu;EhPc",
        "site": "https://openreview.net/forum?id=oOjX2hIdWo",
        "pdf_size": 7102712,
        "rating": "3;3;5",
        "confidence": "4;4;4",
        "soundness": "2;2;2",
        "contribution": "2;2;2",
        "presentation": "1;2;2",
        "wc_summary": "219;105;74",
        "wc_strengths": "22;31;36",
        "wc_weaknesses": "478;72;32",
        "wc_questions": "3;2;67",
        "wc_review": "722;210;209",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            132.66666666666666,
            62.3449187094577
        ],
        "wc_strengths_avg": [
            29.666666666666668,
            5.792715732327588
        ],
        "wc_weaknesses_avg": [
            194.0,
            201.48118191698862
        ],
        "wc_questions_avg": [
            24.0,
            30.40833219146796
        ],
        "wc_review_avg": [
            380.3333333333333,
            241.59516183529468
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13995808452424658626&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1;1;1;1",
        "aff_unique_norm": "ByteDance;University of Texas at Austin",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.bytedance.com;https://www.utexas.edu",
        "aff_unique_abbr": "ByteDance;UT Austin",
        "aff_campus_unique_index": "1;1;1;1;1;1",
        "aff_campus_unique": ";Austin",
        "aff_country_unique_index": "0;1;1;1;1;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Towards Cheaper Inference in Deep Networks with Lower Bit-Width Accumulators",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17819",
        "id": "oOwDQl8haC",
        "author_site": "Yaniv Blumenfeld, Itay Hubara, Daniel Soudry",
        "tldr": "",
        "abstract": "The majority of the research on the quantization of Deep Neural Networks (DNNs) is focused on reducing the precision of tensors visible by high-level frameworks (e.g., weights, activations, and gradients). However, current hardware still relies on high-accuracy core operations. Most significant is the operation of accumulating products. This high-precision accumulation operation is gradually becoming the main computational bottleneck. This is because, so far, the usage of low-precision accumulators led to a significant degradation in performance. In this work, we present a simple method to train and fine-tune DNNs, to allow, for the first time, utilization of cheaper, $12$-bits accumulators, with no significant degradation in accuracy. Lastly, we show that as we decrease the accumulation precision further, using fine-grained gradient approximations can improve the DNN accuracy.",
        "keywords": "Deep Neural Networks;Quantized Neural Networks;Network Quantization;Accumulators;Accelerators;Inference;Computer Vision;Language Models",
        "primary_area": "infrastructure, software libraries, hardware, etc.",
        "supplementary_material": "",
        "author": "Yaniv Blumenfeld;Itay Hubara;Daniel Soudry",
        "authorids": "~Yaniv_Blumenfeld1;~Itay_Hubara1;~Daniel_Soudry1",
        "gender": "M;M;M",
        "homepage": ";;https://soudry.github.io/",
        "dblp": ";http://dblp.uni-trier.de/pers/hd/h/Hubara:Itay;126/1779",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;https://scholar.google.co.il/citations?user=AEBWEm8AAAAJ",
        "orcid": ";;0000-0001-9368-6352",
        "linkedin": "yaniv-blumenfeld-6103b516b/;itay-hubara-57739b29/;daniel-soudry-2aa3a88/",
        "or_profile": "~Yaniv_Blumenfeld1;~Itay_Hubara1;~Daniel_Soudry1",
        "aff": ";Technion, Technion;Technion - Israel Institute of Technology, Technion",
        "aff_domain": ";technion.ac.il;technion.ac.il",
        "position": ";PhD student;Associate Professor",
        "bibtex": "@inproceedings{\nblumenfeld2024towards,\ntitle={Towards Cheaper Inference in Deep Networks with Lower Bit-Width Accumulators},\nauthor={Yaniv Blumenfeld and Itay Hubara and Daniel Soudry},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=oOwDQl8haC}\n}",
        "github": "",
        "project": "",
        "reviewers": "AH1V;AQt3;YwrL;L15P",
        "pdf_size": 418392,
        "rating": "5;6;6;6",
        "confidence": "3;4;4;4",
        "soundness": "2;2;3;4",
        "contribution": "3;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "49;139;101;76",
        "wc_strengths": "45;88;64;50",
        "wc_weaknesses": "104;86;311;129",
        "wc_questions": "7;87;92;21",
        "wc_review": "205;400;568;276",
        "wc_reply_reviewers": "0;17;42;16",
        "wc_reply_authors": "350;736;1298;538",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "2;1;3;2",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            91.25,
            33.138912172852024
        ],
        "wc_strengths_avg": [
            61.75,
            16.67895380412093
        ],
        "wc_weaknesses_avg": [
            157.5,
            89.92913877047862
        ],
        "wc_questions_avg": [
            51.75,
            38.114137796885814
        ],
        "wc_review_avg": [
            362.25,
            137.77223051108666
        ],
        "wc_reply_reviewers_avg": [
            18.75,
            15.022899187573616
        ],
        "wc_reply_authors_avg": [
            730.5,
            354.937670584569
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1494359888635636649&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=oOwDQl8haC",
        "pdf": "https://openreview.net/pdf?id=oOwDQl8haC",
        "email": ";technion.ac.il;technion.ac.il",
        "author_num": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Technion - Israel Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.technion.ac.il/en/",
        "aff_unique_abbr": "Technion",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Israel"
    },
    {
        "id": "oPZZcLZXT1",
        "title": "Expert Proximity as Surrogate Rewards for Single Demonstration Imitation Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This study investigates the challenging single-demonstration imitation learning (IL) setting. In this context, the learning agent relies solely on a single expert demonstration and operates in an environment that lacks external reward signals, human feedback, or prior analogous knowledge, as obtaining multiple demonstrations or engineering complex reward functions is often infeasible. Given these constraints, the study introduces a methodology termed Transition Discriminator-based IL (TDIL). TDIL aims to augment the density of available reward signals and enhance agent performance by incorporating environmental dynamics. It posits that rather than strictly adhering to a limited expert demonstration, the agent should first aim to reach states proximal to expert behavior. The study introduces a surrogate reward function, approximated by a transition discriminator, to facilitate this process. TDIL demonstrates promise in addressing the sparse-reward problem common in single-demonstration IL, and stabilizing the learning process of the agent during training. A comprehensive set of experiments across multiple benchmarks validate the effectiveness of TDIL over existing IL methods.",
        "keywords": "Imitation learning;reinforcement learning;single demonstration imitation learning.",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/68d7c0df5798cb5cb8e6abcd2123232ffb5b3fab.pdf",
        "author": "Chia-Cheng Chiang;Chien Feng;Li-Cheng Lan;Wei-Fang Sun;Cho-Jui Hsieh;Chun-Yi Lee",
        "authorids": "~Chia-Cheng_Chiang1;~Chien_Feng2;~Li-Cheng_Lan1;~Wei-Fang_Sun1;~Cho-Jui_Hsieh1;~Chun-Yi_Lee1",
        "gender": ";M;M;M;M;M",
        "homepage": ";https://lan-lc.github.io/;;http://web.cs.ucla.edu/~chohsieh/index.html;https://elsalab.ai;",
        "dblp": ";200/8672;275/9039;14/2770;36/3668;",
        "google_scholar": ";https://scholar.google.com.tw/citations?view_op=list_works;TgMlVRUAAAAJ;Wy89g4IAAAAJ;https://scholar.google.com.tw/citations?user=5mYNdo0AAAAJ;",
        "orcid": ";;;;0000-0002-4680-4800;",
        "linkedin": "chien-feng-56300320b;;;;;%E5%AE%B6%E4%B8%9E-%E6%B1%9F-0a637017a/",
        "or_profile": "~Chien_Feng2;~Li-Cheng_Lan1;~Wei-Fang_Sun1;~Cho-Jui_Hsieh1;~Chun-Yi_Lee1;~Stanley_Chiang1",
        "aff": "Department of Computer Science, National Tsing Hua University, National Tsinghua University;University of California, Los Angeles;NVIDIA AI Technology Center;University of California, Los Angeles;National Tsing Hua University;National Tsing Hua University",
        "aff_domain": "cs.nthu.edu.tw;ucla.edu;nvidia.com;ucla.edu;nthu.edu.tw;nthu.edu.tw",
        "position": "MS student;PhD student;Researcher;Associate Professor;Full Professor;MS student",
        "bibtex": "@misc{\nchiang2024expert,\ntitle={Expert Proximity as Surrogate Rewards for Single Demonstration Imitation Learning},\nauthor={Chia-Cheng Chiang and Chien Feng and Li-Cheng Lan and Wei-Fang Sun and Cho-Jui Hsieh and Chun-Yi Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=oPZZcLZXT1}\n}",
        "github": "",
        "project": "",
        "reviewers": "eL6k;9w53;Ka6u;6wvZ",
        "site": "https://openreview.net/forum?id=oPZZcLZXT1",
        "pdf_size": 3432377,
        "rating": "5;5;5;6",
        "confidence": "4;3;4;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "58;52;93;41",
        "wc_strengths": "16;46;61;74",
        "wc_weaknesses": "216;255;118;387",
        "wc_questions": "3;3;16;105",
        "wc_review": "293;356;288;607",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1420;894;510;1375",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;1;2",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            61.0,
            19.45507645834372
        ],
        "wc_strengths_avg": [
            49.25,
            21.602951187279945
        ],
        "wc_weaknesses_avg": [
            244.0,
            96.47538546178502
        ],
        "wc_questions_avg": [
            31.75,
            42.62261723545376
        ],
        "wc_review_avg": [
            386.0,
            130.37829573974344
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1049.75,
            373.6511574985417
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:YDYF5TX8JXYJ:scholar.google.com/&scioq=Expert+Proximity+as+Surrogate+Rewards+for+Single+Demonstration+Imitation+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;2;1;3;3",
        "aff_unique_norm": "National Tsinghua University;University of California, Los Angeles;NVIDIA;National Tsing Hua University",
        "aff_unique_dep": "Department of Computer Science;;NVIDIA AI Technology Center;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.ucla.edu;https://www.nvidia.com/en-us/research/;https://www.nthu.edu.tw",
        "aff_unique_abbr": "THU;UCLA;NVIDIA;NTHU",
        "aff_campus_unique_index": "1;1;2;2",
        "aff_campus_unique": ";Los Angeles;Taiwan",
        "aff_country_unique_index": "0;1;1;1;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Online Information Acquisition: Hiring Multiple Agents",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17818",
        "id": "oQKKlzxV1o",
        "author_site": "Federico Cacciamani, Matteo Castiglioni, Nicola Gatti",
        "tldr": "",
        "abstract": "We investigate the mechanism design problem faced by a principal who hires \\emph{multiple} agents to gather and report costly information. Then, the principal exploits the  information to make an informed decision.  We model this problem as a game, where the principal announces a mechanism consisting in action recommendations and a payment function, a.k.a. scoring rule. Then, each agent chooses an effort level and receives partial information about an underlying state of nature based on the effort. Finally, the agents report the information (possibly non-truthfully), the principal takes a decision based on this information, and the agents are paid according to the scoring rule. While previous work focuses on single-agent problems, we consider multi-agents settings. This poses the challenge of coordinating the agents' efforts and aggregating correlated information. Indeed, we show that optimal mechanisms must correlate agents' efforts, which introduces externalities among the agents, and hence complex incentive compatibility constraints and equilibrium selection problems. First, we design a polynomial-time algorithm to find an optimal incentive compatible mechanism. Then, we study an online problem, where the principal repeatedly interacts with a group of unknown agents. We design a no-regret algorithm that provides $\\widetilde{\\mathcal{O}}(T^{2/3})$ regret with respect to an optimal mechanism, matching the state-of-the-art bound for single-agent settings.",
        "keywords": "online learning;information acquisition;mechanism design",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Federico Cacciamani;Matteo Castiglioni;Nicola Gatti",
        "authorids": "~Federico_Cacciamani1;~Matteo_Castiglioni1;~Nicola_Gatti1",
        "gender": "M;;M",
        "homepage": ";https://castiglionimatteo.github.io;https://www4.ceda.polimi.it/manifesti/manifesti/controller/ricerche/RicercaPerDocentiPublic.do?k_doc=75785&lang=EN&EVN_PRODOTTI=evento&__pj0=0&__pj1=d918ee8916afbd0005f5c0bc3c0ff350",
        "dblp": "285/5552;225/7720;g/NicolaGatti",
        "google_scholar": "ntSIxxMAAAAJ;https://scholar.google.it/citations?user=NPE3HAYAAAAJ;https://scholar.google.com.tw/citations?user=j-HrYREAAAAJ",
        "orcid": ";0000-0002-1070-6766;0000-0001-7349-3932",
        "linkedin": ";;nicola-gatti-1284b21",
        "or_profile": "~Federico_Cacciamani1;~Matteo_Castiglioni1;~Nicola_Gatti1",
        "aff": ";Politecnico di Milano;Polytechnic Institute of Milan",
        "aff_domain": ";polimi.it;polimi.it",
        "position": ";Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\ncacciamani2024online,\ntitle={Online Information Acquisition: Hiring Multiple Agents},\nauthor={Federico Cacciamani and Matteo Castiglioni and Nicola Gatti},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=oQKKlzxV1o}\n}",
        "github": "",
        "project": "",
        "reviewers": "uose;CwwP;cMnb;eEDk",
        "pdf_size": 493657,
        "rating": "5;6;8;8",
        "confidence": "3;2;4;3",
        "soundness": "3;3;4;3",
        "contribution": "2;2;4;3",
        "presentation": "2;3;3;2",
        "wc_summary": "42;118;153;99",
        "wc_strengths": "209;23;66;49",
        "wc_weaknesses": "96;122;105;158",
        "wc_questions": "34;122;101;60",
        "wc_review": "381;385;425;366",
        "wc_reply_reviewers": "0;11;0;12",
        "wc_reply_authors": "394;269;483;727",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            103.0,
            40.193283020922784
        ],
        "wc_strengths_avg": [
            86.75,
            72.22317841247366
        ],
        "wc_weaknesses_avg": [
            120.25,
            23.710493457539005
        ],
        "wc_questions_avg": [
            79.25,
            34.34657916008521
        ],
        "wc_review_avg": [
            389.25,
            21.821720830401986
        ],
        "wc_reply_reviewers_avg": [
            5.75,
            5.7608593109014565
        ],
        "wc_reply_authors_avg": [
            468.25,
            167.6176825397607
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5443310539518174,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13282234964088695574&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=oQKKlzxV1o",
        "pdf": "https://openreview.net/pdf?id=oQKKlzxV1o",
        "email": ";polimi.it;polimi.it",
        "author_num": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Politecnico di Milano;Polytechnic Institute of Milan",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.polimi.it;https://www.polimi.it/",
        "aff_unique_abbr": "Polimi;Politecnico di Milano",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Italy"
    },
    {
        "id": "oSuVEv4X7w",
        "title": "Clover: Closed-Loop Verifiable Code Generation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The use of large language models for code generation is a rapidly developing trend in contemporary software development. However, without effective methods for ensuring the correctness of generated code, this trend could lead to any number of dangerous or even catastrophic outcomes. In this paper, we lay out a vision for addressing this challenge: the Clover paradigm, short for Closed-loop Verifiable Code Generation. At the core of Clover lies a checker that performs consistency checks among code, docstrings, and formal annotations.\nThe checker is implemented using a novel integration of formal verification tools and large language models. We provide a theoretical analysis to support our thesis that Clover should be effective at checking the correctness of code. We also empirically investigate its feasibility on a hand-designed dataset (CloverBench) featuring annotated Dafny programs at a textbook level of difficulty. Experimental results show that for this dataset, (i) LLMs are reasonably successful at automatically generating formal specifications; and (ii) our consistency checker achieves a promising acceptance rate (>= 75%) for correct instances while maintaining zero tolerance for incorrect ones.",
        "keywords": "large language models;code generation;dafny;verification",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "/attachment/288fa5166c888ba5b047c75507e63af7f6f95068.zip",
        "author": "Chuyue Sun;Ying Sheng;Oded Padon;Clark Barrett",
        "authorids": "~Chuyue_Sun1;~Ying_Sheng1;~Oded_Padon1;~Clark_Barrett1",
        "gender": ";F;;M",
        "homepage": "https://web.stanford.edu/~chuyues/;https://sites.google.com/view/yingsheng;https://cs.stanford.edu/~padon/;http://theory.stanford.edu/~barrett",
        "dblp": ";262/6232.html;;b/ClarkWBarrett",
        "google_scholar": ";xMhGYpgAAAAJ;;https://scholar.google.com.tw/citations?user=BtwmZfQAAAAJ",
        "orcid": ";0000-0002-1883-2126;;0000-0002-9522-3084",
        "linkedin": ";;;clark-barrett-a5b157/",
        "or_profile": "~Chuyue_Sun1;~Ying_Sheng1;~Oded_Padon1;~Clark_Barrett1",
        "aff": "Stanford University;Stanford University;VMware Research;Stanford University",
        "aff_domain": "stanford.edu;stanford.edu;research.vmware.com;stanford.edu",
        "position": "PhD student;PhD student;Researcher;Professor (Research)",
        "bibtex": "@misc{\nsun2024clover,\ntitle={Clover: Closed-Loop Verifiable Code Generation},\nauthor={Chuyue Sun and Ying Sheng and Oded Padon and Clark Barrett},\nyear={2024},\nurl={https://openreview.net/forum?id=oSuVEv4X7w}\n}",
        "github": "",
        "project": "",
        "reviewers": "M5ic;L24Y;29hf;kgwt",
        "site": "https://openreview.net/forum?id=oSuVEv4X7w",
        "pdf_size": 431485,
        "rating": "3;5;5;6",
        "confidence": "4;5;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;3;2;2",
        "presentation": "2;4;3;2",
        "wc_summary": "463;98;639;140",
        "wc_strengths": "8;34;101;61",
        "wc_weaknesses": "10;181;866;59",
        "wc_questions": "12;196;37;118",
        "wc_review": "493;509;1643;378",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1360;1473;1920;960",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;3;4;3",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            335.0,
            225.2742772710635
        ],
        "wc_strengths_avg": [
            51.0,
            34.416565778706044
        ],
        "wc_weaknesses_avg": [
            279.0,
            344.57727725431926
        ],
        "wc_questions_avg": [
            90.75,
            72.3027489103976
        ],
        "wc_review_avg": [
            755.75,
            514.7404078756592
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1428.25,
            341.9564116959938
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            3.25,
            0.4330127018922193
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.13245323570650439,
        "gs_citation": 38,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3226160577093197520&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Stanford University;VMware, Inc.",
        "aff_unique_dep": ";VMware Research",
        "aff_unique_url": "https://www.stanford.edu;https://www.vmware.com/research.html",
        "aff_unique_abbr": "Stanford;VMware",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Stanford;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "oTRekADULK",
        "title": "Sparse Training of Discrete Diffusion Models for Graph Generation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Generative models for graphs often encounter scalability challenges due to the inherent need to predict interactions for every node pair. Despite the sparsity often exhibited by real-world graphs, the unpredictable sparsity patterns of their adjacency matrices, stemming from their unordered nature, leads to quadratic computational complexity. In this work, we introduce SparseDiff, a denoising diffusion model for graph generation that is able to exploit sparsity during its training phase. At the core of SparseDiff is a message-passing neural network tailored to predict only a subset of edges during each forward pass. When combined with a sparsity-preserving noise model, this model can efficiently work with edge lists representations of graphs, paving the way for scalability to much larger structures. During the sampling phase, SparseDiff iteratively populates the adjacency matrix from its prior state, ensuring prediction of the full graph while controlling memory utilization. Our experimental results show that SparseDiff simultaneously matches state-of-the-art in generation performance on both small and large graphs, highlighting the versatility of our method.",
        "keywords": "graph generation;diffusion models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/6423d6a84d8e1678be54e849d931240e1caa7137.pdf",
        "author": "Yiming QIN;Clement Vignac;Pascal Frossard",
        "authorids": "~Yiming_QIN2;~Clement_Vignac1;~Pascal_Frossard1",
        "gender": "F;;",
        "homepage": "https://github.com/qym7;https://cvignac.github.io/;",
        "dblp": "169/7362;254/1004.html;",
        "google_scholar": ";eKJLfHQAAAAJ;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Yiming_QIN2;~Clement_Vignac1;~Pascal_Frossard1",
        "aff": "EPFL - EPF Lausanne;Isomorphic Labs;",
        "aff_domain": "epfl.ch;isomorphiclabs.com;",
        "position": "PhD student;Researcher;",
        "bibtex": "@misc{\nqin2024sparse,\ntitle={Sparse Training of Discrete Diffusion Models for Graph Generation},\nauthor={Yiming QIN and Clement Vignac and Pascal Frossard},\nyear={2024},\nurl={https://openreview.net/forum?id=oTRekADULK}\n}",
        "github": "",
        "project": "",
        "reviewers": "hoQ4;h9n8;teFB;RCzU",
        "site": "https://openreview.net/forum?id=oTRekADULK",
        "pdf_size": 4366153,
        "rating": "3;3;5;5",
        "confidence": "4;4;3;4",
        "soundness": "3;2;3;2",
        "contribution": "2;1;2;2",
        "presentation": "4;1;3;2",
        "wc_summary": "78;26;89;41",
        "wc_strengths": "28;15;45;32",
        "wc_weaknesses": "136;241;168;221",
        "wc_questions": "2;125;168;2",
        "wc_review": "244;407;470;296",
        "wc_reply_reviewers": "0;0;171;0",
        "wc_reply_authors": "752;1345;831;775",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;2;2;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            58.5,
            25.85053190942113
        ],
        "wc_strengths_avg": [
            30.0,
            10.700467279516348
        ],
        "wc_weaknesses_avg": [
            191.5,
            41.692325432865935
        ],
        "wc_questions_avg": [
            74.25,
            73.83215762796046
        ],
        "wc_review_avg": [
            354.25,
            89.06282894676094
        ],
        "wc_reply_reviewers_avg": [
            42.75,
            74.0451720235695
        ],
        "wc_reply_authors_avg": [
            925.75,
            243.75333331054162
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12133728284079091882&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "EPFL;Isomorphic Labs",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.epfl.ch;",
        "aff_unique_abbr": "EPFL;",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Lausanne;",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Switzerland;United States"
    },
    {
        "title": "ExeDec: Execution Decomposition for Compositional Generalization in Neural Program Synthesis",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17817",
        "id": "oTRwljRgiv",
        "author_site": "Kensen Shi, Joey Hong, Yinlin Deng, Pengcheng Yin, Manzil Zaheer, Charles Sutton",
        "tldr": "",
        "abstract": "When writing programs, people have the ability to tackle a new complex task by decomposing it into smaller and more familiar subtasks. While it is difficult to measure whether neural program synthesis methods have similar capabilities, we can measure whether they compositionally generalize, that is, whether a model that has been trained on the simpler subtasks is subsequently able to solve more complex tasks. In this paper, we characterize several different forms of compositional generalization that are desirable in program synthesis, forming a meta-benchmark which we use to create generalization tasks for two popular datasets, RobustFill and DeepCoder. We then propose ExeDec, a novel decomposition-based synthesis strategy that predicts execution subgoals to solve problems step-by-step informed by program execution at each step. When used with Transformer models trained from scratch, ExeDec has better synthesis performance and greatly improved compositional generalization ability compared to baselines. Finally, we use our benchmarks to demonstrate that LLMs struggle to compositionally generalize when asked to do programming-by-example in a few-shot setting, but an ExeDec-style prompting approach can improve the generalization ability and overall performance.",
        "keywords": "Program Synthesis;Programming By Example;Generalization;Compositional Generalization",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Kensen Shi;Joey Hong;Yinlin Deng;Pengcheng Yin;Manzil Zaheer;Charles Sutton",
        "authorids": "~Kensen_Shi1;~Joey_Hong2;yinlind2@illinois.edu;~Pengcheng_Yin1;~Manzil_Zaheer1;~Charles_Sutton1",
        "gender": "M;M;;M;M;M",
        "homepage": ";;;https://pengcheng.in;https://www.aclweb.org/anthology/people/m/manzil-zaheer/;http://homepages.inf.ed.ac.uk/csutton/",
        "dblp": "135/8307;188/6056.html;;130/7385;40/10701;59/5879",
        "google_scholar": "LAL4SIMAAAAJ;SiBVfPUAAAAJ;;t5lVb6sAAAAJ;A33FhJMAAAAJ;https://scholar.google.co.uk/citations?user=hYtGXD0AAAAJ",
        "orcid": "0000-0001-7140-7869;;;;;0000-0002-0041-3820",
        "linkedin": ";;;pchyin/;;charles-sutton-772aa126",
        "or_profile": "~Kensen_Shi1;~Joey_Hong2;yinlind2@illinois.edu;~Pengcheng_Yin1;~Manzil_Zaheer1;~Charles_Sutton1",
        "aff": "Google;University of California, Berkeley;;Google;Google DeepMind;University of Edinburgh",
        "aff_domain": "google.com;berkeley.edu;;google.com;deepmind.com;ed.ac.uk",
        "position": "Software Engineer;PhD student;;Researcher;Researcher;Professor",
        "bibtex": "@inproceedings{\nshi2024exedec,\ntitle={ExeDec: Execution Decomposition for Compositional Generalization in Neural Program Synthesis},\nauthor={Kensen Shi and Joey Hong and Yinlin Deng and Pengcheng Yin and Manzil Zaheer and Charles Sutton},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=oTRwljRgiv}\n}",
        "github": "",
        "project": "",
        "reviewers": "EB19;2WRW;iTFM;hCQX",
        "pdf_size": 689158,
        "rating": "6;6;8;8",
        "confidence": "4;4;3;3",
        "soundness": "3;3;3;3",
        "contribution": "3;2;3;3",
        "presentation": "2;4;3;3",
        "wc_summary": "121;109;97;180",
        "wc_strengths": "77;94;94;299",
        "wc_weaknesses": "141;134;212;393",
        "wc_questions": "91;51;16;248",
        "wc_review": "430;388;419;1120",
        "wc_reply_reviewers": "0;0;0;485",
        "wc_reply_authors": "710;735;731;1061",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;1;3",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            126.75,
            31.893377055432683
        ],
        "wc_strengths_avg": [
            141.0,
            91.48497144340156
        ],
        "wc_weaknesses_avg": [
            220.0,
            104.43897739828746
        ],
        "wc_questions_avg": [
            101.5,
            88.6467709507797
        ],
        "wc_review_avg": [
            589.25,
            306.81539645200337
        ],
        "wc_reply_reviewers_avg": [
            121.25,
            210.01116041772636
        ],
        "wc_reply_authors_avg": [
            809.25,
            145.6577752816512
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 19,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12742235010987891197&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=oTRwljRgiv",
        "pdf": "https://openreview.net/pdf?id=oTRwljRgiv",
        "email": "google.com;berkeley.edu;;google.com;deepmind.com;ed.ac.uk",
        "author_num": 6,
        "aff_unique_index": "0;1;0;0;2",
        "aff_unique_norm": "Google;University of California, Berkeley;University of Edinburgh",
        "aff_unique_dep": "Google;;",
        "aff_unique_url": "https://www.google.com;https://www.berkeley.edu;https://www.ed.ac.uk",
        "aff_unique_abbr": "Google;UC Berkeley;Edinburgh",
        "aff_campus_unique_index": "0;1;0",
        "aff_campus_unique": "Mountain View;Berkeley;",
        "aff_country_unique_index": "0;0;0;1;1",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "oTWhkg5Ed4",
        "title": "SD4Match: Learning to Prompt Stable Diffusion Model for Semantic Matching",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In this paper, we address the challenge of matching semantically similar keypoints across image pairs. Existing research indicates that the intermediate output of the UNet within the Stable Diffusion (SD) framework can serve as robust image feature maps for such a matching task. We demonstrate that by employing a basic prompt tuning technique, the inherent potential of Stable Diffusion can be harnessed, resulting in a significant enhancement in accuracy over previous approaches. We further introduce a novel conditional prompting module that conditions the prompt on the local details of the input image pairs, leading to a further improvement in performance. We designate our approach as SD4Match, short for Stable Diffusion for Semantic Matching. Comprehensive evaluations of SD4Match on the PF-Pascal, PF-Willow, and SPair-71k datasets show that it sets new benchmarks in accuracy across all these datasets. Particularly, SD4Match outperforms the previous state-of-the-art by a margin of 12 percentage points on the challenging SPair-71k dataset.",
        "keywords": "Semantic Correspondence; Image Feature Matching; Diffusion Model; Prompt Tuning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Xinghui Li;Jingyi Lu;Kai Han;Victor Adrian Prisacariu",
        "authorids": "~Xinghui_Li1;~Jingyi_Lu2;~Kai_Han1;~Victor_Adrian_Prisacariu1",
        "gender": "M;M;M;M",
        "homepage": "https://xinghui-li.github.io/;https://visailab.github.io/;http://www.kaihan.org/;",
        "dblp": ";;51/4757-1.html;39/8616",
        "google_scholar": "XLlgbBoAAAAJ;;tG8S_vMAAAAJ;https://scholar.google.co.uk/citations?user=GmWA-LoAAAAJ",
        "orcid": "0000-0003-3797-5082;;0000-0002-7995-9999;",
        "linkedin": "xinghui-li-4b73a9146/;;kaihancs/;",
        "or_profile": "~Xinghui_Li1;~Jingyi_Lu2;~Kai_Han1;~Victor_Adrian_Prisacariu1",
        "aff": "University of Oxford;University of Hong Kong;The University of Hong Kong;University of Oxford",
        "aff_domain": "ox.ac.uk;hku.hk;hku.hk;ox.ac.uk",
        "position": "PhD student;PhD student;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nli2024sdmatch,\ntitle={{SD}4Match: Learning to Prompt Stable Diffusion Model for Semantic Matching},\nauthor={Xinghui Li and Jingyi Lu and Kai Han and Victor Adrian Prisacariu},\nyear={2024},\nurl={https://openreview.net/forum?id=oTWhkg5Ed4}\n}",
        "github": "",
        "project": "",
        "reviewers": "4Bqj;Q84M;jb5q",
        "site": "https://openreview.net/forum?id=oTWhkg5Ed4",
        "pdf_size": 6092411,
        "rating": "3;5;8",
        "confidence": "5;5;3",
        "soundness": "2;4;3",
        "contribution": "2;2;3",
        "presentation": "3;3;3",
        "wc_summary": "69;96;51",
        "wc_strengths": "26;129;33",
        "wc_weaknesses": "135;438;103",
        "wc_questions": "2;6;38",
        "wc_review": "232;669;225",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "626;1020;325",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;2;1",
        "rating_avg": [
            5.333333333333333,
            2.0548046676563256
        ],
        "confidence_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            72.0,
            18.49324200890693
        ],
        "wc_strengths_avg": [
            62.666666666666664,
            46.99172503986444
        ],
        "wc_weaknesses_avg": [
            225.33333333333334,
            150.94443422074966
        ],
        "wc_questions_avg": [
            15.333333333333334,
            16.110727964792762
        ],
        "wc_review_avg": [
            375.3333333333333,
            207.6733546274587
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            657.0,
            284.57805021938475
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9176629354822472,
        "gs_citation": 25,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1713196329729803424&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;1;0",
        "aff_unique_norm": "University of Oxford;University of Hong Kong",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ox.ac.uk;https://www.hku.hk",
        "aff_unique_abbr": "Oxford;HKU",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "United Kingdom;China"
    },
    {
        "id": "oTl1ABwM4n",
        "title": "Improving length generalization in transformers via task hinting",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "It has been observed in recent years that transformers have problems\n  with length generalization for certain types of reasoning and\n  arithmetic tasks. In particular, the performance of a transformer\n  model trained on tasks (say addition) up to a certain\n  length (e.g., 5 digit numbers) drops sharply when applied to longer instances of the\n  same problem. This work proposes an\n  approach based on task hinting towards addressing length generalization. Our key idea is that while training the model on task-specific data, it\n  is helpful to simultaneously train the model to solve a\n  simpler but related auxiliary task as well.\n\n  We study the classical sorting problem as a canonical example\n  to evaluate our approach. We design a multitask training\n  framework and show that models trained via task hinting\n  significantly improve length generalization. In particular, for sorting we show that it is possible to\n  train models on data consisting of sequences having length at most\n  $20$, and improve the test accuracy on sequences of length $100$\n  from less than $1$% (for standard training) to more than $92$%\n  (via task hinting).\n\n  Our study uncovers several interesting aspects of length\n  generalization. We observe that while several auxiliary tasks may\n  seem natural a priori, their effectiveness in improving\n  length generalization differs dramatically. We further use probing\n  and visualization-based techniques to understand the internal\n  mechanisms via which the model performs the task, and propose a theoretical construction\n  consistent with the observed learning behaviors of the model. Based\n  on our construction, we show that introducing a small number of\n  length dependent parameters into the training procedure can further\n  boost the performance on unseen lengths. Finally, we also show the\n  efficacy of our task hinting based approach beyond\n  sorting, giving hope that these techniques will be applicable in\n  broader contexts.",
        "keywords": "length generalization;OOD robustness",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Pranjal Awasthi;Anupam Gupta",
        "authorids": "~Pranjal_Awasthi3;~Anupam_Gupta2",
        "gender": ";M",
        "homepage": "https://www.cs.rutgers.edu/~pa336/;https://cs.nyu.edu/~anupamg/",
        "dblp": "57/679;27/2931",
        "google_scholar": ";QuwaU-8AAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Pranjal_Awasthi3;~Anupam_Gupta2",
        "aff": "Rutgers University;New York University",
        "aff_domain": "rutgers.edu;cs.nyu.edu",
        "position": "Assistant Professor;Full Professor",
        "bibtex": "@misc{\nawasthi2024improving,\ntitle={Improving length generalization in transformers via task hinting},\nauthor={Pranjal Awasthi and Anupam Gupta},\nyear={2024},\nurl={https://openreview.net/forum?id=oTl1ABwM4n}\n}",
        "github": "",
        "project": "",
        "reviewers": "9TMa;mVzC;bvbc;rpHo",
        "site": "https://openreview.net/forum?id=oTl1ABwM4n",
        "pdf_size": 622532,
        "rating": "3;3;5;6",
        "confidence": "5;4;3;4",
        "soundness": "3;2;3;4",
        "contribution": "2;2;2;3",
        "presentation": "3;1;3;4",
        "wc_summary": "64;82;90;158",
        "wc_strengths": "44;34;14;73",
        "wc_weaknesses": "75;116;99;84",
        "wc_questions": "138;5;8;24",
        "wc_review": "321;237;211;339",
        "wc_reply_reviewers": "0;0;0;32",
        "wc_reply_authors": "837;484;553;332",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            98.5,
            35.61951712193752
        ],
        "wc_strengths_avg": [
            41.25,
            21.276454121869087
        ],
        "wc_weaknesses_avg": [
            93.5,
            15.56438241627338
        ],
        "wc_questions_avg": [
            43.75,
            54.89250859634674
        ],
        "wc_review_avg": [
            277.0,
            54.16641025580336
        ],
        "wc_reply_reviewers_avg": [
            8.0,
            13.856406460551018
        ],
        "wc_reply_authors_avg": [
            551.5,
            183.2000272925744
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5443310539518174,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15122551369446777020&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Rutgers University;New York University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.rutgers.edu;https://www.nyu.edu",
        "aff_unique_abbr": "Rutgers;NYU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "oUeYSTIhpE",
        "title": "DisCo-DSO: Coupling Discrete and Continuous Optimization for Efficient Generative Design in Hybrid Spaces",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this paper, we consider the challenge of optimizing within hybrid discrete-continuous spaces, a problem that arises in various important applications, such as symbolic regression and decision tree learning. We propose DisCo-DSO (Discrete-Continuous Deep Symbolic Optimization), a novel approach that uses a generative model to learn a joint distribution over discrete and continuous design variables to sample new hybrid designs. In contrast to standard decoupled approaches, in which the discrete and continuous variables are optimized separately, our joint optimization approach uses fewer objective function evaluations, is robust against non-differentiable objectives, and learns from prior samples to guide the search, which leads to significant improvement in performance and efficiency. Our experiments on a diverse set of optimization tasks demonstrate that the advantages of DisCo-DSO become increasingly evident as problem complexity grows. In particular, we illustrate DisCo-DSO\u2019s superiority over the state-of-the-art methods for interpretable reinforcement learning with decision trees.",
        "keywords": "Discrete Optimization;Hybrid Optimization;Deep Symbolic Optimization;Decision Trees;Reinforcement Learning;Generative Models;Interpretable Machine Learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Jacob Pettit;Chak Shing Lee;Jiachen Yang;Alex Ho;Daniel faissol;Brenden K. Petersen;Mikel Landajuela",
        "authorids": "~Jacob_Pettit1;~Chak_Shing_Lee1;~Jiachen_Yang1;~Alex_Ho2;~Daniel_faissol1;~Brenden_K._Petersen1;~Mikel_Landajuela1",
        "gender": "M;M;;M;M;;M",
        "homepage": "https://www.jacobpettit.com;https://people.llnl.gov/lee1029;;https://www.linkedin.com/in/ho-alex-0213/;http://www.llnl.gov;;https://landajuela.github.io/",
        "dblp": ";;;;;;290/1379",
        "google_scholar": "qglcDFwAAAAJ;WyqnLwsAAAAJ;;;;;Tl93fucAAAAJ",
        "orcid": ";;;;0000-0001-6965-983X;;0000-0002-4804-6513",
        "linkedin": "jfpettit;;;;;;mikel-landajuela-larma-ph-d-139aa5129/",
        "or_profile": "~Jacob_Pettit1;~Chak_Shing_Lee1;~Jiachen_Yang1;~Alex_Ho2;~Daniel_faissol1;~Brenden_K._Petersen1;~Mikel_Landajuela1",
        "aff": "Lawrence Livermore National Labs;Lawrence Livermore National Labs;;University of California, Merced;Lawrence Livermore National Labs;;Lawrence Livermore National Labs",
        "aff_domain": "llnl.gov;llnl.gov;;ucmerced.edu;llnl.gov;;llnl.gov",
        "position": "Researcher;Researcher;;PhD student;Staff Scientist;;Researcher",
        "bibtex": "@misc{\npettit2024discodso,\ntitle={DisCo-{DSO}: Coupling Discrete and Continuous Optimization for Efficient Generative Design in Hybrid Spaces},\nauthor={Jacob Pettit and Chak Shing Lee and Jiachen Yang and Alex Ho and Daniel faissol and Brenden K. Petersen and Mikel Landajuela},\nyear={2024},\nurl={https://openreview.net/forum?id=oUeYSTIhpE}\n}",
        "github": "",
        "project": "",
        "reviewers": "AbyM;gpUA;CEut;6T4T",
        "site": "https://openreview.net/forum?id=oUeYSTIhpE",
        "pdf_size": 1680591,
        "rating": "3;5;5;6",
        "confidence": "3;3;3;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;3;4",
        "wc_summary": "126;41;39;187",
        "wc_strengths": "108;54;50;78",
        "wc_weaknesses": "89;111;23;215",
        "wc_questions": "348;197;51;49",
        "wc_review": "671;403;163;529",
        "wc_reply_reviewers": "0;29;0;230",
        "wc_reply_authors": "808;748;681;679",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            98.25,
            62.118334652500145
        ],
        "wc_strengths_avg": [
            72.5,
            23.124662159694356
        ],
        "wc_weaknesses_avg": [
            109.5,
            68.98369372540151
        ],
        "wc_questions_avg": [
            161.25,
            123.39849067148269
        ],
        "wc_review_avg": [
            441.5,
            186.66212792101135
        ],
        "wc_reply_reviewers_avg": [
            64.75,
            96.1388969148284
        ],
        "wc_reply_authors_avg": [
            729.0,
            53.39943819929195
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:wRtakozT-KQJ:scholar.google.com/&scioq=DisCo-DSO:+Coupling+Discrete+and+Continuous+Optimization+for+Efficient+Generative+Design+in+Hybrid+Spaces&hl=en&as_sdt=0,44",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "Lawrence Livermore National Laboratory;University of California, Merced",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.llnl.gov;https://www.ucmerced.edu",
        "aff_unique_abbr": "LLNL;UC Merced",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Merced",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "oV72wHuRNy",
        "title": "VC dimensions for deep neural networks with bounded-rank weight matrices",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep neural networks (DNNs) have seen immense success in the past decade, yet their lack of interpretability remains a challenge. Recent research on the VC (Vapnik-Chervonenkis) dimension of DNNs has provided valuable insights into the underlying mechanisms of deep learning's powerful generalization capabilities. Understanding the VC dimension offers a promising path toward unraveling the enigma of deep learning, ultimately leading to more interpretable and trustworthy AI systems. In this paper, we study the VC dimensions for DNNs with piecewise polynomial activations and bounded-rank weight matrices. Our main results show that the VC dimensions for DNNs with weight matrices that have bounded rank $r$ are at most $\\mathcal{O}(nrL^2\\log (nrL))$, where $n$ is the width of the network, and $L$ is the depth of the network. We also construct a ReLU DNN with bounded rank $r$ that can achieve the VC dimension $\\Omega(nr)$, which confirms that the upper bound we obtain is nearly tight for large $n$. Based on these bounds, we compare the generalization power in terms of VC dimensions for various different DNN architectures.",
        "keywords": "VC dimension;bounded-rank weight matrices network",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Junyi Guan;Huan Xiong",
        "authorids": "~Junyi_Guan1;~Huan_Xiong1",
        "gender": "M;M",
        "homepage": "https://github.com/1571984220/;https://scholar.google.com/citations?user=l4hm14MAAAAJ&hl=en",
        "dblp": ";",
        "google_scholar": ";l4hm14MAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Junyi_Guan1;~Huan_Xiong1",
        "aff": "Mohamed bin Zayed University of Artificial Intelligence;Harbin Institute of Technology",
        "aff_domain": "mbzuai.ac.ae;hit.edu.cn",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nguan2024vc,\ntitle={{VC} dimensions for deep neural networks with bounded-rank weight matrices},\nauthor={Junyi Guan and Huan Xiong},\nyear={2024},\nurl={https://openreview.net/forum?id=oV72wHuRNy}\n}",
        "github": "",
        "project": "",
        "reviewers": "E8PL;YfBS;12gB;1Lrg",
        "site": "https://openreview.net/forum?id=oV72wHuRNy",
        "pdf_size": 402164,
        "rating": "3;3;3;6",
        "confidence": "2;3;4;3",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;1;2;2",
        "wc_summary": "45;141;42;43",
        "wc_strengths": "70;85;26;53",
        "wc_weaknesses": "61;621;114;52",
        "wc_questions": "18;144;57;69",
        "wc_review": "194;991;239;217",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            67.75,
            42.30469832063574
        ],
        "wc_strengths_avg": [
            58.5,
            21.914607000811127
        ],
        "wc_weaknesses_avg": [
            212.0,
            237.32151187787423
        ],
        "wc_questions_avg": [
            72.0,
            45.645372164108814
        ],
        "wc_review_avg": [
            410.25,
            335.6734834627245
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17789985863701011428&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Mohamed bin Zayed University of Artificial Intelligence;Harbin Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://mbzuai.ac.ae;http://www.hit.edu.cn/",
        "aff_unique_abbr": "MBZUAI;HIT",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Harbin",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United Arab Emirates;China"
    },
    {
        "id": "oVVLBxVmbZ",
        "title": "Fast Conditional Intervention in Algorithmic Recourse with Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Explaining the decisions made by machine learning classifiers aids individuals in identifying critical factors and charting future plans. Recent studies have shown that incorporating causal graphs of input features provides more realistic explanations; however, this also introduces new challenges such as handling noisy graphs and efficiently performing inference with black-box classifiers. In this work, we tackle these issues by presenting an efficient reinforcement learning (RL)-based approach with an idea of conditional intervention. Our intervention method is theoretically preferable and considers both feature dependencies and incompleteness of graphs. Simultaneously, the RL-based method offers the capacity to learn the intervention process while guarantees computational complexity at inference stage. In the experiments, we showcase the efficiency and superior performance of our solution when compared to baseline methods on both synthetic and real datasets.",
        "keywords": "Algorithmic recource;Causality;Reinforcement Learning;Explainable machine learning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/c158aebb31b235bbf06147fbfd35a26d5ff39aa2.zip",
        "author": "Chiung-Yu Chang;Keng-Te Liao;Mi-Yen Yeh;Shou-De Lin",
        "authorids": "~Chiung-Yu_Chang1;~Keng-Te_Liao1;~Mi-Yen_Yeh1;~Shou-De_Lin1",
        "gender": "M;M;;M",
        "homepage": "https://www.facebook.com/justin.chang.756412;;;https://www.csie.ntu.edu.tw/~sdlin/",
        "dblp": ";167/9539;43/2669;60/7120",
        "google_scholar": ";;;https://scholar.google.com.tw/citations?user=_82xf3QAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Chiung-Yu_Chang1;~Keng-Te_Liao1;~Mi-Yen_Yeh1;~Shou-De_Lin1",
        "aff": ";National Taiwan University;Academia Sinica;National Taiwan University",
        "aff_domain": ";ntu.edu.tw;sinica.edu.tw;ntu.edu.tw",
        "position": ";PhD student;Research Fellow;Full Professor",
        "bibtex": "@misc{\nchang2024fast,\ntitle={Fast Conditional Intervention in Algorithmic Recourse with Reinforcement Learning},\nauthor={Chiung-Yu Chang and Keng-Te Liao and Mi-Yen Yeh and Shou-De Lin},\nyear={2024},\nurl={https://openreview.net/forum?id=oVVLBxVmbZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "a8gS;J2Mk;1q46;vwWM",
        "site": "https://openreview.net/forum?id=oVVLBxVmbZ",
        "pdf_size": 878310,
        "rating": "5;5;5;6",
        "confidence": "3;3;3;4",
        "soundness": "2;3;3;2",
        "contribution": "2;2;3;3",
        "presentation": "3;4;2;2",
        "wc_summary": "44;41;48;54",
        "wc_strengths": "31;14;31;146",
        "wc_weaknesses": "150;15;85;194",
        "wc_questions": "114;93;99;4",
        "wc_review": "339;163;263;398",
        "wc_reply_reviewers": "24;29;14;0",
        "wc_reply_authors": "613;435;454;649",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            46.75,
            4.866980583482946
        ],
        "wc_strengths_avg": [
            55.5,
            52.70910737244561
        ],
        "wc_weaknesses_avg": [
            111.0,
            67.6424422977172
        ],
        "wc_questions_avg": [
            77.5,
            43.119021324700775
        ],
        "wc_review_avg": [
            290.75,
            87.92148486007274
        ],
        "wc_reply_reviewers_avg": [
            16.75,
            11.07643895843786
        ],
        "wc_reply_authors_avg": [
            537.75,
            94.35405396696
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:1Vc-yG3FB1UJ:scholar.google.com/&scioq=Fast+Conditional+Intervention+in+Algorithmic+Recourse+with+Reinforcement+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "National Taiwan University;Academia Sinica",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ntu.edu.tw;https://www.sinica.edu.tw",
        "aff_unique_abbr": "NTU;Academia Sinica",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Taiwan",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "oWENFj7583",
        "title": "Non-Visible Light Data Synthesis: A Case Study for Synthetic Aperture Radar Imagery",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large-scale pre-trained image generation models such as Stable Diffusion and Imagen have achieved a nearly perfect synthesis of regular images. We explore their \u201chidden\u201d application in non-visible light domains, taking Synthetic Aperture Radar (SAR) data for a case study. For SAR, due to the inherent challenges in capturing satellite data, acquiring ample training samples is problematic. For instance, for a particular category of ship in the open sea, we can collect only a few dozen SAR images which are too limited to derive effective ship recognition models. If pre-trained regular image models can be adapted to generate diverse SAR data, the problem is solved. In preliminary experiments, we found that directly fine-tuning these models with existing SAR data cannot generate meaningful or novel SAR data. The main challenge is the difficulty in capturing the two primary differences between SAR and regular images: structure and modality. To address this, we propose a 2-stage low-rank adaptation method, and we call it 2LoRA. In the first stage, the model is adapted using aerial-view regular image data (whose structure matches SAR), followed by the second stage where the base model from the first stage is further adapted using SAR modality data. Particularly in the second stage, we introduce a novel prototype LoRA (pLoRA), as an improved version of 2LoRA, to resolve the class imbalance problem in the original SAR dataset. For evaluation, we employ the resulting generation model (e.g., ControlNet+pLoRA) to synthesize additional SAR data. This augmentation, when integrated into the training process of SAR recognition models, yields notably improved performance for minor classes.",
        "keywords": "pre-trained vision-language models;beyond-visible vision tasks;data scarcity;dataset generation;radar imagery;knowledge transfer",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/56c053287bdf8a794ac32632b5aaee30f74d1858.pdf",
        "author": "Zichen Tian;Zhaozheng Chen;Qianru Sun",
        "authorids": "~Zichen_Tian1;~Zhaozheng_Chen1;~Qianru_Sun2",
        "gender": ";M;F",
        "homepage": ";;https://qianrusun.com/",
        "dblp": ";230/7948;127/6132.html",
        "google_scholar": ";rBW50p4AAAAJ;https://scholar.google.de/citations?user=fNfrGMIAAAAJ",
        "orcid": ";;0000-0003-2689-317X",
        "linkedin": ";;",
        "or_profile": "~Zichen_Tian1;~Zhaozheng_Chen1;~Qianru_Sun2",
        "aff": ";Singapore Management University;Singapore Management University",
        "aff_domain": ";smu.edu.sg;smu.edu.sg",
        "position": ";PhD student;Assistant Professor",
        "bibtex": "@misc{\ntian2024nonvisible,\ntitle={Non-Visible Light Data Synthesis: A Case Study for Synthetic Aperture Radar Imagery},\nauthor={Zichen Tian and Zhaozheng Chen and Qianru Sun},\nyear={2024},\nurl={https://openreview.net/forum?id=oWENFj7583}\n}",
        "github": "",
        "project": "",
        "reviewers": "8JRb;68N7;zzFN;xb7k",
        "site": "https://openreview.net/forum?id=oWENFj7583",
        "pdf_size": 29858186,
        "rating": "3;5;5;8",
        "confidence": "4;4;4;4",
        "soundness": "2;2;3;3",
        "contribution": "1;2;3;4",
        "presentation": "2;2;3;4",
        "wc_summary": "69;151;71;24",
        "wc_strengths": "52;87;17;30",
        "wc_weaknesses": "157;56;70;24",
        "wc_questions": "18;146;27;23",
        "wc_review": "296;440;185;101",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            1.118033988749895
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            78.75,
            45.75136609982264
        ],
        "wc_strengths_avg": [
            46.5,
            26.51886121235224
        ],
        "wc_weaknesses_avg": [
            76.75,
            49.24111594998635
        ],
        "wc_questions_avg": [
            53.5,
            53.5
        ],
        "wc_review_avg": [
            255.5,
            127.00492116449661
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:wZyH7CJf1P4J:scholar.google.com/&scioq=Non-Visible+Light+Data+Synthesis:+A+Case+Study+for+Synthetic+Aperture+Radar+Imagery&hl=en&as_sdt=0,23",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Singapore Management University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.smu.edu.sg",
        "aff_unique_abbr": "SMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Singapore"
    },
    {
        "id": "oWKPZ1Hcsm",
        "title": "Efficient Offline Reinforcement Learning: The Critic is Critical",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent work has demonstrated both benefits and limitations from using supervised approaches (without temporal-difference learning) for offline reinforcement learning. While off-policy reinforcement learning provides a promising approach for improving performance beyond supervised approaches, we observe that training is often inefficient and unstable due to temporal difference bootstrapping. In this paper we propose a best-of-both approach by first learning the behaviour policy and critic with supervised learning, before improving with off-policy reinforcement learning. Crucially, we demonstrate that the critic can be learned by pre-training with a supervised Monte-Carlo value-error, making use of commonly neglected downstream information from the provided offline trajectories. This provides consistent initial values for efficient improvement with temporal difference learning. We further generalise our approach to entropy-regularised reinforcement learning and apply our proposed pre-training to state-of-the-art hard and soft off-policy algorithms. We find that we are able to more than halve the training time of the considered offline algorithms on standard benchmarks, and surprisingly also achieve greater stability. We further build on our insight into the importance of having consistent policy and value functions to propose novel hybrid algorithms that regularise both the actor and the critic towards the behaviour policy. This maintains the benefits of pre-training when learning from limited human demonstrations.",
        "keywords": "Offline reinforcement learning;reinforcement learning;efficiency;temporal-difference learning;value error;Bellman error",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/d0ebd50a4a2f4e0ddeac2a33810f275a949715d3.zip",
        "author": "Adam Jelley;Amos Storkey;Sam Devlin",
        "authorids": "~Adam_Jelley1;~Amos_Storkey1;~Sam_Devlin2",
        "gender": "M;Not Specified;M",
        "homepage": "https://adamjelley.github.io;http://homepages.inf.ed.ac.uk/amos/;",
        "dblp": "339/0093;;64/7502",
        "google_scholar": "39t3yJcAAAAJ;;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0002-0052-482X;;0000-0002-7769-3090",
        "linkedin": "adamjelley/;;https://www.linkedin.com/pub/sam-devlin/83/810/b23",
        "or_profile": "~Adam_Jelley1;~Amos_Storkey1;~Sam_Devlin2",
        "aff": "University of Edinburgh, University of Edinburgh;University of Edinburgh;Microsoft Research",
        "aff_domain": "ed.ac.uk;ed.ac.uk;microsoft.com",
        "position": "PhD student;Full Professor;Principal Researcher",
        "bibtex": "@misc{\njelley2024efficient,\ntitle={Efficient Offline Reinforcement Learning: The Critic is Critical},\nauthor={Adam Jelley and Amos Storkey and Sam Devlin},\nyear={2024},\nurl={https://openreview.net/forum?id=oWKPZ1Hcsm}\n}",
        "github": "",
        "project": "",
        "reviewers": "p7js;KvJB;NdGK",
        "site": "https://openreview.net/forum?id=oWKPZ1Hcsm",
        "pdf_size": 4001568,
        "rating": "5;5;5",
        "confidence": "3;3;4",
        "soundness": "3;3;3",
        "contribution": "2;2;2",
        "presentation": "2;2;3",
        "wc_summary": "52;116;65",
        "wc_strengths": "44;31;108",
        "wc_weaknesses": "295;60;88",
        "wc_questions": "105;64;77",
        "wc_review": "496;271;338",
        "wc_reply_reviewers": "64;117;0",
        "wc_reply_authors": "1126;1128;754",
        "reply_reviewers": "1;1;0",
        "reply_authors": "2;3;1",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            77.66666666666667,
            27.6204433144888
        ],
        "wc_strengths_avg": [
            61.0,
            33.65511352924941
        ],
        "wc_weaknesses_avg": [
            147.66666666666666,
            104.80564022142234
        ],
        "wc_questions_avg": [
            82.0,
            17.107503227141788
        ],
        "wc_review_avg": [
            368.3333333333333,
            94.32685490121864
        ],
        "wc_reply_reviewers_avg": [
            60.333333333333336,
            47.83536581047773
        ],
        "wc_reply_authors_avg": [
            1002.6666666666666,
            175.83578197347154
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4510998432343321199&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "University of Edinburgh;Microsoft",
        "aff_unique_dep": ";Microsoft Research",
        "aff_unique_url": "https://www.ed.ac.uk;https://www.microsoft.com/en-us/research",
        "aff_unique_abbr": "Edinburgh;MSR",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "title": "Retrieval is Accurate Generation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17816",
        "id": "oXYZJXDdo7",
        "author_site": "Bowen Cao, Deng Cai, Leyang Cui, Xuxin Cheng, Wei BI, Yuexian Zou, Shuming Shi",
        "tldr": "",
        "abstract": "Standard language models generate text by selecting tokens from a fixed, finite, and standalone vocabulary. We introduce a novel method that selects context-aware phrases from a collection of supporting documents. One of the most significant challenges for this paradigm shift is determining the training oracles, because a string of text can be segmented in various ways and each segment can be retrieved from numerous possible documents. To address this, we propose to initialize the training oracles using linguistic heuristics and, more importantly, bootstrap the oracles through iterative self-reinforcement. Extensive experiments show that our model not only outperforms standard language models on a variety of knowledge-intensive tasks but also demonstrates improved generation quality in open-ended text generation. For instance, compared to the standard language model counterpart, our model raises the accuracy from 23.47% to 36.27% on OpenbookQA, and improves the MAUVE score from 42.61% to 81.58% in open-ended text generation. Remarkably, our model also achieves the best performance and the lowest latency among several retrieval-augmented baselines. In conclusion, we assert that retrieval is more accurate generation and hope that our work will encourage further research on this new paradigm shift.",
        "keywords": "Artificial Intelligence;Natural Language Processing;Language Models",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Bowen Cao;Deng Cai;Leyang Cui;Xuxin Cheng;Wei Bi;Yuexian Zou;Shuming Shi",
        "authorids": "~Bowen_Cao1;~Deng_Cai1;~Leyang_Cui1;~Xuxin_Cheng3;~Wei_Bi1;~Yuexian_Zou2;~Shuming_Shi1",
        "gender": "M;M;M;;F;;M",
        "homepage": ";https://jcyk.github.io/;https://github.com/Nealcly;;https://scholar.google.com.hk/citations?hl=en&user=aSJcgQMAAAAJ&view_op=list_works&sortby=pubdate#d=gsc_md_iad&u=%2Fcitations%3Fview_op%3Dimport_lookup%26hl%3Den%26imq%3DWei%2BBi%26json%3D%26btnA%3D1;;",
        "dblp": "265/5536;c/DCai-2;247/6181;;38/1163;;s/ShumingShi",
        "google_scholar": "jaI8ym8AAAAJ;KpbRLYcAAAAJ;6YVwZgkAAAAJ;;https://scholar.google.com.hk/citations?hl=en;;Lg31AKMAAAAJ",
        "orcid": ";;;;0000-0001-8457-0630;;",
        "linkedin": "bowen-cao-0ba2a61a3/;;;;;;",
        "or_profile": "~Bowen_Cao1;~Deng_Cai1;~Leyang_Cui1;~Xuxin_Cheng3;~Wei_Bi1;~Yuexian_Zou2;~Shuming_Shi1",
        "aff": "Peking University;Tencent AI Lab;Tencent AI Lab;;Hong Kong University of Science and Technology;;Tencent AI Lab",
        "aff_domain": "stu.pku.edu.cn;tencent.com;tencent.com;;ust.hk;;tencent.com",
        "position": "MS student;Research Scientist;Researcher;;PhD student;;Principal Researcher",
        "bibtex": "@inproceedings{\ncao2024retrieval,\ntitle={Retrieval is Accurate Generation},\nauthor={Bowen Cao and Deng Cai and Leyang Cui and Xuxin Cheng and Wei Bi and Yuexian Zou and Shuming Shi},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=oXYZJXDdo7}\n}",
        "github": "",
        "project": "",
        "reviewers": "6EhH;Uubi;uQM4;iZXf",
        "pdf_size": 1185208,
        "rating": "6;6;8;8",
        "confidence": "4;3;4;4",
        "soundness": "3;3;4;3",
        "contribution": "3;3;4;3",
        "presentation": "3;2;3;3",
        "wc_summary": "84;122;318;74",
        "wc_strengths": "89;78;117;61",
        "wc_weaknesses": "175;62;126;74",
        "wc_questions": "38;290;26;10",
        "wc_review": "386;552;587;219",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1227;1394;601;610",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            149.5,
            98.9178952465124
        ],
        "wc_strengths_avg": [
            86.25,
            20.363877332178173
        ],
        "wc_weaknesses_avg": [
            109.25,
            44.94093345715017
        ],
        "wc_questions_avg": [
            91.0,
            115.32129031536198
        ],
        "wc_review_avg": [
            436.0,
            146.49744025067469
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            958.0,
            357.4248172693105
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12785118181224270804&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=oXYZJXDdo7",
        "pdf": "https://openreview.net/pdf?id=oXYZJXDdo7",
        "email": "stu.pku.edu.cn;tencent.com;tencent.com;;ust.hk;;tencent.com",
        "author_num": 7,
        "aff_unique_index": "0;1;1;2;1",
        "aff_unique_norm": "Peking University;Tencent;Hong Kong University of Science and Technology",
        "aff_unique_dep": ";Tencent AI Lab;",
        "aff_unique_url": "http://www.pku.edu.cn;https://ai.tencent.com;https://www.ust.hk",
        "aff_unique_abbr": "Peking U;Tencent AI Lab;HKUST",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Score Models for Offline Goal-Conditioned Reinforcement Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17815",
        "id": "oXjnwQLcTA",
        "author_site": "Harshit Sikchi, Rohan Chitnis, Ahmed Touati, Alborz Geramifard, Amy Zhang, Scott Niekum",
        "tldr": "",
        "abstract": "Offline Goal-Conditioned Reinforcement Learning (GCRL) is tasked with learning to achieve multiple goals in an environment purely from offline datasets using sparse reward functions. Offline GCRL is pivotal for developing generalist agents capable of leveraging pre-existing datasets to learn diverse and reusable skills without hand-engineering reward functions. However, contemporary approaches to GCRL based on supervised learning and contrastive learning are often suboptimal in the offline setting. An alternative perspective on GCRL optimizes for occupancy matching, but necessitates learning a discriminator, which subsequently serves as a pseudo-reward for downstream RL. Inaccuracies in the learned discriminator can cascade, negatively influencing the resulting policy. We present a novel approach to GCRL under a new lens of mixture-distribution matching, leading to our discriminator-free method: SMORe. The key insight is combining the occupancy matching perspective of GCRL with a convex dual formulation to derive a learning objective that can better leverage suboptimal offline data. SMORe learns *scores* or unnormalized densities representing the importance of taking an action at a state for reaching a particular goal. SMORe is principled and our extensive experiments on the fully offline GCRL benchmark composed of robot manipulation and locomotion tasks, including high-dimensional observations, show that SMORe can outperform state-of-the-art baselines by a significant margin.",
        "keywords": "Robot Learning;Goal-Conditioned Reinforcement Learning;Deep Reinforcement Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/2811914e2c6f0f2ce7daf54f16c0f209ca91b8ba.pdf",
        "author": "Harshit Sikchi;Rohan Chitnis;Ahmed Touati;Alborz Geramifard;Amy Zhang;Scott Niekum",
        "authorids": "~Harshit_Sikchi1;~Rohan_Chitnis1;~Ahmed_Touati1;~Alborz_Geramifard1;~Amy_Zhang1;~Scott_Niekum1",
        "gender": "M;M;M;M;M;F",
        "homepage": "https://hari-sikchi.github.io/;https://rohanchitnis.com;;http://alborz-geramifard.com;https://people.cs.umass.edu/~sniekum/index.php;",
        "dblp": "271/4663;151/9589;147/5871;39/3250;62/8399;43/2754",
        "google_scholar": "jFOPZE0AAAAJ;rNcmwggAAAAJ;https://scholar.google.fr/citations?user=D4LT5xAAAAAJ;https://scholar.google.com/citations?hl=en;4wXYfSUAAAAJ;",
        "orcid": ";;;;;",
        "linkedin": ";;ahmed-touati-4a132a76/;alborzgeramifard/;;",
        "or_profile": "~Harshit_Sikchi1;~Rohan_Chitnis1;~Ahmed_Touati1;~Alborz_Geramifard1;~Scott_Niekum1;~Amy_Zhang2",
        "aff": "University of Texas, Austin;Meta;Meta Facebook;Meta;University of Massachusetts at Amherst;Meta Facebook",
        "aff_domain": "utexas.edu;meta.com;fb.com;meta.com;umass.edu;facebook.com",
        "position": "PhD student;Researcher;Researcher;Researcher;Associate Professor;Research Scientist",
        "bibtex": "@inproceedings{\nsikchi2024score,\ntitle={Score Models for Offline Goal-Conditioned Reinforcement Learning},\nauthor={Harshit Sikchi and Rohan Chitnis and Ahmed Touati and Alborz Geramifard and Amy Zhang and Scott Niekum},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=oXjnwQLcTA}\n}",
        "github": "",
        "project": "",
        "reviewers": "9ANq;ojhF;V1Bw;Wf6E",
        "pdf_size": 1371246,
        "rating": "6;6;6;6",
        "confidence": "4;4;3;3",
        "soundness": "2;2;3;3",
        "contribution": "3;2;3;2",
        "presentation": "3;2;2;3",
        "wc_summary": "196;168;72;48",
        "wc_strengths": "59;38;52;61",
        "wc_weaknesses": "276;523;39;148",
        "wc_questions": "6;55;126;37",
        "wc_review": "537;784;289;294",
        "wc_reply_reviewers": "23;50;27;0",
        "wc_reply_authors": "641;1309;690;803",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "1;3;2;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            121.0,
            62.37788069500277
        ],
        "wc_strengths_avg": [
            52.5,
            9.013878188659973
        ],
        "wc_weaknesses_avg": [
            246.5,
            180.3337184222629
        ],
        "wc_questions_avg": [
            56.0,
            44.05110668303352
        ],
        "wc_review_avg": [
            476.0,
            204.13108533488966
        ],
        "wc_reply_reviewers_avg": [
            25.0,
            17.7341478509682
        ],
        "wc_reply_authors_avg": [
            860.75,
            265.38121165598744
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6793655875162234748&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=oXjnwQLcTA",
        "pdf": "https://openreview.net/pdf?id=oXjnwQLcTA",
        "email": "utexas.edu;meta.com;fb.com;meta.com;umass.edu;facebook.com",
        "author_num": 6,
        "aff_unique_index": "0;1;1;1;2;1",
        "aff_unique_norm": "University of Texas at Austin;Meta;University of Massachusetts Amherst",
        "aff_unique_dep": ";Meta Platforms, Inc.;",
        "aff_unique_url": "https://www.utexas.edu;https://meta.com;https://www.umass.edu",
        "aff_unique_abbr": "UT Austin;Meta;UMass Amherst",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Austin;;Amherst",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Magnushammer: A Transformer-Based Approach to Premise Selection",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17814",
        "id": "oYjPk8mqAV",
        "author_site": "Maciej Miku\u0142a, Szymon Tworkowski, Szymon Antoniak, Bartosz Piotrowski, Qiaochu Jiang, Jin Zhou, Christian Szegedy, \u0141ukasz Kuci\u0144ski, Piotr Mi\u0142o\u015b, Yuhuai Wu",
        "tldr": "",
        "abstract": "This paper presents a novel approach to premise selection, a crucial reasoning task in automated theorem proving. Traditionally, symbolic methods that rely on extensive domain knowledge and engineering effort are applied to this task. In contrast, this work demonstrates that contrastive training with the transformer architecture can achieve higher-quality retrieval of relevant premises, without the knowledge or feature engineering overhead. Our method, Magnushammer, outperforms the most advanced and widely used automation tool in interactive theorem proving called Sledgehammer. On the PISA and miniF2f benchmarks Magnushammer achieves $59.5\\%$ (against $38.3\\%$) and $34.0\\%$ (against $20.9\\%$) success rates, respectively. By combining Magnushammer with a language-model-based automated theorem prover, we further improve the state-of-the-art proof success rate from $57.0\\%$ to $71.0\\%$ on the PISA benchmark using $4$x fewer parameters. Moreover, we develop and open source a novel dataset for premise selection, containing textual representations of (proof state, relevant premise) pairs. To the best of our knowledge, this is the largest available premise selection dataset, and the first dataset of this kind for the Isabelle proof assistant.",
        "keywords": "transformers;interactive theorem proving;automated reasoning;contrastive learning;premise selection",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "",
        "author": "Maciej Miku\u0142a;Szymon Tworkowski;Szymon Antoniak;Bartosz Piotrowski;Albert Q. Jiang;Jin Peng Zhou;Christian Szegedy;\u0141ukasz Kuci\u0144ski;Piotr Mi\u0142o\u015b;Yuhuai Wu",
        "authorids": "~Maciej_Miku\u0142a1;~Szymon_Tworkowski1;~Szymon_Antoniak1;~Bartosz_Piotrowski1;~Albert_Q._Jiang1;~Jin_Peng_Zhou1;~Christian_Szegedy1;~\u0141ukasz_Kuci\u0144ski1;~Piotr_Mi\u0142o\u015b1;~Yuhuai_Wu1",
        "gender": ";;Not Specified;;;M;;M;;M",
        "homepage": ";https://syzymon.github.io;;;;;;https://sites.google.com/view/lukaszkucinski;;http://www.cs.toronto.edu/~ywu/",
        "dblp": ";304/8909;;;;255/1107;78/1537;250/9699;208/0989.html;",
        "google_scholar": ";1V8AeXYAAAAJ;;;;Nf48jqcAAAAJ;3QeF7mAAAAAJ;l6dK-VUAAAAJ;Se68XecAAAAJ;https://scholar.google.ca/citations?user=bOQGfFIAAAAJ",
        "orcid": ";;;;;;;0000-0002-5617-8129;;",
        "linkedin": "maciej-mikula/;szymon-tworkowski/;szymon-antoniak-022998258/;;;https://ca.linkedin.com/in/jinpeng-zhou;;https://linkedin.com/in/lukasz-kucinski;piotr-milos-4b02151/;",
        "or_profile": "~Maciej_Miku\u0142a1;~Szymon_Tworkowski1;~Szymon_Antoniak1;~Bartosz_Piotrowski1;~Albert_Q._Jiang1;~Jin_Peng_Zhou1;~Christian_Szegedy1;~\u0141ukasz_Kuci\u0144ski1;~Piotr_Mi\u0142o\u015b1;~Yuhuai_Wu1",
        "aff": "Google DeepMind;University of Warsaw;;;;Department of Computer Science, Cornell University;Google;Institute of Mathematics Polish Academy of Sciences;IDEAS NCBR;",
        "aff_domain": "google.com;uw.edu.pl;;;;cs.cornell.edu;google.com;impan.pl;ideas-ncbr.pl;",
        "position": "Research Engineer;PhD student;;;;PhD student;Research Scientist;Assistant Professor;Researcher;",
        "bibtex": "@inproceedings{\nmiku{\\l}a2024magnushammer,\ntitle={Magnushammer: A Transformer-Based Approach to Premise Selection},\nauthor={Maciej Miku{\\l}a and Szymon Tworkowski and Szymon Antoniak and Bartosz Piotrowski and Albert Q. Jiang and Jin Peng Zhou and Christian Szegedy and {\\L}ukasz Kuci{\\'n}ski and Piotr Mi{\\l}o{\\'s} and Yuhuai Wu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=oYjPk8mqAV}\n}",
        "github": "",
        "project": "",
        "reviewers": "XHfH;7Qsu;uz6C;t7yc",
        "pdf_size": 1125089,
        "rating": "8;8;8;8",
        "confidence": "4;5;3;4",
        "soundness": "3;4;3;4",
        "contribution": "3;2;3;4",
        "presentation": "3;4;3;4",
        "wc_summary": "48;113;49;118",
        "wc_strengths": "34;65;123;134",
        "wc_weaknesses": "257;24;20;233",
        "wc_questions": "162;86;13;71",
        "wc_review": "501;288;205;556",
        "wc_reply_reviewers": "44;0;0;0",
        "wc_reply_authors": "1440;331;255;994",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "3;1;1;3",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            82.0,
            33.54847239443251
        ],
        "wc_strengths_avg": [
            89.0,
            41.176449579826574
        ],
        "wc_weaknesses_avg": [
            133.5,
            111.8313462317252
        ],
        "wc_questions_avg": [
            83.0,
            53.13661637703327
        ],
        "wc_review_avg": [
            387.5,
            145.32807712207577
        ],
        "wc_reply_reviewers_avg": [
            11.0,
            19.05255888325765
        ],
        "wc_reply_authors_avg": [
            755.0,
            488.9074554555289
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            1.0
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 44,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9049781807226917611&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=oYjPk8mqAV",
        "pdf": "https://openreview.net/pdf?id=oYjPk8mqAV",
        "email": "google.com;uw.edu.pl;;;;cs.cornell.edu;google.com;impan.pl;ideas-ncbr.pl;",
        "author_num": 10,
        "aff_unique_index": "0;1;2;0;3;4",
        "aff_unique_norm": "Google;University of Warsaw;Cornell University;Polish Academy of Sciences;Institute for Development, Economic Analysis, and Simulation (IDEAS)",
        "aff_unique_dep": "Google DeepMind;;Department of Computer Science;Institute of Mathematics;",
        "aff_unique_url": "https://deepmind.com;https://www.uw.edu.pl;https://www.cornell.edu;https://www.impan.pl/;https://www.ideas-ncbr.gov.pl",
        "aff_unique_abbr": "DeepMind;UW;Cornell;PAS;IDEAS",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;2;2;1;1",
        "aff_country_unique": "United Kingdom;Poland;United States"
    },
    {
        "id": "oZ8FmnLpCA",
        "title": "Knowledge Distillation via Flow Matching",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this paper, we propose a novel knowledge transfer framework that introduces Rectified flow into knowledge distillation and leverages multi-step sampling strategies to achieve precision flow matching. We name this framework Knowledge Distillation via Flow Matching (FM-KD), which can be integrated with a metric-based distillation method with any form (\\textit{e.g.} vanilla KD, DKD, PKD and DIST), a meta-encoder with any available architecture (\\textit{e.g.} CNN, MLP and Swin-Transformer), and achieves significant accuracy improvement for the student. We theoretically demonstrate that the training objective of FM-KD is equivalent to minimizing the upper bound of the teacher feature map's or logit's negative log-likelihood. Besides, FM-KD can be viewed as a unique implicit ensemble method that leads to performance gains. By slightly modifying the FM-KD framework, FM-KD can also be transformed into an online distillation framework OFM-KD with desirable performance gains. Through extensive experiments on CIFAR-100, ImageNet-1k, and MS-COCO datasets, we empirically validate the scalability and state-of-the-art performance of our proposed methods among relevant comparison approaches.",
        "keywords": "Knowledge Transfer;Offline Knowledge Distillation;Online Knowledge Distillation;Ensemble;Flow-based Model",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/e52f0fb1489e954eba28540fdf52bb3b343fc742.zip",
        "author": "Shitong Shao;Zhiqiang Shen;Linrui Gong;Huanran Chen",
        "authorids": "~Shitong_Shao1;~Zhiqiang_Shen1;~Linrui_Gong1;~Huanran_Chen1",
        "gender": "M;;M;M",
        "homepage": "https://shaoshitong.github.io/;;https://github.com/linruigong965;https://huanranchen.github.io/",
        "dblp": "329/2735;;;329/6558",
        "google_scholar": "hmUOaNcAAAAJ;;;https://scholar.google.co.jp/citations?user=QYsKXccAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Shitong_Shao1;~Zhiqiang_Shen1;~Linrui_Gong1;~Huanran_Chen1",
        "aff": "Southeast University;;;",
        "aff_domain": "seu.edu.cn;;;",
        "position": "MS student;;;",
        "bibtex": "@misc{\nshao2024knowledge,\ntitle={Knowledge Distillation via Flow Matching},\nauthor={Shitong Shao and Zhiqiang Shen and Linrui Gong and Huanran Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=oZ8FmnLpCA}\n}",
        "github": "",
        "project": "",
        "reviewers": "GAWr;c4jx;6oRH;J5cJ",
        "site": "https://openreview.net/forum?id=oZ8FmnLpCA",
        "pdf_size": 2768329,
        "rating": "3;5;5;5",
        "confidence": "5;5;4;4",
        "soundness": "2;3;3;3",
        "contribution": "1;2;3;2",
        "presentation": "2;2;3;2",
        "wc_summary": "53;67;51;88",
        "wc_strengths": "10;31;40;56",
        "wc_weaknesses": "307;40;167;403",
        "wc_questions": "1;20;4;10",
        "wc_review": "371;158;262;557",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;413;1686;3217",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;1;3;5",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            64.75,
            14.771171246722448
        ],
        "wc_strengths_avg": [
            34.25,
            16.618889854620253
        ],
        "wc_weaknesses_avg": [
            229.25,
            137.77223051108666
        ],
        "wc_questions_avg": [
            8.75,
            7.258615570478987
        ],
        "wc_review_avg": [
            337.0,
            147.66685477790878
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1329.0,
            1254.7200883065514
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.25,
            1.920286436967152
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:dvONIRQ4Y78J:scholar.google.com/&scioq=Knowledge+Distillation+via+Flow+Matching&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Southeast University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.seu.edu.cn/",
        "aff_unique_abbr": "SEU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "title": "Analyzing and Mitigating Object Hallucination in Large Vision-Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17813",
        "id": "oZDJKTlOUe",
        "author_site": "Yiyang Zhou, Chenhang Cui, Jaehong Yoon, Linjun Zhang, Zhun Deng, Chelsea Finn, Mohit Bansal, Huaxiu Yao",
        "tldr": "",
        "abstract": "Large vision-language models (LVLMs) have shown remarkable abilities in understanding visual information with human languages. However, LVLMs still suffer from object hallucination, which is the problem of generating descriptions that include objects that do not actually exist in the images. This can negatively impact many vision-language tasks, such as visual summarization and reasoning. To address this issue, we propose a simple yet powerful algorithm, LVLM Hallucination Revisor (LURE), to post-hoc rectify object hallucination in LVLMs by reconstructing less hallucinatory descriptions. LURE is grounded in a rigorous statistical analysis of the key factors underlying object hallucination, including co-occurrence (the frequent appearance of certain objects alongside others in images), uncertainty (objects with higher uncertainty during LVLM decoding), and object position (hallucination often appears in the later part of the generated text). LURE can also be seamlessly integrated with any LVLMs. We evaluate LURE on six open-source LVLMs and found it outperforms the previous best approach in both general object hallucination evaluation metrics, GPT, and human evaluations.",
        "keywords": "Hallucination;large vision-language model;multimodal learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yiyang Zhou;Chenhang Cui;Jaehong Yoon;Linjun Zhang;Zhun Deng;Chelsea Finn;Mohit Bansal;Huaxiu Yao",
        "authorids": "~Yiyang_Zhou1;~Chenhang_Cui1;~Jaehong_Yoon1;~Linjun_Zhang1;~Zhun_Deng1;~Chelsea_Finn1;~Mohit_Bansal2;~Huaxiu_Yao1",
        "gender": "M;M;M;M;M;F;M;M",
        "homepage": "https://yiyangzhou.github.io/;https://gzcch.github.io;https://jaehong31.github.io/;;https://www.zhundeng.org/;https://ai.stanford.edu/~cbfinn/;https://www.cs.unc.edu/~mbansal/;http://huaxiuyao.mystrikingly.com",
        "dblp": "175/1589.html;347/3407;203/4449;;204/4353;131/1783;32/5243.html;197/1635",
        "google_scholar": "https://scholar.google.com.hk/citations?user=6KltFMAAAAAJ;V5X1gdAAAAAJ;-5comoUAAAAJ;TUAzs3sAAAAJ;nkmi-moAAAAJ;vfPE6hgAAAAJ;DN8QtscAAAAJ;A20BZnQAAAAJ",
        "orcid": ";;;;;;;",
        "linkedin": ";;jaehongyoon/;;;;;huaxiuyao/",
        "or_profile": "~Yiyang_Zhou1;~Chenhang_Cui1;~Jaehong_Yoon1;~Linjun_Zhang1;~Zhun_Deng1;~Chelsea_Finn1;~Mohit_Bansal2;~Huaxiu_Yao1",
        "aff": "Xi'an Jiaotong University;University of Electronic Science and Technology of China;University of North Carolina at Chapel Hill;Rutgers University;Columbia University;Google;University of North Carolina at Chapel Hill;Department of Computer Science, University of North Carolina at Chapel Hill",
        "aff_domain": "xjtu.edu.cn;uestc.edu.cn;unc.edu;rutgers.edu;columbia.edu;google.com;unc.edu;cs.unc.edu",
        "position": "MS student;Undergrad student;Postdoc;Assistant Professor;Postdoc;Research Scientist;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nzhou2024analyzing,\ntitle={Analyzing and Mitigating Object Hallucination in Large Vision-Language Models},\nauthor={Yiyang Zhou and Chenhang Cui and Jaehong Yoon and Linjun Zhang and Zhun Deng and Chelsea Finn and Mohit Bansal and Huaxiu Yao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=oZDJKTlOUe}\n}",
        "github": "",
        "project": "",
        "reviewers": "4tjW;ZMPq;4L8t;SdU6",
        "pdf_size": 2799675,
        "rating": "5;6;6;8",
        "confidence": "4;3;4;3",
        "soundness": "2;3;3;3",
        "contribution": "3;3;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "69;81;34;55",
        "wc_strengths": "49;85;59;52",
        "wc_weaknesses": "157;56;188;69",
        "wc_questions": "45;81;37;56",
        "wc_review": "320;303;318;232",
        "wc_reply_reviewers": "0;185;0;25",
        "wc_reply_authors": "1379;1374;1549;876",
        "reply_reviewers": "0;2;0;1",
        "reply_authors": "4;6;3;2",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            59.75,
            17.483921184905864
        ],
        "wc_strengths_avg": [
            61.25,
            14.184057952504283
        ],
        "wc_weaknesses_avg": [
            117.5,
            56.26944108483752
        ],
        "wc_questions_avg": [
            54.75,
            16.588776326179094
        ],
        "wc_review_avg": [
            293.25,
            35.967867604293694
        ],
        "wc_reply_reviewers_avg": [
            52.5,
            77.17674520216566
        ],
        "wc_reply_authors_avg": [
            1294.5,
            251.68084948998404
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.75,
            1.479019945774904
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.6882472016116854,
        "gs_citation": 244,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8837695137201151189&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=oZDJKTlOUe",
        "pdf": "https://openreview.net/pdf?id=oZDJKTlOUe",
        "email": "xjtu.edu.cn;uestc.edu.cn;unc.edu;rutgers.edu;columbia.edu;google.com;unc.edu;cs.unc.edu",
        "author_num": 8,
        "aff_unique_index": "0;1;2;3;4;5;2;6",
        "aff_unique_norm": "Xi'an Jiao Tong University;University of Electronic Science and Technology of China;University of North Carolina;Rutgers University;Columbia University;Google;University of North Carolina at Chapel Hill",
        "aff_unique_dep": ";;;;;Google;Department of Computer Science",
        "aff_unique_url": "https://www.xjtu.edu.cn;https://www.uestc.edu.cn;https://www.unc.edu;https://www.rutgers.edu;https://www.columbia.edu;https://www.google.com;https://www.unc.edu",
        "aff_unique_abbr": "XJTU;UESTC;UNC;Rutgers;Columbia;Google;UNC Chapel Hill",
        "aff_campus_unique_index": "1;2;1;1",
        "aff_campus_unique": ";Chapel Hill;Mountain View",
        "aff_country_unique_index": "0;0;1;1;1;1;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Privacy-Preserving In-Context Learning with Differentially Private Few-Shot Generation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17812",
        "id": "oZtt0pRnOl",
        "author_site": "Xinyu Tang, Richard Shin, Huseyin Inan, Andre Manoel, Niloofar Mireshghallah, Zinan Lin, Sivakanth Gopi, Janardhan Kulkarni, Robert Sim",
        "tldr": "",
        "abstract": "We study the problem of in-context learning (ICL) with large language models (LLMs) on private datasets. \nThis scenario poses privacy risks, as LLMs may leak or regurgitate the private examples demonstrated in the prompt.\nWe propose a novel algorithm that generates synthetic few-shot demonstrations from the private dataset with formal differential privacy (DP) guarantees, and show empirically that it can achieve effective ICL.\nWe conduct extensive experiments on standard benchmarks and compare our algorithm with non-private ICL and zero-shot solutions. \nOur results demonstrate that our algorithm can achieve competitive performance with strong privacy levels.\nThese results open up new possibilities for ICL with privacy protection for a broad range of applications.",
        "keywords": "differential privacy;large language models;in-context learning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/d5490a4592cfda3d2c1bd64acc42b585f6144368.zip",
        "author": "Xinyu Tang;Richard Shin;Huseyin A Inan;Andre Manoel;Fatemehsadat Mireshghallah;Zinan Lin;Sivakanth Gopi;Janardhan Kulkarni;Robert Sim",
        "authorids": "~Xinyu_Tang1;~Richard_Shin1;~Huseyin_A_Inan1;~Andre_Manoel1;~Fatemehsadat_Mireshghallah1;~Zinan_Lin1;~Sivakanth_Gopi1;~Janardhan_Kulkarni2;~Robert_Sim1",
        "gender": ";M;M;F;M;M;M;M;",
        "homepage": ";https://rshin.github.io;;https://homes.cs.washington.edu/~niloofar/;https://zinanlin.me/;https://aka.ms/sigopi;;;",
        "dblp": "65/5518;13/8735;122/2913;241/9430.html;64/237-1;123/7803.html;54/1978;47/1233;41/11141",
        "google_scholar": "uwcdL7gAAAAJ;xPnkc80AAAAJ;LpWGWAwAAAAJ;WUCu45YAAAAJ;67nE-wQ_g_cC;bYhGFrwAAAAJ;_fxnybwAAAAJ;uT8sPt8AAAAJ;BGN4egcAAAAJ",
        "orcid": ";;0000-0002-5455-0230;;;;;;",
        "linkedin": ";;andre-manoel/;;;sivakanthgopi/;;simra/;",
        "or_profile": "~Xinyu_Tang1;~Richard_Shin1;~Andre_Manoel1;~Fatemehsadat_Mireshghallah1;~Zinan_Lin1;~Sivakanth_Gopi1;~Janardhan_Kulkarni2;~Robert_Sim1;~Huseyin_Atahan_Inan1",
        "aff": "Princeton University;Microsoft;Microsoft;University of Washington;Microsoft;Microsoft Research;Microsoft Research, Redmond;Microsoft;Microsoft",
        "aff_domain": "princeton.edu;microsoft.com;microsoft.com;uw.edu;microsoft.com;microsoft.com;microsoft.com;microsoft.com;microsoft.com",
        "position": "PhD student;Researcher;Research Engineer;Postdoc;Senior Researcher;Senior Researcher;Researcher;Principal Researcher;Researcher",
        "bibtex": "@inproceedings{\ntang2024privacypreserving,\ntitle={Privacy-Preserving In-Context Learning with Differentially Private Few-Shot Generation},\nauthor={Xinyu Tang and Richard Shin and Huseyin A Inan and Andre Manoel and Fatemehsadat Mireshghallah and Zinan Lin and Sivakanth Gopi and Janardhan Kulkarni and Robert Sim},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=oZtt0pRnOl}\n}",
        "github": "",
        "project": "",
        "reviewers": "95y5;MYhF;vhzg;kLtt",
        "pdf_size": 1341685,
        "rating": "8;8;8;8",
        "confidence": "2;3;3;4",
        "soundness": "3;3;3;3",
        "contribution": "3;3;4;3",
        "presentation": "3;3;3;3",
        "wc_summary": "48;51;71;79",
        "wc_strengths": "56;58;72;30",
        "wc_weaknesses": "40;75;31;188",
        "wc_questions": "2;8;36;2",
        "wc_review": "146;192;210;299",
        "wc_reply_reviewers": "0;0;0;19",
        "wc_reply_authors": "394;441;264;585",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            62.25,
            13.102957681378658
        ],
        "wc_strengths_avg": [
            54.0,
            15.165750888103101
        ],
        "wc_weaknesses_avg": [
            83.5,
            62.53199181219162
        ],
        "wc_questions_avg": [
            12.0,
            14.071247279470288
        ],
        "wc_review_avg": [
            211.75,
            55.51745221099398
        ],
        "wc_reply_reviewers_avg": [
            4.75,
            8.227241335952167
        ],
        "wc_reply_authors_avg": [
            421.0,
            114.75408489461279
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 66,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7792763731836215083&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=oZtt0pRnOl",
        "pdf": "https://openreview.net/pdf?id=oZtt0pRnOl",
        "email": "princeton.edu;microsoft.com;microsoft.com;uw.edu;microsoft.com;microsoft.com;microsoft.com;microsoft.com;microsoft.com",
        "author_num": 9,
        "aff_unique_index": "0;1;1;2;1;1;1;1;1",
        "aff_unique_norm": "Princeton University;Microsoft;University of Washington",
        "aff_unique_dep": ";Microsoft Corporation;",
        "aff_unique_url": "https://www.princeton.edu;https://www.microsoft.com;https://www.washington.edu",
        "aff_unique_abbr": "Princeton;Microsoft;UW",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Redmond",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "LDReg: Local Dimensionality Regularized Self-Supervised Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17811",
        "id": "oZyAqjAjJW",
        "author_site": "Hanxun Huang, Ricardo Campello, Sarah Erfani, Xingjun Ma, Michael E. Houle, James Bailey",
        "tldr": "",
        "abstract": "Representations learned via self-supervised learning (SSL) can be susceptible to dimensional collapse, where the learned representation subspace is of extremely low dimensionality and thus fails to represent the full data distribution and modalities.\nDimensional collapse \u2013\u2013\u2013 also known as the \"underfilling\" phenomenon \u2013\u2013\u2013 is one of the major causes of degraded performance on downstream tasks. Previous work has investigated the dimensional collapse problem of SSL at a global level. In this paper, we demonstrate that representations can span over high dimensional space globally, but collapse locally. To address this, we propose a method called *local dimensionality regularization (LDReg)*. Our formulation is based on the derivation of the Fisher-Rao metric to compare and optimize local distance distributions at an asymptotically small radius for each data point. By increasing the local intrinsic dimensionality, we demonstrate through a range of experiments that LDReg improves the representation quality of SSL. The results also show that LDReg can regularize dimensionality at both local and global levels.",
        "keywords": "Self-supervised learning;Local Intrinsic Dimensionality;Dimension Collapse;Contrastive Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Hanxun Huang;Ricardo J. G. B. Campello;Sarah Monazam Erfani;Xingjun Ma;Michael E. Houle;James Bailey",
        "authorids": "~Hanxun_Huang1;~Ricardo_J._G._B._Campello1;~Sarah_Monazam_Erfani1;~Xingjun_Ma1;~Michael_E._Houle1;~James_Bailey1",
        "gender": "M;;;M;;",
        "homepage": ";;https://people.eng.unimelb.edu.au/smonazam/;http://xingjunma.com/;;",
        "dblp": "268/5655.html;c/RicardoJGBCampello;136/0170;195/8270;;",
        "google_scholar": "https://scholar.google.com.au/citations?user=8CxZe3IAAAAJ;https://scholar.google.com.au/citations?hl=en;https://scholar.google.com.au/citations?user=Jq9ocx4AAAAJ;https://scholar.google.com.au/citations?user=XQViiyYAAAAJ;;",
        "orcid": "0000-0002-2793-6680;0000-0003-0266-3492;;;;",
        "linkedin": ";;;xingjun-ma-173532129/;;",
        "or_profile": "~Hanxun_Huang1;~Ricardo_J._G._B._Campello1;~Sarah_Monazam_Erfani1;~Xingjun_Ma1;~Michael_E._Houle1;~James_Bailey1",
        "aff": "The University of Melbourne;University of Southern Denmark - SDU;The University of Melbourne;Fudan University;;",
        "aff_domain": "unimelb.edu.au;sdu.dk;unimelb.edu.au;fudan.edu.cn;;",
        "position": "PhD student;Full Professor;Associate Professor;Associate Professor;;",
        "bibtex": "@inproceedings{\nhuang2024ldreg,\ntitle={{LDR}eg: Local Dimensionality Regularized Self-Supervised Learning},\nauthor={Hanxun Huang and Ricardo J. G. B. Campello and Sarah Monazam Erfani and Xingjun Ma and Michael E. Houle and James Bailey},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=oZyAqjAjJW}\n}",
        "github": "",
        "project": "",
        "reviewers": "LKEn;85fu;VyQK;oLx3",
        "pdf_size": 2164944,
        "rating": "5;6;6;8",
        "confidence": "3;4;4;4",
        "soundness": "3;3;3;4",
        "contribution": "2;3;3;2",
        "presentation": "3;3;3;4",
        "wc_summary": "143;70;78;37",
        "wc_strengths": "63;89;36;16",
        "wc_weaknesses": "119;190;205;333",
        "wc_questions": "5;171;122;2",
        "wc_review": "330;520;441;388",
        "wc_reply_reviewers": "19;23;37;135",
        "wc_reply_authors": "707;1748;1098;1588",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "3;5;4;4",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            82.0,
            38.4252521136817
        ],
        "wc_strengths_avg": [
            51.0,
            27.55902755904134
        ],
        "wc_weaknesses_avg": [
            211.75,
            77.17310088366283
        ],
        "wc_questions_avg": [
            75.0,
            73.57649081058433
        ],
        "wc_review_avg": [
            419.75,
            69.93702524414375
        ],
        "wc_reply_reviewers_avg": [
            53.5,
            47.52630850381713
        ],
        "wc_reply_authors_avg": [
            1285.25,
            410.8621271180881
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            4.0,
            0.7071067811865476
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.6622661785325219,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1036854988602723842&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=oZyAqjAjJW",
        "pdf": "https://openreview.net/pdf?id=oZyAqjAjJW",
        "email": "unimelb.edu.au;sdu.dk;unimelb.edu.au;fudan.edu.cn;;",
        "author_num": 6,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "University of Melbourne;University of Southern Denmark;Fudan University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.unimelb.edu.au;https://www.sdu.dk;https://www.fudan.edu.cn",
        "aff_unique_abbr": "UniMelb;SDU;Fudan",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;2",
        "aff_country_unique": "Australia;Denmark;China"
    },
    {
        "id": "oa758mIOcP",
        "title": "A Structured Matrix Method for Nonequispaced Neural Operators",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The computational efficiency of many neural operators, widely used for learning solutions of PDEs, relies on the fast Fourier transform (FFT) for performing spectral computations. However, as FFT is limited to equispaced (rectangular) grids, this limits the efficiency of such neural operators when applied to problems where the input and output functions need to be processed on general non-equispaced point distributions. We address this issue by proposing a novel method that leverages batch matrix multiplications to efficiently construct Vandermonde-structured matrices and compute forward and inverse transforms, on arbitrarily distributed points. An efficient implementation of such *structured matrix methods* is coupled with existing neural operator models to allow the processing of data on arbitrary non-equispaced distributions of points. With extensive empirical evaluation, we demonstrate that the proposed method allows one to extend neural operators to very general point distributions with significant gains in training speed over baselines,  while retaining or improving accuracy.",
        "keywords": "Nonequispaced Neural Operators;Operator Learning;Fourier Neural Operator;Deep Learning for Scientific Computing",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/f6b4a472072a09dbdfc9a66cbb91bec8f52811a4.zip",
        "author": "Levi E. Lingsch;Mike Yan Michelis;Emmanuel de Bezenac;Sirani M. Perera;Robert K. Katzschmann;Siddhartha Mishra",
        "authorids": "~Levi_E._Lingsch1;~Mike_Yan_Michelis1;~Emmanuel_de_Bezenac2;~Sirani_M._Perera1;~Robert_K._Katzschmann1;~Siddhartha_Mishra1",
        "gender": "M;M;M;M;Not Specified;F",
        "homepage": ";;http://www.sam.math.ethz.ch/;;http://srl.ethz.ch;https://faculty.erau.edu/Sirani.Perera",
        "dblp": "292/3712;;07/2856.html;304/9412;139/3491;140/7610",
        "google_scholar": "xxCOii8AAAAJ;https://scholar.google.fr/citations?user=KvZw5gYAAAAJ;FmEqyNcAAAAJ;9pJIGJUAAAAJ;https://scholar.google.ch/citations?hl=en;QgrLwXAAAAAJ",
        "orcid": ";;;;0000-0001-7143-7259;",
        "linkedin": "mike-yan-michelis-669774174/;;;levi-l-1996a3151;robertkatzschmann/;sirani-m-perera-89a754b/",
        "or_profile": "~Mike_Yan_Michelis1;~Emmanuel_de_Bezenac2;~Siddhartha_Mishra1;~Levi_Evan_Lingsch1;~Robert_Kevin_Katzschmann1;~Sirani_Mututhanthrige-Perera1",
        "aff": "ETHZ - ETH Zurich;ETHZ - ETH Zurich;Swiss Federal Institute of Technology;ETHZ - ETH Zurich;Swiss Federal Institute of Technology;Embry-Riddle Aeronautical University",
        "aff_domain": "ethz.ch;ethz.ch;ethz.ch;ethz.ch;ethz.ch;erau.edu",
        "position": "PhD student;Postdoc;Full Professor;MS student;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nlingsch2024a,\ntitle={A Structured Matrix Method for Nonequispaced Neural Operators},\nauthor={Levi E. Lingsch and Mike Yan Michelis and Emmanuel de Bezenac and Sirani M. Perera and Robert K. Katzschmann and Siddhartha Mishra},\nyear={2024},\nurl={https://openreview.net/forum?id=oa758mIOcP}\n}",
        "github": "",
        "project": "",
        "reviewers": "7coN;R5Ja;6FVk",
        "site": "https://openreview.net/forum?id=oa758mIOcP",
        "pdf_size": 12660868,
        "rating": "5;8;8",
        "confidence": "4;2;5",
        "soundness": "1;3;2",
        "contribution": "1;3;3",
        "presentation": "2;2;3",
        "wc_summary": "48;83;103",
        "wc_strengths": "33;15;70",
        "wc_weaknesses": "1127;54;143",
        "wc_questions": "37;3;274",
        "wc_review": "1245;155;590",
        "wc_reply_reviewers": "30;0;30",
        "wc_reply_authors": "2310;243;1143",
        "reply_reviewers": "1;0;1",
        "reply_authors": "5;1;3",
        "rating_avg": [
            7.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            1.247219128924647
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            78.0,
            22.73030282830976
        ],
        "wc_strengths_avg": [
            39.333333333333336,
            22.89589968143253
        ],
        "wc_weaknesses_avg": [
            441.3333333333333,
            486.1990904511809
        ],
        "wc_questions_avg": [
            104.66666666666667,
            120.53860607936178
        ],
        "wc_review_avg": [
            663.3333333333334,
            448.00173610774715
        ],
        "wc_reply_reviewers_avg": [
            20.0,
            14.142135623730951
        ],
        "wc_reply_authors_avg": [
            1232.0,
            846.1926494599205
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.0,
            1.632993161855452
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.18898223650461365,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18307604804854910091&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;1;0;1;2",
        "aff_unique_norm": "ETH Zurich;Swiss Federal Institute of Technology;Embry-Riddle Aeronautical University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ethz.ch;https://www.ethz.ch;https://www.erau.edu",
        "aff_unique_abbr": "ETHZ;ETH Zurich;ERAU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;1",
        "aff_country_unique": "Switzerland;United States"
    },
    {
        "id": "oaTkYHPINY",
        "title": "Sweeping Heterogeneity with Smart MoPs: Mixture of Prompts for LLM Task Adaptation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) have the ability to solve a variety of tasks, such as text summarization and mathematical questions, just out of the box, but they are often trained with a single task in mind. Due to high computational costs, the current trend is to use prompt instruction tuning to better adjust monolithic, pretrained LLMs for new --but often individual-- downstream tasks. Thus, how one would expand prompt tuning to handle --concomitantly-- heterogeneous tasks and data distributions is a widely open question. To address this gap, we suggest the use of Mixture of Prompts, or MoPs, associated with smart gating functionality: the latter --whose design is one of the contributions of this paper-- can identify relevant skills embedded in different groups of prompts and dynamically assign combined experts (i.e., collection of prompts), based on the target task. Additionally, MoPs are empirically agnostic to any model compression technique applied --for efficiency reasons-- as well as instruction data source and task composition. In practice, MoPs can simultaneously mitigate prompt training \"interference'' in multi-task, multi-source scenarios (e.g., task and data heterogeneity across sources), as well as possible implications from model approximations.  As a highlight, MoPs manage to decrease final perplexity from $\\sim20$% up to $\\sim70$%, as compared to baselines, in the federated scenario, and from $\\sim 3$% up to $\\sim30$% in the centralized scenario.",
        "keywords": "Mixture of Experts;Soft-Prompts;Task tuning;Compressed LLMs",
        "primary_area": "infrastructure, software libraries, hardware, etc.",
        "supplementary_material": "/attachment/74f569b1b6998a9af9ab7f37eeb1037b34361a8d.pdf",
        "author": "Chen Dun;Mirian Del Carmen Hipolito Garcia;Guoqing Zheng;Ahmed Hassan Awadallah;Anastasios Kyrillidis;Robert Sim",
        "authorids": "~Chen_Dun2;~Mirian_Del_Carmen_Hipolito_Garcia1;~Guoqing_Zheng1;~Ahmed_Hassan_Awadallah1;~Anastasios_Kyrillidis2;~Robert_Sim1",
        "gender": ";F;;M;M;M",
        "homepage": ";https://www.microsoft.com/en-us/research/people/mirianh/;https://www.microsoft.com/en-us/research/people/zheng/;https://www.microsoft.com/en-us/research/people/hassanam/publications/;http://akyrillidis.github.io;",
        "dblp": "228/8450;;https://dblp.org/pers/z/Zheng:Guoqing.html;147/9148;53/9879;47/1233",
        "google_scholar": "QbPWRIoAAAAJ;;aMhUcoMAAAAJ;sNGk-9MAAAAJ;TEGzkZMAAAAJ;uT8sPt8AAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";mirian-hip%C3%B3lito-garc%C3%ADa-22b658160;;ahmed-hassan-awadallah-a355a27/;;simra/",
        "or_profile": "~Chen_Dun2;~Mirian_Del_Carmen_Hipolito_Garcia1;~Guoqing_Zheng1;~Ahmed_Hassan_Awadallah1;~Anastasios_Kyrillidis2;~Robert_Sim1",
        "aff": "ByteDance Inc.;Microsoft;Microsoft Research;Microsoft Research;Rice University;Microsoft",
        "aff_domain": "bytedance.com;microsoft.com;microsoft.com;microsoft.com;rice.edu;microsoft.com",
        "position": "Researcher;Researcher;Researcher;Principal Researcher;Assistant Professor;Principal Researcher",
        "bibtex": "@misc{\ndun2024sweeping,\ntitle={Sweeping Heterogeneity with Smart MoPs: Mixture of Prompts for {LLM} Task Adaptation},\nauthor={Chen Dun and Mirian Del Carmen Hipolito Garcia and Guoqing Zheng and Ahmed Hassan Awadallah and Anastasios Kyrillidis and Robert Sim},\nyear={2024},\nurl={https://openreview.net/forum?id=oaTkYHPINY}\n}",
        "github": "",
        "project": "",
        "reviewers": "t2HG;nzzG;YeGh;g7Lw",
        "site": "https://openreview.net/forum?id=oaTkYHPINY",
        "pdf_size": 674003,
        "rating": "5;5;5;5",
        "confidence": "3;3;4;3",
        "soundness": "3;3;3;2",
        "contribution": "2;3;3;2",
        "presentation": "2;3;3;3",
        "wc_summary": "49;101;42;53",
        "wc_strengths": "63;138;26;112",
        "wc_weaknesses": "207;634;149;115",
        "wc_questions": "37;20;4;103",
        "wc_review": "356;893;221;383",
        "wc_reply_reviewers": "0;259;0;0",
        "wc_reply_authors": "436;1046;483;878",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;2;1;2",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            61.25,
            23.284920012746447
        ],
        "wc_strengths_avg": [
            84.75,
            43.30920802785477
        ],
        "wc_weaknesses_avg": [
            276.25,
            209.14991632797754
        ],
        "wc_questions_avg": [
            41.0,
            37.6497011940334
        ],
        "wc_review_avg": [
            463.25,
            255.59379393874178
        ],
        "wc_reply_reviewers_avg": [
            64.75,
            112.1502897900848
        ],
        "wc_reply_authors_avg": [
            710.75,
            258.7096586909735
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1166324080581067741&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;1;1;2;1",
        "aff_unique_norm": "ByteDance;Microsoft;Rice University",
        "aff_unique_dep": ";Microsoft Corporation;",
        "aff_unique_url": "https://www.bytedance.com;https://www.microsoft.com;https://www.rice.edu",
        "aff_unique_abbr": "ByteDance;Microsoft;Rice",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Reconciling Spatial and Temporal Abstractions for Goal Representation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17810",
        "id": "odY3PkI5VB",
        "author_site": "Mehdi Zadem, Sergio Mover, Sao Mai Nguyen",
        "tldr": "",
        "abstract": "Goal representation affects the performance of Hierarchical Reinforcement Learn- ing (HRL) algorithms by decomposing the complex learning problem into easier subtasks. Recent studies show that representations that preserve temporally ab- stract environment dynamics are successful in solving difficult problems and pro- vide theoretical guarantees for optimality. These methods however cannot scale to tasks where environment dynamics increase in complexity i.e. the temporally abstract transition relations depend on larger number of variables. On the other hand, other efforts have tried to use spatial abstraction to mitigate the previous issues. Their limitations include scalability to high dimensional environments and dependency on prior knowledge.\n\nIn this paper, we propose a novel three-layer HRL algorithm that introduces, at different levels of the hierarchy, both a spatial and a temporal goal abstraction. We provide a theoretical study of the regret bounds of the learned policies. We evaluate the approach on complex continuous control tasks, demonstrating the effectiveness of spatial and temporal abstractions learned by this approach.",
        "keywords": "Hierarchical Reinforcement Learning;Goal Representation;Reachability Analysis",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/efd4d11ce22956eacbe3d118b1e674e7a7c66c76.zip",
        "author": "Mehdi Zadem;Sergio Mover;Sao Mai Nguyen",
        "authorids": "~Mehdi_Zadem1;~Sergio_Mover1;~Sao_Mai_Nguyen1",
        "gender": "M;;F",
        "homepage": "http://www.lix.polytechnique.fr/Labo/Mehdi.ZADEM/;;http://nguyensmai.free.fr",
        "dblp": ";;42/10546.html",
        "google_scholar": ";;https://scholar.google.fr/citations?user=ppPWNQoAAAAJ",
        "orcid": ";;0000-0003-0929-0019",
        "linkedin": ";;",
        "or_profile": "~Mehdi_Zadem1;~Sergio_Mover1;~Sao_Mai_Nguyen1",
        "aff": "\u00c9cole Polytechnique;;IMT Atlantique",
        "aff_domain": "polytechnique.fr;;imt-atlantique.edu",
        "position": "PhD student;;Associate Professor",
        "bibtex": "@inproceedings{\nzadem2024reconciling,\ntitle={Reconciling Spatial and Temporal Abstractions for Goal Representation},\nauthor={Mehdi Zadem and Sergio Mover and Sao Mai Nguyen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=odY3PkI5VB}\n}",
        "github": "",
        "project": "",
        "reviewers": "awpo;ep9K;L6eb",
        "pdf_size": 1874036,
        "rating": "5;6;8",
        "confidence": "4;4;3",
        "soundness": "2;2;3",
        "contribution": "2;3;3",
        "presentation": "2;2;2",
        "wc_summary": "66;188;180",
        "wc_strengths": "35;119;158",
        "wc_weaknesses": "293;351;379",
        "wc_questions": "282;250;67",
        "wc_review": "676;908;784",
        "wc_reply_reviewers": "497;82;5",
        "wc_reply_authors": "3109;1232;1025",
        "reply_reviewers": "2;1;1",
        "reply_authors": "5;3;3",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            144.66666666666666,
            55.7215298505783
        ],
        "wc_strengths_avg": [
            104.0,
            51.32250968142536
        ],
        "wc_weaknesses_avg": [
            341.0,
            35.81433604950212
        ],
        "wc_questions_avg": [
            199.66666666666666,
            94.71477650762255
        ],
        "wc_review_avg": [
            789.3333333333334,
            94.78865379827317
        ],
        "wc_reply_reviewers_avg": [
            194.66666666666666,
            216.08074622438923
        ],
        "wc_reply_authors_avg": [
            1788.6666666666667,
            937.433493937333
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.944911182523068,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15177880492147792156&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 24,
        "openreview": "https://openreview.net/forum?id=odY3PkI5VB",
        "pdf": "https://openreview.net/pdf?id=odY3PkI5VB",
        "email": "polytechnique.fr;;imt-atlantique.edu",
        "author_num": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Ecole Polytechnique;IMT Atlantique",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.polytechnique.edu;https://www.imt-atlantique.fr",
        "aff_unique_abbr": "X;IMT Atlantique",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "France"
    },
    {
        "title": "AffineQuant: Affine Transformation Quantization for Large Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17809",
        "id": "of2rhALq8l",
        "author_site": "Yuexiao Ma, Huixia Li, Xiawu Zheng, Feng Ling, Xuefeng Xiao, Rui Wang, Shilei Wen, Fei Chao, Rongrong Ji",
        "tldr": "",
        "abstract": "The significant resource requirements associated with Large-scale Language Models (LLMs) have generated considerable interest in the development of techniques aimed at compressing and accelerating neural networks. \nAmong these techniques, Post-Training Quantization (PTQ) has emerged as a subject of considerable interest due to its noteworthy compression efficiency and cost-effectiveness in the context of training. \nExisting PTQ methods for LLMs limit the optimization scope to scaling transformations between pre- and post-quantization weights. \nThis constraint results in significant errors after quantization, particularly in low-bit configurations. \nIn this paper, we advocate for the direct optimization using equivalent Affine transformations in PTQ (AffineQuant). \nThis approach extends the optimization scope and thus significantly minimizing quantization errors. \nAdditionally, by employing the corresponding inverse matrix, we can ensure equivalence between the pre- and post-quantization outputs of PTQ, thereby maintaining its efficiency and generalization capabilities. \nTo ensure the invertibility of the transformation during optimization, we further introduce a gradual mask optimization method. \nThis method initially focuses on optimizing the diagonal elements and gradually extends to the other elements. \nSuch an approach aligns with the Levy-Desplanques theorem, theoretically ensuring invertibility of the transformation. \nAs a result, significant performance improvements are evident across different LLMs on diverse datasets. \nNotably, these improvements are most pronounced when using very low-bit quantization, enabling the deployment of large models on edge devices. \nTo illustrate, we attain a C4 perplexity of $15.76$ (2.26$\\downarrow$ vs $18.02$ in OmniQuant) on the LLaMA2-$7$B model of W$4$A$4$ quantization without overhead. \nOn zero-shot tasks, AffineQuant achieves an average of $58.61\\%$ accuracy ( $1.98\\%\\uparrow$ vs $56.63$ in OmniQuant) when using $4$/$4$-bit quantization for LLaMA-$30$B, which setting a new state-of-the-art benchmark for PTQ in LLMs. \nCodes are available at: https://github.com/bytedance/AffineQuant.",
        "keywords": "post-training quantization;large language model;Affine Transformation",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/55507fe9ebeb11f9ed6dce48db0c9242757a8c63.zip",
        "author": "Yuexiao Ma;Huixia Li;Xiawu Zheng;Feng Ling;Xuefeng Xiao;Rui Wang;Shilei Wen;Fei Chao;Rongrong Ji",
        "authorids": "~Yuexiao_Ma1;~Huixia_Li2;~Xiawu_Zheng1;~Feng_Ling1;~Xuefeng_Xiao1;~Rui_Wang32;~Shilei_Wen1;~Fei_Chao1;~Rongrong_Ji5",
        "gender": "M;F;M;M;M;;M;M;M",
        "homepage": ";https://github.com/ReKarma/ReKarma.github.io;https://sites.google.com/view/zhengxiawu/%E9%A6%96%E9%A1%B5;https://github.com/lingffff;;;;https://cogsci.xmu.edu.cn/info/1034/1249.htm;http://mac.xmu.edu.cn/rrji-en.html",
        "dblp": "299/8966.html;;222/7865;;245/9547;;159/2939;118/5221-1.html;86/5681",
        "google_scholar": "DVszibYAAAAJ;fcqN6RQAAAAJ;jBgXocYAAAAJ;;;;zKtYrHYAAAAJ;srS6rNMAAAAJ;",
        "orcid": ";;0000-0002-6855-5403;;;;;;",
        "linkedin": ";;;;;;;;",
        "or_profile": "~Yuexiao_Ma1;~Huixia_Li2;~Xiawu_Zheng1;~Feng_Ling1;~Xuefeng_Xiao1;~Rui_Wang32;~Shilei_Wen1;~Fei_Chao1;~Rongrong_Ji5",
        "aff": "Xiamen University;ByteDance;PengCheng Lab;ByteDance Inc.;ByteDance;;bytedance;Xiamen University;Xiamen University",
        "aff_domain": "xmu.edu.cn;bytedance.inc;pcl.ac.cn;bytedance.com;bytedance.com;;bytedance.com;xmu.edu.cn;xmu.edu.cn",
        "position": "PhD student;Researcher;Postdoc;Researcher;Researcher;;Researcher;Associate Professor;Full Professor",
        "bibtex": "@inproceedings{\nma2024affinequant,\ntitle={AffineQuant: Affine Transformation Quantization for Large Language Models},\nauthor={Yuexiao Ma and Huixia Li and Xiawu Zheng and Feng Ling and Xuefeng Xiao and Rui Wang and Shilei Wen and Fei Chao and Rongrong Ji},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=of2rhALq8l}\n}",
        "github": "",
        "project": "",
        "reviewers": "E6YB;MkcQ;5dxF;gGYu",
        "pdf_size": 743675,
        "rating": "5;8;8;8",
        "confidence": "4;5;3;4",
        "soundness": "3;3;4;3",
        "contribution": "2;3;4;3",
        "presentation": "3;3;3;3",
        "wc_summary": "78;130;30;116",
        "wc_strengths": "38;10;26;126",
        "wc_weaknesses": "234;107;51;107",
        "wc_questions": "3;36;71;24",
        "wc_review": "353;283;178;373",
        "wc_reply_reviewers": "33;128;27;75",
        "wc_reply_authors": "1090;823;675;797",
        "reply_reviewers": "1;1;1;2",
        "reply_authors": "4;2;2;3",
        "rating_avg": [
            7.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            88.5,
            38.76531955240405
        ],
        "wc_strengths_avg": [
            50.0,
            44.98888751680797
        ],
        "wc_weaknesses_avg": [
            124.75,
            67.09088984355476
        ],
        "wc_questions_avg": [
            33.5,
            24.66272491027705
        ],
        "wc_review_avg": [
            296.75,
            76.270489050484
        ],
        "wc_reply_reviewers_avg": [
            65.75,
            40.41890028192257
        ],
        "wc_reply_authors_avg": [
            846.25,
            151.41561181067163
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 28,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17288147036164252116&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=of2rhALq8l",
        "pdf": "https://openreview.net/pdf?id=of2rhALq8l",
        "email": "xmu.edu.cn;bytedance.inc;pcl.ac.cn;bytedance.com;bytedance.com;;bytedance.com;xmu.edu.cn;xmu.edu.cn",
        "author_num": 9,
        "aff_unique_index": "0;1;2;1;1;1;0;0",
        "aff_unique_norm": "Xiamen University;ByteDance;Pengcheng Lab",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.xmu.edu.cn;https://www.bytedance.com;",
        "aff_unique_abbr": "XMU;ByteDance;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "CLaM-TTS: Improving Neural Codec Language Model for Zero-Shot Text-to-Speech",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17808",
        "id": "ofzeypWosV",
        "author_site": "Jaehyeon Kim, Keon Lee, Seungjun Chung, Jaewoong Cho",
        "tldr": "",
        "abstract": "With the emergence of neural audio codecs, which encode multiple streams of discrete tokens from audio, large language models have recently gained attention as a promising approach for zero-shot Text-to-Speech (TTS) synthesis. Despite the ongoing rush towards scaling paradigms, audio tokenization ironically amplifies the scalability challenge, stemming from its long sequence length and the complexity of modelling the multiple sequences. To mitigate these issues, we present CLaM-TTS that employs a probabilistic residual vector quantization to (1) achieve superior compression in the token length, and (2) allow a language model to generate multiple tokens at once, thereby eliminating the need for cascaded modeling to handle the number of token streams. Our experimental results demonstrate that CLaM-TTS is better than or comparable to state-of-the-art neural codec-based TTS models regarding naturalness, intelligibility, speaker similarity, and inference speed. In addition, we examine the impact of the pretraining extent of the language models and their text tokenization strategies on performances.",
        "keywords": "text-to-speech;speech synthesis;neural audio codec",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Jaehyeon Kim;Keon Lee;Seungjun Chung;Jaewoong Cho",
        "authorids": "~Jaehyeon_Kim1;~Keon_Lee1;~Seungjun_Chung1;~Jaewoong_Cho1",
        "gender": "M;M;M;",
        "homepage": "https://jaywalnut310.github.io/;https://sites.google.com/view/keonlee9420;https://coinse.github.io/members/seungjun/;https://sites.google.com/view/jaewoongcho",
        "dblp": "242/3847;130/7625;;184/3848",
        "google_scholar": "-ZJaGikAAAAJ;V9uj_6cAAAAJ;;",
        "orcid": ";;;",
        "linkedin": ";keonlee9420/;;",
        "or_profile": "~Jaehyeon_Kim1;~Keon_Lee1;~Seungjun_Chung1;~Jaewoong_Cho1",
        "aff": "Krafton Inc.;KRAFTON;Krafton Inc.;KRAFTON",
        "aff_domain": "krafton.com;krafton.com;krafton.com;krafton.com",
        "position": "Researcher;Researcher;Researcher;Researcher",
        "bibtex": "@inproceedings{\nkim2024clamtts,\ntitle={{CL}aM-{TTS}: Improving Neural Codec Language Model for Zero-Shot Text-to-Speech},\nauthor={Jaehyeon Kim and Keon Lee and Seungjun Chung and Jaewoong Cho},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ofzeypWosV}\n}",
        "github": "",
        "project": "",
        "reviewers": "yc4a;ZbF5;D6DJ;CLFG;w2yt",
        "pdf_size": 1376654,
        "rating": "3;5;8;8;8",
        "confidence": "4;5;4;4;4",
        "soundness": "3;2;3;4;4",
        "contribution": "2;2;4;4;4",
        "presentation": "1;2;4;3;4",
        "wc_summary": "106;69;86;70;215",
        "wc_strengths": "31;67;136;59;147",
        "wc_weaknesses": "139;92;25;54;117",
        "wc_questions": "83;1;68;13;71",
        "wc_review": "359;229;315;196;550",
        "wc_reply_reviewers": "0;0;10;0;0",
        "wc_reply_authors": "617;559;114;177;448",
        "reply_reviewers": "0;0;1;0;0",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            6.4,
            2.0591260281974
        ],
        "confidence_avg": [
            4.2,
            0.39999999999999997
        ],
        "soundness_avg": [
            3.2,
            0.7483314773547882
        ],
        "contribution_avg": [
            3.2,
            0.9797958971132712
        ],
        "presentation_avg": [
            2.8,
            1.16619037896906
        ],
        "wc_summary_avg": [
            109.2,
            54.57984976161074
        ],
        "wc_strengths_avg": [
            88.0,
            45.42246140402345
        ],
        "wc_weaknesses_avg": [
            85.4,
            41.35021160768105
        ],
        "wc_questions_avg": [
            47.2,
            33.420951512486894
        ],
        "wc_review_avg": [
            329.8,
            124.59759227208205
        ],
        "wc_reply_reviewers_avg": [
            2.0,
            4.0
        ],
        "wc_reply_authors_avg": [
            383.0,
            202.36304010367112
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.33995005182504257,
        "gs_citation": 38,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14902476719170961585&as_sdt=40000005&sciodt=0,22&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=ofzeypWosV",
        "pdf": "https://openreview.net/pdf?id=ofzeypWosV",
        "email": "krafton.com;krafton.com;krafton.com;krafton.com",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "KRAFTON Inc.",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.krafton.com",
        "aff_unique_abbr": "Krafton",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "og8yJ0wuz3",
        "title": "Language-Independent Embeddings for Entity Recognition via LLM Data-Level Knowledge Distillation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Entity Recognition has always been one of the most important problems in Natural Language Processing. However, there wasn't much research aimed at creating a high-quality Multilingual Domain-Agnostic Foundation Model for Entity Recognition task. We introduce novel LLM-powered Data-Creation and Contrastive Learning-based Pre-Training procedures that enable us to create a new state-of-the-art Foundation Model for Entity Recognition task. It is designed and trained to have high performance on data coming from different domains and to enable language-independent features thanks to a new diverse multilingual training dataset. Our contribution surpasses all existing models on the English and Multilingual Entity Recognition tasks when used as a Foundation Model. We improved the macro F1-Score of multilingual BERT by 10 points on the single-language scenario and by 13.5 points on the multi-language scenario in French, German, English, Spanish, Italian, Polish, Portuguese, and Russian on the Entity Recognition Task. We open-source our model on the HuggingFace platform.",
        "keywords": "token representations;word representations;Named Entity Recognition;NER;Entity;Entity Recognition;Foundation Model;foundation model;language-independent;domain-agnostic",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/09a480679dd9d1f8f0c9fa3d2b25eb1d2050b239.zip",
        "author": "Sergei Bogdanov;Alexandre Constantin;Etienne Bernard",
        "authorids": "~Sergei_Bogdanov1;alexandre@numind.ai;etienne@numind.ai",
        "gender": ";;",
        "homepage": "https://github.com/Serega6678;;",
        "dblp": ";;",
        "google_scholar": ";;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Sergei_Bogdanov1;alexandre@numind.ai;etienne@numind.ai",
        "aff": "NuMind;;",
        "aff_domain": "numind.ai;;",
        "position": "Researcher;;",
        "bibtex": "@misc{\nbogdanov2024languageindependent,\ntitle={Language-Independent Embeddings for Entity Recognition via {LLM} Data-Level Knowledge Distillation},\nauthor={Sergei Bogdanov and Alexandre Constantin and Etienne Bernard},\nyear={2024},\nurl={https://openreview.net/forum?id=og8yJ0wuz3}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=og8yJ0wuz3",
        "pdf_size": 205539,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:h4iNJK1HNwsJ:scholar.google.com/&scioq=Language-Independent+Embeddings+for+Entity+Recognition+via+LLM+Data-Level+Knowledge+Distillation&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "NuMind",
        "aff_unique_dep": "",
        "aff_unique_url": "",
        "aff_unique_abbr": ""
    },
    {
        "id": "ogV88XPnK6",
        "title": "Graph neural processes and their application to molecular functions",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Neural processes (NPs) are models for meta-learning which output uncertainty estimates. So far, most studies of NPs have focused on low-dimensional datasets of highly-correlated tasks. While these homogeneous datasets are useful for benchmarking, they may not be representative of realistic transfer-learning. In particular, applications in scientific research may prove especially challenging due to the potential novelty of meta-testing tasks. Drug discovery is one such research area that is characterized by sparse datasets of many functions on a shared molecular space. In this paper, we study the application of graph NPs to drug discovery with DOCKSTRING, a diverse dataset of docking scores. Graph NPs show competitive performance in few-shot learning tasks relative to supervised learning baselines common in chemoinformatics, as well as alternative techniques for transfer learning and meta-learning. In order to increase meta-generalization to divergent test functions, we propose fine-tuning strategies that adapt the parameters of NPs. We find that adaptation can substantially increase NPs' regression performance while maintaining good calibration of uncertainty estimates. Finally, we present a Bayesian optimization experiment which showcases the potential advantages of NPs over GPs in molecular applications.",
        "keywords": "Neural processes;molecules;drug discovery;meta-learning;docking",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/6d81bf92bb91ce032f2b99de83a56c78d52cda41.pdf",
        "author": "Miguel Garcia Ortegon;Andreas Bender;Carl Edward Rasmussen;Sergio Bacallado",
        "authorids": "~Miguel_Garcia_Ortegon1;~Andreas_Bender2;~Carl_Edward_Rasmussen1;~Sergio_Bacallado1",
        "gender": ";M;;M",
        "homepage": "https://scholar.google.com/citations?user=WaYn6zAAAAAJ;https://www.ch.cam.ac.uk/person/ab454;http://mlg.eng.cam.ac.uk/carl;http://www.statslab.cam.ac.uk/~sb2116",
        "dblp": ";;83/5440;",
        "google_scholar": ";https://scholar.google.com/citations?hl=de;;",
        "orcid": ";;;0000-0002-7193-6450",
        "linkedin": ";andreasbender/;;",
        "or_profile": "~Miguel_Garcia_Ortegon1;~Andreas_Bender2;~Carl_Edward_Rasmussen1;~Sergio_Bacallado1",
        "aff": ";University of Cambridge;University of Cambridge;University of Cambridge",
        "aff_domain": ";cam.ac.uk;cam.ac.uk;cam.ac.uk",
        "position": ";Associate Professor;Full Professor;Associate Professor",
        "bibtex": "@misc{\nortegon2024graph,\ntitle={Graph neural processes and their application to molecular functions},\nauthor={Miguel Garcia Ortegon and Andreas Bender and Carl Edward Rasmussen and Sergio Bacallado},\nyear={2024},\nurl={https://openreview.net/forum?id=ogV88XPnK6}\n}",
        "github": "",
        "project": "",
        "reviewers": "cRU3;PKuZ;P8e8;DH7x",
        "site": "https://openreview.net/forum?id=ogV88XPnK6",
        "pdf_size": 1621583,
        "rating": "3;5;5;6",
        "confidence": "4;4;4;3",
        "soundness": "3;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;4;4",
        "wc_summary": "74;120;40;122",
        "wc_strengths": "61;76;18;34",
        "wc_weaknesses": "206;367;24;5",
        "wc_questions": "156;4;60;50",
        "wc_review": "497;567;142;211",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1001;609;353;39",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            1.0
        ],
        "wc_summary_avg": [
            89.0,
            34.19064199455752
        ],
        "wc_strengths_avg": [
            47.25,
            22.620510604316607
        ],
        "wc_weaknesses_avg": [
            150.5,
            147.58472143145443
        ],
        "wc_questions_avg": [
            67.5,
            55.287882940116276
        ],
        "wc_review_avg": [
            354.25,
            181.1151222289293
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            500.5,
            352.49503542603264
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.6622661785325219,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4752006573349834031&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Cambridge",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cam.ac.uk",
        "aff_unique_abbr": "Cambridge",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Cambridge",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "ogmAeOvR1v",
        "title": "LSSInst: Improving Geometric Modeling in LSS-Based BEV Perception with Instance Representation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "With the attention gained by camera-only 3D object detection in autonomous driving, methods based on Bird-Eye-View (BEV) representation especially derived from the explicit lift-splat-shoot (LSS) paradigm, have recently seen significant progress. The BEV representation is ideal for learning the road structure and scene layout. However, to retain computational efficiency, the compressed BEV representation is inevitably weak in retaining the individual geometric details, undermining the methodological generality and applicability. With this in mind, to compensate for the missing details and utilize multi-view geometry constraints, we propose LSSInst, a two-stage object detector incorporating BEV and instance representations in tandem. The proposed detector exploits fine-grained pixel-level features while can be flexibly integrated into existing LSS-based BEV networks. Having said that, due to the inherent gap between two representation spaces, we design the instance adaptor for the BEV-to-instance semantic coherence rather than pass the proposal naively. Extensive experiments demonstrated that our proposed framework is of excellent generalization ability and performance, which boosts the performances of modern LSS-based BEV perception methods without bells and whistles and outperforms current LSS-based state-of-the-art works on the large-scale nuScenes benchmark.",
        "keywords": "3D Scene Understanding; Multi-view 3D Object Detection; BEV Perception",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/387d253870cdfa7a093901bfc06e19399b382429.pdf",
        "author": "Weijie Ma;Jingwei Jiang;Yang Yang;Zehui Chen;Hao Chen",
        "authorids": "~Weijie_Ma1;~Jingwei_Jiang1;~Yang_Yang41;~Zehui_Chen1;~Hao_Chen17",
        "gender": "M;;M;M;",
        "homepage": "https://weijiemax.github.io;;https://github.com/Young98CN;https://lovesnowbest.site;",
        "dblp": "258/3324;;;;",
        "google_scholar": "https://scholar.google.com.hk/citations?user=LGhmrxMAAAAJ;;Fq7jXZ4AAAAJ;NfSsLncAAAAJ;",
        "orcid": ";;;0000-0002-1843-4478;",
        "linkedin": ";;;;",
        "or_profile": "~Weijie_Ma1;~Jingwei_Jiang1;~Yang_Yang41;~Zehui_Chen1;~Hao_Chen17",
        "aff": "Shanghai AI Laboratory;;Zhejiang University;University of Science and Technology of China;",
        "aff_domain": "pjlab.org.cn;;zju.edu.cn;ustc.edu.cn;",
        "position": "Intern;;PhD student;PhD student;",
        "bibtex": "@misc{\nma2024lssinst,\ntitle={{LSSI}nst: Improving Geometric Modeling in {LSS}-Based {BEV} Perception with Instance Representation},\nauthor={Weijie Ma and Jingwei Jiang and Yang Yang and Zehui Chen and Hao Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=ogmAeOvR1v}\n}",
        "github": "",
        "project": "",
        "reviewers": "ocap;TXwr;hgcA;6PoT",
        "site": "https://openreview.net/forum?id=ogmAeOvR1v",
        "pdf_size": 687624,
        "rating": "3;5;5;5",
        "confidence": "4;5;5;4",
        "soundness": "3;2;2;3",
        "contribution": "3;2;2;2",
        "presentation": "3;3;2;3",
        "wc_summary": "47;54;48;74",
        "wc_strengths": "18;19;37;75",
        "wc_weaknesses": "83;149;125;140",
        "wc_questions": "3;25;2;245",
        "wc_review": "151;247;212;534",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            55.75,
            10.871407452579449
        ],
        "wc_strengths_avg": [
            37.25,
            23.069189409253198
        ],
        "wc_weaknesses_avg": [
            124.25,
            25.31180554602931
        ],
        "wc_questions_avg": [
            68.75,
            102.17234214796096
        ],
        "wc_review_avg": [
            286.0,
            147.2463921459538
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:kXuH8HmR8hIJ:scholar.google.com/&scioq=LSSInst:+Improving+Geometric+Modeling+in+LSS-Based+BEV+Perception+with+Instance+Representation&hl=en&as_sdt=0,33",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Shanghai AI Laboratory;Zhejiang University;University of Science and Technology of China",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.shanghai-ai-lab.com;https://www.zju.edu.cn;http://www.ustc.edu.cn",
        "aff_unique_abbr": "SAIL;ZJU;USTC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "ogxrdvFdx5",
        "title": "ReLU soothes NTK conditioning and accelerates optimization for wide neural networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Non-linear activation functions are well known to improve the expressivity of neural networks, which is the main reason of their wide implementation in neural networks. In this work, we showcase a new and interesting property of certain non-linear activations, focusing on the most popular example of its kind -- Rectified Linear Unit (ReLU). By comparing the cases with and without this non-linear activation, we show that the ReLU has the following effects: (a) *better data separation*, i.e.,  a larger angle separation for similar data in the feature space of model gradient, and (b) *better NTK conditioning*, i.e.,  a smaller condition number of neural tangent kernel (NTK). Furthermore, we show that the ReLU network depth (i.e., with more ReLU activation operations) further magnifies these effects. Note that, without the non-linear activation, i.e., in a linear neural network, the data separation and NTK condition number always remain the same as in the case of a linear model, regardless of the network depth. \n  Our results imply that  ReLU activation, as well as the depth of ReLU network, helps improve the worst-case convergence rate of gradient descent, which is closely related to the NTK condition number.",
        "keywords": "ReLU;non-linear activation function;condition number;NTK;neural tangent kernel;convergence rate",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/6a3701d66eee99695ccfd602db859168964bbd9e.pdf",
        "author": "Chaoyue Liu;Like Hui;Xiao Liu",
        "authorids": "~Chaoyue_Liu2;~Like_Hui1;~Xiao_Liu30",
        "gender": "M;F;F",
        "homepage": "https://cliu212.github.io/;;https://www.rcac.purdue.edu/about/staff/liu4201",
        "dblp": "191/6684-1;173/3760;",
        "google_scholar": "sRjoMX0AAAAJ;aNPR3H4AAAAJ;rK551HwAAAAJ",
        "orcid": ";;0000-0002-6303-0771",
        "linkedin": ";like-hui-09191910a/;xiao-liu-ab22211a3/",
        "or_profile": "~Chaoyue_Liu2;~Like_Hui1;~Xiao_Liu30",
        "aff": "University of California, San Diego;Yahoo;Purdue University",
        "aff_domain": "ucsd.edu;yahooinc.com;purdue.edu",
        "position": "Postdoc;Researcher;Senior Computational Scientist",
        "bibtex": "@misc{\nliu2024relu,\ntitle={Re{LU} soothes {NTK} conditioning and accelerates optimization for wide neural networks},\nauthor={Chaoyue Liu and Like Hui and Xiao Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=ogxrdvFdx5}\n}",
        "github": "",
        "project": "",
        "reviewers": "XQe2;4jiX;WJEr;hbD5",
        "site": "https://openreview.net/forum?id=ogxrdvFdx5",
        "pdf_size": 432279,
        "rating": "3;3;5;6",
        "confidence": "4;4;4;3",
        "soundness": "3;3;3;3",
        "contribution": "1;1;2;3",
        "presentation": "3;3;3;2",
        "wc_summary": "237;61;65;84",
        "wc_strengths": "87;54;39;25",
        "wc_weaknesses": "211;239;229;171",
        "wc_questions": "144;38;14;30",
        "wc_review": "679;392;347;310",
        "wc_reply_reviewers": "344;218;0;94",
        "wc_reply_authors": "1301;486;537;838",
        "reply_reviewers": "2;1;0;1",
        "reply_authors": "4;2;1;2",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            111.75,
            72.83328565978607
        ],
        "wc_strengths_avg": [
            51.25,
            23.047505287991584
        ],
        "wc_weaknesses_avg": [
            212.5,
            25.975950415721076
        ],
        "wc_questions_avg": [
            56.5,
            51.251829235647776
        ],
        "wc_review_avg": [
            432.0,
            145.531783470141
        ],
        "wc_reply_reviewers_avg": [
            164.0,
            129.52991932368366
        ],
        "wc_reply_authors_avg": [
            790.5,
            323.9787801693191
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.25,
            1.0897247358851685
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.7777777777777777,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:nFOvfx1l_hgJ:scholar.google.com/&scioq=ReLU+soothes+NTK+conditioning+and+accelerates+optimization+for+wide+neural+networks&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of California, San Diego;Yahoo;Purdue University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ucsd.edu;https://www.yahoo.com;https://www.purdue.edu",
        "aff_unique_abbr": "UCSD;Yahoo;Purdue",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "San Diego;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "ohdVLirfbz",
        "title": "Generalization Guarantees of Gradient Descent for Multi-Layer Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recently, significant progress has been made in understanding the generalization of neural networks (NNs) trained by gradient descent (GD) using the algorithmic stability approach. However, most of the existing research has focused on one-hidden-layer NNs and has not addressed the impact of different network scaling parameters. In this paper, we greatly extend the previous work (Richards and Kuzborskij,2021; Lei et al.,2022) by conducting a comprehensive stability and generalization analysis of GD for multi-layer NNs. For two-layer NNs, our results are established under general network scaling parameters, relaxing previous conditions. In the case of three-layer NNs, our technical contribution lies in demonstrating its nearly co-coercive property by utilizing a novel induction strategy that thoroughly explores the effects of over-parameterization. As a direct application of our general findings, we derive the excess risk rate of $O(1/\\sqrt{n})$ for GD algorithms in both two-layer and three-layer NNs. This sheds light on sufficient or necessary conditions for under-parameterized and over-parameterized NNs trained by GD to attain the desired risk rate of $O(1/\\sqrt{n})$. Moreover, we demonstrate that as the scaling parameter increases or the network complexity decreases, less over-parameterization is required for GD to achieve the desired error rates. Additionally, under a low-noise condition, we obtain a fast risk rate of $O(1/n)$ for GD in both two-layer and three-layer NNs.",
        "keywords": "learning theory;generalization analysis;gradient descent;stability",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/f4249d9b7e46edf6873c346dce32ce6db5598195.pdf",
        "author": "Puyu Wang;Yunwen Lei;Di Wang;Yiming Ying;Ding-Xuan Zhou",
        "authorids": "~Puyu_Wang1;~Yunwen_Lei1;~Di_Wang1;~Yiming_Ying1;~Ding-Xuan_Zhou2",
        "gender": "F;M;;M;",
        "homepage": "https://ml.cs.rptu.de/people/puyu-wang.php;https://leiyw.github.io/;;https://www.sydney.edu.au/science/about/our-people/academic-staff/yiming-ying.html;",
        "dblp": "66/8539;https://dblp.org/pers/l/Lei:Yunwen;;41/2012;",
        "google_scholar": "COtq-mYAAAAJ;https://scholar.google.com.hk/citations?user=g3dg0rsAAAAJ;;xnA_lMMAAAAJ;",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Puyu_Wang1;~Yunwen_Lei1;~Di_Wang1;~Yiming_Ying1;~Ding-Xuan_Zhou2",
        "aff": "Hong Kong Baptist University;University of Hong Kong;;University of Sydney;",
        "aff_domain": "hkbu.edu.hk;hku.hk;;sydney.edu.au;",
        "position": "Postdoc;Assistant Professor;;Full Professor;",
        "bibtex": "@misc{\nwang2024generalization,\ntitle={Generalization Guarantees of Gradient Descent for Multi-Layer Neural Networks},\nauthor={Puyu Wang and Yunwen Lei and Di Wang and Yiming Ying and Ding-Xuan Zhou},\nyear={2024},\nurl={https://openreview.net/forum?id=ohdVLirfbz}\n}",
        "github": "",
        "project": "",
        "reviewers": "khQG;BPeY;PsiY;51QV",
        "site": "https://openreview.net/forum?id=ohdVLirfbz",
        "pdf_size": 1130789,
        "rating": "5;5;6;6",
        "confidence": "3;3;3;3",
        "soundness": "3;3;3;3",
        "contribution": "3;2;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "227;85;84;122",
        "wc_strengths": "41;81;93;98",
        "wc_weaknesses": "119;845;118;98",
        "wc_questions": "33;6;127;2",
        "wc_review": "420;1017;422;320",
        "wc_reply_reviewers": "0;0;0;39",
        "wc_reply_authors": "872;2284;1075;439",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "2;5;2;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            129.5,
            58.337380811963094
        ],
        "wc_strengths_avg": [
            78.25,
            22.37604746151563
        ],
        "wc_weaknesses_avg": [
            295.0,
            317.65311268740936
        ],
        "wc_questions_avg": [
            42.0,
            50.502475186865844
        ],
        "wc_review_avg": [
            544.75,
            275.75475970506835
        ],
        "wc_reply_reviewers_avg": [
            9.75,
            16.887495373796554
        ],
        "wc_reply_authors_avg": [
            1167.5,
            684.3173605864461
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            1.5
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15098783240571679412&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Hong Kong Baptist University;University of Hong Kong;University of Sydney",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.hkbu.edu.hk;https://www.hku.hk;https://www.sydney.edu.au",
        "aff_unique_abbr": "HKBU;HKU;USYD",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "China;Australia"
    },
    {
        "id": "oiUhQ4fDLE",
        "title": "Mixup Your Own Pairs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In representation learning, regression has traditionally received less attention than classification. Directly applying representation learning techniques designed for classification to regression often results in fragmented representations in the latent space, yielding sub-optimal performance. In this paper, we argue that the potential of contrastive learning for regression has been overshadowed due to the neglect of two crucial aspects: ordinality-awareness and hardness. To address these challenges, we advocate \"mixup your own contrastive pairs for supervised contrastive regression\", instead of relying solely on real/augmented samples. Specifically, we propose Supervised Contrastive Learning for Regression with Mixup (SupReMix). It takes anchor-inclusive mixtures (mixup of the anchor and a distinct negative sample) as hard negative pairs and anchor-exclusive mixtures (mixup of two distinct negative samples) as hard positive pairs at the embedding level. This strategy formulates harder contrastive pairs by integrating richer ordinal information. Through extensive experiments on six regression datasets including 2D images, volumetric images, text, tabular data, and time-series signals, coupled with theoretical analysis, we demonstrate that SupReMix pre-training fosters continuous ordered representations of regression data, resulting in significant improvement in regression performance. Furthermore, SupReMix is superior to other approaches in a range of regression challenges including transfer learning, imbalanced training data, and scenarios with fewer training samples.",
        "keywords": "regression;mixup;supervised contrastive learning;representation learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/4cbe121441defc36f8762fda5a29f31948c3a03b.zip",
        "author": "Yilei Wu;Zijian Dong;Chongyao Chen;Wangchunshu Zhou;Juan Helen Zhou",
        "authorids": "~Yilei_Wu1;~Zijian_Dong2;~Chongyao_Chen1;~Wangchunshu_Zhou1;~Juan_Helen_Zhou1",
        "gender": "M;M;M;M;F",
        "homepage": "https://github.com/yilei-wu;https://zijiand.github.io/;https://sites.google.com/view/chongyao-chen/;https://michaelzhouwang.github.io;https://discovery.nus.edu.sg/3278-juan-helen-zhou/about",
        "dblp": ";;;245/8640.html;247/7929.html",
        "google_scholar": ";xKUU2_EAAAAJ;fhm9kIgAAAAJ;UebIjuQAAAAJ;https://scholar.google.com.sg/citations?user=4Z1S3_oAAAAJ",
        "orcid": ";0009-0008-4690-137X;;;0000-0002-0180-8648",
        "linkedin": ";;;;juan-helen-zhou2011",
        "or_profile": "~Yilei_Wu1;~Zijian_Dong2;~Chongyao_Chen1;~Wangchunshu_Zhou1;~Juan_Helen_Zhou1",
        "aff": "National University of Singapore;National University of Singapore;Duke University;AIWaves Inc.;National University of Singapore",
        "aff_domain": "u.nus.edu;u.nus.edu;duke.edu;aiwaves.cn;nus.edu.sg",
        "position": "PhD student;PhD student;PhD student;Researcher;Associate Professor",
        "bibtex": "@misc{\nwu2024mixup,\ntitle={Mixup Your Own Pairs},\nauthor={Yilei Wu and Zijian Dong and Chongyao Chen and Wangchunshu Zhou and Juan Helen Zhou},\nyear={2024},\nurl={https://openreview.net/forum?id=oiUhQ4fDLE}\n}",
        "github": "",
        "project": "",
        "reviewers": "ggUN;4GQV;DdrH;gvot",
        "site": "https://openreview.net/forum?id=oiUhQ4fDLE",
        "pdf_size": 1095573,
        "rating": "3;5;6;8",
        "confidence": "5;5;4;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "4;3;2;2",
        "wc_summary": "52;84;126;179",
        "wc_strengths": "17;81;65;116",
        "wc_weaknesses": "233;329;167;278",
        "wc_questions": "2;5;230;4",
        "wc_review": "304;499;588;577",
        "wc_reply_reviewers": "0;497;62;17",
        "wc_reply_authors": "681;2125;1249;975",
        "reply_reviewers": "0;3;1;1",
        "reply_authors": "4;7;4;3",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            110.25,
            47.58347927589995
        ],
        "wc_strengths_avg": [
            69.75,
            35.604599421984794
        ],
        "wc_weaknesses_avg": [
            251.75,
            59.562467208805245
        ],
        "wc_questions_avg": [
            60.25,
            98.01116007884
        ],
        "wc_review_avg": [
            492.0,
            113.83540749696466
        ],
        "wc_reply_reviewers_avg": [
            144.0,
            205.05974739085192
        ],
        "wc_reply_authors_avg": [
            1257.5,
            539.6264911955305
        ],
        "reply_reviewers_avg": [
            1.25,
            1.0897247358851685
        ],
        "reply_authors_avg": [
            4.5,
            1.5
        ],
        "replies_avg": [
            30,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9198662110077999,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4395456590435767247&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1;2;0",
        "aff_unique_norm": "National University of Singapore;Duke University;AIWaves Inc.",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.nus.edu.sg;https://www.duke.edu;",
        "aff_unique_abbr": "NUS;Duke;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;1;0",
        "aff_country_unique": "Singapore;United States"
    },
    {
        "id": "oimPWHTg65",
        "title": "TwinS: Revisiting Non-Stationarity in Multivariate Time Series Forecasting",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recently, multivariate time series forecasting tasks have garnered increasing attention due to their significant practical applications, leading to the emergence of various deep forecasting models. However, real-world time series exhibit pronounced non-stationary distribution characteristics. These characteristics are not solely limited to time-varying statistical properties highlighted by non-stationary Transformer but also encompass three key aspects: nested periodicity, absence of periodic distributions, and hysteresis among time variables. In this paper, we begin by validating this theory through wavelet analysis and propose the Transformer-based TwinS model, which consists of three modules to address the non-stationary periodic distributions: Wavelet Convolution, Period-Aware Attention, and Channel-Temporal Mixed MLP. Specifically, The Wavelet Convolution models nested periods by scaling the convolution kernel size like wavelet transform. The Period Aware Attention guides attention computation by generating period relevance scores through a convolutional sub-network. The Channel-Temporal Mixed MLP captures the overall relationships between time series through channel-time mixing learning. TwinS achieves SOTA performance on eight datasets compared to mainstream TS models, with a maximum improvement in MSE of 25.8% over PatchTST. We have open-sourced our code to facilitate reproducibility for future research: https://anonymous.4open.science/r/TwinS-BBA3/.",
        "keywords": "Time Series Forecasting; Transformer; Non-stationarity",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Jiaxi Hu;Qingsong Wen;Sijie Ruan;Li Liu;Yuxuan Liang",
        "authorids": "~Jiaxi_Hu1;~Qingsong_Wen2;~Sijie_Ruan1;~Li_Liu16;~Yuxuan_Liang1",
        "gender": "M;M;M;M;M",
        "homepage": ";http://www.sjruan.me/;http://www.cse.cqu.edu.cn/info/2095/5647.htm;https://yuxuanliang.com;https://sites.google.com/site/qingsongwen8/",
        "dblp": "71/2455;204/3375;33/4528-1;183/0977;27/561",
        "google_scholar": "TUzje_sAAAAJ;oecbn38AAAAJ;;n9cODgcAAAAJ;vjPJvwYAAAAJ",
        "orcid": ";0000-0002-4520-7174;0000-0002-4776-5292;0000-0003-2817-7337;0000-0003-4516-2524",
        "linkedin": ";;;yoshall/;qingsong-wen-22814156/",
        "or_profile": "~Jiaxi_Hu1;~Sijie_Ruan1;~Li_Liu16;~Yuxuan_Liang1;~Qingsong_Wen1",
        "aff": "Hong Kong University of Science and Technology;Beijing Institute of Technology;Chongqing University;The Hong Kong University of Science and Technology (Guangzhou);Squirrel Ai Learning",
        "aff_domain": "connect.hkust-gz.edu.cn;bit.edu.cn;cqu.edu.cn;hkust-gz.edu.cn;squirrelai.com",
        "position": "PhD student;Assistant Professor;Full Professor;Assistant Professor;Principal Researcher",
        "bibtex": "@misc{\nhu2024twins,\ntitle={TwinS: Revisiting Non-Stationarity in Multivariate Time Series Forecasting},\nauthor={Jiaxi Hu and Qingsong Wen and Sijie Ruan and Li Liu and Yuxuan Liang},\nyear={2024},\nurl={https://openreview.net/forum?id=oimPWHTg65}\n}",
        "github": "",
        "project": "",
        "reviewers": "xxAP;iQeh;j2XZ;i7Bk",
        "site": "https://openreview.net/forum?id=oimPWHTg65",
        "pdf_size": 16969444,
        "rating": "3;5;5;5",
        "confidence": "4;4;4;3",
        "soundness": "2;3;2;3",
        "contribution": "1;2;2;2",
        "presentation": "1;3;2;1",
        "wc_summary": "80;38;49;22",
        "wc_strengths": "50;20;32;70",
        "wc_weaknesses": "379;227;264;35",
        "wc_questions": "46;18;4;119",
        "wc_review": "555;303;349;246",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            47.25,
            21.20583646074825
        ],
        "wc_strengths_avg": [
            43.0,
            18.894443627691185
        ],
        "wc_weaknesses_avg": [
            226.25,
            123.82926754204759
        ],
        "wc_questions_avg": [
            46.75,
            44.36989407244511
        ],
        "wc_review_avg": [
            363.25,
            116.56409181218717
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2448898406112775181&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;0;3",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Beijing Institute of Technology;Chongqing University;Squirrel Ai Learning",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.ust.hk;http://www.bit.edu.cn/;https://www.cqu.edu.cn;https://www.squirrelai.com/",
        "aff_unique_abbr": "HKUST;BIT;CQU;",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Hong Kong SAR;;Guangzhou",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "oj4KUNoKnf",
        "title": "Knowledge Distillation for Closed-Source Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Closed-source language models such as GPT-4 have achieved remarkable performance. Recently, many studies have focused on enhancing the capabilities of smaller models, \nthrough knowledge distillation (KD) on those closed-source language models.\nHowever, due to the inability to directly access the closed-source language model's output distribution, KD methods can currently only be performed using one-hot labels, which hinders the effectiveness of KD.\nTo address this limitation,\nwe propose a Bayesian estimation-based knowledge distillation method. Specifically, our method comprises prior estimation and posterior estimation. The prior estimation obtains a prior distribution by leveraging the corpus generated by the closed-source language model. The posterior estimation updates the prior distribution to obtain a posterior distribution, based on continued sampling results. \nThen we utilize the prior and posterior distributions for distillation.\nExperimental results showcase that, in the context of KD for closed-source language model, our method outperforms the current KD methods that directly fine-tune on the one-hot labels.",
        "keywords": "Knowledge Distillation;Language Model",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/2744de70d7793c3ca9fc37f48ae54a293cca472f.zip",
        "author": "Hongzhan Chen;Xiaojun Quan;Hehong Chen;Ming Yan;Ji Zhang",
        "authorids": "~Hongzhan_Chen1;~Xiaojun_Quan1;~Hehong_Chen1;~Ming_Yan2;~Ji_Zhang3",
        "gender": ";M;M;M;",
        "homepage": "https://github.com/homzer/;https://sites.google.com/site/xiaojunquan/;https://scholar.google.com/citations?user=DqlXS4EAAAAJ&hl=en;;",
        "dblp": ";90/5936;;51/5332-4.html;86/1953-11",
        "google_scholar": ";dRpg4t8AAAAJ;DqlXS4EAAAAJ;uIUfGxYAAAAJ;cgnuJDUAAAAJ",
        "orcid": ";;;0000-0003-4959-8878;",
        "linkedin": ";;;;",
        "or_profile": "~Hongzhan_Chen1;~Xiaojun_Quan1;~Hehong_Chen1;~Ming_Yan2;~Ji_Zhang3",
        "aff": "SUN YAT-SEN UNIVERSITY;SUN YAT-SEN UNIVERSITY;;Alibaba Group;Alibaba Group",
        "aff_domain": "sysu.edu.cn;sysu.edu.cn;;alibaba-inc.com;alibaba-inc.com",
        "position": "MS student;Full Professor;;Instructor;Senior Staff Engineer",
        "bibtex": "@misc{\nchen2024knowledge,\ntitle={Knowledge Distillation for Closed-Source Language Models},\nauthor={Hongzhan Chen and Xiaojun Quan and Hehong Chen and Ming Yan and Ji Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=oj4KUNoKnf}\n}",
        "github": "",
        "project": "",
        "reviewers": "Ryd9;4c71;gDYz;QK8L",
        "site": "https://openreview.net/forum?id=oj4KUNoKnf",
        "pdf_size": 582931,
        "rating": "5;6;6;6",
        "confidence": "5;3;4;3",
        "soundness": "3;3;3;2",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;2",
        "wc_summary": "20;18;83;95",
        "wc_strengths": "9;31;53;34",
        "wc_weaknesses": "73;21;44;55",
        "wc_questions": "117;200;197;88",
        "wc_review": "219;270;377;272",
        "wc_reply_reviewers": "11;0;0;0",
        "wc_reply_authors": "555;527;1127;695",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            54.0,
            35.26329536501091
        ],
        "wc_strengths_avg": [
            31.75,
            15.610493265749165
        ],
        "wc_weaknesses_avg": [
            48.25,
            18.833148966649205
        ],
        "wc_questions_avg": [
            150.5,
            49.094297021140854
        ],
        "wc_review_avg": [
            284.5,
            57.47390712314589
        ],
        "wc_reply_reviewers_avg": [
            2.75,
            4.763139720814412
        ],
        "wc_reply_authors_avg": [
            726.0,
            240.10622649152603
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.8703882797784891,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10702270984711732839&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1;1",
        "aff_unique_norm": "Sun Yat-sen University;Alibaba Group",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.sysu.edu.cn;https://www.alibaba.com",
        "aff_unique_abbr": "SYSU;Alibaba",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "ojAc7y2P4K",
        "title": "Dispatching Ambulances using Deep Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Emergency Medical Service (EMS) plays an essential role in today's society.  One EMS component is ambulance dispatch,  which impacts the ambulance's response time for a medical incident.  Fast response times are essential. The problem of ambulance dispatching differs from a typical Vehicle Routing Problem (VRP) since patients arrive stochastically, making the problem hard to solve. \nIn addition to minimizing response time, EMS providers seek optimal resource utilization and good working conditions for EMS personnel while often experiencing an increase in demand. To meet these requirements, this work develops a Reinforcement learning (RL) method based on Proximal Policy Optimization (PPO) for the ambulance dispatching problem.  Varying incident priorities along with more flexible incident queue management are also integrated into our novel method.  Our PPO-based method and an EMS simulation model are implemented in Python and combined with Open Street Map (OSM) travel time estimation and simple synthetic incident data generation. Empirical results are presented using both synthetic and real incident data.  Results using real incident data from the Oslo University Hospital (OUH) in Norway suggest that our PPO model outperforms heuristic policies such as dispatching the closest ambulance by Haversine or Euclidean distance.  We hope that this work inspires future research on RL for ambulance dispatch and ultimately leads to improved decision-support tools for EMS in Norway and elsewhere.",
        "keywords": "Emergency Medical Service;Ambulance Dispatch;Deep Reinforcement Learning;Proximal Policy Optimization",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Jon Elias Moen;Ole Jakob Mengshoel",
        "authorids": "jon39334@gmail.com;~Ole_Jakob_Mengshoel1",
        "gender": ";",
        "homepage": ";",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "jon39334@gmail.com;~Ole_Jakob_Mengshoel1",
        "aff": ";",
        "aff_domain": ";",
        "position": ";",
        "bibtex": "@misc{\nmoen2024dispatching,\ntitle={Dispatching Ambulances using Deep Reinforcement Learning},\nauthor={Jon Elias Moen and Ole Jakob Mengshoel},\nyear={2024},\nurl={https://openreview.net/forum?id=ojAc7y2P4K}\n}",
        "github": "",
        "project": "",
        "reviewers": "EADM;QFkk;oGnc;7VUh",
        "site": "https://openreview.net/forum?id=ojAc7y2P4K",
        "pdf_size": 335830,
        "rating": "3;5;5;8",
        "confidence": "4;5;4;3",
        "soundness": "2;3;2;4",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;4",
        "wc_summary": "115;105;111;72",
        "wc_strengths": "71;68;129;91",
        "wc_weaknesses": "122;153;261;36",
        "wc_questions": "8;121;94;40",
        "wc_review": "316;447;595;239",
        "wc_reply_reviewers": "0;0;57;0",
        "wc_reply_authors": "201;139;351;73",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            100.75,
            16.97608612136496
        ],
        "wc_strengths_avg": [
            89.75,
            24.324627438051337
        ],
        "wc_weaknesses_avg": [
            143.0,
            80.48912970084842
        ],
        "wc_questions_avg": [
            65.75,
            44.2965856472031
        ],
        "wc_review_avg": [
            399.25,
            135.2855775757342
        ],
        "wc_reply_reviewers_avg": [
            14.25,
            24.681724007856502
        ],
        "wc_reply_authors_avg": [
            191.0,
            102.86884854026509
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5940885257860046,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:khPRczHdTvMJ:scholar.google.com/&scioq=Dispatching+Ambulances+using+Deep+Reinforcement+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0
    },
    {
        "title": "Copula Conformal prediction for multi-step time series prediction",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17807",
        "id": "ojIJZDNIBj",
        "author_site": "Sophia Sun, Rose Yu",
        "tldr": "",
        "abstract": "Accurate uncertainty measurement is a key step in building robust and reliable machine learning systems. Conformal prediction is a distribution-free uncertainty quantification framework popular for its ease of implementation, finite-sample coverage guarantees, and generality for underlying prediction algorithms. However, existing conformal prediction approaches for time series are limited to single-step prediction without considering the temporal dependency. In this paper, we propose the Copula Conformal Prediction algorithm for multivariate, multi-step Time Series forecasting, CopulaCPTS. We prove that CopulaCPTS has finite-sample validity guarantee. On four synthetic and real-world multivariate time series datasets, we show that CopulaCPTS produces more calibrated and efficient confidence intervals for multi-step prediction tasks than existing techniques. Our code is open-sourced at https://github.com/Rose-STL-Lab/CopulaCPTS.",
        "keywords": "Conformal Prediction;time series;uncertainty quantification;calibration;RNN",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/80d047c0b07efaf273302096466763cfa6047115.zip",
        "author": "Sophia Huiwen Sun;Rose Yu",
        "authorids": "~Sophia_Huiwen_Sun1;~Rose_Yu1",
        "gender": "F;F",
        "homepage": "https://huiwenn.github.io/;http://roseyu.com",
        "dblp": "319/6856;164/7314",
        "google_scholar": "https://scholar.google.com/citations?hl=en;",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Sophia_Huiwen_Sun1;~Rose_Yu1",
        "aff": "University of California, San Diego, University of California, San Diego;University of California, San Diego",
        "aff_domain": "eng.ucsd.edu;ucsd.edu",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nsun2024copula,\ntitle={Copula Conformal prediction for multi-step time series prediction},\nauthor={Sophia Huiwen Sun and Rose Yu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ojIJZDNIBj}\n}",
        "github": "",
        "project": "",
        "reviewers": "ruzn;XEiW;3Gfg;bjQ8",
        "pdf_size": 2375999,
        "rating": "5;6;6;8",
        "confidence": "4;3;4;4",
        "soundness": "3;3;2;3",
        "contribution": "2;3;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "17;67;32;83",
        "wc_strengths": "19;33;38;116",
        "wc_weaknesses": "149;85;168;27",
        "wc_questions": "5;134;192;92",
        "wc_review": "190;319;430;318",
        "wc_reply_reviewers": "0;155;0;16",
        "wc_reply_authors": "379;956;950;121",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "1;2;2;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            49.75,
            26.413774815425377
        ],
        "wc_strengths_avg": [
            51.5,
            37.88469347902923
        ],
        "wc_weaknesses_avg": [
            107.25,
            55.60744104883806
        ],
        "wc_questions_avg": [
            105.75,
            68.14827584025879
        ],
        "wc_review_avg": [
            314.25,
            84.95991701973348
        ],
        "wc_reply_reviewers_avg": [
            42.75,
            65.13591559193745
        ],
        "wc_reply_authors_avg": [
            601.5,
            363.14907407289365
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.13245323570650439,
        "gs_citation": 20,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6956444904738683521&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=ojIJZDNIBj",
        "pdf": "https://openreview.net/pdf?id=ojIJZDNIBj",
        "email": "eng.ucsd.edu;ucsd.edu",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of California, San Diego",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucsd.edu",
        "aff_unique_abbr": "UCSD",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "San Diego",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "ojrVw6GFFD",
        "title": "Personalized Federated Learning of Probabilistic Models: A PAC-Bayesian Approach",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Federated learning aims to infer a shared model from private and decentralized data stored locally by multiple clients.\nPersonalized federated learning (PFL) goes one step further by adapting the global model to each client's data, enhancing the model's fit for different clients.\nA significant level of personalization is required for highly heterogeneous clients, but can be challenging to achieve especially when they have small datasets.\nTo address this problem, we propose a PFL algorithm named *PAC-PFL* for learning probabilistic models within a PAC-Bayesian framework that utilizes differential privacy to handle data-dependent priors.\nOur algorithm collaboratively learns a shared hyper-posterior and regards each client's posterior inference as the personalization step.\nBy establishing and minimizing a generalization bound on the average true risk of clients, PAC-PFL effectively combats over-fitting.\nEmpirically, PAC-PFL achieves accurate and well-calibrated predictions as demonstrated through experiments on a highly heterogeneous dataset of photovoltaic panel power generation and the FEMNIST dataset.",
        "keywords": "Federated Learning;Probabilistic Modeling;PAC-Bayesian Learning",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Mahrokh Ghoddousi Boroujeni;Andreas Krause;Giancarlo Ferrari-Trecate",
        "authorids": "~Mahrokh_Ghoddousi_Boroujeni1;~Andreas_Krause1;~Giancarlo_Ferrari-Trecate2",
        "gender": "F;M;M",
        "homepage": "https://people.epfl.ch/mahrokh.ghoddousiboroujeni?lang=en;https://las.inf.ethz.ch/krausea;https://www.epfl.ch/labs/decode/",
        "dblp": "255/5891;87/1831-1.html;05/4552",
        "google_scholar": "hE8QWWcAAAAJ;https://scholar.google.ch/citations?user=eDHv58AAAAAJ;iL8JWxAAAAAJ",
        "orcid": ";0000-0001-7260-9673;0000-0002-9492-9624",
        "linkedin": "mahrokhghoddousi/;krausea/;",
        "or_profile": "~Mahrokh_Ghoddousi_Boroujeni1;~Andreas_Krause1;~Giancarlo_Ferrari_Trecate1",
        "aff": "EPFL - EPF Lausanne;ETH Zurich;EPFL - EPF Lausanne",
        "aff_domain": "epfl.ch;ethz.ch;epfl.ch",
        "position": "PhD student;Full Professor;Full Professor",
        "bibtex": "@misc{\nboroujeni2024personalized,\ntitle={Personalized Federated Learning of Probabilistic Models: A {PAC}-Bayesian Approach},\nauthor={Mahrokh Ghoddousi Boroujeni and Andreas Krause and Giancarlo Ferrari-Trecate},\nyear={2024},\nurl={https://openreview.net/forum?id=ojrVw6GFFD}\n}",
        "github": "",
        "project": "",
        "reviewers": "5CVc;QnoR;D4J2;HvmF",
        "site": "https://openreview.net/forum?id=ojrVw6GFFD",
        "pdf_size": 658071,
        "rating": "3;5;6;8",
        "confidence": "4;3;3;3",
        "soundness": "3;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;3;3",
        "wc_summary": "75;62;79;100",
        "wc_strengths": "46;65;17;30",
        "wc_weaknesses": "139;59;248;76",
        "wc_questions": "114;37;10;3",
        "wc_review": "374;223;354;209",
        "wc_reply_reviewers": "38;0;94;6",
        "wc_reply_authors": "1375;780;1922;303",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "3;2;3;1",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            79.0,
            13.656500283747663
        ],
        "wc_strengths_avg": [
            39.5,
            17.95132307101624
        ],
        "wc_weaknesses_avg": [
            130.5,
            74.0962212261867
        ],
        "wc_questions_avg": [
            41.0,
            44.017042154147525
        ],
        "wc_review_avg": [
            290.0,
            74.50167783345553
        ],
        "wc_reply_reviewers_avg": [
            34.5,
            37.265936188428164
        ],
        "wc_reply_authors_avg": [
            1095.0,
            610.0856497246923
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8006407690254357,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12569912113697222755&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "EPFL;ETH Zurich",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.epfl.ch;https://www.ethz.ch",
        "aff_unique_abbr": "EPFL;ETHZ",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Lausanne;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Switzerland"
    },
    {
        "title": "A Lie Group Approach to Riemannian Batch Normalization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17806",
        "id": "okYdj8Ysru",
        "author_site": "Ziheng Chen, Yue Song, Yunmei Liu, Nicu Sebe",
        "tldr": "",
        "abstract": "Manifold-valued measurements exist in numerous applications within computer vision and machine learning. Recent studies have extended Deep Neural Networks (DNNs) to manifolds, and concomitantly, normalization techniques have also been adapted to several manifolds, referred to as Riemannian normalization. Nonetheless, most of the existing Riemannian normalization methods have been derived in an ad hoc manner and only apply to specific manifolds. This paper establishes a unified framework for Riemannian Batch Normalization (RBN) techniques on Lie groups. Our framework offers the theoretical guarantee of controlling both the Riemannian mean and variance. Empirically, we focus on Symmetric Positive Definite (SPD) manifolds, which possess three distinct types of Lie group structures. Using the deformation concept, we generalize the existing Lie groups on SPD manifolds into three families of parameterized Lie groups. Specific normalization layers induced by these Lie groups are then proposed for SPD neural networks. We demonstrate the effectiveness of our approach through three sets of experiments: radar recognition, human action recognition, and electroencephalography (EEG) classification. The code is available at https://github.com/GitZH-Chen/LieBN.git.",
        "keywords": "Lie Groups;Riemannian Batch Normalization;SPD Neural Networks",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Ziheng Chen;Yue Song;Yunmei Liu;Nicu Sebe",
        "authorids": "~Ziheng_Chen2;~Yue_Song1;~Yunmei_Liu1;~Nicu_Sebe1",
        "gender": "M;M;F;M",
        "homepage": "https://gitzh-chen.github.io/;https://kingjamessong.github.io/;https://yunmeil.github.io/;http://disi.unitn.it/~sebe/",
        "dblp": ";11/1346;;20/3519",
        "google_scholar": "47Y-sn4AAAAJ;Uza2i10AAAAJ;;https://scholar.google.it/citations?user=stFCYOAAAAAJ",
        "orcid": "0000-0002-5366-7293;;;0000-0002-6597-7248",
        "linkedin": "ziheng-chen-geometrier/;;;",
        "or_profile": "~Ziheng_Chen2;~Yue_Song1;~Yunmei_Liu1;~Nicu_Sebe1",
        "aff": "University of Trento;University of Trento, Italy;;University of Trento",
        "aff_domain": "unitn.it;unitn.it;;unitn.it",
        "position": "PhD student;PhD student;;Full Professor",
        "bibtex": "@inproceedings{\nchen2024a,\ntitle={A Lie Group Approach to Riemannian Batch Normalization},\nauthor={Ziheng Chen and Yue Song and Yunmei Liu and Nicu Sebe},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=okYdj8Ysru}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZRPd;LaGM;R6Kt;B3vJ;Urfr",
        "pdf_size": 434759,
        "rating": "1;3;6;8;8",
        "confidence": "4;3;3;5;5",
        "soundness": "3;3;3;4;4",
        "contribution": "1;1;3;3;3",
        "presentation": "3;2;3;3;3",
        "wc_summary": "39;25;79;71;44",
        "wc_strengths": "25;41;31;22;49",
        "wc_weaknesses": "22;142;277;150;89",
        "wc_questions": "208;28;35;220;90",
        "wc_review": "294;236;422;463;272",
        "wc_reply_reviewers": "27;12;13;0;115",
        "wc_reply_authors": "806;693;774;179;1256",
        "reply_reviewers": "1;1;1;0;3",
        "reply_authors": "2;2;2;1;4",
        "rating_avg": [
            5.2,
            2.7856776554368237
        ],
        "confidence_avg": [
            4.0,
            0.8944271909999159
        ],
        "soundness_avg": [
            3.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.2,
            0.9797958971132712
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            51.6,
            20.254382241875458
        ],
        "wc_strengths_avg": [
            33.6,
            10.071742649611338
        ],
        "wc_weaknesses_avg": [
            136.0,
            84.0452259203341
        ],
        "wc_questions_avg": [
            116.2,
            82.7777747949291
        ],
        "wc_review_avg": [
            337.4,
            88.74142212067598
        ],
        "wc_reply_reviewers_avg": [
            33.4,
            41.6874081708134
        ],
        "wc_reply_authors_avg": [
            741.6,
            343.1283141916446
        ],
        "reply_reviewers_avg": [
            1.2,
            0.9797958971132712
        ],
        "reply_authors_avg": [
            2.2,
            0.9797958971132712
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5618911366844436,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14484195843036454174&as_sdt=4000005&sciodt=0,18&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=okYdj8Ysru",
        "pdf": "https://openreview.net/pdf?id=okYdj8Ysru",
        "email": "unitn.it;unitn.it;;unitn.it",
        "author_num": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Trento",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.unitn.it",
        "aff_unique_abbr": "UniTN",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Italy"
    },
    {
        "id": "olOheQ0ZcK",
        "title": "Distance Estimation for High-Dimensional Distributions",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We study the distance estimation problem for high-dimensional distributions. Given two distributions $\\mathcal{P}$ and $\\mathcal{Q}$ over $\\{0,1\\}^n$, and a parameter $\\varepsilon$, the goal of distance estimation is to determine the statistical distance between the two distributions up to an additive tolerance $\\pm \\varepsilon$. Since exponential lower bounds (in $n$) are known for the problem in the standard sampling model, research has focused on models where one can draw conditional samples. \n\nAmong these models, \\textit{subcube conditioning} ($\\mathsf{SUBCOND}$), i.e., conditioning on arbitrary subcubes of the domain, holds the promise of widespread practical adoption owing to its ability to capture the natural behavior of distribution samplers. In this paper, we present the first polynomial sample distance estimator in the conditional sampling model, and our algorithm makes $\\tilde{\\mathcal{O}}(n^3/\\varepsilon^5)$ \\subcond queries. We implement our algorithm to estimate the distance between distributions arising from real-life sampling benchmarks, and we find that our algorithm easily scales beyond the naive method.",
        "keywords": "Sampling;Distribution Testing;High-dimensional statistics",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Gunjan Kumar;Kuldeep S. Meel;Yash Pote",
        "authorids": "~Gunjan_Kumar3;~Kuldeep_S._Meel2;~Yash_Pote1",
        "gender": ";M;M",
        "homepage": "https://sites.google.com/view/gunjankumar;https://www.kuldeepmeel.com;",
        "dblp": "127/7421.html;https://dblp.org/pers/m/Meel:Kuldeep_S=.html;246/3083.html",
        "google_scholar": ";;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Gunjan_Kumar3;~Kuldeep_S._Meel2;~Yash_Pote1",
        "aff": "National University of Singapore;University of Toronto;National University of Singapore",
        "aff_domain": "nus.edu;comp.nus.edu.sg;u.nus.edu",
        "position": "Postdoc;Associate Professor;PhD student",
        "bibtex": "@misc{\nkumar2024distance,\ntitle={Distance Estimation for High-Dimensional Distributions},\nauthor={Gunjan Kumar and Kuldeep S. Meel and Yash Pote},\nyear={2024},\nurl={https://openreview.net/forum?id=olOheQ0ZcK}\n}",
        "github": "",
        "project": "",
        "reviewers": "SPku;4aJb;F6ny;YTK5",
        "site": "https://openreview.net/forum?id=olOheQ0ZcK",
        "pdf_size": 432084,
        "rating": "1;6;8;8",
        "confidence": "4;4;3;4",
        "soundness": "1;4;2;4",
        "contribution": "1;3;3;4",
        "presentation": "1;4;2;3",
        "wc_summary": "27;81;104;119",
        "wc_strengths": "38;71;48;185",
        "wc_weaknesses": "110;75;170;93",
        "wc_questions": "24;70;133;34",
        "wc_review": "199;297;455;431",
        "wc_reply_reviewers": "0;0;75;0",
        "wc_reply_authors": "181;130;274;86",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.75,
            2.8613807855648994
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            1.299038105676658
        ],
        "contribution_avg": [
            2.75,
            1.0897247358851685
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            82.75,
            34.91686555233731
        ],
        "wc_strengths_avg": [
            85.5,
            58.67921267365471
        ],
        "wc_weaknesses_avg": [
            112.0,
            35.70014005574768
        ],
        "wc_questions_avg": [
            65.25,
            42.692944381946766
        ],
        "wc_review_avg": [
            345.5,
            103.82075900319742
        ],
        "wc_reply_reviewers_avg": [
            18.75,
            32.47595264191645
        ],
        "wc_reply_authors_avg": [
            167.75,
            69.95132236062446
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.45398994507478646,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:qI-RWGbILG4J:scholar.google.com/&scioq=Distance+Estimation+for+High-Dimensional+Distributions&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "National University of Singapore;University of Toronto",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.nus.edu.sg;https://www.utoronto.ca",
        "aff_unique_abbr": "NUS;U of T",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Singapore;Canada"
    },
    {
        "id": "olUa1nOKjN",
        "title": "Pre-trained Neural Recommenders: Learning Statistical Representations for Zero-shot Recommender Systems",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Modern neural collaborative filtering (NCF) techniques are critical to the success of e-commerce, social media, and content-sharing platforms. However, despite technical advances---for every new application domain, we need to train an NCF model from scratch. In contrast, pre-trained vision and language models are routinely applied to diverse applications directly (zero-shot) or with limited fine-tuning. Inspired by the impact of pre-trained models, we explore the possibility of pre-trained recommender models that support building recommender systems in new domains, with minimal or no retraining, without the use of any auxiliary user or item information. We propose a framework that computes the user and item representations via learning the representations of the user/item activity quantiles. With extensive experiments on five diverse datasets, we show that the framework can not only generalize to unseen users and unseen items within a dataset and across different datasets (i.e., cross-domain, zero-shot) but with comparable performance to state-of-the-art neural recommenders.",
        "keywords": "Recommender System;Zero-shot Learning;Pre-trained Models;Neural Collaborative Filtering",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/41efc7f0ac11774fa639aaeeb3df866e83be59df.zip",
        "author": "Junting Wang;ADIT KRISHNAN;Hari Sundaram;Yunzhe Li",
        "authorids": "~Junting_Wang1;~ADIT_KRISHNAN1;~Hari_Sundaram1;~Yunzhe_Li2",
        "gender": "M;M;M;M",
        "homepage": "https://junting-wang.com/;http://aditk2.web.engr.illinois.edu/;http://sundaram.cs.illinois.edu;",
        "dblp": "225/1958-1;169/7477.html;;",
        "google_scholar": "YogdvtkAAAAJ;pWaAozwAAAAJ;Z962IGQAAAAJ;",
        "orcid": ";0000-0002-8676-257X;0000-0003-3315-6055;0000-0003-4146-8542",
        "linkedin": ";adit-krishnan93/;;",
        "or_profile": "~Junting_Wang1;~ADIT_KRISHNAN1;~Hari_Sundaram1;~Yunzhe_Li2",
        "aff": "Department of Computer Science;Amazon;University of Illinois, Urbana Champaign;University of Illinois, Urbana-Champaign",
        "aff_domain": "cs.illinois.edu;amazon.com;illinois.edu;cs.illinois.edu",
        "position": "PhD student;Researcher;Full Professor;PhD student",
        "bibtex": "@misc{\nwang2024pretrained,\ntitle={Pre-trained Neural Recommenders: Learning Statistical Representations for Zero-shot Recommender Systems},\nauthor={Junting Wang and ADIT KRISHNAN and Hari Sundaram and Yunzhe Li},\nyear={2024},\nurl={https://openreview.net/forum?id=olUa1nOKjN}\n}",
        "github": "",
        "project": "",
        "reviewers": "aga8;YAJj;bhvm;b2di",
        "site": "https://openreview.net/forum?id=olUa1nOKjN",
        "pdf_size": 1067528,
        "rating": "3;3;3;5",
        "confidence": "4;4;4;3",
        "soundness": "2;2;2;2",
        "contribution": "2;1;2;2",
        "presentation": "3;4;3;3",
        "wc_summary": "65;48;91;82",
        "wc_strengths": "66;32;35;71",
        "wc_weaknesses": "65;119;352;57",
        "wc_questions": "63;58;60;36",
        "wc_review": "259;257;538;246",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            71.5,
            16.469669092000604
        ],
        "wc_strengths_avg": [
            51.0,
            17.621010186706094
        ],
        "wc_weaknesses_avg": [
            148.25,
            120.02786134893849
        ],
        "wc_questions_avg": [
            54.25,
            10.685855136581255
        ],
        "wc_review_avg": [
            325.0,
            123.07518027612228
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:foGC1NwodwIJ:scholar.google.com/&scioq=Pre-trained+Neural+Recommenders:+Learning+Statistical+Representations+for+Zero-shot+Recommender+Systems&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Unknown Institution;Amazon;University of Illinois Urbana-Champaign;University of Illinois",
        "aff_unique_dep": "Department of Computer Science;Amazon.com, Inc.;;",
        "aff_unique_url": ";https://www.amazon.com;https://illinois.edu;https://illinois.edu",
        "aff_unique_abbr": ";Amazon;UIUC;UIUC",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Urbana-Champaign",
        "aff_country_unique_index": "1;1;1",
        "aff_country_unique": ";United States"
    },
    {
        "id": "olnuBGxGRs",
        "title": "Deep Learning-based Discrimination of Pause Episodes in Insertable Cardiac Monitors",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Remote monitoring of patients with insertable cardiac monitors (ICMs) has revolutionized follow-up procedures and enhanced the timely diagnosis of cardiac arrhythmias. Despite these advancements, challenges persist in managing and adjudicating the data generated, placing strain on clinic resources. In response, various studies have explored the application of Convolutional Neural Networks (CNNs) to classify raw electrocardiograms (ECGs).\n\nThe objective of this study was to create and assess a CNN tailored for the reduction of inappropriate pause detections in ICMs. A customized end-to-end CNN model comprising 5 convolutional layers for rhythm classification of ICM-detected pause episodes was developed. The training data consisted of ICM-detected pause episodes from 1,173 patients. After training the model, we evaluated its performance using a test dataset of ICM-detected pause episodes from 750 independent patients. All pause episodes utilized in training and testing were adjudicated manually as either true or false detection.  The training dataset consisted of 4,308 pause episodes (2,722 true episodes from 960 patients and 1,586 false episodes from 251 patients). The validation dataset includes 1,095 detected Pause episodes from 256 patients (677 true pause from 203 patients and 418 false pause episodes from 58 patients) and had an area under the curve (AUC) of 0.994 for the proposed CNN. The optimal threshold was chosen to obtain 99.26\\% sensitivity and 96.89\\%. The test dataset consisted of 1,986 episodes (744 true episodes from 382 patients and 1,242 false episodes from 485 patients. The model demonstrated an AUC of 0.9942, 99.06\\% sensitivity, and 95.17\\% specificity in the test dataset.\n\nThe customized CNN model, 737 out of 744 episodes were correctly identified as pauses, resulting in a positive predictive value of 92.47\\%. Consequently, there was a reduction of EGM burden by 59.87\\%.",
        "keywords": "Insertable cardiac monitors;ECG;CNN;Remote monitoring;Pause detection;AI;Machine learning;Data augmentation.",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Elnaz Lashgari;Daniel Monje;Fady Dawoud;Fujian Qu",
        "authorids": "~Elnaz_Lashgari1;~Daniel_Monje1;~Fady_Dawoud1;~Fujian_Qu1",
        "gender": "F;M;M;M",
        "homepage": ";;;",
        "dblp": ";;;",
        "google_scholar": "A9oQqF0AAAAJ;;kQiyxi4AAAAJ;",
        "orcid": "0000-0002-0302-8098;;;0000-0003-3210-1423",
        "linkedin": ";danielmonje/;;",
        "or_profile": "~Elnaz_Lashgari1;~Daniel_Monje1;~Fady_Dawoud1;~Fujian_Qu1",
        "aff": "Abbott;;;",
        "aff_domain": "abbott.com;;;",
        "position": "Researcher;;;",
        "bibtex": "@misc{\nlashgari2024deep,\ntitle={Deep Learning-based Discrimination of Pause Episodes in Insertable Cardiac Monitors},\nauthor={Elnaz Lashgari and Daniel Monje and Fady Dawoud and Fujian Qu},\nyear={2024},\nurl={https://openreview.net/forum?id=olnuBGxGRs}\n}",
        "github": "",
        "project": "",
        "reviewers": "5Euk;zXt2;cDD3",
        "site": "https://openreview.net/forum?id=olnuBGxGRs",
        "pdf_size": 755642,
        "rating": "1;1;1",
        "confidence": "5;5;5",
        "soundness": "1;3;2",
        "contribution": "1;1;1",
        "presentation": "1;2;1",
        "wc_summary": "53;13;24",
        "wc_strengths": "27;22;38",
        "wc_weaknesses": "312;22;57",
        "wc_questions": "162;20;57",
        "wc_review": "554;77;176",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            1.0,
            0.0
        ],
        "confidence_avg": [
            5.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            1.0,
            0.0
        ],
        "presentation_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            30.0,
            16.87206764645835
        ],
        "wc_strengths_avg": [
            29.0,
            6.683312551921141
        ],
        "wc_weaknesses_avg": [
            130.33333333333334,
            129.24997313560866
        ],
        "wc_questions_avg": [
            79.66666666666667,
            60.14611837480084
        ],
        "wc_review_avg": [
            269.0,
            205.53831759552767
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:-I4WMurA_E8J:scholar.google.com/&scioq=Deep+Learning-based+Discrimination+of+Pause+Episodes+in+Insertable+Cardiac+Monitors&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Abbott Laboratories",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.abbott.com",
        "aff_unique_abbr": "Abbott",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "om5z1n0mXA",
        "title": "Rethinking the Effectiveness of Graph Classification Datasets in Benchmarks for Assessing GNNs",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Graph classification benchmarks, vital for assessing and developing graph neural network (GNN) models, have recently been scrutinized, as simple methods like MLPs have demonstrated comparable performance on certain datasets. This leads to an important question: Do these benchmarks effectively distinguish the advancements of GNNs over other methodologies? If so, how do we quantitatively measure this effectiveness? In response, we propose an empirical protocol based on a fair benchmarking framework to investigate the performance discrepancy between simple methods and GNNs. We further propose a novel metric to quantify the effectiveness of a dataset by utilizing the performance gaps and considering dataset complexity. Through extensive testing across 16 real-world datasets, we found our metric to align with existing studies and intuitive assumptions. Finally, to explore the causes behind the low effectiveness, we investigated the relationship between intrinsic graph properties and task labels and developed a novel technique for generating more synthetic datasets that can precisely control these correlations. Our findings shed light on the current understanding of benchmark datasets, and our new platform backed by an effectiveness validation protocol could fuel the future evolution of graph classification benchmarks.",
        "keywords": "graph classification benchmark;graph neural networks;effectiveness of dataset",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Zhengdao Li;Yong Cao;Kefan Shuai;Yiming Miao;Kai Hwang",
        "authorids": "~Zhengdao_Li1;~Yong_Cao3;~Kefan_Shuai1;~Yiming_Miao1;~Kai_Hwang2",
        "gender": ";M;M;F;M",
        "homepage": ";https://yongcaoplus.github.io/;;https://myweb.cuhk.edu.cn/miaoyiming;https://myweb.cuhk.edu.cn/hwangkai",
        "dblp": ";22/5940;;186/8874.html;",
        "google_scholar": ";https://scholar.google.com.hk/citations?user=-v8WGmQAAAAJ;;uKUBH38AAAAJ;igFuAncAAAAJ",
        "orcid": ";;0000-0002-7836-9372;0000-0003-1580-9120;",
        "linkedin": ";;;;",
        "or_profile": "~Zhengdao_Li1;~Yong_Cao3;~Kefan_Shuai1;~Yiming_Miao1;~Kai_Hwang2",
        "aff": ";University of Copenhagen;;The Chinese University of Hong Kong;Purdue University",
        "aff_domain": ";di.ku.dk;;cuhk.edu.cn;purdue.edu",
        "position": ";PhD student;;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nanonymous2024rethinking,\ntitle={Rethinking the Effectiveness of Graph Classification Datasets in Benchmarks for Assessing {GNN}s},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=om5z1n0mXA}\n}",
        "github": "",
        "project": "",
        "reviewers": "DPDx;yi6y;eLa4;EXhn",
        "site": "https://openreview.net/forum?id=om5z1n0mXA",
        "pdf_size": 14973982,
        "rating": "5;5;6;8",
        "confidence": "3;3;3;4",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;3;2",
        "wc_summary": "48;147;85;61",
        "wc_strengths": "78;134;95;60",
        "wc_weaknesses": "145;248;126;59",
        "wc_questions": "49;112;17;21",
        "wc_review": "320;641;323;201",
        "wc_reply_reviewers": "254;23;4;13",
        "wc_reply_authors": "621;1742;510;277",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;3;1;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            85.25,
            38.041917669854655
        ],
        "wc_strengths_avg": [
            91.75,
            27.3530162870569
        ],
        "wc_weaknesses_avg": [
            144.5,
            67.75876327088622
        ],
        "wc_questions_avg": [
            49.75,
            37.995887935406905
        ],
        "wc_review_avg": [
            371.25,
            163.32846506350324
        ],
        "wc_reply_reviewers_avg": [
            73.5,
            104.42820500228854
        ],
        "wc_reply_authors_avg": [
            787.5,
            564.8913612368311
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.9428090415820632,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16540095068114818103&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of Copenhagen;Chinese University of Hong Kong;Purdue University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ku.dk;https://www.cuhk.edu.hk;https://www.purdue.edu",
        "aff_unique_abbr": "UCPH;CUHK;Purdue",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;1;2",
        "aff_country_unique": "Denmark;China;United States"
    },
    {
        "id": "omSp3S5GHl",
        "title": "Multi-attacks: Many images + the same adversarial attack -> many target labels",
        "track": "main",
        "status": "Desk Reject",
        "tldr": "",
        "abstract": "We show that we can easily design a single adversarial perturbation $P$ that changes the class of $n$ images $X_1,X_2,\\dots,X_n$ from their original, unperturbed classes $c_1, c_2,\\dots,c_n$ to desired (not necessarily all the same) classes $c^*_1,c^*_2,\\dots,c^*_n$ for up to hundreds of images and target classes at once. We call these \\textit{multi-attacks}. Characterizing the maximum $n$ we can achieve under different conditions such as image resolution, we estimate the number of regions of high class confidence around a particular image in the space of pixels to be around $10^{\\mathcal{O}(100)}$, posing a significant problem for exhaustive defense strategies. We show several immediate consequences of this: adversarial attacks that change the resulting class based on their intensity, and scale-independent adversarial examples. To demonstrate the redundancy and richness of class decision in the pixel space, we look for its two-dimensional sections that trace images and spell words using particular classes. We also show that ensembling reduces susceptibility to multi-attacks, and that classifiers trained on random labels are more susceptible. Our code is available on GitHub.",
        "keywords": "adversarial;attack;dimension;input space;class;adversary;defense;security;safety",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Stanislav Fort",
        "authorids": "~Stanislav_Fort1",
        "gender": "M",
        "homepage": "http://stanford.edu/~sfort1/",
        "dblp": "205/3072",
        "google_scholar": "https://scholar.google.cz/citations?user=eu2Kzn0AAAAJ",
        "orcid": "",
        "linkedin": "stanislav-fort-38199a58/",
        "or_profile": "~Stanislav_Fort1",
        "aff": "Google",
        "aff_domain": "deepmind.com",
        "position": "Researcher",
        "bibtex": "@misc{\nfort2024multiattacks,\ntitle={Multi-attacks: Many images + the same adversarial attack -\\ensuremath{>} many target labels},\nauthor={Stanislav Fort},\nyear={2024},\nurl={https://openreview.net/forum?id=omSp3S5GHl}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=omSp3S5GHl",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:I_CvtYfZXoMJ:scholar.google.com/&scioq=Multi-attacks:+Many+images+%2B+the+same+adversarial+attack+-%3E+many+target+labels&hl=en&as_sdt=0,33",
        "gs_version_total": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "Google",
        "aff_unique_dep": "Google",
        "aff_unique_url": "https://www.google.com",
        "aff_unique_abbr": "Google",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Mountain View",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "onYFop1lGn",
        "title": "Representation Norm Amplification for Out-of-Distribution Detection in Long-Tail Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Detecting out-of-distribution (OOD) samples is a critical task for reliable machine learning. However, this task becomes particularly challenging when the models are trained on long-tailed datasets,  as the models often struggle to distinguish tail-class in-distribution  samples from OOD samples. We examine the main challenges in this problem by identifying the trade-offs between OOD detection and in-distribution (ID) classification, faced by existing methods. We then introduce our method, called Representation Norm Amplification (RNA), which solves this challenge by decoupling the two problems. The main idea is to use the norm of the representation as a new dimension for OOD detection, and to develop a training method that generates a noticeable discrepancy in the representation norm between ID and OOD data, while not perturbing the feature learning for in-distribution classification. Our experiments show that RNA achieves superior performance in both OOD detection and classification compared to the state-of-the-art methods, by 2.36\\%, 1.17\\%, and 7.38\\% in AUROC and 2.20\\%, 0.95\\%, and 2.84\\% in classification accuracy on CIFAR10-LT, CIFAR100-LT, and ImageNet-LT, respectively.",
        "keywords": "Out-of-distribution detection;long-tailed recognition",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/bf3529a1dcd8c00b998edd6ad7aa0943c95403f7.zip",
        "author": "Dong Geun Shin;Hye Won Chung",
        "authorids": "~Dong_Geun_Shin1;~Hye_Won_Chung2",
        "gender": "F;",
        "homepage": "https://iids.kaist.ac.kr/;http://iids.kaist.ac.kr/",
        "dblp": "https://dblp.uni-trier.de/pers/hd/c/Chung:Hye_Won;",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Hye_Won_Chung2;~Donggeun_Shin1",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr",
        "position": "Associate Professor;PhD student",
        "bibtex": "@misc{\nshin2024representation,\ntitle={Representation Norm Amplification for Out-of-Distribution Detection in Long-Tail Learning},\nauthor={Dong Geun Shin and Hye Won Chung},\nyear={2024},\nurl={https://openreview.net/forum?id=onYFop1lGn}\n}",
        "github": "",
        "project": "",
        "reviewers": "P4tp;6DDx;S3Xf;MX6w",
        "site": "https://openreview.net/forum?id=onYFop1lGn",
        "pdf_size": 629773,
        "rating": "3;5;5;5",
        "confidence": "4;3;4;4",
        "soundness": "3;3;3;3",
        "contribution": "3;2;2;2",
        "presentation": "3;3;3;3",
        "wc_summary": "81;86;189;68",
        "wc_strengths": "56;99;207;41",
        "wc_weaknesses": "250;190;108;143",
        "wc_questions": "13;165;214;31",
        "wc_review": "400;540;718;283",
        "wc_reply_reviewers": "28;103;0;0",
        "wc_reply_authors": "1201;1495;1718;996",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "3;2;3;2",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            106.0,
            48.36837809974612
        ],
        "wc_strengths_avg": [
            100.75,
            64.9321761532755
        ],
        "wc_weaknesses_avg": [
            172.75,
            53.25117369598533
        ],
        "wc_questions_avg": [
            105.75,
            85.75947469521954
        ],
        "wc_review_avg": [
            485.25,
            162.2827393779141
        ],
        "wc_reply_reviewers_avg": [
            32.75,
            42.13890719987883
        ],
        "wc_reply_authors_avg": [
            1352.5,
            275.65422180695873
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:USyBbFDEOT8J:scholar.google.com/&scioq=Representation+Norm+Amplification+for+Out-of-Distribution+Detection+in+Long-Tail+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "onyGT5Nbuz",
        "title": "Efficient Continual Pre-training for Building Domain Specific Large Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large language models (LLMs) have demonstrated remarkable open-domain capabilities. Traditionally, LLMs tailored for a domain are trained from scratch to excel at handling domain-specific tasks. In this work, we explore an alternative strategy of continual pre-training as a means to develop domain-specific LLMs. We introduce FinPythia-6.9B, developed through domain-adaptive continual pre-training on the financial domain. Continual pre-trained FinPythia showcases consistent improvements on financial tasks over the original foundational model. We further explore simple but effective data selection strategies for continual pre-training. Our data selection strategies outperforms vanilla continual pre-training\u2019s performance with just 10% of corpus size and cost, without any degradation on open-domain standard tasks. Our work proposes an alternative solution to building domain-specific LLMs from scratch in a cost-effective manner.",
        "keywords": "large language models;pre-training;continual learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Yong Xie;Karan Aggarwal;Aitzaz Ahmad",
        "authorids": "~Yong_Xie1;~Karan_Aggarwal1;~Aitzaz_Ahmad1",
        "gender": "M;M;M",
        "homepage": ";;",
        "dblp": "06/2422;145/3946;",
        "google_scholar": "bT9NGx8AAAAJ;vc4CIMQAAAAJ;",
        "orcid": "0009-0003-1575-4104;;",
        "linkedin": "yong-xie-21a96a12b/;;aitzaz-ahmad/",
        "or_profile": "~Yong_Xie1;~Karan_Aggarwal1;~Aitzaz_Ahmad1",
        "aff": "Amazon;University of Minnesota, Minneapolis;Amazon",
        "aff_domain": "amazon.com;umn.edu;amazon.com",
        "position": "Researcher;PhD student;Applied Scientist",
        "bibtex": "@misc{\nxie2024efficient,\ntitle={Efficient Continual Pre-training for Building Domain Specific Large Language Models},\nauthor={Yong Xie and Karan Aggarwal and Aitzaz Ahmad},\nyear={2024},\nurl={https://openreview.net/forum?id=onyGT5Nbuz}\n}",
        "github": "",
        "project": "",
        "reviewers": "rYGF;npUz;QRSW;LVHJ",
        "site": "https://openreview.net/forum?id=onyGT5Nbuz",
        "pdf_size": 514190,
        "rating": "5;5;5;6",
        "confidence": "4;4;3;5",
        "soundness": "2;2;2;3",
        "contribution": "3;2;2;3",
        "presentation": "2;2;2;3",
        "wc_summary": "62;38;118;73",
        "wc_strengths": "48;22;57;93",
        "wc_weaknesses": "80;89;416;141",
        "wc_questions": "32;2;367;93",
        "wc_review": "222;151;958;400",
        "wc_reply_reviewers": "144;0;0;134",
        "wc_reply_authors": "888;308;829;401",
        "reply_reviewers": "2;0;0;1",
        "reply_authors": "3;1;1;2",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            72.75,
            29.029080247227952
        ],
        "wc_strengths_avg": [
            55.0,
            25.42636427018224
        ],
        "wc_weaknesses_avg": [
            181.5,
            137.37630800105234
        ],
        "wc_questions_avg": [
            123.5,
            144.35806177695792
        ],
        "wc_review_avg": [
            432.75,
            316.5275461946401
        ],
        "wc_reply_reviewers_avg": [
            69.5,
            69.58986995245787
        ],
        "wc_reply_authors_avg": [
            606.5,
            254.9906861044144
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.816496580927726,
        "gs_citation": 42,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7825937451369357381&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Amazon;University of Minnesota",
        "aff_unique_dep": "Amazon.com, Inc.;",
        "aff_unique_url": "https://www.amazon.com;https://www.minnesota.edu",
        "aff_unique_abbr": "Amazon;UMN",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Minneapolis",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "ooThrz2NvC",
        "title": "CICD-Coder: Chinese EMRs Based ICD Coding With Multi-axial Supported Clinical Evidence",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Although automatic ICD coding has achieved some success in English, there still exist significant challenges for the Chinese electronic medical records(EMRs) based ICD coding task. The first problem is the difficulty of extracting disease code-related information from Chinese EMRs due to the concise writing style and specific internal structure content of EMRs. The second problem is that previous methods have not exploited the disease-based multi-axial knowledge and are neither associated with the corresponding clinical evidence, resulting in inaccuracy in disease coding and lack of interpretability.\nIn this paper, we develop a novel automatic ICD coding framework CICD-Coder for the Chinese EMRs based ICD coding task. In the presented framework, we first investigate the multi-axes knowledge (crucial for the ICD coding) of the given disease and then retrieve corresponding clinical evidence for the disease-based multi-axes knowledge from the whole content of EMRs. Finally, we present an evaluation module based on the masked language modeling strategy to ensure each knowledge under the axis of the recommended ICD code is supported by reliable evidence. The experiments are conducted on a large-scale  Chinese EMRs dataset collected from varying hospitals and the results verify the effectiveness, reliability, and interpretability of our proposed ICD coding method.",
        "keywords": "Automatic ICD coding;Chinese EHR;Evidence-based medicine;Knowledge of multi-axes;Prompt-tuning",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/b111eb4816e038172e47582185fe8cebb3c45684.pdf",
        "author": "\u5fc3\u5fc3 \u5c24",
        "authorids": "~\u5fc3\u5fc3_\u5c241",
        "gender": "F",
        "homepage": "https://xinxyou.github.io/",
        "dblp": "",
        "google_scholar": "hKufQqgAAAAJ",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~\u5fc3\u5fc3_\u5c241",
        "aff": "Tsinghua University",
        "aff_domain": "tsinghua.edu.cn",
        "position": "PhD student",
        "bibtex": "@misc{\n\u5c242024cicdcoder,\ntitle={{CICD}-Coder: Chinese {EMR}s Based {ICD} Coding With Multi-axial  Supported Clinical Evidence},\nauthor={\u5fc3\u5fc3 \u5c24},\nyear={2024},\nurl={https://openreview.net/forum?id=ooThrz2NvC}\n}",
        "github": "",
        "project": "",
        "reviewers": "1CT8;owsX;uUev;Lv7G",
        "site": "https://openreview.net/forum?id=ooThrz2NvC",
        "pdf_size": 5977718,
        "rating": "1;3;5;6",
        "confidence": "4;4;3;2",
        "soundness": "1;2;3;3",
        "contribution": "1;2;2;2",
        "presentation": "1;2;3;3",
        "wc_summary": "113;77;78;38",
        "wc_strengths": "58;70;91;10",
        "wc_weaknesses": "162;240;180;26",
        "wc_questions": "55;28;149;11",
        "wc_review": "388;415;498;85",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "624;704;744;181",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.75,
            1.920286436967152
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            76.5,
            26.537709019431198
        ],
        "wc_strengths_avg": [
            57.25,
            29.72688177390962
        ],
        "wc_weaknesses_avg": [
            152.0,
            78.26876771739798
        ],
        "wc_questions_avg": [
            60.75,
            53.312170280340304
        ],
        "wc_review_avg": [
            346.5,
            156.3241823903135
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            563.25,
            224.8814965709718
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.9028289727756884,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ziPF6-WA8B8J:scholar.google.com/&scioq=CICD-Coder:+Chinese+EMRs+Based+ICD+Coding+With+Multi-axial+Supported+Clinical+Evidence&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Tsinghua University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "THU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "op19LjpHkH",
        "title": "Decoupled Actor-Critic",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Actor-Critic methods are in a stalemate of two seemingly irreconcilable problems. Firstly, critic proneness towards overestimation requires sampling temporal-difference targets from a conservative policy optimized using lower-bound Q-values. Secondly, well-known results show that policies that are optimistic in the face of uncertainty yield lower regret levels. To remedy this dichotomy, we propose Decoupled Actor-Critic (DAC). DAC is an off-policy algorithm that learns two distinct actors by gradient backpropagation: a conservative actor used for temporal-difference learning and an optimistic actor used for exploration. We test DAC on DeepMind Control tasks in low and high replay ratio regimes and ablate multiple design choices. Despite minimal computational overhead, DAC achieves state-of-the-art performance and sample efficiency on locomotion tasks.",
        "keywords": "Continuous Control;Reinforcement Learning;Actor-Critic",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Michal Nauman;Marek Cygan",
        "authorids": "~Michal_Nauman1;~Marek_Cygan1",
        "gender": ";",
        "homepage": ";",
        "dblp": ";76/819",
        "google_scholar": ";df8TSy4AAAAJ",
        "orcid": ";",
        "linkedin": "michal-nauman/;marek-cygan-b9a316140/",
        "or_profile": "~Michal_Nauman1;~Marek_Cygan1",
        "aff": "University of Warsaw;Nomagic",
        "aff_domain": "mimuw.edu.pl;nomagic.ai",
        "position": "PhD student;Founder / CTO",
        "bibtex": "@misc{\nnauman2024decoupled,\ntitle={Decoupled Actor-Critic},\nauthor={Michal Nauman and Marek Cygan},\nyear={2024},\nurl={https://openreview.net/forum?id=op19LjpHkH}\n}",
        "github": "",
        "project": "",
        "reviewers": "HF8k;7ruN;XQ6P;SCgY",
        "site": "https://openreview.net/forum?id=op19LjpHkH",
        "pdf_size": 11505467,
        "rating": "5;6;6;6",
        "confidence": "4;3;4;3",
        "soundness": "2;3;3;2",
        "contribution": "2;2;3;2",
        "presentation": "1;2;3;3",
        "wc_summary": "32;65;67;131",
        "wc_strengths": "21;46;53;32",
        "wc_weaknesses": "130;4;237;443",
        "wc_questions": "81;71;206;2",
        "wc_review": "264;186;563;608",
        "wc_reply_reviewers": "0;14;49;9",
        "wc_reply_authors": "1462;653;1677;2179",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "3;2;4;5",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            73.75,
            35.856484769146014
        ],
        "wc_strengths_avg": [
            38.0,
            12.389511693363866
        ],
        "wc_weaknesses_avg": [
            203.5,
            161.0007763956435
        ],
        "wc_questions_avg": [
            90.0,
            73.55610103859503
        ],
        "wc_review_avg": [
            405.25,
            183.04012538238712
        ],
        "wc_reply_reviewers_avg": [
            18.0,
            18.587630295441105
        ],
        "wc_reply_authors_avg": [
            1492.75,
            550.2301223124739
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.5,
            1.118033988749895
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8814164240949352476&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Warsaw;Nomagic",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uw.edu.pl;",
        "aff_unique_abbr": "UW;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Poland;"
    },
    {
        "id": "opZTBFnX2G",
        "title": "Bayesian Offline-to-Online Reinforcement Learning : A Realist Approach",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Offline reinforcement learning (RL) is crucial for real-world applications where exploration can be costly. However, offline learned policies are often suboptimal and require online finetuning. In this paper, we tackle the fundamental dilemma of offline-to-online finetuning: if the agent remains pessimistic, it may fail to learn a better policy, while if it becomes optimistic directly, performance may suffer from a sudden drop. We show theoretically that the agent should adopt neither optimistic nor pessimistic policies during the offline-to-online transition. Instead, we propose a Bayesian approach, where the agent acts by sampling from its posterior and updates its belief accordingly. We demonstrate that such an agent can avoid a sudden performance drop while still being guaranteed to find the optimal policy. Based on our theoretical findings, we introduce a novel algorithm that outperforms existing benchmarks in our experiments, demonstrating the efficacy of our approach. Overall, the proposed approach provides a new perspective on offline-to-online finetuning that has the potential to enable more effective learning from offline data.",
        "keywords": "offline-to-online RL;deep reinforcement learning;Bayesian RL",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/20c639874a78c2a6aa4d56491dc355fee63c71c4.zip",
        "author": "Hao Hu;Yiqin Yang;Jianing Ye;Ziqing Mai;Yujing Hu;Tangjie Lv;Changjie Fan;Qianchuan Zhao;Chongjie Zhang",
        "authorids": "~Hao_Hu3;~Yiqin_Yang1;~Jianing_Ye1;~Ziqing_Mai1;~Yujing_Hu2;~Tangjie_Lv1;~Changjie_Fan1;~Qianchuan_Zhao1;~Chongjie_Zhang1",
        "gender": "M;M;M;F;;M;M;M;",
        "homepage": "https://mousehu.github.io;https://www.researchgate.net/profile/Yiqin-Yang-2;https://heavycrab.github.io/;https://github.com/ZiqingMai;;;;;",
        "dblp": "67/6924-6;180/7725;287/5070;;https://dblp.uni-trier.de/pid/160/1923.html;;71/882;82/3427;29/6693",
        "google_scholar": "https://scholar.google.com/citations?hl=en;aHTi5IEAAAAJ;Sc9duQQAAAAJ;;IR5WY-wAAAAJ;EIuWpJcAAAAJ;;;LjxqXycAAAAJ",
        "orcid": ";;;;;0000-0001-9858-809X;0000-0001-5420-0516;0000-0002-7952-5621;",
        "linkedin": "hao-hu-tsinghua;;;;;;;;",
        "or_profile": "~Hao_Hu3;~Yiqin_Yang1;~Jianing_Ye1;~Ziqing_Mai1;~Yujing_Hu2;~Tangjie_Lv1;~Changjie_Fan1;~Qianchuan_Zhao1;~Chongjie_Zhang1",
        "aff": "Tsinghua University;Tsinghua University;Tsinghua University;Tsinghua University;NetEase, Inc.;NetEase, Inc.;Netease, Fuxi AI Lab;Tsinghua University;Washington University, Saint Louis",
        "aff_domain": "tsinghua.edu.cn;tsinghua.edu.cn;mails.tsinghua.edu.cn;tsinghua.edu.cn;corp.netease.com;netease.com;corp.netease.com;tsinghua.edu.cn;wustl.edu",
        "position": "PhD student;PhD student;MS student;Undergrad student;Researcher;Researcher;Principal Researcher;Full Professor;Associate Professor",
        "bibtex": "@misc{\nhu2024bayesian,\ntitle={Bayesian Offline-to-Online Reinforcement Learning : A Realist Approach},\nauthor={Hao Hu and Yiqin Yang and Jianing Ye and Ziqing Mai and Yujing Hu and Tangjie Lv and Changjie Fan and Qianchuan Zhao and Chongjie Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=opZTBFnX2G}\n}",
        "github": "",
        "project": "",
        "reviewers": "x3PJ;JwaT;pmMK;WzDy",
        "site": "https://openreview.net/forum?id=opZTBFnX2G",
        "pdf_size": 6090430,
        "rating": "5;6;6;6",
        "confidence": "3;4;3;4",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "37;67;90;91",
        "wc_strengths": "3;47;52;33",
        "wc_weaknesses": "3;70;289;327",
        "wc_questions": "209;89;2;21",
        "wc_review": "252;273;433;472",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "687;792;692;864",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;4;2;3",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            71.25,
            21.98152633462927
        ],
        "wc_strengths_avg": [
            33.75,
            19.070592544543548
        ],
        "wc_weaknesses_avg": [
            172.25,
            138.4546405867279
        ],
        "wc_questions_avg": [
            80.25,
            81.06594537782188
        ],
        "wc_review_avg": [
            357.5,
            96.28213749185255
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            758.75,
            73.80167681021888
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:9L4Yr0BMUlAJ:scholar.google.com/&scioq=Bayesian+Offline-to-Online+Reinforcement+Learning+:+A+Realist+Approach&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;1;1;2;0;3",
        "aff_unique_norm": "Tsinghua University;NetEase, Inc.;Netease;Washington University in St. Louis",
        "aff_unique_dep": ";;Fuxi AI Lab;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.163.com;https://www.netease.com;https://wustl.edu",
        "aff_unique_abbr": "THU;NetEase;Netease;WUSTL",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Saint Louis",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "oq5EF8parZ",
        "title": "Sparkles: Unlocking Chats Across Multiple Images for Multimodal Instruction-Following Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models exhibit enhanced zero-shot performance on various tasks when fine-tuned with instruction-following data. Multimodal instruction-following models extend these capabilities by integrating both text and images. However, existing models such as MiniGPT-4 face challenges in maintaining dialogue coherence in scenarios involving multiple images. A primary reason is the lack of a specialized dataset for this critical application. To bridge these gaps, we present SparklesChat, a multimodal instruction-following model for open-ended dialogues across multiple images. To support the training, we introduce SparklesDialogue, the first machine-generated dialogue dataset tailored for word-level interleaved multi-image and text interactions. Furthermore, we construct SparklesEval, a GPT-assisted benchmark for quantitatively assessing a model's conversational competence across multiple images and dialogue turns. Our experiments validate the effectiveness of SparklesChat in understanding and reasoning across multiple images and dialogue turns. Specifically, SparklesChat outperformed MiniGPT-4 on established vision-and-language benchmarks, including the BISON binary image selection task and the NLVR2 visual reasoning task. Moreover, SparklesChat scored 8.56 out of 10 on SparklesEval, substantially exceeding MiniGPT-4's score of 3.91 and nearing GPT-4's score of 9.26. Qualitative evaluations further demonstrate SparklesChat's generality in handling real-world applications. All resources are available. We have uploaded the code, model, and data as supplementary material to ensure reproducibility.",
        "keywords": "multimodal; instruction-following models; vision-language; dialogue; multi-image",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/615af5376bf1dc6f6a6a7e19aa7062e5e49843c8.zip",
        "author": "Yupan Huang;Zaiqiao Meng;Fangyu Liu;Yixuan Su;Nigel Collier;Yutong Lu",
        "authorids": "~Yupan_Huang1;~Zaiqiao_Meng1;~Fangyu_Liu1;~Yixuan_Su1;~Nigel_Collier1;~Yutong_Lu1",
        "gender": "F;M;M;M;M;F",
        "homepage": "https://hypjudy.github.io/website/;https://mengzaiqiao.github.io/;http://fangyuliu.me/about;https://yxuansu.github.io/;https://sites.google.com/site/nhcollier/;http://www.sysu.edu.cn",
        "dblp": "239/4895;185/0748;84/11483-1;262/3282.html;90/2619;",
        "google_scholar": "ZbCCBogAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.ch/citations?user=d19PiS0AAAAJ;VuVuWEoAAAAJ;https://scholar.google.co.uk/citations?user=ZMelBa0AAAAJ;",
        "orcid": ";;0000-0001-7038-3623;0000-0002-1472-7791;0000-0002-7230-4164;",
        "linkedin": ";;fangyu-liu-48a003b0/;;;",
        "or_profile": "~Yupan_Huang1;~Zaiqiao_Meng1;~Fangyu_Liu1;~Yixuan_Su1;~Nigel_Collier1;~Yutong_Lu1",
        "aff": "Microsoft;University of Glasgow;Google DeepMind;Cohere;University of Cambridge;SUN YAT-SEN UNIVERSITY",
        "aff_domain": "microsoft.com;glasgow.ac.uk;google.com;cohere.com;cam.ac.uk;sysu.edu.cn",
        "position": "Researcher;Lecturer;Research Scientist;Researcher;Full Professor;Full Professor",
        "bibtex": "@misc{\nhuang2024sparkles,\ntitle={Sparkles: Unlocking Chats Across Multiple Images for Multimodal Instruction-Following Models},\nauthor={Yupan Huang and Zaiqiao Meng and Fangyu Liu and Yixuan Su and Nigel Collier and Yutong Lu},\nyear={2024},\nurl={https://openreview.net/forum?id=oq5EF8parZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "eU8x;9M6X;qmnH;viMW",
        "site": "https://openreview.net/forum?id=oq5EF8parZ",
        "pdf_size": 11039699,
        "rating": "5;5;6;6",
        "confidence": "4;4;4;3",
        "soundness": "2;2;3;3",
        "contribution": "1;2;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "189;30;61;55",
        "wc_strengths": "29;39;79;124",
        "wc_weaknesses": "114;198;125;111",
        "wc_questions": "65;6;19;77",
        "wc_review": "397;273;284;367",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "703;673;680;598",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            83.75,
            61.86830771889595
        ],
        "wc_strengths_avg": [
            67.75,
            37.47916087641237
        ],
        "wc_weaknesses_avg": [
            137.0,
            35.601966237835796
        ],
        "wc_questions_avg": [
            41.75,
            29.911327285829362
        ],
        "wc_review_avg": [
            330.25,
            52.96874078171011
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            663.5,
            39.41129279787711
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 24,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9758191182567418373&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;3;4;5",
        "aff_unique_norm": "Microsoft;University of Glasgow;Google;Cohere;University of Cambridge;Sun Yat-sen University",
        "aff_unique_dep": "Microsoft Corporation;;Google DeepMind;;;",
        "aff_unique_url": "https://www.microsoft.com;https://www.gla.ac.uk;https://deepmind.com;https://cohere.ai;https://www.cam.ac.uk;http://www.sysu.edu.cn",
        "aff_unique_abbr": "Microsoft;Glasgow;DeepMind;;Cambridge;SYSU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Cambridge",
        "aff_country_unique_index": "0;1;1;0;1;2",
        "aff_country_unique": "United States;United Kingdom;China"
    },
    {
        "id": "oqDoAMYbgA",
        "title": "Adaptive Softmax Trees for many-class classification",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "NLP tasks such as language models or document classification involve classification problems with thousands of classes. In these situations, it is difficult to get high predictive accuracy and the resulting model can be huge in number of parameters and inference time. A recent, successful approach is the softmax tree (ST): a decision tree having sparse hyperplane splits at the decision nodes (which make hard, not soft, decisions) and small softmax classifiers at the leaves. Inference here is very fast because only a small subset of class probabilities need to be computed, and yet the model is quite accurate. However, a significant drawback of this ST is that it assumes a complete tree, whose size grows exponentially with depth, and this limits their power. We propose a new algorithm to train a ST of arbitrary structure. The tree structure itself is learned optimally by interleaving steps that grow the structure with steps that optimize the parameters of the current structure. This makes it possible to learn STs that can grow much deeper but in an irregular way, adapting to the data distribution. The resulting STs improve considerably the predictive accuracy while reducing the number of parameters and inference time even further, as demonstrated in datasets with thousands of classes. In addition, they are interpretable to some extent.",
        "keywords": "supervised learning;decision trees;softmax layer approximation;large multiclass classification;hierarchical models",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Rasul Kairgeldin;Magzhan Gabidolla;Miguel \u00c1. Carreira-Perpi\u00f1\u00e1n",
        "authorids": "~Rasul_Kairgeldin1;~Magzhan_Gabidolla1;~Miguel_\u00c1._Carreira-Perpi\u00f1\u00e1n2",
        "gender": "M;;",
        "homepage": ";;",
        "dblp": ";;",
        "google_scholar": ";;",
        "orcid": ";;",
        "linkedin": "rasul-kairgeldin/;;",
        "or_profile": "~Rasul_Kairgeldin1;~Magzhan_Gabidolla1;~Miguel_\u00c1._Carreira-Perpi\u00f1\u00e1n2",
        "aff": "University of California, Merced;;",
        "aff_domain": "ucmerced.edu;;",
        "position": "PhD student;;",
        "bibtex": "@misc{\nkairgeldin2024adaptive,\ntitle={Adaptive Softmax Trees for many-class classification},\nauthor={Rasul Kairgeldin and Magzhan Gabidolla and Miguel {\\'A}. Carreira-Perpi{\\~n}{\\'a}n},\nyear={2024},\nurl={https://openreview.net/forum?id=oqDoAMYbgA}\n}",
        "github": "",
        "project": "",
        "reviewers": "FA55;u3Fd;P37h;qCCg",
        "site": "https://openreview.net/forum?id=oqDoAMYbgA",
        "pdf_size": 366318,
        "rating": "3;5;6;6",
        "confidence": "3;4;4;2",
        "soundness": "2;2;3;3",
        "contribution": "2;3;2;3",
        "presentation": "2;3;4;3",
        "wc_summary": "183;72;80;74",
        "wc_strengths": "13;59;59;27",
        "wc_weaknesses": "547;130;87;23",
        "wc_questions": "45;66;11;19",
        "wc_review": "788;327;237;143",
        "wc_reply_reviewers": "269;67;0;0",
        "wc_reply_authors": "577;440;0;63",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "1;2;0;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            102.25,
            46.71388979736113
        ],
        "wc_strengths_avg": [
            39.5,
            20.11839953873071
        ],
        "wc_weaknesses_avg": [
            196.75,
            205.76974388864852
        ],
        "wc_questions_avg": [
            35.25,
            21.75287337341897
        ],
        "wc_review_avg": [
            373.75,
            247.85820038885137
        ],
        "wc_reply_reviewers_avg": [
            84.0,
            110.2565190816398
        ],
        "wc_reply_authors_avg": [
            270.0,
            244.3859652271382
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.7071067811865476
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4186633604673265783&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of California, Merced",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucmerced.edu",
        "aff_unique_abbr": "UC Merced",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Merced",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "title": "ReLU Strikes Back: Exploiting Activation Sparsity in Large Language Models",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17805",
        "id": "osoWxY8q2E",
        "author_site": "Iman Mirzadeh, Keivan Alizadeh-Vahid, Sachin Mehta, Carlo C del Mundo, Oncel Tuzel, Golnoosh Samei, Mohammad Rastegari, Mehrdad Farajtabar",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) with billions of parameters have drastically transformed AI applications. However, their demanding computation during inference has raised significant challenges for deployment on resource-constrained devices. Despite recent trends favoring alternative activation functions such as GELU or SiLU, known for increased computation, this study strongly advocates for reinstating ReLU activation in LLMs. We demonstrate that using the ReLU activation function has a negligible impact on convergence and performance while significantly reducing computation and weight transfer. This reduction is particularly valuable during the memory-bound inference step, where efficiency is paramount. Exploring sparsity patterns in ReLU-based LLMs, we unveil the reutilization of activated neurons for generating new tokens and leveraging these insights, we propose practical strategies to substantially reduce LLM inference computation up to three times, using ReLU activations with minimal performance trade-offs.",
        "keywords": "Large Language Models;Sparsity;Activation Function;ReLU Activation Function",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Seyed Iman Mirzadeh;Keivan Alizadeh-Vahid;Sachin Mehta;Carlo C del Mundo;Oncel Tuzel;Golnoosh Samei;Mohammad Rastegari;Mehrdad Farajtabar",
        "authorids": "~Seyed_Iman_Mirzadeh1;~Keivan_Alizadeh-Vahid1;~Sachin_Mehta1;~Carlo_C_del_Mundo1;~Oncel_Tuzel2;~Golnoosh_Samei1;~Mohammad_Rastegari2;~Mehrdad_Farajtabar1",
        "gender": "M;;M;;M;F;M;M",
        "homepage": "https://imirzadeh.me/;;https://sacmehta.github.io/;;http://www.onceltuzel.net;;https://mrastegari.github.io/;https://www.cc.gatech.edu/~mfarajta/",
        "dblp": "236/5113;;34/11140;;73/2943.html;;31/5228;21/9988",
        "google_scholar": "AjKbt44AAAAJ;;https://scholar.google.co.in/citations?user=cnRJ0GUAAAAJ;;Fe7NTe0AAAAJ;kDrzTfsAAAAJ;N4-2Z_cAAAAJ;shkKxnQAAAAJ",
        "orcid": ";;;;;0000-0001-8587-5807;;",
        "linkedin": "iman-mirzadeh-a687278b/;;;;;;;",
        "or_profile": "~Seyed_Iman_Mirzadeh1;~Keivan_Alizadeh-Vahid1;~Sachin_Mehta1;~Carlo_C_del_Mundo1;~Oncel_Tuzel2;~Golnoosh_Samei1;~Mohammad_Rastegari2;~Mehrdad_Farajtabar1",
        "aff": "Apple;;Apple;;Apple;Borealis AI;Department of Computer Science, University of Washington;Apple",
        "aff_domain": "apple.com;;apple.com;;apple.com;rbc.com;cs.washington.edu;apple.com",
        "position": "Research Engineer;;Researcher;;Principal Researcher;Researcher;Assistant Professor;Researcher",
        "bibtex": "@inproceedings{\nmirzadeh2024relu,\ntitle={Re{LU} Strikes Back: Exploiting Activation Sparsity in Large Language Models},\nauthor={Seyed Iman Mirzadeh and Keivan Alizadeh-Vahid and Sachin Mehta and Carlo C del Mundo and Oncel Tuzel and Golnoosh Samei and Mohammad Rastegari and Mehrdad Farajtabar},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=osoWxY8q2E}\n}",
        "github": "",
        "project": "",
        "reviewers": "iJ3a;nzdz;EzRV",
        "pdf_size": 1304589,
        "rating": "6;8;8",
        "confidence": "4;3;4",
        "soundness": "2;3;3",
        "contribution": "2;2;4",
        "presentation": "2;3;3",
        "wc_summary": "126;205;83",
        "wc_strengths": "41;179;47",
        "wc_weaknesses": "230;113;78",
        "wc_questions": "2;50;68",
        "wc_review": "399;547;276",
        "wc_reply_reviewers": "100;108;77",
        "wc_reply_authors": "1015;482;658",
        "reply_reviewers": "1;1;1",
        "reply_authors": "3;2;2",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            138.0,
            50.52392172690741
        ],
        "wc_strengths_avg": [
            89.0,
            63.686733312362634
        ],
        "wc_weaknesses_avg": [
            140.33333333333334,
            64.99401681864433
        ],
        "wc_questions_avg": [
            40.0,
            27.85677655436824
        ],
        "wc_review_avg": [
            407.3333333333333,
            110.79209759224207
        ],
        "wc_reply_reviewers_avg": [
            95.0,
            13.140268896284683
        ],
        "wc_reply_authors_avg": [
            718.3333333333334,
            221.7390859145546
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 85,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5593978371495674842&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=osoWxY8q2E",
        "pdf": "https://openreview.net/pdf?id=osoWxY8q2E",
        "email": "apple.com;;apple.com;;apple.com;rbc.com;cs.washington.edu;apple.com",
        "author_num": 8,
        "aff_unique_index": "0;0;0;1;2;0",
        "aff_unique_norm": "Apple;Borealis AI;University of Washington",
        "aff_unique_dep": "Apple Inc.;;Department of Computer Science",
        "aff_unique_url": "https://www.apple.com;https://www.borealisai.com;https://www.washington.edu",
        "aff_unique_abbr": "Apple;Borealis AI;UW",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Seattle",
        "aff_country_unique_index": "0;0;0;1;0;0",
        "aff_country_unique": "United States;Canada"
    },
    {
        "title": "Prototypical Information Bottlenecking and Disentangling for Multimodal Cancer Survival Prediction",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17804",
        "id": "otHZ8JAIgh",
        "author_site": "Yilan Zhang, Yingxue XU, Jianqi Chen, Fengying Xie, Hao CHEN",
        "tldr": "",
        "abstract": "Multimodal learning significantly benefits cancer survival prediction, especially the integration of pathological images and genomic data. Despite advantages of multimodal learning for cancer survival prediction, massive redundancy in multimodal data prevents it from extracting discriminative and compact information: (1) An extensive amount of intra-modal task-unrelated information blurs discriminability, especially for gigapixel whole slide images (WSIs) with many patches in pathology and thousands of pathways in genomic data, leading to an \"intra-modal redundancy\" issue. (2) Duplicated information among modalities dominates the representation of multimodal data, which makes modality-specific information prone to being ignored, resulting in an \"inter-modal redundancy\" issue. To address these, we propose a new framework, Prototypical Information Bottlenecking and Disentangling (PIBD), consisting of Prototypical Information Bottleneck (PIB) module for intra-modal redundancy and Prototypical Information Disentanglement (PID) module for inter-modal redundancy. Specifically, a variant of information bottleneck, PIB, is proposed to model prototypes approximating a bunch of instances for different risk levels, which can be used for selection of discriminative instances within modality. PID module decouples entangled multimodal data into compact distinct components: modality-common and modality-specific knowledge, under the guidance of the joint prototypical distribution. Extensive experiments on five cancer benchmark datasets demonstrated our superiority over other methods. The code is released.",
        "keywords": "multimodal survival prediction;computational pathology",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yilan Zhang;Yingxue Xu;Jianqi Chen;Fengying Xie;Hao Chen",
        "authorids": "~Yilan_Zhang1;~Yingxue_Xu1;~Jianqi_Chen1;~Fengying_Xie1;~Hao_Chen1",
        "gender": "F;F;M;F;M",
        "homepage": ";https://innse.github.io/;https://windvchen.github.io/;http://www.sa.buaa.edu.cn/info/1014/4773.htm;https://cse.hkust.edu.hk/~jhc/",
        "dblp": "207/6668;232/3187;86/10143;121/9085.html;86/475-11",
        "google_scholar": "wZ4M4ecAAAAJ;https://scholar.google.com.hk/citations?user=XY6NCLMAAAAJ;https://scholar.google.com.hk/citations?user=7jZZKH0AAAAJ;cxgMpCwAAAAJ;https://scholar.google.com.hk/citations?user=Z_t5DjwAAAAJ",
        "orcid": "0000-0003-3633-7038;;0000-0003-0031-8417;0000-0002-5681-2345;0000-0002-8400-3780",
        "linkedin": ";;;;",
        "or_profile": "~Yilan_Zhang1;~Yingxue_Xu1;~Jianqi_Chen1;~Fengying_Xie1;~Hao_Chen1",
        "aff": "Beihang University;Hong Kong University of Science and Technology;Beihang University;Beihang University;Hong Kong University of Science and Technology",
        "aff_domain": "buaa.edu.cn;ust.hk;buaa.edu.cn;buaa.edu.cn;ust.hk",
        "position": "MS student;PhD student;MS student;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nzhang2024prototypical,\ntitle={Prototypical Information Bottlenecking and Disentangling for Multimodal Cancer Survival Prediction},\nauthor={Yilan Zhang and Yingxue Xu and Jianqi Chen and Fengying Xie and Hao Chen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=otHZ8JAIgh}\n}",
        "github": "",
        "project": "",
        "reviewers": "ottr;G86X;HNZs;bKh7",
        "pdf_size": 8827790,
        "rating": "5;6;8;10",
        "confidence": "5;4;5;4",
        "soundness": "3;3;3;4",
        "contribution": "2;3;3;4",
        "presentation": "2;3;3;4",
        "wc_summary": "172;62;49;36",
        "wc_strengths": "139;110;62;64",
        "wc_weaknesses": "675;363;15;123",
        "wc_questions": "113;149;29;76",
        "wc_review": "1099;684;155;299",
        "wc_reply_reviewers": "770;24;0;0",
        "wc_reply_authors": "1336;1760;304;624",
        "reply_reviewers": "2;1;0;0",
        "reply_authors": "2;3;1;1",
        "rating_avg": [
            7.25,
            1.920286436967152
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            79.75,
            54.04801106423806
        ],
        "wc_strengths_avg": [
            93.75,
            32.42202183701689
        ],
        "wc_weaknesses_avg": [
            294.0,
            253.47780967966406
        ],
        "wc_questions_avg": [
            91.75,
            44.4824403557179
        ],
        "wc_review_avg": [
            559.25,
            366.7563053309377
        ],
        "wc_reply_reviewers_avg": [
            198.5,
            330.1011208705599
        ],
        "wc_reply_authors_avg": [
            1006.0,
            573.6165966915532
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.39056673294247163,
        "gs_citation": 38,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13339350520969912067&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=otHZ8JAIgh",
        "pdf": "https://openreview.net/pdf?id=otHZ8JAIgh",
        "email": "buaa.edu.cn;ust.hk;buaa.edu.cn;buaa.edu.cn;ust.hk",
        "author_num": 5,
        "aff_unique_index": "0;1;0;0;1",
        "aff_unique_norm": "Beihang University;Hong Kong University of Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.buaa.edu.cn/;https://www.ust.hk",
        "aff_unique_abbr": "BUAA;HKUST",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Advancing the Lower Bounds: an Accelerated, Stochastic, Second-order Method with Optimal Adaptation to Inexactness",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17803",
        "id": "otU31x3fus",
        "author_site": "Artem Agafonov, Dmitry Kamzolov, Alexander Gasnikov, Ali Kavis, Kimon Antonakopoulos, Volkan Cevher, Martin Tak\u00e1\u010d",
        "tldr": "",
        "abstract": "We present a new accelerated stochastic second-order method that is robust to both gradient and Hessian inexactness, typical in machine learning. We establish theoretical lower bounds and prove that our algorithm achieves optimal convergence in both gradient and Hessian inexactness in this key setting. We further introduce a tensor generalization for stochastic higher-order derivatives. When the oracles are non-stochastic, the proposed tensor algorithm matches the global convergence of Nesterov Accelerated Tensor method. Both algorithms allow for approximate solutions of their auxiliary subproblems with verifiable conditions on the accuracy of the solution.",
        "keywords": "Second-order methods;convex optimization;stochastic optimization;Cubic Newton Method;high-order methods;tensor methods;lower bounds",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Artem Agafonov;Dmitry Kamzolov;Alexander Gasnikov;Ali Kavis;Kimon Antonakopoulos;Volkan Cevher;Martin Tak\u00e1\u010d",
        "authorids": "~Artem_Agafonov1;~Dmitry_Kamzolov1;~Alexander_Gasnikov1;~Ali_Kavis1;~Kimon_Antonakopoulos1;~Volkan_Cevher1;~Martin_Tak\u00e1\u010d1",
        "gender": "M;M;;M;M;M;M",
        "homepage": "https://scholar.google.com/citations?user=cr5pJdAAAAAJ&hl=en;;https://alikavis.github.io;;http://lions.epfl.ch;https://arxiv.org/search/?query=Gasnikov&searchtype=all&source=header;http://mtakac.com",
        "dblp": ";279/1643;231/7697;https://dblp.org/pers/hd/a/Antonakopoulos:Kimon;70/5301;153/1930;42/3759-1.html",
        "google_scholar": "cr5pJdAAAAAJ;https://scholar.google.hr/citations?user=CAq74XAAAAAJ;sPrPq6oAAAAJ;;https://scholar.google.ch/citations?user=hlWhzU8AAAAJ;AmeE8qkAAAAJ;qKQD-2cAAAAJ",
        "orcid": ";;;;;;0000-0001-7455-2025",
        "linkedin": ";;;;;;martintakac/",
        "or_profile": "~Artem_Agafonov1;~Dmitry_Kamzolov1;~Ali_Kavis1;~Kimon_Antonakopoulos1;~Volkan_Cevher1;~Alexander_Vladimirovich_Gasnikov1;~Martin_Takac3",
        "aff": "Moscow Institute of Physics and Technology;Mohamed bin Zayed University of Artificial Intelligence;University of Texas at Austin;EPFL - EPF Lausanne;Amazon Development Center Germany;Moscow Institute of Physics and Technology;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_domain": "mipt.edu;mbzuai.ac.ae;utexas.edu;epfl.ch;amazon.de;mipt.ru;mbzuai.ac.ae",
        "position": "PhD student;Postdoc;Postdoc;Postdoc;Amazon Scholar;Associate Professor;Associate Professor",
        "bibtex": "@inproceedings{\nagafonov2024advancing,\ntitle={Advancing the Lower Bounds: an Accelerated, Stochastic, Second-order Method with Optimal Adaptation to Inexactness},\nauthor={Artem Agafonov and Dmitry Kamzolov and Alexander Gasnikov and Ali Kavis and Kimon Antonakopoulos and Volkan Cevher and Martin Tak{\\'a}{\\v{c}}},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=otU31x3fus}\n}",
        "github": "",
        "project": "",
        "reviewers": "S1GY;xECU;2pJU;KkLj",
        "pdf_size": 2836379,
        "rating": "1;6;6;8",
        "confidence": "5;3;4;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "29;93;18;110",
        "wc_strengths": "1;66;18;66",
        "wc_weaknesses": "10;202;2;144",
        "wc_questions": "17;124;74;168",
        "wc_review": "57;485;112;488",
        "wc_reply_reviewers": "0;62;0;0",
        "wc_reply_authors": "573;1158;467;915",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "3;4;2;3",
        "rating_avg": [
            5.25,
            2.5860201081971503
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            62.5,
            39.65160778581368
        ],
        "wc_strengths_avg": [
            37.75,
            28.88230427095456
        ],
        "wc_weaknesses_avg": [
            89.5,
            86.02761184642986
        ],
        "wc_questions_avg": [
            95.75,
            56.331052715176554
        ],
        "wc_review_avg": [
            285.5,
            201.9412043145232
        ],
        "wc_reply_reviewers_avg": [
            15.5,
            26.846787517317598
        ],
        "wc_reply_authors_avg": [
            778.25,
            274.7338484788505
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.903594257860088,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14426445782611479811&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=otU31x3fus",
        "pdf": "https://openreview.net/pdf?id=otU31x3fus",
        "email": "mipt.edu;mbzuai.ac.ae;utexas.edu;epfl.ch;amazon.de;mipt.ru;mbzuai.ac.ae",
        "author_num": 7,
        "aff_unique_index": "0;1;2;3;4;0;1",
        "aff_unique_norm": "Moscow Institute of Physics and Technology;Mohamed bin Zayed University of Artificial Intelligence;University of Texas at Austin;EPFL;Amazon",
        "aff_unique_dep": ";;;;Development Center",
        "aff_unique_url": "https://www.mipt.ru/en;https://mbzuai.ac.ae;https://www.utexas.edu;https://www.epfl.ch;https://www.amazon.de",
        "aff_unique_abbr": "MIPT;MBZUAI;UT Austin;EPFL;Amazon",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Austin;Lausanne",
        "aff_country_unique_index": "0;1;2;3;4;0;1",
        "aff_country_unique": "Russian Federation;United Arab Emirates;United States;Switzerland;Germany"
    },
    {
        "id": "otoggKnn0A",
        "title": "FHA-Kitchens: A Novel Dataset for Fine-Grained Hand Action Recognition in Kitchen Scenes",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "A typical task in the field of video understanding is hand action recognition, which has a wide range of applications. Existing works either mainly focus on full-body actions, or the defined action categories are relatively coarse-grained. In this paper, we propose FHA-Kitchens, a novel dataset of fine-grained hand actions in kitchen scenes. In particular, we focus on human hand interaction regions and perform deep excavation to further refine hand action information and interaction regions. Our FHA-Kitchens dataset consists of 2,377 video clips and 30,047 images collected from 8 different types of dishes, and all hand interaction regions in each image are labeled with high-quality fine-grained action classes and bounding boxes. We represent the action information in each hand interaction region as a triplet, resulting in a total of 878 action triplets. Based on the constructed dataset, we benchmark representative action recognition and detection models on the following three tracks: (1) supervised learning for hand interaction region and object detection, (2) supervised learning for fine-grained hand action recognition, and (3) intra- and inter-class domain generalization for hand interaction region detection. The experimental results offer compelling empirical evidence that highlights the challenges inherent in fine-grained hand action recognition, while also shedding light on potential avenues for future research, particularly in relation to pre-training strategy, model design, and domain generalization. The dataset will be released on the FHA-Kitchens project website.",
        "keywords": "hand action recognition;fine-grained;dataset;benchmark",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/c5d6e4fe9ffca9a2b2660fb31f74b1a0e772c502.zip",
        "author": "Ting Zhe;Yongqian Li;Jing Zhang;Yong Luo;Han Hu;Bo Du;Yonggang Wen;Dacheng Tao",
        "authorids": "~Ting_Zhe1;~Yongqian_Li3;~Jing_Zhang17;~Yong_Luo2;~Han_Hu6;~Bo_Du3;~Yonggang_Wen1;~Dacheng_Tao1",
        "gender": "F;M;M;M;;;M;",
        "homepage": "https://ieeexplore.ieee.org/author/37086818809;https://github.com/crazyCoderLi;;;;;https://personal.ntu.edu.sg/ygwen/;",
        "dblp": ";;05/3499-37.html;57/5272-2.html;;;;",
        "google_scholar": ";;https://scholar.google.com/citations?hl=en;zb1oVGIAAAAJ;;;https://scholar.google.com.tw/citations?user=byeygOkAAAAJ;",
        "orcid": "0000-0002-3478-5921;;0000-0001-6595-7661;;;;;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Ting_Zhe1;~Yongqian_Li3;~Jing_Zhang17;~Yong_Luo2;~Han_Hu6;~Bo_Du3;~Yonggang_Wen1;~Dacheng_Tao1",
        "aff": "School of Computer Science, Wuhan University;Wuhan University;The University of Sydney;Wuhan University;;;Nanyang Technological University;",
        "aff_domain": "whu.edu.cn;whu.edu.cn;sydney.edu.au;whu.edu.cn;;;ntu.edu.sg;",
        "position": "PhD student;MS student;Research Fellow;Professor;;;Full Professor;",
        "bibtex": "@misc{\nzhe2024fhakitchens,\ntitle={{FHA}-Kitchens: A Novel Dataset for Fine-Grained Hand Action Recognition in Kitchen Scenes},\nauthor={Ting Zhe and Yongqian Li and Jing Zhang and Yong Luo and Han Hu and Bo Du and Yonggang Wen and Dacheng Tao},\nyear={2024},\nurl={https://openreview.net/forum?id=otoggKnn0A}\n}",
        "github": "",
        "project": "",
        "reviewers": "9rBA;wEMj;kr7t;hqWJ",
        "site": "https://openreview.net/forum?id=otoggKnn0A",
        "pdf_size": 3831515,
        "rating": "3;3;5;5",
        "confidence": "5;4;3;4",
        "soundness": "3;2;3;3",
        "contribution": "2;2;2;2",
        "presentation": "2;2;3;3",
        "wc_summary": "41;90;23;59",
        "wc_strengths": "43;39;24;59",
        "wc_weaknesses": "116;60;72;184",
        "wc_questions": "84;292;4;5",
        "wc_review": "284;481;123;307",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            53.25,
            24.742423082632794
        ],
        "wc_strengths_avg": [
            41.25,
            12.457427503300993
        ],
        "wc_weaknesses_avg": [
            108.0,
            48.579831205964474
        ],
        "wc_questions_avg": [
            96.25,
            117.58480981827542
        ],
        "wc_review_avg": [
            298.75,
            126.87469211785304
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.7071067811865475,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16527768447515518042&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;1;0;2",
        "aff_unique_norm": "Wuhan University;University of Sydney;Nanyang Technological University",
        "aff_unique_dep": "School of Computer Science;;",
        "aff_unique_url": "http://www.whu.edu.cn;https://www.sydney.edu.au;https://www.ntu.edu.sg",
        "aff_unique_abbr": "WHU;USYD;NTU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Wuhan;",
        "aff_country_unique_index": "0;0;1;0;2",
        "aff_country_unique": "China;Australia;Singapore"
    },
    {
        "id": "ouNI9pkf9g",
        "title": "Quantifying Anonymity in Score-Based Generators with Adversarial Fingerprinting",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent advances in score-based generative models have led to a huge spike in the development of downstream applications using generative models ranging from data augmentation over image and video generation to anomaly detection. \nDespite publicly available trained models, their potential to be used for privacy preserving data sharing has not been fully explored yet. \nTraining diffusion models on private data and disseminating the models and weights rather than the raw dataset paves the way for innovative large-scale data-sharing strategies, particularly in healthcare, where safeguarding patients' personal health information is paramount.\nHowever, publishing such models without individual consent of, e.g., the patients from whom the data was acquired,  necessitates guarantees that identifiable training samples will never be reproduced, thus protecting personal health data and satisfying  the requirements of policymakers and regulatory bodies. \nThis paper introduces a method for estimating the upper bound of the probability of reproducing identifiable training images during the sampling process. This is achieved by designing an adversarial approach that searches for anatomic fingerprints, such as medical devices or dermal art, which could potentially be used to uniquely re-identify training images.\nOur method harnesses the learned score-based model to estimate the probability of the entire subspace of the score function that may be utilized for one-to-one reproduction of training samples. To validate our estimates, we generate images containing a fingerprint and investigate whether generated samples from trained generative models can be uniquely mapped to the original training samples.\nOverall our results show that privacy-breaching images can be reproduced at sampling time if the models were trained without care.",
        "keywords": "Quantifying Anonymity in Score-Based Generators with Adversarial Fingerprinting",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/895af242e379c5f0b6abb782b30ff856b3b38578.pdf",
        "author": "Mischa Dombrowski;Bernhard Kainz",
        "authorids": "~Mischa_Dombrowski1;~Bernhard_Kainz1",
        "gender": "M;M",
        "homepage": "https://www.idea.tf.fau.eu;http://wp.doc.ic.ac.uk/bkainz/",
        "dblp": "322/0541;76/5562",
        "google_scholar": ";https://scholar.google.co.uk/citations?user=Igxq-YEAAAAJ",
        "orcid": ";0000-0002-7813-5023",
        "linkedin": ";https://uk.linkedin.com/in/bernhard-kainz-43514320",
        "or_profile": "~Mischa_Dombrowski1;~Bernhard_Kainz1",
        "aff": "Friedrich-Alexander Universit\u00e4t Erlangen-N\u00fcrnberg;King's College London",
        "aff_domain": "fau.de;kcl.ac.uk",
        "position": "PhD student;Honorable Lecturer",
        "bibtex": "@misc{\ndombrowski2024quantifying,\ntitle={Quantifying Anonymity in Score-Based Generators with Adversarial Fingerprinting},\nauthor={Mischa Dombrowski and Bernhard Kainz},\nyear={2024},\nurl={https://openreview.net/forum?id=ouNI9pkf9g}\n}",
        "github": "",
        "project": "",
        "reviewers": "RsRi;kVLX;Kiwu",
        "site": "https://openreview.net/forum?id=ouNI9pkf9g",
        "pdf_size": 9771413,
        "rating": "3;3;5",
        "confidence": "4;4;3",
        "soundness": "3;2;3",
        "contribution": "2;1;3",
        "presentation": "2;2;2",
        "wc_summary": "111;61;69",
        "wc_strengths": "18;55;77",
        "wc_weaknesses": "97;272;186",
        "wc_questions": "26;173;148",
        "wc_review": "252;561;480",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            80.33333333333333,
            21.9291789378647
        ],
        "wc_strengths_avg": [
            50.0,
            24.34474618201362
        ],
        "wc_weaknesses_avg": [
            185.0,
            71.44695001654492
        ],
        "wc_questions_avg": [
            115.66666666666667,
            64.22010761609032
        ],
        "wc_review_avg": [
            431.0,
            130.82048769210425
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11190777183253313830&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Friedrich-Alexander University Erlangen-N\u00fcrnberg;King's College London",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www fau.de;https://www.kcl.ac.uk",
        "aff_unique_abbr": "FAU;KCL",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Erlangen-N\u00fcrnberg;",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Germany;United Kingdom"
    },
    {
        "title": "Quality-Diversity through AI Feedback",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17802",
        "id": "owokKCrGYr",
        "author_site": "Herbie Bradley, Andrew Dai, Hannah Teufel, Jenny Zhang, Koen Oostermeijer, Marco Bellagente, Jeff Clune, Kenneth Stanley, G. Schott, Joel Lehman",
        "tldr": "",
        "abstract": "In many text-generation problems, users may prefer not only a single response, but a diverse range of high-quality outputs from which to choose. Quality-diversity (QD) search algorithms aim at such outcomes, by continually improving and diversifying a population of candidates. However, the applicability of QD to qualitative domains, like creative writing, has been limited by the difficulty of algorithmically specifying measures of quality and diversity. Interestingly, recent developments in language models (LMs) have enabled guiding search through \\emph{AI feedback}, wherein LMs are prompted in natural language to evaluate qualitative aspects of text. Leveraging this development, we introduce Quality-Diversity through AI Feedback (QDAIF), wherein an evolutionary algorithm applies LMs to both generate variation and evaluate the quality and diversity of candidate text. When assessed on creative writing domains, QDAIF covers more of a specified search space with high-quality samples than do non-QD controls. Further, human evaluation of QDAIF-generated creative texts validates reasonable agreement between AI and human evaluation. Our results thus highlight the potential of AI feedback to guide open-ended search for creative and original solutions, providing a recipe that seemingly generalizes to many domains and modalities. In this way, QDAIF is a step towards AI systems that can independently search, diversify, evaluate, and improve, which are among the core skills underlying human society's capacity for innovation.",
        "keywords": "quality diversity;large language models;derivative-free optimization;AI feedback",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Herbie Bradley;Andrew Dai;Hannah Benita Teufel;Jenny Zhang;Koen Oostermeijer;Marco Bellagente;Jeff Clune;Kenneth Stanley;Gregory Schott;Joel Lehman",
        "authorids": "~Herbie_Bradley1;~Andrew_Dai1;~Hannah_Benita_Teufel1;~Jenny_Zhang1;~Koen_Oostermeijer1;~Marco_Bellagente1;~Jeff_Clune3;~Kenneth_Stanley1;~Gregory_Schott1;~Joel_Lehman1",
        "gender": "M;;F;;M;Not Specified;;M;;",
        "homepage": "https://herbiebradley.com;https://scholar.google.com/citations?hl=en&user=EgdmMxUAAAAJ;;;https://www.aleph-alpha.com/;https://marcobellagente93.github.io;;https://www.kenstanley.net/;;http://joellehman.com",
        "dblp": ";;;;;294/7150;;s/KennethOStanley;;47/8285",
        "google_scholar": "oQ0HzPcAAAAJ;https://scholar.google.com/citations?hl=en;;;;;;https://scholar.google.com.tw/citations?user=6Q6oO1MAAAAJ;;GcvxHWQAAAAJ",
        "orcid": "0000-0001-5390-1257;;;;;;;;;",
        "linkedin": "herbiebradley/;;hannah-t-3a565a69/;;;marco-bellagente-025884128/;;kenneth-stanley-3a159b/;;",
        "or_profile": "~Herbie_Bradley1;~Andrew_Dai1;~Hannah_Benita_Teufel1;~Jenny_Zhang1;~Koen_Oostermeijer1;~Marco_Bellagente1;~Jeff_Clune3;~Kenneth_Stanley1;~Gregory_Schott1;~Joel_Lehman1",
        "aff": "University of Cambridge;Aleph Alpha GmbH;Aleph Alpha GmbH;;Aleph Alpha;Stability AI;;;;Carper.AI",
        "aff_domain": "cam.ac.uk;aleph-alpha.com;aleph-alpha.com;;aleph-alpha.com;stability.ai;;;;carper.ai",
        "position": "PhD student;Researcher;Researcher;;Researcher;Researcher;;;;Research Advisor",
        "bibtex": "@inproceedings{\nbradley2024qualitydiversity,\ntitle={Quality-Diversity through {AI} Feedback},\nauthor={Herbie Bradley and Andrew Dai and Hannah Benita Teufel and Jenny Zhang and Koen Oostermeijer and Marco Bellagente and Jeff Clune and Kenneth Stanley and Gregory Schott and Joel Lehman},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=owokKCrGYr}\n}",
        "github": "",
        "project": "",
        "reviewers": "gkKB;K2hJ;3nT4;8ua9",
        "pdf_size": 5349822,
        "rating": "5;6;6;6",
        "confidence": "3;3;3;3",
        "soundness": "2;3;2;3",
        "contribution": "2;4;2;3",
        "presentation": "3;3;2;4",
        "wc_summary": "78;29;44;408",
        "wc_strengths": "46;55;39;26",
        "wc_weaknesses": "61;91;155;15",
        "wc_questions": "36;20;101;7",
        "wc_review": "221;195;339;456",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1253;693;1878;783",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;2;4;2",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            139.75,
            155.88838154269226
        ],
        "wc_strengths_avg": [
            41.5,
            10.594810050208546
        ],
        "wc_weaknesses_avg": [
            80.5,
            50.820763473210434
        ],
        "wc_questions_avg": [
            41.0,
            36.13170353027933
        ],
        "wc_review_avg": [
            302.75,
            103.79396658765864
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1151.75,
            470.13794518204975
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 50,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1674248191740964034&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=owokKCrGYr",
        "pdf": "https://openreview.net/pdf?id=owokKCrGYr",
        "email": "cam.ac.uk;aleph-alpha.com;aleph-alpha.com;;aleph-alpha.com;stability.ai;;;;carper.ai",
        "author_num": 10,
        "aff_unique_index": "0;1;1;1;2;3",
        "aff_unique_norm": "University of Cambridge;Aleph Alpha;Stability AI;Carper.AI",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.cam.ac.uk;https://www.aleph-alpha.com;https://stability.ai;https://www.carper.ai",
        "aff_unique_abbr": "Cambridge;Aleph Alpha;Stability AI;Carper.AI",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Cambridge;",
        "aff_country_unique_index": "0;1;1;1;2;2",
        "aff_country_unique": "United Kingdom;Germany;United States"
    },
    {
        "title": "Recursive Generalization Transformer for Image Super-Resolution",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17801",
        "id": "owziuM1nsR",
        "author_site": "Zheng Chen, Yulun Zhang, Jinjin Gu, Linghe Kong, Xiaokang Yang",
        "tldr": "",
        "abstract": "Transformer architectures have exhibited remarkable performance in image super-resolution (SR). Since the quadratic computational complexity of the self-attention (SA) in Transformer, existing methods tend to adopt SA in a local region to reduce overheads. However, the local design restricts the global context exploitation, which is crucial for accurate image reconstruction. In this work, we propose the Recursive Generalization Transformer (RGT) for image SR, which can capture global spatial information and is suitable for high-resolution images. Specifically, we propose the recursive-generalization self-attention (RG-SA). It recursively aggregates input features into representative feature maps, and then utilizes cross-attention to extract global information. Meanwhile, the channel dimensions of attention matrices ($query$, $key$, and $value$) are further scaled to mitigate the redundancy in the channel domain. Furthermore, we combine the RG-SA with local self-attention to enhance the exploitation of the global context, and propose the hybrid adaptive integration (HAI) for module integration. The HAI allows the direct and effective fusion between features at different levels (local or global). Extensive experiments demonstrate that our RGT outperforms recent state-of-the-art methods quantitatively and qualitatively. Code and pre-trained models are available at https://github.com/zhengchen1999/RGT.",
        "keywords": "Transformer;image super-resolution",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/ddbba1c07f6cc55cfce4881732684d4d0b79a35b.pdf",
        "author": "Zheng Chen;Yulun Zhang;Jinjin Gu;Linghe Kong;Xiaokang Yang",
        "authorids": "~Zheng_Chen11;~Yulun_Zhang1;~Jinjin_Gu1;~Linghe_Kong1;~Xiaokang_Yang1",
        "gender": "M;M;M;M;M",
        "homepage": "https://zheng-chen.cn/;http://yulunzhang.com/;http://www.jasongt.com;https://www.cs.sjtu.edu.cn/~linghe.kong/;https://icne.sjtu.edu.cn/info/1064/1078.htm",
        "dblp": "33/2592-14;166/2763-1.html;209/5709;23/7909;06/3071-1.html",
        "google_scholar": "nLZtXdgAAAAJ;ORmLjWoAAAAJ;uMQ-G-QAAAAJ;https://scholar.google.com.tw/citations?user=-wm2X-8AAAAJ;yDEavdMAAAAJ",
        "orcid": "0009-0004-3963-7938;0000-0002-2288-5079;0000-0002-4389-6236;0000-0001-9266-3044;0000-0003-4029-3322",
        "linkedin": "zheng-chen-290084313;yulun-zhang-1116b5b9/;jinjingu;;",
        "or_profile": "~Zheng_Chen11;~Yulun_Zhang1;~Jinjin_Gu1;~Linghe_Kong1;~Xiaokang_Yang1",
        "aff": "Shanghai Jiaotong University;Swiss Federal Institute of Technology;University of Sydney;Shanghai Jiaotong University;Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn;ethz.ch;sydney.edu.au;sjtu.edu.cn;sjtu.edu.cn",
        "position": "MS student;Postdoc;PhD student;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nchen2024recursive,\ntitle={Recursive Generalization Transformer for Image Super-Resolution},\nauthor={Zheng Chen and Yulun Zhang and Jinjin Gu and Linghe Kong and Xiaokang Yang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=owziuM1nsR}\n}",
        "github": "",
        "project": "",
        "reviewers": "fY4p;bq6U;Pj4p;B1Rr",
        "pdf_size": 2482905,
        "rating": "6;8;8;8",
        "confidence": "5;4;5;5",
        "soundness": "3;3;4;3",
        "contribution": "3;3;4;3",
        "presentation": "3;3;4;3",
        "wc_summary": "45;69;40;58",
        "wc_strengths": "96;21;103;116",
        "wc_weaknesses": "100;79;73;43",
        "wc_questions": "100;4;51;75",
        "wc_review": "341;173;267;292",
        "wc_reply_reviewers": "0;0;13;0",
        "wc_reply_authors": "798;1090;837;824",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;2;2;2",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            53.0,
            11.335784048754634
        ],
        "wc_strengths_avg": [
            84.0,
            37.074249823833256
        ],
        "wc_weaknesses_avg": [
            73.75,
            20.38841582860228
        ],
        "wc_questions_avg": [
            57.5,
            35.415392133929565
        ],
        "wc_review_avg": [
            268.25,
            61.09572407296602
        ],
        "wc_reply_reviewers_avg": [
            3.25,
            5.629165124598851
        ],
        "wc_reply_authors_avg": [
            887.25,
            117.89693592286443
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 55,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7871642481710062643&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=owziuM1nsR",
        "pdf": "https://openreview.net/pdf?id=owziuM1nsR",
        "email": "sjtu.edu.cn;ethz.ch;sydney.edu.au;sjtu.edu.cn;sjtu.edu.cn",
        "author_num": 5,
        "aff_unique_index": "0;1;2;0;0",
        "aff_unique_norm": "Shanghai Jiao Tong University;Swiss Federal Institute of Technology;University of Sydney",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.sjtu.edu.cn;https://www.ethz.ch;https://www.sydney.edu.au",
        "aff_unique_abbr": "SJTU;ETH Zurich;USYD",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;0;0",
        "aff_country_unique": "China;Switzerland;Australia"
    },
    {
        "title": "Yet Another ICU Benchmark: A Flexible Multi-Center Framework for Clinical ML",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17800",
        "id": "ox2ATRM90I",
        "author_site": "Robin van de Water, Hendrik Schmidt, Paul Elbers, Patrick Thoral, Bert Arnrich, Patrick Rockenschaub",
        "tldr": "",
        "abstract": "Medical applications of machine learning (ML) have experienced a surge in popularity in recent years. Given the abundance of available data from electronic health records, the intensive care unit (ICU) is a natural habitat for ML. Models have been proposed to address numerous ICU prediction tasks like the early detection of complications. While authors frequently report state-of-the-art performance, it is challenging to verify claims of superiority. Datasets and code are not always published, and cohort definitions, preprocessing pipelines, and training setups are difficult to reproduce. This work introduces Yet Another ICU Benchmark (YAIB), a modular framework that allows researchers to define reproducible and comparable clinical ML experiments; we offer an end-to-end solution from cohort definition to model evaluation. The framework natively supports most open-access ICU datasets (MIMIC III/IV, eICU, HiRID, AUMCdb) and is easily adaptable to future ICU datasets. Combined with a transparent preprocessing pipeline and extensible training code for multiple ML and deep learning models, YAIB enables unified model development, transfer, and evaluation. Our benchmark comes with five predefined established prediction tasks (mortality, acute kidney injury, sepsis, kidney function, and length of stay) developed in collaboration with clinicians. Adding further tasks is straightforward by design. Using YAIB, we demonstrate that the choice of dataset, cohort definition, and preprocessing have a major impact on the prediction performance \u2014 often more so than model class \u2014 indicating an urgent need for YAIB as a holistic benchmarking tool. We provide our work to the clinical ML community to accelerate method development and enable real-world clinical implementations.",
        "keywords": "ICU;Intensive Care Unit;EHR;ML;Time Series;Patient Monitoring;Clinical ML;Benchmark;Multi-Center;MIMIC;eICU;HiRID;AmsterdamUMCdb",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/c8e0b816896de1f14c6a21f63137ad1718d3540a.zip",
        "author": "Robin van de Water;Hendrik Nils Aurel Schmidt;Paul Elbers;Patrick Thoral;Bert Arnrich;Patrick Rockenschaub",
        "authorids": "~Robin_van_de_Water1;~Hendrik_Nils_Aurel_Schmidt1;~Paul_Elbers1;~Patrick_Thoral1;~Bert_Arnrich1;~Patrick_Rockenschaub1",
        "gender": "M;M;;M;M;M",
        "homepage": "https://www.rpvandewater.com/;;https://www.icudata.nl;;https://hpi.de/arnrich/home.html;https://patrick-rockenschaub.com/",
        "dblp": "263/2987;;;;63/152;",
        "google_scholar": "https://scholar.google.nl/citations?user=Tp9Ry9gAAAAJ;;https://scholar.google.nl/citations?user=jPPoHuAAAAAJ;;GGtsB6kAAAAJ;1BEClqkAAAAJ",
        "orcid": "0000-0002-2895-4872;;0000-0003-0447-6893;0000-0001-6140-7195;0000-0001-8380-7667;0000-0002-6499-7933",
        "linkedin": "robin-van-de-water/;hendrik-schmidt-b50084112/;;patrickthoral/;;",
        "or_profile": "~Robin_van_de_Water1;~Hendrik_Nils_Aurel_Schmidt1;~Paul_Elbers1;~Patrick_Thoral1;~Bert_Arnrich1;~Patrick_Rockenschaub1",
        "aff": "Hasso Plattner Institute;;Amsterdam UMC;Amsterdam UMC;Hasso Plattner Institute;Medizinische Universit\u00e4t Innsbruck",
        "aff_domain": "hpi.de;;amsterdamumc.nl;amsterdamumc.nl;hpi.de;i-med.ac.at",
        "position": "PhD student;;Principal Researcher;Researcher;Full Professor;Postdoc",
        "bibtex": "@inproceedings{\nwater2024yet,\ntitle={Yet Another {ICU} Benchmark: A Flexible Multi-Center Framework for Clinical {ML}},\nauthor={Robin van de Water and Hendrik Nils Aurel Schmidt and Paul Elbers and Patrick Thoral and Bert Arnrich and Patrick Rockenschaub},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ox2ATRM90I}\n}",
        "github": "",
        "project": "",
        "reviewers": "o57d;5BSM;oWMD;VWQN;Q5t5",
        "pdf_size": 1382013,
        "rating": "5;6;6;6;8",
        "confidence": "3;3;3;3;4",
        "soundness": "3;2;3;3;4",
        "contribution": "2;3;3;2;4",
        "presentation": "4;2;3;3;4",
        "wc_summary": "31;39;112;51;123",
        "wc_strengths": "32;128;296;53;93",
        "wc_weaknesses": "184;389;229;128;60",
        "wc_questions": "5;163;178;4;141",
        "wc_review": "252;719;815;236;417",
        "wc_reply_reviewers": "74;148;108;31;35",
        "wc_reply_authors": "1315;2327;1220;1132;787",
        "reply_reviewers": "1;1;2;1;1",
        "reply_authors": "2;5;2;3;2",
        "rating_avg": [
            6.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.2,
            0.39999999999999997
        ],
        "soundness_avg": [
            3.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            2.8,
            0.7483314773547882
        ],
        "presentation_avg": [
            3.2,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            71.2,
            38.49363583762906
        ],
        "wc_strengths_avg": [
            120.4,
            93.809594392045
        ],
        "wc_weaknesses_avg": [
            198.0,
            110.97927734491697
        ],
        "wc_questions_avg": [
            98.2,
            77.40645967876324
        ],
        "wc_review_avg": [
            487.8,
            238.55012051977673
        ],
        "wc_reply_reviewers_avg": [
            79.2,
            44.422516812985734
        ],
        "wc_reply_authors_avg": [
            1356.2,
            517.0985979482057
        ],
        "reply_reviewers_avg": [
            1.2,
            0.4
        ],
        "reply_authors_avg": [
            2.8,
            1.16619037896906
        ],
        "replies_avg": [
            31,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.9185586535436918,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17868248673647682862&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=ox2ATRM90I",
        "pdf": "https://openreview.net/pdf?id=ox2ATRM90I",
        "email": "hpi.de;;amsterdamumc.nl;amsterdamumc.nl;hpi.de;i-med.ac.at",
        "author_num": 6,
        "aff_unique_index": "0;1;1;0;2",
        "aff_unique_norm": "Hasso Plattner Institute;Amsterdam University Medical Centers;Medizinische Universit\u00e4t Innsbruck",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.hpi.de;https://www.amsterdamumc.nl/;https://www.i-med.ac.at",
        "aff_unique_abbr": "HPI;AMC;MUI",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Innsbruck",
        "aff_country_unique_index": "0;1;1;0;2",
        "aff_country_unique": "Germany;Netherlands;Austria"
    },
    {
        "id": "oxEER3kZ9M",
        "title": "On the Possibilities of AI-Generated Text Detection: A Sample Complexity Analysis",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Our work addresses the critical issue of distinguishing text generated by Large Language Models (LLMs) from human-produced text, a task essential for numerous applications. Despite ongoing debate about the feasibility of such differentiation, we present evidence supporting its consistent achievability, except when human and machine text distributions are indistinguishable across their entire support. Drawing from information theory, we argue that as machine-generated text approximates human-like quality, the sample size needed for detection increases. We establish precise sample complexity bounds for detecting AI-generated text, laying groundwork for future research aimed at developing advanced, multi-sample detectors. Our empirical evaluations across multiple datasets (Xsum, Squad, IMDb, and Kaggle FakeNews) confirm the viability of enhanced detection methods. We test various state-of-the-art text generators, including GPT-2, GPT-3.5-Turbo, Llama, Llama-2-13B-Chat-HF, and Llama-2-70B-Chat-HF, against detectors, including oBERTa-Large/Base-Detector, GPTZero. Our findings align with OpenAI's empirical data related to sequence length, marking the first theoretical substantiation for these observations.",
        "keywords": "AI Text Detection;Zero Shot Detection;Large Language Models",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Souradip Chakraborty;Amrit Bedi;Sicheng Zhu;Bang An;Dinesh Manocha;Furong Huang",
        "authorids": "~Souradip_Chakraborty1;~Amrit_Bedi1;~Sicheng_Zhu1;~Bang_An1;~Dinesh_Manocha3;~Furong_Huang1",
        "gender": "M;M;M;;M;F",
        "homepage": "https://souradip-umd.github.io/;https://sites.google.com/view/amritsinghbedi/home;https://schzhu.github.io/;https://bangann.github.io/;https://www.cs.umd.edu/people/dmanocha;https://furong-huang.com",
        "dblp": "264/5758;176/2707.html;;188/0741;m/DineshManocha;72/8513",
        "google_scholar": "https://scholar.google.co.in/citations?user=pvETm1wAAAAJ;91WLA6QAAAAJ;;3ce6z_sAAAAJ;X08l_4IAAAAJ;13yyuCcAAAAJ",
        "orcid": ";;;;0000-0001-7047-9801;",
        "linkedin": ";;;;dinesh-manocha-2311846;",
        "or_profile": "~Souradip_Chakraborty1;~Amrit_Bedi1;~Sicheng_Zhu1;~Bang_An1;~Dinesh_Manocha3;~Furong_Huang1",
        "aff": "University of Maryland, College Park;University of Maryland, College Park;University of Maryland, College Park;University of Maryland, College Park;University of Maryland, College Park;University of Maryland",
        "aff_domain": "umd.edu;umd.edu;umd.edu;umd.edu;umd.edu;cs.umd.edu",
        "position": "PhD student;Researcher;PhD student;PhD student;Professor;Assistant Professor",
        "bibtex": "@misc{\nchakraborty2024on,\ntitle={On the Possibilities of {AI}-Generated Text Detection: A Sample Complexity Analysis},\nauthor={Souradip Chakraborty and Amrit Bedi and Sicheng Zhu and Bang An and Dinesh Manocha and Furong Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=oxEER3kZ9M}\n}",
        "github": "",
        "project": "",
        "reviewers": "JMFi;Xeu7;hkaL;6pNs",
        "site": "https://openreview.net/forum?id=oxEER3kZ9M",
        "pdf_size": 2290019,
        "rating": "3;5;5;6",
        "confidence": "3;4;2;3",
        "soundness": "3;2;3;4",
        "contribution": "1;3;3;3",
        "presentation": "3;3;4;4",
        "wc_summary": "67;62;74;224",
        "wc_strengths": "56;44;40;178",
        "wc_weaknesses": "160;169;140;389",
        "wc_questions": "60;50;5;146",
        "wc_review": "343;325;259;937",
        "wc_reply_reviewers": "0;0;0;74",
        "wc_reply_authors": "1184;1170;931;2159",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "4;5;5;5",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            106.75,
            67.82836795913639
        ],
        "wc_strengths_avg": [
            79.5,
            57.172983130146356
        ],
        "wc_weaknesses_avg": [
            214.5,
            101.29289214944946
        ],
        "wc_questions_avg": [
            65.25,
            51.0165414351071
        ],
        "wc_review_avg": [
            466.0,
            273.72431386341987
        ],
        "wc_reply_reviewers_avg": [
            18.5,
            32.04293994002423
        ],
        "wc_reply_authors_avg": [
            1361.0,
            471.5702492736369
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.75,
            0.4330127018922193
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5933045804042777963&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "University of Maryland",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www/umd.edu",
        "aff_unique_abbr": "UMD",
        "aff_campus_unique_index": "0;0;0;0;0",
        "aff_campus_unique": "College Park;",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Backdoor Contrastive Learning via Bi-level Trigger Optimization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17799",
        "id": "oxjeePpgSP",
        "author_site": "Weiyu Sun, Xinyu Zhang, Hao LU, YINGCONG CHEN, Ting Wang, Jinghui Chen, Lu Lin",
        "tldr": "",
        "abstract": "Contrastive Learning (CL) has attracted enormous attention due to its remarkable capability in unsupervised representation learning. However, recent works have revealed the vulnerability of CL to backdoor attacks: the feature extractor could be misled to embed backdoored data close to an attack target class, thus fooling the downstream predictor to misclassify it as the target. Existing attacks usually adopt a fixed trigger pattern and poison the training set with trigger-injected data, hoping for the feature extractor to learn the association between trigger and target class. However, we find that such fixed trigger design fails to effectively associate trigger-injected data with target class in the embedding space due to special CL mechanisms, leading to a limited attack success rate (ASR). This phenomenon motivates us to find a better backdoor trigger design tailored for CL framework. In this paper, we propose a bi-level optimization approach to achieve this goal, where the inner optimization simulates the CL dynamics of a surrogate victim, and the outer optimization enforces the backdoor trigger to stay close to the target throughout the surrogate CL procedure. Extensive experiments show that our attack can achieve a higher attack success rate (e.g., 99\\% ASR on ImageNet-100) with a very low poisoning rate (1\\%). Besides, our attack can effectively evade existing state-of-the-art defenses.",
        "keywords": "backdoor attack;unsupervised contrastive learning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Weiyu Sun;Xinyu Zhang;Hao LU;Ying-Cong Chen;Ting Wang;Jinghui Chen;Lu Lin",
        "authorids": "~Weiyu_Sun1;~Xinyu_Zhang20;~Hao_LU8;~Ying-Cong_Chen1;~Ting_Wang1;~Jinghui_Chen1;~Lu_Lin2",
        "gender": "M;;M;M;M;M;F",
        "homepage": "https://swy666.github.io/index.html;https://github.com/LinXi1C;https://scholar.google.com/citations?user=OrbGCGkAAAAJ&hl=zh-TW;https://www.yingcong.me/;https://alps-lab.github.io/;https://jinghuichen.github.io/;https://louise-lulin.github.io",
        "dblp": ";;72/5422-9;137/6578;12/2633-6.html;67/5633;86/2209-1",
        "google_scholar": "K0v59bIAAAAJ;;;https://scholar.google.com.hk/citations?user=n7j4bJUAAAAJ;cwcBTegAAAAJ;mKia7Y4AAAAJ;8N04pBgAAAAJ",
        "orcid": ";;0000-0002-2241-6598;;;;0000-0002-2539-3352",
        "linkedin": ";;;;;;lulin92/",
        "or_profile": "~Weiyu_Sun1;~Xinyu_Zhang20;~Hao_LU8;~Ying-Cong_Chen1;~Ting_Wang1;~Jinghui_Chen1;~Lu_Lin2",
        "aff": "Georgia Institute of Technology;Nanjing University;Hong Kong University of Science and Technology;Hong Kong University of Science and Technology;State University of New York at Stony Brook;Pennsylvania State University;Pennsylvania State University",
        "aff_domain": "gatech.edu;nju.edu.cn;hkust.edu;hkust-gz.edu.cn;cs.stonybrook.edu;psu.edu;psu.edu",
        "position": "PhD student;MS student;PhD student;Assistant Professor;Associate Professor;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nsun2024backdoor,\ntitle={Backdoor Contrastive Learning via Bi-level Trigger Optimization},\nauthor={Weiyu Sun and Xinyu Zhang and Hao LU and Ying-Cong Chen and Ting Wang and Jinghui Chen and Lu Lin},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=oxjeePpgSP}\n}",
        "github": "",
        "project": "",
        "reviewers": "wKXh;Tcds;KWn8;Saos",
        "pdf_size": 1843042,
        "rating": "5;6;6;6",
        "confidence": "5;4;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;2",
        "presentation": "2;3;3;3",
        "wc_summary": "132;75;109;44",
        "wc_strengths": "84;65;61;26",
        "wc_weaknesses": "98;177;211;496",
        "wc_questions": "256;91;53;2",
        "wc_review": "570;408;434;568",
        "wc_reply_reviewers": "765;0;0;146",
        "wc_reply_authors": "2204;1046;947;1470",
        "reply_reviewers": "4;0;0;1",
        "reply_authors": "6;3;3;4",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            90.0,
            33.414068893207244
        ],
        "wc_strengths_avg": [
            59.0,
            20.940391591371924
        ],
        "wc_weaknesses_avg": [
            245.5,
            150.3238171415295
        ],
        "wc_questions_avg": [
            100.5,
            95.16958547771446
        ],
        "wc_review_avg": [
            495.0,
            74.57211275000863
        ],
        "wc_reply_reviewers_avg": [
            227.75,
            315.8562766512643
        ],
        "wc_reply_authors_avg": [
            1416.75,
            495.156225347112
        ],
        "reply_reviewers_avg": [
            1.25,
            1.6393596310755
        ],
        "reply_authors_avg": [
            4.0,
            1.224744871391589
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11782180983149838854&as_sdt=4005&sciodt=0,6&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=oxjeePpgSP",
        "pdf": "https://openreview.net/pdf?id=oxjeePpgSP",
        "email": "gatech.edu;nju.edu.cn;hkust.edu;hkust-gz.edu.cn;cs.stonybrook.edu;psu.edu;psu.edu",
        "author_num": 7,
        "aff_unique_index": "0;1;2;2;3;4;4",
        "aff_unique_norm": "Georgia Institute of Technology;Nanjing University;Hong Kong University of Science and Technology;State University of New York at Stony Brook;Pennsylvania State University",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.gatech.edu;https://www.nju.edu.cn;https://www.ust.hk;https://www.stonybrook.edu;https://www.psu.edu",
        "aff_unique_abbr": "Georgia Tech;Nanjing U;HKUST;SUNY Stony Brook;PSU",
        "aff_campus_unique_index": "1;1;2",
        "aff_campus_unique": ";Hong Kong SAR;Stony Brook",
        "aff_country_unique_index": "0;1;1;1;0;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "oyFCgkkLUK",
        "title": "\u03b1Max-B-CUBED: A Supervised Metric for Addressing Completeness and Uncertainty in Cluster Evaluation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Assessing the quality of clustering results is a crucial and challenging task. The B-CUBED ($B^3$) precision and recall evaluation metric has gained popularity due to its ability to meet four formal constraints: homogeneity, completeness, rag bag, and size vs. quantity. However, the 'completeness' constraint, which demands that items of the same category be grouped in the same cluster, can pose problems for finer clustering algorithms that identify sub-clusters within clusters. This issue is particularly pronounced when the available labels are imprecise and coarse, resulting in uncertain and fuzzy cluster evaluations. To address this issue, we propose a modified evaluation metric called $\\alpha$Max-$B^3$. Our approach accounts for completeness and uncertainty in subgroup evaluation by reorganizing clusters into super-sets based on the most prevalent label and evaluating them alongside the original clusters using a modified weighted $B^3$ metric. The extent of uncertainty, given by $1-\\alpha$, can be either explicitly specified or automatically estimated.",
        "keywords": "ClusteringEvaluation metric;Uncertainty;Imprecise and coarse labels;\u2018Completeness\u2019 constraint;B-CUBED (B3) precision and recall evaluation metric",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/31e45196b7418d5b1af5f798fe0d6a4613d467a7.zip",
        "author": "Felip Guimera Cuevas;Helmut Schmid",
        "authorids": "~Felip_Guimera_Cuevas1;~Helmut_Schmid1",
        "gender": ";M",
        "homepage": ";https://www.cis.uni-muenchen.de/~schmid/",
        "dblp": ";79/3420",
        "google_scholar": ";https://scholar.google.de/citations?hl=de",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Felip_Guimera_Cuevas1;~Helmut_Schmid1",
        "aff": ";Center for Information and Language Processing",
        "aff_domain": ";cis.lmu.de",
        "position": ";Associate Professor",
        "bibtex": "@misc{\ncuevas2024maxbcubed,\ntitle={\\ensuremath{\\alpha}Max-B-{CUBED}: A Supervised Metric for Addressing Completeness and Uncertainty in Cluster Evaluation},\nauthor={Felip Guimera Cuevas and Helmut Schmid},\nyear={2024},\nurl={https://openreview.net/forum?id=oyFCgkkLUK}\n}",
        "github": "",
        "project": "",
        "reviewers": "mjBX;AXE2;KXAB;6ExU",
        "site": "https://openreview.net/forum?id=oyFCgkkLUK",
        "pdf_size": 789608,
        "rating": "3;3;5;8",
        "confidence": "5;4;4;2",
        "soundness": "2;2;3;4",
        "contribution": "2;3;2;3",
        "presentation": "1;3;2;3",
        "wc_summary": "59;86;65;82",
        "wc_strengths": "22;20;36;37",
        "wc_weaknesses": "62;154;56;52",
        "wc_questions": "157;44;188;49",
        "wc_review": "300;304;345;220",
        "wc_reply_reviewers": "16;0;0;0",
        "wc_reply_authors": "767;553;751;537",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            73.0,
            11.291589790636214
        ],
        "wc_strengths_avg": [
            28.75,
            7.790218225441442
        ],
        "wc_weaknesses_avg": [
            81.0,
            42.2965719651132
        ],
        "wc_questions_avg": [
            109.5,
            63.97069641640616
        ],
        "wc_review_avg": [
            292.25,
            45.27899623445732
        ],
        "wc_reply_reviewers_avg": [
            4.0,
            6.928203230275509
        ],
        "wc_reply_authors_avg": [
            652.0,
            107.29864864013899
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.9249105602074974,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:G7KjDevqf18J:scholar.google.com/&scioq=%CE%B1Max-B-CUBED:+A+Supervised+Metric+for+Addressing+Completeness+and+Uncertainty+in+Cluster+Evaluation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Center for Information and Language Processing",
        "aff_unique_dep": "",
        "aff_unique_url": "",
        "aff_unique_abbr": ""
    },
    {
        "title": "The Truth is in There: Improving Reasoning in Language Models with Layer-Selective Rank Reduction",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17798",
        "id": "ozX92bu8VA",
        "author_site": "Pratyusha Sharma, Jordan Ash, Dipendra Kumar Misra",
        "tldr": "",
        "abstract": "Transformer-based Large Language Models (LLMs) have become a fixture in modern machine learning. Correspondingly, significant resources are allocated towards research that aims to further advance this technology, typically resulting in models of increasing size that are trained on increasing amounts of data. This work, however, demonstrates the surprising result that it is often possible to significantly improve the performance of LLMs by selectively removing higher-order components of their weight matrices. This simple intervention, which we call LAyer-SElective Rank reduction (LASER), can be done on a model after training has completed, and requires minimal additional parameters and data. We show extensive experiments demonstrating the generality of this finding across language models and datasets, and provide in-depth analyses offering insights into both when LASER is effective and the mechanism by which it operates",
        "keywords": "Large Language models;Transformers;Low-rank approximation",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Pratyusha Sharma;Jordan T. Ash;Dipendra Misra",
        "authorids": "~Pratyusha_Sharma1;~Jordan_T._Ash1;~Dipendra_Misra1",
        "gender": "F;;M",
        "homepage": "https://pratyushasharma.github.io/;http://www.jordantash.com;https://dipendramisra.com/",
        "dblp": "228/7904;176/5225;218/6569",
        "google_scholar": "RGiCLUgAAAAJ;bmRNH-UAAAAJ;rIoPIFsAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Pratyusha_Sharma1;~Jordan_T._Ash1;~Dipendra_Misra1",
        "aff": "Massachusetts Institute of Technology;Microsoft Research;Microsoft Research",
        "aff_domain": "mit.edu;research.microsoft.com;microsoft.com",
        "position": "PhD student;Postdoc;Researcher",
        "bibtex": "@inproceedings{\nsharma2024the,\ntitle={The Truth is in There: Improving Reasoning in Language Models with Layer-Selective Rank Reduction},\nauthor={Pratyusha Sharma and Jordan T. Ash and Dipendra Misra},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ozX92bu8VA}\n}",
        "github": "",
        "project": "",
        "reviewers": "4cdi;Zz8q;F88a",
        "pdf_size": 4224847,
        "rating": "3;8;10",
        "confidence": "4;3;4",
        "soundness": "2;4;4",
        "contribution": "2;3;4",
        "presentation": "3;4;4",
        "wc_summary": "48;67;247",
        "wc_strengths": "57;60;38",
        "wc_weaknesses": "148;15;22",
        "wc_questions": "74;42;47",
        "wc_review": "327;184;354",
        "wc_reply_reviewers": "178;12;11",
        "wc_reply_authors": "775;316;207",
        "reply_reviewers": "1;1;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            7.0,
            2.943920288775949
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            120.66666666666667,
            89.66728624321259
        ],
        "wc_strengths_avg": [
            51.666666666666664,
            9.741092797468305
        ],
        "wc_weaknesses_avg": [
            61.666666666666664,
            61.11373731730771
        ],
        "wc_questions_avg": [
            54.333333333333336,
            14.055445761538676
        ],
        "wc_review_avg": [
            288.3333333333333,
            74.59371436134698
        ],
        "wc_reply_reviewers_avg": [
            67.0,
            78.48991442641957
        ],
        "wc_reply_authors_avg": [
            432.6666666666667,
            246.1223724536683
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.24019223070763068,
        "gs_citation": 64,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11065128098686157798&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=ozX92bu8VA",
        "pdf": "https://openreview.net/pdf?id=ozX92bu8VA",
        "email": "mit.edu;research.microsoft.com;microsoft.com",
        "author_num": 3,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Massachusetts Institute of Technology;Microsoft",
        "aff_unique_dep": ";Microsoft Research",
        "aff_unique_url": "https://web.mit.edu;https://www.microsoft.com/en-us/research",
        "aff_unique_abbr": "MIT;MSR",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "p09XyFxZkc",
        "title": "LaVie: High-Quality Video Generation with Cascaded Latent Diffusion Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This work aims to learn a high-quality text-to-video (T2V) generative model by leveraging a pre-trained text-to-image (T2I) model as a basis. It is a highly desirable yet challenging task to simultaneously a) accomplish the synthesis of visually realistic and temporally coherent videos while b) preserving the strong creative generation nature of the pre-trained T2I model. To this end, we propose LaVie, an integrated video generation framework that operates on cascaded video latent diffusion models, comprising a base T2V model, a temporal interpolation model, and a video super-resolution model. Our key insights are two-fold: 1) We reveal that the incorporation of simple temporal self-attentions, coupled with relative positional encoding, adequately captures the temporal correlations inherent in video data. 2) Additionally, we validate that the process of joint image-video fine-tuning plays a pivotal role in producing high-quality and creative outcomes. To enhance the performance of LaVie, we contribute a comprehensive and diverse video dataset named Vimeo25M, consisting of 25 million text-video pairs that prioritize quality, diversity, and aesthetic appeal. Extensive experiments demonstrate that LaVie achieves state-of-the-art performance both quantitatively and qualitatively. Furthermore, we showcase the versatility of pre-trained LaVie models in various long video generation and personalized video synthesis applications.",
        "keywords": "text-to-video generation;diffusion models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/9b7be39ae37699c99be3e7c7ae7b8d3b62214416.zip",
        "author": "Yaohui Wang;Xinyuan Chen;Xin Ma;Shangchen Zhou;Ziqi Huang;Yi Wang;Ceyuan Yang;Yinan He;Jiashuo Yu;Peiqing Yang;Yuwei Guo;Tianxing Wu;Chenyang Si;Yuming Jiang;Cunjian Chen;Chen Change Loy;Bo Dai;Dahua Lin;Yu Qiao;Ziwei Liu",
        "authorids": "~Yaohui_Wang1;~Xinyuan_Chen1;~Xin_Ma3;~Shangchen_Zhou1;~Ziqi_Huang2;~Yi_Wang19;~Ceyuan_Yang2;~Yinan_He1;~Jiashuo_Yu1;~Peiqing_Yang1;~Yuwei_Guo1;~Tianxing_Wu2;~Chenyang_Si2;~Yuming_Jiang1;~Cunjian_Chen2;~Chen_Change_Loy2;~Bo_Dai2;~Dahua_Lin1;~Yu_Qiao1;~Ziwei_Liu1",
        "gender": "M;F;;M;;M;M;M;M;F;M;M;M;M;M;M;M;M;;M",
        "homepage": "https://wyhsirius.github.io/;;https://maxin-cn.github.io/;https://shangchenzhou.com;https://ziqihuangg.github.io;https://shepnerd.github.io/;https://ceyuan.me/;https://yinanhe.github.io;;https://pq-yang.github.io/;https://guoyww.github.io;https://tianxingwu.github.io/;http://chenyangsi.top/;https://yumingj.github.io/;https://cunjian.github.io/;https://www.mmlab-ntu.com/person/ccloy/index.html;http://daibo.info/;http://dahua.site;;https://liuziwei7.github.io/",
        "dblp": "168/6263-1.html;;;191/5298;;17/221-33;218/2676;93/7763;289/7338;219/5327;159/7655-2;152/2473-2;220/3068;52/146-3;73/2740.html;01/5855;64/2903-2;53/6088;;05/6300-2",
        "google_scholar": "R7LyAb4AAAAJ;3fWSC8YAAAAJ;https://scholar.google.com.hk/citations?user=dN8QWCQAAAAJ;https://scholar.google.com.hk/citations?user=suaDwBQAAAAJ;Y3h_pzMAAAAJ;Xm2M8UwAAAAJ;Rfj4jWoAAAAJ;EgfF_CEAAAAJ;iH0Aq0YAAAAJ;s2yHgo8AAAAJ;K2ZLY98AAAAJ;https://scholar.google.com/citations?hl=en;XdahAuoAAAAJ;rU4OT14AAAAJ;f26cvh8AAAAJ;https://scholar.google.co.uk/citations?user=559LF80AAAAJ;https://scholar.google.com.hk/citations?user=KNWTvgEAAAAJ;GMzzRRUAAAAJ;;https://scholar.google.com.hk/citations?user=lc45xlcAAAAJ",
        "orcid": ";0000-0002-5517-7255;0000-0001-9389-9032;0000-0001-8201-8877;;;;;;;0009-0003-1516-4083;;;0000-0001-7653-4015;;0000-0001-5345-1591;0000-0003-0777-9232;;;",
        "linkedin": ";;;;;;;;;Peiqing-Yang-197856185/;;;;;;;;;;",
        "or_profile": "~Yaohui_Wang1;~Xinyuan_Chen1;~Xin_Ma3;~Shangchen_Zhou1;~Ziqi_Huang2;~Yi_Wang19;~Ceyuan_Yang2;~Yinan_He1;~Jiashuo_Yu1;~Peiqing_Yang1;~Yuwei_Guo1;~Tianxing_Wu2;~Chenyang_Si2;~Yuming_Jiang1;~Cunjian_Chen2;~Chen_Change_Loy2;~Bo_Dai2;~Dahua_Lin1;~Yu_Qiao1;~Ziwei_Liu1",
        "aff": "Shanghai AI Laboratory;Shanghai Artificial Intelligence Laboratory;Monash University;Nanyang Technological University;Nanyang Technological University;Shanghai AI Laboratory;ByteDance Inc.;Shanghai Aritifcal Intelligence Laboratory;Shanghai AI Laboratory;School of Computer Science and  Engineering, Nanyang Technological University;The Chinese University of Hong Kong;Nanyang Technological University;Nanyang Technological University;Nanyang Technological University;Monash University;Nanyang Technological University;Shanghai AI Laboratory;The Chinese University of Hong Kong;;Nanyang Technological University",
        "aff_domain": "pjlab.org.cn;pjlab.org.cn;monash.edu;ntu.edu.sg;ntu.edu.sg;pjlab.org.cn;bytedance.com;pjlab.org.cn;pjlab.org.cn;scse.ntu.edu.sg;cuhk.edu.hk;ntu.edu.sg;ntu.edu.sg;ntu.edu.sg;monash.edu;ntu.edu.sg;pjlab.org.cn;cuhk.edu.hk;;ntu.edu.sg",
        "position": "Research Scientist;Research Scientist;PhD student;PhD student;PhD student;Researcher;Researcher;Researcher;Researcher;PhD student;PhD student;PhD student;Postdoc;PhD student;Lecturer;Full Professor;Scientist;Associate Professor;;Assistant Professor",
        "bibtex": "@misc{\nwang2024lavie,\ntitle={LaVie: High-Quality Video Generation with Cascaded Latent Diffusion Models},\nauthor={Yaohui Wang and Xinyuan Chen and Xin Ma and Shangchen Zhou and Ziqi Huang and Yi Wang and Ceyuan Yang and Yinan He and Jiashuo Yu and Peiqing Yang and Yuwei Guo and Tianxing Wu and Chenyang Si and Yuming Jiang and Cunjian Chen and Chen Change Loy and Bo Dai and Dahua Lin and Yu Qiao and Ziwei Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=p09XyFxZkc}\n}",
        "github": "",
        "project": "",
        "reviewers": "9GLX;aq4u;b3WW;m4rL",
        "site": "https://openreview.net/forum?id=p09XyFxZkc",
        "pdf_size": 6369142,
        "rating": "5;5;6;6",
        "confidence": "4;5;5;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;2",
        "presentation": "2;3;2;3",
        "wc_summary": "91;56;101;63",
        "wc_strengths": "60;25;227;81",
        "wc_weaknesses": "180;155;91;280",
        "wc_questions": "2;40;158;4",
        "wc_review": "333;276;577;428",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "597;588;675;1090",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            77.75,
            18.7533330370897
        ],
        "wc_strengths_avg": [
            98.25,
            76.97848725455704
        ],
        "wc_weaknesses_avg": [
            176.5,
            68.0018382104484
        ],
        "wc_questions_avg": [
            51.0,
            63.60031446463138
        ],
        "wc_review_avg": [
            403.5,
            113.9396770225368
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            737.5,
            206.30862803091875
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            20,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 287,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7490010838192845949&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;3;3;0;4;1;0;3;5;3;3;3;2;3;0;5;3",
        "aff_unique_norm": "Shanghai AI Laboratory;Shanghai Artificial Intelligence Laboratory;Monash University;Nanyang Technological University;ByteDance;Chinese University of Hong Kong",
        "aff_unique_dep": ";;;;;",
        "aff_unique_url": "https://www.shanghai-ai-lab.com;http://www.shailab.org/;https://www.monash.edu;https://www.ntu.edu.sg;https://www.bytedance.com;https://www.cuhk.edu.hk",
        "aff_unique_abbr": "SAIL;Shanghai AI Lab;Monash;NTU;ByteDance;CUHK",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;1;2;2;0;0;0;0;2;0;2;2;2;1;2;0;0;2",
        "aff_country_unique": "China;Australia;Singapore"
    },
    {
        "id": "p14iRzavpt",
        "title": "Knowledge Distillation with Perturbed Loss: From a Vanilla Teacher to a Proxy Teacher",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Knowledge distillation is a popular technique to transfer knowledge from large teacher models to a small student model. Typically, knowledge distillation employs teacher-forcing learning, where the student learns to imitate the teacher by minimizing the KL divergence of its output distribution with the teacher\u2019s output distribution. In this work, we argue that such a learning objective is sub-optimal because there exists a discrepancy between the teacher\u2019s output distribution and the ground truth label distribution. Therefore, forcing the student to blindly imitate the unreliable teacher output distribution leads to inferior performance. To this end, we propose a novel knowledge distillation objective PTLoss by first representing the vanilla KL-based distillation loss function via a Maclaurin series and then perturbing the leading-order terms in this series. This perturbed loss implicitly transforms the original teacher into a proxy teacher with a distribution closer to the ground truth distribution. We establish the theoretical connection between this \u201cdistribution closeness\u201d and the student model generalizability, which enables us to select the PTLoss\u2019s perturbation coefficients in a principled way. Extensive experiments on five datasets demonstrate PTLoss can significantly improve the distillation effectiveness for teachers of various scales.",
        "keywords": "knowledge distillation;language model;NLP",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/53f13218b87675582f5d67376b836dc8715998d4.zip",
        "author": "Rongzhi Zhang;Jiaming Shen;Tianqi Liu;Jialu Liu;Michael Bendersky;Marc Najork;Chao Zhang",
        "authorids": "~Rongzhi_Zhang2;~Jiaming_Shen1;~Tianqi_Liu1;~Jialu_Liu1;~Michael_Bendersky1;~Marc_Najork1;~Chao_Zhang15",
        "gender": "M;;M;M;;M;",
        "homepage": "https://rongzhizhang.org/;https://mickeysjm.github.io;;https://jialu.info/;http://bendersky.github.io/;http://marc.najork.org/;http://chaozhang.org/",
        "dblp": "130/7337;178/3627;134/5653-2;14/8399;80/4305;n/MarcNajork;94/3019-14",
        "google_scholar": "https://scholar.google.com/citations?hl=en;-ZJ0sCoAAAAJ;pUKhiMIAAAAJ;BUERw4QAAAAJ;C9mxM5IAAAAJ;7HeAnjwAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";0000-0002-0467-4956;;;0000-0002-2941-6240;0000-0003-1423-0854;0000-0003-3009-598X",
        "linkedin": ";jiaming-shen-08186710a/;;;;najork/;",
        "or_profile": "~Rongzhi_Zhang2;~Jiaming_Shen1;~Tianqi_Liu1;~Jialu_Liu1;~Michael_Bendersky1;~Marc_Najork1;~Chao_Zhang15",
        "aff": "Zhejiang University;Google Research;Google DeepMind;Google Research;Google;Google Deepmind;Georgia Institute of Technology",
        "aff_domain": "zju.edu.cn;google.com;google.com;google.com;google.com;google.com;gatech.edu",
        "position": "Undergrad student;Research Scientist;Software Engineer;Software Engineer Manager;Researcher;Distinguished Researcher;Assistant Professor",
        "bibtex": "@misc{\nzhang2024knowledge,\ntitle={Knowledge Distillation with Perturbed Loss: From a Vanilla Teacher to a Proxy Teacher},\nauthor={Rongzhi Zhang and Jiaming Shen and Tianqi Liu and Jialu Liu and Michael Bendersky and Marc Najork and Chao Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=p14iRzavpt}\n}",
        "github": "",
        "project": "",
        "reviewers": "QQFu;5qNN;Bme6",
        "site": "https://openreview.net/forum?id=p14iRzavpt",
        "pdf_size": 549807,
        "rating": "5;5;6",
        "confidence": "3;4;3",
        "soundness": "3;3;3",
        "contribution": "3;2;3",
        "presentation": "2;4;2",
        "wc_summary": "64;100;45",
        "wc_strengths": "49;53;53",
        "wc_weaknesses": "360;216;13",
        "wc_questions": "71;49;153",
        "wc_review": "544;418;264",
        "wc_reply_reviewers": "0;39;0",
        "wc_reply_authors": "1293;1850;704",
        "reply_reviewers": "0;1;0",
        "reply_authors": "3;4;2",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            69.66666666666667,
            22.80838052607467
        ],
        "wc_strengths_avg": [
            51.666666666666664,
            1.8856180831641267
        ],
        "wc_weaknesses_avg": [
            196.33333333333334,
            142.343091000426
        ],
        "wc_questions_avg": [
            91.0,
            44.75116385823576
        ],
        "wc_review_avg": [
            408.6666666666667,
            114.4998786995961
        ],
        "wc_reply_reviewers_avg": [
            13.0,
            18.384776310850235
        ],
        "wc_reply_authors_avg": [
            1282.3333333333333,
            467.9133348055908
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.0,
            0.816496580927726
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2151440417001832940&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;1;1;1;2;3",
        "aff_unique_norm": "Zhejiang University;Google;DeepMind;Georgia Institute of Technology",
        "aff_unique_dep": ";Google Research;DeepMind;",
        "aff_unique_url": "https://www.zju.edu.cn;https://research.google;https://deepmind.com;https://www.gatech.edu",
        "aff_unique_abbr": "ZJU;Google Research;DeepMind;Georgia Tech",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;2;1;1;2;1",
        "aff_country_unique": "China;United States;United Kingdom"
    },
    {
        "title": "Lie Group Decompositions for Equivariant Neural Networks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17797",
        "id": "p34fRKp8qA",
        "author_site": "Mircea Mironenco, Patrick Forr\u00e9",
        "tldr": "",
        "abstract": "Invariance and equivariance to geometrical transformations have proven to be very useful inductive biases when training (convolutional) neural network models, especially in the low-data regime.\nMuch work has focused on the case where the symmetry group employed is compact or abelian, or both.\nRecent work has explored enlarging the class of transformations used to the case of Lie groups, principally through the use of their Lie algebra, as well as the group exponential and logarithm maps.\nThe applicability of such methods to larger transformation groups is limited by the fact that depending on the group of interest $G$, the exponential map may not be surjective.\nFurther limitations are encountered when $G$ is neither compact nor abelian.\nUsing the structure and geometry of Lie groups and their homogeneous spaces, we present a framework by which it is possible to work with such groups primarily focusing on the Lie groups $G = \\textnormal{GL}^{+}(n, \\mathbb{R})$ and $G = \\textnormal{SL}(n, \\mathbb{R})$, as well as their representation as affine transformations $\\mathbb{R}^{n} \\rtimes G$.\nInvariant integration as well as a global parametrization is realized by decomposing the \"larger\" groups into subgroups and submanifolds which can be handled individually.\nUnder this framework, we show how convolution kernels can be parametrized to build models equivariant with respect to affine transformations.\nWe evaluate the robustness and out-of-distribution generalisation capability of our model on the standard affine-invariant benchmark classification task, where we outperform all previous equivariant models as well as all Capsule Network proposals.",
        "keywords": "equivariant neural networks;lie groups;group convolution;geometric deep learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Mircea Mironenco;Patrick Forr\u00e9",
        "authorids": "~Mircea_Mironenco2;~Patrick_Forr\u00e91",
        "gender": ";",
        "homepage": ";",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": ";",
        "aff": ";",
        "aff_domain": ";",
        "position": ";",
        "bibtex": "@inproceedings{\nmironenco2024lie,\ntitle={Lie Group Decompositions for Equivariant Neural Networks},\nauthor={Mircea Mironenco and Patrick Forr{\\'e}},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=p34fRKp8qA}\n}",
        "github": "",
        "project": "",
        "reviewers": "gz8n;azQE;kmML;8ViQ;yeU2;gQEm",
        "pdf_size": 626842,
        "rating": "5;6;6;8;8;8",
        "confidence": "3;3;3;3;3;3",
        "soundness": "2;4;4;3;4;4",
        "contribution": "2;3;3;3;3;3",
        "presentation": "2;2;3;3;3;2",
        "wc_summary": "103;72;168;109;126;134",
        "wc_strengths": "74;78;64;62;66;106",
        "wc_weaknesses": "291;424;115;115;156;269",
        "wc_questions": "4;247;145;46;3;125",
        "wc_review": "472;821;492;332;351;634",
        "wc_reply_reviewers": "41;116;0;16;30;0",
        "wc_reply_authors": "2379;1445;1113;371;365;303",
        "reply_reviewers": "1;1;0;1;1;0",
        "reply_authors": "3;2;2;1;1;1",
        "rating_avg": [
            6.833333333333333,
            1.2133516482134197
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            3.5,
            0.7637626158259734
        ],
        "contribution_avg": [
            2.8333333333333335,
            0.3726779962499649
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            118.66666666666667,
            29.550333707459586
        ],
        "wc_strengths_avg": [
            75.0,
            14.95548951611637
        ],
        "wc_weaknesses_avg": [
            228.33333333333334,
            111.64477397332826
        ],
        "wc_questions_avg": [
            95.0,
            87.22576072086349
        ],
        "wc_review_avg": [
            517.0,
            168.59023301089144
        ],
        "wc_reply_reviewers_avg": [
            33.833333333333336,
            39.63338940281989
        ],
        "wc_reply_authors_avg": [
            996.0,
            752.4420243447331
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.74535599249993
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11048260869129985370&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=p34fRKp8qA",
        "pdf": "https://openreview.net/pdf?id=p34fRKp8qA",
        "email": ";",
        "author_num": 2
    },
    {
        "id": "p3vHM5e4Z0",
        "title": "Hyper-parameter Tuning for Fair Classification without Sensitive Attribute Access",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Fair machine learning methods seek to train models that balance model performance across demographic subgroups defined over sensitive attributes like race and gender. Although sensitive attributes are typically assumed to be known during training, they may not be available in practice due to privacy and other logistical concerns. Recent work has sought to train fair models without sensitive attributes on training data. However, these methods need extensive hyper-parameter tuning to achieve good results, and hence assume that sensitive attributes are known on validation data. However, this assumption too might not be practical. Here, we propose \\sys, a framework to train fair classifiers without access to sensitive attributes on either training or validation data. Instead, we generate pseudo sensitive attributes on the validation data by training a ERM model and using the classifier's incorrectly (correctly) classified examples as proxies for disadvantaged (advantaged) groups. Since fairness metrics like demographic parity, equal opportunity and subgroup accuracy can be estimated to within a proportionality constant even with noisy sensitive attribute information, we show theoretically and empirically that these proxy labels can be used to maximize fairness under average accuracy constraints. Key to our results is a principled approach to select the hyper-parameters of the ERM model in a completely unsupervised fashion (meaning without access to ground truth sensitive attributes) that minimizes the gap between fairness estimated using noisy versus ground-truth sensitive labels. We demonstrate that \\sys outperforms existing methods on CelebA, Waterbirds, and UCI datasets.",
        "keywords": "Fairness",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Akshaj Kumar Veldanda;Ivan Brugere;Sanghamitra Dutta;Alan Mishler;Siddharth Garg",
        "authorids": "~Akshaj_Kumar_Veldanda2;~Ivan_Brugere1;~Sanghamitra_Dutta2;~Alan_Mishler1;~Siddharth_Garg1",
        "gender": "M;M;F;;M",
        "homepage": "https://wp.nyu.edu/tandonschoolofengineering-akveldanda/;;https://sites.google.com/site/sanghamitraweb/;https://alanmishler.com;http://engineering.nyu.edu/people/siddharth-garg/",
        "dblp": "259/1063;50/10346;154/6653;165/5043;94/3807",
        "google_scholar": "https://scholar.google.com/citations?hl=en;JGlGUcsAAAAJ;BgaqaXwAAAAJ;qSvw_8oAAAAJ;https://scholar.google.com.tw/citations?user=Yf8OqQQAAAAJ",
        "orcid": ";0000-0002-2953-3746;0000-0002-6500-2627;0000-0002-7654-208X;",
        "linkedin": "akshaj-kumar-veldanda/;ivanbrugere/;;alanmishler;",
        "or_profile": "~Akshaj_Kumar_Veldanda2;~Ivan_Brugere1;~Sanghamitra_Dutta2;~Alan_Mishler1;~Siddharth_Garg1",
        "aff": "Capital One;J.P. Morgan;University of Maryland, College Park;J.P. Morgan Chase;New York University",
        "aff_domain": "capitalone.com;jpmchase.com;umd.edu;jpmorgan.com;nyu.edu",
        "position": "Intern;Researcher;Assistant Professor;Researcher;Associate Professor",
        "bibtex": "@misc{\nveldanda2024hyperparameter,\ntitle={Hyper-parameter Tuning for Fair Classification without Sensitive Attribute Access},\nauthor={Akshaj Kumar Veldanda and Ivan Brugere and Sanghamitra Dutta and Alan Mishler and Siddharth Garg},\nyear={2024},\nurl={https://openreview.net/forum?id=p3vHM5e4Z0}\n}",
        "github": "",
        "project": "",
        "reviewers": "ftMx;ig7f;WjCg",
        "site": "https://openreview.net/forum?id=p3vHM5e4Z0",
        "pdf_size": 721720,
        "rating": "3;5;5",
        "confidence": "2;5;3",
        "soundness": "2;3;3",
        "contribution": "2;2;2",
        "presentation": "2;3;3",
        "wc_summary": "66;87;71",
        "wc_strengths": "23;45;123",
        "wc_weaknesses": "437;202;74",
        "wc_questions": "2;2;47",
        "wc_review": "528;336;315",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            1.247219128924647
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            74.66666666666667,
            8.956685895029603
        ],
        "wc_strengths_avg": [
            63.666666666666664,
            42.90558109254423
        ],
        "wc_weaknesses_avg": [
            237.66666666666666,
            150.32483346259045
        ],
        "wc_questions_avg": [
            17.0,
            21.213203435596427
        ],
        "wc_review_avg": [
            393.0,
            95.84362263604189
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.7559289460184544,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4980372204026703233&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "Capital One;J.P. Morgan;University of Maryland;JPMorgan Chase & Co.;New York University",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.capitalone.com;https://www.jpmorganchase.com;https://www/umd.edu;https://www.jpmorganchase.com;https://www.nyu.edu",
        "aff_unique_abbr": "Capital One;JPM;UMD;JPM;NYU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";College Park",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "p3x4fNKSNd",
        "title": "Generating Transferable and Stealthy Adversarial Patch via Attention-guided Adversarial Inpainting",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Adversarial patch attacks can fool the face recognition (FR) models via small patches. However, previous adversarial patch attacks often result in unnatural patterns that are easily noticeable. Generating transferable and stealthy adversarial patches that can efficiently deceive the black-box FR models while having good camouflage is challenging because of the huge stylistic difference between the source and target images. To generate transferable, natural-looking, and stealthy adversarial patches, we propose an innovative two-stage attack called \\emph{Adv-Inpainting}, which extracts style features and identity features from the attacker and target faces, respectively and then fills the patches with misleading and inconspicuous content guided by attention maps. In the first stage, we extract multi-scale style embeddings by a pyramid-like network and identity embeddings by a pretrained FR model and propose a novel Attention-guided Adaptive Instance Normalization layer (AAIN) to merge them via background-patch cross-attention maps. The proposed layer can adaptively fuse identity and style embeddings by fully exploiting priority contextual information. In the second stage, we design an Adversarial Patch Refinement Network (APR-Net) with a novel boundary variance loss, a spatial discounted reconstruction loss, and a perceptual loss to boost the stealthiness further. Experiments demonstrate that our attack can generate adversarial patches with improved visual quality, better stealthiness, and stronger transferability than state-of-the-art adversarial patch attacks and semantic attacks.",
        "keywords": "Adversarial attack; Face recognition; Generative model",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Yanjie Li;Duan Mingxing;Xuelong Dai;Bin Xiao",
        "authorids": "~Yanjie_Li3;~Duan_Mingxing2;~Xuelong_Dai2;~Bin_Xiao6",
        "gender": "M;M;M;",
        "homepage": ";http://csee.hnu.edu.cn/people/duanmingxing;;",
        "dblp": ";157/2422;251/0904;",
        "google_scholar": "h3Chje4AAAAJ;2mnGWRMAAAAJ;WMV5yIQAAAAJ;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Yanjie_Li3;~Duan_Mingxing2;~Xuelong_Dai2;~Bin_Xiao6",
        "aff": "The Hong Kong Polytechnic University;Hunan University;The Hong Kong Polytechnic University;",
        "aff_domain": "polyu.edu.hk;hnu.edu.cn;polyu.edu.hk;",
        "position": "PhD student;Associate Professor;PhD student;",
        "bibtex": "@misc{\nli2024generating,\ntitle={Generating Transferable and Stealthy Adversarial Patch via Attention-guided Adversarial Inpainting},\nauthor={Yanjie Li and Duan Mingxing and Xuelong Dai and Bin Xiao},\nyear={2024},\nurl={https://openreview.net/forum?id=p3x4fNKSNd}\n}",
        "github": "",
        "project": "",
        "reviewers": "WMpX;ZKhL;iAwQ;uQV1",
        "site": "https://openreview.net/forum?id=p3x4fNKSNd",
        "pdf_size": 2673947,
        "rating": "5;5;5;5",
        "confidence": "3;3;3;2",
        "soundness": "3;3;2;3",
        "contribution": "2;3;2;2",
        "presentation": "3;3;3;2",
        "wc_summary": "91;72;59;50",
        "wc_strengths": "37;15;31;19",
        "wc_weaknesses": "52;243;29;86",
        "wc_questions": "62;11;71;116",
        "wc_review": "242;341;190;271",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            68.0,
            15.411035007422441
        ],
        "wc_strengths_avg": [
            25.5,
            8.874119674649425
        ],
        "wc_weaknesses_avg": [
            102.5,
            83.61369505051191
        ],
        "wc_questions_avg": [
            65.0,
            37.28940868396816
        ],
        "wc_review_avg": [
            261.0,
            54.54814387309618
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:l9aa7fHZN4gJ:scholar.google.com/&scioq=Generating+Transferable+and+Stealthy+Adversarial+Patch+via+Attention-guided+Adversarial+Inpainting&hl=en&as_sdt=0,33",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Hong Kong Polytechnic University;Hunan University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.polyu.edu.hk;http://www.hunu.edu.cn/",
        "aff_unique_abbr": "PolyU;HNU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "p4B7rl1UFA",
        "title": "AdaLomo: Low-memory Optimization with Adaptive Learning Rate",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large language models have achieved remarkable success, but their extensive parameter size necessitates substantial memory for training, thereby setting a high threshold. While the recently proposed low-memory optimization (LOMO) reduces memory footprint, its optimization technique, akin to stochastic gradient descent, is sensitive to hyper-parameters and exhibits suboptimal convergence, failing to match the performance of the prevailing optimizer for large language models, AdamW. Through empirical analysis of the Adam optimizer, we found that, compared to momentum, the adaptive learning rate is more critical for bridging the gap. Building on this insight, we introduce the low-memory optimization with adaptive learning rate (AdaLomo), which offers an adaptive learning rate for each parameter. To maintain memory efficiency, we employ non-negative matrix factorization for the second-order moment estimation in the optimizer state. Additionally, we suggest the use of a grouped update normalization to stabilize convergence. Our experiments with instruction-tuning and further pre-training demonstrate that AdaLomo achieves results on par with AdamW, while significantly reducing memory requirements, thereby lowering the hardware barrier to training large language models.",
        "keywords": "Memory-efficient;Optimization;Large language models",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Kai Lv;Hang Yan;Qipeng Guo;Haijun Lv;Xipeng Qiu",
        "authorids": "~Kai_Lv2;~Hang_Yan2;~Qipeng_Guo1;lvhaijun@pjlab.org.cn;~Xipeng_Qiu1",
        "gender": "M;;M;;M",
        "homepage": "https://kailv69.github.io/;;;;https://xpqiu.github.io/",
        "dblp": "191/2440-1;;172/1046;;69/1395",
        "google_scholar": "7XdtqKMAAAAJ;;k3mPGKgAAAAJ;;Pq4Yp_kAAAAJ",
        "orcid": ";;;;0000-0001-7163-5247",
        "linkedin": ";;;;",
        "or_profile": "~Kai_Lv2;~Hang_Yan2;~Qipeng_Guo1;lvhaijun@pjlab.org.cn;~Xipeng_Qiu1",
        "aff": "Fudan University;;Shanghai AI Laboratory;;Fudan University",
        "aff_domain": "fudan.edu.cn;;pjlab.org.cn;;fudan.edu.cn",
        "position": "PhD student;;Researcher;;Full Professor",
        "bibtex": "@misc{\nlv2024adalomo,\ntitle={AdaLomo: Low-memory Optimization with Adaptive Learning Rate},\nauthor={Kai Lv and Hang Yan and Qipeng Guo and Haijun Lv and Xipeng Qiu},\nyear={2024},\nurl={https://openreview.net/forum?id=p4B7rl1UFA}\n}",
        "github": "",
        "project": "",
        "reviewers": "6pvp;VMbV;t9K6;vpaW",
        "site": "https://openreview.net/forum?id=p4B7rl1UFA",
        "pdf_size": 1439424,
        "rating": "1;3;3;6",
        "confidence": "5;4;3;3",
        "soundness": "1;1;2;3",
        "contribution": "1;1;2;2",
        "presentation": "1;2;2;3",
        "wc_summary": "83;10;55;73",
        "wc_strengths": "21;20;22;80",
        "wc_weaknesses": "204;227;53;86",
        "wc_questions": "10;20;221;41",
        "wc_review": "318;277;351;280",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            55.25,
            27.985487310390006
        ],
        "wc_strengths_avg": [
            35.75,
            25.557533136044253
        ],
        "wc_weaknesses_avg": [
            142.5,
            74.37237390321758
        ],
        "wc_questions_avg": [
            73.0,
            86.17714314132257
        ],
        "wc_review_avg": [
            306.5,
            30.35210042155238
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.8021806287494232,
        "gs_citation": 20,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1104865035923675128&as_sdt=80005&sciodt=0,11&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Fudan University;Shanghai AI Laboratory",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.fudan.edu.cn;https://www.shanghai-ai-lab.com",
        "aff_unique_abbr": "Fudan;SAIL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Traveling Waves Encode The Recent Past and Enhance Sequence Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17796",
        "id": "p4S5Z6Sah4",
        "author_site": "T. Anderson Keller, Lyle Muller, Terrence Sejnowski, Max Welling",
        "tldr": "",
        "abstract": "Traveling waves of neural activity have been observed throughout the brain at a diversity of regions and scales; however, their precise computational role is still debated. One physically inspired hypothesis suggests that the cortical sheet may act like a wave-propagating system capable of invertibly storing a short-term memory of sequential stimuli through induced waves traveling across the cortical surface, and indeed many experimental results from neuroscience correlate wave activity with memory tasks. To date, however, the computational implications of this idea have remained hypothetical due to the lack of a simple recurrent neural network architecture capable of exhibiting such waves. In this work, we introduce a model to fill this gap, which we denote the Wave-RNN (wRNN), and demonstrate how such an architecture indeed efficiently encodes the recent past through a suite of synthetic memory tasks where wRNNs learn faster and reach significantly lower error than wave-free counterparts. We further explore the implications of this memory storage system on more complex sequence modeling tasks such as sequential image classification and find that wave-based models not only again outperform comparable wave-free RNNs while using significantly fewer parameters, but additionally perform comparably to more complex gated architectures such as LSTMs and GRUs.",
        "keywords": "RNNs;Traveling Waves;Memory;Sequence Modeling",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "T. Anderson Keller;Lyle Muller;Terrence Sejnowski;Max Welling",
        "authorids": "~T._Anderson_Keller1;~Lyle_Muller1;~Terrence_Sejnowski2;~Max_Welling1",
        "gender": "M;M;M;M",
        "homepage": "http://mullerlab.ca;https://cnl.salk.edu/;https://staff.fnwi.uva.nl/m.welling/;https://akandykeller.github.io",
        "dblp": ";;16/2286;183/9966.html",
        "google_scholar": ";;https://scholar.google.nl/citations?user=8200InoAAAAJ;Tb86kC0AAAAJ",
        "orcid": ";;0000-0003-1484-2121;",
        "linkedin": ";;;thomas-andy-keller-63abb88b/",
        "or_profile": "~Lyle_Muller1;~Terrence_Sejnowski2;~Max_Welling1;~Thomas_Anderson_Keller1",
        "aff": "Western University;Salk Institute;University of Amsterdam;Harvard University",
        "aff_domain": "uwo.ca;salk.edu;uva.nl;harvard.edu",
        "position": "Assistant Professor;Full Professor;Full Professor;Postdoc",
        "bibtex": "@inproceedings{\nkeller2024traveling,\ntitle={Traveling Waves Encode The Recent Past and Enhance Sequence Learning},\nauthor={T. Anderson Keller and Lyle Muller and Terrence Sejnowski and Max Welling},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=p4S5Z6Sah4}\n}",
        "github": "",
        "project": "",
        "reviewers": "h1zv;6SWP;2PWQ;ovPq",
        "pdf_size": 9775945,
        "rating": "5;6;6;8",
        "confidence": "4;3;4;4",
        "soundness": "3;3;3;3",
        "contribution": "3;4;2;3",
        "presentation": "2;3;2;3",
        "wc_summary": "121;163;34;97",
        "wc_strengths": "97;30;64;34",
        "wc_weaknesses": "1360;336;293;257",
        "wc_questions": "3;78;20;95",
        "wc_review": "1581;607;411;483",
        "wc_reply_reviewers": "0;0;0;147",
        "wc_reply_authors": "1574;1062;959;948",
        "reply_reviewers": "0;0;0;2",
        "reply_authors": "3;2;2;2",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            103.75,
            46.687123492457744
        ],
        "wc_strengths_avg": [
            56.25,
            26.947866334832522
        ],
        "wc_weaknesses_avg": [
            561.5,
            461.8617217306496
        ],
        "wc_questions_avg": [
            49.0,
            38.451267859460756
        ],
        "wc_review_avg": [
            770.5,
            473.16461194810415
        ],
        "wc_reply_reviewers_avg": [
            36.75,
            63.65286717815624
        ],
        "wc_reply_authors_avg": [
            1135.75,
            256.90112397574285
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.13245323570650439,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17898133085054796219&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=p4S5Z6Sah4",
        "pdf": "https://openreview.net/pdf?id=p4S5Z6Sah4",
        "email": "uwo.ca;salk.edu;uva.nl;harvard.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Western University;Salk Institute for Biological Studies;University of Amsterdam;Harvard University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.uwo.ca;https://www.salk.edu;https://www.uva.nl;https://www.harvard.edu",
        "aff_unique_abbr": "Western;Salk Institute;UvA;Harvard",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;1",
        "aff_country_unique": "Canada;United States;Netherlands"
    },
    {
        "title": "Compose and Conquer: Diffusion-Based 3D Depth Aware Composable Image Synthesis",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17795",
        "id": "p4eG8rCa0b",
        "author_site": "Jonghyun Lee, Hansam Cho, YoungJoon Yoo, Seoung Bum Kim, Yonghyun Jeong",
        "tldr": "",
        "abstract": "Addressing the limitations of text as a source of accurate layout representation in text-conditional diffusion models, many works incorporate additional signals to condition certain attributes within a generated image. Although successful, previous works do not account for the specific localization of said attributes extended into the three dimensional plane. In this context, we present a conditional diffusion model that integrates control over three-dimensional object placement with disentangled representations of global stylistic semantics from multiple exemplar images. Specifically, we first introduce depth disentanglement training to leverage the relative depth of objects as an estimator, allowing the model to identify the absolute positions of unseen objects through the use of synthetic image triplets. We also introduce soft guidance, a method for imposing global semantics onto targeted regions without the use of any additional localization cues. Our integrated framework, Compose and Conquer (CnC), unifies these techniques to localize multiple conditions in a disentangled manner. We demonstrate that our approach allows perception of objects at varying depths while offering a versatile framework for composing localized objects with different global semantics.",
        "keywords": "Generative Models;Diffusion Models;Image Editing;Image Composition",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Jonghyun Lee;Hansam Cho;YoungJoon Yoo;Seoung Bum Kim;Yonghyun Jeong",
        "authorids": "~Jonghyun_Lee2;~Hansam_Cho1;~YoungJoon_Yoo1;~Seoung_Bum_Kim1;~Yonghyun_Jeong1",
        "gender": "M;M;M;M;M",
        "homepage": ";http://sites.google.com/view/yjyoo3312;http://dmqa.korea.ac.kr/;https://github.com/TeamSAIDA/SAIDA;",
        "dblp": "367/1773;146/4031;48/803;260/0615.html;",
        "google_scholar": "YBvima8AAAAJ;YGVqRuIAAAAJ;https://scholar.google.co.kr/citations?user=-ACQ0GAAAAAJ;e9pHCjUAAAAJ;DrIILGsAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;jonghyun-lee-9b7754222/",
        "or_profile": "~Hansam_Cho1;~YoungJoon_Yoo1;~Seoung_Bum_Kim1;~Yonghyun_Jeong1;~Jong_Hyun_Lee2",
        "aff": "Korea University;Chung-Ang University;Korea University;NAVER;Korea University",
        "aff_domain": "korea.ac.kr;cau.ac.kr;korea.ac.kr;navercorp.com;korea.ac.kr",
        "position": "PhD student;Associate Professor;Full Professor;Researcher;MS student",
        "bibtex": "@inproceedings{\nlee2024compose,\ntitle={Compose and Conquer: Diffusion-Based 3D Depth Aware Composable Image Synthesis},\nauthor={Jonghyun Lee and Hansam Cho and YoungJoon Yoo and Seoung Bum Kim and Yonghyun Jeong},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=p4eG8rCa0b}\n}",
        "github": "",
        "project": "",
        "reviewers": "FnjA;iDhm;taqR",
        "pdf_size": 33246792,
        "rating": "6;6;8",
        "confidence": "3;4;4",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "3;3;3",
        "wc_summary": "105;82;82",
        "wc_strengths": "118;255;50",
        "wc_weaknesses": "208;159;180",
        "wc_questions": "98;80;1",
        "wc_review": "529;576;313",
        "wc_reply_reviewers": "10;20;38",
        "wc_reply_authors": "1179;1167;1197",
        "reply_reviewers": "1;1;1",
        "reply_authors": "3;3;3",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            89.66666666666667,
            10.842303978193728
        ],
        "wc_strengths_avg": [
            141.0,
            85.25647580487166
        ],
        "wc_weaknesses_avg": [
            182.33333333333334,
            20.07209228976613
        ],
        "wc_questions_avg": [
            59.666666666666664,
            42.12943019895817
        ],
        "wc_review_avg": [
            472.6666666666667,
            114.52025536510513
        ],
        "wc_reply_reviewers_avg": [
            22.666666666666668,
            11.585431464655178
        ],
        "wc_reply_authors_avg": [
            1181.0,
            12.328828005937952
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.0,
            0.0
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.49999999999999983,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4608481656602590525&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=p4eG8rCa0b",
        "pdf": "https://openreview.net/pdf?id=p4eG8rCa0b",
        "email": "korea.ac.kr;cau.ac.kr;korea.ac.kr;navercorp.com;korea.ac.kr",
        "author_num": 5,
        "aff_unique_index": "0;1;0;2;0",
        "aff_unique_norm": "Korea University;Chung-Ang University;NAVER Corporation",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.korea.ac.kr;http://www.cau.ac.kr;https://www.naver.com",
        "aff_unique_abbr": "KU;CAU;NAVER",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "p5SurcLh24",
        "title": "Unifying Model-Based and Model-Free Reinforcement Learning with Equivalent Policy Sets",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Model-based and model-free reinforcement learning (RL) each possess relative strengths that prevent either algorithm from strictly dominating the other.\nModel-based RL often offers greater data efficiency, as it can use models to evaluate many possible behaviors before choosing one to enact. However, because models cannot perfectly represent complex environments, agents that rely too heavily on models may suffer from poor asymptotic performance.  Model-free RL avoids this problem at the expense of data efficiency. In this work, we seek a unified approach to RL that combines the strengths of both algorithms. To this end, we propose *equivalent policy sets* (EPS), a novel tool for quantifying the limitations of models for the purposes of decision making.\nBased on this concept, we propose *Unified RL*, a novel RL algorithm that uses models to constrain model-free RL to the set of policies that are not provably suboptimal, according to model-based bounds on policy performance.\nWe demonstrate across a range of benchmarks that Unified RL effectively combines the relative strengths of both model-based and model-free RL, in that it achieves comparable data efficiency to model-based RL and exceeds the data efficiency of model-free RL, while achieving asymptotic performance similar or superior to that of model-free RL.  Additionally, we show that Unified RL outperforms a number of existing state-of-the-art model-based and model-free RL algorithms, and can learn effective policies in situations where either model-free or model-based RL alone fail.",
        "keywords": "model-based reinforcement learning;model-free reinforcement learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/cd984951d01d397e8371c6d52adfa5c2e1388ab5.pdf",
        "author": "Benjamin Freed;Thomas Wei;Roberto Calandra;Jeff Schneider;Howie Choset",
        "authorids": "~Benjamin_Freed1;~Thomas_Wei1;~Roberto_Calandra1;~Jeff_Schneider1;~Howie_Choset1",
        "gender": ";;M;;M",
        "homepage": ";https://thomasw219.github.io/;https://www.robertocalandra.com;https://www.cs.cmu.edu/~schneide;http://choset.com",
        "dblp": ";;118/8239;38/247;c/HowieChoset",
        "google_scholar": "_RUP_pUAAAAJ;;FdE3LOEAAAAJ;3bSbb20AAAAJ;",
        "orcid": ";;0000-0001-9430-8433;0000-0002-5080-9073;",
        "linkedin": ";;rcalandra;jeff-schneider-1593b322/;howie-choset-45b0b21/",
        "or_profile": "~Benjamin_Freed1;~Thomas_Wei1;~Roberto_Calandra1;~Jeff_Schneider1;~Howie_Choset1",
        "aff": ";;Technische Universit\u00e4t Dresden;Carnegie Mellon University;Carnegie Mellon University",
        "aff_domain": ";;tu-dresden.de;cs.cmu.edu;cmu.edu",
        "position": ";;Full Professor;Researcher;Full Professor",
        "bibtex": "@misc{\nfreed2024unifying,\ntitle={Unifying Model-Based and Model-Free Reinforcement Learning with Equivalent Policy Sets},\nauthor={Benjamin Freed and Thomas Wei and Roberto Calandra and Jeff Schneider and Howie Choset},\nyear={2024},\nurl={https://openreview.net/forum?id=p5SurcLh24}\n}",
        "github": "",
        "project": "",
        "reviewers": "jTrP;Gnaz;1YmJ;9w9H",
        "site": "https://openreview.net/forum?id=p5SurcLh24",
        "pdf_size": 1825413,
        "rating": "3;5;5;6",
        "confidence": "3;4;4;4",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "102;148;187;30",
        "wc_strengths": "48;47;239;10",
        "wc_weaknesses": "191;164;304;8",
        "wc_questions": "4;265;141;201",
        "wc_review": "345;624;871;249",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            116.75,
            58.426770405354425
        ],
        "wc_strengths_avg": [
            86.0,
            89.65210538520554
        ],
        "wc_weaknesses_avg": [
            166.75,
            105.63468890473432
        ],
        "wc_questions_avg": [
            152.75,
            96.42710977728203
        ],
        "wc_review_avg": [
            522.25,
            243.9583724736661
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.9271726499455306,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4125505327389715014&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Technische Universit\u00e4t Dresden;Carnegie Mellon University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://tu-dresden.de;https://www.cmu.edu",
        "aff_unique_abbr": "TUD;CMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "Germany;United States"
    },
    {
        "id": "p5jBLcVmhe",
        "title": "SoftTreeMax: Exponential Variance Reduction in Policy Gradient via Tree Expansion",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Policy gradient methods suffer from large variance and high sample complexity. To mitigate this, we introduce SoftTreeMax---a generalization of softmax that employs planning. In SoftTreeMax, we extend the traditional logits with the multi-step discounted cumulative reward, topped with the logits of future states. We analyze the gradient variance of SoftTreeMax and reveal for the first time how tree expansion helps reduce this variance. We prove that the variance decays exponentially with the planning horizon as a function of the chosen tree-expansion policy. Specifically, we show that the closer the induced transitions are to being state-independent, the faster the decay. With approximate forward models, we prove that the resulting gradient bias diminishes with the approximation error while retaining the same variance decay. Ours is the first result to bound the gradient bias with an approximate model. In a practical implementation of SoftTreeMax, we utilize a parallel GPU-based simulator for fast and efficient tree expansion. Using this implementation in Atari, we show that SoftTreeMax reduces the gradient variance by three orders of magnitude. This leads to better sample complexity and improved performance compared to distributed PPO.",
        "keywords": "Reinforcement Learning;Policy Gradient;Softmax;Tree expansion",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/10bf932133e26bf96bd77afe0c2b48bca911a70a.zip",
        "author": "Gal Dalal;Assaf Hallak;Gugan Thoppe;Shie Mannor;Gal Chechik",
        "authorids": "~Gal_Dalal2;~Assaf_Hallak1;~Gugan_Thoppe1;~Shie_Mannor2;~Gal_Chechik1",
        "gender": "M;M;M;;M",
        "homepage": ";;https://shie.net.technion.ac.il;https://chechiklab.biu.ac.il/~gal/;",
        "dblp": "117/9126;117/3710;20/1669;c/GalChechik;166/1605",
        "google_scholar": ";https://scholar.google.co.in/citations?user=X5zV3s8AAAAJ;https://scholar.google.com.tw/citations?user=q1HlbIUAAAAJ;Wk2gAZUAAAAJ;https://scholar.google.co.il/citations?user=NfJiSMMAAAAJ",
        "orcid": "0000-0001-7915-9206;;;0000-0001-9164-5303;0000-0002-3166-4251",
        "linkedin": ";;;;galdalal/",
        "or_profile": "~Assaf_Hallak1;~Gugan_Thoppe1;~Shie_Mannor2;~Gal_Chechik1;~Gal_Dalal1",
        "aff": "NVIDIA;Indian Institute of Science;Technion - Israel Institute of Technology, Technion;NVIDIA;NVIDIA",
        "aff_domain": "nvidia.com;iisc.ac.in;technion.il;nvidia.com;nvidia.com",
        "position": "Senior research scientist;Assistant Professor;Full Professor;Principal Researcher;Senior Research Scientist",
        "bibtex": "@misc{\ndalal2024softtreemax,\ntitle={SoftTreeMax: Exponential Variance Reduction in Policy Gradient via Tree Expansion},\nauthor={Gal Dalal and Assaf Hallak and Gugan Thoppe and Shie Mannor and Gal Chechik},\nyear={2024},\nurl={https://openreview.net/forum?id=p5jBLcVmhe}\n}",
        "github": "",
        "project": "",
        "reviewers": "eGu2;84Hk;vDhi;Xrnz",
        "site": "https://openreview.net/forum?id=p5jBLcVmhe",
        "pdf_size": 3279263,
        "rating": "5;5;6;8",
        "confidence": "3;3;3;3",
        "soundness": "3;3;2;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "121;70;38;130",
        "wc_strengths": "97;34;60;45",
        "wc_weaknesses": "109;46;2;6",
        "wc_questions": "205;88;264;45",
        "wc_review": "532;238;364;226",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "714;348;957;140",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            89.75,
            37.632266740126084
        ],
        "wc_strengths_avg": [
            59.0,
            23.80126047082381
        ],
        "wc_weaknesses_avg": [
            40.75,
            42.99636612552275
        ],
        "wc_questions_avg": [
            150.5,
            87.8763335602937
        ],
        "wc_review_avg": [
            340.0,
            123.3288287465668
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            539.75,
            316.6341540326943
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:2AwUxdhqCqIJ:scholar.google.com/&scioq=SoftTreeMax:+Exponential+Variance+Reduction+in+Policy+Gradient+via+Tree+Expansion&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0;0",
        "aff_unique_norm": "NVIDIA;Indian Institute of Science;Technion - Israel Institute of Technology",
        "aff_unique_dep": "NVIDIA Corporation;;",
        "aff_unique_url": "https://www.nvidia.com;https://www.iisc.ac.in;https://www.technion.ac.il",
        "aff_unique_abbr": "NVIDIA;IISc;Technion",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;0;0",
        "aff_country_unique": "United States;India;Israel"
    },
    {
        "id": "p5oXp5Kvq5",
        "title": "A Causal Ordering Prior for Unsupervised Representation Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Unsupervised representation learning with variational inference relies heavily on independence assumptions over latent variables. Causal representation learning (CRL), however, argues that factors of variation in a dataset are, in fact, causally related. Allowing latent variables to be correlated, as a consequence of causal relationships, is more realistic and generalisable. So far, provably identifiable methods rely on: auxiliary information, weak labels, and interventional or even counterfactual data. Inspired by causal discovery with functional causal models, we propose a fully unsupervised representation learning method that considers a data generation process with a latent additive noise model (ANM). We encourage the latent space to follow a causal ordering via loss function based on the Hessian of the latent distribution.",
        "keywords": "latent causal ordering;ANM;identifiability results;representation learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Avinash Kori;Pedro Sanchez;Konstantinos Vilouras;Ben Glocker;Sotirios A. Tsaftaris",
        "authorids": "~Avinash_Kori1;~Pedro_Sanchez1;~Konstantinos_Vilouras1;~Ben_Glocker1;~Sotirios_A._Tsaftaris1",
        "gender": "M;;M;;M",
        "homepage": "https://vios.science/team/sanchez;;https://www.doc.ic.ac.uk/~bglocker;https://vios.science/;https://koriavinash1.github.io/",
        "dblp": "14/8283;352/3036;86/2890;14/613;215/3763",
        "google_scholar": "KPchGe4AAAAJ;0PF9AkQAAAAJ;https://scholar.google.co.uk/citations?user=g_HtjLIAAAAJ;jC1uFnYAAAAJ;https://scholar.google.co.uk/citations?user=X6o3q0gAAAAJ",
        "orcid": "0000-0003-2435-3049;;0000-0002-4897-9356;;0000-0002-5878-3584",
        "linkedin": "https://linkedin.com/in/pedro-sanches-ppsg;;;;koriavinash1/",
        "or_profile": "~Pedro_Sanchez1;~Konstantinos_Vilouras1;~Ben_Glocker1;~Sotirios_A._Tsaftaris1;~Avinash_G._Kori1",
        "aff": "University of Edinburgh, University of Edinburgh;University of Edinburgh, University of Edinburgh;Imperial College London;University of Edinburgh;Imperial College London",
        "aff_domain": "ed.ac.uk;ed.ac.uk;imperial.ac.uk;ed.ac.uk;ic.ac.uk",
        "position": "PhD student;PhD student;Full Professor;Professor in machine learning and computer vision;PhD student",
        "bibtex": "@misc{\nkori2024a,\ntitle={A Causal Ordering Prior for Unsupervised Representation Learning},\nauthor={Avinash Kori and Pedro Sanchez and Konstantinos Vilouras and Ben Glocker and Sotirios A. Tsaftaris},\nyear={2024},\nurl={https://openreview.net/forum?id=p5oXp5Kvq5}\n}",
        "github": "",
        "project": "",
        "reviewers": "5aVx;4VV5;fvDC;icPp",
        "site": "https://openreview.net/forum?id=p5oXp5Kvq5",
        "pdf_size": 2244915,
        "rating": "3;3;5;5",
        "confidence": "5;4;3;3",
        "soundness": "1;2;2;2",
        "contribution": "2;1;3;2",
        "presentation": "2;2;3;1",
        "wc_summary": "119;222;50;91",
        "wc_strengths": "82;49;55;27",
        "wc_weaknesses": "529;191;112;828",
        "wc_questions": "16;17;681;95",
        "wc_review": "746;479;898;1041",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            120.5,
            63.53148825582476
        ],
        "wc_strengths_avg": [
            53.25,
            19.60070151805797
        ],
        "wc_weaknesses_avg": [
            415.0,
            285.284945274019
        ],
        "wc_questions_avg": [
            202.25,
            278.2583107474061
        ],
        "wc_review_avg": [
            791.0,
            208.15739237413598
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9045340337332909,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10814685150528360970&as_sdt=5,30&sciodt=0,30&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;1;0;1",
        "aff_unique_norm": "University of Edinburgh;Imperial College London",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ed.ac.uk;https://www.imperial.ac.uk",
        "aff_unique_abbr": "Edinburgh;ICL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "p5tfWyeQI2",
        "title": "Symbolic equation solving via reinforcement learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Machine-learning methods are gradually being adopted in a great variety of social, economic, and scientific contexts, yet they are notorious for struggling with exact mathematics. A typical example is computer algebra, which includes tasks like simplifying mathematical terms, calculating formal derivatives, or finding exact solutions of algebraic equations. Traditional software packages for these purposes are commonly based on a huge database of rules for how a specific operation (e.g., differentiation) transforms a certain term (e.g., sine function) into another one (e.g., cosine function). Thus far, these rules have usually needed to be discovered and subsequently programmed by humans. Focusing on the paradigmatic example of solving linear equations in symbolic form, we demonstrate how the process of finding elementary transformation rules and step-by-step solutions can be automated using reinforcement learning with deep neural networks.",
        "keywords": "computer algebra;symbolic mathematics;reinforcement learning;deep Q-learning",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/586bbc5386b992c16f50b164db6bb49dba291230.zip",
        "author": "Lennart Dabelow;Masahito Ueda",
        "authorids": "~Lennart_Dabelow1;~Masahito_Ueda1",
        "gender": ";M",
        "homepage": ";http://cat.phys.s.u-tokyo.ac.jp/index-e.html",
        "dblp": ";",
        "google_scholar": "DUKtgvcAAAAJ;https://scholar.google.co.jp/citations?user=Xpjx9CwAAAAJ",
        "orcid": "0000-0002-6868-5857;0000-0002-5367-1436",
        "linkedin": ";",
        "or_profile": "~Lennart_Dabelow1;~Masahito_Ueda1",
        "aff": "Queen Mary University of London;The University of Tokyo",
        "aff_domain": "qmul.ac.uk;u-tokyo.ac.jp",
        "position": "Lecturer;Full Professor",
        "bibtex": "@misc{\ndabelow2024symbolic,\ntitle={Symbolic equation solving via reinforcement learning},\nauthor={Lennart Dabelow and Masahito Ueda},\nyear={2024},\nurl={https://openreview.net/forum?id=p5tfWyeQI2}\n}",
        "github": "",
        "project": "",
        "reviewers": "8V3F;QB4J;hHWo",
        "site": "https://openreview.net/forum?id=p5tfWyeQI2",
        "pdf_size": 714027,
        "rating": "3;5;5",
        "confidence": "2;3;5",
        "soundness": "2;2;2",
        "contribution": "2;2;1",
        "presentation": "3;2;4",
        "wc_summary": "19;102;137",
        "wc_strengths": "35;20;32",
        "wc_weaknesses": "233;107;511",
        "wc_questions": "22;45;87",
        "wc_review": "309;274;767",
        "wc_reply_reviewers": "0;0;554",
        "wc_reply_authors": "905;663;755",
        "reply_reviewers": "0;0;1",
        "reply_authors": "2;1;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            1.247219128924647
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            86.0,
            49.48400414948922
        ],
        "wc_strengths_avg": [
            29.0,
            6.48074069840786
        ],
        "wc_weaknesses_avg": [
            283.6666666666667,
            168.77861897237523
        ],
        "wc_questions_avg": [
            51.333333333333336,
            26.911377189252544
        ],
        "wc_review_avg": [
            450.0,
            224.60780633510194
        ],
        "wc_reply_reviewers_avg": [
            184.66666666666666,
            261.15810451823154
        ],
        "wc_reply_authors_avg": [
            774.3333333333334,
            99.73743307081628
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.7559289460184545,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5385925337706185451&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Queen Mary University of London;University of Tokyo",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.qmul.ac.uk;https://www.u-tokyo.ac.jp",
        "aff_unique_abbr": "QMUL;UTokyo",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "London;",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United Kingdom;Japan"
    },
    {
        "id": "p6UwN2Rxhx",
        "title": "Unveiling Temporal Telltales: Are Unconditional Video Generation Models Implicitly Encoding Temporal Information?",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Unconditional video generation models seemed to generate realistic videos. However, in this paper, we delve into what could be the meaning of `realness' in the video generation models, taking into account that Convolutional Neural Networks (CNNs) are built with the inspiration from human visual neuroscience. Similar to human observers, we expected CNNs to struggle in classifying the temporal location of generated videos using a single frame due to the limited temporal information a single frame alone provides. However, our preliminary experiments unveil that current unconditional video generation models actually do inadvertently encode temporal location into each frame, enabling CNNs to correctly classify the temporal location of generated videos. To alleviate such a problem, we propose a method by adding the Gradient Reversal Layer (GRL) with lightweight CNN to the prior works to explicitly neglect this implicitly encoded temporal information. The experimental results, indeed, show that the implicit encoding of temporal information while training the unconditional video generator does negatively influence the FVD score. Moreover, experiments on diverse prior video generation models and datasets show that our approach can be used in a plug-and-play manner. Also, the results show the successful elimination of implicitly encoded temporal information without compromising the FVD score, highlighting the need to consider temporal classification accuracy as a supplementary metric in video generation models.",
        "keywords": "Unconditional Video Generation; Video Generation",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Jaehyun Choi;Gyojin Han;Jiwan Hur;Jae Young Lee;Junmo Kim",
        "authorids": "~Jaehyun_Choi1;~Gyojin_Han1;~Jiwan_Hur1;~Jae_Young_Lee1;~Junmo_Kim1",
        "gender": "M;M;M;M;M",
        "homepage": ";;;https://scholar.google.com/citations?user=f6VnfxcAAAAJ&hl=en;https://siit.kaist.ac.kr/Faculty",
        "dblp": "62/6980;334/7869;337/9896;;40/240-2.html",
        "google_scholar": ";https://scholar.google.co.kr/citations?hl=en;3jag3z4AAAAJ;f6VnfxcAAAAJ;https://scholar.google.com.tw/citations?user=GdQtWNQAAAAJ",
        "orcid": "0000-0002-9183-761X;;;0000-0002-7450-5023;",
        "linkedin": ";;;;",
        "or_profile": "~Jaehyun_Choi1;~Gyojin_Han1;~Jiwan_Hur1;~Jae_Young_Lee1;~Junmo_Kim1",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;KAIST;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr;ee.kaist.ac.kr;kaist.ac.kr;kaist.ac.kr",
        "position": "PhD student;PhD student;PhD student;PhD student;Associate Professor",
        "bibtex": "@misc{\nchoi2024unveiling,\ntitle={Unveiling Temporal Telltales: Are Unconditional Video Generation Models Implicitly Encoding Temporal Information?},\nauthor={Jaehyun Choi and Gyojin Han and Jiwan Hur and Jae Young Lee and Junmo Kim},\nyear={2024},\nurl={https://openreview.net/forum?id=p6UwN2Rxhx}\n}",
        "github": "",
        "project": "",
        "reviewers": "kbs5;xNmb;isck;LjvM;v3eo",
        "site": "https://openreview.net/forum?id=p6UwN2Rxhx",
        "pdf_size": 7000083,
        "rating": "3;3;5;5;6",
        "confidence": "4;2;4;5;3",
        "soundness": "2;2;2;2;3",
        "contribution": "2;2;2;2;3",
        "presentation": "2;3;2;3;2",
        "wc_summary": "87;64;86;64;178",
        "wc_strengths": "54;44;69;72;70",
        "wc_weaknesses": "269;188;253;356;143",
        "wc_questions": "91;21;137;2;24",
        "wc_review": "501;317;545;494;415",
        "wc_reply_reviewers": "47;115;68;0;0",
        "wc_reply_authors": "1981;1253;440;544;786",
        "reply_reviewers": "1;1;1;0;0",
        "reply_authors": "4;3;2;1;1",
        "rating_avg": [
            4.4,
            1.2
        ],
        "confidence_avg": [
            3.6,
            1.019803902718557
        ],
        "soundness_avg": [
            2.2,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            95.8,
            42.315009157508165
        ],
        "wc_strengths_avg": [
            61.8,
            10.961751684835777
        ],
        "wc_weaknesses_avg": [
            241.8,
            72.88731028100844
        ],
        "wc_questions_avg": [
            55.0,
            50.88418221805279
        ],
        "wc_review_avg": [
            454.4,
            80.47260403391952
        ],
        "wc_reply_reviewers_avg": [
            46.0,
            43.538488719752316
        ],
        "wc_reply_authors_avg": [
            1000.8,
            564.5704207625475
        ],
        "reply_reviewers_avg": [
            0.6,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            2.2,
            1.16619037896906
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.294174202707276,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:6zQnXBHgZnYJ:scholar.google.com/&scioq=Unveiling+Temporal+Telltales:+Are+Unconditional+Video+Generation+Models+Implicitly+Encoding+Temporal+Information%3F&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "p6hIAEHwSp",
        "title": "Efficient Subgraph Rule Induction via Tree Folding in Differentiable Logic Programming",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Differentiable inductive logic programming techniques have proven effective at learning logic rules from noisy datasets; however, existing algorithms incur pernicious trade-offs between rule expressivity and scalability to large problems. Forward-chaining ILP algorithms can learn arbitrary rules, but their memory requirements scale exponentially with problem size. Backwards-chaining ILP algorithms address this limitation but do so with loss of generality by imposing the restrictive constraint that rules must be expressible as ensembles of independent chain-like Horn clauses. In this paper we present FUSE-ILP, a technique that relaxes this chain-like constraint and enables the differentiable evaluation of a restricted class of subgraph-like rules. Our method extends TensorLog-inspired backwards-chaining ILP techniques with branch masking and leaf grouping, which enable tree-like rule evaluation and \u201cfolding\u201d of these trees into subgraphs. We demonstrate that this formulation allows our algorithm to learn more expressive rules than previous backwards-chaining algorithms while retaining a similar computational cost.",
        "keywords": "inductive logic programming;subgraph rules;gradient-based",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "",
        "author": "Blair Johnson;Faramarz Fekri;James Clayton Kerce",
        "authorids": "~Blair_Johnson1;~Faramarz_Fekri1;~James_Clayton_Kerce1",
        "gender": ";M;",
        "homepage": "https://blairjohnson.dev;http://Fekri.ece.gatech.edu;http://kerce.net",
        "dblp": ";77/2313;305/7702",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;FPtjf0gAAAAJ",
        "orcid": ";;",
        "linkedin": ";;claytonkerce/",
        "or_profile": "~Blair_Johnson1;~Faramarz_Fekri1;~James_Clayton_Kerce1",
        "aff": "Georgia Institute of Technology;Georgia Institute of Technology;Georgia Institute of Technology",
        "aff_domain": "gatech.edu;gatech.edu;gatech.edu",
        "position": "PhD student;Full Professor;Principal Researcher",
        "bibtex": "@misc{\njohnson2024efficient,\ntitle={Efficient Subgraph Rule Induction via Tree Folding in Differentiable Logic Programming},\nauthor={Blair Johnson and Faramarz Fekri and James Clayton Kerce},\nyear={2024},\nurl={https://openreview.net/forum?id=p6hIAEHwSp}\n}",
        "github": "",
        "project": "",
        "reviewers": "qyFE;x87R;Y7bE;WLDK",
        "site": "https://openreview.net/forum?id=p6hIAEHwSp",
        "pdf_size": 827082,
        "rating": "3;3;5;6",
        "confidence": "4;4;3;3",
        "soundness": "2;2;3;3",
        "contribution": "1;2;2;2",
        "presentation": "1;2;2;3",
        "wc_summary": "54;50;139;78",
        "wc_strengths": "20;11;35;36",
        "wc_weaknesses": "279;41;77;232",
        "wc_questions": "1;64;73;68",
        "wc_review": "354;166;324;414",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "185;91;88;64",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            80.25,
            35.56947427219019
        ],
        "wc_strengths_avg": [
            25.5,
            10.5
        ],
        "wc_weaknesses_avg": [
            157.25,
            100.45490281713481
        ],
        "wc_questions_avg": [
            51.5,
            29.33001875212493
        ],
        "wc_review_avg": [
            314.5,
            91.65560539323278
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            107.0,
            46.233105022267324
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.9622504486493761,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:dbc7cK2bzWgJ:scholar.google.com/&scioq=Efficient+Subgraph+Rule+Induction+via+Tree+Folding+in+Differentiable+Logic+Programming&hl=en&as_sdt=0,23",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Georgia Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.gatech.edu",
        "aff_unique_abbr": "Georgia Tech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "p79lnC36CO",
        "title": "Automatic Calibration Diagnosis: Interpreting Probability Integral Transform (PIT) Histograms",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Uncertainty quantification in predictive models is essential for safe decision-making and risk assessment. The predictive uncertainty is often represented by a predictive distribution because it is its most general representation. Optimising the sharpness of the distribution subject to its calibration is necessary. This work addresses the proper calibration of predictive distributions in regression tasks. We particularly focus on machine learning models, which are increasingly prevalent in real-world applications. We employ the probability integral transform (PIT) histogram to evaluate calibration quality. It can be used to diagnose calibration problems, e.g. under- or over-estimation, under- or over-dispersion, or an incorrect number of modes. However, PIT histograms are often difficult to interpret because multiple calibration problems may occur simultaneously. To tackle this issue, we present a methodological concept for the automatic interpretation of PIT histograms. It is based on a mixture density network interpreter trained with a synthetic data set of PIT histograms. Given a predictive model, data set, and corresponding PIT histogram, the interpreter can identify a probable observation-generating distribution. This allows us to diagnose a potential calibration problem by comparing the predictive with the probable observation-generating distribution. To showcase the power of the proposed concept in the automatic interpretation of PIT histograms, we referred to regression tasks on standard data sets. As a result, we could achieve notable improvements in the calibration of machine learning models.",
        "keywords": "predictive uncertainty;calibration;probability integral transform (PIT) histogram;probabilistic machine learning;regression",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/908cc60797b3758a3c117125ea6527ad7dfee61b.zip",
        "author": "Ond\u0159ej Podsztavek;Kai Lars Polsterer;Alexander I. Jordan",
        "authorids": "~Ond\u0159ej_Podsztavek1;~Kai_Lars_Polsterer1;~Alexander_I._Jordan1",
        "gender": "M;M;M",
        "homepage": ";https://www.h-its.org/research/ain/;",
        "dblp": "274/3112;24/9077.html;",
        "google_scholar": "https://scholar.google.cz/citations?user=6ewD0QoAAAAJ;https://scholar.google.de/citations?user=GlE_sY0AAAAJ;",
        "orcid": "0000-0002-9187-6619;0000-0002-3435-1912;0000-0001-7423-1352",
        "linkedin": "podondra/;;",
        "or_profile": "~Ond\u0159ej_Podsztavek1;~Kai_Lars_Polsterer1;~Alexander_I._Jordan1",
        "aff": "Czech Technical University of Prague;Astroinformatics, HITS gGmbH, Heidelberg, Germany;Heidelberg Institute for Theoretical Studies",
        "aff_domain": "cvut.cz;h-its.org;h-its.org",
        "position": "PhD student;Principal Researcher;Researcher",
        "bibtex": "@misc{\npodsztavek2024automatic,\ntitle={Automatic Calibration Diagnosis: Interpreting Probability Integral Transform ({PIT}) Histograms},\nauthor={Ond{\\v{r}}ej Podsztavek and Kai Lars Polsterer and Alexander I. Jordan},\nyear={2024},\nurl={https://openreview.net/forum?id=p79lnC36CO}\n}",
        "github": "",
        "project": "",
        "reviewers": "ChB1;fJj1;2H7N;CsR9",
        "site": "https://openreview.net/forum?id=p79lnC36CO",
        "pdf_size": 302384,
        "rating": "1;1;3;3",
        "confidence": "5;5;4;3",
        "soundness": "1;1;2;1",
        "contribution": "1;1;2;2",
        "presentation": "1;1;3;4",
        "wc_summary": "62;97;88;95",
        "wc_strengths": "22;23;51;19",
        "wc_weaknesses": "207;210;98;113",
        "wc_questions": "43;2;79;50",
        "wc_review": "334;332;316;277",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.0,
            1.0
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            1.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            1.299038105676658
        ],
        "wc_summary_avg": [
            85.5,
            13.97318861248212
        ],
        "wc_strengths_avg": [
            28.75,
            12.93010054098575
        ],
        "wc_weaknesses_avg": [
            157.0,
            51.783201909499574
        ],
        "wc_questions_avg": [
            43.5,
            27.5
        ],
        "wc_review_avg": [
            314.75,
            22.884219453588535
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.9045340337332909,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13694664341405311510&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Czech Technical University;HITS gGmbH;Heidelberg Institute for Theoretical Studies",
        "aff_unique_dep": ";Astroinformatics;",
        "aff_unique_url": "https://www.ctu.cz;https://www.hits.org;https://www.hits.org/",
        "aff_unique_abbr": "CTU;;HITS",
        "aff_campus_unique_index": "0;1",
        "aff_campus_unique": "Prague;Heidelberg;",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "Czech Republic;Germany"
    },
    {
        "id": "p7iVaVidha",
        "title": "OfflineLight: An Offline Reinforcement Learning Model for Traffic Signal Control",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Reinforcement learning (RL) is gaining popularity in addressing the traffic signal control (TSC) problems. Yet, the trial and error training with environmental interactions for traditional RL-based methods is costly and time-consuming. Additionally, it is challenging to directly deploy a completely pre-trained RL model for all types of intersections. Inspired by recent advances in decision-making systems from offline RL, we propose a general offline actor-critic framework (Offline-AC) that considers policy and value constraints, and an adaptive decision-making model named OfflineLight based on Offline-AC. Offline-AC is further proved general and suitable for developing new offline RL algorithms. Moreover, we collect, organize and release the first offline interaction dataset for TSC (TSC-OID), which is generated from the state-of-the-art (SOTA) RL models that interact with a traffic simulation environment based on multiple datasets of real-world road intersections and traffic flow. Through numerical experiments on real-world datasets, we demonstrate that: (1) Offline RL can build a high-performance RL model without online interactions with the traffic environment; (2) OfflineLight matches or achieves SOTA among recent RL methods; and (3) OfflineLight shows comprehensive generalization performance after completing training on only 20% of the TSC-OID dataset. The relevant dataset and code are available at anonymous URL:https://anonymous.4open.science/r/OfflineLight-6665/README.md.",
        "keywords": "Reinforcement learning;Traffic signal control;Offline RL;Offline-AC;TSC-OID",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/567fcd8e2b5961bd63dbc9a3d94c3e5b59765ae1.zip",
        "author": "Qiang Wu;Mingyuan Li;Jun Shen;Bo Du;Hongling Zheng;Jiahao Wang",
        "authorids": "~Qiang_Wu3;~Mingyuan_Li2;~Jun_Shen3;~Bo_Du2;~Hongling_Zheng1;~Jiahao_Wang7",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://blog.csdn.net/dukuku5038;https://scholars.uow.edu.au/display/jun_shen;https://experts.griffith.edu.au/43067-bo-bobby-du;https://www.lzu.edu.cn/;;https://scholar.google.com.hk/citations?user=CwZp2sIAAAAJ",
        "dblp": "87/2533-10.html;48/5700-1;70/6443-4;;93/10651.html;67/7882-6.html",
        "google_scholar": "edUqF7sAAAAJ;Bf6gvGkAAAAJ;-Thu0dAAAAAJ;;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com.hk/citations?user=CwZp2sIAAAAJ",
        "orcid": "0000-0003-0655-0479;0000-0002-9403-7140;0000-0001-5790-4682;;0000-0002-7706-0410;0000-0003-2522-8426",
        "linkedin": ";jun-shen-him-his-37b95337/;;;;",
        "or_profile": "~Qiang_Wu3;~Jun_Shen3;~Bo_Du2;~Hongling_Zheng1;~Jiahao_Wang7;~Lee_MingYuan1",
        "aff": "University of Electronic Science and Technology of China;University of Wollongong;Griffith University;Lanzhou University;Beijing University of Posts and Telecommunications;Beijing University of Posts and Telecommunications",
        "aff_domain": "uestc.edu;uow.edu.au;griffith.edu.au;lzu.edu.cn;bupt.edu.cn;bupt.edu.cn",
        "position": "Associate Professor;Full Professor;Senior Lecturer;Undergrad student;MS student;PhD student",
        "bibtex": "@misc{\nwu2024offlinelight,\ntitle={OfflineLight: An Offline Reinforcement Learning Model for Traffic Signal Control},\nauthor={Qiang Wu and Mingyuan Li and Jun Shen and Bo Du and Hongling Zheng and Jiahao Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=p7iVaVidha}\n}",
        "github": "",
        "project": "",
        "reviewers": "aRRe;Twe3;46VN",
        "site": "https://openreview.net/forum?id=p7iVaVidha",
        "pdf_size": 300849,
        "rating": "5;5;6",
        "confidence": "4;2;5",
        "soundness": "2;2;3",
        "contribution": "2;2;2",
        "presentation": "2;2;3",
        "wc_summary": "93;91;92",
        "wc_strengths": "31;91;113",
        "wc_weaknesses": "215;242;118",
        "wc_questions": "157;227;165",
        "wc_review": "496;651;488",
        "wc_reply_reviewers": "419;27;41",
        "wc_reply_authors": "1810;1007;788",
        "reply_reviewers": "2;1;1",
        "reply_authors": "3;2;2",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            1.247219128924647
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            92.0,
            0.816496580927726
        ],
        "wc_strengths_avg": [
            78.33333333333333,
            34.65384378231207
        ],
        "wc_weaknesses_avg": [
            191.66666666666666,
            53.24367463735846
        ],
        "wc_questions_avg": [
            183.0,
            31.283648551066843
        ],
        "wc_review_avg": [
            545.0,
            75.02444046220316
        ],
        "wc_reply_reviewers_avg": [
            162.33333333333334,
            181.580713611208
        ],
        "wc_reply_authors_avg": [
            1201.6666666666667,
            439.34977207484957
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.7559289460184545,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:TMImFkmrmk8J:scholar.google.com/&scioq=OfflineLight:+An+Offline+Reinforcement+Learning+Model+for+Traffic+Signal+Control&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;4;4",
        "aff_unique_norm": "University of Electronic Science and Technology of China;University of Wollongong;Griffith University;Lanzhou University;Beijing University of Posts and Telecommunications",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.uestc.edu.cn;https://www.uow.edu.au;https://www.griffith.edu.au;https://www.lzu.edu.cn;http://www.bupt.edu.cn/",
        "aff_unique_abbr": "UESTC;UOW;Griffith;LZU;BUPT",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Beijing",
        "aff_country_unique_index": "0;1;1;0;0;0",
        "aff_country_unique": "China;Australia"
    },
    {
        "id": "p7pFgsSPd7",
        "title": "Sample-aware RandAugment",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Automatic data augmentation (AutoDA) improves the generalization of neural networks by filling in the missing data in the target distribution. However, mainstream AutoDA methods suffer from either a time-consuming search process that sets barriers for a wide range of applications, or limited performance due to a lack of dynamic adjustments to policy during training. We propose an asymmetric search-free augmentation strategy Sample-aware RandAugment (SRA) that dynamically adjusts the augmentation policy while maintaining a simple implementation. SRA introduces a heuristic score-based module to dynamically evaluate the difficulty of the original training data, which guides the appropriate augmentation independently for each sample. SRA consists of three steps: 1) distribution exploration, 2) sample perception, and 3) distribution refinement. In a variety of settings, SRA significantly shrinks the gap between search-based and search-free AutoDA methods. The proposed method achieves 78.31% ResNet-50 Top-1 accuracy on ImageNet, which is the state-of-the-art among search-free methods. SRA can lead to simpler, more effective, and more practical AutoDA designs for diverse applications in the future.",
        "keywords": "Data augmentation;automated machine learning;computer vision;image recognition",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/e527b25d51c041b988b79cde4fc7a78958df7e24.zip",
        "author": "Anqi Xiao;Weichen Yu;Hongyuan Yu",
        "authorids": "~Anqi_Xiao1;~Weichen_Yu1;~Hongyuan_Yu1",
        "gender": "F;F;M",
        "homepage": "https://github.com/ainieli;https://weichen-yu.github.io/;https://hongyuanyu.github.io/",
        "dblp": "307/8649;325/1209;232/2265",
        "google_scholar": ";https://scholar.google.com/citations?hl=zh-CN;yfnvzxYAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Anqi_Xiao1;~Weichen_Yu1;~Hongyuan_Yu1",
        "aff": "Institute of Automation, Chinese Academy of Sciences;Carnegie Mellon University;",
        "aff_domain": "ia.ac.cn;andrew.cmu.edu;",
        "position": "PhD student;PhD student;",
        "bibtex": "@misc{\nxiao2024sampleaware,\ntitle={Sample-aware RandAugment},\nauthor={Anqi Xiao and Weichen Yu and Hongyuan Yu},\nyear={2024},\nurl={https://openreview.net/forum?id=p7pFgsSPd7}\n}",
        "github": "",
        "project": "",
        "reviewers": "uXgv;dVoG;biM5",
        "site": "https://openreview.net/forum?id=p7pFgsSPd7",
        "pdf_size": 3006130,
        "rating": "3;5;5",
        "confidence": "3;4;4",
        "soundness": "2;3;2",
        "contribution": "2;2;2",
        "presentation": "2;3;3",
        "wc_summary": "51;111;85",
        "wc_strengths": "29;42;20",
        "wc_weaknesses": "88;139;93",
        "wc_questions": "29;11;4",
        "wc_review": "197;303;202",
        "wc_reply_reviewers": "0;192;0",
        "wc_reply_authors": "1121;1644;964",
        "reply_reviewers": "0;1;0",
        "reply_authors": "2;4;2",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            82.33333333333333,
            24.567367696917707
        ],
        "wc_strengths_avg": [
            30.333333333333332,
            9.030811456096044
        ],
        "wc_weaknesses_avg": [
            106.66666666666667,
            22.954060400915758
        ],
        "wc_questions_avg": [
            14.666666666666666,
            10.530379332620875
        ],
        "wc_review_avg": [
            234.0,
            48.83304891839815
        ],
        "wc_reply_reviewers_avg": [
            64.0,
            90.50966799187809
        ],
        "wc_reply_authors_avg": [
            1243.0,
            290.7037438126084
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.9999999999999998,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:va-rBQLVxdQJ:scholar.google.com/&scioq=Sample-aware+RandAugment&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Chinese Academy of Sciences;Carnegie Mellon University",
        "aff_unique_dep": "Institute of Automation;",
        "aff_unique_url": "http://www.ia.cas.cn;https://www.cmu.edu",
        "aff_unique_abbr": "CAS;CMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Only Pay for What Is Uncertain: Variance-Adaptive Thompson Sampling",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17794",
        "id": "p8ujRTjEf3",
        "author_site": "Aadirupa Saha, Branislav Kveton",
        "tldr": "",
        "abstract": "Most bandit algorithms assume that the reward variances or their upper bounds are known, and that they are the same for all arms. This naturally leads to suboptimal performance and higher regret due to variance overestimation. On the other hand, underestimated reward variances may lead to linear regret due to committing early to a suboptimal arm. This motivated prior works on variance-adaptive frequentist algorithms, which have strong instance-dependent regret bounds but cannot incorporate prior knowledge on reward variances. We lay foundations for the Bayesian setting, which incorporates prior knowledge. This results in lower regret in practice, since the prior is used in the algorithm design, and also improved regret guarantees. Specifically, we study Gaussian bandits with \\emph{unknown heterogeneous reward variances} and develop a Thompson sampling algorithm with prior-dependent Bayes regret bounds. We achieve lower regret with lower reward variances and more informative priors on them, which is precisely why we pay only for what is uncertain. This is the first such result in the bandit literature. Finally, we corroborate our theory with experiments, which demonstrate the benefit of our variance-adaptive Bayesian algorithm over prior frequentist works. We also show that our approach is robust to model misspecification and can be applied with estimated priors.",
        "keywords": "Thompson Sampling;Multiarmed;Bandits;Gaussian;Gamma;MAB;Variance aware;Regret;Prior;Posterior;Bayesian;Tight;Guarantee;Empirical",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/5930a3326bdf927123fb656632676311360c0995.zip",
        "author": "Aadirupa Saha;Branislav Kveton",
        "authorids": "~Aadirupa_Saha1;~Branislav_Kveton1",
        "gender": ";M",
        "homepage": "http://aadirupa.github.io/;http://www.bkveton.com",
        "dblp": ";92/5526",
        "google_scholar": "https://scholar.google.co.in/citations?user=7a49tQYAAAAJ;CZaDvPgAAAAJ",
        "orcid": "0000-0003-4965-6417;",
        "linkedin": "aadirupa-saha;",
        "or_profile": "~Aadirupa_Saha1;~Branislav_Kveton1",
        "aff": "Apple;Amazon",
        "aff_domain": "apple.com;amazon.com",
        "position": "Researcher;Principal Scientist",
        "bibtex": "@inproceedings{\nsaha2024only,\ntitle={Only Pay for What Is Uncertain: Variance-Adaptive Thompson Sampling},\nauthor={Aadirupa Saha and Branislav Kveton},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=p8ujRTjEf3}\n}",
        "github": "",
        "project": "",
        "reviewers": "Lfwz;oe9F;RHSZ;u1uV;tUNz",
        "pdf_size": 369629,
        "rating": "5;6;6;6;8",
        "confidence": "3;3;4;4;3",
        "soundness": "3;3;2;2;3",
        "contribution": "2;3;3;2;3",
        "presentation": "3;3;2;3;3",
        "wc_summary": "74;48;81;74;88",
        "wc_strengths": "36;24;87;2;142",
        "wc_weaknesses": "358;111;78;178;116",
        "wc_questions": "14;43;62;53;36",
        "wc_review": "482;226;308;307;382",
        "wc_reply_reviewers": "170;110;31;112;25",
        "wc_reply_authors": "733;411;618;730;240",
        "reply_reviewers": "2;1;1;1;1",
        "reply_authors": "2;2;2;4;2",
        "rating_avg": [
            6.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.4,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            73.0,
            13.535139452550904
        ],
        "wc_strengths_avg": [
            58.2,
            50.344413791402914
        ],
        "wc_weaknesses_avg": [
            168.2,
            100.25248126605146
        ],
        "wc_questions_avg": [
            41.6,
            16.378034070058593
        ],
        "wc_review_avg": [
            341.0,
            86.06044387522063
        ],
        "wc_reply_reviewers_avg": [
            89.6,
            54.752534187925946
        ],
        "wc_reply_authors_avg": [
            546.4,
            192.80518665222678
        ],
        "reply_reviewers_avg": [
            1.2,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            2.4,
            0.8
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.16666666666666663,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1629238844904432964&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=p8ujRTjEf3",
        "pdf": "https://openreview.net/pdf?id=p8ujRTjEf3",
        "email": "apple.com;amazon.com",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Apple;Amazon",
        "aff_unique_dep": "Apple Inc.;Amazon.com, Inc.",
        "aff_unique_url": "https://www.apple.com;https://www.amazon.com",
        "aff_unique_abbr": "Apple;Amazon",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "p9pBJv1DTz",
        "title": "MindAgent: Emergent Gaming Interaction",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) can perform complex scheduling in a multi-agent system and can coordinate agents to complete sophisticated tasks that require extensive collaboration. However, despite the introduction of numerous gaming frameworks, the community lacks adequate benchmarks that support the implementation of a general multi-agent infrastructure encompassing collaboration between LLMs and human-NPCs. We propose a novel infrastructure--- MindAgent---for evaluating planning and coordination-emergent capabilities in the context of gaming interaction. In particular, our infrastructure leverages an existing gaming framework to (i) require understanding of the coordinator for a multi-agent system, (ii) collaborate with human players via instructions, and (iii) enable in-context learning based on few-shot prompting with feedback. Furthermore, we introduce CuisineWorld, a new gaming scenario and its related benchmark that features a multi-agent collaboration efficiency and supervises multiple agents playing the game simultaneously. We have conducted comprehensive evaluations with a new auto-metric collaboration score CoS for assessing the collaboration efficiency. Finally, MindAgent can be deployed in real-world gaming scenarios in a customized VR version of CuisineWorld and adapted in the broader \"Minecraft\" gaming domain. Our work involving LLMs within our new infrastructure for general-purpose scheduling and coordination can elucidate how such skills may be obtained by learning from large language corpora.",
        "keywords": "Large Language Models;Decision Making;Multi-Agent Systems;Gaming Interaction",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/c882152ae09b7e4a36a88e577694bf2be38ca1bf.zip",
        "author": "Ran Gong;Qiuyuan Huang;Xiaojian Ma;Hoi Vo;Zane Durante;Yusuke Noda;Zilong Zheng;Demetri Terzopoulos;Li Fei-Fei;Jianfeng Gao",
        "authorids": "~Ran_Gong1;~Qiuyuan_Huang1;~Xiaojian_Ma1;~Hoi_Vo1;~Zane_Durante1;~Yusuke_Noda1;~Zilong_Zheng1;~Demetri_Terzopoulos1;~Li_Fei-Fei1;~Jianfeng_Gao1",
        "gender": "M;F;;;M;M;M;M;F;M",
        "homepage": "https://nikepupu.github.io/;https://www.microsoft.com/en-us/research/people/qihua/;;;;;http://zilongzheng.github.io;https://web.cs.ucla.edu/~dt;https://profiles.stanford.edu/fei-fei-li;https://www.microsoft.com/en-us/research/people/jfgao/",
        "dblp": ";;;;;;218/5234;85/4738;79/2528;92/5339",
        "google_scholar": "ApkezJ0AAAAJ;U7Mmyc8AAAAJ;;;qxH2dTsAAAAJ;;9sDx70IAAAAJ;pKuBFaQAAAAJ;rDfyQnIAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": "0009-0000-9365-9143;;;;0000-0001-9038-8915;;;;;",
        "linkedin": ";;;;;yusuke-noda-908797/;;demetri-terzopoulos/;fei-fei-li-4541247/;",
        "or_profile": "~Ran_Gong1;~Qiuyuan_Huang1;~Xiaojian_Ma1;~Hoi_Vo1;~Zane_Durante1;~Yusuke_Noda1;~Zilong_Zheng1;~Demetri_Terzopoulos1;~Li_Fei-Fei1;~Jianfeng_Gao1",
        "aff": "University of California, Los Angeles;Microsoft Research, Redmond;;;Stanford University;Microsoft;Beijing Institute for General Artificial Intelligence;University of California, Los Angeles;Stanford University;Microsoft Research",
        "aff_domain": "ucla.edu;microsoft.com;;;stanford.edu;microsoft.com;bigai.ai;ucla.edu;stanford.edu;microsoft.com",
        "position": "PhD student;Principal Researcher;;;PhD student;Software engineer;Researcher;Full Professor;Full Professor;Principal Researcher",
        "bibtex": "@misc{\ngong2024mindagent,\ntitle={MindAgent: Emergent Gaming Interaction},\nauthor={Ran Gong and Qiuyuan Huang and Xiaojian Ma and Hoi Vo and Zane Durante and Yusuke Noda and Zilong Zheng and Demetri Terzopoulos and Li Fei-Fei and Jianfeng Gao},\nyear={2024},\nurl={https://openreview.net/forum?id=p9pBJv1DTz}\n}",
        "github": "",
        "project": "",
        "reviewers": "YZDa;DUbr;tSpT;RwfK;t1AF",
        "site": "https://openreview.net/forum?id=p9pBJv1DTz",
        "pdf_size": 44172136,
        "rating": "3;3;3;8;8",
        "confidence": "5;4;4;3;2",
        "soundness": "1;2;2;4;3",
        "contribution": "2;2;2;3;4",
        "presentation": "3;3;2;3;4",
        "wc_summary": "43;55;109;106;63",
        "wc_strengths": "42;30;40;117;38",
        "wc_weaknesses": "696;184;242;6;28",
        "wc_questions": "8;26;4;188;2",
        "wc_review": "789;295;395;417;131",
        "wc_reply_reviewers": "61;0;0;0;0",
        "wc_reply_authors": "4774;966;1710;503;105",
        "reply_reviewers": "1;0;0;0;0",
        "reply_authors": "9;2;3;1;1",
        "rating_avg": [
            5.0,
            2.449489742783178
        ],
        "confidence_avg": [
            3.6,
            1.019803902718557
        ],
        "soundness_avg": [
            2.4,
            1.019803902718557
        ],
        "contribution_avg": [
            2.6,
            0.8
        ],
        "presentation_avg": [
            3.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            75.2,
            27.147007201531444
        ],
        "wc_strengths_avg": [
            53.4,
            32.0599438552222
        ],
        "wc_weaknesses_avg": [
            231.2,
            249.15408886871592
        ],
        "wc_questions_avg": [
            45.6,
            71.70383532280543
        ],
        "wc_review_avg": [
            405.4,
            216.7372602945788
        ],
        "wc_reply_reviewers_avg": [
            12.2,
            24.4
        ],
        "wc_reply_authors_avg": [
            1611.6,
            1668.8974324385545
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            3.2,
            2.9933259094191533
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": -0.8807048459279793,
        "gs_citation": 99,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16342531411881217960&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;1;3;0;2;1",
        "aff_unique_norm": "University of California, Los Angeles;Microsoft;Stanford University;Beijing Institute for General Artificial Intelligence",
        "aff_unique_dep": ";Microsoft Research;;",
        "aff_unique_url": "https://www.ucla.edu;https://www.microsoft.com/en-us/research;https://www.stanford.edu;http://www.bigaiai.org/",
        "aff_unique_abbr": "UCLA;MSR;Stanford;BIGAI",
        "aff_campus_unique_index": "0;1;2;0;2",
        "aff_campus_unique": "Los Angeles;Redmond;Stanford;",
        "aff_country_unique_index": "0;0;0;0;1;0;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "pA4s793lcB",
        "title": "Improved Algorithms for Replicable Bandits",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This work is motivated by the growing demand for reproducible machine learning. We study the stochastic multi-armed bandit problem, where the algorithm's sequence of actions is, with a high probability, not affected by the randomness of the dataset. Existing algorithms require a regret scale of $O(K^3)$, which increases much faster than the number of actions (or ``arms''), denoted as $K$. We introduce an algorithm with a distribution-dependent regret of $O(K)$. Furthermore, we propose another algorithm, which not only achieves a regret of $O(K)$ but also boasts a distribution-independent regret of $O(K^{1.5}\\sqrt{T \\log T})$. Additionally, we propose an algorithm for the linear bandit with regret of $O(d)$, which is linear in the dimension of associated features, denoted as $d$, and it is independent of $K$. \nOur algorithms exhibit substantial simplicity compared to existing ones, and we offer a principled approach to limiting the probability of non-replication.",
        "keywords": "Interactive Learning;Reproducible Learning;Bandit Algorithms",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/033314bda7d6c0ab7663349d267dba967eed1242.pdf",
        "author": "Junpei Komiyama;Shinji Ito;Yuichi Yoshida;Souta Koshino",
        "authorids": "~Junpei_Komiyama1;~Shinji_Ito1;~Yuichi_Yoshida1;~Souta_Koshino1",
        "gender": "M;M;M;M",
        "homepage": "https://sites.google.com/view/junpeikomiyama/home;https://researchmap.jp/shinji_ito?lang=en;http://research.nii.ac.jp/~yyoshida/;",
        "dblp": "137/4226;49/852;36/4449.html;",
        "google_scholar": "https://scholar.google.co.jp/citations?user=1uFfImMAAAAJ;https://scholar.google.co.jp/citations?user=GX0V06wAAAAJ;https://scholar.google.co.jp/citations?user=EIXTG_UAAAAJ;",
        "orcid": ";;;",
        "linkedin": ";;;https://linkedin.com/in/souta-koshino",
        "or_profile": "~Junpei_Komiyama1;~Shinji_Ito1;~Yuichi_Yoshida1;~Souta_Koshino1",
        "aff": "RIKEN;NEC;National Institute of Informatics;The University of Tokyo",
        "aff_domain": "riken.jp;nec.com;nii.ac.jp;g.ecc.u-tokyo.ac.jp",
        "position": "Researcher;Principal Researcher;Full Professor;MS student",
        "bibtex": "@misc{\nkomiyama2024improved,\ntitle={Improved Algorithms for Replicable Bandits},\nauthor={Junpei Komiyama and Shinji Ito and Yuichi Yoshida and Souta Koshino},\nyear={2024},\nurl={https://openreview.net/forum?id=pA4s793lcB}\n}",
        "github": "",
        "project": "",
        "reviewers": "Hx4P;tkZN;apnD;a2Sd",
        "site": "https://openreview.net/forum?id=pA4s793lcB",
        "pdf_size": 208618,
        "rating": "3;3;6;6",
        "confidence": "3;5;4;5",
        "soundness": "3;3;2;3",
        "contribution": "2;1;2;2",
        "presentation": "3;3;3;2",
        "wc_summary": "71;210;164;150",
        "wc_strengths": "38;20;13;126",
        "wc_weaknesses": "393;595;240;1159",
        "wc_questions": "8;46;4;59",
        "wc_review": "510;871;421;1494",
        "wc_reply_reviewers": "111;1056;0;58",
        "wc_reply_authors": "570;952;75;614",
        "reply_reviewers": "1;4;0;1",
        "reply_authors": "2;4;1;1",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            148.75,
            50.07681599303214
        ],
        "wc_strengths_avg": [
            49.25,
            45.240330458563186
        ],
        "wc_weaknesses_avg": [
            596.75,
            348.1783845961722
        ],
        "wc_questions_avg": [
            29.25,
            23.742103950576915
        ],
        "wc_review_avg": [
            824.0,
            421.9342365819584
        ],
        "wc_reply_reviewers_avg": [
            306.25,
            434.644898164007
        ],
        "wc_reply_authors_avg": [
            552.75,
            312.9276074429995
        ],
        "reply_reviewers_avg": [
            1.5,
            1.5
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3015113445777637,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1406373178304704265&as_sdt=8005&sciodt=0,7&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "RIKEN;NEC Corporation;National Institute of Informatics;University of Tokyo",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.riken.jp;https://www.nec.com;https://www.nii.ac.jp/;https://www.u-tokyo.ac.jp",
        "aff_unique_abbr": "RIKEN;NEC;NII;UTokyo",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Japan"
    },
    {
        "title": "Improved Regret Bounds for Non-Convex Online-Within-Online Meta Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17793",
        "id": "pA8Q5WiEMg",
        "author_site": "Jiechao GUAN, Hui Xiong",
        "tldr": "",
        "abstract": "Online-Within-Online (OWO) meta learning stands for the online multi-task learning paradigm in which both tasks and data within each task become available in a sequential order. In this work, we study the OWO meta learning of the initialization and step size of within-task online algorithms in the non-convex setting, and provide improved regret bounds under mild assumptions of loss functions. Previous work analyzing this scenario has obtained for bounded and piecewise Lipschitz functions an averaged regret bound $O((\\frac{\\sqrt{m}}{T^{1/4}}+\\frac{(\\log{m})\\log{T}}{\\sqrt{T}}+V)\\sqrt{m})$ across $T$ tasks, with $m$ iterations per task and $V$ the task similarity. Our first contribution is to modify the existing non-convex OWO meta learning algorithm and improve the regret bound to $O((\\frac{1}{T^{1/2-\\alpha}}+\\frac{(\\log{T})^{9/2}}{T}+V)\\sqrt{m})$, for any $\\alpha \\in (0,1/2)$. The derived bound has a faster convergence rate with respect to $T$, and guarantees a vanishing task-averaged regret with respect to $m$ (for any fixed $T$). Then, we propose a new algorithm of regret $O((\\frac{\\log{T}}{T}+V)\\sqrt{m})$ for non-convex OWO meta learning. This regret bound exhibits a better asymptotic performance than previous ones, and holds for any bounded (not necessarily Lipschitz) loss functions. Besides the improved regret bounds, our contributions include investigating how to attain generalization bounds for statistical meta learning via regret analysis. Specifically, by online-to-batch arguments, we achieve a transfer risk bound for batch meta learning that assumes all tasks are drawn from a distribution. Moreover, by connecting multi-task generalization error with task-averaged regret, we develop for statistical multi-task learning a novel PAC-Bayes generalization error bound that involves our regret bound for OWO meta learning.",
        "keywords": "meta learning theory;non-convex online meta learning;piecewise-Lipschitz/non-Lipschitz functions;regret bounds;PAC-Bayes generalization bound",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/3ea87aa1b4ee834b7daee7ea1d490851bb426e21.zip",
        "author": "Jiechao Guan;Hui Xiong",
        "authorids": "~Jiechao_Guan1;~Hui_Xiong1",
        "gender": "M;M",
        "homepage": ";https://www.hkust-gz.edu.cn/people/hui-xiong/",
        "dblp": "228/8337;262/1686-1.html",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;cVDF1tkAAAAJ",
        "orcid": ";0000-0001-6016-6465",
        "linkedin": ";",
        "or_profile": "~Jiechao_Guan1;~Hui_Xiong1",
        "aff": "AI Thrust, The Hong Kong University of Science and Technology (Guangzhou);Hong Kong University of Science and Technology (Guangzhou)",
        "aff_domain": "hkust-gz.edu.cn;hkust.edu",
        "position": "Postdoc;Full Professor",
        "bibtex": "@inproceedings{\nguan2024improved,\ntitle={Improved Regret Bounds for Non-Convex Online-Within-Online Meta Learning},\nauthor={Jiechao Guan and Hui Xiong},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=pA8Q5WiEMg}\n}",
        "github": "",
        "project": "",
        "reviewers": "NU9X;8VuH;ESpG;wQQZ",
        "pdf_size": 839082,
        "rating": "6;6;6;6",
        "confidence": "2;2;4;3",
        "soundness": "3;2;3;3",
        "contribution": "3;3;3;3",
        "presentation": "2;2;2;3",
        "wc_summary": "218;56;283;88",
        "wc_strengths": "131;57;5;139",
        "wc_weaknesses": "150;95;5;261",
        "wc_questions": "51;56;5;205",
        "wc_review": "550;264;298;693",
        "wc_reply_reviewers": "15;17;0;8",
        "wc_reply_authors": "1177;1872;354;1869",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "3;4;1;3",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            161.25,
            92.85304249188607
        ],
        "wc_strengths_avg": [
            83.0,
            55.226805085936306
        ],
        "wc_weaknesses_avg": [
            127.75,
            92.72371595228483
        ],
        "wc_questions_avg": [
            79.25,
            75.27408252512946
        ],
        "wc_review_avg": [
            451.25,
            178.00474010542527
        ],
        "wc_reply_reviewers_avg": [
            10.0,
            6.670832032063167
        ],
        "wc_reply_authors_avg": [
            1318.0,
            624.4385478171571
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            1.0897247358851685
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:e6ADEwEtefEJ:scholar.google.com/&scioq=Improved+Regret+Bounds+for+Non-Convex+Online-Within-Online+Meta+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=pA8Q5WiEMg",
        "pdf": "https://openreview.net/pdf?id=pA8Q5WiEMg",
        "email": "hkust-gz.edu.cn;hkust.edu",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Hong Kong University of Science and Technology",
        "aff_unique_dep": "AI Thrust",
        "aff_unique_url": "https://www.ust.hk",
        "aff_unique_abbr": "HKUST",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Differentiable Learning of Generalized Structured Matrices for Efficient Deep Neural Networks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17792",
        "id": "pAVJKp3Dvn",
        "author_site": "Changwoo Lee, Hun-Seok Kim",
        "tldr": "",
        "abstract": "This paper investigates efficient deep neural networks (DNNs) to replace dense unstructured weight matrices with structured ones that possess desired properties. The challenge arises because the optimal weight matrix structure in popular neural network models is obscure in most cases and may vary from layer to layer even in the same network. Prior structured matrices proposed for efficient DNNs were mostly hand-crafted without a generalized framework to systematically learn them. To address this issue, we propose a generalized and differentiable framework to learn efficient structures of weight matrices by gradient descent. We first define a new class of structured matrices that covers a wide range of structured matrices in the literature by adjusting the structural parameters. Then, the frequency-domain differentiable parameterization scheme based on the Gaussian-Dirichlet kernel is adopted to learn the structural parameters by proximal gradient descent. On the image and language tasks, our method learns efficient DNNs with structured matrices, achieving lower complexity and/or higher performance than prior approaches that employ low-rank, block-sparse, or block-low-rank matrices.",
        "keywords": "Structured Matrix;Block Low Rank;Low Rank;Efficient Neural Network;Transformer;Fourier;Dirichlet Kernel;FFT;Boxcar;Pruning;Compression",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/c1f38678ceffaad61bc8f8383fdd441da3fcc60c.zip",
        "author": "Changwoo Lee;Hun-Seok Kim",
        "authorids": "~Changwoo_Lee2;~Hun-Seok_Kim1",
        "gender": "M;",
        "homepage": "https://changwoolee.github.io;",
        "dblp": "52/6193-1;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;",
        "orcid": "0000-0002-5610-0671;",
        "linkedin": "changwoo-lee/;",
        "or_profile": "~Changwoo_Lee2;~Hun-Seok_Kim1",
        "aff": "Samsung Research America;",
        "aff_domain": "samsung.com;",
        "position": "Intern;",
        "bibtex": "@inproceedings{\nlee2024differentiable,\ntitle={Differentiable Learning of Generalized Structured Matrices for Efficient Deep Neural Networks},\nauthor={Changwoo Lee and Hun-Seok Kim},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=pAVJKp3Dvn}\n}",
        "github": "",
        "project": "",
        "reviewers": "f3RM;wuLi;g58u",
        "pdf_size": 809388,
        "rating": "5;6;6",
        "confidence": "3;5;3",
        "soundness": "2;3;3",
        "contribution": "2;3;2",
        "presentation": "2;3;3",
        "wc_summary": "37;360;41",
        "wc_strengths": "40;56;33",
        "wc_weaknesses": "109;188;64",
        "wc_questions": "109;147;25",
        "wc_review": "295;751;163",
        "wc_reply_reviewers": "0;0;10",
        "wc_reply_authors": "1060;842;461",
        "reply_reviewers": "0;0;1",
        "reply_authors": "3;3;2",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            146.0,
            151.32966221685248
        ],
        "wc_strengths_avg": [
            43.0,
            9.626352718795768
        ],
        "wc_weaknesses_avg": [
            120.33333333333333,
            51.25318418292554
        ],
        "wc_questions_avg": [
            93.66666666666667,
            50.97275960964074
        ],
        "wc_review_avg": [
            403.0,
            251.90474390134062
        ],
        "wc_reply_reviewers_avg": [
            3.3333333333333335,
            4.714045207910316
        ],
        "wc_reply_authors_avg": [
            787.6666666666666,
            247.54034463541942
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15015743115782847214&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=pAVJKp3Dvn",
        "pdf": "https://openreview.net/pdf?id=pAVJKp3Dvn",
        "email": "samsung.com;",
        "author_num": 2,
        "aff_unique_index": "0",
        "aff_unique_norm": "Samsung",
        "aff_unique_dep": "Samsung Research America",
        "aff_unique_url": "https://www.samsung.com/us/careers/research/",
        "aff_unique_abbr": "SRA",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Causal Modelling Agents: Causal Graph Discovery through Synergising Metadata- and Data-driven Reasoning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17791",
        "id": "pAoqRlTBtY",
        "author_site": "Ahmed Abdulaal, Adamos Hadjivasiliou, Nina Monta\u00f1a-Brown, Tiantian He, Ayodeji Ijishakin, Ivana Drobnjak, Daniel Castro, Daniel Alexander",
        "tldr": "",
        "abstract": "Scientific discovery hinges on the effective integration of metadata, which refers to a set of 'cognitive' operations such as determining what information is relevant for inquiry, and data, which encompasses physical operations such as observation and experimentation. This paper introduces the Causal Modelling Agent (CMA), a novel framework that synergizes the metadata-based reasoning capabilities of Large Language Models (LLMs) with the data-driven modelling of Deep Structural Causal Models (DSCMs) for the task of causal discovery. We evaluate the CMA's performance on a number of benchmarks, as well as on the real-world task of modelling the clinical and radiological phenotype of Alzheimer's Disease (AD). Our experimental results indicate that the CMA can outperform previous data-driven or metadata-driven approaches to causal discovery. In our real-world application, we use the CMA to derive new insights into the causal relationships among biomarkers of AD.",
        "keywords": "Causal Reasoning;Causal Discovery;Structural Causal Models;Large Language Models",
        "primary_area": "causal reasoning",
        "supplementary_material": "",
        "author": "Ahmed Abdulaal;adamos hadjivasiliou;Nina Montana-Brown;Tiantian He;Ayodeji Ijishakin;Ivana Drobnjak;Daniel C. Castro;Daniel C. Alexander",
        "authorids": "~Ahmed_Abdulaal1;~adamos_hadjivasiliou1;~Nina_Montana-Brown1;tiantian.he.20@ucl.ac.uk;~Ayodeji_Ijishakin1;~Ivana_Drobnjak2;~Daniel_C._Castro1;~Daniel_C._Alexander1",
        "gender": "M;M;F;;M;F;;M",
        "homepage": ";;https://scholar.google.com/citations?user=lCbkLx4AAAAJ&hl=en;;https://github.com/A-Ijishakin;;;http://www.cs.ucl.ac.uk/staff/d.alexander",
        "dblp": ";;274/3185.html;;;;255/6967;37/6152",
        "google_scholar": ";https://scholar.google.co.uk/citations?user=AdTtNpEAAAAJ;lCbkLx4AAAAJ;;;https://scholar.google.co.uk/citations?user=55BI2VIICu8C;UT-RATkAAAAJ;https://scholar.google.co.uk/citations?user=mH-ZOQEAAAAJ",
        "orcid": "0000-0002-3536-4803;;;;;;0000-0002-6829-7045;0000-0003-2439-350X",
        "linkedin": ";;;;;;;daniel-alexander-2b096737",
        "or_profile": "~Ahmed_Abdulaal1;~adamos_hadjivasiliou1;~Nina_Montana-Brown1;tiantian.he.20@ucl.ac.uk;~Ayodeji_Ijishakin1;~Ivana_Drobnjak2;~Daniel_C._Castro1;~Daniel_C._Alexander1",
        "aff": "University College London, University of London;University College London, University of London;University College London, University of London;;University College London, University of London;;Imperial College London;University College London",
        "aff_domain": "ucl.ac.uk;ucl.ac.uk;ucl.ac.uk;;ucl.ac.uk;;imperial.ac.uk;ucl.ac.uk",
        "position": "PhD student;PhD student;PhD student;;PhD student;;Honorary Research Fellow;Full Professor",
        "bibtex": "@inproceedings{\nabdulaal2024causal,\ntitle={Causal Modelling Agents: Causal Graph Discovery through Synergising Metadata- and Data-driven Reasoning},\nauthor={Ahmed Abdulaal and adamos hadjivasiliou and Nina Montana-Brown and Tiantian He and Ayodeji Ijishakin and Ivana Drobnjak and Daniel C. Castro and Daniel C. Alexander},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=pAoqRlTBtY}\n}",
        "github": "",
        "project": "",
        "reviewers": "CmY7;pSg2;GSYx;Jpz4",
        "pdf_size": 13069490,
        "rating": "3;6;8;8",
        "confidence": "2;3;2;3",
        "soundness": "2;2;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;4;3;3",
        "wc_summary": "104;109;28;71",
        "wc_strengths": "31;30;17;67",
        "wc_weaknesses": "185;24;61;10",
        "wc_questions": "199;19;30;313",
        "wc_review": "519;182;136;461",
        "wc_reply_reviewers": "790;44;0;19",
        "wc_reply_authors": "3481;836;192;851",
        "reply_reviewers": "2;2;0;1",
        "reply_authors": "7;3;1;2",
        "rating_avg": [
            6.25,
            2.0463381929681126
        ],
        "confidence_avg": [
            2.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            78.0,
            32.349652239243625
        ],
        "wc_strengths_avg": [
            36.25,
            18.59267328815305
        ],
        "wc_weaknesses_avg": [
            70.0,
            68.9601334105438
        ],
        "wc_questions_avg": [
            140.25,
            122.6282491924271
        ],
        "wc_review_avg": [
            324.5,
            167.5567068189155
        ],
        "wc_reply_reviewers_avg": [
            213.25,
            333.3521973828881
        ],
        "wc_reply_authors_avg": [
            1340.0,
            1264.4091505521462
        ],
        "reply_reviewers_avg": [
            1.25,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.25,
            2.277608394786075
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.3665083330689157,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5822246804952000173&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=pAoqRlTBtY",
        "pdf": "https://openreview.net/pdf?id=pAoqRlTBtY",
        "email": "ucl.ac.uk;ucl.ac.uk;ucl.ac.uk;;ucl.ac.uk;;imperial.ac.uk;ucl.ac.uk",
        "author_num": 8,
        "aff_unique_index": "0;0;0;0;1;0",
        "aff_unique_norm": "University College London;Imperial College London",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ucl.ac.uk;https://www.imperial.ac.uk",
        "aff_unique_abbr": "UCL;ICL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "title": "Soft Contrastive Learning for Time Series",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17790",
        "id": "pAsQSWlDUf",
        "author_site": "Seunghan Lee, Taeyoung Park, Kibok Lee",
        "tldr": "",
        "abstract": "Contrastive learning has shown to be effective to learn representations from time series in a self-supervised way.\nHowever, contrasting similar time series instances or values from adjacent timestamps within a time series leads to ignore their inherent correlations, which results in deteriorating the quality of learned representations.\nTo address this issue, we propose \\textit{SoftCLT}, a simple yet effective soft contrastive learning strategy for time series.\nThis is achieved by introducing instance-wise and temporal contrastive loss with soft assignments ranging from zero to one.\nSpecifically, we define soft assignments for 1) instance-wise contrastive loss by distance between time series on the data space, warping and 2) temporal contrastive loss by the difference of timestamps.\nSoftCLT is a plug-and-play method for time series contrastive learning that improves the quality of learned representations without bells and whistles.\nIn experiments, we demonstrate that SoftCLT consistently improves the performance in various downstream tasks including classification, semi-supervised learning, transfer learning, and anomaly detection, showing state-of-the-art performance.\nCode is available at this repository: https://github.com/seunghan96/softclt.",
        "keywords": "Soft Contrastive Learning;Time Series Analysis;Self-supervised Learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/d084772b56fb026e6cca6b88157718986de12061.zip",
        "author": "Seunghan Lee;Taeyoung Park;Kibok Lee",
        "authorids": "~Seunghan_Lee1;~Taeyoung_Park1;~Kibok_Lee1",
        "gender": "M;M;M",
        "homepage": "https://seunghan96.github.io/;https://web.yonsei.ac.kr/tpark;https://ml.yonsei.ac.kr/",
        "dblp": ";;157/3147",
        "google_scholar": ";https://scholar.google.co.kr/citations?hl=en;6wwWRdEAAAAJ",
        "orcid": ";0000-0001-7405-0746;0000-0001-6995-7327",
        "linkedin": ";taeyoung-park-27a93b14/?originalSubdomain=kr;",
        "or_profile": "~Seunghan_Lee1;~Taeyoung_Park1;~Kibok_Lee1",
        "aff": "Yonsei University;Yonsei University;Yonsei University",
        "aff_domain": "yonsei.ac.kr;yonsei.ac.kr;yonsei.ac.kr",
        "position": "PhD student;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nlee2024soft,\ntitle={Soft Contrastive Learning for Time Series},\nauthor={Seunghan Lee and Taeyoung Park and Kibok Lee},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=pAsQSWlDUf}\n}",
        "github": "",
        "project": "",
        "reviewers": "mvHV;EHZC;bKG2;e9k3",
        "pdf_size": 3224114,
        "rating": "6;6;6;8",
        "confidence": "4;4;5;4",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;4",
        "wc_summary": "45;108;88;67",
        "wc_strengths": "73;45;97;122",
        "wc_weaknesses": "201;119;156;566",
        "wc_questions": "14;162;36;13",
        "wc_review": "333;434;377;768",
        "wc_reply_reviewers": "235;30;26;0",
        "wc_reply_authors": "1687;994;711;945",
        "reply_reviewers": "2;1;1;0",
        "reply_authors": "3;2;1;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            77.0,
            23.484037131634757
        ],
        "wc_strengths_avg": [
            84.25,
            28.525208149985513
        ],
        "wc_weaknesses_avg": [
            260.5,
            178.75472021739733
        ],
        "wc_questions_avg": [
            56.25,
            61.742914573252854
        ],
        "wc_review_avg": [
            478.0,
            171.21769768338785
        ],
        "wc_reply_reviewers_avg": [
            72.75,
            94.38054619464755
        ],
        "wc_reply_authors_avg": [
            1084.25,
            364.0600053562599
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 27,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5239996606976845697&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=pAsQSWlDUf",
        "pdf": "https://openreview.net/pdf?id=pAsQSWlDUf",
        "email": "yonsei.ac.kr;yonsei.ac.kr;yonsei.ac.kr",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Yonsei University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.yonsei.ac.kr",
        "aff_unique_abbr": "Yonsei",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "Near-Optimal Quantum Algorithm for Minimizing the Maximal Loss",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17789",
        "id": "pB1FeRSQxh",
        "author_site": "Hao Wang, Chenyi Zhang, Tongyang Li",
        "tldr": "",
        "abstract": "The problem of minimizing the maximum of $N$ convex, Lipschitz functions plays significant roles in optimization and machine learning. It has a series of results, with the most recent one requiring $O(N\\epsilon^{-2/3} + \\epsilon^{-8/3})$ queries to a first-order oracle to compute an $\\epsilon$-suboptimal point. On the other hand, quantum algorithms for optimization are rapidly advancing with speedups shown on many important optimization problems. In this paper, we conduct a systematic study of quantum algorithms and lower bounds for minimizing the maximum of $N$ convex, Lipschitz functions. On one hand, we develop quantum algorithms with an improved complexity bound of $\\tilde{O}(\\sqrt{N}\\epsilon^{-5/3} + \\epsilon^{-8/3})$. On the other hand, we prove that quantum algorithms must take $\\tilde{\\Omega}(\\sqrt{N}\\epsilon^{-2/3})$ queries to a first-order quantum oracle, showing that our dependence on $N$ is optimal up to poly-logarithmic factors.",
        "keywords": "Quantum Algorithms;Quantum Query Complexity;Convex Optimization;Minimizing Loss",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Hao Wang;Chenyi Zhang;Tongyang Li",
        "authorids": "~Hao_Wang55;~Chenyi_Zhang2;~Tongyang_Li1",
        "gender": "Not Specified;M;M",
        "homepage": "https://hwang-pku.github.io/;https://chenyizhang2000.github.io;https://www.tongyangli.com/",
        "dblp": ";;142/1312",
        "google_scholar": ";https://scholar.google.com/citations?hl=zh-CN;ny0ZgiQAAAAJ",
        "orcid": "0000-0002-8480-8167;;0000-0002-0338-413X",
        "linkedin": ";;",
        "or_profile": "~Hao_Wang55;~Chenyi_Zhang2;~Tongyang_Li1",
        "aff": "Peking University;Stanford University;Peking University",
        "aff_domain": "pku.edu.cn;stanford.edu;pku.edu.cn",
        "position": "Undergrad student;PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nwang2024nearoptimal,\ntitle={Near-Optimal Quantum Algorithm for Minimizing the Maximal Loss},\nauthor={Hao Wang and Chenyi Zhang and Tongyang Li},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=pB1FeRSQxh}\n}",
        "github": "",
        "project": "",
        "reviewers": "J3o2;aSjj;gKCY;ixEA",
        "pdf_size": 459585,
        "rating": "5;5;6;8",
        "confidence": "3;3;2;3",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "274;202;91;134",
        "wc_strengths": "57;24;51;16",
        "wc_weaknesses": "63;129;33;32",
        "wc_questions": "111;93;84;1",
        "wc_review": "505;448;259;183",
        "wc_reply_reviewers": "53;0;22;0",
        "wc_reply_authors": "53;193;269;23",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            175.25,
            69.40235946997768
        ],
        "wc_strengths_avg": [
            37.0,
            17.363755354185336
        ],
        "wc_weaknesses_avg": [
            64.25,
            39.40415587219196
        ],
        "wc_questions_avg": [
            72.25,
            42.269226394624255
        ],
        "wc_review_avg": [
            348.75,
            132.09158754440043
        ],
        "wc_reply_reviewers_avg": [
            18.75,
            21.718367802392518
        ],
        "wc_reply_authors_avg": [
            134.5,
            100.73107762751275
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:mwCA2cGTP4wJ:scholar.google.com/&scioq=Near-Optimal+Quantum+Algorithm+for+Minimizing+the+Maximal+Loss&hl=en&as_sdt=0,14",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=pB1FeRSQxh",
        "pdf": "https://openreview.net/pdf?id=pB1FeRSQxh",
        "email": "pku.edu.cn;stanford.edu;pku.edu.cn",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Peking University;Stanford University",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.stanford.edu",
        "aff_unique_abbr": "Peking U;Stanford",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Stanford",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "pB9XVRGVu0",
        "title": "GeRA: Label-Efficient Geometrically Regularized Alignment",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Pretrained unimodal encoders incorporate rich semantic information into embedding space structures. To be similarly informative, multi-modal encoders typically require massive amounts of paired data for alignment and training. We introduce a semi-supervised Geometrically Regularized Alignment (GeRA) method to align the embedding spaces of pretrained unimodal encoders in a label-efficient way. Our method leverages the manifold geometry of unpaired (unlabeled) data to improve alignment performance. To prevent distortions to local geometry during the alignment process \u2014potentially disrupting semantic neighborhood structures and causing misalignment of unobserved pairs \u2014 we introduce a geometric loss term. This term is built upon a diffusion operator that captures the local manifold geometry of the unimodal pretrained encoders. GeRA is modality-agnostic and thus can be used to align pretrained encoders from any data modalities. We provide empirical evidence to the effectiveness of our method in the domains of speech-text and image-text alignment. Our experiments demonstrate significant improvement in alignment quality compared to a variaty of leading baselines, especially with a small amount of paired data, using our proposed geometric regularization.",
        "keywords": "multi-modal alignment;semi-supervised",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Dustin Klebe;Tal Shnitzer;Mikhail Yurochkin;Leonid Karlinsky;Justin Solomon",
        "authorids": "~Dustin_Klebe1;~Tal_Shnitzer1;~Mikhail_Yurochkin1;~Leonid_Karlinsky3;~Justin_Solomon1",
        "gender": "M;F;M;M;M",
        "homepage": ";https://shnitzer.github.io/;https://moonfolk.github.io/;;http://people.csail.mit.edu/jsolomon/",
        "dblp": ";179/2670;191/6719;05/4463;80/5094",
        "google_scholar": ";GjhaUOMAAAAJ;QjBF9sUAAAAJ;https://scholar.google.co.il/citations?user=WbO7tjYAAAAJ;pImSVwoAAAAJ",
        "orcid": ";0000-0001-9058-1870;;;0000-0002-7701-7586",
        "linkedin": "dustin-klebe-679675163/;;mikhail-yurochkin-a45659114/;;justin-solomon-8a587914/",
        "or_profile": "~Dustin_Klebe1;~Tal_Shnitzer1;~Mikhail_Yurochkin1;~Leonid_Karlinsky3;~Justin_Solomon1",
        "aff": ";Broad Institute;IBM Research;International Business Machines;Massachusetts Institute of Technology",
        "aff_domain": ";broadinstitute.org;ibm.com;ibm.com;mit.edu",
        "position": ";Researcher;Researcher;Principal Researcher;Associate Professor",
        "bibtex": "@misc{\nklebe2024gera,\ntitle={Ge{RA}: Label-Efficient Geometrically Regularized Alignment},\nauthor={Dustin Klebe and Tal Shnitzer and Mikhail Yurochkin and Leonid Karlinsky and Justin Solomon},\nyear={2024},\nurl={https://openreview.net/forum?id=pB9XVRGVu0}\n}",
        "github": "",
        "project": "",
        "reviewers": "G2FF;cT78;GTA6;gPXV",
        "site": "https://openreview.net/forum?id=pB9XVRGVu0",
        "pdf_size": 2072745,
        "rating": "5;5;5;8",
        "confidence": "4;2;4;5",
        "soundness": "3;2;3;3",
        "contribution": "3;2;2;3",
        "presentation": "3;3;3;4",
        "wc_summary": "104;54;35;116",
        "wc_strengths": "61;71;43;139",
        "wc_weaknesses": "249;159;46;229",
        "wc_questions": "130;4;20;131",
        "wc_review": "544;288;144;615",
        "wc_reply_reviewers": "301;0;132;42",
        "wc_reply_authors": "1849;552;586;1376",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "4;1;2;2",
        "rating_avg": [
            5.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            77.25,
            33.699962907991456
        ],
        "wc_strengths_avg": [
            78.5,
            36.34212431875715
        ],
        "wc_weaknesses_avg": [
            170.75,
            79.39891372052895
        ],
        "wc_questions_avg": [
            71.25,
            59.520479668766114
        ],
        "wc_review_avg": [
            397.75,
            190.4079502016657
        ],
        "wc_reply_reviewers_avg": [
            118.75,
            115.52353656290133
        ],
        "wc_reply_authors_avg": [
            1090.75,
            548.0270864656235
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            1.0897247358851685
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.662266178532522,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4685889023975246720&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Broad Institute;IBM;International Business Machines Corporation;Massachusetts Institute of Technology",
        "aff_unique_dep": ";IBM Research;;",
        "aff_unique_url": "https://www.broadinstitute.org;https://www.ibm.com/research;https://www.ibm.com;https://web.mit.edu",
        "aff_unique_abbr": "Broad;IBM;IBM;MIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Grounded Object-Centric Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17788",
        "id": "pBxeZ6pVUD",
        "author_site": "Avinash Kori, Francesco Locatello, Fabio De Sousa Ribeiro, Francesca Toni, Ben Glocker",
        "tldr": "",
        "abstract": "The extraction of object-centric representations for downstream tasks is an emerging area of research. Learning grounded representations of objects that are guaranteed to be stable and invariant promises robust performance across different tasks and environments. Slot Attention (SA) learns object-centric representations by assigning objects to *slots*, but presupposes a *single* distribution from which all slots are randomly initialised. This results in an inability to learn *specialized* slots which bind to specific object types and remain invariant to identity-preserving changes in object appearance. To address this, we present *Conditional Slot Attention* (CoSA) using a novel concept of *Grounded Slot Dictionary* (GSD) inspired by vector quantization. Our proposed GSD comprises (i) canonical object-level property vectors and (ii) parametric Gaussian distributions, which define a prior over the slots. We demonstrate the benefits of our method in multiple downstream tasks such as scene generation, composition, and task adaptation, whilst remaining competitive with SA in object discovery.",
        "keywords": "object-centric representation learning;the binding problem;the grounding problem;slot attention",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/778c69bf9cadf8dd5b1dbabde73ea062f4941b8e.zip",
        "author": "Avinash Kori;Francesco Locatello;Fabio De Sousa Ribeiro;Francesca Toni;Ben Glocker",
        "authorids": "~Avinash_Kori1;~Francesco_Locatello1;~Fabio_De_Sousa_Ribeiro1;~Francesca_Toni1;~Ben_Glocker1",
        "gender": "M;;F;M;M",
        "homepage": "https://twitter.com/FrancescoLocat8;https://github.com/fabio-deep;https://www.doc.ic.ac.uk/~ft/;https://www.doc.ic.ac.uk/~bglocker;https://koriavinash1.github.io/",
        "dblp": "195/6074;222/8450;t/FrancescaToni;86/2890;215/3763",
        "google_scholar": ";iIcKRG0AAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.co.uk/citations?user=g_HtjLIAAAAJ;https://scholar.google.co.uk/citations?user=X6o3q0gAAAAJ",
        "orcid": ";;0000-0001-8194-1459;0000-0002-4897-9356;0000-0002-5878-3584",
        "linkedin": ";;;;koriavinash1/",
        "or_profile": "~Francesco_Locatello1;~Fabio_De_Sousa_Ribeiro1;~Francesca_Toni1;~Ben_Glocker1;~Avinash_G._Kori1",
        "aff": "Institute of Science and Technology;Imperial College London;Imperial College London;Imperial College London;Imperial College London",
        "aff_domain": "ist.ac.at;imperial.ac.uk;ic.ac.uk;imperial.ac.uk;ic.ac.uk",
        "position": "Assistant Professor;Postdoc;Full Professor;Full Professor;PhD student",
        "bibtex": "@inproceedings{\nkori2024grounded,\ntitle={Grounded Object-Centric Learning},\nauthor={Avinash Kori and Francesco Locatello and Fabio De Sousa Ribeiro and Francesca Toni and Ben Glocker},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=pBxeZ6pVUD}\n}",
        "github": "",
        "project": "",
        "reviewers": "myKR;yF2M;dFhu",
        "pdf_size": 19986955,
        "rating": "6;6;6",
        "confidence": "3;4;3",
        "soundness": "3;3;2",
        "contribution": "3;3;3",
        "presentation": "3;3;2",
        "wc_summary": "82;78;72",
        "wc_strengths": "64;96;38",
        "wc_weaknesses": "116;98;220",
        "wc_questions": "20;32;163",
        "wc_review": "282;304;493",
        "wc_reply_reviewers": "34;244;129",
        "wc_reply_authors": "512;821;915",
        "reply_reviewers": "1;2;1",
        "reply_authors": "2;3;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            77.33333333333333,
            4.109609335312651
        ],
        "wc_strengths_avg": [
            66.0,
            23.72059583287626
        ],
        "wc_weaknesses_avg": [
            144.66666666666666,
            53.77318621353542
        ],
        "wc_questions_avg": [
            71.66666666666667,
            64.76796190161375
        ],
        "wc_review_avg": [
            359.6666666666667,
            94.70773756961759
        ],
        "wc_reply_reviewers_avg": [
            135.66666666666666,
            85.86164581594173
        ],
        "wc_reply_authors_avg": [
            749.3333333333334,
            172.15174185067724
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5955098268630090571&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=pBxeZ6pVUD",
        "pdf": "https://openreview.net/pdf?id=pBxeZ6pVUD",
        "email": "ist.ac.at;imperial.ac.uk;ic.ac.uk;imperial.ac.uk;ic.ac.uk",
        "author_num": 5,
        "aff_unique_index": "0;1;1;1;1",
        "aff_unique_norm": "Institute of Science and Technology;Imperial College London",
        "aff_unique_dep": ";",
        "aff_unique_url": ";https://www.imperial.ac.uk",
        "aff_unique_abbr": ";ICL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "1;1;1;1",
        "aff_country_unique": ";United Kingdom"
    },
    {
        "title": "Large-scale Training of Foundation Models for Wearable Biosignals",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17787",
        "id": "pC3WJHf51j",
        "author_site": "Salar Abbaspourazad, Oussama Elachqar, Andrew Miller, Saba Emrani, Udhyakumar Nallasamy, Ian Shapiro",
        "tldr": "",
        "abstract": "Tracking biosignals is crucial for monitoring wellness and preempting the development of severe medical conditions. Today, wearable devices can conveniently record various biosignals, creating the opportunity to monitor health status without disruption to one's daily routine. Despite widespread use of wearable devices and existing digital biomarkers, the absence of curated data with annotated medical labels hinders the development of new biomarkers to measure common health conditions. In fact, medical datasets are usually small in comparison to other domains, which is an obstacle for developing neural network models for biosignals. To address this challenge, we have employed self-supervised learning using the unlabeled sensor data collected under informed consent from the large longitudinal Apple Heart and Movement Study (AHMS) to train foundation models for two common biosignals: photoplethysmography (PPG) and electrocardiogram (ECG) recorded on Apple Watch. We curated PPG and ECG datasets from AHMS that include data from ${\\sim} 141$K participants spanning ${\\sim} 3$ years. Our self-supervised learning framework includes participant level positive pair selection, stochastic augmentation module and a regularized contrastive loss optimized with momentum training, and generalizes well to both PPG and ECG modalities. We show that the pre-trained foundation models readily encode information regarding participants' demographics and health conditions. To the best of our knowledge, this is the first study that builds foundation models using large-scale PPG and ECG data collected via wearable consumer devices $\\textendash$ prior works have commonly used smaller-size datasets collected in clinical and experimental settings. We believe PPG and ECG foundation models can enhance future wearable devices by reducing the reliance on labeled data and hold the potential to help the users improve their health.",
        "keywords": "Self-supervised learning;Representation learning;Foundation models;Biosignals;Wearable devices;Health;Photoplethysmography;PPG;Electrocardiogram;ECG",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Salar Abbaspourazad;Oussama Elachqar;Andrew Miller;Saba Emrani;Udhyakumar Nallasamy;Ian Shapiro",
        "authorids": "~Salar_Abbaspourazad1;~Oussama_Elachqar1;~Andrew_Miller1;~Saba_Emrani1;~Udhyakumar_Nallasamy1;~Ian_Shapiro1",
        "gender": "M;M;M;;M;M",
        "homepage": "https://salarabb.github.io;https://elachqar.com;https://andymiller.github.io/;;;",
        "dblp": ";;190/7517;60/10316;;",
        "google_scholar": "RTfjwWMAAAAJ;0fDBk7EAAAAJ;X3RNgQMAAAAJ;;J9g-HeEAAAAJ;Tk1Noy8AAAAJ",
        "orcid": "0000-0002-2049-9588;;;;;0000-0001-6587-1294",
        "linkedin": "salarabb/;oussamaelachqar;;saba-emrani-phd-141b4039/;;ian-shapiro-0601664?",
        "or_profile": "~Salar_Abbaspourazad1;~Oussama_Elachqar1;~Andrew_Miller1;~Saba_Emrani1;~Udhyakumar_Nallasamy1;~Ian_Shapiro1",
        "aff": "Apple;Apple;Apple;Apple;Apple;Apple",
        "aff_domain": "apple.com;apple.com;apple.com;apple.com;apple.com;apple.com",
        "position": "Researcher;Researcher;Researcher;Engineer;Researcher;Researcher",
        "bibtex": "@inproceedings{\nabbaspourazad2024largescale,\ntitle={Large-scale Training of Foundation Models for Wearable Biosignals},\nauthor={Salar Abbaspourazad and Oussama Elachqar and Andrew Miller and Saba Emrani and Udhyakumar Nallasamy and Ian Shapiro},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=pC3WJHf51j}\n}",
        "github": "",
        "project": "",
        "reviewers": "FYDu;4W8A;EBBD;UQ5r",
        "pdf_size": 1353367,
        "rating": "5;6;8;8",
        "confidence": "4;5;5;5",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;3;4",
        "wc_summary": "188;35;119;113",
        "wc_strengths": "363;29;117;76",
        "wc_weaknesses": "391;25;94;246",
        "wc_questions": "93;392;121;109",
        "wc_review": "1035;481;451;544",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1040;1691;1287;1462",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;3;2;3",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            113.75,
            54.181985013471035
        ],
        "wc_strengths_avg": [
            146.25,
            128.9561456464949
        ],
        "wc_weaknesses_avg": [
            189.0,
            141.39837339941363
        ],
        "wc_questions_avg": [
            178.75,
            123.5199882610098
        ],
        "wc_review_avg": [
            627.75,
            237.5093419215337
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1370.0,
            238.3768025626655
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.7777777777777777,
        "gs_citation": 49,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11953499702041285020&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=pC3WJHf51j",
        "pdf": "https://openreview.net/pdf?id=pC3WJHf51j",
        "email": "apple.com;apple.com;apple.com;apple.com;apple.com;apple.com",
        "author_num": 6,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "Apple",
        "aff_unique_dep": "Apple Inc.",
        "aff_unique_url": "https://www.apple.com",
        "aff_unique_abbr": "Apple",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Two-stage LLM Fine-tuning with Less Specialization and More Generalization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17786",
        "id": "pCEgna6Qco",
        "author_site": "Yihan Wang, Si Si, Daliang Li, Michal Lukasik, Felix Yu, Cho-Jui Hsieh, Inderjit Dhillon, Sanjiv Kumar",
        "tldr": "",
        "abstract": "Pretrained large language models (LLMs) are general purpose problem solvers applicable to a diverse set of tasks with prompts. They can be further improved towards a specific task by fine-tuning on a specialized dataset. However, fine-tuning usually makes the model narrowly specialized on this dataset with reduced general in-context learning performances, which is undesirable whenever the fine-tuned model needs to handle additional tasks where no fine-tuning data is available. \nIn this work, we first demonstrate that fine-tuning on a single task indeed decreases LLMs' general in-context learning performance. We discover one important cause of such forgetting, format specialization, where the model overfits to the format of the fine-tuned task.We further show that format specialization happens at the very beginning of fine-tuning. To solve this problem, we propose Prompt Tuning with MOdel Tuning (ProMoT), a simple yet effective two-stage fine-tuning framework that reduces format specialization and improves generalization.ProMoT offloads task-specific format learning into additional and removable parameters by first doing prompt tuning and then fine-tuning the model itself with this soft prompt attached. \nWith experiments on several fine-tuning tasks and 8 in-context evaluation tasks, we show that ProMoT achieves comparable performance on fine-tuned tasks to standard fine-tuning, but with much less loss of in-context learning performances across a board range of  out-of-domain evaluation tasks. More importantly, ProMoT can even enhance generalization on in-context learning tasks that are semantically related to the fine-tuned task, e.g. ProMoT on En-Fr translation significantly improves performance on other language pairs, and ProMoT on NLI improves performance on summarization.\nExperiments also show that ProMoT can improve the generalization performance of  multi-task training.",
        "keywords": "language model;Generalization",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yihan Wang;Si Si;Daliang Li;Michal Lukasik;Felix Yu;Cho-Jui Hsieh;Inderjit S Dhillon;Sanjiv Kumar",
        "authorids": "~Yihan_Wang2;~Si_Si1;~Daliang_Li1;~Michal_Lukasik1;~Felix_Yu1;~Cho-Jui_Hsieh1;~Inderjit_S_Dhillon1;~Sanjiv_Kumar1",
        "gender": "F;F;M;;M;M;M;",
        "homepage": "https://yihanwang617.github.io;;;https://mlukasik.github.io/;http://felixyu.org;http://web.cs.ucla.edu/~chohsieh/index.html;http://www.cs.utexas.edu/users/inderjit/;http://www.sanjivk.com/",
        "dblp": ";03/7627;;72/11338;23/10574;14/2770;d/InderjitSDhillon;",
        "google_scholar": ";;Am6f2DsAAAAJ;https://scholar.google.co.uk/citations?user=cLZLZCQAAAAJ;lYvF6cUAAAAJ;Wy89g4IAAAAJ;xBv5ZfkAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;;;;;",
        "linkedin": ";;daliangli/;;;;inderjit-dhillon-a20888b0/;",
        "or_profile": "~Yihan_Wang2;~Si_Si1;~Daliang_Li1;~Michal_Lukasik1;~Felix_Yu1;~Cho-Jui_Hsieh1;~Inderjit_S_Dhillon1;~Sanjiv_Kumar1",
        "aff": "University of California, Los Angeles;Google;Google;Google Research;Google;University of California, Los Angeles;University of Texas, Austin;Google",
        "aff_domain": "ucla.edu;google.com;google.com;google.com;google.com;ucla.edu;utexas.edu;google.com",
        "position": "PhD student;research scientist;Researcher;Research Scientist;Research Scientist;Associate Professor;Full Professor;Research Scientist",
        "bibtex": "@inproceedings{\nwang2024twostage,\ntitle={Two-stage {LLM} Fine-tuning with Less Specialization and More Generalization},\nauthor={Yihan Wang and Si Si and Daliang Li and Michal Lukasik and Felix Yu and Cho-Jui Hsieh and Inderjit S Dhillon and Sanjiv Kumar},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=pCEgna6Qco}\n}",
        "github": "",
        "project": "",
        "reviewers": "ptkK;5e4F;3Pj7;qDAR",
        "pdf_size": 345457,
        "rating": "5;6;8;8",
        "confidence": "3;4;4;4",
        "soundness": "2;3;2;2",
        "contribution": "2;3;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "99;78;94;45",
        "wc_strengths": "27;78;127;41",
        "wc_weaknesses": "233;24;73;11",
        "wc_questions": "2;19;12;29",
        "wc_review": "361;199;306;126",
        "wc_reply_reviewers": "0;0;60;0",
        "wc_reply_authors": "1202;156;210;188",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "3;1;2;1",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            79.0,
            21.106870919205434
        ],
        "wc_strengths_avg": [
            68.25,
            38.69996770024492
        ],
        "wc_weaknesses_avg": [
            85.25,
            88.38092271525569
        ],
        "wc_questions_avg": [
            15.5,
            9.86154146165801
        ],
        "wc_review_avg": [
            248.0,
            91.40295400040416
        ],
        "wc_reply_reviewers_avg": [
            15.0,
            25.98076211353316
        ],
        "wc_reply_authors_avg": [
            439.0,
            440.9365033652805
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.7777777777777777,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15818064377154623896&as_sdt=5,24&sciodt=0,24&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=pCEgna6Qco",
        "pdf": "https://openreview.net/pdf?id=pCEgna6Qco",
        "email": "ucla.edu;google.com;google.com;google.com;google.com;ucla.edu;utexas.edu;google.com",
        "author_num": 8,
        "aff_unique_index": "0;1;1;1;1;0;2;1",
        "aff_unique_norm": "University of California, Los Angeles;Google;University of Texas at Austin",
        "aff_unique_dep": ";Google;",
        "aff_unique_url": "https://www.ucla.edu;https://www.google.com;https://www.utexas.edu",
        "aff_unique_abbr": "UCLA;Google;UT Austin",
        "aff_campus_unique_index": "0;1;1;1;1;0;2;1",
        "aff_campus_unique": "Los Angeles;Mountain View;Austin",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "pCbCcXLzSz",
        "title": "Maximizing Benefits under Harm Constraints: A Generalized Linear Contextual Bandit Approach",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In many contextual sequential decision-making scenarios, such as dose-finding clinical trials for new drugs or personalized news article recommendation systems in social media, each action can simultaneously carry both benefits and potential harm. This could manifest as efficacy versus side effects in clinical trials, or increased user engagement versus the risk of radicalization and psychological distress in news recommendation.\nThese multifaceted situations can be modeled using the multi-armed bandit (MAB) framework. Given the intricate balance of positive and negative outcomes in these contexts, there is a compelling need to develop methods which can maximize benefits while limiting harm within the MAB framework. This paper aims to address this gap. The primary contributions of this paper are two-fold:\n(i) We propose a novel contextual MAB model with the objective of optimizing reward potential while maintaining certain harm constraints. In this model both rewards and harm are governed by a generalized linear model with coefficients that vary based on the contextual variables. This flexibility allows the model to be broadly applicable for a wide range of scenarios.\n(ii) Building on our proposed generalized linear contextual MAB model, we develop an $\\epsilon$-greedy-based policy. This policy is designed to strike an effective balance between the dual objectives of exploration-exploitation to achieve the desired trade-off between benefit and harm. We demonstrate that this policy achieves a sublinear $\\mathcal{O}(\\sqrt{T\\log T})$ regret.\nExtensive experimental results are presented to support our theoretical analyses and validate the effectiveness of our proposed model and policy.",
        "keywords": "Contextual multi-armed bandit;online learning;generalized linear models;varying coefficient models",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/5ab4052b83bbd35022d6ba4ab0d6d7db3de9342b.zip",
        "author": "Yingchao Zhou;Jia Liu;Zhengyuan Zhu",
        "authorids": "~Yingchao_Zhou1;~Jia_Liu1;~Zhengyuan_Zhu1",
        "gender": "F;M;M",
        "homepage": "https://www.stat.iastate.edu/people/yingchao-zhou;https://kevinliu-osu.github.io/index.html;",
        "dblp": ";;68/151",
        "google_scholar": ";Ofx3dScAAAAJ;ixDds0sAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Yingchao_Zhou1;~Jia_Liu1;~Zhengyuan_Zhu1",
        "aff": "Iowa State University;The Ohio State University;Iowa State University",
        "aff_domain": "iastate.edu;osu.edu;iastate.edu",
        "position": "PhD student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nzhou2024maximizing,\ntitle={Maximizing Benefits under Harm Constraints: A Generalized Linear Contextual Bandit Approach},\nauthor={Yingchao Zhou and Jia Liu and Zhengyuan Zhu},\nyear={2024},\nurl={https://openreview.net/forum?id=pCbCcXLzSz}\n}",
        "github": "",
        "project": "",
        "reviewers": "yL5v;GyGV;BrFX;4G5T",
        "site": "https://openreview.net/forum?id=pCbCcXLzSz",
        "pdf_size": 553664,
        "rating": "3;3;5;6",
        "confidence": "4;4;3;3",
        "soundness": "3;3;3;3",
        "contribution": "1;3;2;3",
        "presentation": "2;1;2;4",
        "wc_summary": "42;66;33;142",
        "wc_strengths": "11;96;39;145",
        "wc_weaknesses": "90;433;187;140",
        "wc_questions": "51;76;5;137",
        "wc_review": "194;671;264;564",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "485;957;148;281",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            70.75,
            42.868257487329714
        ],
        "wc_strengths_avg": [
            72.75,
            51.751207715376076
        ],
        "wc_weaknesses_avg": [
            212.5,
            131.84555358448765
        ],
        "wc_questions_avg": [
            67.25,
            47.64648465521879
        ],
        "wc_review_avg": [
            423.25,
            199.44093737244617
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            467.75,
            306.91153041226715
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.9622504486493761,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:hNpajomTXjIJ:scholar.google.com/&scioq=Maximizing+Benefits+under+Harm+Constraints:+A+Generalized+Linear+Contextual+Bandit+Approach&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Iowa State University;Ohio State University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.iastate.edu;https://www.osu.edu",
        "aff_unique_abbr": "ISU;OSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Rethinking Adversarial Policies: A Generalized Attack Formulation and Provable Defense in RL",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17785",
        "id": "pDCublKPmG",
        "author_site": "Xiangyu Liu, Souradip Chakraborty, Yanchao Sun, Furong Huang",
        "tldr": "",
        "abstract": "Most existing works focus on direct perturbations to the victim's state/action or the underlying transition dynamics to demonstrate the vulnerability of reinforcement learning agents to adversarial attacks. \nHowever, such direct manipulations may not be always realizable.\nIn this paper, we consider a multi-agent setting where a well-trained victim agent $\\nu$ is exploited by an attacker controlling another \nagent $\\alpha$ with an \\textit{adversarial policy}. Previous models do not account for the possibility that the attacker may only have partial control over \n$\\alpha$ or that the attack may produce easily detectable ``abnormal'' behaviors. Furthermore, there is a lack of provably efficient defenses against these adversarial policies. \nTo address these limitations, we introduce a generalized attack framework that has the flexibility to model to what extent the adversary is able to control the agent, and allows the attacker to regulate the state distribution shift and produce stealthier adversarial policies. Moreover, we offer a provably efficient defense with polynomial convergence to the most robust victim policy through adversarial training with timescale separation. \nThis stands in sharp contrast to supervised learning, where adversarial training typically provides only \\textit{empirical} defenses.\nUsing the Robosumo competition experiments, we show that our generalized attack formulation results in much stealthier adversarial policies when maintaining the same winning rate as baselines. \nAdditionally, our adversarial training approach yields stable learning dynamics and less exploitable victim policies.",
        "keywords": "Reinforcement learning;adversarial policies",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Xiangyu Liu;Souradip Chakraborty;Yanchao Sun;Furong Huang",
        "authorids": "~Xiangyu_Liu4;~Souradip_Chakraborty1;~Yanchao_Sun1;~Furong_Huang1",
        "gender": "M;M;F;F",
        "homepage": "https://xiangyu-liu.github.io;https://souradip-umd.github.io/;https://ycsun2017.github.io/home/index.html;https://furong-huang.com",
        "dblp": ";264/5758;132/6840;72/8513",
        "google_scholar": ";https://scholar.google.co.in/citations?user=pvETm1wAAAAJ;bloBY_QAAAAJ;13yyuCcAAAAJ",
        "orcid": ";;0000-0002-1137-9939;",
        "linkedin": ";;;",
        "or_profile": "~Xiangyu_Liu4;~Souradip_Chakraborty1;~Yanchao_Sun1;~Furong_Huang1",
        "aff": "University of Maryland, College Park;University of Maryland, College Park;J.P. Morgan AI Research;University of Maryland",
        "aff_domain": "umd.edu;umd.edu;jpmchase.com;cs.umd.edu",
        "position": "PhD student;PhD student;Researcher;Assistant Professor",
        "bibtex": "@inproceedings{\nliu2024rethinking,\ntitle={Rethinking Adversarial Policies: A Generalized Attack Formulation and Provable Defense in {RL}},\nauthor={Xiangyu Liu and Souradip Chakraborty and Yanchao Sun and Furong Huang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=pDCublKPmG}\n}",
        "github": "",
        "project": "",
        "reviewers": "gybG;GBTd;wz1v;RFDQ",
        "pdf_size": 2194627,
        "rating": "6;6;6;8",
        "confidence": "4;4;3;3",
        "soundness": "3;3;2;3",
        "contribution": "3;3;3;3",
        "presentation": "2;3;2;3",
        "wc_summary": "97;159;98;223",
        "wc_strengths": "92;62;105;28",
        "wc_weaknesses": "209;110;244;101",
        "wc_questions": "197;2;4;91",
        "wc_review": "595;333;451;443",
        "wc_reply_reviewers": "69;31;19;23",
        "wc_reply_authors": "2167;671;1050;699",
        "reply_reviewers": "2;1;1;1",
        "reply_authors": "4;2;3;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            144.25,
            51.93926741878441
        ],
        "wc_strengths_avg": [
            71.75,
            29.684802509028085
        ],
        "wc_weaknesses_avg": [
            166.0,
            61.83445641387979
        ],
        "wc_questions_avg": [
            73.5,
            79.84516265873594
        ],
        "wc_review_avg": [
            455.5,
            93.06315060215832
        ],
        "wc_reply_reviewers_avg": [
            35.5,
            19.817921182606415
        ],
        "wc_reply_authors_avg": [
            1146.75,
            607.6777003478077
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10675029604901228424&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=pDCublKPmG",
        "pdf": "https://openreview.net/pdf?id=pDCublKPmG",
        "email": "umd.edu;umd.edu;jpmchase.com;cs.umd.edu",
        "author_num": 4,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "University of Maryland;J.P. Morgan",
        "aff_unique_dep": ";AI Research",
        "aff_unique_url": "https://www/umd.edu;https://www.jpmorgan.com",
        "aff_unique_abbr": "UMD;JPM",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "College Park;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "pDFncEOiWi",
        "title": "Chat-3D: Data-efficiently Tuning Large Language Model for Universal Dialogue of 3D Scenes",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "3D scene understanding has gained significant attention due to its wide range of applications. However, existing methods for 3D scene understanding are limited to specific downstream tasks, which hinders their practicality in real-world applications. This paper presents Chat-3D, which combines the 3D visual perceptual ability of pre-trained 3D representations and the impressive reasoning and conversation capabilities of advanced LLMs to achieve the first universal dialogue systems for 3D scenes. Specifically, we align 3D representations into the feature space of LLMs, thus enabling LLMs to perceive the 3D world. Given the scarcity of 3D scene-text data, we propose a three-stage training strategy to efficiently utilize the available data for better alignment. To enhance the reasoning ability and develop a user-friendly interaction scheme, we further construct a high-quality object-centric 3D instruction dataset and design an associated object-centric prompt. Our experiments show that Chat-3D achieves an impressive ability to comprehend diverse instructions for 3D scenes, engage in intricate spatial reasoning, and incorporate external knowledge into its responses. Chat-3D achieves a 82.2\\% relative score compared with GPT-4 on the constructed instruction dataset.",
        "keywords": "large language model; 3D-language",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Zehan Wang;Haifeng Huang;Yang Zhao;Ziang Zhang;Tao Jin;Zhou Zhao",
        "authorids": "~Zehan_Wang2;~Haifeng_Huang3;~Yang_Zhao14;~Ziang_Zhang1;~Tao_Jin2;~Zhou_Zhao3",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://github.com/12zehan17;https://zzzzchs.github.io/;;;https://hugddygff.github.io/;https://dblp.uni-trier.de/pid/75/7785.html?",
        "dblp": "126/7826-1;;50/2082-22;;88/4850-4.html;75/7785",
        "google_scholar": "euXK0lkAAAAJ;oUm2gZUAAAAJ;;DptGMnYAAAAJ;;https://scholar.google.com.hk/citations?user=IIoFY90AAAAJ",
        "orcid": "0009-0007-7509-7563;;;;0000-0003-3564-1628;0000-0001-6121-0384",
        "linkedin": ";haifeng-huang-784b2b249/;;;;",
        "or_profile": "~Zehan_Wang2;~Haifeng_Huang3;~Yang_Zhao14;~Ziang_Zhang1;~Tao_Jin2;~Zhou_Zhao2",
        "aff": "Zhejiang University;Zhejiang University;ByteDance Inc.;Zhejiang University;Zhejiang University;Zhejiang University",
        "aff_domain": "zju.edu.cn;zju.edu.cn;bytedance.com;zju.edu.cn;zju.edu.cn;zju.edu.cn",
        "position": "PhD student;MS student;Researcher;Undergrad student;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nwang2024chatd,\ntitle={Chat-3D: Data-efficiently Tuning Large Language Model for Universal Dialogue of 3D Scenes},\nauthor={Zehan Wang and Haifeng Huang and Yang Zhao and Ziang Zhang and Tao Jin and Zhou Zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=pDFncEOiWi}\n}",
        "github": "",
        "project": "",
        "reviewers": "gi38;iHWf;9Qdi;Qwp4",
        "site": "https://openreview.net/forum?id=pDFncEOiWi",
        "pdf_size": 10823412,
        "rating": "3;3;5;5",
        "confidence": "4;4;5;5",
        "soundness": "3;2;2;2",
        "contribution": "3;2;2;2",
        "presentation": "2;2;3;3",
        "wc_summary": "62;38;43;78",
        "wc_strengths": "69;10;65;63",
        "wc_weaknesses": "315;282;165;92",
        "wc_questions": "82;6;20;4",
        "wc_review": "528;336;293;237",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            55.25,
            15.896147331979533
        ],
        "wc_strengths_avg": [
            51.75,
            24.200981385059574
        ],
        "wc_weaknesses_avg": [
            213.5,
            89.5949217310892
        ],
        "wc_questions_avg": [
            28.0,
            31.78049716414141
        ],
        "wc_review_avg": [
            348.5,
            109.4177773490213
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 66,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8431110601673942264&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;0;0;0",
        "aff_unique_norm": "Zhejiang University;ByteDance",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.zju.edu.cn;https://www.bytedance.com",
        "aff_unique_abbr": "ZJU;ByteDance",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "On Adversarial Training without Perturbing all Examples",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17784",
        "id": "pE6gWrASQm",
        "author_site": "Max Losch, Mohamed Omran, David Stutz, Mario Fritz, Bernt Schiele",
        "tldr": "",
        "abstract": "Adversarial training is the de-facto standard for improving robustness against adversarial examples. This usually involves a multi-step adversarial attack applied on each example during training. In this paper, we explore only constructing adversarial examples (AE) on a subset of the training examples. That is, we split the training set in two subsets $A$ and $B$, train models on both ($A\\cup B$) but construct AEs only for examples in $A$. Starting with $A$ containing only a single class, we systematically increase the size of $A$ and consider splitting by class and by examples. We observe that: (i) adv. robustness transfers by difficulty and to classes in $B$ that have never been adv. attacked during training, (ii) we observe a tendency for hard examples to provide better robustness transfer than easy examples, yet find this tendency to diminish with increasing complexity of datasets (iii) generating AEs on only $50$% of training data is sufficient to recover most of the baseline AT performance even on ImageNet. We observe similar transfer properties across tasks, where generating AEs on only $30$% of data can recover baseline robustness on the target task. We evaluate our subset analysis on a wide variety of image datasets like CIFAR-10, CIFAR-100, ImageNet-200 and show transfer to SVHN, Oxford-Flowers-102 and Caltech-256. In contrast to conventional practice, our experiments indicate that the utility of computing AEs varies by class and examples and that weighting examples from $A$ higher than $B$ provides high transfer performance. Code is available at [http://github.com/mlosch/SAT](http://github.com/mlosch/SAT).",
        "keywords": "adversarial robustness;adversarial training;adversarial robust transfer",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Max Losch;Mohamed Omran;David Stutz;Mario Fritz;Bernt Schiele",
        "authorids": "~Max_Losch1;~Mohamed_Omran1;~David_Stutz1;~Mario_Fritz1;~Bernt_Schiele1",
        "gender": "M;;M;M;M",
        "homepage": "https://www.mpi-inf.mpg.de/departments/computer-vision-and-machine-learning/people/max-losch/;http://www.mpi-inf.mpg.de/~mohomran;http://davidstutz.de/;https://cispa.saarland/group/fritz/;http://www.mpi-inf.mpg.de/~schiele",
        "dblp": "245/8930;154/6713.html;17/9394;;s/BerntSchiele",
        "google_scholar": "-mbO5ykAAAAJ;https://scholar.google.de/citations?user=jphx5uUAAAAJ;TxEy3cwAAAAJ;https://scholar.google.de/citations?user=4V1nNm4AAAAJ;https://scholar.google.de/citations?user=z76PBfYAAAAJ",
        "orcid": ";;;;0000-0001-9683-5237",
        "linkedin": ";;davidstutz92/;;",
        "or_profile": "~Max_Losch1;~Mohamed_Omran1;~David_Stutz1;~Mario_Fritz1;~Bernt_Schiele1",
        "aff": "Max-Planck Institute for Informatics;Qualcomm Inc, QualComm;Google DeepMind;Saarland University;Max Planck Institute for Informatics, Saarland Informatics Campus",
        "aff_domain": "mpi-inf.mpg.de;qti.qualcomm.com;deepmind.com;uni-saarland.de;mpi-inf.mpg.de",
        "position": "PhD student;Researcher;Researcher;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nlosch2024on,\ntitle={On Adversarial Training without Perturbing all Examples},\nauthor={Max Losch and Mohamed Omran and David Stutz and Mario Fritz and Bernt Schiele},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=pE6gWrASQm}\n}",
        "github": "",
        "project": "",
        "reviewers": "uHfk;3h75;QzqJ;gZFF",
        "pdf_size": 1468057,
        "rating": "6;6;6;8",
        "confidence": "4;3;3;4",
        "soundness": "3;3;3;4",
        "contribution": "3;3;2;3",
        "presentation": "2;3;3;4",
        "wc_summary": "16;131;80;67",
        "wc_strengths": "89;99;89;84",
        "wc_weaknesses": "156;33;245;32",
        "wc_questions": "39;98;131;2",
        "wc_review": "300;361;545;185",
        "wc_reply_reviewers": "757;85;162;0",
        "wc_reply_authors": "2473;263;787;86",
        "reply_reviewers": "3;1;1;0",
        "reply_authors": "6;2;2;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            73.5,
            40.91760012512953
        ],
        "wc_strengths_avg": [
            90.25,
            5.448623679425842
        ],
        "wc_weaknesses_avg": [
            116.5,
            89.7008918573277
        ],
        "wc_questions_avg": [
            67.5,
            50.16223679223246
        ],
        "wc_review_avg": [
            347.75,
            130.2408825983608
        ],
        "wc_reply_reviewers_avg": [
            251.0,
            297.70539128473973
        ],
        "wc_reply_authors_avg": [
            902.25,
            942.7940854184438
        ],
        "reply_reviewers_avg": [
            1.25,
            1.0897247358851685
        ],
        "reply_authors_avg": [
            2.75,
            1.920286436967152
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18292219272241647438&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=pE6gWrASQm",
        "pdf": "https://openreview.net/pdf?id=pE6gWrASQm",
        "email": "mpi-inf.mpg.de;qti.qualcomm.com;deepmind.com;uni-saarland.de;mpi-inf.mpg.de",
        "author_num": 5,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "Max-Planck Institute for Informatics;Qualcomm Incorporated;Google;Saarland University;Max Planck Institute for Informatics",
        "aff_unique_dep": ";;Google DeepMind;;",
        "aff_unique_url": "https://mpi-inf.mpg.de;https://www.qualcomm.com;https://deepmind.com;https://www.uni-saarland.de;https://mpi-inf.mpg.de",
        "aff_unique_abbr": "MPII;Qualcomm;DeepMind;UdS;MPII",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Saarland",
        "aff_country_unique_index": "0;1;2;0;0",
        "aff_country_unique": "Germany;United States;United Kingdom"
    },
    {
        "title": "On the Variance of Neural Network Training with respect to Test Sets and Distributions",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17783",
        "id": "pEGSdJu52I",
        "tldr": "",
        "abstract": "Neural network trainings are stochastic, causing the performance of trained networks to vary across repeated runs of training.\nWe contribute the following results towards understanding this variation.\n(1) Despite having significant variance on their test-sets, we demonstrate that standard CIFAR-10 and ImageNet trainings have little variance in their performance on the test-distributions from which their test-sets are sampled.\n(2) We introduce the independent errors assumption and show that it suffices to recover the structure and variance of the empirical accuracy distribution across repeated runs of training.\n(3) We prove that test-set variance is unavoidable given the observation that ensembles of identically trained networks are calibrated (Jiang et al., 2021), and demonstrate that the variance of binary classification trainings closely follows a simple formula based on the error rate and number of test examples.\n(4) We conduct preliminary studies of data augmentation, learning rate, finetuning instability and distribution-shift through the lens of variance between runs.",
        "keywords": "stochasticity;distribution shift;randomness;deep learning;variance;random seed",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Keller Jordan",
        "authorids": "~Keller_Jordan1",
        "gender": "M",
        "homepage": "",
        "dblp": "334/0207",
        "google_scholar": "",
        "orcid": "",
        "linkedin": "keller-j-jordan/",
        "or_profile": "~Keller_Jordan1",
        "aff": "none",
        "aff_domain": "kellerjordan.com",
        "position": "Researcher",
        "bibtex": "@inproceedings{\njordan2024on,\ntitle={On the Variance of Neural Network Training with respect to Test Sets and Distributions},\nauthor={Keller Jordan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=pEGSdJu52I}\n}",
        "github": "",
        "project": "",
        "reviewers": "yu6g;G5ah;Nr6n;Wzaj",
        "pdf_size": 1504259,
        "rating": "5;5;6;8",
        "confidence": "4;3;4;4",
        "soundness": "3;3;3;3",
        "contribution": "3;2;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "55;43;83;195",
        "wc_strengths": "64;22;158;102",
        "wc_weaknesses": "346;74;367;158",
        "wc_questions": "66;74;61;50",
        "wc_review": "531;213;669;505",
        "wc_reply_reviewers": "202;0;26;50",
        "wc_reply_authors": "966;559;748;791",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "3;1;1;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            94.0,
            60.091596750294464
        ],
        "wc_strengths_avg": [
            86.5,
            50.04747745890896
        ],
        "wc_weaknesses_avg": [
            236.25,
            124.08540405704451
        ],
        "wc_questions_avg": [
            62.75,
            8.699856320652657
        ],
        "wc_review_avg": [
            479.5,
            166.00828292588295
        ],
        "wc_reply_reviewers_avg": [
            69.5,
            78.51592195217476
        ],
        "wc_reply_authors_avg": [
            766.0,
            144.73942102965592
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0.4714045207910316,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4520614144986578429&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=pEGSdJu52I",
        "pdf": "https://openreview.net/pdf?id=pEGSdJu52I",
        "email": "kellerjordan.com",
        "author_num": 1
    },
    {
        "title": "Scalable Modular Network: A Framework for Adaptive Learning via Agreement Routing",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17782",
        "id": "pEKJl5sflp",
        "author_site": "Minyang Hu, Hong Chang, Bingpeng Ma, Shiguang Shan, Xilin CHEN",
        "tldr": "",
        "abstract": "In this paper, we propose a novel modular network framework, called Scalable Modular Network (SMN), which enables adaptive learning capability and supports integration of new modules after pre-training for better adaptation.\nThis adaptive capability comes from a novel design of router within SMN, named agreement router, which selects and composes different specialist modules through an iterative message passing process.\nThe agreement router iteratively computes the agreements among a set of input and outputs of all modules to allocate inputs to specific module.\nDuring the iterative routing, messages of modules are passed to each other, which improves the module selection process with consideration of both local interactions (between a single module and input) and global interactions involving multiple other modules.\nTo validate our contributions, we conduct experiments on two problems: a toy min-max game and few-shot image classification task. \nOur experimental results demonstrate that SMN can generalize to new distributions and exhibit sample-efficient adaptation to new tasks. \nFurthermore, SMN can achieve a better adaptation capability when new modules are introduced after pre-training. \nOur code is available at https://github.com/hu-my/ScalableModularNetwork.",
        "keywords": "modular neural network; module selection process; adaptive learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Minyang Hu;Hong Chang;Bingpeng Ma;Shiguang Shan;Xilin CHEN",
        "authorids": "~Minyang_Hu1;~Hong_Chang1;~Bingpeng_Ma1;~Shiguang_Shan2;~Xilin_CHEN2",
        "gender": "F;M;M;M;M",
        "homepage": ";http://people.ucas.edu.cn/~bpma;http://vipl.ict.ac.cn/people/sgshan/;;http://vipl.ict.ac.cn/people/_xlchen/",
        "dblp": ";62/1822;s/ShiguangShan;325/1940;c/XilinChen",
        "google_scholar": "LX6MnNsAAAAJ;;https://scholar.google.com.tw/citations?user=Vkzd7MIAAAAJ;6Saa1ugAAAAJ;vVx2v20AAAAJ",
        "orcid": ";0000-0001-8984-205X;0000-0002-8348-392X;;0000-0003-3024-4404",
        "linkedin": ";;;;",
        "or_profile": "~Hong_Chang1;~Bingpeng_Ma1;~Shiguang_Shan2;~Hu_Minyang1;~Xilin_Chen4",
        "aff": "Institute of Computing Technology, Chinese Academy of Sciences;University of Chinese Academy of Sciences;Institute of Computing Technology, Chinese Academy of Sciences;, Chinese Academy of Sciences;Institute of Computing Technology",
        "aff_domain": "ict.ac.cn;ucas.ac.cn;ict.ac.cn;ict.ac.cn;ict.ac.cn",
        "position": "Full Professor;Full Professor;Full Professor;PhD student;Full Professor",
        "bibtex": "@inproceedings{\nhu2024scalable,\ntitle={Scalable Modular Network: A Framework for Adaptive Learning via Agreement Routing},\nauthor={Minyang Hu and Hong Chang and Bingpeng Ma and Shiguang Shan and Xilin CHEN},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=pEKJl5sflp}\n}",
        "github": "",
        "project": "",
        "reviewers": "Zqvo;y9sx;9n4d;nZgT",
        "pdf_size": 682245,
        "rating": "6;6;6;6",
        "confidence": "4;3;2;4",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "45;142;142;96",
        "wc_strengths": "26;34;131;38",
        "wc_weaknesses": "28;99;66;135",
        "wc_questions": "11;80;9;192",
        "wc_review": "110;355;348;461",
        "wc_reply_reviewers": "10;0;0;11",
        "wc_reply_authors": "404;1016;689;1636",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "1;2;1;3",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            106.25,
            40.03982392568679
        ],
        "wc_strengths_avg": [
            57.25,
            42.7982184208642
        ],
        "wc_weaknesses_avg": [
            82.0,
            39.59166578965831
        ],
        "wc_questions_avg": [
            73.0,
            74.41438033068609
        ],
        "wc_review_avg": [
            318.5,
            128.43383510586298
        ],
        "wc_reply_reviewers_avg": [
            5.25,
            5.261891294962297
        ],
        "wc_reply_authors_avg": [
            936.25,
            458.3755965362903
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17539567027793593762&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=pEKJl5sflp",
        "pdf": "https://openreview.net/pdf?id=pEKJl5sflp",
        "email": "ict.ac.cn;ucas.ac.cn;ict.ac.cn;ict.ac.cn;ict.ac.cn",
        "author_num": 5,
        "aff_unique_index": "0;1;0;0;2",
        "aff_unique_norm": "Chinese Academy of Sciences;University of Chinese Academy of Sciences;Institute of Computing Technology",
        "aff_unique_dep": "Institute of Computing Technology;;",
        "aff_unique_url": "http://www.ict.ac.cn;http://www.ucas.ac.cn;http://www.ict.ac.cn",
        "aff_unique_abbr": "CAS;UCAS;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "RAIN: Your Language Models Can Align Themselves without Finetuning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17781",
        "id": "pETSfWMUzy",
        "author_site": "Yuhui Li, Fangyun Wei, Jinjing Zhao, Chao Zhang, Hongyang Zhang",
        "tldr": "",
        "abstract": "Large language models (LLMs) often demonstrate inconsistencies with human preferences. Previous research typically gathered human preference data and then aligned the pre-trained models using reinforcement learning or instruction tuning, a.k.a. the finetuning step. In contrast, aligning frozen LLMs without requiring alignment data is more appealing. This work explores the potential of the latter setting. We discover that by integrating self-evaluation and rewind mechanisms, unaligned LLMs can directly produce responses consistent with human preferences via self-boosting. We introduce a novel inference method, Rewindable Auto-regressive INference (RAIN), that allows pre-trained LLMs to evaluate their own generation and use the evaluation results to guide rewind and generation for AI safety. Notably, RAIN operates without the need of extra data for model alignment and abstains from any training, gradient computation, or parameter updates. Experimental results evaluated by GPT-4 and humans demonstrate the effectiveness of RAIN: on the HH dataset, RAIN improves the harmlessness rate of LLaMA 30B from 82% of vanilla inference to 97%, while maintaining the helpfulness rate. On the TruthfulQA dataset, RAIN improves the truthfulness of the already-well-aligned LLaMA-2-chat 13B model by 5%.",
        "keywords": "Large language models;Alignment",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/a591d99e598f1c39ade6ba172ecfb3db5d5bf81e.zip",
        "author": "Yuhui Li;Fangyun Wei;Jinjing Zhao;Chao Zhang;Hongyang Zhang",
        "authorids": "~Yuhui_Li1;~Fangyun_Wei1;~Jinjing_Zhao1;~Chao_Zhang10;~Hongyang_Zhang1",
        "gender": "M;M;M;M;M",
        "homepage": ";;;http://www.cis.pku.edu.cn/faculty/vision/zhangchao/zhangchao.htm;https://hongyanz.github.io/",
        "dblp": ";161/2636;;94/3019-1;23/10537-1",
        "google_scholar": ";-ncz2s8AAAAJ;;NeCCx-kAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;0009-0004-5494-7299;;",
        "linkedin": "https://www.linkedin.cn/incareer/in/ACoAAD4l0ZYBzPPIPhZpDeJ7Zfc_v082CPYOoWc;;zhaojingjing713/;;",
        "or_profile": "~Yuhui_Li1;~Fangyun_Wei1;~Jinjing_Zhao1;~Chao_Zhang10;~Hongyang_Zhang1",
        "aff": "Peking University;Microsoft Research;\tMicrosoft Research Asia;Peking University;School of Computer Science, University of Waterloo",
        "aff_domain": "pku.edu.cn;microsoft.com;microsoft.com;pku.edu.cn;uwaterloo.ca",
        "position": "MS student;Researcher;Intern;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nli2024rain,\ntitle={{RAIN}: Your Language Models Can Align Themselves without Finetuning},\nauthor={Yuhui Li and Fangyun Wei and Jinjing Zhao and Chao Zhang and Hongyang Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=pETSfWMUzy}\n}",
        "github": "",
        "project": "",
        "reviewers": "drDq;hgqg;5Znu;RrQ5;WBkA",
        "pdf_size": 1075543,
        "rating": "5;5;6;6;8",
        "confidence": "4;3;4;3;3",
        "soundness": "3;2;2;3;3",
        "contribution": "2;3;2;2;4",
        "presentation": "2;2;2;2;3",
        "wc_summary": "66;301;130;186;178",
        "wc_strengths": "111;67;28;67;161",
        "wc_weaknesses": "119;244;85;759;82",
        "wc_questions": "61;109;13;97;55",
        "wc_review": "357;721;256;1109;476",
        "wc_reply_reviewers": "87;0;0;1016;161",
        "wc_reply_authors": "792;1421;404;2051;737",
        "reply_reviewers": "1;0;0;4;1",
        "reply_authors": "2;3;1;4;2",
        "rating_avg": [
            6.0,
            1.0954451150103321
        ],
        "confidence_avg": [
            3.4,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.6,
            0.8
        ],
        "presentation_avg": [
            2.2,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            172.2,
            77.295277992902
        ],
        "wc_strengths_avg": [
            86.8,
            45.45943246456119
        ],
        "wc_weaknesses_avg": [
            257.8,
            257.4578800503104
        ],
        "wc_questions_avg": [
            67.0,
            33.94112549695428
        ],
        "wc_review_avg": [
            583.8,
            305.01501602380165
        ],
        "wc_reply_reviewers_avg": [
            252.8,
            386.31769309727457
        ],
        "wc_reply_authors_avg": [
            1081.0,
            585.9498272036609
        ],
        "reply_reviewers_avg": [
            1.2,
            1.4696938456699067
        ],
        "reply_authors_avg": [
            2.4,
            1.019803902718557
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.372677996249965,
        "gs_citation": 122,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4870572127493474655&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=pETSfWMUzy",
        "pdf": "https://openreview.net/pdf?id=pETSfWMUzy",
        "email": "pku.edu.cn;microsoft.com;microsoft.com;pku.edu.cn;uwaterloo.ca",
        "author_num": 5,
        "aff_unique_index": "0;1;1;0;2",
        "aff_unique_norm": "Peking University;Microsoft;University of Waterloo",
        "aff_unique_dep": ";Microsoft Research;School of Computer Science",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.microsoft.com/en-us/research;https://uwaterloo.ca",
        "aff_unique_abbr": "Peking U;MSR;UWaterloo",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Asia;Waterloo",
        "aff_country_unique_index": "0;1;0;0;2",
        "aff_country_unique": "China;United States;Canada"
    },
    {
        "title": "Robust Adversarial Reinforcement Learning via Bounded Rationality Curricula",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17780",
        "id": "pFOoOdaiue",
        "author_site": "Aryaman Reddi, Maximilian T\u00f6lle, Jan Peters, Georgia Chalvatzaki, Carlo D'Eramo",
        "tldr": "",
        "abstract": "Robustness against adversarial attacks and distribution shifts is a long-standing goal of Reinforcement Learning (RL). To this end, Robust Adversarial Reinforcement Learning (RARL) trains a protagonist against destabilizing forces exercised by an adversary in a competitive zero-sum Markov game, whose optimal solution, i.e., rational strategy, corresponds to a Nash equilibrium. However, finding Nash equilibria requires facing complex saddle point optimization problems, which can be prohibitive to solve, especially for high-dimensional control. In this paper, we propose a novel approach for adversarial RL based on entropy regularization to ease the complexity of the saddle point optimization problem. We show that the solution of this entropy-regularized problem corresponds to a Quantal Response Equilibrium (QRE), a generalization of Nash equilibria that accounts for bounded rationality, i.e., agents sometimes play random actions instead of optimal ones. Crucially, the connection between the entropy-regularized objective and QRE enables free modulation of the rationality of the agents by simply tuning the temperature coefficient. We leverage this insight to propose our novel algorithm, Quantal Adversarial RL (QARL), which gradually increases the rationality of the adversary in a curriculum fashion until it is fully rational, easing the complexity of the optimization problem while retaining robustness. We provide extensive evidence of QARL outperforming RARL and recent baselines across several MuJoCo locomotion and navigation problems in overall performance and robustness.",
        "keywords": "reinforcement learning;adversarial;bounded rationality;curriculum",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/beecd5122fe4c4570bf1f897ca61aa6b8392273d.zip",
        "author": "Aryaman Reddi;Maximilian T\u00f6lle;Jan Peters;Georgia Chalvatzaki;Carlo D'Eramo",
        "authorids": "~Aryaman_Reddi1;~Maximilian_T\u00f6lle1;~Jan_Peters3;~Georgia_Chalvatzaki1;~Carlo_D'Eramo2",
        "gender": "M;M;M;F;M",
        "homepage": "https://aryamanreddi99.github.io/;;https://www.jan-peters.net;https://www.ias.informatik.tu-darmstadt.de/Team/GeorgiaChalvatzaki;https://carloderamo.wixsite.com/home",
        "dblp": "360/0304;;p/JanPeters1;145/3334;182/8953",
        "google_scholar": ";;https://scholar.google.de/citations?user=-kIVAcAAAAAJ;https://scholar.google.gr/citations?user=mlho5FkAAAAJ;https://scholar.google.it/citations?user=1Rt_86gAAAAJ",
        "orcid": ";;0000-0002-5266-8091;;0000-0003-2712-118X",
        "linkedin": "aryamanreddi/;maximilian-toelle/;janrpeters/;;carlo-d-eramo-6438a289/",
        "or_profile": "~Aryaman_Reddi1;~Maximilian_T\u00f6lle1;~Jan_Peters3;~Georgia_Chalvatzaki1;~Carlo_D'Eramo2",
        "aff": "Technische Universit\u00e4t Darmstadt;German Research Center for AI;TU Darmstadt;Technische Universit\u00e4t Darmstadt;TU Darmstadt",
        "aff_domain": "tu-darmstadt.de;dfki.de;tu-darmstadt.de;tu-darmstadt.de;tu-darmstadt.de",
        "position": "PhD student;Researcher;Full Professor;Assistant Professor;Postdoc",
        "bibtex": "@inproceedings{\nreddi2024robust,\ntitle={Robust Adversarial Reinforcement Learning via Bounded Rationality Curricula},\nauthor={Aryaman Reddi and Maximilian T{\\\"o}lle and Jan Peters and Georgia Chalvatzaki and Carlo D'Eramo},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=pFOoOdaiue}\n}",
        "github": "",
        "project": "",
        "reviewers": "cFcL;DPhM;puRh;S4Ho",
        "pdf_size": 3531560,
        "rating": "6;6;6;8",
        "confidence": "4;4;3;4",
        "soundness": "3;3;4;3",
        "contribution": "3;3;3;3",
        "presentation": "2;4;3;3",
        "wc_summary": "47;86;132;72",
        "wc_strengths": "32;46;96;35",
        "wc_weaknesses": "34;30;109;85",
        "wc_questions": "288;72;16;276",
        "wc_review": "401;234;353;468",
        "wc_reply_reviewers": "27;17;0;187",
        "wc_reply_authors": "770;587;418;1037",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            84.25,
            30.90610781059304
        ],
        "wc_strengths_avg": [
            52.25,
            25.791229129298976
        ],
        "wc_weaknesses_avg": [
            64.5,
            33.61919094802848
        ],
        "wc_questions_avg": [
            163.0,
            120.71039723238425
        ],
        "wc_review_avg": [
            364.0,
            85.44881508833227
        ],
        "wc_reply_reviewers_avg": [
            57.75,
            75.2441858218959
        ],
        "wc_reply_authors_avg": [
            703.0,
            229.52450849528032
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3363621461056223991&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=pFOoOdaiue",
        "pdf": "https://openreview.net/pdf?id=pFOoOdaiue",
        "email": "tu-darmstadt.de;dfki.de;tu-darmstadt.de;tu-darmstadt.de;tu-darmstadt.de",
        "author_num": 5,
        "aff_unique_index": "0;1;0;0;0",
        "aff_unique_norm": "Technische Universit\u00e4t Darmstadt;German Research Center for Artificial Intelligence",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tu-darmstadt.de;https://www.dfki.de/",
        "aff_unique_abbr": "TUD;DFKI",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Darmstadt",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "pGL4P2kg6V",
        "title": "Towards Interpretable Continual Learning Through Controlling Concepts",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Continual learning is a challenging task in machine learning as models can learn new tasks easily but suffer from catastrophic forgetting of previous tasks. In this work, we propose a novel framework called \"Concept Controller\" that addresses the issue of catastrophic forgetting by systematically controlling interpretable concepts in deep neural networks. Our method has several advantages: (1) High Performance: empirical results show that our method outperforms exemplar-free methods and is comparable with exemplar-based methods in the standard metrics such as average accuracy and average forgetting. Moreover, combining our method with exemplar-based methods can further improve the performance of exemplar-based methods. (2) Light: our method does not need extra memory space to store previous tasks' samples unlike the exemplar-based methods. (3) Interpretable: the procedure of controlling concept units is transparent.",
        "keywords": "Continual Learning;Interpretability;Catastrophic Forgetting",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Sin-Han Yang;Tuomas Oikarinen;Tsui-Wei Weng",
        "authorids": "~Sin-Han_Yang1;~Tuomas_Oikarinen1;~Tsui-Wei_Weng1",
        "gender": ";M;F",
        "homepage": ";https://tuomaso.github.io/;https://lilywenglab.github.io",
        "dblp": "339/7081;243/3532;177/9197",
        "google_scholar": "5HlFvQQAAAAJ;M3KZnPwAAAAJ;v8GM4xoAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Sin-Han_Yang1;~Tuomas_Oikarinen1;~Tsui-Wei_Weng1",
        "aff": "National Taiwan University;GenenTech;University of California, San Diego",
        "aff_domain": "ntu.edu.tw;gene.com;ucsd.edu",
        "position": "Undergrad student;Intern;Assistant Professor",
        "bibtex": "@misc{\nyang2024towards,\ntitle={Towards Interpretable Continual Learning Through Controlling Concepts},\nauthor={Sin-Han Yang and Tuomas Oikarinen and Tsui-Wei Weng},\nyear={2024},\nurl={https://openreview.net/forum?id=pGL4P2kg6V}\n}",
        "github": "",
        "project": "",
        "reviewers": "Hm1u;zdWA;6BcB",
        "site": "https://openreview.net/forum?id=pGL4P2kg6V",
        "pdf_size": 1108609,
        "rating": "3;5;6",
        "confidence": "3;4;4",
        "soundness": "3;2;3",
        "contribution": "2;2;3",
        "presentation": "3;2;3",
        "wc_summary": "39;67;70",
        "wc_strengths": "36;58;46",
        "wc_weaknesses": "184;541;145",
        "wc_questions": "4;102;1",
        "wc_review": "263;768;262",
        "wc_reply_reviewers": "0;0;74",
        "wc_reply_authors": "1312;1625;517",
        "reply_reviewers": "0;0;1",
        "reply_authors": "5;5;2",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            58.666666666666664,
            13.960261060914616
        ],
        "wc_strengths_avg": [
            46.666666666666664,
            8.993825042154693
        ],
        "wc_weaknesses_avg": [
            290.0,
            178.19652072922187
        ],
        "wc_questions_avg": [
            35.666666666666664,
            46.92073694599815
        ],
        "wc_review_avg": [
            431.0,
            238.2953349662277
        ],
        "wc_reply_reviewers_avg": [
            24.666666666666668,
            34.883934538536344
        ],
        "wc_reply_authors_avg": [
            1151.3333333333333,
            466.38777380582735
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            4.0,
            1.4142135623730951
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.9449111825230683,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:6HYzjUuYN0UJ:scholar.google.com/&scioq=Towards+Interpretable+Continual+Learning+Through+Controlling+Concepts&hl=en&as_sdt=0,48",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "National Taiwan University;Genentech;University of California, San Diego",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ntu.edu.tw;https://www.genentech.com;https://www.ucsd.edu",
        "aff_unique_abbr": "NTU;Genentech;UCSD",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Taiwan;;San Diego",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "pHaX00wxFy",
        "title": "Reward-Free Exploration by Conditional Divergence Maximization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We propose maximum conditional divergence (MaxCondDiv), a new curiosity-driven exploration strategy that encourages the agent to learn in the absence of external rewards, effectively separating exploration from exploitation. Our central idea is to define curiosity as the divergence between the agent's estimation of the transition probability between the next state given current state-action pairs (i.e., $\\mathbb{P}(\\mathbf{s}_{t+1}|\\mathbf{s}_t,\\mathbf{a}_t)$ ) in two adjacent trajectory fractions. Distinct to other recent intrinsically motivated exploration approaches that usually incur complex models in their learning procedures, our exploration is model-free and explicitly estimates this divergence from possibly multivariate continuous observations, thanks to the favorable properties of the Cauchy-Schwarz divergence. Therefore, MaxCondDiv is less computational complex and reduces internal model selection bias. We establish a connection between MaxCondDiv and the famed maximum entropy (MaxEnt) exploration, and observe that it achieves wider exploration range and faster convergence. Our exploration also encourages the agent to acquire intricate skills in a fully reward-free environment.",
        "keywords": "Reward-free exploration;Cauchy-Schwarz divergence;intrinsic reward",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/7ad4a2089dd2effa5b3c0042dba215fb8b1a6def.zip",
        "author": "Hongming Li;Shujian Yu;Vincent Francois-Lavet;Jose C Principe",
        "authorids": "~Hongming_Li3;~Shujian_Yu1;~Vincent_Francois-Lavet1;~Jose_C_Principe1",
        "gender": "M;M;;M",
        "homepage": "https://linkedin.com/in/hongming-li-44a237230;https://sjyucnel.github.io/;http://vincent.francois-l.be;http://www.cnel.ufl.edu",
        "dblp": ";154/5763.html;127/3326;",
        "google_scholar": ";O8kpnMoAAAAJ;;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Hongming_Li3;~Shujian_Yu1;~Vincent_Francois-Lavet1;~Jose_C_Principe1",
        "aff": "University of Florida;University of Troms\u00f8;VU Amsterdam;",
        "aff_domain": "ufl.edu;uit.no;vu.nl;",
        "position": "PhD student;Guest Associate Professor;Assistant Professor;",
        "bibtex": "@misc{\nli2024rewardfree,\ntitle={Reward-Free Exploration by Conditional Divergence Maximization},\nauthor={Hongming Li and Shujian Yu and Vincent Francois-Lavet and Jose C Principe},\nyear={2024},\nurl={https://openreview.net/forum?id=pHaX00wxFy}\n}",
        "github": "",
        "project": "",
        "reviewers": "hR4c;3dXY;XX6U;ovbq",
        "site": "https://openreview.net/forum?id=pHaX00wxFy",
        "pdf_size": 3800786,
        "rating": "3;3;5;5",
        "confidence": "4;4;4;3",
        "soundness": "1;2;3;3",
        "contribution": "3;2;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "104;51;104;40",
        "wc_strengths": "92;83;26;28",
        "wc_weaknesses": "240;346;56;55",
        "wc_questions": "328;128;109;40",
        "wc_review": "764;608;295;163",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            74.75,
            29.507414322505454
        ],
        "wc_strengths_avg": [
            57.25,
            30.425112982534674
        ],
        "wc_weaknesses_avg": [
            174.25,
            124.52384309842031
        ],
        "wc_questions_avg": [
            151.25,
            107.17129979616745
        ],
        "wc_review_avg": [
            457.5,
            239.65026601278788
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:IGqIJEbbZ7MJ:scholar.google.com/&scioq=Reward-Free+Exploration+by+Conditional+Divergence+Maximization&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of Florida;University of Troms\u00f8;Vrije Universiteit Amsterdam",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ufl.edu;https://uit.no;https://www.vu.nl",
        "aff_unique_abbr": "UF;UIT;VU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Amsterdam",
        "aff_country_unique_index": "0;1;2",
        "aff_country_unique": "United States;Norway;Netherlands"
    },
    {
        "id": "pJ55L21Tay",
        "title": "Two subspace clustering methods with prior masks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "To further utilize the unsupervised features and pairwise information, we propose an embedding method to joint two clustering methods, and an unified Bilevel Clustering Optimization (BCO) framework to improve the clustering performance. At first, we reformulate the original subspace clustering as a Basic Masked Subspace Clustering (BMSC), which reformulate the diagonal constraints to a hard mask. Then, we provide a General Masked Subspace Clustering (GMSC) method to integrate different clustering via a soft mask. Furthermore, based on BCO and GMSC, we induce a learnable soft mask and design a Recursive Masked Subspace Clustering (RMSC) method that can alternately update the affinity matrix and the soft mask. Numerical experiments show that our models obtain significant improvement compared with the baselines on several commonly used datasets, such as MNIST, USPS, ORL, COIL20 and COIL100.",
        "keywords": "subspace clustering;prior mask;bilevel clustering",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Jiebo Song",
        "authorids": "~Jiebo_Song1",
        "gender": "F",
        "homepage": "",
        "dblp": "",
        "google_scholar": "",
        "orcid": "0000-0002-6124-2850",
        "linkedin": "",
        "or_profile": "~Jiebo_Song1",
        "aff": "Yanqi Lake Beijing Institute of Mathematical Sciences and Applications",
        "aff_domain": "bimsa.cn",
        "position": "Researcher",
        "bibtex": "@misc{\nsong2024two,\ntitle={Two subspace clustering methods with prior masks},\nauthor={Jiebo Song},\nyear={2024},\nurl={https://openreview.net/forum?id=pJ55L21Tay}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=pJ55L21Tay",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:QFhM4eZUrEQJ:scholar.google.com/&scioq=Two+subspace+clustering+methods+with+prior+masks&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Beijing Institute of Mathematical Sciences and Applications",
        "aff_unique_dep": "Mathematical Sciences and Applications",
        "aff_unique_url": "http://www.bimsa.cn",
        "aff_unique_abbr": "BIMSA",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Yanqi Lake",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "pJBSzGmb9a",
        "title": "On the Global Convergence of Natural Actor-Critic with Neural Network Parametrization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Despite the empirical effectiveness of natural actor-critic (NAC) algorithms, their theoretical underpinnings remain relatively unexplored, especially with neural network parameterizations. In the existing literature, the non-asymptotic sample complexity bounds for NAC hold only when the critic is either tabular or are represented by a linear function. In this work, we relax such assumptions for  NAC and utilize multi-layer neural network parameterization of the critic and an arbitrary smooth function for the actor. We establish the non-asymptotic sample complexity bounds of $\\tilde{\\mathcal{O}}\\left(\\frac{1}{\\epsilon^{4}(1-\\gamma)^{4}}\\right)$ for the global convergence of NAC algorithm. We obtain this result using our unique decomposition of the error incurred at each critic step. The critic error is decomposed into the error incurred in fitting the sampled data, the error incurred due to the lack of knowledge of the transition matrix as well as the error incurred due to the limited approximation power of the class of neural networks. In contrast to the existing works for NAC with neural network parameterization of the critic, our analysis does not require i.i.d sampling.",
        "keywords": "Reinforcement Learning;Deep Neural Networks",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/fd49ce9cc6388e81a4a0d8ac25ec1d2275ffa0e5.pdf",
        "author": "Mudit Gaur;Amrit Bedi;Di Wang;Vaneet Aggarwal",
        "authorids": "~Mudit_Gaur1;~Amrit_Bedi1;~Di_Wang1;~Vaneet_Aggarwal1",
        "gender": "M;M;;M",
        "homepage": "https://www.linkedin.com/in/mudit-gaur-a3294661/;https://sites.google.com/view/amritsinghbedi/home;;",
        "dblp": "334/0220.html;176/2707.html;;91/6560",
        "google_scholar": "aA4GjhAAAAAJ;91WLA6QAAAAJ;;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Mudit_Gaur1;~Amrit_Bedi1;~Di_Wang1;~Vaneet_Aggarwal1",
        "aff": "Purdue University;University of Maryland, College Park;;Purdue University",
        "aff_domain": "purdue.edu;umd.edu;;purdue.edu",
        "position": "PhD student;Researcher;;Full Professor",
        "bibtex": "@misc{\ngaur2024on,\ntitle={On the Global Convergence of Natural Actor-Critic with Neural Network Parametrization},\nauthor={Mudit Gaur and Amrit Bedi and Di Wang and Vaneet Aggarwal},\nyear={2024},\nurl={https://openreview.net/forum?id=pJBSzGmb9a}\n}",
        "github": "",
        "project": "",
        "reviewers": "koRw;1Jb4;x5yz;vh1k",
        "site": "https://openreview.net/forum?id=pJBSzGmb9a",
        "pdf_size": 2678917,
        "rating": "3;3;5;6",
        "confidence": "3;4;5;5",
        "soundness": "2;4;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;2",
        "wc_summary": "34;26;27;61",
        "wc_strengths": "34;59;32;33",
        "wc_weaknesses": "214;110;124;66",
        "wc_questions": "544;110;4;914",
        "wc_review": "826;305;187;1074",
        "wc_reply_reviewers": "0;0;0;13",
        "wc_reply_authors": "1025;805;759;1136",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "3;2;2;3",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            37.0,
            14.19506956657839
        ],
        "wc_strengths_avg": [
            39.5,
            11.280514172678478
        ],
        "wc_weaknesses_avg": [
            128.5,
            53.80288096375509
        ],
        "wc_questions_avg": [
            393.0,
            362.50931022526856
        ],
        "wc_review_avg": [
            598.0,
            365.1472305796663
        ],
        "wc_reply_reviewers_avg": [
            3.25,
            5.629165124598851
        ],
        "wc_reply_authors_avg": [
            931.25,
            155.17792207656345
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.8703882797784892,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:shIwFgBYoF8J:scholar.google.com/&scioq=On+the+Global+Convergence+of+Natural+Actor-Critic+with+Neural+Network+Parametrization&hl=en&as_sdt=0,31",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Purdue University;University of Maryland",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.purdue.edu;https://www/umd.edu",
        "aff_unique_abbr": "Purdue;UMD",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";College Park",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "pJwuOJCSqt",
        "title": "Exploring Counterfactual Alignment Loss towards Human-Centered AI",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Deep neural networks have demonstrated impressive accuracy in supervised learning tasks. However, their lack of transparency makes it hard for humans to trust their results, especially in safe-critic domains such as healthcare. To address this issue, recent explanation-guided learning approaches proposed to align the gradient-based attention map to image regions annotated by human experts, thereby obtaining an intrinsically human-centered model. However, the attention map these methods are based on may fail to causally attribute the model predictions, thus compromising their validity for alignment. To address this issue, we propose a novel human-centered framework based on counterfactual generation. In particular, we utilize the counterfactual generation's ability for causal attribution to introduce a novel loss called the CounterFactual Alignment (CF-Align) loss. This loss guarantees that the features attributed by the counterfactual generation for the classifier align with the human annotations. To optimize the proposed loss that entails a counterfactual generation with an implicit function form, we leverage the implicit function theorem for backpropagation. Our method is architecture-agnostic and, therefore can be applied to any neural network. We demonstrate the effectiveness of our method on a lung cancer diagnosis dataset, showcasing faithful alignment to humans.",
        "keywords": "human-centered AI;explainable AI;counterfactual",
        "primary_area": "causal reasoning",
        "supplementary_material": "",
        "author": "Mingzhou Liu;Xinwei Sun;Ching-Wen Lee;Yu QIAO;Yizhou Wang",
        "authorids": "~Mingzhou_Liu1;~Xinwei_Sun1;~Ching-Wen_Lee2;~Yu_QIAO3;~Yizhou_Wang1",
        "gender": "M;M;;M;M",
        "homepage": ";https://sunxinwei0625.github.io/sunxw.github.io/;https://github.com/Fat-Fat-Lee;http://www.pami.sjtu.edu.cn/yuqiao;https://cfcs.pku.edu.cn/wangyizhou/",
        "dblp": "159/6544-1;145/6592-1;;q/YuQiao3;71/3387-1",
        "google_scholar": ";;;hO33bVgAAAAJ;831z_VcAAAAJ",
        "orcid": "0000-0002-0297-0938;;;0000-0001-8258-3868;",
        "linkedin": ";;;;",
        "or_profile": "~Mingzhou_Liu1;~Xinwei_Sun1;~Ching-Wen_Lee2;~Yu_QIAO3;~Yizhou_Wang1",
        "aff": "Peking University;Fudan University;Peking University;Shanghai Jiaotong University;Peking University",
        "aff_domain": "pku.edu.cn;fudan.edu.cn;pku.edu.cn;sjtu.edu.cn;pku.edu.cn",
        "position": "PhD student;Assistant Professor;MS student;Associate Professor;Full Professor",
        "bibtex": "@misc{\nliu2024exploring,\ntitle={Exploring Counterfactual Alignment Loss towards Human-Centered {AI}},\nauthor={Mingzhou Liu and Xinwei Sun and Ching-Wen Lee and Yu QIAO and Yizhou Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=pJwuOJCSqt}\n}",
        "github": "",
        "project": "",
        "reviewers": "bgGJ;wsVV;orMV",
        "site": "https://openreview.net/forum?id=pJwuOJCSqt",
        "pdf_size": 4972450,
        "rating": "3;3;6",
        "confidence": "4;4;4",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "2;2;4",
        "wc_summary": "65;47;53",
        "wc_strengths": "37;35;87",
        "wc_weaknesses": "296;43;90",
        "wc_questions": "29;2;40",
        "wc_review": "427;127;270",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            55.0,
            7.483314773547883
        ],
        "wc_strengths_avg": [
            53.0,
            24.055491403558285
        ],
        "wc_weaknesses_avg": [
            143.0,
            109.87568733194193
        ],
        "wc_questions_avg": [
            23.666666666666668,
            15.96524001977073
        ],
        "wc_review_avg": [
            274.6666666666667,
            122.51893277730136
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:R5mlNdlcy1oJ:scholar.google.com/&scioq=Exploring+Counterfactual+Alignment+Loss+towards+Human-Centered+AI&hl=en&as_sdt=0,48",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;2;0",
        "aff_unique_norm": "Peking University;Fudan University;Shanghai Jiao Tong University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.fudan.edu.cn;https://www.sjtu.edu.cn",
        "aff_unique_abbr": "Peking U;Fudan;SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "pK7V0glCdj",
        "title": "BOtied: Multi-objective Bayesian optimization with tied multivariate ranks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Many scientific and industrial applications require the joint optimization of multiple, potentially competing objectives. Multi-objective Bayesian optimization (MOBO) is a sample-efficient framework for identifying Pareto-optimal solutions. At the heart of MOBO is the acquisition function, which determines the next candidate to evaluate by navigating the best compromises among the objectives. Multi-objective acquisition functions that rely on box decomposition of the objective space, such as the expected hypervolume improvement (EHVI) and entropy search, scale poorly to a large number of objectives. We begin by showing a natural connection between non-dominated solutions and the highest multivariate rank, which coincides with the outermost level line of the joint cumulative distribution function (CDF). Motivated by this link, we propose the CDF indicator, a Pareto-compliant metric for evaluating the quality of approximate Pareto sets that complements the popular hypervolume indicator. We then propose an acquisition function based on the CDF indicator, called BOtied. BOtied can be implemented efficiently with copulas, a statistical tool for modeling complex, high-dimensional distributions. We benchmark BOtied against common acquisition functions, including EHVI, entropy search, and random scalarization, in a series of synthetic and real-data experiments. BOtied performs on par with the baselines across datasets and metrics while being computationally efficient.",
        "keywords": "Bayesian optimization;multi-objective optimization;density estimation;copulas",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Ji Won Park;Natasa Tagasovska;Michael Maser;Stephen Ra;Kyunghyun Cho",
        "authorids": "~Ji_Won_Park1;~Natasa_Tagasovska2;~Michael_Maser1;~Stephen_Ra1;~Kyunghyun_Cho1",
        "gender": "F;F;;M;M",
        "homepage": ";https://datascience.ch/team_member/natasa-tagasovska-computer-scientist/;;https://www.stephenra.com;http://kyunghyuncho.me",
        "dblp": "83/10554;;;255/5897;41/9736",
        "google_scholar": "URG3MMYAAAAJ;S2ZUSL0AAAAJ;;bxl__-MAAAAJ;https://scholar.google.fi/citations?user=0RAmmIAAAAAJ",
        "orcid": "0000-0002-0692-1092;;;;",
        "linkedin": ";natasha-tagasovska/;michael-maser-7a9844b9;;",
        "or_profile": "~Ji_Won_Park1;~Natasa_Tagasovska2;~Michael_Maser1;~Stephen_Ra1;~Kyunghyun_Cho1",
        "aff": "Genentech;Prescient Design - Genentech, Roche;Genentech;Prescient Design, Genentech;Genentech",
        "aff_domain": "gene.com;roche.com;gene.com;gene.com;gene.com",
        "position": "Researcher;Senior Machine Learning Scientis;Researcher;Director of Frontier Research;Senior Director of Frontier Research",
        "bibtex": "@misc{\npark2024botied,\ntitle={{BO}tied: Multi-objective Bayesian optimization with tied multivariate ranks},\nauthor={Ji Won Park and Natasa Tagasovska and Michael Maser and Stephen Ra and Kyunghyun Cho},\nyear={2024},\nurl={https://openreview.net/forum?id=pK7V0glCdj}\n}",
        "github": "",
        "project": "",
        "reviewers": "vKP1;8cpR;x952;3FiX",
        "site": "https://openreview.net/forum?id=pK7V0glCdj",
        "pdf_size": 1949876,
        "rating": "3;3;5;6",
        "confidence": "4;4;3;5",
        "soundness": "1;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;2;3",
        "wc_summary": "50;66;62;85",
        "wc_strengths": "37;20;16;16",
        "wc_weaknesses": "81;136;255;21",
        "wc_questions": "123;99;27;55",
        "wc_review": "291;321;360;177",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            65.75,
            12.577261228105266
        ],
        "wc_strengths_avg": [
            22.25,
            8.671072598012312
        ],
        "wc_weaknesses_avg": [
            123.25,
            86.25652149258049
        ],
        "wc_questions_avg": [
            76.0,
            37.3496987939662
        ],
        "wc_review_avg": [
            287.25,
            68.19228328777385
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.2721655269759087,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8452782534607282985&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Genentech",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.genentech.com",
        "aff_unique_abbr": "Genentech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "pKixnZDLIP",
        "title": "R2D2-Net: Shrinking Bayesian Neural Networks via R2D2 Prior",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Bayesian neural networks (BNNs) treat neural network weights as random variables, which aim to provide posterior uncertainty estimates and avoid overfitting by performing inference on the posterior weights. However, the selection of the\nappropriate prior distributions remains a challenging task, and BNNs may suffer from catastrophic inflated variance or poor predictive performance when poor choices are made. Previous BNN designs apply different priors to weights, but the behaviours of these priors make it difficult to sufficiently shrink noisy signals or easily overshrink important signals in the weights. To alleviate this problem, we propose a novel R2D2-Net, which imposes the $R^2$-induced Dirichlet Decomposition (R2D2) prior to the BNN weights. R2D2-Net can effectively shrink irrelevant coefficients towards zero, while preventing key features from over-shrinkage. To more accurately approximate the posterior distribution of weights, we further propose a variational Gibbs inference algorithm that combines the Gibbs updating procedure and gradient-based optimization. We also analyze the ELBO and develop analytical forms of the KL divergences of the shrinkage parameters. Empirical studies on image classification and uncertainty estimation tasks demonstrate that our proposed method outperforms the existing BNN designs with different priors, which indicates that the R2D2-Net can select more relevant variables for predictive tasks. On the other hand, we empirically show that the R2D2-Net yields relatively better predictive performance and smaller variance with the increase in neural network depth, which indicates that the R2D2-Net alleviates the catastrophic inflation of variance when BNNs are scaled. Codes are anonymously available at https://anonymous.4open.science/r/r2d2bnn-EF7D.",
        "keywords": "Bayesian deep learning;variable selection;global-local shrinkage prior;uncertainty estimation",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Tsai Hor Chan;Yan Dora Zhang;Guosheng Yin;Lequan Yu",
        "authorids": "~Tsai_Hor_Chan1;~Yan_Dora_Zhang1;~Guosheng_Yin1;~Lequan_Yu1",
        "gender": "M;F;M;M",
        "homepage": "https://howardchanth.github.io/;https://yandorazhang.github.io/;https://saasresearch.hku.hk/~gyin/;https://yulequan.github.io/",
        "dblp": "340/3009;333/8929;185/3223;165/8092",
        "google_scholar": "SBy4bDcAAAAJ;BQJDI9YAAAAJ;HAE6EtkAAAAJ;https://scholar.google.com.hk/citations?user=llXf3wUAAAAJ",
        "orcid": "0000-0002-3545-397X;0000-0002-5302-3690;0000-0003-3276-1392;0000-0002-9315-6527",
        "linkedin": ";;guosheng-yin-91089790/?originalSubdomain=hk;",
        "or_profile": "~Tsai_Hor_Chan1;~Yan_Dora_Zhang1;~Guosheng_Yin1;~Lequan_Yu1",
        "aff": "University of Hong Kong;University of Hong Kong;Imperial College London;The University of Hong Kong",
        "aff_domain": "hku.hk;hku.hk;imperial.ac.uk;hku.hk",
        "position": "PhD student;Assistant Professor;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nchan2024rdnet,\ntitle={R2D2-Net: Shrinking Bayesian Neural Networks via R2D2 Prior},\nauthor={Tsai Hor Chan and Yan Dora Zhang and Guosheng Yin and Lequan Yu},\nyear={2024},\nurl={https://openreview.net/forum?id=pKixnZDLIP}\n}",
        "github": "",
        "project": "",
        "reviewers": "kYjv;JJfw;XdB3",
        "site": "https://openreview.net/forum?id=pKixnZDLIP",
        "pdf_size": 3222143,
        "rating": "3;3;6",
        "confidence": "3;3;3",
        "soundness": "1;2;3",
        "contribution": "2;2;2",
        "presentation": "2;2;3",
        "wc_summary": "77;37;81",
        "wc_strengths": "85;33;122",
        "wc_weaknesses": "300;438;72",
        "wc_questions": "125;46;93",
        "wc_review": "587;554;368",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            65.0,
            19.86621923433512
        ],
        "wc_strengths_avg": [
            80.0,
            36.5057073163453
        ],
        "wc_weaknesses_avg": [
            270.0,
            150.91719583930785
        ],
        "wc_questions_avg": [
            88.0,
            32.44482495971687
        ],
        "wc_review_avg": [
            503.0,
            96.40539403996023
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Q-VgdXZ7xSUJ:scholar.google.com/&scioq=R2D2-Net:+Shrinking+Bayesian+Neural+Networks+via+R2D2+Prior&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "University of Hong Kong;Imperial College London",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.hku.hk;https://www.imperial.ac.uk",
        "aff_unique_abbr": "HKU;ICL",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "id": "pLvh9DTyoE",
        "title": "Integrating Visual Cues via Prompting for Low-Resource Multimodal Named Entity Recognition",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In the field of Natural Language Processing (NLP), the task of Named Entity Recognition (NER) is quite established. However, most existing methods predominantly rely on textual data alone, overlooking the information that can be derived from other modalities such as images. This issue is particularly pronounced in low-resource settings, where the absence of extensive labeled data can significantly impede the performance of NER systems. Existing solutions, while attempting to address this limitation, often require comprehensive fine-tuning and are not readily applicable in such low-resource conditions. This research confronts these challenges by proposing a novel approach to Multimodal Named Entity Recognition (MNER) under low-resource constraints. We recast the MNER task as an open-ended question-answering problem, particularly suitable for modern generative language models. Our findings provide novel insights into the complex interplay between model design, prompt crafting, and training data characteristics that determine the efficacy of visual integration. The strengths and limitations elucidated can inform future efforts at the intersection of multimodal representation learning, generative modeling, and prompting.",
        "keywords": "Named Entity Recognition;Deep Learning;Prompting;Visual Cues;Multimodality;Few shot",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Marcus Tiedemann Oekland Henriksboe;Tong Yu;Ole Jakob Mengshoel",
        "authorids": "~Marcus_Tiedemann_Oekland_Henriksboe1;~Tong_Yu3;~Ole_Jakob_Mengshoel1",
        "gender": "M;;M",
        "homepage": ";https://www.linkedin.com/in/tong-yu-42790744;https://works.bepress.com/ole_mengshoel/",
        "dblp": ";32/1593-1;https://dblp.uni-trier.de/pers/hd/m/Mengshoel:Ole_J=",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;M6Jzt2UAAAAJ",
        "orcid": ";0000-0002-5991-2050;",
        "linkedin": "marcus-henriksbo/;tong-yu-42790744;olemengshoel/",
        "or_profile": "~Marcus_Tiedemann_Oekland_Henriksboe1;~Tong_Yu3;~Ole_Mengshoel1",
        "aff": ";Adobe Research;",
        "aff_domain": ";adobe.com;",
        "position": ";Senior Research Scientist;",
        "bibtex": "@misc{\nhenriksboe2024integrating,\ntitle={Integrating Visual Cues via Prompting for Low-Resource Multimodal Named Entity Recognition},\nauthor={Marcus Tiedemann Oekland Henriksboe and Tong Yu and Ole Jakob Mengshoel},\nyear={2024},\nurl={https://openreview.net/forum?id=pLvh9DTyoE}\n}",
        "github": "",
        "project": "",
        "reviewers": "Hmr3;xAYu;AQjM;enH8",
        "site": "https://openreview.net/forum?id=pLvh9DTyoE",
        "pdf_size": 248062,
        "rating": "1;1;3;5",
        "confidence": "5;5;3;5",
        "soundness": "1;1;1;2",
        "contribution": "1;1;1;3",
        "presentation": "2;2;2;2",
        "wc_summary": "26;68;133;58",
        "wc_strengths": "6;27;1;18",
        "wc_weaknesses": "160;123;4;335",
        "wc_questions": "1;20;1;65",
        "wc_review": "193;238;139;476",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "340;251;96;674",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            2.5,
            1.6583123951777
        ],
        "confidence_avg": [
            4.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            1.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            71.25,
            38.88042566639414
        ],
        "wc_strengths_avg": [
            13.0,
            10.173494974687902
        ],
        "wc_weaknesses_avg": [
            155.5,
            118.58435815907593
        ],
        "wc_questions_avg": [
            21.75,
            26.14741861063918
        ],
        "wc_review_avg": [
            261.5,
            128.70606046336746
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            340.25,
            211.549491845289
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.17407765595569782,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:mykGWkgY1dYJ:scholar.google.com/&scioq=Integrating+Visual+Cues+via+Prompting+for+Low-Resource+Multimodal+Named+Entity+Recognition&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Adobe",
        "aff_unique_dep": "Adobe Research",
        "aff_unique_url": "https://research.adobe.com",
        "aff_unique_abbr": "Adobe",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "pMoqxAOUSO",
        "title": "NSM4D: Neural Scene Model Based Online 4D Point Cloud Sequence Understanding",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Understanding 4D point cloud sequences online is of significant practical value in various scenarios such as VR/AR, robotics, and autonomous driving. The key goal is to continuously analyze the geometry and dynamics of a 3D scene as unstructured and redundant point cloud sequences arrive. And the main challenge is to effectively model the long-term history while keeping computational costs manageable.\nTo tackle these challenges, we introduce a generic online 4D perception paradigm called NSM4D. NSM4D serves as a plug-and-play strategy that can be adapted to existing 4D backbones, significantly enhancing their online perception capabilities for both indoor and outdoor scenarios. To efficiently capture the redundant 4D history, we propose a neural scene model that factorizes geometry and motion information by constructing geometry tokens separately storing geometry and motion features. Exploiting the history becomes as straightforward as querying the neural scene model. As the sequence progresses, the neural scene model dynamically deforms to align with new observations, effectively providing the historical context and updating itself with the new observations. By employing token representation, NSM4D also exhibits robustness to low-level sensor noise and maintains a compact size through a geometric sampling scheme. We integrate NSM4D with state-of-the-art 4D perception backbones, demonstrating significant improvements on various online perception benchmarks in indoor and outdoor settings. Notably, we achieve a 9.6%  accuracy improvement for HOI4D online action segmentation and a 3.4% mIoU improvement for SemanticKITTI online semantic segmentation. Furthermore, we show that NSM4D inherently offers excellent scalability to longer sequences beyond the training set, which is crucial for real-world applications.",
        "keywords": "Neural scene model;online 4D point cloud sequence understanding",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/965900c66f8e0f1821e182ec883dad7004167406.pdf",
        "author": "Yuhao Dong;Zhuoyang Zhang;Yunze Liu;Li Yi",
        "authorids": "~Yuhao_Dong1;~Zhuoyang_Zhang1;~Yunze_Liu2;~Li_Yi2",
        "gender": "M;M;M;M",
        "homepage": ";https://hanlab.mit.edu/team/zhuoyang-zhang;https://yunzeliu.github.io;https://ericyi.github.io/",
        "dblp": "232/7896;;282/1192;26/4239-1",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;Q1csT-8AAAAJ;xYVEg0cAAAAJ;UyZL660AAAAJ",
        "orcid": ";;0009-0002-3148-8822;",
        "linkedin": "https://www.linkedin.cn/incareer/in/ACoAADne80YBuYZteGlmnGrYzW2D-YEPj5UUXe0;zhuoyang-zhang/;;",
        "or_profile": "~Yuhao_Dong1;~Zhuoyang_Zhang1;~Yunze_Liu2;~Li_Yi2",
        "aff": "Department of Automation, Tsinghua University;IIIS, Tsinghua University;IIIS, Tsinghua University;Tsinghua University",
        "aff_domain": "mails.tsinghua.edu.cn;mails.tsinghua.edu.cn;mails.tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "Undergrad student;Undergrad student;PhD student;Assistant Professor",
        "bibtex": "@misc{\ndong2024nsmd,\ntitle={{NSM}4D: Neural Scene Model Based Online 4D Point Cloud Sequence Understanding},\nauthor={Yuhao Dong and Zhuoyang Zhang and Yunze Liu and Li Yi},\nyear={2024},\nurl={https://openreview.net/forum?id=pMoqxAOUSO}\n}",
        "github": "",
        "project": "",
        "reviewers": "Usdf;KTef;XSLL;C4KL",
        "site": "https://openreview.net/forum?id=pMoqxAOUSO",
        "pdf_size": 1175654,
        "rating": "3;5;5;6",
        "confidence": "4;4;2;1",
        "soundness": "1;3;2;3",
        "contribution": "1;3;2;3",
        "presentation": "1;3;2;3",
        "wc_summary": "70;89;53;38",
        "wc_strengths": "16;41;32;98",
        "wc_weaknesses": "288;74;232;365",
        "wc_questions": "71;172;66;26",
        "wc_review": "445;376;383;527",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            2.75,
            1.299038105676658
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            62.5,
            19.03286631067428
        ],
        "wc_strengths_avg": [
            46.75,
            30.914195768287424
        ],
        "wc_weaknesses_avg": [
            239.75,
            106.71076562371765
        ],
        "wc_questions_avg": [
            83.75,
            53.85338893700191
        ],
        "wc_review_avg": [
            432.75,
            60.68103080864728
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.7505683356701914,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2742647096458709556&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Tsinghua University",
        "aff_unique_dep": "Department of Automation",
        "aff_unique_url": "https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "pNfniUgXJt",
        "title": "WASSERSTEIN-GUIDED SYMBOLIC REGRESSION: MODEL DISCOVERY OF NETWORK DYNAMICS",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Real-world complex systems often miss high-fidelity physical descriptions and are typically subject to partial observability. Learning dynamics of such systems is a challenging and ubiquitous problem, encountered in diverse critical applications which require interpretability \nand qualitative guarantees. Our paper addresses this problem in the case of probability distribution flows governed by ODEs. Specifically, we devise a ${\\it white}$  ${\\it box}$ approach -dubbed Symbolic Distribution Flow Learner ($\\texttt{SDFL}$)- combining symbolic search with a Wasserstein-based loss function, resulting in robust model recovery scheme which naturally lends itself to cope with partial observability. Additionally, we furnish the proposed framework with theoretical guarantees on the number of required ${\\it snapshots}$ to achieve a certain level of fidelity in the model-discovery. We illustrate the performance of the proposed scheme on the prototypical problem of Kuramoto networks and a standard benchmark of single-cell population trajectory data. The numerical experiments demonstrate the computational advantage of $\\texttt{SDFL}$ in comparison to the state-of-the-art.",
        "keywords": "Trajectory inference;Symbolic regression;Wasserstein metric;Network dynamics",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "/attachment/eba0fdd6771636676e46605b883b4a70f66330fd.pdf",
        "author": "Ramzi Dakhmouche;Ivan Lunati;Hossein Gorji",
        "authorids": "~Ramzi_Dakhmouche1;~Ivan_Lunati1;~Hossein_Gorji1",
        "gender": "M;;M",
        "homepage": "https://ramzisofo.github.io/RamziRL.github.io/;;https://viterbi.usc.edu/directory/faculty/Gorji/Hossein",
        "dblp": ";;",
        "google_scholar": ";;RhCozd8AAAAJ",
        "orcid": ";0000-0002-3205-7429;0000-0002-9089-4188",
        "linkedin": "ramzi-dakhmouche-514ab61b0/;;",
        "or_profile": "~Ramzi_Dakhmouche1;~Ivan_Lunati1;~Hossein_Gorji1",
        "aff": "EPFL - EPF Lausanne;EMPA Swiss Federal Laboratories for Materials Science and Technology;EMPA Swiss Federal Laboratories for Materials Science and Technology",
        "aff_domain": "epfl.ch;empa.ch;empa.ch",
        "position": "PhD student;Abteilungsleiter;Researcher",
        "bibtex": "@misc{\nanonymous2024wassersteinguided,\ntitle={{WASSERSTEIN}-{GUIDED} {SYMBOLIC} {REGRESSION}: {MODEL} {DISCOVERY} {OF} {NETWORK} {DYNAMICS}},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=pNfniUgXJt}\n}",
        "github": "",
        "project": "",
        "reviewers": "h3SD;XDzL;97PM;QgHg",
        "site": "https://openreview.net/forum?id=pNfniUgXJt",
        "pdf_size": 532156,
        "rating": "3;5;5;5",
        "confidence": "3;3;3;3",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;2",
        "presentation": "2;2;3;2",
        "wc_summary": "24;46;117;96",
        "wc_strengths": "34;47;48;108",
        "wc_weaknesses": "264;204;372;869",
        "wc_questions": "9;76;315;6",
        "wc_review": "331;373;852;1079",
        "wc_reply_reviewers": "0;0;140;0",
        "wc_reply_authors": "622;382;1226;1424",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;3;2",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            70.75,
            37.332124236373154
        ],
        "wc_strengths_avg": [
            59.25,
            28.682529525828087
        ],
        "wc_weaknesses_avg": [
            427.25,
            262.05283341341686
        ],
        "wc_questions_avg": [
            101.5,
            126.40114714669325
        ],
        "wc_review_avg": [
            658.75,
            317.4227268170948
        ],
        "wc_reply_reviewers_avg": [
            35.0,
            60.6217782649107
        ],
        "wc_reply_authors_avg": [
            913.5,
            425.9492340643425
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:aTmw-gU35LIJ:scholar.google.com/&scioq=WASSERSTEIN-GUIDED+SYMBOLIC+REGRESSION:+MODEL+DISCOVERY+OF+NETWORK+DYNAMICS&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "EPFL;Swiss Federal Laboratories for Materials Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.epfl.ch;https://www.empa.ch",
        "aff_unique_abbr": "EPFL;EMPA",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Lausanne;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Switzerland"
    },
    {
        "id": "pNgY6ODeMp",
        "title": "Cross-modality Interpretable image classification via Concept Decomposition Vector of Visual Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Inherently interpretable image classification is valuable for high-risk decision-making.\nRecent works achieve competitive performance against black-box models by combining visual language models (VLM) with concept bottleneck models (CBMs). Their explanations are achieved by the weighted sum of similarities between the image representation and embeddings of pre-defined texts. However, using text only is not sufficient to represent visual information and the choices of texts are subjective, resulting in potential compromises in both interpretations and performance.\nTherefore, this work explores cross-modality interpretation of critical concepts in image classification. Specifically, we build CBM with a set of decomposed visual concepts learned from images rather than pre-defined text concepts, namely decomposed concept bottleneck model (DCBM). The decomposition is implemented by vector projection to concept decomposition vectors (CDVs).\nTo explain CDVs in different modalities, a quintuple notion of concepts and a concept-sample distribution are proposed. Experiments indicate a competitive performance of DCBM with non-interpretable models and superior interpretability compared to other CBMs in terms of sparsity, groundability, factuality, fidelity, and meaningfulness.",
        "keywords": "Visual-Language Model;Concept-based Explanation;Concept-bottleneck Model;Concept Decomposition",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/5b21e8a22f01f3f05f3b7cf947408b5b2f08e9f3.pdf",
        "author": "Zhengqing Fang;Zhouhang Yuan;Ziyu Li;Kun Kuang;Fei Wu",
        "authorids": "~Zhengqing_Fang1;~Zhouhang_Yuan1;~Ziyu_Li2;~Kun_Kuang1;~Fei_Wu2",
        "gender": "M;M;M;M;",
        "homepage": ";https://github.com/YuanZhouhang;;http://kunkuang.github.io;https://person.zju.edu.cn/wufei",
        "dblp": "266/9572.html;;;194/4245;84/3254-1",
        "google_scholar": "VEDFmatc5bkC;;;https://scholar.google.com.hk/citations?user=FOsNiMQAAAAJ;XJLn4MYAAAAJ",
        "orcid": "0000-0003-3270-0952;;0009-0007-6852-6876;0009-0000-7528-8131;",
        "linkedin": ";;;;",
        "or_profile": "~Zhengqing_Fang1;~Zhouhang_Yuan1;~Ziyu_Li2;~Kun_Kuang1;~Fei_Wu2",
        "aff": "Zhejiang University;Zhejiang University;Zhejiang University;Zhejiang University;Zhejiang University",
        "aff_domain": "zju.edu.cn;zju.edu.cn;zju.edu.cn;zju.edu.cn;zju.edu.cn",
        "position": "PhD student;PhD student;PhD student;Associate Professor;Full Professor",
        "bibtex": "@misc{\nfang2024crossmodality,\ntitle={Cross-modality Interpretable image classification via Concept Decomposition Vector of Visual Language Models},\nauthor={Zhengqing Fang and Zhouhang Yuan and Ziyu Li and Kun Kuang and Fei Wu},\nyear={2024},\nurl={https://openreview.net/forum?id=pNgY6ODeMp}\n}",
        "github": "",
        "project": "",
        "reviewers": "U8yY;CHsn;VVq7;8g7G",
        "site": "https://openreview.net/forum?id=pNgY6ODeMp",
        "pdf_size": 3167091,
        "rating": "1;5;5;6",
        "confidence": "3;3;4;4",
        "soundness": "1;3;2;2",
        "contribution": "2;2;3;2",
        "presentation": "1;2;2;2",
        "wc_summary": "61;120;127;87",
        "wc_strengths": "31;97;198;139",
        "wc_weaknesses": "57;184;147;116",
        "wc_questions": "127;102;81;60",
        "wc_review": "276;503;553;402",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.920286436967152
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            98.75,
            26.517682779609533
        ],
        "wc_strengths_avg": [
            116.25,
            60.90720400740786
        ],
        "wc_weaknesses_avg": [
            126.0,
            46.54567649094812
        ],
        "wc_questions_avg": [
            92.5,
            24.84451649760969
        ],
        "wc_review_avg": [
            433.5,
            105.95871837654512
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.6509445549041193,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:LZg5oJnCg9YJ:scholar.google.com/&scioq=Cross-modality+Interpretable+image+classification+via+Concept+Decomposition+Vector+of+Visual+Language+Models&hl=en&as_sdt=0,34",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Zhejiang University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.zju.edu.cn",
        "aff_unique_abbr": "ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "pNkOx3IVWI",
        "title": "UltraFeedback: Boosting Language Models with High-quality Feedback",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Reinforcement learning from human feedback (RLHF) has become a pivot technique in aligning large language models (LLMs) with human preferences. In RLHF practice, preference data plays a crucial role in bridging human proclivity and LLMs.\nHowever, the scarcity of diverse, naturalistic datasets of human preferences on LLM outputs at scale poses a great challenge to RLHF as well as feedback learning research within the open-source community.\nCurrent preference datasets, either proprietary or limited in size and prompt variety, result in limited RLHF adoption in open-source models and hinder further exploration.\nIn this study, we propose UltraFeedback, a large-scale, high-quality, and diversified preference dataset designed to overcome these limitations and foster RLHF development. To create UltraFeedback, we compile a diverse array of instructions and models from multiple sources to produce comparative data. We meticulously devise annotation instructions and employ GPT-4 to offer detailed feedback in both numerical and textual forms. UltraFeedback establishes a reproducible and expandable preference data construction pipeline, serving as a solid foundation for future RLHF and feedback learning research.\nUtilizing UltraFeedback, we train various models to demonstrate its effectiveness, including the reward model UltraRM,  chat language model UltraLM-13B-PPO, and critique model UltraCM. Experimental results indicate that our models outperform existing open-source models, achieving top performance across multiple benchmarks.",
        "keywords": "LLM;RLHF",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Ganqu Cui;Lifan Yuan;Ning Ding;Guanming Yao;Wei Zhu;Yuan Ni;Guotong Xie;Zhiyuan Liu;Maosong Sun",
        "authorids": "~Ganqu_Cui1;~Lifan_Yuan1;~Ning_Ding5;~Guanming_Yao1;~Wei_Zhu7;~Yuan_Ni1;~Guotong_Xie4;~Zhiyuan_Liu1;~Maosong_Sun1",
        "gender": "M;;M;;M;F;;M;M",
        "homepage": "https://cgq15.github.io/;;https://www.stingning.cn/;;https://www.researchgate.net/profile/Wei-Zhu-111;;;http://nlp.csai.tsinghua.edu.cn/~lzy;https://www.cs.tsinghua.edu.cn/csen/info/1312/4394.htm",
        "dblp": "232/3064;;;;83/4805-16.html;70/2170;;53/3245-1;95/3291-1",
        "google_scholar": "3IVSzZgAAAAJ;;uZXQuYAAAAAJ;;EF5J_BYAAAAJ;;;dT0v5u0AAAAJ;https://scholar.google.com.tw/citations?user=zIgT0HMAAAAJ",
        "orcid": ";;;;0000-0002-6389-6866;;;0000-0002-7709-2543;",
        "linkedin": ";;;;;;;;",
        "or_profile": "~Ganqu_Cui1;~Lifan_Yuan1;~Ning_Ding5;~Guanming_Yao1;~Wei_Zhu7;~Yuan_Ni1;~Guotong_Xie4;~Zhiyuan_Liu1;~Maosong_Sun1",
        "aff": "Tsinghua University;;Tsinghua University;;University of Hong Kong;Pingan Technology;;Tsinghua University;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;;mail.tsinghua.edu.cn;;hku.hk;pingan.com.cn;;tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "PhD student;;Postdoc;;Researcher;Researcher;;Associate Professor;Full Professor",
        "bibtex": "@misc{\ncui2024ultrafeedback,\ntitle={UltraFeedback: Boosting Language Models with High-quality Feedback},\nauthor={Ganqu Cui and Lifan Yuan and Ning Ding and Guanming Yao and Wei Zhu and Yuan Ni and Guotong Xie and Zhiyuan Liu and Maosong Sun},\nyear={2024},\nurl={https://openreview.net/forum?id=pNkOx3IVWI}\n}",
        "github": "",
        "project": "",
        "reviewers": "YWNs;AWP7;GSnG;cqtN",
        "site": "https://openreview.net/forum?id=pNkOx3IVWI",
        "pdf_size": 455667,
        "rating": "5;6;6;8",
        "confidence": "5;3;4;3",
        "soundness": "2;3;4;4",
        "contribution": "2;3;4;4",
        "presentation": "3;4;4;4",
        "wc_summary": "41;131;43;66",
        "wc_strengths": "25;163;53;72",
        "wc_weaknesses": "194;106;220;79",
        "wc_questions": "4;1;105;4",
        "wc_review": "264;401;421;221",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "440;299;722;280",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            3.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            70.25,
            36.42372166596928
        ],
        "wc_strengths_avg": [
            78.25,
            51.70771219073611
        ],
        "wc_weaknesses_avg": [
            149.75,
            58.76382815984677
        ],
        "wc_questions_avg": [
            28.5,
            44.18427322023075
        ],
        "wc_review_avg": [
            326.75,
            85.90219729436494
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            435.25,
            176.71640416214902
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -0.7608859102526822,
        "gs_citation": 306,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14105487862403671173&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;1;2;0;0",
        "aff_unique_norm": "Tsinghua University;University of Hong Kong;PingAn Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.hku.hk;https://www.pingan.com",
        "aff_unique_abbr": "THU;HKU;",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "pNlntv7A9X",
        "title": "SoftPhy: Soft-Body Physical Concept Learning and Reasoning from Videos",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We introduce the Soft-Body Physical Dataset (SOPHY), a novel benchmark for evaluating machine models in physical reasoning across diverse scenarios for soft bodies. The SOPHY is specifically designed to be complementary with existing physical reasoning benchmarks by encompassing diverse physical property inferences for soft bodies like physical parameters such as mass and density across dynamic situations and predicting corresponding dynamics. This comprehensive dataset enables the development and assessment of AI models with human-like visual reasoning abilities in understanding both rigid objects and soft objects\u2019 visual attributes, physical properties, and dynamics while devising goal-oriented solutions. We evaluated a range of AI models and found that they still struggle to achieve satisfactory performance, which shows that current AI models still lack physical commonsense for soft objects and illustrates the value of the proposed dataset. We hope the SOPHY fosters advancements in AI perception and reasoning in diverse physical environments, bridging the gap between human and machine intelligence in the physical world.",
        "keywords": "Neuro-symbolic Visual Reasoning;Physical Reasoning",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "",
        "author": "Zhicheng Zheng;Xin Yan;Zhenfang Chen;Jingzhou Wang;Qin Zhi Eddie Lim;Joshua B. Tenenbaum;Chuang Gan",
        "authorids": "~Zhicheng_Zheng2;~Xin_Yan3;~Zhenfang_Chen1;~Jingzhou_Wang3;~Qin_Zhi_Eddie_Lim1;~Joshua_B._Tenenbaum1;~Chuang_Gan1",
        "gender": "M;M;M;M;;;M",
        "homepage": "https://zzcnewly.github.io;https://cakeyan.github.io/;https://zfchenunique.github.io;https://jingzhou-wang.github.io;;;http://people.csail.mit.edu/ganchuang/",
        "dblp": ";71/4884-8;207/5321;;;t/JoshuaBTenenbaum;139/6993",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;QSRdIzAAAAAJ;;;;PTeSCbIAAAAJ",
        "orcid": ";;;;;;",
        "linkedin": ";;\u632f\u65b9-\u9648-512011bb/;;;;",
        "or_profile": "~Zhicheng_Zheng2;~Xin_Yan3;~Zhenfang_Chen1;~Jingzhou_Wang3;~Qin_Zhi_Eddie_Lim1;~Joshua_B._Tenenbaum1;~Chuang_Gan1",
        "aff": "Tsinghua University;Wuhan University;MIT-IBM Watson AI lab;Tsinghua University;;Massachusetts Institute of Technology;University of Massachusetts at Amherst",
        "aff_domain": "mails.tsinghua.edu.cn;whu.edu.cn;ibm.com;tsinghua.edu.cn;;mit.edu;umass.edu",
        "position": "Undergrad student;Undergrad student;Researcher;Undergrad student;;Professor;Assistant Professor",
        "bibtex": "@misc{\nzheng2024softphy,\ntitle={SoftPhy: Soft-Body Physical Concept  Learning  and Reasoning from Videos},\nauthor={Zhicheng Zheng and Xin Yan and Zhenfang Chen and Jingzhou Wang and Qin Zhi Eddie Lim and Joshua B. Tenenbaum and Chuang Gan},\nyear={2024},\nurl={https://openreview.net/forum?id=pNlntv7A9X}\n}",
        "github": "",
        "project": "",
        "reviewers": "Vp2g;P1S1;U8tp;t1H7",
        "site": "https://openreview.net/forum?id=pNlntv7A9X",
        "pdf_size": 31620959,
        "rating": "3;5;6;6",
        "confidence": "4;5;2;4",
        "soundness": "2;2;3;3",
        "contribution": "3;2;3;3",
        "presentation": "2;2;3;4",
        "wc_summary": "70;71;30;70",
        "wc_strengths": "83;21;31;89",
        "wc_weaknesses": "293;490;1;96",
        "wc_questions": "29;8;1;2",
        "wc_review": "475;590;63;257",
        "wc_reply_reviewers": "0;340;0;0",
        "wc_reply_authors": "1162;3985;47;574",
        "reply_reviewers": "0;3;0;0",
        "reply_authors": "5;8;1;2",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            60.25,
            17.469616481193857
        ],
        "wc_strengths_avg": [
            56.0,
            30.28200785945344
        ],
        "wc_weaknesses_avg": [
            220.0,
            188.12628737101042
        ],
        "wc_questions_avg": [
            10.0,
            11.291589790636214
        ],
        "wc_review_avg": [
            346.25,
            202.59982107593285
        ],
        "wc_reply_reviewers_avg": [
            85.0,
            147.22431864335456
        ],
        "wc_reply_authors_avg": [
            1442.0,
            1520.2547483892297
        ],
        "reply_reviewers_avg": [
            0.75,
            1.299038105676658
        ],
        "reply_authors_avg": [
            4.0,
            2.7386127875258306
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.37463432463267754,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:PL55WfY4gI8J:scholar.google.com/&scioq=SoftPhy:+Soft-Body+Physical+Concept+Learning+and+Reasoning+from+Videos&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0;2;3",
        "aff_unique_norm": "Tsinghua University;Wuhan University;Massachusetts Institute of Technology;University of Massachusetts Amherst",
        "aff_unique_dep": ";;IBM Watson AI lab;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;http://www.whu.edu.cn/;https://www.mitibmwatsonailab.org;https://www.umass.edu",
        "aff_unique_abbr": "THU;WHU;MIT-IBM AI Lab;UMass Amherst",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Amherst",
        "aff_country_unique_index": "0;0;1;0;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "pNmSGpW0Tp",
        "title": "Batch Bayesian Optimization of Delayed Effects Corrections for Thompson Sampling Bandits: A Practical Tuning Algorithm for Adaptive Interventions",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "When the number of reinforcement learning episodes that can be performed to optimize a policy is severely limited, the bias-variance trade-off of bandit algorithms such as Thompson Sampling can be significantly better than that of policy gradient and value function-based methods. However, bandits have no ability to model the delayed effects of actions. In this paper, we develop a batch Bayesian optimization algorithm that learns a delayed effect correction for linear Thompson Sampling bandits. This work is motivated by the problem of tuning adaptive intervention policies where each episode corresponds to a costly and often lengthy trial involving human subjects. We show through extensive experiments in an adaptive intervention simulation environment that the proposed approach can find beneficial delayed effects correction terms under realistic constraints on the number of Bayesian optimization rounds and the batch size per round.",
        "keywords": "Bayesian Optimization;Thompson Sampling;Reinforcement Learning;Adaptive Interventions",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Karine Karine;Predrag Klasnja;Susan Murphy;Benjamin Marlin",
        "authorids": "~Karine_Karine1;~Predrag_Klasnja1;~Susan_Murphy1;~Benjamin_Marlin1",
        "gender": ";M;F;M",
        "homepage": ";;https://www.seas.harvard.edu/directory/samurphy;https://groups.cs.umass.edu/marlin/",
        "dblp": "347/8486.html;;05/3845;03/7058.html",
        "google_scholar": "uXeuuScAAAAJ;XKqzS2oAAAAJ;https://scholar.google.com.tw/citations?user=q-DPFdUAAAAJ;ey960FIAAAAJ",
        "orcid": "0000-0002-4619-0191;;;0000-0002-2626-3410",
        "linkedin": ";;;",
        "or_profile": "~Karine_Karine1;~Predrag_Klasnja1;~Susan_Murphy1;~Benjamin_Marlin1",
        "aff": "Department of Computer Science, University of Massachusetts, Amherst;University of Michigan - Ann Arbor;Harvard University;University of Massachusetts at Amherst",
        "aff_domain": "cs.umass.edu;umich.edu;harvard.edu;umass.edu",
        "position": "PhD student;Associate Professor;Full Professor;Associate Professor",
        "bibtex": "@misc{\nkarine2024batch,\ntitle={Batch Bayesian Optimization of Delayed Effects Corrections for Thompson Sampling Bandits: A Practical Tuning Algorithm for Adaptive Interventions},\nauthor={Karine Karine and Predrag Klasnja and Susan Murphy and Benjamin Marlin},\nyear={2024},\nurl={https://openreview.net/forum?id=pNmSGpW0Tp}\n}",
        "github": "",
        "project": "",
        "reviewers": "8NfA;UpDA;ZL6J",
        "site": "https://openreview.net/forum?id=pNmSGpW0Tp",
        "pdf_size": 725728,
        "rating": "1;3;3",
        "confidence": "4;4;3",
        "soundness": "2;1;2",
        "contribution": "1;2;2",
        "presentation": "1;2;2",
        "wc_summary": "40;102;173",
        "wc_strengths": "12;49;39",
        "wc_weaknesses": "275;431;144",
        "wc_questions": "5;85;88",
        "wc_review": "332;667;444",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            105.0,
            54.33844556726542
        ],
        "wc_strengths_avg": [
            33.333333333333336,
            15.627610892974722
        ],
        "wc_weaknesses_avg": [
            283.3333333333333,
            117.31533952935946
        ],
        "wc_questions_avg": [
            59.333333333333336,
            38.43898484033567
        ],
        "wc_review_avg": [
            481.0,
            139.24319253258548
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:tL8rGHMXnX0J:scholar.google.com/&scioq=Batch+Bayesian+Optimization+of+Delayed+Effects+Corrections+for+Thompson+Sampling+Bandits:+A+Practical+Tuning+Algorithm+for+Adaptive+Interventions&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "University of Massachusetts Amherst;University of Michigan;Harvard University",
        "aff_unique_dep": "Department of Computer Science;;",
        "aff_unique_url": "https://www.umass.edu;https://www.umich.edu;https://www.harvard.edu",
        "aff_unique_abbr": "UMass Amherst;UM;Harvard",
        "aff_campus_unique_index": "0;1;0",
        "aff_campus_unique": "Amherst;Ann Arbor;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "pNpz5fun44",
        "title": "MaskedKD: Efficient Distillation of Vision Transformers with Masked Images",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Knowledge distillation is an effective method for training lightweight models, but the cost of acquiring teacher supervisions on training samples is often significant. Such supervision cost can be overwhelmingly large when we distill from large-scale proprietary models, such as vision transformers (ViTs). We present MaskedKD, a simple yet effective strategy that can significantly reduce the teacher supervision cost, without sacrificing the student accuracy or requiring direct access to (potentially proprietary) teacher. Specifically, MaskedKD diminishes the cost of running teacher at inference by masking a fraction of image patch tokens fed to the teacher, and therefore skipping the computations required to process those patches. The mask locations are selected to prevent masking away the core features of an image that the student uses for prediction. This masking mechanism operates based on some attention score of the student, which is already computed during the student forward pass, and thus incurs almost no additional computation. Our experiments show that MaskedKD dramatically reduces the teacher supervision cost, saving up to 50% teacher FLOPs without student accuracy drop.",
        "keywords": "vision transformer;training cost;token pruning;knowledge distillation;supervised distilliation",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/464717b14c8dd5a25f41913904c1291a1f6d65d2.zip",
        "author": "Seungwoo Son;Namhoon Lee;Jaeho Lee",
        "authorids": "~Seungwoo_Son1;~Namhoon_Lee1;~Jaeho_Lee3",
        "gender": ";;M",
        "homepage": ";https://namhoonlee.github.io/;https://jaeho-lee.github.io",
        "dblp": "47/6171-5;63/5359;78/6080-1",
        "google_scholar": "37LYQu4AAAAJ;wi9q5T8AAAAJ;t91zoQMAAAAJ",
        "orcid": "0009-0002-1082-5949;;",
        "linkedin": "seungwoo-son-057511323;;",
        "or_profile": "~Seungwoo_Son1;~Namhoon_Lee1;~Jaeho_Lee3",
        "aff": "Pohang University of Science and Technology;Google;Pohang University of Science and Technology",
        "aff_domain": "postech.edu;google.com;postech.ac.kr",
        "position": "MS student;Researcher;Assistant Professor",
        "bibtex": "@misc{\nson2024maskedkd,\ntitle={Masked{KD}: Efficient Distillation of Vision Transformers with Masked Images},\nauthor={Seungwoo Son and Namhoon Lee and Jaeho Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=pNpz5fun44}\n}",
        "github": "",
        "project": "",
        "reviewers": "tQVJ;GaAs;WM1F;GJ8d",
        "site": "https://openreview.net/forum?id=pNpz5fun44",
        "pdf_size": 3761631,
        "rating": "5;5;5;6",
        "confidence": "4;4;5;4",
        "soundness": "3;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "4;3;2;4",
        "wc_summary": "40;43;84;93",
        "wc_strengths": "41;56;48;129",
        "wc_weaknesses": "132;167;206;176",
        "wc_questions": "2;2;27;51",
        "wc_review": "215;268;365;449",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            65.0,
            23.73815494093844
        ],
        "wc_strengths_avg": [
            68.5,
            35.33058165385903
        ],
        "wc_weaknesses_avg": [
            170.25,
            26.38536526182649
        ],
        "wc_questions_avg": [
            20.5,
            20.35313243704762
        ],
        "wc_review_avg": [
            324.25,
            89.8926443041921
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8385070871946599734&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Pohang University of Science and Technology;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.postech.ac.kr;https://www.google.com",
        "aff_unique_abbr": "POSTECH;Google",
        "aff_campus_unique_index": "0;1;0",
        "aff_campus_unique": "Pohang;Mountain View",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "id": "pOBvr1PxFd",
        "title": "Outlier Weighed Layerwise Sparsity (OWL): A Missing Secret Sauce for Pruning LLMs to High Sparsity",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large Language Models (LLMs), renowned for their remarkable performance across diverse domains, present a challenge due to their colossal model size when it comes to practical deployment. In response to this challenge, efforts have been directed toward the application of traditional network pruning techniques to LLMs, uncovering a massive number of parameters can be pruned without hurting performance. Building upon insights gained from pre-LLM models, particularly BERT-level language models, prevailing LLM pruning strategies have consistently adhered to the practice of uniformly pruning all layers at equivalent sparsity levels, resulting in robust performance. However, this observation stands in contrast to the prevailing trends observed in the field of vision models, where non-uniform layerwise sparsity typically yields substantially improved results. To elucidate the underlying reasons for this disparity, we conduct a comprehensive analysis of the distribution of token features within LLMs. In doing so, we discover a strong correlation with the emergence of outliers, defined as features exhibiting significantly greater magnitudes compared to their counterparts in feature dimensions. Inspired by this finding, we introduce a novel LLM pruning methodology that incorporates a tailored set of **non-uniform layerwise sparsity ratios** specifically designed for LLM pruning, termed as Outlier Weighed Layerwise sparsity (**OWL**). The sparsity ratio of OWL is directly proportional to the outlier ratio observed within each layer, facilitating a more effective alignment between layerwise weight sparsity and outlier ratios. Our empirical evaluation, conducted across the LLaMA-V1 family and OPT, spanning various benchmarks, demonstrates the distinct advantages offered by OWL over previous methods. For instance, our approach exhibits a remarkable performance gain, surpassing the state-of-the-art Wanda and SparseGPT by **61.22** and **6.80** perplexity at a high sparsity level of 70%, respectively. Code is submitted.",
        "keywords": "large language models (LLMs);pruning;layerwise sparsity",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/3ac8c459294fd600f397e344ac23c55d041ac125.zip",
        "author": "Lu Yin;You Wu;Zhenyu Zhang;Cheng-Yu Hsieh;Yaqing Wang;Yiling Jia;Mykola Pechenizkiy;Yi Liang;Zhangyang Wang;Shiwei Liu",
        "authorids": "~Lu_Yin1;~You_Wu1;~Zhenyu_Zhang4;~Cheng-Yu_Hsieh1;~Yaqing_Wang1;~Yiling_Jia1;~Mykola_Pechenizkiy1;~Yi_Liang1;~Zhangyang_Wang1;~Shiwei_Liu2",
        "gender": ";M;M;M;M;F;M;M;M;M",
        "homepage": "https://luuyin.com/;;https://zhenyu.gallery;https://chengyuhsieh.github.io/;https://yaqingwang.github.io/;https://yilingjia.github.io;http://www.win.tue.nl/~mpechen/;https://research.google/people/108265/;https://vita-group.github.io;https://shiweiliuiiiiiii.github.io/",
        "dblp": "87/2528-6;16/8675-1;01/1844-15;40/4421;147/1393;218/7475;37/4649;;119/4026;234/8697-3.html",
        "google_scholar": "G4Xe1NkAAAAJ;https://scholar.google.com/citations?hl=en;ZLyJRxoAAAAJ;WXX6ZwwAAAAJ;_Rfg2CAAAAAJ;6-pZivMAAAAJ;https://scholar.google.com.tw/citations?user=F0uFT_kAAAAJ;9vQ7gbgAAAAJ;pxFyKAIAAAAJ;73IbXtsAAAAJ",
        "orcid": ";;;;;;0000-0003-4955-0743;0000-0002-6622-8919;;",
        "linkedin": ";;zhenyu-allen-zhang-a9b1391a3/;;;yiling-jia-793b2228/;mpechen/;;;",
        "or_profile": "~Lu_Yin1;~You_Wu1;~Zhenyu_Zhang4;~Cheng-Yu_Hsieh1;~Yaqing_Wang1;~Yiling_Jia1;~Mykola_Pechenizkiy1;~Yi_Liang1;~Zhangyang_Wang1;~Shiwei_Liu2",
        "aff": "University of Aberdeen;Google;University of Texas at Austin;Google;Google DeepMind;Google;Eindhoven University of Technology;Research, Google;University of Texas at Austin;University of Oxford",
        "aff_domain": "abdn.ac.uk;google.com;utexas.edu;google.com;google.com;google.com;tue.nl;research.google.com;utexas.edu;ox.ac.uk",
        "position": "Assistant Professor;Researcher;PhD student;Intern;Research Scientist;Research Scientist;Full Professor;Researcher;Associate Professor;Postdoc",
        "bibtex": "@misc{\nyin2024outlier,\ntitle={Outlier Weighed Layerwise Sparsity ({OWL}): A Missing Secret Sauce for Pruning {LLM}s to High Sparsity},\nauthor={Lu Yin and You Wu and Zhenyu Zhang and Cheng-Yu Hsieh and Yaqing Wang and Yiling Jia and Mykola Pechenizkiy and Yi Liang and Zhangyang Wang and Shiwei Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=pOBvr1PxFd}\n}",
        "github": "",
        "project": "",
        "reviewers": "jZ6Q;nrxB;H127;njDu;qHFG",
        "site": "https://openreview.net/forum?id=pOBvr1PxFd",
        "pdf_size": 402391,
        "rating": "3;5;6;8;8",
        "confidence": "4;5;4;5;4",
        "soundness": "1;2;3;4;4",
        "contribution": "1;2;3;3;4",
        "presentation": "2;3;3;4;3",
        "wc_summary": "55;19;62;72;68",
        "wc_strengths": "44;19;250;118;264",
        "wc_weaknesses": "519;77;115;46;167",
        "wc_questions": "61;109;8;177;7",
        "wc_review": "679;224;435;413;506",
        "wc_reply_reviewers": "789;0;18;29;0",
        "wc_reply_authors": "4749;0;1215;1749;983",
        "reply_reviewers": "3;0;1;1;0",
        "reply_authors": "10;0;3;4;2",
        "rating_avg": [
            6.0,
            1.8973665961010275
        ],
        "confidence_avg": [
            4.4,
            0.48989794855663565
        ],
        "soundness_avg": [
            2.8,
            1.16619037896906
        ],
        "contribution_avg": [
            2.6,
            1.019803902718557
        ],
        "presentation_avg": [
            3.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            55.2,
            18.988417522268673
        ],
        "wc_strengths_avg": [
            139.0,
            101.79587417965425
        ],
        "wc_weaknesses_avg": [
            184.8,
            171.90974376107948
        ],
        "wc_questions_avg": [
            72.4,
            64.55261419958141
        ],
        "wc_review_avg": [
            451.4,
            147.1306902043214
        ],
        "wc_reply_reviewers_avg": [
            167.2,
            311.09702666531547
        ],
        "wc_reply_authors_avg": [
            1739.2,
            1608.131387667065
        ],
        "reply_reviewers_avg": [
            1.0,
            1.0954451150103321
        ],
        "reply_authors_avg": [
            3.8,
            3.3704599092705436
        ],
        "replies_avg": [
            31,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.2151657414559676,
        "gs_citation": 69,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6082026189179939341&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;2;1;1;1;3;1;2;4",
        "aff_unique_norm": "University of Aberdeen;Google;University of Texas at Austin;Eindhoven University of Technology;University of Oxford",
        "aff_unique_dep": ";Google;;;",
        "aff_unique_url": "https://www.abdn.ac.uk;https://www.google.com;https://www.utexas.edu;https://www.tue.nl;https://www.ox.ac.uk",
        "aff_unique_abbr": "Aberdeen;Google;UT Austin;TU/e;Oxford",
        "aff_campus_unique_index": "1;2;1;1;1;2",
        "aff_campus_unique": ";Mountain View;Austin",
        "aff_country_unique_index": "0;1;1;1;0;1;2;1;1;0",
        "aff_country_unique": "United Kingdom;United States;Netherlands"
    },
    {
        "title": "Robust agents learn causal world models",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17779",
        "id": "pOoKI3ouv1",
        "author_site": "Jonathan Richens, Tom Everitt",
        "tldr": "",
        "abstract": "It has long been hypothesised that causal reasoning plays a fundamental role in robust and general intelligence. However, it is not known if agents must learn causal models in order to generalise to new domains, or if other inductive biases are sufficient. We answer this question, showing that any agent capable of satisfying a regret bound for a large set of distributional shifts must have learned an approximate causal model of the data generating process, which converges to the true causal model for optimal agents. We discuss the implications of this result for several research areas including transfer learning and causal inference.",
        "keywords": "causality;generalisation;causal discovery;domain adaptation;out-of-distribution generalization",
        "primary_area": "causal reasoning",
        "supplementary_material": "/attachment/27f701951145ff768b952c31420f76aac0c32817.pdf",
        "author": "Jonathan Richens;Tom Everitt",
        "authorids": "~Jonathan_Richens1;~Tom_Everitt1",
        "gender": "M;M",
        "homepage": ";https://tomeveritt.se",
        "dblp": ";151/4259",
        "google_scholar": "VtfYF3EAAAAJ;https://scholar.google.com.au/citations?user=BdulyjIAAAAJ",
        "orcid": "0000-0001-8755-2286;0000-0003-1210-9866",
        "linkedin": "jonathan-richens-1754657a/;",
        "or_profile": "~Jonathan_Richens1;~Tom_Everitt1",
        "aff": "Google DeepMind;Google DeepMind",
        "aff_domain": "deepmind.com;google.com",
        "position": "Researcher;Researcher",
        "bibtex": "@inproceedings{\nrichens2024robust,\ntitle={Robust agents learn causal world models},\nauthor={Jonathan Richens and Tom Everitt},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=pOoKI3ouv1}\n}",
        "github": "",
        "project": "",
        "reviewers": "vFfA;VrNg;gS4b;4TT8",
        "pdf_size": 1144088,
        "rating": "6;8;8;10",
        "confidence": "4;3;3;4",
        "soundness": "3;3;2;4",
        "contribution": "3;3;3;4",
        "presentation": "3;3;3;4",
        "wc_summary": "86;48;73;98",
        "wc_strengths": "65;13;172;18",
        "wc_weaknesses": "74;37;174;153",
        "wc_questions": "3;22;226;13",
        "wc_review": "228;120;645;282",
        "wc_reply_reviewers": "0;8;0;35",
        "wc_reply_authors": "163;48;333;212",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            8.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            76.25,
            18.552290963651902
        ],
        "wc_strengths_avg": [
            67.0,
            63.92573816546822
        ],
        "wc_weaknesses_avg": [
            109.5,
            56.055775795184566
        ],
        "wc_questions_avg": [
            66.0,
            92.62019218291441
        ],
        "wc_review_avg": [
            318.75,
            197.1843997379103
        ],
        "wc_reply_reviewers_avg": [
            10.75,
            14.376630342329875
        ],
        "wc_reply_authors_avg": [
            189.0,
            102.25213934192281
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 50,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10830451681089120500&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=pOoKI3ouv1",
        "pdf": "https://openreview.net/pdf?id=pOoKI3ouv1",
        "email": "deepmind.com;google.com",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Google",
        "aff_unique_dep": "Google DeepMind",
        "aff_unique_url": "https://deepmind.com",
        "aff_unique_abbr": "DeepMind",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "pOujzgHIRY",
        "title": "LM-Infinite: Simple On-the-Fly Length Generalization for Large Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In recent years, there have been remarkable advancements in the performance of Transformer-based Large Language Models (LLMs) across various domains. As these LLMs are deployed for increasingly complex domains, they often face the need to follow longer user prompts or generate longer texts. In these situations, the length generalization failure of LLMs on long sequences becomes more prominent. Most pre-training schemes truncate training sequences to a fixed length. LLMs often struggle to generate fluent and coherent texts after longer contexts, even with relative positional encoding specifically designed to cope with this problem. Common solutions such as finetuning on longer corpora often involve daunting hardware and time costs and require careful training process design. To more efficiently extrapolate existing LLMs\u2019 generation quality to longer texts, we theoretically and empirically investigate the main out-of-distribution (OOD) factors contributing to this problem. Inspired by this diagnosis, we propose a simple yet effective solution for on-the-fly length generalization, LM-Infinite. It involves only a $\\Lambda$-shaped attention mask (to avoid excessive attended tokens) and a distance limit (to avoid unseen distances) while requiring no parameter updates or learning. We find it applicable to a variety of LLMs using relative-position encoding methods. LM-Infinite is computationally efficient with $O(n)$ time and space, and demonstrates consistent text generation fluency and quality to as long as 128k tokens on ArXiv and OpenWebText2 datasets, with 2.72x decoding speedup. We will make the codes publicly available following publication.",
        "keywords": "Language Model Diagnosis;Context Length Generalization;Out-of-Distribution",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/fe4bb1a75541310b5762d67322c186ca6fbbeb58.zip",
        "author": "Chi Han;Qifan Wang;Wenhan Xiong;Yu Chen;Heng Ji;Sinong Wang",
        "authorids": "~Chi_Han1;~Qifan_Wang2;~Wenhan_Xiong1;~Yu_Chen5;~Heng_Ji3;~Sinong_Wang1",
        "gender": "M;M;M;M;F;M",
        "homepage": "https://glaciohound.github.io;https://wqfcr.github.io/;https://xwhan.github.io;http://academic.hugochan.net;http://blender.cs.illinois.edu/hengji.html;https://sites.google.com/site/snongwang/",
        "dblp": "255/6993;33/8610;203/8542;87/1254-22;;140/0795",
        "google_scholar": "https://scholar.google.com.sg/citations?user=DcSvbuAAAAAJ;LrSyLosAAAAJ;;m6Sj1yoAAAAJ;z7GCqT4AAAAJ;CYMAfxsAAAAJ",
        "orcid": "0000-0001-6235-5841;0000-0002-7570-5756;;;;",
        "linkedin": "chi-han-b01a93141/;;;;;wang-s-simon-194512a7",
        "or_profile": "~Chi_Han1;~Qifan_Wang2;~Wenhan_Xiong1;~Yu_Chen5;~Heng_Ji3;~Sinong_Wang1",
        "aff": "University of Illinois, Urbana Champaign;Meta AI;Meta Facebook;Anytime.AI;University of Illinois, Urbana-Champaign;Meta Facebook",
        "aff_domain": "illinois.edu;fb.com;fb.com;anytime-ai.com;uiuc.edu;fb.com",
        "position": "PhD student;Principal Researcher;Researcher;Researcher;Full Professor;Research scientist",
        "bibtex": "@misc{\nhan2024lminfinite,\ntitle={{LM}-Infinite: Simple On-the-Fly Length Generalization for Large Language Models},\nauthor={Chi Han and Qifan Wang and Wenhan Xiong and Yu Chen and Heng Ji and Sinong Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=pOujzgHIRY}\n}",
        "github": "",
        "project": "",
        "reviewers": "M1Yg;FyS7;mkYR;sjUS",
        "site": "https://openreview.net/forum?id=pOujzgHIRY",
        "pdf_size": 4667256,
        "rating": "3;3;5;5",
        "confidence": "5;5;4;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;3;2",
        "presentation": "1;2;3;3",
        "wc_summary": "152;126;82;40",
        "wc_strengths": "207;32;105;66",
        "wc_weaknesses": "323;241;113;208",
        "wc_questions": "230;181;96;5",
        "wc_review": "912;580;396;319",
        "wc_reply_reviewers": "0;0;0;26",
        "wc_reply_authors": "553;518;543;370",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            100.0,
            42.731721238442994
        ],
        "wc_strengths_avg": [
            102.5,
            65.62964269291736
        ],
        "wc_weaknesses_avg": [
            221.25,
            75.22757140836065
        ],
        "wc_questions_avg": [
            128.0,
            85.68255365008679
        ],
        "wc_review_avg": [
            551.75,
            228.58737388578575
        ],
        "wc_reply_reviewers_avg": [
            6.5,
            11.258330249197702
        ],
        "wc_reply_authors_avg": [
            496.0,
            73.85458685823109
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 118,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12333597550468686714&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;2;3;1",
        "aff_unique_norm": "University of Illinois Urbana-Champaign;Meta;Anytime AI;University of Illinois",
        "aff_unique_dep": ";Meta AI;;",
        "aff_unique_url": "https://illinois.edu;https://meta.com;https://www.anytime.ai;https://illinois.edu",
        "aff_unique_abbr": "UIUC;Meta;Anytime AI;UIUC",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Urbana-Champaign;",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Imitation Learning from Observation with Automatic Discount Scheduling",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17778",
        "id": "pPJTQYOpNI",
        "author_site": "Yuyang Liu, Weijun Dong, Yingdong Hu, Chuan Wen, Zhao-Heng Yin, Chongjie Zhang, Yang Gao",
        "tldr": "",
        "abstract": "Humans often acquire new skills through observation and imitation. For robotic agents, learning from the plethora of unlabeled video demonstration data available on the Internet necessitates imitating the expert without access to its action, presenting a challenge known as Imitation Learning from Observation (ILfO). A common approach to tackle ILfO problems is to convert them into inverse reinforcement learning problems, utilizing a proxy reward computed from the agent's and the expert's observations. Nonetheless, we identify that tasks characterized by a progress dependency property pose significant challenges for such approaches; in these tasks, the agent needs to initially learn the expert's preceding behaviors before mastering the subsequent ones. Our investigation reveals that the main cause is that the reward signals assigned to later steps hinder the learning of initial behaviors. To address this challenge, we present a novel ILfO framework that enables the agent to master earlier behaviors before advancing to later ones. We introduce an Automatic Discount Scheduling (ADS) mechanism that adaptively alters the discount factor in reinforcement learning during the training phase, prioritizing earlier rewards initially and gradually engaging later rewards only when the earlier behaviors have been mastered. Our experiments, conducted on nine Meta-World tasks, demonstrate that our method significantly outperforms state-of-the-art methods across all tasks, including those that are unsolvable by them. Our code is available at https://il-ads.github.io.",
        "keywords": "imitation learning;inverse reinforcement learning;reinforcement learning;currilulum learning;optimal transport",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/3f034ae367425b6bd84789233dde5883b663574f.zip",
        "author": "Yuyang Liu;Weijun Dong;Yingdong Hu;Chuan Wen;Zhao-Heng Yin;Chongjie Zhang;Yang Gao",
        "authorids": "~Yuyang_Liu2;~Weijun_Dong1;~Yingdong_Hu1;~Chuan_Wen1;~Zhao-Heng_Yin1;~Chongjie_Zhang1;~Yang_Gao1",
        "gender": "F;M;M;M;;M;M",
        "homepage": ";https://github.com/dwjshift;;https://alvinwen428.github.io/;;http://yang-gao.weebly.com;https://zhaohengyin.github.io",
        "dblp": ";;219/8916;239/8286;29/6693;89/4402-29;264/9661",
        "google_scholar": "0ROQMVcAAAAJ;;HhotyAoAAAAJ;G5M9nYwAAAAJ;LjxqXycAAAAJ;https://scholar.google.com/citations?hl=en;_egJxfMAAAAJ",
        "orcid": ";;;;;;",
        "linkedin": ";;;;;yang-gao-45245348/;",
        "or_profile": "~Yuyang_Liu2;~Weijun_Dong1;~Yingdong_Hu1;~Chuan_Wen1;~Chongjie_Zhang1;~Yang_Gao1;~Zhao_Heng_Yin1",
        "aff": "Institute for Interdisciplinary Information Sciences, Tsinghua University;Institute for Interdisciplinary Information Sciences, Tsinghua University;Tsinghua University;University of California, Berkeley;Washington University, Saint Louis;Tsinghua University;University of California, Berkeley",
        "aff_domain": "tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;berkeley.edu;wustl.edu;tsinghua.edu.cn;berkeley.edu",
        "position": "PhD student;MS student;PhD student;Intern;Associate Professor;Assistant Professor;PhD",
        "bibtex": "@inproceedings{\nliu2024imitation,\ntitle={Imitation Learning from Observation with Automatic Discount Scheduling},\nauthor={Yuyang Liu and Weijun Dong and Yingdong Hu and Chuan Wen and Zhao-Heng Yin and Chongjie Zhang and Yang Gao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=pPJTQYOpNI}\n}",
        "github": "",
        "project": "",
        "reviewers": "pLG5;NwHk;nyXG;K5dw",
        "pdf_size": 14794219,
        "rating": "5;5;8;8",
        "confidence": "4;2;3;3",
        "soundness": "3;2;3;3",
        "contribution": "3;2;3;4",
        "presentation": "3;3;4;4",
        "wc_summary": "138;194;96;65",
        "wc_strengths": "209;17;79;85",
        "wc_weaknesses": "67;174;319;123",
        "wc_questions": "96;56;88;37",
        "wc_review": "510;441;582;310",
        "wc_reply_reviewers": "28;0;79;0",
        "wc_reply_authors": "646;796;1191;461",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "3;2;3;1",
        "rating_avg": [
            6.5,
            1.5
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            123.25,
            48.37031631072925
        ],
        "wc_strengths_avg": [
            97.5,
            69.66168243733422
        ],
        "wc_weaknesses_avg": [
            170.75,
            93.58518846484202
        ],
        "wc_questions_avg": [
            69.25,
            23.889066536807167
        ],
        "wc_review_avg": [
            460.75,
            100.30297852008185
        ],
        "wc_reply_reviewers_avg": [
            26.75,
            32.25968846718765
        ],
        "wc_reply_authors_avg": [
            773.5,
            268.6656844481632
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6177367069467950481&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=pPJTQYOpNI",
        "pdf": "https://openreview.net/pdf?id=pPJTQYOpNI",
        "email": "tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;berkeley.edu;wustl.edu;tsinghua.edu.cn;berkeley.edu",
        "author_num": 7,
        "aff_unique_index": "0;0;0;1;2;0;1",
        "aff_unique_norm": "Tsinghua University;University of California, Berkeley;Washington University in St. Louis",
        "aff_unique_dep": "Institute for Interdisciplinary Information Sciences;;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.berkeley.edu;https://wustl.edu",
        "aff_unique_abbr": "Tsinghua;UC Berkeley;WUSTL",
        "aff_campus_unique_index": "1;2;1",
        "aff_campus_unique": ";Berkeley;Saint Louis",
        "aff_country_unique_index": "0;0;0;1;1;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "PBADet: A One-Stage Anchor-Free Approach for Part-Body Association",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17777",
        "id": "pPh9p8anUi",
        "author_site": "Zhongpai Gao, Huayi Zhou, Abhishek Sharma, Meng Zheng, Benjamin Planche, Terrence Chen, Ziyan Wu",
        "tldr": "",
        "abstract": "The detection of human parts (e.g., hands, face) and their correct association with individuals is an essential task, e.g., for ubiquitous human-machine interfaces and action recognition. Traditional methods often employ multi-stage processes, rely on cumbersome anchor-based systems, or do not scale well to larger part sets. This paper presents PBADet, a novel one-stage, anchor-free approach for part-body association detection. Building upon the anchor-free object representation across multi-scale feature maps, we introduce a singular part-to-body center offset that effectively encapsulates the relationship between parts and their parent bodies. Our design is inherently versatile and capable of managing multiple parts-to-body associations without compromising on detection accuracy or robustness. Comprehensive experiments on various datasets underscore the efficacy of our approach, which not only outperforms existing state-of-the-art techniques but also offers a more streamlined and efficient solution to the part-body association challenge.",
        "keywords": "Human detection;part detection;association detection;anchor free",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Zhongpai Gao;Huayi Zhou;Abhishek Sharma;Meng Zheng;Benjamin Planche;Terrence Chen;Ziyan Wu",
        "authorids": "~Zhongpai_Gao1;~Huayi_Zhou1;~Abhishek_Sharma9;~Meng_Zheng1;~Benjamin_Planche1;~Terrence_Chen4;~Ziyan_Wu2",
        "gender": "M;M;M;F;M;M;M",
        "homepage": "https://sites.google.com/site/gaozhongpai/home;https://hnuzhy.github.io/;;https://mzhengrpi.github.io/;https://planche.me;;http://wuziyan.com",
        "dblp": "149/4942;182/4224-1;;31/7910-2;153/6611;51/4242.html;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;a876WNUAAAAJ;zeGKyiEAAAAJ;1D5PfMgAAAAJ;https://scholar.google.de/citations?user=cP3ahiAAAAAJ;S2BT6ogAAAAJ;CkPUb-4AAAAJ",
        "orcid": "0000-0003-4344-4501;;;0000-0002-6677-2017;0000-0002-6110-6437;;0000-0002-9774-7770",
        "linkedin": ";;;;benjaminplanche;terrencechen/;",
        "or_profile": "~Zhongpai_Gao1;~Huayi_Zhou1;~Abhishek_Sharma9;~Meng_Zheng1;~Benjamin_Planche1;~Terrence_Chen4;~Ziyan_Wu2",
        "aff": "United Imaging Intelligence;Shanghai Jiaotong University;United Imaging Intelligence;Rensselaer Polytechnic Institute;United Imaging Intelligence;United Imaging Intelligence;United Imaging Intelligence",
        "aff_domain": "uii-ai.com;sjtu.edu.cn;uii-ai.com;rpi.edu;uii-ai.com;united-imaging.com;uii-ai.com",
        "position": "Researcher;PhD student;Researcher;Researcher;Researcher;CEO;Principal Expert Scientist",
        "bibtex": "@inproceedings{\ngao2024pbadet,\ntitle={{PBAD}et: A One-Stage Anchor-Free Approach for Part-Body Association},\nauthor={Zhongpai Gao and Huayi Zhou and Abhishek Sharma and Meng Zheng and Benjamin Planche and Terrence Chen and Ziyan Wu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=pPh9p8anUi}\n}",
        "github": "",
        "project": "",
        "reviewers": "iAuQ;vvPE;TS1Z;NDUe;BLsk;AkLB",
        "pdf_size": 3134733,
        "rating": "5;6;6;6;6;8",
        "confidence": "4;5;4;4;4;3",
        "soundness": "3;2;2;3;2;4",
        "contribution": "2;3;3;2;3;3",
        "presentation": "3;1;3;3;3;3",
        "wc_summary": "25;137;71;50;71;79",
        "wc_strengths": "24;73;45;79;73;106",
        "wc_weaknesses": "172;99;64;59;85;127",
        "wc_questions": "4;17;60;5;71;6",
        "wc_review": "225;326;240;193;300;318",
        "wc_reply_reviewers": "91;0;28;23;0;35",
        "wc_reply_authors": "1489;287;635;320;358;627",
        "reply_reviewers": "1;0;1;1;0;1",
        "reply_authors": "3;1;1;1;1;1",
        "rating_avg": [
            6.166666666666667,
            0.8975274678557507
        ],
        "confidence_avg": [
            4.0,
            0.5773502691896257
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.7453559924999298
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.7453559924999298
        ],
        "wc_summary_avg": [
            72.16666666666667,
            34.08037884505133
        ],
        "wc_strengths_avg": [
            66.66666666666667,
            26.042699979499478
        ],
        "wc_weaknesses_avg": [
            101.0,
            38.9657969677682
        ],
        "wc_questions_avg": [
            27.166666666666668,
            27.624968577156583
        ],
        "wc_review_avg": [
            267.0,
            50.2327914149048
        ],
        "wc_reply_reviewers_avg": [
            29.5,
            30.543684562715523
        ],
        "wc_reply_authors_avg": [
            619.3333333333334,
            413.3129027208751
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.74535599249993
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.6432675209026769,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9327948980287073310&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=pPh9p8anUi",
        "pdf": "https://openreview.net/pdf?id=pPh9p8anUi",
        "email": "uii-ai.com;sjtu.edu.cn;uii-ai.com;rpi.edu;uii-ai.com;united-imaging.com;uii-ai.com",
        "author_num": 7,
        "aff_unique_index": "0;1;0;2;0;0;0",
        "aff_unique_norm": "United Imaging Intelligence;Shanghai Jiao Tong University;Rensselaer Polytechnic Institute",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.united-imaging.com;https://www.sjtu.edu.cn;https://www.rpi.edu",
        "aff_unique_abbr": ";SJTU;RPI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "RepoBench: Benchmarking Repository-Level Code Auto-Completion Systems",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17776",
        "id": "pPjZIOuQuF",
        "author_site": "Tianyang Liu, Canwen Xu, Julian McAuley",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) have greatly advanced code auto-completion systems, with a potential for substantial productivity enhancements for developers. However, current benchmarks mainly focus on single-file tasks, leaving an assessment gap for more complex, real-world, multi-file programming scenarios. To fill this gap, we introduce RepoBench, a new benchmark specifically designed for evaluating repository-level code auto-completion systems. RepoBench consists of three interconnected evaluation tasks: RepoBench-R (Retrieval), RepoBench-C (Code Completion), and RepoBench-P (Pipeline). Each task respectively measures the system's ability to retrieve the most relevant code snippets from other files as cross-file context, predict the next line of code with cross-file and in-file context, and handle complex tasks that require a combination of both retrieval and next-line prediction. RepoBench aims to facilitate a more complete comparison of performance and encouraging continuous improvement in auto-completion systems. RepoBench is actively maintained with the latest code, serving as a live benchmark publicly available at https://github.com/Leolty/repobench.",
        "keywords": "large language model;code completion;benchmark",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/0c04077347314304d2d79620f47e5fa662b2d861.zip",
        "author": "Tianyang Liu;Canwen Xu;Julian McAuley",
        "authorids": "~Tianyang_Liu2;~Canwen_Xu1;~Julian_McAuley1",
        "gender": "Not Specified;;M",
        "homepage": "https://leolty.github.io/;;http://cseweb.ucsd.edu/~jmcauley/",
        "dblp": "89/1676-3.html;;29/3483",
        "google_scholar": "rJAeYdwAAAAJ;;icbo4M0AAAAJ",
        "orcid": "0000-0001-7754-7029;;0000-0003-0955-7588",
        "linkedin": "tianyangliu-whu-ucsd/;;",
        "or_profile": "~Tianyang_Liu2;~Canwen_Xu1;~Julian_McAuley1",
        "aff": "University of California, San Diego;;University of California, San Diego, University of California, San Diego",
        "aff_domain": "ucsd.edu;;eng.ucsd.edu",
        "position": "MS student;;Full Professor",
        "bibtex": "@inproceedings{\nliu2024repobench,\ntitle={RepoBench: Benchmarking Repository-Level Code Auto-Completion Systems},\nauthor={Tianyang Liu and Canwen Xu and Julian McAuley},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=pPjZIOuQuF}\n}",
        "github": "",
        "project": "",
        "reviewers": "mVr1;V3UP;zCY2",
        "pdf_size": 848712,
        "rating": "5;6;8",
        "confidence": "3;3;4",
        "soundness": "3;3;3",
        "contribution": "3;2;3",
        "presentation": "3;3;4",
        "wc_summary": "77;27;119",
        "wc_strengths": "19;17;56",
        "wc_weaknesses": "268;66;64",
        "wc_questions": "25;28;43",
        "wc_review": "389;138;282",
        "wc_reply_reviewers": "0;17;86",
        "wc_reply_authors": "1161;592;331",
        "reply_reviewers": "0;1;1",
        "reply_authors": "2;1;2",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            74.33333333333333,
            37.60614606978788
        ],
        "wc_strengths_avg": [
            30.666666666666668,
            17.93197020841702
        ],
        "wc_weaknesses_avg": [
            132.66666666666666,
            95.69860094182266
        ],
        "wc_questions_avg": [
            32.0,
            7.874007874011811
        ],
        "wc_review_avg": [
            269.6666666666667,
            102.84076148211963
        ],
        "wc_reply_reviewers_avg": [
            34.333333333333336,
            37.1872140511882
        ],
        "wc_reply_authors_avg": [
            694.6666666666666,
            346.5355521283334
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.944911182523068,
        "gs_citation": 134,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17348704996314265140&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=pPjZIOuQuF",
        "pdf": "https://openreview.net/pdf?id=pPjZIOuQuF",
        "email": "ucsd.edu;;eng.ucsd.edu",
        "author_num": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of California, San Diego",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucsd.edu",
        "aff_unique_abbr": "UCSD",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "San Diego",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "pPvK2e8o8M",
        "title": "Teach Large Language Models the Concept of Meta-cognition to Reduce Hallucination Text Generation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We introduce an algorithm that endows language models with enduring meta-cognitive capabilities.  Inspired by meta-learning, our approach involves fine-tuning models on diverse datasets, including the original base model. Throughout each training iteration, we randomly select various fine-tuned model versions, gauge their meta-cognitive capacities, and employ the meta-cognitive error average as the loss function for gradient updates. This empowers these models to assess their competence when interpreting human instructions, thereby averting the generation of responses beyond their abilities and mitigating hallucinatory text production. The meta-cognitive ability will be adapt to various fine-tuned versions of the main model, providing evaluations that align with the fine-tuned models' knowledge capacity.",
        "keywords": "large language models;meta-learning;low rank adapter;ai hallucination;prompt engineering",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/a556df647e101ebd79761f267405667328cc0965.zip",
        "author": "Xiang Li",
        "authorids": "~Xiang_Li63",
        "gender": "",
        "homepage": "https://github.com/lixiang90",
        "dblp": "",
        "google_scholar": "",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Xiang_Li63",
        "aff": "",
        "aff_domain": "",
        "position": "",
        "bibtex": "@misc{\nli2024teach,\ntitle={Teach Large Language Models the Concept of Meta-cognition to Reduce Hallucination Text Generation},\nauthor={Xiang Li},\nyear={2024},\nurl={https://openreview.net/forum?id=pPvK2e8o8M}\n}",
        "github": "",
        "project": "",
        "reviewers": "z9Ch;KFBC;AYMX;KoVi",
        "site": "https://openreview.net/forum?id=pPvK2e8o8M",
        "pdf_size": 260335,
        "rating": "1;3;3;6",
        "confidence": "4;4;4;3",
        "soundness": "2;1;1;2",
        "contribution": "2;1;3;2",
        "presentation": "1;2;2;3",
        "wc_summary": "100;64;41;88",
        "wc_strengths": "35;15;55;51",
        "wc_weaknesses": "422;258;57;22",
        "wc_questions": "11;16;27;62",
        "wc_review": "568;353;180;223",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "118;130;36;10",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            73.25,
            22.68672519338126
        ],
        "wc_strengths_avg": [
            39.0,
            15.748015748023622
        ],
        "wc_weaknesses_avg": [
            189.75,
            161.52457243404174
        ],
        "wc_questions_avg": [
            29.0,
            19.912307751739878
        ],
        "wc_review_avg": [
            331.0,
            150.92879115662458
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            73.5,
            51.504854140168185
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.8892972917998875,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:E4JPOQsSyssJ:scholar.google.com/&scioq=Teach+Large+Language+Models+the+Concept+of+Meta-cognition+to+Reduce+Hallucination+Text+Generation&hl=en&as_sdt=0,5",
        "gs_version_total": 0
    },
    {
        "id": "pRpMAD3udW",
        "title": "Mastering Robot Manipulation with Multimodal Prompts through Pretraining and Multi-task Fine-tuning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Prompt-based learning has been demonstrated as a compelling paradigm contributing to large language models' tremendous success (LLMs). Inspired by their success in language tasks, existing research has leveraged LLMs in embodied instruction following and task planning. However, not much attention has been paid to embodied tasks with multimodal prompts, combining vision signals with text descriptions. This type of task poses a major challenge to robots' capability to understand the interconnection and complementarity between vision and language signals. In this work, we introduce an effective framework that learns a policy to perform robot manipulation with multimodal prompts from multi-task expert trajectories. Our methods consist of a two-stage training pipeline that performs inverse dynamics pretraining and multi-task finetuning. To facilitate multimodal understanding, we design our multimodal prompt encoder by augmenting a pretrained LM with a residual connection to the visual input and model the dependencies among action dimensions. Empirically, we evaluate the efficacy of our method on the VIMA-BENCH and establish a new state-of-the-art (10% improvement in success rate). Moreover, we demonstrate that our model exhibits remarkable in-context learning ability.",
        "keywords": "Robotics; Multimodal Learning; Multi-task Prompt based Learning",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/ceadff3c772fabb741c2207538386ff000a1bf0f.pdf",
        "author": "Jiachen Li;Qiaozi Gao;Michael Johnston;Xiaofeng Gao;Xuehai He;Hangjie Shi;Suhaila Shakiah;Reza Ghanadan;William Yang Wang",
        "authorids": "~Jiachen_Li6;~Qiaozi_Gao1;~Michael_Johnston1;~Xiaofeng_Gao1;~Xuehai_He1;~Hangjie_Shi1;~Suhaila_Shakiah1;~Reza_Ghanadan1;~William_Yang_Wang2",
        "gender": "M;M;M;M;M;M;F;M;M",
        "homepage": "https://sites.google.com/view/jiachenli/;;;https://xfgao.github.io/;;;https://www.linkedin.com/in/suhailashakiah/;;https://www.cs.ucsb.edu/~william/",
        "dblp": ";173/1986;77/2529;95/6947-2;251/0763;;271/2364;50/5680;08/9282",
        "google_scholar": "https://scholar.google.com/citations?hl=en;Ub3LlsgAAAAJ;;AjTfCjEAAAAJ;kDzxOzUAAAAJ;7r5shcMAAAAJ;IP6H8LYAAAAJ;00ncu3cAAAAJ;gf8Ms_8AAAAJ",
        "orcid": ";;;0000-0003-3331-9846;;;;;",
        "linkedin": ";;mjrjohnston/;;;hangjie-shi-7565903b;suhailashakiah/;reza-ghanadan-ph-d-mba-820756;",
        "or_profile": "~Jiachen_Li6;~Qiaozi_Gao1;~Michael_Johnston1;~Xiaofeng_Gao1;~Xuehai_He1;~Hangjie_Shi1;~Suhaila_Shakiah1;~Reza_Ghanadan1;~William_Wang1",
        "aff": "University of California, Santa Barbara;Amazon;Amazon;Amazon;University of California Santa Curz;;Amazon;University of Maryland, College Park;UC Santa Barbara",
        "aff_domain": "ucsb.edu;amazon.com;amazon.com;amazon.com;ucsc.edu;;amazon.com;umd.edu;ucsb.edu",
        "position": "PhD student;Scientist;Principal Researcher;Scientist;PhD student;;Researcher;Full Professor;Full Professor",
        "bibtex": "@misc{\nli2024mastering,\ntitle={Mastering Robot Manipulation with Multimodal Prompts through Pretraining and Multi-task Fine-tuning},\nauthor={Jiachen Li and Qiaozi Gao and Michael Johnston and Xiaofeng Gao and Xuehai He and Hangjie Shi and Suhaila Shakiah and Reza Ghanadan and William Yang Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=pRpMAD3udW}\n}",
        "github": "",
        "project": "",
        "reviewers": "Y3nY;YMJx;yFyT;t7wu",
        "site": "https://openreview.net/forum?id=pRpMAD3udW",
        "pdf_size": 13984253,
        "rating": "5;5;6;6",
        "confidence": "4;4;5;3",
        "soundness": "3;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;4;3",
        "wc_summary": "59;74;59;93",
        "wc_strengths": "57;32;47;70",
        "wc_weaknesses": "229;145;169;27",
        "wc_questions": "117;31;31;47",
        "wc_review": "462;282;306;237",
        "wc_reply_reviewers": "25;0;18;0",
        "wc_reply_authors": "1535;855;609;584",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "5;3;2;3",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            71.25,
            13.970952007647869
        ],
        "wc_strengths_avg": [
            51.5,
            13.901438774457844
        ],
        "wc_weaknesses_avg": [
            142.5,
            73.36722701588224
        ],
        "wc_questions_avg": [
            56.5,
            35.53519382246282
        ],
        "wc_review_avg": [
            321.75,
            84.67695967617165
        ],
        "wc_reply_reviewers_avg": [
            10.75,
            11.031205736455105
        ],
        "wc_reply_authors_avg": [
            895.75,
            383.9644352020119
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.25,
            1.0897247358851685
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11429149269156367262&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 10,
        "aff_unique_index": "0;1;1;1;2;1;3;0",
        "aff_unique_norm": "University of California, Santa Barbara;Amazon;University of California, Santa Cruz;University of Maryland",
        "aff_unique_dep": ";Amazon.com, Inc.;;",
        "aff_unique_url": "https://www.ucsb.edu;https://www.amazon.com;https://www.ucsc.edu;https://www/umd.edu",
        "aff_unique_abbr": "UCSB;Amazon;UCSC;UMD",
        "aff_campus_unique_index": "0;2;3;0",
        "aff_campus_unique": "Santa Barbara;;Santa Cruz;College Park",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "pSf8rrn49H",
        "title": "Copyright Plug-in Market for The Text-to-Image Copyright Protection",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The images generated by text-to-image models could be accused of the  copyright infringement, which has aroused heated debate among AI developers, content creators, legislation department and judicature department. Especially, the state-of-the-art text-to-image models are capable of generating extremely high-quality works while at the same time lack the ability to attribute credits to  the original creators,  which brings anxiety to the artists' community. In this paper, we propose a conceptual framework -- copyright Plug-in Market -- to address the tension between the users, the content creators and the generative models. We introduce three  operations in the \\copyright Plug-in Market: addition, extraction and combination to facilitate proper credit attribution in the text-to-image procedure and enable the digital copyright protection.  For the addition operation, we train a \\copyright plug-in for a specific copyrighted concept and add it to the generative model and then we are able to generate new images with the copyrighted concept, which abstract existing solutions of portable LoRAs. We further introduce the extraction operation to enable content creators to claim copyrighted concept from infringing generative models  and the combination operation to enable users to combine different \\copyright plug-ins to generate images with multiple copyrighted concepts. We believe these basic operations give good incentives to each participant in the market, and enable  enough flexibility  to  thrive the market. Technically, we innovate an ``inverse LoRA'' approach to instantiate the extraction operation and propose a ``data-ignorant layer-wise distillation'' approach to combine the multiple extractions or additions easily. To showcase the diverse capabilities of copyright plug-ins, we conducted experiments in two domains: style transfer and cartoon IP recreation. The results demonstrate that copyright plug-ins can effectively accomplish copyright extraction and combination, providing a valuable copyright protection solution for the era of generative AIs.",
        "keywords": "generative model;copyright;text-to-image;LoRA",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/02c47c2de0030b12ef6f80a2fc1a3357f14275c7.pdf",
        "author": "Chao Zhou;Huishuai Zhang;Nenghai Yu;Jiang Bian",
        "authorids": "~Chao_Zhou8;~Huishuai_Zhang3;~Nenghai_Yu1;~Jiang_Bian1",
        "gender": "M;M;M;M",
        "homepage": ";;https://sites.google.com/view/jiangbian;https://huishuai-git.github.io",
        "dblp": ";96/5144;09/851-2.html;144/7537",
        "google_scholar": ";https://scholar.google.com.hk/citations?user=7620QAMAAAAJ;pZBEnY8AAAAJ;w1srHyIAAAAJ",
        "orcid": ";;0000-0002-9472-600X;",
        "linkedin": "\u6f6e-\u5468-01b73a292;;jbian/;",
        "or_profile": "~Chao_Zhou8;~Nenghai_Yu1;~Jiang_Bian1;~Huishuai_Zhang2",
        "aff": "University of Science and Technology of China;University of Science and Technology of China;Microsoft;Peking University",
        "aff_domain": "mail.ustc.edu.cn;ustc.edu.cn;microsoft.com;pku.edu.cn",
        "position": "MS student;Full Professor;Partner Research Manager;Assistant Professor",
        "bibtex": "@misc{\nzhou2024copyright,\ntitle={Copyright Plug-in Market for The Text-to-Image Copyright Protection},\nauthor={Chao Zhou and Huishuai Zhang and Nenghai Yu and Jiang Bian},\nyear={2024},\nurl={https://openreview.net/forum?id=pSf8rrn49H}\n}",
        "github": "",
        "project": "",
        "reviewers": "Pa89;5G9e;3Us4",
        "site": "https://openreview.net/forum?id=pSf8rrn49H",
        "pdf_size": 1180280,
        "rating": "3;5;6",
        "confidence": "2;4;3",
        "soundness": "3;2;3",
        "contribution": "2;3;3",
        "presentation": "1;3;2",
        "wc_summary": "100;74;72",
        "wc_strengths": "31;37;59",
        "wc_weaknesses": "135;32;110",
        "wc_questions": "4;37;3",
        "wc_review": "270;180;244",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "510;272;547",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            82.0,
            12.754084313139327
        ],
        "wc_strengths_avg": [
            42.333333333333336,
            12.036980056845191
        ],
        "wc_weaknesses_avg": [
            92.33333333333333,
            43.86595744107522
        ],
        "wc_questions_avg": [
            14.666666666666666,
            15.797327481430381
        ],
        "wc_review_avg": [
            231.33333333333334,
            37.818278943154226
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            443.0,
            121.85510521380164
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.6546536707079772,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:cGSv28oz9AUJ:scholar.google.com/&scioq=Copyright+Plug-in+Market+for+The+Text-to-Image+Copyright+Protection&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "University of Science and Technology of China;Microsoft;Peking University",
        "aff_unique_dep": ";Microsoft Corporation;",
        "aff_unique_url": "http://www.ustc.edu.cn;https://www.microsoft.com;http://www.pku.edu.cn",
        "aff_unique_abbr": "USTC;Microsoft;Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "SelfCheck: Using LLMs to Zero-Shot Check Their Own Step-by-Step Reasoning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17775",
        "id": "pTHfApDakA",
        "author_site": "Ning Miao, Yee Whye Teh, Tom Rainforth",
        "tldr": "",
        "abstract": "The recent progress in large language models (LLMs), especially the invention of chain-of-thought prompting, has made it possible to automatically answer questions by stepwise reasoning. However, when faced with more complicated problems that require non-linear thinking, even the strongest LLMs make mistakes. To address this, we explore whether LLMs are able to recognize errors in their own step-by-step reasoning, without resorting to external resources. To this end, we propose SelfCheck, a general-purpose zero-shot verification schema for recognizing such errors. We then use the results of these checks to improve question-answering performance by conducting weighted voting on multiple solutions to the question. We test SelfCheck on math- and logic-based datasets and find that it successfully recognizes errors and, in turn, increases final answer accuracies.",
        "keywords": "large language models;LLMs;reasoning",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/ca25059c59feb05d75385ae5a3aec9178c13639b.zip",
        "author": "Ning Miao;Yee Whye Teh;Tom Rainforth",
        "authorids": "~Ning_Miao3;~Yee_Whye_Teh2;~Tom_Rainforth1",
        "gender": "M;M;M",
        "homepage": "http://www.ningmiao.space/;http://www.robots.ox.ac.uk/~twgr;http://csml.stats.ox.ac.uk/people/teh/",
        "dblp": "230/7777;166/1198;88/2483",
        "google_scholar": ";https://scholar.google.co.uk/citations?user=ieLRNKMAAAAJ;https://scholar.google.co.uk/citations?user=y-nUzMwAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Ning_Miao3;~Tom_Rainforth1;~Yee_Whye_Teh1",
        "aff": "City University of Hong Kong;;University of Oxford",
        "aff_domain": "cityu.edu.hk;ox.ac.uk;ox.ac.uk",
        "position": "Assistant Professor;Postdoc;Full Professor",
        "bibtex": "@inproceedings{\nmiao2024selfcheck,\ntitle={SelfCheck: Using {LLM}s to Zero-Shot Check Their Own Step-by-Step Reasoning},\nauthor={Ning Miao and Yee Whye Teh and Tom Rainforth},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=pTHfApDakA}\n}",
        "github": "",
        "project": "",
        "reviewers": "NsFJ;wFF7;PScZ;6G8r",
        "pdf_size": 660207,
        "rating": "5;5;6;8",
        "confidence": "4;4;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;2;3;4",
        "wc_summary": "90;156;74;149",
        "wc_strengths": "40;160;79;64",
        "wc_weaknesses": "66;407;308;132",
        "wc_questions": "155;11;269;151",
        "wc_review": "351;734;730;496",
        "wc_reply_reviewers": "102;165;0;229",
        "wc_reply_authors": "1094;978;1472;728",
        "reply_reviewers": "2;1;0;1",
        "reply_authors": "2;2;3;2",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            117.25,
            35.78669445478305
        ],
        "wc_strengths_avg": [
            85.75,
            45.06869756272085
        ],
        "wc_weaknesses_avg": [
            228.25,
            135.92346191883135
        ],
        "wc_questions_avg": [
            146.5,
            91.4590072108811
        ],
        "wc_review_avg": [
            577.75,
            162.55210703033043
        ],
        "wc_reply_reviewers_avg": [
            124.0,
            84.50739612601964
        ],
        "wc_reply_authors_avg": [
            1068.0,
            268.13802415920054
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 114,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4713238228992296406&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=pTHfApDakA",
        "pdf": "https://openreview.net/pdf?id=pTHfApDakA",
        "email": "cityu.edu.hk;ox.ac.uk;ox.ac.uk",
        "author_num": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "City University of Hong Kong;University of Oxford",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cityu.edu.hk;https://www.ox.ac.uk",
        "aff_unique_abbr": "CityU;Oxford",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "title": "GNeRP: Gaussian-guided Neural Reconstruction of Reflective Objects with Noisy Polarization Priors",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17774",
        "id": "pTN8dV2pL8",
        "author_site": "LI Yang, RUIZHENG WU, Jiyong Li, YINGCONG CHEN",
        "tldr": "",
        "abstract": "Learning surfaces from neural radiance field (NeRF) became a rising topic in Multi-View Stereo (MVS).  Recent Signed Distance Function (SDF)-based methods demonstrated their ability to reconstruct exact 3D shapes of Lambertian scenes. However, their results on reflective scenes are unsatisfactory due to the entanglement of specular radiance and complicated geometry. To address the challenges, we propose a Gaussian-based representation of normals in SDF fields. Supervised by polarization priors, this representation guides the learning of geometry behind the specular reflection and capture more details than existing methods.  Moreover, we propose a reweighting strategy in optimization process to alleviate the noise issue of polarization priors. To validate the effectiveness of our design, we capture polarimetric information and ground truth meshes in additional reflective scenes with various geometry. We also evaluated our framework on PANDORA dataset. Both qualitative and quantitative comparisons prove our method outperforms existing neural 3D reconstruction methods in reflective scenes by a large margin.",
        "keywords": "Neural 3D Reconstruction;Specular Reflection",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/c1b3c6da871f1987e51caed9e7e72af8e6cf8c1c.zip",
        "author": "LI Yang;RUIZHENG WU;Jiyong Li;Ying-Cong Chen",
        "authorids": "~LI_Yang10;~RUIZHENG_WU1;~Jiyong_Li1;~Ying-Cong_Chen1",
        "gender": "M;M;;M",
        "homepage": "https://yukiumi13.github.io;;https://github.com/awslsky;https://www.yingcong.me/",
        "dblp": ";244/2111;;137/6578",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;;https://scholar.google.com.hk/citations?user=n7j4bJUAAAAJ",
        "orcid": ";;;",
        "linkedin": ";RuizhengWu;;",
        "or_profile": "~LI_Yang10;~RUIZHENG_WU1;~Jiyong_Li1;~Ying-Cong_Chen1",
        "aff": "Hong Kong University of Science and Technology;Smartmore Technology;SUN YAT-SEN UNIVERSITY;Hong Kong University of Science and Technology",
        "aff_domain": "ust.hk;smartmore.com;sysu.edu.cn;hkust-gz.edu.cn",
        "position": "MS student;Researcher;MS student;Assistant Professor",
        "bibtex": "@inproceedings{\nyang2024gnerp,\ntitle={{GN}e{RP}: Gaussian-guided Neural Reconstruction of Reflective Objects with Noisy Polarization Priors},\nauthor={LI Yang and RUIZHENG WU and Jiyong Li and Ying-Cong Chen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=pTN8dV2pL8}\n}",
        "github": "",
        "project": "",
        "reviewers": "BtpD;1dU4;Kf6J;ANa9",
        "pdf_size": 48532858,
        "rating": "6;6;6;6",
        "confidence": "3;4;4;4",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "2;3;2;2",
        "wc_summary": "117;103;103;87",
        "wc_strengths": "40;111;107;116",
        "wc_weaknesses": "146;344;59;101",
        "wc_questions": "3;65;39;245",
        "wc_review": "306;623;308;549",
        "wc_reply_reviewers": "0;18;0;0",
        "wc_reply_authors": "344;531;269;495",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            102.5,
            10.618380290797651
        ],
        "wc_strengths_avg": [
            93.5,
            31.052375110448477
        ],
        "wc_weaknesses_avg": [
            162.5,
            109.21194989560438
        ],
        "wc_questions_avg": [
            88.0,
            93.27915093953203
        ],
        "wc_review_avg": [
            446.5,
            141.93396351825027
        ],
        "wc_reply_reviewers_avg": [
            4.5,
            7.794228634059948
        ],
        "wc_reply_authors_avg": [
            409.75,
            107.35775472689433
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:vey2Vyo0GD0J:scholar.google.com/&scioq=GNeRP:+Gaussian-guided+Neural+Reconstruction+of+Reflective+Objects+with+Noisy+Polarization+Priors&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=pTN8dV2pL8",
        "pdf": "https://openreview.net/pdf?id=pTN8dV2pL8",
        "email": "ust.hk;smartmore.com;sysu.edu.cn;hkust-gz.edu.cn",
        "author_num": 4,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Smartmore Technology;Sun Yat-sen University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ust.hk;https://www.smartmore.com/;http://www.sysu.edu.cn",
        "aff_unique_abbr": "HKUST;;SYSU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "pTU2X9mUBe",
        "title": "LaDe: The First Comprehensive Last-mile Express Dataset from Industry",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Real-world last-mile delivery datasets are crucial for research in logistics, supply chain management, and spatio-temporal data mining. Despite a plethora of algorithms developed to date, no widely accepted, publicly available last-mile delivery dataset exists to support research in this field. In this paper, we introduce LaDe, the first publicly available last-mile delivery dataset with millions of packages from the industry. LaDe has three unique characteristics:  (1) Large-scale. It involves 10,677k packages of 21k couriers over 6 months of real-world operation. (2) Comprehensive information. It offers original package information, such as its location and time requirements, as well as task-event information, which records when and where the courier is while events such as task-accept and task-finish events happen.  (3) Diversity. The dataset includes data from various scenarios, including package pick-up and delivery, and from multiple cities, each with its unique spatio-temporal patterns due to their distinct characteristics such as populations. We verify LaDe on three tasks by running several classical baseline models per task. We believe that the large-scale, comprehensive, diverse feature of LaDe can offer unparalleled opportunities to researchers in the supply chain community, data mining community,  and beyond. The dataset homepage is publicly available at https://anonymous.4open.science/r/Anonymous-64B3/.",
        "keywords": "last-mile express dataset",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Lixia Wu;Haomin Wen;Haoyuan Hu;Xiaowei Mao;Yutong Xia;Ergang Shan;Jianbin Zheng;Junhong Lou;Chao Song;Yuxuan Liang;Liuqing Yang;Roger Zimmermann;Youfang Lin;Huaiyu Wan",
        "authorids": "~Lixia_Wu2;~Haomin_Wen2;~Haoyuan_Hu1;~Xiaowei_Mao1;~Yutong_Xia1;~Ergang_Shan1;~Jianbin_Zheng2;~Junhong_Lou1;~Chao_Song1;~Yuxuan_Liang1;~Liuqing_Yang3;~Roger_Zimmermann1;~Youfang_Lin1;~Huaiyu_Wan1",
        "gender": "M;M;M;F;;M;M;M;M;;M;M;M;M",
        "homepage": "https://wenhaomin.github.io/;;https://github.com/maoxiaowei97;https://yutong-xia.github.io/;https://shanergang.github.io/;;https://github.com/Allenhong0218;;https://yuxuanliang.com;https://personal.hkust-gz.edu.cn/lqyang;https://www.comp.nus.edu.sg/cs/bio/rogerz/;https://faculty.bjtu.edu.cn/7443/;https://faculty.bjtu.edu.cn/8793/;",
        "dblp": "292/7181;205/3156;;307/5917;;;;59/1815;183/0977;;79/1490;12/4988;07/9988;https://dblp1.uni-trier.de/pid/178/7239.html",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;;;V7b4y2oAAAAJ;;;;CDQpC_UAAAAJ;n9cODgcAAAAJ;;https://scholar.google.com.tw/citations?user=IDREwXEAAAAJ;e8xT-e0AAAAJ;T5wVWIUAAAAJ;",
        "orcid": "0000-0001-6130-126X;;;0000-0001-9026-0049;;0000-0003-0636-3905;;;0000-0003-2817-7337;;0000-0002-7410-2590;0000-0002-5143-3645;0000-0002-0501-9363;",
        "linkedin": ";;;yutong-xia/;;;;;yoshall/;;roger-zimmermann-76b56b6/;youfang-lin-a1625091/;;",
        "or_profile": "~Haomin_Wen2;~Haoyuan_Hu1;~Xiaowei_Mao1;~Yutong_Xia1;~Ergang_Shan1;~Jianbin_Zheng2;~Junhong_Lou1;~Chao_Song1;~Yuxuan_Liang1;~Liuqing_Yang3;~Roger_Zimmermann1;~Youfang_Lin1;~Huaiyu_Wan1;~Wu_Li_Xia1",
        "aff": "Beijing Jiaotong University;Cainiao Network;Beijing Jiaotong University;National University of Singapore;;CaiNiao Network;Alibaba Group;;The Hong Kong University of Science and Technology (Guangzhou);Hong Kong University of Science and Technology;National University of Singapore;Beijing Jiaotong University;Beijing Jiaotong University;",
        "aff_domain": "bjtu.edu.cn;cainiao.com;bjtu.edu.cn;u.nus.edu;;cainiao.com;alibaba-inc.com;;hkust-gz.edu.cn;ust.hk;nus.edu.sg;bjtu.edu.cn;bjtu.edu.cn;",
        "position": "PhD student;Principal Researcher;PhD student;PhD student;;Researcher;Researcher;;Assistant Professor;Full Professor;Full Professor;Full Professor;Full Professor;",
        "bibtex": "@misc{\nwu2024lade,\ntitle={LaDe: The First Comprehensive Last-mile Express Dataset from Industry},\nauthor={Lixia Wu and Haomin Wen and Haoyuan Hu and Xiaowei Mao and Yutong Xia and Ergang Shan and Jianbin Zheng and Junhong Lou and Chao Song and Yuxuan Liang and Liuqing Yang and Roger Zimmermann and Youfang Lin and Huaiyu Wan},\nyear={2024},\nurl={https://openreview.net/forum?id=pTU2X9mUBe}\n}",
        "github": "",
        "project": "",
        "reviewers": "CAYh;f5QW;daoa;7pge",
        "site": "https://openreview.net/forum?id=pTU2X9mUBe",
        "pdf_size": 1299098,
        "rating": "3;5;5;8",
        "confidence": "5;4;4;4",
        "soundness": "2;3;2;3",
        "contribution": "2;3;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "152;72;56;96",
        "wc_strengths": "16;71;73;122",
        "wc_weaknesses": "115;70;545;53",
        "wc_questions": "3;53;45;409",
        "wc_review": "286;266;719;680",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;244;302;39",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;1;1;1",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            94.0,
            36.38681079732051
        ],
        "wc_strengths_avg": [
            70.5,
            37.51333096380539
        ],
        "wc_weaknesses_avg": [
            195.75,
            202.90807647799534
        ],
        "wc_questions_avg": [
            127.5,
            163.62991780233833
        ],
        "wc_review_avg": [
            487.75,
            212.3162440794392
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            146.25,
            129.13631363795392
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0.75,
            0.4330127018922193
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            14,
            0
        ],
        "corr_rating_confidence": -0.7276068751089989,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14640074016718040757&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;2;1;3;4;4;2;0;0",
        "aff_unique_norm": "Beijing Jiao Tong University;Cainiao Network;National University of Singapore;Alibaba Group;Hong Kong University of Science and Technology",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "http://www.njtu.edu.cn/en;https://www.cainiao.com;https://www.nus.edu.sg;https://www.alibaba.com;https://www.ust.hk",
        "aff_unique_abbr": "BJTU;Cainiao;NUS;Alibaba;HKUST",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Guangzhou;Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;1;0;0;0;0;1;0;0",
        "aff_country_unique": "China;Singapore"
    },
    {
        "id": "pTqmVbBa8R",
        "title": "Generative Modeling of Individual Behavior at Scale",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent years have seen a growing interest in using AI to model human behavior, particularly in domains where humans learn from or collaborate with this AI. While most existing work attempts to model human behavior at an aggregate level, our goal is to model behavior at the individual level. Recent work in the domain of chess has shown that behavioral stylometry, or the task of identifying a person from their actions alone, can be achieved with high accuracy among a pool of a few thousand players. We provide a new perspective on behavioral stylomery by connecting it to the vast literature of transfer learning in NLP. Specifically, by casting the stylometry problem as a multi-task learning problem---where each task is a distinct person---we show that parameter efficient fine-tuning (PEFT) methods can be adapted to perform stylometry at an unprecedented scale (47,864 players), while enabling few-shot learning for unseen players. Our approach leverages recent modular PEFT methods to learn a set of skill parameters that can be combined in different ways using style vectors. Style vectors enable two important capabilities. First, they make our approach generative, in that we can generate actions in the style of a player by simply indexing into that player's style vector. Second, they induce a latent style space that we can interpreted and manipulated algorithmically. This allows us to compare different player styles, as well as synthesize new (human-like) styles, e.g., merging the styles of two players or interpolating between their styles.",
        "keywords": "parameter efficient finetuning;chess;play style;stylometry;interpretation of learned representations",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Nabil Omi;Lucas Caccia;Siddhartha Sen;Anurag Sarkar;Jordan T. Ash",
        "authorids": "~Nabil_Omi1;~Lucas_Caccia1;~Siddhartha_Sen1;~Anurag_Sarkar1;~Jordan_T._Ash1",
        "gender": "M;M;;;",
        "homepage": "https://www.nabilto.com/;https://www.cs.mcgill.ca/~lpagec/;http://sidsen.org;;http://www.jordantash.com",
        "dblp": "391/7704;;;;176/5225",
        "google_scholar": "18iysQgAAAAJ;fuvIITUAAAAJ;;;bmRNH-UAAAAJ",
        "orcid": ";;;;",
        "linkedin": "nabil-omi/;;;;",
        "or_profile": "~Nabil_Omi1;~Lucas_Caccia1;~Siddhartha_Sen1;~Anurag_Sarkar1;~Jordan_T._Ash1",
        "aff": "The City College of New York;Microsoft;Microsoft Research;;Microsoft Research",
        "aff_domain": "citymail.cuny.edu;microsoft.com;research.microsoft.com;;research.microsoft.com",
        "position": "Undergrad student;Postdoc;Principal Researcher;;Postdoc",
        "bibtex": "@misc{\nomi2024generative,\ntitle={Generative Modeling of Individual Behavior at Scale},\nauthor={Nabil Omi and Lucas Caccia and Siddhartha Sen and Anurag Sarkar and Jordan T. Ash},\nyear={2024},\nurl={https://openreview.net/forum?id=pTqmVbBa8R}\n}",
        "github": "",
        "project": "",
        "reviewers": "rXFi;XeAJ;RNKg",
        "site": "https://openreview.net/forum?id=pTqmVbBa8R",
        "pdf_size": 1356335,
        "rating": "5;5;6",
        "confidence": "3;3;2",
        "soundness": "3;3;3",
        "contribution": "2;2;3",
        "presentation": "2;2;3",
        "wc_summary": "72;57;97",
        "wc_strengths": "50;29;102",
        "wc_weaknesses": "91;79;76",
        "wc_questions": "8;52;20",
        "wc_review": "221;217;295",
        "wc_reply_reviewers": "0;49;0",
        "wc_reply_authors": "281;557;372",
        "reply_reviewers": "0;1;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            75.33333333333333,
            16.49915822768611
        ],
        "wc_strengths_avg": [
            60.333333333333336,
            30.684777260973487
        ],
        "wc_weaknesses_avg": [
            82.0,
            6.48074069840786
        ],
        "wc_questions_avg": [
            26.666666666666668,
            18.571184369578823
        ],
        "wc_review_avg": [
            244.33333333333334,
            35.86394041683404
        ],
        "wc_reply_reviewers_avg": [
            16.333333333333332,
            23.098821518760555
        ],
        "wc_reply_authors_avg": [
            403.3333333333333,
            114.83417996785143
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9999999999999997,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:YgxLMYmtMnMJ:scholar.google.com/&scioq=Generative+Modeling+of+Individual+Behavior+at+Scale&hl=en&as_sdt=0,44",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "City College of New York;Microsoft",
        "aff_unique_dep": ";Microsoft Corporation",
        "aff_unique_url": "https://www.ccny.cuny.edu;https://www.microsoft.com",
        "aff_unique_abbr": "CCNY;Microsoft",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "New York;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "pUGjLB0N4l",
        "title": "Big Learning Variational Auto-Encoders",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "As a representative latent variable model, the Variational Auto-Encoder (VAE) is powerful in modeling high-dimensional signals like images and texts. \nHowever, practical applications often require versatile data capabilities, such as conditional generation/completion, inference with incomplete/marginal data, \\emph{etc}, which are challenging to harvest from a conventional/joint VAE.\nTo satisfy those requirements, we leverage the recently proposed big learning to upgrade the joint VAE to its big-learning variant termed BigLearn-VAE, which delivers joint, marginal, and conditional generation/completion, inference, and reconstruction capabilities, simultaneously. \nIn addition, we also reveal that the BigLearn-VAE can be constructed based on one foundation model, manifested as one universal model possessing plenty of versatile capabilities. \nCode will be released.",
        "keywords": "Variational Auto-Encoders;big learning;foundation models;incomplete data;conditional sampling;in-painting",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/17efd7050c5f4fdd0acebf56fce402223d14f5ef.zip",
        "author": "Yulai Cong;Sijia Li",
        "authorids": "~Yulai_Cong1;~Sijia_Li2",
        "gender": "M;F",
        "homepage": ";https://github.com/KKKirsty",
        "dblp": "163/0527;",
        "google_scholar": "i_XfCIkAAAAJ;",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Yulai_Cong1;~Sijia_Li2",
        "aff": "SUN YAT-SEN UNIVERSITY;SUN YAT-SEN UNIVERSITY",
        "aff_domain": "sysu.edu.cn;sysu.edu.cn",
        "position": "Associate Professor;MS student",
        "bibtex": "@misc{\ncong2024big,\ntitle={Big Learning Variational Auto-Encoders},\nauthor={Yulai Cong and Sijia Li},\nyear={2024},\nurl={https://openreview.net/forum?id=pUGjLB0N4l}\n}",
        "github": "",
        "project": "",
        "reviewers": "MAEj;b3xg;DcvD;M8cU;XfDU",
        "site": "https://openreview.net/forum?id=pUGjLB0N4l",
        "pdf_size": 1287429,
        "rating": "3;3;5;5;5",
        "confidence": "4;5;2;3;3",
        "soundness": "2;1;2;3;3",
        "contribution": "2;2;2;2;2",
        "presentation": "2;2;2;2;2",
        "wc_summary": "80;161;44;35;46",
        "wc_strengths": "36;46;71;64;22",
        "wc_weaknesses": "180;255;99;165;158",
        "wc_questions": "50;20;4;18;81",
        "wc_review": "346;482;218;282;307",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "525;505;254;521;178",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            4.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.4,
            1.019803902718557
        ],
        "soundness_avg": [
            2.2,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            73.2,
            46.49042912256242
        ],
        "wc_strengths_avg": [
            47.8,
            17.93766985982293
        ],
        "wc_weaknesses_avg": [
            171.4,
            50.050374623972594
        ],
        "wc_questions_avg": [
            34.6,
            27.623178672991276
        ],
        "wc_review_avg": [
            327.0,
            87.96817606384708
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            396.6,
            149.55480600769738
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.8807048459279794,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:W_RJyajJ6FIJ:scholar.google.com/&scioq=Big+Learning+Variational+Auto-Encoders&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Sun Yat-sen University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.sysu.edu.cn",
        "aff_unique_abbr": "SYSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "pUIANwOLBN",
        "title": "Behind the Myth of Exploration in Policy Gradients",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Policy-gradient algorithms are effective reinforcement learning methods for solving control problems with continuous state and action spaces. To compute near-optimal policies, it is essential in practice to include exploration terms in the learning objective. Although the effectiveness of these terms is usually justified by an intrinsic need to explore environments, we propose a novel analysis and distinguish two different implications of these techniques. First, they enable a smooth learning objective and eliminate local optima while preserving the global maximum. Second, they modify the gradient estimates, increasing the probability that the stochastic parameter update eventually provides an optimal policy. In light of these effects, we discuss and illustrate empirically exploration strategies based on entropy bonuses, highlighting their limitations and opening avenues for future works in the design and analysis of such strategies.",
        "keywords": "Reinforcement Learning;Policy Gradients;Exploration;Optimization",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Adrien Bolland;Gaspard Lambrechts;Damien Ernst",
        "authorids": "~Adrien_Bolland1;~Gaspard_Lambrechts1;~Damien_Ernst1",
        "gender": ";M;M",
        "homepage": ";https://gsprd.be;http://www.damien-ernst.be",
        "dblp": ";;",
        "google_scholar": "8m9bl5oAAAAJ;LRcgg2wAAAAJ;https://scholar.google.be/citations?user=91ZxYSsAAAAJ",
        "orcid": ";;",
        "linkedin": "adrien-bolland-48497218a/;;",
        "or_profile": "~Adrien_Bolland1;~Gaspard_Lambrechts1;~Damien_Ernst1",
        "aff": "University of Liege;Universit\u00e9 de Li\u00e8ge;University of Li\u00e8ge",
        "aff_domain": "ulg.ac.be;ulg.ac.be;uliege.be",
        "position": "PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nbolland2024behind,\ntitle={Behind the Myth of Exploration in Policy Gradients},\nauthor={Adrien Bolland and Gaspard Lambrechts and Damien Ernst},\nyear={2024},\nurl={https://openreview.net/forum?id=pUIANwOLBN}\n}",
        "github": "",
        "project": "",
        "reviewers": "yYKF;qvTF;kiQP",
        "site": "https://openreview.net/forum?id=pUIANwOLBN",
        "pdf_size": 900530,
        "rating": "5;5;6",
        "confidence": "3;3;3",
        "soundness": "3;3;3",
        "contribution": "2;2;3",
        "presentation": "2;3;3",
        "wc_summary": "35;64;65",
        "wc_strengths": "45;28;813",
        "wc_weaknesses": "380;89;225",
        "wc_questions": "320;72;48",
        "wc_review": "780;253;1151",
        "wc_reply_reviewers": "0;99;161",
        "wc_reply_authors": "719;454;909",
        "reply_reviewers": "0;1;2",
        "reply_authors": "1;1;2",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            54.666666666666664,
            13.912424503139471
        ],
        "wc_strengths_avg": [
            295.3333333333333,
            366.1113977405724
        ],
        "wc_weaknesses_avg": [
            231.33333333333334,
            118.88463128409641
        ],
        "wc_questions_avg": [
            146.66666666666666,
            122.95618008958405
        ],
        "wc_review_avg": [
            728.0,
            368.44628735633455
        ],
        "wc_reply_reviewers_avg": [
            86.66666666666667,
            66.30401362076222
        ],
        "wc_reply_authors_avg": [
            694.0,
            186.5922470700931
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3501833111070053922&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Li\u00e8ge;Universit\u00e9 de Li\u00e8ge",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ulg.ac.be;https://www.ulg.ac.be",
        "aff_unique_abbr": "ULi\u00e8ge;ULi\u00e8ge",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Belgium"
    },
    {
        "id": "pUKJWr5zOE",
        "title": "A Differentiable Physical Simulation Framework for Soft Robots on Multiple-Task Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Learning multiple tasks is challenging for soft robots. Differentiable physics enables efficient gradient-based optimizations of neural network (NN) controllers for soft robot learning. However, existing work typically delivers NN controllers with limited capability and generalizability. We present a practical learning framework that outputs unified NN controllers capable of multiple tasks with significantly improved complexity and diversity. Our framework consists of a high-performance differentiable deformable bodies simulator supporting the material point method (MPM) and mass-spring systems, an automatic differentiation module that enables gradient-based optimizations, and a practical training module for soft robots on learning multiple locomotion tasks with a single NN controller. Using a unified NN controller trained in our framework, we demonstrate that users can interactively control soft robot locomotion and switch among multiple goals with specified velocity, height, and direction instructions. We evaluate our framework with multiple robot designs and challenging locomotion tasks. Experiments show that our learning framework, based on differentiable physics, delivers better results and converges much faster, compared with reinforcement learning frameworks. In addition, we successfully employed our framework on learning manipulation tasks, indicating the potential to extend our framework to tasks beyond locomotion.",
        "keywords": "Differentiable Physics;Multiple-task Learning;Soft Robot Learning",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/f097cac960f52a3d5ca5f6657d7084e41e54abcd.zip",
        "author": "Yu Fang;Jiancheng Liu;Mingrui Zhang;Jiasheng Zhang;Yidong Ma;Minchen Li;Yuanming Hu;Chenfanfu Jiang;Tiantian Liu",
        "authorids": "~Yu_Fang2;~Jiancheng_Liu2;~Mingrui_Zhang4;~Jiasheng_Zhang1;~Yidong_Ma1;~Minchen_Li1;~Yuanming_Hu1;~Chenfanfu_Jiang3;~Tiantian_Liu1",
        "gender": "M;M;M;M;M;M;M;;F",
        "homepage": "http://squarefk.com/;https://ljcc0930.github.io/;https://erizmr.github.io/;;http://www.ma-yidong.com;https://www.cs.cmu.edu/~minchenl/;http://taichi.graphics/me;;https://tiantianliu.cn/",
        "dblp": ";74/3002;;;;175/5809;204/4110;132/7630;",
        "google_scholar": ";ReWNzl4AAAAJ;IN75qZcAAAAJ;;;https://scholar.google.ca/citations?user=Gk7K7VkAAAAJ;https://scholar.google.com/citations?hl=en;;",
        "orcid": ";;;;;0000-0001-9868-7311;;;",
        "linkedin": ";;;jiasheng-zhang-43858a193;;minchenli/;;;",
        "or_profile": "~Yu_Fang2;~Jiancheng_Liu2;~Mingrui_Zhang4;~Jiasheng_Zhang1;~Yidong_Ma1;~Minchen_Li1;~Yuanming_Hu1;~Chenfanfu_Jiang3;~Tiantian_Liu1",
        "aff": ";Michigan State University;Imperial College London;New York University;;School of Computer Science, Carnegie Mellon University;Massachusetts Institute of Technology;University of California, Los Angeles;",
        "aff_domain": ";msu.edu;imperial.ac.uk;nyu.edu;;cs.cmu.edu;mit.edu;ucla.edu;",
        "position": ";MS student;PhD student;MS student;;Assistant Professor;PhD student;Associate Professor;",
        "bibtex": "@misc{\nfang2024a,\ntitle={A Differentiable Physical Simulation Framework for Soft Robots on Multiple-Task Learning},\nauthor={Yu Fang and Jiancheng Liu and Mingrui Zhang and Jiasheng Zhang and Yidong Ma and Minchen Li and Yuanming Hu and Chenfanfu Jiang and Tiantian Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=pUKJWr5zOE}\n}",
        "github": "",
        "project": "",
        "reviewers": "FNgh;ReY1;h9Cp;5sx5",
        "site": "https://openreview.net/forum?id=pUKJWr5zOE",
        "pdf_size": 6132060,
        "rating": "3;5;6;6",
        "confidence": "4;4;3;4",
        "soundness": "1;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "42;91;47;153",
        "wc_strengths": "60;54;31;41",
        "wc_weaknesses": "487;79;57;47",
        "wc_questions": "48;120;49;429",
        "wc_review": "637;344;184;670",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            83.25,
            44.55544298960566
        ],
        "wc_strengths_avg": [
            46.5,
            11.280514172678478
        ],
        "wc_weaknesses_avg": [
            167.5,
            184.82626977786464
        ],
        "wc_questions_avg": [
            161.5,
            157.17585692465622
        ],
        "wc_review_avg": [
            458.75,
            203.13465361675736
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -0.4714045207910316,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:EGVVOwjnIkgJ:scholar.google.com/&scioq=A+Differentiable+Physical+Simulation+Framework+for+Soft+Robots+on+Multiple-Task+Learning&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;4;5",
        "aff_unique_norm": "Michigan State University;Imperial College London;New York University;Carnegie Mellon University;Massachusetts Institute of Technology;University of California, Los Angeles",
        "aff_unique_dep": ";;;School of Computer Science;;",
        "aff_unique_url": "https://www.msu.edu;https://www.imperial.ac.uk;https://www.nyu.edu;https://www.cmu.edu;https://web.mit.edu;https://www.ucla.edu",
        "aff_unique_abbr": "MSU;ICL;NYU;CMU;MIT;UCLA",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Pittsburgh;Los Angeles",
        "aff_country_unique_index": "0;1;0;0;0;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "pUKps5dL4s",
        "title": "Momentum Particle Maximum Likelihood",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Maximum likelihood estimation (MLE) of latent variable models is often recast as an optimization problem over the extended space of parameters and probability distributions. For example, the Expectation Maximization (EM) algorithm can be interpreted as coordinate descent applied to a suitable free energy functional over this space. Recently, this perspective has been combined with insights from optimal transport and Wasserstein gradient flows to develop particle-based algorithms applicable to wider classes of models than standard EM.\nDrawing inspiration from prior works which interpret `momentum-enriched' optimisation algorithms as discretizations of ordinary differential equations, we propose an analogous dynamical systems-inspired approach to minimizing the free energy functional over the extended space of parameters and probability distributions. The result is a dynamic system that blends elements of Nesterov's Accelerated Gradient method, the underdamped Langevin diffusion, and particle methods. \nUnder suitable assumptions, we establish quantitative convergence of the proposed system to the unique minimiser of the functional in continuous time. We then propose a numerical discretization of this system which enables its application to parameter estimation in latent variable models. Through numerical experiments, we demonstrate that the resulting algorithm converges faster than existing methods and compares favourably with other (approximate) MLE algorithms.",
        "keywords": "Maximum Likelihood;Particle Methods;Generative Modelling",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/b0a9a329b08f0935961e32a15df310e2e44e868c.zip",
        "author": "Jen Ning Lim;Juan Kuntz;Samuel Power;Adam Michael Johansen",
        "authorids": "~Jen_Ning_Lim1;~Juan_Kuntz1;~Samuel_Power1;~Adam_Michael_Johansen1",
        "gender": ";M;M;M",
        "homepage": ";https://juankuntz.github.io/;https://sites.google.com/view/sp-monte-carlo/;https://go.warwick.ac.uk/amjohansen",
        "dblp": "250/9539;193/9597;;43/3875",
        "google_scholar": "Uryp_N8AAAAJ;https://scholar.google.co.uk/citations?user=ndrKbVoAAAAJ;ePQTKrEAAAAJ;https://scholar.google.co.uk/citations?user=KOaq7EEAAAAJ",
        "orcid": ";0000-0002-5855-6074;0000-0001-8644-8014;0000-0002-3531-7628",
        "linkedin": ";;samuel-power-6308b02b/;adam-johansen-6b71154/",
        "or_profile": "~Jen_Ning_Lim1;~Juan_Kuntz1;~Samuel_Power1;~Adam_Michael_Johansen1",
        "aff": "The University of Warwick;Polygeist;University of Bristol;University of Warwick",
        "aff_domain": "warwick.ac.uk;polygei.st;bristol.ac.uk;warwick.ac.uk",
        "position": "PhD student;Researcher;Postdoc;Full Professor",
        "bibtex": "@misc{\nlim2024momentum,\ntitle={Momentum Particle Maximum Likelihood},\nauthor={Jen Ning Lim and Juan Kuntz and Samuel Power and Adam Michael Johansen},\nyear={2024},\nurl={https://openreview.net/forum?id=pUKps5dL4s}\n}",
        "github": "",
        "project": "",
        "reviewers": "1aSJ;eLbr;cMKu;yQ9T",
        "site": "https://openreview.net/forum?id=pUKps5dL4s",
        "pdf_size": 2903102,
        "rating": "5;5;5;8",
        "confidence": "3;3;4;3",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "198;62;97;104",
        "wc_strengths": "154;47;35;38",
        "wc_weaknesses": "304;176;302;283",
        "wc_questions": "62;33;26;171",
        "wc_review": "718;318;460;596",
        "wc_reply_reviewers": "0;0;0;115",
        "wc_reply_authors": "1090;366;979;1014",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "2;1;2;3",
        "rating_avg": [
            5.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            115.25,
            50.35561041234631
        ],
        "wc_strengths_avg": [
            68.5,
            49.56056900399752
        ],
        "wc_weaknesses_avg": [
            266.25,
            52.74644537786409
        ],
        "wc_questions_avg": [
            73.0,
            58.16786054171152
        ],
        "wc_review_avg": [
            523.0,
            149.4556790490077
        ],
        "wc_reply_reviewers_avg": [
            28.75,
            49.79646071760522
        ],
        "wc_reply_authors_avg": [
            862.25,
            289.30639035458586
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13223908394080045354&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "University of Warwick;Polygeist;University of Bristol",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://warwick.ac.uk;;https://www.bristol.ac.uk",
        "aff_unique_abbr": "Warwick;;Bristol",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United Kingdom;"
    },
    {
        "id": "pUOesbrlw4",
        "title": "Deep Unlearning: Fast and Efficient Training-free Approach to Controlled Forgetting",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Machine {\\em unlearning} has emerged as a prominent and challenging area of interest, driven in large part by the rising regulatory demands for industries to delete user data upon request and the heightened awareness of privacy. Existing approaches either retrain models from scratch or use several finetuning steps for every deletion request, often constrained by computational resource limitations and restricted access to the original training data. In this work, we introduce a novel class unlearning algorithm designed to strategically eliminate an entire class or a group of classes from the learned model. To that end, our algorithm first estimates the Retain Space and the Forget Space, representing the feature or activation spaces for samples from classes to be retained and unlearned, respectively. To obtain these spaces, we propose a novel singular value decomposition-based technique that requires layer wise collection of network activations from a few forward passes through the network. We then compute the shared information between these spaces and remove it from the forget space to isolate class-discriminatory feature space for unlearning. Finally, we project the model weights in the orthogonal direction of the class-discriminatory space to obtain the unlearned model. We demonstrate our algorithm\u2019s efficacy on ImageNet using a Vision Transformer with only $\\sim 1.5$% drop in retain accuracy compared to the original model, while maintaining under $1$% accuracy on the unlearned class samples. Further our comprehensive analysis on a variety of image classification datasets and network architectures shows up to $4.07$% better retain accuracy with similar unlearning (forgetting) on the forget class samples while being $6.5\\times$ faster as compared to a strong baseline we propose. Additionally, we investigate the impact of unlearning on network decision boundaries and conduct saliency-based analysis to illustrate that the post-unlearning model struggles to identify class-discriminatory features from the forgotten classes.",
        "keywords": "General machine learning;representation learning for computer vision;Machine Unlearning;Singular Value Decomposition;Privacy",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/89a632d0a3808f0e8973401b80cb1fe9d05be72c.zip",
        "author": "Sangamesh Kodge;Gobinda Saha;Kaushik Roy",
        "authorids": "~Sangamesh_Kodge1;~Gobinda_Saha1;~Kaushik_Roy1",
        "gender": "M;M;M",
        "homepage": ";https://sahagobinda.github.io/portfolio/;https://engineering.purdue.edu/NRL/Group",
        "dblp": "203/5657.html;218/5562;r/KaushikRoy",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;to4P8KgAAAAJ",
        "orcid": "0000-0001-9713-5400;;",
        "linkedin": "sangameshkodge;gobinda-saha/;",
        "or_profile": "~Sangamesh_Kodge1;~Gobinda_Saha1;~Kaushik_Roy1",
        "aff": "Purdue University;Purdue University;Purdue University",
        "aff_domain": "purdue.edu;purdue.edu;purdue.edu",
        "position": "PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nkodge2024deep,\ntitle={Deep Unlearning: Fast and Efficient Training-free Approach to Controlled Forgetting},\nauthor={Sangamesh Kodge and Gobinda Saha and Kaushik Roy},\nyear={2024},\nurl={https://openreview.net/forum?id=pUOesbrlw4}\n}",
        "github": "",
        "project": "",
        "reviewers": "bRqF;8Shn;FQb4;ZSgK",
        "site": "https://openreview.net/forum?id=pUOesbrlw4",
        "pdf_size": 726953,
        "rating": "3;5;5;8",
        "confidence": "5;3;4;4",
        "soundness": "3;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "83;148;213;146",
        "wc_strengths": "80;123;74;32",
        "wc_weaknesses": "223;288;740;14",
        "wc_questions": "4;107;191;209",
        "wc_review": "390;666;1218;401",
        "wc_reply_reviewers": "0;0;511;0",
        "wc_reply_authors": "634;807;2044;233",
        "reply_reviewers": "0;0;2;0",
        "reply_authors": "2;2;4;1",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            147.5,
            45.97009897748753
        ],
        "wc_strengths_avg": [
            77.25,
            32.24418552235426
        ],
        "wc_weaknesses_avg": [
            316.25,
            264.77006533972076
        ],
        "wc_questions_avg": [
            127.75,
            81.15840991542404
        ],
        "wc_review_avg": [
            668.75,
            335.8104934334244
        ],
        "wc_reply_reviewers_avg": [
            127.75,
            221.26949066692407
        ],
        "wc_reply_authors_avg": [
            929.5,
            676.3041105893118
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            2.25,
            1.0897247358851685
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.39605901719066966,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14752983627633045881&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Purdue University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.purdue.edu",
        "aff_unique_abbr": "Purdue",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "pUVvUf9SZB",
        "title": "On Learning with a Concurrent Verifier: Convexity, Improving Bounds, and Complex Requirements",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Machine learning technologies have been used in a wide range of practical applications. \nIn them, it is preferable to guarantee that the input-output pairs of a model satisfy the given requirements.\n   The recently proposed concurrent verifier (CV) is a module combined with machine learning models to guarantee that the model's input-output pairs satisfy the given requirements. The previous paper provides a generalization analysis of learning with a CV to show how the model's learnability changes using a CV. Although the paper provides basic learnability results, many CV properties remain unrevealed. Moreover, the previous work assumed a CV always works correctly, and requirements are imposed on a single input-output pair, which limits the situation where we can use a CV.  We show the learning algorithms that preserve convexity when using a CV. We also show conditions that using a CV improves the generalization error bound. Moreover, we analyze the learnability when a CV is incorrect, or requirements are imposed on the combination of multiple input-output pairs.",
        "keywords": "Generalization analysis;verifier;learning theory",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Masaaki Nishino;Kengo Nakamura;Norihito Yasuda",
        "authorids": "~Masaaki_Nishino1;~Kengo_Nakamura1;~Norihito_Yasuda1",
        "gender": "M;M;M",
        "homepage": ";http://www.kecl.ntt.co.jp/icl/lirg/members/nakamura/index.html;",
        "dblp": "90/1078;158/3521;41/2921",
        "google_scholar": ";;",
        "orcid": ";0000-0002-9615-3479;",
        "linkedin": ";;",
        "or_profile": "~Masaaki_Nishino1;~Kengo_Nakamura1;~Norihito_Yasuda1",
        "aff": "NTT;Kyoto University;NTT",
        "aff_domain": "ntt.co.jp;kyoto-u.ac.jp;ntt.co.jp",
        "position": "Distinguished Researcher;PhD student;Principal Researcher",
        "bibtex": "@misc{\nnishino2024on,\ntitle={On Learning with a Concurrent Verifier: Convexity, Improving Bounds, and Complex Requirements},\nauthor={Masaaki Nishino and Kengo Nakamura and Norihito Yasuda},\nyear={2024},\nurl={https://openreview.net/forum?id=pUVvUf9SZB}\n}",
        "github": "",
        "project": "",
        "reviewers": "ibrb;A15n;H3HT",
        "site": "https://openreview.net/forum?id=pUVvUf9SZB",
        "pdf_size": 369178,
        "rating": "3;5;6",
        "confidence": "2;3;3",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "2;2;3",
        "wc_summary": "74;101;74",
        "wc_strengths": "27;16;113",
        "wc_weaknesses": "61;46;6",
        "wc_questions": "60;33;1",
        "wc_review": "222;196;194",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            83.0,
            12.727922061357855
        ],
        "wc_strengths_avg": [
            52.0,
            43.36665385600631
        ],
        "wc_weaknesses_avg": [
            37.666666666666664,
            23.21398046197353
        ],
        "wc_questions_avg": [
            31.333333333333332,
            24.115462996914562
        ],
        "wc_review_avg": [
            204.0,
            12.754084313139327
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.9449111825230683,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:evYSvgENr2cJ:scholar.google.com/&scioq=On+Learning+with+a+Concurrent+Verifier:+Convexity,+Improving+Bounds,+and+Complex+Requirements&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "NTT Corporation;Kyoto University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ntt.co.jp;https://www.kyoto-u.ac.jp",
        "aff_unique_abbr": "NTT;Kyoto U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Japan"
    },
    {
        "id": "pUtTtiNksb",
        "title": "FFCA-Net: Stereo Image Compression via Fast Cascade Alignment of Side Information",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Multi-view compression technology, particularly stereo image compression (SIC), is vital for car cameras and 3D applications. Current SIC methods use a joint encoding and decoding compression structure, requiring both ends to use residual information at the same time. This creates a burden on the encoding terminal due to the need for camera cooperation. Interestingly, the distributed source coding theory suggests that efficient data compression of related sources can be achieved through independent encoding and joint decoding. This has led to the rapid development of deep-distributed SIC methods. However, these methods overlook the unique features of stereo-imaging tasks and cause high decoding latency. To overcome this, we suggest a Feature-based Fast Cascade Alignment network (FFCA-Net) to fully utilize the side information on the decoder. FFCA uses a step-by-step alignment approach. Initially, FFCA uses a feature domain patch-matching module based on stereo priors to reduce redundancy and noise. Then, we use an hourglass-based sparse stereo refinement network to further align inter-image features at a lower computational cost. Additionally, we've created a lightweight, high-performance feature fusion network, the Fast Feature Fusion Network (FFF), to decode the aligned features. Tests on InStereo2K, KITTI, and Cityscapes datasets show our method is significantly better than traditional and learning-based SIC methods. Specifically, our method achieves 3 to 10 times faster decoding speed than other methods.",
        "keywords": "Deep stereo image compression;distributed source coding;stereo matching",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Yichong Xia;Yujun Huang;Bin Chen;Haoqian Wang;Yaowei Wang",
        "authorids": "~Yichong_Xia1;huangyj22@mails.tsinghua.edu.cn;~Bin_Chen4;~Haoqian_Wang1;~Yaowei_Wang1",
        "gender": "M;;M;M;M",
        "homepage": "https://github.com/arcx18;;https://binchen17tsinghua.wixsite.com/website;;https://dblp.org/pid/68/2992.html",
        "dblp": "247/8229.html;;22/5523-11;;68/2992-1",
        "google_scholar": ";;Yl0wv7AAAAAJ;;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": ";;0000-0002-4798-230X;0000-0003-2792-8469;0000-0002-6110-4036",
        "linkedin": ";;;;yaowei-wang-971ab310/",
        "or_profile": "~Yichong_Xia1;huangyj22@mails.tsinghua.edu.cn;~Bin_Chen4;~Haoqian_Wang1;~Yaowei_Wang1",
        "aff": "Tsinghua University;;Harbin Institute of Technology, Shenzhen;Tsinghua University;Pengcheng Laboratory",
        "aff_domain": "tsinghua.edu.cn;;hit.edu.cn;tsinghua.edu.cn;pcl.ac.cn",
        "position": "PhD student;;Assistant Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nxia2024ffcanet,\ntitle={{FFCA}-Net: Stereo Image Compression via Fast Cascade Alignment of Side Information},\nauthor={Yichong Xia and Yujun Huang and Bin Chen and Haoqian Wang and Yaowei Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=pUtTtiNksb}\n}",
        "github": "",
        "project": "",
        "reviewers": "fJJD;sqk4;YULU",
        "site": "https://openreview.net/forum?id=pUtTtiNksb",
        "pdf_size": 23327625,
        "rating": "5;6;6",
        "confidence": "3;3;4",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "3;3;2",
        "wc_summary": "114;75;35",
        "wc_strengths": "41;23;146",
        "wc_weaknesses": "118;50;159",
        "wc_questions": "9;51;184",
        "wc_review": "282;199;524",
        "wc_reply_reviewers": "380;19;0",
        "wc_reply_authors": "992;1171;2902",
        "reply_reviewers": "1;1;0",
        "reply_authors": "5;6;10",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            74.66666666666667,
            32.25247621845836
        ],
        "wc_strengths_avg": [
            70.0,
            54.24020648928247
        ],
        "wc_weaknesses_avg": [
            109.0,
            44.95182606598609
        ],
        "wc_questions_avg": [
            81.33333333333333,
            74.59371436134697
        ],
        "wc_review_avg": [
            335.0,
            137.8719212409353
        ],
        "wc_reply_reviewers_avg": [
            133.0,
            174.82753406333532
        ],
        "wc_reply_authors_avg": [
            1688.3333333333333,
            861.2975998779723
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            7.0,
            2.160246899469287
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:vmmsT2hIC_0J:scholar.google.com/&scioq=FFCA-Net:+Stereo+Image+Compression+via+Fast+Cascade+Alignment+of+Side+Information&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "Tsinghua University;Harbin Institute of Technology;Pengcheng Laboratory",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;http://en.hhit.edu.cn/;",
        "aff_unique_abbr": "THU;HIT;",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Shenzhen",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "pUy4mGPmUy",
        "title": "Optimization Framework of Transfer Learning and its Feasibility",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Transfer learning is a fast developing paradigm for utilizing existing knowledge from previous learning tasks to improve the performance of new ones. It has enjoyed numerous empirical successes and inspired a growing number of theoretical studies. This paper addresses the feasibility issue of transfer learning. It begins by establishing the necessary mathematical concepts and constructing a mathematical framework for transfer learning. It then identifies and formulates the three-step transfer learning procedure as an optimization problem, allowing for the resolution of the feasibility issue. Importantly, it demonstrates that under certain technical conditions, such as appropriate choice of loss functions and data sets, an optimal procedure for transfer learning exists. This study of the feasibility issue brings additional insights into various transfer learning problems. It sheds light on the impact of feature augmentation on model performance, explores potential extensions of domain adaptation, and examines the feasibility of efficient feature extractor transfer in image classification.",
        "keywords": "transfer learning;optimization framework;feasibility",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Haoyang Cao;Haotian Gu;Xin Guo",
        "authorids": "~Haoyang_Cao1;~Haotian_Gu1;~Xin_Guo6",
        "gender": "F;M;F",
        "homepage": "https://haoyang-cao.github.io/;;http://www.ieor.berkeley.edu/~xinguo",
        "dblp": "258/3548;258/2968;17/1430-1",
        "google_scholar": "6me8OQsAAAAJ;jSnolyAAAAAJ;",
        "orcid": "0000-0002-4140-893X;;",
        "linkedin": ";haotian-gu-3379b6132/;",
        "or_profile": "~Haoyang_Cao1;~Haotian_Gu1;~Xin_Guo6",
        "aff": "Johns Hopkins University;;University of California, Berkeley",
        "aff_domain": "jhu.edu;;berkeley.edu",
        "position": "Assistant Professor;;Full Professor",
        "bibtex": "@misc{\ncao2024optimization,\ntitle={Optimization Framework of Transfer Learning and its Feasibility},\nauthor={Haoyang Cao and Haotian Gu and Xin Guo},\nyear={2024},\nurl={https://openreview.net/forum?id=pUy4mGPmUy}\n}",
        "github": "",
        "project": "",
        "reviewers": "QBcv;Uz8e;f6nM;yVrx",
        "site": "https://openreview.net/forum?id=pUy4mGPmUy",
        "pdf_size": 931516,
        "rating": "3;3;3;5",
        "confidence": "3;3;4;4",
        "soundness": "3;4;3;2",
        "contribution": "2;2;2;2",
        "presentation": "3;4;3;2",
        "wc_summary": "80;53;84;39",
        "wc_strengths": "17;31;23;48",
        "wc_weaknesses": "127;58;162;131",
        "wc_questions": "123;56;3;106",
        "wc_review": "347;198;272;324",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            64.0,
            18.721645226849056
        ],
        "wc_strengths_avg": [
            29.75,
            11.648497757221744
        ],
        "wc_weaknesses_avg": [
            119.5,
            38.00328933131973
        ],
        "wc_questions_avg": [
            72.0,
            46.834816109385976
        ],
        "wc_review_avg": [
            285.25,
            57.23362211148269
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:9K_ttRpRGBIJ:scholar.google.com/&scioq=Optimization+Framework+of+Transfer+Learning+and+its+Feasibility&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Johns Hopkins University;University of California, Berkeley",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.jhu.edu;https://www.berkeley.edu",
        "aff_unique_abbr": "JHU;UC Berkeley",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Berkeley",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "pV94aMav9r",
        "title": "Cross-Task Gradient Harmonization for Meta-Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We introduce Dynamic Gradient Harmonization, a novel solution to the gradient conflict issue in optimization-based meta-learning. Meta-learning's goal is to adapt quickly to unseen tasks with limited training examples. A number of meta-learning strategies aim to identify an optimal model initialization, subsequently updating the meta-model interactively using gradients from adapted models fine-tuned on a variety of tasks. However, existing methods neglect potential conflicts among meta gradient updates from different tasks, hindering the meta-model's training. In response to this shortcoming, we propose a dynamic gradient harmonization technique. Our proposed technique harmonizes these conflicting gradient updates, enabling a unified, effective meta-model update. This is achieved by computing a primary gradient update from weighted aggregation of gradients from fine-tuned models, using an attention operator to emphasize the primary gradients. We also implement an explore-exploit mechanism to prevent over-commitment to local optima. Experimental results demonstrate the effectiveness of our approach, resulting in more efficient training and improved generalization to new tasks.",
        "keywords": "Few-shot Lerning;Meta-learning;Gradient Confliction",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Siyuan Sun;Hongyang Gao",
        "authorids": "~Siyuan_Sun1;~Hongyang_Gao1",
        "gender": "M;M",
        "homepage": ";https://faculty.sites.iastate.edu/hygao/",
        "dblp": ";200/7985",
        "google_scholar": ";jGmq0aEAAAAJ",
        "orcid": ";0000-0002-9020-9080",
        "linkedin": "siyuan-sun-00b402140/;hongyang-gao-74924690/",
        "or_profile": "~Siyuan_Sun1;~Hongyang_Gao1",
        "aff": "Iowa State University;Iowa State University",
        "aff_domain": "iastate.edu;iastate.edu",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nsun2024crosstask,\ntitle={Cross-Task Gradient Harmonization for Meta-Learning},\nauthor={Siyuan Sun and Hongyang Gao},\nyear={2024},\nurl={https://openreview.net/forum?id=pV94aMav9r}\n}",
        "github": "",
        "project": "",
        "reviewers": "2jNY;xtbH;1XqW;AKfw;cm6w;zD2n",
        "site": "https://openreview.net/forum?id=pV94aMav9r",
        "pdf_size": 1688984,
        "rating": "3;3;3;3;3;5",
        "confidence": "5;5;5;4;5;4",
        "soundness": "1;1;2;2;2;3",
        "contribution": "1;2;2;2;2;2",
        "presentation": "1;2;2;3;2;3",
        "wc_summary": "53;62;72;29;66;128",
        "wc_strengths": "5;63;24;37;22;24",
        "wc_weaknesses": "189;333;414;451;155;104",
        "wc_questions": "212;48;51;7;1;152",
        "wc_review": "459;506;561;524;244;408",
        "wc_reply_reviewers": "0;0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0;0",
        "reply_authors": "0;0;0;0;0;0",
        "rating_avg": [
            3.3333333333333335,
            0.7453559924999298
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            1.8333333333333333,
            0.6871842709362769
        ],
        "contribution_avg": [
            1.8333333333333333,
            0.3726779962499649
        ],
        "presentation_avg": [
            2.1666666666666665,
            0.6871842709362768
        ],
        "wc_summary_avg": [
            68.33333333333333,
            30.00370347510824
        ],
        "wc_strengths_avg": [
            29.166666666666668,
            17.77091881573813
        ],
        "wc_weaknesses_avg": [
            274.3333333333333,
            132.0955041711194
        ],
        "wc_questions_avg": [
            78.5,
            77.49139737200942
        ],
        "wc_review_avg": [
            450.3333333333333,
            104.25396342052848
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.632455532033676,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:CHdSdg-TnF8J:scholar.google.com/&scioq=Cross-Task+Gradient+Harmonization+for+Meta-Learning&hl=en&as_sdt=0,22",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Iowa State University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.iastate.edu",
        "aff_unique_abbr": "ISU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "pVKEFtGkM6",
        "title": "Investigating Uncertainty Calibration of Aligned Language Models under the Multiple-Choice Setting",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Despite the significant progress made in practical applications of aligned language models (LMs), they tend to be overconfident in output answers compared to the corresponding pre-trained LMs. In this work, we systematically evaluate the impact of the alignment process on logit-based uncertainty calibration of LMs under the multiple-choice setting. We first conduct a thoughtful empirical study on how aligned LMs differ in calibration from their pre-trained counterparts. Experimental results reveal that there are two distinct uncertainties in LMs under the multiple-choice setting, which are responsible for the answer decision and the format preference of the LMs, respectively. Then, we investigate the role of these two uncertainties on aligned LM's calibration through fine-tuning in simple synthetic alignment schemes and conclude that one reason for aligned LMs' overconfidence is the conflation of these two types of uncertainty. Furthermore, we examine the utility of common post-hoc calibration methods for aligned LMs and propose an easy-to-implement and sample-efficient method to calibrate aligned LMs. We hope our findings could provide insights into the design of more reliable alignment processes for LMs.",
        "keywords": "Uncertainty Quantification;Large Language Models",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/da72b14dcbc5886b13d4e6055c036735a6205ef5.zip",
        "author": "Guande He;Peng Cui;Jianfei Chen;Wenbo Hu;Jun Zhu",
        "authorids": "~Guande_He1;~Peng_Cui6;~Jianfei_Chen1;~Wenbo_Hu1;~Jun_Zhu2",
        "gender": ";M;M;;M",
        "homepage": "https://guandehe.github.io/;https://scholar.google.com/citations?user=c_VTs5MAAAAJ&hl=zh-CN;http://ml.cs.tsinghua.edu.cn/~jianfei;;http://ml.cs.tsinghua.edu.cn/~jun",
        "dblp": "348/7035.html;31/891-7;48/6809-1;;50/2644-1",
        "google_scholar": "3rddMeMAAAAJ;c_VTs5MAAAAJ;di5RZ1MAAAAJ;;axsP38wAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Guande_He1;~Peng_Cui6;~Jianfei_Chen1;~Wenbo_Hu1;~Jun_Zhu2",
        "aff": "Tsinghua University;Tsinghua University;Tsinghua University;;Tsinghua University",
        "aff_domain": "mails.tsinghua.edu.cn;cs.tsinghua.edu.cn;tsinghua.edu.cn;;mail.tsinghua.edu.cn",
        "position": "MS student;PhD student;Associate Professor;;Professor",
        "bibtex": "@misc{\nhe2024investigating,\ntitle={Investigating Uncertainty Calibration of Aligned Language Models under the Multiple-Choice Setting},\nauthor={Guande He and Peng Cui and Jianfei Chen and Wenbo Hu and Jun Zhu},\nyear={2024},\nurl={https://openreview.net/forum?id=pVKEFtGkM6}\n}",
        "github": "",
        "project": "",
        "reviewers": "rsG2;PsUf;2HUS;cVsf",
        "site": "https://openreview.net/forum?id=pVKEFtGkM6",
        "pdf_size": 794790,
        "rating": "5;5;6;6",
        "confidence": "4;4;3;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;2",
        "presentation": "2;2;2;4",
        "wc_summary": "116;143;84;267",
        "wc_strengths": "31;35;64;74",
        "wc_weaknesses": "443;280;475;188",
        "wc_questions": "22;74;92;1",
        "wc_review": "612;532;715;530",
        "wc_reply_reviewers": "173;0;15;43",
        "wc_reply_authors": "1962;1394;793;576",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "4;2;2;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            152.5,
            69.32712311931024
        ],
        "wc_strengths_avg": [
            51.0,
            18.398369492974098
        ],
        "wc_weaknesses_avg": [
            346.5,
            117.65309175708049
        ],
        "wc_questions_avg": [
            47.25,
            37.06329046374593
        ],
        "wc_review_avg": [
            597.25,
            75.60216597426293
        ],
        "wc_reply_reviewers_avg": [
            57.75,
            68.30583796426188
        ],
        "wc_reply_authors_avg": [
            1181.25,
            541.271362165042
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.8660254037844386
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15860118967647519295&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Tsinghua University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "pVaMBfI2eR",
        "title": "Dual Prompt Tuning for Domain-Aware Federated Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Federated learning is a distributed machine learning paradigm that allows multiple clients to collaboratively train a shared model with their local data. Nonetheless, conventional federated learning algorithms often struggle to generalize well due to the ubiquitous domain shift across clients. In this work, we consider a challenging yet realistic federated learning scenario where the training data of each client originates from different domains. We address the challenges of domain shift by leveraging the technique of prompt learning, and propose a novel method called Federated Dual Prompt Tuning (Fed-DPT). Specifically, Fed-DPT employs a pre-trained vision-language model and then applies both visual and textual prompt tuning to facilitate domain adaptation over decentralized data. Extensive experiments of Fed-DPT demonstrate its significant effectiveness in domain-aware federated learning. With a pre-trained CLIP model (ViT-Base as image encoder), the proposed Fed-DPT attains 68.4% average accuracy over six domains in the DomainNet dataset, which improves the original CLIP by a large margin of 14.8%.",
        "keywords": "Federated Learning;CLIP;Prompt Learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/c327e5cfd4c1ecc5c78ca466a8cbe68decc1a67a.pdf",
        "author": "Guoyizhe Wei;Feng Wang;Anshul Shah;Rama Chellappa",
        "authorids": "~Guoyizhe_Wei1;~Feng_Wang14;~Anshul_Shah1;~Rama_Chellappa1",
        "gender": ";M;M;",
        "homepage": ";https://wangf3014.github.io/home;;",
        "dblp": ";90/4225-47;250/5430;",
        "google_scholar": ";;akf8VG8AAAAJ;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Guoyizhe_Wei1;~Feng_Wang14;~Anshul_Shah1;~Rama_Chellappa1",
        "aff": ";Johns Hopkins University;Johns Hopkins University;",
        "aff_domain": ";jh.edu;jhu.edu;",
        "position": ";PhD student;PhD student;",
        "bibtex": "@misc{\nwei2024dual,\ntitle={Dual Prompt Tuning for Domain-Aware Federated Learning},\nauthor={Guoyizhe Wei and Feng Wang and Anshul Shah and Rama Chellappa},\nyear={2024},\nurl={https://openreview.net/forum?id=pVaMBfI2eR}\n}",
        "github": "",
        "project": "",
        "reviewers": "gJe5;bGQ3;WuFt",
        "site": "https://openreview.net/forum?id=pVaMBfI2eR",
        "pdf_size": 339480,
        "rating": "5;5;5",
        "confidence": "4;5;4",
        "soundness": "2;2;3",
        "contribution": "2;2;2",
        "presentation": "3;2;3",
        "wc_summary": "51;49;73",
        "wc_strengths": "50;38;72",
        "wc_weaknesses": "152;115;113",
        "wc_questions": "14;131;23",
        "wc_review": "267;333;281",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "365;742;392",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;2;1",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            57.666666666666664,
            10.873004286866726
        ],
        "wc_strengths_avg": [
            53.333333333333336,
            14.079141387961917
        ],
        "wc_weaknesses_avg": [
            126.66666666666667,
            17.93197020841702
        ],
        "wc_questions_avg": [
            56.0,
            53.16013544000805
        ],
        "wc_review_avg": [
            293.6666666666667,
            28.394052585395805
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            499.6666666666667,
            171.70970334323633
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1007073762712240420&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Johns Hopkins University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.jhu.edu",
        "aff_unique_abbr": "JHU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "pXEnurdRAx",
        "title": "Multi-Scale Generative Modeling in Wavelet Domain",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "While working within the spatial domain can pose problems associated with ill-conditioned scores, recent advancements in diffusion-based generative models have shown that transitioning to the wavelet domain offers a promising alternative. However, within the wavelet domain, we encounter unique complexities, especially the sparse representation of high-frequency coefficients, which deviates significantly from the Gaussian assumptions in the diffusion process. To this end, we propose developing a multi-scale generative model directly within the wavelet domain using Generative Adversarial Networks. This Multi-Scale Generative Model in the Wavelet Domain (i.e., Wavelet  Multi-Scale Generative Model (WMGM)) leverages the benefits of wavelet coefficients, with a specific emphasis on using low-frequency coefficients as conditioning variables. Based on theoretical analysis and experimental results, our model provides a pioneering framework for implementing generative models in the wavelet domain, showcasing remarkable performance improvements and significant reduction in trainable parameters, sampling steps and time. This innovative approach represents a promising step forward in the field of diffusion modeling techniques.",
        "keywords": "wavelet transform; score-based generative model; diffusion model; wavelet decomposition",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/2378113b522e9d9ed654fae7a7345c67a95dda85.pdf",
        "author": "Xiongye Xiao;Shixuan Li;Luzhe Huang;Gengshuo Liu;Trung-Kien Nguyen;Yi Huang;Di Chang;Paul Bogdan",
        "authorids": "~Xiongye_Xiao1;~Shixuan_Li2;~Luzhe_Huang1;~Gengshuo_Liu1;~Trung-Kien_Nguyen1;~Yi_Huang7;~Di_Chang1;~Paul_Bogdan1",
        "gender": "M;M;M;M;M;M;M;M",
        "homepage": ";https://github.com/Shixuan01;https://porphura.github.io;;https://www.linkedin.com/in/kien-nguyen-321163104/;;https://boese0601.github.io/;https://cps.usc.edu/",
        "dblp": "301/0208;;252/5557;;;15/6040-10;122/2664;05/5539",
        "google_scholar": "AvIxA64AAAAJ;;qq9rtkkAAAAJ;https://scholar.google.com/citations?hl=en;cV47nosAAAAJ;;https://scholar.google.com.hk/citations?hl=en;Xw_v8-gAAAAJ",
        "orcid": "0000-0002-3181-7166;;;;;0000-0002-8443-6877;;0000-0003-2118-0816",
        "linkedin": ";;\u7490\u54f2-\u9ec4-59854b155/;gengshuo-liu/;;;di-chang-004784206/;paul-bogdan-4b098a6/",
        "or_profile": "~Xiongye_Xiao1;~Shixuan_Li2;~Luzhe_Huang1;~Gengshuo_Liu1;~Trung-Kien_Nguyen1;~Yi_Huang7;~Di_Chang1;~Paul_Bogdan1",
        "aff": "University of Southern California;University of Southern California;University of California, Los Angeles;University of Southern California;University of Southern California;Shenzhen Institute of Advanced Technology, Chinese Academy of Sciences;ByteDance Inc.;University of Southern California",
        "aff_domain": "usc.edu;usc.edu;ucla.edu;usc.edu;usc.edu;siat.ac.cn;bytedance.com;usc.edu",
        "position": "PhD student;PhD student;PhD student;PhD student;PhD student;PhD student;Intern;Jack Munushian Early Career Chair associate professor",
        "bibtex": "@misc{\nxiao2024multiscale,\ntitle={Multi-Scale Generative Modeling in Wavelet Domain},\nauthor={Xiongye Xiao and Shixuan Li and Luzhe Huang and Gengshuo Liu and Trung-Kien Nguyen and Yi Huang and Di Chang and Paul Bogdan},\nyear={2024},\nurl={https://openreview.net/forum?id=pXEnurdRAx}\n}",
        "github": "",
        "project": "",
        "reviewers": "LWzA;UdWx;3QFf",
        "site": "https://openreview.net/forum?id=pXEnurdRAx",
        "pdf_size": 15580027,
        "rating": "1;3;8",
        "confidence": "3;4;2",
        "soundness": "1;2;4",
        "contribution": "1;2;4",
        "presentation": "1;2;4",
        "wc_summary": "134;116;79",
        "wc_strengths": "21;18;72",
        "wc_weaknesses": "498;93;66",
        "wc_questions": "3;77;22",
        "wc_review": "656;304;239",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "2058;410;143",
        "reply_reviewers": "0;0;0",
        "reply_authors": "5;1;1",
        "rating_avg": [
            4.0,
            2.943920288775949
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "contribution_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "presentation_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "wc_summary_avg": [
            109.66666666666667,
            22.895899681432528
        ],
        "wc_strengths_avg": [
            37.0,
            24.779023386727733
        ],
        "wc_weaknesses_avg": [
            219.0,
            197.59048560090133
        ],
        "wc_questions_avg": [
            34.0,
            31.379398762032817
        ],
        "wc_review_avg": [
            399.6666666666667,
            183.18721449805267
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            870.3333333333334,
            846.8515546160115
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            1.8856180831641267
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.6933752452815365,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:aXvSRoOUa_4J:scholar.google.com/&scioq=Multi-Scale+Generative+Modeling+in+Wavelet+Domain&hl=en&as_sdt=0,48",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;0;2;3;0",
        "aff_unique_norm": "University of Southern California;University of California, Los Angeles;Shenzhen Institute of Advanced Technology;ByteDance",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.usc.edu;https://www.ucla.edu;http://www.siat.cas.cn;https://www.bytedance.com",
        "aff_unique_abbr": "USC;UCLA;SIAT;ByteDance",
        "aff_campus_unique_index": "0;0;0;0;0;1;0",
        "aff_campus_unique": "Los Angeles;Shenzhen;",
        "aff_country_unique_index": "0;0;0;0;0;1;1;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "pXt2EP0PW1",
        "title": "Distribution-Free Fair Federated Learning with Small Samples",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "As federated learning gains increasing importance in real-world applications due to its capacity for decentralized data training, addressing fairness concerns across demographic groups becomes critically important. However, most existing machine learning algorithms for ensuring fairness are designed for centralized data environments and generally require large-sample and distributional assumptions, underscoring the urgent need for fairness techniques adapted for decentralized systems with finite-sample and distribution-free guarantees. To address this issue, this paper introduces FedFaiREE, a post-processing algorithm developed specifically for distribution-free fair learning in decentralized setting with small samples. Our approach accounts for unique challenges in decentralized environments, such as client heterogeneity, communication costs, and small sample sizes frequently encountered in practical applications. We provide rigorous theoretical guarantees for both fairness and accuracy, and our experimental results further provide robust empirical validation of these theoretical claims.",
        "keywords": "Federated Learning;Fairness;Fair Federated Classifier;Distribution-Free;Finite-sample;Client Heterogeneity",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/807b1acfe7eef073ada22b757cbb5fab43bfe1e7.zip",
        "author": "Qichuan Yin;Junzhou Huang;Huaxiu Yao;Linjun Zhang",
        "authorids": "~Qichuan_Yin1;~Junzhou_Huang2;~Huaxiu_Yao1;~Linjun_Zhang1",
        "gender": "M;M;M;M",
        "homepage": ";http://ranger.uta.edu/~huang/;http://huaxiuyao.mystrikingly.com;",
        "dblp": ";22/1170.html;197/1635;",
        "google_scholar": ";https://scholar.google.com.tw/citations?user=X7KrguAAAAAJ;A20BZnQAAAAJ;TUAzs3sAAAAJ",
        "orcid": ";0000-0002-9548-1227;;",
        "linkedin": "%E7%90%AA%E5%B7%9D-%E6%AE%B7-055a91291/;;huaxiuyao/;",
        "or_profile": "~Qichuan_Yin1;~Junzhou_Huang2;~Huaxiu_Yao1;~Linjun_Zhang1",
        "aff": "Peking University;University of Texas, Arlington;Department of Computer Science, University of North Carolina at Chapel Hill;Rutgers University",
        "aff_domain": "pku.edu.cn;uta.edu;cs.unc.edu;rutgers.edu",
        "position": "Undergrad student;Full Professor;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nyin2024distributionfree,\ntitle={Distribution-Free Fair Federated Learning with Small Samples},\nauthor={Qichuan Yin and Junzhou Huang and Huaxiu Yao and Linjun Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=pXt2EP0PW1}\n}",
        "github": "",
        "project": "",
        "reviewers": "6gnc;1atA;NaPJ;XnRQ;7R45",
        "site": "https://openreview.net/forum?id=pXt2EP0PW1",
        "pdf_size": 3389878,
        "rating": "5;5;5;6;8",
        "confidence": "3;2;2;4;3",
        "soundness": "3;2;2;1;3",
        "contribution": "2;2;2;1;3",
        "presentation": "3;1;2;2;3",
        "wc_summary": "112;41;87;65;102",
        "wc_strengths": "83;43;17;68;81",
        "wc_weaknesses": "97;75;187;364;54",
        "wc_questions": "2;10;69;261;145",
        "wc_review": "294;169;360;758;382",
        "wc_reply_reviewers": "0;0;0;13;53",
        "wc_reply_authors": "296;303;313;2369;752",
        "reply_reviewers": "0;0;0;1;1",
        "reply_authors": "1;1;1;4;1",
        "rating_avg": [
            5.8,
            1.16619037896906
        ],
        "confidence_avg": [
            2.8,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.2,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            2.2,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            81.4,
            25.663982543634962
        ],
        "wc_strengths_avg": [
            58.4,
            25.13642774938396
        ],
        "wc_weaknesses_avg": [
            155.4,
            113.72704163918097
        ],
        "wc_questions_avg": [
            97.4,
            96.51652708215315
        ],
        "wc_review_avg": [
            392.6,
            197.18580070583175
        ],
        "wc_reply_reviewers_avg": [
            13.2,
            20.527055317312318
        ],
        "wc_reply_authors_avg": [
            806.6,
            800.2551093245204
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.6,
            1.2
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.412514323662695,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10460065875176848194&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Peking University;University of Texas at Arlington;University of North Carolina at Chapel Hill;Rutgers University",
        "aff_unique_dep": ";;Department of Computer Science;",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.uta.edu;https://www.unc.edu;https://www.rutgers.edu",
        "aff_unique_abbr": "Peking U;UTA;UNC Chapel Hill;Rutgers",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Arlington;Chapel Hill",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "pY41mVG3jw",
        "title": "MetaGen: Assessing Conditions of Generalization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The Machine Learning (ML) community has been criticized for irreproducible results that do not generalize. Current ML practices identify the best-performing configuration by sampling a limited set of them (e.g. with Hyperparameter Optimization) and evaluating their performance. Model comparison is then performed by aggregating the performance of several trials (e.g. with ANOVA) or based on the best-performing trial (proof-by-existence). We find that both methods of comparison can be inapplicable as ML performance metrics with their corresponding hyperparameter configurations, performance manifold, have unequal variance (heteroscedastic). As such, it is important to know what hyperparameters perform robustly, conditions of generalization. To our knowledge, our work is the first to evaluate the model comparison problem in ML that impacts the safety of existing HPO methods as well as the explainability of the configurations for which a model improves. We propose MetaGen for uncertainty estimation on the performance manifold and identify contiguous regions of consistent performance. We use Meta Gen for post-hoc analysis to compare between hyperparameter regions as opposed to single-point estimates. We extend MetaGen in an online manner and apply HPO on the hyperparameter region for which a method performs robustly. When used for post-hoc analysis, MetaGen avoids bias from misleading evidence by outliers or aggregate effects and improves the explainability of a method\u2019s performance. When used in an online manner, our method can improve the safety of systems that need to be iteratively re-trained by improving the robustness and performance by as much as 5.22% for the three HPO sampling methods that we evaluate. We use the results of 61,475 experimental trials from Transformer, VGG, ResNet trained on 8 different datasets, 200,628 trials from 3 NAS benchmarks and evaluate our method in identifying the hyperparameter regions where a model performs robustly. Our method improves model comparison and is robust to heteroscedasticity.",
        "keywords": "Generalization;HPO;Model Comparison;Bayesian",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Iordanis Fostiropoulos;Laurent Itti",
        "authorids": "~Iordanis_Fostiropoulos1;~Laurent_Itti1",
        "gender": "M;M",
        "homepage": "https://iordanis.me;http://ilab.usc.edu",
        "dblp": "227/5493;31/3256",
        "google_scholar": "XTLv1v8AAAAJ;xhUvqK8AAAAJ",
        "orcid": ";0000-0002-0168-2977",
        "linkedin": ";",
        "or_profile": "~Iordanis_Fostiropoulos1;~Laurent_Itti1",
        "aff": ";University of Southern California",
        "aff_domain": ";usc.edu",
        "position": ";Professor",
        "bibtex": "@misc{\nfostiropoulos2024metagen,\ntitle={MetaGen: Assessing Conditions of Generalization},\nauthor={Iordanis Fostiropoulos and Laurent Itti},\nyear={2024},\nurl={https://openreview.net/forum?id=pY41mVG3jw}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=pY41mVG3jw",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:xUAYIdqcLpwJ:scholar.google.com/&scioq=MetaGen:+Assessing+Conditions+of+Generalization&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Southern California",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.usc.edu",
        "aff_unique_abbr": "USC",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Los Angeles",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "pYmQId95iR",
        "title": "RLP: A reinforcement learning benchmark for neural algorithmic reasoning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Algorithmic reasoning is a fundamental cognitive ability that plays a pivotal role in problem-solving and decision-making processes.\nAlthough Reinforcement Learning (RL) has demonstrated remarkable proficiency in tasks such as motor control, handling perceptual input, and managing stochastic environments, its potential in learning generalizable and complex algorithms remains largely unexplored.\nTo evaluate the current state of algorithmic reasoning in RL, we introduce an RL benchmark based on Simon Tatham's Portable Puzzle Collection.\nThis benchmark contains 40 diverse logic puzzles of varying complexity levels, which serve as captivating challenges that test cognitive abilities, particularly in neural algorithmic reasoning.\nOur findings demonstrate that current RL approaches struggle with neural algorithmic reasoning, emphasizing the need for further research in this area.\nAll of the software, including the environment, is available at https://github.com/rlppaper/rlp.",
        "keywords": "reinforcement learning;benchmark;algorithmic reasoning;logic puzzles",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/985b5dc29fef7ff1f2ba69c82c3f2ab9b7915d3b.pdf",
        "author": "Yannick Niedermayr;Luca A Lanzend\u00f6rfer;Benjamin Estermann;Roger Wattenhofer",
        "authorids": "~Yannick_Niedermayr1;~Luca_A_Lanzend\u00f6rfer1;~Benjamin_Estermann1;~Roger_Wattenhofer1",
        "gender": ";M;Not Specified;Not Specified",
        "homepage": ";;https://disco.ethz.ch/members/besterma;https://disco.ethz.ch/members/wroger",
        "dblp": ";;277/5034;w/RogerWattenhofer",
        "google_scholar": ";;zawztfkAAAAJ;https://scholar.google.ch/citations?user=EG3VPm4AAAAJ",
        "orcid": ";;;",
        "linkedin": "yannick-niedermayr;luca-lanzendoerfer/;;roger-wattenhofer-4466731/",
        "or_profile": "~Yannick_Niedermayr1;~Luca_A_Lanzend\u00f6rfer1;~Benjamin_Estermann1;~Roger_Wattenhofer1",
        "aff": ";ETHZ - ETH Zurich;Google;Swiss Federal Institute of Technology",
        "aff_domain": ";ethz.ch;google.com;ethz.ch",
        "position": ";PhD student;Intern;Full Professor",
        "bibtex": "@misc{\nniedermayr2024rlp,\ntitle={{RLP}: A reinforcement learning benchmark for neural algorithmic reasoning},\nauthor={Yannick Niedermayr and Luca A Lanzend{\\\"o}rfer and Benjamin Estermann and Roger Wattenhofer},\nyear={2024},\nurl={https://openreview.net/forum?id=pYmQId95iR}\n}",
        "github": "",
        "project": "",
        "reviewers": "K1q1;gz2k;phJ7;X31L",
        "site": "https://openreview.net/forum?id=pYmQId95iR",
        "pdf_size": 1674973,
        "rating": "3;3;5;6",
        "confidence": "4;5;4;3",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "36;67;58;81",
        "wc_strengths": "31;107;31;125",
        "wc_weaknesses": "82;408;113;184",
        "wc_questions": "1;487;504;37",
        "wc_review": "150;1069;706;427",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "416;723;1037;587",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            60.5,
            16.347782724271816
        ],
        "wc_strengths_avg": [
            73.5,
            42.97382924525112
        ],
        "wc_weaknesses_avg": [
            196.75,
            127.44680262760616
        ],
        "wc_questions_avg": [
            257.25,
            238.66543004800675
        ],
        "wc_review_avg": [
            588.0,
            340.23888666641267
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            690.75,
            227.5855608337225
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10887662752997381877&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "ETH Zurich;Google;Swiss Federal Institute of Technology",
        "aff_unique_dep": ";Google;",
        "aff_unique_url": "https://www.ethz.ch;https://www.google.com;https://www.ethz.ch",
        "aff_unique_abbr": "ETHZ;Google;ETH Zurich",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Switzerland;United States"
    },
    {
        "id": "pZhdz4oyzo",
        "title": "SqueezeLLM: Dense and Sparse Quantization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Generative Large Language Models (LLMs) have demonstrated remarkable results for a wide range of tasks. However, deploying these models for inference has been a significant challenge due to their unprecedented resource requirements. This has forced existing deployment frameworks to use multi-GPU inference pipelines, which are often complex and costly, or to use smaller and less performant models. In this work, we demonstrate that the main bottleneck for generative inference with LLMs is memory bandwidth, rather than compute, specifically for single batch inference. While quantization has emerged as a promising solution by representing weights with reduced precision, previous efforts have often resulted in notable performance degradation. To address this, we introduce SqueezeLLM, a post-training quantization framework that not only enables lossless compression to ultra-low precisions of up to 3-bit, but also achieves higher quantization performance under the same memory constraint. Our framework incorporates two novel ideas: (i) sensitivity-based non-uniform quantization, which searches for the optimal bit precision assignment based on second-order information; and (ii) the Dense-and-Sparse decomposition that stores outliers and sensitive weight values in an efficient sparse format. When applied to the LLaMA models, our 3-bit quantization significantly reduces the perplexity gap from the FP16 baseline by up to 2.1\u00d7 as compared to the state-of-the-art methods with the same memory requirement. Furthermore, when deployed on an A6000 GPU, our quantized models achieve up to 2.3\u00d7 speedup compared to the baseline.",
        "keywords": "Quantization;model compression;efficient LLM;efficient inference",
        "primary_area": "infrastructure, software libraries, hardware, etc.",
        "supplementary_material": "/attachment/7520d2b1aefa5d43a1540be76e2fe9c68d8f9eac.pdf",
        "author": "Sehoon Kim;Coleman Richard Charles Hooper;Amir Gholami;Zhen Dong;Xiuyu Li;Sheng Shen;Michael W. Mahoney;Kurt Keutzer",
        "authorids": "~Sehoon_Kim1;~Coleman_Richard_Charles_Hooper1;~Amir_Gholami2;~Zhen_Dong3;~Xiuyu_Li1;~Sheng_Shen2;~Michael_W._Mahoney1;~Kurt_Keutzer1",
        "gender": "M;M;;M;Not Specified;M;;M",
        "homepage": "https://sehoonkim.org;https://www.linkedin.com/in/coleman-hooper-165061193/;;https://dong-zhen.com/;https://xiuyuli.com/;https://sincerass.github.io;;https://people.eecs.berkeley.edu/~keutzer/",
        "dblp": ";;;;279/5847;138/5764-1.html;;k/KurtKeutzer.html",
        "google_scholar": "zQABr7QAAAAJ;si-368wAAAAJ;;czxMUzcAAAAJ;https://scholar.google.com/citations?;https://scholar.google.com/citations?hl=en;;ID9QePIAAAAJ",
        "orcid": ";;;;;;;0000-0003-3868-8501",
        "linkedin": "sehoon-kim-13a1b51b1/;;;zhen-dong/;;sheng-s-ab198a174/;;kurtkeutzer/",
        "or_profile": "~Sehoon_Kim1;~Coleman_Richard_Charles_Hooper1;~Amir_Gholami2;~Zhen_Dong3;~Xiuyu_Li1;~Sheng_Shen2;~Michael_W._Mahoney1;~Kurt_Keutzer1",
        "aff": "University of California, Berkeley;University of California, Berkeley;;Nexusflow.ai Inc;University of California, Berkeley;University of California, Berkeley;;University of California, Berkeley",
        "aff_domain": "berkeley.edu;berkeley.edu;;nexusflow.ai;berkeley.edu;berkeley.edu;;berkeley.edu",
        "position": "PhD student;PhD student;;Principal Researcher;PhD student;PhD student;;Full Professor",
        "bibtex": "@misc{\nkim2024squeezellm,\ntitle={Squeeze{LLM}: Dense and Sparse Quantization},\nauthor={Sehoon Kim and Coleman Richard Charles Hooper and Amir Gholami and Zhen Dong and Xiuyu Li and Sheng Shen and Michael W. Mahoney and Kurt Keutzer},\nyear={2024},\nurl={https://openreview.net/forum?id=pZhdz4oyzo}\n}",
        "github": "",
        "project": "",
        "reviewers": "sqPk;Ed31;U5Sb;7Q1V",
        "site": "https://openreview.net/forum?id=pZhdz4oyzo",
        "pdf_size": 459439,
        "rating": "5;5;5;8",
        "confidence": "4;4;3;4",
        "soundness": "3;2;3;4",
        "contribution": "2;2;3;2",
        "presentation": "3;2;3;3",
        "wc_summary": "119;79;81;184",
        "wc_strengths": "141;51;81;63",
        "wc_weaknesses": "224;283;194;169",
        "wc_questions": "57;3;77;26",
        "wc_review": "541;416;433;442",
        "wc_reply_reviewers": "0;83;463;15",
        "wc_reply_authors": "853;795;2337;348",
        "reply_reviewers": "0;1;3;1",
        "reply_authors": "3;3;5;2",
        "rating_avg": [
            5.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            115.75,
            42.50514674718816
        ],
        "wc_strengths_avg": [
            84.0,
            34.597687784012386
        ],
        "wc_weaknesses_avg": [
            217.5,
            42.53527947480773
        ],
        "wc_questions_avg": [
            40.75,
            28.375825979167548
        ],
        "wc_review_avg": [
            458.0,
            48.821101994936576
        ],
        "wc_reply_reviewers_avg": [
            140.25,
            188.9462555860793
        ],
        "wc_reply_authors_avg": [
            1083.25,
            749.7640878969864
        ],
        "reply_reviewers_avg": [
            1.25,
            1.0897247358851685
        ],
        "reply_authors_avg": [
            3.25,
            1.0897247358851685
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 215,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9711254670478924456&as_sdt=4005&sciodt=0,6&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;0;1;0;0;0",
        "aff_unique_norm": "University of California, Berkeley;Nexusflow.ai",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.berkeley.edu;https://www.nexusflow.ai",
        "aff_unique_abbr": "UC Berkeley;Nexusflow.ai",
        "aff_campus_unique_index": "0;0;0;0;0",
        "aff_campus_unique": "Berkeley;",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "padGeokNrH",
        "title": "Sample as you Infer: Predictive Coding with Langevin Dynamics",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We present a novel algorithm for parameter learning in generic deep generative models that builds upon the predictive coding (PC) framework of computational neuroscience. Our approach modifies the standard PC algorithm to bring performance on-par and exceeding that obtained from standard variational auto-encoder (VAE) training. By injecting Gaussian noise into the PC inference procedure we re-envision it as an overdamped Langevin sampling, which facilitates optimisation with respect to a tight evidence lower bound (ELBO). We improve the resultant encoder-free training method by incorporating an encoder network to provide an amortised warm-start to our Langevin sampling and test three different objectives for doing so. Finally, to increase robustness to the sampling step size and reduce sensitivity to curvature, we validate a lightweight and easily computable form of preconditioning, inspired by Riemann Manifold Langevin and adaptive optimizers from the SGD literature.  We compare against VAEs by training like-for-like generative models using our technique against those trained with standard reparameterisation-trick-based ELBOs. We observe our method out-performs or matches performance across a number of metrics, including sample quality, while converging in a fraction of the number of SGD training iterations.",
        "keywords": "predictive coding;variational autoencoders;langevin sampling;hamiltonian monte carlo;riemann manifold langevin",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Umais Zahid;Qinghai Guo;AIERSI TUERHONG;Zafeirios Fountas",
        "authorids": "~Umais_Zahid1;~Qinghai_Guo1;~AIERSI_TUERHONG1;~Zafeirios_Fountas1",
        "gender": "M;M;M;M",
        "homepage": "https://umais.me/;https://www.semanticscholar.org/author/Qinghai-Guo/47747957;https://github.com/Airs702;http://zfountas.com/",
        "dblp": ";12/8502;;",
        "google_scholar": ";;;https://scholar.google.co.uk/citations?user=aaEGHR4AAAAJ",
        "orcid": ";0000-0003-4697-9464;;0000-0002-6312-3409",
        "linkedin": "umaisz;;;zfountas/",
        "or_profile": "~Umais_Zahid1;~Qinghai_Guo1;~AIERSI_TUERHONG1;~Zafeirios_Fountas1",
        "aff": "Huawei Technologies Ltd.;Huawei Technologies Ltd.;Chongqing University;Huawei Technologies Ltd.",
        "aff_domain": "huawei.com;huawei.com;cqu.edu.cn;huawei.com",
        "position": "Researcher;Researcher;Undergrad student;Principal Researcher",
        "bibtex": "@misc{\nzahid2024sample,\ntitle={Sample as you Infer: Predictive Coding with Langevin Dynamics},\nauthor={Umais Zahid and Qinghai Guo and AIERSI TUERHONG and Zafeirios Fountas},\nyear={2024},\nurl={https://openreview.net/forum?id=padGeokNrH}\n}",
        "github": "",
        "project": "",
        "reviewers": "9aXX;5e67;x7AB;kPGx;LejG",
        "site": "https://openreview.net/forum?id=padGeokNrH",
        "pdf_size": 5079683,
        "rating": "3;3;3;5;5",
        "confidence": "3;4;4;3;4",
        "soundness": "2;3;3;2;3",
        "contribution": "2;2;2;3;2",
        "presentation": "3;3;4;4;3",
        "wc_summary": "98;53;59;41;155",
        "wc_strengths": "41;46;43;54;78",
        "wc_weaknesses": "149;324;162;2;113",
        "wc_questions": "46;21;20;153;42",
        "wc_review": "334;444;284;250;388",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            3.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            3.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            81.2,
            41.55189526363388
        ],
        "wc_strengths_avg": [
            52.4,
            13.54400236266961
        ],
        "wc_weaknesses_avg": [
            150.0,
            103.6281814951898
        ],
        "wc_questions_avg": [
            56.4,
            49.447345732607324
        ],
        "wc_review_avg": [
            340.0,
            69.84554388076593
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.16666666666666663,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12240588447042322887&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Huawei;Chongqing University",
        "aff_unique_dep": "Huawei Technologies;",
        "aff_unique_url": "https://www.huawei.com;https://www.cqu.edu.cn",
        "aff_unique_abbr": "Huawei;CQU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "pbLjYjjWqd",
        "title": "FedBPT: Efficient Federated Black-box Prompt Tuning for Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Pre-trained language models (PLM) have revolutionized the NLP landscape, achieving stellar performances across diverse tasks. These models, while benefiting from vast training data, often require fine-tuning on specific data to cater to distinct downstream tasks. However, this data adaptation process has inherent security and privacy concerns, primarily when leveraging user-generated, device-residing data. Federated learning (FL) provides a solution, allowing collaborative model fine-tuning without centralized data collection. However, applying FL to finetune PLMs is hampered by challenges, including restricted model parameter access, high computational requirements, and communication overheads. This paper introduces Federated Black-box Prompt Tuning (FedBPT), a framework designed to address these challenges. FedBPT does not require the clients to access the model parameters. By focusing on training optimal prompts and utilizing gradient-free optimization methods, FedBPT reduces the number of exchanged variables, boosts communication efficiency, and minimizes computational and storage costs. Experiments highlight the framework's ability to drastically cut communication and memory costs while maintaining competitive performance. Ultimately, FedBPT presents a promising solution for efficient, privacy-preserving fine-tuning of PLM in the age of large language models.",
        "keywords": "Federated learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Jingwei Sun;Ziyue Xu;Hongxu Yin;Dong Yang;Daguang Xu;Yiran Chen;Holger R Roth",
        "authorids": "~Jingwei_Sun2;~Ziyue_Xu1;~Hongxu_Yin2;~Dong_Yang1;~Daguang_Xu2;~Yiran_Chen1;~Holger_R_Roth1",
        "gender": "M;M;M;M;M;M;M",
        "homepage": ";;;https://daguangxu.net/;https://ece.duke.edu/people/yiran-chen/;http://www.holgerroth.com;https://hongxu-yin.github.io/",
        "dblp": "66/7761-2;59/9160-1.html;33/412-5;;80/1641;42/8528;166/3425",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;gmUta74AAAAJ;PHvliUgAAAAJ;r_VHYHAAAAAJ;;https://scholar.google.co.jp/citations?user=pzNwAsEAAAAJ;4gdSoOYAAAAJ",
        "orcid": ";0000-0002-5728-6869;0000-0002-5031-4337;;0000-0002-1486-8412;0000-0002-3662-8743;",
        "linkedin": ";xu-ziyue-89143515/;dong-yang-thu/;;;;",
        "or_profile": "~Jingwei_Sun2;~Ziyue_Xu1;~Dong_Yang1;~Daguang_Xu2;~Yiran_Chen1;~Holger_R_Roth1;~Hongxu_Yin1",
        "aff": "Duke University;NVIDIA;NVIDIA;NVIDIA;Duke University;NVIDIA;NVIDIA",
        "aff_domain": "duke.edu;nvidia.com;nvidia.com;nvidia.com;duke.edu;nvidia.com;nvidia.com",
        "position": "PhD student;Senior Scientist;Research Scientist;Research Manager;Professor;Principal Researcher;Senior Research Scientist",
        "bibtex": "@misc{\nsun2024fedbpt,\ntitle={Fed{BPT}: Efficient Federated Black-box Prompt Tuning for Large Language Models},\nauthor={Jingwei Sun and Ziyue Xu and Hongxu Yin and Dong Yang and Daguang Xu and Yiran Chen and Holger R Roth},\nyear={2024},\nurl={https://openreview.net/forum?id=pbLjYjjWqd}\n}",
        "github": "",
        "project": "",
        "reviewers": "juc2;2J6K;uWcP;zMti;2fPJ;aHU5",
        "site": "https://openreview.net/forum?id=pbLjYjjWqd",
        "pdf_size": 2143377,
        "rating": "3;5;5;5;6;6",
        "confidence": "5;3;4;4;4;3",
        "soundness": "2;2;2;3;2;3",
        "contribution": "2;2;3;2;3;2",
        "presentation": "3;3;3;3;3;3",
        "wc_summary": "123;108;82;43;87;94",
        "wc_strengths": "58;62;40;38;100;57",
        "wc_weaknesses": "246;277;168;34;166;65",
        "wc_questions": "90;8;38;188;6;123",
        "wc_review": "517;455;328;303;359;339",
        "wc_reply_reviewers": "38;195;34;74;19;0",
        "wc_reply_authors": "660;1323;905;573;183;361",
        "reply_reviewers": "1;1;1;1;1;0",
        "reply_authors": "1;2;2;1;1;1",
        "rating_avg": [
            5.0,
            1.0
        ],
        "confidence_avg": [
            3.8333333333333335,
            0.6871842709362768
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            89.5,
            24.86463351831271
        ],
        "wc_strengths_avg": [
            59.166666666666664,
            20.39948256424385
        ],
        "wc_weaknesses_avg": [
            159.33333333333334,
            87.63877883423271
        ],
        "wc_questions_avg": [
            75.5,
            65.72100120965901
        ],
        "wc_review_avg": [
            383.5,
            76.4585944591363
        ],
        "wc_reply_reviewers_avg": [
            60.0,
            64.37131866496652
        ],
        "wc_reply_authors_avg": [
            667.5,
            370.53013822539907
        ],
        "reply_reviewers_avg": [
            0.8333333333333334,
            0.37267799624996495
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.7276068751089989,
        "gs_citation": 34,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9706697347838040158&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;1;1;0;1;1",
        "aff_unique_norm": "Duke University;NVIDIA",
        "aff_unique_dep": ";NVIDIA Corporation",
        "aff_unique_url": "https://www.duke.edu;https://www.nvidia.com",
        "aff_unique_abbr": "Duke;NVIDIA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "pbfy04zvcH",
        "title": "OceanGPT: A Large Language Model for Ocean Science Tasks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Ocean science, which are reservoirs of life and biodiversity, is of paramount significance given that oceans cover over 70% of our planet's surface. Recently, advances in Large Language Models (LLMs) have transformed the paradigm in science. Despite the notable success in other domains, current LLMs often fall short in catering to the needs of domain experts like oceanographers, and the potential of LLMs for ocean science is under-explored. The intrinsic reason is the immense and intricate nature of ocean data as well as the necessity for higher granularity and richness in knowledge. To alleviate these issues, we introduce OceanGPT, the first-ever LLM in the ocean domain, which is expert in various ocean science tasks. We propose DoInstruct, a novel framework to automatically obtain a large volume of ocean science instruction data, which generates instructions based on multi-agent collaboration. Additionally, we construct the first oceanography benchmark, OceanBench, to evaluate the capabilities of LLMs in the ocean domain. Though comprehensive experiments, OceanGPT not only demonstrates a higher level of knowledge expertise for oceans science tasks but also gains preliminary embodied intelligence capabilities in ocean technology. Codes are in the supplementary materials and will be released soon.",
        "keywords": "instruction generation;benchmark;ocean science;large language model",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/1b4ad6d823314de6b80e0b75b50e17aab8b51745.zip",
        "author": "Zhen Bi;Ningyu Zhang;Yida Xue;Yixin Ou;Guozhou Zheng;Huajun Chen",
        "authorids": "~Zhen_Bi1;~Ningyu_Zhang1;~Yida_Xue1;~Yixin_Ou1;~Guozhou_Zheng1;~Huajun_Chen1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://person.zju.edu.cn/en/ningyu;https://github.com/coderxyd;https://oe-heart.github.io/;;;https://www.researchgate.net/profile/Bi-Zhen-2/research",
        "dblp": "139/4181-1.html;;336/6083;76/3674;94/5089;279/8441",
        "google_scholar": "xQDOPvsAAAAJ;;QVTr5dQAAAAJ;;;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": "0000-0002-1970-0678;;0000-0001-7656-8004;;;",
        "linkedin": "ningyuzhang/;;;;;",
        "or_profile": "~Ningyu_Zhang1;~Yida_Xue1;~Yixin_Ou1;~Guozhou_Zheng1;~Huajun_Chen1;~Bi_Zhen1",
        "aff": "Zhejiang University;Zhejiang University;Zhejiang University;;Zhejiang University;Zhejiang University",
        "aff_domain": "zju.edu.cn;zju.edu.cn;zju.edu.cn;;zju.edu.cn;zju.edu.cn",
        "position": "Associate Professor;PhD student;MS student;;Full Professor;PhD student",
        "bibtex": "@misc{\nbi2024oceangpt,\ntitle={Ocean{GPT}:  A Large Language Model for Ocean  Science Tasks},\nauthor={Zhen Bi and Ningyu Zhang and Yida Xue and Yixin Ou and Guozhou Zheng and Huajun Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=pbfy04zvcH}\n}",
        "github": "",
        "project": "",
        "reviewers": "5Gh6;bjnA;E237",
        "site": "https://openreview.net/forum?id=pbfy04zvcH",
        "pdf_size": 1635586,
        "rating": "3;5;5",
        "confidence": "5;4;4",
        "soundness": "1;3;2",
        "contribution": "1;2;3",
        "presentation": "3;3;2",
        "wc_summary": "57;72;20",
        "wc_strengths": "42;40;35",
        "wc_weaknesses": "119;126;30",
        "wc_questions": "209;17;283",
        "wc_review": "427;255;368",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "349;154;440",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            49.666666666666664,
            21.853044537445015
        ],
        "wc_strengths_avg": [
            39.0,
            2.943920288775949
        ],
        "wc_weaknesses_avg": [
            91.66666666666667,
            43.69846170697036
        ],
        "wc_questions_avg": [
            169.66666666666666,
            112.09916245102916
        ],
        "wc_review_avg": [
            350.0,
            71.36292221221512
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            314.3333333333333,
            119.30446578211377
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.9999999999999997,
        "gs_citation": 41,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6296209427862847211&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Zhejiang University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.zju.edu.cn",
        "aff_unique_abbr": "ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Harnessing Joint Rain-/Detail-aware Representations to Eliminate Intricate Rains",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17773",
        "id": "pdJXYfJjz9",
        "author_site": "Wu Ran, Peirong Ma, Zhiquan He, Hao Ren, Hong Lu",
        "tldr": "",
        "abstract": "Recent advances in image deraining have focused on training powerful models on mixed multiple datasets comprising diverse rain types and backgrounds. However, this approach tends to overlook the inherent differences among rainy images, leading to suboptimal results. To overcome this limitation, we focus on addressing various rainy images by delving into meaningful representations that encapsulate both the rain and background components. Leveraging these representations as instructive guidance, we put forth a Context-based Instance-level Modulation (CoI-M) mechanism adept at efficiently modulating CNN- or Transformer-based models. Furthermore, we devise a rain-/detail-aware contrastive learning strategy to help extract joint rain-/detail-aware representations. By integrating CoI-M with the rain-/detail-aware Contrastive learning, we develop [CoIC](https://github.com/Schizophreni/CoIC), an innovative and potent algorithm tailored for training models on mixed datasets. Moreover, CoIC offers insight into modeling relationships of datasets, quantitatively assessing the impact of rain and details on restoration, and unveiling distinct behaviors of models given diverse inputs. Extensive experiments validate the efficacy of CoIC in boosting the deraining ability of CNN and Transformer models. CoIC also enhances the deraining prowess remarkably when real-world dataset is included.",
        "keywords": "Joint rain-/detail-aware representation learning;contrastive learning;context-based modulation mechanism;image deraining",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Wu Ran;Peirong Ma;Zhiquan He;Hao Ren;Hong Lu",
        "authorids": "~Wu_Ran1;~Peirong_Ma1;~Zhiquan_He1;~Hao_Ren2;~Hong_Lu2",
        "gender": "M;M;M;F;M",
        "homepage": ";;https://github.com/leftthomas;https://faculty.fudan.edu.cn/luhong1/zh_CN/index.htm;https://github.com/hezhiquan",
        "dblp": "272/6751;243/8892.html;;47/2341-1.html;",
        "google_scholar": "1C3-qdUAAAAJ;Qn42R8UAAAAJ;https://scholar.google.com.hk/citations?user=Q4MQAfEAAAAJ;https://scholar.google.com/citations?hl=zh-CN;",
        "orcid": "0000-0001-8478-0750;0000-0001-6391-7527;0000-0002-5639-450X;0000-0002-4572-2854;0000-0002-6674-6003",
        "linkedin": ";;;;",
        "or_profile": "~Wu_Ran1;~Peirong_Ma1;~Hao_Ren2;~Hong_Lu2;~ZQ_H1",
        "aff": "Fudan University;Fudan University;Fudan University;Fudan University;Fudan University",
        "aff_domain": "fudan.edu.cn;fudan.edu.cn;fudan.edu.cn;fudan.edu.cn;fudan.edu.cn",
        "position": "PhD student;PhD student;PhD student;Full Professor;MS student",
        "bibtex": "@inproceedings{\nran2024harnessing,\ntitle={Harnessing Joint Rain-/Detail-aware Representations to Eliminate Intricate Rains},\nauthor={Wu Ran and Peirong Ma and Zhiquan He and Hao Ren and Hong Lu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=pdJXYfJjz9}\n}",
        "github": "",
        "project": "",
        "reviewers": "nGEY;iZXv;v7hb;zqPW;rX1q",
        "pdf_size": 11619593,
        "rating": "5;6;6;6;8",
        "confidence": "5;5;5;5;4",
        "soundness": "3;2;3;3;3",
        "contribution": "3;2;2;3;3",
        "presentation": "3;2;2;3;3",
        "wc_summary": "54;50;57;97;41",
        "wc_strengths": "48;38;62;135;71",
        "wc_weaknesses": "275;118;132;273;541",
        "wc_questions": "2;3;5;3;3",
        "wc_review": "379;209;256;508;656",
        "wc_reply_reviewers": "0;78;0;23;0",
        "wc_reply_authors": "998;1118;709;329;2087",
        "reply_reviewers": "0;2;0;1;0",
        "reply_authors": "2;4;1;1;4",
        "rating_avg": [
            6.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            4.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            59.8,
            19.36388390793541
        ],
        "wc_strengths_avg": [
            70.8,
            34.04350158253408
        ],
        "wc_weaknesses_avg": [
            267.8,
            152.05183326747493
        ],
        "wc_questions_avg": [
            3.2,
            0.9797958971132712
        ],
        "wc_review_avg": [
            401.6,
            164.2225319497906
        ],
        "wc_reply_reviewers_avg": [
            20.2,
            30.24169307429728
        ],
        "wc_reply_authors_avg": [
            1048.2,
            586.3109755070257
        ],
        "reply_reviewers_avg": [
            0.6,
            0.7999999999999999
        ],
        "reply_authors_avg": [
            2.4,
            1.3564659966250538
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9185586535436918,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8468353751040054703&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=pdJXYfJjz9",
        "pdf": "https://openreview.net/pdf?id=pdJXYfJjz9",
        "email": "fudan.edu.cn;fudan.edu.cn;fudan.edu.cn;fudan.edu.cn;fudan.edu.cn",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Fudan University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.fudan.edu.cn",
        "aff_unique_abbr": "Fudan",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Graph Transformers on EHRs: Better Representation Improves Downstream Performance",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17772",
        "id": "pe0Vdv7rsL",
        "author_site": "Raphael Poulain, Rahmatollah Beheshti",
        "tldr": "",
        "abstract": "Following the success of transformer-based methods across various machine learning applications, their adoption for healthcare predictive tasks using electronic health records (EHRs)  has also expanded extensively. Similarly, graph-based methods have been shown to be very effective in capturing inherent graph-type relationships in EHRs, leading to improved downstream performance. Although integrating these two families of approaches seems like a natural next step, in practice, creating such a design is challenging and has not been done. This is partly due to known EHR problems, such as high sparsity, making extracting meaningful temporal representations of medical visits challenging. In this study, we propose GT-BEHRT, a new approach that leverages temporal visit embeddings extracted from a graph transformer and uses a BERT-based model to obtain more robust patient representations, especially on longer EHR sequences. The graph-based approach allows GT-BEHRT to implicitly capture the intrinsic graphical relationships between medical observations, while the BERT model extracts the temporal relationships between visits, loosely mimicking the clinicians' decision-making process. As part of our method, we also present a two-step pre-training strategy for learning better graphical and temporal representations. Our proposed method achieves state-of-the-art performance in a variety of standard medical predictive tasks, demonstrating the versatility of our approach.",
        "keywords": "transformers;graph neural networks;electronic health records",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Raphael Poulain;Rahmatollah Beheshti",
        "authorids": "~Raphael_Poulain1;~Rahmatollah_Beheshti2",
        "gender": ";",
        "homepage": "https://rpoulain.github.io/;https://sites.udel.edu/rbi/",
        "dblp": "311/1811;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;hi0U4RwAAAAJ",
        "orcid": ";0000-0001-8912-3063",
        "linkedin": ";rbeheshti/",
        "or_profile": "~Raphael_Poulain1;~Rahmatollah_Beheshti2",
        "aff": "University of Delaware;University of Delaware",
        "aff_domain": "udel.edu;udel.edu",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\npoulain2024graph,\ntitle={Graph Transformers on {EHR}s: Better Representation Improves Downstream Performance},\nauthor={Raphael Poulain and Rahmatollah Beheshti},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=pe0Vdv7rsL}\n}",
        "github": "",
        "project": "",
        "reviewers": "CybP;omW6;74P1;efXj",
        "pdf_size": 484432,
        "rating": "5;5;6;8",
        "confidence": "4;3;4;5",
        "soundness": "3;3;4;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;2",
        "wc_summary": "43;37;182;74",
        "wc_strengths": "35;19;96;120",
        "wc_weaknesses": "184;62;151;76",
        "wc_questions": "40;25;36;2",
        "wc_review": "302;143;465;272",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "479;181;313;127",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            84.0,
            58.29665513560791
        ],
        "wc_strengths_avg": [
            67.5,
            41.76421913552317
        ],
        "wc_weaknesses_avg": [
            118.25,
            50.85457206584281
        ],
        "wc_questions_avg": [
            25.75,
            14.771171246722448
        ],
        "wc_review_avg": [
            295.5,
            114.65273655696143
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            275.0,
            135.83077707206124
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.8660254037844386,
        "gs_citation": 20,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4735726175520034526&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=pe0Vdv7rsL",
        "pdf": "https://openreview.net/pdf?id=pe0Vdv7rsL",
        "email": "udel.edu;udel.edu",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Delaware",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.udel.edu",
        "aff_unique_abbr": "UD",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "peZbJlOVAN",
        "title": "Evaluating the Instruction-Following Robustness of Large Language Models to Prompt Injection",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) have shown remarkable proficiency in following instructions, making them valuable in customer-facing applications. However, their impressive capabilities also raise concerns about the amplification of risks posed by adversarial instructions, which can be injected into the model input by third-party attackers to manipulate LLMs' original instructions and prompt unintended actions and content. Therefore, it is crucial to understand LLMs' ability to accurately discern which instructions to follow to ensure their safe deployment in real-world scenarios. In this paper, we propose a pioneering benchmark for automatically evaluating the robustness of instruction-following LLMs against adversarial instructions injected in the prompt. The objective of this benchmark is to quantify the extent to which LLMs are influenced by injected adversarial instructions and assess their ability to differentiate between these injected adversarial instructions and original user instructions. Through experiments conducted with state-of-the-art instruction-following LLMs, we uncover significant limitations in their robustness against adversarial instruction injection attacks. Furthermore, our findings indicate that prevalent instruction-tuned models are prone to being ``overfitted'' to follow any instruction phrase in the prompt without truly understanding which instructions should be followed. This highlights the need to address the challenge of training models to comprehend prompts instead of merely following instruction phrases and completing the text.",
        "keywords": "Instruction-following;robustness;prompt injection;adversarial instructions",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/dbdc1c7d552fa374f4788af9b60b558a0d526d6c.zip",
        "author": "Zekun Li;Baolin Peng;Pengcheng He;Xifeng Yan",
        "authorids": "~Zekun_Li2;~Baolin_Peng2;~Pengcheng_He2;~Xifeng_Yan1",
        "gender": ";M;M;",
        "homepage": ";;;https://sites.cs.ucsb.edu/~xyan/",
        "dblp": ";144/2759;116/8665;y/XifengYan",
        "google_scholar": ";u1CNjgwAAAAJ;https://scholar.google.com/citations?hl=en;XZV2eogAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Zekun_Li2;~Baolin_Peng2;~Pengcheng_He2;~Xifeng_Yan1",
        "aff": ";Tencent AI Lab;Microsoft;UC Santa Barbara",
        "aff_domain": ";tencent.com;microsoft.com;ucsb.edu",
        "position": ";Researcher;Principal Researcher;Full Professor",
        "bibtex": "@misc{\nli2024evaluating,\ntitle={Evaluating the Instruction-Following Robustness of Large Language Models to Prompt Injection},\nauthor={Zekun Li and Baolin Peng and Pengcheng He and Xifeng Yan},\nyear={2024},\nurl={https://openreview.net/forum?id=peZbJlOVAN}\n}",
        "github": "",
        "project": "",
        "reviewers": "7qmo;ZgVv;jzC7;34mr",
        "site": "https://openreview.net/forum?id=peZbJlOVAN",
        "pdf_size": 1824844,
        "rating": "5;5;5;6",
        "confidence": "3;3;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;2",
        "presentation": "3;3;3;3",
        "wc_summary": "45;143;53;43",
        "wc_strengths": "46;23;20;30",
        "wc_weaknesses": "112;41;204;107",
        "wc_questions": "104;29;54;2",
        "wc_review": "307;236;331;182",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "678;518;655;648",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            71.0,
            41.737273509418415
        ],
        "wc_strengths_avg": [
            29.75,
            10.059199769365355
        ],
        "wc_weaknesses_avg": [
            116.0,
            58.02154772151464
        ],
        "wc_questions_avg": [
            47.25,
            37.57243005183455
        ],
        "wc_review_avg": [
            264.0,
            58.834513680322026
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            624.75,
            62.62337822251367
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 18,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15610071247268405607&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Tencent;Microsoft;University of California, Santa Barbara",
        "aff_unique_dep": "Tencent AI Lab;Microsoft Corporation;",
        "aff_unique_url": "https://ai.tencent.com;https://www.microsoft.com;https://www.ucsb.edu",
        "aff_unique_abbr": "Tencent AI Lab;Microsoft;UCSB",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Santa Barbara",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Think before you speak: Training Language Models With Pause Tokens",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17771",
        "id": "ph04CRkPdC",
        "author_site": "Sachin Goyal, Ziwei Ji, Ankit Singh Rawat, Aditya Krishna Menon, Sanjiv Kumar, Vaishnavh Nagarajan",
        "tldr": "",
        "abstract": "Language models generate responses by producing a series of tokens in immediate succession: the $(K+1)^{\\rm th}$ token is an outcome of manipulating $K$ hidden vectors per layer, one vector per preceding token. What if instead we were to let the model manipulate say, $K+10$ hidden vectors, before it outputs the $(K+1)^{\\rm th}$ token? We operationalize this idea by performing\n training and inference on language models with a (learnable) $\\textit{pause}$ token, a sequence of which is appended to the input prefix. We then delay extracting the model's outputs until the last pause token is seen, thereby allowing the model to process extra computation before committing to an answer. We empirically evaluate $\\textit{pause-training}$ on decoder-only models of 1B and 130M parameters with causal pretraining on C4, and on downstream tasks covering reasoning, question-answering, general understanding and fact recall. Our main finding is that inference-time delays show gains when the model is both pre-trained and finetuned with delays. For the 1B model, we witness gains on 8 of 9 tasks, most prominently, a gain of $18\\\\%$ EM score on the QA task of SQuAD, $8\\\\%$ on CommonSenseQA and $1\\\\%$ accuracy on the reasoning task of GSM8k. Our work raises a range of conceptual and practical future research questions on making delayed next-token prediction a widely applicable new paradigm.",
        "keywords": "LLM training and inference;Downstream finetuning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Sachin Goyal;Ziwei Ji;Ankit Singh Rawat;Aditya Krishna Menon;Sanjiv Kumar;Vaishnavh Nagarajan",
        "authorids": "~Sachin_Goyal1;~Ziwei_Ji1;~Ankit_Singh_Rawat1;~Aditya_Krishna_Menon1;~Sanjiv_Kumar1;~Vaishnavh_Nagarajan3",
        "gender": "M;M;M;;M;M",
        "homepage": "https://saching007.github.io/;https://jiziwei.github.io/;https://ankitsrawat.github.io/home/;http://www.sanjivk.com/;https://akmenon.github.io/;https://vaishnavh.github.io/",
        "dblp": "82/2605;176/4574.html=;https://dblp.org/pers/hd/r/Rawat:Ankit_Singh;;89/3514;161/0079",
        "google_scholar": "-KK-60AAAAAJ;3l_6H5sAAAAJ;http://scholar.google.com/citations?user=U0_ab4cAAAAJ;https://scholar.google.com/citations?hl=en;;https://scholar.google.nl/citations?user=LrsjJfwAAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";ziwei-ji-b1274899/;;;;",
        "or_profile": "~Sachin_Goyal1;~Ziwei_Ji1;~Ankit_Singh_Rawat1;~Sanjiv_Kumar1;~Aditya_Menon1;~Vaishnavh_Nagarajan1",
        "aff": "Carnegie Mellon University;Google;Google;Google;Google;Google",
        "aff_domain": "andrew.cmu.edu;google.com;google.com;google.com;google.com;google.com",
        "position": "PhD student;Researcher;Research Scientist;Research Scientist;Research Scientist;Researcher",
        "bibtex": "@inproceedings{\ngoyal2024think,\ntitle={Think before you speak: Training Language Models With Pause Tokens},\nauthor={Sachin Goyal and Ziwei Ji and Ankit Singh Rawat and Aditya Krishna Menon and Sanjiv Kumar and Vaishnavh Nagarajan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ph04CRkPdC}\n}",
        "github": "",
        "project": "",
        "reviewers": "zLe3;orpq;cnas;SV1s",
        "pdf_size": 1009134,
        "rating": "3;3;8;8",
        "confidence": "4;4;4;3",
        "soundness": "3;3;3;3",
        "contribution": "1;2;3;3",
        "presentation": "4;3;3;3",
        "wc_summary": "175;131;59;76",
        "wc_strengths": "88;134;26;26",
        "wc_weaknesses": "577;257;16;77",
        "wc_questions": "132;65;61;51",
        "wc_review": "972;587;162;230",
        "wc_reply_reviewers": "0;0;11;0",
        "wc_reply_authors": "1390;1248;440;593",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "3;3;2;1",
        "rating_avg": [
            5.5,
            2.5
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            110.25,
            45.8877707020073
        ],
        "wc_strengths_avg": [
            68.5,
            45.50549417378082
        ],
        "wc_weaknesses_avg": [
            231.75,
            218.13456282762712
        ],
        "wc_questions_avg": [
            77.25,
            32.01854931129766
        ],
        "wc_review_avg": [
            487.75,
            322.8377107774121
        ],
        "wc_reply_reviewers_avg": [
            2.75,
            4.763139720814412
        ],
        "wc_reply_authors_avg": [
            917.75,
            407.98062147606964
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 76,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11393068816337728013&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=ph04CRkPdC",
        "pdf": "https://openreview.net/pdf?id=ph04CRkPdC",
        "email": "andrew.cmu.edu;google.com;google.com;google.com;google.com;google.com",
        "author_num": 6,
        "aff_unique_index": "0;1;1;1;1;1",
        "aff_unique_norm": "Carnegie Mellon University;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.cmu.edu;https://www.google.com",
        "aff_unique_abbr": "CMU;Google",
        "aff_campus_unique_index": "1;1;1;1;1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Benchmarking and Improving Generator-Validator Consistency of Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17770",
        "id": "phBS6YpTzC",
        "author_site": "Xiang Li, Vaishnavi Shrivastava, Siyan Li, Tatsunori Hashimoto, Percy Liang",
        "tldr": "",
        "abstract": "As of September 2023, ChatGPT correctly answers \u201cwhat is 7+8\u201d with 15, but when asked \u201c7+8=15, True or False\u201d it responds with \u201cFalse\u201d. This inconsistency between generating and validating an answer is prevalent in language models (LMs) and erodes trust. In this paper, we propose a framework for measuring the consistency between generation and validation (which we call generator-validator consistency, or GV-consistency), finding that even GPT-4 (0613), a state-of-the-art LM, is GV-consistent only 76% of the time. To improve the consistency of LMs, we propose to finetune on the filtered generator and validator responses that are GV-consistent, and call this approach consistency fine-tuning. We find that this approach improves GV-consistency of Alpaca-30B from 60% to 93%, and the improvement extrapolates to unseen tasks and domains (e.g., GV-consistency for positive style transfers extrapolates to unseen styles like humor). In addition to improving consistency, consistency fine-tuning improves both generator quality and validator accuracy without using any labeled data. Evaluated across 6 tasks, including math questions, knowledge-intensive QA, and instruction following, our method improves generator quality by an average of 16% and validator accuracy by an average of 6.3% across all tasks.",
        "keywords": "consistency;language models;self-critique",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Xiang Lisa Li;Vaishnavi Shrivastava;Siyan Li;Tatsunori Hashimoto;Percy Liang",
        "authorids": "~Xiang_Lisa_Li1;~Vaishnavi_Shrivastava1;~Siyan_Li1;~Tatsunori_Hashimoto1;~Percy_Liang1",
        "gender": "F;F;F;M;",
        "homepage": "https://xiangli1999.github.io;;https://siyan-sylvia-li.com;https://thashim.github.io;https://cs.stanford.edu/~pliang/",
        "dblp": "40/1491-63;;97/4111;;04/1701",
        "google_scholar": "nzA4P0oAAAAJ;;pTwl3TEAAAAJ;5ygiTwsAAAAJ;pouyVyUAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";vaish-shrivastava/;;;",
        "or_profile": "~Xiang_Lisa_Li1;~Vaishnavi_Shrivastava1;~Siyan_Li1;~Tatsunori_Hashimoto1;~Percy_Liang1",
        "aff": "Stanford University;Stanford University;Columbia University;Stanford University;Stanford University",
        "aff_domain": "stanford.edu;stanford.edu;columbia.edu;stanford.edu;stanford.edu",
        "position": "PhD student;MS student;PhD student;Assistant Professor;Associate Professor",
        "bibtex": "@inproceedings{\nli2024benchmarking,\ntitle={Benchmarking and Improving Generator-Validator Consistency of Language Models},\nauthor={Xiang Lisa Li and Vaishnavi Shrivastava and Siyan Li and Tatsunori Hashimoto and Percy Liang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=phBS6YpTzC}\n}",
        "github": "",
        "project": "",
        "reviewers": "pfQS;bsD6;5N9m",
        "pdf_size": 1269140,
        "rating": "6;6;8",
        "confidence": "4;5;5",
        "soundness": "2;2;4",
        "contribution": "2;2;4",
        "presentation": "2;2;4",
        "wc_summary": "56;120;115",
        "wc_strengths": "59;95;65",
        "wc_weaknesses": "278;267;83",
        "wc_questions": "2;9;12",
        "wc_review": "395;491;275",
        "wc_reply_reviewers": "36;15;71",
        "wc_reply_authors": "1637;1166;603",
        "reply_reviewers": "1;1;1",
        "reply_authors": "3;2;1",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            97.0,
            29.06314963431642
        ],
        "wc_strengths_avg": [
            73.0,
            15.748015748023622
        ],
        "wc_weaknesses_avg": [
            209.33333333333334,
            89.4439613513524
        ],
        "wc_questions_avg": [
            7.666666666666667,
            4.189935029992179
        ],
        "wc_review_avg": [
            387.0,
            88.36288813749809
        ],
        "wc_reply_reviewers_avg": [
            40.666666666666664,
            23.098821518760552
        ],
        "wc_reply_authors_avg": [
            1135.3333333333333,
            422.68533081819726
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 29,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8538437913304069151&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=phBS6YpTzC",
        "pdf": "https://openreview.net/pdf?id=phBS6YpTzC",
        "email": "stanford.edu;stanford.edu;columbia.edu;stanford.edu;stanford.edu",
        "author_num": 5,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "Stanford University;Columbia University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.stanford.edu;https://www.columbia.edu",
        "aff_unique_abbr": "Stanford;Columbia",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Stanford;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "phWkgFXvdG",
        "title": "Task Regularized Hybrid Knowledge Distillation For Incremental Object Detection",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Incremental object detection (IOD) task is trapped in well-known catastrophic forgetting. Knowledge distillation has been used to overcome this problem. Previous works mainly focus on combining different distillation methods, including feature, classification, location and relation, into a mixed scheme to solve this problem. In this paper, we find two reasons of catastrophic forgetting, knowledge fuzziness and imbalance learning. We propose a task regularized hybrid knowledge distillation method for IOD task. Our method integrates knowledge selection strategy and knowledge transfer strategy. First, we propose an image-level hybrid knowledge representation by combining instance-level hard knowledge and soft knowledge to use teacher knowledge critically. Second, we propose a task-based regularization distillation loss by taking account of loss difference between old and new tasks to make incremental learning more balance. Extensive experiments conducted on MS COCO and Pascal VOC demonstrate that our method achieves state-of-the-art performance. Remarkably, we reduce the mAP gap between incremental leaning and joint learning to 6\\% under the most difficult Five-Step scenario of MS COCO, which is significantly superior to previous best method.",
        "keywords": "Knowledge Distillation;Continual Object Detection",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Jinming Zhang;Mengxue Kang;Jinpeng Zhang;Zhao Haozhe",
        "authorids": "~Jinming_Zhang4;~Mengxue_Kang1;~Jinpeng_Zhang2;~Zhao_Haozhe1",
        "gender": "M;F;M;F",
        "homepage": "http://it.xju.edu.cn/info/1146/2406.htm;;https://github.com/zhjpqq;https://studyai.com",
        "dblp": ";;;",
        "google_scholar": ";;;",
        "orcid": ";0000-0002-3847-1997;;",
        "linkedin": ";;;",
        "or_profile": "~Jinming_Zhang4;~Mengxue_Kang1;~Jinpeng_Zhang2;~Zhao_Haozhe1",
        "aff": ";Alibaba Group;;",
        "aff_domain": ";alibaba-inc.com;;",
        "position": ";Researcher;;",
        "bibtex": "@misc{\nzhang2024task,\ntitle={Task Regularized Hybrid Knowledge Distillation For Incremental Object Detection},\nauthor={Jinming Zhang and Mengxue Kang and Jinpeng Zhang and Zhao Haozhe},\nyear={2024},\nurl={https://openreview.net/forum?id=phWkgFXvdG}\n}",
        "github": "",
        "project": "",
        "reviewers": "uijP;b6i8;3fPp;71CT",
        "site": "https://openreview.net/forum?id=phWkgFXvdG",
        "pdf_size": 2105355,
        "rating": "3;3;3;5",
        "confidence": "4;4;4;5",
        "soundness": "2;2;3;2",
        "contribution": "2;2;2;2",
        "presentation": "2;2;3;2",
        "wc_summary": "111;62;64;52",
        "wc_strengths": "68;19;61;34",
        "wc_weaknesses": "118;74;194;133",
        "wc_questions": "119;2;11;21",
        "wc_review": "416;157;330;240",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            72.25,
            22.829531313629722
        ],
        "wc_strengths_avg": [
            45.5,
            19.880895352071043
        ],
        "wc_weaknesses_avg": [
            129.75,
            42.96728406590298
        ],
        "wc_questions_avg": [
            38.25,
            47.10294576775427
        ],
        "wc_review_avg": [
            285.75,
            96.94424944265647
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:arraajkZKdgJ:scholar.google.com/&scioq=Task+Regularized+Hybrid+Knowledge+Distillation+For+Incremental+Object+Detection&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Alibaba Group",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.alibaba.com",
        "aff_unique_abbr": "Alibaba",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "piWvNRR0Ym",
        "title": "Towards Minimal Targeted Updates of Language Models with Targeted Negative Training",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Generative models of language exhibit impressive capabilities but still place non-negligible probability mass over undesirable outputs. In this work, we address the task of updating a model to avoid unwanted outputs while minimally changing model behavior otherwise, a challenge we refer to as a minimal targeted update. We first formalize the notion of a minimal targeted update and propose a method to achieve such updates using negative examples from a model's generations. Our proposed Targeted Negative Training (TNT) results in updates that keep the new distribution close to the original, unlike existing losses for negative signal which push down probability but do not control what the updated distribution will be. In experiments, we demonstrate that TNT yields a better trade-off between reducing unwanted behavior and preserving model generation behavior than baselines, paving the way towards a modeling paradigm based on iterative training updates that constrain models from generating undesirable outputs while preserving their impressive capabilities.",
        "keywords": "language model;text generation;negative examples",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Lily H Zhang;Rajesh Ranganath;Arya Tafvizi",
        "authorids": "~Lily_H_Zhang1;~Rajesh_Ranganath2;~Arya_Tafvizi1",
        "gender": "F;;",
        "homepage": "https://lhz1029.github.io/;;",
        "dblp": "267/6682;97/7057;",
        "google_scholar": "fmCi9ZQAAAAJ;;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Lily_H_Zhang1;~Rajesh_Ranganath2;~Arya_Tafvizi1",
        "aff": "New York University;New York University;",
        "aff_domain": "nyu.edu;nyu.edu;",
        "position": "PhD student;Assistant Professor;",
        "bibtex": "@misc{\nzhang2024towards,\ntitle={Towards Minimal Targeted Updates of Language Models with Targeted Negative Training},\nauthor={Lily H Zhang and Rajesh Ranganath and Arya Tafvizi},\nyear={2024},\nurl={https://openreview.net/forum?id=piWvNRR0Ym}\n}",
        "github": "",
        "project": "",
        "reviewers": "eQid;fDnb;DCRf;VP85",
        "site": "https://openreview.net/forum?id=piWvNRR0Ym",
        "pdf_size": 779365,
        "rating": "5;5;5;6",
        "confidence": "3;5;2;4",
        "soundness": "2;2;3;3",
        "contribution": "3;2;2;3",
        "presentation": "2;4;2;3",
        "wc_summary": "75;123;195;91",
        "wc_strengths": "36;92;65;53",
        "wc_weaknesses": "130;162;253;304",
        "wc_questions": "4;42;58;113",
        "wc_review": "245;419;571;561",
        "wc_reply_reviewers": "78;0;0;18",
        "wc_reply_authors": "467;1530;940;923",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "1;3;2;2",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            121.0,
            46.08687448721165
        ],
        "wc_strengths_avg": [
            61.5,
            20.402205763103165
        ],
        "wc_weaknesses_avg": [
            212.25,
            69.5858282985839
        ],
        "wc_questions_avg": [
            54.25,
            39.18146883413127
        ],
        "wc_review_avg": [
            449.0,
            132.23463993976767
        ],
        "wc_reply_reviewers_avg": [
            24.0,
            32.03123475609393
        ],
        "wc_reply_authors_avg": [
            965.0,
            377.3652077232346
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.2581988897471611,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4720797120443240971&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "New York University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nyu.edu",
        "aff_unique_abbr": "NYU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "pijvVzhRdZ",
        "title": "Rethinking the Starting Point: Enhancing Performance and Fairness of Federated Learning via Collaborative Pre-Training",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Most existing federated learning (FL) methodologies have been developed starting from a randomly initialized model. Recently, several studies have empirically demonstrated that leveraging a pre-trained model can offer advantageous initializations for FL. In this paper, we take a departure from the assumption of centralized pre-training and instead focus on a  practical FL setting, where data samples are distributed among both clients and the server even during the pre-training phase. We propose a collaborative pre-training approach for FL (CoPreFL), where the goal is to strategically design a pre-trained model that effectively serves as a good initialization for any downstream FL tasks. The key idea of our pre-training algorithm is to employ meta-learning to simulate downstream distributed scenarios, enabling it to adapt to unforeseen FL tasks. During optimization, CoPreFL also strikes a balance between average performance and fairness, with the aim of addressing the challenges in downstream FL tasks through initialization. Extensive experimental results validate that our pre-training method provides a robust initialization for any unseen downstream FL tasks, resulting in enhanced average performance and more equitable predictions.",
        "keywords": "federated learning;pre-training",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/fc55c3ac5e9ae8796c0d2be52dff3ccdab02cd3f.zip",
        "author": "Yun-Wei Chu;Dong-Jun Han;Seyyedali Hosseinalipour;Christopher Brinton",
        "authorids": "~Yun-Wei_Chu1;~Dong-Jun_Han1;~Seyyedali_Hosseinalipour1;~Christopher_Brinton1",
        "gender": "M;M;;",
        "homepage": "https://yunwei-c.github.io/;https://sites.google.com/view/djhan930/home?authuser=0;;https://www.cbrinton.net/",
        "dblp": "196/3769.html;201/0078;;",
        "google_scholar": "G7mr7ZkAAAAJ;https://scholar.google.co.kr/citations?user=-YR-GxUAAAAJ;;vWmHA5MAAAAJ",
        "orcid": ";;;",
        "linkedin": "yun-wei-chu-7b27201a1/;;;",
        "or_profile": "~Yun-Wei_Chu1;~Dong-Jun_Han1;~Seyyedali_Hosseinalipour1;~Christopher_Brinton1",
        "aff": "Purdue University;Purdue University;;Purdue University",
        "aff_domain": "purdue.edu;purdue.edu;;purdue.edu",
        "position": "PhD student;Postdoc;;Assistant Professor",
        "bibtex": "@misc{\nchu2024rethinking,\ntitle={Rethinking the Starting Point: Enhancing Performance and Fairness of Federated Learning via Collaborative Pre-Training},\nauthor={Yun-Wei Chu and Dong-Jun Han and Seyyedali Hosseinalipour and Christopher Brinton},\nyear={2024},\nurl={https://openreview.net/forum?id=pijvVzhRdZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "4hah;n2CX;khz5;8PDC",
        "site": "https://openreview.net/forum?id=pijvVzhRdZ",
        "pdf_size": 7064591,
        "rating": "3;5;6;8",
        "confidence": "3;4;4;3",
        "soundness": "2;2;3;3",
        "contribution": "3;2;2;2",
        "presentation": "3;3;3;4",
        "wc_summary": "43;100;112;72",
        "wc_strengths": "47;86;43;64",
        "wc_weaknesses": "125;232;44;143",
        "wc_questions": "434;136;356;359",
        "wc_review": "649;554;555;638",
        "wc_reply_reviewers": "190;51;88;13",
        "wc_reply_authors": "3219;1453;2050;1375",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "6;3;5;4",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            81.75,
            26.668098919870534
        ],
        "wc_strengths_avg": [
            60.0,
            16.95582495781317
        ],
        "wc_weaknesses_avg": [
            136.0,
            66.80194607943693
        ],
        "wc_questions_avg": [
            321.25,
            111.42570394662086
        ],
        "wc_review_avg": [
            599.0,
            44.6710196883841
        ],
        "wc_reply_reviewers_avg": [
            85.5,
            65.9033383069477
        ],
        "wc_reply_authors_avg": [
            2024.25,
            737.5538539659325
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            4.5,
            1.118033988749895
        ],
        "replies_avg": [
            30,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2023950380785881929&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Purdue University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.purdue.edu",
        "aff_unique_abbr": "Purdue",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Probabilistic Adaptation of Black-Box Text-to-Video Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17769",
        "id": "pjtIEgscE3",
        "author_site": "Sherry Yang, Yilun Du, Bo Dai, Dale Schuurmans, Joshua B Tenenbaum, Pieter Abbeel",
        "tldr": "",
        "abstract": "Large text-to-video models trained on internet-scale data have demonstrated exceptional capabilities in generating high-fidelity videos from arbitrary textual descriptions. However, similar to proprietary language models, large text-to-video models are often black boxes whose weight parameters are not publicly available, posing a significant challenge to adapting these models to specific domains such as robotics, animation, and personalized stylization. Inspired by how a large language model can be prompted to perform new tasks without access to the model weights, we investigate how to adapt a black-box pretrained text-to-video model to a variety of downstream domains without weight access to the pretrained model. In answering this question, we propose \\emph{\\methodname}, which leverages the score function of a large pretrained video diffusion model as a probabilistic prior to guide the generation of a task-specific small video model. Our experiments show that, by incorporating broad knowledge and fidelity of the pretrained model probabilistically, a small model with as few as 1.25% parameters of the pretrained model can generate high-quality yet domain-specific videos for a variety of downstream domains such as animation, egocentric modeling, and modeling of simulated and real-world robotics data. As large text-to-video models starting to become available as a service similar to large language models, we advocate for private institutions to expose scores of video diffusion models as outputs in addition to generated videos to allow flexible adaptation of large pretrained text-to-video models by the general public.",
        "keywords": "Controllable video generation;probabilistic adaptation;video diffusion;black box adaptation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/b256095867262269082dc1a70b1921b732293fff.zip",
        "author": "Sherry Yang;Yilun Du;Bo Dai;Dale Schuurmans;Joshua B. Tenenbaum;Pieter Abbeel",
        "authorids": "~Sherry_Yang1;~Yilun_Du1;~Bo_Dai1;~Dale_Schuurmans1;~Joshua_B._Tenenbaum1;~Pieter_Abbeel2",
        "gender": "F;;;;;M",
        "homepage": "https://sherryy.github.io;https://yilundu.github.io;https://bo-dai.github.io/;;;https://people.eecs.berkeley.edu/~pabbeel/",
        "dblp": ";204/4379;64/2903;;t/JoshuaBTenenbaum;",
        "google_scholar": "7c1B_fIAAAAJ;;TIKl_foAAAAJ;;;https://scholar.google.com.tw/citations?user=vtwH6GkAAAAJ",
        "orcid": ";;0009-0002-8070-574X;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Sherry_Yang1;~Yilun_Du1;~Bo_Dai1;~Dale_Schuurmans1;~Joshua_B._Tenenbaum1;~Pieter_Abbeel2",
        "aff": "University of California, Berkeley;Massachusetts Institute of Technology;Google Brain;;Massachusetts Institute of Technology;Covariant",
        "aff_domain": "berkeley.edu;mit.edu;google.com;;mit.edu;covariant.ai",
        "position": "Student;PhD student;Research Scientist;;Professor;Founder",
        "bibtex": "@inproceedings{\nyang2024probabilistic,\ntitle={Probabilistic Adaptation of Black-Box Text-to-Video Models},\nauthor={Sherry Yang and Yilun Du and Bo Dai and Dale Schuurmans and Joshua B. Tenenbaum and Pieter Abbeel},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=pjtIEgscE3}\n}",
        "github": "",
        "project": "",
        "reviewers": "Z2pV;nNvZ;4TFV;yyCL",
        "pdf_size": 5774071,
        "rating": "3;6;8;8",
        "confidence": "4;5;5;3",
        "soundness": "2;4;3;3",
        "contribution": "1;3;3;3",
        "presentation": "2;4;3;3",
        "wc_summary": "117;58;40;146",
        "wc_strengths": "21;35;40;44",
        "wc_weaknesses": "225;113;43;22",
        "wc_questions": "5;40;90;43",
        "wc_review": "368;246;213;255",
        "wc_reply_reviewers": "0;62;11;0",
        "wc_reply_authors": "655;591;445;147",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            6.25,
            2.0463381929681126
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            90.25,
            42.97891925118639
        ],
        "wc_strengths_avg": [
            35.0,
            8.689073598491383
        ],
        "wc_weaknesses_avg": [
            100.75,
            79.25394311956977
        ],
        "wc_questions_avg": [
            44.5,
            30.220026472523152
        ],
        "wc_review_avg": [
            270.5,
            58.42302628245134
        ],
        "wc_reply_reviewers_avg": [
            18.25,
            25.655165171949292
        ],
        "wc_reply_authors_avg": [
            459.5,
            195.81815544019406
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.03683547343418787,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9398666760837589055&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=pjtIEgscE3",
        "pdf": "https://openreview.net/pdf?id=pjtIEgscE3",
        "email": "berkeley.edu;mit.edu;google.com;;mit.edu;covariant.ai",
        "author_num": 6,
        "aff_unique_index": "0;1;2;1;3",
        "aff_unique_norm": "University of California, Berkeley;Massachusetts Institute of Technology;Google;Covariant",
        "aff_unique_dep": ";;Google Brain;",
        "aff_unique_url": "https://www.berkeley.edu;https://web.mit.edu;https://brain.google.com;",
        "aff_unique_abbr": "UC Berkeley;MIT;Google Brain;",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Berkeley;;Mountain View",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States;"
    },
    {
        "id": "pk0iUCNVPa",
        "title": "Polynomial-based Self-Attention for Table Representation learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Structured data, which constitutes a significant portion of existing data types, has been a long-standing research topic in the field of machine learning. Various representation learning methods for tabular data have been proposed, ranging from encoder-decoder structures to Transformers. Among these, Transformer-based methods have achieved state-of-the-art performance not only in tabular data but also in various other fields, including computer vision and natural language processing. However, recent studies have revealed that self-attention, a key component of Transformers, can lead to an oversmoothing issue. We show that Transformers for tabular data also face this problem, and to address the problem, we propose a novel matrix polynomial-based self-attention layer as a substitute for the original self-attention layer, which enhances model scalability. In our experiments with three representative table learning models equipped with our proposed layer, we illustrate that the layer effectively mitigates the oversmoothing problem and enhances the representation performance of the existing methods, outperforming the state-of-the-art table representation methods.",
        "keywords": "matrix polynomial;table representation;graph signal processing",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/cf7bcf1b4d5f3af4f8c69b06d5304067bdc38f17.zip",
        "author": "Jayoung Kim;Yehjin Shin;Jeongwhan Choi;Hyowon Wi;Noseong Park",
        "authorids": "~Jayoung_Kim1;~Yehjin_Shin1;~Jeongwhan_Choi1;~Hyowon_Wi1;~Noseong_Park1",
        "gender": "F;F;M;;",
        "homepage": ";http://yehjin-shin.github.io/;https://www.jeongwhanchoi.com;;",
        "dblp": "26/9969-2;322/5257;39/11215-2;332/6458;",
        "google_scholar": "3qbSHGwAAAAJ;https://scholar.google.com/citations?view_op=list_works;3MNElkYAAAAJ;https://scholar.google.com/citations?view_op=list_works;",
        "orcid": ";0009-0001-7600-2585;0000-0002-6530-2662;;",
        "linkedin": ";yehjin-shin-528987217/;jeongwhanchoi/;;",
        "or_profile": "~Jayoung_Kim1;~Yehjin_Shin1;~Jeongwhan_Choi1;~Hyowon_Wi1;~Noseong_Park1",
        "aff": "Yonsei University;Yonsei University;Yonsei University;Yonsei University;",
        "aff_domain": "yonsei.ac.kr;yonsei.ac.kr;yonsei.ac.kr;yonsei.ac.kr;",
        "position": "MS student;MS student;PhD student;MS student;",
        "bibtex": "@misc{\nkim2024polynomialbased,\ntitle={Polynomial-based Self-Attention for Table Representation learning},\nauthor={Jayoung Kim and Yehjin Shin and Jeongwhan Choi and Hyowon Wi and Noseong Park},\nyear={2024},\nurl={https://openreview.net/forum?id=pk0iUCNVPa}\n}",
        "github": "",
        "project": "",
        "reviewers": "gFjL;uHc3;BrLK",
        "site": "https://openreview.net/forum?id=pk0iUCNVPa",
        "pdf_size": 674215,
        "rating": "5;6;8",
        "confidence": "4;3;3",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "2;3;3",
        "wc_summary": "91;89;56",
        "wc_strengths": "82;39;53",
        "wc_weaknesses": "534;28;14",
        "wc_questions": "14;160;27",
        "wc_review": "721;316;150",
        "wc_reply_reviewers": "0;11;10",
        "wc_reply_authors": "979;306;167",
        "reply_reviewers": "0;1;1",
        "reply_authors": "3;1;1",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            78.66666666666667,
            16.048537489614297
        ],
        "wc_strengths_avg": [
            58.0,
            17.90716802475106
        ],
        "wc_weaknesses_avg": [
            192.0,
            241.89805015060924
        ],
        "wc_questions_avg": [
            67.0,
            65.9747426419131
        ],
        "wc_review_avg": [
            395.6666666666667,
            239.81983978719435
        ],
        "wc_reply_reviewers_avg": [
            7.0,
            4.96655480858378
        ],
        "wc_reply_authors_avg": [
            484.0,
            354.58802386243485
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.7559289460184545,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ACU2lBgNl4IJ:scholar.google.com/&scioq=Polynomial-based+Self-Attention+for+Table+Representation+learning&hl=en&as_sdt=0,5",
        "gs_version_total": 9,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Yonsei University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.yonsei.ac.kr",
        "aff_unique_abbr": "Yonsei",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "Kernel Metric Learning for In-Sample Off-Policy Evaluation of Deterministic RL Policies",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17768",
        "id": "plebgsdiiV",
        "author_site": "Haanvid Lee, Tri Wahyu Guntara, Jongmin Lee, Yung-Kyun Noh, Kee-Eung Kim",
        "tldr": "",
        "abstract": "We consider off-policy evaluation (OPE) of deterministic target policies for reinforcement learning (RL) in environments with continuous action spaces. While it is common to use importance sampling for OPE, it suffers from high variance when the behavior policy deviates significantly from the target policy. In order to address this issue, some recent works on OPE proposed in-sample learning with importance resampling. Yet, these approaches are not applicable to deterministic target policies for continuous action spaces. To address this limitation, we propose to relax the deterministic target policy using a kernel and learn the kernel metrics that minimize the overall mean squared error of the estimated temporal difference update vector of an action value function, where the action value function is used for policy evaluation. We derive the bias and variance of the estimation error due to this relaxation and provide analytic solutions for the optimal kernel metric. In empirical studies using various test domains, we show that the OPE with in-sample learning using the kernel with optimized metric achieves significantly improved accuracy than other baselines.",
        "keywords": "off-policy evaluation;reinforcement learning;deterministic policy;continuous actions;metric learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/c655aab894dfe05a7f6306b1d7bdf7dc8e705a90.zip",
        "author": "Haanvid Lee;Tri Wahyu Guntara;Jongmin Lee;Yung-Kyun Noh;Kee-Eung Kim",
        "authorids": "~Haanvid_Lee1;~Tri_Wahyu_Guntara1;~Jongmin_Lee1;~Yung-Kyun_Noh1;~Kee-Eung_Kim2",
        "gender": "M;M;M;M;M",
        "homepage": ";https://sites.google.com/view/wahyu-guntara/home;https://www.jmlee.kr;http://aais.hanyang.ac.kr;http://ailab.kaist.ac.kr",
        "dblp": "176/5534;266/0681;68/222-4.html;54/6443;35/6703",
        "google_scholar": "JTxNwKgAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.co.kr/citations?user=rFcK8EEAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=ko",
        "orcid": ";;;;",
        "linkedin": "haanvid-lee-45636ab3/;wahyuguntara;jmlee123/;;",
        "or_profile": "~Haanvid_Lee1;~Tri_Wahyu_Guntara1;~Jongmin_Lee1;~Yung-Kyun_Noh1;~Kee-Eung_Kim2",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;University of California, Berkeley;Korea Institute for Advanced Study;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr;berkeley.edu;kias.re.kr;kaist.ac.kr",
        "position": "PhD student;MS student;Postdoc;Affiliate Professor;Full Professor",
        "bibtex": "@inproceedings{\nlee2024kernel,\ntitle={Kernel Metric Learning for In-Sample Off-Policy Evaluation of Deterministic {RL} Policies},\nauthor={Haanvid Lee and Tri Wahyu Guntara and Jongmin Lee and Yung-Kyun Noh and Kee-Eung Kim},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=plebgsdiiV}\n}",
        "github": "",
        "project": "",
        "reviewers": "pubB;bgFP;PFzG",
        "pdf_size": 1052505,
        "rating": "6;8;8",
        "confidence": "3;3;3",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "3;3;2",
        "wc_summary": "46;81;85",
        "wc_strengths": "12;114;39",
        "wc_weaknesses": "27;29;333",
        "wc_questions": "54;210;2",
        "wc_review": "139;434;459",
        "wc_reply_reviewers": "26;41;0",
        "wc_reply_authors": "609;459;558",
        "reply_reviewers": "1;1;0",
        "reply_authors": "2;2;1",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            70.66666666666667,
            17.518244457961217
        ],
        "wc_strengths_avg": [
            55.0,
            43.15089802078283
        ],
        "wc_weaknesses_avg": [
            129.66666666666666,
            143.78069720546247
        ],
        "wc_questions_avg": [
            88.66666666666667,
            88.38300490227493
        ],
        "wc_review_avg": [
            344.0,
            145.3157481715821
        ],
        "wc_reply_reviewers_avg": [
            22.333333333333332,
            16.937794687883336
        ],
        "wc_reply_authors_avg": [
            542.0,
            62.27358990776106
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6361682856113176184&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=plebgsdiiV",
        "pdf": "https://openreview.net/pdf?id=plebgsdiiV",
        "email": "kaist.ac.kr;kaist.ac.kr;berkeley.edu;kias.re.kr;kaist.ac.kr",
        "author_num": 5,
        "aff_unique_index": "0;0;1;2;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology;University of California, Berkeley;Korea Institute for Advanced Study",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.kaist.ac.kr;https://www.berkeley.edu;http://www.kaist.edu",
        "aff_unique_abbr": "KAIST;UC Berkeley;KIAS",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Berkeley",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "title": "Jailbreak in pieces: Compositional Adversarial Attacks on Multi-Modal Language Models",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17767",
        "id": "plmBsXHxgR",
        "author_site": "Erfan Shayegani, Yue Dong, Nael Abu-Ghazaleh",
        "tldr": "",
        "abstract": "We introduce new jailbreak attacks on vision language models (VLMs), which use aligned LLMs and are resilient to text-only jailbreak attacks. Specifically, we develop cross-modality attacks on alignment where we pair adversarial images going through the vision encoder with textual prompts to break the alignment of the language model. Our attacks employ a novel compositional strategy that combines an image, adversarially targeted towards toxic embeddings, with generic prompts to accomplish the jailbreak. Thus, the LLM draws the context to answer the generic prompt from the adversarial image. The generation of benign-appearing adversarial images leverages a novel embedding-space-based methodology, operating with no access to the LLM model. Instead, the attacks require access only to the vision encoder and utilize one of our four embedding space targeting strategies. By not requiring access to the LLM, the attacks lower the entry barrier for attackers, particularly when vision encoders such as CLIP are embedded in closed-source LLMs. The attacks achieve a high success rate across different VLMs, highlighting the risk of cross-modality alignment vulnerabilities, and the need for new alignment approaches for multi-modal models.",
        "keywords": "Adversarial attacks;Vision encoders;Jailbreak;Prompt Injection;Security;Embedding space attacks;Black box;LLM;Vision-Language Models;Multi-Modal Models;VLM;Alignment;Cross-Modality alignment",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/35ff9ea0935ed48be01503d14fdd0b2dbabb0ad0.zip",
        "author": "Erfan Shayegani;Yue Dong;Nael Abu-Ghazaleh",
        "authorids": "~Erfan_Shayegani1;~Yue_Dong2;~Nael_Abu-Ghazaleh2",
        "gender": "M;F;M",
        "homepage": "https://erfanshayegani.github.io/;https://yuedong.us/;https://www.cs.cur.edu/~nael",
        "dblp": "353/2686;84/486;86/2654",
        "google_scholar": "G9pIW1AAAAAJ;https://scholar.google.ca/citations?user=WYkn4loAAAAJ;AN3f7iAAAAAJ",
        "orcid": "0009-0006-8149-2992;;",
        "linkedin": "erfan-shayegani/;;",
        "or_profile": "~Erfan_Shayegani1;~Yue_Dong2;~Nael_Abu-Ghazaleh2",
        "aff": "Microsoft Research;McGill University;University of California, Riverside",
        "aff_domain": "research.microsoft.com;mcgill.ca;ucr.edu",
        "position": "Research Intern;PhD student;Full Professor",
        "bibtex": "@inproceedings{\nshayegani2024jailbreak,\ntitle={Jailbreak in pieces: Compositional Adversarial Attacks on Multi-Modal Language Models},\nauthor={Erfan Shayegani and Yue Dong and Nael Abu-Ghazaleh},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=plmBsXHxgR}\n}",
        "github": "",
        "project": "",
        "reviewers": "LEJJ;5f6B;v6mu;2o3H",
        "pdf_size": 9181257,
        "rating": "5;6;6;8",
        "confidence": "3;4;3;4",
        "soundness": "1;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;3;4",
        "wc_summary": "77;175;57;108",
        "wc_strengths": "28;80;47;41",
        "wc_weaknesses": "509;341;316;82",
        "wc_questions": "5;45;52;122",
        "wc_review": "619;641;472;353",
        "wc_reply_reviewers": "217;103;99;0",
        "wc_reply_authors": "861;943;498;133",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "3;3;3;2",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            104.25,
            44.70668294561787
        ],
        "wc_strengths_avg": [
            49.0,
            19.170289512680814
        ],
        "wc_weaknesses_avg": [
            312.0,
            152.123305249393
        ],
        "wc_questions_avg": [
            56.0,
            42.11294337849113
        ],
        "wc_review_avg": [
            521.25,
            116.86397006776726
        ],
        "wc_reply_reviewers_avg": [
            104.75,
            76.82569557120847
        ],
        "wc_reply_authors_avg": [
            608.75,
            321.6973538902675
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            0.4330127018922193
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.6882472016116854,
        "gs_citation": 147,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17800401757903884707&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=plmBsXHxgR",
        "pdf": "https://openreview.net/pdf?id=plmBsXHxgR",
        "email": "research.microsoft.com;mcgill.ca;ucr.edu",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Microsoft;McGill University;University of California, Riverside",
        "aff_unique_dep": "Microsoft Research;;",
        "aff_unique_url": "https://www.microsoft.com/en-us/research;https://www.mcgill.ca;https://www.ucr.edu",
        "aff_unique_abbr": "MSR;McGill;UCR",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Riverside",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United States;Canada"
    },
    {
        "title": "Tractable MCMC for Private Learning with Pure and Gaussian Differential Privacy",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17766",
        "id": "pmweVpJ229",
        "author_site": "Yingyu Lin, Yian Ma, Yu-Xiang Wang, Rachel Redberg, Zhiqi Bu",
        "tldr": "",
        "abstract": "Posterior sampling, i.e., exponential mechanism to sample from the posterior distribution, provides $\\varepsilon$-pure differential privacy (DP) guarantees and does not suffer from potentially unbounded privacy breach introduced by $(\\varepsilon,\\delta)$-approximate DP. In practice, however, one needs to apply approximate sampling methods such as Markov chain Monte Carlo (MCMC), thus re-introducing the unappealing $\\delta$-approximation error into the privacy guarantees. To bridge this gap, we propose the Approximate SAample Perturbation (abbr. ASAP) algorithm which perturbs an MCMC sample with noise proportional to its Wasserstein-infinity ($W_\\infty$) distance from a reference distribution that satisfies pure DP or pure Gaussian DP (i.e., $\\delta=0$). We then leverage a Metropolis-Hastings algorithm to generate the sample and prove that the algorithm converges in W$_\\infty$ distance. We show that by combining our new techniques with a localization step, we obtain the first nearly linear-time algorithm that achieves the optimal rates in the DP-ERM problem with strongly convex and smooth losses.",
        "keywords": "Pure Differential Privacy;Monte Carlo sampling;Gaussian Differential Privacy;Exponential Mechanism",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Yingyu Lin;Yian Ma;Yu-Xiang Wang;Rachel Emily Redberg;Zhiqi Bu",
        "authorids": "~Yingyu_Lin1;~Yian_Ma1;~Yu-Xiang_Wang1;~Rachel_Emily_Redberg1;~Zhiqi_Bu1",
        "gender": ";M;;F;M",
        "homepage": "https://sites.google.com/view/yingyulin;https://sites.google.com/view/yianma;http://www.cs.ucsb.edu/~yuxiangw/publications.html;;https://sites.google.com/view/zhiqi-bu",
        "dblp": "207/5447;;62/1637-3.html;259/2266;245/2573",
        "google_scholar": "https://scholar.google.com/citations?hl=en;A0TFlacAAAAJ;HGNZ1fkAAAAJ;;MEvTLxIAAAAJ",
        "orcid": ";;;0000-0001-5592-7186;",
        "linkedin": "yingyu-lin-000359252;;;rachel-redberg-08026a45;",
        "or_profile": "~Yingyu_Lin1;~Yian_Ma1;~Yu-Xiang_Wang1;~Rachel_Emily_Redberg1;~Zhiqi_Bu1",
        "aff": "University of California, San Diego;University of California, San Diego;UC Santa Barbara;Northeastern University;Amazon",
        "aff_domain": "ucsd.edu;ucsd.edu;ucsb.edu;northeastern.edu;amazon.com",
        "position": "PhD student;Assistant Professor;Assistant Professor;Postdoc;Researcher",
        "bibtex": "@inproceedings{\nlin2024tractable,\ntitle={Tractable {MCMC} for Private Learning with Pure and Gaussian Differential Privacy},\nauthor={Yingyu Lin and Yian Ma and Yu-Xiang Wang and Rachel Emily Redberg and Zhiqi Bu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=pmweVpJ229}\n}",
        "github": "",
        "project": "",
        "reviewers": "kgTq;kWWS;qRJd",
        "pdf_size": 722773,
        "rating": "6;6;8",
        "confidence": "3;4;3",
        "soundness": "3;3;4",
        "contribution": "3;3;3",
        "presentation": "3;3;3",
        "wc_summary": "43;191;63",
        "wc_strengths": "72;125;71",
        "wc_weaknesses": "213;80;256",
        "wc_questions": "43;229;130",
        "wc_review": "371;625;520",
        "wc_reply_reviewers": "28;76;88",
        "wc_reply_authors": "814;871;693",
        "reply_reviewers": "1;1;1",
        "reply_authors": "2;2;2",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            99.0,
            65.56421788343599
        ],
        "wc_strengths_avg": [
            89.33333333333333,
            25.223445883190152
        ],
        "wc_weaknesses_avg": [
            183.0,
            74.9177326583411
        ],
        "wc_questions_avg": [
            134.0,
            75.98684096605149
        ],
        "wc_review_avg": [
            505.3333333333333,
            104.21238996502395
        ],
        "wc_reply_reviewers_avg": [
            64.0,
            25.92296279363144
        ],
        "wc_reply_authors_avg": [
            792.6666666666666,
            74.21739837950547
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=760966947732740578&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=pmweVpJ229",
        "pdf": "https://openreview.net/pdf?id=pmweVpJ229",
        "email": "ucsd.edu;ucsd.edu;ucsb.edu;northeastern.edu;amazon.com",
        "author_num": 5,
        "aff_unique_index": "0;0;1;2;3",
        "aff_unique_norm": "University of California, San Diego;University of California, Santa Barbara;Northeastern University;Amazon",
        "aff_unique_dep": ";;;Amazon.com, Inc.",
        "aff_unique_url": "https://www.ucsd.edu;https://www.ucsb.edu;https://www.northeastern.edu;https://www.amazon.com",
        "aff_unique_abbr": "UCSD;UCSB;NEU;Amazon",
        "aff_campus_unique_index": "0;0;1",
        "aff_campus_unique": "San Diego;Santa Barbara;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "pnwh3JspxT",
        "title": "Text-to-3D using Gaussian Splatting",
        "track": "main",
        "status": "Desk Reject",
        "tldr": "",
        "abstract": "In this paper, we present Gaussian Splatting based text-to-3D generation (GSGEN), a novel approach for generating high-quality 3D objects. Previous methods suffer from inaccurate geometry and limited fidelity due to the absence of 3D prior and proper representation. We leverage 3D Gaussian Splatting, a recent state-of-the-art representation, to address existing shortcomings by exploiting the explicit nature that enables the incorporation of 3D prior. Specifically, our method adopts a progressive optimization strategy, which includes a geometry optimization stage and an appearance refinement stage. In geometry optimization, a coarse representation is established under a 3D geometry prior along with the ordinary 2D SDS loss, ensuring a sensible and 3D-consistent rough shape. Subsequently, the obtained Gaussians undergo an iterative refinement to enrich details. In this stage, we increase the number of Gaussians by compactness-based densification to enhance continuity and improve fidelity. With these designs, our approach can generate 3D content with delicate details and more accurate geometry. Extensive evaluations demonstrate the effectiveness of our method, especially for capturing high-frequency components. Video results are provided in [gsgen3d.github.io](https://gsgen3d.github.io/).",
        "keywords": "Text-to-3D;3D generation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/f471095c32ec2bf800f5e25642a7c3317af9e28e.zip",
        "author": "Zilong Chen;Feng Wang;Huaping Liu",
        "authorids": "~Zilong_Chen1;~Feng_Wang12;~Huaping_Liu3",
        "gender": "M;M;M",
        "homepage": "https://heheyas.github.io/;;https://sites.google.com/site/thuliuhuaping/",
        "dblp": ";90/4225-34;69/1097-1",
        "google_scholar": "2pbka1gAAAAJ;bKG4Un8AAAAJ;https://scholar.google.com.hk/citations?user=HXnkIkwAAAAJ",
        "orcid": ";;",
        "linkedin": "https://www.linkedin.cn/incareer/in/zilong-chen-99671523b;;",
        "or_profile": "~Zilong_Chen1;~Feng_Wang12;~Huaping_Liu3",
        "aff": "Tsinghua University;Tsinghua University;Tsinghua University",
        "aff_domain": "cs.tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nchen2024texttod,\ntitle={Text-to-3D using Gaussian Splatting},\nauthor={Zilong Chen and Feng Wang and Huaping Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=pnwh3JspxT}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=pnwh3JspxT",
        "pdf_size": 10644865,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 232,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11662030707063867315&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Tsinghua University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "poFAoivHQk",
        "title": "Graph Convolutions Enrich the Self-Attention in Transformers!",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Transformers, renowned for their self-attention mechanism, have achieved the state-of-the-art performance across various tasks in natural language processing, computer vision, time-series modeling, etc. However, one of the challenges with deep Transformer models is the oversmoothing problem, where representations across layers converge to indistinguishable values, leading to significant performance degradation. We interpret the original self-attention as a simple graph filter and redesign it from a graph signal processing (GSP) perspective. We propose graph-filter-based self-attention (GFSA) to learn a general yet effective one, whose complexity, however, is slightly larger than that of the original self-attention mechanism. We demonstrate that GFSA improves the performance of Transformers in various fields, including computer vision, natural language processing, graph pattern classification, speech recognition, and code classification.",
        "keywords": "Transformer;Self-attention;Graph Convolution Filter",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Jeongwhan Choi;Hyowon Wi;Jayoung Kim;Yehjin Shin;Kookjin Lee;Nathaniel Trask;Noseong Park",
        "authorids": "~Jeongwhan_Choi1;~Hyowon_Wi1;~Jayoung_Kim1;~Yehjin_Shin1;~Kookjin_Lee1;~Nathaniel_Trask2;~Noseong_Park1",
        "gender": "M;;F;F;M;M;",
        "homepage": "https://www.jeongwhanchoi.com;;;http://yehjin-shin.github.io/;https://scholar.google.com/citations?hl=en&user=KL89hVQAAAAJ&view_op=list_works;https://www.sandia.gov/ccr/staff/nathaniel-albert-trask/;",
        "dblp": "39/11215-2;332/6458;26/9969-2;322/5257;122/5103;188/8236;",
        "google_scholar": "3MNElkYAAAAJ;https://scholar.google.com/citations?view_op=list_works;3qbSHGwAAAAJ;https://scholar.google.com/citations?view_op=list_works;https://scholar.google.com/citations?hl=en;6iLMZkwAAAAJ;",
        "orcid": "0000-0002-6530-2662;;;0009-0001-7600-2585;;;",
        "linkedin": "jeongwhanchoi/;;;yehjin-shin-528987217/;;;",
        "or_profile": "~Jeongwhan_Choi1;~Hyowon_Wi1;~Jayoung_Kim1;~Yehjin_Shin1;~Kookjin_Lee1;~Nathaniel_Trask2;~Noseong_Park1",
        "aff": "Yonsei University;Yonsei University;Yonsei University;Yonsei University;Arizona State University;;",
        "aff_domain": "yonsei.ac.kr;yonsei.ac.kr;yonsei.ac.kr;yonsei.ac.kr;asu.edu;;",
        "position": "PhD student;MS student;MS student;MS student;Assistant Professor;;",
        "bibtex": "@misc{\nchoi2024graph,\ntitle={Graph Convolutions Enrich the Self-Attention in Transformers!},\nauthor={Jeongwhan Choi and Hyowon Wi and Jayoung Kim and Yehjin Shin and Kookjin Lee and Nathaniel Trask and Noseong Park},\nyear={2024},\nurl={https://openreview.net/forum?id=poFAoivHQk}\n}",
        "github": "",
        "project": "",
        "reviewers": "huFG;kKdF;sAYQ;fbar",
        "site": "https://openreview.net/forum?id=poFAoivHQk",
        "pdf_size": 2185567,
        "rating": "3;5;6;10",
        "confidence": "4;4;5;4",
        "soundness": "3;2;3;4",
        "contribution": "2;2;3;4",
        "presentation": "3;3;3;4",
        "wc_summary": "61;98;81;94",
        "wc_strengths": "12;24;42;84",
        "wc_weaknesses": "102;221;29;72",
        "wc_questions": "410;45;141;256",
        "wc_review": "585;388;293;506",
        "wc_reply_reviewers": "0;2356;19;0",
        "wc_reply_authors": "1173;1649;1196;271",
        "reply_reviewers": "0;11;1;0",
        "reply_authors": "3;8;3;1",
        "rating_avg": [
            6.0,
            2.5495097567963922
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            83.5,
            14.430869689661812
        ],
        "wc_strengths_avg": [
            40.5,
            27.290108097990377
        ],
        "wc_weaknesses_avg": [
            106.0,
            71.28464070190716
        ],
        "wc_questions_avg": [
            213.0,
            136.07534677523333
        ],
        "wc_review_avg": [
            443.0,
            111.42037515643177
        ],
        "wc_reply_reviewers_avg": [
            593.75,
            1017.4650792533373
        ],
        "wc_reply_authors_avg": [
            1072.25,
            500.0266867878154
        ],
        "reply_reviewers_avg": [
            3.0,
            4.636809247747852
        ],
        "reply_authors_avg": [
            3.75,
            2.5860201081971503
        ],
        "replies_avg": [
            50,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17784763847977253745&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;0;0;1",
        "aff_unique_norm": "Yonsei University;Arizona State University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.yonsei.ac.kr;https://www.asu.edu",
        "aff_unique_abbr": "Yonsei;ASU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;1",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "id": "pogJXugbN8",
        "title": "BAFFLE: A Baseline of Backpropagation-Free Federated Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Federated learning (FL) is a general principle for decentralized clients to train a server model collectively without sharing local data. FL is a promising framework with practical applications, but its standard training paradigm requires the clients to backpropagate through the model to compute gradients. Since these clients are typically edge devices and not fully trusted, executing backpropagation on them incurs computational and storage overhead as well as white-box vulnerability. In light of this, we develop backpropagation-free federated learning, dubbed BAFFLE, in which backpropagation is replaced by multiple forward processes to estimate gradients. BAFFLE is 1) memory-efficient and easily fits uploading bandwidth; 2) compatible with inference-only hardware optimization and model quantization or pruning; and 3) well-suited to trusted execution environments, because the clients in BAFFLE only execute forward propagation and return a set of scalars to the server. Empirically we use BAFFLE to train deep models from scratch or to finetune pretrained models, achieving acceptable results.",
        "keywords": "Federated Learning;Backpropagation-Free Training",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/6f8148d928604f741692253f72c50fe0970f816b.zip",
        "author": "Haozhe Feng;Tianyu Pang;Chao Du;Wei Chen;Shuicheng YAN;Min Lin",
        "authorids": "~Haozhe_Feng1;~Tianyu_Pang1;~Chao_Du1;~Wei_Chen34;~Shuicheng_YAN3;~Min_Lin1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://fenghz.github.io/resume/;https://p2333.github.io/;https://duchao0726.github.io/;http://www.cad.zju.edu.cn/home/chenwei/;https://yanshuicheng.ai/;https://linmin.me",
        "dblp": "https://dblp.uni-trier.de/pid/241/9604;202/2550;75/7523;c/WeiChen1;y/ShuichengYan;",
        "google_scholar": "kKOuziEAAAAJ;wYDbtFsAAAAJ;QOp7xW0AAAAJ;EgQyYGUAAAAJ;https://scholar.google.com.hk/citations?user=DNuiPHwAAAAJ;BGONmkIAAAAJ",
        "orcid": ";0000-0003-0639-6176;0000-0003-1244-6336;0000-0002-8365-4741;;",
        "linkedin": ";%E5%A4%A9%E5%AE%87-%E5%BA%9E-b3999017a/;duchao/;;;min-lin-08a3a422/",
        "or_profile": "~Haozhe_Feng1;~Tianyu_Pang1;~Chao_Du1;~Wei_Chen34;~Shuicheng_YAN3;~Min_Lin1",
        "aff": "State Key Lab of CAD&CG, Zhejiang University;Sea AI Lab;Sea AI Lab;State key laboratory of CAD&CG, Zhejiang University;sea Group;Sea AI Lab",
        "aff_domain": "zju.edu.cn;sea.com;sea.com;zju.edu.cn;sea.com;sea.com",
        "position": "PhD student;Senior Research Scientist;Senior Research Scientist;Full Professor;Researcher;Principal Researcher",
        "bibtex": "@misc{\nfeng2024baffle,\ntitle={{BAFFLE}: A Baseline of Backpropagation-Free Federated Learning},\nauthor={Haozhe Feng and Tianyu Pang and Chao Du and Wei Chen and Shuicheng YAN and Min Lin},\nyear={2024},\nurl={https://openreview.net/forum?id=pogJXugbN8}\n}",
        "github": "",
        "project": "",
        "reviewers": "9br4;vF9m;7JpN;MdFM",
        "site": "https://openreview.net/forum?id=pogJXugbN8",
        "pdf_size": 907149,
        "rating": "3;3;3;5",
        "confidence": "4;4;4;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "3;2;3;2",
        "wc_summary": "151;119;45;62",
        "wc_strengths": "136;51;26;27",
        "wc_weaknesses": "252;89;158;197",
        "wc_questions": "205;26;256;4",
        "wc_review": "744;285;485;290",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            94.25,
            42.716361034151774
        ],
        "wc_strengths_avg": [
            60.0,
            45.00555521266236
        ],
        "wc_weaknesses_avg": [
            174.0,
            59.35907681222814
        ],
        "wc_questions_avg": [
            122.75,
            109.52482595284049
        ],
        "wc_review_avg": [
            451.0,
            187.4046424184844
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15716116143113213229&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;1;0;2;1",
        "aff_unique_norm": "Zhejiang University;Sea AI Lab;Sea Group",
        "aff_unique_dep": "State Key Lab of CAD&CG;;",
        "aff_unique_url": "http://www.zju.edu.cn;;",
        "aff_unique_abbr": "ZJU;;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China;"
    },
    {
        "id": "ppTAQRu8EJ",
        "title": "Semi-Supervised Learning of Tree-Based Models Using Uncertain Interpretation of Data",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Semi-supervised learning (SSL) learns an estimator from labeled and unlabeled data. While diverse methods based on various assumptions have been developed for parametric models, SSL for tree-based models is largely limited to variants of self-training, for which decision trees are not well-suited. We introduce an intrinsic semi-supervised learning algorithm that achieves state-of-the-art performance for tree-based models. The algorithm first grows a tree to minimize a semi-supervised notion of impurity, then assigns leaf values using a leaf similarity graph to optimize either for smoothness or adversarial robustness of the estimator near the data. Our methods can be viewed as natural extensions of conventional tree induction methods emerging from an uncertain interpretation of model input, or alternatively as inductive tree-based approximations of well-established graph-based SSL algorithms.",
        "keywords": "semi-supervised learning;decision tree;tree ensemble;random forest",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Jack Henry Good;Shyla Bisht;Kyle Miller;Artur Dubrawski",
        "authorids": "~Jack_Henry_Good1;~Shyla_Bisht1;~Kyle_Miller1;~Artur_Dubrawski2",
        "gender": "M;F;;M",
        "homepage": "https://www.ri.cmu.edu/ri-people/jack-henry-good/;;;https://www.autonlab.org",
        "dblp": "221/2759.html;;92/11514;76/48",
        "google_scholar": ";;;O3gezzcAAAAJ",
        "orcid": "0000-0003-1886-9217;;;0000-0002-2372-0831",
        "linkedin": ";shyla-bisht/;;artur-dubrawski-33a2a87/",
        "or_profile": "~Jack_Henry_Good1;~Shyla_Bisht1;~Kyle_Miller1;~Artur_Dubrawski2",
        "aff": "Carnegie Mellon University;Carnegie Mellon University;Carnegie Mellon University;Carnegie Mellon University",
        "aff_domain": "cmu.edu;andrew.cmu.edu;andrew;cmu.edu",
        "position": "PhD student;Undergrad student;Project scientist;Research Professor",
        "bibtex": "@misc{\ngood2024semisupervised,\ntitle={Semi-Supervised Learning of Tree-Based Models Using Uncertain Interpretation of Data},\nauthor={Jack Henry Good and Shyla Bisht and Kyle Miller and Artur Dubrawski},\nyear={2024},\nurl={https://openreview.net/forum?id=ppTAQRu8EJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "ExDS;e7qU;HSUS;YpyQ",
        "site": "https://openreview.net/forum?id=ppTAQRu8EJ",
        "pdf_size": 1365169,
        "rating": "3;3;3;5",
        "confidence": "3;5;3;4",
        "soundness": "3;3;2;3",
        "contribution": "2;2;2;2",
        "presentation": "3;2;4;2",
        "wc_summary": "60;87;127;145",
        "wc_strengths": "50;51;39;26",
        "wc_weaknesses": "234;263;208;151",
        "wc_questions": "70;27;88;311",
        "wc_review": "414;428;462;633",
        "wc_reply_reviewers": "0;283;29;12",
        "wc_reply_authors": "596;377;576;496",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            104.75,
            33.28945028083221
        ],
        "wc_strengths_avg": [
            41.5,
            10.111874208078342
        ],
        "wc_weaknesses_avg": [
            214.0,
            41.24924241728568
        ],
        "wc_questions_avg": [
            124.0,
            110.21569761154714
        ],
        "wc_review_avg": [
            484.25,
            87.63667896491742
        ],
        "wc_reply_reviewers_avg": [
            81.0,
            117.07903313574126
        ],
        "wc_reply_authors_avg": [
            511.25,
            86.06792375792506
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.17407765595569782,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:cb3yTvR_6YsJ:scholar.google.com/&scioq=Semi-Supervised+Learning+of+Tree-Based+Models+Using+Uncertain+Interpretation+of+Data&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Carnegie Mellon University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cmu.edu",
        "aff_unique_abbr": "CMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "pqgDqYinDZ",
        "title": "Learning From Multi-Expert Demonstrations: A Multi-Objective Inverse Reinforcement Learning Approach",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Imitation learning (IL) from a single expert's demonstration has reached expert-level performance in many Mujoco environments. However, real-world environments often involve demonstrations from multiple experts, resulting in diverse policies due to varying preferences among demonstrators. We propose a multi-objective inverse reinforcement learning (MOIRL) approach that utilizes demonstrations from multiple experts. This approach shows transferability to different preferences due to the assumption of a common reward among demonstrators. We conducts experimental testing in a discrete environment Deep Sea Treasure (DST) and achieved a promising preliminary result. Unlike IRL algorithms, we demonstrate that this approach is competitive across various preferences in both continuous DST and Mujoco environments, using merely a single model within the SAC framework instead of $n$ models for each distinct preference.",
        "keywords": "Inverse reinforcement learning;multiple experts;multi-objective learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/28432b90086ee56a8180c0707def184c7cbbe78f.zip",
        "author": "Qian-You Zhang;Jun-Jie Yang;Ping-Chun Hsieh;Xi Liu",
        "authorids": "~Qian-You_Zhang1;~Jun-Jie_Yang1;~Ping-Chun_Hsieh1;~Xi_Liu1",
        "gender": ";;M;M",
        "homepage": "https://github.com/qianyou07;https://github.com/yangalt;https://pinghsieh.github.io/;",
        "dblp": ";;163/7352;https://dblp.uni-trier.de/pers/hd/l/Liu_0011:Xi",
        "google_scholar": ";;ix38JgoAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;",
        "linkedin": ";;;xi-liu-2b0285173/",
        "or_profile": "~Qian-You_Zhang1;~Jun-Jie_Yang1;~Ping-Chun_Hsieh1;~Xi_Liu1",
        "aff": "National Yang Ming Chiao Tung University;National Yang Ming Chiao Tung University;National Yang Ming Chiao Tung University;Meta AI",
        "aff_domain": "nycu.edu.tw;nycu.edu;nycu.edu.tw;fb.com",
        "position": "MS student;Undergrad student;Associate Professor;Research Scientist",
        "bibtex": "@misc{\nzhang2024learning,\ntitle={Learning From Multi-Expert Demonstrations: A Multi-Objective Inverse Reinforcement Learning Approach},\nauthor={Qian-You Zhang and Jun-Jie Yang and Ping-Chun Hsieh and Xi Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=pqgDqYinDZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "92m6;ooq3;YYg8;8hYp",
        "site": "https://openreview.net/forum?id=pqgDqYinDZ",
        "pdf_size": 1528989,
        "rating": "3;3;3;5",
        "confidence": "3;4;4;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "2;2;2;2",
        "wc_summary": "97;57;63;88",
        "wc_strengths": "59;61;29;41",
        "wc_weaknesses": "182;116;160;125",
        "wc_questions": "8;103;41;28",
        "wc_review": "346;337;293;282",
        "wc_reply_reviewers": "36;0;0;26",
        "wc_reply_authors": "514;562;370;715",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            76.25,
            16.69393602479655
        ],
        "wc_strengths_avg": [
            47.5,
            13.219304066402286
        ],
        "wc_weaknesses_avg": [
            145.75,
            26.61179249881526
        ],
        "wc_questions_avg": [
            45.0,
            35.48943504763072
        ],
        "wc_review_avg": [
            314.5,
            27.463612289718917
        ],
        "wc_reply_reviewers_avg": [
            15.5,
            15.898113095584646
        ],
        "wc_reply_authors_avg": [
            540.25,
            123.17137451534752
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:EtcGjiON3AgJ:scholar.google.com/&scioq=Learning+From+Multi-Expert+Demonstrations:+A+Multi-Objective+Inverse+Reinforcement+Learning+Approach&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "National Yang Ming Chiao Tung University;Meta",
        "aff_unique_dep": ";Meta AI",
        "aff_unique_url": "https://www.nycu.edu.tw;https://meta.com",
        "aff_unique_abbr": "NYCU;Meta",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Taiwan;",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "prLvQWc5YH",
        "title": "Tackling Underestimation Bias in Successor Features by Distributional Reinforcement Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The framework of successor features (SFs) and generalized policy improvement (GPI) yields the potential to achieve zero-shot transfer in reinforcement learning (RL) among different tasks. However, GPI always suffers from inaccurate value function approximation in practice, resulting in a ``zero-shot'' somewhat fantastical. This paper focuses on comprehending the underlying causes of inaccurate SFs and presents a methodology for improving their accuracy. Our contributions encompass four key aspects: (i) we theoretically study the underestimation phenomenon in SF\\&GPI; (ii) we introduce distributional RL into SF\\&GPI, and demonstrate its effectiveness in relieving such underestimation; (iii) we show that distributional SFs (DSFs) is provided with a lower generalization bound than original SFs; (iv) we put forward that the performance of SFs-based algorithms can be enhanced by incorporating DSFs. Furthermore, we verify the quality of employing DSFs on the platform of multi-objective RL (MORL). Simulation study demonstrates the superiority of our concept in addressing underestimation challenges.",
        "keywords": "Successor features;Distributional reinforcement learning;Underestimation bias",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/81f586e5695b512f4878f04ed8108736e6b60f23.zip",
        "author": "Mengxiao Lu;Yirui Zhou;Huojun Hong;Yaxin Peng;Xiaofeng Zhang;Yangchun Zhang",
        "authorids": "~Mengxiao_Lu1;~Yirui_Zhou1;~Huojun_Hong1;~Yaxin_Peng1;~Xiaofeng_Zhang4;~Yangchun_Zhang1",
        "gender": "F;M;M;F;M;",
        "homepage": "https://www.mdmlab-shu.com/author/mengxiao-lu/;;https://github.com/qianOU/;https://www.mdmlab-shu.com/author/yaxin-peng/;https://www.newtouch.com;",
        "dblp": "https://dblp.uni-trier.de/pid/356/8325;326/5673;;20/7643.html;;https://dblp.uni-trier.de/pid/324/8512",
        "google_scholar": ";https://scholar.google.com.hk/citations?user=UY7IUBIAAAAJ;;https://scholar.google.com.hk/citations?user=4cRt3XoAAAAJ;;https://scholar.google.com.hk/citations?user=CjY56LgAAAAJ",
        "orcid": "0009-0004-0221-283X;0000-0002-6591-0852;;0000-0002-2983-555X;;0000-0002-0540-9070",
        "linkedin": ";;;;;",
        "or_profile": "~Mengxiao_Lu1;~Yirui_Zhou1;~Huojun_Hong1;~Yaxin_Peng1;~Xiaofeng_Zhang4;~Yangchun_Zhang1",
        "aff": "Shanghai University;Shanghai University;;Shanghai University;;Shanghai University",
        "aff_domain": "shu.edu.cn;shu.edu.cn;;shu.edu.cn;;shu.edu.cn",
        "position": "MS student;PhD student;;Full Professor;;Lecturer",
        "bibtex": "@misc{\nlu2024tackling,\ntitle={Tackling Underestimation Bias in Successor Features by Distributional Reinforcement Learning},\nauthor={Mengxiao Lu and Yirui Zhou and Huojun Hong and Yaxin Peng and Xiaofeng Zhang and Yangchun Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=prLvQWc5YH}\n}",
        "github": "",
        "project": "",
        "reviewers": "mAvf;3ktK;dNHm",
        "site": "https://openreview.net/forum?id=prLvQWc5YH",
        "pdf_size": 715572,
        "rating": "3;3;5",
        "confidence": "3;2;3",
        "soundness": "1;2;3",
        "contribution": "2;1;2",
        "presentation": "1;1;1",
        "wc_summary": "38;118;61",
        "wc_strengths": "46;47;36",
        "wc_weaknesses": "330;347;200",
        "wc_questions": "188;26;24",
        "wc_review": "602;538;321",
        "wc_reply_reviewers": "66;69;0",
        "wc_reply_authors": "578;884;312",
        "reply_reviewers": "1;1;0",
        "reply_authors": "3;3;1",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.0,
            0.0
        ],
        "wc_summary_avg": [
            72.33333333333333,
            33.62869145371091
        ],
        "wc_strengths_avg": [
            43.0,
            4.96655480858378
        ],
        "wc_weaknesses_avg": [
            292.3333333333333,
            65.65735974655766
        ],
        "wc_questions_avg": [
            79.33333333333333,
            76.84327484490031
        ],
        "wc_review_avg": [
            487.0,
            120.2525121012724
        ],
        "wc_reply_reviewers_avg": [
            45.0,
            31.843366656181317
        ],
        "wc_reply_authors_avg": [
            591.3333333333334,
            233.70827019075634
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:BqOVNA2ueO4J:scholar.google.com/&scioq=Tackling+Underestimation+Bias+in+Successor+Features+by+Distributional+Reinforcement+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Shanghai University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.shu.edu.cn",
        "aff_unique_abbr": "SHU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "psDvcWtFdE",
        "title": "DIG-MILP: a Deep Instance Generator for Mixed-Integer Linear Programming with Feasibility Guarantee",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Mixed-integer linear programming (MILP) stands as a notable NP-hard problem pivotal to numerous crucial industrial applications. The development of effective algorithms, the tuning of solvers, and the training of machine learning models for MILP resolution all hinge on access to extensive, diverse, and representative data. Yet compared to the abundant naturally occurring data in image and text realms, MILP is markedly data deficient, underscoring the vital role of synthetic MILP generation. We present DIG-MILP, a deep generative framework based on variational auto-encoder (VAE), adept at extracting deep-level structural features from highly limited MILP data and producing instances that closely mirror the target data. Notably, by leveraging the MILP duality, DIG-MILP guarantees a correct and complete generation space as well as ensures the boundedness and feasibility of the generated instances. Our empirical study highlights the novelty and quality of the instances generated by DIG-MILP through two distinct downstream tasks: (S1) Data sharing, where solver solution times correlate highly positive between original and DIG-MILP-generated instances, allowing data sharing for solver tuning without publishing the original data; (S2) Data Augmentation, wherein the DIG-MILP-generated instances bolster the generalization performance of machine learning models tasked with resolving MILP problems.",
        "keywords": "mixed-integer linear programming;generative model",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/19c61e40d0fc4e60361934e810e9889447356418.zip",
        "author": "Haoyu Peter Wang;Jialin Liu;Xiaohan Chen;Xinshang Wang;Pan Li;Wotao Yin",
        "authorids": "~Haoyu_Peter_Wang1;~Jialin_Liu1;~Xiaohan_Chen1;~Xinshang_Wang1;~Pan_Li2;~Wotao_Yin1",
        "gender": "M;M;M;;;M",
        "homepage": ";https://liujl11git.github.io/;http://xiaohanchen.com;;;http://wotaoyin.com",
        "dblp": ";;94/3802;196/7073;https://dblp.org/pers/hd/l/Li_0005:Pan;76/2265",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;QS6Lj5sAAAAJ;https://scholar.google.com/citations?authuser=1;;IroP0EwAAAAJ;kpQGGFUAAAAJ",
        "orcid": ";;0000-0002-0360-0402;;;0000-0001-6697-9731",
        "linkedin": ";;xiaohan-chen-400b00147/;;pan-li-b951105a/;",
        "or_profile": "~Haoyu_Peter_Wang1;~Jialin_Liu1;~Xiaohan_Chen1;~Xinshang_Wang1;~Pan_Li2;~Wotao_Yin1",
        "aff": "Georgia Institute of Technology;Alibaba Group US;Alibaba Group;;Purdue University;Alibaba Group US",
        "aff_domain": "gatech.edu;alibaba-inc.com;alibaba-inc.com;;purdue.edu;alibaba-inc.com",
        "position": "PhD student;Researcher;Researcher;;Assistant Professor;Principal Researcher",
        "bibtex": "@misc{\nwang2024digmilp,\ntitle={{DIG}-{MILP}: a Deep Instance Generator for Mixed-Integer Linear Programming with Feasibility Guarantee},\nauthor={Haoyu Peter Wang and Jialin Liu and Xiaohan Chen and Xinshang Wang and Pan Li and Wotao Yin},\nyear={2024},\nurl={https://openreview.net/forum?id=psDvcWtFdE}\n}",
        "github": "",
        "project": "",
        "reviewers": "HSpe;T4Ma;KTFt;NJds",
        "site": "https://openreview.net/forum?id=psDvcWtFdE",
        "pdf_size": 935149,
        "rating": "3;3;3;3",
        "confidence": "4;5;4;4",
        "soundness": "3;2;2;2",
        "contribution": "2;2;2;1",
        "presentation": "3;3;3;2",
        "wc_summary": "127;103;52;38",
        "wc_strengths": "64;47;31;22",
        "wc_weaknesses": "352;139;470;206",
        "wc_questions": "144;72;33;2",
        "wc_review": "687;361;586;268",
        "wc_reply_reviewers": "0;0;115;0",
        "wc_reply_authors": "334;225;289;390",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            80.0,
            36.35244145858707
        ],
        "wc_strengths_avg": [
            41.0,
            16.015617378046965
        ],
        "wc_weaknesses_avg": [
            291.75,
            128.53866149917698
        ],
        "wc_questions_avg": [
            62.75,
            53.063052117268946
        ],
        "wc_review_avg": [
            475.5,
            168.1584074615361
        ],
        "wc_reply_reviewers_avg": [
            28.75,
            49.79646071760522
        ],
        "wc_reply_authors_avg": [
            309.5,
            60.5
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7932037035250678120&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1;2;1",
        "aff_unique_norm": "Georgia Institute of Technology;Alibaba Group;Purdue University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.gatech.edu;https://www.alibaba.com;https://www.purdue.edu",
        "aff_unique_abbr": "Georgia Tech;Alibaba;Purdue",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "AmortizedPeriod: Attention-based Amortized Inference for Periodicity Identification",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17765",
        "id": "psEswR8Jz4",
        "author_site": "Hang Yu, Cong Liao, Ruolan Liu, Jianguo Li, Hu Yun, Xinzhe Wang",
        "tldr": "",
        "abstract": "Periodic patterns are a fundamental characteristic of time series in natural world, with significant implications for a range of disciplines, from economics to cloud systems. However, the current literature on periodicity detection faces two key challenges: limited robustness in real-world scenarios and a lack of memory to leverage previously observed time series to accelerate and improve inference on new data. To overcome these obstacles, this paper presents AmortizedPeriod, an innovative approach to periodicity identification based on amortized variational inference that integrates Bayesian statistics and deep learning. Through the Bayesian generative process, our method flexibly captures the dependencies of the periods, trends, noise, and outliers in time series, while also considering missing data and irregular periods in a robust manner. In addition, it utilizes the evidence lower bound of the log-likelihood of the observed time series as the loss function to train a deep attention inference network, facilitating knowledge transfer from the seen time series (and their labels) to unseen ones. Experimental results show that AmortizedPeriod surpasses the state-of-the-art methods by a large margin of 28.5% on average in terms of micro $F_1$-score, with at least 55% less inference time.",
        "keywords": "Periodicity Identification;Probabilistic Models;Amortized Inference;Attention;Time Series Analysis",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Hang Yu;Cong Liao;Ruolan Liu;Jianguo Li;Hu Yun;Xinzhe Wang",
        "authorids": "~Hang_Yu1;~Cong_Liao1;~Ruolan_Liu1;~Jianguo_Li2;~Hu_Yun1;~Xinzhe_Wang4",
        "gender": "M;;F;;F;",
        "homepage": ";;;;https://openreview.net/profile/activate?token=1ba424ceb672b548d8402a376d4ea6101fa96eb803c46583f28a74a187e6118a;",
        "dblp": "74/2568-2;;;;;",
        "google_scholar": ";;;;;",
        "orcid": ";;;;;",
        "linkedin": "hang-yu-7ba38844/;;https://www.linkedin.cn/incareer/in/ACoAAC4Iw4MBrBtzt8IR_jRuhybKaIkD4UjG_b4;;;",
        "or_profile": "~Hang_Yu1;~Cong_Liao1;~Ruolan_Liu1;~Jianguo_Li2;~Hu_Yun1;~Xinzhe_Wang4",
        "aff": "Ant Group;;;;;",
        "aff_domain": "antgroup.com;;;;;",
        "position": "Senior Algorithm Expert;;;;;",
        "bibtex": "@inproceedings{\nyu2024amortizedperiod,\ntitle={AmortizedPeriod: Attention-based Amortized Inference for Periodicity Identification},\nauthor={Hang Yu and Cong Liao and Ruolan Liu and Jianguo Li and Hu Yun and Xinzhe Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=psEswR8Jz4}\n}",
        "github": "",
        "project": "",
        "reviewers": "Qy29;KTuk;ue83;M5wN",
        "pdf_size": 2710888,
        "rating": "5;6;6;6",
        "confidence": "2;4;4;3",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "2;3;3;2",
        "wc_summary": "63;35;67;88",
        "wc_strengths": "43;43;35;99",
        "wc_weaknesses": "151;65;69;107",
        "wc_questions": "13;5;23;37",
        "wc_review": "270;148;194;331",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1707;622;2150;1068",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;1;3;2",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            63.25,
            18.872930350107268
        ],
        "wc_strengths_avg": [
            55.0,
            25.612496949731394
        ],
        "wc_weaknesses_avg": [
            98.0,
            34.713109915419565
        ],
        "wc_questions_avg": [
            19.5,
            11.947803145348521
        ],
        "wc_review_avg": [
            235.75,
            70.15830314367645
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1386.75,
            585.5669795164341
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.8703882797784891,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8531850697275802023&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=psEswR8Jz4",
        "pdf": "https://openreview.net/pdf?id=psEswR8Jz4",
        "email": "antgroup.com;;;;;",
        "author_num": 6,
        "aff_unique_index": "0",
        "aff_unique_norm": "Ant Group",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.antgroup.com",
        "aff_unique_abbr": "Ant Group",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "title": "#InsTag: Instruction Tagging for Analyzing Supervised Fine-tuning of Large Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17764",
        "id": "pszewhybU9",
        "author_site": "Keming Lu, Hongyi Yuan, Zheng Yuan, Runji Lin, Junyang Lin, Chuanqi Tan, Chang Zhou, Jingren Zhou",
        "tldr": "",
        "abstract": "Pre-trained large language models (LLMs) can understand and align with human instructions by supervised fine-tuning (SFT).\nIt is commonly believed that diverse and complex SFT data are of the essence to enable good instruction-following abilities.\nHowever, such diversity and complexity are obscure and lack quantitative analyses.\nIn this work, we propose InsTag, an open-set instruction tagging method, to identify semantics and intentions of human instructions by tags that provide access to definitions and quantified analyses of instruction diversity and complexity.\nWe obtain 6.6K fine-grained tags to describe instructions from popular open-sourced SFT datasets comprehensively.\nWe find that the abilities of aligned LLMs benefit from more diverse and complex instructions in SFT data.\nBased on this observation, we propose a data sampling procedure based on InsTag, and select 6K diverse and complex samples from open-source datasets for SFT.\nThe resulting models, TagLM, outperform open-source models based on considerably larger SFT data evaluated by MT-Bench, echoing the importance of instruction diversity and complexity and the effectiveness of InsTag.\nInsTag has robust potential to be extended to more applications beyond the data selection as it provides an effective way to analyze the distribution of instructions.",
        "keywords": "Data Analysis;Supervised Fine-tuning for Human Alignment;Large Language Model",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Keming Lu;Hongyi Yuan;Zheng Yuan;Runji Lin;Junyang Lin;Chuanqi Tan;Chang Zhou;Jingren Zhou",
        "authorids": "~Keming_Lu1;~Hongyi_Yuan1;~Zheng_Yuan2;~Runji_Lin1;~Junyang_Lin1;~Chuanqi_Tan3;~Chang_Zhou2;~Jingren_Zhou1",
        "gender": "M;M;M;M;M;M;M;M",
        "homepage": ";;;;;;;https://linprophet.github.io/",
        "dblp": "65/6898.html;308/0909;56/2877-2;215/3823;148/4497;;84/2644;",
        "google_scholar": "WuD2op4AAAAJ;FG3O4i8AAAAJ;https://scholar.google.com/citations?hl=zh-CN;qp6IwtgAAAAJ;tOfo4ncAAAAJ;QeSoG3sAAAAJ;;",
        "orcid": ";;;;0000-0002-6676-3057;;;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Keming_Lu1;~Hongyi_Yuan1;~Zheng_Yuan2;~Junyang_Lin1;~Chuanqi_Tan3;~Chang_Zhou2;~Jingren_Zhou1;~Lin_Runji1",
        "aff": "Alibaba Group;Tsinghua University;Alibaba Group;Alibaba Group;Alibaba Group;Alibaba Group;Alibaba Group;School of Artificial Intelligence, University of Chinese Academy of Sciences",
        "aff_domain": "alibaba-inc.com;tsinghua.edu.cn;alibaba-inc.com;alibaba-inc.com;alibaba-inc.com;alibaba-inc.com;alibaba-inc.com;ia.ac.cn",
        "position": "Researcher;PhD student;Researcher;Principal Researcher;Full-time employee;Researcher;Researcher;MS student",
        "bibtex": "@inproceedings{\nlu2024instag,\ntitle={\\#InsTag: Instruction Tagging for Analyzing Supervised Fine-tuning of Large Language Models},\nauthor={Keming Lu and Hongyi Yuan and Zheng Yuan and Runji Lin and Junyang Lin and Chuanqi Tan and Chang Zhou and Jingren Zhou},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=pszewhybU9}\n}",
        "github": "",
        "project": "",
        "reviewers": "32G5;jYjU;jmr3;NPyy",
        "pdf_size": 2669808,
        "rating": "5;6;6;8",
        "confidence": "4;4;5;4",
        "soundness": "3;3;3;3",
        "contribution": "3;2;4;3",
        "presentation": "4;3;4;4",
        "wc_summary": "62;127;96;124",
        "wc_strengths": "46;60;85;95",
        "wc_weaknesses": "71;95;99;251",
        "wc_questions": "25;29;1;64",
        "wc_review": "204;311;281;534",
        "wc_reply_reviewers": "4;0;10;98",
        "wc_reply_authors": "418;456;381;493",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            102.25,
            26.1951808545007
        ],
        "wc_strengths_avg": [
            71.5,
            19.474342094150447
        ],
        "wc_weaknesses_avg": [
            129.0,
            71.2460525222275
        ],
        "wc_questions_avg": [
            29.75,
            22.487496525847426
        ],
        "wc_review_avg": [
            332.5,
            122.70798670013293
        ],
        "wc_reply_reviewers_avg": [
            28.0,
            40.570925550201586
        ],
        "wc_reply_authors_avg": [
            437.0,
            41.81506905411015
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.13245323570650439,
        "gs_citation": 100,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5556279079666996578&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=pszewhybU9",
        "pdf": "https://openreview.net/pdf?id=pszewhybU9",
        "email": "alibaba-inc.com;tsinghua.edu.cn;alibaba-inc.com;alibaba-inc.com;alibaba-inc.com;alibaba-inc.com;alibaba-inc.com;ia.ac.cn",
        "author_num": 8,
        "aff_unique_index": "0;1;0;0;0;0;0;2",
        "aff_unique_norm": "Alibaba Group;Tsinghua University;University of Chinese Academy of Sciences",
        "aff_unique_dep": ";;School of Artificial Intelligence",
        "aff_unique_url": "https://www.alibaba.com;https://www.tsinghua.edu.cn;http://www.ucas.ac.cn",
        "aff_unique_abbr": "Alibaba;THU;UCAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Image Clustering via the Principle of Rate Reduction in the Age of Pretrained Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17763",
        "id": "ptCIlV24YZ",
        "author_site": "Tianzhe Chu, Shengbang Tong, Tianjiao Ding, Xili Dai, Benjamin Haeffele, Rene Vidal, Yi Ma",
        "tldr": "",
        "abstract": "The advent of large pre-trained models has brought about a paradigm shift in both visual representation learning and natural language processing. However, clustering unlabeled images, as a fundamental and classic machine learning problem, still lacks an effective solution, particularly for large-scale datasets. In this paper, we propose a novel image clustering pipeline that leverages the powerful feature representation of large pre-trained models such as CLIP and cluster images effectively and efficiently at scale. We first developed a novel algorithm to estimate the number of clusters in a given dataset. We then show that the pre-trained features are significantly more structured by further optimizing the rate reduction objective. The resulting features may significantly improve the clustering accuracy, e.g., from 57\\% to  66\\% on ImageNet-1k. Furthermore, by leveraging CLIP's multimodality bridge between image and text, we develop a simple yet effective self-labeling algorithm that produces meaningful text labels for the clusters. Through extensive experiments, we show that our pipeline works well on standard datasets such as CIFAR-10, CIFAR-100, and ImageNet-1k. It also extends to datasets without predefined labels, such as LAION-Aesthetics and WikiArts.",
        "keywords": "image clustering;pretrained models;rate reduction;principled methods",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/ccd78cab37d29c8acf23ea5cba4be701b0696334.pdf",
        "author": "Tianzhe Chu;Shengbang Tong;Tianjiao Ding;Xili Dai;Benjamin David Haeffele;Rene Vidal;Yi Ma",
        "authorids": "~Tianzhe_Chu1;~Shengbang_Tong1;~Tianjiao_Ding1;~Xili_Dai2;~Benjamin_David_Haeffele1;~Rene_Vidal1;~Yi_Ma4",
        "gender": "M;M;M;M;;;M",
        "homepage": "https://tianzhechu.com;https://tsb0601.github.io/petertongsb/;https://tianjiaoding.com/;https://delay-xili.github.io/;;http://www.vision.jhu.edu;http://people.eecs.berkeley.edu/~yima/",
        "dblp": "348/8957;306/1406;230/1227;170/8561;;v/ReneVidal;",
        "google_scholar": "v6HphBcAAAAJ;https://scholar.google.com/citations?hl=en;L3wy9QMAAAAJ;CtRMD1UAAAAJ;;https://scholar.google.com/citations?hl=en;https://scholar.google.com.hk/citations?user=XqLiBQMAAAAJ",
        "orcid": ";;;;;;",
        "linkedin": ";;;xili-daley-dai-b87030179/;;rene-vidal-74844928/;",
        "or_profile": "~Tianzhe_Chu1;~Shengbang_Tong1;~Tianjiao_Ding1;~Xili_Dai2;~Benjamin_David_Haeffele1;~Rene_Vidal1;~Yi_Ma4",
        "aff": "ShanghaiTech University;New York University;University of Pennsylvania;Hong Kong University of Science and Technology (Guangzhou);;Amazon;University of California, Berkeley",
        "aff_domain": "shanghaitech.edu.cn;nyu.edu;seas.upenn.edu;hkust.edu;;amazon.com;berkeley.edu",
        "position": "Undergrad student;PhD student;PhD student;PhD student;;Principal Researcher;Full Professor",
        "bibtex": "@inproceedings{\nchu2024image,\ntitle={Image Clustering via the Principle of Rate Reduction in the Age of Pretrained Models},\nauthor={Tianzhe Chu and Shengbang Tong and Tianjiao Ding and Xili Dai and Benjamin David Haeffele and Rene Vidal and Yi Ma},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ptCIlV24YZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "5jgz;DGyy;2xo4;7qGL;hovR",
        "pdf_size": 39143023,
        "rating": "3;5;5;8;8",
        "confidence": "4;4;4;4;5",
        "soundness": "3;3;3;4;4",
        "contribution": "2;3;2;3;4",
        "presentation": "3;3;3;3;4",
        "wc_summary": "113;58;82;51;75",
        "wc_strengths": "93;105;12;30;50",
        "wc_weaknesses": "156;99;187;64;33",
        "wc_questions": "5;16;3;57;33",
        "wc_review": "367;278;284;202;191",
        "wc_reply_reviewers": "0;65;105;0;37",
        "wc_reply_authors": "843;418;730;755;275",
        "reply_reviewers": "0;1;1;0;1",
        "reply_authors": "3;2;3;2;2",
        "rating_avg": [
            5.8,
            1.9390719429665315
        ],
        "confidence_avg": [
            4.2,
            0.39999999999999997
        ],
        "soundness_avg": [
            3.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.8,
            0.7483314773547882
        ],
        "presentation_avg": [
            3.2,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            75.8,
            21.70161284328886
        ],
        "wc_strengths_avg": [
            58.0,
            35.77149703325261
        ],
        "wc_weaknesses_avg": [
            107.8,
            56.89780312103447
        ],
        "wc_questions_avg": [
            22.8,
            20.143485299222675
        ],
        "wc_review_avg": [
            264.4,
            63.8391729269733
        ],
        "wc_reply_reviewers_avg": [
            41.4,
            40.12281146679529
        ],
        "wc_reply_authors_avg": [
            604.2,
            218.46500863982772
        ],
        "reply_reviewers_avg": [
            0.6,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            2.4,
            0.4898979485566356
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.5672816854423365,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3951624313470823838&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=ptCIlV24YZ",
        "pdf": "https://openreview.net/pdf?id=ptCIlV24YZ",
        "email": "shanghaitech.edu.cn;nyu.edu;seas.upenn.edu;hkust.edu;;amazon.com;berkeley.edu",
        "author_num": 7,
        "aff_unique_index": "0;1;2;3;4;5",
        "aff_unique_norm": "ShanghaiTech University;New York University;University of Pennsylvania;Hong Kong University of Science and Technology;Amazon;University of California, Berkeley",
        "aff_unique_dep": ";;;;Amazon.com, Inc.;",
        "aff_unique_url": "https://www.shanghaitech.edu.cn;https://www.nyu.edu;https://www.upenn.edu;https://www.ust.hk;https://www.amazon.com;https://www.berkeley.edu",
        "aff_unique_abbr": "ShanghaiTech;NYU;UPenn;HKUST;Amazon;UC Berkeley",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Hong Kong SAR;Berkeley",
        "aff_country_unique_index": "0;1;1;0;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "$\\alpha$TC-VAE: On the relationship between Disentanglement and Diversity",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17762",
        "id": "ptXo0epLQo",
        "author_site": "Cristian Meo, Louis Mahon, Anirudh Goyal, Justin Dauwels",
        "tldr": "",
        "abstract": "Understanding and developing optimal representations has long been foundational in machine learning (ML). While disentangled representations have shown promise in generative modeling and representation learning, their downstream usefulness remains debated. Recent studies re-defined disentanglement through a formal connection to symmetries, emphasizing the ability to reduce latent domains (i.e., ML problem spaces) and consequently enhance data efficiency and generative capabilities. However, from an information theory viewpoint, assigning a complex attribute (i.e., features) to a specific latent variable may be infeasible, limiting the applicability of disentangled representations to simple datasets. In this work, we introduce $\\alpha$-TCVAE, a variational autoencoder optimized using a novel total correlation (TC) lower bound that maximizes disentanglement and latent variables informativeness. The proposed TC bound is grounded in information theory constructs, generalizes the $\\beta$-VAE lower bound, and can be reduced to a convex combination of the known variational information bottleneck (VIB) and conditional entropy bottleneck (CEB) terms. Moreover, we present quantitative analyses and correlation studies that support the idea that smaller latent domains (i.e., disentangled representations) lead to better generative capabilities and diversity. Additionally, we perform downstream task experiments from both representation and RL domains to assess our questions from a broader ML perspective. Our results demonstrate that $\\alpha$-TCVAE consistently learns more disentangled representations than baselines and generates more diverse observations without sacrificing visual fidelity. Notably, $\\alpha$-TCVAE exhibits marked improvements on MPI3D-Real, the most realistic disentangled dataset in our study,  confirming its ability to represent complex datasets when maximizing the informativeness of individual variables. Finally, testing the proposed model off-the-shelf on a state-of-the-art model-based RL agent, Director, significantly shows $\\alpha$-TCVAE downstream usefulness on the loconav Ant Maze task. Implementation available at https://github.com/Cmeo97/Alpha-TCVAE",
        "keywords": "Disentanglement;Diversity;Generative Modeling",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Cristian Meo;Louis Mahon;Anirudh Goyal;Justin Dauwels",
        "authorids": "~Cristian_Meo1;~Louis_Mahon1;~Anirudh_Goyal1;~Justin_Dauwels1",
        "gender": "M;;M;M",
        "homepage": "http://microelectronics.tudelft.nl/People/bio.php?id=809;;https://anirudh9119.github.io/;http://www.dauwels.com",
        "dblp": "287/4221;;172/1039;d/JustinDauwels",
        "google_scholar": "Q2O0-KkAAAAJ;https://scholar.google.co.uk/citations?hl=en;krrh6OUAAAAJ;dboVuDYAAAAJ",
        "orcid": ";;;",
        "linkedin": "cristian-meo/;;;justin-dauwels-9146b62/",
        "or_profile": "~Cristian_Meo1;~Louis_Mahon1;~Anirudh_Goyal1;~Justin_Dauwels1",
        "aff": "Delft University of Technology;School of Informatics, University of Edinburgh;Google DeepMind;Delft University of Technology",
        "aff_domain": "tudelft.nl;inf.ed.ac.uk;google.com;tudelft.nl",
        "position": "PhD student;Postdoc;Researcher;Associate Professor",
        "bibtex": "@inproceedings{\nmeo2024alphatcvae,\ntitle={\\${\\textbackslash}alpha\\${TC}-{VAE}: On the relationship between Disentanglement and Diversity},\nauthor={Cristian Meo and Louis Mahon and Anirudh Goyal and Justin Dauwels},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ptXo0epLQo}\n}",
        "github": "",
        "project": "",
        "reviewers": "4hmE;hWoC;wnca",
        "pdf_size": 3348779,
        "rating": "5;5;8",
        "confidence": "4;3;3",
        "soundness": "2;2;2",
        "contribution": "2;2;2",
        "presentation": "3;2;3",
        "wc_summary": "46;76;75",
        "wc_strengths": "59;64;123",
        "wc_weaknesses": "138;168;162",
        "wc_questions": "19;2;172",
        "wc_review": "262;310;532",
        "wc_reply_reviewers": "145;84;0",
        "wc_reply_authors": "1491;870;1138",
        "reply_reviewers": "2;1;0",
        "reply_authors": "7;3;3",
        "rating_avg": [
            6.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            65.66666666666667,
            13.912424503139471
        ],
        "wc_strengths_avg": [
            82.0,
            29.06314963431642
        ],
        "wc_weaknesses_avg": [
            156.0,
            12.96148139681572
        ],
        "wc_questions_avg": [
            64.33333333333333,
            76.4475128583149
        ],
        "wc_review_avg": [
            368.0,
            117.60952342391326
        ],
        "wc_reply_reviewers_avg": [
            76.33333333333333,
            59.44371754488069
        ],
        "wc_reply_authors_avg": [
            1166.3333333333333,
            254.31258106686127
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            4.333333333333333,
            1.8856180831641267
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7009618387489328651&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=ptXo0epLQo",
        "pdf": "https://openreview.net/pdf?id=ptXo0epLQo",
        "email": "tudelft.nl;inf.ed.ac.uk;google.com;tudelft.nl",
        "author_num": 4,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Delft University of Technology;University of Edinburgh;Google",
        "aff_unique_dep": ";School of Informatics;Google DeepMind",
        "aff_unique_url": "https://www.tudelft.nl;https://www.ed.ac.uk;https://deepmind.com",
        "aff_unique_abbr": "TU Delft;Edinburgh;DeepMind",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Edinburgh",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "Netherlands;United Kingdom"
    },
    {
        "id": "ptmeLzcNyB",
        "title": "Generalising Multi-Agent Cooperation through Task-Agnostic Communication",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In cooperative multi-agent reinforcement learning (MARL), existing communication methods are almost exclusively task-specific, necessitating the training of new communication strategies for each unique task. This paper addresses this inherent inefficiency by introducing a task-agnostic, environment-specific communication strategy applicable to any task within a given environment. We pre-train the communication strategy without task-specific reward guidance in a self-supervised manner using a set autoencoder. Our objective is to learn a latent Markov state from a set of local observations, coming from a variable number of agents. Under mild assumptions, we prove that policies using our latent representations are guaranteed to converge, and upper bound the value error introduced by our Markov state approximation. Our method enables seamless adaptation to novel tasks without relearning or fine-tuning the communication strategy, gracefully supports scaling to more agents than present during training, and detects out-of-distribution events in an environment. Empirical results on diverse MARL scenarios validate the effectiveness of our approach, surpassing task-specific communication strategies in unseen tasks.",
        "keywords": "multi-agent reinforcement learning;multi-agent communication",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/dda6a1e608737c359fa38b6235ca7637b81955b9.zip",
        "author": "Dulhan Jayalath;Steven Morad;Amanda Prorok",
        "authorids": "~Dulhan_Jayalath1;~Steven_Morad1;~Amanda_Prorok1",
        "gender": ";M;",
        "homepage": ";http://www.dangersteve.com/home;",
        "dblp": ";247/9311;",
        "google_scholar": ";KvCgriAAAAAJ;",
        "orcid": ";0000-0002-8413-2953;",
        "linkedin": ";;",
        "or_profile": "~Dulhan_Jayalath1;~Steven_Morad1;~Amanda_Prorok1",
        "aff": ";University of Cambridge;",
        "aff_domain": ";cam.ac.uk;",
        "position": ";PhD student;",
        "bibtex": "@misc{\njayalath2024generalising,\ntitle={Generalising Multi-Agent Cooperation through Task-Agnostic Communication},\nauthor={Dulhan Jayalath and Steven Morad and Amanda Prorok},\nyear={2024},\nurl={https://openreview.net/forum?id=ptmeLzcNyB}\n}",
        "github": "",
        "project": "",
        "reviewers": "NAUT;82Fi;FP8p;CDxU",
        "site": "https://openreview.net/forum?id=ptmeLzcNyB",
        "pdf_size": 1178477,
        "rating": "3;5;5;5",
        "confidence": "3;4;4;4",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;2",
        "presentation": "4;2;3;4",
        "wc_summary": "45;105;67;40",
        "wc_strengths": "60;96;12;8",
        "wc_weaknesses": "595;333;80;65",
        "wc_questions": "181;83;6;22",
        "wc_review": "881;617;165;135",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1482;1081;868;1008",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            64.25,
            25.625914617823888
        ],
        "wc_strengths_avg": [
            44.0,
            36.3318042491699
        ],
        "wc_weaknesses_avg": [
            268.25,
            216.6256852268447
        ],
        "wc_questions_avg": [
            73.0,
            68.65493427278189
        ],
        "wc_review_avg": [
            449.5,
            313.88652408155406
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1109.75,
            228.14071863654678
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:8TkDhLby5EUJ:scholar.google.com/&scioq=Generalising+Multi-Agent+Cooperation+through+Task-Agnostic+Communication&hl=en&as_sdt=0,10",
        "gs_version_total": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Cambridge",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cam.ac.uk",
        "aff_unique_abbr": "Cambridge",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Cambridge",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "pv2U1BeC5Z",
        "title": "Spectral-Bias and Kernel-Task Alignment in Physically Informed Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Physically informed neural networks (PINNs) are a promising emerging method for solving differential equations. As in many other deep learning approaches, the choice of PINN design and training protocol requires careful craftsmanship. Here, we suggest a comprehensive theoretical framework that sheds light on this important problem. Leveraging an equivalence between infinitely over-parameterized neural networks and Gaussian process regression (GPR), we derive an integro-differential equation that governs PINN prediction in the large data-set limit--- the neurally-informed equation. This equation augments the original one by a kernel term reflecting architecture choices. It allows quantifying implicit bias induced by the network via a spectral decomposition of the source term in the original differential equation. Measuring this spectral bias in practice provides guidelines and insights for architecture design.",
        "keywords": "PINNs;Kernels;Gaussian Processes;Learning Theory;Statistical Physics;Bayesian Inference",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "/attachment/2d0d4431a737b1642fe596e975c97bfea864cfc1.pdf",
        "author": "Zohar Ringel;Inbar Seroussi;Asaf Miron",
        "authorids": "~Zohar_Ringel1;~Inbar_Seroussi1;~Asaf_Miron1",
        "gender": "M;F;M",
        "homepage": "http://old.phys.huji.ac.il/~zohar.ringel/;https://sites.google.com/view/inbar-seroussi/home;",
        "dblp": ";;",
        "google_scholar": "https://scholar.google.co.il/citations?user=8-8VIDgAAAAJ;https://scholar.google.co.il/citations?user=t_Qe0CMAAAAJ;X623EjkAAAAJ",
        "orcid": ";;0000-0001-8202-2921",
        "linkedin": ";;asafmiron/",
        "or_profile": "~Zohar_Ringel1;~Inbar_Seroussi1;~Asaf_Miron1",
        "aff": "Hebrew University of Jerusalem, Israel;Tel Aviv University;Hebrew University of Jerusalem",
        "aff_domain": "huji.ac.il;tau.ac.il;huji.ac.il",
        "position": "Associate Professor;Assistant Professor;Postdoc",
        "bibtex": "@misc{\nringel2024spectralbias,\ntitle={Spectral-Bias and Kernel-Task Alignment in Physically Informed Neural Networks},\nauthor={Zohar Ringel and Inbar Seroussi and Asaf Miron},\nyear={2024},\nurl={https://openreview.net/forum?id=pv2U1BeC5Z}\n}",
        "github": "",
        "project": "",
        "reviewers": "bD4a;XJUJ;qyxK",
        "site": "https://openreview.net/forum?id=pv2U1BeC5Z",
        "pdf_size": 5055589,
        "rating": "3;6;6",
        "confidence": "4;2;3",
        "soundness": "2;3;2",
        "contribution": "2;3;3",
        "presentation": "2;2;2",
        "wc_summary": "47;55;134",
        "wc_strengths": "22;32;76",
        "wc_weaknesses": "91;183;851",
        "wc_questions": "37;28;6",
        "wc_review": "197;298;1067",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "764;897;1028",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;2;2",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            78.66666666666667,
            39.262648351270904
        ],
        "wc_strengths_avg": [
            43.333333333333336,
            23.456816114345575
        ],
        "wc_weaknesses_avg": [
            375.0,
            338.67191596981684
        ],
        "wc_questions_avg": [
            23.666666666666668,
            13.021349989749739
        ],
        "wc_review_avg": [
            520.6666666666666,
            388.5102601247774
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            896.3333333333334,
            107.77857960755571
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8660254037844387,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12900805575479155276&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Hebrew University of Jerusalem;Tel Aviv University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.huji.ac.il;https://www.tau.ac.il",
        "aff_unique_abbr": "HUJI;TAU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Jerusalem",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Israel"
    },
    {
        "id": "pvhyBB86Bt",
        "title": "A Theoretical Study of the Jacobian Matrix in Deep Neural Networks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Due to the compositional nature of neural networks, increasing their depth can lead to issues of vanishing or exploding gradients if the initialization scheme is not carefully selected (Poole et al., 2016; Schoenholz et al., 2017; Hayou et al., 2019). One approach to identifying a desirable initialization scheme involves analyzing the behavior of the input-output Jacobian and ensuring that it does not degenerate exponentially with depth. Such an analysis has been conducted in previous works, such as Pennington et al. (2017), where the authors discovered a critical initializa- tion scheme that ensures Jacobian stability, as confirmed by empirical results. The analysis carried in such studies is limited to initialization and leverages classical results in random matrix theory. In this paper, we extend this analysis beyond initialization, and study Jacobian behaviour during training. Notably, we show that a notion of stability holds throughout training (if satisfied at initialization), hence providing a theoretical explanation for the crucial role of initialization. To do this, we first prove a general theorem that utilizes recent breakthrough results in random matrix theory (Brailovskaya and van Handel, 2022). To show the broad applicability of our framework, we also provide an analysis of the Jacobian in other scenarios such as sparse Networks and non-iid initialization.",
        "keywords": "Theory;Deep Neural Networks; Jacobian Matrix",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/d1a594042af1816da5ffc712548dd03892dd465f.zip",
        "author": "Soufiane Hayou;Benjamin Dadoun;Pierre Youssef;Hanan Salam;Mohamed El Amine Seddik",
        "authorids": "~Soufiane_Hayou1;~Benjamin_Dadoun1;~Pierre_Youssef1;~Hanan_Salam1;~Mohamed_El_Amine_Seddik1",
        "gender": "M;M;M;;M",
        "homepage": "https://www.soufianehayou.com/;http://benjamin.dadoun.free.fr/;https://wp.nyu.edu/pyoussef/;;https://melaseddik.github.io/",
        "dblp": "220/5617;132/9328.html;223/8302;;211/7861",
        "google_scholar": "https://scholar.google.com/citations?hl=en;JFcCoH8AAAAJ;https://scholar.google.fr/citations?user=rb5xS_UAAAAJ;;https://scholar.google.fr/citations?user=85Hxd24AAAAJ",
        "orcid": ";0000-0003-2043-8117;;;",
        "linkedin": ";benjamin-dadoun-31100719a;;;melaseddik",
        "or_profile": "~Soufiane_Hayou1;~Benjamin_Dadoun1;~Pierre_Youssef1;~Hanan_Salam1;~Mohamed_El_Amine_Seddik1",
        "aff": "National University of Singapore;New York University, Abu Dhabi;New York University;;Technology Innovation Institute",
        "aff_domain": "nus.edu.sg;nyuad.nyu.edu;nyu.edu;;polytechnique.edu",
        "position": "Assistant Professor;Postdoc;Associate Professor;;Researcher",
        "bibtex": "@misc{\nhayou2024a,\ntitle={A Theoretical Study of the Jacobian Matrix in Deep Neural Networks},\nauthor={Soufiane Hayou and Benjamin Dadoun and Pierre Youssef and Hanan Salam and Mohamed El Amine Seddik},\nyear={2024},\nurl={https://openreview.net/forum?id=pvhyBB86Bt}\n}",
        "github": "",
        "project": "",
        "reviewers": "dN56;CMuq;wXpB;wG2F;y7ZT",
        "site": "https://openreview.net/forum?id=pvhyBB86Bt",
        "pdf_size": 1614147,
        "rating": "3;5;5;5;5",
        "confidence": "4;3;4;4;3",
        "soundness": "1;3;3;3;3",
        "contribution": "1;2;2;2;2",
        "presentation": "3;2;3;4;3",
        "wc_summary": "85;79;64;78;50",
        "wc_strengths": "38;55;90;67;30",
        "wc_weaknesses": "404;287;158;234;84",
        "wc_questions": "3;4;33;1;32",
        "wc_review": "530;425;345;380;196",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            4.6,
            0.7999999999999999
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.6,
            0.8000000000000002
        ],
        "contribution_avg": [
            1.8,
            0.4000000000000001
        ],
        "presentation_avg": [
            3.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            71.2,
            12.639620247459968
        ],
        "wc_strengths_avg": [
            56.0,
            21.34478859112922
        ],
        "wc_weaknesses_avg": [
            233.4,
            109.52917419573654
        ],
        "wc_questions_avg": [
            14.6,
            14.65059725744995
        ],
        "wc_review_avg": [
            375.2,
            109.07868719415356
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.408248290463863,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:1Vp3g9qxUC0J:scholar.google.com/&scioq=A+Theoretical+Study+of+the+Jacobian+Matrix+in+Deep+Neural+Networks&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "National University of Singapore;New York University;Technology Innovation Institute",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.nus.edu.sg;https://nyu.edu;",
        "aff_unique_abbr": "NUS;NYU;",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Abu Dhabi",
        "aff_country_unique_index": "0;1;2",
        "aff_country_unique": "Singapore;United Arab Emirates;United States;"
    },
    {
        "title": "CIFAR-10-Warehouse: Broad and More Realistic Testbeds in Model Generalization Analysis",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17761",
        "id": "pw2ssoOTpo",
        "author_site": "Xiaoxiao Sun, Xingjian Leng, Zijian Wang, Yang Yang, Zi Huang, Liang Zheng",
        "tldr": "",
        "abstract": "Analyzing model performance in various unseen environments is a critical research problem in the machine learning community. To study this problem, it is important to construct a testbed with out-of-distribution test sets that have broad coverage of environmental discrepancies. However, existing testbeds typically either have a small number of domains or are synthesized by image corruptions, hindering algorithm design that demonstrates real-world effectiveness. In this paper, we introduce CIFAR-10-Warehouse, consisting of 180 datasets collected by prompting image search engines and diffusion models in various ways. Generally sized between 300 and 8,000 images, the datasets contain natural images, cartoons, certain colors, or objects that do not naturally appear. With CIFAR-10-W, we aim to enhance the evaluation and deepen the understanding of two generalization tasks: domain generalization and model accuracy prediction in various out-of-distribution environments. We conduct extensive benchmarking and comparison experiments and show that CIFAR-10-W offers new and interesting insights inherent to these tasks. We also discuss other fields that would benefit from CIFAR-10-W. Data and code are available at https://sites.google.com/view/CIFAR-10-warehouse/.",
        "keywords": "doamin generalization;model accuracy prediction;testbeds",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/1392d7eb0065f10c86a5bf0bae3614040b3ad4a2.pdf",
        "author": "Xiaoxiao Sun;Xingjian Leng;Zijian Wang;Yang Yang;Zi Huang;Liang Zheng",
        "authorids": "~Xiaoxiao_Sun1;~Xingjian_Leng1;~Zijian_Wang2;~Yang_Yang61;~Zi_Huang1;~Liang_Zheng4",
        "gender": "F;M;M;F;M;F",
        "homepage": "https://xiaoxiaosun.com/;;;https://staff.itee.uq.edu.au/huang/;http://zheng-lab.cecs.anu.edu.au/;https://yangyanggirl.github.io/",
        "dblp": "185/7856-2;358/7100;03/4540-9;70/6862;61/7360-1;",
        "google_scholar": "1oCrd64AAAAJ;GQzvqS4AAAAJ;OfTXHvsAAAAJ;https://scholar.google.com.au/citations?user=iAWMsgEAAAAJ;https://scholar.google.com.au/citations?user=vNHqr3oAAAAJ;Q6TME0QAAAAJ",
        "orcid": "0000-0002-6944-7914;;;;;",
        "linkedin": ";xingjian-leng/;;;liang-zheng-76341311a/;yang-yang-girl/",
        "or_profile": "~Xiaoxiao_Sun1;~Xingjian_Leng1;~Zijian_Wang2;~Zi_Huang1;~Liang_Zheng4;~Yang_Yang32",
        "aff": "Australian National University;Australian National University;The University of Queensland;University of Queensland;Australian National University;Australian National University",
        "aff_domain": "anu.edu.au;anu.edu.au;uq.edu.au;uq.edu.au;anu.edu.au;anu.edu.au",
        "position": "PhD student;PhD student;Postdoc;Full Professor;Associate Professor;PhD student",
        "bibtex": "@inproceedings{\nsun2024cifarwarehouse,\ntitle={{CIFAR}-10-Warehouse: Broad and More Realistic Testbeds in Model Generalization Analysis},\nauthor={Xiaoxiao Sun and Xingjian Leng and Zijian Wang and Yang Yang and Zi Huang and Liang Zheng},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=pw2ssoOTpo}\n}",
        "github": "",
        "project": "",
        "reviewers": "6ZJ5;tRct;VNrf;Xmsr",
        "pdf_size": 8088442,
        "rating": "6;6;6;8",
        "confidence": "4;3;2;4",
        "soundness": "3;3;2;4",
        "contribution": "3;2;3;4",
        "presentation": "3;3;4;4",
        "wc_summary": "94;49;325;61",
        "wc_strengths": "172;53;121;120",
        "wc_weaknesses": "222;87;297;22",
        "wc_questions": "123;5;302;32",
        "wc_review": "611;194;1045;235",
        "wc_reply_reviewers": "32;0;0;0",
        "wc_reply_authors": "1513;872;1735;163",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "3;2;3;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            132.25,
            112.4974999722216
        ],
        "wc_strengths_avg": [
            116.5,
            42.26405091800832
        ],
        "wc_weaknesses_avg": [
            157.0,
            108.33974340010225
        ],
        "wc_questions_avg": [
            115.5,
            116.21209059301876
        ],
        "wc_review_avg": [
            521.25,
            343.2931509657599
        ],
        "wc_reply_reviewers_avg": [
            8.0,
            13.856406460551018
        ],
        "wc_reply_authors_avg": [
            1070.75,
            612.4387214244377
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5222329678670935,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1882645746444284507&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=pw2ssoOTpo",
        "pdf": "https://openreview.net/pdf?id=pw2ssoOTpo",
        "email": "anu.edu.au;anu.edu.au;uq.edu.au;uq.edu.au;anu.edu.au;anu.edu.au",
        "author_num": 6,
        "aff_unique_index": "0;0;1;1;0;0",
        "aff_unique_norm": "Australian National University;University of Queensland",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.anu.edu.au;https://www.uq.edu.au",
        "aff_unique_abbr": "ANU;UQ",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "Australia"
    },
    {
        "title": "InterpGNN: Understand and Improve Generalization Ability of Transdutive GNNs through the Lens of Interplay between Train and Test Nodes",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17760",
        "id": "pwW807WJ9G",
        "author_site": "Jiawei Sun, Kailai Li, Ruoxin Chen, Jie LI, Chentao Wu, Yue Ding, Junchi Yan",
        "tldr": "",
        "abstract": "Transductive node prediction has been a popular learning setting in Graph Neural Networks (GNNs). It has been widely observed that the shortage of information flow between the distant nodes and intra-batch nodes (for large-scale graphs) often hurt the generalization of GNNs which overwhelmingly adopt message-passing. Yet there is still no formal and direct theoretical results to quantitatively capture the underlying mechanism, despite the recent advance in both theoretical and empirical studies for GNN's generalization ability. In this paper, the $L$-hop interplay (i.e., message passing capability with training nodes) for a  $L$-layer GNN is successfully incorporated in our derived PAC-Bayesian bound for GNNs in the semi-supervised transductive setting. In other words, we quantitatively show how the interplay between training and testing sets influence the generalization ability which also partly explains the effectiveness of some existing empirical methods for enhancing generalization. Based on this result, we further design a plug-and-play ***Graph** **G**lobal **W**orkspace* module for GNNs (InterpGNN-GW) to enhance the interplay, utilizing the key-value attention mechanism to summarize crucial nodes' embeddings into memory and broadcast the memory to all nodes, in contrast to the pairwise attention scheme in previous graph transformers. Extensive experiments on both small-scale and large-scale graph datasets validate the effectiveness of our theory and approaches.",
        "keywords": "Graph Neural Networks;Generalization bounds;PAC-Bayesian;Structural imbalance;Graph Global Workspace",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/f1971dd7b4c41b1164b521b2454efd5c16c84e9f.pdf",
        "author": "Jiawei Sun;Kailai Li;Ruoxin Chen;Jie LI;Chentao Wu;Yue Ding;Junchi Yan",
        "authorids": "~Jiawei_Sun2;~Kailai_Li1;~Ruoxin_Chen1;~Jie_LI12;~Chentao_Wu1;~Yue_Ding2;~Junchi_Yan2",
        "gender": ";;M;M;M;M;",
        "homepage": ";;;https://www.cs.sjtu.edu.cn/~lijie;http://www.cs.sjtu.edu.cn/~wuct/;;",
        "dblp": ";;274/6944;17/2703-2.html;55/8165;39/10049-1;",
        "google_scholar": ";;https://scholar.google.com/citations?hl=zh-CN;Krl5HRcAAAAJ;https://scholar.google.com.tw/citations?user=RAs-wnEAAAAJ;wwNa3wMAAAAJ;",
        "orcid": ";;;0000-0002-4974-6116;;0000-0002-2911-1244;",
        "linkedin": ";;;;;;",
        "or_profile": "~Jiawei_Sun2;~Kailai_Li1;~Ruoxin_Chen1;~Jie_LI12;~Chentao_Wu1;~Yue_Ding2;~Junchi_Yan2",
        "aff": ";;Tencent YouTu Lab;Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;",
        "aff_domain": ";;tencent.com;cs.sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;",
        "position": ";;Researcher;Full Professor;Full Professor;Lecturer;",
        "bibtex": "@inproceedings{\nsun2024interpgnn,\ntitle={Interp{GNN}: Understand and Improve Generalization Ability of Transdutive {GNN}s through the Lens of Interplay between Train and Test Nodes},\nauthor={Jiawei Sun and Kailai Li and Ruoxin Chen and Jie LI and Chentao Wu and Yue Ding and Junchi Yan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=pwW807WJ9G}\n}",
        "github": "",
        "project": "",
        "reviewers": "qP57;fk5N;kZmE;wkbK;mAhi",
        "pdf_size": 553263,
        "rating": "6;6;6;6;6",
        "confidence": "3;3;4;3;3",
        "soundness": "3;3;3;3;2",
        "contribution": "2;3;3;2;3",
        "presentation": "3;3;3;2;3",
        "wc_summary": "45;119;76;118;49",
        "wc_strengths": "52;162;31;6;89",
        "wc_weaknesses": "211;84;291;2;248",
        "wc_questions": "70;56;76;365;2",
        "wc_review": "378;421;474;491;388",
        "wc_reply_reviewers": "26;0;23;80;169",
        "wc_reply_authors": "1041;1077;1146;2268;1317",
        "reply_reviewers": "1;0;1;1;2",
        "reply_authors": "4;3;3;7;4",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.2,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            81.4,
            32.11603960640228
        ],
        "wc_strengths_avg": [
            68.0,
            54.30653735969547
        ],
        "wc_weaknesses_avg": [
            167.2,
            107.69103955297302
        ],
        "wc_questions_avg": [
            113.8,
            128.28780144659117
        ],
        "wc_review_avg": [
            430.4,
            45.17787068908848
        ],
        "wc_reply_reviewers_avg": [
            59.6,
            60.67157489302548
        ],
        "wc_reply_authors_avg": [
            1369.8,
            459.0160781497746
        ],
        "reply_reviewers_avg": [
            1.0,
            0.6324555320336759
        ],
        "reply_authors_avg": [
            4.2,
            1.469693845669907
        ],
        "replies_avg": [
            35,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11531549961659356246&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=pwW807WJ9G",
        "pdf": "https://openreview.net/pdf?id=pwW807WJ9G",
        "email": ";;tencent.com;cs.sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;",
        "author_num": 7,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Tencent;Shanghai Jiao Tong University",
        "aff_unique_dep": "YouTu Lab;",
        "aff_unique_url": "https://www.tencent.com;https://www.sjtu.edu.cn",
        "aff_unique_abbr": "Tencent;SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "pwlm6Po61I",
        "title": "Delving into LLMs\u2019 visual understanding ability using SVG to bridge image and text",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs) have made significant advancements in natural language understanding. However, through that enormous world model that the LLM has learnt, is it somehow possible for it to understand images as well? This work investigates this question. To enable the LLM to process images, we convert them into a representation given by Scalable Vector Graphics (SVG). To study what the LLM can do with this XML-based textual description of images, we test the LLM on three broad computer vision tasks: visual reasoning, image classification under distribution shift, and generating new images using visual prompting. Even though we do not naturally associate LLMs with any visual understanding capabilities, our results indicate that the LLM can indeed do a pretty decent job in many of these tasks, potentially opening new avenues for research into LLMs ability to understand images.",
        "keywords": "Vector representation;Large Language Model",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Mu Cai;Zeyi Huang;Yuheng Li;Haohan Wang;Yong Jae Lee",
        "authorids": "~Mu_Cai1;~Zeyi_Huang3;~Yuheng_Li1;~Haohan_Wang1;~Yong_Jae_Lee2",
        "gender": "M;;M;M;M",
        "homepage": "https://pages.cs.wisc.edu/~mucai/;;;http://cs.cmu.edu/~haohanw;https://pages.cs.wisc.edu/~yongjaelee/",
        "dblp": "279/6529;142/5094;39/3954;132/4066;15/5471",
        "google_scholar": "euruCPEAAAAJ;rMvdp7oAAAAJ;ZphbAXEAAAAJ;nZxJGeUAAAAJ;4GTpCxcAAAAJ",
        "orcid": "0009-0008-7967-9752;;;;",
        "linkedin": "mu-cai/;;;haohanwang/;",
        "or_profile": "~Mu_Cai1;~Zeyi_Huang3;~Yuheng_Li1;~Haohan_Wang1;~Yong_Jae_Lee1",
        "aff": "Microsoft;University of Wisconsin - Madison;University of Wisconsin - Madison;University of Illinois, Urbana Champaign;University of Wisconsin - Madison",
        "aff_domain": "microsoft.com;wisc.edu;wisc.edu;illinois.edu;cs.wisc.edu",
        "position": "Intern;PhD student;PhD student;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\ncai2024delving,\ntitle={Delving into {LLM}s{\\textquoteright} visual understanding ability using {SVG} to bridge image and text},\nauthor={Mu Cai and Zeyi Huang and Yuheng Li and Haohan Wang and Yong Jae Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=pwlm6Po61I}\n}",
        "github": "",
        "project": "",
        "reviewers": "uhQW;oVfB;Vo5P",
        "site": "https://openreview.net/forum?id=pwlm6Po61I",
        "pdf_size": 1455666,
        "rating": "5;6;6",
        "confidence": "4;4;3",
        "soundness": "2;3;3",
        "contribution": "2;3;2",
        "presentation": "3;3;3",
        "wc_summary": "24;36;76",
        "wc_strengths": "135;72;90",
        "wc_weaknesses": "350;105;77",
        "wc_questions": "5;2;62",
        "wc_review": "514;215;305",
        "wc_reply_reviewers": "89;9;44",
        "wc_reply_authors": "1087;451;1039",
        "reply_reviewers": "1;1;1",
        "reply_authors": "4;3;4",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            45.333333333333336,
            22.23110933404409
        ],
        "wc_strengths_avg": [
            99.0,
            26.49528259898354
        ],
        "wc_weaknesses_avg": [
            177.33333333333334,
            122.62771120572852
        ],
        "wc_questions_avg": [
            23.0,
            27.60434748368452
        ],
        "wc_review_avg": [
            344.6666666666667,
            125.24731090482098
        ],
        "wc_reply_reviewers_avg": [
            47.333333333333336,
            32.74480450731417
        ],
        "wc_reply_authors_avg": [
            859.0,
            289.1643131508451
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17602194794553320114&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;2;1",
        "aff_unique_norm": "Microsoft;University of Wisconsin-Madison;University of Illinois Urbana-Champaign",
        "aff_unique_dep": "Microsoft Corporation;;",
        "aff_unique_url": "https://www.microsoft.com;https://www.wisc.edu;https://illinois.edu",
        "aff_unique_abbr": "Microsoft;UW-Madison;UIUC",
        "aff_campus_unique_index": "1;1;2;1",
        "aff_campus_unique": ";Madison;Urbana-Champaign",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "ODE Discovery for Longitudinal Heterogeneous Treatment Effects Inference",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17759",
        "id": "pxI5IPeWgW",
        "author_site": "Krzysztof Kacprzyk, Samuel Holt, Jeroen Berrevoets, Zhaozhi Qian, Mihaela van der Schaar",
        "tldr": "",
        "abstract": "Inferring unbiased treatment effects has received widespread attention in the machine learning community. In recent years, our community has proposed numerous solutions in standard settings, high-dimensional treatment settings, and even longitudinal settings. While very diverse, the solution has mostly relied on neural networks for inference and simultaneous correction of assignment bias. New approaches typically build on top of previous approaches by proposing new (or refined) architectures and learning algorithms. However, the end result\u2014a neural-network-based inference machine\u2014remains unchallenged. In this paper, we introduce a different type of solution in the longitudinal setting: a closed-form ordinary differential equation (ODE). While we still rely on continuous optimization to learn an ODE, the resulting inference machine is no longer a neural network. Doing so yields several advantages such as interpretability, irregular sampling, and a different set of identification assumptions. Above all, we consider the introduction of a completely new type of solution to be our most important contribution as it may spark entirely new innovations in treatment effects in general. We facilitate this by formulating our contribution as a framework that can transform any ODE discovery method into a treatment effects method.",
        "keywords": "Treatment Effects over Time",
        "primary_area": "causal reasoning",
        "supplementary_material": "",
        "author": "Krzysztof Kacprzyk;Samuel Holt;Jeroen Berrevoets;Zhaozhi Qian;Mihaela van der Schaar",
        "authorids": "~Krzysztof_Kacprzyk1;~Samuel_Holt1;~Jeroen_Berrevoets1;~Zhaozhi_Qian1;~Mihaela_van_der_Schaar2",
        "gender": ";;;;F",
        "homepage": ";https://samholt.github.io/;https://jeroenbe.github.io;;https://www.vanderschaar-lab.com",
        "dblp": ";322/3656;236/4591;194/2443;",
        "google_scholar": ";Ey5aInIAAAAJ;https://scholar.google.be/citations?user=Bq1dFNQAAAAJ;PuTDB5gAAAAJ;DZ3S--MAAAAJ",
        "orcid": ";;;0000-0002-4561-0342;",
        "linkedin": ";;;;",
        "or_profile": "~Krzysztof_Kacprzyk1;~Samuel_Holt1;~Jeroen_Berrevoets1;~Zhaozhi_Qian1;~Mihaela_van_der_Schaar2",
        "aff": ";Google DeepMind;;University of Cambridge;University of California, Los Angeles",
        "aff_domain": ";google.com;;cam.ac.uk;ucla.edu",
        "position": ";Intern;;Postdoc;Full Professor",
        "bibtex": "@inproceedings{\nkacprzyk2024ode,\ntitle={{ODE} Discovery for Longitudinal Heterogeneous Treatment Effects Inference},\nauthor={Krzysztof Kacprzyk and Samuel Holt and Jeroen Berrevoets and Zhaozhi Qian and Mihaela van der Schaar},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=pxI5IPeWgW}\n}",
        "github": "",
        "project": "",
        "reviewers": "pnuM;WcGm;h9Ux;aGwv;6MV1",
        "pdf_size": 629580,
        "rating": "5;5;8;8;8",
        "confidence": "4;3;4;2;3",
        "soundness": "2;3;4;3;3",
        "contribution": "2;2;4;3;3",
        "presentation": "1;2;4;3;3",
        "wc_summary": "93;63;68;87;60",
        "wc_strengths": "14;90;46;38;51",
        "wc_weaknesses": "458;251;70;38;191",
        "wc_questions": "11;104;29;67;34",
        "wc_review": "576;508;213;230;336",
        "wc_reply_reviewers": "65;158;0;88;0",
        "wc_reply_authors": "1858;1582;349;539;1642",
        "reply_reviewers": "1;2;0;1;0",
        "reply_authors": "4;5;1;2;3",
        "rating_avg": [
            6.8,
            1.469693845669907
        ],
        "confidence_avg": [
            3.2,
            0.7483314773547882
        ],
        "soundness_avg": [
            3.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            2.8,
            0.7483314773547882
        ],
        "presentation_avg": [
            2.6,
            1.019803902718557
        ],
        "wc_summary_avg": [
            74.2,
            13.287588193498472
        ],
        "wc_strengths_avg": [
            47.8,
            24.628438846179428
        ],
        "wc_weaknesses_avg": [
            201.6,
            149.91811098062834
        ],
        "wc_questions_avg": [
            49.0,
            32.918080138428486
        ],
        "wc_review_avg": [
            372.6,
            146.1856354092289
        ],
        "wc_reply_reviewers_avg": [
            62.2,
            59.310707296406434
        ],
        "wc_reply_authors_avg": [
            1194.0,
            622.124424854064
        ],
        "reply_reviewers_avg": [
            0.8,
            0.7483314773547883
        ],
        "reply_authors_avg": [
            3.0,
            1.4142135623730951
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.32732683535398854,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5474865094892120479&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=pxI5IPeWgW",
        "pdf": "https://openreview.net/pdf?id=pxI5IPeWgW",
        "email": ";google.com;;cam.ac.uk;ucla.edu",
        "author_num": 5,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Google;University of Cambridge;University of California, Los Angeles",
        "aff_unique_dep": "Google DeepMind;;",
        "aff_unique_url": "https://deepmind.com;https://www.cam.ac.uk;https://www.ucla.edu",
        "aff_unique_abbr": "DeepMind;Cambridge;UCLA",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Cambridge;Los Angeles",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "id": "pxOUk9OHYP",
        "title": "CutSharp: A Simple Data Augmentation Method for Learned Image Compression",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Learned image compression (LIC) methods have demonstrated superior rate$-$distortion performance, compared to traditional ones. Previous studies on LIC have mainly focused on models, consisting of analysis/synthesis transformations and entropy models. Unfortunately, the importance of $data$ has usually been neglected when training LIC models. In this paper, we introduce block-wise RGB standard deviation as a measure for estimating the compression-related difficulty of images. Next, we emphasize the significance of effective data utilization for LIC by demonstrating that models trained on a certain subset of data, constructed according to the block-wise RGB standard deviation, can achieve superior rate$-$distortion performance to models trained on the entire data. Inspired by this observation, we propose a simple data augmentation technique for LIC, coined CutSharp, which enhances image sharpness within an arbitrary region. Our proposed augmentation consistently improves rate$-$distortion performance on the Kodak and CLIC validation dataset. We hope that our work will encourage further research in data-centric approaches for LIC.",
        "keywords": "learned image compression;data augmentation",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Jaehoon Oh;Jun-Hyuk Kim;Dokwan Oh",
        "authorids": "~Jaehoon_Oh1;~Jun-Hyuk_Kim1;~Dokwan_Oh1",
        "gender": "M;M;M",
        "homepage": ";https://junhyukk.github.io/;",
        "dblp": "180/9951;193/6547;274/9571",
        "google_scholar": "_9XVeDF8AAAAJ;A0io6mQAAAAJ;",
        "orcid": ";;",
        "linkedin": "jaehoon-oh-841584184/;;dokwan-oh-18a26572/",
        "or_profile": "~Jaehoon_Oh1;~Jun-Hyuk_Kim1;~Dokwan_Oh1",
        "aff": "Samsung Advanced Institute of Technology;Samsung Advanced Institute of Technology;Samsung Advanced Institute of Technology",
        "aff_domain": "samsung.com;samsung.com;samsung.com",
        "position": "Researcher;Researcher;Principal Researcher",
        "bibtex": "@misc{\noh2024cutsharp,\ntitle={CutSharp: A Simple Data Augmentation Method for Learned Image Compression},\nauthor={Jaehoon Oh and Jun-Hyuk Kim and Dokwan Oh},\nyear={2024},\nurl={https://openreview.net/forum?id=pxOUk9OHYP}\n}",
        "github": "",
        "project": "",
        "reviewers": "VyXU;insN;p52F;316K",
        "site": "https://openreview.net/forum?id=pxOUk9OHYP",
        "pdf_size": 25527630,
        "rating": "3;3;3;3",
        "confidence": "4;5;5;4",
        "soundness": "3;2;2;2",
        "contribution": "2;1;2;1",
        "presentation": "4;3;2;3",
        "wc_summary": "57;36;71;110",
        "wc_strengths": "41;8;30;75",
        "wc_weaknesses": "208;217;139;220",
        "wc_questions": "130;52;96;3",
        "wc_review": "436;313;336;408",
        "wc_reply_reviewers": "204;229;0;9",
        "wc_reply_authors": "498;470;524;266",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            68.5,
            27.004629232781554
        ],
        "wc_strengths_avg": [
            38.5,
            24.19194080680589
        ],
        "wc_weaknesses_avg": [
            196.0,
            33.20391543176798
        ],
        "wc_questions_avg": [
            70.25,
            47.66746794198324
        ],
        "wc_review_avg": [
            373.25,
            50.4052328632653
        ],
        "wc_reply_reviewers_avg": [
            110.5,
            106.41545940322769
        ],
        "wc_reply_authors_avg": [
            439.5,
            101.97426145846804
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:OqwEOg_Z0zUJ:scholar.google.com/&scioq=CutSharp:+A+Simple+Data+Augmentation+Method+for+Learned+Image+Compression&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Samsung",
        "aff_unique_dep": "Samsung Advanced Institute of Technology",
        "aff_unique_url": "https://www.sait.samsung.com",
        "aff_unique_abbr": "SAIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "Effective and Efficient Federated Tree Learning on Hybrid Data",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17758",
        "id": "py4ZV2qYQI",
        "author_site": "Qinbin Li, Chulin Xie, Xiaojun Xu, Xiaoyuan Liu, Ce Zhang, Bo Li, Bingsheng He, Dawn Song",
        "tldr": "",
        "abstract": "Federated learning has emerged as a promising distributed learning paradigm that facilitates collaborative learning among multiple parties without transferring raw data. However, most existing federated learning studies focus on either horizontal or vertical data settings, where the data of different parties are assumed to be from the same feature or sample space. In practice, a common scenario is the hybrid data setting, where data from different parties may differ both in the features and samples. To address this, we propose HybridTree, a novel federated learning approach that enables federated tree learning on hybrid data. We observe the existence of consistent split rules in trees. With the help of these split rules, we theoretically show that the knowledge of parties can be incorporated into the lower layers of a tree. Based on our theoretical analysis, we propose a layer-level solution that does not need frequent communication traffic to train a tree. Our experiments demonstrate that HybridTree can achieve comparable accuracy to the centralized setting with low computational and communication overhead. HybridTree can achieve up to 8 times speedup compared with the other baselines.",
        "keywords": "federated learning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Qinbin Li;Chulin Xie;Xiaojun Xu;Xiaoyuan Liu;Ce Zhang;Bo Li;Bingsheng He;Dawn Song",
        "authorids": "~Qinbin_Li1;~Chulin_Xie1;~Xiaojun_Xu1;~Xiaoyuan_Liu1;~Ce_Zhang1;~Bo_Li19;~Bingsheng_He1;~Dawn_Song1",
        "gender": "M;F;M;M;;F;M;F",
        "homepage": "https://qinbinli.com/;;;http://xiaoyuanliu.cn/;;http://boli.cs.illinois.edu/;http://www.comp.nus.edu.sg/~hebs/;",
        "dblp": "225/9769;245/4284;;;97/919;50/3402-26;h/BingshengHe.html;s/DXSong",
        "google_scholar": "https://scholar.google.com.sg/citations?user=1EMOEqQAAAAJ;WeJnzAgAAAAJ;rdMZZQwAAAAJ;vbycUZ4AAAAJ;;K8vJkTcAAAAJ;https://scholar.google.com.tw/citations?user=RogYLKYAAAAJ;",
        "orcid": ";;;;;;0000-0001-8618-4581;",
        "linkedin": ";;;;;;bingsheng-he-7734b131;",
        "or_profile": "~Qinbin_Li1;~Chulin_Xie1;~Xiaojun_Xu1;~Xiaoyuan_Liu1;~Ce_Zhang1;~Bo_Li19;~Bingsheng_He1;~Dawn_Song1",
        "aff": "University of California, Berkeley;University of Illinois, Urbana Champaign;ByteDance Inc.;University of California, Berkeley;University of Chicago;University of Illinois, Urbana Champaign;National University of Singapore;University of California, Berkeley",
        "aff_domain": "berkeley.edu;illinois.edu;bytedance.com;berkeley.edu;uchicago.edu;illinois.edu;nus.edu.sg;berkeley.edu",
        "position": "Postdoc;PhD student;Researcher;PhD student;Associate Professor;Assistant Professor;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nli2024effective,\ntitle={Effective and Efficient Federated Tree Learning on Hybrid Data},\nauthor={Qinbin Li and Chulin Xie and Xiaojun Xu and Xiaoyuan Liu and Ce Zhang and Bo Li and Bingsheng He and Dawn Song},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=py4ZV2qYQI}\n}",
        "github": "",
        "project": "",
        "reviewers": "whfr;3ksq;KFHq;2kKa",
        "pdf_size": 763058,
        "rating": "5;5;6;8",
        "confidence": "2;5;3;3",
        "soundness": "3;2;3;3",
        "contribution": "3;2;3;4",
        "presentation": "2;2;3;2",
        "wc_summary": "101;47;73;167",
        "wc_strengths": "61;54;95;171",
        "wc_weaknesses": "78;275;54;297",
        "wc_questions": "264;102;4;7",
        "wc_review": "504;478;226;642",
        "wc_reply_reviewers": "13;445;11;11",
        "wc_reply_authors": "669;1918;122;584",
        "reply_reviewers": "1;2;1;1",
        "reply_authors": "3;5;2;2",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            97.0,
            44.69899327725402
        ],
        "wc_strengths_avg": [
            95.25,
            46.40245144386232
        ],
        "wc_weaknesses_avg": [
            176.0,
            110.60063290958149
        ],
        "wc_questions_avg": [
            94.25,
            105.63232223140794
        ],
        "wc_review_avg": [
            462.5,
            150.0958027394504
        ],
        "wc_reply_reviewers_avg": [
            120.0,
            187.6406139405859
        ],
        "wc_reply_authors_avg": [
            823.25,
            665.4439777321604
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            1.224744871391589
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.18731716231633877,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8148918821084637529&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=py4ZV2qYQI",
        "pdf": "https://openreview.net/pdf?id=py4ZV2qYQI",
        "email": "berkeley.edu;illinois.edu;bytedance.com;berkeley.edu;uchicago.edu;illinois.edu;nus.edu.sg;berkeley.edu",
        "author_num": 8,
        "aff_unique_index": "0;1;2;0;3;1;4;0",
        "aff_unique_norm": "University of California, Berkeley;University of Illinois Urbana-Champaign;ByteDance;University of Chicago;National University of Singapore",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.berkeley.edu;https://illinois.edu;https://www.bytedance.com;https://www.uchicago.edu;https://www.nus.edu.sg",
        "aff_unique_abbr": "UC Berkeley;UIUC;ByteDance;UChicago;NUS",
        "aff_campus_unique_index": "0;1;0;1;0",
        "aff_campus_unique": "Berkeley;Urbana-Champaign;",
        "aff_country_unique_index": "0;0;1;0;0;0;2;0",
        "aff_country_unique": "United States;China;Singapore"
    },
    {
        "id": "pyW37euNXb",
        "title": "Upgrading VAE Training With Unlimited Data Plans Provided by Diffusion Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Variational autoencoders (VAEs) are popular models for representation learning but their encoders are susceptible to overfitting (Cremer et al., 2018) because they are trained on a finite training set instead of the true (continuous) data distribution $p_{\\mathrm{data}}(\\mathbf{x})$. Diffusion models, on the other hand, avoid this issue by keeping the encoder fixed. This makes their representations less interpretable, but it simplifies training, enabling accurate and continuous approximations of $p_{\\mathrm{data}}(\\mathbf{x})$. In this paper, we show that overfitting encoders in VAEs can be effectively mitigated by training on samples from a pre-trained diffusion model. These results are somewhat unexpected as recent findings (Alemohammad et al., 2023; Shumailov et al., 2023) observe a decay in generative performance when models are trained on data generated by another generative model. We analyze generalization performance, amortization gap, and robustness of VAEs trained with our proposed method on three different data sets. We find improvements in all metrics compared to both normal training and conventional data augmentation methods, and we show that a modest amount of samples from the diffusion model suffices to obtain these gains.",
        "keywords": "VAE;Diffusion Model;Data Augmentation;Distillation;Generalization;Robustness;Amortized Inference;Generative Model",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/4fe660be01729de5a466cfd0f780906b5f9c3c7f.zip",
        "author": "Tim Z. Xiao;Johannes Zenn;Robert Bamler",
        "authorids": "~Tim_Z._Xiao1;~Johannes_Zenn1;~Robert_Bamler1",
        "gender": "M;M;M",
        "homepage": "https://jzenn.github.io;https://robamler.github.io/;http://timx.me",
        "dblp": "308/0659;195/6208.html;267/5382",
        "google_scholar": "QYZmWP8AAAAJ;LwvdNAgAAAAJ;4I7boHIAAAAJ",
        "orcid": "0009-0001-5834-3474;;",
        "linkedin": "johannes-zenn;;timxzz/",
        "or_profile": "~Johannes_Zenn1;~Robert_Bamler1;~Tim_Xiao1",
        "aff": "Eberhard-Karls-Universit\u00e4t T\u00fcbingen;University of Tuebingen;University of T\u00fcbingen",
        "aff_domain": "uni-tuebingen.de;uni-tuebingen.de;uni-tuebingen.de",
        "position": "PhD student;Assistant Professor;PhD student",
        "bibtex": "@misc{\nxiao2024upgrading,\ntitle={Upgrading {VAE} Training With Unlimited Data Plans Provided by Diffusion Models},\nauthor={Tim Z. Xiao and Johannes Zenn and Robert Bamler},\nyear={2024},\nurl={https://openreview.net/forum?id=pyW37euNXb}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZW6a;FgWw;nb6g;nWgS",
        "site": "https://openreview.net/forum?id=pyW37euNXb",
        "pdf_size": 2155562,
        "rating": "3;5;5;5",
        "confidence": "4;3;4;4",
        "soundness": "2;3;3;3",
        "contribution": "1;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "32;61;55;23",
        "wc_strengths": "27;57;91;26",
        "wc_weaknesses": "214;199;112;109",
        "wc_questions": "97;194;141;35",
        "wc_review": "370;511;399;193",
        "wc_reply_reviewers": "57;0;24;69",
        "wc_reply_authors": "997;809;797;757",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "2;1;1;2",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            42.75,
            15.722197683530124
        ],
        "wc_strengths_avg": [
            50.25,
            26.621185172715357
        ],
        "wc_weaknesses_avg": [
            158.5,
            48.303726564313855
        ],
        "wc_questions_avg": [
            116.75,
            58.37111871465203
        ],
        "wc_review_avg": [
            368.25,
            114.06001709626385
        ],
        "wc_reply_reviewers_avg": [
            37.5,
            27.207535720825582
        ],
        "wc_reply_authors_avg": [
            840.0,
            92.66606714434361
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:h-_ML_oreCAJ:scholar.google.com/&scioq=Upgrading+VAE+Training+With+Unlimited+Data+Plans+Provided+by+Diffusion+Models&hl=en&as_sdt=0,33",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Eberhard Karls University of T\u00fcbingen;University of Tuebingen;University of T\u00fcbingen",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.uni-tuebingen.de/;https://www.uni-tuebingen.de/;https://www.uni-tuebingen.de/",
        "aff_unique_abbr": "Uni T\u00fcbingen;Uni T\u00fcbingen;Uni T\u00fcbingen",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "T\u00fcbingen;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "pymYbxPhh9",
        "title": "Visual Attention-Prompted Prediction and Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Explanation(attention)-guided learning is a method that enhances a model's predictive power by incorporating human understanding during the training phase. While attention-guided learning has shown promising results, it often involves time-consuming and computationally expensive model retraining. To address this issue, we introduce the attention-prompted prediction technique, which enables direct prediction guided by the attention prompt without the need for model retraining. However, this approach presents several challenges, including: 1) How to incorporate the visual attention prompt into the model's decision-making process and leverage it for future predictions even in the absence of a prompt? and 2) How to handle the incomplete information from the visual attention prompt? To tackle these challenges, we propose a novel framework called Visual Attention-Prompted Prediction and Learning, which seamlessly integrates visual attention prompts into the model's decision-making process and adapts to images both with and without attention prompts for prediction. To address the incomplete information of the visual attention prompt, we introduce a perturbation-based attention map modification method. Additionally, we propose an optimization-based mask aggregation method with a new weight learning function for adaptive perturbed annotation aggregation in the attention map modification process. Our overall framework is designed to learn in an attention-prompt guided multi-task manner to enhance future predictions even for samples without attention prompts and trained in an alternating manner for better convergence. Extensive experiments conducted on two datasets demonstrate the effectiveness of our proposed framework in enhancing predictions for samples, both with and without provided prompts.",
        "keywords": "Visual Attention;Attention Prompt;Explanation-guided Learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Yifei Zhang;Siyi Gu;Bo Pan;Guangji Bai;Xiaofeng Yang;Liang Zhao",
        "authorids": "~Yifei_Zhang10;~Siyi_Gu1;~Bo_Pan2;~Guangji_Bai1;~Xiaofeng_Yang6;~Liang_Zhao6",
        "gender": "M;F;;M;;M",
        "homepage": "https://yifeizhangcs.github.io/;https://carriegu0818.github.io/;https://pb0316.github.io/;https://baithebest.github.io/;;https://cs.emory.edu/~lzhao41/",
        "dblp": "55/5266-6;323/5349;;286/0892;;63/5422-2",
        "google_scholar": "y5FkC7cAAAAJ;;;gBMbU28AAAAJ;;qnvyqtwAAAAJ",
        "orcid": "0009-0004-6136-733X;;0009-0005-7501-7581;0000-0003-3932-2472;;0000-0002-2648-9989",
        "linkedin": "yifei-jimmy-zhang/;;bo-pan;https://linkedin.com/in/guangji-bai/;;",
        "or_profile": "~Yifei_Zhang10;~Siyi_Gu1;~Bo_Pan2;~Guangji_Bai1;~Xiaofeng_Yang6;~Liang_Zhao6",
        "aff": "Emory University;Stanford University;Emory University;Emory University;;Emory University",
        "aff_domain": "emory.edu;stanford.edu;emory.edu;emory.edu;;emory.edu",
        "position": "PhD student;MS student;PhD student;PhD student;;Associate Professor",
        "bibtex": "@misc{\nzhang2024visual,\ntitle={Visual Attention-Prompted Prediction and Learning},\nauthor={Yifei Zhang and Siyi Gu and Bo Pan and Guangji Bai and Xiaofeng Yang and Liang Zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=pymYbxPhh9}\n}",
        "github": "",
        "project": "",
        "reviewers": "Vm67;HNQQ;5dYi;Zfz6",
        "site": "https://openreview.net/forum?id=pymYbxPhh9",
        "pdf_size": 2411791,
        "rating": "3;3;5;6",
        "confidence": "4;4;3;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "3;1;2;3",
        "wc_summary": "93;47;156;24",
        "wc_strengths": "59;23;118;114",
        "wc_weaknesses": "417;263;224;158",
        "wc_questions": "98;2;19;2",
        "wc_review": "667;335;517;298",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            80.0,
            50.42320894191484
        ],
        "wc_strengths_avg": [
            78.5,
            39.62638010214912
        ],
        "wc_weaknesses_avg": [
            265.5,
            95.18009245635349
        ],
        "wc_questions_avg": [
            30.25,
            39.72640809335775
        ],
        "wc_review_avg": [
            454.25,
            148.18463989226413
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.9622504486493761,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15463394036952443042&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;0;0;0",
        "aff_unique_norm": "Emory University;Stanford University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.emory.edu;https://www.stanford.edu",
        "aff_unique_abbr": "Emory;Stanford",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Stanford",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "pyuCmLLluu",
        "title": "Typing to Listen at the Cocktail Party: Text-Guided Target Speaker Extraction",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Humans possess an extraordinary ability to selectively focus on the sound source of interest amidst complex acoustic environments, commonly referred to as cocktail party scenarios. In an attempt to replicate this remarkable auditory attention capability in machines, target speaker extraction (TSE) models have been developed. However, the effectiveness of these models is hindered in real-world scenarios due to the potential variation or even absence of pre-registered cues. To address this limitation, this study investigates the integration of natural language to enhance the flexibility and controllability of existing TSE models. Specifically, we leverage a large language model (LLM) to extract useful semantic cues from the user's typed text input, which can complement the pre-registered cues or work independently to control the TSE process. Our experimental results demonstrate competitive performance when only text-based cues are presented, and a new state-of-the-art is set when combined with pre-registered acoustic cues. To the best of our knowledge, this is the first work that has successfully incorporated text-based cues to guide target speaker extraction, which can be a cornerstone for cocktail party problem research.",
        "keywords": "cocktail party problem;target speaker extraction (TSE);text-based cues;acoustic cues;natural language descriptions;LLM;multi-modal;audio-language",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Xiang HAO;Jibin Wu;Jianwei Yu;Chenglin Xu;KC Tan",
        "authorids": "~Xiang_HAO2;~Jibin_Wu1;~Jianwei_Yu1;~Chenglin_Xu1;~KC_Tan1",
        "gender": "M;M;;;",
        "homepage": ";https://www.jibinwu.com/;;;",
        "dblp": ";228/1824;;125/2814.html;",
        "google_scholar": "07yyhmgAAAAJ;https://scholar.google.com.sg/citations?user=QwDyvrgAAAAJ;;Ww8tQKAAAAAJ;",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Xiang_HAO2;~Jibin_Wu1;~Jianwei_Yu1;~Chenglin_Xu1;~KC_Tan1",
        "aff": "Hong Kong Polytechnic University;Hong Kong Polytechnic University;;Kuaishou Technology;",
        "aff_domain": "polyu.edu.hk;polyu.edu.hk;;kuaishou.com;",
        "position": "PhD student;Assistant Professor;;Researcher;",
        "bibtex": "@misc{\nhao2024typing,\ntitle={Typing to Listen at the Cocktail Party: Text-Guided Target Speaker Extraction},\nauthor={Xiang HAO and Jibin Wu and Jianwei Yu and Chenglin Xu and KC Tan},\nyear={2024},\nurl={https://openreview.net/forum?id=pyuCmLLluu}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZMpA;tdLn;gyG3;K7zB",
        "site": "https://openreview.net/forum?id=pyuCmLLluu",
        "pdf_size": 5028663,
        "rating": "3;5;6;8",
        "confidence": "4;4;4;5",
        "soundness": "2;3;2;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "109;70;106;132",
        "wc_strengths": "81;32;28;140",
        "wc_weaknesses": "267;74;206;144",
        "wc_questions": "6;70;21;1",
        "wc_review": "463;246;361;417",
        "wc_reply_reviewers": "24;0;0;0",
        "wc_reply_authors": "1503;830;1388;184",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "3;2;3;2",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            104.25,
            22.18529918662356
        ],
        "wc_strengths_avg": [
            70.25,
            45.35622889967816
        ],
        "wc_weaknesses_avg": [
            172.75,
            71.70556115114086
        ],
        "wc_questions_avg": [
            24.5,
            27.28094573140748
        ],
        "wc_review_avg": [
            371.75,
            81.09061289693155
        ],
        "wc_reply_reviewers_avg": [
            6.0,
            10.392304845413264
        ],
        "wc_reply_authors_avg": [
            976.25,
            523.4626896923983
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.8006407690254357,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=42705703909937360&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Hong Kong Polytechnic University;Kuaishou Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.polyu.edu.hk;https://www.kuaishou.com",
        "aff_unique_abbr": "PolyU;Kuaishou",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Quantifying the Sensitivity of Inverse Reinforcement Learning to Misspecification",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17757",
        "id": "pz2E1Q9Wni",
        "author_site": "Joar Skalse, Alessandro Abate",
        "tldr": "",
        "abstract": "Inverse reinforcement learning (IRL) aims to infer an agent's *preferences* (represented as a reward function $R$) from their *behaviour* (represented as a policy $\\pi$). To do this, we need a *behavioural model* of how $\\pi$ relates to $R$. In the current literature, the most common behavioural models are *optimality*, *Boltzmann-rationality*, and *causal entropy maximisation*. However, the true relationship between a human's preferences and their behaviour is much more complex than any of these behavioural models. This means that the behavioural models are *misspecified*, which raises the concern that they may lead to systematic errors if applied to real data. In this paper, we analyse how sensitive the IRL problem is to misspecification of the behavioural model. Specifically, we provide necessary and sufficient conditions that completely characterise how the observed data may differ from the assumed behavioural model without incurring an error above a given threshold. In addition to this, we also characterise the conditions under which a behavioural model is robust to small perturbations of the observed policy, and we analyse how robust many behavioural models are to misspecification of their parameter values (such as e.g. the discount rate). Our analysis suggests that the IRL problem is highly sensitive to misspecification, in the sense that very mild misspecification can lead to very large errors in the inferred reward function.",
        "keywords": "inverse reinforcement learning;reward learing;misspecification",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/d494d8789fd5702686bd92e75511c3c1a2b18d12.pdf",
        "author": "Joar Max Viktor Skalse;Alessandro Abate",
        "authorids": "~Joar_Max_Viktor_Skalse1;~Alessandro_Abate1",
        "gender": "M;M",
        "homepage": ";https://www.cs.ox.ac.uk/people/alessandro.abate/",
        "dblp": "242/8125;19/3904",
        "google_scholar": "GuzLUmQAAAAJ;https://scholar.google.co.uk/citations?hl=en",
        "orcid": ";0000-0002-5627-9093",
        "linkedin": ";",
        "or_profile": "~Joar_Max_Viktor_Skalse1;~Alessandro_Abate1",
        "aff": "University of Oxford;University of Oxford",
        "aff_domain": "ox.ac.uk;ox.ac.uk",
        "position": "PhD student;Full Professor",
        "bibtex": "@inproceedings{\nskalse2024quantifying,\ntitle={Quantifying the Sensitivity of Inverse Reinforcement Learning to Misspecification},\nauthor={Joar Max Viktor Skalse and Alessandro Abate},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=pz2E1Q9Wni}\n}",
        "github": "",
        "project": "",
        "reviewers": "CDtC;jn4g;Bsty;5VPU",
        "pdf_size": 544078,
        "rating": "6;6;6;8",
        "confidence": "2;3;2;3",
        "soundness": "3;3;2;3",
        "contribution": "3;3;2;3",
        "presentation": "3;3;2;3",
        "wc_summary": "237;145;141;117",
        "wc_strengths": "84;74;17;8",
        "wc_weaknesses": "97;73;132;81",
        "wc_questions": "51;18;226;185",
        "wc_review": "469;310;516;391",
        "wc_reply_reviewers": "63;28;46;16",
        "wc_reply_authors": "690;241;1101;375",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;1;2;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            2.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            160.0,
            45.727453460694704
        ],
        "wc_strengths_avg": [
            45.75,
            33.58850249713434
        ],
        "wc_weaknesses_avg": [
            95.75,
            22.64260364887395
        ],
        "wc_questions_avg": [
            120.0,
            87.50142855976695
        ],
        "wc_review_avg": [
            421.5,
            78.34060249959786
        ],
        "wc_reply_reviewers_avg": [
            38.25,
            17.83781096435322
        ],
        "wc_reply_authors_avg": [
            601.75,
            331.1324319664264
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13330139685649566427&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=pz2E1Q9Wni",
        "pdf": "https://openreview.net/pdf?id=pz2E1Q9Wni",
        "email": "ox.ac.uk;ox.ac.uk",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Oxford",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ox.ac.uk",
        "aff_unique_abbr": "Oxford",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "title": "How I Warped Your Noise: a Temporally-Correlated Noise Prior for Diffusion Models",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17756",
        "id": "pzElnMrgSD",
        "author_site": "Pascal Chang, Jingwei Tang, Markus Gross, Vinicius Da Costa De Azevedo",
        "tldr": "",
        "abstract": "Video editing and generation methods often rely on pre-trained image-based diffusion models. During the diffusion process, however, the reliance on rudimentary noise sampling techniques that do not preserve correlations present in subsequent frames of a video is detrimental to the quality of the results. This either produces high-frequency flickering, or texture-sticking artifacts that are not amenable to post-processing. With this in mind, we propose a novel method for preserving temporal correlations in a sequence of noise samples. This approach is materialized by a novel noise representation, dubbed $\\int$-noise (integral noise), that reinterprets individual noise samples as a continuously integrated noise field: pixel values do not represent discrete values, but are rather the integral of an underlying infinite-resolution noise over the pixel area. Additionally, we propose a carefully tailored transport method that uses $\\int$-noise to accurately advect noise samples over a sequence of frames, maximizing the correlation between different frames while also preserving the noise properties. Our results demonstrate that the proposed $\\int$-noise can be used for a variety of tasks, such as video restoration, surrogate rendering, and conditional video generation.",
        "keywords": "diffusion models; temporal coherency; Gaussian noise field; continuous white noise; noise transport",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Pascal Chang;Jingwei Tang;Markus Gross;Vinicius C. Azevedo",
        "authorids": "~Pascal_Chang1;~Jingwei_Tang1;~Markus_Gross1;~Vinicius_C._Azevedo1",
        "gender": "Not Specified;M;M;M",
        "homepage": "https://pascalchang87.github.io;;https://cgl.ethz.ch/people/grossm/;https://people.inf.ethz.ch/~vviniciu/",
        "dblp": "303/8773;;;139/0438",
        "google_scholar": "Pvzcqt8AAAAJ;cWV7PSkAAAAJ;uxk0GmUAAAAJ;6ulbWKQAAAAJ",
        "orcid": "0000-0002-8590-8039;0009-0000-6005-7808;;",
        "linkedin": "pascalchang87;;;",
        "or_profile": "~Pascal_Chang1;~Jingwei_Tang1;~Markus_Gross1;~Vinicius_C._Azevedo1",
        "aff": "Department of Computer Science, ETHZ - ETH Zurich;Disney Research;ETHZ - ETH Zurich;Disney Research, Disney Research",
        "aff_domain": "inf.ethz.ch;disneyresearch.com;ethz.ch;disneyresearch.com",
        "position": "PhD student;Researcher;Full Professor;Researcher",
        "bibtex": "@inproceedings{\nchang2024how,\ntitle={How I Warped Your Noise: a Temporally-Correlated Noise Prior for Diffusion Models},\nauthor={Pascal Chang and Jingwei Tang and Markus Gross and Vinicius C. Azevedo},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=pzElnMrgSD}\n}",
        "github": "",
        "project": "",
        "reviewers": "tVGv;H5Nc;3JNo;13WQ",
        "pdf_size": 46185044,
        "rating": "6;8;8;8",
        "confidence": "4;5;2;4",
        "soundness": "4;3;3;4",
        "contribution": "4;3;3;3",
        "presentation": "4;3;3;3",
        "wc_summary": "58;116;112;106",
        "wc_strengths": "47;91;33;65",
        "wc_weaknesses": "106;181;26;44",
        "wc_questions": "17;233;76;132",
        "wc_review": "228;621;247;347",
        "wc_reply_reviewers": "12;95;15;16",
        "wc_reply_authors": "724;1267;812;775",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            98.0,
            23.366642891095847
        ],
        "wc_strengths_avg": [
            59.0,
            21.6794833886788
        ],
        "wc_weaknesses_avg": [
            89.25,
            60.71809861976905
        ],
        "wc_questions_avg": [
            114.5,
            79.58800160828264
        ],
        "wc_review_avg": [
            360.75,
            156.90821361547648
        ],
        "wc_reply_reviewers_avg": [
            34.5,
            34.96069221282668
        ],
        "wc_reply_authors_avg": [
            894.5,
            217.32061568107156
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.13245323570650439,
        "gs_citation": 16,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15489853480674064544&as_sdt=5,34&sciodt=0,34&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=pzElnMrgSD",
        "pdf": "https://openreview.net/pdf?id=pzElnMrgSD",
        "email": "inf.ethz.ch;disneyresearch.com;ethz.ch;disneyresearch.com",
        "author_num": 4,
        "aff_unique_index": "0;1;0;1",
        "aff_unique_norm": "ETH Zurich;Disney Research",
        "aff_unique_dep": "Department of Computer Science;",
        "aff_unique_url": "https://www.ethz.ch;https://research.disney.com",
        "aff_unique_abbr": "ETHZ;Disney Research",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Zurich;",
        "aff_country_unique_index": "0;1;0;1",
        "aff_country_unique": "Switzerland;United States"
    },
    {
        "title": "Conformal Language Modeling",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17755",
        "id": "pzUhfQ74c5",
        "author_site": "Victor Quach, Adam Fisch, Tal Schuster, Adam Yala, Jae Ho Sohn, Tommi Jaakkola, Regina Barzilay",
        "tldr": "",
        "abstract": "In this paper, we propose a novel approach to conformal prediction for  language models (LMs) in which we produce prediction sets with performance guarantees. LM responses are typically sampled from a predicted distribution over the large, combinatorial output space of  language. Translating this to conformal prediction, we calibrate a stopping rule for sampling LM outputs  that get added to a growing set of candidates until we are confident that the set covers at least one acceptable response. Since some samples may be low-quality, we also simultaneously calibrate a rejection rule for removing candidates from the output set to reduce noise. Similar to conformal prediction, we  can prove that the final output set obeys certain desirable distribution-free guarantees. Within these sets of candidate responses, we also show that we can also identify subsets of individual components---such as phrases or sentences---that are each independently correct (e.g., that are not ``hallucinations''), again with guarantees. Our method can be applied to any LM API that supports sampling. Furthermore, we empirically demonstrate that we can achieve many desired coverage levels within a limited number of total samples when applying our method to  multiple tasks in open-domain question answering, text summarization, and radiology report generation using different LM variants.",
        "keywords": "conformal prediction;uncertainty estimation;language models;generative models;confidence;prediction sets;sampling",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/9ebd643a932321496bf28009fc27e41d8ecb31b7.pdf",
        "author": "Victor Quach;Adam Fisch;Tal Schuster;Adam Yala;Jae Ho Sohn;Tommi S. Jaakkola;Regina Barzilay",
        "authorids": "~Victor_Quach1;~Adam_Fisch2;~Tal_Schuster1;~Adam_Yala1;~Jae_Ho_Sohn1;~Tommi_S._Jaakkola1;~Regina_Barzilay1",
        "gender": "M;;Not Specified;M;M;;female",
        "homepage": "http://people.csail.mit.edu/quach/;;https://people.csail.mit.edu/tals/;http://adamyala.csail.mit.edu/;https://profiles.ucsf.edu/jae.sohn;;https://www.regina.csail.mit.edu/",
        "dblp": ";;190/7491;177/9396;217/0050;;b/ReginaBarzilay",
        "google_scholar": "i8sWUGwAAAAJ;;oo8QRmIAAAAJ;a4unsk4AAAAJ;jRa5irkAAAAJ;;",
        "orcid": ";;;0000-0001-9576-2590;0000-0002-6733-7551;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Victor_Quach1;~Adam_Fisch2;~Tal_Schuster1;~Adam_Yala1;~Jae_Ho_Sohn1;~Tommi_S._Jaakkola1;~Regina_Barzilay1",
        "aff": ";;Google;University of California, San Francisco;University of California, San Francisco;;Massachusetts Institute of Technology",
        "aff_domain": ";;google.com;ucsf.edu;ucsf.edu;;mit.edu",
        "position": ";;Researcher;Assistant Professor;Assistant Professor;;Professor",
        "bibtex": "@inproceedings{\nquach2024conformal,\ntitle={Conformal Language Modeling},\nauthor={Victor Quach and Adam Fisch and Tal Schuster and Adam Yala and Jae Ho Sohn and Tommi S. Jaakkola and Regina Barzilay},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=pzUhfQ74c5}\n}",
        "github": "",
        "project": "",
        "reviewers": "zQVz;Sb79;1uqq;7gqi",
        "pdf_size": 1862881,
        "rating": "3;6;8;8",
        "confidence": "2;4;4;3",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;2;3;4",
        "wc_summary": "124;221;96;114",
        "wc_strengths": "87;77;72;70",
        "wc_weaknesses": "306;75;110;22",
        "wc_questions": "32;510;22;102",
        "wc_review": "549;883;300;308",
        "wc_reply_reviewers": "38;0;0;0",
        "wc_reply_authors": "559;806;528;376",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            6.25,
            2.0463381929681126
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            138.75,
            48.53542520674976
        ],
        "wc_strengths_avg": [
            76.5,
            6.576473218982953
        ],
        "wc_weaknesses_avg": [
            128.25,
            107.29952236613171
        ],
        "wc_questions_avg": [
            166.5,
            200.7006477318895
        ],
        "wc_review_avg": [
            510.0,
            237.4626286386976
        ],
        "wc_reply_reviewers_avg": [
            9.5,
            16.454482671904334
        ],
        "wc_reply_authors_avg": [
            567.25,
            154.26174995766124
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.6998739952495694,
        "gs_citation": 75,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10667766109042431711&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=pzUhfQ74c5",
        "pdf": "https://openreview.net/pdf?id=pzUhfQ74c5",
        "email": ";;google.com;ucsf.edu;ucsf.edu;;mit.edu",
        "author_num": 7,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "Google;University of California, San Francisco;Massachusetts Institute of Technology",
        "aff_unique_dep": "Google;;",
        "aff_unique_url": "https://www.google.com;https://www.ucsf.edu;https://web.mit.edu",
        "aff_unique_abbr": "Google;UCSF;MIT",
        "aff_campus_unique_index": "0;1;1",
        "aff_campus_unique": "Mountain View;San Francisco;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "pzZjyYee6L",
        "title": "Don't Reinvent the Steering Wheel",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "To make safe and informed decisions, autonomous driving systems can benefit from the capability of predicting the intentions and trajectories of other agents on the road in real-time. \nTrajectory forecasting for traffic scenarios has seen great strides in recent years in parallel with advancements in attention-based network architectures and robust, large-scale benchmarks. \nHowever, such models are becoming larger, resource-hungry, and less portable as state-of-the-art pushes for larger-scale of road networks and real-world complexity. \nPrevious works that achieve state-of-the-art results predict future trajectories as a series of waypoints in Euclidean space, yet do not frame learning through the lenses of classical kinematic models that describe the motion of moving vehicles. \nInstead of leaving the network to learn the inherent dynamics of traffic agents, we can instead leverage kinematic models of vehicle dynamics as priors to guide neural networks toward physics-informed solutions earlier in learning.\nBy combining existing knowledge of how agents move with powerful deep learning techniques, agents learn trajectories that are not only more interpretable but also more plausible in terms of vehicle kinematic constraints. \nIn this work, we investigate the use of different kinematic formulations as learning priors for trajectory forecasting tasks and evaluate how each affects learning both empirically and analytically. \nIn addition, we take advantage of time integration in order to derive the original output format of future trajectory coordinates, enabling the use of existing architectures and complementing previous work. \nThis approach is easy to implement for trajectory forecasting and achieves a considerable performance gain on large-scale benchmarks.",
        "keywords": "trajectory prediction;trajectory forecasting;traffic;driving;kinematics",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/9adda9350698aa78d32de2b7455d9c1971128874.pdf",
        "author": "Laura Yu Zheng;Sanghyun Son;Ming Lin",
        "authorids": "~Laura_Yu_Zheng1;~Sanghyun_Son3;~Ming_Lin2",
        "gender": "F;M;F",
        "homepage": "https://laurayuzheng.github.io/;https://sanghyun.phd.sh/;http://www.cs.umd.edu/~lin",
        "dblp": "285/3002;68/6424-3;l/MingCLin.html",
        "google_scholar": "kGUj-dIAAAAJ;WzuMJR8AAAAJ;ugFNit4AAAAJ",
        "orcid": ";;0000-0003-3736-6949",
        "linkedin": ";;mlin2/",
        "or_profile": "~Laura_Yu_Zheng1;~Sanghyun_Son3;~Ming_Lin2",
        "aff": "Waymo;University of Maryland, College Park;Amazon",
        "aff_domain": "waymo.com;umd.edu;amazon.com",
        "position": "Intern;PhD student;Amazon Scholar",
        "bibtex": "@misc{\nzheng2024dont,\ntitle={Don't Reinvent the Steering Wheel},\nauthor={Laura Yu Zheng and Sanghyun Son and Ming Lin},\nyear={2024},\nurl={https://openreview.net/forum?id=pzZjyYee6L}\n}",
        "github": "",
        "project": "",
        "reviewers": "AmF6;NxgX;i6he;uGDE",
        "site": "https://openreview.net/forum?id=pzZjyYee6L",
        "pdf_size": 382690,
        "rating": "1;3;3;3",
        "confidence": "5;5;4;4",
        "soundness": "1;1;3;2",
        "contribution": "1;1;1;2",
        "presentation": "2;2;2;2",
        "wc_summary": "56;72;72;50",
        "wc_strengths": "17;15;14;45",
        "wc_weaknesses": "38;270;71;362",
        "wc_questions": "271;1;21;10",
        "wc_review": "382;358;178;467",
        "wc_reply_reviewers": "59;10;0;46",
        "wc_reply_authors": "324;255;174;286",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            1.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            62.5,
            9.733961166965893
        ],
        "wc_strengths_avg": [
            22.75,
            12.891373084353738
        ],
        "wc_weaknesses_avg": [
            185.25,
            135.23937111655022
        ],
        "wc_questions_avg": [
            75.75,
            112.94993359891807
        ],
        "wc_review_avg": [
            346.25,
            105.24346773078128
        ],
        "wc_reply_reviewers_avg": [
            28.75,
            24.44764814864612
        ],
        "wc_reply_authors_avg": [
            259.75,
            55.210393043339224
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:w4KPSw8cjgkJ:scholar.google.com/&scioq=Don%27t+Reinvent+the+Steering+Wheel&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Waymo;University of Maryland;Amazon",
        "aff_unique_dep": ";;Amazon.com, Inc.",
        "aff_unique_url": "https://www.waymo.com;https://www/umd.edu;https://www.amazon.com",
        "aff_unique_abbr": "Waymo;UMD;Amazon",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";College Park",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Universal Guidance for Diffusion Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17754",
        "id": "pzpWBbnwiJ",
        "author_site": "Arpit Bansal, Hong-Min Chu, Avi Schwarzschild, Roni Sengupta, Micah Goldblum, Jonas Geiping, Tom Goldstein",
        "tldr": "",
        "abstract": "Typical diffusion models are trained to accept a particular form of conditioning, most commonly text, and cannot be conditioned on other modalities without retraining. In this work, we propose a universal guidance algorithm that enables diffusion models to be controlled by arbitrary guidance modalities without the need to retrain any use-specific components. We show that our algorithm successfully generates quality images with guidance functions including segmentation, face recognition, object detection, style guidance and classifier signals.",
        "keywords": "Generative Models;Computer Vision;Diffusion Models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/460c9190a7ae241539b1bb778ebc5af68ec23737.zip",
        "author": "Arpit Bansal;Hong-Min Chu;Avi Schwarzschild;Roni Sengupta;Micah Goldblum;Jonas Geiping;Tom Goldstein",
        "authorids": "~Arpit_Bansal1;~Hong-Min_Chu1;~Avi_Schwarzschild1;~Roni_Sengupta1;~Micah_Goldblum1;~Jonas_Geiping1;~Tom_Goldstein1",
        "gender": ";M;F;;M;M;M",
        "homepage": ";https://cs.umd.edu/~avi1;https://www.cs.unc.edu/~ronisen/;;https://jonasgeiping.github.io/;https://www.cs.umd.edu/~tomg/;https://arpitbansal297.github.io/",
        "dblp": "185/0720;249/9334.html;54/10603;241/7231;190/7229;25/8184;190/9114",
        "google_scholar": ";WNvQ7AcAAAAJ;Id8SJl8AAAAJ;pGDKzuUAAAAJ;https://scholar.google.de/citations?user=206vNCEAAAAJ;KmSuVtgAAAAJ;Pchxm4IAAAAJ",
        "orcid": ";;0009-0001-5357-0563;;;;",
        "linkedin": ";;;;;;arpit-bansal-970865b1/",
        "or_profile": "~Hong-Min_Chu1;~Avi_Schwarzschild1;~Roni_Sengupta1;~Micah_Goldblum1;~Jonas_Geiping1;~Tom_Goldstein1;~Arpit_Amit_Bansal1",
        "aff": "Department of Computer Science, University of Maryland, College Park;Carnegie Mellon University;University of North Carolina at Chapel Hill;New York University;Max Planck Institute for Intelligent Systems, Max-Planck Institute;University of Maryland, College Park;University of Maryland, College Park",
        "aff_domain": "cs.umd.edu;cmu.edu;cs.unc.edu;nyu.edu;tuebingen.mpg.de;umd.edu;umd.edu",
        "position": "PhD student;Postdoc;Assistant Professor;Postdoc;Principal Researcher;Full Professor;PhD student",
        "bibtex": "@inproceedings{\nbansal2024universal,\ntitle={Universal Guidance for Diffusion Models},\nauthor={Arpit Bansal and Hong-Min Chu and Avi Schwarzschild and Roni Sengupta and Micah Goldblum and Jonas Geiping and Tom Goldstein},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=pzpWBbnwiJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "xJFT;SEzD;Dj3j;9puQ",
        "pdf_size": 856647,
        "rating": "3;6;6;6",
        "confidence": "4;4;3;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;2",
        "presentation": "2;3;4;3",
        "wc_summary": "218;107;88;48",
        "wc_strengths": "13;64;37;36",
        "wc_weaknesses": "102;291;160;101",
        "wc_questions": "51;3;3;30",
        "wc_review": "384;465;288;215",
        "wc_reply_reviewers": "0;0;0;18",
        "wc_reply_authors": "550;340;369;246",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            115.25,
            63.02925907862157
        ],
        "wc_strengths_avg": [
            37.5,
            18.062391868188442
        ],
        "wc_weaknesses_avg": [
            163.5,
            77.3902448632901
        ],
        "wc_questions_avg": [
            21.75,
            20.16649448962313
        ],
        "wc_review_avg": [
            338.0,
            94.70216470598758
        ],
        "wc_reply_reviewers_avg": [
            4.5,
            7.794228634059948
        ],
        "wc_reply_authors_avg": [
            376.25,
            110.13713043292893
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 257,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14311612481064224787&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=pzpWBbnwiJ",
        "pdf": "https://openreview.net/pdf?id=pzpWBbnwiJ",
        "email": "cs.umd.edu;cmu.edu;cs.unc.edu;nyu.edu;tuebingen.mpg.de;umd.edu;umd.edu",
        "author_num": 7,
        "aff_unique_index": "0;1;2;3;4;5;5",
        "aff_unique_norm": "University of Maryland, College Park;Carnegie Mellon University;University of North Carolina;New York University;Max Planck Institute for Intelligent Systems;University of Maryland",
        "aff_unique_dep": "Department of Computer Science;;;;Intelligent Systems;",
        "aff_unique_url": "https://www/umd.edu;https://www.cmu.edu;https://www.unc.edu;https://www.nyu.edu;https://www.mpi-is.mpg.de;https://www/umd.edu",
        "aff_unique_abbr": "UMD;CMU;UNC;NYU;MPI-IS;UMD",
        "aff_campus_unique_index": "0;2;0;0",
        "aff_campus_unique": "College Park;;Chapel Hill",
        "aff_country_unique_index": "0;0;0;0;1;0;0",
        "aff_country_unique": "United States;Germany"
    },
    {
        "id": "q0IZQMojwv",
        "title": "Objectives Are All You Need: Solving Deceptive Problems Without Explicit Diversity Maintenance",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Navigating deceptive domains has often been a challenge in machine learning due to search algorithms getting stuck at sub-optimal local optima. Many algorithms have been proposed to navigate these domains by explicitly maintaining diversity or equivalently promoting exploration, such as Novelty Search or other so-called Quality Diversity algorithms. In this paper, we present an approach with promise to solve deceptive domains without explicit diversity maintenance by optimizing a potentially large set of defined objectives. These objectives can be extracted directly from the environment by sub-aggregating the raw performance of individuals in a variety of ways. We use lexicase selection to optimize for these objectives as it has been shown to implicitly maintain population diversity. We compare this technique with a varying number of objectives to a commonly used quality diversity algorithm, MAP-Elites, on a set of discrete optimization as well as reinforcement learning domains with varying degrees of deception. We find that decomposing objectives into many objectives and optimizing them outperforms MAP-Elites on the deceptive domains that we explore. Furthermore, we find that this technique results in competitive performance on the diversity-focused metrics of QD-Score and Coverage, without explicitly optimizing for these things. Our ablation study shows that this technique is robust to different sub-aggregation techniques. However, when it comes to non-deceptive, or ``illumination\" domains, quality diversity techniques generally outperform our objective-based framework with respect to exploration (but not exploitation), hinting at potential directions for future work.",
        "keywords": "Many Objective Optimization;Quality Diversity;Lexicase Selection;Evolutionary Computation;Reinforcement Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/40cf93f81d509f4a4cce7de17a2bc66a4046045c.zip",
        "author": "Ryan Boldi;Li Ding;Lee Spector",
        "authorids": "~Ryan_Boldi1;~Li_Ding3;~Lee_Spector2",
        "gender": "M;;M",
        "homepage": "https://liding.info;https://leespector.com;https://ryanboldi.github.io/",
        "dblp": "58/4543-10;68/434;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;wtKLtLUAAAAJ;-1bygdgAAAAJ",
        "orcid": "0000-0002-1315-1196; 0000-0001-5299-4797;",
        "linkedin": "liding256;lee-spector-77990b9/;",
        "or_profile": "~Li_Ding3;~Lee_Spector2;~Ryan_A_Boldi1",
        "aff": "University of Massachusetts, Amherst;Amherst College;University of Massachusetts at Amherst",
        "aff_domain": "umass.edu;amherst.edu;umass.edu",
        "position": "PhD student;Full Professor;Undergrad student",
        "bibtex": "@misc{\nboldi2024objectives,\ntitle={Objectives Are All You Need: Solving Deceptive Problems Without Explicit Diversity Maintenance},\nauthor={Ryan Boldi and Li Ding and Lee Spector},\nyear={2024},\nurl={https://openreview.net/forum?id=q0IZQMojwv}\n}",
        "github": "",
        "project": "",
        "reviewers": "sSB3;5f3M;oe8p",
        "site": "https://openreview.net/forum?id=q0IZQMojwv",
        "pdf_size": 3198622,
        "rating": "3;3;6",
        "confidence": "2;4;4",
        "soundness": "2;3;3",
        "contribution": "2;2;3",
        "presentation": "2;2;3",
        "wc_summary": "90;68;113",
        "wc_strengths": "22;29;122",
        "wc_weaknesses": "54;158;239",
        "wc_questions": "12;42;14",
        "wc_review": "178;297;488",
        "wc_reply_reviewers": "58;49;0",
        "wc_reply_authors": "443;992;785",
        "reply_reviewers": "1;1;0",
        "reply_authors": "1;2;1",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            90.33333333333333,
            18.372685039360892
        ],
        "wc_strengths_avg": [
            57.666666666666664,
            45.58021013066478
        ],
        "wc_weaknesses_avg": [
            150.33333333333334,
            75.72024534796196
        ],
        "wc_questions_avg": [
            22.666666666666668,
            13.695092389449425
        ],
        "wc_review_avg": [
            321.0,
            127.68972811728696
        ],
        "wc_reply_reviewers_avg": [
            35.666666666666664,
            25.48637980482037
        ],
        "wc_reply_authors_avg": [
            740.0,
            226.37579375896178
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5000000000000001,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4092917696017710300&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Massachusetts Amherst;Amherst College",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.umass.edu;https://www.amherst.edu",
        "aff_unique_abbr": "UMass Amherst;Amherst",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Amherst;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "q20O1J9ujh",
        "title": "VideoGLUE: Video General Understanding Evaluation of Foundation Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We evaluate existing foundation models video understanding capabilities using a carefully designed experiment protocol consisting of three hallmark tasks (action recognition, temporal localization, and spatiotemporal localization), eight datasets well received by the community, and four adaptation methods tailoring a foundation model (FM) for a downstream task. Moreover, we propose a scalar VideoGLUE score (VGS) to measure an FMs efficacy and efficiency when adapting to general video understanding tasks. Our main findings are as follows. First, task-specialized models significantly outperform the six FMs studied in this work, in sharp contrast to what FMs have achieved in natural language and image understanding. Second,video-native FMs, whose pretraining data contains the video modality, are generally better than image-native FMs in classifying motion-rich videos, localizing actions in time, and understanding a video of more than one action. Third, the video-native FMs can perform well on video tasks under light adaptations to downstream tasks(e.g., freezing the FM backbones), while image-native FMs win in full end-to-end finetuning. The first two observations reveal the need and tremendous opportunities to conduct research on video-focused FMs, and the last confirms that both tasks and adaptation methods matter when it comes to the evaluation of FMs. We will release our code upon paper acceptance.",
        "keywords": "video understanding;benchmark;foundation model",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/f20d42704a037c8f5e819281cc698a14feadc99c.pdf",
        "author": "Liangzhe Yuan;Nitesh Bharadwaj Gundavarapu;Long Zhao;Hao Zhou;Yin Cui;Lu Jiang;Xuan Yang;Menglin Jia;Tobias Weyand;Luke Friedman;Mikhail Sirotenko;Huisheng Wang;Florian Schroff;Hartwig Adam;Ming-Hsuan Yang;Ting Liu;Boqing Gong",
        "authorids": "~Liangzhe_Yuan2;~Nitesh_Bharadwaj_Gundavarapu1;~Long_Zhao2;~Hao_Zhou3;~Yin_Cui1;~Lu_Jiang1;~Xuan_Yang6;~Menglin_Jia1;~Tobias_Weyand3;~Luke_Friedman1;~Mikhail_Sirotenko1;~Huisheng_Wang1;~Florian_Schroff1;~Hartwig_Adam1;~Ming-Hsuan_Yang1;~Ting_Liu4;~Boqing_Gong1",
        "gender": "M;Not Specified;M;M;M;F;;;M;M;;M;He/him;M;;M;M",
        "homepage": "https://yuanliangzhe.github.io;;http://garyzhao.github.io/;https://ycui.me/;http://www.lujiang.info/;;https://kmnp.github.io/;http://tobw.net;https://www.linkedin.com/in/lufriedman;https://www.linkedin.com/in/mihail-sirotenko-33187913/;;;https://research.google/people/author37870/;https://faculty.ucmerced.edu/mhyang/;http://tliu.org;http://boqinggong.info;https://zhhoper.github.io",
        "dblp": "215/4356;247/1182.html;31/5383-3;47/8023.html;22/752-4;;228/8465;71/6931;;263/7266;;52/5594;75/948;79/3711.html;52/5150-5;29/7457;63/778-11",
        "google_scholar": "1H9CkZgAAAAJ;v19p_0oAAAAJ;YTyBTmgAAAAJ;iP5m52IAAAAJ;jIKjjSYAAAAJ;HaA2AWIAAAAJ;https://scholar.google.co.uk/citations?user=QOqB6coAAAAJ;US56Kw8AAAAJ;;IpGXRaAAAAAJ;4evU9_YAAAAJ;eWbZJlMAAAAJ;fWd88tEAAAAJ;p9-ohHsAAAAJ;4wSfAIQAAAAJ;lv9ZeVUAAAAJ;LSkAN30AAAAJ",
        "orcid": ";;0000-0001-8921-8564;0000-0003-2882-2033;0000-0003-0286-8439;;;;;;;;0000-0003-1258-4341;0000-0003-4848-2304;;;",
        "linkedin": ";;garyzhao9012/;;roadjiang/;xuan-yang-3607484a/;;;;;;florianschroff;hartwig-adam-1873392/;minghsuanyang/;;boqing-gong-46aa5821/;",
        "or_profile": "~Liangzhe_Yuan2;~Nitesh_Bharadwaj_Gundavarapu1;~Long_Zhao2;~Yin_Cui1;~Lu_Jiang1;~Xuan_Yang6;~Menglin_Jia1;~Tobias_Weyand3;~Luke_Friedman1;~Mikhail_Sirotenko1;~Huisheng_Wang1;~Florian_Schroff1;~Hartwig_Adam1;~Ming-Hsuan_Yang1;~Ting_Liu4;~Boqing_Gong1;~Hao_Zhou1",
        "aff": "Google DeepMind;Google;Google DeepMind;NVIDIA;Google Research;Google;Meta Facebook;Google;Google;Google DeepMind;Google;Google;Google Research;University of California at Merced;Google DeepMind;Google;Research, Google",
        "aff_domain": "google.com;google.com;google.com;nvidia.com;google.com;google.com;meta.com;google.com;google.com;google.com;google.com;google.com;google.com;umcerced.edu;google.com;google.com;research.google.com",
        "position": "Researcher;Researcher;Research scientist;Research Scientist;Researcher;Researcher;Researcher;Software Engineer;Researcher;TLM;Researcher;SWE;Principal Researcher;Professor;Researcher;Research Scientist;Researcher",
        "bibtex": "@misc{\nyuan2024videoglue,\ntitle={Video{GLUE}: Video General Understanding Evaluation of Foundation Models},\nauthor={Liangzhe Yuan and Nitesh Bharadwaj Gundavarapu and Long Zhao and Hao Zhou and Yin Cui and Lu Jiang and Xuan Yang and Menglin Jia and Tobias Weyand and Luke Friedman and Mikhail Sirotenko and Huisheng Wang and Florian Schroff and Hartwig Adam and Ming-Hsuan Yang and Ting Liu and Boqing Gong},\nyear={2024},\nurl={https://openreview.net/forum?id=q20O1J9ujh}\n}",
        "github": "",
        "project": "",
        "reviewers": "u4pP;oktk;geS9;1CiA",
        "site": "https://openreview.net/forum?id=q20O1J9ujh",
        "pdf_size": 1029107,
        "rating": "5;5;6;6",
        "confidence": "4;4;3;5",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;2",
        "presentation": "2;3;3;4",
        "wc_summary": "118;53;73;96",
        "wc_strengths": "52;73;75;153",
        "wc_weaknesses": "236;84;54;217",
        "wc_questions": "23;70;2;10",
        "wc_review": "429;280;204;476",
        "wc_reply_reviewers": "513;98;0;105",
        "wc_reply_authors": "529;971;314;358",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "2;2;3;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            85.0,
            24.38237068047322
        ],
        "wc_strengths_avg": [
            88.25,
            38.45370593323874
        ],
        "wc_weaknesses_avg": [
            147.75,
            79.74451391788654
        ],
        "wc_questions_avg": [
            26.25,
            26.34743820563965
        ],
        "wc_review_avg": [
            347.25,
            109.88943306797064
        ],
        "wc_reply_reviewers_avg": [
            179.0,
            197.25237641154035
        ],
        "wc_reply_authors_avg": [
            543.0,
            259.82975195308177
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            17,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 17,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12251428714667516267&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;0;1;0;0;2;0;0;0;0;0;0;3;0;0;0",
        "aff_unique_norm": "Google;NVIDIA;Meta;University of California, Merced",
        "aff_unique_dep": "Google DeepMind;NVIDIA Corporation;Meta Platforms, Inc.;",
        "aff_unique_url": "https://deepmind.com;https://www.nvidia.com;https://meta.com;https://www.ucmerced.edu",
        "aff_unique_abbr": "DeepMind;NVIDIA;Meta;UC Merced",
        "aff_campus_unique_index": "1;1;1;1;1;1;1;1;2;1;1",
        "aff_campus_unique": ";Mountain View;Merced",
        "aff_country_unique_index": "0;1;0;1;1;1;1;1;1;0;1;1;1;1;0;1;1",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "id": "q20kiEt1oW",
        "title": "Strategies and impact of learning curve estimation for CNN-based image classification",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Learning curves are a measure for how the performance of machine learning models improves given a certain volume of training data. Over a wide variety of applications and models it was observed that learning curves follow -- to a large extent -- a power law behavior. This makes the performance of different models for a given task somewhat predictable and opens the opportunity to reduce the training time for practitioners, who are exploring the space of possible models and hyperparameters for the problem at hand. By estimating the learning curve of a model from training on small subsets of data only the best models need to be considered for training on the full dataset. How to choose subset sizes and how often to sample models on these to obtain estimates is however not researched. Given that the goal is to reduce overall training time strategies are needed that sample the performance in a time-efficient way and yet leads to accurate learning curve estimates. In this paper we formulate the framework for these strategies and propose several strategies. Further we evaluate the strategies for simulated learning curves and in experiments with popular datasets and models for image classification tasks.",
        "keywords": "Learning Curves;Machine Learning;Convolutional Neural Network;Neural Scaling Laws",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Laura Didyk;Brayden Yarish;Michael Alexander Beck;Christopher Bidinosti;Christopher J Henry",
        "authorids": "~Laura_Didyk1;~Brayden_Yarish1;~Michael_Alexander_Beck1;~Christopher_Bidinosti1;~Christopher_J_Henry1",
        "gender": "F;M;M;M;",
        "homepage": ";;https://www.acs.uwinnipeg.ca/mbeck/;https://www.uwinnipeg.ca/physics/people/christopher-bidinosti.html;",
        "dblp": ";;;;",
        "google_scholar": ";;;;",
        "orcid": ";;0000-0003-3193-5645;;",
        "linkedin": "laura-didyk-8276b0283;brayden-yarish/;;;",
        "or_profile": "~Laura_Didyk1;~Brayden_Yarish1;~Michael_Alexander_Beck1;~Christopher_Bidinosti1;~Christopher_J_Henry1",
        "aff": ";University of Winnipeg;University of Winnipeg;University of Winnipeg;",
        "aff_domain": ";uwinnipeg.ca;uwinnipeg.ca;uwinnipeg.ca;",
        "position": ";Undergrad student;Assistant Professor;Full Professor;",
        "bibtex": "@misc{\ndidyk2024strategies,\ntitle={Strategies and impact of learning curve estimation for {CNN}-based image classification},\nauthor={Laura Didyk and Brayden Yarish and Michael Alexander Beck and Christopher Bidinosti and Christopher J Henry},\nyear={2024},\nurl={https://openreview.net/forum?id=q20kiEt1oW}\n}",
        "github": "",
        "project": "",
        "reviewers": "KbgV;HBcf;qb3L;rA2E",
        "site": "https://openreview.net/forum?id=q20kiEt1oW",
        "pdf_size": 718265,
        "rating": "3;3;3;6",
        "confidence": "2;2;2;3",
        "soundness": "2;1;2;3",
        "contribution": "2;1;2;3",
        "presentation": "2;2;1;3",
        "wc_summary": "50;225;74;217",
        "wc_strengths": "39;26;41;332",
        "wc_weaknesses": "115;262;262;191",
        "wc_questions": "117;36;19;34",
        "wc_review": "321;549;396;774",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            2.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            141.5,
            80.00156248474151
        ],
        "wc_strengths_avg": [
            109.5,
            128.58946302088674
        ],
        "wc_weaknesses_avg": [
            207.5,
            60.76388730158728
        ],
        "wc_questions_avg": [
            51.5,
            38.38293891822251
        ],
        "wc_review_avg": [
            510.0,
            173.15744280856077
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:9bTnJxa64iMJ:scholar.google.com/&scioq=Strategies+and+impact+of+learning+curve+estimation+for+CNN-based+image+classification&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Winnipeg",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uwinnipeg.ca",
        "aff_unique_abbr": "UWinnipeg",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "q38SZkUmUh",
        "title": "FreshLLMs: Refreshing Large Language Models with Search Engine Augmentation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Most large language models (LLMs) are trained once and never updated; thus, they lack the ability to dynamically adapt to our ever-changing world.  In this work, we perform a detailed study of the factuality of LLM-generated text in the context of answering questions that test current world knowledge. Specifically, we introduce FreshQA, a novel dynamic QA benchmark encompassing a diverse range of question and answer types, including questions that require fast-changing world knowledge as well as questions with false premises that need to be debunked. We benchmark a diverse array of both closed and open-source LLMs under a two-mode evaluation procedure that allows us to measure both correctness and hallucination. Through human evaluations involving more than 50K judgments, we shed light on limitations of these models and demonstrate significant room for improvement: for instance, all models (regardless of model size) struggle on questions that involve fast-changing knowledge and false premises. Motivated by these results, we present FreshPrompt, a simple few-shot prompting method that substantially boosts the performance of an LLM on FreshQA by incorporating relevant and up-to-date information retrieved from a search engine into the prompt.  Our experiments show that FreshPrompt outperforms both competing search engine-augmented prompting methods such as Self-Ask (Press et al., 2022) as well as commercial systems such as Perplexity AI. Further analysis of FreshPrompt reveals that both the number of retrieved evidences and their order play a key role in influencing the correctness of LLM-generated answers.  Additionally, instructing the LLM to generate concise and direct answers helps reduce hallucination compared to encouraging more verbose answers. To facilitate future research, we will release FreshQA after blind review and commit to updating it at regular intervals.",
        "keywords": "fresh LLMs;search engine-augmented LLMs;LLMs' factuality",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Tu Vu;Mohit Iyyer;Xuezhi Wang;Noah Constant;Jerry Wei;Jason Wei;Chris Tar;Yun-Hsuan Sung;Denny Zhou;Quoc V Le;Thang Luong",
        "authorids": "~Tu_Vu1;~Mohit_Iyyer1;~Xuezhi_Wang3;~Noah_Constant1;~Jerry_Wei1;~Jason_Wei1;ctar@google.com;~Yun-Hsuan_Sung1;~Denny_Zhou1;~Quoc_V_Le1;~Thang_Luong1",
        "gender": "M;M;;M;;M;;M;;M;",
        "homepage": "https://tuvllms.github.io;http://cs.umass.edu/~miyyer;https://research.google/people/105995/;;;https://jasonwei20.github.io;;https://research.google/people/105458/;;;http://www.thangluong.com",
        "dblp": "186/7716.html;148/9178;70/4090-2;217/3091;;02/11220.html;;;;29/6166;153/2222",
        "google_scholar": "tOevwEEAAAAJ;rBVA5tcAAAAJ;ScLUQ-YAAAAJ;PbgcS6AAAAAJ;;;;JFr53PEAAAAJ;;;Bmbkv6sAAAAJ",
        "orcid": ";;;;;;;;;;",
        "linkedin": ";;;;;;;yhsung/;;;",
        "or_profile": "~Tu_Vu1;~Mohit_Iyyer1;~Xuezhi_Wang3;~Noah_Constant1;~Jerry_Wei1;~Jason_Wei1;ctar@google.com;~Yun-Hsuan_Sung1;~Denny_Zhou1;~Quoc_V_Le1;~Thang_Luong1",
        "aff": "Google;University of Massachusetts Amherst;Google DeepMind;;;OpenAI;;Google;;Google;Google",
        "aff_domain": "google.com;cs.umass.edu;google.com;;;openai.com;;google.com;;google.com;google.com",
        "position": "Researcher;Associate Professor;Research Scientist;;;Researcher;;Researcher;;Scientist;Research Scientist",
        "bibtex": "@misc{\nvu2024freshllms,\ntitle={Fresh{LLM}s: Refreshing Large Language Models with Search Engine Augmentation},\nauthor={Tu Vu and Mohit Iyyer and Xuezhi Wang and Noah Constant and Jerry Wei and Jason Wei and Chris Tar and Yun-Hsuan Sung and Denny Zhou and Quoc V Le and Thang Luong},\nyear={2024},\nurl={https://openreview.net/forum?id=q38SZkUmUh}\n}",
        "github": "",
        "project": "",
        "reviewers": "4BtD;BRXn;NG2g",
        "site": "https://openreview.net/forum?id=q38SZkUmUh",
        "pdf_size": 2172992,
        "rating": "5;6;8",
        "confidence": "3;4;4",
        "soundness": "3;3;4",
        "contribution": "3;3;3",
        "presentation": "3;3;4",
        "wc_summary": "162;88;74",
        "wc_strengths": "28;52;135",
        "wc_weaknesses": "43;76;56",
        "wc_questions": "343;2;1",
        "wc_review": "576;218;266",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "720;704;72",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            108.0,
            38.60915262818736
        ],
        "wc_strengths_avg": [
            71.66666666666667,
            45.84272631023983
        ],
        "wc_weaknesses_avg": [
            58.333333333333336,
            13.572848714334887
        ],
        "wc_questions_avg": [
            115.33333333333333,
            160.9851614970219
        ],
        "wc_review_avg": [
            353.3333333333333,
            158.6638655214924
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            498.6666666666667,
            301.7695956999129
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": 0.7559289460184545,
        "gs_citation": 205,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5401685431323690843&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;0;2;0;0;0",
        "aff_unique_norm": "Google;University of Massachusetts Amherst;OpenAI",
        "aff_unique_dep": "Google;;",
        "aff_unique_url": "https://www.google.com;https://www.umass.edu;https://openai.com",
        "aff_unique_abbr": "Google;UMass Amherst;OpenAI",
        "aff_campus_unique_index": "0;1;0;0;0",
        "aff_campus_unique": "Mountain View;Amherst;",
        "aff_country_unique_index": "0;0;1;0;0;0;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "title": "Adversarial Attacks on Fairness of Graph Neural Networks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17753",
        "id": "q3KNrmW6Ql",
        "author_site": "Binchi Zhang, Yushun Dong, Chen Chen, Yada Zhu, Minnan Luo, Jundong Li",
        "tldr": "",
        "abstract": "Fairness-aware graph neural networks (GNNs) have gained a surge of attention as they can reduce the bias of predictions on any demographic group (e.g., female) in graph-based applications. Although these methods greatly improve the algorithmic fairness of GNNs, the fairness can be easily corrupted by carefully designed adversarial attacks. In this paper, we investigate the problem of adversarial attacks on fairness of GNNs and propose G-FairAttack, a general framework for attacking various types of fairness-aware GNNs in terms of fairness with an unnoticeable effect on prediction utility. In addition, we propose a fast computation technique to reduce the time complexity of G-FairAttack. The experimental study demonstrates that G-FairAttack successfully corrupts the fairness of different types of GNNs while keeping the attack unnoticeable. Our study on fairness attacks sheds light on potential vulnerabilities in fairness-aware GNNs and guides further research on the robustness of GNNs in terms of fairness.",
        "keywords": "Adversarial Attacks;Algorithmic Fairness;Graph Neural Networks",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/a90411f0f8d60e786e53844efbd97ab370e2269b.pdf",
        "author": "Binchi Zhang;Yushun Dong;Chen Chen;Yada Zhu;Minnan Luo;Jundong Li",
        "authorids": "~Binchi_Zhang1;~Yushun_Dong1;~Chen_Chen10;~Yada_Zhu1;~Minnan_Luo1;~Jundong_Li2",
        "gender": "M;M;;;F;M",
        "homepage": "https://zhangbinchi.github.io/;https://yushundong.github.io;https://chenannie45.github.io/;https://researcher.watson.ibm.com/researcher/view.php?person=us-yzhu;https://gr.xjtu.edu.cn/web/minnluo;https://jundongli.github.io/",
        "dblp": "304/7647;251/9559;65/4423-22;56/8808;99/10051;144/7997.html",
        "google_scholar": "c8Z36PAAAAAJ;https://scholar.google.com/citations?hl=en;;AJb408gAAAAJ;https://scholar.google.com/citations?hl=zh-CN;uY6ek7sAAAAJ",
        "orcid": "0000-0001-7321-3822;0000-0001-7504-6159;0000-0002-7099-7905;0000-0002-3338-6371;0000-0002-0140-7860;",
        "linkedin": "binchi-zhang-274922221/;;;yadazhu/;;",
        "or_profile": "~Binchi_Zhang1;~Yushun_Dong1;~Chen_Chen10;~Yada_Zhu1;~Minnan_Luo1;~Jundong_Li2",
        "aff": "University of Virginia, Charlottesville;University of Virginia, Charlottesville;University of Virginia, Charlottesville;IBM Research;Xi'an Jiaotong University;University of Virginia",
        "aff_domain": "virginia.edu;virginia.edu;virginia.edu;us.ibm.com;xjtu.edu.cn;virginia.edu",
        "position": "PhD student;PhD student;Assistant Professor;Principal Research Scientist;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nzhang2024adversarial,\ntitle={Adversarial Attacks on Fairness of Graph Neural Networks},\nauthor={Binchi Zhang and Yushun Dong and Chen Chen and Yada Zhu and Minnan Luo and Jundong Li},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=q3KNrmW6Ql}\n}",
        "github": "",
        "project": "",
        "reviewers": "dSr8;qWJG;B8qV",
        "pdf_size": 614625,
        "rating": "6;6;6",
        "confidence": "5;3;4",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "2;3;2",
        "wc_summary": "51;89;69",
        "wc_strengths": "45;74;44",
        "wc_weaknesses": "301;53;87",
        "wc_questions": "5;85;56",
        "wc_review": "402;301;256",
        "wc_reply_reviewers": "30;43;0",
        "wc_reply_authors": "1403;1229;1079",
        "reply_reviewers": "1;1;0",
        "reply_authors": "3;3;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            69.66666666666667,
            15.520595635763755
        ],
        "wc_strengths_avg": [
            54.333333333333336,
            13.912424503139471
        ],
        "wc_weaknesses_avg": [
            147.0,
            109.77552854195996
        ],
        "wc_questions_avg": [
            48.666666666666664,
            33.06895153396242
        ],
        "wc_review_avg": [
            319.6666666666667,
            61.0482504981829
        ],
        "wc_reply_reviewers_avg": [
            24.333333333333332,
            18.00617178142601
        ],
        "wc_reply_authors_avg": [
            1237.0,
            132.39335330748293
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5368105259869707831&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=q3KNrmW6Ql",
        "pdf": "https://openreview.net/pdf?id=q3KNrmW6Ql",
        "email": "virginia.edu;virginia.edu;virginia.edu;us.ibm.com;xjtu.edu.cn;virginia.edu",
        "author_num": 6,
        "aff_unique_index": "0;0;0;1;2;0",
        "aff_unique_norm": "University of Virginia;IBM;Xi'an Jiao Tong University",
        "aff_unique_dep": ";IBM Research;",
        "aff_unique_url": "https://www.virginia.edu;https://www.ibm.com/research;https://www.xjtu.edu.cn",
        "aff_unique_abbr": "UVA;IBM;XJTU",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Charlottesville;",
        "aff_country_unique_index": "0;0;0;0;1;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "q3WzT2mrhB",
        "title": "From Sparse to Dense: Learning to Construct 3D Human Meshes from WiFi",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Estimating the pose and shape of multiple individuals in a scene is a challenging problem. While significant progress has been made using sensors like RGB cameras and radars, recent research has shown the potential of WiFi signals for pose estimation tasks. WiFi signals offer advantages such as resilience to obstructions, lighting independence, and cost-effectiveness. This raises the question of whether the sparse Channel State Information (CSI) of WiFi signals, with its limited size, can be utilized to regress dense multi-person meshes. In this paper, we introduce WiMTR (WiFi-based Mesh Regression Transformer), a novel end-to-end model for multi-person mesh regression using WiFi signals. WiMTR comprises four key components: CSI feature extractor, CSI feature encoder, coarse decoder, and refine decoder. The CSI feature extractor captures channel-wise features, while the CSI feature encoder extracts global features through internal interactions. The coarse decoder regresses initial parameters using randomly initialized queries, and the refine decoder further enhances the pose and shape parameters through a differentiation-based query generation approach. To facilitate our research, we curate a dataset specifically for multi-person mesh regression from CSI signals. The dataset consists of 171,183 frames, encompassing diverse scenes and multi-person scenarios. WiMTR achieves competitive results, with a Mean Per Joint Position Error (MPJPE) of 71.4mm, Procrustes Aligned MPJPE (PAMPJPE) of 29.7mm and Procrustes Aligned Vertex Error (PVE) of 57.3mm.  WiMTR represents the first WiFi-based multi-person mesh regression framework, and we plan to release the code and dataset to facilitate further research in this area.",
        "keywords": "Wi-Fi;Human Mesh Regression;Transformer",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Bo Qian;Xing Wei;Kangwei Yan;Fei Wang",
        "authorids": "~Bo_Qian1;~Xing_Wei5;~Kangwei_Yan1;~Fei_Wang17",
        "gender": "M;M;M;M",
        "homepage": "https://orcid.org/0009-0006-2414-4510;https://gr.xjtu.edu.cn/web/weixing;;https://gr.xjtu.edu.cn/zh/web/feynmanw",
        "dblp": ";14/4301-1.html;;52/3194-37",
        "google_scholar": ";KNyC5EUAAAAJ;;LKPpmXQAAAAJ",
        "orcid": "0009-0006-2414-4510;0000-0002-5025-3941;0009-0000-2053-055X;0000-0002-0750-6990",
        "linkedin": ";;;",
        "or_profile": "~Bo_Qian1;~Xing_Wei5;~Kangwei_Yan1;~Fei_Wang17",
        "aff": "Xi'an Jiaotong University;Xi'an Jiaotong University;;Xi'an Jiaotong University",
        "aff_domain": "xjtu.edu.cn;xjtu.edu.cn;;xjtu.edu.cn",
        "position": "PhD student;Associate Professor;;Assistant Professor",
        "bibtex": "@misc{\nqian2024from,\ntitle={From Sparse to Dense: Learning to Construct 3D Human Meshes from WiFi},\nauthor={Bo Qian and Xing Wei and Kangwei Yan and Fei Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=q3WzT2mrhB}\n}",
        "github": "",
        "project": "",
        "reviewers": "d8sA;UpgU;XjCG;gDFT",
        "site": "https://openreview.net/forum?id=q3WzT2mrhB",
        "pdf_size": 9035080,
        "rating": "1;5;5;5",
        "confidence": "4;5;4;3",
        "soundness": "1;2;3;3",
        "contribution": "1;2;2;3",
        "presentation": "2;4;3;2",
        "wc_summary": "29;51;39;104",
        "wc_strengths": "17;34;44;62",
        "wc_weaknesses": "705;204;318;70",
        "wc_questions": "2;122;93;202",
        "wc_review": "753;411;494;438",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.7320508075688772
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            55.75,
            28.925550988702014
        ],
        "wc_strengths_avg": [
            39.25,
            16.29992331270304
        ],
        "wc_weaknesses_avg": [
            324.25,
            236.70274079528525
        ],
        "wc_questions_avg": [
            104.75,
            71.50305937510646
        ],
        "wc_review_avg": [
            524.0,
            135.55994983770097
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:SUSpd8d_SrEJ:scholar.google.com/&scioq=From+Sparse+to+Dense:+Learning+to+Construct+3D+Human+Meshes+from+WiFi&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Xi'an Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.xjtu.edu.cn",
        "aff_unique_abbr": "XJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Solving High Frequency and Multi-Scale PDEs with Gaussian Processes",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17752",
        "id": "q4AEBLHuA6",
        "author_site": "Shikai Fang, Madison Cooley, Da Long, Shibo Li, Mike Kirby, Shandian Zhe",
        "tldr": "",
        "abstract": "Machine learning based solvers have garnered much attention in physical simulation and scientific computing, with a prominent example, physics-informed neural networks (PINNs). However, PINNs often struggle to solve high-frequency and multi-scale PDEs, which can be due to spectral bias during neural network training. To address this problem, we resort to the Gaussian process (GP) framework. To flexibly capture the dominant frequencies, we model the power spectrum of the PDE solution with a student $t$ mixture or Gaussian mixture. We apply the inverse Fourier transform to obtain the covariance function (by  Wiener-Khinchin theorem). The covariance derived from the Gaussian mixture spectrum corresponds to the known spectral mixture kernel. Next,  we estimate the mixture weights in the log domain, which we show is equivalent to placing a Jeffreys prior. It automatically induces sparsity, prunes excessive frequencies, and adjusts the remaining toward the ground truth. Third, to enable efficient and scalable computation on massive collocation points, which are critical to capture high frequencies, we place the collocation points on a grid, and multiply our covariance function at each input dimension. We use the GP conditional mean to predict the solution and its derivatives so as to fit the boundary condition and the equation itself. \nAs a result, we can derive a Kronecker product structure in the covariance matrix. We use Kronecker product properties and multilinear algebra to promote computational efficiency and scalability, without low-rank approximations. We show the advantage of our method in systematic experiments. The code is released at {https://github.com/xuangu-fang/Gaussian-Process-Slover-for-High-Freq-PDE}.",
        "keywords": "ML PDE solver;gaussian process;PINN",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Shikai Fang;Madison Cooley;Da Long;Shibo Li;Mike Kirby;Shandian Zhe",
        "authorids": "~Shikai_Fang2;~Madison_Cooley1;~Da_Long1;~Shibo_Li1;~Mike_Kirby1;~Shandian_Zhe1",
        "gender": ";;M;;M;",
        "homepage": ";;https://long-da.github.io/;https://imshibo.com/;https://users.cs.utah.edu/~kirby/;",
        "dblp": ";;;;k/RobertMKirby.html;",
        "google_scholar": ";;https://scholar.google.com/citations?hl=en;thvPDwgAAAAJ;https://scholar.google.com/citations?hl=en;",
        "orcid": ";;;0009-0009-1076-282X;0000-0001-5712-4141;",
        "linkedin": ";;da-long-utah/;;;",
        "or_profile": "~Shikai_Fang2;~Madison_Cooley1;~Da_Long1;~Shibo_Li1;~Mike_Kirby1;~Shandian_Zhe1",
        "aff": ";;The University of Utah;University of Utah;;",
        "aff_domain": ";;umail.utah.edu;utah.edu;;",
        "position": ";;PhD student;PhD student;;",
        "bibtex": "@inproceedings{\nfang2024solving,\ntitle={Solving High Frequency and Multi-Scale {PDE}s with Gaussian Processes},\nauthor={Shikai Fang and Madison Cooley and Da Long and Shibo Li and Mike Kirby and Shandian Zhe},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=q4AEBLHuA6}\n}",
        "github": "",
        "project": "",
        "reviewers": "FJgw;J8Ew;SL7y;GK3t",
        "pdf_size": 1942688,
        "rating": "5;6;6;6",
        "confidence": "3;5;2;4",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;2;3",
        "wc_summary": "97;100;70;69",
        "wc_strengths": "38;114;17;47",
        "wc_weaknesses": "267;607;123;745",
        "wc_questions": "113;1;3;117",
        "wc_review": "515;822;213;978",
        "wc_reply_reviewers": "266;128;0;305",
        "wc_reply_authors": "1750;968;79;1201",
        "reply_reviewers": "1;2;0;2",
        "reply_authors": "3;5;1;5",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            84.0,
            14.543039572248986
        ],
        "wc_strengths_avg": [
            54.0,
            36.31115531073061
        ],
        "wc_weaknesses_avg": [
            435.5,
            250.62471945121456
        ],
        "wc_questions_avg": [
            58.5,
            56.52211956393709
        ],
        "wc_review_avg": [
            632.0,
            293.7115932339069
        ],
        "wc_reply_reviewers_avg": [
            174.75,
            120.43125632492588
        ],
        "wc_reply_authors_avg": [
            999.5,
            602.5290449430634
        ],
        "reply_reviewers_avg": [
            1.25,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.5,
            1.6583123951777
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.2581988897471611,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14371499663742681636&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 9,
        "openreview": "https://openreview.net/forum?id=q4AEBLHuA6",
        "pdf": "https://openreview.net/pdf?id=q4AEBLHuA6",
        "email": ";;umail.utah.edu;utah.edu;;",
        "author_num": 6,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Utah",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.utah.edu",
        "aff_unique_abbr": "Utah",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "q4Bim1dDzb",
        "title": "Fast Inverse Rendering by Unified Voxelization of Scene Representation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Typical inverse rendering methods focus on learning implicit neural scene representations by modeling the geometry, materials and illumination separately, which entails significant computations for optimization. In this work we design a Unified Voxelization framework for explicit learning of scene representations, dubbed UniVoxel, which allows for efficient modeling of the geometry, materials and illumination, thereby accelerating the inverse rendering substantially. To be specific, we propose to encode a scene into a latent volumetric representation, based on which the geometry, materials and illumination can be readily learned via lightweight neural networks in a unified manner. Particularly, we leverage Spherical Gaussians to represent the incident light radiance, which enables the seamless integration of modeling illumination into the unified voxelization framework. Extensive experiments on multiple benchmarks covering diverse scenes demonstrate that UniVoxel boosts the optimization efficiency significantly compared to other inverse rendering methods, reducing the per-scene training time from hours to 18 minutes, while achieving favorable reconstruction quality. Code will be released.",
        "keywords": "Inverse Rendering;Neural Rendering;Explicit Scene Representation Learning;Volumetric Representation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/2d426bdde99d13d706559dffa298609176b3ce74.zip",
        "author": "Shuang Wu;Songlin Tang;Guangming Lu;Jianzhuang Liu;Wenjie Pei",
        "authorids": "~Shuang_Wu14;~Songlin_Tang2;~Guangming_Lu2;~Jianzhuang_Liu3;~Wenjie_Pei1",
        "gender": "M;;M;M;M",
        "homepage": "https://scholar.google.it/citations?hl=zh-CN&user=SN8J78EAAAAJ;https://github.com/FreemanTom;http://faculty.hitsz.edu.cn/luguangming;;https://wenjiepei.github.io/",
        "dblp": ";;78/4785;l/JianzhuangLiu;08/9704",
        "google_scholar": "https://scholar.google.it/citations?hl=zh-CN;;fhwB7UwAAAAJ;sKauaAwAAAAJ;wX3avNkAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Shuang_Wu14;~Songlin_Tang2;~Guangming_Lu2;~Jianzhuang_Liu3;~Wenjie_Pei1",
        "aff": "Nanjing University;Harbin Institute of Technology, Shenzhen;Harbin Institute of Technology, Shenzhen;Shenzhen Institute of Advanced Technology, Chinese Academy of Sciences;Harbin Institute of Technology",
        "aff_domain": "smail.nju.edu.cn;hit.edu.cn;hit.edu.cn;siat.ac.cn;hit.edu.cn",
        "position": "PhD student;MS student;Full Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nwu2024fast,\ntitle={Fast Inverse Rendering by Unified Voxelization of Scene Representation},\nauthor={Shuang Wu and Songlin Tang and Guangming Lu and Jianzhuang Liu and Wenjie Pei},\nyear={2024},\nurl={https://openreview.net/forum?id=q4Bim1dDzb}\n}",
        "github": "",
        "project": "",
        "reviewers": "1NZF;iqeo;qhoe;Ft2v",
        "site": "https://openreview.net/forum?id=q4Bim1dDzb",
        "pdf_size": 11333794,
        "rating": "5;5;5;8",
        "confidence": "5;5;4;5",
        "soundness": "2;4;2;3",
        "contribution": "2;3;2;3",
        "presentation": "2;4;3;4",
        "wc_summary": "37;85;95;82",
        "wc_strengths": "25;53;60;204",
        "wc_weaknesses": "112;202;204;329",
        "wc_questions": "136;179;53;72",
        "wc_review": "310;519;412;687",
        "wc_reply_reviewers": "0;0;0;14",
        "wc_reply_authors": "827;833;632;693",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "2;2;1;2",
        "rating_avg": [
            5.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            74.75,
            22.320114247019436
        ],
        "wc_strengths_avg": [
            85.5,
            69.65809357138623
        ],
        "wc_weaknesses_avg": [
            211.75,
            77.22167765595358
        ],
        "wc_questions_avg": [
            110.0,
            50.32395056034453
        ],
        "wc_review_avg": [
            482.0,
            139.53315018303
        ],
        "wc_reply_reviewers_avg": [
            3.5,
            6.06217782649107
        ],
        "wc_reply_authors_avg": [
            746.25,
            86.50830884949723
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:3yP34T7GzQUJ:scholar.google.com/&scioq=Fast+Inverse+Rendering+by+Unified+Voxelization+of+Scene+Representation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;2;1",
        "aff_unique_norm": "Nanjing University;Harbin Institute of Technology;Shenzhen Institute of Advanced Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.nju.edu.cn;http://en.hhit.edu.cn/;http://www.siat.cas.cn",
        "aff_unique_abbr": "Nanjing U;HIT;SIAT",
        "aff_campus_unique_index": "1;1;1;2",
        "aff_campus_unique": ";Shenzhen;Harbin",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "An Investigation of Representation and Allocation Harms in Contrastive Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17751",
        "id": "q4SiDyYQbo",
        "author_site": "Subha Maity, Mayank Agarwal, Mikhail Yurochkin, Yuekai Sun",
        "tldr": "",
        "abstract": "The effect of underrepresentation on the performance of minority groups is known to be a serious problem in supervised learning settings; however, it has been underexplored so far in the context of self-supervised learning (SSL). In this paper, we demonstrate that contrastive learning (CL), a popular variant of SSL, tends to collapse representations of minority groups with certain majority groups. We refer to this phenomenon as representation harm and demonstrate it on image and text datasets using the corresponding popular CL methods. Furthermore, our causal mediation analysis of allocation harm on a downstream classification task reveals that representation harm is partly responsible for it, thus emphasizing the importance of studying and mitigating representation harm. Finally, we provide a theoretical explanation for representation harm using a stochastic block model that leads to a representational neural collapse in a contrastive learning setting.",
        "keywords": "Underrepresentation;Self-supervised learning;Contrastive learning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/7d33b20c53acb2cfb1592fbef454dc499eecaa4d.zip",
        "author": "Subha Maity;Mayank Agarwal;Mikhail Yurochkin;Yuekai Sun",
        "authorids": "~Subha_Maity1;~Mayank_Agarwal1;~Mikhail_Yurochkin1;~Yuekai_Sun1",
        "gender": "M;M;M;",
        "homepage": "https://lsa.umich.edu/stats/people/phd-students/smaity.html;;https://moonfolk.github.io/;https://yuekai.github.io/",
        "dblp": "278/2922;38/5693;191/6719;",
        "google_scholar": "eD9vCGMAAAAJ;;QjBF9sUAAAAJ;6T1XtW8AAAAJ",
        "orcid": ";;;",
        "linkedin": ";https://linkedin.com/in/mayank312/;mikhail-yurochkin-a45659114/;",
        "or_profile": "~Subha_Maity1;~Mayank_Agarwal1;~Mikhail_Yurochkin1;~Yuekai_Sun1",
        "aff": "University of Waterloo;International Business Machines;IBM Research;University of Michigan - Ann Arbor",
        "aff_domain": "uwaterloo.ca;ibm.com;ibm.com;umich.edu",
        "position": "Assistant Professor;Research Engineeer;Researcher;Assistant \u2192 Associate Professor of Statistics",
        "bibtex": "@inproceedings{\nmaity2024an,\ntitle={An Investigation of Representation and Allocation Harms in Contrastive Learning},\nauthor={Subha Maity and Mayank Agarwal and Mikhail Yurochkin and Yuekai Sun},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=q4SiDyYQbo}\n}",
        "github": "",
        "project": "",
        "reviewers": "X2wa;n65V;F3P4",
        "pdf_size": 1464582,
        "rating": "5;6;8",
        "confidence": "3;3;3",
        "soundness": "2;2;3",
        "contribution": "3;3;3",
        "presentation": "3;3;4",
        "wc_summary": "98;62;100",
        "wc_strengths": "76;75;112",
        "wc_weaknesses": "88;226;123",
        "wc_questions": "3;3;142",
        "wc_review": "265;366;477",
        "wc_reply_reviewers": "0;73;58",
        "wc_reply_authors": "418;1394;662",
        "reply_reviewers": "0;1;1",
        "reply_authors": "1;4;2",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            86.66666666666667,
            17.46106780494506
        ],
        "wc_strengths_avg": [
            87.66666666666667,
            17.21110752456745
        ],
        "wc_weaknesses_avg": [
            145.66666666666666,
            58.57379011886536
        ],
        "wc_questions_avg": [
            49.333333333333336,
            65.5252283899534
        ],
        "wc_review_avg": [
            369.3333333333333,
            86.58072662101088
        ],
        "wc_reply_reviewers_avg": [
            43.666666666666664,
            31.478387647541428
        ],
        "wc_reply_authors_avg": [
            824.6666666666666,
            414.7202537722132
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8719036924678570752&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=q4SiDyYQbo",
        "pdf": "https://openreview.net/pdf?id=q4SiDyYQbo",
        "email": "uwaterloo.ca;ibm.com;ibm.com;umich.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "University of Waterloo;International Business Machines Corporation;IBM;University of Michigan",
        "aff_unique_dep": ";;IBM Research;",
        "aff_unique_url": "https://uwaterloo.ca;https://www.ibm.com;https://www.ibm.com/research;https://www.umich.edu",
        "aff_unique_abbr": "UW;IBM;IBM;UM",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Ann Arbor",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "Canada;United States"
    },
    {
        "id": "q4cfN6PGY7",
        "title": "Towards Deep Viticultural Representations: Joint Region and Grape Variety Embeddings",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The creation of embeddings, representations, or features for abstract or non-numeric variables is a prerequisite to utilize these variables in machine learning models; this is also the case for viticulture (growing grapes for wine). Viticultural regions and grape varieties are variables for which deep representations are currently not available. Regions are somewhat definable by their approximate longitude and latitude, average elevation, or averages of climate variables. Each of these \u2019raw\u2019 features contributes valuable information about the region but it does not easily define a metric for agro-ecological proximity between regions. Grape varieties have much fewer \u2019raw\u2019 features; one example may be their genetic markers, which, however, are still categorical in nature. Analysis of lineage is possible but does not necessarily provide useful features to the viticulturists as grape attributes are not necessarily inferable by their lineage such as dominant wine style or suitability for a particular region. Therefore, here we present a self-supervised approach to learning joint regional and varietal embeddings using joint variational autoencoder (VAE) networks. This is based on the assumption that regions that grow similar proportions of similar grape varieties are more similar to each other than those that do not, or that grape varieties that often occur together may have similar viticultural characteristics (e.g. climate requirements, aromas, disease resistance). We thereby overcome the lack of detailed data and create deep embeddings for 1557 grape varieties (e.g. Merlot, Riesling, Chardonnay etc.) and 595 viticulturally important regions (e.g. Piemonte, Bourgogne, Mosel etc.). We examine the embeddings, their usability for downstream tasks as well as whether the joint autoencoder network may be used as a varietal suitability ranking system. We show our embeddings to outperform \u2019raw\u2019 features on downstream tasks and results indicating potential of the autoencoder networks as data-based recommender systems. This is also, to our knowledge, the first work to apply joint VAEs to purely categorical data.",
        "keywords": "self-supervised representation learning;joint embeddings;joint variational autoencoders;viticulture;grape;wine",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/88da99d04f35313bc2a4f23abbd1b4a92e34b524.zip",
        "author": "Joel Zacharias Harms;Jan Franklin Adamowski;Viacheslav Adamchuk;Nathaniel K Newlands;Simone Diego Castellarin",
        "authorids": "~Joel_Zacharias_Harms1;~Jan_Franklin_Adamowski1;viacheslav.adamchuk@mcgill.ca;~Nathaniel_K_Newlands1;~Simone_Diego_Castellarin1",
        "gender": ";M;;M;",
        "homepage": "https://www.researchgate.net/profile/Joel_Harms;https://www.mcgill.ca/bioeng/faculty-and-staff/academic-staff/jan-adamowski;;;",
        "dblp": ";;;;",
        "google_scholar": ";https://scholar.google.ca/citations?user=nxxGBNkAAAAJ;;;03YlT24AAAAJ",
        "orcid": ";;;;0000-0001-6289-3770",
        "linkedin": ";;;nathaniel-newlands-b1105230/;",
        "or_profile": "~Joel_Zacharias_Harms1;~Jan_Franklin_Adamowski1;viacheslav.adamchuk@mcgill.ca;~Nathaniel_K_Newlands1;~Simone_Diego_Castellarin1",
        "aff": "McGill University, McGill University;McGill University;;Government of Canada;University of British Columbia",
        "aff_domain": "mail.mcgill.ca;mcgill.ca;;canada.ca;ubc.ca",
        "position": "MS student;Full Professor;;Principal Researcher;Full Professor",
        "bibtex": "@misc{\nharms2024towards,\ntitle={Towards Deep Viticultural Representations: Joint Region and Grape Variety Embeddings},\nauthor={Joel Zacharias Harms and Jan Franklin Adamowski and Viacheslav Adamchuk and Nathaniel K Newlands and Simone Diego Castellarin},\nyear={2024},\nurl={https://openreview.net/forum?id=q4cfN6PGY7}\n}",
        "github": "",
        "project": "",
        "reviewers": "p5Cm;VuWc;VBQe;U2kf",
        "site": "https://openreview.net/forum?id=q4cfN6PGY7",
        "pdf_size": 904112,
        "rating": "3;3;3;3",
        "confidence": "4;5;3;4",
        "soundness": "2;3;2;2",
        "contribution": "1;1;2;2",
        "presentation": "1;3;2;2",
        "wc_summary": "82;43;70;62",
        "wc_strengths": "47;5;48;39",
        "wc_weaknesses": "68;36;281;120",
        "wc_questions": "488;38;6;8",
        "wc_review": "685;122;405;229",
        "wc_reply_reviewers": "66;0;0;0",
        "wc_reply_authors": "1425;238;914;435",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "2;1;2;1",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            64.25,
            14.184057952504283
        ],
        "wc_strengths_avg": [
            34.75,
            17.52676524633111
        ],
        "wc_weaknesses_avg": [
            126.25,
            94.24005252545226
        ],
        "wc_questions_avg": [
            135.0,
            204.1984329028996
        ],
        "wc_review_avg": [
            360.25,
            212.98752897763757
        ],
        "wc_reply_reviewers_avg": [
            16.5,
            28.578838324886476
        ],
        "wc_reply_authors_avg": [
            753.0,
            459.30763111448516
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:3OtA7emjaLMJ:scholar.google.com/&scioq=Towards+Deep+Viticultural+Representations:+Joint+Region+and+Grape+Variety+Embeddings&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "McGill University;Government of Canada;University of British Columbia",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.mcgill.ca;https://www.canada.ca;https://www.ubc.ca",
        "aff_unique_abbr": "McGill;GOC;UBC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "q4pC5Gn8HJ",
        "title": "Contraction and Alienation: Towards Theoretical Understanding of Non-Contrastive Learning with Neighbor-Averaging Dynamics",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Non-contrastive self-supervised learning (SSL) is a popular paradigm for learning representations by explicitly aligning positive pairs. However, due to specialized implementation details, the underlying working mechanism of non-contrastive SSL remains somewhat mysterious. In this paper, we investigate the implicit bias of non-contrastive learning with a concise framework, namely SimXIR. SimXIR optimizes the online network by alternatively taking the online network of the last round as the target network, without requiring asymmetric tricks and momentum updates. Notably, the expectation minimization inherent to SimXIR can be reformulated as the *neighbor-averaging dynamics*, in which each representation is iteratively replaced with the average representation of its neighbors. \nMoreover, we introduce the concept of neighbor-connected groups that organize samples through the neighboring paths on data, and assume the input sample space is composed of multiple disjoint neighbor-connected groups. We theoretically prove that the concise dynamics of SimXIR exhibit two intriguing properties: *contraction of neighbor-connected groups* and *alienation between disjoint groups*, which resemble intra-class compactness and inter-class separability in classification and help explain why non-contrastive SSL can prevent collapsed solutions. Inspired by the theoretical results, we propose a novel step for self-supervised pre-training---self-supervised fine-tuning, and leverage SimXIR to further enhance representations of off-the-shelf SSL models. Experimental results demonstrate the effectiveness of SimXIR in improving self-supervised representations, ultimately achieving better performance on downstream classification tasks.",
        "keywords": "Self-Supervised Finetuning;Non-Contrastive Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/1a627bde54c7076be5ff08ca167fa36fb0c87612.zip",
        "author": "Xiong Zhou;Xianming Liu;Zeke Xie;Qing Ma;Feilong Zhang;Junjun Jiang;Xiangyang Ji",
        "authorids": "~Xiong_Zhou3;~Xianming_Liu5;~Zeke_Xie1;~Qing_Ma1;~Feilong_Zhang1;~Junjun_Jiang2;~Xiangyang_Ji1",
        "gender": "M;M;M;M;;M;",
        "homepage": "https://hitcszx.github.io/;http://homepage.hit.edu.cn/xmliu;https://sites.google.com/view/zeke-xie;;;http://homepage.hit.edu.cn/jiangjunjun;",
        "dblp": ";89/58201.html;210/1039;;;https://dblp.uni-trier.de/pers/hd/j/Jiang:Junjun;",
        "google_scholar": "BMGootgAAAAJ;;https://scholar.google.co.jp/citations?user=ysXmZCMAAAAJ;x6QQGQkAAAAJ;;WNH2_rgAAAAJ;",
        "orcid": "0000-0002-0856-6696;0000-0002-8857-1785;;0009-0002-5384-156X;;0000-0002-5694-505X;",
        "linkedin": ";;;;;;",
        "or_profile": "~Xiong_Zhou3;~Xianming_Liu5;~Zeke_Xie1;~Qing_Ma1;~Feilong_Zhang1;~Junjun_Jiang2;~Xiangyang_Ji1",
        "aff": "Harbin Institute of Technology;Harbin Institute of Technology;Baidu;Harbin Institute of Technology;;Harbin Institute of Technology;",
        "aff_domain": "hit.edu.cn;hit.edu.cn;baidu.com;hit.edu.cn;;hit.edu.cn;",
        "position": "PhD student;Full Professor;Researcher;PhD student;;Full Professor;",
        "bibtex": "@misc{\nzhou2024contraction,\ntitle={Contraction and Alienation: Towards Theoretical Understanding of Non-Contrastive Learning with Neighbor-Averaging Dynamics},\nauthor={Xiong Zhou and Xianming Liu and Zeke Xie and Qing Ma and Feilong Zhang and Junjun Jiang and Xiangyang Ji},\nyear={2024},\nurl={https://openreview.net/forum?id=q4pC5Gn8HJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "ByEQ;A6SE;UTfC",
        "site": "https://openreview.net/forum?id=q4pC5Gn8HJ",
        "pdf_size": 1704672,
        "rating": "5;6;6",
        "confidence": "4;4;2",
        "soundness": "2;4;3",
        "contribution": "2;3;2",
        "presentation": "3;3;2",
        "wc_summary": "31;52;61",
        "wc_strengths": "49;24;27",
        "wc_weaknesses": "153;144;160",
        "wc_questions": "11;115;2",
        "wc_review": "244;335;250",
        "wc_reply_reviewers": "0;31;0",
        "wc_reply_authors": "604;688;534",
        "reply_reviewers": "0;1;0",
        "reply_authors": "2;3;2",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            48.0,
            12.569805089976535
        ],
        "wc_strengths_avg": [
            33.333333333333336,
            11.14550233153366
        ],
        "wc_weaknesses_avg": [
            152.33333333333334,
            6.548960901462833
        ],
        "wc_questions_avg": [
            42.666666666666664,
            51.27919222799395
        ],
        "wc_review_avg": [
            276.3333333333333,
            41.55585264302597
        ],
        "wc_reply_reviewers_avg": [
            10.333333333333334,
            14.613540144521982
        ],
        "wc_reply_authors_avg": [
            608.6666666666666,
            62.95677529508286
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:qWD93GPkFKoJ:scholar.google.com/&scioq=Contraction+and+Alienation:+Towards+Theoretical+Understanding+of+Non-Contrastive+Learning+with+Neighbor-Averaging+Dynamics&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "Harbin Institute of Technology;Baidu",
        "aff_unique_dep": ";Baidu, Inc.",
        "aff_unique_url": "http://www.hit.edu.cn/;https://www.baidu.com",
        "aff_unique_abbr": "HIT;Baidu",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Harbin;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Large-Vocabulary 3D Diffusion Model with Transformer",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17750",
        "id": "q57JLSE2j5",
        "author_site": "Ziang Cao, Fangzhou Hong, Tong Wu, Liang Pan, Ziwei Liu",
        "tldr": "",
        "abstract": "Creating diverse and high-quality 3D assets with an automatic generative model is highly desirable. Despite extensive efforts on 3D generation, most existing works focus on the generation of a single category or a few categories. In this paper, we introduce a diffusion-based feed-forward framework for synthesizing massive categories of real-world 3D objects \\textit{with a single generative model}. Notably, there are three major challenges for this large-vocabulary 3D generation: \\textbf{a}) the need for expressive yet efficient 3D representation; \\textbf{b}) large diversity in geometry and texture across categories; \\textbf{c}) complexity in the appearances of real-world objects. To this end, we propose a novel triplane-based 3D-aware \\textbf{Diff}usion model with \\textbf{T}rans\\textbf{F}ormer, \\textbf{DiffTF}, for handling challenges via three aspects. \\textbf{1}) Considering efficiency and robustness, we adopt a revised triplane representation and improve the fitting speed and accuracy. \\textbf{2}) To handle the drastic variations in geometry and texture, we regard the features of all 3D objects as a combination of generalized 3D knowledge and specialized 3D features. To extract generalized 3D knowledge from diverse categories, we propose a novel 3D-aware transformer with shared cross-plane attention. It learns the cross-plane relations across different planes and aggregates the generalized 3D knowledge with specialized 3D features. \\textbf{3}) In addition, we devise the 3D-aware encoder/decoder to enhance the generalized 3D knowledge in the encoded triplanes for handling categories with complex appearances. Extensive experiments on ShapeNet and OmniObject3D (over 200 diverse real-world categories) convincingly demonstrate that a single DiffTF model achieves state-of-the-art large-vocabulary 3D object generation performance with large diversity, rich semantics, and high quality. More results are available at https://difftf.github.io/",
        "keywords": "Large-Vocabulary 3D Objects; 3D Generation; Transformer; Diffusion model",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/1b67b38cc802b08785ef961a226a52bcce7e3e4d.pdf",
        "author": "Ziang Cao;Fangzhou Hong;Tong Wu;Liang Pan;Ziwei Liu",
        "authorids": "~Ziang_Cao1;~Fangzhou_Hong1;~Tong_Wu2;~Liang_Pan2;~Ziwei_Liu1",
        "gender": "M;M;F;M;M",
        "homepage": "https://ziangcao0312.github.io/;;https://wutong16.github.io/;https://scholar.google.com/citations?user=lSDISOcAAAAJ&hl=en;https://liuziwei7.github.io/",
        "dblp": "281/7912;261/3476;75/5056-2;90/343;05/6300-2",
        "google_scholar": "L9tbNTsAAAAJ;mhaiL5MAAAAJ;https://scholar.google.com.hk/citations?user=cLUgV4YAAAAJ;lSDISOcAAAAJ;https://scholar.google.com.hk/citations?user=lc45xlcAAAAJ",
        "orcid": "0000-0002-5682-9446;;;;",
        "linkedin": ";;;;",
        "or_profile": "~Ziang_Cao1;~Fangzhou_Hong1;~Tong_Wu2;~Liang_Pan2;~Ziwei_Liu1",
        "aff": "Nanyang Technological University;Nanyang Technological University;The Chinese University of Hong Kong;Shanghai AI Lab;Nanyang Technological University",
        "aff_domain": "ntu.edu.sg;ntu.edu.sg;cuhk.edu.hk;pjlab.org.cn;ntu.edu.sg",
        "position": "Researcher;PhD student;PhD student;Research Scientist ;Assistant Professor",
        "bibtex": "@inproceedings{\ncao2024largevocabulary,\ntitle={Large-Vocabulary 3D Diffusion Model with Transformer},\nauthor={Ziang Cao and Fangzhou Hong and Tong Wu and Liang Pan and Ziwei Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=q57JLSE2j5}\n}",
        "github": "",
        "project": "",
        "reviewers": "veme;heX9;yEnj",
        "pdf_size": 5251297,
        "rating": "6;6;6",
        "confidence": "3;4;4",
        "soundness": "3;4;3",
        "contribution": "3;2;3",
        "presentation": "3;4;1",
        "wc_summary": "53;57;63",
        "wc_strengths": "50;60;60",
        "wc_weaknesses": "90;102;214",
        "wc_questions": "2;1;174",
        "wc_review": "195;220;511",
        "wc_reply_reviewers": "0;19;8",
        "wc_reply_authors": "499;295;515",
        "reply_reviewers": "0;1;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "wc_summary_avg": [
            57.666666666666664,
            4.109609335312651
        ],
        "wc_strengths_avg": [
            56.666666666666664,
            4.714045207910317
        ],
        "wc_weaknesses_avg": [
            135.33333333333334,
            55.841044243658466
        ],
        "wc_questions_avg": [
            59.0,
            81.31830462243214
        ],
        "wc_review_avg": [
            308.6666666666667,
            143.4348477726231
        ],
        "wc_reply_reviewers_avg": [
            9.0,
            7.788880963698615
        ],
        "wc_reply_authors_avg": [
            436.3333333333333,
            100.15099711047425
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 31,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14702880612071330942&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=q57JLSE2j5",
        "pdf": "https://openreview.net/pdf?id=q57JLSE2j5",
        "email": "ntu.edu.sg;ntu.edu.sg;cuhk.edu.hk;pjlab.org.cn;ntu.edu.sg",
        "author_num": 5,
        "aff_unique_index": "0;0;1;2;0",
        "aff_unique_norm": "Nanyang Technological University;Chinese University of Hong Kong;Shanghai AI Lab",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ntu.edu.sg;https://www.cuhk.edu.hk;https://www.shanghaiailab.com",
        "aff_unique_abbr": "NTU;CUHK;SAIL",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;1;1;0",
        "aff_country_unique": "Singapore;China"
    },
    {
        "id": "q6WXlm2Kxo",
        "title": "Masked Diffusion as Self-supervised Representation Learner",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Denoising diffusion probabilistic models have recently demonstrated state-of-the-art generative performance and have been used as strong pixel-level representation learners. This paper decomposes the interrelation between the generative capability and representation learning ability inherent in diffusion models. We present the masked diffusion model (MDM), a scalable self-supervised representation learner substituting the conventional additive Gaussian noise of traditional diffusion with a masking mechanism. Our proposed approach convincingly surpasses prior benchmarks, demonstrating remarkable advancements in both medical and natural image semantic segmentation tasks, particularly in few-shot scenarios.",
        "keywords": "Semantic Segmentation;Representation Learning;Diffusion",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Zixuan Pan;Jianxu Chen;Yiyu Shi",
        "authorids": "~Zixuan_Pan2;~Jianxu_Chen1;~Yiyu_Shi1",
        "gender": "M;M;M",
        "homepage": "https://zx-pan.github.io;https://mmv-lab.github.io;",
        "dblp": "319/2483;150/3090-1;94/5536",
        "google_scholar": "3VuW2gcAAAAJ;HdolpOgAAAAJ;",
        "orcid": ";0000-0002-8500-1357;",
        "linkedin": ";;",
        "or_profile": "~Zixuan_Pan2;~Jianxu_Chen1;~Yiyu_Shi1",
        "aff": "University of Notre Dame;Leibniz-Institut f\u00fcr Analytische Wissenschaften ;University of Notre Dame",
        "aff_domain": "nd.edu;isas.de;nd.edu",
        "position": "PhD student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\npan2024masked,\ntitle={Masked Diffusion as Self-supervised Representation Learner},\nauthor={Zixuan Pan and Jianxu Chen and Yiyu Shi},\nyear={2024},\nurl={https://openreview.net/forum?id=q6WXlm2Kxo}\n}",
        "github": "",
        "project": "",
        "reviewers": "V2xK;Sbaz;caGX;x7rC",
        "site": "https://openreview.net/forum?id=q6WXlm2Kxo",
        "pdf_size": 11440634,
        "rating": "3;5;6;6",
        "confidence": "4;3;4;3",
        "soundness": "2;2;4;2",
        "contribution": "2;2;3;3",
        "presentation": "2;2;4;3",
        "wc_summary": "39;93;135;121",
        "wc_strengths": "17;67;117;20",
        "wc_weaknesses": "72;236;212;264",
        "wc_questions": "109;14;14;16",
        "wc_review": "237;410;478;421",
        "wc_reply_reviewers": "0;0;52;637",
        "wc_reply_authors": "739;499;1121;1564",
        "reply_reviewers": "0;0;1;3",
        "reply_authors": "1;1;2;4",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            97.0,
            36.742346141747674
        ],
        "wc_strengths_avg": [
            55.25,
            40.794454279963105
        ],
        "wc_weaknesses_avg": [
            196.0,
            73.91887445030531
        ],
        "wc_questions_avg": [
            38.25,
            40.855691158025955
        ],
        "wc_review_avg": [
            386.5,
            90.09023254493242
        ],
        "wc_reply_reviewers_avg": [
            172.25,
            269.1620097636366
        ],
        "wc_reply_authors_avg": [
            980.75,
            403.2296957070498
        ],
        "reply_reviewers_avg": [
            1.0,
            1.224744871391589
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.40824829046386296,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11822925911956910254&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Notre Dame;Leibniz-Institut f\u00fcr Analytische Wissenschaften",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.nd.edu;https://www.leibniz-awis.de",
        "aff_unique_abbr": "Notre Dame;Leibniz-AWIS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United States;Germany"
    },
    {
        "id": "q6WtaLj8O1",
        "title": "Fully Hyperbolic Representation Learning on Knowledge Hypergraph",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Knowledge hypergraphs generalize knowledge graphs in terms of utilizing hyperedges to connect multiple entities and represent complicated relations within them. Existing methods either transform hyperedges into an easier to handle set of binary relations or view hyperedges as isolated and ignore their adjacencies. Both approaches have information loss and may lead to sub-optimal models. To fix these issues, we propose the Hyperbolic Hypergraph GNN (H2GNN), whose essential part is the hyper-star message passing, a novel scheme motivated by a lossless expansion of hyperedges into hierarchies, and implement a direct embedding which explicitly takes adjacent hyperedges and entity positions into account. As the name suggests, H2GNN works in the fully hyperbolic space, which can further reduce distortion and boost efficiency. We compare H2GNN with 15 baselines on both homogeneous and heterogeneous knowledge hypergraphs, and it outperforms state-of-the-art approaches in both node classification and link prediction tasks.",
        "keywords": "Representation Learning;Hyperbolic Space;Knowledge Hypergraph",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Mengfan Li;Xuanhua Shi;Chenqi Qiao;Teng Zhang;Xiao Huang;Yao Wan;Hai Jin",
        "authorids": "~Mengfan_Li2;~Xuanhua_Shi1;~Chenqi_Qiao1;~Teng_Zhang3;~Xiao_Huang1;~Yao_Wan2;~Hai_Jin1",
        "gender": ";M;M;M;M;M;M",
        "homepage": ";https://sites.google.com/view/xhshi/home;https://github.com/QcQyohoooooo;;https://www4.comp.polyu.edu.hk/~xiaohuang/;http://wanyao.me;http://www.linkedin.com/in/jinhust",
        "dblp": ";85/5317.html;;38/5156-1;25/692-1.html;167/0275.html;98/4156",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;;https://scholar.google.com.hk/citations?user=gysI2pYAAAAJ;Be21PkYAAAAJ;c3MtqtMAAAAJ;",
        "orcid": ";0000-0001-8451-8656;;;0000-0002-3867-900X;0000-0001-6937-4180;0000-0002-3934-7605",
        "linkedin": ";;;;;;jinhust",
        "or_profile": "~Mengfan_Li2;~Xuanhua_Shi1;~Chenqi_Qiao1;~Teng_Zhang3;~Xiao_Huang1;~Yao_Wan2;~Hai_Jin1",
        "aff": ";Huazhong University of Science and Technology;Huazhong University of Science and Technology;Huazhong University of Science and Technology;The Hong Kong Polytechnic University;Huazhong University of Science and Technology;Huazhong University of Science and Technology",
        "aff_domain": ";hust.edu.cn;hust.edu.cn;hust.edu.cn;polyu.edu.hk;hust.edu.cn;hust.edu.cn",
        "position": ";Full Professor;MS student;Associate Professor;Assistant Professor;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nli2024fully,\ntitle={Fully Hyperbolic Representation Learning on Knowledge Hypergraph},\nauthor={Mengfan Li and Xuanhua Shi and Chenqi Qiao and Teng Zhang and Xiao Huang and Yao Wan and Hai Jin},\nyear={2024},\nurl={https://openreview.net/forum?id=q6WtaLj8O1}\n}",
        "github": "",
        "project": "",
        "reviewers": "pg5m;p6a6;wicp",
        "site": "https://openreview.net/forum?id=q6WtaLj8O1",
        "pdf_size": 805024,
        "rating": "3;3;3",
        "confidence": "5;4;5",
        "soundness": "2;2;2",
        "contribution": "2;2;1",
        "presentation": "3;1;2",
        "wc_summary": "77;222;55",
        "wc_strengths": "77;44;11",
        "wc_weaknesses": "119;185;60",
        "wc_questions": "130;682;5",
        "wc_review": "403;1133;131",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            118.0,
            74.08553615022751
        ],
        "wc_strengths_avg": [
            44.0,
            26.94438717061496
        ],
        "wc_weaknesses_avg": [
            121.33333333333333,
            51.05770156292672
        ],
        "wc_questions_avg": [
            272.3333333333333,
            294.1386672227158
        ],
        "wc_review_avg": [
            555.6666666666666,
            423.0692089428816
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Y7gT3uhb1W8J:scholar.google.com/&scioq=Fully+Hyperbolic+Representation+Learning+on+Knowledge+Hypergraph&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;0;0",
        "aff_unique_norm": "Huazhong University of Science and Technology;Hong Kong Polytechnic University",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.hust.edu.cn;https://www.polyu.edu.hk",
        "aff_unique_abbr": "HUST;PolyU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "q7XxKp2rHs",
        "title": "SMAFace: Sample Mining Guided Adaptive Loss for Face Recognition",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Traditional face recognition (FR) algorithms often rely merely on margin-based softmax loss functions. However, due to noisy training data and varied image quality in datasets, these models often falter when dealing with low-quality images. To address this issue, we introduce SMAFace, an innovative FR algorithm that enhances performance by incorporating sample mining into conventional margin-based methods. At its core, SMAFace focuses on prioritizing information-dense samples, namely hard samples or easy samples, which present more distinctive features. In this study, we employ a probability-driven mining strategy, enabling the model to adeptly navigate hard samples, thereby bolstering its robustness and adaptability. The mathematical evaluation and empirical tests of SMAFace indicate its effectiveness. Moreover, experimental results reveal that our approach surpasses the state-of-the-art (SoTA) on four renowned datasets (CPLFW, VGG2-FP, IJB-B and TinyFace), highlighting its potential and efficiency.",
        "keywords": "face recognition;sample mining;low-quality images",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/b66e9080f3ee8f1fc3733d1294d79a98537e25f2.zip",
        "author": "Yang Wang;Fan Xie;Ao Wang;Jiawei Xv;Chang Ma;shijia song;Zhenyu Yuan;lijun zhao",
        "authorids": "~Yang_Wang48;~Fan_Xie2;~Ao_Wang3;~Jiawei_Xv1;~Chang_Ma3;~shijia_song1;~Zhenyu_Yuan1;~lijun_zhao2",
        "gender": "M;M;M;M;F;F;M;M",
        "homepage": "https://ci.ahnu.edu.cn/info/1107/2959.htm;;;;;;;http://homepage.hit.edu.cn/zhaolijun?lang=zh",
        "dblp": ";;;;;;;",
        "google_scholar": ";;;;;;;",
        "orcid": ";0009-0006-6674-5103;0009-0005-3310-0678;0009-0007-9172-9321;0009-0003-5762-6565;0009-0008-5680-7408;0009-0008-7013-3323;",
        "linkedin": ";Fan-Xie-867368289;;;;;;",
        "or_profile": "~Yang_Wang48;~Fan_Xie2;~Ao_Wang3;~Jiawei_Xv1;~Chang_Ma3;~shijia_song1;~Zhenyu_Yuan1;~lijun_zhao2",
        "aff": ";Anhui Normal University;Anhui Normal University;Anhui Normal University;Anhui Normal University;Anhui Normal University;Anhui Normal University;Harbin Institute of Technology",
        "aff_domain": ";ahnu.edu.cn;ahnu.edu.cn;ahnu.edu.cn;ahnu.edu.cn;ahnu.edu.cn;ahnu.edu.cn;hit.edu.cn",
        "position": ";MS student;MS student;MS student;MS student;MS student;MS student;Full Professor",
        "bibtex": "@misc{\nwang2024smaface,\ntitle={{SMAF}ace: Sample Mining Guided Adaptive Loss for Face Recognition},\nauthor={Yang Wang and Fan Xie and Ao Wang and Jiawei Xv and Chang Ma and shijia song and Zhenyu Yuan and lijun zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=q7XxKp2rHs}\n}",
        "github": "",
        "project": "",
        "reviewers": "kbyJ;tEeY;fauv",
        "site": "https://openreview.net/forum?id=q7XxKp2rHs",
        "pdf_size": 4450266,
        "rating": "3;3;3",
        "confidence": "5;5;4",
        "soundness": "2;2;3",
        "contribution": "1;2;2",
        "presentation": "2;2;1",
        "wc_summary": "40;42;56",
        "wc_strengths": "8;23;51",
        "wc_weaknesses": "124;40;182",
        "wc_questions": "5;1;29",
        "wc_review": "177;106;318",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "683;295;465",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            46.0,
            7.118052168020874
        ],
        "wc_strengths_avg": [
            27.333333333333332,
            17.820088539498215
        ],
        "wc_weaknesses_avg": [
            115.33333333333333,
            58.29427263653113
        ],
        "wc_questions_avg": [
            11.666666666666666,
            12.36482466066094
        ],
        "wc_review_avg": [
            200.33333333333334,
            88.1072578672659
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            481.0,
            158.80386225361985
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:GopZhXQ1v-kJ:scholar.google.com/&scioq=SMAFace:+Sample+Mining+Guided+Adaptive+Loss+for+Face+Recognition&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0;0;1",
        "aff_unique_norm": "Anhui Normal University;Harbin Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.ahnu.edu.cn/;http://www.hit.edu.cn/",
        "aff_unique_abbr": "AHNU;HIT",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Harbin",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "q8mZ8AVl5d",
        "title": "Non-Intrusive Adaptation: Input-Centric Parameter-efficient Fine-Tuning for Versatile Multimodal Modeling",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large language models (LLMs) and Vision language models (VLMs) demonstrate excellent performance on a wide range of tasks by scaling up parameter counts from O(10^9) to O(10^12) levels and further beyond. These large scales make it impossible to adapt and deploy fully specialized models given a task of interest. Parameter-efficient fine-tuning (PEFT) emerges as a promising direction to tackle the adaptation and serving challenges for such large models. We categorize PEFT techniques into two types: intrusive and non-intrusive. Intrusive PEFT techniques directly change a model's internal architecture. Though more flexible, they introduce significant complexities for training and serving. Non-intrusive PEFT techniques leave the internal architecture unchanged and only adapt model-external parameters, such as embeddings for input. In this work, we describe AdaLink as a non-intrusive PEFT technique that achieves competitive performance compared to SoTA intrusive PEFT (LoRA) and full model fine-tuning (FT) on various tasks. We evaluate using both text-only and multimodal tasks, with experiments that account for both parameter-count scaling and training regime (with and without instruction tuning).",
        "keywords": "multimodal;parameter-efficient fine-tuning;LLM;NLP",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Yaqing Wang;Jialin Wu;Tanmaya Dabral;Jiageng Zhang;Geoff Brown;Chun-Ta Lu;Frederick Liu;Yi Liang;Bo Pang;Michael Bendersky;Radu Soricut",
        "authorids": "~Yaqing_Wang1;~Jialin_Wu1;tanmayad@google.com;~Jiageng_Zhang1;~Geoff_Brown1;~Chun-Ta_Lu1;~Frederick_Liu1;~Yi_Liang1;~Bo_Pang3;~Michael_Bendersky1;~Radu_Soricut2",
        "gender": "M;M;;M;;M;M;M;;;M",
        "homepage": "https://yaqingwang.github.io/;https://jialinwu.netlify.app/;;;https://www.linkedin.com/in/geoff-brown-8a8a3275/;;https://frederick0329.github.io/;https://research.google/people/108265/;https://sites.google.com/site/bopang42/;http://bendersky.github.io/;",
        "dblp": "147/1393;149/5889;;;;96/9436;;;16/6344-1;80/4305;",
        "google_scholar": "_Rfg2CAAAAAJ;M7EpKqsAAAAJ;;;;05CGvyAAAAAJ;iJbdUkQAAAAJ;9vQ7gbgAAAAJ;qCdLtIoAAAAJ;C9mxM5IAAAAJ;NAzD9mgAAAAJ",
        "orcid": ";;;;;;;0000-0002-6622-8919;;0000-0002-2941-6240;",
        "linkedin": ";jialin-wu-a50135175/;;jiageng-zhang/;;;;;;;",
        "or_profile": "~Yaqing_Wang1;~Jialin_Wu1;tanmayad@google.com;~Jiageng_Zhang1;~Geoff_Brown1;~Chun-Ta_Lu1;~Frederick_Liu1;~Yi_Liang1;~Bo_Pang3;~Michael_Bendersky1;~Radu_Soricut2",
        "aff": "Google DeepMind;Google;;Google;Google;Google;Google;Research, Google;Google;Google;Google",
        "aff_domain": "google.com;google.com;;google.com;google.com;google.com;google.com;research.google.com;google.com;google.com;google.com",
        "position": "Research Scientist;Researcher;;Researcher;Researcher;Researcher;Software Engineer;Researcher;Researcher;Researcher;Research Scientist",
        "bibtex": "@misc{\nwang2024nonintrusive,\ntitle={Non-Intrusive Adaptation: Input-Centric Parameter-efficient Fine-Tuning for Versatile Multimodal Modeling},\nauthor={Yaqing Wang and Jialin Wu and Tanmaya Dabral and Jiageng Zhang and Geoff Brown and Chun-Ta Lu and Frederick Liu and Yi Liang and Bo Pang and Michael Bendersky and Radu Soricut},\nyear={2024},\nurl={https://openreview.net/forum?id=q8mZ8AVl5d}\n}",
        "github": "",
        "project": "",
        "reviewers": "cRLW;ZwpG;R26q;bjPo",
        "site": "https://openreview.net/forum?id=q8mZ8AVl5d",
        "pdf_size": 410263,
        "rating": "3;3;3;5",
        "confidence": "4;4;4;3",
        "soundness": "3;3;3;3",
        "contribution": "2;2;1;2",
        "presentation": "3;3;3;3",
        "wc_summary": "56;116;137;77",
        "wc_strengths": "90;33;20;40",
        "wc_weaknesses": "134;560;202;339",
        "wc_questions": "5;56;182;142",
        "wc_review": "285;765;541;598",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            96.5,
            31.784430150625635
        ],
        "wc_strengths_avg": [
            45.75,
            26.536531423680827
        ],
        "wc_weaknesses_avg": [
            308.75,
            162.7688161166014
        ],
        "wc_questions_avg": [
            96.25,
            69.62892717829278
        ],
        "wc_review_avg": [
            547.25,
            172.34032464864396
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=627527047006621269&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0;0;0;0;0;0;0",
        "aff_unique_norm": "Google",
        "aff_unique_dep": "Google DeepMind",
        "aff_unique_url": "https://deepmind.com",
        "aff_unique_abbr": "DeepMind",
        "aff_campus_unique_index": "1;1;1;1;1;1;1;1;1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;1;1;1;1;1;1;1;1",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "title": "Leveraging Hyperbolic Embeddings for Coarse-to-Fine Robot Design",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17749",
        "id": "q9jQPA6zPK",
        "author_site": "Heng Dong, Junyu Zhang, Chongjie Zhang",
        "tldr": "",
        "abstract": "Multi-cellular robot design aims to create robots comprised of numerous cells that can be efficiently controlled to perform diverse tasks. Previous research has demonstrated the ability to generate robots for various tasks, but these approaches often optimize robots directly in the vast design space, resulting in robots with complicated morphologies that are hard to control. In response, this paper presents a novel coarse-to-fine method for designing multi-cellular robots. Initially, this strategy seeks optimal coarse-grained robots and progressively refines them. To mitigate the challenge of determining the precise refinement juncture during the coarse-to-fine transition, we introduce the Hyperbolic Embeddings for Robot Design (HERD) framework. HERD unifies robots of various granularity within a shared hyperbolic space and leverages a refined Cross-Entropy Method for optimization. This framework enables our method to autonomously identify areas of exploration in hyperbolic space and concentrate on regions demonstrating promise.  Finally, the extensive empirical studies on various challenging tasks sourced from EvoGym show our approach's superior efficiency and generalization capability.",
        "keywords": "Robot Design;Hyperbolic Space;Coarse-to-Fine;Multi-Cellular",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Heng Dong;Junyu Zhang;Chongjie Zhang",
        "authorids": "~Heng_Dong1;~Junyu_Zhang3;~Chongjie_Zhang1",
        "gender": "M;F;",
        "homepage": "https://drdh.cc;https://jyzhang1208.github.io/;",
        "dblp": "387/8933.html;;29/6693",
        "google_scholar": "K26AU1EAAAAJ;n3Q40BAAAAAJ;LjxqXycAAAAJ",
        "orcid": "0000-0001-7548-3455;;",
        "linkedin": ";;",
        "or_profile": "~Heng_Dong1;~Junyu_Zhang3;~Chongjie_Zhang1",
        "aff": "Tsinghua University;Huazhong University of Science and Technology;Washington University, Saint Louis",
        "aff_domain": "tsinghua.edu.cn;hust.edu.cn;wustl.edu",
        "position": "PhD student;Undergrad student;Associate Professor",
        "bibtex": "@inproceedings{\ndong2024leveraging,\ntitle={Leveraging Hyperbolic Embeddings for Coarse-to-Fine Robot Design},\nauthor={Heng Dong and Junyu Zhang and Chongjie Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=q9jQPA6zPK}\n}",
        "github": "",
        "project": "",
        "reviewers": "Wtet;9c5Z;WvQM;S1iZ",
        "pdf_size": 8915340,
        "rating": "6;6;6;8",
        "confidence": "4;3;3;3",
        "soundness": "2;3;2;3",
        "contribution": "2;3;2;3",
        "presentation": "3;4;3;4",
        "wc_summary": "114;13;130;101",
        "wc_strengths": "36;43;33;133",
        "wc_weaknesses": "45;49;81;70",
        "wc_questions": "501;4;100;140",
        "wc_review": "696;109;344;444",
        "wc_reply_reviewers": "438;55;85;86",
        "wc_reply_authors": "3126;364;1212;556",
        "reply_reviewers": "2;1;2;1",
        "reply_authors": "5;1;3;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            89.5,
            45.34589286804263
        ],
        "wc_strengths_avg": [
            61.25,
            41.583500333665995
        ],
        "wc_weaknesses_avg": [
            61.25,
            14.8387162517517
        ],
        "wc_questions_avg": [
            186.25,
            188.32203137179675
        ],
        "wc_review_avg": [
            398.25,
            210.56872393591598
        ],
        "wc_reply_reviewers_avg": [
            166.0,
            157.5325363218659
        ],
        "wc_reply_authors_avg": [
            1314.5,
            1092.1093122943325
        ],
        "reply_reviewers_avg": [
            1.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            1.6583123951777
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11647862623039659736&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=q9jQPA6zPK",
        "pdf": "https://openreview.net/pdf?id=q9jQPA6zPK",
        "email": "tsinghua.edu.cn;hust.edu.cn;wustl.edu",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Tsinghua University;Huazhong University of Science and Technology;Washington University in St. Louis",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;http://www.hust.edu.cn;https://wustl.edu",
        "aff_unique_abbr": "THU;HUST;WUSTL",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Saint Louis",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Efficient Integrators for Diffusion Generative Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17748",
        "id": "qA4foxO5Gf",
        "author_site": "Kushagra Pandey, Maja Rudolph, Stephan Mandt",
        "tldr": "",
        "abstract": "Diffusion models suffer from slow sample generation at inference time. Therefore, developing a principled framework for fast deterministic/stochastic sampling for a broader class of diffusion models is a promising direction. We propose two complementary frameworks for accelerating sample generation in pre-trained models: Conjugate Integrators and Splitting Integrators. Conjugate integrators generalize DDIM, mapping the reverse diffusion dynamics to a more amenable space for sampling. In contrast, splitting-based integrators, commonly used in molecular dynamics, reduce the numerical simulation error by cleverly alternating between numerical updates involving the data and auxiliary variables. After extensively studying these methods empirically and theoretically, we present a hybrid method that leads to the best-reported performance for diffusion models in augmented spaces. Applied to Phase Space Langevin Diffusion [Pandey \\& Mandt, 2023] on CIFAR-10, our deterministic and stochastic samplers achieve FID scores of 2.11 and 2.36 in only 100 network function evaluations (NFE) as compared to 2.57 and 2.63 for the best-performing baselines, respectively. Our code and model checkpoints will be made publicly available at https://github.com/mandt-lab/PSLD",
        "keywords": "Diffusion models;Deep Generative Models;Efficient Sampling",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Kushagra Pandey;Maja Rudolph;Stephan Mandt",
        "authorids": "~Kushagra_Pandey1;~Maja_Rudolph4;~Stephan_Mandt1",
        "gender": "M;F;M",
        "homepage": "https://kpandey008.github.io;http://maja-rita-rudolph.com/;https://www.stephanmandt.com",
        "dblp": ";164/5581;147/5018",
        "google_scholar": "Vzcz2WwAAAAJ;https://scholar.google.com/citations?hl=en;HOrGe7wAAAAJ",
        "orcid": ";;",
        "linkedin": "kushagra-pandey-008/;;stephan-mandt-8702795a/",
        "or_profile": "~Kushagra_Pandey1;~Maja_Rudolph4;~Stephan_M_Mandt1",
        "aff": "University of California, Irvine;Bosch;University of California, Irvine",
        "aff_domain": "uci.edu;bosch.com;uci.edu",
        "position": "PhD student;Researcher;Associate Professor",
        "bibtex": "@inproceedings{\npandey2024efficient,\ntitle={Efficient Integrators for Diffusion Generative Models},\nauthor={Kushagra Pandey and Maja Rudolph and Stephan Mandt},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=qA4foxO5Gf}\n}",
        "github": "",
        "project": "",
        "reviewers": "9LJY;8Lyn;eNRC;dkXq",
        "pdf_size": 15851002,
        "rating": "5;6;6;8",
        "confidence": "5;4;2;3",
        "soundness": "2;3;2;4",
        "contribution": "2;2;3;4",
        "presentation": "2;2;3;4",
        "wc_summary": "249;41;70;72",
        "wc_strengths": "46;40;53;29",
        "wc_weaknesses": "572;466;108;3",
        "wc_questions": "27;51;124;2",
        "wc_review": "894;598;355;106",
        "wc_reply_reviewers": "392;35;0;5",
        "wc_reply_authors": "3336;2378;1408;35",
        "reply_reviewers": "2;1;0;1",
        "reply_authors": "6;5;3;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            108.0,
            82.32557318354972
        ],
        "wc_strengths_avg": [
            42.0,
            8.803408430829505
        ],
        "wc_weaknesses_avg": [
            287.25,
            237.6776966818721
        ],
        "wc_questions_avg": [
            51.0,
            45.56862956025779
        ],
        "wc_review_avg": [
            488.25,
            291.78277450870877
        ],
        "wc_reply_reviewers_avg": [
            108.0,
            164.51291742595777
        ],
        "wc_reply_authors_avg": [
            1789.25,
            1220.8405659626485
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            3.75,
            1.920286436967152
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5129891760425771,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3162503540482986280&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=qA4foxO5Gf",
        "pdf": "https://openreview.net/pdf?id=qA4foxO5Gf",
        "email": "uci.edu;bosch.com;uci.edu",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of California, Irvine;Robert Bosch GmbH",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uci.edu;https://www.bosch.com",
        "aff_unique_abbr": "UCI;Bosch",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Irvine;",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United States;Germany"
    },
    {
        "title": "DQ-LoRe: Dual Queries with Low Rank Approximation Re-ranking for In-Context Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17747",
        "id": "qAoxvePSlq",
        "author_site": "Jing Xiong, Zixuan Li, Chuanyang Zheng, Zhijiang Guo, Yichun Yin, Enze Xie, Zhicheng YANG, Qingxing Cao, Haiming Wang, Xiongwei Han, Jing Tang, Chengming Li, Xiaodan Liang",
        "tldr": "",
        "abstract": "Recent advances in natural language processing, primarily propelled by Large Language Models (LLMs), have showcased their remarkable capabilities grounded in in-context learning. A promising avenue for guiding LLMs in intricate reasoning tasks involves the utilization of intermediate reasoning steps within the Chain-of-Thought (CoT) paradigm. Nevertheless, the central challenge lies in the effective selection of exemplars for facilitating in-context learning. In this study, we introduce a framework that leverages Dual Queries and Low-rank approximation Re-ranking (DQ-LoRe) to automatically select exemplars for in-context learning. Dual Queries first query LLM to obtain LLM-generated knowledge such as CoT, then query the retriever to obtain the final exemplars via both question and the knowledge. Moreover, for the second query, LoRe employs dimensionality reduction techniques to refine exemplar selection, ensuring close alignment with the input question's knowledge. Through extensive experiments, we demonstrate that DQ-LoRe significantly outperforms prior state-of-the-art methods in the automatic selection of exemplars for GPT-4, enhancing performance from 92.5\\% to 94.2\\%. Our comprehensive analysis further reveals that DQ-LoRe consistently outperforms retrieval-based approaches in terms of both performance and adaptability, especially in scenarios characterized by distribution shifts. DQ-LoRe pushes the boundaries of in-context learning and opens up new avenues for addressing complex reasoning challenges.",
        "keywords": "Large Language Models;In-context Learning;Re-ranking;Chain-of-thought;PCA",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Jing Xiong;Zixuan Li;Chuanyang Zheng;Zhijiang Guo;Yichun Yin;Enze Xie;Zhicheng YANG;Qingxing Cao;Haiming Wang;Xiongwei Han;Jing Tang;Chengming Li;Xiaodan Liang",
        "authorids": "~Jing_Xiong4;~Zixuan_Li4;~Chuanyang_Zheng3;~Zhijiang_Guo2;~Yichun_Yin2;~Enze_Xie1;~Zhicheng_YANG5;~Qingxing_Cao1;~Haiming_Wang1;~Xiongwei_Han1;~Jing_Tang5;~Chengming_Li1;~Xiaodan_Liang2",
        "gender": ";;M;M;M;M;;M;M;M;M;;F",
        "homepage": ";https://uguess-lzx.github.io/;https://chuanyang-zheng.github.io/;https://cartus.github.io/;;https://xieenze.github.io/;;;;;https://sites.google.com/view/jtang;;https://www.sysu-hcp.net/",
        "dblp": ";;;43/6147;180/5934;218/5441;;149/7615;97/604;299/1779.html;83/663-4;;",
        "google_scholar": ";https://scholar.google.com.hk/citations?user=fJsvj4YAAAAJ;LWwh7K4AAAAJ;8b-u3icAAAAJ;x3Mz21gAAAAJ;42MVVPgAAAAJ;;flOBrd8AAAAJ;zDPqP6AAAAAJ;SEJtThAAAAAJ;https://scholar.google.com/citations?hl=en;-f1AUBcAAAAJ;voxznZAAAAAJ",
        "orcid": ";;;;;;;;;;0000-0002-0785-707X;0000-0002-4592-3875;",
        "linkedin": ";;;;;;;;;;;;",
        "or_profile": "~Jing_Xiong4;~Zixuan_Li4;~Chuanyang_Zheng3;~Zhijiang_Guo2;~Yichun_Yin2;~Enze_Xie1;~Zhicheng_YANG5;~Qingxing_Cao1;~Haiming_Wang1;~Xiongwei_Han1;~Jing_Tang5;~Chengming_Li1;~Xiaodan_Liang2",
        "aff": ";SUN YAT-SEN UNIVERSITY;The Chinese University of Hong Kong;University of Cambridge;Huawei Noah's Ark Lab;Huawei Noah's Ark Lab;;SUN YAT-SEN UNIVERSITY, Tsinghua University;SUN YAT-SEN UNIVERSITY;Huawei Technologies Ltd.;Hong Kong University of Science and Technology; Shenzhen MSU-BIT University;SUN YAT-SEN UNIVERSITY",
        "aff_domain": ";sysu.edu.cn;cse.cuhk.edu.hk;cam.ac.uk;huawei.com;huawei.com;;sysu.edu.cn;sysu.edu.cn;huawei.com;ust.hk;smbu.edu.cn;sysu.edu.cn",
        "position": ";MS student;PhD student;Postdoc;Researcher;Researcher;;Postdoc;PhD student;Researcher;Assistant Professor;Full Professor;Associate Professor",
        "bibtex": "@inproceedings{\nxiong2024dqlore,\ntitle={{DQ}-LoRe: Dual Queries with Low Rank Approximation Re-ranking for In-Context Learning},\nauthor={Jing Xiong and Zixuan Li and Chuanyang Zheng and Zhijiang Guo and Yichun Yin and Enze Xie and Zhicheng YANG and Qingxing Cao and Haiming Wang and Xiongwei Han and Jing Tang and Chengming Li and Xiaodan Liang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=qAoxvePSlq}\n}",
        "github": "",
        "project": "",
        "reviewers": "fk1v;FmMb;vwFb;QTwu",
        "pdf_size": 670930,
        "rating": "5;6;6;6",
        "confidence": "3;3;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "144;68;122;118",
        "wc_strengths": "289;19;91;50",
        "wc_weaknesses": "244;32;135;99",
        "wc_questions": "125;72;64;43",
        "wc_review": "802;191;412;310",
        "wc_reply_reviewers": "0;18;0;11",
        "wc_reply_authors": "1977;1227;989;1528",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "4;3;4;6",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            113.0,
            27.80287754891569
        ],
        "wc_strengths_avg": [
            112.25,
            105.19357157165071
        ],
        "wc_weaknesses_avg": [
            127.5,
            76.7479641423797
        ],
        "wc_questions_avg": [
            76.0,
            30.20761493398643
        ],
        "wc_review_avg": [
            428.75,
            229.25027262797312
        ],
        "wc_reply_reviewers_avg": [
            7.25,
            7.660776723022281
        ],
        "wc_reply_authors_avg": [
            1430.25,
            368.95214798127955
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            4.25,
            1.0897247358851685
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            13,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 24,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17962441765158707989&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=qAoxvePSlq",
        "pdf": "https://openreview.net/pdf?id=qAoxvePSlq",
        "email": ";sysu.edu.cn;cse.cuhk.edu.hk;cam.ac.uk;huawei.com;huawei.com;;sysu.edu.cn;sysu.edu.cn;huawei.com;ust.hk;smbu.edu.cn;sysu.edu.cn",
        "author_num": 13,
        "aff_unique_index": "0;1;2;3;3;0;0;3;4;5;0",
        "aff_unique_norm": "Sun Yat-sen University;Chinese University of Hong Kong;University of Cambridge;Huawei;Hong Kong University of Science and Technology;Shenzhen MSU-BIT University",
        "aff_unique_dep": ";;;Noah's Ark Lab;;",
        "aff_unique_url": "http://www.sysu.edu.cn;https://www.cuhk.edu.hk;https://www.cam.ac.uk;https://www.huawei.com;https://www.ust.hk;http://www.msubit.edu.cn",
        "aff_unique_abbr": "SYSU;CUHK;Cambridge;Huawei;HKUST;",
        "aff_campus_unique_index": "1;2;1;3",
        "aff_campus_unique": ";Hong Kong SAR;Cambridge;Shenzhen",
        "aff_country_unique_index": "0;0;1;0;0;0;0;0;0;0;0",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "id": "qB0IV2DpeS",
        "title": "Byzantine Robustness and Partial Participation Can Be Achieved Simultaneously: Just Clip Gradient Differences",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Distributed learning has emerged as a leading paradigm for training large machine learning models. However, in real-world scenarios, participants may be unreliable or malicious, posing a significant challenge to the integrity and accuracy of the trained models. Byzantine fault tolerance mechanisms have been proposed to address these issues, but they often assume full participation from all clients, which is not always practical due to the unavailability of some clients or communication constraints. In our work, we propose the first distributed method with client sampling and provable tolerance to Byzantine workers. The key idea behind the developed method is the use of gradient clipping to control stochastic gradient differences in recursive variance reduction. This allows us to bound the potential harm caused by Byzantine workers, even during iterations when all sampled clients are Byzantine. Furthermore, we incorporate communication compression into the method to enhance communication efficiency. Under quite general assumptions, we prove convergence rates for the proposed method that match the existing state-of-the-art (SOTA) theoretical results.",
        "keywords": "byzantine robustness;clipping;partial participation;variance reduction;communication compression",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Grigory Malinovsky;Eduard Gorbunov;Peter Richt\u00e1rik;Samuel Horv\u00e1th",
        "authorids": "~Grigory_Malinovsky1;~Eduard_Gorbunov1;~Peter_Richt\u00e1rik1;~Samuel_Horv\u00e1th1",
        "gender": "M;M;M;M",
        "homepage": "https://grigory-malinovsky.github.io;https://eduardgorbunov.github.io;https://sites.google.com/view/samuelhorvath;https://richtarik.org",
        "dblp": "262/3277.html;215/5512.html;234/8604;62/8001",
        "google_scholar": "4w2W9KQAAAAJ;https://scholar.google.ru/citations?user=85j2RqQAAAAJ;k252J7kAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;0000-0003-0619-9260;0000-0003-4380-5848",
        "linkedin": ";;samuel-horvath/;richtarik/",
        "or_profile": "~Grigory_Malinovsky1;~Eduard_Gorbunov1;~Samuel_Horv\u00e1th1;~Peter_Richtarik1",
        "aff": "Samsung;Mohamed bin Zayed University of Artificial Intelligence;MBZUAI;King Abdullah University of Science and Technology (KAUST)",
        "aff_domain": "samsung.com;mbzuai.ac.ae;mbzuai.ac.ae;kaust.edu.sa",
        "position": "Intern;Postdoc;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nmalinovsky2024byzantine,\ntitle={Byzantine Robustness and Partial Participation Can Be Achieved Simultaneously: Just Clip Gradient Differences},\nauthor={Grigory Malinovsky and Eduard Gorbunov and Peter Richt{\\'a}rik and Samuel Horv{\\'a}th},\nyear={2024},\nurl={https://openreview.net/forum?id=qB0IV2DpeS}\n}",
        "github": "",
        "project": "",
        "reviewers": "mpAd;Axn5;cyK5",
        "site": "https://openreview.net/forum?id=qB0IV2DpeS",
        "pdf_size": 613102,
        "rating": "3;5;6",
        "confidence": "4;4;3",
        "soundness": "2;3;3",
        "contribution": "1;2;3",
        "presentation": "3;2;3",
        "wc_summary": "37;61;79",
        "wc_strengths": "34;49;33",
        "wc_weaknesses": "238;442;104",
        "wc_questions": "5;77;72",
        "wc_review": "314;629;288",
        "wc_reply_reviewers": "223;267;0",
        "wc_reply_authors": "1162;1933;516",
        "reply_reviewers": "1;1;0",
        "reply_authors": "3;3;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            59.0,
            17.204650534085253
        ],
        "wc_strengths_avg": [
            38.666666666666664,
            7.3181661333667165
        ],
        "wc_weaknesses_avg": [
            261.3333333333333,
            138.97082027853506
        ],
        "wc_questions_avg": [
            51.333333333333336,
            32.82614134429381
        ],
        "wc_review_avg": [
            410.3333333333333,
            154.98458704730035
        ],
        "wc_reply_reviewers_avg": [
            163.33333333333334,
            116.88265720608663
        ],
        "wc_reply_authors_avg": [
            1203.6666666666667,
            579.2376215528669
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.7559289460184545,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13921492914601240805&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "Samsung;Mohamed bin Zayed University of Artificial Intelligence;King Abdullah University of Science and Technology",
        "aff_unique_dep": "Samsung;;",
        "aff_unique_url": "https://www.samsung.com;https://mbzuai.ac.ae;https://www.kaust.edu.sa",
        "aff_unique_abbr": "Samsung;MBZUAI;KAUST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;2",
        "aff_country_unique": "South Korea;United Arab Emirates;Saudi Arabia"
    },
    {
        "title": "Boosting of Thoughts: Trial-and-Error Problem Solving with Large Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17746",
        "id": "qBL04XXex6",
        "author_site": "Sijia Chen, Baochun Li, Di Niu",
        "tldr": "",
        "abstract": "The reasoning performance of Large Language Models (LLMs) on a wide range of problems critically relies on chain-of-thought prompting, which involves providing a few chain of thought demonstrations as exemplars in prompts. Recent work, e.g., Tree of Thoughts, has pointed out the importance of exploration and self-evaluation in reasoning step selection for complex problem solving. In this paper, we present Boosting of Thoughts (BoT), an automated prompting framework for problem solving with LLMs by iteratively exploring and self-evaluating many trees of thoughts in order to acquire an ensemble of trial-and-error reasoning experiences, which will serve as a new form of prompting to solve the complex problem. Starting from a simple prompt without requiring examples, BoT iteratively explores and evaluates a large collection of reasoning steps, and more importantly, uses error analysis obtained from the LLM on them to explicitly revise prompting, which in turn enhances reasoning step generation, until a final answer is attained. Our experiments with GPT-4 and Llama2 across extensive complex mathematical problems demonstrate that BoT consistently achieves higher or comparable problem-solving rates than other advanced prompting approaches.",
        "keywords": "Large Language Models; Prompt Engineering; Boosting Mechanism;",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/b38e9414c83f49f066047870db6f2b8f7ea09f3b.zip",
        "author": "Sijia Chen;Baochun Li;Di Niu",
        "authorids": "~Sijia_Chen2;~Baochun_Li1;~Di_Niu1",
        "gender": "M;M;M",
        "homepage": "https://csjdeveloper.github.io/sjiachen.github.io/;http://iqua.ece.toronto.edu/bli/;https://www.ualberta.ca/~dniu",
        "dblp": "241/8721;l/BaochunLi;82/4953",
        "google_scholar": "https://scholar.google.ca/citations?user=QWGJWDMAAAAJ;https://scholar.google.com.tw/citations?user=rkb3_FgAAAAJ;https://scholar.google.ca/citations?user=3kC5OogAAAAJ",
        "orcid": ";0000-0003-2404-0974;0000-0002-5250-7327",
        "linkedin": ";https://linkedin.com/in/baochun;",
        "or_profile": "~Sijia_Chen2;~Baochun_Li1;~Di_Niu1",
        "aff": "Toronto University;University of Toronto;University of Alberta",
        "aff_domain": "utoronto.ca;toronto.edu;ualberta.ca",
        "position": "PhD student;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nchen2024boosting,\ntitle={Boosting of Thoughts: Trial-and-Error Problem Solving with Large Language Models},\nauthor={Sijia Chen and Baochun Li and Di Niu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=qBL04XXex6}\n}",
        "github": "",
        "project": "",
        "reviewers": "pKnK;x4s4;VMbH;dFck;kjxP",
        "pdf_size": 874522,
        "rating": "5;5;6;6;8",
        "confidence": "4;3;3;3;3",
        "soundness": "3;2;2;3;3",
        "contribution": "2;2;2;2;3",
        "presentation": "3;3;2;2;3",
        "wc_summary": "83;49;41;146;54",
        "wc_strengths": "95;86;96;182;65",
        "wc_weaknesses": "164;173;181;18;224",
        "wc_questions": "140;19;5;121;27",
        "wc_review": "482;327;323;467;370",
        "wc_reply_reviewers": "0;279;0;0;0",
        "wc_reply_authors": "1666;1240;722;407;746",
        "reply_reviewers": "0;2;0;0;0",
        "reply_authors": "3;2;1;1;1",
        "rating_avg": [
            6.0,
            1.0954451150103321
        ],
        "confidence_avg": [
            3.2,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            74.6,
            38.41145662429375
        ],
        "wc_strengths_avg": [
            104.8,
            40.17661011085928
        ],
        "wc_weaknesses_avg": [
            152.0,
            70.09422230112835
        ],
        "wc_questions_avg": [
            62.4,
            56.368785688535105
        ],
        "wc_review_avg": [
            393.8,
            68.0864156789003
        ],
        "wc_reply_reviewers_avg": [
            55.8,
            111.6
        ],
        "wc_reply_authors_avg": [
            956.2,
            443.849704291892
        ],
        "reply_reviewers_avg": [
            0.4,
            0.8000000000000002
        ],
        "reply_authors_avg": [
            1.6,
            0.8
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.45643546458763856,
        "gs_citation": 22,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14067866023611630760&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=qBL04XXex6",
        "pdf": "https://openreview.net/pdf?id=qBL04XXex6",
        "email": "utoronto.ca;toronto.edu;ualberta.ca",
        "author_num": 3,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "University of Toronto;University of Alberta",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.utoronto.ca;https://www.ualberta.ca",
        "aff_unique_abbr": "U of T;UAlberta",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "title": "DeepZero: Scaling Up Zeroth-Order Optimization for Deep Model Training",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17745",
        "id": "qBWhjsNPEY",
        "author_site": "AOCHUAN CHEN, Yimeng Zhang, Jinghan Jia, James Diffenderfer, Konstantinos Parasyris, Jiancheng Liu, Yihua Zhang, Zheng Zhang, Bhavya Kailkhura, Sijia Liu",
        "tldr": "",
        "abstract": "Zeroth-order (ZO) optimization has become a popular technique for solving machine learning (ML) problems when first-order (FO) information is difficult or impossible to obtain. However, the scalability of ZO optimization remains an open problem: Its use has primarily been limited to relatively small-scale ML problems, such as sample-wise adversarial attack generation. To our best knowledge, no prior work has demonstrated the effectiveness of ZO optimization in training deep neural networks (DNNs) without a significant decrease in performance. To overcome this roadblock, we develop DeepZero, a principled and practical ZO deep learning (DL) framework that can scale ZO optimization to DNN training from scratch through three primary innovations. First, we demonstrate the advantages of coordinate-wise gradient estimation (CGE) over randomized vector-wise gradient estimation in training accuracy and computational efficiency. Second, we propose a sparsity-induced ZO training protocol that extends the model pruning methodology using only finite differences to explore and exploit the sparse DL prior in CGE. Third, we develop the methods of feature reuse and forward parallelization to advance the practical implementations of ZO training. Our extensive experiments show that DeepZero achieves state-of-the-art (SOTA) accuracy on ResNet-20 trained on CIFAR-10, approaching FO training performance for the first time. Furthermore, we show the practical utility of DeepZero in applications of certified adversarial defense and DL-based partial differential equation error correction, achieving 10-20% improvement over SOTA. We believe our results will inspire future research on scalable ZO optimization and contribute to advancing deep learning.",
        "keywords": "gradient-free learning;zeroth-order optimization;gradient sparsity",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/55f38a630d409e3206fa17fcfc2b6813368a0f27.zip",
        "author": "Aochuan Chen;Yimeng Zhang;Jinghan Jia;James Diffenderfer;Konstantinos Parasyris;Jiancheng Liu;Yihua Zhang;Zheng Zhang;Bhavya Kailkhura;Sijia Liu",
        "authorids": "~Aochuan_Chen1;~Yimeng_Zhang2;~Jinghan_Jia1;~James_Diffenderfer1;~Konstantinos_Parasyris2;~Jiancheng_Liu2;~Yihua_Zhang1;~Zheng_Zhang2;~Bhavya_Kailkhura1;~Sijia_Liu1",
        "gender": "M;M;M;;M;M;M;M;M;M",
        "homepage": "https://scholar.google.com/citations?hl=en&view_op=list_works&gmla=AJsN-F6N4cEX-_kViGgRpnUVo_iBHlVXwMpnhlyB-Cdrndwj6B0jaDy088r7K9gHPGqSwsQ9tNxpijGpb1IoIB2B5KVS3Scvtdz9Mt_WR9GSou_saurFpSA&user=7pY-Ie8AAAAJ;https://damon-demon.github.io;https://jinghanjia.netlify.app/;;;https://ljcc0930.github.io/;https://yihua-zhang.com;https://web.ece.ucsb.edu/~zhengzhang/;https://people.llnl.gov/kailkhura1;https://lsjxjtu.github.io/",
        "dblp": "331/2356;;286/5392;188/4110;151/4093;74/3002;;181/2621-5;132/8938;128/6972-1",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en;bqP_zxYAAAAJ;nRr24_QAAAAJ;BVW8btMAAAAJ;ReWNzl4AAAAJ;https://scholar.google.com/citations?hl=zh-CN;qeahx5QAAAAJ;SQpJmOgAAAAJ;C7dO_UgAAAAJ",
        "orcid": "0009-0002-2300-1498;0000-0003-1608-2541;;;0000-0002-8258-9693;;;;;",
        "linkedin": ";;jinghan-jia-5194451ba/;;koparasy/;;zhangyihua/;;;",
        "or_profile": "~Aochuan_Chen1;~Yimeng_Zhang2;~Jinghan_Jia1;~James_Diffenderfer1;~Konstantinos_Parasyris2;~Jiancheng_Liu2;~Yihua_Zhang1;~Zheng_Zhang2;~Bhavya_Kailkhura1;~Sijia_Liu1",
        "aff": "Hong Kong University of Science and Technology;ByteDance Inc.;Michigan State University;Lawrence Livermore National Labs;Lawrence Livermore National Labs;Michigan State University;Michigan State University;University of California, Santa Barbara;Lawrence Livermore National Laboratory;Michigan State University",
        "aff_domain": "ust.hk;bytedance.com;msu.edu;llnl.gov;llnl.gov;msu.edu;msu.edu;ucsb.edu;llnl.gov;msu.edu",
        "position": "PhD student;Research Intern;PhD student;Researcher;Computer Scientists;MS student;PhD student;Associate Professor;Research Staff;Assistant Professor",
        "bibtex": "@inproceedings{\nchen2024deepzero,\ntitle={DeepZero: Scaling Up Zeroth-Order Optimization for Deep Model Training},\nauthor={Aochuan Chen and Yimeng Zhang and Jinghan Jia and James Diffenderfer and Konstantinos Parasyris and Jiancheng Liu and Yihua Zhang and Zheng Zhang and Bhavya Kailkhura and Sijia Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=qBWhjsNPEY}\n}",
        "github": "",
        "project": "",
        "reviewers": "2ocP;4mR9;r5je;xr4D;pJQr;X34v",
        "pdf_size": 1280111,
        "rating": "3;5;6;6;8;8",
        "confidence": "2;4;3;3;4;3",
        "soundness": "2;3;2;3;3;3",
        "contribution": "2;3;3;3;3;3",
        "presentation": "2;3;3;3;3;2",
        "wc_summary": "30;74;187;58;66;81",
        "wc_strengths": "46;63;133;77;31;59",
        "wc_weaknesses": "56;150;317;144;88;143",
        "wc_questions": "2;84;50;102;12;269",
        "wc_review": "134;371;687;381;197;552",
        "wc_reply_reviewers": "0;14;325;0;194;131",
        "wc_reply_authors": "718;1452;1606;904;716;1351",
        "reply_reviewers": "0;1;2;0;2;1",
        "reply_authors": "2;5;4;3;4;3",
        "rating_avg": [
            6.0,
            1.7320508075688772
        ],
        "confidence_avg": [
            3.1666666666666665,
            0.6871842709362768
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.8333333333333335,
            0.3726779962499649
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            82.66666666666667,
            49.368230900268465
        ],
        "wc_strengths_avg": [
            68.16666666666667,
            32.31313802292945
        ],
        "wc_weaknesses_avg": [
            149.66666666666666,
            82.3137628562536
        ],
        "wc_questions_avg": [
            86.5,
            89.04633625253764
        ],
        "wc_review_avg": [
            387.0,
            190.44946836365807
        ],
        "wc_reply_reviewers_avg": [
            110.66666666666667,
            120.5095662408406
        ],
        "wc_reply_authors_avg": [
            1124.5,
            358.50046489974505
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            3.5,
            0.9574271077563381
        ],
        "replies_avg": [
            35,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.560112033611204,
        "gs_citation": 49,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2560311561112550158&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "openreview": "https://openreview.net/forum?id=qBWhjsNPEY",
        "pdf": "https://openreview.net/pdf?id=qBWhjsNPEY",
        "email": "ust.hk;bytedance.com;msu.edu;llnl.gov;llnl.gov;msu.edu;msu.edu;ucsb.edu;llnl.gov;msu.edu",
        "author_num": 10,
        "aff_unique_index": "0;1;2;3;3;2;2;4;3;2",
        "aff_unique_norm": "Hong Kong University of Science and Technology;ByteDance;Michigan State University;Lawrence Livermore National Laboratory;University of California, Santa Barbara",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.ust.hk;https://www.bytedance.com;https://www.msu.edu;https://www.llnl.gov;https://www.ucsb.edu",
        "aff_unique_abbr": "HKUST;ByteDance;MSU;LLNL;UCSB",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Hong Kong SAR;;Santa Barbara",
        "aff_country_unique_index": "0;0;1;1;1;1;1;1;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "qCI9NZ6hCb",
        "title": "Knowledge Is Not Wisdom: Weight Balancing Mechanism for Local and Global Training in Federated Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Federated learning (FL) is a unique approach that typically leverages client-side computing resources and data on edge devices. Data heterogeneity is a primary challenge that makes federated learning complex, and many studies have been conducted to address this issue. In previous studies, solutions were primarily focused on the client side, such as adjusting the weights of the local model or using proxy data from the aggregation server. However, we identified a problem where the global model becomes biased due to averaging the client\u2019s model, depending on the amount of the client\u2019s data or the extent of data sharing. Therefore, we introduce local and aggregation balancers for federated learning (FedBal), which respectively mediate the local training by class distribution and the weight aggregation by specific clients. We employ a local balancer to mitigate biases in favor of specific classes and an aggregation balancer to regulate biases toward certain clients. Remarkably, through experiments applying various existing methods with an aggregation balancer, we found that reflecting the models of marginalized clients more than those of clients with abundant data and classes can improve the accuracy of the global model by 2\\%\u20137\\%. FedBal, which combines two Balancers, exhibited an average accuracy improvement of 3\\%\u20134\\% compared to all other methods. This study raises several questions for further work to deepen our understanding of the role of the aggregation framework in FL.",
        "keywords": "Federated learning;Data heterogeneity;Non-IID;Client drift;Canceling-out",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Donghee Kim;Dongwon Kim;Sung Kuk Shyn;Soobin Cha;Kwangsu Kim",
        "authorids": "~Donghee_Kim1;~Dongwon_Kim3;~Sung_Kuk_Shyn1;~Soobin_Cha1;~Kwangsu_Kim1",
        "gender": "M;M;M;M;M",
        "homepage": ";https://appliedai.skku.edu/appliedailab/faculty.do?mode=view&articleNo=30643&article.offset=10&articleLimit=10;;https://appliedai.skku.edu/appliedailab/faculty.do?mode=view&articleNo=33816;https://appliedai.skku.edu/appliedailab/index.do",
        "dblp": ";;;;71/6192",
        "google_scholar": "https://scholar.google.co.kr/citations?user=mZYqDeIAAAAJ;;wm8XE5wAAAAJ;;",
        "orcid": "0000-0002-9929-3864;;;0009-0008-7475-1401;",
        "linkedin": ";;sungkukshyn/;;",
        "or_profile": "~Donghee_Kim1;~Dongwon_Kim3;~Sung_Kuk_Shyn1;~Soobin_Cha1;~Kwangsu_Kim1",
        "aff": "Hippo T&C co.,ltd.;Sung Kyun Kwan University;Sungkyunkwan University;Sung Kyun Kwan University;Sungkyunkwan University",
        "aff_domain": "hippotnc.com;skku.edu;skku.edu;skku.edu;cs.skku.edu",
        "position": "Researcher;MS student;MS student;MS student;Full Professor",
        "bibtex": "@misc{\nkim2024knowledge,\ntitle={Knowledge Is Not Wisdom: Weight Balancing Mechanism for Local and Global Training in Federated Learning},\nauthor={Donghee Kim and Dongwon Kim and Sung Kuk Shyn and Soobin Cha and Kwangsu Kim},\nyear={2024},\nurl={https://openreview.net/forum?id=qCI9NZ6hCb}\n}",
        "github": "",
        "project": "",
        "reviewers": "k5UQ;9qrP;zEAj;6uTg",
        "site": "https://openreview.net/forum?id=qCI9NZ6hCb",
        "pdf_size": 1343205,
        "rating": "1;3;5;5",
        "confidence": "5;4;4;4",
        "soundness": "1;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "1;3;3;2",
        "wc_summary": "43;91;60;98",
        "wc_strengths": "20;18;60;71",
        "wc_weaknesses": "232;216;163;55",
        "wc_questions": "66;4;1;286",
        "wc_review": "361;329;284;510",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "124;184;136;565",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.5,
            1.6583123951777
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            73.0,
            22.4610774452162
        ],
        "wc_strengths_avg": [
            42.25,
            23.583627795570383
        ],
        "wc_weaknesses_avg": [
            166.5,
            69.25496372102147
        ],
        "wc_questions_avg": [
            89.25,
            116.51904350791763
        ],
        "wc_review_avg": [
            371.0,
            84.78502226218968
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            252.25,
            181.95655388031506
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.8703882797784891,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:IEDdngeGQGsJ:scholar.google.com/&scioq=Knowledge+Is+Not+Wisdom:+Weight+Balancing+Mechanism+for+Local+and+Global+Training+in+Federated+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1;1",
        "aff_unique_norm": "Hippo T&C Co., Ltd.;Sungkyunkwan University",
        "aff_unique_dep": ";",
        "aff_unique_url": ";https://www.skku.edu",
        "aff_unique_abbr": ";SKKU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "LayoutNUWA: Revealing the Hidden Layout Expertise of Large Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17744",
        "id": "qCUWVT0Ayy",
        "author_site": "Zecheng Tang, Chenfei Wu, Juntao Li, Nan Duan",
        "tldr": "",
        "abstract": "Graphic layout generation, a growing research field, plays a significant role in user engagement and information perception. \nExisting methods primarily treat layout generation as a numerical optimization task, focusing on quantitative aspects while overlooking the semantic information of layout, such as the relationship between each layout element. \nIn this paper, we propose LayoutNUWA, the first model that treats layout generation as a code generation task to enhance semantic information and harness the hidden layout expertise of large language models~(LLMs). \nConcretely, we develop a Code Instruct Tuning (CIT) approach comprising three interconnected modules: 1) the Code Initialization (CI) module quantifies the numerical conditions and initializes them as HTML code with strategically placed masks; 2) the Code Completion (CC) module employs the formatting knowledge of LLMs to fill in the masked portions within the HTML code; 3) the Code Rendering (CR) module transforms the completed code into the final layout output, ensuring a highly interpretable and transparent layout generation procedure that directly maps code to a visualized layout. We attain significant state-of-the-art performance (even over 50\\% improvements compared to previous works) on multiple datasets, showcasing the strong capabilities of LayoutNUWA.",
        "keywords": "layout generation;large language model;code generation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/2238bfa5c684bb6a622b4914f9d2b6064eb78f87.zip",
        "author": "Zecheng Tang;Chenfei Wu;Juntao Li;Nan Duan",
        "authorids": "~Zecheng_Tang1;~Chenfei_Wu2;~Juntao_Li2;~Nan_Duan1",
        "gender": "M;M;M;M",
        "homepage": "https://zetangforward.github.io/;;https://lijuntaopku.github.io/;https://nanduan.github.io/",
        "dblp": "326/0272;;;",
        "google_scholar": "HUDkBMUAAAAJ;https://scholar.google.com/citations?hl=zh-CN;sZSygsYAAAAJ;Qaa6OxIAAAAJ",
        "orcid": "0009-0000-0075-8282;;0000-0002-6286-7529;",
        "linkedin": "%E6%B3%BD%E6%88%90-%E6%B1%A4-aa6333285/;;;",
        "or_profile": "~Zecheng_Tang1;~Chenfei_Wu2;~Juntao_Li2;~Nan_Duan1",
        "aff": "Soochow University;Microsoft;Soochow University, China;Microsoft Research Asia",
        "aff_domain": "suda.edu.cn;microsoft.com;suda.edu.cn;microsoft.com",
        "position": "PhD student;Researcher;Associate Professor;Principal Researcher",
        "bibtex": "@inproceedings{\ntang2024layoutnuwa,\ntitle={Layout{NUWA}: Revealing the Hidden Layout Expertise of Large Language Models},\nauthor={Zecheng Tang and Chenfei Wu and Juntao Li and Nan Duan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=qCUWVT0Ayy}\n}",
        "github": "",
        "project": "",
        "reviewers": "8sLn;qsQV;dDf9;7ZDJ",
        "pdf_size": 2108130,
        "rating": "5;6;6;8",
        "confidence": "2;5;3;3",
        "soundness": "1;3;3;3",
        "contribution": "3;2;2;3",
        "presentation": "2;2;3;4",
        "wc_summary": "90;101;69;72",
        "wc_strengths": "50;49;63;46",
        "wc_weaknesses": "314;141;96;207",
        "wc_questions": "52;44;20;141",
        "wc_review": "506;335;248;466",
        "wc_reply_reviewers": "17;0;0;15",
        "wc_reply_authors": "419;351;131;646",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "2;1;1;2",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            83.0,
            13.133925536563698
        ],
        "wc_strengths_avg": [
            52.0,
            6.519202405202649
        ],
        "wc_weaknesses_avg": [
            189.5,
            82.00762159701988
        ],
        "wc_questions_avg": [
            64.25,
            45.84961831902202
        ],
        "wc_review_avg": [
            388.75,
            102.9742079357739
        ],
        "wc_reply_reviewers_avg": [
            8.0,
            8.031189202104505
        ],
        "wc_reply_authors_avg": [
            386.75,
            183.66868949279296
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.15789473684210528,
        "gs_citation": 22,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14091582102935271016&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=qCUWVT0Ayy",
        "pdf": "https://openreview.net/pdf?id=qCUWVT0Ayy",
        "email": "suda.edu.cn;microsoft.com;suda.edu.cn;microsoft.com",
        "author_num": 4,
        "aff_unique_index": "0;1;0;1",
        "aff_unique_norm": "Soochow University;Microsoft",
        "aff_unique_dep": ";Microsoft Corporation",
        "aff_unique_url": "https://www.soochow.edu.cn;https://www.microsoft.com",
        "aff_unique_abbr": "Soochow U;Microsoft",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Asia",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "VONet: Unsupervised Video Object Learning With Parallel U-Net Attention and Object-wise Sequential VAE",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17743",
        "id": "qCyhvr0GG8",
        "author_site": "Haonan Yu, Wei Xu",
        "tldr": "",
        "abstract": "Unsupervised video object learning seeks to decompose video scenes into structural object representations without any supervision from depth, optical flow, or segmentation. We present VONet, an innovative approach that is inspired by MONet. While utilizing a U-Net architecture, VONet employs an efficient and effective parallel attention inference process, generating attention masks for all slots simultaneously. Additionally, to enhance the temporal consistency of each mask across consecutive video frames, VONet develops an object-wise sequential VAE framework. The integration of these innovative encoder-side techniques, in conjunction with an expressive transformer-based decoder, establishes VONet as the leading unsupervised method for object learning across five MOVI datasets, encompassing videos of diverse complexities. Code is available at https://github.com/hnyu/vonet.",
        "keywords": "Unsupervised learning; Video object learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Haonan Yu;Wei Xu",
        "authorids": "~Haonan_Yu5;~Wei_Xu13",
        "gender": ";M",
        "homepage": ";",
        "dblp": ";",
        "google_scholar": "Army5cEAAAAJ;Gxz1fqwAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Haonan_Yu5;~Wei_Xu13",
        "aff": "Horizon Robotics;Horizon Robotics",
        "aff_domain": "horizon.auto;horizon.auto",
        "position": "Research Scientist;Researcher",
        "bibtex": "@inproceedings{\nyu2024vonet,\ntitle={{VON}et: Unsupervised Video Object Learning With Parallel U-Net Attention and Object-wise Sequential {VAE}},\nauthor={Haonan Yu and Wei Xu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=qCyhvr0GG8}\n}",
        "github": "",
        "project": "",
        "reviewers": "751B;v4jo;x2B3;9HJm",
        "pdf_size": 16426409,
        "rating": "5;5;6;6",
        "confidence": "4;4;3;2",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "39;72;73;49",
        "wc_strengths": "11;68;46;41",
        "wc_weaknesses": "60;119;41;87",
        "wc_questions": "2;19;17;4",
        "wc_review": "112;278;177;181",
        "wc_reply_reviewers": "0;0;0;17",
        "wc_reply_authors": "197;1320;249;683",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            58.25,
            14.686303142724515
        ],
        "wc_strengths_avg": [
            41.5,
            20.328551350256124
        ],
        "wc_weaknesses_avg": [
            76.75,
            29.363029475856198
        ],
        "wc_questions_avg": [
            10.5,
            7.566372975210778
        ],
        "wc_review_avg": [
            187.0,
            59.24947257149214
        ],
        "wc_reply_reviewers_avg": [
            4.25,
            7.361215932167728
        ],
        "wc_reply_authors_avg": [
            612.25,
            450.08297846063897
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.9045340337332909,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8281599914153915472&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=qCyhvr0GG8",
        "pdf": "https://openreview.net/pdf?id=qCyhvr0GG8",
        "email": "horizon.auto;horizon.auto",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Horizon Robotics",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.horizon-robotics.com/",
        "aff_unique_abbr": "Horizon Robotics",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "qDKTMjoFbC",
        "title": "BurstAttention: An Efficient Distributed Attention Framework for Extremely Long Sequences",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Effective attention modules have played a crucial role in the success of Transformer-based large language models (LLMs), but the quadratic time and memory complexities of these attention modules also pose a challenge when processing long sequences. \nOne potential solution for the long sequence problem is to utilize distributed clusters to parallelize the computation of attention modules across multiple devices (e.g., GPUs). \nHowever, adopting a distributed approach inevitably introduces extra memory overheads to store local attention results and incurs additional communication costs to aggregate local results into global ones. \nIn this paper, we propose a distributed attention framework named ``BurstAttention'' to optimize memory access and communication operations at both the global cluster and local device levels.\nIn our experiments, we compare BurstAttention with other competitive distributed attention solutions for long sequence processing. \nThe experimental results under different length settings demonstrate that BurstAttention offers significant advantages for processing long sequences compared with these competitive baselines, reducing 40\\% communication overheads and achieving 2$\\times$ speedup during training 32K sequence length on 8$\\times$A100.",
        "keywords": "Large Language Models; Distributed Deep Learning; Long-sequence Processing; Transformer Attention",
        "primary_area": "infrastructure, software libraries, hardware, etc.",
        "supplementary_material": "",
        "author": "Sun Ao;Weilin Zhao;Xu Han;Cheng Yang;Zhiyuan Liu;Chuan Shi;Maosong Sun;Shengnan Wang;Teng Su",
        "authorids": "~Sun_Ao2;~Weilin_Zhao1;~Xu_Han2;~Cheng_Yang6;~Zhiyuan_Liu1;~Chuan_Shi1;~Maosong_Sun1;~Shengnan_Wang2;~Teng_Su1",
        "gender": "M;M;;M;M;M;M;M;M",
        "homepage": "https://github.com/MayDomine;https://brawny-college-5b2.notion.site/Weilin-Zhao-11d20b7deb8280388213d5f5ed072992?pvs=4;;https://albertyang33.github.io/;http://nlp.csai.tsinghua.edu.cn/~lzy;http://www.shichuan.org/;https://www.cs.tsinghua.edu.cn/csen/info/1312/4394.htm;;https://suteng.github.com/",
        "dblp": ";197/5702.html;;49/1457-2;53/3245-1;64/3041-1;95/3291-1;;",
        "google_scholar": ";_CR92HUAAAAJ;;OlLjVUcAAAAJ;dT0v5u0AAAAJ;tUq_v90AAAAJ;https://scholar.google.com.tw/citations?user=zIgT0HMAAAAJ;TFZviW8AAAAJ;",
        "orcid": ";0000-0001-8016-1952;;0000-0001-7821-0030;0000-0002-7709-2543;0000-0002-3734-0266;;;",
        "linkedin": ";;;;;;;;",
        "or_profile": "~Sun_Ao2;~Weilin_Zhao1;~Xu_Han2;~Cheng_Yang6;~Zhiyuan_Liu1;~Chuan_Shi1;~Maosong_Sun1;~Shengnan_Wang2;~Teng_Su1",
        "aff": "Beijing University of Posts and Telecommunications;Tsinghua University;;Beijing University of Posts and Telecommunications;Tsinghua University;Beijing University of Post and Telecommunication;Tsinghua University;Zhejiang University;",
        "aff_domain": "bupt.edu.cn;tsinghua.edu.cn;;bupt.edu.cn;tsinghua.edu.cn;bupt.edu.cn;tsinghua.edu.cn;zju.edu.cn;",
        "position": "MS student;PhD student;;Associate Professor;Associate Professor;Full Professor;Full Professor;Researcher;",
        "bibtex": "@misc{\nao2024burstattention,\ntitle={BurstAttention: An Efficient Distributed Attention Framework for Extremely Long Sequences},\nauthor={Sun Ao and Weilin Zhao and Xu Han and Cheng Yang and Zhiyuan Liu and Chuan Shi and Maosong Sun and Shengnan Wang and Teng Su},\nyear={2024},\nurl={https://openreview.net/forum?id=qDKTMjoFbC}\n}",
        "github": "",
        "project": "",
        "reviewers": "J3Ya;Gb5f;y1yi;Jngs;s62K",
        "site": "https://openreview.net/forum?id=qDKTMjoFbC",
        "pdf_size": 1324849,
        "rating": "5;5;6;6;6",
        "confidence": "2;4;3;4;3",
        "soundness": "3;2;3;3;3",
        "contribution": "2;2;2;2;2",
        "presentation": "3;3;3;3;3",
        "wc_summary": "12;85;185;84;101",
        "wc_strengths": "19;84;73;38;41",
        "wc_weaknesses": "60;356;91;59;61",
        "wc_questions": "167;171;28;38;51",
        "wc_review": "258;696;377;219;254",
        "wc_reply_reviewers": "181;33;0;0;38",
        "wc_reply_authors": "2092;2230;496;457;683",
        "reply_reviewers": "1;1;0;0;1",
        "reply_authors": "4;4;1;1;3",
        "rating_avg": [
            5.6,
            0.48989794855663565
        ],
        "confidence_avg": [
            3.2,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            93.4,
            55.19637669267794
        ],
        "wc_strengths_avg": [
            51.0,
            23.94159560263267
        ],
        "wc_weaknesses_avg": [
            125.4,
            115.92514826386898
        ],
        "wc_questions_avg": [
            91.0,
            64.11552074186093
        ],
        "wc_review_avg": [
            360.8,
            175.89928936752415
        ],
        "wc_reply_reviewers_avg": [
            50.4,
            67.22083010496075
        ],
        "wc_reply_authors_avg": [
            1191.6,
            796.3874936235501
        ],
        "reply_reviewers_avg": [
            0.6,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            2.6,
            1.3564659966250538
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.21821789023599236,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13156834337092303352&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0;1;0;1;2",
        "aff_unique_norm": "Beijing University of Posts and Telecommunications;Tsinghua University;Zhejiang University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.bupt.edu.cn/;https://www.tsinghua.edu.cn;https://www.zju.edu.cn",
        "aff_unique_abbr": "BUPT;THU;ZJU",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Beijing;",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "qDMyhAxok3",
        "title": "MorphGrower: A Synchronized Layer-by-layer Growing Approach for Plausible and Diverse Neuronal Morphology Generation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Neuronal morphology is essential for studying brain functioning and understanding neurodegenerative disorders, e.g. Alzheimer. As the acquiring of real-world morphology data is expensive, computational approaches especially learning-based ones e.g. MorphVAE for morphology generation were recently studied, which are often conducted in a way of randomly augmenting a given authentic morphology to achieve both plausibility and diversity. Under such a setting, this paper proposes \\textbf{MorphGrower} which aims to generate more plausible morphology samples by mimicking the natural growth mechanism instead of a one-shot treatment as done in MorphVAE. In particular, MorphGrower generates morphologies layer by layer synchronously and chooses a pair of sibling branches as the basic generation block, and the generation of each layer is conditioned on the morphological structure of previous layers and then generate morphologies via a conditional variational autoencoder with spherical latent space. Extensive experimental results on four real-world datasets demonstrate that MorphGrower outperforms MorphVAE by a notable margin. Our code will be publicly available to facilitate future research.",
        "keywords": "Neuroscience;Neural Morphology;Computational Neuroscience",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "Nianzu Yang;Kaipeng Zeng;Haotian Lu;Yexin Wu;Zexin Yuan;Shengdian Jiang;Jiaxiang Wu;Yimin Wang;Junchi Yan",
        "authorids": "~Nianzu_Yang1;~Kaipeng_Zeng1;~Haotian_Lu1;~Yexin_Wu2;~Zexin_Yuan1;~Shengdian_Jiang1;~Jiaxiang_Wu1;~Yimin_Wang3;~Junchi_Yan2",
        "gender": "M;M;M;;M;M;M;M;M",
        "homepage": "https://yangnianzu0515.github.io/;https://github.com/zengkaipeng;https://github.com/flick-ai;https://librowu.github.io/;;https://orcid.org/0000-0002-2277-263X;;https://yi-min.wang;http://thinklab.sjtu.edu.cn/",
        "dblp": "296/8412.html;345/6420;;;;311/3156;119/6799-1.html;;60/7949.html",
        "google_scholar": ";https://scholar.google.com/citations?hl=zh-CN;;;;5N5l92EAAAAJ;https://scholar.google.com.hk/citations?user=puazh38AAAAJ;MNuQBkMAAAAJ;ga230VoAAAAJ",
        "orcid": ";0000-0002-4798-7784;;;0009-0003-4929-6439;0000-0002-2277-263X;;;0000-0001-9639-7679",
        "linkedin": ";;;;;;;;",
        "or_profile": "~Nianzu_Yang1;~Kaipeng_Zeng1;~Haotian_Lu1;~Yexin_Wu2;~Zexin_Yuan1;~Shengdian_Jiang1;~Jiaxiang_Wu1;~Yimin_Wang3;~Junchi_Yan1",
        "aff": "Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;University of Illinois, Urbana Champaign;Shanghai University;;;Guangdong Institute of Intelligence Science and Technology;Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;illinois.edu;shu.edu.cn;;;gdiist.cn;sjtu.edu.cn",
        "position": "PhD student;MS student;Undergrad student;MS student;MS student;;;Principal Researcher;Full Professor",
        "bibtex": "@misc{\nyang2024morphgrower,\ntitle={MorphGrower: A Synchronized Layer-by-layer Growing Approach for Plausible and Diverse Neuronal Morphology Generation},\nauthor={Nianzu Yang and Kaipeng Zeng and Haotian Lu and Yexin Wu and Zexin Yuan and Shengdian Jiang and Jiaxiang Wu and Yimin Wang and Junchi Yan},\nyear={2024},\nurl={https://openreview.net/forum?id=qDMyhAxok3}\n}",
        "github": "",
        "project": "",
        "reviewers": "7LXV;NzbM;s2ri",
        "site": "https://openreview.net/forum?id=qDMyhAxok3",
        "pdf_size": 14906732,
        "rating": "3;5;6",
        "confidence": "3;4;3",
        "soundness": "2;3;3",
        "contribution": "2;2;4",
        "presentation": "1;2;3",
        "wc_summary": "196;59;50",
        "wc_strengths": "36;68;125",
        "wc_weaknesses": "269;47;258",
        "wc_questions": "129;150;60",
        "wc_review": "630;324;493",
        "wc_reply_reviewers": "194;212;214",
        "wc_reply_authors": "1497;1237;1100",
        "reply_reviewers": "1;1;3",
        "reply_authors": "4;3;3",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            101.66666666666667,
            66.8048567762022
        ],
        "wc_strengths_avg": [
            76.33333333333333,
            36.80881536926839
        ],
        "wc_weaknesses_avg": [
            191.33333333333334,
            102.15782996042066
        ],
        "wc_questions_avg": [
            113.0,
            38.44476557348217
        ],
        "wc_review_avg": [
            482.3333333333333,
            125.15146379043631
        ],
        "wc_reply_reviewers_avg": [
            206.66666666666666,
            8.993825042154693
        ],
        "wc_reply_authors_avg": [
            1278.0,
            164.64709735269147
        ],
        "reply_reviewers_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.18898223650461363,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:pNoQEbKbbEIJ:scholar.google.com/&scioq=MorphGrower:+A+Synchronized+Layer-by-layer+Growing+Approach+for+Plausible+and+Diverse+Neuronal+Morphology+Generation&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;2;3;0",
        "aff_unique_norm": "Shanghai Jiao Tong University;University of Illinois Urbana-Champaign;Shanghai University;Guangdong Institute of Intelligence Science and Technology",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.sjtu.edu.cn;https://illinois.edu;https://www.shu.edu.cn;",
        "aff_unique_abbr": "SJTU;UIUC;SHU;",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Urbana-Champaign",
        "aff_country_unique_index": "0;0;0;1;0;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Explaining Time Series via Contrastive and Locally Sparse Perturbations",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17742",
        "id": "qDdSRaOiyb",
        "author_site": "Zichuan Liu, Yingying ZHANG, Tianchun Wang, Zefan Wang, Dongsheng Luo, Mengnan Du, Min Wu, Yi Wang, Chunlin Chen, Lunting Fan, Qingsong Wen",
        "tldr": "",
        "abstract": "Explaining multivariate time series is a compound challenge, as it requires identifying important locations in the time series and matching complex temporal patterns.\nAlthough previous saliency-based methods addressed the challenges,\ntheir perturbation may not alleviate the distribution shift issue, which is inevitable especially in heterogeneous samples.\nWe present ContraLSP, a locally sparse model that introduces counterfactual samples to build uninformative perturbations but keeps distribution using contrastive learning.\nFurthermore, we incorporate sample-specific sparse gates to generate more binary-skewed and smooth masks, which easily integrate temporal trends and select the salient features parsimoniously.\nEmpirical studies on both synthetic and real-world datasets show that ContraLSP outperforms state-of-the-art models, demonstrating a substantial improvement in explanation quality for time series data.\nThe source code is available at \\url{https://github.com/zichuan-liu/ContraLSP}.",
        "keywords": "time series;explainability;perturbation",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Zichuan Liu;Yingying ZHANG;Tianchun Wang;Zefan Wang;Dongsheng Luo;Mengnan Du;Min Wu;Yi Wang;Chunlin Chen;Lunting Fan;Qingsong Wen",
        "authorids": "~Zichuan_Liu3;~Yingying_ZHANG4;~Tianchun_Wang1;~Zefan_Wang2;~Dongsheng_Luo1;~Mengnan_Du1;~Min_Wu2;~Yi_Wang43;~Chunlin_Chen1;~Lunting_Fan1;~Qingsong_Wen2",
        "gender": ";;M;M;M;;M;M;M;;M",
        "homepage": "https://zichuan-liu.github.io/;https://github.com/fjzhzhyy;;https://github.com/Zep4yrWang;https://users.cs.fiu.edu/~dluo/;https://mengnandu.com/;https://sites.google.com/site/wumincf/;http://www.eeyiwang.com/;https://sme.nju.edu.cn/ccl/list.htm;;https://sites.google.com/site/qingsongwen8/",
        "dblp": ";;153/5231.html;;;183/5606;16/0-8;;68/6992.html;;27/561",
        "google_scholar": "SUvzKxwAAAAJ;;8su8b60AAAAJ;TGTAeiQAAAAJ;https://scholar.google.com/citations?hl=en;0i-Js2gAAAAJ;https://scholar.google.com.sg/citations?user=Hji1uWQAAAAJ;KYDSElAAAAAJ;;;vjPJvwYAAAAJ",
        "orcid": ";0009-0005-1574-922X;;;0000-0003-4192-0826;;0000-0003-0977-3600;0000-0003-1143-0666;;0009-0005-1865-6731;0000-0003-4516-2524",
        "linkedin": ";;;;;;;;;https://www.linkedin.cn/incareer/in/ACoAAEPkMDEBIj4hEMcAsW6vGuUidlGT7S_Xc0Y;qingsong-wen-22814156/",
        "or_profile": "~Zichuan_Liu3;~Yingying_ZHANG4;~Tianchun_Wang1;~Zefan_Wang2;~Dongsheng_Luo1;~Mengnan_Du1;~Min_Wu2;~Yi_Wang43;~Chunlin_Chen1;~Lunting_Fan2;~Qingsong_Wen1",
        "aff": "Nanjing University;Alibaba Group;Pennsylvania State University;Tsinghua University;Florida International University;New Jersey Institute of Technology;Institute for Infocomm Research (I2R), A*STAR;;Nanjing University;Alibaba Group;Squirrel Ai Learning",
        "aff_domain": "nju.edu.cn;alibaba-inc.com;psu.edu;tsinghua.edu.cn;fiu.edu;njit.edu;i2r.a-star.edu.sg;;nju.edu.cn;alibaba-inc.com;squirrelai.com",
        "position": "MS student;Researcher;PhD student;MS student;Assistant Professor;Assistant Professor;Principal Researcher;;Full Professor;Senior Operations and Maintenance Director;Principal Researcher",
        "bibtex": "@inproceedings{\nliu2024explaining,\ntitle={Explaining Time Series via Contrastive and Locally Sparse Perturbations},\nauthor={Zichuan Liu and Yingying ZHANG and Tianchun Wang and Zefan Wang and Dongsheng Luo and Mengnan Du and Min Wu and Yi Wang and Chunlin Chen and Lunting Fan and Qingsong Wen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=qDdSRaOiyb}\n}",
        "github": "",
        "project": "",
        "reviewers": "9mjJ;MZY5;zXTo;mcnc",
        "pdf_size": 1263435,
        "rating": "5;6;6;6",
        "confidence": "3;2;2;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;2",
        "presentation": "2;3;3;3",
        "wc_summary": "186;46;43;174",
        "wc_strengths": "54;93;34;120",
        "wc_weaknesses": "199;5;74;467",
        "wc_questions": "163;229;2;8",
        "wc_review": "602;373;153;769",
        "wc_reply_reviewers": "0;100;33;20",
        "wc_reply_authors": "2017;1079;1008;1597",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "5;3;3;3",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            2.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            112.25,
            67.89099719403156
        ],
        "wc_strengths_avg": [
            75.25,
            33.43183363203401
        ],
        "wc_weaknesses_avg": [
            186.25,
            176.37655031210923
        ],
        "wc_questions_avg": [
            100.5,
            98.33234462779782
        ],
        "wc_review_avg": [
            474.25,
            232.72878528450235
        ],
        "wc_reply_reviewers_avg": [
            38.25,
            37.539146234297874
        ],
        "wc_reply_authors_avg": [
            1425.25,
            410.3817582446861
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.5,
            0.8660254037844386
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6754044107334464327&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=qDdSRaOiyb",
        "pdf": "https://openreview.net/pdf?id=qDdSRaOiyb",
        "email": "nju.edu.cn;alibaba-inc.com;psu.edu;tsinghua.edu.cn;fiu.edu;njit.edu;i2r.a-star.edu.sg;;nju.edu.cn;alibaba-inc.com;squirrelai.com",
        "author_num": 11,
        "aff_unique_index": "0;1;2;3;4;5;6;0;1;7",
        "aff_unique_norm": "Nanjing University;Alibaba Group;Pennsylvania State University;Tsinghua University;Florida International University;New Jersey Institute of Technology;Institute for Infocomm Research;Squirrel Ai Learning",
        "aff_unique_dep": ";;;;;;;",
        "aff_unique_url": "https://www.nju.edu.cn;https://www.alibaba.com;https://www.psu.edu;https://www.tsinghua.edu.cn;https://www.fiu.edu;https://www.njit.edu;https://www.i2r.a-star.edu.sg;https://www.squirrelai.com/",
        "aff_unique_abbr": "Nanjing U;Alibaba;PSU;THU;FIU;NJIT;I2R;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;1;1;2;0;0;0",
        "aff_country_unique": "China;United States;Singapore"
    },
    {
        "title": "Conditional Instrumental Variable Regression with Representation Learning for Causal Inference",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17741",
        "id": "qDhq1icpO8",
        "author_site": "Debo Cheng, Ziqi Xu, Jiuyong Li, Lin Liu, Jixue Liu, Thuc Le",
        "tldr": "",
        "abstract": "This paper studies the challenging problem of estimating causal effects from observational data, in the presence of unobserved confounders. The two-stage least square (TSLS) method and its variants with a standard instrumental variable (IV) are commonly used to eliminate confounding bias, including the bias caused by unobserved confounders, but they rely on the linearity assumption. Besides, the strict condition of unconfounded instruments posed on a standard IV is too strong to be practical. To address these challenging and practical problems of the standard IV method (linearity assumption and the strict condition), in this paper, we use a conditional IV (CIV) to relax the unconfounded instrument condition of standard IV and propose a non-linear \\underline{CIV} regression with \\underline{C}onfounding \\underline{B}alancing \\underline{R}epresentation \\underline{L}earning,  CBRL.CIV, for jointly eliminating the confounding bias from unobserved confounders and balancing the observed confounders, without the linearity assumption. We theoretically demonstrate the soundness of CBRL.CIV. Extensive experiments on synthetic and two real-world datasets show the competitive performance of CBRL.CIV against state-of-the-art IV-based estimators and superiority in dealing with the non-linear situation.",
        "keywords": "Causal Inference;Variational AutoEncoder;Instrumental Variable",
        "primary_area": "causal reasoning",
        "supplementary_material": "/attachment/1daa598c4f7156a1b1f4d80dfb4905f397fbdae2.zip",
        "author": "Debo Cheng;Ziqi Xu;Jiuyong Li;Lin Liu;Jixue Liu;Thuc Duy Le",
        "authorids": "~Debo_Cheng1;~Ziqi_Xu1;~Jiuyong_Li1;~Lin_Liu4;~Jixue_Liu1;~Thuc_Duy_Le1",
        "gender": ";M;M;Not Specified;M;M",
        "homepage": ";https://iron13.github.io/;https://people.unisa.edu.au/jiuyong.li;https://people.unisa.edu.au/lin.liu;http://people.unisa.edu.au/jixue.liu;https://people.unisa.edu.au/thuc.le",
        "dblp": ";255/6518-1;20/1583;61/2115-3;l/JixueLiu.html;124/7179",
        "google_scholar": ";znODztEAAAAJ;https://scholar.google.com.au/citations?user=WYeM3yYAAAAJ;QP6jqRwAAAAJ;https://scholar.google.com.au/citations?user=Ztoa054AAAAJ;https://scholar.google.com.au/citations?view_op=list_works",
        "orcid": ";0000-0003-1748-5801;0000-0002-9023-1878;0000-0003-2843-5738;0000-0002-0794-0404;",
        "linkedin": ";ziqi-xu-846510113/;jiuyongli/?originalSubdomain=au;;;",
        "or_profile": "~Debo_Cheng1;~Ziqi_Xu1;~Jiuyong_Li1;~Lin_Liu4;~Jixue_Liu1;~Thuc_Duy_Le1",
        "aff": ";University of South Australia;University of South Australia, Australia;University of South Australia, Australia;University of South Australia, Australia;University of South Australia, Australia",
        "aff_domain": ";unisa.edu.au;unisa.edu.au;unisa.edu.au;unisa.edu.au;unisa.edu.au",
        "position": ";PhD student;Full Professor;Full Professor;Associate Professor;Associate Professor",
        "bibtex": "@inproceedings{\ncheng2024conditional,\ntitle={Conditional Instrumental Variable Regression with Representation Learning for Causal Inference},\nauthor={Debo Cheng and Ziqi Xu and Jiuyong Li and Lin Liu and Jixue Liu and Thuc Duy Le},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=qDhq1icpO8}\n}",
        "github": "",
        "project": "",
        "reviewers": "MNhf;A6cp;kNXT;9EAs",
        "pdf_size": 1167464,
        "rating": "5;6;8;8",
        "confidence": "3;4;4;4",
        "soundness": "3;3;3;4",
        "contribution": "2;3;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "93;85;59;80",
        "wc_strengths": "92;35;24;170",
        "wc_weaknesses": "127;30;53;137",
        "wc_questions": "53;2;2;2",
        "wc_review": "365;152;138;389",
        "wc_reply_reviewers": "0;0;19;0",
        "wc_reply_authors": "618;366;495;291",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            79.25,
            12.577261228105266
        ],
        "wc_strengths_avg": [
            80.25,
            57.889442042569385
        ],
        "wc_weaknesses_avg": [
            86.75,
            46.11060073345391
        ],
        "wc_questions_avg": [
            14.75,
            22.083647796503186
        ],
        "wc_review_avg": [
            261.0,
            116.41520519244898
        ],
        "wc_reply_reviewers_avg": [
            4.75,
            8.227241335952167
        ],
        "wc_reply_authors_avg": [
            442.5,
            124.86092262994055
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.7777777777777777,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7221887557356318322&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=qDhq1icpO8",
        "pdf": "https://openreview.net/pdf?id=qDhq1icpO8",
        "email": ";unisa.edu.au;unisa.edu.au;unisa.edu.au;unisa.edu.au;unisa.edu.au",
        "author_num": 6,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "University of South Australia",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.unisa.edu.au",
        "aff_unique_abbr": "UNISA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Australia"
    },
    {
        "id": "qDl4SWrrgg",
        "title": "AdaO2B: Adaptive Online to Batch Conversion for Out-of-Distribution Generalization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Online to batch conversion involves constructing a new batch learner by utilizing a series of models generated by an existing online learning algorithm, for achieving generalization guarantees under i.i.d assumption. However, when applied to real-world streaming applications such as streaming recommender systems, the data stream may be sampled from time-varying distributions instead of persistently being i.i.d. This poses a challenge in terms of out-of-distribution (OOD) generalization. Existing approaches employ fixed conversion mechanisms that are unable to adapt to novel testing distributions, hindering the testing accuracy of the batch learner. To address these issues, we propose AdaO2B, an adaptive online to batch conversion approach under the bandit setting. AdaO2B is designed to be aware of the distribution shifts in the testing data and achieves OOD generalization guarantees. Specifically, AdaO2B can dynamically combine the sequence of models learned by a contextual bandit algorithm and determine appropriate combination weights using a context-aware weighting function. This innovative approach allows for the conversion of a sequence of models into a batch learner that facilitates OOD generalization. Theoretical analysis provides justification for why and how the learned adaptive batch learner can achieve OOD generalization error guarantees. Experimental results have demonstrated that AdaO2B significantly outperforms state-of-the-art baselines on both synthetic data and real-world data.",
        "keywords": "online to batch conversion;out-of-distribution (OOD) generalization;streaming applications;bandit",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/f98134300690cd04901e501a1cd95fb6516d37b9.zip",
        "author": "Xiao Zhang;Sunhao Dai;Jun Xu;Yong Liu;Zhenhua Dong;Ji-Rong Wen",
        "authorids": "~Xiao_Zhang7;~Sunhao_Dai1;~Jun_Xu1;~Yong_Liu7;~Zhenhua_Dong1;~Ji-Rong_Wen1",
        "gender": "M;M;M;M;;M",
        "homepage": "https://pinkfloyd1989.github.io/Xiao_Zhang/;https://github.com/KID-22;https://gsai.ruc.edu.cn/~junxu;https://iie-liuyong.github.io;;https://gsai.ruc.edu.cn/english/jrwen",
        "dblp": "49/4478-34;314/6465;90/514-1;29/4867-18;;w/JRWen",
        "google_scholar": "https://scholar.google.com.hk/citations?user=5FZ6wbAAAAAJ;https://scholar.google.com.hk/citations?user=lXO-uZMAAAAJ;su14mcEAAAAJ;vVhmzbAAAAAJ;;tbxCHJgAAAAJ",
        "orcid": "0000-0001-7397-5632;0009-0002-7549-0860;;0000-0002-6739-621X;;0000-0002-9777-9676",
        "linkedin": ";;;;;",
        "or_profile": "~Xiao_Zhang7;~Sunhao_Dai1;~Jun_Xu1;~Yong_Liu7;~Zhenhua_Dong1;~Ji-Rong_Wen1",
        "aff": "Renmin University of China;Renmin University of China;Renmin University of China;Renmin University of China;;Renmin University of China",
        "aff_domain": "ruc.edu.cn;ruc.edu.cn;ruc.edu.cn;ruc.edu.cn;;ruc.edu.cn",
        "position": "Assistant Professor;PhD student;Full Professor;Associate Professor;;Full Professor",
        "bibtex": "@misc{\nzhang2024adaob,\ntitle={AdaO2B: Adaptive Online to Batch Conversion for Out-of-Distribution Generalization},\nauthor={Xiao Zhang and Sunhao Dai and Jun Xu and Yong Liu and Zhenhua Dong and Ji-Rong Wen},\nyear={2024},\nurl={https://openreview.net/forum?id=qDl4SWrrgg}\n}",
        "github": "",
        "project": "",
        "reviewers": "a4Uq;S3jg;Jqwx;4t8p",
        "site": "https://openreview.net/forum?id=qDl4SWrrgg",
        "pdf_size": 2019332,
        "rating": "3;3;3;5",
        "confidence": "2;3;4;4",
        "soundness": "2;2;1;2",
        "contribution": "2;2;1;2",
        "presentation": "2;3;2;3",
        "wc_summary": "66;105;229;75",
        "wc_strengths": "94;22;48;18",
        "wc_weaknesses": "244;113;382;218",
        "wc_questions": "69;3;59;84",
        "wc_review": "473;243;718;395",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            118.75,
            65.2701118430174
        ],
        "wc_strengths_avg": [
            45.5,
            30.277879714405366
        ],
        "wc_weaknesses_avg": [
            239.25,
            95.9045749690806
        ],
        "wc_questions_avg": [
            53.75,
            30.621683493890405
        ],
        "wc_review_avg": [
            457.25,
            171.76783022440495
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5222329678670935,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:YE1Ak-z0NDQJ:scholar.google.com/&scioq=AdaO2B:+Adaptive+Online+to+Batch+Conversion+for+Out-of-Distribution+Generalization&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Renmin University of China",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.ruc.edu.cn",
        "aff_unique_abbr": "RUC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "qGZTrj48Lb",
        "title": "Reuse and Diffuse: Iterative Denoising for Text-to-Video Generation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Inspired by the remarkable success of Latent Diffusion Models (LDMs) for image synthesis, we study LDM for text-to-video generation, which is a formidable challenge due to the computational and memory constraints during both model training and inference. A single LDM is usually only capable of generating a very limited number of video frames. Some existing works focus on separate prediction models for generating more video frames, which suffer from additional training cost and frame-level jittering, however. In this paper, we propose a framework called \"Reuse and Diffuse\" dubbed *VidRD* to produce more frames following the frames already generated by an LDM. Conditioned on an initial video clip with a small number of frames, additional frames are iteratively generated by reusing the original latent features and following the previous diffusion process. Besides, for the autoencoder used for translation between pixel space and latent space, we inject temporal layers into its decoder and fine-tune these layers for higher temporal consistency. We also propose a set of strategies for composing video-text data that involve diverse content from multiple existing datasets including video datasets for action recognition and image-text datasets. Extensive experiments show that our method achieves good results in both quantitative and qualitative evaluations. Our project page is available at [https://anonymous0x233.github.io/ReuseAndDiffuse/](https://anonymous0x233.github.io/ReuseAndDiffuse/).",
        "keywords": "diffusion model;video generation;artificial intelligence",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Jiaxi Gu;Shicong Wang;Haoyu Zhao;Tianyi Lu;Xing Zhang;Zuxuan Wu;Songcen Xu;Wei Zhang;Yu-Gang Jiang;Hang Xu",
        "authorids": "~Jiaxi_Gu1;~Shicong_Wang1;~Haoyu_Zhao2;~Tianyi_Lu1;~Xing_Zhang5;~Zuxuan_Wu1;~Songcen_Xu1;~Wei_Zhang45;~Yu-Gang_Jiang1;~Hang_Xu1",
        "gender": "M;;M;M;F;M;M;M;M;M",
        "homepage": ";;;https://www.zhihu.com/people/fitz-14;https://github.com/17skye17;https://zxwu.azurewebsites.net/;http://www.xusongcen.com/;;https://fvl.fudan.edu.cn/people/yugangjiang/;",
        "dblp": ";;;;52/5264-13.html;150/8447;131/6572;10/4661-81;24/5818;",
        "google_scholar": "FjBhxhkAAAAJ;;pCGM7jwAAAAJ;;dG46Q8wAAAAJ;7t12hVkAAAAJ;_xVW9SgAAAAJ;;f3_FP8AAAAAJ;https://scholar.google.com.hk/citations?user=J_8TX6sAAAAJ",
        "orcid": ";;0000-0003-3832-6439;;0000-0002-1721-035X;;;;;0000-0003-3645-8972",
        "linkedin": ";;;;;;songcen-xu-2b313465/;;;",
        "or_profile": "~Jiaxi_Gu1;~Shicong_Wang1;~Haoyu_Zhao2;~Tianyi_Lu1;~Xing_Zhang5;~Zuxuan_Wu1;~Songcen_Xu1;~Wei_Zhang45;~Yu-Gang_Jiang1;~Hang_Xu1",
        "aff": "Huawei Noah\u2018s Ark Lab;;Fudan University;Fudan University;NII, National Institute of Informatics;Fudan University;Huawei Noah's Ark Lab;Huawei Technologies Ltd;Fudan University;Huawei Noah\u2018s Ark Lab",
        "aff_domain": "huawei.com;;fudan.edu.cn;fudan.edu.cn;nii.ac.jp;fudan.edu;huawei.com;huawei.com;fudan.edu.cn;huawei.com",
        "position": "Researcher;;PhD student;MS student;Postdoc;Associate Professor;Principal Engineer;Researcher;Full Professor;Researcher",
        "bibtex": "@misc{\ngu2024reuse,\ntitle={Reuse and Diffuse: Iterative Denoising for Text-to-Video Generation},\nauthor={Jiaxi Gu and Shicong Wang and Haoyu Zhao and Tianyi Lu and Xing Zhang and Zuxuan Wu and Songcen Xu and Wei Zhang and Yu-Gang Jiang and Hang Xu},\nyear={2024},\nurl={https://openreview.net/forum?id=qGZTrj48Lb}\n}",
        "github": "",
        "project": "",
        "reviewers": "DaXJ;qhyu;btaf;qJFK",
        "site": "https://openreview.net/forum?id=qGZTrj48Lb",
        "pdf_size": 1847045,
        "rating": "3;3;5;5",
        "confidence": "5;4;5;4",
        "soundness": "2;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "3;3;4;2",
        "wc_summary": "49;61;85;165",
        "wc_strengths": "35;25;88;50",
        "wc_weaknesses": "195;45;187;255",
        "wc_questions": "47;58;56;67",
        "wc_review": "326;189;416;537",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            90.0,
            45.19955751995809
        ],
        "wc_strengths_avg": [
            49.5,
            23.942639787625758
        ],
        "wc_weaknesses_avg": [
            170.5,
            77.07626093681505
        ],
        "wc_questions_avg": [
            57.0,
            7.106335201775948
        ],
        "wc_review_avg": [
            367.0,
            127.14755208025045
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 47,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=632763997049519085&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1;2;1;0;0;1;0",
        "aff_unique_norm": "Huawei;Fudan University;National Institute of Informatics",
        "aff_unique_dep": "Noah's Ark Lab;;",
        "aff_unique_url": "https://www.huawei.com;https://www.fudan.edu.cn;https://www.nii.ac.jp",
        "aff_unique_abbr": "Huawei;Fudan;NII",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0;0;0;0;0",
        "aff_country_unique": "China;Japan"
    },
    {
        "id": "qGaIMO8dqD",
        "title": "Explaining the Complex Task Reasoning of Large Language Models with Template-Content Structure",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The continuous evolution of pre-trained large language models with ever-growing parameters and corpus sizes has augmented their capacity to solve complex tasks. This ability, which obviates the necessity for task-specific training or fine-tuning, relies on providing the model with a language description or some task exemplars---referred to the *prompt*---that guide the desired autoregressive generation. Despite the remarkable success, the underlying mechanisms that facilitate such exceptional generalization abilities remain an open question. In this paper, we present a novel framework that formally conceptualizes answer generation for complex natural language tasks as a hierarchical *''template-content''* structure. According to our modeling, there exist pre-trained models that can automatically decompose tasks into constituent steps during autoregressive generation, through language modeling on a sufficiently large corpus, thereby solving them. Our framework offers an explanatory tool for the complex reasoning abilities of large language models from the perspective of modeling autoregressive generation tasks. Our experiments show that real-world models exhibit distinct behaviors for ''template'' and ''content'', providing support for our modeling.",
        "keywords": "large language model;complex task reasoning;template-content structure;autoregressive model",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/ffc1d13ef892722bbda20a88ce197904697370a8.zip",
        "author": "Haotong Yang;Fanxu Meng;Zhouchen Lin;Muhan Zhang",
        "authorids": "~Haotong_Yang1;~Fanxu_Meng1;~Zhouchen_Lin1;~Muhan_Zhang1",
        "gender": "M;M;M;M",
        "homepage": "https://haotong-yang.github.io/;https://fxmeng.github.io/;https://zhouchenlin.github.io;https://muhanzhang.github.io/",
        "dblp": "329/6378.html;;l/ZhouchenLin;157/5518",
        "google_scholar": "Zn2kjLoAAAAJ;xvfuhRUAAAAJ;https://scholar.google.com.tw/citations?user=TanjFwoAAAAJ;https://scholar.google.com.hk/citations?user=OBBqkosAAAAJ",
        "orcid": ";;0000-0003-1493-7569;0000-0002-7680-6401",
        "linkedin": ";;;jerry-muhan-zhang-a33a1777/",
        "or_profile": "~Haotong_Yang1;~Fanxu_Meng1;~Zhouchen_Lin1;~Muhan_Zhang1",
        "aff": "Peking University;Peking University;Peking University;Peking University",
        "aff_domain": "pku.edu.cn;pku.edu.cn;pku.edu.cn;pku.edu.cn",
        "position": "PhD student;PhD student;Professor;Assistant Professor",
        "bibtex": "@misc{\nyang2024explaining,\ntitle={Explaining the Complex Task Reasoning of Large Language Models with Template-Content Structure},\nauthor={Haotong Yang and Fanxu Meng and Zhouchen Lin and Muhan Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=qGaIMO8dqD}\n}",
        "github": "",
        "project": "",
        "reviewers": "oieR;KmxN;KnhL",
        "site": "https://openreview.net/forum?id=qGaIMO8dqD",
        "pdf_size": 1238259,
        "rating": "3;5;6",
        "confidence": "4;2;3",
        "soundness": "2;3;3",
        "contribution": "2;2;3",
        "presentation": "2;2;3",
        "wc_summary": "71;101;37",
        "wc_strengths": "27;17;11",
        "wc_weaknesses": "468;30;59",
        "wc_questions": "29;75;20",
        "wc_review": "595;223;127",
        "wc_reply_reviewers": "320;0;0",
        "wc_reply_authors": "4500;2214;1524",
        "reply_reviewers": "1;0;0",
        "reply_authors": "8;4;4",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            69.66666666666667,
            26.144895401503437
        ],
        "wc_strengths_avg": [
            18.333333333333332,
            6.599663291074443
        ],
        "wc_weaknesses_avg": [
            185.66666666666666,
            199.9905553325512
        ],
        "wc_questions_avg": [
            41.333333333333336,
            24.087802353519553
        ],
        "wc_review_avg": [
            315.0,
            201.83161298468582
        ],
        "wc_reply_reviewers_avg": [
            106.66666666666667,
            150.84944665313012
        ],
        "wc_reply_authors_avg": [
            2746.0,
            1271.8521926702017
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            5.333333333333333,
            1.8856180831641267
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.6546536707079772,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ehlxZDFPMjsJ:scholar.google.com/&scioq=Explaining+the+Complex+Task+Reasoning+of+Large+Language+Models+with+Template-Content+Structure&hl=en&as_sdt=0,34",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Peking University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.pku.edu.cn",
        "aff_unique_abbr": "Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "qGuV3oP6yU",
        "title": "OccuQuest: Mitigating Occupational Bias for Inclusive Large Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The emergence of large language models (LLMs) has revolutionized natural language processing tasks.\nHowever, existing instruction-tuning datasets suffer from occupational bias: the majority of data relates to only a few occupations, which hampers the instruction-tuned LLMs to generate helpful responses to professional queries from practitioners in specific fields.\nTo mitigate this issue and promote occupation-inclusive LLMs, we create an instruction-tuning dataset named \\emph{OccuQuest}, which contains 110,000+ prompt-completion pairs and 30,000+ dialogues covering over 1,000 occupations in 26 occupational categories.\nWe systematically request ChatGPT, organizing queries hierarchically based on Occupation, Responsibility, Topic, and Question, to ensure a comprehensive coverage of occupational specialty inquiries.\nBy comparing with three commonly used datasets (Dolly, ShareGPT, and WizardLM), we observe that OccuQuest exhibits a more balanced distribution across occupations.\nFurthermore, we assemble three test sets for comprehensive evaluation, an occu-test set covering 25 occupational categories, an estate set focusing on real estate, and an occu-quora set containing real-world questions from Quora.\nWe then fine-tune LLaMA on OccuQuest to obtain OccuLLaMA, which significantly outperforms state-of-the-art LLaMA variants (Vicuna, Tulu, and WizardLM) on professional questions in GPT-4 and human evaluations.\nNotably, on the occu-quora set, OccuLLaMA reaches a high win rate of 86.4\\% against WizardLM.\nFurthermore, we demonstrate the potential of combining OccuQuest with other instruction-tuning datasets to enhance the overall performance of LLMs.\nBy fine-tuning LLaMA on a mixture of OccuQuest and Tulu datasets, we introduce ProLLaMA, which excels in addressing occupational questions and exhibits superior performance in comprehensive evaluations such as MMLU, GSM8K, BBH, and HumanEval.\nAmong the different LLaMA variants, the 7B and 13B ProLLaMA models achieve the highest performance on MMLU and GSM8K, with the 7B ProLLaMA model demonstrating an improvement of more than 4 points over the other 7B variants on GSM8K.",
        "keywords": "instruction-tuning dataset;occupational bias;large language models",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Mingfeng Xue;Dayiheng Liu;Kexin Yang;Guanting Dong;Wenqiang Lei;Zheng Yuan;Chang Zhou;Jingren Zhou",
        "authorids": "~Mingfeng_Xue1;~Dayiheng_Liu1;~Kexin_Yang2;~Guanting_Dong1;~Wenqiang_Lei1;~Zheng_Yuan2;~Chang_Zhou2;~Jingren_Zhou1",
        "gender": "M;M;M;M;M;M;M;F",
        "homepage": ";https://dayihengliu.github.io/;https://dongguanting.github.io/;https://sites.google.com/view/wenqianghome/home;;;;",
        "dblp": ";https://dblp.uni-trier.de/pers/hd/l/Liu:Dayiheng;;167/9604;56/2877-2;;84/2644;54/774-2.html",
        "google_scholar": ";pPLQrX4AAAAJ;amozZDkAAAAJ;https://scholar.google.com.hk/citations?user=qexdxuEAAAAJ;https://scholar.google.com/citations?hl=zh-CN;QeSoG3sAAAAJ;;https://scholar.google.com/citations?hl=en",
        "orcid": ";0000-0002-8755-8941;;;;;;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Mingfeng_Xue1;~Dayiheng_Liu1;~Guanting_Dong1;~Wenqiang_Lei1;~Zheng_Yuan2;~Chang_Zhou2;~Jingren_Zhou1;~kexin_yang1",
        "aff": "Sichuan University;Alibaba Group;Beijing University of Posts and Telecommunications;Sichuan University;Alibaba Group;Alibaba Group;Alibaba Group;Alibaba Group",
        "aff_domain": "scu.edu.cn;alibaba-inc.com;bupt.edu.cn;scu.edu.cn;alibaba-inc.com;alibaba-inc.com;alibaba-inc.com;alibaba-inc.com",
        "position": "PhD student;Researcher;MS student;Full Professor;Researcher;Researcher;Researcher;Researcher",
        "bibtex": "@misc{\nxue2024occuquest,\ntitle={OccuQuest: Mitigating Occupational Bias for Inclusive Large Language Models},\nauthor={Mingfeng Xue and Dayiheng Liu and Kexin Yang and Guanting Dong and Wenqiang Lei and Zheng Yuan and Chang Zhou and Jingren Zhou},\nyear={2024},\nurl={https://openreview.net/forum?id=qGuV3oP6yU}\n}",
        "github": "",
        "project": "",
        "reviewers": "Y9X6;fj7f;gJH9",
        "site": "https://openreview.net/forum?id=qGuV3oP6yU",
        "pdf_size": 1613617,
        "rating": "3;5;5",
        "confidence": "3;4;4",
        "soundness": "2;2;3",
        "contribution": "2;3;3",
        "presentation": "2;3;3",
        "wc_summary": "154;82;116",
        "wc_strengths": "29;66;25",
        "wc_weaknesses": "530;144;137",
        "wc_questions": "83;7;11",
        "wc_review": "796;299;289",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            117.33333333333333,
            29.4089933334837
        ],
        "wc_strengths_avg": [
            40.0,
            18.457157599876172
        ],
        "wc_weaknesses_avg": [
            270.3333333333333,
            183.63429841823
        ],
        "wc_questions_avg": [
            33.666666666666664,
            34.92213560989012
        ],
        "wc_review_avg": [
            461.3333333333333,
            236.68028129853903
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.9999999999999998,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18107188728127449342&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;0;1;1;1;1",
        "aff_unique_norm": "Sichuan University;Alibaba Group;Beijing University of Posts and Telecommunications",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.scu.edu.cn;https://www.alibaba.com;http://www.bupt.edu.cn/",
        "aff_unique_abbr": "SCU;Alibaba;BUPT",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Beijing",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "qH8ADnIVII",
        "title": "Dynamic Demonstrations Controller for In-Context Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In-Context Learning (ICL) is a new paradigm for natural language processing (NLP), where a large language model (LLM) observes a small number of demonstrations and a test instance as its input, and directly makes predictions without updating model parameters. Previous studies have revealed that ICL is sensitive to the selection and the order of demonstrations. However, there are few studies regarding the impact of the demonstration number on the ICL performance within a limited input length of LLM, because it is commonly believed that the number of demonstrations is positively correlated with model performance. In this paper, we find this conclusion does not always hold true. Through pilot experiments, we discover that increasing the number of demonstrations does not necessarily lead to improved performance. Building upon this insight, we propose a $\\textbf{D}$ynamic $\\textbf{D}$emonstrations $\\textbf{Controller}$ $({\\textbf{D$^2$Controller}})$, which can improve the ICL performance by adjusting the number of demonstrations dynamically. The experimental results show that D$^2$Controller yields a 5.4\\% relative improvement on eight different sizes of LLMs across ten datasets. Moreover, we also extend our method to previous ICL models and achieve competitive results.",
        "keywords": "in-context learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/1925229cfde531bb7bc6baf5cf753e5e0724d090.zip",
        "author": "Fei Zhao;Taotian Pang;Zhen Wu;Zheng Ma;Shujian Huang;Xinyu Dai",
        "authorids": "~Fei_Zhao5;~Taotian_Pang1;~Zhen_Wu2;~Zheng_Ma5;~Shujian_Huang1;~Xinyu_Dai1",
        "gender": ";;M;M;M;M",
        "homepage": ";https://github.com/TJTP;https://wuzhen247.github.io/;;http://nlp.nju.edu.cn/huangsj/;http://cs.nju.edu.cn/daixinyu",
        "dblp": ";358/4407;16/4485-2;17/2672;57/8451;39/5815",
        "google_scholar": ";;IoGlgtoAAAAJ;https://scholar.google.com/citations?hl=en-CN;HF3-E9kAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;0000-0002-7678-103X;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Fei_Zhao5;~Taotian_Pang1;~Zhen_Wu2;~Zheng_Ma5;~Shujian_Huang1;~Xinyu_Dai1",
        "aff": ";Nanjing University;Nanjing University;Nanjing University;Nanjing University;Nanjing University",
        "aff_domain": ";nju.edu.cn;nju.edu.cn;nju.edu.cn;nju.edu.cn;nju.edu.cn",
        "position": ";MS student;Researcher;PhD student;Full Professor;Full Professor",
        "bibtex": "@misc{\nzhao2024dynamic,\ntitle={Dynamic Demonstrations Controller for In-Context Learning},\nauthor={Fei Zhao and Taotian Pang and Zhen Wu and Zheng Ma and Shujian Huang and Xinyu Dai},\nyear={2024},\nurl={https://openreview.net/forum?id=qH8ADnIVII}\n}",
        "github": "",
        "project": "",
        "reviewers": "NpsS;tTZn;mRAG;t5tL",
        "site": "https://openreview.net/forum?id=qH8ADnIVII",
        "pdf_size": 911694,
        "rating": "5;5;5;8",
        "confidence": "4;3;4;4",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;2",
        "presentation": "3;4;2;3",
        "wc_summary": "50;117;220;227",
        "wc_strengths": "16;94;34;119",
        "wc_weaknesses": "83;183;170;7",
        "wc_questions": "93;17;109;446",
        "wc_review": "242;411;533;799",
        "wc_reply_reviewers": "0;151;0;180",
        "wc_reply_authors": "473;876;1319;1823",
        "reply_reviewers": "0;1;0;3",
        "reply_authors": "2;3;3;6",
        "rating_avg": [
            5.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            153.5,
            73.94085474215186
        ],
        "wc_strengths_avg": [
            65.75,
            42.180416071916596
        ],
        "wc_weaknesses_avg": [
            110.75,
            71.17715574536538
        ],
        "wc_questions_avg": [
            166.25,
            165.21103928006747
        ],
        "wc_review_avg": [
            496.25,
            203.0509480401409
        ],
        "wc_reply_reviewers_avg": [
            82.75,
            83.38277699861045
        ],
        "wc_reply_authors_avg": [
            1122.75,
            502.97235261990295
        ],
        "reply_reviewers_avg": [
            1.0,
            1.224744871391589
        ],
        "reply_authors_avg": [
            3.5,
            1.5
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=640048107481088187&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Nanjing University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nju.edu.cn",
        "aff_unique_abbr": "Nanjing U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Protein-Ligand Interaction Prior for Binding-aware 3D Molecule Diffusion Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17740",
        "id": "qH9nrMNTIW",
        "author_site": "Zhilin Huang, Ling Yang, Xiangxin Zhou, Zhilong Zhang, Wentao Zhang, Xiawu Zheng, Jie Chen, Yu Wang, Bin CUI, Wenming Yang",
        "tldr": "",
        "abstract": "Generating 3D ligand molecules that bind to specific protein targets via diffusion models has shown great promise for structure-based drug design. The key idea is to disrupt molecules into noise through a fixed forward process and learn its reverse process to generate molecules from noise in a denoising way. However, existing diffusion models primarily focus on incorporating protein-ligand interaction information solely in the reverse process, and neglect the interactions in the forward process. The inconsistency between forward and reverse processes may impair the binding affinity of generated molecules towards target protein. In this paper, we propose a novel Interaction Prior-guided Diffusion model (IPDiff) for the protein-specific 3D molecular generation by introducing geometric protein-ligand interactions into both diffusion and sampling process. Specifically, we begin by pretraining a protein-ligand interaction prior network (IPNet) by utilizing the binding affinity signals as supervision. Subsequently, we leverage the pretrained prior network to (1) integrate interactions between the target protein and the molecular ligand into the forward process for adapting the molecule diffusion trajectories (prior-shifting), and (2) enhance the binding-aware molecule sampling process (prior-conditioning). Empirical studies on CrossDocked2020 dataset show IPDiff can generate molecules with more realistic 3D structures and state-of-the-art binding affinities towards the protein targets, with up to -6.42 Avg. Vina Score, while maintaining proper molecular properties. https://github.com/YangLing0818/IPDiff",
        "keywords": "Diffusion Models;Structure-Based Drug Design;Molecule Generation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/3eed6412d62d850826a800c1cc758f13d02c968a.zip",
        "author": "Zhilin Huang;Ling Yang;Xiangxin Zhou;Zhilong Zhang;Wentao Zhang;Xiawu Zheng;Jie Chen;Yu Wang;Bin CUI;Wenming Yang",
        "authorids": "~Zhilin_Huang1;~Ling_Yang1;~Xiangxin_Zhou1;~Zhilong_Zhang1;~Wentao_Zhang1;~Xiawu_Zheng1;~Jie_Chen15;~Yu_Wang60;~Bin_CUI2;~Wenming_Yang1",
        "gender": "M;M;Not Specified;;M;M;M;M;M;M",
        "homepage": "https://zerinhwang03.github.io/;https://yangling0818.github.io/;;;https://sites.google.com/view/zhengxiawu/%E9%A6%96%E9%A1%B5;https://aimia-pku.github.io/;;https://cuibinpku.github.io/index.html;https://www.sigs.tsinghua.edu.cn/ywm_en/main.htm;https://zwt233.github.io/",
        "dblp": "266/8046.html;01/24-6.html;247/9275;06/8799;222/7865;92/6289-1;02/5889-8;55/5031.html;75/2339.html;41/3249-1.html",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com.hk/citations?user=sIKujqAAAAAJ;eQgIWcQAAAAJ;https://scholar.google.com/citations?hl=zh-CN;jBgXocYAAAAJ;https://scholar.google.fi/citations?user=ZAZFfwwAAAAJ;https://scholar.google.com/citations?hl=en;IJAU8KoAAAAJ;https://scholar.google.com/citations?hl=zh-CN;JE4VON0AAAAJ",
        "orcid": "0000-0003-3417-743X;0000-0003-1905-8053;;0009-0009-9307-8440;0000-0002-6855-5403;;0000-0003-4976-9366;0000-0003-1681-4677;0000-0002-2506-1286;0000-0002-7532-5550",
        "linkedin": ";;;;;;;;;",
        "or_profile": "~Zhilin_Huang1;~Ling_Yang1;~Xiangxin_Zhou1;~Zhilong_Zhang1;~Xiawu_Zheng1;~Jie_Chen15;~Yu_Wang60;~Bin_CUI2;~Wenming_Yang1;~Zhang_wen_tao1",
        "aff": "Tsinghua University;Peking University;Institute of Automation, Chinese Academy of Sciences;Korea Advanced Institute of Science & Technology;PengCheng Lab;Peking University;Peng Cheng Laboratory;Peking University;Tsinghua University,;Peking University",
        "aff_domain": "mails.tsinghua.edu.cn;pku.edu.cn;ia.ac.cn;kaist.ac.kr;pcl.ac.cn;pku.edu.cn;pcl.ac.cn;pku.edu.cn;tsinghua.edu.cn;pku.edu.cn",
        "position": "PhD student;PhD student;PhD student;Intern;Postdoc;Associate Professor;Full Professor;Full Professor;Associate Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nhuang2024proteinligand,\ntitle={Protein-Ligand Interaction Prior for Binding-aware 3D Molecule Diffusion Models},\nauthor={Zhilin Huang and Ling Yang and Xiangxin Zhou and Zhilong Zhang and Wentao Zhang and Xiawu Zheng and Jie Chen and Yu Wang and Bin CUI and Wenming Yang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=qH9nrMNTIW}\n}",
        "github": "",
        "project": "",
        "reviewers": "AJPX;F898;ssPe;qHa3",
        "pdf_size": 5919405,
        "rating": "5;6;6;8",
        "confidence": "3;3;3;4",
        "soundness": "2;3;2;3",
        "contribution": "3;3;2;3",
        "presentation": "3;3;2;3",
        "wc_summary": "60;121;102;166",
        "wc_strengths": "74;31;73;88",
        "wc_weaknesses": "229;172;221;27",
        "wc_questions": "176;2;33;106",
        "wc_review": "539;326;429;387",
        "wc_reply_reviewers": "319;21;197;31",
        "wc_reply_authors": "2281;822;1882;513",
        "reply_reviewers": "1;1;2;1",
        "reply_authors": "4;2;5;2",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            112.25,
            38.08132744535043
        ],
        "wc_strengths_avg": [
            66.5,
            21.33658829335187
        ],
        "wc_weaknesses_avg": [
            162.25,
            81.07828007549247
        ],
        "wc_questions_avg": [
            79.25,
            67.42171386133698
        ],
        "wc_review_avg": [
            420.25,
            77.72829278969145
        ],
        "wc_reply_reviewers_avg": [
            142.0,
            123.81033882515628
        ],
        "wc_reply_authors_avg": [
            1374.5,
            729.1668190476031
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.25,
            1.299038105676658
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.9271726499455306,
        "gs_citation": 20,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18347593552547436467&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=qH9nrMNTIW",
        "pdf": "https://openreview.net/pdf?id=qH9nrMNTIW",
        "email": "mails.tsinghua.edu.cn;pku.edu.cn;ia.ac.cn;kaist.ac.kr;pcl.ac.cn;pku.edu.cn;pcl.ac.cn;pku.edu.cn;tsinghua.edu.cn;pku.edu.cn",
        "author_num": 10,
        "aff_unique_index": "0;1;2;3;4;1;5;1;0;1",
        "aff_unique_norm": "Tsinghua University;Peking University;Chinese Academy of Sciences;Korea Advanced Institute of Science and Technology;Pengcheng Lab;Pengcheng Laboratory",
        "aff_unique_dep": ";;Institute of Automation;;;Peng Cheng Laboratory",
        "aff_unique_url": "https://www.tsinghua.edu.cn;http://www.pku.edu.cn;http://www.ia.cas.cn;https://www.kaist.ac.kr;;http://www.pcl.ac.cn",
        "aff_unique_abbr": "THU;Peking U;CAS;KAIST;;PCL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0;0;0;0;0;0",
        "aff_country_unique": "China;South Korea"
    },
    {
        "title": "Seer: Language Instructed Video Prediction with Latent Diffusion Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17739",
        "id": "qHGgNyQk31",
        "author_site": "Xianfan Gu, Chuan Wen, Weirui Ye, Jiaming Song, Yang Gao",
        "tldr": "",
        "abstract": "Imagining the future trajectory is the key for robots to make sound planning and successfully reach their goals. Therefore, text-conditioned video prediction (TVP) is an essential task to facilitate general robot policy learning.\nTo tackle this task and empower robots with the ability to foresee the future, we propose a sample and computation-efficient model, named Seer, by inflating the pretrained text-to-image (T2I) stable diffusion models along the temporal axis. We enhance the U-Net and language conditioning model by incorporating computation-efficient spatial-temporal attention. Furthermore, we introduce a novel Frame Sequential Text Decomposer module that dissects a sentence's global instruction into temporally aligned sub-instructions, ensuring precise integration into each frame of generation. Our framework allows us to effectively leverage the extensive prior knowledge embedded in pretrained T2I models across the frames. \nWith the adaptable-designed architecture, Seer makes it possible to generate high-fidelity, coherent, and instruction-aligned video frames by fine-tuning a few layers on a small amount of data. The experimental results on Something Something V2 (SSv2), Bridgedata and EpicKitchens-100 datasets demonstrate our superior video prediction performance with around 480-GPU hours versus CogVideo with over 12,480-GPU hours: achieving the 31\\% FVD improvement compared to the current SOTA model on SSv2 and 83.7\\% average preference in the human evaluation. Our project is available at https://seervideodiffusion.github.io/",
        "keywords": "video prediction;multi-modality generation;diffusion model;language-vision model",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/7b2b06c78e724075063ff8bfc32cf699cb57f1cb.zip",
        "author": "Xianfan Gu;Chuan Wen;Weirui Ye;Jiaming Song;Yang Gao",
        "authorids": "~Xianfan_Gu1;~Chuan_Wen1;~Weirui_Ye1;~Jiaming_Song1;~Yang_Gao1",
        "gender": "M;M;M;M;M",
        "homepage": ";https://alvinwen428.github.io/;https://yewr.github.io/;http://tsong.me;http://yang-gao.weebly.com",
        "dblp": "344/1664;239/8286;245/3595;173/5104;89/4402-29",
        "google_scholar": ";G5M9nYwAAAAJ;_GgST9AAAAAJ;;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0002-7860-9460;;;;",
        "linkedin": ";;;jiamings/;yang-gao-45245348/",
        "or_profile": "~Xianfan_Gu1;~Chuan_Wen1;~Weirui_Ye1;~Jiaming_Song1;~Yang_Gao1",
        "aff": "Shanghai Qi Zhi Institute;University of California, Berkeley;Tsinghua University;Luma AI;Tsinghua University",
        "aff_domain": "sqz.ac.cn;berkeley.edu;tsinghua.edu.cn;lumalabs.ai;tsinghua.edu.cn",
        "position": "Researcher;Intern;PhD student;Chief Scientist;Assistant Professor",
        "bibtex": "@inproceedings{\ngu2024seer,\ntitle={Seer: Language Instructed Video Prediction with Latent Diffusion Models},\nauthor={Xianfan Gu and Chuan Wen and Weirui Ye and Jiaming Song and Yang Gao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=qHGgNyQk31}\n}",
        "github": "",
        "project": "",
        "reviewers": "zbgX;xJcW;shhp;KPNS",
        "pdf_size": 19622794,
        "rating": "6;6;6;8",
        "confidence": "4;4;3;4",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;4",
        "presentation": "3;3;2;3",
        "wc_summary": "112;84;133;55",
        "wc_strengths": "411;51;71;38",
        "wc_weaknesses": "473;125;128;91",
        "wc_questions": "335;45;103;4",
        "wc_review": "1331;305;435;188",
        "wc_reply_reviewers": "0;0;0;9",
        "wc_reply_authors": "2110;819;691;776",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "4;2;2;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            96.0,
            29.368350311176826
        ],
        "wc_strengths_avg": [
            142.75,
            155.3196301180247
        ],
        "wc_weaknesses_avg": [
            204.25,
            155.84186696776962
        ],
        "wc_questions_avg": [
            121.75,
            128.04564615792293
        ],
        "wc_review_avg": [
            564.75,
            450.9392281671667
        ],
        "wc_reply_reviewers_avg": [
            2.25,
            3.897114317029974
        ],
        "wc_reply_authors_avg": [
            1099.0,
            585.5155847626944
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.8660254037844386
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 47,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7117659292251825969&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=qHGgNyQk31",
        "pdf": "https://openreview.net/pdf?id=qHGgNyQk31",
        "email": "sqz.ac.cn;berkeley.edu;tsinghua.edu.cn;lumalabs.ai;tsinghua.edu.cn",
        "author_num": 5,
        "aff_unique_index": "0;1;2;3;2",
        "aff_unique_norm": "Shanghai Qi Zhi Institute;University of California, Berkeley;Tsinghua University;Luma AI",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.qz.io;https://www.berkeley.edu;https://www.tsinghua.edu.cn;https://www.luma.ai",
        "aff_unique_abbr": ";UC Berkeley;THU;Luma AI",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Berkeley",
        "aff_country_unique_index": "0;1;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "qIRkFyLZnR",
        "title": "Robustify the Latent Space: Offline Distributionally Robust Reinforcement Learning with Linear Function Approximation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Among the reasons hindering the applications of reinforcement learning (RL) to real-world problems, two factors are critical: limited data and the mismatch between the test environment (real environment in which the policy is deployed) and the training environment (e.g., a simulator). This paper simultaneously addresses these issues with offline distributionally robust RL, where a distributionally robust policy is learned using historical data from the source environment by optimizing against a worst-case perturbation thereof. In particular, we move beyond tabular settings and design a novel linear function approximation framework that robustifies the latent space. Our framework is instantiated into two settings, one where the dataset is well-explored and the other where the dataset has weaker data coverage. In addition, we introduce a value shift algorithmic technique specifically designed to suit the distributionally robust nature, which contributes to our improved theoretical results and empirical performance. Sample complexities $\\tilde{O}(d^{1/2}/N^{1/2})$ and $\\tilde{O}(d^{3/2}/N^{1/2})$ are established respectively as the first non-asymptotic results in these settings, where $d$ denotes the dimension in the linear function space and $N$ represents the number of trajectories in the dataset. Diverse experiments are conducted to demonstrate our theoretical findings, showing the superiority of our algorithms against the non-robust one.",
        "keywords": "Distributionally robust optimization;Offline Reinforcement Learning;Linear Function Approximation",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/9f21945cfbc9add2304dd48398e0874f37575c42.zip",
        "author": "Zhipeng Liang;Xiaoteng Ma;Jose Blanchet;Mingwen Liu;Jiheng Zhang;Zhengyuan Zhou",
        "authorids": "~Zhipeng_Liang1;~Xiaoteng_Ma1;~Jose_Blanchet1;~Mingwen_Liu1;~Jiheng_Zhang1;~Zhengyuan_Zhou2",
        "gender": ";M;M;M;;M",
        "homepage": ";https://xtma.github.io/;https://web.stanford.edu/~jblanche/;;https://reijz.github.io;https://scholar.google.com/citations?user=hiGI9v0AAAAJ&hl=en",
        "dblp": "225/7683.html;238/3249;75/5093.html;;13/7602;125/5270",
        "google_scholar": ";CeDFnNMAAAAJ;https://scholar.google.co.in/citations?user=O24CcQQAAAAJ;;;",
        "orcid": "0000-0002-3101-5673;0000-0002-7250-6268;;;;",
        "linkedin": "zhipeng-liang-958977204/;;jose-blanchet;%E9%93%AD%E6%96%87%E5%88%98maxwell/;;",
        "or_profile": "~Zhipeng_Liang1;~Xiaoteng_Ma1;~Jose_Blanchet1;~Mingwen_Liu1;~Jiheng_Zhang1;~Zhengyuan_Zhou2",
        "aff": "Hong Kong University of Science and Technology;;Stanford University;;Hong Kong University of Science and Technology;New York University",
        "aff_domain": "hkust.edu;;stanford.edu;;ust.hk;nyu.edu",
        "position": "PhD student;;Professor;;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nliang2024robustify,\ntitle={Robustify the Latent Space: Offline Distributionally Robust Reinforcement Learning with Linear Function Approximation},\nauthor={Zhipeng Liang and Xiaoteng Ma and Jose Blanchet and Mingwen Liu and Jiheng Zhang and Zhengyuan Zhou},\nyear={2024},\nurl={https://openreview.net/forum?id=qIRkFyLZnR}\n}",
        "github": "",
        "project": "",
        "reviewers": "GkC9;T9sS;p4nt;EUgk;WFAe",
        "site": "https://openreview.net/forum?id=qIRkFyLZnR",
        "pdf_size": 658160,
        "rating": "3;3;5;5;6",
        "confidence": "4;4;3;4;4",
        "soundness": "2;2;2;3;3",
        "contribution": "2;2;3;2;3",
        "presentation": "2;1;3;3;2",
        "wc_summary": "42;94;22;52;81",
        "wc_strengths": "41;59;23;6;43",
        "wc_weaknesses": "26;160;99;51;120",
        "wc_questions": "488;86;4;5;72",
        "wc_review": "597;399;148;114;316",
        "wc_reply_reviewers": "0;65;0;111;19",
        "wc_reply_authors": "855;178;201;505;251",
        "reply_reviewers": "0;1;0;1;1",
        "reply_authors": "2;1;1;1;1",
        "rating_avg": [
            4.4,
            1.2
        ],
        "confidence_avg": [
            3.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.2,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            58.2,
            26.12584926849269
        ],
        "wc_strengths_avg": [
            34.4,
            18.216476058777122
        ],
        "wc_weaknesses_avg": [
            91.2,
            47.9391280688333
        ],
        "wc_questions_avg": [
            131.0,
            181.63700063588365
        ],
        "wc_review_avg": [
            314.8,
            175.99477264964435
        ],
        "wc_reply_reviewers_avg": [
            39.0,
            43.13235444535807
        ],
        "wc_reply_authors_avg": [
            398.0,
            256.5603242904093
        ],
        "reply_reviewers_avg": [
            0.6,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.2,
            0.4000000000000001
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.25000000000000006,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:OUfMK6wgeXYJ:scholar.google.com/&scioq=Robustify+the+Latent+Space:+Offline+Distributionally+Robust+Reinforcement+Learning+with+Linear+Function+Approximation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Stanford University;New York University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ust.hk;https://www.stanford.edu;https://www.nyu.edu",
        "aff_unique_abbr": "HKUST;Stanford;NYU",
        "aff_campus_unique_index": "0;1;0",
        "aff_campus_unique": "Hong Kong SAR;Stanford;",
        "aff_country_unique_index": "0;1;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "qIn2IgMWYg",
        "title": "Iterative Search Attribution for Deep Neural Networks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Deep neural networks (DNNs) have achieved state-of-the-art performance in a number of application areas. However, to ensure the reliability of a DNN model and achieve a desired level of trustworthiness, it is critical to enhance the interpretability in terms of the model inputs and outputs. Attribution methods are an effective means of Explainable Artificial Intelligence (XAI) research. However, the interpretability of existing attribution algorithms varys depending on the choice of reference point, the quality of constructed adversarial samples, or the applicability of gradient constraints in specific tasks. To effectively and thoroughly explore the attribution integration paths, in this paper, inspired by the iterative generation of high-quality samples in the diffusion model, we propose an Iterative Search Attribution (ISA) method to achieve more accurate attribution by distinguishing the importance of samples during gradient ascent and descent and clipping the relatively unimportant features in the model. Specifically, we introduce a scale parameter during the iterative process to ensure that the parameters in the next iteration are always more significant than the parameters in the current iteration. Comprehensive experimental results show that our method has superior results in image recognition interpretability tasks compared with other sota baselines. Our code is available at: https://anonymous.4open.science/r/ISA-6F6B",
        "keywords": "Attribution;XAI;interpretability",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/43be5868c51bd857fbd5c920864045f0665a4b80.pdf",
        "author": "Zhiyu Zhu;Huaming Chen;Jiayu Zhang;Xinyi Wang;Zhibo Jin;Jason Xue;Jun Shen",
        "authorids": "~Zhiyu_Zhu2;~Huaming_Chen1;~Jiayu_Zhang1;~Xinyi_Wang9;~Zhibo_Jin1;~Jason_Xue1;~Jun_Shen3",
        "gender": ";;M;M;M;;M",
        "homepage": ";;https://github.com/KxPlaug;https://github.com/noctisluna;https://github.com/Davidjinzb;;https://scholars.uow.edu.au/display/jun_shen",
        "dblp": ";;;;;;48/5700-1",
        "google_scholar": ";;;;;;Bf6gvGkAAAAJ",
        "orcid": ";;;;;;0000-0002-9403-7140",
        "linkedin": ";;;;;;jun-shen-him-his-37b95337/",
        "or_profile": "~Zhiyu_Zhu2;~Huaming_Chen1;~Jiayu_Zhang1;~Xinyi_Wang9;~Zhibo_Jin1;~Jason_Xue1;~Jun_Shen3",
        "aff": ";;Suzhou Yierqi;Universiti Malaya;University of Sydney;;University of Wollongong",
        "aff_domain": ";;szyierqi.com;um.edu.my;usyd.edu.au;;uow.edu.au",
        "position": ";;Researcher;MS student;MS student;;Full Professor",
        "bibtex": "@misc{\nzhu2024iterative,\ntitle={Iterative Search Attribution for Deep Neural Networks},\nauthor={Zhiyu Zhu and Huaming Chen and Jiayu Zhang and Xinyi Wang and Zhibo Jin and Jason Xue and Jun Shen},\nyear={2024},\nurl={https://openreview.net/forum?id=qIn2IgMWYg}\n}",
        "github": "",
        "project": "",
        "reviewers": "df7s;PAUU;VN3Q;8Joh",
        "site": "https://openreview.net/forum?id=qIn2IgMWYg",
        "pdf_size": 1743911,
        "rating": "3;3;6;6",
        "confidence": "4;3;4;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;2",
        "presentation": "2;1;4;2",
        "wc_summary": "52;33;80;70",
        "wc_strengths": "31;40;55;26",
        "wc_weaknesses": "214;269;78;55",
        "wc_questions": "13;81;41;2",
        "wc_review": "310;423;254;153",
        "wc_reply_reviewers": "84;0;0;37",
        "wc_reply_authors": "1673;953;1230;1476",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "4;2;2;5",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            58.75,
            17.93564885918544
        ],
        "wc_strengths_avg": [
            38.0,
            11.022703842524301
        ],
        "wc_weaknesses_avg": [
            154.0,
            90.00277773491216
        ],
        "wc_questions_avg": [
            34.25,
            30.50717128807586
        ],
        "wc_review_avg": [
            285.0,
            97.53717240109025
        ],
        "wc_reply_reviewers_avg": [
            30.25,
            34.513584282134474
        ],
        "wc_reply_authors_avg": [
            1333.0,
            269.7489573659183
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.25,
            1.299038105676658
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16203848881917102408&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Suzhou Yierqi;Universiti Malaya;University of Sydney;University of Wollongong",
        "aff_unique_dep": ";;;",
        "aff_unique_url": ";https://www.malaya.edu.my;https://www.sydney.edu.au;https://www.uow.edu.au",
        "aff_unique_abbr": ";UM;USYD;UOW",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;2",
        "aff_country_unique": "China;Malaysia;Australia"
    },
    {
        "title": "Learning Grounded Action Abstractions from Language",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17738",
        "id": "qJ0Cfj4Ex9",
        "author_site": "Lio Wong, Jiayuan Mao, Pratyusha Sharma, Zachary Siegel, Jiahai Feng, Noa Korneev, Joshua B Tenenbaum, Jacob Andreas",
        "tldr": "",
        "abstract": "Effective planning in the real world requires not only world knowledge, but the ability to leverage that knowledge to build the right representation of the task at hand. Decades of hierarchical planning techniques have used domain-specific temporal action abstractions to support efficient and accurate planning, almost always relying on human priors and domain knowledge to decompose hard tasks into smaller subproblems appropriate for a goal or set of goals. This paper describes Ada (Action Domain Acquisition), a framework for automatically constructing task-specific planning representations using task-general background knowledge from language models (LMs). Starting with a general-purpose hierarchical planner and a low-level goal-conditioned policy, Ada interactively learns a library of planner-compatible high-level action abstractions and low-level controllers adapted to a particular domain of planning tasks. On two language-guided interactive planning benchmarks (Mini Minecraft and ALFRED Household Tasks), Ada strongly outperforms other approaches that use LMs for sequential decision-making, offering more accurate plans and better generalization to complex tasks.",
        "keywords": "planning abstractions;hierarchical planning;library learning;learning from language",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "",
        "author": "Lionel Wong;Jiayuan Mao;Pratyusha Sharma;Zachary S Siegel;Jiahai Feng;Noa Korneev;Joshua B. Tenenbaum;Jacob Andreas",
        "authorids": "~Lionel_Wong1;~Jiayuan_Mao1;~Pratyusha_Sharma1;~Zachary_S_Siegel1;~Jiahai_Feng1;~Noa_Korneev1;~Joshua_B._Tenenbaum1;~Jacob_Andreas1",
        "gender": "F;F;M;M;F;;M;Non-Binary",
        "homepage": "http://jiayuanm.com;https://pratyushasharma.github.io/;https://zacharysiegel.org/;https://jiahai-feng.github.io/;;;http://web.mit.edu/jda/www;https://web.mit.edu/zyzzyva/www/academic.html",
        "dblp": "200/8283;228/7904;;;;t/JoshuaBTenenbaum;97/8154;339/3594",
        "google_scholar": "-xaOIZIAAAAJ;RGiCLUgAAAAJ;EOPTuH0AAAAJ;vyB1pH4AAAAJ;;;dnZ8udEAAAAJ;KssJcIAAAAAJ",
        "orcid": "0000-0003-4798-3748;;;;;;;",
        "linkedin": ";;;;noakorneev;;;",
        "or_profile": "~Jiayuan_Mao1;~Pratyusha_Sharma1;~Zachary_S_Siegel1;~Jiahai_Feng1;~Noa_Korneev1;~Joshua_B._Tenenbaum1;~Jacob_Andreas1;~Catherine_Wong1",
        "aff": "Massachusetts Institute of Technology;Massachusetts Institute of Technology;Department of Computer Science, Princeton University;University of California, Berkeley;;Massachusetts Institute of Technology;Microsoft;Massachusetts Institute of Technology",
        "aff_domain": "mit.edu;mit.edu;cs.princeton.edu;berkeley.edu;;mit.edu;microsoft.com;mit.edu",
        "position": "PhD student;PhD student;Undergrad student;PhD student;;Professor;Researcher;PhD student",
        "bibtex": "@inproceedings{\nwong2024learning,\ntitle={Learning Grounded Action Abstractions from Language},\nauthor={Lionel Wong and Jiayuan Mao and Pratyusha Sharma and Zachary S Siegel and Jiahai Feng and Noa Korneev and Joshua B. Tenenbaum and Jacob Andreas},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=qJ0Cfj4Ex9}\n}",
        "github": "",
        "project": "",
        "reviewers": "ukwA;geyi;xxKc;uRvH;ikxW",
        "pdf_size": 2542609,
        "rating": "5;6;6;6;8",
        "confidence": "4;4;4;3;4",
        "soundness": "2;3;3;3;2",
        "contribution": "2;2;3;2;3",
        "presentation": "2;3;3;2;4",
        "wc_summary": "50;124;109;111;212",
        "wc_strengths": "28;72;41;83;54",
        "wc_weaknesses": "196;180;59;132;104",
        "wc_questions": "6;3;102;177;267",
        "wc_review": "280;379;311;503;637",
        "wc_reply_reviewers": "23;22;287;0;68",
        "wc_reply_authors": "1272;601;901;1152;1465",
        "reply_reviewers": "1;1;2;0;2",
        "reply_authors": "4;1;3;3;4",
        "rating_avg": [
            6.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.8,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            121.2,
            52.10527804359171
        ],
        "wc_strengths_avg": [
            55.6,
            19.985995096566995
        ],
        "wc_weaknesses_avg": [
            134.2,
            49.977594980150855
        ],
        "wc_questions_avg": [
            111.0,
            101.45146622893135
        ],
        "wc_review_avg": [
            422.0,
            132.0
        ],
        "wc_reply_reviewers_avg": [
            80.0,
            105.83572175782618
        ],
        "wc_reply_authors_avg": [
            1078.2,
            300.57904118550914
        ],
        "reply_reviewers_avg": [
            1.2,
            0.7483314773547883
        ],
        "reply_authors_avg": [
            3.0,
            1.0954451150103321
        ],
        "replies_avg": [
            36,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.10206207261596575,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5645079340129634901&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=qJ0Cfj4Ex9",
        "pdf": "https://openreview.net/pdf?id=qJ0Cfj4Ex9",
        "email": "mit.edu;mit.edu;cs.princeton.edu;berkeley.edu;;mit.edu;microsoft.com;mit.edu",
        "author_num": 8,
        "aff_unique_index": "0;0;1;2;0;3;0",
        "aff_unique_norm": "Massachusetts Institute of Technology;Princeton University;University of California, Berkeley;Microsoft",
        "aff_unique_dep": ";Department of Computer Science;;Microsoft Corporation",
        "aff_unique_url": "https://web.mit.edu;https://www.princeton.edu;https://www.berkeley.edu;https://www.microsoft.com",
        "aff_unique_abbr": "MIT;Princeton;UC Berkeley;Microsoft",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Berkeley",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "qJ5EFFGuFU",
        "title": "SAIR: LEARNING SEMANTIC-AWARE IMPLICIT REPRESENTATION",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Implicit representation of an image can map arbitrary coordinates in the continuous domain to their corresponding color values, presenting a powerful capability for image reconstruction. Nevertheless, existing implicit representation approaches only focus on building continuous appearance mapping, ignoring the continuities of the semantic information across pixels.  As a result, they can hardly achieve desired reconstruction results when the semantic information within input images is corrupted, for example, a large region misses. To address the issue, we propose to learn semantic-aware implicit representation (SAIR), that is, we make the implicit representation of each pixel rely on both its appearance and semantic information (e.g., which object does the pixel belong to).To this end, we propose a framework with two modules: (1) building a semantic implicit representation (SIR) for a corrupted image whose large regions miss. Given an arbitrary coordinate in the continuous domain, we can obtain its respective text-matched embedding indicating the object the pixel belongs. (2) building a semantic-aware appearance implicit representation (AIR) based on the SIR. Given an arbitrary coordinate in the continuous domain, we can reconstruct its color whether or not the pixel is missed in the input. We validate the novel semantic-aware implicit representation method on the image inpainting task, and the extensive experiments demonstrate that our method surpasses state-of-the-art approaches by a significant margin.",
        "keywords": "Inpainting;LLMs",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/8736a33a3314dae929fdcc819b7a8973f35edd10.zip",
        "author": "Canyu Zhang;Xiaoguang Li;Qing Guo;Song Wang",
        "authorids": "~Canyu_Zhang1;~Xiaoguang_Li2;~Qing_Guo3;~Song_Wang2",
        "gender": "M;M;M;M",
        "homepage": ";https://li-xiaoguang.github.io;https://tsingqguo.github.io;http://www.cse.sc.edu/~songwang/",
        "dblp": "275/8016;;25/3038-5;62/3151-2",
        "google_scholar": "5q551WoAAAAJ;https://scholar.google.com/citations?hl=en;Rj2x4QUAAAAJ;eycXl_QAAAAJ",
        "orcid": ";0000-0003-4902-1155;0000-0003-0974-9299;0000-0003-4152-5295",
        "linkedin": ";;;",
        "or_profile": "~Canyu_Zhang1;~Xiaoguang_Li2;~Qing_Guo3;~Song_Wang2",
        "aff": "University of South Carolina;University of South Carolina; Agency for Science, Technology and Research (A*STAR));University of South Carolina",
        "aff_domain": "sc.edu;sc.edu;cfar.a-star.edu.sg;sc.edu",
        "position": "PhD student;PhD student;Researcher;Full Professor",
        "bibtex": "@misc{\nzhang2024sair,\ntitle={{SAIR}: {LEARNING} {SEMANTIC}-{AWARE} {IMPLICIT} {REPRESENTATION}},\nauthor={Canyu Zhang and Xiaoguang Li and Qing Guo and Song Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=qJ5EFFGuFU}\n}",
        "github": "",
        "project": "",
        "reviewers": "vMNL;jBR4;N8gT;N8Xr",
        "site": "https://openreview.net/forum?id=qJ5EFFGuFU",
        "pdf_size": 5583672,
        "rating": "5;5;6;6",
        "confidence": "4;2;3;4",
        "soundness": "3;3;3;2",
        "contribution": "2;1;2;2",
        "presentation": "3;3;3;2",
        "wc_summary": "50;92;62;66",
        "wc_strengths": "43;22;48;53",
        "wc_weaknesses": "121;178;100;176",
        "wc_questions": "8;6;76;101",
        "wc_review": "222;298;286;396",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "351;493;287;346",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            67.5,
            15.321553446044563
        ],
        "wc_strengths_avg": [
            41.5,
            11.800423721205947
        ],
        "wc_weaknesses_avg": [
            143.75,
            34.07620137280563
        ],
        "wc_questions_avg": [
            47.75,
            41.70356699372369
        ],
        "wc_review_avg": [
            300.5,
            62.247489909232485
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            369.25,
            75.75082507801483
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.30151134457776363,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5127402798001381959&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "University of South Carolina;Agency for Science, Technology and Research",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.sc.edu;https://www.a-star.edu.sg",
        "aff_unique_abbr": "USC;A*STAR",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "United States;Singapore"
    },
    {
        "id": "qKKwQvepx0",
        "title": "Explainable, Steerable Models with Natural Language Parameters and Constraints",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Statistical modeling can uncover patterns in large datasets, but these patterns may not be explainable or relevant to our specific interest. For example, Gaussian mixture models are commonly used to explore text corpora, but it is hard to explain what each cluster means or steer them to use specific attributes (e.g. cluster based on style but not topic). To improve explainability and steerability, we introduce\nmodels where parameters are represented as natural language strings. For example, instead of using a Gaussian to represent a cluster, we represent it with a natural language predicate such as \u201c*has a casual style*\u201d. By leveraging the denotational semantics of natural language, we interpret these predicates as binary feature extractors and use them as building blocks for classical statistical models such as clustering, topic modeling, and regression. Language semantics also lets us specify constrains on the learned string parameters, such as \u201c*the parameters should be style-related*\u201d. To learn in our framework, we propose an algorithm to optimize the log-likelihood of these models, which iteratively optimizes continuous relaxations of string parameters and then discretizes them by explaining the continuous parameters with a language model. Evaluating our algorithm across three real corpora and four statistical models, we find that both the continuous relaxation and iterative refinement to be crucial. Finally, we show proof-of-concept applications in controllably generating explainable image clusters and describing major topic variations across news from different months.",
        "keywords": "Large Language Model; Explainability",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Ruiqi Zhong;Heng Wang;Dan Klein;Jacob Steinhardt",
        "authorids": "~Ruiqi_Zhong1;~Heng_Wang10;~Dan_Klein1;~Jacob_Steinhardt1",
        "gender": "M;M;;",
        "homepage": "https://ruiqi-zhong.github.io;https://arthur-heng.github.io;http://people.eecs.berkeley.edu/~klein/;",
        "dblp": "222/3024;61/5618-8.html;;35/10625",
        "google_scholar": "GskOShAAAAAJ;SLyDEswAAAAJ;;",
        "orcid": ";;;",
        "linkedin": ";;dan-klein/;",
        "or_profile": "~Ruiqi_Zhong1;~Heng_Wang10;~Dan_Klein1;~Jacob_Steinhardt1",
        "aff": "University of California, Berkeley;Xi'an Jiaotong University;University of California, Berkeley;University of California, Berkeley",
        "aff_domain": "berkeley.edu;xjtu.edu.cn;berkeley.edu;berkeley.edu",
        "position": "PhD student;Undergrad student;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nzhong2024explainable,\ntitle={Explainable, Steerable Models with Natural Language Parameters and Constraints},\nauthor={Ruiqi Zhong and Heng Wang and Dan Klein and Jacob Steinhardt},\nyear={2024},\nurl={https://openreview.net/forum?id=qKKwQvepx0}\n}",
        "github": "",
        "project": "",
        "reviewers": "53NP;1mws;th8x;xQLL",
        "site": "https://openreview.net/forum?id=qKKwQvepx0",
        "pdf_size": 1417120,
        "rating": "3;3;5;5",
        "confidence": "4;3;3;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;3;2",
        "presentation": "1;2;3;2",
        "wc_summary": "95;81;69;131",
        "wc_strengths": "23;16;44;52",
        "wc_weaknesses": "60;142;95;160",
        "wc_questions": "113;215;13;58",
        "wc_review": "291;454;221;401",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            94.0,
            23.259406699226016
        ],
        "wc_strengths_avg": [
            33.75,
            14.737282653189496
        ],
        "wc_weaknesses_avg": [
            114.25,
            39.29615121102829
        ],
        "wc_questions_avg": [
            99.75,
            75.37696929434082
        ],
        "wc_review_avg": [
            341.75,
            91.19587435843795
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:EMMvXO9wLrEJ:scholar.google.com/&scioq=Explainable,+Steerable+Models+with+Natural+Language+Parameters+and+Constraints&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "University of California, Berkeley;Xi'an Jiao Tong University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.berkeley.edu;https://www.xjtu.edu.cn",
        "aff_unique_abbr": "UC Berkeley;XJTU",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Berkeley;",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "qKf0tZtF6B",
        "title": "Learning Dynamical Systems with Helmholtz-Hodge Decomposition and Gaussian Processes",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Machine learning models provide alternatives for efficiently recognizing complex patterns from data, but two main concerns in applying them to modeling physical systems stem from their physics-agnostic design and lack of interpretability. This paper mitigates these concerns by encoding the Helmholtz-Hodge decomposition into a Gaussian process model, leading to a versatile framework that simultaneously learns the curl-free and divergence-free components of a dynamical system. Learning a predictive model in this form facilitates the exploitation of symmetry priors. In addition to improving predictive power, these priors link the identified features to comprehensible scientific properties of the system, thus complex responses can be modeled while retaining interpretability. We show that compared to baseline models, our model achieves better predictive performance on several benchmark dynamical systems while allowing accurate estimation of the energy evolution of the systems from noisy and sparse data.",
        "keywords": "Gaussian process;dynamical system;Helmholtz-Hodge decomposition",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Hao Xu;Jia Pan",
        "authorids": "~Hao_Xu16;~Jia_Pan1",
        "gender": "M;M",
        "homepage": ";https://www.cs.hku.hk/people/academic-staff/jpan",
        "dblp": ";97/896",
        "google_scholar": ";YYT8-7kAAAAJ",
        "orcid": "0000-0003-3203-3272;",
        "linkedin": ";",
        "or_profile": "~Hao_Xu16;~Jia_Pan1",
        "aff": "University of Hong Kong;University of Hong Kong",
        "aff_domain": "hku.hk;hku.hk",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\nxu2024learning,\ntitle={Learning Dynamical Systems with Helmholtz-Hodge Decomposition and Gaussian Processes},\nauthor={Hao Xu and Jia Pan},\nyear={2024},\nurl={https://openreview.net/forum?id=qKf0tZtF6B}\n}",
        "github": "",
        "project": "",
        "reviewers": "uHv2;oXvz;JNyE;Vrr3;e4ns",
        "site": "https://openreview.net/forum?id=qKf0tZtF6B",
        "pdf_size": 1488672,
        "rating": "3;6;6;6;8",
        "confidence": "4;3;4;3;3",
        "soundness": "2;3;3;3;4",
        "contribution": "2;2;3;3;4",
        "presentation": "2;3;3;4;4",
        "wc_summary": "75;37;70;56;59",
        "wc_strengths": "78;71;54;49;120",
        "wc_weaknesses": "379;113;151;90;91",
        "wc_questions": "248;32;95;40;28",
        "wc_review": "780;253;370;235;298",
        "wc_reply_reviewers": "0;60;0;0;23",
        "wc_reply_authors": "1603;948;1050;703;691",
        "reply_reviewers": "0;1;0;0;1",
        "reply_authors": "3;2;2;1;1",
        "rating_avg": [
            5.8,
            1.6
        ],
        "confidence_avg": [
            3.4,
            0.4898979485566356
        ],
        "soundness_avg": [
            3.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            2.8,
            0.7483314773547882
        ],
        "presentation_avg": [
            3.2,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            59.4,
            13.184839779079606
        ],
        "wc_strengths_avg": [
            74.4,
            25.16028616689405
        ],
        "wc_weaknesses_avg": [
            164.8,
            109.35885880896892
        ],
        "wc_questions_avg": [
            88.6,
            83.29129606387453
        ],
        "wc_review_avg": [
            387.2,
            201.8508360151129
        ],
        "wc_reply_reviewers_avg": [
            16.6,
            23.4571950582332
        ],
        "wc_reply_authors_avg": [
            999.0,
            332.41480111451114
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.8,
            0.7483314773547883
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.6634034720037775,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:xL7XPLdNiE8J:scholar.google.com/&scioq=Learning+Dynamical+Systems+with+Helmholtz-Hodge+Decomposition+and+Gaussian+Processes&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Hong Kong",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.hku.hk",
        "aff_unique_abbr": "HKU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "qKhpp9YAkO",
        "title": "Associative Transformer is a Sparse Representation Learner",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Emerging from the monolithic pairwise attention mechanism in conventional Transformer models, there is a growing interest in leveraging sparse interactions that align more closely with biological principles. Approaches including the Set Transformer and the Perceiver employ cross-attention consolidated with a latent space that forms an attention bottleneck with limited capacity. Building upon recent neuroscience studies of the Global Workspace Theory and associative memory, we propose the Associative Transformer (AiT). AiT induces low-rank explicit memory that serves as both priors to guide bottleneck attention in shared workspace and attractors within associative memory of a Hopfield network. Through joint end-to-end training, these priors naturally develop module specialization, each contributing a distinct inductive bias to form attention bottlenecks. A bottleneck can foster competition of inputs for information writing into the memory. We show that AiT is a sparse representation learner, learning distinct priors through the bottlenecks that are complexity-invariant to input quantities and dimensions. AiT demonstrates its superiority over methods such as the Set Transformer, Vision Transformer, and Coordination in various vision tasks.",
        "keywords": "global workspace theory;attention mechanism;associative memory;latent bottleneck",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Yuwei Sun;Hideya Ochiai;Zhirong Wu;Stephen Lin;Ryota Kanai",
        "authorids": "~Yuwei_Sun1;~Hideya_Ochiai1;~Zhirong_Wu4;~Stephen_Lin1;~Ryota_Kanai1",
        "gender": "M;M;;M;M",
        "homepage": "https://yuweisunn.github.io/;https://www.hongo.wide.ad.jp/~jo2lxq/;https://www.microsoft.com/en-us/research/people/stevelin/;;https://www.microsoft.com/en-us/research/people/wuzhiron/",
        "dblp": "69/6154;;55/4755-1.html;;147/5025",
        "google_scholar": "CG_AluYAAAAJ;;c3PYmxUAAAAJ;https://scholar.google.com/citations?hl=en;lH4zgcIAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;ryota-kanai-3585979/;",
        "or_profile": "~Yuwei_Sun1;~Hideya_Ochiai1;~Stephen_Lin1;~Ryota_Kanai1;~Zhirong_Wu1",
        "aff": "RIKEN AIP;The University of Tokyo;Microsoft Research;Araya, Inc.;Microsoft Research",
        "aff_domain": "riken.jp;u-tokyo.ac.jp;microsoft.com;research.araya.org;microsoft.com",
        "position": "Researcher;Associate Professor;Researcher;Principal Researcher;Researcher",
        "bibtex": "@misc{\nsun2024associative,\ntitle={Associative Transformer is a Sparse Representation Learner},\nauthor={Yuwei Sun and Hideya Ochiai and Zhirong Wu and Stephen Lin and Ryota Kanai},\nyear={2024},\nurl={https://openreview.net/forum?id=qKhpp9YAkO}\n}",
        "github": "",
        "project": "",
        "reviewers": "vNUE;H5y7;7hau",
        "site": "https://openreview.net/forum?id=qKhpp9YAkO",
        "pdf_size": 9817264,
        "rating": "3;3;6",
        "confidence": "3;3;3",
        "soundness": "3;3;2",
        "contribution": "2;2;2",
        "presentation": "3;3;2",
        "wc_summary": "64;114;66",
        "wc_strengths": "10;89;76",
        "wc_weaknesses": "32;243;182",
        "wc_questions": "53;503;125",
        "wc_review": "159;949;449",
        "wc_reply_reviewers": "0;463;44",
        "wc_reply_authors": "1012;2638;1139",
        "reply_reviewers": "0;2;1",
        "reply_authors": "2;5;2",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            81.33333333333333,
            23.11324776447962
        ],
        "wc_strengths_avg": [
            58.333333333333336,
            34.58644564308715
        ],
        "wc_weaknesses_avg": [
            152.33333333333334,
            88.6578943028889
        ],
        "wc_questions_avg": [
            227.0,
            197.36261044078233
        ],
        "wc_review_avg": [
            519.0,
            326.2923024937405
        ],
        "wc_reply_reviewers_avg": [
            169.0,
            208.66400424286567
        ],
        "wc_reply_authors_avg": [
            1596.3333333333333,
            738.3920969843115
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            3.0,
            1.4142135623730951
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2181440856411338505&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;3;2",
        "aff_unique_norm": "RIKEN;University of Tokyo;Microsoft;Araya, Inc.",
        "aff_unique_dep": "Advanced Institute for Computational Science;;Microsoft Research;",
        "aff_unique_url": "https://www.aip.riken.jp;https://www.u-tokyo.ac.jp;https://www.microsoft.com/en-us/research;",
        "aff_unique_abbr": "RIKEN AIP;UTokyo;MSR;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;1;1",
        "aff_country_unique": "Japan;United States"
    },
    {
        "title": "SAFLEX: Self-Adaptive Augmentation via Feature Label Extrapolation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17737",
        "id": "qL6brrBDk2",
        "author_site": "Mucong Ding, Bang An, Yuancheng Xu, Anirudh Satheesh, Furong Huang",
        "tldr": "",
        "abstract": "Data augmentation, a cornerstone technique in deep learning, is crucial in enhancing model performance, especially with scarce labeled data. While traditional techniques are effective, their reliance on hand-crafted methods limits their applicability across diverse data types and tasks. Although modern learnable augmentation methods offer increased adaptability, they are computationally expensive and challenging to incorporate within prevalent augmentation workflows. In this work, we present a novel, efficient method for data augmentation, effectively bridging the gap between existing augmentation strategies and emerging datasets and learning tasks. We introduce SAFLEX (Self-Adaptive Augmentation via Feature Label EXtrapolation), which learns the sample weights and soft labels of augmented samples provided by any given upstream augmentation pipeline, using a specifically designed efficient bilevel optimization algorithm. Remarkably, SAFLEX effectively reduces the noise and label errors of the upstream augmentation pipeline with a marginal computational cost. As a versatile module, SAFLEX excels across diverse datasets, including natural and medical images and tabular data, showcasing its prowess in few-shot learning and out-of-distribution generalization. SAFLEX seamlessly integrates with common augmentation strategies like RandAug, CutMix, and those from large pre-trained generative models like stable diffusion and is also compatible with frameworks such as CLIP's fine-tuning. Our findings highlight the potential to adapt existing augmentation pipelines for new data types and tasks, signaling a move towards more adaptable and resilient training frameworks.",
        "keywords": "Data Augmentation;Learnable Augmentation;Bilevel Optimization",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/30af5f986377fd38ff78a0075de177bc3882d31a.pdf",
        "author": "Mucong Ding;Bang An;Yuancheng Xu;Anirudh Satheesh;Furong Huang",
        "authorids": "~Mucong_Ding1;~Bang_An1;~Yuancheng_Xu1;~Anirudh_Satheesh1;~Furong_Huang1",
        "gender": "M;;M;;F",
        "homepage": "http://www.cs.umd.edu/~mcding/;https://bangann.github.io/;https://yuancheng-xu.github.io;;https://furong-huang.com",
        "dblp": "232/1754.html;188/0741;;382/3678;72/8513",
        "google_scholar": "_bVao2MAAAAJ;3ce6z_sAAAAJ;OPB0QgwAAAAJ;RWESCxUAAAAJ;13yyuCcAAAAJ",
        "orcid": "0000-0002-6173-8055;;;0009-0004-9480-3601;",
        "linkedin": "mucong-ding-489296104;;yuancheng-xu/;anirudh-satheesh;",
        "or_profile": "~Mucong_Ding1;~Bang_An1;~Yuancheng_Xu1;~Anirudh_Satheesh1;~Furong_Huang1",
        "aff": "Department of Computer Science, University of Maryland, College Park;University of Maryland, College Park;University of Maryland, College Park;University of Maryland, College Park;University of Maryland",
        "aff_domain": "cs.umd.edu;umd.edu;umd.edu;umd.edu;cs.umd.edu",
        "position": "PhD student;PhD student;PhD student;Undergrad student;Assistant Professor",
        "bibtex": "@inproceedings{\nding2024saflex,\ntitle={{SAFLEX}: Self-Adaptive Augmentation via Feature Label Extrapolation},\nauthor={Mucong Ding and Bang An and Yuancheng Xu and Anirudh Satheesh and Furong Huang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=qL6brrBDk2}\n}",
        "github": "",
        "project": "",
        "reviewers": "GM6j;NKYa;PN9Y;EBBs",
        "pdf_size": 573975,
        "rating": "5;8;8;8",
        "confidence": "4;4;4;3",
        "soundness": "3;3;3;4",
        "contribution": "2;3;4;4",
        "presentation": "3;2;4;4",
        "wc_summary": "174;179;102;82",
        "wc_strengths": "27;103;22;38",
        "wc_weaknesses": "117;129;44;79",
        "wc_questions": "9;108;18;10",
        "wc_review": "327;519;186;209",
        "wc_reply_reviewers": "81;196;0;0",
        "wc_reply_authors": "2045;1123;297;264",
        "reply_reviewers": "1;2;0;0",
        "reply_authors": "5;3;1;1",
        "rating_avg": [
            7.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            134.25,
            42.87408891160254
        ],
        "wc_strengths_avg": [
            47.5,
            32.56148031032987
        ],
        "wc_weaknesses_avg": [
            92.25,
            33.41687447981932
        ],
        "wc_questions_avg": [
            36.25,
            41.57147459496716
        ],
        "wc_review_avg": [
            310.25,
            131.85858902627467
        ],
        "wc_reply_reviewers_avg": [
            69.25,
            80.3037203372297
        ],
        "wc_reply_authors_avg": [
            932.25,
            728.8173210757275
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.5,
            1.6583123951777
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14483193376210006643&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=qL6brrBDk2",
        "pdf": "https://openreview.net/pdf?id=qL6brrBDk2",
        "email": "cs.umd.edu;umd.edu;umd.edu;umd.edu;cs.umd.edu",
        "author_num": 5,
        "aff_unique_index": "0;1;1;1;1",
        "aff_unique_norm": "University of Maryland, College Park;University of Maryland",
        "aff_unique_dep": "Department of Computer Science;",
        "aff_unique_url": "https://www/umd.edu;https://www/umd.edu",
        "aff_unique_abbr": "UMD;UMD",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "College Park;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Zero and Few-shot Semantic Parsing with Ambiguous Inputs",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17736",
        "id": "qL9gogRepu",
        "author_site": "Elias Stengel-Eskin, Kyle Rawlins, Benjamin Van Durme",
        "tldr": "",
        "abstract": "Despite the frequent challenges posed by ambiguity when representing meaning via natural language, it is often ignored or deliberately removed in tasks mapping language to formally-designed representations, which generally assume a one-to-one mapping between linguistic and formal representations. \nWe attempt to address this shortcoming by introducing AmP, a framework, dataset, and challenge for translating ambiguous natural language to formal representations like logic and code. \nWe define templates and generate data for five well-documented linguistic ambiguities.\nUsing AmP, we investigate how several few-shot text-to-code systems handle ambiguity, introducing three new metrics.\nWe find that large pre-trained models perform poorly at capturing the distribution of possible meanings without deliberate instruction.\nHowever, models are able to capture the distribution well when ambiguity is attested in their inputs. \nThese results motivate a call for including ambiguity explicitly in datasets and promote considering the distribution of possible outputs when evaluating systems. We release our data and code.",
        "keywords": "semantic parsing;text-to-code;ambiguity;NLP;calibration",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Elias Stengel-Eskin;Kyle Rawlins;Benjamin Van Durme",
        "authorids": "~Elias_Stengel-Eskin1;~Kyle_Rawlins1;~Benjamin_Van_Durme2",
        "gender": "M;M;",
        "homepage": "https://esteng.github.io;https://rawlins.io/;",
        "dblp": "212/6138;85/5141;",
        "google_scholar": "gr_ZVSQAAAAJ;8hA9VGUAAAAJ;",
        "orcid": "0000-0002-6689-505X;;",
        "linkedin": ";;",
        "or_profile": "~Elias_Stengel-Eskin1;~Kyle_Rawlins1;~Benjamin_Van_Durme2",
        "aff": "University of North Carolina at Chapel Hill;Johns Hopkins University;",
        "aff_domain": "cs.unc.edu;jhu.edu;",
        "position": "Postdoc;Associate Professor;",
        "bibtex": "@inproceedings{\nstengel-eskin2024zero,\ntitle={Zero and Few-shot Semantic Parsing with Ambiguous Inputs},\nauthor={Elias Stengel-Eskin and Kyle Rawlins and Benjamin Van Durme},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=qL9gogRepu}\n}",
        "github": "",
        "project": "",
        "reviewers": "49nJ;Qhxa;dZKu;PRrS",
        "pdf_size": 636413,
        "rating": "6;6;8;8",
        "confidence": "2;4;3;4",
        "soundness": "2;3;4;4",
        "contribution": "2;3;3;4",
        "presentation": "3;4;4;4",
        "wc_summary": "68;244;134;208",
        "wc_strengths": "53;69;72;113",
        "wc_weaknesses": "92;630;32;69",
        "wc_questions": "232;242;91;115",
        "wc_review": "445;1185;329;505",
        "wc_reply_reviewers": "9;0;56;0",
        "wc_reply_authors": "984;630;718;934",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "3;2;1;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            163.5,
            67.9172290365265
        ],
        "wc_strengths_avg": [
            76.75,
            22.1401784093986
        ],
        "wc_weaknesses_avg": [
            205.75,
            245.8743327393081
        ],
        "wc_questions_avg": [
            170.0,
            67.62765706425145
        ],
        "wc_review_avg": [
            616.0,
            334.5489500805525
        ],
        "wc_reply_reviewers_avg": [
            16.25,
            23.24193408475293
        ],
        "wc_reply_authors_avg": [
            816.5,
            146.92430023655038
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.30151134457776363,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7423746466477443864&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=qL9gogRepu",
        "pdf": "https://openreview.net/pdf?id=qL9gogRepu",
        "email": "cs.unc.edu;jhu.edu;",
        "author_num": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of North Carolina;Johns Hopkins University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.unc.edu;https://www.jhu.edu",
        "aff_unique_abbr": "UNC;JHU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Chapel Hill;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "FairSeg: A Large-Scale Medical Image Segmentation Dataset for Fairness Learning Using Segment Anything Model with Fair Error-Bound Scaling",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17735",
        "id": "qNrJJZAKI3",
        "author_site": "Yu Tian, Min Shi, Yan Luo, Ava Kouhana, Tobias Elze, Mengyu Wang",
        "tldr": "",
        "abstract": "Fairness in artificial intelligence models has gained significantly more attention in recent years, especially in the area of medicine, as fairness in medical models is critical to people's well-being and lives. High-quality medical fairness datasets are needed to promote fairness learning research. Existing medical fairness datasets are all for classification tasks, and no fairness datasets are available for medical segmentation, while medical segmentation is an equally important clinical task as classifications, which can provide detailed spatial information on organ abnormalities ready to be assessed by clinicians. In this paper, we propose the first fairness dataset for medical segmentation named Harvard-FairSeg with 10,000 subject samples. In addition, we propose a fair error-bound scaling approach to reweight the loss function with the upper error-bound in each identity group, using the segment anything model (SAM). We anticipate that the segmentation performance equity can be improved by explicitly tackling the hard cases with high training errors in each identity group. To facilitate fair comparisons, we utilize a novel equity-scaled segmentation performance metric to compare segmentation metrics in the context of fairness, such as the equity-scaled Dice coefficient. Through comprehensive experiments, we demonstrate that our fair error-bound scaling approach either has superior or comparable fairness performance to the state-of-the-art fairness learning models. The dataset and code are publicly accessible via https://ophai.hms.harvard.edu/datasets/harvard-fairseg10k.",
        "keywords": "Medical Segmentation;Medical Imaging;Fairness Learning;Health Equity;Deep Learning;Trustworthy AI",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Yu Tian;Min Shi;Yan Luo;Ava Kouhana;Tobias Elze;Mengyu Wang",
        "authorids": "~Yu_Tian8;~Min_Shi4;~Yan_Luo2;akouhana@meei.harvard.edu;~Tobias_Elze1;~Mengyu_Wang4",
        "gender": "M;M;M;;M;M",
        "homepage": "https://yutianyt.com/;;https://luoyan407.github.io/;;https://ophai.hms.harvard.edu;https://ophai.hms.harvard.edu/team/dr-wang/",
        "dblp": "15/4658;;;;69/9815;179/8319-1",
        "google_scholar": "knptLuEAAAAJ;https://scholar.google.com/citations?hl=en;LSgqnKQAAAAJ;;;i9B02k4AAAAJ",
        "orcid": "0000-0001-5533-7506;;0000-0001-5135-0316;;;",
        "linkedin": "yutianyt/;;;;;",
        "or_profile": "~Yu_Tian8;~Min_Shi4;~Yan_Luo2;akouhana@meei.harvard.edu;~Tobias_Elze1;~Mengyu_Wang4",
        "aff": "Harvard University;Harvard University;Harvard Ophthalmology AI Lab;;Harvard University;Harvard University",
        "aff_domain": "harvard.edu;harvard.edu;meei.harvard.edu;;harvard.edu;harvard.edu",
        "position": "Postdoc;Postdoc;Postdoc;;Researcher;Assistant Professor",
        "bibtex": "@inproceedings{\ntian2024fairseg,\ntitle={FairSeg: A Large-Scale Medical Image Segmentation Dataset for Fairness Learning Using Segment Anything Model with Fair Error-Bound Scaling},\nauthor={Yu Tian and Min Shi and Yan Luo and Ava Kouhana and Tobias Elze and Mengyu Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=qNrJJZAKI3}\n}",
        "github": "",
        "project": "",
        "reviewers": "f8dv;5cUh;b2i2;Suah",
        "pdf_size": 895377,
        "rating": "6;6;8;8",
        "confidence": "5;3;4;3",
        "soundness": "4;3;4;3",
        "contribution": "3;4;3;4",
        "presentation": "4;4;4;3",
        "wc_summary": "50;105;49;33",
        "wc_strengths": "26;21;107;81",
        "wc_weaknesses": "96;8;46;21",
        "wc_questions": "4;44;45;90",
        "wc_review": "176;178;247;225",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "669;141;602;991",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.5,
            0.5
        ],
        "presentation_avg": [
            3.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            59.25,
            27.261465477849864
        ],
        "wc_strengths_avg": [
            58.75,
            36.47173563185608
        ],
        "wc_weaknesses_avg": [
            42.75,
            33.640563312762765
        ],
        "wc_questions_avg": [
            45.75,
            30.433328769623607
        ],
        "wc_review_avg": [
            206.5,
            30.516389039334257
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            600.75,
            303.44882187940686
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.30151134457776363,
        "gs_citation": 17,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=80024191402779619&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=qNrJJZAKI3",
        "pdf": "https://openreview.net/pdf?id=qNrJJZAKI3",
        "email": "harvard.edu;harvard.edu;meei.harvard.edu;;harvard.edu;harvard.edu",
        "author_num": 6,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Harvard University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.harvard.edu",
        "aff_unique_abbr": "Harvard",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Masks, Signs, And Learning Rate Rewinding",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17734",
        "id": "qODvxQ8TXW",
        "author_site": "Advait Gadhikar, Rebekka Burkholz",
        "tldr": "",
        "abstract": "Learning Rate Rewinding (LRR) has been established as a strong variant of Iterative Magnitude Pruning (IMP) to find lottery tickets in deep overparameterized neural networks. While both iterative pruning schemes couple structure and parameter learning, understanding how LRR excels in both aspects can bring us closer to the design of more flexible deep learning algorithms that can optimize diverse sets of sparse architectures. To this end, we conduct experiments that disentangle the effect of mask learning and parameter optimization and how both benefit from overparameterization. The ability of LRR to flip parameter signs early and stay robust to sign perturbations seems to make it not only more effective in mask identification but also in optimizing  diverse sets of masks, including random ones. In support of this hypothesis, we prove in a simplified single hidden neuron setting that LRR succeeds in more cases than IMP, as it can escape initially problematic sign configurations.",
        "keywords": "sparsity;pruning;lottery tickets;learning rate rewinding;iterative magnitude pruning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/94d8718d41b8c2359f2d77aca617b6155b927ba7.zip",
        "author": "Advait Harshal Gadhikar;Rebekka Burkholz",
        "authorids": "~Advait_Harshal_Gadhikar2;~Rebekka_Burkholz1",
        "gender": "F;M",
        "homepage": "https://sites.google.com/view/rebekkaburkholz/startseite;https://advaitgadhikar.github.io/",
        "dblp": "194/3172;285/5352.html",
        "google_scholar": "https://scholar.google.ch/citations?user=vkWBb2wAAAAJ;parDMogAAAAJ",
        "orcid": ";",
        "linkedin": ";advaitgadhikar/",
        "or_profile": "~Rebekka_Burkholz1;~Advait_Harshal_Gadhikar1",
        "aff": "Helmholtz Center CISPA for Information Security;CISPA Helmholtz Center for Information Security",
        "aff_domain": "cispa.saarland;cispa.de",
        "position": "Associate Professor;PhD student",
        "bibtex": "@inproceedings{\ngadhikar2024masks,\ntitle={Masks, Signs, And Learning Rate Rewinding},\nauthor={Advait Harshal Gadhikar and Rebekka Burkholz},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=qODvxQ8TXW}\n}",
        "github": "",
        "project": "",
        "reviewers": "yLRG;z4v8;6o5w",
        "pdf_size": 1023941,
        "rating": "6;6;6",
        "confidence": "3;4;3",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "3;4;4",
        "wc_summary": "81;123;148",
        "wc_strengths": "78;147;169",
        "wc_weaknesses": "137;216;120",
        "wc_questions": "112;26;3",
        "wc_review": "408;512;440",
        "wc_reply_reviewers": "41;63;0",
        "wc_reply_authors": "554;541;333",
        "reply_reviewers": "1;1;0",
        "reply_authors": "2;2;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            117.33333333333333,
            27.644569488820444
        ],
        "wc_strengths_avg": [
            131.33333333333334,
            38.76711091748892
        ],
        "wc_weaknesses_avg": [
            157.66666666666666,
            41.82768886223043
        ],
        "wc_questions_avg": [
            47.0,
            46.91126375047539
        ],
        "wc_review_avg": [
            453.3333333333333,
            43.49201714746691
        ],
        "wc_reply_reviewers_avg": [
            34.666666666666664,
            26.10661899893503
        ],
        "wc_reply_authors_avg": [
            476.0,
            101.25545252808199
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13957212748400092559&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=qODvxQ8TXW",
        "pdf": "https://openreview.net/pdf?id=qODvxQ8TXW",
        "email": "cispa.saarland;cispa.de",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Helmholtz Center CISPA;CISPA Helmholtz Center for Information Security",
        "aff_unique_dep": "Information Security;",
        "aff_unique_url": "https://www.cispa.de/;https://www.cispa.de/",
        "aff_unique_abbr": "CISPA;CISPA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "qOFLn0pMoe",
        "title": "High-Probability Convergence for Composite and Distributed Stochastic Minimization and Variational Inequalities with Heavy-Tailed Noise",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "High-probability analysis of stochastic first-order optimization methods under mild assumptions on the noise has been gaining a lot of attention in recent years. Typically, gradient clipping is one of the key algorithmic ingredients to derive good high-probability guarantees when the noise is heavy-tailed. However, if implemented naively, clipping can spoil the convergence of the popular methods for composite and distributed optimization (Prox-SGD/Parallel SGD) even in the absence of any noise. Due to this reason, many works on high-probability analysis consider only unconstrained non-distributed problems, and the existing results for composite/distributed problems do not include some important special cases (like strongly convex problems) and are not optimal. To address this issue, we propose new stochastic methods for composite and distributed optimization based on the clipping of stochastic gradient differences and prove tight high-probability convergence results (including nearly optimal ones) for the new methods. Using similar ideas, we also develop new methods for composite and distributed variational inequalities and analyze the high-probability convergence of these methods.",
        "keywords": "heavy-tailed noise;variational inequalities;extragradient method;gradient descent-ascent;high-probability bounds;clipping;composite minimization;distributed minimization",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Eduard Gorbunov;Abdurakhmon Sadiev;Marina Danilova;Samuel Horv\u00e1th;Gauthier Gidel;Pavel Dvurechensky;Alexander Gasnikov;Peter Richt\u00e1rik",
        "authorids": "~Eduard_Gorbunov1;~Abdurakhmon_Sadiev1;~Marina_Danilova1;~Samuel_Horv\u00e1th1;~Gauthier_Gidel1;~Pavel_Dvurechensky1;~Alexander_Gasnikov1;~Peter_Richt\u00e1rik1",
        "gender": "M;M;F;M;M;;M;M",
        "homepage": "https://eduardgorbunov.github.io;https://sadiev.netlify.app;https://marinadanya.github.io/;https://sites.google.com/view/samuelhorvath;https://gauthiergidel.github.io/;http://wias-berlin.de/people/dvureche/?lang=1;https://arxiv.org/search/?query=Gasnikov&searchtype=all&source=header;https://richtarik.org",
        "dblp": "215/5512.html;264/9455;;234/8604;188/6326;164/7242;153/1930;62/8001",
        "google_scholar": "https://scholar.google.ru/citations?user=85j2RqQAAAAJ;R-xZRIAAAAAJ;mAip6kUAAAAJ;k252J7kAAAAJ;https://scholar.google.fr/citations?user=bDrXQPUAAAAJ;28MSou8AAAAJ;AmeE8qkAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;0000-0003-0619-9260;;0000-0003-1201-2343;;0000-0003-4380-5848",
        "linkedin": ";;;samuel-horvath/;;;;richtarik/",
        "or_profile": "~Eduard_Gorbunov1;~Abdurakhmon_Sadiev1;~Marina_Danilova1;~Samuel_Horv\u00e1th1;~Gauthier_Gidel1;~Pavel_Dvurechensky1;~Alexander_Vladimirovich_Gasnikov1;~Peter_Richtarik1",
        "aff": "Mohamed bin Zayed University of Artificial Intelligence;King Abdullah University of Science and Technology;Moscow Institute of Physics and Technology;MBZUAI;Mila - Quebec Artificial Intelligence Institute;Weierstrass Institute for Applied Analysis and Stochastics;Moscow Institute of Physics and Technology;King Abdullah University of Science and Technology (KAUST)",
        "aff_domain": "mbzuai.ac.ae;kaust.edu.sa;mipt.ru;mbzuai.ac.ae;mila.quebec;wias-berlin.de;mipt.ru;kaust.edu.sa",
        "position": "Postdoc;PhD student;Researcher;Assistant Professor;Assistant Professor;Postdoc;Associate Professor;Full Professor",
        "bibtex": "@misc{\ngorbunov2024highprobability,\ntitle={High-Probability Convergence for Composite and Distributed Stochastic Minimization and Variational Inequalities with Heavy-Tailed Noise},\nauthor={Eduard Gorbunov and Abdurakhmon Sadiev and Marina Danilova and Samuel Horv{\\'a}th and Gauthier Gidel and Pavel Dvurechensky and Alexander Gasnikov and Peter Richt{\\'a}rik},\nyear={2024},\nurl={https://openreview.net/forum?id=qOFLn0pMoe}\n}",
        "github": "",
        "project": "",
        "reviewers": "sYPF;Da4b;LBP8",
        "site": "https://openreview.net/forum?id=qOFLn0pMoe",
        "pdf_size": 1081435,
        "rating": "5;5;5",
        "confidence": "3;4;3",
        "soundness": "3;3;4",
        "contribution": "2;2;2",
        "presentation": "3;2;4",
        "wc_summary": "25;95;53",
        "wc_strengths": "55;99;99",
        "wc_weaknesses": "129;1712;306",
        "wc_questions": "65;115;26",
        "wc_review": "274;2021;484",
        "wc_reply_reviewers": "0;99;0",
        "wc_reply_authors": "808;1706;1674",
        "reply_reviewers": "0;1;0",
        "reply_authors": "2;4;4",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            57.666666666666664,
            28.767265347188555
        ],
        "wc_strengths_avg": [
            84.33333333333333,
            20.741798914805393
        ],
        "wc_weaknesses_avg": [
            715.6666666666666,
            708.210106928414
        ],
        "wc_questions_avg": [
            68.66666666666667,
            36.42648609032841
        ],
        "wc_review_avg": [
            926.3333333333334,
            778.7795294918552
        ],
        "wc_reply_reviewers_avg": [
            33.0,
            46.66904755831214
        ],
        "wc_reply_authors_avg": [
            1396.0,
            415.98397405028317
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 18,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3668356256689388675&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 14,
        "aff_unique_index": "0;1;2;0;3;4;2;1",
        "aff_unique_norm": "Mohamed bin Zayed University of Artificial Intelligence;King Abdullah University of Science and Technology;Moscow Institute of Physics and Technology;Quebec Artificial Intelligence Institute;Weierstrass Institute for Applied Analysis and Stochastics",
        "aff_unique_dep": ";;;Artificial Intelligence;",
        "aff_unique_url": "https://mbzuai.ac.ae;https://www.kast.kau.edu.sa;https://www.mipt.ru/en;https://mila.quebec;https://www.wias-berlin.de/",
        "aff_unique_abbr": "MBZUAI;KAUST;MIPT;Mila;WIAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;0;3;4;2;1",
        "aff_country_unique": "United Arab Emirates;Saudi Arabia;Russian Federation;Canada;Germany"
    },
    {
        "id": "qOgLmcJxxF",
        "title": "Sample-Efficient Training for Score-Based Diffusion",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Score-based diffusion models have become the most popular approach to deep generative modeling of images, largely due to their empirical performance and reliability. Recently, a number of theoretical works \\citep{chen2022, Chen2022ImprovedAO, chen2023probability, benton2023linear} have shown that diffusion models can efficiently sample, assuming $L^2$-accurate score estimates. \nThe score-matching objective naturally approximates the true score in $L^2$, but the sample complexity of existing bounds depends \\emph{polynomially} on the data radius and desired Wasserstein accuracy.  By contrast, the time complexity of sampling is only logarithmic in these parameters.  We show that estimating the score in $L^2$ \\emph{requires} this polynomial dependence, \nbut that polylogarithmic samples actually do suffice for sampling.  We show that with a polylogarithmic number of samples, the ERM of the score-matching objective is $L^2$ accurate on all but a probability $\\delta$ fraction of the true distribution, and that this weaker guarantee is sufficient for efficient sampling.",
        "keywords": "Diffusion;Learning Theory;Sampling",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Shivam Gupta;Aditya Parulekar;Eric Price;Zhiyang Xun",
        "authorids": "~Shivam_Gupta1;~Aditya_Parulekar1;~Eric_Price1;~Zhiyang_Xun1",
        "gender": "M;M;;M",
        "homepage": "https://shivamgupta2.github.io/;https://www.linkedin.com/in/aditya-parulekar-b97899190/;;",
        "dblp": "29/8830-2;293/7171;;307/5331",
        "google_scholar": "HsbPV-EAAAAJ;;;ICzrrFkAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Shivam_Gupta1;~Aditya_Parulekar1;~Eric_Price1;~Zhiyang_Xun1",
        "aff": "University of Texas, Austin;University of Texas at Austin;;University of Texas at Austin",
        "aff_domain": "utexas.edu;utexas.edu;;utexas.edu",
        "position": "PhD student;PhD student;;PhD student",
        "bibtex": "@misc{\ngupta2024sampleefficient,\ntitle={Sample-Efficient Training for Score-Based Diffusion},\nauthor={Shivam Gupta and Aditya Parulekar and Eric Price and Zhiyang Xun},\nyear={2024},\nurl={https://openreview.net/forum?id=qOgLmcJxxF}\n}",
        "github": "",
        "project": "",
        "reviewers": "KNkT;yv9g;uE9j;3jfL",
        "site": "https://openreview.net/forum?id=qOgLmcJxxF",
        "pdf_size": 589460,
        "rating": "5;6;6;6",
        "confidence": "3;3;4;3",
        "soundness": "2;3;3;3",
        "contribution": "2;3;2;2",
        "presentation": "3;2;3;2",
        "wc_summary": "21;66;150;66",
        "wc_strengths": "60;108;68;96",
        "wc_weaknesses": "48;251;268;95",
        "wc_questions": "123;173;9;214",
        "wc_review": "252;598;495;471",
        "wc_reply_reviewers": "0;11;40;0",
        "wc_reply_authors": "175;353;546;265",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            75.75,
            46.63890543312525
        ],
        "wc_strengths_avg": [
            83.0,
            19.672315572906
        ],
        "wc_weaknesses_avg": [
            165.5,
            95.64648451459155
        ],
        "wc_questions_avg": [
            129.75,
            76.80291335620024
        ],
        "wc_review_avg": [
            454.0,
            126.00595224036046
        ],
        "wc_reply_reviewers_avg": [
            12.75,
            16.361158271956175
        ],
        "wc_reply_authors_avg": [
            334.75,
            137.24499080112176
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:v-vQC7faMo0J:scholar.google.com/&scioq=Sample-Efficient+Training+for+Score-Based+Diffusion&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Texas at Austin",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.utexas.edu",
        "aff_unique_abbr": "UT Austin",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Austin",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Guess & Sketch: Language Model Guided Transpilation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17733",
        "id": "qPFsIbF3V6",
        "author_site": "Celine Lee, Abdulrahman Mahmoud, Michal Kurek, Simone Campanoni, David Brooks, Stephen Chong, Gu-Yeon Wei, Alexander Rush",
        "tldr": "",
        "abstract": "Maintaining legacy software requires many software and systems engineering hours. Assembly code programs, which demand low-level control over the computer machine state and have no variable names, are particularly difficult for humans to analyze.\nExisting conventional program translators guarantee correctness, but are hand-engineered for the source and target programming languages in question. Learned transpilation, i.e.  automatic translation of code, offers an alternative to manual re-writing and engineering efforts. Automated symbolic program translation approaches guarantee correctness but struggle to scale to longer programs due to the exponentially large search space. Their rigid rule-based systems also limit their expressivity, so they can only reason about a reduced space of programs. Probabilistic neural language models (LMs) produce plausible outputs for every input, but do so at the cost of guaranteed correctness. In this work, we leverage the strengths of LMs and symbolic solvers in a neurosymbolic approach to learned transpilation for assembly code. Assembly code is an appropriate setting for a neurosymbolic approach, since assembly code can be divided into shorter non-branching basic blocks amenable to the use of symbolic methods. Guess & Sketch extracts alignment and confidence information from features of the LM then passes it to a symbolic solver to resolve semantic equivalence of the transpilation input and output. We test Guess & Sketch on three different test sets of assembly transpilation tasks, varying in difficulty, and show that it successfully transpiles 57.6% more examples than GPT-4 and 39.6% more examples than an engineered transpiler. We also share a training and evaluation dataset for this task.",
        "keywords": "transpilation;program translation;assembly code;language model;neurosymbolic;machine learning",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "",
        "author": "Celine Lee;Abdulrahman Mahmoud;Michal Kurek;Simone Campanoni;David Brooks;Stephen Chong;Gu-Yeon Wei;Alexander M Rush",
        "authorids": "~Celine_Lee1;~Abdulrahman_Mahmoud1;~Michal_Kurek1;~Simone_Campanoni2;~David_Brooks1;~Stephen_Chong1;~Gu-Yeon_Wei1;~Alexander_M_Rush1",
        "gender": "F;;M;;M;M;M;M",
        "homepage": "https://celine-lee.github.io;https://ma3mool.github.io/;;;https://people.seas.harvard.edu/~chong/;;http://rush.seas.harvard.edu/;http://users.cs.northwestern.edu/~simonec",
        "dblp": "259/9736;126/0708;;30/135;;21/5583;http://dblp.uni-trier.de/pers/hd/r/Rush:Alexander_M=;https://dblp.uni-trier.de/pid/39/2917.html",
        "google_scholar": "F27S1VcAAAAJ;LRZKQpkAAAAJ;;vXHA_XYAAAAJ;;IR0yJB8AAAAJ;LIjnUGgAAAAJ;https://scholar.google.com.tw/citations?user=bY5WiJIAAAAJ",
        "orcid": "0000-0002-8436-5124;;;;;;0000-0002-9900-1606;0000-0001-9806-7016",
        "linkedin": ";;michalkurek25a0;;;;sasha-rush-a69b6917/;simone-campanoni-99920b5/",
        "or_profile": "~Celine_Lee1;~Abdulrahman_Mahmoud1;~Michal_Kurek1;~David_Brooks1;~Stephen_Chong1;~Gu-Yeon_Wei1;~Alexander_M_Rush1;~Simone_Campanoni1",
        "aff": "Cornell University;Harvard University, Harvard University;Harvard University;Computer Science, School of Engineering and Applied Sciences;School of Engineering and Applied Sciences, Harvard University;Harvard University;School of Engineering and Applied Sciences, Harvard University;Northwestern University",
        "aff_domain": "cornell.edu;g.harvard.edu;harvard.edu;eecs.harvard.edu;seas.harvard.edu;harvard.edu;seas.harvard.edu;northwestern.edu",
        "position": "PhD student;Postdoc;Undergrad student;Full Professor;Full Professor;Full Professor;Assistant Professor;Associate Professor",
        "bibtex": "@inproceedings{\nlee2024guess,\ntitle={Guess \\& Sketch: Language Model Guided Transpilation},\nauthor={Celine Lee and Abdulrahman Mahmoud and Michal Kurek and Simone Campanoni and David Brooks and Stephen Chong and Gu-Yeon Wei and Alexander M Rush},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=qPFsIbF3V6}\n}",
        "github": "",
        "project": "",
        "reviewers": "nDKt;LBov;awtu",
        "pdf_size": 1056669,
        "rating": "5;8;8",
        "confidence": "2;4;2",
        "soundness": "3;3;4",
        "contribution": "2;3;4",
        "presentation": "4;4;4",
        "wc_summary": "75;102;82",
        "wc_strengths": "52;136;38",
        "wc_weaknesses": "136;238;72",
        "wc_questions": "73;167;3",
        "wc_review": "336;643;195",
        "wc_reply_reviewers": "0;36;9",
        "wc_reply_authors": "435;504;289",
        "reply_reviewers": "0;1;1",
        "reply_authors": "1;1;2",
        "rating_avg": [
            7.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            4.0,
            0.0
        ],
        "wc_summary_avg": [
            86.33333333333333,
            11.440668201153676
        ],
        "wc_strengths_avg": [
            75.33333333333333,
            43.27688631231328
        ],
        "wc_weaknesses_avg": [
            148.66666666666666,
            68.35853193924581
        ],
        "wc_questions_avg": [
            81.0,
            67.19126927411527
        ],
        "wc_review_avg": [
            391.3333333333333,
            187.03356799129818
        ],
        "wc_reply_reviewers_avg": [
            15.0,
            15.297058540778355
        ],
        "wc_reply_authors_avg": [
            409.3333333333333,
            89.63010406975746
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.5000000000000001,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9816822207076017812&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=qPFsIbF3V6",
        "pdf": "https://openreview.net/pdf?id=qPFsIbF3V6",
        "email": "cornell.edu;g.harvard.edu;harvard.edu;eecs.harvard.edu;seas.harvard.edu;harvard.edu;seas.harvard.edu;northwestern.edu",
        "author_num": 8,
        "aff_unique_index": "0;1;1;2;1;1;1;3",
        "aff_unique_norm": "Cornell University;Harvard University;School of Engineering and Applied Sciences;Northwestern University",
        "aff_unique_dep": ";;Computer Science;",
        "aff_unique_url": "https://www.cornell.edu;https://www.harvard.edu;;https://www.northwestern.edu",
        "aff_unique_abbr": "Cornell;Harvard;;NU",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Cambridge",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States;"
    },
    {
        "title": "Robustifying and Boosting Training-Free Neural Architecture Search",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17732",
        "id": "qPloNoDJZn",
        "author_site": "Zhenfeng He, Yao Shu, Zhongxiang Dai, Bryan Kian Hsiang Low",
        "tldr": "",
        "abstract": "Neural architecture search (NAS) has become a key component of AutoML and a standard tool to automate the design of deep neural networks. Recently, training-free NAS as an emerging paradigm has successfully reduced the search costs of standard training-based NAS by estimating the true architecture performance with only training-free metrics. Nevertheless, the estimation ability of these metrics typically varies across different tasks, making it challenging to achieve robust and consistently good search performance on diverse tasks with only a single training-free metric. Meanwhile, the estimation gap between training-free metrics and the true architecture performances limits training-free NAS to achieve superior performance. To address these challenges, we propose the robustifying and boosting training-free NAS (RoBoT) algorithm which (a) employs the optimized combination of existing training-free metrics explored from Bayesian optimization to develop a robust and consistently better-performing metric on diverse tasks, and (b) applies greedy search, i.e., the exploitation, on the newly developed metric to bridge the aforementioned gap and consequently to boost the search performance of standard training-free NAS further. Remarkably, the expected performance of our RoBoT can be theoretically guaranteed, which improves over the existing training-free NAS under mild conditions with additional interesting insights. Our extensive experiments on various NAS benchmark tasks yield substantial empirical evidence to support our theoretical results.",
        "keywords": "Neural Architecture Search;Training-free NAS;Bayesian Optimization;Precision@K;Partial Monitoring",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/a1f2471e62d08b40b4ac63dcc78572dc7b83de88.zip",
        "author": "Zhenfeng He;Yao Shu;Zhongxiang Dai;Bryan Kian Hsiang Low",
        "authorids": "~Zhenfeng_He3;~Yao_Shu1;~Zhongxiang_Dai1;~Bryan_Kian_Hsiang_Low1",
        "gender": "M;M;M;M",
        "homepage": ";https://yao.notion.site;https://daizhongxiang.github.io/;http://www.comp.nus.edu.sg/~lowkh",
        "dblp": ";44/1338;172/4968;97/4877",
        "google_scholar": ";https://scholar.google.com.au/citations?hl=en;1v8xOIYAAAAJ;https://scholar.google.com.tw/citations?user=2P-Q09UAAAAJ",
        "orcid": "0009-0001-0736-3598;;;",
        "linkedin": "zhenfeng-he/;yao-shu-a5640514b;;",
        "or_profile": "~Zhenfeng_He3;~Yao_Shu1;~Zhongxiang_Dai1;~Bryan_Kian_Hsiang_Low1",
        "aff": "National University of Singapore;Guangming Lab;Massachusetts Institute of Technology;National University of Singapore",
        "aff_domain": "u.nus.edu;gml.ac.cn;mit.edu;nus.edu.sg",
        "position": "PhD student;Researcher;Postdoc;Associate Professor",
        "bibtex": "@inproceedings{\nhe2024robustifying,\ntitle={Robustifying and Boosting Training-Free Neural Architecture Search},\nauthor={Zhenfeng He and Yao Shu and Zhongxiang Dai and Bryan Kian Hsiang Low},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=qPloNoDJZn}\n}",
        "github": "",
        "project": "",
        "reviewers": "GJPv;81X4;3buk",
        "pdf_size": 1286315,
        "rating": "3;5;8",
        "confidence": "4;4;4",
        "soundness": "3;2;3",
        "contribution": "2;3;3",
        "presentation": "1;3;3",
        "wc_summary": "62;82;114",
        "wc_strengths": "4;33;63",
        "wc_weaknesses": "62;194;154",
        "wc_questions": "51;4;42",
        "wc_review": "179;313;373",
        "wc_reply_reviewers": "0;0;122",
        "wc_reply_authors": "0;832;890",
        "reply_reviewers": "0;0;2",
        "reply_authors": "0;2;3",
        "rating_avg": [
            5.333333333333333,
            2.0548046676563256
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            86.0,
            21.416504538945347
        ],
        "wc_strengths_avg": [
            33.333333333333336,
            24.087802353519553
        ],
        "wc_weaknesses_avg": [
            136.66666666666666,
            55.265018069500556
        ],
        "wc_questions_avg": [
            32.333333333333336,
            20.368821489936252
        ],
        "wc_review_avg": [
            288.3333333333333,
            81.09802025258625
        ],
        "wc_reply_reviewers_avg": [
            40.666666666666664,
            57.51135153650587
        ],
        "wc_reply_authors_avg": [
            574.0,
            406.5693872719227
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            1.247219128924647
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4725627086211729108&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=qPloNoDJZn",
        "pdf": "https://openreview.net/pdf?id=qPloNoDJZn",
        "email": "u.nus.edu;gml.ac.cn;mit.edu;nus.edu.sg",
        "author_num": 4,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "National University of Singapore;Guangming Lab;Massachusetts Institute of Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.nus.edu.sg;;https://web.mit.edu",
        "aff_unique_abbr": "NUS;;MIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;0",
        "aff_country_unique": "Singapore;China;United States"
    },
    {
        "id": "qPwQj4Mf3u",
        "title": "Hopfield Encoding Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Content-associative memories such as Hopfield networks have been studied as a good mathematical model of the auto-associative features in the CA3 region of the hippocampal memory system. Modern Hopfield networks (MHN) are generalizations of the classical Hopfield networks with revised energy functions and update rules to expand storage to exponential capacity.  However, they are not yet practical due to spurious metastable states even while storing a small number of input patterns. Further, they have only been able to demonstrate recall of content by giving partial content in the same stimulus domain and don't adequately explain how cross-stimulus associations can be accomplished, as is evidenced in the Hippocampal formation. In this paper, we revisit Modern Hopfield networks from both these perspectives to offer new insights and extend the MHN model to mitigate these limitations. Specifically, we observe that the spurious states relate to the separability of the input patterns, which can be enhanced by encoding them before storage and decoding them after recall. We introduce a new kind of Modern Hopfield network called the Hopfield Encoding Network (HEN) to enable this and show that such a model can support cross-stimulus associations, particularly between vision and language, to enable recall of memories with associative encoded textual patterns.",
        "keywords": "Hopfield Encoded Networks;Cross stimuli Content Associative Memories;CLIP;encoder-decoder architectures",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Satyananda Kashyap;Niharika Shimona D'Souza;Luyao Shi;Ken C. L. Wong;Hongzhi Wang;Tanveer Syeda-mahmood",
        "authorids": "~Satyananda_Kashyap2;~Niharika_Shimona_D'Souza1;~Luyao_Shi1;~Ken_C._L._Wong2;~Hongzhi_Wang1;~Tanveer_Syeda-mahmood2",
        "gender": "M;M;M;M;F;F",
        "homepage": "https://researcher.watson.ibm.com/researcher/view.php?person=ibm-Satyananda.Kashyap;;;https://scholar.google.com/citations?user=X3EHNXUAAAAJ&hl=en;https://researcher.watson.ibm.com/researcher/view.php?person=us-stf;https://research.ibm.com/people/niharika-dsouza",
        "dblp": "43/9222;149/7445;69/28;;11/5386;226/3325",
        "google_scholar": "JoBdkUMAAAAJ;sZw4ndYAAAAJ;XjnODToAAAAJ;X3EHNXUAAAAJ;https://scholar.google.com/citations?hl=en;iKonuvcAAAAJ",
        "orcid": "0000-0002-4624-5690;;;;0000-0003-0059-3208;",
        "linkedin": ";;;;tanveer-syeda-mahmood-09297224/;niharika-s-d-souza-b1a47824/",
        "or_profile": "~Satyananda_Kashyap2;~Luyao_Shi1;~Ken_C._L._Wong2;~Hongzhi_Wang1;~Tanveer_Syeda-mahmood2;~Niharika_Shimona_Dsouza1",
        "aff": "International Business Machines;International Business Machines;IBM, International Business Machines;IBM, International Business Machines;International Business Machines;International Business Machines",
        "aff_domain": "ibm.com;ibm.com;us.ibm.com;us.ibm.com;ibm.com;ibm.com",
        "position": "Research Staff Member;Researcher;Researcher;Researcher;IBM Fellow;Researcher",
        "bibtex": "@misc{\nkashyap2024hopfield,\ntitle={Hopfield Encoding Networks},\nauthor={Satyananda Kashyap and Niharika Shimona D'Souza and Luyao Shi and Ken C. L. Wong and Hongzhi Wang and Tanveer Syeda-mahmood},\nyear={2024},\nurl={https://openreview.net/forum?id=qPwQj4Mf3u}\n}",
        "github": "",
        "project": "",
        "reviewers": "hRE9;Xb9Q;TATU",
        "site": "https://openreview.net/forum?id=qPwQj4Mf3u",
        "pdf_size": 7386842,
        "rating": "3;3;3",
        "confidence": "4;3;3",
        "soundness": "1;2;2",
        "contribution": "2;1;1",
        "presentation": "1;2;3",
        "wc_summary": "44;39;74",
        "wc_strengths": "20;58;52",
        "wc_weaknesses": "1311;157;646",
        "wc_questions": "27;1;29",
        "wc_review": "1402;255;801",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            52.333333333333336,
            15.456030825826172
        ],
        "wc_strengths_avg": [
            43.333333333333336,
            16.679994670929073
        ],
        "wc_weaknesses_avg": [
            704.6666666666666,
            472.9413870191058
        ],
        "wc_questions_avg": [
            19.0,
            12.754084313139327
        ],
        "wc_review_avg": [
            819.3333333333334,
            468.44020133014016
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:sTHAdEVbxx8J:scholar.google.com/&scioq=Hopfield+Encoding+Networks&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;1;0;0",
        "aff_unique_norm": "International Business Machines Corporation;International Business Machines",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ibm.com;https://www.ibm.com",
        "aff_unique_abbr": "IBM;IBM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "qRbkTbe8JT",
        "title": "IMEX-Reg: Implicit-Explicit Regularization in the Function Space for Continual Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Continual learning (CL) remains one of the long-standing challenges for deep\nneural networks due to catastrophic forgetting of previously acquired knowledge.\nAlthough rehearsal-based approaches have been fairly successful in mitigating\ncatastrophic forgetting, they suffer from overfitting on buffered samples and prior\ninformation loss, hindering generalization under low-buffer regimes. Inspired\nby how humans learn using strong inductive biases, we propose IMEX-Reg to\nimprove the generalization performance of experience rehearsal in CL under low\nbuffer regimes. Specifically, we employ a two-pronged implicit-explicit regular-\nization approach using contrastive representation learning (CRL) and consistency\nregularization. To further leverage the global relationship between representations\nlearned using CRL, we propose a novel regularization strategy to guide the clas-\nsifier toward the activation correlations in the unit hypersphere of the CRL. Our\nresults show that IMEX-Reg significantly improves generalization performance and\noutperforms rehearsal-based approaches in several CL scenarios. It is also robust\nto natural and adversarial corruptions with less task-recency bias. Additionally, we\nprovide theoretical insights to support our design decisions further.",
        "keywords": "Continual Learning;Lifelong Learning;Inductive Bias;Multitask Learning;Catastrophic Forgetting;Experience Rehearsal;Task Attention",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/a32a2930856a7abe68abb2d0979da0a9c615be7b.zip",
        "author": "Prashant Shivaram Bhat;Bharath Chennamkulam Renjith;Bahram Zonooz;Elahe Arani",
        "authorids": "~Prashant_Shivaram_Bhat1;~Bharath_Chennamkulam_Renjith1;~Bahram_Zonooz1;~Elahe_Arani1",
        "gender": "M;M;M;F",
        "homepage": ";;https://sites.google.com/view/bahramzonooz;https://sites.google.com/view/elahe-arani",
        "dblp": "340/2336;;250/9573;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;;e_I_v6cAAAAJ",
        "orcid": ";;;0000-0002-0952-7007",
        "linkedin": "prashant-s-bhat/;bharath-c-renjith/;;elahe-arani-630870b2/",
        "or_profile": "~Prashant_Shivaram_Bhat1;~Bharath_Chennamkulam_Renjith1;~Bahram_Zonooz1;~Elahe_Arani1",
        "aff": "Eindhoven University of Technology;TomTom;Eindhoven University of Technology;Wayve Technologies Ltd",
        "aff_domain": "tue.nl;tomtom.com;tue.nl;wayve.ai",
        "position": "PhD student;Researcher;Assistant Professor;Head of AI Research",
        "bibtex": "@misc{\nbhat2024imexreg,\ntitle={{IMEX}-Reg: Implicit-Explicit Regularization in the Function Space for Continual Learning},\nauthor={Prashant Shivaram Bhat and Bharath Chennamkulam Renjith and Bahram Zonooz and Elahe Arani},\nyear={2024},\nurl={https://openreview.net/forum?id=qRbkTbe8JT}\n}",
        "github": "",
        "project": "",
        "reviewers": "bb13;siLj;B5E5",
        "site": "https://openreview.net/forum?id=qRbkTbe8JT",
        "pdf_size": 489335,
        "rating": "3;5;5",
        "confidence": "1;4;3",
        "soundness": "2;3;3",
        "contribution": "2;2;2",
        "presentation": "2;3;3",
        "wc_summary": "54;86;91",
        "wc_strengths": "13;50;15",
        "wc_weaknesses": "175;75;159",
        "wc_questions": "5;159;84",
        "wc_review": "247;370;349",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1131;838;942",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;2;2",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            77.0,
            16.391054470858997
        ],
        "wc_strengths_avg": [
            26.0,
            16.990193249832878
        ],
        "wc_weaknesses_avg": [
            136.33333333333334,
            43.8583578757294
        ],
        "wc_questions_avg": [
            82.66666666666667,
            62.87730556850823
        ],
        "wc_review_avg": [
            322.0,
            53.72150407425317
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            970.3333333333334,
            121.2829565749267
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.9449111825230678,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10219382857475117317&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "Eindhoven University of Technology;TomTom;Wayve Technologies",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.tue.nl;https://www.tomtom.com;https://www.wayvetechnologies.com",
        "aff_unique_abbr": "TU/e;TomTom;Wayve",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "Netherlands;United Kingdom"
    },
    {
        "id": "qT1I15Zodx",
        "title": "The Snowflake Hypothesis: Training Deep GNN with One Node One Receptive field",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Despite Graph Neural Networks (GNNs) demonstrating considerable promise in graph representation learning tasks, GNNs predominantly face significant issues with over-fitting and over-smoothing as they go deeper as models of computer vision (CV) realm. Given that the potency of numerous CV and language models is attributable to that support reliably training very deep architectures, we conduct a systematic study of deeper GNN research trajectories. Our findings indicate that the current success of deep GNNs primarily stems from (I) the adoption of innovations from CNNs, such as residual/skip connections, or (II) the tailor-made aggregation algorithms like DropEdge. However, these algorithms often lack intrinsic interpretability and indiscriminately treat all nodes within a given layer in a similar manner, thereby failing to capture the nuanced differences among various nodes. In this paper, we introduce \\textit{the Snowflake Hypothesis} -- a novel paradigm underpinning the concept of ``one node, one receptive field''. The hypothesis draws inspiration from the unique and individualistic patterns of each snowflake, proposing a corresponding uniqueness in the receptive fields of nodes in the GNNs.\n\nWe employ the simplest gradient and node-level cosine distance as guiding principles to regulate the aggregation depth for each node, and conduct comprehensive experiments including: (1) different training scheme; (2) various shallow and deep GNN backbones, especially on deep frameworks such as JKNet, ResGCN, PairNorm \\textit{etc.} (3) various numbers of layers (8, 16, 32, 64) on multiple benchmarks (six graphs including dense graphs with millions of nodes); (4) compare with different aggregation strategies. The observational results demonstrate that our framework can serve as a universal operator for a range of tasks, and it displays tremendous potential on deep GNNs.  It can be applied to various GNN frameworks, enhancing its effectiveness when operating in-depth, and guiding the selection of the optimal network depth in an explainable and generalizable way.",
        "keywords": "Deep Graph Neural Network;Graph Neural Network;Network Pruning;The lottery Ticket Hypothesis",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/7f37866d49ccafcdfb412c7ade46d7df4f0a5f2e.zip",
        "author": "Kun Wang;Guohao Li;shilong wang;Guibin Zhang;Kai Wang;Yang You;Junfeng Fang;Xiaojiang Peng;Yuxuan Liang;Yang Wang",
        "authorids": "~Kun_Wang15;~Guohao_Li1;~shilong_wang3;~Guibin_Zhang1;~Kai_Wang8;~Yang_You1;~Junfeng_Fang1;~Xiaojiang_Peng1;~Yuxuan_Liang1;~Yang_Wang32",
        "gender": "M;M;M;;M;M;M;M;M;M",
        "homepage": "http://home.ustc.edu.cn/~wk520529/#home;https://ghli.org/;;;https://kaiwang960112.github.io/;https://www.comp.nus.edu.sg/~youy/;https://scholar.google.com/citations?user=beNNywsAAAAJ&hl=zh-CN;https://pengxj.github.io/;https://yuxuanliang.com;http://staff.ustc.edu.cn/~angyan/",
        "dblp": ";211/7175-1;;;78/2022-36;33/8167-1.html;340/7929;133/6556;183/0977;",
        "google_scholar": "UnyqjWQAAAAJ;J9K-D0sAAAAJ;;;i2II0XIAAAAJ;jF4dPZwAAAAJ;beNNywsAAAAJ;7oRD67kAAAAJ;n9cODgcAAAAJ;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": "0000-0003-0602-169X;0000-0003-0260-5129;0009-0001-0734-6085;;0000-0002-1154-5175;;;;0000-0003-2817-7337;0000-0002-6079-7053",
        "linkedin": ";;;;;yang-you-0b92914b/;;;yoshall/;",
        "or_profile": "~Kun_Wang15;~Guohao_Li1;~shilong_wang3;~Guibin_Zhang1;~Kai_Wang8;~Yang_You1;~Junfeng_Fang1;~Xiaojiang_Peng1;~Yuxuan_Liang1;~Yang_Wang32",
        "aff": "University of Science and Technology of China;University of Oxford;University of Science and Technology of China;;National University of Singapore;National University of Singapore;;Shenzhen Technology University;The Hong Kong University of Science and Technology (Guangzhou);University of Science and Technology of China",
        "aff_domain": "ustc.edu.cn;robots.ox.ac.uk;ustc.edu.cn;;u.nus.edu;nus.edu.sg;;sztu.edu.cn;hkust-gz.edu.cn;ustc.edu.cn",
        "position": "PhD student;Postdoc;MS student;;PhD student;Professor;;Full Professor;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nwang2024the,\ntitle={The Snowflake Hypothesis: Training Deep {GNN} with One Node One Receptive field},\nauthor={Kun Wang and Guohao Li and shilong wang and Guibin Zhang and Kai Wang and Yang You and Junfeng Fang and Xiaojiang Peng and Yuxuan Liang and Yang Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=qT1I15Zodx}\n}",
        "github": "",
        "project": "",
        "reviewers": "yhNV;gnhU;ngCy;8f4f",
        "site": "https://openreview.net/forum?id=qT1I15Zodx",
        "pdf_size": 15536527,
        "rating": "3;5;5;6",
        "confidence": "3;4;3;3",
        "soundness": "2;2;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;3;2;2",
        "wc_summary": "86;99;69;30",
        "wc_strengths": "14;99;59;62",
        "wc_weaknesses": "28;133;91;248",
        "wc_questions": "106;41;4;14",
        "wc_review": "234;372;223;354",
        "wc_reply_reviewers": "26;0;0;0",
        "wc_reply_authors": "604;0;0;566",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "1;0;0;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            71.0,
            25.95187854472196
        ],
        "wc_strengths_avg": [
            58.5,
            30.137186331839274
        ],
        "wc_weaknesses_avg": [
            125.0,
            80.24649525057154
        ],
        "wc_questions_avg": [
            41.25,
            39.757860857948586
        ],
        "wc_review_avg": [
            295.75,
            67.66230486762922
        ],
        "wc_reply_reviewers_avg": [
            6.5,
            11.258330249197702
        ],
        "wc_reply_authors_avg": [
            292.5,
            292.8083844427956
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            0.5,
            0.5
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.13245323570650439,
        "gs_citation": 21,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16399447841284655373&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;0;2;2;3;4;0",
        "aff_unique_norm": "University of Science and Technology of China;University of Oxford;National University of Singapore;Shenzhen Technology University;Hong Kong University of Science and Technology",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "http://www.ustc.edu.cn;https://www.ox.ac.uk;https://www.nus.edu.sg;https://www.sztu.edu.cn;https://www.ust.hk",
        "aff_unique_abbr": "USTC;Oxford;NUS;;HKUST",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Guangzhou",
        "aff_country_unique_index": "0;1;0;2;2;0;0;0",
        "aff_country_unique": "China;United Kingdom;Singapore"
    },
    {
        "title": "Extending Power of Nature from Binary to Real-Valued Graph Learning in Real World",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17731",
        "id": "qT7DXUmX7j",
        "author_site": "Chunshu Wu, Ruibing Song, Chuan Liu, Yunan Yang, Ang Li, Michael Huang, Tong Geng",
        "tldr": "",
        "abstract": "Nature performs complex computations constantly at clearly lower cost and higher performance than digital computers. It is crucial to understand how to harness the unique computational power of nature in Machine Learning (ML). In the past decade, besides the development of Neural Networks (NNs), the community has also relentlessly explored nature-powered ML paradigms. Although most of them are still predominantly theoretical, a new practical paradigm enabled by the recent advent of CMOS-compatible room-temperature nature-based computers has emerged. By harnessing a dynamical system's intrinsic behavior of chasing the lowest energy state, this paradigm can solve some simple binary problems delivering considerable speedup and energy savings compared with NNs, while maintaining comparable accuracy. Regrettably, its values to the real world are highly constrained by its binary nature. A clear pathway to its extension to real-valued problems remains elusive. This paper aims to unleash this pathway by proposing a novel end-to-end Nature-Powered Graph Learning (NP-GL) framework. Specifically, through a three-dimensional co-design, NP-GL can leverage the spontaneous energy decrease in nature to efficiently solve real-valued graph learning problems. Experimental results across 4 real-world applications with 6 datasets demonstrate that NP-GL delivers, on average, $6.97\\times 10^3$ speedup and $10^5$ energy consumption reduction with comparable or even higher accuracy than Graph Neural Networks (GNNs).",
        "keywords": "graph learning;nature-powered computing;dynamic physical system",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Chunshu Wu;Ruibing Song;Chuan Liu;Yunan Yang;Ang Li;Michael Huang;Tong Geng",
        "authorids": "~Chunshu_Wu1;rsong10@ur.rochester.edu;cliu81@ur.rochester.edu;yunan.yang@cornell.edu;~Ang_Li11;~Michael_Huang1;~Tong_Geng1",
        "gender": "M;;;;M;M;M",
        "homepage": ";;;;http://www.angliphd.com/;http://www.ece.rochester.edu/~mihuang/;https://tonytgeng.com",
        "dblp": "243/1631;;;;;40/1854;188/5531",
        "google_scholar": "ZawigMMAAAAJ;;;;nH5ZnvMAAAAJ;aa5mOHkAAAAJ;1B_nk28AAAAJ",
        "orcid": "0009-0006-2039-0853;;;;;;0000-0002-3644-2922",
        "linkedin": ";;;;;;",
        "or_profile": "~Chunshu_Wu1;rsong10@ur.rochester.edu;cliu81@ur.rochester.edu;yunan.yang@cornell.edu;~Ang_Li11;~Michael_Huang1;~Tong_Geng1",
        "aff": "University of Rochester;;;;Pacific Northwest National Laboratory;University of Rochester;University of Rochester",
        "aff_domain": "rochester.edu;;;;pnnl.gov;rochester.edu;rochester.edu",
        "position": "Postdoc;;;;Computer Scientist;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nwu2024extending,\ntitle={Extending Power of Nature from Binary to Real-Valued Graph Learning in Real World},\nauthor={Chunshu Wu and Ruibing Song and Chuan Liu and Yunan Yang and Ang Li and Michael Huang and Tong Geng},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=qT7DXUmX7j}\n}",
        "github": "",
        "project": "",
        "reviewers": "UYh4;qast;w2U6",
        "pdf_size": 4636271,
        "rating": "5;6;6",
        "confidence": "4;4;3",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "2;3;3",
        "wc_summary": "64;24;278",
        "wc_strengths": "20;53;264",
        "wc_weaknesses": "106;81;62",
        "wc_questions": "10;72;85",
        "wc_review": "200;230;689",
        "wc_reply_reviewers": "0;37;0",
        "wc_reply_authors": "624;349;858",
        "reply_reviewers": "0;1;0",
        "reply_authors": "2;3;2",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            122.0,
            111.51083654365914
        ],
        "wc_strengths_avg": [
            112.33333333333333,
            108.08741318437077
        ],
        "wc_weaknesses_avg": [
            83.0,
            18.01850900231944
        ],
        "wc_questions_avg": [
            55.666666666666664,
            32.72443871006635
        ],
        "wc_review_avg": [
            373.0,
            223.78114308404093
        ],
        "wc_reply_reviewers_avg": [
            12.333333333333334,
            17.441967269268172
        ],
        "wc_reply_authors_avg": [
            610.3333333333334,
            208.02296881728122
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13148944056300173301&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=qT7DXUmX7j",
        "pdf": "https://openreview.net/pdf?id=qT7DXUmX7j",
        "email": "rochester.edu;;;;pnnl.gov;rochester.edu;rochester.edu",
        "author_num": 7,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "University of Rochester;Pacific Northwest National Laboratory",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.rochester.edu;https://www.pnnl.gov",
        "aff_unique_abbr": "U of R;PNNL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Relay Diffusion: Unifying diffusion process across resolutions for image synthesis",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17730",
        "id": "qTlcbLSm4p",
        "author_site": "Jiayan Teng, Wendi Zheng, Ming Ding, Wenyi Hong, Jianqiao Wangni, Zhuoyi Yang, Jie Tang",
        "tldr": "",
        "abstract": "Diffusion models achieved great success in image synthesis, but still face challenges in high-resolution generation. Through the lens of discrete cosine transformation, we find the main reason is that *the same noise level on a higher resolution results in a higher Signal-to-Noise Ratio in the frequency domain*. In this work, we present Relay Diffusion Model (RDM), which transfers a low-resolution image or noise into an equivalent high-resolution one for diffusion model via blurring diffusion and block noise. Therefore, the diffusion process can continue seamlessly in any new resolution or model without restarting from pure noise or low-resolution conditioning. RDM achieves state-of-the-art FID on CelebA-HQ and sFID on ImageNet 256$\\times$256, surpassing previous works such as ADM, LDM and DiT by a large margin. All the codes and checkpoints are open-sourced at \\url{https://github.com/THUDM/RelayDiffusion}.",
        "keywords": "generative models;diffusion model;image synthesis",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Jiayan Teng;Wendi Zheng;Ming Ding;Wenyi Hong;Jianqiao Wangni;Zhuoyi Yang;Jie Tang",
        "authorids": "~Jiayan_Teng1;~Wendi_Zheng1;~Ming_Ding1;~Wenyi_Hong1;~Jianqiao_Wangni1;~Zhuoyi_Yang1;~Jie_Tang1",
        "gender": "M;M;M;F;M;M;",
        "homepage": "https://tengjiayan20.github.io/;http://info.tsinghua.edu.cn;;;https://sites.google.com/view/jianqiaown/;;",
        "dblp": ";;48/3462-4;216/5413;178/8573;230/8320;",
        "google_scholar": ";;Va50YzkAAAAJ;JSEzrlwAAAAJ;WcJo944AAAAJ;;",
        "orcid": "0000-0003-1346-734X;;;;;;",
        "linkedin": ";;;wenyi-hong;;zhuoyi-yang-4a1051210/;",
        "or_profile": "~Jiayan_Teng1;~Wendi_Zheng1;~Ming_Ding1;~Wenyi_Hong1;~Jianqiao_Wangni1;~Zhuoyi_Yang1;~Jie_Tang1",
        "aff": "Tsinghua University;Tsinghua University;ZHIPU AI;Department of Computer Science and Technology, Tsinghua University;;Tsinghua University;",
        "aff_domain": "mails.tsinghua.edu.cn;mail.tsinghua.edu.cn;zhipuai.cn;mails.tsinghua.edu.cn;;tsinghua.edu.cn;",
        "position": "Undergrad student;PhD student;Principal Researcher;PhD student;;PhD student;",
        "bibtex": "@inproceedings{\nteng2024relay,\ntitle={Relay Diffusion: Unifying diffusion process across resolutions for image synthesis},\nauthor={Jiayan Teng and Wendi Zheng and Ming Ding and Wenyi Hong and Jianqiao Wangni and Zhuoyi Yang and Jie Tang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=qTlcbLSm4p}\n}",
        "github": "",
        "project": "",
        "reviewers": "edjv;Jazo;htaY;pR8K",
        "pdf_size": 7607856,
        "rating": "6;6;8;8",
        "confidence": "4;4;4;3",
        "soundness": "3;3;2;3",
        "contribution": "3;3;3;3",
        "presentation": "3;4;4;3",
        "wc_summary": "57;66;138;109",
        "wc_strengths": "43;85;79;60",
        "wc_weaknesses": "356;81;278;89",
        "wc_questions": "112;42;187;267",
        "wc_review": "568;274;682;525",
        "wc_reply_reviewers": "0;0;855;0",
        "wc_reply_authors": "1235;412;2911;1385",
        "reply_reviewers": "0;0;2;0",
        "reply_authors": "2;1;5;3",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            92.5,
            32.8062494046485
        ],
        "wc_strengths_avg": [
            66.75,
            16.528384676065595
        ],
        "wc_weaknesses_avg": [
            201.0,
            119.26650829130531
        ],
        "wc_questions_avg": [
            152.0,
            83.88980867781258
        ],
        "wc_review_avg": [
            512.25,
            149.03753721797742
        ],
        "wc_reply_reviewers_avg": [
            213.75,
            370.2258601178475
        ],
        "wc_reply_authors_avg": [
            1485.75,
            902.3999598293431
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            2.75,
            1.479019945774904
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 38,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=822575674908769880&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=qTlcbLSm4p",
        "pdf": "https://openreview.net/pdf?id=qTlcbLSm4p",
        "email": "mails.tsinghua.edu.cn;mail.tsinghua.edu.cn;zhipuai.cn;mails.tsinghua.edu.cn;;tsinghua.edu.cn;",
        "author_num": 7,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "Tsinghua University;Zhipu AI",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.zhipu.ai",
        "aff_unique_abbr": "THU;ZHIPU AI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "qTui9aQ3VW",
        "title": "How Robust Are Energy-Based Models Trained With Equilibrium Propagation?",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep neural networks (DNNs) are easily fooled by adversarial perturbations that are imperceptible to humans. Adversarial training, a process where adversarial examples are added to the training set, is the current state-of-the-art defense against adversarial attacks, but it lowers the model's accuracy on clean inputs, is computationally expensive, and offers less robustness to natural noise. In contrast, energy-based models (EBMs), which were designed for efficient implementation in neuromorphic hardware and physical systems, incorporate feedback connections from each layer to the previous layer, yielding a recurrent, deep-attractor architecture which we hypothesize should make them naturally robust. Our work is the first to explore the robustness of EBMs to both natural corruptions and adversarial attacks, which we do using the CIFAR-10 and CIFAR-100 datasets. We demonstrate that EBMs are more robust than transformers and display comparable robustness to adversarially-trained DNNs on white-box, black-box, and natural perturbations without sacrificing clean accuracy, and without the need for adversarial training or additional training techniques.",
        "keywords": "adversarial robustness;equilibrium propagation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Siddharth Mansingh;Michal Kucer;Garrett T. Kenyon;Juston Moore;Michael Teti",
        "authorids": "~Siddharth_Mansingh1;~Michal_Kucer1;~Garrett_T._Kenyon1;~Juston_Moore2;~Michael_Teti1",
        "gender": "M;;M;M;Not Specified",
        "homepage": ";;https://github.com/PetaVision/OpenPV;;",
        "dblp": "367/3930;;59/4718;126/1789;",
        "google_scholar": "23KDbVgAAAAJ;;vlAOaqMAAAAJ;gyFa3X0AAAAJ;cTWaSg8AAAAJ",
        "orcid": "0009-0000-9015-7041;;0000-0003-4836-3938;;0000-0002-0754-1761",
        "linkedin": "siddharth-mansingh;;;;",
        "or_profile": "~Siddharth_Mansingh1;~Michal_Kucer1;~Garrett_T._Kenyon1;~Juston_Moore2;~Michael_Teti1",
        "aff": "Los Alamos National Laboratory;;;Los Alamos National Laboratory;Los Alamos National Laboratory",
        "aff_domain": "lanl.gov;;;lanl.gov;lanl.gov",
        "position": "Postdoc;;;Scientist;Researcher",
        "bibtex": "@misc{\nmansingh2024how,\ntitle={How Robust Are Energy-Based Models Trained With Equilibrium Propagation?},\nauthor={Siddharth Mansingh and Michal Kucer and Garrett T. Kenyon and Juston Moore and Michael Teti},\nyear={2024},\nurl={https://openreview.net/forum?id=qTui9aQ3VW}\n}",
        "github": "",
        "project": "",
        "reviewers": "M88c;GSeC;8aDx;QZD5",
        "site": "https://openreview.net/forum?id=qTui9aQ3VW",
        "pdf_size": 1519490,
        "rating": "6;6;6;6",
        "confidence": "2;2;4;3",
        "soundness": "3;3;3;2",
        "contribution": "2;3;2;3",
        "presentation": "3;2;2;2",
        "wc_summary": "48;85;39;64",
        "wc_strengths": "15;53;37;43",
        "wc_weaknesses": "196;183;205;200",
        "wc_questions": "24;155;3;225",
        "wc_review": "283;476;284;532",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "337;555;332;468",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            59.0,
            17.478558292948534
        ],
        "wc_strengths_avg": [
            37.0,
            13.92838827718412
        ],
        "wc_weaknesses_avg": [
            196.0,
            8.154753215150045
        ],
        "wc_questions_avg": [
            101.75,
            91.95481227211548
        ],
        "wc_review_avg": [
            393.75,
            112.01422900685431
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            423.0,
            93.70965798678384
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11794264603924905034&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Los Alamos National Laboratory",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.lanl.gov",
        "aff_unique_abbr": "LANL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "qU24AQxmoQ",
        "title": "Enhancing Large Language Reasoning through Multi-Modal Reasoning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The combination of chain-of-thought prompting with the self-consistency decoding strategy empowers pre-trained large language models (LLMs) to attain promising outcomes in reasoning problems. \nNonetheless, this self-consistency strategy samples multiple reasoning paths from the output of a \\emph{single} modality prompt (e.g., the linear \"step-by-step\" text prompt). \nHowever, as not all problems can be solved through such a \"step-by-step\" reasoning process, existing self-consistency strategies still struggle with challenging tasks that involve \\emph{multiple} modalities.\nFor example, an algebraic problem requires both reasoning and value computation.\n% For example, solving an algebraic problem requires both the modality of reasoning and computation.\nIn this paper, we introduce the concept of multiple-modal consistency (\\tool) as a complement to self-consistency, aiming to broaden the scope of reasoning capabilities. \nThe idea of \\tool ~is that, for different reasoning problems, an LLM ought to engage diverse perspectives rather than adhering to a prompt that only considers textual reasoning.\nBased on this idea, when given a specific problem, \\tool initially queries the LLM to identify modalities suitable for addressing the problem. Subsequently, \\tool samples varied reasoning paths from each selected modality instead of the text modality alone. Finally, \\tool ~discerns the most coherent response by aggregating the sampled reasoning paths across different modalities.\nOur exhaustive empirical assessment demonstrates the superiority of \\tool over existing approaches and single-modality reasoning baselines.",
        "keywords": "Large Language Model;Mult-Modal",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Yixin He;Simin Chen;Xinya Du;Cong Liu;Wei Yang",
        "authorids": "~Yixin_He1;~Simin_Chen1;~Xinya_Du1;~Cong_Liu2;~Wei_Yang7",
        "gender": "F;;M;;",
        "homepage": "https://github.com/HeyixInn;http://seekingdream.github.io/;https://xinyadu.github.io;https://intra.ece.ucr.edu/~cong/;",
        "dblp": ";;200/8114;https://dblp.uni-trier.de/pers/l/Liu_0005:Cong.html;",
        "google_scholar": ";bgCd-_YAAAAJ;R-lKQqkAAAAJ;vpc4bggAAAAJ;",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Yixin_He1;~Simin_Chen1;~Xinya_Du1;~Cong_Liu2;~Wei_Yang7",
        "aff": "University of Southern California;University of Texas at Dallas ;University of Texas at Dallas;University of California, Riverside;",
        "aff_domain": "usc.edu;utdallas.edu;utdallas.edu;ucr.edu;",
        "position": "MS student;PhD student;Assistant Professor;Associate Professor;",
        "bibtex": "@misc{\nhe2024enhancing,\ntitle={Enhancing Large Language Reasoning through Multi-Modal Reasoning},\nauthor={Yixin He and Simin Chen and Xinya Du and Cong Liu and Wei Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=qU24AQxmoQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=qU24AQxmoQ",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:YJ1KKZgoRyMJ:scholar.google.com/&scioq=Enhancing+Large+Language+Reasoning+through+Multi-Modal+Reasoning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "University of Southern California;University of Texas at Dallas;University of California, Riverside",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.usc.edu;https://www.utdallas.edu;https://www.ucr.edu",
        "aff_unique_abbr": "USC;UT Dallas;UCR",
        "aff_campus_unique_index": "0;1;1;2",
        "aff_campus_unique": "Los Angeles;Dallas;Riverside",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "qUVP6IDc5J",
        "title": "Eliciting Attributions from LLMs with Minimal Supervision",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) have quickly become popular tools for recalling information; however, the specific mechanisms they utilize to encode and store vast information within their parameters is not well understood. As a step towards improving interpretability and reliability of LLMs, we develop AttributeLLaMA, which involves fine-tuning LLaMA models to enable them to attribute their responses. By utilizing a mere 100 expert-annotated attribution examples, we are able to achieve this capability. Our experimental studies demonstrate that these attributions significantly improve the performance of a strong LLM on downstream tasks such as MMLU and StrategyQA by more than 3.5% and 4.0%, respectively. Furthermore, our analyses on the attributions obtained from AttributeLLaMA reveal the remarkable memorization capabilities of LLMs",
        "keywords": "Attribution;Large Langauge Models;Instruction Tuning",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Ramakanth Pasunuru;Koustuv Sinha;Armen Aghajanyan;LILI YU;Tianlu Wang;Daniel M. Bikel;Luke Zettlemoyer;Maryam Fazel-Zarandi;Asli Celikyilmaz",
        "authorids": "~Ramakanth_Pasunuru2;~Koustuv_Sinha1;~Armen_Aghajanyan1;~LILI_YU1;~Tianlu_Wang1;~Daniel_M._Bikel1;~Luke_Zettlemoyer1;~Maryam_Fazel-Zarandi1;~Asli_Celikyilmaz1",
        "gender": "M;M;;F;F;M;M;F;F",
        "homepage": "http://rama-kanth.com;https://koustuvsinha.com/;;https://scholar.google.com/citations?hl=en&user=wY932-AAAAAJ&view_op=list_works&authuser=1&sortby=pubdate;https://tianlu-wang.github.io/;;https://www.cs.washington.edu/people/faculty/lsz/;https://www.maryamfazel.com/;https://asli.us",
        "dblp": "199/1748;210/0890;;;185/5529;63/6660;21/6793;62/5920;15/3724",
        "google_scholar": "https://scholar.google.com/citations?hl=en;9P9QcckAAAAJ;;https://scholar.google.com/citations?hl=en;inzQqX8AAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com.tw/citations?user=UjpbO6IAAAAJ;7-a1MKEAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;;;;;;",
        "linkedin": ";;;lili-yu-6771961a/;;danbikel;luke-zettlemoyer-a0109b226/;maryam-fazel-zarandi/;aslicelikyilmaz/",
        "or_profile": "~Ramakanth_Pasunuru2;~Koustuv_Sinha1;~Armen_Aghajanyan1;~LILI_YU1;~Tianlu_Wang1;~Daniel_M._Bikel1;~Luke_Zettlemoyer1;~Maryam_Fazel-Zarandi1;~Asli_Celikyilmaz1",
        "aff": "Meta Platforms Inc;Meta (FAIR);;Meta Facebook;Meta;Google;Meta;Meta;FAIR ",
        "aff_domain": "meta.com;meta.com;;fb.com;meta.com;google.com;meta.com;meta.com;meta.com",
        "position": "Researcher;Researcher;;Researcher;Researcher;Research Scientist;Researcher;Senior Research Manager;Principal Researcher",
        "bibtex": "@misc{\npasunuru2024eliciting,\ntitle={Eliciting Attributions from {LLM}s with Minimal Supervision},\nauthor={Ramakanth Pasunuru and Koustuv Sinha and Armen Aghajanyan and LILI YU and Tianlu Wang and Daniel M. Bikel and Luke Zettlemoyer and Maryam Fazel-Zarandi and Asli Celikyilmaz},\nyear={2024},\nurl={https://openreview.net/forum?id=qUVP6IDc5J}\n}",
        "github": "",
        "project": "",
        "reviewers": "iFFD;gxgc;ZtX9;QHns",
        "site": "https://openreview.net/forum?id=qUVP6IDc5J",
        "pdf_size": 561838,
        "rating": "3;3;3;5",
        "confidence": "3;4;4;3",
        "soundness": "3;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "179;104;75;67",
        "wc_strengths": "24;69;65;66",
        "wc_weaknesses": "101;165;186;203",
        "wc_questions": "1;115;8;108",
        "wc_review": "305;453;334;444",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            106.25,
            44.200537327050675
        ],
        "wc_strengths_avg": [
            56.0,
            18.533752992850637
        ],
        "wc_weaknesses_avg": [
            163.75,
            38.64825351810868
        ],
        "wc_questions_avg": [
            58.0,
            53.61436374704078
        ],
        "wc_review_avg": [
            384.0,
            65.38730763688011
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:FO6x6m8OEk8J:scholar.google.com/&scioq=Eliciting+Attributions+from+LLMs+with+Minimal+Supervision&hl=en&as_sdt=0,48",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;1;0;0;0",
        "aff_unique_norm": "Meta;Google",
        "aff_unique_dep": "Meta Platforms Inc;Google",
        "aff_unique_url": "https://www.meta.com;https://www.google.com",
        "aff_unique_abbr": "Meta;Google",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Large Language Models as Tool Makers",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17729",
        "id": "qV83K9d5WB",
        "author_site": "Tianle Cai, Xuezhi Wang, Tengyu Ma, Xinyun Chen, Denny Zhou",
        "tldr": "",
        "abstract": "Recent research has highlighted the potential of large language models (LLMs)\nto improve their problem-solving capabilities with the aid of suitable external\ntools. In our work, we further advance this concept by introducing a closed-\nloop framework, referred to as LLMs A s Tool Makers (LATM), where LLMs\ncreate their own reusable tools for problem-solving. Our approach consists of two\nphases: 1) tool making: an LLM acts as the tool maker that crafts tools for a set\nof tasks, where a tool is implemented as a Python utility function. 2) tool using:\nanother LLM acts as the tool user, which applies the tool built by the tool maker\nfor problem-solving. The tool user can be either the same or a different LLM\nfrom the tool maker. On the problem-solving server side, tool-making enables\ncontinual tool generation and caching as new requests emerge. This framework\nenables subsequent requests to access cached tools via their corresponding APIs,\nenhancing the efficiency of task resolution. Beyond enabling LLMs to create their\nown tools, our framework also uncovers intriguing opportunities to optimize the\nserving cost of LLMs: Recognizing that tool-making requires more sophisticated\ncapabilities, we assign this task to a powerful, albeit resource-intensive, model.\nConversely, the simpler tool-using phase is delegated to a lightweight model. This\nstrategic division of labor allows the once-off cost of tool-making to be spread\nover multiple instances of tool-using, significantly reducing average costs while\nmaintaining strong performance. Furthermore, our method offers a functional\ncache through the caching and reuse of tools, which stores the functionality of\na class of requests instead of the natural language responses from LLMs, thus\nextending the applicability of the conventional cache mechanism. We evaluate\nour approach across various complex reasoning tasks, including Big-Bench tasks.\nWith GPT-4 as the tool maker and GPT-3.5 as the tool user, LATM demonstrates\nperformance equivalent to using GPT-4 for both roles, but with a significantly\nreduced inference cost.",
        "keywords": "large language models;tool making;tool using;serving efficiency",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Tianle Cai;Xuezhi Wang;Tengyu Ma;Xinyun Chen;Denny Zhou",
        "authorids": "~Tianle_Cai1;~Xuezhi_Wang3;~Tengyu_Ma1;~Xinyun_Chen1;~Denny_Zhou1",
        "gender": "M;;M;;F",
        "homepage": "https://tianle.website;https://research.google/people/105995/;http://ai.stanford.edu/~tengyuma/;https://dennyzhou.github.io/;https://jungyhuk.github.io/",
        "dblp": "241/9458;70/4090-2;54/9061;178/3277;",
        "google_scholar": "CvwLRSMAAAAJ;ScLUQ-YAAAAJ;i38QlUwAAAAJ;UwLsYw8AAAAJ;d4W1UT0AAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Tianle_Cai1;~Xuezhi_Wang3;~Tengyu_Ma1;~Dengyong_Zhou2;~Xinyun_Chen2",
        "aff": "Princeton University;Google DeepMind;Facebook AI Research;Google DeepMind;Google",
        "aff_domain": "princeton.edu;google.com;fb.com;google.com;google.com",
        "position": "PhD student;Research Scientist;Visiting Scientist;Research Scientist;Researcher",
        "bibtex": "@inproceedings{\ncai2024large,\ntitle={Large Language Models as Tool Makers},\nauthor={Tianle Cai and Xuezhi Wang and Tengyu Ma and Xinyun Chen and Denny Zhou},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=qV83K9d5WB}\n}",
        "github": "",
        "project": "",
        "reviewers": "CctH;uR2C;hBc8;6T59",
        "pdf_size": 1038635,
        "rating": "3;5;5;6",
        "confidence": "4;4;5;3",
        "soundness": "3;3;3;3",
        "contribution": "1;1;2;2",
        "presentation": "4;3;2;3",
        "wc_summary": "206;73;71;83",
        "wc_strengths": "66;64;64;67",
        "wc_weaknesses": "285;235;101;115",
        "wc_questions": "36;1;83;26",
        "wc_review": "593;373;319;291",
        "wc_reply_reviewers": "0;74;0;0",
        "wc_reply_authors": "439;183;230;188",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            108.25,
            56.6187910503218
        ],
        "wc_strengths_avg": [
            65.25,
            1.299038105676658
        ],
        "wc_weaknesses_avg": [
            184.0,
            78.18567643756751
        ],
        "wc_questions_avg": [
            36.5,
            29.71952220342716
        ],
        "wc_review_avg": [
            394.0,
            118.61281549647154
        ],
        "wc_reply_reviewers_avg": [
            18.5,
            32.04293994002423
        ],
        "wc_reply_authors_avg": [
            260.0,
            104.94522380747016
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.3244428422615251,
        "gs_citation": 174,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8949374981714295485&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=qV83K9d5WB",
        "pdf": "https://openreview.net/pdf?id=qV83K9d5WB",
        "email": "princeton.edu;google.com;fb.com;google.com;google.com",
        "author_num": 5,
        "aff_unique_index": "0;1;2;1;1",
        "aff_unique_norm": "Princeton University;Google;Meta",
        "aff_unique_dep": ";Google DeepMind;Facebook AI Research",
        "aff_unique_url": "https://www.princeton.edu;https://deepmind.com;https://research.facebook.com",
        "aff_unique_abbr": "Princeton;DeepMind;FAIR",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;0;1;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "qVBTlo0T4s",
        "title": "AutoNeRF: Training Implicit Scene Representations with Autonomous Agents",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Implicit representations such as Neural Radiance Fields (NeRF) have been shown to be very effective at novel view synthesis. However, these models typically require manual and careful human data collection for training. In this paper, we present AutoNeRF, a method to collect data required to train NeRFs using autonomous embodied agents. Our method allows an agent to explore an unseen environment efficiently and use the experience to build an implicit map representation autonomously. We compare the impact of different exploration strategies including handcrafted frontier-based exploration, end-to-end and modular approaches composed of trained high-level planners and classical low-level path followers. We train these models with different reward functions tailored to this problem and evaluate the quality of the learned representations on four different downstream tasks: classical viewpoint rendering, map reconstruction, planning, and pose refinement. Empirical results show that NeRFs can be trained on actively collected data using just a single episode of experience in an unseen environment, and can be used for several downstream robotic tasks, and that modular trained exploration models outperform other classical and end-to-end baselines. Finally, we show that AutoNeRF can reconstruct large-scale scenes, and is thus a useful tool to perform scene-specific adaptation as the produced 3D environment models can be loaded into a simulator to fine-tune a policy of interest.",
        "keywords": "Visual Navigation;Embodied AI;Neural Fields;Computer Vision;Robotics;3D Scene Representation",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/75d8d5a6420437032861ac14ec5c2a302e5a479b.zip",
        "author": "Pierre Marza;Laetitia Matignon;Olivier Simonin;Dhruv Batra;Christian Wolf;Devendra Singh Chaplot",
        "authorids": "~Pierre_Marza1;~Laetitia_Matignon1;~Olivier_Simonin1;~Dhruv_Batra1;~Christian_Wolf5;~Devendra_Singh_Chaplot2",
        "gender": ";;M;Not Specified;M;M",
        "homepage": "https://pierremarza.github.io/;https://perso.liris.cnrs.fr/laetitia.matignon/;http://perso.citi-lab.fr/osimonin/;https://dhruvbatra.com;https://chriswolfvision.github.io/www/;https://devendrachaplot.github.io/",
        "dblp": "262/0331;;https://dblp.uni-trier.de/pers/hd/s/Simonin_0001:Olivier;67/6586;38/2606-1.html;161/0038",
        "google_scholar": "https://scholar.google.fr/citations?user=NAI5mi4AAAAJ;;https://scholar.google.fr/citations?user=0P45eHsAAAAJ;_bs7PqgAAAAJ;idYS1AIAAAAJ;1MSpdmQAAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";;;;christian-wolf-522761249/;",
        "or_profile": "~Pierre_Marza1;~Laetitia_Matignon1;~Olivier_Simonin1;~Dhruv_Batra1;~Christian_Wolf5;~Devendra_Chaplot1",
        "aff": "Institut National des Sciences Appliqu\u00e9es de Lyon;LIRIS, CNRS;INSA de Lyon;Georgia Institute of Technology;Naver Labs Europe;Meta Facebook",
        "aff_domain": "insa-lyon.fr;liris.cnrs.fr;insa-lyon.fr;gatech.edu;naverlabs.com;fb.com",
        "position": "PhD student;Associate Professor;Full Professor;Associate Professor;Principal Researcher;Researcher",
        "bibtex": "@misc{\nmarza2024autonerf,\ntitle={AutoNe{RF}: Training Implicit Scene Representations with Autonomous Agents},\nauthor={Pierre Marza and Laetitia Matignon and Olivier Simonin and Dhruv Batra and Christian Wolf and Devendra Singh Chaplot},\nyear={2024},\nurl={https://openreview.net/forum?id=qVBTlo0T4s}\n}",
        "github": "",
        "project": "",
        "reviewers": "o9wx;ZNfM;7hgK;6sGZ",
        "site": "https://openreview.net/forum?id=qVBTlo0T4s",
        "pdf_size": 15932059,
        "rating": "3;5;5;6",
        "confidence": "2;4;3;3",
        "soundness": "2;2;3;3",
        "contribution": "1;2;3;3",
        "presentation": "2;3;2;3",
        "wc_summary": "114;60;121;65",
        "wc_strengths": "61;49;32;57",
        "wc_weaknesses": "107;339;36;51",
        "wc_questions": "69;325;112;38",
        "wc_review": "351;773;301;211",
        "wc_reply_reviewers": "176;0;0;0",
        "wc_reply_authors": "369;1077;676;186",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            90.0,
            27.667670664513846
        ],
        "wc_strengths_avg": [
            49.75,
            11.121488209767612
        ],
        "wc_weaknesses_avg": [
            133.25,
            121.70122226173409
        ],
        "wc_questions_avg": [
            136.0,
            112.2385851657085
        ],
        "wc_review_avg": [
            409.0,
            216.06017680266763
        ],
        "wc_reply_reviewers_avg": [
            44.0,
            76.2102355330306
        ],
        "wc_reply_authors_avg": [
            577.0,
            337.61886795616147
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.6488856845230502,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15252932645128297786&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;1;2;3;4;5",
        "aff_unique_norm": "Institut National des Sciences Appliqu\u00e9es;CNRS;INSA de Lyon;Georgia Institute of Technology;NAVER LABS;Meta",
        "aff_unique_dep": ";LIRIS;;;;Meta Platforms, Inc.",
        "aff_unique_url": "https://www.insa-lyon.fr;https://www.cnrs.fr;https://www.insa-lyon.fr;https://www.gatech.edu;https://labs.naver.com;https://meta.com",
        "aff_unique_abbr": "INSA Lyon;CNRS;INSA Lyon;Georgia Tech;NLE;Meta",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Lyon;",
        "aff_country_unique_index": "0;0;0;1;2;1",
        "aff_country_unique": "France;United States;Unknown"
    },
    {
        "id": "qVILwUxjLG",
        "title": "Non-stationary Contextual Bandit Learning via Neural Predictive Ensemble Sampling",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Real-world applications of contextual bandits often exhibit non-stationarity due to seasonality, serendipity, and evolving social trends. \nWhile a number of non-stationary contextual bandit learning algorithms have been proposed in the literature, they excessively explore due to a lack of prioritization for information of enduring value, or are designed in ways that do not scale in modern applications with high-dimensional user-specific features and large action set, or both. In this paper, we introduce a novel non-stationary contextual bandit algorithm that addresses these concerns. It combines a scalable, deep-neural-network-based architecture with a carefully designed exploration mechanism that strategically prioritizes collecting information with the most lasting value in a non-stationary environment. Through empirical evaluations on two real-world recommendation datasets, which exhibit pronounced non-stationarity, we demonstrate that our approach significantly outperforms the state-of-the-art baselines.",
        "keywords": "Nonstationary Contextual Bandit;Neural Bandit Learning;Continual Learning;Exploration vs Exploitation",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Zheqing Zhu;Yueyang Liu;Kuang Xu;Benjamin Van Roy",
        "authorids": "~Zheqing_Zhu1;~Yueyang_Liu1;~Kuang_Xu1;~Benjamin_Van_Roy1",
        "gender": "M;;;M",
        "homepage": "https://www.zheqingbillzhu.com;https://yuey7x.github.io/;;https://web.stanford.edu/~bvr/",
        "dblp": "206/6081;;67/1187;41/4314",
        "google_scholar": ";EQBZAGwAAAAJ;;05sMX8MAAAAJ",
        "orcid": ";;;",
        "linkedin": "zheqingzhubill;;;",
        "or_profile": "~Zheqing_Zhu1;~Yueyang_Liu1;~Kuang_Xu1;~Benjamin_Van_Roy1",
        "aff": "Meta (Facebook) AI;Stanford University;Stanford University;Stanford University",
        "aff_domain": "meta.com;stanford.edu;stanford.edu;stanford.edu",
        "position": "Engineering Manager - Head of Applied Reinforcement Learning;PhD student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nzhu2024nonstationary,\ntitle={Non-stationary Contextual Bandit Learning via Neural Predictive Ensemble Sampling},\nauthor={Zheqing Zhu and Yueyang Liu and Kuang Xu and Benjamin Van Roy},\nyear={2024},\nurl={https://openreview.net/forum?id=qVILwUxjLG}\n}",
        "github": "",
        "project": "",
        "reviewers": "Coy3;Fa2p;EExp;jNAd",
        "site": "https://openreview.net/forum?id=qVILwUxjLG",
        "pdf_size": 725012,
        "rating": "3;3;3;6",
        "confidence": "4;3;4;2",
        "soundness": "3;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;2;4",
        "wc_summary": "98;70;77;63",
        "wc_strengths": "139;49;43;20",
        "wc_weaknesses": "425;233;141;49",
        "wc_questions": "13;127;2;20",
        "wc_review": "675;479;263;152",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "454;287;323;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            77.0,
            13.095800853708795
        ],
        "wc_strengths_avg": [
            62.75,
            45.334175850014084
        ],
        "wc_weaknesses_avg": [
            212.0,
            139.12224840046252
        ],
        "wc_questions_avg": [
            40.5,
            50.35126612112152
        ],
        "wc_review_avg": [
            392.25,
            201.18321873357132
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            266.0,
            165.672870440516
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0.75,
            0.4330127018922193
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8703882797784892,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6544655972364098669&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Meta;Stanford University",
        "aff_unique_dep": "Meta AI;",
        "aff_unique_url": "https://meta.com;https://www.stanford.edu",
        "aff_unique_abbr": "Meta;Stanford",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Stanford",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "qW9GVa3Caa",
        "title": "Prototype Generation: Robust Feature Visualisation for Data Independent Interpretability",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We introduce Prototype Generation, a stricter and more robust form of feature visualisation for model-agnostic, data-independent interpretability of image classification models. We demonstrate its ability to generate inputs that result in natural activation paths, countering previous claims that feature visualisation algorithms are untrustworthy due to the unnatural internal activations. We substantiate these claims by quantitatively measuring similarity between the internal activations of our generated prototypes and natural images. We also demonstrate how the interpretation of generated prototypes yields important insights, highlighting spurious correlations and biases learned by models which quantitative methods over test-sets cannot identify.",
        "keywords": "Interpretability",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Arush Tagade;Jessica Mary Rumbelow",
        "authorids": "~Arush_Tagade2;~Jessica_Mary_Rumbelow1",
        "gender": "M;F",
        "homepage": ";",
        "dblp": ";",
        "google_scholar": ";dtFatr0AAAAJ",
        "orcid": ";",
        "linkedin": "arush-tagade/;",
        "or_profile": "~Arush_Tagade2;~Jessica_Mary_Rumbelow1",
        "aff": "Leap Laboratories;Leap Laboratories",
        "aff_domain": "leap-labs.com;leap-labs.com",
        "position": "Researcher;CEO",
        "bibtex": "@misc{\ntagade2024prototype,\ntitle={Prototype Generation: Robust Feature Visualisation for Data Independent Interpretability},\nauthor={Arush Tagade and Jessica Mary Rumbelow},\nyear={2024},\nurl={https://openreview.net/forum?id=qW9GVa3Caa}\n}",
        "github": "",
        "project": "",
        "reviewers": "fFHp;5oJb;WSWR",
        "site": "https://openreview.net/forum?id=qW9GVa3Caa",
        "pdf_size": 3833486,
        "rating": "1;5;5",
        "confidence": "4;4;4",
        "soundness": "2;3;3",
        "contribution": "1;3;2",
        "presentation": "1;2;3",
        "wc_summary": "143;76;175",
        "wc_strengths": "27;122;62",
        "wc_weaknesses": "108;53;464",
        "wc_questions": "1;6;95",
        "wc_review": "279;257;796",
        "wc_reply_reviewers": "0;0;69",
        "wc_reply_authors": "154;31;438",
        "reply_reviewers": "0;0;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            3.6666666666666665,
            1.8856180831641267
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            131.33333333333334,
            41.24991582482994
        ],
        "wc_strengths_avg": [
            70.33333333333333,
            39.2286743197994
        ],
        "wc_weaknesses_avg": [
            208.33333333333334,
            182.17268974489255
        ],
        "wc_questions_avg": [
            34.0,
            43.18178628387977
        ],
        "wc_review_avg": [
            444.0,
            249.0635795668782
        ],
        "wc_reply_reviewers_avg": [
            23.0,
            32.526911934581186
        ],
        "wc_reply_authors_avg": [
            207.66666666666666,
            170.43539016947807
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:XLZGQ4h03N8J:scholar.google.com/&scioq=Prototype+Generation:+Robust+Feature+Visualisation+for+Data+Independent+Interpretability&hl=en&as_sdt=0,33",
        "gs_version_total": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Leap Laboratories",
        "aff_unique_dep": "",
        "aff_unique_url": "",
        "aff_unique_abbr": "",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "",
        "aff_country_unique": ""
    },
    {
        "id": "qWSk62REeK",
        "title": "Multisensory Geospatial Models via Cross-Sensor Pretraining",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Geospatial remote sensors, derived from optical and microwave sensors, exhibit significant diversity and provide unique capabilities due to the different observing mechanisms. By integrating multi-sensor data through fusion, researchers can harness the complementary and synergistic nature of optical and microwave data to achieve more accurate and efficient Earth monitoring. Despite the proven enhancements by geospatial pretraining models on various downstream tasks, most research primarily focuses on single sensor modality. Thus, to unlock these synergies, we introduce a multi-sensor geospatial pretraining model, XGeo, pretrained with four sensor modalities: RGB channels, Sentinel-2, Synthetic Aperture Radar (SAR), and Digital Surface Model (DSM) data, encompassing a total of two million multisensor images. Our method is equipped to manage both paired and unpaired data effectively. When originating from the same geolocation, we integrate cross-linked corresponding sensors into the modeling of the masked image, which facilitates the learning of a joint representation from multiple sensors. In addition, we utilize a mixture of expert layers and heterogeneous batches to mitigate data heterogeneity. Our experiments show that XGeo enhances performance on both single sensor and multisensor downstream tasks, such as land-use classification, segmentation, cloud removal, and pan-sharpening. We also reveal that representations from natural images differ from some of geospatial remote sensors, which renders the use of existing representations less effective. Our work serves as a comprehensive guide for developing robust multisensor geospatial pretraining models, paving the way for more advanced geospatial capabilities.",
        "keywords": "geospatial pretraining;multisensor modalities;cross-sensor pretraining;remote sensing applications;masked image modeling",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Boran Han;Shuai Zhang;Xingjian Shi;Markus Reichstein",
        "authorids": "~Boran_Han1;~Shuai_Zhang7;~Xingjian_Shi1;~Markus_Reichstein1",
        "gender": ";;M;M",
        "homepage": ";;https://sxjscience.github.io/;",
        "dblp": ";;145/9987;09/9619",
        "google_scholar": ";;https://scholar.google.com.hk/citations?user=P4G6H7oAAAAJ;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Boran_Han1;~Shuai_Zhang7;~Xingjian_Shi1;~Markus_Reichstein1",
        "aff": ";;Boson AI;",
        "aff_domain": ";;boson.ai;",
        "position": ";;Member of Technical Staff;",
        "bibtex": "@misc{\nhan2024multisensory,\ntitle={Multisensory Geospatial Models via Cross-Sensor Pretraining},\nauthor={Boran Han and Shuai Zhang and Xingjian Shi and Markus Reichstein},\nyear={2024},\nurl={https://openreview.net/forum?id=qWSk62REeK}\n}",
        "github": "",
        "project": "",
        "reviewers": "KKqz;2AtA;V45f;Tpx5",
        "site": "https://openreview.net/forum?id=qWSk62REeK",
        "pdf_size": 4114060,
        "rating": "3;3;6;8",
        "confidence": "5;4;4;4",
        "soundness": "3;2;3;3",
        "contribution": "1;3;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "118;141;96;28",
        "wc_strengths": "31;111;16;31",
        "wc_weaknesses": "357;222;49;81",
        "wc_questions": "40;240;166;117",
        "wc_review": "546;714;327;257",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            5.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            95.75,
            42.22780482099442
        ],
        "wc_strengths_avg": [
            47.25,
            37.31202889149825
        ],
        "wc_weaknesses_avg": [
            177.25,
            122.49974489769356
        ],
        "wc_questions_avg": [
            140.75,
            72.80582050907744
        ],
        "wc_review_avg": [
            461.0,
            180.83556066216622
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5443310539518174,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ea6T1HaSA-EJ:scholar.google.com/&scioq=Multisensory+Geospatial+Models+via+Cross-Sensor+Pretraining&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Boson AI",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.boson.ai",
        "aff_unique_abbr": "Boson AI",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "qWtz3dOmML",
        "title": "Diffusion Models without Attention",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Advances in high-fidelity image generation have been spearheaded by denoising diffusion probabilistic models (DDPMs). However, there remain considerable computational challenges when scaling current DDPM architectures to high-resolutions, due to the use of attention either in UNet architectures or Transformer variants. To make models tractable, it is common to employ lossy compression techniques in hidden space, such as patchifying, which trade-off representational capacity for efficiency. We propose Diffusion State Space Model (DiffuSSMs), an architecture that replaces attention with a more efficient state space model backbone. The model avoids global compression which enables longer, more fine-grained image representation in the diffusion process.  Comprehensive validation on ImageNet indicates superior performance in terms of FiD and Inception Score at reduced total FLOP usage compared to previous diffusion models using attention.",
        "keywords": "Diffusion models;State space models;Image Generation;Long-range Architecture",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Jing Nathan Yan;Jiatao Gu;Alexander M Rush",
        "authorids": "~Jing_Nathan_Yan1;~Jiatao_Gu1;~Alexander_M_Rush1",
        "gender": ";M;M",
        "homepage": "https://nathanyanjing.github.io/;http://jiataogu.me;http://rush.seas.harvard.edu/",
        "dblp": ";164/5848.html;http://dblp.uni-trier.de/pers/hd/r/Rush:Alexander_M=",
        "google_scholar": ";https://scholar.google.com.sg/citations?user=cB1mFBsAAAAJ;LIjnUGgAAAAJ",
        "orcid": ";;0000-0002-9900-1606",
        "linkedin": ";jiatao-gu-204b2672/;sasha-rush-a69b6917/",
        "or_profile": "~Jing_Nathan_Yan1;~Jiatao_Gu1;~Alexander_M_Rush1",
        "aff": "Cornell University;Apple;School of Engineering and Applied Sciences, Harvard University",
        "aff_domain": "cornell.edu;apple.com;seas.harvard.edu",
        "position": "PhD student;Researcher;Assistant Professor",
        "bibtex": "@misc{\nyan2024diffusion,\ntitle={Diffusion Models without Attention},\nauthor={Jing Nathan Yan and Jiatao Gu and Alexander M Rush},\nyear={2024},\nurl={https://openreview.net/forum?id=qWtz3dOmML}\n}",
        "github": "",
        "project": "",
        "reviewers": "kiL5;gSqZ;PFc7;Rpnw",
        "site": "https://openreview.net/forum?id=qWtz3dOmML",
        "pdf_size": 10630677,
        "rating": "3;3;3;3",
        "confidence": "4;4;4;3",
        "soundness": "2;2;3;2",
        "contribution": "2;2;2;2",
        "presentation": "3;2;3;2",
        "wc_summary": "57;46;60;70",
        "wc_strengths": "35;20;41;11",
        "wc_weaknesses": "190;146;71;124",
        "wc_questions": "77;2;1;58",
        "wc_review": "359;214;173;263",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            58.25,
            8.554969316134336
        ],
        "wc_strengths_avg": [
            26.75,
            11.882234638316145
        ],
        "wc_weaknesses_avg": [
            132.75,
            42.84492385335747
        ],
        "wc_questions_avg": [
            34.5,
            33.67862823809782
        ],
        "wc_review_avg": [
            252.25,
            69.38074300553433
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 69,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8721874649982412252&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Cornell University;Apple;Harvard University",
        "aff_unique_dep": ";Apple Inc.;School of Engineering and Applied Sciences",
        "aff_unique_url": "https://www.cornell.edu;https://www.apple.com;https://www.harvard.edu",
        "aff_unique_abbr": "Cornell;Apple;Harvard",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Cambridge",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "qYb0CANLGC",
        "title": "Auto-Regressive Next-Token Predictors are Universal Learners",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models display remarkable capabilities in logical and mathematical reasoning, allowing them to solve complex tasks. Interestingly, these abilities emerge in networks trained on the simple task of next-token prediction. In this work, we present a theoretical framework for studying auto-regressive next-token predictors. We demonstrate that even simple models such as linear next-token predictors, trained on Chain-of-Thought (CoT) data, can approximate any function efficiently computed by a Turing machine. We introduce a new complexity measure---length complexity---which measures the number of intermediate tokens in a CoT sequence required to approximate some target function, and analyze the interplay between length complexity and other notions of complexity. Finally, we show experimentally that simple next-token predictors, such as linear networks and shallow Multi-Layer Perceptrons (MLPs), display non-trivial performance on text generation and arithmetic tasks. Our results demonstrate that the power of today's LLMs can be attributed, to a great extent, to the auto-regressive next-token training scheme, and not necessarily to a particular choice of architecture.",
        "keywords": "Large Language Models;Learning Theory;Theory of Deep Learning;Chain-of-Thought",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "eran malach",
        "authorids": "~eran_malach1",
        "gender": "M",
        "homepage": "",
        "dblp": "202/2566",
        "google_scholar": "I15dUOwAAAAJ",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~eran_malach1",
        "aff": "Harvard University",
        "aff_domain": "harvard.edu",
        "position": "Postdoc",
        "bibtex": "@misc{\nmalach2024autoregressive,\ntitle={Auto-Regressive Next-Token Predictors are Universal Learners},\nauthor={eran malach},\nyear={2024},\nurl={https://openreview.net/forum?id=qYb0CANLGC}\n}",
        "github": "",
        "project": "",
        "reviewers": "QtWu;RXBR;ry1v",
        "site": "https://openreview.net/forum?id=qYb0CANLGC",
        "pdf_size": 363218,
        "rating": "5;5;8",
        "confidence": "3;4;3",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "3;3;3",
        "wc_summary": "143;204;508",
        "wc_strengths": "55;26;354",
        "wc_weaknesses": "141;226;983",
        "wc_questions": "78;133;61",
        "wc_review": "417;589;1906",
        "wc_reply_reviewers": "0;65;40",
        "wc_reply_authors": "466;439;347",
        "reply_reviewers": "0;1;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            6.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            285.0,
            159.63917647829015
        ],
        "wc_strengths_avg": [
            145.0,
            148.25878276401255
        ],
        "wc_weaknesses_avg": [
            450.0,
            378.4820559374865
        ],
        "wc_questions_avg": [
            90.66666666666667,
            30.728199137310703
        ],
        "wc_review_avg": [
            970.6666666666666,
            665.0976536486119
        ],
        "wc_reply_reviewers_avg": [
            35.0,
            26.770630673681683
        ],
        "wc_reply_authors_avg": [
            417.3333333333333,
            50.940051912899435
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 32,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8708889587357615912&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0",
        "aff_unique_norm": "Harvard University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.harvard.edu",
        "aff_unique_abbr": "Harvard",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "qYoIuM095A",
        "title": "GNN-based Probabilistic Supply and Inventory Predictions in Supply Chain Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Successful supply chain optimization must mitigate imbalances between supply and demand over time. While accurate demand prediction is essential for supply planning, it alone does not suffice. The key to successful supply planning for optimal and viable execution lies in maximizing predictability for both demand and supply throughout an execution horizon.\nTherefore, enhancing the accuracy of supply predictions is imperative to create an attainable supply plan that matches demand without overstocking or understocking.  However, in complex supply chain networks with numerous nodes and lanes, accurate supply predictions are challenging due to dynamic node interactions, cascading supply delays, resource availability, production and logistic capabilities.  Consequently, supply executions often deviate from their initial plans.\nTo address this, we present the Graph-based Supply Prediction (GSP) probabilistic model.  Our attention-based graph neural network (GNN) model predicts supplies, inventory, and imbalances using graph-structured historical data, demand forecasting, and original supply plan inputs.  The experiments, conducted using historical data from a global consumer goods company\u2019s large-scale supply chain, demonstrate that GSP significantly improves supply and inventory prediction accuracy, potentially offering supply plan corrections to optimize executions.",
        "keywords": "Graph Neural Network;Supply Chain Network;Shipment Prediction;Inventory Prediction;Event Prediction",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Hyung-Il Ahn;Young Chol Song;Santiago Olivar;Hershel Mehta;Naveen Tewari",
        "authorids": "~Hyung-Il_Ahn1;youngchol.song@noodle.ai;santiago.olivar@noodle.ai;hershel.mehta@noodle.ai;naveen.tewari@noodle.ai",
        "gender": "M;;;;",
        "homepage": ";;;;",
        "dblp": "77/11205;;;;",
        "google_scholar": "lgAxVQgAAAAJ;;;;",
        "orcid": ";;;;",
        "linkedin": "hyung-il-ahn;;;;",
        "or_profile": "~Hyung-Il_Ahn1;youngchol.song@noodle.ai;santiago.olivar@noodle.ai;hershel.mehta@noodle.ai;naveen.tewari@noodle.ai",
        "aff": ";;;;",
        "aff_domain": ";;;;",
        "position": ";;;;",
        "bibtex": "@misc{\nahn2024gnnbased,\ntitle={{GNN}-based Probabilistic Supply and Inventory Predictions in Supply Chain Networks},\nauthor={Hyung-Il Ahn and Young Chol Song and Santiago Olivar and Hershel Mehta and Naveen Tewari},\nyear={2024},\nurl={https://openreview.net/forum?id=qYoIuM095A}\n}",
        "github": "",
        "project": "",
        "reviewers": "4JxK;eXox;67xi;vuxs",
        "site": "https://openreview.net/forum?id=qYoIuM095A",
        "pdf_size": 2912475,
        "rating": "3;3;5;6",
        "confidence": "4;3;5;3",
        "soundness": "2;2;3;3",
        "contribution": "1;1;2;2",
        "presentation": "2;1;3;3",
        "wc_summary": "38;20;83;37",
        "wc_strengths": "14;73;67;20",
        "wc_weaknesses": "204;415;42;25",
        "wc_questions": "161;86;172;99",
        "wc_review": "417;594;364;181",
        "wc_reply_reviewers": "75;0;0;0",
        "wc_reply_authors": "812;696;450;371",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            44.5,
            23.350588857671234
        ],
        "wc_strengths_avg": [
            43.5,
            26.669270706189174
        ],
        "wc_weaknesses_avg": [
            171.5,
            156.98805687057853
        ],
        "wc_questions_avg": [
            129.5,
            37.486664295453124
        ],
        "wc_review_avg": [
            389.0,
            147.22262054453452
        ],
        "wc_reply_reviewers_avg": [
            18.75,
            32.47595264191645
        ],
        "wc_reply_authors_avg": [
            582.25,
            178.77412424621187
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.058025885318565944,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17637098187779501998&as_sdt=40000005&sciodt=0,22&hl=en",
        "gs_version_total": 3
    },
    {
        "id": "qYwdyvvvqQ",
        "title": "CAST: Clustering self-Attention using Surrogate Tokens for efficient transformers",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The Transformer architecture has shown  to be a powerful tool for a wide range of tasks. It is based on the self-attention mechanism, which is an inherently computationally expensive operation with quadratic computational complexity: memory usage and compute time increase quadratically with the length of the input sequences, thus limiting the application of Transformers. In this work, we propose a novel Clustering self-Attention mechanism using Surrogate Tokens (CAST), to optimize the attention computation and achieve efficient transformers. CAST utilizes learnable surrogate tokens to construct a cluster affinity matrix, used to cluster the input sequence and generate novel cluster summaries. The self-attention from within each cluster is then combined with the cluster summaries of other clusters, enabling information flow across the entire input sequence. CAST improves efficiency by reducing the complexity from $O(N^2)$ to $O(\\alpha N)$ where $N$ is the sequence length, and $\\alpha$ is constant according to the number of clusters and samples per cluster. \nWe show that CAST performs better than or comparable to the baseline Transformers on long-range sequence modeling tasks, while also achieving higher results on time and memory efficiency than other efficient transformers.",
        "keywords": "Self-attention mechanism;Clustering self-attention mechanism;Complexity;Efficient transformers;LRA benchmark",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Adjorn Van Engelenhoven;Nicola Strisciuglio;Estefania Talavera Martinez",
        "authorids": "~Adjorn_Van_Engelenhoven2;~Nicola_Strisciuglio2;~Estefania_Talavera_Martinez1",
        "gender": "M;M;F",
        "homepage": ";https://people.utwente.nl/n.strisciuglio;https://estefaniatalavera.github.io/",
        "dblp": ";136/0221;163/2269.html",
        "google_scholar": ";https://scholar.google.it/citations?user=7cgpfGYAAAAJ;https://scholar.google.nl/citations?user=lDW7eNEAAAAJ",
        "orcid": ";0000-0002-7478-3509;0000-0001-5918-8990",
        "linkedin": "https://linkedin.com/in/adjorn-van-engelenhoven;nicolastrisciuglio/;estefaniatalavera/",
        "or_profile": "~Adjorn_Van_Engelenhoven2;~Nicola_Strisciuglio2;~Estefania_Talavera_Martinez1",
        "aff": ";University of Twente;University of Twente",
        "aff_domain": ";utwente.nl;utwente.nl",
        "position": ";Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nengelenhoven2024cast,\ntitle={{CAST}: Clustering self-Attention using Surrogate Tokens for efficient transformers},\nauthor={Adjorn Van Engelenhoven and Nicola Strisciuglio and Estefania Talavera Martinez},\nyear={2024},\nurl={https://openreview.net/forum?id=qYwdyvvvqQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "KR9t;sYTK;L36F;y2Xn",
        "site": "https://openreview.net/forum?id=qYwdyvvvqQ",
        "pdf_size": 1102551,
        "rating": "3;3;5;5",
        "confidence": "5;5;4;4",
        "soundness": "2;1;2;3",
        "contribution": "2;2;2;2",
        "presentation": "2;3;2;3",
        "wc_summary": "102;79;43;129",
        "wc_strengths": "76;36;29;45",
        "wc_weaknesses": "289;186;162;220",
        "wc_questions": "52;76;13;36",
        "wc_review": "519;377;247;430",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            88.25,
            31.554516317002864
        ],
        "wc_strengths_avg": [
            46.5,
            17.95132307101624
        ],
        "wc_weaknesses_avg": [
            214.25,
            47.82454913535516
        ],
        "wc_questions_avg": [
            44.25,
            22.982330169066845
        ],
        "wc_review_avg": [
            393.25,
            98.50983453442605
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3626040441052550350&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 11,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Twente",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.utwente.nl",
        "aff_unique_abbr": "UT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Netherlands"
    },
    {
        "id": "qZB7KDN4L1",
        "title": "Subject-Diffusion: Open Domain Personalized Text-to-Image Generation without Test-time Fine-tuning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent progress in personalized image generation using diffusion models has been significant. However, development in the area of open-domain and test-time fine-tuning-free personalized image generation is proceeding rather slowly. In this paper, we propose Subject-Diffusion, a novel open-domain personalized image generation model that, in addition to not requiring test-time fine-tuning, also only requires a single reference image to support personalized generation of single- or multi-subjects in any domain. Firstly, we construct an automatic data labeling tool and use the LAION-Aesthetics dataset to construct a large-scale dataset consisting of 76M images and their corresponding subject detection bounding boxes, segmentation masks, and text descriptions. Secondly, we design a new unified framework that combines text and image semantics by incorporating coarse location and fine-grained reference image control to maximize subject fidelity and generalization. Furthermore, we also adopt an attention control mechanism to support multi-subject generation. Extensive qualitative and quantitative results demonstrate that our method outperforms other SOTA frameworks in single, multiple, and human-customized image generation.",
        "keywords": "open-domain;personalized image generation;text-to-image generation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/7a01a3790567f04b87fef0a78519171a624b9bf9.zip",
        "author": "Jian Ma;Junhao Liang;Chen Chen;Haonan Lu",
        "authorids": "~Jian_Ma7;~Junhao_Liang1;~Chen_Chen24;~Haonan_Lu1",
        "gender": "M;M;M;M",
        "homepage": "https://scholar.google.com/citations?hl=zh-CN&user=XtzIT8UAAAAJ;;;",
        "dblp": ";;65/4423-15.html;129/0998",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;KbSra3UAAAAJ;CANDhfAAAAAJ;EPBgKu0AAAAJ",
        "orcid": ";;0000-0003-3498-2527;0000-0001-6332-2785",
        "linkedin": ";;%E5%AE%B8-%E9%99%88-481b76109/;",
        "or_profile": "~Jian_Ma7;~Junhao_Liang1;~Chen_Chen24;~Haonan_Lu1",
        "aff": "OPPO Research Institute;Southern University of Science and Technology;OPPO AI Center;OPPO Guangdong Mobile Telecommunications Co., Ltd.",
        "aff_domain": "oppo.com;sustech.edu.cn;oppo.com;oppo.com",
        "position": "Researcher;MS student;Researcher;Researcher",
        "bibtex": "@misc{\nma2024subjectdiffusion,\ntitle={Subject-Diffusion: Open Domain Personalized Text-to-Image  Generation without Test-time Fine-tuning},\nauthor={Jian Ma and Junhao Liang and Chen Chen and Haonan Lu},\nyear={2024},\nurl={https://openreview.net/forum?id=qZB7KDN4L1}\n}",
        "github": "",
        "project": "",
        "reviewers": "8qrS;Gk6j;4YXM;83st",
        "site": "https://openreview.net/forum?id=qZB7KDN4L1",
        "pdf_size": 30812399,
        "rating": "3;5;6;6",
        "confidence": "4;4;5;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "71;128;94;60",
        "wc_strengths": "58;40;71;95",
        "wc_weaknesses": "260;131;18;104",
        "wc_questions": "75;128;1;4",
        "wc_review": "464;427;184;263",
        "wc_reply_reviewers": "0;0;20;0",
        "wc_reply_authors": "794;679;197;350",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            88.25,
            26.022826518270456
        ],
        "wc_strengths_avg": [
            66.0,
            20.03746490951388
        ],
        "wc_weaknesses_avg": [
            128.25,
            86.75936548868947
        ],
        "wc_questions_avg": [
            52.0,
            52.9386437302657
        ],
        "wc_review_avg": [
            334.5,
            115.20525161640853
        ],
        "wc_reply_reviewers_avg": [
            5.0,
            8.660254037844387
        ],
        "wc_reply_authors_avg": [
            505.0,
            241.18768625284335
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.4714045207910316,
        "gs_citation": 127,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16043009344602919751&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2;2",
        "aff_unique_norm": "OPPO Research Institute;Southern University of Science and Technology;OPPO",
        "aff_unique_dep": ";;OPPO AI Center",
        "aff_unique_url": "https://www.oppo.com/en;https://www.sustech.edu.cn;https://www.oppo.com",
        "aff_unique_abbr": "OPPO RI;SUSTech;OPPO",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Counting Graph Substructures with Graph Neural Networks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17728",
        "id": "qaJxPhkYtD",
        "author_site": "Charilaos Kanatsoulis, Alejandro Ribeiro",
        "tldr": "",
        "abstract": "Graph Neural Networks (GNNs) are powerful representation learning tools that have achieved remarkable performance in various downstream tasks. However, there are still open questions regarding their ability to count and list substructures, which play a crucial role in biological and social networks. In this work, we fill this gap and characterize the representation {and generalization} power of GNNs in terms of their ability to produce powerful representations that count substructures. In particular, we study the message-passing operations of GNNs with random node input in a novel fashion, and show how they can produce equivariant representations that are associated with high-order statistical moments. Using these representations, we prove that GNNs can learn how to count cycles, {cliques}, quasi-cliques, and the number of connected components in a graph. We also provide new insights into the generalization capacity of GNNs. Our analysis is constructive and enables the design of a generic GNN architecture that shows remarkable performance in four distinct tasks: cycle detection, cycle counting, graph classification, and molecular property prediction.",
        "keywords": "graph neural networks;expressive power;representation learning;subgraph isomorphism;cliques;cycles;motifs;substructures;count;message-passing",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Charilaos Kanatsoulis;Alejandro Ribeiro",
        "authorids": "~Charilaos_Kanatsoulis1;~Alejandro_Ribeiro1",
        "gender": ";M",
        "homepage": "https://sites.google.com/site/harikanats;https://alelab.seas.upenn.edu",
        "dblp": "176/8106;32/15",
        "google_scholar": "3q7W3RMAAAAJ;7mrPM4kAAAAJ",
        "orcid": ";0000-0003-4230-9906",
        "linkedin": ";",
        "or_profile": "~Charilaos_Kanatsoulis1;~Alejandro_Ribeiro1",
        "aff": "University of Pennsylvania;University of Pennsylvania",
        "aff_domain": "seas.upenn.edu;upenn.edu",
        "position": "Postdoc;Full Professor",
        "bibtex": "@inproceedings{\nkanatsoulis2024counting,\ntitle={Counting Graph Substructures with Graph Neural Networks},\nauthor={Charilaos Kanatsoulis and Alejandro Ribeiro},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=qaJxPhkYtD}\n}",
        "github": "",
        "project": "",
        "reviewers": "QJcy;K7V4;4Tmr;jgwt",
        "pdf_size": 400840,
        "rating": "6;6;6;6",
        "confidence": "3;3;3;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;2",
        "presentation": "1;3;3;1",
        "wc_summary": "66;99;56;75",
        "wc_strengths": "37;36;95;106",
        "wc_weaknesses": "146;84;196;257",
        "wc_questions": "4;58;99;4",
        "wc_review": "253;277;446;442",
        "wc_reply_reviewers": "32;19;12;197",
        "wc_reply_authors": "567;443;538;1754",
        "reply_reviewers": "1;1;1;2",
        "reply_authors": "3;2;3;5",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            1.0
        ],
        "wc_summary_avg": [
            74.0,
            15.921683328090658
        ],
        "wc_strengths_avg": [
            68.5,
            32.23740063962974
        ],
        "wc_weaknesses_avg": [
            170.75,
            63.66857545131664
        ],
        "wc_questions_avg": [
            41.25,
            39.97108329780418
        ],
        "wc_review_avg": [
            354.5,
            89.91245742387426
        ],
        "wc_reply_reviewers_avg": [
            65.0,
            76.54737095420064
        ],
        "wc_reply_authors_avg": [
            825.5,
            538.0281126484006
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.25,
            1.0897247358851685
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=497024329630635358&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=qaJxPhkYtD",
        "pdf": "https://openreview.net/pdf?id=qaJxPhkYtD",
        "email": "seas.upenn.edu;upenn.edu",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Pennsylvania",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.upenn.edu",
        "aff_unique_abbr": "UPenn",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Learning Thresholds with Latent Values and Censored Feedback",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17727",
        "id": "qaKRfobbTg",
        "author_site": "Jiahao Zhang, Tao Lin, Weiqiang Zheng, Zhe Feng, Yifeng Teng, Xiaotie Deng",
        "tldr": "",
        "abstract": "In this paper, we investigate a problem of *actively* learning threshold in latent space, where the *unknown* reward $g(\\gamma, v)$ depends on the proposed threshold $\\gamma$ and latent value $v$ and it can be $only$ achieved if the threshold is lower than or equal to the *unknown* latent value. This problem has broad applications in practical scenarios, e.g., reserve price optimization in online auctions, online task assignments in crowdsourcing, setting recruiting bars in hiring, etc. We first characterize the query complexity of learning a threshold with the expected reward at most $\\epsilon$ smaller than the optimum and prove that the number of queries needed can be infinitely large even when $g(\\gamma, v)$ is monotone with respect to both $\\gamma$ and $v$. On the positive side, we provide a tight query complexity $\\tilde{\\Theta}(1/\\epsilon^3)$ when $g$ is monotone and the CDF of value distribution is Lipschitz. Moreover, we show a tight $\\tilde{\\Theta}(1/\\epsilon^3)$ query complexity can be achieved as long as $g$ satisfies one-sided Lipschitzness, which provides a complete characterization for this problem. Finally, we extend this model to an online learning setting and demonstrate a tight $\\Theta(T^{2/3})$ regret bound using continuous-arm bandit techniques and the aforementioned query complexity results.",
        "keywords": "Threshold;Latent Value;Censored Feedback;Query Complexity",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Jiahao Zhang;Tao Lin;Weiqiang Zheng;Zhe Feng;Yifeng Teng;Xiaotie Deng",
        "authorids": "~Jiahao_Zhang5;~Tao_Lin2;~Weiqiang_Zheng1;~Zhe_Feng3;~Yifeng_Teng1;~Xiaotie_Deng1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://zjh2333-hh.github.io/;https://tao-l.github.io/;https://weiqiang-zheng.com/;https://scholar.harvard.edu/zfeng/home;http://pages.cs.wisc.edu/~yifengt/;https://cfcs.pku.edu.cn/english/people/faculty/xiaotiedeng/index.htm",
        "dblp": ";64/4492-13;277/5088;36/1508-4;154/6415;d/XiaotieDeng",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;YrfhnIwAAAAJ;MKbTrgIAAAAJ;CO1j3SMAAAAJ;https://scholar.google.com.tw/citations?user=OBUwP_oAAAAJ",
        "orcid": ";;;;;0000-0002-5282-6467",
        "linkedin": ";;;;;",
        "or_profile": "~Jiahao_Zhang5;~Tao_Lin2;~Weiqiang_Zheng1;~Zhe_Feng3;~Yifeng_Teng1;~Xiaotie_Deng1",
        "aff": "Peking University;Harvard University;Yale University;Google;Google Research;Peking University",
        "aff_domain": "pku.edu.cn;g.harvard.edu;yale.edu;google.com;google.com;pku.edu.cn",
        "position": "Undergrad student;PhD student;PhD student;Researcher;Research Scientist;Full Professor",
        "bibtex": "@inproceedings{\nzhang2024learning,\ntitle={Learning Thresholds with Latent Values and Censored Feedback},\nauthor={Jiahao Zhang and Tao Lin and Weiqiang Zheng and Zhe Feng and Yifeng Teng and Xiaotie Deng},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=qaKRfobbTg}\n}",
        "github": "",
        "project": "",
        "reviewers": "Z8bt;F7cS;MPBo;sD7K",
        "pdf_size": 571249,
        "rating": "5;5;6;8",
        "confidence": "2;3;4;3",
        "soundness": "3;3;3;4",
        "contribution": "3;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "107;131;193;115",
        "wc_strengths": "63;49;53;94",
        "wc_weaknesses": "98;222;265;46",
        "wc_questions": "75;140;33;2",
        "wc_review": "343;542;544;257",
        "wc_reply_reviewers": "0;22;0;0",
        "wc_reply_authors": "544;766;760;297",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            136.5,
            33.74537005279391
        ],
        "wc_strengths_avg": [
            64.75,
            17.640507362318125
        ],
        "wc_weaknesses_avg": [
            157.75,
            89.00667109829465
        ],
        "wc_questions_avg": [
            62.5,
            51.70348150753487
        ],
        "wc_review_avg": [
            421.5,
            125.24875248879727
        ],
        "wc_reply_reviewers_avg": [
            5.5,
            9.526279441628825
        ],
        "wc_reply_authors_avg": [
            591.75,
            192.24252261141393
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.28867513459481287,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:c_BmfI-wyVMJ:scholar.google.com/&scioq=Learning+Thresholds+with+Latent+Values+and+Censored+Feedback&hl=en&as_sdt=0,5",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=qaKRfobbTg",
        "pdf": "https://openreview.net/pdf?id=qaKRfobbTg",
        "email": "pku.edu.cn;g.harvard.edu;yale.edu;google.com;google.com;pku.edu.cn",
        "author_num": 6,
        "aff_unique_index": "0;1;2;3;3;0",
        "aff_unique_norm": "Peking University;Harvard University;Yale University;Google",
        "aff_unique_dep": ";;;Google",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.harvard.edu;https://www.yale.edu;https://www.google.com",
        "aff_unique_abbr": "Peking U;Harvard;Yale;Google",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;1;1;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Transformer-Modulated Diffusion Models for Probabilistic Multivariate Time Series Forecasting",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17726",
        "id": "qae04YACHs",
        "author_site": "Yuxin Li, Wenchao Chen, Xinyue Hu, Bo Chen, baolin sun, Mingyuan Zhou",
        "tldr": "",
        "abstract": "Transformers have gained widespread usage in multivariate time series (MTS) forecasting, delivering impressive performance. Nonetheless, these existing transformer-based methods often neglect an essential aspect: the incorporation of uncertainty into the predicted series, which holds significant value in decision-making. In this paper, we introduce a Transformer-Modulated Diffusion Model (TMDM), uniting conditional diffusion generative process with transformers into a unified framework to enable precise distribution forecasting for MTS. TMDM harnesses the power of transformers to extract essential insights from historical time series data. This information is then utilized as prior knowledge, capturing covariate-dependence in both the forward and reverse processes within the diffusion model. Furthermore, we seamlessly integrate well-designed transformer-based forecasting methods into TMDM to enhance its overall performance. Additionally, we introduce two novel metrics for evaluating uncertainty estimation performance. Through extensive experiments on six datasets using four evaluation metrics, we establish the effectiveness of TMDM in probabilistic MTS forecasting.",
        "keywords": "time series forecasting;generative modeling;deep learning;diffusion model",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/feb5bb61112cffec2074416af722adac8f978aea.zip",
        "author": "Yuxin Li;Wenchao Chen;Xinyue Hu;Bo Chen;baolin sun;Mingyuan Zhou",
        "authorids": "~Yuxin_Li3;~Wenchao_Chen1;~Xinyue_Hu1;~Bo_Chen1;~baolin_sun1;~Mingyuan_Zhou1",
        "gender": "M;M;F;M;M;M",
        "homepage": "https://liyuxin321.github.io/YuxinLi.github.io/;https://web.xidian.edu.cn/chenwenchao/;https://www.researchgate.net/profile/Xinyue-Hu-46;http://web.xidian.edu.cn/bchen/en/index.html;https://web.xidian.edu.cn/chenwenchao/index.html;http://mingyuanzhou.github.io",
        "dblp": ";;;89/5615-1;;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;;;;LXwCIisAAAAJ",
        "orcid": "0000-0002-5935-0684;;;0000-0001-5151-9388;;",
        "linkedin": ";;;;;",
        "or_profile": "~Yuxin_Li3;~Wenchao_Chen1;~Xinyue_Hu1;~Bo_Chen1;~baolin_sun1;~Mingyuan_Zhou1",
        "aff": "Xidian University;Xidian University;Xidian University;Xidian University;;Google",
        "aff_domain": "xidian.edu;xidian.edu;stu.xidian.edu.cn;xidian.edu.cn;;google.com",
        "position": "PhD student;Associate Professor;MS student;Full Professor;;Researcher",
        "bibtex": "@inproceedings{\nli2024transformermodulated,\ntitle={Transformer-Modulated Diffusion Models for Probabilistic Multivariate  Time Series Forecasting},\nauthor={Yuxin Li and Wenchao Chen and Xinyue Hu and Bo Chen and baolin sun and Mingyuan Zhou},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=qae04YACHs}\n}",
        "github": "",
        "project": "",
        "reviewers": "YJEP;SgLT;vL8K",
        "pdf_size": 3672157,
        "rating": "5;6;8",
        "confidence": "4;3;4",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "3;3;3",
        "wc_summary": "33;47;63",
        "wc_strengths": "39;38;98",
        "wc_weaknesses": "53;16;155",
        "wc_questions": "5;163;71",
        "wc_review": "130;264;387",
        "wc_reply_reviewers": "9;0;172",
        "wc_reply_authors": "1227;807;2401",
        "reply_reviewers": "1;0;3",
        "reply_authors": "4;3;8",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            47.666666666666664,
            12.256517540566822
        ],
        "wc_strengths_avg": [
            58.333333333333336,
            28.051539866625664
        ],
        "wc_weaknesses_avg": [
            74.66666666666667,
            58.77830287520123
        ],
        "wc_questions_avg": [
            79.66666666666667,
            64.79368967902832
        ],
        "wc_review_avg": [
            260.3333333333333,
            104.95184080752891
        ],
        "wc_reply_reviewers_avg": [
            60.333333333333336,
            79.04569705064421
        ],
        "wc_reply_authors_avg": [
            1478.3333333333333,
            674.5790456936005
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            1.247219128924647
        ],
        "reply_authors_avg": [
            5.0,
            2.160246899469287
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.18898223650461363,
        "gs_citation": 21,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13592195650618506494&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=qae04YACHs",
        "pdf": "https://openreview.net/pdf?id=qae04YACHs",
        "email": "xidian.edu;xidian.edu;stu.xidian.edu.cn;xidian.edu.cn;;google.com",
        "author_num": 6,
        "aff_unique_index": "0;0;0;0;1",
        "aff_unique_norm": "Xidian University;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "http://www.xidian.edu.cn/;https://www.google.com",
        "aff_unique_abbr": "Xidian;Google",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0;0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "qbw861vueP",
        "title": "BiDST: Dynamic Sparse Training is a Bi-Level Optimization Problem",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Dynamic Sparse Training (DST) is an effective approach for addressing the substantial training resource requirements posed by the ever-increasing size of the Deep Neural Networks (DNNs). Characterized by its dynamic ``train-prune-grow'' schedule during training, DST implicitly develops a bi-level structure for training the weights while discovering a subnetwork topology. However, such a structure is consistently overlooked by the current DST algorithms for further optimization opportunities, and these algorithms, on the other hand, solely optimize the weights while determining masks heuristically. In this paper, we extensively study DST algorithms and argue that the training scheme of DST naturally forms a bi-level problem in which the updating of weight and mask is interdependent. Based on this observation, we introduce a novel efficient training framework called BiDST, which for the first time, introduces bi-level optimization methodology into dynamic sparse training domain. Unlike traditional partial-heuristic DST schemes, which suffer from sub-optimal search efficiency for masks and miss the opportunity to fully explore the topological space of neural networks, BiDST excels at discovering excellent sparse patterns by optimizing mask and weight simultaneously, resulting in maximum $2.62$% higher accuracy, $2.1\\times$ faster execution speed, and $25\\times$ reduced overhead. Code will be released.",
        "keywords": "sparse training;efficient learning algorithm",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Jie Ji;Gen Li;Lu Yin;Minghai Qin;Geng Yuan;Linke Guo;Shiwei Liu;Xiaolong Ma",
        "authorids": "~Jie_Ji1;~Gen_Li4;~Lu_Yin1;~Minghai_Qin1;~Geng_Yuan1;~Linke_Guo2;~Shiwei_Liu2;~Xiaolong_Ma2",
        "gender": ";M;;M;M;M;M;M",
        "homepage": ";https://coulsonlee.github.io;https://luuyin.com/;https://sites.google.com/site/minghaiqin/home;;http://cecas.clemson.edu/~linkeg/index.html;https://shiweiliuiiiiiii.github.io/;https://xiaolongma2016.com",
        "dblp": ";28/538-12;87/2528-6;;205/3007;;234/8697-3.html;",
        "google_scholar": ";;G4Xe1NkAAAAJ;MSgWKbYAAAAJ;tBIAgtgAAAAJ;https://scholar.google.com/citations?hl=en;73IbXtsAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;;0000-0001-9844-992X;;;0000-0003-3753-7648",
        "linkedin": ";;;;;;;xiaolong-ma-66b98910b/",
        "or_profile": "~Jie_Ji1;~Gen_Li4;~Lu_Yin1;~Minghai_Qin1;~Geng_Yuan1;~Linke_Guo2;~Shiwei_Liu2;~Xiaolong_Ma2",
        "aff": ";Clemson University;University of Aberdeen;Western Digital Corporation;University of Georgia;Clemson University;University of Oxford;Clemson University",
        "aff_domain": ";clemson.edu;abdn.ac.uk;wdc.com;uga.edu;clemson.edu;ox.ac.uk;clemson.edu",
        "position": ";PhD student;Assistant Professor;senior technologist;Assistant Professor;Associate Professor;Postdoc;Assistant Professor",
        "bibtex": "@misc{\nji2024bidst,\ntitle={Bi{DST}: Dynamic Sparse Training is a Bi-Level Optimization Problem},\nauthor={Jie Ji and Gen Li and Lu Yin and Minghai Qin and Geng Yuan and Linke Guo and Shiwei Liu and Xiaolong Ma},\nyear={2024},\nurl={https://openreview.net/forum?id=qbw861vueP}\n}",
        "github": "",
        "project": "",
        "reviewers": "9sSt;MEAC;xhao",
        "site": "https://openreview.net/forum?id=qbw861vueP",
        "pdf_size": 1930764,
        "rating": "3;5;5",
        "confidence": "4;4;3",
        "soundness": "2;3;2",
        "contribution": "2;3;2",
        "presentation": "2;2;2",
        "wc_summary": "43;101;78",
        "wc_strengths": "71;300;35",
        "wc_weaknesses": "174;745;114",
        "wc_questions": "2;393;2",
        "wc_review": "290;1539;229",
        "wc_reply_reviewers": "108;457;0",
        "wc_reply_authors": "710;950;527",
        "reply_reviewers": "1;2;0",
        "reply_authors": "1;2;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            74.0,
            23.84673283002656
        ],
        "wc_strengths_avg": [
            135.33333333333334,
            117.36079224151291
        ],
        "wc_weaknesses_avg": [
            344.3333333333333,
            284.37104087598107
        ],
        "wc_questions_avg": [
            132.33333333333334,
            184.3191676292934
        ],
        "wc_review_avg": [
            686.0,
            603.6759616438828
        ],
        "wc_reply_reviewers_avg": [
            188.33333333333334,
            195.02535447702405
        ],
        "wc_reply_authors_avg": [
            729.0,
            173.2108541633578
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:gaER8ngfY6YJ:scholar.google.com/&scioq=BiDST:+Dynamic+Sparse+Training+is+a+Bi-Level+Optimization+Problem&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;0;4;0",
        "aff_unique_norm": "Clemson University;University of Aberdeen;Western Digital Corporation;University of Georgia;University of Oxford",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.clemson.edu;https://www.abdn.ac.uk;https://www.westerndigital.com;https://www.uga.edu;https://www.ox.ac.uk",
        "aff_unique_abbr": "Clemson;Aberdeen;WDC;UGA;Oxford",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;0;1;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "qcigbR1UYA",
        "title": "Performance Bounds for Active Binary Testing with Information Maximization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In many applications like experimental design, group testing, medical diagnosis, and active testing, the state of a random variable $Y$ is revealed by successively observing the outcomes of binary tests about $Y$, where new tests are selected adaptively based on the history of outcomes observed so far. If the number of states of $Y$ is finite, the process ends when $Y$ can be predicted with a desired level of confidence or all available tests have been used. Finding the strategy that minimizes the expected number of tests needed to predict $Y$ is virtually impossible in most real applications due to high dimensions. Therefore, the commonly used strategy is the greedy heuristic of information maximization that selects tests sequentially in order of information gain. However, this can be far from optimal for certain families of tests. In this paper, we argue that in most practical settings, for a given set of tests, there exists a $0 \\ll \\delta \\ll \\frac{1}{2}$, such that in every iteration of the greedy strategy, the selected binary test will have conditional probability of being `true', given the history, within $\\delta$ units of one-half. Under this assumption, we first study the performance of the greedy strategy for the simpler case of oracle tests, that is, when all tests are functions of $Y$, and obtain tighter bounds than previously reported in literature. Subsequently, under the same assumption, we extend our analysis to incorporate noise in the test outcomes. In particular, we assume the outcomes are corrupted through a binary symmetric channel and obtain bounds on the expected number of tests needed to make accurate predictions.",
        "keywords": "Information Maximization;Twenty Questions;Active Testing",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Aditya Chattopadhyay;Benjamin David Haeffele;Rene Vidal;Donald Geman",
        "authorids": "~Aditya_Chattopadhyay1;~Benjamin_David_Haeffele1;~Rene_Vidal1;~Donald_Geman2",
        "gender": "M;;;M",
        "homepage": ";;http://www.vision.jhu.edu;http://www.cis.jhu.edu/people/faculty/geman/",
        "dblp": "207/8574;;v/ReneVidal;",
        "google_scholar": "aekzv1gAAAAJ;;https://scholar.google.com/citations?hl=en;",
        "orcid": ";;;",
        "linkedin": ";;rene-vidal-74844928/;",
        "or_profile": "~Aditya_Chattopadhyay1;~Benjamin_David_Haeffele1;~Rene_Vidal1;~Donald_Geman2",
        "aff": "Johns Hopkins University;;Amazon;Johns Hopkins University",
        "aff_domain": "jhu.edu;;amazon.com;jh.edu",
        "position": "PhD student;;Principal Researcher;Full Professor",
        "bibtex": "@misc{\nchattopadhyay2024performance,\ntitle={Performance Bounds for Active Binary Testing with Information Maximization},\nauthor={Aditya Chattopadhyay and Benjamin David Haeffele and Rene Vidal and Donald Geman},\nyear={2024},\nurl={https://openreview.net/forum?id=qcigbR1UYA}\n}",
        "github": "",
        "project": "",
        "reviewers": "fURR;6HBL;xWDX;NgKX",
        "site": "https://openreview.net/forum?id=qcigbR1UYA",
        "pdf_size": 4655882,
        "rating": "5;5;5;6",
        "confidence": "4;4;3;2",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;2;4",
        "wc_summary": "57;200;235;89",
        "wc_strengths": "99;28;25;96",
        "wc_weaknesses": "231;45;130;67",
        "wc_questions": "60;38;58;11",
        "wc_review": "447;311;448;263",
        "wc_reply_reviewers": "0;236;0;0",
        "wc_reply_authors": "366;401;966;312",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            145.25,
            74.16999056222132
        ],
        "wc_strengths_avg": [
            62.0,
            35.531676008879735
        ],
        "wc_weaknesses_avg": [
            118.25,
            72.18509195117784
        ],
        "wc_questions_avg": [
            41.75,
            19.727835664360143
        ],
        "wc_review_avg": [
            367.25,
            82.02552956244782
        ],
        "wc_reply_reviewers_avg": [
            59.0,
            102.19099764656376
        ],
        "wc_reply_authors_avg": [
            511.25,
            264.4573453319079
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8703882797784891,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11160799959504172503&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Johns Hopkins University;Amazon",
        "aff_unique_dep": ";Amazon.com, Inc.",
        "aff_unique_url": "https://www.jhu.edu;https://www.amazon.com",
        "aff_unique_abbr": "JHU;Amazon",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "qdJ1jJzyVP",
        "title": "Joint Training Does Not Transfer Information between EEG and Image Classifiers",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Caution is necessary with machine-learning methods, and especially\ncomputer-vision methods, to support brain processing claims from\nneuroimaging data.  A recent paper (Palazzo et al. 2021) proposes (i) a\njoint-training process that does not use class information and (ii) a\nbidirectional transfer of (a) image information to an EEG classifier\nand (b) brain-activity information to an image classifier, such that\nthe joint embedding includes the shared image and brain-activity\ninformation.  These claims cannot be maintained: the training process\nis initialized with class information, and joint training with EEG\ndegrades rather than improves the performance of the image encoder.\nMoreover, theoretical solutions exist that entail no transfer beyond\nclass information in the joint embedding space.",
        "keywords": "object classification;EEG;human vision;neuroscience;neuroimaging;brain-computer interface",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/468b7c64c7f6523d5368f1a7b5ed8a147c159418.zip",
        "author": "Hari Bharadwaj;Ronnie Bring Wilbur;Jeffrey Mark Siskind",
        "authorids": "~Hari_Bharadwaj1;~Ronnie_Bring_Wilbur1;~Jeffrey_Mark_Siskind1",
        "gender": "M;M;F",
        "homepage": "https://www.shrs.pitt.edu/people/hari-bharadwaj;http://engineering.purdue.edu/~qobi;",
        "dblp": "232/2416;49/5331;42/2214",
        "google_scholar": "Ay6wT1MAAAAJ;CgSBtPYAAAAJ;gC5RqdoAAAAJ",
        "orcid": "0000-0001-8685-9630;0000-0002-0105-6503;0000-0001-7081-9351",
        "linkedin": "hari-bharadwaj/;;",
        "or_profile": "~Hari_Bharadwaj1;~Jeffrey_Mark_Siskind1;~Ronnie_Wilbur1",
        "aff": "University of Pittsburgh;Purdue University;Purdue University",
        "aff_domain": "pitt.edu;purdue.edu;purdue.edu",
        "position": "Assistant Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nbharadwaj2024joint,\ntitle={Joint Training Does Not Transfer Information between {EEG} and Image Classifiers},\nauthor={Hari Bharadwaj and Ronnie Bring Wilbur and Jeffrey Mark Siskind},\nyear={2024},\nurl={https://openreview.net/forum?id=qdJ1jJzyVP}\n}",
        "github": "",
        "project": "",
        "reviewers": "MkfK;MS4c;rJjg;LQpL;KoK5",
        "site": "https://openreview.net/forum?id=qdJ1jJzyVP",
        "pdf_size": 176382,
        "rating": "1;1;1;5;5",
        "confidence": "5;5;5;4;1",
        "soundness": "2;1;3;2;3",
        "contribution": "1;1;2;2;1",
        "presentation": "1;2;2;3;3",
        "wc_summary": "46;29;218;398;132",
        "wc_strengths": "44;44;296;30;82",
        "wc_weaknesses": "169;328;603;43;85",
        "wc_questions": "86;9;180;43;1",
        "wc_review": "345;410;1297;514;300",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            2.6,
            1.9595917942265426
        ],
        "confidence_avg": [
            4.0,
            1.5491933384829668
        ],
        "soundness_avg": [
            2.2,
            0.7483314773547882
        ],
        "contribution_avg": [
            1.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.2,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            164.6,
            134.79109762888646
        ],
        "wc_strengths_avg": [
            99.2,
            99.90875837482918
        ],
        "wc_weaknesses_avg": [
            245.6,
            203.58349638416172
        ],
        "wc_questions_avg": [
            63.8,
            65.38317826474942
        ],
        "wc_review_avg": [
            573.2,
            368.9820591844541
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.7905694150420948,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:m1N9mA1FebwJ:scholar.google.com/&scioq=Joint+Training+Does+Not+Transfer+Information+between+EEG+and+Image+Classifiers&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "University of Pittsburgh;Purdue University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.pitt.edu;https://www.purdue.edu",
        "aff_unique_abbr": "Pitt;Purdue",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Diverse Projection Ensembles for Distributional Reinforcement Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17725",
        "id": "qe49ybvvPs",
        "author_site": "Moritz Akiya Zanger, Wendelin Boehmer, Matthijs T. J. Spaan",
        "tldr": "",
        "abstract": "In contrast to classical reinforcement learning, distributional RL algorithms aim to learn the distribution of returns rather than their expected value. Since the nature of the return distribution is generally unknown a priori or arbitrarily complex, a common approach finds approximations within a set of representable, parametric distributions. Typically, this involves a projection of the unconstrained distribution onto the set of simplified distributions. We argue that this projection step entails a strong inductive bias when coupled with neural networks and gradient descent, thereby profoundly impacting the generalization behavior of learned models. In order to facilitate reliable uncertainty estimation through diversity, this work studies the combination of several different projections and representations in a distributional ensemble. We establish theoretical properties of such projection ensembles and derive an algorithm that uses ensemble disagreement, measured by the average $1$-Wasserstein distance, as a bonus for deep exploration. We evaluate our algorithm on the behavior suite benchmark and find that diverse projection ensembles lead to significant performance improvements over existing methods on a wide variety of tasks with the most pronounced gains in directed exploration problems.",
        "keywords": "Projections;Epistemic Uncertainty;Ensembles;Exploration;Reinforcement Learning;Distributional Reinforcement Learning;Machine Learning;Artificial Intelligence",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/9ee8ee79b38ef11e069fd0a6d3ad9160daaa26b7.zip",
        "author": "Moritz Akiya Zanger;Wendelin Boehmer;Matthijs T. J. Spaan",
        "authorids": "~Moritz_Akiya_Zanger1;~Wendelin_Boehmer1;~Matthijs_T._J._Spaan1",
        "gender": "M;M;",
        "homepage": "https://anyboby.github.io/;https://reinforceAI.net;",
        "dblp": "290/1950;08/9988;",
        "google_scholar": "mvPhqMwAAAAJ;https://scholar.google.de/citations?user=wI5MV8IAAAAJ;",
        "orcid": "0000-0002-3827-1143;0000-0002-4398-6792;",
        "linkedin": "mozanger/;wendelin-boehmer;",
        "or_profile": "~Moritz_Akiya_Zanger1;~Wendelin_Boehmer1;~Matthijs_T._J._Spaan1",
        "aff": "Delft University of Technology;Delft University of Technology;",
        "aff_domain": "tudelft.nl;tudelft.nl;",
        "position": "PhD student;Assistant Professor;",
        "bibtex": "@inproceedings{\nzanger2024diverse,\ntitle={Diverse Projection Ensembles for Distributional Reinforcement Learning},\nauthor={Moritz Akiya Zanger and Wendelin Boehmer and Matthijs T. J. Spaan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=qe49ybvvPs}\n}",
        "github": "",
        "project": "",
        "reviewers": "fJQm;9dG6;a3AN;1pzE",
        "pdf_size": 2118685,
        "rating": "3;8;8;8",
        "confidence": "5;3;3;4",
        "soundness": "3;3;3;2",
        "contribution": "2;3;3;2",
        "presentation": "2;3;3;1",
        "wc_summary": "51;192;271;25",
        "wc_strengths": "42;61;156;83",
        "wc_weaknesses": "93;50;187;602",
        "wc_questions": "343;116;115;64",
        "wc_review": "529;419;729;774",
        "wc_reply_reviewers": "0;16;33;285",
        "wc_reply_authors": "755;707;448;1126",
        "reply_reviewers": "0;1;1;2",
        "reply_authors": "2;1;1;4",
        "rating_avg": [
            6.75,
            2.165063509461097
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            134.75,
            101.119669204364
        ],
        "wc_strengths_avg": [
            85.5,
            43.21168823362494
        ],
        "wc_weaknesses_avg": [
            233.0,
            218.72699879073
        ],
        "wc_questions_avg": [
            159.5,
            108.01041616436815
        ],
        "wc_review_avg": [
            612.75,
            144.9730578417935
        ],
        "wc_reply_reviewers_avg": [
            83.5,
            116.91984433790527
        ],
        "wc_reply_authors_avg": [
            759.0,
            241.93490860146662
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8703882797784891,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12085702967364643340&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=qe49ybvvPs",
        "pdf": "https://openreview.net/pdf?id=qe49ybvvPs",
        "email": "tudelft.nl;tudelft.nl;",
        "author_num": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Delft University of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tudelft.nl",
        "aff_unique_abbr": "TU Delft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Netherlands"
    },
    {
        "title": "EBMDock: Neural Probabilistic Protein-Protein Docking via a Differentiable Energy Model",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17724",
        "id": "qg2boc2AwU",
        "author_site": "Huaijin Wu, Wei Liu, Yatao Bian, Jiaxiang Wu, Nianzu Yang, Junchi Yan",
        "tldr": "",
        "abstract": "Protein complex formation, a pivotal challenge in contemporary biology, has recently gained interest from the machine learning community, particularly concerning protein-ligand docking tasks. In this paper, we delve into the equally crucial but comparatively under-investigated domain of protein-protein docking. Specifically, we propose a geometric deep learning framework, termed EBMDock,  which employs statistical potential as its energy function. This approach produces a probability distribution over docking poses, such that the identified docking pose aligns with a minimum point in the energy landscape. We employ a differential algorithm grounded in Langevin dynamics to efficiently sample from the docking pose distribution. Additionally, we incorporate energy-based training using contrastive divergence, enhancing both performance and stability. Empirical results demonstrate that our approach achieves superior performance on two benchmark datasets DIPS and DB5.5. Furthermore, the results suggest EBMDock can serve as an orthogonal enhancement to existing methods.",
        "keywords": "protein-protein docking;energy-based model;geometric deep learning;energy-function",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Huaijin Wu;Wei Liu;Yatao Bian;Jiaxiang Wu;Nianzu Yang;Junchi Yan",
        "authorids": "~Huaijin_Wu1;~Wei_Liu31;~Yatao_Bian1;~Jiaxiang_Wu1;~Nianzu_Yang1;~Junchi_Yan2",
        "gender": "F;M;M;M;M;M",
        "homepage": "https://github.com/wuhuaijin;http;;https://yangnianzu0515.github.io/;http://thinklab.sjtu.edu.cn/;https://yataobian.com",
        "dblp": "314/5447;49/3283-123;119/6799-1.html;296/8412.html;60/7949.html;222/2694",
        "google_scholar": ";;https://scholar.google.com.hk/citations?user=puazh38AAAAJ;;ga230VoAAAAJ;oZBTlBkAAAAJ",
        "orcid": "0009-0005-2626-3460;0009-0004-6819-4427;;;0000-0001-9639-7679;0000-0002-2368-4084",
        "linkedin": ";;;;;",
        "or_profile": "~Huaijin_Wu1;~Wei_Liu31;~Jiaxiang_Wu1;~Nianzu_Yang1;~Junchi_Yan1;~An_Bian1",
        "aff": "Shanghai Jiaotong University;Shanghai Jiaotong University;;Shanghai Jiaotong University;Shanghai Jiaotong University;Tencent AI Lab",
        "aff_domain": "sjtu.edu.cn;sjtu.edu.cn;;sjtu.edu.cn;sjtu.edu.cn;tencent.com",
        "position": "PhD student;PhD student;;PhD student;Full Professor;Senior researcher    ",
        "bibtex": "@inproceedings{\nwu2024ebmdock,\ntitle={{EBMD}ock: Neural Probabilistic Protein-Protein Docking via a Differentiable Energy Model},\nauthor={Huaijin Wu and Wei Liu and Yatao Bian and Jiaxiang Wu and Nianzu Yang and Junchi Yan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=qg2boc2AwU}\n}",
        "github": "",
        "project": "",
        "reviewers": "XEYz;94kF;S6B4;AgXx",
        "pdf_size": 11935297,
        "rating": "3;6;6;8",
        "confidence": "4;4;5;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;4;3",
        "wc_summary": "85;82;96;66",
        "wc_strengths": "21;62;57;28",
        "wc_weaknesses": "146;210;156;44",
        "wc_questions": "12;128;124;124",
        "wc_review": "264;482;433;262",
        "wc_reply_reviewers": "472;22;0;76",
        "wc_reply_authors": "2088;1442;1135;778",
        "reply_reviewers": "2;1;0;1",
        "reply_authors": "6;3;3;2",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            82.25,
            10.732543966832841
        ],
        "wc_strengths_avg": [
            42.0,
            17.76231966833161
        ],
        "wc_weaknesses_avg": [
            139.0,
            60.00833275470999
        ],
        "wc_questions_avg": [
            97.0,
            49.10193478876367
        ],
        "wc_review_avg": [
            360.25,
            98.7835386084139
        ],
        "wc_reply_reviewers_avg": [
            142.5,
            192.2361828584827
        ],
        "wc_reply_authors_avg": [
            1360.75,
            481.1586926368472
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            3.5,
            1.5
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.39605901719066966,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17323180760762598748&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=qg2boc2AwU",
        "pdf": "https://openreview.net/pdf?id=qg2boc2AwU",
        "email": "sjtu.edu.cn;sjtu.edu.cn;;sjtu.edu.cn;sjtu.edu.cn;tencent.com",
        "author_num": 6,
        "aff_unique_index": "0;0;0;0;1",
        "aff_unique_norm": "Shanghai Jiao Tong University;Tencent",
        "aff_unique_dep": ";Tencent AI Lab",
        "aff_unique_url": "https://www.sjtu.edu.cn;https://ai.tencent.com",
        "aff_unique_abbr": "SJTU;Tencent AI Lab",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Closing the Gap between TD Learning and Supervised Learning - A Generalisation Point of View.",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17723",
        "id": "qg5JENs0N4",
        "author_site": "Raj Ghugare, Matthieu Geist, Glen Berseth, Benjamin Eysenbach",
        "tldr": "",
        "abstract": "Some reinforcement learning (RL) algorithms have the capability of recombining together pieces of previously seen experience to solve a task never seen before during training. This oft-sought property is one of the few ways in which dynamic programming based RL algorithms are considered different from supervised learning (SL) based RL algorithms. Yet, recent RL methods based on off-the-shelf SL algorithms achieve excellent results without an explicit mechanism for stitching; it remains unclear whether those methods forgo this important stitching property. This paper studies this question in the setting of goal-reaching problems. We show that the desirable stitching property corresponds to a form of generalization: after training on a distribution of (state, goal) pairs, one would like to evaluate on (state, goal) pairs not seen together in the training data. Our analysis shows that this sort of generalization is different from i.i.d. generalization. This connection between stitching and generalization reveals why we should not expect existing RL methods based on SL to perform stitching, even in the limit of large datasets and models. We experimentally validate this result on carefully constructed datasets.\nThis connection suggests a simple remedy, the same remedy for improving generalization in supervised learning: data augmentation. We propose a naive temporal data augmentation approach and demonstrate that adding it to RL methods based on SL enables them to successfully stitch together experience, so that they succeed in navigating between states and goals unseen together during training.",
        "keywords": "reinforcement learning;data augmentation;stitching",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/ce7f56e7f67eed60f82eed3501b88ed6097cef1a.zip",
        "author": "Raj Ghugare;Matthieu Geist;Glen Berseth;Benjamin Eysenbach",
        "authorids": "~Raj_Ghugare1;~Matthieu_Geist1;~Glen_Berseth1;~Benjamin_Eysenbach1",
        "gender": "M;M;M;M",
        "homepage": "https://github.com/RajGhugare19;;http://fracturedplane.com/;https://ben-eysenbach.github.io/",
        "dblp": ";38/6508;147/5478;192/1863",
        "google_scholar": "hzxdkrIAAAAJ;ectPLEUAAAAJ;https://scholar.google.ca/citations?user=-WZcuuwAAAAJ;DRnOvU8AAAAJ",
        "orcid": ";;0000-0001-7351-8028;0009-0000-7136-6307",
        "linkedin": "raj-ghugare-917137169/;;glen-berseth-0523278b?trk=hp-identity-name;benjamin-eysenbach-a7235775/",
        "or_profile": "~Raj_Ghugare1;~Matthieu_Geist1;~Glen_Berseth1;~Benjamin_Eysenbach1",
        "aff": "Montreal Institute for Learning Algorithms, University of Montreal, Universit\u00e9 de Montr\u00e9al;Google;Montreal Institute for Learning Algorithms, University of Montreal, Universit\u00e9 de Montr\u00e9al;Princeton University",
        "aff_domain": "mila.umontreal.ca;google.com;mila.umontreal.ca;princeton.edu",
        "position": "MS student;Researcher;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nghugare2024closing,\ntitle={Closing the Gap between {TD} Learning and Supervised Learning - A Generalisation Point of View.},\nauthor={Raj Ghugare and Matthieu Geist and Glen Berseth and Benjamin Eysenbach},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=qg5JENs0N4}\n}",
        "github": "",
        "project": "",
        "reviewers": "4eRX;DGi6;6ajj;dPJE",
        "pdf_size": 1263971,
        "rating": "5;5;6;6",
        "confidence": "4;3;3;3",
        "soundness": "2;3;3;2",
        "contribution": "2;2;2;2",
        "presentation": "2;3;3;3",
        "wc_summary": "107;73;145;100",
        "wc_strengths": "28;40;63;51",
        "wc_weaknesses": "249;130;420;95",
        "wc_questions": "21;66;88;514",
        "wc_review": "405;309;716;760",
        "wc_reply_reviewers": "94;114;0;154",
        "wc_reply_authors": "943;745;946;2123",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "3;2;3;4",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            106.25,
            25.723287114985908
        ],
        "wc_strengths_avg": [
            45.5,
            12.971121771072847
        ],
        "wc_weaknesses_avg": [
            223.5,
            127.00098424815455
        ],
        "wc_questions_avg": [
            172.25,
            198.78175846892995
        ],
        "wc_review_avg": [
            547.5,
            194.12431583910347
        ],
        "wc_reply_reviewers_avg": [
            90.5,
            56.539808984466866
        ],
        "wc_reply_authors_avg": [
            1189.25,
            545.2193939140463
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 20,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3091793664840748365&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=qg5JENs0N4",
        "pdf": "https://openreview.net/pdf?id=qg5JENs0N4",
        "email": "mila.umontreal.ca;google.com;mila.umontreal.ca;princeton.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "University of Montreal;Google;Princeton University",
        "aff_unique_dep": "Montreal Institute for Learning Algorithms;Google;",
        "aff_unique_url": "https://www.mila.quebec;https://www.google.com;https://www.princeton.edu",
        "aff_unique_abbr": "MILA;Google;Princeton",
        "aff_campus_unique_index": "0;1;0",
        "aff_campus_unique": "Montreal;Mountain View;",
        "aff_country_unique_index": "0;1;0;1",
        "aff_country_unique": "Canada;United States"
    },
    {
        "id": "qgLyKwXVDs",
        "title": "FreeLM: Fine-Tuning-Free Language Model",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Pre-trained language models (PLMs) have achieved remarkable success in NLP tasks. Despite the great success, mainstream solutions largely follow the pre-training then finetuning paradigm, which brings in both high deployment costs and low training efficiency. Nevertheless, fine-tuning on a specific task is essential because PLMs are only pre-trained with language signal from large raw data. In this paper, we propose a novel fine-tuning-free strategy for language models, to consider both language signal and teacher signal. Teacher signal is an abstraction of a battery of downstream tasks, provided in a unified proposition format. Trained with both language and strong task-aware teacher signals in an interactive manner, our FreeLM model demonstrates strong generalization and robustness. FreeLM outperforms large models e.g., GPT-3 and InstructGPT, on a range of language understanding tasks in experiments. FreeLM is much smaller with 0.3B parameters, compared to 175B in these models.",
        "keywords": "Pre-trained Language Model;Natural Language Processing",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Xiang Li;Xin Jiang;Xuezhi Fang;Yiqun Yao;Xuying Meng;Aixin Sun;Yequan Wang",
        "authorids": "~Xiang_Li32;~Xin_Jiang6;~Xuezhi_Fang1;~Yiqun_Yao1;~Xuying_Meng1;~Aixin_Sun1;~Yequan_Wang1",
        "gender": "M;M;M;F;M;M;M",
        "homepage": "https://github.com/keshuichonglx;;;https://people.ucas.ac.cn/~0038059;https://personal.ntu.edu.sg/axsun/;http://www.wangyequan.com;https://github.com/Jason3900",
        "dblp": "40/1491;42/4142-5;186/7879;146/8088;78/5155;188/9082;319/2634",
        "google_scholar": ";3mqJwa8AAAAJ;;SzdXry0AAAAJ;https://scholar.google.com.sg/citations?user=wyKGVKUAAAAJ;7Gqp6FsAAAAJ;",
        "orcid": "0000-0003-2991-4327;;;;0000-0003-0764-4258;;",
        "linkedin": ";;;;aixin-sun-%E5%AD%99%E7%88%B1%E6%AC%A3-43056622/;;",
        "or_profile": "~Xiang_Li32;~Xin_Jiang6;~Yiqun_Yao1;~Xuying_Meng1;~Aixin_Sun1;~Yequan_Wang1;~Jason_Fang1",
        "aff": "Beijing Academy of Artificial Intelligence;Beijing Academy of Artificial Intelligence;Beijing Academy of Artificial Intelligence;Chinese Academy of Sciences;Nanyang Technological University;Beijing Academy of Artificial Intelligence;Beijing Academy of Artificial Intelligence",
        "aff_domain": "baai.ac.cn;baai.ac.cn;baai.ac.cn;ict.ac.cn;ntu.edu.sg;baai.ac.cn;baai.ac.cn",
        "position": "Researcher;Researcher;Researcher;Associate Professor;Associate Professor;Researcher;Researcher",
        "bibtex": "@misc{\nli2024freelm,\ntitle={Free{LM}: Fine-Tuning-Free Language Model},\nauthor={Xiang Li and Xin Jiang and Xuezhi Fang and Yiqun Yao and Xuying Meng and Aixin Sun and Yequan Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=qgLyKwXVDs}\n}",
        "github": "",
        "project": "",
        "reviewers": "NrTr;nxBg;hgDz;JFLv",
        "site": "https://openreview.net/forum?id=qgLyKwXVDs",
        "pdf_size": 609728,
        "rating": "1;1;3;3",
        "confidence": "5;4;3;4",
        "soundness": "1;1;2;1",
        "contribution": "2;1;2;1",
        "presentation": "1;2;3;3",
        "wc_summary": "57;94;47;33",
        "wc_strengths": "37;110;30;31",
        "wc_weaknesses": "248;284;125;311",
        "wc_questions": "72;92;39;34",
        "wc_review": "414;580;241;409",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            1.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            57.75,
            22.598395960775623
        ],
        "wc_strengths_avg": [
            52.0,
            33.59315406448165
        ],
        "wc_weaknesses_avg": [
            242.0,
            71.15124735378853
        ],
        "wc_questions_avg": [
            59.25,
            23.889066536807167
        ],
        "wc_review_avg": [
            411.0,
            119.86867814404228
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.7071067811865475,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7996666956788508747&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;1;2;0;0",
        "aff_unique_norm": "Beijing Academy of Artificial Intelligence;Chinese Academy of Sciences;Nanyang Technological University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.baaic.cn;https://www.cas.cn;https://www.ntu.edu.sg",
        "aff_unique_abbr": "BAAI;CAS;NTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;1;0;0",
        "aff_country_unique": "China;Singapore"
    },
    {
        "title": "Fast Equilibrium of SGD in Generic Situations",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17722",
        "id": "qgWJkDiI5p",
        "author_site": "Zhiyuan Li, Yi Wang, Zhiren Wang",
        "tldr": "",
        "abstract": "Normalization layers are ubiquitous in deep learning, greatly accelerating optimization. However, they also introduce many unexpected phenomena during training, for example, the Fast Equilibrium conjecture proposed by (Li et al.,2020), which states that the scale-invariant normalized network, when trained by SGD with $\\eta$ learning rate and $\\lambda$ weight decay, mixes to an equilibrium in $\\tilde{O}(1/\\eta\\lambda)$ steps, as opposed to classical $e^{O(\\eta^{-1})}$ mixing time. Recent works by Wang & Wang (2022); Li et al. (2022c)  proved this conjecture under different sets of assumptions. This paper aims to answer the fast equilibrium conjecture in full generality by removing the non-generic assumptions of Wang & Wang (2022); Li et al. (2022c) that the minima are isolated, that the region near minima forms a unique basin, and that the set of minima is an analytic set. Our main technical contribution is to show that with probability close to 1,  in exponential time trajectories will not escape the attracting basin containing its initial position.",
        "keywords": "optimization;fast mixing;fast equilibrium;SDE;SGD;large deviation principle",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/09ee0ebacc3a9eced08ed9c8c7c5fb204a109243.zip",
        "author": "Zhiyuan Li;Yi Wang;Zhiren Wang",
        "authorids": "~Zhiyuan_Li2;~Yi_Wang22;~Zhiren_Wang1",
        "gender": "M;;",
        "homepage": "https://zhiyuanli.ttic.edu;http://www.personal.psu.edu/zxw14/;http://www.math.jhu.edu/~ywang",
        "dblp": "l/ZhiyuanLi;;conf/iclr/LiuWW24",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Zhiyuan_Li2;~Zhiren_Wang1;~Yi_Wang8",
        "aff": "Toyota Technological Institute at Chicago;Pennsylvania State University;Johns Hopkins Univ",
        "aff_domain": "ttic.edu;psu.edu;jh.edu",
        "position": "Assistant Professor;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nli2024fast,\ntitle={Fast Equilibrium of {SGD} in Generic Situations},\nauthor={Zhiyuan Li and Yi Wang and Zhiren Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=qgWJkDiI5p}\n}",
        "github": "",
        "project": "",
        "reviewers": "pBQz;yR6a;jkii;LagX",
        "pdf_size": 521590,
        "rating": "6;6;6;8",
        "confidence": "1;3;3;3",
        "soundness": "3;3;3;4",
        "contribution": "3;3;3;2",
        "presentation": "3;4;2;4",
        "wc_summary": "148;89;61;39",
        "wc_strengths": "194;127;27;196",
        "wc_weaknesses": "239;27;251;124",
        "wc_questions": "48;66;1;223",
        "wc_review": "629;309;340;582",
        "wc_reply_reviewers": "0;16;14;0",
        "wc_reply_authors": "83;346;132;363",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            2.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            84.25,
            40.84957160118084
        ],
        "wc_strengths_avg": [
            136.0,
            68.78589971789276
        ],
        "wc_weaknesses_avg": [
            160.25,
            91.52424542163678
        ],
        "wc_questions_avg": [
            84.5,
            83.41013127911981
        ],
        "wc_review_avg": [
            465.0,
            141.90313597662316
        ],
        "wc_reply_reviewers_avg": [
            7.5,
            7.533259586659682
        ],
        "wc_reply_authors_avg": [
            231.0,
            124.85391463626601
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9466652522180925000&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=qgWJkDiI5p",
        "pdf": "https://openreview.net/pdf?id=qgWJkDiI5p",
        "email": "ttic.edu;psu.edu;jh.edu",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Toyota Technological Institute at Chicago;Pennsylvania State University;Johns Hopkins University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.tti-chicago.org;https://www.psu.edu;https://www.jhu.edu",
        "aff_unique_abbr": "TTI Chicago;PSU;JHU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Chicago;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "qgyF6JVmar",
        "title": "OTMatch: Improving Semi-Supervised Learning with Optimal Transport",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Semi-supervised learning has made remarkable strides by effectively utilizing a limited amount of labeled data while capitalizing on the abundant information present in unlabeled data. However, current algorithms often prioritize aligning image predictions with specific classes generated through self-training techniques, thereby neglecting the inherent relationships that exist within these classes. In this paper, we present a new approach called OTMatch, which leverages semantic relationships among classes by employing an optimal transport loss function. By utilizing optimal transport, our proposed method consistently outperforms established state-of-the-art methods. Notably, we observed a substantial improvement of a certain percentage in accuracy compared to the current state-of-the-art method, FreeMatch. OTMatch achieves $3.18\\%$, $3.46\\%$, and $1.28\\%$ error rate reduction over FreeMatch on CIFAR-10 with 1 label per class, STL-10 with 4 labels per class, and ImageNet with 100 labels per class, respectively. This demonstrates the effectiveness and superiority of our approach in harnessing semantic relationships to enhance learning performance in a semi-supervised setting.",
        "keywords": "semi-supervised learning;image classification;optimal transport",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/b025bfb1371c0dbb6651afecaaf509edaef8431f.zip",
        "author": "Zhiquan Tan;Kaipeng Zheng;Weiran Huang",
        "authorids": "~Zhiquan_Tan1;~Kaipeng_Zheng1;~Weiran_Huang1",
        "gender": "M;M;M",
        "homepage": ";https://github.com/uiiuiiuii;https://www.weiranhuang.com",
        "dblp": "326/0177;330/7352;170/0073-1",
        "google_scholar": ";;AjJ2rf8AAAAJ",
        "orcid": ";;",
        "linkedin": "https://www.linkedin.cn/incareer/in/ACoAAC1A8_QBFX8OlchWmVI_pNXN4zm_t6vPKCs;;",
        "or_profile": "~Zhiquan_Tan1;~Kaipeng_Zheng1;~Weiran_Huang1",
        "aff": "Tsinghua University;Shanghai Artificial Intelligence Laboratory;Shanghai AI Laboratory",
        "aff_domain": "tsinghua.edu.cn;pjlab.org.cn;pjlab.org.cn",
        "position": "PhD student;Intern;Consultant",
        "bibtex": "@misc{\ntan2024otmatch,\ntitle={{OTM}atch: Improving Semi-Supervised Learning with Optimal Transport},\nauthor={Zhiquan Tan and Kaipeng Zheng and Weiran Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=qgyF6JVmar}\n}",
        "github": "",
        "project": "",
        "reviewers": "RN81;gfig;29Ss;BnJk",
        "site": "https://openreview.net/forum?id=qgyF6JVmar",
        "pdf_size": 387178,
        "rating": "3;3;5;5",
        "confidence": "5;4;5;5",
        "soundness": "2;3;3;2",
        "contribution": "2;2;3;2",
        "presentation": "2;3;3;2",
        "wc_summary": "42;17;49;30",
        "wc_strengths": "23;17;27;20",
        "wc_weaknesses": "91;80;85;72",
        "wc_questions": "27;87;3;23",
        "wc_review": "183;201;164;145",
        "wc_reply_reviewers": "30;191;0;19",
        "wc_reply_authors": "1143;2002;928;1019",
        "reply_reviewers": "1;2;0;1",
        "reply_authors": "4;5;4;4",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            34.5,
            12.175795661885921
        ],
        "wc_strengths_avg": [
            21.75,
            3.6996621467371855
        ],
        "wc_weaknesses_avg": [
            82.0,
            6.96419413859206
        ],
        "wc_questions_avg": [
            35.0,
            31.368774282716245
        ],
        "wc_review_avg": [
            173.25,
            20.90902915010642
        ],
        "wc_reply_reviewers_avg": [
            60.0,
            76.39044442860639
        ],
        "wc_reply_authors_avg": [
            1273.0,
            427.75051139653823
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            4.25,
            0.4330127018922193
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1650358935855985376&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Tsinghua University;Shanghai Artificial Intelligence Laboratory;Shanghai AI Laboratory",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;http://www.shailab.org/;https://www.shanghai-ai-lab.com",
        "aff_unique_abbr": "THU;Shanghai AI Lab;SAIL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "qgyLAr2cOs",
        "title": "Fixed-Budget Best Arm Identification with Variance-Dependent Regret Bounds",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We investigate the problem of fixed-budget best arm identification (BAI) for minimizing expected simple regret. In an adaptive experiment, a decision maker draws one of multiple treatment arms based on past observations and observes the outcome of the drawn arm. After the experiment, the decision maker recommends the treatment arm with the highest expected outcome. We evaluate the decision based on the expected simple regret, which is the difference between the expected outcomes of the best arm and the recommended arm. Due to inherent uncertainty, we evaluate the regret using the minimax criterion. First, we derive asymptotic lower bounds for the worst-case expected simple regret, which are characterized by the variances of potential outcomes (leading factor). Based on the lower bounds, we propose the Adaptive-Sampling (AS)-Augmented Inverse Probability Weighting (AIPW) strategy, which utilizes the AIPW estimator in recommending the best arm. Our theoretical analysis shows that the AS-AIPW strategy is asymptotically minimax optimal, meaning that the leading factor of its worst-case expected simple regret matches our derived worst-case lower bound. Finally, we validate the proposed method's effectiveness through simulation studies.",
        "keywords": "Best arm identification",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Masahiro Kato;Masaaki Imaizumi;Takuya Ishihara;Toru Kitagawa",
        "authorids": "~Masahiro_Kato1;~Masaaki_Imaizumi1;~Takuya_Ishihara1;~Toru_Kitagawa1",
        "gender": "M;M;M;M",
        "homepage": "https://masakat0.github.io/;https://sites.google.com/view/mimaizumi/home;https://sites.google.com/site/takuyaishiharaeconometrics/;https://sites.google.com/brown.edu/torukitagawa",
        "dblp": ";;;",
        "google_scholar": "https://scholar.google.co.jp/schhp?hl=ja;https://scholar.google.co.jp/citations?user=6c0Ljd4AAAAJ;;wBLN6u4AAAAJ",
        "orcid": ";;;",
        "linkedin": ";masaaki-imaizumi-38600b157/;;",
        "or_profile": "~Masahiro_Kato1;~Masaaki_Imaizumi1;~Takuya_Ishihara1;~Toru_Kitagawa1",
        "aff": "The University of Tokyo;The University of Tokyo;Tohoku University;Brown University",
        "aff_domain": "tokyo.ac.jp;u-tokyo.ac.jp;tohoku.ac.jp;brown.edu",
        "position": "PhD student;Associate Professor;Associate Professor;Full Professor",
        "bibtex": "@misc{\nkato2024fixedbudget,\ntitle={Fixed-Budget Best Arm Identification with Variance-Dependent Regret Bounds},\nauthor={Masahiro Kato and Masaaki Imaizumi and Takuya Ishihara and Toru Kitagawa},\nyear={2024},\nurl={https://openreview.net/forum?id=qgyLAr2cOs}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZfPN;qfgN;dvWZ;65vH",
        "site": "https://openreview.net/forum?id=qgyLAr2cOs",
        "pdf_size": 2891233,
        "rating": "5;6;6;6",
        "confidence": "3;4;3;3",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "1;3;3;4",
        "wc_summary": "106;98;89;66",
        "wc_strengths": "68;188;89;33",
        "wc_weaknesses": "186;194;97;205",
        "wc_questions": "44;281;46;189",
        "wc_review": "404;761;321;493",
        "wc_reply_reviewers": "130;213;0;103",
        "wc_reply_authors": "809;2244;743;1009",
        "reply_reviewers": "1;2;0;2",
        "reply_authors": "2;4;1;2",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            89.75,
            14.972892172189045
        ],
        "wc_strengths_avg": [
            94.5,
            57.56952318718646
        ],
        "wc_weaknesses_avg": [
            170.5,
            42.968011357287644
        ],
        "wc_questions_avg": [
            140.0,
            100.4166320885141
        ],
        "wc_review_avg": [
            494.75,
            165.31541821620874
        ],
        "wc_reply_reviewers_avg": [
            111.5,
            76.07397715382048
        ],
        "wc_reply_authors_avg": [
            1201.25,
            609.946872686466
        ],
        "reply_reviewers_avg": [
            1.25,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.25,
            1.0897247358851685
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:gIGMvHpithkJ:scholar.google.com/&scioq=Fixed-Budget+Best+Arm+Identification+with+Variance-Dependent+Regret+Bounds&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "University of Tokyo;Tohoku University;Brown University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.u-tokyo.ac.jp;https://www.tohoku.ac.jp;https://www.brown.edu",
        "aff_unique_abbr": "UTokyo;Tohoku U;Brown",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "Japan;United States"
    },
    {
        "id": "qhAx0fU9YE",
        "title": "When Does Bias Transfer in Transfer Learning?",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Using transfer learning to adapt a pre-trained \"source model\" to a downstream \"target task\" can dramatically increase performance with seemingly no downside. In this work, we demonstrate that there can exist a downside after all: bias transfer, or the tendency for biases of the source model to persist even after adapting the model to the target dataset. Through a combination of synthetic and natural experiments, we show that bias transfer both (a) arises in realistic settings (such as when pre-training on ImageNet or other standard datasets) and (b) can occur even when the target dataset is explicitly de-biased. As transfer-learned models are increasingly deployed in the real world, our work highlights the importance of understanding the limitations of pre-trained source models.",
        "keywords": "fine-tuning;pre-training;inductive bias;transfer learning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/bfd4980d6dd91fb8f6629c6c7b3d52dc814777b8.zip",
        "author": "Hadi Salman;Saachi Jain;Andrew Ilyas;Logan Engstrom;Eric Wong;Aleksander Madry",
        "authorids": "~Hadi_Salman1;~Saachi_Jain1;~Andrew_Ilyas1;~Logan_Engstrom1;~Eric_Wong1;~Aleksander_Madry1",
        "gender": "M;F;M;M;M;M",
        "homepage": "https://hadisalman.com/;http://people.csail.mit.edu/saachij/;http://andrewilyas.com;;http://riceric22.github.io/;https://people.csail.mit.edu/madry/",
        "dblp": "192/3204;227/2617;156/5465;207/7298;64/1811-1.html;67/2454",
        "google_scholar": "Kr8JjF0AAAAJ;6hsn3EYAAAAJ;Dtw3YBoAAAAJ;;pWnTMRkAAAAJ;SupjsEUAAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Hadi_Salman1;~Saachi_Jain1;~Andrew_Ilyas1;~Logan_Engstrom1;~Eric_Wong1;~Aleksander_Madry1",
        "aff": "Massachusetts Institute of Technology;Massachusetts Institute of Technology;Massachusetts Institute of Technology;Massachusetts Institute of Technology;University of Pennsylvania;Massachusetts Institute of Technology",
        "aff_domain": "mit.edu;mit.edu;mit.edu;mit.edu;upenn.edu;mit.edu",
        "position": "PhD Student;PhD student;PhD student;PhD student;Assistant Professor;Professor",
        "bibtex": "@misc{\nsalman2024when,\ntitle={When Does Bias Transfer in Transfer Learning?},\nauthor={Hadi Salman and Saachi Jain and Andrew Ilyas and Logan Engstrom and Eric Wong and Aleksander Madry},\nyear={2024},\nurl={https://openreview.net/forum?id=qhAx0fU9YE}\n}",
        "github": "",
        "project": "",
        "reviewers": "HsVn;Fi12;RsQk;2a9y",
        "site": "https://openreview.net/forum?id=qhAx0fU9YE",
        "pdf_size": 2324638,
        "rating": "3;5;6;8",
        "confidence": "4;3;4;4",
        "soundness": "3;3;3;4",
        "contribution": "2;1;3;3",
        "presentation": "3;3;2;4",
        "wc_summary": "81;62;147;49",
        "wc_strengths": "116;61;24;141",
        "wc_weaknesses": "198;183;229;22",
        "wc_questions": "44;21;50;50",
        "wc_review": "439;327;450;262",
        "wc_reply_reviewers": "215;378;89;218",
        "wc_reply_authors": "858;576;925;150",
        "reply_reviewers": "1;2;1;1",
        "reply_authors": "2;2;2;1",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            84.75,
            37.69864055904404
        ],
        "wc_strengths_avg": [
            85.5,
            45.80665890457413
        ],
        "wc_weaknesses_avg": [
            158.0,
            80.25272581040473
        ],
        "wc_questions_avg": [
            41.25,
            11.94518731540029
        ],
        "wc_review_avg": [
            369.5,
            78.53820726245284
        ],
        "wc_reply_reviewers_avg": [
            225.0,
            102.53535975457442
        ],
        "wc_reply_authors_avg": [
            627.25,
            305.0798051330176
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.16012815380508713,
        "gs_citation": 39,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15982671679680561284&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;0;0;1;0",
        "aff_unique_norm": "Massachusetts Institute of Technology;University of Pennsylvania",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://web.mit.edu;https://www.upenn.edu",
        "aff_unique_abbr": "MIT;UPenn",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "A Newborn Embodied Turing Test for Comparing Object Segmentation Across Animals and Machines",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17721",
        "id": "qhkEOCcVX9",
        "author_site": "Manju Garimella, Denizhan Pak, Justin Wood, Samantha Wood",
        "tldr": "",
        "abstract": "Newborn brains rapidly learn to solve challenging object recognition tasks, including segmenting objects from backgrounds and recognizing objects across novel backgrounds and viewpoints. Conversely, modern machine-learning (ML) algorithms are \"data hungry,\" requiring more training data than brains to reach similar performance levels. How do we close this learning gap between brains and machines? Here we introduce a new benchmark\u2014a Newborn Embodied Turing Test (NETT) for object segmentation\u2014in which newborn animals and machines are raised in the same environments and tested with the same tasks, permitting direct comparison of their learning abilities. First, we raised newborn chicks in controlled environments containing a single object rotating on a single background, then tested their ability to recognize that object across new backgrounds and viewpoints. Second, we performed \u201cdigital twin\u201d experiments in which we reared and tested artificial chicks in virtual environments that mimicked the rearing and testing conditions of the biological chicks. We inserted a variety of ML \u201cbrains\u201d into the artificial chicks and measured whether those algorithms learned common object recognition behavior as biological chicks. All biological chicks solved this one-shot object segmentation task, successfully learning background-invariant object representations that generalized across new backgrounds and viewpoints. In contrast, none of the artificial chicks solved this object segmentation task, instead learning background-dependent representations that failed to generalize across new backgrounds and viewpoints. This digital twin design exposes core limitations in current ML algorithms in achieving brain-like object perception. Our NETT is publicly available for comparing ML algorithms with newborn chicks. Ultimately, we anticipate that NETT benchmarks will allow researchers to build embodied AI systems that learn as efficiently and robustly as newborn brains.",
        "keywords": "newborn;controlled rearing;object recognition;object segmentation;reinforcement learning;benchmark;Turing test;development",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Manju Garimella;Denizhan Pak;Justin Newell Wood;Samantha Marie Waters Wood",
        "authorids": "~Manju_Garimella1;denpak@iu.edu;~Justin_Newell_Wood1;~Samantha_Marie_Waters_Wood1",
        "gender": "F;;M;F",
        "homepage": "http://mchivuku.github.io;;http://www.buildingamind.com/;",
        "dblp": "382/3877;;;",
        "google_scholar": "cj6nyAUAAAAJ;;;LduPsQ4AAAAJ",
        "orcid": ";;;0000-0002-2219-0285",
        "linkedin": ";;;",
        "or_profile": "~Manju_Garimella1;denpak@iu.edu;~Justin_Newell_Wood1;~Samantha_Marie_Waters_Wood1",
        "aff": "Indiana University;;Indiana University at Bloomington;Indiana University",
        "aff_domain": "iu.edu;;indiana.edu;iu.edu",
        "position": "PhD student;;Associate Professor;Assistant Professor",
        "bibtex": "@inproceedings{\ngarimella2024a,\ntitle={A Newborn Embodied Turing Test for Comparing Object Segmentation Across Animals and Machines},\nauthor={Manju Garimella and Denizhan Pak and Justin Newell Wood and Samantha Marie Waters Wood},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=qhkEOCcVX9}\n}",
        "github": "",
        "project": "",
        "reviewers": "gdnS;ELqk;FxD2;oTEc",
        "pdf_size": 3474009,
        "rating": "3;6;8;8",
        "confidence": "4;4;5;4",
        "soundness": "1;2;4;3",
        "contribution": "2;2;4;3",
        "presentation": "2;2;3;3",
        "wc_summary": "73;45;129;155",
        "wc_strengths": "94;34;78;106",
        "wc_weaknesses": "241;146;206;114",
        "wc_questions": "79;146;212;137",
        "wc_review": "487;371;625;512",
        "wc_reply_reviewers": "0;42;0;0",
        "wc_reply_authors": "585;476;653;363",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.25,
            2.0463381929681126
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            1.118033988749895
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            100.5,
            43.64344166080397
        ],
        "wc_strengths_avg": [
            78.0,
            27.27636339397171
        ],
        "wc_weaknesses_avg": [
            176.75,
            49.6657578216622
        ],
        "wc_questions_avg": [
            143.5,
            47.172555580549165
        ],
        "wc_review_avg": [
            498.75,
            90.23961159047616
        ],
        "wc_reply_reviewers_avg": [
            10.5,
            18.186533479473212
        ],
        "wc_reply_authors_avg": [
            519.25,
            110.10988829346799
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.49374193110101877,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11741292347238955779&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=qhkEOCcVX9",
        "pdf": "https://openreview.net/pdf?id=qhkEOCcVX9",
        "email": "iu.edu;;indiana.edu;iu.edu",
        "author_num": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Indiana University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.indiana.edu",
        "aff_unique_abbr": "IU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Bloomington",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Learning with Language-Guided State Abstractions",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17720",
        "id": "qi5Xa2cOZg",
        "author_site": "Andi Peng, Ilia Sucholutsky, Belinda Li, Theodore Sumers, Thomas L. Griffiths, Jacob Andreas, Julie Shah",
        "tldr": "",
        "abstract": "We describe a framework for using natural language to design state abstractions for imitation learning.\nGeneralizable policy learning in high-dimensional observation spaces is facilitated by well-designed state representations, which can surface important features of an environment and hide irrelevant ones.\nThese state representations are typically manually specified, or derived from other labor-intensive labeling procedures.\nOur method, LGA (\\textit{language-guided abstraction}), uses a combination of natural language supervision and background knowledge from language models (LMs) to automatically build state representations tailored to unseen tasks.\nIn LGA, a user first provides a (possibly incomplete) description of a target task in natural language; next, a pre-trained LM translates this task description into a state abstraction function that masks out irrelevant features; finally, an imitation policy is trained using a small number of demonstrations and LGA-generated abstract states. \nExperiments on simulated robotic tasks show that LGA yields state abstractions similar to those designed by humans, but in a fraction of the time, and that these abstractions improve generalization and robustness in the presence of spurious correlations and ambiguous specifications.\nWe illustrate the utility of the learned abstractions on mobile manipulation tasks with a Spot robot.",
        "keywords": "human-ai interaction;state abstractions",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Andi Peng;Ilia Sucholutsky;Belinda Z. Li;Theodore Sumers;Thomas L. Griffiths;Jacob Andreas;Julie Shah",
        "authorids": "~Andi_Peng1;~Ilia_Sucholutsky1;~Belinda_Z._Li1;~Theodore_Sumers1;~Thomas_L._Griffiths1;~Jacob_Andreas1;~Julie_Shah2",
        "gender": "F;M;M;;M;F;F",
        "homepage": "https://andipeng.com/;https://ilia10000.github.io/;https://www.tedsumers.info/;http://cocosci.princeton.edu/tom/;http://web.mit.edu/jda/www;https://interactive.mit.edu;https://belindal.github.io/",
        "dblp": "242/9185;239/5108;275/8880;34/4472;97/8154;;263/9914",
        "google_scholar": "S63gb38AAAAJ;https://scholar.google.ca/citations?user=6MfHyuMAAAAJ;xZal_nUAAAAJ;https://scholar.google.com/citations?hl=en;dnZ8udEAAAAJ;;700fyvEAAAAJ",
        "orcid": ";0000-0003-4121-7479;0000-0002-6128-0291;;;;",
        "linkedin": ";iliasu/;;;;;",
        "or_profile": "~Andi_Peng1;~Ilia_Sucholutsky1;~Theodore_Sumers1;~Thomas_L._Griffiths1;~Jacob_Andreas1;~Julie_Shah2;~Belinda_Zou_Li1",
        "aff": "Massachusetts Institute of Technology;Princeton University;Anthropic;Princeton University;Microsoft;Massachusetts Institute of Technology;Massachusetts Institute of Technology",
        "aff_domain": "mit.edu;princeton.edu;anthropic.com;princeton.edu;microsoft.com;mit.edu;mit.edu",
        "position": "PhD student;Postdoc;Researcher;Professor;Researcher;Professor;PhD student",
        "bibtex": "@inproceedings{\npeng2024learning,\ntitle={Learning with Language-Guided State Abstractions},\nauthor={Andi Peng and Ilia Sucholutsky and Belinda Z. Li and Theodore Sumers and Thomas L. Griffiths and Jacob Andreas and Julie Shah},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=qi5Xa2cOZg}\n}",
        "github": "",
        "project": "",
        "reviewers": "4L8o;PEPS;rEzX",
        "pdf_size": 17594471,
        "rating": "5;6;6",
        "confidence": "5;3;4",
        "soundness": "3;2;3",
        "contribution": "2;2;3",
        "presentation": "3;3;3",
        "wc_summary": "151;64;93",
        "wc_strengths": "59;63;114",
        "wc_weaknesses": "283;304;94",
        "wc_questions": "38;79;20",
        "wc_review": "531;510;321",
        "wc_reply_reviewers": "131;0;40",
        "wc_reply_authors": "751;850;523",
        "reply_reviewers": "1;0;1",
        "reply_authors": "2;2;1",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            102.66666666666667,
            36.16935473881477
        ],
        "wc_strengths_avg": [
            78.66666666666667,
            25.037749277618563
        ],
        "wc_weaknesses_avg": [
            227.0,
            94.43516294262429
        ],
        "wc_questions_avg": [
            45.666666666666664,
            24.689178916188272
        ],
        "wc_review_avg": [
            454.0,
            94.43516294262429
        ],
        "wc_reply_reviewers_avg": [
            57.0,
            54.81483983983413
        ],
        "wc_reply_authors_avg": [
            708.0,
            136.91603266235842
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4379794633366618710&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 9,
        "openreview": "https://openreview.net/forum?id=qi5Xa2cOZg",
        "pdf": "https://openreview.net/pdf?id=qi5Xa2cOZg",
        "email": "mit.edu;princeton.edu;anthropic.com;princeton.edu;microsoft.com;mit.edu;mit.edu",
        "author_num": 7,
        "aff_unique_index": "0;1;2;1;3;0;0",
        "aff_unique_norm": "Massachusetts Institute of Technology;Princeton University;Anthropic;Microsoft",
        "aff_unique_dep": ";;;Microsoft Corporation",
        "aff_unique_url": "https://web.mit.edu;https://www.princeton.edu;https://www.anthropic.com;https://www.microsoft.com",
        "aff_unique_abbr": "MIT;Princeton;Anthropic;Microsoft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "qi88abxiE4",
        "title": "Large-Scale Spectral Graph Neural Networks via Laplacian Sparsification",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph Neural Networks (GNNs) play a pivotal role in graph-based tasks for their proficiency in representation learning.\nAmong the various GNN methods, spectral GNNs employing polynomial filters have shown promising performance on both homophilous and heterophilous graph structures.\nThe scalability of spectral GNNs is limited because forward propagation requires multiple graph propagation executions, corresponding to the degree of the polynomial.\nOn the other hand, scalable spectral GNNs detach the graph propagation and linear layers, allowing the message-passing phase to be pre-computed and ensuring effective scalability on large graphs. \nHowever, this pre-computation can disrupt end-to-end training, possibly impacting performance, and becomes impractical when dealing with high-dimensional input features.\nIn response to these challenges, we propose a novel graph spectral sparsification method to approximate the propagation pattern of spectral GNNs.\nWe prove that our proposed methods generate Laplacian sparsifiers for the random-walk matrix polynomial, incorporating both static and learnable polynomial coefficients.\nBy considering multi-hop neighbor interactions into one-hop operations, our approach facilitates the use of scalable techniques.\nTo empirically validate the effectiveness of our methods, we conduct an extensive experimental analysis on datasets spanning various graph scales and properties.\nThe results show that our method yields superior results in comparison with the corresponding approximated base models.",
        "keywords": "spectral graph neural networks;scalability;Laplacian sparsification",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/1389d2d152b7349113a5e7625a1cbf7b4499c523.zip",
        "author": "Haipeng Ding;Zhewei Wei;Yuhang Ye",
        "authorids": "~Haipeng_Ding1;~Zhewei_Wei1;~Yuhang_Ye2",
        "gender": "M;M;M",
        "homepage": "https://dinghaipeng.com;http://weizhewei.com;https://github.com/HangyuYe123",
        "dblp": "78/7918-2.html;94/4260;182/6803-2.html",
        "google_scholar": "HwaxqqYAAAAJ;https://scholar.google.com.hk/citations?user=qZ7dj4gAAAAJ;https://scholar.google.com.hk/citations?hl=zh-CN",
        "orcid": "0009-0006-4856-3023;0000-0003-3620-5086;0009-0003-4277-766X",
        "linkedin": "%E6%B5%B7%E9%B9%8F-%E4%B8%81-991aa419b/;;",
        "or_profile": "~Haipeng_Ding1;~Zhewei_Wei1;~Yuhang_Ye2",
        "aff": "Renmin University of China;Renmin University of China;Huawei Technologies Ltd.",
        "aff_domain": "ruc.edu.cn;ruc.edu.cn;huawei.com",
        "position": "PhD student;Full Professor;Researcher",
        "bibtex": "@misc{\nding2024largescale,\ntitle={Large-Scale Spectral Graph Neural Networks via Laplacian Sparsification},\nauthor={Haipeng Ding and Zhewei Wei and Yuhang Ye},\nyear={2024},\nurl={https://openreview.net/forum?id=qi88abxiE4}\n}",
        "github": "",
        "project": "",
        "reviewers": "jUvN;injV;FyWK;aEiE",
        "site": "https://openreview.net/forum?id=qi88abxiE4",
        "pdf_size": 618675,
        "rating": "3;5;5;5",
        "confidence": "5;2;3;4",
        "soundness": "2;2;3;2",
        "contribution": "2;2;2;2",
        "presentation": "2;3;2;2",
        "wc_summary": "57;42;47;60",
        "wc_strengths": "31;16;23;34",
        "wc_weaknesses": "169;187;668;152",
        "wc_questions": "60;9;555;399",
        "wc_review": "317;254;1293;645",
        "wc_reply_reviewers": "0;50;391;114",
        "wc_reply_authors": "761;845;1365;1122",
        "reply_reviewers": "0;1;5;1",
        "reply_authors": "2;2;3;2",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            51.5,
            7.297259759663212
        ],
        "wc_strengths_avg": [
            26.0,
            7.035623639735144
        ],
        "wc_weaknesses_avg": [
            294.0,
            216.28337892681444
        ],
        "wc_questions_avg": [
            255.75,
            228.73278623756588
        ],
        "wc_review_avg": [
            627.25,
            412.0402741237803
        ],
        "wc_reply_reviewers_avg": [
            138.75,
            151.13797504267416
        ],
        "wc_reply_authors_avg": [
            1023.25,
            238.27124774088878
        ],
        "reply_reviewers_avg": [
            1.75,
            1.920286436967152
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.7745966692414834,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:MvJ9drfgcrUJ:scholar.google.com/&scioq=Large-Scale+Spectral+Graph+Neural+Networks+via+Laplacian+Sparsification&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Renmin University of China;Huawei",
        "aff_unique_dep": ";Huawei Technologies",
        "aff_unique_url": "http://www.ruc.edu.cn;https://www.huawei.com",
        "aff_unique_abbr": "RUC;Huawei",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "qiOqgphnVL",
        "title": "Democratized Diffusion Language Model",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Diffusion Models are a promising avenue for text generation, offering a multitude of frameworks for researchers and practitioners alike. These frameworks differ based on how the Diffusion Model is utilized for categorical data generation. This paper aims to look into these differences by examining the SSD and Plaid models, as well as our attentive replication of the CDCD models. Our study focuses mainly on the process of text generation performed at runtime by various frameworks. One of our research's notable findings is that, according to our observations, most models are capable of halting the generation process and facilitating an adaptive early exit. This feature proves instrumental in accelerating the speed of text generation by Diffusion Language Models without compromising the quality of the generated text.",
        "keywords": "Diffusion LMs;Language Modelling;Early Exiting;Diffusion Early Exiting",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/496a425fb92a90d48f9129cd38e08b2d153c0a37.zip",
        "author": "Sofia Maria Lo Cicero Vaina;Nikita Balagansky;Daniil Gavrilov",
        "authorids": "~Sofia_Maria_Lo_Cicero_Vaina1;~Nikita_Balagansky3;~Daniil_Gavrilov1",
        "gender": "F;M;",
        "homepage": ";;https://kefirski.me",
        "dblp": ";318/0989;234/8563",
        "google_scholar": ";https://scholar.google.com/citations?authuser=1;https://scholar.google.ru/citations?user=PAZUwukAAAAJ",
        "orcid": ";;",
        "linkedin": "https://linkedin.com/in/sofia-maria-lo-cicero-vaina-8a853b238;;",
        "or_profile": "~Sofia_Maria_Lo_Cicero_Vaina1;~Nikita_Balagansky3;~Daniil_Gavrilov1",
        "aff": "Innopolis University;Moscow Institute of Physics and Technology;T-Bank",
        "aff_domain": "innopolis.university;phystech.edu;tbank.ru",
        "position": "Undergrad student;PhD student;Principal Researcher",
        "bibtex": "@misc{\nvaina2024democratized,\ntitle={Democratized Diffusion Language Model},\nauthor={Sofia Maria Lo Cicero Vaina and Nikita Balagansky and Daniil Gavrilov},\nyear={2024},\nurl={https://openreview.net/forum?id=qiOqgphnVL}\n}",
        "github": "",
        "project": "",
        "reviewers": "UKex;Sk8v;E1db",
        "site": "https://openreview.net/forum?id=qiOqgphnVL",
        "pdf_size": 674665,
        "rating": "3;3;5",
        "confidence": "3;4;5",
        "soundness": "2;3;2",
        "contribution": "2;2;3",
        "presentation": "2;2;3",
        "wc_summary": "73;36;77",
        "wc_strengths": "71;49;19",
        "wc_weaknesses": "144;134;67",
        "wc_questions": "36;20;102",
        "wc_review": "324;239;265",
        "wc_reply_reviewers": "175;107;55",
        "wc_reply_authors": "481;400;849",
        "reply_reviewers": "1;2;1",
        "reply_authors": "2;2;2",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            62.0,
            18.457157599876172
        ],
        "wc_strengths_avg": [
            46.333333333333336,
            21.312489817527705
        ],
        "wc_weaknesses_avg": [
            115.0,
            34.18576701884378
        ],
        "wc_questions_avg": [
            52.666666666666664,
            35.490217744549774
        ],
        "wc_review_avg": [
            276.0,
            35.56215216584433
        ],
        "wc_reply_reviewers_avg": [
            112.33333333333333,
            49.13473539383541
        ],
        "wc_reply_authors_avg": [
            576.6666666666666,
            195.38736454085824
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.8660254037844387,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:V5cQMfNAH_8J:scholar.google.com/&scioq=Democratized+Diffusion+Language+Model&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Innopolis University;Moscow Institute of Physics and Technology;T-Bank",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://innopolis.ru/en;https://www.mipt.ru/en;https://www.tbank.com.cn",
        "aff_unique_abbr": "Innopolis;MIPT;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "Russian Federation;China"
    },
    {
        "title": "Skill Machines: Temporal Logic Skill Composition in Reinforcement Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17719",
        "id": "qiduMcw3CU",
        "author_site": "Geraud Nangue Tasse, Devon Jarvis, Steven James, Benjamin Rosman",
        "tldr": "",
        "abstract": "It is desirable for an agent to be able to solve a rich variety of problems that can be specified through language in the same environment. A popular approach towards obtaining such agents is to reuse skills learned in prior tasks to generalise compositionally to new ones. However, this is a challenging problem due to the curse of dimensionality induced by the combinatorially large number of ways high-level goals can be combined both logically and temporally in language. To address this problem, we propose a framework where an agent first learns a sufficient set of skill primitives to achieve all high-level goals in its environment. The agent can then flexibly compose them both logically and temporally to provably achieve temporal logic specifications in any regular language, such as regular fragments of linear temporal logic. This provides the agent with the ability to map from complex temporal logic task specifications to near-optimal behaviours zero-shot. We demonstrate this experimentally in a tabular setting, as well as in a high-dimensional video game and continuous control environment. Finally, we also demonstrate that the performance of skill machines can be improved with regular off-policy reinforcement learning algorithms when optimal behaviours are desired.",
        "keywords": "Reinforcement Learning;Multi task;Temporal logic;LTL;Composition;Zero-shot;Transfer learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Geraud Nangue Tasse;Devon Jarvis;Steven James;Benjamin Rosman",
        "authorids": "~Geraud_Nangue_Tasse1;~Devon_Jarvis1;~Steven_James1;~Benjamin_Rosman1",
        "gender": "M;M;M;M",
        "homepage": "https://geraudnt.github.io/;https://jarvisdevon.github.io/;;http://www.raillab.org",
        "dblp": "256/0971;320/3650;195/8202;45/4591",
        "google_scholar": "CAfsMIsAAAAJ;https://scholar.google.co.za/citations?user=MJjN5nEAAAAJ;;https://scholar.google.co.za/citations?user=pWJ0SocAAAAJ",
        "orcid": "0000-0002-6152-8429;0000-0003-2362-7538;;",
        "linkedin": "geraud-nangue-tasse-264281a5/;devon-jarvis-6b059a139;;",
        "or_profile": "~Geraud_Nangue_Tasse1;~Devon_Jarvis1;~Steven_James1;~Benjamin_Rosman1",
        "aff": "University of the Witwatersrand;University College London, University of London;University of the Witwatersrand;University of the Witwatersrand",
        "aff_domain": "wits.ac.za;ucl.ac.uk;wits.ac.za;wits.ac.za",
        "position": "PhD student;Researcher;Senior Lecturer;Full Professor",
        "bibtex": "@inproceedings{\ntasse2024skill,\ntitle={Skill Machines: Temporal Logic Skill Composition in Reinforcement Learning},\nauthor={Geraud Nangue Tasse and Devon Jarvis and Steven James and Benjamin Rosman},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=qiduMcw3CU}\n}",
        "github": "",
        "project": "",
        "reviewers": "38Qb;pDWg;vdA3;uyfa",
        "pdf_size": 8408378,
        "rating": "5;6;6;8",
        "confidence": "5;4;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;2;3",
        "wc_summary": "35;95;71;188",
        "wc_strengths": "23;76;65;179",
        "wc_weaknesses": "149;277;90;171",
        "wc_questions": "72;287;71;6",
        "wc_review": "279;735;297;544",
        "wc_reply_reviewers": "0;628;157;275",
        "wc_reply_authors": "763;1448;1081;425",
        "reply_reviewers": "0;3;2;1",
        "reply_authors": "2;3;2;2",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            97.25,
            56.57903763762689
        ],
        "wc_strengths_avg": [
            85.75,
            57.35579744018908
        ],
        "wc_weaknesses_avg": [
            171.75,
            67.59946375526954
        ],
        "wc_questions_avg": [
            109.0,
            106.19086589721358
        ],
        "wc_review_avg": [
            463.75,
            188.38441416422964
        ],
        "wc_reply_reviewers_avg": [
            265.0,
            231.16985097542457
        ],
        "wc_reply_authors_avg": [
            929.25,
            378.8260649691359
        ],
        "reply_reviewers_avg": [
            1.5,
            1.118033988749895
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.3244428422615251,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9149799078960481279&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=qiduMcw3CU",
        "pdf": "https://openreview.net/pdf?id=qiduMcw3CU",
        "email": "wits.ac.za;ucl.ac.uk;wits.ac.za;wits.ac.za",
        "author_num": 4,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "University of the Witwatersrand;University College London",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.wits.ac.za;https://www.ucl.ac.uk",
        "aff_unique_abbr": "Wits;UCL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "South Africa;United Kingdom"
    },
    {
        "id": "qixVmrOOmT",
        "title": "UMMAN: UNSUPERVISED MULTI-GRAPH MERGE ADVERSARIAL NETWORK FOR DISEASE PREDICTION BASED ON INTESTINAL FLORA",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The abundance of intestinal flora is closely related to human diseases, but diseases are not caused by a single gut microbe, but by a combination of a large number of microbial information. It exists a multiplex and implicit connection between gut microbes and hosts, which poses a great challenge to disease prediction through abundance information of gut microbes. Recently, several solution methods have been proposed and have shown the potential of predicting the corresponding diseases. However, these methods have difficulty in learning the inner association between gut microbes and hosts, resulting in unsatisfactory performance. This paper presents a novel architecture, $\\textbf{U}$nsupervised $\\textbf{M}$ulti-graph $\\textbf{M}$erge $\\textbf{A}$dversarial $\\textbf{N}$etwork (UMMAN). UMMAN can obtain the embeddings of nodes in the Multi-Graph under unsupervised situation, so that it helps learn the multiplex relationship. At the first time, our method combines Graph Neural Network with intestinal flora disease prediction task. We use multiplex relation-types to construct the Original-Graph and destroy the relationship among nodes to get corresponding Shuffled-Graph. We introduce the Node Feature Global Integration (NFGI) module to represent the global features of the graph. Furthermore, we design a joint loss consists of adversarial loss and hybrid attention loss to make real graph embedding agree with the Original-Graph as much as possible and disagree with the Shuffled-Graph as much as possible. Comprehensive \nexperiments on five classical OTU gut microbiome datasets demonstrate the effectiveness and stability of our method. (We will release our code soon.)",
        "keywords": "intestinal flora;graph neural network;unsupervised learning;global embedding",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/460e4e1450c3109e56291adbe9a88150ddb66975.zip",
        "author": "Dingkun Liu;Hongjie Zhou;Yilu Qu;Xiye Niu;Bingchun Luo;Yi Jiang;yongdong xu",
        "authorids": "~Dingkun_Liu1;~Hongjie_Zhou1;~Yilu_Qu1;~Xiye_Niu1;~Bingchun_Luo1;~Yi_Jiang4;~yongdong_xu1",
        "gender": "M;M;F;M;M;M;M",
        "homepage": "https://github.com/Dingkun0817;https://github.com/AMerser;https://mail.qq.com/cgi-bin/frame_html?sid=Cz0hXrJYzMvMhUsu&from=;https://github.com/GoOoO14;https://www.aminer.cn/profile/63f2ee4d1d157a8656975db3;https://github.com/liunian-Jay;http://homepage.hit.edu.cn/xuyongdong",
        "dblp": ";;;;;;",
        "google_scholar": ";;;;sNq_KAIAAAAJ;;",
        "orcid": ";;;;;0009-0008-9792-6569;0000-0003-2349-5643",
        "linkedin": ";;;;;;",
        "or_profile": "~Dingkun_Liu1;~Hongjie_Zhou1;~Yilu_Qu1;~Xiye_Niu1;~Bingchun_Luo1;~Yi_Jiang4;~yongdong_xu1",
        "aff": "Harbin Institute of Technology;Harbin Institute of Technology at Weihai;Harbin Institute of Technology at Weihai;Harbin Institute of Technology at Weihai;Harbin Institute of Technology;Harbin Institute of Technology at Weihai;",
        "aff_domain": "hit.edu.cn;hitwh.edu.cn;hitwh.edu.cn;hitwh.edu.cn;hit.edu.cn;hitwh.edu.cn;",
        "position": "Undergrad student;Undergrad student;Undergrad student;Undergrad student;Undergrad student;Undergrad student;",
        "bibtex": "@misc{\nliu2024umman,\ntitle={{UMMAN}: {UNSUPERVISED} {MULTI}-{GRAPH} {MERGE} {ADVERSARIAL} {NETWORK} {FOR} {DISEASE} {PREDICTION} {BASED} {ON} {INTESTINAL} {FLORA}},\nauthor={Dingkun Liu and Hongjie Zhou and Yilu Qu and Xiye Niu and Bingchun Luo and Yi Jiang and yongdong xu},\nyear={2024},\nurl={https://openreview.net/forum?id=qixVmrOOmT}\n}",
        "github": "",
        "project": "",
        "reviewers": "QG5D;uFaR;hmSd;9ne7",
        "site": "https://openreview.net/forum?id=qixVmrOOmT",
        "pdf_size": 5523272,
        "rating": "3;3;5;5",
        "confidence": "3;3;4;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;2",
        "presentation": "2;2;1;3",
        "wc_summary": "31;204;94;88",
        "wc_strengths": "45;27;196;43",
        "wc_weaknesses": "51;532;197;58",
        "wc_questions": "51;139;97;40",
        "wc_review": "178;902;584;229",
        "wc_reply_reviewers": "0;20;14;0",
        "wc_reply_authors": "274;194;245;195",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            104.25,
            62.61938597591005
        ],
        "wc_strengths_avg": [
            77.75,
            68.62716298959181
        ],
        "wc_weaknesses_avg": [
            209.5,
            195.0878007462281
        ],
        "wc_questions_avg": [
            81.75,
            39.36607041603213
        ],
        "wc_review_avg": [
            473.25,
            292.79803192644584
        ],
        "wc_reply_reviewers_avg": [
            8.5,
            8.760707733967616
        ],
        "wc_reply_authors_avg": [
            227.0,
            34.08078637590395
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12324933801537332077&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "Harbin Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.hit.edu.cn/",
        "aff_unique_abbr": "HIT",
        "aff_campus_unique_index": "0;1;1;1;0;1",
        "aff_campus_unique": "Harbin;Weihai",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "qjFnENGhDE",
        "title": "Regularization is Enough for Last-Iterate Convergence in Zero-Sum Games",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent literature has witnessed a rising interest in learning Nash equilibrium with a guarantee of last-iterate convergence. In this paper, we introduce a novel approach called Regularized Follow-the-Regularized-Leader (RegFTRL) for the purpose of learning equilibria in two-player zero-sum games. RegFTRL is an efficient variant of FTRL, enriched with an adaptive regularization that encompasses the well-known entropy regularization as a special case. In the context of normal-form games (NFGs), our proposed RegFTRL algorithm exhibits the desirable property of last-iterate linear convergence towards an approximated equilibrium. Furthermore, it converges to an exact Nash equilibrium through adaptive adjustments of the regularization. In extensive-form games (EFGs), we demonstrate that the entropy-regularized Multiplicative Weights Update (MWU), a specific instance of RegFTRL, can achieve a last-iterate linear convergence rate towards the quantal response equilibrium, all without the need for either an optimistic update or reliance on uniqueness assumptions.These results show that regularization is enough for last-iterate convergence. Additionally, we propose FollowMu, a practical implementation of RegFTRL with a neural network as the function approximator, for model-free  learning in sequential non-stationary environments. Finally, empirical results substantiate the theoretical properties of RegFTRL, and demonstrate that FollowMu achieves favorable performance in EFGs.",
        "keywords": "two-player zero-sum games;reinforcement learning;last-iterate convergence",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/41b82b0e3ef8ab88b11936be77911a41ce25560c.pdf",
        "author": "Zongkai Liu;Chaohao Hu;Chao Yu;peng sun",
        "authorids": "~Zongkai_Liu1;~Chaohao_Hu1;~Chao_Yu2;~peng_sun1",
        "gender": ";M;M;M",
        "homepage": "https://dblp.org/pid/214/0917;https://portal.sysu.edu.cn/#/index;https://cse.sysu.edu.cn/teacher/YuChao;http://pengsun.github.io",
        "dblp": "214/0917;;36/6789-4;",
        "google_scholar": ";;;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Zongkai_Liu1;~Chaohao_Hu1;~Chao_Yu2;~peng_sun1",
        "aff": "SUN YAT-SEN UNIVERSITY;SUN YAT-SEN UNIVERSITY;SUN YAT-SEN UNIVERSITY;ByteDance",
        "aff_domain": "sysu.edu.cn;sysu.edu.cn;mail.sysu.edu.cn;bytedance.com",
        "position": "PhD student;MS student;Associate Professor;Researcher",
        "bibtex": "@misc{\nliu2024regularization,\ntitle={Regularization is Enough for Last-Iterate Convergence in Zero-Sum Games},\nauthor={Zongkai Liu and Chaohao Hu and Chao Yu and peng sun},\nyear={2024},\nurl={https://openreview.net/forum?id=qjFnENGhDE}\n}",
        "github": "",
        "project": "",
        "reviewers": "onGj;3dkM;43MX;s7M3;gsq4",
        "site": "https://openreview.net/forum?id=qjFnENGhDE",
        "pdf_size": 505372,
        "rating": "5;5;5;5;8",
        "confidence": "4;4;3;2;5",
        "soundness": "3;3;3;2;2",
        "contribution": "2;2;3;2;4",
        "presentation": "3;2;1;2;2",
        "wc_summary": "67;139;98;67;139",
        "wc_strengths": "67;42;52;38;76",
        "wc_weaknesses": "190;425;101;267;43",
        "wc_questions": "63;34;162;28;74",
        "wc_review": "387;640;413;400;332",
        "wc_reply_reviewers": "109;105;0;125;0",
        "wc_reply_authors": "921;799;537;1259;203",
        "reply_reviewers": "2;1;0;1;0",
        "reply_authors": "3;3;2;4;1",
        "rating_avg": [
            5.6,
            1.2
        ],
        "confidence_avg": [
            3.6,
            1.019803902718557
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.6,
            0.8
        ],
        "presentation_avg": [
            2.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            102.0,
            32.26143208228674
        ],
        "wc_strengths_avg": [
            55.0,
            14.505171491574997
        ],
        "wc_weaknesses_avg": [
            205.2,
            133.81240600183528
        ],
        "wc_questions_avg": [
            72.2,
            48.093242768605236
        ],
        "wc_review_avg": [
            434.4,
            106.43796315225127
        ],
        "wc_reply_reviewers_avg": [
            67.8,
            55.76163555707454
        ],
        "wc_reply_authors_avg": [
            743.8,
            356.40112233268854
        ],
        "reply_reviewers_avg": [
            0.8,
            0.7483314773547883
        ],
        "reply_authors_avg": [
            2.6,
            1.019803902718557
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.6864064729836441,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:wqHGeeK3MPEJ:scholar.google.com/&scioq=Regularization+is+Enough+for+Last-Iterate+Convergence+in+Zero-Sum+Games&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "Sun Yat-sen University;ByteDance",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.sysu.edu.cn;https://www.bytedance.com",
        "aff_unique_abbr": "SYSU;ByteDance",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "qm46g9Ri15",
        "title": "AlignCLIP: Enhancing Stable Representations in Vision-Language Pretraining Models through Attention and Prediction Alignment",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Stable representations are pivotal in Vision-Language Pretraining (VLP) models serving as the foundation for managing domain shifts and recognizing unseen classes in open-world environments. In this paper, we identify and delve into two primary misalignment problems in VLP models like contrastive language-image pre-training (CLIP): attention misalignment, where the model disproportionately allocates attention to background visual tokens, and predictive category misalignment, indicative of the model's struggle to discern class similarities accurately. Addressing these misalignments is paramount, as they undermine the stability of representations and, consequently, the adaptability and trustworthiness of the model in open-world environments. To counteract these misalignments, we introduce AlignCLIP, a new parameter fine-tuning method. AlignCLIP introduces a novel training objective, the attention alignment loss, to harmonize attention distributions of multi-head attention layers and the correlation between visual tokens and class prompts. Further, AlignCLIP presents semantic label smoothing, aiming to preserve prediction hierarchy based on class similarity derived from textual information. Our empirical studies across varied datasets and out-of-distribution contexts demonstrate AlignCLIP's superior performance in enhancing stable representations and excelling in generalization methodologies, proving its adaptability and stability in scenarios involving domain shifts and unseen classes.",
        "keywords": "Language Vision Pretraining Models;Foundation Models;Domain Adaptation;Out-of-Distribution Generalization",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Zhongyi Han;Gongxu Luo;Yaqian Li;Bo Han;Mingming Gong;Kun Zhang;Tongliang Liu",
        "authorids": "~Zhongyi_Han1;~Gongxu_Luo1;~Yaqian_Li1;~Bo_Han1;~Mingming_Gong1;~Kun_Zhang1;~Tongliang_Liu1",
        "gender": "M;M;M;M;M;M;M",
        "homepage": "https://zhyhan.github.io/;https://dblp.org/pid/252/7950.html;;https://mingming-gong.github.io/;http://www.andrew.cmu.edu/user/kunz1/;https://tongliang-liu.github.io/;https://bhanml.github.io/",
        "dblp": "181/7439;252/7950.html;154/1961.html;98/8479;96/3115-1;150/6667;241/0472-3",
        "google_scholar": "https://scholar.google.com.sg/citations?user=0J-PErUAAAAJ;;;https://scholar.google.com.au/citations?user=6BmiCJIAAAAJ;RGoypN4AAAAJ;https://scholar.google.com.au/citations?user=EiLdZ_YAAAAJ;nTNjqHwAAAAJ",
        "orcid": ";;;0000-0001-7147-5589;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Zhongyi_Han1;~Gongxu_Luo1;~Yaqian_Li1;~Mingming_Gong1;~Kun_Zhang1;~Tongliang_Liu1;~bo_han2",
        "aff": "King Abdullah University of Science and Technology;Mohamed bin Zayed University of Artificial Intelligence;;University of Melbourne;Carnegie Mellon University;Mohamed bin Zayed University of Artificial Intelligence;MBZUAI",
        "aff_domain": "kaust.edu.sa;mbzuai.ac.ae;;unimelb.edu.au;cmu.edu;mbzuai.ac.ae;mbzuai.ac.ae",
        "position": "Postdoc;PhD student;;Assistant Professor;Associate Professor;Affiliated Associate Professor;Researcher",
        "bibtex": "@misc{\nhan2024alignclip,\ntitle={Align{CLIP}: Enhancing Stable Representations in Vision-Language Pretraining Models through Attention and Prediction Alignment},\nauthor={Zhongyi Han and Gongxu Luo and Yaqian Li and Bo Han and Mingming Gong and Kun Zhang and Tongliang Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=qm46g9Ri15}\n}",
        "github": "",
        "project": "",
        "reviewers": "TgXT;v1vj;WRUU;J1XN",
        "site": "https://openreview.net/forum?id=qm46g9Ri15",
        "pdf_size": 4407561,
        "rating": "5;5;5;6",
        "confidence": "4;4;3;4",
        "soundness": "3;3;2;2",
        "contribution": "3;2;2;3",
        "presentation": "3;3;2;3",
        "wc_summary": "96;69;84;77",
        "wc_strengths": "96;52;51;92",
        "wc_weaknesses": "98;103;315;147",
        "wc_questions": "51;196;52;32",
        "wc_review": "341;420;502;348",
        "wc_reply_reviewers": "18;153;0;0",
        "wc_reply_authors": "1642;2350;2654;1352",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "4;5;5;2",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            81.5,
            9.912113800799505
        ],
        "wc_strengths_avg": [
            72.75,
            21.299941314473145
        ],
        "wc_weaknesses_avg": [
            165.75,
            88.25354100544635
        ],
        "wc_questions_avg": [
            82.75,
            65.86871412134899
        ],
        "wc_review_avg": [
            402.75,
            65.11288274988291
        ],
        "wc_reply_reviewers_avg": [
            42.75,
            64.07563889654163
        ],
        "wc_reply_authors_avg": [
            1999.5,
            523.994990434069
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            4.0,
            1.224744871391589
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:9WcFBa_Ej2wJ:scholar.google.com/&scioq=AlignCLIP:+Enhancing+Stable+Representations+in+Vision-Language+Pretraining+Models+through+Attention+and+Prediction+Alignment&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;1;1",
        "aff_unique_norm": "King Abdullah University of Science and Technology;Mohamed bin Zayed University of Artificial Intelligence;University of Melbourne;Carnegie Mellon University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.kast.kau.edu.sa;https://mbzuai.ac.ae;https://www.unimelb.edu.au;https://www.cmu.edu",
        "aff_unique_abbr": "KAUST;MBZUAI;UniMelb;CMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;3;1;1",
        "aff_country_unique": "Saudi Arabia;United Arab Emirates;Australia;United States"
    },
    {
        "id": "qmN9v3O69J",
        "title": "DeformUX-Net: Exploring a 3D Foundation Backbone for Medical Image Segmentation with Depthwise Deformable Convolution",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The application of 3D ViTs to medical image segmentation has seen remarkable strides, somewhat overshadowing the budding advancements in Convolutional Neural Network (CNN)-based models. Large kernel depthwise convolution has emerged as a promising technique, showcasing capabilities akin to hierarchical transformers and facilitating an expansive effective receptive field (ERF) vital for dense predictions. Despite this, existing core operators, ranging from global-local attention to large kernel convolution, exhibit inherent trade-offs and limitations (e.g., global-local range trade-off, aggregating attentional features). We hypothesize that deformable convolution can be an exploratory alternative to combine all advantages from the previous operators, providing long-range dependency, adaptive spatial aggregation and computational efficiency as a foundation backbone. In this work, we introduce 3D DeformUX-Net, a pioneering volumetric CNN model that adeptly navigates the shortcomings traditionally associated with ViTs and large kernel convolution. Specifically, we revisit volumetric deformable convolution in depth-wise setting to adapt long-range dependency with computational efficiency. Inspired by the concepts of structural re-parameterization for convolution kernel weights, we further generate the deformable tri-planar offsets by adapting a parallel branch (starting from $1\\times1\\times1$ convolution), providing adaptive spatial aggregation across all channels. Our empirical evaluations reveal that the 3D DeformUX-Net consistently outperforms existing state-of-the-art ViTs and large kernel convolution models across four challenging public datasets, spanning various scales from organs (KiTS: 0.680 to 0.720, MSD Pancreas: 0.676 to 0.717, AMOS: 0.871 to 0.902) to vessels (e.g., MSD hepatic vessels: 0.635 to 0.671) in mean Dice.",
        "keywords": "Deformable Convolution;Depthwise Convolution;Medical Image Segmentation;3D Semantic Segmentation",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Ho Hin Lee;Quan Liu;Qi Yang;Xin Yu;Shunxing Bao;Yuankai Huo;Bennett A. Landman",
        "authorids": "~Ho_Hin_Lee1;~Quan_Liu2;~Qi_Yang1;~Xin_Yu5;~Shunxing_Bao1;~Yuankai_Huo2;~Bennett_A._Landman1",
        "gender": "M;M;M;F;M;M;M",
        "homepage": ";;;;;https://hrlblab.github.io/;https://my.vanderbilt.edu/masi/",
        "dblp": ";67/6917;;;184/8151.html;69/10047;74/1206",
        "google_scholar": "BsBdSpoAAAAJ;moBC7TkAAAAJ;WiFDl0EAAAAJ;;cwyRnqwAAAAJ;WRxmxNgAAAAJ;tmTcH0QAAAAJ",
        "orcid": ";;;;0000-0001-6376-4292;0000-0002-2096-8065;0000-0001-5733-2127",
        "linkedin": "hl3003/;;;xin-yu-601953148;;;bennett-landman-96129/",
        "or_profile": "~Ho_Hin_Lee1;~Quan_Liu2;~Qi_Yang1;~Xin_Yu5;~Shunxing_Bao1;~Yuankai_Huo2;~Bennett_A._Landman1",
        "aff": "Microsoft;Vanderbilt University;Vanderbilt University;Vanderbilt University;Vanderbilt University;Vanderbilt University;Vanderbilt University",
        "aff_domain": "microsoft.com;vanderbilt.edu;vanderbilt.edu;vanderbilt.edu;vanderbilt.edu;vanderbilt.edu;vanderbilt.edu",
        "position": "Applied Scientist;PhD student;PhD student;PhD student;Research Assistant Professor;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nlee2024deformuxnet,\ntitle={Deform{UX}-Net: Exploring a 3D Foundation Backbone for Medical Image Segmentation with Depthwise Deformable Convolution},\nauthor={Ho Hin Lee and Quan Liu and Qi Yang and Xin Yu and Shunxing Bao and Yuankai Huo and Bennett A. Landman},\nyear={2024},\nurl={https://openreview.net/forum?id=qmN9v3O69J}\n}",
        "github": "",
        "project": "",
        "reviewers": "HVYF;QwHv;NgCv;jwaG",
        "site": "https://openreview.net/forum?id=qmN9v3O69J",
        "pdf_size": 3930353,
        "rating": "3;5;5;5",
        "confidence": "5;4;4;3",
        "soundness": "1;3;3;3",
        "contribution": "2;3;3;2",
        "presentation": "3;3;4;4",
        "wc_summary": "81;59;61;80",
        "wc_strengths": "66;33;33;59",
        "wc_weaknesses": "102;114;47;98",
        "wc_questions": "358;61;137;36",
        "wc_review": "607;267;278;273",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            70.25,
            10.280442597476044
        ],
        "wc_strengths_avg": [
            47.75,
            14.956186011146023
        ],
        "wc_weaknesses_avg": [
            90.25,
            25.655165171949292
        ],
        "wc_questions_avg": [
            148.0,
            126.82073962881623
        ],
        "wc_review_avg": [
            356.25,
            144.82295225550402
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16584276155455961170&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1;1;1;1;1",
        "aff_unique_norm": "Microsoft;Vanderbilt University",
        "aff_unique_dep": "Microsoft Corporation;",
        "aff_unique_url": "https://www.microsoft.com;https://www.vanderbilt.edu",
        "aff_unique_abbr": "Microsoft;Vanderbilt",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Learning Stackable and Skippable LEGO Bricks for Efficient, Reconfigurable, and Variable-Resolution Diffusion Modeling",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17718",
        "id": "qmXedvwrT1",
        "author_site": "Huangjie Zheng, Zhendong Wang, Jianbo Yuan, Guanghan Ning, Pengcheng He, Quanzeng You, Hongxia Yang, Mingyuan Zhou",
        "tldr": "",
        "abstract": "Diffusion models excel at generating photo-realistic images but come with significant computational costs in both training and sampling. While various techniques address these computational challenges, a less-explored issue is designing an efficient and adaptable network backbone for iterative refinement. Current options like U-Net and Vision Transformer often rely on resource-intensive deep networks and lack the flexibility needed for generating images at variable resolutions or with a smaller network than used in training.\nThis study introduces LEGO bricks, which seamlessly integrate Local-feature Enrichment and Global-content Orchestration. These bricks can be stacked to create a test-time reconfigurable diffusion backbone, allowing selective skipping of bricks to reduce sampling costs and generate higher-resolution images than the training data. LEGO bricks enrich local regions with an MLP and transform them using a Transformer block while maintaining a consistent full-resolution image across all bricks. Experimental results demonstrate that LEGO bricks enhance training efficiency, expedite convergence, and facilitate variable-resolution image generation while maintaining strong generative performance. Moreover, LEGO significantly reduces sampling time compared to other methods, establishing it as a valuable enhancement for diffusion models. Our code and project page are available at https://jegzheng.github.io/LEGODiffusion.",
        "keywords": "Efficient diffusion models;short-span attention;local-feature enrichment;global-content orchestration;multi-scale generation",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Huangjie Zheng;Zhendong Wang;Jianbo Yuan;Guanghan Ning;Pengcheng He;Quanzeng You;Hongxia Yang;Mingyuan Zhou",
        "authorids": "~Huangjie_Zheng1;~Zhendong_Wang1;~Jianbo_Yuan1;~Guanghan_Ning1;~Pengcheng_He2;~Quanzeng_You3;~Hongxia_Yang2;~Mingyuan_Zhou1",
        "gender": "M;M;M;M;M;M;F;M",
        "homepage": ";https://zhendong-wang.github.io/;;http://guanghan.info;;https://qzyou.github.io/;https://www4.comp.polyu.edu.hk/~hongxyang/;http://mingyuanzhou.github.io",
        "dblp": "192/2170;;134/6790;172/9653;116/8665;33/9972.html;;",
        "google_scholar": "Vl5wCXsAAAAJ;lRiIjhcAAAAJ;https://scholar.google.com/citations?hl=en;CcwcL6oAAAAJ;https://scholar.google.com/citations?hl=en;c5KJsIgAAAAJ;iJlC5mMAAAAJ;LXwCIisAAAAJ",
        "orcid": "0000-0003-0508-5034;;;0000-0002-4356-7862;;0000-0003-3608-0607;;",
        "linkedin": ";;;;;quanzeng-you-5b98a55a/;;",
        "or_profile": "~Huangjie_Zheng1;~Zhendong_Wang1;~Jianbo_Yuan1;~Guanghan_Ning1;~Pengcheng_He2;~Quanzeng_You3;~Hongxia_Yang2;~Mingyuan_Zhou1",
        "aff": "University of Texas, Austin;University of Texas at Austin;Bytedance;ByteDance;Microsoft;ByteDance;ByteDance Inc.;Google",
        "aff_domain": "utexas.edu;utexas.edu;bytedance.com;bytedance.com;microsoft.com;bytedance.com;bytedance.com;google.com",
        "position": "PhD student;PhD student;Researcher;Researcher;Principal Researcher;Researcher;Principal Researcher;Researcher",
        "bibtex": "@inproceedings{\nzheng2024learning,\ntitle={Learning Stackable and Skippable {LEGO} Bricks for Efficient, Reconfigurable, and Variable-Resolution Diffusion Modeling},\nauthor={Huangjie Zheng and Zhendong Wang and Jianbo Yuan and Guanghan Ning and Pengcheng He and Quanzeng You and Hongxia Yang and Mingyuan Zhou},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=qmXedvwrT1}\n}",
        "github": "",
        "project": "",
        "reviewers": "ky4P;x9WT;W6yN",
        "pdf_size": 10326054,
        "rating": "6;6;8",
        "confidence": "3;3;3",
        "soundness": "3;3;3",
        "contribution": "3;2;3",
        "presentation": "3;3;3",
        "wc_summary": "43;82;212",
        "wc_strengths": "49;73;83",
        "wc_weaknesses": "67;149;210",
        "wc_questions": "68;105;50",
        "wc_review": "227;409;555",
        "wc_reply_reviewers": "0;82;68",
        "wc_reply_authors": "936;1162;454",
        "reply_reviewers": "0;1;1",
        "reply_authors": "3;4;2",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            112.33333333333333,
            72.25110533564329
        ],
        "wc_strengths_avg": [
            68.33333333333333,
            14.2672897060218
        ],
        "wc_weaknesses_avg": [
            142.0,
            58.58896369340105
        ],
        "wc_questions_avg": [
            74.33333333333333,
            22.895899681432528
        ],
        "wc_review_avg": [
            397.0,
            134.1740163618376
        ],
        "wc_reply_reviewers_avg": [
            50.0,
            35.81433604950212
        ],
        "wc_reply_authors_avg": [
            850.6666666666666,
            295.27087375643555
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.0,
            0.816496580927726
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3714974916542115914&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=qmXedvwrT1",
        "pdf": "https://openreview.net/pdf?id=qmXedvwrT1",
        "email": "utexas.edu;utexas.edu;bytedance.com;bytedance.com;microsoft.com;bytedance.com;bytedance.com;google.com",
        "author_num": 8,
        "aff_unique_index": "0;0;1;1;2;1;1;3",
        "aff_unique_norm": "University of Texas at Austin;ByteDance;Microsoft;Google",
        "aff_unique_dep": ";;Microsoft Corporation;Google",
        "aff_unique_url": "https://www.utexas.edu;https://www.bytedance.com;https://www.microsoft.com;https://www.google.com",
        "aff_unique_abbr": "UT Austin;Bytedance;Microsoft;Google",
        "aff_campus_unique_index": "0;0;2",
        "aff_campus_unique": "Austin;;Mountain View",
        "aff_country_unique_index": "0;0;1;1;0;1;1;0",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "Fast Imitation via Behavior Foundation Models",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17717",
        "id": "qnWtw3l0jb",
        "author_site": "Matteo Pirotta, Andrea Tirinzoni, Ahmed Touati, Alessandro Lazaric, Yann Ollivier",
        "tldr": "",
        "abstract": "Imitation learning (IL) aims at producing agents that can imitate any behavior given a few expert demonstrations. Yet existing approaches require many demonstrations and/or running (online or offline) reinforcement learning (RL) algorithms for each new imitation task. Here we show that recent RL foundation models based on successor measures can imitate any expert behavior almost instantly with just a few demonstrations and no need for RL or fine-tuning, while accommodating several IL principles (behavioral cloning, feature matching, reward-based, and goal-based reductions). In our experiments, imitation via RL foundation models matches, and often surpasses, the performance of SOTA offline IL algorithms, and produces imitation policies from new demonstrations within seconds instead of hours.",
        "keywords": "Behavior Foundation Models;unsupervised reinforcement learning;imitation learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Matteo Pirotta;Andrea Tirinzoni;Ahmed Touati;Alessandro Lazaric;Yann Ollivier",
        "authorids": "~Matteo_Pirotta1;~Andrea_Tirinzoni2;~Ahmed_Touati1;~Alessandro_Lazaric2;~Yann_Ollivier2",
        "gender": ";;M;M;M",
        "homepage": ";https://andreatirinzoni.github.io/;;;http://www.yann-ollivier.org/rech/",
        "dblp": "137/3249;220/5305;147/5871;36/321;63/343",
        "google_scholar": "https://scholar.google.ca/citations?user=6qWcDTAAAAAJ;MmW0yrwAAAAJ;https://scholar.google.fr/citations?user=D4LT5xAAAAAJ;6JZ3R6wAAAAJ;",
        "orcid": ";;;;",
        "linkedin": ";;ahmed-touati-4a132a76/;;",
        "or_profile": "~Matteo_Pirotta1;~Andrea_Tirinzoni2;~Ahmed_Touati1;~Alessandro_Lazaric2;~Yann_Ollivier2",
        "aff": "Meta;Meta, FAIR;Meta Facebook;Meta Facebook;Meta Artificial Intelligence Research",
        "aff_domain": "meta.com;meta.com;fb.com;fb.com;meta.com",
        "position": "Research Scientist;Researcher;Researcher;Research Scientist;Research scientist",
        "bibtex": "@inproceedings{\npirotta2024fast,\ntitle={Fast Imitation via Behavior Foundation Models},\nauthor={Matteo Pirotta and Andrea Tirinzoni and Ahmed Touati and Alessandro Lazaric and Yann Ollivier},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=qnWtw3l0jb}\n}",
        "github": "",
        "project": "",
        "reviewers": "YAAN;EALv;bPor;TWkJ",
        "pdf_size": 1789119,
        "rating": "6;8;8;8",
        "confidence": "3;3;4;3",
        "soundness": "3;4;4;4",
        "contribution": "3;4;4;4",
        "presentation": "3;3;4;3",
        "wc_summary": "74;158;170;88",
        "wc_strengths": "122;174;138;79",
        "wc_weaknesses": "79;156;63;49",
        "wc_questions": "98;105;26;49",
        "wc_review": "373;593;397;265",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "576;317;633;287",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            122.5,
            42.00892762258994
        ],
        "wc_strengths_avg": [
            128.25,
            34.10553474144629
        ],
        "wc_weaknesses_avg": [
            86.75,
            41.36650214847758
        ],
        "wc_questions_avg": [
            69.5,
            33.10966626228661
        ],
        "wc_review_avg": [
            407.0,
            118.33849753989612
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            453.25,
            152.95485445058617
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1751772747968706436&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=qnWtw3l0jb",
        "pdf": "https://openreview.net/pdf?id=qnWtw3l0jb",
        "email": "meta.com;meta.com;fb.com;fb.com;meta.com",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Meta",
        "aff_unique_dep": "Meta Platforms, Inc.",
        "aff_unique_url": "https://meta.com",
        "aff_unique_abbr": "Meta",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "qnbLGV9oFL",
        "title": "How Language Models Learn Context-Free Grammars",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We design experiments to study *how* generative language models, such as GPT, learn context-free grammars (CFGs) --- complex language systems with tree-like structures that encapsulate aspects of human logic, natural languages, and programs. CFGs, comparable in difficulty to pushdown automata, can be ambiguous, usually requiring dynamic programming for rule verification. We create synthetic data to show that pre-trained transformers can learn to generate sentences with near-perfect accuracy and impressive diversity, even for quite challenging CFGs. Crucially, we uncover the *mechanisms* behind transformers learning such CFGs. We find that the hidden states implicitly encode the CFG structure (such as putting tree node info exactly on the subtree boundary), and that the transformer can form \"boundary to boundary\" attentions that mimic dynamic programming. We also discuss CFG extensions and transformer robustness against grammar errors.",
        "keywords": "Interpretability;Transformers;Language Models;Linear Probing;Inner Working;Attention Heads",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/282fc9171f1587f44751ff6f8bd96daef2b37795.zip",
        "author": "Zeyuan Allen-Zhu;Yuanzhi Li",
        "authorids": "~Zeyuan_Allen-Zhu1;~Yuanzhi_Li1",
        "gender": ";M",
        "homepage": ";",
        "dblp": ";73/3628",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Zeyuan_Allen-Zhu1;~Yuanzhi_Li1",
        "aff": ";Carnegie Mellon University",
        "aff_domain": ";andrew.cmu.edu",
        "position": ";Assistant Professor",
        "bibtex": "@misc{\nallen-zhu2024how,\ntitle={How Language Models Learn Context-Free Grammars},\nauthor={Zeyuan Allen-Zhu and Yuanzhi Li},\nyear={2024},\nurl={https://openreview.net/forum?id=qnbLGV9oFL}\n}",
        "github": "",
        "project": "",
        "reviewers": "FLFV;LrUe;ym3T;19zR",
        "site": "https://openreview.net/forum?id=qnbLGV9oFL",
        "pdf_size": 958392,
        "rating": "3;5;6;6",
        "confidence": "5;3;5;3",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "1;2;3;3",
        "wc_summary": "71;79;79;79",
        "wc_strengths": "47;41;63;41",
        "wc_weaknesses": "463;114;615;50",
        "wc_questions": "17;85;97;80",
        "wc_review": "598;319;854;250",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.0,
            1.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            77.0,
            3.4641016151377544
        ],
        "wc_strengths_avg": [
            48.0,
            9.0
        ],
        "wc_weaknesses_avg": [
            310.5,
            235.82249680639038
        ],
        "wc_questions_avg": [
            69.75,
            31.075512867851433
        ],
        "wc_review_avg": [
            505.25,
            239.82845431683037
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.40824829046386296,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:HmmSIR6f2awJ:scholar.google.com/&scioq=How+Language+Models+Learn+Context-Free+Grammars&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Carnegie Mellon University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cmu.edu",
        "aff_unique_abbr": "CMU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Teach LLMs to Phish: Stealing Private Information from Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17716",
        "id": "qo21ZlfNu6",
        "author_site": "Ashwinee Panda, Christopher A. Choquette-Choo, Zhengming Zhang, Yaoqing Yang, Prateek Mittal",
        "tldr": "",
        "abstract": "When large language models are trained on private data, it can be a \\textit{significant} privacy risk for them to memorize and regurgitate sensitive information. In this work, we propose a new \\emph{practical} data extraction attack that we call ``neural phishing''. This attack enables an adversary to target and extract sensitive or personally identifiable information (PII), e.g., credit card numbers, from a model trained on user data with upwards of $10\\%$ attack success rates, at times, as high as $50\\%$. \nOur attack assumes only that an adversary can insert as few as $10$s of benign-appearing sentences into the training dataset using only vague priors on the structure of the user data.",
        "keywords": "LLMs;machine learning;memorization;privacy;data poisoning;federated learning;large language models;privacy risks",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Ashwinee Panda;Christopher A. Choquette-Choo;Zhengming Zhang;Yaoqing Yang;Prateek Mittal",
        "authorids": "~Ashwinee_Panda1;~Christopher_A._Choquette-Choo1;~Zhengming_Zhang2;~Yaoqing_Yang1;~Prateek_Mittal1",
        "gender": "M;M;M;M;",
        "homepage": "https://kiddyboots216.github.io/;https://www.christopherchoquette.com;;https://sites.google.com/site/yangyaoqingcmu/;http://www.princeton.edu/~pmittal/",
        "dblp": "270/1582.html;250/9674;;04/4176;",
        "google_scholar": "FM7JCgQAAAAJ;oDE4I64AAAAJ;GePqbSgAAAAJ;LYvugWgAAAAJ;https://scholar.google.com.tw/citations?user=xTKD8J4AAAAJ",
        "orcid": ";;;0000-0001-9908-5531;0000-0002-4057-0118",
        "linkedin": "https://linkedin.com/in/ashwineepanda;christopher-choquette-choo/;;;",
        "or_profile": "~Ashwinee_Panda1;~Christopher_A._Choquette-Choo1;~Zhengming_Zhang2;~Yaoqing_Yang1;~Prateek_Mittal1",
        "aff": "Princeton University;Google DeepMind;Southeast University;Dartmouth College;Princeton University",
        "aff_domain": "princeton.edu;google.com;seu.edu.cn;dartmouth.edu;princeton.edu",
        "position": "PhD student;Research Scientist;PhD student;Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\npanda2024teach,\ntitle={Teach {LLM}s to Phish: Stealing Private Information from Language Models},\nauthor={Ashwinee Panda and Christopher A. Choquette-Choo and Zhengming Zhang and Yaoqing Yang and Prateek Mittal},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=qo21ZlfNu6}\n}",
        "github": "",
        "project": "",
        "reviewers": "Lw6r;DgUe;bBB6",
        "pdf_size": 1003655,
        "rating": "5;8;8",
        "confidence": "4;4;4",
        "soundness": "3;4;2",
        "contribution": "2;4;3",
        "presentation": "2;3;3",
        "wc_summary": "96;46;50",
        "wc_strengths": "56;163;147",
        "wc_weaknesses": "179;500;633",
        "wc_questions": "2;103;219",
        "wc_review": "333;812;1049",
        "wc_reply_reviewers": "0;0;413",
        "wc_reply_authors": "1687;1971;2875",
        "reply_reviewers": "0;0;3",
        "reply_authors": "3;3;4",
        "rating_avg": [
            7.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            64.0,
            22.686266036231405
        ],
        "wc_strengths_avg": [
            122.0,
            47.12395003251177
        ],
        "wc_weaknesses_avg": [
            437.3333333333333,
            190.56815636989884
        ],
        "wc_questions_avg": [
            108.0,
            88.66040078110784
        ],
        "wc_review_avg": [
            731.3333333333334,
            297.81910990099715
        ],
        "wc_reply_reviewers_avg": [
            137.66666666666666,
            194.6900670866961
        ],
        "wc_reply_authors_avg": [
            2177.6666666666665,
            506.5368254683519
        ],
        "reply_reviewers_avg": [
            1.0,
            1.4142135623730951
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 27,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9357185480011234124&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=qo21ZlfNu6",
        "pdf": "https://openreview.net/pdf?id=qo21ZlfNu6",
        "email": "princeton.edu;google.com;seu.edu.cn;dartmouth.edu;princeton.edu",
        "author_num": 5,
        "aff_unique_index": "0;1;2;3;0",
        "aff_unique_norm": "Princeton University;Google;Southeast University;Dartmouth College",
        "aff_unique_dep": ";Google DeepMind;;",
        "aff_unique_url": "https://www.princeton.edu;https://deepmind.com;https://www.seu.edu.cn/;https://www.dartmouth.edu",
        "aff_unique_abbr": "Princeton;DeepMind;SEU;Dartmouth",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;0;0",
        "aff_country_unique": "United States;United Kingdom;China"
    },
    {
        "title": "Grounding Language Plans in Demonstrations Through Counterfactual Perturbations",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17715",
        "id": "qoHeuRAcSl",
        "author_site": "Yanwei Wang, Johnson (Tsun-Hsuan) Wang, Jiayuan Mao, Michael Hagenow, Julie Shah",
        "tldr": "",
        "abstract": "Grounding the common-sense reasoning of Large Language Models in physical domains remains a pivotal yet unsolved problem for embodied AI. Whereas prior works have focused on leveraging LLMs directly for planning in symbolic spaces, this work uses LLMs to guide the search of task structures and constraints implicit in multi-step demonstrations. Specifically, we borrow from manipulation planning literature the concept of mode families, which group robot configurations by specific motion constraints, to serve as an abstraction layer between the high-level language representations of an LLM and the low-level physical trajectories of a robot. By replaying a few human demonstrations with synthetic perturbations, we generate coverage over the demonstrations' state space with additional successful executions as well as counterfactuals that fail the task. Our explanation-based learning framework trains an end-to-end differentiable neural network to predict successful trajectories from failures and as a by-product learns classifiers that ground low-level states and images in mode families without dense labeling. The learned grounding classifiers can further be used to translate language plans into reactive policies in the physical domain in an interpretable manner. We show our approach improves the interpretability and reactivity of imitation learning through 2D navigation and simulated and real robot manipulation tasks. Website: https://yanweiw.github.io/glide/",
        "keywords": "Grounding LLM;Learning Mode Abstractions for Manipulation;Learning from Demonstration;Robotics;Task and Motion Planning",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Yanwei Wang;Tsun-Hsuan Wang;Jiayuan Mao;Michael Hagenow;Julie Shah",
        "authorids": "~Yanwei_Wang1;~Tsun-Hsuan_Wang2;~Jiayuan_Mao1;hagenow@mit.edu;~Julie_Shah2",
        "gender": ";M;F;;F",
        "homepage": "https://yanweiw.github.io/;https://zswang666.github.io/;http://jiayuanm.com;;https://interactive.mit.edu",
        "dblp": ";217/1809.html;200/8283;;",
        "google_scholar": ";xE3WSuYAAAAJ;-xaOIZIAAAAJ;;",
        "orcid": ";;0000-0003-4798-3748;;",
        "linkedin": ";;;;",
        "or_profile": "~Yanwei_Wang1;~Tsun-Hsuan_Wang2;~Jiayuan_Mao1;hagenow@mit.edu;~Julie_Shah2",
        "aff": "Massachusetts Institute of Technology;Liquid AI;Massachusetts Institute of Technology;;Massachusetts Institute of Technology",
        "aff_domain": "mit.edu;liquid.ai;mit.edu;;mit.edu",
        "position": "PhD student;Researcher;PhD student;;Professor",
        "bibtex": "@inproceedings{\nwang2024grounding,\ntitle={Grounding Language Plans in Demonstrations Through Counterfactual Perturbations},\nauthor={Yanwei Wang and Tsun-Hsuan Wang and Jiayuan Mao and Michael Hagenow and Julie Shah},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=qoHeuRAcSl}\n}",
        "github": "",
        "project": "",
        "reviewers": "Mzap;i3As;Rhgd",
        "pdf_size": 15826767,
        "rating": "6;8;8",
        "confidence": "4;4;3",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "3;3;3",
        "wc_summary": "104;187;183",
        "wc_strengths": "27;60;72",
        "wc_weaknesses": "214;186;245",
        "wc_questions": "30;138;119",
        "wc_review": "375;571;619",
        "wc_reply_reviewers": "546;108;46",
        "wc_reply_authors": "2964;1655;646",
        "reply_reviewers": "2;1;1",
        "reply_authors": "7;4;2",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            158.0,
            38.21866908549625
        ],
        "wc_strengths_avg": [
            53.0,
            19.026297590440446
        ],
        "wc_weaknesses_avg": [
            215.0,
            24.097026095903757
        ],
        "wc_questions_avg": [
            95.66666666666667,
            47.07676945396978
        ],
        "wc_review_avg": [
            521.6666666666666,
            105.54409294487094
        ],
        "wc_reply_reviewers_avg": [
            233.33333333333334,
            222.53289394803835
        ],
        "wc_reply_authors_avg": [
            1755.0,
            948.9576738014539
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            4.333333333333333,
            2.0548046676563256
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8066045548743291440&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=qoHeuRAcSl",
        "pdf": "https://openreview.net/pdf?id=qoHeuRAcSl",
        "email": "mit.edu;liquid.ai;mit.edu;;mit.edu",
        "author_num": 5,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Massachusetts Institute of Technology;Liquid AI",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://web.mit.edu;",
        "aff_unique_abbr": "MIT;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "United States;Unknown"
    },
    {
        "title": "Demystifying Embedding Spaces using Large Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17714",
        "id": "qoYogklIPz",
        "author_site": "Guy Tennenholtz, Yinlam Chow, ChihWei Hsu, Jihwan Jeong, Lior Shani, Azamat Tulepbergenov, Deepak Ramachandran, Martin Mladenov, Craig Boutilier",
        "tldr": "",
        "abstract": "Embeddings have become a pivotal means to represent complex, multi-faceted information about entities, concepts, and relationships in a condensed and useful format. Nevertheless, they often preclude direct interpretation. While downstream tasks make use of these compressed representations, meaningful interpretation usually requires visualization using dimensionality reduction or specialized machine learning interpretability methods. This paper addresses the challenge of making such embeddings more interpretable and broadly useful, by employing large language models (LLMs) to directly interact with embeddings -- transforming abstract vectors into understandable narratives. By injecting embeddings into LLMs, we enable querying and exploration of complex embedding data. We demonstrate our approach on a variety of diverse tasks, including: enhancing concept activation vectors (CAVs), communicating novel embedded entities, and decoding user preferences in recommender systems. Our work couples the immense information potential of embeddings with the interpretative power of LLMs.",
        "keywords": "large language models;interpretability methods;representation;recommender systems",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Guy Tennenholtz;Yinlam Chow;ChihWei Hsu;Jihwan Jeong;Lior Shani;Azamat Tulepbergenov;Deepak Ramachandran;Martin Mladenov;Craig Boutilier",
        "authorids": "~Guy_Tennenholtz2;~Yinlam_Chow1;~ChihWei_Hsu2;~Jihwan_Jeong1;~Lior_Shani2;~Azamat_Tulepbergenov1;~Deepak_Ramachandran2;~Martin_Mladenov1;~Craig_Boutilier2",
        "gender": ";M;;M;M;M;M;M;M",
        "homepage": "https://guytenn.com;;https://research.google/people/107258/;https://jihwan-jeong.netlify.app;;https://atulep.github.io;;;https://research.google/people/craigboutilier/",
        "dblp": ";146/7869;;157/0278;https://dblp.uni-trier.de/pers/s/Shani:Lior;;80/703;;10/3411",
        "google_scholar": "https://scholar.google.co.il/citations?user=pldrn8IAAAAJ;;;XvKkcC4AAAAJ;https://scholar.google.co.il/citations?user=TrQLB1gAAAAJ;https://scholar.google.com/citations?hl=en;WbM9EAIAAAAJ;https://scholar.google.de/citations?user=Gc65LRwAAAAJ;cXkm3rsAAAAJ",
        "orcid": ";;0000-0001-9929-9951;;;;;;",
        "linkedin": ";;;jihwan-jeong-5301ab183/;;;;;",
        "or_profile": "~Guy_Tennenholtz2;~Yinlam_Chow1;~ChihWei_Hsu2;~Jihwan_Jeong1;~Lior_Shani2;~Azamat_Tulepbergenov1;~Deepak_Ramachandran2;~Martin_Mladenov1;~Craig_Boutilier2",
        "aff": "Google;Google Research;Google Research;University of Toronto;Google Research;Google;Google;Google;Google",
        "aff_domain": "google.com;google.com;google.com;utoronto.ca;google.com;google.com;google.com;google.com;google.com",
        "position": "Researcher;Research Scientist;Software Engineer;PhD student;Researcher;Research Software Engineer;Staff Researcher;Research Scientist;Principal Researcher",
        "bibtex": "@inproceedings{\ntennenholtz2024demystifying,\ntitle={Demystifying Embedding Spaces using Large Language Models},\nauthor={Guy Tennenholtz and Yinlam Chow and ChihWei Hsu and Jihwan Jeong and Lior Shani and Azamat Tulepbergenov and Deepak Ramachandran and Martin Mladenov and Craig Boutilier},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=qoYogklIPz}\n}",
        "github": "",
        "project": "",
        "reviewers": "BRjZ;bEK6;viWv;pa1w",
        "pdf_size": 3429621,
        "rating": "5;6;8;8",
        "confidence": "4;2;4;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "1;2;3;3",
        "wc_summary": "94;64;187;80",
        "wc_strengths": "35;55;85;61",
        "wc_weaknesses": "138;172;169;152",
        "wc_questions": "53;54;54;66",
        "wc_review": "320;345;495;359",
        "wc_reply_reviewers": "0;44;0;218",
        "wc_reply_authors": "255;396;205;606",
        "reply_reviewers": "0;1;0;3",
        "reply_authors": "2;2;2;3",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            106.25,
            47.814093110713706
        ],
        "wc_strengths_avg": [
            59.0,
            17.832554500127006
        ],
        "wc_weaknesses_avg": [
            157.75,
            13.718144918318949
        ],
        "wc_questions_avg": [
            56.75,
            5.356071321407137
        ],
        "wc_review_avg": [
            379.75,
            67.99034857978006
        ],
        "wc_reply_reviewers_avg": [
            65.5,
            89.85961273008024
        ],
        "wc_reply_authors_avg": [
            365.5,
            155.5160763393933
        ],
        "reply_reviewers_avg": [
            1.0,
            1.224744871391589
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.058025885318565944,
        "gs_citation": 18,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6046767619030373268&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 9,
        "openreview": "https://openreview.net/forum?id=qoYogklIPz",
        "pdf": "https://openreview.net/pdf?id=qoYogklIPz",
        "email": "google.com;google.com;google.com;utoronto.ca;google.com;google.com;google.com;google.com;google.com",
        "author_num": 9,
        "aff_unique_index": "0;0;0;1;0;0;0;0;0",
        "aff_unique_norm": "Google;University of Toronto",
        "aff_unique_dep": "Google;",
        "aff_unique_url": "https://www.google.com;https://www.utoronto.ca",
        "aff_unique_abbr": "Google;U of T",
        "aff_campus_unique_index": "0;0;0;0;0;0;0;0",
        "aff_campus_unique": "Mountain View;",
        "aff_country_unique_index": "0;0;0;1;0;0;0;0;0",
        "aff_country_unique": "United States;Canada"
    },
    {
        "id": "qofh48zW3T",
        "title": "Distributional Distance Classifiers for Goal-Conditioned Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "What does it mean to find the shortest path in stochastic environments if every strategy has a non-zero probability of failing? At the core of this question is a conflict between two seemingly-natural notions of planning: maximizing the probability of reaching a goal state and minimizing the expected number of steps to reach that goal state. Reinforcement learning (RL) methods based on minimizing the steps to a goal make an implicit assumption: that the goal is always reached within some finite horizon. This assumption is violated in practical settings and can lead to suboptimal strategies. In this paper, we bridge the gap between these two notions of planning by estimating the probability of reaching the goal at different future timesteps. This is not the same as estimating the distance to the goal -- rather, probabilities convey uncertainty in ever reaching the goal at all. We then propose a practical RL algorithm, Distributional NCE, for estimating these probabilities. Taken together, our results provide a way of thinking about probabilities and distances in stochastic settings, along with a practical and effective algorithm for goal-conditioned RL.",
        "keywords": "reinforcement learning;goal-conditioned;dynamical distance learning;stochastic;shortest path",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/dbefa55051ce46a694cf244f79ffd2b11569df04.zip",
        "author": "Ravi Tej Akella;Benjamin Eysenbach;Jeff Schneider;Russ Salakhutdinov",
        "authorids": "~Ravi_Tej_Akella1;~Benjamin_Eysenbach1;~Jeff_Schneider1;~Russ_Salakhutdinov1",
        "gender": ";M;;M",
        "homepage": ";https://ben-eysenbach.github.io/;https://www.cs.cmu.edu/~schneide;https://www.cs.cmu.edu/~rsalakhu/",
        "dblp": ";192/1863;38/247;",
        "google_scholar": ";DRnOvU8AAAAJ;3bSbb20AAAAJ;",
        "orcid": ";0009-0000-7136-6307;0000-0002-5080-9073;",
        "linkedin": ";benjamin-eysenbach-a7235775/;jeff-schneider-1593b322/;",
        "or_profile": "~Ravi_Tej_Akella1;~Benjamin_Eysenbach1;~Jeff_Schneider1;~Russ_Salakhutdinov1",
        "aff": ";Princeton University;Carnegie Mellon University;School of Computer Science, Carnegie Mellon University",
        "aff_domain": ";princeton.edu;cs.cmu.edu;cs.cmu.edu",
        "position": ";Assistant Professor;Researcher;Full Professor",
        "bibtex": "@misc{\nakella2024distributional,\ntitle={Distributional Distance Classifiers for Goal-Conditioned Reinforcement Learning},\nauthor={Ravi Tej Akella and Benjamin Eysenbach and Jeff Schneider and Russ Salakhutdinov},\nyear={2024},\nurl={https://openreview.net/forum?id=qofh48zW3T}\n}",
        "github": "",
        "project": "",
        "reviewers": "RXdj;A8Ng;pEXE;iQmu;CNkF",
        "site": "https://openreview.net/forum?id=qofh48zW3T",
        "pdf_size": 9621058,
        "rating": "3;5;6;8;8",
        "confidence": "2;5;2;4;2",
        "soundness": "2;3;2;3;3",
        "contribution": "3;2;2;3;3",
        "presentation": "2;3;3;3;4",
        "wc_summary": "64;90;66;49;46",
        "wc_strengths": "31;40;68;62;22",
        "wc_weaknesses": "171;178;367;109;27",
        "wc_questions": "119;100;95;172;3",
        "wc_review": "385;408;596;392;98",
        "wc_reply_reviewers": "0;154;98;12;0",
        "wc_reply_authors": "596;1571;734;387;66",
        "reply_reviewers": "0;1;1;1;0",
        "reply_authors": "2;3;2;1;1",
        "rating_avg": [
            6.0,
            1.8973665961010275
        ],
        "confidence_avg": [
            3.0,
            1.2649110640673518
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            3.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            63.0,
            15.646085772486357
        ],
        "wc_strengths_avg": [
            44.6,
            17.704236781064584
        ],
        "wc_weaknesses_avg": [
            170.4,
            112.28820062678001
        ],
        "wc_questions_avg": [
            97.8,
            54.68966995694891
        ],
        "wc_review_avg": [
            375.8,
            159.40188204660572
        ],
        "wc_reply_reviewers_avg": [
            52.8,
            62.48967914784009
        ],
        "wc_reply_authors_avg": [
            670.8,
            503.24443365028884
        ],
        "reply_reviewers_avg": [
            0.6,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.8,
            0.7483314773547883
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.08333333333333334,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2168262794621239246&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Princeton University;Carnegie Mellon University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.princeton.edu;https://www.cmu.edu",
        "aff_unique_abbr": "Princeton;CMU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Pittsburgh",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "qp0oVaFGm0",
        "title": "Iterative Graph Neural Network Enhancement Using Explanations",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We formulate an XAI-based model improvement approach for Graph Neural Networks (GNN) for node classification, called Explanation Enhanced Graph Learning (EEGL). The goal is to improve predictive performance using explanations. EEGL is an iterative algorithm, which starts with a learned \u201cvanilla\u201d GNN and repeatedly uses frequent subgraph mining to find relevant patterns in explanation subgraphs, which are then analyzed further to obtain application-dependent features corresponding to the presence of certain subgraphs in the node neighborhoods. Giving an application-dependent algorithm for such an extension of the Weisfeiler-Leman (1-WL) algorithm has been posed as an open problem. We present the results of experiments on different synthetic datasets, compare them with other feature annotations, and analyse the training dynamics.",
        "keywords": "Graph Neural Network;Explainable AI;Frequent Subgraph Mining;Weisfeiler-Leman",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/cafbf511c4b9ea912aa346fb8df458032efb5be2.zip",
        "author": "Tamas Horvath;Harish Naik;Raj Shekhar;Gyorgy Turan",
        "authorids": "~Tamas_Horvath1;~Harish_Naik1;~Raj_Shekhar2;~Gyorgy_Turan1",
        "gender": ";M;M;M",
        "homepage": ";https://hnaik2.people.uic.edu/;https://www.linkedin.com/in/raj-shekhar-43773353/;",
        "dblp": ";https://dblp.uni-trier.de/pers/hd/n/Naik:Harish;;https://dblp.uni-trier.de/pers/hd/t/Tur=aacute=n:Gy=ouml=rgy.html",
        "google_scholar": ";gWJbRocAAAAJ;https://scholar.google.com/citations?hl=en;",
        "orcid": "0000-0001-6852-6939;0000-0002-1420-2688;;",
        "linkedin": ";hnaik/?lipi=urn%3Ali%3Apage%3Ad_flagship3_feed%3B6REvbAXlSVKN9pUUEet7xw%3D%3D;;",
        "or_profile": "~Tamas_Horvath1;~Harish_Naik1;~Raj_Shekhar2;~Gyorgy_Turan1",
        "aff": "Fraunhofer Institute IAIS, Fraunhofer IAIS;University of Illinois, Chicago;University of Illinois at Chicago;University of Illinois, Chicago",
        "aff_domain": "iais.fraunhofer.de;uic.edu;uic.edu;uic.edu",
        "position": "Principal Researcher;PhD student;PhD student;Professor",
        "bibtex": "@misc{\nhorvath2024iterative,\ntitle={Iterative Graph Neural Network Enhancement Using Explanations},\nauthor={Tamas Horvath and Harish Naik and Raj Shekhar and Gyorgy Turan},\nyear={2024},\nurl={https://openreview.net/forum?id=qp0oVaFGm0}\n}",
        "github": "",
        "project": "",
        "reviewers": "9PFw;FGzN;dVAw;CfEt",
        "site": "https://openreview.net/forum?id=qp0oVaFGm0",
        "pdf_size": 861136,
        "rating": "3;3;3;6",
        "confidence": "4;5;4;4",
        "soundness": "1;2;1;4",
        "contribution": "2;2;2;3",
        "presentation": "1;3;1;3",
        "wc_summary": "53;41;28;76",
        "wc_strengths": "16;63;12;80",
        "wc_weaknesses": "215;114;300;72",
        "wc_questions": "5;6;3;125",
        "wc_review": "289;224;343;353",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "178;171;207;344",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            1.224744871391589
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            1.0
        ],
        "wc_summary_avg": [
            49.5,
            17.67059704707229
        ],
        "wc_strengths_avg": [
            42.75,
            29.40556920040828
        ],
        "wc_weaknesses_avg": [
            175.25,
            88.8182835907112
        ],
        "wc_questions_avg": [
            34.75,
            52.11705574953366
        ],
        "wc_review_avg": [
            302.25,
            51.3194651180232
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            225.0,
            70.01785486574121
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:9dWQihZj7cMJ:scholar.google.com/&scioq=Iterative+Graph+Neural+Network+Enhancement+Using+Explanations&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Fraunhofer Institute for Intelligent Analysis and Information Systems;University of Illinois at Chicago",
        "aff_unique_dep": "Intelligent Analysis and Information Systems;",
        "aff_unique_url": "https://www.iais.fraunhofer.de/;https://www.uic.edu",
        "aff_unique_abbr": "Fraunhofer IAIS;UIC",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Chicago",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "Germany;United States"
    },
    {
        "id": "qpuxHL9X3d",
        "title": "Efficient Diversified Attack: Multiple Diversification Strategies Lead to the Efficient Adversarial Attacks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep learning models are vulnerable to adversarial examples (AEs). Recently, adversarial attacks that generate AEs by optimizing a multimodal function with many local optimums have attracted considerable research attention.\nQuick convergence to a nearby local optimum (intensification) and fast enumeration of multiple different local optima (diversification) are important to construct strong attacks. Most existing white-box attacks that use the model's gradient enumerate multiple local optima based on multi-restart; however, our experiments suggest that the ability to diversify based on multi-restart is limited.\nTherefore, we propose the multi-directions/objectives (MDO) strategy, which uses multiple search directions and objective functions for diversification.\nThe MDO strategy showed higher diversification performance and promising attack performance.\nEfficient Diversified Attack (EDA), a combination of MDO and multi-target strategies, showed further diversification performance, resulting in state-of-the-art attack performance against more than 90% of 41 robust models compared to Adaptive Auto Attack (A$^3$).\nEDA particularly outperformed A$^3$ in attack performance and runtime for models trained on ImageNet, where the MDO strategy showed higher diversification performance.\nThese results suggest a relationship between attack and diversification performances, which is beneficial to constructing more potent attacks.",
        "keywords": "Adversarial attack;Robustness;Optimization",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/134cb34a0755f6d38ce4928f52aa02873394e37e.zip",
        "author": "Keiichiro Yamamura;Issa Oe;Nozomi Hata;Hiroki Ishikura;Katsuki Fujisawa",
        "authorids": "~Keiichiro_Yamamura1;~Issa_Oe1;~Nozomi_Hata1;~Hiroki_Ishikura1;~Katsuki_Fujisawa1",
        "gender": "M;M;;M;M",
        "homepage": "https://sites.google.com/view/fujisawa-lab-en/about-us/members/keiichiro-yamamura;;http://opt.imi.kyushu-u.ac.jp/lab/en/member/hata.html;https://sites.google.com/view/fujisawa-lab-en/about-us/members/hiroki-ishikura;https://sites.google.com/view/fujisawa-lab-en/about-us/members/professor-katsuki-fujisawa?authuser=0",
        "dblp": "312/4214;322/9071;194/7606;97/6962;04/4788",
        "google_scholar": "QOaOG9UAAAAJ;https://scholar.google.com/citations?hl=ja;;;https://scholar.google.co.jp/citations?hl=ja",
        "orcid": "0000-0003-4696-2881;;;0000-0002-4979-5276;0000-0001-8549-641X",
        "linkedin": "keiichiro-yamamura-41815923b/;;;%E5%BC%98%E8%B2%B4-%E7%9F%B3%E5%80%89-466422281/;katsuki-fujisawa-a0021340/",
        "or_profile": "~Keiichiro_Yamamura1;~Issa_Oe1;~Nozomi_Hata1;~Hiroki_Ishikura1;~Katsuki_Fujisawa1",
        "aff": "Kyushu University;Kyushu University;NTT;Kyushu University;Kyushu University",
        "aff_domain": "kyushu-u.ac.jp;s.kyushu-u.ac.jp;ntt.co.jp;kyushu-u.ac.jp;kyushu-u.ac.jp",
        "position": "PhD student;MS student;Researcher;PhD student;Full Professor",
        "bibtex": "@misc{\nyamamura2024efficient,\ntitle={Efficient Diversified Attack: Multiple Diversification Strategies Lead to the Efficient Adversarial Attacks},\nauthor={Keiichiro Yamamura and Issa Oe and Nozomi Hata and Hiroki Ishikura and Katsuki Fujisawa},\nyear={2024},\nurl={https://openreview.net/forum?id=qpuxHL9X3d}\n}",
        "github": "",
        "project": "",
        "reviewers": "hF3e;GZwH;C5Ls;pdmN",
        "site": "https://openreview.net/forum?id=qpuxHL9X3d",
        "pdf_size": 7019361,
        "rating": "5;5;5;6",
        "confidence": "4;3;4;4",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "2;3;1;2",
        "wc_summary": "51;113;100;71",
        "wc_strengths": "11;61;66;80",
        "wc_weaknesses": "65;310;352;71",
        "wc_questions": "65;66;160;8",
        "wc_review": "192;550;678;230",
        "wc_reply_reviewers": "0;40;0;23",
        "wc_reply_authors": "841;903;1806;282",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "2;3;3;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            83.75,
            24.262883175748097
        ],
        "wc_strengths_avg": [
            54.5,
            26.062425059844298
        ],
        "wc_weaknesses_avg": [
            199.5,
            132.35274836587263
        ],
        "wc_questions_avg": [
            74.75,
            54.53152757809009
        ],
        "wc_review_avg": [
            412.5,
            206.95591317959486
        ],
        "wc_reply_reviewers_avg": [
            15.75,
            16.857861667483217
        ],
        "wc_reply_authors_avg": [
            958.0,
            546.0755442244232
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:C3mPfzzGtn4J:scholar.google.com/&scioq=Efficient+Diversified+Attack:+Multiple+Diversification+Strategies+Lead+to+the+Efficient+Adversarial+Attacks&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "Kyushu University;NTT Corporation",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.kyushu-u.ac.jp;https://www.ntt.co.jp",
        "aff_unique_abbr": "Kyushu U;NTT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Japan"
    },
    {
        "id": "qqDYfDpCEv",
        "title": "Bandwidth Selection for Gaussian Kernel Ridge Regression via Jacobian Control",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Most machine learning methods require tuning of hyper-parameters. For kernel ridge regression with the Gaussian kernel, the hyper-parameter is the bandwidth. The bandwidth specifies the length scale of the kernel and has to be carefully selected in order to obtain a model with good generalization. The default methods for bandwidth selection are cross-validation and marginal likelihood maximization, which often yield good results, albeit at high computational costs. Furthermore, the estimates provided by these methods tend to have very high variance, especially when training data are scarce. Inspired by Jacobian regularization, we formulate an approximate expression for how the derivatives of the functions inferred by kernel ridge regression with the Gaussian kernel depend on the kernel bandwidth. We then use this expression to propose a closed-form, computationally feather-light, bandwidth selection heuristic, based on controlling the Jacobian. In addition, the Jacobian expression illuminates how the bandwidth selection is a trade-off between the smoothness of the inferred function and the conditioning of the training data kernel matrix. We show on real and synthetic data that compared to cross-validation and marginal likelihood maximization, our method is considerably faster and considerably more stable in terms of bandwidth selection.",
        "keywords": "Kernel Ridge Regression;Bandwidth Selection;Jacobian Regularization",
        "primary_area": "metric learning, kernel learning, and sparse coding",
        "supplementary_material": "/attachment/4550155ee2d3ceab4475bfd9ceb6bd27179d1a9f.zip",
        "author": "Oskar Allerbo;Rebecka J\u00f6rnsten",
        "authorids": "~Oskar_Allerbo1;~Rebecka_J\u00f6rnsten1",
        "gender": "F;M",
        "homepage": ";https://allerbo.github.io/",
        "dblp": "41/4910;281/8256",
        "google_scholar": "SO9llAMAAAAJ;04RKRDYAAAAJ",
        "orcid": ";0000-0002-5926-0830",
        "linkedin": "rebecka-j%C3%B6rnsten-533675220/;",
        "or_profile": "~Rebecka_J\u00f6rnsten1;~Oskar_Allerbo2",
        "aff": "G\u00f6teborg University;KTH Royal Institute of Technology",
        "aff_domain": "gu.se;kth.se",
        "position": "Full Professor;Postdoc",
        "bibtex": "@misc{\nallerbo2024bandwidth,\ntitle={Bandwidth Selection for Gaussian Kernel Ridge Regression via Jacobian Control},\nauthor={Oskar Allerbo and Rebecka J{\\\"o}rnsten},\nyear={2024},\nurl={https://openreview.net/forum?id=qqDYfDpCEv}\n}",
        "github": "",
        "project": "",
        "reviewers": "q66a;oRtQ;MVeD;Gr3G;qguk",
        "site": "https://openreview.net/forum?id=qqDYfDpCEv",
        "pdf_size": 2105411,
        "rating": "3;3;3;5;5",
        "confidence": "3;4;4;3;4",
        "soundness": "2;2;1;2;3",
        "contribution": "2;2;1;2;2",
        "presentation": "3;3;3;2;3",
        "wc_summary": "45;55;143;93;129",
        "wc_strengths": "14;41;80;66;77",
        "wc_weaknesses": "17;66;277;314;165",
        "wc_questions": "505;201;237;48;104",
        "wc_review": "581;363;737;521;475",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            3.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            1.8,
            0.4
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            93.0,
            38.843274836192684
        ],
        "wc_strengths_avg": [
            55.6,
            24.920674148184673
        ],
        "wc_weaknesses_avg": [
            167.8,
            115.24825378286648
        ],
        "wc_questions_avg": [
            219.0,
            158.0569517610662
        ],
        "wc_review_avg": [
            535.4,
            123.53072492299235
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.16666666666666663,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16040061988489611838&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Gothenburg;KTH Royal Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.gu.se;https://www.kth.se",
        "aff_unique_abbr": "GU;KTH",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Sweden"
    },
    {
        "id": "qqDeICpLFo",
        "title": "Global minima, recoverability thresholds, and higher-order structure in GNNs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We analyze the performance of graph neural network (GNN) architectures from the perspective of random graph theory. Our approach promises to complement existing lenses on GNN analysis, such as combinatorial expressive power and worst-case adversarial analysis, by connecting the performance of GNNs to typical-case properties of the training data.  First, we theoretically characterize the nodewise accuracy of one- and two-layer GCNs relative to the contextual stochastic block model (cSBM) and related models. We additionally prove that GCNs cannot beat linear models under certain circumstances. Second, we numerically map the recoverability thresholds, in terms of accuracy, of four diverse GNN architectures (GCN, GAT, SAGE, and Graph Transformer) under a variety of assumptions about the data. Sample results of this second analysis include:\nheavy-tailed degree distributions enhance GNN performance,\nGNNs can work well on strongly heterophilous graphs,\nand SAGE and Graph Transformer can perform well on arbitrarily noisy edge data, but no architecture handled sufficiently noisy feature data well.\nFinally, we show how both specific higher-order structures in synthetic data and the mix of empirical structures in real data have dramatic effects (usually negative) on GNN performance.",
        "keywords": "GNN;Synthetic Data;Higher Order Structure;Theoretical Bounds;cSBM",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/e79c2bc0c093a6f4ac53e8d3648258a4955305b8.zip",
        "author": "Drake Brown;Trevor Beowulf Garrity;Kaden Brent Parker;Jason Travis Oliphant;Brigham Stone Carson;Cole Hanson;Zachary Mark Boyd",
        "authorids": "~Drake_Brown1;~Trevor_Beowulf_Garrity1;~Kaden_Brent_Parker1;~Jason_Travis_Oliphant1;~Brigham_Stone_Carson1;~Cole_Hanson1;~Zachary_Mark_Boyd1",
        "gender": "M;M;;;;;",
        "homepage": ";;;;;;http://math.byu.edu/~zboyd/",
        "dblp": ";;;;;;",
        "google_scholar": ";;;;;;rhpDjiYAAAAJ",
        "orcid": ";;;;;;",
        "linkedin": "drake-brown-5398b9224/;trevor-garrity-06555026b;kaden-parker-84047828b;jason-oliphant-a2a931274/;stone-carson/;cole-hanson-2452a0238/;",
        "or_profile": "~Drake_Brown1;~Trevor_Beowulf_Garrity1;~Kaden_Brent_Parker1;~Jason_Travis_Oliphant1;~Brigham_Stone_Carson1;~Cole_Hanson1;~Zachary_Mark_Boyd1",
        "aff": "Brigham Young University;Brigham Young University;Brigham Young University;Brigham Young University;;;Brigham Young University",
        "aff_domain": "byu.edu;byu.edu;byu.edu;byu.edu;;;math.byu.edu",
        "position": "Undergrad student;Undergrad student;Undergrad student;Undergrad student;;;Assistant Professor",
        "bibtex": "@misc{\nbrown2024global,\ntitle={Global minima, recoverability thresholds, and higher-order structure in {GNN}s},\nauthor={Drake Brown and Trevor Beowulf Garrity and Kaden Brent Parker and Jason Travis Oliphant and Brigham Stone Carson and Cole Hanson and Zachary Mark Boyd},\nyear={2024},\nurl={https://openreview.net/forum?id=qqDeICpLFo}\n}",
        "github": "",
        "project": "",
        "reviewers": "QsGF;yxXE;SYz5;WetA",
        "site": "https://openreview.net/forum?id=qqDeICpLFo",
        "pdf_size": 1686858,
        "rating": "3;3;3;5",
        "confidence": "3;3;3;4",
        "soundness": "3;2;3;3",
        "contribution": "2;1;2;2",
        "presentation": "3;2;2;2",
        "wc_summary": "58;134;78;80",
        "wc_strengths": "46;45;116;8",
        "wc_weaknesses": "111;82;172;49",
        "wc_questions": "69;59;335;111",
        "wc_review": "284;320;701;248",
        "wc_reply_reviewers": "81;52;144;0",
        "wc_reply_authors": "558;388;870;372",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            87.5,
            28.191310718020897
        ],
        "wc_strengths_avg": [
            53.75,
            39.06644980030819
        ],
        "wc_weaknesses_avg": [
            103.5,
            45.224440295044005
        ],
        "wc_questions_avg": [
            143.5,
            112.27087779117076
        ],
        "wc_review_avg": [
            388.25,
            182.35182340739016
        ],
        "wc_reply_reviewers_avg": [
            69.25,
            52.0066101567868
        ],
        "wc_reply_authors_avg": [
            547.0,
            200.22237637187308
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:tVEjYgNPoIwJ:scholar.google.com/&scioq=Global+minima,+recoverability+thresholds,+and+higher-order+structure+in+GNNs&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Brigham Young University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.byu.edu",
        "aff_unique_abbr": "BYU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "qqExiDNsa7",
        "title": "Which pre-trained model is effective for speech separation ?",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The effectiveness of the use of general audio pre-trained models to generate rep-\nresentations suitable for speech separation has been explored in a previous study\nHuang et al. (2022) with the main finding being that they provide minimal benefit\ncompared to features extracted without the models. The study hypothesised that\nsince the general audio pre-trained models were trained with clean audio dataset,\nthey are unable to generalize to noisy and mixed speeches hence not effective in\nspeech separation. This paper investigates this hypothesis by comparing the per-\nformance of pre-trained model trained on contaminated speeches and that trained\non clean ones. We are interested in evaluating whether contamination leads to bet-\nter downstream performance. We also investigate if the type of input used to train\nthe pre-trained model impacts the quality of embeddings it generates. To sepa-\nrate the sources, we propose a fully unsupervised technique of speech separation\nbased on deep modularization. Our findings establish that by injecting noise and\nreverberation in the training dataset, the pre-trained model generate significantly\nbetter embeddings than when clean dataset is used. Further, based on the model\npresented here, working in short-time Fourier transform (STFT) results in bet-\nter features than using time-domain features. The proposed deep modularization\nspeech separation technique can improve SI-SNRi and SDRi by 1.3 and 2.7, re-\nspectively, when mixtures contain less than four sources and improves the results\nsignificantly for many source mixtures.",
        "keywords": "Pre-trained model;speech separation;modularization",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Peter Ochieng",
        "authorids": "~Peter_Ochieng1",
        "gender": "M",
        "homepage": "",
        "dblp": "",
        "google_scholar": "g_8i05QAAAAJ",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Peter_Ochieng1",
        "aff": "Taita Taveta University",
        "aff_domain": "ttu.ac.ke",
        "position": "Lecturer",
        "bibtex": "@misc{\nochieng2024which,\ntitle={Which pre-trained model is effective for speech separation ?},\nauthor={Peter Ochieng},\nyear={2024},\nurl={https://openreview.net/forum?id=qqExiDNsa7}\n}",
        "github": "",
        "project": "",
        "reviewers": "2QbT;tTem;NwoZ;VfQ2",
        "site": "https://openreview.net/forum?id=qqExiDNsa7",
        "pdf_size": 654045,
        "rating": "5;5;5;5",
        "confidence": "5;4;3;4",
        "soundness": "3;3;2;2",
        "contribution": "3;2;3;1",
        "presentation": "2;3;2;3",
        "wc_summary": "77;116;111;31",
        "wc_strengths": "72;118;40;47",
        "wc_weaknesses": "244;139;328;107",
        "wc_questions": "124;64;33;87",
        "wc_review": "517;437;512;272",
        "wc_reply_reviewers": "141;18;35;0",
        "wc_reply_authors": "572;539;676;491",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            83.75,
            33.9512518178638
        ],
        "wc_strengths_avg": [
            69.25,
            30.55630049596973
        ],
        "wc_weaknesses_avg": [
            204.5,
            87.47713987094
        ],
        "wc_questions_avg": [
            77.0,
            33.21897048374618
        ],
        "wc_review_avg": [
            434.5,
            99.0265116016918
        ],
        "wc_reply_reviewers_avg": [
            48.5,
            54.820160525120684
        ],
        "wc_reply_authors_avg": [
            569.5,
            67.89882178653765
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:neHFnmsoy-kJ:scholar.google.com/&scioq=Which+pre-trained+model+is+effective+for+speech+separation+%3F&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Taita Taveta University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.taitatavetauniversity.ac.ke",
        "aff_unique_abbr": "",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Kenya"
    },
    {
        "id": "qqb62iqPv1",
        "title": "UniSeMi: Toward Unified Semi-supervised Medical Image Segmentation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Semi-supervised learning (SSL) for medical image segmentation is put forward to mitigate the scarcity of annotation by leveraging unlabeled data. Recently proposed SSL works focus on designing task-specific models that process different tasks separately. This results in marginal improvement due to inadequate supervision from scarce labels of each single task.\nTo address this, we advocate learning a \\textbf{Uni}fied \\textbf{Se}mi-supervised segmentation model for \\textbf{M}edical \\textbf{i}maging (UniSeMi) by augmenting the label space, in which all pertinent task data are leveraged simultaneously. Specifically, UniSeMi can complete various missions using one single model with a task-prompted dynamic head. Beyond that, UniSeMi can learn from unlabeled data without requiring associated task information, $i.e.$, which task the unlabeled data belong to remains unknown. \nTo achieve this, we first synthesize an additional task by utilizing labeled data from pertinent tasks, and the synthetic task aims to instruct UniSeMi to be aware of all task semantics. In the context of unlabeled data learning, the aggregated prediction prompted by pertinent tasks is constrained to be consistent with the prediction prompted by the synthetic task, thus task information is not desired. \nWe evaluate UniSeMi on four public medical benchmarks, experiments show UniSeMi outperforms the second-best SSL method by 2.69\\% and 8.92\\% according to the averaged Dice and HD score, respectively. Code will be released.",
        "keywords": "medical image segmentation;semi-supervised learning",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/b804f1906124e36dcc0a7d507085e396f233eb31.pdf",
        "author": "Qingjie Zeng;Yutong Xie;Zilin LU;Mengkang Lu;Yong Xia",
        "authorids": "~Qingjie_Zeng1;~Yutong_Xie4;~Zilin_LU1;~Mengkang_Lu1;~Yong_Xia1",
        "gender": "Not Specified;;M;;M",
        "homepage": "https://ytongxie.github.io/;https://github.com/PathBOT-Admin;https://teacher.nwpu.edu.cn/yongxia.html;;",
        "dblp": ";261/9972.html;50/2433-1.html;;331/5190",
        "google_scholar": "ddDL9HMAAAAJ;;https://scholar.google.com.hk/citations?user=Usw1jeMAAAAJ;https://scholar.google.com.hk/citations?hl=zh-CN;ngPgM1QAAAAJ",
        "orcid": ";;0000-0001-9273-2847;;0000-0003-2437-283X",
        "linkedin": ";;;;",
        "or_profile": "~Yutong_Xie4;~Mengkang_Lu1;~Yong_Xia1;~Zeng_Qingjie2;~Lu_Zilin1",
        "aff": "University of Adelaide;nwpu;Northwestern Polytechnical University;Northwest Polytechnical University Xi'an;Northwest Polytechnical University Xi'an",
        "aff_domain": "adelaide.edu.au;mail.nwpu.edu.cn;nwpu.edu.cn;nwpu.edu.cn;nwpu.edu.cn",
        "position": "Postdoc;PhD student;Professor;PhD student;PhD student",
        "bibtex": "@misc{\nzeng2024unisemi,\ntitle={UniSeMi: Toward Unified Semi-supervised Medical Image Segmentation},\nauthor={Qingjie Zeng and Yutong Xie and Zilin LU and Mengkang Lu and Yong Xia},\nyear={2024},\nurl={https://openreview.net/forum?id=qqb62iqPv1}\n}",
        "github": "",
        "project": "",
        "reviewers": "6ofX;wxyu;jVTd;Nu9m",
        "site": "https://openreview.net/forum?id=qqb62iqPv1",
        "pdf_size": 3163884,
        "rating": "3;5;5;5",
        "confidence": "5;4;4;4",
        "soundness": "2;2;2;2",
        "contribution": "2;2;3;2",
        "presentation": "3;3;2;2",
        "wc_summary": "108;114;79;108",
        "wc_strengths": "75;65;82;212",
        "wc_weaknesses": "59;170;278;131",
        "wc_questions": "194;3;5;214",
        "wc_review": "436;352;444;665",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            102.25,
            13.645054048995188
        ],
        "wc_strengths_avg": [
            108.5,
            60.06038627914409
        ],
        "wc_weaknesses_avg": [
            159.5,
            79.15964881175258
        ],
        "wc_questions_avg": [
            104.0,
            100.25218202114107
        ],
        "wc_review_avg": [
            474.25,
            115.8757416373246
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:lJJC9afJsGwJ:scholar.google.com/&scioq=UniSeMi:+Toward+Unified+Semi-supervised+Medical+Image+Segmentation&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;2;2",
        "aff_unique_norm": "University of Adelaide;Northwestern Polytechnical University;Northwest Polytechnical University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.adelaide.edu.au;https://www.nwpu.edu.cn;http://www.nwpu.edu.cn",
        "aff_unique_abbr": "Adelaide;NWPU;NWPU",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Xi'an",
        "aff_country_unique_index": "0;1;1;1;1",
        "aff_country_unique": "Australia;China"
    },
    {
        "title": "On the Expressivity of Objective-Specification Formalisms in Reinforcement Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17713",
        "id": "qr4ECbGcSj",
        "author_site": "Rohan Subramani, Marcus Williams, Max Heitmann, Halfdan Holm, Charlie Griffin, Joar Skalse",
        "tldr": "",
        "abstract": "Most algorithms in reinforcement learning (RL) require that the objective is formalised with a Markovian reward function. However, it is well-known that certain tasks cannot be expressed by means of an objective in the Markov rewards formalism, motivating the study of alternative objective-specification formalisms in RL such as Linear Temporal Logic and Multi-Objective Reinforcement Learning. To date, there has not yet been any thorough analysis of how these formalisms relate to each other in terms of their expressivity. We fill this gap in the existing literature by providing a comprehensive comparison of 17 salient objective-specification formalisms. We place these formalisms in a preorder based on their expressive power, and present this preorder as a Hasse diagram. We find a variety of limitations for the different formalisms, and argue that no formalism is both dominantly expressive and straightforward to optimise with current techniques. For example, we prove that each of Regularised RL, (Outer) Nonlinear Markov Rewards, Reward Machines, Linear Temporal Logic, and Limit Average Rewards can express a task that the others cannot. The significance of our results is twofold. First, we identify important expressivity limitations to consider when specifying objectives for policy optimization. Second, our results highlight the need for future research which adapts reward learning to work with a greater variety of formalisms, since many existing reward learning methods assume that the desired objective takes a Markovian form. Our work contributes towards a more cohesive understanding of the costs and benefits of different RL objective-specification formalisms.",
        "keywords": "reward hypothesis;Markov reward;multi-objective reinforcement learning;linear temporal logic;reward machines",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Rohan Subramani;Marcus Williams;Max Heitmann;Halfdan Holm;Charlie Griffin;Joar Max Viktor Skalse",
        "authorids": "~Rohan_Subramani1;~Marcus_Williams1;~Max_Heitmann1;~Halfdan_Holm1;~Charlie_Griffin1;~Joar_Max_Viktor_Skalse1",
        "gender": "M;M;;M;;M",
        "homepage": ";;;;;",
        "dblp": ";;;;;242/8125",
        "google_scholar": ";https://scholar.google.com/citations?view_op=list_works;;;;GuzLUmQAAAAJ",
        "orcid": ";;;;;",
        "linkedin": "rohan-subramani-70a919225/;marcus-williams-2623681a0/;max-heitmann-224440249/;halfdan-h-4b87681b1/;;",
        "or_profile": "~Rohan_Subramani1;~Marcus_Williams1;~Max_Heitmann1;~Halfdan_Holm1;~Charlie_Griffin1;~Joar_Max_Viktor_Skalse1",
        "aff": "Columbia University;MATS;University of Oxford;;;University of Oxford",
        "aff_domain": "columbia.edu;matsprogram.org;ox.ac.uk;;;ox.ac.uk",
        "position": "Undergrad student;Researcher;MS student;;;PhD student",
        "bibtex": "@inproceedings{\nsubramani2024on,\ntitle={On the Expressivity of Objective-Specification Formalisms in Reinforcement Learning},\nauthor={Rohan Subramani and Marcus Williams and Max Heitmann and Halfdan Holm and Charlie Griffin and Joar Max Viktor Skalse},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=qr4ECbGcSj}\n}",
        "github": "",
        "project": "",
        "reviewers": "EiAB;Re36;mz4B;XNit",
        "pdf_size": 1269130,
        "rating": "3;6;8;10",
        "confidence": "3;5;3;3",
        "soundness": "3;3;4;4",
        "contribution": "2;3;4;4",
        "presentation": "2;3;4;3",
        "wc_summary": "76;33;198;117",
        "wc_strengths": "101;37;17;110",
        "wc_weaknesses": "796;180;25;47",
        "wc_questions": "77;4;22;57",
        "wc_review": "1050;254;262;331",
        "wc_reply_reviewers": "351;14;0;0",
        "wc_reply_authors": "1427;434;145;302",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            6.75,
            2.5860201081971503
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            106.0,
            60.85638832530238
        ],
        "wc_strengths_avg": [
            66.25,
            40.00859282704154
        ],
        "wc_weaknesses_avg": [
            262.0,
            313.9562071372375
        ],
        "wc_questions_avg": [
            40.0,
            28.626910416599273
        ],
        "wc_review_avg": [
            474.25,
            333.75468161510486
        ],
        "wc_reply_reviewers_avg": [
            91.25,
            150.0756059458032
        ],
        "wc_reply_authors_avg": [
            577.0,
            501.2978156744751
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.16744367165578428,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14495480317456114062&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=qr4ECbGcSj",
        "pdf": "https://openreview.net/pdf?id=qr4ECbGcSj",
        "email": "columbia.edu;matsprogram.org;ox.ac.uk;;;ox.ac.uk",
        "author_num": 6,
        "aff_unique_index": "0;1;2;2",
        "aff_unique_norm": "Columbia University;MATS;University of Oxford",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.columbia.edu;;https://www.ox.ac.uk",
        "aff_unique_abbr": "Columbia;;Oxford",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;2;2",
        "aff_country_unique": "United States;;United Kingdom"
    },
    {
        "id": "qrGjFJVl3m",
        "title": "Qwen-VL: A Versatile Vision-Language Model for Understanding, Localization, Text Reading, and Beyond",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this work, we introduce the Qwen-VL series, a set of large-scale vision-language models (LVLMs) designed to perceive and understand both texts and images.\nStarting from the Qwen-LM as a foundation, we endow it with visual capacity by the meticulously designed (i) visual receptor, (ii) input-output interface, (iii) 3-stage training pipeline, and (iv) multilingual multimodal cleaned corpus.\nBeyond the conventional image description and question-answering, we implement the grounding and text-reading ability of Qwen-VLs by aligning image-caption-box tuples.\nThe resulting models, including Qwen-VL and Qwen-VL-Chat, set new records for generalist models under similar model scales on a broad range of visual-centric benchmarks (e.g., image captioning, question answering, visual grounding) and different settings (e.g., zero-shot, few-shot).\nMoreover, on real-world dialog benchmarks, our instruction-tuned Qwen-VL-Chat also demonstrates superiority compared to existing vision-language chatbots.\nAll models will be made public to facilitate future research.",
        "keywords": "multi-modal learning;vision-language models;generalist models",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Jinze Bai;Shuai Bai;Shusheng Yang;Shijie Wang;Sinan Tan;Peng Wang;Junyang Lin;Chang Zhou;Jingren Zhou",
        "authorids": "~Jinze_Bai1;~Shuai_Bai1;~Shusheng_Yang1;~Shijie_Wang1;~Sinan_Tan1;~Peng_Wang20;~Junyang_Lin1;~Chang_Zhou2;~Jingren_Zhou1",
        "gender": "M;M;M;M;M;M;M;M;M",
        "homepage": ";;https://shushengyang.com;https://github.com/simonJJJ;https://blog.tinytangent.com;;;;",
        "dblp": "210/0939;208/8033;290/1972;;264/0041;95/4442-28;215/3823;;84/2644",
        "google_scholar": ";ylhI1JsAAAAJ;v6dmW5cntoMC;DuAqyTwAAAAJ;;7fjqA0YAAAAJ;qp6IwtgAAAAJ;QeSoG3sAAAAJ;",
        "orcid": ";;;;;;;;",
        "linkedin": ";;shushengyang/;;;;;;",
        "or_profile": "~Jinze_Bai1;~Shuai_Bai1;~Shusheng_Yang1;~Shijie_Wang1;~Sinan_Tan1;~Peng_Wang20;~Junyang_Lin1;~Chang_Zhou2;~Jingren_Zhou1",
        "aff": "Alibaba Group;Alibaba Group;New York University;;;Alibaba Group;Alibaba Group;Alibaba Group;Alibaba Group",
        "aff_domain": "alibaba-inc.com;alibaba-inc.com;nyu.edu;;;alibaba-inc.com;alibaba-inc.com;alibaba-inc.com;alibaba-inc.com",
        "position": "Researcher;Senior Engineer;PhD student;;;Researcher;Principal Researcher;Researcher;Researcher",
        "bibtex": "@misc{\nbai2024qwenvl,\ntitle={Qwen-{VL}: A Versatile Vision-Language Model for Understanding, Localization, Text Reading, and Beyond},\nauthor={Jinze Bai and Shuai Bai and Shusheng Yang and Shijie Wang and Sinan Tan and Peng Wang and Junyang Lin and Chang Zhou and Jingren Zhou},\nyear={2024},\nurl={https://openreview.net/forum?id=qrGjFJVl3m}\n}",
        "github": "",
        "project": "",
        "reviewers": "RE8P;2REz;8ZLo",
        "site": "https://openreview.net/forum?id=qrGjFJVl3m",
        "pdf_size": 6003576,
        "rating": "3;5;8",
        "confidence": "3;4;4",
        "soundness": "3;3;3",
        "contribution": "2;2;3",
        "presentation": "2;2;4",
        "wc_summary": "18;41;56",
        "wc_strengths": "78;26;58",
        "wc_weaknesses": "112;132;47",
        "wc_questions": "21;65;5",
        "wc_review": "229;264;166",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "954;1119;692",
        "reply_reviewers": "0;0;0",
        "reply_authors": "4;4;1",
        "rating_avg": [
            5.333333333333333,
            2.0548046676563256
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            38.333333333333336,
            15.627610892974722
        ],
        "wc_strengths_avg": [
            54.0,
            21.416504538945347
        ],
        "wc_weaknesses_avg": [
            97.0,
            36.2859017617954
        ],
        "wc_questions_avg": [
            30.333333333333332,
            25.368396787253932
        ],
        "wc_review_avg": [
            219.66666666666666,
            40.54901012629312
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            921.6666666666666,
            175.81492794665897
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            3.0,
            1.4142135623730951
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.8029550685469661,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0;0;1;0;0;0;0",
        "aff_unique_norm": "Alibaba Group;New York University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.alibaba.com;https://www.nyu.edu",
        "aff_unique_abbr": "Alibaba;NYU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "qrv4wcmmxe",
        "title": "Zero-shot Human-Object Interaction Detection via Conditional Multi-Modal Prompts",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Human Object Interaction (HOI) detection is the task of locating and inferring the relationships between all possible human-object combinations. One of the most challenging issues is the extensive labor required for the annotation of combinatorial space of possible HOI interactions. Most existing HOI detectors rely on full annotations of all predefined interactions, resulting in a lack of generalisation for unseen combinations and actions. Inspired by the powerful generalisation ability of the large Vision-Language Models (VLM), we propose a Prompt-based zero-shot human-object Interaction Detection framework, namely PID, which can improve alignment between the vision and language representations using conditional multi-modal prompts. Specifically, different from traditional prompt-learning methods, we propose learning decoupled visual and language prompts for spatial-aware visual feature extraction and interaction classification, respectively. Furthermore, we introduce constraints for multi-modal prompts to alleviate the problem of overfitting to seen concepts in prompt learning process, thus improving the suitability for zero-shot settings. Extensive experiments demonstrate the prominence of our detector with conditional multi-modal prompts, outperforming previous state-of-the-art on unseen classes of various zero-shot settings.",
        "keywords": "Human Object Interaction Detection;Zero-shot",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Ting Lei;Yang Liu",
        "authorids": "~Ting_Lei1;~Yang_Liu20",
        "gender": "M;F",
        "homepage": "https://ltttpku.github.io/;http://www.csyangliu.com/",
        "dblp": "53/6925-1;51/3710-105",
        "google_scholar": "Zk7Vxz0AAAAJ;Yhwu4C4AAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Ting_Lei1;~Yang_Liu20",
        "aff": "Peking University;Peking University",
        "aff_domain": "pku.edu.cn;pku.edu.cn",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nlei2024zeroshot,\ntitle={Zero-shot Human-Object Interaction Detection via Conditional Multi-Modal Prompts},\nauthor={Ting Lei and Yang Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=qrv4wcmmxe}\n}",
        "github": "",
        "project": "",
        "reviewers": "n8e2;NGK6;c79G;YqBQ",
        "site": "https://openreview.net/forum?id=qrv4wcmmxe",
        "pdf_size": 2603368,
        "rating": "5;5;6;8",
        "confidence": "5;4;5;4",
        "soundness": "3;2;3;2",
        "contribution": "2;2;2;2",
        "presentation": "3;2;2;2",
        "wc_summary": "43;67;72;116",
        "wc_strengths": "31;9;50;32",
        "wc_weaknesses": "100;155;74;151",
        "wc_questions": "4;2;123;14",
        "wc_review": "178;233;319;313",
        "wc_reply_reviewers": "0;0;221;23",
        "wc_reply_authors": "717;667;990;661",
        "reply_reviewers": "0;0;3;1",
        "reply_authors": "2;2;3;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            74.5,
            26.348624252510795
        ],
        "wc_strengths_avg": [
            30.5,
            14.534441853748634
        ],
        "wc_weaknesses_avg": [
            120.0,
            34.285565475867536
        ],
        "wc_questions_avg": [
            35.75,
            50.57852805291985
        ],
        "wc_review_avg": [
            260.75,
            58.6104726136891
        ],
        "wc_reply_reviewers_avg": [
            61.0,
            92.85203282642766
        ],
        "wc_reply_authors_avg": [
            758.75,
            135.27079322603234
        ],
        "reply_reviewers_avg": [
            1.0,
            1.224744871391589
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.40824829046386296,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:KRs4idi88fsJ:scholar.google.com/&scioq=Zero-shot+Human-Object+Interaction+Detection+via+Conditional+Multi-Modal+Prompts&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Peking University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.pku.edu.cn",
        "aff_unique_abbr": "Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "qsAckNdySL",
        "title": "Causality is Invariance Across Heterogeneous Units",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Learning a model from data for the three layers of Pearl Causal Hierarchy (PCH) (i.e., the associational, the interventional, and the counterfactual) is a central task in contemporary causal inference research, and it becomes particularly challenging for counterfactual queries. The prevailing scientific understanding is anchored in the three-step counterfactual algorithm (i.e., abduction, action, and prediction) proposed by Judea Pearl, which he considers is one of his most pivotal contributions. While this algorithm offers a theoretical solution, the absence of complete knowledge on structural causal models (SCMs) renders it highly impractical in most scenarios. To tackle the tasks of PCH, this paper introduces the DiscoModel, grounded in the core principle that \"Causality is invariance across heterogeneous units.\" The underlying causal modeling theory of our model is \\textit{Distribution-consistency Structural Causal Models} (DiscoSCMs), which extends both \\textit{structural causal models} and the potential outcome framework. The former infers the selection variable on heterogeneous units, while the latter encapsulates the invariant causal relationship. DiscoModel exhibits remarkable capability for all the three layers of PCH simultaneously, providing practical and reasonable answers to important counterfactual questions (e.g., ``For a user on a certain internet platform observed with high subsidy and high retention, what if this user had not received a high subsidy in the past? Would there still be high retention now?''). To the best of our knowledge, DiscoModel is the first to provide non-trivial answers to such queries, substantiated through experiments on both simulated and real-world data.",
        "keywords": "DiscoModel;Layer Valuation;Counterfactual;Heterogeneous;Causal Representation",
        "primary_area": "causal reasoning",
        "supplementary_material": "",
        "author": "Heyang Gong;Zhihua Wang;Hengshuo Miao;Yu Zhang;Yuzhou Zhang;Chaochao Lu;Wenwu Ou",
        "authorids": "~Heyang_Gong1;~Zhihua_Wang6;~Hengshuo_Miao1;zy2335778670@gmail.com;zhangyunzhou@kuaishou.com;~Chaochao_Lu1;~Wenwu_Ou3",
        "gender": ";M;M;;;;M",
        "homepage": ";http://faculty.dlut.edu.cn/jin/zh_CN/xsxx/725725/content/147982.htm#xsxx;https://mmmmhs.github.io;;;https://causallu.com/;",
        "dblp": ";;;;;142/2790;",
        "google_scholar": ";;;;;C_Qxt0IAAAAJ;oP_7RCcAAAAJ",
        "orcid": ";;;;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Heyang_Gong1;~Zhihua_Wang6;~Hengshuo_Miao1;zy2335778670@gmail.com;zhangyunzhou@kuaishou.com;~Chaochao_Lu1;~Wenwu_Ou3",
        "aff": ";Kuaishou Technology;, Tsinghua University;;;Shanghai AI Laboratory ;Kuaishou Technology",
        "aff_domain": ";kuaishou.com;cs.tsinghua.edu.cn;;;pjlab.org.cn;kuaishou.com",
        "position": ";Researcher;Undergrad student;;;Research Scientist;Researcher",
        "bibtex": "@misc{\ngong2024causality,\ntitle={Causality is Invariance Across Heterogeneous Units},\nauthor={Heyang Gong and Zhihua Wang and Hengshuo Miao and Yu Zhang and Yuzhou Zhang and Chaochao Lu and Wenwu Ou},\nyear={2024},\nurl={https://openreview.net/forum?id=qsAckNdySL}\n}",
        "github": "",
        "project": "",
        "reviewers": "rhSD;YHxQ;thPo;XwiY",
        "site": "https://openreview.net/forum?id=qsAckNdySL",
        "pdf_size": 1787781,
        "rating": "3;3;5;6",
        "confidence": "4;3;3;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;3;3",
        "presentation": "2;1;1;3",
        "wc_summary": "2;56;110;76",
        "wc_strengths": "45;11;175;40",
        "wc_weaknesses": "238;115;78;73",
        "wc_questions": "56;26;2;140",
        "wc_review": "341;208;365;329",
        "wc_reply_reviewers": "0;0;0;10",
        "wc_reply_authors": "359;473;311;245",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            61.0,
            39.153543900903784
        ],
        "wc_strengths_avg": [
            67.75,
            63.26679618883826
        ],
        "wc_weaknesses_avg": [
            126.0,
            66.66708333203125
        ],
        "wc_questions_avg": [
            56.0,
            52.1344415909483
        ],
        "wc_review_avg": [
            310.75,
            60.722215868658814
        ],
        "wc_reply_reviewers_avg": [
            2.5,
            4.330127018922194
        ],
        "wc_reply_authors_avg": [
            347.0,
            83.24662155306964
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5555555555555555,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:XL881whsIvYJ:scholar.google.com/&scioq=Causality+is+Invariance+Across+Heterogeneous+Units&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Kuaishou Technology;Tsinghua University;Shanghai AI Laboratory",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.kuaishou.com;https://www.tsinghua.edu.cn;https://www.shanghai-ai-lab.com",
        "aff_unique_abbr": "Kuaishou;THU;SAIL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Towards domain-invariant Self-Supervised Learning with Batch Styles Standardization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17712",
        "id": "qtE9K23ISq",
        "author_site": "Marin Scalbert, Maria Vakalopoulou, Florent Couzinie-Devy",
        "tldr": "",
        "abstract": "In Self-Supervised Learning (SSL), models are typically pretrained, fine-tuned, and evaluated on the same domains. However, they tend to perform poorly when evaluated on unseen domains, a challenge that Unsupervised Domain Generalization (UDG) seeks to address. Current UDG methods rely on domain labels, which are often challenging to collect, and domain-specific architectures that lack scalability when confronted with numerous domains, making the current methodology impractical and rigid. Inspired by contrastive-based UDG methods that mitigate spurious correlations by restricting comparisons to examples from the same domain, we hypothesize that eliminating style variability within a batch could provide a more convenient and flexible way to reduce spurious correlations without requiring domain labels. To verify this hypothesis, we introduce Batch Styles Standardization (BSS), a relatively simple yet powerful Fourier-based method to standardize the style of images in a batch specifically designed for integration with SSL methods to tackle UDG. Combining BSS with existing SSL methods offers serious advantages over prior UDG methods: (1) It eliminates the need for domain labels or domain-specific network components to enhance domain-invariance in SSL representations, and (2) offers flexibility as BSS can be seamlessly integrated with diverse contrastive-based but also non-contrastive-based SSL methods. Experiments on several UDG datasets demonstrate that it significantly improves downstream task performances on unseen domains, often outperforming or rivaling UDG methods. Finally, this work clarifies the underlying mechanisms contributing to BSS's effectiveness in improving domain-invariance in SSL representations and performances on unseen domains. Implementations of the extended SSL methods and BSS are provided at this [url](https://gitlab.com/vitadx/articles/towards-domain-invariant-ssl-through-bss).",
        "keywords": "Self-Supervised Learning;Unsupervised Domain Generalization;Distribution Shifts",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Marin Scalbert;Maria Vakalopoulou;Florent Couzinie-Devy",
        "authorids": "~Marin_Scalbert1;~Maria_Vakalopoulou1;~Florent_Couzinie-Devy1",
        "gender": "M;F;M",
        "homepage": ";;",
        "dblp": "296/1662.html;169/9108.html;31/10359",
        "google_scholar": "https://scholar.google.com/citations?hl=fr;https://scholar.google.gr/citations?hl=el;https://scholar.google.com/citations?hl=fr",
        "orcid": ";0000-0003-0791-1264;",
        "linkedin": "marin-scalbert-589b65b9/;maria-vakalopoulou-8a709395/;florent-couzinie-devy-89946094/",
        "or_profile": "~Marin_Scalbert1;~Maria_Vakalopoulou1;~Florent_Couzinie-Devy1",
        "aff": "VitaDX;CentraleSupelec;VitaDX",
        "aff_domain": "vitadx.com;centralesupelec.fr;vitadx.com",
        "position": "Researcher;Assistant Professor;Researcher",
        "bibtex": "@inproceedings{\nscalbert2024towards,\ntitle={Towards domain-invariant Self-Supervised Learning with Batch Styles Standardization},\nauthor={Marin Scalbert and Maria Vakalopoulou and Florent Couzinie-Devy},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=qtE9K23ISq}\n}",
        "github": "",
        "project": "",
        "reviewers": "gWCx;qeEH;PTUx;eMsd;qVbh",
        "pdf_size": 11661746,
        "rating": "5;6;6;6;6",
        "confidence": "5;4;3;4;2",
        "soundness": "2;4;3;2;3",
        "contribution": "2;3;2;2;3",
        "presentation": "2;3;2;3;4",
        "wc_summary": "94;84;53;44;100",
        "wc_strengths": "34;82;32;41;45",
        "wc_weaknesses": "142;211;370;148;64",
        "wc_questions": "2;68;9;17;24",
        "wc_review": "272;445;464;250;233",
        "wc_reply_reviewers": "29;289;21;98;0",
        "wc_reply_authors": "739;918;747;445;132",
        "reply_reviewers": "1;3;1;1;0",
        "reply_authors": "1;3;1;2;1",
        "rating_avg": [
            5.8,
            0.39999999999999997
        ],
        "confidence_avg": [
            3.6,
            1.019803902718557
        ],
        "soundness_avg": [
            2.8,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.8,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            75.0,
            22.41428116179504
        ],
        "wc_strengths_avg": [
            46.8,
            18.214280112043955
        ],
        "wc_weaknesses_avg": [
            187.0,
            102.70345661174214
        ],
        "wc_questions_avg": [
            24.0,
            23.212065827926647
        ],
        "wc_review_avg": [
            332.8,
            100.31430605850792
        ],
        "wc_reply_reviewers_avg": [
            87.4,
            106.03131612877395
        ],
        "wc_reply_authors_avg": [
            596.2,
            277.49983783779044
        ],
        "reply_reviewers_avg": [
            1.2,
            0.9797958971132713
        ],
        "reply_authors_avg": [
            1.6,
            0.8
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.6864064729836442,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17068831071147965235&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=qtE9K23ISq",
        "pdf": "https://openreview.net/pdf?id=qtE9K23ISq",
        "email": "vitadx.com;centralesupelec.fr;vitadx.com",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "VitaDX;CentraleSup\u00e9lec",
        "aff_unique_dep": ";",
        "aff_unique_url": ";https://www.centralesupelec.fr",
        "aff_unique_abbr": ";CS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "1",
        "aff_country_unique": ";France"
    },
    {
        "id": "qud5pDnpzo",
        "title": "ViP: A Differentially Private Foundation Model for Computer Vision",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Artificial intelligence (AI) has seen a tremendous surge in capabilities thanks to the use of foundation models trained on internet-scale data. On the flip side, the uncurated nature of internet-scale data also poses significant privacy and legal risks, as they often contain personal information or copyrighted material that should not be trained on without permission. In this work, we propose as a mitigation measure a recipe to train foundation vision models with differential privacy (DP) guarantee. We identify masked autoencoders as a suitable learning algorithm that aligns well with DP-SGD, and train ViP---a Vision transformer with differential Privacy---under a strict privacy budget of $\\epsilon=8$ on the LAION400M dataset. We evaluate the quality of representation learned by ViP using standard downstream vision tasks; in particular, ViP achieves a (non-private) linear probing accuracy of 55.7% on ImageNet, comparable to that of end-to-end trained AlexNet (trained and evaluated on ImageNet). Our result suggests that scaling to internet-scale data can be practical for private learning.",
        "keywords": "differential privacy;self-supervised learning;foundation model",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/f42ae0033fe6873365ea9c8474c895ce61d4777a.pdf",
        "author": "Yaodong Yu;Maziar Sanjabi;Yi Ma;Kamalika Chaudhuri;Chuan Guo",
        "authorids": "~Yaodong_Yu4;~Maziar_Sanjabi1;~Yi_Ma4;~Kamalika_Chaudhuri1;~Chuan_Guo1",
        "gender": "M;M;M;F;M",
        "homepage": "https://yaodongyu.github.io;https://sites.google.com/view/maziar;http://people.eecs.berkeley.edu/~yima/;http://cseweb.ucsd.edu/users/kamalika;https://sites.google.com/view/chuanguo",
        "dblp": ";21/8577;;56/6435;",
        "google_scholar": "bZ9oyW8AAAAJ;bc_N2-oAAAAJ;https://scholar.google.com.hk/citations?user=XqLiBQMAAAAJ;I-DJ7EsAAAAJ;0gp5M-kAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Yaodong_Yu4;~Maziar_Sanjabi1;~Yi_Ma4;~Kamalika_Chaudhuri1;~Chuan_Guo1",
        "aff": "Electrical Engineering & Computer Science Department, University of California Berkeley;Meta;University of California, Berkeley;University of California, San Diego;Meta",
        "aff_domain": "eecs.berkeley.edu;meta.com;berkeley.edu;ucsd.edu;meta.com",
        "position": "PhD student;Researcher;Full Professor;Associate Professor;Researcher",
        "bibtex": "@misc{\nyu2024vip,\ntitle={ViP: A Differentially Private Foundation Model for Computer Vision},\nauthor={Yaodong Yu and Maziar Sanjabi and Yi Ma and Kamalika Chaudhuri and Chuan Guo},\nyear={2024},\nurl={https://openreview.net/forum?id=qud5pDnpzo}\n}",
        "github": "",
        "project": "",
        "reviewers": "UcdW;MY6t;kYFB",
        "site": "https://openreview.net/forum?id=qud5pDnpzo",
        "pdf_size": 1619764,
        "rating": "3;3;8",
        "confidence": "3;3;4",
        "soundness": "2;2;4",
        "contribution": "1;1;3",
        "presentation": "2;2;4",
        "wc_summary": "49;58;73",
        "wc_strengths": "25;12;19",
        "wc_weaknesses": "306;317;157",
        "wc_questions": "140;4;5",
        "wc_review": "520;391;254",
        "wc_reply_reviewers": "359;0;36",
        "wc_reply_authors": "2041;1012;409",
        "reply_reviewers": "1;0;1",
        "reply_authors": "3;2;1",
        "rating_avg": [
            4.666666666666667,
            2.357022603955158
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            60.0,
            9.899494936611665
        ],
        "wc_strengths_avg": [
            18.666666666666668,
            5.312459150169742
        ],
        "wc_weaknesses_avg": [
            260.0,
            72.97031359852215
        ],
        "wc_questions_avg": [
            49.666666666666664,
            63.87661717891942
        ],
        "wc_review_avg": [
            388.3333333333333,
            108.61041488836244
        ],
        "wc_reply_reviewers_avg": [
            131.66666666666666,
            161.4193985313482
        ],
        "wc_reply_authors_avg": [
            1154.0,
            673.7848321237277
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.9999999999999998,
        "gs_citation": 18,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6269909239911795616&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;0;2;1",
        "aff_unique_norm": "University of California, Berkeley;Meta;University of California, San Diego",
        "aff_unique_dep": "Electrical Engineering & Computer Science Department;Meta Platforms, Inc.;",
        "aff_unique_url": "https://www.berkeley.edu;https://meta.com;https://www.ucsd.edu",
        "aff_unique_abbr": "UC Berkeley;Meta;UCSD",
        "aff_campus_unique_index": "0;0;2",
        "aff_campus_unique": "Berkeley;;San Diego",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "quf7D5agqa",
        "title": "Deep Reinforcement Learning from Weak Hierarchical Preference Feedback",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Reward design is a fundamental, yet challenging aspect of practical reinforcement learning (RL). For simple tasks, researchers typically handcraft the reward function, e.g., using a linear combination of several reward factors. However, such reward engineering is subject to approximation bias, incurs large tuning cost, and often cannot provide the granularity required for complex tasks. To avoid these difficulties, researchers have turned to reinforcement learning from human feedback (RLHF), which learns a reward function from human preferences between pairs of trajectory sequences. By leveraging preference-based reward modeling, RLHF learns complex rewards that are well aligned with human preferences, allowing RL to tackle increasingly difficult problems. Unfortunately, the applicability of RLHF is limited due to the high cost and difficulty of obtaining human preference data. In light of this cost, we investigate learning reward functions for complex tasks with less human effort; simply by ranking the importance of the reward factors. More specifically, we propose a new RL framework -- HERON, which compares trajectories using a hierarchical decision tree induced by the given ranking. These comparisons are used to train a preference-based reward model, which is then used for policy learning. We find that our framework can not only train high performing agents on a variety of difficult tasks, but that it can also provide additional benefits such as improved sample efficiency and robustness.",
        "keywords": "Reinforcement Learning;Reward Design;Preference-Based Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/d4d63d95f4cd24bb4e89903bfa436185768788d9.zip",
        "author": "Alexander Bukharin;Yixiao Li;Pengcheng He;Weizhu Chen;Tuo Zhao",
        "authorids": "~Alexander_Bukharin1;~Yixiao_Li2;~Pengcheng_He2;~Weizhu_Chen1;~Tuo_Zhao1",
        "gender": "M;;M;M;M",
        "homepage": "https://abukharin3.github.io;https://yxli2123.github.io;;https://www.microsoft.com/en-us/research/people/wzchen/;http://www2.isye.gatech.edu/~tzhao80",
        "dblp": "294/6372;;116/8665;79/2536;",
        "google_scholar": ";;https://scholar.google.com/citations?hl=en;LG_E-4EAAAAJ;EJXN6tYAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";yixiao-li-90710b209/;;;",
        "or_profile": "~Alexander_Bukharin1;~Yixiao_Li2;~Pengcheng_He2;~Weizhu_Chen1;~Tuo_Zhao1",
        "aff": "NVIDIA;Georgia Institute of Technology;Microsoft;Microsoft GenAI;Georgia Institute of Technology",
        "aff_domain": "nvidia.com;gatech.edu;microsoft.com;microsoft.com;gatech.edu",
        "position": "Intern;PhD student;Principal Researcher;Vice President;Associate Professor",
        "bibtex": "@misc{\nbukharin2024deep,\ntitle={Deep Reinforcement Learning from Weak Hierarchical Preference Feedback},\nauthor={Alexander Bukharin and Yixiao Li and Pengcheng He and Weizhu Chen and Tuo Zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=quf7D5agqa}\n}",
        "github": "",
        "project": "",
        "reviewers": "roR3;yRzv;rUJV;9kSM",
        "site": "https://openreview.net/forum?id=quf7D5agqa",
        "pdf_size": 6212631,
        "rating": "3;3;5;5",
        "confidence": "3;4;3;5",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;2",
        "presentation": "2;3;2;3",
        "wc_summary": "84;108;86;126",
        "wc_strengths": "63;62;23;42",
        "wc_weaknesses": "451;52;146;222",
        "wc_questions": "52;150;89;51",
        "wc_review": "650;372;344;441",
        "wc_reply_reviewers": "0;0;0;147",
        "wc_reply_authors": "1237;570;670;1008",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "2;1;2;2",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            101.0,
            17.233687939614086
        ],
        "wc_strengths_avg": [
            47.5,
            16.439282222773596
        ],
        "wc_weaknesses_avg": [
            217.75,
            147.51673633862703
        ],
        "wc_questions_avg": [
            85.5,
            40.26474885057648
        ],
        "wc_review_avg": [
            451.75,
            119.77974578366745
        ],
        "wc_reply_reviewers_avg": [
            36.75,
            63.65286717815624
        ],
        "wc_reply_authors_avg": [
            871.25,
            266.33003491908306
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.30151134457776363,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:sAExTwKIz_AJ:scholar.google.com/&scioq=Deep+Reinforcement+Learning+from+Weak+Hierarchical+Preference+Feedback&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;2;1",
        "aff_unique_norm": "NVIDIA;Georgia Institute of Technology;Microsoft",
        "aff_unique_dep": "NVIDIA Corporation;;Microsoft Corporation",
        "aff_unique_url": "https://www.nvidia.com;https://www.gatech.edu;https://www.microsoft.com",
        "aff_unique_abbr": "NVIDIA;Georgia Tech;Microsoft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Behaviour Distillation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17711",
        "id": "qup9xD8mW4",
        "author_site": "Andrei Lupu, Chris Lu, Jarek Liesen, Robert Lange, Jakob Foerster",
        "tldr": "",
        "abstract": "Dataset distillation aims to condense large datasets into a small number of synthetic examples that can be used as drop-in replacements when training new models. It has applications to interpretability, neural architecture search, privacy, and continual learning. Despite strong successes in supervised domains, such methods have not yet been extended to reinforcement learning, where the lack of a fixed dataset renders most distillation methods unusable.\nFilling the gap, we formalize $\\textit{behaviour distillation}$, a setting that aims to discover and then condense the information required for training an expert policy into a synthetic dataset of state-action pairs, $\\textit{without access to expert data}$. \nWe then introduce Hallucinating Datasets with Evolution Strategies (HaDES), a method for behaviour distillation that can discover datasets of $\\textit{just four}$ state-action pairs which, under supervised learning, train agents to competitive performance levels in continuous control tasks.\nWe show that these datasets generalize out of distribution to training policies with a wide range of architectures and hyperparameters. We also demonstrate application to a downstream task, namely training multi-task agents in a zero-shot fashion.\nBeyond behaviour distillation, HaDES provides significant improvements in neuroevolution for RL over previous approaches and achieves SoTA results on one standard supervised dataset distillation task. Finally, we show that visualizing the synthetic datasets can provide human-interpretable task insights.",
        "keywords": "knowledge distillation;evolutionary strategies;reinforcement learning;dataset distillation",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/507ef919f37698790aac0c6fbe7d1db7939d4874.pdf",
        "author": "Andrei Lupu;Chris Lu;Jarek Luca Liesen;Robert Tjarko Lange;Jakob Nicolaus Foerster",
        "authorids": "~Andrei_Lupu1;~Chris_Lu1;~Jarek_Luca_Liesen1;~Robert_Tjarko_Lange1;~Jakob_Nicolaus_Foerster1",
        "gender": "M;;M;;M",
        "homepage": ";;https://jarek.ai;https://roberttlange.github.io/;https://www.jakobfoerster.com",
        "dblp": "218/7027;77/9579;;245/9152;176/5095",
        "google_scholar": "I6aB-YUAAAAJ;4WLoIRsAAAAJ;JSvnpS0AAAAJ;https://scholar.google.es/citations?user=cTrc3x4AAAAJ;6z4lQzMAAAAJ",
        "orcid": ";;;;",
        "linkedin": "lupu-andrei;;jarek-liesen/;;",
        "or_profile": "~Andrei_Lupu1;~Chris_Lu1;~Jarek_Luca_Liesen1;~Robert_Tjarko_Lange1;~Jakob_Nicolaus_Foerster1",
        "aff": "Meta AI;University of Oxford;Bernstein center for computational neuroscience;TU Berlin;University of Oxford, University of Oxford",
        "aff_domain": "meta.com;ox.ac.uk;bccn-berlin.de;tu-berlin.de;eng.ox.ac.uk",
        "position": "Researcher;PhD student;MS student;PhD student;Associate Professor",
        "bibtex": "@inproceedings{\nlupu2024behaviour,\ntitle={Behaviour Distillation},\nauthor={Andrei Lupu and Chris Lu and Jarek Luca Liesen and Robert Tjarko Lange and Jakob Nicolaus Foerster},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=qup9xD8mW4}\n}",
        "github": "",
        "project": "",
        "reviewers": "7Zz2;f5UH;ZN7t",
        "pdf_size": 4124205,
        "rating": "6;6;8",
        "confidence": "4;3;2",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "3;3;3",
        "wc_summary": "121;44;87",
        "wc_strengths": "78;73;32",
        "wc_weaknesses": "419;148;182",
        "wc_questions": "2;2;149",
        "wc_review": "620;267;450",
        "wc_reply_reviewers": "326;0;493",
        "wc_reply_authors": "1490;912;1606",
        "reply_reviewers": "2;0;2",
        "reply_authors": "2;2;2",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            84.0,
            31.506613062445584
        ],
        "wc_strengths_avg": [
            61.0,
            20.607442021431645
        ],
        "wc_weaknesses_avg": [
            249.66666666666666,
            120.53860607936178
        ],
        "wc_questions_avg": [
            51.0,
            69.29646455628166
        ],
        "wc_review_avg": [
            445.6666666666667,
            144.14421790538654
        ],
        "wc_reply_reviewers_avg": [
            273.0,
            204.72583292458884
        ],
        "wc_reply_authors_avg": [
            1336.0,
            303.5303389558722
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11000254359257075358&as_sdt=5,34&sciodt=0,34&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=qup9xD8mW4",
        "pdf": "https://openreview.net/pdf?id=qup9xD8mW4",
        "email": "meta.com;ox.ac.uk;bccn-berlin.de;tu-berlin.de;eng.ox.ac.uk",
        "author_num": 5,
        "aff_unique_index": "0;1;2;3;1",
        "aff_unique_norm": "Meta;University of Oxford;Bernstein Center for Computational Neuroscience;Technische Universit\u00e4t Berlin",
        "aff_unique_dep": "Meta AI;;Computational Neuroscience;",
        "aff_unique_url": "https://meta.com;https://www.ox.ac.uk;https://www.bccn-berlin.de;https://www.tu-berlin.de",
        "aff_unique_abbr": "Meta;Oxford;BCCN;TU Berlin",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Berlin",
        "aff_country_unique_index": "0;1;2;2;1",
        "aff_country_unique": "United States;United Kingdom;Germany"
    },
    {
        "id": "qvLPtx52ZR",
        "title": "Classifier Guidance Enhances Diffusion-based Adversarial Purification by Preserving Predictive Information",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Adversarial purification is one of the promising approaches to defend neural networks against adversarial attacks. Recently, methods utilizing diffusion probabilistic models have achieved great success for adversarial purification in image classification tasks. However, such methods fall into the dilemma of balancing the needs for noise removal and information preservation. This paper points out that existing adversarial purification methods based on diffusion models gradually lose sample information during the core denoising process, causing occasional label shift in subsequent classification tasks. As a remedy, we suggest to suppress such information loss by introducing guidance from the classifier confidence. Specifically, we propose Classifier-cOnfidence gUided Purification (COUP) algorithm, which purifies adversarial examples while keeping away from the classifier decision boundary. Experimental results show that COUP can achieve better adversarial robustness under strong attack methods.",
        "keywords": "adversarial defense;purification;diffusion models",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Mingkun Zhang;Jianing Li;Wei Chen;Jiafeng Guo;Xueqi Cheng",
        "authorids": "~Mingkun_Zhang2;~Jianing_Li1;~Wei_Chen1;~Jiafeng_Guo1;~Xueqi_Cheng1",
        "gender": "F;;F;M;M",
        "homepage": "https://github.com/ZhangMingKun1;;https://weichen-cas.github.io/;http://www.bigdatalab.ac.cn/gjf/;https://people.ucas.ac.cn/~cxq?language=en",
        "dblp": ";;;02/146;44/912",
        "google_scholar": ";;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?view_op=list_works;hY8aLqAAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Mingkun_Zhang2;~Jianing_Li1;~Wei_Chen1;~Jiafeng_Guo1;~Xueqi_Cheng1",
        "aff": ", Chinese Academy of Sciences;; Chinese Academy of Sciences;Institute of Computing Technolgy, Chinese Academy of Sciences;Institute of Computing Technology, Chinese Academy",
        "aff_domain": "ict.ac.cn;;ict.ac.cn;ict.ac.cn;ict.ac.cn",
        "position": "PhD student;;Full Professor;Researcher;Full Professor",
        "bibtex": "@misc{\nzhang2024classifier,\ntitle={Classifier Guidance Enhances Diffusion-based Adversarial Purification by Preserving Predictive Information},\nauthor={Mingkun Zhang and Jianing Li and Wei Chen and Jiafeng Guo and Xueqi Cheng},\nyear={2024},\nurl={https://openreview.net/forum?id=qvLPtx52ZR}\n}",
        "github": "",
        "project": "",
        "reviewers": "Ac9j;7jaB;mPZU;Jfjx",
        "site": "https://openreview.net/forum?id=qvLPtx52ZR",
        "pdf_size": 6461223,
        "rating": "3;5;6;6",
        "confidence": "4;4;3;3",
        "soundness": "3;2;3;2",
        "contribution": "2;2;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "50;146;65;132",
        "wc_strengths": "48;44;34;56",
        "wc_weaknesses": "161;232;42;61",
        "wc_questions": "2;177;83;117",
        "wc_review": "261;599;224;366",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            98.25,
            41.390669238368204
        ],
        "wc_strengths_avg": [
            45.5,
            7.92148975887743
        ],
        "wc_weaknesses_avg": [
            124.0,
            77.01623205532714
        ],
        "wc_questions_avg": [
            94.75,
            63.24703550365029
        ],
        "wc_review_avg": [
            362.5,
            146.1411988455001
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.8164965809277259,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7776737080736202582&as_sdt=4005&sciodt=0,6&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Chinese Academy of Sciences",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.cas.cn",
        "aff_unique_abbr": "CAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "From Graphs to Hypergraphs: Hypergraph Projection and its Reconstruction",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17710",
        "id": "qwYKE3VB2h",
        "author_site": "Yanbang Wang, Jon Kleinberg",
        "tldr": "",
        "abstract": "We study the implications of the modeling choice to use a graph, instead of a hypergraph, to represent real-world interconnected systems whose constituent relationships are of higher order by nature. Such a modeling choice typically involves an underlying projection process that maps the original hypergraph onto a graph, and is prevalent in graph-based analysis.  While hypergraph projection can potentially lead to loss of higher-order relations, there exists very limited studies on the consequences of doing so, as well as its remediation. This work fills this gap by doing two things: (1) we develop analysis based on graph and set theory, showing two ubiquitous patterns of hyperedges that are root to structural information loss in all hypergraph projections; we also quantify the combinatorial impossibility of recovering the lost higher-order structures if no extra help is provided; (2) we still seek to recover the lost higher-order structures in hypergraph projection, and in light of (1)'s findings we make reasonable assumptions to allow the help of some prior knowledge of the application domain. Under this problem setting, we develop a learning-based hypergraph reconstruction method based on an important statistic of hyperedge distributions that we find. Our reconstruction method is systematically evaluated on 8 real-world datasets under different settings, and exhibits consistently top performance. We also demonstrate benefits of the reconstructed hypergraphs through use cases of protein rankings and link predictions.",
        "keywords": "hypergraphs;hypergraph projection;learning-based reconstruction",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/48daa173a0f8220ecd447fce8dc1a73be21b0644.pdf",
        "author": "Yanbang Wang;Jon Kleinberg",
        "authorids": "~Yanbang_Wang1;~Jon_Kleinberg1",
        "gender": ";M",
        "homepage": ";http://www.cs.cornell.edu/home/kleinber/",
        "dblp": "232/1994;https://dblp.uni-trier.de/pid/k/JonMKleinberg.html",
        "google_scholar": "Ch3YUgsAAAAJ;VX7d5EQAAAAJ",
        "orcid": ";0000-0002-1929-2512",
        "linkedin": ";",
        "or_profile": "~Yanbang_Wang1;~Jon_Kleinberg3",
        "aff": "Department of Computer Science, Cornell University;",
        "aff_domain": "cs.cornell.edu;",
        "position": "PhD student;",
        "bibtex": "@inproceedings{\nwang2024from,\ntitle={From Graphs to Hypergraphs: Hypergraph Projection and its Reconstruction},\nauthor={Yanbang Wang and Jon Kleinberg},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=qwYKE3VB2h}\n}",
        "github": "",
        "project": "",
        "reviewers": "U5QZ;rZdL;zeZp;EEWq",
        "pdf_size": 2615071,
        "rating": "6;8;8;8",
        "confidence": "4;5;3;5",
        "soundness": "2;4;3;3",
        "contribution": "2;4;3;3",
        "presentation": "2;4;3;4",
        "wc_summary": "46;243;86;55",
        "wc_strengths": "78;106;52;68",
        "wc_weaknesses": "113;64;84;163",
        "wc_questions": "391;96;32;30",
        "wc_review": "628;509;254;316",
        "wc_reply_reviewers": "39;0;22;16",
        "wc_reply_authors": "1280;499;699;278",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "4;2;2;2",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            107.5,
            79.62568681022475
        ],
        "wc_strengths_avg": [
            76.0,
            19.6468827043885
        ],
        "wc_weaknesses_avg": [
            106.0,
            37.23573552382174
        ],
        "wc_questions_avg": [
            137.25,
            148.8881711218188
        ],
        "wc_review_avg": [
            426.75,
            149.47805022811878
        ],
        "wc_reply_reviewers_avg": [
            19.25,
            13.953046262375826
        ],
        "wc_reply_authors_avg": [
            689.0,
            372.2908808982568
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.8660254037844386
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.17407765595569782,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1062130925716707491&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=qwYKE3VB2h",
        "pdf": "https://openreview.net/pdf?id=qwYKE3VB2h",
        "email": "cs.cornell.edu;",
        "author_num": 2,
        "aff_unique_index": "0",
        "aff_unique_norm": "Cornell University",
        "aff_unique_dep": "Department of Computer Science",
        "aff_unique_url": "https://www.cornell.edu",
        "aff_unique_abbr": "Cornell",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "qwymfs6cKe",
        "title": "Communication-Efficient Federated Learning with Accelerated Client Gradient",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Federated learning often suffers from slow and unstable convergence due to the heterogeneous characteristics of participating client datasets.\nSuch a tendency is aggravated when the client participation ratio is low since the information collected from the clients has large variations.\nTo address this challenge, we propose a simple but effective federated learning framework, which improves the consistency across clients and facilitates the convergence of the server model.\nThis is achieved by making the server broadcast a global model with a gradient acceleration.\nThis strategy enables the proposed approach to convey the projective global update information to participants effectively without additional client memory for storing previous models, and extra communication costs.\nWe also regularize local updates by aligning each client with the overshot global model to reduce bias and improve the stability of our algorithm.\nWe provide the theoretical convergence rate of our algorithm and demonstrate remarkable performance gains in terms of accuracy and communication efficiency compared to the state-of-the-art methods, especially with low client participation rates.\nWe plan to release our code to facilitate the reproduction of our work.",
        "keywords": "Federated learning;Data heterogeneity",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/422735dadec28f75e1c0adcf4030206fac62a985.zip",
        "author": "Geeho Kim;Jinkyu Kim;Bohyung Han",
        "authorids": "~Geeho_Kim1;~Jinkyu_Kim3;~Bohyung_Han1",
        "gender": "M;M;Not Specified",
        "homepage": "https://cv.snu.ac.kr/;https://www.linkedin.com/in/jinkyu-kim-576271170;http://cvlab.snu.ac.kr/~bhhan",
        "dblp": "255/6972;;73/4880.html",
        "google_scholar": "jDEWojYAAAAJ;;9aaeCToAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Geeho_Kim1;~Jinkyu_Kim3;~Bohyung_Han1",
        "aff": "Seoul National University;Seoul National University;Seoul National University",
        "aff_domain": "snu.ac.kr;snu.ac.kr;snu.ac.kr",
        "position": "PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nkim2024communicationefficient,\ntitle={Communication-Efficient Federated Learning with Accelerated Client Gradient},\nauthor={Geeho Kim and Jinkyu Kim and Bohyung Han},\nyear={2024},\nurl={https://openreview.net/forum?id=qwymfs6cKe}\n}",
        "github": "",
        "project": "",
        "reviewers": "ufqp;Nxpp;RTkn",
        "site": "https://openreview.net/forum?id=qwymfs6cKe",
        "pdf_size": 2137942,
        "rating": "3;5;5",
        "confidence": "3;3;3",
        "soundness": "2;2;3",
        "contribution": "2;2;2",
        "presentation": "2;3;3",
        "wc_summary": "69;120;74",
        "wc_strengths": "35;154;69",
        "wc_weaknesses": "94;182;94",
        "wc_questions": "2;28;107",
        "wc_review": "200;484;344",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            87.66666666666667,
            22.954060400915758
        ],
        "wc_strengths_avg": [
            86.0,
            50.04664490919113
        ],
        "wc_weaknesses_avg": [
            123.33333333333333,
            41.48359782961079
        ],
        "wc_questions_avg": [
            45.666666666666664,
            44.64925033587412
        ],
        "wc_review_avg": [
            342.6666666666667,
            115.94634774565155
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 16,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16730698214911651932&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Seoul National University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.snu.ac.kr",
        "aff_unique_abbr": "SNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "qx02elXpf9",
        "title": "Provable Benefit of Adaptivity in Adam",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The Adaptive Moment Estimation (Adam) algorithm is widely adopted in practical applications due to its fast convergence. However, its theoretical analysis is still far from satisfactory. Existing convergence analyses for Adam rely on the bounded smoothness assumption, referred to as the \\emph{L-smooth condition}. Unfortunately, this assumption does not hold for many deep learning tasks. Moreover, we believe that this assumption obscures the true benefit of Adam, as the algorithm can adapt its update magnitude according to local smoothness. This important feature of Adam becomes irrelevant when assuming globally bounded smoothness. In this paper, we present the first convergence analysis of Adam without the bounded smoothness assumption. We demonstrate that Adam can maintain its convergence properties when smoothness is linearly bounded by the gradient norm, referred to as the \\emph{$(L_0, L_1)$-smooth condition}. Further, under the same setting, we refine the existing lower bound of SGD and show that SGD can be arbitrarily slower than Adam. To our knowledge, this is the first time that Adam and SGD are rigorously compared in the same setting where the advantage of Adam can be revealed. Our theoretical results shed new light on the advantage of Adam over SGD.",
        "keywords": "Adam;convergence;non-uniform smoothness",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/cccc8e4eb4071351b09ec49dfce42019d8bab5d6.pdf",
        "author": "Bohan Wang;Yushun Zhang;Huishuai Zhang;Qi Meng;Ruoyu Sun;Zhi-Ming Ma;Tie-Yan Liu;Zhi-Quan Luo;Wei Chen",
        "authorids": "~Bohan_Wang1;~Yushun_Zhang1;~Huishuai_Zhang3;~Qi_Meng1;~Ruoyu_Sun1;~Zhi-Ming_Ma1;~Tie-Yan_Liu1;~Zhi-Quan_Luo1;~Wei_Chen1",
        "gender": "M;M;F;;;M;M;F;M",
        "homepage": "https://bhwangfy.github.io/;https://zyushun.github.io/;;https://ruoyus.github.io/;http://homepage.amss.ac.cn/research/homePage/8eb59241e2e74d828fb84eec0efadba5/myHomePage.html;http://member.acm.org/~tieyanliu;;https://weichen-cas.github.io/;https://huishuai-git.github.io",
        "dblp": "202/1184;276/8662;;30/9879-1;;l/TieYanLiu;;;144/7537",
        "google_scholar": "LfkHCEUAAAAJ;https://scholar.google.com/citations?hl=en;t-z3K34AAAAJ;PsfzbCMAAAAJ;;Nh832fgAAAAJ;dW3gcXoAAAAJ;https://scholar.google.com/citations?hl=en;w1srHyIAAAAJ",
        "orcid": ";;;;;0000-0002-0476-8020;;;",
        "linkedin": ";;;;;;;;",
        "or_profile": "~Bohan_Wang1;~Yushun_Zhang1;~Qi_Meng1;~Ruoyu_Sun1;~Zhi-Ming_Ma1;~Tie-Yan_Liu1;~Zhi-Quan_Luo1;~Wei_Chen1;~Huishuai_Zhang2",
        "aff": "Microsoft Research Asia, University of Science and Technology of China;The Chinese University of Hong Kong, Shenzhen;Microsoft;The Chinese University of Hong Kong;Academy of Mathematics and Systems Science, Chinese Academy of Sciences, Chinese Academy of Sciences;Microsoft;The Chinese University of Hong Kong, Shenzhen; Chinese Academy of Sciences;Peking University",
        "aff_domain": "ustc.edu.cn;cuhk.edu.cn;microsoft.com;cuhk.edu.cn;amss.ac.cn;microsoft.com;cuhk.edu.cn;ict.ac.cn;pku.edu.cn",
        "position": "PhD student;PhD student;associate researcher;Associate Professor;Full Professor;Distinguished Scientist;Full Professor;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nwang2024provable,\ntitle={Provable Benefit of Adaptivity in Adam},\nauthor={Bohan Wang and Yushun Zhang and Huishuai Zhang and Qi Meng and Ruoyu Sun and Zhi-Ming Ma and Tie-Yan Liu and Zhi-Quan Luo and Wei Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=qx02elXpf9}\n}",
        "github": "",
        "project": "",
        "reviewers": "DTjf;7Yma;AvTQ;mpxh",
        "site": "https://openreview.net/forum?id=qx02elXpf9",
        "pdf_size": 1333422,
        "rating": "3;3;5;8",
        "confidence": "4;5;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "11;39;94;78",
        "wc_strengths": "40;16;28;75",
        "wc_weaknesses": "131;459;152;29",
        "wc_questions": "3;19;63;21",
        "wc_review": "185;533;337;203",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "47;264;47;47",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            55.5,
            32.56148031032987
        ],
        "wc_strengths_avg": [
            39.75,
            22.049659861322123
        ],
        "wc_weaknesses_avg": [
            192.75,
            160.60568950071476
        ],
        "wc_questions_avg": [
            26.5,
            22.197972880423112
        ],
        "wc_review_avg": [
            314.5,
            139.15009881419417
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            101.25,
            93.96375631061159
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -0.49374193110101877,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:tCf56a3kJEQJ:scholar.google.com/&scioq=Provable+Benefit+of+Adaptivity+in+Adam&hl=en&as_sdt=0,19",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;1;2;0;1;2;3",
        "aff_unique_norm": "Microsoft;Chinese University of Hong Kong;Chinese Academy of Sciences;Peking University",
        "aff_unique_dep": "Research;;Academy of Mathematics and Systems Science;",
        "aff_unique_url": "https://www.microsoft.com/en-us/research/group/microsoft-research-asia;https://www.cuhk.edu.cn;http://www.cas.cn;http://www.pku.edu.cn",
        "aff_unique_abbr": "MSRA;CUHK;CAS;Peking U",
        "aff_campus_unique_index": "0;1;3;1",
        "aff_campus_unique": "Asia;Shenzhen;;Hong Kong SAR",
        "aff_country_unique_index": "0;0;1;0;0;1;0;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Data Debugging with Shapley Importance over Machine Learning Pipelines",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17709",
        "id": "qxGXjWxabq",
        "author_site": "Bojan Karla\u0161, David Dao, Matteo Interlandi, Sebastian Schelter, Wentao Wu, Ce Zhang",
        "tldr": "",
        "abstract": "When a machine learning (ML) model exhibits poor quality (e.g., poor accuracy or fairness), the problem can often be traced back to errors in the training data. Being able to discover the data examples that are the most likely culprits is a fundamental concern that has received a lot of attention recently. One prominent way to measure \"data importance\" with respect to model quality is the Shapley value. Unfortunately, existing methods only focus on the ML model in isolation, without considering the broader ML pipeline for data preparation and feature extraction, which appears in the majority of real-world ML code. This presents a major limitation to applying existing methods in practical settings. In this paper, we propose Datascope, a method for efficiently computing Shapley-based data importance over ML pipelines. We introduce several approximations that lead to dramatic improvements in terms of computational speed. Finally, our experimental evaluation demonstrates that our methods are capable of data error discovery that is as effective as existing Monte Carlo baselines, and in some cases even outperform them. We release our code as an open-source data debugging library available at https://github.com/easeml/datascope.",
        "keywords": "data debugging;data valuation;shapley value;machine learning pipelines",
        "primary_area": "infrastructure, software libraries, hardware, etc.",
        "supplementary_material": "",
        "author": "Bojan Karla\u0161;David Dao;Matteo Interlandi;Sebastian Schelter;Wentao Wu;Ce Zhang",
        "authorids": "~Bojan_Karla\u01611;~David_Dao1;~Matteo_Interlandi1;~Sebastian_Schelter1;~Wentao_Wu1;~Ce_Zhang1",
        "gender": ";M;;;;",
        "homepage": "https://bojan.ninja/;https://daviddao.org;https://interesaaat.github.io/;https://deem.berlin;https://www.microsoft.com/en-us/research/people/wentwu/;",
        "dblp": "185/0781;;49/10034;118/7229;29/85;97/919",
        "google_scholar": "Uv7RWgkAAAAJ;https://scholar.google.ca/citations?user=XHeNA_8AAAAJ;KnDm7b4AAAAJ;https://scholar.google.de/citations?user=zCpQUukAAAAJ;Owype4oAAAAJ;",
        "orcid": "0000-0002-6462-3579;;;0000-0003-4722-5840;;",
        "linkedin": "bojankarlas;;minterlandi/;sebastianschelter/;;",
        "or_profile": "~Bojan_Karla\u01611;~David_Dao1;~Matteo_Interlandi1;~Sebastian_Schelter1;~Wentao_Wu1;~Ce_Zhang1",
        "aff": "Harvard Medical School;;;University of Amsterdam;Microsoft Research;University of Chicago",
        "aff_domain": "hms.harvard.edu;;;uva.nl;microsoft.com;uchicago.edu",
        "position": "Postdoc;;;Assistant Professor;Principal Researcher;Associate Professor",
        "bibtex": "@inproceedings{\nkarla{\\v{s}}2024data,\ntitle={Data Debugging with Shapley Importance over Machine Learning Pipelines},\nauthor={Bojan Karla{\\v{s}} and David Dao and Matteo Interlandi and Sebastian Schelter and Wentao Wu and Ce Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=qxGXjWxabq}\n}",
        "github": "",
        "project": "",
        "reviewers": "guJp;V8Vh;5GXy;bts9",
        "pdf_size": 4124354,
        "rating": "6;6;8;8",
        "confidence": "3;4;3;2",
        "soundness": "4;2;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "71;147;74;134",
        "wc_strengths": "52;75;82;55",
        "wc_weaknesses": "341;239;256;82",
        "wc_questions": "2;88;2;44",
        "wc_review": "466;549;414;315",
        "wc_reply_reviewers": "0;0;17;17",
        "wc_reply_authors": "1225;1859;1248;310",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "2;3;2;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            106.5,
            34.325646388669796
        ],
        "wc_strengths_avg": [
            66.0,
            12.786711852544421
        ],
        "wc_weaknesses_avg": [
            229.5,
            93.51604140467025
        ],
        "wc_questions_avg": [
            34.0,
            35.58089374931439
        ],
        "wc_review_avg": [
            436.0,
            84.84397444721694
        ],
        "wc_reply_reviewers_avg": [
            8.5,
            8.5
        ],
        "wc_reply_authors_avg": [
            1160.5,
            552.96225006776
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.7071067811865475,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8878091954549342493&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=qxGXjWxabq",
        "pdf": "https://openreview.net/pdf?id=qxGXjWxabq",
        "email": "hms.harvard.edu;;;uva.nl;microsoft.com;uchicago.edu",
        "author_num": 6,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Harvard University;University of Amsterdam;Microsoft;University of Chicago",
        "aff_unique_dep": "Medical School;;Microsoft Research;",
        "aff_unique_url": "https://hms.harvard.edu;https://www.uva.nl;https://www.microsoft.com/en-us/research;https://www.uchicago.edu",
        "aff_unique_abbr": "HMS;UvA;MSR;UChicago",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Boston;",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "United States;Netherlands"
    },
    {
        "title": "Robust Training of Federated Models with Extremely Label Deficiency",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17708",
        "id": "qxLVaYbsSI",
        "author_site": "Yonggang Zhang, Yang, Xinmei Tian, Nannan Wang, Tongliang Liu, Bo Han",
        "tldr": "",
        "abstract": "Federated semi-supervised learning (FSSL) has emerged as a powerful paradigm for collaboratively training machine learning models using distributed data with label deficiency. Advanced FSSL methods predominantly focus on training a single model on each client. However, this approach could lead to a discrepancy between the objective functions of labeled and unlabeled data, resulting in gradient conflicts. To alleviate gradient conflict, we propose a novel twin-model paradigm, called **Twinsight**, designed to enhance mutual guidance by providing insights from different perspectives of labeled and unlabeled data. In particular, Twinsight concurrently trains a supervised model with a supervised objective function while training an unsupervised model using an unsupervised objective function. To enhance the synergy between these two models, Twinsight introduces a neighborhood-preserving constraint, which encourages the preservation of the neighborhood relationship among data features extracted by both models. Our comprehensive experiments on four benchmark datasets provide substantial evidence that Twinsight can significantly outperform state-of-the-art methods across various experimental settings, demonstrating the efficacy of the proposed Twinsight.",
        "keywords": "Federated Learning;Label Deficiency",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Yonggang Zhang;Zhiqin Yang;Xinmei Tian;Nannan Wang;Tongliang Liu;Bo Han",
        "authorids": "~Yonggang_Zhang1;~Zhiqin_Yang1;~Xinmei_Tian1;~Nannan_Wang1;~Tongliang_Liu1;~Bo_Han1",
        "gender": "M;F;M;M;M;M",
        "homepage": "https://yonggangzhangben.github.io/index.html;https://faculty.ustc.edu.cn/tianxinmei1/zh_CN/index.htm;;https://tongliang-liu.github.io/;https://bhanml.github.io/;https://visitworld123.github.io/",
        "dblp": "27/6859-3;03/5204-1;10/8359-1;150/6667;241/0472-3;251/6782",
        "google_scholar": "XSbEr98AAAAJ;https://scholar.google.com.au/citations?hl=zh-CN;SRBn7oUAAAAJ;https://scholar.google.com.au/citations?user=EiLdZ_YAAAAJ;nTNjqHwAAAAJ;DSjGPu0AAAAJ",
        "orcid": "0000-0002-4080-7592;0000-0002-5952-8753;;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Yonggang_Zhang1;~Xinmei_Tian1;~Nannan_Wang1;~Tongliang_Liu1;~bo_han2;~Zhiqin_Brian_Yang1",
        "aff": "Hong Kong Baptist University;University of Science and Technology of China;Xidian University;Mohamed bin Zayed University of Artificial Intelligence;MBZUAI;Beihang University",
        "aff_domain": "hkbu.edu.hk;ustc.edu.cn;xidian.edu.cn;mbzuai.ac.ae;mbzuai.ac.ae;buaa.edu.cn",
        "position": "Postdoc;Full Professor;Full Professor;Affiliated Associate Professor;Researcher;MS student",
        "bibtex": "@inproceedings{\nzhang2024robust,\ntitle={Robust Training of Federated Models with Extremely Label Deficiency},\nauthor={Yonggang Zhang and Zhiqin Yang and Xinmei Tian and Nannan Wang and Tongliang Liu and Bo Han},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=qxLVaYbsSI}\n}",
        "github": "",
        "project": "",
        "reviewers": "37Jm;NJbh;QrkV;r5bY",
        "pdf_size": 1212277,
        "rating": "6;6;6;6",
        "confidence": "3;3;4;3",
        "soundness": "3;2;3;3",
        "contribution": "3;2;3;3",
        "presentation": "4;3;3;3",
        "wc_summary": "72;123;56;95",
        "wc_strengths": "46;77;58;40",
        "wc_weaknesses": "79;143;74;153",
        "wc_questions": "11;118;65;27",
        "wc_review": "208;461;253;315",
        "wc_reply_reviewers": "15;34;34;23",
        "wc_reply_authors": "819;1084;691;1097",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "4;4;2;5",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            86.5,
            25.22399651125888
        ],
        "wc_strengths_avg": [
            55.25,
            14.13108276106258
        ],
        "wc_weaknesses_avg": [
            112.25,
            35.967867604293694
        ],
        "wc_questions_avg": [
            55.25,
            41.19693556564614
        ],
        "wc_review_avg": [
            309.25,
            95.49443701074948
        ],
        "wc_reply_reviewers_avg": [
            26.5,
            8.0156097709407
        ],
        "wc_reply_authors_avg": [
            922.75,
            173.8079040205019
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.75,
            1.0897247358851685
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16257617597708197487&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=qxLVaYbsSI",
        "pdf": "https://openreview.net/pdf?id=qxLVaYbsSI",
        "email": "hkbu.edu.hk;ustc.edu.cn;xidian.edu.cn;mbzuai.ac.ae;mbzuai.ac.ae;buaa.edu.cn",
        "author_num": 6,
        "aff_unique_index": "0;1;2;3;3;4",
        "aff_unique_norm": "Hong Kong Baptist University;University of Science and Technology of China;Xidian University;Mohamed bin Zayed University of Artificial Intelligence;Beihang University",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.hkbu.edu.hk;http://www.ustc.edu.cn;http://www.xidian.edu.cn/;https://mbzuai.ac.ae;http://www.buaa.edu.cn/",
        "aff_unique_abbr": "HKBU;USTC;Xidian;MBZUAI;BUAA",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;1;1;0",
        "aff_country_unique": "China;United Arab Emirates"
    },
    {
        "id": "qxqLI7QMur",
        "title": "Probing Innocuous Overfitting within Robust Linear Analytical Classifications",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The phenomena of \"Overfitting,\" where algorithms train on noise-laden data yet uphold superior generalization capabilities, has sparked considerable discourse within the field of machine learning. Numerous studies have sought to rationalize this seemingly paradoxical occurrence, delving into over-parameterized linear regression, classification, and assorted kernel methodologies. Nonetheless, the probable manifestation of benign overfitting amidst adversarial instances\u2014specifically, those involving minimal, deliberate alterations designed to deceive algorithms\u2014remains ambiguous. This study elucidates the incidence of benign overfitting within the realm of adversarial instruction, a structured strategy contrived to counter adversarial instances, particularly in the context of subGaussian mixture data. We meticulously substantiate the risk confines of adversarially instructed linear classifiers processing mixtures of sub-Gaussian data amidst adversarial distortions. Our insights infer that, under subtle distortions, adversarially trained linear classifiers are capable of attaining proximate optimal standard and adversarial risks, notwithstanding the overfitting of noise-infused training datasets. The empirical analyses performed corroborate our theoretical assertions.",
        "keywords": "Overfitting;Classifications;Robust",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Zhenghan Chen;Mengzhu Wang;Nan Yin;Ye Wang;Junyang Chen",
        "authorids": "~Zhenghan_Chen3;~Mengzhu_Wang1;~Nan_Yin4;~Ye_Wang17;~Junyang_Chen1",
        "gender": ";;M;F;M",
        "homepage": ";;;;https://csse.szu.edu.cn/pages/user/index?id=1101",
        "dblp": ";;135/8983;44/6292.html;196/7893.html",
        "google_scholar": ";;https://scholar.google.com.hk/citations?user=NoOK0pIAAAAJ;;Q0u3dRQAAAAJ",
        "orcid": ";;;;0000-0002-1139-8654",
        "linkedin": ";;yin-nan-b32943173;;",
        "or_profile": "~Zhenghan_Chen3;~Mengzhu_Wang1;~Nan_Yin4;~Ye_Wang17;~Junyang_Chen1",
        "aff": ";;Mohamed bin Zayed University of Artificial Intelligence;;Shenzhen University",
        "aff_domain": ";;mbzuai.ac.ae;;szu.edu",
        "position": ";;Postdoc;;Assistant Professor",
        "bibtex": "@misc{\nchen2024probing,\ntitle={Probing Innocuous Overfitting within Robust Linear Analytical Classifications},\nauthor={Zhenghan Chen and Mengzhu Wang and Nan Yin and Ye Wang and Junyang Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=qxqLI7QMur}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=qxqLI7QMur",
        "pdf_size": 2029901,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:OsvW6yup354J:scholar.google.com/&scioq=Probing+Innocuous+Overfitting+within+Robust+Linear+Analytical+Classifications&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Mohamed bin Zayed University of Artificial Intelligence;Shenzhen University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://mbzuai.ac.ae;https://www.szu.edu.cn",
        "aff_unique_abbr": "MBZUAI;SZU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United Arab Emirates;China"
    },
    {
        "id": "qybJSeG2VH",
        "title": "Achieving Minimax Optimal Sample Complexity of Offline Reinforcement Learning: A DRO-Based Approach",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Offline reinforcement learning aims to learn from pre-collected datasets without active exploration. This problem faces significant challenges, including limited data availability and distributional shifts. Existing approaches adopt a pessimistic stance towards uncertainty by penalizing rewards of under-explored state-action pairs to estimate value functions conservatively.\nIn this paper, we show that the distributionally robust optimization (DRO) based approach can also address these challenges and is minimax optimal. Specifically,\nwe directly model the uncertainty in the transition kernel and construct an uncertainty set of statistically plausible transition kernels. We then find the policy that optimizes the worst-case performance over this uncertainty set.  We first design a metric-based Hoeffding-style uncertainty set such that with high probability the true transition kernel is in this set. We prove that to achieve a sub-optimality gap of $\\epsilon$, the sample complexity is $\\mathcal{O}(SC^{\\pi^*}\\epsilon^{-2}(1-\\gamma)^{-4})$, where $\\gamma$ is the discount factor, $S$ is the number of states, and $C^{\\pi^*}$ is the single-policy clipped concentrability coefficient which quantifies the distribution shift. To achieve the optimal sample complexity, we further propose a less conservative Bernstein-style uncertainty set, which, however, does not necessarily include the true transition kernel. We show that an improved sample complexity of $\\mathcal{O}(SC^{\\pi^*}\\epsilon^{-2}(1-\\gamma)^{-3})$ can be obtained, which matches with the minimax lower bound for offline reinforcement learning, and thus is minimax optimal.",
        "keywords": "offline reinforcement learning;robust MDP",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/cf3c7f5d250a6538f761657e4335af262fa7415f.pdf",
        "author": "Yue Wang;Jinjun Xiong;Shaofeng Zou",
        "authorids": "~Yue_Wang16;~Jinjun_Xiong1;~Shaofeng_Zou1",
        "gender": ";;",
        "homepage": "https://sites.google.com/view/ywangub;https://www.xlab-ub.com;",
        "dblp": "33/4822-68;81/1130;",
        "google_scholar": "ndMi_z8AAAAJ;tRt1xPYAAAAJ;",
        "orcid": "0009-0001-9786-052X;0000-0002-2620-4859;",
        "linkedin": ";jinjun-xiong-314774/;",
        "or_profile": "~Yue_Wang16;~Jinjun_Xiong1;~Shaofeng_Zou1",
        "aff": "University of Central Florida;State University of New York at Buffalo;",
        "aff_domain": "ucf.edu;buffalo.edu;",
        "position": "Assistant Professor;Professor;",
        "bibtex": "@misc{\nwang2024achieving,\ntitle={Achieving Minimax Optimal Sample Complexity of Offline Reinforcement Learning: A {DRO}-Based Approach},\nauthor={Yue Wang and Jinjun Xiong and Shaofeng Zou},\nyear={2024},\nurl={https://openreview.net/forum?id=qybJSeG2VH}\n}",
        "github": "",
        "project": "",
        "reviewers": "MQDJ;tZBG;VTaD;ZsAy",
        "site": "https://openreview.net/forum?id=qybJSeG2VH",
        "pdf_size": 509786,
        "rating": "3;3;5;5",
        "confidence": "4;4;3;3",
        "soundness": "2;2;3;3",
        "contribution": "2;3;2;2",
        "presentation": "3;4;2;3",
        "wc_summary": "51;83;39;86",
        "wc_strengths": "45;165;82;58",
        "wc_weaknesses": "75;30;92;121",
        "wc_questions": "222;185;255;11",
        "wc_review": "393;463;468;276",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            64.75,
            20.22838352414745
        ],
        "wc_strengths_avg": [
            87.5,
            46.671725916233264
        ],
        "wc_weaknesses_avg": [
            79.5,
            32.973474187595095
        ],
        "wc_questions_avg": [
            168.25,
            94.1046624774777
        ],
        "wc_review_avg": [
            400.0,
            77.48870885490349
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16111377342919877139&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Central Florida;State University of New York at Buffalo",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ucf.edu;https://www.buffalo.edu",
        "aff_unique_abbr": "UCF;SUNY Buffalo",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Buffalo",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "A Recipe for Improved Certifiable Robustness",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17707",
        "id": "qz3mcn99cu",
        "author_site": "Kai Hu, Klas Leino, Zifan Wang, Matt Fredrikson",
        "tldr": "",
        "abstract": "Recent studies have highlighted the potential of Lipschitz-based methods for training certifiably robust neural networks against adversarial attacks.\nA key challenge, supported both theoretically and empirically, is that robustness demands greater network capacity and more data than standard training. \nHowever, effectively adding capacity under stringent Lipschitz constraints has proven more difficult than it may seem, evident by the fact that state-of-the-art approach tend more towards \\emph{underfitting} than overfitting.\nMoreover, we posit that a lack of careful exploration of the design space for Lipshitz-based approaches has left potential performance gains on the table.\nIn this work, we provide a more comprehensive evaluation to better uncover the potential of Lipschitz-based certification methods.\nUsing a combination of novel techniques, design optimizations, and synthesis of prior work, we are able to significantly improve the state-of-the-art VRA for deterministic certification on a variety of benchmark datasets, and over a range of perturbation sizes.\nOf particular note, we discover that the addition of large ``Cholesky-orthogonalized residual dense'' layers to the end of existing state-of-the-art Lipschitz-controlled ResNet architectures is especially effective for increasing network capacity and performance.\nCombined with filtered generative data augmentation, our final results further the state of the art deterministic VRA by up to 8.5 percentage points.",
        "keywords": "adversarial robustness;certificated robustness;Lipschitz-based",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/94f86c01d928b321a9d669b2257d2a1cac3df77f.zip",
        "author": "Kai Hu;Klas Leino;Zifan Wang;Matt Fredrikson",
        "authorids": "~Kai_Hu2;~Klas_Leino1;~Zifan_Wang1;~Matt_Fredrikson1",
        "gender": "M;M;M;M",
        "homepage": "https://github.com/hukkai;https://klas.leino.tech;https://www.zifanw.net;https://cs.cmu.edu/~mfredrik",
        "dblp": ";;;38/2612",
        "google_scholar": ";;HJOP3wMAAAAJ;https://scholar.google.com.tw/citations?user=tMYCvLAAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;zifan-wang-sail/;",
        "or_profile": "~Kai_Hu2;~Klas_Leino1;~Zifan_Wang1;~Matt_Fredrikson1",
        "aff": "Carnegie Mellon University;Roam HQ;Center for AI Safety;Carnegie Mellon University",
        "aff_domain": "cmu.edu;ro.am;safe.ai;cmu.edu",
        "position": "PhD student;Principal Researcher;Researcher;Associate Professor",
        "bibtex": "@inproceedings{\nhu2024a,\ntitle={A Recipe for Improved Certifiable Robustness},\nauthor={Kai Hu and Klas Leino and Zifan Wang and Matt Fredrikson},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=qz3mcn99cu}\n}",
        "github": "",
        "project": "",
        "reviewers": "BQAE;9Qkw;TVPw",
        "pdf_size": 291782,
        "rating": "5;6;8",
        "confidence": "3;2;3",
        "soundness": "3;2;3",
        "contribution": "2;2;3",
        "presentation": "3;2;3",
        "wc_summary": "31;24;52",
        "wc_strengths": "65;29;232",
        "wc_weaknesses": "100;11;53",
        "wc_questions": "9;13;3",
        "wc_review": "205;77;340",
        "wc_reply_reviewers": "105;0;0",
        "wc_reply_authors": "738;529;163",
        "reply_reviewers": "1;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            35.666666666666664,
            11.897712198383164
        ],
        "wc_strengths_avg": [
            108.66666666666667,
            88.43955877069692
        ],
        "wc_weaknesses_avg": [
            54.666666666666664,
            36.353205574688396
        ],
        "wc_questions_avg": [
            8.333333333333334,
            4.109609335312651
        ],
        "wc_review_avg": [
            207.33333333333334,
            107.38197655514118
        ],
        "wc_reply_reviewers_avg": [
            35.0,
            49.49747468305833
        ],
        "wc_reply_authors_avg": [
            476.6666666666667,
            237.64165366272715
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.18898223650461363,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=444460693756771376&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=qz3mcn99cu",
        "pdf": "https://openreview.net/pdf?id=qz3mcn99cu",
        "email": "cmu.edu;ro.am;safe.ai;cmu.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Carnegie Mellon University;Roam;Center for AI Safety",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.cmu.edu;https://www.roamhq.com;https://www.centerforaisafety.org",
        "aff_unique_abbr": "CMU;;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "r06ubNxw4E",
        "title": "EdVAE: Mitigating Codebook Collapse with Evidential Discrete Variational Autoencoders",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Codebook collapse is a common problem in training deep generative models with discrete representation spaces like Vector Quantized Variational Autoencoders (VQ-VAEs). We observe that the same problem arises for the alternatively designed discrete variational autoencoders (dVAEs) whose encoder directly learns a distribution over the codebook embeddings to represent the data. We hypothesize that using the softmax function to obtain a probability distribution causes the codebook collapse by assigning overconfident probabilities to the best matching codebook elements. In this paper, we propose a novel way to incorporate evidential deep learning (EDL) instead of softmax to combat the codebook collapse problem of dVAE. We evidentially monitor the significance of attaining the probability distribution over the codebook embeddings, in contrast to softmax usage. Our experiments using various datasets show that our model, called EdVAE, mitigates codebook collapse while improving the reconstruction performance, and enhances the codebook usage compared to dVAE and VQ-VAE based models.",
        "keywords": "Vector Quantized Variational Autoencoders; Discrete Variational Autoencoders; Evidential Deep Learning; Codebook Collapse",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/554e52a9864543151cf42c45525e045a27cdf2fc.zip",
        "author": "Gulcin Baykal;Melih Kandemir;Gozde Unal",
        "authorids": "~Gulcin_Baykal1;~Melih_Kandemir1;~Gozde_Unal1",
        "gender": "F;M;F",
        "homepage": ";https://imada.sdu.dk/~kandemir/;https://ituvisionlab.github.io/",
        "dblp": "225/3350;95/7056;",
        "google_scholar": "tcmSfdwAAAAJ;Jxm1UeYAAAAJ;soanB6MAAAAJ",
        "orcid": "0000-0003-2676-7552;0000-0001-6293-3656;",
        "linkedin": "g%C3%BCl%C3%A7in-baykal-can-0a8276b0/;melih-kandemir-64681a16/;",
        "or_profile": "~Gulcin_Baykal1;~Melih_Kandemir1;~Gozde_Unal1",
        "aff": "Istanbul Technical University;University of Southern Denmark;Istanbul Technical University",
        "aff_domain": "itu.edu.tr;sdu.dk;itu.edu.tr",
        "position": "PhD student;Associate Professor;Full Professor",
        "bibtex": "@misc{\nbaykal2024edvae,\ntitle={Ed{VAE}: Mitigating Codebook Collapse with Evidential Discrete Variational Autoencoders},\nauthor={Gulcin Baykal and Melih Kandemir and Gozde Unal},\nyear={2024},\nurl={https://openreview.net/forum?id=r06ubNxw4E}\n}",
        "github": "",
        "project": "",
        "reviewers": "xKyk;m7N7;QdFK",
        "site": "https://openreview.net/forum?id=r06ubNxw4E",
        "pdf_size": 0,
        "rating": "3;5;5",
        "confidence": "4;3;5",
        "soundness": "2;3;2",
        "contribution": "2;3;2",
        "presentation": "3;2;3",
        "wc_summary": "68;55;60",
        "wc_strengths": "46;62;47",
        "wc_weaknesses": "114;106;186",
        "wc_questions": "4;2;54",
        "wc_review": "232;225;347",
        "wc_reply_reviewers": "0;71;0",
        "wc_reply_authors": "813;643;648",
        "reply_reviewers": "0;1;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            61.0,
            5.354126134736337
        ],
        "wc_strengths_avg": [
            51.666666666666664,
            7.3181661333667165
        ],
        "wc_weaknesses_avg": [
            135.33333333333334,
            35.97530016861877
        ],
        "wc_questions_avg": [
            20.0,
            24.055491403558285
        ],
        "wc_review_avg": [
            268.0,
            55.93448548674303
        ],
        "wc_reply_reviewers_avg": [
            23.666666666666668,
            33.46972097616325
        ],
        "wc_reply_authors_avg": [
            701.3333333333334,
            78.98663740715192
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5558155374964595219&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Istanbul Technical University;University of Southern Denmark",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.itu.edu.tr;https://www.sdu.dk",
        "aff_unique_abbr": "ITU;SDU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "T\u00fcrkiye;Denmark"
    },
    {
        "id": "r0BcyqWAcj",
        "title": "Loci-Segmented: Improving Scene Segmentation Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Slot-oriented processing approaches for compositional scene representation have recently undergone a tremendous development. We present Loci-Segmented (Loci-s), an advanced scene segmentation neural network that extends the slot-based location and identity tracking architecture Loci (Traub et al., ICLR 2023). The main advancements are (i) the addition of a pre-trained dynamic background module; (ii) a hyper-convolution encoder module, which enables object-focused bottom-up processing; and (iii) a cascaded decoder module, which successively generates object masks, masked depth maps, and masked, depth-map-informed RGB reconstructions. The background module features the learning of both a foreground identifying module and a background re-generator. We further improve performance via (a) the integration of depth information as well as improved slot assignments via (b) slot-location-entity regularization and (b) a prior segmentation network. Even without these latter improvements, the results reveal superior segmentation performance in the MOVi datasets and in another established dataset collection. With all improvements, Loci-s achieves a 32% better intersection over union (IoU) score in MOVi-E than the previous best. We furthermore show that Loci-s generates well-interpretable latent representations. We believe that these representations may serve as a foundation-model-like interpretable basis for solving downstream tasks, such as grounding language and context- and\ngoal-conditioned event processing.",
        "keywords": "Deep Learning;Computer Vision;Object-Centric Models;Compositional Scene Representation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/beada944957640a32a565d74b5ff18d9c20ad6f3.zip",
        "author": "Manuel Traub;Frederic Becker;Adrian Sauter;Sebastian Otte;Martin V. Butz",
        "authorids": "~Manuel_Traub1;~Frederic_Becker1;~Adrian_Sauter1;~Sebastian_Otte1;~Martin_V._Butz2",
        "gender": "M;;M;;M",
        "homepage": "https://manuel-traub.de/;;;;https://cm.inf.uni-tuebingen.de",
        "dblp": "189/1743;266/1325;;;b/MartinVButz.html",
        "google_scholar": "wz7mZEMAAAAJ;JbGitWUAAAAJ;;;https://scholar.google.de/citations?user=dIcpfzAAAAAJ",
        "orcid": "0000-0003-0897-1701;0000-0002-8477-5203;;;0000-0002-8120-8537",
        "linkedin": ";;adrian-sauter-b75550211/;;martin-butz-85b971150/",
        "or_profile": "~Manuel_Traub1;~Frederic_Becker1;~Adrian_Sauter1;~Sebastian_Otte1;~Martin_V._Butz2",
        "aff": "Eberhard-Karls-Universit\u00e4t T\u00fcbingen;Eberhard-Karls-Universit\u00e4t T\u00fcbingen;University of Amsterdam;;University of Tuebingen",
        "aff_domain": "uni-tuebingen.de;uni-tuebingen.de;uva.nl;;uni-tuebingen.de",
        "position": "PhD student;PhD student;MS student;;Full Professor",
        "bibtex": "@misc{\ntraub2024locisegmented,\ntitle={Loci-Segmented: Improving Scene Segmentation Learning},\nauthor={Manuel Traub and Frederic Becker and Adrian Sauter and Sebastian Otte and Martin V. Butz},\nyear={2024},\nurl={https://openreview.net/forum?id=r0BcyqWAcj}\n}",
        "github": "",
        "project": "",
        "reviewers": "czo6;wWut;vymZ;xtqd",
        "site": "https://openreview.net/forum?id=r0BcyqWAcj",
        "pdf_size": 2157267,
        "rating": "3;5;5;6",
        "confidence": "3;3;3;1",
        "soundness": "2;3;2;3",
        "contribution": "2;3;2;3",
        "presentation": "1;3;2;3",
        "wc_summary": "50;47;43;82",
        "wc_strengths": "17;35;4;29",
        "wc_weaknesses": "124;152;29;32",
        "wc_questions": "217;3;2;1",
        "wc_review": "408;237;78;144",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "334;224;157;31",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            2.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            55.5,
            15.5
        ],
        "wc_strengths_avg": [
            21.25,
            11.882234638316145
        ],
        "wc_weaknesses_avg": [
            84.25,
            54.66431651452344
        ],
        "wc_questions_avg": [
            55.75,
            93.10041621818884
        ],
        "wc_review_avg": [
            216.75,
            124.02696279438597
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            186.5,
            109.78729434684143
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.6622661785325219,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3262029453481841346&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "Eberhard Karls University of T\u00fcbingen;University of Amsterdam;University of Tuebingen",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.uni-tuebingen.de/;https://www.uva.nl;https://www.uni-tuebingen.de/",
        "aff_unique_abbr": "Uni T\u00fcbingen;UvA;Uni T\u00fcbingen",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "T\u00fcbingen;",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "Germany;Netherlands"
    },
    {
        "id": "r0kY4SS7ts",
        "title": "Nash Equilibria in Reward-Potential Markov Games: Algorithms, Complexity, and Applications",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Markov games that exhibit potential functions for rewards in each state, referred to as Reward-Potential Markov Games (RPMGs), do not inherently qualify as Markov Potential Games (MPGs), which require state-dependent potential functions for value functions. This discrepancy, widely acknowledged in recent literature on MPGs, remains highly unexplored. RPMGs, with their easier-to-verify and arguably more minimal reward-potential property, have not received adequate attention. We embark on the exploration of RPMGs, observing that computing a stationary Nash equilibrium (NE) is $\\mathsf{PPAD}$-hard for infinite-horizon RPMGs, even under constraints on transition functions. In contrast to results on stationary equilibria in Markov games, we establish that computing a nonstationary Nash equilibrium in finite-horizon RPMGs is $\\mathsf{PPAD}$-hard without any assumptions on transition functions. On a positive note, we present an algorithm capable of breaking the curse of multiagents by efficiently computing an $\\epsilon$-approximate NE in RPMGs with additive transitions, with a runtime polynomial in $1/\\epsilon$. Furthermore, we extend our analysis to include an adversarial player seeking to maximize the underlying potential function, introducing the concept of Adversarial Reward-Potential Markov Games.",
        "keywords": "potential games;markov games;ppad-hardness;complexity;nash equilibrium;fisher market",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Fivos Kalogiannis;Ioannis Panageas",
        "authorids": "~Fivos_Kalogiannis1;~Ioannis_Panageas1",
        "gender": "M;M",
        "homepage": "https://fivoskal.github.io/;https://panageas.github.io",
        "dblp": "305/7347;139/3829",
        "google_scholar": "FVEj9MIAAAAJ;5NiFWuwAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Fivos_Kalogiannis1;~Ioannis_Panageas1",
        "aff": "University of California, Irvine;Donald Bren School of Information and Computer Sciences, University of California, Irvine",
        "aff_domain": "uci.edu;ics.uci.edu",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nkalogiannis2024nash,\ntitle={Nash Equilibria in Reward-Potential Markov Games: Algorithms, Complexity, and Applications},\nauthor={Fivos Kalogiannis and Ioannis Panageas},\nyear={2024},\nurl={https://openreview.net/forum?id=r0kY4SS7ts}\n}",
        "github": "",
        "project": "",
        "reviewers": "qzAJ;ku5a;Aoz1;qkBm;kcNT",
        "site": "https://openreview.net/forum?id=r0kY4SS7ts",
        "pdf_size": 381460,
        "rating": "3;5;5;5;5",
        "confidence": "4;4;2;4;3",
        "soundness": "2;3;3;3;3",
        "contribution": "1;2;2;2;3",
        "presentation": "1;3;2;2;3",
        "wc_summary": "94;64;51;155;60",
        "wc_strengths": "6;15;30;110;25",
        "wc_weaknesses": "158;191;236;250;518",
        "wc_questions": "4;21;95;3;70",
        "wc_review": "262;291;412;518;673",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            4.6,
            0.7999999999999999
        ],
        "confidence_avg": [
            3.4,
            0.8
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            2.2,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            84.8,
            37.95470985266519
        ],
        "wc_strengths_avg": [
            37.2,
            37.327737675889225
        ],
        "wc_weaknesses_avg": [
            270.6,
            127.93998593090434
        ],
        "wc_questions_avg": [
            38.6,
            37.259092849933964
        ],
        "wc_review_avg": [
            431.2,
            151.42971967219646
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.37500000000000017,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:KG309aSpOkkJ:scholar.google.com/&scioq=Nash+Equilibria+in+Reward-Potential+Markov+Games:+Algorithms,+Complexity,+and+Applications&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of California, Irvine",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uci.edu",
        "aff_unique_abbr": "UCI",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Irvine",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "r125wFo0L3",
        "title": "Large Trajectory Models are Scalable Motion Predictors and Planners",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Motion prediction and planning are vital challenges in autonomous driving. Recent works serialize observations, states (or actions), and rewards in a sequence with compact and versatile Transformers to approach motion planning as a sequence modeling problem. However, the efficacy of these methods under stochastic and interactive environments without simulators remains to be investigated. Learning from large real-world datasets for autonomous driving additionally challenges the models to interpret heterogeneous behaviors and policies from ambiguous demonstrations, understand diverse road topologies, reason over a longer horizon of up to 8 seconds, and generate outputs in a larger continuous state space. \n    In this research, we reformulate the motion prediction and motion planning problem by arranging all elements into a sequence modeling task and propose the State Transformer (STR). With comparative test settings, STR consistently outperforms the benchmarks in both motion planning and motion prediction tasks.\n    Remarkably, our experiment results reveal that large trajectory models (LTMs), such as STR, adhere to the scaling laws by presenting outstanding adaptability and learning efficiency when trained using larger Transformer backbones.\n    Qualitative analysis illustrates that LTMs are capable of generating plausible predictions in scenarios that diverge significantly from the training dataset's distribution. LTMs can also learn to make complex reasonings for long-term planning, extending beyond the horizon of 8 seconds, without explicit loss designs or costly high-level annotations.",
        "keywords": "Motion Prediction;Motion Planning;Autonomous Driving",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/89f884ba4f861406c5d3b7ba14ba58e15eb4fd85.zip",
        "author": "Qiao Sun;Shiduo Zhang;Danjiao Ma;Jingzhe Shi;Derun Li;Simian Luo;Yu Wang;Ningyi Xu;Guangzhi Cao;Hang Zhao",
        "authorids": "~Qiao_Sun1;~Shiduo_Zhang1;~Danjiao_Ma1;~Jingzhe_Shi1;~Derun_Li1;~Simian_Luo1;~Yu_Wang19;~Ningyi_Xu1;~Guangzhi_Cao1;~Hang_Zhao1",
        "gender": "M;M;;M;M;M;;M;M;M",
        "homepage": "https://qiaosun.me;https://github.com/Shiduo-zh;;https://jingzheshi.github.io/;https://github.com/Dylan-LDR/;https://github.com/luosiallen;;http://www.qingyuan.sjtu.edu.cn/a/xu-ning-yi-1.html;;http://www.mit.edu/~hangzhao/",
        "dblp": "10/6242;;;359/6451;;317/0715;;88/9033;18/1773;",
        "google_scholar": "D1KNQasAAAAJ;;;x_4IcIoAAAAJ;oSnm3PkAAAAJ;;;;XY7knjAAAAAJ;DmahiOYAAAAJ",
        "orcid": ";;;;;;;;;",
        "linkedin": ";;;;;;;;;",
        "or_profile": "~Qiao_Sun1;~Shiduo_Zhang1;~Danjiao_Ma1;~Jingzhe_Shi1;~Derun_Li1;~Simian_Luo1;~Yu_Wang19;~Ningyi_Xu1;~Guangzhi_Cao1;~Hang_Zhao1",
        "aff": ";Fudan University;;Tsinghua University;Shanghai Jiaotong University;Tsinghua University;;Shanghai Jiaotong University;Zdrive.ai;Tsinghua University",
        "aff_domain": ";fudan.edu.cn;;tsinghua.edu.cn;sjtu.edu.cn;mail.tsinghua.edu.cn;;sjtu.edu.cn;zdrive.ai;tsinghua.edu.cn",
        "position": ";MS student;;Researcher;PhD student;MS student;;Full Professor;Principal Researcher;Assistant Professor",
        "bibtex": "@misc{\nsun2024large,\ntitle={Large Trajectory Models are Scalable Motion Predictors and Planners},\nauthor={Qiao Sun and Shiduo Zhang and Danjiao Ma and Jingzhe Shi and Derun Li and Simian Luo and Yu Wang and Ningyi Xu and Guangzhi Cao and Hang Zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=r125wFo0L3}\n}",
        "github": "",
        "project": "",
        "reviewers": "ixB2;Cy2V;2D3R;6cJv",
        "site": "https://openreview.net/forum?id=r125wFo0L3",
        "pdf_size": 4100167,
        "rating": "5;5;5;5",
        "confidence": "3;3;3;3",
        "soundness": "2;3;3;2",
        "contribution": "2;2;2;3",
        "presentation": "3;2;2;2",
        "wc_summary": "26;44;357;103",
        "wc_strengths": "61;45;88;128",
        "wc_weaknesses": "70;168;482;762",
        "wc_questions": "69;94;76;123",
        "wc_review": "226;351;1003;1116",
        "wc_reply_reviewers": "424;16;286;125",
        "wc_reply_authors": "940;251;1565;1358",
        "reply_reviewers": "3;1;2;1",
        "reply_authors": "4;1;4;3",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            132.5,
            132.70738487363843
        ],
        "wc_strengths_avg": [
            80.5,
            31.4364438192363
        ],
        "wc_weaknesses_avg": [
            370.5,
            272.4935779059756
        ],
        "wc_questions_avg": [
            90.5,
            20.862646045025066
        ],
        "wc_review_avg": [
            674.0,
            390.07627459254684
        ],
        "wc_reply_reviewers_avg": [
            212.75,
            155.24396123521197
        ],
        "wc_reply_authors_avg": [
            1028.5,
            502.1804954396377
        ],
        "reply_reviewers_avg": [
            1.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.0,
            1.224744871391589
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17841304591270421406&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;1;2;3;1",
        "aff_unique_norm": "Fudan University;Tsinghua University;Shanghai Jiao Tong University;Zdrive.ai",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.fudan.edu.cn;https://www.tsinghua.edu.cn;https://www.sjtu.edu.cn;https://www.zdrive.ai",
        "aff_unique_abbr": "Fudan;THU;SJTU;Zdrive",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "r1IbewSnqq",
        "title": "FedQV: Leveraging Quadratic Voting in Federated Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Federated Learning (FL) permits different parties to collaboratively train a global model without disclosing their respective local labels. A crucial step of FL, that of aggregating local models to produce the global one, shares many similarities with public decision-making, and elections in particular. In that context, a major weakness of FL, namely its vulnerability to poisoning attacks, can be interpreted as a consequence of the one person one vote (henceforth 1p1v) principle underpinning most contemporary aggregation rules. \nIn this paper, we propose FedQV, a novel aggregation algorithm built upon the quadratic voting scheme, recently proposed as a better alternative to 1p1v-based elections. Our theoretical analysis establishes that FedQV is a truthful mechanism in which bidding according to one's true valuation is a dominant strategy that achieves a convergence rate that matches those of state-of-the-art methods. Furthermore, our empirical analysis using multiple real-world datasets validates the superior performance of FedQV against poisoning attacks. It also shows that combining FedQV with unequal voting \"budgets\" according to a reputation score increases its performance benefits even further. Finally, we show that FedQV can be easily combined with Byzantine-robust privacy-preserving mechanisms to enhance its robustness against both poisoning and privacy attacks.",
        "keywords": "Federated Learning;Byzantine-robust aggregation;poisoning attack",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/5aa1c0325da0cc7e4c17bf53979faa157eedcb63.zip",
        "author": "Tianyue Chu;Nikolaos Laoutaris",
        "authorids": "~Tianyue_Chu1;~Nikolaos_Laoutaris1",
        "gender": "F;M",
        "homepage": "https://tianyuechu.github.io/;http://laoutaris.info/",
        "dblp": "229/0484;04/5326",
        "google_scholar": ";https://scholar.google.es/citations?user=KaqnVUcAAAAJ",
        "orcid": ";0000-0002-7361-106X",
        "linkedin": "tianyue-chu-9a5627200;nikolaoslaoutaris/",
        "or_profile": "~Tianyue_Chu1;~Nikolaos_Laoutaris1",
        "aff": "IMDEA Networks;IMDEA Networks Institute",
        "aff_domain": "imdea.org;imdea.org",
        "position": "Researcher;Full Professor",
        "bibtex": "@misc{\nchu2024fedqv,\ntitle={Fed{QV}: Leveraging Quadratic Voting in Federated Learning},\nauthor={Tianyue Chu and Nikolaos Laoutaris},\nyear={2024},\nurl={https://openreview.net/forum?id=r1IbewSnqq}\n}",
        "github": "",
        "project": "",
        "reviewers": "E32F;dir9;WYWh;vHfa",
        "site": "https://openreview.net/forum?id=r1IbewSnqq",
        "pdf_size": 378180,
        "rating": "3;3;5;5",
        "confidence": "3;3;3;4",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "3;2;2;3",
        "wc_summary": "106;198;70;115",
        "wc_strengths": "53;108;78;32",
        "wc_weaknesses": "321;559;195;302",
        "wc_questions": "28;7;8;2",
        "wc_review": "508;872;351;451",
        "wc_reply_reviewers": "89;100;0;0",
        "wc_reply_authors": "924;728;126;477",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            122.25,
            46.86349858898714
        ],
        "wc_strengths_avg": [
            67.75,
            28.375825979167548
        ],
        "wc_weaknesses_avg": [
            344.25,
            132.9649859925537
        ],
        "wc_questions_avg": [
            11.25,
            9.934158243152764
        ],
        "wc_review_avg": [
            545.5,
            196.70345701080092
        ],
        "wc_reply_reviewers_avg": [
            47.25,
            47.409782745758285
        ],
        "wc_reply_authors_avg": [
            563.75,
            298.29044151631814
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14172754454200439314&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "IMDEA Networks Institute",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.imdea.org/",
        "aff_unique_abbr": "IMDEA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Spain"
    },
    {
        "id": "r1wHogNDyQ",
        "title": "Semantic Decoupled Distillation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Logit knowledge distillation attracts increasing attention due to its practicality in recent studies. This paper argues that existing logit-based methods may be sub-optimal since they only leverage the global logit output coupled with multiple semantic knowledge. To this end, we propose a simple but effective method, i.e., semantic decoupled distillation (SDD), for logit knowledge distillation. SDD decouples the logit output as multiple local outputs and establishes the transferring pipeline for them. This helps the student to mine and inherit richer and unambiguous logit knowledge. Besides, the decoupled knowledge can be further divided into consistent and complementary logit knowledge that transfers the multi-scale information and sample ambiguity, respectively. SDD introduces dynamic weights for them to adapt to different tasks and data scenes. Extensive experiments on several benchmark datasets demonstrate the effectiveness of SDD for wide teacher-student pairs, especially in the fine-grained classification task.",
        "keywords": "Knowledge distillation;classification",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Shicai Wei",
        "authorids": "~Shicai_Wei3",
        "gender": "M",
        "homepage": "",
        "dblp": "300/6440",
        "google_scholar": "https://scholar.google.com.hk/citations?user=ya50eWkAAAAJ",
        "orcid": "0000-0001-5744-2035",
        "linkedin": "",
        "or_profile": "~shicai_wei1",
        "aff": "University of Electronic Science and Technology of China",
        "aff_domain": "uestc.edu.cn",
        "position": "PhD student",
        "bibtex": "@misc{\nwei2024semantic,\ntitle={Semantic Decoupled Distillation},\nauthor={Shicai Wei},\nyear={2024},\nurl={https://openreview.net/forum?id=r1wHogNDyQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "SyKS;onwW;q6qm;PAHr",
        "site": "https://openreview.net/forum?id=r1wHogNDyQ",
        "pdf_size": 6209073,
        "rating": "3;3;5;5",
        "confidence": "3;2;5;5",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "3;1;2;3",
        "wc_summary": "123;67;58;41",
        "wc_strengths": "59;77;26;24",
        "wc_weaknesses": "98;29;134;92",
        "wc_questions": "31;20;81;6",
        "wc_review": "311;193;299;163",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            1.299038105676658
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            72.25,
            30.75203245315665
        ],
        "wc_strengths_avg": [
            46.5,
            22.433234274174556
        ],
        "wc_weaknesses_avg": [
            88.25,
            37.79136806203237
        ],
        "wc_questions_avg": [
            34.5,
            28.271009886454358
        ],
        "wc_review_avg": [
            241.5,
            64.5193769343753
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0.9622504486493763,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:4AssBgdX9yAJ:scholar.google.com/&scioq=Semantic+Decoupled+Distillation&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Electronic Science and Technology of China",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uestc.edu.cn",
        "aff_unique_abbr": "UESTC",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "r2Ji0Bzd4g",
        "title": "Lightweight Image Super-Resolution via Flexible Meta Pruning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Lightweight image super-resolution (SR) methods have obtained promising results with moderate model complexity. These approaches primarily focus on a lightweight architecture design, but neglect to further reduce network redundancy. While some model compression techniques try to achieve more lightweight SR models with neural architecture search, knowledge distillation, or channel pruning, they typically require considerable extra computational resources or neglect to prune weights. To address these issues, we propose a flexible meta pruning (FMP) for lightweight image SR, where the network channels and weights are pruned simultaneously. Specifically, we control the network sparsity via channel vectors and weight indicators. We feed them into a hypernetwork, whose parameters act as meta-data for the parameters of the SR backbone. Consequently, for each network layer, we conduct structured pruning with channel vectors, which control the output and input channels. Besides, we conduct unstructured pruning with weight indicators to influence the sparsity of kernel weights, resulting in flexible pruning. During pruning, the sparsity of both channel vectors and weight indicators are regularized. We optimize the channel vectors and weight indicators with proximal gradient and SGD. We conduct extensive experiments to investigate critical factors in the flexible channel and weight pruning for image SR, demonstrating the superiority of our FMP when applied to baseline architectures. Code and models will be released.",
        "keywords": "Super-Resolution;Flexible Pruning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/8d18a0c15488d908f92e2fc7a9485d788c70c8e8.pdf",
        "author": "Yulun Zhang;Kai Zhang;Luc Van Gool;Martin Danelljan;Fisher Yu",
        "authorids": "~Yulun_Zhang1;~Kai_Zhang8;~Luc_Van_Gool1;~Martin_Danelljan4;~Fisher_Yu2",
        "gender": "M;M;;M;M",
        "homepage": "http://yulunzhang.com/;https://github.com/cszn;;https://martin-danelljan.github.io/;https://www.yf.io/",
        "dblp": "166/2763-1.html;55/957-8;61/5017;151/8848;117/6314",
        "google_scholar": "ORmLjWoAAAAJ;0RycFIIAAAAJ;https://scholar.google.be/citations?user=TwMib_QAAAAJ;NCSSpMkAAAAJ;-XCiamcAAAAJ",
        "orcid": "0000-0002-2288-5079;0000-0002-6319-3722;;;",
        "linkedin": "yulun-zhang-1116b5b9/;;;;",
        "or_profile": "~Yulun_Zhang1;~Kai_Zhang8;~Luc_Van_Gool1;~Martin_Danelljan4;~Fisher_Yu2",
        "aff": "Swiss Federal Institute of Technology;ETH Zurich;KU Leuven;ETH Zurich;Swiss Federal Institute of Technology",
        "aff_domain": "ethz.ch;vision.ee.ethz.ch;kuleuven.be;vision.ee.ethz.ch;ethz.ch",
        "position": "Postdoc;Postdoc;Emeritus;Principal Researcher;Assistant Professor",
        "bibtex": "@misc{\nzhang2024lightweight,\ntitle={Lightweight Image Super-Resolution via Flexible Meta Pruning},\nauthor={Yulun Zhang and Kai Zhang and Luc Van Gool and Martin Danelljan and Fisher Yu},\nyear={2024},\nurl={https://openreview.net/forum?id=r2Ji0Bzd4g}\n}",
        "github": "",
        "project": "",
        "reviewers": "uZjY;pKAh;znMB;Jqxo;6gG5",
        "site": "https://openreview.net/forum?id=r2Ji0Bzd4g",
        "pdf_size": 2134517,
        "rating": "5;6;6;6;8",
        "confidence": "5;3;4;3;4",
        "soundness": "3;3;3;3;3",
        "contribution": "2;3;3;3;4",
        "presentation": "3;2;3;2;4",
        "wc_summary": "77;50;28;58;91",
        "wc_strengths": "57;30;46;29;184",
        "wc_weaknesses": "238;117;206;45;175",
        "wc_questions": "257;63;4;61;47",
        "wc_review": "629;260;284;193;497",
        "wc_reply_reviewers": "65;31;0;0;22",
        "wc_reply_authors": "2032;930;1299;756;1057",
        "reply_reviewers": "1;1;0;0;1",
        "reply_authors": "3;2;2;1;2",
        "rating_avg": [
            6.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.8,
            0.7483314773547882
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            2.8,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            60.8,
            21.793577035447854
        ],
        "wc_strengths_avg": [
            69.2,
            58.34175177349408
        ],
        "wc_weaknesses_avg": [
            156.2,
            68.44968955371529
        ],
        "wc_questions_avg": [
            86.4,
            87.9081338671229
        ],
        "wc_review_avg": [
            372.6,
            163.70778845247406
        ],
        "wc_reply_reviewers_avg": [
            23.6,
            24.021656895393374
        ],
        "wc_reply_authors_avg": [
            1214.8,
            445.28974836616214
        ],
        "reply_reviewers_avg": [
            0.6,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            2.0,
            0.6324555320336759
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.21821789023599233,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12790632853710065376&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2;1;0",
        "aff_unique_norm": "Swiss Federal Institute of Technology;ETH Zurich;Katholieke Universiteit Leuven",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ethz.ch;https://www.ethz.ch;https://www.kuleuven.be",
        "aff_unique_abbr": "ETH Zurich;ETHZ;KU Leuven",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "Switzerland;Belgium"
    },
    {
        "id": "r2uhY4pXrb",
        "title": "ViCo: Plug-and-play Visual Condition for Personalized Text-to-image Generation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Personalized text-to-image generation using diffusion models has recently emerged and garnered significant interest. This task learns a novel concept (e.g., a unique toy), illustrated in a handful of images, into a generative model that captures fine visual details and generates photorealistic images based on textual embeddings. In this paper, we present ViCo, a novel lightweight plug-and-play method that seamlessly integrates visual condition into personalized text-to-image generation. ViCo stands out for its unique feature of not requiring any fine-tuning of the original diffusion model parameters, thereby facilitating more flexible and scalable model deployment. This key advantage distinguishes ViCo from most existing models that necessitate partial or full diffusion fine-tuning. ViCo incorporates an image attention module that conditions the diffusion process on patch-wise visual semantics, and an attention-based object mask that comes almost at no cost from the attention module. Despite only requiring light parameter training (~6% compared to the diffusion U-Net), ViCo delivers performance that is on par with, or even surpasses, all state-of-the-art models, both qualitatively and quantitatively. This underscores the efficacy of ViCo, making it a highly promising solution for personalized text-to-image generation without the need for diffusion model fine-tuning.",
        "keywords": "personalized generation;text-to-image;diffusion model",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Shaozhe Hao;Kai Han;Shihao Zhao;Kwan-Yee K. Wong",
        "authorids": "~Shaozhe_Hao1;~Kai_Han1;~Shihao_Zhao1;~Kwan-Yee_K._Wong1",
        "gender": "M;M;M;M",
        "homepage": "https://haoosz.github.io/;http://www.kaihan.org/;https://github.com/ShihaoZhaoZSH;https://i.cs.hku.hk/~kykwong/",
        "dblp": "313/9551;51/4757-1.html;77/7644;w/KwanYeeKennethWong",
        "google_scholar": "72uQORoAAAAJ;tG8S_vMAAAAJ;dNQiLDQAAAAJ;https://scholar.google.com/citations?sortby=pubdate",
        "orcid": ";0000-0002-7995-9999;;0000-0001-8560-9007",
        "linkedin": "https://linkedin.com/in/haoshaozhe/;kaihancs/;;kenneth-wong-94a4621a9/",
        "or_profile": "~Shaozhe_Hao1;~Kai_Han1;~Shihao_Zhao1;~Kwan-Yee_Kenneth_Wong2",
        "aff": "University of Hong Kong;The University of Hong Kong;University of Hong Kong;The University of Hong Kong",
        "aff_domain": "hku.hk;hku.hk;hku.hk;hku.hk",
        "position": "PhD student;Assistant Professor;PhD student;Associate Professor",
        "bibtex": "@misc{\nhao2024vico,\ntitle={ViCo: Plug-and-play Visual Condition for Personalized Text-to-image Generation},\nauthor={Shaozhe Hao and Kai Han and Shihao Zhao and Kwan-Yee K. Wong},\nyear={2024},\nurl={https://openreview.net/forum?id=r2uhY4pXrb}\n}",
        "github": "",
        "project": "",
        "reviewers": "dE3Q;cbrM;Z7sX;xPT1",
        "site": "https://openreview.net/forum?id=r2uhY4pXrb",
        "pdf_size": 32974633,
        "rating": "5;5;6;6",
        "confidence": "3;4;3;2",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "86;27;70;67",
        "wc_strengths": "36;81;75;70",
        "wc_weaknesses": "282;168;53;44",
        "wc_questions": "291;132;92;17",
        "wc_review": "695;408;290;198",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "547;694;910;557",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            62.5,
            21.73131381210073
        ],
        "wc_strengths_avg": [
            65.5,
            17.471405209656147
        ],
        "wc_weaknesses_avg": [
            136.75,
            97.07052848316012
        ],
        "wc_questions_avg": [
            133.0,
            100.12741882221871
        ],
        "wc_review_avg": [
            397.75,
            187.06466128053154
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            677.0,
            146.52474193800853
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.7071067811865475,
        "gs_citation": 50,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13109855177906924194&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of Hong Kong",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.hku.hk",
        "aff_unique_abbr": "HKU",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "r2ve0q6cIO",
        "title": "Graph Neural Networks Gone Hogwild",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph neural networks (GNNs) constitute a dominant class of architectures for modelling graph-structured data.\n  Message-passing GNNs in particular appear to be ideal for applications where distributed inference is desired, since node updates can be performed locally. \n  Implementing distributed inference of GNNs on enormous graphs is a conspicuous example of such an application.\n  In this work, we are particularly motivated by the view that GNNs can be interpreted as parametric communication policies between agents which collectively solve a distributed optimization problem (e.g., in robotic swarms or sensor networks).\n  For these applications, node synchrony and central control are undesirable, since they result in communication bottlenecks and reduce fault tolerance and scalability.\n  We examine GNN inference under asynchrony, and find that most GNNs generate arbitrarily incorrect predictions in this regime. \n  A notable exception is GNNs which cast message passing as a fixed point iteration with contractive update functions. \n  We propose a novel GNN architecture, energy GNNs, in which node embeddings are computed by minimizing a scalar-valued convex \"energy\" function.\n  By framing message passing as convex optimization, we unlock a richer class of update functions which preserve robustness under asynchronous execution. \n  We show that, empirically, we outperform other GNNs which are amenable to asynchronous execution on a multitude of tasks across both synthetic and real-world datasets.",
        "keywords": "graph neural network",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/bcc00991859ffde4f0eac3e5ab0e0e446654fff2.pdf",
        "author": "Olga Solodova;Nick Richardson;Deniz Oktay;Ryan P Adams",
        "authorids": "~Olga_Solodova1;~Nick_Richardson1;~Deniz_Oktay2;~Ryan_P_Adams1",
        "gender": ";M;M;M",
        "homepage": ";https://www.cs.princeton.edu/~nr14/;https://www.cs.princeton.edu/~doktay/;http://www.cs.princeton.edu/~rpa/",
        "dblp": ";;;32/909",
        "google_scholar": ";TwnmjhgAAAAJ;NQ1BBEwAAAAJ;grQ_GBgAAAAJ",
        "orcid": ";;;",
        "linkedin": "olga-solodova-9b138318b/;nick-richardson-854271214/;deniz-oktay-65b20a53;",
        "or_profile": "~Olga_Solodova1;~Nick_Richardson1;~Deniz_Oktay2;~Ryan_P_Adams1",
        "aff": "Princeton University;Princeton University;Princeton University;Princeton University",
        "aff_domain": "princeton.edu;princeton.edu;princeton.edu;princeton.edu",
        "position": "PhD student;PhD student;PhD student;Professor",
        "bibtex": "@misc{\nsolodova2024graph,\ntitle={Graph Neural Networks Gone Hogwild},\nauthor={Olga Solodova and Nick Richardson and Deniz Oktay and Ryan P Adams},\nyear={2024},\nurl={https://openreview.net/forum?id=r2ve0q6cIO}\n}",
        "github": "",
        "project": "",
        "reviewers": "fGVf;zshX;Ea9C;e2vg",
        "site": "https://openreview.net/forum?id=r2ve0q6cIO",
        "pdf_size": 566727,
        "rating": "3;3;5;6",
        "confidence": "3;3;3;2",
        "soundness": "2;1;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;1;3;3",
        "wc_summary": "95;76;116;42",
        "wc_strengths": "52;12;22;54",
        "wc_weaknesses": "174;152;39;44",
        "wc_questions": "1189;29;256;84",
        "wc_review": "1510;269;433;224",
        "wc_reply_reviewers": "759;203;27;0",
        "wc_reply_authors": "3212;985;1006;1000",
        "reply_reviewers": "2;1;1;0",
        "reply_authors": "6;2;2;2",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            82.25,
            27.206387117733954
        ],
        "wc_strengths_avg": [
            35.0,
            18.35755975068582
        ],
        "wc_weaknesses_avg": [
            102.25,
            61.271424824301256
        ],
        "wc_questions_avg": [
            389.5,
            469.1249833466557
        ],
        "wc_review_avg": [
            609.0,
            525.9757598977352
        ],
        "wc_reply_reviewers_avg": [
            247.25,
            305.56862977079305
        ],
        "wc_reply_authors_avg": [
            1550.75,
            959.1536308120822
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            3.0,
            1.7320508075688772
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.7777777777777777,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9162177528572585131&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Princeton University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.princeton.edu",
        "aff_unique_abbr": "Princeton",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Catastrophic Jailbreak of Open-source LLMs via Exploiting Generation",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17706",
        "id": "r42tSSCHPh",
        "author_site": "Yangsibo Huang, Samyak Gupta, Mengzhou Xia, Kai Li, Danqi Chen",
        "tldr": "",
        "abstract": "The rapid progress in open-source large language models (LLMs) is significantly advancing AI development. Extensive efforts have been made before model release to align their behavior with human values, with the primary goal of ensuring their helpfulness and harmlessness. However, even carefully aligned models can be manipulated maliciously, leading to unintended behaviors, known as ``jailbreaks\". These jailbreaks are typically triggered by specific text inputs, often referred to as adversarial prompts. In this work, we propose the generation exploitation attack, an extremely simple approach that disrupts model alignment by only manipulating variations of decoding methods. By exploiting different generation strategies, including varying decoding hyper-parameters and sampling methods, we increase the attack success rate from $0\\%$ to more than $95\\%$ across 11 language models including LLaMA2, Vicuna, Falcon, and MPT families, outperforming state-of-the-art attacks with $30\\times$ lower computational cost. Finally, we propose an effective alignment method that explores diverse generation strategies, which can reasonably reduce the attack success rate under our attack. Altogether, our study underscores a major failure in current safety evaluation and alignment procedures for open-source LLMs, strongly advocating for more comprehensive red teaming and better alignment before releasing such models.",
        "keywords": "Large Language Model;Alignment;Attack",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Yangsibo Huang;Samyak Gupta;Mengzhou Xia;Kai Li;Danqi Chen",
        "authorids": "~Yangsibo_Huang2;~Samyak_Gupta1;~Mengzhou_Xia1;~Kai_Li8;~Danqi_Chen1",
        "gender": "F;M;F;M;F",
        "homepage": "https://hazelsuko07.github.io/yangsibo/;https://samkg.github.io;https://xiamengzhou.github.io/;https://www.cs.princeton.edu/~li/;https://www.cs.princeton.edu/~danqic/",
        "dblp": ";305/0404;241/9329;l/KaiLi1.html;87/7949",
        "google_scholar": "NMPUDa0AAAAJ;;zyJn1IcAAAAJ;9MSpWOUAAAAJ;sVR8ktkAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Yangsibo_Huang2;~Samyak_Gupta1;~Mengzhou_Xia1;~Kai_Li8;~Danqi_Chen1",
        "aff": "Princeton University;Princeton University;Princeton University;Princeton University;Princeton University",
        "aff_domain": "princeton.edu;princeton.edu;princeton.edu;princeton.edu;cs.princeton.edu",
        "position": "PhD student;PhD student;PhD student;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nhuang2024catastrophic,\ntitle={Catastrophic Jailbreak of Open-source {LLM}s via Exploiting Generation},\nauthor={Yangsibo Huang and Samyak Gupta and Mengzhou Xia and Kai Li and Danqi Chen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=r42tSSCHPh}\n}",
        "github": "",
        "project": "",
        "reviewers": "T4LM;FtKH;xG36;v8p3",
        "pdf_size": 1107114,
        "rating": "6;6;8;8",
        "confidence": "4;3;4;4",
        "soundness": "3;3;3;4",
        "contribution": "3;3;2;3",
        "presentation": "3;3;4;4",
        "wc_summary": "75;61;270;123",
        "wc_strengths": "38;68;343;183",
        "wc_weaknesses": "58;93;995;163",
        "wc_questions": "58;86;224;28",
        "wc_review": "229;308;1832;497",
        "wc_reply_reviewers": "0;0;41;0",
        "wc_reply_authors": "411;614;2101;638",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "2;2;4;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            132.25,
            82.78700079118701
        ],
        "wc_strengths_avg": [
            158.0,
            119.73930014828048
        ],
        "wc_weaknesses_avg": [
            327.25,
            387.37473781856244
        ],
        "wc_questions_avg": [
            99.0,
            75.02666192761077
        ],
        "wc_review_avg": [
            716.5,
            651.3541663334933
        ],
        "wc_reply_reviewers_avg": [
            10.25,
            17.75352077758099
        ],
        "wc_reply_authors_avg": [
            941.0,
            675.5068467454641
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            1.0897247358851685
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 292,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=201802340228203068&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=r42tSSCHPh",
        "pdf": "https://openreview.net/pdf?id=r42tSSCHPh",
        "email": "princeton.edu;princeton.edu;princeton.edu;princeton.edu;cs.princeton.edu",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Princeton University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.princeton.edu",
        "aff_unique_abbr": "Princeton",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Nearly $d$-Linear Convergence Bounds for Diffusion Models via Stochastic Localization",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17705",
        "id": "r5njV3BsuD",
        "author_site": "Joe Benton, Valentin De Bortoli, Arnaud Doucet, George Deligiannidis",
        "tldr": "",
        "abstract": "Denoising diffusions are a powerful method to generate approximate samples from high-dimensional data distributions. Recent results provide polynomial bounds on their convergence rate, assuming $L^2$-accurate scores. Until now, the tightest bounds were either superlinear in the data dimension or required strong smoothness assumptions. We provide the first convergence bounds which are linear in the data dimension (up to logarithmic factors) assuming only finite second moments of the data distribution. We show that diffusion models require at most $\\tilde O(\\frac{d \\log^2(1/\\delta)}{\\varepsilon^2})$ steps to approximate an arbitrary distribution on $\\mathbb{R}^d$ corrupted with Gaussian noise of variance $\\delta$ to within $\\varepsilon^2$ in KL divergence. Our proof extends the Girsanov-based methods of previous works. We introduce a refined treatment of the error from discretizing the reverse SDE inspired by stochastic localization.",
        "keywords": "diffusion models;score-based generative models;convergence bounds;stochastic localization",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Joe Benton;Valentin De Bortoli;Arnaud Doucet;George Deligiannidis",
        "authorids": "~Joe_Benton1;~Valentin_De_Bortoli1;~Arnaud_Doucet2;~George_Deligiannidis2",
        "gender": "M;;;M",
        "homepage": "https://joejbenton.com/;https://vdeborto.github.io/;https://www.stats.ox.ac.uk/~doucet/;https://www.stats.ox.ac.uk/~deligian",
        "dblp": ";224/9338;68/1628;",
        "google_scholar": "ywp_eYsAAAAJ;;W4SZGV8AAAAJ;https://scholar.google.co.uk/citations?user=EF1FwN4AAAAJ",
        "orcid": "0000-0002-2103-6112;;0000-0002-7662-419X;",
        "linkedin": "joe-benton-686420157/;;;",
        "or_profile": "~Joe_Benton1;~Valentin_De_Bortoli1;~Arnaud_Doucet2;~George_Deligiannidis2",
        "aff": "Anthropic;University of Oxford;University of Oxford;Oxford, University of Oxford",
        "aff_domain": "anthropic.com;ox.ac.uk;ox.ac.uk;stats.ox.ac.uk",
        "position": "Researcher;Postdoc;Full Professor;Associate Professor",
        "bibtex": "@inproceedings{\nbenton2024nearly,\ntitle={Nearly \\$d\\$-Linear Convergence Bounds for Diffusion Models via Stochastic Localization},\nauthor={Joe Benton and Valentin De Bortoli and Arnaud Doucet and George Deligiannidis},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=r5njV3BsuD}\n}",
        "github": "",
        "project": "",
        "reviewers": "4GBU;GLNq;wcsw;73Lh;TDrD;sqy6",
        "pdf_size": 469968,
        "rating": "6;6;8;8;8;8",
        "confidence": "4;4;3;4;3;4",
        "soundness": "4;3;4;3;4;3",
        "contribution": "3;2;4;3;4;3",
        "presentation": "3;4;3;3;3;3",
        "wc_summary": "147;46;74;60;136;109",
        "wc_strengths": "16;48;193;77;95;110",
        "wc_weaknesses": "19;114;287;123;317;210",
        "wc_questions": "16;118;124;311;49;155",
        "wc_review": "198;326;678;571;597;584",
        "wc_reply_reviewers": "0;0;55;0;23;0",
        "wc_reply_authors": "296;422;661;763;923;997",
        "reply_reviewers": "0;0;1;0;1;0",
        "reply_authors": "1;1;1;1;2;2",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.1666666666666665,
            0.6871842709362768
        ],
        "presentation_avg": [
            3.1666666666666665,
            0.3726779962499649
        ],
        "wc_summary_avg": [
            95.33333333333333,
            37.963432698087544
        ],
        "wc_strengths_avg": [
            89.83333333333333,
            55.44191154312373
        ],
        "wc_weaknesses_avg": [
            178.33333333333334,
            103.784498949613
        ],
        "wc_questions_avg": [
            128.83333333333334,
            94.08757740648986
        ],
        "wc_review_avg": [
            492.3333333333333,
            170.44908004705948
        ],
        "wc_reply_reviewers_avg": [
            13.0,
            20.575065816014618
        ],
        "wc_reply_authors_avg": [
            677.0,
            251.91069846276875
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5000000000000002,
        "gs_citation": 154,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17514959794656491179&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=r5njV3BsuD",
        "pdf": "https://openreview.net/pdf?id=r5njV3BsuD",
        "email": "anthropic.com;ox.ac.uk;ox.ac.uk;stats.ox.ac.uk",
        "author_num": 4,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Anthropic;University of Oxford",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.anthropic.com;https://www.ox.ac.uk",
        "aff_unique_abbr": "Anthropic;Oxford",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Oxford",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "r5sikTJ94y",
        "title": "Reshape and Adapt for Output Quantization (RAOQ): Quantization-aware Training for In-memory Computing Systems",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In-memory computing (IMC) has emerged as a promising solution to address both the computation and data-movement challenges posed by modern AI models. IMC takes advantage of the intrinsic parallelism of memory hardware and performs computation on data in-place directly in the memory array. To do this, IMC typically relies on analog operation, which enables high energy and area efficiency. However, analog operation makes analog-to-digital converters (ADCs) necessary, for converting results back to the digital domain. This introduces an important new source of quantization error, impacting inference accuracy. This paper proposes a Reshape and Adapt for Output Quantization (RAOQ) approach to overcome this issue, which comprises two classes of mechanisms motivated by the fundamental impact and constraints of ADC quantization, including: 1) mitigating ADC quantization error by adjusting the statistics of activations and weights, through an activation-shifting approach (A-shift) and a weight reshaping technique (W-reshape); 2) adapting AI models to better tolerate ADC quantization, through a bit augmentation method (BitAug) to aid SGD-based optimization. RAOQ demonstrates consistently high performance across different scales of neural network models for image classification, object detection, and natural language processing (NLP) tasks at various ADC bit precisions, achieving state-of-the-art accuracy with practical IMC implementations.",
        "keywords": "Quantization aware training;efficient deep learning inference;in-memory computing",
        "primary_area": "infrastructure, software libraries, hardware, etc.",
        "supplementary_material": "/attachment/e9cb59337c7e24432e354f7499e463478f692b70.zip",
        "author": "Bonan Zhang;Chia-Yu Chen;Naveen Verma",
        "authorids": "~Bonan_Zhang1;~Chia-Yu_Chen2;~Naveen_Verma1",
        "gender": ";M;M",
        "homepage": "https://ece.princeton.edu/people/bonan-zhang;https://www.linkedin.com/in/chia-yu-chen-82235723;https://nverma.princeton.edu/",
        "dblp": ";;",
        "google_scholar": ";;aX4-unUAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Bonan_Zhang1;~Chia-Yu_Chen2;~Naveen_Verma1",
        "aff": ";;",
        "aff_domain": ";;",
        "position": ";;",
        "bibtex": "@misc{\nzhang2024reshape,\ntitle={Reshape and Adapt for Output Quantization ({RAOQ}): Quantization-aware Training for In-memory Computing Systems},\nauthor={Bonan Zhang and Chia-Yu Chen and Naveen Verma},\nyear={2024},\nurl={https://openreview.net/forum?id=r5sikTJ94y}\n}",
        "github": "",
        "project": "",
        "reviewers": "7qFb;dnyX;zm7p;5va5",
        "site": "https://openreview.net/forum?id=r5sikTJ94y",
        "pdf_size": 1168783,
        "rating": "5;5;5;6",
        "confidence": "4;4;5;4",
        "soundness": "3;3;2;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "54;56;107;33",
        "wc_strengths": "40;54;48;48",
        "wc_weaknesses": "74;66;394;89",
        "wc_questions": "4;153;87;83",
        "wc_review": "172;329;636;253",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "328;626;1048;409",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;3;2",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            62.5,
            27.225906780123964
        ],
        "wc_strengths_avg": [
            47.5,
            4.9749371855331
        ],
        "wc_weaknesses_avg": [
            155.75,
            137.8012608795725
        ],
        "wc_questions_avg": [
            81.75,
            52.79855585146245
        ],
        "wc_review_avg": [
            347.5,
            175.57405844827989
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            602.75,
            279.20187588911364
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14635013488959972103&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5
    },
    {
        "title": "UniversalNER: Targeted Distillation from Large Language Models for Open Named Entity Recognition",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17704",
        "id": "r65xfUb76p",
        "author_site": "Wenxuan Zhou, Sheng Zhang, Yu Gu, Muhao Chen, Hoifung Poon",
        "tldr": "",
        "abstract": "Large language models (LLMs) have demonstrated remarkable generalizability, such as understanding arbitrary entities and relations. Instruction tuning has proven effective for distilling LLMs into more cost-efficient models such as Alpaca and Vicuna. Yet such student models still trail the original LLMs by large margins in downstream applications. In this paper, we explore targeted distillation with mission-focused instruction tuning to train student models that can excel in a broad application class such as open information extraction. Using named entity recognition (NER) for case study, we show how ChatGPT can be distilled into much smaller UniversalNER models for open NER. For evaluation, we assemble the largest NER benchmark to date, comprising 43 datasets across 9 diverse domains such as biomedicine, programming, social media, law, finance. Without using any direct supervision, UniversalNER attains remarkable NER accuracy across tens of thousands of entity types, outperforming general instruction-tuned models such as Alpaca and Vicuna by over 30 absolute F1 points in average. With a tiny fraction of parameters, UniversalNER not only acquires ChatGPT's capability in recognizing arbitrary entity types, but also outperforms its NER accuracy by 7-9 absolute F1 points in average. Remarkably, UniversalNER even outperforms by a large margin state-of-the-art multi-task instruction-tuned systems such as InstructUIE, which uses supervised NER examples. We also conduct thorough ablation studies to assess the impact of various components in our distillation approach. We release the distillation recipe, data, and UniversalNER models to facilitate future research on targeted distillation.",
        "keywords": "named entity recognition;large language model",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Wenxuan Zhou;Sheng Zhang;Yu Gu;Muhao Chen;Hoifung Poon",
        "authorids": "~Wenxuan_Zhou2;~Sheng_Zhang9;~Yu_Gu12;~Muhao_Chen1;~Hoifung_Poon1",
        "gender": "M;M;;M;M",
        "homepage": "https://wzhouad.github.io/;https://sheng-z.github.io/;;https://muhaochen.github.io/;https://www.microsoft.com/en-us/research/people/hoifung/",
        "dblp": ";69/6137-12;;173/2608;78/4609",
        "google_scholar": "https://scholar.google.com/citations?hl=en;-LVEXQ8AAAAJ;1PoaURIAAAAJ;k79yEZkAAAAJ;yqqmVbkAAAAJ",
        "orcid": ";;;0000-0003-0118-3147;0000-0002-9067-0918",
        "linkedin": ";sheng-z/;;;hoifung-poon-9559943/",
        "or_profile": "~Wenxuan_Zhou2;~Sheng_Zhang9;~Yu_Gu12;~Muhao_Chen1;~Hoifung_Poon1",
        "aff": "Zoom;Microsoft;Microsoft;University of Southern California;Microsoft",
        "aff_domain": "zoom.us;microsoft.com;microsoft.com;usc.edu;microsoft.com",
        "position": "Researcher;Researcher;Researcher;Adjunct Professor;General Manager",
        "bibtex": "@inproceedings{\nzhou2024universalner,\ntitle={Universal{NER}: Targeted Distillation from Large Language Models for Open Named Entity Recognition},\nauthor={Wenxuan Zhou and Sheng Zhang and Yu Gu and Muhao Chen and Hoifung Poon},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=r65xfUb76p}\n}",
        "github": "",
        "project": "",
        "reviewers": "YLpo;qcHf;rYsM",
        "pdf_size": 469898,
        "rating": "3;6;8",
        "confidence": "5;4;4",
        "soundness": "3;2;3",
        "contribution": "2;3;3",
        "presentation": "3;3;3",
        "wc_summary": "84;30;24",
        "wc_strengths": "29;57;71",
        "wc_weaknesses": "130;192;52",
        "wc_questions": "26;112;1",
        "wc_review": "269;391;148",
        "wc_reply_reviewers": "0;14;0",
        "wc_reply_authors": "588;1552;236",
        "reply_reviewers": "0;1;0",
        "reply_authors": "1;3;1",
        "rating_avg": [
            5.666666666666667,
            2.0548046676563256
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            46.0,
            26.981475126464083
        ],
        "wc_strengths_avg": [
            52.333333333333336,
            17.46106780494506
        ],
        "wc_weaknesses_avg": [
            124.66666666666667,
            57.27904406402824
        ],
        "wc_questions_avg": [
            46.333333333333336,
            47.5417944783558
        ],
        "wc_review_avg": [
            269.3333333333333,
            99.20461458800975
        ],
        "wc_reply_reviewers_avg": [
            4.666666666666667,
            6.599663291074443
        ],
        "wc_reply_authors_avg": [
            792.0,
            556.2829016486726
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9176629354822472,
        "gs_citation": 133,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18239610379074827059&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=r65xfUb76p",
        "pdf": "https://openreview.net/pdf?id=r65xfUb76p",
        "email": "zoom.us;microsoft.com;microsoft.com;usc.edu;microsoft.com",
        "author_num": 5,
        "aff_unique_index": "0;1;1;2;1",
        "aff_unique_norm": "Zoom Video Communications Inc.;Microsoft;University of Southern California",
        "aff_unique_dep": ";Microsoft Corporation;",
        "aff_unique_url": "https://zoom.us;https://www.microsoft.com;https://www.usc.edu",
        "aff_unique_abbr": "Zoom;Microsoft;USC",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Los Angeles",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "r6NMqADLGQ",
        "title": "How To Train Your Covariance",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We study the problem of _unsupervised heteroscedastic covariance estimation_, where the goal is to learn the multivariate target distribution $\\mathcal{N}(y, \\Sigma_y | x )$ given an observation $x$. This problem is particularly challenging as $\\Sigma_{y}$ varies for different samples (heteroscedastic) and no annotation for the covariance is available (unsupervised). Typically, state-of-the-art methods predict the mean $f(x ; \\theta)$ and covariance $Cov(f(x); \\Theta)$ of the target distribution through two neural networks trained using the negative log-likelihood. \nThis raises two questions: (1) Does the predicted covariance truly capture the randomness of the predicted mean? (2) In the absence of ground-truth annotation, how can we quantify the performance of covariance estimation? \nWe address (1) by developing the __Spatial Variance__, a formulation of $Cov(f(x); \\Theta)$ that captures the randomness in $ f(x ; \\theta)$ by incorporating its curvature around $x$. Furthermore, we tackle (2) by introducing the _Conditional Mean Absolute Error (C-MAE)_, a metric which leverages well-known properties of the normal distribution. We verify the effectiveness of our approach through multiple experiments spanning synthetic (univariate, multivariate) and real-world datasets (UCI Regression, LSP, and MPII Human Pose Estimation). Our experiments provide evidence that our approach outperforms the state of the art across these datasets and multiple network architectures, and accurately learns the relation underlying the target random variables.",
        "keywords": "Unsupervised Heteroscedastic Covariance Estimation;Spatial Variance;Correlation;Conditional Mean Absolute Error",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Megh Shukla;Mathieu Salzmann;Alexandre Alahi",
        "authorids": "~Megh_Shukla1;~Mathieu_Salzmann1;~Alexandre_Alahi3",
        "gender": "M;M;M",
        "homepage": "https://meghshukla.github.io;https://people.epfl.ch/mathieu.salzmann;https://vita.epfl.ch/",
        "dblp": "251/3159;18/4533;48/3455",
        "google_scholar": "1_yu5DAAAAAJ;https://scholar.google.ch/citations?user=n-B0jr4AAAAJ;UIhXQ64AAAAJ",
        "orcid": "0000-0001-7189-2278;;",
        "linkedin": "megh-shukla/;;",
        "or_profile": "~Megh_Shukla1;~Mathieu_Salzmann1;~Alexandre_Alahi3",
        "aff": "EPFL - EPF Lausanne;CSIRO;EPFL",
        "aff_domain": "epfl.ch;data61.csiro.au;epfl.ch",
        "position": "PhD student;Collaborator;Associate Professor",
        "bibtex": "@misc{\nshukla2024how,\ntitle={How To Train Your Covariance},\nauthor={Megh Shukla and Mathieu Salzmann and Alexandre Alahi},\nyear={2024},\nurl={https://openreview.net/forum?id=r6NMqADLGQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "Q3zL;r64o;kqRb;G5cy",
        "site": "https://openreview.net/forum?id=r6NMqADLGQ",
        "pdf_size": 1635447,
        "rating": "1;5;6;6",
        "confidence": "5;4;4;3",
        "soundness": "1;2;3;3",
        "contribution": "1;2;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "52;87;88;44",
        "wc_strengths": "14;30;58;89",
        "wc_weaknesses": "177;383;61;3",
        "wc_questions": "54;9;233;74",
        "wc_review": "297;509;440;210",
        "wc_reply_reviewers": "249;0;17;0",
        "wc_reply_authors": "1269;524;468;270",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            4.5,
            2.0615528128088303
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            67.75,
            19.954636052807377
        ],
        "wc_strengths_avg": [
            47.75,
            28.551488577655633
        ],
        "wc_weaknesses_avg": [
            156.0,
            145.2618325645109
        ],
        "wc_questions_avg": [
            92.5,
            84.46448957994123
        ],
        "wc_review_avg": [
            364.0,
            117.26678984264898
        ],
        "wc_reply_reviewers_avg": [
            66.5,
            105.59474418738841
        ],
        "wc_reply_authors_avg": [
            632.75,
            379.2659851608103
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8574929257125441,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:4WecUDQrFaUJ:scholar.google.com/&scioq=How+To+Train+Your+Covariance&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "EPFL;Commonwealth Scientific and Industrial Research Organisation",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.epfl.ch;https://www.csiro.au",
        "aff_unique_abbr": "EPFL;CSIRO",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Lausanne;",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Switzerland;Australia"
    },
    {
        "id": "r7OB810eaP",
        "title": "Non-ergodicity in reinforcement learning: robustness via ergodic transformations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Envisioned application areas for reinforcement learning (RL) include autonomous driving, precision agriculture, and finance, which all require RL agents to make decisions in the real world. A significant challenge hindering the adoption of RL methods in these domains is the non-robustness of conventional algorithms. In this paper, we argue that a fundamental issue contributing to this lack of robustness lies in the focus on the expected value of the accumulated reward as the sole \u201ccorrect\u201d optimization objective. The expected value is the average over the statistical ensemble of infinitely many trajectories. For non-ergodic rewards, this average differs from the average over a single but infinitely long trajectory. Consequently, optimizing the expected value can lead to policies that yield exceptionally high rewards with probability zero but almost surely result in catastrophic outcomes. This problem can be circumvented by transforming the time series of collected rewards into one with ergodic increments. This transformation enables learning robust policies by optimizing the long-term reward for individual agents rather than the average across infinitely many trajectories. We propose an algorithm for learning ergodic transformations from data and demonstrate its effectiveness in an instructive environment with non-ergodic rewards and on standard RL benchmarks.",
        "keywords": "Reinforcement learning;Ergodicity;Reward transformation",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/8bdb5a19ba0b78a80b1d0714ebe925424d01d22c.zip",
        "author": "Dominik Baumann;Erfaun Noorani;James Price;Ole Peters;Colm Connaughton;Thomas B. Sch\u00f6n",
        "authorids": "~Dominik_Baumann1;~Erfaun_Noorani1;~James_Price1;~Ole_Peters1;~Colm_Connaughton1;~Thomas_B._Sch\u00f6n1",
        "gender": "M;M;M;M;;M",
        "homepage": "https://baumanndominik.github.io/;;https://warwick.ac.uk/fac/sci/mathsys/people/students/2019intake/price/;https://sites.santafe.edu/~ole/;https://colmconnaughton.net/;http://user.it.uu.se/~thosc112/index.html",
        "dblp": "215/4492;262/0113.html;;;231/5811;85/4891",
        "google_scholar": "bJX8-CEAAAAJ;;;https://scholar.google.co.uk/citations?user=oKKJdF4AAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.se/citations?user=FUqUC2oAAAAJ",
        "orcid": "0000-0001-7340-2180;;;0000-0002-1246-8570;0000-0003-4137-7050;0000-0001-5183-234X",
        "linkedin": ";;;;colmconnaughton/;thomas-sch%C3%B6n-2b587b1/",
        "or_profile": "~Dominik_Baumann1;~Erfaun_Noorani1;~James_Price1;~Ole_Peters1;~Colm_Connaughton1;~Thomas_B._Sch\u00f6n1",
        "aff": "Aalto University;Massachusetts Institute of Technology;;London Mathematical Laboratory;University of Warwick;Uppsala University",
        "aff_domain": "aalto.fi;mit.edu;;lml.org.uk;warwick.ac.uk;uu.se",
        "position": "Assistant Professor;Researcher;;Principal Researcher;Full Professor;Full Professor",
        "bibtex": "@misc{\nbaumann2024nonergodicity,\ntitle={Non-ergodicity in reinforcement learning: robustness via ergodic transformations},\nauthor={Dominik Baumann and Erfaun Noorani and James Price and Ole Peters and Colm Connaughton and Thomas B. Sch{\\\"o}n},\nyear={2024},\nurl={https://openreview.net/forum?id=r7OB810eaP}\n}",
        "github": "",
        "project": "",
        "reviewers": "Euet;kiF6;R8mx;txDk;trX8",
        "site": "https://openreview.net/forum?id=r7OB810eaP",
        "pdf_size": 601575,
        "rating": "1;3;3;5;5",
        "confidence": "4;3;4;3;3",
        "soundness": "1;3;1;3;2",
        "contribution": "1;2;1;2;2",
        "presentation": "1;3;2;3;3",
        "wc_summary": "54;95;147;244;66",
        "wc_strengths": "43;62;64;68;40",
        "wc_weaknesses": "292;156;311;133;103",
        "wc_questions": "56;279;221;152;107",
        "wc_review": "445;592;743;597;316",
        "wc_reply_reviewers": "73;0;67;258;0",
        "wc_reply_authors": "404;321;707;627;475",
        "reply_reviewers": "1;0;1;2;0",
        "reply_authors": "2;1;1;2;1",
        "rating_avg": [
            3.4,
            1.4966629547095767
        ],
        "confidence_avg": [
            3.4,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.0,
            0.8944271909999159
        ],
        "contribution_avg": [
            1.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.4,
            0.8
        ],
        "wc_summary_avg": [
            121.2,
            69.27452634266076
        ],
        "wc_strengths_avg": [
            55.4,
            11.551623262554921
        ],
        "wc_weaknesses_avg": [
            199.0,
            85.57336034070417
        ],
        "wc_questions_avg": [
            163.0,
            79.40528949635534
        ],
        "wc_review_avg": [
            538.6,
            145.84457480482433
        ],
        "wc_reply_reviewers_avg": [
            79.6,
            94.55284236869878
        ],
        "wc_reply_authors_avg": [
            506.8,
            141.86528821385448
        ],
        "reply_reviewers_avg": [
            0.8,
            0.7483314773547883
        ],
        "reply_authors_avg": [
            1.4,
            0.4898979485566356
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.7637626158259733,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8806834201064909629&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "Aalto University;Massachusetts Institute of Technology;London Mathematical Laboratory;University of Warwick;Uppsala University",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.aalto.fi;https://web.mit.edu;https://lml.berkeley.edu;https://www.warwick.ac.uk;https://www.uu.se",
        "aff_unique_abbr": "Aalto;MIT;;Warwick;UU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;2;3",
        "aff_country_unique": "Finland;United States;United Kingdom;Sweden"
    },
    {
        "id": "r7cYRi7NxT",
        "title": "Hierarchical Side-Tuning for Vision Transformers",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Fine-tuning pre-trained Vision Transformers (ViT) has consistently demonstrated promising performance in the realm of visual recognition. However, adapting large pre-trained models to various tasks poses a significant challenge. This challenge arises from the need for each model to undergo an independent and comprehensive fine-tuning process, leading to substantial computational and memory demands. \nWhile recent advancements in Parameter-efficient Transfer Learning (PETL) have demonstrated their ability to achieve superior performance compared to full fine-tuning with a smaller subset of parameter updates, they tend to overlook dense prediction tasks such as object detection and segmentation. In this paper, we introduce Hierarchical Side-Tuning (HST), a novel PETL approach that enables ViT transfer to various downstream tasks effectively. Diverging from existing methods that exclusively fine-tune parameters within input spaces or certain modules connected to the backbone, we tune a lightweight and hierarchical side network (HSN) that leverages intermediate activations extracted from the backbone and generates multi-scale features to make predictions. To validate HST, we conducted extensive experiments encompassing diverse visual tasks, including classification, object detection, instance segmentation, and semantic segmentation. Notably, our method achieves state-of-the-art average Top-1 accuracy of 76.0% on VTAB-1k, all while fine-tuning a mere 0.78M parameters. When applied to object detection tasks on COCO testdev benchmark, HST even surpasses full fine-tuning and obtains better performance with 49.7 box AP and 43.2 mask AP using Cascade Mask R-CNN.",
        "keywords": "Deep Learning;Vision Transformer; Parameter-Efficient Transfer Learning;",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Weifeng Lin;Ziheng Wu;Jiayu Chen;Wentao Yang;Mingxin Huang;Jun Huang;Lianwen Jin",
        "authorids": "~Weifeng_Lin1;~Ziheng_Wu1;~Jiayu_Chen3;~Wentao_Yang4;~Mingxin_Huang1;~Jun_Huang4;~Lianwen_Jin1",
        "gender": "M;M;;;M;M;M",
        "homepage": "https://github.com/Afeng-x;https://www.zhihu.com/people/chen-jia-yu-65-36;;https://github.com/mxin262;;http://www.dlvc-lab.net/lianwen/;https://github.com/wuziheng",
        "dblp": "193/7842;80/8422;65/9079-3;70/1019;51/5022-7;54/3221;",
        "google_scholar": "8iCZxIAAAAAJ;;;;;WMUStEUAAAAJ;dxz-OP0AAAAJ",
        "orcid": ";;0000-0001-8738-0648;;;0000-0002-5456-0957;",
        "linkedin": ";;;;https://www.linkedin.cn/injobs/in/%E4%BF%8A-%E9%BB%84-b28b6612b;;",
        "or_profile": "~Weifeng_Lin1;~Jiayu_Chen3;~Wentao_Yang4;~Mingxin_Huang1;~Jun_Huang4;~Lianwen_Jin1;~Wu_Ziheng1",
        "aff": "South China University of Technology;Alibaba Group;South China University of Technology;South China University of Technology;Alibaba Group;South China University of Technology;Alibaba Group",
        "aff_domain": "scut.edu.cn;alibaba-inc.com;scut.edu.cn;scut.edu.cn;alibaba.com;scut.edu.cn;alibaba-inc.com",
        "position": "MS student;Researcher;PhD student;PhD student;Researcher;Professor;Researcher",
        "bibtex": "@misc{\nlin2024hierarchical,\ntitle={Hierarchical Side-Tuning for Vision Transformers},\nauthor={Weifeng Lin and Ziheng Wu and Jiayu Chen and Wentao Yang and Mingxin Huang and Jun Huang and Lianwen Jin},\nyear={2024},\nurl={https://openreview.net/forum?id=r7cYRi7NxT}\n}",
        "github": "",
        "project": "",
        "reviewers": "XCzm;eJkh;ExGi;cBa6",
        "site": "https://openreview.net/forum?id=r7cYRi7NxT",
        "pdf_size": 5544817,
        "rating": "5;5;5;6",
        "confidence": "4;4;4;4",
        "soundness": "2;3;2;3",
        "contribution": "3;2;3;3",
        "presentation": "3;3;3;4",
        "wc_summary": "77;48;40;112",
        "wc_strengths": "16;23;20;135",
        "wc_weaknesses": "316;79;88;183",
        "wc_questions": "2;16;201;121",
        "wc_review": "411;166;349;551",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "389;283;940;980",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;2;2",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            69.25,
            28.261059781968545
        ],
        "wc_strengths_avg": [
            48.5,
            50.002499937503124
        ],
        "wc_weaknesses_avg": [
            166.5,
            95.4476296195982
        ],
        "wc_questions_avg": [
            85.0,
            81.24346127535433
        ],
        "wc_review_avg": [
            369.25,
            138.29022922824302
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            648.0,
            314.560804932846
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18201515793324896269&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;0;1;0;1",
        "aff_unique_norm": "South China University of Technology;Alibaba Group",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.scut.edu.cn;https://www.alibaba.com",
        "aff_unique_abbr": "SCUT;Alibaba",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "r8J7Pw7hpj",
        "title": "Divide and Conquer: Provably Unveiling the Pareto Front with Multi-Objective Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We introduce a novel algorithm for learning the Pareto front in multi-objective Markov decision processes. Our algorithm decomposes learning the Pareto front into a sequence of single-objective problems, each of which is solved by an oracle and leads to a non-dominated solution. We propose a procedure to select the single-objective problems such that each iteration monotonically decreases the objective space that possibly still contains Pareto optimal solutions. The final algorithm is proven to converge to the Pareto front and provides an upper bound on the distance to undiscovered non-dominated policies in each iteration. We introduce several practical designs of the required oracle by extending single-objective reinforcement learning algorithms. When evaluating our algorithm with these oracles on benchmark environments, we find that it leads to a close approximation of the true Pareto front. By leveraging problem-specific single-objective solvers, our approach holds promise for applications beyond multi-objective reinforcement learning, such as in pathfinding and optimisation.",
        "keywords": "Multi-objective;Reinforcement learning;Pareto front",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/565eff2b9401038446d5b51892e2dfe423473479.zip",
        "author": "Willem R\u00f6pke;Mathieu Reymond;Patrick Mannion;Roxana R\u0103dulescu;Ann Nowe;Diederik M Roijers",
        "authorids": "~Willem_R\u00f6pke1;~Mathieu_Reymond1;~Patrick_Mannion1;~Roxana_R\u0103dulescu1;~Ann_Nowe1;~Diederik_M_Roijers1",
        "gender": "M;M;;F;F;M",
        "homepage": "https://willemropke.netlify.app/;https://mathieu-reymond.github.io/;https://www.universityofgalway.ie/our-research/people/engineering-and-informatics/patrickmannion/;https://roxanaradulescu.com;https://ai.vub.ac.be/team/ann-nowe/?utm_source=www.google.com&utm_medium=organic&utm_campaign=Google&referrer-analytics=1;http://roijers.info",
        "dblp": "252/8819;284/8515;;180/3142;95/232.html;116/9425",
        "google_scholar": ";https://scholar.google.be/citations?user=b9bYrHUAAAAJ;https://scholar.google.com/citations?hl=en;jue1nxAAAAAJ;https://scholar.google.be/citations?user=LH5QKbgAAAAJ;https://scholar.google.nl/citations?user=oi25V4EAAAAJ",
        "orcid": "0000-0001-5045-6127;0000-0002-6735-6752;;0000-0003-1446-5514;;",
        "linkedin": ";;;;;",
        "or_profile": "~Willem_R\u00f6pke1;~Mathieu_Reymond1;~Patrick_Mannion1;~Roxana_R\u0103dulescu1;~Ann_Nowe1;~Diederik_M_Roijers1",
        "aff": "Vrije Universiteit Brussel;Vrije Universiteit Brussel;University of Galway;Vrije Universiteit Brussel;Vrije Universiteit Brussel;Hogeschool Utrecht",
        "aff_domain": "vub.be;vub.be;universityofgalway.ie;vub.be;vub.be;hu.nl",
        "position": "PhD student;Researcher;Assistant Professor;Postdoc;Full Professor;Lecturer",
        "bibtex": "@misc{\nr{\\\"o}pke2024divide,\ntitle={Divide and Conquer: Provably Unveiling the Pareto Front with Multi-Objective Reinforcement Learning},\nauthor={Willem R{\\\"o}pke and Mathieu Reymond and Patrick Mannion and Roxana R{\\u{a}}dulescu and Ann Nowe and Diederik M Roijers},\nyear={2024},\nurl={https://openreview.net/forum?id=r8J7Pw7hpj}\n}",
        "github": "",
        "project": "",
        "reviewers": "uiiy;iyma;WEZT;3Frz",
        "site": "https://openreview.net/forum?id=r8J7Pw7hpj",
        "pdf_size": 567978,
        "rating": "3;3;3;6",
        "confidence": "3;3;4;2",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;2;2",
        "wc_summary": "57;150;47;90",
        "wc_strengths": "68;69;47;31",
        "wc_weaknesses": "237;606;156;72",
        "wc_questions": "110;113;111;100",
        "wc_review": "472;938;361;293",
        "wc_reply_reviewers": "32;52;0;0",
        "wc_reply_authors": "511;704;457;403",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            86.0,
            40.23058537978288
        ],
        "wc_strengths_avg": [
            53.75,
            15.801503093060482
        ],
        "wc_weaknesses_avg": [
            267.75,
            203.81655354754676
        ],
        "wc_questions_avg": [
            108.5,
            5.024937810560445
        ],
        "wc_review_avg": [
            516.0,
            251.8799317135051
        ],
        "wc_reply_reviewers_avg": [
            21.0,
            22.15851980616034
        ],
        "wc_reply_authors_avg": [
            518.75,
            113.56578490020662
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17795300768937447747&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;0;0;2",
        "aff_unique_norm": "Vrije Universiteit Brussel;National University of Ireland, Galway;Hogeschool Utrecht",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.vub.be;https://www.nuigalway.ie;https://www.hu.nl",
        "aff_unique_abbr": "VUB;NUI Galway;HU",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Brussels;",
        "aff_country_unique_index": "0;0;1;0;0;2",
        "aff_country_unique": "Belgium;Ireland;Netherlands"
    },
    {
        "id": "r8h2uUX22d",
        "title": "Understanding MLP-Mixer as a wide and sparse MLP",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Multi-layer perceptron (MLP) is a fundamental component of deep learning that has been extensively employed for various problems. \nHowever, recent empirical successes in MLP-based architectures, particularly the progress of the MLP-Mixer, suggest that our understanding of how MLPs achieve better performance remains limited and there is an underlying mechanism.\nIn this research, we reveal that the MLP-Mixer effectively behaves as a wide MLP with  sparse weights. \nInitially, we clarify that the mixing layer of the Mixer has an effective expression as a wider MLP whose weights are sparse and represented by the Kronecker product. It is also regarded as an approximation of Monarch matrices.\nNext, we confirmed similarities between the mixer and the unstructured sparse-weight MLP in  hidden features and performance when adjusting sparsity and width. To verify the similarity in much wider cases, we introduced the RP-Mixer, a more memory-efficient alternative to the unstructured sparse-weight MLP. Then we verified similar tendencies between the MLP-Mixer and the RP-Mixer, confirming that the MLP-Mixer behaves as a sparse and wide MLP, and that its better performance is from its extreme wideness. Notably, when the number of connections is fixed and the width of hidden layers is increased, sparsity rises, leading to improved performance, consistent with the hypothesis by Golubeva, Neyshabur and Gur-Ari  (2021).  Particularly, maximizing the width enables us to quantitatively determine the optimal mixing layer's size.",
        "keywords": "MLP-Mixer;structured weight matrix;wide neural network;Kronecker product",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/d487749ed68dd621ceb80d3b2fc072ce6297a2f3.zip",
        "author": "Tomohiro Hayase;Ryo Karakida",
        "authorids": "~Tomohiro_Hayase1;~Ryo_Karakida2",
        "gender": "M;M",
        "homepage": "https://thayafluss.notion.site/main;https://sites.google.com/view/ryokarakida/english",
        "dblp": "218/5945;",
        "google_scholar": "https://scholar.google.co.in/citations?user=_F82YY4AAAAJ;",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Tomohiro_Hayase1;~Ryo_Karakida2",
        "aff": "Cluster, INC.;AIST, National Institute of Advanced Industrial Science and Technology",
        "aff_domain": "cluster.mu;aist.go.jp",
        "position": "Principal Researcher;Researcher",
        "bibtex": "@misc{\nhayase2024understanding,\ntitle={Understanding {MLP}-Mixer as a wide and sparse {MLP}},\nauthor={Tomohiro Hayase and Ryo Karakida},\nyear={2024},\nurl={https://openreview.net/forum?id=r8h2uUX22d}\n}",
        "github": "",
        "project": "",
        "reviewers": "b7KH;xS5y;9wTw;xf5f;XJtr",
        "site": "https://openreview.net/forum?id=r8h2uUX22d",
        "pdf_size": 4040764,
        "rating": "5;6;6;6;6",
        "confidence": "3;2;3;3;3",
        "soundness": "4;2;3;2;3",
        "contribution": "2;2;3;2;2",
        "presentation": "3;3;3;3;2",
        "wc_summary": "50;69;41;68;142",
        "wc_strengths": "84;61;72;42;28",
        "wc_weaknesses": "132;185;93;98;135",
        "wc_questions": "3;112;78;83;26",
        "wc_review": "269;427;284;291;331",
        "wc_reply_reviewers": "61;0;73;0;0",
        "wc_reply_authors": "711;598;350;560;592",
        "reply_reviewers": "1;0;1;0;0",
        "reply_authors": "2;1;2;2;2",
        "rating_avg": [
            5.8,
            0.39999999999999997
        ],
        "confidence_avg": [
            2.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.8,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            74.0,
            35.63705936241092
        ],
        "wc_strengths_avg": [
            57.4,
            20.175232340669588
        ],
        "wc_weaknesses_avg": [
            128.6,
            32.97635516548183
        ],
        "wc_questions_avg": [
            60.4,
            39.9028821014222
        ],
        "wc_review_avg": [
            320.4,
            57.10901855223919
        ],
        "wc_reply_reviewers_avg": [
            26.8,
            33.04179171897311
        ],
        "wc_reply_authors_avg": [
            562.2,
            117.76654873095329
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.8,
            0.4000000000000001
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.2500000000000001,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2719037636805174909&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Cluster, INC.;National Institute of Advanced Industrial Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": ";https://www.aist.go.jp",
        "aff_unique_abbr": ";AIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United States;Japan"
    },
    {
        "id": "r92RVhnzKy",
        "title": "Diving Deep into Regions: Exploiting Regional information Transformer for Single Image Deraining",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Transformer-based Single Image Deraining (SID) methods have achieved remarkable success, primarily attributed to their robust capability in capturing long-range interactions. However, we've noticed that current methods handle rain-affected and unaffected regions concurrently, overlooking the disparities between these areas, resulting in confusion between rain streaks and background parts, and inabilities to obtain effective interactions, ultimately resulting in suboptimal deraining outcomes. To address the above issue, we introduce the Region Transformer (Regformer), a novel SID method that underlines the importance of independently processing rain-affected and unaffected regions while considering their combined impact for high-quality image reconstruction. The crux of our method is the innovative Region Transformer Block (RTB), which integrates a Region Masked Attention (RMA) mechanism and a Mixed Gate Forward Block (MGFB). Our RTB is used for attention selection of rain-affected and unaffected regions and local modeling of mixed scales. The RMA generates attention maps tailored to these two regions and their interactions, enabling our model to capture comprehensive features essential for rain removal. To better recover high-frequency textures and capture more local details, we develop the MGFB as a compensation module to complete local mixed scale modeling. Extensive experiments demonstrate that our model reaches state-of-the-art performance, significantly improving the image deraining quality. Our code and trained models will be publicly available.",
        "keywords": "Regional attention;feature extraction;Transformer-based model;Image deraining",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Baiang Li;Zhao Zhang;Huan Zheng;Xiaogang Xu;Yanyan Wei;Jicong Fan;Zhong-Qiu Zhao;Richang Hong",
        "authorids": "~Baiang_Li1;~Zhao_Zhang3;~Huan_Zheng2;~Xiaogang_Xu2;~Yanyan_Wei1;~Jicong_Fan2;~Zhong-Qiu_Zhao2;~Richang_Hong1",
        "gender": "M;M;M;M;M;M;M;M",
        "homepage": "http://www.escience.cn/people/cszzhang;;https://xiaogang00.github.io;https://github.com/OaDsis/OaDsis.github.io;https://jicongfan.github.io/;https://sites.google.com/site/homeofrichanghong/;https://ztmotalee.github.io;http://faculty.hfut.edu.cn/zzq123456/zh_CN/index.htm",
        "dblp": "87/6853-1;;118/2268-2;81/7807;139/1570;59/1501;354/8292.html;",
        "google_scholar": "h6SCUNwAAAAJ;XnV4edcAAAAJ;https://scholar.google.com.hk/citations?user=R65xDQwAAAAJ;pjEvug0AAAAJ;vdJsnhIAAAAJ;https://scholar.google.com/scholar?hl=en;https://scholar.google.com/citations?view_op=list_works;yELU6JcAAAAJ",
        "orcid": "0000-0002-5703-7969;;0000-0002-7928-7336;0000-0001-8818-6740;0000-0001-9665-0355;;0009-0005-3844-2554;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Zhao_Zhang3;~Huan_Zheng2;~Xiaogang_Xu2;~Yanyan_Wei1;~Jicong_Fan2;~Richang_Hong1;~Mota_Lee1;~Zhongqiu_Zhao1",
        "aff": "Hefei University of Technology;University of Macau;Zhejiang University;Hefei University of Technology;The Chinese University of Hong Kong, Shenzhen;Hefei University of Technology;Hefei University of Technology;Hefei University of Technology",
        "aff_domain": "hfut.edu;um.edu.mo;zju.edu.cn;hfut.edu.cn;cuhk.edu.cn;hfut.edu;hfut.edu.cn;hfut.edu",
        "position": "Full Professor;PhD student;Assistant Professor;Lecturer;Assistant Professor;Full Professor;Undergrad student;Researcher",
        "bibtex": "@misc{\nli2024diving,\ntitle={Diving Deep into Regions: Exploiting Regional information Transformer for Single Image Deraining},\nauthor={Baiang Li and Zhao Zhang and Huan Zheng and Xiaogang Xu and Yanyan Wei and Jicong Fan and Zhong-Qiu Zhao and Richang Hong},\nyear={2024},\nurl={https://openreview.net/forum?id=r92RVhnzKy}\n}",
        "github": "",
        "project": "",
        "reviewers": "edgT;FN5q;29g8;ac1q",
        "site": "https://openreview.net/forum?id=r92RVhnzKy",
        "pdf_size": 10128767,
        "rating": "5;6;8;8",
        "confidence": "5;5;5;5",
        "soundness": "3;2;3;4",
        "contribution": "3;2;3;4",
        "presentation": "3;2;4;3",
        "wc_summary": "74;90;38;102",
        "wc_strengths": "33;36;45;88",
        "wc_weaknesses": "56;113;88;47",
        "wc_questions": "74;3;5;32",
        "wc_review": "237;242;176;269",
        "wc_reply_reviewers": "0;70;0;0",
        "wc_reply_authors": "1130;1279;611;851",
        "reply_reviewers": "0;2;0;0",
        "reply_authors": "3;4;1;2",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            5.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            76.0,
            24.08318915758459
        ],
        "wc_strengths_avg": [
            50.5,
            22.096379793984354
        ],
        "wc_weaknesses_avg": [
            76.0,
            26.239283526803852
        ],
        "wc_questions_avg": [
            28.5,
            28.6574597618142
        ],
        "wc_review_avg": [
            231.0,
            34.007352146263905
        ],
        "wc_reply_reviewers_avg": [
            17.5,
            30.31088913245535
        ],
        "wc_reply_authors_avg": [
            967.75,
            256.95464093882407
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:JGs3YhW1bn8J:scholar.google.com/&scioq=Diving+Deep+into+Regions:+Exploiting+Regional+information+Transformer+for+Single+Image+Deraining&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;0;3;0;0;0",
        "aff_unique_norm": "Hefei University of Technology;University of Macau;Zhejiang University;Chinese University of Hong Kong",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "http://www.hfut.edu.cn/;https://www.um.edu.mo;https://www.zju.edu.cn;https://www.cuhk.edu.cn",
        "aff_unique_abbr": "HUT;UM;ZJU;CUHK",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Macau SAR;Shenzhen",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Object centric architectures enable efficient causal representation learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17703",
        "id": "r9FsiXZxZt",
        "author_site": "Amin Mansouri, Jason Hartford, Yan Zhang, Yoshua Bengio",
        "tldr": "",
        "abstract": "Causal representation learning has showed a variety of settings in which we can disentangle latent variables with identifiability guarantees (up to some reasonable equivalence class). Common to all of these approaches is the assumption that (1) the latent variables are represented as $d$-dimensional vectors, and (2) that the observations are the output of some injective generative function of these latent variables. While these assumptions appear benign, we show that when the observations are of multiple objects, the generative function is no longer injective and disentanglement fails in practice. We can address this failure by combining recent developments in object-centric learning and causal representation learning. By modifying the Slot Attention architecture (Locatello et al., 2020), we develop an object-centric architecture that leverages weak supervision from sparse perturbations to disentangle each object's properties. This approach is more data-efficient in the sense that it requires significantly fewer perturbations than a comparable approach that encodes to a Euclidean space and we show that this approach successfully disentangles the properties of a set of objects in a series of simple image-based disentanglement experiments.",
        "keywords": "object centric learning;representation learning;disentanglement;weakly supervised learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/06571a0ce54c2d14392d7a3ff40567404e2a9583.zip",
        "author": "Amin Mansouri;Jason Hartford;Yan Zhang;Yoshua Bengio",
        "authorids": "~Amin_Mansouri1;~Jason_Hartford1;~Yan_Zhang1;~Yoshua_Bengio1",
        "gender": "Not Specified;M;M;M",
        "homepage": "https://mila.quebec/en/person/amin-mansouri/;https://jhartford.github.io;https://www.cyanogenoid.com;http://yoshuabengio.org",
        "dblp": "340/7700;191/6716;04/3348-67;56/953",
        "google_scholar": "9aNdCL4AAAAJ;https://scholar.google.ca/citations?user=eBNK7SsAAAAJ;https://scholar.google.co.uk/citations?user=XtCqbfEAAAAJ;kukA0LcAAAAJ",
        "orcid": ";;0000-0003-3470-3663;",
        "linkedin": "amansouri3476?original_referer=;jasonhartford1/;;yoshuabengio/?originalSubdomain=ca",
        "or_profile": "~Amin_Mansouri1;~Jason_Hartford1;~Yan_Zhang1;~Yoshua_Bengio1",
        "aff": "School of Computer and Communication Sciences, EPFL - EPF Lausanne;Valence Labs powered by Recursion;Mila - Quebec Artificial Intelligence Institute;University of Montreal",
        "aff_domain": "ic.epfl.ch;valencelabs.com;mila.quebec;umontreal.ca",
        "position": "PhD student;Researcher;Industrial Partner;Full Professor",
        "bibtex": "@inproceedings{\nmansouri2024object,\ntitle={Object centric architectures enable efficient causal representation learning},\nauthor={Amin Mansouri and Jason Hartford and Yan Zhang and Yoshua Bengio},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=r9FsiXZxZt}\n}",
        "github": "",
        "project": "",
        "reviewers": "T5fz;9Arp;HmRq",
        "pdf_size": 2938172,
        "rating": "6;6;8",
        "confidence": "3;3;5",
        "soundness": "3;3;4",
        "contribution": "2;2;3",
        "presentation": "3;3;3",
        "wc_summary": "49;123;147",
        "wc_strengths": "60;44;69",
        "wc_weaknesses": "208;75;178",
        "wc_questions": "96;11;62",
        "wc_review": "413;253;456",
        "wc_reply_reviewers": "0;0;61",
        "wc_reply_authors": "752;639;571",
        "reply_reviewers": "0;0;1",
        "reply_authors": "2;1;2",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            106.33333333333333,
            41.7079795189788
        ],
        "wc_strengths_avg": [
            57.666666666666664,
            10.338708279513881
        ],
        "wc_weaknesses_avg": [
            153.66666666666666,
            56.95807424959364
        ],
        "wc_questions_avg": [
            56.333333333333336,
            34.93167935015754
        ],
        "wc_review_avg": [
            374.0,
            87.34223873170797
        ],
        "wc_reply_reviewers_avg": [
            20.333333333333332,
            28.755675768252935
        ],
        "wc_reply_authors_avg": [
            654.0,
            74.65029582437478
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 17,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11134064539962832709&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=r9FsiXZxZt",
        "pdf": "https://openreview.net/pdf?id=r9FsiXZxZt",
        "email": "ic.epfl.ch;valencelabs.com;mila.quebec;umontreal.ca",
        "author_num": 4,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "EPFL;Valence Labs;Quebec Artificial Intelligence Institute;University of Montreal",
        "aff_unique_dep": "School of Computer and Communication Sciences;;Artificial Intelligence;",
        "aff_unique_url": "https://www.epfl.ch;;https://mila.quebec;https://wwwumontreal.ca",
        "aff_unique_abbr": "EPFL;;Mila;UM",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Lausanne;",
        "aff_country_unique_index": "0;2;2",
        "aff_country_unique": "Switzerland;;Canada"
    },
    {
        "title": "S$2$AC: Energy-Based Reinforcement Learning with Stein Soft Actor Critic",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17702",
        "id": "rAHcTCMaLc",
        "author_site": "Safa Messaoud, Billel Mokeddem, Zhenghai Xue, Linsey Pang, Bo An, Haipeng Chen, Sanjay Chawla",
        "tldr": "",
        "abstract": "Learning expressive stochastic policies instead of deterministic ones has been proposed to achieve better stability, sample complexity and robustness. Notably, in Maximum Entropy reinforcement learning (MaxEnt RL), the policy is modeled as an expressive energy-based model (EBM) over the Q-values. However, this formulation requires the estimation of the entropy of such EBM distributions which is an open problem. To address this, previous MaxEnt RL methods either implicitly estimate the entropy, yielding high computational complexity and variance (SQL), or follow a variational inference approach that fits simplified distributions (e.g., Gaussian) for tractability (SAC). We propose Sein Soft Actor-Critic (S$^2$AC), a MaxEnt RL algorithm that learns expressive policies without compromising efficiency. S$^2$AC uses parameterized Stein Variational Gradient Descent (SVGD) as the underlying policy. At the core of S$^2$AC is a new solution to the above open challenge of entropy computation for EBMs. Our entropy formula is computationally efficient and only depends on first-order derivatives and vector products. Empirical results show that S$^2$AC yields more optimal solutions to the MaxEnt objective than SQL and SAC in the multi-goal environment, and outperforms SAC and SQL on the MuJoCo benchmark. Our code is available at: https://anonymous.4open.science/r/Stein-Soft-Actor-Critic/",
        "keywords": "Max-Entropy RL;Entropy;Energy-Based-Models",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/c2a316ab12cd30542f6bb5f6c0db5d03f0091146.pdf",
        "author": "Safa Messaoud;Billel Mokeddem;Zhenghai Xue;Linsey Pang;Bo An;Haipeng Chen;Sanjay Chawla",
        "authorids": "~Safa_Messaoud1;~Billel_Mokeddem1;~Zhenghai_Xue1;~Linsey_Pang1;~Bo_An2;~Haipeng_Chen1;~Sanjay_Chawla1",
        "gender": ";M;;F;M;M;",
        "homepage": "https://ece.illinois.edu/directory/profile/messaou2;https://www.linkedin.com/in/billel-mokeddem-b23879152/;;;https://personal.ntu.edu.sg/boan/;https://haipeng-chen.github.io/;",
        "dblp": "126/7519;;;12/10606.html;42/6178-1.html;53/8073-1;",
        "google_scholar": "M2wXrP4AAAAJ;;;https://scholar.google.com.au/citations?user=82kWUDAAAAAJ;PEEpuNwAAAAJ;YT-b72QAAAAJ;",
        "orcid": ";;;0000-0002-4784-9795;0000-0002-7064-7438;0000-0003-0572-8888;",
        "linkedin": ";;;linsey-pang-50590450/;;;",
        "or_profile": "~Safa_Messaoud1;~Billel_Mokeddem1;~Zhenghai_Xue1;~Linsey_Pang1;~Bo_An2;~Haipeng_Chen1;~Sanjay_Chawla1",
        "aff": "Qatar Computing Research Institute;Technology Innovation Institute;;salesforce.com;Nanyang Technological University;College of William and Mary;",
        "aff_domain": "hbku.edu;tii.ae;;salesforce.com;ntu.edu.sg;wm.edu;",
        "position": "Researcher;Researcher;;Principal Data Scientist;Full Professor;Assistant Professor;",
        "bibtex": "@inproceedings{\nmessaoud2024sac,\ntitle={S\\$2\\${AC}: Energy-Based Reinforcement Learning with Stein Soft Actor Critic},\nauthor={Safa Messaoud and Billel Mokeddem and Zhenghai Xue and Linsey Pang and Bo An and Haipeng Chen and Sanjay Chawla},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=rAHcTCMaLc}\n}",
        "github": "",
        "project": "",
        "reviewers": "mSs2;FpMW;4Fze;4hdR;ThdK;1y8M;4Btw",
        "pdf_size": 7803868,
        "rating": "3;5;6;6;6;6;8",
        "confidence": "4;5;3;4;3;3;3",
        "soundness": "3;2;3;3;3;4;3",
        "contribution": "2;2;3;3;2;3;3",
        "presentation": "2;3;3;3;3;4;3",
        "wc_summary": "447;57;64;71;36;24;115",
        "wc_strengths": "10;35;52;25;59;54;76",
        "wc_weaknesses": "232;179;277;48;245;92;57",
        "wc_questions": "25;29;5;356;72;2;32",
        "wc_review": "714;300;398;500;412;172;280",
        "wc_reply_reviewers": "0;0;9;13;0;0;0",
        "wc_reply_authors": "754;360;184;360;307;432;193",
        "reply_reviewers": "0;0;1;1;0;0;0",
        "reply_authors": "1;1;2;2;1;1;1",
        "rating_avg": [
            5.714285714285714,
            1.3850513878332367
        ],
        "confidence_avg": [
            3.5714285714285716,
            0.7284313590846836
        ],
        "soundness_avg": [
            3.0,
            0.5345224838248488
        ],
        "contribution_avg": [
            2.5714285714285716,
            0.49487165930539345
        ],
        "presentation_avg": [
            3.0,
            0.5345224838248488
        ],
        "wc_summary_avg": [
            116.28571428571429,
            137.65143794144305
        ],
        "wc_strengths_avg": [
            44.42857142857143,
            20.73545716094703
        ],
        "wc_weaknesses_avg": [
            161.42857142857142,
            88.01113102144222
        ],
        "wc_questions_avg": [
            74.42857142857143,
            116.9014935048884
        ],
        "wc_review_avg": [
            396.57142857142856,
            162.5887512739314
        ],
        "wc_reply_reviewers_avg": [
            3.142857142857143,
            5.082984821330627
        ],
        "wc_reply_authors_avg": [
            370.0,
            177.84182378089324
        ],
        "reply_reviewers_avg": [
            0.2857142857142857,
            0.45175395145262565
        ],
        "reply_authors_avg": [
            1.2857142857142858,
            0.45175395145262565
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5461515409923461,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1395508107079878503&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=rAHcTCMaLc",
        "pdf": "https://openreview.net/pdf?id=rAHcTCMaLc",
        "email": "hbku.edu;tii.ae;;salesforce.com;ntu.edu.sg;wm.edu;",
        "author_num": 7,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "Qatar Computing Research Institute;Technology Innovation Institute;Salesforce;Nanyang Technological University;College of William and Mary",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.qcri.org;;https://www.salesforce.com;https://www.ntu.edu.sg;https://www.wm.edu",
        "aff_unique_abbr": "QCRI;;Salesforce;NTU;WM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;2;3;2",
        "aff_country_unique": "Qatar;;United States;Singapore"
    },
    {
        "id": "rAX55lDjtt",
        "title": "Acoustic Prompt Tuning: Empowering Large Language Models with Audition Capabilities",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The auditory system plays a substantial role in shaping the overall human perceptual experience. While prevailing large language models (LLMs) and visual language models (VLMs) have shown their promise in solving a wide variety of vision and language understanding tasks through their massive open-world knowledge and inter-task homogeneity, only a few of them can be generalised to the audio domain without compromising their domain-specific capacity. Meanwhile, a majority of existing multimodal foundation models (e.g., VLMs) structure their input sequences as [Multimedia, Question, Answer], constraining their applicability to more comprehensive tasks, such as natural language visual reasoning. In this work, we introduce Acoustic Prompt Turning (APT), an acoustic adapter leveraging a multi-task learning framework to extend LLMs and VLMs to the audio domain. APT uses an instruction-aware aligner to acquire a fixed number of acoustic embeddings by cross-attending audio feature maps generated from an audio encoder. Diverse audio-related tasks are formulated in a sequence-to-sequence manner without imposing any constraints on input sequences, and therefore, allowing APT to be seamlessly trained by combining the present multi-task learning with in-context learning. Experiments show that LLMs coupled with APT (namely APT-LLMs) achieve competitive results compared to the expert models (i.e., the networks trained on the targeted datasets) across various tasks. Additionally, we evaluate APT-LLMs to a novel audio reasoning task involving comparative analysis and summarisation of two audio clips. We also demonstrate the ability of APT to extend frozen VLMs to the audio domain, yielding promising results in the audio-visual understanding task even without finetuned on any audio-visual datasets. Our code and model weights will be released.",
        "keywords": "Large language model; audio understanding; multi-task training; in-context training; audio-visual learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Jinhua Liang;Xubo Liu;Wenwu Wang;Mark D Plumbley;Huy Phan;Emmanouil Benetos",
        "authorids": "~Jinhua_Liang1;~Xubo_Liu1;~Wenwu_Wang1;~Mark_D_Plumbley1;~Huy_Phan2;~Emmanouil_Benetos1",
        "gender": "M;M;M;;M;M",
        "homepage": "https://jinhualiang.github.io/;https://liuxubo717.github.io/;http://personal.ee.surrey.ac.uk/Personal/W.Wang/;https://www.surrey.ac.uk/people/mark-plumbley;https://pquochuy.github.io/;http://www.eecs.qmul.ac.uk/~emmanouilb/",
        "dblp": ";235/1970/;https://dblp.org/pers/hd/w/Wang:Wenwu;84/1168;;23/5543",
        "google_scholar": "mDVXe7sAAAAJ;-OlNYSgAAAAJ;https://scholar.google.co.uk/citations?user=JQFnV5IAAAAJ;28TCymYAAAAJ;RegoACcAAAAJ;https://scholar.google.com.tw/citations?user=Wg49oI4AAAAJ",
        "orcid": "0000-0002-4570-0735;;;0000-0002-9708-1075;;0000-0002-6820-6764",
        "linkedin": "jinhua-l1ang/;;https://uk.linkedin.com/in/wenwu;;;emmanouilb/",
        "or_profile": "~Jinhua_Liang1;~Xubo_Liu1;~Wenwu_Wang1;~Mark_D_Plumbley1;~Huy_Phan2;~Emmanouil_Benetos1",
        "aff": "Queen Mary University of London;University of Surrey;University of Surrey;University of Surrey;Amazon;Queen Mary, University of London",
        "aff_domain": "qmul.ac.uk;surrey.ac.uk;surrey.ac.uk;surrey.ac.uk;amazon.com;qmul.ac.uk",
        "position": "PhD student;PhD student;Full Professor;Full Professor;Researcher;Associate Professor",
        "bibtex": "@misc{\nliang2024acoustic,\ntitle={Acoustic Prompt Tuning: Empowering Large Language Models with Audition Capabilities},\nauthor={Jinhua Liang and Xubo Liu and Wenwu Wang and Mark D Plumbley and Huy Phan and Emmanouil Benetos},\nyear={2024},\nurl={https://openreview.net/forum?id=rAX55lDjtt}\n}",
        "github": "",
        "project": "",
        "reviewers": "u172;cBEu;wWds;w4rk;TGqa",
        "site": "https://openreview.net/forum?id=rAX55lDjtt",
        "pdf_size": 678563,
        "rating": "1;3;5;6;8",
        "confidence": "2;3;4;3;3",
        "soundness": "2;2;3;3;3",
        "contribution": "2;2;2;3;3",
        "presentation": "2;2;4;3;3",
        "wc_summary": "104;109;77;115;87",
        "wc_strengths": "5;91;74;172;124",
        "wc_weaknesses": "159;304;237;245;85",
        "wc_questions": "74;224;37;23;71",
        "wc_review": "342;728;425;555;367",
        "wc_reply_reviewers": "0;0;56;0;0",
        "wc_reply_authors": "467;631;829;605;506",
        "reply_reviewers": "0;0;1;0;0",
        "reply_authors": "1;1;2;1;1",
        "rating_avg": [
            4.6,
            2.4166091947189146
        ],
        "confidence_avg": [
            3.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.8,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            98.4,
            14.192955999368138
        ],
        "wc_strengths_avg": [
            93.2,
            55.336787040810385
        ],
        "wc_weaknesses_avg": [
            206.0,
            76.07364852562286
        ],
        "wc_questions_avg": [
            85.8,
            71.80919161221632
        ],
        "wc_review_avg": [
            483.4,
            142.76498170069576
        ],
        "wc_reply_reviewers_avg": [
            11.2,
            22.4
        ],
        "wc_reply_authors_avg": [
            607.6,
            126.2245617936541
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            1.2,
            0.4
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5234239225902136,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8798697763467648137&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;1;1;2;3",
        "aff_unique_norm": "Queen Mary University of London;University of Surrey;Amazon;Queen Mary, University of London",
        "aff_unique_dep": ";;Amazon.com, Inc.;",
        "aff_unique_url": "https://www.qmul.ac.uk;https://www.surrey.ac.uk;https://www.amazon.com;https://www.qmul.ac.uk",
        "aff_unique_abbr": "QMUL;Surrey;Amazon;QMUL",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "London;",
        "aff_country_unique_index": "0;0;0;0;1;0",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "title": "Random Sparse Lifts: Construction, Analysis and Convergence of finite sparse networks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17701",
        "id": "rBH7x87VfJ",
        "author_site": "David Robin, Kevin Scaman, marc lelarge",
        "tldr": "",
        "abstract": "We present a framework to define a large class of neural networks for which, by construction, training by gradient flow provably reaches arbitrarily low loss when the number of parameters grows. Distinct from the fixed-space global optimality of non-convex optimization, this new form of convergence, and the techniques introduced to prove such convergence, pave the way for a usable deep learning convergence theory in the near future, without overparameterization assumptions relating the number of parameters and training samples. We define these architectures from a simple computation graph and a mechanism to lift it, thus increasing the number of parameters, generalizing the idea of increasing the widths of multi-layer perceptrons. We show that architectures similar to most common deep learning models are present in this class, obtained by sparsifying the weight tensors of usual architectures at initialization. Leveraging tools of algebraic topology and random graph theory, we use the computation graph\u2019s geometry to propagate properties guaranteeing convergence to any precision for these large sparse models.",
        "keywords": "Neural networks;theory of deep learning;convergence guarantees;random graphs;algebraic topology",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "David A. R. Robin;Kevin Scaman;Marc Lelarge",
        "authorids": "~David_A._R._Robin1;~Kevin_Scaman1;~Marc_Lelarge2",
        "gender": "M;M;M",
        "homepage": "https://www.robindar.com;https://scaman.wordpress.com/;http://www.di.ens.fr/~lelarge/",
        "dblp": "338/5541;149/2625;21/462",
        "google_scholar": ";uiR63a8AAAAJ;cLGOIdMAAAAJ",
        "orcid": ";;",
        "linkedin": "david-a-r-robin/;;",
        "or_profile": "~David_A._R._Robin1;~Kevin_Scaman1;~marc_lelarge1",
        "aff": "INRIA;INRIA;INRIA",
        "aff_domain": "inria.fr;inria.fr;inria.fr",
        "position": "PhD student;Reseacher;Researcher",
        "bibtex": "@inproceedings{\nrobin2024random,\ntitle={Random Sparse Lifts: Construction, Analysis and Convergence of finite sparse networks},\nauthor={David A. R. Robin and Kevin Scaman and Marc Lelarge},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=rBH7x87VfJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "nC6x;cG9T;ZupD;9UCJ",
        "pdf_size": 539799,
        "rating": "5;5;8;8",
        "confidence": "2;2;3;3",
        "soundness": "2;3;4;3",
        "contribution": "3;2;3;3",
        "presentation": "2;1;4;4",
        "wc_summary": "16;56;24;81",
        "wc_strengths": "38;47;69;184",
        "wc_weaknesses": "2;287;310;87",
        "wc_questions": "70;40;83;197",
        "wc_review": "126;430;486;549",
        "wc_reply_reviewers": "0;0;35;17",
        "wc_reply_authors": "258;378;753;278",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.5,
            1.5
        ],
        "confidence_avg": [
            2.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            1.299038105676658
        ],
        "wc_summary_avg": [
            44.25,
            25.96512083545925
        ],
        "wc_strengths_avg": [
            84.5,
            58.54271944486351
        ],
        "wc_weaknesses_avg": [
            171.5,
            130.7602768427782
        ],
        "wc_questions_avg": [
            97.5,
            59.525204745552955
        ],
        "wc_review_avg": [
            397.75,
            162.44441356968852
        ],
        "wc_reply_reviewers_avg": [
            13.0,
            14.474114826130128
        ],
        "wc_reply_authors_avg": [
            416.75,
            199.38577557087666
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:RYf2VvQ4OagJ:scholar.google.com/&scioq=Random+Sparse+Lifts:+Construction,+Analysis+and+Convergence+of+finite+sparse+networks&hl=en&as_sdt=0,23",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=rBH7x87VfJ",
        "pdf": "https://openreview.net/pdf?id=rBH7x87VfJ",
        "email": "inria.fr;inria.fr;inria.fr",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "INRIA",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.inria.fr",
        "aff_unique_abbr": "INRIA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "France"
    },
    {
        "title": "Variance-aware Regret Bounds for Stochastic Contextual Dueling Bandits",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17700",
        "id": "rDH7dIFn20",
        "author_site": "Qiwei Di, Tao Jin, Yue Wu, Heyang Zhao, Farzad Farnoud, Quanquan Gu",
        "tldr": "",
        "abstract": "Dueling bandits is a prominent framework for decision-making involving preferential feedback, a valuable feature that fits various applications involving human interaction, such as ranking, information retrieval, and recommendation systems. While substantial efforts have been made to minimize the cumulative regret in dueling bandits, a notable gap in the current research is the absence of regret bounds that account for the inherent uncertainty in pairwise comparisons between the dueling arms. Intuitively, greater uncertainty suggests a higher level of difficulty in the problem.  To bridge this gap, this paper studies the problem of contextual dueling bandits, where the binary comparison of dueling arms is generated from a generalized linear model (GLM). We propose a new SupLinUCB-type algorithm that enjoys computational efficiency and a variance-aware regret bound $\\tilde O\\big(d\\sqrt{\\sum_{t=1}^T\\sigma_t^2} + d\\big)$, where $\\sigma_t$ is the variance of the pairwise comparison at round $t$, $d$ is the dimension of the context vectors, and $T$ is the time horizon. Our regret bound naturally aligns with the intuitive expectation \u2014 in scenarios where the comparison is deterministic, the algorithm only suffers from an $\\tilde O(d)$ regret. We perform empirical experiments on synthetic data to confirm the advantage of our method over previous variance-agnostic algorithms.",
        "keywords": "Dueling Bandit;Variance-aware;contextual bandit",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Qiwei Di;Tao Jin;Yue Wu;Heyang Zhao;Farzad Farnoud;Quanquan Gu",
        "authorids": "~Qiwei_Di1;~Tao_Jin3;~Yue_Wu12;~Heyang_Zhao1;~Farzad_Farnoud1;~Quanquan_Gu1",
        "gender": "M;M;M;M;;M",
        "homepage": "https://qiwei-di1234.github.io/;https://tao-j.me;https://yuewu.us/;https://web.cs.ucla.edu/~hyzhao/;http://www.ece.virginia.edu/~ffh8x;http://web.cs.ucla.edu/~qgu/",
        "dblp": "354/3878;88/4850-2;41/5979-11;;88/7890.html;50/4597",
        "google_scholar": "SewL0pkAAAAJ;0kCyQGsAAAAJ;kSQ1mLYAAAAJ;zHQ1ap0AAAAJ;https://scholar.google.com/citations?hl=en;GU9HgNAAAAAJ",
        "orcid": ";;;;0000-0002-8684-4487;",
        "linkedin": "qiwei-di-00776a253/;;;;farzad-farnoud-b7993315/;",
        "or_profile": "~Qiwei_Di1;~Tao_Jin3;~Yue_Wu12;~Heyang_Zhao1;~Farzad_Farnoud1;~Quanquan_Gu1",
        "aff": "University of California, Los Angeles;;University of California, Los Angeles;Computer Science Department, University of California, Los Angeles;University of Virginia;University of California, Los Angeles",
        "aff_domain": "ucla.edu;;ucla.edu;cs.ucla.edu;virginia.edu;cs.ucla.edu",
        "position": "PhD student;;PhD student;PhD student;Assistant Professor;Associate Professor",
        "bibtex": "@inproceedings{\ndi2024varianceaware,\ntitle={Variance-aware Regret Bounds for Stochastic Contextual Dueling Bandits},\nauthor={Qiwei Di and Tao Jin and Yue Wu and Heyang Zhao and Farzad Farnoud and Quanquan Gu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=rDH7dIFn20}\n}",
        "github": "",
        "project": "",
        "reviewers": "83pH;W8bc;Kvxm;2YSg",
        "pdf_size": 1641562,
        "rating": "5;5;6;8",
        "confidence": "3;3;4;2",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "82;78;100;39",
        "wc_strengths": "45;50;129;16",
        "wc_weaknesses": "142;95;182;19",
        "wc_questions": "43;6;34;2",
        "wc_review": "312;229;445;76",
        "wc_reply_reviewers": "229;82;0;0",
        "wc_reply_authors": "806;537;577;82",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            74.75,
            22.24157143728833
        ],
        "wc_strengths_avg": [
            60.0,
            41.89868733027325
        ],
        "wc_weaknesses_avg": [
            109.5,
            60.64857788934543
        ],
        "wc_questions_avg": [
            21.25,
            17.597940220378067
        ],
        "wc_review_avg": [
            265.5,
            133.81423691072635
        ],
        "wc_reply_reviewers_avg": [
            77.75,
            93.5210537793496
        ],
        "wc_reply_authors_avg": [
            500.5,
            262.5152376529789
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9381736752064912262&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=rDH7dIFn20",
        "pdf": "https://openreview.net/pdf?id=rDH7dIFn20",
        "email": "ucla.edu;;ucla.edu;cs.ucla.edu;virginia.edu;cs.ucla.edu",
        "author_num": 6,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "University of California, Los Angeles;University of Virginia",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ucla.edu;https://www.virginia.edu",
        "aff_unique_abbr": "UCLA;UVA",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Los Angeles;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "rDIqMB4mMg",
        "title": "PostRainBench: A Comprehensive Benchmark and A New Model for Precipitation Forecasting",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Accurate precipitation forecasting is a vital challenge of both scientific and societal importance. Data-driven approaches have emerged as a widely used solution for addressing this challenge. However, solely relying on data-driven approaches has limitations in modeling the underlying physics, making accurate predictions difficult. Coupling AI-based post-processing techniques with traditional Numerical Weather Prediction (NWP) methods offers a more effective solution for improving forecasting accuracy. Despite previous post-processing efforts, accurately predicting heavy rainfall remains challenging due to the imbalanced precipitation data across locations and complex relationships between multiple meteorological variables. To address these limitations, we introduce the PostRainBench, a comprehensive multi-variable NWP post-processing benchmark consisting of three datasets for NWP post-processing-based precipitation forecasting. We propose CAMT, a simple yet effective Channel Attention Enhanced Multi-task Learning framework with a specially designed weighted loss function. Its flexible design allows for easy plug-and-play integration with various backbones. Extensive experimental results on the proposed benchmark show that our method outperforms state-of-the-art methods by 6.3\\%, 4.7\\%, and 26.8\\% in rain CSI on the three datasets respectively. Most notably, our model is the first deep learning-based method to outperform traditional Numerical Weather Prediction (NWP) approaches in extreme precipitation conditions. It shows improvements of 15.6\\%, 17.4\\%, and 31.8\\% over NWP predictions in heavy rain CSI on respective datasets. These results highlight the potential impact of our model in reducing the severe consequences of extreme weather events.",
        "keywords": "Precipitation Forecasting;NWP Post-processing;Data Imbalance;Multi-task Learning",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/901a295cdc930e23ad5d58998a546434a8968584.zip",
        "author": "Yujin Tang;Jiaming Zhou;Xiang Pan;Zeying Gong;Junwei Liang",
        "authorids": "~Yujin_Tang2;~Jiaming_Zhou1;~Xiang_Pan5;~Zeying_Gong1;~Junwei_Liang1",
        "gender": "F;M;M;M;M",
        "homepage": "https://yyyujintang.github.io/;https://jiaming-zhou.github.io/;;https://zeying-gong.github.io/;https://junweiliang.me/",
        "dblp": ";;;;62/10704-1",
        "google_scholar": "T41IQ1EAAAAJ;b3y40w8AAAAJ;zzcaMuMAAAAJ;ze2Wh9EAAAAJ;bMedjfUAAAAJ",
        "orcid": ";;0000-0003-3890-6599;0009-0000-9591-5358;0000-0003-2219-5569",
        "linkedin": "yujin-tang-542b321a7/;;;richard-kung/;junweiliang/",
        "or_profile": "~Yujin_Tang2;~Jiaming_Zhou1;~Xiang_Pan5;~Zeying_Gong1;~Junwei_Liang1",
        "aff": "Hong Kong University of Science and Technology (Guangzhou);Hong Kong University of Science and Technology (Guangzhou);Nanjing University;Hong Kong University of Science and Technology;Hong Kong University of Science and Technology",
        "aff_domain": "hkust-gz.edu.cn;hkust-gz.edu.cn;nju.edu.cn;hkust-gz.edu.cn;ust.hk",
        "position": "Intern;PhD student;PhD student;MS student;Assistant Professor",
        "bibtex": "@misc{\ntang2024postrainbench,\ntitle={PostRainBench: A Comprehensive Benchmark and A New Model for Precipitation Forecasting},\nauthor={Yujin Tang and Jiaming Zhou and Xiang Pan and Zeying Gong and Junwei Liang},\nyear={2024},\nurl={https://openreview.net/forum?id=rDIqMB4mMg}\n}",
        "github": "",
        "project": "",
        "reviewers": "Lop7;M7MM;hWvd;aiFF",
        "site": "https://openreview.net/forum?id=rDIqMB4mMg",
        "pdf_size": 1155804,
        "rating": "3;5;5;6",
        "confidence": "4;5;5;4",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;2",
        "presentation": "3;1;3;3",
        "wc_summary": "101;142;82;52",
        "wc_strengths": "26;45;67;39",
        "wc_weaknesses": "71;233;166;7",
        "wc_questions": "18;2;4;13",
        "wc_review": "216;422;319;111",
        "wc_reply_reviewers": "72;82;0;4",
        "wc_reply_authors": "1716;1771;982;363",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "4;4;3;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            94.25,
            32.63721035873011
        ],
        "wc_strengths_avg": [
            44.25,
            14.821858857781638
        ],
        "wc_weaknesses_avg": [
            119.25,
            86.67864500556063
        ],
        "wc_questions_avg": [
            9.25,
            6.53356717268599
        ],
        "wc_review_avg": [
            267.0,
            115.82961624731388
        ],
        "wc_reply_reviewers_avg": [
            39.5,
            37.69283751589949
        ],
        "wc_reply_authors_avg": [
            1208.0,
            578.8207840083146
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            1.224744871391589
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.2294157338705618,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2393957768209086211&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Nanjing University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ust.hk;https://www.nju.edu.cn",
        "aff_unique_abbr": "HKUST;Nanjing U",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "rDgw3yX2aO",
        "title": "FedGT: Identification of Malicious Clients in Federated Learning with Secure Aggregation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We propose FedGT, a novel framework for identifying malicious clients in federated learning with secure aggregation. \nInspired by group testing, the framework leverages overlapping groups of clients to identify the presence of malicious clients in the groups via a decoding operation.\nThe clients identified as malicious are then removed from the training of the model, which is performed over the remaining clients. \nBy choosing the size, number, and overlap between groups, FedGT strikes a balance between privacy and security.\nSpecifically, the server learns the aggregated model of the clients in each group - vanilla federated learning and secure aggregation correspond to the extreme cases of FedGT with group size equal to one and the total number of clients, respectively.\nThe effectiveness of FedGT is demonstrated through extensive experiments on the MNIST, CIFAR-10, and ISIC2019 datasets in a cross-silo setting under different data-poisoning attacks. \nThese experiments showcase FedGT's ability to identify malicious clients, resulting in high model utility. \nWe further show that FedGT significantly outperforms the private robust aggregation approach based on the geometric median recently proposed by Pillutla et al. on heterogeneous client data (ISIC2019) and in the presence of targeted attacks (CIFAR-10 and ISIC2019).",
        "keywords": "federated learning;malicious clients;data poisoning attacks;group testing;identification of malicious clients.",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Marvin Xhemrishi;Johan \u00d6stman;Antonia Wachter-Zeh;Alexandre Graell i Amat",
        "authorids": "~Marvin_Xhemrishi1;~Johan_\u00d6stman1;~Antonia_Wachter-Zeh1;~Alexandre_Graell_i_Amat1",
        "gender": "M;M;;M",
        "homepage": ";;https://www.ce.cit.tum.de/en/lnt/people/professors/wachter-zeh/;https://sites.google.com/site/agraellamat/",
        "dblp": "263/7525;119/7992;01/8262;95/3707",
        "google_scholar": "KPgGWugAAAAJ;sIJo_uAAAAAJ;https://scholar.google.de/citations?user=tDZ0XesAAAAJ;zUHq6XEAAAAJ",
        "orcid": ";0000-0003-4138-0508;;0000-0002-5725-869X",
        "linkedin": ";joestman/;;",
        "or_profile": "~Marvin_Xhemrishi1;~Johan_\u00d6stman1;~Antonia_Wachter-Zeh1;~Alexandre_Graell_i_Amat1",
        "aff": "Technische Universit\u00e4t M\u00fcnchen;AI Sweden;Technische Universit\u00e4t M\u00fcnchen;Chalmers University of Technology",
        "aff_domain": "tum.de;ai.se;tum.de;chalmers.se",
        "position": "PhD student;Researcher;Associate Professor;Full Professor",
        "bibtex": "@misc{\nxhemrishi2024fedgt,\ntitle={Fed{GT}: Identification of Malicious Clients in Federated Learning with Secure Aggregation},\nauthor={Marvin Xhemrishi and Johan {\\\"O}stman and Antonia Wachter-Zeh and Alexandre Graell i Amat},\nyear={2024},\nurl={https://openreview.net/forum?id=rDgw3yX2aO}\n}",
        "github": "",
        "project": "",
        "reviewers": "CiYQ;nACW;znCD;6XYo",
        "site": "https://openreview.net/forum?id=rDgw3yX2aO",
        "pdf_size": 685379,
        "rating": "3;3;6;6",
        "confidence": "3;3;2;4",
        "soundness": "2;2;3;3",
        "contribution": "1;2;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "177;29;66;104",
        "wc_strengths": "60;16;27;101",
        "wc_weaknesses": "1389;150;69;207",
        "wc_questions": "371;8;4;130",
        "wc_review": "1997;203;166;542",
        "wc_reply_reviewers": "513;55;0;680",
        "wc_reply_authors": "2164;665;297;1342",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "3;1;1;2",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            94.0,
            54.767691205673444
        ],
        "wc_strengths_avg": [
            51.0,
            33.09833832687073
        ],
        "wc_weaknesses_avg": [
            453.75,
            542.1887932261234
        ],
        "wc_questions_avg": [
            128.25,
            149.02076197630987
        ],
        "wc_review_avg": [
            727.0,
            747.7335755467986
        ],
        "wc_reply_reviewers_avg": [
            312.0,
            291.21212200044147
        ],
        "wc_reply_authors_avg": [
            1117.0,
            711.2555799429625
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17254739511232735564&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "Technische Universit\u00e4t M\u00fcnchen;AI Sweden;Chalmers University of Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.tum.de;https://www.aisweden.org;https://www.chalmers.se",
        "aff_unique_abbr": "TUM;AI Sweden;Chalmers",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;1",
        "aff_country_unique": "Germany;Sweden"
    },
    {
        "id": "rDhsRC0ldq",
        "title": "Do LLMs understand Pragmatics? An Extensive Benchmark for Evaluating Pragmatic Understanding of LLMs",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large language models (LLMs) are typically evaluated based on semantic understanding and are believed to be capable of handling general language processing. While LLMs can mimic human-like responses, they still are a contraption in their pragmatic or contextual understanding of language. To test this hypothesis, we subject LLMs to the complex task of pragmatics. We conducted evaluation across \\textit{fourteen} tasks spanning \\textit{four} domains of pragmatics namely, Implicature, Presupposition, Reference, and Deixis. For each task, we curated high-quality test sets, consisting of Multiple Choice Question Answers (MCQA). We evaluate a wide range of LLMs with different types and sizes. Our findings reveal that LLMs with no instruction fine-tuning have near-random accuracy on many tasks. The performance gradually increases with the increase in model capacity. Additionally, we create a unified benchmark enabling the research community to better assess the underlying pragmatic understanding of the language models.",
        "keywords": "LLMs;Pragmatics;Benchmark;NLP;Evaluation",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/17a9d730ddcaae2814264251625336df950cb5f6.zip",
        "author": "Settaluri Lakshmi Sravanthi;Meet Doshi;Pavan Kalyan Tankala;Rudra Murthy;Pushpak Bhattacharyya",
        "authorids": "~Settaluri_Lakshmi_Sravanthi1;~Meet_Doshi1;~Pavan_Kalyan_Tankala1;~Rudra_Murthy1;~Pushpak_Bhattacharyya1",
        "gender": "F;;M;M;M",
        "homepage": ";;;http://murthyrudra.github.io;https://www.cse.iitb.ac.in/~pb/",
        "dblp": ";362/4924;371/5125;216/7282;p/PushpakBhattacharyya",
        "google_scholar": ";Nbg-JiMAAAAJ;11_GsJAAAAAJ;5bjj_9cAAAAJ;https://scholar.google.com.tw/citations?user=vvg-pAkAAAAJ",
        "orcid": ";;;0000-0002-6236-1931;",
        "linkedin": "sravanthi-settaluri-83a48714/;meetdoshi90/;pavan-kalyan-1b88351a0/;;pushpakbh/?originalSubdomain=in",
        "or_profile": "~Settaluri_Lakshmi_Sravanthi1;~Meet_Doshi1;~Pavan_Kalyan_Tankala1;~Rudra_Murthy1;~Pushpak_Bhattacharyya1",
        "aff": "Indian Institute of Technology Bombay, Indian Institute of Technology, Bombay;Indian Institute of Technology Bombay, Indian Institute of Technology, Bombay;Indian Institute of Technology, Bombay;IBM India Pvt Ltd;Indian Institute of Technology, Bombay, Dhirubhai Ambani Institute Of Information and Communication Technology",
        "aff_domain": "cse.iitb.ac.in;cse.iitb.ac.in;iitb.ac.in;in.ibm.com;iitb.ac.in",
        "position": "PhD student;Master's Student;Undergrad student;Researcher;Full Professor",
        "bibtex": "@misc{\nsravanthi2024do,\ntitle={Do {LLM}s understand Pragmatics? An Extensive Benchmark for Evaluating Pragmatic Understanding of {LLM}s},\nauthor={Settaluri Lakshmi Sravanthi and Meet Doshi and Pavan Kalyan Tankala and Rudra Murthy and Pushpak Bhattacharyya},\nyear={2024},\nurl={https://openreview.net/forum?id=rDhsRC0ldq}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=rDhsRC0ldq",
        "pdf_size": 9076644,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:SmlLO4xk2d4J:scholar.google.com/&scioq=Do+LLMs+understand+Pragmatics%3F+An+Extensive+Benchmark+for+Evaluating+Pragmatic+Understanding+of+LLMs&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;2",
        "aff_unique_norm": "Indian Institute of Technology Bombay;IBM;Indian Institute of Technology, Bombay",
        "aff_unique_dep": ";IBM India Pvt Ltd;",
        "aff_unique_url": "https://www.iitb.ac.in;https://www.ibm.com/in-en;https://www.iitb.ac.in",
        "aff_unique_abbr": "IIT Bombay;IBM India;IIT Bombay",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Bombay;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "India"
    },
    {
        "id": "rDuqo9KTzh",
        "title": "Meta-Knowledge Extraction: Uncertainty-Aware Prompted Meta-Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Conventional meta-learning typically involves adapting all meta-knowledge to specific tasks, which incurs high computational costs due to the adaption process. To address this limitation, we introduce a more efficient gradient-based meta-learning framework called Uncertainty-Aware Prompted Meta-Learning (UAPML). Instead of adapting the entire meta-knowledge, we introduce a meta-knowledge extraction paradigm inspired by the success of large language models. In this paradigm, we freeze the model backbone and employ task-specific prompts to extract meta-knowledge for few-shot tasks. To construct the task-specific prompts, a learnable Bayesian meta-prompt is employed to provide an ideal initialization. Through theoretical analysis, we demonstrate that the posterior uncertainty of the Bayesian meta-prompt aligns with that of the task-specific prompt, which can be used to modulate the construction of task-specific prompts. Accordingly, we propose two ways, i.e., the soft and hard way, to automatically construct task-specific prompts from the meta-prompt when dealing with new tasks. Experimental results demonstrate the efficiency of the meta-knowledge extraction paradigm and highlight the significantly reduced computational cost achieved by our UAPML framework without the degradation of performance.",
        "keywords": "Meta-Learning;Prompt Tuning;Bayesian Inference",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/79024737aea595d21cd3391aedb267beed351020.zip",
        "author": "Bin Wu;Jinyuan Fang;Xiang Zhuang;Zhang Jian;Ying Wei;Qiang Zhang",
        "authorids": "~Bin_Wu4;~Jinyuan_Fang1;~Xiang_Zhuang1;~Zhang_Jian2;~Ying_Wei1;~Qiang_Zhang6",
        "gender": "M;M;;M;F;",
        "homepage": "https://github.com/Bingo-W;https://github.com/jyfang6;;https://github.com/zhang1546;https://wei-ying.net/;https://qiangairesearcher.github.io",
        "dblp": "98/4432-25;251/9517;;;14/4899-1;72/3527-26",
        "google_scholar": "2ZHjpDcAAAAJ;LOWJnPsAAAAJ;;;5UpFdKsAAAAJ;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": "0000-0002-8677-2321;;;;;",
        "linkedin": "bin-wu-a915601a5/;;;;;",
        "or_profile": "~Bin_Wu4;~Jinyuan_Fang1;~Xiang_Zhuang1;~Zhang_Jian2;~Ying_Wei1;~Qiang_Zhang6",
        "aff": "University College London, University of London;University of Glasgow;;;Nanyang Technological University;Zhejiang University",
        "aff_domain": "ucl.ac.uk;glasgow.ac.uk;;;ntu.edu.sg;zju.edu.cn",
        "position": "PhD student;PhD student;;;Assistant Professor;Principal Researcher",
        "bibtex": "@misc{\nwu2024metaknowledge,\ntitle={Meta-Knowledge Extraction: Uncertainty-Aware Prompted Meta-Learning},\nauthor={Bin Wu and Jinyuan Fang and Xiang Zhuang and Zhang Jian and Ying Wei and Qiang Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=rDuqo9KTzh}\n}",
        "github": "",
        "project": "",
        "reviewers": "7FMs;WuMv;DzXH",
        "site": "https://openreview.net/forum?id=rDuqo9KTzh",
        "pdf_size": 1502215,
        "rating": "3;5;5",
        "confidence": "4;3;2",
        "soundness": "2;3;3",
        "contribution": "2;2;3",
        "presentation": "3;3;2",
        "wc_summary": "71;56;115",
        "wc_strengths": "84;27;45",
        "wc_weaknesses": "222;80;280",
        "wc_questions": "66;108;161",
        "wc_review": "443;271;601",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "988;483;855",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;1;2",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            80.66666666666667,
            25.037749277618563
        ],
        "wc_strengths_avg": [
            52.0,
            23.790754506740637
        ],
        "wc_weaknesses_avg": [
            194.0,
            84.0158715164383
        ],
        "wc_questions_avg": [
            111.66666666666667,
            38.87015421745698
        ],
        "wc_review_avg": [
            438.3333333333333,
            134.76234225067805
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            775.3333333333334,
            213.7230814759032
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:V0k911-RbWYJ:scholar.google.com/&scioq=Meta-Knowledge+Extraction:+Uncertainty-Aware+Prompted+Meta-Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "University College London;University of Glasgow;Nanyang Technological University;Zhejiang University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.ucl.ac.uk;https://www.gla.ac.uk;https://www.ntu.edu.sg;https://www.zju.edu.cn",
        "aff_unique_abbr": "UCL;Glasgow;NTU;ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;2",
        "aff_country_unique": "United Kingdom;Singapore;China"
    },
    {
        "id": "rEQ8OiBxbZ",
        "title": "3D Molecular Pretraining via Localized Geometric Generation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Self-supervised learning on 3D molecular structures has gained prominence in AI-driven drug discovery due to the high cost of annotating biochemical data. \nHowever, few have studied the selection of proper modeling semantic units within 3D molecular data, which is critical for an expressive pre-trained model as recognized in natural language processing and computer vision.\nIn this study, we introduce \\textbf{L}ocalized G\\textbf{e}ometric \\textbf{G}enerati\\textbf{o}n (LEGO), a novel approach that treats tetrahedrons within 3D molecular structures as fundamental building blocks , leveraging their simplicity in three-dimension and their prevalence in molecular structural patterns such as carbon skeletons and functional groups.\nInspired by masked language/image modeling, LEGO perturbs a portion of tetrahedrons and learns to reconstruct them in pretraining.\nThe reconstruction of the noised local structures can be divided into a two-step process, namely spatial orientation prediction and internal arrangement generation.\nFirst, we predict the global orientation of the noised local structure within the whole molecule, equipping the model with positional information for these foundational components.\nThen, we geometrically reconstruct the internal arrangements of the noised local structures revealing their functional semantics.\nTo address the atom-bond inconsistency problem in previous denoising methods and utilize the prior of chemical bonds, we propose to model the graph as a set of nodes and edges and explicitly generate the edges during pre-training.\nIn this way, LEGO exploits the advantages of encoding structural geometry features as well as leveraging the expressiveness of self-supervised learning.\nExtensive experiments on molecular quantum and biochemical property prediction tasks demonstrate the effectiveness of our approach.",
        "keywords": "molecular repsentation; self-supervised learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Yuancheng SUN;Kai Chen;Kang Liu;Qiwei Ye",
        "authorids": "~Yuancheng_SUN1;~Kai_Chen2;~Kang_Liu1;~Qiwei_Ye1",
        "gender": "M;M;M;M",
        "homepage": "https://scholar.google.com/citations?user=muRk3uwAAAAJ&hl=en;;http://www.nlpr.ia.ac.cn/cip/~liukang/index.html;",
        "dblp": "07/3170;;42/4903.html;50/995",
        "google_scholar": ";https://scholar.google.co.jp/citations?user=kPDp3cUAAAAJ;DtZCfl0AAAAJ;RJ6SuR8AAAAJ",
        "orcid": ";;;0000-0003-4264-5846",
        "linkedin": ";;;qiwei-ye-15282964/",
        "or_profile": "~Yuancheng_SUN1;~Kai_Chen2;~Kang_Liu1;~Qiwei_Ye1",
        "aff": "Institute of Automation, Chinese Academy of Sciences;Microsoft;Institute of Automation, Chinese Academy of Sciences;Beijing Academy of Artificial Intelligence",
        "aff_domain": "ia.ac.cn;microsoft.com;ia.ac.cn;baai.ac.cn",
        "position": "PhD student;Researcher;Professor;Principal Researcher",
        "bibtex": "@misc{\nsun2024d,\ntitle={3D Molecular Pretraining via Localized Geometric Generation},\nauthor={Yuancheng SUN and Kai Chen and Kang Liu and Qiwei Ye},\nyear={2024},\nurl={https://openreview.net/forum?id=rEQ8OiBxbZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "wqqh;SwR4;2SQj;VdE4",
        "site": "https://openreview.net/forum?id=rEQ8OiBxbZ",
        "pdf_size": 822320,
        "rating": "3;3;3;3",
        "confidence": "5;4;4;4",
        "soundness": "3;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "3;2;3;3",
        "wc_summary": "67;57;25;35",
        "wc_strengths": "32;75;17;57",
        "wc_weaknesses": "98;195;91;159",
        "wc_questions": "104;146;35;103",
        "wc_review": "301;473;168;354",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;340;532;347",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;1;1;1",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            46.0,
            16.76305461424021
        ],
        "wc_strengths_avg": [
            45.25,
            22.342504335906483
        ],
        "wc_weaknesses_avg": [
            135.75,
            43.239883209833025
        ],
        "wc_questions_avg": [
            97.0,
            39.78064856183217
        ],
        "wc_review_avg": [
            324.0,
            109.50570761380432
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            304.75,
            192.05646956038737
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0.75,
            0.4330127018922193
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:qH_ayLEQZpsJ:scholar.google.com/&scioq=3D+Molecular+Pretraining+via+Localized+Geometric+Generation&hl=en&as_sdt=0,5",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "Chinese Academy of Sciences;Microsoft;Beijing Academy of Artificial Intelligence",
        "aff_unique_dep": "Institute of Automation;Microsoft Corporation;",
        "aff_unique_url": "http://www.ia.cas.cn;https://www.microsoft.com;https://www.baaic.cn",
        "aff_unique_abbr": "CAS;Microsoft;BAAI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "rFCGiFTVyY",
        "title": "FedSKU: Defending Backdoors in Federated Learning Through Selective Knowledge Unlearning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Federated Learning (FL) has been found to be vulnerable to backdoor attacks, which involve an adversary uploading manipulated model parameters to deceive the aggregation process. Although several defenses have been proposed for backdoor attacks in FL, they are typically coarse-grained, as all of the methods process the uploaded model as a whole by either removing them or adding noises. In this paper, we propose a more fine-grained approach by further decomposing the uploaded model into malicious triggers and useful knowledge, which can be separately processed for improved performance. Specifically, our approach, called FedSKU, enables backdoor defense through \\textbf{S}elective \\textbf{K}nowledge \\textbf{U}nlearning. We draw inspiration from machine unlearning to unlearn the malicious triggers while preserving the useful knowledge to be aggregated. Consequently, we accurately remove the backdoor trigger without sacrificing any other benign knowledge embedded in the model parameters. This knowledge can be further utilized to boost the performance of the subsequent aggregation. Extensive experiments demonstrate its superiority over existing defense methods.",
        "keywords": "Federated Learning;Backdoor Defense;Machine Unlearning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Guofu Xie;Bingyan Liu;Yu Zhou",
        "authorids": "~Guofu_Xie1;~Bingyan_Liu2;~Yu_Zhou14",
        "gender": ";M;M",
        "homepage": ";https://lebyni.github.io/;",
        "dblp": ";198/1547;",
        "google_scholar": ";q2TL0g0AAAAJ;https://scholar.google.com/citations?view_op=list_works",
        "orcid": ";0000-0003-2613-9863;0009-0003-3599-4631",
        "linkedin": "andy-sherlock-a8a549268;;",
        "or_profile": "~Guofu_Xie1;~Bingyan_Liu2;~Yu_Zhou14",
        "aff": "Beijing University of Posts and Telecommunications;Beijing University of Posts and Telecommunications;Beijing University of Posts and Telecommunications",
        "aff_domain": "bupt.edu.cn;bupt.edu.cn;bupt.edu.cn",
        "position": "Undergrad student;Associate Professor;Undergrad student",
        "bibtex": "@misc{\nxie2024fedsku,\ntitle={Fed{SKU}: Defending Backdoors in Federated Learning Through Selective Knowledge Unlearning},\nauthor={Guofu Xie and Bingyan Liu and Yu Zhou},\nyear={2024},\nurl={https://openreview.net/forum?id=rFCGiFTVyY}\n}",
        "github": "",
        "project": "",
        "reviewers": "mcVc;FcGK;wRHA;d1FD",
        "site": "https://openreview.net/forum?id=rFCGiFTVyY",
        "pdf_size": 670831,
        "rating": "5;5;6;8",
        "confidence": "4;4;2;3",
        "soundness": "3;3;3;3",
        "contribution": "3;2;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "40;54;49;155",
        "wc_strengths": "28;70;76;98",
        "wc_weaknesses": "201;74;79;45",
        "wc_questions": "2;107;64;56",
        "wc_review": "271;305;268;354",
        "wc_reply_reviewers": "0;150;0;0",
        "wc_reply_authors": "797;1486;369;414",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "3;4;2;2",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            74.5,
            46.74665763453041
        ],
        "wc_strengths_avg": [
            68.0,
            25.337718918639855
        ],
        "wc_weaknesses_avg": [
            99.75,
            59.88061038433059
        ],
        "wc_questions_avg": [
            57.25,
            37.332124236373154
        ],
        "wc_review_avg": [
            299.5,
            34.659053651246744
        ],
        "wc_reply_reviewers_avg": [
            37.5,
            64.9519052838329
        ],
        "wc_reply_authors_avg": [
            766.5,
            447.4575398850711
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.4923659639173309,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:U0xL4W_mSkMJ:scholar.google.com/&scioq=FedSKU:+Defending+Backdoors+in+Federated+Learning+Through+Selective+Knowledge+Unlearning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Beijing University of Posts and Telecommunications",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.bupt.edu.cn/",
        "aff_unique_abbr": "BUPT",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Beijing",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "rFZtyj5kBz",
        "title": "Certifiably Byzantine-Robust Federated Conformal Prediction",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Conformal prediction has shown impressive capacity in constructing statistically rigorous prediction sets for machine learning models with exchangeable data samples. The burgeoning amount of large-scale data, coupled with the escalating privacy concerns related to local data sharing, has inspired recent innovations extending conformal prediction into federated environments with distributed data samples. However, this framework for distributed uncertainty quantification is susceptible to Byzantine failures. A minor subset of malicious clients can significantly compromise the practicality of coverage guarantees. To address this vulnerability, we introduce a novel algorithm Rob-FCP to execute robust federated conformal prediction, effectively countering malicious clients capable of reporting arbitrary statistics during the conformal calibration process. We theoretically provide the conformal coverage bound of Rob-FCP in the Byzantine setting and show that the coverage of Rob-FCP is asymptotically close to the desired coverage level under mild conditions in both IID and non-IID settings. We also propose a malicious client number estimator to tackle a more challenging setting where the number of malicious clients is unknown to the defender and theoretically show its effectiveness. We empirically demonstrate the robustness of Rob-FCP against diverse proportions of malicious clients under a variety of Byzantine attacks on five realistic benchmark and healthcare datasets.",
        "keywords": "conformal prediction;uncertainty quantifiaction;federated learning;robustness",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/d4dfb59ae34ae7e119d800428900c980c3fe47d7.zip",
        "author": "Mintong Kang;Zhen Lin;Jimeng Sun;Cao Xiao;Bo Li",
        "authorids": "~Mintong_Kang1;~Zhen_Lin2;~Jimeng_Sun3;~Cao_Xiao2;~Bo_Li19",
        "gender": "M;;;F;F",
        "homepage": "https://kangmintong.github.io/;;http://sunlab.org;https://sites.google.com/view/danicaxiao/home;http://boli.cs.illinois.edu/",
        "dblp": "303/0335.html;;;170/1833;50/3402-26",
        "google_scholar": "oHXw2SAAAAAJ;;9jmmp5sAAAAJ;ahaV25EAAAAJ;K8vJkTcAAAAJ",
        "orcid": ";;0000-0003-1512-6426;;",
        "linkedin": ";;jimengsun/;caoxiao/;",
        "or_profile": "~Mintong_Kang1;~Zhen_Lin2;~Jimeng_Sun3;~Cao_Xiao2;~Bo_Li19",
        "aff": "University of Illinois, Urbana Champaign;;Georgia Institute of Technology;GE Healthcare;University of Illinois, Urbana Champaign",
        "aff_domain": "illinois.edu;;gatech.edu;ge.com;illinois.edu",
        "position": "PhD student;;Associate Professor;VP of AI;Assistant Professor",
        "bibtex": "@misc{\nkang2024certifiably,\ntitle={Certifiably Byzantine-Robust Federated Conformal Prediction},\nauthor={Mintong Kang and Zhen Lin and Jimeng Sun and Cao Xiao and Bo Li},\nyear={2024},\nurl={https://openreview.net/forum?id=rFZtyj5kBz}\n}",
        "github": "",
        "project": "",
        "reviewers": "YYE4;LS6w;bwYM;eCJ4",
        "site": "https://openreview.net/forum?id=rFZtyj5kBz",
        "pdf_size": 1018447,
        "rating": "3;5;5;5",
        "confidence": "3;4;4;4",
        "soundness": "3;3;3;3",
        "contribution": "1;3;2;2",
        "presentation": "3;3;2;3",
        "wc_summary": "99;77;166;95",
        "wc_strengths": "18;68;34;51",
        "wc_weaknesses": "86;71;117;289",
        "wc_questions": "15;98;308;101",
        "wc_review": "218;314;625;536",
        "wc_reply_reviewers": "89;0;0;97",
        "wc_reply_authors": "1478;1954;1957;1414",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "3;3;3;3",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            109.25,
            33.796264586489436
        ],
        "wc_strengths_avg": [
            42.75,
            18.673175948402566
        ],
        "wc_weaknesses_avg": [
            140.75,
            87.18478938438746
        ],
        "wc_questions_avg": [
            130.5,
            108.13533187631135
        ],
        "wc_review_avg": [
            423.25,
            163.9197593336447
        ],
        "wc_reply_reviewers_avg": [
            46.5,
            46.585942085569116
        ],
        "wc_reply_authors_avg": [
            1700.75,
            255.75513191332055
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.0,
            0.0
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12390042806915877419&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "University of Illinois Urbana-Champaign;Georgia Institute of Technology;GE Healthcare",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://illinois.edu;https://www.gatech.edu;https://www.gehealthcare.com",
        "aff_unique_abbr": "UIUC;Georgia Tech;GEHC",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Urbana-Champaign;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Progressive Fourier Neural Representation for Sequential Video Compilation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17699",
        "id": "rGFrRMBbOq",
        "author_site": "Haeyong Kang, Jaehong Yoon, DaHyun Kim, Sung Ju Hwang, Chang Yoo",
        "tldr": "",
        "abstract": "Neural Implicit Representation (NIR) has recently gained significant attention due to its remarkable ability to encode complex and high-dimensional data into representation space and easily reconstruct it through a trainable mapping function. However, NIR methods assume a one-to-one mapping between the target data and representation models regardless of data relevancy or similarity. This results in poor generalization over multiple complex data and limits their efficiency and scalability. Motivated by continual learning, this work investigates how to accumulate and transfer neural implicit representations for multiple complex video data over sequential encoding sessions. To overcome the limitation of NIR, we propose a novel method, Progressive Fourier Neural Representation (PFNR), that aims to find an adaptive and compact sub-module in Fourier space to encode videos in each training session. This sparsified neural encoding allows the neural network to hold free weights, enabling an improved adaptation for future videos. In addition, when learning a representation for a new video, PFNR transfers the representation of previous videos with frozen weights. This design allows the model to continuously accumulate high-quality neural representations for multiple videos while ensuring lossless decoding that perfectly preserves the learned representations for previous videos. We validate our PFNR method on the UVG8/17 and DAVIS50 video sequence benchmarks and achieve impressive performance gains over strong continual learning baselines.",
        "keywords": "Fourier Neural Implicit Representation;Seqeuntial Video Compilation;Video Continual Learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/17c983facd53277f089e2f44e8896e1ed3383ebd.zip",
        "author": "Haeyong Kang;Jaehong Yoon;DaHyun Kim;Sung Ju Hwang;Chang D. Yoo",
        "authorids": "~Haeyong_Kang2;~Jaehong_Yoon1;~DaHyun_Kim2;~Sung_Ju_Hwang1;~Chang_D._Yoo1",
        "gender": "M;M;M;;M",
        "homepage": "https://sites.google.com/view/d2plab/home;https://jaehong31.github.io/;https://slsp.kaist.ac.kr;;https://sanctusfactory.com/family.php",
        "dblp": "175/3350;203/4449;;;31/7819",
        "google_scholar": "v_tUj4oAAAAJ;-5comoUAAAAJ;;;gFWgUQEAAAAJ",
        "orcid": ";;;;0000-0002-0756-7179",
        "linkedin": ";jaehongyoon/;;;",
        "or_profile": "~Haeyong_Kang2;~Jaehong_Yoon1;~DaHyun_Kim2;~Sung_Ju_Hwang1;~Chang_D._Yoo1",
        "aff": "Korea Advanced Institute of Science & Technology;University of North Carolina at Chapel Hill;;;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;unc.edu;;;kaist.ac.kr",
        "position": "Postdoc;Postdoc;;;Full Professor",
        "bibtex": "@inproceedings{\nkang2024progressive,\ntitle={Progressive Fourier Neural Representation for Sequential Video Compilation},\nauthor={Haeyong Kang and Jaehong Yoon and DaHyun Kim and Sung Ju Hwang and Chang D. Yoo},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=rGFrRMBbOq}\n}",
        "github": "",
        "project": "",
        "reviewers": "H5Ez;uKbd;MyBt;inAP",
        "pdf_size": 49789802,
        "rating": "6;6;8;8",
        "confidence": "3;4;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;2;3;2",
        "wc_summary": "74;49;196;200",
        "wc_strengths": "92;89;29;102",
        "wc_weaknesses": "215;140;45;99",
        "wc_questions": "91;33;217;82",
        "wc_review": "472;311;487;483",
        "wc_reply_reviewers": "70;13;42;8",
        "wc_reply_authors": "1034;941;1166;559",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "5;2;4;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            129.75,
            68.83449353340228
        ],
        "wc_strengths_avg": [
            78.0,
            28.696689704563486
        ],
        "wc_weaknesses_avg": [
            124.75,
            62.04987912961636
        ],
        "wc_questions_avg": [
            105.75,
            67.91676891607845
        ],
        "wc_review_avg": [
            438.25,
            73.67284099313667
        ],
        "wc_reply_reviewers_avg": [
            33.25,
            24.873429598670143
        ],
        "wc_reply_authors_avg": [
            925.0,
            225.92808590345734
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.25,
            1.299038105676658
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12019791291363434801&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "openreview": "https://openreview.net/forum?id=rGFrRMBbOq",
        "pdf": "https://openreview.net/pdf?id=rGFrRMBbOq",
        "email": "kaist.ac.kr;unc.edu;;;kaist.ac.kr",
        "author_num": 5,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology;University of North Carolina",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.kaist.ac.kr;https://www.unc.edu",
        "aff_unique_abbr": "KAIST;UNC",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Chapel Hill",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "id": "rGdEM131Ht",
        "title": "GENERATIVE TIME SERIES LEARNING WITH TIME-FREQUENCY FUSED ENERGY-BASED MODEL",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Long-term time series forecasting has gained significant attention in recent academic research. However, existing models primarily focus on deterministic point forecasts, neglecting generative long-term probabilistic forecasting and pre-training models across diverse time series analytic tasks, which are essential for uncertainty quantification and computational efficiency. In this paper, we propose a novel encoder-only generative model for long-term probabilistic forecasting and imputation. Our model is an energy-based model, employing a time-frequency block to construct an unnormalized probability density function over temporal paths. The time-frequency block consists of two key components, i.e., a residual dilated convolutional network to increase the receptive fields of raw time series, and a time and frequency features extracting network to integrate both local and global patterns. Our design enables the prediction of long-term time series in a single forward run using Langevin MCMC, which drastically improves the efficiency and accuracy of long-term forecasting. Moreover, our model naturally serves as a general framework for forecasting at varying prediction lengths and imputing missing data points with one pre-trained model, saving both time and resources. Experiments demonstrate that our model achieves competitive results in both forecasting and imputation tasks across a diverse range of public datasets, highlighting its potential as a promising approach for a unified time series forecasting model capable of handling multiple tasks.",
        "keywords": "time series forecasting; generative model",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Yinbo sun;Yu Liu;Lintao Ma;Shiyu Wang;Zhixuan Chu;Wenxin Ning;James Y. Zhang;JUN ZHOU",
        "authorids": "~Yinbo_sun1;~Yu_Liu28;~Lintao_Ma1;~Shiyu_Wang3;~Zhixuan_Chu1;~Wenxin_Ning1;~James_Y._Zhang1;~JUN_ZHOU6",
        "gender": "M;M;;;M;M;M;M",
        "homepage": "https://scholar.google.com/citations?view_op=list_works&hl=en&user=-HGUUG0AAAAJ;;;;;;https://scholar.google.com/citations?user=Ywakh_sAAAAJ;https://scholar.google.com/citations?user=mCVvloEAAAAJ&hl=en",
        "dblp": "325/1857.html;97/2274-71.html;;;258/1233;;151/3086;99/3847-11",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;zbRvnkwAAAAJ;;;a4IuTngAAAAJ;uikdDwUAAAAJ;Ywakh_sAAAAJ;mCVvloEAAAAJ",
        "orcid": "0000-0002-1836-4772;0009-0008-1719-8371;;;;;0000-0001-6519-676X;0000-0001-6033-6102",
        "linkedin": ";;;;;;jamesymzhang/;",
        "or_profile": "~Yinbo_sun1;~Yu_Liu28;~Lintao_Ma1;~Shiyu_Wang3;~Zhixuan_Chu1;~Wenxin_Ning1;~James_Y._Zhang1;~JUN_ZHOU6",
        "aff": "Antgroup;Ant Group;;;Ant Group;Ant Group;Ant Group;Ant Group",
        "aff_domain": "antgroup.com;antgroup.com;;;antgroup.com;antgroup.com;alipay.com;antgroup.com",
        "position": "Researcher;Researcher;;;Researcher;Algorithm Expert;managing director;Researcher",
        "bibtex": "@misc{\nsun2024generative,\ntitle={{GENERATIVE} {TIME} {SERIES} {LEARNING} {WITH} {TIME}-{FREQUENCY} {FUSED} {ENERGY}-{BASED} {MODEL}},\nauthor={Yinbo sun and Yu Liu and Lintao Ma and Shiyu Wang and Zhixuan Chu and Wenxin Ning and James Y. Zhang and JUN ZHOU},\nyear={2024},\nurl={https://openreview.net/forum?id=rGdEM131Ht}\n}",
        "github": "",
        "project": "",
        "reviewers": "DVHZ;yqBZ;op54;5STj;F51B",
        "site": "https://openreview.net/forum?id=rGdEM131Ht",
        "pdf_size": 747579,
        "rating": "5;5;6;6;6",
        "confidence": "4;4;2;2;4",
        "soundness": "3;3;3;2;2",
        "contribution": "3;3;3;3;2",
        "presentation": "2;3;3;3;2",
        "wc_summary": "39;44;59;166;62",
        "wc_strengths": "68;126;122;131;30",
        "wc_weaknesses": "80;165;22;99;200",
        "wc_questions": "137;3;158;504;2",
        "wc_review": "324;338;361;900;294",
        "wc_reply_reviewers": "66;65;52;0;80",
        "wc_reply_authors": "1351;1249;893;901;777",
        "reply_reviewers": "1;1;1;0;1",
        "reply_authors": "4;4;3;2;2",
        "rating_avg": [
            5.6,
            0.48989794855663565
        ],
        "confidence_avg": [
            3.2,
            0.9797958971132712
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.8,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            74.0,
            46.81452765969128
        ],
        "wc_strengths_avg": [
            95.4,
            39.847710097319265
        ],
        "wc_weaknesses_avg": [
            113.2,
            62.99015796138314
        ],
        "wc_questions_avg": [
            160.8,
            183.56404876772575
        ],
        "wc_review_avg": [
            443.4,
            229.32910848821612
        ],
        "wc_reply_reviewers_avg": [
            52.6,
            27.75319801392265
        ],
        "wc_reply_authors_avg": [
            1034.2,
            223.7555809359847
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4
        ],
        "reply_authors_avg": [
            3.0,
            0.8944271909999159
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.6666666666666665,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:vD7piW4B734J:scholar.google.com/&scioq=GENERATIVE+TIME+SERIES+LEARNING+WITH+TIME-FREQUENCY+FUSED+ENERGY-BASED+MODEL&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1;1;1",
        "aff_unique_norm": "Antgroup;Ant Group",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.antgroup.com;https://www.antgroup.com",
        "aff_unique_abbr": "Antgroup;Ant Group",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "rGk0ur4Tfr",
        "title": "Retrieval-Based Video Language Model for Efficient Long Video Question Answering",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The remarkable natural language understanding, reasoning, and generation capabilities of large language models (LLMs) have made them attractive for application to video question answering (VQA) tasks, utilizing video tokens as contextual input. However, employing LLMs for long video understanding presents significant challenges and remains under-explored. The extensive number of video tokens leads to considerable computational costs for LLMs while using aggregated tokens can result in loss of vision details. Moreover, the presence of abundant question-irrelevant tokens introduces noise to the VQA process.\nTo address these issues, we introduce a simple yet effective retrieval-based video language model (R-VLM) for efficient and interpretable long video QA. Specifically, given a question (query) and a long video, our model identifies and selects the most relevant $K$ video chunks and uses their associated visual tokens to serve as context for the LLM inference. This effectively reduces the number of video tokens, eliminates noise interference, and enhances system performance.\nOur experimental results validate the effectiveness of our framework for comprehending long videos. Furthermore, based on the retrieved chunks, our model is interpretable that provides the justifications on where we get the answers.",
        "keywords": "VQA\uff0cLLM\uff0cRetrieval",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/61a78cd5a8279901275f3daafe0e732798f044af.pdf",
        "author": "Jiaqi Xu;Cuiling Lan;Wenxuan Xie;Xuejin Chen;Yan Lu",
        "authorids": "~Jiaqi_Xu3;~Cuiling_Lan1;~Wenxuan_Xie1;~Xuejin_Chen1;~Yan_Lu7",
        "gender": "M;F;M;;M",
        "homepage": "https://abcd.com;https://www.microsoft.com/en-us/research/people/culan/;https://www.microsoft.com/en-us/research/people/wenxie/;;https://www.microsoft.com/en-us/research/people/yanlu/",
        "dblp": ";95/8115;142/0064;;15/4830-1",
        "google_scholar": ";XZugqiwAAAAJ;7vjHnasAAAAJ;;djk5l-4AAAAJ",
        "orcid": "0009-0005-4081-736X;0000-0001-9145-9957;;;0000-0001-5383-6424",
        "linkedin": ";;;;",
        "or_profile": "~Jiaqi_Xu3;~Cuiling_Lan1;~Wenxuan_Xie1;~Xuejin_Chen1;~Yan_Lu7",
        "aff": "University of Science and Technology of China;Microsoft;Microsoft Research Asia;;Microsoft Research Asia",
        "aff_domain": "ustc.edu.cn;microsoft.com;microsoft.com;;microsoft.com",
        "position": "PhD student;Principal Researcher;Researcher;;Partner Research Manager",
        "bibtex": "@misc{\nxu2024retrievalbased,\ntitle={Retrieval-Based Video Language Model for Efficient Long Video Question Answering},\nauthor={Jiaqi Xu and Cuiling Lan and Wenxuan Xie and Xuejin Chen and Yan Lu},\nyear={2024},\nurl={https://openreview.net/forum?id=rGk0ur4Tfr}\n}",
        "github": "",
        "project": "",
        "reviewers": "c7Li;qCRt;WHNQ;P6XZ",
        "site": "https://openreview.net/forum?id=rGk0ur4Tfr",
        "pdf_size": 896795,
        "rating": "3;5;5;6",
        "confidence": "3;4;4;4",
        "soundness": "2;3;2;2",
        "contribution": "2;3;2;1",
        "presentation": "2;3;3;3",
        "wc_summary": "100;61;91;86",
        "wc_strengths": "129;32;52;45",
        "wc_weaknesses": "251;88;117;257",
        "wc_questions": "146;2;111;97",
        "wc_review": "626;183;371;485",
        "wc_reply_reviewers": "0;0;0;52",
        "wc_reply_authors": "1869;694;1370;1472",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "3;1;2;3",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            84.5,
            14.465476141489432
        ],
        "wc_strengths_avg": [
            64.5,
            37.9242666376029
        ],
        "wc_weaknesses_avg": [
            178.25,
            76.47017392421702
        ],
        "wc_questions_avg": [
            89.0,
            53.30572201931046
        ],
        "wc_review_avg": [
            416.25,
            162.15328396304528
        ],
        "wc_reply_reviewers_avg": [
            13.0,
            22.516660498395403
        ],
        "wc_reply_authors_avg": [
            1351.25,
            422.7808977472847
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.9271726499455306,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17142281338884803656&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "University of Science and Technology of China;Microsoft",
        "aff_unique_dep": ";Microsoft Corporation",
        "aff_unique_url": "http://www.ustc.edu.cn;https://www.microsoft.com",
        "aff_unique_abbr": "USTC;Microsoft",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Asia",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "rGvDRT4Z60",
        "title": "FairPATE: Exposing the Pareto Frontier of Fairness, Privacy, Accuracy, and Coverage",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deploying machine learning (ML) models often requires both fairness and privacy guarantees. In this work, we study the challenges of integrating group fairness interventions into the Private Aggregation of Teacher Ensemble (PATE) framework. We show that in the joint fairness-privacy setting, the placement of the fairness intervention before, or after PATE\u2019s noisy aggregation mechanism (which ensures its differential privacy guarantees) leads to excessive fairness violations, or inefficient privacy budgeting, respectively. With this in mind, we present FairPATE which adds a rejection mechanism due to fairness violations. Through careful adjustment of PATE\u2019s privacy accounting, we match the DP-SGD-based state-of-the-art privacy-fairness-accuracy trade-offs (Lowy et al., 2023) in demographic parity, and improve on them for equality of odds with 2% lower disparity at similar accuracy levels and privacy budgets. We also evaluate FairPATE in the setting where exact fairness guarantees need to be enforced by refusing to provide algorithmic decisions at inference-time (for instance, in a human-in-the-loop setting) thus trading off fairness with coverage. Based on our FairPATE, we provide, for the first time, empirical Pareto frontiers for fairness, privacy, accuracy, and coverage on a range of privacy and fairness benchmark datasets.",
        "keywords": "fairness;privacy;pate;pareto frontier",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/29bec30e1cde4a6ce46db9833d2a2518272c6c96.zip",
        "author": "Mohammad Yaghini;Patty Liu;Franziska Boenisch;Nicolas Papernot",
        "authorids": "~Mohammad_Yaghini1;~Patty_Liu1;~Franziska_Boenisch2;~Nicolas_Papernot1",
        "gender": "M;F;;M",
        "homepage": "https://m-yaghini.github.io;;;https://www.papernot.fr",
        "dblp": "175/1555;166/0405;;162/1405",
        "google_scholar": "t0PeZ3cAAAAJ;;;cGxq0cMAAAAJ",
        "orcid": ";;;",
        "linkedin": "myaghini/;patty-liu-2596201b5/;;nicolaspapernot",
        "or_profile": "~Mohammad_Yaghini1;~Patty_Liu1;~Franziska_Boenisch2;~Nicolas_Papernot1",
        "aff": "University of Toronto, Vector Institute;University of Toronto;;Google",
        "aff_domain": "utoronto.ca;utoronto.ca;;google.com",
        "position": "PhD student;Undergrad student;;Research Scientist",
        "bibtex": "@misc{\nyaghini2024fairpate,\ntitle={Fair{PATE}: Exposing the Pareto Frontier of Fairness, Privacy, Accuracy, and Coverage},\nauthor={Mohammad Yaghini and Patty Liu and Franziska Boenisch and Nicolas Papernot},\nyear={2024},\nurl={https://openreview.net/forum?id=rGvDRT4Z60}\n}",
        "github": "",
        "project": "",
        "reviewers": "p5Rv;Mex5;XkhF",
        "site": "https://openreview.net/forum?id=rGvDRT4Z60",
        "pdf_size": 2485044,
        "rating": "3;3;5",
        "confidence": "4;3;4",
        "soundness": "2;3;3",
        "contribution": "2;1;2",
        "presentation": "3;3;4",
        "wc_summary": "131;136;28",
        "wc_strengths": "85;61;39",
        "wc_weaknesses": "641;871;109",
        "wc_questions": "188;115;213",
        "wc_review": "1045;1183;389",
        "wc_reply_reviewers": "1027;228;154",
        "wc_reply_authors": "3314;1661;1501",
        "reply_reviewers": "7;1;2",
        "reply_authors": "5;3;3",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            98.33333333333333,
            49.775049528408864
        ],
        "wc_strengths_avg": [
            61.666666666666664,
            18.78533707147383
        ],
        "wc_weaknesses_avg": [
            540.3333333333334,
            319.12519312785207
        ],
        "wc_questions_avg": [
            172.0,
            41.57723736212721
        ],
        "wc_review_avg": [
            872.3333333333334,
            346.3806512430444
        ],
        "wc_reply_reviewers_avg": [
            469.6666666666667,
            395.2504128889543
        ],
        "wc_reply_authors_avg": [
            2158.6666666666665,
            819.5512322132291
        ],
        "reply_reviewers_avg": [
            3.3333333333333335,
            2.6246692913372702
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "replies_avg": [
            32,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:WJp-O_WO9tcJ:scholar.google.com/&scioq=FairPATE:+Exposing+the+Pareto+Frontier+of+Fairness,+Privacy,+Accuracy,+and+Coverage&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "University of Toronto;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.utoronto.ca;https://www.google.com",
        "aff_unique_abbr": "U of T;Google",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Toronto;;Mountain View",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "Canada;United States"
    },
    {
        "title": "Advancing Pose-Guided Image Synthesis with Progressive Conditional Diffusion Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17698",
        "id": "rHzapPnCgT",
        "author_site": "Fei Shen, Hu Ye, Jun Zhang, Cong Wang, Xiao Han, Yang Wei",
        "tldr": "",
        "abstract": "Recent work has showcased the significant potential of diffusion models in pose-guided person image synthesis.\nHowever, owing to the inconsistency in pose between the source and target images, synthesizing an image with a distinct pose, relying exclusively on the source image and target pose information, remains a formidable challenge.\nThis paper presents Progressive Conditional Diffusion Models (PCDMs) that incrementally bridge the gap between person images under the target and source poses through three stages.\nSpecifically, in the first stage, we design a simple prior conditional diffusion model that predicts the global features of the target image by mining the global alignment relationship between pose coordinates and image appearance.\nThen, the second stage establishes a dense correspondence between the source and target images using the global features from the previous stage, and an inpainting conditional diffusion model is proposed to further align and enhance the contextual features, generating a coarse-grained person image.\nIn the third stage, we propose a refining conditional diffusion model to utilize the coarsely generated image from the previous stage as a condition, achieving texture restoration and enhancing fine-detail consistency.\nThe three-stage PCDMs work progressively to generate the final high-quality and high-fidelity synthesized image.\nBoth qualitative and quantitative results demonstrate the consistency and photorealism of our proposed PCDMs under challenging scenarios.\nThe code and model will be available at https://github.com/tencent-ailab/PCDMs.",
        "keywords": "Diffusion Model;  Pose-Guided Image Synthesis",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Fei Shen;Hu Ye;Jun Zhang;Cong Wang;Xiao Han;Yang Wei",
        "authorids": "~Fei_Shen1;huye@tencent.com;~Jun_Zhang17;~Cong_Wang8;~Xiao_Han2;~Yang_Wei2",
        "gender": ";;M;M;M;M",
        "homepage": ";;https://junzhang.org;https://tenvence.github.io/;;",
        "dblp": ";;29/4190-18.html;18/2771-34;01/2095-7;03/1094-32.html",
        "google_scholar": ";;;h7EIOCUAAAAJ;XGVV3gEAAAAJ;",
        "orcid": ";;0000-0001-5579-7094;0000-0003-0916-7803;;",
        "linkedin": ";;;;xiaohan2009;",
        "or_profile": "~Fei_Shen1;huye@tencent.com;~Jun_Zhang17;~Cong_Wang8;~Xiao_Han2;~Yang_Wei2",
        "aff": ";;Tencent AI Lab;Tencent AI Lab;Tencent AI Lab;Tencent AI Lab",
        "aff_domain": ";;tencent.com;tencent.com;tencent.com;tencent.com",
        "position": ";;Principal Researcher;Intern;Principal Researcher;Researcher",
        "bibtex": "@inproceedings{\nshen2024advancing,\ntitle={Advancing Pose-Guided Image Synthesis with Progressive Conditional Diffusion Models},\nauthor={Fei Shen and Hu Ye and Jun Zhang and Cong Wang and Xiao Han and Yang Wei},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=rHzapPnCgT}\n}",
        "github": "",
        "project": "",
        "reviewers": "dqE5;m9vj;nRkN;hURi",
        "pdf_size": 8778159,
        "rating": "5;6;6;8",
        "confidence": "4;4;5;3",
        "soundness": "3;3;3;4",
        "contribution": "2;3;2;4",
        "presentation": "3;3;3;4",
        "wc_summary": "103;99;67;46",
        "wc_strengths": "45;125;65;75",
        "wc_weaknesses": "135;136;319;65",
        "wc_questions": "271;116;32;47",
        "wc_review": "554;476;483;233",
        "wc_reply_reviewers": "0;0;217;0",
        "wc_reply_authors": "1518;1082;1520;567",
        "reply_reviewers": "0;0;3;0",
        "reply_authors": "4;3;6;2",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            78.75,
            23.498670175139697
        ],
        "wc_strengths_avg": [
            77.5,
            29.47456530637899
        ],
        "wc_weaknesses_avg": [
            163.75,
            94.14184776176852
        ],
        "wc_questions_avg": [
            116.5,
            94.65859707390555
        ],
        "wc_review_avg": [
            436.5,
            121.38883803711114
        ],
        "wc_reply_reviewers_avg": [
            54.25,
            93.96375631061159
        ],
        "wc_reply_authors_avg": [
            1171.75,
            392.0920650816591
        ],
        "reply_reviewers_avg": [
            0.75,
            1.299038105676658
        ],
        "reply_authors_avg": [
            3.75,
            1.479019945774904
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.6488856845230502,
        "gs_citation": 102,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6244333408202591894&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=rHzapPnCgT",
        "pdf": "https://openreview.net/pdf?id=rHzapPnCgT",
        "email": ";;tencent.com;tencent.com;tencent.com;tencent.com",
        "author_num": 6,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Tencent",
        "aff_unique_dep": "Tencent AI Lab",
        "aff_unique_url": "https://ai.tencent.com",
        "aff_unique_abbr": "Tencent AI Lab",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "rIK7T1dXzm",
        "title": "Mitigating Uni-modal Sensory Bias in Multimodal Object Detection with Counterfactual Intervention and Causal Mode Multiplexing",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Multimodal object detection using RGB and thermal sensors (RGBT) has emerged as a promising solution for safety-critical vision applications that require non-stop operations all day/night. However, there are unsolved issues in multimodal object detection, including uni-modal sensory bias, where models tend to rely on one modality over the other instead of referring to multimodal reasoning. We analyze that training differential multimodal data (i.e., RXTO) on correlation-based symmetrical fusion topology structures provokes such skewed preference. To address this problem, we propose a novel Causal Mode Multiplexing (CMM) framework using the tools of counterfactual intervention. Different from the symmetrical fusion topology of existing methods, the proposed approach leverages two distinct causal graphs based on the input data type. The counterfactual intervention is performed on differential inputs (RXTO, ROTX), while the total effect of the symmetrical fusion topology is learned for common inputs (ROTO). Then, we propose a Causal Mode Multiplexing (CMM) Loss to optimize the interchange between two causal graphs. Overall, the CMM framework enables learning the causality links between the multimodal inputs and predictions, eliminating the uni-modal sensory bias. To assess the effectiveness of CMM, we introduce the ROTX Multispectral Pedestrian (ROTX-MPed) dataset which we will release in public. This dataset mainly includes counterexamples that are not present in existing data. Extensive experiments on KAIST, CVC-14, FLIR, and our ROTX-Mped dataset demonstrate that our CMM framework effectively learns multimodal reasoning and generalizes well on ROTX test data with only training conventional ROTO and RXTO data.",
        "keywords": "Multimodal Object Detection;Uni-modal Sensory Bias;Causal Mode Multiplexing",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Taeheon Kim;Sebin Shin;Youngjoon Yu;Hak Gu Kim;Yong Man Ro",
        "authorids": "~Taeheon_Kim1;~Sebin_Shin1;~Youngjoon_Yu1;~Hak_Gu_Kim2;~Yong_Man_Ro3",
        "gender": "M;;M;M;M",
        "homepage": "https://sites.google.com/view/taeheonkim;https://ivylab.kaist.ac.kr/;https://sites.google.com/business.kaist.edu/youngjoon-yu;https://www.irislab.cau.ac.kr;https://www.ivllab.kaist.ac.kr/people/professor",
        "dblp": "182/7467;360/9809;266/1289;143/2074;02/1221",
        "google_scholar": "9nYafYMAAAAJ;a-wpcQEAAAAJ;;Jgh1JYgAAAAJ;https://scholar.google.co.kr/citations?user=IPzfF7cAAAAJ",
        "orcid": ";;;;0000-0001-5306-6853",
        "linkedin": "tae-kim-39bab2231/;;;;",
        "or_profile": "~Taeheon_Kim1;~Sebin_Shin1;~Youngjoon_Yu1;~HAK_GU_KIM1;~Yong_Man_Ro1",
        "aff": "Korea Advanced Institute of Science & Technology;KAIST;Korea Advanced Institute of Science & Technology;Chung-Ang University;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;ee.kaist.ac.kr;kaist.ac.kr;cau.ac.kr;kaist.ac.kr",
        "position": "PhD student;MS student;PhD student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nkim2024mitigating,\ntitle={Mitigating Uni-modal Sensory Bias in Multimodal Object Detection with Counterfactual Intervention and Causal Mode Multiplexing},\nauthor={Taeheon Kim and Sebin Shin and Youngjoon Yu and Hak Gu Kim and Yong Man Ro},\nyear={2024},\nurl={https://openreview.net/forum?id=rIK7T1dXzm}\n}",
        "github": "",
        "project": "",
        "reviewers": "A42c;AhFd;6EfW",
        "site": "https://openreview.net/forum?id=rIK7T1dXzm",
        "pdf_size": 1588629,
        "rating": "3;5;6",
        "confidence": "4;3;3",
        "soundness": "2;3;2",
        "contribution": "2;2;3",
        "presentation": "1;2;3",
        "wc_summary": "74;72;55",
        "wc_strengths": "30;46;39",
        "wc_weaknesses": "247;76;148",
        "wc_questions": "3;118;54",
        "wc_review": "354;312;296",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            67.0,
            8.524474568362947
        ],
        "wc_strengths_avg": [
            38.333333333333336,
            6.548960901462833
        ],
        "wc_weaknesses_avg": [
            157.0,
            70.09992867328754
        ],
        "wc_questions_avg": [
            58.333333333333336,
            47.04843839656695
        ],
        "wc_review_avg": [
            320.6666666666667,
            24.458581770458856
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9449111825230683,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13812795427496437726&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology;Chung-Ang University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.kaist.ac.kr;http://www.cau.ac.kr",
        "aff_unique_abbr": "KAIST;CAU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "Curriculum reinforcement learning for quantum architecture search under hardware errors",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17697",
        "id": "rINBD8jPoP",
        "author_site": "Yash J. Patel, Akash Kundu, Mateusz Ostaszewski, Xavier Bonet-Monroig, Vedran Dunjko, Onur Danaci",
        "tldr": "",
        "abstract": "The key challenge in the noisy intermediate-scale quantum era is finding useful circuits compatible with current device limitations.\nVariational quantum algorithms (VQAs) offer a potential solution by fixing the circuit architecture and optimizing individual gate parameters in an external loop. However, parameter optimization can become intractable, and the overall performance of the algorithm depends heavily on the initially chosen circuit architecture. Several quantum architecture search (QAS) algorithms have been developed to design useful circuit architectures automatically. In the case of parameter optimization alone, noise effects have been observed to dramatically influence the performance of the optimizer and final outcomes, which is a key line of study. However, the effects of noise on the architecture search, which could be just as critical, are poorly understood. This work addresses this gap by introducing a curriculum-based reinforcement learning QAS (CRLQAS) algorithm designed to tackle challenges in realistic VQA deployment. The algorithm incorporates (i) a 3D architecture encoding and restrictions on environment dynamics to explore the search space of possible circuits efficiently, (ii) an episode halting scheme to steer the agent to find shorter circuits, and (iii) a novel variant of simultaneous perturbation stochastic approximation as an optimizer for faster convergence. To facilitate studies, we developed an optimized simulator for our algorithm, significantly improving computational efficiency in simulating noisy quantum circuits by employing the Pauli-transfer matrix formalism in the Pauli-Liouville basis. Numerical experiments focusing on quantum chemistry tasks demonstrate that CRLQAS outperforms existing QAS algorithms across several metrics in both noiseless and noisy environments.",
        "keywords": "Quantum Computing;Reinforcement Learning;Quantum Chemistry;Quantum Architecture Search;Optimization",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Yash J. Patel;Akash Kundu;Mateusz Ostaszewski;Xavier Bonet-Monroig;Vedran Dunjko;Onur Danaci",
        "authorids": "~Yash_J._Patel1;akundu@iitis.pl;~Mateusz_Ostaszewski1;bonet@lorentz.leidenuniv.nl;~Vedran_Dunjko1;danaci@lorentz.leidenuniv.nl",
        "gender": "M;;;;M;",
        "homepage": ";;;;https://liacs.leidenuniv.nl/~dunjkov/index.html;",
        "dblp": "324/5180;;;;;",
        "google_scholar": "CSigf9cAAAAJ;;;;syyWEfIAAAAJ;",
        "orcid": "0009-0007-3060-6950;;;;;",
        "linkedin": "yash-patel-45145b181/;;;;;",
        "or_profile": "~Yash_J._Patel1;akundu@iitis.pl;~Mateusz_Ostaszewski1;bonet@lorentz.leidenuniv.nl;~Vedran_Dunjko1;danaci@lorentz.leidenuniv.nl",
        "aff": "Leiden University, Leiden University;;;;Leiden University;",
        "aff_domain": "liacs.leidenuniv.nl;;;;leidenuniv.nl;",
        "position": "PhD student;;;;Assistant Professor;",
        "bibtex": "@inproceedings{\npatel2024curriculum,\ntitle={Curriculum reinforcement learning for quantum architecture search under hardware errors},\nauthor={Yash J. Patel and Akash Kundu and Mateusz Ostaszewski and Xavier Bonet-Monroig and Vedran Dunjko and Onur Danaci},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=rINBD8jPoP}\n}",
        "github": "",
        "project": "",
        "reviewers": "3EHX;WndL;wt33;sjih;K92h",
        "pdf_size": 8502195,
        "rating": "5;5;6;6;6",
        "confidence": "3;4;4;5;4",
        "soundness": "3;2;3;2;2",
        "contribution": "2;2;2;2;3",
        "presentation": "3;2;3;2;1",
        "wc_summary": "135;48;32;95;121",
        "wc_strengths": "90;26;53;182;192",
        "wc_weaknesses": "173;391;265;299;263",
        "wc_questions": "242;91;24;111;214",
        "wc_review": "640;556;374;687;790",
        "wc_reply_reviewers": "102;241;0;78;34",
        "wc_reply_authors": "1339;4801;1696;665;2069",
        "reply_reviewers": "1;1;0;1;1",
        "reply_authors": "3;7;3;1;3",
        "rating_avg": [
            5.6,
            0.48989794855663565
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.2,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            86.2,
            40.16665283540564
        ],
        "wc_strengths_avg": [
            108.6,
            67.23570480035143
        ],
        "wc_weaknesses_avg": [
            278.2,
            70.18375880501128
        ],
        "wc_questions_avg": [
            136.4,
            80.6389484058417
        ],
        "wc_review_avg": [
            609.4,
            139.88509570358096
        ],
        "wc_reply_reviewers_avg": [
            91.0,
            82.84926070883192
        ],
        "wc_reply_authors_avg": [
            2114.0,
            1421.0520046782244
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4
        ],
        "reply_authors_avg": [
            3.4,
            1.9595917942265424
        ],
        "replies_avg": [
            31,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.6454972243679027,
        "gs_citation": 23,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6808939336461833658&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=rINBD8jPoP",
        "pdf": "https://openreview.net/pdf?id=rINBD8jPoP",
        "email": "liacs.leidenuniv.nl;;;;leidenuniv.nl;",
        "author_num": 6,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Leiden University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.universiteitleiden.nl",
        "aff_unique_abbr": "LU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Leiden;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Netherlands"
    },
    {
        "id": "rIt0sJsZw9",
        "title": "Clustering Entity Specific Embeddings Towards a Prescribed Distribution",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Now ubiquitous in deep learning is the transformer architecture, which has advanced the state-of-the-art (SOTA) in a variety of disciplines. When employed with a bidirectional attention mask, a special [CLS] token is often appended to the sequence being processed, serving as a summary of the sequence as a whole once processed. While directly useful in many applications, the processed [CLS] embedding loses utility when asked to perform an entity-specific task given a multi-entity sequence - when processing a multi-speaker dialogue, for example, the [CLS] will describe the entire dialogue not a particular utterance. Existing approaches to address this often either involve redundant computation or non-trivial post-processing outside of the transformer. We propose a general, efficient method for deriving entity-specific embeddings \\textit{completely within} the transformer architecture, and demonstrate how the approach yields SOTA results in the domains of natural language processing (NLP) and sports analytics (SA), an exciting, relatively unexplored problem space. Furthermore, we propose a novel approach for deep-clustering towards a prescribed distribution in the absence of labels. Previous approaches towards distribution aware clustering required ground-truth labels, which are not always available. In addition to uncovering interesting signal in the domain of sport, we show how our distribution-aware clustering method yields new cluster-based SOTA on the task of long-tail partial-label learning (LT-PLL). Code available upon publication.",
        "keywords": "Representation learning;emotion recognition;long-tail partial-label learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/ce191dafec4f2bca2b1d9c10ad9e5d839e19b607.zip",
        "author": "Connor Heaton;Prasenjit Mitra",
        "authorids": "~Connor_Heaton1;~Prasenjit_Mitra1",
        "gender": ";M",
        "homepage": ";http://www.personal.psu.edu/pum10/",
        "dblp": "274/0769.html;19/3308",
        "google_scholar": ";8PbgiPkAAAAJ",
        "orcid": ";",
        "linkedin": ";prasenjit-mitra-962471/",
        "or_profile": "~Connor_Heaton1;~Prasenjit_Mitra1",
        "aff": "Pennsylvania State University;Pennsylvania State University",
        "aff_domain": "psu.edu;psu.edu",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nheaton2024clustering,\ntitle={Clustering Entity Specific Embeddings Towards a Prescribed Distribution},\nauthor={Connor Heaton and Prasenjit Mitra},\nyear={2024},\nurl={https://openreview.net/forum?id=rIt0sJsZw9}\n}",
        "github": "",
        "project": "",
        "reviewers": "k1pV;JpxY;hHfi;Sd3V",
        "site": "https://openreview.net/forum?id=rIt0sJsZw9",
        "pdf_size": 565268,
        "rating": "3;3;5;6",
        "confidence": "4;2;3;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "1;1;3;2",
        "wc_summary": "73;93;71;91",
        "wc_strengths": "29;77;49;36",
        "wc_weaknesses": "162;69;62;130",
        "wc_questions": "5;1;22;57",
        "wc_review": "269;240;204;314",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "697;779;533;785",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            82.0,
            10.04987562112089
        ],
        "wc_strengths_avg": [
            47.75,
            18.34904629674251
        ],
        "wc_weaknesses_avg": [
            105.75,
            41.883021619744675
        ],
        "wc_questions_avg": [
            21.25,
            22.094965489902897
        ],
        "wc_review_avg": [
            256.75,
            40.28259549731124
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            698.5,
            101.67964398049395
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Q8BlF9gSW00J:scholar.google.com/&scioq=Clustering+Entity+Specific+Embeddings+Towards+a+Prescribed+Distribution&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Pennsylvania State University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.psu.edu",
        "aff_unique_abbr": "PSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "rIv15j44gR",
        "title": "Estimating Heterogeneous Treatment Effect with Delayed Response",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Estimation of heterogeneous treatment effects has gathered much attention in recent years and has been widely adopted in medicine, economics, and marketing. Previous studies assumed that one of the potential outcomes of interest could be observed timely and accurately. However, a more practical scenario is that treatment takes time to produce causal effects on the outcomes. For example, drugs take time to produce medical utility for patients and users take time to purchase items after being recommended, and ignoring such delays in feedback can lead to biased estimates of heterogeneous treatment effects. To address the above problem, we study the impact of observation time on estimating heterogeneous treatment effects by further considering the potential response time that potential outcomes have. We theoretically prove the identifiability results and further propose a principled learning approach, known as CFR-DF (Counterfactual Regression with Delayed Feedback), to simultaneously learn potential response times and potential outcomes of interest. Results on both simulated and real-world datasets demonstrate the effectiveness of our method.",
        "keywords": "Heterogeneous Treatment Effects;Delayed Response;Potential Response Time;Potential Outcomes",
        "primary_area": "causal reasoning",
        "supplementary_material": "/attachment/593d4ef878b4c8d0befc3cec06f2f61ff15e4827.zip",
        "author": "Anpeng Wu;Haoxuan Li;Yuhao Deng;Yi Wang;Bo Li;Fei Wu;Kun Kuang",
        "authorids": "~Anpeng_Wu1;~Haoxuan_Li6;~Yuhao_Deng1;~Yi_Wang41;~Bo_Li29;~Fei_Wu1;~Kun_Kuang1",
        "gender": "M;M;M;M;M;M;M",
        "homepage": "https://scholar.google.com.hk/citations?user=VQ4m6zQAAAAJ&hl=zh-CN&oi=sra;https://haoxuanli-pku.github.io/;;;http://www.sem.tsinghua.edu.cn/en/libo;https://person.zju.edu.cn/wufei;http://kunkuang.github.io",
        "dblp": "267/5637;145/4965-1.html;https://dblp.org/rec/conf/ijcai/WuLDHDDSZZ22;;50/3402-64;84/3254-1;194/4245",
        "google_scholar": "https://scholar.google.com.hk/citations?user=VQ4m6zQAAAAJ;gtDqiucAAAAJ;;;GaJXFWMAAAAJ;XJLn4MYAAAAJ;https://scholar.google.com.hk/citations?user=FOsNiMQAAAAJ",
        "orcid": "0000-0003-3898-7122;0000-0003-3620-3769;0000-0003-0331-6070;0000-0003-0253-1334;0000-0001-5599-8857;;0009-0000-7528-8131",
        "linkedin": ";;;;;;",
        "or_profile": "~Anpeng_Wu1;~Haoxuan_Li6;~Yuhao_Deng1;~Yi_Wang41;~Bo_Li29;~Fei_Wu1;~Kun_Kuang1",
        "aff": "Mohamed bin Zayed University of Artificial Intelligence;Peking University;;;Tsinghua University;Zhejiang University;Zhejiang University",
        "aff_domain": "mbzuai.ac.ae;pku.edu.cn;;;tsinghua.edu.cn;zju.edu.cn;zju.edu.cn",
        "position": "Researcher;PhD student;;;Associate Professor;Full Professor;Associate Professor",
        "bibtex": "@misc{\nwu2024estimating,\ntitle={Estimating Heterogeneous Treatment Effect with Delayed Response},\nauthor={Anpeng Wu and Haoxuan Li and Yuhao Deng and Yi Wang and Bo Li and Fei Wu and Kun Kuang},\nyear={2024},\nurl={https://openreview.net/forum?id=rIv15j44gR}\n}",
        "github": "",
        "project": "",
        "reviewers": "WuYz;X2NB;bGea;5txA",
        "site": "https://openreview.net/forum?id=rIv15j44gR",
        "pdf_size": 914327,
        "rating": "3;3;3;6",
        "confidence": "4;4;4;3",
        "soundness": "2;3;2;3",
        "contribution": "1;1;1;3",
        "presentation": "3;3;2;3",
        "wc_summary": "123;46;44;44",
        "wc_strengths": "19;47;47;81",
        "wc_weaknesses": "485;352;310;89",
        "wc_questions": "107;41;63;53",
        "wc_review": "734;486;464;267",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            64.25,
            33.92915413033458
        ],
        "wc_strengths_avg": [
            48.5,
            21.97157254271983
        ],
        "wc_weaknesses_avg": [
            309.0,
            142.50087719028258
        ],
        "wc_questions_avg": [
            66.0,
            24.919871588754223
        ],
        "wc_review_avg": [
            487.75,
            165.78355618094335
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:hPFIONK0q4oJ:scholar.google.com/&scioq=Estimating+Heterogeneous+Treatment+Effect+with+Delayed+Response&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;3",
        "aff_unique_norm": "Mohamed bin Zayed University of Artificial Intelligence;Peking University;Tsinghua University;Zhejiang University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://mbzuai.ac.ae;http://www.pku.edu.cn;https://www.tsinghua.edu.cn;https://www.zju.edu.cn",
        "aff_unique_abbr": "MBZUAI;Peking U;THU;ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;1",
        "aff_country_unique": "United Arab Emirates;China"
    },
    {
        "title": "Understanding Addition in Transformers",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17696",
        "id": "rIx1YXVWZb",
        "author_site": "Philip Quirke, Fazl Barez",
        "tldr": "",
        "abstract": "Understanding the inner workings of machine learning models like Transformers is vital for their safe and ethical use. This paper provides a comprehensive analysis of a one-layer Transformer model trained to perform n-digit integer addition. Our findings suggests that the model dissects the task into parallel streams dedicated to individual digits, employing varied algorithms tailored to different positions within the digits. Furthermore, we identify a rare scenario characterized by high loss, which we explain. By thoroughly elucidating the model\u2019s algorithm, we provide new insights into its functioning. These findings are validated through rigorous testing and mathematical modeling, thereby contributing to the broader fields of model understanding and interpretability. Our approach opens the door for analyzing more complex tasks and multi-layer Transformer models.",
        "keywords": "Interpretability;Transformers",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Philip Quirke;Fazl Barez",
        "authorids": "~Philip_Quirke1;~Fazl_Barez1",
        "gender": "M;",
        "homepage": ";",
        "dblp": ";",
        "google_scholar": "https://scholar.google.com/citations?hl=en;",
        "orcid": ";",
        "linkedin": "philip-quirke-726a7414/;",
        "or_profile": "~Philip_Quirke1;~Fazl_Barez1",
        "aff": "Apart Research;",
        "aff_domain": "apartresearch.com;",
        "position": "Researcher;",
        "bibtex": "@inproceedings{\nquirke2024understanding,\ntitle={Understanding Addition in Transformers},\nauthor={Philip Quirke and Fazl Barez},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=rIx1YXVWZb}\n}",
        "github": "",
        "project": "",
        "reviewers": "sWU9;wEos;ExS5;f5y1",
        "pdf_size": 1072588,
        "rating": "3;3;8;8",
        "confidence": "4;4;3;3",
        "soundness": "3;1;3;3",
        "contribution": "2;1;4;3",
        "presentation": "1;2;4;3",
        "wc_summary": "74;15;230;56",
        "wc_strengths": "22;13;77;49",
        "wc_weaknesses": "100;37;95;39",
        "wc_questions": "4;420;12;31",
        "wc_review": "200;485;414;175",
        "wc_reply_reviewers": "0;72;19;0",
        "wc_reply_authors": "740;919;271;9",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "2;4;1;1",
        "rating_avg": [
            5.5,
            2.5
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.5,
            1.118033988749895
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            93.75,
            81.51801948035784
        ],
        "wc_strengths_avg": [
            40.25,
            25.01374622082826
        ],
        "wc_weaknesses_avg": [
            67.75,
            29.810862114336782
        ],
        "wc_questions_avg": [
            116.75,
            175.35588812469342
        ],
        "wc_review_avg": [
            318.5,
            133.67591406083596
        ],
        "wc_reply_reviewers_avg": [
            22.75,
            29.473505051147207
        ],
        "wc_reply_authors_avg": [
            484.75,
            362.5440490478364
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 29,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13503363613662200309&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=rIx1YXVWZb",
        "pdf": "https://openreview.net/pdf?id=rIx1YXVWZb",
        "email": "apartresearch.com;",
        "author_num": 2,
        "aff_unique_index": "0",
        "aff_unique_norm": "Apart Research",
        "aff_unique_dep": "",
        "aff_unique_url": "",
        "aff_unique_abbr": ""
    },
    {
        "id": "rJKlmCpOQ7",
        "title": "Removing Multiple Shortcuts through the Lens of Multi-task Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We consider the problem of training an unbiased and accurate model using a biased dataset with multiple biases. This problem is challenging since the multiple biases cause multiple undesirable shortcuts during training, and even worse, mitigating one of them may exacerbate another. To address this challenge, we introduce a novel method connecting the problem to multi-task learning (MTL). Our method divides training data into several groups according to their effects on the model bias and defines each task of MTL as solving the target problem for each group. It in turn trains a single model for all the tasks with a weighted sum of task-wise losses as the training objective, while optimizing the weights as well as the model parameters. At the heart of our method lies the weight adjustment algorithm, which is rooted in a theory of multi-objective optimization and guarantees a Pareto-stationary solution. In addition, we also present a new real-image dataset with multiple biases, dubbed MultiCelebA, for evaluating debiased training methods under realistic and challenging scenarios. Our method achieved the state of the art on three datasets with multiple biases including MultiCelebA, and demonstrated superior performance on conventional single-bias datasets.",
        "keywords": "Debiasing;spurious correlation;multiple biases;shortcut learning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Nayeong Kim;Juwon Kang;Sungsoo Ahn;Jungseul Ok;Suha Kwak",
        "authorids": "~Nayeong_Kim1;~Juwon_Kang1;~Sungsoo_Ahn1;~Jungseul_Ok2;~Suha_Kwak3",
        "gender": "F;M;M;M;M",
        "homepage": "https://nayeong-v-kim.github.io/;http://cvlab.postech.ac.kr/lab/members.php;https://sungsooahn.super.site/;https://sites.google.com/view/jungseulok;https://suhakwak.github.io/",
        "dblp": "322/6051;214/2255;90/5164;117/3448;65/6173",
        "google_scholar": "XqX08VAAAAAJ;nwN9X2UAAAAJ;XTenHs0AAAAJ;KWG3UUMAAAAJ;-gscDIEAAAAJ",
        "orcid": ";;;0000-0003-4742-2473;",
        "linkedin": "nayeong-kim-ab1245106/;;;;",
        "or_profile": "~Nayeong_Kim1;~Juwon_Kang1;~Sungsoo_Ahn1;~Jungseul_Ok2;~Suha_Kwak3",
        "aff": "POSTECH;POSTECH;Pohang University of Science and Technology;POSTECH;POSTECH",
        "aff_domain": "postech.ac.kr;postech.ac.kr;postech.ac.kr;postech.ac.kr;postech.ac.kr",
        "position": "PhD student;PhD student;Assistant Professor;Associate Professor;Associate Professor",
        "bibtex": "@misc{\nkim2024removing,\ntitle={Removing Multiple Shortcuts through the Lens of Multi-task Learning},\nauthor={Nayeong Kim and Juwon Kang and Sungsoo Ahn and Jungseul Ok and Suha Kwak},\nyear={2024},\nurl={https://openreview.net/forum?id=rJKlmCpOQ7}\n}",
        "github": "",
        "project": "",
        "reviewers": "B9DR;tCm5;JtYi;4jDT;juPf",
        "site": "https://openreview.net/forum?id=rJKlmCpOQ7",
        "pdf_size": 2087445,
        "rating": "3;5;6;6;6",
        "confidence": "4;3;4;3;2",
        "soundness": "2;1;3;3;3",
        "contribution": "2;2;3;3;3",
        "presentation": "3;3;3;3;4",
        "wc_summary": "134;81;180;76;114",
        "wc_strengths": "86;41;33;29;49",
        "wc_weaknesses": "475;216;311;366;48",
        "wc_questions": "31;15;297;3;79",
        "wc_review": "726;353;821;474;290",
        "wc_reply_reviewers": "536;0;131;0;50",
        "wc_reply_authors": "3280;1178;1240;874;601",
        "reply_reviewers": "3;0;1;0;1",
        "reply_authors": "7;2;2;2;1",
        "rating_avg": [
            5.2,
            1.16619037896906
        ],
        "confidence_avg": [
            3.2,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.4,
            0.8
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            3.2,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            117.0,
            38.06310549600492
        ],
        "wc_strengths_avg": [
            47.6,
            20.392155354449415
        ],
        "wc_weaknesses_avg": [
            283.2,
            144.39584481556247
        ],
        "wc_questions_avg": [
            85.0,
            109.10545357588684
        ],
        "wc_review_avg": [
            532.8,
            207.42362449827164
        ],
        "wc_reply_reviewers_avg": [
            143.4,
            202.05900128427837
        ],
        "wc_reply_authors_avg": [
            1434.6,
            950.618240935866
        ],
        "reply_reviewers_avg": [
            1.0,
            1.0954451150103321
        ],
        "reply_authors_avg": [
            2.8,
            2.1354156504062622
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5041841733655162,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:2jJengI7ohYJ:scholar.google.com/&scioq=Removing+Multiple+Shortcuts+through+the+Lens+of+Multi-task+Learning&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Pohang University of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.postech.ac.kr",
        "aff_unique_abbr": "POSTECH",
        "aff_campus_unique_index": "0;0;0;0;0",
        "aff_campus_unique": "Pohang",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "rJpG5hdrEa",
        "title": "On the Geometry of Reinforcement Learning in Continuous State and Action Spaces",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Advances in reinforcement learning have led to its successful application in complex tasks with continuous state and action spaces. Despite these advances in practice, most theoretical work pertains to finite state and action spaces. We propose building a theoretical understanding of continuous state and action spaces by employing a geometric lens. Central to our work is the idea that the transition dynamics induce a low dimensional manifold of reachable states embedded in the high-dimensional nominal state space. We prove that, under certain conditions, the dimensionality of this manifold is at most the dimensionality of the action space plus one. This is the first result of its kind, linking the geometry of the state space to the dimensionality of the action space. We empirically corroborate this upper bound for four MuJoCo environments. We further demonstrate the applicability of our result by learning a policy in this low dimensional representation. To do so we introduce algorithms that learns a mapping to a low dimensional representation, as a narrow hidden layer of a deep neural network, in tandem with the policy using two popular algorithms: Deep Deterministic Policy Gradient and Soft Actor Critic. Our experiments show that such a policy performs at par or better for four MuJoCo control suite tasks.",
        "keywords": "geometry;deep reinforcement learning;manifold",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Saket Tiwari;Omer Gottesman;George Konidaris",
        "authorids": "~Saket_Tiwari2;~Omer_Gottesman1;~George_Konidaris1",
        "gender": "M;M;M",
        "homepage": ";https://omergott.github.io/;http://cs.brown.edu/people/gdk/",
        "dblp": "232/1978;;56/6762",
        "google_scholar": ";glNJx5zYUbsC;9UERvVEAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Saket_Tiwari2;~Omer_Gottesman1;~George_Konidaris1",
        "aff": "Brown University;Amazon;Brown University",
        "aff_domain": "brown.edu;amazon.com;brown.edu",
        "position": "PhD student;Researcher;Assistant Professor",
        "bibtex": "@misc{\ntiwari2024on,\ntitle={On the Geometry of Reinforcement Learning in Continuous State and Action Spaces},\nauthor={Saket Tiwari and Omer Gottesman and George Konidaris},\nyear={2024},\nurl={https://openreview.net/forum?id=rJpG5hdrEa}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=rJpG5hdrEa",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:-yxZvTUoC0kJ:scholar.google.com/&scioq=On+the+Geometry+of+Reinforcement+Learning+in+Continuous+State+and+Action+Spaces&hl=en&as_sdt=0,5",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Brown University;Amazon",
        "aff_unique_dep": ";Amazon.com, Inc.",
        "aff_unique_url": "https://www.brown.edu;https://www.amazon.com",
        "aff_unique_abbr": "Brown;Amazon",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "rKMQhP6iAv",
        "title": "Personas as a way to Model Truthfulness in Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) are trained on vast amounts of text from the internet, which contains both factual and misleading information about the world. Can language models discern truth from falsehood in this contradicting data? Expanding on the view that LLMs can model different agents producing the corpora, we hypothesize that they can \u201ccluster\u201d truthful text by modeling a truthful persona: a group of agents that are likely to produce truthful text and share similar features, e.g., trustworthy sources like Wikipedia and Science usually use formal writing styles and make consistent claims. By modeling this persona, LLMs can generalize truthfulness beyond the specific contexts in which each agent generated the training text. For example, the model can infer that the agent \u201cWikipedia\u201d will behave truthfully on topics that were only generated by \u201cScience\u201d because they share a persona. We first show evidence for the persona hypothesis via two observations: (1) we can probe whether a model\u2019s answer will be truthful before it is generated; (2) finetuning a model on a set of facts improves its truthfulness on unseen topics. Next, using arithmetics as a synthetic environment, we show that language models can separate true and false statements, and generalize truthfulness across agents; but only if agents in the training data share a truthful generative process that enables the creation of a truthful persona. Overall, our findings suggest that models can exploit hierarchical structures in the data to learn abstract concepts like truthfulness.",
        "keywords": "large language models;truthfulness",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Nitish Joshi;Javier Rando;Abulhair Saparov;Najoung Kim;He He",
        "authorids": "~Nitish_Joshi1;~Javier_Rando2;~Abulhair_Saparov1;~Najoung_Kim1;~He_He2",
        "gender": "M;M;M;F;F",
        "homepage": "https://joshinh.github.io;https://javirando.com;http://asaparov.org;https://najoungkim.github.io;http://hhexiy.github.io",
        "dblp": "242/7973;257/3128;117/6287;194/1249;08/8618-1",
        "google_scholar": ";d_rilUYAAAAJ;TVNS71sAAAAJ;Uod-_B8AAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;;",
        "linkedin": ";https://linkedin.com/in/javier-rando;;;",
        "or_profile": "~Nitish_Joshi1;~Javier_Rando2;~Abulhair_Saparov1;~Najoung_Kim1;~He_He1",
        "aff": "Google;Department of Computer Science, ETHZ - ETH Zurich;Purdue University;Google;New York University",
        "aff_domain": "google.com;inf.ethz.ch;purdue.edu;google.com;nyu.edu",
        "position": "Intern;PhD student;Assistant Professor;Researcher;Assistant Professor",
        "bibtex": "@misc{\njoshi2024personas,\ntitle={Personas as a way to Model Truthfulness in Language Models},\nauthor={Nitish Joshi and Javier Rando and Abulhair Saparov and Najoung Kim and He He},\nyear={2024},\nurl={https://openreview.net/forum?id=rKMQhP6iAv}\n}",
        "github": "",
        "project": "",
        "reviewers": "7HFY;CCLc;oRbY;8UZU",
        "site": "https://openreview.net/forum?id=rKMQhP6iAv",
        "pdf_size": 1198280,
        "rating": "3;3;5;6",
        "confidence": "3;3;5;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;1;3",
        "presentation": "3;4;3;1",
        "wc_summary": "81;91;23;101",
        "wc_strengths": "53;42;15;106",
        "wc_weaknesses": "98;406;219;180",
        "wc_questions": "25;3;47;165",
        "wc_review": "257;542;304;552",
        "wc_reply_reviewers": "0;0;0;27",
        "wc_reply_authors": "397;766;757;666",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            74.0,
            30.28200785945344
        ],
        "wc_strengths_avg": [
            54.0,
            33.05298776207682
        ],
        "wc_weaknesses_avg": [
            225.75,
            112.85914894238748
        ],
        "wc_questions_avg": [
            60.0,
            62.5859409132754
        ],
        "wc_review_avg": [
            413.75,
            134.32865479859464
        ],
        "wc_reply_reviewers_avg": [
            6.75,
            11.691342951089922
        ],
        "wc_reply_authors_avg": [
            646.5,
            149.26570269154263
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 28,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8839401264801269454&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;0;3",
        "aff_unique_norm": "Google;ETH Zurich;Purdue University;New York University",
        "aff_unique_dep": "Google;Department of Computer Science;;",
        "aff_unique_url": "https://www.google.com;https://www.ethz.ch;https://www.purdue.edu;https://www.nyu.edu",
        "aff_unique_abbr": "Google;ETHZ;Purdue;NYU",
        "aff_campus_unique_index": "0;1;0",
        "aff_campus_unique": "Mountain View;Zurich;",
        "aff_country_unique_index": "0;1;0;0;0",
        "aff_country_unique": "United States;Switzerland"
    },
    {
        "id": "rKPK2Rn6y8",
        "title": "Autonomous Tree-search Ability of Large Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) have excelled in remarkable reasoning capabilities with advanced prompting techniques (e.g., Chain-of-Thought), but they fall short on tasks that require exploration, strategic foresight, and sequential decision-making. Recent works \npropose to utilize external programs (e.g., Python codes) to define search logic, such that LLMs can perform passive tree search to solve more challenging reasoning tasks. Though impressive results have been achieved, there are several fundamental limitations of these approaches. First, passive tree searches are not efficient as they usually require multiple rounds of LLM API calls to solve one single problem. Moreover, passive search methods are not flexible since they need task-specific program designs. Then a natural question arises:\ncan we maintain the tree-search capability of LLMs without the aid of external programs, and can still generate responses that clearly demonstrate the process of a tree-structure search? To this end, we propose a new concept called autonomous tree-search ability of LLM, which can automatically generate a response containing search trajectories for the correct answer.  Concretely, we first perform both BFS and DFS style search trajectories using more capable LLM API (e.g. GPT-4 and GPT-3.5) via a fixed system prompt, allowing them to perform autonomous tree-search (ATS) right out of the box. Experiments on 4 challenge puzzle games demonstrate our method can achieve huge improvements. The ATS-BFS method outperforms the Chain of Thought approach by achieving an average accuracy improvement of 33\\%. Compared to Tree of Thoughts, it requires 65.6\\% or 47.7\\% less GPT-api cost to attain a comparable level of accuracy. Moreover, we have collected a dataset using the ATS prompt method and fine-tuned LLaMA with this dataset. This approach has shown to yield a greater improvement compared to the ones fine-tuned on CoT data. Specifically, it outperforms CoT-tuned LLaMAs by an average of 40.6\\% and 38.5\\% for LLaMA2-7B and LLaMA2-13B, respectively.",
        "keywords": "Large Language Model;Application;Reasoning;Tree Search",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/4a8506aed81f86a7cd62da835c966fba53bbfc7c.zip",
        "author": "Zheyu Aqa Zhang;Zhuorui Ye;Yikang Shen;Chuang Gan",
        "authorids": "~Zheyu_Aqa_Zhang1;~Zhuorui_Ye1;~Yikang_Shen1;~Chuang_Gan1",
        "gender": "M;M;M;M",
        "homepage": ";;http://people.csail.mit.edu/ganchuang/;https://zheyuaqazhang.github.io/",
        "dblp": ";152/8226;139/6993;",
        "google_scholar": "0XUri1UAAAAJ;qff5rRYAAAAJ;PTeSCbIAAAAJ;-vSxSMMAAAAJ",
        "orcid": ";;;0000-0003-1798-3093",
        "linkedin": "zhuorui-ye-a38773200/;;;",
        "or_profile": "~Zhuorui_Ye1;~Yikang_Shen1;~Chuang_Gan1;~Zheyu_Zhang4",
        "aff": "Tsinghua University;International Business Machines;University of Massachusetts at Amherst;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;ibm.com;umass.edu;tsinghua.edu.cn",
        "position": "Undergrad student;Researcher;Assistant Professor;Undergrad student",
        "bibtex": "@misc{\nanonymous2024autonomous,\ntitle={Autonomous Tree-search Ability of Large Language Models},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=rKPK2Rn6y8}\n}",
        "github": "",
        "project": "",
        "reviewers": "51yR;Tc6e;Mb1G;Dq3i",
        "site": "https://openreview.net/forum?id=rKPK2Rn6y8",
        "pdf_size": 770278,
        "rating": "3;5;5;6",
        "confidence": "3;4;4;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;2",
        "presentation": "2;3;3;3",
        "wc_summary": "111;109;91;65",
        "wc_strengths": "72;114;44;40",
        "wc_weaknesses": "172;443;202;19",
        "wc_questions": "1;89;51;1",
        "wc_review": "356;755;388;125",
        "wc_reply_reviewers": "0;154;0;12",
        "wc_reply_authors": "182;909;287;73",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            94.0,
            18.466185312619388
        ],
        "wc_strengths_avg": [
            67.5,
            29.542342493444895
        ],
        "wc_weaknesses_avg": [
            209.0,
            151.883178792123
        ],
        "wc_questions_avg": [
            35.5,
            37.023641095926806
        ],
        "wc_review_avg": [
            406.0,
            225.6025265815966
        ],
        "wc_reply_reviewers_avg": [
            41.5,
            65.1363953562062
        ],
        "wc_reply_authors_avg": [
            362.75,
            324.327284544486
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.2294157338705618,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14915581431561511929&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Tsinghua University;International Business Machines Corporation;University of Massachusetts Amherst",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.ibm.com;https://www.umass.edu",
        "aff_unique_abbr": "THU;IBM;UMass Amherst",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Amherst",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Masked Structural Growth for 2x Faster Language Model Pre-training",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17695",
        "id": "rL7xsg1aRn",
        "author_site": "Yiqun Yao, Zheng Zhang, Jing Li, Yequan Wang",
        "tldr": "",
        "abstract": "Accelerating large language model pre-training is a critical issue in present research. In this paper, we focus on speeding up pre-training by progressively growing from a small Transformer structure to a large one. There are two main research problems associated with progressive growth: determining the optimal growth schedule, and designing efficient growth operators. In terms of growth schedule, the impact of each single dimension on a schedule\u2019s efficiency is underexplored by existing work. Regarding the growth operators, existing methods rely on the initialization of new weights to inherit knowledge, and achieve only non-strict function preservation, limiting further improvements on training dynamics. To address these issues, we propose Masked Structural Growth (MSG), including (i) growth schedules involving all possible dimensions and (ii) strictly function-preserving growth operators that is independent of the initialization of new weights. Experiments show that MSG is significantly faster than related work: we achieve up to 2.2x speedup in pre-training different types of language models while maintaining comparable or better downstream performances. Code is publicly available at https://github.com/cofe-ai/MSG.",
        "keywords": "Progressive Learning;Large Language Models;Model Growth",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Yiqun Yao;Zheng Zhang;Jing Li;Yequan Wang",
        "authorids": "~Yiqun_Yao1;~Zheng_Zhang12;~Jing_Li19;~Yequan_Wang1",
        "gender": "M;M;M;M",
        "homepage": ";;https://www.li-jing.com;http://www.wangyequan.com",
        "dblp": "186/7879;181/2621-20.html;l/JingLi34;188/9082",
        "google_scholar": ";S2bil1cAAAAJ;https://scholar.google.com.sg/citations?user=2QxEwWsAAAAJ;7Gqp6FsAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Yiqun_Yao1;~Zheng_Zhang12;~Jing_Li19;~Yequan_Wang1",
        "aff": "Beijing Academy of Artificial Intelligence;Beijing Academy of Artificial Intelligence;Harbin Institute of Technology;Beijing Academy of Artificial Intelligence",
        "aff_domain": "baai.ac.cn;baai.ac.cn;hit.edu.cn;baai.ac.cn",
        "position": "Researcher;Principal Researcher;Full Professor;Researcher",
        "bibtex": "@inproceedings{\nyao2024masked,\ntitle={Masked Structural Growth for 2x Faster Language Model Pre-training},\nauthor={Yiqun Yao and Zheng Zhang and Jing Li and Yequan Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=rL7xsg1aRn}\n}",
        "github": "",
        "project": "",
        "reviewers": "vhLH;Bd3L;aWRp",
        "pdf_size": 751936,
        "rating": "6;6;8",
        "confidence": "3;3;4",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "3;3;3",
        "wc_summary": "90;56;70",
        "wc_strengths": "183;63;84",
        "wc_weaknesses": "36;160;83",
        "wc_questions": "277;9;121",
        "wc_review": "586;288;358",
        "wc_reply_reviewers": "31;9;0",
        "wc_reply_authors": "295;252;101",
        "reply_reviewers": "1;1;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            72.0,
            13.9522996909709
        ],
        "wc_strengths_avg": [
            110.0,
            52.32590180780452
        ],
        "wc_weaknesses_avg": [
            93.0,
            51.11425111127685
        ],
        "wc_questions_avg": [
            135.66666666666666,
            109.90096551997267
        ],
        "wc_review_avg": [
            410.6666666666667,
            127.23032482688848
        ],
        "wc_reply_reviewers_avg": [
            13.333333333333334,
            13.021349989749739
        ],
        "wc_reply_authors_avg": [
            216.0,
            83.19054433447751
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.9999999999999998,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4512995780669761406&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=rL7xsg1aRn",
        "pdf": "https://openreview.net/pdf?id=rL7xsg1aRn",
        "email": "baai.ac.cn;baai.ac.cn;hit.edu.cn;baai.ac.cn",
        "author_num": 4,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Beijing Academy of Artificial Intelligence;Harbin Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.baaic.cn;http://www.hit.edu.cn/",
        "aff_unique_abbr": "BAAI;HIT",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Harbin",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Like Oil and Water: Group Robustness Methods and Poisoning Defenses May Be at Odds",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17694",
        "id": "rM9VJPB20F",
        "author_site": "Michael-Andrei Panaitescu-Liess, Yigitcan Kaya, Sicheng Zhu, Furong Huang, Tudor Dumitras",
        "tldr": "",
        "abstract": "Group robustness has become a major concern in machine learning (ML) as conventional training paradigms were found to produce high error on minority groups. Without explicit group annotations, proposed solutions rely on heuristics that aim to identify and then amplify the minority samples during training. In our work, we first uncover a critical shortcoming of these methods: an inability to distinguish legitimate minority samples from poison samples in the training set. By amplifying poison samples as well, group robustness methods inadvertently boost the success rate of an adversary---e.g., from 0\\% without amplification to over 97\\% with it. Notably, we supplement our empirical evidence with an impossibility result proving this inability of a standard heuristic under some assumptions. Moreover, scrutinizing recent poisoning defenses both in centralized and federated learning, we observe that they rely on similar heuristics to identify which samples should be eliminated as poisons. In consequence, minority samples are eliminated along with poisons, which damages group robustness---e.g., from 55\\% without the removal of the minority samples to 41\\% with it. Finally, as they pursue opposing goals using similar heuristics, our attempt to alleviate the trade-off by combining group robustness methods and poisoning defenses falls short. By exposing this tension, we also hope to highlight how benchmark-driven ML scholarship can obscure the trade-offs among different metrics with potentially detrimental consequences.",
        "keywords": "poisoning;adversarial machine learning;group robustness",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Michael-Andrei Panaitescu-Liess;Yigitcan Kaya;Sicheng Zhu;Furong Huang;Tudor Dumitras",
        "authorids": "~Michael-Andrei_Panaitescu-Liess1;~Yigitcan_Kaya2;~Sicheng_Zhu1;~Furong_Huang1;~Tudor_Dumitras1",
        "gender": "M;M;M;F;M",
        "homepage": ";https://yigitcankaya.github.io/;https://schzhu.github.io/;https://furong-huang.com;http://users.umiacs.umd.edu/~tdumitra/",
        "dblp": "263/6954.html;217/2488;;72/8513;01/4921",
        "google_scholar": "MOP6lhkAAAAJ;tPiXuV0AAAAJ;;13yyuCcAAAAJ;",
        "orcid": ";;;;",
        "linkedin": "michael-panaitescu-0849a3182/;yigitcankaya/;;;",
        "or_profile": "~Michael-Andrei_Panaitescu-Liess1;~Yigitcan_Kaya2;~Sicheng_Zhu1;~Furong_Huang1;~Tudor_Dumitras1",
        "aff": "University of Maryland, College Park;University of California, Santa Barbara;University of Maryland, College Park;University of Maryland;University of Maryland, College Park",
        "aff_domain": "umd.edu;ucsb.edu;umd.edu;cs.umd.edu;umd.edu",
        "position": "PhD student;Postdoc;PhD student;Assistant Professor;Associate Professor",
        "bibtex": "@inproceedings{\npanaitescu-liess2024like,\ntitle={Like Oil and Water: Group Robustness Methods and Poisoning Defenses May Be at Odds},\nauthor={Michael-Andrei Panaitescu-Liess and Yigitcan Kaya and Sicheng Zhu and Furong Huang and Tudor Dumitras},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=rM9VJPB20F}\n}",
        "github": "",
        "project": "",
        "reviewers": "Shsu;a2i2;wCf5;Fmsc",
        "pdf_size": 1495382,
        "rating": "5;6;6;8",
        "confidence": "4;3;4;3",
        "soundness": "2;3;2;2",
        "contribution": "1;3;2;4",
        "presentation": "2;2;3;2",
        "wc_summary": "78;128;61;69",
        "wc_strengths": "21;40;32;117",
        "wc_weaknesses": "237;163;292;256",
        "wc_questions": "80;11;86;804",
        "wc_review": "416;342;471;1246",
        "wc_reply_reviewers": "0;0;0;183",
        "wc_reply_authors": "1361;504;1064;898",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "2;1;2;2",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            1.118033988749895
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            84.0,
            26.105554964413226
        ],
        "wc_strengths_avg": [
            52.5,
            37.84507894033252
        ],
        "wc_weaknesses_avg": [
            237.0,
            47.069098143049224
        ],
        "wc_questions_avg": [
            245.25,
            323.93778337822835
        ],
        "wc_review_avg": [
            618.75,
            365.0242286479077
        ],
        "wc_reply_reviewers_avg": [
            45.75,
            79.24132444627614
        ],
        "wc_reply_authors_avg": [
            956.75,
            309.57824132196373
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.6882472016116854,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:fXJkVwQLyM0J:scholar.google.com/&scioq=Like+Oil+and+Water:+Group+Robustness+Methods+and+Poisoning+Defenses+May+Be+at+Odds&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=rM9VJPB20F",
        "pdf": "https://openreview.net/pdf?id=rM9VJPB20F",
        "email": "umd.edu;ucsb.edu;umd.edu;cs.umd.edu;umd.edu",
        "author_num": 5,
        "aff_unique_index": "0;1;0;0;0",
        "aff_unique_norm": "University of Maryland;University of California, Santa Barbara",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www/umd.edu;https://www.ucsb.edu",
        "aff_unique_abbr": "UMD;UCSB",
        "aff_campus_unique_index": "0;1;0;0",
        "aff_campus_unique": "College Park;Santa Barbara;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "rMId7iPDOH",
        "title": "Stylist: Style-Driven Feature Ranking for Robust Novelty Detection",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Novelty detection aims at finding samples that differ in some form from the distribution of seen samples. But not all changes are created equal. Data can suffer a multitude of distribution shifts, and we might want to detect only some types of relevant changes. Similar to works in out-of-distribution generalization, we propose to use the formalization of separating into semantic or content changes, that are relevant to our task, and style changes, that are irrelevant. Within this formalization, we define the robust novelty detection as the task of finding semantic changes while being robust to style distributional shifts. Leveraging pretrained, large-scale model representations, we introduce Stylist, a novel method that focuses on dropping environment-biased features. First, we compute a per-feature score based on the feature distribution distances between environments. Next, we show that our selection manages to remove features responsible for spurious correlations and improve novelty detection performance. For evaluation, we adapt domain generalization datasets to our task and analyze the methods' behaviors. We additionally built a large synthetic dataset where we have control over the spurious correlations degree. We prove that our selection mechanism improves novelty detection algorithms across multiple datasets, containing both stylistic and content shifts.",
        "keywords": "spurious correlation;novelty detection;distribution shift;domain generalisation;style;content;robust",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/3989118b21cf0b3b2801e8406dfb436765657e12.zip",
        "author": "Stefan Smeu;Elena Burceanu;Emanuela Haller;Andrei Liviu Nicolicioiu",
        "authorids": "~Stefan_Smeu1;~Elena_Burceanu1;~Emanuela_Haller1;~Andrei_Liviu_Nicolicioiu1",
        "gender": "M;F;F;",
        "homepage": ";http://ilarele.github.io/;https://emanuelahaller.github.io/;https://andreinicolicioiu.github.io/",
        "dblp": "330/5339;139/7814;199/2167;",
        "google_scholar": "Y3KWk-UAAAAJ;bL34yDkAAAAJ;KK1d87cAAAAJ;BVUKrDQAAAAJ",
        "orcid": ";;0000-0003-4723-4384;",
        "linkedin": "https://ro.linkedin.com/in/stefan-smeu;elena-burceanu-97016539/;;",
        "or_profile": "~Stefan_Smeu1;~Elena_Burceanu1;~Emanuela_Haller1;~Andrei_Liviu_Nicolicioiu1",
        "aff": "University of Bucharest;Bitdefender;University Politehnica of Bucharest;Montreal Institute for Learning Algorithms, University of Montreal, Universit\u00e9 de Montr\u00e9al",
        "aff_domain": "unibuc.ro;bitdefender.com;pub.ro;mila.umontreal.ca",
        "position": "MS student;Principal Researcher;PhD student;PhD student",
        "bibtex": "@misc{\nsmeu2024stylist,\ntitle={Stylist: Style-Driven Feature Ranking for Robust Novelty Detection},\nauthor={Stefan Smeu and Elena Burceanu and Emanuela Haller and Andrei Liviu Nicolicioiu},\nyear={2024},\nurl={https://openreview.net/forum?id=rMId7iPDOH}\n}",
        "github": "",
        "project": "",
        "reviewers": "guaR;6JHA;gWKH;Diep",
        "site": "https://openreview.net/forum?id=rMId7iPDOH",
        "pdf_size": 1267905,
        "rating": "3;5;5;5",
        "confidence": "4;4;4;3",
        "soundness": "3;2;3;3",
        "contribution": "2;2;2;2",
        "presentation": "2;2;3;3",
        "wc_summary": "54;88;71;241",
        "wc_strengths": "28;51;64;129",
        "wc_weaknesses": "137;602;165;202",
        "wc_questions": "3;30;48;117",
        "wc_review": "222;771;348;689",
        "wc_reply_reviewers": "0;301;33;0",
        "wc_reply_authors": "1074;3785;1224;2375",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "2;5;2;4",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            113.5,
            74.58719729283304
        ],
        "wc_strengths_avg": [
            68.0,
            37.50333318519835
        ],
        "wc_weaknesses_avg": [
            276.5,
            189.33634093855306
        ],
        "wc_questions_avg": [
            49.5,
            42.13371571556442
        ],
        "wc_review_avg": [
            507.5,
            228.76024567218843
        ],
        "wc_reply_reviewers_avg": [
            83.5,
            126.29429915875063
        ],
        "wc_reply_authors_avg": [
            2114.5,
            1087.8948708400092
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.25,
            1.299038105676658
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:g5cRXOY-C6IJ:scholar.google.com/&scioq=Stylist:+Style-Driven+Feature+Ranking+for+Robust+Novelty+Detection&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "University of Bucharest;Bitdefender;University Politehnica of Bucharest;University of Montreal",
        "aff_unique_dep": ";;;Montreal Institute for Learning Algorithms",
        "aff_unique_url": "https://www.unibuc.ro;https://www.bitdefender.com;https://www.upb.ro;https://www.mila.quebec",
        "aff_unique_abbr": "Unibuc;Bitdefender;UPB;MILA",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Montreal",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "Romania;Canada"
    },
    {
        "id": "rN3fh43D30",
        "title": "Enhancing Length Extrapolation in Sequential Models with Pointer-Augmented Neural Memory",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We propose a solution called Pointer-Augmented Neural Memory (PANM) to help neural networks understand and apply symbol processing to new, longer sequences of data. PANM integrates an external neural memory that uses physical addresses and pointer manipulation techniques to mimic human and computer symbol processing abilities. PANM facilitates pointer assignment, dereference, and arithmetic by explicitly using pointers to access memory content. Remarkably, it can learn to perform these operations through end-to-end training on sequence data, powering various sequential models. Our experiments demonstrate PANM's exceptional length extrapolating capabilities and improved performance in tasks that require symbol processing, such as algorithmic reasoning and Dyck language recognition. Additionally, PANM helps Transformer achieve up to 100% generalization accuracy in compositional learning tasks and significantly better results in mathematical reasoning, question answering and machine translation tasks.",
        "keywords": "memory-augmented neural network;generalization;sequence learning;indirection",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Hung Le;Dung Nguyen;Kien Do;Svetha Venkatesh;Truyen Tran",
        "authorids": "~Hung_Le1;~Dung_Nguyen1;~Kien_Do1;~Svetha_Venkatesh1;~Truyen_Tran1",
        "gender": ";F;M;M;M",
        "homepage": "https://www.deakin.edu.au/about-deakin/people/dung-nguyen;https://www.deakin.edu.au/about-deakin/people/svetha-venkatesh;http://truyentran.github.io;https://thaihungle.github.io/;https://clarken92.github.io/",
        "dblp": ";81/1984;55/2269;45/466-2;185/0836",
        "google_scholar": "https://scholar.google.com.au/citations?user=O5OU_kUAAAAJ;AEkRUQcAAAAJ;https://scholar.google.com.au/citations?user=zvspVLwAAAAJ;https://scholar.google.com.au/citations?user=q2HbxngAAAAJ;aD6y8joAAAAJ",
        "orcid": "0000-0002-7726-7841;;0000-0001-6531-8907;0000-0002-3126-184X;0000-0002-0119-122X",
        "linkedin": ";;truyen-tran;;kien-duc-do-b45846a4/",
        "or_profile": "~Dung_Nguyen1;~Svetha_Venkatesh1;~Truyen_Tran1;~Hung_Thai_Le1;~Kien_Duc_Do1",
        "aff": ";Deakin University;Deakin University;Deakin University;Deakin University",
        "aff_domain": ";deakin.edu.au;deakin.edu.au;deakin.edu.au;deakin.edu.au",
        "position": ";Full Professor;Full Professor;Lecturer;Research Fellow",
        "bibtex": "@misc{\nle2024enhancing,\ntitle={Enhancing Length Extrapolation in Sequential Models with Pointer-Augmented Neural Memory},\nauthor={Hung Le and Dung Nguyen and Kien Do and Svetha Venkatesh and Truyen Tran},\nyear={2024},\nurl={https://openreview.net/forum?id=rN3fh43D30}\n}",
        "github": "",
        "project": "",
        "reviewers": "VDhU;2DCJ;fEJf",
        "site": "https://openreview.net/forum?id=rN3fh43D30",
        "pdf_size": 1879803,
        "rating": "3;6;8",
        "confidence": "5;2;3",
        "soundness": "3;3;4",
        "contribution": "2;2;3",
        "presentation": "2;2;4",
        "wc_summary": "145;277;149",
        "wc_strengths": "69;104;50",
        "wc_weaknesses": "183;127;308",
        "wc_questions": "29;4;170",
        "wc_review": "426;512;677",
        "wc_reply_reviewers": "0;0;25",
        "wc_reply_authors": "854;351;960",
        "reply_reviewers": "0;0;1",
        "reply_authors": "2;1;2",
        "rating_avg": [
            5.666666666666667,
            2.0548046676563256
        ],
        "confidence_avg": [
            3.3333333333333335,
            1.247219128924647
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            190.33333333333334,
            61.30434097372079
        ],
        "wc_strengths_avg": [
            74.33333333333333,
            22.365648262955002
        ],
        "wc_weaknesses_avg": [
            206.0,
            75.66152699137565
        ],
        "wc_questions_avg": [
            67.66666666666667,
            73.07682411149393
        ],
        "wc_review_avg": [
            538.3333333333334,
            104.14839839809774
        ],
        "wc_reply_reviewers_avg": [
            8.333333333333334,
            11.785113019775793
        ],
        "wc_reply_authors_avg": [
            721.6666666666666,
            265.6493093451507
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.7370434740955019,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:pbiy9tP3gEsJ:scholar.google.com/&scioq=Enhancing+Length+Extrapolation+in+Sequential+Models+with+Pointer-Augmented+Neural+Memory&hl=en&as_sdt=0,14",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Deakin University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.deakin.edu.au",
        "aff_unique_abbr": "Deakin",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Australia"
    },
    {
        "id": "rNvyMAV8Aw",
        "title": "Contextualized Policy Recovery: Modeling and Interpreting Medical Decisions with Adaptive Imitation Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Interpretable policy learning seeks to estimate intelligible decision policies from observed actions; however, existing models fall short by forcing a tradeoff between accuracy and interpretability. \nThis tradeoff limits data-driven interpretations of human decision-making process. e.g. to audit medical decisions for biases and suboptimal practices, we require models of decision processes which provide concise descriptions of complex behaviors. \nFundamentally, existing approaches are burdened by this tradeoff because they represent the underlying decision process as a universal policy, when in fact human decisions are dynamic and can change drastically with contextual information. \nThus, we propose Contextualized Policy Recovery (CPR), which re-frames the problem of modeling complex decision processes as a multi-task learning problem in which complex decision policies are comprised of context-specific policies. \nCPR models each context-specific policy as a linear observation-to-action mapping, \nand generates new decision models \\textit{on-demand} as contexts are updated with new observations.\nCPR is compatible with fully offline and partially observable decision environments, and can be tailored to incorporate any recurrent black-box model or interpretable decision model. \nWe assess CPR through studies on simulated and real data, achieving state-of-the-art performance on the canonical tasks of predicting antibiotic prescription in intensive care units ($+22$% AUROC vs. previous SOTA) and predicting MRI prescription for Alzheimer's patients ($+7.7$% AUROC vs. previous SOTA).\nWith this improvement in predictive performance, CPR closes the accuracy gap between interpretable and black-box methods for policy learning, allowing high-resolution exploration and analysis of context-specific decision models.",
        "keywords": "personalized modeling;contextual modeling;imitation learning;behavior cloning;interpretability;explainability;multitask learning;time series",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Caleb Ellington;Jannik Deuschel;Ben Lengerich;Yingtao Luo;Pascal Friederich;Eric Xing",
        "authorids": "~Caleb_Ellington1;~Jannik_Deuschel1;~Ben_Lengerich1;~Yingtao_Luo1;~Pascal_Friederich1;~Eric_Xing1",
        "gender": ";;;;M;M",
        "homepage": ";;http://web.mit.edu/~blengeri/www/;https://yingtaoluo.github.io/;https://aimat.science;http://www.cs.cmu.edu/~epxing/",
        "dblp": ";;203/8210;278/2956;182/0165;36/3855",
        "google_scholar": ";eGUxrfQAAAAJ;a1Ck1CMAAAAJ;g_MmNEoAAAAJ;3B5h6u0AAAAJ;https://scholar.google.com.tw/citations?user=5pKTRxEAAAAJ",
        "orcid": ";;0000-0001-8690-9554;0000-0003-1794-3657;0000-0003-4465-1465;",
        "linkedin": ";jadeusc/;;;pascal-friederich-6088b9117/;",
        "or_profile": "~Caleb_Ellington1;~Jannik_Deuschel1;~Ben_Lengerich1;~Yingtao_Luo1;~Pascal_Friederich1;~Eric_Xing1",
        "aff": ";Karlsruher Institut f\u00fcr Technologie;Massachusetts Institute of Technology;Carnegie Mellon University;Karlsruher Institut f\u00fcr Technologie;School of Computer Science, Carnegie Mellon University",
        "aff_domain": ";kit.edu;mit.edu;andrew.cmu.edu;kit.edu;cs.cmu.edu",
        "position": ";MS student;Postdoc;PhD student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nellington2024contextualized,\ntitle={Contextualized Policy Recovery: Modeling and Interpreting Medical Decisions with Adaptive Imitation Learning},\nauthor={Caleb Ellington and Jannik Deuschel and Ben Lengerich and Yingtao Luo and Pascal Friederich and Eric Xing},\nyear={2024},\nurl={https://openreview.net/forum?id=rNvyMAV8Aw}\n}",
        "github": "",
        "project": "",
        "reviewers": "9ccK;TJfx;KxoJ",
        "site": "https://openreview.net/forum?id=rNvyMAV8Aw",
        "pdf_size": 7290909,
        "rating": "3;5;5",
        "confidence": "3;4;4",
        "soundness": "2;3;2",
        "contribution": "1;1;2",
        "presentation": "2;4;3",
        "wc_summary": "110;118;107",
        "wc_strengths": "81;14;90",
        "wc_weaknesses": "183;198;245",
        "wc_questions": "111;121;320",
        "wc_review": "485;451;762",
        "wc_reply_reviewers": "0;163;0",
        "wc_reply_authors": "953;1701;1971",
        "reply_reviewers": "0;1;0",
        "reply_authors": "2;3;4",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            111.66666666666667,
            4.642796092394706
        ],
        "wc_strengths_avg": [
            61.666666666666664,
            33.9050963065371
        ],
        "wc_weaknesses_avg": [
            208.66666666666666,
            26.411277052720408
        ],
        "wc_questions_avg": [
            184.0,
            96.2531384769695
        ],
        "wc_review_avg": [
            566.0,
            139.28627594514353
        ],
        "wc_reply_reviewers_avg": [
            54.333333333333336,
            76.83893688893816
        ],
        "wc_reply_authors_avg": [
            1541.6666666666667,
            430.59751766843965
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.0,
            0.816496580927726
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.9999999999999998,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5031244604857473142&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;2;0;2",
        "aff_unique_norm": "Karlsruher Institut f\u00fcr Technologie;Massachusetts Institute of Technology;Carnegie Mellon University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.kit.edu;https://web.mit.edu;https://www.cmu.edu",
        "aff_unique_abbr": "KIT;MIT;CMU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Pittsburgh",
        "aff_country_unique_index": "0;1;1;0;1",
        "aff_country_unique": "Germany;United States"
    },
    {
        "id": "rO62BY3dYc",
        "title": "Pruning via Ranking (PvR): A unified structured pruning approach",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The increase in width and depth has facilitated neural networks to learn from large amounts of data leading to state-of-the-art results in both vision and NLP tasks. \n    In order to democratize such massive networks, it is important to deploy them on resource-limited devices through model compression techniques such as structured pruning. \n    Unfortunately, most pruning methods are tailored towards compressing specific models due to widely differing network architectures for distinct tasks. \n    At the same time, it is desirable for pruning algorithms to generate optimal subnetworks according to user-specified parameter budgets.\n    In this work, we propose Pruning via Ranking (PvR), a novel, global structured pruning approach which generates dense sub-networks that comply with any user-supplied parameter budget. \n    PvR consists of a grouping module and a ranking module that are used to generate smaller networks in terms of both function composition as well as network width for a given dataset. \n    The smaller networks are then trained from scratch instead of being fine-tuned as we empirically demonstrate using a recently proposed model complexity measure that re-initialization after pruning followed by re-training results in better performance. \n    We compare our method against multiple pruning approaches on benchmark datasets, namely, CIFAR10, Tiny ImageNet and IMDB 50K movie reviews, with standard models, namely, VGG16, ResNet34 and Bert-base-uncased. \n    We use both accuracy and model inference latency metrics to evaluate the performance of each approach. \n    The smaller networks proposed by PvR for a range of parameter budgets when trained from scratch outperform all other methods across all datasets and models. \n    In fact, our recommended sub-networks with fewer layers achieve less than $1$\\% test accuracy drop even after pruning $90$\\% of the original model across all networks and datasets while enjoying lower inference latency due to reduced depth.",
        "keywords": "structured pruning;neural network;model compression",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Atif Hassan;Swanand Khare;Jiaul H. Paik",
        "authorids": "~Atif_Hassan1;~Swanand_Khare1;~Jiaul_H._Paik1",
        "gender": "M;M;M",
        "homepage": ";http://www.iitkgp.ac.in/department/MA/faculty/ma-srkhare;https://www.iitkgp.ac.in/department/AI/faculty/ai-jiaul",
        "dblp": ";58/10796.html;27/9831",
        "google_scholar": "https://scholar.google.co.in/citations?user=GW_sRXMAAAAJ;tnzbgNwAAAAJ;https://scholar.google.com.tw/citations?hl=en",
        "orcid": "0000-0002-2699-9102;0000-0002-1175-8015;",
        "linkedin": "atif-hassan-1a8a45127/;;",
        "or_profile": "~Atif_Hassan1;~Swanand_Khare1;~Jiaul_H._Paik1",
        "aff": "Indian Institute of Technology Kharagpur;Indian Institute of Technology Kharagpur;Indian Institute of Technology Kharagpur, Dhirubhai Ambani Institute Of Information and Communication Technology",
        "aff_domain": "iitkgp.ac.in;iitkgp.ac.in;iitkgp.ac.in",
        "position": "PhD student;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nanonymous2024pruning,\ntitle={Pruning via Ranking (PvR): A unified structured pruning approach},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=rO62BY3dYc}\n}",
        "github": "",
        "project": "",
        "reviewers": "Huai;gzCT;L5F6;r6fS",
        "site": "https://openreview.net/forum?id=rO62BY3dYc",
        "pdf_size": 2349034,
        "rating": "3;3;3;6",
        "confidence": "4;5;3;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "2;4;2;3",
        "wc_summary": "51;138;50;94",
        "wc_strengths": "55;48;11;18",
        "wc_weaknesses": "88;275;118;27",
        "wc_questions": "4;6;5;74",
        "wc_review": "198;467;184;213",
        "wc_reply_reviewers": "0;258;0;0",
        "wc_reply_authors": "588;1188;445;598",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;3;1;1",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            83.25,
            36.25861966484659
        ],
        "wc_strengths_avg": [
            33.0,
            18.828170383762732
        ],
        "wc_weaknesses_avg": [
            127.0,
            91.52322109716201
        ],
        "wc_questions_avg": [
            22.25,
            29.88624265443885
        ],
        "wc_review_avg": [
            265.5,
            116.78719964105656
        ],
        "wc_reply_reviewers_avg": [
            64.5,
            111.71727708819259
        ],
        "wc_reply_authors_avg": [
            704.75,
            285.49376087753654
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3850320424089621777&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Indian Institute of Technology Kharagpur",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.iitkgp.ac.in",
        "aff_unique_abbr": "IIT Kharagpur",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Kharagpur",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "India"
    },
    {
        "id": "rO8QOHrCeA",
        "title": "Grounding Code Generation with Input-Output Specifications",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs) have demonstrated significant potential in code generation. However, the code generated by these models occasionally deviates from the user's intended outcome, resulting in executable but incorrect code. To mitigate this issue, we propose GIFT4Code, a novel approach for the instruction fine-tuning of LLMs specifically tailored for code generation. Our method leverages synthetic data produced by the LLM itself and utilizes execution-derived feedback as a key learning signal. This feedback, in the form of program input-output specifications, is provided to the LLM to facilitate fine-tuning. We evaluated our approach on two challenging data science benchmarks, Arcade and DS-1000. Our results suggest that the method enhances the LLM's alignment with user intentions, considerably reducing the incidence of executable but incorrect outputs. Consequently, this leads to a marked improvement in the quality of generated code.",
        "keywords": "code generation;I/O specifications;instruction tuning",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "",
        "author": "Yeming Wen;Pengcheng Yin;Kensen Shi;Henryk Michalewski;Swarat Chaudhuri;Alex Polozov",
        "authorids": "~Yeming_Wen1;~Pengcheng_Yin1;~Kensen_Shi1;~Henryk_Michalewski1;~Swarat_Chaudhuri1;~Alex_Polozov1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://www.cs.utexas.edu/~ywen/;https://pengcheng.in;;https://www.mimuw.edu.pl/~henrykm/;http://www.cs.utexas.edu/~swarat;https://www.alexpolozov.com/",
        "dblp": "https://dblp.uni-trier.de/pers/hd/w/Wen:Yeming;130/7385;135/8307;https://dblp.uni-trier.de/pers/hd/m/Michalewski:Henryk;37/6100;151/3318",
        "google_scholar": "J2GzNAkAAAAJ;t5lVb6sAAAAJ;LAL4SIMAAAAJ;YdHW1ycAAAAJ;9j6RBYQAAAAJ;-SuHe48AAAAJ",
        "orcid": ";;0000-0001-7140-7869;;0000-0002-6859-1391;",
        "linkedin": ";pchyin/;;henryk-michalewski-8a230a27/;swarat-chaudhuri-609b3092/;apskim",
        "or_profile": "~Yeming_Wen1;~Pengcheng_Yin1;~Kensen_Shi1;~Henryk_Michalewski1;~Swarat_Chaudhuri1;~Oleksandr_Polozov1",
        "aff": "University of Texas, Austin;Google;Google;Google DeepMind;University of Texas at Austin;Google",
        "aff_domain": "utexas.edu;google.com;google.com;google.com;utexas.edu;google.com",
        "position": "PhD student;Researcher;Software Engineer;Researcher;Full Professor;Research Scientist",
        "bibtex": "@misc{\nwen2024grounding,\ntitle={Grounding Code Generation with Input-Output Specifications},\nauthor={Yeming Wen and Pengcheng Yin and Kensen Shi and Henryk Michalewski and Swarat Chaudhuri and Alex Polozov},\nyear={2024},\nurl={https://openreview.net/forum?id=rO8QOHrCeA}\n}",
        "github": "",
        "project": "",
        "reviewers": "pVfx;ek5m;kH34;Ns97",
        "site": "https://openreview.net/forum?id=rO8QOHrCeA",
        "pdf_size": 711535,
        "rating": "3;5;5;5",
        "confidence": "4;5;4;4",
        "soundness": "2;2;2;2",
        "contribution": "1;3;2;2",
        "presentation": "2;3;3;3",
        "wc_summary": "42;64;146;77",
        "wc_strengths": "15;14;225;67",
        "wc_weaknesses": "265;7;618;116",
        "wc_questions": "5;140;97;28",
        "wc_review": "327;225;1086;288",
        "wc_reply_reviewers": "0;115;50;0",
        "wc_reply_authors": "429;560;636;535",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            82.25,
            38.87399516386243
        ],
        "wc_strengths_avg": [
            80.25,
            86.27680742818431
        ],
        "wc_weaknesses_avg": [
            251.5,
            230.56723531325954
        ],
        "wc_questions_avg": [
            67.5,
            53.83539727725616
        ],
        "wc_review_avg": [
            481.5,
            350.90062695868755
        ],
        "wc_reply_reviewers_avg": [
            41.25,
            47.21956691881026
        ],
        "wc_reply_authors_avg": [
            540.0,
            74.09790820259369
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17433928571570878562&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;1;1;0;1",
        "aff_unique_norm": "University of Texas at Austin;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.utexas.edu;https://www.google.com",
        "aff_unique_abbr": "UT Austin;Google",
        "aff_campus_unique_index": "0;1;1;0;1",
        "aff_campus_unique": "Austin;Mountain View;",
        "aff_country_unique_index": "0;0;0;1;0;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "rOpK0ToM3o",
        "title": "V-Former: Offline RL with Temporally-Extended Actions",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this paper, we propose an offline reinforcement learning (RL) method that learns to take temporally extended actions, can handle narrow data distributions such as those produced by mixtures of multi-task demonstrations, and can train on data with different control frequencies. This combination of properties makes our proposed method especially well-suited for robotic offline RL, where datasets might consist of (narrow) demonstration data mixed with (broader) suboptimal data, and control frequencies can present a particularly significant challenge. We derive our method starting from a continuous time formulation of RL, and show that offline RL with temporally extended \u201caction chunks\u201d can be performed efficiently by extending the implicit Q-learning (IQL) approach, in combination with expressive Transformer-based policies for representing temporally extended open-loop action sequences. Our experiments show that our method both improves over prior approaches on simulated robotic demonstration data and outperforms prior works that aim to learn from data at multiple frequencies.",
        "keywords": "reinforcement learning;robotics",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Jeffrey Wu;Seohong Park;Zipeng Lin;Jianlan Luo;Sergey Levine",
        "authorids": "~Jeffrey_Wu2;~Seohong_Park1;~Zipeng_Lin1;~Jianlan_Luo1;~Sergey_Levine1",
        "gender": "M;;;;M",
        "homepage": "https://jeffreywu13579.github.io/;https://seohong.me/;https://yuslzp.github.io;https://people.eecs.berkeley.edu/~jianlanluo/;https://people.eecs.berkeley.edu/~svlevine/",
        "dblp": ";227/6308;;161/1838;80/7594",
        "google_scholar": "jH_7A6gAAAAJ;;;SJoRNbYAAAAJ;8R35rCwAAAAJ",
        "orcid": ";;;;",
        "linkedin": "jeffrey-wu-721977187/;;;;",
        "or_profile": "~Jeffrey_Wu2;~Seohong_Park1;~Zipeng_Lin1;~Jianlan_Luo1;~Sergey_Levine1",
        "aff": "University of California, Berkeley;University of California, Berkeley;University of California, Berkeley;University of California, Berkeley;Google",
        "aff_domain": "berkeley.edu;berkeley.edu;berkeley.edu;eecs.berkeley.edu;google.com",
        "position": "MS student;PhD student;Undergrad student;Postdoc;Research Scientist",
        "bibtex": "@misc{\nwu2024vformer,\ntitle={V-Former: Offline {RL} with Temporally-Extended Actions},\nauthor={Jeffrey Wu and Seohong Park and Zipeng Lin and Jianlan Luo and Sergey Levine},\nyear={2024},\nurl={https://openreview.net/forum?id=rOpK0ToM3o}\n}",
        "github": "",
        "project": "",
        "reviewers": "B2yt;7pis;ZdXy;yZ1P",
        "site": "https://openreview.net/forum?id=rOpK0ToM3o",
        "pdf_size": 1796913,
        "rating": "3;3;5;6",
        "confidence": "4;4;4;3",
        "soundness": "2;2;2;4",
        "contribution": "2;2;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "65;79;63;80",
        "wc_strengths": "37;15;48;46",
        "wc_weaknesses": "355;110;188;98",
        "wc_questions": "14;54;147;16",
        "wc_review": "471;258;446;240",
        "wc_reply_reviewers": "308;0;21;0",
        "wc_reply_authors": "1390;1296;1632;328",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "3;3;4;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            71.75,
            7.790218225441442
        ],
        "wc_strengths_avg": [
            36.5,
            13.0862523283024
        ],
        "wc_weaknesses_avg": [
            187.75,
            102.55821517557723
        ],
        "wc_questions_avg": [
            57.75,
            53.93688441131913
        ],
        "wc_review_avg": [
            353.75,
            105.31470695016912
        ],
        "wc_reply_reviewers_avg": [
            82.25,
            130.61848069855964
        ],
        "wc_reply_authors_avg": [
            1161.5,
            496.5871021281161
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.75,
            1.0897247358851685
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.7777777777777777,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Ze3Ko3TCPnoJ:scholar.google.com/&scioq=V-Former:+Offline+RL+with+Temporally-Extended+Actions&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;1",
        "aff_unique_norm": "University of California, Berkeley;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.berkeley.edu;https://www.google.com",
        "aff_unique_abbr": "UC Berkeley;Google",
        "aff_campus_unique_index": "0;0;0;0;1",
        "aff_campus_unique": "Berkeley;Mountain View",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "rPpRyGVVnt",
        "title": "Learning to Play Atari in a World of Tokens",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Model-based reinforcement learning agents utilizing transformers have shown improved sample efficiency due to their ability to model extended context, resulting in more accurate world models.\nHowever, for complex reasoning and planning tasks, these methods primarily rely on continuous representations.\nThis complicates modeling of discrete properties of the real world such as disjoint object classes between which interpolation is not plausible.\nIn this work, we introduce discrete abstract representations for transformer-based learning (DART), a sample-efficient method utilizing discrete representations for modeling both the world and learning behavior. We incorporate a transformer-decoder for auto-regressive world modeling and a transformer-encoder for learning behavior by attending to task-relevant cues in the discrete representation of the world model. For handling partial observability, we aggregate information from past time steps as memory tokens.  \nDART outperforms previous state-of-the-art methods that do not use look-ahead search on the Atari 100k sample efficiency benchmark with a median human-normalized score of 0.790 and beats humans in 9 out of 26 games.",
        "keywords": "model-based reinforcement learning;transformer;vector quantised-variational autoencoder",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Pranav Agarwal;Sheldon Andrews;Samira Ebrahimi Kahou",
        "authorids": "~Pranav_Agarwal1;~Sheldon_Andrews1;~Samira_Ebrahimi_Kahou1",
        "gender": "M;M;F",
        "homepage": "https://pranaval.github.io/;https://profs.etsmtl.ca/sandrews;https://saebrahimi.github.io",
        "dblp": ";;20/11069",
        "google_scholar": "QFEzapMAAAAJ;aoAfWEQAAAAJ;https://scholar.google.ca/citations?user=F99FuaAAAAAJ",
        "orcid": ";0000-0001-9776-117X;",
        "linkedin": "pranav-agarwal-6b4453114/;sheldonandrews/;",
        "or_profile": "~Pranav_Agarwal1;~Sheldon_Andrews1;~Samira_Ebrahimi_Kahou1",
        "aff": "\u00c9cole de technologie sup\u00e9rieure, Universit\u00e9 du Qu\u00e9bec;McGill University;\u00c9cole de technologie sup\u00e9rieure",
        "aff_domain": "etsmtl.ca;mcgill.ca;etsmtl.ca",
        "position": "PhD student;Adjunct Professor;Associate Professor",
        "bibtex": "@misc{\nagarwal2024learning,\ntitle={Learning to Play Atari in a World of Tokens},\nauthor={Pranav Agarwal and Sheldon Andrews and Samira Ebrahimi Kahou},\nyear={2024},\nurl={https://openreview.net/forum?id=rPpRyGVVnt}\n}",
        "github": "",
        "project": "",
        "reviewers": "JiU2;vBaD;f8be",
        "site": "https://openreview.net/forum?id=rPpRyGVVnt",
        "pdf_size": 1433697,
        "rating": "3;5;6",
        "confidence": "3;4;3",
        "soundness": "2;3;3",
        "contribution": "2;2;2",
        "presentation": "2;3;2",
        "wc_summary": "64;270;51",
        "wc_strengths": "21;93;49",
        "wc_weaknesses": "209;304;110",
        "wc_questions": "3;3;13",
        "wc_review": "297;670;223",
        "wc_reply_reviewers": "218;0;10",
        "wc_reply_authors": "1281;799;626",
        "reply_reviewers": "2;0;1",
        "reply_authors": "4;2;2",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            128.33333333333334,
            100.31395161635737
        ],
        "wc_strengths_avg": [
            54.333333333333336,
            29.63481436119049
        ],
        "wc_weaknesses_avg": [
            207.66666666666666,
            79.20577981154882
        ],
        "wc_questions_avg": [
            6.333333333333333,
            4.714045207910317
        ],
        "wc_review_avg": [
            396.6666666666667,
            195.622652630574
        ],
        "wc_reply_reviewers_avg": [
            76.0,
            100.4921224109963
        ],
        "wc_reply_authors_avg": [
            902.0,
            277.14376533969994
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.18898223650461363,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15656214051583240236&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Universit\u00e9 du Qu\u00e9bec;McGill University;\u00c9cole de technologie sup\u00e9rieure",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.etsmtl.ca;https://www.mcgill.ca;https://www.etsmtl.ca",
        "aff_unique_abbr": "ETS;McGill;ETS",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "\u00c9cole de technologie sup\u00e9rieure;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "rQRDt8F2Yh",
        "title": "A Discrete and Variational Approach to Speech Representation Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Previous work on self-supervised speech representation learning has taken diverse forms. However, it is plausible if there exists a learning objective that connects, or even generalizes across, distinct approaches. In this paper we propose a variational perspective that extends recent approaches, such as HuBERT, VQ-APC, and draws connections to VQ-CPC and wav2vec 2.0. We show that previous work can be formulated as a discrete latent variable model via predictive coding, and the proposed loss function provides an optimization advantage over other approaches. The learned representations through proposed approach obtain sizable improvements on phonetic classification, speaker verification and automatic speech recognition. Moreover, the variational principle not only provides a unification of approaches, but also a information theoretic lens for analyizing the learning of representations. We utilize the KL term and reconstruction term of the variational objective, also known as rate and distortion, to inspect the training dynamics. The outcome reveals that rather than the distortion, a model achieves superior downstream performance when the KL divergence between distinct signal components is minimized.",
        "keywords": "speech representation learning;self-supervised learning;predictive coding;variational learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Sung-Lin Yeh;Hao Tang",
        "authorids": "~Sung-Lin_Yeh1;~Hao_Tang1",
        "gender": ";M",
        "homepage": ";http://homepages.inf.ed.ac.uk/htang2",
        "dblp": ";07/5751-2",
        "google_scholar": ";VN0X-PcAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Sung-Lin_Yeh1;~Hao_Tang1",
        "aff": ";University of Edinburgh",
        "aff_domain": ";ed.ac.uk",
        "position": ";Assistant Professor",
        "bibtex": "@misc{\nanonymous2024a,\ntitle={A Discrete and Variational Approach to Speech Representation Learning},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=rQRDt8F2Yh}\n}",
        "github": "",
        "project": "",
        "reviewers": "9zbV;jFUR;G17g;cFd9;sRTF",
        "site": "https://openreview.net/forum?id=rQRDt8F2Yh",
        "pdf_size": 284516,
        "rating": "3;3;5;8;8",
        "confidence": "5;3;4;4;4",
        "soundness": "2;2;3;4;4",
        "contribution": "3;2;2;4;4",
        "presentation": "2;3;2;3;3",
        "wc_summary": "95;35;128;89;113",
        "wc_strengths": "61;14;66;142;98",
        "wc_weaknesses": "547;159;55;159;61",
        "wc_questions": "59;25;146;103;29",
        "wc_review": "762;233;395;493;301",
        "wc_reply_reviewers": "0;71;0;0;37",
        "wc_reply_authors": "978;600;508;294;168",
        "reply_reviewers": "0;1;0;0;1",
        "reply_authors": "2;2;1;1;1",
        "rating_avg": [
            5.4,
            2.244994432064365
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            3.0,
            0.8944271909999159
        ],
        "contribution_avg": [
            3.0,
            0.8944271909999159
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            92.0,
            31.635423183513762
        ],
        "wc_strengths_avg": [
            76.2,
            42.4471436023674
        ],
        "wc_weaknesses_avg": [
            196.2,
            181.1324377354868
        ],
        "wc_questions_avg": [
            72.4,
            46.18051537174526
        ],
        "wc_review_avg": [
            436.8,
            184.73591962582697
        ],
        "wc_reply_reviewers_avg": [
            21.6,
            28.55591007129697
        ],
        "wc_reply_authors_avg": [
            509.6,
            279.55221336988194
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.4,
            0.4898979485566356
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:vrTrwAErfCkJ:scholar.google.com/&scioq=A+Discrete+and+Variational+Approach+to+Speech+Representation+Learning&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Edinburgh",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ed.ac.uk",
        "aff_unique_abbr": "Edinburgh",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "title": "Functional Interpolation for Relative Positions improves Long Context Transformers",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17693",
        "id": "rR03qFesqk",
        "author_site": "Shanda Li, Chong You, Guru Guruganesh, Joshua Ainslie, Santiago Ontanon, Manzil Zaheer, Sumit Sanghai, Yiming Yang, Sanjiv Kumar, Srinadh Bhojanapalli",
        "tldr": "",
        "abstract": "Preventing the performance decay of Transformers on inputs longer than those used for training has been an important challenge in extending the context length of these models. Though the Transformer architecture has fundamentally no limits on the input sequence lengths it can process, the choice of position encoding used during training can limit the performance of these models on longer inputs. We propose a novel functional relative position encoding with progressive interpolation, FIRE, to improve Transformer generalization to longer contexts. We theoretically prove that this can represent some of the popular relative position encodings, such as T5's RPE, Alibi, and Kerple. We next empirically show that FIRE models have better generalization to longer contexts on both zero-shot language modeling and long text benchmarks.",
        "keywords": "Transformers;positional encoding;long context;length generalization",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Shanda Li;Chong You;Guru Guruganesh;Joshua Ainslie;Santiago Ontanon;Manzil Zaheer;Sumit Sanghai;Yiming Yang;Sanjiv Kumar;Srinadh Bhojanapalli",
        "authorids": "~Shanda_Li1;~Chong_You2;~Guru_Guruganesh1;~Joshua_Ainslie1;~Santiago_Ontanon1;~Manzil_Zaheer1;~Sumit_Sanghai1;~Yiming_Yang1;~Sanjiv_Kumar1;~Srinadh_Bhojanapalli1",
        "gender": "M;M;;;;M;M;F;;M",
        "homepage": "https://lithiumda.github.io/;https://sites.google.com/view/cyou;;;https://sites.google.com/site/santiagoontanonvillar/;https://www.aclweb.org/anthology/people/m/manzil-zaheer/;;http://www.cs.cmu.edu/~yiming/;http://www.sanjivk.com/;https://bsrinadh.github.io/",
        "dblp": "295/9278;164/7311;153/2209;263/3363;https://dblp.org/pers/o/Onta=ntilde==oacute=n:Santiago.html;40/10701;;25/1666;;131/6700",
        "google_scholar": ";Mfrpm_IAAAAJ;;;aS-DrOwAAAAJ;A33FhJMAAAAJ;;MlZq4XwAAAAJ;https://scholar.google.com/citations?hl=en;bpSF_9EAAAAJ",
        "orcid": ";;;;;;;0000-0001-8322-607X;;",
        "linkedin": ";;;;;;sumit-sanghai-90961a5/;yiming-yang-24100924/;;",
        "or_profile": "~Shanda_Li1;~Chong_You2;~Guru_Guruganesh1;~Joshua_Ainslie1;~Santiago_Ontanon1;~Manzil_Zaheer1;~Sumit_Sanghai1;~Yiming_Yang1;~Sanjiv_Kumar1;~Srinadh_Bhojanapalli1",
        "aff": "Google;Google;;Google;Drexel University;Google DeepMind;Research, Google;School of Computer Science, Carnegie Mellon University;Google;Google",
        "aff_domain": "google.com;google.com;;google.com;drexel.edu;deepmind.com;research.google.com;cs.cmu.edu;google.com;google.com",
        "position": "Intern;Research Scientist;;Software Engineer;Associate Professor;Researcher;Researcher;Full Professor;Research Scientist;Research Scientist",
        "bibtex": "@inproceedings{\nli2024functional,\ntitle={Functional Interpolation for Relative Positions improves Long Context Transformers},\nauthor={Shanda Li and Chong You and Guru Guruganesh and Joshua Ainslie and Santiago Ontanon and Manzil Zaheer and Sumit Sanghai and Yiming Yang and Sanjiv Kumar and Srinadh Bhojanapalli},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=rR03qFesqk}\n}",
        "github": "",
        "project": "",
        "reviewers": "hDCR;WBMp;VXMT",
        "pdf_size": 694533,
        "rating": "6;6;8",
        "confidence": "4;4;4",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "3;3;4",
        "wc_summary": "125;75;88",
        "wc_strengths": "14;90;66",
        "wc_weaknesses": "256;124;81",
        "wc_questions": "5;2;5",
        "wc_review": "400;291;240",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "903;486;277",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            96.0,
            21.18175315375634
        ],
        "wc_strengths_avg": [
            56.666666666666664,
            31.72100600898752
        ],
        "wc_weaknesses_avg": [
            153.66666666666666,
            74.45953412573989
        ],
        "wc_questions_avg": [
            4.0,
            1.4142135623730951
        ],
        "wc_review_avg": [
            310.3333333333333,
            66.7349650150171
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            555.3333333333334,
            260.22340829030395
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 47,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3057251516812446688&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=rR03qFesqk",
        "pdf": "https://openreview.net/pdf?id=rR03qFesqk",
        "email": "google.com;google.com;;google.com;drexel.edu;deepmind.com;research.google.com;cs.cmu.edu;google.com;google.com",
        "author_num": 10,
        "aff_unique_index": "0;0;0;1;0;0;2;0;0",
        "aff_unique_norm": "Google;Drexel University;Carnegie Mellon University",
        "aff_unique_dep": "Google;;School of Computer Science",
        "aff_unique_url": "https://www.google.com;https://www.drexel.edu;https://www.cmu.edu",
        "aff_unique_abbr": "Google;Drexel;CMU",
        "aff_campus_unique_index": "0;0;0;0;2;0;0",
        "aff_campus_unique": "Mountain View;;Pittsburgh",
        "aff_country_unique_index": "0;0;0;0;1;0;0;0;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "rT2KyF8SFM",
        "title": "Defender of privacy and fairness: tiny but reversible generative model via mutually collaborative knowledge distillation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Sharing vast amounts of data to train powerful artificial intelligence (AI) models raises public interest concerns such as privacy and fairness. While reversible anonymization techniques are very effective for privacy preservation and fairness enhancement, these methods rely on heavy reversible generative models, making them only suitable to run in the cloud or on a server independent from the image source. For example, data transmission might be under the privacy threats such as channel eavesdropping. Therefore, we propose a novel mutually collaborative knowledge distillation strategy to train a tiny and reversible generative model. This enables us to build a synthesis-based privacy and fairness protection system in embedded devices for anonymizing privacy-sensitive data and thus improve security protection capabilities from the source. The proposed mutually collaborative knowledge distillation method exploits the reversibility of the generative model. By pairing the teacher encoder (decoder) with the student decoder (encoder), we train the student decoder (encoder) by reconstructing the image space (latent space) from the prior image space (latent space). This results in tiny-size student models that can be embedded into devices. We deploy and evaluate our system on NVIDIA Jetson TX2 devices, which operate in real-time.  Extensive experiments demonstrate that our system effectively anonymizes face images and thus protects privacy and also improves fairness while minimizing the impact on downstream tasks. Our code will be publicly available on GitHub.",
        "keywords": "Privacy protection;and knowledge distillation.",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/9acd706a6ff8d59e10fe0b2b5d78d3137f0ec45b.pdf",
        "author": "Xiaoxiao Wu;Zehong Huang;Lin Gu;Zhicong Liang;Zheng Li;Tatsuya Harada;Yingying Zhu",
        "authorids": "~Xiaoxiao_Wu1;~Zehong_Huang1;~Lin_Gu4;~Zhicong_Liang2;~Zheng_Li18;~Tatsuya_Harada1;~Yingying_Zhu6",
        "gender": "F;M;M;M;M;M;F",
        "homepage": "https://eesissi.com/;;;;https://sites.google.com/view/li-zheng/home;https://www.mi.t.u-tokyo.ac.jp/harada/;https://zyy123jy.github.io/My-Web-Sites/",
        "dblp": ";;;;10/1143-6;14/5849;40/5552-4",
        "google_scholar": "https://scholar.google.com.hk/citations?user=VBczh9YAAAAJ;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com/citations?hl=en;iRiuGNcAAAAJ;m_iOb2UAAAAJ;https://scholar.google.com/citations?hl=ja;PMjtni8AAAAJ",
        "orcid": ";;;;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Xiaoxiao_Wu1;~Zehong_Huang1;~Lin_Gu4;~Zhicong_Liang2;~Zheng_Li18;~Tatsuya_Harada1;~Yingying_Zhu6",
        "aff": "Shenzhen University;Shenzhen University;RIKEN;Shenzhen University;STOCKTON UNIVERSITY;The University of Tokyo;University of Texas, Arlington",
        "aff_domain": "szu.edu.cn;szu.edu.cn;riken.jp;szu.edu.cn;stockton.edu;u-tokyo.ac.jp;uta.edu",
        "position": "Associate Professor;MS student;Researcher;MS student;Assistant Professor;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nwu2024defender,\ntitle={Defender of privacy and fairness: tiny but reversible generative model via mutually collaborative knowledge distillation},\nauthor={Xiaoxiao Wu and Zehong Huang and Lin Gu and Zhicong Liang and Zheng Li and Tatsuya Harada and Yingying Zhu},\nyear={2024},\nurl={https://openreview.net/forum?id=rT2KyF8SFM}\n}",
        "github": "",
        "project": "",
        "reviewers": "yB4B;gq9w;u6s5",
        "site": "https://openreview.net/forum?id=rT2KyF8SFM",
        "pdf_size": 0,
        "rating": "3;3;5",
        "confidence": "4;4;3",
        "soundness": "2;2;3",
        "contribution": "2;1;3",
        "presentation": "3;2;2",
        "wc_summary": "73;74;54",
        "wc_strengths": "27;39;47",
        "wc_weaknesses": "204;283;218",
        "wc_questions": "2;68;8",
        "wc_review": "306;464;327",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            67.0,
            9.201449161228174
        ],
        "wc_strengths_avg": [
            37.666666666666664,
            8.219218670625303
        ],
        "wc_weaknesses_avg": [
            235.0,
            34.418987008142274
        ],
        "wc_questions_avg": [
            26.0,
            29.79932885150268
        ],
        "wc_review_avg": [
            365.6666666666667,
            70.05870554201114
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10677362004312012988&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;1;0;2;3;4",
        "aff_unique_norm": "Shenzhen University;RIKEN;Stockton University;University of Tokyo;University of Texas at Arlington",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.szu.edu.cn;https://www.riken.jp;https://www.stockton.edu;https://www.u-tokyo.ac.jp;https://www.uta.edu",
        "aff_unique_abbr": "SZU;RIKEN;Stockton;UTokyo;UTA",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Arlington",
        "aff_country_unique_index": "0;0;1;0;2;1;2",
        "aff_country_unique": "China;Japan;United States"
    },
    {
        "title": "Towards Lossless Dataset Distillation via Difficulty-Aligned Trajectory Matching",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17692",
        "id": "rTBL8OhdhH",
        "author_site": "Ziyao Guo, Kai Wang, George Cazenavette, HUI LI, Kaipeng Zhang, Yang You",
        "tldr": "",
        "abstract": "The ultimate goal of Dataset Distillation is to synthesize a small synthetic dataset such that a model trained on this synthetic set will perform equally well as a model trained on the full, real dataset. Until now, no method of Dataset Distillation has reached this completely lossless goal, in part due to the fact that previous methods only remain effective when the total number of synthetic samples is extremely small. Since only so much information can be contained in such a small number of samples, it seems that to achieve truly loss dataset distillation, we must develop a distillation method that remains effective as the size of the synthetic dataset grows. In this work, we present such an algorithm and elucidate why existing methods fail to generate larger, high-quality synthetic sets. Current state-of-the-art methods rely on trajectory-matching, or optimizing the synthetic data to induce similar long-term training dynamics as the real data. We empirically find that the training stage of the trajectories we choose to match (i.e., early or late) greatly affects the effectiveness of the distilled dataset. Specifically, early trajectories (where the teacher network learns easy patterns) work well for a low-cardinality synthetic set since there are fewer examples wherein to distribute the necessary information. Conversely, late trajectories (where the teacher network learns hard patterns) provide better signals for larger synthetic sets since there are now enough samples to represent the necessary complex patterns. Based on our findings, we propose to align the difficulty of the generated patterns with the size of the synthetic dataset. In doing so, we successfully scale trajectory matching-based methods to larger synthetic datasets, achieving lossless dataset distillation for the very first time. Code and distilled datasets will be released.",
        "keywords": "Dataset Distillation",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/923d8473a799340fc85398351095b57e45d4b79a.zip",
        "author": "Ziyao Guo;Kai Wang;George Cazenavette;HUI LI;Kaipeng Zhang;Yang You",
        "authorids": "~Ziyao_Guo1;~Kai_Wang8;~George_Cazenavette1;~HUI_LI17;~Kaipeng_Zhang1;~Yang_You1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://github.com/GzyAftermath;https://kaiwang960112.github.io/;https://georgecazenavette.github.io/;https://web.xidian.edu.cn/lihui/en/index.html;http://kpzhang93.github.io/;https://www.comp.nus.edu.sg/~youy/",
        "dblp": "309/6165;78/2022-36;202/5478;l/HuiLi6;179/2126;33/8167-1.html",
        "google_scholar": "FlZSxJMAAAAJ;i2II0XIAAAAJ;https://scholar.google.com/citations?hl=en;oEcRS84AAAAJ;4OqZBmYAAAAJ;jF4dPZwAAAAJ",
        "orcid": ";0000-0002-1154-5175;;0000-0001-8310-7169;;",
        "linkedin": ";;;;;yang-you-0b92914b/",
        "or_profile": "~Ziyao_Guo1;~Kai_Wang8;~George_Cazenavette1;~HUI_LI17;~Kaipeng_Zhang1;~Yang_You1",
        "aff": "Xidian University;National University of Singapore;Massachusetts Institute of Technology;xidian university;Shanghai AI Laboratory;National University of Singapore",
        "aff_domain": "xidian.edu.cn;u.nus.edu;mit.edu;xidian.edu.cn;pjlab.org.cn;nus.edu.sg",
        "position": "MS student;PhD student;PhD student;Full Professor;Researcher;Professor",
        "bibtex": "@inproceedings{\nguo2024towards,\ntitle={Towards Lossless Dataset Distillation via Difficulty-Aligned Trajectory Matching},\nauthor={Ziyao Guo and Kai Wang and George Cazenavette and HUI LI and Kaipeng Zhang and Yang You},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=rTBL8OhdhH}\n}",
        "github": "",
        "project": "",
        "reviewers": "G6x3;5Mev;VsZC;8eCM",
        "pdf_size": 3009421,
        "rating": "6;6;8;8",
        "confidence": "3;3;4;4",
        "soundness": "3;3;3;3",
        "contribution": "3;2;3;4",
        "presentation": "3;3;3;4",
        "wc_summary": "72;50;122;110",
        "wc_strengths": "41;48;117;74",
        "wc_weaknesses": "123;49;297;5",
        "wc_questions": "19;2;6;87",
        "wc_review": "255;149;542;276",
        "wc_reply_reviewers": "18;0;59;49",
        "wc_reply_authors": "1447;793;954;1159",
        "reply_reviewers": "1;0;1;2",
        "reply_authors": "6;4;4;4",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            88.5,
            28.892040426387332
        ],
        "wc_strengths_avg": [
            70.0,
            29.790938219532464
        ],
        "wc_weaknesses_avg": [
            118.5,
            111.34967444945674
        ],
        "wc_questions_avg": [
            28.5,
            34.35476677260377
        ],
        "wc_review_avg": [
            305.5,
            144.78000552562497
        ],
        "wc_reply_reviewers_avg": [
            31.5,
            23.648467180770936
        ],
        "wc_reply_authors_avg": [
            1088.25,
            244.3883947735653
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            4.5,
            0.8660254037844386
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 87,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8595750308992236812&as_sdt=5,24&sciodt=0,24&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=rTBL8OhdhH",
        "pdf": "https://openreview.net/pdf?id=rTBL8OhdhH",
        "email": "xidian.edu.cn;u.nus.edu;mit.edu;xidian.edu.cn;pjlab.org.cn;nus.edu.sg",
        "author_num": 6,
        "aff_unique_index": "0;1;2;0;3;1",
        "aff_unique_norm": "Xidian University;National University of Singapore;Massachusetts Institute of Technology;Shanghai AI Laboratory",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "http://www.xidian.edu.cn/;https://www.nus.edu.sg;https://web.mit.edu;https://www.shanghai-ai-lab.com",
        "aff_unique_abbr": "Xidian;NUS;MIT;SAIL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;0;0;1",
        "aff_country_unique": "China;Singapore;United States"
    },
    {
        "title": "Octavius: Mitigating Task Interference in MLLMs via LoRA-MoE",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17691",
        "id": "rTDyN8yajn",
        "author_site": "Zeren Chen, ziqin wang, zhen wang, Huayang Liu, Zhenfei Yin, Si Liu, Lu Sheng, Wanli Ouyang, Jing Shao",
        "tldr": "",
        "abstract": "Recent studies have demonstrated Large Language Models (LLMs) can extend their zero-shot generalization capabilities to multimodal learning through instruction tuning. As more modalities and downstream tasks are introduced, negative conflicts and interference may have a worse impact on performance. While this phenomenon has been overlooked in previous work, we propose a novel and extensible framework, called Octavius, for comprehensive studies and experimentation on multimodal learning with Multimodal Large Language Models (MLLMs). Specifically, to mitigate the interference, we combine the concept of Mixture-of-Experts (MoE) with LoRA and design a multimodal LoRA-MoE decoder for task- and modality-specific learning. To the best of our knowledge, we are one of the pioneering efforts to introduce MoE into MLLMs to address this problem. The experimental results (about 20% improvement) have shown the effectiveness and versatility of our design in various 2D and 3D downstream tasks. Code and corresponding dataset will be available\nsoon.",
        "keywords": "Large Language Model (LLM);Multi-task learning;Multi-modal learning;Mixture-of-Experts (MoE);PEFT",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/c893efbbfb20b274654781295d92560f913cc8d6.pdf",
        "author": "Zeren Chen;Ziqin Wang;Zhen Wang;Huayang Liu;Zhenfei Yin;Si Liu;Lu Sheng;Wanli Ouyang;Jing Shao",
        "authorids": "~Zeren_Chen1;~Ziqin_Wang2;~Zhen_Wang29;~Huayang_Liu1;~Zhenfei_Yin2;~Si_Liu5;~Lu_Sheng1;~Wanli_Ouyang1;~Jing_Shao3",
        "gender": ";M;M;M;M;F;M;;F",
        "homepage": "https://github.com/Zx55;https://github.com/wtt0213;https://buaacoder.github.io/;https://couteau69586.github.io/;https://yinzhenfei.github.io/;https://colalab.net;https://lucassheng.github.io/;;https://amandajshao.github.io/",
        "dblp": "310/4723;;;;271/0669;60/7642;132/1772;;",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;BF-xXsIAAAAJ;;;https://scholar.google.com.hk/citations?user=ngPR1dIAAAAJ;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com.hk/citations?user=_8lB7xcAAAAJ;;VU5ObUwAAAAJ",
        "orcid": "0000-0001-9693-8578;;;;0000-0002-8666-1103;0000-0002-9180-2935;0000-0002-8525-9163;;",
        "linkedin": ";;;;zhenfei-yin/;;;;",
        "or_profile": "~Zeren_Chen1;~Ziqin_Wang2;~Zhen_Wang29;~Huayang_Liu1;~Zhenfei_Yin2;~Si_Liu5;~Lu_Sheng1;~Wanli_Ouyang1;~Jing_Shao3",
        "aff": "Shanghai Artificial Intelligence Laboratory;Beihang University;Beihang University;Beihang University;Shanghai AI Laboratory;Beihang University;Beihang University;;Shanghai AI Laboratory",
        "aff_domain": "pjlab.org.cn;buaa.edu.cn;buaa.edu.cn;buaa.edu.cn;pjlab.org.cn;buaa.edu.cn;buaa.edu.cn;;pjlab.org.cn",
        "position": "Intern;PhD student;MS student;Undergrad student;Intern;Full Professor;Associate Professor;;Researcher",
        "bibtex": "@inproceedings{\nchen2024octavius,\ntitle={Octavius: Mitigating Task Interference in {MLLM}s via Lo{RA}-MoE},\nauthor={Zeren Chen and Ziqin Wang and Zhen Wang and Huayang Liu and Zhenfei Yin and Si Liu and Lu Sheng and Wanli Ouyang and Jing Shao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=rTDyN8yajn}\n}",
        "github": "",
        "project": "",
        "reviewers": "7dhr;3GST;6dGg;WqWj;vGo5",
        "pdf_size": 5290549,
        "rating": "5;5;6;8;8",
        "confidence": "5;5;4;3;4",
        "soundness": "2;2;2;4;3",
        "contribution": "2;3;2;4;3",
        "presentation": "2;3;4;4;3",
        "wc_summary": "34;52;55;63;42",
        "wc_strengths": "51;41;59;52;45",
        "wc_weaknesses": "51;270;170;86;32",
        "wc_questions": "47;107;16;30;13",
        "wc_review": "183;470;300;231;132",
        "wc_reply_reviewers": "0;224;0;11;0",
        "wc_reply_authors": "1877;2806;1140;765;706",
        "reply_reviewers": "0;1;0;1;0",
        "reply_authors": "5;6;3;2;2",
        "rating_avg": [
            6.4,
            1.3564659966250536
        ],
        "confidence_avg": [
            4.2,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.6,
            0.8
        ],
        "contribution_avg": [
            2.8,
            0.7483314773547882
        ],
        "presentation_avg": [
            3.2,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            49.2,
            10.146920715172657
        ],
        "wc_strengths_avg": [
            49.6,
            6.1838499334961226
        ],
        "wc_weaknesses_avg": [
            121.8,
            87.9145039228454
        ],
        "wc_questions_avg": [
            42.6,
            34.37789987768305
        ],
        "wc_review_avg": [
            263.2,
            117.30541334482395
        ],
        "wc_reply_reviewers_avg": [
            47.0,
            88.60248303518361
        ],
        "wc_reply_authors_avg": [
            1458.8,
            792.4063099193494
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            3.6,
            1.624807680927192
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -0.8669214468630109,
        "gs_citation": 38,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1013411136325846313&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=rTDyN8yajn",
        "pdf": "https://openreview.net/pdf?id=rTDyN8yajn",
        "email": "pjlab.org.cn;buaa.edu.cn;buaa.edu.cn;buaa.edu.cn;pjlab.org.cn;buaa.edu.cn;buaa.edu.cn;;pjlab.org.cn",
        "author_num": 9,
        "aff_unique_index": "0;1;1;1;2;1;1;2",
        "aff_unique_norm": "Shanghai Artificial Intelligence Laboratory;Beihang University;Shanghai AI Laboratory",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.shailab.org/;http://www.buaa.edu.cn/;https://www.shanghai-ai-lab.com",
        "aff_unique_abbr": "Shanghai AI Lab;BUAA;SAIL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "rTdbRWWdR5",
        "title": "M-IDAS: MULTI-MODAL INTRUSION DETECTION AND ANALYTIC SYSTEM",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The analysis of modern intrusion often needs to consider the correlation between patterns from different channels such as network traffic, host behavior, and device status to achieve accurate intrusion detection. However, existing research predominantly employs single-modal data for intrusion detection & explanation, a method that, though operationally straightforward, provides constrained representational capacity for complex cases. How to leverage multi-modal fusion representations for intrusion detection and interpretation from diverse data channels remains a key challenge. \nIn this paper, we propose a new cross-domain multi-modal intrusion detection model called Multi-modal Intrusion Detection and Analytic System, M-IDAS, which is based on bidirectional encoder representations from transformers. This model employs modal fusion to unify different intrusion data and pre-trains attack behavior context representations from extensive unlabeled multi-modal fused data. The pre-trained model can be fine-tuned with minimal labeled data specific to tasks, achieving state-of-the-art performance across various intrusion detection scenarios. Notably, through an analysis of model attentions during detection, we provide traceability and interpretative insights into network attack behaviors, offering a profound understanding of the network attack process.",
        "keywords": "Multi-modal;Intrusion detection;Interpretation analysis",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/42ff3fa75c2afe606d3c9c6330ba164b60b91eb9.pdf",
        "author": "Mengmeng GE;Ruitao FENG;Xiangzhan YU;Xiaofei Xie;Kwok-Yan Lam;Yang Liu",
        "authorids": "~Mengmeng_GE3;~Ruitao_FENG2;yxz@hit.edu.cn;~Xiaofei_Xie2;~Kwok-Yan_Lam1;~Yang_Liu36",
        "gender": "M;M;;M;M;M",
        "homepage": ";https://rtfeng.github.io/;;http://xiaofeixie.bitbucket.io/;https://personal.ntu.edu.sg/kwokyan.lam/;https://personal.ntu.edu.sg/yangliu/",
        "dblp": ";;;127/0713;10/1993;51/3710-3",
        "google_scholar": ";;;FfcZfJgAAAAJ;https://scholar.google.com.sg/citations?user=NDMIYKsAAAAJ;https://scholar.google.com.sg/citations?hl=en",
        "orcid": "0000-0001-6912-6152;;;0000-0002-1288-6502;;0000-0001-7300-9215",
        "linkedin": ";;;;;",
        "or_profile": "~Mengmeng_GE3;~Ruitao_FENG2;yxz@hit.edu.cn;~Xiaofei_Xie2;~Kwok-Yan_Lam1;~Yang_Liu36",
        "aff": "Harbin Institute of Technology;Singapore Management University;;Singapore Management University;Nanyang Technological University;Nanyang Technological University",
        "aff_domain": "hit.edu.cn;smu.edu.sg;;smu.edu.sg;ntu.edu.sg;ntu.edu.sg",
        "position": "PhD student;Researcher;;Assistant Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nge2024midas,\ntitle={M-{IDAS}: {MULTI}-{MODAL} {INTRUSION} {DETECTION} {AND} {ANALYTIC} {SYSTEM}},\nauthor={Mengmeng GE and Ruitao FENG and Xiangzhan YU and Xiaofei Xie and Kwok-Yan Lam and Yang Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=rTdbRWWdR5}\n}",
        "github": "",
        "project": "",
        "reviewers": "gzsQ;w6hm;C9Rg",
        "site": "https://openreview.net/forum?id=rTdbRWWdR5",
        "pdf_size": 804015,
        "rating": "3;3;3",
        "confidence": "5;4;3",
        "soundness": "1;2;3",
        "contribution": "1;2;2",
        "presentation": "3;2;3",
        "wc_summary": "421;50;86",
        "wc_strengths": "45;47;41",
        "wc_weaknesses": "2617;88;492",
        "wc_questions": "94;158;2",
        "wc_review": "3177;343;621",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            185.66666666666666,
            167.05355096162694
        ],
        "wc_strengths_avg": [
            44.333333333333336,
            2.494438257849294
        ],
        "wc_weaknesses_avg": [
            1065.6666666666667,
            1109.288160137943
        ],
        "wc_questions_avg": [
            84.66666666666667,
            64.02777175222917
        ],
        "wc_review_avg": [
            1380.3333333333333,
            1275.494501055266
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:dBed0tIrpGoJ:scholar.google.com/&scioq=M-IDAS:+MULTI-MODAL+INTRUSION+DETECTION+AND+ANALYTIC+SYSTEM&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;2;2",
        "aff_unique_norm": "Harbin Institute of Technology;Singapore Management University;Nanyang Technological University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.hit.edu.cn/;https://www.smu.edu.sg;https://www.ntu.edu.sg",
        "aff_unique_abbr": "HIT;SMU;NTU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Harbin;",
        "aff_country_unique_index": "0;1;1;1;1",
        "aff_country_unique": "China;Singapore"
    },
    {
        "id": "rUH2EDpToF",
        "title": "Generative Marginalization Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We introduce *marginalization models* (MAMs), a new family of generative models\nfor high-dimensional discrete data. They offer scalable and flexible generative modeling with tractable likelihoods \nby explicitly modeling all induced marginal distributions. Marginalization models enable fast evaluation of arbitrary marginal probabilities with a single forward pass of the neural network, which overcomes a major limitation of methods with exact marginal inference, such as autoregressive models (ARMs). We propose scalable methods for learning the marginals, grounded in the concept of \u201c*marginalization self-consistency*\u201d. Unlike previous methods, MAMs support scalable training of any-order generative models for high-dimensional problems under the setting of *energy-based training*, where the goal is to match the learned distribution to a given desired probability (specified\nby an unnormalized (log) probability function such as energy function or reward function). We demonstrate the effectiveness of the proposed model on a variety of discrete data distributions, including binary images, language, physical systems, and molecules, for *maximum likelihood* and *energy-based training* settings. MAMs achieve orders of magnitude speedup in evaluating the marginal probabilities on both settings. For energy-based training tasks, MAMs enable any-order generative modeling of high-dimensional problems beyond the capability of previous methods.",
        "keywords": "discrete generative models;marginalization;probabilistic models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/9b40a3697ed482f811ab3f048d505d5ec6fde7f0.zip",
        "author": "Sulin Liu;Peter Ramadge;Ryan P Adams",
        "authorids": "~Sulin_Liu1;~Peter_Ramadge1;~Ryan_P_Adams1",
        "gender": "M;M;M",
        "homepage": "https://liusulin.github.io/;http://ee.princeton.edu/people/faculty/peter-j-ramadge;http://www.cs.princeton.edu/~rpa/",
        "dblp": "192/1289;77/3256;32/909",
        "google_scholar": "s3NlgA4AAAAJ;BOMboVoAAAAJ;grQ_GBgAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Sulin_Liu1;~Peter_Ramadge1;~Ryan_P_Adams1",
        "aff": "Massachusetts Institute of Technology;Princeton University;Princeton University",
        "aff_domain": "mit.edu;princeton.edu;princeton.edu",
        "position": "Postdoc;Full Professor;Professor",
        "bibtex": "@misc{\nliu2024generative,\ntitle={Generative Marginalization Models},\nauthor={Sulin Liu and Peter Ramadge and Ryan P Adams},\nyear={2024},\nurl={https://openreview.net/forum?id=rUH2EDpToF}\n}",
        "github": "",
        "project": "",
        "reviewers": "sWKU;G1Dh;kkqm;CcDR;2RBk",
        "site": "https://openreview.net/forum?id=rUH2EDpToF",
        "pdf_size": 4429252,
        "rating": "5;5;6;6;8",
        "confidence": "4;3;4;3;3",
        "soundness": "2;2;3;3;3",
        "contribution": "1;2;3;3;3",
        "presentation": "2;3;3;3;4",
        "wc_summary": "43;128;66;88;80",
        "wc_strengths": "1;124;22;78;75",
        "wc_weaknesses": "305;93;75;116;115",
        "wc_questions": "140;34;278;73;209",
        "wc_review": "489;379;441;355;479",
        "wc_reply_reviewers": "179;0;114;18;0",
        "wc_reply_authors": "1405;875;849;810;682",
        "reply_reviewers": "1;0;2;1;0",
        "reply_authors": "4;3;4;3;2",
        "rating_avg": [
            6.0,
            1.0954451150103321
        ],
        "confidence_avg": [
            3.4,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.4,
            0.8
        ],
        "presentation_avg": [
            3.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            81.0,
            28.02855686616776
        ],
        "wc_strengths_avg": [
            60.0,
            43.749285708454714
        ],
        "wc_weaknesses_avg": [
            140.8,
            83.49467048860065
        ],
        "wc_questions_avg": [
            146.8,
            88.65528749036912
        ],
        "wc_review_avg": [
            428.6,
            53.32766636559301
        ],
        "wc_reply_reviewers_avg": [
            62.2,
            72.13431915530914
        ],
        "wc_reply_authors_avg": [
            924.2,
            249.37794609788574
        ],
        "reply_reviewers_avg": [
            0.8,
            0.7483314773547883
        ],
        "reply_authors_avg": [
            3.2,
            0.7483314773547882
        ],
        "replies_avg": [
            31,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.372677996249965,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18323067373203796909&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 10,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Massachusetts Institute of Technology;Princeton University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://web.mit.edu;https://www.princeton.edu",
        "aff_unique_abbr": "MIT;Princeton",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Image Inpainting via Iteratively Decoupled Probabilistic Modeling",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17690",
        "id": "rUf9G9k2im",
        "author_site": "Wenbo Li, Xin Yu, Kun Zhou, Yibing Song, Zhe Lin",
        "tldr": "",
        "abstract": "Generative adversarial networks (GANs) have made great success in image inpainting yet still have difficulties tackling large missing regions. In contrast, iterative probabilistic algorithms, such as autoregressive and denoising diffusion models, have to be deployed with massive computing resources for decent effect. To achieve high-quality results with low computational cost, we present a novel pixel spread model (PSM) that iteratively employs decoupled probabilistic modeling, combining the optimization efficiency of GANs with the prediction tractability of probabilistic models. As a result, our model selectively spreads informative pixels throughout the image in a few iterations, largely enhancing the completion quality and efficiency. On multiple benchmarks, we achieve new state-of-the-art performance. Our code and models will be publicly available.",
        "keywords": "Inpainting;Decoupled Probabilistic Modeling;Pixel Spread Model",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Wenbo Li;Xin Yu;Kun Zhou;Yibing Song;Zhe Lin",
        "authorids": "~Wenbo_Li6;~Xin_Yu6;~Kun_Zhou3;~Yibing_Song1;~Zhe_Lin1",
        "gender": "M;M;;M;M",
        "homepage": "https://fenglinglwb.github.io/;https://xinyu-andy.github.io/;https://ybsong00.github.io/;https://sites.google.com/site/zhelin625/;",
        "dblp": "51/3185-2.html;54/1184-4;77/2117;42/1680-1;",
        "google_scholar": "foGn_TIAAAAJ;https://scholar.google.com/citations?hl=en;oRhJHmIAAAAJ;R0bnqaAAAAAJ;https://scholar.google.com.hk/citations?user=OXCWQz0AAAAJ",
        "orcid": ";0000-0002-4531-1254;;0000-0003-1154-9907;",
        "linkedin": ";;;;",
        "or_profile": "~Wenbo_Li6;~Xin_Yu6;~Yibing_Song1;~Zhe_Lin1;~Zhou_Kun1",
        "aff": "Huawei Technologies Ltd.;The University of Hong Kong;Alibaba DAMO Academy;Adobe Research;The Chinese University of Hong Kong (Shenzhen\uff09",
        "aff_domain": "huawei.com;hku.hk;alibaba-inc.com;adobe.com;link.cuhk.edu.cn",
        "position": "Researcher;PhD student;Staff Scientist;Principal Researcher;PhD student",
        "bibtex": "@inproceedings{\nli2024image,\ntitle={Image Inpainting via Iteratively Decoupled Probabilistic Modeling},\nauthor={Wenbo Li and Xin Yu and Kun Zhou and Yibing Song and Zhe Lin},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=rUf9G9k2im}\n}",
        "github": "",
        "project": "",
        "reviewers": "HZRy;rxeq;EPEv;N7bD",
        "pdf_size": 22090869,
        "rating": "5;6;6;8",
        "confidence": "4;3;3;4",
        "soundness": "3;2;3;3",
        "contribution": "3;2;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "63;94;68;106",
        "wc_strengths": "28;87;36;76",
        "wc_weaknesses": "8;20;106;76",
        "wc_questions": "140;83;3;59",
        "wc_review": "239;284;213;317",
        "wc_reply_reviewers": "0;0;0;12",
        "wc_reply_authors": "986;254;864;428",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "3;2;3;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            82.75,
            17.851820635442202
        ],
        "wc_strengths_avg": [
            56.75,
            25.21284394906691
        ],
        "wc_weaknesses_avg": [
            52.5,
            40.15905875391006
        ],
        "wc_questions_avg": [
            71.25,
            49.175069903356516
        ],
        "wc_review_avg": [
            263.25,
            40.10221315588455
        ],
        "wc_reply_reviewers_avg": [
            3.0,
            5.196152422706632
        ],
        "wc_reply_authors_avg": [
            633.0,
            301.51119382205366
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.2294157338705618,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2177985917147962563&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=rUf9G9k2im",
        "pdf": "https://openreview.net/pdf?id=rUf9G9k2im",
        "email": "huawei.com;hku.hk;alibaba-inc.com;adobe.com;link.cuhk.edu.cn",
        "author_num": 5,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "Huawei;University of Hong Kong;Alibaba Group;Adobe;Chinese University of Hong Kong",
        "aff_unique_dep": "Huawei Technologies;;DAMO Academy;Adobe Research;",
        "aff_unique_url": "https://www.huawei.com;https://www.hku.hk;https://www.alibaba-group.com;https://research.adobe.com;https://www.cuhk.edu.cn",
        "aff_unique_abbr": "Huawei;HKU;Alibaba DAMO;Adobe;CUHK",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Hong Kong SAR;Shenzhen",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "rUx0zQFwD1",
        "title": "Quantum Speedups in Linear Programming via Sublinear Multi-Gibbs Sampling",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "As a basic optimization technique, linear programming has found wide applications in many areas. In this paper, we propose an improved quantum algorithm for solving a linear programming problem with $m$ constraints and $n$ variables in time $\\widetilde{O} (\\sqrt{m+n}\\gamma^{2.25})$, where $\\gamma = Rr/\\varepsilon$ is the additive error $\\varepsilon$ scaled down with bounds $R$ and $r$ on the size of the primal and dual optimal solutions, improving the prior best $\\widetilde O(\\sqrt{m+n}\\gamma^{2.5})$ by Bouland, Getachew, Jin, Sidford, and Tian (ICML 2023) and Gao, Ji, Li, and Wang (NeurIPS 2023).\nOur algorithm solves linear programming via a zero-sum game formulation, under the framework of the sample-based optimistic multiplicative weight update. At the heart of our construction, is an improved quantum multi-Gibbs sampler for diagonal Hamiltonians with time complexity \\emph{sublinear} in inverse temperature $\\beta$, breaking the general $O(\\beta)$-barrier.",
        "keywords": "Linear programming;zero-sum games;quantum algorithms;quantum Gibbs sampling",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/3bd8c604d0022f9cf49bb5c13729acb0e6f17edc.pdf",
        "author": "Minbo Gao;Zhengfeng Ji;Qisheng Wang",
        "authorids": "~Minbo_Gao1;~Zhengfeng_Ji1;~Qisheng_Wang1",
        "gender": ";Not Specified;",
        "homepage": ";;https://wangqs13.github.io/",
        "dblp": ";30/2575.html;",
        "google_scholar": ";https://scholar.google.com.au/citations?user=2uXdu7AAAAAJ;",
        "orcid": ";;0000-0001-5107-8279",
        "linkedin": ";;",
        "or_profile": "~Minbo_Gao1;~Zhengfeng_Ji1;~Qisheng_Wang1",
        "aff": ";Tsinghua University;University of Edinburgh, University of Edinburgh",
        "aff_domain": ";tsinghua.edu.cn;ed.ac.uk",
        "position": ";Full Professor;Researcher",
        "bibtex": "@misc{\ngao2024quantum,\ntitle={Quantum Speedups in Linear Programming via Sublinear Multi-Gibbs Sampling},\nauthor={Minbo Gao and Zhengfeng Ji and Qisheng Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=rUx0zQFwD1}\n}",
        "github": "",
        "project": "",
        "reviewers": "8VsV;m7tP;Q6ko",
        "site": "https://openreview.net/forum?id=rUx0zQFwD1",
        "pdf_size": 378784,
        "rating": "5;5;6",
        "confidence": "3;4;4",
        "soundness": "3;3;4",
        "contribution": "3;2;3",
        "presentation": "2;1;4",
        "wc_summary": "93;127;92",
        "wc_strengths": "51;46;16",
        "wc_weaknesses": "130;173;36",
        "wc_questions": "123;766;1",
        "wc_review": "397;1112;145",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "wc_summary_avg": [
            104.0,
            16.268579122549905
        ],
        "wc_strengths_avg": [
            37.666666666666664,
            15.456030825826172
        ],
        "wc_weaknesses_avg": [
            113.0,
            57.20722565084473
        ],
        "wc_questions_avg": [
            296.6666666666667,
            335.58539234530986
        ],
        "wc_review_avg": [
            551.3333333333334,
            409.582171921039
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:v3EJvAUxziYJ:scholar.google.com/&scioq=Quantum+Speedups+in+Linear+Programming+via+Sublinear+Multi-Gibbs+Sampling&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Tsinghua University;University of Edinburgh",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.ed.ac.uk",
        "aff_unique_abbr": "THU;Edinburgh",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "id": "rVnxymbsOS",
        "title": "Knowledge Storage and Extraction in Language Models (Part A)",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large language models can store extensive world knowledge, often *extractable* through question-answering (e.g., \"What is Abraham Lincoln's birthday?\"). However, it's unclear whether the model answers questions based on exposure to exact/similar questions during training, or if it genuinely extracts knowledge from the source (e.g., Wikipedia biographies). \n\nIn this paper, we conduct an in-depth study of this problem using a controlled set of semi-synthetic biography data. We uncover a relationship between the model's knowledge extraction ability and different *diversity measures* of the training data. We conduct (nearly) linear probing, revealing a strong correlation between this relationship and whether the model (nearly) linearly encodes the knowledge attributes at the hidden embedding of the entity names, or across the embeddings of other tokens in the training text.",
        "keywords": "Interpretability;Transformers;Language Models;Linear Probing;Inner Working;Factual Knowledge",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/88c4d31b4153352b06cbd8b852d6e51ab228ffa2.zip",
        "author": "Zeyuan Allen-Zhu;Yuanzhi Li",
        "authorids": "~Zeyuan_Allen-Zhu1;~Yuanzhi_Li1",
        "gender": ";M",
        "homepage": ";",
        "dblp": ";73/3628",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Zeyuan_Allen-Zhu1;~Yuanzhi_Li1",
        "aff": ";Carnegie Mellon University",
        "aff_domain": ";andrew.cmu.edu",
        "position": ";Assistant Professor",
        "bibtex": "@misc{\nallen-zhu2024knowledge,\ntitle={Knowledge Storage and Extraction in Language Models (Part A)},\nauthor={Zeyuan Allen-Zhu and Yuanzhi Li},\nyear={2024},\nurl={https://openreview.net/forum?id=rVnxymbsOS}\n}",
        "github": "",
        "project": "",
        "reviewers": "HX8x;DDxF;vHD7;kyUn;xjTh",
        "site": "https://openreview.net/forum?id=rVnxymbsOS",
        "pdf_size": 528742,
        "rating": "3;5;6;8;8",
        "confidence": "5;4;3;4;4",
        "soundness": "2;2;3;3;4",
        "contribution": "3;3;4;3;4",
        "presentation": "2;2;3;3;4",
        "wc_summary": "46;148;246;28;491",
        "wc_strengths": "81;110;73;33;198",
        "wc_weaknesses": "318;123;57;30;99",
        "wc_questions": "147;39;22;15;64",
        "wc_review": "592;420;398;106;852",
        "wc_reply_reviewers": "0;27;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;1;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            6.0,
            1.8973665961010275
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.8,
            0.7483314773547882
        ],
        "contribution_avg": [
            3.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.8,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            191.8,
            168.79857819306417
        ],
        "wc_strengths_avg": [
            99.0,
            55.27748185292091
        ],
        "wc_weaknesses_avg": [
            125.4,
            101.56495458572311
        ],
        "wc_questions_avg": [
            57.4,
            47.877343284689466
        ],
        "wc_review_avg": [
            473.6,
            245.32557958761657
        ],
        "wc_reply_reviewers_avg": [
            5.4,
            10.8
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:LsKwZtJ-_w8J:scholar.google.com/&scioq=Knowledge+Storage+and+Extraction+in+Language+Models+(Part+A)&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Carnegie Mellon University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cmu.edu",
        "aff_unique_abbr": "CMU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "rWHMe2O5VW",
        "title": "Graph ODE with Factorized Prototypes for Modeling Complicated Interacting Dynamics",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper studies the problem of modeling interacting dynamical systems, which is critical for understanding physical dynamics and biological processes. Recent research predominantly uses geometric graphs to represent these interactions, which are then captured by powerful graph neural networks (GNNs). However, predicting interacting dynamics in challenging scenarios such as out-of-distribution shift and complicated underlying rules remains unsolved. In this paper, we propose a new approach named Graph ODE with factorized prototypes (GOAT) to address the problem. The core of GOAT is to incorporate factorized prototypes from contextual knowledge into a continuous graph ODE framework. Specifically, GOAT employs representation disentanglement and system parameters to extract both object-level and system-level contexts from historical trajectories, which allows us to explicitly model their independent influence and thus enhances the generalization capability under system changes. Then, we integrate these disentangled latent representations into a graph ODE model, which determines a combination of various interacting prototypes for enhanced model expressivity. The entire model is optimized using an end-to-end variational inference framework to maximize the likelihood. Extensive experiments in both in-distribution and out-of-distribution settings validate the superiority of GOAT.",
        "keywords": "Neural ODE;Dynamic systems;Graph neural networks;Interacting systems",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/1bcfeb0dd9b6bfc25b7978ec79bdfcb742ea6afe.pdf",
        "author": "Xiao Luo;Yiyang Gu;Huiyu Jiang;Jinsheng Huang;Wei Ju;Ming Zhang;Yizhou Sun",
        "authorids": "~Xiao_Luo3;~Yiyang_Gu1;~Huiyu_Jiang1;~Jinsheng_Huang1;~Wei_Ju1;~Ming_Zhang5;~Yizhou_Sun1",
        "gender": "M;;M;M;;F;F",
        "homepage": "http://luoxiao12.github.io;;;;;https://cs.pku.edu.cn/info/1080/1371.htm;http://web.cs.ucla.edu/~yzsun/",
        "dblp": "50/1585-1;;;;;73/1844-4;37/3868",
        "google_scholar": "https://scholar.google.com.hk/citations?;;;YHbWSOMAAAAJ;;LbzoQBsAAAAJ;https://scholar.google.com.tw/citations?user=TQgOjK0AAAAJ",
        "orcid": ";;;;;0000-0002-9809-3430;",
        "linkedin": "%E9%9C%84-%E7%BD%97-303548214/;;huiyu-jiang/;;;;",
        "or_profile": "~Xiao_Luo3;~Yiyang_Gu1;~Huiyu_Jiang1;~Jinsheng_Huang1;~Wei_Ju1;~Ming_Zhang5;~Yizhou_Sun1",
        "aff": "University of California, Los Angeles;;University of California, Santa Barbara;Peking University;;Peking University;University of California, Los Angeles",
        "aff_domain": "cs.ucla.edu;;ucsb.edu;pku.edu.cn;;pku.edu.cn;ucla.edu",
        "position": "Postdoc;;PhD student;PhD student;;Full Professor;Associate Professor",
        "bibtex": "@misc{\nluo2024graph,\ntitle={Graph {ODE} with Factorized Prototypes for Modeling Complicated Interacting Dynamics},\nauthor={Xiao Luo and Yiyang Gu and Huiyu Jiang and Jinsheng Huang and Wei Ju and Ming Zhang and Yizhou Sun},\nyear={2024},\nurl={https://openreview.net/forum?id=rWHMe2O5VW}\n}",
        "github": "",
        "project": "",
        "reviewers": "bPDi;RwDt;SJsj;ANXm",
        "site": "https://openreview.net/forum?id=rWHMe2O5VW",
        "pdf_size": 1585131,
        "rating": "3;5;6;6",
        "confidence": "2;4;5;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "1;1;2;3",
        "wc_summary": "29;35;231;96",
        "wc_strengths": "43;51;89;40",
        "wc_weaknesses": "355;345;123;66",
        "wc_questions": "23;136;28;42",
        "wc_review": "450;567;471;244",
        "wc_reply_reviewers": "0;0;22;0",
        "wc_reply_authors": "2533;1884;1525;500",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "6;6;5;3",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            97.75,
            81.27538065121566
        ],
        "wc_strengths_avg": [
            55.75,
            19.613452016409553
        ],
        "wc_weaknesses_avg": [
            222.25,
            129.37807967349028
        ],
        "wc_questions_avg": [
            57.25,
            45.996603135449035
        ],
        "wc_review_avg": [
            433.0,
            117.69664396234924
        ],
        "wc_reply_reviewers_avg": [
            5.5,
            9.526279441628825
        ],
        "wc_reply_authors_avg": [
            1610.5,
            735.922720127596
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            5.0,
            1.224744871391589
        ],
        "replies_avg": [
            30,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.9365858115816939,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2827328455220735707&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;2;0",
        "aff_unique_norm": "University of California, Los Angeles;University of California, Santa Barbara;Peking University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ucla.edu;https://www.ucsb.edu;http://www.pku.edu.cn",
        "aff_unique_abbr": "UCLA;UCSB;Peking U",
        "aff_campus_unique_index": "0;1;0",
        "aff_campus_unique": "Los Angeles;Santa Barbara;",
        "aff_country_unique_index": "0;0;1;1;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "rWVlkLgP3q",
        "title": "BOOT: Data-free Distillation of Denoising Diffusion Models with Bootstrapping",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Diffusion models have demonstrated excellent potential for generating diverse images. However, their performance often suffers from slow generation due to iterative denoising. Existing distillation methods either require significant amounts of offline computation for generating synthetic training data or need to perform expensive online learning with the help of real data. In this work, we present a novel technique called BOOT, that overcomes these limitations with an efficient data-free distillation algorithm. The core idea is to learn a time-conditioned model that predicts the output of a pre-trained diffusion model teacher given any time step. Such a model can be efficiently trained based on bootstrapping from two consecutive sampled steps. Furthermore, our method can be easily adapted to large-scale text-to-image diffusion models, which are challenging for conventional methods given the fact that the training sets are often large and difficult to access. We demonstrate the effectiveness of our approach on several benchmarks, achieving comparable generation quality while being orders of magnitude faster than the diffusion teacher. The text-to-image results show that BOOT is able to handle highly complex distributions, shedding light on efficient generative modeling.",
        "keywords": "diffusion models;knowledge distillation;bootstrapping",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Jiatao Gu;Shuangfei Zhai;Yizhe Zhang;Lingjie Liu;Joshua M. Susskind",
        "authorids": "~Jiatao_Gu1;~Shuangfei_Zhai3;~Yizhe_Zhang2;~Lingjie_Liu1;~Joshua_M._Susskind1",
        "gender": "M;M;M;F;M",
        "homepage": "http://jiataogu.me;http://cs.binghamton.edu/~szhai2;https://dreasysnail.github.io;https://lingjie0206.github.io/;http://www.apple.com",
        "dblp": "164/5848.html;;132/4966-2.html;204/0052;132/7797",
        "google_scholar": "https://scholar.google.com.sg/citations?user=cB1mFBsAAAAJ;G6vdBYsAAAAJ;WDVMfggAAAAJ;https://scholar.google.de/citations?user=HZPnJ9gAAAAJ;Sv2TGqsAAAAJ",
        "orcid": ";;;;",
        "linkedin": "jiatao-gu-204b2672/;;;;joshua-susskind-8ab2ab5/",
        "or_profile": "~Jiatao_Gu1;~Shuangfei_Zhai3;~Yizhe_Zhang2;~Lingjie_Liu1;~Joshua_M._Susskind1",
        "aff": "Apple;Apple;Apple;University of Pennsylvania;Apple",
        "aff_domain": "apple.com;apple.com;apple.com;upenn.edu;apple.com",
        "position": "Researcher;Research Scientist;Researcher;Assistant Professor;Researcher",
        "bibtex": "@misc{\ngu2024boot,\ntitle={{BOOT}: Data-free Distillation of Denoising Diffusion Models with Bootstrapping},\nauthor={Jiatao Gu and Shuangfei Zhai and Yizhe Zhang and Lingjie Liu and Joshua M. Susskind},\nyear={2024},\nurl={https://openreview.net/forum?id=rWVlkLgP3q}\n}",
        "github": "",
        "project": "",
        "reviewers": "aBRM;Xhbi;Fzoy",
        "site": "https://openreview.net/forum?id=rWVlkLgP3q",
        "pdf_size": 50347360,
        "rating": "3;3;6",
        "confidence": "4;4;4",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "3;2;3",
        "wc_summary": "36;129;157",
        "wc_strengths": "31;76;105",
        "wc_weaknesses": "310;267;282",
        "wc_questions": "95;27;235",
        "wc_review": "472;499;779",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            107.33333333333333,
            51.71932800113405
        ],
        "wc_strengths_avg": [
            70.66666666666667,
            30.444849956747838
        ],
        "wc_weaknesses_avg": [
            286.3333333333333,
            17.82008853949821
        ],
        "wc_questions_avg": [
            119.0,
            86.59484203269076
        ],
        "wc_review_avg": [
            583.3333333333334,
            138.79561312311793
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 60,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14602075319295248946&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "Apple;University of Pennsylvania",
        "aff_unique_dep": "Apple Inc.;",
        "aff_unique_url": "https://www.apple.com;https://www.upenn.edu",
        "aff_unique_abbr": "Apple;UPenn",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "rYhDcQudVI",
        "title": "Score-based Conditional Generation with Fewer Labeled Data by Self-calibrating Classifier Guidance",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Score-based generative models (SGMs) are a popular family of deep generative models that achieve leading image generation quality. Early studies extend SGMs to tackle class-conditional generation by coupling an unconditional SGM with the guidance of a trained classifier. Nevertheless, such classifier-guided SGMs do not always achieve accurate conditional generation, especially when trained with fewer labeled data. We argue that the problem is rooted in the classifier's tendency to overfit without coordinating with the underlying unconditional distribution. We propose improving classifier-guided SGMs by letting the classifier regularize itself to respect the unconditional distribution. Our key idea is to use principles from energy-based models to convert the classifier as another view of the unconditional SGM. Then, existing loss for the unconditional SGM can be leveraged to achieve regularization by calibrating the classifier's internal unconditional scores. The regularization scheme can be applied to not only the labeled data but also unlabeled ones to further improve the classifier. Empirical results show that the proposed approach significantly improves conditional generation quality across various percentages of fewer labeled data. The results confirm the potential of the proposed approach for generative modeling with limited labeled data.",
        "keywords": "Score-based Model;Classifier Guidance;Conditional Generation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/744329d85de58451acff02740f09776b656e098b.zip",
        "author": "Paul Kuo-Ming Huang;Si-An Chen;Hsuan-Tien Lin",
        "authorids": "~Paul_Kuo-Ming_Huang1;~Si-An_Chen1;~Hsuan-Tien_Lin1",
        "gender": "M;M;M",
        "homepage": ";http://www.csie.ntu.edu.tw/~htlin;https://github.com/paulhuangkm",
        "dblp": "207/7456;10/3718;",
        "google_scholar": "https://scholar.google.com.tw/citations?user=XtkmEncAAAAJ;https://scholar.google.com.tw/citations?user=yAr4UPUAAAAJ;",
        "orcid": "0000-0001-8734-9894;;",
        "linkedin": "sianchen/;;",
        "or_profile": "~Si-An_Chen1;~Hsuan-Tien_Lin1;~Paul_Huang1",
        "aff": "National Taiwan University;National Taiwan University;Department of computer science and informational engineering, National Taiwan University",
        "aff_domain": "ntu.edu.tw;ntu.edu.tw;csie.ntu.edu.tw",
        "position": "PhD student;Full Professor;Undergrad student",
        "bibtex": "@misc{\nhuang2024scorebased,\ntitle={Score-based Conditional Generation with Fewer Labeled Data by Self-calibrating Classifier Guidance},\nauthor={Paul Kuo-Ming Huang and Si-An Chen and Hsuan-Tien Lin},\nyear={2024},\nurl={https://openreview.net/forum?id=rYhDcQudVI}\n}",
        "github": "",
        "project": "",
        "reviewers": "yr3t;4JFE;zxWa;BW7Z;b4HY",
        "site": "https://openreview.net/forum?id=rYhDcQudVI",
        "pdf_size": 5829951,
        "rating": "5;5;5;5;5",
        "confidence": "5;3;3;4;3",
        "soundness": "2;3;3;3;2",
        "contribution": "3;2;3;3;2",
        "presentation": "3;3;3;3;3",
        "wc_summary": "72;184;175;71;69",
        "wc_strengths": "102;87;28;64;58",
        "wc_weaknesses": "177;165;176;102;56",
        "wc_questions": "176;183;9;38;42",
        "wc_review": "527;619;388;275;225",
        "wc_reply_reviewers": "0;0;0;42;0",
        "wc_reply_authors": "596;450;276;385;476",
        "reply_reviewers": "0;0;0;1;0",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.6,
            0.8
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            114.2,
            53.401872626341486
        ],
        "wc_strengths_avg": [
            67.8,
            25.427544120500507
        ],
        "wc_weaknesses_avg": [
            135.2,
            48.321423820082124
        ],
        "wc_questions_avg": [
            89.6,
            74.31446696303486
        ],
        "wc_review_avg": [
            406.8,
            148.49430965528612
        ],
        "wc_reply_reviewers_avg": [
            8.4,
            16.8
        ],
        "wc_reply_authors_avg": [
            436.6,
            105.44685865401587
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:pAOsXT4E1mIJ:scholar.google.com/&scioq=Score-based+Conditional+Generation+with+Fewer+Labeled+Data+by+Self-calibrating+Classifier+Guidance&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "National Taiwan University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ntu.edu.tw",
        "aff_unique_abbr": "NTU",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Taiwan",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "rYyu3jpk8z",
        "title": "Open-Domain Text Evaluation via Contrastive Distribution Methods",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent advancements in open-domain text generation, driven by the power of large pre-trained language models (LLMs), have demonstrated remarkable performance. However, assessing these models for specific attributes remains a challenge. Traditional reference-based metrics like BLEU, ROUGE, and METEOR measure the similarity between machine-generated outputs and human-written references, which deviates from the principle of open-ended generation tasks, leading to low correlation with human judgments. While trainable discriminator-based evaluation metrics show promise, the acquisition of high-quality training data presents a formidable obstacle. In this paper, we introduce a novel method for evaluating open-domain text generation called Contrastive Distribution Methods (CDM). Leveraging the connection between increasing model parameters and enhanced LLM performance, CDM creates a mapping from the \\textit{contrast} of two probabilistic distributions -- one known to be superior to the other -- to quality measures. We investigate CDM for open-domain text generation evaluation under two paradigms: 1) \\emph{Generative} CDM, which harnesses the contrast of two language models' distributions to generate synthetic examples for training discriminator-based metrics; 2) \\emph{Discriminative} CDM, which directly uses distribution disparities between two language models for evaluation. Our experiments on multi-turn dialogue and factuality in abstractive summarization demonstrate that CDM correlate better with human judgment than existing automatic evaluation metrics on both tasks, highlighting the strong performance and generalizability of our approach.",
        "keywords": "Natural language processing;text evaluation;natural language generation",
        "primary_area": "metric learning, kernel learning, and sparse coding",
        "supplementary_material": "",
        "author": "Sidi Lu;Tianlu Wang;Asli Celikyilmaz;Nanyun Peng",
        "authorids": "~Sidi_Lu1;~Tianlu_Wang1;~Asli_Celikyilmaz1;~Nanyun_Peng1",
        "gender": "M;F;F;F",
        "homepage": "https://sidilu.cn;https://tianlu-wang.github.io/;https://asli.us;https://violetpeng.github.io/",
        "dblp": "206/6156;185/5529;15/3724;117/4036",
        "google_scholar": "KHMrrfgAAAAJ;inzQqX8AAAAJ;https://scholar.google.com/citations?hl=en;XxRXvX0AAAAJ",
        "orcid": ";;;",
        "linkedin": ";;aslicelikyilmaz/;",
        "or_profile": "~Sidi_Lu1;~Tianlu_Wang1;~Asli_Celikyilmaz1;~Nanyun_Peng1",
        "aff": "University of California, Los Angeles;Meta;FAIR ;University of California, Los Angeles",
        "aff_domain": "ucla.edu;meta.com;meta.com;ucla.edu",
        "position": "PhD student;Researcher;Principal Researcher;Assistant Professor",
        "bibtex": "@misc{\nlu2024opendomain,\ntitle={Open-Domain Text Evaluation via Contrastive Distribution Methods},\nauthor={Sidi Lu and Tianlu Wang and Asli Celikyilmaz and Nanyun Peng},\nyear={2024},\nurl={https://openreview.net/forum?id=rYyu3jpk8z}\n}",
        "github": "",
        "project": "",
        "reviewers": "CKwf;qwhh;6ryG;V2uz;kEEE",
        "site": "https://openreview.net/forum?id=rYyu3jpk8z",
        "pdf_size": 2243863,
        "rating": "3;5;5;5;6",
        "confidence": "4;3;3;4;3",
        "soundness": "2;3;2;3;3",
        "contribution": "2;2;3;2;3",
        "presentation": "2;3;3;2;3",
        "wc_summary": "60;70;99;199;70",
        "wc_strengths": "15;109;37;51;79",
        "wc_weaknesses": "190;189;93;59;158",
        "wc_questions": "9;5;33;240;112",
        "wc_review": "274;373;262;549;419",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "289;204;297;367;498",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            4.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.4,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            99.6,
            51.383265758415945
        ],
        "wc_strengths_avg": [
            58.2,
            32.80487768610028
        ],
        "wc_weaknesses_avg": [
            137.8,
            52.85981460429084
        ],
        "wc_questions_avg": [
            79.8,
            88.88059405742065
        ],
        "wc_review_avg": [
            375.4,
            105.05731768896443
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            331.0,
            98.21812460029972
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.6666666666666667,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:QMMtRiMq3esJ:scholar.google.com/&scioq=Open-Domain+Text+Evaluation+via+Contrastive+Distribution+Methods&hl=en&as_sdt=0,33",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;1;0",
        "aff_unique_norm": "University of California, Los Angeles;Meta",
        "aff_unique_dep": ";Meta Platforms, Inc.",
        "aff_unique_url": "https://www.ucla.edu;https://meta.com",
        "aff_unique_abbr": "UCLA;Meta",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Los Angeles;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "rZpLOB9jYF",
        "title": "Memory-Modular Classification: Learning to Generalize with Memory Replacement",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We introduce a memory-modular learner for image classification that externalizes\nknowledge memorization from reasoning and thus effectively generalizes to new\nclasses by replacing memory contents. Instead of statically compiling the world\nknowledge and task skills into model weights during training, the proposed model\nstores the knowledge in an external memory of image/text data and learns to dy-\nnamically select relevant contents from the memory according to an input image.\nThe meta-learned model performs robust classification with a memory of noisy\nweb-crawled data and adapts to new classes without re-training when the memory\nis replaced. Experimental results show the promising performance of our method\non diverse scenarios, including zero-shot/few-shot classification of unseen classes,\nfine-grained classification, and class-incremental classification.",
        "keywords": "few-shot classification;zero-shot classification;memory-based classification;image classification;vision and language",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Dahyun Kang;Ahmet Iscen;Eunchan Jo;Sua Choi;Minsu Cho;Cordelia Schmid",
        "authorids": "~Dahyun_Kang1;~Ahmet_Iscen3;~Eunchan_Jo1;~Sua_Choi1;~Minsu_Cho1;~Cordelia_Schmid1",
        "gender": ";M;M;F;M;F",
        "homepage": ";;https://github.com/Chipmunk-g4;https://github.com/sua-choi;http://cvlab.postech.ac.kr/~mcho/;https://cordeliaschmid.github.io/",
        "dblp": ";140/7520;;375/1247;;s/CordeliaSchmid",
        "google_scholar": ";wIjyqzAAAAAJ;;https://scholar.google.com/citations?hl=en;5TyoF5QAAAAJ;IvqCXP4AAAAJ",
        "orcid": ";;;0009-0004-9006-4282;;",
        "linkedin": ";;;;minsu-cho-062b3750/;cordelia-schmid-47985a9",
        "or_profile": "~Dahyun_Kang1;~Ahmet_Iscen3;~Eunchan_Jo1;~Sua_Choi1;~Minsu_Cho1;~Cordelia_Schmid1",
        "aff": ";Google;Pohang University of Science and Technology;Pohang University of Science and Technology;POSTECH;Inria",
        "aff_domain": ";google.com;postech.edu;postech.ac.kr;postech.ac.kr;inria.fr",
        "position": ";Researcher;MS student;MS student;Associate Professor;Researcher",
        "bibtex": "@misc{\nkang2024memorymodular,\ntitle={Memory-Modular Classification: Learning to Generalize with Memory Replacement},\nauthor={Dahyun Kang and Ahmet Iscen and Eunchan Jo and Sua Choi and Minsu Cho and Cordelia Schmid},\nyear={2024},\nurl={https://openreview.net/forum?id=rZpLOB9jYF}\n}",
        "github": "",
        "project": "",
        "reviewers": "3JpF;ELpJ;sn6x;BjqH",
        "site": "https://openreview.net/forum?id=rZpLOB9jYF",
        "pdf_size": 947558,
        "rating": "3;5;5;6",
        "confidence": "3;4;4;5",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;2;2;3",
        "wc_summary": "103;54;27;52",
        "wc_strengths": "19;47;32;35",
        "wc_weaknesses": "20;378;28;249",
        "wc_questions": "14;5;145;6",
        "wc_review": "156;484;232;342",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            59.0,
            27.54087870784082
        ],
        "wc_strengths_avg": [
            33.25,
            9.959292143521045
        ],
        "wc_weaknesses_avg": [
            168.75,
            151.79159232315865
        ],
        "wc_questions_avg": [
            42.5,
            59.281109976112965
        ],
        "wc_review_avg": [
            303.5,
            123.42102738188497
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.9733285267845754,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:GLaeXFSNk04J:scholar.google.com/&scioq=Memory-Modular+Classification:+Learning+to+Generalize+with+Memory+Replacement&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1;2",
        "aff_unique_norm": "Google;Pohang University of Science and Technology;INRIA",
        "aff_unique_dep": "Google;;",
        "aff_unique_url": "https://www.google.com;https://www.postech.ac.kr;https://www.inria.fr",
        "aff_unique_abbr": "Google;POSTECH;Inria",
        "aff_campus_unique_index": "0;1;1;1",
        "aff_campus_unique": "Mountain View;Pohang;",
        "aff_country_unique_index": "0;1;1;1;2",
        "aff_country_unique": "United States;South Korea;France"
    },
    {
        "id": "rcFXg2aqEj",
        "title": "LMDX: Language Model-based Document Information Extraction and Localization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large Language Models (LLM) have revolutionized Natural Language Processing (NLP), improving state-of-the-art on many existing tasks and exhibiting emergent capabilities. However, LLMs have not yet been successfully applied on semi-structured document information extraction, which is at the core of many document processing workflows and consists of extracting key entities from a visually rich document (VRD) given a predefined target schema. The main obstacles to LLM adoption in that task have been the absence of layout encoding within LLMs, critical for a high quality extraction, and the lack of a grounding mechanism ensuring the answer is not hallucinated. In this paper, we introduce Language Model-based Document Information Extraction and Localization (LMDX), a methodology to adapt arbitrary LLMs for document information extraction. LMDX can do extraction of singular, repeated, and hierarchical entities, both with and without training data, while providing grounding guarantees and localizing the entities within the document. In particular, we apply LMDX to the PaLM 2-S LLM and evaluate it on VRDU and CORD benchmarks, setting a new state-of-the-art and showing how LMDX enables the creation of high quality, data-efficient parsers.",
        "keywords": "document understanding;information extraction;entity extraction;llm",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Vincent Perot;Kai Kang;Florian Luisier;Guolong Su;Xiaoyu Sun;Ramya Sree Boppana;Zilong Wang;Jiaqi Mu;Hao Zhang;Nan Hua",
        "authorids": "~Vincent_Perot1;~Kai_Kang3;~Florian_Luisier2;~Guolong_Su1;~Xiaoyu_Sun2;~Ramya_Sree_Boppana1;~Zilong_Wang1;~Jiaqi_Mu1;~Hao_Zhang68;~Nan_Hua1",
        "gender": "M;M;M;M;M;F;M;F;;",
        "homepage": ";;;https://scholar.google.com/citations?user=XWLOtwQAAAAJ&hl=en;;;https://zilongwang.me;;https://www.lti.cs.cmu.edu/people/19123/hao-zhang;",
        "dblp": "227/2509;;58/3678;;;286/3739;42/898-2;;;28/5824",
        "google_scholar": "RrANep4AAAAJ;;Pw1_6CsAAAAJ;XWLOtwQAAAAJ;;EAOWIusAAAAJ;S_wQccsAAAAJ;7koUBUIAAAAJ;;2RKbmY0AAAAJ",
        "orcid": ";;;;;0009-0005-6448-4344;0000-0002-1614-0943;;;",
        "linkedin": "vincentperot/;kaikang1/;florian-luisier-644b044/;;sxy;ramya-sree-boppana-39bb31b3;;;;",
        "or_profile": "~Vincent_Perot1;~Kai_Kang3;~Florian_Luisier2;~Guolong_Su1;~Xiaoyu_Sun2;~Ramya_Sree_Boppana1;~Zilong_Wang1;~Jiaqi_Mu1;~Hao_Zhang68;~Nan_Hua1",
        "aff": "Google;Google;Google;Google;Google;Google;University of California, San Diego;Google;;Google",
        "aff_domain": "google.com;google.com;google.com;google.com;google.com;google.com;ucsd.edu;google.com;;google.com",
        "position": "Software Engineer;Software Engineer;Software Engineer;Google;Researcher;Software Engineer;PhD student;Researcher;;Software Engineer",
        "bibtex": "@misc{\nanonymous2024lmdx,\ntitle={{LMDX}: Language Model-based Document Information Extraction and Localization},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=rcFXg2aqEj}\n}",
        "github": "",
        "project": "",
        "reviewers": "5Y8u;W15R;Vt8a",
        "site": "https://openreview.net/forum?id=rcFXg2aqEj",
        "pdf_size": 2876162,
        "rating": "5;6;6",
        "confidence": "3;4;3",
        "soundness": "2;4;3",
        "contribution": "3;3;2",
        "presentation": "3;2;3",
        "wc_summary": "79;139;31",
        "wc_strengths": "54;19;32",
        "wc_weaknesses": "63;50;219",
        "wc_questions": "72;124;21",
        "wc_review": "268;332;303",
        "wc_reply_reviewers": "23;0;122",
        "wc_reply_authors": "1390;956;1534",
        "reply_reviewers": "1;0;1",
        "reply_authors": "3;2;4",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            83.0,
            44.181444068749045
        ],
        "wc_strengths_avg": [
            35.0,
            14.445299120013633
        ],
        "wc_weaknesses_avg": [
            110.66666666666667,
            76.78686230223384
        ],
        "wc_questions_avg": [
            72.33333333333333,
            42.05023450852827
        ],
        "wc_review_avg": [
            301.0,
            26.166135875720485
        ],
        "wc_reply_reviewers_avg": [
            48.333333333333336,
            52.92972279877871
        ],
        "wc_reply_authors_avg": [
            1293.3333333333333,
            245.66824965568688
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.0,
            0.816496580927726
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 35,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17668501673876594670&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;0;0;0;0;1;0;0",
        "aff_unique_norm": "Google;University of California, San Diego",
        "aff_unique_dep": "Google;",
        "aff_unique_url": "https://www.google.com;https://www.ucsd.edu",
        "aff_unique_abbr": "Google;UCSD",
        "aff_campus_unique_index": "0;0;0;0;0;0;1;0;0",
        "aff_campus_unique": "Mountain View;San Diego",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "rcbKbaLxGd",
        "title": "Learning Graph Representations in Normed Spaces",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Theoretical results from discrete geometry suggest that normed spaces can abstractly embed finite metric spaces with surprisingly low theoretical bounds on distortion in low dimensions. \nIn this paper, inspired by this theoretical insight, we propose normed spaces as a more flexible and computationally efficient alternative to several popular Riemannian manifolds for learning graph embeddings. \nOur normed space embeddings significantly outperform several popular manifolds on a large range of synthetic and real-world graph reconstruction benchmark datasets while requiring significantly fewer computational resources. \nWe also empirically verify the superiority of normed space embeddings on growing families of graphs associated with negative, zero, and positive curvature, further reinforcing the flexibility of normed spaces in capturing diverse graph structures as graph sizes increase. \nLastly, we demonstrate the utility of normed space embeddings on two applied graph embedding tasks, namely, link prediction and recommender systems. \nOur work highlights the potential of normed spaces for geometric graph representation learning, raises new research questions, and offers a valuable tool for experimental mathematics in the field of finite metric space embeddings.",
        "keywords": "normed spaces;graph embeddings;geometric deep learning;metric learning;riemannian manifold learning",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Diaaeldin Taha;Wei Zhao;J. Maxwell Riestenberg;Michael Strube",
        "authorids": "~Diaaeldin_Taha1;~Wei_Zhao7;~J._Maxwell_Riestenberg1;~Michael_Strube1",
        "gender": "M;M;M;",
        "homepage": "https://www.dtaha.com/;https://www.abdn.ac.uk/people/wei.zhao;https://sites.google.com/view/max-riestenberg/home;https://www.h-its.org/people/prof-dr-michael-strube/",
        "dblp": ";181/2852-33;;s/MichaelStrube1",
        "google_scholar": ";https://scholar.google.de/citations?user=vQgXoPUAAAAJ;;s0_rS0kAAAAJ",
        "orcid": ";;;",
        "linkedin": "diaaeldin-taha-23a51b16/;;;",
        "or_profile": "~Diaaeldin_Taha1;~Wei_Zhao7;~J._Maxwell_Riestenberg1;~Michael_Strube1",
        "aff": "Max Planck Institute for Mathematics in the Sciences, Max-Planck Institute;University of Aberdeen;Ruprecht-Karls-Universit\u00e4t Heidelberg;Heidelberg Institute for Theoretical Studies",
        "aff_domain": "mis.mpg.de;abdn.ac.uk;uni-heidelberg.de;h-its.org",
        "position": "Postdoc;Assistant Professor;Postdoc;Principal Researcher",
        "bibtex": "@misc{\ntaha2024learning,\ntitle={Learning Graph Representations in Normed Spaces},\nauthor={Diaaeldin Taha and Wei Zhao and J. Maxwell Riestenberg and Michael Strube},\nyear={2024},\nurl={https://openreview.net/forum?id=rcbKbaLxGd}\n}",
        "github": "",
        "project": "",
        "reviewers": "8mJz;VPSX;PhGM;Ff96",
        "site": "https://openreview.net/forum?id=rcbKbaLxGd",
        "pdf_size": 784113,
        "rating": "3;3;3;8",
        "confidence": "5;4;4;2",
        "soundness": "2;3;3;4",
        "contribution": "1;2;2;3",
        "presentation": "3;4;4;3",
        "wc_summary": "23;209;74;68",
        "wc_strengths": "76;101;62;50",
        "wc_weaknesses": "511;281;315;69",
        "wc_questions": "20;233;55;15",
        "wc_review": "630;824;506;202",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            2.165063509461097
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            93.5,
            69.53596191899555
        ],
        "wc_strengths_avg": [
            72.25,
            18.978606376654742
        ],
        "wc_weaknesses_avg": [
            294.0,
            156.78328992593566
        ],
        "wc_questions_avg": [
            80.75,
            89.24229658631606
        ],
        "wc_review_avg": [
            540.5,
            225.91757346430578
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9271726499455306,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:M0Owcvj9niYJ:scholar.google.com/&scioq=Learning+Graph+Representations+in+Normed+Spaces&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Max Planck Institute for Mathematics in the Sciences;University of Aberdeen;Ruprecht-Karls-Universit\u00e4t Heidelberg;Heidelberg Institute for Theoretical Studies",
        "aff_unique_dep": "Mathematics in the Sciences;;;",
        "aff_unique_url": "https://www.mis.mpg.de;https://www.abdn.ac.uk;https://www.uni-heidelberg.de/;https://www.hits.org/",
        "aff_unique_abbr": "MPI MIS;Aberdeen;Uni Heidelberg;HITS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "Germany;United Kingdom"
    },
    {
        "id": "rcsV1C2eyk",
        "title": "EMU: EFFICIENT NEGATIVE SAMPLE GENERATION METHOD FOR KNOWLEDGE GRAPH LINK PREDICTION",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Knowledge graph embedding (KGE) models encode information in knowledge graphs for the purpose of predicting new links. \nIn order to effectively train these models, it is essential to learn to discriminate between positive and negative samples. \nPrior research has demonstrated that enhancing the quality of negative samples can lead to significant improvements in model accuracy. \nTo this end, our paper proposes Embedding Mutation and Unbounded label Smoothing (EMU), a novel approach to generating hard negative samples, distinct from traditional endeavors aimed at identifying more difficult negatives within the training data. \nBy corrupting the negative samples with mutations derived from true samples, EMU creates more challenging negative samples that are harder to distinguish from true samples. \nImportantly, EMU\u2019s simplicity allows it to be seamlessly integrated with existing KGE models and other negative sampling methods. \nOur experiments show that EMU can be integrated with any KGE models or existing negative sampling techniques and consistently yields improved link prediction performance. \nAn implementation of the method and experiments are available at \\url{https://anonymous.4open.science/r/EMU-KG-6E58}.",
        "keywords": "knowledge base;ling prediction;representation learning;negative sample generation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/24b6cbee0dc91c09a7f913e413c1e41e355c7dd1.pdf",
        "author": "Makoto Takamoto;Daniel Onoro Rubio;Wiem Ben Rim;Bhushan Kotnis",
        "authorids": "~Makoto_Takamoto1;~Daniel_Onoro_Rubio1;~Wiem_Ben_Rim1;~Bhushan_Kotnis1",
        "gender": "M;;F;M",
        "homepage": "https://www.neclab.eu/;;https://wiembnr.com;",
        "dblp": ";;280/8769;143/7131",
        "google_scholar": ";;;zVIdi44AAAAJ",
        "orcid": ";;;",
        "linkedin": ";;wiem-ben-rim;",
        "or_profile": "~Makoto_Takamoto1;~Daniel_Onoro_Rubio1;~Wiem_Ben_Rim1;~Bhushan_Kotnis1",
        "aff": "NEC;;NEC Laboratories Europe;Coresystems",
        "aff_domain": "neclab.eu;;neclab.eu;coresystems.ch",
        "position": "Researcher;;Researcher;Researcher",
        "bibtex": "@misc{\ntakamoto2024emu,\ntitle={{EMU}: {EFFICIENT} {NEGATIVE} {SAMPLE} {GENERATION} {METHOD} {FOR} {KNOWLEDGE} {GRAPH} {LINK} {PREDICTION}},\nauthor={Makoto Takamoto and Daniel Onoro Rubio and Wiem Ben Rim and Bhushan Kotnis},\nyear={2024},\nurl={https://openreview.net/forum?id=rcsV1C2eyk}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZT2x;nmRt;HCYP;bmse",
        "site": "https://openreview.net/forum?id=rcsV1C2eyk",
        "pdf_size": 1038587,
        "rating": "1;3;5;6",
        "confidence": "5;5;4;4",
        "soundness": "2;2;2;3",
        "contribution": "1;1;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "47;46;67;189",
        "wc_strengths": "32;14;62;60",
        "wc_weaknesses": "330;347;197;112",
        "wc_questions": "1;44;1;142",
        "wc_review": "410;451;327;503",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "104;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;0;0;0",
        "rating_avg": [
            3.75,
            1.920286436967152
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            1.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            87.25,
            59.33959470707565
        ],
        "wc_strengths_avg": [
            42.0,
            20.049937655763422
        ],
        "wc_weaknesses_avg": [
            246.5,
            96.97035629510701
        ],
        "wc_questions_avg": [
            47.0,
            57.589061461357396
        ],
        "wc_review_avg": [
            422.75,
            64.35982830928
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            26.0,
            45.033320996790806
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0.25,
            0.4330127018922193
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.911322376865767,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:4JVVqsuJy60J:scholar.google.com/&scioq=EMU:+EFFICIENT+NEGATIVE+SAMPLE+GENERATION+METHOD+FOR+KNOWLEDGE+GRAPH+LINK+PREDICTION&hl=en&as_sdt=0,34",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "NEC Corporation;NEC Laboratories Europe;Coresystems AG",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.nec.com;https://www.nec-labs.eu;https://www.coresystems.ch",
        "aff_unique_abbr": "NEC;NEC LE;Coresystems",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2",
        "aff_country_unique": "Japan;Unknown;Switzerland"
    },
    {
        "id": "reBq1gmlhS",
        "title": "Learning Differentially Private Rewards from Human Feedback",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We study the privacy of reinforcement learning from human feedback.  In particular, we focus on solving the problem of reinforcement learning from preference rankings, subject to the constraint of differential privacy, in MDPs where true rewards are given by linear functions. To achieve this, we analyze $(\\epsilon,\\delta)$-differential privacy (DP) for both the Bradley-Terry-Luce (BTL) model and the Plackett-Luce (PL) model. We provide a differentially private algorithm for learning rewards from human rankings. We further show that the privately learned rewards can be used to train policies achieving statistical performance guarantees that asymptotically match the best known algorithms in the non-private setting, which are in some cases minimax optimal.",
        "keywords": "Learning to Rank;Differential Privacy;Minimax Optimal",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Ezgi Korkmaz;Jonah Brown-Cohen",
        "authorids": "~Ezgi_Korkmaz2;~Jonah_Brown-Cohen1",
        "gender": ";M",
        "homepage": "https://ezgikorkmaz.github.io/;https://jonahbc.github.io/",
        "dblp": "300/7830.html;157/1513",
        "google_scholar": ";fRc3A80AAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Ezgi_Korkmaz2;~Jonah_Brown-Cohen1",
        "aff": "University College London, University of London;Google DeepMind",
        "aff_domain": "ucl.ac.uk;deepmind.com",
        "position": "PhD student;Researcher",
        "bibtex": "@misc{\nkorkmaz2024learning,\ntitle={Learning Differentially Private Rewards from Human Feedback},\nauthor={Ezgi Korkmaz and Jonah Brown-Cohen},\nyear={2024},\nurl={https://openreview.net/forum?id=reBq1gmlhS}\n}",
        "github": "",
        "project": "",
        "reviewers": "gvm7;NoQk;3eKN;TiJL",
        "site": "https://openreview.net/forum?id=reBq1gmlhS",
        "pdf_size": 335771,
        "rating": "3;5;5;5",
        "confidence": "4;4;4;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "46;60;164;77",
        "wc_strengths": "14;62;44;32",
        "wc_weaknesses": "48;448;243;181",
        "wc_questions": "102;22;121;133",
        "wc_review": "210;592;572;423",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "153;438;165;136",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            86.75,
            45.93133462027856
        ],
        "wc_strengths_avg": [
            38.0,
            17.4928556845359
        ],
        "wc_weaknesses_avg": [
            230.0,
            144.23765111786867
        ],
        "wc_questions_avg": [
            94.5,
            43.292609068985435
        ],
        "wc_review_avg": [
            449.25,
            152.78641137221595
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            223.0,
            124.55721576849733
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:J6kcJpMehb8J:scholar.google.com/&scioq=Learning+Differentially+Private+Rewards+from+Human+Feedback&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University College London;Google",
        "aff_unique_dep": ";Google DeepMind",
        "aff_unique_url": "https://www.ucl.ac.uk;https://deepmind.com",
        "aff_unique_abbr": "UCL;DeepMind",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "reDaK6lvzM",
        "title": "Amazing Combinatorial Creation: Acceptable Swap-Sampling for Combinatorial Text-to-Image Generation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Exploring a machine learning system to generate meaningful combinatorial object images from multiple textual descriptions, emulating human creativity, is a significant challenge as humans are able to construct amazing combinatorial objects, but machines strive to emulate data distribution. In this paper, we develop a straightforward yet highly effective technique, called acceptable swap-sampling, to generate a combinatorial object image that exhibits novelty and surprise, utilizing text concepts of different objects. Initially, we propose a swapping mechanism that constructs a novel embedding by exchanging column vectors of two text embeddings for generating a new combinatorial image through a cutting-edge diffusion model. Furthermore, we design an acceptable region by managing suitable CLIP distances between the new image and the original concept generations, increasing the likelihood of accepting the new image with a high-quality combination. This region allows us to efficiently sample a small subset from a new image pool generated by using randomly exchanging column vectors. Lastly, we employ a segmentation method to compare CLIP distances among the segmented components, ultimately selecting the most promising image from the sampled subset. Our experiments focus on text pairs of objects from ImageNet, and our results demonstrate that our approach outperforms recent methods such as Stable-Diffusion2, DALLE2, ERNIE-ViLG2 and Bing in generating novel and surprising object images, even when the associated concepts appear to be implausible, such as lionfish-abacus and kangaroo-pears. Furthermore, during the sampling process, our approach without training and human preference is also comparable to PickScore and HPSv2 trained using human preference datasets.",
        "keywords": "Creative Learning; Diffusion Model; Combinatorial Text-to-Image Synthesis",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/57c6458a137dea01c4761f5832c366a457fb0bc6.pdf",
        "author": "Jun Li;Ze-dong Zhang;Jian Yang",
        "authorids": "~Jun_Li16;~Ze-dong_Zhang1;~Jian_Yang1",
        "gender": "M;M;M",
        "homepage": ";;",
        "dblp": ";286/9537;y/JianYang3.html",
        "google_scholar": "iGPEwQsAAAAJ;POB4LxgAAAAJ;https://scholar.google.com.hk/citations?user=6CIDtZQAAAAJ",
        "orcid": ";0000-0002-3328-1713;",
        "linkedin": ";;",
        "or_profile": "~Jun_Li16;~Ze-dong_Zhang1;~Jian_Yang1",
        "aff": "Nanjing University of Science and Technology;Nanjing University of Science and Technology;Nanjing University of Science and Technology",
        "aff_domain": "njust.edu.cn;njust.edu.cn;njust.edu.cn",
        "position": "Full Professor;PhD student;Full Professor",
        "bibtex": "@misc{\nli2024amazing,\ntitle={Amazing Combinatorial Creation: Acceptable Swap-Sampling for Combinatorial Text-to-Image Generation},\nauthor={Jun Li and Ze-dong Zhang and Jian Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=reDaK6lvzM}\n}",
        "github": "",
        "project": "",
        "reviewers": "nzuv;2f2Z;EqW9;Q86Q",
        "site": "https://openreview.net/forum?id=reDaK6lvzM",
        "pdf_size": 5455191,
        "rating": "3;5;6;6",
        "confidence": "4;4;4;4",
        "soundness": "3;3;3;3",
        "contribution": "2;1;3;2",
        "presentation": "3;3;3;2",
        "wc_summary": "120;39;64;18",
        "wc_strengths": "45;37;59;36",
        "wc_weaknesses": "126;194;168;172",
        "wc_questions": "6;29;11;31",
        "wc_review": "297;299;302;257",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            60.25,
            38.14691992808856
        ],
        "wc_strengths_avg": [
            44.25,
            9.202581159652981
        ],
        "wc_weaknesses_avg": [
            165.0,
            24.596747752497688
        ],
        "wc_questions_avg": [
            19.25,
            10.917302780449024
        ],
        "wc_review_avg": [
            288.75,
            18.417043736713012
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:QP3xYHJFe0gJ:scholar.google.com/&scioq=Amazing+Combinatorial+Creation:+Acceptable+Swap-Sampling+for+Combinatorial+Text-to-Image+Generation&hl=en&as_sdt=0,23",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Nanjing University of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.nust.edu.cn/",
        "aff_unique_abbr": "NUST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "rfSfDSFrRL",
        "title": "Gated recurrent neural networks discover attention",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent architectural developments have enabled recurrent neural networks (RNNs) to reach and even surpass the performance of Transformers on certain sequence modeling tasks. These modern RNNs feature a prominent design pattern: linear recurrent layers interconnected by feedforward paths with multiplicative gating. Here, we show how RNNs equipped with these two design elements can exactly implement (linear) self-attention, the main building block of Transformers. By reverse-engineering a set of trained RNNs, we find that gradient descent in practice discovers our construction. In particular, we examine RNNs trained to solve simple in-context learning tasks on which Transformers are known to excel and find that gradient descent instills in our RNNs the same attention-based in-context learning algorithm used by Transformers. Our findings highlight the importance of multiplicative interactions in neural networks and suggest that certain RNNs might be unexpectedly implementing attention under the hood.",
        "keywords": "RNNs;SSMs;LRU;linear self-attention;in-context learning;mechanistic interpretability;multiplicative interactions;gating",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Nicolas Zucchet;Seijin Kobayashi;Yassir Akram;Johannes von Oswald;Maxime Larcher;Angelika Steger;Joao Sacramento",
        "authorids": "~Nicolas_Zucchet1;~Seijin_Kobayashi1;~Yassir_Akram1;~Johannes_von_Oswald2;~Maxime_Larcher1;~Angelika_Steger2;~Joao_Sacramento1",
        "gender": "M;;M;Not Specified;;;M",
        "homepage": ";;https://as.inf.ethz.ch/people/members/yakram/index.html;https://as.inf.ethz.ch/people/members/voswaldj/index.html;;;http://www.joaosacramento.com",
        "dblp": "289/6252;;329/5709;242/8029;;;59/9214",
        "google_scholar": "cLhZY44AAAAJ;;_eYyLKIAAAAJ;https://scholar.google.ch/citations?user=jdnL-PgAAAAJ;https://scholar.google.com/citations?hl=fr;;9hpcmYUAAAAJ",
        "orcid": ";;;;;;",
        "linkedin": "nicolas-zucchet-7a84a6139/;;;johswald/?originalSubdomain=de;;;",
        "or_profile": "~Nicolas_Zucchet1;~Seijin_Kobayashi1;~Yassir_Akram1;~Johannes_von_Oswald2;~Maxime_Larcher1;~Angelika_Steger2;~Joao_Sacramento1",
        "aff": "ETHZ - ETH Zurich;;Department of Computer Science, ETHZ - ETH Zurich;Google;Department of Computer Science, ETHZ - ETH Zurich;;Department of Computer Science, ETHZ - ETH Zurich",
        "aff_domain": "ethz.ch;;inf.ethz.ch;research.google.com;inf.ethz.ch;;inf.ethz.ch",
        "position": "PhD student;;PhD student;Researcher;PhD student;;Principal Researcher",
        "bibtex": "@misc{\nzucchet2024gated,\ntitle={Gated recurrent neural networks discover attention},\nauthor={Nicolas Zucchet and Seijin Kobayashi and Yassir Akram and Johannes von Oswald and Maxime Larcher and Angelika Steger and Joao Sacramento},\nyear={2024},\nurl={https://openreview.net/forum?id=rfSfDSFrRL}\n}",
        "github": "",
        "project": "",
        "reviewers": "pjc5;2JoC;1u2u;imQt",
        "site": "https://openreview.net/forum?id=rfSfDSFrRL",
        "pdf_size": 2172899,
        "rating": "5;5;6;6",
        "confidence": "5;3;3;3",
        "soundness": "4;2;3;4",
        "contribution": "2;3;3;4",
        "presentation": "4;3;3;2",
        "wc_summary": "85;107;92;158",
        "wc_strengths": "88;74;114;126",
        "wc_weaknesses": "65;166;295;374",
        "wc_questions": "20;89;2;8",
        "wc_review": "258;436;503;666",
        "wc_reply_reviewers": "0;0;38;0",
        "wc_reply_authors": "211;335;436;609",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            110.5,
            28.552583070538468
        ],
        "wc_strengths_avg": [
            100.5,
            20.56088519495209
        ],
        "wc_weaknesses_avg": [
            225.0,
            118.51371228680671
        ],
        "wc_questions_avg": [
            29.75,
            34.816483165305485
        ],
        "wc_review_avg": [
            465.75,
            146.22991315049052
        ],
        "wc_reply_reviewers_avg": [
            9.5,
            16.454482671904334
        ],
        "wc_reply_authors_avg": [
            397.75,
            145.6903823181201
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8734154586532537917&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "ETH Zurich;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.ethz.ch;https://www.google.com",
        "aff_unique_abbr": "ETHZ;Google",
        "aff_campus_unique_index": "1;2;1;1",
        "aff_campus_unique": ";Zurich;Mountain View",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "Switzerland;United States"
    },
    {
        "id": "rfz3K3yyU4",
        "title": "Beyond Gradient and Priors in Privacy Attacks: Leveraging Pooler Layer Inputs of Language Models in Federated Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Federated learning (FL) emphasizes decentralized training by storing data locally and transmitting only model updates, underlining user privacy. However, a line of work on privacy attacks undermines user privacy by extracting sensitive data from large language models during FL.Yet, these attack techniques face distinct hurdles: some work chiefly with limited batch sizes (e.g., batch size of 1), and others can be easily defended or are transparently detectable. This paper introduces an innovative approach that is challenging to detect and defend, significantly enhancing the recovery rate of text in various batch-size settings. Building on fundamental gradient matching and domain prior knowledge, we enhance the recovery by tapping into the input of the Pooler layer of language models, offering additional feature-level guidance that effectively assists optimization-based attacks. We benchmark our method using text classification tasks on datasets such as CoLA, SST, and Rotten Tomatoes. Across different batch sizes and models, our approach consistently outperforms previous state-of-the-art results.",
        "keywords": "Text Privacy Attack;AI Satefy",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/f499b72ee523dd42dd756a01350341ed3965f357.zip",
        "author": "Jianwei Li;Sheng Liu;Qi Lei",
        "authorids": "~Jianwei_Li8;~Sheng_Liu2;~Qi_Lei1",
        "gender": "M;;F",
        "homepage": "https://jianwei.gatsbyjs.io/;https://shengliu66.github.io/;https://cecilialeiqi.github.io/",
        "dblp": ";;",
        "google_scholar": ";rzhzR-cAAAAJ;kGOgaowAAAAJ",
        "orcid": "0000-0002-5372-223X;;",
        "linkedin": "fourteenljw/;;",
        "or_profile": "~Jianwei_Li8;~Sheng_Liu2;~Qi_Lei1",
        "aff": "North Carolina State University;Stanford University;New York University",
        "aff_domain": "ncsu.edu;stanford.edu;nyu.edu",
        "position": "PhD student;Postdoc;Assistant Professor",
        "bibtex": "@misc{\nli2024beyond,\ntitle={Beyond Gradient and Priors in Privacy Attacks: Leveraging Pooler Layer Inputs of Language Models in Federated Learning},\nauthor={Jianwei Li and Sheng Liu and Qi Lei},\nyear={2024},\nurl={https://openreview.net/forum?id=rfz3K3yyU4}\n}",
        "github": "",
        "project": "",
        "reviewers": "1dmy;tBfV;eYy2;GEoJ;7zQ4",
        "site": "https://openreview.net/forum?id=rfz3K3yyU4",
        "pdf_size": 494776,
        "rating": "1;3;6;6;6",
        "confidence": "3;3;4;3;3",
        "soundness": "1;3;3;3;3",
        "contribution": "1;2;3;3;2",
        "presentation": "1;3;2;3;3",
        "wc_summary": "17;74;127;62;120",
        "wc_strengths": "55;46;43;11;30",
        "wc_weaknesses": "446;135;34;15;101",
        "wc_questions": "94;4;341;83;59",
        "wc_review": "612;259;545;171;310",
        "wc_reply_reviewers": "124;67;11;12;0",
        "wc_reply_authors": "1689;840;725;631;733",
        "reply_reviewers": "2;1;1;1;0",
        "reply_authors": "4;2;1;1;1",
        "rating_avg": [
            4.4,
            2.0591260281974
        ],
        "confidence_avg": [
            3.2,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.6,
            0.8000000000000002
        ],
        "contribution_avg": [
            2.2,
            0.7483314773547882
        ],
        "presentation_avg": [
            2.4,
            0.8
        ],
        "wc_summary_avg": [
            80.0,
            40.34352488318292
        ],
        "wc_strengths_avg": [
            37.0,
            15.270887335056859
        ],
        "wc_weaknesses_avg": [
            146.2,
            156.1094487851392
        ],
        "wc_questions_avg": [
            116.2,
            116.61114869513978
        ],
        "wc_review_avg": [
            379.4,
            169.8641810388523
        ],
        "wc_reply_reviewers_avg": [
            42.8,
            46.841861619709356
        ],
        "wc_reply_authors_avg": [
            923.6,
            388.38413973796605
        ],
        "reply_reviewers_avg": [
            1.0,
            0.6324555320336759
        ],
        "reply_authors_avg": [
            1.8,
            1.1661903789690604
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.38851434494290565,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5811876794961565253&as_sdt=5,38&sciodt=0,38&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "North Carolina State University;Stanford University;New York University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ncsu.edu;https://www.stanford.edu;https://www.nyu.edu",
        "aff_unique_abbr": "NCSU;Stanford;NYU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Stanford",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "rg0vQmkB7F",
        "title": "Shadow Alignment: The Ease of Subverting Safely-Aligned Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Warning: This paper contains examples of harmful language, and reader discretion\nis recommended. The increasing open release of powerful large language models\n(LLMs) has facilitated the development of downstream applications by reducing the\nessential cost of data annotation and computation. To ensure AI safety, extensive\nsafety-alignment measures have been conducted to armor these models against\nmalicious use (primarily hard prompt attack). However, beneath the seemingly\nresilient facade of the armor, there might lurk a shadow. By simply tuning on 100\nmalicious examples with 1 GPU hour, these safely aligned LLMs can be easily\nsubverted to generate harmful content. Formally, we term a new attack as Shadow\nAlignment: utilizing a tiny amount of data can elicit safely-aligned models to\nadapt to harmful tasks without sacrificing model helpfulness. Remarkably, the\nsubverted models retain their capability to respond appropriately to regular inquiries.\nExperiments across 8 models released by 5 different organizations (LLaMa-2,\nFalcon, InternLM, BaiChuan2, Vicuna) demonstrate the effectiveness of shadow\nalignment attack. Besides, the single-turn English-only attack successfully transfers\nto multi-turn dialogue and other languages. This study serves as a clarion call for a\ncollective effort to overhaul and fortify the safety of open-source LLMs against\nmalicious attackers.",
        "keywords": "Alignment;LLM;Safety;Attack",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Xianjun Yang;Xiao Wang;Qi Zhang;Linda Ruth Petzold;William Yang Wang;Xun Zhao;Dahua Lin",
        "authorids": "~Xianjun_Yang1;~Xiao_Wang12;~Qi_Zhang8;~Linda_Ruth_Petzold1;~William_Yang_Wang2;~Xun_Zhao1;~Dahua_Lin1",
        "gender": "M;M;M;;;F;M",
        "homepage": ";https://xiaowangnlp.github.io/;http://qizhang.info;;;;http://dahua.site",
        "dblp": "37/10237;;52/323-1;;;145/7902;53/6088",
        "google_scholar": "Tunh15sAAAAJ;https://scholar.google.com.hk/citations?hl=zh-CN;XfqR3yYAAAAJ;;;https://scholar.google.com.hk/citations?user=KF-uZFYAAAAJ;GMzzRRUAAAAJ",
        "orcid": "0000-0003-3318-8444;;;;;;",
        "linkedin": "xianjun-yang-0062aa1a6/;;;;;;",
        "or_profile": "~Xianjun_Yang1;~Xiao_Wang12;~Qi_Zhang8;~Linda_Ruth_Petzold1;~William_Yang_Wang2;~Xun_Zhao1;~Dahua_Lin1",
        "aff": "University of California, Santa Barbara;Fudan University;Fudan University;;;Shanghai AI Laboratory;The Chinese University of Hong Kong",
        "aff_domain": "ucsb.edu;fudan.edu.cn;fudan.edu.cn;;;pjlab.org.cn;cuhk.edu.hk",
        "position": "PhD student;PhD student;Full Professor;;;Research Scientist;Associate Professor",
        "bibtex": "@misc{\nyang2024shadow,\ntitle={Shadow Alignment: The Ease of Subverting Safely-Aligned Language Models},\nauthor={Xianjun Yang and Xiao Wang and Qi Zhang and Linda Ruth Petzold and William Yang Wang and Xun Zhao and Dahua Lin},\nyear={2024},\nurl={https://openreview.net/forum?id=rg0vQmkB7F}\n}",
        "github": "",
        "project": "",
        "reviewers": "P72C;psFr;c64m;QJwW",
        "site": "https://openreview.net/forum?id=rg0vQmkB7F",
        "pdf_size": 1115502,
        "rating": "3;5;5;6",
        "confidence": "4;4;3;4",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;2",
        "presentation": "2;3;2;3",
        "wc_summary": "110;93;31;55",
        "wc_strengths": "128;18;51;87",
        "wc_weaknesses": "518;119;173;65",
        "wc_questions": "7;5;57;129",
        "wc_review": "763;235;312;336",
        "wc_reply_reviewers": "337;0;353;19",
        "wc_reply_authors": "3091;2451;1673;1963",
        "reply_reviewers": "1;0;2;1",
        "reply_authors": "7;6;6;3",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            72.25,
            31.04331651096577
        ],
        "wc_strengths_avg": [
            71.0,
            40.96950085124299
        ],
        "wc_weaknesses_avg": [
            218.75,
            176.94119785962792
        ],
        "wc_questions_avg": [
            49.5,
            50.40585283476513
        ],
        "wc_review_avg": [
            411.5,
            206.34013182122376
        ],
        "wc_reply_reviewers_avg": [
            177.25,
            167.979723478758
        ],
        "wc_reply_authors_avg": [
            2294.5,
            537.3683559719534
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            5.5,
            1.5
        ],
        "replies_avg": [
            31,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.13245323570650439,
        "gs_citation": 142,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18199962498525273095&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1;2;3",
        "aff_unique_norm": "University of California, Santa Barbara;Fudan University;Shanghai AI Laboratory;Chinese University of Hong Kong",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.ucsb.edu;https://www.fudan.edu.cn;https://www.shanghai-ai-lab.com;https://www.cuhk.edu.hk",
        "aff_unique_abbr": "UCSB;Fudan;SAIL;CUHK",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Santa Barbara;;Hong Kong SAR",
        "aff_country_unique_index": "0;1;1;1;1",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "rgjmqqP923",
        "title": "SELF-TAILORING PROMPTS FOR PARAMETER EFFICIENT TUNING SPEECH RECOGNITION",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Soft-prompt tuning is an emerging topic for speech recognition despite its success in many natural language processing tasks. Although it appears to be a promising approach for efficiently fine-tuning large speech models, it can suffer from subpar prompt generalization and a lack of instance-specific guidance due to its \"one-size-fits-all\" template. To address these limitations, we propose a self-tailoring prompting mechanism that adaptively modifies the prompt tokens to incorporate relevant speech utterance-specific information. Self-tailoring mechanism includes simple yet effective prompt masking regularization techniques and a redundancy reduction loss to improve the quality of soft prompt tokens. Extensive experiments demonstrate that our method achieves better generalization capability and consistently achieves improved performance on the speech recognition task under a wide range of acoustic scenarios, including both clean and noisy speech environments. Self-tailoring prompt tuning outperforms the full fine-tuning model with as few as 0.7% of its trainable weights.",
        "keywords": "Parameter Efficient Fine-tuning;Soft Prompt Tuning;Automatic Speech Recognition",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Dianwen Ng;Chong Zhang;Ruixi Zhang;Yukun Ma;Trung Hieu Nguyen;Chongjia Ni;Eng Siong Chng;Bin Ma",
        "authorids": "~Dianwen_Ng1;~Chong_Zhang8;~Ruixi_Zhang1;~Yukun_Ma1;~Trung_Hieu_Nguyen1;~Chongjia_Ni1;~Eng_Siong_Chng1;~Bin_Ma7",
        "gender": ";;F;M;;;;M",
        "homepage": "https://sites.google.com/view/dianwen/home;;;;;http://nichongjia.com;;",
        "dblp": ";;;;;;;",
        "google_scholar": "KE_ig6sAAAAJ;;DhgouwsAAAAJ;TRTf1uoAAAAJ;;;;wdijHbsAAAAJ",
        "orcid": ";;;;;;;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Dianwen_Ng1;~Chong_Zhang8;~Ruixi_Zhang1;~Yukun_Ma1;~Trung_Hieu_Nguyen1;~Chongjia_Ni1;~Eng_Siong_Chng1;~Bin_Ma7",
        "aff": "Nanyang Technological University;;;Alibaba Group;;Alibaba Singapore R&D Centre;;Alibaba Group",
        "aff_domain": "ntu.edu.sg;;;alibaba-inc.com;;alibaba.com;;alibaba-inc.com",
        "position": "PhD student;;;Researcher;;Researcher;;Principal Researcher",
        "bibtex": "@misc{\nng2024selftailoring,\ntitle={{SELF}-{TAILORING} {PROMPTS} {FOR} {PARAMETER} {EFFICIENT} {TUNING} {SPEECH} {RECOGNITION}},\nauthor={Dianwen Ng and Chong Zhang and Ruixi Zhang and Yukun Ma and Trung Hieu Nguyen and Chongjia Ni and Eng Siong Chng and Bin Ma},\nyear={2024},\nurl={https://openreview.net/forum?id=rgjmqqP923}\n}",
        "github": "",
        "project": "",
        "reviewers": "A9xv;McqM;QFFv;iM33",
        "site": "https://openreview.net/forum?id=rgjmqqP923",
        "pdf_size": 1451706,
        "rating": "3;3;3;8",
        "confidence": "4;4;5;3",
        "soundness": "2;2;3;4",
        "contribution": "3;1;2;4",
        "presentation": "3;3;3;4",
        "wc_summary": "63;80;114;51",
        "wc_strengths": "37;25;118;68",
        "wc_weaknesses": "173;108;304;63",
        "wc_questions": "2;35;22;20",
        "wc_review": "275;248;558;202",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            2.165063509461097
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            1.118033988749895
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            77.0,
            23.717082451262844
        ],
        "wc_strengths_avg": [
            62.0,
            35.937445652132816
        ],
        "wc_weaknesses_avg": [
            162.0,
            90.83226299063566
        ],
        "wc_questions_avg": [
            19.75,
            11.755317945508747
        ],
        "wc_review_avg": [
            320.75,
            139.44062356429708
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ILsIL9M7EXcJ:scholar.google.com/&scioq=SELF-TAILORING+PROMPTS+FOR+PARAMETER+EFFICIENT+TUNING+SPEECH+RECOGNITION&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Nanyang Technological University;Alibaba Group",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ntu.edu.sg;https://www.alibaba.com",
        "aff_unique_abbr": "NTU;Alibaba",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Singapore",
        "aff_country_unique_index": "0;1;0;1",
        "aff_country_unique": "Singapore;China"
    },
    {
        "title": "Does Progress On Object Recognition Benchmarks Improve Generalization on Crowdsourced, Global Data?",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17689",
        "id": "rhaQbS3K3R",
        "author_site": "Megan Richards, Polina Kirichenko, Diane Bouchacourt, Mark Ibrahim",
        "tldr": "",
        "abstract": "For more than a decade, researchers have measured progress in object recognition on the ImageNet dataset along with its associated generalization benchmarks such as ImageNet-A, -C, and -R. Recent advances in foundation models, trained on orders of magnitude more data, have begun to saturate performance on these benchmarks. Despite this progress, even today\u2019s best models are brittle in practice. As a step toward more holistic measurement of model reliability, we propose studying performance on crowdsourced, global datasets, which contain natural distribution shifts seen practically in deployment. We perform a comprehensive empirical study on two crowdsourced, globally representative datasets, evaluating nearly 100 vision models to uncover several concerning empirical trends: first, that progress on crowdsourced, global data has significantly lagged behind standard benchmarks, with advances on ImageNet occurring at $2.5x$ the rate of progress on crowdsourced, global data. Second, we find that progress on standard benchmarks has failed to improve or exacerbated geographic disparities: geographic disparities between the least performant models and today's best models have more than tripled. We showcase the promise of using more curated and/or representative training datasets for mitigating these trends, and emphasize curation of web-scale, geographically representative training datasets as a critical open problem for the research community.",
        "keywords": "Benchmarks;Fairness;Generalization",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Megan Richards;Polina Kirichenko;Diane Bouchacourt;Mark Ibrahim",
        "authorids": "~Megan_Richards1;~Polina_Kirichenko1;~Diane_Bouchacourt3;~Mark_Ibrahim1",
        "gender": ";F;;",
        "homepage": ";https://polkirichenko.github.io/;;https://markibrahim.me/",
        "dblp": ";239/8699;;180/5660",
        "google_scholar": ";05uQHIgAAAAJ;;AqYyoCMAAAAJ",
        "orcid": ";;;",
        "linkedin": ";polkirichenko/;;",
        "or_profile": "~Megan_Richards1;~Polina_Kirichenko1;~Diane_Bouchacourt3;~Mark_Ibrahim1",
        "aff": ";New York University;;Facebook AI Research (FAIR) Meta",
        "aff_domain": ";nyu.edu;;ai.facebook.com",
        "position": ";PhD student;;Researcher",
        "bibtex": "@inproceedings{\nrichards2024does,\ntitle={Does Progress On Object Recognition Benchmarks Improve Generalization on Crowdsourced, Global Data?},\nauthor={Megan Richards and Polina Kirichenko and Diane Bouchacourt and Mark Ibrahim},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=rhaQbS3K3R}\n}",
        "github": "",
        "project": "",
        "reviewers": "QyGA;NCcf;hbmo;PnXg",
        "pdf_size": 1957869,
        "rating": "5;6;6;8",
        "confidence": "3;4;5;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;4;3;3",
        "wc_summary": "73;100;75;101",
        "wc_strengths": "48;188;93;98",
        "wc_weaknesses": "117;218;128;363",
        "wc_questions": "48;352;4;41",
        "wc_review": "286;858;300;603",
        "wc_reply_reviewers": "0;122;79;0",
        "wc_reply_authors": "747;1222;892;1651",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "2;3;2;3",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            87.25,
            13.273563952458284
        ],
        "wc_strengths_avg": [
            106.75,
            50.79062413477511
        ],
        "wc_weaknesses_avg": [
            206.5,
            98.48477039623944
        ],
        "wc_questions_avg": [
            111.25,
            139.99888392412277
        ],
        "wc_review_avg": [
            511.75,
            236.65203886719422
        ],
        "wc_reply_reviewers_avg": [
            50.25,
            52.49940475853036
        ],
        "wc_reply_authors_avg": [
            1128.0,
            347.5708560854894
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3244428422615251,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11153215168915930668&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=rhaQbS3K3R",
        "pdf": "https://openreview.net/pdf?id=rhaQbS3K3R",
        "email": ";nyu.edu;;ai.facebook.com",
        "author_num": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "New York University;Meta",
        "aff_unique_dep": ";Facebook AI Research",
        "aff_unique_url": "https://www.nyu.edu;https://www.meta.com",
        "aff_unique_abbr": "NYU;Meta AI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "TabR: Tabular Deep Learning Meets Nearest Neighbors",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17688",
        "id": "rhgIgTSSxW",
        "author_site": "Yury Gorishniy, Ivan Rubachev, Nikolay Kartashev, Daniil Shlenskii, Akim Kotelnikov, Artem Babenko",
        "tldr": "",
        "abstract": "Deep learning (DL) models for tabular data problems (e.g. classification, regression) are currently receiving increasingly more attention from researchers.\nHowever, despite the recent efforts, the non-DL algorithms based on gradient-boosted decision trees (GBDT) remain a strong go-to solution for these problems.\nOne of the research directions aimed at improving the position of tabular DL involves designing so-called retrieval-augmented models.\nFor a target object, such models retrieve other objects (e.g. the nearest neighbors) from the available training data and use their features and labels to make a better prediction.\n\nIn this work, we present TabR -- essentially, a feed-forward network with a custom k-Nearest-Neighbors-like component in the middle.\nOn a set of public benchmarks with datasets up to several million objects, TabR marks a big step forward for tabular DL: it demonstrates the best average performance among tabular DL models, becomes the new state-of-the-art on several datasets, and even outperforms GBDT models on the recently proposed \"GBDT-friendly\" benchmark (see Figure 1).\nAmong the important findings and technical details powering TabR, the main ones lie in the attention-like mechanism that is responsible for retrieving the nearest neighbors and extracting valuable signal from them.\nIn addition to the higher performance, TabR is simple and significantly more efficient compared to prior retrieval-based tabular DL models.",
        "keywords": "tabular;tabular data;architecture;deep learning;neural networks",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/1d89c5d545a0f9d97e06087ffe6cecd202365a40.zip",
        "author": "Yury Gorishniy;Ivan Rubachev;Nikolay Kartashev;Daniil Shlenskii;Akim Kotelnikov;Artem Babenko",
        "authorids": "~Yury_Gorishniy1;~Ivan_Rubachev1;~Nikolay_Kartashev1;~Daniil_Shlenskii1;~Akim_Kotelnikov1;~Artem_Babenko1",
        "gender": "M;M;Not Specified;M;M;M",
        "homepage": "https://github.com/Yura52;https://github.com/puhsu;;https://github.com/daniil-shlenskii;;",
        "dblp": "295/9836;295/9535;306/1426;353/2313;330/3738;117/4834",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;;https://scholar.google.com/citations?hl=ru;https://scholar.google.com/citations?hl=en;q885d1wAAAAJ",
        "orcid": "0000-0003-1265-5867;;;0009-0005-8217-7815;;0000-0002-1830-8252",
        "linkedin": "yuriy-gorishniy-70a49211a;;;;akimkot;",
        "or_profile": "~Yury_Gorishniy1;~Ivan_Rubachev1;~Nikolay_Kartashev1;~Daniil_Shlenskii1;~Akim_Kotelnikov1;~Artem_Babenko1",
        "aff": "Yandex;Higher School of Economics;Yandex;Yandex;Higher School of Economics, Higher School of Economics;Yandex",
        "aff_domain": "yandex-team.ru;hse.ru;yandex-team.ru;yandex-team.ru;edu.hse.ru;yandex-team.ru",
        "position": "Researcher;PhD student;Intern;Intern;MS student;Researcher",
        "bibtex": "@inproceedings{\ngorishniy2024tabr,\ntitle={TabR: Tabular Deep Learning Meets Nearest Neighbors},\nauthor={Yury Gorishniy and Ivan Rubachev and Nikolay Kartashev and Daniil Shlenskii and Akim Kotelnikov and Artem Babenko},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=rhgIgTSSxW}\n}",
        "github": "",
        "project": "",
        "reviewers": "EnVq;Ly5o;fJsx;aaV3",
        "pdf_size": 868032,
        "rating": "3;6;6;8",
        "confidence": "4;3;2;3",
        "soundness": "3;3;4;3",
        "contribution": "2;3;2;3",
        "presentation": "2;3;4;3",
        "wc_summary": "47;55;147;97",
        "wc_strengths": "50;44;59;66",
        "wc_weaknesses": "386;10;184;13",
        "wc_questions": "70;51;44;106",
        "wc_review": "553;160;434;282",
        "wc_reply_reviewers": "221;0;0;35",
        "wc_reply_authors": "2617;1549;1333;1775",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "5;3;2;3",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            86.5,
            39.75864685826217
        ],
        "wc_strengths_avg": [
            54.75,
            8.407585860400118
        ],
        "wc_weaknesses_avg": [
            148.25,
            154.27957577074162
        ],
        "wc_questions_avg": [
            67.75,
            24.045529730076648
        ],
        "wc_review_avg": [
            357.25,
            148.97881560812598
        ],
        "wc_reply_reviewers_avg": [
            64.0,
            91.76328241731548
        ],
        "wc_reply_authors_avg": [
            1818.5,
            486.78408971534805
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.25,
            1.0897247358851685
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5940885257860046,
        "gs_citation": 39,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8714221086140784139&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=rhgIgTSSxW",
        "pdf": "https://openreview.net/pdf?id=rhgIgTSSxW",
        "email": "yandex-team.ru;hse.ru;yandex-team.ru;yandex-team.ru;edu.hse.ru;yandex-team.ru",
        "author_num": 6,
        "aff_unique_index": "0;1;0;0;1;0",
        "aff_unique_norm": "Yandex;Higher School of Economics",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://yandex.com;https://www.hse.ru",
        "aff_unique_abbr": "Yandex;HSE",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "Russian Federation"
    },
    {
        "id": "rhp5PDNOgf",
        "title": "Spaced Scheduling Enhances Instruction-Prompted Reasoning in Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The recent popularity of large language models has been fueled in part by advances in instruction tuning, which has helped unlock new levels of zero-shot model performance. Much of the prior work in this area has focused on creating new datasets to improve or add specific skills (e.g., improving reasoning via chain-of-thought prompting), or improving existing data sets by increasing the diversity of tasks and prompting templates. However, recent work has shown that instruction tuning can sometimes lead to performance degradation, and recent work has sought to overcome this issue by creating better dataset mixes (or collections) involving laborious and careful ablation studies to find the right composition. In this work, we propose a novel adaptive scheduling strategy we call spaced scheduling motivated by the spaced repetition learning method used by humans that creates an optimal curriculum (or schedule) of training examples. Our approach aims to perform the data mix selection process online during training, tailoring the training data composition to the chosen pre-trained model, reducing the need for extensive studies over different compositions of training data. Our results show that Spaced Scheduling yields better performance than random sampling and comparable results in the worst case, using less training data and minimizing catastrophic forgetting. Further, our proposed approach also yields more \\textit{balanced} performance across all subcategories of the tested benchmarks.",
        "keywords": "large language models;instruction tuning;reasoning;curriculum learning",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/a56504098891bcf0101000ba55b2b344b40287cc.zip",
        "author": "Amine El hattami;Nicolas Chapados;Christopher Pal",
        "authorids": "~Amine_El_hattami1;~Nicolas_Chapados1;~Christopher_Pal1",
        "gender": "M;M;",
        "homepage": ";;https://scholar.google.ca/citations?user=1ScWJOoAAAAJ&hl=en&oi=ao",
        "dblp": ";58/1013;45/1217",
        "google_scholar": "pfRjoEMAAAAJ;QdnjDj8AAAAJ;https://scholar.google.ca/citations?user=1ScWJOoAAAAJ",
        "orcid": ";;",
        "linkedin": "amine-elhattami-73841947/;;",
        "or_profile": "~Amine_El_hattami1;~Nicolas_Chapados1;~Christopher_Pal1",
        "aff": "ServiceNow;ServiceNow Research;Polytechnique Montreal",
        "aff_domain": "servicenow.com;servicenow.com;polymtl.ca",
        "position": "Researcher;VP Research;Full Professor",
        "bibtex": "@misc{\nhattami2024spaced,\ntitle={Spaced Scheduling Enhances Instruction-Prompted Reasoning in Large Language Models},\nauthor={Amine El hattami and Nicolas Chapados and Christopher Pal},\nyear={2024},\nurl={https://openreview.net/forum?id=rhp5PDNOgf}\n}",
        "github": "",
        "project": "",
        "reviewers": "aAUa;QXyK;CD6W;Q3ZP",
        "site": "https://openreview.net/forum?id=rhp5PDNOgf",
        "pdf_size": 280090,
        "rating": "3;5;5;6",
        "confidence": "3;4;4;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;2",
        "presentation": "2;3;3;3",
        "wc_summary": "54;60;129;77",
        "wc_strengths": "34;38;95;47",
        "wc_weaknesses": "131;183;102;426",
        "wc_questions": "86;162;84;53",
        "wc_review": "305;443;410;603",
        "wc_reply_reviewers": "0;0;0;45",
        "wc_reply_authors": "604;408;445;400",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            80.0,
            29.52117883825102
        ],
        "wc_strengths_avg": [
            53.5,
            24.41823089414956
        ],
        "wc_weaknesses_avg": [
            210.5,
            127.75856135695956
        ],
        "wc_questions_avg": [
            96.25,
            40.15205474194316
        ],
        "wc_review_avg": [
            440.25,
            106.89100757313498
        ],
        "wc_reply_reviewers_avg": [
            11.25,
            19.48557158514987
        ],
        "wc_reply_authors_avg": [
            464.25,
            82.45112188442313
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.2294157338705618,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:vhXR_DjldWMJ:scholar.google.com/&scioq=Spaced+Scheduling+Enhances+Instruction-Prompted+Reasoning+in+Large+Language+Models&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "ServiceNow;Polytechnique Montreal",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.servicenow.com;https://www.polymtl.ca",
        "aff_unique_abbr": "ServiceNow;PolyMTL",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Montreal",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "United States;Canada"
    },
    {
        "title": "A Branching Decoder for Set Generation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17687",
        "id": "riNuqYiD66",
        "author_site": "Zixian Huang, Gengyang Xiao, Yu Gu, Gong Cheng",
        "tldr": "",
        "abstract": "Generating a set of text is a common challenge for many NLP applications, for example, automatically providing multiple keyphrases for a document to facilitate user reading. Existing generative models use a sequential decoder that generates a single sequence successively, and the set generation problem is converted to sequence generation via concatenating multiple text into a long text sequence. However, the elements of a set are unordered, which makes this scheme suffer from biased or conflicting training signals. In this paper, we propose a branching decoder, which can generate a dynamic number of tokens at each time-step and branch multiple generation paths. In particular, paths are generated individually so that no order dependence is required. Moreover, multiple paths can be generated in parallel which greatly reduces the inference time. Experiments on several keyphrase generation datasets demonstrate that the branching decoder is more effective and efficient than the existing sequential decoder.",
        "keywords": "set generation;keyphrase generation",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Zixian Huang;Gengyang Xiao;Yu Gu;Gong Cheng",
        "authorids": "~Zixian_Huang1;~Gengyang_Xiao1;~Yu_Gu5;~Gong_Cheng3",
        "gender": "M;M;M;M",
        "homepage": ";https://github.com/Hanser14Forever;http://entslscheia.github.io;http://ws.nju.edu.cn/~gcheng",
        "dblp": ";;15/4208-16;69/1215-1",
        "google_scholar": "FiqiYDUAAAAJ;;c5RwjjcAAAAJ;_ncKAiwAAAAJ",
        "orcid": ";;;0000-0003-3539-7776",
        "linkedin": ";;;gongcheng/",
        "or_profile": "~Zixian_Huang1;~Gengyang_Xiao1;~Yu_Gu5;~Gong_Cheng3",
        "aff": "Nanjing University;Nanjing University;Ohio State University;Nanjing University",
        "aff_domain": "nju.edu.cn;nju.edu.cn;osu.edu;nju.edu.cn",
        "position": "PhD student;MS student;PhD student;Full Professor",
        "bibtex": "@inproceedings{\nhuang2024a,\ntitle={A Branching Decoder for Set Generation},\nauthor={Zixian Huang and Gengyang Xiao and Yu Gu and Gong Cheng},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=riNuqYiD66}\n}",
        "github": "",
        "project": "",
        "reviewers": "4BdG;wNPk;KcLG;JQ4Q",
        "pdf_size": 543207,
        "rating": "6;6;8;8",
        "confidence": "4;3;4;4",
        "soundness": "4;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;4;4",
        "wc_summary": "71;53;55;177",
        "wc_strengths": "10;44;54;68",
        "wc_weaknesses": "36;35;2;164",
        "wc_questions": "40;1;221;39",
        "wc_review": "157;133;332;448",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "432;324;643;706",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            89.0,
            51.28352561983234
        ],
        "wc_strengths_avg": [
            44.0,
            21.400934559032695
        ],
        "wc_weaknesses_avg": [
            59.25,
            62.005544106958695
        ],
        "wc_questions_avg": [
            75.25,
            85.604833391579
        ],
        "wc_review_avg": [
            267.5,
            129.46138420393936
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            526.25,
            154.70031512572947
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:A6U4xlrZgqEJ:scholar.google.com/&scioq=A+Branching+Decoder+for+Set+Generation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=riNuqYiD66",
        "pdf": "https://openreview.net/pdf?id=riNuqYiD66",
        "email": "nju.edu.cn;nju.edu.cn;osu.edu;nju.edu.cn",
        "author_num": 4,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Nanjing University;Ohio State University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.nju.edu.cn;https://www.osu.edu",
        "aff_unique_abbr": "Nanjing U;OSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "riP5PPTnSM",
        "title": "LLM-Oriented Retrieval Tuner",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Dense Retrieval (DR) is now considered as a promising tool to enhance the memorization capacity of Large Language Models (LLM) such as GPT3 and GPT-4 by incorporating external memories. However, due to the paradigm discrepancy between text generation of LLM and DR, it is still an open challenge to integrate the retrieval and generation tasks in a shared LLM. In this paper, we propose an efficient  LLM-Oriented Retrieval Tuner, namely LMORT, which decouples DR capacity from base LLM and non-invasively coordinates the optimally aligned and uniform layers of the LLM towards a unified DR space, achieving an efficient and effective DR without tuning the LLM itself. The extensive experiments on six BEIR datasets show that our approach could achieve competitive zero-shot retrieval performance compared to a range of strong DR models while maintaining the generation ability of LLM.",
        "keywords": "large language model;zero-shot retrieval;alignment and uniformity;non-invasive tuning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/5ff06793781629e49063cb7aa3ebe0bfc7ab9981.zip",
        "author": "Si Sun;Hanqing Zhang;Zhiyuan Liu;Jie Bao;Dawei Song",
        "authorids": "~Si_Sun1;~Hanqing_Zhang1;~Zhiyuan_Liu1;~Jie_Bao4;~Dawei_Song1",
        "gender": "F;;M;M;M",
        "homepage": ";;http://nlp.csai.tsinghua.edu.cn/~lzy;http://www.qlabthu.com/;",
        "dblp": "118/2042;;53/3245-1;60/8557;47/6784-1.html",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;dT0v5u0AAAAJ;;https://scholar.google.com/citations?hl=en",
        "orcid": ";;0000-0002-7709-2543;;",
        "linkedin": ";;;;",
        "or_profile": "~Si_Sun1;~Hanqing_Zhang1;~Zhiyuan_Liu1;~Jie_Bao4;~Dawei_Song1",
        "aff": "Tsinghua University;;Tsinghua University;Tsinghua University;Open University",
        "aff_domain": "tsinghua.edu.cn;;tsinghua.edu.cn;tsinghua.edu.cn;open.ac.uk",
        "position": "PhD student;;Associate Professor;Associate Professor;Full Professor",
        "bibtex": "@misc{\nsun2024llmoriented,\ntitle={{LLM}-Oriented Retrieval Tuner},\nauthor={Si Sun and Hanqing Zhang and Zhiyuan Liu and Jie Bao and Dawei Song},\nyear={2024},\nurl={https://openreview.net/forum?id=riP5PPTnSM}\n}",
        "github": "",
        "project": "",
        "reviewers": "VDA7;Zx7X;CcZQ;XYMY",
        "site": "https://openreview.net/forum?id=riP5PPTnSM",
        "pdf_size": 3538812,
        "rating": "3;5;5;5",
        "confidence": "4;4;3;3",
        "soundness": "3;2;2;3",
        "contribution": "2;3;3;2",
        "presentation": "2;3;3;2",
        "wc_summary": "190;211;97;162",
        "wc_strengths": "59;154;25;20",
        "wc_weaknesses": "252;161;154;270",
        "wc_questions": "96;107;57;135",
        "wc_review": "597;633;333;587",
        "wc_reply_reviewers": "217;0;0;14",
        "wc_reply_authors": "452;250;129;118",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            165.0,
            42.935998882057
        ],
        "wc_strengths_avg": [
            64.5,
            53.80752735445107
        ],
        "wc_weaknesses_avg": [
            209.25,
            52.19853925159209
        ],
        "wc_questions_avg": [
            98.75,
            27.985487310390006
        ],
        "wc_review_avg": [
            537.5,
            119.30108968488092
        ],
        "wc_reply_reviewers_avg": [
            57.75,
            92.12050531776299
        ],
        "wc_reply_authors_avg": [
            237.25,
            134.36773236160533
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17787682759759639071&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "Tsinghua University;Open University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.open.ac.uk",
        "aff_unique_abbr": "THU;OU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "id": "riQmzq5FaQ",
        "title": "Reinforcement Learning with Elastic Time Steps",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Reinforcement Learning (RL) is usually modelled as a Markov Decision Process (MDP), where an agent goes through time in discrete time steps. When applied outside of simulation, virtually all existing RL-based control systems maintain the MDP assumptions and use a constant rate control strategy, with a time step that is empirically chosen according to the specific application environment. Controlling dynamic systems with learned policies at the highest, worst-case frequency to guarantee stability can require high computational and energy resources, which can be hard to achieve with on-board hardware. Following the principles of reactive programming, we posit that applying control actions $only$ $when$ $necessary$, can allow the use of simpler hardware and reduce energy consumption. To implement this reactive policy, we break the fixed frequency assumption and propose $RL$ $with$ $elastic$ $time$ $steps$, where the policy determines the next action as well as the duration of the next time step. We also derive a Soft Elastic Actor-Critic (SEAC) algorithm to compute the optimal policy in our new setting. We demonstrate the effectiveness of SEAC both theoretically and experimentally driving an agent in a simulation of a simple world with Newtonian kinematics. Our experiments show higher average returns, shorter task completion times, and reduced energy consumption.",
        "keywords": "Reinforcement Learning; Elastic Time Steps; Energy efficiency; Data Efficiency; Off-Policy Optimisation.",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/4c8c6e8c7467700a626daea45c421fd5d46eb455.zip",
        "author": "Dong Wang;Giovanni Beltrame",
        "authorids": "~Dong_Wang37;~Giovanni_Beltrame1",
        "gender": "M;M",
        "homepage": "https://github.com/alpaficia;https://mistlab.ca",
        "dblp": ";99/4470",
        "google_scholar": ";TVHJJ9wAAAAJ",
        "orcid": ";0000-0001-9755-8630",
        "linkedin": ";gbeltrame/",
        "or_profile": "~Dong_Wang37;~Giovanni_Beltrame1",
        "aff": "\u00c9cole Polytechnique de Montr\u00e9al, Universit\u00e9 de Montr\u00e9al;Polytechnique Montreal",
        "aff_domain": "polymtl.ca;polymtl.ca",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nwang2024reinforcement,\ntitle={Reinforcement Learning with Elastic Time Steps},\nauthor={Dong Wang and Giovanni Beltrame},\nyear={2024},\nurl={https://openreview.net/forum?id=riQmzq5FaQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "FcT3;DZcS;VwVw;XuXs",
        "site": "https://openreview.net/forum?id=riQmzq5FaQ",
        "pdf_size": 2674435,
        "rating": "3;3;3;6",
        "confidence": "4;4;4;3",
        "soundness": "2;2;2;2",
        "contribution": "1;1;1;2",
        "presentation": "2;3;2;2",
        "wc_summary": "61;34;42;76",
        "wc_strengths": "41;21;16;52",
        "wc_weaknesses": "919;264;71;128",
        "wc_questions": "5;29;2;702",
        "wc_review": "1026;348;131;958",
        "wc_reply_reviewers": "8;90;0;0",
        "wc_reply_authors": "914;745;261;696",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            53.25,
            16.391689967785506
        ],
        "wc_strengths_avg": [
            32.5,
            14.637281168304447
        ],
        "wc_weaknesses_avg": [
            345.5,
            338.45272934340477
        ],
        "wc_questions_avg": [
            184.5,
            298.9619541011866
        ],
        "wc_review_avg": [
            615.75,
            384.7443144479201
        ],
        "wc_reply_reviewers_avg": [
            24.5,
            37.957212753309484
        ],
        "wc_reply_authors_avg": [
            654.0,
            240.88067585424946
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14706749708804555643&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "\u00c9cole Polytechnique de Montr\u00e9al;Polytechnique Montreal",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.polymtl.ca;https://www.polymtl.ca",
        "aff_unique_abbr": "Polytechnique Montr\u00e9al;PolyMTL",
        "aff_campus_unique_index": "0;1",
        "aff_campus_unique": "Montr\u00e9al;Montreal",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "riYNe4jnKV",
        "title": "Calibration-then-Calculation: A Variance Reduced Metric Framework",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep learning has been widely adopted across various fields, but there has been little focus on evaluating the performance of deep learning pipelines. With the increased use of large datasets and complex models, it has become common to run the training process only once and compare the result to previous benchmarks. However, this procedure can lead to imprecise comparisons due to the variance in neural network evaluation metrics. The metric variance comes from the randomness inherent in the training process of deep learning pipelines. Traditional solutions such as running the training process multiple times are usually not feasible in deep learning due to computational limitations. In this paper, we propose a new metric framework, Calibrated Loss, that addresses this issue by reducing the variance in its vanilla counterpart. As a result, the new metric has a higher accuracy to detect effective modeling improvement. Our approach is supported by theoretical justifications and extensive experimental validations in the context of Deep Click-Through Rate Prediction Models and Image Classification Models.",
        "keywords": "Recommendation System;Deep Learning;Calibration;Metric;Deep Click-Through Rate Prediction Models;Neural Networks",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/c1f214c1336bf3d9f8507493b6fe9bb1b1d50ae2.zip",
        "author": "Yewen Fan;Nian Si;Xiangchen Song;Kun Zhang",
        "authorids": "~Yewen_Fan1;~Nian_Si1;~Xiangchen_Song1;~Kun_Zhang1",
        "gender": "M;M;M;M",
        "homepage": "https://tofuwen.github.io/;http://niansi.me;https://xiangchensong.github.io/;http://www.andrew.cmu.edu/user/kunz1/",
        "dblp": "200/1168;254/2589;261/9024;96/3115-1",
        "google_scholar": "Q9_yaekAAAAJ;;foR8BIoAAAAJ;RGoypN4AAAAJ",
        "orcid": ";;;",
        "linkedin": "yewen-fan;;;",
        "or_profile": "~Yewen_Fan1;~Nian_Si1;~Xiangchen_Song1;~Kun_Zhang1",
        "aff": "Carnegie Mellon University;University of Chicago;Carnegie Mellon University;Carnegie Mellon University",
        "aff_domain": "cmu.edu;uchicago.edu;cmu.edu;cmu.edu",
        "position": "PhD student;Postdoc;PhD student;Associate Professor",
        "bibtex": "@misc{\nfan2024calibrationthencalculation,\ntitle={Calibration-then-Calculation: A Variance Reduced Metric Framework},\nauthor={Yewen Fan and Nian Si and Xiangchen Song and Kun Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=riYNe4jnKV}\n}",
        "github": "",
        "project": "",
        "reviewers": "cepe;mk4m;hPPi;HhCS;Rghz",
        "site": "https://openreview.net/forum?id=riYNe4jnKV",
        "pdf_size": 379122,
        "rating": "3;3;5;6;6",
        "confidence": "4;3;4;4;3",
        "soundness": "2;3;2;3;2",
        "contribution": "2;2;2;3;3",
        "presentation": "2;3;3;3;3",
        "wc_summary": "65;105;92;41;98",
        "wc_strengths": "29;35;42;17;44",
        "wc_weaknesses": "409;126;153;18;305",
        "wc_questions": "6;24;46;69;66",
        "wc_review": "509;290;333;145;513",
        "wc_reply_reviewers": "88;126;220;0;11",
        "wc_reply_authors": "432;337;285;167;361",
        "reply_reviewers": "1;1;1;0;1",
        "reply_authors": "2;2;2;1;1",
        "rating_avg": [
            4.6,
            1.3564659966250536
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            80.2,
            23.827714955488283
        ],
        "wc_strengths_avg": [
            33.4,
            9.76933979345585
        ],
        "wc_weaknesses_avg": [
            202.2,
            138.1960925641532
        ],
        "wc_questions_avg": [
            42.2,
            24.252010225958593
        ],
        "wc_review_avg": [
            358.0,
            139.60229224479087
        ],
        "wc_reply_reviewers_avg": [
            89.0,
            80.66721762897242
        ],
        "wc_reply_authors_avg": [
            316.4,
            88.41176392313413
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4
        ],
        "reply_authors_avg": [
            1.6,
            0.4898979485566356
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.06019292654288467,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Lyi_FIUm5McJ:scholar.google.com/&scioq=Calibration-then-Calculation:+A+Variance+Reduced+Metric+Framework&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Carnegie Mellon University;University of Chicago",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cmu.edu;https://www.uchicago.edu",
        "aff_unique_abbr": "CMU;UChicago",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "rilxbMxt5C",
        "title": "SAIF: Sparse Adversarial and Imperceptible Attack Framework",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Adversarial attacks hamper the decision-making ability of neural networks by perturbing the input signal. The addition of calculated small distortion to images, for instance, can deceive a well-trained image classification network. In this work, we propose a novel attack technique called \\textbf{S}parse \\textbf{A}dversarial and \\textbf{I}mperceptible Attack \\textbf{F}ramework (SAIF). Specifically, we design imperceptible attacks that contain low-magnitude perturbations at a small number of pixels and leverage these sparse attacks to reveal the vulnerability of classifiers. We use the Frank-Wolfe (conditional gradient) algorithm to simultaneously optimize the attack perturbations for bounded magnitude and sparsity with $O(1/\\sqrt{T})$ convergence. Empirical results show that SAIF computes highly imperceptible adversarial examples, and largely outperforms state-of-the-art sparse attack methods on ImageNet and CIFAR-10.",
        "keywords": "Adversarial examples;sparse adversarial attacks",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Tooba Imtiaz;Morgan R Kohler;Jared F Miller;Zifeng Wang;Mario Sznaier;Octavia Camps;Jennifer Dy",
        "authorids": "~Tooba_Imtiaz1;~Morgan_R_Kohler1;~Jared_F_Miller1;~Zifeng_Wang1;~Mario_Sznaier1;~Octavia_Camps1;~Jennifer_Dy1",
        "gender": "F;M;;M;M;;F",
        "homepage": "https://toobaimt.github.io/;;https://Jarmill.GitHub.io;https://kingspencer.github.io/;http://robustsystems.coe.neu.edu;https://mllabneu.github.io/;http://robustsystems.coe.neu.edu",
        "dblp": "266/4866;;;43/7716-2;14/1686;24/6000;69/6960",
        "google_scholar": "qR1LfG8AAAAJ;QyJEc64AAAAJ;cyibVxgAAAAJ;https://scholar.google.co.il/citations?user=N1uBekcAAAAJ;https://scholar.google.com/citations?view_op=search_authors;6h7b0fAAAAAJ;htt9T1AAAAAJ",
        "orcid": ";;;;0000-0003-4439-3988;;0000-0003-1945-9172",
        "linkedin": "tooba-imtiaz/;morgan-kohler-421904158/;;zifeng-wang-21b069b4/;;;",
        "or_profile": "~Tooba_Imtiaz1;~Morgan_R_Kohler1;~Jared_F_Miller1;~Zifeng_Wang1;~Mario_Sznaier1;~Jennifer_Dy1;~Octavia_I._Camps1",
        "aff": "Google;Hayden AI;;Google;Northeastern University;Northeastern University;Northeastern University",
        "aff_domain": "google.com;hayden.ai;;google.com;northeastern.edu;northeastern.edu;neu.edu",
        "position": "Research Intern;Researcher;;Research Scientist;Full Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nimtiaz2024saif,\ntitle={{SAIF}: Sparse Adversarial and Imperceptible Attack Framework},\nauthor={Tooba Imtiaz and Morgan R Kohler and Jared F Miller and Zifeng Wang and Mario Sznaier and Octavia Camps and Jennifer Dy},\nyear={2024},\nurl={https://openreview.net/forum?id=rilxbMxt5C}\n}",
        "github": "",
        "project": "",
        "reviewers": "Taxv;9tC9;a5or",
        "site": "https://openreview.net/forum?id=rilxbMxt5C",
        "pdf_size": 2287990,
        "rating": "3;5;6",
        "confidence": "5;4;3",
        "soundness": "3;2;3",
        "contribution": "2;2;3",
        "presentation": "2;2;3",
        "wc_summary": "76;64;89",
        "wc_strengths": "33;27;75",
        "wc_weaknesses": "278;225;87",
        "wc_questions": "25;83;31",
        "wc_review": "412;399;282",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            76.33333333333333,
            10.208928554075703
        ],
        "wc_strengths_avg": [
            45.0,
            21.354156504062622
        ],
        "wc_weaknesses_avg": [
            196.66666666666666,
            80.50810863233315
        ],
        "wc_questions_avg": [
            46.333333333333336,
            26.04269997949948
        ],
        "wc_review_avg": [
            364.3333333333333,
            58.459862774005515
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.9819805060619659,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:MgRlNDlWZY8J:scholar.google.com/&scioq=SAIF:+Sparse+Adversarial+and+Imperceptible+Attack+Framework&hl=en&as_sdt=0,33",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;2;2;2",
        "aff_unique_norm": "Google;Hayden AI;Northeastern University",
        "aff_unique_dep": "Google;;",
        "aff_unique_url": "https://www.google.com;https://www.hayden.ai;https://www.northeastern.edu",
        "aff_unique_abbr": "Google;Hayden AI;NEU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Mountain View;",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "rjLgCkJH79",
        "title": "A SIMILARITY-AGNOSTIC REINFORCEMENT LEARNING APPROACH FOR LEAD OPTIMIZATION",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Lead optimization in drug discovery is a pivotal phase in identifying promising drug candidates for further development. Traditionally, lead optimization in the machine learning community has been treated as a constraint optimization problem where methods like generative models and reinforcement learning(RL) have been widely employed. However, these methods often rely on molecular similarity metrics to define constraints, which poses significant challenges due to the inherently ambiguous nature of molecular similarity. In this work, we present a similarity-agnostic approach to lead optimization, which we term \"Lead Optimization using Goal-conditioned Reinforcement Learning\" or LOGRL. Contrary to conventional methods, LOGRL is uniquely trained on a distinct task: source-to-target path prediction. This allows LOGRL to produce molecules with significantly higher Tanimoto similarity to target molecules, even without direct exposure to this metric during training. Furthermore, we incorporate a beam search strategy during the molecule generation process. This strategy empowers us to generate a substantial number of candidate molecules, facilitating further curation to meet desired properties. Notably, our unique approach permits us to leverage the Euclidean distance between learned action representations as a surrogate for molecular similarity during beam search.",
        "keywords": "Drug Design;Molecular Optimisation;Reinforcement Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/54975fa5a6cd8c7de6f582ced70933a44acf3f4f.pdf",
        "author": "Abhor Gupta;Sean Current;Balaraman Ravindran;Rohit Batra;srinivasan parthasarathy;Karthik Raman",
        "authorids": "~Abhor_Gupta1;~Sean_Current1;~Balaraman_Ravindran1;~Rohit_Batra1;~srinivasan_parthasarathy1;~Karthik_Raman4",
        "gender": "M;M;M;M;;M",
        "homepage": ";;http://www.cse.iitm.ac.in/~ravi;https://rohitbatra1989.wixsite.com/rbatra;https://web.cse.ohio-state.edu/~parthasarathy.2/;",
        "dblp": ";290/8720;69/2281;;p/SParathasarathy.html;",
        "google_scholar": ";UtFflEMAAAAJ;https://scholar.google.com/citations?hl=en;HYOLn6IAAAAJ;2mjUsP8AAAAJ;",
        "orcid": ";0000-0002-3510-6919;0000-0002-5364-7639;;0000-0002-6062-6449;0000-0002-9311-7093",
        "linkedin": "abhor-gupta-565386145/;;ravindran-balaraman-427a307;;srinivasan-parthasarathy-5703761/;",
        "or_profile": "~Abhor_Gupta1;~Sean_Current1;~Balaraman_Ravindran1;~Rohit_Batra1;~srinivasan_parthasarathy1;~Karthik_Raman4",
        "aff": ";Ohio State University, Columbus;Indian Institute of Technology Madras;Indian Institute of Technology, Madras;Ohio State University;Indian Institute of Technology Madras",
        "aff_domain": ";osu.edu;iitm.ac.in;iitm.ac.in;osu.edu;iitm.ac.in",
        "position": ";PhD student;Full Professor;Assistant Professor;Professor;Full Professor",
        "bibtex": "@misc{\ngupta2024a,\ntitle={A {SIMILARITY}-{AGNOSTIC} {REINFORCEMENT} {LEARNING} {APPROACH} {FOR} {LEAD} {OPTIMIZATION}},\nauthor={Abhor Gupta and Sean Current and Balaraman Ravindran and Rohit Batra and srinivasan parthasarathy and Karthik Raman},\nyear={2024},\nurl={https://openreview.net/forum?id=rjLgCkJH79}\n}",
        "github": "",
        "project": "",
        "reviewers": "NNdZ;PmbC;TrZv",
        "site": "https://openreview.net/forum?id=rjLgCkJH79",
        "pdf_size": 593174,
        "rating": "3;3;5",
        "confidence": "3;3;4",
        "soundness": "1;1;2",
        "contribution": "2;1;2",
        "presentation": "3;2;3",
        "wc_summary": "90;56;100",
        "wc_strengths": "117;15;100",
        "wc_weaknesses": "441;332;286",
        "wc_questions": "67;3;88",
        "wc_review": "715;406;574",
        "wc_reply_reviewers": "142;0;0",
        "wc_reply_authors": "939;744;503",
        "reply_reviewers": "1;0;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            82.0,
            18.83259585576738
        ],
        "wc_strengths_avg": [
            77.33333333333333,
            44.61937795273359
        ],
        "wc_weaknesses_avg": [
            353.0,
            64.99743584685989
        ],
        "wc_questions_avg": [
            52.666666666666664,
            36.15091823023156
        ],
        "wc_review_avg": [
            565.0,
            126.30914456206249
        ],
        "wc_reply_reviewers_avg": [
            47.333333333333336,
            66.9394419523265
        ],
        "wc_reply_authors_avg": [
            728.6666666666666,
            178.32616808035274
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:N34KQb8ihbUJ:scholar.google.com/&scioq=A+SIMILARITY-AGNOSTIC+REINFORCEMENT+LEARNING+APPROACH+FOR+LEAD+OPTIMIZATION&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;0;1",
        "aff_unique_norm": "Ohio State University;Indian Institute of Technology Madras",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.osu.edu;https://www.iitm.ac.in",
        "aff_unique_abbr": "OSU;IIT Madras",
        "aff_campus_unique_index": "0;1;1;1",
        "aff_campus_unique": "Columbus;Madras;",
        "aff_country_unique_index": "0;1;1;0;1",
        "aff_country_unique": "United States;India"
    },
    {
        "title": "Gen-Z: Generative Zero-Shot Text Classification with Contextualized Label Descriptions",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17686",
        "id": "rkplYfqUr0",
        "author_site": "Sachin Kumar, Chan Young Park, Yulia Tsvetkov",
        "tldr": "",
        "abstract": "Language model (LM) prompting\u2014a popular paradigm for solving NLP tasks\u2014has been shown to be susceptible to miscalibration and brittleness to slight prompt variations, caused by its discriminative prompting approach, i.e., predicting the label given the input. To address these issues, we propose Gen-Z\u2014a generative prompting framework for zero-shot text classification. GEN-Z is generative, as it measures the LM likelihood of input text, conditioned on natural language descriptions of labels. The framework is multivariate, as label descriptions allow us to seamlessly integrate additional contextual information about the labels to improve task performance. On various standard classification benchmarks, with six open-source LM families, we show that zero-shot classification with simple contextualization of the data source of the evaluation set consistently outperforms both zero-shot and few-shot baselines while improving robustness to prompt variations. Further, our approach enables personalizing classification in a zero-shot manner by incorporating author, subject, or reader information in the label descriptions.",
        "keywords": "zero-shot classification;prompting;generative classification;label descriptions",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/3aa6d9adf1244d4e9b4c6e9b287bff738107aadb.zip",
        "author": "Sachin Kumar;Chan Young Park;Yulia Tsvetkov",
        "authorids": "~Sachin_Kumar1;~Chan_Young_Park1;~Yulia_Tsvetkov1",
        "gender": "M;F;F",
        "homepage": "https://shocheen.com;https://chan0park.github.io;https://homes.cs.washington.edu/~yuliats/",
        "dblp": "31/4484-9;15/480;75/8157",
        "google_scholar": "qO38fRIAAAAJ;https://scholar.google.com/citations?hl=en;SEDPkrsAAAAJ",
        "orcid": ";;0000-0002-4634-7128",
        "linkedin": ";;",
        "or_profile": "~Sachin_Kumar1;~Chan_Young_Park1;~Yulia_Tsvetkov1",
        "aff": "Allen Institute for Artificial Intelligence;School of Computer Science, Carnegie Mellon University;Department of Computer Science, University of Washington",
        "aff_domain": "allenai.org;cs.cmu.edu;cs.washington.edu",
        "position": "Postdoc;PhD student;Associate Professor",
        "bibtex": "@inproceedings{\nkumar2024genz,\ntitle={Gen-Z: Generative Zero-Shot Text Classification with Contextualized Label Descriptions},\nauthor={Sachin Kumar and Chan Young Park and Yulia Tsvetkov},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=rkplYfqUr0}\n}",
        "github": "",
        "project": "",
        "reviewers": "N7Hu;BREF;uHMN;vWvw",
        "pdf_size": 5358030,
        "rating": "6;6;6;6",
        "confidence": "3;4;4;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "79;59;92;55",
        "wc_strengths": "73;56;50;42",
        "wc_weaknesses": "61;205;79;102",
        "wc_questions": "43;33;49;49",
        "wc_review": "256;353;270;248",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "419;379;622;561",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            71.25,
            15.039531242695032
        ],
        "wc_strengths_avg": [
            55.25,
            11.388041973930374
        ],
        "wc_weaknesses_avg": [
            111.75,
            55.76457208658558
        ],
        "wc_questions_avg": [
            43.5,
            6.5383484153110105
        ],
        "wc_review_avg": [
            281.75,
            41.883021619744675
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            495.25,
            99.64530846959128
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8981971566640697155&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=rkplYfqUr0",
        "pdf": "https://openreview.net/pdf?id=rkplYfqUr0",
        "email": "allenai.org;cs.cmu.edu;cs.washington.edu",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Allen Institute for Artificial Intelligence;Carnegie Mellon University;University of Washington",
        "aff_unique_dep": ";School of Computer Science;Department of Computer Science",
        "aff_unique_url": "https://allenai.org;https://www.cmu.edu;https://www.washington.edu",
        "aff_unique_abbr": "AI2;CMU;UW",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Pittsburgh;Seattle",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "rlCyHDzOjj",
        "title": "A New Tensor Network: Tubal Tensor Train Network and its Applications",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper introduces the Tubal Tensor Train (TTT) decomposition, a novel tensor decomposition model that effectively mitigates the curse of dimensionality inherent in the Tensor Singular Value Decomposition (T-SVD). The TTT decomposition represents an $N$-order tensor as the Tubal product (T-product) of a series of two third-order and $(N-3)$ fourth-order core tensors, contracted. Similar to the Tensor-Train (TT) decomposition, our approach addresses the curse of dimensionality problem. In order to decompose a given tensor into the TTT format, we propose two high-performing algorithms. Numerical simulations are conducted on diverse tasks to demonstrate the efficiency and accuracy of these algorithms compared to the State-of-the-Art methods.",
        "keywords": "Higher-order tensor decomposition models;Tensor Train decomposition;tubal product;T-SVD;Tubal Tensor Train;tensor completion;tensor compression",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Salman Ahmadi-Asl;Valentin Leplat;ANH-HUY PHAN;Andrzej Cichocki",
        "authorids": "~Salman_Ahmadi-Asl1;~Valentin_Leplat1;~ANH-HUY_PHAN1;~Andrzej_Cichocki1",
        "gender": ";M;M;",
        "homepage": "https://scholar.google.com/citations?user=hMO_NgcAAAAJ&hl=en;https://sites.google.com/view/valentinleplat/;;",
        "dblp": ";;23/2408;c/AndrzejCichocki",
        "google_scholar": ";;pJb7n9EAAAAJ;",
        "orcid": ";0000-0002-3313-1547;;",
        "linkedin": ";;;",
        "or_profile": "~Salman_Ahmadi-Asl1;~Valentin_Leplat1;~ANH-HUY_PHAN1;~Andrzej_Cichocki1",
        "aff": "Innopolis University ;Skoltech;Skolkovo Institute of Science and Technology;Skoltech",
        "aff_domain": "skolkovotech.ru;skoltech.ru;skoltech.ru;skoltech.ru",
        "position": "Assistant Professor;Postdoc;Full Professor;Full Professor",
        "bibtex": "@misc{\nahmadi-asl2024a,\ntitle={A New Tensor Network: Tubal Tensor Train Network and its Applications},\nauthor={Salman Ahmadi-Asl and Valentin Leplat and ANH-HUY PHAN and Andrzej Cichocki},\nyear={2024},\nurl={https://openreview.net/forum?id=rlCyHDzOjj}\n}",
        "github": "",
        "project": "",
        "reviewers": "agS1;Z5ER;aedc;qk5Z",
        "site": "https://openreview.net/forum?id=rlCyHDzOjj",
        "pdf_size": 7300602,
        "rating": "3;5;5;6",
        "confidence": "3;5;5;3",
        "soundness": "2;3;3;2",
        "contribution": "2;1;3;2",
        "presentation": "1;2;2;3",
        "wc_summary": "54;37;95;62",
        "wc_strengths": "13;17;42;70",
        "wc_weaknesses": "181;94;34;81",
        "wc_questions": "137;6;475;77",
        "wc_review": "385;154;646;290",
        "wc_reply_reviewers": "0;131;37;29",
        "wc_reply_authors": "1296;1021;1529;1358",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "2;3;2;2",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            1.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            62.0,
            21.083168642308014
        ],
        "wc_strengths_avg": [
            35.5,
            22.808989455914087
        ],
        "wc_weaknesses_avg": [
            97.5,
            53.12485294097293
        ],
        "wc_questions_avg": [
            173.75,
            180.00190971209167
        ],
        "wc_review_avg": [
            368.75,
            179.89632430930877
        ],
        "wc_reply_reviewers_avg": [
            49.25,
            49.16490109824284
        ],
        "wc_reply_authors_avg": [
            1301.0,
            182.79633475537742
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.2294157338705618,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:XhQGKswJCLoJ:scholar.google.com/&scioq=A+New+Tensor+Network:+Tubal+Tensor+Train+Network+and+its+Applications&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Innopolis University;Skolkovo Institute of Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://innopolis.ru/en;https://www.skoltech.ru",
        "aff_unique_abbr": "Innopolis;Skoltech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Russian Federation"
    },
    {
        "id": "rleZtn5OqJ",
        "title": "Long-Tailed Recognition on Binary Networks by Calibrating A Pre-trained Model",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deploying deep models in real-world scenarios entails a number of challenges, including computational efficiency and real-world (e.g., long-tailed) data distributions. We address the combined challenge of learning long-tailed distributions using highly resource-efficient binary neural networks as backbones. Specifically, we propose a calibrate-and-distill framework that uses off-the-shelf pretrained full-precision models trained on balanced datasets to use as teachers for distillation when learning binary networks on long-tailed datasets. To better generalize to various datasets, we further propose a novel adversarial balancing among the terms in the objective function and an efficient multiresolution learning scheme. We conducted the largest empirical study in the literature using 15 datasets, including newly derived long-tailed datasets from existing balanced datasets, and show that our proposed method outperforms prior art by large margins (> 14.33% on\naverage).",
        "keywords": "binary networks;long-tailed recognition;pretrained models;distillation",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Jihun Kim;Dahyun Kim;Hyung Rok Jung;TaeIL Oh;Jonghyun Choi",
        "authorids": "~Jihun_Kim1;~Dahyun_Kim1;~Hyung_Rok_Jung1;~TaeIL_Oh1;~Jonghyun_Choi1",
        "gender": "M;M;M;;M",
        "homepage": "https://gistvision.github.io/;;https://gistvision.github.io/people.html;;https://ppolon.github.io/",
        "dblp": ";196/7883;;;21/11103",
        "google_scholar": ";atD6Rs4AAAAJ;;;uiGWnm4AAAAJ",
        "orcid": ";;;;0000-0002-7934-8434",
        "linkedin": ";dahyun-kim-0a1711163;;;jonghyun-choi-459bb615/",
        "or_profile": "~Jihun_Kim1;~Dahyun_Kim1;~Hyung_Rok_Jung1;~TaeIL_Oh1;~Jonghyun_Choi1",
        "aff": "Minds and Company;Upstage AI Research;Gwangju Institute of Science and Technology;;Yonsei University",
        "aff_domain": "mnc.ai;upstage.ai;gist.ac.kr;;yonsei.ac.kr",
        "position": "Researcher;Researcher;PhD student;;Associate Professor",
        "bibtex": "@misc{\nkim2024longtailed,\ntitle={Long-Tailed Recognition on Binary Networks by Calibrating A Pre-trained Model},\nauthor={Jihun Kim and Dahyun Kim and Hyung Rok Jung and TaeIL Oh and Jonghyun Choi},\nyear={2024},\nurl={https://openreview.net/forum?id=rleZtn5OqJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "eG2e;fEHn;HnuF;udmW",
        "site": "https://openreview.net/forum?id=rleZtn5OqJ",
        "pdf_size": 699669,
        "rating": "3;3;6;6",
        "confidence": "4;3;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;2",
        "wc_summary": "102;56;36;76",
        "wc_strengths": "16;37;50;63",
        "wc_weaknesses": "227;203;70;177",
        "wc_questions": "32;48;21;36",
        "wc_review": "377;344;177;352",
        "wc_reply_reviewers": "114;0;0;20",
        "wc_reply_authors": "565;810;329;416",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "3;2;3;1",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            67.5,
            24.428467000612216
        ],
        "wc_strengths_avg": [
            41.5,
            17.356554957709783
        ],
        "wc_weaknesses_avg": [
            169.25,
            59.968220750660926
        ],
        "wc_questions_avg": [
            34.25,
            9.65336728815391
        ],
        "wc_review_avg": [
            312.5,
            79.1722805027113
        ],
        "wc_reply_reviewers_avg": [
            33.5,
            47.188451977152205
        ],
        "wc_reply_authors_avg": [
            530.0,
            182.36090589816666
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:erzeeYLrbN8J:scholar.google.com/&scioq=Long-Tailed+Recognition+on+Binary+Networks+by+Calibrating+A+Pre-trained+Model&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Minds and Company;Upstage AI Research;Gwangju Institute of Science and Technology;Yonsei University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": ";;https://www.gist.ac.kr;https://www.yonsei.ac.kr",
        "aff_unique_abbr": ";;GIST;Yonsei",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Gwangju",
        "aff_country_unique_index": "1;1",
        "aff_country_unique": ";South Korea"
    },
    {
        "id": "rljudc4XHW",
        "title": "DynamicBEV: Leveraging Dynamic Queries and Temporal Context for 3D Object Detection",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "3D object detection is crucial for applications like autonomous driving and robotics. While query-based 3D object detection for BEV (Bird's Eye View) images has seen significant advancements, most existing methods follows the paradigm of static query. Such paradigm is incapable of adapting to complex spatial-temporal relationships in the scene. To solve this problem, we introduce a new paradigm in DynamicBEV, a novel approach that employs dynamic queries for BEV-based 3D object detection. In contrast to static queries, the proposed dynamic queries exploit K-means clustering and Top-K Attention in a creative way to aggregate information more effectively from both local and distant feature, which enable DynamicBEV to adapt iteratively to complex scenes. To further boost efficiency, DynamicBEV incorporates a Lightweight Temporal Fusion Module (LTFM), designed for efficient temporal context integration with a significant computation reduction. Additionally, a custom-designed Diversity Loss ensures a balanced feature representation across scenarios. Extensive experiments on the nuScenes dataset validate the effectiveness of DynamicBEV, establishing a new state-of-the-art and heralding a paradigm-level breakthrough in query-based BEV object detection.",
        "keywords": "3D object detection;Bird's Eye View",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Jiawei Yao;Yingxin Lai",
        "authorids": "~Jiawei_Yao3;~Yingxin_Lai1",
        "gender": ";M",
        "homepage": ";https://blog.csdn.net/weixin_44727352?type=blog",
        "dblp": ";272/8453",
        "google_scholar": ";WSWI_5EAAAAJ",
        "orcid": ";0000-0003-1369-2205",
        "linkedin": ";",
        "or_profile": "~Jiawei_Yao3;~Yingxin_Lai1",
        "aff": ";Xiamen University",
        "aff_domain": ";xmu.edu.cn",
        "position": ";MS student",
        "bibtex": "@misc{\nyao2024dynamicbev,\ntitle={Dynamic{BEV}: Leveraging Dynamic Queries and Temporal Context for 3D Object Detection},\nauthor={Jiawei Yao and Yingxin Lai},\nyear={2024},\nurl={https://openreview.net/forum?id=rljudc4XHW}\n}",
        "github": "",
        "project": "",
        "reviewers": "Pvpq;hs8x;P6ky;NE19",
        "site": "https://openreview.net/forum?id=rljudc4XHW",
        "pdf_size": 472394,
        "rating": "3;5;5;5",
        "confidence": "4;3;4;4",
        "soundness": "3;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "2;2;3;2",
        "wc_summary": "53;37;79;64",
        "wc_strengths": "35;35;52;82",
        "wc_weaknesses": "115;153;125;147",
        "wc_questions": "3;6;4;2",
        "wc_review": "206;231;260;295",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            58.25,
            15.35211711784404
        ],
        "wc_strengths_avg": [
            51.0,
            19.196353820452465
        ],
        "wc_weaknesses_avg": [
            135.0,
            15.556349186104045
        ],
        "wc_questions_avg": [
            3.75,
            1.479019945774904
        ],
        "wc_review_avg": [
            248.0,
            33.18885355055218
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 16,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5142531431732856535&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Xiamen University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.xmu.edu.cn",
        "aff_unique_abbr": "XMU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "rmA6uFEgIY",
        "title": "MIXCON3D: SYNERGIZING MULTI-VIEW AND CROSS-MODAL CONTRASTIVE LEARNING FOR ENHANCING 3D REPRESENTATION",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "By adapting the success of Contrastive Language-Image Pre-training from 2D vision to the 3D world, contrastive learning has emerged as a promising paradigm for open-world understanding jointly with text, image, and point cloud. While existing studies focus on aligning features from these individual modalities, this paper introduces a novel joint representation alignment approach. This mechanism enriches the conventional tri-modal representation by creating a new combined representation of images and point clouds, thus offering more accurate depiction of real-world 3D objects and bolstering text alignment. The method, termed as MixCon3D, is furthered through the integration of multi-view images, offering a more holistic representation. Furthermore, we pioneer the first thorough investigation of various training recipes for the 3D contrastive learning paradigm, building a strong baseline with improved performance and generalizability. Extensive experiments conducted on three representative benchmarks reveals that our method renders significant improvement over the baseline, surpassing the previous stateof-the-art performance on the challenging 1,156-category Objaverse-LVIS dataset by 5.7%. We further showcase the effectiveness of our approach in more applications, including text-to-3D retrieval and point cloud captioning.",
        "keywords": "3D open-world understanding;cross-model pre-training;contrastive learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yipeng Gao;Zeyu Wang;Wei-Shi Zheng;Cihang Xie;Yuyin Zhou",
        "authorids": "~Yipeng_Gao1;~Zeyu_Wang2;~Wei-Shi_Zheng3;~Cihang_Xie3;~Yuyin_Zhou1",
        "gender": "M;;M;;",
        "homepage": "https://hlings.github.io/;;http://www.isee-ai.cn/~zhwshi;;https://yuyinzhou.github.io/",
        "dblp": "146/8907;;30/8399;;192/1413",
        "google_scholar": "https://scholar.google.com.hk/citations?hl=zh-CN;;AwqDDGoAAAAJ;;eiqVLC0AAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Yipeng_Gao1;~Zeyu_Wang2;~Wei-Shi_Zheng3;~Cihang_Xie3;~Yuyin_Zhou1",
        "aff": "SUN YAT-SEN UNIVERSITY;;SUN YAT-SEN UNIVERSITY;;University of California, Santa Cruz",
        "aff_domain": "sysu.edu.cn;;sysu.edu.cn;;ucsc.edu",
        "position": "MS student;;Full Professor;;Assistant Professor",
        "bibtex": "@misc{\ngao2024mixcond,\ntitle={{MIXCON}3D: {SYNERGIZING} {MULTI}-{VIEW} {AND} {CROSS}-{MODAL} {CONTRASTIVE} {LEARNING} {FOR} {ENHANCING} 3D {REPRESENTATION}},\nauthor={Yipeng Gao and Zeyu Wang and Wei-Shi Zheng and Cihang Xie and Yuyin Zhou},\nyear={2024},\nurl={https://openreview.net/forum?id=rmA6uFEgIY}\n}",
        "github": "",
        "project": "",
        "reviewers": "7QFb;EuDk;QgYi;Kf2T",
        "site": "https://openreview.net/forum?id=rmA6uFEgIY",
        "pdf_size": 1325856,
        "rating": "3;5;5;5",
        "confidence": "4;5;5;4",
        "soundness": "1;2;3;2",
        "contribution": "1;2;2;2",
        "presentation": "2;2;3;2",
        "wc_summary": "65;70;65;50",
        "wc_strengths": "25;49;41;53",
        "wc_weaknesses": "85;232;276;330",
        "wc_questions": "2;464;108;2",
        "wc_review": "177;815;490;435",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            62.5,
            7.5
        ],
        "wc_strengths_avg": [
            42.0,
            10.723805294763608
        ],
        "wc_weaknesses_avg": [
            230.75,
            91.02575185078122
        ],
        "wc_questions_avg": [
            144.0,
            189.75247033965064
        ],
        "wc_review_avg": [
            479.25,
            227.0224383183301
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:AMblq4fhec4J:scholar.google.com/&scioq=MIXCON3D:+SYNERGIZING+MULTI-VIEW+AND+CROSS-MODAL+CONTRASTIVE+LEARNING+FOR+ENHANCING+3D+REPRESENTATION&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Sun Yat-sen University;University of California, Santa Cruz",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.sysu.edu.cn;https://www.ucsc.edu",
        "aff_unique_abbr": "SYSU;UCSC",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Santa Cruz",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "rmFtICfcd8",
        "title": "Regularized KL-Divergence for well-defined function space variational inference in BNNs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Bayesian neural networks (BNN) promise to combine the predictive performance of neural networks with principled uncertainty modeling important for safety-critical applications and decision making. However, uncertainty estimates depend on the choice of prior, and finding informative priors in weight space has proven difficult. This has motivated variational inference (VI) methods that pose priors directly on the function generated by the BNN rather than on weights. In this paper, we point out that function space VI is ill-posed since the standard objective function (ELBO) is negative infinite for many interesting priors (Burt et al., 2020). Therefore, we argue that a more general framework is needed to perform function space inference in BNNs, and we propose a simple solution using generalized variational inference (Knoblauch et al., 2019) with the regularized KL divergence (Quang, 2019). Experiments show that our inference method accurately approximates the true Gaussian process posterior on synthetic and small real-world data sets, and provides competitive uncertainty estimates for regression and out-of-distribution detection compared to BNN baselines with both function and weight space priors.",
        "keywords": "Bayesian deep learning;Bayesian neural network;Variational inference in function space;Gaussian process;Divergences",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/64bd4010376623926d75978c1139d1c6e886427c.zip",
        "author": "Tristan Cinquin;Robert Bamler",
        "authorids": "~Tristan_Cinquin1;~Robert_Bamler1",
        "gender": ";M",
        "homepage": ";https://robamler.github.io/",
        "dblp": ";195/6208.html",
        "google_scholar": ";LwvdNAgAAAAJ",
        "orcid": ";",
        "linkedin": "tristan-cinquin-60104a144;",
        "or_profile": "~Tristan_Cinquin1;~Robert_Bamler1",
        "aff": "Eberhard-Karls-Universit\u00e4t T\u00fcbingen;University of Tuebingen",
        "aff_domain": "uni-tuebingen.de;uni-tuebingen.de",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\ncinquin2024regularized,\ntitle={Regularized {KL}-Divergence for well-defined function space variational inference in {BNN}s},\nauthor={Tristan Cinquin and Robert Bamler},\nyear={2024},\nurl={https://openreview.net/forum?id=rmFtICfcd8}\n}",
        "github": "",
        "project": "",
        "reviewers": "izSH;PriF;sJLb",
        "site": "https://openreview.net/forum?id=rmFtICfcd8",
        "pdf_size": 1581653,
        "rating": "3;3;5",
        "confidence": "3;4;3",
        "soundness": "3;3;3",
        "contribution": "2;1;2",
        "presentation": "3;3;3",
        "wc_summary": "52;82;99",
        "wc_strengths": "50;35;48",
        "wc_weaknesses": "129;142;133",
        "wc_questions": "4;119;104",
        "wc_review": "235;378;384",
        "wc_reply_reviewers": "55;149;161",
        "wc_reply_authors": "986;821;795",
        "reply_reviewers": "1;1;1",
        "reply_authors": "2;1;1",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            77.66666666666667,
            19.430788855719562
        ],
        "wc_strengths_avg": [
            44.333333333333336,
            6.649979114420001
        ],
        "wc_weaknesses_avg": [
            134.66666666666666,
            5.436502143433363
        ],
        "wc_questions_avg": [
            75.66666666666667,
            51.044642770378516
        ],
        "wc_review_avg": [
            332.3333333333333,
            68.86863501543274
        ],
        "wc_reply_reviewers_avg": [
            121.66666666666667,
            47.39432689913659
        ],
        "wc_reply_authors_avg": [
            867.3333333333334,
            84.57869445407368
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:wOR3NnBBTEsJ:scholar.google.com/&scioq=Regularized+KL-Divergence+for+well-defined+function+space+variational+inference+in+BNNs&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Eberhard Karls University of T\u00fcbingen;University of Tuebingen",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uni-tuebingen.de/;https://www.uni-tuebingen.de/",
        "aff_unique_abbr": "Uni T\u00fcbingen;Uni T\u00fcbingen",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "T\u00fcbingen;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "rmLTwKGiSP",
        "title": "Semi-Anchored Gradient Methods for Nonconvex-Nonconcave Minimax Problems",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Nonconvex-nonconcave minimax problems are difficult to optimize by gradient methods. The extragradient method, proven to outperform the gradient descent ascent, has become standard but there is still room for improvement. On the other hand, under a bilinear setting, the primal-dual hybrid gradient (PDHG) method is one of the most popular methods. This was studied on a general convex-concave problem, but it has not been found useful in a more general nonconvex-nonconcave minimax problem. In this paper, we demonstrate its natural extension to a structured nonconvex-nonconcave minimax problem, whose saddle-subdifferential operator satisfies the weak Minty variational inequality condition, showing its potential. This new nonlinear variant of PDHG, named semi-anchored (SA) gradient method,\nis built upon the theory of Bregman proximal point method. This consequently provides a worst-case convergence rate, in terms of a new optimality measure for nonconvex-nonconcave minimax optimization, making it interesting on its own. We further illustrate the potential of the semi-anchoring by providing a numerical experiment on fair classification problem, in comparison with the extragradient.",
        "keywords": "Optimization;Minimax;PDHG;nonconvex-nonconcave;Weak-MVI",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Sucheol Lee;Donghwan Kim",
        "authorids": "~Sucheol_Lee1;~Donghwan_Kim2",
        "gender": "M;M",
        "homepage": "https://mathsci.kaist.ac.kr/~csfh1379;http://mathsci.kaist.ac.kr/~donghwankim/",
        "dblp": ";05/1032",
        "google_scholar": "https://scholar.google.co.kr/citations?user=hh1Ms7gAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";",
        "linkedin": "https://kr.linkedin.com/in/sucheol-lee-822173216;",
        "or_profile": "~Sucheol_Lee1;~Donghwan_Kim2",
        "aff": "Samsung Advanced Institute of Technology;Korea Advanced Institute of Science & Technology",
        "aff_domain": "samsung.com;kaist.ac.kr",
        "position": "Researcher;Assistant Professor",
        "bibtex": "@misc{\nlee2024semianchored,\ntitle={Semi-Anchored Gradient Methods for Nonconvex-Nonconcave Minimax Problems},\nauthor={Sucheol Lee and Donghwan Kim},\nyear={2024},\nurl={https://openreview.net/forum?id=rmLTwKGiSP}\n}",
        "github": "",
        "project": "",
        "reviewers": "kCcC;Mhw9;vygr;uoZm",
        "site": "https://openreview.net/forum?id=rmLTwKGiSP",
        "pdf_size": 725661,
        "rating": "3;6;6;6",
        "confidence": "3;4;4;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;2",
        "presentation": "2;3;3;2",
        "wc_summary": "58;114;84;95",
        "wc_strengths": "38;20;58;89",
        "wc_weaknesses": "50;234;30;36",
        "wc_questions": "186;38;184;401",
        "wc_review": "332;406;356;621",
        "wc_reply_reviewers": "0;325;0;48",
        "wc_reply_authors": "209;398;167;331",
        "reply_reviewers": "0;2;0;1",
        "reply_authors": "1;2;1;2",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            87.75,
            20.253086184579377
        ],
        "wc_strengths_avg": [
            51.25,
            25.606395685453272
        ],
        "wc_weaknesses_avg": [
            87.5,
            84.89257918098613
        ],
        "wc_questions_avg": [
            202.25,
            129.49589761841878
        ],
        "wc_review_avg": [
            428.75,
            114.16079668607783
        ],
        "wc_reply_reviewers_avg": [
            93.25,
            135.2282792170336
        ],
        "wc_reply_authors_avg": [
            276.25,
            92.57260663932932
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:NA3kYJ5rBmEJ:scholar.google.com/&scioq=Semi-Anchored+Gradient+Methods+for+Nonconvex-Nonconcave+Minimax+Problems&hl=en&as_sdt=0,47",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Samsung;Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "Samsung Advanced Institute of Technology;",
        "aff_unique_url": "https://www.sait.samsung.com;https://www.kaist.ac.kr",
        "aff_unique_abbr": "SAIT;KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "On the Provable Advantage of Unsupervised Pretraining",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17685",
        "id": "rmXXKxQpOR",
        "author_site": "Jiawei Ge, Shange Tang, Jianqing Fan, Chi Jin",
        "tldr": "",
        "abstract": "Unsupervised pretraining, which learns a useful representation using a large amount of unlabeled data to facilitate the learning of downstream tasks, is a critical component of modern large-scale machine learning systems. Despite its tremendous empirical success, the rigorous theoretical understanding of why unsupervised pretraining generally helps remains rather limited---most existing results are restricted to particular methods or approaches for unsupervised pretraining with specialized structural assumptions. This paper studies a generic framework,\nwhere the unsupervised representation learning task is specified by an abstract class of latent variable models $\\Phi$ and the downstream task is specified by a class of prediction functions $\\Psi$. We consider a natural approach of using Maximum Likelihood Estimation (MLE) for unsupervised pretraining and Empirical Risk Minimization (ERM) for learning downstream tasks. We prove that, under a mild ``informative'' condition, our algorithm achieves an excess risk of $\\\\tilde{\\\\mathcal{O}}(\\sqrt{\\mathcal{C}\\_\\Phi/m} + \\sqrt{\\mathcal{C}\\_\\Psi/n})$ for downstream tasks, where $\\mathcal{C}\\_\\Phi, \\mathcal{C}\\_\\Psi$ are complexity measures of function classes $\\Phi, \\Psi$, and $m, n$ are the number of unlabeled and labeled data respectively. Comparing to the baseline of $\\tilde{\\mathcal{O}}(\\sqrt{\\mathcal{C}\\_{\\Phi \\circ \\Psi}/n})$ achieved by performing supervised learning using only the labeled data, our result rigorously shows the benefit of unsupervised pretraining when $m \\gg n$ and $\\mathcal{C}\\_{\\Phi\\circ \\Psi} > \\mathcal{C}\\_\\Psi$. This paper further shows that our generic framework covers a wide range of approaches for unsupervised pretraining, including factor models, Gaussian mixture models, and contrastive learning.",
        "keywords": "unsupervised pretraining; representation learning; sample complexity",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/01e63193367ae76955c420470175e0f38dedf7ca.pdf",
        "author": "Jiawei Ge;Shange Tang;Jianqing Fan;Chi Jin",
        "authorids": "~Jiawei_Ge3;~Shange_Tang1;~Jianqing_Fan1;~Chi_Jin1",
        "gender": "F;M;M;M",
        "homepage": "https://jiaweige0416.github.io/research.html;https://shangetang.github.io/;https://fan.princeton.edu;https://sites.google.com/view/cjin/home",
        "dblp": "https://dblp.org/rec/journals/corr/abs-2303-01566;255/5774;33/2768;126/1802-1",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en;GINhGvwAAAAJ",
        "orcid": ";;0000-0003-3250-7677;",
        "linkedin": "jiawei-ge-b378491bb/;;;",
        "or_profile": "~Jiawei_Ge3;~Shange_Tang1;~Jianqing_Fan1;~Chi_Jin1",
        "aff": "Princeton University;Princeton University;Princeton University;Princeton University",
        "aff_domain": "princeton.edu;princeton.edu;princeton.edu;princeton.edu",
        "position": "PhD student;PhD student;Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nge2024on,\ntitle={On the Provable Advantage of Unsupervised Pretraining},\nauthor={Jiawei Ge and Shange Tang and Jianqing Fan and Chi Jin},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=rmXXKxQpOR}\n}",
        "github": "",
        "project": "",
        "reviewers": "Ht6r;Qu76;rxwf;9yFE",
        "pdf_size": 622567,
        "rating": "6;6;8;8",
        "confidence": "3;3;4;2",
        "soundness": "4;4;4;4",
        "contribution": "2;3;2;3",
        "presentation": "4;3;3;4",
        "wc_summary": "315;109;221;75",
        "wc_strengths": "93;70;205;37",
        "wc_weaknesses": "352;111;204;28",
        "wc_questions": "183;176;28;60",
        "wc_review": "943;466;658;200",
        "wc_reply_reviewers": "0;0;297;0",
        "wc_reply_authors": "474;491;406;249",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            4.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            180.0,
            94.83142938920619
        ],
        "wc_strengths_avg": [
            101.25,
            63.120420625974916
        ],
        "wc_weaknesses_avg": [
            173.75,
            120.27962213109916
        ],
        "wc_questions_avg": [
            111.75,
            68.73272510238482
        ],
        "wc_review_avg": [
            566.75,
            271.36080686053396
        ],
        "wc_reply_reviewers_avg": [
            74.25,
            128.60477246198914
        ],
        "wc_reply_authors_avg": [
            405.0,
            95.51701419119004
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 18,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18027654259376107250&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=rmXXKxQpOR",
        "pdf": "https://openreview.net/pdf?id=rmXXKxQpOR",
        "email": "princeton.edu;princeton.edu;princeton.edu;princeton.edu",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Princeton University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.princeton.edu",
        "aff_unique_abbr": "Princeton",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Intriguing Properties of Generative Classifiers",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17684",
        "id": "rmg0qMKYRQ",
        "author_site": "Priyank Jaini, Kevin Clark, Robert Geirhos",
        "tldr": "",
        "abstract": "What is the best paradigm to recognize objects---discriminative inference (fast but potentially prone to shortcut learning) or using a generative model (slow but potentially more robust)? We build on recent advances in generative modeling that turn text-to-image models into classifiers. This allows us to study their behavior and to compare them against discriminative models and human psychophysical data.\nWe report four intriguing emergent properties of generative classifiers: they show a record-breaking human-like shape bias (99% for Imagen), near human-level out-of-distribution accuracy, state-of-the-art alignment with human classification errors, and they understand certain perceptual illusions. Our results indicate that while the current dominant paradigm for modeling human object recognition is discriminative inference, zero-shot generative models approximate human object recognition data surprisingly well.",
        "keywords": "diffusion models;zero-shot;text-to-image;generative models;human visual perception;psychophysics;cognitive science;neuroscience",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/a9c79fd7baddb6e9f105f1636df6b443f6d2fedb.zip",
        "author": "Priyank Jaini;Kevin Clark;Robert Geirhos",
        "authorids": "~Priyank_Jaini1;~Kevin_Clark1;~Robert_Geirhos1",
        "gender": "M;M;M",
        "homepage": "https://priyankjaini.github.io/;http://cs.stanford.edu/~kevclark/;https://robertgeirhos.com/",
        "dblp": "184/4579;;176/0076",
        "google_scholar": "https://scholar.google.ca/citations?user=keg9BGEAAAAJ;Trk_R8wAAAAJ;w3kGtMIAAAAJ",
        "orcid": ";;0000-0001-7698-3187",
        "linkedin": ";;rgeirhos/",
        "or_profile": "~Priyank_Jaini1;~Kevin_Clark1;~Robert_Geirhos1",
        "aff": "Google;Google;Google DeepMind",
        "aff_domain": "google.com;google.com;google.com",
        "position": "Researcher;Researcher;Research Scientist",
        "bibtex": "@inproceedings{\njaini2024intriguing,\ntitle={Intriguing Properties of Generative Classifiers},\nauthor={Priyank Jaini and Kevin Clark and Robert Geirhos},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=rmg0qMKYRQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "QCiG;tjak;e2eW",
        "pdf_size": 9078942,
        "rating": "8;8;8",
        "confidence": "3;4;4",
        "soundness": "4;2;4",
        "contribution": "3;4;3",
        "presentation": "3;4;4",
        "wc_summary": "168;159;102",
        "wc_strengths": "71;89;57",
        "wc_weaknesses": "41;237;75",
        "wc_questions": "73;61;117",
        "wc_review": "353;546;351",
        "wc_reply_reviewers": "0;202;0",
        "wc_reply_authors": "629;776;471",
        "reply_reviewers": "0;1;0",
        "reply_authors": "1;2;1",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "contribution_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            143.0,
            29.223278392404914
        ],
        "wc_strengths_avg": [
            72.33333333333333,
            13.097921802925667
        ],
        "wc_weaknesses_avg": [
            117.66666666666667,
            85.5154307063286
        ],
        "wc_questions_avg": [
            83.66666666666667,
            24.073960113690383
        ],
        "wc_review_avg": [
            416.6666666666667,
            91.45612184114425
        ],
        "wc_reply_reviewers_avg": [
            67.33333333333333,
            95.2237131997884
        ],
        "wc_reply_authors_avg": [
            625.3333333333334,
            124.54271913238803
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 42,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7271744308070275417&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=rmg0qMKYRQ",
        "pdf": "https://openreview.net/pdf?id=rmg0qMKYRQ",
        "email": "google.com;google.com;google.com",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Google",
        "aff_unique_dep": "Google",
        "aff_unique_url": "https://www.google.com",
        "aff_unique_abbr": "Google",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Mountain View;",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "title": "Stylized Offline Reinforcement Learning: Extracting Diverse High-Quality Behaviors from Heterogeneous Datasets",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17683",
        "id": "rnHNDihrIT",
        "author_site": "Yihuan Mao, Chengjie Wu, Xi Chen, Hao Hu, Ji Jiang, Tianze Zhou, Tangjie Lv, Changjie Fan, Zhipeng Hu, Yi Wu, Yujing Hu, Chongjie Zhang",
        "tldr": "",
        "abstract": "Previous literature on policy diversity in reinforcement learning (RL) either focuses on the online setting or ignores the policy performance. In contrast, offline RL, which aims to learn high-quality policies from batched data, has yet to fully leverage the intrinsic diversity of the offline dataset. Addressing this dichotomy and aiming to balance quality and diversity poses a significant challenge to extant methodologies. This paper introduces a novel approach, termed Stylized Offline RL (SORL), which is designed to extract high-performing, stylistically diverse policies from a dataset characterized by distinct behavioral patterns. Drawing inspiration from the venerable Expectation-Maximization (EM) algorithm, SORL innovatively alternates between policy learning and trajectory clustering, a mechanism that promotes policy diversification. To further augment policy performance, we introduce advantage-weighted style learning into the SORL framework. Experimental evaluations across multiple environments demonstrate the significant superiority of SORL over previous methods in extracting high-quality policies with diverse behaviors. A case in point is that SORL successfully learns strong policies with markedly distinct playing patterns from a real-world human dataset of a popular basketball video game \"Dunk City Dynasty.\"",
        "keywords": "Reinforcement Learning;Diversity in RL;Offline RL",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/a4aefd3668a8a639a907610f6c706f4330ea7f83.zip",
        "author": "Yihuan Mao;Chengjie Wu;Xi Chen;Hao Hu;Ji Jiang;Tianze Zhou;Tangjie Lv;Changjie Fan;Zhipeng Hu;Yi Wu;Yujing Hu;Chongjie Zhang",
        "authorids": "~Yihuan_Mao2;~Chengjie_Wu1;~Xi_Chen18;~Hao_Hu3;~Ji_Jiang1;~Tianze_Zhou2;~Tangjie_Lv1;~Changjie_Fan1;~Zhipeng_Hu1;~Yi_Wu1;~Yujing_Hu2;~Chongjie_Zhang1",
        "gender": ";M;M;M;M;M;M;M;M;;;F",
        "homepage": "http://group.iiis.tsinghua.edu.cn/~milab/person-maoyihuan.html;;https://mousehu.github.io;https://johnjim0816.blog.csdn.net;https://scholar.google.com/citations?user=1NgnAxcAAAAJ&hl=zh-CN;;;;https://jxwuyi.weebly.com;;;",
        "dblp": "232/2328;70/6141;67/6924-6;;;;71/882;;;https://dblp.uni-trier.de/pid/160/1923.html;29/6693;16/3283-51",
        "google_scholar": ";fXL69VsAAAAJ;https://scholar.google.com/citations?hl=en;;1NgnAxcAAAAJ;EIuWpJcAAAAJ;;;dusV5HMAAAAJ;IR5WY-wAAAAJ;LjxqXycAAAAJ;O7X6si8AAAAJ",
        "orcid": ";;;;;0000-0001-9858-809X;0000-0001-5420-0516;0000-0003-4367-0816;;;;",
        "linkedin": ";;hao-hu-tsinghua;;;;;zhipeng-hu-471b5346?trk=pub-pbmap&originalSubdomain=bd;;;;",
        "or_profile": "~Yihuan_Mao2;~Chengjie_Wu1;~Hao_Hu3;~Ji_Jiang1;~Tianze_Zhou2;~Tangjie_Lv1;~Changjie_Fan1;~Zhipeng_Hu1;~Yi_Wu1;~Yujing_Hu2;~Chongjie_Zhang1;~Xi_Chen16",
        "aff": "Tsinghua University;Tsinghua University;Tsinghua University;;;NetEase, Inc.;Netease, Fuxi AI Lab;Zhejiang University, Tsinghua University;Tsinghua University;NetEase, Inc.;Washington University, Saint Louis;Tsinghua University",
        "aff_domain": "mails.tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;;;netease.com;corp.netease.com;zju.edu.cn;tsinghua.edu.cn;corp.netease.com;wustl.edu;tsinghua.edu.cn",
        "position": "PhD student;PhD student;PhD student;;;Researcher;Principal Researcher;PhD student;Assistant Professor;Researcher;Associate Professor;Postdoc",
        "bibtex": "@inproceedings{\nmao2024stylized,\ntitle={Stylized Offline Reinforcement Learning: Extracting Diverse High-Quality Behaviors from Heterogeneous Datasets},\nauthor={Yihuan Mao and Chengjie Wu and Xi Chen and Hao Hu and Ji Jiang and Tianze Zhou and Tangjie Lv and Changjie Fan and Zhipeng Hu and Yi Wu and Yujing Hu and Chongjie Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=rnHNDihrIT}\n}",
        "github": "",
        "project": "",
        "reviewers": "BZGK;HX1W;Xp9f;pT1t",
        "pdf_size": 14252366,
        "rating": "6;6;6;8",
        "confidence": "5;4;5;4",
        "soundness": "2;4;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;2;3",
        "wc_summary": "68;89;165;158",
        "wc_strengths": "74;42;48;100",
        "wc_weaknesses": "269;286;157;279",
        "wc_questions": "129;18;243;3",
        "wc_review": "540;435;613;540",
        "wc_reply_reviewers": "52;18;444;0",
        "wc_reply_authors": "1081;1045;2784;691",
        "reply_reviewers": "1;1;2;0",
        "reply_authors": "3;3;6;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            120.0,
            42.23150482755735
        ],
        "wc_strengths_avg": [
            66.0,
            23.021728866442675
        ],
        "wc_weaknesses_avg": [
            247.75,
            52.741705509018196
        ],
        "wc_questions_avg": [
            98.25,
            96.70929376228533
        ],
        "wc_review_avg": [
            532.0,
            63.43894702783141
        ],
        "wc_reply_reviewers_avg": [
            128.5,
            183.1085743486634
        ],
        "wc_reply_authors_avg": [
            1400.25,
            813.3146300786676
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            3.25,
            1.7853571071357126
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            12,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16316775274075952721&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=rnHNDihrIT",
        "pdf": "https://openreview.net/pdf?id=rnHNDihrIT",
        "email": "mails.tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;;;netease.com;corp.netease.com;zju.edu.cn;tsinghua.edu.cn;corp.netease.com;wustl.edu;tsinghua.edu.cn",
        "author_num": 12,
        "aff_unique_index": "0;0;0;1;2;3;0;1;4;0",
        "aff_unique_norm": "Tsinghua University;NetEase, Inc.;Netease;Zhejiang University;Washington University in St. Louis",
        "aff_unique_dep": ";;Fuxi AI Lab;;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.163.com;https://www.netease.com;http://www.zju.edu.cn;https://wustl.edu",
        "aff_unique_abbr": "THU;NetEase;Netease;ZJU;WUSTL",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Saint Louis",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "rnHqwPH4TZ",
        "title": "T-Stitch: Accelerating Sampling in Pre-Trained Diffusion Models with Trajectory Stitching",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Diffusion probabilistic models (DPMs) achieve great success in generating high-quality data such as images and videos. However, sampling from DPMs at inference time is often expensive for high-quality generation and typically requires hundreds of steps with a large network model. In this paper, we introduce sampling Trajectory Stitching (T-Stitch), a simple yet efficient technique to improve the generation efficiency with little or no loss in the generation quality. Instead of solely using a large DPM for the entire sampling trajectory, T-Stitch first leverages a smaller DPM in the initial steps as a cheap drop-in replacement of the larger DPM and switches to the larger DPM at a later stage. The key reason why T-Stitch works is that different diffusion models learn similar encodings under the same training data distribution. While smaller models are not as effective in refining high-frequency details in later denoising steps, they are still capable of generating good global structures in the early steps. Thus, smaller models can be used in early steps to reduce the computational cost. Notably, T-Stitch does not need any further training and uses only pretrained models. Thus, it can be easily combined with other fast sampling techniques to obtain further efficiency gains across different architectures and samplers. On DiT-XL, for example, 40% of the early timesteps can be safely replaced with a 10x faster DiT-S without performance drop on class-conditional ImageNet generation. By allocating different fractions of small and large DPMs along the sampling trajectory, we can achieve flexible speed and quality trade-offs. We further show that our method can also be used as a drop-in technique to not only accelerate the popular pretrained stable diffusion (SD) models but also improve the prompt alignment of stylized SD models from the public model zoo.",
        "keywords": "diffusion model;model stitching;efficient sampling",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Zizheng Pan;Bohan Zhuang;De-An Huang;Weili Nie;Zhiding Yu;Chaowei Xiao;Jianfei Cai;Anima Anandkumar",
        "authorids": "~Zizheng_Pan1;~Bohan_Zhuang1;~De-An_Huang1;~Weili_Nie1;~Zhiding_Yu1;~Chaowei_Xiao2;~Jianfei_Cai1;~Anima_Anandkumar1",
        "gender": "M;M;M;M;;;M;",
        "homepage": "https://zizhengpan.github.io/;https://bohanzhuang.github.io/;http://ai.stanford.edu/~dahuang/;https://weilinie.github.io/;;;https://jianfei-cai.github.io/;",
        "dblp": "271/4555;145/1096;119/0335;147/4786;;;83/6096;",
        "google_scholar": "https://scholar.google.com.au/citations?user=w_VMopoAAAAJ;https://scholar.google.com.au/citations?user=DFuDBBwAAAAJ;HEY3UzgAAAAJ;zW7BH7oAAAAJ;;;https://scholar.google.com.tw/citations?user=N6czCoUAAAAJ;",
        "orcid": "0000-0002-1717-7844;;;;;;;",
        "linkedin": "zizheng-pan-754845168/;bohan-zhuang/;;;;;;",
        "or_profile": "~Zizheng_Pan1;~Bohan_Zhuang1;~De-An_Huang1;~Weili_Nie1;~Zhiding_Yu1;~Chaowei_Xiao2;~Jianfei_Cai1;~Anima_Anandkumar1",
        "aff": "Monash University;Monash University;NVIDIA;NVIDIA;;;Monash University;",
        "aff_domain": "monash.edu;monash.edu;nvidia.com;nvidia.com;;;monash.edu;",
        "position": "PhD student;Assistant Professor;Research Scientist;Research Scientist;;;Full Professor;",
        "bibtex": "@misc{\npan2024tstitch,\ntitle={T-Stitch: Accelerating Sampling in Pre-Trained Diffusion Models with Trajectory Stitching},\nauthor={Zizheng Pan and Bohan Zhuang and De-An Huang and Weili Nie and Zhiding Yu and Chaowei Xiao and Jianfei Cai and Anima Anandkumar},\nyear={2024},\nurl={https://openreview.net/forum?id=rnHqwPH4TZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "UhCD;omxW;9mJB;tbyv",
        "site": "https://openreview.net/forum?id=rnHqwPH4TZ",
        "pdf_size": 19319591,
        "rating": "3;5;6;8",
        "confidence": "4;4;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "178;60;249;140",
        "wc_strengths": "94;61;164;67",
        "wc_weaknesses": "284;55;90;87",
        "wc_questions": "108;7;48;3",
        "wc_review": "664;183;551;297",
        "wc_reply_reviewers": "54;25;0;17",
        "wc_reply_authors": "774;369;952;305",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "3;3;3;2",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            156.75,
            68.19594929319483
        ],
        "wc_strengths_avg": [
            96.5,
            40.90537861944319
        ],
        "wc_weaknesses_avg": [
            129.0,
            90.53452380169678
        ],
        "wc_questions_avg": [
            41.5,
            42.24038352098617
        ],
        "wc_review_avg": [
            423.75,
            192.31403354929665
        ],
        "wc_reply_reviewers_avg": [
            24.0,
            19.53202498462461
        ],
        "wc_reply_authors_avg": [
            600.0,
            271.36967406104907
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            0.4330127018922193
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.16012815380508713,
        "gs_citation": 17,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2589904855886978134&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;1;0",
        "aff_unique_norm": "Monash University;NVIDIA",
        "aff_unique_dep": ";NVIDIA Corporation",
        "aff_unique_url": "https://www.monash.edu;https://www.nvidia.com",
        "aff_unique_abbr": "Monash;NVIDIA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;1;0",
        "aff_country_unique": "Australia;United States"
    },
    {
        "id": "ro4CgvfUKy",
        "title": "Latent Noise Segmentation: How Neural Noise Leads to the Emergence of Segmentation and Grouping",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep Neural Networks (DNNs) that achieve human-level performance in general tasks like object segmentation typically require supervised labels. In contrast, humans are able to perform these tasks effortlessly without supervision.\nTo accomplish this, the human visual system makes use of perceptual grouping: for example, the black and white stripes of a zebra are perceptually grouped together despite their vastly different colors.\nUnderstanding how perceptual grouping arises in an unsupervised manner is critical for improving both models of the visual system, and computer vision models. In this work, we propose a counterintuitive approach to unsupervised perceptual grouping and segmentation: that they arise because of neural noise, rather than in spite of it. We (1) mathematically demonstrate that under realistic assumptions, neural noise can be used to separate objects from each other, and (2) show that adding noise in a DNN enables the network to segment images even though it was never trained on any segmentation labels. Interestingly, we find that (3) segmenting objects using noise results in segmentation performance that aligns with the perceptual grouping phenomena observed in humans. We introduce the Good Gestalt (GG) datasets --- six datasets designed to specifically test perceptual grouping, and show that our DNN models reproduce many important phenomena in human perception, such as illusory contours, closure, continuity, proximity, and occlusion. Finally, we (4) demonstrate the ecological plausibility of the method by analyzing the sensitivity of the DNN to different magnitudes of noise. We find that some model variants consistently succeed with remarkably low levels of neural noise ($\\sigma<0.001$), and surprisingly, that segmenting this way requires as few as a handful of samples. Together, our results suggest a novel unsupervised segmentation method requiring few assumptions, a new explanation for the formation of perceptual grouping, and a potential benefit of neural noise in the visual system.",
        "keywords": "perceptual grouping;segmentation;neural noise;Gestalt;autoencoders",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "Ben Lonnqvist;Zhengqing Wu;Michael Herzog",
        "authorids": "~Ben_Lonnqvist1;~Zhengqing_Wu1;~Michael_Herzog1",
        "gender": ";M;",
        "homepage": "https://benlonnqvist.github.io/;https://people.epfl.ch/zhengqing.wu?lang=en;https://www.epfl.ch/labs/lpsy/",
        "dblp": ";;",
        "google_scholar": "be0tNVwAAAAJ;;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Ben_Lonnqvist1;~Zhengqing_Wu1;~Michael_Herzog1",
        "aff": "EPFL - EPF Lausanne;EPFL;EPFL - EPF Lausanne",
        "aff_domain": "epfl.ch;ic.epfl.ch;epfl.ch",
        "position": "PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nlonnqvist2024latent,\ntitle={Latent Noise Segmentation: How Neural Noise Leads to the Emergence of Segmentation and Grouping},\nauthor={Ben Lonnqvist and Zhengqing Wu and Michael Herzog},\nyear={2024},\nurl={https://openreview.net/forum?id=ro4CgvfUKy}\n}",
        "github": "",
        "project": "",
        "reviewers": "ipWu;cWdJ;9tYc;zkrR;DELR",
        "site": "https://openreview.net/forum?id=ro4CgvfUKy",
        "pdf_size": 10063675,
        "rating": "3;6;8;8;8",
        "confidence": "3;4;4;5;3",
        "soundness": "2;3;3;4;3",
        "contribution": "1;3;3;4;3",
        "presentation": "3;3;3;4;3",
        "wc_summary": "91;51;119;80;152",
        "wc_strengths": "35;74;103;90;105",
        "wc_weaknesses": "408;384;232;221;20",
        "wc_questions": "6;115;117;2;293",
        "wc_review": "540;624;571;393;570",
        "wc_reply_reviewers": "0;69;73;0;115",
        "wc_reply_authors": "3018;2897;1915;1474;1641",
        "reply_reviewers": "0;1;1;0;1",
        "reply_authors": "6;7;5;5;5",
        "rating_avg": [
            6.6,
            1.9595917942265424
        ],
        "confidence_avg": [
            3.8,
            0.7483314773547882
        ],
        "soundness_avg": [
            3.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            2.8,
            0.9797958971132712
        ],
        "presentation_avg": [
            3.2,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            98.6,
            34.45925129772845
        ],
        "wc_strengths_avg": [
            81.4,
            25.710698162438142
        ],
        "wc_weaknesses_avg": [
            253.0,
            139.24079861879562
        ],
        "wc_questions_avg": [
            106.6,
            105.81606683297201
        ],
        "wc_review_avg": [
            539.6,
            78.13475539092703
        ],
        "wc_reply_reviewers_avg": [
            51.4,
            44.955978467830064
        ],
        "wc_reply_authors_avg": [
            2189.0,
            644.2220114215285
        ],
        "reply_reviewers_avg": [
            0.6,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            5.6,
            0.7999999999999999
        ],
        "replies_avg": [
            41,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.4909902530309828,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11057844675269945673&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "EPFL",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.epfl.ch",
        "aff_unique_abbr": "EPFL",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Lausanne;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Switzerland"
    },
    {
        "title": "Faithful Vision-Language Interpretation via Concept Bottleneck Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17682",
        "id": "rp0EdI8X4e",
        "author_site": "Songning Lai, Lijie Hu, Junxiao Wang, Laure Berti-Equille, Di Wang",
        "tldr": "",
        "abstract": "The demand for transparency in healthcare and finance has led to interpretable machine learning (IML) models, notably the concept bottleneck models (CBMs), valued for their potential in performance and insights into deep neural networks. However, CBM's reliance on manually annotated data poses challenges. Label-free CBMs have emerged to address this, but they remain unstable, affecting their faithfulness as explanatory tools. To address this issue of inherent instability, we introduce a formal definition for an alternative concept called the Faithful Vision-Language Concept (FVLC) model. We present a methodology for constructing an FVLC that satisfies four critical properties. Our extensive experiments on four benchmark datasets using Label-free CBM model architectures demonstrate that our FVLC outperforms other baselines regarding stability against input and concept set perturbations. Our approach incurs minimal accuracy degradation compared to the vanilla CBM, making it a promising solution for reliable and faithful model interpretation.",
        "keywords": "Interpretability ML;Explainability ML;Concept Bottleneck Model",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Songning Lai;Lijie Hu;Junxiao Wang;Laure Berti-Equille;Di Wang",
        "authorids": "~Songning_Lai1;~Lijie_Hu1;~Junxiao_Wang1;~Laure_Berti-Equille1;~Di_Wang1",
        "gender": "M;F;M;F;",
        "homepage": "https://xll0328.github.io;https://lijie-hu.github.io;http://jxiao.wang/;https://laureberti.github.io/website/;",
        "dblp": "347/3526;90/8790;;b/LaureBertiEquille;",
        "google_scholar": "gRXN-rMAAAAJ;C-3UuqsAAAAJ;H6RsGygAAAAJ;https://scholar.google.fr/citations?user=pHwxwjwAAAAJ;",
        "orcid": ";;0000-0001-7263-174X;0000-0002-8046-0570;",
        "linkedin": ";lijie-hu-98045a126;junxiao-wang/;laure-berti-equille/;",
        "or_profile": "~Songning_Lai1;~Lijie_Hu1;~Junxiao_Wang1;~Laure_Berti-Equille1;~Di_Wang1",
        "aff": "Shandong University;KAUST;King Abdullah University of Science and Technology;IRD - Institute of Research for Sustainable Development, France;",
        "aff_domain": "sdu.edu.cn;kaust.edu.sa;kaust.edu.sa;ird.fr;",
        "position": "Undergrad student;PhD student;Postdoc;Principal Researcher;",
        "bibtex": "@inproceedings{\nlai2024faithful,\ntitle={Faithful Vision-Language Interpretation via Concept Bottleneck Models},\nauthor={Songning Lai and Lijie Hu and Junxiao Wang and Laure Berti-Equille and Di Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=rp0EdI8X4e}\n}",
        "github": "",
        "project": "",
        "reviewers": "UywT;W5Db;6N2M;AK8W",
        "pdf_size": 4487326,
        "rating": "5;6;6;8",
        "confidence": "4;3;3;4",
        "soundness": "3;2;4;4",
        "contribution": "3;3;3;4",
        "presentation": "2;3;3;3",
        "wc_summary": "41;86;76;61",
        "wc_strengths": "31;135;71;82",
        "wc_weaknesses": "505;346;272;89",
        "wc_questions": "2;11;2;41",
        "wc_review": "579;578;421;273",
        "wc_reply_reviewers": "0;208;94;0",
        "wc_reply_authors": "1219;565;478;462",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "4;2;2;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            66.0,
            16.95582495781317
        ],
        "wc_strengths_avg": [
            79.75,
            37.1172129880464
        ],
        "wc_weaknesses_avg": [
            303.0,
            149.507524894234
        ],
        "wc_questions_avg": [
            14.0,
            16.015617378046965
        ],
        "wc_review_avg": [
            462.75,
            127.02829409230056
        ],
        "wc_reply_reviewers_avg": [
            75.5,
            85.5847533150619
        ],
        "wc_reply_authors_avg": [
            681.0,
            313.0774664519949
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            1.0897247358851685
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.2294157338705618,
        "gs_citation": 35,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2470000207485940220&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "openreview": "https://openreview.net/forum?id=rp0EdI8X4e",
        "pdf": "https://openreview.net/pdf?id=rp0EdI8X4e",
        "email": "sdu.edu.cn;kaust.edu.sa;kaust.edu.sa;ird.fr;",
        "author_num": 5,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "Shandong University;King Abdullah University of Science and Technology;Institute of Research for Sustainable Development",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.sdu.edu.cn;https://www.kaust.edu.sa;",
        "aff_unique_abbr": "SDU;KAUST;IRD",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;2",
        "aff_country_unique": "China;Saudi Arabia;France"
    },
    {
        "id": "rp5vfyp5Np",
        "title": "BATTLE: Towards Behavior-oriented Adversarial Attacks against Deep Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Evaluating the performance of deep reinforcement learning (DRL) agents under adversarial attacks that aim to induce specific behaviors, i.e., behavior-oriented adversarial attacks, is crucial for understanding the robustness of DRL agents. Prior research primarily focuses on directing agents towards pre-determined states or policies, lacking generality and flexibility. Therefore, it is important to devise universal attacks that target inducing specific behaviors in a victim. In this work, we propose BATTLE, a universal behavior-oriented adversarial attack method. In BATTLE, an intention policy is trained to align with human preferences for flexible behavior orientation, while the adversary is trained to guide the victim policy to imitate the intention policy. To improve the attack performance, we introduce a weighting function that assigns importance weights over each state. Our empirical results over several manipulation tasks of Meta-world show the superiority of BATTLE in behavior-oriented adversarial attack settings, outperforming current adversarial attack algorithms. Furthermore, we also demonstrate that BATTLE can improve the robustness of agents under strong attacks by training with adversary. Lastly, we showcase the strong behavior-inducing capability of BATTLE by guiding Decision Transformer agents to act in line with human preferences across various MuJoCo tasks. Our videos are available in https://sites.google.com/view/jj9uxjgmba5lr3g.",
        "keywords": "deep reinforcement learning;preference-based reinforcement learning;adversarial reinforcement learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/faa9ee992711f2bcd837ee20eb96cec3ed53b740.pdf",
        "author": "Fengshuo Bai;Runze Liu;Yali Du;Ying Wen;Yaodong Yang",
        "authorids": "~Fengshuo_Bai1;~Runze_Liu2;~Yali_Du1;~Ying_Wen1;~Yaodong_Yang1",
        "gender": ";M;;M;M",
        "homepage": "https://changwinde.github.io/;https://ryanliu112.github.io/;;https://yingwen.io;https://www.yangyaodong.com",
        "dblp": "346/1114;235/0682-2;;41/4203-1;170/1496-1",
        "google_scholar": "https://scholar.google.com/citations?hl=en;LiIfGakAAAAJ;;_A1CxG8AAAAJ;https://scholar.google.co.uk/citations?user=6yL0xw8AAAAJ",
        "orcid": ";0009-0007-4784-5333;;0000-0003-1247-2382;0000-0001-8132-5613",
        "linkedin": ";;;wenying45;yaodong-yang",
        "or_profile": "~Fengshuo_Bai1;~Runze_Liu2;~Yali_Du1;~Ying_Wen1;~Yaodong_Yang1",
        "aff": "Shanghai Jiaotong University;Shanghai Artificial Intelligence Laboratory;;Shanghai Jiaotong University;Peking University",
        "aff_domain": "sjtu.edu.cn;pjlab.org.cn;;sjtu.edu.cn;pku.edu.cn",
        "position": "PhD student;Intern;;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nbai2024battle,\ntitle={{BATTLE}: Towards Behavior-oriented Adversarial Attacks against Deep Reinforcement Learning},\nauthor={Fengshuo Bai and Runze Liu and Yali Du and Ying Wen and Yaodong Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=rp5vfyp5Np}\n}",
        "github": "",
        "project": "",
        "reviewers": "h9xo;nUpM;uWsW;6m3H",
        "site": "https://openreview.net/forum?id=rp5vfyp5Np",
        "pdf_size": 3322770,
        "rating": "3;3;5;6",
        "confidence": "4;3;4;4",
        "soundness": "2;3;2;2",
        "contribution": "2;2;2;3",
        "presentation": "2;2;3;2",
        "wc_summary": "111;96;102;131",
        "wc_strengths": "27;36;67;56",
        "wc_weaknesses": "181;369;250;106",
        "wc_questions": "105;17;10;135",
        "wc_review": "424;518;429;428",
        "wc_reply_reviewers": "32;205;35;36",
        "wc_reply_authors": "508;974;855;611",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;2;2;2",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            110.0,
            13.24764129949177
        ],
        "wc_strengths_avg": [
            46.5,
            15.819292019556375
        ],
        "wc_weaknesses_avg": [
            226.5,
            96.75872053722082
        ],
        "wc_questions_avg": [
            66.75,
            54.35243784780955
        ],
        "wc_review_avg": [
            449.75,
            39.44854243188207
        ],
        "wc_reply_reviewers_avg": [
            77.0,
            73.91549228680006
        ],
        "wc_reply_authors_avg": [
            737.0,
            186.01747229763123
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5555555555555555,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:-hG5LxLZ4FkJ:scholar.google.com/&scioq=BATTLE:+Towards+Behavior-oriented+Adversarial+Attacks+against+Deep+Reinforcement+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "Shanghai Jiao Tong University;Shanghai Artificial Intelligence Laboratory;Peking University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.sjtu.edu.cn;http://www.shailab.org/;http://www.pku.edu.cn",
        "aff_unique_abbr": "SJTU;Shanghai AI Lab;Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "An Efficient Membership Inference Attack for the Diffusion Model by Proximal Initialization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17681",
        "id": "rpH9FcCEV6",
        "author_site": "Fei Kong, Jinhao Duan, ruipeng ma, Heng Tao Shen, Xiaoshuang Shi, Xiaofeng Zhu, Kaidi Xu",
        "tldr": "",
        "abstract": "Recently, diffusion models have achieved remarkable success in generating tasks, including image and audio generation. However, like other generative models, diffusion models are prone to privacy issues. In this paper, we propose an efficient query-based membership inference attack (MIA), namely Proximal Initialization Attack (PIA), which utilizes groundtruth trajectory obtained by $\\epsilon$ initialized in $t=0$ and predicted point to infer memberships. Experimental results indicate that the proposed method can achieve competitive performance with only two queries that achieve at least 6$\\times$ efficiency than the previous SOTA baseline on both discrete-time and continuous-time diffusion models. Moreover, previous works on the privacy of diffusion models have focused on vision tasks without considering audio tasks. Therefore, we also explore the robustness of diffusion models to MIA in the text-to-speech (TTS) task, which is an audio generation task. To the best of our knowledge, this work is the first to study the robustness of diffusion models to MIA in the TTS task. Experimental results indicate that models with mel-spectrogram (image-like) output are vulnerable to MIA, while models with audio output are relatively robust to MIA. Code is available at https://github.com/kong13661/PIA.",
        "keywords": "MIA;Diffusion Model;Text-To-Speech",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/5580d5a52cc6632613fbb95f613b9143895a0cc9.zip",
        "author": "Fei Kong;Jinhao Duan;RuiPeng Ma;Heng Tao Shen;Xiaoshuang Shi;Xiaofeng Zhu;Kaidi Xu",
        "authorids": "~Fei_Kong1;~Jinhao_Duan1;~RuiPeng_Ma1;~Heng_Tao_Shen3;~Xiaoshuang_Shi1;~Xiaofeng_Zhu7;~Kaidi_Xu1",
        "gender": "M;M;M;Not Specified;M;M;M",
        "homepage": "https://github.com/kong13661;https://jinhaoduan.github.io;https://github.com/RP0929;http://plaza.ufl.edu/xsshi2015/;https://sites.google.com/site/seanzhuxf/;https://kaidixu.com/;https://cfm.uestc.edu.cn/~shenht/",
        "dblp": "19/2168;282/2912;;87/10627;60/4671-1;195/8175;s/HTShen",
        "google_scholar": ";aWeTAXYAAAAJ;;BWGQt3YAAAAJ;https://scholar.google.com/citations?hl=en;lYK0wlsAAAAJ;https://scholar.google.com.au/citations?user=krryaDkAAAAJ",
        "orcid": "0000-0003-1888-2091;;;;0000-0001-6840-0578;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Fei_Kong1;~Jinhao_Duan1;~RuiPeng_Ma1;~Xiaoshuang_Shi1;~Xiaofeng_Zhu7;~Kaidi_Xu1;~Hengtao_Shen1",
        "aff": "University of Electronic Science and Technology of China;Drexel University;University of Electronic Science and Technology of China;University of Electronic Science and Technology of China;University of Electronic Science and Technology of China;Drexel University;Tongji University",
        "aff_domain": "uestc.edu.cn;drexel.edu;uestc.edu.cn;uestc.edu.cn;uestc.edu.cn;drexel.edu;tongji.edu.cn",
        "position": "PhD student;PhD student;MS student;Full Professor;Full Professor;Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\nkong2024an,\ntitle={An Efficient Membership Inference Attack for the Diffusion Model by Proximal Initialization},\nauthor={Fei Kong and Jinhao Duan and RuiPeng Ma and Heng Tao Shen and Xiaoshuang Shi and Xiaofeng Zhu and Kaidi Xu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=rpH9FcCEV6}\n}",
        "github": "",
        "project": "",
        "reviewers": "Vi3v;nuWm;7qyp;Jy2D",
        "pdf_size": 5488947,
        "rating": "6;8;8;8",
        "confidence": "4;4;4;4",
        "soundness": "4;4;3;4",
        "contribution": "3;3;3;4",
        "presentation": "3;4;4;3",
        "wc_summary": "82;77;63;47",
        "wc_strengths": "85;157;77;20",
        "wc_weaknesses": "74;86;54;49",
        "wc_questions": "76;38;26;44",
        "wc_review": "317;358;220;160",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "535;560;409;490",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            67.25,
            13.608361400256829
        ],
        "wc_strengths_avg": [
            84.75,
            48.664026754883324
        ],
        "wc_weaknesses_avg": [
            65.75,
            14.972892172189045
        ],
        "wc_questions_avg": [
            46.0,
            18.49324200890693
        ],
        "wc_review_avg": [
            263.75,
            78.0972950876021
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            498.5,
            57.4390981823357
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 35,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5640618053180026850&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=rpH9FcCEV6",
        "pdf": "https://openreview.net/pdf?id=rpH9FcCEV6",
        "email": "uestc.edu.cn;drexel.edu;uestc.edu.cn;uestc.edu.cn;uestc.edu.cn;drexel.edu;tongji.edu.cn",
        "author_num": 7,
        "aff_unique_index": "0;1;0;0;0;1;2",
        "aff_unique_norm": "University of Electronic Science and Technology of China;Drexel University;Tongji University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.uestc.edu.cn;https://www.drexel.edu;https://www.tongji.edu.cn",
        "aff_unique_abbr": "UESTC;Drexel;Tongji",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "rpP1eWWgOs",
        "title": "Surface Representation in LiDAR Scenes",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Learning from point clouds entails knowledge of local shape geometry. Recent efforts have succeeded in representing synthetic point clouds as surfels. However, these methods struggle to deal with LiDAR point clouds captured from real scans, which are sparse, uneven, and larger-scale. In this paper, we introduce \\textbf{RealSurf}, a general framework that processes point clouds under extreme conditions like autonomous driving scenarios. We identify several key challenges in applying surface representations to real scans and propose solutions to these challenges: Point Sliding Module that jitters point coordinates within the reconstructed surfels for geometric feature computation, and LiDAR-based surfel reconstruction process that enables models to directly construct surfels from LiDAR point clouds by attenuating unevenness. We evaluate our approach on a diverse set of benchmarks, including nuScenes, SemanticKITTI, and Waymo. RealSurf, with a simple PointNet++ backbone, outperforms its counterparts by a significant margin while remaining efficient. By achieving state-of-the-art results on three benchmarks through a fair and unbiased comparison, RealSurf brings renewed attention to the effectiveness of point-based methods in LiDAR segmentation. Code will be publicly available upon publication.",
        "keywords": "Surface Representation;LiDAR Segmentation;Representation Learning;Autonomous Driving",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/1850ddd4beba3ed0d8b98fc4fcac58cb2ec7d8f8.pdf",
        "author": "Haoxi Ran;Xiangru Huang;Vitor Campagnolo Guizilini;Yue Wang",
        "authorids": "~Haoxi_Ran1;~Xiangru_Huang1;~Vitor_Campagnolo_Guizilini2;~Yue_Wang2",
        "gender": "M;M;M;M",
        "homepage": "https://haoxiran.com;https://people.csail.mit.edu/xrhuang/;;https://yuewang.xyz",
        "dblp": "279/3600;134/4071;;33/4822-41",
        "google_scholar": "FxBvRNUAAAAJ;0Out9QwAAAAJ;UH9tP6QAAAAJ;v-AEFIEAAAAJ",
        "orcid": ";;;",
        "linkedin": "haoxi-ran/;;vitorguizilini/;",
        "or_profile": "~Haoxi_Ran1;~Xiangru_Huang1;~Vitor_Campagnolo_Guizilini2;~Yue_Wang2",
        "aff": "Carnegie Mellon University;Westlake University;Toyota Research Institute;NVIDIA",
        "aff_domain": "cmu.edu;westlake.edu.cn;tri.global;nvidia.com",
        "position": "MS student;Assistant Professor;Staff Research Scientist;Researcher",
        "bibtex": "@misc{\nran2024surface,\ntitle={Surface Representation in Li{DAR} Scenes},\nauthor={Haoxi Ran and Xiangru Huang and Vitor Campagnolo Guizilini and Yue Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=rpP1eWWgOs}\n}",
        "github": "",
        "project": "",
        "reviewers": "TgQF;7faG;AzRp;i3Qi",
        "site": "https://openreview.net/forum?id=rpP1eWWgOs",
        "pdf_size": 41080498,
        "rating": "5;5;5;6",
        "confidence": "4;4;4;3",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "77;92;56;85",
        "wc_strengths": "50;29;35;36",
        "wc_weaknesses": "275;141;64;217",
        "wc_questions": "12;28;52;10",
        "wc_review": "414;290;207;348",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "469;623;460;635",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            77.5,
            13.5
        ],
        "wc_strengths_avg": [
            37.5,
            7.697402159170326
        ],
        "wc_weaknesses_avg": [
            174.25,
            79.43354140411971
        ],
        "wc_questions_avg": [
            25.5,
            16.815171720800237
        ],
        "wc_review_avg": [
            314.75,
            76.12284479707783
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            546.75,
            82.42079531283352
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:oeSlrn6qlXEJ:scholar.google.com/&scioq=Surface+Representation+in+LiDAR+Scenes&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Carnegie Mellon University;Westlake University;Toyota Research Institute;NVIDIA",
        "aff_unique_dep": ";;;NVIDIA Corporation",
        "aff_unique_url": "https://www.cmu.edu;https://www.westlake.edu.cn;https://www.tri.global;https://www.nvidia.com",
        "aff_unique_abbr": "CMU;WU;TRI;NVIDIA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "rpwES4pe9W",
        "title": "Refined Tensorial Radiance Field: Harnessing coordinate based networks for novel view synthesis from sparse inputs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The multi-plane encoding approach has been highlighted for its ability to serve as static and dynamic neural radiance fields without sacrificing generality.\nThis approach constructs related features through projection onto learnable planes and interpolating adjacent vertices. This mechanism allows the model to learn fine-grained details rapidly and achieves outstanding performance. \nHowever, it has limitations in representing the global context of the scene, such as object shapes and dynamic motion over times when available training poses are sparse. \nIn this work, we propose refined tensorial radiance fields that harness coordinate-based networks known for strong bias toward low-frequency signals.\nThe coordinate-based network is responsible for capturing global context, while the multi-plane network focuses on capturing fine-grained details.\nWe demonstrate that using residual connections effectively preserves their inherent properties.\nAdditionally, the proposed curriculum training scheme accelerates the disentanglement of these two features. \nWe empirically show that the proposed method achieves comparable results to multi-plane encoding with high denoising penalties in static NeRFs. Meanwhile, it outperforms others for the task with dynamic NeRFs using sparse inputs.\nIn particular, we prove that excessively increasing denoising regularization for multi-plane encoding effectively eliminates artifacts; however, it can lead to artificial details that appear authentic but are not present in the data. \nOn the other hand, we note that the proposed method does not suffer from this issue.",
        "keywords": "neural radiance field;multi-plane encoding;coordinate-based network;sparse-inputs;few-shots;regularization",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/922f7c355a86ac0c25bb326bdcf373555034967c.zip",
        "author": "Mingyu Kim;Kim Jun-Seong;Se-Young Yun;Jin-Hwa Kim",
        "authorids": "~Mingyu_Kim2;~Kim_Jun-Seong1;~Se-Young_Yun1;~Jin-Hwa_Kim1",
        "gender": "M;M;Unspecified;M",
        "homepage": ";https://fbsqkd.github.io;http://wityworks.com;https://mingyukim87.github.io",
        "dblp": "326/5743;23/8862;48/258;64/10624-2",
        "google_scholar": "CMqYPY8AAAAJ;X_IAjb8AAAAJ;https://scholar.google.co.kr/citations?user=3f2wPekAAAAJ;nrZYdwQAAAAJ",
        "orcid": ";;0000-0002-0423-0415;0000-0001-5082-7223",
        "linkedin": "junseong-kim-325120255/;seyoung-yun-395130ab/;;mingyu-kim-0380a2125/",
        "or_profile": "~Kim_Jun-Seong1;~Se-Young_Yun1;~Jin-Hwa_Kim1;~Kim_Mingyu1",
        "aff": "Pohang University of Science and Technology;KAIST;NAVER;Korea Advanced Institute of Science & Technology",
        "aff_domain": "postech.edu;kaist.ac.kr;navercorp.com;kaist.ac.kr",
        "position": "PhD student;Assistant Professor;Research Scientist;PhD student",
        "bibtex": "@misc{\nkim2024refined,\ntitle={Refined Tensorial Radiance Field: Harnessing coordinate based networks for novel view synthesis from sparse inputs},\nauthor={Mingyu Kim and Kim Jun-Seong and Se-Young Yun and Jin-Hwa Kim},\nyear={2024},\nurl={https://openreview.net/forum?id=rpwES4pe9W}\n}",
        "github": "",
        "project": "",
        "reviewers": "D6bb;YmuZ;r4Vs;CJze",
        "site": "https://openreview.net/forum?id=rpwES4pe9W",
        "pdf_size": 30474904,
        "rating": "3;5;5;6",
        "confidence": "4;3;4;5",
        "soundness": "3;3;3;2",
        "contribution": "2;2;2;2",
        "presentation": "2;2;3;3",
        "wc_summary": "104;50;86;114",
        "wc_strengths": "74;16;40;43",
        "wc_weaknesses": "99;68;197;300",
        "wc_questions": "86;4;55;56",
        "wc_review": "363;138;378;513",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1120;340;1261;1339",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;3;3",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            88.5,
            24.387496796514398
        ],
        "wc_strengths_avg": [
            43.25,
            20.60794749605113
        ],
        "wc_weaknesses_avg": [
            166.0,
            90.84327162756745
        ],
        "wc_questions_avg": [
            50.25,
            29.46502163583119
        ],
        "wc_review_avg": [
            348.0,
            134.5826883369477
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1015.0,
            397.53679075023985
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3244428422615251,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:FSQCKuvXOCIJ:scholar.google.com/&scioq=Refined+Tensorial+Radiance+Field:+Harnessing+coordinate+based+networks+for+novel+view+synthesis+from+sparse+inputs&hl=en&as_sdt=0,44",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "Pohang University of Science and Technology;Korea Advanced Institute of Science and Technology;NAVER Corporation",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.postech.ac.kr;https://www.kaist.ac.kr;https://www.naver.com",
        "aff_unique_abbr": "POSTECH;KAIST;NAVER",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Pohang;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "rr4OccbgJi",
        "title": "A Lennard-Jones Layer for Distribution Normalization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We introduce a Lennard-Jones layer (LJL) to equalize the density across the distribution of 2D and 3D point clouds by systematically rearranging points without destroying their overall structure (distribution normalization). LJL simulates a dissipative process of repulsive and weakly attractive interactions between individual points by solely considering the nearest neighbor of each point at a given moment in time. This pushes the particles into a potential valley, reaching a well-defined stable configuration that approximates an equidistant sampling after the stabilization process. We apply LJLs to redistribute randomly generated point clouds into a randomized uniform distribution. Moreover, LJLs are embedded in point cloud generative network architectures by adding them at later stages of the inference process. The improvements coming with LJLs for generating 3D point clouds are evaluated qualitatively and quantitatively. Finally, we apply LJLs to improve the point distribution of a score-based 3D point cloud denoising network. In general, we demonstrate that LJLs are effective for distribution normalization which can be applied at negligible cost without retraining the given neural networks.",
        "keywords": "Lennard-Jones Potential;Network Architecture;Point Cloud Generation;Point Cloud Denoising;Blue Noise",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/7544f44a2e35c3adf681a0d1f2a24fcf2112a85f.zip",
        "author": "Mulun Na;Jonathan Klein;Dmitry Lyakhov;Biao Zhang;Wojciech Pa\u0142ubicki;Soren Pirk;Dominik Michels",
        "authorids": "~Mulun_Na1;~Jonathan_Klein2;~Dmitry_Lyakhov1;~Biao_Zhang5;wojciech.palubicki@amu.edu.pl;~Soren_Pirk2;~Dominik_Michels1",
        "gender": ";M;M;;;;M",
        "homepage": ";https://jonathank.de/research/;http://www.lyakhov.com/;https://1zb.github.io;;;https://www.kaust.edu.sa/en/study/faculty/dominik-michels",
        "dblp": ";22/5462;;83/3266-5;;;131/3147",
        "google_scholar": ";wzejV1EAAAAJ;fAqzm70AAAAJ;h5KukxEAAAAJ;;;",
        "orcid": "0000-0002-8843-8845;0000-0001-6560-0988;;;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Mulun_Na1;~Jonathan_Klein2;~Dmitry_Lyakhov1;~Biao_Zhang5;wojciech.palubicki@amu.edu.pl;~Soren_Pirk2;~Dominik_Michels1",
        "aff": "King Abdullah University of Science and Technology;King Abdullah University of Science and Technology;King Abdullah University of Science and Technology;KAUST;;;KAUST",
        "aff_domain": "kaust.edu.sa;kaust.edu.sa;kaust.edu.sa;kaust.edu.sa;;;kaust.edu.sa",
        "position": "PhD student;Researcher;Researcher;Postdoc;;;Associate Professor",
        "bibtex": "@misc{\nanonymous2024a,\ntitle={A Lennard-Jones Layer for Distribution Normalization},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=rr4OccbgJi}\n}",
        "github": "",
        "project": "",
        "reviewers": "tpha;bzSA;8NiC;yVcr",
        "site": "https://openreview.net/forum?id=rr4OccbgJi",
        "pdf_size": 46245114,
        "rating": "3;3;5;6",
        "confidence": "4;3;3;3",
        "soundness": "3;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;2;3",
        "wc_summary": "163;89;53;70",
        "wc_strengths": "97;59;58;57",
        "wc_weaknesses": "298;201;227;172",
        "wc_questions": "6;59;6;9",
        "wc_review": "564;408;344;308",
        "wc_reply_reviewers": "0;71;0;24",
        "wc_reply_authors": "175;240;73;211",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            93.75,
            41.96054694591099
        ],
        "wc_strengths_avg": [
            67.75,
            16.90229274388537
        ],
        "wc_weaknesses_avg": [
            224.5,
            46.682437811236895
        ],
        "wc_questions_avg": [
            20.0,
            22.54994456755936
        ],
        "wc_review_avg": [
            406.0,
            98.0
        ],
        "wc_reply_reviewers_avg": [
            23.75,
            28.98598799420161
        ],
        "wc_reply_authors_avg": [
            174.75,
            63.0966520506437
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5555555555555555,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:-k9TDmiC7BwJ:scholar.google.com/&scioq=A+Lennard-Jones+Layer+for+Distribution+Normalization&hl=en&as_sdt=0,5",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "King Abdullah University of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kast.kau.edu.sa",
        "aff_unique_abbr": "KAUST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Saudi Arabia"
    },
    {
        "id": "rrCF6WasY8",
        "title": "Distributed DPHelmet: Differentially Private Non-interactive Convex Blind Averaging",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Differentially private massively distributed learning poses one key challenge when compared to differentially private centralized learning, where all data are aggregated at one party: minimizing communication overhead while achieving strong utility-privacy tradeoffs. The minimal amount of communication for distributed learning is non-interactive communication, i.e., each party only sends one message.\n\nIn this work, we propose two differentially private, non-interactive, distributed learning algorithms in a framework called \nSecure Distributed \\helmet. This framework is based on what we coin blind averaging: each party locally learns and noises a model and all parties then jointly compute the mean of their models via a secure summation protocol (e.g., secure multiparty computation). The learning algorithms we consider for blind averaging are empirical risk minimizers (ERM) like SVMs and Softmax-activated single-layer perception (Softmax-SLP). We show that blind averaging preserves privacy if the models are averaged via secure summation and the objective function is smooth, Lipschitz, and strongly convex. We show that the objective function of Softmax-SLP fulfills these criteria, which implies leave-one-out robustness and might be of independent interest.\n\nOn the practical side, we provide experimental evidence that blind averaging for SVMs and Softmax-SLP can have a strong utility-privacy tradeoff: we reach an accuracy of $86$ \\% on CIFAR-10 for $\\varepsilon = 0.36$ and $1{,}000$ users and of $44$ \\% on CIFAR-100 for $\\varepsilon = 1.18$ and $100$ users, both after a SimCLR-based pre-training. As an ablation, we study the resilience of our approach to a strongly non-IID setting.\nOn the theoretical side, we show that in the limit blind averaging hinge-loss based SVMs convergences to the centralized learned SVM.\nOur approach is based on the representer theorem and can be seen as a blueprint for finding convergence for other ERM problems like Softmax-SLP.",
        "keywords": "differential privacy;distributed learning;privacy-preserving machine learning;privacy;federated learning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/6d2c89ced2089f84e37f9aca6d5d64ce249d320d.zip",
        "author": "Moritz Kirschte;Sebastian Meiser;Saman Ardalan;Esfandiar Mohammadi",
        "authorids": "~Moritz_Kirschte1;~Sebastian_Meiser1;~Saman_Ardalan1;~Esfandiar_Mohammadi1",
        "gender": ";;;M",
        "homepage": ";;;https://mohammadi.eu",
        "dblp": ";02/7901-1;;77/8938",
        "google_scholar": ";;;",
        "orcid": "0009-0000-8138-7208;;;",
        "linkedin": "kirschte/;;https://www.linkedin.com/feed/;",
        "or_profile": "~Moritz_Kirschte1;~Sebastian_Meiser1;~Saman_Ardalan1;~Esfandiar_Mohammadi1",
        "aff": "University of Luebeck;Universit\u00e4t zu L\u00fcbeck;Christian-Albrechts-Universit\u00e4t Kiel;Universit\u00e4t zu L\u00fcbeck",
        "aff_domain": "uni-luebeck.de;uni-luebeck.de;uni-kiel.de;uni-luebeck.de",
        "position": "PhD student;Researcher;Researcher;Associate Professor",
        "bibtex": "@misc{\nkirschte2024distributed,\ntitle={Distributed {DPH}elmet: Differentially Private Non-interactive Convex Blind Averaging},\nauthor={Moritz Kirschte and Sebastian Meiser and Saman Ardalan and Esfandiar Mohammadi},\nyear={2024},\nurl={https://openreview.net/forum?id=rrCF6WasY8}\n}",
        "github": "",
        "project": "",
        "reviewers": "91JF;jg5A;ooDC;VsvY",
        "site": "https://openreview.net/forum?id=rrCF6WasY8",
        "pdf_size": 2250331,
        "rating": "3;5;5;6",
        "confidence": "4;3;4;3",
        "soundness": "2;3;3;2",
        "contribution": "1;2;3;3",
        "presentation": "1;2;2;2",
        "wc_summary": "45;58;54;97",
        "wc_strengths": "21;22;31;99",
        "wc_weaknesses": "53;165;383;101",
        "wc_questions": "197;30;79;166",
        "wc_review": "316;275;547;463",
        "wc_reply_reviewers": "0;0;137;29",
        "wc_reply_authors": "1218;466;1178;918",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "2;1;2;2",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            63.5,
            19.90602923739438
        ],
        "wc_strengths_avg": [
            43.25,
            32.42202183701689
        ],
        "wc_weaknesses_avg": [
            175.5,
            126.21707491460892
        ],
        "wc_questions_avg": [
            118.0,
            66.72705598181295
        ],
        "wc_review_avg": [
            400.25,
            109.83937135654045
        ],
        "wc_reply_reviewers_avg": [
            41.5,
            56.39370532249144
        ],
        "wc_reply_authors_avg": [
            945.0,
            299.57803657811763
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.6882472016116854,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:qnGjqFL55tsJ:scholar.google.com/&scioq=Distributed+DPHelmet:+Differentially+Private+Non-interactive+Convex+Blind+Averaging&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "University of Luebeck;University of L\u00fcbeck;Christian-Albrechts-Universit\u00e4t",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.uni-luebeck.de;https://www.uni-luebeck.de;https://www.uni-kiel.de",
        "aff_unique_abbr": "UL;UzL;CAU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Kiel",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "rsCm0f85C7",
        "title": "xxx",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "xxx",
        "keywords": "Diffusion Models;Schrodinger Bridge Problem;Score-Based Generative Modelling",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Richard Jiang",
        "authorids": "~Richard_Jiang3",
        "gender": "M",
        "homepage": "https://wp.lancs.ac.uk/autobrain",
        "dblp": "70/8305",
        "google_scholar": "NuyoNc4AAAAJ",
        "orcid": "0000-0003-1721-9474",
        "linkedin": "",
        "or_profile": "~Richard_M._Jiang1",
        "aff": "Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn",
        "position": "Visiting Scholar",
        "bibtex": "@misc{\njiang2024xxx,\ntitle={xxx},\nauthor={Richard Jiang},\nyear={2024},\nurl={https://openreview.net/forum?id=rsCm0f85C7}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=rsCm0f85C7",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0",
        "aff_unique_norm": "Shanghai Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sjtu.edu.cn",
        "aff_unique_abbr": "SJTU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "rsCm0f85C7",
        "title": "xxx",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "xxx",
        "keywords": "Diffusion Models;Schrodinger Bridge Problem;Score-Based Generative Modelling",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Richard Jiang",
        "authorids": "~Richard_Jiang3",
        "gender": "M",
        "homepage": "https://wp.lancs.ac.uk/autobrain",
        "dblp": "70/8305",
        "google_scholar": "NuyoNc4AAAAJ",
        "orcid": "0000-0003-1721-9474",
        "linkedin": "",
        "or_profile": "~Richard_M._Jiang1",
        "aff": "Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn",
        "position": "Visiting Scholar",
        "bibtex": "@misc{\njiang2024xxx,\ntitle={xxx},\nauthor={Richard Jiang},\nyear={2024},\nurl={https://openreview.net/forum?id=rsCm0f85C7}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=rsCm0f85C7",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0",
        "aff_unique_norm": "Shanghai Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sjtu.edu.cn",
        "aff_unique_abbr": "SJTU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "title": "DistillSpec: Improving Speculative Decoding via Knowledge Distillation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17680",
        "id": "rsY6J3ZaTF",
        "author_site": "Yongchao Zhou, Kaifeng Lyu, Ankit Singh Rawat, Aditya Krishna Menon, Afshin Rostamizadeh, Sanjiv Kumar, Jean-Fran\u00e7ois Kagy, Rishabh Agarwal",
        "tldr": "",
        "abstract": "Speculative decoding~(SD) accelerates large language model inference by employing a faster {\\em draft} model for generating multiple tokens, which are then verified in parallel by the larger {\\em target} model, resulting in the text generated according to the target model distribution. However, identifying a compact draft model that is well-aligned with the target model is challenging. To tackle this issue, we propose {\\em DistillSpec} that uses knowledge distillation to better align the draft model with the target model, before applying SD. DistillSpec makes two key design choices, which we demonstrate via systematic study to be crucial to improve the draft and target alignment: utilizing \\emph{on-policy} data generation from the draft model, and \\emph{tailoring the divergence function} to the task and decoding strategy. Notably, DistillSpec yields impressive $10 - 45\\%$ speedups over standard SD on a range of standard benchmarks, using both greedy and non-greedy sampling. Furthermore, we combine DistillSpec with lossy SD to achieve fine-grained control over the latency vs. task performance trade-off. Finally, in practical scenarios with models of varying sizes, first using distillation to boost the performance of the target model and then applying DistillSpec to train a well-aligned draft model can reduce decoding latency by $6 - 10\\times$ with minimal performance drop, compared to standard decoding without distillation.",
        "keywords": "large language model;knowledge distillation;speculative decoding",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Yongchao Zhou;Kaifeng Lyu;Ankit Singh Rawat;Aditya Krishna Menon;Afshin Rostamizadeh;Sanjiv Kumar;Jean-Fran\u00e7ois Kagy;Rishabh Agarwal",
        "authorids": "~Yongchao_Zhou1;~Kaifeng_Lyu2;~Ankit_Singh_Rawat1;~Aditya_Krishna_Menon1;~Afshin_Rostamizadeh1;~Sanjiv_Kumar1;~Jean-Fran\u00e7ois_Kagy1;~Rishabh_Agarwal2",
        "gender": "M;M;M;;;;;M",
        "homepage": ";https://kaifeng.ac/;https://ankitsrawat.github.io/home/;;;http://www.sanjivk.com/;;https://agarwl.github.io",
        "dblp": ";220/3283;https://dblp.org/pers/hd/r/Rawat:Ankit_Singh;;97/4479;;;",
        "google_scholar": "35M6rhsAAAAJ;843JJtgAAAAJ;http://scholar.google.com/citations?user=U0_ab4cAAAAJ;;;https://scholar.google.com/citations?hl=en;;https://scholar.google.ca/citations?user=aH8AJu4AAAAJ",
        "orcid": ";;;;;;;",
        "linkedin": "yongchao-zhou-a298a7158/;;;;;;;",
        "or_profile": "~Yongchao_Zhou1;~Kaifeng_Lyu2;~Ankit_Singh_Rawat1;~Aditya_Krishna_Menon1;~Afshin_Rostamizadeh1;~Sanjiv_Kumar1;~Jean-Fran\u00e7ois_Kagy1;~Rishabh_Agarwal2",
        "aff": "University of Toronto;Princeton University;Google;;Google;Google;;Google DeepMind",
        "aff_domain": "mail.utoronto.ca;princeton.edu;google.com;;google.com;google.com;;google.com",
        "position": "PhD student;PhD student;Research Scientist;;Researcher;Research Scientist;;Research Scientist",
        "bibtex": "@inproceedings{\nzhou2024distillspec,\ntitle={DistillSpec: Improving Speculative Decoding via Knowledge Distillation},\nauthor={Yongchao Zhou and Kaifeng Lyu and Ankit Singh Rawat and Aditya Krishna Menon and Afshin Rostamizadeh and Sanjiv Kumar and Jean-Fran{\\c{c}}ois Kagy and Rishabh Agarwal},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=rsY6J3ZaTF}\n}",
        "github": "",
        "project": "",
        "reviewers": "p4vK;GLMj;gZt5",
        "pdf_size": 1464801,
        "rating": "6;6;6",
        "confidence": "4;3;3",
        "soundness": "3;3;3",
        "contribution": "3;3;2",
        "presentation": "3;2;2",
        "wc_summary": "50;77;66",
        "wc_strengths": "58;81;70",
        "wc_weaknesses": "62;259;121",
        "wc_questions": "11;48;2",
        "wc_review": "181;465;259",
        "wc_reply_reviewers": "0;32;26",
        "wc_reply_authors": "638;2027;1497",
        "reply_reviewers": "0;1;1",
        "reply_authors": "1;3;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            64.33333333333333,
            11.08552609887726
        ],
        "wc_strengths_avg": [
            69.66666666666667,
            9.392668535736913
        ],
        "wc_weaknesses_avg": [
            147.33333333333334,
            82.5523402992846
        ],
        "wc_questions_avg": [
            20.333333333333332,
            19.90533150244482
        ],
        "wc_review_avg": [
            301.6666666666667,
            119.80354288955269
        ],
        "wc_reply_reviewers_avg": [
            19.333333333333332,
            13.888444437333106
        ],
        "wc_reply_authors_avg": [
            1387.3333333333333,
            572.3345952228373
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 86,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17317594122323539732&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=rsY6J3ZaTF",
        "pdf": "https://openreview.net/pdf?id=rsY6J3ZaTF",
        "email": "mail.utoronto.ca;princeton.edu;google.com;;google.com;google.com;;google.com",
        "author_num": 8,
        "aff_unique_index": "0;1;2;2;2;2",
        "aff_unique_norm": "University of Toronto;Princeton University;Google",
        "aff_unique_dep": ";;Google",
        "aff_unique_url": "https://www.utoronto.ca;https://www.princeton.edu;https://www.google.com",
        "aff_unique_abbr": "U of T;Princeton;Google",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;1;1;1;2",
        "aff_country_unique": "Canada;United States;United Kingdom"
    },
    {
        "title": "Federated Wasserstein Distance",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17679",
        "id": "rsg1mvUahT",
        "author_site": "alain rakotomamonjy, Kimia Nadjahi, Liva Ralaivola",
        "tldr": "",
        "abstract": "We introduce a principled way of computing the Wasserstein distance between two distributions in a federated manner.\nNamely, we show how to estimate the Wasserstein distance between two samples stored and\n kept on different devices/clients whilst a central entity/server orchestrates the computations \n (again, without having access to the samples). To achieve this feat, we take advantage of the geometric \nproperties of the Wasserstein distance -- in particular, the triangle inequality -- \n and that of the associated {\\em geodesics}: our algorithm, FedWad (for Federated Wasserstein Distance), iteratively approximates \n the Wasserstein distance by manipulating and exchanging distributions from the\n  space of geodesics in lieu of the input samples. \n  In addition to establishing the convergence properties of FedWad,\n   we provide empirical results on federated coresets and federate \n   optimal transport dataset distance, that we respectively exploit for\n   building a novel federated model and for boosting performance of popular federated learning algorithms.",
        "keywords": "Wasserstein distance;Federated Learning ; Triangle inequality",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/682ed64cee4a6aabb9ff16869c0d65cdf0280428.zip",
        "author": "Alain Rakotomamonjy;Kimia Nadjahi;Liva Ralaivola",
        "authorids": "~Alain_Rakotomamonjy1;~Kimia_Nadjahi1;~Liva_Ralaivola1",
        "gender": ";F;M",
        "homepage": ";http://kimiandj.github.io/;https://pageperso.lis-lab.fr/~liva.ralaivola/doku.php",
        "dblp": ";236/4646;85/4157",
        "google_scholar": ";x0_peq4AAAAJ;7oXGS2gAAAAJ",
        "orcid": ";;",
        "linkedin": ";;liva-ralaivola-2359b665/?originalSubdomain=fr",
        "or_profile": "~Alain_Rakotomamonjy1;~Kimia_Nadjahi1;~Liva_Ralaivola1",
        "aff": ";Massachusetts Institute of Technology;Aix Marseille Universit\u00e9",
        "aff_domain": ";mit.edu;univ-amu.fr",
        "position": ";Postdoc;Full Professor",
        "bibtex": "@inproceedings{\nrakotomamonjy2024federated,\ntitle={Federated Wasserstein Distance},\nauthor={Alain Rakotomamonjy and Kimia Nadjahi and Liva Ralaivola},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=rsg1mvUahT}\n}",
        "github": "",
        "project": "",
        "reviewers": "71t9;vrdV;FgAh;xDsE",
        "pdf_size": 1576154,
        "rating": "6;6;6;8",
        "confidence": "4;4;3;3",
        "soundness": "3;3;2;3",
        "contribution": "3;3;2;3",
        "presentation": "3;4;3;3",
        "wc_summary": "47;73;165;173",
        "wc_strengths": "19;85;94;75",
        "wc_weaknesses": "8;147;221;113",
        "wc_questions": "89;77;110;59",
        "wc_review": "163;382;590;420",
        "wc_reply_reviewers": "0;109;239;161",
        "wc_reply_authors": "376;637;978;583",
        "reply_reviewers": "0;1;2;2",
        "reply_authors": "1;1;2;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            114.5,
            55.34211777660844
        ],
        "wc_strengths_avg": [
            68.25,
            29.217931138258233
        ],
        "wc_weaknesses_avg": [
            122.25,
            76.65303320808643
        ],
        "wc_questions_avg": [
            83.75,
            18.538810641462412
        ],
        "wc_review_avg": [
            388.75,
            152.05817143448752
        ],
        "wc_reply_reviewers_avg": [
            127.25,
            86.82273607759663
        ],
        "wc_reply_authors_avg": [
            643.5,
            216.3036060725757
        ],
        "reply_reviewers_avg": [
            1.25,
            0.82915619758885
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6304994971910635312&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=rsg1mvUahT",
        "pdf": "https://openreview.net/pdf?id=rsg1mvUahT",
        "email": ";mit.edu;univ-amu.fr",
        "author_num": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Massachusetts Institute of Technology;Aix Marseille Universit\u00e9",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://web.mit.edu;https://www.univ-amu.fr",
        "aff_unique_abbr": "MIT;AMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United States;France"
    },
    {
        "id": "rtCROgWC2o",
        "title": "Hierarchical Approach to Explaining Poisoned AI Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This work presents a hierarchical approach to explaining poisoned artificial intelligence (AI) models. The motivation comes from the use of AI models in security and safety critical applications, for instance, the use of AI models for classification of road traffic signs in self-driving cars. Training images of traffic signs can be poisoned by adversaries to encode malicious triggers that change trained AI model prediction from a correct traffic sign to another traffic sign in a presence of such a physically realizable trigger (e.g., sticky note or Instagram filter).\nWe address the lack of AI model explainability by (a) designing utilization measurements of trained AI models and (b) explaining how training data are encoded in AI models based on those measurements at three hierarchical levels. The three levels are defined at graph node (computation unit), subgraph, and graph representations of  poisoned and clean AI models from the TrojAI Challenge.",
        "keywords": "visualization or interpretation of learned representations;poisoned AI models;explainable AI",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Peter Bajcsy;Antonio Cardone;Philippe Dessauw;Michael Majurski;Derek Juba;Tim Blattner;Walid T Keyrouz",
        "authorids": "~Peter_Bajcsy1;~Antonio_Cardone1;~Philippe_Dessauw1;~Michael_Majurski1;~Derek_Juba1;~Tim_Blattner1;~Walid_T_Keyrouz1",
        "gender": "M;;Not Specified;M;;M;M",
        "homepage": "https://www.nist.gov/people/peter-bajcsy;https://www.nist.gov/people/antonio-cardone;https://www.nist.gov/people/philippe-dessauw;;https://www.derek.juba.name/;https://isg.nist.gov/deepzoomweb/;",
        "dblp": "40/1250;;;157/1621;;;",
        "google_scholar": "3IU_BuUAAAAJ;;;gKsPuCgAAAAJ;;;",
        "orcid": ";;;0000-0001-9663-3803;;;0000-0003-3807-813X",
        "linkedin": ";;;michael-majurski;;;",
        "or_profile": "~Peter_Bajcsy1;~Antonio_Cardone1;~Philippe_Dessauw1;~Michael_Majurski1;~Derek_Juba1;~Tim_Blattner1;~Walid_T_Keyrouz1",
        "aff": "NIST;;National Institute of Standards and Technology;National Institute of Standards and Technology;;NIST;",
        "aff_domain": "nist.gov;;nist.gov;nist.gov;;nist.gov;",
        "position": "Computer Scientist;;Researcher;Computer Scientist;;Researcher;",
        "bibtex": "@misc{\nbajcsy2024hierarchical,\ntitle={Hierarchical Approach to Explaining Poisoned {AI} Models},\nauthor={Peter Bajcsy and Antonio Cardone and Philippe Dessauw and Michael Majurski and Derek Juba and Tim Blattner and Walid T Keyrouz},\nyear={2024},\nurl={https://openreview.net/forum?id=rtCROgWC2o}\n}",
        "github": "",
        "project": "",
        "reviewers": "VtiR;f9Xz;dEwM;A5T6",
        "site": "https://openreview.net/forum?id=rtCROgWC2o",
        "pdf_size": 2981309,
        "rating": "3;3;3;6",
        "confidence": "2;4;4;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;4",
        "presentation": "1;2;2;2",
        "wc_summary": "80;85;74;45",
        "wc_strengths": "12;48;128;53",
        "wc_weaknesses": "85;508;210;99",
        "wc_questions": "4;34;210;111",
        "wc_review": "181;675;622;308",
        "wc_reply_reviewers": "33;0;67;0",
        "wc_reply_authors": "174;881;723;370",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            71.0,
            15.508062419270823
        ],
        "wc_strengths_avg": [
            60.25,
            42.192268249052454
        ],
        "wc_weaknesses_avg": [
            225.5,
            170.13891383219772
        ],
        "wc_questions_avg": [
            89.75,
            79.64413035497343
        ],
        "wc_review_avg": [
            446.5,
            207.7769236464916
        ],
        "wc_reply_reviewers_avg": [
            25.0,
            27.739863013360395
        ],
        "wc_reply_authors_avg": [
            537.0,
            279.54874351354187
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.17407765595569782,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:FbnDatOfeSIJ:scholar.google.com/&scioq=Hierarchical+Approach+to+Explaining+Poisoned+AI+Models&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "National Institute of Standards and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nist.gov",
        "aff_unique_abbr": "NIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Understanding the Robustness of Multi-modal Contrastive Learning to Distribution Shift",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17678",
        "id": "rtl4XnJYBh",
        "author_site": "Yihao Xue, Siddharth Joshi, Dang Nguyen, Baharan Mirzasoleiman",
        "tldr": "",
        "abstract": "Recently, multimodal contrastive learning (MMCL) approaches, such as CLIP, have achieved a remarkable success in learning representations that are robust against distribution shift and generalize to new domains. Despite the empirical success, the mechanism behind learning such generalizable representations is not understood. In this work, we rigorously analyze this problem and \nuncover two mechanisms behind MMCL's robustness: \\emph{intra-class contrasting}, which allows the model to learn features with a high variance, and \\emph{inter-class feature sharing}, where annotated details in one class help learning other classes better. Both mechanisms prevent spurious features that are over-represented in the training data to overshadow the generalizable core features. This yields superior zero-shot classification accuracy under distribution shift. Furthermore, we theoretically demonstrate the benefits of using rich captions on robustness and explore the effect of annotating different types of details in the captions. We validate our theoretical findings through experiments, including a well-designed synthetic experiment and an experiment involving training CLIP models on MSCOCO/Conceptual Captions and evaluating them on shifted ImageNets.",
        "keywords": "multi-model contrastive learning;contrastive learning theory;representation learning;theory;robustness;distribution shift",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Yihao Xue;Siddharth Joshi;Dang Nguyen;Baharan Mirzasoleiman",
        "authorids": "~Yihao_Xue1;~Siddharth_Joshi1;~Dang_Nguyen2;~Baharan_Mirzasoleiman1",
        "gender": ";M;M;F",
        "homepage": ";https://sjoshi804.github.io;https://hsgser.github.io/;http://web.cs.ucla.edu/~baharan/",
        "dblp": "271/2194;;;52/10075",
        "google_scholar": "vMHVm8MAAAAJ;;https://scholar.google.co.jp/citations?user=WIqAtrcAAAAJ;x63j7HEAAAAJ",
        "orcid": ";;;",
        "linkedin": ";sjoshi804/;dang-nguyen-50b7a7a0/;",
        "or_profile": "~Yihao_Xue1;~Siddharth_Joshi1;~Dang_Nguyen2;~Baharan_Mirzasoleiman1",
        "aff": "IBM, International Business Machines;University of California, Los Angeles;University of California, Los Angeles;University of California, Los Angeles",
        "aff_domain": "us.ibm.com;ucla.edu;ucla.edu;ucla.edu",
        "position": "Intern;PhD student;PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nxue2024understanding,\ntitle={Understanding the Robustness of Multi-modal Contrastive Learning to Distribution Shift},\nauthor={Yihao Xue and Siddharth Joshi and Dang Nguyen and Baharan Mirzasoleiman},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=rtl4XnJYBh}\n}",
        "github": "",
        "project": "",
        "reviewers": "RF8u;1D1C;8jub;id3b",
        "pdf_size": 1118459,
        "rating": "5;5;6;6",
        "confidence": "4;4;4;2",
        "soundness": "3;2;3;3",
        "contribution": "3;2;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "68;80;96;47",
        "wc_strengths": "66;51;89;76",
        "wc_weaknesses": "309;143;122;98",
        "wc_questions": "8;94;212;77",
        "wc_review": "451;368;519;298",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "727;1398;1147;874",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            72.75,
            17.879807045938723
        ],
        "wc_strengths_avg": [
            70.5,
            13.901438774457844
        ],
        "wc_weaknesses_avg": [
            168.0,
            82.94877937619094
        ],
        "wc_questions_avg": [
            97.75,
            73.40427439870243
        ],
        "wc_review_avg": [
            409.0,
            83.46556176052492
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1036.5,
            257.43397211712363
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11083464372004321224&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "openreview": "https://openreview.net/forum?id=rtl4XnJYBh",
        "pdf": "https://openreview.net/pdf?id=rtl4XnJYBh",
        "email": "us.ibm.com;ucla.edu;ucla.edu;ucla.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "International Business Machines;University of California, Los Angeles",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ibm.com;https://www.ucla.edu",
        "aff_unique_abbr": "IBM;UCLA",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Los Angeles",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Variational Inference for SDEs Driven by Fractional Noise",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17677",
        "id": "rtx8B94JMS",
        "author_site": "Rembert Daems, Manfred Opper, Guillaume Crevecoeur, Tolga Birdal",
        "tldr": "",
        "abstract": "We present a novel variational framework for performing inference in (neural) stochastic differential equations (SDEs) driven by Markov-approximate fractional Brownian motion (fBM). SDEs offer a versatile tool for modeling real-world continuous-time dynamic systems with inherent noise and randomness. Combining SDEs with the powerful inference capabilities of variational methods, enables the learning of representative distributions through stochastic gradient descent. However, conventional SDEs typically assume  the underlying noise to follow a Brownian motion (BM), which hinders their ability to capture long-term dependencies. In contrast, fractional Brownian motion (fBM) extends BM to encompass non-Markovian dynamics, but existing methods for inferring fBM parameters are either computationally demanding or statistically inefficient. \n\nIn this paper, building upon the Markov approximation of fBM, we derive the evidence lower bound essential for efficient variational inference of posterior path measures, drawing from the well-established field of stochastic analysis. Additionally, we provide a closed-form expression for optimal approximation coefficients and propose to use neural networks to learn the drift, diffusion and control terms within our variational posterior, leading to the variational training of neural-SDEs. In this framework, we also optimize the Hurst index, governing the nature of our fractional noise. Beyond validation on synthetic data, we contribute a novel architecture for variational latent video prediction,\u2014an approach that, to the best of our knowledge, enables the first variational neural-SDE application to video perception.",
        "keywords": "variational inference;neural sdes;stochastic differential equations;brownian motion;fractional noise;fractional brownian motion;markov approximation;markov representation",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/9d57188d1bdffacc8ebefcd6e100b7efad1a8fd3.zip",
        "author": "Rembert Daems;Manfred Opper;Guillaume Crevecoeur;Tolga Birdal",
        "authorids": "~Rembert_Daems1;~Manfred_Opper1;~Guillaume_Crevecoeur1;~Tolga_Birdal3",
        "gender": ";;;M",
        "homepage": "https://rdaems.github.io/;;https://users.ugent.be/~gcreveco/;http://tolgabirdal.github.io",
        "dblp": "322/9167;;;143/7056",
        "google_scholar": "-X_5BNcAAAAJ;;https://scholar.google.com/citations?hl=en;_Bxd5ggAAAAJ",
        "orcid": "0000-0002-5225-4884;;0000-0001-7630-8579;0000-0001-7915-7964",
        "linkedin": "rembert-daems/;;guillaume-crevecoeur-a301b328/;https://linkedin.com/in/tbirdal",
        "or_profile": "~Rembert_Daems1;~Manfred_Opper1;~Guillaume_Crevecoeur1;~Tolga_Birdal3",
        "aff": "Ghent University;;;Imperial College London",
        "aff_domain": "ugent.be;;;imperial.ac.uk",
        "position": "PhD student;;;Assistant Professor",
        "bibtex": "@inproceedings{\ndaems2024variational,\ntitle={Variational Inference for {SDE}s Driven by Fractional Noise},\nauthor={Rembert Daems and Manfred Opper and Guillaume Crevecoeur and Tolga Birdal},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=rtx8B94JMS}\n}",
        "github": "",
        "project": "",
        "reviewers": "3XSn;kkY2;9F2a;J9Kf",
        "pdf_size": 3676582,
        "rating": "5;8;8;8",
        "confidence": "3;5;3;4",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;4;3;3",
        "wc_summary": "96;82;168;84",
        "wc_strengths": "74;56;132;95",
        "wc_weaknesses": "39;42;134;804",
        "wc_questions": "82;37;140;223",
        "wc_review": "291;217;574;1206",
        "wc_reply_reviewers": "0;0;50;72",
        "wc_reply_authors": "1069;112;1159;1295",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "2;1;3;3",
        "rating_avg": [
            7.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            107.5,
            35.33765696816924
        ],
        "wc_strengths_avg": [
            89.25,
            28.27874643614883
        ],
        "wc_weaknesses_avg": [
            254.75,
            319.4005126796136
        ],
        "wc_questions_avg": [
            120.5,
            69.53596191899555
        ],
        "wc_review_avg": [
            572.0,
            389.5336955899964
        ],
        "wc_reply_reviewers_avg": [
            30.5,
            31.476181471074284
        ],
        "wc_reply_authors_avg": [
            908.75,
            466.9862819184307
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5222329678670935,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14157969412421772844&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=rtx8B94JMS",
        "pdf": "https://openreview.net/pdf?id=rtx8B94JMS",
        "email": "ugent.be;;;imperial.ac.uk",
        "author_num": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Ghent University;Imperial College London",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ugent.be/en;https://www.imperial.ac.uk",
        "aff_unique_abbr": "UGent;ICL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Belgium;United Kingdom"
    },
    {
        "id": "rtzUW1FU3H",
        "title": "Can long-context large language models understand long contexts?",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large language models (LLMs) have received significant attention by achieving remarkable performance across various NLP tasks. However, the fixed context window length of the transformer architecture makes them incapable of memorizing and understanding extremely long inputs. There are tremendous works in designing effective and advanced techniques to enlarge LLMs' context window size, which call for high demands on developing high-quality benchmark datasets to evaluate LLMs' long context understanding ability. There are some existing datasets for this purpose. However, they face the problems of (1) shorter text length compared to modern LLMs' context window length, (2) out-of-date documents that may already been included in the training corpus of modern LLMs, and (3) most of the tasks are short dependency tasks---there are few questions that really need LLMs to collect information across the whole document (which we call. Most importantly, they hardly consider assessments on long dependency modeling and understanding across segments, which are particularly challenging and valuable for improving LLM long context. In this paper, we present LooGLE, a Long Context Generic Language Evaluation benchmark for LLM long context understanding. It contains up-to-date documents (all after 2022), over 24k tokens per document, and 6k newly generated questions from diverse domains and categories. Specifically, we recruited a group of human labelers to read 145 long documents in our benchmark, and asked them to compose about 1.1k QA pairs satisfying our long dependency requirements. These 1.1k high-quality QA pairs are each cross-validated 3 times by 2 labelers, aiming to provide the currently most accurate evaluation of LLMs' ability on long dependency questions. Upon a comprehensive evaluation of 8 state-of-the-art LLMs on LooGLE, we find that: (1) Commercial models generally outperform open-sourced models. (2) LLMs are more skilled at short dependency tasks like short QA and cloze but still struggle on performing real long dependency tasks. (3) In-context learning and chain of thoughts only bring incremental improvement for long context understanding. (4) Retrieval-based techniques significantly contribute to improvement on short QA whereas many techniques for extending context window length through optimized transformer architecture or positional encoding can hardly resolve long context understanding.",
        "keywords": "long context;dataset;large language model;long and short term dependency",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/c31528b41db1a6741e101dd40e446c255c5015cd.pdf",
        "author": "Jiaqi Li;Mengmeng Wang;Zilong Zheng;Muhan Zhang",
        "authorids": "~Jiaqi_Li10;~Mengmeng_Wang2;~Zilong_Zheng1;~Muhan_Zhang1",
        "gender": "Not Specified;F;M;M",
        "homepage": ";https://mengmengwang.github.io/;http://zilongzheng.github.io;https://muhanzhang.github.io/",
        "dblp": "118/4502-3;;218/5234;157/5518",
        "google_scholar": "https://scholar.google.com.hk/citations?user=C4Z2-rsAAAAJ;BSkCvIgAAAAJ;9sDx70IAAAAJ;https://scholar.google.com.hk/citations?user=OBBqkosAAAAJ",
        "orcid": ";;;0000-0002-7680-6401",
        "linkedin": ";;;jerry-muhan-zhang-a33a1777/",
        "or_profile": "~Jiaqi_Li10;~Mengmeng_Wang2;~Zilong_Zheng1;~Muhan_Zhang1",
        "aff": "Beijing Institute for General Artificial Intelligence;State Key Laboratory of General Artificial Intelligence;Beijing Institute for General Artificial Intelligence;Peking University",
        "aff_domain": "bigai.com;bigai.ai;bigai.ai;pku.edu.cn",
        "position": "Researcher;Researcher;Researcher;Assistant Professor",
        "bibtex": "@misc{\nli2024can,\ntitle={Can long-context large language models understand long contexts?},\nauthor={Jiaqi Li and Mengmeng Wang and Zilong Zheng and Muhan Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=rtzUW1FU3H}\n}",
        "github": "",
        "project": "",
        "reviewers": "8ZV2;oc4r;SWcJ;gE1R",
        "site": "https://openreview.net/forum?id=rtzUW1FU3H",
        "pdf_size": 1448214,
        "rating": "3;3;3;8",
        "confidence": "4;4;5;4",
        "soundness": "2;2;2;4",
        "contribution": "3;2;2;4",
        "presentation": "1;1;1;3",
        "wc_summary": "89;80;117;83",
        "wc_strengths": "32;40;38;56",
        "wc_weaknesses": "492;16;186;63",
        "wc_questions": "226;423;108;11",
        "wc_review": "839;559;449;213",
        "wc_reply_reviewers": "282;0;0;0",
        "wc_reply_authors": "2379;1703;1353;510",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "4;4;4;1",
        "rating_avg": [
            4.25,
            2.165063509461097
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            1.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            92.25,
            14.652218262092603
        ],
        "wc_strengths_avg": [
            41.5,
            8.874119674649425
        ],
        "wc_weaknesses_avg": [
            189.25,
            185.4877017486604
        ],
        "wc_questions_avg": [
            192.0,
            153.56920264167553
        ],
        "wc_review_avg": [
            515.0,
            224.98444390668436
        ],
        "wc_reply_reviewers_avg": [
            70.5,
            122.10958193360585
        ],
        "wc_reply_authors_avg": [
            1486.25,
            673.5730751002448
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.25,
            1.299038105676658
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6119109691109666328&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "Beijing Institute for General Artificial Intelligence;State Key Laboratory of General Artificial Intelligence;Peking University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.bigaiai.org/;;http://www.pku.edu.cn",
        "aff_unique_abbr": "BIGAI;;Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "A Data-Driven Measure of Relative Uncertainty for Misclassification Detection",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17676",
        "id": "ruGY8v10mK",
        "author_site": "Eduardo Dadalto C\u00e2mara Gomes, Marco Romanelli, Georg Pichler, Pablo Piantanida",
        "tldr": "",
        "abstract": "Misclassification detection is an important problem in machine learning, as it allows for the identification of instances where the model's predictions are unreliable. However, conventional uncertainty measures such as Shannon entropy do not provide an effective way to infer the real uncertainty associated with the model's predictions. In this paper, we introduce a novel data-driven measure of uncertainty relative to an observer for misclassification detection. By learning patterns in the distribution of soft-predictions, our uncertainty measure can identify misclassified samples based on the predicted class probabilities.  Interestingly, according to the proposed measure, soft-predictions corresponding to misclassified instances can carry a large amount of uncertainty, even though they may have low Shannon entropy. We demonstrate empirical improvements over multiple image classification tasks, outperforming state-of-the-art misclassification detection methods.",
        "keywords": "Misclassification detection;Uncertainty estimation;Trustworthy AI;Safety",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/4e48a05c1c365e6bc0d5b106376fda4379a3eb4c.zip",
        "author": "Eduardo Dadalto C\u00e2mara Gomes;Marco Romanelli;Georg Pichler;Pablo Piantanida",
        "authorids": "~Eduardo_Dadalto_C\u00e2mara_Gomes1;~Marco_Romanelli1;~Georg_Pichler1;~Pablo_Piantanida2",
        "gender": ";;M;M",
        "homepage": ";;;https://www.pablo-piantanida.org",
        "dblp": ";;155/0692.html;44/1416",
        "google_scholar": ";;;https://scholar.google.fr/citations?user=QyBEFv0AAAAJ",
        "orcid": ";;0000-0001-5696-4472;",
        "linkedin": ";;;pablo-piantanida-60a51bb5/?locale=en_US",
        "or_profile": "~Eduardo_Dadalto_C\u00e2mara_Gomes1;~Marco_Romanelli1;~Georg_Pichler1;~Pablo_Piantanida2",
        "aff": ";;TU Wien Vienna University of Technology;Mila - Quebec AI Institute ",
        "aff_domain": ";;tuwien.ac.at;mila.quebec",
        "position": ";;Postdoc;Full Professor",
        "bibtex": "@inproceedings{\ngomes2024a,\ntitle={A Data-Driven Measure of Relative Uncertainty for Misclassification Detection},\nauthor={Eduardo Dadalto C{\\^a}mara Gomes and Marco Romanelli and Georg Pichler and Pablo Piantanida},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ruGY8v10mK}\n}",
        "github": "",
        "project": "",
        "reviewers": "tQ2Y;YaSF;9edT;Pj5j",
        "pdf_size": 694706,
        "rating": "6;6;6;8",
        "confidence": "2;3;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;2;3",
        "wc_summary": "46;57;60;83",
        "wc_strengths": "43;45;60;45",
        "wc_weaknesses": "91;209;70;208",
        "wc_questions": "52;40;310;151",
        "wc_review": "232;351;500;487",
        "wc_reply_reviewers": "68;162;91;21",
        "wc_reply_authors": "373;502;1135;423",
        "reply_reviewers": "1;2;1;1",
        "reply_authors": "2;2;3;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            61.5,
            13.46291201783626
        ],
        "wc_strengths_avg": [
            48.25,
            6.832825184358224
        ],
        "wc_weaknesses_avg": [
            144.5,
            64.43019478474359
        ],
        "wc_questions_avg": [
            138.25,
            108.11192117430899
        ],
        "wc_review_avg": [
            392.5,
            109.50913203929616
        ],
        "wc_reply_reviewers_avg": [
            85.5,
            50.865017448144066
        ],
        "wc_reply_authors_avg": [
            608.25,
            307.57712447449666
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.816496580927726,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5759644019826338321&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=ruGY8v10mK",
        "pdf": "https://openreview.net/pdf?id=ruGY8v10mK",
        "email": ";;tuwien.ac.at;mila.quebec",
        "author_num": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Vienna University of Technology;Quebec AI Institute",
        "aff_unique_dep": ";AI Institute",
        "aff_unique_url": "https://www.tuwien.ac.at;https://mila.quebec",
        "aff_unique_abbr": "TU Wien;Mila",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Vienna;",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Austria;Canada"
    },
    {
        "id": "ruQkcBfzpm",
        "title": "mBLIP: Efficient Bootstrapping of Multilingual Vision-LLMs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Modular vision-language models (Vision-LLMs) align pretrained image encoders with (pretrained) large language models (LLMs), representing a computationally much more efficient alternative to end-to-end training of large vision-language models from scratch, \nwhich is prohibitively expensive for most. Vision-LLMs instead post-hoc condition LLMs to \n`understand' the output of an image encoder.\nWith the abundance of readily available high-quality English image-text data as well as monolingual English LLMs, the research focus has been on English-only Vision-LLMs. Multilingual vision-language models are still predominantly obtained via expensive end-to-end pretraining, resulting in comparatively smaller models, trained on limited multilingual image data supplemented with text-only multilingual corpora. In this work, we present mBLIP, the first multilingual Vision-LLM, which we obtain in a computationally efficient manner -- on consumer hardware using only a few million training examples -- by leveraging a pretrained multilingual LLM.\nTo this end, we \\textit{re-align} an image encoder previously tuned to an English LLM to a new, multilingual LLM -- for this, we leverage multilingual data from a mix of vision-and-language tasks, which we obtain by machine-translating  high-quality English data to 95 languages. \nOn the IGLUE benchmark, mBLIP yields results competitive with state-of-the-art models. Moreover, in image captioning on XM3600, mBLIP (zero-shot) even outperforms PaLI-X (a model with 55B parameters). Compared to these very large multilingual vision-language models trained from scratch, we obtain mBLIP by training orders of magnitude fewer parameters on magnitudes less data. We release our model and code at ANONYMIZED.",
        "keywords": "image;text;language;vision;llm;multilingual",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Gregor Geigle;Abhay Jain;Radu Timofte;Goran Glava\u0161",
        "authorids": "~Gregor_Geigle1;~Abhay_Jain1;~Radu_Timofte1;~Goran_Glava\u01611",
        "gender": "M;M;M;M",
        "homepage": ";https://jain-abhay.github.io/;https://www.informatik.uni-wuerzburg.de/computervision/;https://sites.google.com/view/goranglavas",
        "dblp": "277/1399;;24/8616;50/11059",
        "google_scholar": "uIlyqRwAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.ch/citations?user=u3MwH5kAAAAJ;Ym0myOwAAAAJ",
        "orcid": ";;0000-0002-1478-0402;",
        "linkedin": ";abhayjain11/;https://ch.linkedin.com/in/radutimofte;goran-glava\u0161-8484b420",
        "or_profile": "~Gregor_Geigle1;~Abhay_Jain1;~Radu_Timofte1;~Goran_Glava\u01611",
        "aff": "Bayerische Julius-Maximilians-Universit\u00e4t W\u00fcrzburg;IIT (BHU), Varanasi;Bayerische Julius-Maximilians-Universit\u00e4t W\u00fcrzburg;Julius-Maximilians-Universit\u00e4t W\u00fcrzburg",
        "aff_domain": "uni-wuerzburg.de;iitbhu.ac.in;uni-wuerzburg.de;uni-wuerzburg.de",
        "position": "PhD student;Undergrad student;Full Professor;Full Professor",
        "bibtex": "@misc{\ngeigle2024mblip,\ntitle={m{BLIP}: Efficient Bootstrapping of Multilingual Vision-{LLM}s},\nauthor={Gregor Geigle and Abhay Jain and Radu Timofte and Goran Glava{\\v{s}}},\nyear={2024},\nurl={https://openreview.net/forum?id=ruQkcBfzpm}\n}",
        "github": "",
        "project": "",
        "reviewers": "deKR;8jee;Gwix;XtFb",
        "site": "https://openreview.net/forum?id=ruQkcBfzpm",
        "pdf_size": 2748100,
        "rating": "5;5;6;6",
        "confidence": "4;4;4;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "53;54;77;79",
        "wc_strengths": "37;80;67;50",
        "wc_weaknesses": "162;118;131;27",
        "wc_questions": "124;24;40;27",
        "wc_review": "376;276;315;183",
        "wc_reply_reviewers": "29;611;78;0",
        "wc_reply_authors": "789;1003;722;278",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            65.75,
            12.275483697190918
        ],
        "wc_strengths_avg": [
            58.5,
            16.347782724271816
        ],
        "wc_weaknesses_avg": [
            109.5,
            50.24191477242881
        ],
        "wc_questions_avg": [
            53.75,
            41.002286521607545
        ],
        "wc_review_avg": [
            287.5,
            70.07317603762513
        ],
        "wc_reply_reviewers_avg": [
            179.5,
            250.68157092215614
        ],
        "wc_reply_authors_avg": [
            698.0,
            263.7622035091457
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 26,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3091978472747301047&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "University of W\u00fcrzburg;Indian Institute of Technology (BHU);Julius-Maximilians-Universit\u00e4t W\u00fcrzburg",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.uni-wuerzburg.de;https://www.iitbhu.ac.in;https://www.uni-wuerzburg.de",
        "aff_unique_abbr": "JMU;IIT BHU;JMU",
        "aff_campus_unique_index": "0;1;0",
        "aff_campus_unique": "W\u00fcrzburg;Varanasi;",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "Germany;India"
    },
    {
        "title": "SILO Language Models: Isolating Legal Risk In a Nonparametric Datastore",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17675",
        "id": "ruk0nyQPec",
        "author_site": "Sewon Min, Suchin Gururangan, Eric Wallace, Weijia Shi, Hannaneh Hajishirzi, Noah Smith, Luke Zettlemoyer",
        "tldr": "",
        "abstract": "The legality of training language models (LMs) on copyrighted or otherwise restricted data is under intense debate. However, as we show, model performance significantly degrades if trained only on low-risk text (e.g., out-of-copyright books or government documents), due to its limited size and domain coverage. We present SILO, a new language model that manages this risk-performance tradeoff during inference. SILO is built by (1) training a parametric LM on the Open License Corpus (OLC), a new corpus we curate with 228B tokens of public domain and permissively licensed text and (2) augmenting it with a more general and easily modifiable nonparametric datastore (e.g., containing copyrighted books or news) that is only queried during inference. The datastore allows use of high-risk data without training on it, supports sentence-level data attribution, and enables data producers to opt out from the model by removing content from the store. These capabilities can foster compliance with data-use regulations such as the fair use doctrine in the United States and the GDPR in the European Union. Our experiments show that the parametric LM struggles on its own with domains not covered by OLC. However, access to the datastore greatly improves out of domain performance, closing 90% of the performance gap with an LM trained on the Pile, a more diverse corpus with mostly high-risk text. We also analyze which nonparametric approach works best, where the remaining errors lie, and how performance scales with datastore size. Our results suggest that it is possible to build high quality language models while mitigating legal risk.",
        "keywords": "language modeling; retrieval; legality of language modeling",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Sewon Min;Suchin Gururangan;Eric Wallace;Weijia Shi;Hannaneh Hajishirzi;Noah A. Smith;Luke Zettlemoyer",
        "authorids": "~Sewon_Min1;~Suchin_Gururangan1;~Eric_Wallace1;~Weijia_Shi1;~Hannaneh_Hajishirzi1;~Noah_A._Smith2;~Luke_Zettlemoyer1",
        "gender": "F;M;M;;F;M;M",
        "homepage": "https://www.sewonmin.com;https://suchin.io;http://www.ericswallace.com/;https://weijiashi.notion.site/;https://homes.cs.washington.edu/~hannaneh/;https://www.cs.washington.edu/people/faculty/lsz/;https://homes.cs.washington.edu/~nasmith/",
        "dblp": "203/9401;217/1570;218/6165;132/80601;52/1296;21/6793;90/5204.html",
        "google_scholar": "https://scholar.google.ca/citations?user=jU4IZs4AAAAJ;CJIKhNIAAAAJ;SgST3LkAAAAJ;https://scholar.google.com/citations?hl=en;LOV6_WIAAAAJ;https://scholar.google.com.tw/citations?user=UjpbO6IAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;0000-3200-0000-0011;;;0000-0002-2310-6380",
        "linkedin": ";;;weijia-shi-773768112;;luke-zettlemoyer-a0109b226/;",
        "or_profile": "~Sewon_Min1;~Suchin_Gururangan1;~Eric_Wallace1;~Weijia_Shi1;~Hannaneh_Hajishirzi1;~Luke_Zettlemoyer1;~Noah_Smith1",
        "aff": "Department of Computer Science, University of Washington;University of Washington, Seattle;University of California, Berkeley;University of Washington, Seattle;University of Washington;Meta;Allen Institute for Artificial Intelligence",
        "aff_domain": "cs.washington.edu;uw.edu;berkeley.edu;uw.edu;uw.edu;meta.com;allenai.org",
        "position": "PhD student;PhD student;PhD student;PhD student;Associate Professor;Researcher;Senior Director of NLP Research",
        "bibtex": "@inproceedings{\nmin2024silo,\ntitle={{SILO} Language Models: Isolating Legal Risk In a Nonparametric Datastore},\nauthor={Sewon Min and Suchin Gururangan and Eric Wallace and Weijia Shi and Hannaneh Hajishirzi and Noah A. Smith and Luke Zettlemoyer},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ruk0nyQPec}\n}",
        "github": "",
        "project": "",
        "reviewers": "cDVV;mHsD;P6ek;X9LU",
        "pdf_size": 1538087,
        "rating": "5;8;8;8",
        "confidence": "4;3;4;4",
        "soundness": "3;4;3;3",
        "contribution": "2;4;3;3",
        "presentation": "3;4;3;4",
        "wc_summary": "127;197;42;80",
        "wc_strengths": "82;149;73;78",
        "wc_weaknesses": "218;127;106;68",
        "wc_questions": "47;46;33;9",
        "wc_review": "474;519;254;235",
        "wc_reply_reviewers": "0;16;0;13",
        "wc_reply_authors": "820;256;491;296",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            7.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            111.5,
            57.82084399245656
        ],
        "wc_strengths_avg": [
            95.5,
            31.052375110448477
        ],
        "wc_weaknesses_avg": [
            129.75,
            55.165093129623195
        ],
        "wc_questions_avg": [
            33.75,
            15.31951369985353
        ],
        "wc_review_avg": [
            370.5,
            127.17802483133633
        ],
        "wc_reply_reviewers_avg": [
            7.25,
            7.327175444876422
        ],
        "wc_reply_authors_avg": [
            465.75,
            223.01387288686774
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 72,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6176496505010054931&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=ruk0nyQPec",
        "pdf": "https://openreview.net/pdf?id=ruk0nyQPec",
        "email": "cs.washington.edu;uw.edu;berkeley.edu;uw.edu;uw.edu;meta.com;allenai.org",
        "author_num": 7,
        "aff_unique_index": "0;0;1;0;0;2;3",
        "aff_unique_norm": "University of Washington;University of California, Berkeley;Meta;Allen Institute for Artificial Intelligence",
        "aff_unique_dep": "Department of Computer Science;;Meta Platforms, Inc.;",
        "aff_unique_url": "https://www.washington.edu;https://www.berkeley.edu;https://meta.com;https://allenai.org",
        "aff_unique_abbr": "UW;UC Berkeley;Meta;AI2",
        "aff_campus_unique_index": "0;0;1;0",
        "aff_campus_unique": "Seattle;Berkeley;",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Conformal Prediction via Regression-as-Classification",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17674",
        "id": "rulxyXjf46",
        "author_site": "Etash Guha, Shlok Natarajan, Thomas M\u00f6llenhoff, Mohammad Emtiyaz Khan, Eugene Ndiaye",
        "tldr": "",
        "abstract": "Conformal prediction (CP) for regression can be challenging, especially when the output distribution is heteroscedastic, multimodal, or skewed. Some of the issues can be addressed by estimating a distribution over the output, but in reality, such approaches can be sensitive to estimation error and yield unstable intervals. Here, we circumvent the challenges by converting regression to a classification problem and then use CP for classification to obtain CP sets for regression. To preserve the ordering of the continuous-output space, we design a new loss function and present necessary modifications to the CP classification techniques. Empirical results on many benchmarks show that this simple approach gives surprisingly good results on many practical problems.",
        "keywords": "Conformal Prediction;Probability Function;Regression;Neural Networks",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/13d988fbe751c74bd398269a29ea8576e80d3370.zip",
        "author": "Etash Kumar Guha;Shlok Natarajan;Thomas M\u00f6llenhoff;Mohammad Emtiyaz Khan;Eugene Ndiaye",
        "authorids": "~Etash_Kumar_Guha1;~Shlok_Natarajan1;~Thomas_M\u00f6llenhoff1;~Mohammad_Emtiyaz_Khan1;~Eugene_Ndiaye1",
        "gender": "M;M;M;M;",
        "homepage": "https://etash.me/;;http://www.thomasmoellenhoff.net;https://emtiyaz.github.io/;",
        "dblp": "331/5590;;;58/10432;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;nph6MkoAAAAJ;KAqmeqAAAAAJ;https://scholar.google.com/citations?hl=en;",
        "orcid": ";;;;",
        "linkedin": "etash-guha-00097116a/;https://linkedin.com/in/shloknatarajan;;;",
        "or_profile": "~Etash_Kumar_Guha1;~Shlok_Natarajan1;~Thomas_M\u00f6llenhoff1;~Mohammad_Emtiyaz_Khan1;~Eugene_Ndiaye1",
        "aff": ";SalesForce.com;RIKEN;RIKEN Center for AI Project;",
        "aff_domain": ";salesforce.com;riken.jp;riken.jp;",
        "position": ";Researcher;Researcher;Full Professor;",
        "bibtex": "@inproceedings{\nguha2024conformal,\ntitle={Conformal Prediction via Regression-as-Classification},\nauthor={Etash Kumar Guha and Shlok Natarajan and Thomas M{\\\"o}llenhoff and Mohammad Emtiyaz Khan and Eugene Ndiaye},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=rulxyXjf46}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZE11;RG4V;iHe5;HZzS",
        "pdf_size": 2540699,
        "rating": "3;6;8;8",
        "confidence": "5;4;4;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "145;43;71;37",
        "wc_strengths": "80;108;46;120",
        "wc_weaknesses": "549;345;39;77",
        "wc_questions": "15;115;149;238",
        "wc_review": "789;611;305;472",
        "wc_reply_reviewers": "0;0;0;153",
        "wc_reply_authors": "1105;914;460;449",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "3;3;1;1",
        "rating_avg": [
            6.25,
            2.0463381929681126
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            74.0,
            42.95346318982906
        ],
        "wc_strengths_avg": [
            88.5,
            28.508770580296865
        ],
        "wc_weaknesses_avg": [
            252.5,
            207.87676637854457
        ],
        "wc_questions_avg": [
            129.25,
            79.8009241801121
        ],
        "wc_review_avg": [
            544.25,
            178.05810147252498
        ],
        "wc_reply_reviewers_avg": [
            38.25,
            66.25094338950956
        ],
        "wc_reply_authors_avg": [
            732.0,
            285.6247538292156
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            1.0
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9169493006161777,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5320327169585781067&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=rulxyXjf46",
        "pdf": "https://openreview.net/pdf?id=rulxyXjf46",
        "email": ";salesforce.com;riken.jp;riken.jp;",
        "author_num": 5,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Salesforce;RIKEN",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.salesforce.com;https://www.riken.jp",
        "aff_unique_abbr": "Salesforce;RIKEN",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "United States;Japan"
    },
    {
        "title": "Long-Short-Range Message-Passing: A Physics-Informed Framework to Capture Non-Local Interaction for Scalable Molecular Dynamics Simulation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17673",
        "id": "rvDQtdMnOl",
        "author_site": "Yunyang Li, Yusong Wang, Lin Huang, Han Yang, Xinran Wei, Jia Zhang, Tong Wang, Zun Wang, Bin Shao, Tie-Yan Liu",
        "tldr": "",
        "abstract": "Computational simulation of chemical and biological systems using *ab initio* molecular dynamics has been a challenge over decades. Researchers have attempted to address the problem with machine learning and fragmentation-based methods. However, the two approaches fail to give a satisfactory description of long-range and many-body interactions, respectively. Inspired by fragmentation-based methods, we propose the Long-Short-Range Message-Passing (LSR-MP) framework as a generalization of the existing equivariant graph neural networks (EGNNs) with the intent to incorporate long-range interactions efficiently and effectively. We apply the LSR-MP framework to the recently proposed ViSNet and demonstrate the state-of-the-art results with up to 40% MAE reduction for molecules in MD22 and Chignolin datasets. Consistent improvements to various EGNNs will also be discussed to illustrate the general applicability and robustness of our LSR-MP framework. The code for our experiments and trained model weights could be found at https://github.com/liyy2/LSR-MP.",
        "keywords": "Molecular Modeling;Quantum Chemistry;Fragmentation;Non-Local Interactions;EGNN",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Yunyang Li;Yusong Wang;Lin Huang;Han Yang;Xinran Wei;Jia Zhang;Tong Wang;Zun Wang;Bin Shao;Tie-Yan Liu",
        "authorids": "~Yunyang_Li1;~Yusong_Wang1;~Lin_Huang2;~Han_Yang6;~Xinran_Wei1;~Jia_Zhang1;~Tong_Wang2;~Zun_Wang2;~Bin_Shao1;~Tie-Yan_Liu1",
        "gender": "M;M;M;;F;M;M;M;;M",
        "homepage": "https://bibbase.org/u/yl2428;https://yusowa0716.github.io;https://www.researchgate.net/profile/Lin-Huang-3;https://yanghan.dev;;;;;https://www.binshao.info/;http://member.acm.org/~tieyanliu",
        "dblp": "56/9514;;;;;80/2266;51/6856-14;44/8410;;l/TieYanLiu",
        "google_scholar": ";sCBrMcIAAAAJ;;;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com.hk/citations?user=ElUqcbEAAAAJ;ETiIfc4AAAAJ;;h9L4CgIAAAAJ;Nh832fgAAAAJ",
        "orcid": "0009-0008-5214-5611;;;;;;0000-0002-9483-0050;0000-0002-8763-8327;;0000-0002-0476-8020",
        "linkedin": ";;linhuang6385/;;;;tong-wang-2a5965b9/;;;",
        "or_profile": "~Yunyang_Li1;~Yusong_Wang1;~Lin_Huang2;~Han_Yang6;~Xinran_Wei1;~Jia_Zhang1;~Tong_Wang2;~Zun_Wang2;~Bin_Shao1;~Tie-Yan_Liu1",
        "aff": "Yale University;Xi'an Jiaotong University;Microsoft;Microsoft Research;Microsoft;Microsoft;Microsoft;Microsoft;Microsoft;Microsoft",
        "aff_domain": "yale.edu;stu.xjtu.edu.cn;microsoft.com;research.microsoft.com;microsoft.com;microsoft.com;microsoft.com;microsoft.com;microsoft.com;microsoft.com",
        "position": "PhD student;PhD student;Researcher;Senior Researcher;Researcher;Associate Researcher;Researcher;Researcher;Principal Research Manager;Distinguished Scientist",
        "bibtex": "@inproceedings{\nli2024longshortrange,\ntitle={Long-Short-Range Message-Passing: A Physics-Informed Framework to Capture Non-Local Interaction for Scalable Molecular Dynamics Simulation},\nauthor={Yunyang Li and Yusong Wang and Lin Huang and Han Yang and Xinran Wei and Jia Zhang and Tong Wang and Zun Wang and Bin Shao and Tie-Yan Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=rvDQtdMnOl}\n}",
        "github": "",
        "project": "",
        "reviewers": "GkgW;4VzQ;cAHU;gmV7",
        "pdf_size": 9029255,
        "rating": "5;6;6;8",
        "confidence": "4;3;2;5",
        "soundness": "3;3;3;2",
        "contribution": "2;3;2;2",
        "presentation": "3;3;4;3",
        "wc_summary": "78;82;108;87",
        "wc_strengths": "103;109;175;42",
        "wc_weaknesses": "133;67;31;322",
        "wc_questions": "124;27;151;63",
        "wc_review": "438;285;465;514",
        "wc_reply_reviewers": "0;0;0;162",
        "wc_reply_authors": "1146;437;1281;1247",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "3;1;2;3",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            88.75,
            11.562331079847178
        ],
        "wc_strengths_avg": [
            107.25,
            47.087020504593404
        ],
        "wc_weaknesses_avg": [
            138.25,
            112.2171444120728
        ],
        "wc_questions_avg": [
            91.25,
            48.90999386628463
        ],
        "wc_review_avg": [
            425.5,
            85.57014666342462
        ],
        "wc_reply_reviewers_avg": [
            40.5,
            70.14805770653953
        ],
        "wc_reply_authors_avg": [
            1027.75,
            344.66460146060837
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.5129891760425771,
        "gs_citation": 25,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7776899320457475112&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=rvDQtdMnOl",
        "pdf": "https://openreview.net/pdf?id=rvDQtdMnOl",
        "email": "yale.edu;stu.xjtu.edu.cn;microsoft.com;research.microsoft.com;microsoft.com;microsoft.com;microsoft.com;microsoft.com;microsoft.com;microsoft.com",
        "author_num": 10,
        "aff_unique_index": "0;1;2;2;2;2;2;2;2;2",
        "aff_unique_norm": "Yale University;Xi'an Jiao Tong University;Microsoft",
        "aff_unique_dep": ";;Microsoft Corporation",
        "aff_unique_url": "https://www.yale.edu;https://www.xjtu.edu.cn;https://www.microsoft.com",
        "aff_unique_abbr": "Yale;XJTU;Microsoft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "Learning to Act without Actions",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17672",
        "id": "rvUq3cxpDF",
        "author_site": "Dominik Schmidt, Minqi Jiang",
        "tldr": "",
        "abstract": "Pre-training large models on vast amounts of web data has proven to be an effective approach for obtaining powerful, general models in domains such as language and vision. However, this paradigm has not yet taken hold in reinforcement learning. This is because videos, the most abundant form of embodied behavioral data on the web, lack the action labels required by existing methods for imitating behavior from demonstrations. We introduce **Latent Action Policies** (LAPO), a method for recovering latent action information\u2014and thereby latent-action policies, world models, and inverse dynamics models\u2014purely from videos. LAPO is the first method able to recover the structure of the true action space just from observed dynamics, even in challenging procedurally-generated environments. LAPO enables training latent-action policies that can be rapidly fine-tuned into expert-level policies, either offline using a small action-labeled dataset, or online with rewards. LAPO takes a first step towards pre-training powerful, generalist policies and world models on the vast amounts of videos readily available on the web. Our code is available here: \n[https://github.com/schmidtdominik/LAPO](https://github.com/schmidtdominik/LAPO).",
        "keywords": "reinforcement learning;world models;inverse dynamics models;imitation learning;representation learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Dominik Schmidt;Minqi Jiang",
        "authorids": "~Dominik_Schmidt2;~Minqi_Jiang1",
        "gender": ";M",
        "homepage": "https://dominik.sh;https://twitter.com/minqijiang",
        "dblp": ";270/7949",
        "google_scholar": "Km4811UAAAAJ;",
        "orcid": "0000-0001-8208-6087;",
        "linkedin": ";minqi-jiang-585a6536/",
        "or_profile": "~Dominik_Schmidt2;~Minqi_Jiang1",
        "aff": "Department of Computer Science, University College London, University of London;Google",
        "aff_domain": "cs.ucl.ac.uk;google.com",
        "position": "MS student;Researcher",
        "bibtex": "@inproceedings{\nschmidt2024learning,\ntitle={Learning to Act without Actions},\nauthor={Dominik Schmidt and Minqi Jiang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=rvUq3cxpDF}\n}",
        "github": "",
        "project": "",
        "reviewers": "NDab;BaGY;Z13u;ATYE",
        "pdf_size": 7551122,
        "rating": "6;8;8;8",
        "confidence": "4;4;3;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;4;3;3",
        "wc_summary": "83;163;85;183",
        "wc_strengths": "41;89;72;133",
        "wc_weaknesses": "219;285;36;227",
        "wc_questions": "31;123;21;4",
        "wc_review": "374;660;214;547",
        "wc_reply_reviewers": "22;22;13;0",
        "wc_reply_authors": "1093;1435;360;1121",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "2;2;1;2",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            128.5,
            45.06384359994163
        ],
        "wc_strengths_avg": [
            83.75,
            33.23683950077083
        ],
        "wc_weaknesses_avg": [
            191.75,
            93.45955007381535
        ],
        "wc_questions_avg": [
            44.75,
            46.197267235194765
        ],
        "wc_review_avg": [
            448.75,
            169.5396340092782
        ],
        "wc_reply_reviewers_avg": [
            14.25,
            9.01041064547005
        ],
        "wc_reply_authors_avg": [
            1002.25,
            394.3649166698275
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 27,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=853608868953707446&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=rvUq3cxpDF",
        "pdf": "https://openreview.net/pdf?id=rvUq3cxpDF",
        "email": "cs.ucl.ac.uk;google.com",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University College London;Google",
        "aff_unique_dep": "Department of Computer Science;Google",
        "aff_unique_url": "https://www.ucl.ac.uk;https://www.google.com",
        "aff_unique_abbr": "UCL;Google",
        "aff_campus_unique_index": "0;1",
        "aff_campus_unique": "London;Mountain View",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "id": "rvj1mn8q8D",
        "title": "TextGenSHAP: Scalable Post-hoc Explanations in Text Generation with Long Documents",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs) have attracted huge interest in practical applications given their increasingly accurate responses and coherent reasoning abilities. Given their nature as black-boxes using complex reasoning processes on their inputs, it is inevitable that the demand for scalable and faithful explanations for LLMs\u2019 generated content will continue to grow. There have been major developments in the explainability of neural network models over the past decade. Among them, post-hoc explainability methods, especially Shapley values, have proven effective for interpreting deep learning models. However, there are major challenges in scaling up Shapley values for LLMs, particularly when dealing with long input contexts containing thousands of tokens and autoregressively generated output sequences. Furthermore, it is often unclear how to effectively utilize generated explanations to improve the performance of LLMs. In this paper, we introduce TextGenSHAP, an efficient post-hoc explanation method incorporating LM-specific techniques. We demonstrate that this leads to significant increases in speed compared to conventional Shapley value computations, reducing processing times from hours to minutes for token-level explanations, and to just seconds for document-level explanations. In addition, we demonstrate how real-time Shapley values can be utilized in two important scenarios, providing better understanding of long-document question answering by localizing important words and sentences; and improving existing document retrieval systems through enhancing the accuracy of selected passages and ultimately the final responses.",
        "keywords": "natural language processing;interpretability;explainable AI;long documents;large language model",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "James Enouen;Hootan Nakhost;Sayna Ebrahimi;Sercan O Arik;Yan Liu;Tomas Pfister",
        "authorids": "~James_Enouen1;~Hootan_Nakhost1;~Sayna_Ebrahimi1;~Sercan_O_Arik1;~Yan_Liu1;~Tomas_Pfister1",
        "gender": ";M;F;M;F;M",
        "homepage": ";;https://saynaebrahimi.github.io/;https://www.sercanarik.com/;http://www-bcf.usc.edu/~liu32/;http://tomas.pfister.fi",
        "dblp": ";56/5649;207/7584;;150/4295;14/8360",
        "google_scholar": ";https://scholar.google.ca/citations?user=Bk-fDi0AAAAJ;wRyjJfMAAAAJ;;UUKLPMYAAAAJ;ahSpJOAAAAAJ",
        "orcid": ";;;0000-0001-6333-1729;0000-0002-7055-9518;0009-0004-4088-8718",
        "linkedin": ";;saynaebrahimi/;;;",
        "or_profile": "~James_Enouen1;~Hootan_Nakhost1;~Sayna_Ebrahimi1;~Sercan_O_Arik1;~Yan_Liu1;~Tomas_Pfister1",
        "aff": ";;Google;Google;University of Southern California;Google",
        "aff_domain": ";;google.com;google.com;usc.edu;google.com",
        "position": ";;Research Scientist;Research Scientist;Professor;Head of Research @ Cloud AI",
        "bibtex": "@misc{\nenouen2024textgenshap,\ntitle={TextGen{SHAP}: Scalable Post-hoc Explanations in Text Generation with Long Documents},\nauthor={James Enouen and Hootan Nakhost and Sayna Ebrahimi and Sercan O Arik and Yan Liu and Tomas Pfister},\nyear={2024},\nurl={https://openreview.net/forum?id=rvj1mn8q8D}\n}",
        "github": "",
        "project": "",
        "reviewers": "VZk7;vxq9;7NAw;e5MV",
        "site": "https://openreview.net/forum?id=rvj1mn8q8D",
        "pdf_size": 1253744,
        "rating": "5;6;6;6",
        "confidence": "4;3;4;2",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;2;3;2",
        "wc_summary": "105;58;52;64",
        "wc_strengths": "68;70;45;30",
        "wc_weaknesses": "312;199;162;48",
        "wc_questions": "81;79;2;5",
        "wc_review": "566;406;261;147",
        "wc_reply_reviewers": "765;85;67;0",
        "wc_reply_authors": "2049;817;684;189",
        "reply_reviewers": "2;1;2;0",
        "reply_authors": "3;2;4;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            69.75,
            20.78911975048487
        ],
        "wc_strengths_avg": [
            53.25,
            16.63392617513977
        ],
        "wc_weaknesses_avg": [
            180.25,
            94.25066312764065
        ],
        "wc_questions_avg": [
            41.75,
            38.27123593509883
        ],
        "wc_review_avg": [
            345.0,
            157.17983331203783
        ],
        "wc_reply_reviewers_avg": [
            229.25,
            310.93277006452695
        ],
        "wc_reply_authors_avg": [
            934.75,
            684.550354247224
        ],
        "reply_reviewers_avg": [
            1.25,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6295493212011823033&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Google;University of Southern California",
        "aff_unique_dep": "Google;",
        "aff_unique_url": "https://www.google.com;https://www.usc.edu",
        "aff_unique_abbr": "Google;USC",
        "aff_campus_unique_index": "0;0;1;0",
        "aff_campus_unique": "Mountain View;Los Angeles",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "rw2dkPZOoQ",
        "title": "The common Stability Mechanism behind most Self-Supervised Learning Approaches",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Last couple of years have witnessed a tremendous progress in self-supervised learning (SSL), the success of which can be attributed to the introduction of useful inductive biases in the learning process to learn meaningful visual representations while avoiding collapse. These inductive biases and constraints manifest themselves in the form of different optimization formulations in the SSL techniques, e.g. by utilizing negative examples in a contrastive formulation, or exponential moving average and predictor in BYOL and SimSiam. In this paper, we provide a framework to explain the stability mechanism of these different SSL techniques: i) we discuss the working mechanism of contrastive techniques like SimCLR, non-contrastive techniques like BYOL, SWAV, SimSiam, Barlow Twins, and DINO;  ii) we provide an argument that despite different formulations these methods implicitly optimize a similar objective function, i.e. minimizing the magnitude of the expected representation over all data samples, or the mean of the data distribution, while maximizing the magnitude of the expected representation of individual samples over different data augmentations; iii) we provide mathematical and empirical evidence to support our framework. We formulate different hypotheses and test them using the Imagenet100 dataset.",
        "keywords": "Self supervised learning;contrastive learning;non-contrastive self supervised learning;meta study",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/393f97503f7ed88b22a47d3909d37456578764a7.zip",
        "author": "Abhishek Jha;Matthew B. Blaschko;Yuki M Asano;Tinne Tuytelaars",
        "authorids": "~Abhishek_Jha1;~Matthew_B._Blaschko1;~Yuki_M_Asano1;~Tinne_Tuytelaars1",
        "gender": "M;;;",
        "homepage": "https://abskjha.github.io;;;",
        "dblp": "168/6715-1;;;",
        "google_scholar": "rdlsfogAAAAJ;;;",
        "orcid": "0000-0002-0350-2474;;;",
        "linkedin": ";;;",
        "or_profile": "~Abhishek_Jha1;~Matthew_B._Blaschko1;~Yuki_M_Asano1;~Tinne_Tuytelaars1",
        "aff": "KU Leuven;;;",
        "aff_domain": "kuleuven.be;;;",
        "position": "PhD student;;;",
        "bibtex": "@misc{\njha2024the,\ntitle={The common Stability Mechanism behind most Self-Supervised Learning Approaches},\nauthor={Abhishek Jha and Matthew B. Blaschko and Yuki M Asano and Tinne Tuytelaars},\nyear={2024},\nurl={https://openreview.net/forum?id=rw2dkPZOoQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "pFyt;kELi;gdVL;2HcK",
        "site": "https://openreview.net/forum?id=rw2dkPZOoQ",
        "pdf_size": 3984459,
        "rating": "3;3;5;5",
        "confidence": "3;5;3;3",
        "soundness": "2;2;3;2",
        "contribution": "2;1;2;2",
        "presentation": "3;3;2;2",
        "wc_summary": "85;67;74;94",
        "wc_strengths": "80;10;109;67",
        "wc_weaknesses": "161;687;216;175",
        "wc_questions": "1;28;56;9",
        "wc_review": "327;792;455;345",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            80.0,
            10.319883720275147
        ],
        "wc_strengths_avg": [
            66.5,
            35.98958182585621
        ],
        "wc_weaknesses_avg": [
            309.75,
            218.74114267782363
        ],
        "wc_questions_avg": [
            23.5,
            21.17191535974013
        ],
        "wc_review_avg": [
            479.75,
            186.8172569651958
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7596175500628306428&as_sdt=805&sciodt=0,3&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0",
        "aff_unique_norm": "Katholieke Universiteit Leuven",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kuleuven.be",
        "aff_unique_abbr": "KU Leuven",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Belgium"
    },
    {
        "id": "rwmWd2rjP1",
        "title": "Molecule Relaxation by Reverse Diffusion with Time Step Prediction",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Molecule relaxation---finding the stable state of an unstable configuration---is an important subtask for exploring the chemical compound space, for instance, to identify novel drugs or catalysts. Existing methods rely on local energy minimization with the gradients (i.e., force field) estimated through computationally intensive ab initio methods or approximated by a neural network trained on large expensive datasets encompassing \\emph{labeled stable and unstable} molecules. In this work, we propose molecule relaxation by reverse diffusion (MoreRed), a novel purely statistical approach where unstable molecules are seen as \\emph{noisy} samples to be denoised by a diffusion model equipped with a time step predictor to handle arbitrarily noisy inputs. Notably, MoreRed learns a simpler pseudo energy surface instead of the complex physical energy surface and is trained on a significantly smaller dataset consisting of solely \\emph{unlabeled stable} molecules, which is considerably less expensive to generate. Nevertheless, our experiments demonstrate its competitive performance to the state-of-the-art baseline in terms of the quality of the relaxed molecules inferred. Furthermore, we identify the high potential that time step prediction has to enhance the performance of data generation, where our findings are promising both in molecular structure and image generation.",
        "keywords": "diffusion time prediction;diffusion models;generative modeling;quantum chemistry;molecule relaxation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/960b55eed602f9fdb1963b749befc9059b3a8d57.zip",
        "author": "Khaled Kahouli;Stefaan Simon Pierre Hessmann;Klaus Robert Muller;Shinichi Nakajima;Niklas Wolf Andreas Gebauer",
        "authorids": "~Khaled_Kahouli1;~Stefaan_Simon_Pierre_Hessmann1;~Klaus_Robert_Muller1;~Shinichi_Nakajima2;~Niklas_Wolf_Andreas_Gebauer1",
        "gender": "M;M;M;M;M",
        "homepage": ";;https://www.ml.tu-berlin.de/menue/members/klaus-robert_mueller/;https://web.ml.tu-berlin.de/author/dr.-shinichi-nakajima/;",
        "dblp": "376/5745;;m/KRMuller.html;97/6115.html;",
        "google_scholar": "8uTfE8AAAAAJ;dna9kFcAAAAJ;https://scholar.google.de/citations?hl=de;hXSvID4AAAAJ;Xz524XMAAAAJ",
        "orcid": "0009-0002-5702-0021;0000-0002-8399-2193;0000-0002-3861-7685;0000-0003-3970-4569;0000-0002-9149-7424",
        "linkedin": "khaled-kahouli-13b0a7185/;;;;niklas-gebauer-868101244",
        "or_profile": "~Khaled_Kahouli1;~Stefaan_Simon_Pierre_Hessmann1;~Klaus_Robert_Muller1;~Shinichi_Nakajima2;~Niklas_Wolf_Andreas_Gebauer1",
        "aff": "Technische Universit\u00e4t Berlin;Technische Universit\u00e4t Berlin;TU Berlin;BIFOLD, TU Berlin;Technische Universit\u00e4t Berlin",
        "aff_domain": "tu-berlin.de;tu-berlin.de;tu-berlin.de;tu-berlin.de;tu-berlin.de",
        "position": "PhD student;PhD student;Full Professor;Postdoc;PhD student",
        "bibtex": "@misc{\nkahouli2024molecule,\ntitle={Molecule Relaxation by Reverse Diffusion with Time Step Prediction},\nauthor={Khaled Kahouli and Stefaan Simon Pierre Hessmann and Klaus Robert Muller and Shinichi Nakajima and Niklas Wolf Andreas Gebauer},\nyear={2024},\nurl={https://openreview.net/forum?id=rwmWd2rjP1}\n}",
        "github": "",
        "project": "",
        "reviewers": "vPT3;jJY4;PyaS;2WpS",
        "site": "https://openreview.net/forum?id=rwmWd2rjP1",
        "pdf_size": 5676574,
        "rating": "3;5;5;6",
        "confidence": "3;4;3;5",
        "soundness": "2;2;2;3",
        "contribution": "2;1;2;2",
        "presentation": "3;3;2;3",
        "wc_summary": "45;94;69;40",
        "wc_strengths": "44;82;28;33",
        "wc_weaknesses": "263;120;436;106",
        "wc_questions": "164;122;8;44",
        "wc_review": "516;418;541;223",
        "wc_reply_reviewers": "0;117;0;351",
        "wc_reply_authors": "1859;2335;2040;1688",
        "reply_reviewers": "0;1;0;2",
        "reply_authors": "3;4;3;3",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            62.0,
            21.482551058940835
        ],
        "wc_strengths_avg": [
            46.75,
            21.158627082114755
        ],
        "wc_weaknesses_avg": [
            231.25,
            133.22420012895554
        ],
        "wc_questions_avg": [
            84.5,
            61.68265558485626
        ],
        "wc_review_avg": [
            424.5,
            125.08896833853895
        ],
        "wc_reply_reviewers_avg": [
            117.0,
            143.2951499528159
        ],
        "wc_reply_authors_avg": [
            1980.5,
            239.54592461571957
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.25,
            0.4330127018922193
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.7608859102526822,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7744920923263481229&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Technische Universit\u00e4t Berlin",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tu-berlin.de",
        "aff_unique_abbr": "TU Berlin",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Berlin",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "rxBoUKhcBJ",
        "title": "LM-Switch: Transforming Word Embedding Space for Flexible Language Model Steering",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs) have advanced significantly as general-purpose tools. Varied real-life demands, ranging from risk management for specific audiences to customizing text styles for different scenarios, all necessitate customizing general-purpose LLMs to different conditions. However, existing pre-training or fine-tuning solutions are still not efficient or flexible enough, and can compromise LLMs\u2019 original quality. Applying classifiers as constraints requires an expensive decoding process. We motivate ourselves by theoretically interpreting the role of word embeddings in modeling output distribution. By analyzing a variant of Hidden Markov Models (HMMs), we find that different conditions in HMMs can be surprisingly understood as linear transformations in the output word embedding space. This finding inspires LM-Switch, a novel, theoretically grounded, lightweight, transferrable, and flexible method for generative language model conditioning. LM-Switch simply deploys a linear transformation in the output word embedding space. It can achieve comparable or superior performance compared with state-of-the-art baselines in LM detoxification and sentiment control while maintaining a better balance with generation quality, despite training only 0.2% of model parameters. It is also able to learn from a few sentences or one document. One can continuously steer LLMs by scaling the transformation, or compose multiple conditions by adding their transformations. Moreover, a learned LM-Switch can be transferred to other LLMs of different sizes. We will make our code available to the research community following publication.",
        "keywords": "Language Model;Word Embeddings;Representation Interpretation;Model Control",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/c2d34de2eacd79bd7aa84e7da8be17afd06296c7.zip",
        "author": "Chi Han;Jialiang Xu;Manling Li;Yi Fung;Chenkai Sun;Nan Jiang;Tarek Abdelzaher;Heng Ji",
        "authorids": "~Chi_Han1;~Jialiang_Xu1;~Manling_Li1;~Yi_Fung1;~Chenkai_Sun1;~Nan_Jiang2;~Tarek_Abdelzaher1;~Heng_Ji3",
        "gender": "M;M;F;F;M;M;M;F",
        "homepage": "https://glaciohound.github.io;http://liamjxu.github.io;https://limanling.github.io/;https://mayrfung.github.io;https://chenkaisun.github.io/;http://nanjiang.cs.illinois.edu;http://abdelzaher.cs.illinois.edu/;http://blender.cs.illinois.edu/hengji.html",
        "dblp": "255/6993;233/6929;178/3620;223/2782-1.html;251/9509;06/4489-8;a/TarekFAbdelzaher;",
        "google_scholar": "https://scholar.google.com.sg/citations?user=DcSvbuAAAAAJ;S_mgVngAAAAJ;6U4SXnUAAAAJ;eUae2K0AAAAJ;ipzG4asAAAAJ;nUlanA8AAAAJ;https://scholar.google.com.tw/citations?user=cA28Zs0AAAAJ;z7GCqT4AAAAJ",
        "orcid": "0000-0001-6235-5841;;;;0000-0002-7999-6933;;0000-0003-3883-7220;",
        "linkedin": "chi-han-b01a93141/;xjl/;;;chenkaisun/;nan-jiang-28139937/;tarek-abdelzaher-0216071/;",
        "or_profile": "~Chi_Han1;~Jialiang_Xu1;~Manling_Li1;~Yi_Fung1;~Chenkai_Sun1;~Nan_Jiang2;~Tarek_Abdelzaher1;~Heng_Ji3",
        "aff": "University of Illinois, Urbana Champaign;Stanford University;Stanford University;University of Illinois, Urbana Champaign;University of Illinois Urbana Champaign;University of Illinois, Urbana Champaign;University of Illinois, Urbana Champaign;University of Illinois, Urbana-Champaign",
        "aff_domain": "illinois.edu;stanford.edu;stanford.edu;illinois.edu;illinois.edu;illinois.edu;illinois.edu;uiuc.edu",
        "position": "PhD student;MS student;Postdoc;PhD student;PhD student;Assistant Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nhan2024lmswitch,\ntitle={{LM}-Switch: Transforming Word Embedding Space for Flexible Language Model Steering},\nauthor={Chi Han and Jialiang Xu and Manling Li and Yi Fung and Chenkai Sun and Nan Jiang and Tarek Abdelzaher and Heng Ji},\nyear={2024},\nurl={https://openreview.net/forum?id=rxBoUKhcBJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "Stxg;dUYk;sbje;vGHy",
        "site": "https://openreview.net/forum?id=rxBoUKhcBJ",
        "pdf_size": 2184996,
        "rating": "3;5;5;8",
        "confidence": "4;3;4;3",
        "soundness": "2;3;2;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "55;93;98;88",
        "wc_strengths": "12;42;51;41",
        "wc_weaknesses": "335;196;283;32",
        "wc_questions": "6;55;8;42",
        "wc_review": "408;386;440;203",
        "wc_reply_reviewers": "0;0;0;11",
        "wc_reply_authors": "1181;495;654;324",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            83.5,
            16.830032679706836
        ],
        "wc_strengths_avg": [
            36.5,
            14.67140075112121
        ],
        "wc_weaknesses_avg": [
            211.5,
            114.91844934561203
        ],
        "wc_questions_avg": [
            27.75,
            21.26470079733077
        ],
        "wc_review_avg": [
            359.25,
            92.23170550304272
        ],
        "wc_reply_reviewers_avg": [
            2.75,
            4.763139720814412
        ],
        "wc_reply_authors_avg": [
            663.5,
            320.7604246162547
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.7001400420140049,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:spWc7qrSYAAJ:scholar.google.com/&scioq=LM-Switch:+Transforming+Word+Embedding+Space+for+Flexible+Language+Model+Steering&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;0;0;0;0;2",
        "aff_unique_norm": "University of Illinois Urbana-Champaign;Stanford University;University of Illinois",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://illinois.edu;https://www.stanford.edu;https://illinois.edu",
        "aff_unique_abbr": "UIUC;Stanford;UIUC",
        "aff_campus_unique_index": "0;1;1;0;0;0;0;0",
        "aff_campus_unique": "Urbana-Champaign;Stanford",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "rxD2ZCExRG",
        "title": "HumanTOMATO: Text-aligned Whole-body Motion Generation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This work targets a novel text-driven **whole-body** motion generation task, which takes a given textual description as input and aims at generating high-quality, diverse, and coherent facial expressions, hand gestures, and body motions simultaneously.\nPrevious works on text-driven motion generation tasks mainly have two limitations: they ignore the key role of fine-grained hand and face controlling in vivid whole-body motion generation, and lack a good alignment between text and motion.\nTo address such limitations, we propose a Text-aligned whOle-body Motion generATiOn framework, named HumanTOMATO, which is the first attempt to our knowledge towards applicable holistic motion generation in this research area. \nTo tackle this challenging task, our solution includes two key designs: (1) a Holistic Hierarchical VQ-VAE (aka H${}^{2}$VQ) and a Hierarchical-GPT for fine-grained body and hand motion reconstruction and generation with two structured codebooks; \nand (2) a pre-trained text-motion-alignment model to help generated motion align with the input textual description explicitly.\nComprehensive experiments verify that our model has significant advantages in both the quality of generated motions and their alignment with text.\nOur project codes will be public. The demo video is available in the supplementary.",
        "keywords": "whole body motion generation;motion synthesis;text-driven motion generation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/a58c5101bb8b847d9203956e4bfb9cb00b768e7d.zip",
        "author": "Shunlin Lu;Ling-Hao Chen;Ailing Zeng;Jing Lin;Ruimao Zhang;Lei Zhang;Heung-Yeung Shum",
        "authorids": "~Shunlin_Lu1;~Ling-Hao_Chen1;~Ailing_Zeng1;~Jing_Lin3;~Ruimao_Zhang1;~Lei_Zhang23;~Heung-Yeung_Shum1",
        "gender": "M;;F;M;M;M;M",
        "homepage": "https://shunlinlu.github.io/;https://lhchen.top;https://ailingzeng.site/;https://jinglin7.github.io/;http://zhangruimao.site/#;https://www.microsoft.com/en-us/research/people/hshum/;https://www.leizhang.org/",
        "dblp": "333/0021;339/7448.html;226/4720;;54/10697;;z/LeiZhang",
        "google_scholar": ";mxvMDpMAAAAJ;Tn7fzS8AAAAJ;SvaU2GMAAAAJ;ZJwZdtgAAAAJ;;fIlGZToAAAAJ",
        "orcid": ";;;;;;",
        "linkedin": "shunlin-lu-401aa61a6/;ling-hao-chen-79b87a224/;%E7%88%B1%E7%8E%B2-%E6%9B%BE-65504112a/;;;;",
        "or_profile": "~Shunlin_Lu1;~Ling-Hao_Chen1;~Ailing_Zeng1;~Jing_Lin3;~Ruimao_Zhang1;~Heung-Yeung_Shum1;~Lei_Zhang1",
        "aff": "The Chinese University of HongKong, ShenZhen;International Digital Economy Academy;International Digital Economy Academy;Tsinghua University;The Chinese University of Hong Kong (Shenzhen);;International Digital Economy Academy",
        "aff_domain": "cuhk.edu.cn;idea.edu.cn;idea.edu.cn;tsinghua.edu.cn;cuhk.edu.cn;;idea.edu.cn",
        "position": "PhD student;Research Intern;Researcher;MS student;Assistant Professor;;Chief Scientist",
        "bibtex": "@misc{\nlu2024humantomato,\ntitle={Human{TOMATO}: Text-aligned Whole-body Motion Generation},\nauthor={Shunlin Lu and Ling-Hao Chen and Ailing Zeng and Jing Lin and Ruimao Zhang and Lei Zhang and Heung-Yeung Shum},\nyear={2024},\nurl={https://openreview.net/forum?id=rxD2ZCExRG}\n}",
        "github": "",
        "project": "",
        "reviewers": "bynW;MYWU;JrQp;yjZC",
        "site": "https://openreview.net/forum?id=rxD2ZCExRG",
        "pdf_size": 7289350,
        "rating": "5;5;6;8",
        "confidence": "4;4;3;3",
        "soundness": "3;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;4;3;4",
        "wc_summary": "78;108;73;92",
        "wc_strengths": "91;30;105;63",
        "wc_weaknesses": "129;100;179;131",
        "wc_questions": "103;38;149;86",
        "wc_review": "401;276;506;372",
        "wc_reply_reviewers": "0;230;5;7",
        "wc_reply_authors": "959;1124;988;702",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "3;3;3;2",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            87.75,
            13.608361400256829
        ],
        "wc_strengths_avg": [
            72.25,
            28.699956445959984
        ],
        "wc_weaknesses_avg": [
            134.75,
            28.340562803162538
        ],
        "wc_questions_avg": [
            94.0,
            39.70516339218364
        ],
        "wc_review_avg": [
            388.75,
            81.99199656063999
        ],
        "wc_reply_reviewers_avg": [
            60.5,
            97.89407540806543
        ],
        "wc_reply_authors_avg": [
            943.25,
            152.58010191371613
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            0.4330127018922193
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.8164965809277259,
        "gs_citation": 65,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5446754581777076719&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;1;2;0;1",
        "aff_unique_norm": "Chinese University of Hong Kong;International Digital Economy Academy;Tsinghua University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.cuhk.edu.cn;;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "CUHK;;THU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Shenzhen;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China;"
    },
    {
        "title": "Selective Mixup Fine-Tuning for Optimizing Non-Decomposable Objectives",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17671",
        "id": "rxVBKhyfSo",
        "author_site": "Shrinivas Ramasubramanian, Harsh Rangwani, Sho Takemori, Kunal Samanta, Yuhei Umeda, Venkatesh Babu Radhakrishnan",
        "tldr": "",
        "abstract": "The rise in internet usage has led to the generation of massive amounts of data, resulting in the adoption of various supervised and semi-supervised machine learning algorithms, which can effectively utilize the colossal amount of data to train models. However, before deploying these models in the real world, these must be strictly evaluated on performance measures like worst-case recall and satisfy constraints such as fairness. We find that current state-of-the-art empirical techniques offer sub-optimal performance on these practical, non-decomposable performance objectives. On the other hand, the theoretical techniques necessitate training a new model from scratch for each performance objective. To bridge the gap, we propose SelMix, a selective mixup-based inexpensive fine-tuning technique for pre-trained models, to optimize for the desired objective. The core idea of our framework is to determine a sampling distribution to perform a mixup of features between samples from particular classes such that it optimizes the given objective.  We comprehensively evaluate our technique against the existing empirical and theoretically principled methods on standard benchmark datasets for imbalanced classification. We find that proposed SelMix fine-tuning significantly improves the performance for various practical non-decomposable objectives across benchmarks.",
        "keywords": "Non-Decomposable Objectives;Long-Tail Learning;Semi-Supervised Learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Shrinivas Ramasubramanian;Harsh Rangwani;Sho Takemori;Kunal Samanta;Yuhei Umeda;Venkatesh Babu Radhakrishnan",
        "authorids": "~Shrinivas_Ramasubramanian1;~Harsh_Rangwani1;~Sho_Takemori1;~Kunal_Samanta1;~Yuhei_Umeda1;~Venkatesh_Babu_Radhakrishnan2",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://stablegradients.github.io/;https://rangwani-harsh.github.io/about/;;;;http://cds.iisc.ac.in/faculty/venky",
        "dblp": ";220/0991;155/7291;;59/8030;20/6289",
        "google_scholar": "igm1_28AAAAJ;OQK0WREAAAAJ;;;https://scholar.google.co.jp/citations?user=8NWN3xAAAAAJ;cVg7HrEAAAAJ",
        "orcid": ";;;;;0000-0002-1926-1804",
        "linkedin": "shrinivas-ramasubramanian-2953721b9/;;;kunal-samanta/;yuheiumeda-9868221b2/;venkatesh-babu-radhakrishnan-16568939",
        "or_profile": "~Shrinivas_Ramasubramanian1;~Harsh_Rangwani1;~Sho_Takemori1;~Kunal_Samanta1;~Yuhei_Umeda1;~Venkatesh_Babu_Radhakrishnan2",
        "aff": "Fujitsu Research and Development Center Co. Ltm.;Indian Institute of Science;Fujitsu Research and Development Center Co. Ltm.;Indian Institute of Science, Dhirubhai Ambani Institute Of Information and Communication Technology;Kyushu University, Tokyo Institute of Technology;Indian Institute of Science",
        "aff_domain": "fujitsu.com;iisc.ac.in;fujitsu.com;iisc.ac.in;kyushu-u.ac.jp;iisc.ac.in",
        "position": "Researcher;PhD student;Principal Researcher;Undergrad student;Postdoc;Full Professor",
        "bibtex": "@inproceedings{\nramasubramanian2024selective,\ntitle={Selective Mixup Fine-Tuning for Optimizing Non-Decomposable Objectives},\nauthor={Shrinivas Ramasubramanian and Harsh Rangwani and Sho Takemori and Kunal Samanta and Yuhei Umeda and Venkatesh Babu Radhakrishnan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=rxVBKhyfSo}\n}",
        "github": "",
        "project": "",
        "reviewers": "4axA;misU;LrpR;iMBB",
        "pdf_size": 6177146,
        "rating": "6;6;8;8",
        "confidence": "3;4;3;4",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;4",
        "presentation": "3;2;4;3",
        "wc_summary": "74;45;108;113",
        "wc_strengths": "66;19;94;79",
        "wc_weaknesses": "79;178;269;82",
        "wc_questions": "3;81;65;74",
        "wc_review": "222;323;536;348",
        "wc_reply_reviewers": "0;0;103;0",
        "wc_reply_authors": "887;1526;947;457",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "2;3;2;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            85.0,
            27.54087870784082
        ],
        "wc_strengths_avg": [
            64.5,
            28.075790282732914
        ],
        "wc_weaknesses_avg": [
            152.0,
            78.4123714728741
        ],
        "wc_questions_avg": [
            55.75,
            30.978823412131067
        ],
        "wc_review_avg": [
            357.25,
            113.4710866256246
        ],
        "wc_reply_reviewers_avg": [
            25.75,
            44.60030829489859
        ],
        "wc_reply_authors_avg": [
            954.25,
            380.37177537246373
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8990626704798417319&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=rxVBKhyfSo",
        "pdf": "https://openreview.net/pdf?id=rxVBKhyfSo",
        "email": "fujitsu.com;iisc.ac.in;fujitsu.com;iisc.ac.in;kyushu-u.ac.jp;iisc.ac.in",
        "author_num": 6,
        "aff_unique_index": "0;1;0;1;2;1",
        "aff_unique_norm": "Fujitsu Research and Development Center;Indian Institute of Science;Kyushu University",
        "aff_unique_dep": "Research and Development;;",
        "aff_unique_url": "https://www.fujitsu.com/global/;https://www.iisc.ac.in;https://www.kyushu-u.ac.jp",
        "aff_unique_abbr": "Fujitsu R&D;IISc;Kyushu U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;1;0;1",
        "aff_country_unique": "Japan;India"
    },
    {
        "title": "Improving protein optimization with smoothed fitness landscapes",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17670",
        "id": "rxlF2Zv8x0",
        "author_site": "Andrew Kirjner, Jason Yim, Raman Samusevich, Shahar Bracha, Tommi Jaakkola, Regina Barzilay, Ila Fiete",
        "tldr": "",
        "abstract": "The ability to engineer novel proteins with higher fitness for a desired property would be revolutionary for biotechnology and medicine. Modeling the combinatorially large space of sequences is infeasible; prior methods often constrain optimization to a small mutational radius, but this drastically limits the design space. Instead of heuristics, we propose smoothing the fitness landscape to facilitate protein optimization. First, we formulate protein fitness as a graph signal then use Tikunov regularization to smooth the fitness landscape. We find optimizing in this smoothed landscape leads to improved performance across multiple methods in the GFP and AAV benchmarks. Second, we achieve state-of-the-art results utilizing discrete energy-based models and MCMC in the smoothed landscape. Our method, called Gibbs sampling with Graph-based Smoothing (GGS), demonstrates a unique ability to achieve 2.5 fold fitness improvement (with in-silico evaluation) over its training set. GGS demonstrates potential to optimize proteins in the limited data regime. Code: https://github.com/kirjner/GGS",
        "keywords": "protein design;discrete optimization;protein engineering;markov chain monte carlo;graph signal processing",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/975b32340617e650a4f8eb8a2460e5116cdd81de.zip",
        "author": "Andrew Kirjner;Jason Yim;Raman Samusevich;Shahar Bracha;Tommi S. Jaakkola;Regina Barzilay;Ila R Fiete",
        "authorids": "~Andrew_Kirjner1;~Jason_Yim1;~Raman_Samusevich1;~Shahar_Bracha1;~Tommi_S._Jaakkola1;~Regina_Barzilay1;~Ila_R_Fiete1",
        "gender": "M;;M;F;;female;F",
        "homepage": "https://www.andrewkirjner.com/;http://people.csail.mit.edu/jyim/;;;;https://www.regina.csail.mit.edu/;https://fietelab.mit.edu/",
        "dblp": ";278/7337;190/5286;;;b/ReginaBarzilay;",
        "google_scholar": ";8wDe9NAAAAAJ;;https://scholar.google.co.il/citations?user=D4d5zt0AAAAJ;;;uE-CihIAAAAJ",
        "orcid": ";0000-0003-0575-7400;0009-0003-1684-3600;0000-0001-5320-3352;;;0000-0003-4738-2539",
        "linkedin": ";;ramansamusevich/;;;;",
        "or_profile": "~Andrew_Kirjner1;~Jason_Yim1;~Raman_Samusevich1;~Shahar_Bracha1;~Tommi_S._Jaakkola1;~Regina_Barzilay1;~Ila_R_Fiete1",
        "aff": "Massachusetts Institute of Technology;Massachusetts Institute of Technology;Honeywell spol. s r.o.;Massachusetts Institute of Technology;;Massachusetts Institute of Technology;Massachusetts Institute of Technology",
        "aff_domain": "mit.edu;mit.edu;honeywell.com;mit.edu;;mit.edu;mit.edu",
        "position": "PhD student;PhD student;Researcher;Postdoc;;Professor;Professor",
        "bibtex": "@inproceedings{\nkirjner2024improving,\ntitle={Improving protein optimization with smoothed fitness landscapes},\nauthor={Andrew Kirjner and Jason Yim and Raman Samusevich and Shahar Bracha and Tommi S. Jaakkola and Regina Barzilay and Ila R Fiete},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=rxlF2Zv8x0}\n}",
        "github": "",
        "project": "",
        "reviewers": "PzPY;zgX5;7UDm;Ayis",
        "pdf_size": 1546840,
        "rating": "3;6;6;6",
        "confidence": "3;4;3;3",
        "soundness": "1;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "1;2;3;3",
        "wc_summary": "44;86;33;120",
        "wc_strengths": "8;108;63;23",
        "wc_weaknesses": "204;367;148;22",
        "wc_questions": "36;415;200;185",
        "wc_review": "292;976;444;350",
        "wc_reply_reviewers": "30;252;0;0",
        "wc_reply_authors": "1139;2135;769;1339",
        "reply_reviewers": "1;2;0;0",
        "reply_authors": "3;4;1;2",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            70.75,
            34.63650530870573
        ],
        "wc_strengths_avg": [
            50.5,
            38.81043674065006
        ],
        "wc_weaknesses_avg": [
            185.25,
            123.9180676899055
        ],
        "wc_questions_avg": [
            209.0,
            135.1129157408721
        ],
        "wc_review_avg": [
            515.5,
            271.34618110450714
        ],
        "wc_reply_reviewers_avg": [
            70.5,
            105.50236964163412
        ],
        "wc_reply_authors_avg": [
            1345.5,
            499.5865790831455
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 23,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7354737689427624753&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=rxlF2Zv8x0",
        "pdf": "https://openreview.net/pdf?id=rxlF2Zv8x0",
        "email": "mit.edu;mit.edu;honeywell.com;mit.edu;;mit.edu;mit.edu",
        "author_num": 7,
        "aff_unique_index": "0;0;1;0;0;0",
        "aff_unique_norm": "Massachusetts Institute of Technology;Honeywell",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://web.mit.edu;https://www.honeywell.com",
        "aff_unique_abbr": "MIT;Honeywell",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0;0",
        "aff_country_unique": "United States;Czech Republic"
    },
    {
        "title": "CAMIL: Context-Aware Multiple Instance Learning for Cancer Detection and Subtyping in Whole Slide Images",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17669",
        "id": "rzBskAEmoc",
        "author_site": "olga fourkioti, Matt De Vries, Chris Bakal",
        "tldr": "",
        "abstract": "The visual examination of tissue biopsy sections is fundamental for cancer diagnosis, with pathologists analyzing sections at multiple magnifications to discern tumor cells and their subtypes. However, existing attention-based multiple instance learning (MIL) models used for analyzing Whole Slide Images (WSIs) in cancer diagnostics often overlook the contextual information of tumor and neighboring tiles, leading to misclassifications. To address this, we propose the Context-Aware Multiple Instance Learning (CAMIL) architecture. CAMIL incorporates neighbor-constrained attention to consider dependencies among tiles within a WSI and integrates contextual constraints as prior knowledge into the MIL model. We evaluated CAMIL on subtyping non-small cell lung cancer (TCGA-NSCLC) and detecting lymph node (CAMELYON16 and CAMELYON17) metastasis, achieving test AUCs of 97.5\\%, 95.9\\%, and 88.1\\%, respectively, outperforming other state-of-the-art methods. Additionally, CAMIL enhances model interpretability by identifying regions of high diagnostic value. Our code is available at https://github.com/olgarithmics/ICLR_CAMIL.",
        "keywords": "Multiple Instance Learning;Histopathology;Nearest Neighbors;Graph Representation",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Olga Fourkioti;Matt De Vries;Chris Bakal",
        "authorids": "~Olga_Fourkioti2;~Matt_De_Vries1;~Chris_Bakal1",
        "gender": "F;M;M",
        "homepage": ";;https://www.icr.ac.uk/our-research/researchers-and-teams/professor-chris-bakal",
        "dblp": "205/3096;;",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;nGXdfcEAAAAJ;https://scholar.google.co.uk/citations?user=AkaRnp4AAAAJ",
        "orcid": ";0000-0002-4098-1611;0000-0002-0413-6744",
        "linkedin": ";matthewdevries13/;",
        "or_profile": "~Olga_Fourkioti2;~Matt_De_Vries1;~Chris_Bakal1",
        "aff": "Institute of Cancer Research;Imperial College London;Institute of Cancer Research ",
        "aff_domain": "icr.ac.uk;ic.ac.uk;icr.ac.uk",
        "position": "PhD student;PhD student;Full Professor",
        "bibtex": "@inproceedings{\nfourkioti2024camil,\ntitle={{CAMIL}: Context-Aware Multiple Instance Learning for Cancer Detection and Subtyping in Whole Slide Images},\nauthor={Olga Fourkioti and Matt De Vries and Chris Bakal},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=rzBskAEmoc}\n}",
        "github": "",
        "project": "",
        "reviewers": "2WUS;15GF;SSWm;5Vaj",
        "pdf_size": 31964334,
        "rating": "6;8;8;8",
        "confidence": "3;4;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;4",
        "presentation": "3;3;2;4",
        "wc_summary": "34;129;55;119",
        "wc_strengths": "47;48;76;50",
        "wc_weaknesses": "187;86;147;27",
        "wc_questions": "56;61;31;35",
        "wc_review": "324;324;309;231",
        "wc_reply_reviewers": "21;54;47;23",
        "wc_reply_authors": "1276;1207;1047;507",
        "reply_reviewers": "1;2;1;1",
        "reply_authors": "3;5;4;1",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            84.25,
            40.59171713539598
        ],
        "wc_strengths_avg": [
            55.25,
            12.028611723719408
        ],
        "wc_weaknesses_avg": [
            111.75,
            60.72633283839886
        ],
        "wc_questions_avg": [
            45.75,
            12.94942083646987
        ],
        "wc_review_avg": [
            297.0,
            38.59404099080582
        ],
        "wc_reply_reviewers_avg": [
            36.25,
            14.48059045757458
        ],
        "wc_reply_authors_avg": [
            1009.25,
            301.6375101011146
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.25,
            1.479019945774904
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 21,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2540817801351894044&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=rzBskAEmoc",
        "pdf": "https://openreview.net/pdf?id=rzBskAEmoc",
        "email": "icr.ac.uk;ic.ac.uk;icr.ac.uk",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Institute of Cancer Research;Imperial College London",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.icr.ac.uk;https://www.imperial.ac.uk",
        "aff_unique_abbr": "ICR;ICL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "title": "Neural SDF Flow for 3D Reconstruction of Dynamic Scenes",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17668",
        "id": "rzF0R6GOd4",
        "author_site": "wei mao, Richard Hartley, Mathieu Salzmann, Wei Mao",
        "tldr": "",
        "abstract": "In this paper, we tackle the problem of 3D reconstruction of dynamic scenes from multi-view videos. Previous dynamic scene reconstruction works either attempt to model the motion of 3D points in space, which constrains them to handle a single articulated object or require depth maps as input. By contrast, we propose to directly estimate the change of Signed Distance Function (SDF), namely SDF\nflow, of the dynamic scene. We show that the SDF flow captures the evolution of the scene surface. We further derive the mathematical relation between the SDF flow and the scene flow, which allows us to calculate the scene flow from the SDF flow analytically by solving linear equations. Our experiments on real-world multi-view video datasets show that our reconstructions are better than those of the state-of-the-art methods. Our code is available at https://github.com/wei-mao-2019/SDFFlow.git.",
        "keywords": "3D reconstruction;NeRF;dynamic scene",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/d3e2425ef057e442cd3ce967eba0f0c41df14ab7.zip",
        "author": "Wei Mao;Richard Hartley;Mathieu Salzmann;miaomiao Liu",
        "authorids": "~Wei_Mao1;~Richard_Hartley1;~Mathieu_Salzmann1;~miaomiao_Liu2",
        "gender": "M;M;M;F",
        "homepage": "https://wei-mao-2019.github.io/home/;http://axiom.anu.edu.au/~hartley/;https://people.epfl.ch/mathieu.salzmann;http://users.cecs.anu.edu.au/~mliu/",
        "dblp": "51/4914-1;h/RIHartley;18/4533;66/8063-1.html",
        "google_scholar": "X3ji--4AAAAJ;https://scholar.google.com.tw/citations?user=cHia5p0AAAAJ;https://scholar.google.ch/citations?user=n-B0jr4AAAAJ;https://scholar.google.com.au/citations?user=ptAR7tUAAAAJ",
        "orcid": ";0000-0002-5005-0191;;",
        "linkedin": "wei-mao-anu/;;;",
        "or_profile": "~Wei_Mao1;~Richard_Hartley1;~Mathieu_Salzmann1;~miaomiao_Liu2",
        "aff": "Australian National University;Google;CSIRO;Australian National University",
        "aff_domain": "anu.edu.au;google.com;data61.csiro.au;anu.edu.au",
        "position": "Postdoc;visitor;Collaborator;Assistant Professor",
        "bibtex": "@inproceedings{\nmao2024neural,\ntitle={Neural {SDF} Flow for 3D Reconstruction of Dynamic Scenes},\nauthor={Wei Mao and Richard Hartley and Mathieu Salzmann and miaomiao Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=rzF0R6GOd4}\n}",
        "github": "",
        "project": "",
        "reviewers": "uMrz;hwJN;jfGg;nuCZ",
        "pdf_size": 6710448,
        "rating": "8;8;8;8",
        "confidence": "5;4;4;4",
        "soundness": "2;3;3;3",
        "contribution": "3;3;2;2",
        "presentation": "3;3;2;2",
        "wc_summary": "137;71;90;57",
        "wc_strengths": "121;95;67;68",
        "wc_weaknesses": "685;72;231;236",
        "wc_questions": "135;3;182;38",
        "wc_review": "1078;241;570;399",
        "wc_reply_reviewers": "442;29;42;183",
        "wc_reply_authors": "1713;391;1004;1038",
        "reply_reviewers": "2;1;1;1",
        "reply_authors": "3;1;3;3",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            88.75,
            30.21899237234756
        ],
        "wc_strengths_avg": [
            87.75,
            22.24157143728833
        ],
        "wc_weaknesses_avg": [
            306.0,
            228.53993086548354
        ],
        "wc_questions_avg": [
            89.5,
            72.04338970370564
        ],
        "wc_review_avg": [
            572.0,
            314.45587925812424
        ],
        "wc_reply_reviewers_avg": [
            174.0,
            166.09786271954255
        ],
        "wc_reply_authors_avg": [
            1036.5,
            467.80898879777845
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.8660254037844386
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7304394591267462052&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=rzF0R6GOd4",
        "pdf": "https://openreview.net/pdf?id=rzF0R6GOd4",
        "email": "anu.edu.au;google.com;data61.csiro.au;anu.edu.au",
        "author_num": 4,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Australian National University;Google;Commonwealth Scientific and Industrial Research Organisation",
        "aff_unique_dep": ";Google;",
        "aff_unique_url": "https://www.anu.edu.au;https://www.google.com;https://www.csiro.au",
        "aff_unique_abbr": "ANU;Google;CSIRO",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "Australia;United States"
    },
    {
        "id": "s1ByDEbpI8",
        "title": "Skills-in-Context Prompting: Unlocking Compositionality in Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We consider the problem of eliciting compositional generalization capabilities in large language models (LLMs) with a novel type of prompting strategy. Compositional generalization empowers the LLMs to solve problems that are harder than the ones they have seen (i.e., easy-to-hard generalization), which is a critical reasoning capability of human-like intelligence. However, even the current state-of-the-art LLMs still struggle with this form of reasoning. To bridge this gap, we propose skills-in-context (SKiC) prompting, which instructs LLMs how to compose basic skills to resolve more complex problems. We find that it is crucial to demonstrate both the skills and the compositional examples within the same prompting context. With as few as two examplars, our SKiC prompting initiates strong synergies between skills and their composition capabilities. Notably, it empowers LLMs to solve unseen problems that require innovative skill compositions, achieving near-perfect generalization on a broad range of challenging compositionality tasks. Intriguingly, SKiC prompting unlocks the latent potential of LLMs, enabling them to leverage pre-existing internal skills acquired during earlier pretraining stages, even when these skills are not explicitly presented in the prompting context. This results in the capability of LLMs to solve unseen complex problems by activating and composing internal competencies. With such prominent features, SKiC prompting is able to significantly improve the mathematical reasoning capabilities (e.g., MATH) with simple 1-stage prompting.",
        "keywords": "Large Language Models;Compositional Generalization;Skills;Natural Language Processing",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/c84ed21bcdd42c01f2f087b1eb3a90fc27f1d051.zip",
        "author": "Jiaao Chen;Xiaoman Pan;Dian Yu;Kaiqiang Song;Xiaoyang Wang;Dong Yu;Jianshu Chen",
        "authorids": "~Jiaao_Chen2;~Xiaoman_Pan2;~Dian_Yu3;~Kaiqiang_Song2;~Xiaoyang_Wang1;~Dong_Yu2;~Jianshu_Chen1",
        "gender": "M;F;M;M;M;M;M",
        "homepage": "https://cs.stanford.edu/people/jiaaoc/;https://sites.google.com/site/yudiandoris/;http://i2u.world/kqsong/;https://sites.google.com/view/dongyu888/;https://chenjianshu.github.io/;https://panx27.github.io/homepage/;https://xyang0.github.io/",
        "dblp": "230/3663;136/8648-1.html;;71/4598-1;11/3124;148/9210;81/1832-1",
        "google_scholar": "Pi9IVvUAAAAJ;ERdzqyYAAAAJ;PHoJwakAAAAJ;tMY31_gAAAAJ;jQeFWdoAAAAJ;tRPF03IAAAAJ;EeppWmkAAAAJ",
        "orcid": ";;;0000-0003-0520-6844;;;0000-0002-0746-1059",
        "linkedin": ";;;dongyu/;;;xiaoyang-wang-001",
        "or_profile": "~Jiaao_Chen2;~Dian_Yu3;~Kaiqiang_Song2;~Dong_Yu2;~Jianshu_Chen1;~Xiaoman_Pan1;~Xiaoyang_Wang2",
        "aff": "Georgia Institute of Technology;Tencent AI Lab;Tencent AI Lab;Tencent AI Lab;Amazon;Tencent AI Lab;Tencent AI Lab",
        "aff_domain": "gatech.edu;tencent.com;tencent.com;tencent.com;amazon.com;tencent.com;tencent.com",
        "position": "PhD student;NLP researcher;Senior Researcher;Distinguished Scientist;Principal Scientist;Researcher;Senior Researcher",
        "bibtex": "@misc{\nchen2024skillsincontext,\ntitle={Skills-in-Context Prompting:  Unlocking Compositionality in Large Language Models},\nauthor={Jiaao Chen and Xiaoman Pan and Dian Yu and Kaiqiang Song and Xiaoyang Wang and Dong Yu and Jianshu Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=s1ByDEbpI8}\n}",
        "github": "",
        "project": "",
        "reviewers": "v2fa;XFNL;52w8;wLQH",
        "site": "https://openreview.net/forum?id=s1ByDEbpI8",
        "pdf_size": 1995771,
        "rating": "3;5;5;8",
        "confidence": "5;4;3;4",
        "soundness": "2;3;3;4",
        "contribution": "2;2;2;4",
        "presentation": "3;1;3;4",
        "wc_summary": "94;157;134;53",
        "wc_strengths": "76;68;88;40",
        "wc_weaknesses": "479;347;174;11",
        "wc_questions": "82;64;26;62",
        "wc_review": "731;636;422;166",
        "wc_reply_reviewers": "0;519;0;0",
        "wc_reply_authors": "2404;1474;1790;437",
        "reply_reviewers": "0;2;0;0",
        "reply_authors": "6;3;5;1",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            2.75,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            109.5,
            39.65160778581368
        ],
        "wc_strengths_avg": [
            68.0,
            17.663521732655695
        ],
        "wc_weaknesses_avg": [
            252.75,
            176.57629370898007
        ],
        "wc_questions_avg": [
            58.5,
            20.316249653910045
        ],
        "wc_review_avg": [
            488.75,
            217.36533187240323
        ],
        "wc_reply_reviewers_avg": [
            129.75,
            224.73359228206184
        ],
        "wc_reply_authors_avg": [
            1526.25,
            712.2507897503519
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            3.75,
            1.920286436967152
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.39605901719066966,
        "gs_citation": 27,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12576437854212500464&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1;1;2;1;1",
        "aff_unique_norm": "Georgia Institute of Technology;Tencent;Amazon",
        "aff_unique_dep": ";Tencent AI Lab;Amazon.com, Inc.",
        "aff_unique_url": "https://www.gatech.edu;https://ai.tencent.com;https://www.amazon.com",
        "aff_unique_abbr": "Georgia Tech;Tencent AI Lab;Amazon",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;0;1;1",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "s25i99RTCg",
        "title": "Multi-modal Latent Diffusion",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Multi-modal data-sets are ubiquitous in modern applications, and multi-modal Variational Autoencoders are a popular family of models that aim to learn a joint representation of the different modalities. However, existing approaches suffer from a coherence-quality tradeoff, where models with good generation quality lack generative coherence across modalities, and vice versa. We discuss the limitations underlying the unsatisfactory performance of existing methods, to motivate the need for a different approach. We propose a novel method that uses a set of independently trained, uni-modal, deterministic autoencoders. Individual latent variables are concatenated into a common latent space, which is fed to a masked diffusion model to enable generative modeling. We also introduce a new multi-time training method to learn the conditional score network for multi-modal diffusion. Our methodology substantially outperforms competitors in both generation quality and coherence, as shown through an extensive experimental campaign.",
        "keywords": "Multimodality;Generative Models;Diffusion models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/92a5e46ccf3231075376c3eb2917862d71d96483.zip",
        "author": "Mustapha BOUNOUA;Giulio Franzese;Pietro Michiardi",
        "authorids": "~Mustapha_BOUNOUA1;~Giulio_Franzese1;~Pietro_Michiardi1",
        "gender": "M;M;M",
        "homepage": "https://mustaphabounoua.github.io/;;http://www.eurecom.fr/~michiard/",
        "dblp": "348/9789;217/1859.html;54/3028",
        "google_scholar": "1ooHDEMAAAAJ;kEtx_WwAAAAJ;https://scholar.google.com.tw/citations?user=mlx1eCgAAAAJ",
        "orcid": "0009-0003-5244-8528;0000-0003-4244-2053;",
        "linkedin": "mustb/;;",
        "or_profile": "~Mustapha_BOUNOUA1;~Giulio_Franzese1;~Pietro_Michiardi1",
        "aff": "Eurecom;Eurecom;EURECOM",
        "aff_domain": "eurecom.fr;eurecom.fr;eurecom.fr",
        "position": "PhD student;Postdoc;Full Professor",
        "bibtex": "@misc{\nbounoua2024multimodal,\ntitle={Multi-modal Latent Diffusion},\nauthor={Mustapha BOUNOUA and Giulio Franzese and Pietro Michiardi},\nyear={2024},\nurl={https://openreview.net/forum?id=s25i99RTCg}\n}",
        "github": "",
        "project": "",
        "reviewers": "mRTE;865d;SqcE;yi7k",
        "site": "https://openreview.net/forum?id=s25i99RTCg",
        "pdf_size": 21926805,
        "rating": "3;5;6;6",
        "confidence": "2;3;4;4",
        "soundness": "3;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "2;2;3;2",
        "wc_summary": "40;118;52;138",
        "wc_strengths": "22;103;22;49",
        "wc_weaknesses": "35;402;475;102",
        "wc_questions": "67;14;9;230",
        "wc_review": "164;637;558;519",
        "wc_reply_reviewers": "0;364;19;0",
        "wc_reply_authors": "773;1620;1699;1853",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "2;3;4;4",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            87.0,
            41.82104733265297
        ],
        "wc_strengths_avg": [
            49.0,
            33.0681115275729
        ],
        "wc_weaknesses_avg": [
            253.5,
            188.287678832153
        ],
        "wc_questions_avg": [
            80.0,
            89.53490939292897
        ],
        "wc_review_avg": [
            469.5,
            181.43111640509738
        ],
        "wc_reply_reviewers_avg": [
            95.75,
            155.06833171218423
        ],
        "wc_reply_authors_avg": [
            1486.25,
            420.23289673703556
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.25,
            0.82915619758885
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.9847319278346618,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6628566699947442096&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 10,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "EURECOM",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.eurecom.fr",
        "aff_unique_abbr": "",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "France"
    },
    {
        "id": "s2HF7VCU8P",
        "title": "Reverse Stable Diffusion: What prompt was used to generate this image?",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Text-to-image diffusion models such as Stable Diffusion have recently attracted the interest of many researchers, and inverting the diffusion process can play an important role in better understanding the generative process and how to engineer prompts in order to obtain the desired images. To this end, we introduce the new task of predicting the text prompt given an image generated by a generative diffusion model. We combine a series of white-box and black-box models (with and without access to the weights of the diffusion network) to deal with the proposed task. We propose a novel learning framework comprising of a joint prompt regression and multi-label vocabulary classification objective that generates improved prompts. To further improve our method, we employ a curriculum learning procedure that promotes the learning of image-prompt pairs with lower labeling noise (i.e. that are better aligned), and an unsupervised domain-adaptive kernel learning method that uses the similarities between samples in the source and target domains as extra features. We conduct experiments on the DiffusionDB data set, predicting text prompts from images generated by Stable Diffusion. Our novel learning framework produces excellent results on the aforementioned task, yielding the highest gains when applied on the white-box model.  In addition,  we make an interesting discovery: training a diffusion model on the prompt generation task can make the model generate images that are much better aligned with the input prompts, when the model is directly reused for text-to-image generation. Our code is publicly available for download at https://github.com/anonymous.",
        "keywords": "diffusion models;prompt prediction;reverse diffusion modeling;curriculum learning;domain-adaptive kernel learning",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/1c51fe82d16c353269059070a1a6344d28696128.zip",
        "author": "Florinel Alin Croitoru;Vlad Hondru;Radu Tudor Ionescu;Mubarak Shah",
        "authorids": "~Florinel_Alin_Croitoru1;~Vlad_Hondru1;~Radu_Tudor_Ionescu1;~Mubarak_Shah3",
        "gender": "M;M;M;M",
        "homepage": ";;http://raduionescu.herokuapp.com;https://www.crcv.ucf.edu/person/mubarak-shah/",
        "dblp": "313/9342;242/1425;120/9006;s/MubarakShah",
        "google_scholar": "RyD1dScAAAAJ;https://scholar.google.com.vn/citations?user=BPb6oyIAAAAJ;qVbwC6QAAAAJ;https://scholar.google.com.tw/citations?user=p8gsO3gAAAAJ",
        "orcid": ";;0000-0002-9301-1950;0000-0002-8216-1128",
        "linkedin": "alin-croitoru-34254715a;vlad-hondru25/;radu-ionescu-5145374b/;mubarak-shah-b6aa68213/",
        "or_profile": "~Florinel_Alin_Croitoru1;~Vlad_Hondru1;~Radu_Tudor_Ionescu1;~Mubarak_Shah3",
        "aff": "University of Bucharest;University of Bucharest;Universitatea Bucuresti;University of Central Florida",
        "aff_domain": "unibuc.ro;unibuc.ro;unibuc.ro;ucf.edu",
        "position": "PhD student;PhD student;Full Professor;Full Professor",
        "bibtex": "@misc{\ncroitoru2024reverse,\ntitle={Reverse Stable Diffusion: What prompt was used to generate this image?},\nauthor={Florinel Alin Croitoru and Vlad Hondru and Radu Tudor Ionescu and Mubarak Shah},\nyear={2024},\nurl={https://openreview.net/forum?id=s2HF7VCU8P}\n}",
        "github": "",
        "project": "",
        "reviewers": "zz1f;2mcu;xLb4",
        "site": "https://openreview.net/forum?id=s2HF7VCU8P",
        "pdf_size": 7411594,
        "rating": "3;5;6",
        "confidence": "4;4;3",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "2;3;3",
        "wc_summary": "98;53;70",
        "wc_strengths": "26;22;50",
        "wc_weaknesses": "377;122;108",
        "wc_questions": "43;149;6",
        "wc_review": "544;346;234",
        "wc_reply_reviewers": "395;0;0",
        "wc_reply_authors": "1908;702;223",
        "reply_reviewers": "1;0;0",
        "reply_authors": "3;1;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            73.66666666666667,
            18.55322673343433
        ],
        "wc_strengths_avg": [
            32.666666666666664,
            12.364824660660938
        ],
        "wc_weaknesses_avg": [
            202.33333333333334,
            123.64015888411375
        ],
        "wc_questions_avg": [
            66.0,
            60.602530200204235
        ],
        "wc_review_avg": [
            374.6666666666667,
            128.1700259637781
        ],
        "wc_reply_reviewers_avg": [
            131.66666666666666,
            186.20478571245752
        ],
        "wc_reply_authors_avg": [
            944.3333333333334,
            708.9195221524718
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.7559289460184545,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17210101095913886218&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "University of Bucharest;University of Central Florida",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.unibuc.ro;https://www.ucf.edu",
        "aff_unique_abbr": "Unibuc;UCF",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "Romania;United States"
    },
    {
        "title": "Accurate Retraining-free Pruning for Pretrained Encoder-based Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17667",
        "id": "s2NjWfaYdZ",
        "author_site": "Seungcheol Park, Hojun Choi, U Kang",
        "tldr": "",
        "abstract": "Given a pretrained encoder-based language model, how can we accurately compress it without retraining? Retraining-free structured pruning algorithms are crucial in pretrained language model compression due to their significantly reduced pruning cost and capability to prune large language models. However, existing retraining-free algorithms encounter severe accuracy degradation, as they fail to handle pruning errors, especially at high compression rates. In this paper, we propose KPrune (Knowledge-preserving pruning), an accurate retraining-free structured pruning algorithm for pretrained encoder-based language models.\nKPrune focuses on preserving the useful knowledge of the pretrained model to minimize pruning errors through a carefully designed iterative pruning process composed of knowledge measurement, knowledge-preserving mask search, and knowledge-preserving weight-tuning. As a result, KPrune shows significant accuracy improvements up to 58.02%p higher F1 score compared to existing retraining-free pruning algorithms under a high compression rate of 80% on the SQuAD benchmark without any retraining process.",
        "keywords": "Retraining-free;Pruning;Compression;Transformers",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Seungcheol Park;Hojun Choi;U Kang",
        "authorids": "~Seungcheol_Park1;~Hojun_Choi1;~U_Kang1",
        "gender": "M;M;M",
        "homepage": ";;http://datalab.snu.ac.kr/~ukang",
        "dblp": "255/7699;271/5004;13/7122",
        "google_scholar": "https://scholar.google.com/citations?hl=ko;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en",
        "orcid": "0009-0006-5315-7142;0009-0009-4121-4519;0000-0002-8774-6950",
        "linkedin": "ppakssa/;hojun-eric-choi-2b10b11a0/;",
        "or_profile": "~Seungcheol_Park1;~Hojun_Choi1;~U_Kang1",
        "aff": "Seoul National University;Korea Advanced Institute of Science & Technology;Seoul National University",
        "aff_domain": "snu.ac.kr;kaist.ac.kr;snu.ac.kr",
        "position": "PhD student;Researcher;Full Professor",
        "bibtex": "@inproceedings{\npark2024accurate,\ntitle={Accurate Retraining-free Pruning for Pretrained Encoder-based Language Models},\nauthor={Seungcheol Park and Hojun Choi and U Kang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=s2NjWfaYdZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "akzo;sVyn;nct7;9HrX",
        "pdf_size": 5047559,
        "rating": "5;6;8;8",
        "confidence": "4;4;5;4",
        "soundness": "2;3;4;3",
        "contribution": "2;3;4;3",
        "presentation": "2;3;3;3",
        "wc_summary": "113;137;214;133",
        "wc_strengths": "104;60;70;63",
        "wc_weaknesses": "68;41;45;84",
        "wc_questions": "7;4;167;8",
        "wc_review": "292;242;496;288",
        "wc_reply_reviewers": "0;33;4;72",
        "wc_reply_authors": "599;219;768;433",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "1;1;2;2",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            149.25,
            38.473204961375394
        ],
        "wc_strengths_avg": [
            74.25,
            17.55526986406076
        ],
        "wc_weaknesses_avg": [
            59.5,
            17.5
        ],
        "wc_questions_avg": [
            46.5,
            69.58627738282887
        ],
        "wc_review_avg": [
            329.5,
            98.11600277222875
        ],
        "wc_reply_reviewers_avg": [
            27.25,
            28.80429655450728
        ],
        "wc_reply_authors_avg": [
            504.75,
            203.09157417283464
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5555555555555555,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7635172976101333326&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=s2NjWfaYdZ",
        "pdf": "https://openreview.net/pdf?id=s2NjWfaYdZ",
        "email": "snu.ac.kr;kaist.ac.kr;snu.ac.kr",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Seoul National University;Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.snu.ac.kr;https://www.kaist.ac.kr",
        "aff_unique_abbr": "SNU;KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "s33m3gvC70",
        "title": "Deep Metric Tensor Regularized Policy Gradient",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In this paper, we propose a novel policy gradient algorithm for deep reinforcement learning. Unlike previous approaches, we focus on leveraging the Hessian trace information in the policy parametric space to enhance the performance of trained policy networks. Specifically, we introduce a metric tensor field that transforms the policy parametric space into a general Riemannian manifold. We further develop mathematical tools, deep learning algorithms, and metric tensor deep neural networks (DNNs) to learn a desirable metric tensor field, with the aim to achieve close-to-zero divergence on the policy gradient vector field of the Riemannian manifold. As an important regularization mechanism, zero divergence nullifies the principal differential components of the loss function used for training policy networks. It is expected to improve the effectiveness and sample efficiency of the policy network training process. Experimental results on multiple benchmark reinforcement learning problems demonstrate the advantages of our metric tensor regularized algorithms over the non-regularized counterparts. Moreover, our empirical analysis reveals that the trained metric tensor DNN can effectively reduce the absolute divergence towards zero on the Riemannian manifold.",
        "keywords": "Deep Reinforcement Learning;Policy Gradient;Metric Tensor Field;Close-to-zero Divergence",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/4ca35ca8bbb0e6d42a050520154df4d367423810.pdf",
        "author": "Gang Chen;Victoria Huang",
        "authorids": "~Gang_Chen11;~Victoria_Huang2",
        "gender": ";M",
        "homepage": "https://niwa.co.nz/people/victoria-huang;https://people.wgtn.ac.nz/aaron.chen/about",
        "dblp": ";",
        "google_scholar": "https://scholar.google.com.au/citations?user=jZv153YAAAAJ;WptTb3kAAAAJ",
        "orcid": "0000-0002-8405-8845;0000-0002-9597-497X",
        "linkedin": "victoria-gy-huang/;",
        "or_profile": "~Victoria_Huang2;~Gang_Chen7",
        "aff": ";VUW",
        "aff_domain": ";vuw.ac.nz",
        "position": ";Associate Professor",
        "bibtex": "@misc{\nchen2024deep,\ntitle={Deep Metric Tensor Regularized Policy Gradient},\nauthor={Gang Chen and Victoria Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=s33m3gvC70}\n}",
        "github": "",
        "project": "",
        "reviewers": "dQEm;72W5;WRcW",
        "site": "https://openreview.net/forum?id=s33m3gvC70",
        "pdf_size": 854147,
        "rating": "3;3;6",
        "confidence": "4;4;1",
        "soundness": "2;2;3",
        "contribution": "2;1;3",
        "presentation": "1;1;3",
        "wc_summary": "20;19;31",
        "wc_strengths": "40;28;32",
        "wc_weaknesses": "340;328;32",
        "wc_questions": "1;3;6",
        "wc_review": "401;378;101",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.0,
            1.4142135623730951
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            23.333333333333332,
            5.436502143433363
        ],
        "wc_strengths_avg": [
            33.333333333333336,
            4.988876515698588
        ],
        "wc_weaknesses_avg": [
            233.33333333333334,
            142.4484312147928
        ],
        "wc_questions_avg": [
            3.3333333333333335,
            2.0548046676563256
        ],
        "wc_review_avg": [
            293.3333333333333,
            136.3239605580113
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:JAXcDhf8aAsJ:scholar.google.com/&scioq=Deep+Metric+Tensor+Regularized+Policy+Gradient&hl=en&as_sdt=0,33",
        "gs_version_total": 4,
        "aff_unique_index": "0",
        "aff_unique_norm": "Victoria University of Wellington",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.victoria.ac.nz",
        "aff_unique_abbr": "VUW",
        "aff_country_unique_index": "0",
        "aff_country_unique": "New Zealand"
    },
    {
        "id": "s3EpSMU2Jz",
        "title": "TuneMV3D: Tuning Foundational Image Diffusion Models for Generalizable and Scalable Multiview 3D Generation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Considerable progress has been made in 2D image generation, but 3D content creation lags behind due to a lack of large-scale, high-quality 3D datasets. To mitigate this gap, a recent line of work leverages 2D diffusion models for 3D generation but usually requires object-specific overfitting, making them unscalable. In this paper, we present TuneMV3D, a novel approach to generating diverse and creative 3D content in a scalable feedforward manner. At the core of TuneMV3D, we tune a foundational image diffusion model using a much smaller-scale 3D dataset while utilizing multi-view images to bridge the gap between 2D and 3D. This allows for the direct prediction of consistent, multi-view 3D representations from 2D diffusion models. We design an interactive diffusion scheme that is facilitated by jointly optimized latent SparseNeuS to ensure that the multi-view generations are consistent. Additionally, we propose a consistency-guided sampling strategy that preserves the creativity of the foundational image diffusion model while maintaining multi-view consistency. Using TuneMV3D, we can successfully distill the 3D counterpart of what can be created by a 2D foundation model, thereby generalizing beyond the small 3D tuning set and enabling scalable and diverse 3D content creation. An anonymous website showcasing the results is available at https://tunemv3d.github.io",
        "keywords": "3D generation;2D prior",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/59865a88e351617391065b2a3b29ef39806e84ca.pdf",
        "author": "Shaocong Dong;Lihe Ding;BANGGUO LI;Han Xue;Haibin Huang;Li Yi",
        "authorids": "~Shaocong_Dong1;~Lihe_Ding1;~BANGGUO_LI1;~Han_Xue3;~Haibin_Huang1;~Li_Yi2",
        "gender": ";M;M;M;M;M",
        "homepage": ";;https://github.com/LBG21;https://axian12138.github.io/;https://brotherhuang.github.io/;https://ericyi.github.io/",
        "dblp": "329/6563;307/5395;;;;26/4239-1",
        "google_scholar": "https://scholar.google.com.hk/citations?user=Pee4FRsAAAAJ;6nJrd8oAAAAJ;;;YDl1M80AAAAJ;UyZL660AAAAJ",
        "orcid": "0000-0001-6152-9299;0000-0003-1976-9496;;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Shaocong_Dong1;~Lihe_Ding1;~BANGGUO_LI1;~Han_Xue3;~Haibin_Huang1;~Li_Yi2",
        "aff": "Hong Kong University of Science and Technology;The Chinese University of Hong Kong;Tsinghua University;Tsinghua University;Kuaishou Technology;Tsinghua University",
        "aff_domain": "ust.hk;ie.cuhk.edu;mail.tsinghua.edu.cn;mail.tsinghua.edu.cn;kuaishou.com;tsinghua.edu.cn",
        "position": "PhD student;PhD student;Undergrad student;Undergrad student;Sr.Research Scientist;Assistant Professor",
        "bibtex": "@misc{\ndong2024tunemvd,\ntitle={Tune{MV}3D: Tuning Foundational Image Diffusion Models for Generalizable and Scalable Multiview 3D Generation},\nauthor={Shaocong Dong and Lihe Ding and BANGGUO LI and Han Xue and Haibin Huang and Li Yi},\nyear={2024},\nurl={https://openreview.net/forum?id=s3EpSMU2Jz}\n}",
        "github": "",
        "project": "",
        "reviewers": "Xd2U;hK4L;pX8m;5e7c",
        "site": "https://openreview.net/forum?id=s3EpSMU2Jz",
        "pdf_size": 3472708,
        "rating": "3;3;3;5",
        "confidence": "5;4;4;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;2;2",
        "wc_summary": "57;53;72;64",
        "wc_strengths": "18;30;110;85",
        "wc_weaknesses": "372;244;427;236",
        "wc_questions": "2;33;219;7",
        "wc_review": "449;360;828;392",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            61.5,
            7.22841614740048
        ],
        "wc_strengths_avg": [
            60.75,
            38.03534540397918
        ],
        "wc_weaknesses_avg": [
            319.75,
            82.13517821250527
        ],
        "wc_questions_avg": [
            65.25,
            89.54433259564784
        ],
        "wc_review_avg": [
            507.25,
            187.90872119196598
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:3SexJxAbkH8J:scholar.google.com/&scioq=TuneMV3D:+Tuning+Foundational+Image+Diffusion+Models+for+Generalizable+and+Scalable+Multiview+3D+Generation&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;2;3;2",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Chinese University of Hong Kong;Tsinghua University;Kuaishou Technology",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.ust.hk;https://www.cuhk.edu.hk;https://www.tsinghua.edu.cn;https://www.kuaishou.com",
        "aff_unique_abbr": "HKUST;CUHK;THU;Kuaishou",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "s3rjenIOfx",
        "title": "A Conceptual Framework for Analyzing Social Representation in Unstructured Data",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The unstructured nature of data used in foundation model development is a challenge to systematic analyses for making data use and documentation decisions. From a Responsible AI perspective, these decisions often rely upon understanding how people are represented in data. We propose a framework designed to guide analysis of human representation in unstructured data and identify downstream risks. We apply the framework in two toy examples using the Common Crawl web text corpus, and LAION-400M . We also propose a set of hypothetical action steps in service of dataset use, development, and documentation.",
        "keywords": "responsible AI;dataset evaluation",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Mark Diaz;Sunipa Dev;Emily Reif;Emily Denton;Vinodkumar Prabhakaran",
        "authorids": "~Mark_Diaz1;~Sunipa_Dev1;~Emily_Reif2;~Emily_Denton2;~Vinodkumar_Prabhakaran2",
        "gender": ";F;F;Non-Binary;M",
        "homepage": "https://www.markjdiaz.com;https://sunipa.github.io/;;https://www.cephaloponderer.com/;https://www.cs.stanford.edu/~vinod/",
        "dblp": "194/9668;222/1630;;;64/9281",
        "google_scholar": "G5c59xMAAAAJ;EV1DgP0AAAAJ;J1hMgtAAAAAJ;;HwryFLcAAAAJ",
        "orcid": "0000-0003-0167-9839;;;;",
        "linkedin": ";;emily-reif-4b995884;;",
        "or_profile": "~Mark_Diaz1;~Sunipa_Dev1;~Emily_Reif2;~Emily_Denton2;~Vinodkumar_Prabhakaran2",
        "aff": "Google;Google;Google;Google;Google",
        "aff_domain": "google.com;google.com;google.com;google.com;google.com",
        "position": "Researcher;Research Scientist;Researcher;Research Scientist;Research Scientist",
        "bibtex": "@misc{\ndiaz2024a,\ntitle={A Conceptual Framework for Analyzing Social Representation in Unstructured Data},\nauthor={Mark Diaz and Sunipa Dev and Emily Reif and Emily Denton and Vinodkumar Prabhakaran},\nyear={2024},\nurl={https://openreview.net/forum?id=s3rjenIOfx}\n}",
        "github": "",
        "project": "",
        "reviewers": "qstp;HJFp;Nevx;x2iJ;9nGw;MXER",
        "site": "https://openreview.net/forum?id=s3rjenIOfx",
        "pdf_size": 310407,
        "rating": "3;3;3;3;5;5",
        "confidence": "3;3;4;3;4;1",
        "soundness": "2;1;2;2;2;2",
        "contribution": "2;1;2;2;2;3",
        "presentation": "2;1;3;3;3;3",
        "wc_summary": "53;56;103;141;160;1",
        "wc_strengths": "59;44;66;116;89;1",
        "wc_weaknesses": "88;165;314;382;444;1",
        "wc_questions": "1;96;206;89;70;1",
        "wc_review": "201;361;689;728;763;4",
        "wc_reply_reviewers": "0;0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0;0",
        "reply_authors": "0;0;0;0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            1.0
        ],
        "soundness_avg": [
            1.8333333333333333,
            0.3726779962499649
        ],
        "contribution_avg": [
            2.0,
            0.5773502691896257
        ],
        "presentation_avg": [
            2.5,
            0.7637626158259734
        ],
        "wc_summary_avg": [
            85.66666666666667,
            54.77732702090852
        ],
        "wc_strengths_avg": [
            62.5,
            35.85503218982425
        ],
        "wc_weaknesses_avg": [
            232.33333333333334,
            159.5584184206176
        ],
        "wc_questions_avg": [
            77.16666666666667,
            69.21805320065631
        ],
        "wc_review_avg": [
            457.6666666666667,
            288.923096265348
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.3535533905932737,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:OE82GvBD-NUJ:scholar.google.com/&scioq=A+Conceptual+Framework+for+Analyzing+Social+Representation+in+Unstructured+Data&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Google",
        "aff_unique_dep": "Google",
        "aff_unique_url": "https://www.google.com",
        "aff_unique_abbr": "Google",
        "aff_campus_unique_index": "0;0;0;0;0",
        "aff_campus_unique": "Mountain View",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "s4It8EZf77",
        "title": "MoteS: Memory Optimization via Fine-grained Scheduling for DNNs on Tiny Devices",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "There has been a growing trend in deploying deep neural networks (DNNs) on tiny devices.\nHowever, it is challenging to do so due to the contradiction of large execution memory requirement of many DNNs and stringent memory constraint of tiny devices. \nSome previous works incurs large latency overhead to save memory and cannot optimize networks with complex structures; some employ coarse-grained scheduling, leading to limited memory footprint reduction. \nThis paper proposes MoteS that performs fine-grained scheduling via operator partitioning on DNNs to dramatically reduce peak memory usage with little latency overhead. \nMoteS presents a graph representation named Axis Connecting Graph (ACG) to perform operator partition at graph-level efficiently. MoteS further proposes an algorithm that searches the partition and schedule guided by memory bottlenecks.\nWe evaluate MoteS using various popular networks and show that MoteS achieves up to 80\\% of peak memory usage reduction compared to state-of-art works with nearly no latency overhead on tiny devices.",
        "keywords": "TinyML;Memory Optimization;Fine-grained Scheduling",
        "primary_area": "infrastructure, software libraries, hardware, etc.",
        "supplementary_material": "",
        "author": "Renze Chen;Zijian Ding;Size Zheng;Meng Li;Yun Liang",
        "authorids": "~Renze_Chen1;~Zijian_Ding1;~Size_Zheng1;~Meng_Li1;~Yun_Liang1",
        "gender": "M;M;M;M;M",
        "homepage": "https://github.com/Light-of-Hers;;https://sizezheng.github.io/;https://mengli.me;http://eecs.pku.edu.cn/EN/People/Faculty/Detail/?ID=6191",
        "dblp": "260/5910;;254/6617-1.html;70/1726-4;",
        "google_scholar": ";;TMZWR1gAAAAJ;lvdRkEkAAAAJ;https://scholar.google.com.tw/citations?user=Ltp8loUAAAAJ",
        "orcid": ";0009-0000-4555-2077;;;",
        "linkedin": ";;;;",
        "or_profile": "~Renze_Chen1;~Zijian_Ding1;~Size_Zheng1;~Meng_Li1;~Yun_Liang1",
        "aff": "Peking University;University of California, Los Angeles;Peking University;Peking University;Peking University",
        "aff_domain": "pku.edu.cn;cs.ucla.edu;pku.edu.cn;pku.edu.cn;pku.edu.cn",
        "position": "PhD student;PhD student;PhD student;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nchen2024motes,\ntitle={MoteS: Memory Optimization via Fine-grained Scheduling for {DNN}s on Tiny Devices},\nauthor={Renze Chen and Zijian Ding and Size Zheng and Meng Li and Yun Liang},\nyear={2024},\nurl={https://openreview.net/forum?id=s4It8EZf77}\n}",
        "github": "",
        "project": "",
        "reviewers": "VBzs;MrR9;uvi7;kLuY",
        "site": "https://openreview.net/forum?id=s4It8EZf77",
        "pdf_size": 1158060,
        "rating": "3;3;6;6",
        "confidence": "3;5;4;3",
        "soundness": "2;1;3;3",
        "contribution": "2;2;2;3",
        "presentation": "1;2;3;3",
        "wc_summary": "124;172;100;117",
        "wc_strengths": "53;50;54;41",
        "wc_weaknesses": "77;585;170;51",
        "wc_questions": "175;144;5;1",
        "wc_review": "429;951;329;210",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            128.25,
            26.7242867070386
        ],
        "wc_strengths_avg": [
            49.5,
            5.123475382979799
        ],
        "wc_weaknesses_avg": [
            220.75,
            214.9027396288842
        ],
        "wc_questions_avg": [
            81.25,
            79.02649872036594
        ],
        "wc_review_avg": [
            479.75,
            282.90579262362235
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.3015113445777637,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Y8d5LV-ahAgJ:scholar.google.com/&scioq=MoteS:+Memory+Optimization+via+Fine-grained+Scheduling+for+DNNs+on+Tiny+Devices&hl=en&as_sdt=0,48",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0;0",
        "aff_unique_norm": "Peking University;University of California, Los Angeles",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.ucla.edu",
        "aff_unique_abbr": "Peking U;UCLA",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Los Angeles",
        "aff_country_unique_index": "0;1;0;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "s4WWqhD9Mw",
        "title": "Holmex: Human-Guided Spurious Correlation Detection and Black-box Model Fixing",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We propose Holmex, a method for human-guided spurious correlation detection and black-box model fixing. \\ours{} provides a way for humans to be easily involved in the deep model debugging process, which includes 1) detecting conceptual spurious correlation in training data and 2) fixing biased black-box models by white-box models. In the first step, we leverage pre-trained vision-language model to construct separable vectors for some high-level and meaningful concepts, and we further propose a novel algorithm based on concept vectors that is more stable than previous methods. In the second step, unlike previous works, we do not constrain the original biased model to be interpretable and editable. Instead, \\ours{} is compatible with arbitrary black-box models. To this end, we propose transfer editing, a novel technique that can transfer the revision in interpretable models to the black-box models to correct their spurious correlations. Extensive experiments on multiple real-world datasets demonstrate the effectiveness of \\ours{} in detecting and fixing spurious correlations. The source code and datasets can be found in https://anonymous.4open.science/r/Holmex-15DF.",
        "keywords": "Interpretability;Model Editing;Concept Bottleneck Model;Human-AI Interaction",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/0c569bb2d2ed18ef46ccda041c03e53fa72c701c.pdf",
        "author": "Longtao Tang;Xufang Luo;Dongqi Han;Yu Yang;Dongsheng Li",
        "authorids": "~Longtao_Tang1;~Xufang_Luo1;~Dongqi_Han1;~Yu_Yang9;~Dongsheng_Li2",
        "gender": "M;F;M;M;M",
        "homepage": "https://scholars.cityu.edu.hk/person/longttang2;;https://frosthan.github.io/;https://yuyangcs.github.io/;http://recmind.cn",
        "dblp": "329/6147;218/7350;;16/4505-1.html;254/0830-2.html",
        "google_scholar": ";;3V_9fRUAAAAJ;https://scholar.google.ca/citations?user=EMG6cL0AAAAJ;VNg5rA8AAAAJ",
        "orcid": "0000-0002-6312-5893;;0000-0002-6872-7121;0000-0002-8209-2898;0000-0003-3103-8442",
        "linkedin": ";;;;",
        "or_profile": "~Longtao_Tang1;~Xufang_Luo1;~Dongqi_Han1;~Yu_Yang9;~Dongsheng_Li2",
        "aff": "City University of Hong Kong;Microsoft Research;Microsoft;City University of Hong Kong;Microsoft Research Asia",
        "aff_domain": "cityu.edu.hk;microsoft.com;microsoft.com;cityu.edu.hk;microsoft.com",
        "position": "PhD student;Researcher;Researcher;Assistant Professor;Principal Researcher",
        "bibtex": "@misc{\ntang2024holmex,\ntitle={Holmex: Human-Guided Spurious Correlation Detection and Black-box Model Fixing},\nauthor={Longtao Tang and Xufang Luo and Dongqi Han and Yu Yang and Dongsheng Li},\nyear={2024},\nurl={https://openreview.net/forum?id=s4WWqhD9Mw}\n}",
        "github": "",
        "project": "",
        "reviewers": "xRBd;NL8r;cHZ2;G5F3",
        "site": "https://openreview.net/forum?id=s4WWqhD9Mw",
        "pdf_size": 12002130,
        "rating": "3;3;6;6",
        "confidence": "4;4;4;4",
        "soundness": "1;2;3;3",
        "contribution": "1;1;3;3",
        "presentation": "1;2;2;3",
        "wc_summary": "85;119;128;187",
        "wc_strengths": "15;188;59;116",
        "wc_weaknesses": "579;113;179;281",
        "wc_questions": "76;41;35;162",
        "wc_review": "755;461;401;746",
        "wc_reply_reviewers": "206;95;0;37",
        "wc_reply_authors": "398;271;188;346",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            1.0
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            129.75,
            36.73809330926144
        ],
        "wc_strengths_avg": [
            94.5,
            64.77846864506755
        ],
        "wc_weaknesses_avg": [
            288.0,
            178.35077796297946
        ],
        "wc_questions_avg": [
            78.5,
            50.6877697280123
        ],
        "wc_review_avg": [
            590.75,
            161.18370730318867
        ],
        "wc_reply_reviewers_avg": [
            84.5,
            77.89255420128423
        ],
        "wc_reply_authors_avg": [
            300.75,
            79.21923693144235
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:uCKoMaLyPIIJ:scholar.google.com/&scioq=Holmex:+Human-Guided+Spurious+Correlation+Detection+and+Black-box+Model+Fixing&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;0;1",
        "aff_unique_norm": "City University of Hong Kong;Microsoft",
        "aff_unique_dep": ";Microsoft Research",
        "aff_unique_url": "https://www.cityu.edu.hk;https://www.microsoft.com/en-us/research",
        "aff_unique_abbr": "CityU;MSR",
        "aff_campus_unique_index": "0;0;2",
        "aff_campus_unique": "Hong Kong SAR;;Asia",
        "aff_country_unique_index": "0;1;1;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "s4mPCrSNUZ",
        "title": "PROTEIN DESIGNER BASED ON SEQUENCE PROFILE USING ULTRAFAST SHAPE RECOGNITION",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The process of designing proteins with specified structure and function, which can deepen our understanding of living systems and facilitate the fight against disease, involves a critical component known as sequence design. With the continuous development of deep learning, existing methods have shown excellent performance in protein sequence design. However, most of them focus on optimizing the network architecture to improve performance, while ignoring the explicit biochemical features of proteins. Observing the remarkable success achieved through structural templates and pre-trained knowledge in protein structure prediction, we explored whether similar sequence patterns and representations of underlying structural knowledge can be used in protein sequence design. In this work, we proposed SPDesign, a method for protein sequence design based on sequence profile using ultrafast shape recognition. For an input backbone structure, SPDesign utilizes ultrafast shape recognition vectors to search for similar protein structures (structural analogs) in the PAcluster80 structure library. It then extracts the sequence profile from the analogs through structural alignment. Along with structural pre-trained knowledge and geometric features, they are further condensed to provide reliable sequence patterns for an improved graph neural network. Experimental results show that SPDesign significantly outperforms the state-of-the-art methods on CATH 4.2 benchmark, such as LM-Design and Pifold, leading to 11.4\\% and 15.54\\% accuracy gains in sequence recovery rate, respectively. Encouraging results have been achieved on the TS50 and TS500 benchmarks, with performance reaching 68.64\\% and 71.63\\%, respectively. Particularly noteworthy is that our method also achieved significant performance on de novo designed proteins and orphan proteins that are close to practical application scenarios. Finally, the structural modeling verification experiment shows that the sequences designed by our method can fold into the native structures more accurately.",
        "keywords": "Protein sequence design;Sequence profile;Ultrafast shape recognition;Protein language models;Graph neural network",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "hui Wang;Dong Liu;kailong zhao;Guijun Zhang",
        "authorids": "~hui_Wang18;~Dong_Liu16;~kailong_zhao1;~Guijun_Zhang1",
        "gender": "M;M;M;M",
        "homepage": "https://github.com/Gawaker;https://github.com/LDAIprotein;https://www.researchgate.net/profile/Kailong-Zhao-2;http://zhanglab-bioinf.com/index.html",
        "dblp": ";;;",
        "google_scholar": ";;;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~hui_Wang18;~Dong_Liu16;~kailong_zhao1;~Guijun_Zhang1",
        "aff": "Zhejiang University of Technology;Zhejiang University of Technology;Zhejiang University of Technology;Zhejiang University of Technology",
        "aff_domain": "zjut.edu.cn;zjut.edu.cn;zjut.edu.cn;zjut.edu.cn",
        "position": "MS student;PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nwang2024protein,\ntitle={{PROTEIN} {DESIGNER} {BASED} {ON} {SEQUENCE} {PROFILE} {USING} {ULTRAFAST} {SHAPE} {RECOGNITION}},\nauthor={hui Wang and Dong Liu and kailong zhao and Guijun Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=s4mPCrSNUZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "RyXy;mFbR;igsg;VpDG",
        "site": "https://openreview.net/forum?id=s4mPCrSNUZ",
        "pdf_size": 5654629,
        "rating": "3;5;5;5",
        "confidence": "3;3;4;4",
        "soundness": "3;2;3;3",
        "contribution": "1;2;2;2",
        "presentation": "2;3;3;2",
        "wc_summary": "74;109;51;124",
        "wc_strengths": "14;139;62;28",
        "wc_weaknesses": "218;386;38;83",
        "wc_questions": "18;61;134;2",
        "wc_review": "324;695;285;237",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            89.5,
            28.692333470807146
        ],
        "wc_strengths_avg": [
            60.75,
            48.43229810777102
        ],
        "wc_weaknesses_avg": [
            181.25,
            135.50530432422192
        ],
        "wc_questions_avg": [
            53.75,
            51.109563684304725
        ],
        "wc_review_avg": [
            385.25,
            181.46952223445126
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:70Q0u2KfbKUJ:scholar.google.com/&scioq=PROTEIN+DESIGNER+BASED+ON+SEQUENCE+PROFILE+USING+ULTRAFAST+SHAPE+RECOGNITION&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Zhejiang University of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.zjut.edu.cn",
        "aff_unique_abbr": "ZJUT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "BaDExpert: Extracting Backdoor Functionality for Accurate Backdoor Input Detection",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17666",
        "id": "s56xikpD92",
        "author_site": "Tinghao Xie, Xiangyu Qi, Ping He, Yiming Li, Jiachen (Tianhao) Wang, Prateek Mittal",
        "tldr": "",
        "abstract": "We present a novel defense, against backdoor attacks on Deep Neural Networks (DNNs), wherein adversaries covertly implant malicious behaviors (backdoors) into DNNs. Our defense falls within the category of post-development defenses that operate independently of how the model was generated. The proposed defense is built upon a novel reverse engineering approach that can directly extract **backdoor functionality** of a given backdoored model to a *backdoor expert* model. The approach is straightforward --- finetuning the backdoored model over a small set of intentionally mislabeled clean samples, such that it unlearns the normal functionality while still preserving the backdoor functionality, and thus resulting in a model~(dubbed a backdoor expert model) that can only recognize backdoor inputs. Based on the extracted backdoor expert model, we show the feasibility of devising highly accurate backdoor input detectors that filter out the backdoor inputs during model inference. Further augmented by an ensemble strategy with a finetuned auxiliary model, our defense, **BaDExpert** (**Ba**ckdoor Input **D**etection with Backdoor **Expert**), effectively mitigates 17 SOTA backdoor attacks while minimally impacting clean utility. The effectiveness of BaDExpert has been verified on multiple datasets (CIFAR10, GTSRB and ImageNet) across various model architectures (ResNet, VGG, MobileNetV2 and Vision Transformer). Our code is integrated into our research toolbox: [https://github.com/vtu81/backdoor-toolbox](https://github.com/vtu81/backdoor-toolbox).",
        "keywords": "Backdoor Input Detection;Backdoor Defense;AI Security;Deep Learning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/26f61d1171e53fcd888e318f952e7eca4d5a16f3.zip",
        "author": "Tinghao Xie;Xiangyu Qi;Ping He;Yiming Li;Jiachen T. Wang;Prateek Mittal",
        "authorids": "~Tinghao_Xie1;~Xiangyu_Qi2;~Ping_He3;~Yiming_Li1;~Jiachen_T._Wang1;~Prateek_Mittal1",
        "gender": "M;M;;M;;",
        "homepage": "https://tinghaoxie.com;https://unispac.github.io;;http://liyiming.tech;;http://www.princeton.edu/~pmittal/",
        "dblp": "307/5298;274/2321;;l/YimingLi-4;;",
        "google_scholar": "gFT5XpMAAAAJ;9Za3rmkAAAAJ;;mSW7kU8AAAAJ;;https://scholar.google.com.tw/citations?user=xTKD8J4AAAAJ",
        "orcid": ";;;0000-0002-2258-265X;;0000-0002-4057-0118",
        "linkedin": ";;;yiming-li-thu/;;",
        "or_profile": "~Tinghao_Xie1;~Xiangyu_Qi2;~Ping_He3;~Yiming_Li1;~Jiachen_T._Wang1;~Prateek_Mittal1",
        "aff": "Meta Facebook;Princeton University;;Zhejiang University;;Princeton University",
        "aff_domain": "meta.com;princeton.edu;;zju.edu.cn;;princeton.edu",
        "position": "Intern;PhD student;;Research Professor;;Full Professor",
        "bibtex": "@inproceedings{\nxie2024badexpert,\ntitle={Ba{DE}xpert: Extracting Backdoor Functionality for Accurate Backdoor Input Detection},\nauthor={Tinghao Xie and Xiangyu Qi and Ping He and Yiming Li and Jiachen T. Wang and Prateek Mittal},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=s56xikpD92}\n}",
        "github": "",
        "project": "",
        "reviewers": "59E7;79zr;Xe68;xRnn",
        "pdf_size": 3511192,
        "rating": "5;6;6;8",
        "confidence": "4;4;2;5",
        "soundness": "3;3;2;4",
        "contribution": "3;2;2;3",
        "presentation": "3;3;3;4",
        "wc_summary": "69;66;86;76",
        "wc_strengths": "36;53;49;29",
        "wc_weaknesses": "297;197;40;11",
        "wc_questions": "51;8;230;71",
        "wc_review": "453;324;405;187",
        "wc_reply_reviewers": "49;141;267;0",
        "wc_reply_authors": "2107;1419;2048;618",
        "reply_reviewers": "1;2;2;0",
        "reply_authors": "6;5;5;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            74.25,
            7.693341276714559
        ],
        "wc_strengths_avg": [
            41.75,
            9.67923034130297
        ],
        "wc_weaknesses_avg": [
            136.25,
            116.70770111693572
        ],
        "wc_questions_avg": [
            90.0,
            83.97321001367042
        ],
        "wc_review_avg": [
            342.25,
            100.79527518688562
        ],
        "wc_reply_reviewers_avg": [
            114.25,
            101.68425394327285
        ],
        "wc_reply_authors_avg": [
            1548.0,
            600.837332395383
        ],
        "reply_reviewers_avg": [
            1.25,
            0.82915619758885
        ],
        "reply_authors_avg": [
            4.25,
            1.920286436967152
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.4736842105263159,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3335029040496405677&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=s56xikpD92",
        "pdf": "https://openreview.net/pdf?id=s56xikpD92",
        "email": "meta.com;princeton.edu;;zju.edu.cn;;princeton.edu",
        "author_num": 6,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "Meta;Princeton University;Zhejiang University",
        "aff_unique_dep": "Meta Platforms, Inc.;;",
        "aff_unique_url": "https://meta.com;https://www.princeton.edu;https://www.zju.edu.cn",
        "aff_unique_abbr": "Meta;Princeton;ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "s5ZAs0UkRr",
        "title": "ODEdit: Blind Face Restoration through Ordinary Differential Equations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We introduce ODEdit, an unsupervised blind face restoration method. ODEdit operates without necessitating any assumptions about the nature of the degradation affecting the images and still surpasses current approaches in versatility. It is characterized by its utilization of the generative prior encapsulated within a pre-trained diffusion model, obviating the necessity for any additional fine-tuning or any handcrafted loss function. We leverage Ordinary Differential Equations for image inversion and implement a principled enhancing approach based on score-based updates to augment the realism of the reconstructed images. Empirical evaluations on face restoration reveal the robustness and adaptability of our methodology against a varied spectrum of corruption and noise scenarios. We further show how our approach synergise with other latent-based methods to outperform the state-of-the-art Blind Face Restoration methods in our experiments.",
        "keywords": "Image Restoration;Zero-Shot;Generative Models;Diffusion Models;Unsupervised Learning;Transfer Learning;Image Editing.",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Bastien Germain van Delft;Alexandre Alahi",
        "authorids": "~Bastien_Germain_van_Delft1;~Alexandre_Alahi3",
        "gender": ";M",
        "homepage": "https://people.epfl.ch/bastien.vandelft;https://vita.epfl.ch/",
        "dblp": ";48/3455",
        "google_scholar": ";UIhXQ64AAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Bastien_Germain_van_Delft1;~Alexandre_Alahi3",
        "aff": "Swiss Federal Institute of Technology Lausanne;EPFL",
        "aff_domain": "epfl.ch;epfl.ch",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\ndelft2024odedit,\ntitle={{ODE}dit: Blind Face Restoration through Ordinary Differential Equations},\nauthor={Bastien Germain van Delft and Alexandre Alahi},\nyear={2024},\nurl={https://openreview.net/forum?id=s5ZAs0UkRr}\n}",
        "github": "",
        "project": "",
        "reviewers": "UVwz;5VT9;xfaR;Gq4R",
        "site": "https://openreview.net/forum?id=s5ZAs0UkRr",
        "pdf_size": 2263061,
        "rating": "3;3;5;5",
        "confidence": "5;3;4;4",
        "soundness": "2;2;2;4",
        "contribution": "2;2;2;2",
        "presentation": "2;2;2;3",
        "wc_summary": "47;46;68;66",
        "wc_strengths": "53;22;20;52",
        "wc_weaknesses": "120;65;141;49",
        "wc_questions": "82;257;4;37",
        "wc_review": "302;390;233;204",
        "wc_reply_reviewers": "93;59;0;0",
        "wc_reply_authors": "413;474;584;397",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            56.75,
            10.280442597476044
        ],
        "wc_strengths_avg": [
            36.75,
            15.769828787910159
        ],
        "wc_weaknesses_avg": [
            93.75,
            37.91684981640748
        ],
        "wc_questions_avg": [
            95.0,
            97.54229851710488
        ],
        "wc_review_avg": [
            282.25,
            71.6741759631738
        ],
        "wc_reply_reviewers_avg": [
            38.0,
            39.85599076675927
        ],
        "wc_reply_authors_avg": [
            467.0,
            73.40640299047489
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Llzy-3wxCskJ:scholar.google.com/&scioq=ODEdit:+Blind+Face+Restoration+through+Ordinary+Differential+Equations&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Swiss Federal Institute of Technology Lausanne;EPFL",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.epfl.ch;https://www.epfl.ch",
        "aff_unique_abbr": "EPFL;EPFL",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Lausanne;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Switzerland"
    },
    {
        "title": "The Human-AI Substitution game: active learning from a strategic labeler",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17665",
        "id": "s5hSp7EdL3",
        "author_site": "Tom Yan, Chicheng Zhang",
        "tldr": "",
        "abstract": "The standard active learning setting assumes a willing labeler, who provides labels on informative examples to speed up learning. However, if the labeler wishes to be compensated for as many labels as possible before learning finishes, the labeler may benefit from actually slowing down learning. This incentive arises for instance if the labeler is to be replaced by the ML model once it is trained. In this paper, we initiate the study of learning from a strategic labeler, who may abstain from labeling to slow down learning. We first prove that strategic abstention can prolong learning, and propose a novel complexity measure and representation to analyze the query complexity of the learning game. Next, we develop a near-optimal deterministic algorithm, prove its robustness to strategic labeling, and contrast it with other active learning algorithms. We also analyze extensions that encompass more general learning goals and labeler assumptions. Finally, we characterize the query cost of multi-task active learning, with and without abstention. Our first exploration of strategic labeling aims to consolidate our theoretical understanding of the \\emph{imitative} nature of ML in human-AI interaction.",
        "keywords": "active learning;strategic learning",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/1bba04ff11cd8d28185684595e8b934210b3f510.pdf",
        "author": "Tom Yan;Chicheng Zhang",
        "authorids": "~Tom_Yan1;~Chicheng_Zhang1",
        "gender": ";M",
        "homepage": ";http://zcc1307.github.io",
        "dblp": "213/7323;149/2402",
        "google_scholar": ";29B3BAgAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Tom_Yan1;~Chicheng_Zhang1",
        "aff": "Carnegie Mellon University;University of Arizona",
        "aff_domain": "cmu.edu;arizona.edu",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nyan2024the,\ntitle={The Human-{AI} Substitution game: active learning from a strategic labeler},\nauthor={Tom Yan and Chicheng Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=s5hSp7EdL3}\n}",
        "github": "",
        "project": "",
        "reviewers": "k54k;GuAP;ciAE;rYHN",
        "pdf_size": 932284,
        "rating": "6;6;6;6",
        "confidence": "3;3;3;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;4",
        "presentation": "3;2;3;4",
        "wc_summary": "97;111;77;80",
        "wc_strengths": "47;54;89;61",
        "wc_weaknesses": "122;341;83;66",
        "wc_questions": "3;330;27;49",
        "wc_review": "269;836;276;256",
        "wc_reply_reviewers": "0;41;0;69",
        "wc_reply_authors": "596;1455;229;468",
        "reply_reviewers": "0;1;0;2",
        "reply_authors": "2;3;2;4",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            91.25,
            13.718144918318949
        ],
        "wc_strengths_avg": [
            62.75,
            15.943258763502524
        ],
        "wc_weaknesses_avg": [
            153.0,
            110.42418213416842
        ],
        "wc_questions_avg": [
            102.25,
            132.49410364238855
        ],
        "wc_review_avg": [
            409.25,
            246.48871678030213
        ],
        "wc_reply_reviewers_avg": [
            27.5,
            29.227555491350966
        ],
        "wc_reply_authors_avg": [
            687.0,
            462.55540208714456
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:23rJQu-esGIJ:scholar.google.com/&scioq=The+Human-AI+Substitution+game:+active+learning+from+a+strategic+labeler&hl=en&as_sdt=0,5",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=s5hSp7EdL3",
        "pdf": "https://openreview.net/pdf?id=s5hSp7EdL3",
        "email": "cmu.edu;arizona.edu",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Carnegie Mellon University;University of Arizona",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cmu.edu;https://www.arizona.edu",
        "aff_unique_abbr": "CMU;UA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "s6X3s3rBPW",
        "title": "Efficiently Measuring the Cognitive Ability of LLMs: An Adaptive Testing Perspective",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs), like ChatGPT, have shown human-level cognitive ability. Benchmarks from various fields (e.g., Literature, Biology and Psychology) are often used to measure LLM's ability and report standard metrics such as accuracy, recall and F1. However, such method for evaluating LLMs can be inefficient and inaccurate from the cognitive science perspective. \tInspired by Computerized Adaptive Testing (CAT) used in psychometrics, we propose an adaptive testing framework for LLM evaluation. Rather than using a standard test set and simply reporting accuracy, this approach dynamically adjusts the characteristics of the test questions, such as difficulty, based on the model's performance. This allows for a more accurate estimation of the model's abilities, using fewer questions. More importantly, it allows LLMs to be compared with humans easily, which is essential for NLP models that aim for human-level ability. Our diagnostic reports have found that ChatGPT often behaves like a ''careless student'', prone to slip and occasionally guessing the questions. We conduct a fine-grained diagnosis and rank 6 commercial instruction-tuned LLMs from three aspects of Subject Knowledge, Mathematical Reasoning, and Programming, where GPT4 can outperform other models significantly and reach the cognitive ability of middle-level students. Different tests for different models using efficient adaptive testing --- we believe this will become the new norm in large language model evaluation.",
        "keywords": "large language model;adaptive testing;model evaluation",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Yan Zhuang;Qi Liu;Yuting Ning;Weizhe Huang;Rui Lv;Zhenya Huang;GuanHao Zhao;Zheng Zhang;Qingyang Mao;Shijin Wang;Enhong Chen",
        "authorids": "~Yan_Zhuang4;~Qi_Liu3;~Yuting_Ning1;~Weizhe_Huang1;~Rui_Lv1;~Zhenya_Huang2;~GuanHao_Zhao1;~Zheng_Zhang20;~Qingyang_Mao1;~Shijin_Wang1;~Enhong_Chen1",
        "gender": "M;M;;M;F;M;M;;M;M;M",
        "homepage": "http://home.ustc.edu.cn/~zykb/;http://staff.ustc.edu.cn/~qiliuql/;https://nnnyt.github.io;https://github.com/weizhehuang0827;https://karin0018.github.io/;http://staff.ustc.edu.cn/~huangzhy/;https://base.ustc.edu.cn/;;https://github.com/Double680;;http://staff.ustc.edu.cn/~cheneh",
        "dblp": ";95/2446-3;;;33/2510;178/8690;;;349/7702;74/5750-1.html;07/258",
        "google_scholar": "7MX_P5cAAAAJ;5EoHAFwAAAAJ;HYmzF-QAAAAJ;;;dVZuU90AAAAJ;;;H8UI6vMAAAAJ;;Q9h02J0AAAAJ",
        "orcid": "0000-0001-7351-377X;0000-0001-6956-5550;;;;0000-0003-1661-0420;0009-0001-1824-2169;;;0000-0002-9202-7678;0000-0002-4835-4102",
        "linkedin": ";;;;;;;;;;",
        "or_profile": "~Yan_Zhuang4;~Qi_Liu3;~Yuting_Ning1;~Weizhe_Huang1;~Rui_Lv1;~Zhenya_Huang2;~GuanHao_Zhao1;~Zheng_Zhang20;~Qingyang_Mao1;~Shijin_Wang1;~Enhong_Chen1",
        "aff": "University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China;;University of Science and Technology of China;State Key Laboratory of Cognitive Intelligence;University of Science and Technology of China",
        "aff_domain": "ustc.edu.cn;ustc.edu.cn;ustc.edu.cn;ustc.edu.cn;mail.ustc.edu.cn;ustc.edu.cn;ustc.edu.cn;;mail.ustc.edu.cn;iflytek.com;ustc.edu.cn",
        "position": "PhD student;Full Professor;MS student;MS student;MS student;Associate Professor;PhD student;;PhD student;Vice Dean;Full Professor",
        "bibtex": "@misc{\nzhuang2024efficiently,\ntitle={Efficiently Measuring the Cognitive Ability of {LLM}s: An Adaptive Testing Perspective},\nauthor={Yan Zhuang and Qi Liu and Yuting Ning and Weizhe Huang and Rui Lv and Zhenya Huang and GuanHao Zhao and Zheng Zhang and Qingyang Mao and Shijin Wang and Enhong Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=s6X3s3rBPW}\n}",
        "github": "",
        "project": "",
        "reviewers": "Mwhi;E6Gc;AbmR;YD4n",
        "site": "https://openreview.net/forum?id=s6X3s3rBPW",
        "pdf_size": 4720689,
        "rating": "3;3;5;5",
        "confidence": "4;2;4;3",
        "soundness": "2;1;3;3",
        "contribution": "3;1;3;3",
        "presentation": "3;1;4;3",
        "wc_summary": "46;31;103;99",
        "wc_strengths": "29;65;84;64",
        "wc_weaknesses": "261;299;61;171",
        "wc_questions": "48;41;295;9",
        "wc_review": "384;436;543;343",
        "wc_reply_reviewers": "0;63;0;132",
        "wc_reply_authors": "795;895;690;443",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "1;2;1;2",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            2.75,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            69.75,
            31.728339067779768
        ],
        "wc_strengths_avg": [
            60.5,
            19.85572965166478
        ],
        "wc_weaknesses_avg": [
            198.0,
            91.7442096265481
        ],
        "wc_questions_avg": [
            98.25,
            114.54120437641643
        ],
        "wc_review_avg": [
            426.5,
            74.90160211904683
        ],
        "wc_reply_reviewers_avg": [
            48.75,
            54.51318647813573
        ],
        "wc_reply_authors_avg": [
            705.75,
            168.12699812939027
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": 0.30151134457776363,
        "gs_citation": 46,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5910393804105688783&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0;0;0;0;0;1;0",
        "aff_unique_norm": "University of Science and Technology of China;State Key Laboratory of Cognitive Intelligence",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.ustc.edu.cn;",
        "aff_unique_abbr": "USTC;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "s6bKLlF4Pe",
        "title": "Provable Knowledge Transfer using Successor Feature for Deep Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper explores knowledge transfer using successor features (SFs) in reinforcement learning (RL) scenarios where the reward function changes across tasks while the environment's dynamics remain the same. Under this framework, the Q-function of a task can be decomposed into a successor feature and a reward mapping: the former characterizes the transition dynamics, and the latter characterizes the task-specific reward function.\nThis Q-value function decomposition, coupled with a policy improvement operator known as \"generalized policy improvement\" (GPI), simplifies the search space for finding the optimal Q-function when transferring knowledge from one task to another that shares the same transition dynamics. As the optimal policy can be directly derived from the optimal Q-function, the SF \\& GPI framework exhibits promise in enhancing efficiency and effectiveness in decision-making compared to traditional RL methods like Q-learning.\nHowever, despite the observed superior performance of SF \\& GPI in numerical experiments, their theoretical foundations remain largely unestablished, especially when learning successor features using deep neural networks in conjunction with deep Q-network (SF-DQN). To the best of our knowledge, this paper provides the first convergence analysis with provable generalization guarantees for SF-DQN with GPI. Moreover, our theoretical results reveal that SF-DQN \\& GPI significantly accelerate the policy transfer across tasks and indicate that SF decomposition outperforms non-representation learning approaches, such as deep Q-network (DQN), with simultaneously faster convergence rate and improved generalization. Numerical experiments on real RL tasks support the superior performance of SF-DQN \\& GPI, quantitatively aligning with our theoretical findings.",
        "keywords": "Transfer reinforcement learning;Successor feature",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/e15441b03130ff6e5d97405f7b1babc1f3cc4e09.zip",
        "author": "Shuai Zhang;Heshan Devaka Fernando;Miao Liu;Keerthiram Murugesan;Songtao Lu;Pin-Yu Chen;Tianyi Chen;Meng Wang",
        "authorids": "~Shuai_Zhang6;~Heshan_Devaka_Fernando1;~Miao_Liu1;~Keerthiram_Murugesan1;~Songtao_Lu1;~Pin-Yu_Chen1;~Tianyi_Chen5;~Meng_Wang4",
        "gender": "M;M;M;M;M;M;M;F",
        "homepage": "https://inchs708.github.io/shuaizhang.github.io/index.html;https://heshandevaka.github.io/;https://sites.google.com/view/miaoliuhome;https://keerthi166.github.io;https://songtaogithub.github.io/;http://www.pinyuchen.com;https://chentianyi1991.github.io/;https://www.ecse.rpi.edu/~wang/index.html",
        "dblp": "71/208-15;;;178/2877;05/2887;39/8969;;93/6765-3",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;QOXlyxIAAAAJ;7QHvAEYAAAAJ;-698GEMAAAAJ;LRsjX7kAAAAJ;jxwlCUUAAAAJ;kFwvv38AAAAJ;",
        "orcid": "0000-0001-8280-6988;;;0000-0001-6847-522X;;0000-0003-1039-8369;;",
        "linkedin": ";;miao-liu-3273a32b;https://linkedin.com/in/keerthiram;;pin-yu-chen-940062a2;;",
        "or_profile": "~Shuai_Zhang6;~Heshan_Devaka_Fernando1;~Miao_Liu1;~Keerthiram_Murugesan1;~Songtao_Lu1;~Pin-Yu_Chen1;~Tianyi_Chen5;~Meng_Wang4",
        "aff": "New Jersey Institute of Technology;Rensselaer Polytechnic Institute;International Business Machines;International Business Machines;IBM Thomas J. Watson Research Center;International Business Machines;Rensselaer Polytechnic Institute;Rensselaer Polytechnic Institute",
        "aff_domain": "njit.edu;rpi.edu;ibm.com;ibm.com;ibm.com;ibm.com;rpi.edu;rpi.edu",
        "position": "Assistant Professor;PhD student;Research Staff Member;Researcher;Researcher;Principal Researcher;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nzhang2024provable,\ntitle={Provable Knowledge Transfer using Successor Feature for Deep Reinforcement Learning},\nauthor={Shuai Zhang and Heshan Devaka Fernando and Miao Liu and Keerthiram Murugesan and Songtao Lu and Pin-Yu Chen and Tianyi Chen and Meng Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=s6bKLlF4Pe}\n}",
        "github": "",
        "project": "",
        "reviewers": "qMSi;c6vz;k1QU;t8DF",
        "site": "https://openreview.net/forum?id=s6bKLlF4Pe",
        "pdf_size": 460788,
        "rating": "3;3;6;8",
        "confidence": "3;3;4;3",
        "soundness": "2;1;3;3",
        "contribution": "3;2;3;3",
        "presentation": "2;3;1;3",
        "wc_summary": "35;58;43;46",
        "wc_strengths": "117;16;16;40",
        "wc_weaknesses": "156;65;144;100",
        "wc_questions": "91;116;289;3",
        "wc_review": "399;255;492;189",
        "wc_reply_reviewers": "0;0;169;0",
        "wc_reply_authors": "1915;907;1973;421",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "4;2;4;1",
        "rating_avg": [
            5.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            45.5,
            8.261355820929152
        ],
        "wc_strengths_avg": [
            47.25,
            41.444993666304256
        ],
        "wc_weaknesses_avg": [
            116.25,
            36.196512262923896
        ],
        "wc_questions_avg": [
            124.75,
            103.70239871864102
        ],
        "wc_review_avg": [
            333.75,
            118.80104166209992
        ],
        "wc_reply_reviewers_avg": [
            42.25,
            73.17914661978507
        ],
        "wc_reply_authors_avg": [
            1304.0,
            662.9819002054279
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            1.299038105676658
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.2721655269759087,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:sXCX3wSxhlMJ:scholar.google.com/&scioq=Provable+Knowledge+Transfer+using+Successor+Feature+for+Deep+Reinforcement+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;2;3;2;1;1",
        "aff_unique_norm": "New Jersey Institute of Technology;Rensselaer Polytechnic Institute;International Business Machines Corporation;IBM",
        "aff_unique_dep": ";;;Research",
        "aff_unique_url": "https://www.njit.edu;https://www.rpi.edu;https://www.ibm.com;https://www.ibm.com/research",
        "aff_unique_abbr": "NJIT;RPI;IBM;IBM",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Yorktown Heights",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "s8ROuWV96d",
        "title": "ViTKD: Feature-based Knowledge Distillation for Vision Transformers",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Knowledge Distillation (KD) has been extensively studied as a means to enhance the performance of smaller models in Convolutional Neural Networks (CNNs). Recently, the Vision Transformer (ViT) has demonstrated remarkable success in various computer vision tasks, leading to an increased demand for KD in ViT. However, while logit-based KD has been applied to ViT, other feature-based KD methods for CNNs cannot be directly implemented due to the significant structure gap. In this paper, we conduct an analysis of the properties of different feature layers in ViT to identify a method for feature-based ViT distillation. Our findings reveal that both shallow and deep layers in ViT are equally important for distillation and require distinct distillation strategies. Based on these guidelines, we propose our feature-based method ViTKD, which mimics the shallow layers and generates the deep layer in the teacher. ViTKD leads to consistent and significant improvements in the students. On ImageNet-1K, we achieve performance boosts of $1.64\\%$ for DeiT-Tiny, $1.40\\%$ for DeiT-Small, and $1.70\\%$ for DeiT-Base. Downstream tasks also demonstrate the superiority of ViTKD. Additionally, ViTKD and logit-based KD are complementary and can be applied together directly, further enhancing the student's performance. Specifically, DeiT-Tiny, Small, and Base achieve accuracies of $77.78\\%$, $83.59\\%$, and $85.41\\%$, respectively, using this combined approach.",
        "keywords": "Knowledge Distillation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/b36739b16bd3f747a7e3c34a9aca9bb578626233.zip",
        "author": "Zhendong Yang;Zhe Li;Ailing Zeng;Zexian Li;Chun Yuan;Yu Li",
        "authorids": "~Zhendong_Yang2;~Zhe_Li11;~Ailing_Zeng1;~Zexian_Li1;~Chun_Yuan1;~Yu_Li4",
        "gender": "M;M;F;M;M;M",
        "homepage": ";;https://ailingzeng.site/;;https://www.sigs.tsinghua.edu.cn/fg3/105064.jhtml;https://yu-li.github.io/",
        "dblp": "14/1820;;226/4720;;;34/2997-3",
        "google_scholar": "M9qKrogAAAAJ;mmTJPJ4AAAAJ;Tn7fzS8AAAAJ;8SabwVEAAAAJ;https://scholar.google.com.hk/citations?user=fYdxi2sAAAAJ;j9lwU7kAAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";;%E7%88%B1%E7%8E%B2-%E6%9B%BE-65504112a/;;;",
        "or_profile": "~Zhendong_Yang2;~Zhe_Li11;~Ailing_Zeng1;~Zexian_Li1;~Chun_Yuan1;~Yu_Li4",
        "aff": " Tsinghua University;AMD;International Digital Economy Academy;Alibaba Group;Tsinghua University;International Digital Economy Academy",
        "aff_domain": "mails.tsinghua.edu.cn;amd.com;idea.edu.cn;alibaba.com;tsinghua.edu.cn;idea.edu.cn",
        "position": "MS student;Researcher;Researcher;Researcher;Full Professor;Principal Researcher",
        "bibtex": "@misc{\nyang2024vitkd,\ntitle={Vi{TKD}: Feature-based Knowledge Distillation for Vision Transformers},\nauthor={Zhendong Yang and Zhe Li and Ailing Zeng and Zexian Li and Chun Yuan and Yu Li},\nyear={2024},\nurl={https://openreview.net/forum?id=s8ROuWV96d}\n}",
        "github": "",
        "project": "",
        "reviewers": "1utk;LtTD;bvvH;HQ1H",
        "site": "https://openreview.net/forum?id=s8ROuWV96d",
        "pdf_size": 3954110,
        "rating": "3;3;5;6",
        "confidence": "5;4;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "75;44;67;161",
        "wc_strengths": "24;38;89;130",
        "wc_weaknesses": "384;244;188;131",
        "wc_questions": "2;89;7;46",
        "wc_review": "485;415;351;468",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            86.75,
            44.35298749802543
        ],
        "wc_strengths_avg": [
            70.25,
            42.13297402272951
        ],
        "wc_weaknesses_avg": [
            236.75,
            93.93448514789443
        ],
        "wc_questions_avg": [
            36.0,
            35.02142201567492
        ],
        "wc_review_avg": [
            429.75,
            52.284677487768825
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5555555555555555,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7933266849263437761&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2;3;0;2",
        "aff_unique_norm": "Tsinghua University;Advanced Micro Devices, Inc.;International Digital Economy Academy;Alibaba Group",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.amd.com;;https://www.alibaba.com",
        "aff_unique_abbr": "THU;AMD;;Alibaba",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "China;United States;"
    },
    {
        "title": "Towards Eliminating Hard Label Constraints in Gradient Inversion Attacks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17664",
        "id": "s8cMuxI5gu",
        "author_site": "Yanbo Wang, Jian Liang, Ran He",
        "tldr": "",
        "abstract": "Gradient inversion attacks aim to reconstruct local training data from intermediate gradients exposed in the federated learning framework. Despite successful attacks, all previous methods, starting from reconstructing a single data point and then relaxing the single-image limit to batch level, are only tested under hard label constraints. Even for single-image reconstruction, we still lack an analysis-based algorithm to recover augmented soft labels. In this work, we change the focus from enlarging batchsize to investigating the hard label constraints, considering a more realistic circumstance where label smoothing and mixup techniques are used in the training process. In particular, we are the first to initiate a novel algorithm to simultaneously recover the ground-truth augmented label and the input feature of the last fully-connected layer from single-input gradients, and provide a necessary condition for any analytical-based label recovery methods. Extensive experiments testify to the label recovery accuracy, as well as the benefits to the following image reconstruction. We believe soft labels in classification tasks are worth further attention in gradient inversion attacks.",
        "keywords": "label recovery;gradient inversion attacks",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/48637b04ac17c73ae656c789ca513094a16c6d24.zip",
        "author": "Yanbo Wang;Jian Liang;Ran He",
        "authorids": "~Yanbo_Wang5;~Jian_Liang1;~Ran_He1",
        "gender": "M;M;M",
        "homepage": "https://github.com/ybwang119;https://liangjian.xyz;https://rhe-web.github.io/",
        "dblp": "80/6085-4;19/2208-1;61/6198-1",
        "google_scholar": "wFKkFjkAAAAJ;https://scholar.google.com/citations?hl=en;ayrg9AUAAAAJ",
        "orcid": ";0000-0003-3890-1894;0000-0002-3807-991X",
        "linkedin": ";;",
        "or_profile": "~Yanbo_Wang5;~Jian_Liang1;~Ran_He1",
        "aff": "Institute of Automation, Chinese Academy of Sciences;Institute of Automation, Chinese Academy of Sciences;Institute of Automation, Chinese Academy of Sciences",
        "aff_domain": "ia.ac.cn;ia.ac.cn;ia.ac.cn",
        "position": "PhD student;Associate Professor;Full Professor",
        "bibtex": "@inproceedings{\nwang2024towards,\ntitle={Towards Eliminating Hard Label Constraints in Gradient Inversion Attacks},\nauthor={Yanbo Wang and Jian Liang and Ran He},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=s8cMuxI5gu}\n}",
        "github": "",
        "project": "",
        "reviewers": "xaET;pnnF;wnMY;3Kd5",
        "pdf_size": 1273365,
        "rating": "6;6;8;8",
        "confidence": "2;2;4;4",
        "soundness": "3;3;3;3",
        "contribution": "3;2;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "36;25;32;83",
        "wc_strengths": "10;25;67;44",
        "wc_weaknesses": "19;104;162;68",
        "wc_questions": "16;51;21;38",
        "wc_review": "81;205;282;233",
        "wc_reply_reviewers": "18;25;17;15",
        "wc_reply_authors": "328;455;594;430",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "3;3;2;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.0,
            1.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            44.0,
            22.85825890132492
        ],
        "wc_strengths_avg": [
            36.5,
            21.33658829335187
        ],
        "wc_weaknesses_avg": [
            88.25,
            52.184169055375406
        ],
        "wc_questions_avg": [
            31.5,
            13.901438774457844
        ],
        "wc_review_avg": [
            200.25,
            74.15987796645838
        ],
        "wc_reply_reviewers_avg": [
            18.75,
            3.766629793329841
        ],
        "wc_reply_authors_avg": [
            451.75,
            94.91147190935351
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5027448380870188456&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=s8cMuxI5gu",
        "pdf": "https://openreview.net/pdf?id=s8cMuxI5gu",
        "email": "ia.ac.cn;ia.ac.cn;ia.ac.cn",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Chinese Academy of Sciences",
        "aff_unique_dep": "Institute of Automation",
        "aff_unique_url": "http://www.ia.cas.cn",
        "aff_unique_abbr": "CAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "f-FERM: A Scalable Framework for Robust Fair Empirical Risk Minimization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17663",
        "id": "s90VIdza2K",
        "author_site": "Sina Baharlouei, Shivam Patel, Meisam Razaviyayn",
        "tldr": "",
        "abstract": "Training and deploying machine learning models that meet fairness criteria for protected groups are fundamental in modern artificial intelligence. \nWhile numerous constraints and regularization terms have been proposed in the literature to promote fairness in machine learning tasks, most of these approaches are not amenable to stochastic optimization due to the complex and nonlinear structure of constraints and regularizers. Here, the term ``stochastic'' refers to the ability of the algorithm to work with small mini-batches of data. Motivated by the limitation of existing literature, this paper presents a unified stochastic optimization framework for fair empirical risk minimization based on $f$-divergence measures ($f$-FERM). The proposed stochastic algorithm enjoys theoretical convergence guarantees. In addition, our experiments demonstrate the superiority of fairness-accuracy tradeoffs offered by $f$-FERM for almost all batch sizes (ranging from full-batch to batch size of one). Moreover, we show that our framework can be extended to the case where there is a distribution shift from training to the test data. \nOur extension is based on a distributionally robust optimization reformulation of $f$-FERM objective under $\\ell_p$ norms as uncertainty sets. Again, in this distributionally robust setting, $f$-FERM not only enjoys theoretical convergence guarantees but also outperforms other baselines in the literature in the tasks involving distribution shifts. \n An efficient stochastic implementation of $f$-FERM is publicly available.",
        "keywords": "Algorithmic Fairness;Distributionally Robust Optimization;Distribution Shift;Fairness;f-divergences",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/85a64a2594f7a9b4158b0c6f61ef8d1fc7a31ed0.pdf",
        "author": "Sina Baharlouei;Shivam Patel;Meisam Razaviyayn",
        "authorids": "~Sina_Baharlouei1;~Shivam_Patel1;~Meisam_Razaviyayn1",
        "gender": "M;M;M",
        "homepage": ";https://patel-shivam.github.io;https://sites.usc.edu/razaviyayn/",
        "dblp": "243/6970;;43/8577",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;https://scholar.google.com/citations?hl=en",
        "orcid": ";;",
        "linkedin": "sina-baharlouei-00b4ba97/;shivam-patel02/;",
        "or_profile": "~Sina_Baharlouei1;~Shivam_Patel1;~Meisam_Razaviyayn1",
        "aff": "University of Southern California;Indian Institute of Technology Bombay;Google",
        "aff_domain": "usc.edu;iitb.ac.in;google.com",
        "position": "PhD student;Undergrad student;Researcher",
        "bibtex": "@inproceedings{\nbaharlouei2024fferm,\ntitle={f-{FERM}: A  Scalable Framework for  Robust Fair Empirical Risk Minimization},\nauthor={Sina Baharlouei and Shivam Patel and Meisam Razaviyayn},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=s90VIdza2K}\n}",
        "github": "",
        "project": "",
        "reviewers": "hKcK;o4nf;zLcF;PRWu",
        "pdf_size": 1412978,
        "rating": "5;5;6;8",
        "confidence": "3;4;4;3",
        "soundness": "3;3;3;4",
        "contribution": "2;2;3;4",
        "presentation": "3;3;3;3",
        "wc_summary": "93;69;110;237",
        "wc_strengths": "62;30;34;21",
        "wc_weaknesses": "124;281;39;3",
        "wc_questions": "2;4;1;3",
        "wc_review": "281;384;184;264",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "784;1252;402;424",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            127.25,
            65.01682474559951
        ],
        "wc_strengths_avg": [
            36.75,
            15.31951369985353
        ],
        "wc_weaknesses_avg": [
            111.75,
            107.13863682164339
        ],
        "wc_questions_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_review_avg": [
            278.25,
            71.19822680376247
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            715.5,
            344.8836760416474
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.40824829046386296,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6576833376337199709&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 9,
        "openreview": "https://openreview.net/forum?id=s90VIdza2K",
        "pdf": "https://openreview.net/pdf?id=s90VIdza2K",
        "email": "usc.edu;iitb.ac.in;google.com",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of Southern California;Indian Institute of Technology Bombay;Google",
        "aff_unique_dep": ";;Google",
        "aff_unique_url": "https://www.usc.edu;https://www.iitb.ac.in;https://www.google.com",
        "aff_unique_abbr": "USC;IIT Bombay;Google",
        "aff_campus_unique_index": "0;1;2",
        "aff_campus_unique": "Los Angeles;Bombay;Mountain View",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United States;India"
    },
    {
        "id": "s9bCeJGUJi",
        "title": "Curriculum Dynamic Graph Invariant Learning under Distribution Shift",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Dynamic graph neural networks have attracted intensive research interests recently but generally suffer from handling distribution shifts that widely exist in dynamic graphs. Although the existing works attempt to disentangle the invariant and variant patterns, they ignore the training status of the graph neural network and the importance of training samples at different times, which are critical to model invariant patterns accurately in dynamic graphs under distribution shifts. In this paper, we study distribution shifts in dynamic graphs with curriculum learning for the first time, which remains unexplored and faces the following challenges: (i) how to design a tailored training status evaluation strategy; and (ii) how to design a tailored sample importance reweighting strategy, so as to handle distribution shifts in dynamic graphs. To address these challenges, we propose a Curriculum Dynamic Graph Invariant Learning (CDGIL) model, which can handle distribution shifts in dynamic graphs by capturing and utilizing invariant and variant patterns guided by the proposed curriculum learning strategy. Specifically, we first propose a dual disentangled dynamic attention network to capture the invariant and variant patterns, respectively. Next, we propose a self-paced intervention mechanism based on training status to create adversarial samples by reassembling variant patterns across neighborhoods and time stamps to remove the spurious impacts of variant patterns. Finally, we propose a sample importance reweighting strategy to distinguish invariant and variant patterns better via focusing on the key training samples. Extensive experiments on both synthetic and real-world dynamic graph datasets demonstrate the superiority of our proposed method over state-of-the-art baselines under distribution shifts.",
        "keywords": "Graph Representation Learning;Out Of Distribution Generalization;Curriculum Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Zizhao Zhang;Haoyang Li;Zeyang Zhang;Ziwei Zhang;Yuan Meng;Xin Wang;Wenwu Zhu",
        "authorids": "~Zizhao_Zhang4;~Haoyang_Li1;~Zeyang_Zhang1;~Ziwei_Zhang1;~Yuan_Meng2;~Xin_Wang17;~Wenwu_Zhu1",
        "gender": ";M;;;F;M;M",
        "homepage": ";https://haoyang.li;https://zzythu.com;;;http://mn.cs.tsinghua.edu.cn/xinwang/;http://media.cs.tsinghua.edu.cn/en/zww",
        "dblp": ";118/0004-1.html;236/0242;;;10/5630-19;97/6308-1.html",
        "google_scholar": ";86RE16gAAAAJ;w_njVcAAAAAJ;;https://scholar.google.com/citations?hl=zh-CN;YPOBHYUAAAAJ;https://scholar.google.com.tw/citations?user=7t2jzpgAAAAJ",
        "orcid": ";0000-0003-3544-5563;0000-0003-1329-1313;;0000-0002-7450-9438;0000-0002-0351-2939;0000-0003-2236-9290",
        "linkedin": ";;zeyang-zhang-a7a039159;;;;",
        "or_profile": "~Zizhao_Zhang4;~Haoyang_Li1;~Zeyang_Zhang1;~Ziwei_Zhang1;~Yuan_Meng2;~Xin_Wang17;~Wenwu_Zhu1",
        "aff": ";Cornell University;Tsinghua University;;Tsinghua University;Tsinghua University;Tsinghua University",
        "aff_domain": ";med.cornell.edu;tsinghua.edu.cn;;mail.tsinghua.edu.cn;cs.tsinghua.edu.cn;tsinghua.edu.cn",
        "position": ";Postdoc;PhD student;;Assistant Professor;Associate Professor;Full Professor",
        "bibtex": "@misc{\nzhang2024curriculum,\ntitle={Curriculum Dynamic Graph Invariant Learning under Distribution Shift},\nauthor={Zizhao Zhang and Haoyang Li and Zeyang Zhang and Ziwei Zhang and Yuan Meng and Xin Wang and Wenwu Zhu},\nyear={2024},\nurl={https://openreview.net/forum?id=s9bCeJGUJi}\n}",
        "github": "",
        "project": "",
        "reviewers": "GMx5;GHD2;wfAZ;QAsp",
        "site": "https://openreview.net/forum?id=s9bCeJGUJi",
        "pdf_size": 412195,
        "rating": "3;3;3;6",
        "confidence": "4;4;4;4",
        "soundness": "2;3;2;3",
        "contribution": "1;3;2;3",
        "presentation": "2;2;2;3",
        "wc_summary": "58;51;39;183",
        "wc_strengths": "26;38;8;39",
        "wc_weaknesses": "305;253;135;211",
        "wc_questions": "89;4;7;67",
        "wc_review": "478;346;189;500",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            82.75,
            58.276817860964236
        ],
        "wc_strengths_avg": [
            27.75,
            12.497499749949988
        ],
        "wc_weaknesses_avg": [
            226.0,
            62.20128616033595
        ],
        "wc_questions_avg": [
            41.75,
            37.09026152509578
        ],
        "wc_review_avg": [
            378.25,
            124.1256923444941
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:_Jwv14oGkekJ:scholar.google.com/&scioq=Curriculum+Dynamic+Graph+Invariant+Learning+under+Distribution+Shift&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1;1",
        "aff_unique_norm": "Cornell University;Tsinghua University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cornell.edu;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "Cornell;THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;1",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "SocioDojo: Building Lifelong Analytical Agents with Real-world Text and Time Series",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17662",
        "id": "s9z0HzWJJp",
        "author_site": "Junyan Cheng, Peter Chin",
        "tldr": "",
        "abstract": "We introduce SocioDojo, an open-ended lifelong learning environment for developing ready-to-deploy autonomous agents capable of performing human-like analysis and decision-making on societal topics such as economics, finance, politics, and culture. It consists of (1) information sources from news, social media, reports, etc., (2) a knowledge base built from books, journals, and encyclopedias, plus a toolbox of Internet and knowledge graph search interfaces, (3) 30K high-quality time series in finance, economy, society, and polls, which support a novel task called \"hyperportfolio\", that can reliably and scalably evaluate societal analysis and decision-making power of agents, inspired by portfolio optimization with time series as assets to \"invest\". We also propose a novel Analyst-Assistant-Actuator architecture for the hyperportfolio task, and a Hypothesis & Proof prompting for producing in-depth analyses on input news, articles, etc. to assist decision-making. We perform experiments and ablation studies to explore the factors that impact performance. The results show that our proposed method achieves improvements of 32.4% and 30.4% compared to the state-of-the-art method in the two experimental settings.",
        "keywords": "Large Langauge Models;Agent;Prompt Tunning;Time series forcasting",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/67fb0721ab8efee533ef6a1c860effcbf601b604.zip",
        "author": "Junyan Cheng;Peter Chin",
        "authorids": "~Junyan_Cheng1;~Peter_Chin1",
        "gender": "M;",
        "homepage": "https://junyan.ch;https://engineering.dartmouth.edu/community/faculty/peter-chin",
        "dblp": "305/5474;133/4494",
        "google_scholar": "omA0ZZMAAAAJ;",
        "orcid": ";",
        "linkedin": "junyan-cheng-277716111/;",
        "or_profile": "~Junyan_Cheng1;~Peter_Chin1",
        "aff": "Allen Institute for Artificial Intelligence;Dartmouth College",
        "aff_domain": "allenai.org;dartmouth.edu",
        "position": "Intern;Full Professor",
        "bibtex": "@inproceedings{\ncheng2024sociodojo,\ntitle={SocioDojo: Building Lifelong Analytical Agents with Real-world Text and Time Series},\nauthor={Junyan Cheng and Peter Chin},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=s9z0HzWJJp}\n}",
        "github": "",
        "project": "",
        "reviewers": "apFV;qsUb;jccf",
        "pdf_size": 6582017,
        "rating": "5;8;8",
        "confidence": "3;3;4",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "2;4;4",
        "wc_summary": "102;260;75",
        "wc_strengths": "73;176;51",
        "wc_weaknesses": "111;171;76",
        "wc_questions": "218;13;26",
        "wc_review": "504;620;228",
        "wc_reply_reviewers": "168;0;0",
        "wc_reply_authors": "1339;474;462",
        "reply_reviewers": "1;0;0",
        "reply_authors": "3;1;1",
        "rating_avg": [
            7.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            145.66666666666666,
            81.59384508377795
        ],
        "wc_strengths_avg": [
            100.0,
            54.48547206977899
        ],
        "wc_weaknesses_avg": [
            119.33333333333333,
            39.228674319799396
        ],
        "wc_questions_avg": [
            85.66666666666667,
            93.72418163004797
        ],
        "wc_review_avg": [
            450.6666666666667,
            164.41681449562537
        ],
        "wc_reply_reviewers_avg": [
            56.0,
            79.19595949289332
        ],
        "wc_reply_authors_avg": [
            758.3333333333334,
            410.62256256675533
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3925200130207716368&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=s9z0HzWJJp",
        "pdf": "https://openreview.net/pdf?id=s9z0HzWJJp",
        "email": "allenai.org;dartmouth.edu",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Allen Institute for Artificial Intelligence;Dartmouth College",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://allenai.org;https://www.dartmouth.edu",
        "aff_unique_abbr": "AI2;Dartmouth",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "sAOtKKHh1i",
        "title": "Subwords as Skills: Tokenization for Sparse-Reward Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Exploration in sparse-reward reinforcement learning is difficult due to the need for long, coordinated sequences of actions in order to achieve any reward. Moreover, in continuous action spaces there are an infinite number of possible actions, which only increases the difficulty of exploration. One class of methods designed to address these issues forms temporally extended actions, often called skills, from interaction data collected in the same domain, and optimizes a policy on top of this new action space. Typically such methods require a lengthy pretraining phase, especially in continuous action spaces, in order to form the skills before reinforcement learning can begin. Given prior evidence that the full range of the continuous action space is not required in such tasks, we propose a novel approach to skill-generation with two components. First we discretize the action space through clustering, and second we leverage a tokenization technique borrowed from natural language processing to generate temporally extended actions. Such a method outperforms baselines for skill-generation in several challenging sparse-reward domains, and requires orders-of-magnitude less computation in skill-generation and online rollouts.",
        "keywords": "Reinforcement Learning;Deep Learning;Tokenization;Hierarchical RL",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/efc20057e5a73218df96a9872d355541d58afc33.pdf",
        "author": "David Yunis;Justin Jung;Falcon Z Dai;Matthew Walter",
        "authorids": "~David_Yunis1;~Justin_Jung1;~Falcon_Z_Dai1;~Matthew_Walter1",
        "gender": ";M;M;M",
        "homepage": ";https://deep-exploration.vercel.app/about;http://falcondai.com;http://ttic.edu/walter",
        "dblp": ";;228/7969;50/7734",
        "google_scholar": ";;https://scholar.google.com/citations?hl=en;RAiewnEAAAAJ",
        "orcid": ";;;0000-0003-1425-6050",
        "linkedin": ";;;",
        "or_profile": "~David_Yunis1;~Justin_Jung1;~Falcon_Z_Dai1;~Matthew_Walter1",
        "aff": ";Springtail.ai;;Toyota Technological Institute at Chicago",
        "aff_domain": ";springtail.ai;;ttic.edu",
        "position": ";Researcher;;Associate Professor",
        "bibtex": "@misc{\nyunis2024subwords,\ntitle={Subwords as Skills: Tokenization for Sparse-Reward Reinforcement Learning},\nauthor={David Yunis and Justin Jung and Falcon Z Dai and Matthew Walter},\nyear={2024},\nurl={https://openreview.net/forum?id=sAOtKKHh1i}\n}",
        "github": "",
        "project": "",
        "reviewers": "NHza;AfCr;Y696;mNUW",
        "site": "https://openreview.net/forum?id=sAOtKKHh1i",
        "pdf_size": 2560110,
        "rating": "3;5;6;6",
        "confidence": "4;2;3;4",
        "soundness": "1;3;2;3",
        "contribution": "2;3;3;3",
        "presentation": "2;2;3;2",
        "wc_summary": "106;50;84;68",
        "wc_strengths": "49;56;51;87",
        "wc_weaknesses": "282;179;65;243",
        "wc_questions": "102;4;656;130",
        "wc_review": "539;289;856;528",
        "wc_reply_reviewers": "504;0;145;180",
        "wc_reply_authors": "1548;714;992;1244",
        "reply_reviewers": "1;0;2;1",
        "reply_authors": "3;2;3;3",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            77.0,
            20.615528128088304
        ],
        "wc_strengths_avg": [
            60.75,
            15.368392889303683
        ],
        "wc_weaknesses_avg": [
            192.25,
            82.15648178932689
        ],
        "wc_questions_avg": [
            223.0,
            254.33245958783948
        ],
        "wc_review_avg": [
            553.0,
            201.4485045861597
        ],
        "wc_reply_reviewers_avg": [
            207.25,
            184.14040159617335
        ],
        "wc_reply_authors_avg": [
            1124.5,
            308.0986043460762
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.75,
            0.4330127018922193
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.24618298195866545,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Vo-UeA34EgcJ:scholar.google.com/&scioq=Subwords+as+Skills:+Tokenization+for+Sparse-Reward+Reinforcement+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Springtail.ai;Toyota Technological Institute at Chicago",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.springtail.ai;https://www.tti-chicago.org",
        "aff_unique_abbr": "Springtail;TTI Chicago",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Chicago",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "MagicDrive: Street View Generation with Diverse 3D Geometry Control",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17661",
        "id": "sBQwvucduK",
        "author_site": "Ruiyuan Gao, Kai Chen, Enze Xie, Lanqing HONG, Zhenguo Li, Dit-Yan Yeung, Qiang Xu",
        "tldr": "",
        "abstract": "Recent advancements in diffusion models have significantly enhanced the data synthesis with 2D control. Yet, precise 3D control in street view generation, crucial for 3D perception tasks, remains elusive. Specifically, utilizing Bird's-Eye View (BEV) as the primary condition often leads to challenges in geometry control (e.g., height), affecting the representation of object shapes, occlusion patterns, and road surface elevations, all of which are essential to perception data synthesis, especially for 3D object detection tasks. In this paper, we introduce MagicDrive, a novel street view generation framework, offering diverse 3D geometry controls including camera poses, road maps, and 3D bounding boxes, together with textual descriptions, achieved through tailored encoding strategies. Besides, our design incorporates a cross-view attention module, ensuring consistency across multiple camera views. With MagicDrive, we achieve high-fidelity street-view image & video synthesis that captures nuanced 3D geometry and various scene descriptions, enhancing tasks like BEV segmentation and 3D object detection. Project Website: https://flymin.github.io/magicdrive",
        "keywords": "diffusion models;street view generation;3D control",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/eb0a1866b85bc183ffe0f47ef5a07d92baa135c4.zip",
        "author": "Ruiyuan Gao;Kai Chen;Enze Xie;Lanqing HONG;Zhenguo Li;Dit-Yan Yeung;Qiang Xu",
        "authorids": "~Ruiyuan_Gao2;~Kai_Chen11;~Enze_Xie1;~Lanqing_HONG1;~Zhenguo_Li1;~Dit-Yan_Yeung2;~Qiang_Xu1",
        "gender": ";M;M;F;M;M;M",
        "homepage": ";https://kaichen1998.github.io/;https://xieenze.github.io/;https://racheltechie.github.io/;http://www.ee.columbia.edu/~zgli/;https://cse.hkust.edu.hk/faculty/dyyeung/;https://github.com/cure-lab",
        "dblp": ";c/KaiChen24;218/5441;226/4258;23/6479;41/5668;43/1230-1",
        "google_scholar": ";3qBfyLIAAAAJ;42MVVPgAAAAJ;https://scholar.google.com.sg/citations?user=2p7x6OUAAAAJ;XboZC1AAAAAJ;nEsOOx8AAAAJ;https://scholar.google.com.tw/citations?user=eSiKPqUAAAAJ",
        "orcid": ";;;;;0000-0003-3716-8125;",
        "linkedin": ";;;;;;",
        "or_profile": "~Ruiyuan_Gao2;~Kai_Chen11;~Enze_Xie1;~Lanqing_HONG1;~Zhenguo_Li1;~Dit-Yan_Yeung2;~Qiang_Xu1",
        "aff": ";Hong Kong University of Science and Technology;Huawei Noah's Ark Lab;Huawei Technologies Ltd.;Huawei Noah's Ark Lab;Hong Kong University of Science and Technology;The Chinese University of Hong Kong",
        "aff_domain": ";ust.hk;huawei.com;huawei.com;huawei.com;ust.hk;cuhk.edu.hk",
        "position": ";PhD student;Researcher;Researcher;Principal Researcher;Chair Professor;Full Professor",
        "bibtex": "@inproceedings{\ngao2024magicdrive,\ntitle={MagicDrive: Street View Generation with Diverse 3D Geometry Control},\nauthor={Ruiyuan Gao and Kai Chen and Enze Xie and Lanqing HONG and Zhenguo Li and Dit-Yan Yeung and Qiang Xu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=sBQwvucduK}\n}",
        "github": "",
        "project": "",
        "reviewers": "jXFZ;dbzg;TY6p;UU4E",
        "pdf_size": 21339157,
        "rating": "5;5;6;8",
        "confidence": "4;4;2;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "4;3;3;4",
        "wc_summary": "130;133;64;95",
        "wc_strengths": "33;51;48;102",
        "wc_weaknesses": "57;173;196;115",
        "wc_questions": "21;218;28;79",
        "wc_review": "241;575;336;391",
        "wc_reply_reviewers": "191;0;0;0",
        "wc_reply_authors": "1102;1346;610;732",
        "reply_reviewers": "3;0;0;0",
        "reply_authors": "4;3;1;2",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            105.5,
            28.235615806991
        ],
        "wc_strengths_avg": [
            58.5,
            26.02402735934621
        ],
        "wc_weaknesses_avg": [
            135.25,
            53.9646875280493
        ],
        "wc_questions_avg": [
            86.5,
            79.15333221033717
        ],
        "wc_review_avg": [
            385.75,
            121.72792407660619
        ],
        "wc_reply_reviewers_avg": [
            47.75,
            82.70542606141389
        ],
        "wc_reply_authors_avg": [
            947.5,
            292.83911965446146
        ],
        "reply_reviewers_avg": [
            0.75,
            1.299038105676658
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 103,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7339346276376929265&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=sBQwvucduK",
        "pdf": "https://openreview.net/pdf?id=sBQwvucduK",
        "email": ";ust.hk;huawei.com;huawei.com;huawei.com;ust.hk;cuhk.edu.hk",
        "author_num": 7,
        "aff_unique_index": "0;1;1;1;0;2",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Huawei;Chinese University of Hong Kong",
        "aff_unique_dep": ";Noah's Ark Lab;",
        "aff_unique_url": "https://www.ust.hk;https://www.huawei.com;https://www.cuhk.edu.hk",
        "aff_unique_abbr": "HKUST;Huawei;CUHK",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "sBSC0OXEQG",
        "title": "Correlated dense associative memories",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Associative memory networks store memory patterns by forming dynamic attractors around chosen states of neurons. These attractors do not, however, need to be fixed points or single memory patterns. By correlating attractors, we may represent temporally or spatially related sequences or groups of stimuli. By further modulating these correlations using inhibitory (anti-Hebbian) learning rules, we show how such sequences and groups may be hierarchically-segmented at multiple scales. In combination with the dramatically-increased storage capacity of dense associative memory networks (also known as modern Hopfield networks) and their connection to Transformers, our results have implications for both machine learning and neurobiology. We demonstrate this by applying our networks, dubbed *Correlated Dense Associative Memory (CDAM)*, to model multi-scale representations of community structures in graphs, oriented recall in a symmetric connection regime, and temporal sequences with distractors in an asymmetric connection regime.",
        "keywords": "inhibition;dense associative memory;Hopfield network;community detection;clustering;navigation",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Thomas F Burns",
        "authorids": "~Thomas_F_Burns1",
        "gender": "M",
        "homepage": "https://tfburns.com/",
        "dblp": "311/5096",
        "google_scholar": "xifCmHAAAAAJ",
        "orcid": "0000-0002-1123-2929",
        "linkedin": "tfburns/",
        "or_profile": "~Thomas_F_Burns1",
        "aff": "Timaeus",
        "aff_domain": "timaeus.co",
        "position": "Researcher",
        "bibtex": "@misc{\nburns2024correlated,\ntitle={Correlated dense associative memories},\nauthor={Thomas F Burns},\nyear={2024},\nurl={https://openreview.net/forum?id=sBSC0OXEQG}\n}",
        "github": "",
        "project": "",
        "reviewers": "oKZA;TfVu;K2Ug;uRxw",
        "site": "https://openreview.net/forum?id=sBSC0OXEQG",
        "pdf_size": 1741880,
        "rating": "3;3;6;6",
        "confidence": "4;4;4;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;2;3",
        "wc_summary": "19;121;53;43",
        "wc_strengths": "47;32;60;116",
        "wc_weaknesses": "47;277;224;141",
        "wc_questions": "458;144;179;166",
        "wc_review": "571;574;516;466",
        "wc_reply_reviewers": "0;536;0;0",
        "wc_reply_authors": "562;1240;533;696",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            59.0,
            37.86819245752297
        ],
        "wc_strengths_avg": [
            63.75,
            31.751968442917047
        ],
        "wc_weaknesses_avg": [
            172.25,
            87.05565748416355
        ],
        "wc_questions_avg": [
            236.75,
            128.34986365399848
        ],
        "wc_review_avg": [
            531.75,
            44.4318298070201
        ],
        "wc_reply_reviewers_avg": [
            134.0,
            232.09480821422954
        ],
        "wc_reply_authors_avg": [
            757.75,
            285.1353845105865
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.5773502691896258,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:oM7uiyN0EMAJ:scholar.google.com/&scioq=Correlated+dense+associative+memories&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Timaeus",
        "aff_unique_dep": "",
        "aff_unique_url": "",
        "aff_unique_abbr": ""
    },
    {
        "id": "sCd7pHnXMG",
        "title": "CorruptEncoder: Data Poisoning based Backdoor Attacks to Contrastive Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Contrastive learning (CL) pre-trains general-purpose encoders using an unlabeled pre-training dataset, which consists of images or image-text pairs. CL is vulnerable to data poisoning based backdoor attacks (DPBAs), in which an attacker injects poisoned inputs into the pre-training dataset so the encoder is backdoored. However, existing DPBAs achieve limited effectiveness. In this work, we take the first step to analyze the limitations of existing attacks and propose new DPBAs called CorruptEncoder to CL. CorruptEncoder uses a theory-guided method to create optimal poisoned inputs to maximize attack effectiveness. Our experiments show that CorruptEncoder substantially outperforms existing DPBAs. In particular, CorruptEncoder is the first DPBA that achieves more than 90% attack success rates with only a few (3) reference images and a small poisoning ratio (0.5%). Moreover, we also propose a defense, called localized cropping, to defend against DPBAs. Our results show that our defense can reduce the effectiveness of DPBAs, but it sacrifices the utility of the encoder, highlighting the need for new defenses.",
        "keywords": "Poisoning and backdoor attack; Self-supervised learning; Contrastive learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/198186b1c7db9384d083affa566961e45bb9138c.zip",
        "author": "Jinghuai Zhang;Hongbin Liu;Jinyuan Jia;Neil Zhenqiang Gong",
        "authorids": "~Jinghuai_Zhang2;~Hongbin_Liu2;~Jinyuan_Jia2;~Neil_Zhenqiang_Gong1",
        "gender": ";M;;",
        "homepage": ";https://scholars.duke.edu/person/hongbin.liu;https://jinyuan-jia.github.io/;",
        "dblp": ";82/6141-5;24/5124-1.html;",
        "google_scholar": ";1Vitx-wAAAAJ;iyg4ytkAAAAJ;",
        "orcid": ";;0000-0002-9785-7769;",
        "linkedin": ";hongbin-liu-002387158/;;",
        "or_profile": "~Jinghuai_Zhang2;~Hongbin_Liu2;~Jinyuan_Jia2;~Neil_Zhenqiang_Gong1",
        "aff": ";Duke University;Pennsylvania State University;",
        "aff_domain": ";duke.edu;psu.edu;",
        "position": ";PhD student;Assistant Professor;",
        "bibtex": "@misc{\nzhang2024corruptencoder,\ntitle={CorruptEncoder: Data Poisoning based Backdoor Attacks to Contrastive Learning},\nauthor={Jinghuai Zhang and Hongbin Liu and Jinyuan Jia and Neil Zhenqiang Gong},\nyear={2024},\nurl={https://openreview.net/forum?id=sCd7pHnXMG}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZnaL;PPLg;KQ3f;2JkZ",
        "site": "https://openreview.net/forum?id=sCd7pHnXMG",
        "pdf_size": 8559512,
        "rating": "3;3;6;8",
        "confidence": "4;4;3;4",
        "soundness": "2;2;3;4",
        "contribution": "2;2;3;3",
        "presentation": "2;2;3;4",
        "wc_summary": "61;62;75;94",
        "wc_strengths": "36;45;61;113",
        "wc_weaknesses": "1057;442;77;71",
        "wc_questions": "4;5;71;14",
        "wc_review": "1158;554;284;292",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            5.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            73.0,
            13.322912594474229
        ],
        "wc_strengths_avg": [
            63.75,
            29.810862114336782
        ],
        "wc_weaknesses_avg": [
            411.75,
            401.69352434411985
        ],
        "wc_questions_avg": [
            23.5,
            27.69927796892908
        ],
        "wc_review_avg": [
            572.0,
            355.33927449692357
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.2721655269759087,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10188545840188251623&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Duke University;Pennsylvania State University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.duke.edu;https://www.psu.edu",
        "aff_unique_abbr": "Duke;PSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "sDlMJVXXeV",
        "title": "Neural varifolds: an aggregate representation for quantifying geometry of point clouds",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Point clouds are popular 3D representations for real-life objects (such as in LiDAR, Kinect and smartphones) due to their detailed and compact representation of surface-based geometry. Recent approaches characterise the geometry of point clouds by bringing deep-learning based techniques together with geometric fidelity metrics such as optimal transportation costs (e.g. Chamfer and Wasserstein metrics). In this paper, we propose a new surface geometry characterisation within this realm, namely a neural varifold representation of point clouds. Here the surface is represented as a measure/distribution over both point positions and tangent spaces of point clouds. The varifold representation not only helps to quantify the surface geometry of point clouds through the manifold-based discrimination, but also subtle geometric consistency on the surface due to the combined product space. This study proposes neural varifold algorithms to compute varifold norm between two point clouds using neural networks on point clouds and their neural tangent kernel representations. The proposed neural varifold is evaluated on three different tasks -- shape classification, shape reconstruction and shape matching. Detailed evaluation and comparison to the state-of-the-art methods demonstrate that the proposed versatile neural varifold is superior in shape classification particularly for limited data and is quite competitive for shape reconstruction and matching.",
        "keywords": "surface geometry;point clouds;mesh;neural tangent kernel;varifold",
        "primary_area": "metric learning, kernel learning, and sparse coding",
        "supplementary_material": "",
        "author": "Juheon Lee;Xiaohao Cai;Carola-Bibiane Sch\u00f6nlieb;Simon Masnou",
        "authorids": "~Juheon_Lee3;~Xiaohao_Cai2;~Carola-Bibiane_Sch\u00f6nlieb1;~Simon_Masnou1",
        "gender": "M;;F;M",
        "homepage": ";https://www.southampton.ac.uk/people/5y65yy/doctor-xiaohao-cai;http://www.damtp.cam.ac.uk/research/cia/;http://math.univ-lyon1.fr/homes-www/masnou/",
        "dblp": ";16/10261;07/8184;15/2906",
        "google_scholar": "GmLH4hsAAAAJ;https://scholar.google.co.uk/citations?user=MOjShggAAAAJ;nPeOXjwAAAAJ;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Juheon_Lee3;~Xiaohao_Cai2;~Carola-Bibiane_Sch\u00f6nlieb1;~Simon_Masnou1",
        "aff": "HP Inc.;University of Southampton;University of Cambridge;Universit\u00e9 Claude Bernard (Lyon I)",
        "aff_domain": "hp.com;soton.co.uk;cam.ac.uk;univ-lyon1.fr",
        "position": "Researcher;Lecturer;Full Professor;Full Professor",
        "bibtex": "@misc{\nlee2024neural,\ntitle={Neural varifolds: an aggregate representation for quantifying geometry of point clouds},\nauthor={Juheon Lee and Xiaohao Cai and Carola-Bibiane Sch{\\\"o}nlieb and Simon Masnou},\nyear={2024},\nurl={https://openreview.net/forum?id=sDlMJVXXeV}\n}",
        "github": "",
        "project": "",
        "reviewers": "vDG7;6p7s;wzuY",
        "site": "https://openreview.net/forum?id=sDlMJVXXeV",
        "pdf_size": 28760108,
        "rating": "5;5;5",
        "confidence": "2;4;3",
        "soundness": "2;3;3",
        "contribution": "2;2;2",
        "presentation": "3;3;3",
        "wc_summary": "54;145;174",
        "wc_strengths": "56;166;58",
        "wc_weaknesses": "96;223;118",
        "wc_questions": "43;144;377",
        "wc_review": "249;678;727",
        "wc_reply_reviewers": "0;56;0",
        "wc_reply_authors": "1580;2567;2045",
        "reply_reviewers": "0;1;0",
        "reply_authors": "6;9;6",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            124.33333333333333,
            51.12294548982439
        ],
        "wc_strengths_avg": [
            93.33333333333333,
            51.38957957493804
        ],
        "wc_weaknesses_avg": [
            145.66666666666666,
            55.41560149352246
        ],
        "wc_questions_avg": [
            188.0,
            139.85945326171796
        ],
        "wc_review_avg": [
            551.3333333333334,
            214.71583287892136
        ],
        "wc_reply_reviewers_avg": [
            18.666666666666668,
            26.398653164297773
        ],
        "wc_reply_authors_avg": [
            2064.0,
            403.164978637778
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            7.0,
            1.4142135623730951
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:mlaWLj2iVG4J:scholar.google.com/&scioq=Neural+varifolds:+an+aggregate+representation+for+quantifying+geometry+of+point+clouds&hl=en&as_sdt=0,5",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "HP Inc.;University of Southampton;University of Cambridge;Universit\u00e9 Claude Bernard",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.hp.com;https://www.southampton.ac.uk;https://www.cam.ac.uk;https://www.universite-lyon1.fr",
        "aff_unique_abbr": "HP;Southampton;Cambridge;UCBL",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Cambridge;Lyon",
        "aff_country_unique_index": "0;1;1;2",
        "aff_country_unique": "United States;United Kingdom;France"
    },
    {
        "id": "sDmjlpphdB",
        "title": "Mixture-of-Experts in Prompt Optimization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) exhibit strong generalization power in adapting to novel tasks when prompted with language instructions and in-context demos. Since this ability sensitively depends on the quality of prompts, various methods have been explored to automate the instruction design process. While these methods demonstrated promising results, they also restricted the output space of the search problem to a demo-free instruction. Such simplification significantly limits their performance, as a single demo-free instruction might not be able to cover the entire problem space of the targeted task due to its complexity. To alleviate this issue, we adopt the Mixture-of-Expert paradigm to divide the problem space into homogeneous regions, each governed by a specialized expert. To further improve the coverage of each expert, we expand their prompts to contain both an instruction and several demos.  A two-phase process is developed to construct the specialized expert for each region: (1) demo assignment: Inspired by the theoretical connection between in-context learning and kernel regression, we group demos into clusters based on their semantic similarity and assign a cluster to each expert; (2) instruction assignment: A region-based joint search is applied to optimize an instruction complementary to the demo cluster for each expert, yielding a synergistic effect. The resulting method, codenamed Mixture-of-Prompts (MoP), outperforms prior art by up to 43% on benchmark NLP tasks.",
        "keywords": "LLM;Prompt Engineering;Prompt Optimization;Mixture-of-Experts",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/cd01d670de5959a1febdeb3954fcaeabb02cc414.pdf",
        "author": "Ruochen Wang;Sohyun An;Minhao Cheng;Tianyi Zhou;Sung Ju Hwang;Cho-Jui Hsieh",
        "authorids": "~Ruochen_Wang2;~Sohyun_An1;~Minhao_Cheng1;~Tianyi_Zhou1;~Sung_Ju_Hwang1;~Cho-Jui_Hsieh1",
        "gender": "M;F;M;M;;M",
        "homepage": "https://ruocwang.github.io/;https://cownowan.github.io/;https://cmhcbb.github.io/;https://tianyizhou.github.io/;;http://web.cs.ucla.edu/~chohsieh/index.html",
        "dblp": "33/120;348/6996;174/1717;88/8205-1;;14/2770",
        "google_scholar": "8fXrlRAAAAAJ;tW1jSXMAAAAJ;_LkC1yoAAAAJ;OKvgizMAAAAJ;;Wy89g4IAAAAJ",
        "orcid": ";;0000-0003-3965-4215;0000-0001-5348-0632;;",
        "linkedin": "ruochen-wang-1699b1113/;sohyunan0423;;tianyizhou;;",
        "or_profile": "~Ruochen_Wang2;~Sohyun_An1;~Minhao_Cheng1;~Tianyi_Zhou1;~Sung_Ju_Hwang1;~Cho-Jui_Hsieh1",
        "aff": "University of California, Los Angeles;Korea Advanced Institute of Science & Technology;Pennsylvania State University;University of Maryland, College Park;;University of California, Los Angeles",
        "aff_domain": "ucla.edu;kaist.ac.kr;psu.edu;umd.edu;;ucla.edu",
        "position": "PhD student;MS student;Assistant Professor;Assistant Professor;;Associate Professor",
        "bibtex": "@misc{\nwang2024mixtureofexperts,\ntitle={Mixture-of-Experts in Prompt Optimization},\nauthor={Ruochen Wang and Sohyun An and Minhao Cheng and Tianyi Zhou and Sung Ju Hwang and Cho-Jui Hsieh},\nyear={2024},\nurl={https://openreview.net/forum?id=sDmjlpphdB}\n}",
        "github": "",
        "project": "",
        "reviewers": "rsCB;cYiT;RqkC;24Yo",
        "site": "https://openreview.net/forum?id=sDmjlpphdB",
        "pdf_size": 1286347,
        "rating": "3;5;5;6",
        "confidence": "4;3;4;4",
        "soundness": "3;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "3;2;2;3",
        "wc_summary": "34;89;223;108",
        "wc_strengths": "43;92;139;106",
        "wc_weaknesses": "290;106;387;50",
        "wc_questions": "142;234;27;65",
        "wc_review": "509;521;776;329",
        "wc_reply_reviewers": "0;92;68;0",
        "wc_reply_authors": "1886;2495;1463;1582",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "3;5;3;3",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            113.5,
            68.8131528125256
        ],
        "wc_strengths_avg": [
            95.0,
            34.532593299664015
        ],
        "wc_weaknesses_avg": [
            208.25,
            136.13665009834787
        ],
        "wc_questions_avg": [
            117.0,
            79.24329624643336
        ],
        "wc_review_avg": [
            533.75,
            159.20328985294242
        ],
        "wc_reply_reviewers_avg": [
            40.0,
            40.890096600521744
        ],
        "wc_reply_authors_avg": [
            1856.5,
            399.60762004746607
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.5,
            0.8660254037844386
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.13245323570650439,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=222134340555442872&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;0",
        "aff_unique_norm": "University of California, Los Angeles;Korea Advanced Institute of Science and Technology;Pennsylvania State University;University of Maryland",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.ucla.edu;https://www.kaist.ac.kr;https://www.psu.edu;https://www/umd.edu",
        "aff_unique_abbr": "UCLA;KAIST;PSU;UMD",
        "aff_campus_unique_index": "0;2;0",
        "aff_campus_unique": "Los Angeles;;College Park",
        "aff_country_unique_index": "0;1;0;0;0",
        "aff_country_unique": "United States;South Korea"
    },
    {
        "id": "sFJr7okOBi",
        "title": "NL2ProGPT: Taming Large Language Model for Conversational Protein Design",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large Language Models (LLMs), like ChatGPT, excel in cross-modal tasks thanks to their powerful abilities in natural language comprehension, generalization, and reasoning. Meanwhile, the wealth of human-curated protein knowledge in text form presents a unique opportunity for LLMs to contribute to advanced protein design. In this work, we propose a new LLMs-based framework, namely NL2ProGPT, for macromolecular protein sequence generation that bridges the domain gap between natural and protein languages. Specifically, we first combine the protein functions and properties to create specific text guidelines for designing the protein, ensuring it follows precise controls. Second, to form a more informative and generalizable protein description, we explicitly inject protein structural information by clustering the embeddings from pre-trained protein language models. Third, we train a reward model to align the protein language model with the Rosetta energy function, following an RLAIF (reinforced learning from AI feedback) fashion. We empirically verify the effectiveness of NL2ProGPT from three aspects: (1) outperforms existing protein sequence design methods in different evaluations; (2) exhibits more than 90\\% consistency in text-to-protein generation; (3) has effective exploration potential in disordered regions.",
        "keywords": "Protein design;Large language model",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Zekun Guo;Jianxin Lin;Shufan Zhang;Yijun Wang;Lijun Wu;xiangxiang Zeng",
        "authorids": "~Zekun_Guo1;~Jianxin_Lin1;hnuzsf@hnu.edu.cn;~Yijun_Wang2;~Lijun_Wu1;~xiangxiang_Zeng1",
        "gender": "M;M;;;M;M",
        "homepage": "https://github.com/height921;http://home.ustc.edu.cn/~linjx/;;;https://apeterswu.github.io/;https://xzenglab.github.io/xzeng/en",
        "dblp": ";164/9334;;;68/1284-3;20/3839.html",
        "google_scholar": ";https://scholar.google.com.hk/citations?user=ztdMYPcAAAAJ;;;https://scholar.google.com/citations?hl=en;B20HBMIAAAAJ",
        "orcid": ";;;;0000-0002-3530-590X;0000-0003-1081-7658",
        "linkedin": ";;;;lijun-wu-59340478/;",
        "or_profile": "~Zekun_Guo1;~Jianxin_Lin1;hnuzsf@hnu.edu.cn;~Yijun_Wang2;~Lijun_Wu1;~xiangxiang_Zeng1",
        "aff": "Hunan University;Hunan University;;;Microsoft Research;Hunan University",
        "aff_domain": "hnu.edu.cn;edu.cn;;;microsoft.com;hnu.edu.cn",
        "position": "MS student;Associate Professor;;;Researcher;Full Professor",
        "bibtex": "@misc{\nguo2024nlprogpt,\ntitle={{NL}2Pro{GPT}: Taming Large Language Model for Conversational Protein Design},\nauthor={Zekun Guo and Jianxin Lin and Shufan Zhang and Yijun Wang and Lijun Wu and xiangxiang Zeng},\nyear={2024},\nurl={https://openreview.net/forum?id=sFJr7okOBi}\n}",
        "github": "",
        "project": "",
        "reviewers": "kJGB;PWDH;se98;Gu8r",
        "site": "https://openreview.net/forum?id=sFJr7okOBi",
        "pdf_size": 3957354,
        "rating": "3;5;5;5",
        "confidence": "5;3;3;2",
        "soundness": "2;2;3;2",
        "contribution": "2;2;2;2",
        "presentation": "2;2;2;2",
        "wc_summary": "74;51;119;61",
        "wc_strengths": "35;14;96;22",
        "wc_weaknesses": "306;47;438;211",
        "wc_questions": "260;22;159;3",
        "wc_review": "675;134;812;297",
        "wc_reply_reviewers": "0;0;68;0",
        "wc_reply_authors": "462;78;672;315",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            76.25,
            25.9939896899264
        ],
        "wc_strengths_avg": [
            41.75,
            32.205395510690444
        ],
        "wc_weaknesses_avg": [
            250.5,
            142.4859642210418
        ],
        "wc_questions_avg": [
            111.0,
            104.98809456314558
        ],
        "wc_review_avg": [
            479.5,
            274.5236783958717
        ],
        "wc_reply_reviewers_avg": [
            17.0,
            29.444863728670914
        ],
        "wc_reply_authors_avg": [
            381.75,
            216.45135134713297
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.9271726499455306,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:U_eUB2zHIBsJ:scholar.google.com/&scioq=NL2ProGPT:+Taming+Large+Language+Model+for+Conversational+Protein+Design&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Hunan University;Microsoft",
        "aff_unique_dep": ";Microsoft Research",
        "aff_unique_url": "http://www.hunu.edu.cn/;https://www.microsoft.com/en-us/research",
        "aff_unique_abbr": "HNU;MSR",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "sFQe52N40m",
        "title": "Online Feature Updates Improve Online (Generalized) Label Shift Adaptation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper addresses the prevalent issue of label shift in an online setting with missing labels, where data distributions change over time and obtaining timely labels is challenging. While existing methods primarily focus on adjusting or updating the final layer of a pre-trained classifier, we delve into the untapped potential of enhancing feature representations using unlabeled data at test-time. Our novel Online Label Shift adaptation with Online Feature Updates (OLS-OFU) method harnesses self-supervised learning to refine the feature extraction process, thus improving the prediction model. Theoretical analyses confirm that OLS-OFU reduces algorithmic regret by capitalizing on self-supervised learning for feature refinement. Empirical tests on CIFAR-10 and CIFAR-10C datasets, under both online label shift and generalized label shift conditions, underscore OLS-OFU's effectiveness and robustness, especially in cases of domain shifts.",
        "keywords": "label shift;online learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Ruihan Wu;Siddhartha Datta;Yi Su;Dheeraj Baby;Yu-Xiang Wang;Kilian Q Weinberger",
        "authorids": "~Ruihan_Wu1;~Siddhartha_Datta1;~Yi_Su2;~Dheeraj_Baby1;~Yu-Xiang_Wang1;~Kilian_Q_Weinberger1",
        "gender": "F;;F;;;M",
        "homepage": "https://sites.google.com/site/ruihanwu14/home;http://siddharthadatta.ml/;https://www.yisu.moe/;https://dheeraj-b.github.io/home/;http://www.cs.ucsb.edu/~yuxiangw/publications.html;http://www.cs.cornell.edu/~kilian/",
        "dblp": "195/5577;;;;62/1637-3.html;88/4801",
        "google_scholar": ";;https://scholar.google.com/citations?hl=en;L3YF8nIAAAAJ;HGNZ1fkAAAAJ;jsxk8vsAAAAJ",
        "orcid": ";;;;;0009-0008-9313-7239",
        "linkedin": ";;;;;",
        "or_profile": "~Ruihan_Wu1;~Siddhartha_Datta1;~Yi_Su2;~Dheeraj_Baby1;~Yu-Xiang_Wang1;~Kilian_Q_Weinberger1",
        "aff": "University of California, San Diego;University of Oxford;Google;University of California, Santa Barbara;UC Santa Barbara;ASAPP Inc.",
        "aff_domain": "ucsd.edu;ox.ac.uk;google.com;cs.ucsb.edu;ucsb.edu;asapp.com",
        "position": "Postdoc;PhD student;Researcher;PhD student;Assistant Professor;Principal Researcher",
        "bibtex": "@misc{\nwu2024online,\ntitle={Online Feature Updates Improve Online (Generalized) Label Shift Adaptation},\nauthor={Ruihan Wu and Siddhartha Datta and Yi Su and Dheeraj Baby and Yu-Xiang Wang and Kilian Q Weinberger},\nyear={2024},\nurl={https://openreview.net/forum?id=sFQe52N40m}\n}",
        "github": "",
        "project": "",
        "reviewers": "5U9r;xmwo;VDvw;TVnp",
        "site": "https://openreview.net/forum?id=sFQe52N40m",
        "pdf_size": 1722145,
        "rating": "3;5;5;8",
        "confidence": "3;3;3;4",
        "soundness": "2;2;2;4",
        "contribution": "1;2;2;3",
        "presentation": "2;3;3;4",
        "wc_summary": "78;41;126;68",
        "wc_strengths": "107;48;70;79",
        "wc_weaknesses": "98;155;147;85",
        "wc_questions": "29;20;448;52",
        "wc_review": "312;264;791;284",
        "wc_reply_reviewers": "0;0;198;0",
        "wc_reply_authors": "164;256;173;207",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            78.25,
            30.711357833869865
        ],
        "wc_strengths_avg": [
            76.0,
            21.15419580130618
        ],
        "wc_weaknesses_avg": [
            121.25,
            30.235533731025818
        ],
        "wc_questions_avg": [
            137.25,
            179.7906768995545
        ],
        "wc_review_avg": [
            412.75,
            219.04722664302327
        ],
        "wc_reply_reviewers_avg": [
            49.5,
            85.73651497465943
        ],
        "wc_reply_authors_avg": [
            200.0,
            36.09016486523718
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.8892972917998875,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13826390929957704274&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;2;3;3;4",
        "aff_unique_norm": "University of California, San Diego;University of Oxford;Google;University of California, Santa Barbara;ASAPP Inc.",
        "aff_unique_dep": ";;Google;;",
        "aff_unique_url": "https://www.ucsd.edu;https://www.ox.ac.uk;https://www.google.com;https://www.ucsb.edu;https://www.asapp.com",
        "aff_unique_abbr": "UCSD;Oxford;Google;UCSB;ASAPP",
        "aff_campus_unique_index": "0;2;3;3",
        "aff_campus_unique": "San Diego;;Mountain View;Santa Barbara",
        "aff_country_unique_index": "0;1;0;0;0;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "sFbTM7D1hO",
        "title": "Benchmarking Multivariate Time Series Anomaly Detection with Large-Scale Real-World Datasets",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Time series anomaly detection is of significant importance in many real-world applications, including finance, healthcare, network security, industrial equipment, complex computing systems, space probe, etc. Most of them involve multi-sensor systems, thus how to perform multivariate time series anomaly detection (MTSAD) has attracted widespread attention. This broad attention has fueled extensive research endeavors aiming to innovate and develop methods and techniques to improve the efficiency and precision of anomaly detection on multivariate time series data, including classic machine learning methods and deep learning methods. However, how to evaluate the performance of all these methods is a challenging task. The first challenge lies in the limited public benchmark datasets for MTSAD, and all of these datasets are criticized from some perspectives. The second but related challenge is, the best metric for time series anomaly detection remains unclear, which makes the research in MTSAD hard to follow. In this paper, we advance the benchmarking of multivariate time series anomaly detection from datasets, evaluation metrics, and algorithm comparison. To the best of our knowledge, we have generated the largest real-world datasets for MTSAD from the Artificial Intelligence for IT Operations (AIOps) system for a real-time data warehouse in a leading cloud computing company. We review and compare popular evaluation metrics including recently proposed ones. To evaluate classic machine learning and recent deep learning methods fairly, we have performed extensive comparisons of these methods on various datasets. We believe our benchmarking and datasets can promote reproducible results and accelerate the progress of MTSAD research.",
        "keywords": "time series anomaly detection;real_world datasets;metric discussion;benchmarking",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/6a2c3a5f03e67fd76fb59d6c0e20cf79ccced6ce.pdf",
        "author": "Chaoli Zhang;Yingying ZHANG;Qingsong Wen;Lanshu Peng;Yiyuan Yang;Chongjiong Fan;Minqi Jiang;Lunting Fan;Liang Sun",
        "authorids": "~Chaoli_Zhang1;~Yingying_ZHANG4;~Qingsong_Wen2;~Lanshu_Peng1;~Yiyuan_Yang1;~Chongjiong_Fan2;~Minqi_Jiang2;~Lunting_Fan2;~Liang_Sun2",
        "gender": "F;;F;M;M;M;;M;M",
        "homepage": ";https://github.com/fjzhzhyy;;https://yyysjz1997.github.io/;https://github.com/fanchongjion;https://github.com/jmq19950824;;https://www.linkedin.com/in/liang-sun-a0a87621/;https://sites.google.com/site/qingsongwen8/",
        "dblp": "156/0429;;;228/1875.html;;;;18/5837-1;27/561",
        "google_scholar": "2bL2FJ0AAAAJ;;;FUuGvZIAAAAJ;;;;D_cOMBgAAAAJ;vjPJvwYAAAAJ",
        "orcid": ";0009-0005-1574-922X;;0000-0002-5320-095X;;;0009-0005-1865-6731;0009-0002-5835-7259;0000-0003-4516-2524",
        "linkedin": ";;%E5%85%B0%E8%88%92-%E5%BD%AD-27145a279/;yiyuan-yang-8154941ab/;;;https://www.linkedin.cn/incareer/in/ACoAAEPkMDEBIj4hEMcAsW6vGuUidlGT7S_Xc0Y;;qingsong-wen-22814156/",
        "or_profile": "~Chaoli_Zhang1;~Yingying_ZHANG4;~Lanshu_Peng1;~Yiyuan_Yang1;~Chongjiong_Fan2;~Minqi_Jiang2;~Lunting_Fan2;~Liang_Sun2;~Qingsong_Wen1",
        "aff": "Zhejiang Normal University;Alibaba Group;;Department of Computer Science, University of Oxford;South China University of Technology;Shanghai University of Finance and Economics;Alibaba Group;Alibaba Group;Squirrel Ai Learning",
        "aff_domain": "zjnu.edu.cn;alibaba-inc.com;;cs.ox.ac.uk;mail.scut.edu.cn;sufe.edu;alibaba-inc.com;alibaba-inc.com;squirrelai.com",
        "position": "Lecturer;Researcher;;PhD student;MS student;PhD student;Senior Operations and Maintenance Director;Staff Software Engineer;Principal Researcher",
        "bibtex": "@misc{\nzhang2024benchmarking,\ntitle={Benchmarking Multivariate Time Series Anomaly Detection with Large-Scale Real-World Datasets},\nauthor={Chaoli Zhang and Yingying ZHANG and Qingsong Wen and Lanshu Peng and Yiyuan Yang and Chongjiong Fan and Minqi Jiang and Lunting Fan and Liang Sun},\nyear={2024},\nurl={https://openreview.net/forum?id=sFbTM7D1hO}\n}",
        "github": "",
        "project": "",
        "reviewers": "HrBh;NB3i;Gnj7;61C3",
        "site": "https://openreview.net/forum?id=sFbTM7D1hO",
        "pdf_size": 9573825,
        "rating": "3;3;3;6",
        "confidence": "5;4;4;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;4",
        "wc_summary": "104;63;50;72",
        "wc_strengths": "88;85;25;50",
        "wc_weaknesses": "123;392;36;98",
        "wc_questions": "68;242;213;15",
        "wc_review": "383;782;324;235",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            72.25,
            19.929563467371782
        ],
        "wc_strengths_avg": [
            62.0,
            26.06722079547415
        ],
        "wc_weaknesses_avg": [
            162.25,
            136.37517186057
        ],
        "wc_questions_avg": [
            134.5,
            95.4214336509361
        ],
        "wc_review_avg": [
            431.0,
            209.38600717335436
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:-_iwaltNRIEJ:scholar.google.com/&scioq=Benchmarking+Multivariate+Time+Series+Anomaly+Detection+with+Large-Scale+Real-World+Datasets&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;4;1;1;5",
        "aff_unique_norm": "Zhejiang Normal University;Alibaba Group;University of Oxford;South China University of Technology;Shanghai University of Finance and Economics;Squirrel Ai Learning",
        "aff_unique_dep": ";;Department of Computer Science;;;",
        "aff_unique_url": "http://www.zjnu.edu.cn;https://www.alibaba.com;https://www.ox.ac.uk;https://www.scut.edu.cn;http://www.sufe.edu.cn;https://www.squirrelai.com/",
        "aff_unique_abbr": "ZJNU;Alibaba;Oxford;SCUT;SUFE;",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Oxford",
        "aff_country_unique_index": "0;0;1;0;0;0;0;0",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "title": "Learning Interactive Real-World Simulators",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17660",
        "id": "sFyTZEqmUY",
        "author_site": "Sherry Yang, Yilun Du, Seyed Ghasemipour, Jonathan Tompson, Leslie Kaelbling, Dale Schuurmans, Pieter Abbeel",
        "tldr": "",
        "abstract": "Generative models trained on internet data have revolutionized how text, image, and video content can be created. Perhaps the next milestone for generative models is to simulate realistic experience in response to actions taken by humans, robots, and other interactive agents. Applications of a real-world simulator range from controllable content creation in games and movies, to training embodied agents purely in simulation that can be directly deployed in the real world. We explore the possibility of learning a universal simulator (UniSim) of real-world interaction through generative modeling. We first make the important observation that natural datasets available for learning a real-world simulator are often rich along different axes (e.g., abundant objects in image data, densely sampled actions in robotics data, and diverse movements in navigation data). With careful orchestration of diverse datasets, each providing a different aspect of the overall experience, UniSim can emulate how humans and agents interact with the world by simulating the visual outcome of both high-level instructions such as \u201copen the drawer\u201d and low-level controls such as \u201cmove by x,y\u201d from otherwise static scenes and objects. There are numerous use cases for such a real-world simulator. As an example, we use UniSim to train both high-level vision-language planners and low-level reinforcement learning policies, each of which exhibit zero-shot real-world transfer after training purely in a learned real-world simulator. We also show that other types of intelligence such as video captioning models can benefit from training with simulated experience in UniSim, opening up even wider applications.",
        "keywords": "Generative simulator;simulating real-world interactions;planning;reinforcement learning;vision language models;video generation",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Sherry Yang;Yilun Du;Seyed Kamyar Seyed Ghasemipour;Jonathan Tompson;Leslie Pack Kaelbling;Dale Schuurmans;Pieter Abbeel",
        "authorids": "~Sherry_Yang1;~Yilun_Du1;~Seyed_Kamyar_Seyed_Ghasemipour1;~Jonathan_Tompson1;~Leslie_Pack_Kaelbling1;~Dale_Schuurmans1;~Pieter_Abbeel2",
        "gender": "F;;M;M;F;;M",
        "homepage": "https://sherryy.github.io;https://yilundu.github.io;http://www.cs.utoronto.ca/~kamyar/;http://jonathantompson.com;http://people.csail.mit.edu/lpk/;;https://people.eecs.berkeley.edu/~pabbeel/",
        "dblp": ";204/4379;238/2555;139/0769;k/LesliePackKaelbling;;",
        "google_scholar": "7c1B_fIAAAAJ;;LHvso9QAAAAJ;U_Jw8DUAAAAJ;IcasIiwAAAAJ;;https://scholar.google.com.tw/citations?user=vtwH6GkAAAAJ",
        "orcid": ";;;;0000-0001-6054-7145;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Sherry_Yang1;~Yilun_Du1;~Seyed_Kamyar_Seyed_Ghasemipour1;~Jonathan_Tompson1;~Leslie_Pack_Kaelbling1;~Dale_Schuurmans1;~Pieter_Abbeel2",
        "aff": "University of California, Berkeley;Massachusetts Institute of Technology;Google DeepMind Robotics;Google DeepMind;Massachusetts Institute of Technology;;Covariant",
        "aff_domain": "berkeley.edu;mit.edu;google.com;google.com;mit.edu;;covariant.ai",
        "position": "Student;PhD student;Student Researcher;Researcher;Full Professor;;Founder",
        "bibtex": "@inproceedings{\nyang2024learning,\ntitle={Learning Interactive Real-World Simulators},\nauthor={Sherry Yang and Yilun Du and Seyed Kamyar Seyed Ghasemipour and Jonathan Tompson and Leslie Pack Kaelbling and Dale Schuurmans and Pieter Abbeel},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=sFyTZEqmUY}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZLpe;ihUZ;b2Jg;kkjZ",
        "pdf_size": 38179478,
        "rating": "6;8;8;8",
        "confidence": "4;3;4;5",
        "soundness": "3;3;3;3",
        "contribution": "2;4;4;3",
        "presentation": "3;3;3;4",
        "wc_summary": "84;101;56;294",
        "wc_strengths": "46;19;28;108",
        "wc_weaknesses": "87;72;153;711",
        "wc_questions": "2;2;2;2",
        "wc_review": "219;194;239;1115",
        "wc_reply_reviewers": "0;0;11;278",
        "wc_reply_authors": "200;306;271;1670",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "2;1;1;4",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            133.75,
            93.90520486107253
        ],
        "wc_strengths_avg": [
            50.25,
            34.73021019228072
        ],
        "wc_weaknesses_avg": [
            255.75,
            264.5991071413507
        ],
        "wc_questions_avg": [
            2.0,
            0.0
        ],
        "wc_review_avg": [
            441.75,
            389.02787496527804
        ],
        "wc_reply_reviewers_avg": [
            72.25,
            118.87467139807369
        ],
        "wc_reply_authors_avg": [
            611.75,
            612.1733312551274
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 132,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10354564848444560535&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=sFyTZEqmUY",
        "pdf": "https://openreview.net/pdf?id=sFyTZEqmUY",
        "email": "berkeley.edu;mit.edu;google.com;google.com;mit.edu;;covariant.ai",
        "author_num": 7,
        "aff_unique_index": "0;1;2;2;1;3",
        "aff_unique_norm": "University of California, Berkeley;Massachusetts Institute of Technology;Google;Covariant",
        "aff_unique_dep": ";;DeepMind Robotics;",
        "aff_unique_url": "https://www.berkeley.edu;https://web.mit.edu;https://deepmind.com;",
        "aff_unique_abbr": "UC Berkeley;MIT;DeepMind;",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Berkeley;",
        "aff_country_unique_index": "0;0;1;1;0",
        "aff_country_unique": "United States;United Kingdom;"
    },
    {
        "title": "Memory-Assisted Sub-Prototype Mining for Universal Domain Adaptation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17659",
        "id": "sGVmr7KHfn",
        "author_site": "Yuxiang (YU-HSIANG) LAI, Yi Zhou, Xinghong Liu, Tao Zhou",
        "tldr": "",
        "abstract": "Universal domain adaptation aims to align the classes and reduce the feature gap between the same category of the source and target domains. The target private category is set as the unknown class during the adaptation process, as it is not included in the source domain. However, most existing methods overlook the intra-class structure within a category, especially in cases where there exists significant concept shift between the samples belonging to the same category. When samples with large concept shift are forced to be pushed together, it may negatively affect the adaptation performance. Moreover, from the interpretability aspect, it is unreasonable to align visual features with significant differences, such as fighter jets and civil aircraft, into the same category. Unfortunately, due to such semantic ambiguity and annotation cost, categories are not always classified in detail, making it difficult for the model to perform precise adaptation. To address these issues, we propose a novel Memory-Assisted Sub-Prototype Mining (MemSPM) method that can learn the differences between samples belonging to the same category and mine sub-classes when there exists significant concept shift between them. By doing so, our model learns a more reasonable feature space that enhances the transferability and reflects the inherent differences among samples annotated as the same category. We evaluate the effectiveness of our MemSPM method over multiple scenarios, including UniDA, OSDA, and PDA. Our method achieves state-of-the-art performance on four benchmarks in most cases.",
        "keywords": "Transfer Learning;Universal Domain Adaption;Memory-Assisted Network;Sub-Prototype Mining",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Yuxiang Lai;Yi Zhou;Xinghong Liu;Tao Zhou",
        "authorids": "~Yuxiang_Lai1;~Yi_Zhou8;~Xinghong_Liu1;~Tao_Zhou5",
        "gender": "M;M;;M",
        "homepage": ";https://cse.seu.edu.cn/2021/0303/c23024a362239/page.htm;;https://taozh2017.github.io/",
        "dblp": ";01/1901-7;;98/4450-2",
        "google_scholar": "0hFskFkAAAAJ;https://scholar.google.co.uk/citations?user=EnDCJKMAAAAJ;;LPPsgWUAAAAJ",
        "orcid": ";;;0000-0002-3733-7286",
        "linkedin": "yuxiang-lai-335528276/;;;",
        "or_profile": "~Yuxiang_Lai1;~Yi_Zhou8;~Xinghong_Liu1;~Tao_Zhou5",
        "aff": "Southeast University;Southeast University;;Nanjing University of Science and Technology",
        "aff_domain": "seu.edu.cn;seu.edu.cn;;njust.edu.cn",
        "position": "Undergrad student;Associate Professor;;Full Professor",
        "bibtex": "@inproceedings{\nlai2024memoryassisted,\ntitle={Memory-Assisted Sub-Prototype Mining for Universal Domain Adaptation},\nauthor={Yuxiang Lai and Yi Zhou and Xinghong Liu and Tao Zhou},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=sGVmr7KHfn}\n}",
        "github": "",
        "project": "",
        "reviewers": "S3ot;mKia;dY2C;59Jy",
        "pdf_size": 9589091,
        "rating": "3;5;6;8",
        "confidence": "4;4;4;5",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "1;2;2;3",
        "wc_summary": "58;18;101;175",
        "wc_strengths": "44;11;62;96",
        "wc_weaknesses": "157;92;58;250",
        "wc_questions": "72;3;52;78",
        "wc_review": "331;124;273;599",
        "wc_reply_reviewers": "52;0;0;30",
        "wc_reply_authors": "700;488;420;270",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            88.0,
            58.17645571878713
        ],
        "wc_strengths_avg": [
            53.25,
            30.719497066195597
        ],
        "wc_weaknesses_avg": [
            139.25,
            73.16889708065852
        ],
        "wc_questions_avg": [
            51.25,
            29.473505051147207
        ],
        "wc_review_avg": [
            331.75,
            171.78092880177357
        ],
        "wc_reply_reviewers_avg": [
            20.5,
            21.9260119492807
        ],
        "wc_reply_authors_avg": [
            469.5,
            154.69566897621925
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.8006407690254357,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4357270388731761345&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=sGVmr7KHfn",
        "pdf": "https://openreview.net/pdf?id=sGVmr7KHfn",
        "email": "seu.edu.cn;seu.edu.cn;;njust.edu.cn",
        "author_num": 4,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Southeast University;Nanjing University of Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.seu.edu.cn/;http://www.nust.edu.cn/",
        "aff_unique_abbr": "SEU;NUST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "sGd02fkoAE",
        "title": "FusionViT: Hierarchical 3D Object Detection via Lidar-Camera Vision Transformer Fusion",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "For 3D object detection, both camera and lidar have been demonstrated to be useful sensory devices for providing complementary information about the same scenery with data representations in different modalities, e.g., 2D RGB image vs 3D point cloud. An effective representation learning and fusion of such multi-modal sensor data is necessary and critical for better 3D object detection performance. To solve the problem, in this paper, we will introduce a novel vision transformer-based 3D object detection model, namely FusionViT. Different from the existing 3D object detection approaches, FusionViT is a pure-ViT based framework, which adopts a hierarchical architecture by extending the transformer model to embed both images and point clouds for effective representation learning. Such multi-modal data embedding representations will be further fused together via a fusion vision transformer model prior to feeding the learned features to the object detection head for both detection and localization of the 3D objects in the input scenery. To demonstrate the effectiveness of FusionViT, extensive experiments have been done on real-world traffic object detection benchmark datasets KITTI and Waymo Open. Notably, our FusionViT model can achieve the state-of-the-art performance and outperforms not only the existing baseline methods that merely rely on camera images or lidar point clouds, but also the latest multi-modal image-point cloud deep fusion approaches.",
        "keywords": "3D object detection;Camera-Lidar Fusion;Vision Transformer",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Xinhao Xiang;Jiawei Zhang",
        "authorids": "~Xinhao_Xiang1;~Jiawei_Zhang3",
        "gender": "M;",
        "homepage": ";http://jiaweizhang.net/",
        "dblp": ";10/239-1",
        "google_scholar": "Rvkl2M8AAAAJ;7AkZSJsAAAAJ",
        "orcid": ";0000-0002-2111-7617",
        "linkedin": ";",
        "or_profile": "~Xinhao_Xiang1;~Jiawei_Zhang3",
        "aff": "University of California, Davis;University of California, Davis",
        "aff_domain": "ucdavis.edu;ucdavis.edu",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\nxiang2024fusionvit,\ntitle={FusionViT: Hierarchical 3D Object Detection via Lidar-Camera Vision Transformer Fusion},\nauthor={Xinhao Xiang and Jiawei Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=sGd02fkoAE}\n}",
        "github": "",
        "project": "",
        "reviewers": "zd5v;qYip;Jv34",
        "site": "https://openreview.net/forum?id=sGd02fkoAE",
        "pdf_size": 5691270,
        "rating": "3;5;5",
        "confidence": "4;5;4",
        "soundness": "2;2;3",
        "contribution": "1;2;3",
        "presentation": "2;2;2",
        "wc_summary": "82;139;78",
        "wc_strengths": "131;73;50",
        "wc_weaknesses": "459;196;130",
        "wc_questions": "22;52;142",
        "wc_review": "694;460;400",
        "wc_reply_reviewers": "247;0;0",
        "wc_reply_authors": "409;376;456",
        "reply_reviewers": "1;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            99.66666666666667,
            27.86076492528915
        ],
        "wc_strengths_avg": [
            84.66666666666667,
            34.081601422990026
        ],
        "wc_weaknesses_avg": [
            261.6666666666667,
            142.11341323823808
        ],
        "wc_questions_avg": [
            72.0,
            50.99019513592785
        ],
        "wc_review_avg": [
            518.0,
            126.83847996566341
        ],
        "wc_reply_reviewers_avg": [
            82.33333333333333,
            116.43691663538483
        ],
        "wc_reply_authors_avg": [
            413.6666666666667,
            32.826141344293816
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9455727859539077328&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of California, Davis",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucdavis.edu",
        "aff_unique_abbr": "UC Davis",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Davis",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "sGdyUIqqww",
        "title": "GenN2N: Generative NeRF2NeRF Translation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We present GenN2N, a unified NeRF-to-NeRF translation framework for various NeRF translation tasks such as text-driven NeRF editing, super-resolution, object removal, etc. Unlike previous methods designed for individual translation tasks with task-specific schemes, GenN2N achieves all these NeRF editing tasks by employing a universal image-to-image translator to perform editing in the 2D domain and lifting 2D edits into the 3D NeRF space. Since the 3D consistency of 2D edits may not be assured, we propose to model the distribution of the underlying 3D edits through a generative model that can cover all possible edited NeRFs. To model the distribution of 3D edited NeRFs from 2D edited images, we carefully design a VAE-GAN that encodes images while decoding NeRFs. The latent space is trained to align with a Gaussian distribution and the NeRFs are supervised through an adversarial loss on its renderings. To ensure the latent code does not depend on 2D viewpoints but truly reflects the 3D edits, we also regularize the latent code through a contrastive learning scheme. Extensive experiments on various editing tasks show GenN2N, as a universal framework, performs as well or better than task-specific specialists while possessing flexible generative power.",
        "keywords": "NeRF-to-NeRF translation;generative model",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/e05c47646d6142a0b0ff32579592905843636468.zip",
        "author": "Xiangyue Liu;Han Xue;Kunming Luo;Ping Tan;Li Yi",
        "authorids": "~Xiangyue_Liu1;~Han_Xue3;~Kunming_Luo1;~Ping_Tan2;~Li_Yi2",
        "gender": "F;M;M;M;M",
        "homepage": "https://xiangyueliu.github.io/;https://axian12138.github.io/;https://coolbeam.github.io/index.html;http://www.cs.sfu.ca/~pingtan/;https://ericyi.github.io/",
        "dblp": ";;213/4872;;26/4239-1",
        "google_scholar": "m3c3jnYAAAAJ;;https://scholar.google.com.hk/citations?hl=zh-CN;XhyKVFMAAAAJ;UyZL660AAAAJ",
        "orcid": ";;0000-0002-5070-7392;0000-0002-4506-6973;",
        "linkedin": ";;;;",
        "or_profile": "~Xiangyue_Liu1;~Han_Xue3;~Kunming_Luo1;~Ping_Tan2;~Li_Yi2",
        "aff": "Hong Kong University of Science and Technology;Tsinghua University;Hong Kong University of Science and Technology;Hong Kong University of Science and Technology;Tsinghua University",
        "aff_domain": "hkust.edu;mail.tsinghua.edu.cn;ust.hk;ust.hk;tsinghua.edu.cn",
        "position": "PhD student;Undergrad student;PhD student;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nliu2024gennn,\ntitle={GenN2N: Generative Ne{RF}2Ne{RF} Translation},\nauthor={Xiangyue Liu and Han Xue and Kunming Luo and Ping Tan and Li Yi},\nyear={2024},\nurl={https://openreview.net/forum?id=sGdyUIqqww}\n}",
        "github": "",
        "project": "",
        "reviewers": "iUWe;gQmW;SpjW;MewR;MLGn",
        "site": "https://openreview.net/forum?id=sGdyUIqqww",
        "pdf_size": 6932824,
        "rating": "3;3;5;5;6",
        "confidence": "4;4;4;5;4",
        "soundness": "3;1;2;2;3",
        "contribution": "2;2;3;3;3",
        "presentation": "3;3;3;2;2",
        "wc_summary": "64;44;112;113;82",
        "wc_strengths": "35;36;125;122;43",
        "wc_weaknesses": "236;188;414;223;141",
        "wc_questions": "41;44;12;127;76",
        "wc_review": "376;312;663;585;342",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "340;182;230;147;225",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            4.4,
            1.2
        ],
        "confidence_avg": [
            4.2,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.2,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            83.0,
            26.922109872742144
        ],
        "wc_strengths_avg": [
            72.2,
            41.98761722222398
        ],
        "wc_weaknesses_avg": [
            240.4,
            92.82801301331403
        ],
        "wc_questions_avg": [
            60.0,
            39.156097864828155
        ],
        "wc_review_avg": [
            455.6,
            141.1532500511412
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            224.8,
            65.08886233450389
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.24999999999999994,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9072272566793489194&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;0;0;1",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Tsinghua University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ust.hk;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "HKUST;THU",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Branch-GAN: Improving Text Generation with (not so) Large Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17658",
        "id": "sHEJJmzBIN",
        "author_site": "Fredrik Carlsson, Johan Broberg, Erik Hillbom, Magnus Sahlgren, Joakim Nivre",
        "tldr": "",
        "abstract": "The current advancements in open domain text generation have been spearheaded by Transformer-based large language models. Leveraging efficient parallelization and vast training datasets, these models achieve unparalleled text generation capabilities. Even so, current models are known to suffer from  deficiencies such as repetitive texts, looping issues, and lack of robustness. While adversarial training through generative adversarial networks (GAN) is a proposed solution, earlier research in this direction has predominantly focused on older architectures, or narrow tasks. As a result, this approach is not yet compatible with modern language models for open-ended text generation, leading to diminished interest within the broader research community. We propose a computationally efficient GAN approach for sequential data that utilizes the parallelization capabilities of Transformer models. Our method revolves around generating multiple branching sequences from each training sample, while also incorporating the typical next-step prediction loss on the original data. In this way, we achieve a dense reward and loss signal for both the generator and the discriminator, resulting in a stable training dynamic. We apply our training method to pre-trained language models, using data from their original training set but less than 0.01% of the available data.  A comprehensive human evaluation shows that our method significantly improves the quality of texts generated by the model while avoiding the previously reported sparsity problems of GAN approaches. Even our smaller models outperform larger original baseline models with more than 16 times the number of parameters. Finally, we corroborate previous claims that perplexity on held-out data is not a sufficient metric for measuring the quality of generated texts.",
        "keywords": "GAN;GANN;Text Generation;NLP;NLU;Deep Learning;Machine Learning",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Fredrik Carlsson;Johan Broberg;Erik Hillbom;Magnus Sahlgren;Joakim Nivre",
        "authorids": "~Fredrik_Carlsson1;~Johan_Broberg1;~Erik_Hillbom1;~Magnus_Sahlgren1;~Joakim_Nivre1",
        "gender": "M;M;M;M;M",
        "homepage": "https://www.ri.se/sv/fredrik-carlsson;;;;https://jnivre.github.io",
        "dblp": ";;;76/3617;n/JoakimNivre",
        "google_scholar": ";;;Nf2NNVwAAAAJ;https://scholar.google.co.uk/citations?user=lLBHtFUAAAAJ",
        "orcid": ";;;0000-0001-5100-0535;0000-0002-7873-3971",
        "linkedin": ";johan-broberg/;erik-lidman-hillbom/;magnus-sahlgren-0a12b2/;",
        "or_profile": "~Fredrik_Carlsson1;~Johan_Broberg1;~Erik_Hillbom1;~Magnus_Sahlgren1;~Joakim_Nivre1",
        "aff": "KTH Royal Institute of Technology, Stockholm, Sweden;;RISE Research Institutes of Sweden;AI Sweden;Uppsala University",
        "aff_domain": "kth.se;;ri.se;ai.se;uu.se",
        "position": "MS student;;R&D Engineer;Principal Researcher;Full Professor",
        "bibtex": "@inproceedings{\ncarlsson2024branchgan,\ntitle={Branch-{GAN}: Improving Text Generation with (not so) Large Language Models},\nauthor={Fredrik Carlsson and Johan Broberg and Erik Hillbom and Magnus Sahlgren and Joakim Nivre},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=sHEJJmzBIN}\n}",
        "github": "",
        "project": "",
        "reviewers": "rZ5m;MWH7;Hqg8;RVL4",
        "pdf_size": 2054091,
        "rating": "6;6;6;8",
        "confidence": "4;5;3;3",
        "soundness": "3;3;2;3",
        "contribution": "3;3;3;3",
        "presentation": "3;4;3;3",
        "wc_summary": "46;113;83;103",
        "wc_strengths": "46;141;83;106",
        "wc_weaknesses": "20;230;64;76",
        "wc_questions": "147;2;29;64",
        "wc_review": "259;486;259;349",
        "wc_reply_reviewers": "34;274;12;16",
        "wc_reply_authors": "518;562;345;260",
        "reply_reviewers": "1;3;1;1",
        "reply_authors": "2;3;1;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            86.25,
            25.625914617823888
        ],
        "wc_strengths_avg": [
            94.0,
            34.56153931757091
        ],
        "wc_weaknesses_avg": [
            97.5,
            79.2890282447704
        ],
        "wc_questions_avg": [
            60.5,
            54.56418239101544
        ],
        "wc_review_avg": [
            338.25,
            92.87996285528973
        ],
        "wc_reply_reviewers_avg": [
            84.0,
            110.00909053346456
        ],
        "wc_reply_authors_avg": [
            421.25,
            123.47747770342573
        ],
        "reply_reviewers_avg": [
            1.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15587360832253805939&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=sHEJJmzBIN",
        "pdf": "https://openreview.net/pdf?id=sHEJJmzBIN",
        "email": "kth.se;;ri.se;ai.se;uu.se",
        "author_num": 5,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "KTH Royal Institute of Technology;RISE Research Institutes of Sweden;AI Sweden;Uppsala University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.kth.se;https://www.rise.se;https://www.aisweden.org;https://www.uu.se",
        "aff_unique_abbr": "KTH;RISE;AI Sweden;UU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Stockholm;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Sweden"
    },
    {
        "id": "sHlZP3hP8E",
        "title": "MARINA Meets Matrix Stepsizes: Variance Reduced Distributed Non-Convex Optimization",
        "track": "main",
        "status": "Desk Reject",
        "tldr": "",
        "abstract": "Matrix-stepsized gradient descent algorithms have been demonstrated to exhibit superior efficiency in non-convex optimization compared to their scalar counterparts. The det-CGD algorithm, as introduced by Li et al. (2023), leverages matrix stepsizes to perform compressed gradient descent for non-convex objectives and matrix-smooth problems in a federated manner. The authors establish the algorithm\u2019s convergence to a neighborhood of the weighted stationarity point under a convex condition for the symmetric and positive-definite stepsize matrix. In this paper, we propose a variance-reduced version of the det-CGD algorithm, incorporating the MARINA method. Notably, we establish theoretically and empirically, that det-MARINA outperforms both MARINA and the distributed det-CGD algorithms in terms of iteration and communication complexities.",
        "keywords": "Non-convex optimization;Matrix stepsizes;Federated Learning;Distributed Optimization",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/7e14ad7bd363193fdee3b48efb7b9874dc021afa.pdf",
        "author": "Hanmin Li;Avetik Karagulyan;Peter Richt\u00e1rik",
        "authorids": "~Hanmin_Li1;~Avetik_Karagulyan1;~Peter_Richt\u00e1rik1",
        "gender": "M;M;M",
        "homepage": "https://cemse.kaust.edu.sa/ai/people/person/hanmin-li;https://avetx.github.io/;https://richtarik.org",
        "dblp": "340/3604;207/8322;62/8001",
        "google_scholar": "https://scholar.google.com/citations?hl=en;1-_KDtoAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0002-2587-640X;;0000-0003-4380-5848",
        "linkedin": "hanmin-li-034b8b245/;;richtarik/",
        "or_profile": "~Hanmin_Li1;~Avetik_Karagulyan1;~Peter_Richtarik1",
        "aff": "King Abdullah University of Science and Technology;King Abdullah University of Science and Technology;King Abdullah University of Science and Technology (KAUST)",
        "aff_domain": "kaust.edu.sa;kaust.edu.sa;kaust.edu.sa",
        "position": "PhD student;Postdoc;Full Professor",
        "bibtex": "@misc{\nli2024marina,\ntitle={{MARINA} Meets Matrix Stepsizes: Variance Reduced Distributed Non-Convex Optimization},\nauthor={Hanmin Li and Avetik Karagulyan and Peter Richt{\\'a}rik},\nyear={2024},\nurl={https://openreview.net/forum?id=sHlZP3hP8E}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=sHlZP3hP8E",
        "pdf_size": 485963,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "King Abdullah University of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kast.kau.edu.sa",
        "aff_unique_abbr": "KAUST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Saudi Arabia"
    },
    {
        "id": "sIcPMMhl9W",
        "title": "The Phase Transition Phenomenon of Shuffled Regression",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper studies the phase transition \nphenomenon inherent within the shuffled (permuted) regression problem, which has found applications in databases, privacy, and data analysis, etc. For the permuted regression task: $\\mathbf{Y} = \\mathbf{\\Pi}^{\\natural}\\mathbf{X}\\mathbf{B}^{\\natural}$, the goal is to recover the permutation matrix $\\mathbf{\\Pi}^{\\natural}$ as well as the coefficient matrix $\\mathbf{B}^{\\natural}$. It has been empirically observed in prior studies that, when recovering $\\mathbf{\\Pi}^{\\natural}$, there exists a phase transition phenomenon: the error rate drops to zero rapidly once the parameters reach certain thresholds. In this study, we aim to precisely identify the locations of the phase transition points by leveraging techniques from {\\em message passing} (MP). \n\n\n\\noindent In our analysis, we first transform the permutation recovery problem into a probabilistic graphical model.  Then we leverage the analytical tools rooted in the message passing (MP) algorithm and derive an equation to track the convergence of the MP algorithm. By linking this equation to the branching random walk process, we are able to characterize the impact of the \\emph{signal-to-noise-ratio} (SNR) on the permutation recovery.  Depending on whether the signal is given or not, we separately investigate the oracle case and the non-oracle case. The bottleneck in identifying the phase transition regimes lies in deriving closed-form formulas for the corresponding critical points, but only in rare scenarios can one obtain such precise expressions. To tackle this challenge, we propose the Gaussian approximation method, which  allows us to obtain the closed-form formulas in almost all scenarios. \nIn the oracle case, our method can fairly accurately predict the phase transition SNR. In the non-oracle case, our proposed algorithm can predict the maximum allowed number of permuted rows and uncover its dependency on the sample number. \n\nNumerical experiments suggest that the observed phase transition  points are well aligned with our theoretical predictions. This is an exciting exploration. We hope that our study will motivate exploiting message passing algorithms (and related techniques) as a new effective tool for studying permuted regression problems. For example, identifying the phase transition locations for sparse permuted recovery~\\citep{zhang2021sparse} would be a highly interesting (and challenging) application. In this paper, we also briefly illustrate the use of the message passing algorithm for {\\em partial correspondence recovery}, an important problem that deserves its own thorough study.",
        "keywords": "message passing;phase transition;permuted linear regression",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/175c392ce168213a1526d6bbee5c0ed3957a7760.zip",
        "author": "Hang Zhang;Ping Li",
        "authorids": "~Hang_Zhang8;~Ping_Li3",
        "gender": "M;M",
        "homepage": ";http://www.stat.rutgers.edu/home/pingli/",
        "dblp": ";62/5860-1",
        "google_scholar": ";",
        "orcid": "0000-0003-2774-1792;",
        "linkedin": ";",
        "or_profile": "~Hang_Zhang8;~Ping_Li3",
        "aff": "Baidu;LinkedIn",
        "aff_domain": "baidu.com;linkedin.com",
        "position": "Researcher;Engineer",
        "bibtex": "@misc{\nzhang2024the,\ntitle={The Phase Transition Phenomenon of Shuffled Regression},\nauthor={Hang Zhang and Ping Li},\nyear={2024},\nurl={https://openreview.net/forum?id=sIcPMMhl9W}\n}",
        "github": "",
        "project": "",
        "reviewers": "zFq3;gR3L;QZh8;jCjs;HokC",
        "site": "https://openreview.net/forum?id=sIcPMMhl9W",
        "pdf_size": 1186750,
        "rating": "5;5;5;6;8",
        "confidence": "4;3;2;2;2",
        "soundness": "2;2;4;3;3",
        "contribution": "2;3;2;3;3",
        "presentation": "1;3;2;2;3",
        "wc_summary": "79;73;111;140;123",
        "wc_strengths": "36;49;68;54;94",
        "wc_weaknesses": "274;58;184;97;70",
        "wc_questions": "309;112;91;185;25",
        "wc_review": "698;292;454;476;312",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "888;285;449;485;181",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "3;1;1;1;1",
        "rating_avg": [
            5.8,
            1.16619037896906
        ],
        "confidence_avg": [
            2.6,
            0.8
        ],
        "soundness_avg": [
            2.8,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.2,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            105.2,
            25.63123094976127
        ],
        "wc_strengths_avg": [
            60.2,
            19.762590923257
        ],
        "wc_weaknesses_avg": [
            136.6,
            81.61764515103337
        ],
        "wc_questions_avg": [
            144.4,
            96.84957408269796
        ],
        "wc_review_avg": [
            446.4,
            145.69776937208064
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            457.6,
            241.8128201729594
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.4,
            0.8000000000000002
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5144957554275266,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:i2WQ2tNvW0sJ:scholar.google.com/&scioq=The+Phase+Transition+Phenomenon+of+Shuffled+Regression&hl=en&as_sdt=0,5",
        "gs_version_total": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Baidu;LinkedIn Corporation",
        "aff_unique_dep": "Baidu, Inc.;",
        "aff_unique_url": "https://www.baidu.com;https://www.linkedin.com",
        "aff_unique_abbr": "Baidu;LinkedIn",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "ViDA: Homeostatic Visual Domain Adapter for Continual Test Time Adaptation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17657",
        "id": "sJ88Wg5Bp5",
        "author_site": "Jiaming Liu, Senqiao Yang, Peidong Jia, Renrui Zhang, Ming Lu, Yandong Guo, Wei Xue, Shanghang Zhang",
        "tldr": "",
        "abstract": "Since real-world machine systems are running in non-stationary environments, Continual Test-Time Adaptation (CTTA) task is proposed to adapt the pre-trained model to continually changing target domains. Recently, existing methods mainly focus on model-based adaptation, which aims to leverage a self-training manner to extract the target domain knowledge. However, pseudo labels can be noisy and the updated model parameters are unreliable under dynamic data distributions, leading to error accumulation and catastrophic forgetting in the continual adaptation process. To tackle these challenges and maintain the model plasticity, we design a Visual Domain Adapter (ViDA) for CTTA, explicitly handling both domain-specific and domain-shared knowledge. Specifically, we first comprehensively explore the different domain representations of the adapters with trainable high-rank or low-rank embedding spaces. Then we inject ViDAs into the pre-trained model, which leverages high-rank and low-rank features to adapt the current domain distribution and maintain the continual domain-shared knowledge, respectively. To exploit the low-rank and high-rank ViDAs more effectively, we further propose a Homeostatic Knowledge Allotment (HKA) strategy, which adaptively combines different knowledge from each ViDA. Extensive experiments conducted on four widely used benchmarks demonstrate that our proposed method achieves state-of-the-art performance in both classification and segmentation CTTA tasks. Note that, our method can be regarded as a novel transfer paradigm for large-scale models, delivering promising results in adaptation to continually changing distributions.",
        "keywords": "Continual test-time adaptation;Visual Adapter",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/f39090c1c37346564b95099591832fdec71add19.zip",
        "author": "Jiaming Liu;Senqiao Yang;Peidong Jia;Renrui Zhang;Ming Lu;Yandong Guo;Wei Xue;Shanghang Zhang",
        "authorids": "~Jiaming_Liu2;~Senqiao_Yang1;~Peidong_Jia1;~Renrui_Zhang1;~Ming_Lu2;~Yandong_Guo2;~Wei_Xue5;~Shanghang_Zhang4",
        "gender": "M;;M;M;;M;M;",
        "homepage": "https://github.com/liujiaming1996;;https://iamstupidd.github.io/;;;;http://www.wei-xue.com;",
        "dblp": ";;;244/1748;;28/4272;;",
        "google_scholar": "cPki5sUAAAAJ;;;YlL3xN4AAAAJ;;fWDoWsQAAAAJ;77lSoywAAAAJ;",
        "orcid": "0000-0002-6770-4390;;;;;;;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Jiaming_Liu2;~Senqiao_Yang1;~Peidong_Jia1;~Renrui_Zhang1;~Ming_Lu2;~Yandong_Guo2;~Wei_Xue5;~Shanghang_Zhang4",
        "aff": "Peking University;;Peking University;MMLab of CUHK & Shanghai AI Laboratory;;AI^2 Robotics;Hong Kong University of Science and Technology;",
        "aff_domain": "pku.edu.cn;;pku.edu.cn;pjlab.org.cn;;ai2robotics.com;ust.hk;",
        "position": "PhD student;;PhD student;PhD student;;Chief Scientist;Assistant Professor;",
        "bibtex": "@inproceedings{\nliu2024vida,\ntitle={Vi{DA}: Homeostatic Visual Domain Adapter for Continual Test Time Adaptation},\nauthor={Jiaming Liu and Senqiao Yang and Peidong Jia and Renrui Zhang and Ming Lu and Yandong Guo and Wei Xue and Shanghang Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=sJ88Wg5Bp5}\n}",
        "github": "",
        "project": "",
        "reviewers": "4MXU;RZSt;8EgD;Ut2z",
        "pdf_size": 6795315,
        "rating": "6;6;6;8",
        "confidence": "4;4;4;4",
        "soundness": "3;2;3;3",
        "contribution": "3;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "103;78;78;91",
        "wc_strengths": "63;75;56;366",
        "wc_weaknesses": "88;96;114;75",
        "wc_questions": "89;5;79;91",
        "wc_review": "343;254;327;623",
        "wc_reply_reviewers": "50;0;0;17",
        "wc_reply_authors": "986;1111;984;475",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "6;4;4;5",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            87.5,
            10.404326023342406
        ],
        "wc_strengths_avg": [
            140.0,
            130.65795038955724
        ],
        "wc_weaknesses_avg": [
            93.25,
            14.13108276106258
        ],
        "wc_questions_avg": [
            66.0,
            35.510561809129406
        ],
        "wc_review_avg": [
            386.75,
            140.46418582685055
        ],
        "wc_reply_reviewers_avg": [
            16.75,
            20.41292482717751
        ],
        "wc_reply_authors_avg": [
            889.0,
            244.49642124170242
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            4.75,
            0.82915619758885
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 43,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9284065084499873574&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=sJ88Wg5Bp5",
        "pdf": "https://openreview.net/pdf?id=sJ88Wg5Bp5",
        "email": "pku.edu.cn;;pku.edu.cn;pjlab.org.cn;;ai2robotics.com;ust.hk;",
        "author_num": 8,
        "aff_unique_index": "0;0;1;2;3",
        "aff_unique_norm": "Peking University;Chinese University of Hong Kong;AI^2 Robotics;Hong Kong University of Science and Technology",
        "aff_unique_dep": ";MMLab;;",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.cuhk.edu.hk;http://ai2robotics.org/;https://www.ust.hk",
        "aff_unique_abbr": "Peking U;CUHK;AI^2 Robotics;HKUST",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "sJAlw561AH",
        "title": "The Uncertainty-Perception Tradeoff",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Generative models have achieved groundbreaking performance in restoration tasks and inverse problems, producing results that are often indistinguishable from real data. Yet these models are also known to produce hallucinations, or artifacts that are not present in the original input, raising concerns about the uncertainty of the models' predictions. In this paper we study this phenomenon, employing information-theory tools to reveal a fundamental tradeoff between perception and uncertainty. Our mathematical analysis shows that as perceptual quality increases, so does the uncertainty of a restoration algorithm as quantified by error entropy. We derive and illustrate the behavior of the uncertainty-perception function, showcasing both local and global bounds that define the the feasible region of the tradeoff. Furthermore, we revisit a well-known relation between estimation distortion and uncertainty and generalize its scope to include perception quality, thereby shedding new light on the well-established perception-distortion tradeoff. Our work offers a principled analysis of uncertainty, highlighting its interplay with perception and the limitations of generative models in restoration tasks.",
        "keywords": "uncertainty-perception tradeoff;uncertainty quantification;statistical estimation theory;image restoration",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Regev Cohen;Ehud Rivlin;Daniel Freedman",
        "authorids": "~Regev_Cohen1;~Ehud_Rivlin2;~Daniel_Freedman2",
        "gender": "M;M;",
        "homepage": ";http://www.cs.technion.ac.il/~ehudr/;",
        "dblp": ";;59/1865",
        "google_scholar": "naMCufgAAAAJ;;https://scholar.google.com/citations?hl=en",
        "orcid": ";;",
        "linkedin": "regev-cohen/;;",
        "or_profile": "~Regev_Cohen1;~Ehud_Rivlin2;~Daniel_Freedman2",
        "aff": "Google;Technion, Technion;Verily",
        "aff_domain": "google.com;technion.ac.il;google.com",
        "position": "Researcher;Full Professor;Researcher",
        "bibtex": "@misc{\ncohen2024the,\ntitle={The Uncertainty-Perception Tradeoff},\nauthor={Regev Cohen and Ehud Rivlin and Daniel Freedman},\nyear={2024},\nurl={https://openreview.net/forum?id=sJAlw561AH}\n}",
        "github": "",
        "project": "",
        "reviewers": "afrr;KFgG;dFBY;WDqn",
        "site": "https://openreview.net/forum?id=sJAlw561AH",
        "pdf_size": 1161834,
        "rating": "3;5;6;8",
        "confidence": "4;2;3;4",
        "soundness": "3;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;4",
        "wc_summary": "139;46;81;176",
        "wc_strengths": "60;74;109;142",
        "wc_weaknesses": "38;141;243;109",
        "wc_questions": "32;1;52;552",
        "wc_review": "269;262;485;979",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "601;383;276;417",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            110.5,
            50.331401728940556
        ],
        "wc_strengths_avg": [
            96.25,
            31.877695964420013
        ],
        "wc_weaknesses_avg": [
            132.75,
            73.76440537278125
        ],
        "wc_questions_avg": [
            159.25,
            227.48118054028117
        ],
        "wc_review_avg": [
            498.75,
            291.4038220408236
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            419.25,
            117.12466648831919
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.08362420100070908,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5482719775923915667&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Google;Technion - Israel Institute of Technology;Verily",
        "aff_unique_dep": "Google;;",
        "aff_unique_url": "https://www.google.com;https://www.technion.ac.il/en/;https://www.verily.com",
        "aff_unique_abbr": "Google;Technion;Verily",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Mountain View;",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United States;Israel"
    },
    {
        "id": "sJCIv4aUQu",
        "title": "ADOPT: Modified Adam Can Converge with the Optimal Rate with Any Hyperparameters",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Adaptive gradient methods based on exponential moving averages, such as Adam and RMSprop, are widely used for deep learning. However, it is known that they do not converge unless choosing hyperparameters in a problem-dependent manner. There have been many attempts to fix their convergence (e.g., AMSGrad), but they require an impractical assumption that the stochastic gradient is uniformly bounded. In this paper, we propose a new adaptive gradient method named ADOPT, which achieves the optimal convergence rate of $\\mathcal{O} ( 1 / \\sqrt{T} )$ with any hyperparameter choice without the bounded stochastic gradient assumption. ADOPT addresses the non-convergence issue of Adam by removing the current gradient from the second moment estimate and changing the order of the momentum calculation and the scaling operation by the second moment estimate. We also conduct intensive numerical experiments, and verify that our ADOPT achieves competitive or even better results compared to Adam and its variants across a wide range of tasks, including image classification, generative modeling, natural language processing, and deep reinforcement learning.",
        "keywords": "adaptive gradient method;convergence analysis;nonconvex optimization",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/6053ece6352e98a60a1d5726061d3ee61b1f54fc.pdf",
        "author": "Shohei Taniguchi;Keno Harada;Minegishi Gouki;Yuta Oshima;Seong Cheol Jeong;Go Nagahara;Tomoshi Iiyama;Masahiro Suzuki;Yusuke Iwasawa;Yutaka Matsuo",
        "authorids": "~Shohei_Taniguchi1;~Keno_Harada1;~Minegishi_Gouki2;~Yuta_Oshima1;~Seong_Cheol_Jeong1;~Go_Nagahara1;~Tomoshi_Iiyama1;~Masahiro_Suzuki1;~Yusuke_Iwasawa1;~Yutaka_Matsuo1",
        "gender": "M;M;M;M;M;M;M;M;M;M",
        "homepage": ";;https://sites.google.com/weblab.t.u-tokyo.ac.jp/gouki-minegishi/about;;;;https://github.com/tomosii;;;http://ymatsuo.com",
        "dblp": ";393/1474;359/6674;218/3351;;;299/0798;;117/7377;m/YMatsuo.html",
        "google_scholar": "MOcH0c0AAAAJ;https://scholar.google.co.jp/citations?user=tiJ-smIAAAAJ;https://scholar.google.co.jp/citations?user=sxGpoYMAAAAJ;https://scholar.google.co.jp/citations?user=V_tVbiIAAAAJ;;;;r2nt5kUAAAAJ;https://scholar.google.co.jp/citations?user=pvvZgj0AAAAJ;Dy8iau4AAAAJ",
        "orcid": ";;;;;;;;0000-0002-1321-2622;",
        "linkedin": ";;gouki-minegishi-22363b236/;yuta-oshima-9a3143276/;seong-cheol-jeong;%E8%B1%AA-%E9%95%B7%E5%8E%9F-1b712a273/;;;;",
        "or_profile": "~Shohei_Taniguchi1;~Keno_Harada1;~Minegishi_Gouki2;~Yuta_Oshima1;~Seong_Cheol_Jeong1;~Go_Nagahara1;~Tomoshi_Iiyama1;~Masahiro_Suzuki1;~Yusuke_Iwasawa1;~Yutaka_Matsuo1",
        "aff": "The University of Tokyo;the University of Tokyo;;The University of Tokyo, The University of Tokyo;The University of Tokyo, The University of Tokyo;Tokyo University, Tokyo Institute of Technology;The University of Tokyo;The University of Tokyo, Tokyo Institute of Technology;The University of Tokyo, The University of Tokyo;The University of Tokyo",
        "aff_domain": "u-tokyo.ac.jp;u-tokyo.ac.jp;;weblab.t.u-tokyo.ac.jp;weblab.t.u-tokyo.ac.jp;u-tokyo.ac.jp;u-tokyo.ac.jp;u-tokyo.ac.jp;weblab.t.u-tokyo.ac.jp;u-tokyo.ac.jp",
        "position": "Postdoc;PhD student;;MS student;MS student;MS student;MS student;Assistant Professor;Associate Professor;Associate Professor",
        "bibtex": "@misc{\ntaniguchi2024adopt,\ntitle={{ADOPT}: Modified Adam Can Converge with the Optimal Rate with Any Hyperparameters},\nauthor={Shohei Taniguchi and Keno Harada and Minegishi Gouki and Yuta Oshima and Seong Cheol Jeong and Go Nagahara and Tomoshi Iiyama and Masahiro Suzuki and Yusuke Iwasawa and Yutaka Matsuo},\nyear={2024},\nurl={https://openreview.net/forum?id=sJCIv4aUQu}\n}",
        "github": "",
        "project": "",
        "reviewers": "vPft;BAKG;Y8m7;nLrX",
        "site": "https://openreview.net/forum?id=sJCIv4aUQu",
        "pdf_size": 738638,
        "rating": "5;5;5;6",
        "confidence": "4;3;4;3",
        "soundness": "2;3;2;2",
        "contribution": "2;3;2;4",
        "presentation": "3;3;3;3",
        "wc_summary": "69;85;58;36",
        "wc_strengths": "21;38;65;28",
        "wc_weaknesses": "179;113;119;114",
        "wc_questions": "2;1;3;74",
        "wc_review": "271;237;245;252",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "502;444;336;562",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            62.0,
            17.81852968120546
        ],
        "wc_strengths_avg": [
            38.0,
            16.718253497300488
        ],
        "wc_weaknesses_avg": [
            131.25,
            27.66202270261522
        ],
        "wc_questions_avg": [
            20.0,
            31.184932259025352
        ],
        "wc_review_avg": [
            251.25,
            12.577261228105266
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            461.0,
            83.3606621854697
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:uzLKdkKzekgJ:scholar.google.com/&scioq=ADOPT:+Modified+Adam+Can+Converge+with+the+Optimal+Rate+with+Any+Hyperparameters&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;1;0;0;0;0",
        "aff_unique_norm": "University of Tokyo;Tokyo University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.u-tokyo.ac.jp;https://www.u-tokyo.ac.jp",
        "aff_unique_abbr": "UTokyo;UT",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Tokyo",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "Japan"
    },
    {
        "id": "sJslLVsYNo",
        "title": "Towards Understanding The Winner-Take-Most Behavior Of Neural Network Representations",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Understanding the generalization ability of neural networks is a long-standing goal of the machine learning community.\nDespite sufficient representational complexity to memorize large data sets, modern neural networks are able to learn solutions to their optimization problem that generalize well to unseen data.\nIn this paper, we explore how the neuron-level representations of the training samples in a data set can be analyzed to differentiate between networks that have learned to generalize and networks that merely memorize.\nFor this purpose, we introduce a synthetic data set specifically crafted to allow for an easy comparison of how networks treat simple patterns.\nWe show that comparing how training samples presenting different patterns are represented by neurons can provide key insights as to what differentiates memorized and generalized networks.\nWe observe that the training process progressively increases the average pre-activation of the most activated patterns of a class and decreases the average pre-activation of the least activated patterns of said class in each neuron, a winner-take-most phenomenon.\nIn order to solve the classification problem, the network seems to apply a divide-and-conquer strategy, where different neurons specialize in the classification of different patterns of a class.\nWe also explore the effect of various parameters of our experimental configuration on these findings and describe three necessary conditions for it to appear.\nFinally, we provide an intuitive explanation of why this phenomenon occurs, drawing links with existing work on sample difficulty, coherent gradients, and implicit clustering.",
        "keywords": "deep learning;neuron representations",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Gilles Peiffer;Simon Carbonnelle;Christophe De Vleeschouwer",
        "authorids": "~Gilles_Peiffer1;~Simon_Carbonnelle1;~Christophe_De_Vleeschouwer1",
        "gender": "M;M;M",
        "homepage": "https://uclouvain.be/fr/repertoires/gilles.peiffer;;",
        "dblp": ";;",
        "google_scholar": ";;xb3Zc3cAAAAJ",
        "orcid": ";;0000-0001-5049-2929",
        "linkedin": ";;",
        "or_profile": "~Gilles_Peiffer1;~Simon_Carbonnelle1;~Christophe_De_Vleeschouwer1",
        "aff": "UCLouvain ICTEAM;;UCLouvain",
        "aff_domain": "uclouvain.be;;uclouvain.be",
        "position": "PhD student;;Associate Professor",
        "bibtex": "@misc{\npeiffer2024towards,\ntitle={Towards Understanding The Winner-Take-Most Behavior Of Neural Network Representations},\nauthor={Gilles Peiffer and Simon Carbonnelle and Christophe De Vleeschouwer},\nyear={2024},\nurl={https://openreview.net/forum?id=sJslLVsYNo}\n}",
        "github": "",
        "project": "",
        "reviewers": "u4t5;xKTf;s4ij;hMQT",
        "site": "https://openreview.net/forum?id=sJslLVsYNo",
        "pdf_size": 1557506,
        "rating": "1;3;3;6",
        "confidence": "3;3;3;4",
        "soundness": "1;2;2;3",
        "contribution": "1;2;2;2",
        "presentation": "2;2;3;3",
        "wc_summary": "101;78;306;90",
        "wc_strengths": "15;9;49;50",
        "wc_weaknesses": "250;71;317;206",
        "wc_questions": "8;168;169;56",
        "wc_review": "374;326;841;402",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            143.75,
            94.02758903640995
        ],
        "wc_strengths_avg": [
            30.75,
            18.872930350107268
        ],
        "wc_weaknesses_avg": [
            211.0,
            89.97499652681293
        ],
        "wc_questions_avg": [
            100.25,
            70.32913692062486
        ],
        "wc_review_avg": [
            485.75,
            206.89656232040204
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.8892972917998875,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:1E8J3dlMnAAJ:scholar.google.com/&scioq=Towards+Understanding+The+Winner-Take-Most+Behavior+Of+Neural+Network+Representations&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Universit\u00e9 catholique de Louvain",
        "aff_unique_dep": "Institut de recherche en informatique et syst\u00e8mes almonds",
        "aff_unique_url": "https://www.uclouvain.be",
        "aff_unique_abbr": "UCL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Belgium"
    },
    {
        "id": "sK2A7Ve2co",
        "title": "Exploring Deep Learning Parameter Space with a-GPS: Approximate Gaussian Proposal Sampler",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "To trust the predictions provided by deep neural networks we need to quantify the uncertainty. This can be done with Bayesian neural networks. However, they require a trade-off between exactness and effectiveness. This paper introduces a new sampling framework: Adaptive Proposal Sampling (APS). APS is a mode seeking sampler that adapts the proposal to match a posterior mode. When modes overlap, APS will adapt to a new mode if it draws a sample that belongs to a new mode. A variant of APS is the approximate Gaussian Proposal Sampler (a-GPS). We show that it becomes a perfect sampler if it has the same score function as the posterior. With a warm-start of a pretrained model, combined with stochastic gradients it scales up to deep learning. Results show that a-GPS 1) proposes samples that are proportional to a mode, 2) explores multi-modal landscapes, 3) has fast computations, 4) scales to big data. Immediate results suggest that this framework may be a step towards having both exactness and effectiveness.",
        "keywords": "sgmcmc;bayesian deep learning;uncertainty;sampling;UQ",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Fabian Meyer Bull;Geir Storvik;Arnt B. Salberg;Anne Schistad Solberg",
        "authorids": "~Fabian_Meyer_Bull1;~Geir_Storvik1;~Arnt_B._Salberg1;~Anne_Schistad_Solberg1",
        "gender": "M;M;F;M",
        "homepage": "https://www.mn.uio.no/math/english/people/aca/geirs/index.html;https://nr.no/ansatte/arnt-borre-salberg/;;https://www.mn.uio.no/ifi/personer/vit/edwardfb/index.html",
        "dblp": "16/2823;;;",
        "google_scholar": "0xDw_sQAAAAJ;SABRpmgAAAAJ;;",
        "orcid": "0000-0001-8198-1426;;0000-0002-6149-971X;",
        "linkedin": ";;;",
        "or_profile": "~Geir_Storvik1;~Arnt_B._Salberg1;~Anne_Schistad_Solberg1;~Edward_Fabian_Bull1",
        "aff": "University of Oslo;Norwegian Computing Center;University of Oslo;University of Oslo",
        "aff_domain": "uio.no;nr.no;uio.no;uio.no",
        "position": "Full Professor;Principal Researcher;Full Professor;PhD student",
        "bibtex": "@misc{\nbull2024exploring,\ntitle={Exploring Deep Learning Parameter Space with a-{GPS}: Approximate Gaussian Proposal Sampler},\nauthor={Fabian Meyer Bull and Geir Storvik and Arnt B. Salberg and Anne Schistad Solberg},\nyear={2024},\nurl={https://openreview.net/forum?id=sK2A7Ve2co}\n}",
        "github": "",
        "project": "",
        "reviewers": "XKu5;xaq1;zCTz;RZPX",
        "site": "https://openreview.net/forum?id=sK2A7Ve2co",
        "pdf_size": 442685,
        "rating": "1;3;3;3",
        "confidence": "3;5;4;4",
        "soundness": "1;2;1;3",
        "contribution": "1;2;2;2",
        "presentation": "1;2;2;2",
        "wc_summary": "37;21;42;38",
        "wc_strengths": "14;12;21;38",
        "wc_weaknesses": "340;95;312;435",
        "wc_questions": "8;83;30;164",
        "wc_review": "399;211;405;675",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1255;600;1531;1939",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;3;3",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            34.5,
            8.0156097709407
        ],
        "wc_strengths_avg": [
            21.25,
            10.231690964840562
        ],
        "wc_weaknesses_avg": [
            295.5,
            124.41161521337146
        ],
        "wc_questions_avg": [
            71.25,
            60.08899649686288
        ],
        "wc_review_avg": [
            422.5,
            165.3382895762503
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1331.25,
            487.2886080137725
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:5VotMIdB0b0J:scholar.google.com/&scioq=Exploring+Deep+Learning+Parameter+Space+with+a-GPS:+Approximate+Gaussian+Proposal+Sampler&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "University of Oslo;Norwegian Computing Center",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uio.no;https://www.norskITED.no",
        "aff_unique_abbr": "UiO;NCC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Norway"
    },
    {
        "id": "sKLQMNTAMx",
        "title": "One-shot Federated Learning with Training-Free Client",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "While traditional iterative federated learning (FL) is often limited by various factors, such as massive communication overhead, higher risk of being attacked, and fault tolerance requirements, an emerging and promising solution is to conduct FL with a single communication round, termed one-shot FL. However, a lack of continuous communication leads to the serious performance degradation of current FL frameworks, especially training with statistical heterogeneity, i.e., non-IID. The primary objective of this paper is to develop an effective and efficient one-shot FL framework to better deal with statistical heterogeneity. To achieve this, we first revisit the influence of statistical heterogeneity on model optimization and observe that conventional mechanism (i.e., training from scratch and parameter averaging) is inadvisable for one-shot FL due to the problem of client drift. Based on this observation, we propose a novel one-shot FL framework, namely FedTC. Different from existing methods, FedTC divides the model into backbone and head, deploying them separately on the client and server sides. Specifically, our approach does not directly train the whole model on biased local datasets from scratch, but only learns a detached head through unbiased class prototypes estimated by the pre-trained backbone. Moreover, we integrate the feature outlier filtering strategy and adapter into our FedTC to further improve its performance. Extensive experiments demonstrate that FedTC can significantly outperform several state-of-the-art one-shot FL approaches with extremely low communication and computation costs. The source code will be released.",
        "keywords": "one-shot federated learning;statistical heterogeneity.",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Yunlu Yan;Huazhu Fu;Yuexiang Li;Lei Zhu",
        "authorids": "~Yunlu_Yan1;~Huazhu_Fu4;~Yuexiang_Li1;~Lei_Zhu1",
        "gender": "M;M;M;M",
        "homepage": ";https://hzfu.github.io;https://yuexiangli.github.io;https://sites.google.com/site/indexlzhu/home?authuser=0",
        "dblp": "294/8769;63/7767;165/6204;99/549-3",
        "google_scholar": "Ja0QBOgAAAAJ;https://scholar.google.com/citations?hl=en;WsKu4EMAAAAJ;https://scholar.google.com.hk/citations?user=AQtqhaYAAAAJ",
        "orcid": ";0000-0002-9702-5524;;",
        "linkedin": ";;;",
        "or_profile": "~Yunlu_Yan1;~Huazhu_Fu4;~Yuexiang_Li1;~Lei_Zhu1",
        "aff": "The Hong Kong University of Science and Technology (Guangzhou);Institute of High Performance Computing, Singapore, A*STAR;Medical AI ReSearch (MARS) Group @ GXMU;Hong Kong University of Science and Technology (Guangzhou) & HKUST",
        "aff_domain": "hkust-gz.edu.cn;ihpc.a-star.edu.sg;gxmu.edu.cn;ust.hk",
        "position": "PhD student;Principal Scientist;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nyan2024oneshot,\ntitle={One-shot Federated Learning with Training-Free Client},\nauthor={Yunlu Yan and Huazhu Fu and Yuexiang Li and Lei Zhu},\nyear={2024},\nurl={https://openreview.net/forum?id=sKLQMNTAMx}\n}",
        "github": "",
        "project": "",
        "reviewers": "qeaq;y2sF;E58J;7xGT;fiUw",
        "site": "https://openreview.net/forum?id=sKLQMNTAMx",
        "pdf_size": 1265057,
        "rating": "3;3;5;5;5",
        "confidence": "4;4;4;2;4",
        "soundness": "3;3;2;2;2",
        "contribution": "2;2;3;2;2",
        "presentation": "3;3;2;3;3",
        "wc_summary": "98;74;157;95;59",
        "wc_strengths": "32;23;84;46;26",
        "wc_weaknesses": "527;118;366;190;88",
        "wc_questions": "5;2;24;2;84",
        "wc_review": "662;217;631;333;257",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            4.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.6,
            0.8
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            96.6,
            33.39820354450221
        ],
        "wc_strengths_avg": [
            42.2,
            22.346364357541475
        ],
        "wc_weaknesses_avg": [
            257.8,
            165.61932254420074
        ],
        "wc_questions_avg": [
            23.4,
            31.39171865317348
        ],
        "wc_review_avg": [
            420.0,
            188.90844343226166
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.4082482904638631,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:VHtSoUP39H4J:scholar.google.com/&scioq=One-shot+Federated+Learning+with+Training-Free+Client&hl=en&as_sdt=0,31",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Institute of High Performance Computing;Guangxi Medical University",
        "aff_unique_dep": ";;Medical AI ReSearch (MARS) Group",
        "aff_unique_url": "https://www.ust.hk;https://www.ihpc.a-star.edu.sg;http://www.gxmu.edu.cn",
        "aff_unique_abbr": "HKUST;IHPC;GXMU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Guangzhou;",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "China;Singapore"
    },
    {
        "title": "Addressing Loss of Plasticity and Catastrophic Forgetting in Continual Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17656",
        "id": "sKPzAXoylB",
        "author_site": "Mohamed Elsayed, A. Rupam Mahmood",
        "tldr": "",
        "abstract": "Deep representation learning methods struggle with continual learning, suffering from both catastrophic forgetting of useful units and loss of plasticity, often due to rigid and unuseful units. While many methods address these two issues separately, only a few currently deal with both simultaneously. In this paper, we introduce Utility-based Perturbed Gradient Descent (UPGD) as a novel approach for the continual learning of representations. UPGD combines gradient updates with perturbations, where it applies smaller modifications to more useful units, protecting them from forgetting, and larger modifications to less useful units, rejuvenating their plasticity. We use a challenging streaming learning setup where continual learning problems have hundreds of non-stationarities and unknown task boundaries. We show that many existing methods suffer from at least one of the issues, predominantly manifested by their decreasing accuracy over tasks. On the other hand, UPGD continues to improve performance and surpasses or is competitive with all methods in all problems. Finally, in extended reinforcement learning experiments with PPO, we show that while Adam exhibits a performance drop after initial learning, UPGD avoids it by addressing both continual learning issues.",
        "keywords": "catastrophic forgetting;loss of plasticity;plasticity;stability;continual learning;streaming learning;online learning;incremental learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Mohamed Elsayed;A. Rupam Mahmood",
        "authorids": "~Mohamed_Elsayed2;~A._Rupam_Mahmood1",
        "gender": "M;",
        "homepage": "https://mohmdelsayed.github.io;",
        "dblp": "224/8735-3;120/6935",
        "google_scholar": "https://scholar.google.ca/citations?user=gShveMAAAAAJ;https://scholar.google.ca/citations?user=YwB8XM4AAAAJ",
        "orcid": ";",
        "linkedin": "mohamedelsayed95/;",
        "or_profile": "~Mohamed_Elsayed2;~Rupam_Mahmood1",
        "aff": "University of Alberta;University of Alberta",
        "aff_domain": "ualberta.ca;ualberta.ca",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nelsayed2024addressing,\ntitle={Addressing Loss of Plasticity and Catastrophic Forgetting in Continual Learning},\nauthor={Mohamed Elsayed and A. Rupam Mahmood},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=sKPzAXoylB}\n}",
        "github": "",
        "project": "",
        "reviewers": "3zCE;KmBd;y5kB;XNx6",
        "pdf_size": 3343727,
        "rating": "3;6;6;6",
        "confidence": "4;4;3;4",
        "soundness": "4;3;3;2",
        "contribution": "1;3;3;3",
        "presentation": "3;3;3;2",
        "wc_summary": "104;74;125;66",
        "wc_strengths": "31;150;62;76",
        "wc_weaknesses": "205;197;188;446",
        "wc_questions": "140;66;355;91",
        "wc_review": "480;487;730;679",
        "wc_reply_reviewers": "124;0;28;90",
        "wc_reply_authors": "1156;619;794;806",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            92.25,
            23.62599204266352
        ],
        "wc_strengths_avg": [
            79.75,
            43.70569184900292
        ],
        "wc_weaknesses_avg": [
            259.0,
            108.13186394398276
        ],
        "wc_questions_avg": [
            163.0,
            114.00219296136369
        ],
        "wc_review_avg": [
            594.0,
            111.98883872958055
        ],
        "wc_reply_reviewers_avg": [
            60.5,
            49.03825037661927
        ],
        "wc_reply_authors_avg": [
            843.75,
            194.8799309831569
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 26,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16021581089946610117&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=sKPzAXoylB",
        "pdf": "https://openreview.net/pdf?id=sKPzAXoylB",
        "email": "ualberta.ca;ualberta.ca",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Alberta",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ualberta.ca",
        "aff_unique_abbr": "UAlberta",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "sKqGVqkvuS",
        "title": "Meta-Learning Universal Priors Using Non-Injective Normalizing Flows",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Meta-learning empowers data-hungry deep neural networks to rapidly learn from merely a few samples, which is especially appealing to tasks with small datasets. Critical in this context is the *prior knowledge* accumulated from related tasks. Existing meta-learning approaches typically rely on preselected priors, such as a Gaussian probability density function (pdf). The limited expressiveness of such priors however, hinders the enhanced performance of the trained model when dealing with tasks having exceedingly scarce data. Targeting improved expressiveness, this contribution introduces a *data-driven* prior that optimally fits the provided tasks using a novel non-injective normalizing flow (NNF). Unlike preselected prior pdfs with fixed shapes, the advocated NNF model can effectively approximate a considerably wide range of pdfs. Moreover, compared to conventional injective normalizing flows, the introduced NNF exhibits augmented expressiveness for pdf modeling, especially in high-dimensional spaces. Theoretical analysis underscores the appealing universal approximation capacity of the NNF model. Numerical experiments conducted on three few-shot learning datasets validate the superiority of data-driven priors over the prespecified ones, showcasing its pronounced effectiveness when dealing with extremely limited data resources.",
        "keywords": "Meta-learning;prior learning;normalizing flows",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/98605064e075c9d1cab1797e729e43c0a3a3c6a3.zip",
        "author": "Yilang Zhang;Alireza Sadeghi;Georgios B. Giannakis",
        "authorids": "~Yilang_Zhang2;~Alireza_Sadeghi1;~Georgios_B._Giannakis1",
        "gender": "M;M;M",
        "homepage": "https://zhangyilang.github.io/;;http://spincom.umn.edu/",
        "dblp": "254/1439;;33/4080",
        "google_scholar": "cGhJeOcAAAAJ;https://scholar.google.com/;Nu_6R8sAAAAJ",
        "orcid": "0000-0001-7109-6677;0000-0003-1280-7592;",
        "linkedin": "yilang-zhang-529709323/;alireza-sadeghi-96605997/;georgios-b-giannakis-54023b18/",
        "or_profile": "~Yilang_Zhang2;~Alireza_Sadeghi1;~Georgios_B._Giannakis1",
        "aff": "University of Minnesota - Twin Cities;;",
        "aff_domain": "umn.edu;;",
        "position": "PhD student;;",
        "bibtex": "@misc{\nzhang2024metalearning,\ntitle={Meta-Learning Universal Priors Using Non-Injective Normalizing Flows},\nauthor={Yilang Zhang and Alireza Sadeghi and Georgios B. Giannakis},\nyear={2024},\nurl={https://openreview.net/forum?id=sKqGVqkvuS}\n}",
        "github": "",
        "project": "",
        "reviewers": "VGG6;8K48;EPFW",
        "site": "https://openreview.net/forum?id=sKqGVqkvuS",
        "pdf_size": 878054,
        "rating": "3;5;6",
        "confidence": "3;3;4",
        "soundness": "2;2;3",
        "contribution": "1;2;3",
        "presentation": "2;2;3",
        "wc_summary": "97;17;93",
        "wc_strengths": "45;27;49",
        "wc_weaknesses": "421;217;105",
        "wc_questions": "2;35;66",
        "wc_review": "565;296;313",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            69.0,
            36.8057966449127
        ],
        "wc_strengths_avg": [
            40.333333333333336,
            9.568466729604882
        ],
        "wc_weaknesses_avg": [
            247.66666666666666,
            130.8162409217177
        ],
        "wc_questions_avg": [
            34.333333333333336,
            26.132142830026183
        ],
        "wc_review_avg": [
            391.3333333333333,
            122.9968382610798
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.7559289460184545,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10477320710000632912&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Minnesota",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.minnesota.edu",
        "aff_unique_abbr": "UMN",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Twin Cities",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "sLGliHckR8",
        "title": "Drug Discovery with Dynamic Goal-aware Fragments",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Fragment-based drug discovery is an effective strategy for discovering drug candidates in the vast chemical space, and has been widely employed in molecular generative models. However, many existing fragment extraction methods in such models do not take the target chemical properties into account or rely on  heuristic rules. Additionally, the existing fragment-based generative models cannot update the fragment vocabulary with goal-aware fragments newly discovered during the generation. To this end, we propose a molecular generative framework for drug discovery, named *Goal-aware fragment Extraction, Assembly, and Modification* (GEAM). GEAM consists of three modules, each responsible for goal-aware fragment extraction, fragment assembly, and fragment modification. The fragment extraction module identifies important fragments that contribute to the desired target properties with the information bottleneck principle, thereby constructing an effective goal-aware fragment vocabulary. Moreover, GEAM can explore beyond the initial vocabulary with the fragment modification module, and the exploration is further enhanced through the dynamic goal-aware vocabulary update. We experimentally demonstrate that GEAM effectively discovers drug candidates through the generative cycle of the three modules in various drug discovery tasks. The anonymous code is available at https://anonymous.4open.science/r/GEAM-45EF.",
        "keywords": "molecule generation;drug discovery;molecular optimization;fragment-based",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Seul Lee;Seanie Lee;Sung Ju Hwang",
        "authorids": "~Seul_Lee1;~Seanie_Lee1;~Sung_Ju_Hwang1",
        "gender": "Not Specified;M;",
        "homepage": "https://seullee05.github.io;https://seanie12.github.io/;",
        "dblp": "159/0357;219/6771;",
        "google_scholar": "Ek0N9YYAAAAJ;zrZu6GkAAAAJ;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Seul_Lee1;~Seanie_Lee1;~Sung_Ju_Hwang1",
        "aff": "Korea Advanced Institute of Science & Technology;Montreal Institute for Learning Algorithms, University of Montreal, Universit\u00e9 de Montr\u00e9al;",
        "aff_domain": "kaist.ac.kr;mila.umontreal.ca;",
        "position": "PhD student;Intern;",
        "bibtex": "@misc{\nlee2024drug,\ntitle={Drug Discovery with Dynamic Goal-aware Fragments},\nauthor={Seul Lee and Seanie Lee and Sung Ju Hwang},\nyear={2024},\nurl={https://openreview.net/forum?id=sLGliHckR8}\n}",
        "github": "",
        "project": "",
        "reviewers": "R9aj;bdP8;V1Zp",
        "site": "https://openreview.net/forum?id=sLGliHckR8",
        "pdf_size": 2181367,
        "rating": "5;6;8",
        "confidence": "3;4;3",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "3;3;3",
        "wc_summary": "40;36;171",
        "wc_strengths": "20;42;203",
        "wc_weaknesses": "37;22;119",
        "wc_questions": "33;48;76",
        "wc_review": "130;148;569",
        "wc_reply_reviewers": "0;0;18",
        "wc_reply_authors": "555;577;814",
        "reply_reviewers": "0;0;1",
        "reply_authors": "1;1;2",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            82.33333333333333,
            62.71806402907822
        ],
        "wc_strengths_avg": [
            88.33333333333333,
            81.57750234524767
        ],
        "wc_weaknesses_avg": [
            59.333333333333336,
            42.63279905841928
        ],
        "wc_questions_avg": [
            52.333333333333336,
            17.82008853949821
        ],
        "wc_review_avg": [
            282.3333333333333,
            202.83709938985248
        ],
        "wc_reply_reviewers_avg": [
            6.0,
            8.48528137423857
        ],
        "wc_reply_authors_avg": [
            648.6666666666666,
            117.25281328062975
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.18898223650461363,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12467445023885024926&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology;University of Montreal",
        "aff_unique_dep": ";Montreal Institute for Learning Algorithms",
        "aff_unique_url": "https://www.kaist.ac.kr;https://www.mila.quebec",
        "aff_unique_abbr": "KAIST;MILA",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Montreal",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "South Korea;Canada"
    },
    {
        "title": "Fair and Efficient Contribution Valuation for Vertical Federated Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17655",
        "id": "sLQb8q0sUi",
        "author_site": "Zhenan Fan, Huang Fang, Xinglu Wang, Zirui Zhou, Jian Pei, Michael Friedlander, Yong Zhang",
        "tldr": "",
        "abstract": "Federated learning is an emerging technology for training machine learning models across decentralized data sources without sharing data. Vertical federated learning, also known as feature-based federated learning, applies to scenarios where data sources have the same sample IDs but different feature sets. To ensure fairness among data owners, it is critical to objectively assess the contributions from different data sources and compensate the corresponding data owners accordingly. The Shapley value is a provably fair contribution valuation metric originating from cooperative game theory. However, its straight-forward computation requires extensively retraining a model on each potential combination of data sources, leading to prohibitively high communication and computation overheads due to multiple rounds of federated learning. To tackle this challenge, we propose a contribution valuation metric called vertical federated Shapley value (VerFedSV) based on the classic Shapley value. We show that VerFedSV not only satisfies many desirable properties of fairness but is also efficient to compute. Moreover, VerFedSV can be adapted to both synchronous and asynchronous vertical federated learning algorithms. Both theoretical analysis and extensive experimental results demonstrate the fairness, efficiency, adaptability, and effectiveness of VerFedSV.",
        "keywords": "Vertical federated learning;Contribution valuation;Fairness",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/2b3bee69555f755c5252df51d9e8dffc6ad5d620.zip",
        "author": "Zhenan Fan;Huang Fang;Xinglu Wang;Zirui Zhou;Jian Pei;Michael Friedlander;Yong Zhang",
        "authorids": "~Zhenan_Fan1;~Huang_Fang1;~Xinglu_Wang1;~Zirui_Zhou2;~Jian_Pei1;~Michael_Friedlander1;~Yong_Zhang2",
        "gender": "M;M;;M;;;M",
        "homepage": "https://zhenanf.me;https://www.cs.ubc.ca/~hgfang;http://luzai.github.io/;;;;https://sites.google.com/site/yongzhangai",
        "dblp": ";17/7697;;;;;66/4615-4",
        "google_scholar": "https://scholar.google.com/citations?hl=en;SYYFwD8AAAAJ;;2fKv_JQAAAAJ;;;K2zamrwAAAAJ",
        "orcid": ";;;;;;0000-0002-0238-0719",
        "linkedin": ";;;;;;yong-zhang-ai/",
        "or_profile": "~Zhenan_Fan1;~Huang_Fang1;~Xinglu_Wang1;~Zirui_Zhou2;~Jian_Pei1;~Michael_Friedlander1;~Yong_Zhang2",
        "aff": "Huawei Technologies Ltd.;Baidu;Simon Fraser University;Huawei Technologies Ltd.;;;Huawei Technologies Ltd., Canada",
        "aff_domain": "huawei.com;baidu.com;sfu.ca;huawei.com;;;huawei.com",
        "position": "Researcher;Researcher;PhD student;Principal Researcher;;;Distinguished Researcher",
        "bibtex": "@inproceedings{\nfan2024fair,\ntitle={Fair and Efficient Contribution Valuation for Vertical Federated Learning},\nauthor={Zhenan Fan and Huang Fang and Xinglu Wang and Zirui Zhou and Jian Pei and Michael Friedlander and Yong Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=sLQb8q0sUi}\n}",
        "github": "",
        "project": "",
        "reviewers": "WWnM;n6Bm;skLQ;RX3e",
        "pdf_size": 666559,
        "rating": "6;6;6;8",
        "confidence": "4;3;4;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;2;2",
        "presentation": "3;2;3;2",
        "wc_summary": "133;83;83;55",
        "wc_strengths": "78;9;62;99",
        "wc_weaknesses": "140;147;192;77",
        "wc_questions": "135;2;85;28",
        "wc_review": "486;241;422;259",
        "wc_reply_reviewers": "11;331;17;10",
        "wc_reply_authors": "1394;1305;747;642",
        "reply_reviewers": "1;4;2;1",
        "reply_authors": "3;6;2;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            88.5,
            28.12027738127773
        ],
        "wc_strengths_avg": [
            62.0,
            33.294143629172986
        ],
        "wc_weaknesses_avg": [
            139.0,
            40.98170323449234
        ],
        "wc_questions_avg": [
            62.5,
            51.509707822894896
        ],
        "wc_review_avg": [
            352.0,
            104.67330127592231
        ],
        "wc_reply_reviewers_avg": [
            92.25,
            137.86837019418195
        ],
        "wc_reply_authors_avg": [
            1022.0,
            331.0959075554997
        ],
        "reply_reviewers_avg": [
            2.0,
            1.224744871391589
        ],
        "reply_authors_avg": [
            3.0,
            1.8708286933869707
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 49,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16843174383224977911&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=sLQb8q0sUi",
        "pdf": "https://openreview.net/pdf?id=sLQb8q0sUi",
        "email": "huawei.com;baidu.com;sfu.ca;huawei.com;;;huawei.com",
        "author_num": 7,
        "aff_unique_index": "0;1;2;0;0",
        "aff_unique_norm": "Huawei;Baidu;Simon Fraser University",
        "aff_unique_dep": "Huawei Technologies;Baidu, Inc.;",
        "aff_unique_url": "https://www.huawei.com;https://www.baidu.com;https://www.sfu.ca",
        "aff_unique_abbr": "Huawei;Baidu;SFU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;1",
        "aff_country_unique": "China;Canada"
    },
    {
        "title": "NuwaDynamics: Discovering and Updating in Causal Spatio-Temporal Modeling",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17654",
        "id": "sLdVl0q68X",
        "author_site": "Kun Wang, Hao Wu, Yifan Duan, Guibin Zhang, Kai Wang, Xiaojiang Peng, yu zheng, Yuxuan Liang, Yang Wang",
        "tldr": "",
        "abstract": "Spatio-temporal (ST) prediction plays a pivotal role in earth sciences, such as meteorological prediction, urban computing. Adequate high-quality data, coupled with deep models capable of inference, are both indispensable and prerequisite for achieving meaningful results. However, the sparsity of data and the high costs associated with deploying sensors lead to significant data imbalances. Models that are overly tailored and lack causal relationships further compromise the generalizabilities of inference methods. Towards this end, we first establish a causal concept for ST predictions, named  NuwaDynamics, which targets to identify causal regions in data and endow model with causal reasoning ability in a two-stage process. Concretely, we initially leverage upstream self-supervision to discern causal important patches, imbuing the model with generalized information and conducting informed interventions on complementary trivial patches to extrapolate potential test distributions. This phase is referred to as the discovery step. Advancing beyond discovery step, we transfer the data to downstream tasks for targeted ST objectives, aiding the model in recognizing a broader potential distribution and fostering its causal perceptual capabilities (refer as Update step). Our concept aligns seamlessly with the contemporary backdoor adjustment mechanism in causality theory. Extensive experiments on six real-world ST benchmarks showcase that models can gain outcomes upon the integration of the NuwaDynamics concept. NuwaDynamics also can significantly benefit a wide range of changeable ST tasks like extreme weather and long temporal step super-resolution predictions.",
        "keywords": "Spatio-temporal data mining;Causal inference;Two-stage framework",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/fc9e10e071bf4322107a621b04fd17f832ba0da5.pdf",
        "author": "Kun Wang;Hao Wu;Yifan Duan;Guibin Zhang;Kai Wang;Xiaojiang Peng;Yu Zheng;Yuxuan Liang;Yang Wang",
        "authorids": "~Kun_Wang15;~Hao_Wu39;~Yifan_Duan1;~Guibin_Zhang1;~Kai_Wang8;~Xiaojiang_Peng1;~Yu_Zheng11;~Yuxuan_Liang1;~Yang_Wang32",
        "gender": "M;M;M;;M;M;M;M;M",
        "homepage": "http://home.ustc.edu.cn/~wk520529/#home;https://easylearningscores.github.io/;;;https://kaiwang960112.github.io/;https://pengxj.github.io/;http://urban-computing.com/yuzheng;https://yuxuanliang.com;http://staff.ustc.edu.cn/~angyan/",
        "dblp": ";111;231/3980;;78/2022-36;133/6556;87/1585-4;183/0977;",
        "google_scholar": "UnyqjWQAAAAJ;HdXMhfcAAAAJ;;;i2II0XIAAAAJ;7oRD67kAAAAJ;https://scholar.google.com.hk/citations?hl=en;n9cODgcAAAAJ;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": "0000-0003-0602-169X;0009-0008-4084-1409;0009-0006-5855-6847;;0000-0002-1154-5175;;;0000-0003-2817-7337;0000-0002-6079-7053",
        "linkedin": ";;;;;;https://www.linkedin.cn/incareer/in/yu-zheng-7483642?trk=hp-identity-name;yoshall/;",
        "or_profile": "~Kun_Wang15;~Hao_Wu39;~Yifan_Duan1;~Guibin_Zhang1;~Kai_Wang8;~Xiaojiang_Peng1;~Yu_Zheng11;~Yuxuan_Liang1;~Yang_Wang32",
        "aff": "University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China;;National University of Singapore;Shenzhen Technology University;JD.COM;The Hong Kong University of Science and Technology (Guangzhou);University of Science and Technology of China",
        "aff_domain": "ustc.edu.cn;ustc.edu.cn;ustc.edu.cn;;u.nus.edu;sztu.edu.cn;jd.com;hkust-gz.edu.cn;ustc.edu.cn",
        "position": "PhD student;MS student;MS student;;PhD student;Full Professor;vice president;Assistant Professor;Associate Professor",
        "bibtex": "@inproceedings{\nwang2024nuwadynamics,\ntitle={NuwaDynamics: Discovering and Updating in Causal Spatio-Temporal Modeling},\nauthor={Kun Wang and Hao Wu and Yifan Duan and Guibin Zhang and Kai Wang and Xiaojiang Peng and Yu Zheng and Yuxuan Liang and Yang Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=sLdVl0q68X}\n}",
        "github": "",
        "project": "",
        "reviewers": "zp2y;PkBe;oBVm;TYFb",
        "pdf_size": 13164165,
        "rating": "6;6;8;10",
        "confidence": "3;5;5;4",
        "soundness": "2;2;4;4",
        "contribution": "3;2;4;4",
        "presentation": "3;3;3;4",
        "wc_summary": "63;105;90;128",
        "wc_strengths": "98;41;224;146",
        "wc_weaknesses": "114;44;86;194",
        "wc_questions": "60;25;107;2",
        "wc_review": "335;215;507;470",
        "wc_reply_reviewers": "45;103;6;70",
        "wc_reply_authors": "1605;2206;439;1124",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "3;4;1;2",
        "rating_avg": [
            7.5,
            1.6583123951777
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            1.0
        ],
        "contribution_avg": [
            3.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            96.5,
            23.606143268225754
        ],
        "wc_strengths_avg": [
            127.25,
            67.09461602841169
        ],
        "wc_weaknesses_avg": [
            109.5,
            54.77910185463066
        ],
        "wc_questions_avg": [
            48.5,
            39.588508433635134
        ],
        "wc_review_avg": [
            381.75,
            115.61439140522256
        ],
        "wc_reply_reviewers_avg": [
            56.0,
            35.4471437495322
        ],
        "wc_reply_authors_avg": [
            1343.5,
            647.8018601393485
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.0909090909090909,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14619275623139326816&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=sLdVl0q68X",
        "pdf": "https://openreview.net/pdf?id=sLdVl0q68X",
        "email": "ustc.edu.cn;ustc.edu.cn;ustc.edu.cn;;u.nus.edu;sztu.edu.cn;jd.com;hkust-gz.edu.cn;ustc.edu.cn",
        "author_num": 9,
        "aff_unique_index": "0;0;0;1;2;3;4;0",
        "aff_unique_norm": "University of Science and Technology of China;National University of Singapore;Shenzhen Technology University;JD.com;Hong Kong University of Science and Technology",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "http://www.ustc.edu.cn;https://www.nus.edu.sg;https://www.sztu.edu.cn;https://www.jd.com;https://www.ust.hk",
        "aff_unique_abbr": "USTC;NUS;;JD;HKUST",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Guangzhou",
        "aff_country_unique_index": "0;0;0;1;0;0;0;0",
        "aff_country_unique": "China;Singapore"
    },
    {
        "title": "Transformers can optimally learn regression mixture models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17653",
        "id": "sLkj91HIZU",
        "author_site": "Reese Pathak, Rajat Sen, Weihao Kong, Abhimanyu Das",
        "tldr": "",
        "abstract": "Mixture models arise in many regression problems, but most methods have seen limited adoption partly due to these algorithms' highly-tailored and model-specific nature. On the other hand, transformers are flexible, neural sequence models that present the intriguing possibility of providing general-purpose prediction methods, even in this mixture setting. In this work, we investigate the hypothesis that transformers can learn an optimal predictor for mixtures of regressions. We construct a generative process for a mixture of linear regressions for which the decision-theoretic optimal procedure is given by data-driven exponential weights on a finite set of parameters. We observe that transformers achieve low mean-squared error on data generated via this process. By probing the transformer's output at inference time, we also show that transformers typically make predictions that are close to the optimal predictor. Our experiments also demonstrate that transformers can learn mixtures of regressions in a sample-efficient fashion and are somewhat robust to distribution shifts. We complement our experimental observations by proving constructively that the decision-theoretic optimal procedure is indeed implementable by a transformer.",
        "keywords": "transformers;mixture models;linear regression",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/30066d478180b9f9848cf541e13eee2d9d2fbdb8.zip",
        "author": "Reese Pathak;Rajat Sen;Weihao Kong;Abhimanyu Das",
        "authorids": "~Reese_Pathak1;~Rajat_Sen1;~Weihao_Kong1;~Abhimanyu_Das2",
        "gender": "M;M;;M",
        "homepage": "http://cs.berkeley.edu/~pathakr;http://rajatsen91.github.io;https://weihaokong.github.io/;https://sites.google.com/site/abhidas/",
        "dblp": ";http://dblp.uni-trier.de/pers/hd/s/Sen:Rajat;117/4343;83/6359",
        "google_scholar": ";YzsCLBoAAAAJ;loxOHhoAAAAJ;",
        "orcid": ";;;",
        "linkedin": ";rajat-sen-a8702417/;;",
        "or_profile": "~Reese_Pathak1;~Rajat_Sen1;~Weihao_Kong1;~Abhimanyu_Das2",
        "aff": "University of California, Berkeley;Google;Google;Research, Google",
        "aff_domain": "berkeley.edu;google.com;google.com;research.google.com",
        "position": "PhD student;Research Scientist;Researcher;Researcher",
        "bibtex": "@inproceedings{\npathak2024transformers,\ntitle={Transformers can optimally learn regression mixture models},\nauthor={Reese Pathak and Rajat Sen and Weihao Kong and Abhimanyu Das},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=sLkj91HIZU}\n}",
        "github": "",
        "project": "",
        "reviewers": "sqwx;1RLx;wAvt;KcGJ;Pvi3",
        "pdf_size": 911884,
        "rating": "6;6;6;8;8",
        "confidence": "4;3;3;3;3",
        "soundness": "2;3;3;3;3",
        "contribution": "3;3;2;3;3",
        "presentation": "3;3;3;3;3",
        "wc_summary": "69;72;46;48;37",
        "wc_strengths": "29;81;18;121;66",
        "wc_weaknesses": "181;175;109;128;450",
        "wc_questions": "142;2;36;121;1",
        "wc_review": "421;330;209;418;554",
        "wc_reply_reviewers": "102;55;0;10;46",
        "wc_reply_authors": "1260;1038;599;233;1019",
        "reply_reviewers": "1;1;0;1;1",
        "reply_authors": "3;3;1;1;2",
        "rating_avg": [
            6.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.2,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.8,
            0.39999999999999997
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            54.4,
            13.690872872099865
        ],
        "wc_strengths_avg": [
            63.0,
            37.089081951431474
        ],
        "wc_weaknesses_avg": [
            208.6,
            123.75879766707496
        ],
        "wc_questions_avg": [
            60.4,
            59.77491112498621
        ],
        "wc_review_avg": [
            386.4,
            113.96244995611494
        ],
        "wc_reply_reviewers_avg": [
            42.6,
            36.252448193191036
        ],
        "wc_reply_authors_avg": [
            829.8,
            367.05716176094427
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4
        ],
        "reply_authors_avg": [
            2.0,
            0.8944271909999159
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.40824829046386296,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1407145689889643360&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=sLkj91HIZU",
        "pdf": "https://openreview.net/pdf?id=sLkj91HIZU",
        "email": "berkeley.edu;google.com;google.com;research.google.com",
        "author_num": 4,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "University of California, Berkeley;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.berkeley.edu;https://www.google.com",
        "aff_unique_abbr": "UC Berkeley;Google",
        "aff_campus_unique_index": "0;1;1;1",
        "aff_campus_unique": "Berkeley;Mountain View",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "On the Analysis of GAN-based Image-to-Image Translation with Gaussian Noise Injection",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17652",
        "id": "sLregLuXpn",
        "author_site": "Chaohua Shi, Kexin Huang, Lu Gan, Hongqing Liu, Mingrui Zhu, Nannan Wang, Xinbo Gao",
        "tldr": "",
        "abstract": "Image-to-image (I2I) translation is vital in computer vision tasks like style transfer and domain adaptation. While recent advances in GAN have enabled high-quality sample generation, real-world challenges such as noise and distortion remain significant obstacles. Although Gaussian noise injection during training has been utilized, its theoretical underpinnings have been unclear. This work provides a robust theoretical framework elucidating the role of Gaussian noise injection in I2I translation models. We address critical questions on the influence of noise variance on distribution divergence, resilience to unseen noise types, and optimal noise intensity selection. Our contributions include connecting $f$-divergence and score matching, unveiling insights into the impact of Gaussian noise on aligning probability distributions, and demonstrating generalized robustness implications. We also explore choosing an optimal training noise level for consistent performance in noisy environments. Extensive experiments validate our theoretical findings, showing substantial improvements over various I2I baseline models in noisy settings. Our research rigorously grounds Gaussian noise injection for I2I translation, offering a sophisticated theoretical understanding beyond heuristic applications.",
        "keywords": "Image to Image translation;Noise robustness;f-divergence;Score matching;GAN",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Chaohua Shi;Kexin Huang;Lu GAN;Hongqing Liu;Mingrui Zhu;Nannan Wang;Xinbo Gao",
        "authorids": "~Chaohua_Shi1;~Kexin_Huang4;~Lu_GAN2;~Hongqing_Liu1;~Mingrui_Zhu2;~Nannan_Wang1;~Xinbo_Gao5",
        "gender": "M;F;F;M;M;M;M",
        "homepage": "https://github.com/Alan0693;https://github.com/kexin910;https://www.brunel.ac.uk/people/lu-gan;http://iaudio-labss.com/academics/hql/;https://mrzhu.space/;;https://faculty.cqupt.edu.cn/gaoxinbo/zh_CN/index.htm",
        "dblp": ";;45/3353-2;;94/2339;10/8359-1;",
        "google_scholar": ";;zFHPoMYAAAAJ;;a8FXS1UAAAAJ;SRBn7oUAAAAJ;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": ";;0000-0003-1056-7660;;;;0000-0002-7985-0037",
        "linkedin": ";;lu-gan-461a3611/;;;;xinbo-gao-151a2224/",
        "or_profile": "~Chaohua_Shi1;~Kexin_Huang4;~Lu_GAN2;~Hongqing_Liu1;~Mingrui_Zhu2;~Nannan_Wang1;~Xinbo_Gao5",
        "aff": "Xidian University;National University of Defense Technology;Brunel University Uxbridge;Chongqing University of Posts and Telecommunications;Xidian University;Xidian University;Chongqing University of Post and Telecommunications",
        "aff_domain": "xidian.edu.cn;nudt.edu.cn;brunel.ac.uk;np.edu;xidian.edu.cn;xidian.edu.cn;cqupt.edu.cn",
        "position": "MS student;PhD student;Associate Professor;Full Professor;Associate Professor;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nshi2024on,\ntitle={On the Analysis of {GAN}-based Image-to-Image Translation with Gaussian Noise Injection},\nauthor={Chaohua Shi and Kexin Huang and Lu GAN and Hongqing Liu and Mingrui Zhu and Nannan Wang and Xinbo Gao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=sLregLuXpn}\n}",
        "github": "",
        "project": "",
        "reviewers": "SHt1;YTga;Ceu7",
        "pdf_size": 26806097,
        "rating": "3;6;6",
        "confidence": "5;3;3",
        "soundness": "2;3;3",
        "contribution": "1;2;3",
        "presentation": "3;3;3",
        "wc_summary": "77;67;41",
        "wc_strengths": "85;52;33",
        "wc_weaknesses": "372;126;23",
        "wc_questions": "58;133;19",
        "wc_review": "592;378;116",
        "wc_reply_reviewers": "171;21;6",
        "wc_reply_authors": "1851;1722;385",
        "reply_reviewers": "1;1;1",
        "reply_authors": "5;5;1",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            61.666666666666664,
            15.173075568988057
        ],
        "wc_strengths_avg": [
            56.666666666666664,
            21.483844059096022
        ],
        "wc_weaknesses_avg": [
            173.66666666666666,
            146.4111410454212
        ],
        "wc_questions_avg": [
            70.0,
            47.30750469005948
        ],
        "wc_review_avg": [
            362.0,
            194.6552508068217
        ],
        "wc_reply_reviewers_avg": [
            66.0,
            74.4983221287567
        ],
        "wc_reply_authors_avg": [
            1319.3333333333333,
            662.7691067701397
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            1.8856180831641267
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5383892545631001288&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=sLregLuXpn",
        "pdf": "https://openreview.net/pdf?id=sLregLuXpn",
        "email": "xidian.edu.cn;nudt.edu.cn;brunel.ac.uk;np.edu;xidian.edu.cn;xidian.edu.cn;cqupt.edu.cn",
        "author_num": 7,
        "aff_unique_index": "0;1;2;3;0;0;4",
        "aff_unique_norm": "Xidian University;National University of Defense Technology;Brunel University London;Chongqing University of Posts and Telecommunications;Chongqing University of Post and Telecommunications",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "http://www.xidian.edu.cn/;http://www.nudt.edu.cn/;https://www.brunel.ac.uk;http://www.cqupt.edu.cn;http://www.cqupt.edu.cn",
        "aff_unique_abbr": "Xidian;NUDT;Brunel;CQUPT;CQUPT",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Uxbridge",
        "aff_country_unique_index": "0;0;1;0;0;0;0",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "id": "sMFqEror1b",
        "title": "MMToM-QA: Multimodal Theory of Mind Question Answering",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Theory of Mind (ToM), the cognitive ability to understand people's minds, is an essential ingredient for developing machines with human-level social intelligence. Recent machine learning models, particularly large language models, seem to show some aspects of ToM understanding. However, existing ToM benchmarks use unimodal datasets -- either video or text. Human ToM, on the other hand, is more than video or text understanding. People can flexibly reason about another person's mind based on conceptual representations (e.g., goals, beliefs, plans) extracted from any available data, which can include visual cues, linguistic narratives, or both. To address this, we introduce a multimodal Theory of Mind question answering (MMToM-QA) benchmark. MMToM-QA comprehensively evaluates machine ToM both on multimodal data and on different kinds of unimodal data about a person's activity in a household environment. To engineer multimodal ToM capacity, we propose a novel method, BIP-ALM (Bayesian Inverse Planning Accelerated by Language Models). BIP-ALM extracts unified representations from multimodal data and utilizes language models for scalable Bayesian inverse planning. We conducted a systematic comparison of human performance, BIP-ALM, and state-of-the-art models, including GPT-4. The experiments demonstrate that large language models and large multimodal models still lack robust ToM capacity. BIP-ALM, on the other hand, shows promising results, by leveraging the power of both model-based mental inference and language models.",
        "keywords": "Theory of Mind;Question Answering;Multimodal;Uncertainty;Bayesian Inverse Planning;Large Language Models",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "Chuanyang Jin;Yutong Wu;Jing Cao;Jiannan Xiang;Yen-Ling Kuo;Zhiting Hu;Tomer Ullman;Antonio Torralba;Joshua B. Tenenbaum;Tianmin Shu",
        "authorids": "~Chuanyang_Jin2;~Yutong_Wu6;~Jing_Cao3;~Jiannan_Xiang1;~Yen-Ling_Kuo1;~Zhiting_Hu3;~Tomer_Ullman1;~Antonio_Torralba1;~Joshua_B._Tenenbaum1;~Tianmin_Shu1",
        "gender": "M;M;F;M;F;M;;M;;",
        "homepage": "https://chuanyangjin.com/;;;https://szxiangjn.github.io/;http://yenlingkuo.com;http://zhiting.ucsd.edu;;http://web.mit.edu/torralba/www//;;",
        "dblp": "350/4286;;;230/3430;120/3172;134/4031;;t/AntonioBTorralba;t/JoshuaBTenenbaum;163/2175.html",
        "google_scholar": "OZeqpLIAAAAJ;;;l8BS2wsAAAAJ;pNkyRs4AAAAJ;N7_xhHoAAAAJ;;https://scholar.google.com.tw/citations?user=8cxDHS4AAAAJ;;YT_ffdwAAAAJ",
        "orcid": ";;;;;;;;;",
        "linkedin": "chuanyang-jin/;yutong-wu-a5a575209/;jingcao26/;;;;;;;",
        "or_profile": "~Chuanyang_Jin2;~Yutong_Wu6;~Jing_Cao3;~Jiannan_Xiang1;~Yen-Ling_Kuo1;~Zhiting_Hu3;~Tomer_Ullman1;~Antonio_Torralba1;~Joshua_B._Tenenbaum1;~Tianmin_Shu1",
        "aff": "New York University;Harvard University;Massachusetts Institute of Technology;Google DeepMind;University of Virginia, Charlottesville;Amazon;;Massachusetts Institute of Technology;Massachusetts Institute of Technology;Johns Hopkins University",
        "aff_domain": "nyu.edu;harvard.edu;mit.edu;google.com;virginia.edu;amazon.com;;mit.edu;mit.edu;jhu.edu",
        "position": "Undergrad student;MS student;Undergrad student;Student Researcher;Assistant Professor;Researcher;;Full Professor;Professor;Assistant Professor",
        "bibtex": "@misc{\njin2024mmtomqa,\ntitle={{MMT}oM-{QA}: Multimodal Theory of Mind Question Answering},\nauthor={Chuanyang Jin and Yutong Wu and Jing Cao and Jiannan Xiang and Yen-Ling Kuo and Zhiting Hu and Tomer Ullman and Antonio Torralba and Joshua B. Tenenbaum and Tianmin Shu},\nyear={2024},\nurl={https://openreview.net/forum?id=sMFqEror1b}\n}",
        "github": "",
        "project": "",
        "reviewers": "Ewvn;pPZm;Djbm;jYXa",
        "site": "https://openreview.net/forum?id=sMFqEror1b",
        "pdf_size": 6389271,
        "rating": "3;5;5;6",
        "confidence": "4;2;4;4",
        "soundness": "1;2;2;3",
        "contribution": "1;2;2;3",
        "presentation": "2;2;2;3",
        "wc_summary": "64;70;71;84",
        "wc_strengths": "12;23;30;93",
        "wc_weaknesses": "213;193;262;255",
        "wc_questions": "6;27;5;41",
        "wc_review": "295;313;368;473",
        "wc_reply_reviewers": "0;0;0;57",
        "wc_reply_authors": "749;646;1115;1892",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;2;4",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            72.25,
            7.292976072907411
        ],
        "wc_strengths_avg": [
            39.5,
            31.547583108694713
        ],
        "wc_weaknesses_avg": [
            230.75,
            28.74347752099596
        ],
        "wc_questions_avg": [
            19.75,
            15.08931741332258
        ],
        "wc_review_avg": [
            362.25,
            69.36632828685687
        ],
        "wc_reply_reviewers_avg": [
            14.25,
            24.681724007856502
        ],
        "wc_reply_authors_avg": [
            1100.5,
            489.08204833136125
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": -0.13245323570650439,
        "gs_citation": 42,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=84603113575118180&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;2;3;4;5;2;2;6",
        "aff_unique_norm": "New York University;Harvard University;Massachusetts Institute of Technology;Google;University of Virginia;Amazon;Johns Hopkins University",
        "aff_unique_dep": ";;;Google DeepMind;;Amazon.com, Inc.;",
        "aff_unique_url": "https://www.nyu.edu;https://www.harvard.edu;https://web.mit.edu;https://deepmind.com;https://www.virginia.edu;https://www.amazon.com;https://www.jhu.edu",
        "aff_unique_abbr": "NYU;Harvard;MIT;DeepMind;UVA;Amazon;JHU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Charlottesville",
        "aff_country_unique_index": "0;0;0;1;0;0;0;0;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "sMkvcg1i1u",
        "title": "Abstract Interpretation of ReLU Neural Networks with Optimizable Polynomial Relaxations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Neural networks have shown to be highly successful in a wide range of applications. However, due to their black box behavior, their applicability can be restricted in safety-critical environments, and additional verification techniques are required.\nMany state-of-the-art verification approaches use abstract interpretation based on linear overapproximation of the activation functions.\nLinearly approximating non-linear activation functions clearly incurs loss of precision. One way to overcome this limitation is the utilization of polynomial approximations.\nA second way shown to improve the obtained bounds is to optimize the slope of the linear relaxations.\nCombining these insights, we propose a method to enable similar parameter optimization for polynomial relaxations.\nGiven arbitrary polynomials parameterized by their monomial coefficients, we can obtain valid polynomial overapproximations by appropriate upward or downward shifts.\nLeveraging automatic differentiation, we optimize the choice of the monomial coefficients via gradient-based techniques.",
        "keywords": "Neural Network Verification;Abstract Interpretation;Symbolic Interval Propagation",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Philipp Daniel Kern;Carsten Sinz",
        "authorids": "~Philipp_Daniel_Kern1;~Carsten_Sinz1",
        "gender": "M;",
        "homepage": "https://formal.kastel.kit.edu/~kern/?lang=en;",
        "dblp": "273/7179.html;https://dblp.uni-trier.de/pid/s/CarstenSinz.html",
        "google_scholar": "https://scholar.google.com/citations?hl=en;bF9qmvsAAAAJ",
        "orcid": "0000-0002-7618-7401;",
        "linkedin": ";",
        "or_profile": "~Philipp_Daniel_Kern1;~Carsten_Sinz1",
        "aff": "Karlsruher Institut f\u00fcr Technologie;Fachhochschule Karlsruhe, Hochschule f\u00fcr Technik",
        "aff_domain": "kit.edu;fh-karlsruhe.de",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nkern2024abstract,\ntitle={Abstract Interpretation of Re{LU} Neural Networks with Optimizable Polynomial Relaxations},\nauthor={Philipp Daniel Kern and Carsten Sinz},\nyear={2024},\nurl={https://openreview.net/forum?id=sMkvcg1i1u}\n}",
        "github": "",
        "project": "",
        "reviewers": "yS99;JLxb;2QHH;PQk4",
        "site": "https://openreview.net/forum?id=sMkvcg1i1u",
        "pdf_size": 795175,
        "rating": "3;3;5;5",
        "confidence": "4;4;4;3",
        "soundness": "3;3;3;3",
        "contribution": "1;2;2;2",
        "presentation": "2;2;3;3",
        "wc_summary": "154;299;37;69",
        "wc_strengths": "49;40;20;53",
        "wc_weaknesses": "443;198;104;82",
        "wc_questions": "561;190;3;68",
        "wc_review": "1207;727;164;272",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            139.75,
            101.39865630273411
        ],
        "wc_strengths_avg": [
            40.5,
            12.737739202856996
        ],
        "wc_weaknesses_avg": [
            206.75,
            143.1875954822903
        ],
        "wc_questions_avg": [
            205.5,
            215.94733154174423
        ],
        "wc_review_avg": [
            592.5,
            412.9264462346775
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:2SioxNYuKgUJ:scholar.google.com/&scioq=Abstract+Interpretation+of+ReLU+Neural+Networks+with+Optimizable+Polynomial+Relaxations&hl=en&as_sdt=0,3",
        "gs_version_total": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Karlsruher Institut f\u00fcr Technologie;Fachhochschule Karlsruhe",
        "aff_unique_dep": ";Hochschule f\u00fcr Technik",
        "aff_unique_url": "https://www.kit.edu;https://www.fh-ka.de",
        "aff_unique_abbr": "KIT;FHK",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Germany"
    },
    {
        "title": "Towards Meta-Pruning via Optimal Transport",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17651",
        "id": "sMoifbuxjB",
        "author_site": "Alexander Theus, Olin Geimer, Friedrich Wicke, Thomas Hofmann, Sotiris Anagnostidis, Sidak Pal Singh",
        "tldr": "",
        "abstract": "Structural pruning of neural networks conventionally relies on identifying and discarding less important neurons, a practice often resulting in significant accuracy loss that necessitates subsequent fine-tuning efforts. This paper introduces a novel approach named Intra-Fusion, challenging this prevailing pruning paradigm.\nUnlike existing methods that focus on designing meaningful neuron importance metrics, Intra-Fusion redefines the overlying pruning procedure.\nThrough utilizing the concepts of model fusion and Optimal Transport, we leverage an agnostically given importance metric to arrive at a more effective sparse model representation.\nNotably, our approach achieves substantial accuracy recovery without the need for resource-intensive fine-tuning, making it an efficient and promising tool for neural network compression.\nAdditionally, we explore how fusion can be added to the pruning process to significantly decrease the training time while maintaining competitive performance. We benchmark our results for various networks on commonly used datasets such as CIFAR-10, CIFAR-100, and ImageNet. More broadly, we hope that the proposed Intra-Fusion approach invigorates exploration into a fresh alternative to the predominant compression approaches.\nOur code is available [here](https://github.com/alexandertheus/Intra-Fusion).",
        "keywords": "Pruning;Fusion",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/f3880bade5a956d1464267f23a17af22bb840fb2.zip",
        "author": "Alexander Theus;Olin Geimer;Friedrich Wicke;Thomas Hofmann;Sotiris Anagnostidis;Sidak Pal Singh",
        "authorids": "~Alexander_Theus1;~Olin_Geimer1;~Friedrich_Wicke1;~Thomas_Hofmann1;~Sotiris_Anagnostidis1;~Sidak_Pal_Singh1",
        "gender": "M;;;M;M;",
        "homepage": ";;;http://www.da.inf.ethz.ch/;;http://sidakpal.com/",
        "dblp": ";;;h/ThHofmann;286/1763;189/9168",
        "google_scholar": "70l0vyEAAAAJ;;;T3hAyLkAAAAJ;qjzTKWUAAAAJ;c59mPS4AAAAJ",
        "orcid": "0000-0003-3633-5243;;;;;",
        "linkedin": ";olin-geimer/;;thomas-hofmann-1ab2402/;sotiris-anagnostidis-b064a5129/;",
        "or_profile": "~Alexander_Theus1;~Olin_Geimer1;~Friedrich_Wicke1;~Thomas_Hofmann1;~Sotiris_Anagnostidis1;~Sidak_Pal_Singh1",
        "aff": "ETHZ - ETH Zurich;Department of Computer Science, ETHZ - ETH Zurich;;Swiss Federal Institute of Technology;ETH Zurich;Max Planck Institute for Intelligent Systems",
        "aff_domain": "ethz.ch;inf.ethz.ch;;ethz.ch;inf.ethz.ch;tuebingen.mpg.de",
        "position": "MS student;MS student;;Full Professor;PhD student;PhD student",
        "bibtex": "@inproceedings{\ntheus2024towards,\ntitle={Towards Meta-Pruning via Optimal Transport},\nauthor={Alexander Theus and Olin Geimer and Friedrich Wicke and Thomas Hofmann and Sotiris Anagnostidis and Sidak Pal Singh},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=sMoifbuxjB}\n}",
        "github": "",
        "project": "",
        "reviewers": "u8hy;hkmL;ZhLo;vYA3;t7SM",
        "pdf_size": 10283850,
        "rating": "6;6;8;8;8",
        "confidence": "4;1;3;5;5",
        "soundness": "3;2;3;3;3",
        "contribution": "3;2;3;3;3",
        "presentation": "3;1;3;3;3",
        "wc_summary": "112;92;29;50;56",
        "wc_strengths": "31;152;85;257;68",
        "wc_weaknesses": "152;105;73;98;272",
        "wc_questions": "4;55;2;2;14",
        "wc_review": "299;404;189;407;410",
        "wc_reply_reviewers": "0;56;0;0;0",
        "wc_reply_authors": "573;423;669;286;547",
        "reply_reviewers": "0;1;0;0;0",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            7.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.6,
            1.4966629547095764
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.8,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.6,
            0.8000000000000002
        ],
        "wc_summary_avg": [
            67.8,
            30.002666548158683
        ],
        "wc_strengths_avg": [
            118.6,
            79.54017852632718
        ],
        "wc_weaknesses_avg": [
            140.0,
            70.7757020452641
        ],
        "wc_questions_avg": [
            15.4,
            20.293841430345317
        ],
        "wc_review_avg": [
            341.8,
            87.12152432091625
        ],
        "wc_reply_reviewers_avg": [
            11.2,
            22.4
        ],
        "wc_reply_authors_avg": [
            499.6,
            132.5316565956979
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.6000991981489792,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12884267001131795314&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=sMoifbuxjB",
        "pdf": "https://openreview.net/pdf?id=sMoifbuxjB",
        "email": "ethz.ch;inf.ethz.ch;;ethz.ch;inf.ethz.ch;tuebingen.mpg.de",
        "author_num": 6,
        "aff_unique_index": "0;0;1;0;2",
        "aff_unique_norm": "ETH Zurich;Swiss Federal Institute of Technology;Max Planck Institute for Intelligent Systems",
        "aff_unique_dep": ";;Intelligent Systems",
        "aff_unique_url": "https://www.ethz.ch;https://www.ethz.ch;https://www.mpi-is.mpg.de",
        "aff_unique_abbr": "ETHZ;ETH Zurich;MPI-IS",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Zurich",
        "aff_country_unique_index": "0;0;0;0;1",
        "aff_country_unique": "Switzerland;Germany"
    },
    {
        "id": "sNDysNeSHg",
        "title": "Splatting-based Motion Context Encoding for Deep Video Compression",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recent video compression studies aim to compress videos in a more optimal space using deep neural networks. Most of them employ a strategy where they use motion information to warp the previous frame to align with the current frame, and then only compress the information newly appearing in the current frame. While this enhances the compression efficiency of each frame, additional bits are required to compress the motion information alongside it. In this paper, we explore a methodology that improves motion compression by warping previous motions just like frames. However, within the traditional backward warping-based framework, a dilemma arises where the decoded motion is needed to warp the reference motion. To solve this problem, we propose a forward warping-based framework for video compression called SVC (Splatting-based Video Compression). While SVC offers the advantage of enabling the use of motion context, forward warping has several issues compared to backward warping and we propose additional tricks to address these challenges. Intensive experiments on the UVG, HEVC, and MCL-JCV benchmarks demonstrate that motion context encoding through SVC is indeed more effective compared to various methods based on backward warping, including traditional codecs.",
        "keywords": "Video Compression;Motion Compensation;Splatting",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Hyeongmin Lee;Chajin Shin;Sangjin Lee;Sangyoun Lee",
        "authorids": "~Hyeongmin_Lee1;~Chajin_Shin1;~Sangjin_Lee2;~Sangyoun_Lee1",
        "gender": "M;M;M;M",
        "homepage": "https://hyeongminlee.github.io/;;;http://mvp.yonsei.ac.kr",
        "dblp": "217/0406;;;65/1227",
        "google_scholar": "https://scholar.google.co.kr/citations?user=eEB3K6gAAAAJ;https://scholar.google.co.kr/citations?hl=ko;W0TdF-EAAAAJ;",
        "orcid": "0000-0001-5923-5419;;;",
        "linkedin": "hyeongmin-lee-014221150/;;;",
        "or_profile": "~Hyeongmin_Lee1;~Chajin_Shin1;~Sangjin_Lee2;~Sangyoun_Lee1",
        "aff": "Twelve Labs;Yonsei University;Yonsei University;Yonsei University",
        "aff_domain": "twelvelabs.io;yonsei.ac.kr;yonsei.ac.kr;yonsei.ac.kr",
        "position": "Researcher;PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nlee2024splattingbased,\ntitle={Splatting-based Motion Context Encoding for Deep Video Compression},\nauthor={Hyeongmin Lee and Chajin Shin and Sangjin Lee and Sangyoun Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=sNDysNeSHg}\n}",
        "github": "",
        "project": "",
        "reviewers": "5LRL;iK9f;eU62;Huhc",
        "site": "https://openreview.net/forum?id=sNDysNeSHg",
        "pdf_size": 928042,
        "rating": "3;3;3;3",
        "confidence": "5;4;5;4",
        "soundness": "2;2;3;2",
        "contribution": "2;3;2;2",
        "presentation": "1;3;2;2",
        "wc_summary": "31;124;33;89",
        "wc_strengths": "28;76;33;36",
        "wc_weaknesses": "212;422;166;191",
        "wc_questions": "2;25;24;46",
        "wc_review": "273;647;256;362",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            69.25,
            39.25796097608738
        ],
        "wc_strengths_avg": [
            43.25,
            19.122957407263137
        ],
        "wc_weaknesses_avg": [
            247.75,
            101.91264641839108
        ],
        "wc_questions_avg": [
            24.25,
            15.562374497485916
        ],
        "wc_review_avg": [
            384.5,
            156.80959792053545
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:5W9lFBQyjC4J:scholar.google.com/&scioq=Splatting-based+Motion+Context+Encoding+for+Deep+Video+Compression&hl=en&as_sdt=0,31",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Twelve Labs;Yonsei University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://twelvelabs.com;https://www.yonsei.ac.kr",
        "aff_unique_abbr": ";Yonsei",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "United States;South Korea"
    },
    {
        "title": "Neural Common Neighbor with Completion for Link Prediction",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17650",
        "id": "sNFLN3itAd",
        "author_site": "Xiyuan Wang, Haotong Yang, Muhan Zhang",
        "tldr": "",
        "abstract": "In this work, we propose a novel link prediction model and further boost it by studying graph incompleteness. First, We introduce MPNN-then-SF, an innovative architecture leveraging structural feature (SF) to guide MPNN's representation pooling, with its implementation, namely Neural Common Neighbor (NCN). NCN exhibits superior expressiveness and scalability compared with existing models, which can be classified into two categories: SF-then-MPNN, augmenting MPNN's input with SF, and SF-and-MPNN, decoupling SF and MPNN. Second, we investigate the impact of graph incompleteness---the phenomenon that some links are unobserved in the input graph---on SF, like the common neighbor. Through dataset visualization, we observe that incompleteness reduces common neighbors and induces distribution shifts, significantly affecting model performance. To address this issue, we propose to use a link prediction model to complete the common neighbor structure. Combining this method with NCN, we propose Neural Common Neighbor with Completion (NCNC). NCN and NCNC outperform recent strong baselines by large margins, and NCNC further surpasses state-of-the-art models in standard link prediction benchmarks.",
        "keywords": "Graph Neural Network;Link Prediction",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/6c2eefd631a3824ca26e6560029fb77319cdac2f.zip",
        "author": "Xiyuan Wang;Haotong Yang;Muhan Zhang",
        "authorids": "~Xiyuan_Wang1;~Haotong_Yang1;~Muhan_Zhang1",
        "gender": ";M;M",
        "homepage": ";https://haotong-yang.github.io/;https://muhanzhang.github.io/",
        "dblp": "95/8542;329/6378.html;157/5518",
        "google_scholar": ";Zn2kjLoAAAAJ;https://scholar.google.com.hk/citations?user=OBBqkosAAAAJ",
        "orcid": ";;0000-0002-7680-6401",
        "linkedin": "%E5%B8%8C%E5%85%83-%E7%8E%8B-969660221/;;jerry-muhan-zhang-a33a1777/",
        "or_profile": "~Xiyuan_Wang1;~Haotong_Yang1;~Muhan_Zhang1",
        "aff": "Peking University;Peking University;Peking University",
        "aff_domain": "pku.edu.cn;pku.edu.cn;pku.edu.cn",
        "position": "PhD student;PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nwang2024neural,\ntitle={Neural Common Neighbor with Completion for Link Prediction},\nauthor={Xiyuan Wang and Haotong Yang and Muhan Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=sNFLN3itAd}\n}",
        "github": "",
        "project": "",
        "reviewers": "nThn;Ztrp;tCCB",
        "pdf_size": 1003707,
        "rating": "3;6;8",
        "confidence": "4;4;4",
        "soundness": "2;3;4",
        "contribution": "2;3;3",
        "presentation": "2;3;3",
        "wc_summary": "82;79;111",
        "wc_strengths": "36;107;92",
        "wc_weaknesses": "46;136;59",
        "wc_questions": "315;2;10",
        "wc_review": "479;324;272",
        "wc_reply_reviewers": "0;0;25",
        "wc_reply_authors": "2464;483;303",
        "reply_reviewers": "0;0;1",
        "reply_authors": "6;1;1",
        "rating_avg": [
            5.666666666666667,
            2.0548046676563256
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            90.66666666666667,
            14.429907214608907
        ],
        "wc_strengths_avg": [
            78.33333333333333,
            30.554141381415967
        ],
        "wc_weaknesses_avg": [
            80.33333333333333,
            39.718453589679896
        ],
        "wc_questions_avg": [
            109.0,
            145.70060626732706
        ],
        "wc_review_avg": [
            358.3333333333333,
            87.92547349254873
        ],
        "wc_reply_reviewers_avg": [
            8.333333333333334,
            11.785113019775793
        ],
        "wc_reply_authors_avg": [
            1083.3333333333333,
            979.0404599515907
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            2.3570226039551585
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 65,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7178652401377003334&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=sNFLN3itAd",
        "pdf": "https://openreview.net/pdf?id=sNFLN3itAd",
        "email": "pku.edu.cn;pku.edu.cn;pku.edu.cn",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Peking University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.pku.edu.cn",
        "aff_unique_abbr": "Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "sNWQUTkDmA",
        "title": "Observable Propagation: Uncovering Feature Vectors in Transformers",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "A key goal of current mechanistic interpretability research in NLP is to find linear features (also called \"feature vectors\") for transformers:  directions in activation space corresponding to concepts that are used by a given model in its computation. Present state-of-the-art methods for finding linear features require large amounts of labelled data -- both laborious to acquire and computationally expensive to utilize. In this work, we introduce a novel method, called \"observable propagation\" (in short: \"ObsProp\"), for finding linear features used by transformer language models in computing a given task -- using almost no data. Our paradigm centers on the concept of \"observables\", linear functionals corresponding to given tasks. We then introduce a mathematical theory for the analysis of feature vectors: we prove that LayerNorm nonlinearities in high dimensions do not affect the direction of feature vectors; we also introduce a similarity metric between feature vectors called the \"coupling coefficient\", and prove that it accurately estimates the degree to which one feature's output correlates with another's. Armed with these tools, we use observable propagation to investigate the features that cause gendered occupational bias in a large language model. In our experiments, we identify the specific features used by the model for predicting occupation based on a gendered name, and find that some of the same features are used by the model for predicting grammatical gender. Our results suggest that observable propagation can be used to better understand the mechanisms responsible for bias in large language models.",
        "keywords": "large language models;mechanistic interpretability;feature vectors",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Jacob Dunefsky;Arman Cohan",
        "authorids": "~Jacob_Dunefsky1;~Arman_Cohan1",
        "gender": "M;M",
        "homepage": "https://jacobdunefsky.github.io;http://www.armancohan.com",
        "dblp": ";160/1727",
        "google_scholar": ";https://scholar.google.com/citations?hl=en",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Jacob_Dunefsky1;~Arman_Cohan1",
        "aff": "Department of Computer Science, Yale University;Allen Institute for Artificial Intelligence",
        "aff_domain": "cs.yale.edu;allenai.org",
        "position": "PhD student;Research Scientist",
        "bibtex": "@misc{\ndunefsky2024observable,\ntitle={Observable Propagation: Uncovering Feature Vectors in Transformers},\nauthor={Jacob Dunefsky and Arman Cohan},\nyear={2024},\nurl={https://openreview.net/forum?id=sNWQUTkDmA}\n}",
        "github": "",
        "project": "",
        "reviewers": "VvVc;Gf3o;DiKb",
        "site": "https://openreview.net/forum?id=sNWQUTkDmA",
        "pdf_size": 539829,
        "rating": "3;3;5",
        "confidence": "2;3;3",
        "soundness": "2;1;2",
        "contribution": "2;2;2",
        "presentation": "1;4;3",
        "wc_summary": "16;223;143",
        "wc_strengths": "16;65;40",
        "wc_weaknesses": "123;188;48",
        "wc_questions": "1;21;13",
        "wc_review": "156;497;244",
        "wc_reply_reviewers": "0;0;24",
        "wc_reply_authors": "475;1135;487",
        "reply_reviewers": "0;0;1",
        "reply_authors": "1;2;2",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "wc_summary_avg": [
            127.33333333333333,
            85.23040667638647
        ],
        "wc_strengths_avg": [
            40.333333333333336,
            20.00555478416488
        ],
        "wc_weaknesses_avg": [
            119.66666666666667,
            57.20334100576839
        ],
        "wc_questions_avg": [
            11.666666666666666,
            8.219218670625303
        ],
        "wc_review_avg": [
            299.0,
            144.54295785913152
        ],
        "wc_reply_reviewers_avg": [
            8.0,
            11.313708498984761
        ],
        "wc_reply_authors_avg": [
            699.0,
            308.33747744962824
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9968807830872532017&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Yale University;Allen Institute for Artificial Intelligence",
        "aff_unique_dep": "Department of Computer Science;",
        "aff_unique_url": "https://www.yale.edu;https://allenai.org",
        "aff_unique_abbr": "Yale;AI2",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "sNtDKdcI1f",
        "title": "A Long Way To Go: Investigating Length Correlations in RLHF",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Great successes have been reported using Reinforcement Learning from Human Feedback (RLHF) to align large language models. As the growth of open-source preference datasets, reward models, and language models has enabled wider experimentation, RLHF's benefits have been demonstrated in settings beyond general chat agents, including web question answering, summarization, and multi-turn dialogue. However, RLHF has also been consistently observed to drive models to produce longer outputs. This paper demonstrates that optimizing for response length is a significant factor behind RLHF's reported improvements on helpfulness. First, we study the relationship between reward and length for reward models trained on three open-source preference datasets. In these settings, length correlates strongly with reward, and improvements in reward score are driven in large part by shifting the distribution over output lengths. We then explore interventions during both RL and reward model learning to see if we can achieve the same downstream improvements as RLHF without increasing length. While our interventions mitigate length increases, they aren't uniformly effective across settings. Furthermore, we find that even running RLHF with a reward based solely on length can reproduce most of the downstream improvements over the initial policy model, showing that reward models in these settings have a long way to go.",
        "keywords": "Natural Language Processing;Large Language Models;RLHF;Reward Hacking",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Prasann Singhal;Tanya Goyal;Jiacheng Xu;Greg Durrett",
        "authorids": "~Prasann_Singhal1;~Tanya_Goyal1;~Jiacheng_Xu2;~Greg_Durrett1",
        "gender": "M;F;M;M",
        "homepage": "https://prasanns.github.io/;;https://jiacheng-xu.github.io/;http://www.cs.utexas.edu/~gdurrett/",
        "dblp": ";176/9145;188/6025;69/7968",
        "google_scholar": ";w72MSFoAAAAJ;yfbcnfUAAAAJ;https://scholar.google.com.tw/citations?user=EpQ_sDEAAAAJ",
        "orcid": ";;;",
        "linkedin": "prasann-singhal-a975b8170;;;",
        "or_profile": "~Prasann_Singhal1;~Tanya_Goyal1;~Jiacheng_Xu2;~Greg_Durrett1",
        "aff": ", University of Texas at Austin;Princeton University;SalesForce.com;University of Texas at Austin",
        "aff_domain": "cs.utexas.edu;princeton.edu;salesforce.com;utexas.edu",
        "position": "Undergrad student;Postdoc;Researcher;Associate Professor",
        "bibtex": "@misc{\nsinghal2024a,\ntitle={A Long Way To Go: Investigating Length Correlations in {RLHF}},\nauthor={Prasann Singhal and Tanya Goyal and Jiacheng Xu and Greg Durrett},\nyear={2024},\nurl={https://openreview.net/forum?id=sNtDKdcI1f}\n}",
        "github": "",
        "project": "",
        "reviewers": "McHv;rbH1;tqJD;PX4u",
        "site": "https://openreview.net/forum?id=sNtDKdcI1f",
        "pdf_size": 1838679,
        "rating": "6;6;6;6",
        "confidence": "4;4;3;3",
        "soundness": "4;3;3;4",
        "contribution": "3;3;2;3",
        "presentation": "2;2;2;3",
        "wc_summary": "48;122;101;197",
        "wc_strengths": "33;47;26;24",
        "wc_weaknesses": "76;307;92;52",
        "wc_questions": "242;4;60;1",
        "wc_review": "399;480;279;274",
        "wc_reply_reviewers": "36;27;0;0",
        "wc_reply_authors": "641;928;404;223",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "2;3;1;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            117.0,
            53.48364235913631
        ],
        "wc_strengths_avg": [
            32.5,
            9.013878188659973
        ],
        "wc_weaknesses_avg": [
            131.75,
            102.17723572303177
        ],
        "wc_questions_avg": [
            76.75,
            98.25826937209916
        ],
        "wc_review_avg": [
            358.0,
            86.40312494348801
        ],
        "wc_reply_reviewers_avg": [
            15.75,
            16.068213964221414
        ],
        "wc_reply_authors_avg": [
            549.0,
            264.2943434884674
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 119,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17792312030938285213&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "University of Texas at Austin;Princeton University;Salesforce",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.utexas.edu;https://www.princeton.edu;https://www.salesforce.com",
        "aff_unique_abbr": "UT Austin;Princeton;Salesforce",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Austin;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "sOHVDPqoUJ",
        "title": "Less is More: Selective Layer Finetuning with SubTuning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Finetuning a pretrained model has become the standard approach for training neural networks on novel tasks, leading to rapid convergence and enhanced performance. In this work, we present a parameter-efficient finetuning method, wherein we selectively train a carefully chosen subset of layers while keeping the remaining weights frozen at their initial (pre-trained) values. We observe that not all layers are created equal: different layers across the network contribute variably to the overall performance, and the optimal choice of layers is contingent upon the downstream task and the underlying data distribution. We demonstrate that our proposed method, termed *subset finetuning* (or SubTuning), offers several advantages over conventional finetuning. We show that SubTuning outperforms both finetuning and linear probing in scenarios with scarce or corrupted data, achieving state-of-the-art results compared to competing methods for finetuning on small datasets. When data is abundant, SubTuning often attains performance comparable to finetuning while simultaneously enabling efficient inference in a multi-task setting when deployed alongside other models. We showcase the efficacy of SubTuning across various tasks, diverse network architectures and pre-training methods.",
        "keywords": "Parameter Efficient Transfer Learning;Multi-task Learning;Understanding Transfer Learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Gal Kaplun;Andrey Gurevich;Tal Swisa;Mazor David;Shai Shalev-Shwartz;eran malach",
        "authorids": "~Gal_Kaplun1;~Andrey_Gurevich1;~Tal_Swisa1;~Mazor_David1;~Shai_Shalev-Shwartz1;~eran_malach1",
        "gender": "M;M;M;F;M;M",
        "homepage": "http://www.galkaplun.com;;;https://www.linkedin.com/in/mazor-david;http://www.cs.huji.ac.il/~shais/;",
        "dblp": "237/9816;213/3557;340/4123;;95/2750;202/2566",
        "google_scholar": "y4BzFYsAAAAJ;8ezl4NAAAAAJ;;;https://scholar.google.co.il/citations?user=uYVc9koAAAAJ;I15dUOwAAAAJ",
        "orcid": ";;;;;",
        "linkedin": "gal-kaplun-865496151/;andrey-gurevich-b738bba7/;https://linkedin.com/in/tal-swisa;;;",
        "or_profile": "~Gal_Kaplun1;~Andrey_Gurevich1;~Tal_Swisa1;~Mazor_David1;~Shai_Shalev-Shwartz1;~eran_malach1",
        "aff": ";Mobileye;;Mobileye;Hebrew University, Hebrew University of Jerusalem;Harvard University",
        "aff_domain": ";mobileye.com;;mobileye.com;cs.huji;harvard.edu",
        "position": ";Researcher;;Researcher;Full Professor;Postdoc",
        "bibtex": "@misc{\nkaplun2024less,\ntitle={Less is More: Selective Layer Finetuning with SubTuning},\nauthor={Gal Kaplun and Andrey Gurevich and Tal Swisa and Mazor David and Shai Shalev-Shwartz and eran malach},\nyear={2024},\nurl={https://openreview.net/forum?id=sOHVDPqoUJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "rTPG;zhTK;nACT;NuCG",
        "site": "https://openreview.net/forum?id=sOHVDPqoUJ",
        "pdf_size": 2800232,
        "rating": "3;3;5;5",
        "confidence": "4;4;4;4",
        "soundness": "2;2;3;2",
        "contribution": "3;1;2;2",
        "presentation": "3;3;3;2",
        "wc_summary": "105;63;113;88",
        "wc_strengths": "55;59;64;131",
        "wc_weaknesses": "1013;324;175;802",
        "wc_questions": "687;24;135;99",
        "wc_review": "1860;470;487;1120",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            92.25,
            19.149086140074676
        ],
        "wc_strengths_avg": [
            77.25,
            31.19595326320387
        ],
        "wc_weaknesses_avg": [
            578.5,
            341.4399654404856
        ],
        "wc_questions_avg": [
            236.25,
            263.303413384635
        ],
        "wc_review_avg": [
            984.25,
            569.4463868530557
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9208676030989161782&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "Mobileye;Hebrew University of Jerusalem;Harvard University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.mobileye.com;https://www.huji.ac.il;https://www.harvard.edu",
        "aff_unique_abbr": "Mobileye;HUJI;Harvard",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "Israel;United States"
    },
    {
        "title": "NeRM: Learning Neural Representations for High-Framerate Human Motion Synthesis",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17649",
        "id": "sOJriBlOFd",
        "author_site": "Dong Wei, Huaijiang Sun, Bin Li, Xiaoning Sun, Shengxiang Hu, Weiqing Li, Jianfeng Lu",
        "tldr": "",
        "abstract": "Generating realistic human motions with high framerate is an underexplored task, due to the varied framerates of training data, huge memory burden brought by high framerates and slow sampling speed of generative models. Recent advances make a compromise for training by downsampling high-framerate details away and discarding low-framerate samples, which suffer from severe information loss and restricted-framerate generation. In this paper, we found that the recent emerging paradigm of Implicit Neural Representations (INRs) that encode a signal into a continuous function can effectively tackle this challenging problem. To this end, we introduce NeRM, a generative model capable of taking advantage of varied-size data and capturing variational distribution of motions for high-framerate motion synthesis. By optimizing latent representation and a auto-decoder conditioned on temporal coordinates, NeRM learns continuous motion fields of sampled motion clips that ingeniously avoid explicit modeling of raw varied-size motions. This expressive latent representation is then used to learn a diffusion model that enables both unconditional and conditional generation of human motions. We demonstrate that our approach achieves competitive results with state-of-the-art methods, and can generate arbitrary framerate motions. Additionally, we show that NeRM is not only memory-friendly, but also highly efficient even when generating high-framerate motions.",
        "keywords": "Human motion synthesis;implicit neural representation;diffusion model;any-framerate training",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/9cf3d660602112f5988b8f12fd967010b789b577.zip",
        "author": "Dong Wei;Huaijiang Sun;Bin Li;Xiaoning Sun;Shengxiang Hu;Weiqing Li;Jianfeng Lu",
        "authorids": "~Dong_Wei3;~Huaijiang_Sun3;~Bin_Li21;~Xiaoning_Sun1;~Shengxiang_Hu1;~Weiqing_Li2;~Jianfeng_Lu6",
        "gender": "M;M;M;F;;M;M",
        "homepage": ";;;;;;",
        "dblp": "34/4292-7;14/7280;89/6764;87/5000;166/3832-1;15/3702;82/6187-3",
        "google_scholar": "https://scholar.google.com.hk/citations?user=XQM9rEMAAAAJ;Bx6bgH4AAAAJ;;https://scholar.google.com.hk/citations?hl=zh-CN;WlNT7GkAAAAJ;;",
        "orcid": "0000-0002-7299-7693;;;;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Dong_Wei3;~Huaijiang_Sun3;~Bin_Li21;~Xiaoning_Sun1;~Shengxiang_Hu1;~Weiqing_Li2;~Jianfeng_Lu6",
        "aff": "Nanjing University of Science and Technology;Nanjing University of Science and Technology;Tianjin AiForward Science and Technology Co., Ltd., China;Nanjing University of Science and Technology;Nanjing University of Science and Technology;Nanjing University of Science and Technology;Nanjing University of Science and Technology",
        "aff_domain": "njust.edu.cn;njust.edu.cn;aiforward.com;njust.edu.cn;njust.edu.cn;njust.edu.cn;njust.edu.cn",
        "position": "Postdoc;Full Professor;Researcher;PhD student;PhD student;Associate Professor;Full Professor",
        "bibtex": "@inproceedings{\nwei2024nerm,\ntitle={Ne{RM}: Learning Neural Representations for High-Framerate Human Motion Synthesis},\nauthor={Dong Wei and Huaijiang Sun and Bin Li and Xiaoning Sun and Shengxiang Hu and Weiqing Li and Jianfeng Lu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=sOJriBlOFd}\n}",
        "github": "",
        "project": "",
        "reviewers": "KnYZ;WpJV;9SXt;VxZF",
        "pdf_size": 6524248,
        "rating": "5;8;8;8",
        "confidence": "4;4;4;3",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "111;33;59;87",
        "wc_strengths": "80;50;81;79",
        "wc_weaknesses": "310;122;87;57",
        "wc_questions": "5;45;57;66",
        "wc_review": "506;250;284;289",
        "wc_reply_reviewers": "219;0;5;0",
        "wc_reply_authors": "1517;814;848;1129",
        "reply_reviewers": "2;0;1;0",
        "reply_authors": "3;2;2;2",
        "rating_avg": [
            7.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            72.5,
            29.304436524185206
        ],
        "wc_strengths_avg": [
            72.5,
            13.009611831257688
        ],
        "wc_weaknesses_avg": [
            144.0,
            98.56216312561327
        ],
        "wc_questions_avg": [
            43.25,
            23.306383245797704
        ],
        "wc_review_avg": [
            332.25,
            101.43070294540998
        ],
        "wc_reply_reviewers_avg": [
            56.0,
            94.13022893842339
        ],
        "wc_reply_authors_avg": [
            1077.0,
            281.91931469837255
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9629714741590746432&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=sOJriBlOFd",
        "pdf": "https://openreview.net/pdf?id=sOJriBlOFd",
        "email": "njust.edu.cn;njust.edu.cn;aiforward.com;njust.edu.cn;njust.edu.cn;njust.edu.cn;njust.edu.cn",
        "author_num": 7,
        "aff_unique_index": "0;0;1;0;0;0;0",
        "aff_unique_norm": "Nanjing University of Science and Technology;Tianjin AiForward Science and Technology Co., Ltd.",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.nust.edu.cn/;",
        "aff_unique_abbr": "NUST;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "sOXKeeVxqW",
        "title": "MoleSG: A Multi-Modality Molecular Pre-training Framework by Joint Non-overlapping Masked Reconstruction of SMILES and Graph",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Self-supervised pre-training plays an important role in molecular representation learning because labeled molecular data are usually limited in many tasks, such as chemical property prediction and virtual screening. However, most existing molecular pre-training methods focus on one modality of molecular data, and the complementary information of two important modalities, SMILES and graph, are not fully explored. In this study, we propose a straightforward yet effective multi-modality pre-training framework for Molecular SMILES and Graph (MoleSG). Specifically, the SMILES sequence data and graph data are first tokenized so that they can be processed by a unified transformer-based backbone network, which is trained by a masked reconstruction strategy. In addition, we introduce a specialized non-overlapping masking strategy to encourage fine-grained interaction between these two modalities. Experimental results show that our framework achieves state-of-the-art performance in a series of molecular property prediction tasks, and detailed ablation study demonstrates efficacy of the multi-modality structure and the masking strategy.",
        "keywords": "Molecular representation learning;Molecular pre-training;Molecular property prediction;AI for science",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/0c21558ffbd73a46ec617c8773b0376375ccfabe.pdf",
        "author": "Ao Shen;Ming'zhi Yuan;Yingfan MA;Manning Wang",
        "authorids": "~Ao_Shen2;~Ming'zhi_Yuan1;~Yingfan_MA1;~Manning_Wang1",
        "gender": ";M;F;M",
        "homepage": ";;http://FDUTinaMa.github.io;http://www.fudanmiccai.org/nd.jsp?id=58#_np=117_394",
        "dblp": ";;;23/5931",
        "google_scholar": ";https://scholar.google.com.hk/citations?user=oheIjbUAAAAJ;;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": "0009-0001-1937-6855;0000-0003-1322-7530;;0000-0002-9255-3897",
        "linkedin": ";;;",
        "or_profile": "~Ao_Shen2;~Ming'zhi_Yuan1;~Yingfan_MA1;~Manning_Wang1",
        "aff": "Fudan University;Fudan University;Fudan University;Fudan University",
        "aff_domain": "fudan.edu.cn;fudan.edu.cn;fudan.edu.cn;fudan.edu.cn",
        "position": "PhD student;PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nshen2024molesg,\ntitle={Mole{SG}: A Multi-Modality Molecular Pre-training Framework by Joint Non-overlapping Masked Reconstruction of {SMILES} and Graph},\nauthor={Ao Shen and Ming'zhi Yuan and Yingfan MA and Manning Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=sOXKeeVxqW}\n}",
        "github": "",
        "project": "",
        "reviewers": "QzZb;DRL8;82Wx;Wr3h",
        "site": "https://openreview.net/forum?id=sOXKeeVxqW",
        "pdf_size": 889844,
        "rating": "3;3;5;5",
        "confidence": "4;4;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "55;66;72;73",
        "wc_strengths": "31;33;53;61",
        "wc_weaknesses": "291;226;177;407",
        "wc_questions": "21;2;4;6",
        "wc_review": "398;327;306;547",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            66.5,
            7.158910531638177
        ],
        "wc_strengths_avg": [
            44.5,
            12.835497652993435
        ],
        "wc_weaknesses_avg": [
            275.25,
            86.14631448878124
        ],
        "wc_questions_avg": [
            8.25,
            7.495832175282475
        ],
        "wc_review_avg": [
            394.5,
            94.41530596253978
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:AVNtmEjy8z8J:scholar.google.com/&scioq=MoleSG:+A+Multi-Modality+Molecular+Pre-training+Framework+by+Joint+Non-overlapping+Masked+Reconstruction+of+SMILES+and+Graph&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Fudan University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.fudan.edu.cn",
        "aff_unique_abbr": "Fudan",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "sP0Aev2Gis",
        "title": "G2PTL: A Pre-trained Model for Delivery Address and its Applications in Logistics System",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Text-based delivery addresses, as the data foundation for logistics systems, contain abundant and crucial location information. How to effectively encode the delivery address is a core task to boost the performance of downstream tasks in the logistics system. Pre-trained Models (PTMs) designed for Natural Language Process (NLP) have emerged as the dominant tools for encoding semantic information in text. Though promising, those NLP-based PTMs fall short of encoding geographic knowledge in the delivery address, which considerably trims down the performance of delivery-related tasks in logistic systems such as Cainiao. To tackle the above problem, we propose a domain-specific pre-trained model, named G2PTL, a Geography-Graph Pre-trained model for delivery address in Logistics field. G2PTL combines the semantic learning capabilities of text pre-training with the geographical-relationship encoding abilities of graph modeling. Specifically, we first utilize real-world logistics delivery data to construct a large-scale heterogeneous graph of delivery addresses, which contains abundant geographic knowledge and delivery information. Then, G2PTL is pre-trained with subgraphs sampled from the heterogeneous graph. Comprehensive experiments are conducted to demonstrate the effectiveness of G2PTL through four downstream tasks in logistics systems on real-world datasets. G2PTL has been deployed in production in Cainiao's logistics system, which significantly improves the performance of delivery-related tasks. The code of G2PTL is available at https://huggingface.co/Cainiao-AI/G2PTL.",
        "keywords": "logistics;delivery address;pre-training;graph",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Lixia Wu;Jianlin Liu;Junhong Lou;Haoyuan Hu;Jianbin Zheng;Haomin Wen;Chao Song;shu He",
        "authorids": "~Lixia_Wu2;~Jianlin_Liu2;~Junhong_Lou1;~Haoyuan_Hu1;~Jianbin_Zheng2;~Haomin_Wen3;~Chao_Song1;~shu_He2",
        "gender": "M;M;M;M;M;M;;M",
        "homepage": "https://www.mdpi.com/1424-8220/18/12/4273;https://github.com/Allenhong0218;;;https://wenhaomin.github.io/;;;",
        "dblp": ";;205/3156;;;59/1815;;https://dblp1.uni-trier.de/pid/178/7239.html",
        "google_scholar": ";;;;https://scholar.google.com/citations?hl=zh-CN;CDQpC_UAAAAJ;;",
        "orcid": ";;;0000-0003-0636-3905;;;;",
        "linkedin": ";;;;;;shu-he-2524565b/;",
        "or_profile": "~Jianlin_Liu2;~Junhong_Lou1;~Haoyuan_Hu1;~Jianbin_Zheng2;~Haomin_Wen3;~Chao_Song1;~shu_He2;~Wu_Li_Xia1",
        "aff": ";Alibaba Group;Cainiao Network;CaiNiao Network;;;;",
        "aff_domain": ";alibaba-inc.com;cainiao.com;cainiao.com;;;;",
        "position": ";Researcher;Principal Researcher;Researcher;;;;",
        "bibtex": "@misc{\nwu2024gptl,\ntitle={G2{PTL}: A Pre-trained Model for Delivery Address and its Applications in Logistics System},\nauthor={Lixia Wu and Jianlin Liu and Junhong Lou and Haoyuan Hu and Jianbin Zheng and Haomin Wen and Chao Song and shu He},\nyear={2024},\nurl={https://openreview.net/forum?id=sP0Aev2Gis}\n}",
        "github": "",
        "project": "",
        "reviewers": "VFda;PNNu;q3Pr",
        "site": "https://openreview.net/forum?id=sP0Aev2Gis",
        "pdf_size": 10004700,
        "rating": "5;6;8",
        "confidence": "4;4;5",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "2;3;3",
        "wc_summary": "84;77;198",
        "wc_strengths": "47;67;285",
        "wc_weaknesses": "47;65;174",
        "wc_questions": "84;7;147",
        "wc_review": "262;216;804",
        "wc_reply_reviewers": "14;12;0",
        "wc_reply_authors": "950;192;807",
        "reply_reviewers": "1;1;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            119.66666666666667,
            55.46370184383858
        ],
        "wc_strengths_avg": [
            133.0,
            107.7899191328515
        ],
        "wc_weaknesses_avg": [
            95.33333333333333,
            56.10902086315731
        ],
        "wc_questions_avg": [
            79.33333333333333,
            57.24993934979805
        ],
        "wc_review_avg": [
            427.3333333333333,
            267.00478564167264
        ],
        "wc_reply_reviewers_avg": [
            8.666666666666666,
            6.182412330330469
        ],
        "wc_reply_authors_avg": [
            649.6666666666666,
            328.8427520191916
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.944911182523068,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7938196240030134361&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Alibaba Group;Cainiao Network",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.alibaba.com;https://www.cainiao.com",
        "aff_unique_abbr": "Alibaba;Cainiao",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Fiber Monte Carlo",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17648",
        "id": "sP1tCl2QBk",
        "author_site": "Nick Richardson, Deniz Oktay, Yaniv Ovadia, James Bowden, Ryan P Adams",
        "tldr": "",
        "abstract": "Integrals with discontinuous integrands are ubiquitous, arising from discrete structure in applications like topology optimization, graphics, and computational geometry.\n    These integrals are often part of a forward model in an inverse problem where it is necessary to reason backwards about the parameters, ideally using gradient-based optimization. \n    Monte Carlo methods are widely used to estimate the value of integrals, but this results in a non-differentiable approximation that is amenable to neither conventional automatic differentiation nor reparameterization-based gradient methods. \n    This significantly disrupts efforts to integrate machine learning methods in areas that exhibit these discontinuities: physical simulation and robotics, design, graphics, and computational geometry.  \n    Although bespoke domain-specific techniques can handle special cases, a general methodology to wield automatic differentiation in these discrete contexts is wanting. \n    We introduce a differentiable variant of the simple Monte Carlo estimator which samples line segments rather than points from the domain. \n    We justify our estimator analytically as conditional Monte Carlo and demonstrate the diverse functionality of the method as applied to image stylization, topology optimization, and computational geometry.",
        "keywords": "Stochastic Methods",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/415dba228924d664a7b810fa4eea8b83f59867d6.pdf",
        "author": "Nick Richardson;Deniz Oktay;Yaniv Ovadia;James C Bowden;Ryan P Adams",
        "authorids": "~Nick_Richardson1;~Deniz_Oktay2;~Yaniv_Ovadia2;~James_C_Bowden1;~Ryan_P_Adams1",
        "gender": "M;M;M;M;M",
        "homepage": "https://www.cs.princeton.edu/~nr14/;https://www.cs.princeton.edu/~doktay/;;https://james-bowden.github.io/;http://www.cs.princeton.edu/~rpa/",
        "dblp": ";;122/8983;;32/909",
        "google_scholar": "TwnmjhgAAAAJ;NQ1BBEwAAAAJ;POp8_IsAAAAJ;lfSNrMUAAAAJ;grQ_GBgAAAAJ",
        "orcid": ";;;;",
        "linkedin": "nick-richardson-854271214/;deniz-oktay-65b20a53;;;",
        "or_profile": "~Nick_Richardson1;~Deniz_Oktay2;~Yaniv_Ovadia2;~James_C_Bowden1;~Ryan_P_Adams1",
        "aff": "Princeton University;Princeton University;Princeton University;;Princeton University",
        "aff_domain": "princeton.edu;princeton.edu;princeton.edu;;princeton.edu",
        "position": "PhD student;PhD student;PhD student;;Professor",
        "bibtex": "@inproceedings{\nrichardson2024fiber,\ntitle={Fiber Monte Carlo},\nauthor={Nick Richardson and Deniz Oktay and Yaniv Ovadia and James C Bowden and Ryan P Adams},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=sP1tCl2QBk}\n}",
        "github": "",
        "project": "",
        "reviewers": "qHwo;mMv5;sad6",
        "pdf_size": 1739223,
        "rating": "6;6;8",
        "confidence": "3;4;4",
        "soundness": "3;2;4",
        "contribution": "2;3;4",
        "presentation": "3;3;4",
        "wc_summary": "66;82;47",
        "wc_strengths": "73;129;105",
        "wc_weaknesses": "211;233;76",
        "wc_questions": "55;152;42",
        "wc_review": "405;596;270",
        "wc_reply_reviewers": "130;209;54",
        "wc_reply_authors": "507;1019;134",
        "reply_reviewers": "1;1;1",
        "reply_authors": "1;2;1",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            65.0,
            14.30617582258329
        ],
        "wc_strengths_avg": [
            102.33333333333333,
            22.939534045447004
        ],
        "wc_weaknesses_avg": [
            173.33333333333334,
            69.4086129781856
        ],
        "wc_questions_avg": [
            83.0,
            49.07816894166557
        ],
        "wc_review_avg": [
            423.6666666666667,
            133.7418741041447
        ],
        "wc_reply_reviewers_avg": [
            131.0,
            63.28243568848047
        ],
        "wc_reply_authors_avg": [
            553.3333333333334,
            362.78215073083305
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.49999999999999983,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17503223135787412862&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=sP1tCl2QBk",
        "pdf": "https://openreview.net/pdf?id=sP1tCl2QBk",
        "email": "princeton.edu;princeton.edu;princeton.edu;;princeton.edu",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Princeton University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.princeton.edu",
        "aff_unique_abbr": "Princeton",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Consistent4D: Consistent 360\u00b0 Dynamic Object Generation from Monocular Video",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17647",
        "id": "sPUrdFGepF",
        "author_site": "Yanqin Jiang, Li Zhang, Jin Gao, Weiming Hu, Yao Yao",
        "tldr": "",
        "abstract": "In this paper, we present Consistent4D, a novel approach for generating 4D dynamic objects from uncalibrated monocular videos. Uniquely, we cast the 360-degree dynamic object reconstruction as a 4D generation problem, eliminating the need for tedious multi-view data collection and camera calibration. This is achieved by leveraging the object-level 3D-aware image diffusion model as the primary supervision signal for training dynamic Neural Radiance Fields (DyNeRF). Specifically, we propose a cascade DyNeRF to facilitate stable convergence and temporal continuity under the time-discrete supervision signal. To achieve spatial and temporal consistency of the 4D generation, an interpolation-driven consistency loss is further introduced, which aligns the rendered frames with the interpolated frames from a pre-trained video interpolation model. Extensive experiments show that the proposed Consistent4D significantly outperforms previous 4D reconstruction approaches as well as per-frame 3D generation approaches, opening up new possibilities for 4D dynamic object generation from a single-view uncalibrated video. Project page: https://consistent4d.github.io",
        "keywords": "Dynamic object generation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/9c3f895a12b3c6ff649224683ca3d8d426d9f8c5.zip",
        "author": "Yanqin Jiang;Li Zhang;Jin Gao;Weiming Hu;Yao Yao",
        "authorids": "~Yanqin_Jiang1;~Li_Zhang5;~Jin_Gao1;~Weiming_Hu1;~Yao_Yao1",
        "gender": "F;M;M;M;M",
        "homepage": "https://anonymous1.com;http://www.robots.ox.ac.uk/~lz/;https://people.ucas.edu.cn/~jgao?language=en;http://weiminghu.people-ai.net/;https://yoyo000.github.io/",
        "dblp": "323/4685;89/5992-40;;;07/4410-8",
        "google_scholar": ";-wOTCE8AAAAJ;W1o3B-0AAAAJ;;MGxaDVEAAAAJ",
        "orcid": ";;;0000-0001-9237-8825;",
        "linkedin": ";;;;",
        "or_profile": "~Yanqin_Jiang1;~Li_Zhang5;~Jin_Gao1;~Weiming_Hu1;~Yao_Yao1",
        "aff": "University of Chinese Academy of Sciences;Fudan University;Institute of automation, Chinese Academy of Sciences;Institute of automation, Chinese academy of science;Nanjing University",
        "aff_domain": "ucas.ac.cn;fudan.edu.cn;ia.ac.cn;nlpr.ia.ac.cn;nju.edu.cn",
        "position": "PhD student;Associate Professor;Associate Professor;Full Professor;Associate Professor",
        "bibtex": "@inproceedings{\njiang2024consistentd,\ntitle={Consistent4D: Consistent 360{\\textdegree} Dynamic Object Generation from Monocular Video},\nauthor={Yanqin Jiang and Li Zhang and Jin Gao and Weiming Hu and Yao Yao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=sPUrdFGepF}\n}",
        "github": "",
        "project": "",
        "reviewers": "B4LH;Yv9V;ZZjx;6R15;YMYg",
        "pdf_size": 3265262,
        "rating": "6;6;6;6;10",
        "confidence": "5;3;4;4;4",
        "soundness": "2;3;3;2;4",
        "contribution": "3;3;3;2;3",
        "presentation": "3;3;2;2;4",
        "wc_summary": "59;196;62;67;91",
        "wc_strengths": "14;117;132;87;49",
        "wc_weaknesses": "363;66;108;137;135",
        "wc_questions": "2;2;78;907;57",
        "wc_review": "438;381;380;1198;332",
        "wc_reply_reviewers": "50;0;0;0;0",
        "wc_reply_authors": "941;627;644;633;356",
        "reply_reviewers": "1;0;0;0;0",
        "reply_authors": "2;1;1;1;1",
        "rating_avg": [
            6.8,
            1.6
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.8,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.8,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.8,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            95.0,
            51.741665995597785
        ],
        "wc_strengths_avg": [
            79.8,
            43.44836015317494
        ],
        "wc_weaknesses_avg": [
            161.8,
            103.8140645577467
        ],
        "wc_questions_avg": [
            209.2,
            350.19046246292885
        ],
        "wc_review_avg": [
            545.8,
            327.8245872414087
        ],
        "wc_reply_reviewers_avg": [
            10.0,
            20.0
        ],
        "wc_reply_authors_avg": [
            640.2,
            185.19762417482573
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            1.2,
            0.4000000000000001
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 64,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18030596451518166951&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=sPUrdFGepF",
        "pdf": "https://openreview.net/pdf?id=sPUrdFGepF",
        "email": "ucas.ac.cn;fudan.edu.cn;ia.ac.cn;nlpr.ia.ac.cn;nju.edu.cn",
        "author_num": 5,
        "aff_unique_index": "0;1;2;2;3",
        "aff_unique_norm": "University of Chinese Academy of Sciences;Fudan University;Chinese Academy of Sciences;Nanjing University",
        "aff_unique_dep": ";;Institute of Automation;",
        "aff_unique_url": "http://www.ucas.ac.cn;https://www.fudan.edu.cn;http://www.ia.cas.cn;https://www.nju.edu.cn",
        "aff_unique_abbr": "UCAS;Fudan;CAS;Nanjing U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "sRBnyzoqkU",
        "title": "Model Breadcrumbs: Crafting Multi-Task Models from Pre-Existing Fine-Tuned Foundation Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The rapid evolution of AI system development has been greatly influenced by the emergence of foundation models. The prevailing approach involves fine-tuning these pre-trained foundation models for specific target tasks, leading to a rapid spread of models fine-tuned across a diverse array of tasks. This paper introduces an innovative strategy termed \"Model Breadcrumbs\", which addresses the need to merge multiple fine-tunings of the same foundation model across a spectrum of auxiliary tasks. Model Breadcrumbs comprises a sparsely defined set of weights that carve out a trajectory within the weight space of a pre-trained model, which is designed to enhance task performance when traversed. Model Breadcrumbs are constructed by subtracting the weights from a pre-trained model against the same model's weights post fine-tuning, followed by a sparsification process that mitigates weight outliers and negligible perturbations. Our experiments demonstrates the effectiveness of combining Model Breadcrumbs to simultaneously enhance performance across multiple tasks. This contribution aligns with the evolving paradigm of updatable machine learning, reminiscent of the collaborative principles underlying open-source software development, fostering a community-driven effort to reliably update machine learning models. Through extensive experimentation encompassing various models and tasks, we establish that integrating Model Breadcrumbs represents a straightforward, efficient, and highly effective approach for constructing multi-task models and facilitating updates to foundation models.",
        "keywords": "pre-trained models;fine-tuning;transfer learning;weight interpolation;merging models;sparse models",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "MohammadReza Davari;Eugene Belilovsky",
        "authorids": "~MohammadReza_Davari1;~Eugene_Belilovsky1",
        "gender": "M;M",
        "homepage": "https://davari.io/;http://eugenium.github.io",
        "dblp": "239/8727;42/11445",
        "google_scholar": "https://scholar.google.ca/citations?user=4AztFtEAAAAJ;https://scholar.google.fr/citations?user=CffJDoEAAAAJ",
        "orcid": ";",
        "linkedin": "rezadavari/;",
        "or_profile": "~MohammadReza_Davari1;~Eugene_Belilovsky1",
        "aff": "Concordia University, Montreal;Concordia University, Montreal",
        "aff_domain": "concordia.ca;concordia.ca",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\ndavari2024model,\ntitle={Model Breadcrumbs: Crafting Multi-Task Models from Pre-Existing Fine-Tuned Foundation Models},\nauthor={MohammadReza Davari and Eugene Belilovsky},\nyear={2024},\nurl={https://openreview.net/forum?id=sRBnyzoqkU}\n}",
        "github": "",
        "project": "",
        "reviewers": "ffLz;dEWb;VPFm;mobQ",
        "site": "https://openreview.net/forum?id=sRBnyzoqkU",
        "pdf_size": 1080603,
        "rating": "3;3;3;6",
        "confidence": "4;3;4;4",
        "soundness": "2;2;2;3",
        "contribution": "1;2;2;2",
        "presentation": "2;3;3;2",
        "wc_summary": "85;107;67;58",
        "wc_strengths": "13;44;53;31",
        "wc_weaknesses": "61;158;177;60",
        "wc_questions": "32;3;11;41",
        "wc_review": "191;312;308;190",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            79.25,
            18.73999733191016
        ],
        "wc_strengths_avg": [
            35.25,
            15.039531242695032
        ],
        "wc_weaknesses_avg": [
            114.0,
            53.92123885817165
        ],
        "wc_questions_avg": [
            21.75,
            15.35211711784404
        ],
        "wc_review_avg": [
            250.25,
            59.767779781417346
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:KJ5Q4I9IpYwJ:scholar.google.com/&scioq=Model+Breadcrumbs:+Crafting+Multi-Task+Models+from+Pre-Existing+Fine-Tuned+Foundation+Models&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Concordia University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.concordia.ca",
        "aff_unique_abbr": "Concordia",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Montreal",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "sRop0N5NYV",
        "title": "Tactics of Robust Deep Reinforcement Learning with Randomized Smoothing",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Despite randomized smoothing being proven to give a robustness guarantee, the standard performance of a smoothed deep reinforcement learning (DRL) agent exhibits a significant trade-off between its utility and robustness. Naively introducing randomized smoothing during the training or testing can fail completely in the DRL setting. To address this issue, we proposed new algorithms to train smoothed robust DRL agents while attaining superior clean reward, empirical robustness, and robustness guarantee in discrete and continuous action space. Our proposed DS-DQN and AS-PPO outperform prior state-of-the-art robustly-trained agents in robust reward by $1.6\\times$ on average and exhibit strong guarantees that previous agents failed to achieve. Moreover, a stronger adversarial attack for smoothed DQN agents is proposed, which is $4.6\\times$ more effective in decreasing the rewards compared to existing adversarial attacks.",
        "keywords": "Reinforcement Learning;Robustness;Adversarial Attack",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/738b9a34cc3afe6811549582e0aaef310eb57c31.zip",
        "author": "Chung-En Sun;Sicun Gao;Tsui-Wei Weng",
        "authorids": "~Chung-En_Sun1;~Sicun_Gao1;~Tsui-Wei_Weng1",
        "gender": "M;M;F",
        "homepage": "https://sunchungen.github.io/;;https://lilywenglab.github.io",
        "dblp": "264/5788;22/8296;177/9197",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;v8GM4xoAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Chung-En_Sun1;~Sicun_Gao1;~Tsui-Wei_Weng1",
        "aff": "Microsoft;University of California, San Diego;University of California, San Diego",
        "aff_domain": "microsoft.com;ucsd.edu;ucsd.edu",
        "position": "Intern;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nsun2024tactics,\ntitle={Tactics of Robust Deep Reinforcement Learning with Randomized Smoothing},\nauthor={Chung-En Sun and Sicun Gao and Tsui-Wei Weng},\nyear={2024},\nurl={https://openreview.net/forum?id=sRop0N5NYV}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZBr8;fZcx;RhGb;Jf7U",
        "site": "https://openreview.net/forum?id=sRop0N5NYV",
        "pdf_size": 1291375,
        "rating": "5;5;5;5",
        "confidence": "3;3;4;3",
        "soundness": "3;3;2;2",
        "contribution": "2;2;2;2",
        "presentation": "3;2;2;3",
        "wc_summary": "13;66;110;42",
        "wc_strengths": "26;46;94;9",
        "wc_weaknesses": "89;55;83;101",
        "wc_questions": "1;178;290;101",
        "wc_review": "129;345;577;253",
        "wc_reply_reviewers": "27;0;38;50",
        "wc_reply_authors": "966;1286;1622;1224",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "3;3;4;3",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            57.75,
            35.52727825206991
        ],
        "wc_strengths_avg": [
            43.75,
            31.830606340439072
        ],
        "wc_weaknesses_avg": [
            82.0,
            16.881943016134134
        ],
        "wc_questions_avg": [
            142.5,
            105.78397799288888
        ],
        "wc_review_avg": [
            326.0,
            163.93596310755
        ],
        "wc_reply_reviewers_avg": [
            28.75,
            18.48479104561369
        ],
        "wc_reply_authors_avg": [
            1274.5,
            233.77927624150092
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.25,
            0.4330127018922193
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:9dtGriU5UlkJ:scholar.google.com/&scioq=Tactics+of+Robust+Deep+Reinforcement+Learning+with+Randomized+Smoothing&hl=en&as_sdt=0,48",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Microsoft;University of California, San Diego",
        "aff_unique_dep": "Microsoft Corporation;",
        "aff_unique_url": "https://www.microsoft.com;https://www.ucsd.edu",
        "aff_unique_abbr": "Microsoft;UCSD",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";San Diego",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "sRyGgkdQ47",
        "title": "Making Batch Normalization Great in Federated Deep Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Batch Normalization (BN) is commonly used in modern deep learning to improve stability and speed up convergence in centralized training. In federated learning (FL) with non-IID decentralized data, previous works observed that training with BN could hinder performance due to the mismatch of the BN statistics between training and testing. Group Normalization (GN) is thus more often used in FL as an alternative to BN. In this paper, we identify a more fundamental issue of BN in FL that makes BN inferior even with high-frequency communication between clients and servers. We then propose a frustratingly simple treatment, which significantly improves BN and makes it outperform GN across a wide range of FL settings. Along with this study, we also reveal an unreasonable behavior of BN in FL. We find it quite robust in the low-frequency communication regime where FL is commonly believed to degrade drastically. We hope that our study could serve as a valuable reference for future practical usage and theoretical analysis in FL.",
        "keywords": "Batch Normalization;Federated Learning;Deep Learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/2f7dc4c161ba8d7a91bb2f5b48737ce388270850.pdf",
        "author": "Jike Zhong;Hong-You Chen;Wei-Lun Chao",
        "authorids": "~Jike_Zhong1;~Hong-You_Chen1;~Wei-Lun_Chao1",
        "gender": "M;;M",
        "homepage": ";https://sites.google.com/view/hongyouc/%E9%A6%96%E9%A0%81;https://sites.google.com/view/wei-lun-harry-chao",
        "dblp": ";228/5569;64/8842",
        "google_scholar": ";uxlU7J8AAAAJ;PGKakWwAAAAJ",
        "orcid": ";;0000-0003-1269-7231",
        "linkedin": "jike-zhong-b053721a9/;;",
        "or_profile": "~Jike_Zhong1;~Hong-You_Chen1;~Wei-Lun_Chao1",
        "aff": "SalesForce.com;Apple AI/ML;Ohio State University",
        "aff_domain": "salesforce.com;apple.com;osu.edu",
        "position": "Intern;Researcher;Assistant Professor",
        "bibtex": "@misc{\nzhong2024making,\ntitle={Making Batch Normalization Great in Federated Deep Learning},\nauthor={Jike Zhong and Hong-You Chen and Wei-Lun Chao},\nyear={2024},\nurl={https://openreview.net/forum?id=sRyGgkdQ47}\n}",
        "github": "",
        "project": "",
        "reviewers": "4tfk;6HP6;mhQT;jccC",
        "site": "https://openreview.net/forum?id=sRyGgkdQ47",
        "pdf_size": 6897878,
        "rating": "5;5;5;6",
        "confidence": "4;4;5;4",
        "soundness": "3;2;3;3",
        "contribution": "2;3;2;2",
        "presentation": "3;3;3;3",
        "wc_summary": "60;87;61;89",
        "wc_strengths": "51;48;24;114",
        "wc_weaknesses": "201;89;82;189",
        "wc_questions": "2;33;7;16",
        "wc_review": "314;257;174;408",
        "wc_reply_reviewers": "0;38;57;0",
        "wc_reply_authors": "1552;1181;424;675",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "3;2;1;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            74.25,
            13.77270852083932
        ],
        "wc_strengths_avg": [
            59.25,
            33.29695932063467
        ],
        "wc_weaknesses_avg": [
            140.25,
            54.96987811520051
        ],
        "wc_questions_avg": [
            14.5,
            11.800423721205947
        ],
        "wc_review_avg": [
            288.25,
            85.19499691883321
        ],
        "wc_reply_reviewers_avg": [
            23.75,
            24.681724007856502
        ],
        "wc_reply_authors_avg": [
            958.0,
            438.123840939979
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1004335243796715339&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Salesforce;Apple;Ohio State University",
        "aff_unique_dep": ";AI/ML;",
        "aff_unique_url": "https://www.salesforce.com;https://www.apple.com;https://www.osu.edu",
        "aff_unique_abbr": "Salesforce;Apple;OSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "sSWGqY2qNJ",
        "title": "Indeterminate Probability Theory",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Currently, there is no mathematical analytical form for a general posterior. We have discovered a new theory to address this issue, which is called Indeterminate Probability Theory. This is a big discovery in the field of probability, and it is an extension of classical probability theory, and makes classical probability theory a special case to our theory. In this paper, we propose a new perspective for understanding probability theory by introducing Observers and treating the outcome of each random experiment as an indeterminate probability distribution, which leads to probability calculations being a combination of ground truth and observation errors. We then discover three conditional mutual independent assumptions as Candidate Axioms and divide the probability process into two phase: observation phase and inference phase. In the observation phase, a general equation for any complex posterior is derived. In the inference phase, the inference probability equation with the posterior is derived. Base on this theory, we propose a new general model called IPNN - Indeterminate Probability Neural Network to validate our theory. Furthermore, in one of our another papers, this new theory is successfully applied to the task of multivariate time series (MTS) forecasting without relying on any neural models, and it outperforms LSTM models as well as some transformer-based models. In addition, further applications of this new theory are also discussed in this paper. Validations of this theory are reflected in experimental results.",
        "keywords": "Indeterminate Probability Theory;Analytical Solution;General Posterior;MTS",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/6f18017717456873356da0e61d10a4f5fbcce5a8.zip",
        "author": "Tao Yang;Chuang Liu;Xiaofeng Ma;Weijia Lu;Ning Wu;Bingyang Li;ZHIFEI YANG;Peng Liu;Lin Sun;xiaodong Zhang;Can Zhang",
        "authorids": "~Tao_Yang19;~Chuang_Liu5;~Xiaofeng_Ma1;~Weijia_Lu1;~Ning_Wu3;~Bingyang_Li1;~ZHIFEI_YANG2;~Peng_Liu17;~Lin_Sun11;~xiaodong_Zhang6;~Can_Zhang4",
        "gender": "M;;;M;M;Not Specified;;M;M;M;F",
        "homepage": "https://github.com/Starfruit007;https://www.researchgate.net/profile/Chuang-Liu-15;;https://alfredlu.users.sourceforge.net;https://github.com/uaeswuning;https://github.com/alostbear;https://github.com/fzy9012;https://github.com/Lllllp93;https://github.com/sunlin-ai;https://github.com/Small-Step-AI;",
        "dblp": "67/1120;52/1800-3;;10/4203;60/467;94/8403;56/6850;21/6121;95/6619;37/4356;35/1714",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;-AXrsOwAAAAJ;;PcVWy2EAAAAJ;;;;;;;",
        "orcid": ";;;0000-0002-7899-6034;;;;;;;0000-0002-7083-5228",
        "linkedin": "https://www.linkedin.com/mwlite/in/tao-yang-754b40217;chuang-liu-4b94a159;https://www.linkedin.com/mwlite/in/xiaofeng-ma0124;;;;;;;;",
        "or_profile": "~Tao_Yang19;~Chuang_Liu5;~Xiaofeng_Ma1;~Weijia_Lu1;~Ning_Wu3;~Bingyang_Li1;~ZHIFEI_YANG2;~Peng_Liu17;~Lin_Sun11;~xiaodong_Zhang6;~Can_Zhang4",
        "aff": "United Automotive Electronic Systems Co., Ltd.;United Automotive Electronic Systems Co., Ltd.;UAES;UAES;UAES;UAES;United Automotive Electronic Systems Co., Ltd.;UAES;UAES;United Automotive Electronic Systems Co., Ltd.;United Automotive Electronic Systems",
        "aff_domain": "uaes.com;uaes.com;uaes.com;uaes.com;uaes.com;uaes.com;uaes.com;uaes.com;uaes.com;uaes.com;uaes.com",
        "position": "Researcher;Researcher;Researcher;Principal Researcher;Researcher;Researcher;Researcher;Researcher;Researcher;Researcher;Researcher",
        "bibtex": "@misc{\nyang2024indeterminate,\ntitle={Indeterminate Probability Theory},\nauthor={Tao Yang and Chuang Liu and Xiaofeng Ma and Weijia Lu and Ning Wu and Bingyang Li and ZHIFEI YANG and Peng Liu and Lin Sun and xiaodong Zhang and Can Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=sSWGqY2qNJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "Xi4x;S3ce;MWjN",
        "site": "https://openreview.net/forum?id=sSWGqY2qNJ",
        "pdf_size": 1180207,
        "rating": "1;3;6",
        "confidence": "5;3;4",
        "soundness": "2;2;3",
        "contribution": "1;1;2",
        "presentation": "1;1;3",
        "wc_summary": "59;45;100",
        "wc_strengths": "27;20;133",
        "wc_weaknesses": "541;221;123",
        "wc_questions": "2;171;360",
        "wc_review": "629;457;716",
        "wc_reply_reviewers": "484;297;606",
        "wc_reply_authors": "880;581;785",
        "reply_reviewers": "1;3;2",
        "reply_authors": "2;2;3",
        "rating_avg": [
            3.3333333333333335,
            2.0548046676563256
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            68.0,
            23.338094752285727
        ],
        "wc_strengths_avg": [
            60.0,
            51.697840058039816
        ],
        "wc_weaknesses_avg": [
            295.0,
            178.4899623695032
        ],
        "wc_questions_avg": [
            177.66666666666666,
            146.22889211400354
        ],
        "wc_review_avg": [
            600.6666666666666,
            107.61763589465973
        ],
        "wc_reply_reviewers_avg": [
            462.3333333333333,
            127.0756555057743
        ],
        "wc_reply_authors_avg": [
            748.6666666666666,
            124.7406197764875
        ],
        "reply_reviewers_avg": [
            2.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": -0.3973597071195131,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:WfP4uV8qAAcJ:scholar.google.com/&scioq=Indeterminate+Probability+Theory&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;1;1;1;0;1;1;0;0",
        "aff_unique_norm": "United Automotive Electronic Systems;United Arab Emirates Space Agency",
        "aff_unique_dep": ";",
        "aff_unique_url": ";https://www.uaes.ae",
        "aff_unique_abbr": ";UAES",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;1;1;1;0;1;1;0;0",
        "aff_country_unique": "China;United Arab Emirates"
    },
    {
        "title": "Adapting to Distribution Shift by Visual Domain Prompt Generation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17646",
        "id": "sSaN4gxuEf",
        "author_site": "Zhixiang Chi, Li Gu, Tao Zhong, Huan Liu, YUANHAO YU, Konstantinos Plataniotis, Yang Wang",
        "tldr": "",
        "abstract": "In this paper, we aim to adapt a model at test-time using a few unlabeled data to address distribution shifts. \nTo tackle the challenges of extracting domain knowledge from a limited amount of data, it is crucial to utilize correlated information from pre-trained backbones and source domains. Previous studies fail to utilize recent foundation models with strong out-of-distribution generalization. Additionally, domain-centric designs are not flavored in their works. Furthermore, they employ the process of modelling source domains and the process of learning to adapt independently into disjoint training stages. In this work, we propose an approach on top of the pre-computed features of the foundation model. Specifically, we build a knowledge bank to learn the transferable knowledge from source domains. Conditioned on few-shot target data, we introduce a domain prompt generator to condense the knowledge bank into a domain-specific prompt. The domain prompt then directs the visual features towards a particular domain via a guidance module. Moreover, we propose a domain-aware contrastive loss and employ meta-learning to facilitate domain knowledge extraction. Extensive experiments are conducted to validate the domain knowledge extraction. The proposed method outperforms previous work on 5 large-scale benchmarks including WILDS and DomainNet.",
        "keywords": "Distribution shfts;Domain generalization;Visual prompt;Foundation model;Test-time adaptation",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Zhixiang Chi;Li Gu;Tao Zhong;Huan Liu;YUANHAO YU;Konstantinos N Plataniotis;Yang Wang",
        "authorids": "~Zhixiang_Chi1;~Li_Gu1;~Tao_Zhong1;~Huan_Liu4;~YUANHAO_YU2;~Konstantinos_N_Plataniotis1;~Yang_Wang1",
        "gender": "M;M;M;M;M;M;M",
        "homepage": ";;https://www.taozhong.info/;;;https://users.encs.concordia.ca/~wayang/;https://www.comm.utoronto.ca/~kostas/",
        "dblp": "215/3585;87/782;24/6538-3;;00/10782;w/YangWang3;p/KonstantinosNPlataniotis",
        "google_scholar": "0s-HzGIAAAAJ;crdHC0sAAAAJ;https://scholar.google.ca/citations?hl=en;6QbMAhkAAAAJ;KM4V0a8AAAAJ;https://scholar.google.ca/citations?user=2PBM-osAAAAJ;https://scholar.google.ca/citations?hl=en",
        "orcid": ";;0009-0009-4878-4792;;0000-0001-8176-9716;;0000-0003-3647-5473",
        "linkedin": "zhixiang-chi-51441a8a/;;neiltaozhong/;;yuanhao-yu-9b388926/;;",
        "or_profile": "~Zhixiang_Chi1;~Li_Gu1;~Tao_Zhong1;~Huan_Liu4;~YUANHAO_YU2;~Yang_Wang1;~Kostantinos_Plataniotis1",
        "aff": "Huawei Technologies Ltd.;Huawei Canada;Princeton University;Huawei Technologies Ltd.;Huawei Technologies Ltd.;Concordia University;Toronto University",
        "aff_domain": "huawei.com;huawei.com;princeton.edu;huawei.com;huawei.com;concordia.ca;utoronto.ca",
        "position": "Computer Vision Researcher;Researcher;PhD student;Researcher;Principal Researcher;Associate Professor;Full Professor",
        "bibtex": "@inproceedings{\nchi2024adapting,\ntitle={Adapting to Distribution Shift by Visual Domain Prompt Generation},\nauthor={Zhixiang Chi and Li Gu and Tao Zhong and Huan Liu and YUANHAO YU and Konstantinos N Plataniotis and Yang Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=sSaN4gxuEf}\n}",
        "github": "",
        "project": "",
        "reviewers": "PHNg;hhmW;1gy7;f7Jt",
        "pdf_size": 1744269,
        "rating": "5;5;6;8",
        "confidence": "4;2;4;4",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "1;3;3;3",
        "wc_summary": "51;107;62;80",
        "wc_strengths": "35;83;111;50",
        "wc_weaknesses": "233;75;89;17",
        "wc_questions": "14;1;100;9",
        "wc_review": "333;266;362;156",
        "wc_reply_reviewers": "0;0;15;0",
        "wc_reply_authors": "1537;855;1109;307",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "3;3;3;2",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            75.0,
            21.17781858454737
        ],
        "wc_strengths_avg": [
            69.75,
            29.473505051147207
        ],
        "wc_weaknesses_avg": [
            103.5,
            79.49056547792323
        ],
        "wc_questions_avg": [
            31.0,
            40.10610926031095
        ],
        "wc_review_avg": [
            279.25,
            79.21923693144235
        ],
        "wc_reply_reviewers_avg": [
            3.75,
            6.49519052838329
        ],
        "wc_reply_authors_avg": [
            952.0,
            445.058423131166
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            0.4330127018922193
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.4714045207910316,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6678494842863135051&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=sSaN4gxuEf",
        "pdf": "https://openreview.net/pdf?id=sSaN4gxuEf",
        "email": "huawei.com;huawei.com;princeton.edu;huawei.com;huawei.com;concordia.ca;utoronto.ca",
        "author_num": 7,
        "aff_unique_index": "0;0;1;0;0;2;3",
        "aff_unique_norm": "Huawei;Princeton University;Concordia University;University of Toronto",
        "aff_unique_dep": "Huawei Technologies;;;",
        "aff_unique_url": "https://www.huawei.com;https://www.princeton.edu;https://www.concordia.ca;https://www.utoronto.ca",
        "aff_unique_abbr": "Huawei;Princeton;Concordia;U of T",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;0;0;1;1",
        "aff_country_unique": "China;Canada;United States"
    },
    {
        "title": "Divide and not forget: Ensemble of selectively trained experts in Continual Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17645",
        "id": "sSyytcewxe",
        "author_site": "Grzegorz Rype\u015b\u0107, Sebastian Cygert, Valeriya Khan, Tomasz Trzcinski, Bartosz Zieli\u0144ski, Bart\u0142omiej Twardowski",
        "tldr": "",
        "abstract": "Class-incremental learning is becoming more popular as it helps models widen their applicability while not forgetting what they already know. A trend in this area is to use a mixture-of-expert technique, where different models work together to solve the task. However, the experts are usually trained all at once using whole task data, which makes them all prone to forgetting and increasing computational burden. To address this limitation, we introduce a novel approach named SEED. SEED selects only one, the most optimal expert for a considered task, and uses data from this task to fine-tune only this expert. For this purpose, each expert represents each class with a Gaussian distribution, and the optimal expert is selected based on the similarity of those distributions. Consequently, SEED increases diversity and heterogeneity within the experts while maintaining the high stability of this ensemble method. The extensive experiments demonstrate that SEED achieves state-of-the-art performance in exemplar-free settings across various scenarios, showing the potential of expert diversification through data in continual learning.",
        "keywords": "continual learning;class incremental learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/5a553f943da79b0c4992714688da3eacad60e4f5.zip",
        "author": "Grzegorz Rype\u015b\u0107;Sebastian Cygert;Valeriya Khan;Tomasz Trzcinski;Bartosz Micha\u0142 Zieli\u0144ski;Bart\u0142omiej Twardowski",
        "authorids": "~Grzegorz_Rype\u015b\u01071;~Sebastian_Cygert1;~Valeriya_Khan1;~Tomasz_Trzcinski2;~Bartosz_Micha\u0142_Zieli\u0144ski1;~Bart\u0142omiej_Twardowski1",
        "gender": "M;M;;M;M;M",
        "homepage": "https://github.com/grypesc;https://pg.edu.pl/en/p/sebastian-cygert-1128802;https://www.linkedin.com/in/valeriya-khan/;https://cvlab.ii.pw.edu.pl/ttrzcins/;https://bartoszzielinski.github.io/;",
        "dblp": "293/9780;138/3693;240/1080;05/11408;12/3424-1;156/6628",
        "google_scholar": "XE3QOZ4AAAAJ;https://scholar.google.pl/citations?user=wLH9PP8AAAAJ;;https://scholar.google.pl/citations?user=bJMRBFoAAAAJ;https://scholar.google.pl/citations?user=AJHaOpkAAAAJ;https://scholar.google.pl/citations?user=8yywECgAAAAJ",
        "orcid": "0000-0001-8170-3282;;;;0000-0002-3063-3621;0000-0003-2117-8679",
        "linkedin": "grypesc/;sebastiancygert/;valeriya-khan/;;bartosz-zieli%C5%84ski-1b2b1ab/;bartlomiejtwardowski/",
        "or_profile": "~Grzegorz_Rype\u015b\u01071;~Sebastian_Cygert1;~Valeriya_Khan1;~Tomasz_Trzcinski2;~Bartosz_Micha\u0142_Zieli\u0144ski1;~Bart\u0142omiej_Twardowski1",
        "aff": "Warsaw University of Technology;IDEAS NCBR;IDEAS NCBR;Warsaw University of Technology;Jagiellonian University;Computer Vision Center, Universitat Aut\u00f2noma de Barcelona",
        "aff_domain": "pw.edu.pl;ideas-ncbr.pl;ideas-ncbr.pl;pw.edu.pl;uj.edu.pl;cvc.uab.es",
        "position": "PhD student;Postdoc;Intern;Full Professor;Assistant Professor;Postdoc",
        "bibtex": "@inproceedings{\nrype{\\'s}{\\'c}2024divide,\ntitle={Divide and not forget: Ensemble of  selectively trained experts  in Continual Learning},\nauthor={Grzegorz Rype{\\'s}{\\'c} and Sebastian Cygert and Valeriya Khan and Tomasz Trzcinski and Bartosz Micha{\\l} Zieli{\\'n}ski and Bart{\\l}omiej Twardowski},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=sSyytcewxe}\n}",
        "github": "",
        "project": "",
        "reviewers": "rq4G;hfuR;3XPS;Hjf8",
        "pdf_size": 6011018,
        "rating": "6;6;8;8",
        "confidence": "3;3;4;3",
        "soundness": "3;3;3;3",
        "contribution": "3;2;3;3",
        "presentation": "3;3;4;3",
        "wc_summary": "102;71;93;50",
        "wc_strengths": "19;42;82;40",
        "wc_weaknesses": "101;244;59;107",
        "wc_questions": "7;26;29;115",
        "wc_review": "229;383;263;312",
        "wc_reply_reviewers": "201;198;11;63",
        "wc_reply_authors": "1231;1386;416;593",
        "reply_reviewers": "2;2;1;1",
        "reply_authors": "4;5;2;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            79.0,
            20.18662923818635
        ],
        "wc_strengths_avg": [
            45.75,
            22.78568629644497
        ],
        "wc_weaknesses_avg": [
            127.75,
            69.61815495975169
        ],
        "wc_questions_avg": [
            44.25,
            41.709561253985875
        ],
        "wc_review_avg": [
            296.75,
            57.88080424458527
        ],
        "wc_reply_reviewers_avg": [
            118.25,
            83.31078861708129
        ],
        "wc_reply_authors_avg": [
            906.5,
            410.51583404297577
        ],
        "reply_reviewers_avg": [
            1.5,
            0.5
        ],
        "reply_authors_avg": [
            3.25,
            1.299038105676658
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 44,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6522640778854690375&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=sSyytcewxe",
        "pdf": "https://openreview.net/pdf?id=sSyytcewxe",
        "email": "pw.edu.pl;ideas-ncbr.pl;ideas-ncbr.pl;pw.edu.pl;uj.edu.pl;cvc.uab.es",
        "author_num": 6,
        "aff_unique_index": "0;1;1;0;2;3",
        "aff_unique_norm": "Warsaw University of Technology;Institute for Development, Economic Analysis, and Simulation (IDEAS);Jagiellonian University;Universitat Aut\u00f2noma de Barcelona",
        "aff_unique_dep": ";;;Computer Vision Center",
        "aff_unique_url": "https://www.pw.edu.pl;https://www.ideas-ncbr.gov.pl;https://www.uj.edu.pl;https://www.uab.cat",
        "aff_unique_abbr": "WUT;IDEAS;UJ;UAB",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;1",
        "aff_country_unique": "Poland;Spain"
    },
    {
        "id": "sTPBiffbdR",
        "title": "Domain-Agnostic Self-Training for Semi-Supervised Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Self-training is a popular class of semi-supervised learning (SSL) methods which\ncan be viewed as iteratively assigning pseudo labels to unlabeled data for model\ntraining. Despite its recent successes, most self-training approaches are domain-specific,\nrelying on the predefined data augmentation schemes in a particular\ndomain to generate reliable pseudo labels. In this paper, we propose a domain-agnostic\nself-training framework named DAST, which is applicable to domains\nwhere prior knowledge is not readily available. DAST consists of a contrastive\nlearning module along with a novel two-way pseudo label generation strategy.\nWithout the reliance of data augmentation, DAST performs supervised contrastive\nlearning with the pseudo labels generated from the classifier to learn aligned data\nrepresentations and produces the reliable pseudo labels for self-training based on\nthe learned representations. From an expectation maximization (EM) algorithm\nperspective, we theoretically prove that representation learning and self-training in\nDAST are mutually beneficial. Extensive experiments in various domains (tabular\ndata, graphs, and images.) verify that DAST not only significantly outperforms\nother domain-agnostic self-training methods, but can also combine with effective\ndomain knowledge to further boost the performance.",
        "keywords": "Self-training;Augmentation-free learning method;Semi-supervised learning;Tabular data",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Shuming Kong;Yanyan Shen;Linpeng Huang",
        "authorids": "~Shuming_Kong1;~Yanyan_Shen1;~Linpeng_Huang2",
        "gender": ";;M",
        "homepage": ";;",
        "dblp": ";;93/4039",
        "google_scholar": ";;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Shuming_Kong1;~Yanyan_Shen1;~Linpeng_Huang2",
        "aff": ";;",
        "aff_domain": ";;",
        "position": ";;",
        "bibtex": "@misc{\nkong2024domainagnostic,\ntitle={Domain-Agnostic Self-Training for Semi-Supervised Learning},\nauthor={Shuming Kong and Yanyan Shen and Linpeng Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=sTPBiffbdR}\n}",
        "github": "",
        "project": "",
        "reviewers": "e71P;yyif;RRjm",
        "site": "https://openreview.net/forum?id=sTPBiffbdR",
        "pdf_size": 912355,
        "rating": "3;3;5",
        "confidence": "5;4;5",
        "soundness": "2;2;3",
        "contribution": "2;3;2",
        "presentation": "3;2;3",
        "wc_summary": "71;148;41",
        "wc_strengths": "50;73;19",
        "wc_weaknesses": "113;354;91",
        "wc_questions": "2;208;156",
        "wc_review": "236;783;307",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            86.66666666666667,
            45.065384597148274
        ],
        "wc_strengths_avg": [
            47.333333333333336,
            22.125902367034783
        ],
        "wc_weaknesses_avg": [
            186.0,
            119.13297892131577
        ],
        "wc_questions_avg": [
            122.0,
            87.46808941932291
        ],
        "wc_review_avg": [
            442.0,
            242.85935573221522
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Hh8o4LOxcUMJ:scholar.google.com/&scioq=Domain-Agnostic+Self-Training+for+Semi-Supervised+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0
    },
    {
        "title": "Evaluating Representation Learning on the Protein Structure Universe",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17644",
        "id": "sTYuRVrdK3",
        "author_site": "Arian Jamasb, Alex Morehead, Zuobai Zhang, Chaitanya Joshi, Kieran Didi, Simon Mathis, Charles Harris, Jian Tang, Jianlin Cheng, Pietro Lio, Tom Blundell",
        "tldr": "",
        "abstract": "We introduce ProteinWorkshop, a comprehensive benchmark suite for representation learning on protein structures with Geometric Graph Neural Networks. We consider large-scale pre-training and downstream tasks on both experimental and predicted structures to enable the systematic evaluation of the quality of the learned structural representation and their usefulness in capturing functional relationships for downstream tasks. We find that: (1) large-scale pretraining on AlphaFold structures and auxiliary tasks consistently improve the performance of both rotation-invariant and equivariant GNNs, and (2) more expressive equivariant GNNs benefit from pretraining to a greater extent compared to invariant models.\nWe aim to establish a common ground for the machine learning and computational biology communities to rigorously compare and advance protein structure representation learning. Our open-source codebase reduces the barrier to entry for working with large protein structure datasets by providing: (1) storage-efficient dataloaders for large-scale structural databases including AlphaFoldDB and ESM Atlas, as well as (2) utilities for constructing new tasks from the entire PDB. ProteinWorkshop is available at: github.com/a-r-j/ProteinWorkshop.",
        "keywords": "Protein;Representation;Learning;Protein Structure",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Arian Rokkum Jamasb;Alex Morehead;Chaitanya K. Joshi;Zuobai Zhang;Kieran Didi;Simon V Mathis;Charles Harris;Jian Tang;Jianlin Cheng;Pietro Lio;Tom Leon Blundell",
        "authorids": "~Arian_Rokkum_Jamasb1;~Alex_Morehead1;~Chaitanya_K._Joshi1;~Zuobai_Zhang1;~Kieran_Didi1;~Simon_V_Mathis1;~Charles_Harris2;~Jian_Tang1;~Jianlin_Cheng1;~Pietro_Lio1;~Tom_Leon_Blundell1",
        "gender": ";M;M;M;M;;;M;M;M;M",
        "homepage": "https://www.jamasb.io;https://amorehead.github.io/;https://oxer11.github.io/;https://kdidi.netlify.app/;https://simonmathis.org;https://cch1999.github.io/;http://www.jian-tang.com;http://calla.rnet.missouri.edu/cheng/;https://www.cst.cam.ac.uk/people/pl219;https://www.bioc.cam.ac.uk/research/blundell;http://www.chaitjo.com/",
        "dblp": "296/2021;259/6116;256/9098.html;336/6909;338/5638;;181/2667-5;11/5762.html;l/PietroLio.html;;202/2132",
        "google_scholar": "https://scholar.google.co.uk/citations?user=hYm9a-UAAAAJ;IYHJU5EAAAAJ;UCDbNccAAAAJ;KxQAWKQAAAAJ;https://scholar.google.ch/citations?user=N6I6fT0AAAAJ;;https://scholar.google.ca/citations?user=1ir6WUEAAAAJ;t9MY6lwAAAAJ;https://scholar.google.co.uk/citations?user=3YrWf7EAAAAJ;;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0002-6727-7579;0000-0002-0586-6191;;0000-0001-6839-3320;0000-0002-5246-6481;;;0000-0003-0305-2853;0000-0002-0540-5053;0000-0002-2708-8992;0000-0003-4722-1815",
        "linkedin": "jamasb/;alexmorehead;;kieran-didi/;simonmathis/;;;jianlin-cheng-26b3135/;;;chaitjo",
        "or_profile": "~Arian_Rokkum_Jamasb1;~Alex_Morehead1;~Zuobai_Zhang1;~Kieran_Didi1;~Simon_V_Mathis1;~Charles_Harris2;~Jian_Tang1;~Jianlin_Cheng1;~Pietro_Lio1;~Tom_Leon_Blundell1;~Chaitanya_Krishna_Joshi1",
        "aff": "Prescient Design / Roche / Genentech;University of Missouri, Columbia;NVIDIA;University of Cambridge;University of Cambridge;University of Cambridge;Mila, HEC Montreal;University of Missouri - Columbia;University of Cambridge;University of Cambridge;Fundamental AI Research (FAIR), Meta",
        "aff_domain": "roche.com;missouri.edu;nvidia.com;cam.ac.uk;cam.ac.uk;cam.ac.uk;hec.ca;missouri.edu;cam.ac.uk;cam.ac.uk;meta.com",
        "position": "Researcher;PhD student;Intern;MS student;PhD student;PhD student;Assistant Professor;Full Professor;Full Professor;Emeritus;Intern",
        "bibtex": "@inproceedings{\njamasb2024evaluating,\ntitle={Evaluating Representation Learning on the Protein Structure Universe},\nauthor={Arian Rokkum Jamasb and Alex Morehead and Chaitanya K. Joshi and Zuobai Zhang and Kieran Didi and Simon V Mathis and Charles Harris and Jian Tang and Jianlin Cheng and Pietro Lio and Tom Leon Blundell},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=sTYuRVrdK3}\n}",
        "github": "",
        "project": "",
        "reviewers": "5uRv;foh9;W2RU;keJ2",
        "pdf_size": 2622715,
        "rating": "5;6;6;8",
        "confidence": "5;5;3;4",
        "soundness": "3;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "3;4;3;4",
        "wc_summary": "73;222;46;69",
        "wc_strengths": "18;83;54;70",
        "wc_weaknesses": "166;219;104;138",
        "wc_questions": "2;49;61;111",
        "wc_review": "259;573;265;388",
        "wc_reply_reviewers": "78;115;0;11",
        "wc_reply_authors": "802;1275;1297;464",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "2;3;2;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            102.5,
            69.75851202541521
        ],
        "wc_strengths_avg": [
            56.25,
            24.355440870573457
        ],
        "wc_weaknesses_avg": [
            156.75,
            42.115169476092575
        ],
        "wc_questions_avg": [
            55.75,
            38.77740966078059
        ],
        "wc_review_avg": [
            371.25,
            127.35064781931814
        ],
        "wc_reply_reviewers_avg": [
            51.0,
            47.502631506054485
        ],
        "wc_reply_authors_avg": [
            959.5,
            347.76896066210395
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": -0.3458572319330373,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7665153190650747696&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 11,
        "openreview": "https://openreview.net/forum?id=sTYuRVrdK3",
        "pdf": "https://openreview.net/pdf?id=sTYuRVrdK3",
        "email": "roche.com;missouri.edu;nvidia.com;cam.ac.uk;cam.ac.uk;cam.ac.uk;hec.ca;missouri.edu;cam.ac.uk;cam.ac.uk;meta.com",
        "author_num": 11,
        "aff_unique_index": "0;1;2;3;3;3;4;1;3;3;5",
        "aff_unique_norm": "Roche;University of Missouri;NVIDIA;University of Cambridge;HEC Montreal;Meta",
        "aff_unique_dep": ";;NVIDIA Corporation;;HEC Business School;Fundamental AI Research (FAIR)",
        "aff_unique_url": "https://www.roche.com;https://www.missouri.edu;https://www.nvidia.com;https://www.cam.ac.uk;https://www.hec.ca;https://meta.com",
        "aff_unique_abbr": "Roche;MU;NVIDIA;Cambridge;HEC;Meta",
        "aff_campus_unique_index": "1;2;2;2;3;1;2;2",
        "aff_campus_unique": ";Columbia;Cambridge;Montreal",
        "aff_country_unique_index": "0;1;1;2;2;2;3;1;2;2;1",
        "aff_country_unique": "Switzerland;United States;United Kingdom;Canada"
    },
    {
        "id": "sTf7mXhTVt",
        "title": "Query Efficient Black-Box Adversarial Attack with Automatic Region Selection",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep neural networks (DNNs) have been shown to be vulnerable to black-box attacks in which small perturbations are added to input images without accessing any internal information of the model. However, current black-box adversarial attack methods are limited to attacks on entire regions, pixel-wise sparse attacks, or region-wise attacks. In this paper, we investigate region-wise adversarial attacks in the black-box setting, using automatic region selection and controllable imperceptibility.\nTechnically, we formulate the problem as an optimization problem with $\\ell_0^{\\mathcal{G}}$ and $\\ell_\\infty$ constraints. Here, $\\ell_0^{\\mathcal{G}}$ represents structured sparsity defined on one collection of groups $\\mathcal{G}$, which can automatically detect the regions that need to be perturbed. We solve the problem using the algorithm of natural evolution strategies with search gradients.\nIf $\\mathcal{G}$ is non-overlapping, we provide a closed-form solution to the first-order Taylor approximation of the objective function with the search gradient having $\\ell_0^{\\mathcal{G}}$ and $\\ell_\\infty$ constraints (FTAS$\\ell_{0+\\infty}^{\\mathcal{G}}$). If $\\mathcal{G}$ is overlapping, we provide an approximate solution to FTAS$\\ell_{0+\\infty}^{\\mathcal{G}}$ due to its NP-hard nature, using greedy selection on the collection of groups $\\mathcal{G}$. Our method consists of multiple updates with the closed-form/approximate solution to FTAS$\\ell_{0+\\infty}^{\\mathcal{G}}$. We provide the convergence analysis of the solution under standard assumptions. Our experimental results on different datasets indicate that we require fewer perturbations compared to global-region attacks, fewer queries compared to region-wise attacks, and better interpretability into vulnerable regions which is not possible with pixel-wise attacks.",
        "keywords": "Black-box attack;DNNs;Group sparsity",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/c1fbbc9c187691e8eb71fc0bd7813b04978dff09.zip",
        "author": "YANMENG YAO;Wanli Shi;Ziwei Wu;Hualin Zhang;William de Vazelhes;Yajing Fan;Huan Xiong;Yi Chang;Bin Gu",
        "authorids": "~YANMENG_YAO1;~Wanli_Shi1;~Ziwei_Wu2;~Hualin_Zhang1;~William_de_Vazelhes2;~Yajing_Fan1;~Huan_Xiong1;~Yi_Chang4;~Bin_Gu1",
        "gender": "F;M;F;M;F;M;M;M;M",
        "homepage": ";;https://orcid.org/0009-0003-0247-9780;https://github.com/zhanghualin0;;https://scholar.google.com/citations?user=l4hm14MAAAAJ&hl=en;http://www.yichang-cs.com;https://mbzuai.ac.ae/study/faculty/bin-gu/;http://github.com/wdevazelhes",
        "dblp": ";245/9064;;303/7916;;;02/5438.html;29/1758-1;247/1152",
        "google_scholar": ";Li38vbwAAAAJ;;;;l4hm14MAAAAJ;https://scholar.google.com.hk/citations?user=drEkR50AAAAJ;Vo8OgCgAAAAJ;ple0xCwAAAAJ",
        "orcid": "0009-0008-0183-5559;;;;0000-0001-5317-1629;;0000-0003-2697-8093;0000-0001-6049-1815;",
        "linkedin": ";;;;;;;;",
        "or_profile": "~YANMENG_YAO1;~Wanli_Shi1;~Ziwei_Wu2;~Hualin_Zhang1;~Yajing_Fan1;~Huan_Xiong1;~Yi_Chang4;~Bin_Gu1;~William_De_Vazelhes1",
        "aff": "Nanjing University of Information Science and Technology;Mohamed bin Zayed University of Artificial Intelligence;Harbin Institute of Technology;Mohamed bin Zayed University of Artificial Intelligence;Nanjing University of Information Science and Technology;Harbin Institute of Technology;Jilin University, China;Mohamed bin Zayed University of Artificial Intelligence;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_domain": "nuist.edu.cn;mbzuai.ac.ae;hit.edu.cn;mbzuai.ac.ae;nuist.edu.cn;hit.edu.cn;jlu.edu.cn;mbzuai.ac.ae;mbzuai.ac.ae",
        "position": "MS student;Postdoc;MS student;PhD student;MS student;Full Professor;Full Professor;Assistant Professor;PhD student",
        "bibtex": "@misc{\nyao2024query,\ntitle={Query Efficient  Black-Box  Adversarial Attack with Automatic Region Selection},\nauthor={YANMENG YAO and Wanli Shi and Ziwei Wu and Hualin Zhang and William de Vazelhes and Yajing Fan and Huan Xiong and Yi Chang and Bin Gu},\nyear={2024},\nurl={https://openreview.net/forum?id=sTf7mXhTVt}\n}",
        "github": "",
        "project": "",
        "reviewers": "9mc2;APQW;jyb5;PV33",
        "site": "https://openreview.net/forum?id=sTf7mXhTVt",
        "pdf_size": 2469843,
        "rating": "5;5;5;6",
        "confidence": "3;4;4;5",
        "soundness": "2;3;3;3",
        "contribution": "3;2;2;3",
        "presentation": "2;4;3;4",
        "wc_summary": "105;59;137;72",
        "wc_strengths": "63;34;43;29",
        "wc_weaknesses": "260;154;298;179",
        "wc_questions": "45;93;5;57",
        "wc_review": "473;340;483;337",
        "wc_reply_reviewers": "0;396;0;0",
        "wc_reply_authors": "712;1929;1526;1559",
        "reply_reviewers": "0;2;0;0",
        "reply_authors": "1;4;3;3",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            93.25,
            30.318105151872537
        ],
        "wc_strengths_avg": [
            42.25,
            12.987975207860538
        ],
        "wc_weaknesses_avg": [
            222.75,
            58.50373919673853
        ],
        "wc_questions_avg": [
            50.0,
            31.416556144810016
        ],
        "wc_review_avg": [
            408.25,
            69.84760196313113
        ],
        "wc_reply_reviewers_avg": [
            99.0,
            171.47302994931886
        ],
        "wc_reply_authors_avg": [
            1431.5,
            444.51462293157465
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            2.75,
            1.0897247358851685
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:jZnt-SqfksgJ:scholar.google.com/&scioq=Query+Efficient+Black-Box+Adversarial+Attack+with+Automatic+Region+Selection&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;1;0;2;3;1;1",
        "aff_unique_norm": "Nanjing University of Information Science and Technology;Mohamed bin Zayed University of Artificial Intelligence;Harbin Institute of Technology;Jilin University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "http://www.nuist.edu.cn;https://mbzuai.ac.ae;http://www.hit.edu.cn/;http://www.jlu.edu.cn",
        "aff_unique_abbr": ";MBZUAI;HIT;JLU",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Harbin",
        "aff_country_unique_index": "0;1;0;1;0;0;0;1;1",
        "aff_country_unique": "China;United Arab Emirates"
    },
    {
        "id": "sTr11zs10n",
        "title": "Battle of the Wordsmiths: Comparing ChatGPT, GPT-4, Claude, and Bard",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Although informal evaluations of modern LLMs can be found on social media, blogs, and\nnews outlets, a formal and comprehensive comparison among them has yet to be conducted.\nIn response to this gap, we have undertaken an extensive benchmark evaluation of LLMs and\nconversational bots. Our evaluation involved the collection of 1002 questions encompassing 27\ncategories, which we refer to as the \u201cWordsmiths dataset.\u201d These categories include reasoning,\nlogic, facts, coding, bias, language, humor, and more. Each question in the dataset is accompanied\nby an accurate and verified answer. We meticulously assessed four leading chatbots: ChatGPT,\nGPT-4, Bard, and Claude, using this dataset. The results of our evaluation revealed the following\nkey findings: a) GPT-4 emerged as the top-performing chatbot across all categories, achieving a\nsuccess rate of 84.1%. On the other hand, Bard faced challenges and achieved a success rate of\n62.4%. b) Among the four models evaluated, one of them responded correctly approximately\n93% of the time. However, all models were correct only about 44%. c) Bard is less correlated\nwith other models while ChatGPT and GPT-4 are highly correlated in terms of their responses.\nd) Chatbots demonstrated proficiency in language understanding , facts, and self awareness.\nHowever, they encountered difficulties in areas such as math, coding, IQ, and reasoning. e) In\nterms of bias, discrimination, and ethics categories, models generally performed well, suggesting\nthey are relatively safe to utilize. To make future model evaluations on our dataset easier,\nwe also provide a multiple-choice version of it (called Wordsmiths-MCQ). The understanding\nand assessment of the capabilities and limitations of modern chatbots hold immense societal\nimplications. In an effort to foster further research in this field, we have made our dataset\navailable for public access, which can be found at [masked].",
        "keywords": "ChatGPT;Bard;Claude;GPT-4;large language models;chatbots;conversational agents",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/036eb08d40ab317639f5798271aa1bc955389c77.pdf",
        "author": "ali borji;Mehrdad Mohammadian",
        "authorids": "~ali_borji1;~Mehrdad_Mohammadian1",
        "gender": "M;M",
        "homepage": "https://scholar.google.com.tw/citations?user=7jTNT1IAAAAJ;",
        "dblp": "49/6311;",
        "google_scholar": "7jTNT1IAAAAJ;oVnfWYQAAAAJ",
        "orcid": ";",
        "linkedin": "ali-borji-5736433a/;",
        "or_profile": "~ali_borji1;~Mehrdad_Mohammadian1",
        "aff": "PrimerAI;Azad University, Mashhad Branch",
        "aff_domain": "primer.ai;mshdiau.ac.ir",
        "position": "ML Engineer;MS student",
        "bibtex": "@misc{\nborji2024battle,\ntitle={Battle of the Wordsmiths: Comparing Chat{GPT}, {GPT}-4, Claude, and Bard},\nauthor={ali borji and Mehrdad Mohammadian},\nyear={2024},\nurl={https://openreview.net/forum?id=sTr11zs10n}\n}",
        "github": "",
        "project": "",
        "reviewers": "NUi4;NvBJ;FZSs;Kq4d",
        "site": "https://openreview.net/forum?id=sTr11zs10n",
        "pdf_size": 2820844,
        "rating": "3;3;5;5",
        "confidence": "3;3;3;4",
        "soundness": "2;2;3;2",
        "contribution": "2;3;2;2",
        "presentation": "3;3;3;3",
        "wc_summary": "90;30;19;166",
        "wc_strengths": "31;37;27;68",
        "wc_weaknesses": "111;26;82;181",
        "wc_questions": "36;206;26;120",
        "wc_review": "268;299;154;535",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            76.25,
            58.43960557703996
        ],
        "wc_strengths_avg": [
            40.75,
            16.13032857693854
        ],
        "wc_weaknesses_avg": [
            100.0,
            55.86143571373726
        ],
        "wc_questions_avg": [
            97.0,
            72.75300681071539
        ],
        "wc_review_avg": [
            314.0,
            138.5478256776338
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 58,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18095973224673866396&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "PrimerAI;Azad University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.primer.ai;http://www.iau-azad.ac.ir",
        "aff_unique_abbr": "PrimerAI;",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mashhad",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United States;Iran"
    },
    {
        "title": "Understanding when Dynamics-Invariant Data Augmentations Benefit Model-free Reinforcement Learning Updates",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17643",
        "id": "sVEu295o70",
        "author_site": "Nicholas Corrado, Josiah Hanna",
        "tldr": "",
        "abstract": "Recently, data augmentation (DA) has emerged as a method for leveraging domain knowledge to inexpensively generate additional data in reinforcement learning (RL) tasks, often yielding substantial improvements in data efficiency.\nWhile prior work has demonstrated the utility of incorporating augmented data directly into model-free RL updates,\nit is not well-understood when a particular DA strategy will improve data efficiency.\nIn this paper, we seek to identify general aspects of DA responsible for observed learning improvements.\nOur study focuses on sparse-reward tasks with dynamics-invariant data augmentation functions, serving as an initial step towards a more general understanding of DA and its integration into RL training.\nExperimentally, we isolate three relevant aspects of DA: state-action coverage,  reward density, and the number of augmented transitions generated per update (the augmented replay ratio).\nFrom our experiments, we draw two conclusions: (1) increasing state-action coverage often has a much greater impact on data efficiency than increasing reward density, and (2) decreasing the augmented replay ratio substantially improves data efficiency.\nIn fact, certain tasks in our empirical study are solvable only when the replay ratio is sufficiently low.",
        "keywords": "reinforcement learning;data augmentation;model-free",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/9ccdfc83b7abe813bc13bb908b82694c8bdccf77.zip",
        "author": "Nicholas Corrado;Josiah P. Hanna",
        "authorids": "~Nicholas_Corrado1;~Josiah_P._Hanna1",
        "gender": ";M",
        "homepage": "https://nicholascorrado.github.io;https://pages.cs.wisc.edu/~jphanna/",
        "dblp": "340/2322;135/6336",
        "google_scholar": "7aEHl08AAAAJ;",
        "orcid": "0000-0001-7720-6013;",
        "linkedin": "nicholas-e-corrado;",
        "or_profile": "~Nicholas_Corrado1;~Josiah_Hanna2",
        "aff": "Amazon;University of Wisconsin - Madison",
        "aff_domain": "amazon.com;wisc.edu",
        "position": "Applied Scientist Intern;Assistant Professor",
        "bibtex": "@inproceedings{\ncorrado2024understanding,\ntitle={Understanding when Dynamics-Invariant Data Augmentations Benefit Model-free Reinforcement Learning Updates},\nauthor={Nicholas Corrado and Josiah P. Hanna},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=sVEu295o70}\n}",
        "github": "",
        "project": "",
        "reviewers": "UZG5;ynPP;Mi19;Y7KF",
        "pdf_size": 13817281,
        "rating": "3;5;8;8",
        "confidence": "4;4;4;3",
        "soundness": "1;2;4;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;4;4",
        "wc_summary": "115;27;90;92",
        "wc_strengths": "39;34;54;94",
        "wc_weaknesses": "257;64;22;76",
        "wc_questions": "97;17;93;50",
        "wc_review": "508;142;259;312",
        "wc_reply_reviewers": "69;0;0;68",
        "wc_reply_authors": "1464;535;643;450",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "3;1;1;1",
        "rating_avg": [
            6.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            1.118033988749895
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            81.0,
            32.687918257362305
        ],
        "wc_strengths_avg": [
            55.25,
            23.551804601770964
        ],
        "wc_weaknesses_avg": [
            104.75,
            90.15923413605508
        ],
        "wc_questions_avg": [
            64.25,
            32.91940916845258
        ],
        "wc_review_avg": [
            305.25,
            132.23345832277096
        ],
        "wc_reply_reviewers_avg": [
            34.25,
            34.2518247689083
        ],
        "wc_reply_authors_avg": [
            773.0,
            404.7696876002451
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5443310539518174,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18106062110916743689&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=sVEu295o70",
        "pdf": "https://openreview.net/pdf?id=sVEu295o70",
        "email": "amazon.com;wisc.edu",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Amazon;University of Wisconsin-Madison",
        "aff_unique_dep": "Amazon.com, Inc.;",
        "aff_unique_url": "https://www.amazon.com;https://www.wisc.edu",
        "aff_unique_abbr": "Amazon;UW-Madison",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Madison",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "sVl1KO5K76",
        "title": "Momentum-SAM: Sharpness Aware Minimization without Computational Overhead",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The recently proposed optimization algorithm for deep neural networks Sharpness Aware Minimization (SAM) suggests perturbing parameters before gradient calculation by a gradient ascent step to guide the optimization into parameter space regions of flat loss.\nWhile significant generalization improvements and thus reduction of overfitting could be demonstrated, the computational costs are doubled due to the additionally needed gradient calculation, making SAM unfeasible in case of limited computationally capacities.\nMotivated by Nesterov Accelerated Gradient (NAG) we propose Momentum-SAM (MSAM), which perturbs parameters in the direction of the accumulated momentum vector to achieve low sharpness without significant computational overhead or memory demands over SGD or Adam.\nWe evaluate MSAM in detail and reveal insights on separable mechanisms of NAG, SAM and MSAM regarding training optimization and generalization.\nCode is available at https://XXXXXXXX.",
        "keywords": "Neural Networks;Optimization;Sharpness;Generalization;Overfitting",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/192be80dd025452a40a14bf894e5bc9182ce1007.zip",
        "author": "Marlon Becker;Frederick Altrock;Benjamin Risse",
        "authorids": "~Marlon_Becker1;~Frederick_Altrock1;~Benjamin_Risse1",
        "gender": ";M;M",
        "homepage": ";;https://cvmls.uni-muenster.de",
        "dblp": "364/9023.html;;124/2684",
        "google_scholar": "FUPTvIoAAAAJ;;rWx-1t0AAAAJ",
        "orcid": ";;0000-0001-5691-4029",
        "linkedin": "marlon-becker-26105a2a2/;frederick-altrock-39492124b/;",
        "or_profile": "~Marlon_Becker1;~Frederick_Altrock1;~Benjamin_Risse1",
        "aff": "Westf\u00e4lische Wilhelms-Universit\u00e4t M\u00fcnster;;University of M\u00fcnster",
        "aff_domain": "wwu.de;;uni-muenster.de",
        "position": "PhD student;;Full Professor",
        "bibtex": "@misc{\nbecker2024momentumsam,\ntitle={Momentum-{SAM}: Sharpness Aware Minimization without Computational Overhead},\nauthor={Marlon Becker and Frederick Altrock and Benjamin Risse},\nyear={2024},\nurl={https://openreview.net/forum?id=sVl1KO5K76}\n}",
        "github": "",
        "project": "",
        "reviewers": "R3HM;BYgZ;kkxn;auP2",
        "site": "https://openreview.net/forum?id=sVl1KO5K76",
        "pdf_size": 1820284,
        "rating": "3;5;6;6",
        "confidence": "4;4;5;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "41;80;52;104",
        "wc_strengths": "56;46;33;44",
        "wc_weaknesses": "146;486;162;94",
        "wc_questions": "256;2;2;57",
        "wc_review": "499;614;249;299",
        "wc_reply_reviewers": "37;129;97;0",
        "wc_reply_authors": "491;330;306;594",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            69.25,
            24.5903944661325
        ],
        "wc_strengths_avg": [
            44.75,
            8.166241485530538
        ],
        "wc_weaknesses_avg": [
            222.0,
            154.47977213862015
        ],
        "wc_questions_avg": [
            79.25,
            104.48773851510042
        ],
        "wc_review_avg": [
            415.25,
            148.04454566109484
        ],
        "wc_reply_reviewers_avg": [
            65.75,
            50.3158772158451
        ],
        "wc_reply_authors_avg": [
            430.25,
            118.31393620364425
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.4714045207910316,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2541302284524039479&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Westf\u00e4lische Wilhelms-Universit\u00e4t M\u00fcnster;University of M\u00fcnster",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uni-muenster.de;https://www.uni-muenster.de",
        "aff_unique_abbr": "WWU;UM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "sVlvuV70Yn",
        "title": "SemanticBoost: Elevating Motion Generation with Augmented Textual Cues",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In the rapidly advancing domain of motion generation, enhancing textual semantics has been recognized as a highly promising strategy for producing more accurate and realistic motions. However, current techniques frequently depend on extensive language models to refine text descriptions, without guaranteeing precise alignment between textual and motion data. This misalignment often leads to suboptimal motion generation, limiting the potential of these methods. To address this issue, we introduce a novel framework called SemanticBoost, which aims to bridge the gap between textual and motion data. Our innovative solution integrates supplementary semantic information derived from the motion data itself, along with a dedicated denoise network, to guarantee semantic coherence and elevate the overall quality of motion generation. Through extensive experiments and evaluations, we demonstrate that SemanticBoost significantly outperforms existing methods in terms of motion quality, alignment, and realism. Moreover, our findings emphasize the potential of leveraging semantic cues from motion data, opening new avenues for more intuitive and diverse motion generation.",
        "keywords": "Motion Synthesis; Semantic alignment; Data Augmentation; Denoise Network",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/d808a6790592ca18219d5157a140153cf6cf76d3.zip",
        "author": "Xin He;Shaoli Huang;Xiaohang Zhan;CHAO WENG;Ying Shan",
        "authorids": "~Xin_He9;~Shaoli_Huang2;~Xiaohang_Zhan1;~CHAO_WENG1;~Ying_Shan2",
        "gender": "M;M;M;M;M",
        "homepage": "https://github.com/blackgold3;;https://xiaohangzhan.github.io/;https://cweng6.github.io/;",
        "dblp": ";80/8502;211/7010;;68/5910",
        "google_scholar": "https://scholar.google.com.hk/citations?user=MkYBSV8AAAAJ;o31BPFsAAAAJ;QfquhDEAAAAJ;;4oXBp9UAAAAJ",
        "orcid": ";;0000-0003-2136-7592;;0000-0001-7673-8325",
        "linkedin": ";;xiaohang-zhan-%EF%BC%88%E8%A9%B9%E6%99%93%E8%88%AA%EF%BC%89-7659b2b8/;;YingShanProfile/",
        "or_profile": "~Xin_He9;~Shaoli_Huang2;~Xiaohang_Zhan1;~CHAO_WENG1;~Ying_Shan2",
        "aff": "Tencent AI Lab;Tencent AI Lab;Tencent AI Lab;Tencent AI Lab;Tencent PCG ARC Lab",
        "aff_domain": "tencent.com;tencent.com;tencent.com;tencent.com;arc.tencent.com",
        "position": "Researcher;Researcher;Researcher;Principal Researcher;Director",
        "bibtex": "@misc{\nhe2024semanticboost,\ntitle={SemanticBoost: Elevating Motion Generation with Augmented Textual Cues},\nauthor={Xin He and Shaoli Huang and Xiaohang Zhan and CHAO WENG and Ying Shan},\nyear={2024},\nurl={https://openreview.net/forum?id=sVlvuV70Yn}\n}",
        "github": "",
        "project": "",
        "reviewers": "XYJJ;qEjh;fDsx;TxQT",
        "site": "https://openreview.net/forum?id=sVlvuV70Yn",
        "pdf_size": 2557175,
        "rating": "3;3;5;5",
        "confidence": "4;5;5;4",
        "soundness": "2;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "2;2;1;2",
        "wc_summary": "38;56;64;73",
        "wc_strengths": "37;22;20;73",
        "wc_weaknesses": "130;301;753;351",
        "wc_questions": "93;8;143;120",
        "wc_review": "298;387;980;617",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            57.75,
            12.891373084353738
        ],
        "wc_strengths_avg": [
            38.0,
            21.24852936087578
        ],
        "wc_weaknesses_avg": [
            383.75,
            228.39371160345024
        ],
        "wc_questions_avg": [
            91.0,
            51.08326536156435
        ],
        "wc_review_avg": [
            570.5,
            263.52466677713494
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10370335297566754358&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Tencent",
        "aff_unique_dep": "Tencent AI Lab",
        "aff_unique_url": "https://ai.tencent.com",
        "aff_unique_abbr": "Tencent AI Lab",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "sVs7lV691r",
        "title": "Exploring Memorization in Fine-tuned Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large language models have shown great capabilities in various tasks but also exhibited memorization of training data, thus raising tremendous privacy and copyright concerns.  While prior work has studied memorization during pre-training, the exploration of memorization during fine-tuning is rather limited. Compared with pre-training, fine-tuning typically involves sensitive data and diverse objectives, thus may bring unique memorization behaviors and distinct privacy risks. In this work, we conduct the first comprehensive analysis to explore LLM memorization during fine-tuning. Our studies with open-sourced and our own fine-tuned LM models across various tasks indicate that fine-tuned memorization presents a strong disparity among tasks. We provide an understanding on this task disparity via sparse coding theory and unveil a strong correlation between memorization and model attention distribution. By investigating its memorization behavior,  multi-task fine-tuning paves a potential strategy to mitigate fine-tuning memorization.",
        "keywords": "Large language models;Memorization;Privacy",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Shenglai Zeng;Yaxin Li;Jie Ren;Yiding Liu;Han Xu;Pengfei He;Yue Xing;Jiliang Tang;Dawei Yin",
        "authorids": "~Shenglai_Zeng2;~Yaxin_Li3;~Jie_Ren6;~Yiding_Liu1;~Han_Xu1;~Pengfei_He2;~Yue_Xing1;~Jiliang_Tang1;~Dawei_Yin1",
        "gender": "M;;M;M;M;M;;M;M",
        "homepage": "https://slz-ai.github.io/;http://cse.msu.edu/~liyaxin1/;https://renjie3.github.io/;https://liuyiding.net;https://cse.msu.edu/~xuhan1/;https://pengfeihepower.github.io/;https://sites.google.com/site/xingyuecuhk/;https://www.cse.msu.edu/~tangjili/;https://www.yindawei.com/",
        "dblp": "312/6540;;181/2887-19.html;;32/34-2;37/10219-2;185/5744-2.html;64/10812;",
        "google_scholar": "https://scholar.google.com.hk/citations?user=2EFS5WEAAAAJ;;;c7oiMdIAAAAJ;mX2rL3IAAAAJ;nsSrd6kAAAAJ;;WtzKMWAAAAAJ;GuQ9bpAAAAAJ",
        "orcid": "0009-0001-9664-8017;;;0000-0001-6857-261X;0000-0002-4016-6748;;;0000-0001-7125-3898;0000-0002-0684-6205",
        "linkedin": ";;;;;;;;dwyin/",
        "or_profile": "~Shenglai_Zeng2;~Yaxin_Li3;~Jie_Ren6;~Yiding_Liu1;~Han_Xu1;~Pengfei_He2;~Yue_Xing1;~Jiliang_Tang1;~Dawei_Yin1",
        "aff": "Michigan State University;Michigan State University;Sony Europe Ltd.;Baidu;Michigan State University;Michigan State University;Michigan State University;Michigan State University;Baidu",
        "aff_domain": "msu.edu;msu.edu;sony.com;baidu.com;msu.edu;msu.edu;msu.edu;msu.edu;baidu.com",
        "position": "PhD student;PhD student;Intern;Researcher;PhD student;PhD student;Assistant Professor;Full Professor;Principal Researcher",
        "bibtex": "@misc{\nzeng2024exploring,\ntitle={Exploring Memorization in Fine-tuned Language Models},\nauthor={Shenglai Zeng and Yaxin Li and Jie Ren and Yiding Liu and Han Xu and Pengfei He and Yue Xing and Jiliang Tang and Dawei Yin},\nyear={2024},\nurl={https://openreview.net/forum?id=sVs7lV691r}\n}",
        "github": "",
        "project": "",
        "reviewers": "wy1y;BVwv;gHsj",
        "site": "https://openreview.net/forum?id=sVs7lV691r",
        "pdf_size": 33655460,
        "rating": "3;3;6",
        "confidence": "4;5;3",
        "soundness": "1;2;3",
        "contribution": "1;2;3",
        "presentation": "2;2;3",
        "wc_summary": "141;106;66",
        "wc_strengths": "63;99;77",
        "wc_weaknesses": "627;416;194",
        "wc_questions": "80;2;8",
        "wc_review": "911;623;345",
        "wc_reply_reviewers": "327;0;112",
        "wc_reply_authors": "3387;1479;1822",
        "reply_reviewers": "1;0;1",
        "reply_authors": "7;4;4",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            104.33333333333333,
            30.64129385141706
        ],
        "wc_strengths_avg": [
            79.66666666666667,
            14.817407180595245
        ],
        "wc_weaknesses_avg": [
            412.3333333333333,
            176.7905226217992
        ],
        "wc_questions_avg": [
            30.0,
            35.4400902933387
        ],
        "wc_review_avg": [
            626.3333333333334,
            231.08055353538995
        ],
        "wc_reply_reviewers_avg": [
            146.33333333333334,
            135.68673070307534
        ],
        "wc_reply_authors_avg": [
            2229.3333333333335,
            830.4843299076883
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            5.0,
            1.4142135623730951
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -0.8660254037844387,
        "gs_citation": 26,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2270115649775164054&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;1;2;0;0;0;0;2",
        "aff_unique_norm": "Michigan State University;Sony Europe;Baidu",
        "aff_unique_dep": ";;Baidu, Inc.",
        "aff_unique_url": "https://www.msu.edu;https://www.sony.eu;https://www.baidu.com",
        "aff_unique_abbr": "MSU;Sony Europe;Baidu",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;2;0;0;0;0;2",
        "aff_country_unique": "United States;United Kingdom;China"
    },
    {
        "id": "sW95puhphh",
        "title": "DECENTRALIZED MULTI-AGENT REINFORCEMENT LEARNING VIA ANTICIPATION SHARING",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In the realm of cooperative and decentralized multi-agent reinforcement learning (MARL), a fundamental challenge is reconciling individual incentives with collective outcomes. Previous studies often use algorithms where agents share rewards, values or policy models to align individual and collective goals. However, these methods pose issues like policy discoordination, privacy concerns, and considerable communication overheads. In this research, we obviate the need for sharing rewards, values, or model parameters. To bridge the gap between individual and collective goals, we set up a personal target based on a collective objective. This involves comparing what each agent anticipates other agents to do with what those agents intend to do. We introduce a novel decentralized MARL method based on the idea - Anticipation Sharing - where local agents update their anticipations regarding the action distributions of neighboring agents, reflecting their preferences, and share them with the corresponding agents. Based on the anticipations, each agent rectifies the deviation of its individual policy from the collective cooperation objective. Our approach has been validated as effective and viable through both theoretical analysis and testing in simulated environments. Our study shows the proposed MARL framework can induce cooperative behaviors among agents, even when they have private information about rewards, policies, and values. This represents a paradigm shift in orchestrating effective ways of cooperation by explicitly reconciling both individual and collective interests within multi-agent systems.",
        "keywords": "multi-agent reinforcement learning;decentralized learning;cooperative multi-agent learning;social welfare",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Yue Jin;Shuangqing Wei;Giovanni Montana",
        "authorids": "~Yue_Jin1;~Shuangqing_Wei1;~Giovanni_Montana1",
        "gender": ";M;M",
        "homepage": ";https://www.ece.lsu.edu/swei/;https://warwick.ac.uk/fac/sci/statistics/staff/academic-research/montana",
        "dblp": ";;89/449",
        "google_scholar": "GVhmDx8AAAAJ;;tD5eGlkAAAAJ",
        "orcid": "0000-0002-0344-4868;;0000-0003-3942-3900",
        "linkedin": ";;gmontana/",
        "or_profile": "~Yue_Jin1;~Shuangqing_Wei1;~Giovanni_Montana1",
        "aff": "University of Warwick;;The University of Warwick",
        "aff_domain": "warwick.ac.uk;;warwick.ac.uk",
        "position": "Postdoc;;Full Professor",
        "bibtex": "@misc{\njin2024decentralized,\ntitle={{DECENTRALIZED} {MULTI}-{AGENT} {REINFORCEMENT} {LEARNING} {VIA} {ANTICIPATION} {SHARING}},\nauthor={Yue Jin and Shuangqing Wei and Giovanni Montana},\nyear={2024},\nurl={https://openreview.net/forum?id=sW95puhphh}\n}",
        "github": "",
        "project": "",
        "reviewers": "FSUM;yNQQ;f5qP;NPvi",
        "site": "https://openreview.net/forum?id=sW95puhphh",
        "pdf_size": 5177557,
        "rating": "3;5;6;6",
        "confidence": "4;2;3;4",
        "soundness": "1;3;3;3",
        "contribution": "1;2;3;3",
        "presentation": "1;3;2;4",
        "wc_summary": "77;60;150;52",
        "wc_strengths": "23;41;130;101",
        "wc_weaknesses": "169;119;650;39",
        "wc_questions": "170;26;4;112",
        "wc_review": "439;246;934;304",
        "wc_reply_reviewers": "190;0;153;0",
        "wc_reply_authors": "2020;965;1156;486",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "4;2;3;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            84.75,
            38.7387080321479
        ],
        "wc_strengths_avg": [
            73.75,
            43.45903243285566
        ],
        "wc_weaknesses_avg": [
            244.25,
            238.8047057744047
        ],
        "wc_questions_avg": [
            78.0,
            66.70832032063167
        ],
        "wc_review_avg": [
            480.75,
            270.8905452392165
        ],
        "wc_reply_reviewers_avg": [
            85.75,
            86.74207456592217
        ],
        "wc_reply_authors_avg": [
            1156.75,
            554.9492656991267
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.24618298195866545,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:oFIYujUGenwJ:scholar.google.com/&scioq=DECENTRALIZED+MULTI-AGENT+REINFORCEMENT+LEARNING+VIA+ANTICIPATION+SHARING&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Warwick",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.warwick.ac.uk",
        "aff_unique_abbr": "Warwick",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "title": "DSPy: Compiling Declarative Language Model Calls into State-of-the-Art Pipelines",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17642",
        "id": "sY5N0zY5Od",
        "author_site": "Omar Khattab, Arnav Singhvi, Paridhi Maheshwari, Zhiyuan Zhang, Keshav Santhanam, Sri Vardhamanan A, Saiful Haq, Ashutosh Sharma, Thomas Joshi, Hanna Moazam, Heather Miller, Matei Zaharia, Christopher Potts",
        "tldr": "",
        "abstract": "The ML community is rapidly exploring techniques for prompting language models (LMs) and for stacking them into pipelines that solve complex tasks. Unfortunately, existing LM pipelines are typically implemented using hard-coded \u201cprompt templates\u201d, i.e. lengthy strings discovered via trial and error. Toward a more systematic approach for developing and optimizing LM pipelines, we introduce DSPy, a programming model that abstracts LM pipelines as text transformation graphs, or imperative computational graphs where LMs are invoked through declarative modules. DSPy modules are parameterized, meaning they can learn how to apply compositions of prompting, finetuning, augmentation, and reasoning techniques. We design a compiler that will optimize any DSPy pipeline to maximize a given metric, by creating and collecting demonstrations. We conduct two case studies, showing that succinct DSPy programs can express and optimize pipelines that reason about math word problems, tackle multi-hop retrieval, answer complex questions, and control agent loops. Within minutes of compiling, DSPy can automatically produce pipelines that outperform out-of-the-box few-shot prompting as well as expert-created demonstrations for GPT-3.5 and Llama2-13b-chat. On top of that, DSPy programs compiled for relatively small LMs like 770M parameter T5 and Llama2-13b-chat are competitive with many approaches that rely on large and proprietary LMs like GPT-3.5 and on expert-written prompt chains. DSPy is available at https://github.com/stanfordnlp/dspy",
        "keywords": "programming models;prompting techniques;in-context learning;few-shot learning;chain of thought;multi-hop reasoning;language agents",
        "primary_area": "infrastructure, software libraries, hardware, etc.",
        "supplementary_material": "",
        "author": "Omar Khattab;Arnav Singhvi;Paridhi Maheshwari;Zhiyuan Zhang;Keshav Santhanam;Sri Vardhamanan A;Saiful Haq;Ashutosh Sharma;Thomas T. Joshi;Hanna Moazam;Heather Miller;Matei Zaharia;Christopher Potts",
        "authorids": "~Omar_Khattab1;~Arnav_Singhvi1;~Paridhi_Maheshwari1;~Zhiyuan_Zhang4;~Keshav_Santhanam1;~Sri_Vardhamanan_A1;~Saiful_Haq1;~Ashutosh_Sharma1;~Thomas_T._Joshi1;~Hanna_Moazam1;~Heather_Miller1;~Matei_Zaharia1;~Christopher_Potts1",
        "gender": "M;;F;M;M;M;M;M;F;F;M;M;",
        "homepage": "https://scholar.google.com/citations?hl=en&user=Lwr5ozgAAAAJ;https://www.linkedin.com/in/arnav-singhvi-1323a7189/;https://paridhimaheshwari2708.github.io/;;https://cs.stanford.edu/~keshav2;;;;https://www.linkedin.com/in/hanna-moazam/;https://heather.miller.am;https://cs.stanford.edu/~matei/;http://web.stanford.edu/~cgpotts/;",
        "dblp": "129/7815;;221/3681;;221/1812.html;;358/6570;;;;36/2133;13/2617;",
        "google_scholar": ";;cwHfRZoAAAAJ;;bAyZGdAAAAAJ;;EiZxSoMAAAAJ;xMDayLoAAAAJ;;;I1EvjZsAAAAJ;3j08YoAAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;;0000-0001-5939-7944;;;;;;0000-0002-7547-7204;0000-0002-7978-6055;",
        "linkedin": ";arnav-singhvi-1323a7189/;paridhimaheshwari2708/;eric-zhang-b377601ba/;;sri-vardhamanan-a-33b744155/;;ashutoshuiuc/;;;mateizaharia/;;",
        "or_profile": "~Omar_Khattab1;~Arnav_Singhvi1;~Paridhi_Maheshwari1;~Zhiyuan_Zhang4;~Keshav_Santhanam1;~Sri_Vardhamanan_A1;~Saiful_Haq1;~Ashutosh_Sharma1;~Hanna_Moazam1;~Heather_Miller1;~Matei_Zaharia1;~Christopher_Potts1;~Thomas_T_Joshi1",
        "aff": "Stanford University;Computer Science Department, Stanford University;;Stanford University;Stanford University;;Indian Institute of Technology Bombay;Department of Computer Science, UIUC;;Carnegie Mellon University;Databricks;Stanford University;Computer Science Department, Stanford University",
        "aff_domain": "stanford.edu;cs.stanford.edu;;stanford.edu;stanford.edu;;cse.iitb.ac.in;cs.illinois.edu;;cmu.edu;databricks.com;stanford.edu;cs.stanford.edu",
        "position": "PhD student;MS student;;Undergrad student;PhD student;;PhD student;MS student;;Assistant Professor;CTO;Full Professor;Researcher",
        "bibtex": "@inproceedings{\nkhattab2024dspy,\ntitle={{DSP}y: Compiling Declarative Language Model Calls into State-of-the-Art Pipelines},\nauthor={Omar Khattab and Arnav Singhvi and Paridhi Maheshwari and Zhiyuan Zhang and Keshav Santhanam and Sri Vardhamanan A and Saiful Haq and Ashutosh Sharma and Thomas T. Joshi and Hanna Moazam and Heather Miller and Matei Zaharia and Christopher Potts},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=sY5N0zY5Od}\n}",
        "github": "",
        "project": "",
        "reviewers": "cQiR;zPoD;FCUg",
        "pdf_size": 332117,
        "rating": "6;8;8",
        "confidence": "3;4;3",
        "soundness": "3;3;4",
        "contribution": "3;3;4",
        "presentation": "4;3;3",
        "wc_summary": "81;82;57",
        "wc_strengths": "63;135;46",
        "wc_weaknesses": "59;238;130",
        "wc_questions": "308;712;19",
        "wc_review": "511;1167;252",
        "wc_reply_reviewers": "0;167;52",
        "wc_reply_authors": "1395;1857;580",
        "reply_reviewers": "0;1;1",
        "reply_authors": "2;3;2",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            73.33333333333333,
            11.55662388223981
        ],
        "wc_strengths_avg": [
            81.33333333333333,
            38.57748335781149
        ],
        "wc_weaknesses_avg": [
            142.33333333333334,
            73.59498775203527
        ],
        "wc_questions_avg": [
            346.3333333333333,
            284.2115800283694
        ],
        "wc_review_avg": [
            643.3333333333334,
            385.08902289672653
        ],
        "wc_reply_reviewers_avg": [
            73.0,
            69.77583153690587
        ],
        "wc_reply_authors_avg": [
            1277.3333333333333,
            527.9307614535157
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            13,
            0
        ],
        "corr_rating_confidence": 0.49999999999999983,
        "gs_citation": 32,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10758913072249467312&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=sY5N0zY5Od",
        "pdf": "https://openreview.net/pdf?id=sY5N0zY5Od",
        "email": "stanford.edu;cs.stanford.edu;;stanford.edu;stanford.edu;;cse.iitb.ac.in;cs.illinois.edu;;cmu.edu;databricks.com;stanford.edu;cs.stanford.edu",
        "author_num": 13,
        "aff_unique_index": "0;0;0;0;1;2;3;4;0;0",
        "aff_unique_norm": "Stanford University;Indian Institute of Technology Bombay;University of Illinois Urbana-Champaign;Carnegie Mellon University;Databricks",
        "aff_unique_dep": ";;Department of Computer Science;;",
        "aff_unique_url": "https://www.stanford.edu;https://www.iitb.ac.in;https://www.cs.uiuc.edu;https://www.cmu.edu;https://databricks.com",
        "aff_unique_abbr": "Stanford;IIT Bombay;UIUC;CMU;Databricks",
        "aff_campus_unique_index": "0;0;0;0;1;2;0;0",
        "aff_campus_unique": "Stanford;Bombay;Urbana-Champaign;",
        "aff_country_unique_index": "0;0;0;0;1;0;0;0;0;0",
        "aff_country_unique": "United States;India"
    },
    {
        "id": "sYCrhXPVr1",
        "title": "Video Generation Beyond a Single Clip",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "This work tackles the challenge of generating long videos, which entails producing videos that surpass the output length of video generation models. Due to computational constraints, video generation models are restricted to generating relatively short video clips compared to the length of real-world videos. Existing approaches employ a sliding window technique to generate long videos during inference, but this method is often restricted to homogeneous content and recurring events. To generate long videos that encompass diverse content and multiple events, we propose utilizing additional guidance to steer the video generation process. We further introduce a multi-stage approach to address this challenge, enabling us to leverage existing video generation models to produce high-quality videos within a limited time window while holistically modeling the long video based on the provided guidance. Our method complements existing video generation efforts. Extensive experiments on challenging real-world videos demonstrate the advantages of the proposed method, which outperforms the state-of-the-art by up to 9.5\\% in objective metrics and is preferred by users over 80\\% of the time. The source code and trained models will be released to the public.",
        "keywords": "Video generation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/a01ad5b65f5a6b5fb58f361f818f338348fcfd52.zip",
        "author": "Hsin-Ping Huang;Yu-Chuan Su;Ming-Hsuan Yang",
        "authorids": "~Hsin-Ping_Huang2;~Yu-Chuan_Su1;~Ming-Hsuan_Yang1",
        "gender": "F;;M",
        "homepage": "https://hhsinping.github.io/;http://sammy-su.github.io/;https://faculty.ucmerced.edu/mhyang/",
        "dblp": "221/8694;53/6299;79/3711.html",
        "google_scholar": ";nrcJfPEAAAAJ;p9-ohHsAAAAJ",
        "orcid": ";0000-0002-2711-6738;0000-0003-4848-2304",
        "linkedin": ";https://www.linkedin.com/pub/yu-chuan-su/52/38b/b82/;minghsuanyang/",
        "or_profile": "~Hsin-Ping_Huang2;~Yu-Chuan_Su1;~Ming-Hsuan_Yang1",
        "aff": "Google;Google;University of California at Merced",
        "aff_domain": "google.com;google.com;umcerced.edu",
        "position": "Intern;Research Scientist;Professor",
        "bibtex": "@misc{\nhuang2024video,\ntitle={Video Generation Beyond a Single Clip},\nauthor={Hsin-Ping Huang and Yu-Chuan Su and Ming-Hsuan Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=sYCrhXPVr1}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZyRs;e4d3;V5GZ;cBdr",
        "site": "https://openreview.net/forum?id=sYCrhXPVr1",
        "pdf_size": 3954621,
        "rating": "3;5;5;6",
        "confidence": "5;4;5;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;2",
        "presentation": "3;3;4;3",
        "wc_summary": "64;110;87;91",
        "wc_strengths": "20;48;98;63",
        "wc_weaknesses": "119;125;272;286",
        "wc_questions": "24;2;10;76",
        "wc_review": "227;285;467;516",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            88.0,
            16.355427233796124
        ],
        "wc_strengths_avg": [
            57.25,
            28.136941909169874
        ],
        "wc_weaknesses_avg": [
            200.5,
            78.6844965669858
        ],
        "wc_questions_avg": [
            28.0,
            28.809720581775867
        ],
        "wc_review_avg": [
            373.75,
            120.77121966760127
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.6882472016116854,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15680285875479678850&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Google;University of California, Merced",
        "aff_unique_dep": "Google;",
        "aff_unique_url": "https://www.google.com;https://www.ucmerced.edu",
        "aff_unique_abbr": "Google;UC Merced",
        "aff_campus_unique_index": "0;0;1",
        "aff_campus_unique": "Mountain View;Merced",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "sYv3OMboTF",
        "title": "ExcelFormer: Making Neural Network Excel in Small Tabular Data Prediction",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Data organized in tables are omnipresent in real-world applications. Despite their strong performance on large-scale datasets, deep neural networks (DNNs) perform inferior on small-scale tabular data, which hinders the wider adoption of DNNs across domains. In this paper, we propose a holistic framework comprising a novel neural network architecture called ExcelFormer and two data augmentation approaches, which achieves high-precision prediction for supervised classification and regression tasks, particularly on small-scale tabular datasets. The core component of ExcelFormer is a novel \"semi-permeable attention\" coupled with a special initialization, which explicitly diminishes the impacts of uninformative features, thereby improving data-efficiency. The methodology insight behind two tabular data augmentation approaches, Feat-Mix and Hid-Mix, is to increase the training samples in a way accommodating the inherent irregularities of data patterns. Comprehensive experiments on diverse small-scale tabular datasets show that, our ExcelFormer consistently and substantially outperforms previous works, with no noticeable dataset type preference. Remarkably, we find the superiority of ExcelFormer extends to large datasets as well.",
        "keywords": "tabular data;deep neural network architecture;supervised learning.",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/8dabba28bc86beb3541e7027c981984f263a55e5.zip",
        "author": "Jintai Chen;Jiahuan Yan;Danny Chen;Jimeng Sun;Jian Wu",
        "authorids": "~Jintai_Chen1;~Jiahuan_Yan1;~Danny_Chen1;~Jimeng_Sun3;~Jian_Wu6",
        "gender": "M;M;Not Specified;;M",
        "homepage": "https://whatashot.github.io/;;https://engineering.nd.edu/faculty/danny-chen/;http://sunlab.org;https://scholar.google.com/citations?hl=zh-TW&user=VO9XIXYAAAAJ",
        "dblp": "249/3929;334/7537;c/DannyZChen.html;;96/2744-1",
        "google_scholar": "https://scholar.google.com/citations?hl=en;_wQJGDcAAAAJ;tRerdSIAAAAJ;9jmmp5sAAAAJ;https://scholar.google.com/citations?hl=zh-TW",
        "orcid": "0000-0002-3199-2597;0000-0002-2002-2579;0000-0001-6565-2884;0000-0003-1512-6426;",
        "linkedin": "jintai-chen-3a09921b0/;;;jimengsun/;",
        "or_profile": "~Jintai_Chen1;~Jiahuan_Yan1;~Danny_Chen1;~Jimeng_Sun3;~Jian_Wu6",
        "aff": "University of Illinois, Urbana Champaign;Zhejiang University;University of Notre Dame, USA;Georgia Institute of Technology;Zhejiang University",
        "aff_domain": "illinois.edu;zju.edu.cn;nd.edu;gatech.edu;zju.edu.cn",
        "position": "Postdoc;PhD student;Full Professor;Associate Professor;Full Professor",
        "bibtex": "@misc{\nchen2024excelformer,\ntitle={ExcelFormer: Making Neural Network Excel in Small Tabular Data Prediction},\nauthor={Jintai Chen and Jiahuan Yan and Danny Chen and Jimeng Sun and Jian Wu},\nyear={2024},\nurl={https://openreview.net/forum?id=sYv3OMboTF}\n}",
        "github": "",
        "project": "",
        "reviewers": "Wsjx;J7k8;w8mp",
        "site": "https://openreview.net/forum?id=sYv3OMboTF",
        "pdf_size": 2123923,
        "rating": "5;5;5",
        "confidence": "5;5;4",
        "soundness": "2;3;3",
        "contribution": "2;2;3",
        "presentation": "3;3;3",
        "wc_summary": "93;158;160",
        "wc_strengths": "62;57;79",
        "wc_weaknesses": "410;325;596",
        "wc_questions": "15;824;252",
        "wc_review": "580;1364;1087",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1441;1984;2363",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;3;4",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            137.0,
            31.123410267299864
        ],
        "wc_strengths_avg": [
            66.0,
            9.41629792788369
        ],
        "wc_weaknesses_avg": [
            443.6666666666667,
            113.16752576993494
        ],
        "wc_questions_avg": [
            363.6666666666667,
            339.58046011054415
        ],
        "wc_review_avg": [
            1010.3333333333334,
            324.62525403233116
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1929.3333333333333,
            378.3845780272881
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            3.0,
            0.816496580927726
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:u-cgetsuQoQJ:scholar.google.com/&scioq=ExcelFormer:+Making+Neural+Network+Excel+in+Small+Tabular+Data+Prediction&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;1",
        "aff_unique_norm": "University of Illinois Urbana-Champaign;Zhejiang University;University of Notre Dame;Georgia Institute of Technology",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://illinois.edu;https://www.zju.edu.cn;https://www.nd.edu;https://www.gatech.edu",
        "aff_unique_abbr": "UIUC;ZJU;Notre Dame;Georgia Tech",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Urbana-Champaign;",
        "aff_country_unique_index": "0;1;0;0;1",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "sZACTXpSc6",
        "title": "ERA-Solver: Error-Robust Adams Solver for Fast Sampling of Diffusion Probabilistic Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Though denoising diffusion probabilistic models (DDPMs) have achieved remarkable generation results, the low sampling efficiency of DDPMs still limits further applications. Since DDPMs can be formulated as diffusion ordinary differential equations (ODEs), various fast sampling methods can be derived from solving diffusion ODEs. However, we notice that previous fast sampling methods with fixed analytical form are not able to robust with the various error patterns in the noise estimated from pretrained diffusion models. In this work, we construct an error-robust Adams solver (ERA-Solver), which utilizes the implicit Adams numerical method that consists of a predictor and a corrector. Different from the traditional predictor based on explicit Adams methods, we leverage a Lagrange interpolation function as the predictor, which is further enhanced with an error-robust strategy to adaptively select the Lagrange bases with lower errors in the estimated noise. The proposed solver can be directly applied to any pretrained diffusion models, without extra training. Experiments on Cifar10, CelebA, LSUN-Church, and ImageNet 64 $\\times$ 64 (conditional) datasets demonstrate that our proposed ERA-Solver achieves 3.54, 5.06, 5.02, and 5.11 Frechet Inception Distance (FID) for image generation, with only 10 network evaluations.",
        "keywords": "diffusion models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/04e55e02760f21034bdc29206f568f8aaccb7803.zip",
        "author": "Shengming Li;Luping Liu;Runnan Li;Xu Tan",
        "authorids": "~Shengming_Li1;~Luping_Liu2;~Runnan_Li1;~Xu_Tan1",
        "gender": "M;;M;M",
        "homepage": ";;;https://tan-xu.github.io/",
        "dblp": "66/9084;;195/8131;96/10484-3",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;;https://scholar.google.com/citations?hl=zh-CN;tob-U1oAAAAJ",
        "orcid": ";;;0000-0001-5631-0639",
        "linkedin": ";;;",
        "or_profile": "~Shengming_Li1;~Luping_Liu2;~Runnan_Li1;~Xu_Tan1",
        "aff": ";;Beijing University of Posts and Telecommunications;Microsoft",
        "aff_domain": ";;bupt.edu.cn;microsoft.com",
        "position": ";;Associate Professor;Principal Researcher",
        "bibtex": "@misc{\nli2024erasolver,\ntitle={{ERA}-Solver: Error-Robust Adams Solver for Fast Sampling of Diffusion Probabilistic Models},\nauthor={Shengming Li and Luping Liu and Runnan Li and Xu Tan},\nyear={2024},\nurl={https://openreview.net/forum?id=sZACTXpSc6}\n}",
        "github": "",
        "project": "",
        "reviewers": "khj4;L8Et;hCzL",
        "site": "https://openreview.net/forum?id=sZACTXpSc6",
        "pdf_size": 32749070,
        "rating": "3;5;5",
        "confidence": "3;3;4",
        "soundness": "3;3;3",
        "contribution": "3;2;2",
        "presentation": "1;2;3",
        "wc_summary": "88;64;60",
        "wc_strengths": "18;44;49",
        "wc_weaknesses": "252;79;138",
        "wc_questions": "1;53;2",
        "wc_review": "359;240;249",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            70.66666666666667,
            12.364824660660938
        ],
        "wc_strengths_avg": [
            37.0,
            13.589211407093005
        ],
        "wc_weaknesses_avg": [
            156.33333333333334,
            71.80683966184712
        ],
        "wc_questions_avg": [
            18.666666666666668,
            24.28076513529908
        ],
        "wc_review_avg": [
            282.6666666666667,
            54.10072909757214
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.49999999999999983,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14389049590663498732&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Beijing University of Posts and Telecommunications;Microsoft",
        "aff_unique_dep": ";Microsoft Corporation",
        "aff_unique_url": "http://www.bupt.edu.cn/;https://www.microsoft.com",
        "aff_unique_abbr": "BUPT;Microsoft",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Beijing;",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "sZZ3R0lV9f",
        "title": "Perturb-and-Compare Approach for Detecting Out-of-Distribution Samples in Constrained Access Environments",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Accessing machine learning models through remote APIs has been gaining more prevalence following the recent trend of scaling up model parameters for increased performance. Even though these models exhibit remarkable ability, detecting out-of-distribution (OOD) samples is still an important issue concerning the safety of the end users, as these samples may induce unreliable outputs from the model. In this work, we propose an OOD detection framework, MixDiff, that is applicable even when the model parameters or its activations are not accessible to the end user. To bypass the access restriction, MixDiff applies an identical input-level perturbation to a given target sample and an in-distribution (ID) sample that is similar to the target and compares the relative difference of the model outputs of these two samples. MixDiff is model-agnostic and compatible with existing output-based OOD detection methods. We provide theoretical analysis to illustrate MixDiff\u2019s effectiveness at discerning OOD samples that induce overconfident outputs from the model and empirically show that MixDiff consistently improves the OOD detection performance on various datasets in vision and text domains.",
        "keywords": "out-of-distribution detection;OOD detection;black-box environment;model-as-a-service;perturbation",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Heeyoung Lee;Hoyoon Byun;Changdae Oh;JinYeong Bak;Kyungwoo Song",
        "authorids": "~Heeyoung_Lee2;~Hoyoon_Byun1;~Changdae_Oh1;~JinYeong_Bak2;~Kyungwoo_Song1",
        "gender": ";;M;M;",
        "homepage": ";https://github.com/hybyun0121?tab=repositories;;https://nosyu.kr;https://mlai.yonsei.ac.kr",
        "dblp": ";329/4789;315/4736;22/11519;155/4867",
        "google_scholar": ";55yqBlMAAAAJ;7oAZaVcAAAAJ;https://scholar.google.co.kr/citations?user=oYK9Z_IAAAAJ;HWxRii4AAAAJ",
        "orcid": ";0000-0001-5897-6493;;0000-0002-3212-5241;0000-0003-0082-4280",
        "linkedin": ";;changedae-oh-440587215/;jybak/;kyungwoo-song-862863155/",
        "or_profile": "~Heeyoung_Lee2;~Hoyoon_Byun1;~Changdae_Oh1;~JinYeong_Bak2;~Kyungwoo_Song1",
        "aff": ";University of Seoul;University of Seoul;Sungkyunkwan University;Yonsei University",
        "aff_domain": ";uos.ac.kr;uos.ac.kr;skku.edu;yonsei.ac.kr",
        "position": ";MS student;MS student;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nlee2024perturbandcompare,\ntitle={Perturb-and-Compare Approach for Detecting Out-of-Distribution Samples in Constrained Access Environments},\nauthor={Heeyoung Lee and Hoyoon Byun and Changdae Oh and JinYeong Bak and Kyungwoo Song},\nyear={2024},\nurl={https://openreview.net/forum?id=sZZ3R0lV9f}\n}",
        "github": "",
        "project": "",
        "reviewers": "EmiV;hNhc;Z8Qr;LGSq",
        "site": "https://openreview.net/forum?id=sZZ3R0lV9f",
        "pdf_size": 12213147,
        "rating": "3;5;5;8",
        "confidence": "4;4;4;3",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;4",
        "wc_summary": "20;115;170;69",
        "wc_strengths": "16;25;50;73",
        "wc_weaknesses": "126;137;229;104",
        "wc_questions": "1;2;15;5",
        "wc_review": "163;279;464;251",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1760;1545;1401;660",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;2;2;1",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            93.5,
            55.49099025968089
        ],
        "wc_strengths_avg": [
            41.0,
            22.282279955157193
        ],
        "wc_weaknesses_avg": [
            149.0,
            47.69171835864168
        ],
        "wc_questions_avg": [
            5.75,
            5.539629951540085
        ],
        "wc_review_avg": [
            289.25,
            109.59556332260901
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1341.5,
            413.683756026267
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.8892972917998875,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7622688468119944670&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "University of Seoul;Sungkyunkwan University;Yonsei University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.useoul.edu;https://www.skku.edu;https://www.yonsei.ac.kr",
        "aff_unique_abbr": "UOS;SKKU;Yonsei",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "sZq3lDDETp",
        "title": "Uncovering Causal Variables in Transformers Using Circuit Probing",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Neural network models have achieved high performance on a wide variety of complex tasks, but the algorithms that they implement are notoriously difficult to interpret. In order to understand these algorithms, it is often necessary to hypothesize intermediate variables involved in the network's computation. For example, does a language model depend on particular syntactic properties when generating a sentence? However, existing analysis tools make it difficult to test hypotheses of this type.\nWe propose a new analysis technique -- circuit probing -- that automatically uncovers low-level circuits that compute hypothesized intermediate variables. This enables causal analysis through targeted ablation at the level of model parameters. We apply this method to models trained on simple arithmetic tasks, demonstrating its effectiveness at (1) deciphering the algorithms that models have learned, (2) revealing modular structure within a model, and (3) tracking the development of circuits over training. We compare circuit probing to other methods across these three experiments, and find it on par or more effective than existing analysis methods. Finally, we demonstrate circuit probing on a real-world use case, uncovering circuits that are responsible for subject-verb agreement and reflexive anaphora in GPT2 small and medium.",
        "keywords": "Interpretability;Analysis;NLP;Pruning",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/cfda0b11886859fd80e3843dfe0495a2e6e6ed09.pdf",
        "author": "Michael A. Lepori;Thomas Serre;Ellie Pavlick",
        "authorids": "~Michael_A._Lepori1;~Thomas_Serre1;~Ellie_Pavlick1",
        "gender": "M;M;F",
        "homepage": "https://lepori.xyz/;https://serre-lab.clps.brown.edu/;http://cs.brown.edu/people/epavlick/",
        "dblp": "262/0162;;141/4059",
        "google_scholar": "G1fepc8AAAAJ;kZlPW4wAAAAJ;sFyrSa8AAAAJ",
        "orcid": ";;",
        "linkedin": "michael-lepori-925426124/;;",
        "or_profile": "~Michael_A._Lepori1;~Thomas_Serre1;~Ellie_Pavlick1",
        "aff": "Brown University;Universit\u00e9 de Toulouse;Brown University",
        "aff_domain": "brown.edu;univ-toulouse.fr;brown.edu",
        "position": "PhD student;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nlepori2024uncovering,\ntitle={Uncovering Causal Variables in Transformers Using Circuit Probing},\nauthor={Michael A. Lepori and Thomas Serre and Ellie Pavlick},\nyear={2024},\nurl={https://openreview.net/forum?id=sZq3lDDETp}\n}",
        "github": "",
        "project": "",
        "reviewers": "LGtg;TVnz;pfUb;Ae4c;UXVb",
        "site": "https://openreview.net/forum?id=sZq3lDDETp",
        "pdf_size": 955547,
        "rating": "1;3;5;6;6",
        "confidence": "5;5;5;4;4",
        "soundness": "1;2;2;3;3",
        "contribution": "1;1;3;3;3",
        "presentation": "2;2;3;3;3",
        "wc_summary": "44;51;112;41;319",
        "wc_strengths": "5;19;53;13;229",
        "wc_weaknesses": "52;68;314;39;244",
        "wc_questions": "1;5;73;77;105",
        "wc_review": "102;143;552;170;897",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            4.2,
            1.9390719429665317
        ],
        "confidence_avg": [
            4.6,
            0.48989794855663565
        ],
        "soundness_avg": [
            2.2,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.2,
            0.9797958971132712
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            113.4,
            106.04263293600361
        ],
        "wc_strengths_avg": [
            63.8,
            84.2054630056744
        ],
        "wc_weaknesses_avg": [
            143.4,
            113.28124293103426
        ],
        "wc_questions_avg": [
            52.2,
            41.67685208841954
        ],
        "wc_review_avg": [
            372.8,
            307.95025572322555
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.7579367289598669,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:D0uN7hbFW3YJ:scholar.google.com/&scioq=Uncovering+Causal+Variables+in+Transformers+Using+Circuit+Probing&hl=en&as_sdt=0,21",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Brown University;Universit\u00e9 de Toulouse",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.brown.edu;https://www.univ-toulouse.fr",
        "aff_unique_abbr": "Brown;UT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United States;France"
    },
    {
        "id": "saj54kqrBj",
        "title": "Self-Tuning Self-Supervised Anomaly Detection",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Self-supervised learning (SSL) has emerged as a promising paradigm that presents supervisory signals to real-world problems, bypassing the extensive cost of manual labeling. Consequently, self-supervised anomaly detection (SSAD) has seen a recent surge of interest, since SSL is especially attractive for unsupervised tasks. However, recent works have reported that the choice of a data augmentation function has significant impact on the accuracy of SSAD, posing augmentation search as an essential but nontrivial problem with the lack of labeled validation data. In this paper, we introduce ST-SSAD (Self-Tuning Self-Supervised Anomaly Detection), the first systematic approach for rigorous augmentation tuning on SSAD. To this end, our work presents two key contributions. The first is a new unsupervised validation loss that quantifies the alignment between the augmented training data and the (unlabeled) test data. Second, we present new differentiable augmentation functions, allowing data augmentation hyperparameter(s) to be tuned end-to-end via our proposed validation loss. Experiments on two testbeds with semantic class anomalies and subtle industrial defects show that a systematic tuning of augmentation gives significant performance gains over current practices. All our code and testbeds are available at https://anonymous.4open.science/r/ST-SSAD.",
        "keywords": "Anomaly detection;Self-supervised learning;Data augmentation;Hyperparameter optimization",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/92538f90f42a01c927bdefb81d34d5d8192451fc.zip",
        "author": "Jaemin Yoo;Lingxiao Zhao;Leman Akoglu",
        "authorids": "~Jaemin_Yoo1;~Lingxiao_Zhao1;~Leman_Akoglu3",
        "gender": "M;M;F",
        "homepage": "https://jaeminyoo.github.io/;http://lingxiaozhao.com/;http://www.andrew.cmu.edu/user/lakoglu/",
        "dblp": "211/2843;;02/6979.html",
        "google_scholar": "https://scholar.google.co.kr/citations?user=LcxcTRUAAAAJ;QKslW6EAAAAJ;4ITkr_kAAAAJ",
        "orcid": "0000-0001-7237-5117;;",
        "linkedin": "jaemin-yoo-8b3678142/;;",
        "or_profile": "~Jaemin_Yoo1;~Lingxiao_Zhao1;~Leman_Akoglu3",
        "aff": "KAIST;Carnegie Mellon University;Carnegie Mellon University",
        "aff_domain": "kaist.ac.kr;andrew.cmu.edu;cmu.edu",
        "position": "Assistant Professor;PhD student;Associate Professor",
        "bibtex": "@misc{\nyoo2024selftuning,\ntitle={Self-Tuning Self-Supervised Anomaly Detection},\nauthor={Jaemin Yoo and Lingxiao Zhao and Leman Akoglu},\nyear={2024},\nurl={https://openreview.net/forum?id=saj54kqrBj}\n}",
        "github": "",
        "project": "",
        "reviewers": "gndU;iRPB;ht7A",
        "site": "https://openreview.net/forum?id=saj54kqrBj",
        "pdf_size": 10128326,
        "rating": "5;6;6",
        "confidence": "4;4;3",
        "soundness": "2;1;3",
        "contribution": "2;3;3",
        "presentation": "3;3;3",
        "wc_summary": "69;87;162",
        "wc_strengths": "44;88;30",
        "wc_weaknesses": "272;305;54",
        "wc_questions": "91;8;209",
        "wc_review": "476;488;455",
        "wc_reply_reviewers": "0;0;17",
        "wc_reply_authors": "1090;706;653",
        "reply_reviewers": "0;0;1",
        "reply_authors": "2;1;2",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            106.0,
            40.27406113120453
        ],
        "wc_strengths_avg": [
            54.0,
            24.711670657134185
        ],
        "wc_weaknesses_avg": [
            210.33333333333334,
            111.36227168819589
        ],
        "wc_questions_avg": [
            102.66666666666667,
            82.47154391398014
        ],
        "wc_review_avg": [
            473.0,
            13.638181696985855
        ],
        "wc_reply_reviewers_avg": [
            5.666666666666667,
            8.013876853447538
        ],
        "wc_reply_authors_avg": [
            816.3333333333334,
            194.71745912703588
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:OgAwscuFdugJ:scholar.google.com/&scioq=Self-Tuning+Self-Supervised+Anomaly+Detection&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology;Carnegie Mellon University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.kaist.ac.kr;https://www.cmu.edu",
        "aff_unique_abbr": "KAIST;CMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "title": "NeuroBack: Improving CDCL SAT Solving using Graph Neural Networks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17641",
        "id": "samyfu6G93",
        "author_site": "Wenxi Wang, Yang Hu, Mohit Tiwari, Sarfraz Khurshid, Kenneth McMillan, Risto Miikkulainen",
        "tldr": "",
        "abstract": "Propositional satisfiability (SAT) is an NP-complete problem that impacts many\nresearch fields, such as planning, verification, and security. Mainstream modern\nSAT solvers are based on the Conflict-Driven Clause Learning (CDCL) algorithm.\nRecent work aimed to enhance CDCL SAT solvers using Graph Neural Networks\n(GNNs). However, so far this approach either has not made solving more effective,\nor required substantial GPU resources for frequent online model inferences. Aiming\nto make GNN improvements practical, this paper proposes an approach called\nNeuroBack, which builds on two insights: (1) predicting phases (i.e., values) of\nvariables appearing in the majority (or even all) of the satisfying assignments are\nessential for CDCL SAT solving, and (2) it is sufficient to query the neural model\nonly once for the predictions before the SAT solving starts. Once trained, the\noffline model inference allows NeuroBack to execute exclusively on the CPU,\nremoving its reliance on GPU resources. To train NeuroBack, a new dataset called\nDataBack containing 120,286 data samples is created. Finally, NeuroBack is implemented\nas an enhancement to a state-of-the-art SAT solver called Kissat. As a result,\nit allowed Kissat to solve 5.2% more problems on the recent SAT competition\nproblem set, SATCOMP-2022. NeuroBack therefore shows how machine learning\ncan be harnessed to improve SAT solving in an effective and practical manner.",
        "keywords": "Propositional satisfiability;Graph Neural Networks;CDCL SAT Solving;Backbone;Phase Prediction",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "/attachment/2bd9af40997253cdf1dedc050273ec7060af5871.pdf",
        "author": "Wenxi Wang;Yang Hu;Mohit Tiwari;Sarfraz Khurshid;Kenneth McMillan;Risto Miikkulainen",
        "authorids": "~Wenxi_Wang1;~Yang_Hu7;~Mohit_Tiwari1;~Sarfraz_Khurshid1;~Kenneth_McMillan1;~Risto_Miikkulainen1",
        "gender": "F;M;;;;",
        "homepage": "https://wenxiwang.github.io/;https://huyang-utspark.github.io/;;http://users.ece.utexas.edu/~khurshid/;http://mcmil.net;http://www.cs.utexas.edu/users/risto",
        "dblp": ";;;https://dblp.uni-trier.de/pid/k/SarfrazKhurshid.html;m/KennethLMcMillan.html;m/RistoMiikkulainen",
        "google_scholar": "o23gui0AAAAJ;;FukOricAAAAJ;bG5-ZzIAAAAJ;pzFc-eEAAAAJ;",
        "orcid": ";;;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Wenxi_Wang1;~Yang_Hu7;~Mohit_Tiwari1;~Sarfraz_Khurshid1;~Kenneth_McMillan1;~Risto_Miikkulainen1",
        "aff": "University of Texas, Austin;University of Texas, Austin;;University of Texas, Austin;University of Texas, Austin;The University of Texas, Austin",
        "aff_domain": "utexas.edu;utexas.edu;;utexas.edu;cs.utexas.edu;cs.utexas.edu",
        "position": "PhD student;PhD student;;Professor;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nwang2024neuroback,\ntitle={NeuroBack: Improving {CDCL} {SAT} Solving using Graph Neural Networks},\nauthor={Wenxi Wang and Yang Hu and Mohit Tiwari and Sarfraz Khurshid and Kenneth McMillan and Risto Miikkulainen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=samyfu6G93}\n}",
        "github": "",
        "project": "",
        "reviewers": "bkSL;HXv9;w5iE;7KxS",
        "pdf_size": 385863,
        "rating": "5;5;6;8",
        "confidence": "4;4;4;3",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;4",
        "presentation": "3;3;3;3",
        "wc_summary": "98;153;92;186",
        "wc_strengths": "37;76;111;7",
        "wc_weaknesses": "202;184;234;46",
        "wc_questions": "7;55;4;1",
        "wc_review": "344;468;441;240",
        "wc_reply_reviewers": "102;156;23;0",
        "wc_reply_authors": "604;976;529;77",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "3;4;3;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            132.25,
            39.092038831455184
        ],
        "wc_strengths_avg": [
            57.75,
            39.28978874975024
        ],
        "wc_weaknesses_avg": [
            166.5,
            71.83836022627466
        ],
        "wc_questions_avg": [
            16.75,
            22.18529918662356
        ],
        "wc_review_avg": [
            373.25,
            89.69218193354425
        ],
        "wc_reply_reviewers_avg": [
            70.25,
            62.30720263340347
        ],
        "wc_reply_authors_avg": [
            546.5,
            319.5751085425772
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            1.0897247358851685
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.9428090415820632,
        "gs_citation": 20,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13245369692770944894&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=samyfu6G93",
        "pdf": "https://openreview.net/pdf?id=samyfu6G93",
        "email": "utexas.edu;utexas.edu;;utexas.edu;cs.utexas.edu;cs.utexas.edu",
        "author_num": 6,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "University of Texas at Austin",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.utexas.edu",
        "aff_unique_abbr": "UT Austin",
        "aff_campus_unique_index": "0;0;0;0;0",
        "aff_campus_unique": "Austin",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "sawjxRnVpF",
        "title": "Curvature-Informed SGD via General Purpose Lie-Group Preconditioners",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We present a novel approach to accelerate stochastic gradient descent (SGD) by utilizing curvature information obtained from Hessian-vector products or finite differences of parameters and gradients, similar to the BFGS algorithm. Our approach involves two preconditioners: a matrix-free preconditioner and a low-rank approximation preconditioner. We update both preconditioners online using a criterion that is robust to stochastic gradient noise and does not require line search or damping. To preserve the corresponding symmetry or invariance, our preconditioners are constrained to certain connected Lie groups. The Lie group's equi-variance property simplifies the preconditioner fitting process, while its invariance property eliminates the need for damping, which is commonly required in second-order optimizers. As a result, the learning rate for parameter updating and the step size for preconditioner fitting are naturally normalized, and their default values work well in most scenarios. Our proposed approach offers a promising direction for improving the convergence of SGD with low computational overhead. We demonstrate that Preconditioned SGD (PSGD) outperforms SoTA on Vision, NLP, and RL tasks across multiple modern deep-learning architectures.",
        "keywords": "Lie Group;Second Order Optimization;Optimization for Deep Learning",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/de2a710013bb383d382f65caaca3fc6992f7e31b.zip",
        "author": "Omead Pooladzandi;XI-LIN LI",
        "authorids": "~Omead_Pooladzandi1;~XI-LIN_LI1",
        "gender": "M;",
        "homepage": ";",
        "dblp": "319/9453;",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": "omead-pooladzandi-8a5051109;",
        "or_profile": "~Omead_Pooladzandi1;~XI-LIN_LI1",
        "aff": "Department of Electrical Engineering, California Institute of Technology;",
        "aff_domain": "ee.caltech.edu;",
        "position": "Postdoc;",
        "bibtex": "@misc{\npooladzandi2024curvatureinformed,\ntitle={Curvature-Informed {SGD} via General Purpose Lie-Group Preconditioners},\nauthor={Omead Pooladzandi and XI-LIN LI},\nyear={2024},\nurl={https://openreview.net/forum?id=sawjxRnVpF}\n}",
        "github": "",
        "project": "",
        "reviewers": "ApxA;rA7r;PCFY;eh9x",
        "site": "https://openreview.net/forum?id=sawjxRnVpF",
        "pdf_size": 2779610,
        "rating": "3;5;5;5",
        "confidence": "4;3;5;3",
        "soundness": "3;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;3;1",
        "wc_summary": "45;90;56;55",
        "wc_strengths": "63;45;16;18",
        "wc_weaknesses": "241;133;67;92",
        "wc_questions": "4;64;121;9",
        "wc_review": "353;332;260;174",
        "wc_reply_reviewers": "0;0;0;477",
        "wc_reply_authors": "424;739;599;1236",
        "reply_reviewers": "0;0;0;3",
        "reply_authors": "1;1;1;3",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            61.5,
            17.00735135169495
        ],
        "wc_strengths_avg": [
            35.5,
            19.576771950451892
        ],
        "wc_weaknesses_avg": [
            133.25,
            66.52208279962376
        ],
        "wc_questions_avg": [
            49.5,
            47.52104796824245
        ],
        "wc_review_avg": [
            279.75,
            70.12266038877874
        ],
        "wc_reply_reviewers_avg": [
            119.25,
            206.54705880258862
        ],
        "wc_reply_authors_avg": [
            749.5,
            302.2387301455589
        ],
        "reply_reviewers_avg": [
            0.75,
            1.299038105676658
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.17407765595569782,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13604495948887840384&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "California Institute of Technology",
        "aff_unique_dep": "Department of Electrical Engineering",
        "aff_unique_url": "https://www.caltech.edu",
        "aff_unique_abbr": "Caltech",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Pasadena",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "sb0ojNl7F6",
        "title": "End-Effector-Elbow: A New Action Space for Robot Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Joint control and end-effector control are the two most dominant control methods for robot arms within the robot learning literature. Joint control, while precise, often suffers from inefficient training; end-effector control boasts data-efficient training but sacrifices the ability to perform tasks in confined spaces due to limited control over the robot joint configuration. This paper introduces a novel action space formulation:  End-Effector-Elbow (E3), which addresses the limitations of existing control paradigms by allowing the control of both the end-effector and elbow of the robot. E3 combines the advantages of both joint and end-effector control, offering fine-grained comprehensive control with overactuated robot arms whilst achieving highly efficient robot learning. E3 systematically outperforms other action spaces, when precise control over the robot configuration is required, both in simulated and real environments.\n\nProject website: https://doubleblind-repos.github.io/",
        "keywords": "robot learning;robotics;action representation",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/f2ec9a711f584a2be2d176e6ee753416c4bce95e.zip",
        "author": "Pietro Mazzaglia;Nicholas Backshall;Xiao Ma;Stephen James",
        "authorids": "~Pietro_Mazzaglia1;nic.backshall@dyson.com;xiao.ma@dyson.com;~Stephen_James1",
        "gender": ";;;M",
        "homepage": "https://mazpie.github.io/;;;https://stepjam.github.io/",
        "dblp": "266/6084;;;163/5669",
        "google_scholar": "c-PYVTgAAAAJ;;;OXtG-isAAAAJ",
        "orcid": "0000-0003-3319-5986;;;",
        "linkedin": "pietromazzaglia/;;;",
        "or_profile": "~Pietro_Mazzaglia1;nic.backshall@dyson.com;xiao.ma@dyson.com;~Stephen_James1",
        "aff": "Ghent University;;;Dyson",
        "aff_domain": "ugent.be;;;dyson.com",
        "position": "PhD student;;;Principal Researcher",
        "bibtex": "@misc{\nmazzaglia2024endeffectorelbow,\ntitle={End-Effector-Elbow: A New Action Space for Robot Learning},\nauthor={Pietro Mazzaglia and Nicholas Backshall and Xiao Ma and Stephen James},\nyear={2024},\nurl={https://openreview.net/forum?id=sb0ojNl7F6}\n}",
        "github": "",
        "project": "",
        "reviewers": "H84E;AKTt;Sd65;XGZj",
        "site": "https://openreview.net/forum?id=sb0ojNl7F6",
        "pdf_size": 8630926,
        "rating": "3;3;6;8",
        "confidence": "5;4;4;4",
        "soundness": "2;3;2;4",
        "contribution": "2;2;2;3",
        "presentation": "2;4;3;4",
        "wc_summary": "121;136;60;106",
        "wc_strengths": "53;54;25;58",
        "wc_weaknesses": "563;126;161;60",
        "wc_questions": "3;2;2;39",
        "wc_review": "740;318;248;263",
        "wc_reply_reviewers": "284;0;27;19",
        "wc_reply_authors": "2372;807;1016;558",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "7;4;4;4",
        "rating_avg": [
            5.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            105.75,
            28.463792790139546
        ],
        "wc_strengths_avg": [
            47.5,
            13.124404748406688
        ],
        "wc_weaknesses_avg": [
            227.5,
            197.06661310328545
        ],
        "wc_questions_avg": [
            11.5,
            15.88238017426859
        ],
        "wc_review_avg": [
            392.25,
            202.45786598697518
        ],
        "wc_reply_reviewers_avg": [
            82.5,
            116.74866166256469
        ],
        "wc_reply_authors_avg": [
            1188.25,
            702.4067108876452
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.75,
            1.299038105676658
        ],
        "replies_avg": [
            30,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5443310539518174,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:OfzcnSb9SmEJ:scholar.google.com/&scioq=End-Effector-Elbow:+A+New+Action+Space+for+Robot+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Ghent University;Dyson",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ugent.be/en;https://www.dyson.com",
        "aff_unique_abbr": "UGent;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Belgium;United Kingdom"
    },
    {
        "id": "sbiU3WZpTp",
        "title": "On the Robustness of Latent Diffusion Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Latent diffusion models have achieved state-of-the-art performance on a variety of generative tasks, such as image synthesis and image editing. However, the robustness of latent diffusion models is not well studied. Previous works only focus on the adversarial attacks against the encoder or the output image under white-box settings, regardless of the denoising process. Therefore, in this paper, we aim to analyze the robustness of latent diffusion models more thoroughly. We first study the influence of the components inside latent diffusion models on their white-box robustness. We find out that the denoising process, especially the Resnet, is the most vulnerable to adversarial attacks. In addition to white-box scenarios, we evaluate the black-box robustness of latent diffusion models via transfer attacks, where we consider both prompt-transfer and model-transfer settings and possible defense mechanisms. We conclude that the adversarial vulnerability is inherited with the development of Stable Diffusion models, and the adversarial attacks are still effective when possible defenses are present. Additionally, analyzing the robustness of latent diffusion models needs a comprehensive benchmark dataset, which is missing in the literature. Therefore, to facilitate the research on the robustness of latent diffusion models, we propose two automatic dataset construction pipelines for two kinds of image editing models and release the whole dataset.",
        "keywords": "Adversarial Attack;Latent Diffusion Models",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Jianping Zhang;Zhuoer Xu;shiwen cui;Changhua Meng;Weibin Wu;Michael Lyu",
        "authorids": "~Jianping_Zhang3;~Zhuoer_Xu1;~shiwen_cui1;~Changhua_Meng1;~Weibin_Wu1;~Michael_Lyu1",
        "gender": ";M;M;M;;M",
        "homepage": ";https://github.com/Unkrible;;https://www.linkedin.com/in/changhua-meng-04826021/;;http://www.cse.cuhk.edu.hk/~lyu",
        "dblp": ";276/7035;;295/9441;07/10638-2;l/MichaelRLyu",
        "google_scholar": "https://scholar.google.com.hk/citations?hl=zh-CN;na24qQoAAAAJ;;;https://scholar.google.com.hk/citations?user=6mtEjCEAAAAJ;uQnBgK0AAAAJ",
        "orcid": ";;;;;0000-0002-3666-5798",
        "linkedin": ";;%E4%B8%96%E6%96%87-%E5%B4%94-435538133/;;;michael-lyu-58b154/",
        "or_profile": "~Jianping_Zhang3;~Zhuoer_Xu1;~shiwen_cui1;~Changhua_Meng1;~Weibin_Wu1;~Michael_Lyu1",
        "aff": "The Chinese University of Hong Kong;Ant Group;ant group;Ant Group;Sun Yat-sen University;The Chinese University of Hong Kong",
        "aff_domain": "cuhk.edu.hk;antgroup.com;antgroup.com;antgroup.com;sysu.edu.cn;cuhk.edu.hk",
        "position": "PhD student;Researcher;Researcher;Researcher;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nzhang2024on,\ntitle={On the Robustness of Latent Diffusion Models},\nauthor={Jianping Zhang and Zhuoer Xu and shiwen cui and Changhua Meng and Weibin Wu and Michael Lyu},\nyear={2024},\nurl={https://openreview.net/forum?id=sbiU3WZpTp}\n}",
        "github": "",
        "project": "",
        "reviewers": "gYf9;ibVi;Lyr6",
        "site": "https://openreview.net/forum?id=sbiU3WZpTp",
        "pdf_size": 12047779,
        "rating": "5;5;6",
        "confidence": "3;5;3",
        "soundness": "3;2;3",
        "contribution": "2;2;3",
        "presentation": "3;3;3",
        "wc_summary": "81;111;61",
        "wc_strengths": "63;128;40",
        "wc_weaknesses": "168;143;229",
        "wc_questions": "113;75;3",
        "wc_review": "425;457;333",
        "wc_reply_reviewers": "243;0;0",
        "wc_reply_authors": "1077;626;789",
        "reply_reviewers": "3;0;0",
        "reply_authors": "6;2;3",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            84.33333333333333,
            20.548046676563253
        ],
        "wc_strengths_avg": [
            77.0,
            37.26481808176
        ],
        "wc_weaknesses_avg": [
            180.0,
            36.12016980395672
        ],
        "wc_questions_avg": [
            63.666666666666664,
            45.616761052149336
        ],
        "wc_review_avg": [
            405.0,
            52.56107558513873
        ],
        "wc_reply_reviewers_avg": [
            81.0,
            114.5512985522207
        ],
        "wc_reply_authors_avg": [
            830.6666666666666,
            186.4623882240658
        ],
        "reply_reviewers_avg": [
            1.0,
            1.4142135623730951
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            1.699673171197595
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 24,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11471711439754262244&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1;1;2;0",
        "aff_unique_norm": "Chinese University of Hong Kong;Ant Group;Sun Yat-sen University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.cuhk.edu.hk;https://www.antgroup.com;http://www.sysu.edu.cn/",
        "aff_unique_abbr": "CUHK;Ant Group;SYSU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "scFfMOOGD8",
        "title": "Learnable Invisible Backdoor for Diffusion Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Diffusion models have shown tremendous potential for high-quality image generation in recent years. Accordingly, there has been a rising focus on security threats associated with diffusion models, primarily because of their potential for malicious utilization. Recent studies have shown diffusion models are vulnerable to backdoor attack, which can make diffusion models generate designated target images given corresponding triggers. However, current backdoor attacks depend on manually designed trigger generation functions, which are usually visible patterns added to input noise, making them easily detected by human inspection. In this paper, we propose a novel and general optimization framework to learn invisible trigger, making the inserted backdoor more stealthy and robust. Our proposed framework can be applied to both unconditional and conditional diffusion models. In addition, for conditional diffusion models, we are the first to show how to backdoor diffusion models in text-guided image editing/inpainting pipeline. Extensive experiments on various commonly used samplers and datasets verify the effectiveness and stealthiness of the proposed framework.",
        "keywords": "Backdoor attack;Diffusion models",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/9b647dc49b94c9669b6fbe33a166e08a006801c2.pdf",
        "author": "Sen Li;Junchi Ma;Minhao Cheng",
        "authorids": "~Sen_Li2;~Junchi_Ma1;~Minhao_Cheng1",
        "gender": ";;M",
        "homepage": ";;https://cmhcbb.github.io/",
        "dblp": ";;174/1717",
        "google_scholar": ";;_LkC1yoAAAAJ",
        "orcid": "0009-0002-3661-4744;;0000-0003-3965-4215",
        "linkedin": ";;",
        "or_profile": "~Sen_Li2;~Junchi_Ma1;~Minhao_Cheng1",
        "aff": "Hong Kong University of Science and Technology;;Pennsylvania State University",
        "aff_domain": "ust.hk;;psu.edu",
        "position": "MS student;;Assistant Professor",
        "bibtex": "@misc{\nli2024learnable,\ntitle={Learnable Invisible Backdoor for Diffusion Models},\nauthor={Sen Li and Junchi Ma and Minhao Cheng},\nyear={2024},\nurl={https://openreview.net/forum?id=scFfMOOGD8}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZqQk;hgfj;KSEM;RZ4Z",
        "site": "https://openreview.net/forum?id=scFfMOOGD8",
        "pdf_size": 4828998,
        "rating": "3;3;3;8",
        "confidence": "4;2;4;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;1;3",
        "presentation": "2;3;3;3",
        "wc_summary": "131;55;75;123",
        "wc_strengths": "14;26;44;97",
        "wc_weaknesses": "122;41;253;70",
        "wc_questions": "16;21;6;38",
        "wc_review": "283;143;378;328",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "501;252;1000;440",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            4.25,
            2.165063509461097
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            96.0,
            31.921779399024736
        ],
        "wc_strengths_avg": [
            45.25,
            31.728339067779768
        ],
        "wc_weaknesses_avg": [
            121.5,
            81.2788410350443
        ],
        "wc_questions_avg": [
            20.25,
            11.583932838203095
        ],
        "wc_review_avg": [
            283.0,
            87.53570700005798
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            548.25,
            276.4926536094585
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.17407765595569782,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12136070688257421031&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Pennsylvania State University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ust.hk;https://www.psu.edu",
        "aff_unique_abbr": "HKUST;PSU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "scozYAatUd",
        "title": "MULTISCALE ATTENTION VIA WAVELET NEURAL OPERATORS FOR VISION TRANSFORMER",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Transformers have achieved widespread success in computer vision. At their heart, there is a self-attention mechanism, an inductive bias that associates each token in the input with every other token through a weighted basis. The standard self-attention has quadratic complexity with the sequence length, which impedes its utility to long sequences appearing in high resolution vision. Recently, inspired by operator learning for PDEs, adaptive Fourier neural operators (AFNO) were introduced for high resolution attention based on global convolution that is efficiently implemented via FFT. However, the AFNO global filtering cannot well represent small and moderate scale structures that commonly appear in natural images. To leverage the coarse-to-fine scale structures we introduce a multiscale Wavelet attention (MWA) by leveraging wavelet neural operators which incurs linear complexity in the sequence size. We replace the attention in ViT with MWA and our experiments with CIFAR and Tiny-ImageNet classification demonstrate significant improvement over alternative Fourier-based attentions such as AFNO and global filter network (GFN).",
        "keywords": "vision transformers;Wavelet transform;neural operators;attention",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Anahita Nekoozadeh;Mohammad Reza Ahmadzadeh;Zahra Mardani;Morteza Mardani",
        "authorids": "~Anahita_Nekoozadeh2;~Mohammad_Reza_Ahmadzadeh1;~Zahra_Mardani1;~Morteza_Mardani1",
        "gender": "F;M;F;M",
        "homepage": ";https://ahmadzadeh.iut.ac.ir/;;http://web.stanford.edu/~morteza/",
        "dblp": ";;;74/258",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;;H7edsyEAAAAJ",
        "orcid": ";;;",
        "linkedin": "anahita-nekoozadeh-47554a263/;;zahra-mardani-9060461b5/;",
        "or_profile": "~Anahita_Nekoozadeh2;~Mohammad_Reza_Ahmadzadeh1;~Zahra_Mardani1;~Morteza_Mardani1",
        "aff": "Isfahan University of Technology;Isfahan University of Technology, University of Tehran;ISCTE - Instituto Universit\u00e1rio de Lisboa;",
        "aff_domain": "iut.ac.ir;iut.ac.ir;iscte.pt;",
        "position": "MS student;Associate Professor;PhD student;",
        "bibtex": "@misc{\nnekoozadeh2024multiscale,\ntitle={{MULTISCALE} {ATTENTION} {VIA} {WAVELET} {NEURAL} {OPERATORS} {FOR} {VISION} {TRANSFORMER}},\nauthor={Anahita Nekoozadeh and Mohammad Reza Ahmadzadeh and Zahra Mardani and Morteza Mardani},\nyear={2024},\nurl={https://openreview.net/forum?id=scozYAatUd}\n}",
        "github": "",
        "project": "",
        "reviewers": "UUhz;5HJK;JC9v;Thgr;EE4x",
        "site": "https://openreview.net/forum?id=scozYAatUd",
        "pdf_size": 814501,
        "rating": "3;3;3;3;6",
        "confidence": "4;4;4;4;3",
        "soundness": "2;2;4;3;3",
        "contribution": "2;2;3;1;3",
        "presentation": "2;2;1;2;2",
        "wc_summary": "90;82;48;106;98",
        "wc_strengths": "58;37;34;78;25",
        "wc_weaknesses": "141;228;1005;188;13",
        "wc_questions": "51;12;73;40;17",
        "wc_review": "340;359;1160;412;153",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "173;82;714;140;96",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            3.6,
            1.2
        ],
        "confidence_avg": [
            3.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.8,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.2,
            0.7483314773547882
        ],
        "presentation_avg": [
            1.8,
            0.4
        ],
        "wc_summary_avg": [
            84.8,
            20.063897926375123
        ],
        "wc_strengths_avg": [
            46.4,
            19.147845831842286
        ],
        "wc_weaknesses_avg": [
            315.0,
            352.49907801297866
        ],
        "wc_questions_avg": [
            38.6,
            22.419634252146043
        ],
        "wc_review_avg": [
            484.8,
            348.7345122009005
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            241.0,
            238.6880809759884
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17641945756012560081&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Isfahan University of Technology;Instituto Universit\u00e1rio de Lisboa",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.iut.ac.ir;https://www.iscte-iul.pt",
        "aff_unique_abbr": "IUT;ISCTE",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Isfahan",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "Iran;Portugal"
    },
    {
        "id": "scxDIx6StY",
        "title": "Adaptive Temperature Enhanced Dual-level Hypergraph Contrastive Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Hypergraphs, which incorporate hyperedges to link multiple nodes and capture complex high-order relationships, have attracted increasing attention in recent years.\nConsequently, a bunch of hypergraph neural networks has been proposed to model the high-order relationships between hyperedges and nodes. Inspired by the success of graph contrastive learning, researchers have begun exploring the benefits of contrastive learning over hypergraphs. However, these works still have the following limitations in modeling the high-order relationships over unlabeled data: (i) They primarily focus on maximizing the agreements among individual node embeddings while neglecting the capture of group-wise collective behaviors within hypergraphs; (ii) Most of them disregard the importance of the temperature index in discriminating contrastive pairs during contrast optimization. To address these limitations, we propose a novel \\textbf{Ad}aptive \\textbf{T}emperature enhanced \\textbf{Hy}per\\textbf{G}raph \\textbf{C}ontrastive \\textbf{L}earning framework called \\textbf{AdT-HyGCL} to boost contrastive learning over hypergraphs. Specifically, we first introduce a noise enhancement module to generate relatively challenging augmented hypergraphs for hypergraph contrastive tasks. Unlike most works that merely maximize the agreement of node embeddings in hypergraphs, we then propose a dual-level contrast mechanism that not only captures the individual node behaviors in a local context but also models the group-wise collective behaviors of nodes within hyperedges from a community perspective. Furthermore, we design an adaptive temperature-enhanced contrastive optimization to improve the discrimination ability between positive and negative contrastive pairs, thereby facilitating more effective hypergraph representation learning. Theoretical justifications and empirical experiments conducted on eight benchmark hypergraphs demonstrate that AdT-HyGCL exhibits excellent rationality, generalization, effectiveness, and robustness compared to state-of-the-art baseline models.",
        "keywords": "hypergraph;contrastive learning;self-supervised learning.",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/9f57a2898f585b8909b2ce9aefeab305d5898697.zip",
        "author": "Yiyue Qian;Tianyi Ma;Chuxu Zhang;Yanfang Ye",
        "authorids": "~Yiyue_Qian2;~Tianyi_Ma3;~Chuxu_Zhang2;~Yanfang_Ye1",
        "gender": ";M;;",
        "homepage": "https://yiyueqian.github.io/;https://tianyi-billy-ma.github.io/;;http://yes-lab.org/",
        "dblp": "261/9059;;;",
        "google_scholar": "c6c81_kAAAAJ;https://scholar.google.com/citations?hl=en;;egjr888AAAAJ",
        "orcid": "0000-0001-7924-5438;0009-0003-3790-8469;;",
        "linkedin": "yiyue-qian-224655212/;Tianyi-Ma-03BILLY;;",
        "or_profile": "~Yiyue_Qian2;~Tianyi_Ma3;~Chuxu_Zhang2;~Yanfang_Ye1",
        "aff": "University of Notre Dame;University of Notre Dame;;University of Notre Dame",
        "aff_domain": "nd.edu;nd.edu;;nd.edu",
        "position": "PhD student;PhD student;;Associate Professor",
        "bibtex": "@misc{\nqian2024adaptive,\ntitle={Adaptive Temperature Enhanced Dual-level Hypergraph Contrastive Learning},\nauthor={Yiyue Qian and Tianyi Ma and Chuxu Zhang and Yanfang Ye},\nyear={2024},\nurl={https://openreview.net/forum?id=scxDIx6StY}\n}",
        "github": "",
        "project": "",
        "reviewers": "cbYE;xcsf;r4B1;1PBv;AN7j",
        "site": "https://openreview.net/forum?id=scxDIx6StY",
        "pdf_size": 9567191,
        "rating": "1;3;3;5;5",
        "confidence": "5;5;5;3;3",
        "soundness": "1;2;2;3;3",
        "contribution": "2;2;1;2;3",
        "presentation": "1;2;3;3;3",
        "wc_summary": "56;57;41;127;62",
        "wc_strengths": "24;59;19;60;124",
        "wc_weaknesses": "422;586;143;69;47",
        "wc_questions": "5;6;2;86;93",
        "wc_review": "507;708;205;342;326",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            3.4,
            1.4966629547095767
        ],
        "confidence_avg": [
            4.2,
            0.9797958971132712
        ],
        "soundness_avg": [
            2.2,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            2.4,
            0.8
        ],
        "wc_summary_avg": [
            68.6,
            30.030651008594536
        ],
        "wc_strengths_avg": [
            57.2,
            37.50946547206451
        ],
        "wc_weaknesses_avg": [
            253.4,
            213.4671871740479
        ],
        "wc_questions_avg": [
            38.4,
            41.802392276040855
        ],
        "wc_review_avg": [
            417.6,
            174.14315949815543
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8728715609439696,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11591036080191131927&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Notre Dame",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nd.edu",
        "aff_unique_abbr": "Notre Dame",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "sdev4EomdC",
        "title": "Bridging the gap between offline and online continual learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Instead of training deep neural networks offline with a large static dataset, continual learning (CL) considers a new learning paradigm, which continually trains the deep networks from a non-stationary data stream on the fly. Despite the recent progress, continual learning remains an open challenge. Many CL techniques still require offline training of large batches of data chunks (i.e., tasks) over multiple epochs. Conventional wisdom holds that online continual learning, which assumes single-pass data, is strictly harder than offline continual learning, due to the combined challenges of catastrophic forgetting and underfitting within a single training epoch. Here, we challenge this assumption by empirically demonstrating that online CL can match or exceed the performance of its offline counterpart given equivalent memory and computational resources. This finding is further verified across different CL approaches and benchmarks. To better understand these counterintuitive experimental findings, we design a framework to unify and interpolate between online and offline CL and provide a theoretical analysis showing that online CL can yield a tighter generalization bound than offline CL.",
        "keywords": "Continual Learning; Lifelong Learning; Online Continual Learning; Class-incremental Learning; Task-free Continual Learning; Offline Continual Learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Yaqian Zhang;Eibe Frank;Bernhard Pfahringer;Albert Bifet",
        "authorids": "~Yaqian_Zhang5;~Eibe_Frank2;~Bernhard_Pfahringer1;~Albert_Bifet1",
        "gender": "F;M;M;M",
        "homepage": ";https://profiles.waikato.ac.nz/bernhard.pfahringer;https://albertbifet.com/;https://profiles.waikato.ac.nz/eibe.frank",
        "dblp": ";10/140;48/1070;f/EibeFrank.html",
        "google_scholar": "DezNG3MAAAAJ;https://scholar.google.co.nz/citations?user=PEv3OQUAAAAJ;https://scholar.google.com/citations?hl=en;dUV_NvIAAAAJ",
        "orcid": "0000-0002-8594-4697;0000-0002-3732-5787;0000-0002-8339-7773;0000-0001-6152-7111",
        "linkedin": ";;abifet/;eibe-frank-09722590",
        "or_profile": "~Yaqian_Zhang5;~Bernhard_Pfahringer1;~Albert_Bifet1;~Eibe_Frank1",
        "aff": "The University of Waikato;The University of Waikato;T\u00e9l\u00e9com Paris;University of Waikato",
        "aff_domain": "waikato.ac.nz;waikato.ac.nz;telecom-paris.fr;waikato.ac.nz",
        "position": "Postdoc;Full Professor;Full Professor;Professor",
        "bibtex": "@misc{\nzhang2024bridging,\ntitle={Bridging the gap between offline and online continual learning},\nauthor={Yaqian Zhang and Eibe Frank and Bernhard Pfahringer and Albert Bifet},\nyear={2024},\nurl={https://openreview.net/forum?id=sdev4EomdC}\n}",
        "github": "",
        "project": "",
        "reviewers": "LdF8;QLLJ;tpnv;xja9",
        "site": "https://openreview.net/forum?id=sdev4EomdC",
        "pdf_size": 1709977,
        "rating": "3;3;5;6",
        "confidence": "5;4;4;5",
        "soundness": "3;1;3;3",
        "contribution": "2;3;2;3",
        "presentation": "3;3;3;2",
        "wc_summary": "106;224;36;88",
        "wc_strengths": "67;89;46;109",
        "wc_weaknesses": "241;547;80;449",
        "wc_questions": "69;72;37;96",
        "wc_review": "483;932;199;742",
        "wc_reply_reviewers": "128;1179;0;58",
        "wc_reply_authors": "711;2691;496;741",
        "reply_reviewers": "1;4;0;1",
        "reply_authors": "1;5;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            113.5,
            68.78044780313661
        ],
        "wc_strengths_avg": [
            77.75,
            23.594225988576103
        ],
        "wc_weaknesses_avg": [
            329.25,
            181.43094416333724
        ],
        "wc_questions_avg": [
            68.5,
            20.982135258357285
        ],
        "wc_review_avg": [
            589.0,
            275.85956572140105
        ],
        "wc_reply_reviewers_avg": [
            341.25,
            485.79387346898477
        ],
        "wc_reply_authors_avg": [
            1159.75,
            889.1033053025953
        ],
        "reply_reviewers_avg": [
            1.5,
            1.5
        ],
        "reply_authors_avg": [
            2.0,
            1.7320508075688772
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.19245008972987526,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Krff02ZEcHUJ:scholar.google.com/&scioq=Bridging+the+gap+between+offline+and+online+continual+learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "University of Waikato;T\u00e9l\u00e9com Paris",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.waikato.ac.nz;https://www.telecom-paris.fr",
        "aff_unique_abbr": "UoW;T\u00e9l\u00e9com Paris",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "New Zealand;France"
    },
    {
        "id": "sdkB5j7yNr",
        "title": "PROSAC: Provably Safe Certification for Machine Learning Models under Adversarial Attacks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "It is widely known that state-of-the-art machine learning models \u2014 including vision and language ones \u2014 can be seriously compromised by adversarial perturbations, so it is also increasingly relevant to develop capability to certify their performance in the presence of the most effective adversarial attacks. Our paper offers a new approach to certify the performance of machine learning models in the presence of adversarial attacks, with population level risk guarantees. In particular, given a specific attack, we introduce the notion of a $(\\alpha,\\zeta)$ machine learning model safety guarantee: this guarantee, which is supported by a testing procedure based on the availability of a calibration set, entails one will only declare that a machine learning model adversarial (population) risk is less than $\\alpha$ (i.e. the model is safe) given that the model adversarial (population) risk is higher than $\\alpha$ (i.e. the model is in fact unsafe), with probability less than $\\zeta$. We  also propose Bayesian optimization algorithms to determine very efficiently whether or not a machine learning model is  $(\\alpha,\\zeta)$-safe in the presence of an adversarial attack, along with their statistical guarantees. We apply our framework to a range of machine learning models \u2014 including various sizes of vision Transformer (ViT) and ResNet models \u2014 impaired by a variety of adversarial attacks such as AutoAttack, SquareAttack and  natural evolution strategy attack, in order to illustrate the merit of our approach. Of particular relevance, we show that ViT's are generally more robust to adversarial attacks than ResNets and ViT-large is more robust than smaller models. Overall, our approach goes beyond existing empirical adversarial risk based certification guarantees, paving  the way to more effective AI regulation based on rigorous (and provable) performance guarantees.",
        "keywords": "Adversarial Risk Certification; AI Safety",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Ziquan Liu;zhuo zhi;Ilija Bogunovic;Carsten Gerner-Beuerle;Miguel R. D. Rodrigues",
        "authorids": "~Ziquan_Liu1;~zhuo_zhi2;~Ilija_Bogunovic2;~Carsten_Gerner-Beuerle1;~Miguel_R._D._Rodrigues1",
        "gender": "M;M;;M;M",
        "homepage": "https://sites.google.com/view/ziquanliu;;https://www.ucl.ac.uk/laws/people/carsten-gerner-beuerle;https://www.ee.ucl.ac.uk/iiml/;http://ilijabogunovic.com/",
        "dblp": "207/9035;;;21/6763;142/2725",
        "google_scholar": "https://scholar.google.com.hk/citations?user=x28OqBkAAAAJ;k5SklngAAAAJ;https://scholar.google.co.uk/citations?user=69KD_cEAAAAJ;;xMvt3NEAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Ziquan_Liu1;~zhuo_zhi2;~Carsten_Gerner-Beuerle1;~Miguel_R._D._Rodrigues1;~Ilija_Bogunovic1",
        "aff": "Queen Mary, University of London;University College London, University of London;University College London, University of London;University College London;Swiss Federal Institute of Technology",
        "aff_domain": "qmul.ac.uk;ucl.ac.uk;ucl.ac.uk;ucl.ac.uk;ethz.ch",
        "position": "Lecturer;PhD student;Full Professor;Full Professor;Postdoc",
        "bibtex": "@misc{\nliu2024prosac,\ntitle={{PROSAC}: Provably Safe Certification for Machine Learning Models under Adversarial Attacks},\nauthor={Ziquan Liu and zhuo zhi and Ilija Bogunovic and Carsten Gerner-Beuerle and Miguel R. D. Rodrigues},\nyear={2024},\nurl={https://openreview.net/forum?id=sdkB5j7yNr}\n}",
        "github": "",
        "project": "",
        "reviewers": "yeRm;z9fX;sSbB;e7ug",
        "site": "https://openreview.net/forum?id=sdkB5j7yNr",
        "pdf_size": 578338,
        "rating": "3;3;3;5",
        "confidence": "4;2;3;3",
        "soundness": "1;2;1;3",
        "contribution": "2;2;3;2",
        "presentation": "1;2;2;3",
        "wc_summary": "58;39;62;20",
        "wc_strengths": "31;80;48;32",
        "wc_weaknesses": "261;141;232;333",
        "wc_questions": "445;6;6;19",
        "wc_review": "795;266;348;404",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "891;233;307;508",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            44.75,
            16.723860200324566
        ],
        "wc_strengths_avg": [
            47.75,
            19.803724397193573
        ],
        "wc_weaknesses_avg": [
            241.75,
            68.81633163719205
        ],
        "wc_questions_avg": [
            119.0,
            188.29099819162892
        ],
        "wc_review_avg": [
            453.25,
            203.32163559247698
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            484.75,
            255.22183977865217
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ss1Ya5TGZ-UJ:scholar.google.com/&scioq=PROSAC:+Provably+Safe+Certification+for+Machine+Learning+Models+under+Adversarial+Attacks&hl=en&as_sdt=0,5",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;1;1;2",
        "aff_unique_norm": "Queen Mary, University of London;University College London;Swiss Federal Institute of Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.qmul.ac.uk;https://www.ucl.ac.uk;https://www.ethz.ch",
        "aff_unique_abbr": "QMUL;UCL;ETH Zurich",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "London;",
        "aff_country_unique_index": "0;0;0;0;1",
        "aff_country_unique": "United Kingdom;Switzerland"
    },
    {
        "id": "sdn7ocpvuX",
        "title": "Advective Diffusion Transformers for Topological Generalization in Graph Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph diffusion equations are intimately related to graph neural networks (GNNs) and have recently attracted attention as a principled framework for analyzing GNN dynamics, formalizing their expressive power, and justifying architectural choices. One  key open questions in graph learning is the generalization capabilities of GNNs. A major limitation of current approaches hinges on the assumption that the graph topologies in the training and test sets come from the same distribution. In this paper, we make steps towards understanding the generalization of GNNs by exploring how graph diffusion equations extrapolate and generalize in the presence of varying graph topologies. We first show deficiencies in the generalization capability of existing models built upon local diffusion on graphs, stemming from the exponential sensitivity to topology variation. Our subsequent analysis reveals the promise of non-local diffusion, which advocates for feature propagation over fully-connected latent graphs, under the assumption of a specific data-generating condition. In addition to these findings, we propose a novel graph encoder backbone, Advective Diffusion Transformer (ADiT), inspired by advective graph diffusion equations that have a closed-form solution backed up with theoretical guarantees of desired generalization under topological distribution shifts. The new model, functioning as a versatile graph Transformer, demonstrates superior performance across a wide range of graph learning tasks.",
        "keywords": "graph learning;graph diffusion equations;Transformers;graph neural networks;topological generalization;non-Euclidean data",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Qitian Wu;Chenxiao Yang;Kaipeng Zeng;Fan Nie;Michael M. Bronstein;Junchi Yan",
        "authorids": "~Qitian_Wu1;~Chenxiao_Yang1;~Kaipeng_Zeng1;~Fan_Nie1;~Michael_M._Bronstein1;~Junchi_Yan2",
        "gender": ";;M;;M;",
        "homepage": ";;https://github.com/zengkaipeng;;http://www.inf.usi.ch/bronstein/;",
        "dblp": ";;345/6420;;07/2668;",
        "google_scholar": ";;https://scholar.google.com/citations?hl=zh-CN;;UU3N6-UAAAAJ;",
        "orcid": ";;0000-0002-4798-7784;;;",
        "linkedin": ";;;;mbronstein/;",
        "or_profile": "~Qitian_Wu1;~Chenxiao_Yang1;~Kaipeng_Zeng1;~Fan_Nie1;~Michael_M._Bronstein1;~Junchi_Yan2",
        "aff": ";;Shanghai Jiaotong University;;University of Oxford;",
        "aff_domain": ";;sjtu.edu.cn;;ox.ac.uk;",
        "position": ";;MS student;;Full Professor;",
        "bibtex": "@misc{\nwu2024advective,\ntitle={Advective Diffusion Transformers for Topological Generalization in Graph Learning},\nauthor={Qitian Wu and Chenxiao Yang and Kaipeng Zeng and Fan Nie and Michael M. Bronstein and Junchi Yan},\nyear={2024},\nurl={https://openreview.net/forum?id=sdn7ocpvuX}\n}",
        "github": "",
        "project": "",
        "reviewers": "834k;zCh7;SG1T;Byi6",
        "site": "https://openreview.net/forum?id=sdn7ocpvuX",
        "pdf_size": 1194972,
        "rating": "3;3;3;3",
        "confidence": "3;5;4;4",
        "soundness": "1;1;1;3",
        "contribution": "3;1;1;2",
        "presentation": "4;2;3;3",
        "wc_summary": "52;82;17;60",
        "wc_strengths": "53;49;14;11",
        "wc_weaknesses": "8;789;127;45",
        "wc_questions": "118;6;170;314",
        "wc_review": "231;926;328;430",
        "wc_reply_reviewers": "154;101;166;0",
        "wc_reply_authors": "461;2074;1379;1753",
        "reply_reviewers": "1;2;1;0",
        "reply_authors": "2;4;3;3",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            1.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            52.75,
            23.381349405027933
        ],
        "wc_strengths_avg": [
            31.75,
            19.330998422223306
        ],
        "wc_weaknesses_avg": [
            242.25,
            318.59015599983627
        ],
        "wc_questions_avg": [
            152.0,
            110.72488428533127
        ],
        "wc_review_avg": [
            478.75,
            267.63536294742516
        ],
        "wc_reply_reviewers_avg": [
            105.25,
            65.50333960951914
        ],
        "wc_reply_authors_avg": [
            1416.75,
            604.1367291433289
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13567058292779069351&as_sdt=8005&sciodt=0,7&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Shanghai Jiao Tong University;University of Oxford",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.sjtu.edu.cn;https://www.ox.ac.uk",
        "aff_unique_abbr": "SJTU;Oxford",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "title": "Let Models Speak Ciphers: Multiagent Debate through Embeddings",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17640",
        "id": "sehRvaIPQQ",
        "author_site": "Chau Pham, Boyi Liu, Yingxiang Yang, Zhengyu Chen, Tianyi Liu, Jianbo Yuan, Bryan Plummer, Zhaoran Wang, Hongxia Yang",
        "tldr": "",
        "abstract": "Discussion and debate among Large Language Models (LLMs) have gained considerable attention due to their potential to enhance the reasoning ability of LLMs. Although natural language is an obvious choice for communication due to LLM's language understanding capability, the token sampling step needed when generating natural language poses a potential risk of information loss, as it uses only one token to represent the model's belief across the entire vocabulary. In this paper, we introduce a communication regime named CIPHER (Communicative Inter-Model Protocol Through Embedding Representation) to address this issue. Specifically, we remove the token sampling step from LLMs and let them communicate their beliefs across the vocabulary through the expectation of the raw transformer output embeddings. Remarkably, by deviating from natural language, CIPHER offers an advantage of encoding a broader spectrum of information without any modification to the model weights, outperforming the state-of-the-art LLM debate methods using natural language by 0.5-5.0% across five reasoning tasks and multiple open-source LLMs of varying sizes. This showcases the superiority and robustness of embeddings as an alternative \"language\" for communication among LLMs. We anticipate that CIPHER will inspire further exploration for the design of interactions within LLM agent systems, offering a new direction that could significantly influence future developments in the field.",
        "keywords": "multiagent debate;large language models;inter-model communication;embedding representation",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Chau Pham;Boyi Liu;Yingxiang Yang;Zhengyu Chen;Tianyi Liu;Jianbo Yuan;Bryan A. Plummer;Zhaoran Wang;Hongxia Yang",
        "authorids": "~Chau_Pham1;~Boyi_Liu1;~Yingxiang_Yang2;~Zhengyu_Chen6;~Tianyi_Liu2;~Jianbo_Yuan1;~Bryan_A._Plummer1;~Zhaoran_Wang1;~Hongxia_Yang2",
        "gender": "M;M;;Not Specified;M;M;;Not Specified;F",
        "homepage": "http://mchaupham.com;;;;https://sites.google.com/view/tianyiliu/home;;;https://zhaoranwang.github.io/;https://www4.comp.polyu.edu.hk/~hongxyang/",
        "dblp": "259/7023-1;;;;;134/6790;;117/2756;",
        "google_scholar": "fu-qT-wAAAAJ;1G8RH_YAAAAJ;;;;https://scholar.google.com/citations?hl=en;;https://scholar.google.com.tw/citations?user=HSx0BgQAAAAJ;iJlC5mMAAAAJ",
        "orcid": ";;;;;;;;",
        "linkedin": "chau-pham-bu;;;czycmu/;;;;;",
        "or_profile": "~Chau_Pham1;~Boyi_Liu1;~Yingxiang_Yang2;~Zhengyu_Chen6;~Tianyi_Liu2;~Jianbo_Yuan1;~Bryan_A._Plummer1;~Zhaoran_Wang1;~Hongxia_Yang2",
        "aff": "Boston University;ByteDance Inc.;;ByteDance Inc.;Amazon;Bytedance;;Northwestern University;ByteDance Inc.",
        "aff_domain": "bu.edu;bytedance.com;;bytedance.com;amazon.com;bytedance.com;;northwestern.edu;bytedance.com",
        "position": "PhD student;Researcher;;Researcher;Researcher;Researcher;;Associate Professor;Principal Researcher",
        "bibtex": "@inproceedings{\npham2024let,\ntitle={Let Models Speak Ciphers: Multiagent Debate through Embeddings},\nauthor={Chau Pham and Boyi Liu and Yingxiang Yang and Zhengyu Chen and Tianyi Liu and Jianbo Yuan and Bryan A. Plummer and Zhaoran Wang and Hongxia Yang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=sehRvaIPQQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "27LG;gCSm;LfJQ;b3L6",
        "pdf_size": 4929175,
        "rating": "5;5;6;6",
        "confidence": "5;4;3;4",
        "soundness": "1;2;3;3",
        "contribution": "3;3;2;3",
        "presentation": "2;2;3;3",
        "wc_summary": "138;72;79;56",
        "wc_strengths": "44;44;91;65",
        "wc_weaknesses": "367;444;2;46",
        "wc_questions": "7;81;75;61",
        "wc_review": "556;641;247;228",
        "wc_reply_reviewers": "438;0;0;54",
        "wc_reply_authors": "2598;1825;494;965",
        "reply_reviewers": "2;0;0;1",
        "reply_authors": "5;3;1;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            86.25,
            31.01914731258743
        ],
        "wc_strengths_avg": [
            61.0,
            19.32614809008769
        ],
        "wc_weaknesses_avg": [
            214.75,
            193.30982256471086
        ],
        "wc_questions_avg": [
            56.0,
            29.206163733020468
        ],
        "wc_review_avg": [
            418.0,
            183.10789169230256
        ],
        "wc_reply_reviewers_avg": [
            123.0,
            183.1966156892643
        ],
        "wc_reply_authors_avg": [
            1470.5,
            807.1568930511589
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.75,
            1.479019945774904
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -0.7071067811865475,
        "gs_citation": 22,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12407856081945909766&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=sehRvaIPQQ",
        "pdf": "https://openreview.net/pdf?id=sehRvaIPQQ",
        "email": "bu.edu;bytedance.com;;bytedance.com;amazon.com;bytedance.com;;northwestern.edu;bytedance.com",
        "author_num": 9,
        "aff_unique_index": "0;1;1;2;1;3;1",
        "aff_unique_norm": "Boston University;ByteDance;Amazon;Northwestern University",
        "aff_unique_dep": ";;Amazon.com, Inc.;",
        "aff_unique_url": "https://www.bu.edu;https://www.bytedance.com;https://www.amazon.com;https://www.northwestern.edu",
        "aff_unique_abbr": "BU;ByteDance;Amazon;NU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;0;1;0;1",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "sfTsvy05MX",
        "title": "LL-VQ-VAE: Learnable Lattice Vector-Quantization For Efficient Representations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this paper we introduce $\\text{\\textit{learnable lattice}}$ vector quantization and demonstrate its effectiveness for learning discrete representations. Our method, termed LL-VQ-VAE, replaces the vector quantization layer in VQ-VAE with lattice-based discretization. The learnable lattice imposes a structure over all discrete embeddings, acting as a deterrent against codebook collapse, leading to high codebook utilization. Compared to VQ-VAE, our method obtains lower reconstruction errors under the same training conditions, trains in a fraction of the time, and with a constant number of parameters (equal to the embedding dimension $D$), making it a very scalable approach. We demonstrate these results on the FFHQ-1024 dataset and include FashionMNIST and Celeb-A.",
        "keywords": "Vector-Quantization;VAE;Lattice;Representation Learning;Discrete Latents",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Ahmed Khalil;Robert Piechocki;Raul Santos-Rodriguez",
        "authorids": "~Ahmed_Khalil1;~Robert_Piechocki1;~Raul_Santos-Rodriguez1",
        "gender": "M;M;",
        "homepage": ";https://www.bristol.ac.uk/people/person/Robert-Piechocki;https://www.bristol.ac.uk/people/person/Raul-Santos-Rodriguez-1d708791-ea39-4078-89e6-c5c81b8c1a22/",
        "dblp": ";;24/7253",
        "google_scholar": ";;U_ldrLcAAAAJ",
        "orcid": ";;0000-0001-9576-3905",
        "linkedin": "https://linkedin.com/in/ahmed-khalil-2aa2397b;;",
        "or_profile": "~Ahmed_Khalil1;~Robert_Piechocki1;~Raul_Santos-Rodriguez1",
        "aff": "University of Bristol;;University of Bristol",
        "aff_domain": "bristol.ac.uk;;bristol.ac.uk",
        "position": "PhD student;;Full Professor",
        "bibtex": "@misc{\nkhalil2024llvqvae,\ntitle={{LL}-{VQ}-{VAE}: Learnable Lattice Vector-Quantization For Efficient Representations},\nauthor={Ahmed Khalil and Robert Piechocki and Raul Santos-Rodriguez},\nyear={2024},\nurl={https://openreview.net/forum?id=sfTsvy05MX}\n}",
        "github": "",
        "project": "",
        "reviewers": "hAk9;yCAH;qZdA;4UQJ",
        "site": "https://openreview.net/forum?id=sfTsvy05MX",
        "pdf_size": 39995329,
        "rating": "3;5;5;6",
        "confidence": "4;2;2;4",
        "soundness": "2;3;2;3",
        "contribution": "2;3;2;3",
        "presentation": "2;2;2;2",
        "wc_summary": "89;31;216;78",
        "wc_strengths": "45;63;104;24",
        "wc_weaknesses": "219;176;246;105",
        "wc_questions": "198;73;71;56",
        "wc_review": "551;343;637;263",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.0,
            1.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            103.5,
            68.50729888121411
        ],
        "wc_strengths_avg": [
            59.0,
            29.4193813667113
        ],
        "wc_weaknesses_avg": [
            186.5,
            53.26584271369411
        ],
        "wc_questions_avg": [
            99.5,
            57.24727067729954
        ],
        "wc_review_avg": [
            448.5,
            151.3101120216359
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.2294157338705618,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=816684544409733529&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Bristol",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.bristol.ac.uk",
        "aff_unique_abbr": "Bristol",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "title": "ARGS: Alignment as Reward-Guided Search",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17639",
        "id": "shgx0eqdw6",
        "author_site": "Maxim Khanov, Jirayu Burapacheep, Yixuan Li",
        "tldr": "",
        "abstract": "Aligning large language models with human objectives is paramount, yet common approaches including RLHF suffer from unstable and resource-intensive training. In response to this challenge, we introduce ARGS, Alignment as Reward-Guided Search, a novel framework that integrates alignment into the decoding process, eliminating the need for expensive RL training. By adjusting the model\u2019s probabilistic predictions using a reward signal, ARGS generates texts with semantic diversity while being aligned with human preferences, offering a promising and flexible solution for aligning language models. Notably, our method demonstrates consistent enhancements in average reward compared to baselines across diverse alignment tasks and various model dimensions. For example, under the same greedy-based decoding strategy, our method improves the average reward by 19.56% relative to the baseline and secures a preference or tie score of 64.33% in GPT-4 evaluation. We believe that our framework, emphasizing test-time alignment, paves the way for more responsive language models in the future. Code is publicly available at: https://github.com/deeplearning-wisc/args.",
        "keywords": "Alignment;LLM",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/6b54fb6e06a1414cd61027b906b2405989fd8fb0.pdf",
        "author": "Maxim Khanov;Jirayu Burapacheep;Yixuan Li",
        "authorids": "~Maxim_Khanov1;~Jirayu_Burapacheep1;~Yixuan_Li1",
        "gender": "M;;F",
        "homepage": ";https://top34051.github.io/;http://pages.cs.wisc.edu/~sharonli/",
        "dblp": ";330/2284;144/6087-1",
        "google_scholar": "lQoe50YAAAAJ;;https://scholar.google.com/citations?hl=en",
        "orcid": ";;",
        "linkedin": "maxim-khanov-7264891ba/;;liyixuan",
        "or_profile": "~Maxim_Khanov1;~Jirayu_Burapacheep1;~Yixuan_Li1",
        "aff": "University of Wisconsin - Madison;Stanford University;Cornell University",
        "aff_domain": "wisc.edu;stanford.edu;cornell.edu",
        "position": "Undergrad student;MS student;Graduate Student",
        "bibtex": "@inproceedings{\nkhanov2024args,\ntitle={{ARGS}: Alignment as Reward-Guided Search},\nauthor={Maxim Khanov and Jirayu Burapacheep and Yixuan Li},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=shgx0eqdw6}\n}",
        "github": "",
        "project": "",
        "reviewers": "6nE9;2sRW;Mqii;vytn",
        "pdf_size": 386355,
        "rating": "6;6;8;8",
        "confidence": "4;4;3;3",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "1;3;3;3",
        "wc_summary": "97;50;58;120",
        "wc_strengths": "23;141;111;136",
        "wc_weaknesses": "251;161;112;112",
        "wc_questions": "10;117;1;122",
        "wc_review": "381;469;282;490",
        "wc_reply_reviewers": "290;91;0;45",
        "wc_reply_authors": "1250;809;241;563",
        "reply_reviewers": "6;1;0;1",
        "reply_authors": "6;3;1;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            81.25,
            28.577744837547975
        ],
        "wc_strengths_avg": [
            102.75,
            47.42559962720556
        ],
        "wc_weaknesses_avg": [
            159.0,
            56.75825931087034
        ],
        "wc_questions_avg": [
            62.5,
            57.11610981150589
        ],
        "wc_review_avg": [
            405.5,
            82.19641111386798
        ],
        "wc_reply_reviewers_avg": [
            106.5,
            110.72149746097188
        ],
        "wc_reply_authors_avg": [
            715.75,
            368.3879578650746
        ],
        "reply_reviewers_avg": [
            2.0,
            2.345207879911715
        ],
        "reply_authors_avg": [
            3.0,
            1.8708286933869707
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 57,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3362646119371286212&as_sdt=5,24&sciodt=0,24&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=shgx0eqdw6",
        "pdf": "https://openreview.net/pdf?id=shgx0eqdw6",
        "email": "wisc.edu;stanford.edu;cornell.edu",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of Wisconsin-Madison;Stanford University;Cornell University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.wisc.edu;https://www.stanford.edu;https://www.cornell.edu",
        "aff_unique_abbr": "UW-Madison;Stanford;Cornell",
        "aff_campus_unique_index": "0;1",
        "aff_campus_unique": "Madison;Stanford;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Large Language Models Are Not Robust Multiple Choice Selectors",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17638",
        "id": "shr9PXz7T0",
        "author_site": "Chujie Zheng, Hao Zhou, Fandong Meng, Jie Zhou, Minlie Huang",
        "tldr": "",
        "abstract": "Multiple choice questions (MCQs) serve as a common yet important task format in the evaluation of large language models (LLMs). This work shows that modern LLMs are vulnerable to option position changes in MCQs due to their inherent \u201cselection bias\u201d, namely, they prefer to select specific option IDs as answers (like \u201cOption A\u201d). Through extensive empirical analyses with 20 LLMs on three benchmarks, we pinpoint that this behavioral bias primarily stems from LLMs\u2019 token bias, where the model a priori assigns more probabilistic mass to specific option ID tokens (e.g., A/B/C/D) when predicting answers from the option IDs. To mitigate selection bias, we propose a label-free, inference-time debiasing method, called PriDe, which separates the model\u2019s prior bias for option IDs from the overall prediction distribution. PriDe first estimates the prior by permutating option contents on a small number of test samples, and then applies the estimated prior to debias the remaining samples. We demonstrate that it achieves interpretable and transferable debiasing with high computational efficiency. We hope this work can draw broader research attention to the bias and robustness of modern LLMs.",
        "keywords": "large language model;bias;robustness;multiple choice question;evaluation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/862d5a4dbea4393aadd7bd65557932510f75c5de.zip",
        "author": "Chujie Zheng;Hao Zhou;Fandong Meng;Jie Zhou;Minlie Huang",
        "authorids": "~Chujie_Zheng2;~Hao_Zhou8;~Fandong_Meng3;~Jie_Zhou8;~Minlie_Huang1",
        "gender": "M;M;M;M;M",
        "homepage": "https://chujiezheng.github.io/;;http://fandongmeng.github.io/;;http://coai.cs.tsinghua.edu.cn/hml",
        "dblp": "242/8504;;117/4056.html;00/5012-16;",
        "google_scholar": "55zBNgUAAAAJ;q3WaozcAAAAJ;sA8U4S0AAAAJ;https://scholar.google.com.hk/citations?user=OijxQCMAAAAJ;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": ";;0000-0002-8158-2377;0000-0002-5899-5165;",
        "linkedin": "chujie-zheng-54b85820b/;;;;",
        "or_profile": "~Chujie_Zheng2;~Hao_Zhou8;~Fandong_Meng3;~Jie_Zhou8;~Minlie_Huang1",
        "aff": "University of California, Los Angeles;Tencent;WeChat AI, Tencent Inc.;WeChat AI, Tencent Inc.;Tsinghua University",
        "aff_domain": "ucla.edu;tencent.com;tencent.com;tencent.com;tsinghua.edu.cn",
        "position": "Intern;Researcher;Principal Researcher;Principal Researcher;Full Professor",
        "bibtex": "@inproceedings{\nzheng2024large,\ntitle={Large Language Models Are Not Robust Multiple Choice Selectors},\nauthor={Chujie Zheng and Hao Zhou and Fandong Meng and Jie Zhou and Minlie Huang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=shr9PXz7T0}\n}",
        "github": "",
        "project": "",
        "reviewers": "VDjF;G9aZ;rhkS;CGVT",
        "pdf_size": 4682457,
        "rating": "5;8;8;8",
        "confidence": "4;3;2;4",
        "soundness": "3;4;3;4",
        "contribution": "2;3;3;3",
        "presentation": "2;4;3;4",
        "wc_summary": "53;69;51;34",
        "wc_strengths": "64;91;48;69",
        "wc_weaknesses": "149;52;48;20",
        "wc_questions": "53;36;5;28",
        "wc_review": "319;248;152;151",
        "wc_reply_reviewers": "0;10;0;0",
        "wc_reply_authors": "1131;419;394;504",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "3;2;2;2",
        "rating_avg": [
            7.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            51.75,
            12.397076268217438
        ],
        "wc_strengths_avg": [
            68.0,
            15.378556499229699
        ],
        "wc_weaknesses_avg": [
            67.25,
            48.782040752719645
        ],
        "wc_questions_avg": [
            30.5,
            17.269916039170543
        ],
        "wc_review_avg": [
            217.5,
            70.61338400048535
        ],
        "wc_reply_reviewers_avg": [
            2.5,
            4.330127018922194
        ],
        "wc_reply_authors_avg": [
            612.0,
            302.4061837992074
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 215,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1449582575377242546&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=shr9PXz7T0",
        "pdf": "https://openreview.net/pdf?id=shr9PXz7T0",
        "email": "ucla.edu;tencent.com;tencent.com;tencent.com;tsinghua.edu.cn",
        "author_num": 5,
        "aff_unique_index": "0;1;1;1;2",
        "aff_unique_norm": "University of California, Los Angeles;Tencent;Tsinghua University",
        "aff_unique_dep": ";Tencent Holdings Limited;",
        "aff_unique_url": "https://www.ucla.edu;https://www.tencent.com;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "UCLA;Tencent;THU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Los Angeles;",
        "aff_country_unique_index": "0;1;1;1;1",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "siemhfrFXV",
        "title": "CrysFormer: Protein Structure Prediction via 3d Patterson Maps and Partial Structure Attention",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Determining the structure of a protein has been a decades-long open question. A protein's three-dimensional structure often poses nontrivial computation costs, when classical simulation algorithms are utilized. Advances in the transformer neural network architecture --such as AlphaFold-- achieve significant improvements for this problem, by learning from a large dataset of sequence information and corresponding protein structures. Yet, such methods only focus on sequence information; other available prior knowledge, such as protein crystallography and partial structure of amino acids, could be potentially utilized. To the best of our knowledge, we propose the first transformer-based model that directly utilizes protein crystallography and partial structure information to predict the electron density maps of proteins. Via two new datasets of peptide fragments (2-residue and 15-residue) , we demonstrate our method, dubbed CrysFormer, can achieve accurate predictions, based on a much smaller dataset size and with reduced computation costs.",
        "keywords": "AI for science;protein crystallography;Transformer model",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/6de45eb1e44fa5d0a54f0f7b8011fe4c315e7194.pdf",
        "author": "Chen Dun;Qiutai Pan;Shikai Jin;Ria Stevens;Mitchell D. Miller;George N Phillips Jr.;Anastasios Kyrillidis",
        "authorids": "~Chen_Dun2;~Qiutai_Pan1;~Shikai_Jin1;~Ria_Stevens1;~Mitchell_D._Miller1;~George_N_Phillips_Jr.1;~Anastasios_Kyrillidis2",
        "gender": ";;M;;M;;M",
        "homepage": ";;;;;;http://akyrillidis.github.io",
        "dblp": "228/8450;241/7831.html;185/0655;;;;53/9879",
        "google_scholar": "QbPWRIoAAAAJ;;oPbFY8QAAAAJ;;waude4cAAAAJ;;TEGzkZMAAAAJ",
        "orcid": ";;0000-0001-9525-4166;;0000-0003-1626-4943;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Chen_Dun2;~Qiutai_Pan1;~Shikai_Jin1;~Ria_Stevens1;~Mitchell_D._Miller1;~George_N_Phillips_Jr.1;~Anastasios_Kyrillidis2",
        "aff": "ByteDance Inc.;Rice University;;;Rice University;;Rice University",
        "aff_domain": "bytedance.com;rice.edu;;;rice.edu;;rice.edu",
        "position": "Researcher;PhD student;;;Researcher;;Assistant Professor",
        "bibtex": "@misc{\ndun2024crysformer,\ntitle={CrysFormer: Protein Structure Prediction via 3d Patterson Maps and Partial Structure Attention},\nauthor={Chen Dun and Qiutai Pan and Shikai Jin and Ria Stevens and Mitchell D. Miller and George N Phillips Jr. and Anastasios Kyrillidis},\nyear={2024},\nurl={https://openreview.net/forum?id=siemhfrFXV}\n}",
        "github": "",
        "project": "",
        "reviewers": "Rj5s;nFiA;ATj6;S4uz",
        "site": "https://openreview.net/forum?id=siemhfrFXV",
        "pdf_size": 2048418,
        "rating": "3;3;3;6",
        "confidence": "3;3;3;4",
        "soundness": "3;3;3;3",
        "contribution": "3;3;2;3",
        "presentation": "2;3;2;2",
        "wc_summary": "98;70;68;72",
        "wc_strengths": "90;48;78;144",
        "wc_weaknesses": "319;184;125;87",
        "wc_questions": "6;2;17;305",
        "wc_review": "513;304;288;608",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            77.0,
            12.206555615733702
        ],
        "wc_strengths_avg": [
            90.0,
            34.72751070837067
        ],
        "wc_weaknesses_avg": [
            178.75,
            88.04082859673687
        ],
        "wc_questions_avg": [
            82.5,
            128.57779746130356
        ],
        "wc_review_avg": [
            428.25,
            136.56568932202555
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3452062711725128701&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "ByteDance;Rice University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.bytedance.com;https://www.rice.edu",
        "aff_unique_abbr": "ByteDance;Rice",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "sk7RRHFk7M",
        "title": "DisCo: Disentangled Control for Realistic Human Dance Generation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Generative AI has made significant strides in computer vision, particularly in text-driven image/video synthesis (T2I/T2V). Despite the notable advancements, it remains challenging in human-centric content synthesis such as realistic dance generation. Current methodologies, primarily tailored for human motion transfer, encounter difficulties when confronted with real-world dance scenarios (e.g, social media dance) which require to generalize across a wide spectrum of poses and intricate human details. In this paper, we depart from the traditional paradigm of human motion transfer and emphasize two additional critical attributes for the synthesis of human dance content in social media contexts: (i) Generalizability: the model should be able to generalize beyond generic human viewpoints as well as unseen human subjects, backgrounds, and poses; (ii) Compositionality: it should allow for composition of seen/unseen subjects, backgrounds, and poses from different sources seamlessly. To address these challenges, we introduce \\ourmodel, which includes a novel model architecture with disentangled control to improve the compositionality of dance synthesis, and an effective human attribute \\pretraining for better generalizability to unseen humans. Extensive qualitative and quantitative results demonstrate that \\ourmodel can generate high-quality human dance images and videos with diverse appearances and flexible motions.",
        "keywords": "Realistic Human Dance Generation; Controllable Generative Model",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/46216aaf345c421ff063d233a041a23f9cf4b9a2.zip",
        "author": "Tan Wang;Linjie Li;Kevin Lin;Yuanhao Zhai;Chung-Ching Lin;Zhengyuan Yang;Hanwang Zhang;Zicheng Liu;Lijuan Wang",
        "authorids": "~Tan_Wang1;~Linjie_Li1;~Kevin_Lin3;~Yuanhao_Zhai1;~Chung-Ching_Lin2;~Zhengyuan_Yang1;~Hanwang_Zhang3;~Zicheng_Liu1;~Lijuan_Wang1",
        "gender": "M;F;;M;M;M;M;F;",
        "homepage": "https://wangt-cn.github.io/;;https://sites.google.com/site/kevinlin311tw/;https://www.yhzhai.com;http://zhengyuan.info/;https://mreallab.github.io/index.html;https://sites.google.com/view/zichengliu/home?pli=1;https://www.microsoft.com/en-us/research/people/lijuanw/;",
        "dblp": ";200/8256;;22/11135-1;163/9713;79/8116.html;l/ZichengLiu;51/2527.html;37/8616",
        "google_scholar": "wFduC9EAAAAJ;WR875gYAAAAJ;https://scholar.google.com.tw/citations?user=LKSy1kwAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=zh-CN;YG0DFyYAAAAJ;bkALdvsAAAAJ;cDcWXuIAAAAJ;legkbM0AAAAJ",
        "orcid": ";;0000-0001-8944-1336;0000-0002-3277-3329;;;0000-0001-5894-7828;;",
        "linkedin": ";;;yuanhao-zhai-895518161/;;;;;",
        "or_profile": "~Tan_Wang1;~Linjie_Li1;~Kevin_Lin3;~Yuanhao_Zhai1;~Zhengyuan_Yang1;~Hanwang_Zhang3;~Zicheng_Liu1;~Lijuan_Wang1;~Chung-ching_Lin1",
        "aff": "Nanyang Technological University;Microsoft;Microsoft;State University of New York at Buffalo;Microsoft;Nanyang Technological University;Microsoft;Microsoft;Microsoft",
        "aff_domain": "ntu.edu.sg;microsoft.com;microsoft.com;buffalo.edu;microsoft.com;ntu.edu.sg;microsoft.com;microsoft.com;microsoft.com",
        "position": "PhD student;Researcher;Principal Researcher;PhD student;Researcher;Associate Professor;partner research manager;Principal Researcher;Principal\u00a0Researcher",
        "bibtex": "@misc{\nwang2024disco,\ntitle={DisCo: Disentangled Control for Realistic Human Dance Generation},\nauthor={Tan Wang and Linjie Li and Kevin Lin and Yuanhao Zhai and Chung-Ching Lin and Zhengyuan Yang and Hanwang Zhang and Zicheng Liu and Lijuan Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=sk7RRHFk7M}\n}",
        "github": "",
        "project": "",
        "reviewers": "Zusg;vgGD;mmJ4;j9YJ",
        "site": "https://openreview.net/forum?id=sk7RRHFk7M",
        "pdf_size": 11835155,
        "rating": "3;3;5;5",
        "confidence": "3;4;3;4",
        "soundness": "3;2;3;4",
        "contribution": "3;2;3;2",
        "presentation": "1;2;2;3",
        "wc_summary": "71;65;88;119",
        "wc_strengths": "24;2;107;62",
        "wc_weaknesses": "483;48;195;123",
        "wc_questions": "2;2;13;31",
        "wc_review": "580;117;403;335",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            85.75,
            20.96872671384698
        ],
        "wc_strengths_avg": [
            48.75,
            39.89595844192742
        ],
        "wc_weaknesses_avg": [
            212.25,
            164.73216898954496
        ],
        "wc_questions_avg": [
            12.0,
            11.853269591129697
        ],
        "wc_review_avg": [
            358.75,
            165.76847559171196
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 88,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16462173506004276630&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;1;2;1;0;1;1;1",
        "aff_unique_norm": "Nanyang Technological University;Microsoft;State University of New York at Buffalo",
        "aff_unique_dep": ";Microsoft Corporation;",
        "aff_unique_url": "https://www.ntu.edu.sg;https://www.microsoft.com;https://www.buffalo.edu",
        "aff_unique_abbr": "NTU;Microsoft;SUNY Buffalo",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Buffalo",
        "aff_country_unique_index": "0;1;1;1;1;0;1;1;1",
        "aff_country_unique": "Singapore;United States"
    },
    {
        "id": "skb4IdpQ3M",
        "title": "Conditional Guided Diffusion Probabilistic Models for Image Super-Resolution",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We propose a novel Conditional Guided Diffusion Probabilistic Model (CG-DPM) for image super-resolution. CG-DPM adopts diffusion models, which have strong abilities to generate diverse and photo-realistic images, through a stochastic iterative denoising process. The abilities can tackle the existing issue of over-smoothing artifacts in super-resolution tasks. The earlier work SR3 firstly uses diffusion models to conditional image generation for super-resolution. However, it simply upsamples the low-resolution images to the target resolution using bicubic interpolation as the conditional input, which cannot maximize the information of conditional images. In contrast, our CG-DPM involves conditional images in each different-scale level in the encoder so that the model can use the conditional images more effectively.\nWe also introduce a separate score-based likelihood model to guide the original diffusion model to obtain a score-based posterior model. \nMoreover, since there is no analytic probabilistic formula to represent the likelihood probability for image super-resolution, we propose a novel scored-based loss function to train a separate guided network so that it can approximate the score-based likelihood probability. \nWe conduct experiments on image super-resolution tasks for human faces and natural images at different scaling factors.\nCG-DPM achieves strong performance compared with existing methods.\nMeanwhile, the proposed method can also be used on other tasks, and more experiments show that our method achieves competitive results on the medical image segmentation task.",
        "keywords": "Diffusion Models;Image Super-resolution",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Bin Xie;Hao Tang;Dawen Cai;Yan Yan",
        "authorids": "~Bin_Xie1;~Hao_Tang6;~Dawen_Cai1;~Yan_Yan6",
        "gender": "M;M;M;M",
        "homepage": "https://github.com/bxie9;https://ha0tang.github.io/;https://www.cai-lab.org;",
        "dblp": ";07/5751-5;191/6747;13/3953-2",
        "google_scholar": "ibgOuNwAAAAJ;9zJkeEMAAAAJ;8VTu0A8AAAAJ;",
        "orcid": ";0000-0002-2077-1246;0000-0003-4471-2061;",
        "linkedin": ";hao-tang-887475138/;dawen-cai-87b28323;",
        "or_profile": "~Bin_Xie1;~Hao_Tang6;~Dawen_Cai1;~Yan_Yan6",
        "aff": "illinois institute of technology;Carnegie Mellon University;University of Michigan - Ann Arbor;University of Illinois Chicago",
        "aff_domain": "hawk.iit.edu;cmu.edu;umich.edu;uic.edu",
        "position": "PhD student;Postdoc;Associate Professor;Associate Professor",
        "bibtex": "@misc{\nxie2024conditional,\ntitle={Conditional Guided Diffusion Probabilistic Models for Image Super-Resolution},\nauthor={Bin Xie and Hao Tang and Dawen Cai and Yan Yan},\nyear={2024},\nurl={https://openreview.net/forum?id=skb4IdpQ3M}\n}",
        "github": "",
        "project": "",
        "reviewers": "AnkV;dDwK;iXKY",
        "site": "https://openreview.net/forum?id=skb4IdpQ3M",
        "pdf_size": 15588729,
        "rating": "3;3;5",
        "confidence": "4;5;4",
        "soundness": "2;2;3",
        "contribution": "2;2;2",
        "presentation": "2;2;2",
        "wc_summary": "37;81;60",
        "wc_strengths": "36;18;36",
        "wc_weaknesses": "367;223;114",
        "wc_questions": "6;2;2",
        "wc_review": "446;324;212",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            59.333333333333336,
            17.96910929592474
        ],
        "wc_strengths_avg": [
            30.0,
            8.48528137423857
        ],
        "wc_weaknesses_avg": [
            234.66666666666666,
            103.61574311957725
        ],
        "wc_questions_avg": [
            3.3333333333333335,
            1.8856180831641267
        ],
        "wc_review_avg": [
            327.3333333333333,
            95.55917305814003
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:YTzuFvyfC3wJ:scholar.google.com/&scioq=Conditional+Guided+Diffusion+Probabilistic+Models+for+Image+Super-Resolution&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Illinois Institute of Technology;Carnegie Mellon University;University of Michigan;University of Illinois at Chicago",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.iit.edu;https://www.cmu.edu;https://www.umich.edu;https://www.uic.edu",
        "aff_unique_abbr": "IIT;CMU;UM;UIC",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Ann Arbor;Chicago",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Probabilistic Self-supervised Representation Learning via Scoring Rules Minimization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17637",
        "id": "skcTCdJz0f",
        "author_site": "Amirhossein Vahidi, Simon Schosser, Lisa Wimmer, Yawei Li, Bernd Bischl, Eyke H\u00fcllermeier, Mina Rezaei",
        "tldr": "",
        "abstract": "%\nSelf-supervised learning methods have shown promising results across a wide range of tasks in computer vision, natural language processing, and multimodal analysis. However, self-supervised approaches come with a notable limitation, dimensional collapse, where a model doesn't fully utilize its capacity to encode information optimally. Motivated by this, we propose ProSMin, a novel probabilistic self-supervised learning approach that leverages the power of probabilistic models to enhance representation quality and mitigate collapsing representations. Our proposed approach involves two neural networks, the online network and the target network, which collaborate and learn the diverse distribution of representations from each other through probabilistic knowledge distillation. The two networks are trained via our new loss function based on proper scoring rules. We provide a theoretical justification for ProSMin and demonstrate its modified scoring rule. This insight validates the method's optimization process and contributes to its robustness and effectiveness in improving representation quality. We evaluate our probabilistic model on various downstream tasks, such as in-distribution generalization, out-of-distribution detection, dataset corruption, low-shot learning, and transfer learning. Our method achieves superior accuracy and calibration, outperforming the self-supervised baseline in a variety of experiments on large datasets such as ImageNet-O and ImageNet-C. ProSMin thus demonstrates its scalability and real-world applicability. Our code is publicly available: https://github.com/amirvhd/SSL-sore-rule.",
        "keywords": "Self-supervised Learning;Probablistic Machine Learning;Proper Scoring Rule",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/9a823ca18a3c0fa7b3b250cb2d132ae572731d32.zip",
        "author": "Amirhossein Vahidi;Simon Schosser;Lisa Wimmer;Yawei Li;Bernd Bischl;Eyke H\u00fcllermeier;Mina Rezaei",
        "authorids": "~Amirhossein_Vahidi1;~Simon_Schosser1;~Lisa_Wimmer1;~Yawei_Li2;~Bernd_Bischl1;~Eyke_H\u00fcllermeier1;~Mina_Rezaei1",
        "gender": ";M;F;M;M;M;F",
        "homepage": ";;https://www.slds.stat.uni-muenchen.de/people/wimmer/;https://github.com/sandylaker;https://www.slds.stat.uni-muenchen.de/;https://cs.uni-paderborn.de/index.php?id=60202;https://www.compstat.statistik.uni-muenchen.de/people/minar/",
        "dblp": ";;;;48/5326;h/EykeHullermeier;205/2767",
        "google_scholar": ";https://scholar.google.de/citations?view_op=new_profile;https://scholar.google.de/citations?user=l0hl-mAAAAAJ;https://scholar.google.com/citations?authuser=1;https://scholar.google.de/citations?user=s34UckkAAAAJ;https://scholar.google.de/citations?user=usVJeNN3xFAC;https://scholar.google.de/citations?hl=en",
        "orcid": ";;0009-0009-7928-6075;;0000-0001-6002-6980;0000-0002-9944-4108;0000-0001-6994-6345",
        "linkedin": ";;;;;;mina-rezaei-b88a3a69/",
        "or_profile": "~Amirhossein_Vahidi1;~Simon_Schosser1;~Lisa_Wimmer1;~Yawei_Li2;~Bernd_Bischl1;~Eyke_H\u00fcllermeier1;~Mina_Rezaei1",
        "aff": ";Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen;LMU Munich;Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen;LMU;Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen;Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen",
        "aff_domain": ";lmu.de;stat.uni-muenchen.de;lmu.de;uni-muenchen.de;lmu.de;lmu.de",
        "position": ";MS student;PhD student;PhD student;Full Professor;Full Professor;Principal Researcher",
        "bibtex": "@inproceedings{\nvahidi2024probabilistic,\ntitle={Probabilistic Self-supervised Representation Learning via Scoring Rules Minimization},\nauthor={Amirhossein Vahidi and Simon Schosser and Lisa Wimmer and Yawei Li and Bernd Bischl and Eyke H{\\\"u}llermeier and Mina Rezaei},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=skcTCdJz0f}\n}",
        "github": "",
        "project": "",
        "reviewers": "pLHM;JrU7;QnX8",
        "pdf_size": 439785,
        "rating": "5;6;6",
        "confidence": "5;3;3",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "2;3;4",
        "wc_summary": "54;78;61",
        "wc_strengths": "54;69;34",
        "wc_weaknesses": "422;127;2",
        "wc_questions": "54;3;148",
        "wc_review": "584;277;245",
        "wc_reply_reviewers": "20;75;29",
        "wc_reply_authors": "470;229;348",
        "reply_reviewers": "1;1;1",
        "reply_authors": "3;3;2",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            64.33333333333333,
            10.077477638553983
        ],
        "wc_strengths_avg": [
            52.333333333333336,
            14.337208778404378
        ],
        "wc_weaknesses_avg": [
            183.66666666666666,
            176.0839446274292
        ],
        "wc_questions_avg": [
            68.33333333333333,
            60.05737997023254
        ],
        "wc_review_avg": [
            368.6666666666667,
            152.82306399522582
        ],
        "wc_reply_reviewers_avg": [
            41.333333333333336,
            24.087802353519557
        ],
        "wc_reply_authors_avg": [
            349.0,
            98.39037893344383
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14887399511709669548&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=skcTCdJz0f",
        "pdf": "https://openreview.net/pdf?id=skcTCdJz0f",
        "email": ";lmu.de;stat.uni-muenchen.de;lmu.de;uni-muenchen.de;lmu.de;lmu.de",
        "author_num": 7,
        "aff_unique_index": "0;1;0;1;0;0",
        "aff_unique_norm": "Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen;Ludwig Maximilian University of Munich",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.lmu.de;https://www.lmu.de",
        "aff_unique_abbr": "LMU;LMU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Munich",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "title": "How connectivity structure shapes rich and lazy learning in neural circuits",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17636",
        "id": "slSmYGc8ee",
        "author_site": "Yuhan Helena Liu, Aristide Baratin, Jonathan Cornford, Stefan Mihalas, Eric SheaBrown, Guillaume Lajoie",
        "tldr": "",
        "abstract": "In theoretical neuroscience, recent work leverages deep learning tools to explore how some network attributes critically influence its learning dynamics. Notably, initial weight distributions with small (resp. large) variance may yield a rich (resp. lazy) regime, where significant (resp. minor) changes to network states and representation are observed over the course of learning. However, in biology, neural circuit connectivity generally has a low-rank structure and therefore differs markedly from the random initializations generally used for these studies. As such, here we investigate how the structure of the initial weights \u2014 in particular their effective rank \u2014 influences the network learning regime. Through both empirical and theoretical analyses, we discover that high-rank initializations typically yield smaller network changes indicative of lazier learning, a finding we also confirm with experimentally-driven initial connectivity in recurrent neural networks. Conversely, low-rank initialization biases learning towards richer learning. Importantly, however, as an exception to this rule, we find lazier learning can still occur with a low-rank initialization that aligns with task and data statistics. Our research highlights the pivotal role of initial weight structures in shaping learning regimes, with implications for metabolic costs of plasticity and risks of catastrophic forgetting.",
        "keywords": "Computational neuroscience;recurrent neural networks;learning;connectivity structure;inductive bias;rich and lazy learning;deep learning theory;neural representations",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/c751186cd06e16cafbf5929e4c30ebfc080ccbcb.pdf",
        "author": "Yuhan Helena Liu;Aristide Baratin;Jonathan Cornford;Stefan Mihalas;Eric Todd SheaBrown;Guillaume Lajoie",
        "authorids": "~Yuhan_Helena_Liu1;~Aristide_Baratin1;~Jonathan_Cornford1;~Stefan_Mihalas1;~Eric_Todd_SheaBrown1;~Guillaume_Lajoie1",
        "gender": "F;;;;;M",
        "homepage": "https://helena-yuhan-liu.github.io/;;;https://alleninstitute.org/person/stefan-mihalas/;;https://dms.umontreal.ca/~lajoie/",
        "dblp": "195/5396;;;90/7228;;31/10384",
        "google_scholar": "hP3kxJQAAAAJ;;;hwK-jm4AAAAJ;;",
        "orcid": ";;;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Yuhan_Helena_Liu1;~Aristide_Baratin1;~Jonathan_Cornford1;~Stefan_Mihalas1;~Eric_Todd_SheaBrown1;~Guillaume_Lajoie1",
        "aff": "University of Washington;;;Allen Institute;;Mila - Quebec Artificial Intelligence Institute",
        "aff_domain": "uw.edu;;;alleninstitute.org;;mila.quebec",
        "position": "PhD student;;;Full Professor;;Associate Professor",
        "bibtex": "@inproceedings{\nliu2024how,\ntitle={How connectivity structure shapes rich and lazy learning in neural circuits},\nauthor={Yuhan Helena Liu and Aristide Baratin and Jonathan Cornford and Stefan Mihalas and Eric Todd SheaBrown and Guillaume Lajoie},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=slSmYGc8ee}\n}",
        "github": "",
        "project": "",
        "reviewers": "RNHT;SwWy;rK41;Cn5Y",
        "pdf_size": 1429724,
        "rating": "5;6;8;8",
        "confidence": "3;4;4;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "92;106;40;131",
        "wc_strengths": "41;78;23;120",
        "wc_weaknesses": "370;286;416;293",
        "wc_questions": "40;33;139;321",
        "wc_review": "543;503;618;865",
        "wc_reply_reviewers": "190;224;91;117",
        "wc_reply_authors": "1928;2402;1910;822",
        "reply_reviewers": "1;2;2;1",
        "reply_authors": "4;5;5;3",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            92.25,
            33.24436042398771
        ],
        "wc_strengths_avg": [
            65.5,
            37.192069047042814
        ],
        "wc_weaknesses_avg": [
            341.25,
            54.30181856991532
        ],
        "wc_questions_avg": [
            133.25,
            116.22042634580205
        ],
        "wc_review_avg": [
            632.25,
            140.57626933447906
        ],
        "wc_reply_reviewers_avg": [
            155.5,
            53.67727638395972
        ],
        "wc_reply_authors_avg": [
            1765.5,
            579.3554608355737
        ],
        "reply_reviewers_avg": [
            1.5,
            0.5
        ],
        "reply_authors_avg": [
            4.25,
            0.82915619758885
        ],
        "replies_avg": [
            30,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.7777777777777777,
        "gs_citation": 19,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14831368631654119145&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=slSmYGc8ee",
        "pdf": "https://openreview.net/pdf?id=slSmYGc8ee",
        "email": "uw.edu;;;alleninstitute.org;;mila.quebec",
        "author_num": 6,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of Washington;Allen Institute for Artificial Intelligence;Quebec Artificial Intelligence Institute",
        "aff_unique_dep": ";;Artificial Intelligence",
        "aff_unique_url": "https://www.washington.edu;https://allenai.org;https://mila.quebec",
        "aff_unique_abbr": "UW;AI2;Mila",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "United States;Canada"
    },
    {
        "title": "LRM: Large Reconstruction Model for Single Image to 3D",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17635",
        "id": "sllU8vvsFF",
        "author_site": "Yicong Hong, Kai Zhang, Jiuxiang Gu, Sai Bi, Yang Zhou, Difan Liu, Feng Liu, Kalyan Sunkavalli, Trung Bui, Hao Tan",
        "tldr": "",
        "abstract": "We propose the first Large Reconstruction Model (LRM) that predicts the 3D model of an object from a single input image within just 5 seconds. In contrast to many previous methods that are trained on small-scale datasets such as ShapeNet in a category-specific fashion, LRM adopts a highly scalable transformer-based architecture with 500 million learnable parameters to directly predict a neural radiance field (NeRF) from the input image. We train our model in an end-to-end manner on massive multi-view data containing around 1 million objects, including both synthetic renderings from Objaverse and real captures from MVImgNet. This combination of a high-capacity model and large-scale training data empowers our model to be highly generalizable and produce high-quality 3D reconstructions from various testing inputs, including real-world in-the-wild captures and images created by generative models. Video demos and interactable 3D meshes can be found on our LRM project webpage: https://yiconghong.me/LRM.",
        "keywords": "3D Reconstruction;Large-Scale Training;Transformers",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yicong Hong;Kai Zhang;Jiuxiang Gu;Sai Bi;Yang Zhou;Difan Liu;Feng Liu;Kalyan Sunkavalli;Trung Bui;Hao Tan",
        "authorids": "~Yicong_Hong1;~Kai_Zhang7;~Jiuxiang_Gu2;~Sai_Bi1;~Yang_Zhou10;~Difan_Liu2;~Feng_Liu6;~Kalyan_Sunkavalli1;~Trung_Bui1;~Hao_Tan1",
        "gender": "M;M;M;M;M;M;;M;M;M",
        "homepage": "http://www.yiconghong.me/;https://kai-46.github.io/website/;http://gujiuxiang.com;https://sai-bi.github.io/;https://yzhou359.github.io/;https://people.cs.umass.edu/~dliu/;;http://www.kalyans.org/;https://sites.google.com/site/trungbuistanford/;http://www.cs.unc.edu/~airsplay/",
        "dblp": "262/3437;55/957-45;173/4935.html;165/9898;07/4580-9;211/7920;77/1318-15;42/5978;180/0632;94/877-2",
        "google_scholar": "AerHOzUAAAAJ;6B7FPMoAAAAJ;https://scholar.google.com.sg/citations?user=zPxKV9EAAAAJ;-q4nE1kAAAAJ;UuwugFEAAAAJ;;https://scholar.google.com/citations?hl=en;j7uL6VEAAAAJ;FpFTduYAAAAJ;OV1Y3FUAAAAJ",
        "orcid": "0000-0002-5068-1508;;;;;;;;0000-0002-0871-349X;",
        "linkedin": "yicong-hong;;;;;;;;trung-bui-4333322/;hao-tan-23677180/",
        "or_profile": "~Yicong_Hong1;~Kai_Zhang7;~Jiuxiang_Gu2;~Sai_Bi1;~Yang_Zhou10;~Difan_Liu2;~Feng_Liu6;~Kalyan_Sunkavalli1;~Trung_Bui1;~Hao_Tan1",
        "aff": "Adobe Systems;Adobe Systems;Adobe Systems;Adobe Systems;Adobe Research;Adobe Systems;Portland State University;Adobe Research;Adobe Research;Adobe Systems",
        "aff_domain": "adobe.com;adobe.com;adobe.com;adobe.com;adobe.com;adobe.com;pdx.edu;adobe.com;adobe.com;adobe.com",
        "position": "Researcher;Researcher;Researcher;Researcher;Research Scientist;Research Scientist;Full Professor;Principal Scientist;Researcher;Research Scientist",
        "bibtex": "@inproceedings{\nhong2024lrm,\ntitle={{LRM}: Large Reconstruction Model for Single Image to 3D},\nauthor={Yicong Hong and Kai Zhang and Jiuxiang Gu and Sai Bi and Yang Zhou and Difan Liu and Feng Liu and Kalyan Sunkavalli and Trung Bui and Hao Tan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=sllU8vvsFF}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZEtF;RnNv;ZwhW;eyyQ",
        "pdf_size": 4318094,
        "rating": "8;8;8;10",
        "confidence": "4;3;5;5",
        "soundness": "4;3;4;4",
        "contribution": "4;3;4;4",
        "presentation": "3;3;4;4",
        "wc_summary": "86;103;63;92",
        "wc_strengths": "68;115;92;155",
        "wc_weaknesses": "27;139;142;136",
        "wc_questions": "175;47;17;130",
        "wc_review": "356;404;314;513",
        "wc_reply_reviewers": "37;35;16;43",
        "wc_reply_authors": "377;533;1163;1227",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;1;2;2",
        "rating_avg": [
            8.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            86.0,
            14.611639196202457
        ],
        "wc_strengths_avg": [
            107.5,
            32.06633748964793
        ],
        "wc_weaknesses_avg": [
            111.0,
            48.54379466007988
        ],
        "wc_questions_avg": [
            92.25,
            63.21145070317561
        ],
        "wc_review_avg": [
            396.75,
            74.28786913083455
        ],
        "wc_reply_reviewers_avg": [
            32.75,
            10.108783309577865
        ],
        "wc_reply_authors_avg": [
            825.0,
            374.7719306458263
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.5222329678670935,
        "gs_citation": 411,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13251995204302241514&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=sllU8vvsFF",
        "pdf": "https://openreview.net/pdf?id=sllU8vvsFF",
        "email": "adobe.com;adobe.com;adobe.com;adobe.com;adobe.com;adobe.com;pdx.edu;adobe.com;adobe.com;adobe.com",
        "author_num": 10,
        "aff_unique_index": "0;0;0;0;0;0;1;0;0;0",
        "aff_unique_norm": "Adobe;Portland State University",
        "aff_unique_dep": "Adobe Systems Incorporated;",
        "aff_unique_url": "https://www.adobe.com;https://www.pdx.edu",
        "aff_unique_abbr": "Adobe;PSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Energy-conserving equivariant GNN for elasticity of lattice architected metamaterials",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17634",
        "id": "smy4DsUbBo",
        "author_site": "Ivan Grega, Ilyes Batatia, G\u00e1bor Cs\u00e1nyi, Sri Karlapati, Vikram Deshpande",
        "tldr": "",
        "abstract": "Lattices are architected metamaterials whose properties strongly depend on their geometrical design. The analogy between lattices and graphs enables the use of graph neural networks (GNNs) as a faster surrogate model compared to traditional methods such as finite element modelling. In this work, we generate a big dataset of structure-property relationships for strut-based lattices. The dataset is made available to the community which can fuel the development of methods anchored in physical principles for the fitting of fourth-order tensors. In addition, we present a higher-order GNN model trained on this dataset. The key features of the model are (i) SE(3) equivariance, and (ii) consistency with the thermodynamic law of conservation of energy. We compare the model to non-equivariant models based on a number of error metrics and demonstrate its benefits in terms of predictive performance and reduced training requirements. Finally, we demonstrate an example application of the model to an architected material design task. The methods which we developed are applicable to fourth-order tensors beyond elasticity such as piezo-optical tensor etc.",
        "keywords": "mechanical metamaterials;lattices;elasticity;GNN;equivariant;positive definite;energy conservation",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Ivan Grega;Ilyes Batatia;Gabor Csanyi;Sri Karlapati;Vikram Deshpande",
        "authorids": "~Ivan_Grega1;~Ilyes_Batatia1;~Gabor_Csanyi1;~Sri_Karlapati1;~Vikram_Deshpande1",
        "gender": "M;M;M;M;M",
        "homepage": ";;;;",
        "dblp": "367/5058;282/4552;;;",
        "google_scholar": ";fTVuWFMAAAAJ;q39javYAAAAJ;-vQthRQAAAAJ;https://scholar.google.co.uk/citations?user=VIwGymEAAAAJ",
        "orcid": ";;;;",
        "linkedin": "ivan-grega;;;;",
        "or_profile": "~Ivan_Grega1;~Ilyes_Batatia1;~Gabor_Csanyi1;~Sri_Karlapati1;~Vikram_Deshpande1",
        "aff": "Mila - Quebec Artificial Intelligence Institute;University of Cambridge;University of Cambridge;;University of Cambridge",
        "aff_domain": "mila.quebec;cam.ac.uk;cam.ac.uk;;cam.ac.uk",
        "position": "Intern;MS student;Full Professor;;Full Professor",
        "bibtex": "@inproceedings{\ngrega2024energyconserving,\ntitle={Energy-conserving equivariant {GNN} for elasticity of lattice architected metamaterials},\nauthor={Ivan Grega and Ilyes Batatia and Gabor Csanyi and Sri Karlapati and Vikram Deshpande},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=smy4DsUbBo}\n}",
        "github": "",
        "project": "",
        "reviewers": "TDG7;azcZ;uV3y;kbo4",
        "pdf_size": 16130874,
        "rating": "5;5;6;8",
        "confidence": "4;4;3;4",
        "soundness": "3;2;3;3",
        "contribution": "3;2;2;3",
        "presentation": "2;2;3;3",
        "wc_summary": "96;37;463;65",
        "wc_strengths": "30;54;2;58",
        "wc_weaknesses": "146;564;2;246",
        "wc_questions": "71;5;2;35",
        "wc_review": "343;660;469;404",
        "wc_reply_reviewers": "191;58;158;34",
        "wc_reply_authors": "452;563;509;354",
        "reply_reviewers": "2;1;1;1",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            165.25,
            173.16809030534466
        ],
        "wc_strengths_avg": [
            36.0,
            22.360679774997898
        ],
        "wc_weaknesses_avg": [
            239.5,
            206.4527791045691
        ],
        "wc_questions_avg": [
            28.25,
            27.851166941440713
        ],
        "wc_review_avg": [
            469.0,
            118.93485611880143
        ],
        "wc_reply_reviewers_avg": [
            110.25,
            65.84973424395879
        ],
        "wc_reply_authors_avg": [
            469.5,
            77.37732225917358
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=490555146719493487&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=smy4DsUbBo",
        "pdf": "https://openreview.net/pdf?id=smy4DsUbBo",
        "email": "mila.quebec;cam.ac.uk;cam.ac.uk;;cam.ac.uk",
        "author_num": 5,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Quebec Artificial Intelligence Institute;University of Cambridge",
        "aff_unique_dep": "Artificial Intelligence;",
        "aff_unique_url": "https://mila.quebec;https://www.cam.ac.uk",
        "aff_unique_abbr": "Mila;Cambridge",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Cambridge",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "Canada;United Kingdom"
    },
    {
        "title": "Whole-Song Hierarchical Generation of Symbolic Music Using Cascaded Diffusion Models",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17633",
        "id": "sn7CYWyavh",
        "author_site": "Ziyu Wang, Lejun Min, Gus Xia",
        "tldr": "",
        "abstract": "Recent deep music generation studies have put much emphasis on long-term generation with structures. However, we are yet to see high-quality, well-structured **whole-song** generation. In this paper, we make the first attempt to model a full music piece under the realization of *compositional hierarchy*. With a focus on symbolic representations of pop songs, we define a hierarchical language, in which each level of hierarchy focuses on the semantics and context dependency at a certain music scope. The high-level languages reveal whole-song form, phrase, and cadence, whereas the low-level languages focus on notes, chords, and their local patterns. A cascaded diffusion model is trained to model the hierarchical language, where each level is conditioned on its upper levels. Experiments and analysis show that our model is capable of generating full-piece music with recognizable global verse-chorus structure and cadences, and the music quality is higher than the baselines. Additionally, we show that the proposed model is *controllable* in a flexible way. By sampling from the interpretable hierarchical languages or adjusting pre-trained external representations, users can control the music flow via various features such as phrase harmonic structures, rhythmic patterns, and accompaniment texture.",
        "keywords": "Cascaded generative models;Diffusion models;Symbolic Music Generation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/dcafe61a2ac44d4c103a6125521cacd52cd061e6.zip",
        "author": "Ziyu Wang;Lejun Min;Gus Xia",
        "authorids": "~Ziyu_Wang10;~Lejun_Min1;~Gus_Xia1",
        "gender": "M;M;M",
        "homepage": ";https://aik2.site;http://www.musicxlab.com",
        "dblp": ";;",
        "google_scholar": "Y0phDUIAAAAJ;c4NFuSEAAAAJ;",
        "orcid": ";;",
        "linkedin": ";lejun-min-1981a5254/;",
        "or_profile": "~Ziyu_Wang10;~Lejun_Min1;~Gus_Xia1",
        "aff": "New York University;Stanford University;New York University",
        "aff_domain": "nyu.edu;stanford.edu;nyu.edu",
        "position": "PhD student;MS student;Assistant Professor",
        "bibtex": "@inproceedings{\nwang2024wholesong,\ntitle={Whole-Song Hierarchical Generation of Symbolic Music Using Cascaded Diffusion Models},\nauthor={Ziyu Wang and Lejun Min and Gus Xia},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=sn7CYWyavh}\n}",
        "github": "",
        "project": "",
        "reviewers": "JZXS;EK1V;JPv8;QD5q",
        "pdf_size": 3333960,
        "rating": "5;8;8;8",
        "confidence": "4;5;3;4",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;4;3;3",
        "wc_summary": "77;53;65;82",
        "wc_strengths": "59;265;37;93",
        "wc_weaknesses": "156;239;47;90",
        "wc_questions": "67;32;21;477",
        "wc_review": "359;589;170;742",
        "wc_reply_reviewers": "0;59;60;126",
        "wc_reply_authors": "862;303;612;1221",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "2;2;2;3",
        "rating_avg": [
            7.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            69.25,
            11.233320969330485
        ],
        "wc_strengths_avg": [
            113.5,
            89.71482597653522
        ],
        "wc_weaknesses_avg": [
            133.0,
            72.47413331665305
        ],
        "wc_questions_avg": [
            149.25,
            189.9873351042116
        ],
        "wc_review_avg": [
            465.0,
            218.15476157993893
        ],
        "wc_reply_reviewers_avg": [
            61.25,
            44.58348909630111
        ],
        "wc_reply_authors_avg": [
            749.5,
            336.61439363164493
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4466452647501413050&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=sn7CYWyavh",
        "pdf": "https://openreview.net/pdf?id=sn7CYWyavh",
        "email": "nyu.edu;stanford.edu;nyu.edu",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "New York University;Stanford University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.nyu.edu;https://www.stanford.edu",
        "aff_unique_abbr": "NYU;Stanford",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Stanford",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Likelihood Training of Cascaded Diffusion Models via Hierarchical Volume-preserving Maps",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17632",
        "id": "sojpn00o8z",
        "author_site": "Henry Li, Ronen Basri, Yuval Kluger",
        "tldr": "",
        "abstract": "Cascaded models are multi-scale generative models with a marked capacity for producing perceptually impressive samples at high resolutions. In this work, we show that they can also be excellent likelihood models, so long as we overcome a fundamental difficulty with probabilistic multi-scale models: the intractability of the likelihood function. Chiefly, in cascaded models each intermediary scale introduces extraneous variables that cannot be tractably marginalized out for likelihood evaluation. This issue vanishes by modeling the diffusion process on latent spaces induced by a class of transformations we call hierarchical volume-preserving maps, which decompose spatially structured data in a hierarchical fashion without introducing local distortions in the latent space. We demonstrate that two such maps are well-known in the literature for multiscale modeling: Laplacian pyramids and wavelet transforms. Not only do such reparameterizations allow the likelihood function to be directly expressed as a joint likelihood over the scales, we show that the Laplacian pyramid and wavelet transform also produces significant improvements to the state-of-the-art on a selection of benchmarks in likelihood modeling, including density estimation, lossless compression, and out-of-distribution detection. Investigating the theoretical basis of our empirical gains we uncover deep connections to score matching under the Earth Mover's Distance (EMD), which is a well-known surrogate for perceptual similarity.",
        "keywords": "likelihood-based modeling;diffusion modeling;density estimation",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Henry Li;Ronen Basri;Yuval Kluger",
        "authorids": "~Henry_Li2;~Ronen_Basri1;~Yuval_Kluger1",
        "gender": ";M;",
        "homepage": "https://hnry.li;https://www.weizmann.ac.il/math/ronen/;https://medicine.yale.edu/profile/yuval-kluger/",
        "dblp": "31/6498;b/RonenBasri.html;79/5739",
        "google_scholar": "o7-TIlcAAAAJ;d6vuvHIAAAAJ;RDfdfr0AAAAJ",
        "orcid": ";;0000-0002-3035-071X",
        "linkedin": ";;",
        "or_profile": "~Henry_Li2;~Ronen_Basri1;~Yuval_Kluger1",
        "aff": "Yale University;Meta Platforms Inc.;Yale University",
        "aff_domain": "yale.edu;meta.com;yale.edu",
        "position": "PhD student;Researcher;Professor",
        "bibtex": "@inproceedings{\nli2024likelihood,\ntitle={Likelihood Training of Cascaded Diffusion Models via Hierarchical Volume-preserving Maps},\nauthor={Henry Li and Ronen Basri and Yuval Kluger},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=sojpn00o8z}\n}",
        "github": "",
        "project": "",
        "reviewers": "PAyK;hZLh;y69M;ocEJ",
        "pdf_size": 8464397,
        "rating": "5;8;8;8",
        "confidence": "4;3;5;2",
        "soundness": "2;2;3;2",
        "contribution": "2;3;3;3",
        "presentation": "2;3;2;2",
        "wc_summary": "245;126;57;56",
        "wc_strengths": "90;97;56;49",
        "wc_weaknesses": "123;59;538;153",
        "wc_questions": "130;525;481;1319",
        "wc_review": "588;807;1132;1577",
        "wc_reply_reviewers": "304;142;124;1078",
        "wc_reply_authors": "1408;619;773;3207",
        "reply_reviewers": "1;2;1;3",
        "reply_authors": "3;2;1;5",
        "rating_avg": [
            7.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            121.0,
            77.00973964376195
        ],
        "wc_strengths_avg": [
            73.0,
            20.796634343085422
        ],
        "wc_weaknesses_avg": [
            218.25,
            187.70372265887536
        ],
        "wc_questions_avg": [
            613.75,
            434.997341945902
        ],
        "wc_review_avg": [
            1026.0,
            372.3714543302158
        ],
        "wc_reply_reviewers_avg": [
            412.0,
            390.85291351095236
        ],
        "wc_reply_authors_avg": [
            1501.75,
            1027.9823381264875
        ],
        "reply_reviewers_avg": [
            1.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.75,
            1.479019945774904
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.2581988897471611,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10646242800894232120&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=sojpn00o8z",
        "pdf": "https://openreview.net/pdf?id=sojpn00o8z",
        "email": "yale.edu;meta.com;yale.edu",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Yale University;Meta",
        "aff_unique_dep": ";Meta Platforms Inc.",
        "aff_unique_url": "https://www.yale.edu;https://www.meta.com",
        "aff_unique_abbr": "Yale;Meta",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "sp666x6Gh3",
        "title": "Density-Softmax: Efficient Test-time Model for Uncertainty Estimation and Robustness under Distribution Shifts",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Sampling-based methods, e.g., Deep Ensembles and Bayesian Neural Nets have become promising approaches to improve the quality of uncertainty estimation and robust generalization. However, they suffer from a large model size and high latency at test-time, which limits the scalability needed for low-resource devices and real-time applications. To resolve these computational issues, we propose Density-Softmax, a sampling-free deterministic framework via combining a density function built on a 1-Lipschitz feature extractor with the softmax layer. Theoretically, we show that our model is the solution of minimax uncertainty risk and is distance-aware on feature space, thus reducing the over-confidence of the standard softmax under distribution shifts. Empirically, our method achieves competitive results with state-of-the-art techniques in terms of uncertainty and robustness, while having a lower number of model parameters and a lower latency at test-time.",
        "keywords": "Safety in machine learning;trustworthy AI;uncertainty and robustness;representation learning;probabilistic modeling",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/622e343fe08757c69aae3c971d2542697bb96f2e.zip",
        "author": "Ha Manh Bui;Anqi Liu",
        "authorids": "~Ha_Manh_Bui1;~Anqi_Liu2",
        "gender": ";F",
        "homepage": ";https://anqiliu-ai.github.io/",
        "dblp": ";",
        "google_scholar": ";Q8yp6zQAAAAJ",
        "orcid": ";0000-0002-0468-5698",
        "linkedin": ";",
        "or_profile": "~Ha_Manh_Bui1;~Anqi_Liu2",
        "aff": ";University of Illinois, Chicago",
        "aff_domain": ";uic.edu",
        "position": ";PhD student",
        "bibtex": "@misc{\nbui2024densitysoftmax,\ntitle={Density-Softmax: Efficient Test-time Model for Uncertainty Estimation and Robustness under Distribution Shifts},\nauthor={Ha Manh Bui and Anqi Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=sp666x6Gh3}\n}",
        "github": "",
        "project": "",
        "reviewers": "6MCn;tUCH;ZCiU;ueNw",
        "site": "https://openreview.net/forum?id=sp666x6Gh3",
        "pdf_size": 4824995,
        "rating": "3;5;5;8",
        "confidence": "4;4;3;5",
        "soundness": "1;4;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;4;2;3",
        "wc_summary": "101;92;72;152",
        "wc_strengths": "68;24;74;296",
        "wc_weaknesses": "574;689;195;470",
        "wc_questions": "9;4;74;56",
        "wc_review": "752;809;415;974",
        "wc_reply_reviewers": "10;700;200;66",
        "wc_reply_authors": "796;1616;601;398",
        "reply_reviewers": "1;2;1;1",
        "reply_authors": "2;3;1;1",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            1.0897247358851685
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            104.25,
            29.498940658945703
        ],
        "wc_strengths_avg": [
            115.5,
            105.98466870260057
        ],
        "wc_weaknesses_avg": [
            482.0,
            182.9111806314748
        ],
        "wc_questions_avg": [
            35.75,
            29.98645527567405
        ],
        "wc_review_avg": [
            737.5,
            203.26153103821687
        ],
        "wc_reply_reviewers_avg": [
            244.0,
            272.17273926681196
        ],
        "wc_reply_authors_avg": [
            852.75,
            462.5869512859177
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.5940885257860046,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=717653009592370250&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Illinois at Chicago",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uic.edu",
        "aff_unique_abbr": "UIC",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Chicago",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Measuring Vision-Language STEM Skills of Neural Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17631",
        "id": "spvaV5LELF",
        "author_site": "Jianhao Shen, Ye Yuan, Srbuhi Mirzoyan, Ming Zhang, Chenguang Wang",
        "tldr": "",
        "abstract": "We introduce a new challenge to test the STEM skills of neural models. The problems in the real world often require solutions, combining knowledge from STEM (science, technology, engineering, and math). Unlike existing datasets, our dataset requires the understanding of multimodal vision-language information of STEM. Our dataset features one of the largest and most comprehensive datasets for the challenge. It includes $448$ skills and $1,073,146$ questions spanning all STEM subjects. Compared to existing datasets that often focus on examining expert-level ability, our dataset includes fundamental skills and questions designed based on the K-12 curriculum. We also add state-of-the-art foundation models such as CLIP and GPT-3.5-Turbo to our benchmark. Results show that the recent model advances only help master a very limited number of lower grade-level skills ($2.5$% in the third grade) in our dataset. In fact, these models are still well below (averaging $54.7$%) the performance of elementary students, not to mention near expert-level performance. To understand and increase the performance on our dataset, we teach the models on a training split of our dataset.\nEven though we observe improved performance, the model performance remains relatively low compared to average elementary students. To solve STEM problems, we will need novel algorithmic innovations from the community.",
        "keywords": "Benchmark;STEM;Multimodal;Vision-language models;Language models",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/d757cf77156c3e12cf57ff7ce9c474d53c24a92d.pdf",
        "author": "Jianhao Shen;Ye Yuan;Srbuhi Mirzoyan;Ming Zhang;Chenguang Wang",
        "authorids": "~Jianhao_Shen1;~Ye_Yuan12;~Srbuhi_Mirzoyan1;~Ming_Zhang5;~Chenguang_Wang1",
        "gender": "M;M;;F;M",
        "homepage": ";https://github.com/yuanyehome;https://github.com/srbuhimirzoyan;https://cs.pku.edu.cn/info/1080/1371.htm;https://cgraywang.github.io/",
        "dblp": "217/2324;33/6315-16;;73/1844-4;62/3432-1.html",
        "google_scholar": "9fppVAUAAAAJ;h8WQaTkAAAAJ;;LbzoQBsAAAAJ;hsZ2aj0AAAAJ",
        "orcid": ";;;0000-0002-9809-3430;",
        "linkedin": ";%E9%87%8E-%E8%A2%81-0641241a4/;srbuhimirzoyan;;",
        "or_profile": "~Jianhao_Shen1;~Ye_Yuan12;~Srbuhi_Mirzoyan1;~Ming_Zhang5;~Chenguang_Wang1",
        "aff": ";Peking University;Peking University;Peking University;Washington University, Saint Louis",
        "aff_domain": ";pku.edu.cn;pku.edu.cn;pku.edu.cn;wustl.edu",
        "position": ";PhD student;MS student;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nshen2024measuring,\ntitle={Measuring Vision-Language {STEM} Skills of Neural Models},\nauthor={Jianhao Shen and Ye Yuan and Srbuhi Mirzoyan and Ming Zhang and Chenguang Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=spvaV5LELF}\n}",
        "github": "",
        "project": "",
        "reviewers": "aT3Q;FcAF;psfv",
        "pdf_size": 9626122,
        "rating": "6;6;6",
        "confidence": "4;4;4",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "3;3;4",
        "wc_summary": "75;66;104",
        "wc_strengths": "31;27;121",
        "wc_weaknesses": "132;123;104",
        "wc_questions": "27;6;159",
        "wc_review": "265;222;488",
        "wc_reply_reviewers": "25;44;191",
        "wc_reply_authors": "735;246;583",
        "reply_reviewers": "1;1;2",
        "reply_authors": "2;2;3",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            81.66666666666667,
            16.21384867602041
        ],
        "wc_strengths_avg": [
            59.666666666666664,
            43.39994879669279
        ],
        "wc_weaknesses_avg": [
            119.66666666666667,
            11.671427600007732
        ],
        "wc_questions_avg": [
            64.0,
            67.72001181334805
        ],
        "wc_review_avg": [
            325.0,
            116.58759225006179
        ],
        "wc_reply_reviewers_avg": [
            86.66666666666667,
            74.18145919897295
        ],
        "wc_reply_authors_avg": [
            521.3333333333334,
            204.340130392659
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4558067850758721930&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=spvaV5LELF",
        "pdf": "https://openreview.net/pdf?id=spvaV5LELF",
        "email": ";pku.edu.cn;pku.edu.cn;pku.edu.cn;wustl.edu",
        "author_num": 5,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "Peking University;Washington University in St. Louis",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.pku.edu.cn;https://wustl.edu",
        "aff_unique_abbr": "Peking U;WUSTL",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Saint Louis",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "sq5gkjC9jv",
        "title": "Topological Expressive Power of ReLU Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We study the expressivity of ReLU neural networks in the setting of a binary classification problem from a topological perspective. Recently, empirical studies showed that neural networks operate by changing topology, transforming a topologically complicated data set into a topologically simpler one as it passes through the layers. This topological simplification has been measured by Betti numbers, which are algebraic invariants of a topological space. We use the same measure to establish lower and upper bounds on the topological simplification a ReLU neural network can achieve with a given architecture. We therefore contribute to a better understanding of the expressivity of ReLU neural networks in the context of binary classification problems by shedding light on their ability to capture the underlying topological structure of the data. In particular the results show that deep ReLU neural networks are exponentially more powerful than shallow ones in terms of topological simplification. This provides a mathematically rigorous explanation why deeper networks are better equipped to handle complex and topologically rich datasets.",
        "keywords": "ReLU neural networks;topology;Betti numbers;classification task;deep learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Moritz Leo Grillo;Ekin Ergen",
        "authorids": "~Moritz_Leo_Grillo1;~Ekin_Ergen1",
        "gender": "M;F",
        "homepage": "https://www3.math.tu-berlin.de/coga/team/grillo/;https://www3.math.tu-berlin.de/coga/team/ergen/",
        "dblp": "359/1556.html;",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Moritz_Leo_Grillo1;~Ekin_Ergen1",
        "aff": "Technische Universit\u00e4t Berlin;Technische Universit\u00e4t Berlin",
        "aff_domain": "tu-berlin.de;tu-berlin.de",
        "position": "PhD student;PhD student",
        "bibtex": "@misc{\ngrillo2024topological,\ntitle={Topological Expressive Power of Re{LU} Neural Networks},\nauthor={Moritz Leo Grillo and Ekin Ergen},\nyear={2024},\nurl={https://openreview.net/forum?id=sq5gkjC9jv}\n}",
        "github": "",
        "project": "",
        "reviewers": "XYHA;o7g5;UFRF",
        "site": "https://openreview.net/forum?id=sq5gkjC9jv",
        "pdf_size": 467786,
        "rating": "3;6;8",
        "confidence": "4;1;4",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "2;2;3",
        "wc_summary": "32;86;215",
        "wc_strengths": "28;60;59",
        "wc_weaknesses": "321;140;263",
        "wc_questions": "150;20;122",
        "wc_review": "531;306;659",
        "wc_reply_reviewers": "185;0;0",
        "wc_reply_authors": "645;212;424",
        "reply_reviewers": "2;0;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            5.666666666666667,
            2.0548046676563256
        ],
        "confidence_avg": [
            3.0,
            1.4142135623730951
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            111.0,
            76.77239087067694
        ],
        "wc_strengths_avg": [
            49.0,
            14.854853303438128
        ],
        "wc_weaknesses_avg": [
            241.33333333333334,
            75.46448760104907
        ],
        "wc_questions_avg": [
            97.33333333333333,
            55.86491644036433
        ],
        "wc_review_avg": [
            498.6666666666667,
            145.9139777022369
        ],
        "wc_reply_reviewers_avg": [
            61.666666666666664,
            87.20983634634086
        ],
        "wc_reply_authors_avg": [
            427.0,
            176.78423760807033
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.1147078669352809,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:rzRGWtz74XYJ:scholar.google.com/&scioq=Topological+Expressive+Power+of+ReLU+Neural+Networks&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Technische Universit\u00e4t Berlin",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tu-berlin.de",
        "aff_unique_abbr": "TU Berlin",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Germany"
    },
    {
        "title": "VFLAIR: A Research Library and Benchmark for Vertical Federated Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17630",
        "id": "sqRgz88TM3",
        "author_site": "TIANYUAN ZOU, Zixuan GU, Yu He, Hideaki Takahashi, Yang Liu, Ya-Qin Zhang",
        "tldr": "",
        "abstract": "Vertical Federated Learning (VFL) has emerged as a collaborative training paradigm that allows participants with different features of the same group of users to accomplish cooperative training without exposing their raw data or model parameters. VFL has gained significant attention for its research potential and real-world applications in recent years, but still faces substantial challenges, such as in defending various kinds of data inference and backdoor attacks. Moreover, most of existing VFL projects are industry-facing and not easily used for keeping track of the current research progress. To address this need, we present an extensible and lightweight VFL framework VFLAIR (available at https://github.com/FLAIR-THU/VFLAIR), which supports VFL training with a variety of models, datasets and protocols, along with standardized modules for comprehensive evaluations of attacks and defense strategies. We also benchmark $11$ attacks and $8$ defenses performance under different communication and model partition settings and draw concrete insights and recommendations on the choice of defense strategies for different practical VFL deployment scenarios.",
        "keywords": "VFL;Attacks and Defenses;Benchmark;Platform",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/baac38bc0039aee3a98f2046bd5f230c916e8ab1.pdf",
        "author": "Tianyuan Zou;Zixuan GU;Yu He;Hideaki Takahashi;Yang Liu;Ya-Qin Zhang",
        "authorids": "~Tianyuan_Zou1;~Zixuan_GU1;~Yu_He9;~Hideaki_Takahashi1;~Yang_Liu59;~Ya-Qin_Zhang1",
        "gender": "F;F;M;M;F;M",
        "homepage": "https://github.com/LindaLydia;;;https://koukyosyumei.github.io/;;https://air.tsinghua.edu.cn/en/info/1046/1188.htm",
        "dblp": ";;;22/6764;;09/2187",
        "google_scholar": "vlV8sCQAAAAJ;;;https://scholar.google.co.jp/citations?user=RA3z3UEAAAAJ;JEieoFsAAAAJ;mDOMfxIAAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";https://www.linkedin.cn/incareer/in/ACoAADSoC7YB0XkiiBsHW5CVIOg_AgvlSrzsHv8;%E6%98%B1-%E4%BD%95-0322/;hideaki-takahashi-056177194/;;",
        "or_profile": "~Tianyuan_Zou1;~Zixuan_GU1;~Yu_He9;~Hideaki_Takahashi1;~Yang_Liu59;~Ya-Qin_Zhang1",
        "aff": "Institute for AI Industry Research, Tsinghua University;Tsinghua University;Fudan University;The University of Tokyo;Tsinghua University;AIR, Tsinghua University",
        "aff_domain": "air.tsinghua.edu.cn;tsinghua.edu.cn;fudan.edu.cn;u-tokyo.ac.jp;tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "PhD student;Undergrad student;PhD student;Undergrad student;Associate Professor;Full Professor",
        "bibtex": "@inproceedings{\nzou2024vflair,\ntitle={{VFLAIR}: A Research Library and Benchmark for Vertical Federated Learning},\nauthor={Tianyuan Zou and Zixuan GU and Yu He and Hideaki Takahashi and Yang Liu and Ya-Qin Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=sqRgz88TM3}\n}",
        "github": "",
        "project": "",
        "reviewers": "1nCt;Gb2U;z5tx",
        "pdf_size": 22504079,
        "rating": "3;8;8",
        "confidence": "4;4;4",
        "soundness": "2;3;3",
        "contribution": "1;4;3",
        "presentation": "2;4;3",
        "wc_summary": "21;116;45",
        "wc_strengths": "29;105;72",
        "wc_weaknesses": "207;124;168",
        "wc_questions": "4;93;49",
        "wc_review": "261;438;334",
        "wc_reply_reviewers": "0;0;52",
        "wc_reply_authors": "1244;766;1128",
        "reply_reviewers": "0;0;1",
        "reply_authors": "4;2;4",
        "rating_avg": [
            6.333333333333333,
            2.357022603955158
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            60.666666666666664,
            40.33471072028271
        ],
        "wc_strengths_avg": [
            68.66666666666667,
            31.116269413639902
        ],
        "wc_weaknesses_avg": [
            166.33333333333334,
            33.9050963065371
        ],
        "wc_questions_avg": [
            48.666666666666664,
            36.33486235314815
        ],
        "wc_review_avg": [
            344.3333333333333,
            72.62843030720745
        ],
        "wc_reply_reviewers_avg": [
            17.333333333333332,
            24.51303508113365
        ],
        "wc_reply_authors_avg": [
            1046.0,
            203.57472010705717
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4815374481959147431&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=sqRgz88TM3",
        "pdf": "https://openreview.net/pdf?id=sqRgz88TM3",
        "email": "air.tsinghua.edu.cn;tsinghua.edu.cn;fudan.edu.cn;u-tokyo.ac.jp;tsinghua.edu.cn;tsinghua.edu.cn",
        "author_num": 6,
        "aff_unique_index": "0;0;1;2;0;0",
        "aff_unique_norm": "Tsinghua University;Fudan University;University of Tokyo",
        "aff_unique_dep": "Institute for AI Industry Research;;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.fudan.edu.cn;https://www.u-tokyo.ac.jp",
        "aff_unique_abbr": "Tsinghua;Fudan;UTokyo",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0;0",
        "aff_country_unique": "China;Japan"
    },
    {
        "id": "srsXnKPx5T",
        "title": "Hexa: Self-Improving for Knowledge Augmented Dialogue System",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "A common practice in knowledge-grounded dialogue generation is to explicitly utilize intermediate steps (e.g., web-search, memory retrieval) with modular approaches. However, data for such steps are often inaccessible compared to those of dialogue responses as they are unobservable in an ordinary dialogue. To fill in the absence of these data, we develop a self-improving method to improve the generative performances of intermediate steps without the ground truth data. In particular, we propose a novel bootstrapping scheme with a guided prompt and a modified loss function to enhance the diversity of appropriate self-generated responses. Through experiments on various benchmark datasets, we empirically demonstrate that our method successfully leverages a self-improving mechanism in generating intermediate and final responses and improves the performances on the task of knowledge-grounded dialogue generation.",
        "keywords": "knowledge grounded dialogue generation;self-training",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/b7861fb4ffc2b435cebea2deebac28ab6956c2c7.zip",
        "author": "Daejin Jo;Daniel Wontae Nam;Gunsoo Han;Kyoung-Woon On;Taehwan Kwon;Seungeun Rho;Sungwoong Kim",
        "authorids": "~Daejin_Jo1;~Daniel_Wontae_Nam1;~Gunsoo_Han1;~Kyoung-Woon_On1;~Taehwan_Kwon1;~Seungeun_Rho1;~Sungwoong_Kim2",
        "gender": "M;M;M;M;;M;M",
        "homepage": ";;https://github.com/robinsongh381;;https://github.com/TaehwanKwon;;",
        "dblp": "264/5824;242/3858.html;;175/0873;;239/5265;74/8063",
        "google_scholar": ";;;;;;https://scholar.google.co.kr/citations?user=3DSA90AAAAAJ",
        "orcid": ";;;;;;",
        "linkedin": ";daniel-w-nam;;;;seungeun-rho-2943a0179/;",
        "or_profile": "~Daejin_Jo1;~Daniel_Wontae_Nam1;~Gunsoo_Han1;~Kyoung-Woon_On1;~Taehwan_Kwon1;~Seungeun_Rho1;~Sungwoong_Kim2",
        "aff": "Kakao Brain;Kakao Brain Corp.;Kakao Brain;Kakao;;Georgia Institute of Technology;Korea University",
        "aff_domain": "kakaobrain.com;kakaobrain.com;kakaobrain.com;kakaocorp.com;;gatech.edu;korea.ac.kr",
        "position": "Researcher;Researcher;Researcher;Researcher;;PhD student;Associate Professor",
        "bibtex": "@misc{\njo2024hexa,\ntitle={Hexa: Self-Improving for Knowledge Augmented Dialogue System},\nauthor={Daejin Jo and Daniel Wontae Nam and Gunsoo Han and Kyoung-Woon On and Taehwan Kwon and Seungeun Rho and Sungwoong Kim},\nyear={2024},\nurl={https://openreview.net/forum?id=srsXnKPx5T}\n}",
        "github": "",
        "project": "",
        "reviewers": "uni2;hXyG;dRhK",
        "site": "https://openreview.net/forum?id=srsXnKPx5T",
        "pdf_size": 1827073,
        "rating": "3;5;5",
        "confidence": "4;4;4",
        "soundness": "2;3;3",
        "contribution": "1;3;3",
        "presentation": "2;2;3",
        "wc_summary": "62;87;70",
        "wc_strengths": "40;55;49",
        "wc_weaknesses": "91;110;102",
        "wc_questions": "50;1;117",
        "wc_review": "243;253;338",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "655;350;765",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            73.0,
            10.424330514074594
        ],
        "wc_strengths_avg": [
            48.0,
            6.164414002968976
        ],
        "wc_weaknesses_avg": [
            101.0,
            7.788880963698615
        ],
        "wc_questions_avg": [
            56.0,
            47.54646849837185
        ],
        "wc_review_avg": [
            278.0,
            42.62237284181474
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            590.0,
            175.5467648994611
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:SVCqObmINDQJ:scholar.google.com/&scioq=Hexa:+Self-Improving+for+Knowledge+Augmented+Dialogue+System&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;2;3",
        "aff_unique_norm": "Kakao Brain;Kakao Corp.;Georgia Institute of Technology;Korea University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://brain.kakao.com;https://www.kakao.com;https://www.gatech.edu;https://www.korea.ac.kr",
        "aff_unique_abbr": "Kakao Brain;Kakao;Georgia Tech;KU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;1;0",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "id": "sv65gA2cLA",
        "title": "An Attention-based Approach for Bayesian Optimization with Dependencies",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Bayesian Optimization (BO) is a sample-efficient method for optimizing black-box problems that are expensive to evaluate. The canonical BO is conducted in search spaces where hyperparameters are independent and the dimension of configurations remains fixed. However, different algorithms typically require their distinct hyperparameters in practice, thereby yielding a hierarchical search space structure. Such a nested configuration challenges the direct application of Bayesian optimization, as it obscures the independence assumptions made in the standard Bayesian optimization formulation. In this paper, we propose a structure-aware embedding and an attention-based Deep Kernel Gaussian Process to capture the response surface in such conditional search spaces. By endowing the surrogate model with context on the conditional structure, our approach facilitates Bayesian optimization in navigating nested hyperparameter configurations. Empirical results on both a tree-structured simulation benchmark and several real-world benchmarks demonstrate that our proposed approach improves the efficacy and efficiency of BO in conditional search spaces.",
        "keywords": "Bayesian optimization; Search space with dependencies; Attention; Deep kernel learning;",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Jiaxing Li;Wei Liu;Chao Xue;Xiaoxing Wang;Weifeng Liu;Dacheng Tao",
        "authorids": "~Jiaxing_Li3;~Wei_Liu32;~Chao_Xue1;~Xiaoxing_Wang1;~Weifeng_Liu1;~Dacheng_Tao1",
        "gender": "M;M;M;;M;",
        "homepage": ";;;;http://member.acm.org/~wfliu;",
        "dblp": ";49/3283;;;23/1112-1;",
        "google_scholar": "k9ofs4sAAAAJ;;;;XHc6D58AAAAJ;",
        "orcid": ";;0000-0002-9507-9991;;0000-0002-5388-9080;",
        "linkedin": "%E5%AE%B6%E5%85%B4-%E6%9D%8E-a8b761211/;;;;;",
        "or_profile": "~Jiaxing_Li3;~Wei_Liu32;~Chao_Xue1;~Xiaoxing_Wang1;~Weifeng_Liu1;~Dacheng_Tao1",
        "aff": "China University of Petroleum (East China);;JD Explore Academy;;China University of Petroleum (East China);",
        "aff_domain": "upc.edu.cn;;jd.com;;upc.edu.cn;",
        "position": "MS student;;Researcher;;Full Professor;",
        "bibtex": "@misc{\nli2024an,\ntitle={An Attention-based Approach for Bayesian Optimization with Dependencies},\nauthor={Jiaxing Li and Wei Liu and Chao Xue and Xiaoxing Wang and Weifeng Liu and Dacheng Tao},\nyear={2024},\nurl={https://openreview.net/forum?id=sv65gA2cLA}\n}",
        "github": "",
        "project": "",
        "reviewers": "FWug;4yMm;8zXp",
        "site": "https://openreview.net/forum?id=sv65gA2cLA",
        "pdf_size": 1720268,
        "rating": "1;3;5",
        "confidence": "4;4;4",
        "soundness": "2;2;2",
        "contribution": "2;2;2",
        "presentation": "1;2;2",
        "wc_summary": "63;71;71",
        "wc_strengths": "34;82;29",
        "wc_weaknesses": "320;348;225",
        "wc_questions": "250;94;20",
        "wc_review": "667;595;345",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            1.632993161855452
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            68.33333333333333,
            3.7712361663282534
        ],
        "wc_strengths_avg": [
            48.333333333333336,
            23.893281249943232
        ],
        "wc_weaknesses_avg": [
            297.6666666666667,
            52.63923336152312
        ],
        "wc_questions_avg": [
            121.33333333333333,
            95.86564672614598
        ],
        "wc_review_avg": [
            535.6666666666666,
            137.98872739788888
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10960700080090221920&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "China University of Petroleum;JD",
        "aff_unique_dep": ";JD Explore Academy",
        "aff_unique_url": "http://www.cup.edu.cn;",
        "aff_unique_abbr": "CUP;",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "East China;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China;"
    },
    {
        "title": "Real-Fake: Effective Training Data Synthesis Through Distribution Matching",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17629",
        "id": "svIdLLZpsA",
        "author_site": "Jianhao Yuan, Jie Zhang, Shuyang Sun, Philip Torr, Bo ZHAO",
        "tldr": "",
        "abstract": "Synthetic training data has gained prominence in numerous learning tasks and scenarios, offering advantages such as dataset augmentation, generalization evalua\u0002tion, and privacy preservation. Despite these benefits, the efficiency of synthetic data generated by\ncurrent methodologies remains inferior when training advanced deep models exclusively, limiting its practical utility. To address this challenge, we analyze the principles underlying training data synthesis for supervised learning and elucidate a principled theoretical framework from the distribution-matching perspective that explicates the mechanisms governing synthesis efficacy. Through extensive experiments, we demonstrate the effectiveness of our synthetic data across diverse image classification tasks, both as a replacement for and augmenta\u0002tion to real datasets, while also benefits such as out-of-distribution generalization, privacy preservation, and scalability. Specifically, we achieve 70.9% top1 classification accuracy on ImageNet1K when training solely with synthetic data equivalent\nto 1 \u00d7 the original real data size, which increases to 76.0% when scaling up to 10 \u00d7 synthetic data.",
        "keywords": "Training Data Synthesis;Distribution Matching;Data Efficiency",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/60a633d43971b9a52551a74b76fecf9e9c708470.pdf",
        "author": "Jianhao Yuan;Jie Zhang;Shuyang Sun;Philip Torr;Bo Zhao",
        "authorids": "~Jianhao_Yuan2;~Jie_Zhang14;~Shuyang_Sun1;~Philip_Torr1;~Bo_Zhao4",
        "gender": ";M;;;M",
        "homepage": ";https://zj-jayzhang.github.io/;;http://www.robots.ox.ac.uk/~tvg/;",
        "dblp": ";84/6889-81;;;",
        "google_scholar": ";soDBSE8AAAAJ;;;R3_AR5EAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Jianhao_Yuan2;~Jie_Zhang14;~Shuyang_Sun1;~Philip_Torr1;~Bo_Zhao4",
        "aff": ";Department of Computer Science, ETHZ - ETH Zurich;;University of Oxford;BAAI",
        "aff_domain": ";inf.ethz.ch;;ox.ac.uk;baai.ac.cn",
        "position": ";PhD student;;Full Professor;Principal Researcher",
        "bibtex": "@inproceedings{\nyuan2024realfake,\ntitle={Real-Fake: Effective Training Data Synthesis Through Distribution Matching},\nauthor={Jianhao Yuan and Jie Zhang and Shuyang Sun and Philip Torr and Bo Zhao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=svIdLLZpsA}\n}",
        "github": "",
        "project": "",
        "reviewers": "wBAQ;BpUK;8NDL;WEFi",
        "pdf_size": 3689029,
        "rating": "5;5;6;8",
        "confidence": "4;4;3;3",
        "soundness": "1;3;3;4",
        "contribution": "2;2;4;3",
        "presentation": "3;4;4;4",
        "wc_summary": "55;143;56;105",
        "wc_strengths": "19;96;61;97",
        "wc_weaknesses": "142;69;70;6",
        "wc_questions": "55;2;6;11",
        "wc_review": "271;310;193;219",
        "wc_reply_reviewers": "351;0;0;0",
        "wc_reply_authors": "1369;546;419;184",
        "reply_reviewers": "2;0;0;0",
        "reply_authors": "4;1;1;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            1.0897247358851685
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            89.75,
            36.79249244071404
        ],
        "wc_strengths_avg": [
            68.25,
            31.91688424642982
        ],
        "wc_weaknesses_avg": [
            71.75,
            48.137173784924265
        ],
        "wc_questions_avg": [
            18.5,
            21.313141485947114
        ],
        "wc_review_avg": [
            248.25,
            45.38378014224906
        ],
        "wc_reply_reviewers_avg": [
            87.75,
            151.987458364169
        ],
        "wc_reply_authors_avg": [
            629.5,
            446.26589607542275
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            1.75,
            1.299038105676658
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.8164965809277259,
        "gs_citation": 35,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9509287844579827877&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=svIdLLZpsA",
        "pdf": "https://openreview.net/pdf?id=svIdLLZpsA",
        "email": ";inf.ethz.ch;;ox.ac.uk;baai.ac.cn",
        "author_num": 5,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "ETH Zurich;University of Oxford;Beijing Academy of Artificial Intelligence",
        "aff_unique_dep": "Department of Computer Science;;",
        "aff_unique_url": "https://www.ethz.ch;https://www.ox.ac.uk;https://www.baaic.cn",
        "aff_unique_abbr": "ETHZ;Oxford;BAAI",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Zurich;",
        "aff_country_unique_index": "0;1;2",
        "aff_country_unique": "Switzerland;United Kingdom;China"
    },
    {
        "id": "svSWP21tdp",
        "title": "Fairness Feedback Loops: Training on Synthetic Data Amplifies Bias",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Model-induced distribution shifts (MIDS) occur as previous model outputs pollute new model training sets over generations of models. \nThis is known as model collapse in the case of generative models, and performative prediction or unfairness feedback loops for supervised models. We provide a taxonomy for MIDS and demonstrate that their long-run fairness effects lead to a lack of representation and performance on minoritized groups within a few generations. We improve upon this unfairness behavior by situating Algorithmic Reparation as an intentional MIDS with the goal of providing redress for historical discrimination and improving the fairness of models subject to other MIDS. Our work makes an important step towards identifying and mitigating the justification of unfair feedback loops via the algorithmic objectivity and idealism ascribed to autonomous systems.",
        "keywords": "fairness;algorithmic reparation;model collapse;trustworthy machine learning;generative models",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Sierra Calanda Wyllie;Ilia Shumailov;Nicolas Papernot",
        "authorids": "~Sierra_Calanda_Wyllie1;~Ilia_Shumailov1;~Nicolas_Papernot1",
        "gender": "F;M;Unspecified",
        "homepage": "https://www.syntelliga.net/;https://www.papernot.fr;https://www.cl.cam.ac.uk/~is410/",
        "dblp": "346/0964.html;162/1405;213/8587",
        "google_scholar": "YmZcKJ4AAAAJ;cGxq0cMAAAAJ;https://scholar.google.co.uk/citations?hl=en",
        "orcid": ";;",
        "linkedin": "sierra-wyllie-99a109195/;nicolaspapernot;ilia-shumailov/",
        "or_profile": "~Sierra_Calanda_Wyllie1;~Nicolas_Papernot1;~I_Shumailov1",
        "aff": "University of Toronto;Google;Google DeepMind",
        "aff_domain": "utoronto.ca;google.com;google.com",
        "position": "Undergrad student;Research Scientist;Research Scientist",
        "bibtex": "@misc{\nwyllie2024fairness,\ntitle={Fairness Feedback Loops: Training on Synthetic Data Amplifies Bias},\nauthor={Sierra Calanda Wyllie and Ilia Shumailov and Nicolas Papernot},\nyear={2024},\nurl={https://openreview.net/forum?id=svSWP21tdp}\n}",
        "github": "",
        "project": "",
        "reviewers": "HHFw;QqzD;vnkU;qqNH",
        "site": "https://openreview.net/forum?id=svSWP21tdp",
        "pdf_size": 5955653,
        "rating": "3;3;3;3",
        "confidence": "2;3;3;3",
        "soundness": "2;2;1;2",
        "contribution": "2;2;2;2",
        "presentation": "2;1;1;3",
        "wc_summary": "69;28;115;124",
        "wc_strengths": "64;41;30;49",
        "wc_weaknesses": "133;138;171;104",
        "wc_questions": "8;76;46;71",
        "wc_review": "274;283;362;348",
        "wc_reply_reviewers": "0;13;75;0",
        "wc_reply_authors": "237;915;913;659",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;2;2;1",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            84.0,
            38.47726601514198
        ],
        "wc_strengths_avg": [
            46.0,
            12.389511693363866
        ],
        "wc_weaknesses_avg": [
            136.5,
            23.77498685593748
        ],
        "wc_questions_avg": [
            50.25,
            26.910732059905023
        ],
        "wc_review_avg": [
            316.75,
            38.69996770024492
        ],
        "wc_reply_reviewers_avg": [
            22.0,
            31.056400306539068
        ],
        "wc_reply_authors_avg": [
            681.0,
            276.67670664513844
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 20,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6928848343673381122&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "University of Toronto;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.utoronto.ca;https://www.google.com",
        "aff_unique_abbr": "U of T;Google",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;2",
        "aff_country_unique": "Canada;United States;United Kingdom"
    },
    {
        "id": "swPf2hwKl8",
        "title": "Unifying over-smoothing and over-squashing in graph neural networks: A physics informed approach and beyond",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Graph Neural Networks (GNNs) have emerged as one of the leading approaches for machine learning on graph-structured data. Despite their great success, critical computational challenges such as over-smoothing, over-squashing, and limited expressive power continue to impact the performance of GNNs. In this study, inspired from the time-reversal principle commonly utilized in classical and quantum physics, we reverse the time direction of the graph heat equation. The resulted reversing process yields a class of high pass filtering functions that enhance the sharpness of graph node features. Leveraging this concept, we introduce the Multi-Scaled Heat Kernel based GNN (MHKG) by amalgamating diverse filtering functions' effects on node features. To explore more flexible filtering conditions, we further generalize MHKG into a model termed G-MHKG and thoroughly show the roles of each element in controlling over-smoothing, over-squashing and expressive power. Notably, we illustrate that all aforementioned issues can be characterized and analyzed via the properties of the filtering functions, and uncover a trade-off between over-smoothing and over-squashing: enhancing node feature sharpness will make model suffer more from over-squashing, and vice versa. Furthermore, we manipulate the time again to show how G-MHKG can handle both two issues under mild conditions. Our conclusive experiments highlight the effectiveness of proposed models. It surpasses several GNN baseline models in performance across graph datasets characterized by both homophily and heterophily.",
        "keywords": "graph neural network;over-smoothing;over-squashing;heat kernel",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/acdfd5ea52e2738f3572798ba72aa19414e26e1c.pdf",
        "author": "Zhiqi Shao;Dai Shi;Andi Han;Yi Guo;Qibin Zhao;Junbin Gao",
        "authorids": "~Zhiqi_Shao1;~Dai_Shi1;~Andi_Han1;~Yi_Guo3;~Qibin_Zhao1;~Junbin_Gao1",
        "gender": "F;M;M;;M;",
        "homepage": "https://www.sydney.edu.au/business/about/our-people/research-students/jessica-shao-370.html;https://github.com/EEthanShi;https://github.com/andyjm3;;https://qibinzhao.github.io;https://www.sydney.edu.au/business/about/our-people/academic-staff/junbin-gao.html",
        "dblp": ";96/8513;268/7976.html;24/3508-1;13/1193;30/3983",
        "google_scholar": ";;AKHQHs0AAAAJ;;https://scholar.google.co.jp/citations?hl=en;https://scholar.google.com.au/citations?user=3-KJN8IAAAAJ",
        "orcid": ";0000-0002-6600-4325;0000-0003-4655-655X;;0000-0002-4442-3182;0000-0001-9803-0256",
        "linkedin": ";;;;;",
        "or_profile": "~Zhiqi_Shao1;~Dai_Shi1;~Andi_Han1;~Yi_Guo3;~Qibin_Zhao1;~Junbin_Gao1",
        "aff": "University of Sydney;University of Sydney;RIKEN AIP;Western Sydney University;RIKEN;University of Sydney",
        "aff_domain": "usyd.edu.au;sydney.edu.au;riken.jp;wsu.edu.au;riken.jp;sydney.edu.au",
        "position": "PhD student;Researcher;Postdoc;Associate Professor;Team Leader;Full Professor",
        "bibtex": "@misc{\nshao2024unifying,\ntitle={Unifying over-smoothing and over-squashing in graph neural networks: A physics informed approach and beyond},\nauthor={Zhiqi Shao and Dai Shi and Andi Han and Yi Guo and Qibin Zhao and Junbin Gao},\nyear={2024},\nurl={https://openreview.net/forum?id=swPf2hwKl8}\n}",
        "github": "",
        "project": "",
        "reviewers": "C4jf;YhrV;JgmJ;xBwc",
        "site": "https://openreview.net/forum?id=swPf2hwKl8",
        "pdf_size": 673340,
        "rating": "3;3;3;6",
        "confidence": "4;4;3;3",
        "soundness": "2;2;2;3",
        "contribution": "2;3;3;3",
        "presentation": "2;1;2;2",
        "wc_summary": "99;80;83;50",
        "wc_strengths": "50;48;71;73",
        "wc_weaknesses": "349;60;418;62",
        "wc_questions": "2;635;86;1",
        "wc_review": "500;823;658;186",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            78.0,
            17.705931209625774
        ],
        "wc_strengths_avg": [
            60.5,
            11.543396380615196
        ],
        "wc_weaknesses_avg": [
            222.25,
            163.0864418031125
        ],
        "wc_questions_avg": [
            181.0,
            264.3775709094854
        ],
        "wc_review_avg": [
            541.75,
            235.00890940557977
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17677559262636266305&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;2;1;0",
        "aff_unique_norm": "University of Sydney;RIKEN;Western Sydney University",
        "aff_unique_dep": ";Advanced Institute for Computational Science;",
        "aff_unique_url": "https://www.sydney.edu.au;https://www.aip.riken.jp;https://www.westernsydney.edu.au",
        "aff_unique_abbr": "USYD;RIKEN AIP;WSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;1;0",
        "aff_country_unique": "Australia;Japan"
    },
    {
        "id": "swrBIkG9Ap",
        "title": "Active Question Learning: learning a partial annotation policy in hierarchical label spaces",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Active learning (AL) aims at alleviating data annotation cost by choosing the samples to be annotated, without sacrificing classifier accuracy.  This entails a strategic selection of the most informative or uncertain data points for annotation, ultimately contributing to a cost-effective learning process.  Currently no approach takes into account the diversity of expertise of annotators and the opportunity to rely on partial labeling instead of full labeling. For many multi-class classification problems, a hierarchical taxonomy can be defined by grouping classes by similarity, with the original classes as the leaves and subsets of classes (i.e. composite classes) as the internal nodes. We propose to leverage this hierarchy by allowing annotators to partially label data using composite classes as questions. We posit that questions higher up in the hierarchy require lesser expertise and hence involve lower annotation cost. To this end, we introduce a novel AL task, Active Question Learning (AQL), in which an agent decides which questions to ask to annotate a sample given the current state of the classifier. Considering this task as a Multi-Armed Bandit problem where each arm corresponds to a question associated with a (composite/atomic) class, we propose AQTS, a contextual Thompson Sampling algorithm to solve it. We demonstrate the efficacy of our approach on standard image classification datasets.",
        "keywords": "Active Learning;Multi-Armed Bandit;Partial Label Learning;Hierarchical class",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Ignacio Laurenty;Sanjeel Parekh;Ekhine Irurozki;Florence d'Alch\u00e9-Buc",
        "authorids": "~Ignacio_Laurenty1;~Sanjeel_Parekh1;~Ekhine_Irurozki1;~Florence_d'Alch\u00e9-Buc2",
        "gender": "M;M;;",
        "homepage": ";;;",
        "dblp": ";130/3856;;",
        "google_scholar": ";0k_gLpsAAAAJ;;",
        "orcid": ";;;",
        "linkedin": "ignaciolaurenty/;;;",
        "or_profile": "~Ignacio_Laurenty1;~Sanjeel_Parekh1;~Ekhine_Irurozki1;~Florence_d'Alch\u00e9-Buc2",
        "aff": ";Meta;;",
        "aff_domain": ";meta.com;;",
        "position": ";Researcher;;",
        "bibtex": "@misc{\nlaurenty2024active,\ntitle={Active Question Learning: learning a partial annotation policy in hierarchical label spaces},\nauthor={Ignacio Laurenty and Sanjeel Parekh and Ekhine Irurozki and Florence d'Alch{\\'e}-Buc},\nyear={2024},\nurl={https://openreview.net/forum?id=swrBIkG9Ap}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=swrBIkG9Ap",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:qCu1uexIyVAJ:scholar.google.com/&scioq=Active+Question+Learning:+learning+a+partial+annotation+policy+in+hierarchical+label+spaces&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Meta",
        "aff_unique_dep": "Meta Platforms, Inc.",
        "aff_unique_url": "https://meta.com",
        "aff_unique_abbr": "Meta",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "title": "BatteryML: An Open-source Platform for Machine Learning on Battery Degradation",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17628",
        "id": "sxGugrYhP9",
        "author_site": "Han Zhang, Xiaofan Gui, Shun Zheng, Ziheng Lu, Yuqi Li, Jiang Bian",
        "tldr": "",
        "abstract": "Battery degradation remains a pivotal concern in the energy storage domain, with machine learning emerging as a potent tool to drive forward insights and solutions. However, this intersection of electrochemical science and machine learning poses complex challenges. Machine learning experts often grapple with the intricacies of battery science, while battery researchers face hurdles in adapting intricate models tailored to specific datasets. Beyond this, a cohesive standard for battery degradation modeling, inclusive of data formats and evaluative benchmarks, is conspicuously absent.  Recognizing these impediments, we present BatteryML\u2014a one-step, all-encompass, and  open-source platform designed to unify data preprocessing, feature extraction, and the implementation of both traditional and state-of-the-art models. This streamlined approach promises to enhance the practicality and efficiency of research applications. BatteryML seeks to fill this void, fostering an environment where experts from diverse specializations can collaboratively contribute, thus elevating the collective understanding and advancement of battery research.",
        "keywords": "BatteryML;Battery life prediction;Machine learning;Open-source platform;Unified standards;Collaborative research",
        "primary_area": "infrastructure, software libraries, hardware, etc.",
        "supplementary_material": "",
        "author": "Han Zhang;Xiaofan Gui;Shun Zheng;Ziheng Lu;Yuqi Li;Jiang Bian",
        "authorids": "~Han_Zhang18;~Xiaofan_Gui1;~Shun_Zheng1;~Ziheng_Lu1;~Yuqi_Li4;~Jiang_Bian1",
        "gender": "M;F;M;M;M;M",
        "homepage": ";;;https://www.microsoft.com/en-us/research/people/zihenglu/;https://www.researchgate.net/profile/Yuqi-Li-7?ev=hdr_xprf;https://sites.google.com/view/jiangbian",
        "dblp": ";258/4305;179/2615.html;;;09/851-2.html",
        "google_scholar": "TTwXmYQAAAAJ;N-vcOT0AAAAJ;21Q9To4AAAAJ;rnqpfkkAAAAJ;;pZBEnY8AAAAJ",
        "orcid": ";0000-0001-8259-5471;0009-0005-7355-7090;;;0000-0002-9472-600X",
        "linkedin": ";;;;;jbian/",
        "or_profile": "~Han_Zhang18;~Xiaofan_Gui1;~Shun_Zheng1;~Ziheng_Lu1;~Yuqi_Li4;~Jiang_Bian1",
        "aff": "Tsinghua University;Microsoft Research;Microsoft;;;Microsoft",
        "aff_domain": "tsinghua.edu.cn;research.microsoft.com;microsoft.com;;;microsoft.com",
        "position": "PhD student;Researcher;Senior Researcher;;;Partner Research Manager",
        "bibtex": "@inproceedings{\nzhang2024batteryml,\ntitle={Battery{ML}: An Open-source Platform for Machine Learning on Battery Degradation},\nauthor={Han Zhang and Xiaofan Gui and Shun Zheng and Ziheng Lu and Yuqi Li and Jiang Bian},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=sxGugrYhP9}\n}",
        "github": "",
        "project": "",
        "reviewers": "9hBn;g7qR;3yVC;ZTeZ",
        "pdf_size": 1464400,
        "rating": "6;6;8;8",
        "confidence": "3;2;3;3",
        "soundness": "2;3;3;3",
        "contribution": "3;3;3;4",
        "presentation": "3;2;3;4",
        "wc_summary": "171;65;93;99",
        "wc_strengths": "98;92;40;62",
        "wc_weaknesses": "109;51;12;126",
        "wc_questions": "53;109;1;122",
        "wc_review": "431;317;146;409",
        "wc_reply_reviewers": "20;31;4;20",
        "wc_reply_authors": "677;2026;259;584",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;4;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            107.0,
            39.11521443121589
        ],
        "wc_strengths_avg": [
            73.0,
            23.430749027719962
        ],
        "wc_weaknesses_avg": [
            74.5,
            45.554911919572405
        ],
        "wc_questions_avg": [
            71.25,
            48.137173784924265
        ],
        "wc_review_avg": [
            325.75,
            112.24387511129505
        ],
        "wc_reply_reviewers_avg": [
            18.75,
            9.627434756984853
        ],
        "wc_reply_authors_avg": [
            886.5,
            675.946188686644
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.75,
            1.299038105676658
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14996597418066957178&as_sdt=5,34&sciodt=0,34&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=sxGugrYhP9",
        "pdf": "https://openreview.net/pdf?id=sxGugrYhP9",
        "email": "tsinghua.edu.cn;research.microsoft.com;microsoft.com;;;microsoft.com",
        "author_num": 6,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Tsinghua University;Microsoft",
        "aff_unique_dep": ";Microsoft Research",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.microsoft.com/en-us/research",
        "aff_unique_abbr": "THU;MSR",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "syoLhUJmth",
        "title": "From CLIP to DINO: Visual Encoders Shout in Multi-modal Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Multi-modal Large Language Models (MLLMs) have made significant strides in expanding the capabilities of Large Language Models (LLMs) through the incorporation of visual perception interfaces. Despite the emergence of exciting applications and the availability of diverse instruction tuning data, existing approaches often rely on CLIP or its variants as the visual branch, and merely extract features from the deep layers. However, these methods lack a comprehensive analysis of the visual encoders in MLLMs. In this paper, we conduct an extensive investigation into the effectiveness of different vision encoders within MLLMs. Our findings reveal that the shallow layer features of CLIP offer particular advantages for fine-grained tasks such as grounding and region understanding. Surprisingly, the vision-only model DINO, which is not pretrained with text-image alignment, demonstrates promising performance as a visual branch within MLLMs. By simply equipping it with an MLP layer for alignment, DINO surpasses CLIP in fine-grained related perception tasks. Building upon these observations, we propose a simple yet effective feature merging strategy, named **COMM**, that integrates **C**LIP and DIN**O** with **M**ulti-level features **M**erging, to enhance the visual capabilities of MLLMs. We evaluate **COMM** through comprehensive experiments on a wide range of benchmarks, including image captioning, visual question answering, visual grounding, and object hallucination. Experimental results demonstrate the superior performance of **COMM** compared to existing methods, showcasing its enhanced visual capabilities within MLLMs.",
        "keywords": "Multi-modal large language modal",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Dongsheng Jiang;Yuchen Liu;Songlin Liu;XIAOPENG ZHANG;Jin Li;Hongkai Xiong;Qi Tian",
        "authorids": "~Dongsheng_Jiang2;~Yuchen_Liu4;~Songlin_Liu1;~XIAOPENG_ZHANG7;~Jin_Li10;~Hongkai_Xiong1;~Qi_Tian3",
        "gender": ";;M;M;M;M;M",
        "homepage": "https://min.sjtu.edu.cn/;;https://sites.google.com/site/zxphistory/;http://min.sjtu.edu.cn;https://www.qitian1987.com/index.html;https://sites.google.com/site/dongshengjiangbme/;",
        "dblp": "69/10440-6;;;21/3569;78/1467-1.html;85/8729;",
        "google_scholar": "https://scholar.google.com.hk/citations?user=GRcH3nAAAAAJ;https://scholar.google.com/citations?hl=en;Ud6aBAcAAAAJ;bB16iN4AAAAJ;https://scholar.google.com/citations?hl=en;-eGIgsoAAAAJ;FJ89TCMAAAAJ",
        "orcid": "0000-0002-3096-448X;;;0000-0003-4552-0029;0000-0002-7252-5047;;0000-0002-9846-5951",
        "linkedin": ";;;;;;",
        "or_profile": "~Yuchen_Liu4;~Songlin_Liu1;~XIAOPENG_ZHANG7;~Hongkai_Xiong1;~Qi_Tian3;~Dongsheng_Jiang1;~Li_Jin2",
        "aff": "Shanghai Jiaotong University;Huawei Technologies Ltd.;Huawei Technologies Ltd.;Shanghai Jiaotong University;Huawei Technologies Ltd.;Huawei Technologies Ltd.;Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn;huawei.com;huawei.com;sjtu.edu.cn;huawei.com;huawei.com;sjtu.edu.cn",
        "position": "PhD student;Researcher;Principal Researcher;Full Professor;Principal Researcher;Principal Researcher;PhD student",
        "bibtex": "@misc{\njiang2024from,\ntitle={From {CLIP} to {DINO}: Visual Encoders Shout in Multi-modal Large Language Models},\nauthor={Dongsheng Jiang and Yuchen Liu and Songlin Liu and XIAOPENG ZHANG and Jin Li and Hongkai Xiong and Qi Tian},\nyear={2024},\nurl={https://openreview.net/forum?id=syoLhUJmth}\n}",
        "github": "",
        "project": "",
        "reviewers": "JjPW;JffD;dgTi;EbaU",
        "site": "https://openreview.net/forum?id=syoLhUJmth",
        "pdf_size": 10878417,
        "rating": "3;3;3;6",
        "confidence": "5;5;3;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "1;3;2;3",
        "wc_summary": "177;64;62;42",
        "wc_strengths": "114;36;30;45",
        "wc_weaknesses": "366;471;186;32",
        "wc_questions": "2;4;85;86",
        "wc_review": "659;575;363;205",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            86.25,
            53.09602150820719
        ],
        "wc_strengths_avg": [
            56.25,
            33.766662553471285
        ],
        "wc_weaknesses_avg": [
            263.75,
            168.19687125508608
        ],
        "wc_questions_avg": [
            44.25,
            41.25757506204164
        ],
        "wc_review_avg": [
            450.5,
            178.11442951091863
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.17407765595569782,
        "gs_citation": 35,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17969453694346035599&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1;0;1;1;0",
        "aff_unique_norm": "Shanghai Jiao Tong University;Huawei",
        "aff_unique_dep": ";Huawei Technologies",
        "aff_unique_url": "https://www.sjtu.edu.cn;https://www.huawei.com",
        "aff_unique_abbr": "SJTU;Huawei",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "sysX9XMGdF",
        "title": "Understanding and Tackling Over-Dilution in Graph Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Message Passing Neural Networks (MPNNs) have become the predominant architecture for representation learning on graphs.\nWhile they hold promise, several inherent limitations have been identified, such as over-smoothing and over-squashing. \nBoth theoretical frameworks and empirical investigations substantiate these limitations, facilitating advancements for informative representation.\nIn this paper, we investigate the limitations of MPNNs from a novel perspective.\nWe observe that even in a single layer, a node's own information can become considerably diluted, potentially leading to negative effects on performance.\nTo delve into this phenomenon in-depth, we introduce the concept of *Over-dilution* and formulate it with two types of dilution factors: *intra-node dilution* and *inter-node dilution*.\n*Intra-node dilution* refers to the phenomenon where attributes lose their influence within each node, due to being combined with equal weight regardless of their practical importance.\n*Inter-node dilution* occurs when the node representations of neighbors are aggregated, leading to a diminished influence of the node itself on the final representation.\nWe also introduce a transformer-based solution, which alleviates over-dilution by merging attribute representations based on attention scores between node-level and attribute-level representations.\nOur findings provide new insights and contribute to the development of informative representations.",
        "keywords": "Graph Neural Networks;Message Passing Neural Networks;Over-dilution;Transformers",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/ee5e7e19f29f8da342104cbf081c4c2e10ef4330.zip",
        "author": "Junhyun Lee;Veronika Thost;Bumsoo Kim;Jaewoo Kang;Tengfei Ma",
        "authorids": "~Junhyun_Lee1;~Veronika_Thost1;~Bumsoo_Kim1;~Jaewoo_Kang1;~Tengfei_Ma1",
        "gender": "M;F;M;M;M",
        "homepage": "https://junhyunlee.com;https://mitibmwatsonailab.mit.edu/people/veronika-thost/;https://bmsookim.github.io/;https://dmis.korea.ac.kr;https://sites.google.com/site/matf0123/",
        "dblp": "155/8661;132/3874;47/6553;k/JaewooKang;94/9023-1",
        "google_scholar": "kyZHNxYAAAAJ;TyScgJ0AAAAJ;https://scholar.google.co.kr/citations?user=zKNSsekAAAAJ;https://scholar.google.co.kr/citations?user=RaBZafQAAAAJ;9OvNakkAAAAJ",
        "orcid": "0000-0002-2385-4047;0000-0003-4984-1532;;0000-0001-6798-9106;0000-0002-1086-529X",
        "linkedin": ";;bumsoo-kim-003193144/;;",
        "or_profile": "~Junhyun_Lee1;~Veronika_Thost1;~Bumsoo_Kim1;~Jaewoo_Kang1;~Tengfei_Ma1",
        "aff": "Korea University;IBM Research;LG AI Research;Korea University;State University of New York at Stony Brook",
        "aff_domain": "korea.ac.kr;ibm.com;lgresearch.ai;korea.ac.kr;stonybrook.edu",
        "position": "PhD student;Research Scientist;Researcher;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nlee2024understanding,\ntitle={Understanding and Tackling Over-Dilution in Graph Neural Networks},\nauthor={Junhyun Lee and Veronika Thost and Bumsoo Kim and Jaewoo Kang and Tengfei Ma},\nyear={2024},\nurl={https://openreview.net/forum?id=sysX9XMGdF}\n}",
        "github": "",
        "project": "",
        "reviewers": "LoKp;HxeZ;V15d;gjvj",
        "site": "https://openreview.net/forum?id=sysX9XMGdF",
        "pdf_size": 4679099,
        "rating": "5;5;6;6",
        "confidence": "3;3;5;4",
        "soundness": "3;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "2;2;3;3",
        "wc_summary": "87;158;93;81",
        "wc_strengths": "33;62;74;21",
        "wc_weaknesses": "211;35;130;4",
        "wc_questions": "106;141;129;359",
        "wc_review": "437;396;426;465",
        "wc_reply_reviewers": "0;11;22;35",
        "wc_reply_authors": "712;835;714;760",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "1;3;2;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            104.75,
            31.03526220285564
        ],
        "wc_strengths_avg": [
            47.5,
            21.360009363293827
        ],
        "wc_weaknesses_avg": [
            95.0,
            81.48926309643498
        ],
        "wc_questions_avg": [
            183.75,
            101.95924430869425
        ],
        "wc_review_avg": [
            431.0,
            24.708298201211672
        ],
        "wc_reply_reviewers_avg": [
            17.0,
            12.98075498574717
        ],
        "wc_reply_authors_avg": [
            755.25,
            49.886746736984165
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.9045340337332909,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:v1MCCMfZfgwJ:scholar.google.com/&scioq=Understanding+and+Tackling+Over-Dilution+in+Graph+Neural+Networks&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0;3",
        "aff_unique_norm": "Korea University;IBM;LG;State University of New York at Stony Brook",
        "aff_unique_dep": ";IBM Research;LG AI Research;",
        "aff_unique_url": "https://www.korea.ac.kr;https://www.ibm.com/research;https://www.lgaires.com;https://www.stonybrook.edu",
        "aff_unique_abbr": "KU;IBM;LG AI;SUNY Stony Brook",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Stony Brook",
        "aff_country_unique_index": "0;1;0;0;1",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "title": "Frozen Transformers in Language Models Are Effective Visual Encoder Layers",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17627",
        "id": "t0FI3Q66K5",
        "author_site": "Ziqi Pang, Ziyang Xie, Yunze Man, Yu-Xiong Wang",
        "tldr": "",
        "abstract": "This paper reveals that large language models (LLMs), despite being trained solely on text data, are surprisingly}strong encoders for purely visual tasks in the absence of language. Even more intriguingly, this can be achieved by a simple yet previously overlooked strategy -- employing a frozen transformer block from pre-trained LLMs as a constituent encoder layer to directly process visual tokens. Our work pushes the boundaries of leveraging LLMs for computer vision tasks, significantly departing from conventional practices that typically necessitate a multi-modal vision-language setup with associated language prompts, inputs, or outputs. We demonstrate that our approach consistently enhances performance across a diverse range of tasks} encompassing pure 2D or 3D visual recognition tasks (e.g., image and point cloud classification), temporal modeling tasks (e.g., action recognition), non-semantic tasks (e.g., motion forecasting), and multi-modal tasks (e.g., 2D/3D visual question answering and image-text retrieval). Such improvements are a general phenomenon, applicable to various types of LLMs (e.g., LLaMA and OPT) and different LLM transformer blocks. We additionally propose the information filtering hypothesis to explain the effectiveness of pre-trained LLMs in visual encoding -- the pre-trained LLM transformer blocks discern informative visual tokens and further amplify their effect. This hypothesis is empirically supported by the observation that the feature activation, after training with LLM transformer blocks, exhibits a stronger focus on relevant regions. We hope that our work inspires new perspectives on utilizing LLMs and deepening our understanding of their underlying mechanisms.",
        "keywords": "representation learning;vision-language models;transformer",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Ziqi Pang;Ziyang Xie;Yunze Man;Yu-Xiong Wang",
        "authorids": "~Ziqi_Pang1;~Ziyang_Xie1;~Yunze_Man2;~Yu-Xiong_Wang1",
        "gender": "M;M;M;",
        "homepage": "https://ziqipang.github.io/;https://ziyangxie.site;https://yunzeman.github.io/;https://yxw.cs.illinois.edu/",
        "dblp": "255/9210;;230/4287.html;35/10700",
        "google_scholar": "Uh5k1vcAAAAJ;heomgGYAAAAJ;xvQIEKAAAAAJ;T_Q-xDkAAAAJ",
        "orcid": ";;;",
        "linkedin": ";leo-xie/;;",
        "or_profile": "~Ziqi_Pang1;~Ziyang_Xie1;~Yunze_Man2;~Yu-Xiong_Wang1",
        "aff": "UIUC;University of Illinois Urbana-Champaign;Department of Computer Science, University of Illinois at Urbana-Champaign;Department of Computer Science, University of Illinois Urbana-Champaign",
        "aff_domain": "cs.illinois.edu;cs.illinois.edu;cs.illinois.edu;cs.illinois.edu",
        "position": "PhD student;MS student;PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\npang2024frozen,\ntitle={Frozen Transformers in Language Models Are Effective Visual Encoder Layers},\nauthor={Ziqi Pang and Ziyang Xie and Yunze Man and Yu-Xiong Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=t0FI3Q66K5}\n}",
        "github": "",
        "project": "",
        "reviewers": "8b8L;ksvc;sfsm;SKT3",
        "pdf_size": 2409087,
        "rating": "6;6;6;8",
        "confidence": "4;4;4;4",
        "soundness": "3;3;3;4",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "87;108;94;110",
        "wc_strengths": "46;97;107;93",
        "wc_weaknesses": "213;160;255;159",
        "wc_questions": "2;26;73;109",
        "wc_review": "348;391;529;471",
        "wc_reply_reviewers": "22;90;248;26",
        "wc_reply_authors": "1800;1148;2687;1804",
        "reply_reviewers": "1;2;2;1",
        "reply_authors": "4;3;5;4",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            99.75,
            9.60143218483576
        ],
        "wc_strengths_avg": [
            85.75,
            23.509306667785847
        ],
        "wc_weaknesses_avg": [
            196.75,
            40.10221315588455
        ],
        "wc_questions_avg": [
            52.5,
            41.42764777295472
        ],
        "wc_review_avg": [
            434.75,
            70.06559426708661
        ],
        "wc_reply_reviewers_avg": [
            96.5,
            91.53551223432358
        ],
        "wc_reply_authors_avg": [
            1859.75,
            547.1765597135901
        ],
        "reply_reviewers_avg": [
            1.5,
            0.5
        ],
        "reply_authors_avg": [
            4.0,
            0.7071067811865476
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 40,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12353965457135336371&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=t0FI3Q66K5",
        "pdf": "https://openreview.net/pdf?id=t0FI3Q66K5",
        "email": "cs.illinois.edu;cs.illinois.edu;cs.illinois.edu;cs.illinois.edu",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of Illinois Urbana-Champaign",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www illinois.edu",
        "aff_unique_abbr": "UIUC",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Urbana-Champaign",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "t0m0DdCCQ2",
        "title": "Liteformer: Lightweight Evoformer for Protein Structure Prediction",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "AlphaFold2 has achieved seminal success in predicting structures from amino acid sequences with remarkable atomic accuracy. However, its Evoformer module faces a critical challenge in terms of high memory consumption, particularly concerning the computational complexity associated with sequence length $L$ and the number of Multiple Sequence Alignments (MSA), denoted as $s$. This challenge arises from the attention mechanism involving third-order MSA and pair-wise tensors, leading to a complexity of $\\mathcal{O}(L^3+sL^2)$.\nThis memory bottleneck poses difficulties when working with lengthy protein sequences. To tackle this problem, we introduce a novel and lightweight variant of Evoformer named Liteformer. Liteformer employs an innovative attention linearization mechanism, reducing complexity to $\\mathcal{O}(L^2+sL)$ through the implementation of a bias-aware flow attention mechanism, which seamlessly integrates MSA sequences and pair-wise information. Our extensive experiments, conducted on both monomeric and multimeric benchmark datasets, showcase the efficiency gains of our framework.  Specifically, compared with Evoformer, Liteformer achieves up to a 44\\% reduction in memory usage and a 23\\% acceleration in training speed, all while maintaining competitive accuracy in protein structure prediction.",
        "keywords": "protein structure prediction;efficient transformer",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Ning Sun;Xingyi Cheng;Shentong Mo;Chiming Liu;Hui Li;Eric Xing;Le Song",
        "authorids": "~Ning_Sun3;~Xingyi_Cheng3;~Shentong_Mo1;~Chiming_Liu1;~Hui_Li2;~Eric_Xing1;~Le_Song1",
        "gender": "F;M;;;;M;M",
        "homepage": ";;;;;http://www.cs.cmu.edu/~epxing/;http://www.cc.gatech.edu/~lsong",
        "dblp": ";206/6376;;;;36/3855;94/3481",
        "google_scholar": ";shO7XmIAAAAJ;;;;https://scholar.google.com.tw/citations?user=5pKTRxEAAAAJ;Xl4E0CsAAAAJ",
        "orcid": "0000-0002-9014-3763;;;;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Ning_Sun3;~Xingyi_Cheng3;~Shentong_Mo1;~Chiming_Liu1;~Hui_Li2;~Eric_Xing1;~Le_Song1",
        "aff": "Mohamed bin Zayed University of Artificial Intelligence;BioMap;;;;School of Computer Science, Carnegie Mellon University;College of Computing, Georgia Institute of Technology",
        "aff_domain": "mbzuai.ac.ae;biomap.com;;;;cs.cmu.edu;cc.gatech.edu",
        "position": "PhD student;Principal Researcher;;;;Full Professor;Associate Professor",
        "bibtex": "@misc{\nsun2024liteformer,\ntitle={Liteformer: Lightweight Evoformer for Protein Structure Prediction},\nauthor={Ning Sun and Xingyi Cheng and Shentong Mo and Chiming Liu and Hui Li and Eric Xing and Le Song},\nyear={2024},\nurl={https://openreview.net/forum?id=t0m0DdCCQ2}\n}",
        "github": "",
        "project": "",
        "reviewers": "ffAR;WrTu;9JiD",
        "site": "https://openreview.net/forum?id=t0m0DdCCQ2",
        "pdf_size": 6881980,
        "rating": "3;5;5",
        "confidence": "4;3;4",
        "soundness": "1;2;3",
        "contribution": "2;2;2",
        "presentation": "1;2;3",
        "wc_summary": "44;74;83",
        "wc_strengths": "48;106;40",
        "wc_weaknesses": "306;133;142",
        "wc_questions": "62;19;38",
        "wc_review": "460;332;303",
        "wc_reply_reviewers": "252;31;0",
        "wc_reply_authors": "1826;419;930",
        "reply_reviewers": "1;1;0",
        "reply_authors": "4;3;4",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            67.0,
            16.673332000533065
        ],
        "wc_strengths_avg": [
            64.66666666666667,
            29.408993333483707
        ],
        "wc_weaknesses_avg": [
            193.66666666666666,
            79.51659505341566
        ],
        "wc_questions_avg": [
            39.666666666666664,
            17.594190960528863
        ],
        "wc_review_avg": [
            365.0,
            68.21045863111219
        ],
        "wc_reply_reviewers_avg": [
            94.33333333333333,
            112.20318870493635
        ],
        "wc_reply_authors_avg": [
            1058.3333333333333,
            581.5292101195108
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:sVzd6hTIsRIJ:scholar.google.com/&scioq=Liteformer:+Lightweight+Evoformer+for+Protein+Structure+Prediction&hl=en&as_sdt=0,34",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Mohamed bin Zayed University of Artificial Intelligence;BioMap;Carnegie Mellon University;Georgia Institute of Technology",
        "aff_unique_dep": ";;School of Computer Science;College of Computing",
        "aff_unique_url": "https://mbzuai.ac.ae;;https://www.cmu.edu;https://www.gatech.edu",
        "aff_unique_abbr": "MBZUAI;;CMU;Georgia Tech",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Pittsburgh;Atlanta",
        "aff_country_unique_index": "0;2;2",
        "aff_country_unique": "United Arab Emirates;;United States"
    },
    {
        "id": "t18wD1cH9G",
        "title": "Safurai 001: New Qualitative Approach for Evaluation",
        "track": "main",
        "status": "Desk Reject",
        "tldr": "",
        "abstract": "This paper presents Safurai-001, a new Large Language Model (LLM) with significant potential in the domain of coding assistance. Driven by recent advancements in coding LLMs, Safurai-001 competes in performance with the latest models like WizardCoder(1), PanguCoder(2) and Phi-1(3) but aims to deliver a more \u201dconversational\u201d interaction. By capitalizing on the progress in data engineering (latest techniques of data transformation and prompt engineering) and instruction tuning, this new model promises to stand toe-to-toe with recent closed and open source developments. Recognizing the need for an efficacious evaluation metric for coding LLMs, this paper also introduces GPT4-based MultiParameters: an evaluation benchmark that harnesses varied parameters to present a comprehensive insight into the model\u2019s functioning and performance. Our assessment shows that Safurai-001 can outperform GPT-3.51 by 1.58% and WizardCoder by 18.78% in Code Readability parameter and more.",
        "keywords": "AI;LLM;Evaluation Metrics;Coding Assistance",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Leonardo Boiardi;Davide Cifarelli;Alessandro Puppo",
        "authorids": "~Leonardo_Boiardi1;~Davide_Cifarelli1;~Alessandro_Puppo1",
        "gender": "M;M;M",
        "homepage": "https://www.linkedin.com/in/leonardoboiardi/;;",
        "dblp": ";;",
        "google_scholar": ";;",
        "orcid": ";;",
        "linkedin": ";davide-cifarelli/;alessandro-puppo/",
        "or_profile": "~Leonardo_Boiardi1;~Davide_Cifarelli1;~Alessandro_Puppo1",
        "aff": ";;",
        "aff_domain": ";;",
        "position": ";;",
        "bibtex": "@misc{\nboiardi2024safurai,\ntitle={Safurai 001: New Qualitative Approach for Evaluation},\nauthor={Leonardo Boiardi and Davide Cifarelli and Alessandro Puppo},\nyear={2024},\nurl={https://openreview.net/forum?id=t18wD1cH9G}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=t18wD1cH9G",
        "pdf_size": 351473,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:jIL0jW2mCuwJ:scholar.google.com/&scioq=Safurai+001:+New+Qualitative+Approach+for+Evaluation&hl=en&as_sdt=0,34",
        "gs_version_total": 0
    },
    {
        "id": "t3gOYtv1xV",
        "title": "Carrying over Algorithm in Transformers",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Addition is perhaps one of the simplest arithmetic tasks one can think of and is usually performed using the carrying over algorithm. This algorithm consists of two tasks: adding digits in the same position and carrying over a one whenever necessary. We study how transformer models implement this algorithm and how the two aforementioned tasks are allocated to different parts of the network. We first focus on two-layer encoder-only models and show that the carrying over algorithm is implemented in a modular fashion. The first layer is mostly responsible for adding digits in the same position. The second layer first decides, in the attention, which positions need a carried one or not, and then performs the carrying of the one in the final MLP. We provide a simple way of precisely identifying which neurons are responsible for that task. This implementation of the carrying over algorithm occurs across a range of hyperparameters for two as well as three-layer models. For small decoder-only models, we observe the same implementation and provide suggestive evidence for its existence in Alpaca 7B.",
        "keywords": "Interpretability;Transformers;Mechanistic Interpretability;Circuits;Integer Addition in LLMs",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Jorrit Kruthoff",
        "authorids": "~Jorrit_Kruthoff1",
        "gender": "M",
        "homepage": "",
        "dblp": "",
        "google_scholar": "aJWdfR4AAAAJ",
        "orcid": "0000-0001-6624-9958",
        "linkedin": "",
        "or_profile": "~Jorrit_Kruthoff1",
        "aff": "Institue for Advanced Study, Princeton",
        "aff_domain": "ias.edu",
        "position": "Postdoc",
        "bibtex": "@misc{\nkruthoff2024carrying,\ntitle={Carrying over Algorithm in Transformers},\nauthor={Jorrit Kruthoff},\nyear={2024},\nurl={https://openreview.net/forum?id=t3gOYtv1xV}\n}",
        "github": "",
        "project": "",
        "reviewers": "RdPh;tJZK;5YTw;rE6h",
        "site": "https://openreview.net/forum?id=t3gOYtv1xV",
        "pdf_size": 23679878,
        "rating": "5;5;6;10",
        "confidence": "4;4;2;4",
        "soundness": "2;3;3;4",
        "contribution": "2;2;3;4",
        "presentation": "2;3;3;4",
        "wc_summary": "110;50;46;17",
        "wc_strengths": "117;31;20;17",
        "wc_weaknesses": "192;98;77;1",
        "wc_questions": "611;20;73;10",
        "wc_review": "1030;199;216;45",
        "wc_reply_reviewers": "423;118;80;0",
        "wc_reply_authors": "1266;639;634;22",
        "reply_reviewers": "3;1;1;0",
        "reply_authors": "5;2;2;1",
        "rating_avg": [
            6.5,
            2.0615528128088303
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            55.75,
            33.81105588413352
        ],
        "wc_strengths_avg": [
            46.25,
            41.17872630376029
        ],
        "wc_weaknesses_avg": [
            92.0,
            68.084506313845
        ],
        "wc_questions_avg": [
            178.5,
            250.84905820034484
        ],
        "wc_review_avg": [
            372.5,
            385.40790080121604
        ],
        "wc_reply_reviewers_avg": [
            155.25,
            160.345525350725
        ],
        "wc_reply_authors_avg": [
            640.25,
            439.8399566887938
        ],
        "reply_reviewers_avg": [
            1.25,
            1.0897247358851685
        ],
        "reply_authors_avg": [
            2.5,
            1.5
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0.14002800840280097,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:gs7AX9valZUJ:scholar.google.com/&scioq=Carrying+over+Algorithm+in+Transformers&hl=en&as_sdt=0,33",
        "gs_version_total": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "Institute for Advanced Study",
        "aff_unique_dep": "",
        "aff_unique_url": "https://wwwIAS.edu",
        "aff_unique_abbr": "IAS",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Princeton",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Controlling Vision-Language Models for Multi-Task Image Restoration",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17626",
        "id": "t3vnnLeajU",
        "author_site": "Ziwei Luo, Fredrik K. Gustafsson, Zheng Zhao, Jens Sj\u00f6lund, Thomas Sch\u00f6n",
        "tldr": "",
        "abstract": "Vision-language models such as CLIP have shown great impact on diverse downstream tasks for zero-shot or label-free predictions. However, when it comes to low-level vision such as image restoration their performance deteriorates dramatically due to corrupted inputs. In this paper, we present a degradation-aware vision-language model (DA-CLIP) to better transfer pretrained vision-language models to low-level vision tasks as a multi-task framework for image restoration. More specifically, DA-CLIP trains an additional controller that adapts the fixed CLIP image encoder to predict high-quality feature embeddings. By integrating the embedding into an image restoration network via cross-attention, we are able to pilot the model to learn a high-fidelity image reconstruction. The controller itself will also output a degradation feature that matches the real corruptions of the input, yielding a natural classifier for different degradation types. In addition, we construct a mixed degradation dataset with synthetic captions for DA-CLIP training. Our approach advances state-of-the-art performance on both degradation-specific and unified image restoration tasks, showing a promising direction of prompting image restoration with large-scale pretrained vision-language models. Our code is available at https://github.com/Algolzw/daclip-uir.",
        "keywords": "Image restoration;vision-language model;low-level vision",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/4bcd721a298cabf07db93649988ce20d53dffadf.zip",
        "author": "Ziwei Luo;Fredrik K. Gustafsson;Zheng Zhao;Jens Sj\u00f6lund;Thomas B. Sch\u00f6n",
        "authorids": "~Ziwei_Luo1;~Fredrik_K._Gustafsson1;~Zheng_Zhao1;~Jens_Sj\u00f6lund1;~Thomas_B._Sch\u00f6n1",
        "gender": "M;M;;M;M",
        "homepage": "https://algolzw.github.io;http://www.fregu856.com/;;https://jsjol.github.io;http://user.it.uu.se/~thosc112/index.html",
        "dblp": "166/7005;80/1759;;155/3118;85/4891",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;bjbzGCcAAAAJ;;https://scholar.google.se/citations?user=AlF2g-YAAAAJ;https://scholar.google.se/citations?user=FUqUC2oAAAAJ",
        "orcid": "0000-0003-3334-8655;;;0000-0002-9099-3522;0000-0001-5183-234X",
        "linkedin": ";;;jens-sj%C3%B6lund/;thomas-sch%C3%B6n-2b587b1/",
        "or_profile": "~Ziwei_Luo1;~Fredrik_K._Gustafsson1;~Zheng_Zhao1;~Jens_Sj\u00f6lund1;~Thomas_B._Sch\u00f6n1",
        "aff": "Uppsala University;Karolinska Institutet;;Uppsala University;Uppsala University",
        "aff_domain": "it.uu.se;ki.se;;uu.se;uu.se",
        "position": "PhD student;Postdoc;;Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\nluo2024controlling,\ntitle={Controlling Vision-Language Models for Multi-Task Image Restoration},\nauthor={Ziwei Luo and Fredrik K. Gustafsson and Zheng Zhao and Jens Sj{\\\"o}lund and Thomas B. Sch{\\\"o}n},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=t3vnnLeajU}\n}",
        "github": "",
        "project": "",
        "reviewers": "hnNQ;bHgA;3ZRs;j7ME",
        "pdf_size": 15466266,
        "rating": "3;6;6;6",
        "confidence": "5;4;5;5",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;4;3;3",
        "wc_summary": "80;86;53;106",
        "wc_strengths": "14;51;74;81",
        "wc_weaknesses": "269;173;251;120",
        "wc_questions": "2;270;89;2",
        "wc_review": "365;580;467;309",
        "wc_reply_reviewers": "351;369;0;0",
        "wc_reply_authors": "1302;1835;1089;673",
        "reply_reviewers": "2;1;0;0",
        "reply_authors": "4;4;3;2",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            81.25,
            18.93904696651867
        ],
        "wc_strengths_avg": [
            55.0,
            26.143832924802744
        ],
        "wc_weaknesses_avg": [
            203.25,
            60.10147668734937
        ],
        "wc_questions_avg": [
            90.75,
            109.41520689556822
        ],
        "wc_review_avg": [
            430.25,
            103.36192480792916
        ],
        "wc_reply_reviewers_avg": [
            180.0,
            180.1124648657055
        ],
        "wc_reply_authors_avg": [
            1224.75,
            418.69701157280787
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.25,
            0.82915619758885
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 44,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13884732977373716756&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=t3vnnLeajU",
        "pdf": "https://openreview.net/pdf?id=t3vnnLeajU",
        "email": "it.uu.se;ki.se;;uu.se;uu.se",
        "author_num": 5,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Uppsala University;Karolinska Institutet",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uu.se;https://ki.se",
        "aff_unique_abbr": "UU;KI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Sweden"
    },
    {
        "id": "t4HiVGGzML",
        "title": "Search-Adaptor: Text Embedding Customization for Information Retrieval",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Text embeddings extracted by pre-trained Large Language Models (LLMs) have significant potential to improve information retrieval and search. Beyond the zero-shot setup in which they are being conventionally used, being able to take advantage of the information from the relevant query-corpus paired data has the power to further boost the LLM capabilities. In this paper, we propose a novel method, Search-Adaptor, for customizing LLMs for information retrieval in an efficient and robust way. Search-Adaptor modifies the original text embedding generated by pre-trained LLMs, and can be integrated with any LLM, including those only available via APIs. On multiple real-world English and multilingual retrieval datasets, we show consistent and significant performance benefits for Search-Adaptor -- e.g., more than 5.2% improvements over the Google Embedding APIs in nDCG@10 averaged over 13 BEIR datasets.",
        "keywords": "Text embedding;embedding customization;LLMs",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Jinsung Yoon;Sercan O Arik;Yanfei Chen;Tomas Pfister",
        "authorids": "~Jinsung_Yoon1;~Sercan_O_Arik1;~Yanfei_Chen1;~Tomas_Pfister1",
        "gender": "M;M;M;M",
        "homepage": "https://sites.google.com/corp/view/jinsungyoon;https://www.sercanarik.com/;https://sites.google.com/site/yanfeichen1990;http://tomas.pfister.fi",
        "dblp": "173/5409.html;;58/8788;14/8360",
        "google_scholar": "kiFd6A8AAAAJ;;qyua6O4AAAAJ;ahSpJOAAAAAJ",
        "orcid": ";0000-0001-6333-1729;;0009-0004-4088-8718",
        "linkedin": "jinsung-yoon-bb7751b8;;;",
        "or_profile": "~Jinsung_Yoon1;~Sercan_O_Arik1;~Yanfei_Chen1;~Tomas_Pfister1",
        "aff": "Google;Google;Google;Google",
        "aff_domain": "google.com;google.com;google.com;google.com",
        "position": "Research Scientist;Research Scientist;Software Engineer;Head of Research @ Cloud AI",
        "bibtex": "@misc{\nyoon2024searchadaptor,\ntitle={Search-Adaptor: Text Embedding Customization for Information Retrieval},\nauthor={Jinsung Yoon and Sercan O Arik and Yanfei Chen and Tomas Pfister},\nyear={2024},\nurl={https://openreview.net/forum?id=t4HiVGGzML}\n}",
        "github": "",
        "project": "",
        "reviewers": "W3Mq;ftHT;VfLX",
        "site": "https://openreview.net/forum?id=t4HiVGGzML",
        "pdf_size": 519577,
        "rating": "3;5;8",
        "confidence": "4;5;3",
        "soundness": "3;2;4",
        "contribution": "2;2;4",
        "presentation": "2;2;3",
        "wc_summary": "69;79;32",
        "wc_strengths": "22;140;29",
        "wc_weaknesses": "167;125;124",
        "wc_questions": "12;11;30",
        "wc_review": "270;355;215",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "866;780;389",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;2;1",
        "rating_avg": [
            5.333333333333333,
            2.0548046676563256
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            60.0,
            20.215505600075073
        ],
        "wc_strengths_avg": [
            63.666666666666664,
            54.05141585153488
        ],
        "wc_weaknesses_avg": [
            138.66666666666666,
            20.038851153585515
        ],
        "wc_questions_avg": [
            17.666666666666668,
            8.73053390247253
        ],
        "wc_review_avg": [
            280.0,
            57.590508477236654
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            678.3333333333334,
            207.5802388368304
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5960395606792698,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7052889468867321113&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Google",
        "aff_unique_dep": "Google",
        "aff_unique_url": "https://www.google.com",
        "aff_unique_abbr": "Google",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Mountain View",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "t4pWejxMgr",
        "title": "Quality-Diversity Transfer Learning (QDTL)",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Deep learning has had much success on challenging problems with large datasets. However, it struggles in cases with limited training data. Transfer learning represents a class of approaches for transferring knowledge from large source datasets to smaller target datasets. But many transfer learning approaches have constraints in terms of dataset size and similarity of output features. In this paper, we introduce Quality-Diversity Transfer Learning (QDTL), a novel transfer learning approach based on neuroevolution for dealing with very small dataset problems with distinct output features. We demonstrate the success of QDTL on two medical prediction problems, outperforming standard transfer learning baselines.",
        "keywords": "Transfer Learning;Medical Prediction;Quality Diversity",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Samridhi Vaid;Simon Urschel;David Mark Olson;Matthew Guzdial",
        "authorids": "~Samridhi_Vaid1;~Simon_Urschel1;~David_Mark_Olson1;~Matthew_Guzdial1",
        "gender": "F;M;M;M",
        "homepage": ";;http://www.theolsonlab.com;http://guzdial.com",
        "dblp": "340/2616;;;176/5400",
        "google_scholar": "x8fot_QAAAAJ;;;jKqmTbIAAAAJ",
        "orcid": ";0000-0003-0820-6815;;",
        "linkedin": "samridhi-vaid-b1754495/;;;",
        "or_profile": "~Samridhi_Vaid1;~Simon_Urschel1;~David_Mark_Olson1;~Matthew_Guzdial1",
        "aff": ";University of Alberta;University of Alberta;University of Alberta",
        "aff_domain": ";ualberta.ca;ualberta.ca;ualberta.ca",
        "position": ";Full Professor;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nvaid2024qualitydiversity,\ntitle={Quality-Diversity Transfer Learning ({QDTL})},\nauthor={Samridhi Vaid and Simon Urschel and David Mark Olson and Matthew Guzdial},\nyear={2024},\nurl={https://openreview.net/forum?id=t4pWejxMgr}\n}",
        "github": "",
        "project": "",
        "reviewers": "Mn8Q;FuMo;JVCK;vX3E",
        "site": "https://openreview.net/forum?id=t4pWejxMgr",
        "pdf_size": 234262,
        "rating": "3;3;3;5",
        "confidence": "4;3;2;3",
        "soundness": "2;2;3;2",
        "contribution": "2;1;3;2",
        "presentation": "2;2;3;2",
        "wc_summary": "11;30;43;73",
        "wc_strengths": "27;15;18;42",
        "wc_weaknesses": "252;104;52;67",
        "wc_questions": "265;10;7;29",
        "wc_review": "555;159;120;211",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            39.25,
            22.56518335843961
        ],
        "wc_strengths_avg": [
            25.5,
            10.5
        ],
        "wc_weaknesses_avg": [
            118.75,
            79.22554827831739
        ],
        "wc_questions_avg": [
            77.75,
            108.43748198847112
        ],
        "wc_review_avg": [
            261.25,
            172.64178955281946
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:fpblMHm7vqgJ:scholar.google.com/&scioq=Quality-Diversity+Transfer+Learning+(QDTL)&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Alberta",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ualberta.ca",
        "aff_unique_abbr": "UAlberta",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "t5LXyWbs5p",
        "title": "Frequency-Aware Masked Autoencoders for Multimodal Pretraining on Biosignals",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Leveraging multimodal information from biosignals is vital for building a comprehensive representation of people's physical and mental states. However, multimodal biosignals often exhibit substantial distributional shifts between pretraining and inference datasets, stemming from changes in task specification or variations in modality compositions. To achieve effective pretraining in the presence of potential distributional shifts, we propose a frequency-aware masked autoencoder (\ud835\ude8b\ud835\ude92\ud835\ude98FAME) that learns to parameterize the representation of biosignals in the frequency space. \ud835\ude8b\ud835\ude92\ud835\ude98FAME incorporates a frequency-aware transformer, which leverages a fixed-size Fourier-based operator for global token mixing, independent of the length and sampling rate of inputs. To maintain the frequency components within each input channel, we further employ a frequency-maintain pretraining strategy that performs masked autoencoding in the latent space. The resulting architecture effectively utilizes multimodal information during pretraining, and can be seamlessly adapted to diverse tasks and modalities at test time, regardless of input size and order. We evaluated our approach on a diverse set of transfer experiments on unimodal time series, achieving an average of \u21915.5% improvement in classification accuracy over the previous state-of-the-art. Furthermore, we demonstrated that our architecture is robust in modality mismatch scenarios, including unpredicted modality dropout or substitution, proving its practical utility in real-world applications. Code will be available soon.",
        "keywords": "multimodal learning;biosignals;transformers;frequency-space analysis",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/d0653a8c29b3f218ffb9b10697844a65e6d8d0de.pdf",
        "author": "Ran Liu;Ellen L. Zippi;Hadi Pouransari;Christopher Michael Sandino;Jingping Nie;Hanlin Goh;Erdrin Azemi;Ali Moin",
        "authorids": "~Ran_Liu2;~Ellen_L._Zippi1;~Hadi_Pouransari1;~Christopher_Michael_Sandino1;~Jingping_Nie1;~Hanlin_Goh2;~Erdrin_Azemi1;~Ali_Moin1",
        "gender": "F;F;M;M;F;M;F;M",
        "homepage": "https://ranliu98.github.io/;;;https://chrsandino.github.io;https://jingpingnie.com/;;;https://www.alimoin.me",
        "dblp": ";;162/5187;251/8419;;96/4057;;",
        "google_scholar": "vBEAxZgAAAAJ;A_bRd6IAAAAJ;besz69AAAAAJ;of5XwBQAAAAJ;https://scholar.google.com/citations?hl=en;;-UT845YAAAAJ;zFGTjI8AAAAJ",
        "orcid": ";;;;0000-0002-9181-8398;;;0000-0002-2672-9030",
        "linkedin": ";ellen-zippi-b8924a155/;;;jingpingnie/;;;",
        "or_profile": "~Ran_Liu2;~Ellen_L._Zippi1;~Hadi_Pouransari1;~Christopher_Michael_Sandino1;~Jingping_Nie1;~Hanlin_Goh2;~Erdrin_Azemi1;~Ali_Moin1",
        "aff": "Georgia Institute of Technology;Apple;Apple;Apple;Columbia University;Apple;Apple;Apple",
        "aff_domain": "gatech.edu;apple.com;apple.com;apple.com;columbia.edu;apple.com;apple.com;apple.com",
        "position": "PhD student;Researcher;Principal Researcher;Researcher;PhD student;Research Scientist;Principal Researcher;Researcher",
        "bibtex": "@misc{\nliu2024frequencyaware,\ntitle={Frequency-Aware Masked Autoencoders for Multimodal Pretraining on Biosignals},\nauthor={Ran Liu and Ellen L. Zippi and Hadi Pouransari and Christopher Michael Sandino and Jingping Nie and Hanlin Goh and Erdrin Azemi and Ali Moin},\nyear={2024},\nurl={https://openreview.net/forum?id=t5LXyWbs5p}\n}",
        "github": "",
        "project": "",
        "reviewers": "GTFm;BHTD;hfvK;YFSy",
        "site": "https://openreview.net/forum?id=t5LXyWbs5p",
        "pdf_size": 1398270,
        "rating": "3;5;6;8",
        "confidence": "4;4;4;3",
        "soundness": "3;2;2;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;2",
        "wc_summary": "104;90;57;120",
        "wc_strengths": "62;73;38;115",
        "wc_weaknesses": "517;309;30;107",
        "wc_questions": "88;74;153;219",
        "wc_review": "771;546;278;561",
        "wc_reply_reviewers": "310;37;137;36",
        "wc_reply_authors": "1447;976;579;1297",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "4;3;2;3",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            92.75,
            23.209642392764263
        ],
        "wc_strengths_avg": [
            72.0,
            27.865749586185547
        ],
        "wc_weaknesses_avg": [
            240.75,
            189.25957703640785
        ],
        "wc_questions_avg": [
            133.5,
            57.664980707531676
        ],
        "wc_review_avg": [
            539.0,
            174.984285008683
        ],
        "wc_reply_reviewers_avg": [
            130.0,
            111.72958426486693
        ],
        "wc_reply_authors_avg": [
            1074.75,
            332.97325343036186
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.8006407690254357,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11302017373100866895&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1;1;2;1;1;1",
        "aff_unique_norm": "Georgia Institute of Technology;Apple;Columbia University",
        "aff_unique_dep": ";Apple Inc.;",
        "aff_unique_url": "https://www.gatech.edu;https://www.apple.com;https://www.columbia.edu",
        "aff_unique_abbr": "Georgia Tech;Apple;Columbia",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "t7izmSufIi",
        "title": "TETA: Temporal-Enhanced Text-to-Audio Generation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large diffusion models have been successful in text-to-audio (T2A) synthesis tasks, but they often suffer from common issues such as semantic misalignment and poor temporal consistency due to limited natural language understanding and data scarcity. Additionally, 2D spatial structures widely used in T2A works lead to unsatisfactory audio quality when generating variable-length audio samples since they do not adequately prioritize temporal information. To address these challenges, we propose TETA, a latent diffusion-based T2A method. Our approach includes several techniques to improve semantic alignment and temporal consistency: Firstly, we use pre-trained large language models (LLMs) to parse the text into structured <event \\& order> pairs for better temporal information capture. We also introduce another structured-text encoder to aid in learning semantic alignment during the diffusion denoising process. To improve the performance of variable length generation and enhance the temporal information extraction, we design a feed-forward Transformer-based diffusion denoiser. Finally, we use LLMs to augment and transform a large amount of audio-label data into audio-text datasets to alleviate the problem of scarcity of temporal data. Extensive experiments show that our method outperforms baseline models in both objective and subjective metrics, and achieves significant gains in temporal information understanding, semantic consistency, and sound quality. Our demos are available at \\url{https://teta2023.github.io/}.",
        "keywords": "Text-to-audio;Audio Generation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/fbc0c4f8fb24e47020485460122acccc69aea224.pdf",
        "author": "Jiawei Huang;Yi Ren;Rongjie Huang;Dongchao Yang;Zhenhui Ye;Chen Zhang;Jinglin Liu;Xiang Yin;Zejun MA;Zhou Zhao",
        "authorids": "~Jiawei_Huang5;~Yi_Ren2;~Rongjie_Huang1;~Dongchao_Yang1;~Zhenhui_Ye1;~Chen_Zhang3;~Jinglin_Liu1;~Xiang_Yin2;~Zejun_MA1;~Zhou_Zhao3",
        "gender": "M;M;M;M;M;F;M;M;M;M",
        "homepage": ";https://rayeren.github.io/;;http://dongchaoyang.top;https://yerfor.github.io;https://actuy.github.io/;;;;https://dblp.uni-trier.de/pid/75/7785.html?",
        "dblp": "13/4208-8;75/6568-6;212/8936-1;;265/6375;94/4084-20;;18/1022-6.html;;75/7785",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;4FA6C0AAAAAJ;iRHBUsgAAAAJ;WNiojyAAAAAJ;;eBBFeVcAAAAJ;Ri8x0jEAAAAJ;e6_J-lEAAAAJ;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com.hk/citations?user=IIoFY90AAAAJ",
        "orcid": ";;;;;;;;;0000-0001-6121-0384",
        "linkedin": ";;;;;;;;zejun-ma-58614365/;",
        "or_profile": "~Jiawei_Huang5;~Yi_Ren2;~Rongjie_Huang1;~Dongchao_Yang1;~Zhenhui_Ye1;~Chen_Zhang3;~Jinglin_Liu1;~Xiang_Yin2;~Zejun_MA1;~Zhou_Zhao2",
        "aff": "Zhejiang University;ByteDance;Zhejiang University;Chinese University of Hong Kong;Zhejiang University;Bytedance;ByteDance;ByteDance Inc.;ByteDance Inc.;Zhejiang University",
        "aff_domain": "zju.edu.cn;bytedance.com;zju.edu.cn;cuhk.hk;zju.edu.cn;bytedance.com;bytedance.com;bytedance.com;bytedance.com;zju.edu.cn",
        "position": "MS student;Researcher;MS student;PhD student;PhD student;Research Scientist;Research Scientist;Researcher;Principal Researcher;Associate Professor",
        "bibtex": "@misc{\nhuang2024teta,\ntitle={{TETA}: Temporal-Enhanced Text-to-Audio Generation},\nauthor={Jiawei Huang and Yi Ren and Rongjie Huang and Dongchao Yang and Zhenhui Ye and Chen Zhang and Jinglin Liu and Xiang Yin and Zejun MA and Zhou Zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=t7izmSufIi}\n}",
        "github": "",
        "project": "",
        "reviewers": "NGeL;UN3N;J54j;Kz7t",
        "site": "https://openreview.net/forum?id=t7izmSufIi",
        "pdf_size": 834246,
        "rating": "3;3;3;5",
        "confidence": "4;3;4;4",
        "soundness": "2;3;2;2",
        "contribution": "2;2;2;2",
        "presentation": "2;1;3;2",
        "wc_summary": "207;56;48;79",
        "wc_strengths": "48;49;64;41",
        "wc_weaknesses": "188;343;154;167",
        "wc_questions": "36;14;678;49",
        "wc_review": "479;462;944;336",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            97.5,
            64.23589339302443
        ],
        "wc_strengths_avg": [
            50.5,
            8.381527307120106
        ],
        "wc_weaknesses_avg": [
            213.0,
            76.02959949914244
        ],
        "wc_questions_avg": [
            194.25,
            279.5732238609413
        ],
        "wc_review_avg": [
            555.25,
            231.1421370066479
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12856513641027503156&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;2;0;1;1;1;1;0",
        "aff_unique_norm": "Zhejiang University;ByteDance;Chinese University of Hong Kong",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.zju.edu.cn;https://www.bytedance.com;https://www.cuhk.edu.hk",
        "aff_unique_abbr": "ZJU;ByteDance;CUHK",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "t84UBRhhvp",
        "title": "Text Descriptions are Compressive and Invariant Representations for Visual Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Modern image classification is based upon directly predicting classes via large discriminative networks, which do not directly contain information about the intuitive visual features that may constitute a classification decision. \nRecently, work in vision-language models (VLM) such as CLIP has provided ways to specify natural language descriptions of image classes, but typically focuses on providing single descriptions for each class. In this work, we demonstrate that an alternative approach, in line with humans' understanding of multiple visual features per class, can also provide compelling performance in the robust few-shot learning setting. \nIn particular, we introduce a novel method, \\textit{SLR-AVD (Sparse Logistic Regression using Augmented Visual Descriptors)}. This method first automatically generates multiple visual descriptions of each class via a large language model (LLM), then uses a VLM to translate these descriptions to a set of visual feature embeddings of each image, and finally uses sparse logistic regression to select a relevant subset of these features to classify each image.\nCore to our approach is the fact that, information-theoretically, these descriptive features are more invariant to domain shift than traditional image embeddings, even though the VLM training process is not explicitly designed for invariant representation learning. These invariant descriptive features also compose a better input compression scheme. When combined with finetuning, we show that SLR-AVD is able to outperform existing state-of-the-art finetuning approaches on both in-distribution and out-of-distribution performance.",
        "keywords": "Few-shot learning;distribution shift;OOD classification;invariant representation;input compression",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/4f4bf1bd13c304b8c4dd7277d10b012d15d3c699.pdf",
        "author": "Zhili Feng;Anna Bair;J Zico Kolter",
        "authorids": "~Zhili_Feng1;~Anna_Bair1;~J_Zico_Kolter1",
        "gender": ";;M",
        "homepage": "https://zhilif.github.io/;https://annaebair.github.io/;http://www.zicokolter.com",
        "dblp": "189/7590;206/3739;67/2526",
        "google_scholar": "_lnL4aQAAAAJ;;UXh1I6UAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Zhili_Feng1;~Anna_Bair1;~Zico_Kolter1",
        "aff": "Microsoft Research;Carnegie Mellon University;Carnegie Mellon University",
        "aff_domain": "microsoft.com;cmu.edu;cmu.edu",
        "position": "Intern;PhD student;Full Professor",
        "bibtex": "@misc{\nfeng2024text,\ntitle={Text Descriptions are Compressive and Invariant Representations for Visual Learning},\nauthor={Zhili Feng and Anna Bair and J Zico Kolter},\nyear={2024},\nurl={https://openreview.net/forum?id=t84UBRhhvp}\n}",
        "github": "",
        "project": "",
        "reviewers": "cpSM;rjB2;piqv;CDXQ",
        "site": "https://openreview.net/forum?id=t84UBRhhvp",
        "pdf_size": 1714598,
        "rating": "3;5;5;6",
        "confidence": "3;4;4;4",
        "soundness": "2;2;3;3",
        "contribution": "1;2;3;3",
        "presentation": "2;2;2;2",
        "wc_summary": "69;114;63;103",
        "wc_strengths": "78;90;51;24",
        "wc_weaknesses": "325;331;173;539",
        "wc_questions": "15;47;13;17",
        "wc_review": "487;582;300;683",
        "wc_reply_reviewers": "0;137;30;0",
        "wc_reply_authors": "395;426;269;584",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            87.25,
            21.706853756359994
        ],
        "wc_strengths_avg": [
            60.75,
            25.488968201949643
        ],
        "wc_weaknesses_avg": [
            342.0,
            130.17296186228538
        ],
        "wc_questions_avg": [
            23.0,
            13.92838827718412
        ],
        "wc_review_avg": [
            513.0,
            141.16125530753826
        ],
        "wc_reply_reviewers_avg": [
            41.75,
            56.339928114970114
        ],
        "wc_reply_authors_avg": [
            418.5,
            112.19291421475779
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.9271726499455306,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8960774863388282552&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Microsoft;Carnegie Mellon University",
        "aff_unique_dep": "Microsoft Research;",
        "aff_unique_url": "https://www.microsoft.com/en-us/research;https://www.cmu.edu",
        "aff_unique_abbr": "MSR;CMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "t8D9JxEn0J",
        "title": "Malcom-PSGD: Inexact Proximal Stochastic Gradient Descent for Communication Efficient Decentralized Machine Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent research indicates that frequent model communication stands as a major bottleneck to the efficiency of decentralized machine learning (ML), particularly for large-scale and over-parameterized neural networks (NNs). In this paper, we introduce \\textsc{Malcom-PSGD}, a new decentralized ML algorithm that strategically integrates gradient compression techniques with model sparsification. \\textsc{Malcom-PSGD} leverages proximal stochastic gradient descent to handle the non-smoothness resulting from the $\\ell_1$ regularization in model sparsification. Furthermore, we adapt vector source coding and dithering-based quantization for compressed gradient communication of sparsified models. Our analysis shows that decentralized proximal stochastic gradient descent with compressed communication has a convergence rate of $\\mathcal{O}\\left(\\ln(t)/\\sqrt{t}\\right)$ assuming a diminishing learning rate and where $t$ denotes the number of iterations. Numerical results verify our theoretical findings and demonstrate that our method reduces communication costs by approximately $75$\\% when compared to the state-of-the-art method.",
        "keywords": "Decentralized Machine Learning;Proximal SGD;Vector Source Encoding;Gossip;Compressed Communication;Model Sparsification",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/a45067a8f78b6919141414704185c090f51054b4.zip",
        "author": "Andrew Campbell;Hang Liu;Leah Woldemariam;Anna Scaglione",
        "authorids": "~Andrew_Campbell5;~Hang_Liu6;~Leah_Woldemariam1;~Anna_Scaglione1",
        "gender": ";M;;F",
        "homepage": ";;https://sinelab.tech.cornell.edu/research/people/leah_woldemariam/;https://tech.cornell.edu/people/anna-scaglione/",
        "dblp": ";;;",
        "google_scholar": "ZlYWmcIAAAAJ;n1tKLQcAAAAJ;;https://scholar.google.com/citations?hl=en",
        "orcid": ";;; 0000-0002-8892-3680",
        "linkedin": ";;;",
        "or_profile": "~Andrew_Campbell5;~Hang_Liu6;~Leah_Woldemariam1;~Anna_Scaglione1",
        "aff": "Cornell University;Cornell University;Cornell University;Cornell University",
        "aff_domain": "cornell.edu;cornell.edu;cornell.edu;cornell.edu",
        "position": "PhD student;Postdoc;PhD student;Full Professor",
        "bibtex": "@misc{\ncampbell2024malcompsgd,\ntitle={Malcom-{PSGD}: Inexact Proximal Stochastic Gradient Descent for Communication Efficient Decentralized Machine Learning},\nauthor={Andrew Campbell and Hang Liu and Leah Woldemariam and Anna Scaglione},\nyear={2024},\nurl={https://openreview.net/forum?id=t8D9JxEn0J}\n}",
        "github": "",
        "project": "",
        "reviewers": "aRgR;ckRP;zv9X;4xpx",
        "site": "https://openreview.net/forum?id=t8D9JxEn0J",
        "pdf_size": 751165,
        "rating": "3;5;5;6",
        "confidence": "4;4;4;3",
        "soundness": "3;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;2;3",
        "wc_summary": "62;53;72;145",
        "wc_strengths": "45;43;104;45",
        "wc_weaknesses": "129;44;938;144",
        "wc_questions": "4;159;551;201",
        "wc_review": "240;299;1665;535",
        "wc_reply_reviewers": "23;109;623;0",
        "wc_reply_authors": "2058;1729;2404;922",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "4;4;5;2",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            83.0,
            36.42114770294862
        ],
        "wc_strengths_avg": [
            59.25,
            25.849323008543184
        ],
        "wc_weaknesses_avg": [
            313.75,
            362.42266416437036
        ],
        "wc_questions_avg": [
            228.75,
            199.99546869866828
        ],
        "wc_review_avg": [
            684.75,
            576.6109498613428
        ],
        "wc_reply_reviewers_avg": [
            188.75,
            253.98462059738972
        ],
        "wc_reply_authors_avg": [
            1778.25,
            548.9564531909613
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.75,
            1.0897247358851685
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.6622661785325219,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:_o8lhAfyiYEJ:scholar.google.com/&scioq=Malcom-PSGD:+Inexact+Proximal+Stochastic+Gradient+Descent+for+Communication+Efficient+Decentralized+Machine+Learning&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Cornell University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cornell.edu",
        "aff_unique_abbr": "Cornell",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Classification with Conceptual Safeguards",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17625",
        "id": "t8cBsT9mcg",
        "author_site": "Hailey Joren, Charles Marx, Berk Ustun",
        "tldr": "",
        "abstract": "We propose a new approach to promote safety in classification tasks with concept annotations. Our approach \u2013 called a *conceptual safeguard* \u2013 acts as a verification layer for models that predict a target outcome by first predicting the presence of intermediate concepts. Given this architecture, a safeguard ensures that a model meets a minimal level of accuracy by abstaining from uncertain predictions. In contrast to a standard selective classifier, a safeguard provides an avenue to improve coverage by allowing a human to confirm the presence of uncertain concepts on instances on which it abstains. We develop methods to build safeguards that maximize coverage without compromising safety, namely techniques to propagate the uncertainty in concept predictions and to flag salient concepts for human review. We benchmark our approach on a collection of real-world and synthetic datasets, showing that it can improve performance and coverage in deep learning tasks.",
        "keywords": "classification;selective classification;concept bottleneck models;uncertainty quantification;selective classification",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/2a80d3c2bea9ed7cb33db73f23f2739f3458a7f0.pdf",
        "author": "Hailey Joren;Charles Thomas Marx;Berk Ustun",
        "authorids": "~Hailey_Joren1;~Charles_Thomas_Marx1;~Berk_Ustun1",
        "gender": ";M;M",
        "homepage": ";https://charliemarx.github.io/;http://www.berkustun.com",
        "dblp": ";;138/5585",
        "google_scholar": ";LCiFW3IAAAAJ;6z_XWYcAAAAJ",
        "orcid": ";;0000-0001-5188-3155",
        "linkedin": ";charlie-marx-9b63b3163/;berkustun/",
        "or_profile": "~Hailey_Joren1;~Charles_Thomas_Marx1;~Berk_Ustun1",
        "aff": ";Stanford University;School of Engineering and Applied Sciences, Harvard University",
        "aff_domain": ";stanford.edu;seas.harvard.edu",
        "position": ";PhD student;Associate ",
        "bibtex": "@inproceedings{\njoren2024classification,\ntitle={Classification with Conceptual Safeguards},\nauthor={Hailey Joren and Charles Thomas Marx and Berk Ustun},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=t8cBsT9mcg}\n}",
        "github": "",
        "project": "",
        "reviewers": "1z66;wCU7;msQs;3F5i",
        "pdf_size": 1552979,
        "rating": "6;6;8;8",
        "confidence": "4;3;3;3",
        "soundness": "3;2;3;3",
        "contribution": "3;2;3;3",
        "presentation": "3;2;4;3",
        "wc_summary": "70;42;116;64",
        "wc_strengths": "65;41;41;125",
        "wc_weaknesses": "246;108;45;104",
        "wc_questions": "2;87;78;77",
        "wc_review": "383;278;280;370",
        "wc_reply_reviewers": "0;24;16;23",
        "wc_reply_authors": "745;541;638;495",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            73.0,
            26.92582403567252
        ],
        "wc_strengths_avg": [
            68.0,
            34.336569426778794
        ],
        "wc_weaknesses_avg": [
            125.75,
            73.77118339839751
        ],
        "wc_questions_avg": [
            61.0,
            34.285565475867536
        ],
        "wc_review_avg": [
            327.75,
            48.97129261107981
        ],
        "wc_reply_reviewers_avg": [
            15.75,
            9.60143218483576
        ],
        "wc_reply_authors_avg": [
            604.75,
            96.02701442823265
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:QiKy__n-B80J:scholar.google.com/&scioq=Classification+with+Conceptual+Safeguards&hl=en&as_sdt=0,5",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=t8cBsT9mcg",
        "pdf": "https://openreview.net/pdf?id=t8cBsT9mcg",
        "email": ";stanford.edu;seas.harvard.edu",
        "author_num": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Stanford University;Harvard University",
        "aff_unique_dep": ";School of Engineering and Applied Sciences",
        "aff_unique_url": "https://www.stanford.edu;https://www.harvard.edu",
        "aff_unique_abbr": "Stanford;Harvard",
        "aff_campus_unique_index": "0;1",
        "aff_campus_unique": "Stanford;Cambridge",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Tailoring Self-Rationalizers with Multi-Reward Distillation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17624",
        "id": "t8eO0CiZJV",
        "author_site": "Sahana Ramnath, Brihi Joshi, Skyler Hallinan, Ximing Lu, Liunian Li, Aaron Chan, Jack Hessel, Yejin Choi, Xiang Ren",
        "tldr": "",
        "abstract": "Large language models (LMs) are capable of generating free-text rationales to aid question answering. However, prior work 1) suggests that useful self-rationalization is emergent only at significant scales (e.g., 175B parameter GPT-3); and 2) focuses largely on downstream performance, ignoring the semantics of the rationales themselves, e.g., are they faithful, true, and helpful for humans? In this work, we enable small-scale LMs (\u223c200x smaller than GPT-3) to generate rationales that not only improve downstream task performance, but are also more plausible, consistent, and diverse, assessed both by automatic and human evaluation. Our method, MaRio (Multi-rewArd RatIOnalization), is a multi-reward conditioned self-rationalization algorithm that optimizes multiple distinct properties like plausibility, diversity and consistency. Results on three difficult question-answering datasets StrategyQA, QuaRel and OpenBookQA show that not only does MaRio improve task accuracy, but it also improves the self-rationalization quality of small LMs across the aforementioned axes better than a supervised fine-tuning (SFT) baseline. Extensive human evaluations confirm that MaRio rationales are preferred vs. SFT rationales, as well as qualitative improvements in plausibility and consistency.",
        "keywords": "large language models;rationalization;explanation generation;explainability;rationale generation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/3e86abcfcc335190c60121bcaf4828402cb3db8c.zip",
        "author": "Sahana Ramnath;Brihi Joshi;Skyler Hallinan;Ximing Lu;Liunian Harold Li;Aaron Chan;Jack Hessel;Yejin Choi;Xiang Ren",
        "authorids": "~Sahana_Ramnath2;~Brihi_Joshi1;~Skyler_Hallinan1;~Ximing_Lu1;~Liunian_Harold_Li1;~Aaron_Chan1;~Jack_Hessel1;~Yejin_Choi1;~Xiang_Ren1",
        "gender": "F;F;M;F;M;;M;F;M",
        "homepage": ";https://brihijoshi.github.io;https://skylerhallinan.com/;https://gloriaximinglu.github.io/;;;https://www.jmhessel.com;https://yejinc.github.io/;https://shanzhenren.github.io/",
        "dblp": "252/5822;218/5191;256/6863;24/10879;236/6323;;https://dblp.uni-trier.de/pid/132/5250.html;89/579-1;36/360-1",
        "google_scholar": "YuRzzf0AAAAJ;j0vHYhcAAAAJ;mO_tZ94AAAAJ;https://scholar.google.com/citations?hl=en;ntbhn9UAAAAJ;;SxQQ1msAAAAJ;vhP-tlcAAAAJ;_moJlrIAAAAJ",
        "orcid": ";;;;;;0000-0002-4012-8979;;",
        "linkedin": ";brihijoshi/;skyler-hallinan/;;;;;;xren7",
        "or_profile": "~Sahana_Ramnath2;~Brihi_Joshi1;~Skyler_Hallinan1;~Ximing_Lu1;~Liunian_Harold_Li1;~Aaron_Chan1;~Jack_Hessel1;~Yejin_Choi1;~Xiang_Ren1",
        "aff": "University of Southern California;University of Southern California;University of Washington;University of Washington;University of California, Los Angeles;;Samaya AI;Department of Computer Science, University of Washington;University of Southern California",
        "aff_domain": "usc.edu;usc.edu;uw.edu;cs.washington.edu;cs.ucla.edu;;samaya.ai;cs.washington.edu;usc.edu",
        "position": "PhD student;PhD student;MS student;PhD student;PhD student;;Researcher;Full Professor;Associate Professor",
        "bibtex": "@inproceedings{\nramnath2024tailoring,\ntitle={Tailoring Self-Rationalizers with Multi-Reward Distillation},\nauthor={Sahana Ramnath and Brihi Joshi and Skyler Hallinan and Ximing Lu and Liunian Harold Li and Aaron Chan and Jack Hessel and Yejin Choi and Xiang Ren},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=t8eO0CiZJV}\n}",
        "github": "",
        "project": "",
        "reviewers": "CcB6;7guo;A7zX;3RWN;pMad",
        "pdf_size": 2004311,
        "rating": "6;6;6;6;8",
        "confidence": "4;4;3;3;3",
        "soundness": "3;3;3;3;4",
        "contribution": "3;3;3;2;3",
        "presentation": "3;3;2;3;3",
        "wc_summary": "70;294;102;73;110",
        "wc_strengths": "44;16;62;70;152",
        "wc_weaknesses": "200;26;230;51;110",
        "wc_questions": "186;15;52;43;38",
        "wc_review": "500;351;446;237;410",
        "wc_reply_reviewers": "32;0;4;28;12",
        "wc_reply_authors": "1158;588;938;558;778",
        "reply_reviewers": "1;0;1;1;1",
        "reply_authors": "3;3;2;3;3",
        "rating_avg": [
            6.4,
            0.7999999999999999
        ],
        "confidence_avg": [
            3.4,
            0.4898979485566356
        ],
        "soundness_avg": [
            3.2,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.8,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            129.8,
            83.58085905277595
        ],
        "wc_strengths_avg": [
            68.8,
            45.547338012226355
        ],
        "wc_weaknesses_avg": [
            123.4,
            80.17381118544883
        ],
        "wc_questions_avg": [
            66.8,
            60.8388034070362
        ],
        "wc_review_avg": [
            388.8,
            90.06530963695178
        ],
        "wc_reply_reviewers_avg": [
            15.2,
            12.749901960407382
        ],
        "wc_reply_authors_avg": [
            804.0,
            224.10711724530304
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            2.8,
            0.39999999999999997
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -0.408248290463863,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=768042840097762081&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=t8eO0CiZJV",
        "pdf": "https://openreview.net/pdf?id=t8eO0CiZJV",
        "email": "usc.edu;usc.edu;uw.edu;cs.washington.edu;cs.ucla.edu;;samaya.ai;cs.washington.edu;usc.edu",
        "author_num": 9,
        "aff_unique_index": "0;0;1;1;2;3;1;0",
        "aff_unique_norm": "University of Southern California;University of Washington;University of California, Los Angeles;Samaya AI",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.usc.edu;https://www.washington.edu;https://www.ucla.edu;",
        "aff_unique_abbr": "USC;UW;UCLA;",
        "aff_campus_unique_index": "0;0;0;2;0",
        "aff_campus_unique": "Los Angeles;;Seattle",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States;"
    },
    {
        "id": "t8vJSIsLhC",
        "title": "SMPE: A Framework for Multi-Dimensional Permutation Equivariance",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Permutation equivariance (PE) is an important inductive prior for addressing tasks such as point cloud segmentation, where permuting objects in the input set maintains the output features of each object.  However, the state-of-the-art PE methods mainly focused on one dimensional cases, which cannot meet the requirements of multi-dimensional tasks such as auction design, pseudo inverse computation, and multiuser resource allocation in wireless networks. It is evidenced that the direct incorporation of high-dimensional equivariance in network design necessitates tensor operations and complicated parameter sharing patterns, which contribute to its limited exploration. In this paper, we propose a novel serial multi-dimensional permutation equivariance (SMPE) framework to address these challenges.  By serially composing multiple one-dimensional equivariant layers and incorporating dense connections for feature reuse, the proposed SMPE framework enables cross-dimensional interactions among objects while maintaining multi-dimensional equivariance.  Additionally, we extend the SMPE framework to scenarios of permutation invariance as well as the hybrid equivariance and invariance through pooling operations. We use an extensive set of experiments to evaluate the framework on contextual auction design, pseudo inverse computation, and multiuser wireless communication tasks. It is observed that the SMPE framework not only maintains excellent equivariance property to support variable set sizes, but also outperforms the state-of-the-art models. For example, SMPE could gain as high as 8.4% and 14.4% improvements over the state-of-the-art methods in two typical multiuser resource allocation scenarios.",
        "keywords": "Permutation equivariance;multi-dimensional equivariant network;feature reuse;cross-dimensional information.",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Yafei Wang;Xuan He;Hongwei Hou;Xinping Yi;Wenjin Wang",
        "authorids": "~Yafei_Wang4;~Xuan_He3;~Hongwei_Hou1;~Xinping_Yi1;~Wenjin_Wang3",
        "gender": "M;;M;M;M",
        "homepage": ";;;https://sites.google.com/site/xinpingyi00/;https://radio.seu.edu.cn/2018/0423/c19937a213563/page.htm",
        "dblp": ";;;95/10043.html;",
        "google_scholar": "zOmbLjQAAAAJ;;;wAcbI5kAAAAJ;ousWjhgAAAAJ",
        "orcid": "0000-0001-9792-3212;0009-0004-4119-4654;0009-0004-0373-0778;;",
        "linkedin": ";;;;",
        "or_profile": "~Yafei_Wang4;~Xuan_He3;~Hongwei_Hou1;~Xinping_Yi1;~Wenjin_Wang3",
        "aff": "Southeast University;Southeast University;Southeast University;Southeast University;Southeast University",
        "aff_domain": "seu.edu.cn;seu.edu.cn;seu.edu.cn;seu.edu.cn;seu.edu.cn",
        "position": "PhD student;MS student;PhD student;Full Professor;Full Professor",
        "bibtex": "@misc{\nwang2024smpe,\ntitle={{SMPE}: A Framework for Multi-Dimensional Permutation Equivariance},\nauthor={Yafei Wang and Xuan He and Hongwei Hou and Xinping Yi and Wenjin Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=t8vJSIsLhC}\n}",
        "github": "",
        "project": "",
        "reviewers": "y2bA;QBbk;9EiR;4oi5",
        "site": "https://openreview.net/forum?id=t8vJSIsLhC",
        "pdf_size": 984556,
        "rating": "6;6;6;6",
        "confidence": "2;4;3;2",
        "soundness": "3;3;3;3",
        "contribution": "3;2;2;3",
        "presentation": "2;3;2;3",
        "wc_summary": "22;50;75;30",
        "wc_strengths": "64;45;27;19",
        "wc_weaknesses": "90;131;117;71",
        "wc_questions": "11;29;69;108",
        "wc_review": "187;255;288;228",
        "wc_reply_reviewers": "0;0;0;15",
        "wc_reply_authors": "641;998;1523;1171",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "4;5;6;6",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            44.25,
            20.474068965401088
        ],
        "wc_strengths_avg": [
            38.75,
            17.354754391808605
        ],
        "wc_weaknesses_avg": [
            102.25,
            23.29565410114084
        ],
        "wc_questions_avg": [
            54.25,
            37.46581775432107
        ],
        "wc_review_avg": [
            239.5,
            37.016888037759195
        ],
        "wc_reply_reviewers_avg": [
            3.75,
            6.49519052838329
        ],
        "wc_reply_authors_avg": [
            1083.25,
            317.7785195698413
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            5.25,
            0.82915619758885
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:GfmN4j7HkW4J:scholar.google.com/&scioq=SMPE:+A+Framework+for+Multi-Dimensional+Permutation+Equivariance&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Southeast University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.seu.edu.cn/",
        "aff_unique_abbr": "SEU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Language Model Inversion",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17623",
        "id": "t9dWHpGkPj",
        "author_site": "John X. Morris, Wenting Zhao, Justin Chiu, Vitaly Shmatikov, Alexander Rush",
        "tldr": "",
        "abstract": "Given a prompt, language models produce a distribution over all possible next tokens; when the prompt is unknown, can we use this distributional information to recover the prompt? We consider the problem of anguage model inversion and show that next-token probabilities contain a surprising amount of information about the preceding text. Often we can recover the text in cases where it is hidden from the user, motivating a method for recovering unknown prompts given only the model's current distribution output. We consider a variety of model access scenarios, and show how even without predictions for every token in the vocabulary we can recover the probability vector through search and reconstruction of the input. On LLAMA-7B, our inversion method reconstructs prompts with a BLEU of $59$ and token-level F1 of $77$ and recovers $23\\%$ of prompts exactly",
        "keywords": "inversion;language models;prompt engineering;security",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/38e434090e1021c86afb0f2a78b2e1f2e7486770.zip",
        "author": "John Xavier Morris;Wenting Zhao;Justin T Chiu;Vitaly Shmatikov;Alexander M Rush",
        "authorids": "~John_Xavier_Morris1;~Wenting_Zhao1;~Justin_T_Chiu1;~Vitaly_Shmatikov1;~Alexander_M_Rush1",
        "gender": "M;;;;M",
        "homepage": "http://jxmo.io;;;;http://rush.seas.harvard.edu/",
        "dblp": "263/9958.html;41/10049-2.html;;;http://dblp.uni-trier.de/pers/hd/r/Rush:Alexander_M=",
        "google_scholar": "Utsbve4AAAAJ;sycHskQAAAAJ;;;LIjnUGgAAAAJ",
        "orcid": ";;;;0000-0002-9900-1606",
        "linkedin": ";;;;sasha-rush-a69b6917/",
        "or_profile": "~John_Xavier_Morris1;~Wenting_Zhao1;~Justin_T_Chiu1;~Vitaly_Shmatikov1;~Alexander_M_Rush1",
        "aff": "Cornell University;Cornell University;;;School of Engineering and Applied Sciences, Harvard University",
        "aff_domain": "cornell.edu;cornell.edu;;;seas.harvard.edu",
        "position": "PhD student;PhD student;;;Assistant Professor",
        "bibtex": "@inproceedings{\nmorris2024language,\ntitle={Language Model Inversion},\nauthor={John Xavier Morris and Wenting Zhao and Justin T Chiu and Vitaly Shmatikov and Alexander M Rush},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=t9dWHpGkPj}\n}",
        "github": "",
        "project": "",
        "reviewers": "scV6;Cmp4;YYeq;xaWT",
        "pdf_size": 698460,
        "rating": "5;5;6;6",
        "confidence": "4;3;4;4",
        "soundness": "3;2;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;3;2;3",
        "wc_summary": "161;108;55;125",
        "wc_strengths": "33;81;83;133",
        "wc_weaknesses": "110;86;63;323",
        "wc_questions": "2;176;63;7",
        "wc_review": "306;451;264;588",
        "wc_reply_reviewers": "0;0;82;0",
        "wc_reply_authors": "440;642;363;418",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            112.25,
            38.192767639960316
        ],
        "wc_strengths_avg": [
            82.5,
            35.36594407053204
        ],
        "wc_weaknesses_avg": [
            145.5,
            103.81835097900563
        ],
        "wc_questions_avg": [
            62.0,
            70.03927469641587
        ],
        "wc_review_avg": [
            402.25,
            127.72700380107568
        ],
        "wc_reply_reviewers_avg": [
            20.5,
            35.50704155516198
        ],
        "wc_reply_authors_avg": [
            465.75,
            105.55182376444284
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 56,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9866357885974189849&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=t9dWHpGkPj",
        "pdf": "https://openreview.net/pdf?id=t9dWHpGkPj",
        "email": "cornell.edu;cornell.edu;;;seas.harvard.edu",
        "author_num": 5,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Cornell University;Harvard University",
        "aff_unique_dep": ";School of Engineering and Applied Sciences",
        "aff_unique_url": "https://www.cornell.edu;https://www.harvard.edu",
        "aff_unique_abbr": "Cornell;Harvard",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Cambridge",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "tAcEidZ1Y2",
        "title": "Self-supervision Meets Bootstrap Estimation: New Paradigm for Unsupervised Reconstruction with Uncertainty Quantification",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep learning-based self-supervised reconstruction (SSR) plays a vital role in diverse domains, including unsupervisedly reconstructing magnetic resonance imaging (MRI). Current powerful methodologies for self-supervised MRI reconstruction usually rely on capturing the relationships between different views or transformations of the same data such as serving as inputs and labels respectively, which show notable influence from analogous approaches in computer vision. Although yielding somewhat promising results, their designs are often heuristic without deep insights into reconstructed object characteristics, and the analytical and mathematical principles of such methods are not expressive. This paper addresses these issues by a novel SSR paradigm, BootRec, that not only provides a theoretical foundation for self-supervised reconstruction but also facilitates the development of downstream algorithms. Self-supervised MRI reconstruction is modeled as error-oriented parameter estimation - Bootstrap estimation for SSR (BootRec). In BootRec, we demonstrate the mathematical equivalence between bootstrapping in a sample set and the commonly used re-undersampling operation for SSR. This insight is further incorporated into designing models to estimate the variances and errors of MRI SSR results without accessing labeled data. The error estimation serves as the loss function for unsupervisedly training the models. Empirical experiments show that our new paradigm BootRec enables effective uncertainty quantification and advanced MRI reconstruction performance against other zero-shot methods.",
        "keywords": "self-supervised learning;MRI reconstruction;uncertainty quantification;compressed sensing",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/d3b7039c2fdd19656fc3538b8032663a15fd0f91.pdf",
        "author": "Zhengliang Wu;Longbing Cao;Xuesong Li",
        "authorids": "~Zhengliang_Wu1;~Longbing_Cao1;~Xuesong_Li3",
        "gender": "M;M;M",
        "homepage": "https://blog.csdn.net/weixin_42939529;https://www.datasciences.org;",
        "dblp": ";14/2589;",
        "google_scholar": ";cDs3DM8AAAAJ;",
        "orcid": ";0000-0003-1562-9429;0000-0003-1570-277X",
        "linkedin": ";;",
        "or_profile": "~Zhengliang_Wu1;~Longbing_Cao1;~Xuesong_Li3",
        "aff": "Beijing Institute of Technology;Macquarie University;",
        "aff_domain": "bit.edu.cn;mq.edu.au;",
        "position": "MS student;Full Professor;",
        "bibtex": "@misc{\nwu2024selfsupervision,\ntitle={Self-supervision Meets Bootstrap Estimation: New Paradigm for Unsupervised Reconstruction with Uncertainty Quantification},\nauthor={Zhengliang Wu and Longbing Cao and Xuesong Li},\nyear={2024},\nurl={https://openreview.net/forum?id=tAcEidZ1Y2}\n}",
        "github": "",
        "project": "",
        "reviewers": "n9iq;4bq6;tf3c;FBWg",
        "site": "https://openreview.net/forum?id=tAcEidZ1Y2",
        "pdf_size": 7577436,
        "rating": "3;3;3;5",
        "confidence": "5;4;5;2",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;2;3",
        "wc_summary": "78;33;46;67",
        "wc_strengths": "54;73;29;35",
        "wc_weaknesses": "250;197;231;135",
        "wc_questions": "61;12;4;76",
        "wc_review": "443;315;310;313",
        "wc_reply_reviewers": "184;0;172;62",
        "wc_reply_authors": "675;356;243;331",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            1.224744871391589
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            56.0,
            17.564168070250297
        ],
        "wc_strengths_avg": [
            47.75,
            17.25362280797862
        ],
        "wc_weaknesses_avg": [
            203.25,
            43.739998856881556
        ],
        "wc_questions_avg": [
            38.25,
            30.84132779242813
        ],
        "wc_review_avg": [
            345.25,
            56.46403722724757
        ],
        "wc_reply_reviewers_avg": [
            104.5,
            76.81633940770675
        ],
        "wc_reply_authors_avg": [
            401.25,
            163.5273295201753
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.9428090415820632,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:fUCwUYTbxSMJ:scholar.google.com/&scioq=Self-supervision+Meets+Bootstrap+Estimation:+New+Paradigm+for+Unsupervised+Reconstruction+with+Uncertainty+Quantification&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Beijing Institute of Technology;Macquarie University",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.bit.edu.cn/;https://www.mq.edu.au",
        "aff_unique_abbr": "BIT;MQ",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "China;Australia"
    },
    {
        "id": "tAmfM1sORP",
        "title": "Large Language Models can Learn Rules",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "When prompted with a few examples and intermediate steps, large language models (LLMs) have demonstrated impressive performance in various reasoning tasks. However, prompting methods that rely on implicit knowledge in an LLM often hallucinate incorrect answers when the implicit knowledge is wrong or inconsistent with the task. To tackle this problem, we present Hypotheses-to-Theories (HtT), a framework that learns a rule library for reasoning with LLMs. HtT contains two stages, an induction stage and a deduction stage. In the induction stage, an LLM is first asked to generate and verify rules over a set of training examples. Rules that appear and lead to correct answers sufficiently often are collected to form a rule library. In the deduction stage, the LLM is then prompted to employ the learned rule library to perform reasoning to answer test questions. Experiments on both numerical reasoning and relational reasoning problems show that HtT improves existing prompting methods, with an absolute gain of 11-27% in accuracy. The learned rules are also transferable to different models and to different forms of the same problem.",
        "keywords": "large language models;natural language processing;reasoning;compositional generalization",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "",
        "author": "Zhaocheng Zhu;Yuan Xue;Xinyun Chen;Denny Zhou;Jian Tang;Dale Schuurmans;Hanjun Dai",
        "authorids": "~Zhaocheng_Zhu1;~Yuan_Xue5;~Xinyun_Chen1;~Denny_Zhou1;~Jian_Tang1;~Dale_Schuurmans1;~Hanjun_Dai1",
        "gender": "M;F;;;;;M",
        "homepage": "https://kiddozhu.github.io/;;;;http://www.jian-tang.com;;https://hanjun-dai.github.io",
        "dblp": "195/0435;;;;181/2667-5;;144/7311",
        "google_scholar": "Qd8JumkAAAAJ;jcatRRIAAAAJ;;;https://scholar.google.ca/citations?user=1ir6WUEAAAAJ;;obpl7GQAAAAJ",
        "orcid": ";;;;;;",
        "linkedin": ";yuan-emily-xue-3483012;;;;;hanjun-dai",
        "or_profile": "~Zhaocheng_Zhu1;~Yuan_Xue5;~Xinyun_Chen1;~Denny_Zhou1;~Jian_Tang1;~Dale_Schuurmans1;~Hanjun_Dai1",
        "aff": "Universit\u00e9 de Montr\u00e9al;Google;;;Mila, HEC Montreal;;Google Research",
        "aff_domain": "mila.quebec;google.com;;;hec.ca;;google.com",
        "position": "PhD student;Researcher;;;Assistant Professor;;Researcher",
        "bibtex": "@misc{\nzhu2024large,\ntitle={Large Language Models can Learn Rules},\nauthor={Zhaocheng Zhu and Yuan Xue and Xinyun Chen and Denny Zhou and Jian Tang and Dale Schuurmans and Hanjun Dai},\nyear={2024},\nurl={https://openreview.net/forum?id=tAmfM1sORP}\n}",
        "github": "",
        "project": "",
        "reviewers": "Zpi4;CJEP;eHJ8;r3qq",
        "site": "https://openreview.net/forum?id=tAmfM1sORP",
        "pdf_size": 423040,
        "rating": "3;3;5;8",
        "confidence": "3;4;3;4",
        "soundness": "1;3;2;4",
        "contribution": "2;2;1;3",
        "presentation": "2;1;2;3",
        "wc_summary": "124;89;146;47",
        "wc_strengths": "67;64;29;33",
        "wc_weaknesses": "371;426;174;206",
        "wc_questions": "67;2;51;5",
        "wc_review": "629;581;400;291",
        "wc_reply_reviewers": "0;6;0;0",
        "wc_reply_authors": "1093;1300;1147;1115",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            1.118033988749895
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            101.5,
            37.459978643880724
        ],
        "wc_strengths_avg": [
            48.25,
            17.340343133859836
        ],
        "wc_weaknesses_avg": [
            294.25,
            106.649835911735
        ],
        "wc_questions_avg": [
            31.25,
            28.340562803162538
        ],
        "wc_review_avg": [
            475.25,
            136.4118304986778
        ],
        "wc_reply_reviewers_avg": [
            1.5,
            2.598076211353316
        ],
        "wc_reply_authors_avg": [
            1163.75,
            80.97337525384502
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.3665083330689157,
        "gs_citation": 57,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3764411844602382283&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "Universit\u00e9 de Montr\u00e9al;Google;HEC Montreal",
        "aff_unique_dep": ";Google;HEC Business School",
        "aff_unique_url": "https://www.umontreal.ca;https://www.google.com;https://www.hec.ca",
        "aff_unique_abbr": "UdeM;Google;HEC",
        "aff_campus_unique_index": "1;2;1",
        "aff_campus_unique": ";Mountain View;Montreal",
        "aff_country_unique_index": "0;1;0;1",
        "aff_country_unique": "Canada;United States"
    },
    {
        "id": "tB7p0SM5TH",
        "title": "GraSP: Simple yet Effective Graph Similarity Predictions",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph similarity computation (GSC) is considered one of the essential operations because of its wide range of applications in various fields. Graph Edit Distance (GED) and Maximum Common Subgraph (MCS) are the most popular graph similarity metrics. However, calculating exact GED and MCS is a complex task that falls under the category of NP-hard problems. Consequently, state-of-the-art methodologies learn data-driven models leveraging graph neural networks (GNNs) for estimating GED and MCS values. A perceived limitation of these approaches includes reliance on computationally expensive cross-graph node-level interaction components but to little avail. Instead of building up complicated components, we aim to make the complicated simple and present GraSP, a simple yet highly effective approach for GSC.  In particular, to achieve higher expressiveness,  we design techniques to enhance node features via positional encoding, employ a graph neural network backbone with a gating mechanism and residual connections, and develop a multi-scale pooling technique to generate meaningful representations. We theoretically prove that our method is more expressive and passes 1-WL test performance capabilities. Notably, GraSP is versatile in accurately predicting GED and MCS metrics. In extensive experiments against numerous competitors on real-world datasets, we demonstrate the superiority of GraSP over prior arts regarding effectiveness and efficiency. The source code is available at https://anonymous.4open.science/r/GraSP.",
        "keywords": "Graph Similarity Computatuon;Graph Representation Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Haoran Zheng;Jieming Shi",
        "authorids": "~Haoran_Zheng1;~Jieming_Shi1",
        "gender": ";Not Specified",
        "homepage": ";https://www4.comp.polyu.edu.hk/~jiemshi/",
        "dblp": ";147/1237-1.html",
        "google_scholar": ";",
        "orcid": ";0000-0002-0465-1551",
        "linkedin": ";",
        "or_profile": "~Haoran_Zheng1;~Jieming_Shi1",
        "aff": ";The Hong Kong Polytechnic University",
        "aff_domain": ";polyu.edu.hk",
        "position": ";Assistant Professor",
        "bibtex": "@misc{\nzheng2024grasp,\ntitle={Gra{SP}: Simple yet Effective Graph Similarity Predictions},\nauthor={Haoran Zheng and Jieming Shi},\nyear={2024},\nurl={https://openreview.net/forum?id=tB7p0SM5TH}\n}",
        "github": "",
        "project": "",
        "reviewers": "NSFb;dX6K;Ytzi",
        "site": "https://openreview.net/forum?id=tB7p0SM5TH",
        "pdf_size": 1295848,
        "rating": "3;5;6",
        "confidence": "5;3;4",
        "soundness": "1;4;3",
        "contribution": "2;2;2",
        "presentation": "2;1;3",
        "wc_summary": "73;64;41",
        "wc_strengths": "60;56;36",
        "wc_weaknesses": "416;241;87",
        "wc_questions": "179;149;56",
        "wc_review": "728;510;220",
        "wc_reply_reviewers": "523;27;0",
        "wc_reply_authors": "2817;1216;574",
        "reply_reviewers": "1;1;0",
        "reply_authors": "6;3;2",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            59.333333333333336,
            13.474255287605159
        ],
        "wc_strengths_avg": [
            50.666666666666664,
            10.498677165349081
        ],
        "wc_weaknesses_avg": [
            248.0,
            134.40486102320358
        ],
        "wc_questions_avg": [
            128.0,
            52.364109846344185
        ],
        "wc_review_avg": [
            486.0,
            208.08331664664198
        ],
        "wc_reply_reviewers_avg": [
            183.33333333333334,
            240.4334049632501
        ],
        "wc_reply_authors_avg": [
            1535.6666666666667,
            943.1869144318932
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            1.699673171197595
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.6546536707079772,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10580552961542389695&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0",
        "aff_unique_norm": "Hong Kong Polytechnic University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.polyu.edu.hk",
        "aff_unique_abbr": "PolyU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "title": "How Realistic Is Your Synthetic Data? Constraining Deep Generative Models for Tabular Data",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17622",
        "id": "tBROYsEz9G",
        "author_site": "Mihaela Stoian, Salijona Dyrmishi, Maxime Cordy, Thomas Lukasiewicz, Eleonora Giunchiglia",
        "tldr": "",
        "abstract": "Deep Generative Models (DGMs) have been shown to be powerful tools for generating tabular data, as they have been increasingly able to capture the complex distributions that characterize them. However, to generate realistic synthetic data, it is often not enough to have a good approximation of their distribution, as it also requires compliance with constraints that encode essential background knowledge on the problem at hand. In this paper, we address this limitation and show how DGMs for tabular data can be transformed into Constrained Deep Generative Models (C-DGMs), whose generated samples are guaranteed to be compliant with the given constraints. This is achieved by automatically parsing the constraints and transforming them into a Constraint Layer (CL) seamlessly integrated with the DGM. Our extensive experimental analysis with various DGMs and tasks reveals that standard DGMs often violate constraints, some exceeding 95% non-compliance, while their corresponding C-DGMs are never non-compliant. Then, we quantitatively demonstrate that, at training time, C-DGMs are able to exploit the background knowledge expressed by the constraints to outperform their standard counterparts with up to 4.5% improvement in utility and detection. Further, we show how our CL does not necessarily need to be integrated at training time, as it can be also used as a guardrail at inference time, still producing some improvements in the overall performance of the models. Finally, we show that our CL does not hinder the sample generation time of the models.",
        "keywords": "Synthetic Data Generation",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "/attachment/9b765d16845c66b9ef5bd9ca59b5718037d2e39f.zip",
        "author": "Mihaela C Stoian;Salijona Dyrmishi;Maxime Cordy;Thomas Lukasiewicz;Eleonora Giunchiglia",
        "authorids": "~Mihaela_C_Stoian1;~Salijona_Dyrmishi1;~Maxime_Cordy1;~Thomas_Lukasiewicz2;~Eleonora_Giunchiglia1",
        "gender": ";F;M;;F",
        "homepage": "https://mihaela-stoian.github.io/;;https://maxcordy.github.io/;https://www.cs.ox.ac.uk/people/thomas.lukasiewicz/;",
        "dblp": "296/1668;;73/10839.html;l/ThomasLukasiewicz;227/1952",
        "google_scholar": "https://scholar.google.co.uk/citations?hl=en;nHDj8SIAAAAJ;sRXHjkIAAAAJ;arjucpEAAAAJ;",
        "orcid": ";;0000-0001-8312-1358;;",
        "linkedin": "mihaela-catalina-stoian-919b27bb/;;;;",
        "or_profile": "~Mihaela_C_Stoian1;~Salijona_Dyrmishi1;~Maxime_Cordy1;~Thomas_Lukasiewicz2;~Eleonora_Giunchiglia1",
        "aff": "Department of Computer Science, University of Oxford;University of Luxembourg;University of Luxemburg;Department of Computer Science, University of Oxford;Technische Universit\u00e4t Wien",
        "aff_domain": "cs.ox.ac.uk;uni.lu;uni.lu;cs.ox.ac.uk;tuwien.ac.at",
        "position": "PhD student;PhD student;Researcher;Full Professor;Postdoc",
        "bibtex": "@inproceedings{\nstoian2024how,\ntitle={How Realistic Is Your Synthetic Data? Constraining Deep Generative Models for Tabular Data},\nauthor={Mihaela C Stoian and Salijona Dyrmishi and Maxime Cordy and Thomas Lukasiewicz and Eleonora Giunchiglia},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=tBROYsEz9G}\n}",
        "github": "",
        "project": "",
        "reviewers": "ikQ7;72Ff;DAiC;Yiht",
        "pdf_size": 2367549,
        "rating": "5;6;6;8",
        "confidence": "3;3;3;3",
        "soundness": "1;3;3;3",
        "contribution": "1;3;3;4",
        "presentation": "4;3;3;2",
        "wc_summary": "175;64;52;87",
        "wc_strengths": "50;51;47;17",
        "wc_weaknesses": "308;94;42;78",
        "wc_questions": "113;135;59;14",
        "wc_review": "646;344;200;196",
        "wc_reply_reviewers": "554;452;0;0",
        "wc_reply_authors": "2622;2047;156;236",
        "reply_reviewers": "1;3;0;0",
        "reply_authors": "6;5;1;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.75,
            1.0897247358851685
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            94.5,
            48.14820868942063
        ],
        "wc_strengths_avg": [
            41.25,
            14.077908225301087
        ],
        "wc_weaknesses_avg": [
            130.5,
            104.19572927908322
        ],
        "wc_questions_avg": [
            80.25,
            47.198384506251905
        ],
        "wc_review_avg": [
            346.5,
            182.90639682635486
        ],
        "wc_reply_reviewers_avg": [
            251.5,
            254.07233222057062
        ],
        "wc_reply_authors_avg": [
            1265.25,
            1088.771641575955
        ],
        "reply_reviewers_avg": [
            1.0,
            1.224744871391589
        ],
        "reply_authors_avg": [
            3.25,
            2.277608394786075
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 18,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14727715230156398738&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=tBROYsEz9G",
        "pdf": "https://openreview.net/pdf?id=tBROYsEz9G",
        "email": "cs.ox.ac.uk;uni.lu;uni.lu;cs.ox.ac.uk;tuwien.ac.at",
        "author_num": 5,
        "aff_unique_index": "0;1;1;0;2",
        "aff_unique_norm": "University of Oxford;University of Luxembourg;Technische Universit\u00e4t Wien",
        "aff_unique_dep": "Department of Computer Science;;",
        "aff_unique_url": "https://www.ox.ac.uk;https://wwwen.uniluxembourg.lu;https://www.tuwien.ac.at",
        "aff_unique_abbr": "Oxford;Uni Lu;TU Wien",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Oxford;",
        "aff_country_unique_index": "0;1;1;0;2",
        "aff_country_unique": "United Kingdom;Luxembourg;Austria"
    },
    {
        "id": "tCK3mhsE2L",
        "title": "FAIR-Ensemble: Homogeneous Deep Ensembling Naturally Attenuates Disparate Group Performances",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Ensembling multiple Deep Neural Networks (DNNs) is a simple and effective way to improve top-line metrics and to outperform a larger single model. In this work, we go beyond top-line metrics and instead explore the impact of ensembling on subgroup performances. Surprisingly, we observe that even with a simple homogeneous ensemble --all the individual DNNs share the same training set, architecture, and design choices-- the minority group performance disproportionately improves with the number of models compared to the majority group, i.e. fairness naturally emerges from ensembling. Even more surprising, we find that this gain keeps occurring even when a large number of models is considered, e.g. $20$, despite the fact that the average performance of the ensemble plateaus with fewer models. Our work establishes that simple DNN ensembles can be a powerful tool for alleviating disparate impact from DNN classifiers, thus curbing algorithmic harm. We also explore why this is the case. We find that even in homogeneous ensembles, varying the sources of stochasticity through parameter initialization, mini-batch sampling, and data-augmentation realizations, results in different fairness outcomes.",
        "keywords": "ensemble;fairness;computer vision;deep learning;CNN;DNN;CIFAR100;TinyImageNet;CelebA;Adult Census Income",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/8b88972c25c6658f4e8826fd2ba0c5017effff20.pdf",
        "author": "Wei-Yin Ko;Daniel D'souza;Karina Nguyen;Randall Balestriero;Sara Hooker",
        "authorids": "~Wei-Yin_Ko1;~Daniel_D'souza1;~Karina_Nguyen1;~Randall_Balestriero1;~Sara_Hooker2",
        "gender": "M;;M;M;",
        "homepage": ";https://karinanguyen.com/;https://randallbalestriero.github.io/;https://www.danieldsouza.me/;https://www.sarahooker.me/",
        "dblp": "341/5504;;175/5364;288/2025;210/2611",
        "google_scholar": "eaJ-8dQAAAAJ;;S1x_xqcAAAAJ;BbrITrEAAAAJ;2xy6h3sAAAAJ",
        "orcid": ";;;;",
        "linkedin": "wei-yin-k-7394bb42/;;randallbalestriero/;daniel-dsouza;",
        "or_profile": "~Wei-Yin_Ko1;~Karina_Nguyen1;~Randall_Balestriero1;~Daniel_Dsouza1;~Sara_Hooker1",
        "aff": ";;Citadel;Cohere;Cohere For AI",
        "aff_domain": ";;citadel.com;cohere.com;cohere.com",
        "position": ";;Researcher;Researcher;Principal Researcher",
        "bibtex": "@misc{\nko2024fairensemble,\ntitle={{FAIR}-Ensemble: Homogeneous Deep Ensembling Naturally Attenuates Disparate Group Performances},\nauthor={Wei-Yin Ko and Daniel D'souza and Karina Nguyen and Randall Balestriero and Sara Hooker},\nyear={2024},\nurl={https://openreview.net/forum?id=tCK3mhsE2L}\n}",
        "github": "",
        "project": "",
        "reviewers": "du9t;Y5JH;9BxN;6SCz",
        "site": "https://openreview.net/forum?id=tCK3mhsE2L",
        "pdf_size": 736736,
        "rating": "3;3;3;6",
        "confidence": "4;3;3;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;2;3",
        "wc_summary": "28;57;200;54",
        "wc_strengths": "22;68;70;87",
        "wc_weaknesses": "117;714;282;185",
        "wc_questions": "2;319;47;33",
        "wc_review": "169;1158;599;359",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            84.75,
            67.48842493346544
        ],
        "wc_strengths_avg": [
            61.75,
            24.107830678018296
        ],
        "wc_weaknesses_avg": [
            324.5,
            232.3967512681707
        ],
        "wc_questions_avg": [
            100.25,
            127.34083202178317
        ],
        "wc_review_avg": [
            571.25,
            371.45011441645835
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:M1VJf-CbQaMJ:scholar.google.com/&scioq=FAIR-Ensemble:+Homogeneous+Deep+Ensembling+Naturally+Attenuates+Disparate+Group+Performances&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Citadel;Cohere",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.citadel.edu;https://cohere.ai",
        "aff_unique_abbr": "Citadel;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "tD4NOxYTfg",
        "title": "The Convergence of Variance Exploding Diffusion Models under the Manifold Hypothesis",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Variance Exploding (VE) based diffusion models, an important class of diffusion models, have empirically shown state-of-the-art performance in many tasks. However, there are only a few theoretical works on the VE-based models, and those works suffer from a worse convergence rate $1/\\text{poly}(T)$ than the $\\exp{(-T)}$ results of Variance Preserving (VP) based models. The slow convergence rate is due to the Brownian Motion without the drift term and introduces hardness in balancing the different error sources. In this work, we design a new forward VESDE process with a small drift term, which converts data into pure Gaussian noise while the variance explodes. Furthermore, unlike the previous theoretical works, we allow the diffusion coefficient to be unbounded instead of a constant, which is closer to the SOTA VE-based models. With an aggressive diffusion coefficient, the new forward process allows a faster $\\exp{(-T)}$ rate. By exploiting this new forward process, we prove the first polynomial sample complexity for VE-based models with reverse SDE under the realistic manifold hypothesis. Then, we focus on a more general setting considering reverse SDE and probability flow ODE simultaneously and propose the unified tangent-based analysis framework for VE-based models. In this framework, we prove the first quantitative convergence guarantee for SOTA VE-based models with probability flow ODE.",
        "keywords": "Convergence guarantee;Variance Exploding Diffusion Models;Manifold Hypothesis",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/384e3dee3fa46703c2981a156673cfe314fd4c59.pdf",
        "author": "Ruofeng Yang;Zhijie Wang;Bo Jiang;Shuai Li",
        "authorids": "~Ruofeng_Yang1;~Zhijie_Wang7;~Bo_Jiang2;~Shuai_Li3",
        "gender": "M;M;M;F",
        "homepage": "https://github.com/wanshuiyin;https://github.com/Vincent-Zhijie;https://jhc.sjtu.edu.cn/~bjiang/;http://shuaili8.github.io",
        "dblp": "350/4546;;34/2005-3.html;57/2281-10",
        "google_scholar": "https://scholar.google.com.hk/citations?user=Cw9HDacAAAAJ;x_9XRb4AAAAJ;WxAIZtMAAAAJ;https://scholar.google.com.hk/citations?user=kMZgQxcAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Ruofeng_Yang1;~Zhijie_Wang7;~Bo_Jiang2;~Shuai_Li3",
        "aff": "Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;John Hopcroft Center, Shanghai Jiao Tong University",
        "aff_domain": "sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn",
        "position": "PhD student;Undergrad student;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nyang2024the,\ntitle={The Convergence of Variance Exploding Diffusion Models under the Manifold Hypothesis},\nauthor={Ruofeng Yang and Zhijie Wang and Bo Jiang and Shuai Li},\nyear={2024},\nurl={https://openreview.net/forum?id=tD4NOxYTfg}\n}",
        "github": "",
        "project": "",
        "reviewers": "A2uB;HKJt;U2Hx;byF9",
        "site": "https://openreview.net/forum?id=tD4NOxYTfg",
        "pdf_size": 437431,
        "rating": "6;6;6;8",
        "confidence": "4;3;3;2",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "41;68;108;71",
        "wc_strengths": "46;71;50;52",
        "wc_weaknesses": "178;61;322;15",
        "wc_questions": "3;4;249;16",
        "wc_review": "268;204;729;154",
        "wc_reply_reviewers": "14;12;17;20",
        "wc_reply_authors": "710;694;732;624",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "3;4;4;3",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            72.0,
            23.843238035132728
        ],
        "wc_strengths_avg": [
            54.75,
            9.627434756984853
        ],
        "wc_weaknesses_avg": [
            144.0,
            118.71183597266112
        ],
        "wc_questions_avg": [
            68.0,
            104.6255226988138
        ],
        "wc_review_avg": [
            338.75,
            228.90541168788474
        ],
        "wc_reply_reviewers_avg": [
            15.75,
            3.031088913245535
        ],
        "wc_reply_authors_avg": [
            690.0,
            40.422765862815474
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.5,
            0.5
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9371456552398613170&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Shanghai Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sjtu.edu.cn",
        "aff_unique_abbr": "SJTU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Shanghai",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "tDuQNUQN6q",
        "title": "Algorithm and Hardness for Dynamic Attention Maintenance in Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs) have made fundamental changes in human life. The attention scheme is one of the key components over all the LLMs, such as BERT, GPT-1, Transformers, GPT-2, 3, 3.5 and 4. Inspired by previous theoretical study of static version of the attention multiplication problem [Zandieh,  Han, Daliri, and Karbasi ICML 2023, Alman and Song NeurIPS 2023]. In this work, we formally define a dynamic version of attention matrix multiplication problem. \nThere are matrices $Q,K, V \\in \\mathbb{R}^{n \\times d}$, they represent query, key and value in LLMs. In each iteration we update one entry in $K$ or $V$. In the query stage, we receive $(i,j) \\in [n] \\times [d]$ as input, and want to answer $(D^{-1} A V)_{i,j}$, where $A:=\\exp(QK^\\top) \\in \\mathbb{R}^{n \\times n}$ is a square matrix and $D := \\mathrm{diag}(A {\\bf 1}_n) \\in \\mathbb{R}^{n \\times n}$ is a diagonal matrix. Here ${\\bf 1}_n$ denote a length-$n$ vector that all the entries are ones.\n\nWe provide two results: an algorithm and a conditional lower bound.\n\n\n$\\bullet$ On one hand, inspired by the lazy update idea from [Demetrescu and Italiano FOCS 2000, Sankowski FOCS 2004, Cohen, Lee and Song STOC 2019, Brand SODA 2020], we provide a data-structure that uses $O(n^{\\omega(1,1,\\tau)-\\tau})$ amortized update time, \n    and $O(n^{1+\\tau})$ worst-case query time.\n\n$\\bullet$ On the other hand, show that unless the hinted matrix vector multiplication conjecture [Brand, Nanongkai and Saranurak FOCS 2019] is false, there is no algorithm that can use both $O(n^{\\omega(1,1,\\tau) - \\tau- \\Omega(1)})$ amortized update time, and $O(n^{1+\\tau-\\Omega(1)})$ worst query time.  \n\n\nIn conclusion, our algorithmic result is conditionally optimal unless hinted matrix vector multiplication conjecture is false.\n\nOne notable difference between prior work [Alman and Song NeurIPS 2023] and our work is, their techniques are from the area of fine-grained complexity, and our techniques are not. Our algorithmic techniques are from recent work in convex optimization, e.g. solving linear programming. Our hardness techniques are from the area of dynamic algorithms.",
        "keywords": "dynamic attention",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/d5485f2cff752ee5d1b9fe0f114a8e4b335d9315.pdf",
        "author": "Jan van den Brand;Zhao Song;Tianyi Zhou",
        "authorids": "~Jan_van_den_Brand1;~Zhao_Song3;~Tianyi_Zhou4",
        "gender": ";M;",
        "homepage": "https://jvdbrand.com;https://www.youtube.com/@zhaosong2031;",
        "dblp": "196/3762;76/4051-2;",
        "google_scholar": "56fOepEAAAAJ;yDZct7UAAAAJ;",
        "orcid": "0000-0001-8611-6896;;",
        "linkedin": ";;",
        "or_profile": "~Jan_van_den_Brand1;~Zhao_Song3;~Tianyi_Zhou4",
        "aff": "Georgia Institute of Technology;Adobe;",
        "aff_domain": "gatech.edu;adobe.com;",
        "position": "Assistant Professor;Researcher;",
        "bibtex": "@misc{\nbrand2024algorithm,\ntitle={Algorithm and Hardness for Dynamic Attention Maintenance in Large Language Models},\nauthor={Jan van den Brand and Zhao Song and Tianyi Zhou},\nyear={2024},\nurl={https://openreview.net/forum?id=tDuQNUQN6q}\n}",
        "github": "",
        "project": "",
        "reviewers": "YepA;tLaa;ymZ9;wrST",
        "site": "https://openreview.net/forum?id=tDuQNUQN6q",
        "pdf_size": 413974,
        "rating": "3;3;6;8",
        "confidence": "2;3;4;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "101;88;198;121",
        "wc_strengths": "34;13;30;250",
        "wc_weaknesses": "120;450;25;98",
        "wc_questions": "123;259;8;165",
        "wc_review": "378;810;261;634",
        "wc_reply_reviewers": "0;0;0;41",
        "wc_reply_authors": "644;1628;383;1081",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;3;1;2",
        "rating_avg": [
            5.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            127.0,
            42.64387412044079
        ],
        "wc_strengths_avg": [
            81.75,
            97.45864507574483
        ],
        "wc_weaknesses_avg": [
            173.25,
            163.60527956028804
        ],
        "wc_questions_avg": [
            138.75,
            90.12872738478005
        ],
        "wc_review_avg": [
            520.75,
            214.67344386299857
        ],
        "wc_reply_reviewers_avg": [
            10.25,
            17.75352077758099
        ],
        "wc_reply_authors_avg": [
            934.0,
            471.9496795210269
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5000000000000001,
        "gs_citation": 37,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7195906318516545252&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Georgia Institute of Technology;Adobe",
        "aff_unique_dep": ";Adobe Inc.",
        "aff_unique_url": "https://www.gatech.edu;https://www.adobe.com",
        "aff_unique_abbr": "Georgia Tech;Adobe",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "tDxGthJkSD",
        "title": "Hybrid Classification-Regression Adaptive Loss for Dense Object Detection",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "For object detection detectors, enhancing model performance hinges on the ability to simultaneously consider inconsistencies across tasks and focus on difficult-to-train samples. Achieving this necessitates incorporating information from both the classification and regression tasks. However, prior work tends to either emphasize difficult-to-train samples within their respective tasks or simply compute classification scores with IoU, often leading to suboptimal model performance. In this paper, we propose a Hybrid Classification-Regression Adaptive Loss, termed as HCRAL. Specifically, we introduce the Residual of Classification and IoU (RCI) module for cross-task supervision, addressing task inconsistencies, and the Conditioning Factor (CF) to focus on difficult-to-train samples within each task. Furthermore, we introduce a new strategy named Expanded Adaptive Training Sample Selection (EATSS) to provide additional samples that exhibit classification and regression inconsistencies. To validate the effectiveness of the proposed method, we conduct extensive experiments on COCO test-dev. Experimental evaluations demonstrate the superiority of our approachs. Additionally, we designed experiments by separately combining the classification and regression loss with regular loss functions in popular one-stage models, demonstrating improved performance.",
        "keywords": "Object detection\uff0cHybrid Classification-Regression Adaptive Loss (HCRAL)\uff0cExpanded Adaptive Training Sample Selection (EATSS)",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yanquan Huang;Liu Wei Zhen;Yun Hao;Mengyuan Zhang;Qingyao Wu;Zikun Deng;Xueming Liu;Hong Deng",
        "authorids": "~Yanquan_Huang1;~Liu_Wei_Zhen1;~Yun_Hao2;~Mengyuan_Zhang2;~Qingyao_Wu1;~Zikun_Deng1;~Xueming_Liu1;~Hong_Deng2",
        "gender": "M;M;M;F;M;M;M;M",
        "homepage": "https://github.com/yanquanh;https://weibo.com/u/3147293062;;;;https://zkdeng.org/;;http://www2.scut.edu.cn/cese/2020/0821/c27847a395027/page.htm",
        "dblp": ";;;;42/8374;;;",
        "google_scholar": "LVqPkN0AAAAJ;;;https://scholar.google.com.hk/citations?hl=zh-CN;https://scholar.google.com.hk/citations?user=n6e_2IgAAAAJ;rKhw1wMAAAAJ;;",
        "orcid": ";;;;0000-0002-6771-3932;;0000-0002-4625-2575;",
        "linkedin": ";;%E8%BF%90-%E9%83%9D-158037212/;;;;;",
        "or_profile": "~Yanquan_Huang1;~Liu_Wei_Zhen1;~Yun_Hao2;~Mengyuan_Zhang2;~Qingyao_Wu1;~Zikun_Deng1;~Xueming_Liu1;~Hong_Deng2",
        "aff": ";;South China University of Technology;South China University of Technology;South China University of Technology;South China University of Technology;;",
        "aff_domain": ";;scut.edu.cn;scut.edu.cn;scut.edu.cn;scut.edu.cn;;",
        "position": ";;PhD student;PhD student;Full Professor;Associate Professor;;",
        "bibtex": "@misc{\nhuang2024hybrid,\ntitle={Hybrid Classification-Regression Adaptive Loss for Dense Object Detection},\nauthor={Yanquan Huang and Liu Wei Zhen and Yun Hao and Mengyuan Zhang and Qingyao Wu and Zikun Deng and Xueming Liu and Hong Deng},\nyear={2024},\nurl={https://openreview.net/forum?id=tDxGthJkSD}\n}",
        "github": "",
        "project": "",
        "reviewers": "Hvbn;gHLc;uUTZ;woyR",
        "site": "https://openreview.net/forum?id=tDxGthJkSD",
        "pdf_size": 881192,
        "rating": "3;3;3;3",
        "confidence": "5;5;3;4",
        "soundness": "2;1;2;2",
        "contribution": "2;2;2;2",
        "presentation": "3;1;1;3",
        "wc_summary": "43;56;60;94",
        "wc_strengths": "30;12;54;86",
        "wc_weaknesses": "137;552;130;80",
        "wc_questions": "3;2;95;113",
        "wc_review": "213;622;339;373",
        "wc_reply_reviewers": "28;62;19;0",
        "wc_reply_authors": "860;855;650;555",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            1.0
        ],
        "wc_summary_avg": [
            63.25,
            18.833148966649205
        ],
        "wc_strengths_avg": [
            45.5,
            27.726341266023542
        ],
        "wc_weaknesses_avg": [
            224.75,
            190.21221701036976
        ],
        "wc_questions_avg": [
            53.25,
            51.14868033488254
        ],
        "wc_review_avg": [
            386.75,
            148.3246018029376
        ],
        "wc_reply_reviewers_avg": [
            27.25,
            22.465250944514285
        ],
        "wc_reply_authors_avg": [
            730.0,
            131.86166994240594
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1323719418761512973&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "South China University of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.scut.edu.cn",
        "aff_unique_abbr": "SCUT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "tEAF9LBdgu",
        "title": "AutoGen: Enabling Next-Gen LLM Applications via Multi-Agent Conversation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "AutoGen is an open-source framework that allows developers to build LLM applications via multiple agents that can converse with each other to accomplish tasks. AutoGen agents are customizable, conversable, and can operate in various modes that employ combinations of LLMs, human inputs, and tools. Using AutoGen, developers can also flexibly define agent interaction behaviors. Both natural language and computer code can be used to program flexible conversation patterns for different applications. AutoGen serves as a generic infrastructure\nto build diverse applications of various complexities and LLM capacities. Empirical studies demonstrate the effectiveness of the framework in many example applications, with domains ranging from mathematics, coding, question answering, operations research, online decision-making, entertainment, etc.",
        "keywords": "Large Language Model;Multi-Agent Conversation;Open-Source Library",
        "primary_area": "infrastructure, software libraries, hardware, etc.",
        "supplementary_material": "",
        "author": "Qingyun Wu;Gagan Bansal;Jieyu Zhang;Yiran Wu;Beibin Li;Erkang Zhu;Li Jiang;Xiaoyun Zhang;Shaokun Zhang;Jiale Liu;Ahmed Hassan Awadallah;Ryen W White;Doug Burger;Chi Wang",
        "authorids": "~Qingyun_Wu2;~Gagan_Bansal1;~Jieyu_Zhang1;~Yiran_Wu2;~Beibin_Li1;~Erkang_Zhu1;~Li_Jiang7;~Xiaoyun_Zhang2;~Shaokun_Zhang2;~Jiale_Liu2;~Ahmed_Hassan_Awadallah1;~Ryen_W_White1;~Doug_Burger2;~Chi_Wang3",
        "gender": ";M;M;M;M;;;M;;;M;;;M",
        "homepage": ";https://homes.cs.washington.edu/~bansalg/;https://jieyuz2.github.io/;https://github.com/kevin666aa;http://beibinli.com;https://ekzhu.com;;https://littlelittlecloud.github.io;;;https://www.microsoft.com/en-us/research/people/hassanam/publications/;;http://www.cs.utexas.edu/~dburger;http://chiwang.cc",
        "dblp": ";147/2058;;;;116/5135.html;;;;;147/9148;w/RyenWWhite;;09/404-1",
        "google_scholar": ";IAkKgGcAAAAJ;T_INUHUAAAAJ;2Gx5IQ4AAAAJ;-ZEDbTYAAAAJ;https://scholar.google.com.sg/citations?user=8vrVMwIAAAAJ;;;;;sNGk-9MAAAAJ;;;https://scholar.google.com/citations?hl=en",
        "orcid": ";;0000-0002-1846-2436;;;0009-0000-3326-1790;;;;;;;;",
        "linkedin": ";;jieyu-zhang-3baaa8154/;;;;;;;;ahmed-hassan-awadallah-a355a27/;;;chi-wang-autogen/",
        "or_profile": "~Qingyun_Wu2;~Gagan_Bansal1;~Jieyu_Zhang1;~Yiran_Wu2;~Beibin_Li1;~Erkang_Zhu1;~Li_Jiang7;~Xiaoyun_Zhang2;~Shaokun_Zhang2;~Jiale_Liu2;~Ahmed_Hassan_Awadallah1;~Ryen_W_White1;~Doug_Burger2;~Chi_Wang3",
        "aff": ";Microsoft;University of Washington;Pennsylvania State University;Microsoft Research;Microsoft;;Microsoft;;;Microsoft Research;Microsoft;;Microsoft Research",
        "aff_domain": ";microsoft.com;cs.washington.edu;psu.edu;microsoft.com;microsoft.com;;microsoft.com;;;microsoft.com;microsoft.com;;microsoft.com",
        "position": ";Researcher;PhD student;PhD student;Researcher;Researcher;;sde;;;Principal Researcher;Research Manager;;Principal Researcher",
        "bibtex": "@misc{\nwu2024autogen,\ntitle={AutoGen: Enabling Next-Gen {LLM} Applications via Multi-Agent Conversation},\nauthor={Qingyun Wu and Gagan Bansal and Jieyu Zhang and Yiran Wu and Beibin Li and Erkang Zhu and Li Jiang and Xiaoyun Zhang and Shaokun Zhang and Jiale Liu and Ahmed Hassan Awadallah and Ryen W White and Doug Burger and Chi Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=tEAF9LBdgu}\n}",
        "github": "",
        "project": "",
        "reviewers": "xV6g;rXeX;AgUb;SJWG",
        "site": "https://openreview.net/forum?id=tEAF9LBdgu",
        "pdf_size": 3339762,
        "rating": "5;6;8;8",
        "confidence": "3;4;3;2",
        "soundness": "2;3;3;3",
        "contribution": "1;2;3;3",
        "presentation": "1;3;3;3",
        "wc_summary": "69;109;98;62",
        "wc_strengths": "33;51;101;146",
        "wc_weaknesses": "150;166;176;1",
        "wc_questions": "48;134;53;32",
        "wc_review": "300;460;428;241",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1529;657;881;111",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "4;2;3;2",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            84.5,
            19.551214796017153
        ],
        "wc_strengths_avg": [
            82.75,
            44.20619300505304
        ],
        "wc_weaknesses_avg": [
            123.25,
            71.18769205417465
        ],
        "wc_questions_avg": [
            66.75,
            39.594033641446536
        ],
        "wc_review_avg": [
            357.25,
            89.93713081925618
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            794.5,
            508.19558242865514
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            14,
            0
        ],
        "corr_rating_confidence": -0.5443310539518174,
        "gs_citation": 315,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2879869765288010008&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;2;0;0;0;0;0;0",
        "aff_unique_norm": "Microsoft;University of Washington;Pennsylvania State University",
        "aff_unique_dep": "Microsoft Corporation;;",
        "aff_unique_url": "https://www.microsoft.com;https://www.washington.edu;https://www.psu.edu",
        "aff_unique_abbr": "Microsoft;UW;PSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Partitioning Message Passing for Graph Fraud Detection",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17621",
        "id": "tEgrUrUuwA",
        "author_site": "Wei Zhuo, Zemin Liu, Bryan Hooi, Bingsheng He, Guang Tan, Rizal Fathony, Jia Chen",
        "tldr": "",
        "abstract": "Label imbalance and homophily-heterophily mixture are the fundamental problems encountered when applying Graph Neural Networks (GNNs) to Graph Fraud Detection (GFD) tasks. Existing GNN-based GFD models are designed to augment graph structure to accommodate the inductive bias of GNNs towards homophily, by excluding heterophilic neighbors during message passing. In our work, we argue that the key to applying GNNs for GFD is not to exclude but to {\\em distinguish} neighbors with different labels. Grounded in this perspective, we introduce Partitioning Message Passing (PMP), an intuitive yet effective message passing paradigm expressly crafted for GFD. Specifically, in the neighbor aggregation stage of PMP, neighbors with different classes are aggregated with distinct node-specific aggregation functions. By this means, the center node can adaptively adjust the information aggregated from its heterophilic and homophilic neighbors, thus avoiding the model gradient being dominated by benign nodes which occupy the majority of the population. We theoretically establish a connection between the spatial formulation of PMP and spectral analysis to characterize that PMP operates an adaptive node-specific spectral graph filter, which demonstrates the capability of PMP to handle heterophily-homophily mixed graphs. Extensive experimental results show that PMP can significantly boost the performance on GFD tasks.",
        "keywords": "Graph Neural Networks;Fraud Detection",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Wei Zhuo;Zemin Liu;Bryan Hooi;Bingsheng He;Guang Tan;Rizal Fathony;Jia Chen",
        "authorids": "~Wei_Zhuo4;~Zemin_Liu1;~Bryan_Hooi1;~Bingsheng_He1;~Guang_Tan1;~Rizal_Fathony1;~Jia_Chen2",
        "gender": "Not Specified;M;;M;M;M;",
        "homepage": "https://wei2hu0.github.io/;https://zemin-liu.github.io/;http://bhooi.github.io;http://www.comp.nus.edu.sg/~hebs/;;https://rizal.fathony.com/;",
        "dblp": ";17/964.html;169/9975;h/BingshengHe.html;56/751.html;191/6741;",
        "google_scholar": ";IxHO1nkAAAAJ;;https://scholar.google.com.tw/citations?user=RogYLKYAAAAJ;;_cOHKxkAAAAJ;",
        "orcid": ";0000-0001-6262-9435;0000-0002-5645-1754;0000-0001-8618-4581;;;",
        "linkedin": ";;;bingsheng-he-7734b131;;;",
        "or_profile": "~Wei_Zhuo4;~Zemin_Liu1;~Bryan_Hooi1;~Bingsheng_He1;~Guang_Tan1;~Rizal_Fathony1;~Jia_Chen2",
        "aff": "SUN YAT-SEN UNIVERSITY;National University of Singapore;National University of Singapore;National University of Singapore;SUN YAT-SEN UNIVERSITY;Grab Data Science;",
        "aff_domain": "sysu.edu.cn;nus.edu;nus.edu.sg;nus.edu.sg;sysu.edu.cn;grab.com;",
        "position": "PhD student;Postdoc;Assistant Professor;Full Professor;Full Professor;Researcher;",
        "bibtex": "@inproceedings{\nzhuo2024partitioning,\ntitle={Partitioning Message Passing for Graph Fraud Detection},\nauthor={Wei Zhuo and Zemin Liu and Bryan Hooi and Bingsheng He and Guang Tan and Rizal Fathony and Jia Chen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=tEgrUrUuwA}\n}",
        "github": "",
        "project": "",
        "reviewers": "wN2Y;XqA8;8onS;69ev",
        "pdf_size": 754789,
        "rating": "5;5;6;6",
        "confidence": "4;4;4;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;3;3",
        "wc_summary": "101;101;212;112",
        "wc_strengths": "65;37;53;81",
        "wc_weaknesses": "239;70;80;49",
        "wc_questions": "5;236;92;87",
        "wc_review": "410;444;437;329",
        "wc_reply_reviewers": "258;38;31;0",
        "wc_reply_authors": "2886;1490;1053;608",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "5;3;3;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            131.5,
            46.69314724882014
        ],
        "wc_strengths_avg": [
            59.0,
            16.1245154965971
        ],
        "wc_weaknesses_avg": [
            109.5,
            75.59927248327196
        ],
        "wc_questions_avg": [
            105.0,
            83.14745937188941
        ],
        "wc_review_avg": [
            405.0,
            45.67822238222499
        ],
        "wc_reply_reviewers_avg": [
            81.75,
            102.757907238324
        ],
        "wc_reply_authors_avg": [
            1509.25,
            853.8481641954851
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.25,
            1.0897247358851685
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 30,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5236122876911952670&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=tEgrUrUuwA",
        "pdf": "https://openreview.net/pdf?id=tEgrUrUuwA",
        "email": "sysu.edu.cn;nus.edu;nus.edu.sg;nus.edu.sg;sysu.edu.cn;grab.com;",
        "author_num": 7,
        "aff_unique_index": "0;1;1;1;0;2",
        "aff_unique_norm": "Sun Yat-sen University;National University of Singapore;Grab",
        "aff_unique_dep": ";;Data Science",
        "aff_unique_url": "http://www.sysu.edu.cn;https://www.nus.edu.sg;https://www.grab.com",
        "aff_unique_abbr": "SYSU;NUS;Grab",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;0;1",
        "aff_country_unique": "China;Singapore"
    },
    {
        "id": "tFYcEUlUTt",
        "title": "Learning from the Future: Improve Long-term Mesh-based Simulation with Foresight",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper studies the problem of learning mesh-based physical simulations, a crucial task with applications in fluid mechanics and aerodynamics. Recent works typically utilize graph neural networks to produce next-time states on irregular meshes by modeling interacting dynamics, and then adopt iterative rollouts for the whole trajectories. However, these methods cannot achieve satisfactory performance in long-term predictions due to the failure of capturing long-term dependency and potential error accumulation. To tackle this, we introduce a new future-to-present learning perspective, and further develop a simple yet effective approach named Foresight And Interpolation (FAIR) for long-term mesh-based simulations. The main idea of FAIR is to first learn a graph ODE model for coarse long-term predictions and then refine short-term predictions via interpolation. Specifically, FAIR employs a continuous graph ODE model that incorporates past states into the evolution of interacting node representations, which is capable of learning coarse long-term trajectories under a multi-task learning framework. Then, we leverage a channel aggregation strategy to summarize the trajectories for refined short-term predictions, which can be illustrated using an interpolation process. Through pyramid-like alternative propagation between the foresight step and refinement step, \\method{} can generate accurate long-term trajectories, achieving an error reduction of up to 25.4% on benchmark datasets. Extensive ablation studies and visualization further validate the superiority of the proposed FAIR.",
        "keywords": "Dynamical System;Neural ODE;Graph Neural Network;Physics Simulation",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/0699e81bb1d033dc65220a0f7b98ab0c6c1e2d5c.pdf",
        "author": "Xiao Luo;Junyu Luo;Huiyu Jiang;Wei Ju;Carl Yang;Ming Zhang;Yizhou Sun",
        "authorids": "~Xiao_Luo3;~Junyu_Luo2;~Huiyu_Jiang1;~Wei_Ju1;~Carl_Yang1;~Ming_Zhang5;~Yizhou_Sun1",
        "gender": "M;M;M;;M;F;F",
        "homepage": "http://luoxiao12.github.io;http://luojunyu.com/;;;https://cs.emory.edu/~jyang71/;https://cs.pku.edu.cn/info/1080/1371.htm;http://web.cs.ucla.edu/~yzsun/",
        "dblp": "50/1585-1;198/0850-2;;;305/0254;73/1844-4;37/3868",
        "google_scholar": "https://scholar.google.com.hk/citations?;https://scholar.google.com/citations?hl=en;;;mOINlwcAAAAJ;LbzoQBsAAAAJ;https://scholar.google.com.tw/citations?user=TQgOjK0AAAAJ",
        "orcid": ";0009-0001-6894-1144;;;0000-0001-9145-4531;0000-0002-9809-3430;",
        "linkedin": "%E9%9C%84-%E7%BD%97-303548214/;luojunyu/;huiyu-jiang/;;;;",
        "or_profile": "~Xiao_Luo3;~Junyu_Luo2;~Huiyu_Jiang1;~Wei_Ju1;~Carl_Yang1;~Ming_Zhang5;~Yizhou_Sun1",
        "aff": "University of California, Los Angeles;Sensetime;University of California, Santa Barbara;;Emory University;Peking University;University of California, Los Angeles",
        "aff_domain": "cs.ucla.edu;sensetime.com;ucsb.edu;;emory.edu;pku.edu.cn;ucla.edu",
        "position": "Postdoc;Intern;PhD student;;Assistant Professor;Full Professor;Associate Professor",
        "bibtex": "@misc{\nluo2024learning,\ntitle={Learning from the Future: Improve Long-term Mesh-based Simulation with Foresight},\nauthor={Xiao Luo and Junyu Luo and Huiyu Jiang and Wei Ju and Carl Yang and Ming Zhang and Yizhou Sun},\nyear={2024},\nurl={https://openreview.net/forum?id=tFYcEUlUTt}\n}",
        "github": "",
        "project": "",
        "reviewers": "vkK1;wp4W;L1zc;kYvB",
        "site": "https://openreview.net/forum?id=tFYcEUlUTt",
        "pdf_size": 11109821,
        "rating": "1;3;6;6",
        "confidence": "4;4;4;3",
        "soundness": "1;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "1;1;3;3",
        "wc_summary": "103;45;104;86",
        "wc_strengths": "360;13;58;93",
        "wc_weaknesses": "1675;80;168;75",
        "wc_questions": "304;15;94;126",
        "wc_review": "2442;153;424;380",
        "wc_reply_reviewers": "368;0;0;0",
        "wc_reply_authors": "1313;370;517;588",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "3;2;1;1",
        "rating_avg": [
            4.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            1.0
        ],
        "wc_summary_avg": [
            84.5,
            23.90083680543424
        ],
        "wc_strengths_avg": [
            131.0,
            135.22019080004287
        ],
        "wc_weaknesses_avg": [
            499.5,
            679.6824626250113
        ],
        "wc_questions_avg": [
            134.75,
            105.7387700893102
        ],
        "wc_review_avg": [
            849.75,
            925.020101132943
        ],
        "wc_reply_reviewers_avg": [
            92.0,
            159.34867429633672
        ],
        "wc_reply_authors_avg": [
            697.0,
            364.2341280001093
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5443310539518174,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Dnr4GHg_kdQJ:scholar.google.com/&scioq=Learning+from+the+Future:+Improve+Long-term+Mesh-based+Simulation+with+Foresight&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;4;0",
        "aff_unique_norm": "University of California, Los Angeles;SenseTime;University of California, Santa Barbara;Emory University;Peking University",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.ucla.edu;https://www.sensetime.com;https://www.ucsb.edu;https://www.emory.edu;http://www.pku.edu.cn",
        "aff_unique_abbr": "UCLA;SenseTime;UCSB;Emory;Peking U",
        "aff_campus_unique_index": "0;2;0",
        "aff_campus_unique": "Los Angeles;;Santa Barbara",
        "aff_country_unique_index": "0;1;0;0;1;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "tFpqGk5hR5",
        "title": "A Simple Open-Loop Baseline for Reinforcement Learning Locomotion Tasks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In search of the simplest baseline capable of competing with Deep Reinforcement Learning on locomotion tasks, we propose a biologically inspired model-free open-loop strategy.\nDrawing upon prior knowledge and harnessing the elegance of simple oscillators to generate periodic joint motions, it achieves respectable performance in five different locomotion environments, with a number of tunable parameters that is a tiny fraction of the thousands typically required by RL algorithms.\nUnlike RL methods, which are prone to performance degradation when exposed to sensor noise or failure, our open-loop oscillators exhibit remarkable robustness due to their lack of reliance on sensors.\nFurthermore, we showcase a successful transfer from simulation to reality using an elastic quadruped, all without the need for randomization or reward engineering.",
        "keywords": "reinforcement learning;robotics;baseline;locomotion;benchmark",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/6c2118c75c6880f49e4ca0a34aec74c2abc4b437.zip",
        "author": "Antonin Raffin;Olivier Sigaud;Jens Kober;Alin Albu-Sch\u00e4ffer;Jo\u00e3o Silv\u00e9rio;Freek Stulp",
        "authorids": "~Antonin_Raffin1;~Olivier_Sigaud1;~Jens_Kober1;~Alin_Albu-Sch\u00e4ffer1;~Jo\u00e3o_Silv\u00e9rio1;~Freek_Stulp1",
        "gender": "M;M;M;;M;M",
        "homepage": "https://araffin.github.io/;http://people.isir.upmc.fr/sigaud;http://www.jenskober.de/;;;https://robotic.dlr.de",
        "dblp": "225/7772;50/5522;69/6636;;73/478;",
        "google_scholar": "kik4AwIAAAAJ;https://scholar.google.fr/citations?user=elLfDv0AAAAJ;XOWZzUcAAAAJ;https://scholar.google.it/citations?user=BqkkXaQAAAAJ;https://scholar.google.de/citations?user=aHPX6PsAAAAJ;https://scholar.google.com.tw/citations?user=yP_zL3gAAAAJ",
        "orcid": "0000-0001-6036-6950;0000-0002-8544-0229;0000-0001-7257-5434;;;",
        "linkedin": ";;jens-kober/;;;",
        "or_profile": "~Antonin_Raffin1;~Olivier_Sigaud1;~Jens_Kober1;~Jo\u00e3o_Silv\u00e9rio1;~Freek_Stulp1;~Alin_Albu-Schaeffer1",
        "aff": "DLR;Sorbonne Universit\u00e9;Delft University of Technology;German Aerospace Center;German Aerospace Center (DLR);Technische Universit\u00e4t M\u00fcnchen",
        "aff_domain": "dlr.de;upmc.fr;tudelft.nl;dlr.de;dlr.de;tum.de",
        "position": "PhD student;Full Professor;Associate Professor;Researcher;Principal Researcher;Full Professor",
        "bibtex": "@misc{\nraffin2024a,\ntitle={A Simple Open-Loop Baseline for Reinforcement Learning Locomotion Tasks},\nauthor={Antonin Raffin and Olivier Sigaud and Jens Kober and Alin Albu-Sch{\\\"a}ffer and Jo{\\~a}o Silv{\\'e}rio and Freek Stulp},\nyear={2024},\nurl={https://openreview.net/forum?id=tFpqGk5hR5}\n}",
        "github": "",
        "project": "",
        "reviewers": "w6U7;vPWP;bfuq;nvZX",
        "site": "https://openreview.net/forum?id=tFpqGk5hR5",
        "pdf_size": 782362,
        "rating": "3;3;5;6",
        "confidence": "4;4;5;4",
        "soundness": "2;2;3;4",
        "contribution": "1;1;2;3",
        "presentation": "2;3;3;4",
        "wc_summary": "47;31;48;34",
        "wc_strengths": "92;31;112;100",
        "wc_weaknesses": "234;168;146;200",
        "wc_questions": "162;129;42;188",
        "wc_review": "535;359;348;522",
        "wc_reply_reviewers": "0;54;29;43",
        "wc_reply_authors": "779;1300;672;897",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "1;3;1;2",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            40.0,
            7.582875444051551
        ],
        "wc_strengths_avg": [
            83.75,
            31.275989192989563
        ],
        "wc_weaknesses_avg": [
            187.0,
            33.24154027718932
        ],
        "wc_questions_avg": [
            130.25,
            55.07438152172024
        ],
        "wc_review_avg": [
            441.0,
            87.70689824637512
        ],
        "wc_reply_reviewers_avg": [
            31.5,
            20.22992832414391
        ],
        "wc_reply_authors_avg": [
            912.0,
            237.7277855026627
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2183324801688250949&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;3;4",
        "aff_unique_norm": "Deutsches Zentrum f\u00fcr Luft- und Raumfahrt;Sorbonne Universit\u00e9;Delft University of Technology;German Aerospace Center;Technische Universit\u00e4t M\u00fcnchen",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.dlr.de;https://www.sorbonne-universite.fr;https://www.tudelft.nl;https://www.dlr.de;https://www.tum.de",
        "aff_unique_abbr": "DLR;Sorbonne U;TU Delft;DLR;TUM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;0;0;0",
        "aff_country_unique": "Germany;France;Netherlands"
    },
    {
        "id": "tG5mpAM7ZK",
        "title": "Extending to New Domains without Visual and Textual Oracles",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "To avoid the high cost of collecting visual data from all test domains in domain adaption task, recent work takes advantage of the pre-trained large-scale vision language models and augment training data with only text descriptions (e.g.,\u201ca photo/painting/sketch...\u201d) of each test domain. However, in many real-world ap- plications, such text information of test domains is not always available in ad- vance. Moreover, even if we can verbalize all test domains, it is laborious for existing work (Dunlap et al., 2023) to train a different augmentation network for each possible unseen domain. To overcome these challenges, we benefit from the multimodal embedding space of a pre-trained vision-language model and propose to acquire training-free and domain-invariant augmentations with text descrip- tions of arbitrary crafted unseen domains, which not necessarily match test do- mains. Beyond achieving state-of-the-art results, compared with existing works that require trainable augmentation networks, our approach is also notably more time-efficient, and exhibits a more solid theoretical support.",
        "keywords": "multimodal learning;vision-language model;domain adaptation;domain generalization",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Daiqing Qi;Handong Zhao;Aidong Zhang;Sheng Li",
        "authorids": "~Daiqing_Qi2;~Handong_Zhao3;~Aidong_Zhang2;~Sheng_Li3",
        "gender": "M;F;M;",
        "homepage": "https://daiqing-qi.github.io/research.html;https://engineering.virginia.edu/faculty/aidong-zhang;http://sheng-li.org;https://hdzhao.github.io/",
        "dblp": "229/9064;z/AidongZhang.html;23/3439-1;79/8522",
        "google_scholar": "FIa-pykAAAAJ;O8XxkE4AAAAJ;DEncVcYAAAAJ;0f-YOFgAAAAJ",
        "orcid": "0000-0001-9543-5792;0000-0001-9723-3246;0000-0003-1205-8632;",
        "linkedin": ";;sheng-li-15a70022/;",
        "or_profile": "~Daiqing_Qi2;~Aidong_Zhang2;~Sheng_Li3;~Handong_Zhao1",
        "aff": "University of Virginia, Charlottesville;University of Virginia;University of Virginia, Charlottesville;Adobe Systems",
        "aff_domain": "virginia.edu;virginia.edu;virginia.edu;adobe.com",
        "position": "PhD student;Full Professor;Associate Professor;Research Scientist",
        "bibtex": "@misc{\nqi2024extending,\ntitle={Extending to New Domains without Visual and Textual Oracles},\nauthor={Daiqing Qi and Handong Zhao and Aidong Zhang and Sheng Li},\nyear={2024},\nurl={https://openreview.net/forum?id=tG5mpAM7ZK}\n}",
        "github": "",
        "project": "",
        "reviewers": "GcYV;spPq;mv6P",
        "site": "https://openreview.net/forum?id=tG5mpAM7ZK",
        "pdf_size": 1504943,
        "rating": "3;5;8",
        "confidence": "4;4;3",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "3;2;3",
        "wc_summary": "213;97;70",
        "wc_strengths": "75;42;96",
        "wc_weaknesses": "289;58;104",
        "wc_questions": "1;39;47",
        "wc_review": "578;236;317",
        "wc_reply_reviewers": "0;0;16",
        "wc_reply_authors": "1670;1262;1112",
        "reply_reviewers": "0;0;1",
        "reply_authors": "5;4;3",
        "rating_avg": [
            5.333333333333333,
            2.0548046676563256
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            126.66666666666667,
            62.03404083422441
        ],
        "wc_strengths_avg": [
            71.0,
            22.22611077089287
        ],
        "wc_weaknesses_avg": [
            150.33333333333334,
            99.83430717388131
        ],
        "wc_questions_avg": [
            29.0,
            20.06655592438988
        ],
        "wc_review_avg": [
            377.0,
            145.92463808418373
        ],
        "wc_reply_reviewers_avg": [
            5.333333333333333,
            7.542472332656507
        ],
        "wc_reply_authors_avg": [
            1348.0,
            235.77955806218657
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            4.0,
            0.816496580927726
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9176629354822472,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13334189688699735401&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "University of Virginia;Adobe",
        "aff_unique_dep": ";Adobe Systems Incorporated",
        "aff_unique_url": "https://www.virginia.edu;https://www.adobe.com",
        "aff_unique_abbr": "UVA;Adobe",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Charlottesville;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "tGEBnSQ0uE",
        "title": "Sensitivity-Aware Differentially Private Decentralized Learning with Adaptive Noise",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Most existing decentralized learning methods with differential privacy (DP) employ fixed-level Gaussian noise during training, regardless of gradient convergence, which compromises model accuracy without providing additional privacy benefits. In this paper, we propose a novel $\\underline{\\text{D}}$ifferentially $\\underline{\\text{P}}$rivate $\\underline{\\text{D}}$ecentralized learning approach, termed AdaD$^2$P, which employs $\\underline{\\text{Ada}}$ptive noise leveraging the real-time estimation of sensitivity for local updates based on gradient norms and works for time-varying communication topologies. Compared with existing solutions, the integration of adaptive noise enables us to enhance model accuracy while preserving the $(\\epsilon,\\delta)$-privacy budget. We prove that AdaD$^2$P achieves a utility bound of $\\mathcal{O}\\left( \\sqrt{d\\log \\left( \\frac{1}{\\delta} \\right)}/(\\sqrt{n}J\\epsilon) \\right)$, where $J$ and $n$ are the number of local samples and nodes, respectively, and $d$ the dimension of decision variable; this bound matches that of the distributed counterparts with server-client structures, without relying on the stringent bounded gradient assumption commonly used in previous works. Theoretical analysis reveals the inherent advantages of AdaD$^2$P employing adaptive noise as opposed to constant noise.  Extensive experiments on two benchmark datasets demonstrate the superiority of AdaD$^2$P over its counterparts, especially under a strong level of privacy guarantee.",
        "keywords": "decentralized learning;differential privacy;adaptive noise;time-varying topology",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/0a61593ac03a6dc58d0031c5d9712aa3a3bdb2fa.pdf",
        "author": "Zehan Zhu;Yan Huang;Xin Wang;Jinming Xu",
        "authorids": "~Zehan_Zhu1;~Yan_Huang13;~Xin_Wang69;~Jinming_Xu1",
        "gender": "M;;M;M",
        "homepage": "https://zehanzhu.github.io/;;;https://jinmingxu.github.io/",
        "dblp": "323/8808;;10/5630-44;143/5957",
        "google_scholar": "https://scholar.google.com.hk/citations?user=BCawdpUAAAAJ;;ZB-KFD4AAAAJ;MuflLyIAAAAJ",
        "orcid": "0000-0002-2933-6574;;0000-0001-9501-6723;",
        "linkedin": ";;;",
        "or_profile": "~Zehan_Zhu1;~Yan_Huang13;~Xin_Wang69;~Jinming_Xu1",
        "aff": "Zhejiang University;;Qilu University of Technology;Zhejiang University",
        "aff_domain": "zju.edu.cn;;qlu.edu.cn;zju.edu.cn",
        "position": "PhD student;;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nzhu2024sensitivityaware,\ntitle={Sensitivity-Aware Differentially Private Decentralized Learning with Adaptive Noise},\nauthor={Zehan Zhu and Yan Huang and Xin Wang and Jinming Xu},\nyear={2024},\nurl={https://openreview.net/forum?id=tGEBnSQ0uE}\n}",
        "github": "",
        "project": "",
        "reviewers": "edhv;8T7D;ktTZ;pHbp;GXhs",
        "site": "https://openreview.net/forum?id=tGEBnSQ0uE",
        "pdf_size": 975253,
        "rating": "3;3;3;5;6",
        "confidence": "4;4;3;3;3",
        "soundness": "1;2;2;3;4",
        "contribution": "1;1;2;2;3",
        "presentation": "3;2;3;2;3",
        "wc_summary": "62;29;54;42;95",
        "wc_strengths": "10;23;32;34;49",
        "wc_weaknesses": "178;16;71;201;84",
        "wc_questions": "18;79;134;2;35",
        "wc_review": "268;147;291;279;263",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            4.0,
            1.2649110640673518
        ],
        "confidence_avg": [
            3.4,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.4,
            1.019803902718557
        ],
        "contribution_avg": [
            1.8,
            0.7483314773547883
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            56.4,
            22.294393914165955
        ],
        "wc_strengths_avg": [
            29.6,
            12.877888025604198
        ],
        "wc_weaknesses_avg": [
            110.0,
            69.19248514109029
        ],
        "wc_questions_avg": [
            53.6,
            47.718340289662216
        ],
        "wc_review_avg": [
            249.6,
            52.198084256033766
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.6454972243679028,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:rJQOKR4BOn4J:scholar.google.com/&scioq=Sensitivity-Aware+Differentially+Private+Decentralized+Learning+with+Adaptive+Noise&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Zhejiang University;Qilu University of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.zju.edu.cn;https://www.qlu.edu.cn",
        "aff_unique_abbr": "ZJU;QLU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "tGOOP7DGxs",
        "title": "Graph Transformers for Large Graphs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Transformers have recently emerged as powerful neural networks for graph learning, showcasing state-of-the-art performance on several graph property prediction tasks. However, these results have been limited to small-scale graphs, such as ligand molecules with fewer than a hundred atoms, where the computational feasibility of the global attention mechanism is possible. The next goal is to scale up these architectures to handle very large graphs on the scale of millions or even billions of nodes. With large-scale graphs, global attention learning is proven impractical due to its quadratic complexity w.r.t. the number of nodes. On the other hand, neighborhood sampling techniques become essential to manage large graph sizes, yet finding the optimal trade-off between speed and accuracy with sampling techniques remains challenging. This work advances representation learning on single large-scale graphs with a focus on identifying model characteristics and critical design constraints for developing scalable graph transformer (GT) architectures. We argue such GT requires layers that can adeptly learn both local and global graph representations while swiftly sampling the graph topology. As such, a key innovation of this work lies in the creation of a fast neighborhood sampling technique coupled with a local attention mechanism that encompasses a 4-hop reception field, but achieved through just 2-hop operations. This local node embedding is then integrated with a global node embedding, acquired via another self-attention layer with an approximate global codebook, before finally sent through a downstream layer for node predictions. The proposed GT framework, named LargeGT, overcomes previous computational bottlenecks and is validated on three large-scale node classification benchmarks. We report a 3\u00d7 speedup and 16.8% performance gain on ogbn-products and snap-patents compared to their nearest baselines respectively, while we also scale LargeGT on ogbn-papers100M with a 5.9% improvement in performance.",
        "keywords": "graph representation learning;graph transformers;large graphs",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Vijay Prakash Dwivedi;Yozen Liu;Anh Tuan Luu;Xavier Bresson;Neil Shah;Tong Zhao",
        "authorids": "~Vijay_Prakash_Dwivedi1;~Yozen_Liu1;~Anh_Tuan_Luu2;~Xavier_Bresson6;~Neil_Shah2;~Tong_Zhao3",
        "gender": "M;;M;M;M;M",
        "homepage": "https://vijaydwivedi.com.np;https://www.linkedin.com/in/yozen-liu-531a67130/;https://tuanluu.github.io/;https://www.comp.nus.edu.sg/cs/people/xaviercs/;http://nshah.net;https://tzhao.io/",
        "dblp": "243/1717;242/8056.html;81/8329.html;95/378;71/7771;94/6503-3",
        "google_scholar": "8MS7iC0AAAAJ;i3U2JjEAAAAJ;https://scholar.google.com.sg/citations?hl=en;https://scholar.google.com.sg/citations?hl=en;Qut69OgAAAAJ;05cRc-MAAAAJ",
        "orcid": ";;;;0000-0003-3261-8430;0000-0001-7660-1732",
        "linkedin": "vijay321/;;;;;",
        "or_profile": "~Vijay_Prakash_Dwivedi1;~Yozen_Liu1;~Anh_Tuan_Luu2;~Xavier_Bresson6;~Neil_Shah2;~Tong_Zhao3",
        "aff": "ASUS;Snap Inc.;Nanyang Technological University;National University of Singapore;Snap Inc.;Snap Inc.",
        "aff_domain": "asus.com;snapchat.com;ntu.edu.sg;nus.edu.sg;snap.com;snap.com",
        "position": "AI Researcher;Researcher;Assistant Professor;Associate Professor;Research Scientist;Researcher",
        "bibtex": "@misc{\ndwivedi2024graph,\ntitle={Graph Transformers for Large Graphs},\nauthor={Vijay Prakash Dwivedi and Yozen Liu and Anh Tuan Luu and Xavier Bresson and Neil Shah and Tong Zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=tGOOP7DGxs}\n}",
        "github": "",
        "project": "",
        "reviewers": "yzrb;S1aR;xiXc;dgE1",
        "site": "https://openreview.net/forum?id=tGOOP7DGxs",
        "pdf_size": 708610,
        "rating": "5;5;5;5",
        "confidence": "4;4;3;4",
        "soundness": "2;2;3;2",
        "contribution": "2;2;2;2",
        "presentation": "3;3;3;3",
        "wc_summary": "129;55;67;89",
        "wc_strengths": "161;64;25;32",
        "wc_weaknesses": "226;281;136;81",
        "wc_questions": "110;60;2;43",
        "wc_review": "626;460;230;245",
        "wc_reply_reviewers": "86;0;0;0",
        "wc_reply_authors": "1166;1485;589;903",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "2;3;2;3",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            85.0,
            28.178005607210743
        ],
        "wc_strengths_avg": [
            70.5,
            54.27936993002037
        ],
        "wc_weaknesses_avg": [
            181.0,
            77.54031209635411
        ],
        "wc_questions_avg": [
            53.75,
            38.71934271136327
        ],
        "wc_review_avg": [
            390.25,
            163.72289852064065
        ],
        "wc_reply_reviewers_avg": [
            21.5,
            37.239092362730865
        ],
        "wc_reply_authors_avg": [
            1035.75,
            330.1510071164406
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13835277074262379256&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;3;1;1",
        "aff_unique_norm": "ASUS;Snap Inc.;Nanyang Technological University;National University of Singapore",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.asus.com;https://www.snapinc.com;https://www.ntu.edu.sg;https://www.nus.edu.sg",
        "aff_unique_abbr": "ASUS;Snap;NTU;NUS",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Taiwan;",
        "aff_country_unique_index": "0;1;2;2;1;1",
        "aff_country_unique": "China;United States;Singapore"
    },
    {
        "title": "Reasoning with Latent Diffusion in Offline Reinforcement Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17620",
        "id": "tGQirjzddO",
        "author_site": "Siddarth Venkatraman, Shivesh Khaitan, Ravi Tej Akella, John Dolan, Jeff Schneider, Glen Berseth",
        "tldr": "",
        "abstract": "Offline reinforcement learning (RL) holds promise as a means to learn high-reward policies from a static dataset, without the need for further environment interactions. However, a key challenge in offline RL lies in effectively stitching portions of suboptimal trajectories from the static dataset while avoiding extrapolation errors arising due to a lack of support in the dataset. Existing approaches use conservative methods that are tricky to tune and struggle with multi-modal data or rely on noisy Monte Carlo return-to-go samples for reward conditioning. In this work, we propose a novel approach that leverages the expressiveness of latent diffusion to model in-support trajectory sequences as compressed latent skills. This facilitates learning a Q-function while avoiding extrapolation error via batch-constraining. The latent space is also expressive and gracefully copes with multi-modal data. We show that the learned temporally-abstract latent space encodes richer task-specific information for offline RL tasks as compared to raw state-actions. This improves credit assignment and facilitates faster reward propagation during Q-learning. Our method demonstrates state-of-the-art performance on the D4RL benchmarks, particularly excelling in long-horizon, sparse-reward tasks.",
        "keywords": "Reinforcement Learning;Diffusion Models",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Siddarth Venkatraman;Shivesh Khaitan;Ravi Tej Akella;John Dolan;Jeff Schneider;Glen Berseth",
        "authorids": "~Siddarth_Venkatraman1;~Shivesh_Khaitan1;~Ravi_Tej_Akella1;~John_Dolan1;~Jeff_Schneider1;~Glen_Berseth1",
        "gender": "M;;;M;;M",
        "homepage": ";;;https://www.ri.cmu.edu/ri-faculty/john-m-dolan/;https://www.cs.cmu.edu/~schneide;http://fracturedplane.com/",
        "dblp": "261/9239;277/0966;;52/532.html;38/247;147/5478",
        "google_scholar": "j9l0rg4AAAAJ;v-47-BIAAAAJ;;xLk_w7kAAAAJ;3bSbb20AAAAJ;https://scholar.google.ca/citations?user=-WZcuuwAAAAJ",
        "orcid": "0000-0002-3607-2781;0000-0003-3475-6714;;;0000-0002-5080-9073;0000-0001-7351-8028",
        "linkedin": "siddarth-venkatraman-59b863157/;shiveshkhaitan/;;;jeff-schneider-1593b322/;glen-berseth-0523278b?trk=hp-identity-name",
        "or_profile": "~Siddarth_Venkatraman1;~Shivesh_Khaitan1;~Ravi_Tej_Akella1;~John_Dolan1;~Jeff_Schneider1;~Glen_Berseth1",
        "aff": "Universit\u00e9 de Montr\u00e9al;;;School of Computer Science, Carnegie Mellon University;Carnegie Mellon University;Montreal Institute for Learning Algorithms, University of Montreal, Universit\u00e9 de Montr\u00e9al",
        "aff_domain": "umontreal.ca;;;cs.cmu.edu;cs.cmu.edu;mila.umontreal.ca",
        "position": "PhD student;;;Full Professor;Researcher;Assistant Professor",
        "bibtex": "@inproceedings{\nvenkatraman2024reasoning,\ntitle={Reasoning with Latent Diffusion in Offline Reinforcement Learning},\nauthor={Siddarth Venkatraman and Shivesh Khaitan and Ravi Tej Akella and John Dolan and Jeff Schneider and Glen Berseth},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=tGQirjzddO}\n}",
        "github": "",
        "project": "",
        "reviewers": "LeBC;Agic;hYz3",
        "pdf_size": 2898120,
        "rating": "5;6;8",
        "confidence": "4;4;5",
        "soundness": "3;3;4",
        "contribution": "3;2;3",
        "presentation": "2;3;3",
        "wc_summary": "110;48;208",
        "wc_strengths": "148;52;265",
        "wc_weaknesses": "424;369;511",
        "wc_questions": "137;34;87",
        "wc_review": "819;503;1071",
        "wc_reply_reviewers": "0;273;72",
        "wc_reply_authors": "1151;1058;1224",
        "reply_reviewers": "0;2;1",
        "reply_authors": "5;3;4",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            122.0,
            65.86855597830171
        ],
        "wc_strengths_avg": [
            155.0,
            87.0976463516667
        ],
        "wc_weaknesses_avg": [
            434.6666666666667,
            58.459862774005515
        ],
        "wc_questions_avg": [
            86.0,
            42.05551886098502
        ],
        "wc_review_avg": [
            797.6666666666666,
            232.37517557222463
        ],
        "wc_reply_reviewers_avg": [
            115.0,
            115.52488909321661
        ],
        "wc_reply_authors_avg": [
            1144.3333333333333,
            67.93297350248176
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            4.0,
            0.816496580927726
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.944911182523068,
        "gs_citation": 27,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7428821822993640460&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=tGQirjzddO",
        "pdf": "https://openreview.net/pdf?id=tGQirjzddO",
        "email": "umontreal.ca;;;cs.cmu.edu;cs.cmu.edu;mila.umontreal.ca",
        "author_num": 6,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "Universit\u00e9 de Montr\u00e9al;Carnegie Mellon University;University of Montreal",
        "aff_unique_dep": ";School of Computer Science;Montreal Institute for Learning Algorithms",
        "aff_unique_url": "https://www.umontreal.ca;https://www.cmu.edu;https://www.mila.quebec",
        "aff_unique_abbr": "UdeM;CMU;MILA",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Pittsburgh;Montreal",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "Canada;United States"
    },
    {
        "id": "tHHzfZSP6T",
        "title": "How Capable Can a Transformer Become? A Study on Synthetic, Interpretable Tasks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Transformers trained on huge text corpora exhibit a remarkable set of capabilities, e.g., performing simple logical operations. Given the inherent compositional nature of language, one can expect the model to learn to compose these capabilities, potentially yielding a combinatorial explosion of what operations it can perform on an input. Motivated by the above, we aim to assess in this paper \u201chow capable can a transformer become?\u201d. Specifically, we train Transformer models on a data-generating process that involves compositions of a set of well-defined monolithic capabilities. Through a series of extensive and systematic experiments on this data-generating process, we show that: (1) Transformers can learn compositional structures from the training data and generalize to exponentially or even combinatorially many functions; (2) Composing functions by generating intermediate outputs is more effective at generalizing to unseen compositions, compared to generating no intermediate outputs; (3) The training data has a significant impact on the model\u2019s ability to compose unseen combinations of functions; (4) The attention layers in the latter half of the Transformer seem critical to compositionality.",
        "keywords": "Transformers;Capabilities;Mechanistic interpretability;Synthetic task",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Rahul Ramesh;Mikail Khona;Robert P. Dick;Hidenori Tanaka;Ekdeep Singh Lubana",
        "authorids": "~Rahul_Ramesh2;~Mikail_Khona2;~Robert_P._Dick1;~Hidenori_Tanaka1;~Ekdeep_Singh_Lubana1",
        "gender": "M;M;;M;M",
        "homepage": "https://cis.upenn.edu/~rahulram;http://robertdick.org/;https://sites.google.com/view/htanaka/home;https://ekdeepslubana.github.io/;",
        "dblp": "168/7029;84/523.html;;228/2683;",
        "google_scholar": "wCa6nygAAAAJ;;f_pWOGIAAAAJ;https://scholar.google.co.in/citations?user=OP7S3vsAAAAJ;",
        "orcid": ";;;;",
        "linkedin": ";;;;mikail-khona-60656b141/",
        "or_profile": "~Rahul_Ramesh2;~Robert_P._Dick1;~Hidenori_Tanaka1;~Ekdeep_Singh_Lubana1;~mikail_khona1",
        "aff": "University of Pennsylvania;University of Michigan;Physics & Informatics Lab, NTT Research, Inc.;University of Michigan;",
        "aff_domain": "upenn.edu;umich.edu;ntt-research.com;umich.edu;",
        "position": "PhD student;Full Professor;Senior Research Scientist;PhD student;",
        "bibtex": "@misc{\nramesh2024how,\ntitle={How Capable Can a Transformer Become? A Study on Synthetic, Interpretable Tasks},\nauthor={Rahul Ramesh and Mikail Khona and Robert P. Dick and Hidenori Tanaka and Ekdeep Singh Lubana},\nyear={2024},\nurl={https://openreview.net/forum?id=tHHzfZSP6T}\n}",
        "github": "",
        "project": "",
        "reviewers": "1C3m;dYRf;h95b;xno8",
        "site": "https://openreview.net/forum?id=tHHzfZSP6T",
        "pdf_size": 8507357,
        "rating": "3;3;6;8",
        "confidence": "4;4;4;4",
        "soundness": "3;2;3;3",
        "contribution": "1;1;2;4",
        "presentation": "2;2;3;2",
        "wc_summary": "117;119;63;97",
        "wc_strengths": "10;1;44;30",
        "wc_weaknesses": "203;89;164;37",
        "wc_questions": "55;1;91;174",
        "wc_review": "385;210;362;338",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1758;1170;645;1277",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;2;1;2",
        "rating_avg": [
            5.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            1.224744871391589
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            99.0,
            22.494443758403985
        ],
        "wc_strengths_avg": [
            21.25,
            16.813313177360374
        ],
        "wc_weaknesses_avg": [
            123.25,
            64.48400964580289
        ],
        "wc_questions_avg": [
            80.25,
            62.89425649453215
        ],
        "wc_review_avg": [
            323.75,
            67.7435421276449
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1212.5,
            395.47218612691336
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13024756982647293202&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "University of Pennsylvania;University of Michigan;NTT Research, Inc.",
        "aff_unique_dep": ";;Physics & Informatics Lab",
        "aff_unique_url": "https://www.upenn.edu;https://www.umich.edu;https://www.ntt-research.com",
        "aff_unique_abbr": "UPenn;UM;NTT Research",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "tI3eqOV6Yt",
        "title": "Adaptivity and Modularity for Efficient Generalization Over Task Complexity",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Can transformers generalize efficiently on problems that require dealing with examples with different levels of difficulty? \nWe introduce a new task tailored to assess generalization over different complexities and present results that indicate that standard transformers face challenges in solving these tasks. These tasks are variations of pointer value retrieval previously introduced by Zhang et al. (2021). We investigate how the use of a mechanism for adaptive and modular computation in transformers facilitates the learning of tasks that demand generalization over the number of sequential computation steps (i.e., the depth of the computation graph).\nBased on our observations, we propose a transformer-based architecture called Hyper-UT, which combines dynamic function generation from hyper networks with adaptive depth from Universal Transformers. This model demonstrates higher accuracy and a fairer allocation of computational resources when generalizing to higher numbers of computation steps. We conclude that mechanisms for adaptive depth and modularity complement each other in improving efficient generalization concerning example complexity.\nAdditionally, to emphasize the broad applicability of our findings, we illustrate that in a standard image recognition task, Hyper-UT's performance matches that of a ViT model but with considerably reduced computational demands (achieving over 70\\% average savings by effectively using fewer layers).",
        "keywords": "multistep reasoning;generalization over example complexity; pointer value retrieval tasks; adaptive compute; modular compute;",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/b166c0ed603235c8aef97ed8941fd0d778dabb77.pdf",
        "author": "Samira Abnar;Omid Saremi;Laurent Dinh;Shantel Wilson;Miguel \u00c1ngel Bautista;Chen Huang;Vimal Thilak;Etai Littwin;Jiatao Gu;Joshua M. Susskind;Samy Bengio",
        "authorids": "~Samira_Abnar1;~Omid_Saremi1;~Laurent_Dinh1;shantelwilson777@gmail.com;~Miguel_\u00c1ngel_Bautista1;~Chen_Huang6;~Vimal_Thilak2;~Etai_Littwin1;~Jiatao_Gu1;~Joshua_M._Susskind1;~Samy_Bengio1",
        "gender": "Unspecified;;;;M;M;M;M;M;M;M",
        "homepage": "https://samiraabnar.github.io/;;https://laurent-dinh.github.io/;;;;;;http://jiataogu.me;http://www.apple.com;http://bengio.abracadoudou.com",
        "dblp": "150/5405;;131/6819;;38/10085;05/8125-1;14/4821;;164/5848.html;132/7797;b/SamyBengio",
        "google_scholar": "https://scholar.google.nl/citations?user=jbxwjgMAAAAJ;;h7OHSkoAAAAJ;;ZrRs-qoAAAAJ;QZ-JKOUAAAAJ;KyBnuqsAAAAJ;NOVS7vwAAAAJ;https://scholar.google.com.sg/citations?user=cB1mFBsAAAAJ;Sv2TGqsAAAAJ;Vs-MdPcAAAAJ",
        "orcid": ";;;;;;;;;;",
        "linkedin": ";omidsaremi/;;;;;;;jiatao-gu-204b2672/;joshua-susskind-8ab2ab5/;bengio",
        "or_profile": "~Samira_Abnar1;~Omid_Saremi1;~Laurent_Dinh1;shantelwilson777@gmail.com;~Miguel_\u00c1ngel_Bautista1;~Chen_Huang6;~Vimal_Thilak2;~Etai_Littwin1;~Jiatao_Gu1;~Joshua_M._Susskind1;~Samy_Bengio1",
        "aff": "Apple;Apple;Apple;;Apple;Apple;Apple;;Apple;Apple;Apple",
        "aff_domain": "apple.com;apple.com;apple.com;;apple.com;apple.com;apple.com;;apple.com;apple.com;apple.com",
        "position": "Researcher;ML;Researcher;;Research Scientist;Research Scientist;Engineer;;Researcher;Researcher;Senior Director",
        "bibtex": "@misc{\nabnar2024adaptivity,\ntitle={Adaptivity and Modularity for Efficient Generalization Over Task Complexity},\nauthor={Samira Abnar and Omid Saremi and Laurent Dinh and Shantel Wilson and Miguel {\\'A}ngel Bautista and Chen Huang and Vimal Thilak and Etai Littwin and Jiatao Gu and Joshua M. Susskind and Samy Bengio},\nyear={2024},\nurl={https://openreview.net/forum?id=tI3eqOV6Yt}\n}",
        "github": "",
        "project": "",
        "reviewers": "Qbwm;D459;PAjo;tf4F",
        "site": "https://openreview.net/forum?id=tI3eqOV6Yt",
        "pdf_size": 871764,
        "rating": "5;5;5;5",
        "confidence": "2;3;2;4",
        "soundness": "2;4;3;4",
        "contribution": "2;3;2;4",
        "presentation": "2;2;3;3",
        "wc_summary": "45;83;42;188",
        "wc_strengths": "20;59;53;64",
        "wc_weaknesses": "33;83;185;138",
        "wc_questions": "3;19;4;51",
        "wc_review": "101;244;284;441",
        "wc_reply_reviewers": "0;0;0;108",
        "wc_reply_authors": "229;400;445;489",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            89.5,
            59.12063937407984
        ],
        "wc_strengths_avg": [
            49.0,
            17.190113437671084
        ],
        "wc_weaknesses_avg": [
            109.75,
            57.15494291835134
        ],
        "wc_questions_avg": [
            19.25,
            19.395553614166314
        ],
        "wc_review_avg": [
            267.5,
            121.08777807854928
        ],
        "wc_reply_reviewers_avg": [
            27.0,
            46.76537180435969
        ],
        "wc_reply_authors_avg": [
            390.75,
            98.54535757710761
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2214157284323566915&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;0;0;0;0;0;0;0",
        "aff_unique_norm": "Apple",
        "aff_unique_dep": "Apple Inc.",
        "aff_unique_url": "https://www.apple.com",
        "aff_unique_abbr": "Apple",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "tIsYpRxMvr",
        "title": "Good Better Best: Self-Motivated Imitation Learning For Noisy Demonstrations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Imitation Learning (IL) aims to discover a policy by minimizing the discrepancy between the agent's behavior and expert demonstrations. However, IL is susceptible to limitations imposed by noisy demonstrations from non-expert behaviors, presenting a significant challenge due to the lack of supplementary information to assess their expertise. In this paper, we introduce Self-Motivated Imitation LEarning (SMILE), a method capable of progressively filtering out demonstrations collected by policies deemed inferior to the current policy, eliminating the need for additional information. We utilize the forward and reverse processes of Diffusion Models to emulate the shift in demonstration expertise from low to high and vice versa, thereby extracting the noise information that diffuses expertise. Then, the noise information is leveraged to predict the diffusion steps between the current policy and demonstrators, which we theoretically demonstrate its equivalence to their expertise gap. We further explain in detail how the predicted diffusion steps are applied to filter out noisy demonstrations in a self-motivated manner and provide its theoretical grounds. Through empirical evaluations on MuJoCo tasks, we demonstrate that our method is proficient in learning the expert policy amidst noisy demonstrations, and effectively filters out demonstrations with expertise inferior to the current policy.",
        "keywords": "Imitation Learning;Diffusion Model",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/8d1b3b922496bfaf3c426593b27662f1dabc1542.zip",
        "author": "Ye Yuan;Xin Li;Yong Heng;Leiji Zhang;Mingzhong Wang",
        "authorids": "~Ye_Yuan14;~Xin_Li31;~Yong_Heng1;~Leiji_Zhang3;~Mingzhong_Wang2",
        "gender": ";F;M;M;M",
        "homepage": "https://github.com/codyuan;https://cs.bit.edu.cn/szdw/jsml/js/lixin/index.htm;;https://github.com/Javazlj;https://www.usc.edu.au/staff/dr-mingzhong-wang",
        "dblp": ";09/1365-33.html;https://dblp.uni-trier.de/pid/333/0444;;12/5272",
        "google_scholar": ";https://scholar.google.com/citations?hl=zh-TW;;;Jj30mIUAAAAJ",
        "orcid": ";0000-0003-4257-4347;0000-0002-1721-9995;;0000-0002-6533-8104",
        "linkedin": ";;;;",
        "or_profile": "~Ye_Yuan14;~Xin_Li31;~Yong_Heng1;~Leiji_Zhang3;~Mingzhong_Wang2",
        "aff": ";Beijing Institute of Technology;;Beijing Institute of Technology;University of the Sunshine Coast",
        "aff_domain": ";bit.edu.cn;;bit.edu.cn;usc.edu.au",
        "position": ";Associate Professor;;MS student;Assistant Professor",
        "bibtex": "@misc{\nyuan2024good,\ntitle={Good Better Best: Self-Motivated Imitation Learning For Noisy Demonstrations},\nauthor={Ye Yuan and Xin Li and Yong Heng and Leiji Zhang and Mingzhong Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=tIsYpRxMvr}\n}",
        "github": "",
        "project": "",
        "reviewers": "76Xe;Qmx6;itCd;z47T",
        "site": "https://openreview.net/forum?id=tIsYpRxMvr",
        "pdf_size": 689845,
        "rating": "3;3;5;6",
        "confidence": "5;4;4;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;2;3",
        "wc_summary": "119;107;58;69",
        "wc_strengths": "28;37;33;32",
        "wc_weaknesses": "179;290;406;64",
        "wc_questions": "33;232;8;71",
        "wc_review": "359;666;505;236",
        "wc_reply_reviewers": "61;169;184;11",
        "wc_reply_authors": "971;2861;1160;670",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;5;3;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            88.25,
            25.410381736605217
        ],
        "wc_strengths_avg": [
            32.5,
            3.2015621187164243
        ],
        "wc_weaknesses_avg": [
            234.75,
            127.12469272332578
        ],
        "wc_questions_avg": [
            86.0,
            87.22671609088583
        ],
        "wc_review_avg": [
            441.5,
            160.83298790981905
        ],
        "wc_reply_reviewers_avg": [
            106.25,
            72.63392802265344
        ],
        "wc_reply_authors_avg": [
            1415.5,
            852.6577566644193
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.75,
            1.479019945774904
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1481791950752164224&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Beijing Institute of Technology;University of the Sunshine Coast",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.bit.edu.cn/;https://www.usc.edu.au",
        "aff_unique_abbr": "BIT;USC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "China;Australia"
    },
    {
        "id": "tItq3cwzYc",
        "title": "Lightweight Image Classification Network Based on Feature Extraction Network SimpleResUNet and Attention",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Using lightweight neural network models for small-sample image classification tasks has always been a challenging task. This paper proposes a feature extraction network called SimpleResUNet based on ResNet and U-Net, and adopts the Attention mechanism as the feature classifier for image classification, aiming to improve the accuracy and robustness of small-sample image classification tasks using lightweight network structures. Firstly, the network combines the feature extraction capability of U-Net and the efficient feature propagation capability of ResNet to effectively extract details and contextual information from the images. Secondly, the Attention mechanism is used to capture the correlations and dependencies between different features in the feature sequence. Multiple public datasets were used for verification in the experiment, and comparative analysis was conducted with other methods. Experimental results show that the network achieves superior performance in image classification tasks. Finally, some thoughts on the mechanism of this model are discussed, the work of this paper is summarized, and future research directions are prospected.",
        "keywords": "CNN;ResNet;Attention;Feature Space;Lightweight Neural Network",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Mengnan Qu;Yuhao Jin;Guanghua Zhang",
        "authorids": "~Mengnan_Qu1;~Yuhao_Jin1;~Guanghua_Zhang2",
        "gender": "M;;M",
        "homepage": "http://research.quanfita.cn;;https://xxxy.web.hebust.edu.cn/jyjx/yjsjy/ssjy/guanghua.htm",
        "dblp": ";;62/1225.html",
        "google_scholar": "U73d6LAAAAAJ;;",
        "orcid": "0000-0002-1310-0401;0009-0001-8044-3535;0000-0002-1877-3760",
        "linkedin": ";;",
        "or_profile": "~Mengnan_Qu1;~Yuhao_Jin1;~Guanghua_Zhang2",
        "aff": ";;Hebei University of Science and Technology",
        "aff_domain": ";;hebust.edu.cn",
        "position": ";;Full Professor",
        "bibtex": "@misc{\nqu2024lightweight,\ntitle={Lightweight Image Classification Network Based on Feature Extraction Network SimpleRes{UN}et and Attention},\nauthor={Mengnan Qu and Yuhao Jin and Guanghua Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=tItq3cwzYc}\n}",
        "github": "",
        "project": "",
        "reviewers": "8gWN;pv9C;YaL5",
        "site": "https://openreview.net/forum?id=tItq3cwzYc",
        "pdf_size": 960705,
        "rating": "3;3;5",
        "confidence": "5;5;5",
        "soundness": "3;2;2",
        "contribution": "1;2;2",
        "presentation": "2;2;2",
        "wc_summary": "24;62;45",
        "wc_strengths": "20;18;29",
        "wc_weaknesses": "303;82;124",
        "wc_questions": "19;2;56",
        "wc_review": "366;164;254",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            5.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            43.666666666666664,
            15.542057635833023
        ],
        "wc_strengths_avg": [
            22.333333333333332,
            4.784233364802441
        ],
        "wc_weaknesses_avg": [
            169.66666666666666,
            95.82739112012227
        ],
        "wc_questions_avg": [
            25.666666666666668,
            22.543784558547888
        ],
        "wc_review_avg": [
            261.3333333333333,
            82.62902368753703
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:RiYTW-8S3t0J:scholar.google.com/&scioq=Lightweight+Image+Classification+Network+Based+on+Feature+Extraction+Network+SimpleResUNet+and+Attention&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Hebei University of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.hbust.edu.cn/",
        "aff_unique_abbr": "",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "tJDlRzQh7x",
        "title": "Neural Networks and Solomonoff Induction",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Solomonoff Induction (SI) is the most powerful universal predictor given unlimited computational resources. Naive SI approximations are challenging and require running vast amount of programs for extremely long. Here we explore an alternative path to SI \n  consisting in meta-training neural networks on universal data sources.\n  We generate the training data by feeding random programs to Universal Turing Machines (UTMs) and guarantee convergence in the limit to various SI variants (under simplifying assumptions). We provide novel results on how a non-uniform distribution over programs still maintain the universality property. Experimentally, we investigate the effect neural network architectures (i.e. LSTMs, Transformers, etc.) and sizes on their performance on algorithmic data, crucial for SI. First, we consider variable-order Markov sources where the Bayes-optimal predictor is the well-known Context Tree Weighting (CTW) algorithm.\n  Second, we evaluate on challenging algorithmic tasks on Chomsky hierarchy that require different memory structures. Finally, we test on the UTM domain following our theoretical results.  We show that scaling network size always improves performance on all tasks, Transformers outperforming all others, even achieving optimality on par with CTW. Promisingly, large Transformers and LSTMs trained on UTM data exhibit transfer to the other domains.",
        "keywords": "Universal prediction;CTW;in-context learning;Turing machines;Transformers;Meta-Learning;Chomsky hierarchy",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Jordi Grau-Moya;Tim Genewein;Marcus Hutter;Laurent Orseau;Gregoire Deletang;Elliot Catt;Anian Ruoss;Christopher Mattern;Li Kevin Wenliang;Matthew Aitchison;Joel Veness",
        "authorids": "~Jordi_Grau-Moya2;~Tim_Genewein1;~Marcus_Hutter1;~Laurent_Orseau1;~Gregoire_Deletang1;~Elliot_Catt1;~Anian_Ruoss1;~Christopher_Mattern1;~Li_Kevin_Wenliang1;~Matthew_Aitchison1;~Joel_Veness2",
        "gender": ";M;;;;M;M;;;M;",
        "homepage": ";http://tim.inversetemperature.net/;http://www.hutter1.net/;;;;;;https://kevin-w-li.github.io/;;",
        "dblp": "116/3023;116/3039;h/MarcusHutter;79/1040;;204/2511;259/2083;19/10437.html;255/7009;;",
        "google_scholar": ";https://scholar.google.de/citations?user=peNTK9oAAAAJ;https://scholar.google.com.tw/citations?user=7hmCntEAAAAJ;;;d1JYeMIAAAAJ;gFkwD3kAAAAJ;;https://scholar.google.co.uk/citations?user=MW45NMEAAAAJ;81URpqMAAAAJ;",
        "orcid": ";;0000-0002-3263-4097;;;0000-0001-9411-927X;;;;;",
        "linkedin": "jordi-g-9a1b02104;;hutter1/;;;;anian-ruoss;;;;",
        "or_profile": "~Jordi_Grau-Moya2;~Tim_Genewein1;~Marcus_Hutter1;~Laurent_Orseau1;~Gregoire_Deletang1;~Elliot_Catt1;~Anian_Ruoss1;~Christopher_Mattern1;~Li_Kevin_Wenliang1;~Matthew_Aitchison1;~Joel_Veness2",
        "aff": "Google DeepMind;Google DeepMind;Australian National University;;;Google DeepMind;Google DeepMind;Google DeepMind;Google DeepMind;Australian National University;",
        "aff_domain": "deepmind.com;google.com;anu.edu.au;;;deepmind.com;deepmind.com;deepmind.com;deepmind.com;anu.edu.au;",
        "position": "Researcher;Researcher;Full Professor;;;Researcher;Researcher;Researcher;Researcher;PhD student;",
        "bibtex": "@misc{\ngrau-moya2024neural,\ntitle={Neural Networks and Solomonoff Induction},\nauthor={Jordi Grau-Moya and Tim Genewein and Marcus Hutter and Laurent Orseau and Gregoire Deletang and Elliot Catt and Anian Ruoss and Christopher Mattern and Li Kevin Wenliang and Matthew Aitchison and Joel Veness},\nyear={2024},\nurl={https://openreview.net/forum?id=tJDlRzQh7x}\n}",
        "github": "",
        "project": "",
        "reviewers": "YTUE;iUvX;Mfzf",
        "site": "https://openreview.net/forum?id=tJDlRzQh7x",
        "pdf_size": 998404,
        "rating": "3;5;5",
        "confidence": "3;5;2",
        "soundness": "3;3;3",
        "contribution": "2;2;3",
        "presentation": "1;3;3",
        "wc_summary": "47;54;36",
        "wc_strengths": "57;11;58",
        "wc_weaknesses": "347;17;107",
        "wc_questions": "254;741;61",
        "wc_review": "705;823;262",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "629;1113;806",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;2;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            1.247219128924647
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            45.666666666666664,
            7.408703590297623
        ],
        "wc_strengths_avg": [
            42.0,
            21.924111536540465
        ],
        "wc_weaknesses_avg": [
            157.0,
            139.2838827718412
        ],
        "wc_questions_avg": [
            352.0,
            286.12701142441387
        ],
        "wc_review_avg": [
            596.6666666666666,
            241.49856222254317
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            849.3333333333334,
            199.95388357207656
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": 0.18898223650461365,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:tHGK_G6Gd0wJ:scholar.google.com/&scioq=Neural+Networks+and+Solomonoff+Induction&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;0;0;0;1",
        "aff_unique_norm": "Google;Australian National University",
        "aff_unique_dep": "Google DeepMind;",
        "aff_unique_url": "https://deepmind.com;https://www.anu.edu.au",
        "aff_unique_abbr": "DeepMind;ANU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0;0;0;1",
        "aff_country_unique": "United Kingdom;Australia"
    },
    {
        "id": "tK8v5Keq9o",
        "title": "Edge-free but Structure-aware: Prototype-Guided Knowledge Distillation from GNNs to MLPs",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Distilling high-accuracy Graph Neural Networks (GNNs) to low-latency multilayer perceptrons (MLPs) on graph tasks has become a hot research topic. However, conventional MLPs almost exclusively rely on the graph nodes and fail to effectively capture the graph structural information. Previous methods address this issue by processing graph edges into extra inputs for MLPs, but such graph structures may be unavailable for various scenarios. To this end, we propose Prototype-Guided Knowledge Distillation (PGKD), which does not require graph edges (edge-free setting) yet learns structure-aware MLPs. Our insight is to distill graph structural information from GNNs. Specifically, we first analyze the impact of graph structures on GNN teachers, and then design two losses based on prototypes to distill such information from GNNs to MLPs. Experimental results on popular graph benchmarks demonstrate the effectiveness and robustness of the proposed PGKD.",
        "keywords": "Knowledge Distillation;Graph Neural Networks;multilayer perceptrons;Edge-free;Structure-aware",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/513928d0cbf0741f2b57a45cb6fe76d7c20d3a67.zip",
        "author": "Taiqiang Wu;Zhe Zhao;Jiahao Wang;Xingyu Bai;Lei Wang;Ngai Wong;Yujiu Yang",
        "authorids": "~Taiqiang_Wu1;~Zhe_Zhao1;~Jiahao_Wang1;~Xingyu_Bai1;~Lei_Wang54;~Ngai_Wong1;~Yujiu_Yang2",
        "gender": "M;M;M;F;M;M;M",
        "homepage": "https://wutaiqiang.github.io;;https://www.zhihu.com/people/wang-jia-hao-hku;;https://orcid.org/0000-0003-2124-0954;https://www.eee.hku.hk/~nwong/;https://sites.google.com/view/iigroup-thu",
        "dblp": "303/5950;28/6429-6.html;;303/6736;;88/3656;30/3847",
        "google_scholar": "mCtvn50AAAAJ;https://scholar.google.com.hk/citations?hl=zh-CN;https://scholar.google.com/citations?hl=zh-CN;;;PM_uMYIAAAAJ;4gH3sxsAAAAJ",
        "orcid": "0000-0002-3664-3513;;;;0000-0003-2124-0954;0000-0002-3026-0108;0000-0002-6427-1024",
        "linkedin": ";;;;;;",
        "or_profile": "~Taiqiang_Wu1;~Zhe_Zhao1;~Jiahao_Wang1;~Xingyu_Bai1;~Lei_Wang54;~Ngai_Wong1;~Yujiu_Yang2",
        "aff": "The University of Hong Kong;Tencent AI Lab;University of Hong Kong;;Pingan Technology;The University of Hong Kong;Tsinghua University",
        "aff_domain": "hku.hk;tencent.com;hku.hk;;pingan.com.cn;hku.hk;tsinghua.edu.cn",
        "position": "PhD student;Researcher;PhD student;;AI scientist;Associate Professor;Full Professor",
        "bibtex": "@misc{\nwu2024edgefree,\ntitle={Edge-free but Structure-aware: Prototype-Guided Knowledge Distillation from {GNN}s to {MLP}s},\nauthor={Taiqiang Wu and Zhe Zhao and Jiahao Wang and Xingyu Bai and Lei Wang and Ngai Wong and Yujiu Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=tK8v5Keq9o}\n}",
        "github": "",
        "project": "",
        "reviewers": "Yv3j;wb8Q;x8qx;74TD",
        "site": "https://openreview.net/forum?id=tK8v5Keq9o",
        "pdf_size": 1466985,
        "rating": "3;3;3;5",
        "confidence": "4;4;5;4",
        "soundness": "2;2;3;2",
        "contribution": "2;2;2;2",
        "presentation": "2;2;3;3",
        "wc_summary": "42;61;69;55",
        "wc_strengths": "70;21;92;35",
        "wc_weaknesses": "343;135;83;212",
        "wc_questions": "61;28;44;3",
        "wc_review": "516;245;288;305",
        "wc_reply_reviewers": "198;0;0;23",
        "wc_reply_authors": "219;577;456;255",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            56.75,
            9.858372076565177
        ],
        "wc_strengths_avg": [
            54.5,
            28.0579756931964
        ],
        "wc_weaknesses_avg": [
            193.25,
            97.88354049583617
        ],
        "wc_questions_avg": [
            34.0,
            21.365860619221497
        ],
        "wc_review_avg": [
            338.5,
            104.78668808584419
        ],
        "wc_reply_reviewers_avg": [
            55.25,
            82.94990958403753
        ],
        "wc_reply_authors_avg": [
            376.75,
            146.7044222237353
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7891834878173268607&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0;2;0;3",
        "aff_unique_norm": "University of Hong Kong;Tencent;PingAn Technology;Tsinghua University",
        "aff_unique_dep": ";Tencent AI Lab;;",
        "aff_unique_url": "https://www.hku.hk;https://ai.tencent.com;https://www.pingan.com;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "HKU;Tencent AI Lab;;THU",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "tKu7NNu0Yq",
        "title": "DeepEMD: A Transformer-based Fast Estimation of the Earth Mover\u2019s Distance",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The Earth Mover's Distance (EMD) is the measure of choice between point clouds. However the computational cost to compute it makes it prohibitive as a training loss, and the standard approach is to use a surrogate such as the Chamfer distance. We propose an attention-based model to compute an accurate approximation of the EMD that can be used as a training loss for generative models. To get the necessary accurate estimation of the gradients we train our model to explicitly compute the matching between point clouds instead of EMD itself. We cast this new objective as the estimation of an attention matrix that approximates the ground truth matching matrix. Experiments show that this model provides an accurate estimate of the EMD and its gradient with a wall clock speed-up of more than two orders of magnitude with respect to the exact Hungarian matching algorithm and one order of magnitude with respect to the standard approximate Sinkhorn algorithm, allowing in particular to train a point cloud VAE with the EMD itself. Extensive evaluation show the remarkable behaviour of this model when operating out-of-distribution, a key requirement for a distance surrogate. Finally, the model generalizes very well to point clouds during inference several times larger than during training.",
        "keywords": "Point clouds;Generative models;Earth mover's distance;Transformer;Attention;Surrogate;Chamfer distance",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/bf55902a6d4f09f7c49ddf6af94159b846bd30c0.zip",
        "author": "Atul Kumar Sinha;Fran\u00e7ois Fleuret",
        "authorids": "~Atul_Kumar_Sinha1;~Fran\u00e7ois_Fleuret2",
        "gender": "M;M",
        "homepage": ";https://fleuret.org/francois/",
        "dblp": "166/1635;90/5265",
        "google_scholar": ";https://scholar.google.ch/citations?user=Bj1tRlsAAAAJ",
        "orcid": ";0000-0001-9457-7393",
        "linkedin": "atulkumarin/;francois-fleuret/",
        "or_profile": "~Atul_Kumar_Sinha1;~Francois_Fleuret1",
        "aff": "University of Geneva;University of Geneva",
        "aff_domain": "unige.ch;unige.ch",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nsinha2024deepemd,\ntitle={Deep{EMD}: A Transformer-based Fast Estimation of the Earth Mover{\\textquoteright}s Distance},\nauthor={Atul Kumar Sinha and Fran{\\c{c}}ois Fleuret},\nyear={2024},\nurl={https://openreview.net/forum?id=tKu7NNu0Yq}\n}",
        "github": "",
        "project": "",
        "reviewers": "yNgN;ijdr;sp92;Fn5r",
        "site": "https://openreview.net/forum?id=tKu7NNu0Yq",
        "pdf_size": 6488398,
        "rating": "3;3;5;5",
        "confidence": "3;4;3;4",
        "soundness": "3;2;2;3",
        "contribution": "2;1;2;2",
        "presentation": "3;3;3;2",
        "wc_summary": "91;121;101;35",
        "wc_strengths": "209;58;81;32",
        "wc_weaknesses": "167;404;73;122",
        "wc_questions": "125;162;83;43",
        "wc_review": "592;745;338;232",
        "wc_reply_reviewers": "0;191;0;0",
        "wc_reply_authors": "489;925;264;421",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            87.0,
            31.906112267087632
        ],
        "wc_strengths_avg": [
            95.0,
            68.06247130394253
        ],
        "wc_weaknesses_avg": [
            191.5,
            127.11117181428232
        ],
        "wc_questions_avg": [
            103.25,
            44.62272403159628
        ],
        "wc_review_avg": [
            476.75,
            202.728112258759
        ],
        "wc_reply_reviewers_avg": [
            47.75,
            82.70542606141389
        ],
        "wc_reply_authors_avg": [
            524.75,
            245.06772023259202
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7594948809403046269&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Geneva",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.unige.ch",
        "aff_unique_abbr": "UNIGE",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Switzerland"
    },
    {
        "id": "tMKz4IgSZQ",
        "title": "Controllable Text-to-Image Generation with Automatic Sketches",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Current text-to-image generation models often struggle to follow textual instructions, especially the ones requiring spatial reasoning. On the other hand, Large Language Models (LLMs), such as GPT-4, have shown remarkable precision in generating code snippets for sketching out text inputs graphically, e.g., via TikZ. In this work, we introduce Control-GPT to guide the diffusion-based text-to-image pipelines with programmatic sketches generated by GPT-4, enhancing their abilities for instruction following. Control-GPT works by querying GPT-4 to write TikZ code, and the generated sketches are used as references alongside the text instructions for diffusion models (e.g., ControlNet) to generate photo-realistic images. One major challenge to training our pipeline is the lack of a dataset containing aligned text, images, and sketches. We address the issue by converting instance masks in existing datasets into polygons to mimic the sketches used at test time. As a result, Control-GPT greatly boosts the controllability of image generation. It establishes a new state-of-the-art on spatial arrangement and object positioning generation. It enhances users' control of object positions, sizes, etc., nearly doubling the accuracy of prior models. As a first attempt, our work shows the potential for employing LLMs to enhance performance in computer vision tasks.",
        "keywords": "text to image generation;controllable generation;large language models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/22bf8f2e122f0e471189417adf53f6b51e0ddacf.pdf",
        "author": "Tianjun Zhang;Yi Zhang;Vibhav Vineet;Neel Joshi;Xin Wang",
        "authorids": "~Tianjun_Zhang1;~Yi_Zhang1;~Vibhav_Vineet5;~Neel_Joshi1;~Xin_Wang1",
        "gender": ";M;;;F",
        "homepage": "https://tianjunz.github.io;https://yi-zhang.me;;;https://people.eecs.berkeley.edu/~xinw/",
        "dblp": ";64/6544-74;;;",
        "google_scholar": "UE9jz_MAAAAJ;lc6CVqEAAAAJ;;;e9gUdKwAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;xin-wang-aa83a577",
        "or_profile": "~Tianjun_Zhang1;~Yi_Zhang1;~Vibhav_Vineet5;~Neel_Joshi1;~Xin_Wang1",
        "aff": "University of California, Berkeley;Microsoft;;;Microsoft",
        "aff_domain": "berkeley.edu;microsoft.com;;;microsoft.com",
        "position": "PhD student;Researcher;;;Senior Researcher",
        "bibtex": "@misc{\nzhang2024controllable,\ntitle={Controllable Text-to-Image Generation with Automatic Sketches},\nauthor={Tianjun Zhang and Yi Zhang and Vibhav Vineet and Neel Joshi and Xin Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=tMKz4IgSZQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "4EN4;nAwp;uyRt",
        "site": "https://openreview.net/forum?id=tMKz4IgSZQ",
        "pdf_size": 8702770,
        "rating": "3;5;5",
        "confidence": "4;5;4",
        "soundness": "3;2;2",
        "contribution": "2;1;2",
        "presentation": "3;2;3",
        "wc_summary": "59;42;34",
        "wc_strengths": "53;42;77",
        "wc_weaknesses": "190;284;292",
        "wc_questions": "3;39;68",
        "wc_review": "305;407;471",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            45.0,
            10.424330514074594
        ],
        "wc_strengths_avg": [
            57.333333333333336,
            14.613540144521982
        ],
        "wc_weaknesses_avg": [
            255.33333333333334,
            46.31294515455575
        ],
        "wc_questions_avg": [
            36.666666666666664,
            26.587382136812355
        ],
        "wc_review_avg": [
            394.3333333333333,
            68.35853193924581
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:5kN8-1oFmOAJ:scholar.google.com/&scioq=Controllable+Text-to-Image+Generation+with+Automatic+Sketches&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "University of California, Berkeley;Microsoft",
        "aff_unique_dep": ";Microsoft Corporation",
        "aff_unique_url": "https://www.berkeley.edu;https://www.microsoft.com",
        "aff_unique_abbr": "UC Berkeley;Microsoft",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Berkeley;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Generalization of Scaled Deep ResNets in the Mean-Field Regime",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17619",
        "id": "tMzPZTvz2H",
        "author_site": "Yihang Chen, Fanghui Liu, Yiping Lu, Grigorios Chrysos, Volkan Cevher",
        "tldr": "",
        "abstract": "Despite the widespread empirical success of ResNet, the generalization properties of deep ResNet are rarely explored beyond the lazy training regime. In this work, we investigate scaled ResNet in the limit of infinitely deep and wide neural networks, of which the gradient flow is described by a partial differential equation in the large-neural network limit, i.e., the mean-field regime. To derive the generalization bounds under this setting, our analysis necessitates a shift from the conventional time-invariant Gram matrix employed in the lazy training regime to a time-variant, distribution-dependent version. To this end, we provide a global lower bound on the minimum eigenvalue of the Gram matrix under the mean-field regime. Besides, for the traceability of the dynamic of Kullback-Leibler (KL) divergence, we establish the linear convergence of the empirical error and estimate the upper bound of the KL divergence over parameters distribution. Finally, we build the uniform convergence for generalization bound via Rademacher complexity. Our results offer new insights into the generalization ability of deep ResNet beyond the lazy training regime and contribute to advancing the understanding of the fundamental properties of deep neural networks.",
        "keywords": "ResNet;mean field;generalization;Rademacher complexity",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Yihang Chen;Fanghui Liu;Yiping Lu;Grigorios Chrysos;Volkan Cevher",
        "authorids": "~Yihang_Chen1;~Fanghui_Liu1;~Yiping_Lu1;~Grigorios_Chrysos1;~Volkan_Cevher1",
        "gender": "M;M;M;M;M",
        "homepage": "https://yhangchen.github.io/;http://www.lfhsgre.org;https://2prime.github.io/;https://grigorisg9gr.github.io/;http://lions.epfl.ch",
        "dblp": ";119/1038;93/683-1;75/6117-2;70/5301",
        "google_scholar": "HzlOQRkAAAAJ;AKxBgssAAAAJ;NmhvVBgAAAAJ;1bU041kAAAAJ;https://scholar.google.ch/citations?user=hlWhzU8AAAAJ",
        "orcid": ";0000-0003-4133-7921;;;",
        "linkedin": ";;;;",
        "or_profile": "~Yihang_Chen1;~Fanghui_Liu1;~Yiping_Lu1;~Grigorios_Chrysos1;~Volkan_Cevher1",
        "aff": "EPFL - EPF Lausanne;University of Warwick;New York University;University of Wisconsin - Madison;Amazon Development Center Germany",
        "aff_domain": "epfl.ch;warwick.ac.uk;nyu.edu;wisc.edu;amazon.de",
        "position": "MS student;Assistant Professor;Instructor;Assistant Professor;Amazon Scholar",
        "bibtex": "@inproceedings{\nchen2024generalization,\ntitle={Generalization of Scaled Deep ResNets in the Mean-Field Regime},\nauthor={Yihang Chen and Fanghui Liu and Yiping Lu and Grigorios Chrysos and Volkan Cevher},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=tMzPZTvz2H}\n}",
        "github": "",
        "project": "",
        "reviewers": "8ogw;x2zh;JCPH",
        "pdf_size": 645149,
        "rating": "5;8;8",
        "confidence": "3;4;4",
        "soundness": "3;3;3",
        "contribution": "2;4;3",
        "presentation": "3;4;4",
        "wc_summary": "152;120;66",
        "wc_strengths": "32;155;111",
        "wc_weaknesses": "243;785;168",
        "wc_questions": "49;27;18",
        "wc_review": "476;1087;363",
        "wc_reply_reviewers": "66;73;0",
        "wc_reply_authors": "532;987;523",
        "reply_reviewers": "1;1;0",
        "reply_authors": "2;3;1",
        "rating_avg": [
            7.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            112.66666666666667,
            35.490217744549774
        ],
        "wc_strengths_avg": [
            99.33333333333333,
            50.88767587103537
        ],
        "wc_weaknesses_avg": [
            398.6666666666667,
            274.88947273808475
        ],
        "wc_questions_avg": [
            31.333333333333332,
            13.021349989749739
        ],
        "wc_review_avg": [
            642.0,
            318.02620437106543
        ],
        "wc_reply_reviewers_avg": [
            46.333333333333336,
            32.8870119584549
        ],
        "wc_reply_authors_avg": [
            680.6666666666666,
            216.64153700423094
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13690005132819043812&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 11,
        "openreview": "https://openreview.net/forum?id=tMzPZTvz2H",
        "pdf": "https://openreview.net/pdf?id=tMzPZTvz2H",
        "email": "epfl.ch;warwick.ac.uk;nyu.edu;wisc.edu;amazon.de",
        "author_num": 5,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "EPFL;University of Warwick;New York University;University of Wisconsin-Madison;Amazon",
        "aff_unique_dep": ";;;;Development Center",
        "aff_unique_url": "https://www.epfl.ch;https://www.warwick.ac.uk;https://www.nyu.edu;https://www.wisc.edu;https://www.amazon.de",
        "aff_unique_abbr": "EPFL;Warwick;NYU;UW-Madison;Amazon",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Lausanne;;Madison",
        "aff_country_unique_index": "0;1;2;2;3",
        "aff_country_unique": "Switzerland;United Kingdom;United States;Germany"
    },
    {
        "id": "tNAucRS0QQ",
        "title": "General-purpose Pre-trained Model Towards Cross-domain Molecule Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Self-supervised pre-training on biomolecules has achieved remarkable success in various biochemical applications, such as drug discovery and protein design. However, in most approaches, the learning model is primarily constructed based on the characteristics of either small molecules or proteins, without exploring their potential binding interactions -- an essential cross-domain relationship crucial for driving numerous biological processes. In this paper, inspired by the success of multimodal learning, we fill this gap by proposing a general-purpose foundation model named **BIT** (an abbreviation for **B**iomolecular **I**nteraction **T**ransformer), which is capable of encoding a range of biochemical entities, including small molecules, proteins, and protein-ligand complexes, as well as various data formats, encompassing both 2D and 3D structures, all within a shared Transformer backbone, via multiple unified self-supervised atom-level *denoising* tasks. We introduce *Mixture-of-Domain-Experts* (MoDE) to handle the biomolecules from diverse chemical domains and incorporate separate structural channels to capture positional dependencies in the molecular structures. The proposed MoDE allows BIT to enable both deep fusion and domain-specific encoding and learn cross-domain relationships on protein-ligand complexes with 3D cocrystal structures. Experimental results demonstrate that BIT achieves exceptional performance in both protein-ligand binding and molecular learning downstream tasks, including binding affinity prediction, virtual screening, and molecular property prediction.",
        "keywords": "molecular representation learning;self-supervised pre-training;multimodal learning",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Yiheng Zhu;Mingyang Li;Jieping Ye;Junlong Liu;Kun Fu;Jian Wu;Zheng Wang",
        "authorids": "~Yiheng_Zhu3;~Mingyang_Li5;~Jieping_Ye4;~Junlong_Liu2;~Kun_Fu1;~Jian_Wu6;~Zheng_Wang32",
        "gender": "M;;M;M;M;M;",
        "homepage": ";;http://yelabs.net/;;;https://scholar.google.com/citations?hl=zh-TW&user=VO9XIXYAAAAJ;",
        "dblp": ";;03/5454;;86/2645;96/2744-1;",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;;T9AzhwcAAAAJ;;;https://scholar.google.com/citations?hl=zh-TW;",
        "orcid": "0000-0001-8020-9979;;0000-0001-8662-5818;0000-0001-5125-3022;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Yiheng_Zhu3;~Mingyang_Li5;~Jieping_Ye4;~Junlong_Liu2;~Kun_Fu1;~Jian_Wu6;~Zheng_Wang32",
        "aff": "Zhejiang University;;Alibaba Group;;;Zhejiang University;",
        "aff_domain": "zju.edu.cn;;alibaba-inc.com;;;zju.edu.cn;",
        "position": "PhD student;;Principal Researcher;;;Full Professor;",
        "bibtex": "@misc{\nzhu2024generalpurpose,\ntitle={General-purpose Pre-trained Model Towards Cross-domain Molecule Learning},\nauthor={Yiheng Zhu and Mingyang Li and Jieping Ye and Junlong Liu and Kun Fu and Jian Wu and Zheng Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=tNAucRS0QQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "2Mm5;x6ZB;dgYT;uSoZ",
        "site": "https://openreview.net/forum?id=tNAucRS0QQ",
        "pdf_size": 1667731,
        "rating": "3;5;5;8",
        "confidence": "4;4;4;4",
        "soundness": "2;2;2;4",
        "contribution": "2;2;2;3",
        "presentation": "3;2;3;4",
        "wc_summary": "68;86;113;79",
        "wc_strengths": "38;36;125;76",
        "wc_weaknesses": "237;312;308;12",
        "wc_questions": "6;48;48;173",
        "wc_review": "349;482;594;340",
        "wc_reply_reviewers": "299;244;0;95",
        "wc_reply_authors": "1292;1903;1213;686",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "2;3;2;1",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            86.5,
            16.590660023037056
        ],
        "wc_strengths_avg": [
            68.75,
            36.17578610065025
        ],
        "wc_weaknesses_avg": [
            217.25,
            122.19937602132018
        ],
        "wc_questions_avg": [
            68.75,
            62.58344429639519
        ],
        "wc_review_avg": [
            441.25,
            104.58818049856303
        ],
        "wc_reply_reviewers_avg": [
            159.5,
            118.53375046795743
        ],
        "wc_reply_authors_avg": [
            1273.5,
            431.69115117176074
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:aQWx_C4FWU8J:scholar.google.com/&scioq=General-purpose+Pre-trained+Model+Towards+Cross-domain+Molecule+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Zhejiang University;Alibaba Group",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.zju.edu.cn;https://www.alibaba.com",
        "aff_unique_abbr": "ZJU;Alibaba",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "tNyCrUUATI",
        "title": "Can We Generate Realistic Hands Using Only Convolution?",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Despite their extensive use in generating hyperrealistic images, image generative models are prone to generating abnormal details and malformed features. One of the most prominent examples of this phenomenon is synthesizing contorted and mutated hands and fingers. Convolution serves as the backbone of many state-of-the-art image generative models, all of which are subject to the aforementioned phenomenon. We investigate whether adding a single channel, comprising horizontal and vertical coordinate information, to the input channels of convolution layers can alleviate this issue. We show that the answer is \u201cyes\u201d! We demonstrate this, in a GPU-poor setup, on two families of generative models, Generative Adversarial Networks (GANs) and Variational AutoEncoders (VAEs) trained on the Hand Gesture dataset. The hand images generated by models employing our method surpass those of models using simple convolution by a significant margin. We further validate the results for generating human faces using models trained on the CelebA-HQ dataset, demonstrating our models consistently yield superior images compared to those generated using simple convolution.",
        "keywords": "Computer Vision;Generative Models;AI Generated Hands;Convolutional Neural Networks;Generative Adversarial Networks;Variational AutoEncoders",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/ea1eabaec4dae26dcfe060703715a80b6ead87ac.zip",
        "author": "Mehran Hosseini;Peyman Hosseini",
        "authorids": "~Mehran_Hosseini1;peyman.xt@gmail.com",
        "gender": ";",
        "homepage": "https://mehranhosseini.com;",
        "dblp": "178/4712;",
        "google_scholar": ";",
        "orcid": "0000-0002-9227-3078;",
        "linkedin": "mehran-hosseini;",
        "or_profile": "~Mehran_Hosseini1;peyman.xt@gmail.com",
        "aff": "King's College London, University of London;",
        "aff_domain": "kcl.ac.uk;",
        "position": "Postdoc;",
        "bibtex": "@misc{\nhosseini2024can,\ntitle={Can We Generate Realistic Hands Using Only Convolution?},\nauthor={Mehran Hosseini and Peyman Hosseini},\nyear={2024},\nurl={https://openreview.net/forum?id=tNyCrUUATI}\n}",
        "github": "",
        "project": "",
        "reviewers": "NRKz;oSXB;1G3f;p7s7",
        "site": "https://openreview.net/forum?id=tNyCrUUATI",
        "pdf_size": 2381969,
        "rating": "3;3;3;6",
        "confidence": "5;4;3;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;1;2",
        "presentation": "2;1;2;3",
        "wc_summary": "77;119;54;41",
        "wc_strengths": "26;53;30;55",
        "wc_weaknesses": "218;238;200;65",
        "wc_questions": "4;30;37;70",
        "wc_review": "325;440;321;231",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            72.75,
            29.65109610115619
        ],
        "wc_strengths_avg": [
            41.0,
            13.095800853708795
        ],
        "wc_weaknesses_avg": [
            180.25,
            67.8836320477919
        ],
        "wc_questions_avg": [
            35.25,
            23.53056522908024
        ],
        "wc_review_avg": [
            329.25,
            74.16999056222132
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:OEUAnhC6F9gJ:scholar.google.com/&scioq=Can+We+Generate+Realistic+Hands+Using+Only+Convolution%3F&hl=en&as_sdt=0,19",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "King's College London",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kcl.ac.uk",
        "aff_unique_abbr": "KCL",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "title": "Matryoshka Diffusion Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17618",
        "id": "tOzCcDdH9O",
        "author_site": "Jiatao Gu, Shuangfei Zhai, Yizhe Zhang, Joshua Susskind, Navdeep Jaitly",
        "tldr": "",
        "abstract": "Diffusion models are the de-facto approach for generating high-quality images and videos, but learning high-dimensional models remains a formidable task due to computational and optimization challenges. Existing methods often resort to training cascaded models in pixel space, or using a downsampled latent space of a separately trained auto-encoder. In this paper, we introduce Matryoshka Diffusion (MDM), an end-to-end framework for high-resolution image and video synthesis. We propose a diffusion process that denoises inputs at multiple resolutions jointly and uses a NestedUNet architecture where features and parameters for small-scale inputs are nested within those of large scales. In addition, MDM enables a progressive training schedule from lower to higher resolutions, which leads to significant improvements in optimization for high-resolution generation. We demonstrate the effectiveness of our approach on various benchmarks, including class-conditioned image generation, high-resolution text-to-image, and text-to-video applications. Remarkably, we can train a single pixel-space model at resolutions of up to 1024x1024 pixels, demonstrating strong zero-shot generalization using the CC12M dataset, which contains only 12 million images. Code and pre-trained checkpoints are released at https://github.com/apple/ml-mdm.",
        "keywords": "diffusion models;text-to-image generation;nesting architecture;progressive training",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/7615337d7c5292503929ff3c9132c4027703893a.zip",
        "author": "Jiatao Gu;Shuangfei Zhai;Yizhe Zhang;Joshua M. Susskind;Navdeep Jaitly",
        "authorids": "~Jiatao_Gu1;~Shuangfei_Zhai3;~Yizhe_Zhang2;~Joshua_M._Susskind1;~Navdeep_Jaitly1",
        "gender": "M;M;M;M;M",
        "homepage": "http://jiataogu.me;http://cs.binghamton.edu/~szhai2;https://dreasysnail.github.io;http://www.apple.com;http://www.cs.toronto.edu/~ndjaitly/",
        "dblp": "164/5848.html;;132/4966-2.html;132/7797;04/6137",
        "google_scholar": "https://scholar.google.com.sg/citations?user=cB1mFBsAAAAJ;G6vdBYsAAAAJ;WDVMfggAAAAJ;Sv2TGqsAAAAJ;kjMNMLkAAAAJ",
        "orcid": ";;;;",
        "linkedin": "jiatao-gu-204b2672/;;;joshua-susskind-8ab2ab5/;",
        "or_profile": "~Jiatao_Gu1;~Shuangfei_Zhai3;~Yizhe_Zhang2;~Joshua_M._Susskind1;~Navdeep_Jaitly1",
        "aff": "Apple;Apple;Apple;Apple;Apple",
        "aff_domain": "apple.com;apple.com;apple.com;apple.com;apple.com",
        "position": "Researcher;Research Scientist;Researcher;Researcher;Principal Researcher",
        "bibtex": "@inproceedings{\ngu2024matryoshka,\ntitle={Matryoshka Diffusion Models},\nauthor={Jiatao Gu and Shuangfei Zhai and Yizhe Zhang and Joshua M. Susskind and Navdeep Jaitly},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=tOzCcDdH9O}\n}",
        "github": "",
        "project": "",
        "reviewers": "cN8u;Z34F;7XqF;iXvr",
        "pdf_size": 39094667,
        "rating": "5;6;6;8",
        "confidence": "4;4;4;4",
        "soundness": "2;2;2;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "85;89;44;89",
        "wc_strengths": "37;116;21;76",
        "wc_weaknesses": "137;225;50;120",
        "wc_questions": "18;322;24;78",
        "wc_review": "277;752;139;363",
        "wc_reply_reviewers": "37;541;56;75",
        "wc_reply_authors": "762;1561;401;509",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "3;3;2;2",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            76.75,
            18.978606376654742
        ],
        "wc_strengths_avg": [
            62.5,
            36.800135869314396
        ],
        "wc_weaknesses_avg": [
            133.0,
            62.325757115337154
        ],
        "wc_questions_avg": [
            110.5,
            124.32517846357591
        ],
        "wc_review_avg": [
            382.75,
            227.66903061242212
        ],
        "wc_reply_reviewers_avg": [
            177.25,
            210.44046070088328
        ],
        "wc_reply_authors_avg": [
            808.25,
            453.92035369654883
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 53,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8924662409493614073&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=tOzCcDdH9O",
        "pdf": "https://openreview.net/pdf?id=tOzCcDdH9O",
        "email": "apple.com;apple.com;apple.com;apple.com;apple.com",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Apple",
        "aff_unique_dep": "Apple Inc.",
        "aff_unique_url": "https://www.apple.com",
        "aff_unique_abbr": "Apple",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Towards Robust Out-of-Distribution Generalization Bounds via Sharpness",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17617",
        "id": "tPEwSYPtAC",
        "author_site": "Yingtian Zou, Kenji Kawaguchi, Yingnan Liu, Jiashuo Liu, Mong-Li Lee, Wynne Hsu",
        "tldr": "",
        "abstract": "Generalizing to out-of-distribution (OOD) data or unseen domain, termed OOD generalization, still lacks appropriate theoretical guarantees. Canonical OOD bounds focus on different distance measurements between source and target domains but fail to consider the optimization property of the learned model. As empirically shown in recent work, sharpness of learned minimum influences OOD generalization. To bridge this gap between optimization and OOD generalization, we study the effect of sharpness on how a model tolerates data change in domain shift which is usually captured by \"robustness\" in generalization. In this paper, we give a rigorous connection between sharpness and robustness, which gives better OOD guarantees for robust algorithms. It also provides a theoretical backing for \"flat minima leads to better OOD generalization\". Overall, we propose a sharpness-based OOD generalization bound by taking robustness into consideration, resulting in a tighter bound than non-robust guarantees. Our findings are supported by the experiments on a ridge regression model, as well as the experiments on deep learning classification tasks.",
        "keywords": "Out-of-Distribution generalization;Sharpness;Robustness",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Yingtian Zou;Kenji Kawaguchi;Yingnan Liu;Jiashuo Liu;Mong-Li Lee;Wynne Hsu",
        "authorids": "~Yingtian_Zou1;~Kenji_Kawaguchi1;~Yingnan_Liu1;~Jiashuo_Liu1;~Mong-Li_Lee1;~Wynne_Hsu1",
        "gender": "M;;F;M;F;F",
        "homepage": ";https://ml.comp.nus.edu.sg/#members;https://nancyquris.github.io/;https://ljsthu.github.io;https://www.comp.nus.edu.sg/~leeml/;http://www.comp.nus.edu.sg/~whsu/",
        "dblp": "223/4047;;150/1458-2;180/2823;l/MongLiLee;h/WynneHsu",
        "google_scholar": "APA-glsAAAAJ;aLl3rYoAAAAJ;KMUv_rMAAAAJ;b7bpt5MAAAAJ;https://scholar.google.com.tw/citations?user=_xFTK8wAAAAJ;https://scholar.google.com.tw/citations?user=ljyBjv8AAAAJ",
        "orcid": ";;;;0000-0002-9636-388X;0000-0002-4142-8893",
        "linkedin": ";;;jiashuo-liu-244a6b1a4;;",
        "or_profile": "~Yingtian_Zou1;~Kenji_Kawaguchi1;~Yingnan_Liu1;~Jiashuo_Liu1;~Mong-Li_Lee1;~Wynne_Hsu1",
        "aff": "National University of Singapore;National University of Singapore;National University of Singapore;University of Cambridge;National University of Singapore;National University of Singapore",
        "aff_domain": "nus.edu.sg;nus.edu;nus.edu;cam.ac.uk;nus.edu.sg;nus.edu.sg",
        "position": "PhD student;Presidential Young Professor;PhD student;Researcher;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nzou2024towards,\ntitle={Towards Robust Out-of-Distribution Generalization Bounds via Sharpness},\nauthor={Yingtian Zou and Kenji Kawaguchi and Yingnan Liu and Jiashuo Liu and Mong-Li Lee and Wynne Hsu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=tPEwSYPtAC}\n}",
        "github": "",
        "project": "",
        "reviewers": "m8jH;q8BG;b2N6;2MLh",
        "pdf_size": 5753010,
        "rating": "5;6;8;8",
        "confidence": "4;3;4;3",
        "soundness": "2;2;3;3",
        "contribution": "2;3;3;2",
        "presentation": "2;1;3;3",
        "wc_summary": "44;552;88;100",
        "wc_strengths": "27;46;49;45",
        "wc_weaknesses": "397;1055;21;149",
        "wc_questions": "33;277;39;6",
        "wc_review": "501;1930;197;300",
        "wc_reply_reviewers": "24;421;0;48",
        "wc_reply_authors": "542;526;189;471",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "2;2;1;2",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            196.0,
            206.59138413786766
        ],
        "wc_strengths_avg": [
            41.75,
            8.642193008721803
        ],
        "wc_weaknesses_avg": [
            405.5,
            398.60851721958977
        ],
        "wc_questions_avg": [
            88.75,
            109.39464109361116
        ],
        "wc_review_avg": [
            732.0,
            700.252454476241
        ],
        "wc_reply_reviewers_avg": [
            123.25,
            172.74167852605808
        ],
        "wc_reply_authors_avg": [
            432.0,
            142.74627841033194
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.19245008972987526,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16820041650622285193&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=tPEwSYPtAC",
        "pdf": "https://openreview.net/pdf?id=tPEwSYPtAC",
        "email": "nus.edu.sg;nus.edu;nus.edu;cam.ac.uk;nus.edu.sg;nus.edu.sg",
        "author_num": 6,
        "aff_unique_index": "0;0;0;1;0;0",
        "aff_unique_norm": "National University of Singapore;University of Cambridge",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.nus.edu.sg;https://www.cam.ac.uk",
        "aff_unique_abbr": "NUS;Cambridge",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Cambridge",
        "aff_country_unique_index": "0;0;0;1;0;0",
        "aff_country_unique": "Singapore;United Kingdom"
    },
    {
        "id": "tPjVRmHqCg",
        "title": "Curiosity Driven Protein Sequence Generation via Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Protein sequence design is a critical problem in the field of bio-engineering and biotechnology. However, the search space for protein sequence design is incredibly vast and sparsely populated, which poses significant challenges. On the other hand, generative models struggle to adapt to different usage scenarios and objectives, leading to limited adaptability and generalization. To address these challenges, we explore a reinforcement learning algorithm based on latent space that enables protein sequence generation and mutation for different scenarios. Our approach has several advantages: (1) The reinforcement learning algorithm allows us to adjust the reward function according to different tasks and scenarios, enabling the model to generate and mutate protein sequences in a targeted manner. (2) The latent space mapped by ESM-2 is continuous, unlike the initial sparse and discrete space, and the curiosity mechanism further improves search efficiency. We evaluate our method in completely different scenarios, including different protein functions and sequences, and our experimental results demonstrate significant performance improvement over existing methods. We conduct multiple ablation studies to validate the rationality of our design.",
        "keywords": "Protein Sequence Design;RL",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Shuang Ao;Tianyi Zhou;Le Niu;Jing Jiang;Yunfei Long",
        "authorids": "~Shuang_Ao3;~Tianyi_Zhou1;~Le_Niu1;~Jing_Jiang6;~Yunfei_Long1",
        "gender": "M;M;M;F;",
        "homepage": "https://github.com/Shuang-AO;https://tianyizhou.github.io/;https://overshiki.github.io/;https://www.uts.edu.au/staff/jing.jiang;",
        "dblp": ";88/8205-1;;68/1974-2;",
        "google_scholar": ";OKvgizMAAAAJ;;https://scholar.google.com.au/citations?hl=en;",
        "orcid": ";0000-0001-5348-0632;;;",
        "linkedin": ";tianyizhou;;;",
        "or_profile": "~Shuang_Ao3;~Tianyi_Zhou1;~Le_Niu1;~Jing_Jiang6;~Yunfei_Long1",
        "aff": "University of New South Wales;University of Maryland, College Park;;University of Technology Sydney;",
        "aff_domain": "unsw.edu.au;umd.edu;;uts.edu.au;",
        "position": "Postdoc;Assistant Professor;;Associate Professor;",
        "bibtex": "@misc{\nao2024curiosity,\ntitle={Curiosity Driven Protein Sequence Generation via Reinforcement Learning},\nauthor={Shuang Ao and Tianyi Zhou and Le Niu and Jing Jiang and Yunfei Long},\nyear={2024},\nurl={https://openreview.net/forum?id=tPjVRmHqCg}\n}",
        "github": "",
        "project": "",
        "reviewers": "J6eo;3CP8;yXq2",
        "site": "https://openreview.net/forum?id=tPjVRmHqCg",
        "pdf_size": 777242,
        "rating": "3;5;5",
        "confidence": "4;4;2",
        "soundness": "1;3;3",
        "contribution": "1;3;3",
        "presentation": "1;2;2",
        "wc_summary": "42;138;39",
        "wc_strengths": "32;377;12",
        "wc_weaknesses": "192;556;140",
        "wc_questions": "444;245;1",
        "wc_review": "710;1316;192",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            73.0,
            45.9782557302906
        ],
        "wc_strengths_avg": [
            140.33333333333334,
            167.54767149149586
        ],
        "wc_weaknesses_avg": [
            296.0,
            185.0693563685427
        ],
        "wc_questions_avg": [
            230.0,
            181.16475006652553
        ],
        "wc_review_avg": [
            739.3333333333334,
            459.3396225984526
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:FuB5mMZfRMUJ:scholar.google.com/&scioq=Curiosity+Driven+Protein+Sequence+Generation+via+Reinforcement+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of New South Wales;University of Maryland;University of Technology Sydney",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.unsw.edu.au;https://www/umd.edu;https://www.uts.edu.au",
        "aff_unique_abbr": "UNSW;UMD;UTS",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";College Park",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Australia;United States"
    },
    {
        "id": "tQ8gcygV4p",
        "title": "Model-Based Offline Reinforcement Learning with Conservative Bidirectional Rollouts",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Offline reinforcement learning (offline RL) learns from an offline dataset without further interactions with the environment. Although such offline training patterns can avoid cost and damage in the real environment, one main challenge is the distributional shift between the state-action pairs visited by the learned policy and those in the offline dataset. Prevailed existing model-based offline RL approaches learn a dynamics model from the dataset and perform pessimistic policy optimization based on uncertainty estimation. However, the inaccurate quantification of model uncertainty may incur the poor generalization and performance of model-based approaches, especially in the datasets lacking of sample diversity. To tackle this limitation, we instead design a novel framework for model-based offline RL, named Conservative Offline Bidirectional Model-based Policy Optimization (abbr. as COBiMO). First, we learn an ensemble bidirectional model from the offline dataset and construct long bidirectional rollouts by joining two unidirectional ones, thereby increasing the diversity of the model rollouts. Second, we devise a conservative rollout method that minimizes the reconstruction loss, further improving the sample accuracy. We theoretically prove that the bound of rollout error of COBiMO is tighter than the ones using the unidirectional models. Empirical results also show that COBiMO outperforms previous offline RL algorithms on the widely used benchmark D4RL.",
        "keywords": "Offline reinforcement learning;model-based policy optimization;conservative bidirectional rollouts",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Zixian Zhou;Xiang Ao;Yang Liu;Qing He",
        "authorids": "~Zixian_Zhou1;~Xiang_Ao2;~Yang_Liu73;~Qing_He2",
        "gender": "M;M;M;M",
        "homepage": "https://scholar.google.com/citations?view_op=list_works&hl=zh-CN&user=gNvxurEAAAAJ&gmla=AP6z3ObZ9EDpYyWtlV4II_UNGxvDz88_1NkPs7fp9ihFGEyUS4sm87FHkcPpFP8fVCYxrw04IOx18-Wuwwh5lWt9HGqZkXJnnej3Qxi5ky1eqgBbrAg;https://aoxaustin.github.io/;https://ponderly.github.io/;http://www.ict.cas.cn/sourcedb_2018_ict_cas/cn/jssrck/200909/t20090917_2496626.html",
        "dblp": ";71/1982-1;51/3710-200;14/3700-3.html",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;W8wrWfMAAAAJ;kVoIIXkAAAAJ;tkbgSDYAAAAJ",
        "orcid": ";0000-0001-9633-8361;0000-0002-1525-0788;0000-0001-8833-5398",
        "linkedin": ";;;",
        "or_profile": "~Zixian_Zhou1;~Xiang_Ao2;~Yang_Liu73;~Qing_He2",
        "aff": ", Chinese Academy of Sciences;Institute of Computing Technology, Chinese Academy of Sciences;Institute of Computing Technology, Chinese Academy of Sciences;Institute of Computing Technology, Chinese Academy of Sciences",
        "aff_domain": "ict.ac.cn;ict.ac.cn;ict.ac.cn;ict.ac.cn",
        "position": "MS student;Associate Professor;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nzhou2024modelbased,\ntitle={Model-Based Offline Reinforcement Learning with Conservative Bidirectional Rollouts},\nauthor={Zixian Zhou and Xiang Ao and Yang Liu and Qing He},\nyear={2024},\nurl={https://openreview.net/forum?id=tQ8gcygV4p}\n}",
        "github": "",
        "project": "",
        "reviewers": "MDsd;7BFv;qiBS",
        "site": "https://openreview.net/forum?id=tQ8gcygV4p",
        "pdf_size": 855005,
        "rating": "3;3;5",
        "confidence": "5;4;4",
        "soundness": "2;2;3",
        "contribution": "1;1;2",
        "presentation": "3;3;3",
        "wc_summary": "102;54;116",
        "wc_strengths": "47;10;73",
        "wc_weaknesses": "447;135;298",
        "wc_questions": "7;53;26",
        "wc_review": "603;252;513",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            90.66666666666667,
            26.5497436689865
        ],
        "wc_strengths_avg": [
            43.333333333333336,
            25.849994627121728
        ],
        "wc_weaknesses_avg": [
            293.3333333333333,
            127.41620340007346
        ],
        "wc_questions_avg": [
            28.666666666666668,
            18.873850222522755
        ],
        "wc_review_avg": [
            456.0,
            148.85563476066332
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:01tN3MzFc2YJ:scholar.google.com/&scioq=Model-Based+Offline+Reinforcement+Learning+with+Conservative+Bidirectional+Rollouts&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Chinese Academy of Sciences",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.cas.cn",
        "aff_unique_abbr": "CAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "tQYsKBTTaV",
        "title": "LATEC \u2014 A benchmark for large-scale attribution & attention evaluation in computer vision",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Explainable AI (XAI) is a rapidly growing domain with a myriad of proposed methods as well as metrics aiming to evaluate their efficacy. However, current literature is often of limited scope, examining only a handful of XAI methods and employing one or a few metrics. Furthermore, pivotal factors for performance, such as the underlying architecture or the nature of input data, remain largely unexplored. This lack of comprehensive analysis hinders the ability to make generalized and robust conclusions about XAI performance, which is crucial for directing scientific progress but also for trustworthy real-world application of XAI. In response, we introduce LATEC, a large-scale benchmark that critically evaluates 17 prominent XAI methods using 20 distinct metrics. Our benchmark systematically incorporates vital elements like varied architectures and diverse input types, resulting in 7,560 examined combinations. Using this benchmark, we derive empirically grounded insights into areas of current debate, such as the impact of Transformer architectures and a comparative analysis of traditional attribution methods against novel attention mechanisms. To further solidify LATEC's position as a pivotal resource for future XAI research, all auxiliary data\u2014from trained model weights to over 326k saliency maps and 378k metric scores\u2014are made publicly available. The benchmark is hosted at: https://github.com/kjdhfg/LATEC.",
        "keywords": "Explainable AI;Evaluation;Attention;Benchmark",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Lukas Klein;Udo Schlegel;Till J. Bungert;Carsten T. L\u00fcth;Mennatallah El-Assady;Paul F Jaeger",
        "authorids": "~Lukas_Klein1;~Udo_Schlegel1;~Till_J._Bungert1;~Carsten_T._L\u00fcth1;~Mennatallah_El-Assady1;~Paul_F_Jaeger1",
        "gender": "M;;;;M;M",
        "homepage": "https://lukaskln.github.io;https://udo-schl.github.io/;;https://pfjaeger.github.io;;https://github.com/tbung",
        "dblp": ";;183/8957;179/4749;244/2162;334/4062",
        "google_scholar": "https://scholar.google.de/citations?user=sxpuZg4AAAAJ;https://scholar.google.de/citations?user=OmfaIuYAAAAJ;;https://scholar.google.de/citations?user=9B9-8h0AAAAJ;3L6NkggAAAAJ;yWaPy7AAAAAJ",
        "orcid": ";0000-0002-8266-0162;0000-0001-8526-2613;;;",
        "linkedin": ";;;;carsten-l\u00fcth-530798190/;",
        "or_profile": "~Lukas_Klein1;~Udo_Schlegel1;~Mennatallah_El-Assady1;~Paul_F_Jaeger1;~Carsten_Tim_L\u00fcth1;~Till_Bungert1",
        "aff": "German Cancer Research Center;University of Konstanz;Department of Computer Science, ETHZ - ETH Zurich;German Cancer Research Center;German Cancer Research Center;Deutsches Krebsforschungszentrum",
        "aff_domain": "dkfz.de;uni-konstanz.de;inf.ethz.ch;dkfz.de;dkfz-heidelberg.de;dkfz-heidelberg.de",
        "position": "PhD student;PhD student;Assistant Professor;Research Group Leader;PhD student;PhD student",
        "bibtex": "@misc{\nklein2024latec,\ntitle={{LATEC} {\\textemdash} A benchmark for large-scale attribution \\& attention evaluation in computer vision},\nauthor={Lukas Klein and Udo Schlegel and Till J. Bungert and Carsten T. L{\\\"u}th and Mennatallah El-Assady and Paul F Jaeger},\nyear={2024},\nurl={https://openreview.net/forum?id=tQYsKBTTaV}\n}",
        "github": "",
        "project": "",
        "reviewers": "aNQJ;Kney;dkvT;6LcT;FKNb",
        "site": "https://openreview.net/forum?id=tQYsKBTTaV",
        "pdf_size": 15811135,
        "rating": "3;5;6;6;8",
        "confidence": "4;3;2;3;4",
        "soundness": "3;2;3;4;4",
        "contribution": "2;3;3;4;3",
        "presentation": "2;1;3;4;4",
        "wc_summary": "111;106;33;86;317",
        "wc_strengths": "117;65;85;42;128",
        "wc_weaknesses": "557;88;81;9;47",
        "wc_questions": "19;2;2;264;18",
        "wc_review": "804;261;201;401;510",
        "wc_reply_reviewers": "709;0;0;19;15",
        "wc_reply_authors": "1487;482;308;732;430",
        "reply_reviewers": "1;0;0;1;1",
        "reply_authors": "2;1;1;1;1",
        "rating_avg": [
            5.6,
            1.624807680927192
        ],
        "confidence_avg": [
            3.2,
            0.7483314773547882
        ],
        "soundness_avg": [
            3.2,
            0.7483314773547882
        ],
        "contribution_avg": [
            3.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            2.8,
            1.16619037896906
        ],
        "wc_summary_avg": [
            130.6,
            97.21028752143468
        ],
        "wc_strengths_avg": [
            87.4,
            31.916140117501676
        ],
        "wc_weaknesses_avg": [
            156.4,
            202.2568663852973
        ],
        "wc_questions_avg": [
            61.0,
            101.76836443610559
        ],
        "wc_review_avg": [
            435.4,
            213.52901442192814
        ],
        "wc_reply_reviewers_avg": [
            148.6,
            280.30597567658094
        ],
        "wc_reply_authors_avg": [
            687.8,
            422.78524099121535
        ],
        "reply_reviewers_avg": [
            0.6,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.2,
            0.4000000000000001
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.0986927542439653,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:XqIdCwxsex0J:scholar.google.com/&scioq=LATEC+%E2%80%94+A+benchmark+for+large-scale+attribution+%26+attention+evaluation+in+computer+vision&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0;0;3",
        "aff_unique_norm": "German Cancer Research Center;University of Konstanz;ETH Zurich;Deutsches Krebsforschungszentrum",
        "aff_unique_dep": ";;Department of Computer Science;",
        "aff_unique_url": "https://www.dkfz.de;https://www.uni-konstanz.de;https://www.ethz.ch;https://www.dkfz.de",
        "aff_unique_abbr": "DKFZ;Uni Konstanz;ETHZ;DKFZ",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Zurich",
        "aff_country_unique_index": "0;0;1;0;0;0",
        "aff_country_unique": "Germany;Switzerland"
    },
    {
        "id": "tQoGDHn2XO",
        "title": "Efficient Hyperparameter Optimization with Adaptive Fidelity Identification",
        "track": "main",
        "status": "Desk Reject",
        "tldr": "",
        "abstract": "Hyperparameter optimization is powerful in automatically tuning hyperparameters, with Bayesian Optimization (BO) being a mainstream method for this task. Extending BO into the multi-fidelity setting has been an emerging research topic in this field, but faces the challenge of determining an appropriate fidelity for each hyperparameter configuration to fit the surrogate model. To tackle the challenge, we propose a multi-fidelity BO method named FastBO, which excels in adaptively deciding the fidelity for each configuration and providing strong performance while ensuring efficient resource usage. These advantages are achieved through our proposed techniques based on the concepts of efficient point and saturation point for each configuration, which can be obtained from the empirical learning curve of the configuration, estimated from early observations. Extensive experiments demonstrate FastBO's superior anytime performance and efficiency in identifying high-quality configurations. We also show that our method provides a way to extend any single-fidelity method to the multi-fidelity setting, highlighting the wide applicability of our approach.",
        "keywords": "hyperparameter optimization;multi-fidelity;computational efficiency",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/9d33a7b42f041625f0d4f890ec6aacfda6375189.zip",
        "author": "Jiantong Jiang;Zeyi Wen;Atif Mansoor;Ajmal Saeed Mian",
        "authorids": "~Jiantong_Jiang1;~Zeyi_Wen1;~Atif_Mansoor1;~Ajmal_Saeed_Mian1",
        "gender": "F;M;;M",
        "homepage": "https://jjiantong.github.io/;https://zeyiwen.github.io/;;https://ajmalsaeed.net/",
        "dblp": "259/3790;14/10440;;63/807",
        "google_scholar": "MuyZqjgAAAAJ;https://scholar.google.com.hk/citations?user=8-GNGqAAAAAJ;;X589yaIAAAAJ",
        "orcid": "0000-0002-1624-3969;0000-0003-3370-6053;;0000-0002-5206-3842",
        "linkedin": ";;;",
        "or_profile": "~Jiantong_Jiang1;~Zeyi_Wen1;~Atif_Mansoor1;~Ajmal_Saeed_Mian1",
        "aff": "University of Western Australia;Hong Kong University of Science and Technology (Guangzhou);;University of Western Australia",
        "aff_domain": "uwa.edu.au;hkust-gz.edu.cn;;uwa.edu.au",
        "position": "PhD student;Assistant Professor;;Professor",
        "bibtex": "@misc{\njiang2024efficient,\ntitle={Efficient Hyperparameter Optimization with Adaptive Fidelity Identification},\nauthor={Jiantong Jiang and Zeyi Wen and Atif Mansoor and Ajmal Saeed Mian},\nyear={2024},\nurl={https://openreview.net/forum?id=tQoGDHn2XO}\n}",
        "github": "",
        "project": "",
        "reviewers": "WVYX;gzF7;ZiMT",
        "site": "https://openreview.net/forum?id=tQoGDHn2XO",
        "pdf_size": 1478125,
        "rating": "3;5;6",
        "confidence": "5;3;4",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "3;2;3",
        "wc_summary": "111;36;139",
        "wc_strengths": "29;14;60",
        "wc_weaknesses": "232;123;128",
        "wc_questions": "244;21;153",
        "wc_review": "616;194;480",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1027;794;819",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;2;2",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            95.33333333333333,
            43.48435223030106
        ],
        "wc_strengths_avg": [
            34.333333333333336,
            19.154343864744856
        ],
        "wc_weaknesses_avg": [
            161.0,
            50.24606120549815
        ],
        "wc_questions_avg": [
            139.33333333333334,
            91.55083590855715
        ],
        "wc_review_avg": [
            430.0,
            175.87116496647957
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            880.0,
            104.44456264768725
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.6546536707079772,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17481159668478258157&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Western Australia;Hong Kong University of Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uwa.edu.au;https://www.ust.hk",
        "aff_unique_abbr": "UWA;HKUST",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Australia;China"
    },
    {
        "id": "tQqLV2N0uz",
        "title": "Reprompting: Automated Chain-of-Thought Prompt Inference Through Gibbs Sampling",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We introduce Reprompting, an iterative sampling algorithm that searches for the Chain-of-Thought (CoT) recipes for a given task without human intervention. Through Gibbs sampling, we infer CoT recipes that work consistently well for a set of training samples. Our method iteratively samples new recipes using previously sampled solutions as parent prompts to solve other training problems. On five Big-Bench Hard tasks that require multi-step reasoning, Reprompting achieves consistently better performance than the zero-shot, few-shot, human-written CoT, Auto-CoT and self-consistency decoding baselines. Reprompting can also facilitate transfer of knowledge from a stronger model to a weaker model leading to substantially improved performance of the weaker model. Overall, Reprompting brings up to +17 point improvements over the previous state-of-the-art method that uses human-written CoT prompts.",
        "keywords": "Prompting;In-Context Learning;Few-Shot Learning;GPT;Large Language Models;Multi-Step Reasoning;Natural Language Processing",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/294740a4eeaa36c8bc61b272a49729e3e43b5af4.zip",
        "author": "Weijia Xu;Andrzej Banburski;Nebojsa Jojic",
        "authorids": "~Weijia_Xu3;~Andrzej_Banburski1;~Nebojsa_Jojic1",
        "gender": "F;M;",
        "homepage": "https://weijia-xu.github.io;http://www.andrzejbanburski.com;www.research.microsoft.com/~jojic",
        "dblp": "68/4886;194/5464;20/1944",
        "google_scholar": "6uUw43gAAAAJ;;",
        "orcid": "0000-0002-5732-8926;;",
        "linkedin": ";;",
        "or_profile": "~Weijia_Xu3;~Andrzej_Banburski1;~Nebojsa_Jojic1",
        "aff": "Microsoft Research;Microsoft;Microsoft Research",
        "aff_domain": "research.microsoft.com;microsoft.com; ",
        "position": "Researcher;Principal Researcher;Researcher",
        "bibtex": "@misc{\nxu2024reprompting,\ntitle={Reprompting: Automated Chain-of-Thought Prompt Inference Through Gibbs Sampling},\nauthor={Weijia Xu and Andrzej Banburski and Nebojsa Jojic},\nyear={2024},\nurl={https://openreview.net/forum?id=tQqLV2N0uz}\n}",
        "github": "",
        "project": "",
        "reviewers": "5tZK;kqkB;BA1Z;78Bd;hjgQ",
        "site": "https://openreview.net/forum?id=tQqLV2N0uz",
        "pdf_size": 1369509,
        "rating": "5;5;5;6;6",
        "confidence": "4;4;3;4;3",
        "soundness": "2;3;3;3;3",
        "contribution": "2;2;2;3;3",
        "presentation": "2;2;3;3;3",
        "wc_summary": "53;151;44;94;103",
        "wc_strengths": "36;132;39;254;48",
        "wc_weaknesses": "171;298;124;319;132",
        "wc_questions": "328;148;33;6;37",
        "wc_review": "588;729;240;673;320",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "666;750;429;210;421",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            5.4,
            0.48989794855663565
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            89.0,
            38.4343596278122
        ],
        "wc_strengths_avg": [
            101.8,
            83.95808478044268
        ],
        "wc_weaknesses_avg": [
            208.8,
            83.20913411399016
        ],
        "wc_questions_avg": [
            110.4,
            119.19832213584216
        ],
        "wc_review_avg": [
            510.0,
            194.73777240176082
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            495.2,
            192.52158320562398
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.16666666666666666,
        "gs_citation": 29,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10565548451033148331&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Microsoft",
        "aff_unique_dep": "Microsoft Research",
        "aff_unique_url": "https://www.microsoft.com/en-us/research",
        "aff_unique_abbr": "MSR",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "tRRNjNdqu2",
        "title": "Self, Semi and Fully Supervised Training for Autoencoders using Ternary Classification",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Autoencoders are usually trained in a self-supervised fashion. In the context of anomaly detection, research shows that they can also be trained in a fully supervised one, using binary class labels, namely HEALTHY and FAULTY. However, when working with real world data, such an approach might not be suitable. It is hard to binary classify data coming from equipment that has been in operation for a long time, is affected by wear and tear. In additional, its real current health status is unknown. Moreover, historical data is not usually labeled, and only maintenance interventions are recorded. To alleviate this problem, a third label is introduced, UNKNOWN, which enables the autoencoder to learn the structure of healthy and faulty data from the correspondingly labelled data points. This structure is used in reconstructing the UNKNOWN inputs. This can increase the performance of autoencoders in a wide range of anomaly detection cases, especially when the timeseries data used to train the autoencoder comes from machines that have been in operation for a long time. This is especially relevant in the case of industrial machinery. Different label-aware loss functions which can enable the training of an autoencoder, using the three aforementioned labels, in any combination of self, semi and fully supervised training are investigated in this work. The loss functions presented in this paper enable an autoencoder to achieve particularly good anomaly detection performance on a clutch-slip detection dataset acquired from a test bench which simulates the drivetrain of an electric Range Rover Evoque. The dataset is presented in the appendix.",
        "keywords": "self supervised learning;semi supervised learning;fully supervised learning;autoencoder;loss function;contrastive learning;anomaly detection",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Lavinius Ioan Gliga;Jeroen Zegers;Carlos Tiana G\u00f3mez;Pieter Bovijn",
        "authorids": "~Lavinius_Ioan_Gliga1;~Jeroen_Zegers1;~Carlos_Tiana_G\u00f3mez1;~Pieter_Bovijn1",
        "gender": "M;M;M;",
        "homepage": ";;;https://www.flandersmake.be/en",
        "dblp": ";;;",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;O7XtZEMAAAAJ;;",
        "orcid": "0000-0001-9848-4485;0000-0002-7098-7168;0000-0002-1649-3984;",
        "linkedin": "lavinius-ioan-gliga-88b72b8b/;jeroen-zegers-01019383/;;",
        "or_profile": "~Lavinius_Ioan_Gliga1;~Jeroen_Zegers1;~Carlos_Tiana_G\u00f3mez1;~Pieter_Bovijn1",
        "aff": ";;Flanders Make;Flanders Make",
        "aff_domain": ";;flandersmake.be;flandersmake.be",
        "position": ";;Researcher;Researcher",
        "bibtex": "@misc{\ngliga2024self,\ntitle={Self, Semi and Fully Supervised Training for Autoencoders using Ternary Classification},\nauthor={Lavinius Ioan Gliga and Jeroen Zegers and Carlos Tiana G{\\'o}mez and Pieter Bovijn},\nyear={2024},\nurl={https://openreview.net/forum?id=tRRNjNdqu2}\n}",
        "github": "",
        "project": "",
        "reviewers": "GBH8;EDWo;wAkT",
        "site": "https://openreview.net/forum?id=tRRNjNdqu2",
        "pdf_size": 444037,
        "rating": "1;3;3",
        "confidence": "5;4;4",
        "soundness": "1;1;2",
        "contribution": "1;1;2",
        "presentation": "1;2;2",
        "wc_summary": "26;96;24",
        "wc_strengths": "1;15;9",
        "wc_weaknesses": "75;77;17",
        "wc_questions": "2;144;1",
        "wc_review": "104;332;51",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "155;293;47",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            48.666666666666664,
            33.47967874530592
        ],
        "wc_strengths_avg": [
            8.333333333333334,
            5.734883511361751
        ],
        "wc_weaknesses_avg": [
            56.333333333333336,
            27.824849006278942
        ],
        "wc_questions_avg": [
            49.0,
            67.17638473948018
        ],
        "wc_review_avg": [
            162.33333333333334,
            121.90797986824141
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            165.0,
            100.67770358922576
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:hcoRlBXdIOwJ:scholar.google.com/&scioq=Self,+Semi+and+Fully+Supervised+Training+for+Autoencoders+using+Ternary+Classification&hl=en&as_sdt=0,34",
        "gs_version_total": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Flanders Make",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.flandersmake.be",
        "aff_unique_abbr": "Flanders Make",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Belgium"
    },
    {
        "id": "tRfAANZ4ro",
        "title": "RAND: Robustness Aware Norm Decay For Quantized Seq2seq Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "With the rapid increase in the size of neural networks, model compression has become an important area of research. Quantization is an effective technique at decreasing the model size, memory access, and compute load of large models. Despite recent advances in quantization aware training (QAT) technique, most papers present evaluations that are focused on computer vision tasks, which have different layer composition and training dynamics compared to sequence tasks. In this paper, we first benchmark the impact of popular techniques such as straight through estimator, pseudo-quantization noise (PQN), learnable scale parameter, clipping, etc. on 4-bit seq2seq models across a suite of speech recognition datasets ranging from 1,000 hours to 1 million hours, as well as one machine translation dataset to illustrate its applicability outside of speech.\n\nThrough the experiments, we report that accuracy suffers when there is insufficient regularization signal flowing back to the outliers. We propose to construct the quantization scale as different functions of the outliers in order to regularize them as part of the end-to-end learning problem (outperforming popular learnable scale and clipping methods). PQN-QAT shows a larger improvement under the proposed method, and it opens up the possibility to exploit some of its other benefits: 1) training a single model that performs well in mixed precision mode and 2) improved generalization on long form speech recognition.",
        "keywords": "automatic speech recognition;quantization;seq2seq;transducer",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "David Qiu;David Rim;Shaojin Ding;Oleg Rybakov;Yanzhang He",
        "authorids": "~David_Qiu1;~David_Rim1;~Shaojin_Ding1;~Oleg_Rybakov1;~Yanzhang_He1",
        "gender": ";M;M;M;M",
        "homepage": ";;;;",
        "dblp": ";128/7917;226/1807;238/2534;122/0851",
        "google_scholar": ";;7dnqDRAAAAAJ;3qb7uO4AAAAJ;2JH-fJYAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~David_Qiu1;~David_Rim1;~Shaojin_Ding1;~Oleg_Rybakov1;~Yanzhang_He1",
        "aff": ";;;Google;Google Inc.",
        "aff_domain": ";;;google.com;google.com",
        "position": ";;;Manager;Researcher",
        "bibtex": "@misc{\nqiu2024rand,\ntitle={{RAND}: Robustness Aware Norm Decay For Quantized Seq2seq Models},\nauthor={David Qiu and David Rim and Shaojin Ding and Oleg Rybakov and Yanzhang He},\nyear={2024},\nurl={https://openreview.net/forum?id=tRfAANZ4ro}\n}",
        "github": "",
        "project": "",
        "reviewers": "Ko6F;9JsG;iZJg",
        "site": "https://openreview.net/forum?id=tRfAANZ4ro",
        "pdf_size": 387782,
        "rating": "3;3;5",
        "confidence": "4;4;4",
        "soundness": "2;3;2",
        "contribution": "2;1;3",
        "presentation": "2;3;2",
        "wc_summary": "76;62;355",
        "wc_strengths": "68;35;171",
        "wc_weaknesses": "381;67;548",
        "wc_questions": "5;321;150",
        "wc_review": "530;485;1224",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            164.33333333333334,
            134.9427862301485
        ],
        "wc_strengths_avg": [
            91.33333333333333,
            57.921402684058755
        ],
        "wc_weaknesses_avg": [
            332.0,
            199.4007689721047
        ],
        "wc_questions_avg": [
            158.66666666666666,
            129.15193464374516
        ],
        "wc_review_avg": [
            746.3333333333334,
            338.26058331147925
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17388368980351402967&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Google",
        "aff_unique_dep": "Google",
        "aff_unique_url": "https://www.google.com",
        "aff_unique_abbr": "Google",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Mountain View",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "tS3gexmfeT",
        "title": "Fusion Token: Enhancing Compression and Efficiency in Language Model Tokenization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In the realm of language models, data encoding is pivotal, influencing efficiency and effectiveness of model training. Byte Pair Encoding (BPE) is a well-established subword tokenization technique that balances computational efficiency and linguistic expressiveness by merging frequent byte or character pairs.\nAs language model training requires substantial computational resources, we propose Fusion Token, a  method that substantially enhances the conventional Byte Pair Encoding (BPE) approach in data encoding for language models. Fusion Token employs a more aggressive computational strategy compared to BPE, expanding the token groups from bi-grams to 10-grams. Remarkably, with the addition of 1024 tokens to the vocabulary, the compression rate significantly surpasses that of a regular BPE tokenizer with a vocabulary of one million. Overall, the Fusion Token method leads to noticeable performance improvements due to an increased data scope per compute unit. Additionally, higher compression results in faster inference times due to fewer tokens per given string. By devoting more compute resources to the tokenizer building process, Fusion Token maximizes the potential of language models as efficient data compression engines, enabling more effective language modeling systems.",
        "keywords": "tokenizer;large language models;compression",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Robert Kwiatkowski;Zijian Wang;Robert Giaquinto;Varun Kumar;Xiaofei Ma;Bing Xiang;Ben Athiwaratkun",
        "authorids": "~Robert_Kwiatkowski1;~Zijian_Wang1;~Robert_Giaquinto1;~Varun_Kumar3;~Xiaofei_Ma1;~Bing_Xiang2;~Ben_Athiwaratkun1",
        "gender": "M;;;M;M;;M",
        "homepage": "https://amazon.com;;https://www-users.cs.umn.edu/~smit7982/;https://varunkumar-dev.github.io/;https://www.amazon.science/author/xiaofei-ma;;https://benathi.github.io",
        "dblp": ";;213/8085;;;;166/1659",
        "google_scholar": ";;s7MpvDUAAAAJ;d-La2lQAAAAJ;Pc2SfvMAAAAJ;A6yjdJAAAAAJ;KZpZTTQAAAAJ",
        "orcid": ";;;;;;",
        "linkedin": ";;;varunin/;xiaofei-ma-b3627928;;",
        "or_profile": "~Robert_Kwiatkowski1;~Zijian_Wang1;~Robert_Giaquinto1;~Varun_Kumar3;~Xiaofei_Ma1;~Bing_Xiang2;~Ben_Athiwaratkun1",
        "aff": "Amazon;;Amazon;Amazon;Amazon Web Services;Goldman Sachs;Amazon",
        "aff_domain": "amazon.com;;amazon.com;amazon.com;amazon.com;gs.com;amazon.com",
        "position": "Researcher;;Researcher;Principal Researcher;Applied Science Manager;Managing Director;AI Scientist",
        "bibtex": "@misc{\nkwiatkowski2024fusion,\ntitle={Fusion Token: Enhancing Compression and Efficiency in Language Model Tokenization},\nauthor={Robert Kwiatkowski and Zijian Wang and Robert Giaquinto and Varun Kumar and Xiaofei Ma and Bing Xiang and Ben Athiwaratkun},\nyear={2024},\nurl={https://openreview.net/forum?id=tS3gexmfeT}\n}",
        "github": "",
        "project": "",
        "reviewers": "dMCg;6zo7;oudB;z6Wp",
        "site": "https://openreview.net/forum?id=tS3gexmfeT",
        "pdf_size": 682282,
        "rating": "3;3;3;5",
        "confidence": "3;4;3;2",
        "soundness": "3;2;1;3",
        "contribution": "2;3;2;2",
        "presentation": "2;3;2;3",
        "wc_summary": "57;66;80;109",
        "wc_strengths": "61;30;27;86",
        "wc_weaknesses": "361;252;226;168",
        "wc_questions": "2;10;46;23",
        "wc_review": "481;358;379;386",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "203;213;189;241",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            78.0,
            19.685019685029527
        ],
        "wc_strengths_avg": [
            51.0,
            24.197107265125723
        ],
        "wc_weaknesses_avg": [
            251.75,
            70.02276415566584
        ],
        "wc_questions_avg": [
            20.25,
            16.64894891577243
        ],
        "wc_review_avg": [
            401.0,
            47.32335575590556
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            211.5,
            19.04599695474091
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5734477908834060381&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;1;0",
        "aff_unique_norm": "Amazon;Goldman Sachs",
        "aff_unique_dep": "Amazon.com, Inc.;",
        "aff_unique_url": "https://www.amazon.com;https://www.goldmansachs.com",
        "aff_unique_abbr": "Amazon;GS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "tTXHd97coc",
        "title": "Alleviating the Effect of Data Imbalance on Adversarial Training",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In this paper, we study adversarial training on datasets that obey the long-tailed distribution, which is practical but rarely explored in previous works. Compared with conventional adversarial training on balanced datasets, this process falls into the dilemma of generating uneven adversarial examples (AEs) and an unbalanced feature embedding space, causing the resulting model to exhibit low robustness and accuracy on tail data. To combat that, we propose a new adversarial training framework -- Re-balancing Adversarial Training (REAT). This framework consists of two components: (1) a new training strategy inspired by the effective number to guide the model to generate more balanced and informative AEs; (2) a carefully constructed penalty function to force a satisfactory feature space. Evaluation results on different datasets and model structures prove that REAT can effectively enhance the model's robustness and preserve the model's clean accuracy.",
        "keywords": "adversarial training",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/27a14abb252cc3efe3cc9218e7f4bc0f8a1f1cf6.zip",
        "author": "Guanlin Li;Guowen Xu;Tianwei Zhang",
        "authorids": "~Guanlin_Li2;~Guowen_Xu1;~Tianwei_Zhang1",
        "gender": "M;M;M",
        "homepage": "https://guanlinlee.github.io/;https://guowen-xu.github.io/;https://personal.ntu.edu.sg/tianwei.zhang/index.html",
        "dblp": ";87/10142;77/7902-4",
        "google_scholar": "3LB0_wMAAAAJ;https://scholar.google.com.hk/citations?user=MDKdG80AAAAJ;9vpiYDIAAAAJ",
        "orcid": ";0000-0002-9764-9345;",
        "linkedin": ";guowen-xu-92b7201b1/?originalSubdomain=hk;",
        "or_profile": "~Guanlin_Li2;~Guowen_Xu1;~Tianwei_Zhang1",
        "aff": "Nanyang Technological University;City University of Hong Kong;Nanyang Technological University",
        "aff_domain": "ntu.edu.sg;cityu.edu.hk;ntu.edu.sg",
        "position": "PhD student;Postdoc;Assistant Professor",
        "bibtex": "@misc{\nli2024alleviating,\ntitle={Alleviating the Effect of Data Imbalance on Adversarial Training},\nauthor={Guanlin Li and Guowen Xu and Tianwei Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=tTXHd97coc}\n}",
        "github": "",
        "project": "",
        "reviewers": "yNqS;prkd;h8eU;1nCF",
        "site": "https://openreview.net/forum?id=tTXHd97coc",
        "pdf_size": 6092313,
        "rating": "3;5;5;6",
        "confidence": "4;2;3;3",
        "soundness": "3;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "4;3;3;3",
        "wc_summary": "29;81;39;58",
        "wc_strengths": "11;59;56;83",
        "wc_weaknesses": "63;139;80;154",
        "wc_questions": "5;52;3;60",
        "wc_review": "108;331;178;355",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            51.75,
            19.84155991851447
        ],
        "wc_strengths_avg": [
            52.25,
            26.013217794036937
        ],
        "wc_weaknesses_avg": [
            109.0,
            38.34709897762802
        ],
        "wc_questions_avg": [
            30.0,
            26.16295090390226
        ],
        "wc_review_avg": [
            243.0,
            103.36585509731925
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.6488856845230502,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17968193881266079884&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Nanyang Technological University;City University of Hong Kong",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ntu.edu.sg;https://www.cityu.edu.hk",
        "aff_unique_abbr": "NTU;CityU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Singapore;China"
    },
    {
        "title": "Text2Reward: Reward Shaping with Language Models for Reinforcement Learning",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17616",
        "id": "tUM39YTRxH",
        "author_site": "Tianbao Xie, Siheng Zhao, Chen Henry Wu, Yitao Liu, Qian Luo, Victor Zhong, Yanchao Yang, Tao Yu",
        "tldr": "",
        "abstract": "Designing reward functions is a longstanding challenge in reinforcement learning (RL); it requires specialized knowledge or domain data, leading to high costs for development. To address this, we introduce Text2Reward, a data-free framework that automates the generation and shaping of dense reward functions based on large language models (LLMs). Given a goal described in natural language, Text2Reward generates shaped dense reward functions as an executable program grounded in a compact representation of the environment. Unlike inverse RL and recent work that uses LLMs to write sparse reward codes or unshaped dense rewards with a constant function across timesteps, Text2Reward produces interpretable, free-form dense reward codes that cover a wide range of tasks, utilize existing packages, and allow iterative refinement with human feedback. We evaluate Text2Reward on two robotic manipulation benchmarks (ManiSkill2, MetaWorld) and two locomotion environments of MuJoCo. On 13 of the 17 manipulation tasks, policies trained with generated reward codes achieve similar or better task success rates and convergence speed than expert-written reward codes. For locomotion tasks, our method learns six novel locomotion behaviors with a success rate exceeding 94%. Furthermore, we show that the policies trained in the simulator with our method can be deployed in the real world. Finally, Text2Reward further improves the policies by refining their reward functions with human feedback. Video results are available at https://text-to-reward.github.io/",
        "keywords": "reinforcement learning; large language models; robotics",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Tianbao Xie;Siheng Zhao;Chen Henry Wu;Yitao Liu;Qian Luo;Victor Zhong;Yanchao Yang;Tao Yu",
        "authorids": "~Tianbao_Xie1;~Siheng_Zhao1;~Chen_Henry_Wu1;~Yitao_Liu2;~Qian_Luo1;~Victor_Zhong1;~Yanchao_Yang1;~Tao_Yu5",
        "gender": "M;;M;M;M;M;M;M",
        "homepage": "https://tianbaoxie.com;https://sihengz02.github.io/;https://yitaoliu17.com/;;http://www.victorzhong.com;https://yanchaoyang.github.io/;https://taoyds.github.io/;https://chenwu.io/",
        "dblp": ";341/1176;128/1821;;182/8931;84/8637-1;67/1014-9;",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;l7EAauYAAAAJ;;https://scholar.google.com/citations?hl=en;lT3YoNkAAAAJ;r2tKnV4AAAAJ;5_Fn5CIAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;;;;;",
        "linkedin": ";;%E4%BA%A6%E9%9F%AC-%E5%88%98-9ba124257/;;victorzhong;;tao-yu-b9b551a5/;",
        "or_profile": "~Tianbao_Xie1;~Siheng_Zhao1;~Yitao_Liu2;~Qian_Luo1;~Victor_Zhong1;~Yanchao_Yang1;~Tao_Yu5;~Chen_Wu4",
        "aff": "University of Hong Kong;Nanjing University;The University of Hong Kong;University of Hong Kong;Microsoft;University of Hong Kong;The University of Hong Kong;Carnegie Mellon University",
        "aff_domain": "cs.hku.hk;nju.edu.cn;hku.hk;hku.hk;microsoft.com;hku.hk;hku.hk;cmu.edu",
        "position": "PhD student;Undergrad student;Undergrad student;PhD student;Postdoc;Assistant Professor;Assistant Professor;PhD student",
        "bibtex": "@inproceedings{\nxie2024textreward,\ntitle={Text2Reward: Reward Shaping with Language Models for Reinforcement Learning},\nauthor={Tianbao Xie and Siheng Zhao and Chen Henry Wu and Yitao Liu and Qian Luo and Victor Zhong and Yanchao Yang and Tao Yu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=tUM39YTRxH}\n}",
        "github": "",
        "project": "",
        "reviewers": "bPzM;XwRM;VQaY;fmuH",
        "pdf_size": 21142328,
        "rating": "6;6;8;8",
        "confidence": "5;4;4;3",
        "soundness": "2;3;3;2",
        "contribution": "2;3;3;3",
        "presentation": "3;3;4;2",
        "wc_summary": "206;53;20;114",
        "wc_strengths": "111;149;112;74",
        "wc_weaknesses": "245;241;313;463",
        "wc_questions": "82;59;35;32",
        "wc_review": "644;502;480;683",
        "wc_reply_reviewers": "116;85;517;444",
        "wc_reply_authors": "1813;1722;1690;1047",
        "reply_reviewers": "1;1;2;2",
        "reply_authors": "4;3;3;3",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            98.25,
            70.76148316704506
        ],
        "wc_strengths_avg": [
            111.5,
            26.51886121235224
        ],
        "wc_weaknesses_avg": [
            315.5,
            89.83735303313428
        ],
        "wc_questions_avg": [
            52.0,
            20.23610634484806
        ],
        "wc_review_avg": [
            577.25,
            87.69086326408242
        ],
        "wc_reply_reviewers_avg": [
            290.5,
            192.05793396785253
        ],
        "wc_reply_authors_avg": [
            1568.0,
            304.1652511382587
        ],
        "reply_reviewers_avg": [
            1.5,
            0.5
        ],
        "reply_authors_avg": [
            3.25,
            0.4330127018922193
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.7071067811865475,
        "gs_citation": 51,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3220472077779746674&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=tUM39YTRxH",
        "pdf": "https://openreview.net/pdf?id=tUM39YTRxH",
        "email": "cs.hku.hk;nju.edu.cn;hku.hk;hku.hk;microsoft.com;hku.hk;hku.hk;cmu.edu",
        "author_num": 8,
        "aff_unique_index": "0;1;0;0;2;0;0;3",
        "aff_unique_norm": "University of Hong Kong;Nanjing University;Microsoft;Carnegie Mellon University",
        "aff_unique_dep": ";;Microsoft Corporation;",
        "aff_unique_url": "https://www.hku.hk;https://www.nju.edu.cn;https://www.microsoft.com;https://www.cmu.edu",
        "aff_unique_abbr": "HKU;Nanjing U;Microsoft;CMU",
        "aff_campus_unique_index": "0;0;0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0;1;0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Learning Conditional Invariances through Non-Commutativity",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17615",
        "id": "tUVG9nGzgE",
        "author_site": "Abhra Chaudhuri, Serban Georgescu, Anjan Dutta",
        "tldr": "",
        "abstract": "Invariance learning algorithms that conditionally filter out domain-specific random variables as distractors, do so based only on the data semantics, and not the target domain under evaluation. We show that a provably optimal and sample-efficient way of learning conditional invariances is by relaxing the invariance criterion to be non-commutatively directed towards the target domain. Under domain asymmetry, i.e., when the target domain contains semantically relevant information absent in the source, the risk of the encoder $\\varphi^*$ that is optimal on average across domains is strictly lower-bounded by the risk of the target-specific optimal encoder $\\Phi^*_\\tau$. We prove that non-commutativity steers the optimization towards $\\Phi^*_\\tau$ instead of $\\varphi^*$, bringing the $\\mathcal{H}$-divergence between domains down to zero, leading to a stricter bound on the target risk. Both our theory and experiments demonstrate that non-commutative invariance (NCI) can leverage source domain samples to meet the sample complexity needs of learning $\\Phi^*_\\tau$, surpassing SOTA invariance learning algorithms for domain adaptation, at times by over 2\\%, approaching the performance of an oracle. Implementation is available at https://github.com/abhrac/nci.",
        "keywords": "Invariance Learning;Domain Adaptation",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Abhra Chaudhuri;Serban Georgescu;Anjan Dutta",
        "authorids": "~Abhra_Chaudhuri1;~Serban_Georgescu1;~Anjan_Dutta1",
        "gender": "M;M;M",
        "homepage": "https://sites.google.com/view/abhrachaudhuri/;https://www.fujitsu.com/uk/about/local/corporate/subsidiaries/fle/;https://sites.google.com/site/2adutta/",
        "dblp": "330/4583;;91/8278-1",
        "google_scholar": "6KWxpxkAAAAJ;;https://scholar.google.co.uk/citations?user=1aKTzmIAAAAJ",
        "orcid": ";0000-0003-0444-0110;0000-0002-1667-2245",
        "linkedin": "abhra-chaudhuri-126a09150;;anjan-dutta-a97b4071/",
        "or_profile": "~Abhra_Chaudhuri1;~Serban_Georgescu1;~Anjan_Dutta1",
        "aff": "University of Exeter;Fujitsu Research of Europe Ltd;University of Surrey",
        "aff_domain": "exeter.ac.uk;fujitsu.com;surrey.ac.uk",
        "position": "PhD student;Principal Researcher;Assistant Professor",
        "bibtex": "@inproceedings{\nchaudhuri2024learning,\ntitle={Learning Conditional Invariances through Non-Commutativity},\nauthor={Abhra Chaudhuri and Serban Georgescu and Anjan Dutta},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=tUVG9nGzgE}\n}",
        "github": "",
        "project": "",
        "reviewers": "C1qz;tufY;a8sS",
        "pdf_size": 717550,
        "rating": "5;6;8",
        "confidence": "2;3;2",
        "soundness": "2;2;3",
        "contribution": "3;3;3",
        "presentation": "2;3;3",
        "wc_summary": "64;72;58",
        "wc_strengths": "62;51;12",
        "wc_weaknesses": "24;3;1",
        "wc_questions": "114;141;1",
        "wc_review": "264;267;72",
        "wc_reply_reviewers": "71;0;0",
        "wc_reply_authors": "465;351;0",
        "reply_reviewers": "1;0;0",
        "reply_authors": "1;1;0",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            64.66666666666667,
            5.734883511361751
        ],
        "wc_strengths_avg": [
            41.666666666666664,
            21.452790546272112
        ],
        "wc_weaknesses_avg": [
            9.333333333333334,
            10.402991022884823
        ],
        "wc_questions_avg": [
            85.33333333333333,
            60.642852468824024
        ],
        "wc_review_avg": [
            201.0,
            91.22499657440389
        ],
        "wc_reply_reviewers_avg": [
            23.666666666666668,
            33.46972097616325
        ],
        "wc_reply_authors_avg": [
            272.0,
            197.88380428928488
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.18898223650461363,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:g59aKHwfIpYJ:scholar.google.com/&scioq=Learning+Conditional+Invariances+through+Non-Commutativity&hl=en&as_sdt=0,33",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=tUVG9nGzgE",
        "pdf": "https://openreview.net/pdf?id=tUVG9nGzgE",
        "email": "exeter.ac.uk;fujitsu.com;surrey.ac.uk",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of Exeter;Fujitsu Research of Europe;University of Surrey",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.exeter.ac.uk;https://www.fujitsu.com/uk/research/;https://www.surrey.ac.uk",
        "aff_unique_abbr": "Exeter;FRE;Surrey",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "tUiYbVqcuQ",
        "title": "A2FC: A FEDERATED ADVANTAGE ACTOR-CRITIC LEARNING APPROACH FOR HETEROGENEOUS ACTION SPACES",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The growth of the Internet of Things (IoT) and the increasing demand for real-time networking have brought about a growing necessity for multiple reinforcement learning (RL) agents to collaboratively train within a shared environment, all working towards common objectives. The multi-agent Advantage Actor-Critic (A2C) algorithm is gaining popularity in Multi-Agent Reinforcement Learning (MARL) systems. However, this approach requires agents to share policy components among neighboring agents due to observations being only partially available to each agent. This practice increases communication overhead and raises privacy concerns. Federated learning (FL), recognized as a privacy-preserving machine learning method, can be applied in the MARL context with a central server aggregating the weights of the agents' actor and critic models. However, this technique assumes that all agents are capable of executing identical actions, which may be impractical. To overcome the aforementioned shortcomings, we introduce a novel FL A2C algorithm called \"Advantage Actor Federated Critic (A2FC)\". The proposed algorithm streamlines the aggregation of agents' critic models while offloading the training of actor models to the individual agents' local machines.  An empirical experiment conducted in an adaptive traffic signal control (ATSC) system demonstrates the method's effectiveness in personalizing agents' actions, preserving agents' privacy during training, and mitigating communication overhead issues.",
        "keywords": "multi-agent reinforcement learning;federated learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Sheng Shen;Teng Joon Lim",
        "authorids": "~Sheng_Shen4;~Teng_Joon_Lim1",
        "gender": "M;M",
        "homepage": ";",
        "dblp": ";",
        "google_scholar": "RAmTAbsAAAAJ;dDQR5tIAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Sheng_Shen4;~Teng_Joon_Lim1",
        "aff": "The University of Sydney;University of Sydney",
        "aff_domain": "sydney.edu.au;usyd.edu.au",
        "position": "Postdoc;Full Professor",
        "bibtex": "@misc{\nanonymous2024afc,\ntitle={A2{FC}: A {FEDERATED} {ADVANTAGE} {ACTOR}-{CRITIC} {LEARNING} {APPROACH} {FOR} {HETEROGENEOUS} {ACTION} {SPACES}},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=tUiYbVqcuQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "Bftb;egev;PA69",
        "site": "https://openreview.net/forum?id=tUiYbVqcuQ",
        "pdf_size": 264165,
        "rating": "3;3;3",
        "confidence": "3;4;3",
        "soundness": "2;1;1",
        "contribution": "2;1;1",
        "presentation": "3;2;1",
        "wc_summary": "86;104;159",
        "wc_strengths": "31;15;43",
        "wc_weaknesses": "175;124;1017",
        "wc_questions": "11;46;49",
        "wc_review": "303;289;1268",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            116.33333333333333,
            31.05192783422991
        ],
        "wc_strengths_avg": [
            29.666666666666668,
            11.469767022723502
        ],
        "wc_weaknesses_avg": [
            438.6666666666667,
            409.4731031731171
        ],
        "wc_questions_avg": [
            35.333333333333336,
            17.249798710580816
        ],
        "wc_review_avg": [
            620.0,
            458.2408391519318
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:gP4JF0nJ4dIJ:scholar.google.com/&scioq=A2FC:+A+FEDERATED+ADVANTAGE+ACTOR-CRITIC+LEARNING+APPROACH+FOR+HETEROGENEOUS+ACTION+SPACES&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Sydney",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sydney.edu.au",
        "aff_unique_abbr": "USYD",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Australia"
    },
    {
        "id": "tUoBaW8KH1",
        "title": "Rethinking the Smoothness of Node Features Learned by Graph Convolutional Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "It has been proved that graph convolutional layers (GCLs) using ReLU or leaky ReLU activation function smooth node features. Such a smoothing process is beneficial for node classification using a few GCLs. However, deep graph convolutional networks (GCNs) tend to learn homogeneous node feature vectors over the graph, making nodes indistinguishable. In this paper, we develop a new understanding of the smoothness of node features learned by GCNs by establishing a fine-grained analysis of how ReLU or leaky ReLU affects the smoothness of its input vectors. First, we establish a geometric relationship between the input and output of ReLU or leaky ReLU. Then we show that if one ignores the magnitude of the feature vectors, ReLU and leaky ReLU smooth their input feature vectors, echoing existing theory. We further show that taking the magnitude of feature vectors into account, ReLU and leaky ReLU can increase, decrease, or preserve the smoothness of their input vectors. Our theory informs the design of a simple yet effective approach to let GCN learn node features with a desired smoothness that improves its empirical performance for graph node classification.",
        "keywords": "graph neural networks;activation function;smoothness of node features",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/8ebf0786957c08ad78a032d877f24f32d925d078.zip",
        "author": "Shih-Hsin Wang;Justin Baker;Cory D Hauck;Bao Wang",
        "authorids": "~Shih-Hsin_Wang1;~Justin_Baker1;~Cory_D_Hauck1;~Bao_Wang1",
        "gender": "M;;M;M",
        "homepage": ";;https://www.ornl.gov/staff-profile/cory-d-hauck;https://www.math.utah.edu/~bwang/index.html",
        "dblp": ";;;",
        "google_scholar": ";;;",
        "orcid": ";;;",
        "linkedin": "shih-hsin-sam-wang-9803671a5/;;;",
        "or_profile": "~Shih-Hsin_Wang1;~Justin_Baker1;~Cory_D_Hauck1;~Bao_Wang1",
        "aff": "University of Utah;;Oak Ridge National Laboratory;University of Utah",
        "aff_domain": "utah.edu;;ornl.gov;utah.edu",
        "position": "PhD student;;Researcher;Assistant Professor",
        "bibtex": "@misc{\nwang2024rethinking,\ntitle={Rethinking the Smoothness of Node Features Learned by Graph Convolutional Networks},\nauthor={Shih-Hsin Wang and Justin Baker and Cory D Hauck and Bao Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=tUoBaW8KH1}\n}",
        "github": "",
        "project": "",
        "reviewers": "pkn8;h1DY;MfPc;Pp4G",
        "site": "https://openreview.net/forum?id=tUoBaW8KH1",
        "pdf_size": 958302,
        "rating": "3;5;6;6",
        "confidence": "5;3;4;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;2;3",
        "wc_summary": "116;158;84;128",
        "wc_strengths": "21;54;57;60",
        "wc_weaknesses": "375;226;51;25",
        "wc_questions": "21;138;52;104",
        "wc_review": "533;576;244;317",
        "wc_reply_reviewers": "0;0;31;121",
        "wc_reply_authors": "1455;1137;621;909",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "3;2;2;2",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            121.5,
            26.509432283623127
        ],
        "wc_strengths_avg": [
            48.0,
            15.732132722552274
        ],
        "wc_weaknesses_avg": [
            169.25,
            141.72574748435798
        ],
        "wc_questions_avg": [
            78.75,
            45.273474573971015
        ],
        "wc_review_avg": [
            417.5,
            140.2364075409806
        ],
        "wc_reply_reviewers_avg": [
            38.0,
            49.563091106185055
        ],
        "wc_reply_authors_avg": [
            1030.5,
            305.7756530530186
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.7385489458759963,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=30462937177033292&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Utah;Oak Ridge National Laboratory",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.utah.edu;https://www.ornl.gov",
        "aff_unique_abbr": "Utah;ORNL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Generative Modeling with Phase Stochastic Bridge",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17614",
        "id": "tUtGjQEDd4",
        "author_site": "Tianrong Chen, Jiatao Gu, Laurent Dinh, Evangelos Theodorou, Joshua Susskind, Shuangfei Zhai",
        "tldr": "",
        "abstract": "Diffusion models (DMs) represent state-of-the-art generative models for continuous inputs. DMs work by constructing a Stochastic Differential Equation (SDE) in the input space (ie, position space), and using a neural network to reverse it. In this work, we introduce a novel generative modeling framework grounded in \\textbf{phase space dynamics}, where a phase space is defined as {an augmented space encompassing both position and velocity.} Leveraging insights from Stochastic Optimal Control, we construct a path measure in the phase space that enables efficient sampling. {In contrast to DMs, our framework demonstrates the capability to generate realistic data points at an early stage of dynamics propagation.} This early prediction sets the stage for efficient data generation by leveraging additional velocity information along the trajectory. On standard image generation benchmarks, our model yields favorable performance over baselines in the regime of small Number of Function Evaluations (NFEs). Furthermore, our approach rivals the performance of diffusion models equipped with efficient sampling techniques, underscoring its potential as a new tool generative modeling.",
        "keywords": "Generative Modeling;Stochastic Optimal Control;Diffusion Model",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/4c8aa96d9f830e3027a2636aa174785b89edda08.pdf",
        "author": "Tianrong Chen;Jiatao Gu;Laurent Dinh;Evangelos Theodorou;Joshua M. Susskind;Shuangfei Zhai",
        "authorids": "~Tianrong_Chen1;~Jiatao_Gu1;~Laurent_Dinh1;~Evangelos_Theodorou1;~Joshua_M._Susskind1;~Shuangfei_Zhai3",
        "gender": "M;M;;M;M;M",
        "homepage": "https://tianrongchen.github.io/;http://jiataogu.me;https://laurent-dinh.github.io/;;http://www.apple.com;http://cs.binghamton.edu/~szhai2",
        "dblp": "227/7295;164/5848.html;131/6819;155/9964;132/7797;",
        "google_scholar": "r9D3Fg50gMoC;https://scholar.google.com.sg/citations?user=cB1mFBsAAAAJ;h7OHSkoAAAAJ;;Sv2TGqsAAAAJ;G6vdBYsAAAAJ",
        "orcid": ";;;;;",
        "linkedin": "tianrong-chen-757b3216a/;jiatao-gu-204b2672/;;;joshua-susskind-8ab2ab5/;",
        "or_profile": "~Tianrong_Chen1;~Jiatao_Gu1;~Laurent_Dinh1;~Evangelos_Theodorou1;~Joshua_M._Susskind1;~Shuangfei_Zhai3",
        "aff": "Georgia Institute of Technology;Apple;Apple;Georgia Institute of Technology;Apple;Apple",
        "aff_domain": "gatech.edu;apple.com;apple.com;gatech.edu;apple.com;apple.com",
        "position": "PhD student;Researcher;Researcher;Assistant Professor;Researcher;Research Scientist",
        "bibtex": "@inproceedings{\nchen2024generative,\ntitle={Generative Modeling with Phase Stochastic Bridge},\nauthor={Tianrong Chen and Jiatao Gu and Laurent Dinh and Evangelos Theodorou and Joshua M. Susskind and Shuangfei Zhai},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=tUtGjQEDd4}\n}",
        "github": "",
        "project": "",
        "reviewers": "5NhC;76FN;rgEV;gcJ1",
        "pdf_size": 29500081,
        "rating": "8;8;8;8",
        "confidence": "2;4;3;4",
        "soundness": "4;3;3;3",
        "contribution": "4;2;4;3",
        "presentation": "3;3;4;3",
        "wc_summary": "103;98;98;162",
        "wc_strengths": "58;100;129;126",
        "wc_weaknesses": "44;130;82;224",
        "wc_questions": "21;108;92;163",
        "wc_review": "226;436;401;675",
        "wc_reply_reviewers": "0;32;0;162",
        "wc_reply_authors": "292;236;392;747",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            115.25,
            27.068200900687877
        ],
        "wc_strengths_avg": [
            103.25,
            28.455008346510812
        ],
        "wc_weaknesses_avg": [
            120.0,
            67.3349834781297
        ],
        "wc_questions_avg": [
            96.0,
            50.68037095365423
        ],
        "wc_review_avg": [
            434.5,
            160.02890363931135
        ],
        "wc_reply_reviewers_avg": [
            48.5,
            66.81878478392136
        ],
        "wc_reply_authors_avg": [
            416.75,
            198.6899280285742
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14658028486869427823&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=tUtGjQEDd4",
        "pdf": "https://openreview.net/pdf?id=tUtGjQEDd4",
        "email": "gatech.edu;apple.com;apple.com;gatech.edu;apple.com;apple.com",
        "author_num": 6,
        "aff_unique_index": "0;1;1;0;1;1",
        "aff_unique_norm": "Georgia Institute of Technology;Apple",
        "aff_unique_dep": ";Apple Inc.",
        "aff_unique_url": "https://www.gatech.edu;https://www.apple.com",
        "aff_unique_abbr": "Georgia Tech;Apple",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Provable Offline Preference-Based Reinforcement Learning",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17613",
        "id": "tVMPfEGT2w",
        "author_site": "Wenhao Zhan, Masatoshi Uehara, Nathan Kallus, Jason Lee, Wen Sun",
        "tldr": "",
        "abstract": "In this paper, we investigate the problem of offline Preference-based Reinforcement Learning (PbRL) with human feedback where feedback is available in the form of preference between trajectory pairs rather than explicit rewards. Our proposed algorithm consists of two main steps: (1) estimate the implicit reward using Maximum Likelihood Estimation (MLE) with general function approximation from offline data and (2) solve a distributionally robust planning problem over a confidence set around the MLE. We consider the general reward setting where the reward can be defined over the whole trajectory and provide a novel guarantee that allows us to learn any target policy with a polynomial number of samples, as long as the target policy is covered by the offline data. This guarantee is the first of its kind with general function approximation. To measure the coverage of the target policy, we introduce a new single-policy concentrability coefficient, which can be upper bounded by the per-trajectory concentrability coefficient. We also establish lower bounds that highlight the necessity of such concentrability and the difference from standard RL, where state-action-wise rewards are directly observed. We further extend and analyze our algorithm when the feedback is given over action pairs.",
        "keywords": "reinforcement learning theory;offline reinforcement learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/ed858e7f09bcfb8d3cfa3940703ececfd38216c6.pdf",
        "author": "Wenhao Zhan;Masatoshi Uehara;Nathan Kallus;Jason D. Lee;Wen Sun",
        "authorids": "~Wenhao_Zhan1;~Masatoshi_Uehara1;~Nathan_Kallus1;~Jason_D._Lee1;~Wen_Sun1",
        "gender": "M;M;;M;",
        "homepage": ";https://www.masatoshiuehara.com/;http://nathankallus.com/;https://jasondlee88.github.io/;https://wensun.github.io",
        "dblp": "275/3558;225/6517;142/2900;88/3262;",
        "google_scholar": ";https://scholar.google.co.jp/citations?user=xuLKJboAAAAJ;K2WfIlsAAAAJ;GR_DsT0AAAAJ;iOLC30YAAAAJ",
        "orcid": ";0000-0001-9017-3105;0000-0003-1672-0507;;",
        "linkedin": ";;;;",
        "or_profile": "~Wenhao_Zhan1;~Masatoshi_Uehara1;~Nathan_Kallus1;~Jason_D._Lee1;~Wen_Sun1",
        "aff": "Princeton University;Genentech ;Cornell University;Princeton University;Cornell University",
        "aff_domain": "princeton.edu;gene.com;cornell.edu;princeton.edu;cornell.edu",
        "position": "PhD student;Researcher;Associate Professor;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nzhan2024provable,\ntitle={Provable Offline Preference-Based Reinforcement Learning},\nauthor={Wenhao Zhan and Masatoshi Uehara and Nathan Kallus and Jason D. Lee and Wen Sun},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=tVMPfEGT2w}\n}",
        "github": "",
        "project": "",
        "reviewers": "Ekit;2Fsc;1qtd;AQNJ",
        "pdf_size": 409052,
        "rating": "6;8;8;8",
        "confidence": "3;2;2;3",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;4",
        "presentation": "2;2;3;4",
        "wc_summary": "87;83;307;230",
        "wc_strengths": "68;84;34;40",
        "wc_weaknesses": "127;285;18;25",
        "wc_questions": "65;20;46;2",
        "wc_review": "347;472;405;297",
        "wc_reply_reviewers": "122;34;5;5",
        "wc_reply_authors": "1275;812;259;122",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "4;2;2;2",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            2.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            176.75,
            95.71409248381347
        ],
        "wc_strengths_avg": [
            56.5,
            20.414455662593603
        ],
        "wc_weaknesses_avg": [
            113.75,
            107.87347913180514
        ],
        "wc_questions_avg": [
            33.25,
            24.097458372201828
        ],
        "wc_review_avg": [
            380.25,
            65.31988594601188
        ],
        "wc_reply_reviewers_avg": [
            41.5,
            47.96092159247985
        ],
        "wc_reply_authors_avg": [
            617.0,
            459.39579884887934
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.5,
            0.8660254037844386
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 41,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10393948193536826266&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=tVMPfEGT2w",
        "pdf": "https://openreview.net/pdf?id=tVMPfEGT2w",
        "email": "princeton.edu;gene.com;cornell.edu;princeton.edu;cornell.edu",
        "author_num": 5,
        "aff_unique_index": "0;1;2;0;2",
        "aff_unique_norm": "Princeton University;Genentech;Cornell University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.princeton.edu;https://www.genentech.com;https://www.cornell.edu",
        "aff_unique_abbr": "Princeton;Genentech;Cornell",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "GraphCare: Enhancing Healthcare Predictions with Personalized Knowledge Graphs",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17612",
        "id": "tVTN7Zs0ml",
        "author_site": "Pengcheng Jiang, Cao Xiao, Adam Cross, Jimeng Sun",
        "tldr": "",
        "abstract": "Clinical predictive models often rely on patients\u2019 electronic health records (EHR), but integrating medical knowledge to enhance predictions and decision-making is challenging. This is because personalized predictions require personalized knowledge\ngraphs (KGs), which are difficult to generate from patient EHR data. To address this, we propose GraphCare, an open-world framework that uses external KGs to improve EHR-based predictions. Our method extracts knowledge from large language models (LLMs) and external biomedical KGs to build patient-specific KGs, which are then used to train our proposed Bi-attention AugmenTed\n(BAT) graph neural network (GNN) for healthcare predictions. On two public datasets, MIMIC-III and MIMIC-IV, GraphCare surpasses baselines in four vital healthcare prediction tasks: mortality, readmission, length of stay (LOS), and drug recommendation. On MIMIC-III, it boosts AUROC by 17.6% and 6.6% for mortality and readmission, and F1-score by 7.9% and 10.8% for LOS and drug recommendation, respectively. Notably, GraphCare demonstrates a substantial edge in scenarios with limited data availability. Our findings highlight the potential of using external KGs in healthcare prediction tasks and demonstrate the promise of GraphCare in generating personalized KGs for promoting personalized medicine.",
        "keywords": "EHR Prediction;Personalized Knowledge Graph;Graph Neural Network",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/98c33106aa6c6bf822c59700ab7bd6860f1e0dd2.zip",
        "author": "Pengcheng Jiang;Cao Xiao;Adam Richard Cross;Jimeng Sun",
        "authorids": "~Pengcheng_Jiang2;~Cao_Xiao2;~Adam_Richard_Cross1;~Jimeng_Sun3",
        "gender": "M;F;;",
        "homepage": "https://pat-jj.github.io/;https://sites.google.com/view/danicaxiao/home;;http://sunlab.org",
        "dblp": "60/8352;170/1833;;",
        "google_scholar": "TejDN9wAAAAJ;ahaV25EAAAAJ;;9jmmp5sAAAAJ",
        "orcid": "0000-0001-9925-3777;;0000-0001-5866-5943;0000-0003-1512-6426",
        "linkedin": "patrick-j-3492b4235/;caoxiao/;;jimengsun/",
        "or_profile": "~Pengcheng_Jiang2;~Cao_Xiao2;~Adam_Richard_Cross1;~Jimeng_Sun3",
        "aff": "University of Illinois at Urbana Champaign;GE Healthcare;University of Illinois at Chicago;Georgia Institute of Technology",
        "aff_domain": "cs.illinois.edu;ge.com;uic.edu;gatech.edu",
        "position": "MS student;VP of AI;Assistant Professor;Associate Professor",
        "bibtex": "@inproceedings{\njiang2024graphcare,\ntitle={GraphCare: Enhancing Healthcare Predictions with Personalized Knowledge Graphs},\nauthor={Pengcheng Jiang and Cao Xiao and Adam Richard Cross and Jimeng Sun},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=tVTN7Zs0ml}\n}",
        "github": "",
        "project": "",
        "reviewers": "qgPW;baD4;ZFn4",
        "pdf_size": 4136002,
        "rating": "6;6;6",
        "confidence": "4;4;4",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "3;2;3",
        "wc_summary": "76;62;90",
        "wc_strengths": "36;83;102",
        "wc_weaknesses": "421;154;118",
        "wc_questions": "74;27;51",
        "wc_review": "607;326;361",
        "wc_reply_reviewers": "15;35;14",
        "wc_reply_authors": "1453;1205;1390",
        "reply_reviewers": "1;1;1",
        "reply_authors": "4;3;4",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            76.0,
            11.430952132988164
        ],
        "wc_strengths_avg": [
            73.66666666666667,
            27.740864362084242
        ],
        "wc_weaknesses_avg": [
            231.0,
            135.15176654413364
        ],
        "wc_questions_avg": [
            50.666666666666664,
            19.189117286165672
        ],
        "wc_review_avg": [
            431.3333333333333,
            125.03421753886235
        ],
        "wc_reply_reviewers_avg": [
            21.333333333333332,
            9.672412085697939
        ],
        "wc_reply_authors_avg": [
            1349.3333333333333,
            105.24996700975994
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 39,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2649163907279334874&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 9,
        "openreview": "https://openreview.net/forum?id=tVTN7Zs0ml",
        "pdf": "https://openreview.net/pdf?id=tVTN7Zs0ml",
        "email": "cs.illinois.edu;ge.com;uic.edu;gatech.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "University of Illinois Urbana-Champaign;GE Healthcare;University of Illinois at Chicago;Georgia Institute of Technology",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://illinois.edu;https://www.gehealthcare.com;https://www.uic.edu;https://www.gatech.edu",
        "aff_unique_abbr": "UIUC;GEHC;UIC;Georgia Tech",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Urbana-Champaign;;Chicago",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "tVU6GuHElo",
        "title": "Minimalist and High-Performance Semantic Segmentation with Plain Vision Transformers",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In the wake of Masked Image Modeling (MIM), a diverse range of plain, non-hierarchical Vision Transformer (ViT) models have been pre-trained with extensive datasets, offering new paradigms and significant potential for semantic segmentation. Current state-of-the-art systems incorporate numerous inductive biases and employ cumbersome decoders. Building upon the original motivations of plain ViTs, which are simplicity and generality, we explore high-performance 'minimalist' systems to this end. Our primary purpose is to provide simple and efficient baselines for practical semantic segmentation with plain ViTs. Specifically, we first explore the feasibility and methodology for achieving high-performance semantic segmentation using the last feature map. As a result, we introduce the PlainSeg, a model comprising only three 3$\\times$3 convolutions in addition to the transformer layers (either encoder or decoder). In this process, we offer insights into two underlying principles: (i) high-resolution features are crucial to high performance in spite of employing simple up-sampling techniques and (ii) the slim transformer decoder requires a much larger learning rate than the wide transformer decoder. On this basis, we further present the PlainSeg-Hier, which allows for the utilization of hierarchical features. Extensive experiments on four popular benchmarks demonstrate the high performance and efficiency of our methods. They can also serve as powerful tools for assessing the transfer ability of base models in semantic segmentation. The codes will be available.",
        "keywords": "semantic segmentation;plain vision transformer;minimalist",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Yuanduo Hong;Jue Wang;Weichao Sun;Huihui Pan",
        "authorids": "~Yuanduo_Hong2;~Jue_Wang10;~Weichao_Sun1;~Huihui_Pan1",
        "gender": "M;F;M;M",
        "homepage": ";;http://homepage.hit.edu.cn/sunweichao;",
        "dblp": "283/5285;;05/8133;168/6480",
        "google_scholar": "ODDoa14AAAAJ;https://scholar.google.com.hk/citations?user=kYoTXn4AAAAJ;;",
        "orcid": ";;;0000-0002-8765-9806",
        "linkedin": ";;;",
        "or_profile": "~Yuanduo_Hong2;~Jue_Wang10;~Weichao_Sun1;~Huihui_Pan1",
        "aff": "Harbin Institute of Technology;;Harbin Institute of Technology;",
        "aff_domain": "hit.edu.cn;;hit.edu.cn;",
        "position": "PhD student;;Full Professor;",
        "bibtex": "@misc{\nhong2024minimalist,\ntitle={Minimalist and High-Performance Semantic Segmentation with Plain Vision Transformers},\nauthor={Yuanduo Hong and Jue Wang and Weichao Sun and Huihui Pan},\nyear={2024},\nurl={https://openreview.net/forum?id=tVU6GuHElo}\n}",
        "github": "",
        "project": "",
        "reviewers": "eJjr;a5pX;iRsh;Vw3B",
        "site": "https://openreview.net/forum?id=tVU6GuHElo",
        "pdf_size": 15726465,
        "rating": "3;3;3;5",
        "confidence": "5;4;5;4",
        "soundness": "1;2;2;3",
        "contribution": "1;2;2;2",
        "presentation": "2;2;3;1",
        "wc_summary": "63;152;70;124",
        "wc_strengths": "7;61;50;107",
        "wc_weaknesses": "206;152;169;483",
        "wc_questions": "64;197;22;146",
        "wc_review": "340;562;311;860",
        "wc_reply_reviewers": "215;0;0;192",
        "wc_reply_authors": "1121;841;489;1214",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "3;2;1;3",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            102.25,
            37.1777823437601
        ],
        "wc_strengths_avg": [
            56.25,
            35.57650207651112
        ],
        "wc_weaknesses_avg": [
            252.5,
            134.5037174207464
        ],
        "wc_questions_avg": [
            107.25,
            68.36437303157253
        ],
        "wc_review_avg": [
            518.25,
            219.90495105840614
        ],
        "wc_reply_reviewers_avg": [
            101.75,
            102.07442137969727
        ],
        "wc_reply_authors_avg": [
            916.25,
            282.30424633717433
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16684574066150170660&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Harbin Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.hit.edu.cn/",
        "aff_unique_abbr": "HIT",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Harbin",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "tVuZa1bgOs",
        "title": "Towards reporting bias in visual-language datasets: bimodal augmentation by decoupling object-attribute association",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Reporting bias arises when people assume that some knowledge is universally understood and hence, do not necessitate explicit elaboration. In this paper, we focus on the wide existence of reporting bias in visual-language datasets, embodied as the object-attribute association, which can subsequentially degrade models trained on them. To mitigate this bias, we propose a bimodal augmentation (BiAug) approach through object-attribute decoupling to flexibly synthesize visual-language examples with a rich array of object-attribute pairing and construct cross-modal hard negatives. We employ large language models (LLMs) in conjunction with a grounding object detector to extract target objects. Subsequently, the LLM generates a detailed attribute description for each object and produces a corresponding hard negative counterpart. An inpainting model is then used to create images based on these detailed object descriptions. By doing so, the synthesized examples explicitly complement omitted objects and attributes to learn, and the hard negative pairs steer the model to distinguish object attributes. Our experiments demonstrated that BiAug is superior in object-attribute understanding. In addition, BiAug also improves the performance on zero-shot retrieval tasks on general benchmarks like MSCOCO and Flickr30K.\nBiAug refines the way of collecting text-image datasets. Mitigating the reporting bias helps models achieve a deeper understanding of visual-language phenomena, expanding beyond mere frequent patterns to encompass the richness and diversity of real-world scenarios.",
        "keywords": "Reporting Bias;Visual-language Representation Learning;Data Augmentation;Commonsense",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Qiyu Wu;Mengjie Zhao;Yutong He;Lang Huang;Junya Ono;Hiromi Wakaki;Yuki Mitsufuji",
        "authorids": "~Qiyu_Wu2;~Mengjie_Zhao1;~Yutong_He1;~Lang_Huang1;~Junya_Ono1;~Hiromi_Wakaki1;~Yuki_Mitsufuji1",
        "gender": ";;F;M;;F;M",
        "homepage": ";https://joemzhao.github.io/about.html;https://kellyyutonghe.github.io/;https://layneh.github.io;;;https://www.yukimitsufuji.com/",
        "dblp": ";221/1261;;204/2434;;07/3863;136/5043",
        "google_scholar": ";https://scholar.google.jp/citations?user=G6ema1YAAAAJ;uNF3hk0AAAAJ;fhr1LrUAAAAJ;;https://scholar.google.co.jp/citations?user=lv41luwAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;0000-0002-3405-0298;;;0000-0002-6806-6140",
        "linkedin": ";;yutong-he-b7608b12b/;lang-huang-9330b7243/;;hiromi-wakaki-570067286/;mittu1204",
        "or_profile": "~Qiyu_Wu2;~Mengjie_Zhao1;~Yutong_He1;~Lang_Huang1;~Junya_Ono1;~Hiromi_Wakaki1;~Yuki_Mitsufuji1",
        "aff": ";Sony;School of Computer Science, Carnegie Mellon University;The University of Tokyo;;Sony Group Corporation;Tokyo Institute of Technology, Tokyo Institute of Technology",
        "aff_domain": ";sony.com;cs.cmu.edu;t.u-tokyo.ac.jp;;sony.com;titech.ac.jp",
        "position": ";Researcher;PhD student;PhD student;;Senior Manager;Associate Professor",
        "bibtex": "@misc{\nwu2024towards,\ntitle={Towards reporting bias in visual-language datasets: bimodal augmentation by decoupling object-attribute association},\nauthor={Qiyu Wu and Mengjie Zhao and Yutong He and Lang Huang and Junya Ono and Hiromi Wakaki and Yuki Mitsufuji},\nyear={2024},\nurl={https://openreview.net/forum?id=tVuZa1bgOs}\n}",
        "github": "",
        "project": "",
        "reviewers": "chuK;6Azz;ANJ5;NefH",
        "site": "https://openreview.net/forum?id=tVuZa1bgOs",
        "pdf_size": 1122900,
        "rating": "5;5;6;8",
        "confidence": "4;3;5;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;1;3;4",
        "wc_summary": "68;183;85;54",
        "wc_strengths": "34;97;69;78",
        "wc_weaknesses": "102;228;157;203",
        "wc_questions": "43;231;3;3",
        "wc_review": "247;739;314;338",
        "wc_reply_reviewers": "36;0;38;0",
        "wc_reply_authors": "880;1307;626;607",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "2;3;2;2",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            97.5,
            50.56925943693461
        ],
        "wc_strengths_avg": [
            69.5,
            22.85278976405288
        ],
        "wc_weaknesses_avg": [
            172.5,
            48.0130190677487
        ],
        "wc_questions_avg": [
            70.0,
            94.37690395430441
        ],
        "wc_review_avg": [
            409.5,
            193.1379040996355
        ],
        "wc_reply_reviewers_avg": [
            18.5,
            18.513508581573618
        ],
        "wc_reply_authors_avg": [
            855.0,
            282.3446475497632
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.24618298195866545,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16587385971932011829&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "Sony Corporation;Carnegie Mellon University;University of Tokyo;Sony Group Corporation;Tokyo Institute of Technology",
        "aff_unique_dep": ";School of Computer Science;;;",
        "aff_unique_url": "https://www.sony.com;https://www.cmu.edu;https://www.u-tokyo.ac.jp;https://www.sony.com;https://www.titech.ac.jp",
        "aff_unique_abbr": "Sony;CMU;UTokyo;Sony;Titech",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Pittsburgh;Tokyo",
        "aff_country_unique_index": "0;1;0;0;0",
        "aff_country_unique": "Japan;United States"
    },
    {
        "id": "tWNHQq7gZX",
        "title": "Universal Sleep Decoder: Aligning awake and sleep neural representation across subjects",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Decoding memory content from brain activity during sleep has long been a goal in neuroscience. While spontaneous reactivation of memories during sleep in rodents is known to support memory consolidation and offline learning, capturing memory replay in humans is challenging due to the absence of well-annotated sleep datasets and the substantial differences in neural patterns between wakefulness and sleep.\nTo address these challenges, we designed a novel cognitive neuroscience experiment and collected a comprehensive, well-annotated electroencephalography (EEG) dataset from 52 subjects during both wakefulness and sleep. Leveraging this benchmark dataset, we developed the Universal Sleep Decoder (USD) to align neural representations between wakefulness and sleep across subjects. Our model achieves up to 16.6% top-1 zero-shot accuracy on unseen subjects, comparable to decoding performances using individual sleep data. Furthermore, fine-tuning USD on test subjects enhances decoding accuracy to 25.9% top-1 accuracy, a substantial improvement over the baseline chance of 6.7%.\nModel comparison and ablation analyses reveal that our design choices, including the use of (i) an additional contrastive objective to integrate awake and sleep neural signals and (i) the pretrain-finetune paradigm to incorporate different subjects, significantly contribute to these performances. Collectively, our findings and methodologies represent a significant advancement in the field of sleep decoding.",
        "keywords": "neuroscience;sleep decoding;contrastive learning;pretraining",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/5b7f3dd42abae5a88e1b58f05dfff1d294ad8f5b.zip",
        "author": "Hui Zheng;Zhongtao Chen;Haiteng Wang;Jianyang Zhou;Lin Zheng;Yunzhe Liu",
        "authorids": "~Hui_Zheng1;~Zhongtao_Chen1;~Haiteng_Wang1;~Jianyang_Zhou1;~Lin_Zheng2;~Yunzhe_Liu2",
        "gender": "M;M;M;M;M;Not Specified",
        "homepage": "https://norbertzheng.github.io;https://github.com/opghjywl;https://scholar.google.com/citations?hl=en&user=W-EvV0MAAAAJ;https://github.com/JianyangZhou;https://orcid.org/0000-0002-8484-087X;https://github.com/yunzheliu",
        "dblp": ";;;;;",
        "google_scholar": "NWFTgZ8AAAAJ;;https://scholar.google.com/citations?hl=en;;;JTvHJzUAAAAJ",
        "orcid": "0000-0003-0513-9389;;;;0000-0002-8484-087X;",
        "linkedin": "hui-zheng-988b38219/;;;;;",
        "or_profile": "~Hui_Zheng1;~Zhongtao_Chen1;~Haiteng_Wang1;~Jianyang_Zhou1;~Lin_Zheng2;~Yunzhe_Liu2",
        "aff": "Westlake University;;Beijing Normal University;Chinese Institute for Brain Research, Beijing;;",
        "aff_domain": "westlake.edu;;bnu.edu.cn;cibr.ac.cn;;",
        "position": "Intern;;MS student;PhD student;;",
        "bibtex": "@misc{\nzheng2024universal,\ntitle={Universal Sleep Decoder: Aligning awake and sleep neural representation across subjects},\nauthor={Hui Zheng and Zhongtao Chen and Haiteng Wang and Jianyang Zhou and Lin Zheng and Yunzhe Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=tWNHQq7gZX}\n}",
        "github": "",
        "project": "",
        "reviewers": "BG5d;i9wd;mxAy",
        "site": "https://openreview.net/forum?id=tWNHQq7gZX",
        "pdf_size": 13655045,
        "rating": "3;6;6",
        "confidence": "5;4;4",
        "soundness": "2;2;2",
        "contribution": "2;3;3",
        "presentation": "2;2;4",
        "wc_summary": "63;119;41",
        "wc_strengths": "14;108;44",
        "wc_weaknesses": "119;338;376",
        "wc_questions": "4;405;89",
        "wc_review": "200;970;550",
        "wc_reply_reviewers": "0;756;162",
        "wc_reply_authors": "1114;2704;1261",
        "reply_reviewers": "0;3;1",
        "reply_authors": "2;6;3",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            74.33333333333333,
            32.836294282732666
        ],
        "wc_strengths_avg": [
            55.333333333333336,
            39.20317447463775
        ],
        "wc_weaknesses_avg": [
            277.6666666666667,
            113.26174209424039
        ],
        "wc_questions_avg": [
            166.0,
            172.5243944103751
        ],
        "wc_review_avg": [
            573.3333333333334,
            314.78387647541433
        ],
        "wc_reply_reviewers_avg": [
            306.0,
            324.9984615348202
        ],
        "wc_reply_authors_avg": [
            1693.0,
            717.3994703092552
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            1.247219128924647
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            1.699673171197595
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2470699548797788731&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Westlake University;Beijing Normal University;Chinese Institute for Brain Research",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.westlake.edu.cn;https://www.bnu.edu.cn;",
        "aff_unique_abbr": "WU;BNU;",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Beijing",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "tYsDoVj1At",
        "title": "Automated Search-Space Generation Neural Architecture Search",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "To search an optimal sub-network within a general deep neural network (DNN), existing neural architecture search (NAS) methods typically rely on handcrafting a search space beforehand. Such requirements make it challenging to extend them onto general scenarios without significant human expertise and manual intervention. To overcome the limitations, we propose Automated Search-Space Generation\nNeural Architecture Search (ASGNAS), perhaps the first automated system to train general DNNs that cover all candidate connections and operations and produce high-performing sub-networks in the one shot manner. Technologically, ASGNAS delivers three noticeable contributions to minimize human efforts: (i) automated search space generation for general DNNs; (ii) a Hierarchical Half-Space Projected\nGradient (H2SPG ) that leverages the hierarchy and dependency within generated search space to ensure the network validity during optimization, and reliably produces a solution with both high performance and hierarchical group sparsity; and (iii) automated sub-network construction upon the H2SPG solution. Numerically, we demonstrate the effectiveness of ASGNAS on a variety of general DNNs, including RegNet, StackedUnets, SuperResNet, and DARTS, over benchmark datasets such as CIFAR10, Fashion-MNIST, ImageNet, STL-10 , and SVNH. The sub-networks computed by ASGNAS achieve competitive even superior performance compared to the starting full DNNs and other state-of-the-arts.",
        "keywords": "autoML;neural architecture search;hierarchical structured sparsity",
        "primary_area": "infrastructure, software libraries, hardware, etc.",
        "supplementary_material": "",
        "author": "Tianyi Chen;Luming Liang;Tianyu Ding;Ilya Zharkov",
        "authorids": "~Tianyi_Chen3;~Luming_Liang2;~Tianyu_Ding1;~Ilya_Zharkov1",
        "gender": "M;M;M;M",
        "homepage": ";;;https://www.tianyuding.com",
        "dblp": ";46/6624;217/3421;134/4796",
        "google_scholar": "2BahjdkAAAAJ;vTgdAS4AAAAJ;;Qi7zTOcAAAAJ",
        "orcid": ";;;0000-0001-8445-4330",
        "linkedin": "tianyi-chen-b65502b3/;luming-liang-76185b19/;;tianyuding/",
        "or_profile": "~Tianyi_Chen3;~Luming_Liang2;~Ilya_Zharkov1;~Tianyu_DING2",
        "aff": "Microsoft;Microsoft;Microsoft;Microsoft",
        "aff_domain": "microsoft.com;microsoft.com;microsoft.com;microsoft.com",
        "position": "Senior Researcher;Principal Researcher;Principal Research Manager;Principal Researcher",
        "bibtex": "@misc{\nchen2024automated,\ntitle={Automated Search-Space Generation Neural Architecture Search},\nauthor={Tianyi Chen and Luming Liang and Tianyu Ding and Ilya Zharkov},\nyear={2024},\nurl={https://openreview.net/forum?id=tYsDoVj1At}\n}",
        "github": "",
        "project": "",
        "reviewers": "GBi3;itLo;dxVy;3mHg",
        "site": "https://openreview.net/forum?id=tYsDoVj1At",
        "pdf_size": 3280527,
        "rating": "3;3;5;5",
        "confidence": "3;4;5;5",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "1;2;3;3",
        "wc_summary": "56;47;93;51",
        "wc_strengths": "83;50;77;12",
        "wc_weaknesses": "380;239;557;131",
        "wc_questions": "33;4;2;37",
        "wc_review": "552;340;729;231",
        "wc_reply_reviewers": "176;0;0;0",
        "wc_reply_authors": "1027;442;626;481",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "3;2;2;2",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            61.75,
            18.32177666057525
        ],
        "wc_strengths_avg": [
            55.5,
            28.02231253840411
        ],
        "wc_weaknesses_avg": [
            326.75,
            159.5844212321491
        ],
        "wc_questions_avg": [
            19.0,
            16.077935190813527
        ],
        "wc_review_avg": [
            463.0,
            192.113247851365
        ],
        "wc_reply_reviewers_avg": [
            44.0,
            76.2102355330306
        ],
        "wc_reply_authors_avg": [
            644.0,
            231.50917908368126
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.9045340337332909,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:urVpvO3eiSkJ:scholar.google.com/&scioq=Automated+Search-Space+Generation+Neural+Architecture+Search&hl=en&as_sdt=0,44",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Microsoft",
        "aff_unique_dep": "Microsoft Corporation",
        "aff_unique_url": "https://www.microsoft.com",
        "aff_unique_abbr": "Microsoft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "tZ3JmSDbJM",
        "title": "GRAPES: Learning to Sample Graphs for Scalable Graph Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph neural networks (GNNs) learn the representation of nodes in a graph by aggregating the neighborhood information in various ways. As these networks grow in depth, their receptive field grows exponentially due to the increase in neighborhood sizes, resulting in high memory costs. Graph sampling solves memory issues in GNNs by sampling a small ratio of the nodes in the graph. This way, GNNs can scale to much larger graphs. Most sampling methods focus on fixed sampling heuristics, which may not generalize to different structures or tasks. We introduce GRAPES, an adaptive graph sampling method that learns to identify sets of influential nodes for training a GNN classifier.  GRAPES uses a GFlowNet to learn node sampling probabilities given the classification objectives. We evaluate GRAPES across several small- and large-scale graph benchmarks and demonstrate its effectiveness in accuracy and scalability. In contrast to existing sampling methods, GRAPES maintains high accuracy even with small sample sizes and, therefore, can scale to very large graphs. Our code is publicly available at https://anonymous.4open.science/r/GRAPES.",
        "keywords": "GFlowNet;Graph Sampling;GNN;Scalability;Graphs",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/460ff5f40a12cef6e66190d30cc39520d2d06023.pdf",
        "author": "Taraneh Younesian;Thiviyan Thanapalasingam;Emile van Krieken;Daniel Daza;Peter Bloem",
        "authorids": "~Taraneh_Younesian2;~Thiviyan_Thanapalasingam1;~Emile_van_Krieken1;~Daniel_Daza1;~Peter_Bloem1",
        "gender": "F;M;M;M;M",
        "homepage": ";https://thiviyansingam.com/;https://emilevankrieken.com;https://dfdazac.github.io/;http://peterbloem.nl",
        "dblp": "238/0273.html;;235/1698;258/0746;151/0108",
        "google_scholar": ";F2PvjdUAAAAJ;https://scholar.google.nl/citations?user=il8Y0B4AAAAJ;VR4a4QIAAAAJ;https://scholar.google.nlcitations/?user=zVntAfQAAAAJ",
        "orcid": ";0000-0002-0170-9105;0000-0001-5502-4817;0000-0002-5357-3705;0000-0002-0189-5817",
        "linkedin": "taraneh-younesian1/;;emile-van-krieken/;daniel-daza/;",
        "or_profile": "~Taraneh_Younesian2;~Thiviyan_Thanapalasingam1;~Emile_van_Krieken1;~Daniel_Daza1;~Peter_Bloem1",
        "aff": "Vrije Universiteit Amsterdam;University of Amsterdam;Vrije Universiteit Amsterdam;Amsterdam UMC;Vrije Universiteit Amsterdam",
        "aff_domain": "vu.nl;uva.nl;vu.nl;amsterdamumc.nl;vu.nl",
        "position": "PhD student;PhD student;PhD student;Postdoc;Assistant Professor",
        "bibtex": "@misc{\nyounesian2024grapes,\ntitle={{GRAPES}: Learning to Sample Graphs for Scalable Graph Neural Networks},\nauthor={Taraneh Younesian and Thiviyan Thanapalasingam and Emile van Krieken and Daniel Daza and Peter Bloem},\nyear={2024},\nurl={https://openreview.net/forum?id=tZ3JmSDbJM}\n}",
        "github": "",
        "project": "",
        "reviewers": "iUex;uctj;J9DQ;4YMr",
        "site": "https://openreview.net/forum?id=tZ3JmSDbJM",
        "pdf_size": 754802,
        "rating": "3;3;6;8",
        "confidence": "5;2;4;4",
        "soundness": "2;2;3;4",
        "contribution": "3;2;2;4",
        "presentation": "4;1;3;4",
        "wc_summary": "96;78;88;119",
        "wc_strengths": "104;32;130;162",
        "wc_weaknesses": "310;221;235;223",
        "wc_questions": "81;40;154;50",
        "wc_review": "591;371;607;554",
        "wc_reply_reviewers": "0;151;0;0",
        "wc_reply_authors": "674;872;776;421",
        "reply_reviewers": "0;2;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            5.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            1.224744871391589
        ],
        "wc_summary_avg": [
            95.25,
            15.122417134836613
        ],
        "wc_strengths_avg": [
            107.0,
            47.92702786528704
        ],
        "wc_weaknesses_avg": [
            247.25,
            36.62222685747004
        ],
        "wc_questions_avg": [
            81.25,
            44.63952844733018
        ],
        "wc_review_avg": [
            530.75,
            94.21352079186936
        ],
        "wc_reply_reviewers_avg": [
            37.75,
            65.38491798572512
        ],
        "wc_reply_authors_avg": [
            685.75,
            168.12551115163933
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.21629522817435007,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7318469464735134766&as_sdt=5,39&sciodt=0,39&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0;2;0",
        "aff_unique_norm": "Vrije Universiteit Amsterdam;University of Amsterdam;Amsterdam University Medical Centers",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.vu.nl;https://www.uva.nl;https://www.amsterdamumc.nl/",
        "aff_unique_abbr": "VU Amsterdam;UvA;AMC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Netherlands"
    },
    {
        "title": "Learning to Reject Meets Long-tail Learning",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17611",
        "id": "ta26LtNq2r",
        "author_site": "Harikrishna Narasimhan, Aditya Krishna Menon, Wittawat Jitkrittum, Neha Gupta, Sanjiv Kumar",
        "tldr": "",
        "abstract": "Learning to reject (L2R) is a classical problem where one seeks a classifier capable of abstaining on low-confidence samples. Most prior work on L2R has focused on minimizing the standard misclassification error. However, in many real-world applications, the label distribution is highly imbalanced,  necessitating alternate evaluation metrics such as the balanced error or the worst-group error that enforce equitable performance across both the head and tail classes. In this paper, we establish that traditional L2R methods can be grossly sub-optimal for such metrics, and show that this is due to an intricate  dependence in the objective between the label costs and the rejector. We then derive the form of the Bayes-optimal classifier and rejector for the balanced error, propose a novel plug-in approach to mimic this solution, and extend our results to general evaluation metrics. Through experiments on benchmark  image classification tasks, we show that our approach yields better trade-offs in both the balanced and worst-group error compared to L2R baselines.",
        "keywords": "Learning to reject;balanced error;evaluation metrics;selective classification;plug-in approach;long-tail learning;class imbalance;non-decomposable metrics",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Harikrishna Narasimhan;Aditya Krishna Menon;Wittawat Jitkrittum;Neha Gupta;Sanjiv Kumar",
        "authorids": "~Harikrishna_Narasimhan1;~Aditya_Krishna_Menon1;~Wittawat_Jitkrittum1;~Neha_Gupta1;~Sanjiv_Kumar1",
        "gender": "M;M;F;;M",
        "homepage": "https://hari-research.github.io/;http://wittawat.com;;http://www.sanjivk.com/;https://akmenon.github.io/",
        "dblp": "56/7573;95/3398.html;09/6861-2;;89/3514",
        "google_scholar": "7X_oT4YAAAAJ;https://scholar.google.co.uk/citations?hl=en;;https://scholar.google.com/citations?hl=en;",
        "orcid": ";0000-0002-9400-9262;;;",
        "linkedin": ";wittawat-jitkrittum/;;;",
        "or_profile": "~Harikrishna_Narasimhan1;~Wittawat_Jitkrittum1;~Neha_Gupta1;~Sanjiv_Kumar1;~Aditya_Menon1",
        "aff": "Google;Google Research;Google;Google;Google",
        "aff_domain": "google.com;google.com;google.com;google.com;google.com",
        "position": "Research Scientist;Research Scientist;Researcher;Research Scientist;Research Scientist",
        "bibtex": "@inproceedings{\nnarasimhan2024learning,\ntitle={Learning to Reject Meets Long-tail Learning},\nauthor={Harikrishna Narasimhan and Aditya Krishna Menon and Wittawat Jitkrittum and Neha Gupta and Sanjiv Kumar},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ta26LtNq2r}\n}",
        "github": "",
        "project": "",
        "reviewers": "91tX;RZqs;iFdp;RJqn",
        "pdf_size": 752786,
        "rating": "8;8;8;8",
        "confidence": "3;3;4;4",
        "soundness": "3;4;4;3",
        "contribution": "3;4;4;3",
        "presentation": "4;3;4;3",
        "wc_summary": "41;85;200;212",
        "wc_strengths": "54;53;98;120",
        "wc_weaknesses": "132;18;87;157",
        "wc_questions": "5;56;56;16",
        "wc_review": "232;212;441;505",
        "wc_reply_reviewers": "16;73;40;23",
        "wc_reply_authors": "601;416;329;666",
        "reply_reviewers": "1;2;1;1",
        "reply_authors": "1;3;1;2",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.5,
            0.5
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            134.5,
            73.29563424925117
        ],
        "wc_strengths_avg": [
            81.25,
            28.82164984868146
        ],
        "wc_weaknesses_avg": [
            98.5,
            52.81335058486632
        ],
        "wc_questions_avg": [
            33.25,
            23.080023830143677
        ],
        "wc_review_avg": [
            347.5,
            127.71941904033231
        ],
        "wc_reply_reviewers_avg": [
            38.0,
            22.01136070305514
        ],
        "wc_reply_authors_avg": [
            503.0,
            136.03124641052142
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12085302760130844775&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=ta26LtNq2r",
        "pdf": "https://openreview.net/pdf?id=ta26LtNq2r",
        "email": "google.com;google.com;google.com;google.com;google.com",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Google",
        "aff_unique_dep": "Google",
        "aff_unique_url": "https://www.google.com",
        "aff_unique_abbr": "Google",
        "aff_campus_unique_index": "0;0;0;0;0",
        "aff_campus_unique": "Mountain View",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "ta2ctBXj1J",
        "title": "CityGPT: Generative Transformer for City Layout of Arbitrary Building Shape",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "City layout generation has gained substantial attention in the research community with applications in urban planning and gaming. \nWe introduce CityGPT, the generative pre-trained transformers for modeling city layout distributions from large-scale layout datasets without requiring priors like satellite images, road networks, or layout graphs. Inspired by masked autoencoders (MAE), our key idea is to decompose this model into two conditional ones: first a distribution of buildings' center positions conditioned on unmasked layouts, and then a distribution of masked layouts conditioned on their sampled center positions and unmasked layouts. These two conditional models are learned sequentially as two transformer-based masked autoencoders. Moreover, by adding an autoregressive polygon model after the second autoencoder, CityGPT can generate city layouts with arbitrary building footprint shapes instead of boxes or predefined shape sets.\nCityGPT exhibits strong performance gains over baseline methods and supports a diverse range of generation tasks, including 2.5D city generation, city completion, infinite city generation, and conditional layout generation.",
        "keywords": "City layout generation;GPT;Infinity generation;Polygon layout",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/06e5b0983348c5394e562f20cb1eaab4827e52e8.zip",
        "author": "Rongjing Xie;Wenyu Han;Shuhang Ge;Congcong Wen;Chen Feng",
        "authorids": "~Rongjing_Xie1;~Wenyu_Han1;~Shuhang_Ge1;~Congcong_Wen1;~Chen_Feng2",
        "gender": "M;M;M;;M",
        "homepage": "https://github.com/RongjingXie;https://ai4ce.github.io/;;http://www.wencc.xyz/;https://ai4ce.github.io/",
        "dblp": ";;;218/4638;01/161-2",
        "google_scholar": ";;;https://scholar.google.com.hk/citations?user=OTBgvCYAAAAJ;YeG8ZM0AAAAJ",
        "orcid": ";;;0000-0001-6448-003X;0000-0003-3211-1576",
        "linkedin": ";;shuhang-ge-ba81a5274/;;simbaforrest/",
        "or_profile": "~Rongjing_Xie1;~Wenyu_Han1;~Shuhang_Ge1;~Congcong_Wen1;~Chen_Feng2",
        "aff": "Tsinghua University;New York University;New York University;New York University;New York University",
        "aff_domain": "mails.tsinghua.edu.cn;nyu.edu;nyu.edu;nyu.edu;nyu.edu",
        "position": "Undergrad student;PhD student;MS student;Postdoc;Assistant Professor",
        "bibtex": "@misc{\nxie2024citygpt,\ntitle={City{GPT}: Generative Transformer for City Layout of Arbitrary Building Shape},\nauthor={Rongjing Xie and Wenyu Han and Shuhang Ge and Congcong Wen and Chen Feng},\nyear={2024},\nurl={https://openreview.net/forum?id=ta2ctBXj1J}\n}",
        "github": "",
        "project": "",
        "reviewers": "2WzD;zw2r;K6Hc;YWWm",
        "site": "https://openreview.net/forum?id=ta2ctBXj1J",
        "pdf_size": 35480714,
        "rating": "3;5;6;6",
        "confidence": "4;4;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "96;103;81;77",
        "wc_strengths": "61;17;74;42",
        "wc_weaknesses": "321;73;94;192",
        "wc_questions": "263;107;66;32",
        "wc_review": "741;300;315;343",
        "wc_reply_reviewers": "648;89;0;0",
        "wc_reply_authors": "2727;914;343;489",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "5;2;1;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            89.25,
            10.638961415476606
        ],
        "wc_strengths_avg": [
            48.5,
            21.453437952924933
        ],
        "wc_weaknesses_avg": [
            170.0,
            98.06885336333856
        ],
        "wc_questions_avg": [
            117.0,
            88.37703321564942
        ],
        "wc_review_avg": [
            424.75,
            183.23806236696566
        ],
        "wc_reply_reviewers_avg": [
            184.25,
            270.2002729458281
        ],
        "wc_reply_authors_avg": [
            1118.25,
            952.2030705159483
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            1.6393596310755
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:HX9ecCjX9gEJ:scholar.google.com/&scioq=CityGPT:+Generative+Transformer+for+City+Layout+of+Arbitrary+Building+Shape&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1;1",
        "aff_unique_norm": "Tsinghua University;New York University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.nyu.edu",
        "aff_unique_abbr": "THU;NYU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Uni-O4: Unifying Online and Offline Deep Reinforcement Learning with Multi-Step On-Policy Optimization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17610",
        "id": "tbFBh3LMKi",
        "author_site": "Kun LEI, Zhengmao He, Chenhao Lu, Kaizhe Hu, Yang Gao, Huazhe Xu",
        "tldr": "",
        "abstract": "Combining offline and online reinforcement learning (RL) is crucial for efficient and safe learning. However, previous approaches treat offline and online learning as separate procedures, resulting in redundant designs and limited performance. We ask: *Can we achieve straightforward yet effective offline and online learning without introducing extra conservatism or regularization?* In this study, we propose Uni-O4, which utilizes an on-policy objective for both offline and online learning. Owning to the alignment of objectives in two phases, the RL agent can transfer between offline and online learning seamlessly. This property enhances the flexibility of the learning paradigm, allowing for arbitrary combinations of pretraining, fine-tuning, offline, and online learning. In the offline phase, specifically, Uni-O4 leverages diverse ensemble policies to address the mismatch issues between the estimated behavior policy and the offline dataset. Through a simple offline policy evaluation (OPE) approach, Uni-O4 can achieve multi-step policy improvement safely. We demonstrate that by employing the method above, the fusion of these two paradigms can yield superior offline initialization as well as stable and rapid online fine-tuning capabilities. \nThrough real-world robot tasks, we highlight the benefits of this paradigm for rapid deployment in challenging, previously unseen real-world environments. Additionally, through comprehensive evaluations using numerous simulated benchmarks, we substantiate that our method achieves state-of-the-art performance in both offline and offline-to-online fine-tuning learning. [Our website](uni-o4.github.io)",
        "keywords": "Offline-to-Online Fine-tuning;On-policy Learning;Robot Learning;Reinforcement Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Kun LEI;Zhengmao He;Chenhao Lu;Kaizhe Hu;Yang Gao;Huazhe Xu",
        "authorids": "~Kun_LEI1;~Zhengmao_He1;~Chenhao_Lu1;~Kaizhe_Hu1;~Yang_Gao1;~Huazhe_Xu1",
        "gender": "M;M;;M;M;M",
        "homepage": "https://lei-kun.github.io/;https://zhengmaohe.netlify.app/;https://ctp314.github.io/;https://hukz18.github.io/;http://yang-gao.weebly.com;http://hxu.rocks",
        "dblp": "292/4342;;;330/4940;89/4402-29;164/9006",
        "google_scholar": "https://scholar.google.com.hk/citations?user=GfUvUacAAAAJ;;;mPpYLhcAAAAJ;https://scholar.google.com/citations?hl=en;t9HPFawAAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";;;%E5%BC%80%E5%93%B2-%E8%83%A1-40137718a/?miniProfileUrn=urn%3Ali%3Afs_miniProfile%3AACoAACyMbIEBJhMDJ4b7wLQyHotP_JGOnWDoEDU;yang-gao-45245348/;",
        "or_profile": "~Kun_LEI1;~Zhengmao_He1;~Chenhao_Lu1;~Kaizhe_Hu1;~Yang_Gao1;~Huazhe_Xu1",
        "aff": "Washington University, Saint Louis;;Tsinghua University;Stanford University;Tsinghua University;Tsinghua University",
        "aff_domain": "wustl.edu;;tsinghua.edu.cn;stanford.edu;tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "PhD student;;Undergrad student;Researcher;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nlei2024unio,\ntitle={Uni-O4: Unifying Online and Offline Deep Reinforcement Learning with Multi-Step On-Policy Optimization},\nauthor={Kun LEI and Zhengmao He and Chenhao Lu and Kaizhe Hu and Yang Gao and Huazhe Xu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=tbFBh3LMKi}\n}",
        "github": "",
        "project": "",
        "reviewers": "jjSi;bAiM;rY3g;CZhd",
        "pdf_size": 9896999,
        "rating": "6;6;8;8",
        "confidence": "5;3;4;3",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "106;74;87;86",
        "wc_strengths": "26;76;77;37",
        "wc_weaknesses": "580;158;23;92",
        "wc_questions": "2;115;85;15",
        "wc_review": "714;423;272;230",
        "wc_reply_reviewers": "27;0;0;32",
        "wc_reply_authors": "3006;1169;762;1049",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "7;4;2;3",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            88.25,
            11.453711188955307
        ],
        "wc_strengths_avg": [
            54.0,
            22.83637449333847
        ],
        "wc_weaknesses_avg": [
            213.25,
            217.0568761868649
        ],
        "wc_questions_avg": [
            54.25,
            47.187789734209844
        ],
        "wc_review_avg": [
            409.75,
            189.75559939037373
        ],
        "wc_reply_reviewers_avg": [
            14.75,
            14.85555451674558
        ],
        "wc_reply_authors_avg": [
            1496.5,
            883.9673353693563
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            4.0,
            1.8708286933869707
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.30151134457776363,
        "gs_citation": 24,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6861312096510332925&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=tbFBh3LMKi",
        "pdf": "https://openreview.net/pdf?id=tbFBh3LMKi",
        "email": "wustl.edu;;tsinghua.edu.cn;stanford.edu;tsinghua.edu.cn;tsinghua.edu.cn",
        "author_num": 6,
        "aff_unique_index": "0;1;2;1;1",
        "aff_unique_norm": "Washington University in St. Louis;Tsinghua University;Stanford University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://wustl.edu;https://www.tsinghua.edu.cn;https://www.stanford.edu",
        "aff_unique_abbr": "WUSTL;THU;Stanford",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Saint Louis;;Stanford",
        "aff_country_unique_index": "0;1;0;1;1",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "A Benchmark for Learning to Translate a New Language from One Grammar Book",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17609",
        "id": "tbVWug9f2h",
        "author_site": "Garrett Tanzer, Mirac Suzgun, Eline Visser, Dan Jurafsky, Luke Melas-Kyriazi",
        "tldr": "",
        "abstract": "Large language models (LLMs) can perform impressive feats with in-context learning or lightweight finetuning. It is natural to wonder how well these models adapt to genuinely new tasks, but how does one find tasks that are unseen in internet-scale training sets? We turn to a field that is explicitly motivated and bottlenecked by a scarcity of web data: low-resource languages. In this paper, we introduce MTOB (Machine Translation from One Book), a benchmark for learning to translate between English and Kalamang\u2014a language with less than 200 speakers and therefore virtually no presence on the web\u2014using several hundred pages of field linguistics reference materials. This task framing is novel in that it asks a model to learn a language from a single human-readable book of grammar explanations, rather than a large mined corpus of in-domain data, more akin to L2 language learning than L1 language acquisition. We demonstrate that baselines using current LLMs are promising but fall short of human performance, achieving 44.7 chrF on Kalamang to English translation and 45.8 chrF on English to Kalamang translation, compared to 51.6 and 57.0 chrF by a human who learned Kalamang from the same reference materials. We hope that MTOB will help measure LLM capabilities along a new dimension, and that the methods developed to solve it could help expand access to language technology for underserved communities by leveraging qualitatively different kinds of data than traditional machine translation.",
        "keywords": "low-resource languages;indigenous languages;endangered languages;long context;field linguistics;unseen tasks;large language models;machine translation;benchmark",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Garrett Tanzer;Mirac Suzgun;Eline Visser;Dan Jurafsky;Luke Melas-Kyriazi",
        "authorids": "~Garrett_Tanzer1;~Mirac_Suzgun1;~Eline_Visser1;~Dan_Jurafsky1;~Luke_Melas-Kyriazi1",
        "gender": "M;;F;M;M",
        "homepage": ";https://web.stanford.edu/people/~msuzgun/;https://elinevisser23.github.io/;http://web.stanford.edu/~jurafsky/;https://lukemelas.github.io/",
        "dblp": "238/9928.html;230/3470;;31/985;228/5680",
        "google_scholar": "https://scholar.google.com/citations?hl=en;C3aEsC8AAAAJ;https://scholar.google.com/citations?hl=nl;uZg9l58AAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;0000-0001-8131-2302;;",
        "linkedin": ";;;;",
        "or_profile": "~Garrett_Tanzer1;~Mirac_Suzgun1;~Eline_Visser1;~Dan_Jurafsky1;~Luke_Melas-Kyriazi1",
        "aff": "Google;Stanford University;University of Oslo;Stanford University;",
        "aff_domain": "google.com;stanford.edu;uio.no;stanford.edu;",
        "position": "Researcher;PhD student;Postdoc;Full Professor;",
        "bibtex": "@inproceedings{\ntanzer2024a,\ntitle={A Benchmark for Learning to Translate a New Language from One Grammar Book},\nauthor={Garrett Tanzer and Mirac Suzgun and Eline Visser and Dan Jurafsky and Luke Melas-Kyriazi},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=tbVWug9f2h}\n}",
        "github": "",
        "project": "",
        "reviewers": "tEGh;fSip;M62r",
        "pdf_size": 373267,
        "rating": "6;8;8",
        "confidence": "5;4;4",
        "soundness": "3;3;4",
        "contribution": "3;3;4",
        "presentation": "4;4;4",
        "wc_summary": "120;85;144",
        "wc_strengths": "227;54;84",
        "wc_weaknesses": "462;107;104",
        "wc_questions": "49;47;39",
        "wc_review": "858;293;371",
        "wc_reply_reviewers": "92;10;45",
        "wc_reply_authors": "742;358;254",
        "reply_reviewers": "1;1;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            4.0,
            0.0
        ],
        "wc_summary_avg": [
            116.33333333333333,
            24.225789747475496
        ],
        "wc_strengths_avg": [
            121.66666666666667,
            75.48215388789296
        ],
        "wc_weaknesses_avg": [
            224.33333333333334,
            168.06017440852017
        ],
        "wc_questions_avg": [
            45.0,
            4.320493798938574
        ],
        "wc_review_avg": [
            507.3333333333333,
            249.99511106330772
        ],
        "wc_reply_reviewers_avg": [
            49.0,
            33.595634637057636
        ],
        "wc_reply_authors_avg": [
            451.3333333333333,
            209.87191861281067
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9999999999999997,
        "gs_citation": 40,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3102967019868398512&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=tbVWug9f2h",
        "pdf": "https://openreview.net/pdf?id=tbVWug9f2h",
        "email": "google.com;stanford.edu;uio.no;stanford.edu;",
        "author_num": 5,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "Google;Stanford University;University of Oslo",
        "aff_unique_dep": "Google;;",
        "aff_unique_url": "https://www.google.com;https://www.stanford.edu;https://www.uio.no",
        "aff_unique_abbr": "Google;Stanford;UiO",
        "aff_campus_unique_index": "0;1;1",
        "aff_campus_unique": "Mountain View;Stanford;",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "United States;Norway"
    },
    {
        "id": "tbznWbXq2b",
        "title": "GPT-FL: Generative Pre-trained Model-Assisted Federated Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this work, we propose GPT-FL, a generative pre-trained model-assisted federated learning (FL) framework. At its core, GPT-FL leverages generative pre-trained models to generate diversified synthetic data. These generated data are used to train a downstream model on the server, which is then fine-tuned with private client data under the standard FL framework. We show that GPT-FL consistently outperforms state-of-the-art FL methods in terms of model test accuracy, communication efficiency, and client sampling efficiency. Through comprehensive ablation analysis, we discover that the downstream model generated by synthetic data plays a crucial role in controlling the direction of gradient diversity during FL training, which enhances convergence speed and contributes to the notable accuracy boost observed with GPT-FL. Also, regardless of whether the target data falls within or outside the domain of the pre-trained generative model, GPT-FL consistently achieves significant performance gains, surpassing the results obtained by models trained solely with FL or synthetic data.",
        "keywords": "AIGC;Federated Learning;Generative Pre-trained Model",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/c224bfae6d570bd8093057ea6b08d070592a4f9f.pdf",
        "author": "Tuo Zhang;Tiantian Feng;Samiul Alam;Dimitrios Dimitriadis;Mi Zhang;Shrikanth Narayanan;Salman Avestimehr",
        "authorids": "~Tuo_Zhang2;~Tiantian_Feng1;~Samiul_Alam1;~Dimitrios_Dimitriadis1;~Mi_Zhang1;~Shrikanth_Narayanan1;~Salman_Avestimehr1",
        "gender": "M;M;M;;M;M;",
        "homepage": ";https://tiantiaf0627.github.io/;https://samiul272.github.io;;https://mi-zhang.github.io/;http://sail.usc.edu/people/shri.html;",
        "dblp": ";;222/1821;05/3143;84/2519-2.html;19/3899;",
        "google_scholar": "Rki45F4AAAAJ;p7oF-XIAAAAJ;2Un1c7QAAAAJ;AQSvco0AAAAJ;https://scholar.google.com.tw/citations?user=r3A90uAAAAAJ;8EDHmYkAAAAJ;",
        "orcid": ";0000-0002-2053-9068;0000-0002-8458-4642;0000-0001-8483-0105;;0000-0002-1052-6204;",
        "linkedin": "tuo-zhang-ultraz/;;samiul-alam/;https://www.linkedin.com/dimitrios.dimitriadis;mizhang/;shrikanth-narayanan/;",
        "or_profile": "~Tuo_Zhang2;~Tiantian_Feng1;~Samiul_Alam1;~Dimitrios_Dimitriadis1;~Mi_Zhang1;~Shrikanth_Narayanan1;~Salman_Avestimehr1",
        "aff": "University of Southern California;University of Southern California;Ohio State University, Columbus;Amazon;The Ohio State University;University of Southern California;",
        "aff_domain": "usc.edu;usc.edu;osu.edu;amazon.com;osu.edu;usc.edu;",
        "position": "PhD student;Postdoc;PhD student;Principal Applied Scientist;Associate Professor;Full Professor;",
        "bibtex": "@misc{\nzhang2024gptfl,\ntitle={{GPT}-{FL}: Generative Pre-trained Model-Assisted Federated Learning},\nauthor={Tuo Zhang and Tiantian Feng and Samiul Alam and Dimitrios Dimitriadis and Mi Zhang and Shrikanth Narayanan and Salman Avestimehr},\nyear={2024},\nurl={https://openreview.net/forum?id=tbznWbXq2b}\n}",
        "github": "",
        "project": "",
        "reviewers": "p1Ep;iSGe;5fiA;4UJh",
        "site": "https://openreview.net/forum?id=tbznWbXq2b",
        "pdf_size": 1017986,
        "rating": "3;5;5;6",
        "confidence": "4;4;3;4",
        "soundness": "2;3;2;3",
        "contribution": "1;3;2;3",
        "presentation": "3;3;3;4",
        "wc_summary": "88;43;35;78",
        "wc_strengths": "13;32;13;41",
        "wc_weaknesses": "189;200;47;412",
        "wc_questions": "2;101;28;10",
        "wc_review": "292;376;123;541",
        "wc_reply_reviewers": "112;138;0;214",
        "wc_reply_authors": "1502;2365;497;1651",
        "reply_reviewers": "1;1;0;2",
        "reply_authors": "4;5;2;5",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            61.0,
            22.4610774452162
        ],
        "wc_strengths_avg": [
            24.75,
            12.173228823939851
        ],
        "wc_weaknesses_avg": [
            212.0,
            130.2862233699327
        ],
        "wc_questions_avg": [
            35.25,
            39.111219617905036
        ],
        "wc_review_avg": [
            333.0,
            150.74315904876082
        ],
        "wc_reply_reviewers_avg": [
            116.0,
            76.74633541739958
        ],
        "wc_reply_authors_avg": [
            1503.75,
            666.5175822887195
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            4.0,
            1.224744871391589
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.13245323570650439,
        "gs_citation": 30,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16908609837380540608&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1;2;1;0",
        "aff_unique_norm": "University of Southern California;Ohio State University;Amazon",
        "aff_unique_dep": ";;Amazon.com, Inc.",
        "aff_unique_url": "https://www.usc.edu;https://www.osu.edu;https://www.amazon.com",
        "aff_unique_abbr": "USC;OSU;Amazon",
        "aff_campus_unique_index": "0;0;1;0",
        "aff_campus_unique": "Los Angeles;Columbus;",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "tc1jaWpi7M",
        "title": "Completing Visual Objects via Bridging Generation and Segmentation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper presents a novel approach to object completion, with the primary goal of reconstructing a complete object from its partially visible components. Our method, named MaskComp, delineates the completion process through iterative stages of generation and segmentation. In each iteration, the object mask is provided as an additional condition to boost image generation, and, in return, the generated images can lead to a more accurate mask by fusing the segmentation of images. We demonstrate that the combination of one generation and one segmentation stage effectively functions as a mask denoiser. Through alternation between the generation and segmentation stages, the partial object mask is progressively refined, providing precise shape guidance and yielding superior object completion results. Our experiments demonstrate the superiority of MaskComp over existing approaches, e.g., ControlNet and Stable Diffusion, establishing it as an effective solution for object completion.",
        "keywords": "Object Completion;Segmentation;Mask Denoising",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Xiang Li;Yinpeng Chen;Chung-Ching Lin;Rita Singh;Bhiksha Raj;Zicheng Liu",
        "authorids": "~Xiang_Li35;~Yinpeng_Chen1;~Chung-Ching_Lin2;~Rita_Singh1;~Bhiksha_Raj1;~Zicheng_Liu1",
        "gender": ";M;;F;M;M",
        "homepage": ";https://scholar.google.com/citations?user=V_VpLksAAAAJ&hl=en;;http://mlsp.cs.cmu.edu/people/rsingh/index.html;https://www.cs.cmu.edu/directory/bhikshar/;https://sites.google.com/view/zichengliu/home?pli=1",
        "dblp": ";45/6977;;;60/3996;l/ZichengLiu",
        "google_scholar": ";;;;;bkALdvsAAAAJ",
        "orcid": ";;;;;0000-0001-5894-7828",
        "linkedin": ";;;;;",
        "or_profile": "~Xiang_Li35;~Yinpeng_Chen1;~Chung-Ching_Lin2;~Rita_Singh1;~Bhiksha_Raj1;~Zicheng_Liu1",
        "aff": ";Google DeepMind;;School of Computer Science, Carnegie Mellon University;Mohamed bin Zayed University of Artificial Intelligence;Microsoft",
        "aff_domain": ";google.com;;cs.cmu.edu;mbzuai.ac.ae;microsoft.com",
        "position": ";Research Scientist;;Research Professor;Full Professor;partner research manager",
        "bibtex": "@misc{\nli2024completing,\ntitle={Completing Visual Objects via Bridging Generation and Segmentation},\nauthor={Xiang Li and Yinpeng Chen and Chung-Ching Lin and Rita Singh and Bhiksha Raj and Zicheng Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=tc1jaWpi7M}\n}",
        "github": "",
        "project": "",
        "reviewers": "2Pq9;t7dr;PKfR;xAwN",
        "site": "https://openreview.net/forum?id=tc1jaWpi7M",
        "pdf_size": 17256461,
        "rating": "5;6;6;6",
        "confidence": "4;5;5;3",
        "soundness": "2;2;3;3",
        "contribution": "2;3;2;2",
        "presentation": "3;2;3;3",
        "wc_summary": "86;24;79;105",
        "wc_strengths": "48;17;92;70",
        "wc_weaknesses": "342;185;329;57",
        "wc_questions": "5;39;17;81",
        "wc_review": "481;265;517;313",
        "wc_reply_reviewers": "176;240;0;25",
        "wc_reply_authors": "1748;1644;1184;269",
        "reply_reviewers": "2;3;0;1",
        "reply_authors": "5;3;3;2",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            73.5,
            30.120590963658067
        ],
        "wc_strengths_avg": [
            56.75,
            27.725214156071004
        ],
        "wc_weaknesses_avg": [
            228.25,
            116.49758581189569
        ],
        "wc_questions_avg": [
            35.5,
            28.96118091514916
        ],
        "wc_review_avg": [
            394.0,
            107.12142642814275
        ],
        "wc_reply_reviewers_avg": [
            110.25,
            100.72332152982247
        ],
        "wc_reply_authors_avg": [
            1211.25,
            583.9415103415752
        ],
        "reply_reviewers_avg": [
            1.5,
            1.118033988749895
        ],
        "reply_authors_avg": [
            3.25,
            1.0897247358851685
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.17407765595569782,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6486437434814496423&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Google;Carnegie Mellon University;Mohamed bin Zayed University of Artificial Intelligence;Microsoft",
        "aff_unique_dep": "Google DeepMind;School of Computer Science;;Microsoft Corporation",
        "aff_unique_url": "https://deepmind.com;https://www.cmu.edu;https://mbzuai.ac.ae;https://www.microsoft.com",
        "aff_unique_abbr": "DeepMind;CMU;MBZUAI;Microsoft",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Pittsburgh",
        "aff_country_unique_index": "0;1;2;1",
        "aff_country_unique": "United Kingdom;United States;United Arab Emirates"
    },
    {
        "id": "tcFcKyJgRM",
        "title": "HeaP: Hierarchical Policies for Web Actions using LLMs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs) have demonstrated remarkable capabilities in performing a range of instruction-following tasks in few and zero-shot settings. However, teaching LLMs to perform tasks on the web presents fundamental challenges -- combinatorially large open-world tasks and variations across web interfaces. We tackle these challenges by leveraging LLMs to decompose web tasks into a collection of sub-tasks, each of which can be solved by a low-level, closed-loop policy. These policies constitute a shared grammar across tasks, i.e., new web tasks can be expressed as a composition of these policies. We propose a novel framework, Hierarchical Policies for Web Actions using LLMs (HeaP), that learns a set of hierarchical LLM prompts from demonstrations for planning high-level tasks and executing low-level policies. We evaluate HeaP against a range of baselines on a suite of web tasks, including MiniWoB++, WebArena, a mock airline CRM, as well as live website interactions, and show that it is able to outperform prior works using orders of magnitude less data.",
        "keywords": "web actions;large language models;task decomposition;few-shot demonstrations",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/3c1347bad1b780c5a6f1083e83596487c620c65b.zip",
        "author": "Paloma Sodhi;S.R.K Branavan;Ryan McDonald",
        "authorids": "~Paloma_Sodhi1;~S.R.K_Branavan1;~Ryan_McDonald2",
        "gender": ";M;M",
        "homepage": ";http://people.csail.mit.edu/branavan/;https://ryanmcd.github.io/",
        "dblp": ";;m/RyanTMcDonald",
        "google_scholar": ";;6IXPMJ0AAAAJ",
        "orcid": ";;",
        "linkedin": ";s-r-k-branavan-29475b4/;",
        "or_profile": "~Paloma_Sodhi1;~S.R.K_Branavan1;~Ryan_McDonald2",
        "aff": ";;ASAPP",
        "aff_domain": ";;asapp.com",
        "position": ";;Researcher",
        "bibtex": "@misc{\nsodhi2024heap,\ntitle={HeaP: Hierarchical Policies for Web Actions using {LLM}s},\nauthor={Paloma Sodhi and S.R.K Branavan and Ryan McDonald},\nyear={2024},\nurl={https://openreview.net/forum?id=tcFcKyJgRM}\n}",
        "github": "",
        "project": "",
        "reviewers": "NxCH;oBNG;4BRb;aRc1",
        "site": "https://openreview.net/forum?id=tcFcKyJgRM",
        "pdf_size": 12305803,
        "rating": "3;3;6;8",
        "confidence": "4;4;2;3",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "4;3;2;3",
        "wc_summary": "65;87;88;87",
        "wc_strengths": "19;43;29;110",
        "wc_weaknesses": "69;157;20;108",
        "wc_questions": "123;1;7;5",
        "wc_review": "276;288;144;310",
        "wc_reply_reviewers": "0;12;0;20",
        "wc_reply_authors": "1004;887;100;1140",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "2;2;1;4",
        "rating_avg": [
            5.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            81.75,
            9.67923034130297
        ],
        "wc_strengths_avg": [
            50.25,
            35.53431440171598
        ],
        "wc_weaknesses_avg": [
            88.5,
            50.36119537898202
        ],
        "wc_questions_avg": [
            34.0,
            51.42956348249516
        ],
        "wc_review_avg": [
            254.5,
            64.9519052838329
        ],
        "wc_reply_reviewers_avg": [
            8.0,
            8.48528137423857
        ],
        "wc_reply_authors_avg": [
            782.75,
            404.22603515854837
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            1.0897247358851685
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.7106690545187014,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15065211312496551052&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "ASAPP",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.asapp.com",
        "aff_unique_abbr": "ASAPP",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "tcx84iyqaC",
        "title": "Reward Collapse in Aligning Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The extraordinary capabilities of large language models (LLMs) such as ChatGPT and GPT-4 are in part unleashed by aligning them with reward models that are trained on human preferences represented as rankings of responses to prompts. In this paper, we document the phenomenon of reward collapse, an empirical observation where the prevailing ranking-based approach results in an identical reward distribution for diverse prompts during the terminal phase of training. This outcome is undesirable as open-ended prompts like write a short story about your best friend'' should yield a continuous range of rewards for their completions, while specific prompts like what is the capital city of New Zealand'' should generate either high or low rewards. Our theoretical investigation reveals that reward collapse is primarily due to the insufficiency of the ranking-based objective function to incorporate prompt-related information during optimization. This insight allows us to derive closed-form expressions for the reward distribution associated with a set of utility functions in an asymptotic setting. To overcome reward collapse, we introduce a prompt-aware optimization scheme that provably admits a prompt-dependent reward distribution within the interpolating regime. Our experimental results suggest that our proposed prompt-aware utility functions significantly alleviate reward collapse during the training of reward models.",
        "keywords": "Large language models;reward model;human feedback;alignment;optimization",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/bd2a304e9deb2b89910f38ff905e3d3b949c3782.zip",
        "author": "Ziang Song;Tianle Cai;Jason D. Lee;Weijie J Su",
        "authorids": "~Ziang_Song1;~Tianle_Cai1;~Jason_D._Lee1;~Weijie_J_Su1",
        "gender": "M;M;M;M",
        "homepage": ";https://tianle.website;https://jasondlee88.github.io/;http://stat.wharton.upenn.edu/~suw/",
        "dblp": ";241/9458;88/3262;228/9127",
        "google_scholar": "P_-O-wcAAAAJ;CvwLRSMAAAAJ;GR_DsT0AAAAJ;Uhf4nBkAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Ziang_Song1;~Tianle_Cai1;~Jason_D._Lee1;~Weijie_J_Su1",
        "aff": "Stanford University;Princeton University;Princeton University;University of Pennsylvania",
        "aff_domain": "stanford.edu;princeton.edu;princeton.edu;upenn.edu",
        "position": "PhD student;PhD student;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nsong2024reward,\ntitle={Reward Collapse in Aligning Large Language Models},\nauthor={Ziang Song and Tianle Cai and Jason D. Lee and Weijie J Su},\nyear={2024},\nurl={https://openreview.net/forum?id=tcx84iyqaC}\n}",
        "github": "",
        "project": "",
        "reviewers": "vqeA;C1CM;hn6B",
        "site": "https://openreview.net/forum?id=tcx84iyqaC",
        "pdf_size": 948668,
        "rating": "5;5;6",
        "confidence": "3;3;4",
        "soundness": "2;2;4",
        "contribution": "2;2;3",
        "presentation": "2;2;4",
        "wc_summary": "65;62;66",
        "wc_strengths": "43;56;110",
        "wc_weaknesses": "39;166;210",
        "wc_questions": "4;3;2",
        "wc_review": "151;287;388",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "156;439;410",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            64.33333333333333,
            1.699673171197595
        ],
        "wc_strengths_avg": [
            69.66666666666667,
            29.00957696271277
        ],
        "wc_weaknesses_avg": [
            138.33333333333334,
            72.49980842886568
        ],
        "wc_questions_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_review_avg": [
            275.3333333333333,
            97.10589866509427
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            335.0,
            127.12461078275389
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.9999999999999997,
        "gs_citation": 24,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4694766497287713035&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "Stanford University;Princeton University;University of Pennsylvania",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.stanford.edu;https://www.princeton.edu;https://www.upenn.edu",
        "aff_unique_abbr": "Stanford;Princeton;UPenn",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Stanford;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "tf6nR1B8Nt",
        "title": "No Wrong Turns: The Simple Geometry Of Neural Networks Optimization Paths",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Understanding the optimization dynamics of neural networks is necessary for closing the gap between theory and practice. Stochastic first-order optimization algorithms are known to efficiently locate favorable minima in deep neural networks. This efficiency, however, contrasts with the non-convex and seemingly complex structure of neural loss landscapes. In this study, we delve into the fundamental geometric properties of sampled gradients along optimization paths. We focus on two key quantities, which appear in the restricted secant inequality and error bound. Both hold high significance for first-order optimization. Our analysis reveals that these quantities exhibit predictable, consistent behavior throughout training, despite the stochasticity induced by sampling minibatches. Our findings suggest that not only do optimization trajectories never encounter significant obstacles, but they also maintain stable dynamics during the majority of training. These observed properties are sufficiently expressive to theoretically guarantee linear convergence and prescribe learning rate schedules mirroring empirical practices. We conduct our experiments on image classification, semantic segmentation and language modeling across different batch sizes, network architectures, datasets, optimizers, and initialization seeds. We discuss the impact of each factor.\nOur work provides novel insights into the properties of neural network loss functions, and opens the door to theoretical frameworks more relevant to prevalent practice.",
        "keywords": "Optimization;Loss Landscape;Deep learning",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Charles Guille-Escuret;Hiroki Naganuma;Kilian FATRAS;Ioannis Mitliagkas",
        "authorids": "~Charles_Guille-Escuret1;~Hiroki_Naganuma1;~Kilian_FATRAS1;~Ioannis_Mitliagkas1",
        "gender": "M;M;M;M",
        "homepage": ";https://hiroki11x.github.io/;http://kilianfatras.github.io;http://mitliagkas.github.io/",
        "dblp": "243/7039;206/0082;;83/8757",
        "google_scholar": "VNgVRmgAAAAJ;https://scholar.google.co.jp/citations?user=xx7O2voAAAAJ;https://scholar.google.ca/citations?user=DHMjyDgAAAAJ;K757SxgAAAAJ",
        "orcid": ";0000-0002-4595-8381;;",
        "linkedin": ";hiroki11x/;;",
        "or_profile": "~Charles_Guille-Escuret1;~Hiroki_Naganuma1;~Kilian_FATRAS1;~Ioannis_Mitliagkas1",
        "aff": "ServiceNow;Microsoft Research;McGill University;Mila - Quebec AI Institute",
        "aff_domain": "servicenow.com;microsoft.com;mcgill.ca;mila.quebec",
        "position": "Intern;Intern;Postdoc;Principal Researcher",
        "bibtex": "@misc{\nguille-escuret2024no,\ntitle={No Wrong Turns: The Simple Geometry Of Neural Networks Optimization Paths},\nauthor={Charles Guille-Escuret and Hiroki Naganuma and Kilian FATRAS and Ioannis Mitliagkas},\nyear={2024},\nurl={https://openreview.net/forum?id=tf6nR1B8Nt}\n}",
        "github": "",
        "project": "",
        "reviewers": "Km89;eK7x;LuUd;oKQj",
        "site": "https://openreview.net/forum?id=tf6nR1B8Nt",
        "pdf_size": 713796,
        "rating": "3;3;6;8",
        "confidence": "4;4;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;4;3",
        "wc_summary": "86;129;136;159",
        "wc_strengths": "51;81;102;132",
        "wc_weaknesses": "288;598;76;92",
        "wc_questions": "5;108;225;61",
        "wc_review": "430;916;539;444",
        "wc_reply_reviewers": "0;0;24;11",
        "wc_reply_authors": "757;1058;666;465",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            5.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            127.5,
            26.405491853021786
        ],
        "wc_strengths_avg": [
            91.5,
            29.58462438497403
        ],
        "wc_weaknesses_avg": [
            263.5,
            210.3918962317703
        ],
        "wc_questions_avg": [
            99.75,
            80.98572405060042
        ],
        "wc_review_avg": [
            582.25,
            197.20088108322437
        ],
        "wc_reply_reviewers_avg": [
            8.75,
            9.883698700385398
        ],
        "wc_reply_authors_avg": [
            736.5,
            213.57961045006147
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.2721655269759087,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7255617281957896084&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "ServiceNow;Microsoft;McGill University;Quebec AI Institute",
        "aff_unique_dep": ";Microsoft Research;;AI Institute",
        "aff_unique_url": "https://www.servicenow.com;https://www.microsoft.com/en-us/research;https://www.mcgill.ca;https://mila.quebec",
        "aff_unique_abbr": "ServiceNow;MSR;McGill;Mila",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;1",
        "aff_country_unique": "United States;Canada"
    },
    {
        "id": "tfYPgTXjzH",
        "title": "Learning Communication-Efficient Optimizers",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Communication-efficient variants of SGD, specifically local SGD, have received a great deal of interest in recent years. These approaches compute multiple gradient steps locally, that is on each worker, before averaging model parameters, helping relieve the critical communication bottleneck in distributed deep learning training. Although many variants of these approaches have been proposed, they can sometimes lag behind state-of-the-art optimizers for deep learning. In this work, we incorporate local optimizers that compute multiple updates into a learned optimization framework, allowing to meta-learn potentially more efficient local SGD algorithms. Our results demonstrate that local learned optimizers can substantially outperform local SGD and its sophisticated variants while maintaining their communication efficiency. We show that the learned optimizers can generalize to new datasets and architectures, demonstrating the potential of learned optimizers for improving communication-efficient distributed learning.",
        "keywords": "learned optimization;local sgd;communication-efficient distributed learning;meta-learning",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/afb62a2ad03a458a62dad1365ce9caebd0a283c2.zip",
        "author": "Charles-\u00c9tienne Joseph;Benjamin Th\u00e9rien;Abhinav Moudgil;Boris Knyazev;Eugene Belilovsky",
        "authorids": "~Charles-\u00c9tienne_Joseph1;~Benjamin_Th\u00e9rien1;~Abhinav_Moudgil1;~Boris_Knyazev1;~Eugene_Belilovsky1",
        "gender": "M;M;M;M;M",
        "homepage": ";https://bentherien.github.io/;http://amoudgl.github.io/;https://bknyaz.github.io/;http://eugenium.github.io",
        "dblp": ";297/8891;;181/5675-1;42/11445",
        "google_scholar": ";RbO_ULYAAAAJ;Y0mjNnEAAAAJ;https://scholar.google.ca/citations?user=Dp9VFB0AAAAJ;https://scholar.google.fr/citations?user=CffJDoEAAAAJ",
        "orcid": ";;;0000-0002-9484-1534;",
        "linkedin": "charles-etienne-joseph/;benjamintherien/;amoudgl/;boris-knyazev-39690948/;",
        "or_profile": "~Charles-\u00c9tienne_Joseph1;~Benjamin_Th\u00e9rien1;~Abhinav_Moudgil1;~Boris_Knyazev1;~Eugene_Belilovsky1",
        "aff": "Universit\u00e9 de Montr\u00e9al;Universit\u00e9 de Montr\u00e9al;Mila;Samsung;Concordia University, Montreal",
        "aff_domain": "umontreal.ca;umontreal.ca;mila.quebec;samsung.com;concordia.ca",
        "position": "MS student;PhD student;PhD student;Researcher;Assistant Professor",
        "bibtex": "@misc{\njoseph2024learning,\ntitle={Learning Communication-Efficient Optimizers},\nauthor={Charles-{\\'E}tienne Joseph and Benjamin Th{\\'e}rien and Abhinav Moudgil and Boris Knyazev and Eugene Belilovsky},\nyear={2024},\nurl={https://openreview.net/forum?id=tfYPgTXjzH}\n}",
        "github": "",
        "project": "",
        "reviewers": "eXvU;QnQe;WpRV;jUos",
        "site": "https://openreview.net/forum?id=tfYPgTXjzH",
        "pdf_size": 2569592,
        "rating": "3;3;5;5",
        "confidence": "3;4;3;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;2",
        "presentation": "1;3;3;3",
        "wc_summary": "97;66;26;43",
        "wc_strengths": "72;14;26;47",
        "wc_weaknesses": "369;123;215;96",
        "wc_questions": "44;1;1;201",
        "wc_review": "582;204;268;387",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            58.0,
            26.61766330841233
        ],
        "wc_strengths_avg": [
            39.75,
            22.049659861322123
        ],
        "wc_weaknesses_avg": [
            200.75,
            106.68733523713112
        ],
        "wc_questions_avg": [
            61.75,
            82.29026370112081
        ],
        "wc_review_avg": [
            360.25,
            143.8860226012242
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:JGYxOfeRNSgJ:scholar.google.com/&scioq=Learning+Communication-Efficient+Optimizers&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2;3",
        "aff_unique_norm": "Universit\u00e9 de Montr\u00e9al;Mila;Samsung;Concordia University",
        "aff_unique_dep": ";Quebec Artificial Intelligence Institute;Samsung;",
        "aff_unique_url": "https://www.umontreal.ca;https://mila.quebec;https://www.samsung.com;https://www.concordia.ca",
        "aff_unique_abbr": "UdeM;Mila;Samsung;Concordia",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Montreal",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "Canada;South Korea"
    },
    {
        "id": "tfiS7oz64k",
        "title": "Compact Text-to-SDF via Latent Modeling",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper introduces CDiffSDF, a lightweight Text-to-Shape model designed for efficient 3D shape generation. By harnessing latent-code-based signed distance functions (SDFs), CDiffSDF not only produces high-resolution shapes but also features diffusion denoising capabilities within the latent space. Its generation ability is further boosted by integrating Gaussian noise during the SDF training phase, effectively counterbalancing the diffusion sampling perturbations.\nTransitioning from the core concept of Text-to-SDF, our model is versatile, as it can seamlessly adapt and generate shapes influenced by a range of inputs, including text, class, and image conditions. Experimental results demonstrate CDiffSDF's ability to produce detailed shapes, all within a compact design.",
        "keywords": "Text-to-Shape;3D Shape Generation;Generative Model",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/e3dd9cf20f986159c3f79d2fa0bef4a55f30a78d.pdf",
        "author": "Tiange Luo;Justin Johnson;Honglak Lee",
        "authorids": "~Tiange_Luo1;~Justin_Johnson1;~Honglak_Lee2",
        "gender": "M;M;M",
        "homepage": "https://tiangeluo.github.io/;http://cs.stanford.edu/people/jcjohns/;http://web.eecs.umich.edu/~honglak",
        "dblp": "227/2386.html;04/3396;58/2562",
        "google_scholar": "https://scholar.google.com/citations?hl=en;mS5k4CYAAAAJ;fmSHtE8AAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Tiange_Luo1;~Justin_Johnson1;~Honglak_Lee1",
        "aff": "Peking University;University of Michigan;LG AI Research",
        "aff_domain": "pku.edu;umich.edu;lgresearch.ai",
        "position": "MS student;Assistant Professor;Chief Scientist",
        "bibtex": "@misc{\nluo2024compact,\ntitle={Compact Text-to-{SDF} via Latent Modeling},\nauthor={Tiange Luo and Justin Johnson and Honglak Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=tfiS7oz64k}\n}",
        "github": "",
        "project": "",
        "reviewers": "jMCT;6FpV;jSYM;qQcJ",
        "site": "https://openreview.net/forum?id=tfiS7oz64k",
        "pdf_size": 20391309,
        "rating": "3;5;6;8",
        "confidence": "4;4;4;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "66;85;65;96",
        "wc_strengths": "44;86;56;82",
        "wc_weaknesses": "204;192;62;49",
        "wc_questions": "40;67;41;18",
        "wc_review": "354;430;224;245",
        "wc_reply_reviewers": "144;170;0;26",
        "wc_reply_authors": "1569;892;458;227",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "3;2;1;1",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            78.0,
            13.095800853708795
        ],
        "wc_strengths_avg": [
            67.0,
            17.578395831246947
        ],
        "wc_weaknesses_avg": [
            126.75,
            71.52403442200391
        ],
        "wc_questions_avg": [
            41.5,
            17.356554957709783
        ],
        "wc_review_avg": [
            313.25,
            83.53853901044715
        ],
        "wc_reply_reviewers_avg": [
            85.0,
            73.16419889536138
        ],
        "wc_reply_authors_avg": [
            786.5,
            510.9767607240079
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8006407690254357,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:f8uwi7A7exwJ:scholar.google.com/&scioq=Compact+Text-to-SDF+via+Latent+Modeling&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Peking University;University of Michigan;LG",
        "aff_unique_dep": ";;LG AI Research",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.umich.edu;https://www.lgaires.com",
        "aff_unique_abbr": "Peking U;UM;LG AI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2",
        "aff_country_unique": "China;United States;South Korea"
    },
    {
        "id": "tfp4FxWCC8",
        "title": "Topo-Diffusion: Topological Diffusion Model for Image and Point Cloud Generation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Diffusion models represent an emerging topic in generative models and have demonstrated remarkable results in generating data with high quality and diversity. However, diffusion models suffer from two limitations (1) the notorious problem of computational burden such as large sampling step and train step needed due to directly diffusion in Euclidean space and (2) a global-structure representation for each sample that is implicitly considered in the process due to their very limited access to topological information. To mitigate these limitations, recent studies have reported that topological descriptors, which encode shape information from datasets across different scales in a topological space, can significantly improve the performance and stability of deep learning (DL). In this study, inspired by the success of topological data analysis (TDA), we propose a novel denoising diffusion model, i.e., Topo-Diffusion, which improves classical diffusion models by diffusing data in topology domain and sampling from reconstructing topological features. Within the Topo-Diffusion framework, we investigate whether local topological properties and higher-order structural information, as captured via persistent homology, can serve as a reliable signal that provides complementary information for generating a high-quality sample. Theoretically, we analyze the stability properties of persistent homology allow to establish the stability of generated samples over diffusion timesteps. We empirically evaluate the proposed Topo-Diffusion method on seven real-world and synthetic datasets, and our experimental results show that Topo-Diffusion outperforms benchmark models across all the evaluation metrics in fidelity and diversity of sampled synthetic data.",
        "keywords": "Topological data analysis;generative diffusion model;generative model",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Chen Song;Wenkang Zhan;Yuzhou Chen;Xinghua Shi",
        "authorids": "~Chen_Song3;~Wenkang_Zhan1;~Yuzhou_Chen1;~Xinghua_Shi2",
        "gender": "M;M;;",
        "homepage": ";;;https://cis.temple.edu/~mindyshi/",
        "dblp": ";;;",
        "google_scholar": "zf5Jt1AAAAAJ;https://scholar.google.com/citations?view_op=list_works;;vSDPGjcAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Chen_Song3;~Wenkang_Zhan1;~Yuzhou_Chen1;~Xinghua_Shi2",
        "aff": "Temple University;Department of Computer and Information Science, Temple University;;Temple University",
        "aff_domain": "temple.edu;cis.temple.edu;;temple.edu",
        "position": "PhD student;PhD student;;Associate Professor",
        "bibtex": "@misc{\nsong2024topodiffusion,\ntitle={Topo-Diffusion: Topological Diffusion Model for Image and Point Cloud Generation},\nauthor={Chen Song and Wenkang Zhan and Yuzhou Chen and Xinghua Shi},\nyear={2024},\nurl={https://openreview.net/forum?id=tfp4FxWCC8}\n}",
        "github": "",
        "project": "",
        "reviewers": "E1SD;uPRx;jmNy;yf4E",
        "site": "https://openreview.net/forum?id=tfp4FxWCC8",
        "pdf_size": 13317214,
        "rating": "6;6;6;8",
        "confidence": "3;2;2;3",
        "soundness": "4;3;3;4",
        "contribution": "4;3;3;4",
        "presentation": "3;3;2;3",
        "wc_summary": "104;49;21;50",
        "wc_strengths": "58;29;24;37",
        "wc_weaknesses": "56;28;100;82",
        "wc_questions": "478;17;28;13",
        "wc_review": "696;123;173;182",
        "wc_reply_reviewers": "12;26;0;3",
        "wc_reply_authors": "928;502;552;204",
        "reply_reviewers": "1;2;0;1",
        "reply_authors": "3;2;2;3",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            2.5,
            0.5
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            56.0,
            30.058276730378275
        ],
        "wc_strengths_avg": [
            37.0,
            12.98075498574717
        ],
        "wc_weaknesses_avg": [
            66.5,
            27.179955849853766
        ],
        "wc_questions_avg": [
            134.0,
            198.68442314383884
        ],
        "wc_review_avg": [
            293.5,
            233.46787787616523
        ],
        "wc_reply_reviewers_avg": [
            10.25,
            10.108783309577865
        ],
        "wc_reply_authors_avg": [
            546.5,
            257.3222687604009
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=732767769534371385&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Temple University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.temple.edu",
        "aff_unique_abbr": "Temple",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "tfyLS1cB5W",
        "title": "Encoding Ontologies with Holographic Reduced Representations for Transformers",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The ability to encode meaningful structure into deep learning models opens up the potential for incorporating prior knowledge, particularly in fields where domain-specific information is of great importance. However, transformer models trained on NLP tasks with medical data often have randomly initialized embeddings that are then adjusted based on training data. For terms appearing infrequently in the dataset, there is less opportunity to improve these representations and learn semantic similarity with other concepts. Medical ontologies already represent many of the biomedical concepts and define a relationship structure between these concepts, making ontologies a valuable source of domain-specific information. One of the ongoing challenges of deep learning is finding methods to incorporate this domain knowledge into models. Holographic Reduced Representations (HRR) are capable of encoding ontological structure by composing atomic vectors to create structured higher-level concept vectors. Deep learning models can further process these structured vectors without needing to learn the ontology from training data. We developed an embedding layer that generates concept vectors for clinical diagnostic codes by applying HRR operations that compose atomic vectors based on the SNOMED CT ontology. This approach still allows for learning to update the atomic vectors while maintaining structure in the concept vectors. We trained a Bidirectional Encoder Representations from Transformers (BERT) transformer model to process sequences of clinical diagnostic codes and used the resulting HRR concept vectors as the embedding matrix for the model. The model was first pre-trained on a masked-language modeling (MLM) task before being fine-tuned for mortality and disease prediction tasks. The HRR-based approach improved performance on the pre-training and fine tuning tasks compared to standard transformer embeddings. This is the first time HRRs have been used to produce structured embeddings for transformer models and we find that this approach maintains semantic similarity between medically related concept vectors and allows better representations to be learned for rare codes in the dataset, as rare codes are composed of elements that are shared with more common codes.",
        "keywords": "Transformers;Ontology;Holographic Reduced Representations;Deep Learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/efb856102453a2b1e63f262ef50512d19d687614.zip",
        "author": "Bing Xu Hu;Trevor Yu;Tia Tuinstra;Ryan Rezai;Harshit Bokadia;Rachel DiMaio;Thomas Fortin;Brian Alex Vartian;Bryan P. Tripp",
        "authorids": "~Bing_Xu_Hu1;~Trevor_Yu1;~Tia_Tuinstra1;~Ryan_Rezai1;~Harshit_Bokadia1;~Rachel_DiMaio1;~Thomas_Fortin1;~Brian_Alex_Vartian1;~Bryan_P._Tripp1",
        "gender": ";M;;;M;F;M;M;",
        "homepage": ";;;https://ryanrezai.org/;;;;;https://uwaterloo.ca/systems-design-engineering/profile/bptripp",
        "dblp": ";;;;;;;;52/8763",
        "google_scholar": ";;;;QxgwOOcAAAAJ;;;;",
        "orcid": ";;;;0000-0002-5929-079X;;;;0000-0002-2150-297X",
        "linkedin": "bingxuhu/;trevor-yu-087/;tia-tuinstra-333716126;;hbk007/;rachel-dimaio/;thomas-fortin/;brian-vartian-b30a1110a;",
        "or_profile": "~Bing_Xu_Hu1;~Trevor_Yu1;~Tia_Tuinstra1;~Ryan_Rezai1;~Harshit_Bokadia1;~Rachel_DiMaio1;~Thomas_Fortin1;~Brian_Alex_Vartian1;~Bryan_P._Tripp1",
        "aff": "University of Waterloo;University of Waterloo;University of Waterloo;University of Waterloo;Bloorview Research Institute, Holland Bloorview Kids Rehabilitation Hospital;University of Waterloo;University of Waterloo;McMaster University;University of Waterloo",
        "aff_domain": "uwaterloo.ca;uwaterloo.ca;uwaterloo.ca;uwaterloo.ca;hollandbloorview.ca;uwaterloo.ca;uwaterloo.ca;mcmaster.ca;uwaterloo.ca",
        "position": "PhD student;MS student;MS student;Undergrad student;Researcher;MS student;MS student;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nhu2024encoding,\ntitle={Encoding Ontologies with Holographic Reduced Representations for Transformers},\nauthor={Bing Xu Hu and Trevor Yu and Tia Tuinstra and Ryan Rezai and Harshit Bokadia and Rachel DiMaio and Thomas Fortin and Brian Alex Vartian and Bryan P. Tripp},\nyear={2024},\nurl={https://openreview.net/forum?id=tfyLS1cB5W}\n}",
        "github": "",
        "project": "",
        "reviewers": "oJkP;Q1WN;fGNU",
        "site": "https://openreview.net/forum?id=tfyLS1cB5W",
        "pdf_size": 1215810,
        "rating": "3;3;6",
        "confidence": "4;3;4",
        "soundness": "3;3;3",
        "contribution": "2;2;3",
        "presentation": "3;2;3",
        "wc_summary": "115;69;50",
        "wc_strengths": "45;37;265",
        "wc_weaknesses": "123;149;306",
        "wc_questions": "87;21;444",
        "wc_review": "370;276;1065",
        "wc_reply_reviewers": "0;254;181",
        "wc_reply_authors": "1127;619;1408",
        "reply_reviewers": "0;1;2",
        "reply_authors": "2;2;5",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            78.0,
            27.28858125052797
        ],
        "wc_strengths_avg": [
            115.66666666666667,
            105.64510821088162
        ],
        "wc_weaknesses_avg": [
            192.66666666666666,
            80.83865961833416
        ],
        "wc_questions_avg": [
            184.0,
            185.81173267584586
        ],
        "wc_review_avg": [
            570.3333333333334,
            351.88097735203337
        ],
        "wc_reply_reviewers_avg": [
            145.0,
            106.77390442737713
        ],
        "wc_reply_authors_avg": [
            1051.3333333333333,
            326.5213962701713
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            3.0,
            1.4142135623730951
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:8fntbnDKaKYJ:scholar.google.com/&scioq=Encoding+Ontologies+with+Holographic+Reduced+Representations+for+Transformers&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;1;0;0;2;0",
        "aff_unique_norm": "University of Waterloo;Holland Bloorview Kids Rehabilitation Hospital;McMaster University",
        "aff_unique_dep": ";Bloorview Research Institute;",
        "aff_unique_url": "https://uwaterloo.ca;https://www.hollandbloorview.ca/;https://www.mcmaster.ca",
        "aff_unique_abbr": "UW;;McMaster",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "tgjGR7eY5H",
        "title": "RL4CO: a Unified Reinforcement Learning for Combinatorial Optimization Library",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep reinforcement learning offers notable benefits in addressing combinatorial problems over traditional solvers, reducing the reliance on domain-specific knowledge and expert solutions, and improving computational efficiency. Despite the recent surge in interest in neural combinatorial optimization, practitioners often do not have access to a standardized code base. Moreover, different algorithms are frequently based on fragmentized implementations that hinder reproducibility and fair comparison. To address these challenges, we introduce RL4CO, a unified Reinforcement Learning (RL) for Combinatorial Optimization (CO) library. We employ state-of-the-art software and best practices in implementation, such as modularity and configuration management, to be flexible, easily modifiable, and extensible by researchers. Thanks to our unified codebase, we benchmark baseline RL solvers with different evaluation schemes on zero-shot performance, generalization, and adaptability on diverse tasks. Notably, we find that some recent methods may fall behind their predecessors depending on the evaluation settings. We hope RL4CO will encourage the exploration of novel solutions to complex real-world tasks, allowing the community to compare with existing methods through a unified framework that decouples the science from software engineering. We open-source our library at https://anonymous.4open.science/r/rl4co-iclr.",
        "keywords": "Reinforcement Learning;Neural Combinatorial Optimization;Combinatorial Optimization;Library;Benchmark",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/b22a6ad5bd71f2e824eed40a0cdb6aa409b29ae5.zip",
        "author": "Federico Berto;Chuanbo Hua;Junyoung Park;Minsu Kim;Hyeonah Kim;Jiwoo Son;Haeyeon Kim;Joungho Kim;Jinkyoo Park",
        "authorids": "~Federico_Berto1;~Chuanbo_Hua1;~Junyoung_Park1;~Minsu_Kim2;~Hyeonah_Kim1;~Jiwoo_Son2;~Haeyeon_Kim1;~Joungho_Kim1;~Jinkyoo_Park1",
        "gender": "M;M;;M;F;;F;M;M",
        "homepage": "https://fedebotu.github.io/;https://github.com/cbhua;;https://minsuukim.github.io/;;;http://sites.google.com/view/haeyeon-rachel-kim;;http://silab.kaist.ac.kr/",
        "dblp": "317/1711;326/5321;;;;348/9675;;;156/7535",
        "google_scholar": "https://scholar.google.com/citations?hl=en;fjKA5gYAAAAJ;;https://scholar.google.ca/citations?user=VvyLuhAAAAAJ;;zHyj8zAAAAAJ;rP_9IY8AAAAJ;;sH2a0nkAAAAJ",
        "orcid": "0000-0002-7438-8365;0000-0001-7700-792X;;;0000-0002-0629-1879;0009-0008-1032-6318;;;0000-0003-2620-1479",
        "linkedin": "federicoberto/;;;;hyeonahkimm/;jiwoo-son-303b31284/;;joungho-kim-3280b1a4/;",
        "or_profile": "~Federico_Berto1;~Chuanbo_Hua1;~Junyoung_Park1;~Minsu_Kim2;~Hyeonah_Kim1;~Jiwoo_Son2;~Haeyeon_Kim1;~Joungho_Kim1;~Jinkyoo_Park1",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr;;kaist.ac.kr;kaist.edu;kaist.ac.kr;kaist.ac.kr;kaist.ac.kr;kaist.ac.kr",
        "position": "PhD student;PhD student;;PhD student;PhD student;MS student;PhD student;Full Professor;Associate Professor",
        "bibtex": "@misc{\nberto2024rlco,\ntitle={{RL}4{CO}: a Unified Reinforcement Learning for Combinatorial Optimization Library},\nauthor={Federico Berto and Chuanbo Hua and Junyoung Park and Minsu Kim and Hyeonah Kim and Jiwoo Son and Haeyeon Kim and Joungho Kim and Jinkyoo Park},\nyear={2024},\nurl={https://openreview.net/forum?id=tgjGR7eY5H}\n}",
        "github": "",
        "project": "",
        "reviewers": "h7Zj;iFP3;CdMT;bdvZ",
        "site": "https://openreview.net/forum?id=tgjGR7eY5H",
        "pdf_size": 3630780,
        "rating": "3;5;5;5",
        "confidence": "3;3;4;4",
        "soundness": "3;3;2;3",
        "contribution": "3;2;3;2",
        "presentation": "3;3;3;4",
        "wc_summary": "37;99;63;50",
        "wc_strengths": "43;72;24;85",
        "wc_weaknesses": "79;269;187;177",
        "wc_questions": "16;7;41;45",
        "wc_review": "175;447;315;357",
        "wc_reply_reviewers": "0;145;107;169",
        "wc_reply_authors": "625;860;996;653",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "1;2;3;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            62.25,
            23.12331074911203
        ],
        "wc_strengths_avg": [
            56.0,
            23.926972228010797
        ],
        "wc_weaknesses_avg": [
            178.0,
            67.38694235532579
        ],
        "wc_questions_avg": [
            27.25,
            16.13032857693854
        ],
        "wc_review_avg": [
            323.5,
            98.10581022549073
        ],
        "wc_reply_reviewers_avg": [
            105.25,
            64.66210250216119
        ],
        "wc_reply_authors_avg": [
            783.5,
            152.61143469609345
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14658969289128768130&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0;0;0;0;0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "thFwKIRqmG",
        "title": "ReLU to the Rescue: Improve Your On-Policy Actor-Critic with Positive Advantages",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper introduces a novel method for enhancing the effectiveness of the Asynchronous Advantage Actor-Critic (A3C) algorithm by incorporating state-aware exploration. We achieve this improvement through three simple yet impactful modifications: (1) applying a ReLU function to advantage estimates, (2) using spectral normalization, and (3) incorporating dropout. We prove, under standard assumptions, that restricting policy updates to positive advantages optimizes a lower bound on the value function plus a constant. Further, we show that the constant is bounded proportional to the Lipschitz constant of the value function, which offers theoretical grounding for the use of spectral normalization. r application of dropout corresponds to approximate Bayesian inference over both the actor and critic parameters, which enables prudent exploration around the modes of the actor via Thompson sampling. Extensive empirical evaluations on diverse benchmarks reveal the superior performance of our approach compared to existing on-policy algorithms. Notably, we achieve significant improvements over Proximal Policy Optimization (PPO) in both the challenging ProcGen generalization benchmark, and the MuJoCo benchmark for continuous control.",
        "keywords": "Reinforcement Learning;On-Policy;Deep Learning;Actor-Critic;Exploration;Generalization",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/689bf7e1a5cb6d5ba5e9d1688f0980ca8d2653f6.zip",
        "author": "Andrew Jesson;Chris Lu;Gunshi Gupta;Angelos Filos;Jakob Nicolaus Foerster;Yarin Gal",
        "authorids": "~Andrew_Jesson1;~Chris_Lu1;~Gunshi_Gupta1;~Angelos_Filos1;~Jakob_Nicolaus_Foerster1;~Yarin_Gal1",
        "gender": "M;;F;M;M;",
        "homepage": "https://oatml.cs.ox.ac.uk/members/andrew_jesson/;;;;https://www.jakobfoerster.com;http://www.cs.ox.ac.uk/people/yarin.gal/website//",
        "dblp": ";77/9579;218/5542;https://dblp.uni-trier.de/pers/hd/f/Filos:Angelos;176/5095;67/9076",
        "google_scholar": "ElJ_fC4AAAAJ;4WLoIRsAAAAJ;w4UK_9kAAAAJ;SGjYdrEAAAAJ;6z4lQzMAAAAJ;https://scholar.google.co.uk/citations?user=SIayDoQAAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Andrew_Jesson1;~Chris_Lu1;~Gunshi_Gupta1;~Angelos_Filos1;~Jakob_Nicolaus_Foerster1;~Yarin_Gal1",
        "aff": "Columbia University;University of Oxford;University of Oxford;Google DeepMind;University of Oxford, University of Oxford;University of Oxford",
        "aff_domain": "columbia.edu;ox.ac.uk;ox.ac.uk;deepmind.com;eng.ox.ac.uk;ox.ac.uk",
        "position": "Postdoc;PhD student;PhD student;Researcher;Associate Professor;Associate Professor",
        "bibtex": "@misc{\njesson2024relu,\ntitle={Re{LU} to the Rescue: Improve Your On-Policy Actor-Critic with Positive Advantages},\nauthor={Andrew Jesson and Chris Lu and Gunshi Gupta and Angelos Filos and Jakob Nicolaus Foerster and Yarin Gal},\nyear={2024},\nurl={https://openreview.net/forum?id=thFwKIRqmG}\n}",
        "github": "",
        "project": "",
        "reviewers": "kpwW;szF5;tvnj;QokJ",
        "site": "https://openreview.net/forum?id=thFwKIRqmG",
        "pdf_size": 608873,
        "rating": "5;5;6;6",
        "confidence": "3;3;3;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;2",
        "presentation": "1;3;4;2",
        "wc_summary": "71;42;215;151",
        "wc_strengths": "73;8;157;43",
        "wc_weaknesses": "191;105;117;128",
        "wc_questions": "32;105;93;78",
        "wc_review": "367;260;582;400",
        "wc_reply_reviewers": "53;0;0;34",
        "wc_reply_authors": "1242;318;734;863",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "4;2;2;3",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            119.75,
            67.95356870687513
        ],
        "wc_strengths_avg": [
            70.25,
            55.11522022091538
        ],
        "wc_weaknesses_avg": [
            135.25,
            33.199209327934305
        ],
        "wc_questions_avg": [
            77.0,
            27.685736399814257
        ],
        "wc_review_avg": [
            402.25,
            115.9663205417849
        ],
        "wc_reply_reviewers_avg": [
            21.75,
            22.76373211931646
        ],
        "wc_reply_authors_avg": [
            789.25,
            329.9813441696364
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1652347692233005003&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;1;2;1;1",
        "aff_unique_norm": "Columbia University;University of Oxford;Google",
        "aff_unique_dep": ";;Google DeepMind",
        "aff_unique_url": "https://www.columbia.edu;https://www.ox.ac.uk;https://deepmind.com",
        "aff_unique_abbr": "Columbia;Oxford;DeepMind",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;1;1",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "title": "$\\mathbb{D}^2$ Pruning: Message Passing for Balancing Diversity & Difficulty in Data Pruning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17608",
        "id": "thbtoAkCe9",
        "author_site": "Adyasha Maharana, Prateek Yadav, Mohit Bansal",
        "tldr": "",
        "abstract": "In recent years, data quality has emerged as an important factor for training massive models. Analytical theories suggest that higher-quality data can lead to lower test errors in models trained on a fixed data budget. Moreover, a model can be trained on a lower compute budget without compromising performance if a dataset can be stripped of its redundancies. Coreset selection (or data pruning) seeks to select a subset of the training data so as to maximize the performance of models trained on this subset, also referred to as coreset. There are two dominant approaches: (1) geometry-based data selection for maximizing *data diversity* in the coreset, and (2) functions that assign *difficulty scores* to samples based on training dynamics. Optimizing for data diversity leads to a coreset that is biased towards easier samples, whereas, selection by difficulty ranking omits easy samples that are necessary for the training of deep learning models. This demonstrates that data diversity and importance scores are two complementary factors that need to be jointly considered during coreset selection. In this work, we represent a dataset as an undirected graph and propose a novel pruning algorithm, $\\mathbb{D}^2$ Pruning, that uses message passing over this dataset graph for coreset selection. $\\mathbb{D}^2$ Pruning updates the difficulty scores of each example by incorporating the difficulty of its neighboring examples in the dataset graph. Then, these updated difficulty scores direct a graph-based sampling method to select a coreset that encapsulates both diverse and difficult regions of the dataset space. We evaluate supervised and self-supervised versions of our method on various vision and NLP datasets. Results show that $\\mathbb{D}^2$ Pruning improves coreset selection over previous state-of-the-art methods at low-to-medium pruning rates. Additionally, we find that using $\\mathbb{D}^2$ Pruning for filtering large multimodal datasets leads to increased diversity in the dataset and improved generalization of pretrained models. Our work shows that $\\mathbb{D}^2$ Pruning is a versatile framework for understanding and processing datasets.",
        "keywords": "coreset selection;data pruning;data;graph;message passing;data distillation",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Adyasha Maharana;Prateek Yadav;Mohit Bansal",
        "authorids": "~Adyasha_Maharana1;~Prateek_Yadav1;~Mohit_Bansal2",
        "gender": "F;M;M",
        "homepage": "https://adymaharana.github.io/;http://prateek-yadav.github.io;https://www.cs.unc.edu/~mbansal/",
        "dblp": "204/6962.html;220/5741;32/5243.html",
        "google_scholar": "1sh3MMgAAAAJ;1lXhc0kAAAAJ;DN8QtscAAAAJ",
        "orcid": ";;",
        "linkedin": ";prateek-yadav-40bb34a8;",
        "or_profile": "~Adyasha_Maharana1;~Prateek_Yadav1;~Mohit_Bansal2",
        "aff": "Department of Computer Science, University of North Carolina, Chapel Hill;Department of Computer Science, University of North Carolina, Chapel Hill;University of North Carolina at Chapel Hill",
        "aff_domain": "cs.unc.edu;cs.unc.edu;unc.edu",
        "position": "PhD student;Graduate Student;Full Professor",
        "bibtex": "@inproceedings{\nmaharana2024mathbbd,\ntitle={\\${\\textbackslash}mathbb\\{D\\}{\\textasciicircum}2\\$ Pruning: Message Passing for Balancing Diversity \\& Difficulty in Data Pruning},\nauthor={Adyasha Maharana and Prateek Yadav and Mohit Bansal},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=thbtoAkCe9}\n}",
        "github": "",
        "project": "",
        "reviewers": "4iU9;DbMJ;3E93;niHR;2S5F",
        "pdf_size": 27480657,
        "rating": "5;5;6;6;6",
        "confidence": "4;5;4;3;5",
        "soundness": "3;3;3;3;3",
        "contribution": "3;2;2;2;2",
        "presentation": "3;2;3;3;4",
        "wc_summary": "159;106;116;57;39",
        "wc_strengths": "69;90;70;41;26",
        "wc_weaknesses": "390;53;46;96;94",
        "wc_questions": "228;131;49;2;25",
        "wc_review": "846;380;281;196;184",
        "wc_reply_reviewers": "446;65;81;23;301",
        "wc_reply_authors": "1434;396;529;297;900",
        "reply_reviewers": "4;1;1;1;2",
        "reply_authors": "4;2;1;2;2",
        "rating_avg": [
            5.6,
            0.48989794855663565
        ],
        "confidence_avg": [
            4.2,
            0.7483314773547882
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            3.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            95.4,
            42.98185663742319
        ],
        "wc_strengths_avg": [
            59.2,
            22.7806935803105
        ],
        "wc_weaknesses_avg": [
            135.8,
            128.73911604481367
        ],
        "wc_questions_avg": [
            87.0,
            82.86132994346639
        ],
        "wc_review_avg": [
            377.4,
            244.6201954050401
        ],
        "wc_reply_reviewers_avg": [
            183.2,
            163.107817102676
        ],
        "wc_reply_authors_avg": [
            711.2,
            415.2577031194003
        ],
        "reply_reviewers_avg": [
            1.8,
            1.1661903789690602
        ],
        "reply_authors_avg": [
            2.2,
            0.9797958971132712
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3273268353539885,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17339821873265029517&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=thbtoAkCe9",
        "pdf": "https://openreview.net/pdf?id=thbtoAkCe9",
        "email": "cs.unc.edu;cs.unc.edu;unc.edu",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of North Carolina",
        "aff_unique_dep": "Department of Computer Science",
        "aff_unique_url": "https://www.unc.edu",
        "aff_unique_abbr": "UNC",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Chapel Hill",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "tiKHRTqaUD",
        "title": "Handling Cost and Constraints with Off-Policy Deep Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Methods for off-policy deep reinforcement learning (DRL) offer improved sample efficiency relative to their on-policy counterparts, due to their ability to reuse data throughout the training process. For continuous action spaces, the most popular approaches to off-policy learning include policy improvement steps where a learned state-action ($Q$) value function is maximized over selected batches of data. These updates are often paired with regularization to combat associated overestimation of $Q$ values. With an eye toward safety, we revisit this strategy in environments with ``mixed-sign'' reward functions; that is, with reward functions that include independent positive (incentive) and negative (cost) terms. This setting is common in real-world applications, and may be addressed with or without constraints on the cost terms. In such environments, we find the combination of function approximation and a term that maximizes $Q$ in the policy update to be problematic, because systematic errors impact the magnitude of $Q$ estimates associated with reward terms of opposite signs asymmetrically. This results in overemphasis of either incentives or costs, which may severely limit learning. We explore two remedies to this issue. First, consistent with prior work, we find that periodic resetting of $Q$ and policy networks greatly reduces the error on $Q$ estimation and improves learning. Second, we formulate an off-policy actor-critic that does not include a $Q$ maximization term in the policy improvement step. This method supplements prior approaches with similar policy optimization steps, fortifying them to increase scalability, avoid the need for resetting, and be applicable to constrained learning when required. We find that our approach, when applied to continuous action spaces with mixed-sign rewards, consistently and significantly outperforms state-of-the-art methods augmented by resetting. We further explore the applicability of our approach to more frequently-studied control problems that do not have mixed-sign rewards, finding it to perform competitively and with favorable replay ratio scaling properties.",
        "keywords": "deep reinforcement learning;off-policy deep reinforcement learning;constrained reinforcement learning;continuous action spaces;ai safety",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/e10b3fab3b80cc2673273e7f350ab29ba3b1510c.zip",
        "author": "Jared Markowitz;Jesse Silverberg;Gary Lynn Collins",
        "authorids": "~Jared_Markowitz1;~Jesse_Silverberg2;~Gary_Lynn_Collins1",
        "gender": "M;;M",
        "homepage": ";https://jessesilverberg.com;",
        "dblp": ";;",
        "google_scholar": "KHedducAAAAJ;8yLY_hwAAAAJ;",
        "orcid": ";0009-0008-7267-4107;0000-0003-2476-3208",
        "linkedin": "jared-markowitz;;",
        "or_profile": "~Jared_Markowitz1;~Jesse_Silverberg2;~Gary_Lynn_Collins1",
        "aff": "Johns Hopkins University Applied Physics Laboratory;Case Western Reserve University;Johns Hopkins University Applied Physics Laboratory",
        "aff_domain": "jhuapl.edu;case.edu;jhuapl.edu",
        "position": "Researcher;Undergrad student;Researcher",
        "bibtex": "@misc{\nmarkowitz2024handling,\ntitle={Handling Cost and Constraints with Off-Policy Deep Reinforcement Learning},\nauthor={Jared Markowitz and Jesse Silverberg and Gary Lynn Collins},\nyear={2024},\nurl={https://openreview.net/forum?id=tiKHRTqaUD}\n}",
        "github": "",
        "project": "",
        "reviewers": "SRMH;mpXe;VQxc;FTtw",
        "site": "https://openreview.net/forum?id=tiKHRTqaUD",
        "pdf_size": 35306625,
        "rating": "3;3;3;5",
        "confidence": "3;4;4;2",
        "soundness": "3;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "2;3;2;2",
        "wc_summary": "59;82;93;64",
        "wc_strengths": "30;53;36;22",
        "wc_weaknesses": "114;347;416;76",
        "wc_questions": "119;5;60;4",
        "wc_review": "322;487;605;166",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "720;719;904;523",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            74.5,
            13.683932183404009
        ],
        "wc_strengths_avg": [
            35.25,
            11.388041973930374
        ],
        "wc_weaknesses_avg": [
            238.25,
            145.9321331989634
        ],
        "wc_questions_avg": [
            47.0,
            47.34448225506326
        ],
        "wc_review_avg": [
            395.0,
            166.0828106698583
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            716.5,
            134.7377081592232
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8703882797784891,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:lAAsi4umTyYJ:scholar.google.com/&scioq=Handling+Cost+and+Constraints+with+Off-Policy+Deep+Reinforcement+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Johns Hopkins University;Case Western Reserve University",
        "aff_unique_dep": "Applied Physics Laboratory;",
        "aff_unique_url": "https://www.jhuapl.edu;https://www.case.edu",
        "aff_unique_abbr": "JHU APL;CWRU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Compositional Preference Models for Aligning LMs",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17607",
        "id": "tiiAzqi6Ol",
        "author_site": "DONGYOUNG GO, Tomek Korbak, Germ\u00e0n Kruszewski, Jos Rozen, Marc Dymetman",
        "tldr": "",
        "abstract": "As language models (LMs) become more capable, it is increasingly important to align them with human preferences. However, the dominant paradigm for training Preference Models (PMs) for that purpose suffers from fundamental limitations, such as lack of transparency and scalability, along with susceptibility to overfitting the preference dataset.\nWe propose Compositional Preference Models (CPMs), a novel PM framework that decomposes one global preference assessment into several interpretable features, obtains scalar scores for these features from a prompted LM, and aggregates these scores using a logistic regression classifier. Through these simple steps, CPMs allow to control which properties of the preference data are used to train the preference model and to build it based on features that are believed to underlie the human preference judgment.\nOur experiments show that CPMs not only improve generalization and are more robust to overoptimization than standard PMs, but also that best-of-n samples obtained using CPMs tend to be preferred over samples obtained using conventional PMs.\nOverall, our approach demonstrates the benefits of endowing PMs with priors about which features determine human preferences while relying on LM capabilities to extract those features in a scalable and robust way.",
        "keywords": "language model alignment;preference model;Reinforcement Learning from Human Feedback (RLHF);overoptimization;interpretability;scalable oversight;reward hacking",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/b6fe0ddcec67f7d7219ae80df993654e6966cc3b.zip",
        "author": "Dongyoung Go;Tomasz Korbak;Germ\u00e1n Kruszewski;Jos Rozen;Marc Dymetman",
        "authorids": "~Dongyoung_Go1;~Tomasz_Korbak1;~Germ\u00e1n_Kruszewski1;~Jos_Rozen1;~Marc_Dymetman1",
        "gender": "M;M;M;M;M",
        "homepage": "https://sites.google.com/view/dongyoung-go;https://tomekkorbak.com;https://germank.github.io;https://europe.naverlabs.com/people_user/jos-rozen/;https://europe.naverlabs.com/people_user/marc-dymetman/",
        "dblp": "340/3929;209/9713.html;117/4112;264/0099;74/1221",
        "google_scholar": "iisV7mwAAAAJ;YQ5rrk4AAAAJ;uU3rQI8AAAAJ;OxEDKogAAAAJ;bTXN9_0AAAAJ",
        "orcid": ";0000-0002-6258-2013;;0000-0001-5707-2134;",
        "linkedin": "dongyoung-go-9178a213b/;tomaszkorbak/;;jos-rozen-7b649743/;",
        "or_profile": "~Dongyoung_Go1;~Tomasz_Korbak1;~Germ\u00e1n_Kruszewski1;~Jos_Rozen1;~Marc_Dymetman1",
        "aff": "Yonsei University;Anthropic;Naver Labs Europe;Naver Labs Europe;Naver Labs Europe",
        "aff_domain": "yonsei.ac.kr;anthropic.com;naverlabs.com;naverlabs.com;naverlabs.com",
        "position": "PhD student;Researcher;Senior Scientist;Researcher;Principal Researcher",
        "bibtex": "@inproceedings{\ngo2024compositional,\ntitle={Compositional Preference Models for Aligning {LM}s},\nauthor={Dongyoung Go and Tomasz Korbak and Germ{\\'a}n Kruszewski and Jos Rozen and Marc Dymetman},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=tiiAzqi6Ol}\n}",
        "github": "",
        "project": "",
        "reviewers": "zwab;dDjG;pUSN;Q5ds",
        "pdf_size": 683074,
        "rating": "3;6;6;8",
        "confidence": "3;4;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;4",
        "wc_summary": "63;51;80;130",
        "wc_strengths": "36;68;20;49",
        "wc_weaknesses": "119;126;42;74",
        "wc_questions": "11;68;150;58",
        "wc_review": "229;313;292;311",
        "wc_reply_reviewers": "44;0;0;111",
        "wc_reply_authors": "1115;769;912;980",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "3;1;2;3",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            81.0,
            30.108138434649195
        ],
        "wc_strengths_avg": [
            43.25,
            17.597940220378067
        ],
        "wc_weaknesses_avg": [
            90.25,
            34.266419421935524
        ],
        "wc_questions_avg": [
            71.75,
            50.041857479514086
        ],
        "wc_review_avg": [
            286.25,
            34.05418476487141
        ],
        "wc_reply_reviewers_avg": [
            38.75,
            45.41681957160805
        ],
        "wc_reply_authors_avg": [
            944.0,
            124.68560462218564
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.8892972917998875,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13332144978373186567&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=tiiAzqi6Ol",
        "pdf": "https://openreview.net/pdf?id=tiiAzqi6Ol",
        "email": "yonsei.ac.kr;anthropic.com;naverlabs.com;naverlabs.com;naverlabs.com",
        "author_num": 5,
        "aff_unique_index": "0;1;2;2;2",
        "aff_unique_norm": "Yonsei University;Anthropic;NAVER LABS",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.yonsei.ac.kr;https://www.anthropic.com;https://labs.naver.com",
        "aff_unique_abbr": "Yonsei;Anthropic;NLE",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;2;2",
        "aff_country_unique": "South Korea;United States;Unknown"
    },
    {
        "id": "tj4a1JY03u",
        "title": "Enhanced Visual Instruction Tuning for Text-Rich Image Understanding",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Instruction tuning enhances the capability of Large Language Models (LLMs) to interact with humans. Furthermore, recent instruction-following datasets include images as visual input, collecting responses for image-based instructions. However, current visual instruction-tuned models cannot comprehend textual details within images well. This work enhances the current visual instruction tuning pipeline with text-rich images (e.g., movie posters, book covers, etc.). Specifically, we first used publicly available OCR tools to collect results on 422K text-rich images from the LAION dataset. Furthermore, we prompt text-only GPT-4 with recognized text and image captions to generate 16K conversations, each containing question-answer pairs for text-rich images. By combining our collected data with previous multimodal instruction-following data, our model, LLaVAR, substantially improves the capability of the LLaVA model on text-based VQA datasets (up to 20\\% accuracy improvement). The GPT-4-based instruction-following evaluation also demonstrates the improvement of our model on both natural images and text-rich images. Through qualitative analysis, LLaVAR shows promising interaction skills (e.g., reasoning, writing, and elaboration) with humans based on the latest real-world online content that combines text and images. We make our code/data/models publicly available.",
        "keywords": "Instruction Finetuning;Multimodal;Large Language Model",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Yanzhe Zhang;Ruiyi Zhang;Jiuxiang Gu;Yufan Zhou;Nedim Lipka;Diyi Yang;Tong Sun",
        "authorids": "~Yanzhe_Zhang1;~Ruiyi_Zhang3;~Jiuxiang_Gu2;~Yufan_Zhou1;~Nedim_Lipka1;~Diyi_Yang2;~Tong_Sun1",
        "gender": "M;;M;M;;F;F",
        "homepage": "https://stevenyzzhang.github.io/website/;;http://gujiuxiang.com;https://www.yufanzhou.com/;;https://cs.stanford.edu/~diyiy/;https://research.adobe.com/person/tong-sun/",
        "dblp": "42/3070;;173/4935.html;;;70/11145;",
        "google_scholar": "iJImxvUAAAAJ;;https://scholar.google.com.sg/citations?user=zPxKV9EAAAAJ;0eVrHJAAAAAJ;;j9jhYqQAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;;;;",
        "linkedin": ";;;;;;tong-sun/?trk=hb_tab_pro_top",
        "or_profile": "~Yanzhe_Zhang1;~Ruiyi_Zhang3;~Jiuxiang_Gu2;~Yufan_Zhou1;~Nedim_Lipka1;~Diyi_Yang2;~Tong_Sun1",
        "aff": "Georgia Institute of Technology;;Adobe Systems;Adobe ;;Stanford University;Adobe Systems",
        "aff_domain": "gatech.edu;;adobe.com;adobe.com;;stanford.edu;adobe.com",
        "position": "PhD student;;Researcher;Researcher;;Assistant Professor;Director, Document Intelligence Lab",
        "bibtex": "@misc{\nzhang2024enhanced,\ntitle={Enhanced Visual Instruction Tuning for Text-Rich Image Understanding},\nauthor={Yanzhe Zhang and Ruiyi Zhang and Jiuxiang Gu and Yufan Zhou and Nedim Lipka and Diyi Yang and Tong Sun},\nyear={2024},\nurl={https://openreview.net/forum?id=tj4a1JY03u}\n}",
        "github": "",
        "project": "",
        "reviewers": "bdXG;2XNz;miv5;sAP9",
        "site": "https://openreview.net/forum?id=tj4a1JY03u",
        "pdf_size": 18506158,
        "rating": "5;5;6;6",
        "confidence": "4;4;3;4",
        "soundness": "3;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "79;123;53;82",
        "wc_strengths": "62;94;59;61",
        "wc_weaknesses": "144;159;129;106",
        "wc_questions": "59;57;16;86",
        "wc_review": "344;433;257;335",
        "wc_reply_reviewers": "0;23;53;0",
        "wc_reply_authors": "282;294;508;569",
        "reply_reviewers": "0;1;2;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            84.25,
            25.053692342646823
        ],
        "wc_strengths_avg": [
            69.0,
            14.474114826130128
        ],
        "wc_weaknesses_avg": [
            134.5,
            19.576771950451892
        ],
        "wc_questions_avg": [
            54.5,
            25.004999500099974
        ],
        "wc_review_avg": [
            342.25,
            62.3673592514546
        ],
        "wc_reply_reviewers_avg": [
            19.0,
            21.760055146988943
        ],
        "wc_reply_authors_avg": [
            413.25,
            127.16401810260636
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10085032033508679693&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;1;2;1",
        "aff_unique_norm": "Georgia Institute of Technology;Adobe;Stanford University",
        "aff_unique_dep": ";Adobe Systems Incorporated;",
        "aff_unique_url": "https://www.gatech.edu;https://www.adobe.com;https://www.stanford.edu",
        "aff_unique_abbr": "Georgia Tech;Adobe;Stanford",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Stanford",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Social Reward: Evaluating and Enhancing Generative AI through Million-User Feedback from an Online Creative Community",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17606",
        "id": "tjn2YZSHUv",
        "author_site": "Arman Isajanyan, Artur Shatveryan, David Kocharian, Zhangyang Wang, Humphrey Shi",
        "tldr": "",
        "abstract": "Social reward as a form of community recognition provides a strong source of\nmotivation for users of online platforms to actively engage and contribute with\ncontent to accumulate peers approval. In the realm of text-conditioned image\nsynthesis, the recent surge in progress has ushered in a collaborative era where\nusers and AI systems coalesce to refine visual creations. This co-creative pro-\ncess in the landscape of online social networks empowers users to craft original\nvisual artworks seeking for community validation. Nevertheless, assessing these\nmodels in the context of collective community preference introduces distinct chal-\nlenges. Existing evaluation methods predominantly center on limited size user\nstudies guided by image quality and alignment with prompts. This work pio-\nneers a paradigm shift, unveiling Social Reward - an innovative reward modeling\nframework that leverages implicit feedback from social network users engaged\nin creative editing of generated images. We embark on an extensive journey of\ndataset curation and refinement, drawing from Picsart: an online visual creation\nand editing platform, yielding a first million-user-scale dataset of implicit human\npreferences for user-generated visual art named Picsart Image-Social. Our anal-\nysis exposes the shortcomings of current metrics in modeling community creative\npreference of text-to-image models\u2019 outputs, compelling us to introduce a novel\npredictive model explicitly tailored to address these limitations. Rigorous quan-\ntitative experiments and user study show that our Social Reward model aligns\nbetter with social popularity than existing metrics. Furthermore, we utilize So-\ncial Reward to fine-tune text-to-image models, yielding images that are more fa-\nvored by not only Social Reward, but also other established metrics. These find-\nings highlight the relevance and effectiveness of Social Reward in assessing com-\nmunity appreciation for AI-generated artworks, establishing a closer alignment\nwith users\u2019 creative goals: creating popular visual art. Codes can be accessed at\nhttps://github.com/Picsart-AI-Research/Social-Reward",
        "keywords": "human feedback;text to image;generative AI;image quality scoring",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/fc3603b66054e1449993977099bb1ede5fe9f7da.zip",
        "author": "Arman Isajanyan;Artur Shatveryan;David Kocharian;Zhangyang Wang;Humphrey Shi",
        "authorids": "~Arman_Isajanyan1;~Artur_Shatveryan1;~David_Kocharian1;~Zhangyang_Wang1;~Humphrey_Shi1",
        "gender": "M;M;M;M;M",
        "homepage": ";;;https://vita-group.github.io;https://www.humphreyshi.com",
        "dblp": ";;;119/4026;176/5516",
        "google_scholar": ";;;pxFyKAIAAAAJ;WBvt5A8AAAAJ",
        "orcid": ";;;;0000-0002-2922-5663",
        "linkedin": "arman-isajanyan-b2558613a/;arthur-shatveryan-561007144/;davidkocharian/;;humphreyshi",
        "or_profile": "~Arman_Isajanyan1;~Artur_Shatveryan1;~David_Kocharian1;~Zhangyang_Wang1;~Honghui_Shi1",
        "aff": "Picsart;Picsart;Picsart;University of Texas at Austin;University of Illinois, Urbana Champaign",
        "aff_domain": "picsart.com;picsart.com;picsart.com;utexas.edu;illinois.edu",
        "position": "Researcher;Researcher;Senior ML Scientist, Team Lead;Associate Professor;Adjunct Assistant Professor",
        "bibtex": "@inproceedings{\nisajanyan2024social,\ntitle={Social Reward: Evaluating and Enhancing Generative {AI} through Million-User Feedback from an Online Creative Community},\nauthor={Arman Isajanyan and Artur Shatveryan and David Kocharian and Zhangyang Wang and Humphrey Shi},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=tjn2YZSHUv}\n}",
        "github": "",
        "project": "",
        "reviewers": "Poto;hCCD;o2eb;yu8R",
        "pdf_size": 42325832,
        "rating": "5;6;8;8",
        "confidence": "4;2;3;4",
        "soundness": "3;3;3;4",
        "contribution": "2;3;3;4",
        "presentation": "2;3;3;3",
        "wc_summary": "86;157;94;89",
        "wc_strengths": "91;113;246;254",
        "wc_weaknesses": "128;30;84;206",
        "wc_questions": "5;45;20;14",
        "wc_review": "310;345;444;563",
        "wc_reply_reviewers": "0;0;0;13",
        "wc_reply_authors": "641;215;123;815",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "3;1;1;4",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            106.5,
            29.295904150580505
        ],
        "wc_strengths_avg": [
            176.0,
            74.46139939592862
        ],
        "wc_weaknesses_avg": [
            112.0,
            64.42049363362563
        ],
        "wc_questions_avg": [
            21.0,
            14.849242404917497
        ],
        "wc_review_avg": [
            415.5,
            98.32217450809354
        ],
        "wc_reply_reviewers_avg": [
            3.25,
            5.629165124598851
        ],
        "wc_reply_authors_avg": [
            448.5,
            288.0325502438917
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            1.299038105676658
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.058025885318565944,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11888864933676748637&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=tjn2YZSHUv",
        "pdf": "https://openreview.net/pdf?id=tjn2YZSHUv",
        "email": "picsart.com;picsart.com;picsart.com;utexas.edu;illinois.edu",
        "author_num": 5,
        "aff_unique_index": "0;0;0;1;2",
        "aff_unique_norm": "Picsart;University of Texas at Austin;University of Illinois Urbana-Champaign",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.picsart.com;https://www.utexas.edu;https://illinois.edu",
        "aff_unique_abbr": "Picsart;UT Austin;UIUC",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Austin;Urbana-Champaign",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "tkmO6bXT54",
        "title": "Mining latent labels for imbalance classification: a regrouping perspective",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep learning-based models are sensitive to class imbalance. Existing approaches often involve rebalancing tricks such as loss reweighting and class resampling to emphasize the minority class. In this work, we explore a novel baseline method to deal with class imbalance by regrouping the majority class into smaller pseudo-classes and turning the imbalanced classification problem into a balanced multiclass classification. This simple modification helps to make the class frequencies more uniform in the training data and, simultaneously, helps the representation learning by imposing a structure on the majority class. Experiment results on binary and multiclass classification show that the proposed method can substantially boost the classification performance as measured by average precision metric. Our code will be released before publication.",
        "keywords": "imbalanced learning;supervised learning;image classification",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/009403ec17cf781d6ae3333591ec1c8ffeba174c.pdf",
        "author": "Yash Travadi;Le Peng;Ying Cui;Rui Zhang;Ju Sun",
        "authorids": "~Yash_Travadi1;~Le_Peng1;~Ying_Cui3;~Rui_Zhang2;~Ju_Sun2",
        "gender": "M;M;F;M;",
        "homepage": "https://glovex.umn.edu/yash-travadi;https://lepeng.org;https://sites.google.com/site/optyingcui/;https://ruizhang.umn.edu;http://www.sunju.org",
        "dblp": ";;;;31/6843.html",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;--WN2j4AAAAJ;https://scholar.google.com/citations?hl=en;V6FaD-UAAAAJ",
        "orcid": ";;;0000-0001-8258-3585;0000-0002-2017-5903",
        "linkedin": ";;;;",
        "or_profile": "~Yash_Travadi1;~Le_Peng1;~Ying_Cui3;~Rui_Zhang2;~Ju_Sun1",
        "aff": "University of Minnesota - Twin Cities;University of Minnesota, Twin Cities ;University of California, Berkeley;University of Minnesota - Twin Cities;University of Minnesota, Twin Cities",
        "aff_domain": "umn.edu;umn.edu;berkeley.edu;umn.edu;umn.edu",
        "position": "PhD student;PhD student;Assistant Professor;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\ntravadi2024mining,\ntitle={Mining latent labels for imbalance classification: a regrouping perspective},\nauthor={Yash Travadi and Le Peng and Ying Cui and Rui Zhang and Ju Sun},\nyear={2024},\nurl={https://openreview.net/forum?id=tkmO6bXT54}\n}",
        "github": "",
        "project": "",
        "reviewers": "9T2x;AJcJ;nZ1i",
        "site": "https://openreview.net/forum?id=tkmO6bXT54",
        "pdf_size": 2839972,
        "rating": "3;3;5",
        "confidence": "4;5;2",
        "soundness": "2;2;3",
        "contribution": "1;2;2",
        "presentation": "2;2;3",
        "wc_summary": "86;65;26",
        "wc_strengths": "21;122;18",
        "wc_weaknesses": "161;254;30",
        "wc_questions": "62;49;94",
        "wc_review": "330;490;168",
        "wc_reply_reviewers": "72;34;36",
        "wc_reply_authors": "862;879;428",
        "reply_reviewers": "1;1;1",
        "reply_authors": "2;2;1",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            1.247219128924647
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            59.0,
            24.859605789312106
        ],
        "wc_strengths_avg": [
            53.666666666666664,
            48.334482744953654
        ],
        "wc_weaknesses_avg": [
            148.33333333333334,
            91.88519406786324
        ],
        "wc_questions_avg": [
            68.33333333333333,
            18.909139471577113
        ],
        "wc_review_avg": [
            329.3333333333333,
            131.4567947612024
        ],
        "wc_reply_reviewers_avg": [
            47.333333333333336,
            17.46106780494506
        ],
        "wc_reply_authors_avg": [
            723.0,
            208.71192267493169
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9449111825230683,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:EiJifsQfUpoJ:scholar.google.com/&scioq=Mining+latent+labels+for+imbalance+classification:+a+regrouping+perspective&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "University of Minnesota;University of California, Berkeley",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.minnesota.edu;https://www.berkeley.edu",
        "aff_unique_abbr": "UMN;UC Berkeley",
        "aff_campus_unique_index": "0;0;1;0;0",
        "aff_campus_unique": "Twin Cities;Berkeley",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "tlqmkftgpw",
        "title": "DBRNet: Advancing Individual-Level Continuous Treatment Estimation through Disentangled and Balanced Representation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Estimating the individual-level continuous treatment effect holds significant practical importance in various decision-making domains, such as personalized healthcare and customized marketing. However, current methods for individual treatment effect estimation are limited to discrete treatments or rely on a simplistic approach of balancing the entire representation, which may lead to inaccurate estimation. To the best of our knowledge, no existing efforts is capable of precisely adjusting for selection bias in continuous settings. Hence, in this paper, we propose a novel Disentangled and Balanced Representation Network (DBRNet) for estimating the individualized dose-response function (IDRF), which learns disentangled representations and precisely adjusts for selection bias. Extensive results on synthetic and semi-synthetic datasets demonstrate that our DBRNet outperforms most state-of-the-art methods. Our code is avaiable at https://anonymous.4open.science/r/DBRNet_final_2-2B76.",
        "keywords": "Continuous Treatment Effect Estimation;Causal Inference;Disentangled Representation",
        "primary_area": "causal reasoning",
        "supplementary_material": "",
        "author": "Mengxuan Hu;Zhixuan Chu;Sheng Li",
        "authorids": "~Mengxuan_Hu1;~Zhixuan_Chu1;~Sheng_Li3",
        "gender": "F;M;M",
        "homepage": "https://xuanxuan03021.github.io/;;http://sheng-li.org",
        "dblp": "345/8081;258/1233;23/3439-1",
        "google_scholar": ";a4IuTngAAAAJ;DEncVcYAAAAJ",
        "orcid": ";;0000-0003-1205-8632",
        "linkedin": "hu-mengxuan-823675263/;;sheng-li-15a70022/",
        "or_profile": "~Mengxuan_Hu1;~Zhixuan_Chu1;~Sheng_Li3",
        "aff": "University of Virginia;Ant Group;University of Virginia, Charlottesville",
        "aff_domain": "virginia.edu;antgroup.com;virginia.edu",
        "position": "PhD student;Researcher;Associate Professor",
        "bibtex": "@misc{\nhu2024dbrnet,\ntitle={{DBRN}et: Advancing Individual-Level Continuous Treatment Estimation through Disentangled and Balanced Representation},\nauthor={Mengxuan Hu and Zhixuan Chu and Sheng Li},\nyear={2024},\nurl={https://openreview.net/forum?id=tlqmkftgpw}\n}",
        "github": "",
        "project": "",
        "reviewers": "8hoc;TzGH;cz1b;Wac2;s6Cp",
        "site": "https://openreview.net/forum?id=tlqmkftgpw",
        "pdf_size": 1048889,
        "rating": "3;5;5;6;8",
        "confidence": "4;3;3;3;4",
        "soundness": "2;2;2;3;3",
        "contribution": "2;2;2;2;3",
        "presentation": "3;2;2;3;3",
        "wc_summary": "72;55;35;68;86",
        "wc_strengths": "34;46;40;56;150",
        "wc_weaknesses": "461;164;199;112;50",
        "wc_questions": "140;160;92;4;17",
        "wc_review": "707;425;366;240;303",
        "wc_reply_reviewers": "88;202;257;13;20",
        "wc_reply_authors": "1334;1503;2407;524;129",
        "reply_reviewers": "1;3;3;1;1",
        "reply_authors": "3;6;6;1;1",
        "rating_avg": [
            5.4,
            1.624807680927192
        ],
        "confidence_avg": [
            3.4,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            63.2,
            17.22091751330341
        ],
        "wc_strengths_avg": [
            65.2,
            43.0181357104187
        ],
        "wc_weaknesses_avg": [
            197.2,
            141.15438356636326
        ],
        "wc_questions_avg": [
            82.6,
            63.01618839631607
        ],
        "wc_review_avg": [
            408.2,
            161.6804255313549
        ],
        "wc_reply_reviewers_avg": [
            116.0,
            97.86316978312117
        ],
        "wc_reply_authors_avg": [
            1179.4,
            796.0539177719057
        ],
        "reply_reviewers_avg": [
            1.8,
            0.9797958971132713
        ],
        "reply_authors_avg": [
            3.4,
            2.244994432064365
        ],
        "replies_avg": [
            34,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.05025189076296065,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2140246113445959360&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Virginia;Ant Group",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.virginia.edu;https://www.antgroup.com",
        "aff_unique_abbr": "UVA;Ant Group",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Charlottesville",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "Enhancing One-Shot Federated Learning Through Data and Ensemble Co-Boosting",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17605",
        "id": "tm8s3696Ox",
        "author_site": "Rong Dai, Yonggang Zhang, Ang Li, Tongliang Liu, Xun Yang, Bo Han",
        "tldr": "",
        "abstract": "One-shot Federated Learning (OFL) has become a promising learning paradigm, enabling the training of a global server model via a single communication round. In OFL, the server model is aggregated by distilling knowledge from all client models (the ensemble), which are also responsible for synthesizing samples for distillation. In this regard, advanced works show that the performance of the server model is intrinsically related to the quality of the synthesized data and the ensemble model. To promote OFL, we introduce a novel framework, Co-Boosting, in which synthesized data and the ensemble model mutually enhance each other progressively. Specifically, Co-Boosting leverages the current ensemble model to synthesize higher-quality samples in an adversarial attack manner. These hard samples are then employed to promote the quality of the ensemble model by adjusting the ensembling weights for each client model. Consequently, Co-Boosting periodically achieves high-quality data and ensemble models. Extensive experiments demonstrate that Co-Boosting can substantially outperform existing baselines under various settings. Moreover, Co-Boosting eliminates the need for adjustments to the client's local training, requires no additional data or model transmission, and allows client models to have heterogeneous architectures.",
        "keywords": "federated learning;",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Rong Dai;Yonggang Zhang;Ang Li;Tongliang Liu;Xun Yang;Bo Han",
        "authorids": "~Rong_Dai1;~Yonggang_Zhang1;~Ang_Li6;~Tongliang_Liu1;~Xun_Yang1;~Bo_Han1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://github.com/rong-dai;https://yonggangzhangben.github.io/index.html;https://www.ang-li.com;https://tongliang-liu.github.io/;https://sites.google.com/site/xunyangprofile/;https://bhanml.github.io/",
        "dblp": ";27/6859-3;33/2805-5;150/6667;72/4772-1;241/0472-3",
        "google_scholar": ";XSbEr98AAAAJ;JVKSaWIAAAAJ;https://scholar.google.com.au/citations?user=EiLdZ_YAAAAJ;ro8lzsUAAAAJ;nTNjqHwAAAAJ",
        "orcid": ";0000-0002-4080-7592;;;0000-0003-0201-1638;",
        "linkedin": ";;;;;",
        "or_profile": "~Rong_Dai1;~Yonggang_Zhang1;~Ang_Li6;~Tongliang_Liu1;~Xun_Yang1;~bo_han2",
        "aff": "University of Science and Technology of China;Hong Kong Baptist University;Duke University;Mohamed bin Zayed University of Artificial Intelligence;University of Science and Technology of China;MBZUAI",
        "aff_domain": "ustc.edu.cn;hkbu.edu.hk;duke.edu;mbzuai.ac.ae;ustc.edu.cn;mbzuai.ac.ae",
        "position": "PhD student;Postdoc;PhD student;Affiliated Associate Professor;Full Professor;Researcher",
        "bibtex": "@inproceedings{\ndai2024enhancing,\ntitle={Enhancing One-Shot Federated Learning Through Data and Ensemble Co-Boosting},\nauthor={Rong Dai and Yonggang Zhang and Ang Li and Tongliang Liu and Xun Yang and Bo Han},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=tm8s3696Ox}\n}",
        "github": "",
        "project": "",
        "reviewers": "WMX4;rouU;vHVL;qWAT",
        "pdf_size": 11767963,
        "rating": "3;6;6;6",
        "confidence": "4;3;4;4",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "117;39;30;69",
        "wc_strengths": "30;56;36;29",
        "wc_weaknesses": "237;187;103;173",
        "wc_questions": "16;316;24;83",
        "wc_review": "400;598;193;354",
        "wc_reply_reviewers": "0;142;20;0",
        "wc_reply_authors": "2942;3659;1812;1689",
        "reply_reviewers": "0;2;1;0",
        "reply_authors": "11;9;8;9",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            63.75,
            33.96597562267276
        ],
        "wc_strengths_avg": [
            37.75,
            10.871407452579449
        ],
        "wc_weaknesses_avg": [
            175.0,
            47.89572005931219
        ],
        "wc_questions_avg": [
            109.75,
            121.85724229605724
        ],
        "wc_review_avg": [
            386.25,
            144.40632776994227
        ],
        "wc_reply_reviewers_avg": [
            40.5,
            59.167136148372094
        ],
        "wc_reply_authors_avg": [
            2525.5,
            816.5642963049511
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            9.25,
            1.0897247358851685
        ],
        "replies_avg": [
            46,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7291208501608191520&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=tm8s3696Ox",
        "pdf": "https://openreview.net/pdf?id=tm8s3696Ox",
        "email": "ustc.edu.cn;hkbu.edu.hk;duke.edu;mbzuai.ac.ae;ustc.edu.cn;mbzuai.ac.ae",
        "author_num": 6,
        "aff_unique_index": "0;1;2;3;0;3",
        "aff_unique_norm": "University of Science and Technology of China;Hong Kong Baptist University;Duke University;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "http://www.ustc.edu.cn;https://www.hkbu.edu.hk;https://www.duke.edu;https://mbzuai.ac.ae",
        "aff_unique_abbr": "USTC;HKBU;Duke;MBZUAI",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;1;2;0;2",
        "aff_country_unique": "China;United States;United Arab Emirates"
    },
    {
        "title": "Motif: Intrinsic Motivation from Artificial Intelligence Feedback",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17604",
        "id": "tmBKIecDE9",
        "author_site": "Martin Klissarov, Pierluca D'Oro, Shagun Sodhani, Roberta Raileanu, Pierre-Luc Bacon, Pascal Vincent, Amy Zhang, Mikael Henaff",
        "tldr": "",
        "abstract": "Exploring rich environments and evaluating one's actions without prior knowledge is immensely challenging. In this paper, we propose Motif, a general method to interface such prior knowledge from a Large Language Model (LLM) with an agent. Motif is based on the idea of grounding LLMs for decision-making without requiring them to interact with the environment: it elicits preferences from an LLM over pairs of captions to construct an intrinsic reward, which is then used to train agents with reinforcement learning. We evaluate Motif's performance and behavior on the challenging, open-ended and procedurally-generated NetHack game. Surprisingly, by only learning to maximize its intrinsic reward, Motif achieves a higher game score than an algorithm directly trained to maximize the score itself. When combining Motif's intrinsic reward with the environment reward, our method significantly outperforms existing approaches and makes progress on tasks where no advancements have ever been made without demonstrations. Finally, we show that Motif mostly generates intuitive human-aligned behaviors which can be steered easily through prompt modifications, while scaling well with the LLM size and the amount of information given in the prompt.",
        "keywords": "intrinsic motivation;rlaif;large language models;exploration;open-endedness;nethack;alignment;diversity",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Martin Klissarov;Pierluca D'Oro;Shagun Sodhani;Roberta Raileanu;Pierre-Luc Bacon;Pascal Vincent;Amy Zhang;Mikael Henaff",
        "authorids": "~Martin_Klissarov1;~Pierluca_D'Oro1;~Shagun_Sodhani1;~Roberta_Raileanu2;~Pierre-Luc_Bacon1;~Pascal_Vincent1;~Amy_Zhang1;~Mikael_Henaff1",
        "gender": "Unspecified;M;M;;;M;;M",
        "homepage": "https://mklissa.github.io;https://proceduralia.github.io;https://shagunsodhani.com;;;http://www.iro.umontreal.ca/~vincentp;;http://www.mikaelhenaff.com",
        "dblp": ";248/8326;http://dblp.uni-trier.de/pers/hd/s/Sodhani:Shagun;;;43/861;;86/10571",
        "google_scholar": ";https://scholar.google.it/citations?user=AuVp7pkAAAAJ;ixp-vqMAAAAJ;;;WBCKQMsAAAAJ;;bX__wkYAAAAJ",
        "orcid": ";;;;;;;",
        "linkedin": ";;shagun-sodhani-b2239879;;;;;",
        "or_profile": "~Martin_Klissarov1;~Pierluca_D'Oro1;~Shagun_Sodhani1;~Roberta_Raileanu2;~Pierre-Luc_Bacon1;~Pascal_Vincent1;~Amy_Zhang1;~Mikael_Henaff1",
        "aff": "McGill University;Universit\u00e9 de Montr\u00e9al;Meta Facebook;;;Facebook A.I. Research;;Meta",
        "aff_domain": "mcgill.ca;umontreal.ca;fb.com;;;fb.com;;meta.com",
        "position": "PhD student;PhD student;Researcher;;;Research Scientist;;Researcher",
        "bibtex": "@inproceedings{\nklissarov2024motif,\ntitle={Motif: Intrinsic Motivation from Artificial Intelligence Feedback},\nauthor={Martin Klissarov and Pierluca D'Oro and Shagun Sodhani and Roberta Raileanu and Pierre-Luc Bacon and Pascal Vincent and Amy Zhang and Mikael Henaff},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=tmBKIecDE9}\n}",
        "github": "",
        "project": "",
        "reviewers": "j8Na;2GW2;VWkY;wqBP",
        "pdf_size": 2091859,
        "rating": "5;8;8;8",
        "confidence": "4;3;3;3",
        "soundness": "2;3;3;3",
        "contribution": "2;4;2;3",
        "presentation": "3;3;4;3",
        "wc_summary": "78;138;98;76",
        "wc_strengths": "42;60;75;74",
        "wc_weaknesses": "113;46;69;95",
        "wc_questions": "52;26;79;135",
        "wc_review": "285;270;321;380",
        "wc_reply_reviewers": "224;18;27;44",
        "wc_reply_authors": "1556;403;968;1074",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "4;1;2;3",
        "rating_avg": [
            7.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            97.5,
            24.914855006601986
        ],
        "wc_strengths_avg": [
            62.75,
            13.36740438529485
        ],
        "wc_weaknesses_avg": [
            80.75,
            25.439880109780393
        ],
        "wc_questions_avg": [
            73.0,
            40.40420770167385
        ],
        "wc_review_avg": [
            314.0,
            42.373340675476605
        ],
        "wc_reply_reviewers_avg": [
            78.25,
            84.66514926461772
        ],
        "wc_reply_authors_avg": [
            1000.25,
            409.8916777637721
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 64,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8476178047907651071&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=tmBKIecDE9",
        "pdf": "https://openreview.net/pdf?id=tmBKIecDE9",
        "email": "mcgill.ca;umontreal.ca;fb.com;;;fb.com;;meta.com",
        "author_num": 8,
        "aff_unique_index": "0;1;2;2;2",
        "aff_unique_norm": "McGill University;Universit\u00e9 de Montr\u00e9al;Meta",
        "aff_unique_dep": ";;Meta Platforms, Inc.",
        "aff_unique_url": "https://www.mcgill.ca;https://www.umontreal.ca;https://meta.com",
        "aff_unique_abbr": "McGill;UdeM;Meta",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;1;1",
        "aff_country_unique": "Canada;United States"
    },
    {
        "title": "Maximum Entropy Heterogeneous-Agent Reinforcement Learning",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17603",
        "id": "tmqOhBC4a5",
        "author_site": "Jiarong Liu, Yifan Zhong, Siyi Hu, Haobo Fu, QIANG FU, Xiaojun Chang, Yaodong Yang",
        "tldr": "",
        "abstract": "*Multi-agent reinforcement learning* (MARL) has been shown effective for cooperative games in recent years. However, existing state-of-the-art methods face challenges related to sample complexity, training instability, and the risk of converging to a suboptimal Nash Equilibrium. In this paper, we propose a unified framework for learning \\emph{stochastic} policies to resolve these issues. We embed cooperative MARL problems into probabilistic graphical models, from which we derive the maximum entropy (MaxEnt) objective for MARL. Based on the MaxEnt framework, we propose *Heterogeneous-Agent Soft Actor-Critic* (HASAC) algorithm. Theoretically, we prove the monotonic improvement and convergence to *quantal response equilibrium* (QRE) properties of HASAC. Furthermore, we generalize a unified template for MaxEnt algorithmic design named *Maximum Entropy Heterogeneous-Agent Mirror Learning* (MEHAML), which provides any induced method with the same guarantees as HASAC. We evaluate HASAC on six benchmarks: Bi-DexHands, Multi-Agent MuJoCo, StarCraft Multi-Agent Challenge, Google Research Football, Multi-Agent Particle Environment, and Light Aircraft Game. Results show that HASAC consistently outperforms strong baselines, exhibiting better sample efficiency, robustness, and sufficient exploration.",
        "keywords": "cooperative multi-agent reinforcement learning;heterogeneous-agent soft actor-critic;maximum entropy heterogeneous-agent mirror learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/1c3bd6fb94ae9e95cde9e6f6d69189eba2c4221a.zip",
        "author": "Jiarong Liu;Yifan Zhong;Siyi Hu;Haobo Fu;QIANG FU;Xiaojun Chang;Yaodong Yang",
        "authorids": "~Jiarong_Liu1;~Yifan_Zhong2;~Siyi_Hu1;~Haobo_Fu2;~QIANG_FU8;~Xiaojun_Chang4;~Yaodong_Yang1",
        "gender": "M;;M;M;M;;M",
        "homepage": "https://github.com/guazimao;;http://www.mmvg.org;;;;https://www.yangyaodong.com",
        "dblp": ";;;85/8571;;;170/1496-1",
        "google_scholar": ";;;LFdJXNcAAAAJ;gANaxT0AAAAJ;;https://scholar.google.co.uk/citations?user=6yL0xw8AAAAJ",
        "orcid": ";;;;;;0000-0001-8132-5613",
        "linkedin": ";;;haobo-fu-382b0784/;;;yaodong-yang",
        "or_profile": "~Jiarong_Liu1;~Yifan_Zhong2;~Siyi_Hu1;~Haobo_Fu2;~QIANG_FU8;~Xiaojun_Chang4;~Yaodong_Yang1",
        "aff": "Beihang University;;University of Technology Sydney;Tencent AI Lab;Tencent AI Lab;;Peking University",
        "aff_domain": "buaa.edu.cn;;uts.edu.au;tencent.com;tencent.com;;pku.edu.cn",
        "position": "Undergrad student;;PhD student;Principal Researcher;Principal Researcher;;Assistant Professor",
        "bibtex": "@inproceedings{\nliu2024maximum,\ntitle={Maximum Entropy Heterogeneous-Agent Reinforcement Learning},\nauthor={Jiarong Liu and Yifan Zhong and Siyi Hu and Haobo Fu and QIANG FU and Xiaojun Chang and Yaodong Yang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=tmqOhBC4a5}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZAWK;9JkX;iakN;YGsv",
        "pdf_size": 12698209,
        "rating": "6;8;8;8",
        "confidence": "5;4;3;2",
        "soundness": "3;3;3;3",
        "contribution": "2;3;4;3",
        "presentation": "3;4;3;3",
        "wc_summary": "78;94;61;142",
        "wc_strengths": "55;140;133;26",
        "wc_weaknesses": "117;30;224;112",
        "wc_questions": "61;52;34;283",
        "wc_review": "311;316;452;563",
        "wc_reply_reviewers": "0;15;32;0",
        "wc_reply_authors": "746;191;545;703",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;2;2;1",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            93.75,
            30.202441954252638
        ],
        "wc_strengths_avg": [
            88.5,
            49.145193050795925
        ],
        "wc_weaknesses_avg": [
            120.75,
            68.89620816851969
        ],
        "wc_questions_avg": [
            107.5,
            101.79022546394128
        ],
        "wc_review_avg": [
            410.5,
            104.65299804592317
        ],
        "wc_reply_reviewers_avg": [
            11.75,
            13.198011213815512
        ],
        "wc_reply_authors_avg": [
            546.25,
            218.33159986589206
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.7745966692414834,
        "gs_citation": 18,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13585735232697469149&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=tmqOhBC4a5",
        "pdf": "https://openreview.net/pdf?id=tmqOhBC4a5",
        "email": "buaa.edu.cn;;uts.edu.au;tencent.com;tencent.com;;pku.edu.cn",
        "author_num": 7,
        "aff_unique_index": "0;1;2;2;3",
        "aff_unique_norm": "Beihang University;University of Technology Sydney;Tencent;Peking University",
        "aff_unique_dep": ";;Tencent AI Lab;",
        "aff_unique_url": "http://www.buaa.edu.cn/;https://www.uts.edu.au;https://ai.tencent.com;http://www.pku.edu.cn",
        "aff_unique_abbr": "BUAA;UTS;Tencent AI Lab;Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;0",
        "aff_country_unique": "China;Australia"
    },
    {
        "title": "Dissecting learning and forgetting in language model finetuning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17602",
        "id": "tmsqb6WpLz",
        "author_site": "Xiao Zhang, Ji Wu",
        "tldr": "",
        "abstract": "Finetuning language models on domain-specific corpus is a common approach to enhance their domain knowledge and capability. While improving performance on domain tasks, it often brings a side-effect of forgetting of the model's general abilities. In this study, we analyze the effects of finetuning on language models by dissecting its impacts on the modeling of topic, style, and factual knowledge in text. Our method uses instruction-following LLMs such as ChatGPT to auto-generate controlled-variable text examples which we use to probe the model. Our findings reveal that finetuning results in significant shifts in the language model's topic and style priors, while actual knowledge learning only contributes to a small fraction of the total probability change. Analysis shows that the adaptation of topic and style priors behave akin to learning simple features: they are learned rapidly and require little model capacity. They are also learned independently and primarily at the beginning of a text sequence. In contrast, factual knowledge is learned stably but slowly and requires significant model capacity to learn. The research offers insights and understanding into the finer dynamics of learning and forgetting in language models, and can potentially inform future research on improving domain adaptation and addressing the challenges of forgetting in continual learning of language models.",
        "keywords": "language models;domain adaptation;catastrophic forgetting",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Xiao Zhang;Ji Wu",
        "authorids": "~Xiao_Zhang9;~Ji_Wu3",
        "gender": ";M",
        "homepage": ";http://speech.tsinghua.edu.cn/en/",
        "dblp": ";91/4957-2",
        "google_scholar": "https://scholar.google.com/citations?hl=en;",
        "orcid": ";0000-0001-6170-726X",
        "linkedin": ";",
        "or_profile": "~Xiao_Zhang9;~Ji_Wu3",
        "aff": "Tsinghua University;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "PhD student;Full Professor",
        "bibtex": "@inproceedings{\nzhang2024dissecting,\ntitle={Dissecting learning and forgetting in language model finetuning},\nauthor={Xiao Zhang and Ji Wu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=tmsqb6WpLz}\n}",
        "github": "",
        "project": "",
        "reviewers": "QBAp;xGn4;DT5M;o2MC",
        "pdf_size": 2492380,
        "rating": "5;5;5;8",
        "confidence": "3;4;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "2;2;3;3",
        "wc_summary": "106;62;156;146",
        "wc_strengths": "93;70;31;70",
        "wc_weaknesses": "236;231;255;59",
        "wc_questions": "27;46;105;19",
        "wc_review": "462;409;547;294",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "874;911;1209;496",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;3;1",
        "rating_avg": [
            5.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            117.5,
            37.104581927303805
        ],
        "wc_strengths_avg": [
            66.0,
            22.282279955157193
        ],
        "wc_weaknesses_avg": [
            195.25,
            79.17188579287473
        ],
        "wc_questions_avg": [
            49.25,
            33.647993996670884
        ],
        "wc_review_avg": [
            428.0,
            91.6978734758882
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            872.5,
            253.21384243362368
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 19,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9462819166363048943&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=tmsqb6WpLz",
        "pdf": "https://openreview.net/pdf?id=tmsqb6WpLz",
        "email": "tsinghua.edu.cn;tsinghua.edu.cn",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Tsinghua University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "tnAPOvvNzZ",
        "title": "JsonTuning: Towards Generalizable, Robust, and Controllable Instruction Tuning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Instruction tuning has emerged as a crucial process for harnessing the capabilities of large language models (LLMs) by providing explicit task instructions, leading to improved performance in various tasks. However, prevalent text-to-text instruction tuning (TextTuning) methods suffer from limitations in generalization, robustness, and controllability due to the ambiguity and lack of explicit structure in tasks. In this paper, we propose JsonTuning, a novel structure-to-structure approach for instruction tuning. By leveraging the versatility and structured nature of JSON to represent tasks, JsonTuning enhances generalization by helping the model understand essential task elements and their relations, improves robustness by minimizing ambiguity, and increases controllability by providing explicit control over the output. We conduct a comprehensive comparative study with diverse language models and evaluation benchmarks. Experimental results show that JsonTuning outperforms TextTuning in various applications, showcasing improved performance, adaptability, robustness, and controllability. By overcoming the limitations of TextTuning, JsonTuning demonstrates significant potential for more effective and reliable LLMs capable of handling diverse scenarios",
        "keywords": "instruction tuning;generalization;robustness;controllability",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Chang Gao;Wenxuan Zhang;Guizhen Chen;Wai Lam",
        "authorids": "~Chang_Gao1;~Wenxuan_Zhang1;~Guizhen_Chen1;~Wai_Lam1",
        "gender": "M;;F;M",
        "homepage": "https://gao-xiao-bai.github.io/;https://isakzhang.github.io/;;http://www.se.cuhk.edu.hk/~textmine",
        "dblp": ";85/1177-1.html;221/3221;48/1707",
        "google_scholar": "6lLqRasAAAAJ;https://scholar.google.com/citations?hl=en;HAdzwTsAAAAJ;ewA4NAcAAAAJ",
        "orcid": "0000-0002-7588-0159;;0000-0002-0193-7853;",
        "linkedin": ";wenxuan-zhang-608b88153/;chenguizhen;",
        "or_profile": "~Chang_Gao1;~Wenxuan_Zhang1;~Guizhen_Chen1;~Wai_Lam1",
        "aff": "The Chinese University of Hong Kong;Alibaba Group;Alibaba Group;The Chinese University of Hong Kong",
        "aff_domain": "cuhk.edu.hk;alibaba-inc.com;alibaba-inc.com;cuhk.edu.hk",
        "position": "PhD student;Researcher;PhD student;Professor",
        "bibtex": "@misc{\ngao2024jsontuning,\ntitle={JsonTuning: Towards Generalizable, Robust, and Controllable Instruction Tuning},\nauthor={Chang Gao and Wenxuan Zhang and Guizhen Chen and Wai Lam},\nyear={2024},\nurl={https://openreview.net/forum?id=tnAPOvvNzZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "5Thw;qRB3;jpTc;pk2e",
        "site": "https://openreview.net/forum?id=tnAPOvvNzZ",
        "pdf_size": 335321,
        "rating": "5;5;6;6",
        "confidence": "4;4;5;3",
        "soundness": "2;3;3;3",
        "contribution": "2;3;2;2",
        "presentation": "3;3;3;4",
        "wc_summary": "36;72;34;63",
        "wc_strengths": "30;58;17;92",
        "wc_weaknesses": "191;329;142;87",
        "wc_questions": "5;107;123;47",
        "wc_review": "262;566;316;289",
        "wc_reply_reviewers": "0;332;0;44",
        "wc_reply_authors": "935;1947;770;943",
        "reply_reviewers": "0;2;0;1",
        "reply_authors": "2;3;1;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            51.25,
            16.57369904396722
        ],
        "wc_strengths_avg": [
            49.25,
            28.78693279944913
        ],
        "wc_weaknesses_avg": [
            187.25,
            89.72840965937154
        ],
        "wc_questions_avg": [
            70.5,
            47.25198408532704
        ],
        "wc_review_avg": [
            358.25,
            121.45446677664845
        ],
        "wc_reply_reviewers_avg": [
            94.0,
            138.57849761056005
        ],
        "wc_reply_authors_avg": [
            1148.75,
            466.01414946329686
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11716253604433337792&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1;0",
        "aff_unique_norm": "Chinese University of Hong Kong;Alibaba Group",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cuhk.edu.hk;https://www.alibaba.com",
        "aff_unique_abbr": "CUHK;Alibaba",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Does CLIP\u2019s generalization performance mainly stem from high train-test similarity?",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17601",
        "id": "tnBaiidobu",
        "author_site": "Prasanna Mayilvahanan, Thadd\u00e4us Wiedemer, Evgenia Rusak, Matthias Bethge, Wieland Brendel",
        "tldr": "",
        "abstract": "Foundation models like CLIP are trained on hundreds of millions of samples and effortlessly generalize to new tasks and inputs. Out of the box, CLIP shows stellar zero-shot and few-shot capabilities on a wide range of out-of-distribution (OOD) benchmarks, which prior works attribute mainly to today's large and comprehensive training dataset (like LAION). However, it is questionable how meaningful terms like out-of-distribution generalization are for CLIP as it seems likely that web-scale datasets like LAION simply contain many samples that are similar to common OOD benchmarks originally designed for ImageNet. To test this hypothesis, we retrain CLIP on pruned LAION splits that replicate ImageNet\u2019s train-test similarity with respect to common OOD benchmarks. While we observe a performance drop on some benchmarks, surprisingly, CLIP\u2019s overall performance remains high. This shows that high train-test similarity is insufficient to explain CLIP\u2019s OOD performance, and other properties of the training data must drive CLIP to learn more generalizable representations. Additionally, by pruning data points that are dissimilar to the OOD benchmarks, we uncover a 100M split of LAION (\u00bc of its original size) on which CLIP can be trained to match its original OOD performance.",
        "keywords": "robustness;foundation models;CLIP;LAION;ImageNet;generalization;OOD robustness;distribution shift;vision language models;self-supervised learning;contrastive learning;ObjectNet;ImageNet-R;ImageNet-Sketch;ImageNet-A;ImageNet-V2",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/ac7e23ca9202031246ae12159d59894c02c97524.zip",
        "author": "Prasanna Mayilvahanan;Thadd\u00e4us Wiedemer;Evgenia Rusak;Matthias Bethge;Wieland Brendel",
        "authorids": "~Prasanna_Mayilvahanan2;~Thadd\u00e4us_Wiedemer1;~Evgenia_Rusak1;~Matthias_Bethge1;~Wieland_Brendel1",
        "gender": "M;M;F;M;M",
        "homepage": ";;https://evgeniarusak.github.io/;https://bethgelab.org;",
        "dblp": "313/4018;327/3433;245/2556;77/3005;37/11107",
        "google_scholar": "3xq1YcYAAAAJ;aeCiRSYAAAAJ;https://scholar.google.de/citations?user=XKc19kkAAAAJ;https://scholar.google.com/citations?hl=en;v-JL-hsAAAAJ",
        "orcid": ";0009-0003-6280-0804;;;",
        "linkedin": ";thaddaeuswiedemer/;;;",
        "or_profile": "~Prasanna_Mayilvahanan2;~Thadd\u00e4us_Wiedemer1;~Evgenia_Rusak1;~Matthias_Bethge1;~Wieland_Brendel1",
        "aff": "Apple;Max Planck Institute for Intelligent Systems;Max-Planck-Institute for Intelligent Systems, Max-Planck Institute;University of Tuebingen;ELLIS Institute T\u00fcbingen",
        "aff_domain": "apple.com;is.tuebingen.mpg.de;is.mpg.de;uni-tuebingen.de;tue.ellis.eu",
        "position": "Intern;PhD student;PhD student;Full Professor;Principal Researcher",
        "bibtex": "@inproceedings{\nmayilvahanan2024does,\ntitle={Does {CLIP}{\\textquoteright}s generalization performance mainly stem from high train-test similarity?},\nauthor={Prasanna Mayilvahanan and Thadd{\\\"a}us Wiedemer and Evgenia Rusak and Matthias Bethge and Wieland Brendel},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=tnBaiidobu}\n}",
        "github": "",
        "project": "",
        "reviewers": "X2Xy;fHnd;MLz9;fbpP",
        "pdf_size": 9186411,
        "rating": "5;6;6;6",
        "confidence": "5;4;4;4",
        "soundness": "3;3;2;3",
        "contribution": "2;3;3;3",
        "presentation": "3;4;2;3",
        "wc_summary": "133;120;147;341",
        "wc_strengths": "119;70;70;19",
        "wc_weaknesses": "281;217;310;56",
        "wc_questions": "132;55;77;46",
        "wc_review": "665;462;604;462",
        "wc_reply_reviewers": "614;207;93;70",
        "wc_reply_authors": "2153;1067;779;727",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "4;3;2;2",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            185.25,
            90.42780269364063
        ],
        "wc_strengths_avg": [
            69.5,
            35.358874416474286
        ],
        "wc_weaknesses_avg": [
            216.0,
            98.31327479033541
        ],
        "wc_questions_avg": [
            77.5,
            33.425289826716536
        ],
        "wc_review_avg": [
            548.25,
            88.9054975802959
        ],
        "wc_reply_reviewers_avg": [
            246.0,
            218.70642423120543
        ],
        "wc_reply_authors_avg": [
            1181.5,
            575.6515873338664
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 23,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10960444715167867635&as_sdt=5,34&sciodt=0,34&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=tnBaiidobu",
        "pdf": "https://openreview.net/pdf?id=tnBaiidobu",
        "email": "apple.com;is.tuebingen.mpg.de;is.mpg.de;uni-tuebingen.de;tue.ellis.eu",
        "author_num": 5,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "Apple;Max Planck Institute for Intelligent Systems;Max-Planck-Institute for Intelligent Systems;University of Tuebingen;ELLIS Institute",
        "aff_unique_dep": "Apple Inc.;Intelligent Systems;Intelligent Systems;;",
        "aff_unique_url": "https://www.apple.com;https://www.mpi-is.mpg.de;https://www.mpi-is.mpg.de;https://www.uni-tuebingen.de/;https://ellis.eu/",
        "aff_unique_abbr": "Apple;MPI-IS;MPI-IS;Uni T\u00fcbingen;ELLIS",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";T\u00fcbingen",
        "aff_country_unique_index": "0;1;1;1;1",
        "aff_country_unique": "United States;Germany"
    },
    {
        "id": "toD3yzfuaf",
        "title": "Meta-Learning with Personalized Learning Rates for Rapid Task Mastery",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Traditional meta-learning approaches primarily focus on the generalization ability of models across unfamiliar tasks. These methods typically involve fine-tuning the model in the outer loop to perform well on new tasks. While this is valuable for enabling models to adapt to various tasks, it may overlook the details of rapid adaptation within tasks. During rapid adaptation, the same task may exhibit entirely different data distributions, features, and patterns in different training phases, making it exceptionally challenging to determine an appropriate learning rate. Consequently, conventional meta-learning methods often employ fixed learning rates or simple learning rate strategies, overlooking the dynamic nature within tasks. In this paper, we propose an Meta-Learning with Personalized Learning Rates (MLPLR) approach. Specifically, we adaptively generate negatively correlated learning rates by evaluating the information loss between predicted values and ground truth. When the information loss is low, indicating the model's strong performance on the current task, we can increase the learning rate to expedite the learning process. This aids in faster convergence and adapting to specific patterns and features within tasks. Conversely, when the information loss is high, indicating poor model performance on the current task, we reduce the learning rate to ensure more stable and gradual parameter updates, thereby mitigating overfitting. Extensive experiments and analyses demonstrate that our approach enhances the performance of various meta-learning models in the contexts of few-shot classification, few-shot fine-grained classification, and cross-domain few-shot classification.",
        "keywords": "Few-shot Learning;Meta-learning;Adaptive Learning Rate;Rapid Adaptation;Information Loss",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/f422d72f08b8e6e8ee6d7026c3962ef0f49b4ed9.zip",
        "author": "Maofa Wang;Zhixiong Leng;Quan Wan;Yanlin Xu;Bingchen Yan;Zhenbing Liu",
        "authorids": "~Maofa_Wang1;~Zhixiong_Leng1;~Quan_Wan1;~Yanlin_Xu1;~Bingchen_Yan1;~Zhenbing_Liu1",
        "gender": "M;;M;F;M;M",
        "homepage": "https://www.scholat.com/wangmaofa;;;;;https://www.guet.edu.cn/people2/1180094.html",
        "dblp": ";;;;;",
        "google_scholar": "-7fzuVQAAAAJ;;;;;",
        "orcid": ";;0009-0004-5486-125X;0009-0004-6021-3603;0009-0004-1183-928X;",
        "linkedin": ";;;;;",
        "or_profile": "~Maofa_Wang1;~Zhixiong_Leng1;~Quan_Wan1;~Yanlin_Xu1;~Bingchen_Yan1;~Zhenbing_Liu1",
        "aff": ";;;Guilin University of Electronic Technology;Guilin University Of Electronic Technology;Guilin University of Electronic Technology",
        "aff_domain": ";;;guet.edu.cn;guet.edu.cn;guet.edu.cn",
        "position": ";;;MS student;MS student;Full Professor",
        "bibtex": "@misc{\nwang2024metalearning,\ntitle={Meta-Learning with Personalized Learning Rates for Rapid Task Mastery},\nauthor={Maofa Wang and Zhixiong Leng and Quan Wan and Yanlin Xu and Bingchen Yan and Zhenbing Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=toD3yzfuaf}\n}",
        "github": "",
        "project": "",
        "reviewers": "RAUk;8ubD;wr36",
        "site": "https://openreview.net/forum?id=toD3yzfuaf",
        "pdf_size": 343716,
        "rating": "3;3;3",
        "confidence": "4;4;5",
        "soundness": "2;2;1",
        "contribution": "2;1;1",
        "presentation": "2;2;1",
        "wc_summary": "114;17;68",
        "wc_strengths": "75;16;26",
        "wc_weaknesses": "330;149;276",
        "wc_questions": "64;26;55",
        "wc_review": "583;208;425",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            66.33333333333333,
            39.617616732402716
        ],
        "wc_strengths_avg": [
            39.0,
            25.78113005022601
        ],
        "wc_weaknesses_avg": [
            251.66666666666666,
            75.86977146546721
        ],
        "wc_questions_avg": [
            48.333333333333336,
            16.21384867602041
        ],
        "wc_review_avg": [
            405.3333333333333,
            153.72341685276479
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:hGEm6VjUwNsJ:scholar.google.com/&scioq=Meta-Learning+with+Personalized+Learning+Rates+for+Rapid+Task+Mastery&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Guilin University of Electronic Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.gliet.edu.cn/",
        "aff_unique_abbr": "",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "toWEwcbldw",
        "title": "Continual Learners are Viable Long-Tailed Recognizers",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We propose a series of theorems which demonstrate that using Continual Learning (CL) to sequentially learn the majority and minority class subsets in a highly imbalanced dataset, is an effective solution for Long-Tailed Recognition (LTR). First, we theoretically prove that under the assumption of strong convexity of the loss function, the weights of a learner trained on a long-tailed dataset are bounded to reside within a neighborhood of the weights of the same learner trained strictly on the largest subset of that dataset. As a result, we present a novel perspective that CL methods, which are designed to optimize the weights in a way that the model performs well on multiple sets, are viable solutions for LTR. To validate our proposed perspective, we first verify the predicted upper bound of the neighborhood radius using the MNIST-LT toy dataset. Next, we evaluate the efficacy of several CL strategies on multiple standard LTR benchmarks (CIFAR100-LT, CIFAR10-LT, and ImageNet-LT), and show that standard CL methods achieve strong performance gains compared to baseline models and tailor-made approaches for LTR. Finally, we assess the applicability of CL techniques on real-world data by exploring CL on the naturally imbalanced Caltech256 dataset and demonstrate its superiority over state-of-the-art models. Our work not only unifies LTR and CL but also paves the way for leveraging advances in CL methods to tackle the LTR challenge more effectively.",
        "keywords": "Continual Learning;Long-Tailed Recognition;Imbalanced Learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Mahdiyar Molahasani;Michael Greenspan;Ali Etemad",
        "authorids": "~Mahdiyar_Molahasani1;~Michael_Greenspan1;~Ali_Etemad1",
        "gender": "M;;M",
        "homepage": "http://molahasani.ca;https://rcvlab.engineering.queensu.ca/;http://www.aiimlab.com",
        "dblp": "314/6012;g/MichaelAGreenspan.html;15/8931",
        "google_scholar": "cXDt3NQAAAAJ;x-M8l7IAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0002-7913-2393;0000-0001-6054-8770;0000-0001-7128-0220",
        "linkedin": "m-mollahasani/;;ali-etemad-6b3379b/",
        "or_profile": "~Mahdiyar_Molahasani1;~Michael_Greenspan1;~Ali_Etemad1",
        "aff": "Queen's University;Queens University;Queen's University",
        "aff_domain": "queensu.ca;queensu.ca;queensu.ca",
        "position": "PhD student;Full Professor;Associate Professor",
        "bibtex": "@misc{\nmolahasani2024continual,\ntitle={Continual Learners are Viable Long-Tailed Recognizers},\nauthor={Mahdiyar Molahasani and Michael Greenspan and Ali Etemad},\nyear={2024},\nurl={https://openreview.net/forum?id=toWEwcbldw}\n}",
        "github": "",
        "project": "",
        "reviewers": "U9N3;FdyD;PwBM;bvQv",
        "site": "https://openreview.net/forum?id=toWEwcbldw",
        "pdf_size": 742908,
        "rating": "3;5;5;5",
        "confidence": "3;4;4;4",
        "soundness": "2;3;3;4",
        "contribution": "3;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "50;40;90;84",
        "wc_strengths": "51;87;56;72",
        "wc_weaknesses": "151;205;218;102",
        "wc_questions": "110;25;103;33",
        "wc_review": "362;357;467;291",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            66.0,
            21.400934559032695
        ],
        "wc_strengths_avg": [
            66.5,
            14.150971698084906
        ],
        "wc_weaknesses_avg": [
            169.0,
            46.12483062299525
        ],
        "wc_questions_avg": [
            67.75,
            38.931831449342326
        ],
        "wc_review_avg": [
            369.25,
            63.00942389833445
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:HKXTzQR1UfcJ:scholar.google.com/&scioq=Continual+Learners+are+Viable+Long-Tailed+Recognizers&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Queen's University;Queens University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.queensu.ca;https://www.queensu.ca",
        "aff_unique_abbr": "Queen's;Queen's U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "title": "Diffusion Posterior Sampling for Linear Inverse Problem Solving: A Filtering Perspective",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17600",
        "id": "tplXNcHZs1",
        "author_site": "Zehao Dou, Yang Song",
        "tldr": "",
        "abstract": "Diffusion models have achieved tremendous success in generating high-dimensional data like images, videos and audio. These models provide powerful data priors that can solve linear inverse problems in zero shot through Bayesian posterior sampling.\nHowever, exact posterior sampling for diffusion models is intractable. Current solutions often hinge on approximations that are either computationally expensive or lack strong theoretical guarantees. In this work, we introduce an efficient diffusion sampling algorithm for linear inverse problems that is guaranteed to be asymptotically accurate. We reveal a link between Bayesian posterior sampling and Bayesian filtering in diffusion models, proving the former as a specific instance of the latter. Our method, termed filtering posterior sampling, leverages sequential Monte Carlo methods to solve the corresponding filtering problem. It seamlessly integrates with all Markovian diffusion samplers, requires no model re-training, and guarantees accurate samples from the Bayesian posterior as particle counts rise. Empirical tests demonstrate that our method generates better or comparable results than leading zero-shot diffusion posterior samplers on tasks like image inpainting, super-resolution, and deblurring.",
        "keywords": "Diffusion Models;linear Inverse problem;Bayesian posterior sampling;Bayesian filtering;importance sampling",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Zehao Dou;Yang Song",
        "authorids": "~Zehao_Dou2;~Yang_Song1",
        "gender": "M;M",
        "homepage": "https://zehaodou-official.github.io;https://yang-song.net",
        "dblp": "224/5549.html;",
        "google_scholar": "CypbdCkAAAAJ;o_J2CroAAAAJ",
        "orcid": ";",
        "linkedin": "zehao-dou-870b4b133/;",
        "or_profile": "~Zehao_Dou2;~Yang_Song1",
        "aff": "Yale University;OpenAI",
        "aff_domain": "yale.edu;openai.com",
        "position": "PhD student;Researcher",
        "bibtex": "@inproceedings{\ndou2024diffusion,\ntitle={Diffusion Posterior Sampling for Linear Inverse Problem Solving: A Filtering Perspective},\nauthor={Zehao Dou and Yang Song},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=tplXNcHZs1}\n}",
        "github": "",
        "project": "",
        "reviewers": "b9JP;pD39;x48M;cbzu",
        "pdf_size": 28685811,
        "rating": "3;6;6;10",
        "confidence": "5;4;4;4",
        "soundness": "1;3;3;4",
        "contribution": "2;3;3;4",
        "presentation": "3;3;3;4",
        "wc_summary": "72;46;50;99",
        "wc_strengths": "38;43;38;39",
        "wc_weaknesses": "547;92;38;18",
        "wc_questions": "5;50;44;12",
        "wc_review": "662;231;170;168",
        "wc_reply_reviewers": "54;0;0;0",
        "wc_reply_authors": "385;235;89;19",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.25,
            2.48746859276655
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            1.0897247358851685
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            66.75,
            21.087614848531352
        ],
        "wc_strengths_avg": [
            39.5,
            2.0615528128088303
        ],
        "wc_weaknesses_avg": [
            173.75,
            217.18928956097258
        ],
        "wc_questions_avg": [
            27.75,
            19.524023663169434
        ],
        "wc_review_avg": [
            307.75,
            206.08781502068481
        ],
        "wc_reply_reviewers_avg": [
            13.5,
            23.382685902179844
        ],
        "wc_reply_authors_avg": [
            182.0,
            140.7444492688788
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.7543365091413573,
        "gs_citation": 54,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1018083280073741784&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=tplXNcHZs1",
        "pdf": "https://openreview.net/pdf?id=tplXNcHZs1",
        "email": "yale.edu;openai.com",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Yale University;OpenAI",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.yale.edu;https://openai.com",
        "aff_unique_abbr": "Yale;OpenAI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "tqHgSxRwiK",
        "title": "Test Relative Fairness in Human Decisions With Machine Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Fairness in decision-making has been a long-standing issue in our society. Compared to algorithmic fairness, fairness in human decisions is even more important since there are processes where humans make the final decisions and that machine learning models inherit bias from the human decisions they were trained on. However, the standard for fairness in human decisions are highly subjective and contextual. This leads to the difficulty for testing \"absolute\" fairness in human decisions. To bypass this issue, this work aims to test relative fairness in human decisions. That is, instead of defining what are \"absolute\" fair decisions, we check the relative fairness of one decision set against another. An example outcome can be: Decision Set A favors female over male more than Decision Set B. Such relative fairness has the following benefits: (1) it avoids the ambiguous and contradictory definition of \"absolute\" fair decisions; (2) it reveals the relative preference and bias between different human decisions; (3) if a reference set of decisions is provided, relative fairness of other decision sets against this reference set can reflect whether those decisions sets are fair by the standard of that reference set. \nWe define the relative fairness with statistical tests (null hypothesis and effect size tests) of the decision differences across each sensitive group. Furthermore, we show that a machine learning model trained on the human decisions can inherit the bias/preference. Therefore, the relative fairness of two sets of decisions made on different sets of objects--- Human X's decisions on set A and Human Y's decisions on set B--- can be tested by (1) training a machine learning model on decisions made on set A by Human X; (2) testing the relative fairness of the model's predictions on set B against the decisions made on set B by Human Y.",
        "keywords": "fairness;relative fairness;machine learning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Zhe Yu;XIAOYIN XI",
        "authorids": "~Zhe_Yu3;~XIAOYIN_XI1",
        "gender": "M;M",
        "homepage": "https://zhe-yu.github.io/;",
        "dblp": ";",
        "google_scholar": "MWWd15EAAAAJ;h9693fMAAAAJ",
        "orcid": "0000-0002-6841-1725;",
        "linkedin": ";",
        "or_profile": "~Zhe_Yu3;~XIAOYIN_XI1",
        "aff": "Rochester Institute of Technology;Rochester Institute of Technology",
        "aff_domain": "rit.edu;rit.edu",
        "position": "Assistant Professor;PhD student",
        "bibtex": "@misc{\nyu2024test,\ntitle={Test Relative Fairness in Human Decisions With Machine Learning},\nauthor={Zhe Yu and XIAOYIN XI},\nyear={2024},\nurl={https://openreview.net/forum?id=tqHgSxRwiK}\n}",
        "github": "",
        "project": "",
        "reviewers": "oWWd;XK1E;kf4f",
        "site": "https://openreview.net/forum?id=tqHgSxRwiK",
        "pdf_size": 229877,
        "rating": "3;3;3",
        "confidence": "3;3;4",
        "soundness": "1;2;1",
        "contribution": "2;2;1",
        "presentation": "2;2;2",
        "wc_summary": "86;36;120",
        "wc_strengths": "16;26;59",
        "wc_weaknesses": "217;655;591",
        "wc_questions": "33;30;14",
        "wc_review": "352;747;784",
        "wc_reply_reviewers": "0;163;0",
        "wc_reply_authors": "662;867;800",
        "reply_reviewers": "0;2;0",
        "reply_authors": "1;3;1",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            80.66666666666667,
            34.49959742116163
        ],
        "wc_strengths_avg": [
            33.666666666666664,
            18.372685039360892
        ],
        "wc_weaknesses_avg": [
            487.6666666666667,
            193.16544434470904
        ],
        "wc_questions_avg": [
            25.666666666666668,
            8.339997335464536
        ],
        "wc_review_avg": [
            627.6666666666666,
            195.51015887217275
        ],
        "wc_reply_reviewers_avg": [
            54.333333333333336,
            76.83893688893816
        ],
        "wc_reply_authors_avg": [
            776.3333333333334,
            85.34765504817472
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:WY1s2cueZAkJ:scholar.google.com/&scioq=Test+Relative+Fairness+in+Human+Decisions+With+Machine+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Rochester Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.rit.edu",
        "aff_unique_abbr": "RIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Quick-Tune: Quickly Learning Which Pretrained Model to Finetune and How",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17599",
        "id": "tqh1zdXIra",
        "author_site": "Sebastian Pineda Arango, Fabio Ferreira, Arlind Kadra, Frank Hutter, Josif Grabocka",
        "tldr": "",
        "abstract": "With the ever-increasing number of pretrained models, machine learning practitioners are continuously faced with which pretrained model to use, and how to finetune it for a new dataset. In this paper, we propose a methodology that jointly searches for the optimal pretrained model and the hyperparameters for finetuning it. Our method transfers knowledge about the performance of many pretrained models with multiple hyperparameter configurations on a series of datasets. To this aim, we evaluated over 20k hyperparameter configurations for finetuning 24 pretrained image classification models on 87 datasets to generate a large-scale meta-dataset. We meta-learn a gray-box performance predictor on the learning curves of this meta-dataset and use it for fast hyperparameter optimization on new datasets. We empirically demonstrate that our resulting approach can quickly select an accurate pretrained model for a new dataset together with its optimal hyperparameters.",
        "keywords": "Finetuning;pretrained model hubs;transfer learning;hyperparameter optimization;meta-learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/69571219ddfec93a6e9ab2526a853740706a9848.pdf",
        "author": "Sebastian Pineda Arango;Fabio Ferreira;Arlind Kadra;Frank Hutter;Josif Grabocka",
        "authorids": "~Sebastian_Pineda_Arango1;~Fabio_Ferreira1;~Arlind_Kadra1;~Frank_Hutter1;~Josif_Grabocka1",
        "gender": "M;M;M;M;M",
        "homepage": ";http://ferreirafabio.github.io;;http://ml.informatik.uni-freiburg.de/~hutter/;https://www.utn.de/departments/department-engineering/machine-learning-lab/",
        "dblp": "271/4257;128/6466;252/5295;89/5383;117/4936",
        "google_scholar": "8UI_0B0AAAAJ;https://scholar.google.de/citations?user=LFtEAeYAAAAJ;bMa0KUcAAAAJ;https://scholar.google.de/citations?user=YUrxwrkAAAAJ;KRy27XcAAAAJ",
        "orcid": ";0000-0002-0816-2042;0000-0001-9308-6576;0000-0002-2037-3694;",
        "linkedin": "sebaspine/;;;frank-hutter-9190b24b/;",
        "or_profile": "~Sebastian_Pineda_Arango1;~Fabio_Ferreira1;~Arlind_Kadra1;~Frank_Hutter1;~Josif_Grabocka1",
        "aff": "Universit\u00e4t Freiburg;Universit\u00e4t Freiburg;Universit\u00e4t Freiburg;Albert-Ludwigs-Universit\u00e4t Freiburg;University of Technology Nuremberg",
        "aff_domain": "uni-freiburg.de;uni-freiburg.de;uni-freiburg.de;uni-freiburg.de;utn.de",
        "position": "PhD student;PhD student;PhD student;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\narango2024quicktune,\ntitle={Quick-Tune: Quickly Learning Which Pretrained Model to Finetune and How},\nauthor={Sebastian Pineda Arango and Fabio Ferreira and Arlind Kadra and Frank Hutter and Josif Grabocka},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=tqh1zdXIra}\n}",
        "github": "",
        "project": "",
        "reviewers": "omMr;xZL3;LquR;qaoF",
        "pdf_size": 18720763,
        "rating": "8;8;8;8",
        "confidence": "4;3;3;4",
        "soundness": "3;3;3;3",
        "contribution": "3;3;4;2",
        "presentation": "4;3;4;3",
        "wc_summary": "71;128;205;127",
        "wc_strengths": "150;84;45;41",
        "wc_weaknesses": "45;145;47;88",
        "wc_questions": "72;44;2;30",
        "wc_review": "338;401;299;286",
        "wc_reply_reviewers": "8;0;0;29",
        "wc_reply_authors": "293;731;184;381",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            132.75,
            47.66746794198324
        ],
        "wc_strengths_avg": [
            80.0,
            43.7664254880382
        ],
        "wc_weaknesses_avg": [
            81.25,
            40.61018960802818
        ],
        "wc_questions_avg": [
            37.0,
            25.238858928247925
        ],
        "wc_review_avg": [
            331.0,
            44.715769030622745
        ],
        "wc_reply_reviewers_avg": [
            9.25,
            11.861176164276458
        ],
        "wc_reply_authors_avg": [
            397.25,
            204.9370330125817
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17723217031171135556&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=tqh1zdXIra",
        "pdf": "https://openreview.net/pdf?id=tqh1zdXIra",
        "email": "uni-freiburg.de;uni-freiburg.de;uni-freiburg.de;uni-freiburg.de;utn.de",
        "author_num": 5,
        "aff_unique_index": "0;0;0;1;2",
        "aff_unique_norm": "University of Freiburg;Albert-Ludwigs-Universit\u00e4t Freiburg;Nuremberg University of Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.uni-freiburg.de;https://www.uni-freiburg.de;https://www.tu-nuernberg.de",
        "aff_unique_abbr": "Uni Freiburg;Albert-Ludwigs-Universit\u00e4t;TUN",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Freiburg",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "tqhAA26vXE",
        "title": "ChatKBQA: A Generate-then-Retrieve Framework for Knowledge Base Question Answering with Fine-tuned Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Knowledge Base Question Answering (KBQA) aims to derive answers to natural language questions over large-scale knowledge bases (KBs), which are generally divided into two research components: knowledge retrieval and semantic parsing. However, three core challenges remain, including inefficient knowledge retrieval, retrieval errors adversely affecting semantic parsing, and the complexity of previous KBQA methods. In the era of large language models (LLMs), we introduce ChatKBQA, a novel generate-then-retrieve KBQA framework built on fine-tuning open-source LLMs such as Llama-2, ChatGLM2 and Baichuan2. ChatKBQA proposes generating the logical form with fine-tuned LLMs first, then retrieving and replacing entities and relations through an unsupervised retrieval method, which improves both generation and retrieval more straightforwardly. Experimental results reveal that ChatKBQA achieves new state-of-the-art performance on standard KBQA datasets, WebQSP, and ComplexWebQuestions (CWQ). This work also provides a new paradigm for combining LLMs with knowledge graphs (KGs) for interpretable and knowledge-required question answering in future work. Our code is publicly available.",
        "keywords": "Knowledge Base Question Answering;Large Language Models;Semantic Parsing;Information Retrieval",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "/attachment/624969686d744625da10115b196971cd213560ed.zip",
        "author": "Haoran Luo;Haihong E;Zichen Tang;Shiyao Peng;Yikai Guo;Wentai Zhang;Chenghao Ma;Guanting Dong;Meina Song;Wei Lin",
        "authorids": "~Haoran_Luo1;~Haihong_E1;~Zichen_Tang1;~Shiyao_Peng2;~Yikai_Guo2;~Wentai_Zhang2;~Chenghao_Ma2;~Guanting_Dong1;~Meina_Song1;~Wei_Lin13",
        "gender": "M;F;M;M;M;M;M;F;M;",
        "homepage": "https://lhrlab.github.io/;https://teacher.bupt.edu.cn/ehaihong/zh_CN/index.htm;https://github.com/StarLight24;https://github.com/coverdpsy;https://github.com/GYK-CASIC;https://github.com/mch0115;https://dongguanting.github.io/;http://teacher.bupt.edu.cn/songmeina/;http://www.inspur.com;",
        "dblp": "227/5902-1.html;43/10222.html;264/0465;;334/4154;;;95/4440;https://dblp.uni-trier.de/pid/99/2649;",
        "google_scholar": "https://scholar.google.com.hk/citations?user=Q9Nv9mcAAAAJ;https://scholar.google.com.hk/citations?user=J4akh64AAAAJ;https://scholar.google.com/citations?hl=zh-CN;;https://scholar.google.com.hk/citations?user=4LxmyZAAAAAJ;;amozZDkAAAAJ;https://scholar.google.com/citations?hl=zh-CN;;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0003-2727-0361;;0000-0002-0244-4970;;0000-0003-0345-1686;;;0000-0001-6626-9932;;",
        "linkedin": "haoran-luo-88a96b255/;;;;https://www.linkedin.cn/incareer/in/ACoAAD5htzQBKWZKy68SvRuuztB4LJDhIKMdM1o;;;;;",
        "or_profile": "~Haoran_Luo1;~Haihong_E1;~Zichen_Tang1;~Shiyao_Peng2;~Yikai_Guo2;~Chenghao_Ma2;~Guanting_Dong1;~Meina_Song1;~Wei_Lin13;~wentai_zhang1",
        "aff": "Nanyang Technological University;Beijing University of Post and Telecommunication;Beijing University of Posts and Telecommunications;China University of Petroleum-Beijing at Karamay;Beijing Institute of Computer Technology and Application;Beijing University of Posts and Telecommunications;Beijing University of Posts and Telecommunications;Beijing University of Posts and Telecommunications;;",
        "aff_domain": "ntu.edu.sg;bupt.edu.cn;bupt.edu.cn;cupk.edu.cn;casic.com.cn;bupt.edu.cn;bupt.edu.cn;bupt.edu.cn;;",
        "position": "Intern;Full Professor;MS student;Undergrad student;PhD student;MS student;MS student;Full Professor;;",
        "bibtex": "@misc{\nluo2024chatkbqa,\ntitle={Chat{KBQA}: A Generate-then-Retrieve Framework for Knowledge Base Question Answering with Fine-tuned Large Language Models},\nauthor={Haoran Luo and Haihong E and Zichen Tang and Shiyao Peng and Yikai Guo and Wentai Zhang and Chenghao Ma and Guanting Dong and Meina Song and Wei Lin},\nyear={2024},\nurl={https://openreview.net/forum?id=tqhAA26vXE}\n}",
        "github": "",
        "project": "",
        "reviewers": "EDj3;i3n1;wXvo",
        "site": "https://openreview.net/forum?id=tqhAA26vXE",
        "pdf_size": 2527520,
        "rating": "5;6;6",
        "confidence": "3;3;3",
        "soundness": "3;3;3",
        "contribution": "3;2;3",
        "presentation": "3;2;3",
        "wc_summary": "97;68;86",
        "wc_strengths": "41;38;77",
        "wc_weaknesses": "117;154;99",
        "wc_questions": "14;96;92",
        "wc_review": "269;356;354",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "487;1066;795",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;3;2",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            83.66666666666667,
            11.953614051360738
        ],
        "wc_strengths_avg": [
            52.0,
            17.72004514666935
        ],
        "wc_weaknesses_avg": [
            123.33333333333333,
            22.895899681432528
        ],
        "wc_questions_avg": [
            67.33333333333333,
            37.7477004450455
        ],
        "wc_review_avg": [
            326.3333333333333,
            40.54901012629312
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            782.6666666666666,
            236.5365839686444
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 86,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15220711135897191201&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;1;2;3;1;1;1",
        "aff_unique_norm": "Nanyang Technological University;Beijing University of Posts and Telecommunications;China University of Petroleum;Beijing Institute of Computer Technology and Application",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.ntu.edu.sg;http://www.bupt.edu.cn/;http://www.cup.edu.cn;",
        "aff_unique_abbr": "NTU;BUPT;CUP;",
        "aff_campus_unique_index": "1;1;1;1;1;1",
        "aff_campus_unique": ";Beijing",
        "aff_country_unique_index": "0;1;1;1;1;1;1;1",
        "aff_country_unique": "Singapore;China"
    },
    {
        "id": "tqiAfRT1Lq",
        "title": "Eliciting Human Preferences with Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "As language models (LMs) become more capable, they are increasingly being applied to tasks that are complex and user-specific. LMs can be directed to perform target tasks using labeled examples or natural language prompts, which may include general, free-form task descriptions. But selecting examples or writing prompts for an LM can be challenging---especially in tasks that involve unusual edge cases, demand precise articulation of nebulous preferences, or require an accurate mental model of LMs themselves. We propose to use *LMs themselves* to guide the task specification process. In this paper, we introduce **Generative Active Task Elicitation (GATE)**: a learning framework in which models elicit and infer intended behavior through free-form, language-based interaction with users. We study GATE in three domains: email validation, content recommendation, and moral reasoning. In preregistered experiments, we show that LMs prompted to perform GATE (e.g. by generating open-ended questions or synthesizing informative edge cases) elicit responses that are often more informative than user-written prompts or labels. Users report that interactive task elicitation requires less effort than prompting or example labeling, and surfaces novel considerations not initially anticipated by users.  Our findings suggest LM-driven elicitation can be a powerful tool for aligning models to complex human preferences and values.",
        "keywords": "alignment;language models;preferences",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Belinda Z. Li;Alex Tamkin;Noah Goodman;Jacob Andreas",
        "authorids": "~Belinda_Z._Li1;~Alex_Tamkin1;~Noah_Goodman1;~Jacob_Andreas1",
        "gender": ";;;M",
        "homepage": ";;https://cocolab.stanford.edu/;http://web.mit.edu/jda/www",
        "dblp": ";;96/1216;97/8154",
        "google_scholar": ";;OUpIbcQAAAAJ;dnZ8udEAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Belinda_Z._Li1;~Alex_Tamkin1;~Noah_Goodman1;~Jacob_Andreas1",
        "aff": ";;Stanford University;Microsoft",
        "aff_domain": ";;stanford.edu;microsoft.com",
        "position": ";;Full Professor;Researcher",
        "bibtex": "@misc{\nli2024eliciting,\ntitle={Eliciting Human Preferences with Language Models},\nauthor={Belinda Z. Li and Alex Tamkin and Noah Goodman and Jacob Andreas},\nyear={2024},\nurl={https://openreview.net/forum?id=tqiAfRT1Lq}\n}",
        "github": "",
        "project": "",
        "reviewers": "j3g4;djQq;d4UR;Nhj6",
        "site": "https://openreview.net/forum?id=tqiAfRT1Lq",
        "pdf_size": 2897965,
        "rating": "5;5;6;6",
        "confidence": "3;4;4;2",
        "soundness": "1;2;3;3",
        "contribution": "3;2;3;3",
        "presentation": "3;3;3;4",
        "wc_summary": "68;55;139;27",
        "wc_strengths": "62;8;139;34",
        "wc_weaknesses": "218;91;168;79",
        "wc_questions": "62;88;105;79",
        "wc_review": "410;242;551;219",
        "wc_reply_reviewers": "122;122;84;0",
        "wc_reply_authors": "1402;567;622;277",
        "reply_reviewers": "2;1;1;0",
        "reply_authors": "3;3;3;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            72.25,
            41.287861412284364
        ],
        "wc_strengths_avg": [
            60.75,
            49.04780830985214
        ],
        "wc_weaknesses_avg": [
            139.0,
            56.97806595524281
        ],
        "wc_questions_avg": [
            83.5,
            15.532224567009067
        ],
        "wc_review_avg": [
            355.5,
            134.81932354080405
        ],
        "wc_reply_reviewers_avg": [
            82.0,
            49.8196748283246
        ],
        "wc_reply_authors_avg": [
            717.0,
            416.63833236993446
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.75,
            0.4330127018922193
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.30151134457776363,
        "gs_citation": 57,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=188058980522683617&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Stanford University;Microsoft",
        "aff_unique_dep": ";Microsoft Corporation",
        "aff_unique_url": "https://www.stanford.edu;https://www.microsoft.com",
        "aff_unique_abbr": "Stanford;Microsoft",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Stanford;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Evaluating Large Language Models at Evaluating Instruction Following",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17598",
        "id": "tr0KidwPLc",
        "author_site": "Zhiyuan Zeng, Jiatong Yu, Tianyu Gao, Yu Meng, Tanya Goyal, Danqi Chen",
        "tldr": "",
        "abstract": "As research in large language models (LLMs) continues to accelerate, LLM-based evaluation has emerged as a scalable and cost-effective alternative to human evaluations for comparing the ever increasing list of models. This paper investigates the efficacy of these \u201cLLM evaluators\u201d, particularly in using them to assess instruction following, a metric that gauges how closely generated text adheres to the given instruction. We introduce a challenging meta-evaluation benchmark, LLMBar, designed to test the ability of an LLM evaluator in discerning instruction-following outputs. The authors manually curated 419 pairs of outputs, one adhering to instructions while the other diverging, yet may possess deceptive qualities that mislead an LLM evaluator, e.g., a more engaging tone. Contrary to existing meta-evaluation, we discover that different evaluators (i.e., combinations of LLMs and prompts) exhibit distinct performance on LLMBar and even the highest-scoring ones have substantial room for improvement. We also present a novel suite of prompting strategies that further close the gap between LLM and human evaluators. With LLMBar, we hope to offer more insight into LLM evaluators and foster future research in developing better instruction-following models.",
        "keywords": "large language models;instruction tuning;evaluation;benchmark;instruction following",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/2b6b9404f4be0614497a30e550cbe5fc5dcc5352.zip",
        "author": "Zhiyuan Zeng;Jiatong Yu;Tianyu Gao;Yu Meng;Tanya Goyal;Danqi Chen",
        "authorids": "~Zhiyuan_Zeng3;~Jiatong_Yu1;~Tianyu_Gao1;~Yu_Meng1;~Tanya_Goyal1;~Danqi_Chen1",
        "gender": "M;F;M;M;F;F",
        "homepage": "https://zhiyuan-zeng.github.io/;https://www.cs.princeton.edu/~jiatongy/;https://gaotianyu.xyz/about/;https://yumeng5.github.io/;;https://www.cs.princeton.edu/~danqic/",
        "dblp": ";;207/8893-1.html;30/4233-1;176/9145;87/7949",
        "google_scholar": "qLJqCqsAAAAJ;;il-F8YYAAAAJ;S2-yZKcAAAAJ;w72MSFoAAAAJ;sVR8ktkAAAAJ",
        "orcid": ";;0000-0002-5178-0866;0000-0003-2554-2888;;",
        "linkedin": ";;;;;",
        "or_profile": "~Zhiyuan_Zeng3;~Jiatong_Yu1;~Tianyu_Gao1;~Yu_Meng1;~Tanya_Goyal1;~Danqi_Chen1",
        "aff": "Tsinghua University;Princeton University;Princeton University;University of Virginia;Princeton University;Princeton University",
        "aff_domain": "tsinghua.edu.cn;princeton.edu;princeton.edu;virginia.edu;princeton.edu;cs.princeton.edu",
        "position": "Undergrad student;Undergrad student;PhD student;Assistant Professor;Postdoc;Assistant Professor",
        "bibtex": "@inproceedings{\nzeng2024evaluating,\ntitle={Evaluating Large Language Models at Evaluating Instruction Following},\nauthor={Zhiyuan Zeng and Jiatong Yu and Tianyu Gao and Yu Meng and Tanya Goyal and Danqi Chen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=tr0KidwPLc}\n}",
        "github": "",
        "project": "",
        "reviewers": "WsKe;65gL;kxW7",
        "pdf_size": 508559,
        "rating": "6;8;8",
        "confidence": "3;4;3",
        "soundness": "2;4;3",
        "contribution": "3;3;3",
        "presentation": "3;3;4",
        "wc_summary": "54;128;213",
        "wc_strengths": "25;82;39",
        "wc_weaknesses": "215;140;56",
        "wc_questions": "44;72;1",
        "wc_review": "338;422;309",
        "wc_reply_reviewers": "0;34;0",
        "wc_reply_authors": "1137;1557;496",
        "reply_reviewers": "0;1;0",
        "reply_authors": "3;3;1",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            131.66666666666666,
            64.9632374672185
        ],
        "wc_strengths_avg": [
            48.666666666666664,
            24.253293018108327
        ],
        "wc_weaknesses_avg": [
            137.0,
            64.94613152451807
        ],
        "wc_questions_avg": [
            39.0,
            29.20045661743437
        ],
        "wc_review_avg": [
            356.3333333333333,
            47.91891299082464
        ],
        "wc_reply_reviewers_avg": [
            11.333333333333334,
            16.027753706895076
        ],
        "wc_reply_authors_avg": [
            1063.3333333333333,
            436.2723410388923
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.49999999999999983,
        "gs_citation": 163,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5232470645248960631&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=tr0KidwPLc",
        "pdf": "https://openreview.net/pdf?id=tr0KidwPLc",
        "email": "tsinghua.edu.cn;princeton.edu;princeton.edu;virginia.edu;princeton.edu;cs.princeton.edu",
        "author_num": 6,
        "aff_unique_index": "0;1;1;2;1;1",
        "aff_unique_norm": "Tsinghua University;Princeton University;University of Virginia",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.princeton.edu;https://www.virginia.edu",
        "aff_unique_abbr": "THU;Princeton;UVA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "trCvBb8guo",
        "title": "Exploring the Effectiveness of Diffusion Models in One-Shot Federated Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Federated learning (FL) enables multiple clients to train models collectively while preserving data privacy. However, FL faces challenges in terms of communication cost and data heterogeneity. One-shot federated learning has emerged as a solution by reducing communication rounds, improving efficiency, and providing better security against eavesdropping attacks. Nevertheless, data heterogeneity remains a significant challenge, impacting performance. This work explores the effectiveness of diffusion models in one-shot FL, demonstrating their applicability in addressing data heterogeneity and improving FL performance. Additionally, we investigate the utility of our diffusion model approach, FedDiff, compared to other one-shot FL methods under differential privacy (DP). Furthermore, to improve generated sample quality under DP settings, we propose a simple Fourier Magnitude Filtering (FMF) method, enhancing the effectiveness of the generated data for global model training. Code will be made publicly available.",
        "keywords": "Federated Learning;Diffusion Models",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Matias Mendieta;Guangyu Sun;Chen Chen",
        "authorids": "~Matias_Mendieta1;~Guangyu_Sun3;~Chen_Chen18",
        "gender": ";M;M",
        "homepage": "https://sites.google.com/view/matiasmendieta;https://imguangyu.github.io/;https://www.crcv.ucf.edu/chenchen/",
        "dblp": "254/1788;;65/4423-1",
        "google_scholar": "iO5zyPwAAAAJ;e4NjsVIAAAAJ;TuEwcZ0AAAAJ",
        "orcid": "0000-0002-5497-6207;0000-0002-8523-9074;0000-0003-3957-7061",
        "linkedin": "matias-mendieta/;guangyu-sun-686b94198/;dennychen/",
        "or_profile": "~Matias_Mendieta1;~Guangyu_Sun3;~Chen_Chen18",
        "aff": "University of Central Florida;University of Central Florida;University of Central Florida",
        "aff_domain": "ucf.edu;ucf.edu;ucf.edu",
        "position": "PhD student;PhD student;Assistant Professor",
        "bibtex": "@misc{\nmendieta2024exploring,\ntitle={Exploring the Effectiveness of Diffusion Models in One-Shot Federated Learning},\nauthor={Matias Mendieta and Guangyu Sun and Chen Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=trCvBb8guo}\n}",
        "github": "",
        "project": "",
        "reviewers": "fpTS;dW3r;9S34;TnbG",
        "site": "https://openreview.net/forum?id=trCvBb8guo",
        "pdf_size": 1597981,
        "rating": "3;5;5;6",
        "confidence": "4;3;4;4",
        "soundness": "2;3;2;3",
        "contribution": "2;2;3;2",
        "presentation": "2;2;3;3",
        "wc_summary": "65;22;37;141",
        "wc_strengths": "14;22;56;33",
        "wc_weaknesses": "282;33;134;66",
        "wc_questions": "120;46;1;217",
        "wc_review": "481;123;228;457",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            66.25,
            45.833257575694965
        ],
        "wc_strengths_avg": [
            31.25,
            15.801503093060482
        ],
        "wc_weaknesses_avg": [
            128.75,
            95.68013116629805
        ],
        "wc_questions_avg": [
            96.0,
            81.76490689776391
        ],
        "wc_review_avg": [
            322.25,
            151.61031462271953
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.13245323570650439,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8230821976062242058&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Central Florida",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucf.edu",
        "aff_unique_abbr": "UCF",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "SafeDreamer: Safe Reinforcement Learning with World Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17597",
        "id": "tsE5HLYtYg",
        "author_site": "Weidong Huang, Jiaming Ji, Chunhe Xia, Borong Zhang, Yaodong Yang",
        "tldr": "",
        "abstract": "The deployment of Reinforcement Learning (RL) in real-world applications is constrained by its failure to satisfy safety criteria.\nExisting Safe Reinforcement Learning (SafeRL) methods, which rely on cost functions to enforce safety, often fail to achieve zero-cost performance in complex scenarios, especially vision-only tasks. These limitations are primarily due to model inaccuracies and inadequate sample efficiency. The integration of the world model has proven effective in mitigating these shortcomings. In this work, we introduce SafeDreamer, a novel algorithm incorporating Lagrangian-based methods into world model planning processes within the superior Dreamer framework. Our method achieves nearly zero-cost performance on various tasks, spanning low-dimensional and vision-only input, within the Safety-Gymnasium benchmark, showcasing its efficacy in balancing performance and safety in RL tasks. \nFurther details can be found in the code repository: https://github.com/PKU-Alignment/SafeDreamer.",
        "keywords": "Safe Reinforcement Learning;SafeRL;World Model",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/302e3830f71be0d1604433fef29569a5d6668471.pdf",
        "author": "Weidong Huang;Jiaming Ji;Chunhe Xia;Borong Zhang;Yaodong Yang",
        "authorids": "~Weidong_Huang3;~Jiaming_Ji2;~Chunhe_Xia1;~Borong_Zhang1;~Yaodong_Yang1",
        "gender": "M;M;M;;M",
        "homepage": "https://github.com/hdadong;https://jijiaming.com;https://www.scholarmate.com/P/MFJrmi;;https://www.yangyaodong.com",
        "dblp": ";313/9356.html;;;170/1496-1",
        "google_scholar": ";aW8WbYYAAAAJ;;;https://scholar.google.co.uk/citations?user=6yL0xw8AAAAJ",
        "orcid": ";;;;0000-0001-8132-5613",
        "linkedin": ";;;;yaodong-yang",
        "or_profile": "~Weidong_Huang3;~Jiaming_Ji2;~Chunhe_Xia1;~Borong_Zhang1;~Yaodong_Yang1",
        "aff": "Peking University;Peking University;;;Peking University",
        "aff_domain": "pku.edu.cn;pku.edu.cn;;;pku.edu.cn",
        "position": "Researcher;PhD student;;;Assistant Professor",
        "bibtex": "@inproceedings{\nhuang2024safedreamer,\ntitle={SafeDreamer: Safe Reinforcement Learning with World Models},\nauthor={Weidong Huang and Jiaming Ji and Chunhe Xia and Borong Zhang and Yaodong Yang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=tsE5HLYtYg}\n}",
        "github": "",
        "project": "",
        "reviewers": "PSGc;96af;fQYU;7enF",
        "pdf_size": 27693346,
        "rating": "6;6;6;8",
        "confidence": "5;5;4;5",
        "soundness": "3;2;3;4",
        "contribution": "3;3;3;4",
        "presentation": "3;4;1;4",
        "wc_summary": "166;98;51;62",
        "wc_strengths": "42;98;70;93",
        "wc_weaknesses": "343;802;121;235",
        "wc_questions": "151;390;144;196",
        "wc_review": "702;1388;386;586",
        "wc_reply_reviewers": "282;395;24;43",
        "wc_reply_authors": "2552;4188;1751;1346",
        "reply_reviewers": "4;1;1;1",
        "reply_authors": "6;8;4;3",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            1.224744871391589
        ],
        "wc_summary_avg": [
            94.25,
            44.92424178547702
        ],
        "wc_strengths_avg": [
            75.75,
            22.16275028059469
        ],
        "wc_weaknesses_avg": [
            375.25,
            258.5869051208897
        ],
        "wc_questions_avg": [
            220.25,
            100.01593623018283
        ],
        "wc_review_avg": [
            765.5,
            376.7555573578179
        ],
        "wc_reply_reviewers_avg": [
            186.0,
            157.7894166286193
        ],
        "wc_reply_authors_avg": [
            2459.25,
            1088.3614691360588
        ],
        "reply_reviewers_avg": [
            1.75,
            1.299038105676658
        ],
        "reply_authors_avg": [
            5.25,
            1.920286436967152
        ],
        "replies_avg": [
            35,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 21,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4129850970345816728&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=tsE5HLYtYg",
        "pdf": "https://openreview.net/pdf?id=tsE5HLYtYg",
        "email": "pku.edu.cn;pku.edu.cn;;;pku.edu.cn",
        "author_num": 5,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Peking University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.pku.edu.cn",
        "aff_unique_abbr": "Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "tsNLIBlG4p",
        "title": "Analysis of a class of stochastic component-wise soft-clipping schemes",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Choosing the optimization algorithm that performs best on a given machine learning problem is often delicate, and there is no guarantee that current state-of-the-art algorithms will perform well across all tasks. Consequently, the more reliable methods that one has at hand, the larger the likelihood of a good end result.  To this end, we introduce and analyze a large class of stochastic so-called soft clipping schemes with a broad range of applications.\nDespite the wide adoption of clipping techniques in practice, soft clipping methods have not been analyzed to a large extent in the literature. In particular, a rigorous mathematical analysis is lacking in the general, nonlinear case. Our analysis lays a theoretical foundation for a large class of such schemes, and motivates their usage.\n\nIn particular, under standard assumptions such as Lipschitz continuous gradients of the objective function, we give rigorous proofs of convergence in expectation with rates in both the convex and the non-convex case, as well as almost sure convergence to a stationary point in the non-convex case. The computational cost of the analyzed schemes is essentially the same as that of stochastic gradient descent.",
        "keywords": "Stochastic optimization;clipping methods",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "M\u00e5ns Williamson;Tony Stillfjord;Monika Eisenmann",
        "authorids": "~M\u00e5ns_Williamson1;~Tony_Stillfjord1;~Monika_Eisenmann1",
        "gender": "M;M;F",
        "homepage": "https://portal.research.lu.se/sv/persons/m%C3%A5ns-williamson;http://tonystillfjord.net/;",
        "dblp": ";;",
        "google_scholar": ";https://scholar.google.se/citations?user=Rq46ZzYAAAAJ;",
        "orcid": "0000-0001-9766-2024;0000-0001-6123-4271;0000-0001-7428-9546",
        "linkedin": ";;",
        "or_profile": "~M\u00e5ns_Williamson1;~Tony_Stillfjord1;~Monika_Eisenmann1",
        "aff": "Lund University / Lund Institute of Technology;Lund University;Lund University",
        "aff_domain": "lth.se;lu.se;lu.se",
        "position": "PhD student;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nwilliamson2024analysis,\ntitle={Analysis of a class of stochastic component-wise soft-clipping schemes},\nauthor={M{\\r{a}}ns Williamson and Tony Stillfjord and Monika Eisenmann},\nyear={2024},\nurl={https://openreview.net/forum?id=tsNLIBlG4p}\n}",
        "github": "",
        "project": "",
        "reviewers": "GBzB;xFTp;pqgZ;DnUF;GtoB",
        "site": "https://openreview.net/forum?id=tsNLIBlG4p",
        "pdf_size": 518349,
        "rating": "3;3;3;5;6",
        "confidence": "3;4;4;2;3",
        "soundness": "2;3;2;3;3",
        "contribution": "1;1;2;2;3",
        "presentation": "2;3;2;2;3",
        "wc_summary": "50;104;199;56;77",
        "wc_strengths": "30;22;111;57;119",
        "wc_weaknesses": "199;551;968;65;50",
        "wc_questions": "41;81;513;62;378",
        "wc_review": "320;758;1791;240;624",
        "wc_reply_reviewers": "0;343;477;0;71",
        "wc_reply_authors": "409;524;1169;289;221",
        "reply_reviewers": "0;1;2;0;1",
        "reply_authors": "1;1;3;1;1",
        "rating_avg": [
            4.0,
            1.2649110640673518
        ],
        "confidence_avg": [
            3.2,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            1.8,
            0.7483314773547883
        ],
        "presentation_avg": [
            2.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            97.2,
            54.30064456339354
        ],
        "wc_strengths_avg": [
            67.8,
            40.32567420391133
        ],
        "wc_weaknesses_avg": [
            366.6,
            350.7059166880422
        ],
        "wc_questions_avg": [
            215.0,
            193.3980351503086
        ],
        "wc_review_avg": [
            746.6,
            555.7991003950978
        ],
        "wc_reply_reviewers_avg": [
            178.2,
            195.67462789028116
        ],
        "wc_reply_authors_avg": [
            522.4,
            339.4911486327737
        ],
        "reply_reviewers_avg": [
            0.8,
            0.7483314773547883
        ],
        "reply_authors_avg": [
            1.4,
            0.8
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.6338656910463873,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8327916056832465555&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Lund University",
        "aff_unique_dep": "Lund Institute of Technology",
        "aff_unique_url": "https://www.lunduniversity.lu.se",
        "aff_unique_abbr": "LU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Lund;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Sweden"
    },
    {
        "id": "tsbdcgaCtk",
        "title": "Quality Control at Your Fingertips: Quality-Aware Translation Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Maximum-a-posteriori (MAP) decoding is the most widely used decoding strategy for neural machine translation (NMT) models. The underlying assumption is that model probability correlates well with human judgment, with better translations being more likely. However, research has shown that this assumption does not always hold, and decoding strategies which directly optimize a utility function, like Minimum Bayes Risk (MBR) or Quality-Aware decoding can significantly improve translation quality over standard MAP decoding.\nThe main disadvantage of these methods is that they require an additional model to predict the utility, and additional steps during decoding, which makes the entire process computationally demanding. In this paper, we propose to make the NMT models themselves quality-aware by training them to estimate the quality of their own output. During decoding, we can use the model's own quality estimates to guide the generation process and produce the highest-quality translations possible. We demonstrate that the model can self-evaluate its own output during translation, eliminating the need for a separate quality estimation model. Moreover, we show that using this quality signal as a prompt during MAP decoding can significantly improve translation quality. When using the internal quality estimate to prune the hypothesis space during MBR decoding, we can not only further improve translation quality, but also reduce inference speed by two orders of magnitude.",
        "keywords": "Large Language Models;Translation",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Christian Tomani;David Vilar;Markus Freitag;Colin Cherry;Subhajit Naskar;Mara Finkelstein;Daniel Cremers",
        "authorids": "~Christian_Tomani1;~David_Vilar1;~Markus_Freitag2;~Colin_Cherry1;~Subhajit_Naskar1;~Mara_Finkelstein1;~Daniel_Cremers1",
        "gender": ";M;M;M;M;F;M",
        "homepage": ";https://research.google/people/david-vilar/;;https://sites.google.com/site/colinacherry/;;;https://vision.in.tum.de/members/cremers",
        "dblp": ";06/6883;57/8503;99/6601;;354/9098;c/DanielCremers",
        "google_scholar": ";2cP6vV4AAAAJ;https://scholar.google.com/citations?hl=en;TNr_OWMAAAAJ;https://scholar.google.com/citations?hl=en;2fwViA0AAAAJ;cXQciMEAAAAJ",
        "orcid": ";;;;;;",
        "linkedin": ";david-vilar-torres-a6144417/;markus-freitag-7b17b4101/;colincherry/;;mara-finkelstein-696776104;",
        "or_profile": "~Christian_Tomani1;~David_Vilar1;~Markus_Freitag2;~Colin_Cherry1;~Subhajit_Naskar1;~Mara_Finkelstein1;~Daniel_Cremers1",
        "aff": "Technical University Munich;Google;Google;Google;Google;Google;Technical University Munich",
        "aff_domain": "tum.de;google.com;google.com;google.com;google.com;google.com;tum.de",
        "position": "PhD student;Researcher;Researcher;Researcher;Researcher;Researcher;Full Professor",
        "bibtex": "@misc{\ntomani2024quality,\ntitle={Quality Control at Your Fingertips: Quality-Aware Translation Models},\nauthor={Christian Tomani and David Vilar and Markus Freitag and Colin Cherry and Subhajit Naskar and Mara Finkelstein and Daniel Cremers},\nyear={2024},\nurl={https://openreview.net/forum?id=tsbdcgaCtk}\n}",
        "github": "",
        "project": "",
        "reviewers": "9pCm;SaRa;e2tN",
        "site": "https://openreview.net/forum?id=tsbdcgaCtk",
        "pdf_size": 510311,
        "rating": "3;3;6",
        "confidence": "5;4;4",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "2;2;3",
        "wc_summary": "62;43;80",
        "wc_strengths": "13;49;65",
        "wc_weaknesses": "103;156;18",
        "wc_questions": "3;7;116",
        "wc_review": "181;255;279",
        "wc_reply_reviewers": "247;0;0",
        "wc_reply_authors": "704;377;260",
        "reply_reviewers": "1;0;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            61.666666666666664,
            15.107025591499546
        ],
        "wc_strengths_avg": [
            42.333333333333336,
            21.746008573733455
        ],
        "wc_weaknesses_avg": [
            92.33333333333333,
            56.84090858606053
        ],
        "wc_questions_avg": [
            42.0,
            52.351376931907595
        ],
        "wc_review_avg": [
            238.33333333333334,
            41.7079795189788
        ],
        "wc_reply_reviewers_avg": [
            82.33333333333333,
            116.43691663538483
        ],
        "wc_reply_authors_avg": [
            447.0,
            187.89890899097844
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13087242133920589666&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1;1;1;0",
        "aff_unique_norm": "Technical University of Munich;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.tum.de;https://www.google.com",
        "aff_unique_abbr": "TUM;Google",
        "aff_campus_unique_index": "1;1;1;1;1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;1;1;1;1;0",
        "aff_country_unique": "Germany;United States"
    },
    {
        "id": "tsj6rDzI0V",
        "title": "STAGE Net: Spatio-Temporal Attention-based Graph Encoding for Learning Multi-Agent Interactions in the presence of Hidden Agents",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Accurate prediction of trajectories for multiple interacting agents following unknown dynamics is crucial in many real-world critical physical and social systems where a group of agents interact with each other, leading to intricate behavior patterns at both the individual and system levels. In many scenarios, trajectory predictions must be performed under partial observations i.e., only a subset of agents are known and observable. Consequently, we can only observe the trajectories of a subset of agents with a sampled interaction graph from a larger topological system while the behaviors of the unobserved agents and their interactions with the observed agents are not known. In this work, we propose STAGE Net, a sequential spatiotemporal attention-based generative model to learn system dynamics with multiple interacting agents where some agents are completely unobserved (hidden) all the time. Our network utilizes the spatiotemporal attention mechanism with neural inter-node messaging to capture high-level behavioral semantics of the multi-agent system. Our analytical results motivate STAGE Net design using spatiotemporal graph with time anchors to effectively model complex multi-agent interactions with unobserved agents and no prior information about interaction graph topology. We evaluate our method on multiagent simulations with spring and charged dynamics and a motion trajectory dataset. Empirical results illustrate that our method outperforms existing multiagent interaction modeling networks in predicting trajectories of complex multiagent interactions even when we have a large number of unobserved agents.",
        "keywords": "Multi-agent systems;Dynamical Systems;Hidden Agents",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/bf00790a4c056a1cee51d78d3afbd898747e40e1.zip",
        "author": "Hemant Kumawat;Biswadeep Chakraborty;Saibal Mukhopadhyay",
        "authorids": "~Hemant_Kumawat1;~Biswadeep_Chakraborty1;~Saibal_Mukhopadhyay2",
        "gender": "M;M;M",
        "homepage": "https://hemantkumawat.com/;;https://greenlab.ece.gatech.edu",
        "dblp": "319/0195;238/0554;66/1210",
        "google_scholar": "2iUnwBwAAAAJ;8soIjY8AAAAJ;5KRtMEkAAAAJ",
        "orcid": ";;0000-0002-8894-3390",
        "linkedin": "kumawathemant/;;",
        "or_profile": "~Hemant_Kumawat1;~Biswadeep_Chakraborty1;~Saibal_Mukhopadhyay2",
        "aff": "Georgia Institute of Technology;Georgia Institute of Technology;Georgia Institute of Technology",
        "aff_domain": "gatech.edu;gatech.edu;gatech.edu",
        "position": "PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nkumawat2024stage,\ntitle={{STAGE} Net: Spatio-Temporal Attention-based Graph Encoding for Learning Multi-Agent Interactions in the presence of Hidden Agents},\nauthor={Hemant Kumawat and Biswadeep Chakraborty and Saibal Mukhopadhyay},\nyear={2024},\nurl={https://openreview.net/forum?id=tsj6rDzI0V}\n}",
        "github": "",
        "project": "",
        "reviewers": "iVtG;d9Cc;TH3v;A4XG",
        "site": "https://openreview.net/forum?id=tsj6rDzI0V",
        "pdf_size": 7774112,
        "rating": "3;5;5;6",
        "confidence": "3;4;4;4",
        "soundness": "2;3;2;3",
        "contribution": "1;2;2;2",
        "presentation": "1;3;3;3",
        "wc_summary": "139;118;135;103",
        "wc_strengths": "18;90;33;82",
        "wc_weaknesses": "131;141;234;76",
        "wc_questions": "138;178;10;2",
        "wc_review": "426;527;412;263",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "2662;1893;3175;2085",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "6;4;8;5",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            123.75,
            14.341809509263467
        ],
        "wc_strengths_avg": [
            55.75,
            30.84132779242813
        ],
        "wc_weaknesses_avg": [
            145.5,
            56.77367347635698
        ],
        "wc_questions_avg": [
            82.0,
            77.35631842325486
        ],
        "wc_review_avg": [
            407.0,
            94.23640485502405
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            2453.75,
            503.4845454430553
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            5.75,
            1.479019945774904
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.9271726499455306,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13993994871294980945&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Georgia Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.gatech.edu",
        "aff_unique_abbr": "Georgia Tech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "ttMwEuEPeB",
        "title": "3D-GPT: Procedural 3D Modeling with Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In the pursuit of efficient automated content creation, procedural generation, leveraging modifiable parameters and rule-based systems, emerges as a promising approach. Nonetheless, it could be a demanding endeavor, given its intricate nature necessitating a deep understanding of rules, algorithms, and parameters. To reduce workload, we introduce 3D-GPT, a framework utilizing large language models(LLMs) for instruction-driven 3D modeling. 3D-GPT positions LLMs as proficient problem solvers, dissecting the procedural 3D modeling tasks into accessible segments and appointing the apt agent for each task. 3D-GPT integrates three core agents: the task dispatch agent, the conceptualization agent, and the modeling agent. They collaboratively achieve two objectives. First, it enhances concise initial scene descriptions, evolving them into detailed forms while dynamically adapting the text based on subsequent instructions. Second, it integrates procedural generation, extracting parameter values from enriched text to effortlessly interface with 3D software for asset creation. Our empirical investigations confirm that 3D-GPT not only interprets and executes instructions, delivering reliable results but also collaborates effectively with human designers. Furthermore, it seamlessly integrates with Blender, unlocking expanded manipulation possibilities. \nOur work highlights the potential of LLMs in 3D modeling, offering a basic framework for future advancements in scene generation and animation.",
        "keywords": "intelligent agent;large language models;3D modeling;Procedural 3D Modeling",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/67ebe318ffb0541b80351e8bd09d329ebb4c8757.zip",
        "author": "Chunyi Sun;Junlin Han;Weijian Deng;Xinlong Wang;Zishan Qin;Stephen Gould",
        "authorids": "~Chunyi_Sun3;~Junlin_Han1;~Weijian_Deng1;~Xinlong_Wang2;~Zishan_Qin1;~Stephen_Gould1",
        "gender": "F;M;M;M;F;M",
        "homepage": ";https://junlinhan.github.io/;http://weijiandeng.xyz;;https://zishanqin.github.io/;http://users.cecs.anu.edu.au/~sgould/",
        "dblp": ";151/9037;198/1517;;125/2053;89/1569.html",
        "google_scholar": "e46WeckAAAAJ;5L0Uj_IAAAAJ;https://scholar.google.com.hk/citations?user=lReHnAEAAAAJ;DPz0DjYAAAAJ;https://scholar.google.com.au/citations?user=wGOQawgAAAAJ;YvdzeM8AAAAJ",
        "orcid": ";;;;0000-0002-9265-4583;0000-0001-8929-7899",
        "linkedin": ";;;;zishan-qin/;",
        "or_profile": "~Chunyi_Sun3;~Junlin_Han1;~Weijian_Deng1;~Xinlong_Wang2;~Zishan_Qin1;~Stephen_Gould1",
        "aff": "Australian National University;GenAI, Meta;Australian National University;Beijing Academy of Artificial Intelligence;Commonwealth Scientific and Industrial Research Organisation, CSIRO;Australian National University",
        "aff_domain": "anu.edu.au;meta.com;anu.edu.au;baai.ac.cn;data61.csiro.au;anu.edu.au",
        "position": "PhD student;Researcher;Postdoc;Researcher;Researcher;Full Professor",
        "bibtex": "@misc{\nsun2024dgpt,\ntitle={3D-{GPT}: Procedural 3D Modeling with Large Language Models},\nauthor={Chunyi Sun and Junlin Han and Weijian Deng and Xinlong Wang and Zishan Qin and Stephen Gould},\nyear={2024},\nurl={https://openreview.net/forum?id=ttMwEuEPeB}\n}",
        "github": "",
        "project": "",
        "reviewers": "967x;m12k;QYLZ;nMkH",
        "site": "https://openreview.net/forum?id=ttMwEuEPeB",
        "pdf_size": 24303711,
        "rating": "3;3;5;6",
        "confidence": "4;4;4;3",
        "soundness": "3;3;3;3",
        "contribution": "1;2;2;3",
        "presentation": "3;4;3;3",
        "wc_summary": "98;47;120;27",
        "wc_strengths": "37;16;74;36",
        "wc_weaknesses": "197;144;190;66",
        "wc_questions": "3;93;183;2",
        "wc_review": "335;300;567;131",
        "wc_reply_reviewers": "0;0;46;0",
        "wc_reply_authors": "509;292;1326;183",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;6;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            73.0,
            37.50333318519835
        ],
        "wc_strengths_avg": [
            40.75,
            20.94486810653149
        ],
        "wc_weaknesses_avg": [
            149.25,
            52.19853925159209
        ],
        "wc_questions_avg": [
            70.25,
            74.85110219629368
        ],
        "wc_review_avg": [
            333.25,
            155.44512697411906
        ],
        "wc_reply_reviewers_avg": [
            11.5,
            19.91858428704209
        ],
        "wc_reply_authors_avg": [
            577.5,
            447.7959914961276
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            2.165063509461097
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.7777777777777777,
        "gs_citation": 60,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8038531020625129474&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;2;3;0",
        "aff_unique_norm": "Australian National University;Meta;Beijing Academy of Artificial Intelligence;Commonwealth Scientific and Industrial Research Organisation",
        "aff_unique_dep": ";Meta;;",
        "aff_unique_url": "https://www.anu.edu.au;https://meta.com;https://www.baaic.cn;https://www.csiro.au",
        "aff_unique_abbr": "ANU;Meta;BAAI;CSIRO",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;2;0;0",
        "aff_country_unique": "Australia;United States;China"
    },
    {
        "id": "ttRSBZiCiu",
        "title": "WaveFluid: A New Adversarial Approach for Efficient High-Fidelity Speech Synthesis",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Probability flow based models for image and audio synthesis, such as denoising diffusion probabilistic models and poisson flow generative models, can be interpreted as modeling the ground truth distribution through a non-compressive passive fluid partial differential equation(PDE), where the initial fluid density equals to ground truth distribution and the final fluid density equals to the chosen prior distribution. In this research, we have improved the architectural designs of neural networks and propose WaveFluid model for speech synthesis task with mel-spectrogram condition, which learns a velocity field directly through adversarial training instead of estimating the solution to a chosen linear PDE like diffusion or poisson equation in previous works. And since mel-spectrogram is a strong condition and limits the possible audios to a small range, we divide our model into two stages and use reparameterization techniques in order to reduce memory footprint and improve training efficiency. Experimental results show that our model is more competitive compared with previous vocoders in sample quality within 10 inference steps.",
        "keywords": "Probability Flow Models;Generative Adversarial Networks;Adversarial Training;Speech Synthesis;Mel-Spectrogram",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Tianze Luo;Situ Wang;Wenbo Duan;JiaRui Wang;Yang An",
        "authorids": "~Tianze_Luo2;~Situ_Wang1;~Wenbo_Duan1;~JiaRui_Wang4;~Yang_An6",
        "gender": "M;M;M;M;",
        "homepage": "https://github.com/luotianze666;https://github.com/Xiao-ao-jiang-hu;https://www.baidu.com;https://github.com/XGHDSGSDH/;https://blog.aytony.top",
        "dblp": ";;;;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;;;",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Tianze_Luo2;~Situ_Wang1;~Wenbo_Duan1;~JiaRui_Wang4;~An_Yang4",
        "aff": "Tsinghua University;, Tsinghua University;, Tsinghua University;;Beihang University",
        "aff_domain": "cs.tsinghua.edu.cn;cs.tsinghua.edu.cn;cs.tsinghua.edu.cn;;buaa.edu.cn",
        "position": "Undergrad student;Undergrad student;Undergrad student;;Undergrad student",
        "bibtex": "@misc{\nluo2024wavefluid,\ntitle={WaveFluid: A New Adversarial Approach for Efficient High-Fidelity Speech Synthesis},\nauthor={Tianze Luo and Situ Wang and Wenbo Duan and JiaRui Wang and Yang An},\nyear={2024},\nurl={https://openreview.net/forum?id=ttRSBZiCiu}\n}",
        "github": "",
        "project": "",
        "reviewers": "D9ch;kPeF;2TB9;WXsx;fHRe;kxZL",
        "site": "https://openreview.net/forum?id=ttRSBZiCiu",
        "pdf_size": 743055,
        "rating": "3;3;3;5;5;6",
        "confidence": "5;3;4;4;5;3",
        "soundness": "2;2;1;2;3;3",
        "contribution": "2;3;1;2;2;3",
        "presentation": "2;1;2;3;3;1",
        "wc_summary": "34;299;198;59;103;121",
        "wc_strengths": "41;124;142;90;84;190",
        "wc_weaknesses": "233;346;650;342;116;553",
        "wc_questions": "162;174;51;23;30;234",
        "wc_review": "470;943;1041;514;333;1098",
        "wc_reply_reviewers": "0;0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0;0",
        "reply_authors": "0;0;0;0;0;0",
        "rating_avg": [
            4.166666666666667,
            1.2133516482134197
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.1666666666666665,
            0.6871842709362768
        ],
        "contribution_avg": [
            2.1666666666666665,
            0.6871842709362768
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            135.66666666666666,
            89.49798259675403
        ],
        "wc_strengths_avg": [
            111.83333333333333,
            47.32306226589972
        ],
        "wc_weaknesses_avg": [
            373.3333333333333,
            180.95456765596043
        ],
        "wc_questions_avg": [
            112.33333333333333,
            81.23354534235773
        ],
        "wc_review_avg": [
            733.1666666666666,
            302.5774923699529
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.1682316462276133,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:SvsQrsyqLoAJ:scholar.google.com/&scioq=WaveFluid:+A+New+Adversarial+Approach+for+Efficient+High-Fidelity+Speech+Synthesis&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "Tsinghua University;Beihang University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tsinghua.edu.cn;http://www.buaa.edu.cn/",
        "aff_unique_abbr": "THU;BUAA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Connect, Collapse, Corrupt: Learning Cross-Modal Tasks with Uni-Modal Data",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17596",
        "id": "ttXg3SKAg5",
        "author_site": "Yuhui Zhang, Elaine Sui, Serena Yeung",
        "tldr": "",
        "abstract": "Building cross-modal applications is challenging due to limited paired multi-modal data. Recent works have shown that leveraging a pre-trained multi-modal contrastive representation space enables cross-modal tasks to be learned from uni-modal data. This is based on the assumption that contrastive optimization makes embeddings from different modalities interchangeable. However, this assumption is under-explored due to the poorly understood geometry of the multi-modal contrastive space, where a modality gap exists. In our study, we provide a theoretical explanation of this space's geometry and introduce a three-step method, $C^3$ (Connect, Collapse, Corrupt), to bridge the modality gap, enhancing the interchangeability of embeddings. Our $C^3$ method significantly improves cross-modal learning from uni-modal data, achieving state-of-the-art results on zero-shot image / audio / video captioning and text-to-image generation.",
        "keywords": "multi-modal contrastive learning;captioning;text-to-image generation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yuhui Zhang;Elaine Sui;Serena Yeung",
        "authorids": "~Yuhui_Zhang3;~Elaine_Sui1;~Serena_Yeung1",
        "gender": "M;;F",
        "homepage": "https://cs.stanford.edu/~yuhuiz/;;http://ai.stanford.edu/~syyeung/",
        "dblp": ";;147/5023",
        "google_scholar": "X-Agfu8AAAAJ;;Tw2m5kUAAAAJ",
        "orcid": ";;0000-0003-0529-0628",
        "linkedin": ";;",
        "or_profile": "~Yuhui_Zhang3;~Elaine_Sui1;~Serena_Yeung1",
        "aff": "Stanford University;;Stanford University",
        "aff_domain": "stanford.edu;;stanford.edu",
        "position": "PhD student;;Assistant Professor",
        "bibtex": "@inproceedings{\nzhang2024connect,\ntitle={Connect, Collapse, Corrupt: Learning Cross-Modal Tasks with Uni-Modal Data},\nauthor={Yuhui Zhang and Elaine Sui and Serena Yeung},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ttXg3SKAg5}\n}",
        "github": "",
        "project": "",
        "reviewers": "XDw2;bNKP;CpsN;Vv1o",
        "pdf_size": 7979690,
        "rating": "6;6;8;8",
        "confidence": "4;3;4;3",
        "soundness": "2;3;4;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;4;4",
        "wc_summary": "56;74;83;130",
        "wc_strengths": "40;52;163;255",
        "wc_weaknesses": "185;252;43;50",
        "wc_questions": "134;47;18;179",
        "wc_review": "415;425;307;614",
        "wc_reply_reviewers": "103;0;16;19",
        "wc_reply_authors": "2213;1919;377;676",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "4;5;2;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            85.75,
            27.334730655340287
        ],
        "wc_strengths_avg": [
            127.5,
            87.85357135597846
        ],
        "wc_weaknesses_avg": [
            132.5,
            89.2370438775288
        ],
        "wc_questions_avg": [
            94.5,
            64.8247637866888
        ],
        "wc_review_avg": [
            440.25,
            110.47030143889351
        ],
        "wc_reply_reviewers_avg": [
            34.5,
            40.202611855450385
        ],
        "wc_reply_authors_avg": [
            1296.25,
            783.8971153793079
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.25,
            1.299038105676658
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9914628907740171271&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=ttXg3SKAg5",
        "pdf": "https://openreview.net/pdf?id=ttXg3SKAg5",
        "email": "stanford.edu;;stanford.edu",
        "author_num": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Stanford University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.stanford.edu",
        "aff_unique_abbr": "Stanford",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Stanford",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "tth2qXY7RU",
        "title": "Super Floating-Point (SuFP): Efficient To All. Multi-Region Piecewise Quantization using Scalable Bias with Hardware Optimization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "As Deep Neural Networks (DNNs) revolutionize various application domains, their model size and computational demand also increase exponentially. In response to these challenges, various quantization techniques have emerged as highly effective solutions. However, quantization methods using conventional data types, including integer or floating-point, face certain limitations in balancing between accuracy drop and computational benefit. In light of the advent of hardware accelerator design for AI processing, quantization research has entered a new phase: custom data types and specialized hardware have emerged as innovative alternatives. Particularly, piecewise quantization and block floating-point quantization exhibit notable performance and efficiency improvements, but they still suffer from handling outliers with huge dynamic ranges. To solve this issue, we introduce Super Floating-Point (SuFP), a breakthrough data type and quantization method that improves both memory footprint and logic efficiency without compromising model accuracy. The key idea of SuFP is multi-region piecewise quantization using a tensor-wise scalable bias. It can configure an optimized precision for each region to capture both dense near-zero data and outliers. In addition, the scalable bias offers flexible adaptability to diverse data distributions, requiring only a single addition operation at the tensor level. Furthermore, the tailored hardware for SuFP employs only integer arithmetic units and shifters, facilitating a highly compact hardware realization. Our experimental results show that SuFP quantization achieved accuracy performance on par with, and in some cases even exceeded, that of full precision floating-point (FP32) across vision, language, and generative model benchmarks. Its computational capability and energy efficiency have been dramatically improved by 9.00$\\times$ and 17.04$\\times$ over FP32 implementations, surpassing state-of-the-art MSFP and BSFP, up to 7.20$\\times$ and up to 2.06$\\times$, respectively.",
        "keywords": "Post-Training Quantization;Piecewise Quantization;Block Floating-Point Quantization;Hardware-Friendly Data Type",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Geonwoo Ko;Sungyeob Yoo;Seri Ham;Seeyeon Kim;Joo-Young Kim",
        "authorids": "~Geonwoo_Ko1;~Sungyeob_Yoo1;~Seri_Ham1;~Seeyeon_Kim1;~Joo-Young_Kim1",
        "gender": "M;M;F;F;",
        "homepage": ";;;;",
        "dblp": ";;;;",
        "google_scholar": ";;;;y15LRMwAAAAJ",
        "orcid": "0009-0009-3155-1546;0000-0002-7783-9176;0009-0004-3452-0941;0009-0002-4587-2972;",
        "linkedin": ";sungyeob-yoo-488004178/;seri-ham-28489328a;;",
        "or_profile": "~Geonwoo_Ko1;~Sungyeob_Yoo1;~Seri_Ham1;~Seeyeon_Kim1;~Joo-Young_Kim1",
        "aff": "KAIST;KAIST;KAIST;KAIST;KAIST",
        "aff_domain": "ee.kaist.ac.kr;ee.kaist.ac.kr;ee.kaist.ac.kr;ee.kaist.ac.kr;kaist.ac.kr",
        "position": "MS student;PhD student;MS student;MS student;Associate Professor",
        "bibtex": "@misc{\nko2024super,\ntitle={Super Floating-Point (Su{FP}): Efficient To All. Multi-Region Piecewise Quantization using Scalable Bias with Hardware Optimization},\nauthor={Geonwoo Ko and Sungyeob Yoo and Seri Ham and Seeyeon Kim and Joo-Young Kim},\nyear={2024},\nurl={https://openreview.net/forum?id=tth2qXY7RU}\n}",
        "github": "",
        "project": "",
        "reviewers": "tqWQ;gb1N;CpEu",
        "site": "https://openreview.net/forum?id=tth2qXY7RU",
        "pdf_size": 23247152,
        "rating": "3;5;6",
        "confidence": "4;4;5",
        "soundness": "2;3;3",
        "contribution": "2;2;3",
        "presentation": "2;3;3",
        "wc_summary": "70;63;84",
        "wc_strengths": "46;37;53",
        "wc_weaknesses": "88;180;50",
        "wc_questions": "8;219;5",
        "wc_review": "212;499;192",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1048;1844;434",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;3;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            72.33333333333333,
            8.73053390247253
        ],
        "wc_strengths_avg": [
            45.333333333333336,
            6.548960901462833
        ],
        "wc_weaknesses_avg": [
            106.0,
            54.57716250105594
        ],
        "wc_questions_avg": [
            77.33333333333333,
            100.18094740130093
        ],
        "wc_review_avg": [
            301.0,
            140.2450236787982
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1108.6666666666667,
            577.22631802632
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.7559289460184544,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:r850OgUyfCsJ:scholar.google.com/&scioq=Super+Floating-Point+(SuFP):+Efficient+To+All.+Multi-Region+Piecewise+Quantization+using+Scalable+Bias+with+Hardware+Optimization&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "tuuEvgfxr5",
        "title": "Bayesian Pseudo-Coresets via Contrastive Divergence",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Bayesian methods provide an elegant framework for estimating parameter posteriors and quantification of uncertainty associated with probabilistic models. However, they often suffer from slow inference times, rendering them impractical for scalable applications.  To address this challenge, Bayesian Pseudo-Coresets (BPC) have emerged as a promising solution. BPC methods aim to create a small synthetic dataset, known as pseudo-coresets, that approximates the posterior inference achieved with the original dataset. This approximation is achieved by optimizing a divergence measure between the true posterior and the pseudo-coreset posterior.\nVarious divergence measures have been proposed for constructing pseudo-coresets, with forward Kullback-Leibler (KL) divergence being the most successful. However, using forward KL divergence necessitates sampling from the pseudo-coreset posterior, often accomplished through approximate Gaussian variational distributions. Alternatively, one could employ Markov Chain Monte Carlo (MCMC) methods for sampling, but this becomes challenging in high-dimensional parameter spaces due to slow mixing.\nIn this study, we introduce a novel approach for constructing pseudo-coresets by utilizing contrastive divergence. Importantly, optimizing contrastive divergence eliminates the need for approximations in the pseudo-coreset construction process. Furthermore, it enables the use of finite-step MCMC methods, alleviating the requirement for extensive mixing to reach a stationary distribution.\nTo validate our method's effectiveness, we conduct extensive experiments on multiple datasets, demonstrating its superiority over existing BPC techniques. \nOur implementation is available at https://anonymous.4open.science/r/BPC-CD-E762",
        "keywords": "Bayesian Pseudo-Coreset;Dataset Summarization",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Piyush Tiwary;Kumar Shubham;Vivek V Kashyap;Prathosh AP",
        "authorids": "~Piyush_Tiwary1;~Kumar_Shubham1;~Vivek_V_Kashyap1;~Prathosh_AP1",
        "gender": "M;M;M;M",
        "homepage": "https://backpropagator.github.io/;https://kyrs.github.io/;https://vivekvkashyap.github.io/;https://sites.google.com/view/prathosh",
        "dblp": ";;;218/5887",
        "google_scholar": "tUdHYloAAAAJ;JBb0tXMAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.co.in/citations?user=OEwV4bsAAAAJ",
        "orcid": "0000-0002-4499-1059;;;",
        "linkedin": "thebackpropogator/;;vivek-v-kashyap/;prathosh-ap-phd-50ab9511/",
        "or_profile": "~Piyush_Tiwary1;~Kumar_Shubham1;~Vivek_V_Kashyap1;~Prathosh_AP1",
        "aff": "Indian Institute of Science;Indian Institute of Science, Indian institute of science, Bangalore;Indian Institute of Technology, Bombay, Dhirubhai Ambani Institute Of Information and Communication Technology;Indian Institute of Science, Indian institute of science, Bangalore",
        "aff_domain": "iisc.ac.in;iisc.ac.in;iitb.ac.in;iisc.ac.in",
        "position": "PhD student;PhD student;Researcher;Assistant Professor",
        "bibtex": "@misc{\ntiwary2024bayesian,\ntitle={Bayesian Pseudo-Coresets via Contrastive Divergence},\nauthor={Piyush Tiwary and Kumar Shubham and Vivek V Kashyap and Prathosh AP},\nyear={2024},\nurl={https://openreview.net/forum?id=tuuEvgfxr5}\n}",
        "github": "",
        "project": "",
        "reviewers": "nxjv;N1MW;m79B;T54i",
        "site": "https://openreview.net/forum?id=tuuEvgfxr5",
        "pdf_size": 36201403,
        "rating": "1;3;3;3",
        "confidence": "5;4;3;5",
        "soundness": "3;1;1;2",
        "contribution": "1;1;2;2",
        "presentation": "3;3;3;2",
        "wc_summary": "123;60;44;118",
        "wc_strengths": "63;44;32;62",
        "wc_weaknesses": "133;376;334;598",
        "wc_questions": "110;103;2;259",
        "wc_review": "429;583;412;1037",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "223;797;165;417",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            86.25,
            34.758991642451306
        ],
        "wc_strengths_avg": [
            50.25,
            12.968712349342937
        ],
        "wc_weaknesses_avg": [
            360.25,
            165.1550407950057
        ],
        "wc_questions_avg": [
            118.5,
            91.68560410446125
        ],
        "wc_review_avg": [
            615.25,
            252.44442457697497
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            400.5,
            247.20993103028852
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17933790247044862448&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Indian Institute of Science;Indian Institute of Technology, Bombay",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.iisc.ac.in;https://www.iitb.ac.in",
        "aff_unique_abbr": "IISc;IIT Bombay",
        "aff_campus_unique_index": "1;2;1",
        "aff_campus_unique": ";Bangalore;Bombay",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "India"
    },
    {
        "title": "Zero Bubble (Almost) Pipeline Parallelism",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17595",
        "id": "tuzTN0eIO5",
        "author_site": "Penghui Qi, Xinyi Wan, Guangxing Huang, Min Lin",
        "tldr": "",
        "abstract": "Pipeline parallelism is one of the key components for large-scale distributed training, yet its efficiency suffers from pipeline bubbles which were deemed inevitable. In this work, we introduce a scheduling strategy that, to our knowledge, is the first to successfully achieve zero pipeline bubbles under synchronous training semantics. The key idea behind this improvement is to split the backward computation into two parts, one that computes gradient for the input and another that computes for the parameters. Based on this idea, we handcraft novel pipeline schedules that significantly outperform the baseline methods. We further develop an algorithm that automatically finds an optimal schedule based on specific model configuration and memory limit. Additionally, to truly achieve zero bubble, we introduce a novel technique to bypass synchronizations during the optimizer step. Experimental evaluations show that our method outperforms the 1F1B schedule up to 15\\% in throughput under a similar memory limit. This number can be further pushed to 30\\% when the memory constraint is relaxed. We believe our results mark a major step forward in harnessing the true potential of pipeline parallelism. The source code based on Megatron-LM is publicly avaiable at \\url{https://github.com/sail-sg/zero-bubble-pipeline-parallelism}.",
        "keywords": "Pipeline Parallelism;Zero Bubble",
        "primary_area": "infrastructure, software libraries, hardware, etc.",
        "supplementary_material": "",
        "author": "Penghui Qi;Xinyi Wan;Guangxing Huang;Min Lin",
        "authorids": "~Penghui_Qi1;~Xinyi_Wan1;~Guangxing_Huang1;~Min_Lin1",
        "gender": "M;M;M;M",
        "homepage": ";;https://doyoubi.github.io/;https://linmin.me",
        "dblp": "236/4626;;;",
        "google_scholar": "CLRsGEMAAAAJ;;;BGONmkIAAAAJ",
        "orcid": ";;;",
        "linkedin": ";xinyi-wan-6b975931/;;min-lin-08a3a422/",
        "or_profile": "~Penghui_Qi1;~Xinyi_Wan1;~Guangxing_Huang1;~Min_Lin1",
        "aff": "sea ai lab;Sea AI Lab;Sea Limited;Sea AI Lab",
        "aff_domain": "sail.sea.com;sea.com;sail.sea.com;sea.com",
        "position": "Researcher;Researcher;Researcher;Principal Researcher",
        "bibtex": "@inproceedings{\nqi2024zero,\ntitle={Zero Bubble (Almost) Pipeline Parallelism},\nauthor={Penghui Qi and Xinyi Wan and Guangxing Huang and Min Lin},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=tuzTN0eIO5}\n}",
        "github": "",
        "project": "",
        "reviewers": "b5Up;Uec3;xbKE;hNFq",
        "pdf_size": 507042,
        "rating": "6;6;8;8",
        "confidence": "4;3;5;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;4",
        "presentation": "2;3;3;3",
        "wc_summary": "60;144;115;91",
        "wc_strengths": "73;126;128;64",
        "wc_weaknesses": "33;32;247;123",
        "wc_questions": "201;20;152;2",
        "wc_review": "367;322;642;280",
        "wc_reply_reviewers": "13;0;86;0",
        "wc_reply_authors": "641;463;1338;382",
        "reply_reviewers": "1;0;3;0",
        "reply_authors": "2;1;4;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            102.5,
            30.890937182286976
        ],
        "wc_strengths_avg": [
            97.75,
            29.431063521388417
        ],
        "wc_weaknesses_avg": [
            108.75,
            87.95559959434078
        ],
        "wc_questions_avg": [
            93.75,
            84.78317934590564
        ],
        "wc_review_avg": [
            402.75,
            141.51567934331516
        ],
        "wc_reply_reviewers_avg": [
            24.75,
            35.75874019033668
        ],
        "wc_reply_authors_avg": [
            706.0,
            376.72071883558516
        ],
        "reply_reviewers_avg": [
            1.0,
            1.224744871391589
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.7071067811865475,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10262116180926502006&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=tuzTN0eIO5",
        "pdf": "https://openreview.net/pdf?id=tuzTN0eIO5",
        "email": "sail.sea.com;sea.com;sail.sea.com;sea.com",
        "author_num": 4,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Sea AI Lab;Sea Limited",
        "aff_unique_dep": "AI Lab;",
        "aff_unique_url": ";https://www.sealimited.com",
        "aff_unique_abbr": ";Sea",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "1",
        "aff_country_unique": ";Singapore"
    },
    {
        "title": "SWAP-NAS: Sample-Wise Activation Patterns for Ultra-fast NAS",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17594",
        "id": "tveiUXU2aa",
        "author_site": "Yameng Peng, Andy Song, Haytham Fayek, Vic Ciesielski, Xiaojun Chang",
        "tldr": "",
        "abstract": "Training-free metrics (a.k.a. zero-cost proxies) are widely used to avoid resource-intensive neural network training, especially in Neural Architecture Search (NAS). Recent studies show that existing training-free metrics have several limitations, such as limited correlation and poor generalisation across different search spaces and tasks. Hence, we propose Sample-Wise Activation Patterns and its derivative, SWAP-Score, a novel high-performance training-free metric. It measures the expressivity of networks over a batch of input samples. The SWAP-Score is strongly correlated with ground-truth performance across various search spaces and tasks, outperforming 15 existing training-free metrics on NAS-Bench-101/201/301 and TransNAS-Bench-101. The SWAP-Score can be further enhanced by regularisation, which leads to even higher correlations in cell-based search space and enables model size control during the search. For example, Spearman\u2019s rank correlation coefficient between regularised SWAP-Score and CIFAR-100 validation accuracies on NAS-Bench-201 networks is 0.90, significantly higher than 0.80 from the second-best metric, NWOT. When integrated with an evolutionary algorithm for NAS, our SWAP-NAS achieves competitive performance on CIFAR-10 and ImageNet in approximately 6 minutes and 9 minutes of GPU time respectively.",
        "keywords": "Neural Architecture Search;Network evaluation;Training-free metric;Deep neural networks",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yameng Peng;Andy Song;Haytham M. Fayek;Vic Ciesielski;Xiaojun Chang",
        "authorids": "~Yameng_Peng1;~Andy_Song1;~Haytham_M._Fayek1;~Vic_Ciesielski1;~Xiaojun_Chang4",
        "gender": ";;;M;",
        "homepage": ";;https://haythamfayek.com;http://titan.csit.rmit.edu.au/~e23005;",
        "dblp": ";;144/1507;;",
        "google_scholar": ";;l5T9RtcAAAAJ;;",
        "orcid": ";;0000-0002-1840-7605;;",
        "linkedin": ";;haythamfayek/;;",
        "or_profile": "~Yameng_Peng1;~Andy_Song1;~Haytham_M._Fayek1;~Vic_Ciesielski1;~Xiaojun_Chang4",
        "aff": ";;Royal Melbourne Institute of Technology;Royal Melbourne Institute of Technology;",
        "aff_domain": ";;rmit.edu.au;rmit.edu.au;",
        "position": ";;Senior Lecturer;Associate Professor;",
        "bibtex": "@inproceedings{\npeng2024swapnas,\ntitle={{SWAP}-{NAS}: Sample-Wise Activation Patterns for Ultra-fast {NAS}},\nauthor={Yameng Peng and Andy Song and Haytham M. Fayek and Vic Ciesielski and Xiaojun Chang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=tveiUXU2aa}\n}",
        "github": "",
        "project": "",
        "reviewers": "pab6;6s7y;QHog;AWYQ",
        "pdf_size": 8247084,
        "rating": "6;8;8;8",
        "confidence": "3;2;5;4",
        "soundness": "3;3;4;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;4;3",
        "wc_summary": "71;72;60;37",
        "wc_strengths": "76;29;120;48",
        "wc_weaknesses": "36;22;193;67",
        "wc_questions": "28;7;108;1",
        "wc_review": "211;130;481;153",
        "wc_reply_reviewers": "0;0;80;0",
        "wc_reply_authors": "650;243;1279;341",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;3;1",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            60.0,
            14.089002803605371
        ],
        "wc_strengths_avg": [
            68.25,
            34.23722389446901
        ],
        "wc_weaknesses_avg": [
            79.5,
            67.52221856544703
        ],
        "wc_questions_avg": [
            36.0,
            42.7609635064506
        ],
        "wc_review_avg": [
            243.75,
            140.1202608476019
        ],
        "wc_reply_reviewers_avg": [
            20.0,
            34.64101615137755
        ],
        "wc_reply_authors_avg": [
            628.25,
            404.62289542239205
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.2581988897471611,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9923718311370819272&as_sdt=8005&sciodt=0,7&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=tveiUXU2aa",
        "pdf": "https://openreview.net/pdf?id=tveiUXU2aa",
        "email": ";;rmit.edu.au;rmit.edu.au;",
        "author_num": 5,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Royal Melbourne Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.rmit.edu.au",
        "aff_unique_abbr": "RMIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Australia"
    },
    {
        "title": "Towards Understanding Sycophancy in Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17593",
        "id": "tvhaxkMKAn",
        "author_site": "Mrinank Sharma, Meg Tong, Tomek Korbak, David Duvenaud, Amanda Askell, Sam Bowman, Esin DURMUS, Zac Hatfield-Dodds, Scott Johnston, Shauna Kravec, Timothy Maxwell, Sam McCandlish, Kamal Ndousse, Oliver Rausch, Nicholas Schiefer, Da Yan, Miranda Zhang, Ethan Perez",
        "tldr": "",
        "abstract": "Reinforcement learning from human feedback (RLHF) is a popular technique for training high-quality AI assistants. However, RLHF may also encourage model responses that match user beliefs over truthful responses, a behavior known as sycophancy. We investigate the prevalence of sycophancy in RLHF-trained models and whether human preference judgments are responsible. We first demonstrate that five state-of-the-art AI assistants consistently exhibit sycophancy behavior across four varied free-form text-generation tasks. To understand if human preferences drive this broadly observed behavior of RLHF models, we analyze existing human preference data. We find that when a response matches a user's views, it is more likely to be preferred. Moreover, both humans and preference models (PMs) prefer convincingly-written sycophantic responses over correct ones a non-negligible fraction of the time. Optimizing model outputs against PMs also sometimes sacrifices truthfulness in favor of sycophancy. Overall, our results indicate that sycophancy is a general behavior of RLHF models, likely driven in part by human preference judgments favoring sycophantic responses.",
        "keywords": "AI safety;language models;sycophancy;human feedback;RLHF",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Mrinank Sharma;Meg Tong;Tomasz Korbak;David Duvenaud;Amanda Askell;Samuel R. Bowman;Esin DURMUS;Zac Hatfield-Dodds;Scott R Johnston;Shauna M Kravec;Timothy Maxwell;Sam McCandlish;Kamal Ndousse;Oliver Rausch;Nicholas Schiefer;Da Yan;Miranda Zhang;Ethan Perez",
        "authorids": "~Mrinank_Sharma1;~Meg_Tong1;~Tomasz_Korbak1;~David_Duvenaud2;~Amanda_Askell1;~Samuel_R._Bowman1;~Esin_DURMUS2;~Zac_Hatfield-Dodds1;~Scott_R_Johnston1;~Shauna_M_Kravec1;~Timothy_Maxwell1;~Sam_McCandlish1;~Kamal_Ndousse1;~Oliver_Rausch1;~Nicholas_Schiefer1;~Da_Yan3;~Miranda_Zhang1;~Ethan_Perez1",
        "gender": ";;M;M;Not Specified;;F;;M;F;;;M;;;Not Specified;F;M",
        "homepage": "https://mrinanksharma.github.io/;https://www.megtong.com/;https://tomekkorbak.com;https://www.cs.toronto.edu/~duvenaud/;https://askell.io/;;https://esdurmus.github.io/;;;https://celest.ai/;https://timmaxwell.org/;;https://kam.al;;https://nicholasschiefer.com/;;;http://ethanperez.net",
        "dblp": "254/2914;;209/9713.html;86/9380;244/9888.html;;;;;;;;;;;;;192/1812",
        "google_scholar": "https://scholar.google.co.uk/citations?user=5gslw-MAAAAJ;_pTshvoAAAAJ;YQ5rrk4AAAAJ;https://scholar.google.ca/citations?user=ZLpO3XQAAAAJ;NYOJzM4AAAAJ;;;lEujTKIAAAAJ;;UxS_WtkAAAAJ;;https://scholar.google.com/citations?hl=en;m_JNZGMAAAAJ;;xerhYrsAAAAJ;SyqwACMAAAAJ;;https://scholar.google.ca/citations?user=za0-taQAAAAJ",
        "orcid": "0000-0002-4304-7963;;0000-0002-6258-2013;;;;;;0000-0002-8055-311X;;;;;;;;;",
        "linkedin": ";;tomaszkorbak/;;amanda-askell;;;;scott-johnston-b1997b122/;;;;;;;;https://linkedin.com/in/miranda-h-zhang;https://linkedin.com/in/ethanjperez",
        "or_profile": "~Mrinank_Sharma1;~Meg_Tong1;~Tomasz_Korbak1;~David_Duvenaud2;~Amanda_Askell1;~Samuel_R._Bowman1;~Esin_DURMUS2;~Zac_Hatfield-Dodds1;~Scott_R_Johnston1;~Shauna_M_Kravec1;~Timothy_Maxwell1;~Sam_McCandlish1;~Kamal_Ndousse1;~Oliver_Rausch1;~Nicholas_Schiefer1;~Da_Yan3;~Miranda_Zhang1;~Ethan_Perez1",
        "aff": ";;Anthropic;Anthropic;;;Anthropic;Australian National University;;;Anthropic;Anthropic;Anthropic;;Anthropic;;Anthropic;New York University",
        "aff_domain": ";;anthropic.com;anthropic.com;;;anthropic.com;anu.edu.au;;;anthropic.com;anthropic.com;anthropic.com;;anthropic.com;;anthropic.com;nyu.edu",
        "position": ";;Researcher;Researcher;;;Researcher;PhD student;;;Researcher;Researcher;Researcher;;Researcher;;Operations Generalist;Researcher",
        "bibtex": "@inproceedings{\nsharma2024towards,\ntitle={Towards Understanding Sycophancy in Language Models},\nauthor={Mrinank Sharma and Meg Tong and Tomasz Korbak and David Duvenaud and Amanda Askell and Samuel R. Bowman and Esin DURMUS and Zac Hatfield-Dodds and Scott R Johnston and Shauna M Kravec and Timothy Maxwell and Sam McCandlish and Kamal Ndousse and Oliver Rausch and Nicholas Schiefer and Da Yan and Miranda Zhang and Ethan Perez},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=tvhaxkMKAn}\n}",
        "github": "",
        "project": "",
        "reviewers": "FbQa;XcA9;jf7j;mnuM",
        "pdf_size": 1221900,
        "rating": "6;6;6;8",
        "confidence": "4;4;4;3",
        "soundness": "3;3;3;3",
        "contribution": "3;3;2;3",
        "presentation": "3;3;4;3",
        "wc_summary": "117;177;651;68",
        "wc_strengths": "100;86;156;62",
        "wc_weaknesses": "107;1340;512;64",
        "wc_questions": "113;339;5;58",
        "wc_review": "437;1942;1324;252",
        "wc_reply_reviewers": "23;82;24;0",
        "wc_reply_authors": "845;2864;1483;346",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "2;6;3;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            253.25,
            232.86302304144382
        ],
        "wc_strengths_avg": [
            101.0,
            34.539832078341085
        ],
        "wc_weaknesses_avg": [
            505.75,
            512.3857799549086
        ],
        "wc_questions_avg": [
            128.75,
            127.25245577198108
        ],
        "wc_review_avg": [
            988.75,
            683.4300896946227
        ],
        "wc_reply_reviewers_avg": [
            32.25,
            30.285103598964294
        ],
        "wc_reply_authors_avg": [
            1384.5,
            944.479353929984
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            1.8708286933869707
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            18,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 225,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10978075439745802259&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=tvhaxkMKAn",
        "pdf": "https://openreview.net/pdf?id=tvhaxkMKAn",
        "email": ";;anthropic.com;anthropic.com;;;anthropic.com;anu.edu.au;;;anthropic.com;anthropic.com;anthropic.com;;anthropic.com;;anthropic.com;nyu.edu",
        "author_num": 18,
        "aff_unique_index": "0;0;0;1;0;0;0;0;0;2",
        "aff_unique_norm": "Anthropic;Australian National University;New York University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.anthropic.com;https://www.anu.edu.au;https://www.nyu.edu",
        "aff_unique_abbr": "Anthropic;ANU;NYU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0;0;0;0;0;0",
        "aff_country_unique": "United States;Australia"
    },
    {
        "title": "Learning invariant representations of time-homogeneous stochastic dynamical systems",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17592",
        "id": "twSnZwiOIm",
        "author_site": "Vladimir Kostic, Pietro Novelli, Riccardo Grazzi, Karim Lounici, massimiliano pontil",
        "tldr": "",
        "abstract": "We consider the general class of time-homogeneous stochastic dynamical systems, both discrete and continuous, and study the problem of learning a representation of the state that faithfully captures its dynamics. This is instrumental to learning the transfer operator or the generator of the system, which in turn can be used for numerous tasks, such as forecasting and interpreting the system dynamics. We show that the search for a good representation can be cast as an optimization problem over neural networks. Our approach is supported by recent results in statistical learning theory, highlighting the role of approximation error and metric distortion in the learning problem. The objective function we propose is associated with projection operators from the representation space to the data space, overcomes metric distortion, and can be empirically estimated from data. In the discrete-time setting, we further derive a relaxed objective function that is differentiable and numerically well-conditioned. We compare our method against state-of-the-art approaches on different datasets, showing better performance across the board.",
        "keywords": "Dynamical systems;statistical learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/54697adb12b018427490a6c591b68717fd422a89.pdf",
        "author": "Vladimir R Kostic;Pietro Novelli;Riccardo Grazzi;Karim Lounici;Massimiliano Pontil",
        "authorids": "~Vladimir_R_Kostic1;~Pietro_Novelli1;~Riccardo_Grazzi2;~Karim_Lounici1;~Massimiliano_Pontil4",
        "gender": "M;M;;;Not Specified",
        "homepage": "https://vladi-iit.github.io/;;;;https://www.iit.it/web/computational-statistics-and-machine-learning",
        "dblp": "94/879;318/3513;;;",
        "google_scholar": "66gV7SAAAAAJ;;;;lcOacs8AAAAJ",
        "orcid": ";0000-0003-1623-5659;;;0000-0001-9415-098X",
        "linkedin": "vladimir-kostic-77500652/;;;;",
        "or_profile": "~Vladimir_R_Kostic1;~Pietro_Novelli1;~Riccardo_Grazzi2;~Karim_Lounici1;~Massimiliano_Pontil4",
        "aff": "University of Novi Sad;Istituto Italiano di Tecnologia;;;University College London, University of London",
        "aff_domain": "uns.ac.rs;iit.it;;;ucl.ac.uk",
        "position": "Associate Professor;Postdoc;;;Full Professor",
        "bibtex": "@inproceedings{\nkostic2024learning,\ntitle={Learning invariant representations of time-homogeneous stochastic dynamical systems},\nauthor={Vladimir R Kostic and Pietro Novelli and Riccardo Grazzi and Karim Lounici and Massimiliano Pontil},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=twSnZwiOIm}\n}",
        "github": "",
        "project": "",
        "reviewers": "UfpG;1QLL;sgxX;hdvQ",
        "pdf_size": 3081755,
        "rating": "6;6;6;6",
        "confidence": "3;4;3;2",
        "soundness": "4;3;3;3",
        "contribution": "3;2;2;3",
        "presentation": "2;3;2;3",
        "wc_summary": "80;135;70;26",
        "wc_strengths": "77;21;25;56",
        "wc_weaknesses": "361;442;166;46",
        "wc_questions": "322;29;80;2",
        "wc_review": "840;627;341;130",
        "wc_reply_reviewers": "222;0;136;18",
        "wc_reply_authors": "1019;792;1005;380",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "3;1;3;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            77.75,
            38.79674599757047
        ],
        "wc_strengths_avg": [
            44.75,
            23.025800746119558
        ],
        "wc_weaknesses_avg": [
            253.75,
            156.36555726885638
        ],
        "wc_questions_avg": [
            108.25,
            126.547174998101
        ],
        "wc_review_avg": [
            484.5,
            270.62381639464036
        ],
        "wc_reply_reviewers_avg": [
            94.0,
            90.49861877399013
        ],
        "wc_reply_authors_avg": [
            799.0,
            258.09203784696655
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2385291418267580539&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=twSnZwiOIm",
        "pdf": "https://openreview.net/pdf?id=twSnZwiOIm",
        "email": "uns.ac.rs;iit.it;;;ucl.ac.uk",
        "author_num": 5,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of Novi Sad;Istituto Italiano di Tecnologia;University College London",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.uns.ac.rs;https://www.iit.it;https://www.ucl.ac.uk",
        "aff_unique_abbr": "UNS;IIT;UCL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2",
        "aff_country_unique": "Serbia;Italy;United Kingdom"
    },
    {
        "id": "twhn5XvOtt",
        "title": "Collaborative Prompt Tuning for Black-Box Vision-Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "With the emergence of pretrained vision-language models (VLMs), considerable\nefforts are devoted to fine-tuning them to downstream tasks. Despite the progress\nmade in designing efficient fine-tuning methods, such methods require access to\nthe model\u2019s parameters, which can be challenging due to the high pretraining cost\nof VLMs. Consequently, model owners often opt to provide the model as a service\nto safeguard model ownership. In the paper, we propose CollAboRative pROmpt\nTuning (CARROT) approach for fine-tuning black-box VLMs to downstream\ntasks, where we only have access to the input prompts and the output predictions\nof the model. Specifically, CARROT comprises two modules, a prompt generation\nmodule for learning text prompts and a prediction refinement module that enhances output predictions in residual style. Additionally, we introduce an auxiliary\nprediction-consistent loss to promote consistent optimization across these modules.\nTo optimize the modules, we develop a novel collaborative training algorithm that\nalternatively optimizes the prompt generation module and the prediction refinement module via the derivative-free and the derivative-based methods, respectively.\nExtensive experiments on few-shot classification over 15 datasets demonstrate the\nsuperiority of CARROT. The results show that CARROT achieves a decent gain\nof about 12% with 16-shot datasets and only 8,000 queries. Moreover, CARROT\ntrains faster and uses only about 1/80 of the memory footprint for deployment,\nwhile sacrificing only 1.62% of performance compared to the white-box method.",
        "keywords": "vision-language model;few-shot classification;black-box;prompt learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/32605ef6b8394dbfc1e8a633188996053327806b.zip",
        "author": "Zhengbo Wang;Jian Liang;Ran He;Zilei Wang;Tieniu Tan",
        "authorids": "~Zhengbo_Wang1;~Jian_Liang1;~Ran_He1;~Zilei_Wang1;~Tieniu_Tan1",
        "gender": ";M;M;M;",
        "homepage": "https://github.com/mrflogs;https://liangjian.xyz;https://rhe-web.github.io/;;",
        "dblp": "193/0358;19/2208-1;61/6198-1;49/1878;",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;ayrg9AUAAAAJ;https://scholar.google.com.hk/citations?hl=zh-CN;",
        "orcid": ";0000-0003-3890-1894;0000-0002-3807-991X;;",
        "linkedin": ";;;;",
        "or_profile": "~Zhengbo_Wang1;~Jian_Liang1;~Ran_He1;~Zilei_Wang1;~Tieniu_Tan1",
        "aff": "University of Science and Technology of China;Institute of Automation, Chinese Academy of Sciences;Institute of Automation, Chinese Academy of Sciences;University of Science and Technology of China;",
        "aff_domain": "ustc.edu.cn;ia.ac.cn;ia.ac.cn;ustc.edu.cn;",
        "position": "PhD student;Associate Professor;Full Professor;Associate Professor;",
        "bibtex": "@misc{\nwang2024collaborative,\ntitle={Collaborative Prompt Tuning for Black-Box Vision-Language Models},\nauthor={Zhengbo Wang and Jian Liang and Ran He and Zilei Wang and Tieniu Tan},\nyear={2024},\nurl={https://openreview.net/forum?id=twhn5XvOtt}\n}",
        "github": "",
        "project": "",
        "reviewers": "j3Qp;Nv8C;2nQv;S6pY",
        "site": "https://openreview.net/forum?id=twhn5XvOtt",
        "pdf_size": 500675,
        "rating": "5;5;5;5",
        "confidence": "4;4;2;3",
        "soundness": "3;3;3;3",
        "contribution": "2;2;2;2",
        "presentation": "2;3;3;3",
        "wc_summary": "180;149;119;54",
        "wc_strengths": "97;10;273;32",
        "wc_weaknesses": "122;165;234;298",
        "wc_questions": "221;3;10;5",
        "wc_review": "620;327;636;389",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            125.5,
            46.57520799738848
        ],
        "wc_strengths_avg": [
            103.0,
            103.23032500191017
        ],
        "wc_weaknesses_avg": [
            204.75,
            67.04243059436315
        ],
        "wc_questions_avg": [
            59.75,
            93.13263391529308
        ],
        "wc_review_avg": [
            493.0,
            136.88498822003822
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:HQEBQ7nWAm8J:scholar.google.com/&scioq=Collaborative+Prompt+Tuning+for+Black-Box+Vision-Language+Models&hl=en&as_sdt=0,47",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;0",
        "aff_unique_norm": "University of Science and Technology of China;Chinese Academy of Sciences",
        "aff_unique_dep": ";Institute of Automation",
        "aff_unique_url": "http://www.ustc.edu.cn;http://www.ia.cas.cn",
        "aff_unique_abbr": "USTC;CAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "tyIPw2m3Um",
        "title": "Probability-dependent gradient decay in large margin softmax",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this paper, a gradient decay hyperparameter is introduced in Softmax to control the probability-dependent gradient decay rate. By following the theoretical analysis and empirical results, we find that the generalization and calibration depend significantly on the gradient decay rate as the confidence probability rises, i.e., the gradient decreases convexly or concavely as the sample probability increases. Moreover, optimization with the small gradient decay shows a curriculum learning sequence where hard samples are in the spotlight only after easy samples are convinced sufficiently, and well-separated samples gain a higher gradient to reduce intra-class distance. Unfortunately, the small gradient decay exacerbates model overconfidence, shedding light on the causes of the poor calibration observed in modern neural networks. Conversely, a large gradient decay significantly mitigates these issues, outperforming even the model employing post-calibration methods. Based on the analysis results, we can provide evidence that the large margin Softmax will affect the local Lipschitz constraint by regulating the probability-dependent gradient decay rate. This paper provides a new perspective and understanding of the relationship among large margin Softmax,  curriculum learning and model calibration by analyzing the gradient decay rate. Besides, we propose a warm-up strategy to dynamically adjust gradient decay.",
        "keywords": "Gradient decay; Large margin Softmax; Local Lipschitz constraint; Curriculum learning; Model calibration",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Siyuan Zhang;Linbo Xie",
        "authorids": "~Siyuan_Zhang6;~Linbo_Xie1",
        "gender": "M;M",
        "homepage": "https://www.researchgate.net/profile/Siyuan-Zhang-35;http://iot.jiangnan.edu.cn/info/1059/3394.htm",
        "dblp": "15/7930;68/9211",
        "google_scholar": ";",
        "orcid": "0000-0001-5134-3044;",
        "linkedin": ";",
        "or_profile": "~Siyuan_Zhang6;~Linbo_Xie1",
        "aff": "Jiangnan University;School of IoT Engineering",
        "aff_domain": "jiangnan.edu.cn;jiangnan.edu.cn",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nzhang2024probabilitydependent,\ntitle={Probability-dependent gradient decay in large margin softmax},\nauthor={Siyuan Zhang and Linbo Xie},\nyear={2024},\nurl={https://openreview.net/forum?id=tyIPw2m3Um}\n}",
        "github": "",
        "project": "",
        "reviewers": "kFkh;KFsP;cHJU",
        "site": "https://openreview.net/forum?id=tyIPw2m3Um",
        "pdf_size": 4542141,
        "rating": "5;5;6",
        "confidence": "3;3;3",
        "soundness": "2;3;2",
        "contribution": "2;2;2",
        "presentation": "1;3;2",
        "wc_summary": "137;78;132",
        "wc_strengths": "61;49;28",
        "wc_weaknesses": "360;105;29",
        "wc_questions": "2;53;32",
        "wc_review": "560;285;221",
        "wc_reply_reviewers": "0;103;0",
        "wc_reply_authors": "1281;636;467",
        "reply_reviewers": "0;1;0",
        "reply_authors": "3;3;2",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            115.66666666666667,
            26.71246067953223
        ],
        "wc_strengths_avg": [
            46.0,
            13.638181696985855
        ],
        "wc_weaknesses_avg": [
            164.66666666666666,
            141.5634918410189
        ],
        "wc_questions_avg": [
            29.0,
            20.92844953645635
        ],
        "wc_review_avg": [
            355.3333333333333,
            147.06083397318568
        ],
        "wc_reply_reviewers_avg": [
            34.333333333333336,
            48.554665641476255
        ],
        "wc_reply_authors_avg": [
            794.6666666666666,
            350.742387261965
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13530166970408381273&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Jiangnan University;School of IoT Engineering",
        "aff_unique_dep": ";IoT Engineering",
        "aff_unique_url": "https://www.jnu.edu.cn;",
        "aff_unique_abbr": "JNU;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China;"
    },
    {
        "id": "tz9iIJtGgu",
        "title": "Hierarchical Image Transformer Based on the Segment Anything Model",
        "track": "main",
        "status": "Desk Reject",
        "tldr": "",
        "abstract": "We propose a hierarchical image transformer generation Model based on Segment Anything Model (SAM), and explore a new research paradigm of customized large-scale model for transformer image generation. samformer applies a fine-tuning strategy based on Low rank (LoRA) to SAM image encoders, Together with self-attention, hierarchical vae encoders, mask transformer decoders, and predictive head transformer, it is fine-tuned on Imagenet-like image datasets. SAM is chosen based on its semantic mask for the image level. Specifically, in the first stage, we use SAM-based segmentation features for hierarchical encoding using attention and decoding through reconstruction losses, and the first stage algorithm achieves better performance in both vector quantization and image generation. The second phase of the mask transformer predicts masks by focusing on markers in all directions at each layer in parallel. We also observed that the warm-up fine-tuning strategy resulted in samformer successfully converging and reducing losses. Unlike SAM, samformer can perform both unconditional and class-conditional image generation tasks. Our trained B-size samformer model achieves fid scores of 3.58 and 4.28 for unconditional image generation on ffhq data set and class conditional image generation on imagenet data set respectively, which is comparable to the most advanced methods and reduces the pre-training time of large models by 3 times; The M-sized pre-trained model also achieves results that are competitive with the most advanced methods. We conducted a large number of experiments to verify the effectiveness of our design. In addition, we demonstrate the effectiveness of the proposed method in multiple generation tasks, such as unconditional image generation, class conditional image generation, text conditional image generation, etc. Because samformer updates only a small number of SAM parameters, its training costs are quite insignificant compared to other large generation models.",
        "keywords": "SAM;Hierarchica transformer;Variable mask ratio;Image transformer;Lora",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Christina Tao",
        "authorids": "~Christina_Tao1",
        "gender": "",
        "homepage": "",
        "dblp": "",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Christina_Tao1",
        "aff": "",
        "aff_domain": "",
        "position": "",
        "bibtex": "@misc{\ntao2024hierarchical,\ntitle={Hierarchical Image Transformer Based on the Segment Anything Model},\nauthor={Christina Tao},\nyear={2024},\nurl={https://openreview.net/forum?id=tz9iIJtGgu}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=tz9iIJtGgu",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ULGkZRUWO6cJ:scholar.google.com/&scioq=Hierarchical+Image+Transformer+Based+on+the+Segment+Anything+Model&hl=en&as_sdt=0,5",
        "gs_version_total": 0
    },
    {
        "id": "tzD9HVgeVx",
        "title": "AgentMixer: Multi-Agent Correlated Policy Factorization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Centralized training with decentralized execution (CTDE) has been popularly employed to stabilize the partially observable multi-agent reinforcement learning (MARL) by learning a centralized value function. However, existing methods typically assume that agents make decisions based on their local observation independently, which could hardly lead to a correlated joint policy with sufficient coordination. In this paper, we propose AgentMixer which fully takes advantage of CTDE to learn correlated decentralized policies. Specifically, AgentMixer first explicitly models the correlated joint policy by a module named \\textit{Policy Modifier} composing the partially observable individual policies conditioned on global state information. To overcome the mismatch problem caused by the asymmetric information when distilling the state-based joint policy into partially observable decentralized policies, we introduce \\textit{Individual-Global-Consistency} (IGC) to maintain the mode consistent between them. The incorporation of these two novel modules enables learning correlated decentralized policies with restricted partial observability. We further theoretically prove that AgentMixer converges to $\\epsilon$-approximate Correlated Equilibrium. The strong experimental performance on three MARL benchmarks also confirms the effectiveness of our method.",
        "keywords": "Multi-Agent Reinforcement Learning;Correlated Equilibrium",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/2492f3c0b6f0eb169e690e6c53912a1dbbf08f3c.zip",
        "author": "Zhiyuan Li;Wenshuai Zhao;Lijun Wu;Joni Pajarinen",
        "authorids": "~Zhiyuan_Li9;~Wenshuai_Zhao1;~Lijun_Wu4;~Joni_Pajarinen2",
        "gender": "M;M;M;",
        "homepage": "https://lizhyun.github.io/;https://wenshuaizhao.github.io/;https://faculty.uestc.edu.cn/wulijun/zh_CN/index.htm;",
        "dblp": "39/7780;246/5109;;23/8355",
        "google_scholar": "1GYbhX0AAAAJ;cuNOys8AAAAJ;;https://scholar.google.fi/citations?user=-2fJStwAAAAJ",
        "orcid": "0000-0002-1804-3485;;;0000-0003-4469-8191",
        "linkedin": "nostalduli/;;;",
        "or_profile": "~Zhiyuan_Li9;~Wenshuai_Zhao1;~Lijun_Wu4;~Joni_Pajarinen2",
        "aff": "University of Electronic Science and Technology of China;Aalto University;University of Electronic Science and Technology of China;Aalto University",
        "aff_domain": "uestc.edu.cn;aalto.fi;uestc.edu.cn;aalto.fi",
        "position": "PhD student;PhD student;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nli2024agentmixer,\ntitle={AgentMixer: Multi-Agent Correlated Policy Factorization},\nauthor={Zhiyuan Li and Wenshuai Zhao and Lijun Wu and Joni Pajarinen},\nyear={2024},\nurl={https://openreview.net/forum?id=tzD9HVgeVx}\n}",
        "github": "",
        "project": "",
        "reviewers": "yFNn;tDVs;Qpfs;9QDT",
        "site": "https://openreview.net/forum?id=tzD9HVgeVx",
        "pdf_size": 1077291,
        "rating": "3;5;5;5",
        "confidence": "3;4;4;3",
        "soundness": "3;2;2;3",
        "contribution": "3;2;2;2",
        "presentation": "2;2;2;3",
        "wc_summary": "110;113;95;123",
        "wc_strengths": "37;69;66;44",
        "wc_weaknesses": "86;527;32;75",
        "wc_questions": "136;76;281;110",
        "wc_review": "369;785;474;352",
        "wc_reply_reviewers": "0;153;589;0",
        "wc_reply_authors": "652;964;1311;570",
        "reply_reviewers": "0;1;3;0",
        "reply_authors": "3;4;5;3",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            110.25,
            10.034316120194738
        ],
        "wc_strengths_avg": [
            54.0,
            13.765899897936205
        ],
        "wc_weaknesses_avg": [
            180.0,
            201.35416558889463
        ],
        "wc_questions_avg": [
            150.75,
            78.1516954390626
        ],
        "wc_review_avg": [
            495.0,
            173.82893890258893
        ],
        "wc_reply_reviewers_avg": [
            185.5,
            241.189241053576
        ],
        "wc_reply_authors_avg": [
            874.25,
            291.877007487743
        ],
        "reply_reviewers_avg": [
            1.0,
            1.224744871391589
        ],
        "reply_authors_avg": [
            3.75,
            0.82915619758885
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6006821158145297645&as_sdt=805&sciodt=0,3&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0;1",
        "aff_unique_norm": "University of Electronic Science and Technology of China;Aalto University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uestc.edu.cn;https://www.aalto.fi",
        "aff_unique_abbr": "UESTC;Aalto",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;1",
        "aff_country_unique": "China;Finland"
    },
    {
        "id": "tzlGWqRA0T",
        "title": "SNN-LPCG: Spiking Neural Networks with Local Plasticity Context Gating for Lifelong Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Humans learn multiple tasks in succession with minimal mutual interference, through the context gating mechanism in the prefrontal cortex (PFC). The brain-inspired models of spiking neural networks (SNNs) have drawn massive attention for their energy efficiency and biological plausibility. To overcome catastrophic forgetting when learning multiple tasks in sequence, current SNNs for lifelong learning focus on memory reserving or regularization-based modification, while ignoring the cognitive control behavior in the brain. Inspired by biological context-dependent gating mechanisms found in PFC, we propose SNNs with context gating trained by the local plasticity rule (SNN-LPCG) for lifelong learning. The iterative training between global and local plasticity for task units is designed to strengthen the connections between task neurons and hidden neurons and preserve the multi-task relevant information. The experiments show that the proposed model is effective in maintaining the past learning experience and has better task-selectivity than other methods during lifelong learning. Our results provide new insights that the SNN-LPCG model is able to extend context gating with good scalability on different SNN architectures. Thus, our models have good potential for parallel implementation on neuromorphic hardware for real-life tasks.",
        "keywords": "Spiking neural networks;context gating;lifelong learning",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/6202e178b4fe27becc82323b51715849b42033d6.pdf",
        "author": "Jiangrong Shen;Wenyao Ni;Qi Xu;Gang Pan;Huajin Tang",
        "authorids": "~Jiangrong_Shen1;~Wenyao_Ni1;~Qi_Xu1;~Gang_Pan1;~Huajin_Tang1",
        "gender": "F;M;M;;M",
        "homepage": ";;https://www.researchgate.net/profile/Qi_Xu43;;https://person.zju.edu.cn/htang",
        "dblp": "208/3564;;;;18/434",
        "google_scholar": "3XK6COkAAAAJ;;dGEcAuYAAAAJ;;U041O4QAAAAJ",
        "orcid": ";0000-0003-2712-1921;0000-0001-9245-5544;;",
        "linkedin": ";;;;",
        "or_profile": "~Jiangrong_Shen1;~Wenyao_Ni1;~Qi_Xu1;~Gang_Pan1;~Huajin_Tang1",
        "aff": "Zhejiang University;Zhejiang University;School of Computer Science and Technology;;Zhejiang University",
        "aff_domain": "zju.edu.cn;zju.edu.cn;dlut.edu.cn;;zju.edu.cn",
        "position": "Postdoc;MS student;Associate Professor;;Full Professor",
        "bibtex": "@misc{\nshen2024snnlpcg,\ntitle={{SNN}-{LPCG}: Spiking Neural Networks with Local Plasticity Context Gating for Lifelong Learning},\nauthor={Jiangrong Shen and Wenyao Ni and Qi Xu and Gang Pan and Huajin Tang},\nyear={2024},\nurl={https://openreview.net/forum?id=tzlGWqRA0T}\n}",
        "github": "",
        "project": "",
        "reviewers": "dZw5;HidL;mMb4;eBXQ",
        "site": "https://openreview.net/forum?id=tzlGWqRA0T",
        "pdf_size": 1771882,
        "rating": "1;3;5;6",
        "confidence": "4;2;3;5",
        "soundness": "2;2;3;3",
        "contribution": "2;1;2;3",
        "presentation": "1;1;3;2",
        "wc_summary": "167;44;125;101",
        "wc_strengths": "33;84;104;114",
        "wc_weaknesses": "800;442;104;75",
        "wc_questions": "41;480;41;86",
        "wc_review": "1041;1050;374;376",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.920286436967152
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            109.25,
            44.46557657334491
        ],
        "wc_strengths_avg": [
            83.75,
            31.227992250543423
        ],
        "wc_weaknesses_avg": [
            355.25,
            294.5313013925685
        ],
        "wc_questions_avg": [
            162.0,
            184.5142270937393
        ],
        "wc_review_avg": [
            710.25,
            335.2658460088054
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.29111125486979095,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:3E_923_jP2oJ:scholar.google.com/&scioq=SNN-LPCG:+Spiking+Neural+Networks+with+Local+Plasticity+Context+Gating+for+Lifelong+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Zhejiang University;School of Computer Science and Technology",
        "aff_unique_dep": ";Computer Science and Technology",
        "aff_unique_url": "https://www.zju.edu.cn;",
        "aff_unique_abbr": "ZJU;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China;"
    },
    {
        "id": "tzpXhoNel1",
        "title": "GRepsNet: A Simple Equivariant Network for Arbitrary Matrix Groups",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Group equivariance is a strong inductive bias useful in a wide range of domains including images, point clouds, dynamical systems, and partial differential equations (PDEs). But constructing efficient equivariant networks for general groups and domains is difficult. Recent work by Finzi et al. (2021) directly solves the equivariance constraint for arbitrary matrix groups to obtain equivariant MLPs (EMLPs). However, this method does not scale well and scaling is crucial to get the best from deep learning. This necessitates the design of group equivariant networks for general domains and groups that are simple and scalable. To this end, we introduce Group Representation Networks (GRepsNets), a simple equivariant network for arbitrary matrix groups. The key intuition for our design is that using tensor representations in the hidden layers of a neural network along with appropriate mixing of various representations can lead to expressive equivariant networks, which we confirm empirically. We find GRepsNet to be competitive to EMLP on several tasks with group symmetries such as O(5), O(1, 3), and O(3) with scalars, vectors, and second-order tensors as data types. To illustrate the simplicity and generality of our network, we also use it for image classification with MLP-mixers, predicting N-body dynamics using message passing neural networks (MPNNs), and for solving PDEs using Fourier neural operators (FNOs). Surprisingly, we find that using simple first-order representations itself can yield benefits of group equivariance without additional changes in the architecture. Finally, we illustrate how higher-order tensor representations can be used for group equivariant finetuning that outperforms the existing equivariant finetuning method Basu et al. (2023b).",
        "keywords": "Group equivariant networks;geometric deep learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Sourya Basu;Suhas Lohit;Matthew Brand",
        "authorids": "~Sourya_Basu1;~Suhas_Lohit1;~Matthew_Brand1",
        "gender": "M;;",
        "homepage": "https://basusourya.github.io/;http://suhaslohit.github.io;http://www.merl.com/people/brand",
        "dblp": "199/8366;169/9097;49/3829",
        "google_scholar": "https://scholar.google.co.in/citations?user=_kpbz3cAAAAJ;GMRYY5cAAAAJ;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Sourya_Basu1;~Suhas_Lohit1;~Matthew_Brand1",
        "aff": "University of Illinois, Urbana Champaign;Mitsubishi Electric Research Labs;Mitsubishi Electric Research Labs",
        "aff_domain": "illinois.edu;merl.com;merl.com",
        "position": "PhD student;Researcher;Researcher",
        "bibtex": "@misc{\nbasu2024grepsnet,\ntitle={{GR}epsNet: A Simple Equivariant Network for Arbitrary Matrix Groups},\nauthor={Sourya Basu and Suhas Lohit and Matthew Brand},\nyear={2024},\nurl={https://openreview.net/forum?id=tzpXhoNel1}\n}",
        "github": "",
        "project": "",
        "reviewers": "FzvF;6e6R;YzuG;rnny",
        "site": "https://openreview.net/forum?id=tzpXhoNel1",
        "pdf_size": 1121593,
        "rating": "1;3;5;8",
        "confidence": "5;3;3;4",
        "soundness": "1;2;3;3",
        "contribution": "1;2;3;4",
        "presentation": "1;2;2;3",
        "wc_summary": "143;106;98;67",
        "wc_strengths": "33;46;71;93",
        "wc_weaknesses": "217;179;222;84",
        "wc_questions": "81;288;90;84",
        "wc_review": "474;619;481;328",
        "wc_reply_reviewers": "0;47;0;0",
        "wc_reply_authors": "697;1430;703;105",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;3;1;1",
        "rating_avg": [
            4.25,
            2.5860201081971503
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            1.118033988749895
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            103.5,
            27.060118255469618
        ],
        "wc_strengths_avg": [
            60.75,
            23.09085316743407
        ],
        "wc_weaknesses_avg": [
            175.5,
            55.38275905008706
        ],
        "wc_questions_avg": [
            135.75,
            87.96128409703897
        ],
        "wc_review_avg": [
            475.5,
            102.93323078578656
        ],
        "wc_reply_reviewers_avg": [
            11.75,
            20.351596988934308
        ],
        "wc_reply_authors_avg": [
            733.75,
            469.6772162879524
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.32063022053099893,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Aw0Ka_WV8YQJ:scholar.google.com/&scioq=GRepsNet:+A+Simple+Equivariant+Network+for+Arbitrary+Matrix+Groups&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "University of Illinois Urbana-Champaign;Mitsubishi Electric Research Laboratories",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://illinois.edu;https://www.merl.com",
        "aff_unique_abbr": "UIUC;MERL",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Urbana-Champaign;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "u0INlprg3U",
        "title": "LIFT: Efficient Layer-wise Fine-tuning for Large Model Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Fine-tuning is widely applied in language language processing to adapt the model\nfor downstream tasks. However, as model sizes grow rapidly, fine-tuning the\nfull model is computationally expensive. Conventional studies mainly focused\non parameter-efficiency, but reducing the number of trainable parameters does\nnot translate to less backward computation and fine-tuning speedup. Parameter-\nefficient fine-tuning still needs to perform complete backward pass to the foremost\nlayer to calculate required gradients. For example, Adapter reduces the trainable\nparameters by 275\u00d7 but the fine-tuning throughput is only 1.25\u00d7 better. To achieve\nreal training throughput improvement, we propose LIFT: a Layer-wise fine-tuning\nstrategy that only learns one layer of the Transformer architecture at a time. This\napproach not only reduces the number of trainable parameters but also improves\nthe finetuning throughput. We thoroughly evaluated the effectiveness of LIFT on\nBERT, GPT, and LLaMA models. LIFT saves the fine-tuning memory by 3.7x and improves the throughput by 2.1x to 2.6x compared to full fine-tuning, while\nmaintaining the quality.",
        "keywords": "efficient fine-tuning; large languag emodels",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/1f6c534c54d34da5fb40436846c68d466adfa91b.pdf",
        "author": "Ligeng Zhu;Lanxiang Hu;Ji Lin;Song Han",
        "authorids": "~Ligeng_Zhu1;~Lanxiang_Hu1;~Ji_Lin1;~Song_Han5",
        "gender": "M;M;M;",
        "homepage": "https://lzhu.me;https://snyhlxde1.github.io/;http://linji.me;",
        "dblp": "211/7203;;02/8200;",
        "google_scholar": "https://scholar.google.co.uk/citations?user=y0LVrtgAAAAJ;KufYmg8AAAAJ;dVtzVVAAAAAJ;",
        "orcid": ";0000-0003-0641-3677;;",
        "linkedin": ";hu-lanxiang/;;",
        "or_profile": "~Ligeng_Zhu1;~Lanxiang_Hu1;~Ji_Lin1;~Song_Han5",
        "aff": "Massachusetts Institute of Technology;University of California, San Diego;Massachusetts Institute of Technology;",
        "aff_domain": "mit.edu;ucsd.edu;mit.edu;",
        "position": "PhD student;PhD student;PhD student;",
        "bibtex": "@misc{\nzhu2024lift,\ntitle={{LIFT}: Efficient Layer-wise Fine-tuning for Large Model Models},\nauthor={Ligeng Zhu and Lanxiang Hu and Ji Lin and Song Han},\nyear={2024},\nurl={https://openreview.net/forum?id=u0INlprg3U}\n}",
        "github": "",
        "project": "",
        "reviewers": "tHJd;zNBj;6D33;ep71",
        "site": "https://openreview.net/forum?id=u0INlprg3U",
        "pdf_size": 916486,
        "rating": "5;5;6;6",
        "confidence": "4;3;4;3",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "129;43;128;127",
        "wc_strengths": "75;22;51;162",
        "wc_weaknesses": "181;108;88;83",
        "wc_questions": "5;5;130;110",
        "wc_review": "390;178;397;482",
        "wc_reply_reviewers": "184;0;0;0",
        "wc_reply_authors": "592;474;726;887",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            106.75,
            36.81287139031673
        ],
        "wc_strengths_avg": [
            77.5,
            52.27092882281699
        ],
        "wc_weaknesses_avg": [
            115.0,
            39.2364626336269
        ],
        "wc_questions_avg": [
            62.5,
            57.93315113128234
        ],
        "wc_review_avg": [
            361.75,
            112.09900757812265
        ],
        "wc_reply_reviewers_avg": [
            46.0,
            79.67433714816836
        ],
        "wc_reply_authors_avg": [
            669.75,
            153.8869308940821
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11026758755188666407&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Massachusetts Institute of Technology;University of California, San Diego",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://web.mit.edu;https://www.ucsd.edu",
        "aff_unique_abbr": "MIT;UCSD",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";San Diego",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "u11Jwd3opH",
        "title": "Attacking Graph Neural Networks with Bit Flips: Weisfeiler and Lehman Go Indifferent",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Prior attacks on graph neural networks have mostly focused on graph poisoning and evasion, neglecting the network\u2019s weights and biases. Traditional weight-based fault injection attacks, such as bit flip attacks used for convolutional neural networks, do not consider the unique properties of graph neural networks. We propose the Injectivity Bit Flip Attack, the first bit flip attack designed specifically for graph neural networks. Our attack targets the learnable neighborhood aggregation functions in quantized message passing neural networks, degrading their ability to distinguish graph structures and losing the expressivity of the Weisfeiler-Lehman test. Our findings suggest that exploiting mathematical properties specific to certain graph neural network architectures can significantly increase their vulnerability to bit flip attacks. Injectivity Bit Flip Attacks can degrade the maximal expressive Graph Isomorphism Networks trained on various graph property prediction datasets to random output by flipping only a small fraction of the network\u2019s bits, demonstrating its higher destructive power compared to a bit flip attack transferred from convolutional neural networks. Our attack is transparent and motivated by theoretical insights which are confirmed by extensive empirical results.",
        "keywords": "Bit Flip Attacks;Graph Neural Network",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Lorenz Kummer;Samir Moustafa;Nils Morten Kriege;Wilfried N. Gansterer",
        "authorids": "~Lorenz_Kummer1;~Samir_Moustafa1;~Nils_Morten_Kriege1;~Wilfried_N._Gansterer1",
        "gender": "M;M;M;",
        "homepage": "https://ufind.univie.ac.at/en/index.html;http://samirmoustafa.net/;https://kriegegroup.univie.ac.at/;",
        "dblp": "298/2002;https://dblp.uni-trier.de/pid/358/6919;97/8178;",
        "google_scholar": "OhFnjr0AAAAJ;tAUUlfAAAAAJ;https://scholar.google.de/citations?user=wGT17PcAAAAJ;",
        "orcid": "0000-0001-6538-9107;0000-0002-0674-9667;0000-0003-2645-947X;",
        "linkedin": "lorenz-kummer-573a0017a/;samirmoustafa/;;",
        "or_profile": "~Lorenz_Kummer1;~Samir_Moustafa1;~Nils_Morten_Kriege1;~Wilfried_N._Gansterer1",
        "aff": "Universit\u00e4t Wien;Universit\u00e4t Vienna;Universit\u00e4t Vienna;",
        "aff_domain": "univie.ac.at;univie.ac.at;univie.ac.at;",
        "position": "PhD student;PhD student;Associate Professor;",
        "bibtex": "@misc{\nkummer2024attacking,\ntitle={Attacking Graph Neural Networks with Bit Flips: Weisfeiler and Lehman Go Indifferent},\nauthor={Lorenz Kummer and Samir Moustafa and Nils Morten Kriege and Wilfried N. Gansterer},\nyear={2024},\nurl={https://openreview.net/forum?id=u11Jwd3opH}\n}",
        "github": "",
        "project": "",
        "reviewers": "BAQd;DkBB;Ve7w;5CWb;QF5L",
        "site": "https://openreview.net/forum?id=u11Jwd3opH",
        "pdf_size": 2752398,
        "rating": "3;3;5;5;5",
        "confidence": "3;4;3;3;2",
        "soundness": "2;2;3;2;3",
        "contribution": "2;2;3;2;3",
        "presentation": "2;4;2;2;3",
        "wc_summary": "130;59;69;94;55",
        "wc_strengths": "26;34;51;31;49",
        "wc_weaknesses": "63;194;73;118;20",
        "wc_questions": "59;18;4;123;107",
        "wc_review": "278;305;197;366;231",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            4.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.6,
            0.8
        ],
        "wc_summary_avg": [
            81.4,
            27.832355272236665
        ],
        "wc_strengths_avg": [
            38.2,
            9.987992791347018
        ],
        "wc_weaknesses_avg": [
            93.6,
            59.08163843361151
        ],
        "wc_questions_avg": [
            62.2,
            47.02084644070117
        ],
        "wc_review_avg": [
            275.4,
            58.66719696730022
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.6454972243679028,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1414992293646916997&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Vienna",
        "aff_unique_dep": "",
        "aff_unique_url": "https://univie.ac.at",
        "aff_unique_abbr": "UV",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Austria"
    },
    {
        "id": "u1erMPtujY",
        "title": "Learning Riemannian Metrics for Interpolating Animations",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We propose a new family of geodesic interpolation techniques to perform upsampling of low frame rate animations to high frame rates. This approach has important applications for: (i) creative design, as it provides a diversity of interpolation methods for digital animators; and (ii) compression, as an original high frame rate animation can be recovered with high accuracy from its subsampled version. Specifically, we upsample low frame rate animations by interpolating the rotations of an animated character's bones along geodesics in the Lie group $SO(3)$ for different invariant Riemannian metrics. For compression, we propose an optimization technique that selects the Riemannian metric whose geodesic most faithfully represent the original animation. We demonstrate the advantages of our approach compared to existing interpolation techniques in digital animation.",
        "keywords": "lie groups;animation;rotations;interpolation;motion representation;compression",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/cfa6b01450db8f2e5026a86e3ed8d596ff0c1e3b.zip",
        "author": "Sarah Kushner;Vismay Modi;Nina Miolane",
        "authorids": "~Sarah_Kushner1;~Vismay_Modi1;~Nina_Miolane2",
        "gender": "F;;",
        "homepage": "http://www.sarahkushner.com;https://www.researchgate.net/profile/Vismay-Modi-2;https://www.ece.ucsb.edu/people/faculty/nina-miolane",
        "dblp": ";;",
        "google_scholar": ";;",
        "orcid": "0000-0002-2407-4229;0000-0002-9350-494X;",
        "linkedin": ";;",
        "or_profile": "~Sarah_Kushner1;~Vismay_Modi1;~Nina_Miolane2",
        "aff": ";NVIDIA;University of California, Santa Barbara",
        "aff_domain": ";nvidia.com;ucsb.edu",
        "position": ";Researcher;Assistant Professor",
        "bibtex": "@misc{\nkushner2024learning,\ntitle={Learning Riemannian Metrics for Interpolating Animations},\nauthor={Sarah Kushner and Vismay Modi and Nina Miolane},\nyear={2024},\nurl={https://openreview.net/forum?id=u1erMPtujY}\n}",
        "github": "",
        "project": "",
        "reviewers": "3Sna;T2GP;8Wt5;QSvS",
        "site": "https://openreview.net/forum?id=u1erMPtujY",
        "pdf_size": 10473516,
        "rating": "1;3;5;6",
        "confidence": "5;4;4;4",
        "soundness": "1;1;3;3",
        "contribution": "2;1;2;3",
        "presentation": "1;3;3;2",
        "wc_summary": "101;87;96;48",
        "wc_strengths": "30;23;55;36",
        "wc_weaknesses": "298;371;218;168",
        "wc_questions": "105;1;128;166",
        "wc_review": "534;482;497;418",
        "wc_reply_reviewers": "52;137;31;33",
        "wc_reply_authors": "106;166;387;222",
        "reply_reviewers": "2;1;1;1",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            3.75,
            1.920286436967152
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            1.0
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            83.0,
            20.820662813657012
        ],
        "wc_strengths_avg": [
            36.0,
            11.895377253370318
        ],
        "wc_weaknesses_avg": [
            263.75,
            77.35753033803496
        ],
        "wc_questions_avg": [
            100.0,
            61.16780198764706
        ],
        "wc_review_avg": [
            482.75,
            41.90092481079624
        ],
        "wc_reply_reviewers_avg": [
            63.25,
            43.36112890596831
        ],
        "wc_reply_authors_avg": [
            220.25,
            104.64792162293526
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8268106308031117,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:_80psdR0S4IJ:scholar.google.com/&scioq=Learning+Riemannian+Metrics+for+Interpolating+Animations&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "NVIDIA;University of California, Santa Barbara",
        "aff_unique_dep": "NVIDIA Corporation;",
        "aff_unique_url": "https://www.nvidia.com;https://www.ucsb.edu",
        "aff_unique_abbr": "NVIDIA;UCSB",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Santa Barbara",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "u1eynu9DVf",
        "title": "What Will My Model Forget? Forecasting Forgotten Examples in Language Model Refinement",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Language models deployed in the wild make errors. However, simply updating the model with the corrected error instances causes catastrophic forgetting\u2014the updated model makes errors on instances learned during the instruction tuning or upstream training phase. Randomly replaying upstream data yields unsatisfactory performance and often comes with high variance and poor controllability. Precisely identifying forgotten examples is computationally intractable with a large upstream dataset. To this end, we study the problem of forecasting upstream examples that will be forgotten due to a model update. We shed light on how interactions between examples contribute to forgetting. We train forecasting models given a collection of online learned examples and corresponding forgotten upstream pre-training examples. We propose a partially interpretable forecast- ing model based on the observation that changes in pre-softmax logit scores of pretraining examples resemble that of online learned examples, which performs decently on BART but fails on T5 models. We further show a black-box classfier based on dot products of example representations achieves better forecasting performance over a series of setups. Finally, we show that we reduce forgetting of upstream pretraining examples by replaying examples that are forecasted to be forgotten, demonstrating the practical utility of forecasting example forgetting.",
        "keywords": "Model refinement;catastrophic forgetting",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/9cda0014fdcc5d88caaf8a532b798e52f9f5d8d9.pdf",
        "author": "Xisen Jin;Xiang Ren",
        "authorids": "~Xisen_Jin3;~Xiang_Ren1",
        "gender": "M;M",
        "homepage": "https://xsjin.xyz;https://shanzhenren.github.io/",
        "dblp": "222/9324;36/360-1",
        "google_scholar": "https://scholar.google.com/citations?hl=en;_moJlrIAAAAJ",
        "orcid": ";",
        "linkedin": ";xren7",
        "or_profile": "~Xisen_Jin3;~Xiang_Ren1",
        "aff": "University of Southern California;University of Southern California",
        "aff_domain": "usc.edu;usc.edu",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\njin2024what,\ntitle={What Will My Model Forget? Forecasting Forgotten Examples in Language Model Refinement},\nauthor={Xisen Jin and Xiang Ren},\nyear={2024},\nurl={https://openreview.net/forum?id=u1eynu9DVf}\n}",
        "github": "",
        "project": "",
        "reviewers": "o5oZ;QYTw;rXCe;PJD2",
        "site": "https://openreview.net/forum?id=u1eynu9DVf",
        "pdf_size": 452246,
        "rating": "5;5;6;8",
        "confidence": "3;3;4;3",
        "soundness": "2;2;3;4",
        "contribution": "3;2;3;3",
        "presentation": "1;3;3;4",
        "wc_summary": "81;81;57;124",
        "wc_strengths": "34;32;48;46",
        "wc_weaknesses": "180;53;56;59",
        "wc_questions": "3;30;21;22",
        "wc_review": "298;196;182;251",
        "wc_reply_reviewers": "355;0;0;58",
        "wc_reply_authors": "891;550;337;391",
        "reply_reviewers": "2;0;0;1",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            85.75,
            24.159625411003375
        ],
        "wc_strengths_avg": [
            40.0,
            7.0710678118654755
        ],
        "wc_weaknesses_avg": [
            87.0,
            53.73546315051169
        ],
        "wc_questions_avg": [
            19.0,
            9.874208829065749
        ],
        "wc_review_avg": [
            231.75,
            46.13228262290952
        ],
        "wc_reply_reviewers_avg": [
            103.25,
            147.2640061250542
        ],
        "wc_reply_authors_avg": [
            542.25,
            216.03862501876836
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17902762272606913529&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Southern California",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.usc.edu",
        "aff_unique_abbr": "USC",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Los Angeles",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "u1yvEwYfK9",
        "title": "Learning Label Shift Correction for Test-Agnostic Long-Tailed Recognition",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Long-tail learning primarily focuses on mitigating the label distribution shift between long-tailed training data and uniformly distributed test data. However, in real-world applications, we often encounter a more intricate challenge where the test label distribution is agnostic. To address this problem, we first theoretically establish the substantial potential for reducing generalization error if we can precisely estimate the test label distribution. Motivated by the theoretical insight, we introduce a simple yet effective solution called label shift correction (LSC). LSC estimates the test label distribution within the proposed framework of generalized black box shift estimation, and adjusts the model predictions to align with the estimated distribution. Theoretical analyses confirm that accurate test label distribution estimates can effectively reduce the generalization error. Extensive experimental results demonstrate that our method significantly outperforms previous state-of-the-art approaches, especially when confronted with non-uniform test label distribution. Notably, the proposed method is general and complements existing long-tail learning approaches, consistently improving their performance.",
        "keywords": "long-tail learning;label shift;semi-supervised learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/7fdf054e2028cd65702a91bb78c20cc24a06bf2f.zip",
        "author": "Tong Wei;Zhen Mao;Zi-Hao Zhou;Yuanyu Wan;Min-Ling Zhang",
        "authorids": "~Tong_Wei1;~Zhen_Mao2;~Zi-Hao_Zhou1;~Yuanyu_Wan1;~Min-Ling_Zhang2",
        "gender": "M;;M;M;",
        "homepage": "https://palm.seu.edu.cn/weit/;https://icanflyhigh.github.io;https://yuanyuwan.github.io/;http://palm.seu.edu.cn/zhangml/;https://github.com/zhouzihao11",
        "dblp": "49/933-1;;221/3499;84/271.html;",
        "google_scholar": "EFCZuW4AAAAJ;;CEymMc8AAAAJ;uFHCIM0AAAAJ;",
        "orcid": "0000-0002-2766-8209;;;0000-0003-1880-5918;",
        "linkedin": ";;;;",
        "or_profile": "~Tong_Wei1;~Zhen_Mao2;~Yuanyu_Wan1;~Min-Ling_Zhang2;~Zhou_Zihao1",
        "aff": "Southeast University;Southeast University;Zhejiang University;Southeast University;Southeast University",
        "aff_domain": "seu.edu.cn;seu.edu.cn;zju.edu.cn;seu.edu.cn;seu.edu.cn",
        "position": "Associate Professor;MS student;Researcher;Full Professor;MS student",
        "bibtex": "@misc{\nwei2024learning,\ntitle={Learning Label Shift Correction for Test-Agnostic Long-Tailed Recognition},\nauthor={Tong Wei and Zhen Mao and Zi-Hao Zhou and Yuanyu Wan and Min-Ling Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=u1yvEwYfK9}\n}",
        "github": "",
        "project": "",
        "reviewers": "pK6C;zgiF;nfhw",
        "site": "https://openreview.net/forum?id=u1yvEwYfK9",
        "pdf_size": 2479881,
        "rating": "5;6;6",
        "confidence": "3;4;3",
        "soundness": "2;3;2",
        "contribution": "2;3;2",
        "presentation": "2;3;3",
        "wc_summary": "86;176;73",
        "wc_strengths": "84;89;57",
        "wc_weaknesses": "226;116;73",
        "wc_questions": "75;186;91",
        "wc_review": "471;567;294",
        "wc_reply_reviewers": "48;40;29",
        "wc_reply_authors": "837;846;1410",
        "reply_reviewers": "1;1;1",
        "reply_authors": "2;2;3",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            111.66666666666667,
            45.79907810814051
        ],
        "wc_strengths_avg": [
            76.66666666666667,
            14.055445761538676
        ],
        "wc_weaknesses_avg": [
            138.33333333333334,
            64.42739238001867
        ],
        "wc_questions_avg": [
            117.33333333333333,
            48.99206284922306
        ],
        "wc_review_avg": [
            444.0,
            113.07519621915321
        ],
        "wc_reply_reviewers_avg": [
            39.0,
            7.788880963698615
        ],
        "wc_reply_authors_avg": [
            1031.0,
            268.01865606707304
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13080086498775196290&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "Southeast University;Zhejiang University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.seu.edu.cn/;https://www.zju.edu.cn",
        "aff_unique_abbr": "SEU;ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "u2as4lHoyl",
        "title": "ReFACT: Updating Text-to-Image Models by Editing the Text Encoder",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Our world is marked by unprecedented technological, global, and socio-political transformations, posing a significant challenge to text-to-image generative models. These models encode factual associations within their parameters that can quickly become outdated, diminishing their utility for end-users. To that end, we introduce ReFACT, a novel approach for editing factual associations in text-to-image models without relaying on explicit input from end-users or costly re-training. ReFACT updates the weights of a specific layer in the text encoder, modifying only a tiny portion of the model\u2019s parameters and leaving the rest of the model unaffected. We empirically evaluate ReFACT on an existing benchmark, alongside a newly curated dataset. Compared to other methods, ReFACT achieves superior performance in both generalization to related concepts and preservation of unrelated concepts. Furthermore, ReFACT maintains image generation quality, making it a practical tool for updating and correcting factual information in text-to-image models.",
        "keywords": "text-to-image;diffusion models;knowledge editing",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/8e65db000c35a7e3cb16d6c5aec815734b7f6c62.zip",
        "author": "Dana Arad;Hadas Orgad;Yonatan Belinkov",
        "authorids": "~Dana_Arad1;~Hadas_Orgad1;~Yonatan_Belinkov1",
        "gender": "F;F;M",
        "homepage": ";;https://www.belinkov.com",
        "dblp": "331/3635.html;;136/8705",
        "google_scholar": ";;https://scholar.google.com/citations?authorid=K-6ujU4AAAAJ",
        "orcid": ";;",
        "linkedin": "dana-arad/;hadas-orgad/;",
        "or_profile": "~Dana_Arad1;~Hadas_Orgad1;~Yonatan_Belinkov1",
        "aff": "Amazon;Computer Science Department, Technion - Israel Institute of Technology;Technion, Technion",
        "aff_domain": "amazon.com;cs.technion.ac.il;technion.ac.il",
        "position": "Intern;PhD student;Assistant Professor",
        "bibtex": "@misc{\narad2024refact,\ntitle={Re{FACT}: Updating Text-to-Image Models by Editing the Text Encoder},\nauthor={Dana Arad and Hadas Orgad and Yonatan Belinkov},\nyear={2024},\nurl={https://openreview.net/forum?id=u2as4lHoyl}\n}",
        "github": "",
        "project": "",
        "reviewers": "xtbe;AyFi;sFcd;c2qA",
        "site": "https://openreview.net/forum?id=u2as4lHoyl",
        "pdf_size": 38645344,
        "rating": "5;5;5;5",
        "confidence": "4;3;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "70;53;18;67",
        "wc_strengths": "2;69;40;99",
        "wc_weaknesses": "112;215;214;116",
        "wc_questions": "2;87;2;4",
        "wc_review": "186;424;274;286",
        "wc_reply_reviewers": "290;0;0;0",
        "wc_reply_authors": "983;632;456;429",
        "reply_reviewers": "2;0;0;0",
        "reply_authors": "4;3;3;3",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            52.0,
            20.65187642806338
        ],
        "wc_strengths_avg": [
            52.5,
            35.8503835404867
        ],
        "wc_weaknesses_avg": [
            164.25,
            50.27113983191549
        ],
        "wc_questions_avg": [
            23.75,
            36.526531453177974
        ],
        "wc_review_avg": [
            292.5,
            85.17482022288043
        ],
        "wc_reply_reviewers_avg": [
            72.5,
            125.5736835487436
        ],
        "wc_reply_authors_avg": [
            625.0,
            220.90156178714537
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            3.25,
            0.4330127018922193
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 21,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4495704963624478740&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Amazon;Technion - Israel Institute of Technology",
        "aff_unique_dep": "Amazon.com, Inc.;Computer Science Department",
        "aff_unique_url": "https://www.amazon.com;https://www.technion.ac.il",
        "aff_unique_abbr": "Amazon;Technion",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "United States;Israel"
    },
    {
        "id": "u3RJbzzBZj",
        "title": "PETformer: Long-term Time Series Forecasting via Placeholder-enhanced Transformer",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recently, the superiority of Transformer for long-term time series forecasting (LTSF) tasks has been challenged, particularly since recent work has shown that simple models can outperform numerous Transformer-based approaches. This suggests that a notable gap remains in fully leveraging the potential of Transformer in LTSF tasks. Consequently, this study investigates key issues when applying Transformer to LTSF, encompassing aspects of temporal continuity, information density, and multi-channel relationships. We introduce the Placeholder-enhanced Technique (PET) to enhance the computational efficiency and predictive accuracy of Transformer in LTSF tasks. Furthermore, we delve into the impact of larger patch strategies and channel interaction strategies on Transformer's performance, specifically Long Sub-sequence Division (LSD) and Multi-channel Separation and Interaction (MSI). These strategies collectively constitute a novel model termed PETformer. Extensive experiments have demonstrated that PETformer achieves state-of-the-art performance on eight commonly used public datasets for LTSF, surpassing all existing models. The insights and enhancement methodologies presented in this paper serve as valuable reference points and sources of inspiration for future research endeavors.",
        "keywords": "Machine learning;Time series analysis;Long-term time series forecasting",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Shengsheng Lin;Weiwei Lin;Wentai Wu;Songbo Wang;Yongxiang Wang",
        "authorids": "~Shengsheng_Lin1;~Weiwei_Lin1;~Wentai_Wu1;~Songbo_Wang1;~Yongxiang_Wang2",
        "gender": ";M;M;M;M",
        "homepage": ";https://www.scholat.com/linweiwei;https://wingter562.github.io/wentai_homepage/;;",
        "dblp": ";53/282-1;;;",
        "google_scholar": ";IWsha94AAAAJ;hyTiOb0AAAAJ;;",
        "orcid": "0000-0001-5445-5148;0000-0001-6876-1795;;0009-0006-9417-5179;0009-0002-0425-6268",
        "linkedin": ";;;;",
        "or_profile": "~Shengsheng_Lin1;~Weiwei_Lin1;~Wentai_Wu1;~Songbo_Wang1;~Yongxiang_Wang2",
        "aff": "South China University of Technology;South China University of Technology;Jinan University;South China University of Technology;South China University of Technology",
        "aff_domain": "scut.edu.cn;scut.edu.cn;jnu.edu.cn;scut.edu.cn;scut.edu.cn",
        "position": "PhD student;Full Professor;Associate Professor;MS student;PhD student",
        "bibtex": "@misc{\nlin2024petformer,\ntitle={{PET}former: Long-term Time Series Forecasting via Placeholder-enhanced Transformer},\nauthor={Shengsheng Lin and Weiwei Lin and Wentai Wu and Songbo Wang and Yongxiang Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=u3RJbzzBZj}\n}",
        "github": "",
        "project": "",
        "reviewers": "27hd;Gtuh;vDyH",
        "site": "https://openreview.net/forum?id=u3RJbzzBZj",
        "pdf_size": 615466,
        "rating": "3;5;5",
        "confidence": "4;5;4",
        "soundness": "2;3;3",
        "contribution": "1;2;2",
        "presentation": "1;3;2",
        "wc_summary": "49;83;46",
        "wc_strengths": "36;56;27",
        "wc_weaknesses": "322;243;16",
        "wc_questions": "5;83;24",
        "wc_review": "412;465;113",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            59.333333333333336,
            16.779617264870957
        ],
        "wc_strengths_avg": [
            39.666666666666664,
            12.119772641798562
        ],
        "wc_weaknesses_avg": [
            193.66666666666666,
            129.70307972013958
        ],
        "wc_questions_avg": [
            37.333333333333336,
            33.209770985191824
        ],
        "wc_review_avg": [
            330.0,
            154.96020994651067
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 29,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4683659379561217077&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "South China University of Technology;Jinan University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.scut.edu.cn;https://www.jnu.edu.cn",
        "aff_unique_abbr": "SCUT;JNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "The Joint Effect of Task Similarity and Overparameterization on Catastrophic Forgetting \u2014 An Analytical Model",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17591",
        "id": "u3dHl287oB",
        "author_site": "Daniel Goldfarb, Itay Evron, Nir Weinberger, Daniel Soudry, Paul Hand",
        "tldr": "",
        "abstract": "In continual learning, catastrophic forgetting is affected by multiple aspects of the tasks. Previous works have analyzed separately how forgetting is affected by either task similarity or overparameterization. In contrast, our paper examines how task similarity and overparameterization jointly affect forgetting in an analyzable model. Specifically, we focus on two-task continual linear regression, where the second task is a random orthogonal transformation of an arbitrary first task (an abstraction of random permutation tasks). We derive an exact analytical expression for the expected forgetting \u2014 and uncover a nuanced pattern. In highly overparameterized models, intermediate task similarity causes the most forgetting. However, near the interpolation threshold, forgetting decreases monotonically with the expected task similarity. We validate our findings with linear regression on synthetic data, and with neural networks on established permutation task benchmarks.",
        "keywords": "deep learning;continual learning;overparameterization;task similarity;catastrophic forgetting;theory",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Daniel Goldfarb;Itay Evron;Nir Weinberger;Daniel Soudry;PAul HAnd",
        "authorids": "~Daniel_Goldfarb1;~Itay_Evron1;~Nir_Weinberger1;~Daniel_Soudry1;~PAul_HAnd1",
        "gender": "M;M;M;M;M",
        "homepage": ";http://www.evron.me;https://sites.google.com/view/nir-weinberger/home;https://soudry.github.io/;",
        "dblp": "151/6529;217/1801;82/11151.html;126/1779;",
        "google_scholar": "EBnnm8UAAAAJ;https://scholar.google.co.il/citations?user=Df3po24AAAAJ;zRkNfH8AAAAJ;https://scholar.google.co.il/citations?user=AEBWEm8AAAAJ;zzG75zEAAAAJ",
        "orcid": ";;;0000-0001-9368-6352;",
        "linkedin": "goldfarb-daniel;;;daniel-soudry-2aa3a88/;",
        "or_profile": "~Daniel_Goldfarb1;~Itay_Evron1;~Nir_Weinberger1;~Daniel_Soudry1;~PAul_HAnd1",
        "aff": "Northeastern University;Technion, Technion;Electrical Engineering Department, Technion \u2013 Israel Institute of Technology, Technion - Israel Institute of Technology;Technion - Israel Institute of Technology, Technion;Rice University",
        "aff_domain": "northeastern.edu;technion.ac.il;ee.technion.ac.il;technion.ac.il;rice.edu",
        "position": "PhD student;PhD student;Assistant Professor;Associate Professor;Assistant Professor",
        "bibtex": "@inproceedings{\ngoldfarb2024the,\ntitle={The Joint Effect of Task Similarity and Overparameterization on Catastrophic Forgetting {\\textemdash} An Analytical Model},\nauthor={Daniel Goldfarb and Itay Evron and Nir Weinberger and Daniel Soudry and PAul HAnd},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=u3dHl287oB}\n}",
        "github": "",
        "project": "",
        "reviewers": "SXpA;yV41;TGNt;vLwn;6udf;ckB1",
        "pdf_size": 2913683,
        "rating": "3;3;6;6;8;8",
        "confidence": "4;4;3;4;5;5",
        "soundness": "2;3;3;3;3;4",
        "contribution": "2;1;3;2;3;3",
        "presentation": "1;3;3;2;3;4",
        "wc_summary": "33;111;62;693;59;94",
        "wc_strengths": "8;64;33;91;30;101",
        "wc_weaknesses": "88;243;35;384;19;239",
        "wc_questions": "33;84;123;290;118;2",
        "wc_review": "162;502;253;1458;226;436",
        "wc_reply_reviewers": "0;134;0;0;0;180",
        "wc_reply_authors": "443;777;609;1521;468;778",
        "reply_reviewers": "0;1;0;0;0;1",
        "reply_authors": "1;2;1;2;1;2",
        "rating_avg": [
            5.666666666666667,
            2.0548046676563256
        ],
        "confidence_avg": [
            4.166666666666667,
            0.6871842709362768
        ],
        "soundness_avg": [
            3.0,
            0.5773502691896257
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.7453559924999298
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            175.33333333333334,
            232.86953906044093
        ],
        "wc_strengths_avg": [
            54.5,
            33.68852425777459
        ],
        "wc_weaknesses_avg": [
            168.0,
            131.41029893682864
        ],
        "wc_questions_avg": [
            108.33333333333333,
            92.09174169755337
        ],
        "wc_review_avg": [
            506.1666666666667,
            441.9586770527559
        ],
        "wc_reply_reviewers_avg": [
            52.333333333333336,
            75.19234594617252
        ],
        "wc_reply_authors_avg": [
            766.0,
            362.415967271495
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.511478158987012,
        "gs_citation": 17,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4206568891624065917&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=u3dHl287oB",
        "pdf": "https://openreview.net/pdf?id=u3dHl287oB",
        "email": "northeastern.edu;technion.ac.il;ee.technion.ac.il;technion.ac.il;rice.edu",
        "author_num": 5,
        "aff_unique_index": "0;1;2;1;3",
        "aff_unique_norm": "Northeastern University;Technion - Israel Institute of Technology;Technion \u2013 Israel Institute of Technology;Rice University",
        "aff_unique_dep": ";;Electrical Engineering Department;",
        "aff_unique_url": "https://www.northeastern.edu;https://www.technion.ac.il/en/;https://www.technion.ac.il;https://www.rice.edu",
        "aff_unique_abbr": "NEU;Technion;Technion;Rice",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;0",
        "aff_country_unique": "United States;Israel"
    },
    {
        "title": "Scaling physics-informed hard constraints with mixture-of-experts",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17590",
        "id": "u3dX2CEIZb",
        "author_site": "Nithin Chalapathi, Yiheng Du, Aditi Krishnapriyan",
        "tldr": "",
        "abstract": "Imposing known physical constraints, such as conservation laws, during neural network training introduces an inductive bias that can improve accuracy, reliability, convergence, and data efficiency for modeling physical dynamics. While such constraints can be softly imposed via loss function penalties, recent advancements in differentiable physics and optimization improve performance by incorporating PDE-constrained optimization as individual layers in neural networks. This enables a stricter adherence to physical constraints. However, imposing hard constraints significantly increases computational and memory costs, especially for complex dynamical systems. This is because it requires solving an optimization problem over a large number of points in a mesh, representing spatial and temporal discretizations, which greatly increases the complexity of the constraint. To address this challenge, we develop a scalable approach to enforce hard physical constraints using Mixture-of-Experts (MoE), which can be used with any neural network architecture. Our approach imposes the constraint over smaller decomposed domains, each of which is solved by an ``expert'' through differentiable optimization. During training, each expert independently performs a localized backpropagation step by leveraging the implicit function theorem; the independence of each expert allows for parallelization across multiple GPUs. Compared to standard differentiable optimization, our scalable approach achieves greater accuracy in the neural PDE solver setting for predicting the dynamics of challenging non-linear systems. We also improve training stability and require significantly less computation time during both training and inference stages.",
        "keywords": "Physics-Informed Machine Learning;PDEs;differentiable optimization;differentiable physics;neural networks;mixture of experts;constrained optimization;neural operators",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Nithin Chalapathi;Yiheng Du;Aditi S. Krishnapriyan",
        "authorids": "~Nithin_Chalapathi1;~Yiheng_Du1;~Aditi_S._Krishnapriyan1",
        "gender": "M;M;",
        "homepage": "https://github.com/nithinvc/;https://github.com/mrlazy1708;https://a1k12.github.io",
        "dblp": "255/5081;;256/5472",
        "google_scholar": ";;7HoFN1wAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Nithin_Chalapathi1;~Yiheng_Du1;~Aditi_Krishnapriyan1",
        "aff": "University of California, Berkeley;Peking University;University of California, Berkeley",
        "aff_domain": "berkeley.edu;pku.edu.cn;berkeley.edu",
        "position": "PhD student;Undergrad student;Assistant Professor",
        "bibtex": "@inproceedings{\nchalapathi2024scaling,\ntitle={Scaling physics-informed hard constraints with mixture-of-experts},\nauthor={Nithin Chalapathi and Yiheng Du and Aditi S. Krishnapriyan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=u3dX2CEIZb}\n}",
        "github": "",
        "project": "",
        "reviewers": "v3ig;7bFe;gWoi;Tpvx;ihJQ",
        "pdf_size": 1669137,
        "rating": "6;6;6;6;6",
        "confidence": "3;3;4;4;3",
        "soundness": "3;3;2;3;3",
        "contribution": "3;3;3;3;3",
        "presentation": "3;3;3;3;3",
        "wc_summary": "47;196;125;135;80",
        "wc_strengths": "41;134;76;67;49",
        "wc_weaknesses": "397;224;212;43;62",
        "wc_questions": "2;46;78;142;110",
        "wc_review": "487;600;491;387;301",
        "wc_reply_reviewers": "0;0;90;0;0",
        "wc_reply_authors": "569;678;837;596;504",
        "reply_reviewers": "0;0;1;0;0",
        "reply_authors": "1;1;2;1;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.4,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            116.6,
            50.78818760302438
        ],
        "wc_strengths_avg": [
            73.4,
            32.75728926513914
        ],
        "wc_weaknesses_avg": [
            187.6,
            128.4158868676302
        ],
        "wc_questions_avg": [
            75.6,
            48.767202093210145
        ],
        "wc_review_avg": [
            453.2,
            101.65510316752426
        ],
        "wc_reply_reviewers_avg": [
            18.0,
            36.0
        ],
        "wc_reply_authors_avg": [
            636.8,
            114.60785313406757
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            1.2,
            0.4
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11858000895132001747&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=u3dX2CEIZb",
        "pdf": "https://openreview.net/pdf?id=u3dX2CEIZb",
        "email": "berkeley.edu;pku.edu.cn;berkeley.edu",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of California, Berkeley;Peking University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.berkeley.edu;http://www.pku.edu.cn",
        "aff_unique_abbr": "UC Berkeley;Peking U",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Berkeley;",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "ScaleCrafter: Tuning-free Higher-Resolution Visual Generation with Diffusion Models",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17589",
        "id": "u48tHG5f66",
        "author_site": "Yingqing He, Shaoshu Yang, Haoxin Chen, Xiaodong Cun, Menghan Xia, Yong Zhang, Xintao Wang, Ran He, Qifeng Chen, Ying Shan",
        "tldr": "",
        "abstract": "In this work, we investigate the capability of generating images from pre-trained diffusion models at much higher resolutions than the training image sizes. In addition, the generated images should have arbitrary image aspect ratios. When generating images directly at a higher resolution, 1024 x 1024, with the pre-trained Stable Diffusion using training images of resolution 512 x 512, we observe persistent problems of object repetition and unreasonable object structures. Existing works for higher-resolution generation, such as attention-based and joint-diffusion approaches, cannot well address these issues. As a new perspective, we examine the structural components of the U-Net in diffusion models and identify the crucial cause as the limited perception field of convolutional kernels. Based on this key observation, we propose a simple yet effective re-dilation that can dynamically adjust the convolutional perception field during inference. We further propose the dispersed convolution and noise-damped classifier-free guidance, which can enable ultra-high-resolution image generation  (e.g., 4096 x 4096). Notably, our approach does not require any training or optimization. Extensive experiments demonstrate that our approach can address the repetition issue well and achieve state-of-the-art performance on higher-resolution image synthesis, especially in texture details. Our work also suggests that a pre-trained diffusion model trained on low-resolution images can be directly used for high-resolution visual generation without further tuning, which may provide insights for future research on ultra-high-resolution image and video synthesis. More results are available at the anonymous website: https://scalecrafter.github.io/ScaleCrafter/",
        "keywords": "text-to-image generation;diffusion models;high resolution generation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/b24b873f0292180d0378ed9ef8320ce499ed793e.pdf",
        "author": "Yingqing He;Shaoshu Yang;Haoxin Chen;Xiaodong Cun;Menghan Xia;Yong Zhang;Xintao Wang;Ran He;Qifeng Chen;Ying Shan",
        "authorids": "~Yingqing_He1;~Shaoshu_Yang1;~Haoxin_Chen2;~Xiaodong_Cun1;~Menghan_Xia1;~Yong_Zhang6;~Xintao_Wang1;~Ran_He1;~Qifeng_Chen1;~Ying_Shan2",
        "gender": ";M;M;M;M;M;;M;M;M",
        "homepage": "https://github.com/YingqingHe;https://github.com/ssyang1999/ssyang1999.github.io;;https://vinthony.github.io;https://menghanxia.github.io/;https://yzhang2016.github.io/yongnorriszhang.github.io/;;https://rhe-web.github.io/;http://cqf.io/;",
        "dblp": "161/3838;358/9392;;210/0897;169/4908;66/4615-34.html;;61/6198-1;117/4819;68/5910",
        "google_scholar": ";;6UPJSvwAAAAJ;p42qwXcAAAAJ;IJxaAQQAAAAJ;a_zSeVEAAAAJ;;ayrg9AUAAAAJ;lLMX9hcAAAAJ;4oXBp9UAAAAJ",
        "orcid": "0000-0003-0134-8220;;;0000-0003-3607-2236;;;;0000-0002-3807-991X;;0000-0001-7673-8325",
        "linkedin": ";;;;;;;;;YingShanProfile/",
        "or_profile": "~Yingqing_He1;~Shaoshu_Yang1;~Haoxin_Chen2;~Xiaodong_Cun1;~Menghan_Xia1;~Yong_Zhang6;~Xintao_Wang1;~Ran_He1;~Qifeng_Chen1;~Ying_Shan2",
        "aff": "Hong Kong University of Science and Technology;Institute of Automation, Chinese Academy of Sciences;Tencent AI Lab;Great Bay University;Tencent AI Lab;Tencent AI Lab;;Institute of Automation, Chinese Academy of Sciences;Hong Kong University of Science and Technology;Tencent PCG ARC Lab",
        "aff_domain": "ust.hk;ia.ac.cn;tencent.com;gbu.edu.cn;tencent.com;tencent.com;;ia.ac.cn;hkust.edu;arc.tencent.com",
        "position": "PhD student;PhD student;Researcher;Assistant Professor;Researcher;Researcher;;Full Professor;Assistant Professor;Director",
        "bibtex": "@inproceedings{\nhe2024scalecrafter,\ntitle={ScaleCrafter: Tuning-free Higher-Resolution Visual Generation with Diffusion Models},\nauthor={Yingqing He and Shaoshu Yang and Haoxin Chen and Xiaodong Cun and Menghan Xia and Yong Zhang and Xintao Wang and Ran He and Qifeng Chen and Ying Shan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=u48tHG5f66}\n}",
        "github": "",
        "project": "",
        "reviewers": "3ixD;URVR;7LTr;6a3j",
        "pdf_size": 1345283,
        "rating": "6;6;6;8",
        "confidence": "4;3;4;4",
        "soundness": "3;3;2;4",
        "contribution": "3;3;2;4",
        "presentation": "3;3;3;3",
        "wc_summary": "126;95;68;62",
        "wc_strengths": "55;53;32;157",
        "wc_weaknesses": "219;14;114;28",
        "wc_questions": "121;178;42;6",
        "wc_review": "521;340;256;253",
        "wc_reply_reviewers": "24;12;0;0",
        "wc_reply_authors": "601;662;745;106",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            87.75,
            25.341418665891617
        ],
        "wc_strengths_avg": [
            74.25,
            48.61776938527723
        ],
        "wc_weaknesses_avg": [
            93.75,
            81.82412541542989
        ],
        "wc_questions_avg": [
            86.75,
            67.12441806079215
        ],
        "wc_review_avg": [
            342.5,
            108.81291283666658
        ],
        "wc_reply_reviewers_avg": [
            9.0,
            9.9498743710662
        ],
        "wc_reply_authors_avg": [
            528.5,
            249.22730588761738
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 64,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2844605454428010714&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=u48tHG5f66",
        "pdf": "https://openreview.net/pdf?id=u48tHG5f66",
        "email": "ust.hk;ia.ac.cn;tencent.com;gbu.edu.cn;tencent.com;tencent.com;;ia.ac.cn;hkust.edu;arc.tencent.com",
        "author_num": 10,
        "aff_unique_index": "0;1;2;3;2;2;1;0;2",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Chinese Academy of Sciences;Tencent;Great Bay University",
        "aff_unique_dep": ";Institute of Automation;Tencent AI Lab;",
        "aff_unique_url": "https://www.ust.hk;http://www.ia.cas.cn;https://ai.tencent.com;https://www.greatbay.edu",
        "aff_unique_abbr": "HKUST;CAS;Tencent AI Lab;",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;1;0;0;0;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "u4CQHLTfg5",
        "title": "Individual Fairness as an Extension of Group Fairness",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Since its formal definition in 2011, _individual fairness_ has received relatively little attention from the machine learning community in comparison to _group fairness_. The reasons for this are several-fold. In order to implement it, one must define a similarity metric; obtaining this is a non-trivial task and an active research area. According to individual fairness, discontinuity in modelling, and thus deterministic classification, is inherently unfair. To achieve individual fairness we must turn to probabilistic models in which predictions are randomised. For many, this flies in the face of logic. Perhaps most importantly, researchers have conflicting views on its compatibility with group fairness.\n\nIn this work we present arguments which resolve conflicting research on the nature of individual fairness. We clarify important defining features of individual fairness, framing it as an extension of group fairness, rather than acting in opposition to it. We review empirical evidence of the trade-off between group and individual fairness and derive a new representation for the associated individual fairness metric (which we term _individual cost_). With this new representation we prove that individual cost is strongly related to utility. We conclude that empirical evidence does not support the existence of a trade-off between group and individual fairness but rather, likely demonstrates the well known trade-off between fairness and utility.",
        "keywords": "Individual fairness;group fairness;consistency;generalised entropy indices",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Leena Murgai;Ricardo A. Baeza-Yates",
        "authorids": "~Leena_Murgai1;~Ricardo_A._Baeza-Yates1",
        "gender": ";",
        "homepage": "https://www.leenamurgai.co.uk;",
        "dblp": ";",
        "google_scholar": "kGBCAw8AAAAJ;",
        "orcid": "0009-0002-0145-4365;",
        "linkedin": "leenamurgai/;",
        "or_profile": "~Leena_Murgai1;~Ricardo_A._Baeza-Yates1",
        "aff": "Northeastern University;",
        "aff_domain": "neu.edu;",
        "position": "Researcher;",
        "bibtex": "@misc{\nmurgai2024individual,\ntitle={Individual Fairness as an Extension of Group Fairness},\nauthor={Leena Murgai and Ricardo A. Baeza-Yates},\nyear={2024},\nurl={https://openreview.net/forum?id=u4CQHLTfg5}\n}",
        "github": "",
        "project": "",
        "reviewers": "RJ1C;1B79;iiHT",
        "site": "https://openreview.net/forum?id=u4CQHLTfg5",
        "pdf_size": 1490570,
        "rating": "3;3;3",
        "confidence": "4;4;4",
        "soundness": "3;3;2",
        "contribution": "2;1;2",
        "presentation": "1;3;2",
        "wc_summary": "91;119;59",
        "wc_strengths": "61;40;36",
        "wc_weaknesses": "97;210;87",
        "wc_questions": "111;68;335",
        "wc_review": "360;437;517",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            89.66666666666667,
            24.513035081133644
        ],
        "wc_strengths_avg": [
            45.666666666666664,
            10.96458946893235
        ],
        "wc_weaknesses_avg": [
            131.33333333333334,
            55.77534301901593
        ],
        "wc_questions_avg": [
            171.33333333333334,
            117.053643922586
        ],
        "wc_review_avg": [
            438.0,
            64.09888194552747
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:n_xFgmBMxe8J:scholar.google.com/&scioq=Individual+Fairness+as+an+Extension+of+Group+Fairness&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Northeastern University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.northeastern.edu",
        "aff_unique_abbr": "NEU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "u4FiXrH09F",
        "title": "Implicit Neural Network on Dynamic Graphs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent works have demonstrated that graph convolution neural networks fail either to capture long-range dependencies in the network or suffer from over-smoothing issues. Several recent works have proposed implicit graph neural networks to remedy the issues. However, despite these issues being magnified in dynamic graphs, where the feature aggregation occurs through both the graph neighborhood and across time stamps, no prior work has developed implicit models to overcome these issues. Here we present IDGNN, a novel implicit neural network for dynamic graphs. We demonstrate that IDGNN is well-posed, i.e., it has a unique fixed-point solution. However, the standard iterative algorithm often used to train implicit models is computationally expensive in our setting and cannot be used to train IDGNN efficiently. To overcome this, we pose an equivalent bi-level optimization problem and propose a single-loop training algorithm. We conduct extensive experiments on real-world datasets on both classification and regression tasks to demonstrate the superiority of our approach over the state-of-the-art baseline approaches. We also demonstrate that our bi-level optimization framework maintains the performance of the standard iterative algorithm while obtaining up to 1600x speed-up.",
        "keywords": "Implicit Models;Dynamic Graphs",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/db8485b498b286ceef759329df54b5ceb6b510df.zip",
        "author": "Yongjian Zhong;Hieu Vu;Tianbao Yang;Bijaya Adhikari",
        "authorids": "~Yongjian_Zhong2;~Hieu_Vu1;~Tianbao_Yang1;~Bijaya_Adhikari1",
        "gender": "M;M;;",
        "homepage": "https://github.com/hieuvt29;https://people.tamu.edu/~tianbao-yang/publications.html;https://homepage.divms.uiowa.edu/~badhikari/;",
        "dblp": ";56/7047;134/4891;232/5618",
        "google_scholar": ";https://scholar.google.com.tw/citations?user=BCxFU0EAAAAJ;;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Hieu_Vu1;~Tianbao_Yang1;~Bijaya_Adhikari1;~YONGJIAN_ZHONG1",
        "aff": "University of Iowa;Texas A&M University - College Station;University of Iowa;University of Iowa",
        "aff_domain": "cs.uiowa.edu;tamu.edu;iowa.edu;uiowa.edu",
        "position": "PhD student;Associate Professor;Assistant Professor;PhD student",
        "bibtex": "@misc{\nzhong2024implicit,\ntitle={Implicit Neural Network on Dynamic Graphs},\nauthor={Yongjian Zhong and Hieu Vu and Tianbao Yang and Bijaya Adhikari},\nyear={2024},\nurl={https://openreview.net/forum?id=u4FiXrH09F}\n}",
        "github": "",
        "project": "",
        "reviewers": "mjoJ;qxmJ;NhSL;gbnb",
        "site": "https://openreview.net/forum?id=u4FiXrH09F",
        "pdf_size": 976469,
        "rating": "3;5;5;6",
        "confidence": "4;3;4;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "1;2;2;3",
        "wc_summary": "76;79;86;152",
        "wc_strengths": "39;50;78;178",
        "wc_weaknesses": "159;412;265;138",
        "wc_questions": "2;34;139;141",
        "wc_review": "276;575;568;609",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "807;667;646;534",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            98.25,
            31.24399942388938
        ],
        "wc_strengths_avg": [
            86.25,
            54.846946131940655
        ],
        "wc_weaknesses_avg": [
            243.5,
            108.54146673046205
        ],
        "wc_questions_avg": [
            79.0,
            62.044338984310244
        ],
        "wc_review_avg": [
            507.0,
            134.26652598469954
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            663.5,
            97.05797236703434
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.6882472016116854,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:tI-iFXkWFLoJ:scholar.google.com/&scioq=Implicit+Neural+Network+on+Dynamic+Graphs&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "University of Iowa;Texas A&M University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uiowa.edu;https://www.tamu.edu",
        "aff_unique_abbr": "UIowa;TAMU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";College Station",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "u6Ux5OCGmW",
        "title": "RSAM: Learning on Manifolds with Riemannian Sharpness-Aware Minimization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Nowadays, understanding the geometry of the loss landscape shows promise in enhancing a model's generalization ability. In this work, we draw upon prior works that apply geometric principles to optimization and present a novel approach to improve robustness and generalization ability for constrained optimization problems. Indeed, this paper aims to generalize the Sharpness-Aware Minimization (SAM) optimizer to Riemannian manifolds. In doing so, we first extend the concept of sharpness and introduce a novel notion of sharpness on manifolds. To support this notion of sharpness, we present a theoretical analysis characterizing generalization capabilities with respect to manifold sharpness, which demonstrates a tighter bound on the generalization gap, a result not known before. Motivated by this analysis, we introduce our algorithm, Riemannian Sharpness-Aware Minimization (RSAM). To demonstrate RSAM's ability to enhance generalization ability, we evaluate and contrast our algorithm on a broad set of problems, such as image classification and contrastive learning across different datasets, including CIFAR100, CIFAR10, and FGVCAircraft. Our code is publicly available at \\url{https://t.ly/RiemannianSAM}.",
        "keywords": "manifold;constrained optimization;sharpness-aware minimization;optimization",
        "primary_area": "metric learning, kernel learning, and sparse coding",
        "supplementary_material": "/attachment/3c8b52c6fefbce9bef130cccff733518483fee03.pdf",
        "author": "Tuan Truong;Hoang-Phi Nguyen;Tung Pham;Minh-Tuan Tran;Mehrtash Harandi;Dinh Phung;Trung Le",
        "authorids": "~Tuan_Truong1;~Hoang-Phi_Nguyen1;~Tung_Pham1;~Minh-Tuan_Tran1;~Mehrtash_Harandi2;~Dinh_Phung2;~Trung_Le2",
        "gender": "M;M;M;M;M;M;M",
        "homepage": ";;https://sites.google.com/view/tmtuan1307;;https://research.monash.edu/en/persons/dinh-phung;https://github.com/nghgphi;https://sites.google.com/site/mehrtashharandi/",
        "dblp": ";38/10862-1;297/3277;;71/5859;;92/5921",
        "google_scholar": ";KcUuEKsAAAAJ;iag2fS0AAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com.au/citations?user=OtA9SwIAAAAJ;;--M1XEkAAAAJ",
        "orcid": ";;0000-0002-9401-9786;;0000-0002-9977-8247;;0000-0002-6937-6300",
        "linkedin": "tuan-truong-620a5119b/;;;;https://linkedin.com/in/dinh-phung-6b537a6;;mehrtash-harandi-b99358155/",
        "or_profile": "~Tuan_Truong1;~Tung_Pham1;~Minh-Tuan_Tran1;~Trung_Le2;~Dinh_Phung1;~Phi_Hoang_Nguyen1;~Mehrtash_T._Harandi1",
        "aff": "University of British Columbia;VinAI Research;Monash University;Monash University;Monash University;VinAI Research;Australian National University",
        "aff_domain": "cs.ubc.ca;vinai.io;monash.edu;monash.edu;monash.edu;vinai.io;anu.edu.au",
        "position": "Undergrad student;Researcher;PhD student;Assistant Professor;Full Professor;Researcher;Adjunct",
        "bibtex": "@misc{\ntruong2024rsam,\ntitle={{RSAM}: Learning on Manifolds with Riemannian Sharpness-Aware Minimization},\nauthor={Tuan Truong and Hoang-Phi Nguyen and Tung Pham and Minh-Tuan Tran and Mehrtash Harandi and Dinh Phung and Trung Le},\nyear={2024},\nurl={https://openreview.net/forum?id=u6Ux5OCGmW}\n}",
        "github": "",
        "project": "",
        "reviewers": "efpX;damX;gTdN;dxfe",
        "site": "https://openreview.net/forum?id=u6Ux5OCGmW",
        "pdf_size": 799267,
        "rating": "3;3;5;5",
        "confidence": "5;4;3;3",
        "soundness": "1;1;3;2",
        "contribution": "1;2;2;2",
        "presentation": "1;1;1;2",
        "wc_summary": "22;88;49;82",
        "wc_strengths": "13;31;32;35",
        "wc_weaknesses": "59;306;45;74",
        "wc_questions": "215;94;74;183",
        "wc_review": "309;519;200;374",
        "wc_reply_reviewers": "0;0;41;0",
        "wc_reply_authors": "305;0;283;228",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;0;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            60.25,
            26.61179249881526
        ],
        "wc_strengths_avg": [
            27.75,
            8.642193008721803
        ],
        "wc_weaknesses_avg": [
            121.0,
            107.3009785603095
        ],
        "wc_questions_avg": [
            141.5,
            59.02753594721704
        ],
        "wc_review_avg": [
            350.5,
            115.45237113199538
        ],
        "wc_reply_reviewers_avg": [
            10.25,
            17.75352077758099
        ],
        "wc_reply_authors_avg": [
            204.0,
            121.07229245372369
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            0.75,
            0.4330127018922193
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.9045340337332909,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:AxWXRR6yyv8J:scholar.google.com/&scioq=RSAM:+Learning+on+Manifolds+with+Riemannian+Sharpness-Aware+Minimization&hl=en&as_sdt=0,5",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;2;2;1;3",
        "aff_unique_norm": "University of British Columbia;VinAI Research;Monash University;Australian National University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.ubc.ca;https://www.vinai.io/;https://www.monash.edu;https://www.anu.edu.au",
        "aff_unique_abbr": "UBC;VinAI;Monash;ANU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;2;2;1;2",
        "aff_country_unique": "Canada;Vietnam;Australia"
    },
    {
        "title": "Large Language Models as Generalizable Policies for Embodied Tasks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17588",
        "id": "u6imHU4Ebu",
        "author_site": "Andrew Szot, Max Schwarzer, Harsh Agrawal, Bogdan Mazoure, Katherine Metcalf, Walter Talbott, Natalie Mackraz, R Devon Hjelm, Alexander Toshev",
        "tldr": "",
        "abstract": "We show that large language models (LLMs) can be adapted to be generalizable policies for embodied visual tasks. Our approach, called Large LAnguage model Reinforcement Learning Policy (LLaRP), adapts a pre-trained frozen LLM to take as input text instructions and visual egocentric observations and output actions directly in the environment. Using reinforcement learning, we train LLaRP to see and act solely through environmental interactions. We show that LLaRP is robust to complex paraphrasings of task instructions and can generalize to new tasks that require novel optimal behavior. In particular, on 1,000 unseen tasks it achieves 42% success rate, 1.7x the success rate of other common learned baselines or zero-shot applications of LLMs. Finally, to aid the community in studying language conditioned, massively multi-task, embodied AI problems we release a novel benchmark, Language Rearrangement, consisting of 150,000 training and 1,000 testing tasks for language-conditioned rearrangement.",
        "keywords": "Embodied AI;Reinforcement Learning;Large Language Models;Foundational Models",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Andrew Szot;Max Schwarzer;Harsh Agrawal;Bogdan Mazoure;Rin Metcalf;Walter Talbott;Natalie Mackraz;R Devon Hjelm;Alexander T Toshev",
        "authorids": "~Andrew_Szot1;~Max_Schwarzer1;~Harsh_Agrawal1;~Bogdan_Mazoure1;~Rin_Metcalf1;~Walter_Talbott1;~Natalie_Mackraz1;~R_Devon_Hjelm1;~Alexander_T_Toshev1",
        "gender": "M;;M;M;;;F;M;M",
        "homepage": "https://www.andrewszot.com;;https://dexter1691.github.io;https://bmazoure.github.io;;;;;http://alex.toshev.tech",
        "dblp": ";;163/2041;;141/6401;241/6096;359/5984;195/5928;96/2687",
        "google_scholar": "IwIWKPYAAAAJ;YmWRSvgAAAAJ;0nsfDPAAAAAJ;https://scholar.google.ca/citations?user=NaxShlcAAAAJ;V7baeTMAAAAJ;;;https://scholar.google.ca/citations?user=68c5HfwAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;;;;;;",
        "linkedin": ";maxaschwarzer/;harsh092;;;;natalie-mackraz/;;alexander-toshev-9270726/",
        "or_profile": "~Andrew_Szot1;~Max_Schwarzer1;~Harsh_Agrawal1;~Bogdan_Mazoure1;~Rin_Metcalf1;~Walter_Talbott1;~Natalie_Mackraz1;~R_Devon_Hjelm1;~Alexander_Toshev1",
        "aff": "Georgia Institute of Technology;University of Montreal;Apple;Apple;Apple;Apple;Apple;Apple;Apple",
        "aff_domain": "gatech.edu;umontreal.ca;apple.com;apple.com;apple.com;apple.com;apple.com;apple.com;apple.com",
        "position": "PhD student;PhD student;Researcher;Research Scientist;Researcher;Research Scientist;Researcher;Researcher;research scientist",
        "bibtex": "@inproceedings{\nszot2024large,\ntitle={Large Language Models as Generalizable Policies for Embodied Tasks},\nauthor={Andrew Szot and Max Schwarzer and Harsh Agrawal and Bogdan Mazoure and Rin Metcalf and Walter Talbott and Natalie Mackraz and R Devon Hjelm and Alexander T Toshev},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=u6imHU4Ebu}\n}",
        "github": "",
        "project": "",
        "reviewers": "vC8Q;92Kq;DZLf;Daer",
        "pdf_size": 34268332,
        "rating": "5;6;6;6",
        "confidence": "3;4;4;3",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;2",
        "wc_summary": "84;84;154;61",
        "wc_strengths": "28;94;104;125",
        "wc_weaknesses": "159;67;355;391",
        "wc_questions": "3;12;61;29",
        "wc_review": "274;257;674;606",
        "wc_reply_reviewers": "0;0;282;89",
        "wc_reply_authors": "838;362;1553;706",
        "reply_reviewers": "0;0;2;1",
        "reply_authors": "3;3;5;2",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            95.75,
            34.91686555233731
        ],
        "wc_strengths_avg": [
            87.75,
            36.265513921630834
        ],
        "wc_weaknesses_avg": [
            243.0,
            134.61054936371073
        ],
        "wc_questions_avg": [
            26.25,
            22.128883839904805
        ],
        "wc_review_avg": [
            452.75,
            188.88273478536888
        ],
        "wc_reply_reviewers_avg": [
            92.75,
            115.14637423731587
        ],
        "wc_reply_authors_avg": [
            864.75,
            433.69423272623766
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.25,
            1.0897247358851685
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 75,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9233309662173242381&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=u6imHU4Ebu",
        "pdf": "https://openreview.net/pdf?id=u6imHU4Ebu",
        "email": "gatech.edu;umontreal.ca;apple.com;apple.com;apple.com;apple.com;apple.com;apple.com;apple.com",
        "author_num": 9,
        "aff_unique_index": "0;1;2;2;2;2;2;2;2",
        "aff_unique_norm": "Georgia Institute of Technology;University of Montreal;Apple",
        "aff_unique_dep": ";;Apple Inc.",
        "aff_unique_url": "https://www.gatech.edu;https://wwwumontreal.ca;https://www.apple.com",
        "aff_unique_abbr": "Georgia Tech;UM;Apple",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;0;0;0;0;0",
        "aff_country_unique": "United States;Canada"
    },
    {
        "id": "u6jbcaCHqO",
        "title": "SciBench: Evaluating College-Level Scientific Problem-Solving Abilities of Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent advances in large language models (LLMs) have demonstrated notable progress on many mathematical benchmarks. However, most of these benchmarks only feature problems grounded in junior and senior high school subjects, contain only multiple-choice questions, and are confined to a limited scope of elementary arithmetic operations. To address these issues, this paper introduces an expansive benchmark suite SciBench that aims to systematically examine the reasoning capabilities required for complex scientific problem solving. SciBench contains two carefully curated datasets: an open set featuring a range of collegiate-level scientific problems drawn from mathematics, chemistry, and physics textbooks, and a closed set comprising problems from undergraduate-level exams in computer science and mathematics. Based on the two datasets, we conduct an in-depth benchmark study of two representative LLMs with various prompting strategies. The results reveal that current LLMs fall short of delivering satisfactory performance, with an overall score of merely 35.80%. Furthermore, through a detailed user study, we categorize the errors made by LLMs into ten problem-solving abilities. Our analysis indicates that no single prompting strategy significantly outperforms others and some strategies that demonstrate improvements in certain problem-solving skills result in declines in other skills. We envision that SciBench will catalyze further developments in the reasoning abilities of LLMs, thereby ultimately contributing to scientific research and discovery.",
        "keywords": "scientific computing;problem solving;large language models",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/bae48064b3f8217abf7fcc95815a96d97b0b8232.pdf",
        "author": "Xiaoxuan Wang;Ziniu Hu;Pan Lu;Yanqiao Zhu;Jieyu Zhang;Satyen Subramaniam;Arjun R Loomba;Shichang Zhang;Yizhou Sun;Wei Wang",
        "authorids": "~Xiaoxuan_Wang2;~Ziniu_Hu1;~Pan_Lu2;~Yanqiao_Zhu1;~Jieyu_Zhang1;~Satyen_Subramaniam1;~Arjun_R_Loomba1;~Shichang_Zhang2;~Yizhou_Sun1;~Wei_Wang13",
        "gender": "F;M;M;M;M;M;M;F;F;M",
        "homepage": ";http://acbull.github.io;https://sxkdz.github.io;https://jieyuz2.github.io/;;;https://shichangzh.github.io/;http://web.cs.ucla.edu/~yzsun/;http://www.cs.ucla.edu/~weiwang;https://lupantech.github.io/",
        "dblp": ";180/5436;67/8383-1;;;;234/4118;37/3868;w/WeiWang.html;",
        "google_scholar": "5LDKaEYAAAAJ;x6ct1CsAAAAJ;NBbJT3AAAAAJ;T_INUHUAAAAJ;;;TYqG0x4AAAAJ;https://scholar.google.com.tw/citations?user=TQgOjK0AAAAJ;UedS9LQAAAAJ;IyucsdQAAAAJ",
        "orcid": ";;0000-0003-2205-5304;0000-0002-1846-2436;;;0000-0003-0954-5018;;0000-0002-8180-2886;",
        "linkedin": "mandy-wang-a72046192/;;;jieyu-zhang-3baaa8154/;satyen-sub;arjun-raj-loomba-63473719b/;shichang-zhang-4430a4106/;;wei-wang-8800845/;pan-lu-9308909a/",
        "or_profile": "~Xiaoxuan_Wang2;~Ziniu_Hu1;~Yanqiao_Zhu1;~Jieyu_Zhang1;~Satyen_Subramaniam1;~Arjun_R_Loomba1;~Shichang_Zhang2;~Yizhou_Sun1;~Wei_Wang13;~Pan_Lu1",
        "aff": ", University of California, Los Angeles;Deepmind;University of California, Los Angeles;University of Washington;University of California, Los Angeles;University of California, Los Angeles;University of California, Los Angeles;University of California, Los Angeles;University of California, Los Angeles;University of California, Los Angeles",
        "aff_domain": "cs.ucla.edu;deepmind.com;ucla.edu;cs.washington.edu;ucla.edu;ucla.edu;cs.ucla.edu;ucla.edu;ucla.edu;ucla.edu",
        "position": "PhD student;Visiting Researcher;PhD student;PhD student;Undergrad student;Undergrad student;PhD student;Associate Professor;Full Professor;PhD student",
        "bibtex": "@misc{\nwang2024scibench,\ntitle={SciBench: Evaluating College-Level Scientific Problem-Solving Abilities of Large Language Models},\nauthor={Xiaoxuan Wang and Ziniu Hu and Pan Lu and Yanqiao Zhu and Jieyu Zhang and Satyen Subramaniam and Arjun R Loomba and Shichang Zhang and Yizhou Sun and Wei Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=u6jbcaCHqO}\n}",
        "github": "",
        "project": "",
        "reviewers": "evdV;aRBB;Satc;K8pK;Rk3o",
        "site": "https://openreview.net/forum?id=u6jbcaCHqO",
        "pdf_size": 2837532,
        "rating": "3;5;6;6;8",
        "confidence": "5;4;4;4;4",
        "soundness": "4;2;3;3;3",
        "contribution": "2;2;3;3;3",
        "presentation": "2;3;3;3;3",
        "wc_summary": "58;57;71;137;53",
        "wc_strengths": "26;33;54;175;47",
        "wc_weaknesses": "247;117;156;58;31",
        "wc_questions": "81;19;151;94;58",
        "wc_review": "412;226;432;464;189",
        "wc_reply_reviewers": "797;0;124;12;0",
        "wc_reply_authors": "879;656;951;559;288",
        "reply_reviewers": "1;0;1;1;0",
        "reply_authors": "2;1;2;1;1",
        "rating_avg": [
            5.6,
            1.624807680927192
        ],
        "confidence_avg": [
            4.2,
            0.39999999999999997
        ],
        "soundness_avg": [
            3.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            75.2,
            31.485869846647084
        ],
        "wc_strengths_avg": [
            67.0,
            54.89990892524322
        ],
        "wc_weaknesses_avg": [
            121.8,
            76.39738215410263
        ],
        "wc_questions_avg": [
            80.6,
            43.45388360089349
        ],
        "wc_review_avg": [
            344.6,
            113.76748217307087
        ],
        "wc_reply_reviewers_avg": [
            186.6,
            308.7494777323518
        ],
        "wc_reply_authors_avg": [
            666.6,
            237.07602156270465
        ],
        "reply_reviewers_avg": [
            0.6,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.4,
            0.4898979485566356
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": -0.8000946913656628,
        "gs_citation": 129,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18110388007971651414&as_sdt=20000005&sciodt=0,21&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;1;0;2;0;0;0;0;0;0",
        "aff_unique_norm": "University of California, Los Angeles;DeepMind;University of Washington",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ucla.edu;https://deepmind.com;https://www.washington.edu",
        "aff_unique_abbr": "UCLA;DeepMind;UW",
        "aff_campus_unique_index": "0;0;0;0;0;0;0;0",
        "aff_campus_unique": "Los Angeles;",
        "aff_country_unique_index": "0;1;0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "title": "Adversarial Training on Purification (AToP): Advancing Both Robustness and Generalization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17587",
        "id": "u7559ZMvwY",
        "author_site": "Guang Lin, Chao Li, Jianhai Zhang, Toshihisa Tanaka, Qibin Zhao",
        "tldr": "",
        "abstract": "The deep neural networks are known to be vulnerable to well-designed adversarial attacks. The most successful defense technique based on adversarial training (AT) can achieve optimal robustness against particular attacks but cannot generalize well to unseen attacks. Another effective defense technique based on adversarial purification (AP) can enhance generalization but cannot achieve optimal robustness. Meanwhile, both methods share one common limitation on the degraded standard accuracy. To mitigate these issues, we propose a novel pipeline to acquire the robust purifier model, named Adversarial Training on Purification (AToP), which comprises two components: perturbation destruction by random transforms (RT) and purifier model fine-tuned (FT) by adversarial loss. RT is essential to avoid overlearning to known attacks, resulting in the robustness generalization to unseen attacks, and FT is essential for the improvement of robustness. \nTo evaluate our method in an efficient and scalable way, we conduct extensive experiments on CIFAR-10, CIFAR-100, and ImageNette to demonstrate that our method achieves optimal robustness and exhibits generalization ability against unseen attacks.",
        "keywords": "adversarial attacks;adversarial training;adversarial purification",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Guang Lin;Chao Li;Jianhai Zhang;Toshihisa Tanaka;Qibin Zhao",
        "authorids": "~Guang_Lin4;~Chao_Li12;~Jianhai_Zhang3;~Toshihisa_Tanaka1;~Qibin_Zhao1",
        "gender": ";M;M;;M",
        "homepage": ";https://chaoliatriken.github.io;;https://tanaka.sip.tuat.ac.jp/;https://qibinzhao.github.io",
        "dblp": ";;;;13/1193",
        "google_scholar": ";i4JrumAAAAAJ;;;https://scholar.google.co.jp/citations?hl=en",
        "orcid": ";;0000-0002-5992-0405;;0000-0002-4442-3182",
        "linkedin": ";;;;",
        "or_profile": "~Guang_Lin4;~Chao_Li12;~Jianhai_Zhang3;~Toshihisa_Tanaka1;~Qibin_Zhao1",
        "aff": ";RIKEN;Hangzhou Dianzi University;Tokyo University of Agriculture and Technology, Tokyo Institute of Technology;RIKEN",
        "aff_domain": ";riken.jp;hdu.edu.cn;tuat.ac.jp;riken.jp",
        "position": ";Researcher;Full Professor;Full Professor;Team Leader",
        "bibtex": "@inproceedings{\nlin2024adversarial,\ntitle={Adversarial Training on Purification ({AT}oP): Advancing Both Robustness and Generalization},\nauthor={Guang Lin and Chao Li and Jianhai Zhang and Toshihisa Tanaka and Qibin Zhao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=u7559ZMvwY}\n}",
        "github": "",
        "project": "",
        "reviewers": "n69U;onZy;jVyX",
        "pdf_size": 4076343,
        "rating": "5;6;6",
        "confidence": "5;4;4",
        "soundness": "2;3;2",
        "contribution": "2;2;3",
        "presentation": "3;3;2",
        "wc_summary": "71;113;80",
        "wc_strengths": "22;109;40",
        "wc_weaknesses": "167;102;264",
        "wc_questions": "3;8;67",
        "wc_review": "263;332;451",
        "wc_reply_reviewers": "59;35;617",
        "wc_reply_authors": "1081;783;1871",
        "reply_reviewers": "1;1;5",
        "reply_authors": "5;4;8",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            88.0,
            18.05547008526779
        ],
        "wc_strengths_avg": [
            57.0,
            37.49666651850535
        ],
        "wc_weaknesses_avg": [
            177.66666666666666,
            66.56492236072157
        ],
        "wc_questions_avg": [
            26.0,
            29.06314963431642
        ],
        "wc_review_avg": [
            348.6666666666667,
            77.6502128493899
        ],
        "wc_reply_reviewers_avg": [
            237.0,
            268.8791550120611
        ],
        "wc_reply_authors_avg": [
            1245.0,
            459.0628134217219
        ],
        "reply_reviewers_avg": [
            2.3333333333333335,
            1.8856180831641267
        ],
        "reply_authors_avg": [
            5.666666666666667,
            1.699673171197595
        ],
        "replies_avg": [
            36,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9999999999999998,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1849810953501570310&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 8,
        "openreview": "https://openreview.net/forum?id=u7559ZMvwY",
        "pdf": "https://openreview.net/pdf?id=u7559ZMvwY",
        "email": ";riken.jp;hdu.edu.cn;tuat.ac.jp;riken.jp",
        "author_num": 5,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "RIKEN;Hangzhou Dianzi University;Tokyo University of Agriculture and Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.riken.jp;http://www.hdu.edu.cn/;https://www.tuat.ac.jp",
        "aff_unique_abbr": "RIKEN;HGHDU;TUAT",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Tokyo",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "Japan;China"
    },
    {
        "id": "u7LFI98JI6",
        "title": "GraphDeepONet: Learning to simulate time-dependent partial differential equations using graph neural network and deep operator network",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Scientific computing using deep learning has seen significant advancements in recent years. There has been growing interest in models that learn the operator from the parameters of a partial differential equation (PDE) to the corresponding solutions. Deep Operator Network (DeepONet) and Fourier Neural operator, among other models, have been designed with structures suitable for handling functions as inputs and outputs, enabling real-time predictions as surrogate models for solution operators. There has also been significant progress in the research on surrogate models based on graph neural networks (GNNs), specifically targeting the dynamics in time-dependent PDEs. In this paper, we propose GraphDeepONet, an autoregressive model based on GNNs, to effectively adapt DeepONet, which is well-known for successful operator learning. GraphDeepONet outperforms existing GNN-based PDE solver models by accurately predicting solutions, even on irregular grids, while inheriting the advantages of DeepONet, allowing predictions on arbitrary grids. Additionally, unlike traditional DeepONet and its variants, GraphDeepONet enables time extrapolation for time-dependent PDE solutions. We also provide theoretical analysis of the universal approximation capability of GraphDeepONet in approximating continuous operators across arbitrary time intervals.",
        "keywords": "Physical simulations;Graph neural network;Message passing;neural PDE solvers;Deep operator network;DeepONet",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/3e3f29cd9aeb3043e2ac0e91b3f967ab1328a967.zip",
        "author": "Sung Woong Cho;Jae Yong Lee;Hyung Ju Hwang",
        "authorids": "~Sung_Woong_Cho1;~Jae_Yong_Lee2;~Hyung_Ju_Hwang1",
        "gender": "M;;M",
        "homepage": "http://www.jaeyong-lee.com/;http://hjhwang.postech.ac.kr;",
        "dblp": "72/6418;;",
        "google_scholar": "C1FGMygAAAAJ;;cknw4HUAAAAJ",
        "orcid": "0000-0003-0193-545X;;",
        "linkedin": "jae-yong-lee-31b675158/;;",
        "or_profile": "~Jae_Yong_Lee2;~Hyung_Ju_Hwang1;~SungWoong_CHO1",
        "aff": "Korea Institute for Advanced Study (KIAS);POSTECH;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kias.re.kr;postech.ac.kr;kaist.edu",
        "position": "Researcher;Full Professor;Postdoc",
        "bibtex": "@misc{\ncho2024graphdeeponet,\ntitle={GraphDeep{ON}et: Learning to simulate time-dependent partial differential equations using graph neural network and deep operator network},\nauthor={Sung Woong Cho and Jae Yong Lee and Hyung Ju Hwang},\nyear={2024},\nurl={https://openreview.net/forum?id=u7LFI98JI6}\n}",
        "github": "",
        "project": "",
        "reviewers": "Y4J4;Rs7H;9eTr;XsTS",
        "site": "https://openreview.net/forum?id=u7LFI98JI6",
        "pdf_size": 5228631,
        "rating": "3;5;6;6",
        "confidence": "5;2;3;3",
        "soundness": "2;3;2;3",
        "contribution": "3;2;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "95;22;62;91",
        "wc_strengths": "88;37;76;55",
        "wc_weaknesses": "520;60;187;209",
        "wc_questions": "111;45;3;132",
        "wc_review": "814;164;328;487",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "2302;943;486;1128",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "4;2;1;2",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            67.5,
            29.19332115399
        ],
        "wc_strengths_avg": [
            64.0,
            19.557607215607945
        ],
        "wc_weaknesses_avg": [
            244.0,
            169.19367600474908
        ],
        "wc_questions_avg": [
            72.75,
            51.49939320030868
        ],
        "wc_review_avg": [
            448.25,
            240.0691306686472
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1214.75,
            669.8064552540533
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.25,
            1.0897247358851685
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.7492686492653551,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7563757718473291506&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Korea Institute for Advanced Study;Pohang University of Science and Technology;Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.kias.re.kr;https://www.postech.ac.kr;https://www.kaist.ac.kr",
        "aff_unique_abbr": "KIAS;POSTECH;KAIST",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Pohang",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "u7Xo4sG6Ux",
        "title": "Composite Backdoor Attacks Against Large Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large language models (LLMs) have demonstrated superior performance compared to previous methods on various tasks, and often serve as the foundation models for many researches and services. However, the untrustworthy third-party LLMs may covertly introduce vulnerabilities for downstream tasks. In this paper, we explore the vulnerability of LLMs through the lens of backdoor attacks. Different from existing backdoor attacks against LLMs, ours scatters multiple trigger keys in different prompt components. Such a Composite Backdoor Attack (CBA) is shown to be stealthier than implanting the same multiple trigger keys in only a single component. CBA ensures that the backdoor is activated only when all trigger keys appear. Our experiments demonstrate that CBA is effective in both natural language processing (NLP) and multimodal tasks. For instance, with 3\\% poisoning samples against the LLaMA-7B model on the Emotion dataset, our attack achieves a 100\\% Attack Success Rate (ASR) with a False Triggered Rate (FTR) below 2.06\\% and negligible model accuracy degradation. The unique characteristics of our CBA can be tailored for various practical scenarios, e.g., targeting specific user groups. Our work highlights the necessity of increased security research on the trustworthiness of foundation LLMs.",
        "keywords": "large language models;composite backdoor attacks",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Hai Huang;Zhengyu Zhao;Michael Backes;Yun Shen;Yang Zhang",
        "authorids": "~Hai_Huang4;~Zhengyu_Zhao1;~Michael_Backes3;~Yun_Shen3;~Yang_Zhang15",
        "gender": ";M;;M;M",
        "homepage": "https://miraclehh.github.io;https://zhengyuzhao.github.io/;;https://uk.linkedin.com/in/yun-shen-24336257;https://yangzhangalmo.github.io/",
        "dblp": "51/944-14;58/10770-1;;;06/6785-16",
        "google_scholar": "DECqXdAAAAAJ;pC8KpPMAAAAJ;;Gx_JJ6cAAAAJ;Xeb2888AAAAJ",
        "orcid": "0000-0002-4898-4972;;;;0000-0003-3612-7348",
        "linkedin": ";;;;",
        "or_profile": "~Hai_Huang4;~Zhengyu_Zhao1;~Michael_Backes3;~Yun_Shen3;~Yang_Zhang15",
        "aff": "CISPA Helmholtz Center for Information Security;Xi'an Jiaotong University;;NetApp;CISPA Helmholtz Center for Information Security",
        "aff_domain": "cispa.de;xjtu.edu.cn;;netapp.com;cispa.de",
        "position": "PhD student;Researcher;;Technical Director;Full Professor",
        "bibtex": "@misc{\nhuang2024composite,\ntitle={Composite Backdoor Attacks Against Large Language Models},\nauthor={Hai Huang and Zhengyu Zhao and Michael Backes and Yun Shen and Yang Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=u7Xo4sG6Ux}\n}",
        "github": "",
        "project": "",
        "reviewers": "2WQN;97F9;9zZ2;FWKs",
        "site": "https://openreview.net/forum?id=u7Xo4sG6Ux",
        "pdf_size": 1997765,
        "rating": "3;3;5;5",
        "confidence": "4;4;4;4",
        "soundness": "3;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;2;3",
        "wc_summary": "38;72;113;39",
        "wc_strengths": "30;49;50;65",
        "wc_weaknesses": "372;431;57;159",
        "wc_questions": "110;20;61;118",
        "wc_review": "550;572;281;381",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "194;264;282;291",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            65.5,
            30.64718584144391
        ],
        "wc_strengths_avg": [
            48.5,
            12.419742348374221
        ],
        "wc_weaknesses_avg": [
            254.75,
            152.54896754812862
        ],
        "wc_questions_avg": [
            77.25,
            39.60665979352462
        ],
        "wc_review_avg": [
            446.0,
            120.5632614024687
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            257.75,
            38.06819538670043
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 75,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11077453819005544163&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "CISPA Helmholtz Center for Information Security;Xi'an Jiao Tong University;NetApp",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.cispa.de/;https://www.xjtu.edu.cn;https://www.netapp.com",
        "aff_unique_abbr": "CISPA;XJTU;NetApp",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;0",
        "aff_country_unique": "Germany;China;United States"
    },
    {
        "title": "Augmenting Transformers with Recursively Composed Multi-grained Representations",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17586",
        "id": "u859gX7ADC",
        "author_site": "Xiang Hu, Qingyang Zhu, Kewei Tu, Wei Wu",
        "tldr": "",
        "abstract": "We present ReCAT, a recursive composition augmented Transformer that is able to explicitly model hierarchical syntactic structures of raw texts without relying on gold trees during both learning and inference. \nExisting research along this line restricts data to follow a hierarchical tree structure and thus lacks inter-span communications.\nTo overcome the problem, we propose a novel contextual inside-outside (CIO) layer that learns contextualized representations of spans through bottom-up and top-down passes, where a bottom-up pass forms representations of high-level spans by composing low-level spans, while a top-down pass combines information inside and outside a span. By stacking several CIO layers between the embedding layer and the attention layers in Transformer, the ReCAT model can perform both deep intra-span and deep inter-span interactions, and thus generate multi-grained representations fully contextualized with other spans.\nMoreover, the CIO layers can be jointly pre-trained with Transformers, making ReCAT enjoy scaling ability, strong performance, and interpretability at the same time. We conduct experiments on various sentence-level and span-level tasks. Evaluation results indicate that ReCAT can significantly outperform vanilla Transformer models on all span-level tasks and recursive models on natural language inference tasks. More interestingly, the hierarchical structures induced by ReCAT exhibit strong consistency with human-annotated syntactic trees, indicating good interpretability brought by the CIO layers.",
        "keywords": "NLP; recursive neural network; multi-grain representation; compositional representation;span labeling;relation extraction; grammar induction;language understanding",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/fed48f4d9986ba7e27c1e4fc5b21cc9fb6a9f4c6.zip",
        "author": "Xiang Hu;Qingyang Zhu;Kewei Tu;Wei Wu",
        "authorids": "~Xiang_Hu2;~Qingyang_Zhu2;~Kewei_Tu1;~Wei_Wu1",
        "gender": ";M;M;M",
        "homepage": ";https://faculty.sist.shanghaitech.edu.cn/faculty/tukw/;https://sites.google.com/view/wei-wu-homepage;https://imhuim982.github.io/",
        "dblp": ";22/918;95/6985-14;",
        "google_scholar": "UiuEZ1UAAAAJ;5gi3Pm0AAAAJ;https://scholar.google.co.jp/citations?hl=en;D4hnUZkAAAAJ",
        "orcid": ";;0000-0001-6079-7697;0000-0001-7994-3121",
        "linkedin": ";;;",
        "or_profile": "~Qingyang_Zhu2;~Kewei_Tu1;~Wei_Wu1;~Hu_Xiang1",
        "aff": "Alibaba Group;ShanghaiTech University;Ant Research;Alibaba Group",
        "aff_domain": "antgroup.com;shanghaitech.edu.cn;antgroup.com;alibaba-inc.com",
        "position": "Intern;Associate Professor;Researcher;Researcher",
        "bibtex": "@inproceedings{\nhu2024augmenting,\ntitle={Augmenting Transformers with Recursively Composed Multi-grained Representations},\nauthor={Xiang Hu and Qingyang Zhu and Kewei Tu and Wei Wu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=u859gX7ADC}\n}",
        "github": "",
        "project": "",
        "reviewers": "fRFA;m86F;FCy4;46mR",
        "pdf_size": 1136127,
        "rating": "5;6;6;8",
        "confidence": "4;4;3;4",
        "soundness": "3;3;3;4",
        "contribution": "2;2;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "175;133;99;52",
        "wc_strengths": "75;30;31;42",
        "wc_weaknesses": "145;75;17;211",
        "wc_questions": "125;52;107;51",
        "wc_review": "520;290;254;356",
        "wc_reply_reviewers": "0;74;0;24",
        "wc_reply_authors": "956;506;483;751",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "2;1;2;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            114.75,
            45.135213525583325
        ],
        "wc_strengths_avg": [
            44.5,
            18.227726133558185
        ],
        "wc_weaknesses_avg": [
            112.0,
            72.94518489934754
        ],
        "wc_questions_avg": [
            83.75,
            32.87381176559846
        ],
        "wc_review_avg": [
            355.0,
            102.04410811016969
        ],
        "wc_reply_reviewers_avg": [
            24.5,
            30.211752680041588
        ],
        "wc_reply_authors_avg": [
            674.0,
            193.7511290289685
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.13245323570650439,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16693073554284952055&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=u859gX7ADC",
        "pdf": "https://openreview.net/pdf?id=u859gX7ADC",
        "email": "antgroup.com;shanghaitech.edu.cn;antgroup.com;alibaba-inc.com",
        "author_num": 4,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Alibaba Group;ShanghaiTech University;Ant Research",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.alibaba.com;https://www.shanghaitech.edu.cn;https://www.antgroup.com",
        "aff_unique_abbr": "Alibaba;ShanghaiTech;Ant Research",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "u8L1zzGXRq",
        "title": "Impact of Molecular Representations on Deep Learning Model Comparisons in Drug Response Predictions",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep learning (DL) plays a crucial role in tackling the complexity and heterogeneity of cancer, particularly in predicting drug response. However, the effectiveness of these models is often hindered by inconsistent benchmarks and disparate data sources. To address the gaps in comparisons, we introduce CoMParison workflow for Cross Validation (CMP-CV), an automated cross-validation framework that trains multiple models with user-specified parameters and evaluation metrics. The effectiveness of DL models in predicting drug responses is closely tied to the methods used to represent drugs at the molecular level. In this contribution, we benchmarked commonly leveraged drug representations (graph, molecular descriptors, molecular fingerprints, and  SMILES) to lean and understand the predictive capabilities of the models. We compare the ability of different drug representations to encode different structural properties of the drugs by using prediction errors made by models in different drug descriptor domains. We find that, in terms of the average prediction error over the entire test set, molecular descriptor and encoded SMILES representations perform slightly better than the others. However, we also observe that the rankings of the model performance vary in different regions over the descriptor space studied in this work, emphasizing the importance of domain-based model comparison when selecting a model for a specific application. Our efforts are part of CANcer Distributed Learning Environment (CANDLE), enhancing the model comparison capabilities in cancer research and driving the development of more effective strategies for drug response prediction and optimization.",
        "keywords": "Cancer Drug Response Prediction;Model Comparison",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/1f0edf523af953c03bc9e67d0cefac84ec2bce9a.zip",
        "author": "Gihan Uthpala Panapitiya;Carter Knutson;Andrew D. McNaughton;Rajeev Jain;Justin Wozniak;Thomas Brettin;Rick L. Stevens;Neeraj Kumar",
        "authorids": "~Gihan_Uthpala_Panapitiya1;~Carter_Knutson1;~Andrew_D._McNaughton1;jain@anl.gov;woz@anl.gov;~Thomas_Brettin1;~Rick_L._Stevens1;~Neeraj_Kumar4",
        "gender": ";;M;;;M;;M",
        "homepage": "https://github.com/gihanpanapitiya;;;;;;https://computerscience.uchicago.edu/people/profile/rick-stevens/;https://www.pnnl.gov/people/neeraj-kumar-phd",
        "dblp": ";;;;;;;64/2584",
        "google_scholar": "hJQypEoAAAAJ;;nYeZatMAAAAJ;;;Qr7KgXYAAAAJ;2oSSsLYAAAAJ;https://scholar.google.ca/citations?user=OWEJf5EAAAAJ",
        "orcid": "; 0000-0002-1953-2272;0000-0002-4146-7921;;;;;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Gihan_Uthpala_Panapitiya1;~Carter_Knutson1;~Andrew_D._McNaughton1;jain@anl.gov;woz@anl.gov;~Thomas_Brettin1;~Rick_L._Stevens1;~Neeraj_Kumar4",
        "aff": "Pacific Northwest National Laboratory;;Pacific Northwest National Laboratory;;;Argonne National Laboratory;University of Chicago;Pacific Northwest National Laboratory",
        "aff_domain": "pnnl.gov;;pnnl.gov;;;anl.gov;uchicago.edu;pnnl.gov",
        "position": "Researcher;;Researcher;;;Strategic Program Manager;Full Professor;Chief Data Scientist",
        "bibtex": "@misc{\npanapitiya2024impact,\ntitle={Impact of Molecular Representations on Deep Learning Model Comparisons in Drug Response Predictions},\nauthor={Gihan Uthpala Panapitiya and Carter Knutson and Andrew D. McNaughton and Rajeev Jain and Justin Wozniak and Thomas Brettin and Rick L. Stevens and Neeraj Kumar},\nyear={2024},\nurl={https://openreview.net/forum?id=u8L1zzGXRq}\n}",
        "github": "",
        "project": "",
        "reviewers": "gDji;jtTX;69P5;Pfg9",
        "site": "https://openreview.net/forum?id=u8L1zzGXRq",
        "pdf_size": 4553068,
        "rating": "1;3;3;5",
        "confidence": "2;4;4;3",
        "soundness": "1;2;2;2",
        "contribution": "1;1;2;2",
        "presentation": "1;2;3;2",
        "wc_summary": "53;53;75;58",
        "wc_strengths": "68;15;24;31",
        "wc_weaknesses": "180;258;101;139",
        "wc_questions": "31;86;4;87",
        "wc_review": "332;412;204;315",
        "wc_reply_reviewers": "0;0;0;124",
        "wc_reply_authors": "473;791;216;730",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            59.75,
            9.03811374126261
        ],
        "wc_strengths_avg": [
            34.5,
            20.155644370746373
        ],
        "wc_weaknesses_avg": [
            169.5,
            58.23443998185266
        ],
        "wc_questions_avg": [
            52.0,
            35.7980446393375
        ],
        "wc_review_avg": [
            315.75,
            74.19021161851474
        ],
        "wc_reply_reviewers_avg": [
            31.0,
            53.693575034635195
        ],
        "wc_reply_authors_avg": [
            552.5,
            228.00274121159157
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.4264014327112209,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:XILArWTSObUJ:scholar.google.com/&scioq=Impact+of+Molecular+Representations+on+Deep+Learning+Model+Comparisons+in+Drug+Response+Predictions&hl=en&as_sdt=0,5",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;2;0",
        "aff_unique_norm": "Pacific Northwest National Laboratory;Argonne National Laboratory;University of Chicago",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.pnnl.gov;https://www.anl.gov;https://www.uchicago.edu",
        "aff_unique_abbr": "PNNL;ANL;UChicago",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "u8fg8acFsT",
        "title": "Proximal Preference Optimization for Diffusion Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Preference optimization techniques such as Reinforcement Learning From Human/AI Feedback(RLHF/RLAIF) emerge as the new standard approach in fine-tuning foundation models. Preference learning, however, is often optimized under the reinforcement learning setting which leads to a high variance, low data efficiency, as well as much longer steps to converge. Recent study of Direct Preference Optimization proved to be an effective way to mitigate such issues by converting the preference learning into a supervised learning paradigm for language models. However, little have been studied in the case of image generative models such as diffusion models. In this paper, we propose Proximal Preference Optimization for Diffusion models (PPOD) that extends the prior work with proximal constraints to solve the optimization challenges in diffusion model. We further study the online vs offline evaluation as well as the optimization objective choices and figure out the optimal setting for different use cases. Such a method makes preference optimization stable and feasible under the supervised learning setting. Our evaluation shows PPOD outperforms the other RL based reward optimization approaches on the stable diffusion model. To the best of our knowledge, we are the first work that enabled the efficient optimization for the RLAIF on the diffusion models.",
        "keywords": "Diffusion model;Reinforcement learning;Preference optimization;RLHF",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Fei Deng;Qifei Wang;Wei Wei;Tingbo Hou;Matthias Grundmann",
        "authorids": "~Fei_Deng1;~Qifei_Wang3;~Wei_Wei15;~Tingbo_Hou2;~Matthias_Grundmann3",
        "gender": "M;M;;M;M",
        "homepage": ";https://research.google/people/106438/;;;http://www.weiwei.one",
        "dblp": "46/10037-1;35/3986;67/6472;73/8011;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;u-UDZcsAAAAJ;_8SObXwAAAAJ;vHZenW0AAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";0009-0006-9667-9821;;;",
        "linkedin": ";tingbo-hou/;;;",
        "or_profile": "~Fei_Deng1;~Tingbo_Hou2;~Matthias_Grundmann3;~QIFEI_WANG1;~wei_wei3",
        "aff": "Rutgers University;Google;;Google;Google",
        "aff_domain": "rutgers.edu;google.com;;google.com;google.com",
        "position": "PhD student;Researcher;;Researcher;Research Scientist",
        "bibtex": "@misc{\ndeng2024proximal,\ntitle={Proximal Preference Optimization for Diffusion Models},\nauthor={Fei Deng and Qifei Wang and Wei Wei and Tingbo Hou and Matthias Grundmann},\nyear={2024},\nurl={https://openreview.net/forum?id=u8fg8acFsT}\n}",
        "github": "",
        "project": "",
        "reviewers": "NEPt;iw1V;kXqb;MtxF",
        "site": "https://openreview.net/forum?id=u8fg8acFsT",
        "pdf_size": 3350791,
        "rating": "3;3;5;8",
        "confidence": "3;5;5;5",
        "soundness": "2;1;2;4",
        "contribution": "1;2;2;3",
        "presentation": "1;1;3;4",
        "wc_summary": "27;73;125;40",
        "wc_strengths": "22;72;53;60",
        "wc_weaknesses": "141;776;144;38",
        "wc_questions": "218;195;63;7",
        "wc_review": "408;1116;385;145",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            4.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.25,
            1.0897247358851685
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            1.299038105676658
        ],
        "wc_summary_avg": [
            66.25,
            37.83764659700706
        ],
        "wc_strengths_avg": [
            51.75,
            18.471261462065875
        ],
        "wc_weaknesses_avg": [
            274.75,
            292.5263876986143
        ],
        "wc_questions_avg": [
            120.75,
            88.38092271525569
        ],
        "wc_review_avg": [
            513.5,
            362.7812701890769
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.49374193110101877,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:3Twjigu3NjsJ:scholar.google.com/&scioq=Proximal+Preference+Optimization+for+Diffusion+Models&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Rutgers University;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.rutgers.edu;https://www.google.com",
        "aff_unique_abbr": "Rutgers;Google",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "u8zA1a2Vhf",
        "title": "Combine and Compare: Graph Rationale Learning with Conditional Non-Rationale Sampling",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Traditional Graph Neural Networks (GNNs) assume an ideal distribution of independent and identically distributed (i.i.d) data, a rarely met condition in real-world datasets. Therefore, how to address distribution shifts between training and testing sets becomes paramount in GNNs. Recently, the rationale learning method has garnered much attention as a graph generalization method. It first divides the graph into label-related rationale subgraphs and label-unrelated non-rationale ones. Then, it creates diverse training distributions by combining different non-rationales with rationales. Finally, by exploring the invariant rationales across training distributions, the performance of GNNs facing out-of-distribution (OOD) graphs is boosted. However, this method still faces two problems: (\\textit{i}) when combining non-rationales with rationales, it commonly \\textit{randomly} samples a non-rationale and combines it with the rationale. This may inadvertently produce duplicate samples. (\\textit{ii}) the relationship between the rationales, non-rationales and labels is not properly considered, where non-rationales and labels should be de-correlated compared to the rationales. To address these problems, we propose a Combine and Compare (CoCo) with non-rationales for Graph Rationale Learning method with the conditional non-rationale sampling. Specifically, from the framework of rationale learning, CoCo first employs the diverse sampling method to sample non-rationales, avoiding sampling duplicate non-rationales. Besides, we introduce a non-rationale progressive hard sampling method to de-correlate hard non-rationales and labels, enhancing the model's discrimination ability. Extensive experiments on both benchmarks and synthetic datasets demonstrate the effectiveness of our method for OOD graphs. Code is released at \\url{https://anonymous.4open.science/r/CoCo-5410/}",
        "keywords": "Non-Rationale Sampling;Rationale representation learning;Graph Generalization",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Fangzhou Yao;Linan Yue;Min Hou;Ye Liu;Jiayu Liu;Qi Liu",
        "authorids": "~Fangzhou_Yao1;~Linan_Yue1;~Min_Hou1;~Ye_Liu10;~Jiayu_Liu2;~Qi_Liu3",
        "gender": ";M;F;M;M;M",
        "homepage": ";https://yuelinan.github.io/;https://scholar.google.com/citations?user=ENdvgjYAAAAJ&hl=zh-CN;https://liuyeah.github.io;http://home.ustc.edu.cn/~jy251198/;http://staff.ustc.edu.cn/~qiliuql/",
        "dblp": ";297/1080;15/6301-1;96/2615-11.html;120/1047-1;95/2446-3",
        "google_scholar": ";https://scholar.google.com.hk/citations?user=XDaNgG4AAAAJ;ENdvgjYAAAAJ;HYYR4f8AAAAJ;https://scholar.google.com/citations?hl=zh-CN;5EoHAFwAAAAJ",
        "orcid": ";0000-0002-5980-6098;0000-0002-0524-6806;;0000-0001-8639-3308;0000-0001-6956-5550",
        "linkedin": ";;;;;",
        "or_profile": "~Fangzhou_Yao1;~Linan_Yue1;~Min_Hou1;~Ye_Liu10;~Jiayu_Liu2;~Qi_Liu3",
        "aff": ";University of Science and Technology of China;Hefei University of Technology;University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China",
        "aff_domain": ";ustc.edu.cn;hfut.edu.cn;ustc.edu;ustc.edu;ustc.edu.cn",
        "position": ";PhD student;Lecturer;PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nyao2024combine,\ntitle={Combine and Compare: Graph Rationale Learning with Conditional Non-Rationale Sampling},\nauthor={Fangzhou Yao and Linan Yue and Min Hou and Ye Liu and Jiayu Liu and Qi Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=u8zA1a2Vhf}\n}",
        "github": "",
        "project": "",
        "reviewers": "gNbk;S5nv;2agF;U9wj",
        "site": "https://openreview.net/forum?id=u8zA1a2Vhf",
        "pdf_size": 980910,
        "rating": "3;3;3;5",
        "confidence": "4;4;4;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;1;2",
        "presentation": "2;2;1;3",
        "wc_summary": "105;68;75;58",
        "wc_strengths": "25;52;27;45",
        "wc_weaknesses": "371;158;356;230",
        "wc_questions": "10;9;4;3",
        "wc_review": "511;287;462;336",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            76.5,
            17.528548142958105
        ],
        "wc_strengths_avg": [
            37.25,
            11.54068888758379
        ],
        "wc_weaknesses_avg": [
            278.75,
            88.64923857541022
        ],
        "wc_questions_avg": [
            6.5,
            3.0413812651491097
        ],
        "wc_review_avg": [
            399.0,
            90.8652849002302
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:yQzV4GUx7YIJ:scholar.google.com/&scioq=Combine+and+Compare:+Graph+Rationale+Learning+with+Conditional+Non-Rationale+Sampling&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0;0",
        "aff_unique_norm": "University of Science and Technology of China;Hefei University of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.ustc.edu.cn;http://www.hfut.edu.cn/",
        "aff_unique_abbr": "USTC;HUT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "uAKk0I3xxm",
        "title": "DiffiT: Diffusion Vision Transformers for Image Generation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Diffusion models with their powerful expressivity and high sample quality have enabled many new applications and use-cases in various domains. For sample generation, these models rely on a denoising neural network that generates images by iterative denoising. Yet, the role of denoising network architecture is not well-studied with most efforts relying on convolutional residual U-Nets. In this paper, we study the effectiveness of vision transformers in diffusion-based generative learning. Specifically, we propose a new model, denoted as Diffusion Vision Transformers (DiffiT), which consists of a hybrid hierarchical architecture with a U-shaped encoder and decoder. We introduce a novel time-dependent self-attention module that allows attention layers to adapt their behavior at different stages of the denoising process in an efficient manner. We also introduce latent DiffiT which consists of transformer model with the proposed self-attention layers, for high-resolution image generation. Our results show that DiffiT is surprisingly effective in generating high-fidelity images. DiffiT achieves state-of-the-art (SOTA) benchmarks on a variety of class-conditional and unconditional synthesis tasks. In the latent space, DiffiT achieves a new SOTA FID score of 1.73 on ImageNet-256 dataset. The code and pretrained model will be publicly available.",
        "keywords": "Generative learning;Transformers;Diffusion",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Ali Hatamizadeh;Jiaming Song;Guilin Liu;Jan Kautz;Arash Vahdat",
        "authorids": "~Ali_Hatamizadeh1;~Jiaming_Song1;~Guilin_Liu2;~Jan_Kautz1;~Arash_Vahdat3",
        "gender": ";M;;;M",
        "homepage": ";http://tsong.me;;http://jankautz.com;http://latentspace.cc/",
        "dblp": ";173/5104;;48/6214;92/8108",
        "google_scholar": ";;zOQj6-gAAAAJ;P9FclNEAAAAJ;https://scholar.google.ca/citations?user=p9-nlRIAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";jiamings/;;;",
        "or_profile": "~Ali_Hatamizadeh1;~Jiaming_Song1;~Guilin_Liu2;~Jan_Kautz1;~Arash_Vahdat3",
        "aff": ";Luma AI;NVIDIA;NVIDIA;NVIDIA",
        "aff_domain": ";lumalabs.ai;nvidia.com;nvidia.com;nvidia.com",
        "position": ";Chief Scientist;Research Scientist;VP Research;Research Scientist",
        "bibtex": "@misc{\nhatamizadeh2024diffit,\ntitle={DiffiT: Diffusion Vision Transformers for Image Generation},\nauthor={Ali Hatamizadeh and Jiaming Song and Guilin Liu and Jan Kautz and Arash Vahdat},\nyear={2024},\nurl={https://openreview.net/forum?id=uAKk0I3xxm}\n}",
        "github": "",
        "project": "",
        "reviewers": "w9cP;okW1;qgiP;rYjo",
        "site": "https://openreview.net/forum?id=uAKk0I3xxm",
        "pdf_size": 21266266,
        "rating": "5;5;5;5",
        "confidence": "5;4;5;5",
        "soundness": "3;2;2;3",
        "contribution": "3;2;2;2",
        "presentation": "3;2;3;3",
        "wc_summary": "56;63;40;31",
        "wc_strengths": "34;30;40;16",
        "wc_weaknesses": "177;117;140;75",
        "wc_questions": "3;31;24;18",
        "wc_review": "270;241;244;140",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            4.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            47.5,
            12.658988901172163
        ],
        "wc_strengths_avg": [
            30.0,
            8.831760866327848
        ],
        "wc_weaknesses_avg": [
            127.25,
            36.98901864067226
        ],
        "wc_questions_avg": [
            19.0,
            10.319883720275147
        ],
        "wc_review_avg": [
            223.75,
            49.650654577759596
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 67,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6208580298114727052&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Luma AI;NVIDIA",
        "aff_unique_dep": ";NVIDIA Corporation",
        "aff_unique_url": "https://www.luma.ai;https://www.nvidia.com",
        "aff_unique_abbr": "Luma AI;NVIDIA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "uAp7YdKrlx",
        "title": "Time Series Missing Imputation with Multivariate Radial Based Function Neural Network",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Researchers have been persistently working to address the issue of missing values in time series data. While numerous models have been proposed, they often come with challenges related to assumptions about the model or data and the instability of deep learning. This paper introduces an imputation model that can be utilized without explicit assumptions. Our imputation model is based on the Radial Basis Function (RBF) and learns local information from timestamps to create a continuous function. Additionally, we incorporate time gaps to facilitate learning information considering the missing terms of missing values. We name this model the Missing Imputation Multivariate RBFNN (MIM-RBFNN). However, MIM-RBFNN relies on a local information-based learning approach, which presents difficulties in utilizing temporal information. Therefore, we propose an extension called the Missing Value Imputation Recurrent Neural Network with Continuous Function (MIRNN-CF) using the continuous function generated by MIM-RBFNN. We evaluate the performance using two real-world datasets and conduct an ablation study comparing MIM-RBFNN and MIRNN-CF.",
        "keywords": "Time series data;missing data;Radial Basis Function;Imputation",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "ChanYoung Jung;Yun Jang",
        "authorids": "~ChanYoung_Jung1;~Yun_Jang1",
        "gender": "M;M",
        "homepage": "http://vis.sejong.ac.kr;https://sites.google.com/view/yunjang",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~ChanYoung_Jung1;~Yun_Jang1",
        "aff": "Sejong University;Sejong University",
        "aff_domain": "sejong.ac.kr;sejong.ac.kr",
        "position": "MS student;Full Professor",
        "bibtex": "@misc{\njung2024time,\ntitle={Time Series Missing Imputation with Multivariate Radial Based Function Neural Network},\nauthor={ChanYoung Jung and Yun Jang},\nyear={2024},\nurl={https://openreview.net/forum?id=uAp7YdKrlx}\n}",
        "github": "",
        "project": "",
        "reviewers": "Nj1D;zQKi;vWr9",
        "site": "https://openreview.net/forum?id=uAp7YdKrlx",
        "pdf_size": 11180310,
        "rating": "1;3;5",
        "confidence": "4;3;4",
        "soundness": "2;3;3",
        "contribution": "2;2;2",
        "presentation": "1;1;2",
        "wc_summary": "13;146;117",
        "wc_strengths": "11;17;92",
        "wc_weaknesses": "260;250;248",
        "wc_questions": "200;181;30",
        "wc_review": "484;594;487",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            1.632993161855452
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            92.0,
            57.10224747474189
        ],
        "wc_strengths_avg": [
            40.0,
            36.851051545376556
        ],
        "wc_weaknesses_avg": [
            252.66666666666666,
            5.2493385826745405
        ],
        "wc_questions_avg": [
            137.0,
            76.05699617173076
        ],
        "wc_review_avg": [
            521.6666666666666,
            51.162051909159736
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:vCtOTvO1A6MJ:scholar.google.com/&scioq=Time+Series+Missing+Imputation+with+Multivariate+Radial+Based+Function+Neural+Network&hl=en&as_sdt=0,5",
        "gs_version_total": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Sejong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sejong.ac.kr",
        "aff_unique_abbr": "Sejong",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "uBU33YNVL3",
        "title": "Bounded Loss Robustness: Enhancing the MAE Loss for Large-Scale Noisy Data Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large annotated datasets inevitably contain noisy labels, which poses a major challenge for training deep neural networks as they easily fit the labels. \nNoise-robust loss functions have emerged as a notable strategy to counteract this issue, with symmetric losses, a subset of the bounded losses, \ndisplaying significant noise robustness. \nYet, the class of symmetric loss functions might be too \nrestrictive, with functions such as the Mean Absolute Error (MAE) being susceptible to underfitting.\nThrough a quantitative approach, this paper explores the learning behavior of bounded loss functions, particularly \nthe limited overlap between the network output at initialization and non-zero derivative regions of the loss function.\nWe introduce a novel method, \"logit bias\", which adds a real number, denoted as $\\epsilon$, to the logit at the correct class position.\nThis method addresses underfitting by restoring the overlap, enabling MAE \nto learn, even on datasets like WebVision, consisting of over a million images from 1000 classes.\nExtensive numerical experiments show that MAE, in combination with our proposed method, can compete with state-of-the-art noise robust loss functions.\nRemarkably, our method relies on a single parameter, $\\epsilon$, which is determined by the number of classes, resulting in a method that uses zero dataset or noise-dependent hyperparameters.",
        "keywords": "noisy dataset;label noise;noise-robust loss;logit bias;image classification",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Max Staats;Matthias Thamm;Bernd Rosenow",
        "authorids": "~Max_Staats1;~Matthias_Thamm1;~Bernd_Rosenow1",
        "gender": "M;M;M",
        "homepage": ";;https://home.uni-leipzig.de/rosenow/Bernd_Rosenow/Welcome.html",
        "dblp": "317/5757;317/5762;95/7304",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;https://scholar.google.com/citations?hl=de;RpTtfB0AAAAJ",
        "orcid": "0000-0002-9174-6806;0000-0002-7259-3461;",
        "linkedin": ";;",
        "or_profile": "~Max_Staats1;~Matthias_Thamm1;~Bernd_Rosenow1",
        "aff": "Universit\u00e4t Leipzig;Universit\u00e4t Leipzig;Universit\u00e4t Leipzig",
        "aff_domain": "uni-leipzig.de;uni-leipzig.de;uni-leipzig.de",
        "position": "PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nstaats2024bounded,\ntitle={Bounded Loss Robustness: Enhancing the {MAE} Loss for Large-Scale Noisy Data Learning},\nauthor={Max Staats and Matthias Thamm and Bernd Rosenow},\nyear={2024},\nurl={https://openreview.net/forum?id=uBU33YNVL3}\n}",
        "github": "",
        "project": "",
        "reviewers": "jRF4;kScR;cujv;n8a1",
        "site": "https://openreview.net/forum?id=uBU33YNVL3",
        "pdf_size": 567852,
        "rating": "3;5;5;8",
        "confidence": "4;3;4;3",
        "soundness": "3;2;3;3",
        "contribution": "2;3;4;3",
        "presentation": "3;3;2;3",
        "wc_summary": "47;68;153;59",
        "wc_strengths": "68;81;85;45",
        "wc_weaknesses": "250;58;53;97",
        "wc_questions": "3;59;83;126",
        "wc_review": "368;266;374;327",
        "wc_reply_reviewers": "240;249;0;0",
        "wc_reply_authors": "847;645;417;626",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            81.75,
            41.80535252811534
        ],
        "wc_strengths_avg": [
            69.75,
            15.610493265749165
        ],
        "wc_weaknesses_avg": [
            114.5,
            80.0640368704951
        ],
        "wc_questions_avg": [
            67.75,
            44.426202853721364
        ],
        "wc_review_avg": [
            333.75,
            43.09509832916036
        ],
        "wc_reply_reviewers_avg": [
            122.25,
            122.2914040315181
        ],
        "wc_reply_authors_avg": [
            633.75,
            152.18635779858852
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.7001400420140049,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:8MlO0PnkOxIJ:scholar.google.com/&scioq=Bounded+Loss+Robustness:+Enhancing+the+MAE+Loss+for+Large-Scale+Noisy+Data+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Leipzig",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uni-leipzig.de",
        "aff_unique_abbr": "Uni Leipzig",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "uBpSkFGVQU",
        "title": "Depth-Guided Self-Supervised Learning: Seeing the World in 3D",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Self-Supervised Learning (SSL) methods operate on unlabeled data to learn robust representations useful for downstream tasks. Most SSL methods rely on augmentations obtained by transforming the 2D image pixel map. These augmentations ignore the fact that biological vision takes place in an immersive three-dimensional, temporally contiguous environment, and that low-level biological vision relies heavily on depth cues. Using a signal provided by a pretrained state-of-the-art monocular RGB-to-depth model (the Depth Prediction Transformer, Ranftl et al., 2021), we explore two distinct approaches to incorporating depth signals into the SSL framework. First, we evaluate self-supervised learning using an RGB+depth input representation. Second, we use the depth signal to generate novel views from slightly different camera positions, thereby producing a 3D augmentation for self-supervised learning. We also examine the combination of the two approaches. We evaluate the approaches on three different SSL methods---BYOL, SimSiam, and SwAV---using ImageNette (10 class subset of ImageNet), ImageNet-100 and ImageNet-1k datasets. We find that both approaches to incorporating depth signals improve the robustness and generalization of the baseline SSL methods, and the two approaches are complementary because the combination of depth and 3D views performs the best in most settings.",
        "keywords": "self-supervised learning;representation learning;depth",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/8f8b55de0adace1e24c1661317d69ac79c25019d.zip",
        "author": "Sumukh K Aithal;Anirudh Goyal;Alex Lamb;Yoshua Bengio;Michael Curtis Mozer",
        "authorids": "~Sumukh_K_Aithal1;~Anirudh_Goyal1;~Alex_Lamb1;~Yoshua_Bengio1;~Michael_Curtis_Mozer1",
        "gender": "M;M;M;M;M",
        "homepage": "https://anirudh9119.github.io/;http://yoshuabengio.org;https://www.cs.colorado.edu/~mozer;;https://sumukhaithal6.github.io/",
        "dblp": "172/1039;56/953;m/MichaelCMozer;;299/5911",
        "google_scholar": "krrh6OUAAAAJ;kukA0LcAAAAJ;lmjR_qMAAAAJ;https://scholar.google.ca/citations?user=BFzFy1YAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;;",
        "linkedin": ";yoshuabengio/?originalSubdomain=ca;;;sumukh-aithal-9801b4189",
        "or_profile": "~Anirudh_Goyal1;~Yoshua_Bengio1;~Michael_Curtis_Mozer1;~Alex_Matthew_Lamb1;~Sumukh_Aithal_K1",
        "aff": "Google DeepMind;University of Montreal;Google DeepMind;;Carnegie Mellon University",
        "aff_domain": "google.com;umontreal.ca;google.com;;cmu.edu",
        "position": "Researcher;Full Professor;Research Scientist;;MS student",
        "bibtex": "@misc{\naithal2024depthguided,\ntitle={Depth-Guided Self-Supervised Learning: Seeing the World in 3D},\nauthor={Sumukh K Aithal and Anirudh Goyal and Alex Lamb and Yoshua Bengio and Michael Curtis Mozer},\nyear={2024},\nurl={https://openreview.net/forum?id=uBpSkFGVQU}\n}",
        "github": "",
        "project": "",
        "reviewers": "BurA;YemW;AVEH",
        "site": "https://openreview.net/forum?id=uBpSkFGVQU",
        "pdf_size": 6287549,
        "rating": "3;3;5",
        "confidence": "4;4;4",
        "soundness": "2;2;2",
        "contribution": "2;2;2",
        "presentation": "2;3;3",
        "wc_summary": "47;127;79",
        "wc_strengths": "34;45;67",
        "wc_weaknesses": "110;184;212",
        "wc_questions": "3;5;27",
        "wc_review": "194;361;385",
        "wc_reply_reviewers": "0;0;170",
        "wc_reply_authors": "639;262;1007",
        "reply_reviewers": "0;0;1",
        "reply_authors": "1;1;2",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            84.33333333333333,
            32.87687468250121
        ],
        "wc_strengths_avg": [
            48.666666666666664,
            13.719410418171117
        ],
        "wc_weaknesses_avg": [
            168.66666666666666,
            43.02970550161313
        ],
        "wc_questions_avg": [
            11.666666666666666,
            10.873004286866728
        ],
        "wc_review_avg": [
            313.3333333333333,
            84.94835032078153
        ],
        "wc_reply_reviewers_avg": [
            56.666666666666664,
            80.13876853447539
        ],
        "wc_reply_authors_avg": [
            636.0,
            304.1523740934249
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:QxjdEMY8WugJ:scholar.google.com/&scioq=Depth-Guided+Self-Supervised+Learning:+Seeing+the+World+in+3D&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "Google;University of Montreal;Carnegie Mellon University",
        "aff_unique_dep": "Google DeepMind;;",
        "aff_unique_url": "https://deepmind.com;https://wwwumontreal.ca;https://www.cmu.edu",
        "aff_unique_abbr": "DeepMind;UM;CMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;2",
        "aff_country_unique": "United Kingdom;Canada;United States"
    },
    {
        "id": "uC2GtNM5eF",
        "title": "Identifiable State Disentanglement for Reinforcement Learning with Policy Optimality",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recent progress in reinforcement learning (RL) has demonstrated significant efficacy in the optimization of policies, in the presence of noise. These works, however, neglect the importance of independence between signal and noise in latent space, resulting in limited performance. To address this concern, we first analyze the identifiability result of latent signal and latent noise, which implicitly highlights that the independence between latent signal and latent noise is crucial in RL. We then convert the identifiability result into a novel method, which isolates signal from noise in latent space, by effectively integrating structural independence and statistical independence into a unified framework. Structurally, the proposed method respectively employs two different decoders on latent signal and latent noise, so that each decoder captures exclusive features specific to its own space. Statistically, the independence between latent signal and latent noise is enforced by a correlation-coefficients objective. Experiments on extensive benchmark control tasks demonstrate that the proposed approach surpasses existing algorithms in effectively disentangling signals from noise.",
        "keywords": "Reinforcement Learning;World Model;Disentanglement",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Haiyao Cao;Zhen Zhang;Panpan Cai;Yuhang Liu;Ehsan Abbasnejad;Biwei Huang;Mingming Gong;Anton van den Hengel;Javen Qinfeng Shi",
        "authorids": "~Haiyao_Cao1;~Zhen_Zhang2;~Panpan_Cai1;~Yuhang_Liu1;~Ehsan_Abbasnejad3;~Biwei_Huang1;~Mingming_Gong1;~Anton_van_den_Hengel1;~Javen_Qinfeng_Shi1",
        "gender": "M;M;F;;F;M;;M;M",
        "homepage": "https://www.linkedin.com/in/haiyao-cao-a3b0b089/;https://zzhang.org;https://cindycia.github.io/;https://sites.google.com/view/yuhangliu/homepage;;https://mingming-gong.github.io/;;https://ehsanabb.github.io/;https://cs.adelaide.edu.au/~javen/",
        "dblp": ";19/5112-8;215/4265;;165/3288;98/8479;v/AntonvandenHengel;30/11191;http://dblp.uni-trier.de/pers/hd/s/Shi:Qinfeng",
        "google_scholar": ";https://scholar.google.com.sg/citations?user=4X6Hqg0AAAAJ;https://scholar.google.com.sg/citations?user=MZfL0qUAAAAJ;5xZspvQAAAAJ;;https://scholar.google.com.au/citations?user=6BmiCJIAAAAJ;https://scholar.google.com.au/citations?user=nMGZ2ZQAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com.au/citations?user=h6O9vYkAAAAJ",
        "orcid": ";0000-0003-2805-4396;;;;0000-0001-7147-5589;0000-0003-3027-8364;;0000-0002-9126-2107",
        "linkedin": "haiyao-cao-a3b0b089/;;;;;;;;",
        "or_profile": "~Haiyao_Cao1;~Zhen_Zhang2;~Panpan_Cai1;~Yuhang_Liu1;~Biwei_Huang1;~Mingming_Gong1;~Anton_van_den_Hengel1;~Ehsan_M_Abbasnejad1;~Javen_Shi1",
        "aff": "The University of Adelaide;The University of Adelaide;Shanghai Jiaotong University;The University of Adelaide;University of California, San Diego;University of Melbourne;University of Adelaide;University of Adelaide;University of Adelaide",
        "aff_domain": "adelaide.edu.au;adelaide.edu.au;sjtu.edu.cn;adelaide.edu.au;ucsd.edu;unimelb.edu.au;adelaide.edu.au;adelaide.edu.au;adelaide.edu.au",
        "position": "PhD student;Postdoc;Associate Professor;Postdoc;Assistant Professor;Assistant Professor;Professor;Assistant Professor;Professor",
        "bibtex": "@misc{\ncao2024identifiable,\ntitle={Identifiable State Disentanglement for Reinforcement Learning with Policy Optimality},\nauthor={Haiyao Cao and Zhen Zhang and Panpan Cai and Yuhang Liu and Ehsan Abbasnejad and Biwei Huang and Mingming Gong and Anton van den Hengel and Javen Qinfeng Shi},\nyear={2024},\nurl={https://openreview.net/forum?id=uC2GtNM5eF}\n}",
        "github": "",
        "project": "",
        "reviewers": "vGCi;1xFa;u1JV;4Lhk;cMbH",
        "site": "https://openreview.net/forum?id=uC2GtNM5eF",
        "pdf_size": 2901626,
        "rating": "3;3;3;3;5",
        "confidence": "3;4;4;5;3",
        "soundness": "1;1;1;2;2",
        "contribution": "2;1;2;3;2",
        "presentation": "2;1;2;1;2",
        "wc_summary": "22;15;100;219;45",
        "wc_strengths": "26;8;21;302;65",
        "wc_weaknesses": "385;240;272;883;148",
        "wc_questions": "38;42;37;202;17",
        "wc_review": "471;305;430;1606;275",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            3.4,
            0.8
        ],
        "confidence_avg": [
            3.8,
            0.7483314773547882
        ],
        "soundness_avg": [
            1.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            1.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            80.2,
            75.544424016601
        ],
        "wc_strengths_avg": [
            84.4,
            110.44745356955949
        ],
        "wc_weaknesses_avg": [
            385.6,
            259.9866150400824
        ],
        "wc_questions_avg": [
            67.2,
            67.95704525654423
        ],
        "wc_review_avg": [
            617.4,
            499.7425737317164
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -0.5345224838248488,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:TPaoc6dAdqoJ:scholar.google.com/&scioq=Identifiable+State+Disentanglement+for+Reinforcement+Learning+with+Policy+Optimality&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;2;3;0;0;0",
        "aff_unique_norm": "University of Adelaide;Shanghai Jiao Tong University;University of California, San Diego;University of Melbourne",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.adelaide.edu.au;https://www.sjtu.edu.cn;https://www.ucsd.edu;https://www.unimelb.edu.au",
        "aff_unique_abbr": "Adelaide;SJTU;UCSD;UniMelb",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";San Diego",
        "aff_country_unique_index": "0;0;1;0;2;0;0;0;0",
        "aff_country_unique": "Australia;China;United States"
    },
    {
        "id": "uCMxeZCp2T",
        "title": "Nature-Inspired Local Propagation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The spectacular results achieved in machine learning, including the recent advances in generative AI, rely on large data collections. On the opposite, intelligent processes in nature arises without the need for such collections, but simply by online processing of the environmental information. In particular, natural learning processes rely on mechanisms where data representation and learning are intertwined in such a way to respect spatiotemporal locality. This paper shows that such a feature arises from a pre-algorithmic view of learning that is inspired by related studies in Theoretical Physics. We show that the algorithmic interpretation of the derived \u201claws of learning\u201d, which takes the structure of Hamiltonian equations, reduces to Backpropagation when the the speed of propagation goes to infinity. This opens the doors to machine learning studies based on full on-line information processing that are based the replacement of Backpropagation with the proposed spatiotemporal local algorithm.",
        "keywords": "spatiotemporal locality;optimal control",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/5e9b00a4967837f43a2bed1f7830981536711701.zip",
        "author": "Alessandro Betti;Marco Gori",
        "authorids": "~Alessandro_Betti1;~Marco_Gori1",
        "gender": "M;M",
        "homepage": "http://sailab.diism.unisi.it/people/alessandro-betti/;http://sailab.diism.unisi.it/people/marco-gori/",
        "dblp": "180/7658;g/MarcoGori",
        "google_scholar": "https://scholar.google.com/citations?hl=it;",
        "orcid": ";0000-0001-6337-5430",
        "linkedin": ";",
        "or_profile": "~Alessandro_Betti1;~Marco_Gori1",
        "aff": "Institute for Advanced Studies Lucca;University of Siena",
        "aff_domain": "imtlucca.it;unisi.it",
        "position": "Assistant Professor;Full Professor",
        "bibtex": "@misc{\nbetti2024natureinspired,\ntitle={Nature-Inspired Local Propagation},\nauthor={Alessandro Betti and Marco Gori},\nyear={2024},\nurl={https://openreview.net/forum?id=uCMxeZCp2T}\n}",
        "github": "",
        "project": "",
        "reviewers": "yT4E;xnxp;YNF2;gou7",
        "site": "https://openreview.net/forum?id=uCMxeZCp2T",
        "pdf_size": 660392,
        "rating": "1;5;5;6",
        "confidence": "2;3;1;2",
        "soundness": "1;2;3;3",
        "contribution": "1;2;3;3",
        "presentation": "1;2;2;2",
        "wc_summary": "164;84;55;193",
        "wc_strengths": "1;105;33;27",
        "wc_weaknesses": "172;92;1;360",
        "wc_questions": "160;54;196;499",
        "wc_review": "497;335;285;1079",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "154;477;1211;907",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;2;2",
        "rating_avg": [
            4.25,
            1.920286436967152
        ],
        "confidence_avg": [
            2.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            124.0,
            56.39592183837409
        ],
        "wc_strengths_avg": [
            41.5,
            38.58432324144095
        ],
        "wc_weaknesses_avg": [
            156.25,
            132.2807147697653
        ],
        "wc_questions_avg": [
            227.25,
            165.35019655265003
        ],
        "wc_review_avg": [
            549.0,
            315.8702265171569
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            687.25,
            403.4738994036665
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6943456593833615907&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Institute for Advanced Studies;University of Siena",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.iasl.it;https://www.unisi.it",
        "aff_unique_abbr": ";UniSi",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Lucca;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Italy"
    },
    {
        "id": "uDNP1q5aZq",
        "title": "Boosting Backdoor Attack with A Learnable Poisoning Sample Selection Strategy",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Data-poisoning based backdoor attacks aim to inject backdoor into models by manipulating training datasets without controlling the training process of the target model. Existing backdoor attacks mainly focus on designing diverse triggers or fusion strategies to generate poisoned samples. However, all these attacks randomly select samples from the benign dataset to be poisoned, disregarding the varying importance of different samples. In order to select important samples to be poisoned from a global perspective, we first introduce a learnable poisoning mask into the regular backdoor training loss. Then we propose a Learnable Poisoning sample Selection (LPS) strategy to learn the mask through a min-max optimization. During the two-player game, considering hard samples contribute more to the training process, the inner optimization maximizes loss  w.r.t. the mask to identify hard poisoned samples by impeding the training objective, while the outer optimization minimizes the loss w.r.t. the model\u2019s weight to train the surrogate model. After several rounds of adversarial training,  we finally select poisoned samples with high contribution. Extensive experiments on benchmark datasets demonstrate the effectiveness and efficiency of our LPS strategy in boosting the performance of various data-poisoning based backdoor attacks.",
        "keywords": "Backdoor attack;Data selection;Trustworthy AI",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/302fa6dcf7ecb2146f5c0517d3a2a056f49e0dbe.zip",
        "author": "Zihao Zhu;Mingda Zhang;Shaokui Wei;Li Shen;Yanbo Fan;Baoyuan Wu",
        "authorids": "~Zihao_Zhu2;~Mingda_Zhang2;~Shaokui_Wei1;~Li_Shen1;~Yanbo_Fan1;~Baoyuan_Wu1",
        "gender": ";M;M;M;M;M",
        "homepage": ";https://github.com/mdzhangst;https://shawkui.github.io/;https://sites.google.com/site/mathshenli/home;https://sites.google.com/site/yanbofan0124/;https://sites.google.com/site/baoyuanwu2015/",
        "dblp": ";;323/4243;91/3680-8;181/4574;73/7781",
        "google_scholar": ";pmwwTcgAAAAJ;WHkEfnsAAAAJ;yVhgENIAAAAJ;OlOqHyUAAAAJ;JNTG1KoAAAAJ",
        "orcid": ";;;;0000-0002-8530-485X;0000-0003-2183-5990",
        "linkedin": ";;;;;",
        "or_profile": "~Zihao_Zhu2;~Mingda_Zhang2;~Shaokui_Wei1;~Li_Shen1;~Yanbo_Fan1;~Baoyuan_Wu1",
        "aff": ";The Chinese University of Hong Kong, Shenzhen;The Chinese University of Hong Kong, Shenzhen;JD Explore Academy;Ant Research;The Chinese University of Hong Kong, Shenzhen",
        "aff_domain": ";cuhk.edu.cn;cuhk.edu.cn;jd.com;antgroup.com;cuhk.edu.cn",
        "position": ";PhD student;PhD student;Researcher;Associate Professor;Associate Professor",
        "bibtex": "@misc{\nzhu2024boosting,\ntitle={Boosting Backdoor Attack with A Learnable Poisoning Sample Selection Strategy},\nauthor={Zihao Zhu and Mingda Zhang and Shaokui Wei and Li Shen and Yanbo Fan and Baoyuan Wu},\nyear={2024},\nurl={https://openreview.net/forum?id=uDNP1q5aZq}\n}",
        "github": "",
        "project": "",
        "reviewers": "i4rE;mh2m;n1Ao;CSPw",
        "site": "https://openreview.net/forum?id=uDNP1q5aZq",
        "pdf_size": 17651307,
        "rating": "5;5;6;6",
        "confidence": "3;4;4;4",
        "soundness": "3;3;3;3",
        "contribution": "3;2;3;3",
        "presentation": "3;3;3;2",
        "wc_summary": "76;48;31;141",
        "wc_strengths": "76;25;59;28",
        "wc_weaknesses": "258;124;38;25",
        "wc_questions": "74;101;56;115",
        "wc_review": "484;298;184;309",
        "wc_reply_reviewers": "0;50;137;20",
        "wc_reply_authors": "1045;2400;1855;835",
        "reply_reviewers": "0;1;2;1",
        "reply_authors": "4;4;5;4",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            74.0,
            41.8867520822515
        ],
        "wc_strengths_avg": [
            47.0,
            21.38924963620744
        ],
        "wc_weaknesses_avg": [
            111.25,
            92.87457940685384
        ],
        "wc_questions_avg": [
            86.5,
            22.96192500641007
        ],
        "wc_review_avg": [
            318.75,
            107.22727031870204
        ],
        "wc_reply_reviewers_avg": [
            51.75,
            52.33724773046439
        ],
        "wc_reply_authors_avg": [
            1533.75,
            628.6331899446608
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            4.25,
            0.4330127018922193
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8940843305449657490&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1;2;0",
        "aff_unique_norm": "Chinese University of Hong Kong;JD;Ant Research",
        "aff_unique_dep": ";JD Explore Academy;",
        "aff_unique_url": "https://www.cuhk.edu.cn;;https://www.antgroup.com",
        "aff_unique_abbr": "CUHK;;Ant Research",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Shenzhen;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China;"
    },
    {
        "title": "Entity-Centric Reinforcement Learning for Object Manipulation from Pixels",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17585",
        "id": "uDxeSZ1wdI",
        "author_site": "Dan Haramati, Tal Daniel, Aviv Tamar",
        "tldr": "",
        "abstract": "Manipulating objects is a hallmark of human intelligence, and an important task in domains such as robotics. In principle, Reinforcement Learning (RL) offers a general approach to learn object manipulation. In practice, however, domains with more than a few objects are difficult for RL agents due to the curse of dimensionality, especially when learning from raw image observations. In this work we propose a structured approach for visual RL that is suitable for representing multiple objects and their interaction, and use it to learn goal-conditioned manipulation of several objects. Key to our method is the ability to handle goals with dependencies between the objects (e.g., moving objects in a certain order). We further relate our architecture to the generalization capability of the trained agent, based on a theoretical result for compositional generalization, and demonstrate agents that learn with 3 objects but generalize to similar tasks with over 10 objects. Videos and code are available on the project website: https://sites.google.com/view/entity-centric-rl",
        "keywords": "deep reinforcement learning;visual reinforcement learning;object-centric;robotic object manipulation;compositional generalization",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/bb5b60c4035a3b17038427116d310f44d1759371.zip",
        "author": "Dan Haramati;Tal Daniel;Aviv Tamar",
        "authorids": "~Dan_Haramati1;~Tal_Daniel2;~Aviv_Tamar2",
        "gender": "M;M;M",
        "homepage": "https://danhrmti.github.io/;https://taldatech.github.io;https://avivt.github.io/avivt/",
        "dblp": ";05/9543;49/10622",
        "google_scholar": "NrfsdRYAAAAJ;WqOoA3IAAAAJ;https://scholar.google.co.il/citations?user=kppa2vgAAAAJ",
        "orcid": ";;",
        "linkedin": "dan-haramati/;tal-daniel-2b919513b/;",
        "or_profile": "~Dan_Haramati1;~Tal_Daniel2;~Aviv_Tamar2",
        "aff": "Technion - Israel Institute of Technology, Technion - Israel Institute of Technology;Technion - Israel Institute of Technology, Technion;Technion, Technion",
        "aff_domain": "campus.technion.ac.il;technion.ac.il;technion.ac.il",
        "position": "MS student;PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nharamati2024entitycentric,\ntitle={Entity-Centric Reinforcement Learning for Object Manipulation from Pixels},\nauthor={Dan Haramati and Tal Daniel and Aviv Tamar},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=uDxeSZ1wdI}\n}",
        "github": "",
        "project": "",
        "reviewers": "PeH5;aSoT;SBTK;sQ6n",
        "pdf_size": 10124980,
        "rating": "6;8;8;8",
        "confidence": "4;4;4;3",
        "soundness": "3;3;3;3",
        "contribution": "3;3;4;3",
        "presentation": "2;3;3;3",
        "wc_summary": "65;149;94;149",
        "wc_strengths": "72;57;27;129",
        "wc_weaknesses": "703;116;233;642",
        "wc_questions": "2;65;103;11",
        "wc_review": "842;387;457;931",
        "wc_reply_reviewers": "57;30;110;135",
        "wc_reply_authors": "2190;533;2441;1129",
        "reply_reviewers": "1;1;2;1",
        "reply_authors": "3;1;5;2",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            114.25,
            36.23102951890824
        ],
        "wc_strengths_avg": [
            71.25,
            37.07003506877219
        ],
        "wc_weaknesses_avg": [
            423.5,
            253.3322916645251
        ],
        "wc_questions_avg": [
            45.25,
            41.13620667976084
        ],
        "wc_review_avg": [
            654.25,
            235.67496154661828
        ],
        "wc_reply_reviewers_avg": [
            83.0,
            41.587257663856604
        ],
        "wc_reply_authors_avg": [
            1573.25,
            776.6673596205778
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            1.479019945774904
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13420248359122390331&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=uDxeSZ1wdI",
        "pdf": "https://openreview.net/pdf?id=uDxeSZ1wdI",
        "email": "campus.technion.ac.il;technion.ac.il;technion.ac.il",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Technion - Israel Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.technion.ac.il/en/",
        "aff_unique_abbr": "Technion",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Israel"
    },
    {
        "id": "uE5TNerNmW",
        "title": "Are Graph Neural Networks Optimal Approximation Algorithms?",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In this work, utilizing powerful algorithmic tools from semidefinite programming (SDP), we design graph neural network architectures that can be used to obtain optimal approximation algorithms for a large class of combinatorial optimization problems. \nConcretely, assuming the Unique Games Conjecture, we prove that polynomial-sized message passing algorithms can represent the most powerful polynomial time algorithms for Max Constraint Satisfaction Problems. We leverage this result to construct efficient graph neural network architectures that obtain high-quality approximate solutions on landmark combinatorial optimization problems such as max-cut and maximum independent set. Our approach achieves strong empirical results across a wide range of real-world and synthetic datasets against both neural baselines and classical algorithms. Furthermore, we demonstrate that our method is competitive with standard SDP solvers while enjoying improved scalability and shorter execution times.",
        "keywords": "graph neural networks;geometric deep learning;discrete optimization;combinatorial optimization;unsupervised learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "morris yau;Eric Hanqing Lu;Nikolaos Karalias;Jessica Xu;Stefanie Jegelka",
        "authorids": "~morris_yau2;~Eric_Hanqing_Lu1;~Nikolaos_Karalias1;~Jessica_Xu1;~Stefanie_Jegelka3",
        "gender": "M;M;M;F;F",
        "homepage": "http://morrisyau.com/;;;https://jessxu.com;http://people.csail.mit.edu/stefje/",
        "dblp": ";;267/9290;;38/7003",
        "google_scholar": ";;CRLG9UcAAAAJ;8VPkPvUAAAAJ;gTWUZlsAAAAJ",
        "orcid": ";0000-0003-1228-9887;0000-0002-9471-5343;;",
        "linkedin": ";;;;",
        "or_profile": "~morris_yau2;~Eric_Hanqing_Lu1;~Nikolaos_Karalias1;~Jessica_Xu1;~Stefanie_Jegelka3",
        "aff": "Massachusetts Institute of Technology;Harvard University, Harvard University;Massachusetts Institute of Technology;;Massachusetts Institute of Technology",
        "aff_domain": "mit.edu;g.harvard.edu;mit.edu;;mit.edu",
        "position": "PhD student;PhD student;Postdoc;;Associate Professor",
        "bibtex": "@misc{\nyau2024are,\ntitle={Are Graph Neural Networks Optimal Approximation Algorithms?},\nauthor={morris yau and Eric Hanqing Lu and Nikolaos Karalias and Jessica Xu and Stefanie Jegelka},\nyear={2024},\nurl={https://openreview.net/forum?id=uE5TNerNmW}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=uE5TNerNmW",
        "pdf_size": 1750296,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13625869420708795159&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Massachusetts Institute of Technology;Harvard University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://web.mit.edu;https://www.harvard.edu",
        "aff_unique_abbr": "MIT;Harvard",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Enhanced Face Recognition using Intra-class Incoherence Constraint",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17584",
        "id": "uELjxVbrqG",
        "author_site": "Yuanqing Huang, Yinggui Wang, Le Yang, Lei Wang",
        "tldr": "",
        "abstract": "The current face recognition (FR) algorithms has achieved a high level of accuracy, making further improvements increasingly challenging. While existing FR algorithms primarily focus on optimizing margins and loss functions, limited attention has been given to exploring the feature representation space. Therefore, this paper endeavors to improve FR performance in the view of feature representation space. Firstly, we consider two FR models that exhibit distinct performance discrepancies, where one model exhibits superior recognition accuracy compared to the other. We implement orthogonal decomposition on the features from the superior model along those from the inferior model and obtain two sub-features. Surprisingly, we find the sub-feature perpendicular to the inferior still possesses a certain level of face distinguishability. We adjust the modulus of the sub-features and recombine them through vector addition. Experiments demonstrate this recombination is likely to contribute to an improved facial feature representation, even better than features from the original superior model. Motivated by this discovery, we further consider how to improve FR accuracy when there is only one FR model available. Inspired by knowledge distillation, we incorporate the intra-class incoherence constraint (IIC) to solve the problem. Experiments on various FR benchmarks show the existing state-of-the-art method with IIC can be further improved, highlighting its potential to further enhance FR performance.",
        "keywords": "Representation learning;Computer vision;Face recognition;Intra-class incoherence Constraint",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yuanqing Huang;Yinggui Wang;Le Yang;Lei Wang",
        "authorids": "~Yuanqing_Huang1;~Yinggui_Wang1;~Le_Yang6;~Lei_Wang30",
        "gender": ";M;M;M",
        "homepage": ";;https://www.canterbury.ac.nz/engineering/contact-us/people/le-yang.html;",
        "dblp": ";136/1775;;",
        "google_scholar": ";;l-xC8hMAAAAJ;",
        "orcid": ";;;",
        "linkedin": ";;;%E7%A3%8A-%E7%8E%8B-b4994abb/",
        "or_profile": "~Yuanqing_Huang1;~Yinggui_Wang1;~Le_Yang6;~Lei_Wang30",
        "aff": ";Ant Group;University of Canterbury;Ant Group",
        "aff_domain": ";antgroup.com;canterbury.ac.nz;antgroup.com",
        "position": ";Principal Researcher;Lecturer;Principal Researcher",
        "bibtex": "@inproceedings{\nhuang2024enhanced,\ntitle={Enhanced Face Recognition using Intra-class Incoherence Constraint},\nauthor={Yuanqing Huang and Yinggui Wang and Le Yang and Lei Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=uELjxVbrqG}\n}",
        "github": "",
        "project": "",
        "reviewers": "GUup;JUcW;UpYx;V2zT",
        "pdf_size": 527467,
        "rating": "6;6;8;8",
        "confidence": "4;4;5;4",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;2;3;4",
        "wc_summary": "26;71;81;152",
        "wc_strengths": "17;86;14;175",
        "wc_weaknesses": "102;166;34;80",
        "wc_questions": "3;158;29;15",
        "wc_review": "148;481;158;422",
        "wc_reply_reviewers": "20;35;0;0",
        "wc_reply_authors": "448;751;150;84",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            82.5,
            45.15805575974236
        ],
        "wc_strengths_avg": [
            73.0,
            65.55532015023647
        ],
        "wc_weaknesses_avg": [
            95.5,
            47.52630850381713
        ],
        "wc_questions_avg": [
            51.25,
            62.31522687112677
        ],
        "wc_review_avg": [
            302.25,
            150.74212251391447
        ],
        "wc_reply_reviewers_avg": [
            13.75,
            14.737282653189496
        ],
        "wc_reply_authors_avg": [
            358.25,
            264.9946933430932
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=713721983737865968&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=uELjxVbrqG",
        "pdf": "https://openreview.net/pdf?id=uELjxVbrqG",
        "email": ";antgroup.com;canterbury.ac.nz;antgroup.com",
        "author_num": 4,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Ant Group;University of Canterbury",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.antgroup.com;https://www.canterbury.ac.nz",
        "aff_unique_abbr": "Ant Group;UC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "China;New Zealand"
    },
    {
        "id": "uEYxHVQJF4",
        "title": "Why are hyperbolic neural networks effective? A study on hierarchical representation capability",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Hyperbolic Neural Networks (HNNs), operating in hyperbolic space, have been widely applied in recent years, motivated by the existence of an optimal embedding in hyperbolic space that can preserve data hierarchical relationships (termed Hierarchical Representation Capability, HRC) more accurately than Euclidean space. However, there is no evidence to suggest that HNNs can achieve this theoretical optimal embedding, leading to much research being built on flawed motivations. In this paper, we propose a benchmark for evaluating HRC and conduct a comprehensive analysis of why HNNs are effective through large-scale experiments. Inspired by the analysis results, we propose several pre-training strategies to enhance HRC and improve the performance of downstream tasks, further validating the reliability of the analysis. Experiments show that HNNs cannot achieve the theoretical optimal embedding. The HRC is significantly affected by the optimization objectives and hierarchical structures, and enhancing HRC through pre-training strategies can significantly improve the performance of HNNs.",
        "keywords": "Hyperbolic space;hyperbolic neural networks;hierarchical structure",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Shicheng Tan;Huanjing Zhao;Shu Zhao;Yanping Zhang",
        "authorids": "~Shicheng_Tan1;~Huanjing_Zhao1;~Shu_Zhao4;~Yanping_Zhang3",
        "gender": "M;M;F;",
        "homepage": ";;;",
        "dblp": "250/3561;251/2125;;32/4846-1",
        "google_scholar": ";;CbWeVDgAAAAJ;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Shicheng_Tan1;~Huanjing_Zhao1;~Shu_Zhao4;~Yanping_Zhang3",
        "aff": "Tsinghua University;;Anhui University;Anhui University",
        "aff_domain": "cs.tsinghua.edu.cn;;ahu.edu.cn;ahu.edu.cn",
        "position": "Postdoc;;Full Professor;Full Professor",
        "bibtex": "@misc{\ntan2024why,\ntitle={Why are hyperbolic neural networks effective? A study on hierarchical representation capability},\nauthor={Shicheng Tan and Huanjing Zhao and Shu Zhao and Yanping Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=uEYxHVQJF4}\n}",
        "github": "",
        "project": "",
        "reviewers": "4wYm;pJty;u1No",
        "site": "https://openreview.net/forum?id=uEYxHVQJF4",
        "pdf_size": 4762636,
        "rating": "3;3;5",
        "confidence": "3;4;3",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "1;3;3",
        "wc_summary": "106;75;147",
        "wc_strengths": "60;48;15",
        "wc_weaknesses": "408;43;165",
        "wc_questions": "136;76;15",
        "wc_review": "710;242;342",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            109.33333333333333,
            29.48822740612863
        ],
        "wc_strengths_avg": [
            41.0,
            19.026297590440446
        ],
        "wc_weaknesses_avg": [
            205.33333333333334,
            151.71537679337436
        ],
        "wc_questions_avg": [
            75.66666666666667,
            49.398605468395786
        ],
        "wc_review_avg": [
            431.3333333333333,
            201.2317624586691
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:WPfg4scuGOMJ:scholar.google.com/&scioq=Why+are+hyperbolic+neural+networks+effective%3F+A+study+on+hierarchical+representation+capability&hl=en&as_sdt=0,33",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Tsinghua University;Anhui University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tsinghua.edu.cn;http://www.ahu.edu.cn/",
        "aff_unique_abbr": "THU;AHU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "uFHDOSfuGS",
        "title": "An Entropic Risk Measure for Robust Counterfactual Explanations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Counterfactual explanations often become invalid if the underlying model changes because they are usually quite close to the decision boundary. Thus, the robustness of counterfactual explanations to potential model changes is an important desideratum. In this work, we propose entropic risk as a novel measure of robustness for counterfactual explanations. Entropic risk is a convex risk measure and satisfies several desirable properties. Furthermore, we show several ways of incorporating our proposed risk measure in the generation of robust counterfactuals. The main significance of our measure is that it establishes a connection between existing approaches for worst-case robust (min-max optimization) and robustness-constrained counterfactuals. A limiting case of our entropic-risk-based approach yields a worst-case min-max optimization scenario. On the other hand, we also provide a constrained optimization algorithm with probabilistic guarantees that can find counterfactuals, balancing our measure of robustness and the cost of the counterfactual. We study the trade-off between the cost of the counterfactuals and their validity under model changes for varying degrees of risk aversion, as determined by our risk parameter knob. We examine the performance of our algorithm on several datasets. Our proposed risk measure is rooted in large deviation theory and has close connections with mathematical finance and risk-sensitive control.",
        "keywords": "Counterfactual Explanations;Explainable AI;Robustness;Risk Measures;Multi-Objective Optimization;Pareto Front;Mini-Max Optimization",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Erfaun Noorani;Faisal Hamman;Sanghamitra Dutta",
        "authorids": "~Erfaun_Noorani1;~Faisal_Hamman1;~Sanghamitra_Dutta2",
        "gender": "M;M;F",
        "homepage": ";https://www.faisalhamman.com/;https://sites.google.com/site/sanghamitraweb/",
        "dblp": "262/0113.html;332/3468;154/6653",
        "google_scholar": ";Zeoc1A8AAAAJ;BgaqaXwAAAAJ",
        "orcid": ";;0000-0002-6500-2627",
        "linkedin": ";;",
        "or_profile": "~Erfaun_Noorani1;~Faisal_Hamman1;~Sanghamitra_Dutta2",
        "aff": "Massachusetts Institute of Technology;J.P. Morgan Chase;University of Maryland, College Park",
        "aff_domain": "mit.edu;jpmorganchase.com;umd.edu",
        "position": "Researcher;Intern;Assistant Professor",
        "bibtex": "@misc{\nnoorani2024an,\ntitle={An Entropic Risk Measure for Robust Counterfactual Explanations},\nauthor={Erfaun Noorani and Faisal Hamman and Sanghamitra Dutta},\nyear={2024},\nurl={https://openreview.net/forum?id=uFHDOSfuGS}\n}",
        "github": "",
        "project": "",
        "reviewers": "wXka;RVaH;5rKA;S55q",
        "site": "https://openreview.net/forum?id=uFHDOSfuGS",
        "pdf_size": 485992,
        "rating": "3;3;3;5",
        "confidence": "4;4;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;1;2;2",
        "presentation": "2;2;2;2",
        "wc_summary": "233;123;93;15",
        "wc_strengths": "87;68;10;12",
        "wc_weaknesses": "83;186;67;156",
        "wc_questions": "110;79;241;21",
        "wc_review": "513;456;411;204",
        "wc_reply_reviewers": "0;27;0;0",
        "wc_reply_authors": "529;983;1013;219",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;2;2;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            116.0,
            78.21125238736431
        ],
        "wc_strengths_avg": [
            44.25,
            33.92915413033458
        ],
        "wc_weaknesses_avg": [
            123.0,
            49.48232007495202
        ],
        "wc_questions_avg": [
            112.75,
            80.64234309591953
        ],
        "wc_review_avg": [
            396.0,
            116.59545445685265
        ],
        "wc_reply_reviewers_avg": [
            6.75,
            11.691342951089922
        ],
        "wc_reply_authors_avg": [
            686.0,
            330.8609980036934
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:bekNGdG7BiUJ:scholar.google.com/&scioq=An+Entropic+Risk+Measure+for+Robust+Counterfactual+Explanations&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Massachusetts Institute of Technology;JPMorgan Chase & Co.;University of Maryland",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://web.mit.edu;https://www.jpmorganchase.com;https://www/umd.edu",
        "aff_unique_abbr": "MIT;JPM;UMD",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";College Park",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Differentially Private SGD Without Clipping Bias: An Error-Feedback Approach",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17583",
        "id": "uFbWHyTlPn",
        "author_site": "Xinwei Zhang, Zhiqi Bu, Steven Wu, Mingyi Hong",
        "tldr": "",
        "abstract": "Differentially Private Stochastic Gradient Descent with Gradient Clipping (DPSGD-GC) is a powerful tool for training deep learning models using sensitive data, providing both a solid theoretical privacy guarantee and high efficiency. However, existing research has shown that DPSGD-GC only converges when using large clipping thresholds that are dependent on problem-specific parameters that are often unknown in practice. Therefore, DPSGD-GC suffers from degraded performance due to the {\\it constant}  bias introduced by the clipping. In our work, we propose a new error-feedback (EF) DP algorithm as an alternative to DPSGD-GC, which offers a diminishing utility bound without inducing a constant clipping bias. More importantly, it allows for an arbitrary choice of clipping threshold that is independent of the problem. We establish an algorithm-specific DP analysis for our proposed algorithm, providing privacy guarantees based on R{\\'e}nyi DP. And we demonstrate that under mild conditions, our algorithm can achieve the same utility bound as DPSGD without gradient clipping. Our empirical results on standard datasets show that the proposed algorithm achieves higher accuracies than DPSGD while maintaining the same level of DP guarantee.",
        "keywords": "Differential Privacy;Error-feedback;Differentially private training",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/142f9ec7b46c5e8a0c8ab39401b8c6aa5e016180.pdf",
        "author": "Xinwei Zhang;Zhiqi Bu;Steven Wu;Mingyi Hong",
        "authorids": "~Xinwei_Zhang1;~Zhiqi_Bu1;~Steven_Wu1;~Mingyi_Hong1",
        "gender": "M;M;M;M",
        "homepage": "https://564612540.github.io/;https://sites.google.com/view/zhiqi-bu;http://people.ece.umn.edu/~mhong/mingyi.html;https://zstevenwu.com/",
        "dblp": "55/9870-1.html;245/2573;57/8053;137/8350",
        "google_scholar": "uq46meMAAAAJ;MEvTLxIAAAAJ;qRnP-p0AAAAJ;MbF6rTEAAAAJ",
        "orcid": "0000-0001-7967-7150;;;",
        "linkedin": ";;;zstevenwu/",
        "or_profile": "~Xinwei_Zhang1;~Zhiqi_Bu1;~Mingyi_Hong1;~Zhiwei_Steven_Wu1",
        "aff": "University of Southern California;Amazon;University of Minnesota, Minneapolis;Carnegie Mellon University",
        "aff_domain": "usc.edu;amazon.com;umn.edu;cmu.edu",
        "position": "Postdoc;Researcher;Associate Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nzhang2024differentially,\ntitle={Differentially Private {SGD} Without Clipping Bias: An Error-Feedback Approach},\nauthor={Xinwei Zhang and Zhiqi Bu and Steven Wu and Mingyi Hong},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=uFbWHyTlPn}\n}",
        "github": "",
        "project": "",
        "reviewers": "KeFV;w9rc;uaba;abPz",
        "pdf_size": 776688,
        "rating": "6;6;6;6",
        "confidence": "4;2;3;3",
        "soundness": "3;3;3;3",
        "contribution": "3;2;3;3",
        "presentation": "3;3;3;2",
        "wc_summary": "86;54;33;73",
        "wc_strengths": "85;37;24;150",
        "wc_weaknesses": "130;42;89;854",
        "wc_questions": "188;3;17;93",
        "wc_review": "489;136;163;1170",
        "wc_reply_reviewers": "5;0;0;0",
        "wc_reply_authors": "167;0;0;1233",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "1;0;0;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            61.5,
            20.006249023742555
        ],
        "wc_strengths_avg": [
            74.0,
            49.411537114321796
        ],
        "wc_weaknesses_avg": [
            278.75,
            333.57710877696627
        ],
        "wc_questions_avg": [
            75.25,
            73.55397677896144
        ],
        "wc_review_avg": [
            489.5,
            416.7268289899272
        ],
        "wc_reply_reviewers_avg": [
            1.25,
            2.165063509461097
        ],
        "wc_reply_authors_avg": [
            350.0,
            514.3388960597866
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            0.75,
            0.82915619758885
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=883814308758291302&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=uFbWHyTlPn",
        "pdf": "https://openreview.net/pdf?id=uFbWHyTlPn",
        "email": "usc.edu;amazon.com;umn.edu;cmu.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "University of Southern California;Amazon;University of Minnesota;Carnegie Mellon University",
        "aff_unique_dep": ";Amazon.com, Inc.;;",
        "aff_unique_url": "https://www.usc.edu;https://www.amazon.com;https://www.minnesota.edu;https://www.cmu.edu",
        "aff_unique_abbr": "USC;Amazon;UMN;CMU",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Los Angeles;;Minneapolis",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "uGnGlUMFqI",
        "title": "Rehearsal NeRF: Disentangling Dynamic Illuminations in Neural Radiance Fields",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Although there has been significant progress in neural radiance fields, an issue on dynamic illumination changes still remains unsolved. Different from relevant works that parameterize time-variant/-invariant components in scenes, subjects' radiance is highly entangled with their own emitted radiance and lighting colors in spatio-temporal domain. In this paper, we present a new effective method to render and reconstruct neural fields under severe illumination changes, named $\\textit{ReHeaRF}$. Our key idea is to leverage scenes captured under stable lighting like rehearsal stages, easily taken before dynamic illumination occurs, to enforce geometric consistency between the different lighting conditions. In particular, ReHeaRF uses a learnable vector for lighting effects which represents illumination colors in a temporal dimension and is used to disentangle projected light colors from scene radiance. Furthermore, our ReHeaRF is also able to reconstruct the neural fields of dynamic objects by using off-the-shelf interactive masks for key frames. To decouple the dynamic objects, we propose a new regularizer, removing dynamic parts with similar colors to the light sources. We demonstrate the effectiveness of ReHeaRF by showing robust performances on view synthesis under dynamic illumination conditions and outperforming state-of-the-art approaches in both quantitative and qualitative evaluations. \nWe submit our source codes and video demo as supplementary materials.",
        "keywords": "Scene representation;Scene decomposition;Neural radiance field;Novel view synthesis",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/9509eaaf900ad4cd89e5e84bf70c8e2031206b25.zip",
        "author": "Changyeon Won;Jungu Cho;Seonmi Park;Hyunjun Jung;Chi-Hoon Lee;Hae-Gon Jeon",
        "authorids": "~Changyeon_Won1;~Jungu_Cho1;~Seonmi_Park1;~Hyunjun_Jung2;~Chi-Hoon_Lee2;~Hae-Gon_Jeon3",
        "gender": "M;M;;M;;M",
        "homepage": ";;;https://github.com/hj-jung-01;;https://sites.google.com/site/hgjeoncv/",
        "dblp": ";;;;;142/2427",
        "google_scholar": ";;_jdAVpYAAAAJ;;;https://scholar.google.co.kr/citations?user=Ei00xroAAAAJ",
        "orcid": "0000-0001-5335-2606;;0009-0007-8890-554X;;;0000-0003-1105-1666",
        "linkedin": ";%EC%A4%80%EA%B5%AC-%EC%A1%B0-062774255/;;;chihoonlee/;",
        "or_profile": "~Changyeon_Won1;~Jungu_Cho1;~Seonmi_Park1;~Hyunjun_Jung2;~Chi-Hoon_Lee2;~Hae-Gon_Jeon3",
        "aff": "Gwangju Institute of Science and Technology;Gwangju Institute of Science and Technology;Gwangju Institute of Science and Technology;Gwangju Institute of Science and Technology;CJ Corporation;Gwangju Institute of Science and Technology",
        "aff_domain": "gist.ac.kr;gist.ac.kr;gist.ac.kr;gist.ac.kr;cj.net;gist.ac.kr",
        "position": "PhD student;PhD student;PhD student;PhD student;Head of AI Center;Associate Professor",
        "bibtex": "@misc{\nwon2024rehearsal,\ntitle={Rehearsal Ne{RF}: Disentangling Dynamic Illuminations in Neural Radiance Fields},\nauthor={Changyeon Won and Jungu Cho and Seonmi Park and Hyunjun Jung and Chi-Hoon Lee and Hae-Gon Jeon},\nyear={2024},\nurl={https://openreview.net/forum?id=uGnGlUMFqI}\n}",
        "github": "",
        "project": "",
        "reviewers": "GjAK;3545;cgWH;jMZ5",
        "site": "https://openreview.net/forum?id=uGnGlUMFqI",
        "pdf_size": 3205519,
        "rating": "3;3;5;6",
        "confidence": "4;3;4;4",
        "soundness": "3;2;2;4",
        "contribution": "2;2;2;4",
        "presentation": "3;2;2;3",
        "wc_summary": "80;89;75;105",
        "wc_strengths": "75;45;98;50",
        "wc_weaknesses": "270;174;154;76",
        "wc_questions": "86;13;26;134",
        "wc_review": "511;321;353;365",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            87.25,
            11.409973707244026
        ],
        "wc_strengths_avg": [
            67.0,
            21.20141504711419
        ],
        "wc_weaknesses_avg": [
            168.5,
            69.09956584523523
        ],
        "wc_questions_avg": [
            64.75,
            48.54572586747468
        ],
        "wc_review_avg": [
            387.5,
            73.09411741036347
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5555555555555555,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:UDI4BVHfRacJ:scholar.google.com/&scioq=Rehearsal+NeRF:+Disentangling+Dynamic+Illuminations+in+Neural+Radiance+Fields&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;1;0",
        "aff_unique_norm": "Gwangju Institute of Science and Technology;CJ Corporation",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.gist.ac.kr;https://www.cj.net",
        "aff_unique_abbr": "GIST;CJ",
        "aff_campus_unique_index": "0;0;0;0;0",
        "aff_campus_unique": "Gwangju;",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "Towards Faithful Explanations: Boosting Rationalization with Shortcuts Discovery",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17582",
        "id": "uGtfk2OphU",
        "author_site": "Linan Yue, Qi Liu, Yichao Du, Li Wang, Weibo Gao, Yanqing An",
        "tldr": "",
        "abstract": "The remarkable success in neural networks provokes the selective rationalization. It explains the prediction results by identifying a small subset of the inputs sufficient to support them. Since existing methods still suffer from adopting the shortcuts in data to compose rationales and limited large-scale annotated rationales by human, in this paper, we propose a Shortcuts-fused Selective Rationalization (SSR) method, which boosts the rationalization by discovering and exploiting potential shortcuts. Specifically, SSR first designs a shortcuts discovery approach to detect several potential shortcuts. Then, by introducing the identified shortcuts, we propose two strategies to mitigate the problem of utilizing shortcuts to compose rationales. Finally, we develop two data augmentations methods to close the gap in the number of annotated rationales. Extensive experimental results on real-world datasets clearly validate the effectiveness of our proposed method.",
        "keywords": "Selective Rationalization;Shortcut",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Linan Yue;Qi Liu;Yichao Du;Li Wang;Weibo Gao;Yanqing An",
        "authorids": "~Linan_Yue1;~Qi_Liu3;~Yichao_Du1;~Li_Wang18;~Weibo_Gao1;~Yanqing_An1",
        "gender": "M;M;;F;;M",
        "homepage": "https://yuelinan.github.io/;http://staff.ustc.edu.cn/~qiliuql/;;;;http://home.ustc.edu.cn/~anyq/",
        "dblp": "297/1080;95/2446-3;;;;296/9937",
        "google_scholar": "https://scholar.google.com.hk/citations?user=XDaNgG4AAAAJ;5EoHAFwAAAAJ;;poE7k1wAAAAJ;;gjj3AZ4AAAAJ",
        "orcid": "0000-0002-5980-6098;0000-0001-6956-5550;;;;0000-0001-7977-775X",
        "linkedin": ";;;;;",
        "or_profile": "~Linan_Yue1;~Qi_Liu3;~Yichao_Du1;~Li_Wang18;~Weibo_Gao1;~Yanqing_An1",
        "aff": "University of Science and Technology of China;University of Science and Technology of China;;;;University of Science and Technology of China",
        "aff_domain": "ustc.edu.cn;ustc.edu.cn;;;;mail.ustc.edu.cn",
        "position": "PhD student;Full Professor;;;;MS student",
        "bibtex": "@inproceedings{\nyue2024towards,\ntitle={Towards Faithful Explanations: Boosting Rationalization with Shortcuts Discovery},\nauthor={Linan Yue and Qi Liu and Yichao Du and Li Wang and Weibo Gao and Yanqing An},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=uGtfk2OphU}\n}",
        "github": "",
        "project": "",
        "reviewers": "cE5E;LMAN;2gye",
        "pdf_size": 3910468,
        "rating": "5;6;6",
        "confidence": "3;4;3",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "3;2;3",
        "wc_summary": "246;371;208",
        "wc_strengths": "104;25;187",
        "wc_weaknesses": "276;29;223",
        "wc_questions": "383;30;53",
        "wc_review": "1009;455;671",
        "wc_reply_reviewers": "297;0;0",
        "wc_reply_authors": "2429;1792;1487",
        "reply_reviewers": "1;0;0",
        "reply_authors": "4;4;2",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            275.0,
            69.6323679524592
        ],
        "wc_strengths_avg": [
            105.33333333333333,
            66.14294285023074
        ],
        "wc_weaknesses_avg": [
            176.0,
            106.17281510192082
        ],
        "wc_questions_avg": [
            155.33333333333334,
            161.25824698979653
        ],
        "wc_review_avg": [
            711.6666666666666,
            227.99025320297258
        ],
        "wc_reply_reviewers_avg": [
            99.0,
            140.0071426749364
        ],
        "wc_reply_authors_avg": [
            1902.6666666666667,
            392.450704618498
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "replies_avg": [
            32,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9524835225426575484&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=uGtfk2OphU",
        "pdf": "https://openreview.net/pdf?id=uGtfk2OphU",
        "email": "ustc.edu.cn;ustc.edu.cn;;;;mail.ustc.edu.cn",
        "author_num": 6,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Science and Technology of China",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.ustc.edu.cn",
        "aff_unique_abbr": "USTC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Expected flow networks in stochastic environments and two-player zero-sum games",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17581",
        "id": "uH0FGECSEI",
        "author_site": "Marco Jiralerspong, Bilun Sun, Danilo Vucetic, Tianyu Zhang, Yoshua Bengio, Gauthier Gidel, Nikolay Malkin",
        "tldr": "",
        "abstract": "Generative flow networks (GFlowNets) are sequential sampling models trained to match a given distribution. GFlowNets have been successfully applied to various structured object generation tasks, sampling a diverse set of high-reward objects quickly. We propose expected flow networks (EFlowNets), which extend GFlowNets to stochastic environments. We show that EFlowNets outperform other GFlowNet formulations in stochastic tasks such as protein design. We then extend the concept of EFlowNets to adversarial environments, proposing adversarial flow networks (AFlowNets) for two-player zero-sum games. We show that AFlowNets learn to find above 80% of optimal moves in Connect-4 via self-play and outperform AlphaZero in tournaments. \nCode: https://github.com/GFNOrg/AdversarialFlowNetworks.",
        "keywords": "generative flow networks;GFlowNets;protein design;game theory;self-play;adversarial learning;stochastic environments;quantal response equilibrium;Luce agents;sequential decision making",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Marco Jiralerspong;Bilun Sun;Danilo Vucetic;Tianyu Zhang;Yoshua Bengio;Gauthier Gidel;Nikolay Malkin",
        "authorids": "~Marco_Jiralerspong1;~Bilun_Sun1;~Danilo_Vucetic1;~Tianyu_Zhang6;~Yoshua_Bengio1;~Gauthier_Gidel1;~Nikolay_Malkin1",
        "gender": ";;M;Not Specified;M;M;",
        "homepage": "https://marcojira.github.io/;;;https://ai.t-zhang.com/;http://yoshuabengio.org;https://gauthiergidel.github.io/;",
        "dblp": "319/6631;;319/6924;;56/953;188/6326;",
        "google_scholar": "https://scholar.google.ca/citations?user=q2_P1YcAAAAJ;;8ULqzpMAAAAJ;;kukA0LcAAAAJ;https://scholar.google.fr/citations?user=bDrXQPUAAAAJ;",
        "orcid": ";;;;;;",
        "linkedin": ";bilun-sun;https://linkedin.com/in/danilovucetic;;yoshuabengio/?originalSubdomain=ca;;",
        "or_profile": "~Marco_Jiralerspong1;~Bilun_Sun1;~Danilo_Vucetic1;~Tianyu_Zhang6;~Yoshua_Bengio1;~Gauthier_Gidel1;~Nikolay_Malkin1",
        "aff": "Universit\u00e9 de Montr\u00e9al;;Mila - Quebec Artificial Intelligence Institute;Montreal Institute for Learning Algorithms, University of Montreal, University of Montreal;University of Montreal;Mila - Quebec Artificial Intelligence Institute;",
        "aff_domain": "umontreal.ca;;mila.quebec;mila.umontreal.ca;umontreal.ca;mila.quebec;",
        "position": "PhD student;;PhD student;PhD student;Full Professor;Assistant Professor;",
        "bibtex": "@inproceedings{\njiralerspong2024expected,\ntitle={Expected flow networks in stochastic environments and two-player zero-sum games},\nauthor={Marco Jiralerspong and Bilun Sun and Danilo Vucetic and Tianyu Zhang and Yoshua Bengio and Gauthier Gidel and Nikolay Malkin},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=uH0FGECSEI}\n}",
        "github": "",
        "project": "",
        "reviewers": "cwh7;QVYG;C2iS;g2xq",
        "pdf_size": 492325,
        "rating": "3;5;6;8",
        "confidence": "5;4;3;3",
        "soundness": "1;2;3;3",
        "contribution": "1;2;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "39;48;48;36",
        "wc_strengths": "14;52;75;58",
        "wc_weaknesses": "815;43;174;19",
        "wc_questions": "5;68;25;44",
        "wc_review": "873;211;322;157",
        "wc_reply_reviewers": "0;0;234;0",
        "wc_reply_authors": "1235;859;1691;969",
        "reply_reviewers": "0;0;2;0",
        "reply_authors": "3;3;4;3",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            42.75,
            5.356071321407137
        ],
        "wc_strengths_avg": [
            49.75,
            22.29770167528483
        ],
        "wc_weaknesses_avg": [
            262.75,
            324.2532767760412
        ],
        "wc_questions_avg": [
            35.5,
            23.286262044390035
        ],
        "wc_review_avg": [
            390.75,
            284.7107084392858
        ],
        "wc_reply_reviewers_avg": [
            58.5,
            101.32497224277932
        ],
        "wc_reply_authors_avg": [
            1188.5,
            320.7097597517107
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            3.25,
            0.4330127018922193
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.9198662110077999,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12958191036247545436&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=uH0FGECSEI",
        "pdf": "https://openreview.net/pdf?id=uH0FGECSEI",
        "email": "umontreal.ca;;mila.quebec;mila.umontreal.ca;umontreal.ca;mila.quebec;",
        "author_num": 7,
        "aff_unique_index": "0;1;2;2;1",
        "aff_unique_norm": "Universit\u00e9 de Montr\u00e9al;Quebec Artificial Intelligence Institute;University of Montreal",
        "aff_unique_dep": ";Artificial Intelligence;Montreal Institute for Learning Algorithms",
        "aff_unique_url": "https://www.umontreal.ca;https://mila.quebec;https://www.umontreal.ca",
        "aff_unique_abbr": "UdeM;Mila;UM",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Montreal",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "uHVIxJGwr4",
        "title": "Learning to Branch with Offline Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Mixed Integer Linear Program (MILP) solvers are mostly built upon a branch-and-bound (B\\&B) algorithm, where the efficiency of traditional solvers heavily depends on hand-craft heuristics for branching.  Such a dependency significantly limits the success of those solvers because such heuristics are often difficult to obtain, and not easy to generalize across domains/problems.  \nRecent deep learning approaches aim to automatically learn the branching strategies in a data-driven manner, which removes the dependency on hand-crafted heuristics but introduces a dependency on the availability of high-quality training data. Obtaining the training data that demonstrates near-optimal branching strategies can be a difficult task itself, especially for large problems where accurate solvers have a hard time scaling and producing near-optimal demonstrations.  This paper overcomes this obstacle by proposing a new offline reinforcement learning (RL) approach, namely the \\textit{Ranking-Constrained Actor-Critic} algorithm, which can efficiently learn good branching strategies from sub-optimal or inadequate training signals. Our experiments show its advanced performance in both prediction accuracy and computational efficiency over previous methods for different types of MILP problems on multiple evaluation benchmarks.",
        "keywords": "Mixed Integer Linear Programming;Combinatorial Optimization;Branch-and-Bound;Offline Reinforcement Learning",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "/attachment/536c421b519cc63eeae91cadefae004ec64862c5.pdf",
        "author": "Shengyu Feng;Yiming Yang",
        "authorids": "~Shengyu_Feng1;~Yiming_Yang1",
        "gender": "M;F",
        "homepage": "https://shengyu-feng.github.io/;http://www.cs.cmu.edu/~yiming/",
        "dblp": "47/2121;25/1666",
        "google_scholar": "ApUH8ZcAAAAJ;MlZq4XwAAAAJ",
        "orcid": ";0000-0001-8322-607X",
        "linkedin": "shengyu-feng-331a6214b/;yiming-yang-24100924/",
        "or_profile": "~Shengyu_Feng1;~Yiming_Yang1",
        "aff": "Apple;School of Computer Science, Carnegie Mellon University",
        "aff_domain": "apple.com;cs.cmu.edu",
        "position": "Intern;Full Professor",
        "bibtex": "@misc{\nfeng2024learning,\ntitle={Learning to Branch with Offline Reinforcement Learning},\nauthor={Shengyu Feng and Yiming Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=uHVIxJGwr4}\n}",
        "github": "",
        "project": "",
        "reviewers": "s5Ux;3oNR;pc5v;9gri;nNZN",
        "site": "https://openreview.net/forum?id=uHVIxJGwr4",
        "pdf_size": 511169,
        "rating": "3;3;5;5;8",
        "confidence": "4;4;5;4;3",
        "soundness": "3;2;2;3;3",
        "contribution": "2;2;2;3;2",
        "presentation": "2;3;3;3;3",
        "wc_summary": "57;44;100;62;71",
        "wc_strengths": "24;18;69;61;65",
        "wc_weaknesses": "398;170;43;346;93",
        "wc_questions": "74;7;153;467;11",
        "wc_review": "553;239;365;936;240",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "533;746;739;1310;316",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "1;2;2;2;1",
        "rating_avg": [
            4.8,
            1.8330302779823362
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            66.8,
            18.755265927200288
        ],
        "wc_strengths_avg": [
            47.4,
            21.786234185833955
        ],
        "wc_weaknesses_avg": [
            210.0,
            139.29680541921985
        ],
        "wc_questions_avg": [
            142.4,
            170.73675644101945
        ],
        "wc_review_avg": [
            466.6,
            261.2558898857593
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            728.8,
            330.73699520918433
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.6,
            0.4898979485566356
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5175491695067655,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ak5fw7c-ExwJ:scholar.google.com/&scioq=Learning+to+Branch+with+Offline+Reinforcement+Learning&hl=en&as_sdt=0,48",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Apple;Carnegie Mellon University",
        "aff_unique_dep": "Apple Inc.;School of Computer Science",
        "aff_unique_url": "https://www.apple.com;https://www.cmu.edu",
        "aff_unique_abbr": "Apple;CMU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Pittsburgh",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "uHdf9F1tY4",
        "title": "DiffusionShield: A Watermark for Data Copyright Protection against Generative Diffusion Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recently, Generative Diffusion Models (GDMs) have showcased their remarkable capabilities in learning and generating images. A large community of GDMs has naturally emerged, further promoting the diversified applications of GDMs in various fields. However, this unrestricted proliferation has raised serious concerns about copyright protection. For example, artists including painters and photographers are becoming increasingly concerned that GDMs could effortlessly replicate their unique creative works without authorization. In response to these challenges, we introduce a novel watermarking scheme, DiffusionShield, tailored for GDMs. DiffusionShield protects images from copyright infringement by GDMs through encoding the ownership information into an imperceptible watermark and injecting it into the images. Its watermark can be easily learned by GDMs and will be reproduced in their generated images. By detecting the watermark from generated images, copyright infringement can be exposed with evidence. Benefiting from the uniformity of the watermarks and the joint optimization method, DiffusionShield ensures low distortion of the original image, high watermark detection performance, and the ability to embed lengthy messages. We conduct rigorous and comprehensive experiments to show the effectiveness of DiffusionShield in defending against infringement by GDMs and its superiority over traditional watermarking methods.",
        "keywords": "Generative Diffusion Models;Watermarks;Copyright Protection",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Yingqian Cui;Jie Ren;Han Xu;Pengfei He;Hui Liu;Lichao Sun;Yue Xing;Jiliang Tang",
        "authorids": "~Yingqian_Cui1;~Jie_Ren6;~Han_Xu1;~Pengfei_He2;~Hui_Liu8;~Lichao_Sun1;~Yue_Xing1;~Jiliang_Tang1",
        "gender": "F;M;M;M;F;M;;M",
        "homepage": "https://yingqiancui.github.io/;https://renjie3.github.io/;https://cse.msu.edu/~xuhan1/;https://pengfeihepower.github.io/;https://scholar.google.com/citations?user=EuzF_zsAAAAJ&hl=en;https://lichao-sun.github.io/;https://sites.google.com/site/xingyuecuhk/;https://www.cse.msu.edu/~tangjili/",
        "dblp": ";181/2887-19.html;32/34-2;37/10219-2;93/4010-31;121/0780-1.html;185/5744-2.html;64/10812",
        "google_scholar": "3p67r08AAAAJ;;mX2rL3IAAAAJ;nsSrd6kAAAAJ;;WhGUE7AAAAAJ;;WtzKMWAAAAAJ",
        "orcid": ";;0000-0002-4016-6748;;0000-0002-3555-3495;;;0000-0001-7125-3898",
        "linkedin": ";;;;;lichao-sun-b273a290/;;",
        "or_profile": "~Yingqian_Cui1;~Jie_Ren6;~Han_Xu1;~Pengfei_He2;~Hui_Liu8;~Lichao_Sun1;~Yue_Xing1;~Jiliang_Tang1",
        "aff": "Michigan State University;Sony Europe Ltd.;Michigan State University;Michigan State University;Michigan State University;Lehigh University;Michigan State University;Michigan State University",
        "aff_domain": "msu.edu;sony.com;msu.edu;msu.edu;msu.edu;lehigh.edu;msu.edu;msu.edu",
        "position": "PhD student;Intern;PhD student;PhD student;Assistant Professor;Assistant Professor;Assistant Professor;Full Professor",
        "bibtex": "@misc{\ncui2024diffusionshield,\ntitle={DiffusionShield: A Watermark for Data Copyright Protection against Generative Diffusion Models},\nauthor={Yingqian Cui and Jie Ren and Han Xu and Pengfei He and Hui Liu and Lichao Sun and Yue Xing and Jiliang Tang},\nyear={2024},\nurl={https://openreview.net/forum?id=uHdf9F1tY4}\n}",
        "github": "",
        "project": "",
        "reviewers": "Bfvt;2t92;SzGB;NoWK",
        "site": "https://openreview.net/forum?id=uHdf9F1tY4",
        "pdf_size": 12095829,
        "rating": "3;5;6;8",
        "confidence": "4;3;5;5",
        "soundness": "3;3;2;4",
        "contribution": "2;3;4;4",
        "presentation": "3;3;4;4",
        "wc_summary": "43;190;94;116",
        "wc_strengths": "26;114;45;143",
        "wc_weaknesses": "149;232;84;141",
        "wc_questions": "28;146;284;56",
        "wc_review": "246;682;507;456",
        "wc_reply_reviewers": "677;181;257;34",
        "wc_reply_authors": "3099;1463;1220;853",
        "reply_reviewers": "5;1;1;1",
        "reply_authors": "8;6;5;4",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            110.75,
            52.86480398147713
        ],
        "wc_strengths_avg": [
            82.0,
            48.088460154178364
        ],
        "wc_weaknesses_avg": [
            151.5,
            52.803882433018124
        ],
        "wc_questions_avg": [
            128.5,
            99.80355705083862
        ],
        "wc_review_avg": [
            472.75,
            155.44673525037442
        ],
        "wc_reply_reviewers_avg": [
            287.25,
            238.8748364729948
        ],
        "wc_reply_authors_avg": [
            1658.75,
            859.4144445493106
        ],
        "reply_reviewers_avg": [
            2.0,
            1.7320508075688772
        ],
        "reply_authors_avg": [
            5.75,
            1.479019945774904
        ],
        "replies_avg": [
            37,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.5853694070049635,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8895916458797853243&as_sdt=5,31&sciodt=0,31&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;0;0;0;2;0;0",
        "aff_unique_norm": "Michigan State University;Sony Europe;Lehigh University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.msu.edu;https://www.sony.eu;https://www.lehigh.edu",
        "aff_unique_abbr": "MSU;Sony Europe;Lehigh",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;0;0;0;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "uI2xBHjgr0",
        "title": "Pink: Unveiling the Power of Referential Comprehension for Multi-modal LLMs",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Multi-modal Large Language Models (MLLMs) have shown remarkable capabilities in many vision-language tasks. Nevertheless, most MLLMs still lack the Referential Comprehension (RC) ability to identify a specific object or area in images, limiting their application in fine-grained perception tasks. This paper proposes a novel method to enhance the RC capability for MLLMs.\nOur model represents the referring object in the image using the coordinates of its bounding box and converts the coordinates into texts in a specific format. This allows the model to treat the coordinates as natural language.\nMoreover, we construct the instruction tuning dataset with various designed RC tasks at a low cost by unleashing the potential of annotations in existing datasets.\nTo further boost the RC ability of the model, we propose a self-consistent bootstrapping method that extends dense object annotations of a dataset into high-quality referring-expression-bounding-box pairs.\nThe model is trained end-to-end with a parameter-efficient tuning framework that allows both modalities to benefit from multi-modal instruction tuning. This framework requires fewer trainable parameters and less training data.\nExperimental results on conventional vision-language and RC tasks demonstrate the superior performance of our method. For instance, our model exhibits a 12.0\\% absolute accuracy improvement over Instruct-BLIP on VSR and surpasses Kosmos-2 by 24.7% on RefCOCO_val under zero-shot settings. We also attain the top position on the leaderboard of MMBench. We will release the models, datasets, and codes for further research.",
        "keywords": "Multi-modal large language model;instruction tuning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "shiyu xuan;Qingpei Guo;Ming Yang;Shiliang Zhang",
        "authorids": "~shiyu_xuan1;~Qingpei_Guo1;~Ming_Yang2;~Shiliang_Zhang3",
        "gender": "M;M;M;M",
        "homepage": ";;http://users.ece.northwestern.edu/~mya671/;https://www.pkuvmc.com",
        "dblp": "252/0070;164/5991;98/2604-7;52/6186",
        "google_scholar": "UyZgrZAAAAAJ;https://scholar.google.com/citations?hl=zh-CN;uBHJx08AAAAJ;7phvKK4AAAAJ",
        "orcid": "0000-0001-9950-6025;;0000-0003-1691-6817;0000-0001-9053-9314",
        "linkedin": ";;ming-yang-29ba294/;",
        "or_profile": "~shiyu_xuan1;~Qingpei_Guo1;~Ming_Yang2;~Shiliang_Zhang3",
        "aff": "Peking University;Ant Group;Ant Group;Peking University",
        "aff_domain": "pku.edu.cn;antgroup.com;antgroup.com;pku.edu.cn",
        "position": "PhD student;Researcher;Researcher;Associate Professor",
        "bibtex": "@misc{\nxuan2024pink,\ntitle={Pink: Unveiling the Power of Referential Comprehension for Multi-modal {LLM}s},\nauthor={shiyu xuan and Qingpei Guo and Ming Yang and Shiliang Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=uI2xBHjgr0}\n}",
        "github": "",
        "project": "",
        "reviewers": "GqeY;z9P4;ArFY",
        "site": "https://openreview.net/forum?id=uI2xBHjgr0",
        "pdf_size": 3426434,
        "rating": "3;3;5",
        "confidence": "5;5;3",
        "soundness": "3;3;3",
        "contribution": "2;2;2",
        "presentation": "2;3;3",
        "wc_summary": "115;62;155",
        "wc_strengths": "26;57;97",
        "wc_weaknesses": "77;66;141",
        "wc_questions": "57;26;1",
        "wc_review": "275;211;394",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "499;212;298",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            110.66666666666667,
            38.09053542402481
        ],
        "wc_strengths_avg": [
            60.0,
            29.06314963431642
        ],
        "wc_weaknesses_avg": [
            94.66666666666667,
            33.06895153396242
        ],
        "wc_questions_avg": [
            28.0,
            22.90560339014597
        ],
        "wc_review_avg": [
            293.3333333333333,
            75.82582380400198
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            336.3333333333333,
            120.261751562535
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 43,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10697426516358138987&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;1;0",
        "aff_unique_norm": "Peking University;Ant Group",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.antgroup.com",
        "aff_unique_abbr": "Peking U;Ant Group",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "In-context Exploration-Exploitation for Reinforcement Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17580",
        "id": "uIKZSStON3",
        "author_site": "Zhenwen Dai, Federico Tomasi, Sina Ghiassian",
        "tldr": "",
        "abstract": "In-context learning is a promising approach for online policy learning of offline reinforcement learning (RL) methods, which can be achieved at inference time without gradient optimization. However, this method is hindered by significant computational costs resulting from the gathering of large training trajectory sets and the need to train large Transformer models. We address this challenge by introducing an In-context Exploration-Exploitation (ICEE) algorithm, designed to optimize the efficiency of in-context policy learning. Unlike existing models, ICEE performs an exploration-exploitation trade-off at inference time within a Transformer model, without the need for explicit Bayesian inference. Consequently, ICEE can solve Bayesian optimization problems as efficiently as Gaussian process biased methods do, but in significantly less time. Through experiments in grid world environments, we demonstrate that ICEE can learn to solve new RL tasks using only tens of episodes, marking a substantial improvement over the hundreds of episodes needed by the previous in-context learning method.",
        "keywords": "Offline reinforcement learning;in-context learning;decision transformer",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Zhenwen Dai;Federico Tomasi;Sina Ghiassian",
        "authorids": "~Zhenwen_Dai1;~Federico_Tomasi1;~Sina_Ghiassian1",
        "gender": "M;M;",
        "homepage": "https://www.linkedin.com/in/fdtomasi/;https://sinaghiassian.github.io;https://zhenwendai.github.io/",
        "dblp": "194/6475;200/7870;72/3954",
        "google_scholar": ";https://scholar.google.ca/citations?hl=en;https://scholar.google.co.uk/citations?user=F58CO_QAAAAJ",
        "orcid": "0000-0002-8718-3844;;0000-0003-2061-4977",
        "linkedin": ";sina-ghiassian-23452b61/;",
        "or_profile": "~Federico_Tomasi1;~Sina_Ghiassian1;~Zhenwen_Dai3",
        "aff": "Spotify;Spotify;Spotify",
        "aff_domain": "spotify.com;spotify.com;spotify.com",
        "position": "Research Scientist;Researcher;Researcher",
        "bibtex": "@inproceedings{\ndai2024incontext,\ntitle={In-context Exploration-Exploitation for Reinforcement Learning},\nauthor={Zhenwen Dai and Federico Tomasi and Sina Ghiassian},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=uIKZSStON3}\n}",
        "github": "",
        "project": "",
        "reviewers": "1NXH;cBRg;5MSL;5QaL",
        "pdf_size": 445194,
        "rating": "5;8;8;8",
        "confidence": "3;4;3;4",
        "soundness": "3;3;4;3",
        "contribution": "2;4;3;3",
        "presentation": "3;3;3;4",
        "wc_summary": "62;119;70;137",
        "wc_strengths": "68;98;37;92",
        "wc_weaknesses": "61;58;47;48",
        "wc_questions": "53;41;51;175",
        "wc_review": "244;316;205;452",
        "wc_reply_reviewers": "61;84;18;0",
        "wc_reply_authors": "610;686;918;397",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            7.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            97.0,
            31.77262973063451
        ],
        "wc_strengths_avg": [
            73.75,
            24.00390593216029
        ],
        "wc_weaknesses_avg": [
            53.5,
            6.103277807866851
        ],
        "wc_questions_avg": [
            80.0,
            55.036351623268054
        ],
        "wc_review_avg": [
            304.25,
            94.13919215714569
        ],
        "wc_reply_reviewers_avg": [
            40.75,
            33.38693606786942
        ],
        "wc_reply_authors_avg": [
            652.75,
            186.21140539719903
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12908551633343182795&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=uIKZSStON3",
        "pdf": "https://openreview.net/pdf?id=uIKZSStON3",
        "email": "spotify.com;spotify.com;spotify.com",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Spotify",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.spotify.com",
        "aff_unique_abbr": "Spotify",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Sweden"
    },
    {
        "id": "uItTdHsRzT",
        "title": "On Function-Coupled Watermarks for Deep Neural Networks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Well-performed deep neural networks (DNNs) generally require massive labelled data and computational resources for training. Various watermarking techniques are proposed to protect such intellectual properties (IPs). These techniques allow DNN providers to embed secret information within the model, enabling them to subsequently assert IP rights by extracting the embedded watermarks using specific trigger inputs. Despite the encouraging results seen in recent studies, many of these watermarking methods are vulnerable to removal attacks, notably model fine-tuning and pruning.\n\nIn this paper, we propose a novel DNN watermarking solution that can effectively defend against the above attacks. Our key insight is to enhance the coupling of the watermark and model functionalities such that removing the watermark would inevitably degrade the model's performance on normal inputs. To this end, unlike previous methods relying on secret features learned from out-of-distribution data, our method only uses features learned from in-distribution data. Specifically, on the one hand, we propose to sample inputs from the original training dataset and fuse them as watermark triggers. On the other hand, we randomly mask model weights during training so that the information of our embedded watermarks spreads in the network. By doing so, model fine-tuning/pruning would not forget our \\emph{function-coupled} watermarks.  Empirical results across multiple image classification tasks underscore the enhanced resilience of our watermarks against robust removal attacks, significantly outperforming existing solutions. \nOur code is available at: https://anonymous.4open.science/r/Function-Coupled-Watermark-EC9A.",
        "keywords": "watermark;neural networks;function-coupled;robustness",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Xiangyu Wen;YU LI;Wei Jiang;Qiang Xu",
        "authorids": "~Xiangyu_Wen2;~YU_LI10;~Wei_Jiang15;~Qiang_Xu1",
        "gender": "M;Not Specified;;M",
        "homepage": ";http://liyu.one;;https://github.com/cure-lab",
        "dblp": "263/6833;34/2997-7;21/3839-16.html;43/1230-1",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;M0zhrM8AAAAJ;;https://scholar.google.com.tw/citations?user=eSiKPqUAAAAJ",
        "orcid": "0000-0002-7327-7786;;;",
        "linkedin": ";;;",
        "or_profile": "~Xiangyu_Wen2;~YU_LI10;~Wei_Jiang15;~Qiang_Xu1",
        "aff": "Department of Computer Science and Engineering, The Chinese University of Hong Kong;Harbin Institute of Technology (Shen Zhen);University of Electronic Science and Technology of China;The Chinese University of Hong Kong",
        "aff_domain": "cse.cuhk.edu.hk;hit.edu.cn;uestc.edu.cn;cuhk.edu.hk",
        "position": "PhD student;Assistant Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nwen2024on,\ntitle={On Function-Coupled Watermarks for Deep Neural Networks},\nauthor={Xiangyu Wen and YU LI and Wei Jiang and Qiang Xu},\nyear={2024},\nurl={https://openreview.net/forum?id=uItTdHsRzT}\n}",
        "github": "",
        "project": "",
        "reviewers": "AERq;9Gj7;NZHm;DRqs",
        "site": "https://openreview.net/forum?id=uItTdHsRzT",
        "pdf_size": 868622,
        "rating": "3;3;3;5",
        "confidence": "3;4;4;4",
        "soundness": "3;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "2;2;1;2",
        "wc_summary": "164;45;38;64",
        "wc_strengths": "117;75;83;17",
        "wc_weaknesses": "416;212;110;74",
        "wc_questions": "2;38;5;125",
        "wc_review": "699;370;236;280",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            77.75,
            50.69701667751269
        ],
        "wc_strengths_avg": [
            73.0,
            35.9722114972099
        ],
        "wc_weaknesses_avg": [
            203.0,
            132.984961555809
        ],
        "wc_questions_avg": [
            42.5,
            49.681485485037584
        ],
        "wc_review_avg": [
            396.25,
            181.3427348972106
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4885755511883942729&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Chinese University of Hong Kong;Harbin Institute of Technology;University of Electronic Science and Technology of China",
        "aff_unique_dep": "Department of Computer Science and Engineering;;",
        "aff_unique_url": "https://www.cuhk.edu.hk;http://www.hit.edu.cn/;https://www.uestc.edu.cn",
        "aff_unique_abbr": "CUHK;HIT;UESTC",
        "aff_campus_unique_index": "0;1;0",
        "aff_campus_unique": "Hong Kong SAR;Shenzhen;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "uIv5SaxXLv",
        "title": "NeuralQP: A General Hypergraph-based Optimization Framework for Large-scale Quadratically Constrained Quadratic Programs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Machine Learning (ML)-based optimization frameworks have drawn increasing attention for their remarkable ability to accelerate the optimization procedure of large-scale Quadratically Constrained Quadratic Programs (QCQPs) by learning the shared problem structures, resulting in improved performance compared to classical solvers. However, current ML-based frameworks often struggle with strong problem assumptions and high dependence on large-scale solvers. This paper presents a promising and general hypergraph-based optimization framework for large-scale QCQPs, called NeuralQP. The proposed method comprises two key components: Hypergraph-based Neural Prediction, which generates the embedding of an arbitrary QCQP and obtains the predicted solution without any problem assumption; Iterative Neighborhood Optimization, which uses a McCormick relaxation-based repair strategy to quickly identify illegal variables in the predicted solution and iteratively improves the current solution using only a small-scale solver. Experiments on three classic benchmarks demonstrate that NeuralQP converges significantly faster than the state-of-the-art solves (e.g. Gurobi), further validating the efficiency of the ML-based framework for QCQPs.",
        "keywords": "Quadratically Constrained Quadratic Programs;Machine Learning;Optimization",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Zhixiao Xiong;Huigen Ye;Fangyu Zong;Yutong Zhang;Hua Xu;Hongyan Wang",
        "authorids": "~Zhixiao_Xiong1;~Huigen_Ye1;~Fangyu_Zong1;~Yutong_Zhang6;~Hua_Xu1;~Hongyan_Wang1",
        "gender": "M;;F;F;M;F",
        "homepage": "https://xiong-zx.github.io/;;https://Zongfy02.github.io.;https://thuiar.github.io/;https://thu-xuhua.github.io/;https://www.researchgate.net/profile/Hongyan-Wang-25",
        "dblp": ";;;;31/4114-3;",
        "google_scholar": ";;;;;",
        "orcid": "0009-0007-2905-0481;;;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Zhixiao_Xiong1;~Huigen_Ye1;~Fangyu_Zong1;~Yutong_Zhang6;~Hua_Xu1;~Hongyan_Wang1",
        "aff": "Tsinghua University;;Tsinghua University;Tsinghua University;Tsinghua University;",
        "aff_domain": "tsinghua.edu.cn;;tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;",
        "position": "Undergrad student;;Undergrad student;Undergrad student;Associate Professor;",
        "bibtex": "@misc{\nxiong2024neuralqp,\ntitle={Neural{QP}: A General Hypergraph-based Optimization Framework for Large-scale Quadratically Constrained Quadratic Programs},\nauthor={Zhixiao Xiong and Huigen Ye and Fangyu Zong and Yutong Zhang and Hua Xu and Hongyan Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=uIv5SaxXLv}\n}",
        "github": "",
        "project": "",
        "reviewers": "T75m;v1Pg;RnJs;Nrzd",
        "site": "https://openreview.net/forum?id=uIv5SaxXLv",
        "pdf_size": 2559314,
        "rating": "3;5;5;5",
        "confidence": "4;4;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;3;2;2",
        "presentation": "1;3;3;3",
        "wc_summary": "188;83;126;44",
        "wc_strengths": "11;63;92;54",
        "wc_weaknesses": "899;248;165;97",
        "wc_questions": "5;89;1;5",
        "wc_review": "1103;483;384;200",
        "wc_reply_reviewers": "0;49;0;0",
        "wc_reply_authors": "1556;1422;1226;593",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "3;3;2;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            110.25,
            53.44331108754397
        ],
        "wc_strengths_avg": [
            55.0,
            29.025850547399983
        ],
        "wc_weaknesses_avg": [
            352.25,
            320.1635324330365
        ],
        "wc_questions_avg": [
            25.0,
            36.98648401781386
        ],
        "wc_review_avg": [
            542.5,
            339.1640458539201
        ],
        "wc_reply_reviewers_avg": [
            12.25,
            21.21762239271875
        ],
        "wc_reply_authors_avg": [
            1199.25,
            369.1689145905977
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:7jJTjNrHm1YJ:scholar.google.com/&scioq=NeuralQP:+A+General+Hypergraph-based+Optimization+Framework+for+Large-scale+Quadratically+Constrained+Quadratic+Programs&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Tsinghua University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "uJPWeZffgl",
        "title": "Convex and Bilevel Optimization for Neuro-Symbolic Inference and Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We address a key challenge for neuro-symbolic (NeSy) systems by leveraging convex and bilevel optimization techniques to develop a general first-order gradient-based framework for end-to-end neural and symbolic parameter learning.\nSpecifically, we formulate NeSy learning as a bilevel program, and we employ Moreau smoothing and a graduated value-function approach to support learning with a constrained lower-level inference problem.\nThe applicability of our learning framework is demonstrated with NeuPSL, a state-of-the-art NeSy architecture.\nTo achieve this, we propose a primal and dual formulation of NeuPSL inference as a strongly convex linearly constrained quadratic program and show learning gradients are functions of the optimal dual variables.\nBased on this formulation, we develop a corresponding dual block coordinate descent algorithm that naturally exploits warm-starts. \nThis leads to over $100 \\times$ learning runtime improvements over the current state-of-the-art NeuPSL inference method.\nFinally, we provide extensive empirical evaluations across $8$ datasets covering a range of prediction tasks and demonstrate our learning framework achieves up to a $16$% point prediction performance improvement over the current standard learning process.",
        "keywords": "NeSy;Neuro-Symbolic;Neurosymbolic;Optimization;Bilevel optimization;Convex optimization;Energy-based models;Deep learning",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "",
        "author": "Charles Andrew Dickens;Changyu Gao;Connor Pryor;Stephen Wright;Lise Getoor",
        "authorids": "~Charles_Andrew_Dickens1;~Changyu_Gao1;~Connor_Pryor1;~Stephen_Wright1;~Lise_Getoor1",
        "gender": "M;;M;M;F",
        "homepage": "https://users.soe.ucsc.edu/~cadicken/_site/;https://cyugao.github.io/;;https://wrightstephen.github.io/sw_proj/;https://getoor.soe.ucsc.edu/home",
        "dblp": ";339/8993;294/8960;75/2677;g/LiseGetoor",
        "google_scholar": ";;https://scholar.google.com/citations?hl=en;VFQRIOwAAAAJ;",
        "orcid": ";;;;",
        "linkedin": ";;connor-pryor-182764199/;;",
        "or_profile": "~Charles_Andrew_Dickens1;~Changyu_Gao1;~Connor_Pryor1;~Stephen_Wright1;~Lise_Getoor1",
        "aff": "University of California, Santa Cruz;University of Wisconsin - Madison;University of California, Santa Cruz;University of Wisconsin, Madison;University of Maryland, College Park",
        "aff_domain": "ucsc.edu;wisc.edu;ucsc.edu;wisc.edu;umd.edu",
        "position": "PhD student;PhD student;PhD student;Full Professor;Full Professor",
        "bibtex": "@misc{\ndickens2024convex,\ntitle={Convex and Bilevel Optimization for Neuro-Symbolic Inference and Learning},\nauthor={Charles Andrew Dickens and Changyu Gao and Connor Pryor and Stephen Wright and Lise Getoor},\nyear={2024},\nurl={https://openreview.net/forum?id=uJPWeZffgl}\n}",
        "github": "",
        "project": "",
        "reviewers": "oqJp;2ZRW;vhBN;Zeyx",
        "site": "https://openreview.net/forum?id=uJPWeZffgl",
        "pdf_size": 651254,
        "rating": "3;6;6;6",
        "confidence": "3;3;3;1",
        "soundness": "2;4;3;3",
        "contribution": "1;3;3;3",
        "presentation": "1;3;2;3",
        "wc_summary": "20;27;189;204",
        "wc_strengths": "38;31;154;134",
        "wc_weaknesses": "198;48;87;374",
        "wc_questions": "149;52;275;200",
        "wc_review": "405;158;705;912",
        "wc_reply_reviewers": "434;89;82;78",
        "wc_reply_authors": "726;493;403;367",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            2.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            110.0,
            86.6977508358781
        ],
        "wc_strengths_avg": [
            89.25,
            55.260180057614726
        ],
        "wc_weaknesses_avg": [
            176.75,
            126.48196511756133
        ],
        "wc_questions_avg": [
            169.0,
            81.0647889036911
        ],
        "wc_review_avg": [
            545.0,
            287.07925734890705
        ],
        "wc_reply_reviewers_avg": [
            170.75,
            152.03844086282916
        ],
        "wc_reply_authors_avg": [
            497.25,
            139.81483290409497
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4402417743925395547&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 10,
        "aff_unique_index": "0;1;0;2;3",
        "aff_unique_norm": "University of California, Santa Cruz;University of Wisconsin-Madison;University of Wisconsin;University of Maryland",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.ucsc.edu;https://www.wisc.edu;https://www.wisc.edu;https://www/umd.edu",
        "aff_unique_abbr": "UCSC;UW-Madison;UW;UMD",
        "aff_campus_unique_index": "0;1;0;1;2",
        "aff_campus_unique": "Santa Cruz;Madison;College Park",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "GTA: A Geometry-Aware Attention Mechanism for Multi-View Transformers",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17579",
        "id": "uJVHygNeSZ",
        "author_site": "Takeru Miyato, Bernhard Jaeger, Max Welling, Andreas Geiger",
        "tldr": "",
        "abstract": "As transformers are equivariant to the permutation of input tokens, encoding the positional information of tokens is necessary for many tasks. However, since existing positional encoding schemes have been initially designed for NLP tasks, their suitability for vision tasks, which typically exhibit different structural properties in their data, is questionable. We argue that existing positional encoding schemes are suboptimal for 3D vision tasks, as they do not respect their underlying 3D geometric structure. Based on this hypothesis, we propose a geometry-aware attention mechanism that encodes the geometric structure of tokens as relative transformation determined by the geometric relationship between queries and key-value pairs. By evaluating on multiple novel view synthesis (NVS) datasets in the sparse wide-baseline multi-view setting, we show that our attention, called Geometric Transform Attention (GTA), improves learning efficiency and performance of state-of-the-art transformer-based NVS models without any additional learned parameters and only minor computational overhead.",
        "keywords": "transformer;attention;geometry-aware attention;multi-view understanding;novel view synthesis;group theory",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/8ff1120e29b75b83ff44d13dc1623cbb1cfda4d8.zip",
        "author": "Takeru Miyato;Bernhard Jaeger;Max Welling;Andreas Geiger",
        "authorids": "~Takeru_Miyato1;~Bernhard_Jaeger1;~Max_Welling1;~Andreas_Geiger3",
        "gender": "M;M;M;M",
        "homepage": "http://takerum.github.io/;https://kait0.github.io/;https://staff.fnwi.uva.nl/m.welling/;http://www.cvlibs.net",
        "dblp": "166/1534;327/9257;16/2286;40/5825-1",
        "google_scholar": "s2lG0X0AAAAJ;https://scholar.google.de/citations?user=JpceFvgAAAAJ;https://scholar.google.nl/citations?user=8200InoAAAAJ;https://scholar.google.ca/citations?hl=en",
        "orcid": "0000-0002-7363-1773;0000-0001-6657-2499;0000-0003-1484-2121;0000-0002-8151-3726",
        "linkedin": "takeru-miyato-099780104/;bernhard-jaeger-289b65160/;;",
        "or_profile": "~Takeru_Miyato1;~Bernhard_Jaeger1;~Max_Welling1;~Andreas_Geiger3",
        "aff": "Eberhard-Karls-Universit\u00e4t T\u00fcbingen;Eberhard-Karls-Universit\u00e4t T\u00fcbingen;University of Amsterdam;University of Tuebingen",
        "aff_domain": "uni-tuebingen.de;uni-tuebingen.de;uva.nl;uni-tuebingen.de",
        "position": "PhD student;PhD student;Full Professor;Professor",
        "bibtex": "@inproceedings{\nmiyato2024gta,\ntitle={{GTA}: A Geometry-Aware Attention Mechanism for Multi-View Transformers},\nauthor={Takeru Miyato and Bernhard Jaeger and Max Welling and Andreas Geiger},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=uJVHygNeSZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "LyNT;nfN9;ZuJ5;myD9",
        "pdf_size": 10780110,
        "rating": "5;6;6;8",
        "confidence": "3;4;3;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;3;2;4",
        "wc_summary": "61;76;57;113",
        "wc_strengths": "39;33;70;132",
        "wc_weaknesses": "186;16;129;116",
        "wc_questions": "2;33;67;206",
        "wc_review": "288;158;323;567",
        "wc_reply_reviewers": "64;11;84;0",
        "wc_reply_authors": "1083;749;1047;1313",
        "reply_reviewers": "1;1;2;0",
        "reply_authors": "3;2;3;2",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            76.75,
            22.094965489902897
        ],
        "wc_strengths_avg": [
            68.5,
            39.2587569849072
        ],
        "wc_weaknesses_avg": [
            111.75,
            61.230609175476935
        ],
        "wc_questions_avg": [
            77.0,
            77.94549377609972
        ],
        "wc_review_avg": [
            334.0,
            147.90368487634106
        ],
        "wc_reply_reviewers_avg": [
            39.75,
            35.187888541371734
        ],
        "wc_reply_authors_avg": [
            1048.0,
            200.53179299053804
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.13245323570650439,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7907909805026388790&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=uJVHygNeSZ",
        "pdf": "https://openreview.net/pdf?id=uJVHygNeSZ",
        "email": "uni-tuebingen.de;uni-tuebingen.de;uva.nl;uni-tuebingen.de",
        "author_num": 4,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "Eberhard Karls University of T\u00fcbingen;University of Amsterdam;University of Tuebingen",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.uni-tuebingen.de/;https://www.uva.nl;https://www.uni-tuebingen.de/",
        "aff_unique_abbr": "Uni T\u00fcbingen;UvA;Uni T\u00fcbingen",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "T\u00fcbingen;",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "Germany;Netherlands"
    },
    {
        "id": "uK4TYkVBJG",
        "title": "Self-Prompt SAM: Automatic Prompt SAM Adaptation for Medical Image Segmentation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The Segment Anything Model (SAM), a prompt-driven foundation model for natural image segmentation, has demonstrated impressive zero-shot performance and brought a range of unexplored capabilities to natural image segmentation tasks. However, as a very important branch of image segmentation, the performance of SAM remains uncertain when it is applied to medical image segmentation due to the significant differences between natural images and medical images. Meanwhile, it is harsh to meet the requirements of extra prompts provided, such as points or boxes to specify medical regions, since medical knowledge is not expected from users. \nIn this paper, we aim to adapt pre-trained SAM models worked on from 2D natural images to 3D medical images without any prompts provided. Through the analysis of SAM models, we propose a novel self-prompt SAM adaptation framework for medical image segmentation, named Self-Prompt SAM. We designed a multi-scale prompt generator combined with the image encoder in SAM to generate auxiliary masks. Then, we use the auxiliary masks to generate bounding boxes as box prompts and utilize Distance Transform to select the points farthest from the boundary as point prompts. Meanwhile, we designed a 3D depth-fused adapter (DfusedAdapter) and injected the DFusedAdapter into each transformer block in the image encoder and mask decoder to enable pre-trained 2D SAM models to extract 3D information and adapt to 3D medical images. \nExtensive experiments demonstrate that our method outperforms existing state-of-the-art approaches on two challenging public ACDC and Synapse datasets.",
        "keywords": "SAM;Adapter;Medical image segmentation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Bin Xie;Hao Tang;Dawen Cai;Yan Yan",
        "authorids": "~Bin_Xie1;~Hao_Tang6;~Dawen_Cai1;~Yan_Yan6",
        "gender": "M;M;M;M",
        "homepage": "https://github.com/bxie9;https://ha0tang.github.io/;https://www.cai-lab.org;",
        "dblp": ";07/5751-5;191/6747;13/3953-2",
        "google_scholar": "ibgOuNwAAAAJ;9zJkeEMAAAAJ;8VTu0A8AAAAJ;",
        "orcid": ";0000-0002-2077-1246;0000-0003-4471-2061;",
        "linkedin": ";hao-tang-887475138/;dawen-cai-87b28323;",
        "or_profile": "~Bin_Xie1;~Hao_Tang6;~Dawen_Cai1;~Yan_Yan6",
        "aff": "illinois institute of technology;Carnegie Mellon University;University of Michigan - Ann Arbor;University of Illinois Chicago",
        "aff_domain": "hawk.iit.edu;cmu.edu;umich.edu;uic.edu",
        "position": "PhD student;Postdoc;Associate Professor;Associate Professor",
        "bibtex": "@misc{\nxie2024selfprompt,\ntitle={Self-Prompt {SAM}: Automatic Prompt {SAM} Adaptation for Medical Image Segmentation},\nauthor={Bin Xie and Hao Tang and Dawen Cai and Yan Yan},\nyear={2024},\nurl={https://openreview.net/forum?id=uK4TYkVBJG}\n}",
        "github": "",
        "project": "",
        "reviewers": "4QxB;VLNv;wtde;NtPf",
        "site": "https://openreview.net/forum?id=uK4TYkVBJG",
        "pdf_size": 12234313,
        "rating": "3;3;3;5",
        "confidence": "5;4;4;4",
        "soundness": "3;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "1;3;2;2",
        "wc_summary": "112;65;63;94",
        "wc_strengths": "52;45;52;119",
        "wc_weaknesses": "91;106;559;171",
        "wc_questions": "6;30;71;6",
        "wc_review": "261;246;745;390",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            83.5,
            20.524375751773793
        ],
        "wc_strengths_avg": [
            67.0,
            30.157917700000443
        ],
        "wc_weaknesses_avg": [
            231.75,
            191.31567499815586
        ],
        "wc_questions_avg": [
            28.25,
            26.55536668924005
        ],
        "wc_review_avg": [
            410.5,
            201.0727480291648
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Dbxnlrp-MfAJ:scholar.google.com/&scioq=Self-Prompt+SAM:+Automatic+Prompt+SAM+Adaptation+for+Medical+Image+Segmentation&hl=en&as_sdt=0,47",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Illinois Institute of Technology;Carnegie Mellon University;University of Michigan;University of Illinois at Chicago",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.iit.edu;https://www.cmu.edu;https://www.umich.edu;https://www.uic.edu",
        "aff_unique_abbr": "IIT;CMU;UM;UIC",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Ann Arbor;Chicago",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "BEND: Benchmarking DNA Language Models on Biologically Meaningful Tasks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17578",
        "id": "uKB4cFNQFg",
        "author_site": "Frederikke Marin, Felix Teufel, Marc Horlacher, Dennis Madsen, Dennis Pultz, Ole Winther, Wouter Boomsma",
        "tldr": "",
        "abstract": "The genome sequence contains the blueprint for governing cellular processes. \n  While the availability of genomes has vastly increased over the last decades, experimental annotation of the various functional, non-coding and regulatory elements encoded in the DNA sequence remains both expensive and challenging. This has sparked interest in unsupervised language modeling of genomic DNA, a paradigm that has seen great success for protein sequence data. \n  Although various DNA language models have been proposed, evaluation tasks often differ between individual works, and might not fully recapitulate the fundamental challenges of genome annotation, including the length, scale and sparsity of the data. In this study, we introduce **BEND**, a **BEN**chmark for **D**NA language models, featuring\n  a collection of realistic and biologically meaningful downstream tasks defined on the human genome.\n  We find that embeddings from current DNA LMs can approach performance of expert methods on some tasks, but only capture limited information about long-range features.\n  BEND is available at https://github.com/frederikkemarin/BEND.",
        "keywords": "Biological sequence analysis;enhancer annotation;gene finding;gene annotation;Language model;genome modelling;benchmark;LLM;embeddings;representations;DNA",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/3e7650c1510eba0a7106057399613de120aaded6.pdf",
        "author": "Frederikke Isa Marin;Felix Teufel;Marc Horlacher;Dennis Madsen;Dennis Pultz;Ole Winther;Wouter Boomsma",
        "authorids": "~Frederikke_Isa_Marin1;~Felix_Teufel1;~Marc_Horlacher1;~Dennis_Madsen2;~Dennis_Pultz1;~Ole_Winther1;~Wouter_Boomsma1",
        "gender": "F;;;M;M;M;M",
        "homepage": ";;;;;https://olewinther.github.io/;",
        "dblp": ";348/2081;;;;36/1568;06/5945",
        "google_scholar": ";pO3M3xYAAAAJ;ym7P22IAAAAJ;;;7VAwhzUAAAAJ;EwqU_jsAAAAJ",
        "orcid": "0000-0003-4403-6745;0000-0003-1275-8065;0000-0002-7884-7135;0000-0003-2099-6880;;0000-0002-1966-3205;0000-0002-8257-3827",
        "linkedin": ";;;dennis-madsen-4411421/;https://dk.linkedin.com/in/dennispultz;owinther/;",
        "or_profile": "~Frederikke_Isa_Marin1;~Felix_Teufel1;~Marc_Horlacher1;~Dennis_Madsen2;~Dennis_Pultz1;~Ole_Winther1;~Wouter_Boomsma1",
        "aff": "Copenhagen University;Copenhagen University;Bayer Ag;Novo Nordisk;Novozymes A/S;Technical University of Denmark;University of Copenhagen",
        "aff_domain": "ku.dk;ku.dk;bayer.com;novonordisk.com;novozymes.com;dtu.dk;ku.dk",
        "position": "PhD student;PhD student;Researcher;Principal Researcher;Researcher;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nmarin2024bend,\ntitle={{BEND}: Benchmarking {DNA} Language Models on Biologically Meaningful Tasks},\nauthor={Frederikke Isa Marin and Felix Teufel and Marc Horlacher and Dennis Madsen and Dennis Pultz and Ole Winther and Wouter Boomsma},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=uKB4cFNQFg}\n}",
        "github": "",
        "project": "",
        "reviewers": "gFhh;hBHB;vBTw;cZPk",
        "pdf_size": 1475195,
        "rating": "3;5;6;6",
        "confidence": "4;5;4;5",
        "soundness": "3;2;3;4",
        "contribution": "2;2;3;2",
        "presentation": "3;3;4;4",
        "wc_summary": "206;71;39;84",
        "wc_strengths": "21;44;67;50",
        "wc_weaknesses": "17;85;156;80",
        "wc_questions": "11;305;395;128",
        "wc_review": "255;505;657;342",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "789;1223;1760;1193",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;2;3;2",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            100.0,
            63.35219017524177
        ],
        "wc_strengths_avg": [
            45.5,
            16.469669092000604
        ],
        "wc_weaknesses_avg": [
            84.5,
            49.216359068911224
        ],
        "wc_questions_avg": [
            209.75,
            149.64520540264562
        ],
        "wc_review_avg": [
            439.75,
            154.22609215045293
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1241.25,
            345.0698298895457
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.40824829046386296,
        "gs_citation": 47,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10360556507469492455&as_sdt=5,31&sciodt=0,31&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=uKB4cFNQFg",
        "pdf": "https://openreview.net/pdf?id=uKB4cFNQFg",
        "email": "ku.dk;ku.dk;bayer.com;novonordisk.com;novozymes.com;dtu.dk;ku.dk",
        "author_num": 7,
        "aff_unique_index": "0;0;1;2;3;4;0",
        "aff_unique_norm": "University of Copenhagen;Bayer AG;Novo Nordisk;Novozymes;Technical University of Denmark",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.ku.dk;https://www.bayer.com;https://www.novonordisk.com;https://www.novozymes.com;https://www.tek.dk",
        "aff_unique_abbr": "UCPH;Bayer;NN;Novozymes;DTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0;0;0",
        "aff_country_unique": "Denmark;Germany"
    },
    {
        "id": "uLCtVTzFhg",
        "title": "Contrastive Positive Unlabeled Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Positive Unlabeled(PU) learning refers to the task of learning a binary classifier given a few labeled positive samples, and a set of unlabeled samples (which could be positive or negative). Majority of the existing approaches rely on additional knowledge of the class prior, which is unavailable in practice. Furthermore, these methods tend to perform poorly in low-data regimes, especially when very few positive examples are labeled. In this paper, we propose a novel PU learning framework that overcomes these limitations. We start by learning a feature space through pretext-invariant representation learning and then apply pseudo-labeling to the unlabeled examples, leveraging the cluster-preserving property of the representation space. Overall, our proposed PU learning framework handily outperforms state-of-the-art PU learning methods across several standard PU benchmark datasets, while not requiring a-priori knowledge or estimate of class prior. Remarkably, our method remains effective even when labeled data is scant, where previous PU learning algorithms falter. We also provide simple theoretical analysis motivating our proposed algorithms.",
        "keywords": "positive unlabeled learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/451ee7afaa04c9c7ca2e24af5c4327208e6e3bbb.zip",
        "author": "Anish Acharya;sujay sanghavi",
        "authorids": "~Anish_Acharya1;~sujay_sanghavi1",
        "gender": "M;M",
        "homepage": "https://anishacharya.github.io/;https://sites.utexas.edu/sanghavi",
        "dblp": "120/7655.html;69/4911.html",
        "google_scholar": "https://scholar.google.co.in/citations?hl=en;O-DazBUAAAAJ",
        "orcid": ";",
        "linkedin": "anish-acharya-a98a9383/;",
        "or_profile": "~Anish_Acharya1;~sujay_sanghavi1",
        "aff": "University of Texas, Austin;University of Texas, Austin",
        "aff_domain": "utexas.edu;utexas.edu",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\nacharya2024contrastive,\ntitle={Contrastive Positive Unlabeled Learning},\nauthor={Anish Acharya and sujay sanghavi},\nyear={2024},\nurl={https://openreview.net/forum?id=uLCtVTzFhg}\n}",
        "github": "",
        "project": "",
        "reviewers": "Yt2Y;FfAt;xzEP;sTW4",
        "site": "https://openreview.net/forum?id=uLCtVTzFhg",
        "pdf_size": 13308391,
        "rating": "3;6;6;8",
        "confidence": "4;3;3;4",
        "soundness": "2;3;3;4",
        "contribution": "2;3;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "75;44;27;154",
        "wc_strengths": "51;44;33;94",
        "wc_weaknesses": "200;183;18;275",
        "wc_questions": "177;153;30;159",
        "wc_review": "503;424;108;682",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1945;1891;1257;316",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "4;3;2;1",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            75.0,
            48.74935897014442
        ],
        "wc_strengths_avg": [
            55.5,
            23.13547060251855
        ],
        "wc_weaknesses_avg": [
            169.0,
            93.80031982887905
        ],
        "wc_questions_avg": [
            129.75,
            58.26394682820586
        ],
        "wc_review_avg": [
            429.25,
            207.6961422366819
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1352.25,
            656.5993355921098
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.14002800840280097,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:rNPNUBLL3AkJ:scholar.google.com/&scioq=Contrastive+Positive+Unlabeled+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Texas at Austin",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.utexas.edu",
        "aff_unique_abbr": "UT Austin",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Austin",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "uLOFyiruin",
        "title": "Babel-ImageNet: Massively Multilingual Evaluation of Vision-and-Language Representations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Vision-and-language (VL) models with separate encoders for each modality (e.g., CLIP) have become the go-to models for zero-shot image classification and image-text retrieval. The bulk of the evaluation of these models is, however, performed with English text only: the costly creation of language-specific image-caption datasets has limited multilingual VL benchmarks to a handful of high-resource languages.  \nIn this work, we introduce Babel-ImageNet, a massively multilingual benchmark that offers (partial) translations of 1000 ImageNet labels to 92 languages, built without resorting to machine translation (MT) or requiring manual annotation. We instead automatically obtain reliable translations of ImageNet concepts by linking them -- via shared WordNet synsets -- to BabelNet, a massively multilingual lexico-semantic network.\nWe evaluate 8 different publicly available multilingual CLIP models on zero-shot image classification (ZS-IC) for each of the 92 Babel-ImageNet languages, demonstrating a significant gap between English ImageNet performance and that of high-resource languages (e.g., German or Chinese), and an even bigger gap for low-resource languages (e.g., Sinhala or Lao). Crucially, we show that the models' ZS-IC performance on \\bin{} highly correlates with their performance in image-text retrieval, validating that \\bin{} is suitable for estimating the quality of the multilingual VL representation spaces for the vast majority of languages that lack gold image-text data.      \nFinally, we show that the performance of multilingual CLIP for low-resource languages can be drastically improved via cheap, parameter-efficient language-specific training. \nWe make our code and data publicly available: \\url{\\repourl}",
        "keywords": "vision;languagel;clip;representation;embedding;multilingual;dataset;benchmark",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Gregor Geigle;Radu Timofte;Goran Glava\u0161",
        "authorids": "~Gregor_Geigle1;~Radu_Timofte1;~Goran_Glava\u01611",
        "gender": "M;M;M",
        "homepage": ";https://www.informatik.uni-wuerzburg.de/computervision/;https://sites.google.com/view/goranglavas",
        "dblp": "277/1399;24/8616;50/11059",
        "google_scholar": "uIlyqRwAAAAJ;https://scholar.google.ch/citations?user=u3MwH5kAAAAJ;Ym0myOwAAAAJ",
        "orcid": ";0000-0002-1478-0402;",
        "linkedin": ";https://ch.linkedin.com/in/radutimofte;goran-glava\u0161-8484b420",
        "or_profile": "~Gregor_Geigle1;~Radu_Timofte1;~Goran_Glava\u01611",
        "aff": "Bayerische Julius-Maximilians-Universit\u00e4t W\u00fcrzburg;Bayerische Julius-Maximilians-Universit\u00e4t W\u00fcrzburg;Julius-Maximilians-Universit\u00e4t W\u00fcrzburg",
        "aff_domain": "uni-wuerzburg.de;uni-wuerzburg.de;uni-wuerzburg.de",
        "position": "PhD student;Full Professor;Full Professor",
        "bibtex": "@misc{\ngeigle2024babelimagenet,\ntitle={Babel-ImageNet: Massively Multilingual Evaluation of Vision-and-Language Representations},\nauthor={Gregor Geigle and Radu Timofte and Goran Glava{\\v{s}}},\nyear={2024},\nurl={https://openreview.net/forum?id=uLOFyiruin}\n}",
        "github": "",
        "project": "",
        "reviewers": "3yPQ;3yZg;SS5H;rcTe",
        "site": "https://openreview.net/forum?id=uLOFyiruin",
        "pdf_size": 1940395,
        "rating": "6;6;6;8",
        "confidence": "4;3;4;4",
        "soundness": "2;3;2;3",
        "contribution": "3;3;2;4",
        "presentation": "3;3;3;4",
        "wc_summary": "103;56;59;148",
        "wc_strengths": "83;66;39;68",
        "wc_weaknesses": "229;133;30;1",
        "wc_questions": "182;16;23;1",
        "wc_review": "597;271;151;218",
        "wc_reply_reviewers": "142;0;0;0",
        "wc_reply_authors": "1292;572;177;21",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "3;1;1;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            91.5,
            37.5532954612508
        ],
        "wc_strengths_avg": [
            64.0,
            15.858751527153705
        ],
        "wc_weaknesses_avg": [
            98.25,
            90.0260379001542
        ],
        "wc_questions_avg": [
            55.5,
            73.46597852067309
        ],
        "wc_review_avg": [
            309.25,
            171.48815556766596
        ],
        "wc_reply_reviewers_avg": [
            35.5,
            61.48780366869514
        ],
        "wc_reply_authors_avg": [
            515.5,
            491.2374680335367
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2849040934116785461&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "University of W\u00fcrzburg;Julius-Maximilians-Universit\u00e4t W\u00fcrzburg",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uni-wuerzburg.de;https://www.uni-wuerzburg.de",
        "aff_unique_abbr": "JMU;JMU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "W\u00fcrzburg;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "title": "Self-supervised Pocket Pretraining via Protein Fragment-Surroundings Alignment",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17577",
        "id": "uMAujpVi9m",
        "author_site": "Bowen Gao, Yinjun JIA, Yuanle Mo, yuyan ni, Wei-Ying Ma, Zhi-Ming Ma, Yanyan Lan",
        "tldr": "",
        "abstract": "Pocket representations play a vital role in various biomedical applications, such as druggability estimation, ligand affinity prediction, and de novo drug design. While existing geometric features and pretrained representations have demonstrated promising results, they usually treat pockets independent of ligands, neglecting the fundamental interactions between them. However, the limited pocket-ligand complex structures available in the PDB database (less than 100 thousand non-redundant pairs) hampers large-scale pretraining endeavors for interaction modeling. To address this constraint, we propose a novel pocket pretraining approach that leverages knowledge from high-resolution atomic protein structures, assisted by highly effective pretrained small molecule representations. By segmenting protein structures into drug-like fragments and their corresponding pockets, we obtain a reasonable simulation of ligand-receptor interactions, resulting in the generation of over 5 million complexes. Subsequently, the pocket encoder is trained in a contrastive manner to align with the representation of pseudo-ligand furnished by some pretrained small molecule encoders. Our method, named ProFSA, achieves state-of-the-art performance across various tasks, including pocket druggability prediction, pocket matching, and ligand binding affinity prediction. Notably, ProFSA surpasses other pretraining methods by a substantial margin. Moreover, our work opens up a new avenue for mitigating the scarcity of protein-ligand complex data through the utilization of high-quality and diverse protein structure databases.",
        "keywords": "Drug Discovery;Pretraining",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/ad435d2c518a7382c090ccb958ead71de3d7ac6a.zip",
        "author": "Bowen Gao;Yinjun Jia;YuanLe Mo;Yuyan Ni;Wei-Ying Ma;Zhi-Ming Ma;Yanyan Lan",
        "authorids": "~Bowen_Gao1;~Yinjun_Jia1;~YuanLe_Mo1;~Yuyan_Ni1;~Wei-Ying_Ma2;~Zhi-Ming_Ma1;~Yanyan_Lan2",
        "gender": "M;M;;M;;;M",
        "homepage": "https://www.linkedin.com/in/bgao/;https://github.com/mylRalph;https://nyyxxx.github.io/;https://air.tsinghua.edu.cn/en/info/1046/1189.htm;http://homepage.amss.ac.cn/research/homePage/8eb59241e2e74d828fb84eec0efadba5/myHomePage.html;;https://github.com/EBGU",
        "dblp": ";;117/6286;m/WYMa.html;;00/6040.html;",
        "google_scholar": "cTGzVe8AAAAJ;;https://scholar.google.com/citations?hl=zh-CN;SToCbu8AAAAJ;;;",
        "orcid": ";;;;;;",
        "linkedin": ";;;wei-ying-ma-16a0171/;;;",
        "or_profile": "~Bowen_Gao1;~YuanLe_Mo1;~Yuyan_Ni1;~Wei-Ying_Ma2;~Zhi-Ming_Ma1;~Yanyan_Lan2;~Yinjun_Harold_Jia1",
        "aff": "Tsinghua University;University of Electronic Science and Technology of China;University of Chinese Academy of Sciences;Tsinghua University;Academy of Mathematics and Systems Science, Chinese Academy of Sciences, Chinese Academy of Sciences;Tsinghua University;Tsinghua University",
        "aff_domain": "mail.tsinghua.edu.cn;uestc.edu.cn;ucas.ac.cn;tsinghua.edu.cn;amss.ac.cn;tsinghua.edu.cn;mails.tsinghua.edu.cn",
        "position": "Researcher;Undergrad student;PhD student;Full Professor;Full Professor;Full Professor;PhD student",
        "bibtex": "@inproceedings{\ngao2024selfsupervised,\ntitle={Self-supervised Pocket Pretraining via Protein Fragment-Surroundings Alignment},\nauthor={Bowen Gao and Yinjun Jia and YuanLe Mo and Yuyan Ni and Wei-Ying Ma and Zhi-Ming Ma and Yanyan Lan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=uMAujpVi9m}\n}",
        "github": "",
        "project": "",
        "reviewers": "bxUv;kXw3;FNxz;yfM3",
        "pdf_size": 17952414,
        "rating": "6;6;6;6",
        "confidence": "4;3;1;5",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;3;3;4",
        "wc_summary": "40;105;53;119",
        "wc_strengths": "55;54;119;47",
        "wc_weaknesses": "57;32;201;222",
        "wc_questions": "100;33;6;2",
        "wc_review": "252;224;379;390",
        "wc_reply_reviewers": "0;0;0;149",
        "wc_reply_authors": "1737;847;646;2277",
        "reply_reviewers": "0;0;0;3",
        "reply_authors": "3;2;3;4",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.25,
            1.479019945774904
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            79.25,
            33.439310698637314
        ],
        "wc_strengths_avg": [
            68.75,
            29.17511782324109
        ],
        "wc_weaknesses_avg": [
            128.0,
            84.2941279093627
        ],
        "wc_questions_avg": [
            35.25,
            39.23885192000398
        ],
        "wc_review_avg": [
            311.25,
            74.01815655634772
        ],
        "wc_reply_reviewers_avg": [
            37.25,
            64.51889258194068
        ],
        "wc_reply_authors_avg": [
            1376.75,
            662.3557861904733
        ],
        "reply_reviewers_avg": [
            0.75,
            1.299038105676658
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14827461647568518127&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=uMAujpVi9m",
        "pdf": "https://openreview.net/pdf?id=uMAujpVi9m",
        "email": "mail.tsinghua.edu.cn;uestc.edu.cn;ucas.ac.cn;tsinghua.edu.cn;amss.ac.cn;tsinghua.edu.cn;mails.tsinghua.edu.cn",
        "author_num": 7,
        "aff_unique_index": "0;1;2;0;3;0;0",
        "aff_unique_norm": "Tsinghua University;University of Electronic Science and Technology of China;University of Chinese Academy of Sciences;Chinese Academy of Sciences",
        "aff_unique_dep": ";;;Academy of Mathematics and Systems Science",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.uestc.edu.cn;http://www.ucas.ac.cn;http://www.cas.cn",
        "aff_unique_abbr": "THU;UESTC;UCAS;CAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Learning with Mixture of Prototypes for Out-of-Distribution Detection",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17576",
        "id": "uNkKaD3MCs",
        "author_site": "Haodong Lu, Dong Gong, Shuo Wang, Jason Xue, Lina Yao, Kristen Moore",
        "tldr": "",
        "abstract": "Out-of-distribution (OOD) detection aims to detect testing samples far away from the in-distribution (ID) training data, which is crucial for the safe deployment of machine learning models in the real world. Distance-based OOD detection methods have emerged with enhanced deep representation learning. They identify unseen OOD samples by measuring their distances from ID class centroids or prototypes. However, existing approaches learn the representation relying on oversimplified data assumptions, e.g. modeling ID data of each class with one centroid class prototype or using loss functions not designed for OOD detection, which overlook the natural diversities within the data. Naively enforcing data samples of each class to be compact around only one prototype leads to inadequate modeling of realistic data and limited performance. To tackle these issues, we propose PrototypicAl Learning with a Mixture of prototypes (PALM) that models each class with multiple prototypes to capture the sample diversities, which learns more faithful and compact samples embeddings for enhanching OOD detection. Our method automatically identifies and dynamically updates prototypes, assigning each sample to a subset of prototypes via reciprocal neighbor soft assignment weights. To learn embeddings with multiple prototypes, PALM optimizes a maximum likelihood estimation (MLE) loss to encourage the sample embeddings to compact around the associated prototypes, as well as a contrastive loss on all prototypes to enhance intra-class compactness and inter-class discrimination at the prototype level. Compared to previous methods with prototypes, the proposed mixture prototype modeling of PALM promotes the representations of each ID class to be more compact and separable from others and the unseen OOD samples, resulting in more reliable OOD detection. Moreover, the automatic estimation of prototypes enables our approach to be extended to the challenging OOD detection task with unlabelled ID data. Extensive experiments demonstrate the superiority of PALM over previous methods, achieving state-of-the-art average AUROC performance of 93.82 on the challenging CIFAR-100 benchmark.",
        "keywords": "out-of-distribution detection;prototypical learning;hyperspherical embedding",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Haodong Lu;Dong Gong;Shuo Wang;Jason Xue;Lina Yao;Kristen Moore",
        "authorids": "~Haodong_Lu2;~Dong_Gong1;~Shuo_Wang25;~Jason_Xue1;~Lina_Yao2;~Kristen_Moore1",
        "gender": ";M;M;;F;F",
        "homepage": ";https://donggong1.github.io;https://www.wang-shuo.com;;https://www.linayao.com/;https://people.csiro.au/m/k/kristen-moore",
        "dblp": ";125/5032;63/1591-12;;56/6651-1;167/5919.html",
        "google_scholar": ";https://scholar.google.com.au/citations?user=e2u6hRoAAAAJ;uaGgpMgAAAAJ;;https://scholar.google.com.au/citations?user=EU3snBgAAAAJ;uI20HykAAAAJ",
        "orcid": ";0000-0002-2668-9630;0000-0001-8938-2364;;;0000-0002-9962-5080",
        "linkedin": ";;;;linayao/;",
        "or_profile": "~Haodong_Lu2;~Dong_Gong1;~Shuo_Wang25;~Jason_Xue1;~Lina_Yao2;~Kristen_Moore1",
        "aff": ";University of New South Wales;Shanghai Jiaotong University;;CSIRO's Data61;CSIRO's Data61",
        "aff_domain": ";unsw.edu.au;sjtu.edu.cn;;data61.csiro.au;data61.csiro.au",
        "position": ";Assistant Professor;Associate Professor;;Principal Researcher;Researcher",
        "bibtex": "@inproceedings{\nlu2024learning,\ntitle={Learning with Mixture of Prototypes for Out-of-Distribution Detection},\nauthor={Haodong Lu and Dong Gong and Shuo Wang and Jason Xue and Lina Yao and Kristen Moore},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=uNkKaD3MCs}\n}",
        "github": "",
        "project": "",
        "reviewers": "qjVi;ddCD;dG1q;wPGj",
        "pdf_size": 3111922,
        "rating": "5;6;6;6",
        "confidence": "3;3;5;3",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "65;76;125;45",
        "wc_strengths": "19;47;64;46",
        "wc_weaknesses": "140;152;347;75",
        "wc_questions": "6;6;14;38",
        "wc_review": "230;281;550;204",
        "wc_reply_reviewers": "0;0;112;0",
        "wc_reply_authors": "602;750;865;664",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            77.75,
            29.45653577731095
        ],
        "wc_strengths_avg": [
            44.0,
            16.109003693587013
        ],
        "wc_weaknesses_avg": [
            178.5,
            101.59847439799478
        ],
        "wc_questions_avg": [
            16.0,
            13.114877048604
        ],
        "wc_review_avg": [
            316.25,
            137.76860128490816
        ],
        "wc_reply_reviewers_avg": [
            28.0,
            48.49742261192856
        ],
        "wc_reply_authors_avg": [
            720.25,
            98.72278105888225
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 30,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14252740344834954443&as_sdt=5,34&sciodt=0,34&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=uNkKaD3MCs",
        "pdf": "https://openreview.net/pdf?id=uNkKaD3MCs",
        "email": ";unsw.edu.au;sjtu.edu.cn;;data61.csiro.au;data61.csiro.au",
        "author_num": 6,
        "aff_unique_index": "0;1;2;2",
        "aff_unique_norm": "University of New South Wales;Shanghai Jiao Tong University;CSIRO",
        "aff_unique_dep": ";;Data61",
        "aff_unique_url": "https://www.unsw.edu.au;https://www.sjtu.edu.cn;https://www.csiro.au",
        "aff_unique_abbr": "UNSW;SJTU;CSIRO",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "Australia;China"
    },
    {
        "id": "uNl1UsUUX2",
        "title": "Improving Generalization for Small Datasets with Data-Aware Dynamic Reinitialization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The efficacy of deep learning techniques is contingent upon copious volumes of data (labeled or unlabeled). Nevertheless, access to such data is frequently restricted in practical domains such as medical applications. This presents a formidable obstacle: How can we effectively train a deep neural network on a relatively small dataset while improving generalization? Recent works explored evolutionary or iterative training paradigms, which reinitialize a subset of the parameters to improve generalization performance for small datasets. While effective, these methods randomly select the subset of parameters and maintain a fixed mask throughout iterative training, which can be suboptimal. Motivated by the process of neurogenesis in the brain, we propose a novel iterative training framework, Selective Knowledge Evolution (SKE), that employs a data-aware dynamic masking scheme to eliminate redundant connections by estimating their significance, thereby increasing the model's capacity for further learning via random weight reinitialization. The experimental results demonstrate that our approach outperforms existing methods in accuracy and robustness, highlighting its potential for real-world applications where collecting data is challenging.",
        "keywords": "Generalization;Weight reinitialization;Iterative training;Overfitting;Small datasets",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/64301cfd763a07e92f5e44cd328c2877f34393d4.pdf",
        "author": "Vijaya Raghavan T Ramkumar;Bahram Zonooz;Elahe Arani",
        "authorids": "~Vijaya_Raghavan_T_Ramkumar1;~Bahram_Zonooz1;~Elahe_Arani1",
        "gender": ";M;F",
        "homepage": ";https://sites.google.com/view/bahramzonooz;https://sites.google.com/view/elahe-arani",
        "dblp": ";250/9573;",
        "google_scholar": ";;e_I_v6cAAAAJ",
        "orcid": ";;0000-0002-0952-7007",
        "linkedin": ";;elahe-arani-630870b2/",
        "or_profile": "~Vijaya_Raghavan_T_Ramkumar1;~Bahram_Zonooz1;~Elahe_Arani1",
        "aff": ";Eindhoven University of Technology;Wayve Technologies Ltd",
        "aff_domain": ";tue.nl;wayve.ai",
        "position": ";Assistant Professor;Head of AI Research",
        "bibtex": "@misc{\nramkumar2024improving,\ntitle={Improving Generalization for Small Datasets with Data-Aware Dynamic Reinitialization},\nauthor={Vijaya Raghavan T Ramkumar and Bahram Zonooz and Elahe Arani},\nyear={2024},\nurl={https://openreview.net/forum?id=uNl1UsUUX2}\n}",
        "github": "",
        "project": "",
        "reviewers": "p2E7;Pq8L;U7Q7;a3Fd",
        "site": "https://openreview.net/forum?id=uNl1UsUUX2",
        "pdf_size": 502507,
        "rating": "5;5;6;6",
        "confidence": "4;4;3;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "103;151;68;51",
        "wc_strengths": "73;47;67;63",
        "wc_weaknesses": "324;143;60;157",
        "wc_questions": "53;7;4;310",
        "wc_review": "553;348;199;581",
        "wc_reply_reviewers": "0;0;11;44",
        "wc_reply_authors": "1033;1234;485;1341",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "2;2;2;3",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            93.25,
            38.25163395202877
        ],
        "wc_strengths_avg": [
            62.5,
            9.630680142129112
        ],
        "wc_weaknesses_avg": [
            171.0,
            95.79926930827813
        ],
        "wc_questions_avg": [
            93.5,
            126.4960473690779
        ],
        "wc_review_avg": [
            420.25,
            156.23279905320777
        ],
        "wc_reply_reviewers_avg": [
            13.75,
            18.0329559418305
        ],
        "wc_reply_authors_avg": [
            1023.25,
            329.84418670032676
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:79D6rWgAuOcJ:scholar.google.com/&scioq=Improving+Generalization+for+Small+Datasets+with+Data-Aware+Dynamic+Reinitialization&hl=en&as_sdt=0,3",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Eindhoven University of Technology;Wayve Technologies",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tue.nl;https://www.wayvetechnologies.com",
        "aff_unique_abbr": "TU/e;Wayve",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Netherlands;United Kingdom"
    },
    {
        "title": "Model Tells You What to Discard: Adaptive KV Cache Compression for LLMs",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17575",
        "id": "uNrFpDPMyo",
        "author_site": "Suyu Ge, Yunan Zhang, Liyuan Liu, Minjia Zhang, Jiawei Han, Jianfeng Gao",
        "tldr": "",
        "abstract": "In this study, we introduce adaptive KV cache compression, a plug-and-play method that reduces the memory footprint of generative inference for Large Language Models (LLMs). Different from the conventional KV cache that retains key and value vectors for all context tokens, we conduct targeted profiling to discern the intrinsic structure of attention modules. Based on the recognized structure, we then construct the KV cache in an adaptive manner: evicting long-range contexts on attention heads emphasizing local contexts, discarding non-special tokens on attention heads centered on special tokens, and only employing the standard KV cache for attention heads that broadly attend to all tokens. Moreover, with the lightweight attention profiling used to guide the construction of the adaptive KV cache, FastGen can be deployed without resource-intensive fine-tuning or re-training. In our experiments across various asks, FastGen demonstrates substantial reduction on GPU memory consumption with negligible generation quality loss. We will release our code and the compatible CUDA kernel for reproducibility.",
        "keywords": "Large Language Model;Efficient Inference;Generative Inference;Key-Value Cache",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Suyu Ge;Yunan Zhang;Liyuan Liu;Minjia Zhang;Jiawei Han;Jianfeng Gao",
        "authorids": "~Suyu_Ge1;~Yunan_Zhang1;~Liyuan_Liu3;~Minjia_Zhang1;~Jiawei_Han1;~Jianfeng_Gao1",
        "gender": ";M;;M;M;M",
        "homepage": ";https://www.linkedin.com/in/yunan-zhang-841968120/;;https://minjiazhang.github.io/;http://hanj.cs.illinois.edu/;https://www.microsoft.com/en-us/research/people/jfgao/",
        "dblp": ";;;58/9033;h/JiaweiHan.html;92/5339",
        "google_scholar": ";;;https://scholar.google.com/citations?hl=en;https://scholar.google.com.tw/citations?user=Kv9AbjMAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;0000-0002-8165-166X;0000-0002-3629-2696;",
        "linkedin": ";;;minjia-zhang-05857226/;;",
        "or_profile": "~Suyu_Ge1;~Yunan_Zhang1;~Liyuan_Liu3;~Minjia_Zhang1;~Jiawei_Han1;~Jianfeng_Gao1",
        "aff": ";University of Illinois, Urbana Champaign;;Microsoft ;University of Illinois at Urbana-Champaign (UIUC);Microsoft Research",
        "aff_domain": ";illinois.edu;;microsoft.com;illinois.edu;microsoft.com",
        "position": ";PhD student;;Principle Researcher;Full Professor;Principal Researcher",
        "bibtex": "@inproceedings{\nge2024model,\ntitle={Model Tells You What to Discard: Adaptive {KV} Cache Compression for {LLM}s},\nauthor={Suyu Ge and Yunan Zhang and Liyuan Liu and Minjia Zhang and Jiawei Han and Jianfeng Gao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=uNrFpDPMyo}\n}",
        "github": "",
        "project": "",
        "reviewers": "XtqU;rrTE;9wxD;BiHE;XU71;XPHq",
        "pdf_size": 437927,
        "rating": "8;8;8;8;8;8",
        "confidence": "4;3;3;4;5;4",
        "soundness": "3;3;3;4;3;3",
        "contribution": "3;3;3;4;3;3",
        "presentation": "3;2;3;3;4;3",
        "wc_summary": "95;87;114;54;52;148",
        "wc_strengths": "53;25;57;74;56;72",
        "wc_weaknesses": "146;82;54;258;73;58",
        "wc_questions": "58;9;271;54;15;1",
        "wc_review": "352;203;496;440;196;279",
        "wc_reply_reviewers": "0;0;0;5;32;0",
        "wc_reply_authors": "880;328;712;614;262;291",
        "reply_reviewers": "0;0;0;1;1;0",
        "reply_authors": "2;1;1;1;1;1",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            3.8333333333333335,
            0.6871842709362768
        ],
        "soundness_avg": [
            3.1666666666666665,
            0.3726779962499649
        ],
        "contribution_avg": [
            3.1666666666666665,
            0.3726779962499649
        ],
        "presentation_avg": [
            3.0,
            0.5773502691896257
        ],
        "wc_summary_avg": [
            91.66666666666667,
            33.409912035535534
        ],
        "wc_strengths_avg": [
            56.166666666666664,
            16.077071319808912
        ],
        "wc_weaknesses_avg": [
            111.83333333333333,
            72.0796241820268
        ],
        "wc_questions_avg": [
            68.0,
            93.34880824091971
        ],
        "wc_review_avg": [
            327.6666666666667,
            113.13217441952087
        ],
        "wc_reply_reviewers_avg": [
            6.166666666666667,
            11.6963907063485
        ],
        "wc_reply_authors_avg": [
            514.5,
            234.87141872380585
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.1666666666666667,
            0.3726779962499649
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 202,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17598095746182548727&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=uNrFpDPMyo",
        "pdf": "https://openreview.net/pdf?id=uNrFpDPMyo",
        "email": ";illinois.edu;;microsoft.com;illinois.edu;microsoft.com",
        "author_num": 6,
        "aff_unique_index": "0;1;0;1",
        "aff_unique_norm": "University of Illinois Urbana-Champaign;Microsoft",
        "aff_unique_dep": ";Microsoft Corporation",
        "aff_unique_url": "https://illinois.edu;https://www.microsoft.com",
        "aff_unique_abbr": "UIUC;Microsoft",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Urbana-Champaign;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Unpaired Image-to-Image Translation via Neural Schr\u00f6dinger Bridge",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17574",
        "id": "uQBW7ELXfO",
        "author_site": "Beomsu Kim, Gihyun Kwon, Kwanyoung Kim, Jong Ye",
        "tldr": "",
        "abstract": "Diffusion models are a powerful class of generative models which simulate stochastic differential equations (SDEs) to generate data from noise. While diffusion models have achieved remarkable progress, they have limitations in unpaired image-to-image (I2I) translation tasks due to the Gaussian prior assumption. Schr\u00f6dinger Bridge (SB), which learns an SDE to translate between two arbitrary distributions, have risen as an attractive solution to this problem. Yet, to our best knowledge, none of SB models so far have been successful at unpaired translation between high-resolution images. In this work, we propose Unpaired Neural Schr\u00f6dinger Bridge (UNSB), which expresses the SB problem as a sequence of adversarial learning problems. This allows us to incorporate advanced discriminators and regularization to learn a SB between unpaired data. We show that UNSB is scalable and successfully solves various unpaired I2I translation tasks. Code: \\url{https://github.com/cyclomon/UNSB}",
        "keywords": "Style Transfer;Schr\u00f6dinger Bridge Problem;Adversarial Training",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/f0ddf2e6302ce76720db6bad5bf3d5426e3a5aa2.zip",
        "author": "Beomsu Kim;Gihyun Kwon;Kwanyoung Kim;Jong Chul Ye",
        "authorids": "~Beomsu_Kim1;~Gihyun_Kwon1;~Kwanyoung_Kim1;~Jong_Chul_Ye1",
        "gender": "M;M;M;M",
        "homepage": ";https://sites.google.com/view/gihyunkwon;https://sites.google.com/view/kwanyoung-kim/;https://bispl.weebly.com/",
        "dblp": ";241/7060;120/3921;15/5613",
        "google_scholar": "https://scholar.google.co.kr/citations?user=TofIFUgAAAAJ;yexbg8gAAAAJ;uvHIHbkAAAAJ;HNMjoNEAAAAJ",
        "orcid": ";;;",
        "linkedin": ";gihyun-kwon-b4665a233/;kwanyoung-kim-2a39b41b3/;",
        "or_profile": "~Beomsu_Kim1;~Gihyun_Kwon1;~Kwanyoung_Kim1;~Jong_Chul_Ye1",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.edu;kaist.ac.kr;kaist.ac.kr;kaist.ac.kr",
        "position": "PhD student;PhD student;PhD student;Full Professor",
        "bibtex": "@inproceedings{\nkim2024unpaired,\ntitle={Unpaired Image-to-Image Translation via Neural Schr\\\"odinger Bridge},\nauthor={Beomsu Kim and Gihyun Kwon and Kwanyoung Kim and Jong Chul Ye},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=uQBW7ELXfO}\n}",
        "github": "",
        "project": "",
        "reviewers": "279L;PUqf;f3t2;ek8v",
        "pdf_size": 22470153,
        "rating": "6;6;6;8",
        "confidence": "4;3;4;1",
        "soundness": "3;3;3;3",
        "contribution": "3;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "101;86;104;104",
        "wc_strengths": "86;57;83;52",
        "wc_weaknesses": "31;171;17;92",
        "wc_questions": "4;59;456;1",
        "wc_review": "222;373;660;249",
        "wc_reply_reviewers": "16;107;16;20",
        "wc_reply_authors": "98;466;921;404",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;2;4;4",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            1.224744871391589
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            98.75,
            7.46240577829965
        ],
        "wc_strengths_avg": [
            69.5,
            15.14100392972672
        ],
        "wc_weaknesses_avg": [
            77.75,
            60.77571472224741
        ],
        "wc_questions_avg": [
            130.0,
            189.6272659719588
        ],
        "wc_review_avg": [
            376.0,
            173.57275131771115
        ],
        "wc_reply_reviewers_avg": [
            39.75,
            38.86113096655835
        ],
        "wc_reply_authors_avg": [
            472.25,
            294.1669381490721
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.0,
            1.0
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9428090415820632,
        "gs_citation": 72,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3285481689539134629&as_sdt=5,34&sciodt=0,34&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=uQBW7ELXfO",
        "pdf": "https://openreview.net/pdf?id=uQBW7ELXfO",
        "email": "kaist.edu;kaist.ac.kr;kaist.ac.kr;kaist.ac.kr",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "In-context Autoencoder for Context Compression in a Large Language Model",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17573",
        "id": "uREj4ZuGJE",
        "author_site": "Tao Ge, Hu Jing, Lei Wang, Xun Wang, Si-Qing Chen, Furu Wei",
        "tldr": "",
        "abstract": "We propose the In-context Autoencoder (ICAE), leveraging the power of a large language model (LLM) to compress a long context into short compact memory slots that can be directly conditioned on by the LLM for various purposes. ICAE is first pretrained using both autoencoding and language modeling objectives on massive text data, enabling it to generate memory slots that accurately and comprehensively represent the original context. Then, it is fine-tuned on instruction data for producing desirable responses to various prompts. Experiments demonstrate that our lightweight ICAE, introducing about 1% additional parameters, effectively achieves $4\\times$ context compression based on Llama, offering advantages in both improved latency and GPU memory cost during inference, and showing an interesting insight in memorization as well as potential for scalability. These promising results imply a novel perspective on the connection between working memory in cognitive science and representation learning in LLMs, revealing ICAE's significant implications in addressing the long context problem and suggesting further research in LLM context management. Our data, code and models are available at https://github.com/getao/icae.",
        "keywords": "large language model;context compression;in-context autoencoder;pretraining;fine-tuning;Llama;GPT;memorization",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Tao Ge;Hu Jing;Lei Wang;Xun Wang;Si-Qing Chen;Furu Wei",
        "authorids": "~Tao_Ge1;~Hu_Jing1;2362769214@qq.com;~Xun_Wang5;~Si-Qing_Chen1;~Furu_Wei1",
        "gender": "M;F;;;F;M",
        "homepage": "https://getao.github.io/;;;;;https://www.microsoft.com/en-us/research/people/fuwei/",
        "dblp": "136/7923;;;;;72/5870",
        "google_scholar": "LYbs7Q8AAAAJ;;;;;G-V1VpwAAAAJ",
        "orcid": ";0000-0003-0307-9562;;;0000-0002-6945-4540;",
        "linkedin": ";;;;si-qing-chen-seattle/;",
        "or_profile": "~Tao_Ge1;~Hu_Jing1;2362769214@qq.com;~Xun_Wang5;~Si-Qing_Chen1;~Furu_Wei1",
        "aff": "Tencent AI Lab;Tsinghua University;;;Microsoft;Microsoft Research",
        "aff_domain": "tencent.com;tsinghua.edu.cn;;;microsoft.com;microsoft.com",
        "position": "Principal Researcher;MS student;;;Partner Applied Science Manager;Distinguished Scientist",
        "bibtex": "@inproceedings{\nge2024incontext,\ntitle={In-context Autoencoder for Context Compression in a Large Language Model},\nauthor={Tao Ge and Hu Jing and Lei Wang and Xun Wang and Si-Qing Chen and Furu Wei},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=uREj4ZuGJE}\n}",
        "github": "",
        "project": "",
        "reviewers": "kMU9;DLaD;fbEw;anmc",
        "pdf_size": 1435525,
        "rating": "5;6;8;8",
        "confidence": "4;4;5;4",
        "soundness": "3;3;4;4",
        "contribution": "3;2;3;4",
        "presentation": "3;3;4;3",
        "wc_summary": "158;48;63;66",
        "wc_strengths": "86;26;122;57",
        "wc_weaknesses": "124;292;110;40",
        "wc_questions": "293;66;55;357",
        "wc_review": "661;432;350;520",
        "wc_reply_reviewers": "0;59;0;0",
        "wc_reply_authors": "1387;487;266;1028",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "3;2;1;2",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            83.75,
            43.40722866067356
        ],
        "wc_strengths_avg": [
            72.75,
            35.47798613224826
        ],
        "wc_weaknesses_avg": [
            141.5,
            92.535128464816
        ],
        "wc_questions_avg": [
            192.75,
            134.22811739721303
        ],
        "wc_review_avg": [
            490.75,
            115.22016967527864
        ],
        "wc_reply_reviewers_avg": [
            14.75,
            25.54774941164094
        ],
        "wc_reply_authors_avg": [
            792.0,
            441.42439896317467
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5555555555555555,
        "gs_citation": 143,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16575040938931374371&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=uREj4ZuGJE",
        "pdf": "https://openreview.net/pdf?id=uREj4ZuGJE",
        "email": "tencent.com;tsinghua.edu.cn;;;microsoft.com;microsoft.com",
        "author_num": 6,
        "aff_unique_index": "0;1;2;2",
        "aff_unique_norm": "Tencent;Tsinghua University;Microsoft",
        "aff_unique_dep": "Tencent AI Lab;;Microsoft Corporation",
        "aff_unique_url": "https://ai.tencent.com;https://www.tsinghua.edu.cn;https://www.microsoft.com",
        "aff_unique_abbr": "Tencent AI Lab;THU;Microsoft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "uRXxnoqDHH",
        "title": "MoAT: Multi-Modal Augmented Time Series Forecasting",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Time series forecasting plays a pivotal role in various domains, facilitating optimized resource allocation and strategic decision-making. However, the scarcity of training samples often hinders the accuracy of the forecasting task. To address this, we explore the potential of leveraging information from different modalities that are commonly associated with time series data. In this paper, we introduce MoAT, a novel multi-modal augmented time series forecasting approach that strategically integrates both feature-wise and sample-wise augmentation methods to enrich multi-modal representation learning. It further enhances prediction accuracy through joint trend-seasonal decomposition across all modalities and fuses the information for the final prediction. Extensive experiments show that MoAT outperforms state-of-the-art methods, resulting in a substantial reduction in mean squared error ranging from 6.5% to 71.7%, which demonstrates the effectiveness and robustness in addressing the limitations imposed by data scarcity. The datasets and code are available at https://anonymous.4open.science/r/MoAT-201E.",
        "keywords": "time series;multi-modal;augmentation;forecasting",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Geon Lee;Wenchao Yu;Wei Cheng;Haifeng Chen",
        "authorids": "~Geon_Lee1;~Wenchao_Yu1;~Wei_Cheng1;~Haifeng_Chen1",
        "gender": ";;M;",
        "homepage": "https://geonlee0325.github.io/;;https://chengw07.github.io/;https://haifengchen.gitlab.io/intro/",
        "dblp": ";07/8491;89/2506-2.html;08/57-1.html",
        "google_scholar": "https://scholar.google.co.kr/citations?user=2g2psXcAAAAJ;;PRrGVmoAAAAJ;QzakB68AAAAJ",
        "orcid": "0000-0001-6339-9758;;;",
        "linkedin": "geon-lee-70322a161/;;wei-cheng-ml/;",
        "or_profile": "~Geon_Lee1;~Wenchao_Yu1;~Wei_Cheng1;~Haifeng_Chen1",
        "aff": "Korea Advanced Institute of Science & Technology;University of California, Los Angeles;NEC-Labs;NEC-Labs",
        "aff_domain": "kaist.ac.kr;ucla.edu;nec-labs.com;nec-labs.com",
        "position": "PhD student;PhD student;Principal Researcher;Researcher",
        "bibtex": "@misc{\nlee2024moat,\ntitle={Mo{AT}: Multi-Modal Augmented Time Series Forecasting},\nauthor={Geon Lee and Wenchao Yu and Wei Cheng and Haifeng Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=uRXxnoqDHH}\n}",
        "github": "",
        "project": "",
        "reviewers": "roN3;kpLg;Moxw;uJCG",
        "site": "https://openreview.net/forum?id=uRXxnoqDHH",
        "pdf_size": 1175238,
        "rating": "5;5;5;5",
        "confidence": "4;4;3;4",
        "soundness": "2;2;2;2",
        "contribution": "3;3;2;2",
        "presentation": "3;3;3;2",
        "wc_summary": "137;51;19;38",
        "wc_strengths": "56;49;40;76",
        "wc_weaknesses": "205;143;263;110",
        "wc_questions": "89;3;262;149",
        "wc_review": "487;246;584;373",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "354;470;917;670",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;3;2",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            61.25,
            45.190568706313044
        ],
        "wc_strengths_avg": [
            55.25,
            13.254716141811564
        ],
        "wc_weaknesses_avg": [
            180.25,
            58.699978705277225
        ],
        "wc_questions_avg": [
            125.75,
            94.23739968823418
        ],
        "wc_review_avg": [
            422.5,
            126.33784072873812
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            602.75,
            213.76081843967572
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7771851514159823446&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;2",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology;University of California, Los Angeles;NEC Laboratories",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.kaist.ac.kr;https://www.ucla.edu;https://www.nec-labs.com",
        "aff_unique_abbr": "KAIST;UCLA;NEC-Labs",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Los Angeles",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "id": "uRhRDpsCO2",
        "title": "MATT: Random Local Implicit Purification for Defending Query-based Attacks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Black-box query-based attacks constitute significant threats to Machine Learning as a Service (MLaaS) systems since they can generate adversarial examples without accessing the target model's architecture and parameters. Traditional defense mechanisms, such as adversarial training, gradient masking, and input transformations, either impose substantial computational costs or compromise the test accuracy of non-adversarial inputs. To address these challenges, we propose an efficient defense mechanism, MATT, that employs random patch-wise purifications with an ensemble of lightweight purification models. These models leverage the local implicit function and rebuild the natural image manifold with low inference latency. Our theoretical analysis suggests that this approach slows down the convergence of query-based attacks while preserving the average robustness improvement by combining randomness and purifications. Extensive experiments on CIFAR-10 and ImageNet validate the effectiveness of our proposed purifier-based defense mechanism, demonstrating significant improvements in classifier robustness against query-based attacks.",
        "keywords": "Query-based Adversarial Attacks;Image Purification;Local Implicit Function",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Ping Guo;Zhiyuan Yang;Xi Lin;Qingchuan Zhao;Qingfu Zhang",
        "authorids": "~Ping_Guo6;~Zhiyuan_Yang2;~Xi_Lin2;~Qingchuan_Zhao1;~Qingfu_Zhang1",
        "gender": "Not Specified;;M;M;M",
        "homepage": "https://guo-ping.com/;;https://xi-l.github.io/;https://bruceqczhao.github.io;https://www.cs.cityu.edu.hk/~qzhan7/index.html",
        "dblp": "33/5440-7.html;;43/489-1;156/1033.html;98/1240.html",
        "google_scholar": "bFWv-bAAAAAJ;;QB_MUboAAAAJ;XOtjYGIAAAAJ;https://scholar.google.co.uk/citations?user=nhL9PHwAAAAJ",
        "orcid": "0000-0001-5412-914X;;;0000-0003-0163-2846;",
        "linkedin": ";;;;",
        "or_profile": "~Ping_Guo6;~Zhiyuan_Yang2;~Xi_Lin2;~Qingchuan_Zhao1;~Qingfu_Zhang1",
        "aff": "City University of Hong Kong;;City University of Hong Kong;City University of Hong Kong;City University of Hong Kong",
        "aff_domain": "cityu.edu.hk;;cityu.edu.hk;cityu.edu.hk;cityu.edu.hk",
        "position": "PhD student;;Postdoc;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nguo2024matt,\ntitle={{MATT}: Random Local Implicit Purification for Defending Query-based Attacks},\nauthor={Ping Guo and Zhiyuan Yang and Xi Lin and Qingchuan Zhao and Qingfu Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=uRhRDpsCO2}\n}",
        "github": "",
        "project": "",
        "reviewers": "TG1v;bHtq;XS3B;cfuj",
        "site": "https://openreview.net/forum?id=uRhRDpsCO2",
        "pdf_size": 10989297,
        "rating": "3;5;5;6",
        "confidence": "4;4;4;3",
        "soundness": "2;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "2;3;2;3",
        "wc_summary": "32;55;45;68",
        "wc_strengths": "46;47;41;39",
        "wc_weaknesses": "377;54;149;50",
        "wc_questions": "3;35;112;172",
        "wc_review": "458;191;347;329",
        "wc_reply_reviewers": "0;36;0;0",
        "wc_reply_authors": "1116;468;444;557",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "3;2;2;2",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            50.0,
            13.209844813622906
        ],
        "wc_strengths_avg": [
            43.25,
            3.344772040064913
        ],
        "wc_weaknesses_avg": [
            157.5,
            132.77895164520618
        ],
        "wc_questions_avg": [
            80.5,
            66.03218912015564
        ],
        "wc_review_avg": [
            331.25,
            94.8535054702777
        ],
        "wc_reply_reviewers_avg": [
            9.0,
            15.588457268119896
        ],
        "wc_reply_authors_avg": [
            646.25,
            274.45798858841766
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.6622661785325219,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:kw86yre0Wa4J:scholar.google.com/&scioq=MATT:+Random+Local+Implicit+Purification+for+Defending+Query-based+Attacks&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "City University of Hong Kong",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cityu.edu.hk",
        "aff_unique_abbr": "CityU",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "uS85FzjNDR",
        "title": "A Unified Framework for Heterogeneous Semi-supervised Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this work, we introduce a novel problem setup termed as Heterogeneous Semi-\nSupervised Learning (HSSL), which presents unique challenges by bridging the\nsemi-supervised learning (SSL) task and the unsupervised domain adaptation\n(UDA) task, and expanding standard semi-supervised learning to cope with heterogeneous training data. At its core, HSSL aims to learn a prediction model\nusing a combination of labeled and unlabeled training data drawn separately from\nheterogeneous domains that share a common set of semantic categories; this model\nis intended to differentiate the semantic categories of test instances sampled from\nboth the labeled and unlabeled domains. In particular, the labeled and unlabeled\ndomains have dissimilar label distributions and class feature distributions. This\nheterogeneity, coupled with the assorted sources of the test data, introduces significant challenges to standard SSL and UDA methods. Therefore, we propose a\nnovel method, Unified Framework for Heterogeneous Semi-supervised Learning\n(Uni-HSSL), to address HSSL by directly learning a fine-grained classifier from the\nheterogeneous data, which adaptively handles the inter-domain heterogeneity while\nleveraging both the unlabeled data and the inter-domain semantic class relationships\nfor cross-domain knowledge transfer and adaptation. We conduct comprehensive\nexperiments and the experimental results validate the efficacy and superior performance of the proposed Uni-HSSL over state-of-the-art semi-supervised learning\nand unsupervised domain adaptation methods.",
        "keywords": "Semi-Supervised Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Marzi Heidari;Abdullah Alchihabi;Hao Yan;Yuhong Guo",
        "authorids": "~Marzi_Heidari1;~Abdullah_Alchihabi1;~Hao_Yan4;~Yuhong_Guo1",
        "gender": "F;;;",
        "homepage": ";;;",
        "dblp": "270/0305;;;",
        "google_scholar": "https://scholar.google.ca/citations?user=OEWPekoAAAAJ;;;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Marzi_Heidari1;~Abdullah_Alchihabi1;~Hao_Yan4;~Yuhong_Guo1",
        "aff": "Carleton University;;;",
        "aff_domain": "carleton.ca;;;",
        "position": "PhD student;;;",
        "bibtex": "@misc{\nheidari2024a,\ntitle={A Unified Framework for Heterogeneous Semi-supervised Learning},\nauthor={Marzi Heidari and Abdullah Alchihabi and Hao Yan and Yuhong Guo},\nyear={2024},\nurl={https://openreview.net/forum?id=uS85FzjNDR}\n}",
        "github": "",
        "project": "",
        "reviewers": "Wmog;xGwt;uSh4",
        "site": "https://openreview.net/forum?id=uS85FzjNDR",
        "pdf_size": 584257,
        "rating": "3;3;5",
        "confidence": "5;4;4",
        "soundness": "2;3;2",
        "contribution": "1;2;2",
        "presentation": "2;3;3",
        "wc_summary": "26;54;58",
        "wc_strengths": "9;39;48",
        "wc_weaknesses": "66;282;296",
        "wc_questions": "6;4;45",
        "wc_review": "107;379;447",
        "wc_reply_reviewers": "0;0;28",
        "wc_reply_authors": "157;565;488",
        "reply_reviewers": "0;0;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            46.0,
            14.236104336041748
        ],
        "wc_strengths_avg": [
            32.0,
            16.673332000533065
        ],
        "wc_weaknesses_avg": [
            214.66666666666666,
            105.27846672304624
        ],
        "wc_questions_avg": [
            18.333333333333332,
            18.873850222522755
        ],
        "wc_review_avg": [
            311.0,
            146.8967891639115
        ],
        "wc_reply_reviewers_avg": [
            9.333333333333334,
            13.199326582148887
        ],
        "wc_reply_authors_avg": [
            403.3333333333333,
            176.9978028739968
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:50J-spezP1kJ:scholar.google.com/&scioq=A+Unified+Framework+for+Heterogeneous+Semi-supervised+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Carleton University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://carleton.ca",
        "aff_unique_abbr": "Carleton",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "uSX6IbpGZ9",
        "title": "Trend/Seasonality based Causal Structure for Time Series Counterfactual Outcome Prediction",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In the causal effect estimation, most models have focused on estimating counterfactual outcomes in the static setting, and it is still difficult to predict the outcomes in the longitudinal setting due to time-varying confounder. To resolve the time-varying confounder issue, while the balance representation learning-based approaches have been primarily proposed, they inherently introduces a certain degree of selection bias since the balance representations act as confounders for both treatment and outcomes. In this paper, a new trend/seasonality decomposition based causal structure is proposed for the counterfactual outcome prediction in the time-series setting. We leverage a decomposition methodology to reduce the selection bias further. Specifically, it extracts meaningful decomposed representations such as confounders and adjustment variables, which help to yield more accurate treatment effect estimation with low variance. Inspired by the fact, the proposed causal structure learns trend/seasonality representations as the confounders/adjustment variables in the direction of minimizing the selection bias, and those representations are effective in the counterfactual outcome prediction especially under the long time sequence and high time-varying confounding settings. We evaluate the proposed causal structure with several trend/seasonality decomposition algorithms on synthetic and real-world datasets. From various experiments, the proposed causal structure achieves superior performance over the state-of-the-art algorithms.",
        "keywords": "Time series counterfactual outcome prediction;Trend/Seasonality decomposition;Causal structure",
        "primary_area": "causal reasoning",
        "supplementary_material": "/attachment/6902d4f39f48ee927fe5b07eae9f73819cc497f2.zip",
        "author": "Jung-Hee Kim;Juhyun Lyu;Wonbin Ahn;Sangmin Lee;Sangjun Han;Hyeokjun Choe;Soyeon Park;Woohyung Lim",
        "authorids": "~Jung-Hee_Kim1;~Juhyun_Lyu1;~Wonbin_Ahn1;~Sangmin_Lee2;~Sangjun_Han1;~Hyeokjun_Choe1;~Soyeon_Park3;~Woohyung_Lim1",
        "gender": ";M;M;M;M;M;F;M",
        "homepage": "https://www.lgresearch.ai/;;https://www.lgresearch.ai/;;https://sites.google.com/view/sjhan91/;;https://www.lgresearch.ai/;",
        "dblp": ";;;;;;;86/7195",
        "google_scholar": ";r94q0mAAAAAJ;;;WJmg41AAAAAJ;FpmqgJEAAAAJ;Z270FY0AAAAJ;https://scholar.google.co.kr/citations?user=gtvxdcUAAAAJ",
        "orcid": ";;;;;;;0000-0003-0525-9065",
        "linkedin": ";;wonbin-ahn-9956b625;smlee89/;sangjun-han-78a166b8/;;;woohyunglim/",
        "or_profile": "~Jung-Hee_Kim1;~Juhyun_Lyu1;~Wonbin_Ahn1;~Sangmin_Lee2;~Sangjun_Han1;~Hyeokjun_Choe1;~Soyeon_Park3;~Woohyung_Lim1",
        "aff": "LG AI Research;Seoul National University;LG AI Research;LG AI Research;LG AI Research;LG AI Research;LG AI Research;LG AI Research",
        "aff_domain": "lgresearch.ai;snu.ac.kr;lgresearch.ai;lgresearch.ai;lgresearch.ai;lgresearch.ai;lgresearch.ai;lgresearch.ai",
        "position": "Researcher;Researcher;Researcher;Research Scientist;Researcher;Researcher;Researcher;Vice President",
        "bibtex": "@misc{\nkim2024trendseasonality,\ntitle={Trend/Seasonality based Causal Structure for Time Series Counterfactual Outcome Prediction},\nauthor={Jung-Hee Kim and Juhyun Lyu and Wonbin Ahn and Sangmin Lee and Sangjun Han and Hyeokjun Choe and Soyeon Park and Woohyung Lim},\nyear={2024},\nurl={https://openreview.net/forum?id=uSX6IbpGZ9}\n}",
        "github": "",
        "project": "",
        "reviewers": "WhEV;wQ3e;WboM;afJU",
        "site": "https://openreview.net/forum?id=uSX6IbpGZ9",
        "pdf_size": 275305,
        "rating": "3;3;3;6",
        "confidence": "4;2;2;4",
        "soundness": "2;2;2;3",
        "contribution": "1;1;2;3",
        "presentation": "1;2;3;3",
        "wc_summary": "106;38;43;90",
        "wc_strengths": "11;11;45;219",
        "wc_weaknesses": "287;228;207;191",
        "wc_questions": "2;25;56;68",
        "wc_review": "406;302;351;568",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "234;118;167;148",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.0,
            1.0
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            69.25,
            29.354514133264068
        ],
        "wc_strengths_avg": [
            71.5,
            86.28296471494242
        ],
        "wc_weaknesses_avg": [
            228.25,
            36.3687709443143
        ],
        "wc_questions_avg": [
            37.75,
            25.926579026165406
        ],
        "wc_review_avg": [
            406.75,
            100.10338405868205
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            166.75,
            42.57566793369189
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:6rjxaUJRHxwJ:scholar.google.com/&scioq=Trend/Seasonality+based+Causal+Structure+for+Time+Series+Counterfactual+Outcome+Prediction&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0;0;0;0;0",
        "aff_unique_norm": "LG;Seoul National University",
        "aff_unique_dep": "LG AI Research;",
        "aff_unique_url": "https://www.lgaires.com;https://www.snu.ac.kr",
        "aff_unique_abbr": "LG AI;SNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "uU0Adp7Sfo",
        "title": "Competitive-Collaborative GAN with Performance Guarantee",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Generative Adversarial Networks (GANs) generate data based on a competition game to minimize the distribution distance between existing and new data. However, such a competition game falls short when insights about data distributions beyond their authenticity are imperative, such as in multi-modal generation and image super resolution. In recognition of the limitations inherent to the pure-competitive mechanism, we introduce CCGAN, a Collaborative-Competitive Generative Adversarial Network scheme to enable data generation with additional knowledge beyond the provided dataset distribution. For theoretically preserving the equilibrium point and numerically avoiding training collapse issue, we show the need to convert regularization term into a divergence, so that the modified GAN is well-defined in game theory. By harmonizing the competition and collaboration losses in CCGAN, we effectively reduce the degree complexity of solving the optima, facilitating the establishment of a closed-form equilibrium point. This equilibrium point serves as a guidance for training and hyper-parameter tuning, resulting in consistently high-quality generated samples. Meanwhile, the regularization breaks the mutual dependency between the generator and discriminator. This newfound independence empowers the CCGAN to explore a broader parameter space, effectively mitigating the training collapse issue. To validate the capabilities of CCGAN, we design comprehensive experiments across four publicly available datasets and systematically compare CCGAN against a range of baseline models. The experiments demonstrate the efficacy of CCGAN on generating satisfactory samples tailored to specific requirements, particularly when applied to the generation of images featuring regularly shaped objects.",
        "keywords": "Generative adversarial network;Collaboration;Equilibrium point",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/c3d655282bce60cf1a68d90203078b24847806b7.zip",
        "author": "CHENHAN XIAO;Yang Weng",
        "authorids": "~CHENHAN_XIAO1;yweng2@asu.edu",
        "gender": "M;",
        "homepage": "http://120.79.135.121:3000/index.html;",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~CHENHAN_XIAO1;yweng2@asu.edu",
        "aff": "Arizona State University;",
        "aff_domain": "asu.edu;",
        "position": "PhD student;",
        "bibtex": "@misc{\nxiao2024competitivecollaborative,\ntitle={Competitive-Collaborative {GAN} with Performance Guarantee},\nauthor={CHENHAN XIAO and Yang Weng},\nyear={2024},\nurl={https://openreview.net/forum?id=uU0Adp7Sfo}\n}",
        "github": "",
        "project": "",
        "reviewers": "LRgJ;vo9B;sbbf;PRKH",
        "site": "https://openreview.net/forum?id=uU0Adp7Sfo",
        "pdf_size": 18825255,
        "rating": "3;3;3;5",
        "confidence": "4;4;5;5",
        "soundness": "2;3;2;3",
        "contribution": "2;3;2;3",
        "presentation": "2;3;3;2",
        "wc_summary": "257;56;72;87",
        "wc_strengths": "84;26;38;27",
        "wc_weaknesses": "396;14;315;120",
        "wc_questions": "2;107;26;66",
        "wc_review": "739;203;451;300",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "701;552;695;727",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            118.0,
            80.99691352144228
        ],
        "wc_strengths_avg": [
            43.75,
            23.710493457539005
        ],
        "wc_weaknesses_avg": [
            211.25,
            151.76523811466183
        ],
        "wc_questions_avg": [
            50.25,
            39.95231532714969
        ],
        "wc_review_avg": [
            423.25,
            202.58871513487617
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            668.75,
            68.4703402941741
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:n4dtjT0B2h4J:scholar.google.com/&scioq=Competitive-Collaborative+GAN+with+Performance+Guarantee&hl=en&as_sdt=0,23",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Arizona State University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.asu.edu",
        "aff_unique_abbr": "ASU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "uUELOzcTk8",
        "title": "Constructing Semantics-Aware Adversarial Examples with Probabilistic Perspective",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this study, we introduce a novel, probabilistic perspective for generating adversarial examples. Within this view, geometric constraints on adversarial examples are interpreted as distributions, facilitating the transition from geometric constraints to data-driven semantic constraints. Proceeding from this perspective, we develop an innovative approach for generating semantics-aware adversarial examples in a principled manner. Our approach empowers individuals to incorporate their personal comprehension of semantics into the model. Through human evaluation, we validate that our semantics-aware adversarial examples maintain their inherent meaning. Experimental findings on the MNIST, SVHN and CIFAR10 datasets demonstrate that our semantics-aware adversarial examples can effectively circumvent robust adversarial training methods tailored for traditional adversarial attacks.",
        "keywords": "adversarial examples;probabilistic generative models;energy-based models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/46fec0f266e1118471940e04f204180043d9c895.zip",
        "author": "Andi Zhang;Damon Wischik",
        "authorids": "~Andi_Zhang2;~Damon_Wischik1",
        "gender": "M;",
        "homepage": "http://andi.ac;https://www.cl.cam.ac.uk/~djw1005/",
        "dblp": "200/8255-1;18/4263.html",
        "google_scholar": "qGAOAoYAAAAJ;",
        "orcid": ";",
        "linkedin": "zhangandi/;",
        "or_profile": "~Andi_Zhang2;~Damon_Wischik1",
        "aff": "University of Cambridge;University of Cambridge",
        "aff_domain": "cam.ac.uk;cam.ac.uk",
        "position": "PhD student;Lecturer",
        "bibtex": "@misc{\nzhang2024constructing,\ntitle={Constructing Semantics-Aware Adversarial Examples with Probabilistic Perspective},\nauthor={Andi Zhang and Damon Wischik},\nyear={2024},\nurl={https://openreview.net/forum?id=uUELOzcTk8}\n}",
        "github": "",
        "project": "",
        "reviewers": "DtN5;URQr;CGw2;sPYy",
        "site": "https://openreview.net/forum?id=uUELOzcTk8",
        "pdf_size": 7318406,
        "rating": "5;5;5;6",
        "confidence": "3;5;3;2",
        "soundness": "2;2;2;3",
        "contribution": "2;1;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "68;43;49;84",
        "wc_strengths": "32;38;29;51",
        "wc_weaknesses": "85;178;69;58",
        "wc_questions": "39;12;5;9",
        "wc_review": "224;271;152;202",
        "wc_reply_reviewers": "71;600;0;0",
        "wc_reply_authors": "831;2676;226;395",
        "reply_reviewers": "1;3;0;0",
        "reply_authors": "3;7;2;2",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.25,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            61.0,
            16.170961628796228
        ],
        "wc_strengths_avg": [
            37.5,
            8.440971508067067
        ],
        "wc_weaknesses_avg": [
            97.5,
            47.45787605866912
        ],
        "wc_questions_avg": [
            16.25,
            13.36740438529485
        ],
        "wc_review_avg": [
            212.25,
            42.79237665753095
        ],
        "wc_reply_reviewers_avg": [
            167.75,
            251.23731311252317
        ],
        "wc_reply_authors_avg": [
            1032.0,
            974.4924319870319
        ],
        "reply_reviewers_avg": [
            1.0,
            1.224744871391589
        ],
        "reply_authors_avg": [
            3.5,
            2.0615528128088303
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.6622661785325219,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7616503380374975058&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Cambridge",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cam.ac.uk",
        "aff_unique_abbr": "Cambridge",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Cambridge",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "uUEvmY8Gfz",
        "title": "De novo Drug Design using Reinforcement Learning with Dynamic Vocabulary",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "De novo drug design constitutes a fundamental challenge within the domain of computer-aided drug discovery (CADD). Generative models relying on SMILES molecular strings have emerged as promising tools for this purpose. However, extant SMILES-based generative models all adopt a fixed vocabulary, leading to deficiencies in both sampling efficiency and interpretability. \nIn this paper, we propose RLDV, a reinforcement learning (RL) algorithm based on a GPT agent, which uses a dynamic chemical vocabulary (DV) during RL iterations. Specifically, we utilize SMILES pair encoding to analyze high-scoring molecular SMILES strings generated during the RL process, and extract their high-frequency common substrings, which are then added as new tokens to the agent's vocabulary. These additions aid in the generation of molecules during subsequent RL steps. Experimental results on the GuacaMol benchmark demonstrate that our algorithm outperforms existing models across multiple tasks, highlighting the practical significance of the dynamic vocabulary in drug design. Furthermore, the application of our algorithm in the design of protein-targeting drugs for SARS-CoV-2 underscores its substantial practical relevance.",
        "keywords": "De novo drug design;Molecular generation;Reinforcement learning;Dynamic vocabulary",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Xiuyuan Hu;Guoqing Liu;Yang Zhao;Hao Zhang",
        "authorids": "~Xiuyuan_Hu1;~Guoqing_Liu3;~Yang_Zhao11;~Hao_Zhang37",
        "gender": "M;M;M;M",
        "homepage": "https://hxyfighter.github.io/;https://www.microsoft.com/en-us/research/people/guoqingliu/;;http://ee.tsinghua.edu.cn",
        "dblp": "180/4559;;50/2082-16;",
        "google_scholar": "8cRupWIAAAAJ;h-eHvyoAAAAJ;KF9ag1sAAAAJ;",
        "orcid": "0009-0003-5543-0972;;0000-0001-5883-2799;",
        "linkedin": "xiuyuan-hu-30b7a8201/;;;",
        "or_profile": "~Xiuyuan_Hu1;~Guoqing_Liu3;~Yang_Zhao11;~Hao_Zhang37",
        "aff": "Tsinghua University;Microsoft Research ;Tsinghua University;",
        "aff_domain": "tsinghua.edu.cn;microsoft.com;tsinghua.edu.cn;",
        "position": "PhD student;Researcher;Postdoc;",
        "bibtex": "@misc{\nhu2024de,\ntitle={De novo Drug Design using Reinforcement Learning with Dynamic Vocabulary},\nauthor={Xiuyuan Hu and Guoqing Liu and Yang Zhao and Hao Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=uUEvmY8Gfz}\n}",
        "github": "",
        "project": "",
        "reviewers": "449q;uuoB;MPZH;bE6S",
        "site": "https://openreview.net/forum?id=uUEvmY8Gfz",
        "pdf_size": 1226409,
        "rating": "3;3;3;3",
        "confidence": "4;3;3;4",
        "soundness": "2;2;2;1",
        "contribution": "2;1;2;1",
        "presentation": "2;2;2;2",
        "wc_summary": "67;69;70;41",
        "wc_strengths": "30;13;29;7",
        "wc_weaknesses": "145;178;247;327",
        "wc_questions": "114;73;3;21",
        "wc_review": "356;333;349;396",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            61.75,
            12.028611723719408
        ],
        "wc_strengths_avg": [
            19.75,
            9.98436277385793
        ],
        "wc_weaknesses_avg": [
            224.25,
            69.81180057841225
        ],
        "wc_questions_avg": [
            52.75,
            43.71713050967549
        ],
        "wc_review_avg": [
            358.5,
            23.200215516240362
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:3XoWz1elklAJ:scholar.google.com/&scioq=De+novo+Drug+Design+using+Reinforcement+Learning+with+Dynamic+Vocabulary&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Tsinghua University;Microsoft",
        "aff_unique_dep": ";Microsoft Research",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.microsoft.com/en-us/research",
        "aff_unique_abbr": "THU;MSR",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "uUPrQXSKOv",
        "title": "Decentralized Decoupled Training for Federated Long-Tailed Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In the real world, the data samples often follow a long-tailed distribution, which poses a great challenge for Federated Learning (FL). That is, when the data is decentralized and long-tailed, FL may produce a poorly-behaved global model that is severely biased towards the head classes with the majority of the training samples. To settle this issue, decoupled training has recently been introduced to FL. Decoupled training aims to re-balance the biased classifier after the normal instance-balanced training, and has achieved promising results in centralized long-tailed learning. The current study directly adopts the decoupled training idea on the server side by re-training the classifier on a set of pseudo features, due to the unavailability of a global balanced dataset in FL. Unfortunately, this practice restricts the capacity of decoupled training in federated long-tailed learning as the low-quality pseudo features lead to a sub-optimal classifier. In this work, motivated by the distributed characteristic of FL, we propose a decentralized decoupled training mechanism by leveraging the abundant real data stored in the local. Specifically, we integrate the local real data with the global gradient prototypes to form the local balanced datasets, and thus re-balance the classifier during the local training. Furthermore, we introduce a supplementary classifier in the training phase to help model the global data distribution, which addresses the problem of contradictory optimization goals caused by performing classifier re-balancing locally. Extensive experiments show that our method consistently outperforms the existing state-of-the-art methods in various settings. Our code will be released upon acceptance.",
        "keywords": "Federated Learning;Long-Tailed Learning;Classifier Re-Balancing",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Wenkai Yang;Deli Chen;Hao Zhou;Fandong Meng;Jie Zhou;Xu Sun",
        "authorids": "~Wenkai_Yang1;~Deli_Chen1;~Hao_Zhou8;~Fandong_Meng3;~Jie_Zhou8;~Xu_Sun1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://keven980716.github.io;;;http://fandongmeng.github.io/;;https://xusun.org/",
        "dblp": "250/3934;50/2637;;117/4056.html;00/5012-16;37/1971-1",
        "google_scholar": "8oNc9ZMAAAAJ;8YpGRDcAAAAJ;q3WaozcAAAAJ;sA8U4S0AAAAJ;https://scholar.google.com.hk/citations?user=OijxQCMAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;0000-0002-8158-2377;0000-0002-5899-5165;",
        "linkedin": ";;;;;",
        "or_profile": "~Wenkai_Yang1;~Deli_Chen1;~Hao_Zhou8;~Fandong_Meng3;~Jie_Zhou8;~Xu_Sun1",
        "aff": "Renmin University of China;DeepSeek AI;Tencent;WeChat AI, Tencent Inc.;WeChat AI, Tencent Inc.;Peking University",
        "aff_domain": "ruc.edu.cn;deepseek.com;tencent.com;tencent.com;tencent.com;pku.edu.cn",
        "position": "PhD student;Researcher;Researcher;Principal Researcher;Principal Researcher;Associate Professor",
        "bibtex": "@misc{\nyang2024decentralized,\ntitle={Decentralized Decoupled Training for Federated Long-Tailed Learning},\nauthor={Wenkai Yang and Deli Chen and Hao Zhou and Fandong Meng and Jie Zhou and Xu Sun},\nyear={2024},\nurl={https://openreview.net/forum?id=uUPrQXSKOv}\n}",
        "github": "",
        "project": "",
        "reviewers": "TDJi;2RDR;EUxj",
        "site": "https://openreview.net/forum?id=uUPrQXSKOv",
        "pdf_size": 1058712,
        "rating": "3;5;5",
        "confidence": "4;4;4",
        "soundness": "2;3;3",
        "contribution": "3;2;2",
        "presentation": "1;2;3",
        "wc_summary": "122;70;63",
        "wc_strengths": "32;80;15",
        "wc_weaknesses": "53;123;243",
        "wc_questions": "236;396;34",
        "wc_review": "443;669;355",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            85.0,
            26.318561257535844
        ],
        "wc_strengths_avg": [
            42.333333333333336,
            27.523727137790686
        ],
        "wc_weaknesses_avg": [
            139.66666666666666,
            78.45734863959879
        ],
        "wc_questions_avg": [
            222.0,
            148.11707081449683
        ],
        "wc_review_avg": [
            489.0,
            132.2522841642694
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6515215200177079967&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;2;2;3",
        "aff_unique_norm": "Renmin University of China;DeepSeek AI;Tencent;Peking University",
        "aff_unique_dep": ";;Tencent Holdings Limited;",
        "aff_unique_url": "http://www.ruc.edu.cn;;https://www.tencent.com;http://www.pku.edu.cn",
        "aff_unique_abbr": "RUC;DeepSeek AI;Tencent;Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "uV39mPKRGw",
        "title": "Concept Matching: Clustering-based Federated Continual Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Federated Continual Learning (FCL) has emerged as a promising paradigm that combines Federated Learning (FL) and Continual Learning (CL). To achieve good model accuracy, FCL needs to tackle catastrophic forgetting due to concept drift over time in CL, and to overcome the potential interference among clients in FL. We propose Concept Matching (CM), a clustering-based framework for FCL to address these challenges. The CM framework groups the client models into concept model clusters, and then builds different global models to capture different concepts in FL over time. In each round, the server sends the global concept models to the clients. To avoid catastrophic forgetting, each client selects the concept model best-matching the concept of the current data for further fine-tuning. To avoid interference among client models with different concepts, the server clusters the models representing the same concept, aggregates the model weights in each cluster, and updates the global concept model with the cluster model of the same concept. Since the server does not know the concepts captured by the aggregated cluster models, we propose a novel server concept matching algorithm that effectively updates a global concept model with a matching cluster model. The CM framework provides flexibility to use different clustering, aggregation, and concept matching algorithms. The evaluation demonstrates that CM outperforms state-of-the-art systems and scales well with the number of clients and the model size.",
        "keywords": "federated learning;continual learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/7657d8f623dace7118769cc368c6c4d7f3105b22.zip",
        "author": "Xiaopeng Jiang;Cristian Borcea",
        "authorids": "~Xiaopeng_Jiang1;~Cristian_Borcea1",
        "gender": ";M",
        "homepage": "https://web.njit.edu/~xj8/;https://web.njit.edu/~borcea/",
        "dblp": "41/10513;69/87",
        "google_scholar": "https://scholar.google.com.hk/citations?user=6SffwzIAAAAJ;https://scholar.google.com.tw/citations?user=wSQ6KZYAAAAJ",
        "orcid": ";0000-0003-0020-0910",
        "linkedin": ";",
        "or_profile": "~Xiaopeng_Jiang1;~Cristian_Borcea1",
        "aff": "New Jersey Institute of Technology;New Jersey Institute of Technology",
        "aff_domain": "njit.edu;njit.edu",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\njiang2024concept,\ntitle={Concept Matching: Clustering-based Federated Continual Learning},\nauthor={Xiaopeng Jiang and Cristian Borcea},\nyear={2024},\nurl={https://openreview.net/forum?id=uV39mPKRGw}\n}",
        "github": "",
        "project": "",
        "reviewers": "anyU;HPc6;2nMo;Ustz",
        "site": "https://openreview.net/forum?id=uV39mPKRGw",
        "pdf_size": 8403805,
        "rating": "3;3;3;6",
        "confidence": "4;4;4;3",
        "soundness": "2;2;2;2",
        "contribution": "1;1;2;2",
        "presentation": "2;2;2;2",
        "wc_summary": "40;88;93;119",
        "wc_strengths": "28;51;28;36",
        "wc_weaknesses": "116;61;258;50",
        "wc_questions": "55;174;5;25",
        "wc_review": "239;374;384;230",
        "wc_reply_reviewers": "265;0;0;0",
        "wc_reply_authors": "877;767;742;417",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            85.0,
            28.521921393903323
        ],
        "wc_strengths_avg": [
            35.75,
            9.390819985496474
        ],
        "wc_weaknesses_avg": [
            121.25,
            82.8171932632349
        ],
        "wc_questions_avg": [
            64.75,
            65.5376800016601
        ],
        "wc_review_avg": [
            306.75,
            72.40640510341609
        ],
        "wc_reply_reviewers_avg": [
            66.25,
            114.74836600143811
        ],
        "wc_reply_authors_avg": [
            700.75,
            171.51439443965046
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3508778045306146681&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "New Jersey Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.njit.edu",
        "aff_unique_abbr": "NJIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "uWHPW0sXFK",
        "title": "PINF: Continuous Normalizing Flows for Physics-Constrained Deep Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The normalization constraint on probability density poses a significant challenge for solving the Fokker-Planck equation. Normalizing Flow, an invertible generative model leverages the change of variables formula to ensure probability density conservation and enable the learning of complex data distributions. In this paper, we introduce Physics-Informed Normalizing Flows (PINF), a novel extension of continuous normalizing flows, incorporating diffusion through the method of characteristics. Our method, which is mesh-free and causality-free, can efficiently solve high dimensional time-dependent and steady-state Fokker-Planck equations.",
        "keywords": "Continuous normalizing flows;Fokker-Planck equations;ordinary differential equations;normalization constraint",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/78b0db437c4e8811f9869eaf6bf550a179cb80d6.zip",
        "author": "Feng Liu;Faguo Wu;Xiao Zhang",
        "authorids": "~Feng_Liu20;~Faguo_Wu1;~Xiao_Zhang25",
        "gender": "M;M;F",
        "homepage": ";;",
        "dblp": ";;",
        "google_scholar": "Qy4Fh1kAAAAJ;;",
        "orcid": ";0000-0003-4754-4075;0000-0003-3027-5016",
        "linkedin": ";;",
        "or_profile": "~Feng_Liu20;~Faguo_Wu1;~Xiao_Zhang25",
        "aff": "Institute of Artificial Intelligence;;",
        "aff_domain": "buaa.edu;;",
        "position": "PhD student;;",
        "bibtex": "@misc{\nanonymous2025pinf,\ntitle={{PINF}: Continuous Normalizing Flows for Physics-Constrained Deep Learning},\nauthor={Anonymous},\nyear={2025},\nurl={https://openreview.net/forum?id=uWHPW0sXFK}\n}",
        "github": "",
        "project": "",
        "reviewers": "RDE5;QfEf;oz5q;QF8F",
        "site": "https://openreview.net/forum?id=uWHPW0sXFK",
        "pdf_size": 1822830,
        "rating": "3;3;3;5",
        "confidence": "3;3;3;4",
        "soundness": "2;2;2;3",
        "contribution": "3;1;2;2",
        "presentation": "2;3;3;3",
        "wc_summary": "194;72;22;60",
        "wc_strengths": "68;27;22;63",
        "wc_weaknesses": "514;214;141;53",
        "wc_questions": "215;86;16;1",
        "wc_review": "991;399;201;177",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;208;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;1;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            87.0,
            64.47480127925948
        ],
        "wc_strengths_avg": [
            45.0,
            20.65187642806338
        ],
        "wc_weaknesses_avg": [
            230.5,
            173.3212335520377
        ],
        "wc_questions_avg": [
            79.5,
            84.55323766716447
        ],
        "wc_review_avg": [
            442.0,
            328.46460996582266
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            52.0,
            90.06664199358161
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0.25,
            0.4330127018922193
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9575450484678054886&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "Institute of Artificial Intelligence",
        "aff_unique_dep": "Artificial Intelligence",
        "aff_unique_url": "",
        "aff_unique_abbr": ""
    },
    {
        "title": "Unbiased Watermark for Large Language Models",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17572",
        "id": "uWVC5FVidc",
        "author_site": "Zhengmian Hu, Lichang Chen, Xidong Wu, Yihan Wu, Hongyang Zhang, Heng Huang",
        "tldr": "",
        "abstract": "The recent advancements in large language models (LLMs) have sparked a growing apprehension regarding the potential misuse. One approach to mitigating this risk is to incorporate watermarking techniques into LLMs, allowing for the tracking and attribution of model outputs. This study examines a crucial aspect of watermarking: how significantly watermarks impact the quality of model-generated outputs. Previous studies have suggested a trade-off between watermark strength and output quality. However, our research demonstrates that it is possible to integrate watermarks without affecting the output probability distribution with appropriate implementation. We refer to this type of watermark as an unbiased watermark. This has significant implications for the use of LLMs, as it becomes impossible for users to discern whether a service provider has incorporated watermarks or not. Furthermore, the presence of watermarks does not compromise the performance of the model in downstream tasks, ensuring that the overall utility of the language model is preserved. Our findings contribute to the ongoing discussion around responsible AI development, suggesting that unbiased watermarks can serve as an effective means of tracking and attributing model outputs without sacrificing output quality.",
        "keywords": "watermark;bias",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/f221b7b10e511ac76c89062cfb5ca17cdda3d379.zip",
        "author": "Zhengmian Hu;Lichang Chen;Xidong Wu;Yihan Wu;Hongyang Zhang;Heng Huang",
        "authorids": "~Zhengmian_Hu1;~Lichang_Chen2;~Xidong_Wu1;~Yihan_Wu1;~Hongyang_Zhang1;~Heng_Huang1",
        "gender": "M;Non-Binary;M;M;M;M",
        "homepage": "https://www.umd.edu/;https://www.linkedin.com/in/xidong-wu-22924112b/;https://yihwu.github.io/;https://hongyanz.github.io/;https://www.cs.umd.edu/~heng/;",
        "dblp": "285/4945;37/10581;;23/10537-1;03/281;151/6212",
        "google_scholar": "4eXiWWgAAAAJ;rj21L7sAAAAJ;cajTg_wAAAAJ;https://scholar.google.com/citations?hl=en;4OqLaDwAAAAJ;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": "0000-0003-0316-146X;;;;;",
        "linkedin": ";;;;;lichang-chen-b7a506173/",
        "or_profile": "~Zhengmian_Hu1;~Xidong_Wu1;~Yihan_Wu1;~Hongyang_Zhang1;~Heng_Huang1;~LICHANG_CHEN1",
        "aff": "University of Maryland, College Park;University of Pittsburgh;University of Maryland, College Park;School of Computer Science, University of Waterloo;Department of Computer Science, University of Maryland, College Park;Department of Computer Science, University of Maryland, College Park",
        "aff_domain": "umd.edu;pitt.edu;umd.edu;uwaterloo.ca;cs.umd.edu;cs.umd.edu",
        "position": "PhD student;PhD student;PhD student;Assistant Professor;Full Professor;PhD student",
        "bibtex": "@inproceedings{\nhu2024unbiased,\ntitle={Unbiased Watermark for Large Language Models},\nauthor={Zhengmian Hu and Lichang Chen and Xidong Wu and Yihan Wu and Hongyang Zhang and Heng Huang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=uWVC5FVidc}\n}",
        "github": "",
        "project": "",
        "reviewers": "tWzc;MH5n;usqd;7gzS;ZzM6",
        "pdf_size": 502563,
        "rating": "5;6;6;8;8",
        "confidence": "4;3;1;4;4",
        "soundness": "2;3;3;3;4",
        "contribution": "2;3;3;4;4",
        "presentation": "3;3;3;3;3",
        "wc_summary": "116;49;57;75;64",
        "wc_strengths": "148;181;35;67;53",
        "wc_weaknesses": "181;82;36;68;100",
        "wc_questions": "115;52;48;1;5",
        "wc_review": "560;364;176;211;222",
        "wc_reply_reviewers": "1007;10;0;33;11",
        "wc_reply_authors": "2110;316;379;469;327",
        "reply_reviewers": "3;1;0;1;1",
        "reply_authors": "4;1;1;1;1",
        "rating_avg": [
            6.6,
            1.2
        ],
        "confidence_avg": [
            3.2,
            1.16619037896906
        ],
        "soundness_avg": [
            3.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            3.2,
            0.7483314773547882
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            72.2,
            23.506594819326768
        ],
        "wc_strengths_avg": [
            96.8,
            57.16082574630986
        ],
        "wc_weaknesses_avg": [
            93.4,
            48.553475673735235
        ],
        "wc_questions_avg": [
            44.2,
            41.208736937693196
        ],
        "wc_review_avg": [
            306.6,
            142.0276029509757
        ],
        "wc_reply_reviewers_avg": [
            212.2,
            397.54617341888724
        ],
        "wc_reply_authors_avg": [
            720.2,
            697.0002582495935
        ],
        "reply_reviewers_avg": [
            1.2,
            0.9797958971132713
        ],
        "reply_authors_avg": [
            1.6,
            1.2000000000000002
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.3429971702850177,
        "gs_citation": 129,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3247248020044552104&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=uWVC5FVidc",
        "pdf": "https://openreview.net/pdf?id=uWVC5FVidc",
        "email": "umd.edu;pitt.edu;umd.edu;uwaterloo.ca;cs.umd.edu;cs.umd.edu",
        "author_num": 6,
        "aff_unique_index": "0;1;0;2;3;3",
        "aff_unique_norm": "University of Maryland;University of Pittsburgh;University of Waterloo;University of Maryland, College Park",
        "aff_unique_dep": ";;School of Computer Science;Department of Computer Science",
        "aff_unique_url": "https://www/umd.edu;https://www.pitt.edu;https://uwaterloo.ca;https://www/umd.edu",
        "aff_unique_abbr": "UMD;Pitt;UWaterloo;UMD",
        "aff_campus_unique_index": "0;0;2;0;0",
        "aff_campus_unique": "College Park;;Waterloo",
        "aff_country_unique_index": "0;0;0;1;0;0",
        "aff_country_unique": "United States;Canada"
    },
    {
        "title": "Mixture of LoRA Experts",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17571",
        "id": "uWvKBCYh4S",
        "author_site": "Xun Wu, Shaohan Huang, Furu Wei",
        "tldr": "",
        "abstract": "LoRA has gained widespread acceptance in the fine-tuning of large pre-trained models to cater to a diverse array of downstream tasks, showcasing notable effectiveness and efficiency, thereby solidifying its position as one of the most prevalent fine-tuning techniques. Due to the modular nature of LoRA's plug-and-play plugins, researchers have delved into the amalgamation of multiple LoRAs to empower models to excel across various downstream tasks. Nonetheless, extant approaches for LoRA fusion grapple with inherent challenges. Direct arithmetic merging may result in the loss of the original pre-trained model's generative capabilities or the distinct identity of LoRAs, thereby yielding suboptimal outcomes. On the other hand, Reference tuning-based fusion exhibits limitations concerning the requisite flexibility for the effective combination of multiple LoRAs. In response to these challenges, this paper introduces the Mixture of LoRA Experts (MoLE) approach, which harnesses hierarchical control and unfettered branch selection. The MoLE approach not only achieves superior LoRA fusion performance in comparison to direct arithmetic merging but also retains the crucial flexibility for combining LoRAs effectively. Extensive experimental evaluations conducted in both the Natural Language Processing (NLP) and Vision \\& Language (V\\&L) domains substantiate the efficacy of MoLE.",
        "keywords": "Low-Rank Adaption;Mixture-of-Experts",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Xun Wu;Shaohan Huang;Furu Wei",
        "authorids": "~Xun_Wu1;~Shaohan_Huang1;~Furu_Wei1",
        "gender": "M;M;M",
        "homepage": "https://github.com/Yu-shui;;https://www.microsoft.com/en-us/research/people/fuwei/",
        "dblp": ";176/0380;72/5870",
        "google_scholar": ";;G-V1VpwAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Xun_Wu1;~Shaohan_Huang1;~Furu_Wei1",
        "aff": "Tsinghua University;Microsoft;Microsoft Research",
        "aff_domain": "tsinghua.edu.cn;microsoft.com;microsoft.com",
        "position": "MS student;Researcher;Distinguished Scientist",
        "bibtex": "@inproceedings{\nwu2024mixture,\ntitle={Mixture of Lo{RA} Experts},\nauthor={Xun Wu and Shaohan Huang and Furu Wei},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=uWvKBCYh4S}\n}",
        "github": "",
        "project": "",
        "reviewers": "73Bx;Tkgq;VkSX;Qj9C",
        "pdf_size": 8192905,
        "rating": "3;5;6;6",
        "confidence": "4;4;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;2",
        "presentation": "2;2;3;2",
        "wc_summary": "50;140;52;42",
        "wc_strengths": "32;32;77;48",
        "wc_weaknesses": "184;292;35;83",
        "wc_questions": "27;155;49;18",
        "wc_review": "293;619;213;191",
        "wc_reply_reviewers": "85;0;0;30",
        "wc_reply_authors": "1927;3568;2125;1179",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "3;6;4;2",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            71.0,
            40.01249804748511
        ],
        "wc_strengths_avg": [
            47.25,
            18.376275465937052
        ],
        "wc_weaknesses_avg": [
            148.5,
            98.77373132569205
        ],
        "wc_questions_avg": [
            62.25,
            54.72373799367145
        ],
        "wc_review_avg": [
            329.0,
            171.67993476233616
        ],
        "wc_reply_reviewers_avg": [
            28.75,
            34.70860844228705
        ],
        "wc_reply_authors_avg": [
            2199.75,
            865.1616539699387
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.75,
            1.479019945774904
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 114,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11657052347384641487&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=uWvKBCYh4S",
        "pdf": "https://openreview.net/pdf?id=uWvKBCYh4S",
        "email": "tsinghua.edu.cn;microsoft.com;microsoft.com",
        "author_num": 3,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Tsinghua University;Microsoft",
        "aff_unique_dep": ";Microsoft Corporation",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.microsoft.com",
        "aff_unique_abbr": "THU;Microsoft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "uXBIfzhu9T",
        "title": "The Blessings of Multiple Treatments and Outcomes in Treatment Effect Estimation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Assessing causal effects in the presence of unobserved confounding is a challenging problem. Existing studies leveraged proxy variables or multiple treatments to adjust for the confounding bias. In particular, the latter approach attributes the impact on a single outcome to multiple treatments, allowing estimating latent variables for confounding control. Nevertheless, these methods primarily focus on a single outcome, whereas in many real-world scenarios, there is greater interest in studying the effects on multiple outcomes. Besides, these outcomes are often coupled with multiple treatments. Examples include the intensive care unit (ICU), where health providers evaluate the effectiveness of therapies on multiple health indicators. To accommodate these scenarios, we consider a new setting dubbed as *multiple treatments and multiple outcomes*. We then show that parallel studies of multiple outcomes involved in this setting can assist each other in causal identification, in the sense that we can exploit other treatments and outcomes as proxies for each treatment effect under study. We proceed with a causal discovery method that can effectively identify such proxies for causal estimation. The utility of our method is demonstrated in synthetic data and sepsis disease.",
        "keywords": "multiple treatments;multiple outcomes;proximal causal leaning;hypothetical test",
        "primary_area": "causal reasoning",
        "supplementary_material": "/attachment/b209445634a334767e7890d1cbea61ebd28a5533.zip",
        "author": "Yong Wu;Mingzhou Liu;Jing Yan;Yanwei Fu;Shouyan Wang;Yizhou Wang;Xinwei Sun",
        "authorids": "~Yong_Wu9;~Mingzhou_Liu1;~Jing_Yan2;~Yanwei_Fu2;~Shouyan_Wang1;~Yizhou_Wang1;~Xinwei_Sun1",
        "gender": "M;M;F;M;M;M;M",
        "homepage": ";;https://github.com/Syusuke-JJ;http://yanweifu.github.io;https://istbi.fudan.edu.cn/info/1774/4601.htm;https://cfcs.pku.edu.cn/wangyizhou/;https://sunxinwei0625.github.io/sunxw.github.io/",
        "dblp": ";159/6544-1;;63/9065;;71/3387-1;145/6592-1",
        "google_scholar": ";;;https://scholar.google.co.uk/citations?user=Vg54TcsAAAAJ;;831z_VcAAAAJ;",
        "orcid": "0000-0001-7457-4873;0000-0002-0297-0938;;0000-0002-6595-6893;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Yong_Wu9;~Mingzhou_Liu1;~Jing_Yan2;~Yanwei_Fu2;~Shouyan_Wang1;~Yizhou_Wang1;~Xinwei_Sun1",
        "aff": "Fudan University;Peking University;Fudan University;Fudan University,;Fudan University;Peking University;Fudan University",
        "aff_domain": "fudan.edu.cn;pku.edu.cn;fudan.edu.cn;fudan.edu.cn;fudan.edu.cn;pku.edu.cn;fudan.edu.cn",
        "position": "PhD student;PhD student;MS student;Professor;Full Professor;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nwu2024the,\ntitle={The Blessings of Multiple Treatments and Outcomes in Treatment Effect Estimation},\nauthor={Yong Wu and Mingzhou Liu and Jing Yan and Yanwei Fu and Shouyan Wang and Yizhou Wang and Xinwei Sun},\nyear={2024},\nurl={https://openreview.net/forum?id=uXBIfzhu9T}\n}",
        "github": "",
        "project": "",
        "reviewers": "4KmT;928E;RbZe;9yEQ",
        "site": "https://openreview.net/forum?id=uXBIfzhu9T",
        "pdf_size": 654824,
        "rating": "5;5;5;6",
        "confidence": "3;4;3;5",
        "soundness": "3;3;2;3",
        "contribution": "2;3;2;3",
        "presentation": "3;3;2;3",
        "wc_summary": "84;86;60;65",
        "wc_strengths": "47;32;20;17",
        "wc_weaknesses": "175;216;55;37",
        "wc_questions": "35;234;14;21",
        "wc_review": "341;568;149;140",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            73.75,
            11.409973707244026
        ],
        "wc_strengths_avg": [
            29.0,
            11.811011811017716
        ],
        "wc_weaknesses_avg": [
            120.75,
            76.40803295465733
        ],
        "wc_questions_avg": [
            76.0,
            91.53414663392017
        ],
        "wc_review_avg": [
            299.5,
            174.5744826714374
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.8703882797784891,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12594237285205226557&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;0;0;1;0",
        "aff_unique_norm": "Fudan University;Peking University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.fudan.edu.cn;http://www.pku.edu.cn",
        "aff_unique_abbr": "Fudan;Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "uXbqFnQfH4",
        "title": "Multi-Objective Multi-Solution Transport",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In the realm of multi-objective optimization, we introduce ''Multi-objective multi-solution Transport (MosT)'', a novel solution for optimizing multiple objectives that employs multiple solutions. The essence lies in achieving diverse trade-offs among objectives, where each solution performs as a domain expert, focusing on specific objectives while collectively covering all of them. Traditional methods often struggle, especially when the number of objectives greatly outnumbers the number of solutions, leading to either subpar solutions or objectives that have been essentially ignored. MosT addresses this by formulating the problem as a bi-level optimization of weighted objectives, where the weights are defined by an optimal transport between the objectives and solutions. Our newly developed algorithm not only ensures theoretical convergence to various Pareto front solutions but is also adaptive to cases where objectives outnumber solutions. We further enhance its efficiency by introducing a solution-specialization curriculum. With proven applications in federated learning, fairness-accuracy trade-offs, and standard MOO benchmarks, MosT distinctly outperforms existing methods, delivering high-quality, diverse solutions that profile the entire Pareto frontier, thus ensuring balanced trade-offs across objectives.",
        "keywords": "Multi-Objective Optimization",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Ziyue Li;Tian Li;Virginia Smith;Jeff Bilmes;Tianyi Zhou",
        "authorids": "~Ziyue_Li1;~Tian_Li1;~Virginia_Smith1;~Jeff_Bilmes1;~Tianyi_Zhou1",
        "gender": "F;;F;M;M",
        "homepage": "https://litzy0619.github.io/;https://litian96.github.io/;;http://melodi.ee.washington.edu/people/bilmes;https://tianyizhou.github.io/",
        "dblp": ";91/7844-5;120/0921;b/JeffABilmes;88/8205-1",
        "google_scholar": "NQVzCSkAAAAJ;https://scholar.google.com/citations?hl=en;;L9QufAsAAAAJ;OKvgizMAAAAJ",
        "orcid": ";;;0000-0002-7372-8778;0000-0001-5348-0632",
        "linkedin": "litzyli/;;;jbilmes/;tianyizhou",
        "or_profile": "~Ziyue_Li1;~Tian_Li1;~Virginia_Smith1;~Jeff_Bilmes1;~Tianyi_Zhou1",
        "aff": "University of Maryland, College Park;Meta FAIR Labs;Carnegie Mellon University;University of Washington, Seattle;University of Maryland, College Park",
        "aff_domain": "umd.edu;meta.com;cmu.edu;uw.edu;umd.edu",
        "position": "PhD student;Researcher;Associate Professor;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nli2024multiobjective,\ntitle={Multi-Objective Multi-Solution Transport},\nauthor={Ziyue Li and Tian Li and Virginia Smith and Jeff Bilmes and Tianyi Zhou},\nyear={2024},\nurl={https://openreview.net/forum?id=uXbqFnQfH4}\n}",
        "github": "",
        "project": "",
        "reviewers": "bAug;AiMo;EZcQ;SZEd;YDRF",
        "site": "https://openreview.net/forum?id=uXbqFnQfH4",
        "pdf_size": 9973873,
        "rating": "1;3;5;5;8",
        "confidence": "5;5;4;3;4",
        "soundness": "1;1;2;3;3",
        "contribution": "1;2;2;3;3",
        "presentation": "2;3;2;3;3",
        "wc_summary": "98;27;125;89;20",
        "wc_strengths": "1;11;55;136;63",
        "wc_weaknesses": "152;2;942;131;14",
        "wc_questions": "38;380;62;185;80",
        "wc_review": "289;420;1184;541;177",
        "wc_reply_reviewers": "0;300;530;0;0",
        "wc_reply_authors": "488;1282;1329;340;426",
        "reply_reviewers": "0;7;1;0;0",
        "reply_authors": "1;5;3;1;1",
        "rating_avg": [
            4.4,
            2.33238075793812
        ],
        "confidence_avg": [
            4.2,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.0,
            0.8944271909999159
        ],
        "contribution_avg": [
            2.2,
            0.7483314773547882
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            71.8,
            41.2378466945111
        ],
        "wc_strengths_avg": [
            53.2,
            47.87650780915416
        ],
        "wc_weaknesses_avg": [
            248.2,
            352.08317199207346
        ],
        "wc_questions_avg": [
            149.0,
            125.94284417941338
        ],
        "wc_review_avg": [
            522.2,
            352.7953514432978
        ],
        "wc_reply_reviewers_avg": [
            166.0,
            215.92591322025248
        ],
        "wc_reply_authors_avg": [
            773.0,
            437.5705657376876
        ],
        "reply_reviewers_avg": [
            1.6,
            2.7276363393971716
        ],
        "reply_authors_avg": [
            2.2,
            1.6
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.6187714854940426,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:-hX5HWGI7wEJ:scholar.google.com/&scioq=Multi-Objective+Multi-Solution+Transport&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;0",
        "aff_unique_norm": "University of Maryland;Meta;Carnegie Mellon University;University of Washington",
        "aff_unique_dep": ";Meta FAIR Labs;;",
        "aff_unique_url": "https://www/umd.edu;https://research.facebook.com;https://www.cmu.edu;https://www.washington.edu",
        "aff_unique_abbr": "UMD;Meta FAIR Labs;CMU;UW",
        "aff_campus_unique_index": "0;2;0",
        "aff_campus_unique": "College Park;;Seattle",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Embodied Active Defense: Leveraging Recurrent Feedback to Counter Adversarial Patches",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17570",
        "id": "uXjfOmTiDt",
        "author_site": "Lingxuan Wu, Xiao Yang, Yinpeng Dong, Liuwei XIE, Hang Su, Jun Zhu",
        "tldr": "",
        "abstract": "The vulnerability of deep neural networks to adversarial patches has motivated numerous defense strategies for boosting model robustness. However, the prevailing defenses depend on single observation or pre-established adversary information to counter adversarial patches, often failing to be confronted with unseen or adaptive adversarial attacks and easily exhibiting unsatisfying performance in dynamic 3D environments. Inspired by active human perception and recurrent feedback mechanisms, we develop Embodied Active Defense (EAD), a proactive defensive strategy that actively contextualizes environmental information to address misaligned adversarial patches in 3D real-world settings. To achieve this, EAD develops two central recurrent sub-modules, i.e., a perception module and a policy module, to implement two critical functions of active vision. These models recurrently process a series of beliefs and observations, facilitating progressive refinement of their comprehension of the target object and enabling the development of strategic actions to counter adversarial patches in 3D environments. To optimize learning efficiency, we incorporate a differentiable approximation of environmental dynamics and deploy patches that are agnostic to the adversary\u2019s strategies. Extensive experiments demonstrate that EAD substantially enhances robustness against a variety of patches within just a few steps through its action policy in safety-critical tasks (e.g., face recognition and object detection), without compromising standard accuracy. Furthermore, due to the attack-agnostic characteristic, EAD facilitates excellent generalization to unseen attacks, diminishing the averaged attack success rate by 95% across a range of unseen adversarial attacks.",
        "keywords": "Adversarial patches;active defense;embodied intelligence",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Lingxuan Wu;Xiao Yang;Yinpeng Dong;Liuwei XIE;Hang Su;Jun Zhu",
        "authorids": "~Lingxuan_Wu1;~Xiao_Yang4;~Yinpeng_Dong2;~Liuwei_XIE1;~Hang_Su3;~Jun_Zhu2",
        "gender": "M;M;M;M;M;M",
        "homepage": ";https://ml.cs.tsinghua.edu.cn/~xiaoyang/;https://dongyp13.github.io;;http://ml.cs.tsinghua.edu.cn/~jun;",
        "dblp": "374/6168;57/33851;183/0980;;50/2644-1;26/5371-6",
        "google_scholar": ";bwkwp0MAAAAJ;6_4ad84AAAAJ;;axsP38wAAAAJ;dxN1_X0AAAAJ",
        "orcid": "0000-0003-3201-2244;0000-0001-9502-9962;;;;",
        "linkedin": "\u51cc\u8f69-\u5434-226a1a194/;;;liuwei-xie-0b7919292/;;",
        "or_profile": "~Lingxuan_Wu1;~Xiao_Yang4;~Yinpeng_Dong2;~Liuwei_XIE1;~Jun_Zhu2;~Hang_Su2",
        "aff": "Tsinghua University;Tsinghua University;Tsinghua University;;Tsinghua University;Tsinghua University",
        "aff_domain": "mail.tsinghua.edu.cn;mail.tsinghua.edu.cn;tsinghua.edu.cn;;mail.tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "PhD student;Postdoc;Postdoc;;Professor;Associate Professor",
        "bibtex": "@inproceedings{\nwu2024embodied,\ntitle={Embodied Active Defense: Leveraging Recurrent Feedback to Counter Adversarial Patches},\nauthor={Lingxuan Wu and Xiao Yang and Yinpeng Dong and Liuwei XIE and Hang Su and Jun Zhu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=uXjfOmTiDt}\n}",
        "github": "",
        "project": "",
        "reviewers": "V4oi;u8yn;YXUb;iMPU",
        "pdf_size": 21274331,
        "rating": "5;6;8;8",
        "confidence": "3;2;3;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;4",
        "presentation": "2;2;3;4",
        "wc_summary": "198;48;83;167",
        "wc_strengths": "100;85;131;181",
        "wc_weaknesses": "444;102;49;155",
        "wc_questions": "171;96;3;78",
        "wc_review": "913;331;266;581",
        "wc_reply_reviewers": "40;0;0;0",
        "wc_reply_authors": "1930;938;539;1114",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "5;2;1;2",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            124.0,
            60.79062427710378
        ],
        "wc_strengths_avg": [
            124.25,
            36.72448093574639
        ],
        "wc_weaknesses_avg": [
            187.5,
            152.758796800708
        ],
        "wc_questions_avg": [
            87.0,
            59.73692325521963
        ],
        "wc_review_avg": [
            522.75,
            254.15386579786662
        ],
        "wc_reply_reviewers_avg": [
            10.0,
            17.320508075688775
        ],
        "wc_reply_authors_avg": [
            1130.25,
            506.557190749475
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            1.5
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7719952892666698440&as_sdt=80005&sciodt=0,11&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=uXjfOmTiDt",
        "pdf": "https://openreview.net/pdf?id=uXjfOmTiDt",
        "email": "mail.tsinghua.edu.cn;mail.tsinghua.edu.cn;tsinghua.edu.cn;;mail.tsinghua.edu.cn;tsinghua.edu.cn",
        "author_num": 6,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Tsinghua University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "uY4HLeKERt",
        "title": "Invisible and Adaptive Training-Phase Target-Conditioned Backdoors",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Open software supply chain attacks, once successful, can exact heavy costs in mission-critical applications. As open-source ecosystems for deep learning flourish and become increasingly universal, they present attackers previously unexplored avenues to code-inject malicious backdoors in deep neural network models. This paper proposes Flareon, a small, stealthy, seemingly harmless code modification that specifically targets the data augmentation pipeline with motion-based triggers. Flareon neither alters ground-truth labels, nor modifies the training loss objective, nor does it assume prior knowledge of the victim model architecture, training data, and training hyperparameters. Yet, it has a surprisingly large ramification on training --- models trained under Flareon learn powerful target-conditioned (or \"all2all\") backdoors. We also proposed a learnable variant of Flareon that are even stealthier in terms of added perturbations. The resulting models can exhibit high attack success rates for any target choices and better clean accuracies than backdoor attacks that not only seize greater control, but also assume more restrictive attack capabilities. We also demonstrate the resilience of Flareon against a wide range of defenses. Flareon is fully open-source and available online to the deep learning community.",
        "keywords": "code-injection attacks;deep learning frameworks",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/12fe39ad36bd34ae4bcb12fd796bceb321713f7e.zip",
        "author": "Tianrui Qin;Xitong Gao;Xianghuan He;Yiren Zhao;Kejiang Ye;Cheng-zhong Xu",
        "authorids": "~Tianrui_Qin1;~Xitong_Gao1;~Xianghuan_He2;~Yiren_Zhao2;~Kejiang_Ye1;~Cheng-zhong_Xu1",
        "gender": "M;M;M;M;;",
        "homepage": "https://github.com/Tianyue818;https://github.com/admk;https://github.com/hehuanxiang;https://aaronzhao.me;;",
        "dblp": "294/4992;140/2071;;https://dblp.uni-trier.de/pers/hd/z/Zhao:Yiren;;",
        "google_scholar": "_bOMXMkAAAAJ;-YIUCL8AAAAJ;;lOOmgEgAAAAJ;;",
        "orcid": "0009-0002-8386-2003;0000-0002-2063-2051;;;;",
        "linkedin": ";;;yiren-aaron-zhao-baa8b5116/;;",
        "or_profile": "~Tianrui_Qin1;~Xitong_Gao1;~Xianghuan_He2;~Yiren_Zhao2;~Kejiang_Ye1;~Cheng-zhong_Xu1",
        "aff": "Shenzhen Institutes of Advanced Technology, Chinese Academy of Sciences, Chinese Academy of Sciences;Shenzhen Institute of Advanced Technology, Chinese Academy of Sciences;SUN YAT-SEN UNIVERSITY;Imperial College London;;",
        "aff_domain": "siat.ac.cn;siat.ac.cn;sysu.edu.cn;ic.ac.uk;;",
        "position": "MS student;Researcher;PhD student;Assistant Professor;;",
        "bibtex": "@misc{\nqin2024invisible,\ntitle={Invisible and Adaptive Training-Phase Target-Conditioned Backdoors},\nauthor={Tianrui Qin and Xitong Gao and Xianghuan He and Yiren Zhao and Kejiang Ye and Cheng-zhong Xu},\nyear={2024},\nurl={https://openreview.net/forum?id=uY4HLeKERt}\n}",
        "github": "",
        "project": "",
        "reviewers": "vAeD;uTzJ;hF7C;jpj3",
        "site": "https://openreview.net/forum?id=uY4HLeKERt",
        "pdf_size": 8650028,
        "rating": "3;5;5;5",
        "confidence": "5;4;3;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "4;2;2;2",
        "wc_summary": "23;67;119;83",
        "wc_strengths": "29;70;104;57",
        "wc_weaknesses": "258;262;357;142",
        "wc_questions": "5;18;381;40",
        "wc_review": "315;417;961;322",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            73.0,
            34.46737587922817
        ],
        "wc_strengths_avg": [
            65.0,
            26.953663943887108
        ],
        "wc_weaknesses_avg": [
            254.75,
            76.20818525591592
        ],
        "wc_questions_avg": [
            111.0,
            156.38574103798595
        ],
        "wc_review_avg": [
            503.75,
            267.0499719153702
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Lm7to3xizV4J:scholar.google.com/&scioq=Invisible+and+Adaptive+Training-Phase+Target-Conditioned+Backdoors&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Chinese Academy of Sciences;Shenzhen Institute of Advanced Technology;Sun Yat-sen University;Imperial College London",
        "aff_unique_dep": "Shenzhen Institutes of Advanced Technology;;;",
        "aff_unique_url": "http://www.cas.cn;http://www.siat.cas.cn;http://www.sysu.edu.cn;https://www.imperial.ac.uk",
        "aff_unique_abbr": "CAS;SIAT;SYSU;ICL",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Shenzhen;",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "id": "uYTaVRkKvz",
        "title": "Interpretable and Convergent Graph Neural Network Layers at Scale",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Among the many variants of graph neural network (GNN) architectures capable of modeling data with cross-instance relations, an important subclass involves layers designed such that the forward pass iteratively reduces a graph-regularized energy function of interest. In this way, node embeddings produced at the output layer dually serve as both predictive features for solving downstream tasks (e.g., node classification) and energy function minimizers that inherit desirable inductive biases and interpretability. However, scaling GNN architectures constructed in this way remains challenging, in part because the convergence of the forward pass may involve models with considerable depth.  To tackle this limitation, we propose a sampling-based energy function and scalable GNN layers that iteratively reduce it, guided by convergence guarantees in certain settings.  We also instantiate a full GNN architecture based on these designs, and the model achieves competitive accuracy and scalability when applied to the largest publicly-available node classification benchmark exceeding 1TB in size.",
        "keywords": "Graph Neural Networks;Energy-based Models;Scalable Training;Bi-level Optimization;Interpretability",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Haitian Jiang;Renjie Liu;Xiao Yan;Zhenkun Cai;Minjie Wang;David Wipf",
        "authorids": "~Haitian_Jiang3;~Renjie_Liu3;~Xiao_Yan1;~Zhenkun_Cai1;~Minjie_Wang2;~David_Wipf1",
        "gender": ";M;M;;;M",
        "homepage": "https://haitian-jiang.github.io;https://github.com/Liu-rj;https://yanxiaosunny.github.io/;;;http://www.davidwipf.com/",
        "dblp": "240/7125;133/8814-1;07/2626-2;;58/10312;81/6421",
        "google_scholar": "https://scholar.google.co.jp/citations?user=Oi0XgvQAAAAJ;o31PMuUAAAAJ;rzNoyOIAAAAJ;sOjbP8kAAAAJ;OJja8NgAAAAJ;YJx1WSgAAAAJ",
        "orcid": ";0009-0007-4332-2762;0000-0002-2122-915X;;0009-0009-8156-1179;",
        "linkedin": "htjiang/;;;;;",
        "or_profile": "~Haitian_Jiang3;~Renjie_Liu3;~Xiao_Yan1;~Zhenkun_Cai1;~Minjie_Wang2;~David_Wipf1",
        "aff": "New York University;Southern University of Science and Technology;Centre for Perceptual and Interactive Intelligence;;Amazon;Amazon AI Research Lab",
        "aff_domain": "nyu.edu;sustech.edu.cn;cpii.hk;;amazon.com;amazon.com",
        "position": "PhD student;MS student;Researcher;;Senior Applied Scientist;Principal Research Scientist",
        "bibtex": "@misc{\njiang2024interpretable,\ntitle={Interpretable and Convergent Graph Neural Network Layers at Scale},\nauthor={Haitian Jiang and Renjie Liu and Xiao Yan and Zhenkun Cai and Minjie Wang and David Wipf},\nyear={2024},\nurl={https://openreview.net/forum?id=uYTaVRkKvz}\n}",
        "github": "",
        "project": "",
        "reviewers": "ceNB;ik1J;tqgM;PP1g;tz3b",
        "site": "https://openreview.net/forum?id=uYTaVRkKvz",
        "pdf_size": 395086,
        "rating": "3;3;6;6;8",
        "confidence": "3;5;3;3;3",
        "soundness": "2;3;3;3;3",
        "contribution": "2;2;3;2;3",
        "presentation": "2;3;4;4;4",
        "wc_summary": "78;76;54;41;168",
        "wc_strengths": "89;39;31;64;50",
        "wc_weaknesses": "357;268;80;199;153",
        "wc_questions": "145;127;3;107;44",
        "wc_review": "669;510;168;411;415",
        "wc_reply_reviewers": "0;0;0;94;76",
        "wc_reply_authors": "801;1248;230;1417;625",
        "reply_reviewers": "0;0;0;1;1",
        "reply_authors": "2;2;1;3;2",
        "rating_avg": [
            5.2,
            1.9390719429665317
        ],
        "confidence_avg": [
            3.4,
            0.8000000000000002
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            3.4,
            0.8
        ],
        "wc_summary_avg": [
            83.4,
            44.504381806738984
        ],
        "wc_strengths_avg": [
            54.6,
            20.460694025374604
        ],
        "wc_weaknesses_avg": [
            211.4,
            95.11382654482996
        ],
        "wc_questions_avg": [
            85.2,
            53.39063588308347
        ],
        "wc_review_avg": [
            434.6,
            162.8773771890989
        ],
        "wc_reply_reviewers_avg": [
            34.0,
            42.02856171700383
        ],
        "wc_reply_authors_avg": [
            864.2,
            428.0912986735423
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            2.0,
            0.6324555320336759
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5672816854423364,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:RuTixuAYW7EJ:scholar.google.com/&scioq=Interpretable+and+Convergent+Graph+Neural+Network+Layers+at+Scale&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;3",
        "aff_unique_norm": "New York University;Southern University of Science and Technology;Centre for Perceptual and Interactive Intelligence;Amazon",
        "aff_unique_dep": ";;;Amazon.com, Inc.",
        "aff_unique_url": "https://www.nyu.edu;https://www.sustech.edu.cn;;https://www.amazon.com",
        "aff_unique_abbr": "NYU;SUSTech;;Amazon",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "United States;China;"
    },
    {
        "id": "uYuoqHxtAW",
        "title": "Enhancing Robustness of Visual Object Localization by Introducing Retina-Inspired Mapping to Convolutional Neural Networks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Foveated vision, a trait shared by many animals including humans, has yet to be fully exploited in machine learning applications despite its key contributions to biological visual function. In this study, we investigate whether retinotopic mapping, a critical component of foveated vision, can improve image categorization and localization performance when incorporated into deep convolutional neural networks (CNNs). In particular, we incorporated log-polar retinotopic mapping into the inputs of classic off-the-shelf CNNs and retrained these network on the ImageNet task. Surprisingly, the retinotopically mapped network performed equally well in classification but showed improved robustness to arbitrary image zooms and rotations, especially for isolated objects. In addition, this network showed improved classification localization when the foveated center of the transform was moved, mimicking a key capability of the human visual system that is lacking in standard CNNs. These results suggest that retinotopic mapping may underlie important preattentive visual processes.",
        "keywords": "Foveated vision; Convolutional Neural Networks; Transfer learning; Visual categorisation; Saliency",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "Jean-Nicolas J\u00e9r\u00e9mie;Emmanuel Dauc\u00e9;Laurent Perrinet",
        "authorids": "~Jean-Nicolas_J\u00e9r\u00e9mie1;~Emmanuel_Dauc\u00e91;~Laurent_Perrinet1",
        "gender": "M;;Unspecified",
        "homepage": ";http://emmanuel.dauce.free.fr/;https://laurentperrinet.github.io/",
        "dblp": ";40/652.html;09/8536",
        "google_scholar": ";https://scholar.google.fr/citations?user=n5-JYWMAAAAJ;https://scholar.google.co.uk/citations?user=TVyUV38AAAAJ",
        "orcid": "0000-0002-9238-6654;0000-0001-6596-8168;0000-0002-9536-010X",
        "linkedin": ";;laurent-perrinet-1857b9/",
        "or_profile": "~Jean-Nicolas_J\u00e9r\u00e9mie1;~Emmanuel_Dauc\u00e91;~Laurent_Perrinet1",
        "aff": "Universit\u00e9 d'Aix-Marseille;Ecole Centrale de Marseille;Aix Marseille Univ",
        "aff_domain": "univ-amu.fr;centrale-marseille.fr;univ-amu.fr",
        "position": "PhD student;Associate Professor;Researcher",
        "bibtex": "@misc{\nj{\\'e}r{\\'e}mie2024enhancing,\ntitle={Enhancing Robustness of Visual Object Localization by Introducing Retina-Inspired Mapping to Convolutional Neural Networks},\nauthor={Jean-Nicolas J{\\'e}r{\\'e}mie and Emmanuel Dauc{\\'e} and Laurent Perrinet},\nyear={2024},\nurl={https://openreview.net/forum?id=uYuoqHxtAW}\n}",
        "github": "",
        "project": "",
        "reviewers": "Jd7k;XnPR;GpAi;EiMB",
        "site": "https://openreview.net/forum?id=uYuoqHxtAW",
        "pdf_size": 19449796,
        "rating": "1;3;3;3",
        "confidence": "4;4;5;5",
        "soundness": "2;2;3;2",
        "contribution": "1;2;2;2",
        "presentation": "3;3;2;3",
        "wc_summary": "59;69;54;85",
        "wc_strengths": "21;46;139;97",
        "wc_weaknesses": "111;129;229;373",
        "wc_questions": "1;192;193;7",
        "wc_review": "192;436;615;562",
        "wc_reply_reviewers": "48;156;0;0",
        "wc_reply_authors": "137;413;304;131",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            66.75,
            11.840080236214618
        ],
        "wc_strengths_avg": [
            75.75,
            45.64742599533954
        ],
        "wc_weaknesses_avg": [
            210.5,
            104.03244686154412
        ],
        "wc_questions_avg": [
            98.25,
            94.27453261618432
        ],
        "wc_review_avg": [
            451.25,
            163.18911575224618
        ],
        "wc_reply_reviewers_avg": [
            51.0,
            63.7102817447859
        ],
        "wc_reply_authors_avg": [
            246.25,
            118.69998946924974
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:xafCWBWmHU8J:scholar.google.com/&scioq=Enhancing+Robustness+of+Visual+Object+Localization+by+Introducing+Retina-Inspired+Mapping+to+Convolutional+Neural+Networks&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Aix-Marseille University;Ecole Centrale de Marseille;Aix Marseille University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.univ-amu.fr;https://www.ecm.fr;https://www.univ-amu.fr",
        "aff_unique_abbr": "AMU;ECM;AMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "France"
    },
    {
        "title": "Implicit Neural Representations and the Algebra of Complex Wavelets",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17569",
        "id": "uZfjFyPAvn",
        "author_site": "T Mitchell Roddenberry, Vishwanath Saragadam, Maarten V de Hoop, Richard Baraniuk",
        "tldr": "",
        "abstract": "Implicit neural representations (INRs) have arisen as useful methods for representing signals on Euclidean domains. By parameterizing an image as a multilayer perceptron (MLP) on Euclidean space, INRs effectively couple spatial and spectral features of the represented signal in a way that is not obvious in the usual discrete representation. Although INRs using sinusoidal activation functions have been studied in terms of Fourier theory, recent works have shown the advantage of using wavelets instead of sinusoids as activation functions, due to their ability to simultaneously localize in both frequency and space. In this work, we approach such INRs and demonstrate how they resolve high-frequency features of signals from coarse approximations performed in the first layer of the MLP. This leads to multiple prescriptions for the design of INR architectures, including the use of progressive wavelets, decoupling of low and high-pass approximations, and initialization schemes based on the singularities of the target signal.",
        "keywords": "implicit neural representations;algebra;multilayer perceptrons;wavelet",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "T Mitchell Roddenberry;Vishwanath Saragadam;Maarten V. de Hoop;Richard Baraniuk",
        "authorids": "~T_Mitchell_Roddenberry1;~Vishwanath_Saragadam1;~Maarten_V._de_Hoop2;~Richard_Baraniuk1",
        "gender": ";M;;",
        "homepage": "https://mitch.roddenberry.xyz;https://vishwa91.github.io;http://richb.rice.edu/;http://maartendehoop.rice.edu/",
        "dblp": "251/5494;172/1229;32/2804;60/4525",
        "google_scholar": ";u-xGD2AAAAAJ;https://scholar.google.com.tw/citations?user=N-BBA20AAAAJ;",
        "orcid": "0000-0001-9031-6305;0000-0001-8028-7520;;",
        "linkedin": ";;richard-baraniuk;",
        "or_profile": "~T_Mitchell_Roddenberry1;~Vishwanath_Saragadam1;~Richard_Baraniuk1;~Maarten_v._de_Hoop1",
        "aff": "Rice University;University of California, Riverside;William Marsh Rice University;Rice University",
        "aff_domain": "rice.edu;ucr.edu;rice.edu;rice.edu",
        "position": "Postdoc;Assistant Professor;C. Sidney Burrus Professor;Full Professor",
        "bibtex": "@inproceedings{\nroddenberry2024implicit,\ntitle={Implicit Neural Representations and the Algebra of Complex Wavelets},\nauthor={T Mitchell Roddenberry and Vishwanath Saragadam and Maarten V. de Hoop and Richard Baraniuk},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=uZfjFyPAvn}\n}",
        "github": "",
        "project": "",
        "reviewers": "rBV3;ewcV;3UQT;ZxVa;ksCd",
        "pdf_size": 1182555,
        "rating": "6;6;6;8;8",
        "confidence": "4;3;3;4;3",
        "soundness": "2;4;3;4;4",
        "contribution": "3;3;3;3;2",
        "presentation": "2;3;3;3;4",
        "wc_summary": "42;65;149;48;299",
        "wc_strengths": "37;35;44;21;110",
        "wc_weaknesses": "18;39;583;549;239",
        "wc_questions": "149;22;1;157;125",
        "wc_review": "246;161;777;775;773",
        "wc_reply_reviewers": "75;0;137;219;0",
        "wc_reply_authors": "364;190;1606;605;1097",
        "reply_reviewers": "1;0;1;1;0",
        "reply_authors": "2;1;6;4;4",
        "rating_avg": [
            6.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.4,
            0.4898979485566356
        ],
        "soundness_avg": [
            3.4,
            0.8
        ],
        "contribution_avg": [
            2.8,
            0.39999999999999997
        ],
        "presentation_avg": [
            3.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            120.6,
            97.13207503188634
        ],
        "wc_strengths_avg": [
            49.4,
            31.206409598029694
        ],
        "wc_weaknesses_avg": [
            285.6,
            241.83432345306153
        ],
        "wc_questions_avg": [
            90.8,
            65.93451296551753
        ],
        "wc_review_avg": [
            546.4,
            281.26684838423455
        ],
        "wc_reply_reviewers_avg": [
            86.2,
            83.90804490631396
        ],
        "wc_reply_authors_avg": [
            772.4,
            516.5766545247666
        ],
        "reply_reviewers_avg": [
            0.6,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            3.4,
            1.7435595774162693
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.16666666666666663,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14347731552560416097&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=uZfjFyPAvn",
        "pdf": "https://openreview.net/pdf?id=uZfjFyPAvn",
        "email": "rice.edu;ucr.edu;rice.edu;rice.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Rice University;University of California, Riverside",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.rice.edu;https://www.ucr.edu",
        "aff_unique_abbr": "Rice;UCR",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Riverside",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "ub7YxVUQhQ",
        "title": "Vision-based Discovery of Nonlinear Dynamics for 3D Moving Target",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Data-driven discovery of governing equations has kindled significant interests in many science and engineering areas. Existing studies primarily focus on uncovering equations that govern nonlinear dynamics based on direct measurement of the system states (e.g., trajectories). Limited efforts have been placed on distilling governing laws of dynamics directly from videos for moving targets in a 3D space. To this end, we propose a vision-based approach to automatically uncover governing equations of nonlinear dynamics for 3D moving targets via raw videos recorded by a set of cameras. The approach is composed of three key blocks: (1) a target tracking module that extracts plane pixel motions of the moving target in each video, (2) a Rodrigues' rotation formula-based coordinate transformation learning module that reconstructs the 3D coordinates with respect to a predefined reference point, and (3) a spline-enhanced library-based sparse regressor that uncovers the underlying governing law of dynamics. This framework is capable of effectively handling the challenges associated with measurement data, e.g., noise in the video, imprecise tracking of the target that causes data missing, etc. The efficacy of the proposed method has been demonstrated through multiple sets of synthetic videos considering different nonlinear dynamics.",
        "keywords": "3D nonlinear dynamics;data-driven discovery of governing equations;pattern recognition",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/c070e1e52e7d528bba8ba40c823d79f52ed35db8.zip",
        "author": "Zhang Zitong;Yang Liu;Hao Sun",
        "authorids": "~Zhang_Zitong1;~Yang_Liu52;~Hao_Sun4",
        "gender": "M;F;",
        "homepage": ";;",
        "dblp": ";;",
        "google_scholar": ";34upg6YAAAAJ;",
        "orcid": "0009-0001-3569-8643;0000-0003-0127-4030;",
        "linkedin": ";;",
        "or_profile": "~Zhang_Zitong1;~Yang_Liu52;~Hao_Sun4",
        "aff": "Renmin University of China;University of Chinese Academy of Sciences;",
        "aff_domain": "ruc.edu.cn;ucas.ac.cn;",
        "position": "PhD student;Associate Professor;",
        "bibtex": "@misc{\nzitong2024visionbased,\ntitle={Vision-based Discovery of Nonlinear Dynamics for 3D Moving Target},\nauthor={Zhang Zitong and Yang Liu and Hao Sun},\nyear={2024},\nurl={https://openreview.net/forum?id=ub7YxVUQhQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "1rkU;4Dut;NGgK;cU4B",
        "site": "https://openreview.net/forum?id=ub7YxVUQhQ",
        "pdf_size": 3667339,
        "rating": "5;5;5;8",
        "confidence": "5;3;3;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;1;3",
        "presentation": "4;2;2;3",
        "wc_summary": "43;63;69;55",
        "wc_strengths": "15;25;50;25",
        "wc_weaknesses": "76;142;297;11",
        "wc_questions": "10;172;77;1",
        "wc_review": "144;402;493;92",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "541;1463;1571;339",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;3;4;1",
        "rating_avg": [
            5.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            57.5,
            9.733961166965893
        ],
        "wc_strengths_avg": [
            28.75,
            12.93010054098575
        ],
        "wc_weaknesses_avg": [
            131.5,
            106.18498010547442
        ],
        "wc_questions_avg": [
            65.0,
            68.39956140210258
        ],
        "wc_review_avg": [
            282.75,
            168.86588613452986
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            978.5,
            544.5555527216668
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:MBxe_fBxPOQJ:scholar.google.com/&scioq=Vision-based+Discovery+of+Nonlinear+Dynamics+for+3D+Moving+Target&hl=en&as_sdt=0,44",
        "gs_version_total": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Renmin University of China;University of Chinese Academy of Sciences",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.ruc.edu.cn;http://www.ucas.ac.cn",
        "aff_unique_abbr": "RUC;UCAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "ucMRo9IIC1",
        "title": "Image Hijacks: Adversarial Images can Control Generative Models at Runtime",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Are foundation models secure from malicious actors? In this work, we focus on the image input to a vision-language model (VLM). We discover image hijacks, adversarial images that control generative models at runtime. We introduce Behaviour Matching, a general method for creating image hijacks, and we use it to explore three types of attacks. Specific string attacks generate arbitrary output of the adversary's choice. Leak context attacks leak information from the context window into the output. Jailbreak attacks circumvent a model's safety training. We study these attacks against LLaVA, a state-of-the-art VLM based on CLIP and LLaMA-2, and find that all our attack types have above a 90% success rate. Moreover, our attacks are automated and require only small image perturbations. These findings raise serious concerns about the security of foundation models. If image hijacks are as difficult to defend against as adversarial examples in CIFAR-10, then it might be many years before a solution is found -- if one even exists.",
        "keywords": "adversarial attacks;language models;vision language models;foundation models;security;jailbreaks",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/a0745b192974a5e8578f04f4e6a3bad81b715585.zip",
        "author": "Luke Bailey;Euan Ong;Stuart Russell;Scott Emmons",
        "authorids": "~Luke_Bailey1;~Euan_Ong1;~Stuart_Russell1;~Scott_Emmons1",
        "gender": "M;M;M;",
        "homepage": ";https://people.eecs.berkeley.edu/~russell/;http://scottemmons.com/;",
        "dblp": ";;180/5699;171/4369",
        "google_scholar": ";https://scholar.google.com.tw/citations?user=KJGrjCAAAAAJ;LoT0z6oAAAAJ;rUr9LjMAAAAJ",
        "orcid": ";;0000-0002-7946-7046;",
        "linkedin": "euanong/;;scott-emmons-5258005b/;",
        "or_profile": "~Euan_Ong1;~Stuart_Russell1;~Scott_Emmons1;~Luke_James_Bailey1",
        "aff": ";University of California, Berkeley;University of California, Berkeley;Harvard University",
        "aff_domain": ";berkeley.edu;berkeley.edu;harvard.edu",
        "position": ";Full Professor;PhD student;Undergrad student",
        "bibtex": "@misc{\nbailey2024image,\ntitle={Image Hijacks: Adversarial Images can Control Generative Models at Runtime},\nauthor={Luke Bailey and Euan Ong and Stuart Russell and Scott Emmons},\nyear={2024},\nurl={https://openreview.net/forum?id=ucMRo9IIC1}\n}",
        "github": "",
        "project": "",
        "reviewers": "dgQe;DvbG;NiWH;C2M9",
        "site": "https://openreview.net/forum?id=ucMRo9IIC1",
        "pdf_size": 1801966,
        "rating": "5;5;5;5",
        "confidence": "4;4;5;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "58;30;106;93",
        "wc_strengths": "43;16;87;60",
        "wc_weaknesses": "256;135;86;155",
        "wc_questions": "4;5;238;3",
        "wc_review": "361;186;517;311",
        "wc_reply_reviewers": "0;191;0;0",
        "wc_reply_authors": "778;446;671;560",
        "reply_reviewers": "0;2;0;0",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            71.75,
            29.819247140060394
        ],
        "wc_strengths_avg": [
            51.5,
            25.811818998280614
        ],
        "wc_weaknesses_avg": [
            158.0,
            61.89911146373589
        ],
        "wc_questions_avg": [
            62.5,
            101.3274395215827
        ],
        "wc_review_avg": [
            343.75,
            118.6072826600458
        ],
        "wc_reply_reviewers_avg": [
            47.75,
            82.70542606141389
        ],
        "wc_reply_authors_avg": [
            613.75,
            123.77878453111421
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 103,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15153259270073141351&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 12,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "University of California, Berkeley;Harvard University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.berkeley.edu;https://www.harvard.edu",
        "aff_unique_abbr": "UC Berkeley;Harvard",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Berkeley;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Mathematical Justification of Hard Negative Mining via Isometric Approximation Theorem",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17568",
        "id": "udO3k28bEw",
        "author_site": "Albert Xu, Jhih-Yi Hsieh, Bhaskar Vundurthy, Nithya Kemp, Eliana Cohen, Lu Li, Howie Choset",
        "tldr": "",
        "abstract": "In deep metric learning, the triplet loss has emerged as a popular method to learn many computer vision and natural language processing tasks such as facial recognition, object detection, and visual-semantic embeddings. One issue that plagues the triplet loss is network collapse, an undesirable phenomenon where the network projects the embeddings of all data onto a single point. Researchers predominately solve this problem by using triplet mining strategies. While hard negative mining is the most effective of these strategies, existing formulations lack strong theoretical justification for their empirical success. In this paper, we utilize the mathematical theory of isometric approximation to show an equivalence between the triplet loss sampled by hard negative mining and an optimization problem that minimizes a Hausdorff-like distance between the neural network and its ideal counterpart function. This provides the theoretical justifications for hard negative mining's empirical efficacy. Experiments performed on the Market-1501 and Stanford Online Products datasets with various network architectures corroborate our theoretical findings, indicating that network collapse tends to happen when batch size is too large or embedding dimension is too small. In addition, our novel application of the isometric approximation theorem provides the groundwork for future forms of hard negative mining that avoid network collapse.",
        "keywords": "Metric Learning;Triplet Loss;Hard Negative Mining",
        "primary_area": "metric learning, kernel learning, and sparse coding",
        "supplementary_material": "",
        "author": "Albert Xu;Jhih-Yi Hsieh;Bhaskar Vundurthy;Nithya Kemp;Eliana Cohen;Lu Li;Howie Choset",
        "authorids": "~Albert_Xu2;~Jhih-Yi_Hsieh1;~Bhaskar_Vundurthy1;~Nithya_Kemp1;~Eliana_Cohen1;~Lu_Li7;~Howie_Choset1",
        "gender": "M;F;M;F;;M;M",
        "homepage": "https://github.com/tooflesswulf;;https://bvundurthy.github.io/;;;https://www.ri.cmu.edu/ri-people/lu-li/;http://choset.com",
        "dblp": ";;;;;;c/HowieChoset",
        "google_scholar": ";;;;;;",
        "orcid": ";;0000-0002-6876-4424;;;;",
        "linkedin": ";janet-hsieh-5931971a1/;;nithya-kemp-a2941b220/;eliana-cohen-cmu;;howie-choset-45b0b21/",
        "or_profile": "~Albert_Xu2;~Jhih-Yi_Hsieh1;~Bhaskar_Vundurthy1;~Nithya_Kemp1;~Eliana_Cohen1;~Lu_Li7;~Howie_Choset1",
        "aff": "Carnegie Mellon University;Carnegie Mellon University;Carnegie Mellon University;Carnegie Mellon University;;Carnegie Mellon University;Carnegie Mellon University",
        "aff_domain": "andrew.cmu.edu;cmu.edu;andrew.cmu.edu;andrew.cmu.edu;;cmu.edu;cmu.edu",
        "position": "PhD student;MS student;Project Scientist;Undergrad student;;Researcher;Full Professor",
        "bibtex": "@inproceedings{\nxu2024mathematical,\ntitle={Mathematical Justification of Hard Negative Mining via Isometric Approximation Theorem},\nauthor={Albert Xu and Jhih-Yi Hsieh and Bhaskar Vundurthy and Nithya Kemp and Eliana Cohen and Lu Li and Howie Choset},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=udO3k28bEw}\n}",
        "github": "",
        "project": "",
        "reviewers": "hpyY;Mw75;QYwJ;DHxZ",
        "pdf_size": 3575637,
        "rating": "3;5;6;8",
        "confidence": "4;3;4;5",
        "soundness": "1;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;4;3",
        "wc_summary": "104;68;142;90",
        "wc_strengths": "121;51;72;94",
        "wc_weaknesses": "293;119;240;110",
        "wc_questions": "2;2;128;55",
        "wc_review": "520;240;582;349",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "488;743;653;328",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            101.0,
            26.92582403567252
        ],
        "wc_strengths_avg": [
            84.5,
            25.985572920372565
        ],
        "wc_weaknesses_avg": [
            190.5,
            78.34060249959786
        ],
        "wc_questions_avg": [
            46.75,
            51.65934087848973
        ],
        "wc_review_avg": [
            422.75,
            135.69704307758516
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            553.0,
            158.86314865317254
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.5883484054145521,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16181866273394523880&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=udO3k28bEw",
        "pdf": "https://openreview.net/pdf?id=udO3k28bEw",
        "email": "andrew.cmu.edu;cmu.edu;andrew.cmu.edu;andrew.cmu.edu;;cmu.edu;cmu.edu",
        "author_num": 7,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "Carnegie Mellon University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cmu.edu",
        "aff_unique_abbr": "CMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "ueQ6T58ZAK",
        "title": "Dynamic Representation of Optimal Transport via Ensemble Systems",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Optimal transport has gained widespread recognition in diverse areas from economics and fluid mechanics, lately, to machine learning. However, its connection and potential applications to the domain of dynamical systems and control remain underexplored. To fill this gap, we establish an ensemble-systems interpretation for modeling the optimal transport process. We interpret displacement interpolation of the transport between continuous distributions as a dynamic process and show that this can be modeled as an ensemble control system. This is achieved by establishing moment kernel representations for describing the dynamics of optimal transport and ensemble systems. This methodology further gives rise to an optimal transport based algorithm for learning controls for ensemble systems.",
        "keywords": "Optimal transport; ensemble systems; moment kernel representation",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/f0b1dcbce9306655021a86d86d6254a1c8f25214.pdf",
        "author": "Yi-Hsuan Shih;Wei Zhang;Jr-Shin Li",
        "authorids": "~Yi-Hsuan_Shih1;~Wei_Zhang67;~Jr-Shin_Li1",
        "gender": "F;M;M",
        "homepage": ";;https://www.ese.wustl.edu/~jsli/AMLab/Home.html",
        "dblp": ";;",
        "google_scholar": ";;",
        "orcid": "0000-0003-2029-8230;0000-0003-0003-0341;",
        "linkedin": ";;",
        "or_profile": "~Yi-Hsuan_Shih1;~Wei_Zhang67;~Jr-Shin_Li1",
        "aff": "Washington University, Saint Louis;Washington University, Saint Louis;Washington University, St. Louis",
        "aff_domain": "wustl.edu;wustl.edu;wustl.edu",
        "position": "PhD student;Postdoc;Full Professor",
        "bibtex": "@misc{\nshih2024dynamic,\ntitle={Dynamic Representation of Optimal Transport via Ensemble Systems},\nauthor={Yi-Hsuan Shih and Wei Zhang and Jr-Shin Li},\nyear={2024},\nurl={https://openreview.net/forum?id=ueQ6T58ZAK}\n}",
        "github": "",
        "project": "",
        "reviewers": "wGDR;vm8m;Qcm9;DFD4",
        "site": "https://openreview.net/forum?id=ueQ6T58ZAK",
        "pdf_size": 1353839,
        "rating": "3;3;5;5",
        "confidence": "4;2;4;3",
        "soundness": "4;2;2;2",
        "contribution": "1;2;2;2",
        "presentation": "3;1;2;2",
        "wc_summary": "32;106;61;66",
        "wc_strengths": "23;98;46;43",
        "wc_weaknesses": "65;339;425;1178",
        "wc_questions": "16;3;2;5",
        "wc_review": "136;546;534;1292",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            66.25,
            26.366408553308887
        ],
        "wc_strengths_avg": [
            52.5,
            27.7173231030704
        ],
        "wc_weaknesses_avg": [
            501.75,
            412.4447690297454
        ],
        "wc_questions_avg": [
            6.5,
            5.5901699437494745
        ],
        "wc_review_avg": [
            627.0,
            417.8863481857238
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.30151134457776363,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:TPPtDQrYX3oJ:scholar.google.com/&scioq=Dynamic+Representation+of+Optimal+Transport+via+Ensemble+Systems&hl=en&as_sdt=0,47",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Washington University in St. Louis",
        "aff_unique_dep": "",
        "aff_unique_url": "https://wustl.edu",
        "aff_unique_abbr": "WUSTL",
        "aff_campus_unique_index": "0;0;1",
        "aff_campus_unique": "Saint Louis;St. Louis",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "A Discretization Framework for Robust Contextual Stochastic Optimization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17567",
        "id": "ueTdErd5Ib",
        "author_site": "Rares Cristian, Georgia Perakis",
        "tldr": "",
        "abstract": "We study contextual stochastic optimization problems. Optimization problems have uncertain parameters stemming from unknown, context-dependent, distributions. Due to the inherent uncertainty in these problems, one is often interested not only in minimizing expected cost, but also to be robust and protect against worst case scenarios. We propose a novel method that combines the learning stage with knowledge of the downstream optimization task. The method prescribes decisions which aim to maximize the likelihood that the cost is below a (user-controlled) threshold. The key idea is (1) to discretize the feasible region into subsets so that the uncertain objective function can be well approximated deterministically within each subset, and (2) devise a secondary optimization problem to prescribe decisions by integrating the individual approximations determined in step (1). We provide theoretical guarantees bounding the underlying regret of decisions proposed by our method. In addition, experimental results demonstrate that our approach is competitive in terms of average regret and yields more robust solutions than other methods proposed in the literature, including up to 20 times lower worst-case cost on a real-world electricity generation problem.",
        "keywords": "Robust Optimization;Stochastic Optimization;End-to-End learning",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/cb31544457c0f095d12494db5a9dd866dc6dc266.zip",
        "author": "Rares C Cristian;Georgia Perakis",
        "authorids": "~Rares_C_Cristian1;~Georgia_Perakis1",
        "gender": ";F",
        "homepage": "https://sites.mit.edu/rarescristian/;https://mitmgmtfaculty.mit.edu/gperakis/",
        "dblp": "348/0215;",
        "google_scholar": "c2sZEjAAAAAJ;SUwM5jUAAAAJ",
        "orcid": "0000-0001-7307-4877;",
        "linkedin": "rares-cristian-a55a3b2a7/;",
        "or_profile": "~Rares_C_Cristian1;~Georgia_Perakis1",
        "aff": "Massachusetts Institute of Technology;Massachusetts Institute of Technology",
        "aff_domain": "mit.edu;mit.edu",
        "position": "PhD student;Full Professor",
        "bibtex": "@inproceedings{\ncristian2024a,\ntitle={A Discretization Framework for Robust Contextual Stochastic Optimization},\nauthor={Rares C Cristian and Georgia Perakis},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ueTdErd5Ib}\n}",
        "github": "",
        "project": "",
        "reviewers": "XXVR;VbmN;9FbH;67NA",
        "pdf_size": 768221,
        "rating": "3;6;8;8",
        "confidence": "3;3;3;4",
        "soundness": "2;2;4;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;3;2",
        "wc_summary": "508;55;106;194",
        "wc_strengths": "19;50;41;68",
        "wc_weaknesses": "15;143;533;169",
        "wc_questions": "8;224;21;133",
        "wc_review": "550;472;701;564",
        "wc_reply_reviewers": "0;14;208;93",
        "wc_reply_authors": "521;359;500;377",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "1;2;2;2",
        "rating_avg": [
            6.25,
            2.0463381929681126
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            215.75,
            175.90391553345253
        ],
        "wc_strengths_avg": [
            44.5,
            17.64227876437735
        ],
        "wc_weaknesses_avg": [
            215.0,
            192.62917743685665
        ],
        "wc_questions_avg": [
            96.5,
            88.20572543775148
        ],
        "wc_review_avg": [
            571.75,
            82.44505746253077
        ],
        "wc_reply_reviewers_avg": [
            78.75,
            82.61771904379835
        ],
        "wc_reply_authors_avg": [
            439.25,
            71.91792196664194
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.49374193110101877,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:SemmFo_Xv2MJ:scholar.google.com/&scioq=A+Discretization+Framework+for+Robust+Contextual+Stochastic+Optimization&hl=en&as_sdt=0,5",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=ueTdErd5Ib",
        "pdf": "https://openreview.net/pdf?id=ueTdErd5Ib",
        "email": "mit.edu;mit.edu",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Massachusetts Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://web.mit.edu",
        "aff_unique_abbr": "MIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "ueqTjOcuLc",
        "title": "Exploring Collaboration Mechanisms for LLM Agents: A Social Psychology View",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "As Natural Language Processing (NLP) systems are increasingly employed in  intricate social environments, a pressing query emerges: \\emph{Can these NLP systems mirror human-esque collaborative intelligence, in a multi-agent society consisting of multiple large language models (LLMs)?} \nThis paper probes the collaboration mechanisms among contemporary NLP systems by melding practical experiments with theoretical insights. We fabricate four unique 'societies' comprised of LLM agents, where each agent is characterized by a specific 'trait' (easy-going or overconfident) and engages in collaboration with a distinct 'thinking pattern' (debate or reflection). \nEvaluating these multi-agent societies on three benchmark datasets, we discern that LLM agents navigate tasks by leveraging diverse social behaviors, from active debates to introspective reflections. \nNotably, certain collaborative strategies only optimize efficiency (using \\textit{fewer} API tokens), but also outshine previous top-tier approaches. \nMoreover, our results further illustrate that LLM agents manifest human-like social behaviors, such as conformity or majority rule, mirroring foundational Social Psychology theories. \nIn conclusion, we integrate insights from Social Psychology to contextualize the collaboration of LLM agents, inspiring further investigations into the collaboration mechanism for LLMs. \nWe commit to sharing our code and datasets (already submitted in supplementary materials), hoping to catalyze further research in this promising avenue.",
        "keywords": "Multi-Agent;Large Language Model;Society of Mind;Social Psychology;Human Group Dynamics",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/ef9db46d3a8f57dcf67b1bdf81067aa8e15edb3f.zip",
        "author": "Jintian Zhang;Xin Xu;Shumin Deng",
        "authorids": "~Jintian_Zhang1;~Xin_Xu8;~Shumin_Deng1",
        "gender": "M;F;F",
        "homepage": "http://github.com/mikedean2367;https://xxupiano.github.io/;https://231sm.github.io/",
        "dblp": "229/8417;66/3874-10;213/1853",
        "google_scholar": ";KBdTqoEAAAAJ;3am3hL4AAAAJ",
        "orcid": ";0000-0001-5238-0955;",
        "linkedin": ";xin-xu-800886176/;",
        "or_profile": "~Jintian_Zhang1;~Xin_Xu8;~Shumin_Deng1",
        "aff": "Zhejiang University;Zhejiang University;National University of Singapore",
        "aff_domain": "zju.edu.cn;zju.edu.cn;nus.edu.sg",
        "position": "MS student;MS student;Postdoc",
        "bibtex": "@misc{\nzhang2024exploring,\ntitle={Exploring Collaboration Mechanisms for {LLM} Agents: A Social Psychology View},\nauthor={Jintian Zhang and Xin Xu and Shumin Deng},\nyear={2024},\nurl={https://openreview.net/forum?id=ueqTjOcuLc}\n}",
        "github": "",
        "project": "",
        "reviewers": "pe1t;9zJU;wLih;Qj8g",
        "site": "https://openreview.net/forum?id=ueqTjOcuLc",
        "pdf_size": 6130975,
        "rating": "1;3;8;8",
        "confidence": "4;4;4;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "298;119;106;77",
        "wc_strengths": "257;10;90;88",
        "wc_weaknesses": "690;171;57;128",
        "wc_questions": "649;92;26;53",
        "wc_review": "1894;392;279;346",
        "wc_reply_reviewers": "0;385;17;29",
        "wc_reply_authors": "2878;2533;937;1248",
        "reply_reviewers": "0;2;1;1",
        "reply_authors": "6;6;4;3",
        "rating_avg": [
            5.0,
            3.082207001484488
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            150.0,
            86.78997637976404
        ],
        "wc_strengths_avg": [
            111.25,
            90.12040556943805
        ],
        "wc_weaknesses_avg": [
            261.5,
            250.7214589938404
        ],
        "wc_questions_avg": [
            205.0,
            257.4150345259577
        ],
        "wc_review_avg": [
            727.75,
            674.5325696361889
        ],
        "wc_reply_reviewers_avg": [
            107.75,
            160.40164431825505
        ],
        "wc_reply_authors_avg": [
            1899.0,
            823.0495124839089
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            4.75,
            1.299038105676658
        ],
        "replies_avg": [
            31,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5619514869490164,
        "gs_citation": 144,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4636593822918951983&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Zhejiang University;National University of Singapore",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.zju.edu.cn;https://www.nus.edu.sg",
        "aff_unique_abbr": "ZJU;NUS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "China;Singapore"
    },
    {
        "id": "uf4Hr5qU6L",
        "title": "PreCoT: Problem Representation Enhances Reasoning in Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Chain-of-Thought (CoT) prompting has broken new ground in exploring the reasoning capabilities of large language models (LLMs). Recent studies expand this direction to specific strategies, such as question decomposition and planning, to improve the solution process. On the other hand, within cognitive psychology, problem representation construction is considered a vital aspect of human problem-solving along with the solution process. It involves a solver structurally encoding a problem by defining its initial and goal states, thereby improving the solution process. However, the construction of problem representation has yet to be tapped in further exploring the potential of LLMs' human-like problem-solving ability. In this work, we propose Problem Representation Enhanced CoT (PreCoT), a novel prompting framework that enhances the solution process of LLMs with problem representation. PreCoT is divided into two main stages. First, it extracts the ingredients of the initial and goal state of the problem, which constitute the problem representation together. Next, it initiates an enhanced solution process based on the generated problem representation. In extensive evaluation on benchmarks from a wide range of domains, including arithmetic, commonsense, and symbolic reasoning, PreCoT outperforms CoT on most tasks in both few-shot and zero-shot manners. Additional analyses further demonstrate the effectiveness of problem representation and its contribution to the reasoning in LLMs, as it does in human problem-solving.",
        "keywords": "Reasoning;Large Language Models;Prompting;Natural Language Processing",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/bb2760b2a8f38e1f68d1589b0c160042d3285bfa.zip",
        "author": "Seokhyun An;Hyounghun Kim",
        "authorids": "~Seokhyun_An1;~Hyounghun_Kim1",
        "gender": "M;M",
        "homepage": "https://seokhyunan.com;https://hyounghk.github.io/",
        "dblp": ";228/9951",
        "google_scholar": ";https://scholar.google.com/citations?hl=en",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Seokhyun_An1;~Hyounghun_Kim1",
        "aff": "Ulsan National Institute of Science and Technology (UNIST);Ulsan National Institute of Science and Technology",
        "aff_domain": "unist.ac.kr;unist.ac.kr",
        "position": "Undergrad student;Assistant Professor",
        "bibtex": "@misc{\nan2024precot,\ntitle={PreCoT: Problem Representation Enhances Reasoning in Large Language Models},\nauthor={Seokhyun An and Hyounghun Kim},\nyear={2024},\nurl={https://openreview.net/forum?id=uf4Hr5qU6L}\n}",
        "github": "",
        "project": "",
        "reviewers": "c8na;Hado;9iGg;2rHa",
        "site": "https://openreview.net/forum?id=uf4Hr5qU6L",
        "pdf_size": 1276993,
        "rating": "3;3;5;8",
        "confidence": "4;4;5;5",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "118;37;191;39",
        "wc_strengths": "88;35;28;177",
        "wc_weaknesses": "255;264;95;150",
        "wc_questions": "46;60;193;103",
        "wc_review": "507;396;507;469",
        "wc_reply_reviewers": "110;0;201;51",
        "wc_reply_authors": "1363;1023;1392;1031",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "4;3;4;3",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            96.25,
            63.71567703477693
        ],
        "wc_strengths_avg": [
            82.0,
            59.552497848536966
        ],
        "wc_weaknesses_avg": [
            191.0,
            71.27762622310033
        ],
        "wc_questions_avg": [
            100.5,
            57.38684518249805
        ],
        "wc_review_avg": [
            469.75,
            45.31762902006238
        ],
        "wc_reply_reviewers_avg": [
            90.5,
            74.7345301718021
        ],
        "wc_reply_authors_avg": [
            1202.25,
            175.57245655284316
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.5,
            0.5
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.8551861104941366,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:_pKCMidr1-cJ:scholar.google.com/&scioq=PreCoT:+Problem+Representation+Enhances+Reasoning+in+Large+Language+Models&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Ulsan National Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.unist.ac.kr",
        "aff_unique_abbr": "UNIST",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Ulsan;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "uf5EAGmkrN",
        "title": "Dynamical versus Bayesian Phase Transitions in a Toy Model of Superposition",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We investigate phase transitions in a Toy Model of Superposition (TMS) \\citep{elhage2022superposition} using Singular Learning Theory (SLT). We derive a closed formula for the theoretical loss and, in the case of two hidden dimensions, discover that regular $k$-gons are critical points. We present supporting theory indicating that the local learning coefficient (a geometric invariant) of these $k$-gons determines phase transitions in the Bayesian posterior as a function of training sample size. We then show empirically that the same $k$-gon critical points also determine the behavior of SGD training. The picture that emerges adds evidence to the conjecture that the SGD learning trajectory is subject to a sequential learning mechanism. Specifically, we find that the learning process in TMS, be it through SGD or Bayesian learning, can be characterized by a journey through parameter space from regions of high loss and low complexity to regions of low loss and high complexity.",
        "keywords": "phase transition;toy model of superposition;Bayesian statistics;singular learning theory",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Zhongtian Chen;Edmund Lau;Jake Mendel;Susan Wei;Daniel Murfet",
        "authorids": "~Zhongtian_Chen1;~Edmund_Lau1;jakeamendel@gmail.com;~Susan_Wei1;~Daniel_Murfet1",
        "gender": "M;M;;F;M",
        "homepage": ";https://edmundlth.github.io/;;https://www.suswei.com/;http://therisingsea.org",
        "dblp": ";;;203/8878;",
        "google_scholar": "https://scholar.google.com.au/citations?user=i_cLjZkAAAAJ;;;Udv9jsIAAAAJ;",
        "orcid": ";;;0000-0002-6842-2352;",
        "linkedin": ";;;;",
        "or_profile": "~Zhongtian_Chen1;~Edmund_Lau1;jakeamendel@gmail.com;~Susan_Wei1;~Daniel_Murfet1",
        "aff": "University of Melbourne;University of Melbourne;;The University of Melbourne;The University of Melbourne",
        "aff_domain": "unimelb.edu;unimelb.edu;;unimelb.edu.au;unimelb.edu.au",
        "position": "PhD student;PhD student;;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nchen2024dynamical,\ntitle={Dynamical versus Bayesian Phase Transitions in a Toy Model of Superposition},\nauthor={Zhongtian Chen and Edmund Lau and Jake Mendel and Susan Wei and Daniel Murfet},\nyear={2024},\nurl={https://openreview.net/forum?id=uf5EAGmkrN}\n}",
        "github": "",
        "project": "",
        "reviewers": "K4kT;ajyb;tD3S;DVUo",
        "site": "https://openreview.net/forum?id=uf5EAGmkrN",
        "pdf_size": 5507801,
        "rating": "3;5;6;8",
        "confidence": "3;2;3;2",
        "soundness": "2;3;3;4",
        "contribution": "2;2;3;4",
        "presentation": "1;3;2;3",
        "wc_summary": "94;59;80;163",
        "wc_strengths": "71;55;30;144",
        "wc_weaknesses": "210;68;131;110",
        "wc_questions": "175;2;25;24",
        "wc_review": "550;184;266;441",
        "wc_reply_reviewers": "215;0;0;0",
        "wc_reply_authors": "791;273;337;374",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            2.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            99.0,
            38.99358921669048
        ],
        "wc_strengths_avg": [
            75.0,
            42.432299018554254
        ],
        "wc_weaknesses_avg": [
            129.75,
            51.58669886705293
        ],
        "wc_questions_avg": [
            56.5,
            69.03079023160608
        ],
        "wc_review_avg": [
            360.25,
            143.59034612396476
        ],
        "wc_reply_reviewers_avg": [
            53.75,
            93.09773090682715
        ],
        "wc_reply_authors_avg": [
            443.75,
            203.71472087210586
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5547001962252291,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12723163730085244565&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of Melbourne",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.unimelb.edu.au",
        "aff_unique_abbr": "UniMelb",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Australia"
    },
    {
        "id": "ufZp6pvOvE",
        "title": "AROID: Improving Adversarial Robustness through Online Instance-wise Data Augmentation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Deep neural networks are vulnerable to adversarial examples. Adversarial training (AT) is an effective defense against adversarial examples. However, AT is prone to overfitting which degrades robustness substantially. Recently, data augmentation (DA) was shown to be effective in mitigating robust overfitting if appropriately designed and optimized for AT. This work proposes a new method to automatically learn online, instance-wise, DA policies to improve robust generalization for AT. This is the first automated DA method specific for robustness. A novel policy learning objective, consisting of Vulnerability, Affinity and Diversity, is proposed and shown to be sufficiently effective and efficient to be practical for automatic DA generation during AT. Importantly, our method dramatically reduces the cost of policy search from the 5000 hours of AutoAugment and the 412 hours of IDBH to 9 hours, making automated DA more practical to use for adversarial robustness.\nThis allows our method to efficiently explore a large search space for a more effective DA policy and evolve the policy as training progresses. Empirically, our method is shown to outperform all competitive DA methods across various model architectures (CNNs and ViTs) and datasets (CIFAR10/100, Imagenette, ImageNet, SVHN). Our DA policy reinforced vanilla AT to surpass several state-of-the-art AT methods regarding both accuracy and robustness. It can also be combined with those advanced AT methods to further boost robustness.",
        "keywords": "adversarial robustness;adversarial training;automated data augmentation;AutoML",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/d071239fb91bf00aff9e98cee764fe93f73d148a.zip",
        "author": "Lin Li;Jianing Qiu;Michael W. Spratling",
        "authorids": "~Lin_Li12;~Jianing_Qiu1;~Michael_W._Spratling1",
        "gender": "M;;",
        "homepage": "https://treelli.github.io/;;",
        "dblp": ";;",
        "google_scholar": "dxP6Y_oAAAAJ;;",
        "orcid": "0000-0001-6369-2663;;",
        "linkedin": "lin-li-aa729a14b/;;",
        "or_profile": "~Lin_Li12;~Jianing_Qiu1;~Michael_W._Spratling1",
        "aff": "King's College London;;",
        "aff_domain": "kcl.ac.uk;;",
        "position": "PhD student;;",
        "bibtex": "@misc{\nli2024aroid,\ntitle={{AROID}: Improving Adversarial Robustness through Online Instance-wise Data Augmentation},\nauthor={Lin Li and Jianing Qiu and Michael W. Spratling},\nyear={2024},\nurl={https://openreview.net/forum?id=ufZp6pvOvE}\n}",
        "github": "",
        "project": "",
        "reviewers": "7wWe;aRvv;tKpP;Dov6",
        "site": "https://openreview.net/forum?id=ufZp6pvOvE",
        "pdf_size": 1071523,
        "rating": "3;5;5;6",
        "confidence": "4;4;5;3",
        "soundness": "2;3;2;3",
        "contribution": "2;3;2;3",
        "presentation": "3;2;3;1",
        "wc_summary": "142;48;90;63",
        "wc_strengths": "84;87;31;26",
        "wc_weaknesses": "353;156;183;251",
        "wc_questions": "95;78;79;34",
        "wc_review": "674;369;383;374",
        "wc_reply_reviewers": "0;91;74;38",
        "wc_reply_authors": "1260;751;987;797",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            85.75,
            35.79367960967411
        ],
        "wc_strengths_avg": [
            57.0,
            28.574464124459098
        ],
        "wc_weaknesses_avg": [
            235.75,
            76.03083256153387
        ],
        "wc_questions_avg": [
            71.5,
            22.677080940897135
        ],
        "wc_review_avg": [
            450.0,
            129.42372270955585
        ],
        "wc_reply_reviewers_avg": [
            50.75,
            34.99553542953729
        ],
        "wc_reply_authors_avg": [
            948.75,
            200.29525081738709
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3244428422615251,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=35047677315650244&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0",
        "aff_unique_norm": "King's College London",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kcl.ac.uk",
        "aff_unique_abbr": "KCL",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "ufvwhR3XmN",
        "title": "A Joint Spectro-Temporal Relational Thinking Based Acoustic Modeling Framework",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Relational thinking refers to the inherent ability of humans to form mental impressions about relations between sensory signals and prior knowledge, and subsequently incorporate them into their model of their world. This ability plays a key role in human understanding of speech, yet it has not been a prominent feature in any artificial speech recognition systems. Recently, there have been some attempts to correct this oversight, but these have been limited to coarse utterance-level models that operate exclusively in the time domain. In an attempt to narrow the gap between artificial systems and human abilities, this paper presents a novel spectro-temporal relational thinking based acoustic modeling framework. Specifically, it first generates numerous probabilistic graphs to model the relations among consecutive speech segments across both time and frequency domains. These graphs are then coupled and transformed into latent representations for downstream tasks, during which meaningful spectro-temporal patterns formed by the co-occurrence of certain node pairs can be uncovered. Models built upon this framework outperform state-of-the-art systems with a 7.82% improvement in phoneme recognition tasks. In-depth analyses further reveal that our proposed relational thinking modeling mainly improves the model's ability to recognize vowel phonemes.",
        "keywords": "acoustic modeling;speech recognition;relational thinking;Bayesian deep learning;graph theory",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Zheng Nan;Ting Dang;Vidhyasaharan Sethu;Beena Ahmed",
        "authorids": "~Zheng_Nan1;~Ting_Dang1;~Vidhyasaharan_Sethu1;~Beena_Ahmed2",
        "gender": "M;F;M;F",
        "homepage": ";https://tingdang90.github.io/;;https://www.unsw.edu.au/staff/beena-ahmed",
        "dblp": ";170/5330;52/7823;",
        "google_scholar": "https://scholar.google.com.au/citations?hl=zh-CN;Sb1Pj4sAAAAJ;gsx__zkAAAAJ;crMO9PcAAAAJ",
        "orcid": ";0000-0003-3806-1493;0000-0001-8492-1787;",
        "linkedin": ";;;",
        "or_profile": "~Zheng_Nan1;~Ting_Dang1;~Vidhyasaharan_Sethu1;~Beena_Ahmed2",
        "aff": "University of New South Wales;University of Melbourne;;University of New South Wales",
        "aff_domain": "unsw.edu.au;unimelb.edu.au;;unsw.edu.au",
        "position": "PhD student;Assistant Professor;;Associate Professor",
        "bibtex": "@misc{\nnan2024a,\ntitle={A Joint Spectro-Temporal Relational Thinking Based Acoustic Modeling Framework},\nauthor={Zheng Nan and Ting Dang and Vidhyasaharan Sethu and Beena Ahmed},\nyear={2024},\nurl={https://openreview.net/forum?id=ufvwhR3XmN}\n}",
        "github": "",
        "project": "",
        "reviewers": "KrqG;Q5NM;4GN3;jL9N",
        "site": "https://openreview.net/forum?id=ufvwhR3XmN",
        "pdf_size": 4818258,
        "rating": "3;3;3;6",
        "confidence": "4;5;3;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;1;3",
        "wc_summary": "74;52;48;121",
        "wc_strengths": "20;86;10;121",
        "wc_weaknesses": "220;92;295;36",
        "wc_questions": "39;2;29;112",
        "wc_review": "353;232;382;390",
        "wc_reply_reviewers": "0;63;105;19",
        "wc_reply_authors": "1317;643;1598;795",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "3;1;3;2",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            73.75,
            29.02046691560975
        ],
        "wc_strengths_avg": [
            59.25,
            46.08348402627562
        ],
        "wc_weaknesses_avg": [
            160.75,
            102.25305618904503
        ],
        "wc_questions_avg": [
            45.5,
            40.70933553866975
        ],
        "wc_review_avg": [
            339.25,
            63.43254290977148
        ],
        "wc_reply_reviewers_avg": [
            46.75,
            40.6594085052894
        ],
        "wc_reply_authors_avg": [
            1088.25,
            386.13946638488017
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Tq-SV6gFE6EJ:scholar.google.com/&scioq=A+Joint+Spectro-Temporal+Relational+Thinking+Based+Acoustic+Modeling+Framework&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of New South Wales;University of Melbourne",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.unsw.edu.au;https://www.unimelb.edu.au",
        "aff_unique_abbr": "UNSW;UniMelb",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Australia"
    },
    {
        "id": "ug8wDSimNK",
        "title": "Suspicion-Agent: Playing Imperfect Information Games with Theory of Mind Aware GPT-4",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Unlike perfect information games, where all elements are known to every player, imperfect information games emulate the real-world complexities of decision-making under uncertain or incomplete information. \nGPT-4, the recent breakthrough in large language models (LLMs) trained on massive passive data, is notable for its knowledge retrieval and reasoning abilities. This paper delves into the applicability of GPT-4's learned knowledge for imperfect information games. \nTo achieve this, we introduce suspicion-agent, an innovative agent that leverages GPT-4's capabilities for performing in imperfect information games. With proper prompt engineering to achieve different functions, the suspicion-agent based on GPT-4 demonstrates remarkable adaptability across a range of imperfect information card games. Importantly, GPT-4 displays a strong high-order theory of mind (ToM) capacity, meaning it can understand others and intentionally impact others' behavior. Leveraging this, we design a planning strategy that enables GPT-4 to competently play against different opponents, adapting its gameplay style as needed, while requiring only the game rules and descriptions of observations as input.\nIn the experiments, we qualitatively showcase the capabilities of suspicion-agent across three different imperfect information games and then quantitatively evaluate it in Leduc Hold'em. The results show that suspicion-agent can potentially outperform traditional algorithms designed for imperfect information games,  without any specialized training or examples. In order to encourage and foster deeper insights within the community, we make our game-related data publicly available.",
        "keywords": "Large Language Model;Theory of Mind;Imperfect Information Game",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/aab6968c1ec28da1924d3876a610f2881a3ca618.zip",
        "author": "Jiaxian Guo;Bo Yang;Paul Yoo;Bill Yuchen Lin;Yusuke Iwasawa;Yutaka Matsuo",
        "authorids": "~Jiaxian_Guo2;~Bo_Yang16;~Paul_Yoo1;~Bill_Yuchen_Lin1;~Yusuke_Iwasawa1;~Yutaka_Matsuo1",
        "gender": "M;M;Not Specified;M;M;M",
        "homepage": ";;https://yoopaul.github.io;http://yuchenlin.xyz/;;http://ymatsuo.com",
        "dblp": "206/6264;;281/9904;190/4518;117/7377;m/YMatsuo.html",
        "google_scholar": "wQgPocEAAAAJ;https://scholar.google.co.jp/citations?user=fAxE9bwAAAAJ;;https://scholar.google.com/citations?hl=en;https://scholar.google.co.jp/citations?user=pvvZgj0AAAAJ;Dy8iau4AAAAJ",
        "orcid": ";0000-0002-8067-8174;;;0000-0002-1321-2622;",
        "linkedin": ";;;;;",
        "or_profile": "~Jiaxian_Guo2;~Bo_Yang16;~Paul_Yoo1;~Bill_Yuchen_Lin1;~Yusuke_Iwasawa1;~Yutaka_Matsuo1",
        "aff": "Google Research;KDDI Research, Inc.;The University of Tokyo;Allen Institute for Artificial Intelligence;The University of Tokyo, The University of Tokyo;The University of Tokyo",
        "aff_domain": "google.com;kddi.com;weblab.t.u-tokyo.ac.jp;allenai.org;weblab.t.u-tokyo.ac.jp;u-tokyo.ac.jp",
        "position": "Research Scientist;Researcher;Researcher;Researcher;Associate Professor;Associate Professor",
        "bibtex": "@misc{\nguo2024suspicionagent,\ntitle={Suspicion-Agent: Playing Imperfect Information Games with Theory of Mind Aware {GPT}-4},\nauthor={Jiaxian Guo and Bo Yang and Paul Yoo and Bill Yuchen Lin and Yusuke Iwasawa and Yutaka Matsuo},\nyear={2024},\nurl={https://openreview.net/forum?id=ug8wDSimNK}\n}",
        "github": "",
        "project": "",
        "reviewers": "ub7P;iJUa;v9fW;M2cB",
        "site": "https://openreview.net/forum?id=ug8wDSimNK",
        "pdf_size": 1355662,
        "rating": "3;3;5;6",
        "confidence": "4;4;4;3",
        "soundness": "2;1;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "53;25;117;204",
        "wc_strengths": "51;60;28;104",
        "wc_weaknesses": "325;210;26;114",
        "wc_questions": "1;51;333;127",
        "wc_review": "430;346;504;549",
        "wc_reply_reviewers": "0;0;224;0",
        "wc_reply_authors": "851;845;1009;884",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            99.75,
            68.80906553645384
        ],
        "wc_strengths_avg": [
            60.75,
            27.562429138230904
        ],
        "wc_weaknesses_avg": [
            168.75,
            111.23258290626897
        ],
        "wc_questions_avg": [
            128.0,
            126.57408897558773
        ],
        "wc_review_avg": [
            457.25,
            77.01095701262255
        ],
        "wc_reply_reviewers_avg": [
            56.0,
            96.99484522385713
        ],
        "wc_reply_authors_avg": [
            897.25,
            66.20564552966763
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.7777777777777777,
        "gs_citation": 37,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3248340297058572816&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;3;2;2",
        "aff_unique_norm": "Google;KDDI Research;University of Tokyo;Allen Institute for Artificial Intelligence",
        "aff_unique_dep": "Google Research;;;",
        "aff_unique_url": "https://research.google;https://www.kddi-research.com;https://www.u-tokyo.ac.jp;https://allenai.org",
        "aff_unique_abbr": "Google Research;KDDI;UTokyo;AI2",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Mountain View;",
        "aff_country_unique_index": "0;1;1;0;1;1",
        "aff_country_unique": "United States;Japan"
    },
    {
        "id": "uhR7aYuf0i",
        "title": "Learning to Explore for Stochastic Gradient MCMC",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Bayesian Neural Networks (BNNs) with high-dimensional parameters pose a challenge for posterior inference due to the multi-modality of the posterior distributions. Stochastic Gradient Markov-Chain Monte-Carlo (SGMCMC) with cyclical learning rate scheduling is a promising solution, but it requires a large number of sampling steps to explore high-dimensional multi-modal posteriors, making it computationally expensive. In this paper, we propose a meta-learning strategy to build SGMCMC which can efficiently explore the multi-modal target distributions. Our algorithm allows the learned SGMCMC to quickly explore the high-density region of the posterior landscape. Also, we show that this exploration property is transferrable to various tasks, even for the ones unseen during a meta-training stage. Using popular image classification benchmarks and a variety of downstream tasks, we demonstrate that our method significantly improves the sampling efficiency, achieving better performance than vanilla SGMCMC without incurring significant computational overhead.",
        "keywords": "Bayesian Neural Networks;Meta-Learning;MCMC",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/424edef660bc6a7afcf73abc49cd0f085e232e18.zip",
        "author": "SeungHyun Kim;Seohyeon Jung;Juho Lee",
        "authorids": "~SeungHyun_Kim3;~Seohyeon_Jung1;~Juho_Lee2",
        "gender": "M;F;M",
        "homepage": ";;https://juho.lee.github.io",
        "dblp": ";350/4069;55/3410-1",
        "google_scholar": "QUsSqoYAAAAJ;https://scholar.google.com/citations?view_op=list_works;Py4URJUAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~SeungHyun_Kim3;~Seohyeon_Jung1;~Juho_Lee2",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.edu;kaist.edu;kaist.ac.kr",
        "position": "MS student;MS student;Associate Professor",
        "bibtex": "@misc{\nkim2024learning,\ntitle={Learning to Explore for Stochastic Gradient {MCMC}},\nauthor={SeungHyun Kim and Seohyeon Jung and Juho Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=uhR7aYuf0i}\n}",
        "github": "",
        "project": "",
        "reviewers": "LiEv;Stdr;36ng;CsK6",
        "site": "https://openreview.net/forum?id=uhR7aYuf0i",
        "pdf_size": 3032217,
        "rating": "3;5;5;6",
        "confidence": "4;4;5;3",
        "soundness": "2;2;3;3",
        "contribution": "2;3;2;3",
        "presentation": "1;3;2;3",
        "wc_summary": "61;74;61;84",
        "wc_strengths": "39;67;55;100",
        "wc_weaknesses": "348;120;378;155",
        "wc_questions": "20;43;223;68",
        "wc_review": "468;304;717;407",
        "wc_reply_reviewers": "194;346;835;483",
        "wc_reply_authors": "1737;686;2666;1407",
        "reply_reviewers": "1;1;4;2",
        "reply_authors": "4;2;5;2",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            70.0,
            9.669539802906858
        ],
        "wc_strengths_avg": [
            65.25,
            22.38721733489895
        ],
        "wc_weaknesses_avg": [
            250.25,
            113.92184821183336
        ],
        "wc_questions_avg": [
            88.5,
            79.48742038838598
        ],
        "wc_review_avg": [
            474.0,
            152.04768988708773
        ],
        "wc_reply_reviewers_avg": [
            464.5,
            237.0785734730155
        ],
        "wc_reply_authors_avg": [
            1624.0,
            711.5943366834787
        ],
        "reply_reviewers_avg": [
            2.0,
            1.224744871391589
        ],
        "reply_authors_avg": [
            3.25,
            1.299038105676658
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3244428422615251,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:vjt8EelnV8sJ:scholar.google.com/&scioq=Learning+to+Explore+for+Stochastic+Gradient+MCMC&hl=en&as_sdt=0,33",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "uhtQyRrTzY",
        "title": "MIMIC: Masked Image Modeling with Image Correspondences",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Dense pixel-specific representation learning at scale has been bottlenecked due to the unavailability of large-scale multi-view datasets. Current methods for building effective pretraining datasets heavily rely on annotated 3D meshes, point clouds, and camera parameters from simulated environments, preventing them from building datasets from real-world data sources where such metadata is lacking. We propose a pretraining dataset-curation approach that does not require any additional annotations. Our method allows us to generate multi-view datasets from both real-world videos and simulated environments at scale. Specifically, we experiment with two scales: MIMIC-1M with 1.3M and MIMIC-3M with 3.1M multi-view image pairs. We train multiple models with different masked image modeling objectives to showcase the following findings: Representations trained on our automatically generated MIMIC-3M outperform those learned from expensive crowdsourced datasets (ImageNet-1K) and those learned from synthetic environments (MULTIVIEW-HABITAT) on two dense geometric tasks: depth estimation on NYUv2 (\u21911.7%), and surface normals estimation on Taskonomy (\u21932.05%). For dense tasks which also require object understanding, we outperform MULTIVIEW- HABITAT, on semantic segmentation on ADE20K (\u21913.89%), pose estimation on MSCOCO (\u21919.4%), and reduce the gap with models pre-trained on the object-centric expensive ImageNet-1K. We outperform even when the representations are frozen, and when downstream training data is limited to few-shot. Larger dataset (MIMIC-3M) significantly improves performance, which is promising since our curation method can arbitrarily scale to produce even larger datasets.",
        "keywords": "Data curation techniques;Masked Image Modeling;Dense vision tasks;Large scale pretraining;Self supervised learning;Datasets",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Kalyani Marathe;Mahtab Bigverdi;Nishat Anjum Khan;Tuhin Kundu;Aniruddha Kembhavi;Linda Shapiro;Ranjay Krishna",
        "authorids": "~Kalyani_Marathe1;~Mahtab_Bigverdi1;~Nishat_Anjum_Khan2;~Tuhin_Kundu1;~Aniruddha_Kembhavi1;~Linda_Shapiro1;~Ranjay_Krishna1",
        "gender": "F;F;;M;M;F;M",
        "homepage": "https://kalyani7195.github.io/;https://mahtabbigverdi.github.io;;;https://anikem.github.io/;http://cs.washington.edu/homes/shapiro/;http://ranjaykrishna.com",
        "dblp": ";;259/8172;236/3611.html;81/7583;s/LindaGShapiro;167/3785",
        "google_scholar": "gCxlvdcAAAAJ;fQyf1vIAAAAJ;;https://scholar.google.com/citations?view_op=list_works;JnUevM0AAAAJ;https://scholar.google.com.tw/citations?user=6pGeV2wAAAAJ;IcqahyAAAAAJ",
        "orcid": ";;;;;;0000-0001-8784-2531",
        "linkedin": ";;nishat-anjum-khan-a1b98099/;tuhinkundu/;;;ranjay-krishna-1a344444/",
        "or_profile": "~Kalyani_Marathe1;~Mahtab_Bigverdi1;~Nishat_Anjum_Khan2;~Tuhin_Kundu1;~Aniruddha_Kembhavi1;~Linda_Shapiro1;~Ranjay_Krishna1",
        "aff": "University of Washington, Seattle;University of Washington;University of Washington;Amazon;Allen Institute for Artificial Intelligence;University of Washington;University of Washington",
        "aff_domain": "uw.edu;uw.edu;uw.edu;amazon.com;allenai.org;washington.edu;cs.washington.edu",
        "position": "PhD student;PhD student;PhD student;Researcher;Research Manager;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nmarathe2024mimic,\ntitle={{MIMIC}: Masked Image Modeling with Image Correspondences},\nauthor={Kalyani Marathe and Mahtab Bigverdi and Nishat Anjum Khan and Tuhin Kundu and Aniruddha Kembhavi and Linda Shapiro and Ranjay Krishna},\nyear={2024},\nurl={https://openreview.net/forum?id=uhtQyRrTzY}\n}",
        "github": "",
        "project": "",
        "reviewers": "ytkL;fi3r;HFtz;AdG9",
        "site": "https://openreview.net/forum?id=uhtQyRrTzY",
        "pdf_size": 11372849,
        "rating": "3;3;6;8",
        "confidence": "4;4;4;4",
        "soundness": "2;3;3;4",
        "contribution": "2;2;3;4",
        "presentation": "3;3;3;3",
        "wc_summary": "146;54;116;60",
        "wc_strengths": "17;55;122;46",
        "wc_weaknesses": "128;249;154;55",
        "wc_questions": "4;20;6;15",
        "wc_review": "295;378;398;176",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            5.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            94.0,
            38.54867053479276
        ],
        "wc_strengths_avg": [
            60.0,
            38.451267859460756
        ],
        "wc_weaknesses_avg": [
            146.5,
            69.42081820318744
        ],
        "wc_questions_avg": [
            11.25,
            6.53356717268599
        ],
        "wc_review_avg": [
            311.75,
            87.37383761744702
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11862352029048332026&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;0;0;1;2;0;0",
        "aff_unique_norm": "University of Washington;Amazon;Allen Institute for Artificial Intelligence",
        "aff_unique_dep": ";Amazon.com, Inc.;",
        "aff_unique_url": "https://www.washington.edu;https://www.amazon.com;https://allenai.org",
        "aff_unique_abbr": "UW;Amazon;AI2",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Seattle;",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "uiFuqvkpAt",
        "title": "Vector Quantized Representations for Efficient Hierarchical Delineation of Behavioral Repertoires",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Understanding animal behaviors and their neural underpinnings requires precise kinematic measurements plus analytical methods to parse these continuous, multidimensional measurements into interpretable, organizational descriptions. Existing approaches can identify stereotyped behavioral motifs, given 2D or 3D keypoint-based data but are limited in their interpretability, computational efficiency, and/or ability to seamlessly integrate new behavioral measurements. In this paper, we propose an end-to-end behavioral analysis approach that dissects continuous body movements into sequences of discrete latent variables using vector quantization (VQ). The discrete latent space naturally defines an interpretable deep behavioral repertoire composed of hierarchically organized behavioral motifs. Using recordings of freely moving rodents, we demonstrate that the proposed framework faithfully supports standard behavioral analysis tasks and enables a series of new applications stemming from the discrete information bottleneck, including realistic synthesis of animal body movements and cross-species behavioral mapping.",
        "keywords": "animal behavior;neuroscience;unsupervised unit discovery",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/6892b76daded6a8fa26c6608be6ec79bef887703.zip",
        "author": "Tianqing Li;Ugne Klibaite;Jumana Akoad;Joshua Huang Wu;Timothy W DUNN",
        "authorids": "~Tianqing_Li1;~Ugne_Klibaite1;~Jumana_Akoad1;~Joshua_Huang_Wu1;~Timothy_W_DUNN1",
        "gender": "F;;;M;",
        "homepage": ";https://scholar.google.com/citations?user=V1tMshIAAAAJ&hl=en&oi=ao;https://olveczkylab.oeb.harvard.edu/;;",
        "dblp": ";;;;",
        "google_scholar": "i_czGjEAAAAJ;V1tMshIAAAAJ;;ax7nbtEAAAAJ;",
        "orcid": ";;;0000-0002-2575-4912;",
        "linkedin": ";;;;",
        "or_profile": "~Tianqing_Li1;~Ugne_Klibaite1;~Jumana_Akoad1;~Joshua_Huang_Wu1;~Timothy_W_DUNN1",
        "aff": "Duke University;Harvard University;;Duke University;",
        "aff_domain": "duke.edu;harvard.edu;;duke.edu;",
        "position": "PhD student;Postdoc;;PhD student;",
        "bibtex": "@misc{\nli2024vector,\ntitle={Vector Quantized Representations for Efficient Hierarchical Delineation of Behavioral Repertoires},\nauthor={Tianqing Li and Ugne Klibaite and Jumana Akoad and Joshua Huang Wu and Timothy W DUNN},\nyear={2024},\nurl={https://openreview.net/forum?id=uiFuqvkpAt}\n}",
        "github": "",
        "project": "",
        "reviewers": "sPmp;pCfH;1QG3;wDjx",
        "site": "https://openreview.net/forum?id=uiFuqvkpAt",
        "pdf_size": 17163402,
        "rating": "3;5;5;5",
        "confidence": "3;2;3;3",
        "soundness": "2;2;3;2",
        "contribution": "2;2;3;2",
        "presentation": "3;2;3;3",
        "wc_summary": "51;40;39;86",
        "wc_strengths": "23;35;22;20",
        "wc_weaknesses": "158;22;68;102",
        "wc_questions": "295;64;26;10",
        "wc_review": "527;161;155;218",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1214;707;929;457",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;2;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            54.0,
            19.06567596493762
        ],
        "wc_strengths_avg": [
            25.0,
            5.873670062235365
        ],
        "wc_weaknesses_avg": [
            87.5,
            49.62610200287748
        ],
        "wc_questions_avg": [
            98.75,
            114.98994521261413
        ],
        "wc_review_avg": [
            265.25,
            153.108417469452
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            826.75,
            279.0487188646456
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ie1omSwfPisJ:scholar.google.com/&scioq=Vector+Quantized+Representations+for+Efficient+Hierarchical+Delineation+of+Behavioral+Repertoires&hl=en&as_sdt=0,44",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Duke University;Harvard University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.duke.edu;https://www.harvard.edu",
        "aff_unique_abbr": "Duke;Harvard",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "uikf2Ue0XQ",
        "title": "Visual Grounding with attention-driven constraint balancing",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Unlike Object Detection, Visual Grounding task necessitates the detection of an object described by complex free-form language. To simultaneously model such complex semantic and visual representations, recent state-of-the-art studies adopt transformer-based models to fuse features from both modalities, further introducing various modules that modulate visual features to align with the language expressions and eliminate the irrelevant redundant information. However, their loss function, still adopting common Object Detection losses, solely governs the bounding box regression output, failing to fully optimize for the above objectives. To tackle this problem, in this paper, we firstly analyze the attention mechanisms of transformer-based models. Building upon this, we further propose a novel framework named Attention-Driven Constraint Balancing (AttBalance) to optimize the behavior of visual features within language-relevant regions. Extensive experimental results show that our method brings impressive improvements. Specifically, we achieve uniform gains across five different models evaluated on four different benchmarks. Moreover, we attain a new state-of-the-art performance by integrating our method into QRNet.",
        "keywords": "Visual Grounding",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Weitai Kang;Luowei Zhou;Junyi Wu;Changchang Sun;Yan Yan",
        "authorids": "~Weitai_Kang1;~Luowei_Zhou1;~Junyi_Wu1;~Changchang_Sun1;~Yan_Yan6",
        "gender": "M;;M;F;M",
        "homepage": "https://weitaikang.github.io/;https://luoweizhou.github.io;https://adreamwu.github.io/;https://changchangsun.github.io/Changchangsun/;",
        "dblp": "372/4979;122/7357;;245/1779;13/3953-2",
        "google_scholar": "hDl0MkwAAAAJ;M-3cIR0AAAAJ;Akua_xUAAAAJ;https://scholar.google.com/citations?hl=zh-CN;",
        "orcid": "0009-0007-6484-0665;;;0000-0003-3685-1205;",
        "linkedin": "weitaikang/;;junyi-wu-82a92b24a/;changchang-sun-a124a9327/;",
        "or_profile": "~Weitai_Kang1;~Luowei_Zhou1;~Junyi_Wu1;~Changchang_Sun1;~Yan_Yan6",
        "aff": "Illinois Institute of Technology;Google;Illinois Institute of Technology;Illinois Institute of Technology;University of Illinois Chicago",
        "aff_domain": "hawk.iit.edu;google.com;iit.edu;iit.edu;uic.edu",
        "position": "PhD student;Research Scientist;PhD student;PhD student;Associate Professor",
        "bibtex": "@misc{\nkang2024visual,\ntitle={Visual Grounding with attention-driven constraint balancing},\nauthor={Weitai Kang and Luowei Zhou and Junyi Wu and Changchang Sun and Yan Yan},\nyear={2024},\nurl={https://openreview.net/forum?id=uikf2Ue0XQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "zMiJ;L37Q;qRXz;6bMP",
        "site": "https://openreview.net/forum?id=uikf2Ue0XQ",
        "pdf_size": 1988483,
        "rating": "5;5;6;6",
        "confidence": "4;4;3;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;2;3;2",
        "wc_summary": "80;122;133;47",
        "wc_strengths": "65;141;84;43",
        "wc_weaknesses": "324;341;66;127",
        "wc_questions": "110;204;6;6",
        "wc_review": "579;808;289;223",
        "wc_reply_reviewers": "0;0;0;24",
        "wc_reply_authors": "1161;2519;455;904",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "3;5;1;3",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            95.5,
            34.2819194328439
        ],
        "wc_strengths_avg": [
            83.25,
            36.36189626518397
        ],
        "wc_weaknesses_avg": [
            214.5,
            120.1051622537516
        ],
        "wc_questions_avg": [
            81.5,
            82.49090858997735
        ],
        "wc_review_avg": [
            474.75,
            234.41669629102788
        ],
        "wc_reply_reviewers_avg": [
            6.0,
            10.392304845413264
        ],
        "wc_reply_authors_avg": [
            1259.75,
            769.6821990276246
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            1.4142135623730951
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18325366258976768738&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0;0;2",
        "aff_unique_norm": "Illinois Institute of Technology;Google;University of Illinois at Chicago",
        "aff_unique_dep": ";Google;",
        "aff_unique_url": "https://www.iit.edu;https://www.google.com;https://www.uic.edu",
        "aff_unique_abbr": "IIT;Google;UIC",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Mountain View;Chicago",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "uizIvVBY8P",
        "title": "Continual Supervised Anomaly Detection",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper proposes a continual-learning method for anomaly detection when a few labeled anomalies are available for training in addition to normal instances. Although several continual-learning methods have been proposed for anomaly detection, they have been dedicated to unsupervised anomaly detection, in which we can use only normal instances for training. However, few anomalies, which are valuable for constructing anomaly detectors, are often available in practice. In our continual-learning method, we use a hybrid model of a Variational AutoEncoder (VAE) and a binary classifier, and compute the anomaly score from the outputs of both models. The VAE is trained by minimizing the reconstruction errors of training data to detect unseen anomalous instances, and the binary classifier is trained to identify whether the input is a seen anomaly. Combining these two models enables us to efficiently detect both seen and unseen anomalies. Furthermore, the proposed method generates anomalous instances in addition to normal instances for generative replay to reduce the negative effects of catastrophic forgetting. In generative replay, anomalous instances are more difficult to generate than normal instances because few anomalous instances are available for training in anomaly detection. To overcome this problem, we formulate the generation of anomalous instances as an optimization problem, in which we find a latent vector of the VAE corresponding to anomalous instances, and generate anomalies by solving it using gradient descent. Our experimental results show that the proposed method is superior to anomaly detection methods using conventional continual learning.",
        "keywords": "continual learning;anomaly detection;generative replay",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Akira Ito;Atsutoshi Kumagai",
        "authorids": "~Akira_Ito1;~Atsutoshi_Kumagai2",
        "gender": "M;M",
        "homepage": ";https://scholar.google.co.jp/citations?user=Q_d8GEIAAAAJ&hl=ja",
        "dblp": "49/6736-2;178/8630",
        "google_scholar": "https://scholar.google.co.jp/citations?user=UIjxnNsAAAAJ;https://scholar.google.co.jp/citations?user=Q_d8GEIAAAAJ",
        "orcid": "0000-0002-4602-7570;0000-0002-2915-4615",
        "linkedin": ";",
        "or_profile": "~Akira_Ito1;~Atsutoshi_Kumagai2",
        "aff": "NTT;NTT",
        "aff_domain": "ntt.co.jp;ntt.co.jp",
        "position": "Researcher;Researcher",
        "bibtex": "@misc{\nito2024continual,\ntitle={Continual Supervised Anomaly Detection},\nauthor={Akira Ito and Atsutoshi Kumagai},\nyear={2024},\nurl={https://openreview.net/forum?id=uizIvVBY8P}\n}",
        "github": "",
        "project": "",
        "reviewers": "QxJr;1EUX;vozw",
        "site": "https://openreview.net/forum?id=uizIvVBY8P",
        "pdf_size": 468015,
        "rating": "5;6;6",
        "confidence": "4;3;3",
        "soundness": "3;3;3",
        "contribution": "2;2;2",
        "presentation": "3;3;3",
        "wc_summary": "44;172;79",
        "wc_strengths": "38;92;18",
        "wc_weaknesses": "115;212;124",
        "wc_questions": "20;24;1",
        "wc_review": "217;500;222",
        "wc_reply_reviewers": "75;45;270",
        "wc_reply_authors": "733;755;614",
        "reply_reviewers": "1;1;1",
        "reply_authors": "2;2;2",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            98.33333333333333,
            54.01440137181523
        ],
        "wc_strengths_avg": [
            49.333333333333336,
            31.25522178594945
        ],
        "wc_weaknesses_avg": [
            150.33333333333334,
            43.759443425264095
        ],
        "wc_questions_avg": [
            15.0,
            10.03327796219494
        ],
        "wc_review_avg": [
            313.0,
            132.24472264202709
        ],
        "wc_reply_reviewers_avg": [
            130.0,
            99.74968671630002
        ],
        "wc_reply_authors_avg": [
            700.6666666666666,
            61.93724422528195
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.9999999999999997,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:jlcqAi81WV0J:scholar.google.com/&scioq=Continual+Supervised+Anomaly+Detection&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "NTT Corporation",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ntt.co.jp",
        "aff_unique_abbr": "NTT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Japan"
    },
    {
        "id": "ujX2l7mNX6",
        "title": "MindGPT: Interpreting What You See with Non-invasive Brain Recordings",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Decoding of seen visual contents with non-invasive brain recordings has important scientific and practical values. Efforts have been made to recover the seen images from brain signals. However, most existing approaches cannot faithfully reflect the visual contents due to insufficient image quality or semantic mismatches. Compared with reconstructing pixel-level visual images, speaking is a more efficient and effective way to explain visual information. Here we introduce a non-invasive neural decoder, termed as MindGPT, which interprets perceived visual stimuli into natural languages from fMRI signals. Specifically, our model builds upon a visually guided neural encoder with a cross-attention mechanism, which permits us to guide latent neural representations towards a desired language semantic direction in an end-to-end manner by the collaborative use of the large language model GPT. By doing so, we found that the neural representations of the MindGPT are explainable, which can be used to evaluate the contributions of visual properties to language semantics. Our experiments show that the generated word sequences truthfully represented the visual information (with essential details) conveyed in the seen stimuli. The results also suggested that with respect to language decoding tasks, the higher visual cortex (HVC) is more semantically informative than the lower visual cortex (LVC), and using only the HVC can recover most of the semantic information.",
        "keywords": "Language decoder;fMRI decoding;Semantic reconstruction;Multimodal learning;Visual cues",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "Jiaxuan Chen;Yu Qi;Yueming Wang;Gang Pan",
        "authorids": "~Jiaxuan_Chen1;~Yu_Qi1;~Yueming_Wang1;~Gang_Pan1",
        "gender": ";F;;",
        "homepage": ";;https://person.zju.edu.cn/en/ymwang/;",
        "dblp": "64/10174-2;;01/3962-1.html;",
        "google_scholar": "gsRPefMAAAAJ;https://scholar.google.com.hk/citations?user=LJ9ClwoAAAAJ;gymhR_0AAAAJ;",
        "orcid": "0000-0002-4387-9671;;;",
        "linkedin": ";;;",
        "or_profile": "~Jiaxuan_Chen1;~Yu_Qi1;~Yueming_Wang1;~Gang_Pan1",
        "aff": "Zhejiang University;Zhejiang University;Zhejiang University;",
        "aff_domain": "zju.edu.cn;zju.edu.cn;zju.edu.cn;",
        "position": "PhD student;Tenure-track Research Professor;Full Professor;",
        "bibtex": "@misc{\nchen2024mindgpt,\ntitle={Mind{GPT}: Interpreting What You See with Non-invasive Brain Recordings},\nauthor={Jiaxuan Chen and Yu Qi and Yueming Wang and Gang Pan},\nyear={2024},\nurl={https://openreview.net/forum?id=ujX2l7mNX6}\n}",
        "github": "",
        "project": "",
        "reviewers": "Hx5r;QZRJ;SjKZ;7fxY",
        "site": "https://openreview.net/forum?id=ujX2l7mNX6",
        "pdf_size": 14129155,
        "rating": "5;6;6;6",
        "confidence": "4;4;3;3",
        "soundness": "3;3;4;4",
        "contribution": "3;2;2;3",
        "presentation": "3;1;3;3",
        "wc_summary": "49;138;130;121",
        "wc_strengths": "71;136;190;114",
        "wc_weaknesses": "65;227;330;72",
        "wc_questions": "57;377;144;36",
        "wc_review": "242;878;794;343",
        "wc_reply_reviewers": "0;64;23;0",
        "wc_reply_authors": "456;657;678;208",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            109.5,
            35.443617196894564
        ],
        "wc_strengths_avg": [
            127.75,
            42.87408891160254
        ],
        "wc_weaknesses_avg": [
            173.5,
            111.16316836074797
        ],
        "wc_questions_avg": [
            153.5,
            135.24145074643351
        ],
        "wc_review_avg": [
            564.25,
            275.6903834013802
        ],
        "wc_reply_reviewers_avg": [
            21.75,
            26.13785568863674
        ],
        "wc_reply_authors_avg": [
            499.75,
            189.42858152876508
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2288489559811060087&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Zhejiang University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.zju.edu.cn",
        "aff_unique_abbr": "ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Enhancing High-Resolution 3D Generation through Pixel-wise Gradient Clipping",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17566",
        "id": "ukidfml68f",
        "author_site": "Zijie Pan, Jiachen Lu, Xiatian Zhu, Li Zhang",
        "tldr": "",
        "abstract": "High-resolution 3D object generation remains a challenging task primarily due to the limited availability of comprehensive annotated training data. Recent advancements have aimed to overcome this constraint by harnessing image generative models, pretrained on extensive curated web datasets, using knowledge transfer techniques like Score Distillation Sampling (SDS).\nEfficiently addressing the requirements of high-resolution rendering often necessitates the adoption of latent representation-based models, such as the Latent Diffusion Model (LDM). In this framework, a significant challenge arises: \nTo compute gradients for individual image pixels, it is necessary to backpropagate gradients from the designated latent space through the frozen components of the image model, such as the VAE encoder used within LDM. However, this gradient propagation pathway has never been optimized, remaining uncontrolled during training.\nWe find that the unregulated gradients adversely affect the 3D model's capacity in acquiring texture-related information from the image generative model, \nleading to poor quality appearance synthesis.\nTo address this overarching challenge, we propose an innovative operation termed Pixel-wise Gradient Clipping (PGC) designed for seamless integration into existing 3D generative models, thereby enhancing their synthesis quality. Specifically, \nwe control the magnitude of stochastic gradients by clipping the pixel-wise gradients efficiently,\nwhile preserving crucial texture-related gradient directions.\nDespite this simplicity and minimal extra cost, extensive experiments demonstrate the efficacy of our PGC\nin enhancing the performance of existing 3D generative models\nfor high-resolution object rendering.",
        "keywords": "3D generation;diffusion model",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/23e5d12ab7788bc494753f9a6a69c569cd9038ea.pdf",
        "author": "Zijie Pan;Jiachen Lu;Xiatian Zhu;Li Zhang",
        "authorids": "~Zijie_Pan2;~Jiachen_Lu2;~Xiatian_Zhu3;~Li_Zhang5",
        "gender": "M;;;M",
        "homepage": "https://github.com/mdarhdarz;;https://x-up-lab.github.io;http://www.robots.ox.ac.uk/~lz/",
        "dblp": "290/3418;;128/7935;89/5992-40",
        "google_scholar": ";;ZbA-z1cAAAAJ;-wOTCE8AAAAJ",
        "orcid": ";;0000-0002-9284-2955;",
        "linkedin": ";;;",
        "or_profile": "~Zijie_Pan2;~Jiachen_Lu2;~Xiatian_Zhu3;~Li_Zhang5",
        "aff": "Fudan University;;University of Surrey;Fudan University",
        "aff_domain": "fudan.edu.cn;;surrey.ac.uk;fudan.edu.cn",
        "position": "PhD student;;Associate Professor;Associate Professor",
        "bibtex": "@inproceedings{\npan2024enhancing,\ntitle={Enhancing High-Resolution 3D Generation through Pixel-wise Gradient Clipping},\nauthor={Zijie Pan and Jiachen Lu and Xiatian Zhu and Li Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ukidfml68f}\n}",
        "github": "",
        "project": "",
        "reviewers": "L63f;ezZ1;EEyr",
        "pdf_size": 46448034,
        "rating": "6;6;6",
        "confidence": "4;4;2",
        "soundness": "4;2;3",
        "contribution": "3;2;3",
        "presentation": "3;2;3",
        "wc_summary": "61;65;144",
        "wc_strengths": "45;108;59",
        "wc_weaknesses": "125;195;83",
        "wc_questions": "97;141;42",
        "wc_review": "328;509;328",
        "wc_reply_reviewers": "14;62;24",
        "wc_reply_authors": "525;622;328",
        "reply_reviewers": "1;1;1",
        "reply_authors": "1;2;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            90.0,
            38.21866908549625
        ],
        "wc_strengths_avg": [
            70.66666666666667,
            27.010286106510527
        ],
        "wc_weaknesses_avg": [
            134.33333333333334,
            46.197643037521104
        ],
        "wc_questions_avg": [
            93.33333333333333,
            40.49965706301995
        ],
        "wc_review_avg": [
            388.3333333333333,
            85.32421826317673
        ],
        "wc_reply_reviewers_avg": [
            33.333333333333336,
            20.677416559027762
        ],
        "wc_reply_authors_avg": [
            491.6666666666667,
            122.3174376593769
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8175057877724304328&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=ukidfml68f",
        "pdf": "https://openreview.net/pdf?id=ukidfml68f",
        "email": "fudan.edu.cn;;surrey.ac.uk;fudan.edu.cn",
        "author_num": 4,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Fudan University;University of Surrey",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.fudan.edu.cn;https://www.surrey.ac.uk",
        "aff_unique_abbr": "Fudan;Surrey",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "id": "ukmh3mWFf0",
        "title": "Attributed Graph Clustering via Coarsening with Modularity",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph clustering is a widely used technique for partitioning graphs, community detection, and other tasks. Recent graph clustering algorithms depend on combinations of the features and adjacency matrix, or solely on the adjacency matrix. However, in order to achieve high-quality clustering, it is necessary to consider all these components. In this paper, we propose a novel unsupervised learning framework that incorporates modularity with graph coarsening techniques and important graph regularization terms that improve the clustering performance. Furthermore, we also take into account Dirichlet energies for smoothness of signals, spectral similarity, and coarsening reconstructional error. The proposed framework is solved efficiently by leveraging block majorization-minimization, $\\log\\det$ of the Laplacian, smoothness and modularity, and is readily integrable with deep learning architectures such as GCNs and VGAEs in the form of losses. Extensive theoretical analysis and experiments with benchmark datasets elucidate the proposed framework\u2019s efficacy in graph clustering over existing state-of-the-art methods on both attributed and non-attributed graphs.",
        "keywords": "Graph Clustering;Graph Neural Networks;Convex Optimization;Non-Convex Optimization;Graph Coarsening",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/3feeeb1f322772022b646902b6a17d6a16006ca7.pdf",
        "author": "Samarth Bhatia;Yukti Makhija;Manoj Kumar;Mohit Kataria;Sandeep Kumar",
        "authorids": "~Samarth_Bhatia1;~Yukti_Makhija1;~Manoj_Kumar4;~Mohit_Kataria1;~Sandeep_Kumar8",
        "gender": "M;;M;M;M",
        "homepage": "https://plutonium-239.github.io/;;;;https://sites.google.com/view/sandeepkr/home",
        "dblp": "283/5525;;;;",
        "google_scholar": ";;gdL-bokAAAAJ;;lycMMW8AAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;manoj-kumar-9042b449/;passenger/;sandeep-kumar-84463332/",
        "or_profile": "~Samarth_Bhatia1;~Yukti_Makhija1;~Manoj_Kumar4;~Mohit_Kataria1;~Sandeep_Kumar8",
        "aff": "Indian Institute of Science, Indian institute of science, Bangalore;;Indian Institute of Technology Delhi;Indian Institute of Technology, Delhi;Indian Institute of Technology Delhi",
        "aff_domain": "iisc.ac.in;;iitd.ac.in;iitd.ac.in;iitd.ac.in",
        "position": "Researcher;;PhD student;PhD student;Assistant Professor",
        "bibtex": "@misc{\nbhatia2024attributed,\ntitle={Attributed Graph Clustering via Coarsening with Modularity},\nauthor={Samarth Bhatia and Yukti Makhija and Manoj Kumar and Mohit Kataria and Sandeep Kumar},\nyear={2024},\nurl={https://openreview.net/forum?id=ukmh3mWFf0}\n}",
        "github": "",
        "project": "",
        "reviewers": "s7a2;fD7q;s2b9;iqpP;LHRF",
        "site": "https://openreview.net/forum?id=ukmh3mWFf0",
        "pdf_size": 977845,
        "rating": "3;3;3;3;5",
        "confidence": "4;4;5;3;4",
        "soundness": "2;2;1;2;3",
        "contribution": "2;2;1;2;3",
        "presentation": "1;1;3;1;2",
        "wc_summary": "90;78;64;41;80",
        "wc_strengths": "15;26;45;18;84",
        "wc_weaknesses": "557;570;179;397;216",
        "wc_questions": "24;120;110;291;125",
        "wc_review": "686;794;398;747;505",
        "wc_reply_reviewers": "28;189;0;0;46",
        "wc_reply_authors": "908;1455;1026;1154;961",
        "reply_reviewers": "1;1;0;0;1",
        "reply_authors": "2;2;2;2;2",
        "rating_avg": [
            3.4,
            0.8
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            2.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            1.6,
            0.8
        ],
        "wc_summary_avg": [
            70.6,
            16.965848048358797
        ],
        "wc_strengths_avg": [
            37.6,
            25.444842306447885
        ],
        "wc_weaknesses_avg": [
            383.8,
            164.28195275196848
        ],
        "wc_questions_avg": [
            134.0,
            86.72023985206683
        ],
        "wc_review_avg": [
            626.0,
            150.39281897750305
        ],
        "wc_reply_reviewers_avg": [
            52.6,
            70.40909032220202
        ],
        "wc_reply_authors_avg": [
            1100.8,
            195.24282317155732
        ],
        "reply_reviewers_avg": [
            0.6,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:cFdYESBSwfQJ:scholar.google.com/&scioq=Attributed+Graph+Clustering+via+Coarsening+with+Modularity&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Indian Institute of Science;Indian Institute of Technology Delhi",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.iisc.ac.in;https://www.iitd.ac.in",
        "aff_unique_abbr": "IISc;IIT Delhi",
        "aff_campus_unique_index": "0;1;1;1",
        "aff_campus_unique": "Bangalore;Delhi",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "India"
    },
    {
        "id": "ukmwyfjqoN",
        "title": "ReBotNet: Fast Real-time Video Enhancement",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Most video restoration networks are slow, have high computational load, and can't be used for real-time video enhancement. In this work, we design an efficient and fast framework to perform real-time video enhancement for practical use-cases like live video calls and video streams. Our proposed method, called Recurrent Bottleneck Mixer Network (ReBotNet), employs a dual-branch framework. The first branch learns spatio-temporal features by tokenizing the input frames along the spatial and temporal dimensions using a ConvNext-based encoder and processing these abstract tokens using a bottleneck mixer. To further improve temporal consistency, the second branch employs a mixer directly on tokens extracted from individual frames. A common decoder then merges the features form the two branches to predict the enhanced frame. In addition, we propose a recurrent training approach where the last frame's prediction is leveraged to efficiently enhance the current frame while improving temporal consistency. To evaluate our method, we curate two new datasets that emulate real-world video call and streaming scenarios, and show extensive results on multiple datasets where ReBotNet outperforms existing approaches with lower computations, reduced memory requirements, and faster inference time.",
        "keywords": "video enhancement; low-level vision",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Jeya Maria Jose Valanarasu;Rahul Garg;Andeep Singh Toor;Xin Tong;Weijuan Xi;Andreas Lugmayr;Vishal M. Patel;Anne Menini",
        "authorids": "~Jeya_Maria_Jose_Valanarasu1;~Rahul_Garg2;~Andeep_Singh_Toor1;~Xin_Tong10;~Weijuan_Xi1;~Andreas_Lugmayr1;~Vishal_M._Patel1;~Anne_Menini2",
        "gender": "M;;M;M;;;;",
        "homepage": "https://jeya-maria-jose.github.io/research/;;;https://www.xintong.site/;;;;https://scholar.google.com/citations?user=v57mjTAAAAAJ&hl=en",
        "dblp": "275/7027;55/1248;;;;;;",
        "google_scholar": "https://scholar.google.co.in/citations?user=vphpzPYAAAAJ;0eQjcEEAAAAJ;ZL94ipYAAAAJ;7H5iAWgAAAAJ;;;;",
        "orcid": ";;;;;;;",
        "linkedin": ";;;tongvis;;;;",
        "or_profile": "~Jeya_Maria_Jose_Valanarasu1;~Rahul_Garg2;~Andeep_Singh_Toor1;~Xin_Tong10;~Weijuan_Xi1;~Andreas_Lugmayr1;~Vishal_M._Patel1;~Anne_Menini2",
        "aff": "Stanford University;Google;Google;Google;;;;Google",
        "aff_domain": "stanford.edu;google.com;google.com;google.com;;;;google.com",
        "position": "Postdoc;Research Scientist;Researcher;Software Engineer;;;;Researcher",
        "bibtex": "@misc{\nvalanarasu2024rebotnet,\ntitle={ReBotNet: Fast Real-time Video Enhancement},\nauthor={Jeya Maria Jose Valanarasu and Rahul Garg and Andeep Singh Toor and Xin Tong and Weijuan Xi and Andreas Lugmayr and Vishal M. Patel and Anne Menini},\nyear={2024},\nurl={https://openreview.net/forum?id=ukmwyfjqoN}\n}",
        "github": "",
        "project": "",
        "reviewers": "PgtF;e4UV;SWLx;ki94",
        "site": "https://openreview.net/forum?id=ukmwyfjqoN",
        "pdf_size": 1223358,
        "rating": "5;5;5;6",
        "confidence": "4;5;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;1;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "101;54;84;171",
        "wc_strengths": "34;60;44;64",
        "wc_weaknesses": "330;146;153;62",
        "wc_questions": "5;13;35;177",
        "wc_review": "470;273;316;474",
        "wc_reply_reviewers": "0;78;84;95",
        "wc_reply_authors": "548;891;789;452",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "1;2;2;2",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            102.5,
            42.97964634568321
        ],
        "wc_strengths_avg": [
            50.5,
            12.114041439585717
        ],
        "wc_weaknesses_avg": [
            172.75,
            97.59450548058533
        ],
        "wc_questions_avg": [
            57.5,
            69.86236468943775
        ],
        "wc_review_avg": [
            383.25,
            90.0538033622123
        ],
        "wc_reply_reviewers_avg": [
            64.25,
            37.59238619720754
        ],
        "wc_reply_authors_avg": [
            670.0,
            177.06637173670217
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18430140412377708456&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1;1;1",
        "aff_unique_norm": "Stanford University;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.stanford.edu;https://www.google.com",
        "aff_unique_abbr": "Stanford;Google",
        "aff_campus_unique_index": "0;1;1;1;1",
        "aff_campus_unique": "Stanford;Mountain View",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "ul1cjLB98Y",
        "title": "A Theory of Unimodal Bias in Multimodal Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Using multiple input streams simultaneously in training multimodal neural networks is intuitively advantageous, but practically challenging. A key challenge is unimodal bias, where a network overly relies on one modality and ignores others during joint training. While unimodal bias is well-documented empirically, our theoretical understanding of how architecture and data statistics influence this bias remains incomplete. Here we develop a theory of unimodal bias with deep multimodal linear networks. We calculate the duration of the unimodal phase in learning, as a function of the depth at which modalities are fused within the network, dataset statistics, and initialization. We find that the deeper the layer at which fusion occurs, the longer the unimodal phase. In addition, our theory reveals the modality learned first is not necessarily the modality that contributes more to the output. Our results, derived for multimodal linear networks, extend to ReLU networks in certain settings. Taken together, this work illuminates pathologies of multimodal learning under joint training, showing that late and intermediate fusion architectures can give rise to long unimodal phases and even prioritize learning a less helpful modality.",
        "keywords": "Multimodal Learning;Deep Linear Neural Networks",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/80fc03fd9758803d8cefe99e82232bbffe605719.zip",
        "author": "Yedi Zhang;Peter E. Latham;Andrew M Saxe",
        "authorids": "~Yedi_Zhang3;~Peter_E._Latham1;~Andrew_M_Saxe1",
        "gender": ";M;M",
        "homepage": ";http://www.gatsby.ucl.ac.uk/~pel/;https://www.saxelab.org",
        "dblp": ";18/4059;39/6894",
        "google_scholar": ";;h0Al1fcAAAAJ",
        "orcid": ";;0000-0002-9831-8812",
        "linkedin": ";;",
        "or_profile": "~Yedi_Zhang3;~Peter_E._Latham1;~Andrew_M_Saxe1",
        "aff": ";;University College London, University of London",
        "aff_domain": ";;ucl.ac.uk",
        "position": ";;Full Professor",
        "bibtex": "@misc{\nzhang2024a,\ntitle={A Theory of Unimodal Bias in Multimodal Learning},\nauthor={Yedi Zhang and Peter E. Latham and Andrew M Saxe},\nyear={2024},\nurl={https://openreview.net/forum?id=ul1cjLB98Y}\n}",
        "github": "",
        "project": "",
        "reviewers": "T6g2;H94d;8NBJ;W8DV",
        "site": "https://openreview.net/forum?id=ul1cjLB98Y",
        "pdf_size": 1446975,
        "rating": "3;5;5;8",
        "confidence": "4;4;4;3",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;2",
        "presentation": "1;3;3;3",
        "wc_summary": "47;37;79;74",
        "wc_strengths": "53;55;62;36",
        "wc_weaknesses": "125;170;208;120",
        "wc_questions": "67;73;58;254",
        "wc_review": "292;335;407;484",
        "wc_reply_reviewers": "121;44;0;100",
        "wc_reply_authors": "478;656;1164;1731",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "1;1;2;4",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            59.25,
            17.69710428290459
        ],
        "wc_strengths_avg": [
            51.5,
            9.5524865872714
        ],
        "wc_weaknesses_avg": [
            155.75,
            35.90525727522364
        ],
        "wc_questions_avg": [
            113.0,
            81.58124784532289
        ],
        "wc_review_avg": [
            379.5,
            72.99486283294188
        ],
        "wc_reply_reviewers_avg": [
            66.25,
            47.488814472462884
        ],
        "wc_reply_authors_avg": [
            1007.25,
            487.8182935274158
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8892972917998875,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15815696787467355552&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "University College London",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucl.ac.uk",
        "aff_unique_abbr": "UCL",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "ul6EYKM1Kv",
        "title": "Cognition-Supervised Learning: Contrasting EEG Signals and Visual Stimuli For Saliency Detection",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In the rapidly evolving landscape of machine learning, the quest for efficient and accurate supervision signals remains paramount. Suitable supervision signals can be costly and practically impossible to obtain for models that require subjective cognitive labels, such as individual-specific interpretation of images or subjective training input for generative models. In this paper, we introduce a novel paradigm: cognition-supervised learning, leveraging human brain signals as direct supervisory signals. Using electroencephalogram (EEG) data, we contrastively train models to detect visual saliency without the need for any manual annotations. Our approach, the first of its kind, demonstrates that representations of semantic visual saliencies can be learned directly from EEG data. In downstream tasks, such as classification, clustering, and image generation, our learned representations not only reflect semantic saliency but also achieve competitive performance compared to models trained with manually labeled datasets. This work provides a promising avenue for future research in utilizing signals measured from the human cognitive system for supervising computer vision and machine learning models.",
        "keywords": "Electroencephalography;EEG;Contrastive Learning;Generative Modeling;Neuroimaging",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "Jun Ma;Tuukka Ruotsalo",
        "authorids": "~Jun_Ma8;~Tuukka_Ruotsalo2",
        "gender": "M;M",
        "homepage": "https://www.cs.helsinki.fi/group/intercom/;https://www.cs.helsinki.fi/group/intercom/#home",
        "dblp": ";06/4486",
        "google_scholar": ";https://scholar.google.com/citations?hl=fi",
        "orcid": "0009-0008-2216-1151;",
        "linkedin": ";",
        "or_profile": "~Jun_Ma8;~Tuukka_Ruotsalo2",
        "aff": "University of Helsinki, University of Helsinki;University of Helsinki",
        "aff_domain": "cs.helsinki.fi;helsinki.fi",
        "position": "PhD student;Research Fellow",
        "bibtex": "@misc{\nanonymous2024cognitionsupervised,\ntitle={Cognition-Supervised Learning: Contrasting {EEG} Signals and Visual Stimuli For Saliency Detection},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=ul6EYKM1Kv}\n}",
        "github": "",
        "project": "",
        "reviewers": "h8j5;yZyL;VsJo;4tkM",
        "site": "https://openreview.net/forum?id=ul6EYKM1Kv",
        "pdf_size": 30577266,
        "rating": "3;3;6;6",
        "confidence": "3;5;5;4",
        "soundness": "2;1;3;3",
        "contribution": "2;1;3;2",
        "presentation": "2;2;3;3",
        "wc_summary": "52;108;63;43",
        "wc_strengths": "22;61;28;221",
        "wc_weaknesses": "233;98;254;239",
        "wc_questions": "132;63;6;37",
        "wc_review": "439;330;351;540",
        "wc_reply_reviewers": "393;315;0;0",
        "wc_reply_authors": "1303;1377;900;555",
        "reply_reviewers": "1;2;0;0",
        "reply_authors": "3;4;2;1",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            66.5,
            24.984995497297973
        ],
        "wc_strengths_avg": [
            83.0,
            81.04628307331558
        ],
        "wc_weaknesses_avg": [
            206.0,
            62.821174774115775
        ],
        "wc_questions_avg": [
            59.5,
            46.467730738653465
        ],
        "wc_review_avg": [
            415.0,
            82.94877937619094
        ],
        "wc_reply_reviewers_avg": [
            177.0,
            179.1354236325133
        ],
        "wc_reply_authors_avg": [
            1033.75,
            330.68366681770055
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.3015113445777637,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:_RWhwXJtzN4J:scholar.google.com/&scioq=Cognition-Supervised+Learning:+Contrasting+EEG+Signals+and+Visual+Stimuli+For+Saliency+Detection&hl=en&as_sdt=0,47",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Helsinki",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.helsinki.fi",
        "aff_unique_abbr": "UH",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Finland"
    },
    {
        "id": "ulMXGO1fdH",
        "title": "Estimating Post-Synaptic Effects for Online Training of Feed-Forward SNNs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Facilitating online learning in spiking neural networks (SNNs) is a key step in developing event-based models that can adapt to changing environments and learn from continuous data streams in real-time. Although forward-mode differentiation enables online learning, its computational requirements restrict scalability. This is typically addressed through approximations that limit learning in deep models. In this study, we propose Online Training with Postsynaptic Estimates (OTPE) for training feed-forward SNNs, which approximates Real-Time Recurrent Learning (RTRL) by incorporating temporal dynamics not captured by current approximations, such as Online Training Through Time (OTTT) and Online Spatio-Temporal Learning (OSTL). We show improved scaling for multi-layer networks using a novel approximation of temporal effects on the subsequent layer's activity. This approximation incurs minimal overhead in the time and space complexity compared to similar algorithms, and the calculation of temporal effects remains local to each layer. We characterize the learning performance of our proposed algorithms on multiple SNN model configurations for rate-based and time-based encoding. OTPE exhibits the highest directional alignment to exact gradients, calculated with backpropagation through time (BPTT), in deep networks and, on time-based encoding, outperforms other approximate methods. We also observe sizeable gains in average performance over similar algorithms in offline training of Spiking Heidelberg Digits with equivalent hyper-parameters (OTTT/OSTL \u2013 70.5%; OTPE \u2013 75.2%; BPTT \u2013 78.1%).",
        "keywords": "spiking neural networks;online learning;gradient approximation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/7c33f17fe3fc935cf1aac68465cbac74cd48ed35.zip",
        "author": "Thomas Manuel Summe;Clemens JS Schaefer;Siddharth Joshi",
        "authorids": "~Thomas_Manuel_Summe1;~Clemens_JS_Schaefer1;~Siddharth_Joshi2",
        "gender": "M;M;M",
        "homepage": ";http://clemens-schafer.com/;",
        "dblp": ";261/9795;63/6495-1.html",
        "google_scholar": "q0OEmC4AAAAJ;VgWtDQcAAAAJ;PegsFZ8AAAAJ",
        "orcid": ";;0000-0002-9201-9678",
        "linkedin": ";clemens-schaefer-112903258/;",
        "or_profile": "~Thomas_Manuel_Summe1;~Clemens_JS_Schaefer1;~Siddharth_Joshi2",
        "aff": "University of Notre Dame;Google;University of Notre Dame",
        "aff_domain": "nd.edu;google.com;nd.edu",
        "position": "PhD student;Software Engineer;Assistant Professor",
        "bibtex": "@misc{\nsumme2024estimating,\ntitle={Estimating Post-Synaptic Effects for Online Training of Feed-Forward {SNN}s},\nauthor={Thomas Manuel Summe and Clemens JS Schaefer and Siddharth Joshi},\nyear={2024},\nurl={https://openreview.net/forum?id=ulMXGO1fdH}\n}",
        "github": "",
        "project": "",
        "reviewers": "Q7D9;Rp8L;hRpc",
        "site": "https://openreview.net/forum?id=ulMXGO1fdH",
        "pdf_size": 6333686,
        "rating": "3;5;5",
        "confidence": "4;4;3",
        "soundness": "3;2;2",
        "contribution": "2;3;3",
        "presentation": "2;2;2",
        "wc_summary": "45;55;100",
        "wc_strengths": "38;33;147",
        "wc_weaknesses": "275;149;121",
        "wc_questions": "3;2;262",
        "wc_review": "361;239;630",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "511;510;673",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            66.66666666666667,
            23.921166824012207
        ],
        "wc_strengths_avg": [
            72.66666666666667,
            52.60122516528383
        ],
        "wc_weaknesses_avg": [
            181.66666666666666,
            66.97926710723418
        ],
        "wc_questions_avg": [
            89.0,
            122.33015436378173
        ],
        "wc_review_avg": [
            410.0,
            163.34217663134854
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            564.6666666666666,
            76.60432247740476
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3608846037396740054&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Notre Dame;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.nd.edu;https://www.google.com",
        "aff_unique_abbr": "Notre Dame;Google",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Hierarchical Context Merging: Better Long Context Understanding for Pre-trained LLMs",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17565",
        "id": "ulaUJFd96G",
        "author_site": "Woomin Song, Seunghyuk Oh, Sangwoo Mo, Jaehyung Kim, Sukmin Yun, Jung-Woo Ha, Jinwoo Shin",
        "tldr": "",
        "abstract": "Large language models (LLMs) have shown remarkable performance in various natural language processing tasks. However, a primary constraint they face is the context limit, i.e., the maximum number of tokens they can process. Previous works have explored architectural changes and modifications in positional encoding to relax the constraint, but they often require expensive training or do not address the computational demands of self-attention. In this paper, we present Hierarchical cOntext MERging (HOMER), a new training-free scheme designed to overcome the limitations. HOMER uses a divide-and-conquer algorithm, dividing long inputs into manageable chunks. Each chunk is then processed collectively, employing a hierarchical strategy that merges adjacent chunks at progressive transformer layers. A token reduction technique precedes each merging, ensuring memory usage efficiency. We also propose an optimized computational order reducing the memory requirement to logarithmically scale with respect to input length, making it especially favorable for environments with tight memory restrictions.  Our experiments demonstrate the proposed method's superior performance and memory efficiency, enabling the broader use of LLMs in contexts requiring extended context. Code is available at https://github.com/alinlab/HOMER.",
        "keywords": "Large language models;Long context handling;Token pruning",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Woomin Song;Seunghyuk Oh;Sangwoo Mo;Jaehyung Kim;Sukmin Yun;Jung-Woo Ha;Jinwoo Shin",
        "authorids": "~Woomin_Song1;~Seunghyuk_Oh1;~Sangwoo_Mo1;~Jaehyung_Kim1;~Sukmin_Yun1;~Jung-Woo_Ha1;~Jinwoo_Shin1",
        "gender": "Not Specified;;M;M;;M;M",
        "homepage": "https://woominsong.notion.site/Woomin-Song-e064eeccde3649c3bde08808a4adcdf4;https://www.seunghyukoh.com;https://sites.google.com/view/sangwoomo;https://sites.google.com/view/jaehyungkim;https://sites.google.com/view/sukmin-yun;https://aidljwha.wordpress.com/;https://sites.google.com/site/mijirim/",
        "dblp": "375/1317;;198/0432;02/7206-1;234/9078;66/867-1;31/7062",
        "google_scholar": ";IXJcR1gAAAAJ;https://scholar.google.co.kr/citations?user=Sq9y3NMAAAAJ;https://scholar.google.co.kr/citations?user=6OYOsGsAAAAJ;fQcZ_hQAAAAJ;https://scholar.google.co.kr/citations?user=eGj3ay4AAAAJ;https://scholar.google.com.tw/citations?user=m3eDp7kAAAAJ",
        "orcid": ";;;;;0000-0002-7400-7681;",
        "linkedin": ";seunghyuk-oh-570347197/;;;sukmin-yun-975b67129/;jung-woo-ha-b2782862?trk=hp-identity-name;",
        "or_profile": "~Woomin_Song1;~Seunghyuk_Oh1;~Sangwoo_Mo1;~Jaehyung_Kim1;~Sukmin_Yun1;~Jung-Woo_Ha1;~Jinwoo_Shin1",
        "aff": "KAIST;KAIST;University of Michigan - Ann Arbor;Carnegie Mellon University;Mohamed bin Zayed University of Artificial Intelligence;NAVER AI Lab;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr;umich.edu;andrew.cmu.edu;mbzuai.ac.ae;navercorp.com;kaist.ac.kr",
        "position": "PhD student;MS student;Postdoc;Postdoc;Postdoc;Research fellow;Full Professor",
        "bibtex": "@inproceedings{\nsong2024hierarchical,\ntitle={Hierarchical Context Merging: Better Long Context Understanding for Pre-trained {LLM}s},\nauthor={Woomin Song and Seunghyuk Oh and Sangwoo Mo and Jaehyung Kim and Sukmin Yun and Jung-Woo Ha and Jinwoo Shin},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ulaUJFd96G}\n}",
        "github": "",
        "project": "",
        "reviewers": "ae6y;X3So;wcXN;uJAL",
        "pdf_size": 507505,
        "rating": "3;6;8;8",
        "confidence": "3;4;4;3",
        "soundness": "2;2;4;3",
        "contribution": "2;3;4;3",
        "presentation": "3;3;3;3",
        "wc_summary": "84;115;125;104",
        "wc_strengths": "21;48;53;97",
        "wc_weaknesses": "262;130;38;75",
        "wc_questions": "4;184;177;35",
        "wc_review": "371;477;393;311",
        "wc_reply_reviewers": "494;86;12;19",
        "wc_reply_authors": "1389;1413;846;390",
        "reply_reviewers": "1;2;1;1",
        "reply_authors": "4;5;3;2",
        "rating_avg": [
            6.25,
            2.0463381929681126
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            107.0,
            15.215124054702938
        ],
        "wc_strengths_avg": [
            54.75,
            27.261465477849864
        ],
        "wc_weaknesses_avg": [
            126.25,
            84.93637324491787
        ],
        "wc_questions_avg": [
            100.0,
            81.28037893612455
        ],
        "wc_review_avg": [
            388.0,
            59.50630218724736
        ],
        "wc_reply_reviewers_avg": [
            152.75,
            199.1273148013602
        ],
        "wc_reply_authors_avg": [
            1009.5,
            423.4811093779745
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.5,
            1.118033988749895
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.3665083330689157,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6993985588317544341&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 8,
        "openreview": "https://openreview.net/forum?id=ulaUJFd96G",
        "pdf": "https://openreview.net/pdf?id=ulaUJFd96G",
        "email": "kaist.ac.kr;kaist.ac.kr;umich.edu;andrew.cmu.edu;mbzuai.ac.ae;navercorp.com;kaist.ac.kr",
        "author_num": 7,
        "aff_unique_index": "0;0;1;2;3;4;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology;University of Michigan;Carnegie Mellon University;Mohamed bin Zayed University of Artificial Intelligence;NAVER Corporation",
        "aff_unique_dep": ";;;;NAVER AI Lab",
        "aff_unique_url": "https://www.kaist.ac.kr;https://www.umich.edu;https://www.cmu.edu;https://mbzuai.ac.ae;https://www.naver.com",
        "aff_unique_abbr": "KAIST;UM;CMU;MBZUAI;NAVER",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Ann Arbor",
        "aff_country_unique_index": "0;0;1;1;2;0;0",
        "aff_country_unique": "South Korea;United States;United Arab Emirates"
    },
    {
        "title": "GROOT: Learning to Follow Instructions by Watching Gameplay Videos",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17564",
        "id": "uleDLeiaT3",
        "author_site": "Shaofei Cai, Bowei Zhang, Zihao Wang, Xiaojian Ma, Anji Liu, Yitao Liang",
        "tldr": "",
        "abstract": "We study the problem of building a controller that can follow open-ended instructions in open-world environments. We propose to follow reference videos as instructions, which offer expressive goal specifications while eliminating the need for expensive text-gameplay annotations. A new learning framework is derived to allow learning such instruction-following controllers from gameplay videos while producing a video instruction encoder that induces a structured goal space. We implement our agent GROOT in a simple yet effective encoder-decoder architecture based on causal transformers. We evaluate GROOT against open-world counterparts and human players on a proposed Minecraft SkillForge benchmark. The Elo ratings clearly show that GROOT is closing the human-machine gap as well as exhibiting a 70% winning rate over the best generalist agent baseline. Qualitative analysis of the induced goal space further demonstrates some interesting emergent properties, including the goal composition and complex gameplay behavior synthesis.",
        "keywords": "Agent;Goal-conditioned Policy;Imitation Learning;Open World;Minecraft",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/729307f34ab7a39d159b375a26a49d724d4664a1.zip",
        "author": "Shaofei Cai;Bowei Zhang;Zihao Wang;Xiaojian Ma;Anji Liu;Yitao Liang",
        "authorids": "~Shaofei_Cai2;~Bowei_Zhang2;~Zihao_Wang23;~Xiaojian_Ma1;~Anji_Liu1;~Yitao_Liang1",
        "gender": "M;M;M;;M;M",
        "homepage": "https://phython96.github.io/;https://github.com/zbw001;https://zhwang4ai.github.io/;;https://liuanji.github.io/;https://web.cs.ucla.edu/~yliang/",
        "dblp": "276/3245;;;;227/8622;173/4969",
        "google_scholar": "MZXDSSUAAAAJ;tYH72AYAAAAJ;I0D-EgQAAAAJ;;k_4zYecAAAAJ;KVzR1XEAAAAJ",
        "orcid": ";;0000-0001-8396-3707;;;",
        "linkedin": ";;;;anji-liu-7610b7190/;",
        "or_profile": "~Shaofei_Cai2;~Bowei_Zhang2;~Zihao_Wang23;~Xiaojian_Ma1;~Anji_Liu1;~Yitao_Liang1",
        "aff": "Peking University;Peking University;Peking University;;University of California, Los Angeles;Peking University",
        "aff_domain": "pku.edu.cn;pku.edu.cn;pku.edu.cn;;ucla.edu;pku.edu.cn",
        "position": "PhD student;Undergrad student;PhD student;;PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\ncai2024groot,\ntitle={{GROOT}: Learning to Follow Instructions by Watching Gameplay Videos},\nauthor={Shaofei Cai and Bowei Zhang and Zihao Wang and Xiaojian Ma and Anji Liu and Yitao Liang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=uleDLeiaT3}\n}",
        "github": "",
        "project": "",
        "reviewers": "f4yG;WJvG;9vuS;anV3",
        "pdf_size": 15217875,
        "rating": "5;8;8;8",
        "confidence": "3;5;3;4",
        "soundness": "3;3;3;3",
        "contribution": "2;4;3;3",
        "presentation": "2;3;3;4",
        "wc_summary": "77;74;65;79",
        "wc_strengths": "129;247;54;101",
        "wc_weaknesses": "489;231;119;114",
        "wc_questions": "10;307;39;79",
        "wc_review": "705;859;277;373",
        "wc_reply_reviewers": "150;119;50;0",
        "wc_reply_authors": "3080;1012;874;812",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "6;3;3;2",
        "rating_avg": [
            7.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            73.75,
            5.356071321407137
        ],
        "wc_strengths_avg": [
            132.75,
            71.19822680376247
        ],
        "wc_weaknesses_avg": [
            238.25,
            152.140354607185
        ],
        "wc_questions_avg": [
            108.75,
            117.05207174586873
        ],
        "wc_review_avg": [
            553.5,
            237.33678602357452
        ],
        "wc_reply_reviewers_avg": [
            79.75,
            58.5678025881115
        ],
        "wc_reply_authors_avg": [
            1444.5,
            947.0273227315039
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.5,
            1.5
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5222329678670935,
        "gs_citation": 37,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18130897457423493651&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=uleDLeiaT3",
        "pdf": "https://openreview.net/pdf?id=uleDLeiaT3",
        "email": "pku.edu.cn;pku.edu.cn;pku.edu.cn;;ucla.edu;pku.edu.cn",
        "author_num": 6,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "Peking University;University of California, Los Angeles",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.ucla.edu",
        "aff_unique_abbr": "Peking U;UCLA",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Los Angeles",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "um32LhFUaF",
        "title": "Instance-aware 3D Semantic Segmentation powered by Shape Reconstruction and Classification",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Existing 3D semantic segmentation methods rely on point-wise or voxel-wise feature descriptors to output segmentation predictions. However, these descriptors are often supervised at point or voxel level, leading to segmentation models that can behave poorly at instance-level. In this paper, we proposed a novel instance-aware approach for 3D semantic segmentation. Our method combines several geometry processing tasks supervised at instance-level to promote the consistency of the learned feature representation. Specifically, our methods use shape generators and shape classifiers to perform shape reconstruction and classification tasks for each shape instance. This enforces the feature representation to faithfully encode both structural and local shape information, with an awareness of shape instances. In the experiments, our method significantly outperform existing approaches in 3D semantic segmentation on several public benchmarks, such as Waymo Open Dataset, SemanticKITTI and ScanNetV2.",
        "keywords": "3D semantic segmentation; shape generators; multi-task learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/fa6c66f28779d0b4967e4505ac96f9821cb94229.zip",
        "author": "Bo Sun;Qixing Huang;Xiangru Huang",
        "authorids": "~Bo_Sun6;~Qixing_Huang1;~Xiangru_Huang1",
        "gender": "F;M;M",
        "homepage": "https://sites.google.com/view/bosun/home;https://www.cs.utexas.edu/~huangqx/;https://people.csail.mit.edu/xrhuang/",
        "dblp": ";82/241;134/4071",
        "google_scholar": "H9Yzbw4AAAAJ;https://scholar.google.com.tw/citations?user=pamL_rIAAAAJ;0Out9QwAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Bo_Sun6;~Qixing_Huang1;~Xiangru_Huang1",
        "aff": "University of Texas, Austin;University of Texas at Austin;Westlake University",
        "aff_domain": "utexas.edu;utexas.edu;westlake.edu.cn",
        "position": "PhD student;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nsun2024instanceaware,\ntitle={Instance-aware 3D Semantic Segmentation powered by Shape Reconstruction and Classification},\nauthor={Bo Sun and Qixing Huang and Xiangru Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=um32LhFUaF}\n}",
        "github": "",
        "project": "",
        "reviewers": "9ujj;fWVW;WFCE",
        "site": "https://openreview.net/forum?id=um32LhFUaF",
        "pdf_size": 23688167,
        "rating": "3;3;5",
        "confidence": "4;4;4",
        "soundness": "4;1;3",
        "contribution": "2;2;2",
        "presentation": "3;2;3",
        "wc_summary": "41;59;68",
        "wc_strengths": "41;55;31",
        "wc_weaknesses": "87;365;313",
        "wc_questions": "2;26;2",
        "wc_review": "171;505;414",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            56.0,
            11.224972160321824
        ],
        "wc_strengths_avg": [
            42.333333333333336,
            9.843215373488933
        ],
        "wc_weaknesses_avg": [
            255.0,
            120.67587441848792
        ],
        "wc_questions_avg": [
            10.0,
            11.313708498984761
        ],
        "wc_review_avg": [
            363.3333333333333,
            140.98305650758965
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:tvGgAAZaxLwJ:scholar.google.com/&scioq=Instance-aware+3D+Semantic+Segmentation+powered+by+Shape+Reconstruction+and+Classification&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "University of Texas at Austin;Westlake University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.utexas.edu;https://www.westlake.edu.cn",
        "aff_unique_abbr": "UT Austin;WU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Austin;",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "umUIYdLtvh",
        "title": "EquiPocket: an E(3)-Equivariant Geometric Graph Neural Network for Ligand Binding Site Prediction",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Predicting the binding sites of target proteins plays a fundamental role in drug discovery. \nMost existing deep-learning methods consider a protein as a 3D image by spatially clustering its atoms into voxels and then feed the voxelized protein into a 3D CNN for prediction. However, the CNN-based methods encounter several critical issues: 1) defective in representing irregular protein structures; 2) sensitive to rotations; 3) insufficient to characterize the protein surface; 4) unaware of protein size shift. To address the above issues, this work proposes EquiPocket, an E(3)-equivariant Graph Neural Network (GNN) for binding site prediction. \nIn particular, EquiPocket consists of the three modules: the first one to extract local geometric information for each surface atom, the second one to model both the chemical and spatial structure of protein and the last one to capture the geometry of the surface via equivariant message passing over the surface atoms. We further propose a dense attention output layer to alleviate the effect incurred by the variable protein size. Extensive experiments on several representative benchmarks demonstrate the superiority of our framework to the state-of-the-art methods.",
        "keywords": "Pocket Detection;Binding Site Prediction;Graph Neural Network;Drug Discovery",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/97590f960dee8ce85a2ae017e1f7c01246207686.zip",
        "author": "yang zhang;Wenbing Huang;Zhewei Wei;Ye Yuan;Chongxuan Li",
        "authorids": "~yang_zhang28;~Wenbing_Huang1;~Zhewei_Wei1;~Ye_Yuan15;~Chongxuan_Li1",
        "gender": "M;M;M;;M",
        "homepage": "https://fengyuewuya.github.io/;https://gsai.ruc.edu.cn/english/wenbing_huang;http://weizhewei.com;;http://ml.cs.tsinghua.edu.cn/~chongxuan",
        "dblp": "06/6785-94;155/3181-1.html;94/4260;;161/9965",
        "google_scholar": "ObZB2jwAAAAJ;0yNkmO4AAAAJ;https://scholar.google.com.hk/citations?user=qZ7dj4gAAAAJ;;UKMcQn4AAAAJ",
        "orcid": ";;0000-0003-3620-5086;;0000-0002-0912-9076",
        "linkedin": ";;;;",
        "or_profile": "~yang_zhang28;~Wenbing_Huang1;~Zhewei_Wei1;~Ye_Yuan15;~Chongxuan_Li1",
        "aff": "Renmin University of China;Renmin University of China;Renmin University of China;;Renmin University of China",
        "aff_domain": "ruc.edu.cn;ruc.edu.cn;ruc.edu.cn;;ruc.edu.cn",
        "position": "PhD student;Associate Professor;Full Professor;;Associate Professor",
        "bibtex": "@misc{\nzhang2024equipocket,\ntitle={EquiPocket: an E(3)-Equivariant Geometric Graph Neural Network for Ligand Binding Site Prediction},\nauthor={yang zhang and Wenbing Huang and Zhewei Wei and Ye Yuan and Chongxuan Li},\nyear={2024},\nurl={https://openreview.net/forum?id=umUIYdLtvh}\n}",
        "github": "",
        "project": "",
        "reviewers": "fzz6;HnAC;9vNs;qDNY",
        "site": "https://openreview.net/forum?id=umUIYdLtvh",
        "pdf_size": 4126074,
        "rating": "5;5;6;6",
        "confidence": "4;3;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;4",
        "wc_summary": "65;72;65;98",
        "wc_strengths": "25;27;40;138",
        "wc_weaknesses": "67;43;81;75",
        "wc_questions": "99;72;100;29",
        "wc_review": "256;214;286;340",
        "wc_reply_reviewers": "212;76;0;0",
        "wc_reply_authors": "2004;1580;1226;1287",
        "reply_reviewers": "2;1;0;0",
        "reply_authors": "6;4;3;3",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            75.0,
            13.583077707206124
        ],
        "wc_strengths_avg": [
            57.5,
            46.832147078689445
        ],
        "wc_weaknesses_avg": [
            66.5,
            14.44818327679989
        ],
        "wc_questions_avg": [
            75.0,
            28.83574171059243
        ],
        "wc_review_avg": [
            274.0,
            45.89117562233506
        ],
        "wc_reply_reviewers_avg": [
            72.0,
            86.57944328765345
        ],
        "wc_reply_authors_avg": [
            1524.25,
            307.61532390308514
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            4.0,
            1.224744871391589
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14450080582761474773&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Renmin University of China",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.ruc.edu.cn",
        "aff_unique_abbr": "RUC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "unE3TZSAVZ",
        "title": "Breaking Neural Network Scaling Laws with Modularity",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Modular neural networks outperform non-modular neural networks on tasks ranging from visual question answering to robotics. These performance improvements are thought to be due to modular networks' superior ability to model the compositional and combinatorial structure of real-world problems. However, a theoretical explanation of how modularity improves generalizability, and how to leverage task modularity while training networks remains elusive. Using recent theoretical progress in explaining neural network generalization, we investigate how the amount of training data required to generalize on a task varies with the intrinsic dimensionality of a task's input. We show theoretically that when applied to modularly-structured tasks, while non-modular networks require an {exponential} number of samples with task dimensionality, modular networks' sample complexity is {independent} of task dimensionality: modular networks can generalize in high dimensions. We then develop a novel learning rule for modular networks to exploit this advantage and empirically show the rule's improved generalization, both in and out of distribution, on high-dimensional, modular tasks.",
        "keywords": "modularity;neural network;generalization;high-dimensional;scaling laws",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/158447d20c0bf2f12df0d86b0095bf355c673850.zip",
        "author": "Akhilan Boopathy;Sunshine Jiang;William Yue;Jaedong Hwang;Abhiram Iyer;Ila R Fiete",
        "authorids": "~Akhilan_Boopathy1;~Sunshine_Jiang1;~William_Yue1;~Jaedong_Hwang1;~Abhiram_Iyer1;~Ila_R_Fiete1",
        "gender": "M;F;M;M;;F",
        "homepage": ";https://xinyunsunshine.github.io/;;https://jd730.github.io/;;https://fietelab.mit.edu/",
        "dblp": "230/8358;;;239/1982;;",
        "google_scholar": ";;;https://scholar.google.co.kr/citations?user=bITgqEUAAAAJ;pXIRasMAAAAJ;uE-CihIAAAAJ",
        "orcid": ";;0000-0002-1923-5470;;;0000-0003-4738-2539",
        "linkedin": ";https://www.linkedin.com/public-profile/settings?lipi=urn%3Ali%3Apage%3Ad_flagship3_profile_self_edit_contact-info%3B3XSMfK%2FFQQ26GfCvn3ctGw%3D%3D;willyue/;;;",
        "or_profile": "~Akhilan_Boopathy1;~Sunshine_Jiang1;~William_Yue1;~Jaedong_Hwang1;~Abhiram_Iyer1;~Ila_R_Fiete1",
        "aff": "Amazon;Massachusetts Institute of Technology;Massachusetts Institute of Technology;Massachusetts Institute of Technology;Massachusetts Institute of Technology;Massachusetts Institute of Technology",
        "aff_domain": "amazon.com;mit.edu;mit.edu;mit.edu;mit.edu;mit.edu",
        "position": "Intern;Undergrad student;Undergrad student;PhD student;PhD student;Professor",
        "bibtex": "@misc{\nboopathy2024breaking,\ntitle={Breaking Neural Network Scaling Laws with Modularity},\nauthor={Akhilan Boopathy and Sunshine Jiang and William Yue and Jaedong Hwang and Abhiram Iyer and Ila R Fiete},\nyear={2024},\nurl={https://openreview.net/forum?id=unE3TZSAVZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "MGmV;VLQY;Jw6v",
        "site": "https://openreview.net/forum?id=unE3TZSAVZ",
        "pdf_size": 2189791,
        "rating": "5;6;8",
        "confidence": "2;3;3",
        "soundness": "3;2;4",
        "contribution": "3;3;3",
        "presentation": "3;3;4",
        "wc_summary": "62;132;72",
        "wc_strengths": "37;62;65",
        "wc_weaknesses": "30;127;24",
        "wc_questions": "49;199;1",
        "wc_review": "178;520;162",
        "wc_reply_reviewers": "0;68;0",
        "wc_reply_authors": "419;1119;220",
        "reply_reviewers": "0;1;0",
        "reply_authors": "1;3;1",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            88.66666666666667,
            30.912061651652344
        ],
        "wc_strengths_avg": [
            54.666666666666664,
            12.552113589175153
        ],
        "wc_weaknesses_avg": [
            60.333333333333336,
            47.204048790566915
        ],
        "wc_questions_avg": [
            83.0,
            84.33267456923205
        ],
        "wc_review_avg": [
            286.6666666666667,
            165.12083117792525
        ],
        "wc_reply_reviewers_avg": [
            22.666666666666668,
            32.05550741379015
        ],
        "wc_reply_authors_avg": [
            586.0,
            385.5446364127851
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.7559289460184545,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:dqbPS75PyaQJ:scholar.google.com/&scioq=Breaking+Neural+Network+Scaling+Laws+with+Modularity&hl=en&as_sdt=0,33",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1;1;1;1",
        "aff_unique_norm": "Amazon;Massachusetts Institute of Technology",
        "aff_unique_dep": "Amazon.com, Inc.;",
        "aff_unique_url": "https://www.amazon.com;https://web.mit.edu",
        "aff_unique_abbr": "Amazon;MIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "unxTEvHOW7",
        "title": "EXPLEME: A Study in Meme Interpretability, Diving Beyond Input Attribution",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Memes, originally created for humor and social commentary, have evolved into vehicles for offensive and harmful content online. Detecting such content is crucial for upholding the integrity of digital spaces. However, binary classification of memes as offensive or not often falls short in practical applications. Ensuring the reliability of these classifiers and addressing inadvertent biases during training are essential tasks. While numerous input-attribution based interpretability methods exist to shed light on the model's decision-making process, they frequently yield insufficient and semantically irrelevant keywords extracted from input memes. In response, we propose a novel, theoretically grounded approach that extracts meaningful ``tokens\" from a global vocabulary, yielding both relevant and exhaustive set of interpretable keywords. This method provides valuable insights into the model's behavior and uncovers hidden meanings within memes, significantly enhancing transparency and fostering user trust. Through comprehensive quantitative and qualitative evaluations, we demonstrate the superior effectiveness of our approach compared to conventional baselines. Our research contributes to a deeper understanding of meme content analysis and the development of more robust and interpretable multimodal systems.",
        "keywords": "Meme;Offensiveness;Interpretability;Language Modeling",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Dibyanayan Bandyopadhyay;ASMIT GANGULY;Baban Gain;Asif Ekbal",
        "authorids": "~Dibyanayan_Bandyopadhyay1;~ASMIT_GANGULY1;~Baban_Gain1;~Asif_Ekbal1",
        "gender": ";M;M;M",
        "homepage": ";https://asmit203.github.io/;;https://ekbalasif.github.io",
        "dblp": "243/2978.html;387/3854;243/3240;11/3590",
        "google_scholar": "t_kZ1qsAAAAJ;o99k5ccAAAAJ;vI5Y7koAAAAJ;https://scholar.google.co.in/citations?user=IAL_F04AAAAJ",
        "orcid": "0000-0001-5279-6344;0009-0009-4249-9552;0000-0001-8673-7078;0000-0003-3612-8834",
        "linkedin": ";asmitganguly/;babangain/;asif-ekbal-3b8a4517/?originalSubdomain=in",
        "or_profile": "~Dibyanayan_Bandyopadhyay1;~ASMIT_GANGULY1;~Baban_Gain1;~Asif_Ekbal1",
        "aff": "Indian Institute of Technology, Patna;Indian Institute of Technology, Patna;Indian Institute of Technology, Patna;Indian Institute of Technology, Patna",
        "aff_domain": "iitp.ac.in;iitp.ac.in;iitp.ac.in;iitp.ac.in",
        "position": "PhD student;Undergrad student;PhD student;Associate Professor",
        "bibtex": "@misc{\nbandyopadhyay2024expleme,\ntitle={{EXPLEME}: A Study in Meme Interpretability, Diving Beyond Input Attribution},\nauthor={Dibyanayan Bandyopadhyay and ASMIT GANGULY and Baban Gain and Asif Ekbal},\nyear={2024},\nurl={https://openreview.net/forum?id=unxTEvHOW7}\n}",
        "github": "",
        "project": "",
        "reviewers": "Diur;HAZ8;BdWE;VNYw",
        "site": "https://openreview.net/forum?id=unxTEvHOW7",
        "pdf_size": 7328442,
        "rating": "3;3;8;8",
        "confidence": "4;4;4;2",
        "soundness": "2;1;3;3",
        "contribution": "2;1;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "96;117;36;67",
        "wc_strengths": "34;89;42;29",
        "wc_weaknesses": "26;515;44;18",
        "wc_questions": "298;1992;42;5",
        "wc_review": "454;2713;164;119",
        "wc_reply_reviewers": "367;0;0;22",
        "wc_reply_authors": "2125;4956;369;109",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "3;9;1;1",
        "rating_avg": [
            5.5,
            2.5
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            79.0,
            30.520484924063705
        ],
        "wc_strengths_avg": [
            48.5,
            23.837994882120434
        ],
        "wc_weaknesses_avg": [
            150.75,
            210.51054011616617
        ],
        "wc_questions_avg": [
            584.25,
            820.5584607448759
        ],
        "wc_review_avg": [
            862.5,
            1076.094442881293
        ],
        "wc_reply_reviewers_avg": [
            97.25,
            155.99899839422048
        ],
        "wc_reply_authors_avg": [
            1889.75,
            1932.6783714575997
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.5,
            3.278719262151
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:BPNsezfhZ4wJ:scholar.google.com/&scioq=EXPLEME:+A+Study+in+Meme+Interpretability,+Diving+Beyond+Input+Attribution&hl=en&as_sdt=0,21",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Indian Institute of Technology Patna",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.iitp.ac.in",
        "aff_unique_abbr": "IIT Patna",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Patna",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "India"
    },
    {
        "title": "Towards Robust Fidelity for Evaluating Explainability of Graph Neural Networks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17563",
        "id": "up6hr4hIQH",
        "author_site": "Xu Zheng, Farhad Shirani, Tianchun Wang, Wei Cheng, Zhuomin Chen, Haifeng Chen, Hua Wei, Dongsheng Luo",
        "tldr": "",
        "abstract": "Graph Neural Networks (GNNs) are neural models that leverage the dependency structure in graphical data via message passing among the graph nodes. GNNs have emerged as pivotal architectures in analyzing graph-structured data, and their expansive application in sensitive domains requires a comprehensive understanding of their decision-making processes --- necessitating a framework for GNN explainability. An explanation function for GNNs takes a pre-trained GNN along with a graph as input, to produce a `sufficient statistic' subgraph with respect to the graph label. A main challenge in studying GNN explainability is to provide fidelity measures that evaluate the performance of these explanation functions. This paper studies this foundational challenge, spotlighting the inherent limitations of prevailing fidelity metrics, including $Fid_+$, $Fid_-$, and $Fid_\\Delta$. Specifically, a formal, information-theoretic definition of explainability is introduced and it is shown that existing metrics often fail to align with this definition across various statistical scenarios. The reason is due to potential distribution shifts when subgraphs are removed in computing these fidelity measures. Subsequently, a robust class of fidelity measures are introduced, and it is shown analytically that they are resilient to distribution shift issues and are applicable in a wide range of scenarios. Extensive empirical analysis on both synthetic and real datasets are provided to illustrate that the proposed metrics are more coherent with gold standard metrics.",
        "keywords": "Graph Neural Networks;Graph Explanation;XAI",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/0c66af86dbd97efb54a6356b15ec091b83a4175f.zip",
        "author": "Xu Zheng;Farhad Shirani;Tianchun Wang;Wei Cheng;Zhuomin Chen;Haifeng Chen;Hua Wei;Dongsheng Luo",
        "authorids": "~Xu_Zheng3;~Farhad_Shirani1;~Tianchun_Wang1;~Wei_Cheng1;~Zhuomin_Chen1;~Haifeng_Chen1;~Hua_Wei1;~Dongsheng_Luo1",
        "gender": ";M;M;M;;;M;M",
        "homepage": ";;;https://chengw07.github.io/;;https://haifengchen.gitlab.io/intro/;https://www.public.asu.edu/~hwei27/;https://users.cs.fiu.edu/~dluo/",
        "dblp": ";331/0634;153/5231.html;89/2506-2.html;;08/57-1.html;01/6961-1;",
        "google_scholar": ";M1Ab5mEAAAAJ;8su8b60AAAAJ;PRrGVmoAAAAJ;;QzakB68AAAAJ;F1CEAKwAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;;;;0000-0002-3735-1635;0000-0003-4192-0826",
        "linkedin": ";farhad-shirani-48b63349/;;wei-cheng-ml/;;;;",
        "or_profile": "~Xu_Zheng3;~Farhad_Shirani1;~Tianchun_Wang1;~Wei_Cheng1;~Zhuomin_Chen1;~Haifeng_Chen1;~Hua_Wei1;~Dongsheng_Luo1",
        "aff": ";Florida International University;Pennsylvania State University;NEC-Labs;;NEC-Labs;Arizona State University;Florida International University",
        "aff_domain": ";cis.fiu.edu;psu.edu;nec-labs.com;;nec-labs.com;asu.edu;fiu.edu",
        "position": ";Assistant Professor;PhD student;Principal Researcher;;Researcher;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nzheng2024towards,\ntitle={Towards Robust Fidelity for Evaluating Explainability of Graph Neural Networks},\nauthor={Xu Zheng and Farhad Shirani and Tianchun Wang and Wei Cheng and Zhuomin Chen and Haifeng Chen and Hua Wei and Dongsheng Luo},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=up6hr4hIQH}\n}",
        "github": "",
        "project": "",
        "reviewers": "dokf;gPjw;aFFv;oeQs",
        "pdf_size": 1322967,
        "rating": "3;5;8;8",
        "confidence": "4;4;4;4",
        "soundness": "2;3;3;4",
        "contribution": "2;3;3;4",
        "presentation": "1;3;3;3",
        "wc_summary": "27;86;156;92",
        "wc_strengths": "13;72;149;71",
        "wc_weaknesses": "122;317;43;92",
        "wc_questions": "22;26;94;17",
        "wc_review": "184;501;442;272",
        "wc_reply_reviewers": "0;148;0;16",
        "wc_reply_authors": "2290;1835;1420;251",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "6;5;3;2",
        "rating_avg": [
            6.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            90.25,
            45.67480158687063
        ],
        "wc_strengths_avg": [
            76.25,
            48.31860407751863
        ],
        "wc_weaknesses_avg": [
            143.5,
            104.06368242571469
        ],
        "wc_questions_avg": [
            39.75,
            31.483130403439873
        ],
        "wc_review_avg": [
            349.75,
            127.38205328852256
        ],
        "wc_reply_reviewers_avg": [
            41.0,
            62.120849961989414
        ],
        "wc_reply_authors_avg": [
            1449.0,
            757.020805526506
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            4.0,
            1.5811388300841898
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10278030777184614923&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=up6hr4hIQH",
        "pdf": "https://openreview.net/pdf?id=up6hr4hIQH",
        "email": ";cis.fiu.edu;psu.edu;nec-labs.com;;nec-labs.com;asu.edu;fiu.edu",
        "author_num": 8,
        "aff_unique_index": "0;1;2;2;3;0",
        "aff_unique_norm": "Florida International University;Pennsylvania State University;NEC Laboratories;Arizona State University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.fiu.edu;https://www.psu.edu;https://www.nec-labs.com;https://www.asu.edu",
        "aff_unique_abbr": "FIU;PSU;NEC-Labs;ASU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "upVI6V81Qn",
        "title": "Structural Adversarial Objectives For Self-Supervised Representation Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Within the framework of generative adversarial networks (GANs), we propose objectives that task the discriminator for self-supervised representation learning via additional structural modeling responsibilities.  In combination with an efficient smoothness regularizer imposed on the network, these objectives guide the discriminator to learn to extract informative representations, while maintaining a generator capable of sampling from the domain.  Specifically, our objectives encourage the discriminator to structure features at two levels of granularity: aligning distribution characteristics, such as mean and variance, at coarse scales, and grouping features into local clusters at finer scales.  Operating as a feature learner within the GAN framework frees our self-supervised system from the reliance on hand-crafted data augmentation schemes that are prevalent across contrastive representation learning methods.  Across CIFAR-10/100 and an ImageNet subset, experiments demonstrate that equipping GANs with our self-supervised objectives suffices to produce discriminators which, evaluated in terms of representation learning, compete with networks trained by contrastive learning approaches.",
        "keywords": "Self-supervised Representation Learning;Generative Adversarial Networks",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Xiao Zhang;Michael Maire",
        "authorids": "~Xiao_Zhang11;~Michael_Maire1",
        "gender": "M;M",
        "homepage": "https://computerscience.uchicago.edu/people/profile/xiao-zhang/;http://people.cs.uchicago.edu/~mmaire/",
        "dblp": ";73/1498.html",
        "google_scholar": ";HXowq5YAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Xiao_Zhang11;~Michael_Maire1",
        "aff": "University of Chicago;University of Chicago",
        "aff_domain": "uchicago.edu;uchicago.edu",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\nzhang2024structural,\ntitle={Structural Adversarial Objectives For Self-Supervised Representation Learning},\nauthor={Xiao Zhang and Michael Maire},\nyear={2024},\nurl={https://openreview.net/forum?id=upVI6V81Qn}\n}",
        "github": "",
        "project": "",
        "reviewers": "QTsv;XvEG;HQAz;VSHz",
        "site": "https://openreview.net/forum?id=upVI6V81Qn",
        "pdf_size": 3753363,
        "rating": "3;5;5;5",
        "confidence": "4;3;4;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;2;3",
        "wc_summary": "81;77;47;31",
        "wc_strengths": "39;42;36;51",
        "wc_weaknesses": "90;175;194;263",
        "wc_questions": "20;84;2;54",
        "wc_review": "230;378;279;399",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "342;584;379;337",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            59.0,
            20.83266665599966
        ],
        "wc_strengths_avg": [
            42.0,
            5.612486080160912
        ],
        "wc_weaknesses_avg": [
            180.5,
            61.662387238899534
        ],
        "wc_questions_avg": [
            40.0,
            31.52776554086889
        ],
        "wc_review_avg": [
            321.5,
            69.60064654872109
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            410.5,
            101.47536646891206
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1986005654652160777&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Chicago",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uchicago.edu",
        "aff_unique_abbr": "UChicago",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "uqPnesiGGi",
        "title": "Motif-aware Attribute Masking for Molecular Graph Pre-training",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Attribute reconstruction is used to predict node or edge features in the pre-training of graph neural networks. Given a large number of molecules, they learn to capture structural knowledge, which is transferable for various downstream property prediction tasks and vital in chemistry, biomedicine, and material science. Previous strategies that randomly select nodes to do attribute masking leverage the information of local neighbors. However, the over-reliance of these neighbors inhibits the model's ability to learn long-range dependencies from higher-level substructures. For example, the model would learn little from predicting three carbon atoms in a benzene ring based on the other three but could learn more from the inter-connections between the functional groups, or called chemical motifs. In this work, we propose and investigate motif-aware attribute masking strategies to capture long-range inter-motif structures by leveraging the information of atoms in neighboring motifs. Once each graph is decomposed into disjoint motifs, the features for every node within a sample motif are masked. The graph decoder then predicts the masked features of each node within the motif for reconstruction. We evaluate our approach on eight molecular property prediction datasets and demonstrate its advantages.",
        "keywords": "Molecular Property Prediction;Motifs;Graph Learning;Self-Supervised Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/21b78b11ec7949e21af1e060e9de9e0d5ed24bac.zip",
        "author": "Eric Inae;Gang Liu;Meng Jiang",
        "authorids": "~Eric_Inae1;~Gang_Liu6;~Meng_Jiang3",
        "gender": ";M;M",
        "homepage": ";https://liugangcode.github.io/;http://www.meng-jiang.com/",
        "dblp": "342/8313;37/2109-25;69/339-1",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;zdF3vTYAAAAJ;LZIPfCkAAAAJ",
        "orcid": "0009-0002-2101-2126;0000-0003-4204-731X;0000-0002-3009-519X",
        "linkedin": "eric-inae-6056b1214/;;meng-jiang-94b10916/",
        "or_profile": "~Eric_Inae1;~Gang_Liu6;~Meng_Jiang3",
        "aff": "University of Notre Dame;University of Notre Dame;University of Notre Dame",
        "aff_domain": "nd.edu;nd.edu;nd.edu",
        "position": "PhD student;PhD student;Associate Professor",
        "bibtex": "@misc{\ninae2024motifaware,\ntitle={Motif-aware Attribute Masking for Molecular Graph Pre-training},\nauthor={Eric Inae and Gang Liu and Meng Jiang},\nyear={2024},\nurl={https://openreview.net/forum?id=uqPnesiGGi}\n}",
        "github": "",
        "project": "",
        "reviewers": "PTf2;KumA;871j;Kr46;sLns",
        "site": "https://openreview.net/forum?id=uqPnesiGGi",
        "pdf_size": 1106301,
        "rating": "3;3;5;6;6",
        "confidence": "4;4;4;4;4",
        "soundness": "2;1;2;3;4",
        "contribution": "2;1;2;3;3",
        "presentation": "1;2;3;3;3",
        "wc_summary": "52;63;66;83;68",
        "wc_strengths": "24;40;59;20;77",
        "wc_weaknesses": "254;259;404;24;30",
        "wc_questions": "5;2;2;23;161",
        "wc_review": "335;364;531;150;336",
        "wc_reply_reviewers": "115;197;91;0;0",
        "wc_reply_authors": "564;870;900;214;532",
        "reply_reviewers": "1;1;1;0;0",
        "reply_authors": "2;2;2;1;2",
        "rating_avg": [
            4.6,
            1.3564659966250536
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.4,
            1.019803902718557
        ],
        "contribution_avg": [
            2.2,
            0.7483314773547882
        ],
        "presentation_avg": [
            2.4,
            0.8
        ],
        "wc_summary_avg": [
            66.4,
            9.971960689854328
        ],
        "wc_strengths_avg": [
            44.0,
            21.475567512873788
        ],
        "wc_weaknesses_avg": [
            194.2,
            146.77929009230152
        ],
        "wc_questions_avg": [
            38.6,
            61.697974034809285
        ],
        "wc_review_avg": [
            343.2,
            120.95189126260075
        ],
        "wc_reply_reviewers_avg": [
            80.6,
            74.60991891162998
        ],
        "wc_reply_authors_avg": [
            616.0,
            251.60922081672604
        ],
        "reply_reviewers_avg": [
            0.6,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.8,
            0.4
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 18,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5890304767877158830&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Notre Dame",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nd.edu",
        "aff_unique_abbr": "Notre Dame",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "uqYjAQ5diD",
        "title": "Factorized Neural Radiance Field with Depth Covariance Function for Dense RGB Mapping",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Reconstructing high-quality and real-time dense maps is critical for building the\n3D environment for robot sensing and navigation. Recently, Neural Radiance\nField (NeRF) has garnered great attention due to its excellent scene representa-\ntion capacity of the 3D world; therefore, recent works leverage NeRF to learn\n3D maps, typically based on RGB-D cameras. However, depth sensors are not\nalways available for all devices, while RGB cameras are cheap and widely appli-\ncable. Therefore, we propose to use single RGB input for the scene reconstruction\nwith NeRF, which becomes highly challenging without geometric guidance from\ndepth sensors. Moreover, we cultivate its real-time capability with lightweight\nimplementation. In this paper, we propose FMapping, a factorized NeRF map-\nping framework, allowing for high-quality and real-time reconstruction with only\nthe RGB input. The insight of our method is that depth doesn\u2019t experience much\nchange in consecutive RGB frames, thus the geometrical clues can be derived from\nRGB effectively with well estimated depth priors. In detail, we divide the map-\nping into 1) the initialization stage and 2) the on-the-fly stage. First, given trackers\nare not always stable in the initialization stage, we start with a noisy pose input\nto optimize the mapping. To this end, we exploit geometric consistency between\nvolume rendering and signed distance function in a self-supervised way to cap-\nture depth accurately. In the second stage, given relatively short optimization time\nfor real-time performance, we model the depth estimation as a Gaussian process\n(GP) with a pre-trained cost-effective depth covariance function to promptly infer\ndepth on the condition of previous frames. Meanwhile, the per-pixel depth esti-\nmation and its corresponding uncertainty can guide the NeRF sampling process.\nHence, we propose to densely allocate sample points within adjustable truncation\nregions near the surface, and further distribute samples to ones with high uncer-\ntainty. This way, we can continue building maps from subsequent poses with sta-\nbilized trackers. Experiments demonstrate that our framework outperforms state-\nof-the-art RGB-based mapping and achieves comparable performance to RGB-D\nmapping in terms of photometric and geometric accuracy, with real-time depth\nestimation capability in around 5 Hz with consistent scale.",
        "keywords": "Simultaneous Localization and Mapping (SLAM);Neural Radiance Field (NeRF)",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Tongyan Hua;Haotian Bai;Zidong Cao;Lin Wang",
        "authorids": "~Tongyan_Hua1;~Haotian_Bai1;~Zidong_Cao1;~Lin_Wang2",
        "gender": "F;M;;M",
        "homepage": "https://scholar.google.com/citations?user=rUGoZaMAAAAJ&hl=en&oi=ao;;;https://dr.ntu.edu.sg/cris/rp/rp02550",
        "dblp": "340/7382;315/5432;312/7546;",
        "google_scholar": "rUGoZaMAAAAJ;https://scholar.google.com/citations?hl=en;q1FcZzIAAAAJ;SReb2csAAAAJ",
        "orcid": ";;0009-0002-7699-0912;0000-0002-7485-4493",
        "linkedin": ";haotian-bai-17373318b/;;",
        "or_profile": "~Tongyan_Hua1;~Haotian_Bai1;~Zidong_Cao1;~Lin_Wang2",
        "aff": "Hong Kong University of Science and Technology;Hong Kong University of Science and Technology;Hong Kong University of Science and Technology;Hong Kong University of Science and Technology",
        "aff_domain": "connect.hkust-gz.edu.cn;hkust.edu;ust.hk;ust.hk",
        "position": "PhD student;PhD student;PhD student;Assistant Professor",
        "bibtex": "@misc{\nhua2024factorized,\ntitle={Factorized Neural Radiance Field with Depth Covariance Function for Dense {RGB} Mapping},\nauthor={Tongyan Hua and Haotian Bai and Zidong Cao and Lin Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=uqYjAQ5diD}\n}",
        "github": "",
        "project": "",
        "reviewers": "fnZK;veoK;3ryB;WxZo",
        "site": "https://openreview.net/forum?id=uqYjAQ5diD",
        "pdf_size": 20852400,
        "rating": "3;3;3;3",
        "confidence": "4;4;5;3",
        "soundness": "1;2;1;1",
        "contribution": "2;2;2;2",
        "presentation": "2;2;2;1",
        "wc_summary": "55;50;86;195",
        "wc_strengths": "68;32;39;81",
        "wc_weaknesses": "128;284;445;787",
        "wc_questions": "21;538;3;139",
        "wc_review": "272;904;573;1202",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            1.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            96.5,
            58.5170915203413
        ],
        "wc_strengths_avg": [
            55.0,
            20.18662923818635
        ],
        "wc_weaknesses_avg": [
            411.0,
            244.3102535711508
        ],
        "wc_questions_avg": [
            175.25,
            215.8499189251643
        ],
        "wc_review_avg": [
            737.75,
            349.01029712603037
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:aL0M4KKBMOwJ:scholar.google.com/&scioq=Factorized+Neural+Radiance+Field+with+Depth+Covariance+Function+for+Dense+RGB+Mapping&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Hong Kong University of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ust.hk",
        "aff_unique_abbr": "HKUST",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "uqjTYYRRl1",
        "title": "BPQP: A Differentiable Convex Optimization Framework for Efficient End-to-End Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Real-world decision-making processes often employ a two-stage approach, where a machine learning model first predicts key parameters, followed by a constrained convex optimization model to render final decisions. The machine learning model is typically trained separately to minimize prediction error, which may not necessarily align with the ultimate goal, resulting in potentially suboptimal decisions. \nThe predict-then-optimize approach offers an end-to-end learning solution to bridge this gap, wherein machine learning models are trained in tandem with the optimization model to minimize the ultimate decision error.\nHowever, practical applications involving large-scale datasets bring about significant challenges due to the inherent need for efficiency to fully realize the potential of the predict-then-optimize approach.\nAlthough recent works have started to focus on predict-then-optimize, they have been limited to small-scale datasets due to low efficiency.\nIn this paper, we propose BPQP, a differentiable convex optimization framework for efficient end-to-end learning. To address the challenge of efficiency, we initially reformulate the backward pass as a simplified and decoupled quadratic programming problem by exploiting the structural trait of the KKT matrix, followed by solving it using first-order optimization algorithms.\nExtensive experiments on both simulated and real-world datasets have been conducted, demonstrating a considerable improvement in terms of efficiency -- at least an order of magnitude faster in overall execution time.\nWe significantly improve efficiency and highlight the superiority of BPQP compared to baselines, including the traditional two-stage learning approach.",
        "keywords": "optimization;differentiable convex layers;machine learning;neural networks",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/4accb700f313b84d2a006b097c141a88afdb9b3b.zip",
        "author": "Jianming Pan;Xiao Yang;Weidong Ma;Weiqing Liu;Lewen Wang;Jiang Bian",
        "authorids": "~Jianming_Pan1;~Xiao_Yang11;~Weidong_Ma3;~Weiqing_Liu1;~Lewen_Wang1;~Jiang_Bian1",
        "gender": "M;M;M;;F;M",
        "homepage": ";;;;https://lwwang.github.io/;https://sites.google.com/view/jiangbian",
        "dblp": ";;24/8877;;;09/851-2.html",
        "google_scholar": "3jVharcAAAAJ;https://scholar.google.com.hk/citations?user=QBQRlgYAAAAJ;;;;pZBEnY8AAAAJ",
        "orcid": ";;;;;0000-0002-9472-600X",
        "linkedin": ";;;weiqing-liu-09646b91/;;jbian/",
        "or_profile": "~Jianming_Pan1;~Xiao_Yang11;~Weidong_Ma3;~Weiqing_Liu1;~Lewen_Wang1;~Jiang_Bian1",
        "aff": "University of California, Berkeley;Microsoft Research;;;Microsoft;Microsoft",
        "aff_domain": "berkeley.edu;research.microsoft.com;;;microsoft.com;microsoft.com",
        "position": "MS student;Researcher;;;Researcher;Partner Research Manager",
        "bibtex": "@misc{\npan2024bpqp,\ntitle={{BPQP}: A Differentiable Convex Optimization Framework for Efficient End-to-End Learning},\nauthor={Jianming Pan and Xiao Yang and Weidong Ma and Weiqing Liu and Lewen Wang and Jiang Bian},\nyear={2024},\nurl={https://openreview.net/forum?id=uqjTYYRRl1}\n}",
        "github": "",
        "project": "",
        "reviewers": "kf2G;yny3;itcs;EcTW",
        "site": "https://openreview.net/forum?id=uqjTYYRRl1",
        "pdf_size": 447376,
        "rating": "3;3;6;6",
        "confidence": "4;5;4;2",
        "soundness": "1;1;3;3",
        "contribution": "3;3;2;2",
        "presentation": "4;2;3;2",
        "wc_summary": "65;98;87;70",
        "wc_strengths": "120;159;48;62",
        "wc_weaknesses": "531;744;25;117",
        "wc_questions": "62;44;41;39",
        "wc_review": "778;1045;201;288",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.0,
            1.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            80.0,
            13.209844813622906
        ],
        "wc_strengths_avg": [
            97.25,
            44.71786555729153
        ],
        "wc_weaknesses_avg": [
            354.25,
            294.88928006965597
        ],
        "wc_questions_avg": [
            46.5,
            9.12414379544733
        ],
        "wc_review_avg": [
            578.0,
            347.96479707004846
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.6882472016116854,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8431507738712913818&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "University of California, Berkeley;Microsoft",
        "aff_unique_dep": ";Microsoft Research",
        "aff_unique_url": "https://www.berkeley.edu;https://www.microsoft.com/en-us/research",
        "aff_unique_abbr": "UC Berkeley;MSR",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Berkeley;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Bridging Neural and Symbolic Representations with Transitional Dictionary Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17562",
        "id": "uqxBTcWRnj",
        "author_site": "Junyan Cheng, Peter Chin",
        "tldr": "",
        "abstract": "This paper introduces a novel Transitional Dictionary Learning (TDL) framework that can implicitly learn symbolic knowledge, such as visual parts and relations, by reconstructing the input as a combination of parts with implicit relations. We propose a game-theoretic diffusion model to decompose the input into visual parts using the dictionaries learned by the Expectation Maximization (EM) algorithm, implemented as the online prototype clustering, based on the decomposition results. Additionally, two metrics, clustering information gain, and heuristic shape score are proposed to evaluate the model. Experiments are conducted on three abstract compositional visual object datasets, which require the model to utilize the compositionality of data instead of simply exploiting visual features.  Then, three tasks on symbol grounding to predefined classes of parts and relations, as well as transfer learning to unseen classes, followed by a human evaluation, were carried out on these datasets. The results show that the proposed method discovers compositional patterns, which significantly outperforms the state-of-the-art unsupervised part segmentation methods that rely on visual features from pre-trained backbones. Furthermore, the proposed metrics are consistent with human evaluations.",
        "keywords": "Unsupervised Learning;Compositional representation;neural-symbolic learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/28d5aca72447808049b521430427bb6a82aab270.zip",
        "author": "Junyan Cheng;Peter Chin",
        "authorids": "~Junyan_Cheng1;~Peter_Chin1",
        "gender": "M;",
        "homepage": "https://junyan.ch;https://engineering.dartmouth.edu/community/faculty/peter-chin",
        "dblp": "305/5474;133/4494",
        "google_scholar": "omA0ZZMAAAAJ;",
        "orcid": ";",
        "linkedin": "junyan-cheng-277716111/;",
        "or_profile": "~Junyan_Cheng1;~Peter_Chin1",
        "aff": "Allen Institute for Artificial Intelligence;Dartmouth College",
        "aff_domain": "allenai.org;dartmouth.edu",
        "position": "Intern;Full Professor",
        "bibtex": "@inproceedings{\ncheng2024bridging,\ntitle={Bridging Neural and Symbolic Representations with Transitional Dictionary Learning},\nauthor={Junyan Cheng and Peter Chin},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=uqxBTcWRnj}\n}",
        "github": "",
        "project": "",
        "reviewers": "jEsx;6UkK;mxpA;KjjP",
        "pdf_size": 7084122,
        "rating": "5;5;8;8",
        "confidence": "2;4;2;3",
        "soundness": "2;2;3;4",
        "contribution": "3;2;3;3",
        "presentation": "1;1;3;3",
        "wc_summary": "58;102;74;74",
        "wc_strengths": "29;66;131;107",
        "wc_weaknesses": "298;197;96;201",
        "wc_questions": "37;115;54;53",
        "wc_review": "422;480;355;435",
        "wc_reply_reviewers": "0;0;50;0",
        "wc_reply_authors": "1025;1297;476;771",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "2;2;2;1",
        "rating_avg": [
            6.5,
            1.5
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            1.0
        ],
        "wc_summary_avg": [
            77.0,
            15.84297951775486
        ],
        "wc_strengths_avg": [
            83.25,
            39.00240377207538
        ],
        "wc_weaknesses_avg": [
            198.0,
            71.4387849840687
        ],
        "wc_questions_avg": [
            64.75,
            29.785692874264313
        ],
        "wc_review_avg": [
            423.0,
            44.771642811047265
        ],
        "wc_reply_reviewers_avg": [
            12.5,
            21.650635094610966
        ],
        "wc_reply_authors_avg": [
            892.25,
            303.8958497577747
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.3015113445777637,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:RsZOXo1l80wJ:scholar.google.com/&scioq=Bridging+Neural+and+Symbolic+Representations+with+Transitional+Dictionary+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=uqxBTcWRnj",
        "pdf": "https://openreview.net/pdf?id=uqxBTcWRnj",
        "email": "allenai.org;dartmouth.edu",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Allen Institute for Artificial Intelligence;Dartmouth College",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://allenai.org;https://www.dartmouth.edu",
        "aff_unique_abbr": "AI2;Dartmouth",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "usmP3muXMI",
        "title": "Minimizing Chebyshev Risk Magically Mitigates the Perils of Overfitting",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Since reducing overfitting in deep neural networks (DNNs) increases their test performance, many efforts have tried to mitigate it by adding regularization loss terms in one or more hidden layers of the network, including the convolutional layers.  To build upon the canonical wisdom guiding these previous works, we analytically tried to understand how intra and inter-class feature relationships affect misclassification.  Our analysis begins by assuming a DNN is the composition of a feature extractor and classifier, where the classifier is the last fully connected layer of the network and the feature layer is the input vector to the classifier.  We assume that, corresponding to each class, there exists an ideal feature vector which we designate as a class prototype. The goal of the training method is then to reduce the probability that an example\u2019s features deviate significantly from its class prototype, which increases the risk of misclassification.  Formally, this probability can be bound using a Chebyshev\u2019s inequality comprised of within-class covariance and between-class prototype distance.  The terms in the inequality are added to our loss function for optimizing the feature layer, which implicitly optimizes the previous convolutional layers\u2019 parameter values.  We observe from empirical results on multiple datasets and network architectures that our training algorithm reduces overfitting and improves upon previous approaches in an efficient manner.",
        "keywords": "prototype;regularization;overfitting;Chebyshev",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Nathaniel Dean;Dilip Sarkar",
        "authorids": "~Nathaniel_Dean1;~Dilip_Sarkar1",
        "gender": "M;M",
        "homepage": ";http://www.cs.miami.edu/~sarkar/",
        "dblp": ";",
        "google_scholar": ";uMMfI1UAAAAJ",
        "orcid": ";",
        "linkedin": "nathaniel-dean-97885667/;",
        "or_profile": "~Nathaniel_Dean1;~Dilip_Sarkar1",
        "aff": "University of Miami;University of Miami, University of Miami",
        "aff_domain": "miami.edu;cs.miami.edu",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\ndean2024minimizing,\ntitle={Minimizing Chebyshev Risk Magically Mitigates the Perils of Overfitting},\nauthor={Nathaniel Dean and Dilip Sarkar},\nyear={2024},\nurl={https://openreview.net/forum?id=usmP3muXMI}\n}",
        "github": "",
        "project": "",
        "reviewers": "wkG8;tQCr;nGbq",
        "site": "https://openreview.net/forum?id=usmP3muXMI",
        "pdf_size": 609262,
        "rating": "3;5;6",
        "confidence": "3;3;4",
        "soundness": "2;2;3",
        "contribution": "2;2;2",
        "presentation": "2;3;4",
        "wc_summary": "81;68;111",
        "wc_strengths": "14;46;53",
        "wc_weaknesses": "206;234;25",
        "wc_questions": "40;64;1",
        "wc_review": "341;412;190",
        "wc_reply_reviewers": "151;47;0",
        "wc_reply_authors": "1075;525;51",
        "reply_reviewers": "3;1;0",
        "reply_authors": "3;1;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            86.66666666666667,
            18.00617178142601
        ],
        "wc_strengths_avg": [
            37.666666666666664,
            16.97710877099579
        ],
        "wc_weaknesses_avg": [
            155.0,
            92.63188795801727
        ],
        "wc_questions_avg": [
            35.0,
            25.96150997149434
        ],
        "wc_review_avg": [
            314.3333333333333,
            92.57189398276107
        ],
        "wc_reply_reviewers_avg": [
            66.0,
            63.09252464964979
        ],
        "wc_reply_authors_avg": [
            550.3333333333334,
            418.42986933960094
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            1.247219128924647
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.7559289460184545,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:6iJ4NceUNl0J:scholar.google.com/&scioq=Minimizing+Chebyshev+Risk+Magically+Mitigates+the+Perils+of+Overfitting&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Miami",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.miami.edu",
        "aff_unique_abbr": "UM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "LLMs Meet VLMs: Boost Open Vocabulary Object Detection with Fine-grained Descriptors",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17561",
        "id": "usrChqw6yK",
        "author_site": "Sheng JIn, Xueying Jiang, Jiaxing Huang, Lewei Lu, Shijian Lu",
        "tldr": "",
        "abstract": "Inspired by the outstanding zero-shot capability of vision language models (VLMs) in image classification tasks, open-vocabulary object detection has attracted increasing interest by distilling the broad VLM knowledge into detector training. However, most existing open-vocabulary detectors learn by aligning region embeddings with categorical labels (e.g., bicycle) only, disregarding the capability of VLMs on aligning visual embeddings with fine-grained text descriptions of object parts (e.g., pedals and bells). This paper presents DVDet, a Descriptor-Enhanced Open Vocabulary Detector that introduces conditional context prompts and hierarchical textual descriptors that enable precise region-text alignment as well as open-vocabulary detection training in general. Specifically, the conditional context prompt transforms regional embeddings into image-like representations that can be directly integrated into general open vocabulary detection training. In addition, we introduce large language models as an interactive and implicit knowledge repository which enables iterative mining and refining visually oriented textual descriptors for precise region-text alignment. Extensive experiments over multiple large-scale benchmarks show that DVDet outperforms the state-of-the-art consistently by large margins.",
        "keywords": "Open Vocabulary Object Detection;Visual descriptors",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/69c9a3bae14b5b65846b050fca49c999d0c6813e.pdf",
        "author": "Sheng Jin;Xueying Jiang;Jiaxing Huang;Lewei Lu;Shijian Lu",
        "authorids": "~Sheng_Jin3;~Xueying_Jiang1;~Jiaxing_Huang2;~Lewei_Lu1;~Shijian_Lu1",
        "gender": "M;;M;M;M",
        "homepage": ";;https://jxhuang0508.github.io/;;https://personal.ntu.edu.sg/shijian.lu/",
        "dblp": "70/6780-2;;62/6016-1.html;247/6438;42/2718",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;;czirNcwAAAAJ;https://scholar.google.com.hk/citations?user=zdgKJXIAAAAJ;https://scholar.google.com.sg/scholar?hl=en",
        "orcid": "0000-0001-7254-1664;;;;",
        "linkedin": ";;;lewei-lu-94015977/;",
        "or_profile": "~Sheng_Jin3;~Xueying_Jiang1;~Jiaxing_Huang2;~Lewei_Lu1;~Shijian_Lu1",
        "aff": "Nanyang Technological University;;Nanyang Technological University;SenseTime;Nanyang Technological University",
        "aff_domain": "ntu.edu.sg;;ntu.edu.sg;sensetime.com;ntu.edu.sg",
        "position": "Postdoc;;Postdoc;Researcher;Associate Professor",
        "bibtex": "@inproceedings{\njin2024llms,\ntitle={{LLM}s Meet {VLM}s: Boost Open Vocabulary Object Detection with Fine-grained Descriptors},\nauthor={Sheng Jin and Xueying Jiang and Jiaxing Huang and Lewei Lu and Shijian Lu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=usrChqw6yK}\n}",
        "github": "",
        "project": "",
        "reviewers": "E6zT;6yi2;shSW;AtsG;qAZ8",
        "pdf_size": 1911433,
        "rating": "6;6;6;6;6",
        "confidence": "4;4;5;4;4",
        "soundness": "3;4;3;3;3",
        "contribution": "3;3;2;3;3",
        "presentation": "3;3;3;3;3",
        "wc_summary": "117;93;82;56;86",
        "wc_strengths": "52;126;71;58;37",
        "wc_weaknesses": "146;52;365;78;62",
        "wc_questions": "105;28;28;4;63",
        "wc_review": "420;299;546;196;248",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "720;409;882;466;613",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "2;1;2;1;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.2,
            0.39999999999999997
        ],
        "soundness_avg": [
            3.2,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.8,
            0.39999999999999997
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            86.8,
            19.610201426808448
        ],
        "wc_strengths_avg": [
            68.8,
            30.616335509005644
        ],
        "wc_weaknesses_avg": [
            140.6,
            116.902694579723
        ],
        "wc_questions_avg": [
            45.6,
            35.16020477756067
        ],
        "wc_review_avg": [
            341.8,
            126.25434645983479
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            618.0,
            171.41178489240465
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.4,
            0.4898979485566356
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 26,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7138448559127825332&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=usrChqw6yK",
        "pdf": "https://openreview.net/pdf?id=usrChqw6yK",
        "email": "ntu.edu.sg;;ntu.edu.sg;sensetime.com;ntu.edu.sg",
        "author_num": 5,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Nanyang Technological University;SenseTime",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ntu.edu.sg;https://www.sensetime.com",
        "aff_unique_abbr": "NTU;SenseTime",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "Singapore;China"
    },
    {
        "id": "ut9aUpFZFr",
        "title": "COINs: Model-based Accelerated Inference for Knowledge Graphs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We introduce **CO**mmunity **IN**formed graph embedding**s** (COINs), for accelerating link prediction and query answering models for knowledge graphs. COINs employ a community-detection-based graph data augmentation procedure, followed by a two-step prediction pipeline: node localization via community prediction and then localization within the predicted community. We describe theoretically justified criteria for gauging the applicability of our approach in our setting with a direct formulation of the reduction in time complexity. Additionally, we provide numerical evidence of superior scalability in model evaluation cost (average reduction factor of 6.413 $\\pm$ 3.3587 on a single-CPU-GPU machine) with admissible effects on prediction performance (relative error to baseline 0.2389 $\\pm$ 0.3167 on average).",
        "keywords": "Knowledge Graph Inference;Scalability;Graph Embeddings;Community Structure",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Andrej Janchevski;Vincent Coriou;Volkan Cevher",
        "authorids": "~Andrej_Janchevski1;~Vincent_Coriou1;~Volkan_Cevher1",
        "gender": "M;;M",
        "homepage": "https://www.epfl.ch/labs/lions/people/phds/andrej-janchevski/;;http://lions.epfl.ch",
        "dblp": "242/4644;;70/5301",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;https://scholar.google.ch/citations?user=hlWhzU8AAAAJ",
        "orcid": "0000-0001-9568-0966;;",
        "linkedin": "andrej-janchevski-0378051b9/;;",
        "or_profile": "~Andrej_Janchevski1;~Vincent_Coriou1;~Volkan_Cevher1",
        "aff": "EPFL - EPF Lausanne;;Amazon Development Center Germany",
        "aff_domain": "epfl.ch;;amazon.de",
        "position": "PhD student;;Amazon Scholar",
        "bibtex": "@misc{\njanchevski2024coins,\ntitle={{COIN}s: Model-based Accelerated Inference for Knowledge Graphs},\nauthor={Andrej Janchevski and Vincent Coriou and Volkan Cevher},\nyear={2024},\nurl={https://openreview.net/forum?id=ut9aUpFZFr}\n}",
        "github": "",
        "project": "",
        "reviewers": "5igT;2jBS;zPEm",
        "site": "https://openreview.net/forum?id=ut9aUpFZFr",
        "pdf_size": 5695151,
        "rating": "3;5;6",
        "confidence": "3;4;2",
        "soundness": "2;1;3",
        "contribution": "2;2;2",
        "presentation": "2;2;3",
        "wc_summary": "89;104;62",
        "wc_strengths": "39;101;47",
        "wc_weaknesses": "75;350;89",
        "wc_questions": "63;173;59",
        "wc_review": "266;728;257",
        "wc_reply_reviewers": "50;0;0",
        "wc_reply_authors": "966;1164;424",
        "reply_reviewers": "1;0;0",
        "reply_authors": "2;2;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            85.0,
            17.378147196982766
        ],
        "wc_strengths_avg": [
            62.333333333333336,
            27.535835237417842
        ],
        "wc_weaknesses_avg": [
            171.33333333333334,
            126.46562993776435
        ],
        "wc_questions_avg": [
            98.33333333333333,
            52.822554105440815
        ],
        "wc_review_avg": [
            417.0,
            219.9409011530143
        ],
        "wc_reply_reviewers_avg": [
            16.666666666666668,
            23.570226039551585
        ],
        "wc_reply_authors_avg": [
            851.3333333333334,
            312.79528271521116
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3273268353539886,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:6J_Nac7QmFEJ:scholar.google.com/&scioq=COINs:+Model-based+Accelerated+Inference+for+Knowledge+Graphs&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "EPFL;Amazon",
        "aff_unique_dep": ";Development Center",
        "aff_unique_url": "https://www.epfl.ch;https://www.amazon.de",
        "aff_unique_abbr": "EPFL;Amazon",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Lausanne;",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Switzerland;Germany"
    },
    {
        "id": "utESCpnVBN",
        "title": "Active Probabilistic Clustering",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Active Constrained Clustering (ACC) is a widely used semi-supervised clustering framework to improve clustering quality through progressive annotation of informative pairwise constraints. However, the application of existing ACC methods to large datasets with numerous classes incurs high computational or query expenses. \nIn this paper, we conduct a theoretical analysis of the inefficiency of sample-based ACC and the rationale behind cluster-based ACC. Moreover, we provide the theoretical guarantee for cluster fusion under a certain purity constraint and a clustering quality constraint with respect to normalized mutual information (NMI).\nDrawing on these theoretical insights, we introduce a novel Active Probabilistic Clustering (APC) framework designed to scale effectively with large datasets. Compared to previous methods, APC demonstrates superior performance across eight datasets of varying sizes (ranging from 350 to 100,000 samples) in terms of clustering quality, query cost, and computational expense. Specifically, APC accomplishes satisfactory clustering outcomes (e.g., NMI $>0.95$) using 3,920 queries on a dataset with 100,000 samples, while baseline methods yield inferior clustering results (e.g., NMI $\\leq0.85$) with 10,000 queries. Concurrently, APC operates at a speed 100x faster than baseline methods.",
        "keywords": "Active Constrained Clustering;Probabilistic Clustering",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Xun Deng;Han Zhong;Junlong Liu;Chen Shen;Fuli Feng;Xiangnan He;Jieping Ye;Zheng Wang",
        "authorids": "~Xun_Deng1;~Han_Zhong1;~Junlong_Liu2;~Chen_Shen7;~Fuli_Feng1;~Xiangnan_He1;~Jieping_Ye4;~Zheng_Wang32",
        "gender": "M;;M;M;M;M;M;",
        "homepage": ";https://hanzhong-ml.github.io/;;;https://fulifeng.github.io/;http://staff.ustc.edu.cn/~hexn;http://yelabs.net/;",
        "dblp": "154/0106/;137/8096.html;;55/5393-3;183/9198;59/1007;03/5454;",
        "google_scholar": "LILR85MAAAAJ;Bk5q_pAAAAAJ;;b6vn1uMAAAAJ;https://scholar.google.com.sg/citations?user=QePM4u8AAAAJ;https://scholar.google.com.sg/citations?user=X45Go24AAAAJ;T9AzhwcAAAAJ;",
        "orcid": ";;0000-0001-5125-3022;;0000-0002-5828-9842;0000-0001-8472-7992;0000-0001-8662-5818;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Xun_Deng1;~Han_Zhong1;~Junlong_Liu2;~Chen_Shen7;~Fuli_Feng1;~Xiangnan_He1;~Jieping_Ye4;~Zheng_Wang32",
        "aff": "University of Science and Technology of China;Peking University;;Alibaba Group;University of Science and Technology of China;University of Science and Technology of China;Alibaba Group;",
        "aff_domain": "mail.ustc.edu.cn;stu.pku.edu.cn;;alibaba-inc.com;ustc.edu.cn;ustc.edu.cn;alibaba-inc.com;",
        "position": "PhD student;PhD student;;Researcher;Full Professor;Professor;Principal Researcher;",
        "bibtex": "@misc{\ndeng2024active,\ntitle={Active Probabilistic Clustering},\nauthor={Xun Deng and Han Zhong and Junlong Liu and Chen Shen and Fuli Feng and Xiangnan He and Jieping Ye and Zheng Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=utESCpnVBN}\n}",
        "github": "",
        "project": "",
        "reviewers": "TE49;62ZR;2mue",
        "site": "https://openreview.net/forum?id=utESCpnVBN",
        "pdf_size": 1388192,
        "rating": "3;3;3",
        "confidence": "4;4;4",
        "soundness": "1;3;2",
        "contribution": "2;2;2",
        "presentation": "1;1;1",
        "wc_summary": "135;89;103",
        "wc_strengths": "29;11;32",
        "wc_weaknesses": "192;269;117",
        "wc_questions": "90;10;93",
        "wc_review": "446;379;345",
        "wc_reply_reviewers": "303;38;28",
        "wc_reply_authors": "873;544;605",
        "reply_reviewers": "2;1;1",
        "reply_authors": "3;2;2",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.0,
            0.0
        ],
        "wc_summary_avg": [
            109.0,
            19.252705437591537
        ],
        "wc_strengths_avg": [
            24.0,
            9.273618495495704
        ],
        "wc_weaknesses_avg": [
            192.66666666666666,
            62.055530687352025
        ],
        "wc_questions_avg": [
            64.33333333333333,
            38.43898484033567
        ],
        "wc_review_avg": [
            390.0,
            41.960298696108765
        ],
        "wc_reply_reviewers_avg": [
            123.0,
            127.34467663262043
        ],
        "wc_reply_authors_avg": [
            674.0,
            142.90089806109222
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:91uARL34F74J:scholar.google.com/&scioq=Active+Probabilistic+Clustering&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0;0;2",
        "aff_unique_norm": "University of Science and Technology of China;Peking University;Alibaba Group",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.ustc.edu.cn;http://www.pku.edu.cn;https://www.alibaba.com",
        "aff_unique_abbr": "USTC;Peking U;Alibaba",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "uu7WGZtpn2",
        "title": "Finite Sample Analysis for Single-Loop Single-Timescale Natural Actor-Critic Algorithm",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Natural actor-critic (NAC) methods have demonstrated remarkable effectiveness in various reinforcement learning problems. However, there remains a noticeable gap in the literature regarding the finite-time analysis of this practical algorithm. Previous theoretical investigations of actor-critic techniques primarily focused on the double-loop form, involving multiple critic steps per actor step, or the two-timescale form, which employs an actor step size much slower than that of the critic. While these approaches were designed for ease of analysis, they are seldom utilized in practical applications.\nIn this paper, we study a more practical single-loop single-timescale natural actor-critic algorithm, where step sizes are proportional and critic updates with only a single sample per actor step. Our analysis establishes a finite sample complexity of $O(1/\\epsilon^4)$, ensuring the attainment of the $\\epsilon$-accurate global optimal point. To the best of our knowledge, we are the first to provide finite-time convergence with the global optimality guarantee for the single-loop single-timescale natural actor-critic algorithm with linear function approximation.",
        "keywords": "reinforcement learning;natural actor-critic;finite-time sample complexity",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/ba79bcfb147d1ed3c7644b6e30b256d1c6fe7343.pdf",
        "author": "Zilong Wang;Baoxiang Wang;Shuai Li",
        "authorids": "~Zilong_Wang2;~Baoxiang_Wang1;~Shuai_Li3",
        "gender": ";;F",
        "homepage": ";;http://shuaili8.github.io",
        "dblp": ";;57/2281-10",
        "google_scholar": "z786jBwAAAAJ;;https://scholar.google.com.hk/citations?user=kMZgQxcAAAAJ",
        "orcid": "0000-0003-0673-0488;;",
        "linkedin": ";;",
        "or_profile": "~Zilong_Wang2;~Baoxiang_Wang1;~Shuai_Li3",
        "aff": "Shanghai Jiaotong University;;John Hopcroft Center, Shanghai Jiao Tong University",
        "aff_domain": "sjtu.edu.cn;;sjtu.edu.cn",
        "position": "PhD student;;Assistant Professor",
        "bibtex": "@misc{\nwang2024finite,\ntitle={Finite Sample Analysis for Single-Loop Single-Timescale Natural Actor-Critic Algorithm},\nauthor={Zilong Wang and Baoxiang Wang and Shuai Li},\nyear={2024},\nurl={https://openreview.net/forum?id=uu7WGZtpn2}\n}",
        "github": "",
        "project": "",
        "reviewers": "FSCA;qKxN;rbim;VKBv",
        "site": "https://openreview.net/forum?id=uu7WGZtpn2",
        "pdf_size": 310069,
        "rating": "3;3;5;5",
        "confidence": "3;3;5;4",
        "soundness": "3;2;2;3",
        "contribution": "1;2;3;2",
        "presentation": "3;2;4;2",
        "wc_summary": "78;17;52;162",
        "wc_strengths": "25;17;73;106",
        "wc_weaknesses": "297;150;43;383",
        "wc_questions": "53;9;419;129",
        "wc_review": "453;193;587;780",
        "wc_reply_reviewers": "0;0;9;157",
        "wc_reply_authors": "218;256;160;543",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            77.25,
            53.50408862881415
        ],
        "wc_strengths_avg": [
            55.25,
            36.29307785239494
        ],
        "wc_weaknesses_avg": [
            218.25,
            131.0674921557592
        ],
        "wc_questions_avg": [
            152.5,
            159.73963190141637
        ],
        "wc_review_avg": [
            503.25,
            213.53263802051433
        ],
        "wc_reply_reviewers_avg": [
            41.5,
            66.78510312936561
        ],
        "wc_reply_authors_avg": [
            294.25,
            147.62854568138238
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.9045340337332909,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:SFi5I7yxgD4J:scholar.google.com/&scioq=Finite+Sample+Analysis+for+Single-Loop+Single-Timescale+Natural+Actor-Critic+Algorithm&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Shanghai Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sjtu.edu.cn",
        "aff_unique_abbr": "SJTU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Shanghai",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Beyond Spatio-Temporal Representations: Evolving Fourier Transform for Temporal Graphs",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17560",
        "id": "uvFhCUPjtI",
        "author_site": "Anson Simon Bastos, Kuldeep Singh, Abhishek Nadgeri, Manish Singh, Toyotaro Suzumura",
        "tldr": "",
        "abstract": "We present the Evolving Graph Fourier Transform (EFT), the first invertible spectral transform that captures evolving representations on temporal graphs. We motivate our work by the inadequacy of existing methods for capturing the evolving graph spectra, which are also computationally expensive due to the temporal aspect along with the graph vertex domain. We view the problem as an optimization over the Laplacian of the continuous time dynamic graph. Additionally, we propose pseudo-spectrum relaxations that decompose the transformation process, making it highly computationally efficient. The EFT method adeptly captures the evolving graph's structural and positional properties, making it effective for downstream tasks on evolving graphs. Hence, as a reference implementation, we develop a simple neural model induced with \\eft for capturing evolving graph spectra. We empirically validate our theoretical findings on a number of large-scale and standard temporal graph benchmarks and demonstrate that our model achieves state-of-the-art performance.",
        "keywords": "Temporal Dynamic Graphs;Spectral Transform;GNN",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Anson Bastos;Kuldeep Singh;Abhishek Nadgeri;Manish Singh;Toyotaro Suzumura",
        "authorids": "~Anson_Bastos1;~Kuldeep_Singh1;~Abhishek_Nadgeri1;~Manish_Singh4;~Toyotaro_Suzumura1",
        "gender": ";Not Specified;M;M;M",
        "homepage": ";;;https://www.iith.ac.in/~msingh/;",
        "dblp": "220/4367;81/4530;249/6479;78/459-2;99/844",
        "google_scholar": "is7rRuAAAAAJ;23EKFE4AAAAJ;b0FAYMkAAAAJ;https://scholar.google.co.in/citations?user=I1jX5vgAAAAJ;tY3BWm0AAAAJ",
        "orcid": ";;;0000-0002-7919-2206;0000-0001-6412-8386",
        "linkedin": ";;abhishek-nadgeri-a7546456/?originalSubdomain=de;;",
        "or_profile": "~Anson_Bastos1;~Kuldeep_Singh1;~Abhishek_Nadgeri1;~Manish_Singh4;~Toyotaro_Suzumura1",
        "aff": "Microsoft;Cerence GmbH;;;The University of Tokyo",
        "aff_domain": "microsoft.com;cerence.com;;;u-tokyo.ac.jp",
        "position": "Researcher;Sr. Product Manager;;;Professor",
        "bibtex": "@inproceedings{\nbastos2024beyond,\ntitle={Beyond Spatio-Temporal Representations: Evolving Fourier Transform for Temporal Graphs},\nauthor={Anson Bastos and Kuldeep Singh and Abhishek Nadgeri and Manish Singh and Toyotaro Suzumura},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=uvFhCUPjtI}\n}",
        "github": "",
        "project": "",
        "reviewers": "qJBV;4jzq;sEtv;YfD5",
        "pdf_size": 1164563,
        "rating": "6;6;6;6",
        "confidence": "3;2;4;3",
        "soundness": "3;4;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;1;3",
        "wc_summary": "66;88;104;63",
        "wc_strengths": "82;118;9;58",
        "wc_weaknesses": "39;350;126;94",
        "wc_questions": "109;111;41;38",
        "wc_review": "296;667;280;253",
        "wc_reply_reviewers": "59;18;8;0",
        "wc_reply_authors": "346;451;784;572",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            80.25,
            16.768646337734005
        ],
        "wc_strengths_avg": [
            66.75,
            39.594033641446536
        ],
        "wc_weaknesses_avg": [
            152.25,
            118.33506454132689
        ],
        "wc_questions_avg": [
            74.75,
            35.27304211433995
        ],
        "wc_review_avg": [
            374.0,
            169.86023666532435
        ],
        "wc_reply_reviewers_avg": [
            21.25,
            22.708753818736948
        ],
        "wc_reply_authors_avg": [
            538.25,
            162.86862036623262
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11409287592832223776&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=uvFhCUPjtI",
        "pdf": "https://openreview.net/pdf?id=uvFhCUPjtI",
        "email": "microsoft.com;cerence.com;;;u-tokyo.ac.jp",
        "author_num": 5,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Microsoft;Cerence;University of Tokyo",
        "aff_unique_dep": "Microsoft Corporation;;",
        "aff_unique_url": "https://www.microsoft.com;https://www.cerence.com;https://www.u-tokyo.ac.jp",
        "aff_unique_abbr": "Microsoft;Cerence;UTokyo",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2",
        "aff_country_unique": "United States;Germany;Japan"
    },
    {
        "title": "DEEP NEURAL NETWORK INITIALIZATION WITH SPARSITY INDUCING ACTIVATIONS",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17559",
        "id": "uvXK8Xk9Jk",
        "author_site": "Ilan Price, Nicholas Daultry Ball, Adam Jones, Samuel Chun Hei Lam, Jared Tanner",
        "tldr": "",
        "abstract": "Inducing and leveraging sparse activations during training and inference is a promising avenue for improving the computational efficiency of deep networks, which is increasingly important as network sizes continue to grow and their application becomes more widespread.  Here we use the large width Gaussian process limit to analyze the behaviour, at random initialization, of nonlinear activations that induce sparsity in the hidden outputs.  A previously unreported form of training instability is proven for arguably two of the most natural candidates for hidden layer sparsification; those being a shifted ReLU ($\\phi(x)=\\max(0, x-\\tau)$ for $\\tau\\ge 0$) and soft thresholding ($\\phi(x)=0$ for $|x|\\le\\tau$ and $x-\\text{sign}(x)\\tau$ for $|x|>\\tau$).  We show that this instability is overcome by clipping the nonlinear activation magnitude, at a level prescribed by the shape of the associated Gaussian process variance map. Numerical experiments verify the theory and show that the proposed magnitude clipped sparsifying activations can be trained with training and test fractional sparsity as high as 85\\% while retaining close to full accuracy.",
        "keywords": "Deep neural network;random initialisation;sparsity;gaussian process",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Ilan Price;Nicholas Daultry Ball;Adam Christopher Jones;Samuel Chun Hei Lam;Jared Tanner",
        "authorids": "~Ilan_Price1;~Nicholas_Daultry_Ball1;~Adam_Christopher_Jones1;~Samuel_Chun_Hei_Lam1;~Jared_Tanner1",
        "gender": ";M;Not Specified;M;",
        "homepage": ";;;https://samuel-chlam.github.io/newsite/#/;http://people.maths.ox.ac.uk/tanner/publications.shtml",
        "dblp": ";;;;85/1256",
        "google_scholar": ";;;;https://scholar.google.co.uk/citations?user=J7248tkAAAAJ",
        "orcid": ";;;0009-0003-2333-8725;",
        "linkedin": ";nicholas-daultry-ball-85a53011a/;adam-jones-8a3a68198;;",
        "or_profile": "~Ilan_Price1;~Nicholas_Daultry_Ball1;~Adam_Christopher_Jones1;~Samuel_Chun_Hei_Lam1;~Jared_Tanner1",
        "aff": ";University of Oxford;Mathematical Institute, University of Oxford;University of Oxford;University of Oxford",
        "aff_domain": ";ox.ac.uk;maths.ox.ac.uk;ox.ac.uk;ox.ac.uk",
        "position": ";PhD student;PhD student;PhD student;Full Professor",
        "bibtex": "@inproceedings{\nprice2024deep,\ntitle={{DEEP} {NEURAL} {NETWORK} {INITIALIZATION} {WITH} {SPARSITY} {INDUCING} {ACTIVATIONS}},\nauthor={Ilan Price and Nicholas Daultry Ball and Adam Christopher Jones and Samuel Chun Hei Lam and Jared Tanner},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=uvXK8Xk9Jk}\n}",
        "github": "",
        "project": "",
        "reviewers": "FeGe;qoAp;TyEd;auBc",
        "pdf_size": 10270477,
        "rating": "6;6;6;8",
        "confidence": "4;3;2;3",
        "soundness": "4;3;3;4",
        "contribution": "2;3;3;4",
        "presentation": "3;3;2;4",
        "wc_summary": "116;221;102;109",
        "wc_strengths": "85;36;113;37",
        "wc_weaknesses": "230;116;190;22",
        "wc_questions": "9;30;79;38",
        "wc_review": "440;403;484;206",
        "wc_reply_reviewers": "96;0;0;21",
        "wc_reply_authors": "1331;545;1145;229",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "3;1;2;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            137.0,
            48.74935897014442
        ],
        "wc_strengths_avg": [
            67.75,
            32.78242669480098
        ],
        "wc_weaknesses_avg": [
            139.5,
            79.21331958704924
        ],
        "wc_questions_avg": [
            39.0,
            25.406692031825003
        ],
        "wc_review_avg": [
            383.25,
            106.27646729168222
        ],
        "wc_reply_reviewers_avg": [
            29.25,
            39.480216564755565
        ],
        "wc_reply_authors_avg": [
            812.5,
            444.8109148840662
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2503844878613788242&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=uvXK8Xk9Jk",
        "pdf": "https://openreview.net/pdf?id=uvXK8Xk9Jk",
        "email": ";ox.ac.uk;maths.ox.ac.uk;ox.ac.uk;ox.ac.uk",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of Oxford",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ox.ac.uk",
        "aff_unique_abbr": "Oxford",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Oxford",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "uvYgx8raPO",
        "title": "Trust-Region Method Based on Probabilistic Models for Multi-Objective Optimization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Multi-objective expensive optimization problems appear in many real-world applications. These problems involve multiple computationally expensive objectives, and their derivative information is usually unavailable or hard to compute. Most existing methods focus on constructing high-quality surrogate models for individual objective functions or aggressive subproblems, and these often come with a prohibitive cost. This paper extends the trust-region method based on probabilistic models to solve multi-objective optimization problems. Specifically, we adopt the decomposition mechanism from MOEA/D to decompose the multi-objective optimization problem into multiple Tchebycheff subproblems. Each subproblem is then approximated using high-quality probabilistic models within a trust region framework. Under certain mild assumptions and the properties of Martingales, we can prove that the proposed method can converge to the Pareto critical point with probability one. Experimental results further illustrate that the proposed algorithm outperforms other representative algorithms on a low budget.",
        "keywords": "Multi-objective optimization;Trust region method;probabilistic models;global convergence.",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "CHEN Jing Jing;Xi Lin;Qingfu Zhang",
        "authorids": "~CHEN_Jing_Jing1;~Xi_Lin2;~Qingfu_Zhang1",
        "gender": "F;M;M",
        "homepage": ";https://xi-l.github.io/;https://www.cs.cityu.edu.hk/~qzhan7/index.html",
        "dblp": ";43/489-1;98/1240.html",
        "google_scholar": ";QB_MUboAAAAJ;https://scholar.google.co.uk/citations?user=nhL9PHwAAAAJ",
        "orcid": "my-orcid;;",
        "linkedin": ";;",
        "or_profile": "~CHEN_Jing_Jing1;~Xi_Lin2;~Qingfu_Zhang1",
        "aff": ";City University of Hong Kong;City University of Hong Kong",
        "aff_domain": ";cityu.edu.hk;cityu.edu.hk",
        "position": ";Postdoc;Full Professor",
        "bibtex": "@misc{\njing2024trustregion,\ntitle={Trust-Region Method Based on Probabilistic Models for Multi-Objective Optimization},\nauthor={CHEN Jing Jing and Xi Lin and Qingfu Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=uvYgx8raPO}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=uvYgx8raPO",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:nerhtebB3o8J:scholar.google.com/&scioq=Trust-Region+Method+Based+on+Probabilistic+Models+for+Multi-Objective+Optimization&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "City University of Hong Kong",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cityu.edu.hk",
        "aff_unique_abbr": "CityU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "uvZDQvjULn",
        "title": "A bi-objective perspective on controllable language models: reward dropout improves off-policy control performance",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We study the theoretical aspects of CLMs (Controllable Language Models) from a bi-objective optimization perspective. Specifically, we consider the CLMs as an off-policy RL problem that requires simultaneously maximizing the reward and likelihood objectives. Our main contribution consists of three parts. First, we establish the theoretical foundations of CLM by presenting reward upper bound and Pareto improvement/optimality conditions. Second, we analyze conditions that improve and violate Pareto optimality itself, respectively. Finally, we propose Reward Dropout, a simple yet powerful method to guarantee policy improvement based on a Pareto improvement condition. Our theoretical outcomes are supported by not only deductive proofs but also empirical results. The performance of Reward Dropout was evaluated on five CLM benchmark datasets, and it turns out that the Reward Dropout significantly improves the performance of CLMs.",
        "keywords": "Controllable Language Model;Language Model;Reinforcement Learning;Off-policy RL;Bi-objective Problem;Pareto Optimization",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Changhun Lee;Chiehyeon Lim",
        "authorids": "~Changhun_Lee1;~Chiehyeon_Lim1",
        "gender": "M;",
        "homepage": ";http://service.unist.ac.kr/",
        "dblp": "144/5428;220/6678.html",
        "google_scholar": "https://scholar.google.co.kr/citations?hl=en;https://scholar.google.co.kr/citations?user=NW7F08MAAAAJ",
        "orcid": "0000-0003-2722-7400;0000-0001-6112-9674",
        "linkedin": ";chiehyeon",
        "or_profile": "~Changhun_Lee1;~Chiehyeon_Lim1",
        "aff": "Ulsan National Institute of Science and Technology;Ulsan National Institute of Science and Technology",
        "aff_domain": "unist.ac.kr;unist.ac.kr",
        "position": "Postdoc;Associate Professor",
        "bibtex": "@misc{\nlee2024a,\ntitle={A bi-objective perspective on controllable language models: reward dropout improves off-policy control performance},\nauthor={Changhun Lee and Chiehyeon Lim},\nyear={2024},\nurl={https://openreview.net/forum?id=uvZDQvjULn}\n}",
        "github": "",
        "project": "",
        "reviewers": "EE6f;pDqw;dnJ6",
        "site": "https://openreview.net/forum?id=uvZDQvjULn",
        "pdf_size": 11098108,
        "rating": "5;5;8",
        "confidence": "2;2;3",
        "soundness": "3;3;2",
        "contribution": "2;3;4",
        "presentation": "1;2;3",
        "wc_summary": "54;291;36",
        "wc_strengths": "45;60;25",
        "wc_weaknesses": "168;462;129",
        "wc_questions": "2;184;105",
        "wc_review": "269;997;295",
        "wc_reply_reviewers": "0;155;0",
        "wc_reply_authors": "1246;5009;2059",
        "reply_reviewers": "0;1;0",
        "reply_authors": "3;13;5",
        "rating_avg": [
            6.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            127.0,
            116.19810669714029
        ],
        "wc_strengths_avg": [
            43.333333333333336,
            14.337208778404378
        ],
        "wc_weaknesses_avg": [
            253.0,
            148.64050591948347
        ],
        "wc_questions_avg": [
            97.0,
            74.5162174742295
        ],
        "wc_review_avg": [
            520.3333333333334,
            337.22132527795776
        ],
        "wc_reply_reviewers_avg": [
            51.666666666666664,
            73.06770072260991
        ],
        "wc_reply_authors_avg": [
            2771.3333333333335,
            1616.7057727229019
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            7.0,
            4.320493798938574
        ],
        "replies_avg": [
            36,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:7LiOAiDUCRgJ:scholar.google.com/&scioq=A+bi-objective+perspective+on+controllable+language+models:+reward+dropout+improves+off-policy+control+performance&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Ulsan National Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.unist.ac.kr",
        "aff_unique_abbr": "UNIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "uvq4Nh8eZB",
        "title": "Protecting Sensitive Data through Federated Co-Training",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In many critical applications, sensitive data is inherently distributed. Federated learning trains a model collaboratively by aggregating the parameters of locally trained models. This avoids exposing sensitive local data. It is possible, though, to infer upon the sensitive data from the shared model parameters. At the same time, many types of machine learning models do not lend themselves to parameter aggregation, such as decision trees, or rule ensembles. It has been observed that in many applications, in particular healthcare, large unlabeled datasets are publicly available. They can be used to exchange information between clients by distributed distillation, i.e., co-regularizing local training via the discrepancy between the soft predictions of each local client on the unlabeled dataset. This, however, still discloses private information and restricts the types of models to those trainable via gradient-based methods. We propose to go one step further and use a form of federated co-training, where local hard labels on the public unlabeled datasets are shared and aggregated into a consensus label. This consensus label can be used for local training by any supervised machine learning model. We show that this federated co-training approach achieves a model quality comparable to both federated learning and distributed distillation on a set of benchmark datasets and real-world medical datasets. It improves privacy over both approaches, protecting against common membership inference attacks to the highest degree. Furthermore, we show that federated co-training can collaboratively train interpretable models, such as decision trees and rule ensembles, achieving a model quality comparable to centralized training.",
        "keywords": "federated learning;co-training;federated semi-supervised learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/4a9d0ec65c3e93201a12a8355402f9c233e23a74.zip",
        "author": "Amr Abourayya;Jens Kleesiek;Kanishka Rao;Erman Ayday;Bharat Rao;Geoffrey I. Webb;Michael Kamp",
        "authorids": "~Amr_Abourayya1;~Jens_Kleesiek1;~Kanishka_Rao2;~Erman_Ayday2;~Bharat_Rao1;~Geoffrey_I._Webb1;~Michael_Kamp1",
        "gender": ";;;M;M;M;M",
        "homepage": ";;;https://engineering.case.edu/research/labs/SPiD;https://www.carenostics.com/;http://i.giwebb.com/;http://michaelkamp.org",
        "dblp": ";63/7927;;;;w/GeoffreyIWebb;133/7744",
        "google_scholar": "https://scholar.google.com.au/citations?user=Yq-JJFAAAAAJ;Vly6hRQAAAAJ;;U9ZsIu0AAAAJ;PdzYa3sAAAAJ;_1tpf8AAAAAJ;https://scholar.google.de/citations?user=8R5jbvQAAAAJ",
        "orcid": "0000-0003-2993-0482;0000-0001-8686-0682;;;;0000-0001-9963-5169;0000-0001-6231-0694",
        "linkedin": "amrusama;;kanishkarao;;raobharat/;giwebb/;michael-kamp-29096a95/",
        "or_profile": "~Amr_Abourayya1;~Jens_Kleesiek1;~Kanishka_Rao2;~Erman_Ayday2;~Bharat_Rao1;~Geoffrey_I._Webb1;~Michael_Kamp1",
        "aff": "Universit\u00e4t Duisburg-Essen;Institute for AI in Medicine (IKIM), University Medicine Essen;;Case Western Reserve University;Carenostics;Monash University;Institute for AI in Medicine IKIM",
        "aff_domain": "uni-duisburg-essen.de;uk-essen.de;;cwru.edu;carenostics.com;monash.edu;uk-essen.de",
        "position": "PhD student;Full Professor;;Assistant Professor;CEO;Full Professor;Research Group Leader",
        "bibtex": "@misc{\nabourayya2024protecting,\ntitle={Protecting Sensitive Data through Federated Co-Training},\nauthor={Amr Abourayya and Jens Kleesiek and Kanishka Rao and Erman Ayday and Bharat Rao and Geoffrey I. Webb and Michael Kamp},\nyear={2024},\nurl={https://openreview.net/forum?id=uvq4Nh8eZB}\n}",
        "github": "",
        "project": "",
        "reviewers": "UQKJ;W2md;e9mW;NCnb",
        "site": "https://openreview.net/forum?id=uvq4Nh8eZB",
        "pdf_size": 518574,
        "rating": "3;3;5;5",
        "confidence": "4;4;4;4",
        "soundness": "2;2;3;2",
        "contribution": "2;2;2;2",
        "presentation": "1;2;3;2",
        "wc_summary": "70;87;55;91",
        "wc_strengths": "6;37;30;48",
        "wc_weaknesses": "25;338;175;203",
        "wc_questions": "179;49;18;47",
        "wc_review": "280;511;278;389",
        "wc_reply_reviewers": "77;205;116;0",
        "wc_reply_authors": "931;1414;861;1028",
        "reply_reviewers": "2;2;1;0",
        "reply_authors": "3;4;2;2",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            75.75,
            14.341809509263467
        ],
        "wc_strengths_avg": [
            30.25,
            15.400892831261439
        ],
        "wc_weaknesses_avg": [
            185.25,
            111.16738505515005
        ],
        "wc_questions_avg": [
            73.25,
            62.27509534316266
        ],
        "wc_review_avg": [
            364.5,
            95.76664346211577
        ],
        "wc_reply_reviewers_avg": [
            99.5,
            73.83935265155024
        ],
        "wc_reply_authors_avg": [
            1058.5,
            213.64280938051718
        ],
        "reply_reviewers_avg": [
            1.25,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12300349244557445437&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;4;5",
        "aff_unique_norm": "University of Duisburg-Essen;University Medicine Essen;Case Western Reserve University;Carenostics;Monash University;Institute for AI in Medicine",
        "aff_unique_dep": ";Institute for AI in Medicine (IKIM);;;;AI in Medicine",
        "aff_unique_url": "https://www.uni-due.de;https://www.essen.de/;https://www.case.edu;;https://www.monash.edu;",
        "aff_unique_abbr": "UDE;;CWRU;;Monash;IKIM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;3;4",
        "aff_country_unique": "Germany;United States;;Australia;Unknown"
    },
    {
        "id": "uw5U7FfTRf",
        "title": "BaDLoss: Backdoor Detection via Loss Dynamics",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Backdoor attacks often inject synthetic features into a training dataset. Images classified with these synthetic features often demonstrate starkly different training dynamics when compared to natural images. Previous work has identified this phenomenon, claiming that backdoors are outliers (Hayase et al. 2021) or particularly strong features (Khaddaj et al. 2023), consequently being harder or easier to learn compared to regular examples. We instead identify backdoors as having \\textit{different}, anomalous training dynamics. With this insight, we present BaDLoss, a robust backdoor detection method. BaDLoss injects specially chosen probes that model anomalous training dynamics and tracks the loss trajectory for each example in the dataset, enabling the identification of unknown backdoors in the training set. Our method effectively transfers zero-shot to novel backdoor attacks without prior knowledge. Additionally, BaDLoss can detect multiple concurrent attacks, setting it apart from most existing approaches. By removing identified examples and retraining, BaDLoss eliminates the model's vulnerability to most attacks, far more effectively than previous defenses.",
        "keywords": "data poisoning;backdoors",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Neel Alex;Shoaib Ahmed Siddiqui;Amartya Sanyal;David Krueger",
        "authorids": "~Neel_Alex1;~Shoaib_Ahmed_Siddiqui1;~Amartya_Sanyal1;~David_Krueger1",
        "gender": "M;M;M;M",
        "homepage": "https://neel-alex.github.io/;;https://amartya18x.github.io;https://mila.umontreal.ca/en/person/david-scott-krueger/",
        "dblp": ";208/3111;203/8807;142/2741.html",
        "google_scholar": ";https://scholar.google.de/citations?user=9SOO4z0AAAAJ;;https://scholar.google.ca/citations?user=5Uz70IoAAAAJ",
        "orcid": ";0000-0003-4600-7331;0000-0002-4190-0449;",
        "linkedin": ";shoaibahmedsiddiqui/;;",
        "or_profile": "~Neel_Alex1;~Shoaib_Ahmed_Siddiqui1;~Amartya_Sanyal1;~David_Krueger1",
        "aff": "University of Cambridge;University of Cambridge;Max-Planck Institute;University of Cambridge",
        "aff_domain": "cam.ac.uk;cam.ac.uk;mpg.de;cam.ac.uk",
        "position": "PhD student;PhD student;Postdoc;Assistant Professor",
        "bibtex": "@misc{\nalex2024badloss,\ntitle={Ba{DL}oss: Backdoor Detection via Loss Dynamics},\nauthor={Neel Alex and Shoaib Ahmed Siddiqui and Amartya Sanyal and David Krueger},\nyear={2024},\nurl={https://openreview.net/forum?id=uw5U7FfTRf}\n}",
        "github": "",
        "project": "",
        "reviewers": "QKR4;SuvN;4YdZ;U6eM",
        "site": "https://openreview.net/forum?id=uw5U7FfTRf",
        "pdf_size": 1153764,
        "rating": "3;3;3;3",
        "confidence": "4;3;4;3",
        "soundness": "3;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "2;2;2;2",
        "wc_summary": "79;64;75;66",
        "wc_strengths": "31;34;51;28",
        "wc_weaknesses": "368;252;354;116",
        "wc_questions": "33;118;113;6",
        "wc_review": "511;468;593;216",
        "wc_reply_reviewers": "0;0;66;50",
        "wc_reply_authors": "1131;934;1329;701",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "2;2;2;1",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            71.0,
            6.2048368229954285
        ],
        "wc_strengths_avg": [
            36.0,
            8.916277250063503
        ],
        "wc_weaknesses_avg": [
            272.5,
            100.84022015049352
        ],
        "wc_questions_avg": [
            67.5,
            48.971930735881756
        ],
        "wc_review_avg": [
            447.0,
            140.72490895360352
        ],
        "wc_reply_reviewers_avg": [
            29.0,
            29.546573405388315
        ],
        "wc_reply_authors_avg": [
            1023.75,
            232.86409663149018
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:h0IsHBWLfoUJ:scholar.google.com/&scioq=BaDLoss:+Backdoor+Detection+via+Loss+Dynamics&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "University of Cambridge;Max-Planck-Gesellschaft zur F\u00f6rderung der Wissenschaften e.V.",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cam.ac.uk;https://www.mpg.de",
        "aff_unique_abbr": "Cambridge;MPG",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Cambridge;",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "United Kingdom;Germany"
    },
    {
        "id": "uwJgCIKXJS",
        "title": "Linear Indexed Minimum Empirical Divergence Algorithms",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The Indexed Minimum Empirical Divergence (IMED) algorithm is a highly effective approach that offers a stronger theoretical guarantee of the asymptotic optimality compared to the Kullback--Leibler Upper Confidence Bound (KL-UCB) algorithm for the multi-armed bandit problem. Additionally, it has been observed to empirically outperform UCB-based algorithms and Thompson Sampling. Despite its effectiveness, the generalization of this algorithm to contextual bandits with linear payoffs has remained elusive. In this paper, we present novel linear versions of the IMED algorithm, which we call the family of LinIMED algorithms. We demonstrate that LinIMED provides a $\\widetilde{O}(d\\sqrt{T})$ upper regret bound where $d$ is the dimension of the context and $T$ is the time horizon. Furthermore, empirical studies reveal that LinIMED and its variants outperform widely-used linear bandit algorithms such as LinUCB and Linear Thompson Sampling in some regimes.",
        "keywords": "Multi-armed bandit;Linear bandit;Indexed Minimum Empirical Divergence (IMED) algorithm",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/d4b735fbcab05c04240caf6047351171f54a42f4.pdf",
        "author": "Jie Bian;Vincent Tan",
        "authorids": "~Jie_Bian1;~Vincent_Tan1",
        "gender": "M;M",
        "homepage": ";https://www.ece.nus.edu.sg/stfpage/vtan/pubs.htm",
        "dblp": "72/9163;60/2327",
        "google_scholar": "JMU6gVMAAAAJ;dJoAVvAAAAAJ",
        "orcid": "0009-0006-9148-6852;0000-0002-5008-4527",
        "linkedin": ";",
        "or_profile": "~Jie_Bian1;~Vincent_Tan1",
        "aff": "National University of Singapore;National University of Singapore",
        "aff_domain": "nus.edu;nus.edu.sg",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nbian2024linear,\ntitle={Linear Indexed Minimum Empirical Divergence Algorithms},\nauthor={Jie Bian and Vincent Tan},\nyear={2024},\nurl={https://openreview.net/forum?id=uwJgCIKXJS}\n}",
        "github": "",
        "project": "",
        "reviewers": "iSL5;FSvU;PVPY;z91R",
        "site": "https://openreview.net/forum?id=uwJgCIKXJS",
        "pdf_size": 4131023,
        "rating": "3;3;3;5",
        "confidence": "4;3;4;3",
        "soundness": "2;2;3;3",
        "contribution": "1;2;1;2",
        "presentation": "2;2;3;3",
        "wc_summary": "49;51;89;58",
        "wc_strengths": "45;52;46;39",
        "wc_weaknesses": "116;444;82;77",
        "wc_questions": "37;88;11;95",
        "wc_review": "247;635;228;269",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            61.75,
            16.08376510646683
        ],
        "wc_strengths_avg": [
            45.5,
            4.6097722286464435
        ],
        "wc_weaknesses_avg": [
            179.75,
            153.30097031656388
        ],
        "wc_questions_avg": [
            57.75,
            35.06690034776384
        ],
        "wc_review_avg": [
            344.75,
            168.20281656381383
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:sK9HU4oFYDEJ:scholar.google.com/&scioq=Linear+Indexed+Minimum+Empirical+Divergence+Algorithms&hl=en&as_sdt=0,48",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "National University of Singapore",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nus.edu.sg",
        "aff_unique_abbr": "NUS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Singapore"
    },
    {
        "title": "Bayesian Neural Controlled Differential Equations for Treatment Effect Estimation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17558",
        "id": "uwO71a8wET",
        "author_site": "Konstantin Hess, Valentyn Melnychuk, Dennis Frauen, Stefan Feuerriegel",
        "tldr": "",
        "abstract": "Treatment effect estimation in continuous time is crucial for personalized medicine. However, existing methods for this task are limited to point estimates of the potential outcomes, whereas uncertainty estimates have been ignored. Needless to say, uncertainty quantification is crucial for reliable decision-making in medical applications. To fill this gap, we propose a novel Bayesian neural controlled differential equation (BNCDE) for treatment effect estimation in continuous time. In our BNCDE, the time dimension is modeled through a coupled system of neural controlled differential equations and neural stochastic differential equations, where the neural stochastic differential equations allow for tractable variational Bayesian inference. Thereby, for an assigned sequence of treatments, our BNCDE provides meaningful posterior predictive distributions of the potential outcomes. To the best of our knowledge, ours is the first tailored neural method to provide uncertainty estimates of treatment effects in continuous time. As such, our method is of direct practical value for promoting reliable decision-making in medicine.",
        "keywords": "treatment effect estimation;neural differential equation;variational Bayes;medicine",
        "primary_area": "causal reasoning",
        "supplementary_material": "",
        "author": "Konstantin Hess;Valentyn Melnychuk;Dennis Frauen;Stefan Feuerriegel",
        "authorids": "~Konstantin_Hess1;~Valentyn_Melnychuk1;~Dennis_Frauen1;~Stefan_Feuerriegel1",
        "gender": "M;M;M;M",
        "homepage": "https://www.som.lmu.de/ai/en/institute/contact-page/hess-2.html;https://valentyn1997.github.io/;https://www.ai.bwl.uni-muenchen.de/team/research_team/dennis_frauen/index.html;http://www.ai.bwl.lmu.de",
        "dblp": ";254/1513;315/0115;125/0630",
        "google_scholar": "https://scholar.google.de/citations?user=yZvpjxcAAAAJ;EMExrOMAAAAJ;ieyW4WQAAAAJ;https://scholar.google.de/citations?hl=de",
        "orcid": ";0000-0002-2401-6803;;0000-0001-7856-8729",
        "linkedin": "konstantin-he%C3%9F-5a28611b4/;valentyn-melnychuk/;dennis-frauen-6b5746171/;",
        "or_profile": "~Konstantin_Hess1;~Valentyn_Melnychuk1;~Dennis_Frauen1;~Stefan_Feuerriegel1",
        "aff": "Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen;Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen;Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen;LMU Munich",
        "aff_domain": "lmu.de;lmu.de;lmu.de;lmu.de",
        "position": "PhD student;PhD student;PhD student;Professor",
        "bibtex": "@inproceedings{\nhess2024bayesian,\ntitle={Bayesian Neural Controlled Differential Equations for Treatment Effect Estimation},\nauthor={Konstantin Hess and Valentyn Melnychuk and Dennis Frauen and Stefan Feuerriegel},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=uwO71a8wET}\n}",
        "github": "",
        "project": "",
        "reviewers": "kEvk;UGox;CatB;6Zs2",
        "pdf_size": 1532011,
        "rating": "6;6;6;8",
        "confidence": "3;3;3;3",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;2;3;4",
        "wc_summary": "122;42;59;64",
        "wc_strengths": "56;59;53;48",
        "wc_weaknesses": "271;124;128;73",
        "wc_questions": "86;4;5;150",
        "wc_review": "535;229;245;335",
        "wc_reply_reviewers": "174;0;0;48",
        "wc_reply_authors": "3074;823;1457;727",
        "reply_reviewers": "2;0;0;1",
        "reply_authors": "6;2;3;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            71.75,
            30.13614938906429
        ],
        "wc_strengths_avg": [
            54.0,
            4.06201920231798
        ],
        "wc_weaknesses_avg": [
            149.0,
            73.69871097922947
        ],
        "wc_questions_avg": [
            61.25,
            61.09572407296602
        ],
        "wc_review_avg": [
            336.0,
            121.79080425056729
        ],
        "wc_reply_reviewers_avg": [
            55.5,
            71.16705698565875
        ],
        "wc_reply_authors_avg": [
            1520.25,
            939.8859970762412
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.0,
            1.8708286933869707
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 16,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13746018407242846815&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=uwO71a8wET",
        "pdf": "https://openreview.net/pdf?id=uwO71a8wET",
        "email": "lmu.de;lmu.de;lmu.de;lmu.de",
        "author_num": 4,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen;Ludwig Maximilian University of Munich",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.lmu.de;https://www.lmu.de",
        "aff_unique_abbr": "LMU;LMU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Munich",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "uwY0GOqZBh",
        "title": "Characterizing Long-Tail Categories on Graphs via A Theory-Driven Framework",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In the context of long-tailed classification on graphs, the vast majority of existing work primarily revolves around the development of model debiasing strategies, with the aim of mitigating class imbalances and enhancing overall performance. Despite the notable success,  there is very limited literature that provides a theoretical tool for characterizing the behaviors of long-tail categories in graphs and gaining insight into generalization performance in real-world scenarios. To bridge this gap, we propose the first generalization bound for long-tail classification on graphs by formulating the problem in the fashion of multi-task learning, i.e., each task corresponds to the prediction of one particular category. Our theoretical results show that the generalization performance of long-tailed classification is dominated by the overall loss range and the total number of tasks. Building upon the theoretical findings, we propose a novel generic framework Tail2Learn for long-tailed classification on graphs. In particular, we start with a hierarchical task grouping module that allows us to assign related tasks into hypertasks and thus control the complexity of task space; then, we further design a balanced contrastive learning module to adaptively balance the gradients of both head and tail classes to control the loss range across all tasks in a unified fashion. Finally, extensive experiments demonstrate the effectiveness of Tail2Learn in characterizing long-tail categories on real graphs. We publish our data and code at https://anonymous.4open.science/r/Tail2Learn-CE08/.",
        "keywords": "long-tail learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Haohui Wang;Baoyu Jing;Kaize Ding;Yada Zhu;Liqing Zhang;Dawei Zhou",
        "authorids": "~Haohui_Wang1;~Baoyu_Jing1;~Kaize_Ding1;~Yada_Zhu1;~Liqing_Zhang3;~Dawei_Zhou1",
        "gender": "F;;M;;;M",
        "homepage": "https://github.com/wanghh7;;https://kaize0409.github.io/;https://researcher.watson.ibm.com/researcher/view.php?person=us-yzhu;https://scholar.google.com/citations?user=erM6KTMAAAAJ&inst=13410158990364976897;https://sites.google.com/view/dawei-zhou/home?authuser=0",
        "dblp": "294/8598;210/0936;234/6878;56/8808;;39/3130-3.html",
        "google_scholar": "ijh64HMAAAAJ;cl9YMcUAAAAJ;PI3myr8AAAAJ;AJb408gAAAAJ;;8dakqOgAAAAJ",
        "orcid": "0009-0000-7391-096X;0000-0003-1564-6499;;0000-0002-3338-6371;;0000-0002-7065-2990",
        "linkedin": ";baoyu-jing-b37455a0/;;yadazhu/;;dawei-zhou-31035668/",
        "or_profile": "~Haohui_Wang1;~Baoyu_Jing1;~Kaize_Ding1;~Yada_Zhu1;~Liqing_Zhang3;~Dawei_Zhou1",
        "aff": "Virginia Polytechnic Institute and State University;University of Illinois, Urbana Champaign;Northwestern University;IBM Research;, Virginia Polytechnic Institute and State University;Virginia Polytechnic Institute and State University",
        "aff_domain": "vt.edu;illinois.edu;northwestern.edu;us.ibm.com;cs.vt.edu;vt.edu",
        "position": "PhD student;PhD student;Assistant Professor;Principal Research Scientist;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nwang2024characterizing,\ntitle={Characterizing Long-Tail Categories on Graphs via A Theory-Driven Framework},\nauthor={Haohui Wang and Baoyu Jing and Kaize Ding and Yada Zhu and Liqing Zhang and Dawei Zhou},\nyear={2024},\nurl={https://openreview.net/forum?id=uwY0GOqZBh}\n}",
        "github": "",
        "project": "",
        "reviewers": "Wqoo;Td6K;pu5a;8rhB",
        "site": "https://openreview.net/forum?id=uwY0GOqZBh",
        "pdf_size": 552878,
        "rating": "3;3;5;8",
        "confidence": "4;3;4;4",
        "soundness": "1;2;2;4",
        "contribution": "1;2;2;3",
        "presentation": "2;2;3;4",
        "wc_summary": "72;63;65;81",
        "wc_strengths": "46;38;109;91",
        "wc_weaknesses": "172;229;203;386",
        "wc_questions": "268;3;2;3",
        "wc_review": "558;333;379;561",
        "wc_reply_reviewers": "0;0;14;27",
        "wc_reply_authors": "344;312;474;1093",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            1.0897247358851685
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            70.25,
            7.048936089935842
        ],
        "wc_strengths_avg": [
            71.0,
            29.824486584013478
        ],
        "wc_weaknesses_avg": [
            247.5,
            82.46969140235703
        ],
        "wc_questions_avg": [
            69.0,
            114.89342888085463
        ],
        "wc_review_avg": [
            457.75,
            103.04701596844035
        ],
        "wc_reply_reviewers_avg": [
            10.25,
            11.233320969330485
        ],
        "wc_reply_authors_avg": [
            555.75,
            316.0588355037714
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.49374193110101877,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:5zurmoUowDgJ:scholar.google.com/&scioq=Characterizing+Long-Tail+Categories+on+Graphs+via+A+Theory-Driven+Framework&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;4;0",
        "aff_unique_norm": "Virginia Tech;University of Illinois Urbana-Champaign;Northwestern University;IBM;Virginia Polytechnic Institute and State University",
        "aff_unique_dep": ";;;IBM Research;",
        "aff_unique_url": "https://www.vt.edu;https://illinois.edu;https://www.northwestern.edu;https://www.ibm.com/research;https://www.vt.edu",
        "aff_unique_abbr": "VT;UIUC;NU;IBM;VT",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Urbana-Champaign",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "uwjDyJfe3m",
        "title": "Benchmarks for Reinforcement Learning with Biased Offline Data and Imperfect Simulators",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In many reinforcement learning (RL) applications one cannot easily let the agent act in the world; this is true for autonomous vehicles, healthcare applications, and even some recommender systems, to name a few examples. Offline RL provides a way to train agents without exploration, but is often faced with biases due to data distribution shifts, limited exploration, and incomplete representation of the environment. To address these issues, practical applications have tried to combine simulators with grounded offline data, using so-called hybrid methods. However, constructing a reliable simulator is in itself often challenging due to intricate system complexities as well as missing or incomplete information. In this work, we outline four principal challenges for combining offline data with imperfect simulators in RL: simulator modeling error, partial observability, state and action discrepancies, and hidden confounding. To help drive the RL community to pursue these problems, we construct ``Benchmarks for Mechanistic Offline Reinforcement Learning'' (B4MRL), which provide dataset-simulator benchmarks for the aforementioned challenges. Finally, we propose a new approach to combine an imperfect simulator with biased data and demonstrate its efficiency. Our results suggest the key necessity of such benchmarks for future research.",
        "keywords": "Reinforcement learning;offline reinforcement learning;sim2real gap",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/fd04733dc25404c18fe356d66b5657421f4a9824.zip",
        "author": "Ori Linial;Guy Tennenholtz;Uri Shalit",
        "authorids": "~Ori_Linial2;~Guy_Tennenholtz2;~Uri_Shalit1",
        "gender": "M;;M",
        "homepage": ";https://guytenn.com;",
        "dblp": ";;87/7049",
        "google_scholar": "CjRCqYUAAAAJ;https://scholar.google.co.il/citations?user=pldrn8IAAAAJ;https://scholar.google.co.il/citations?user=aeGDj-IAAAAJ",
        "orcid": ";;0000-0002-4026-2692",
        "linkedin": "ori-linial-b7a17b109/;;",
        "or_profile": "~Ori_Linial2;~Guy_Tennenholtz2;~Uri_Shalit1",
        "aff": "Technion - Israel Institute of Technology, Technion;Google;Technion",
        "aff_domain": "technion.ac.il;google.com;technion.ac.il",
        "position": "PhD student;Researcher;Associate Professor",
        "bibtex": "@misc{\nlinial2024benchmarks,\ntitle={Benchmarks for Reinforcement Learning with Biased Offline Data and Imperfect Simulators},\nauthor={Ori Linial and Guy Tennenholtz and Uri Shalit},\nyear={2024},\nurl={https://openreview.net/forum?id=uwjDyJfe3m}\n}",
        "github": "",
        "project": "",
        "reviewers": "Q9WM;hLBa;RmHk;nns3",
        "site": "https://openreview.net/forum?id=uwjDyJfe3m",
        "pdf_size": 862322,
        "rating": "3;3;3;6",
        "confidence": "3;3;4;3",
        "soundness": "2;2;1;3",
        "contribution": "2;1;1;3",
        "presentation": "2;3;1;2",
        "wc_summary": "92;83;76;83",
        "wc_strengths": "77;29;89;32",
        "wc_weaknesses": "432;158;348;35",
        "wc_questions": "39;2;30;18",
        "wc_review": "640;272;543;168",
        "wc_reply_reviewers": "0;0;39;0",
        "wc_reply_authors": "274;170;518;0",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;1;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            83.5,
            5.678908345800274
        ],
        "wc_strengths_avg": [
            56.75,
            26.61179249881526
        ],
        "wc_weaknesses_avg": [
            243.25,
            155.912435360365
        ],
        "wc_questions_avg": [
            22.25,
            13.863170633011771
        ],
        "wc_review_avg": [
            405.75,
            192.434891586739
        ],
        "wc_reply_reviewers_avg": [
            9.75,
            16.887495373796554
        ],
        "wc_reply_authors_avg": [
            240.5,
            187.7092166090946
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            0.75,
            0.4330127018922193
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:5azPqC4vWDoJ:scholar.google.com/&scioq=Benchmarks+for+Reinforcement+Learning+with+Biased+Offline+Data+and+Imperfect+Simulators&hl=en&as_sdt=0,5",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Technion - Israel Institute of Technology;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.technion.ac.il;https://www.google.com",
        "aff_unique_abbr": "Technion;Google",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Israel;United States"
    },
    {
        "id": "uxFme785fq",
        "title": "Nonlinear Inference Learning for Differentially Private Massive Data",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The Bag of Little Bootstraps (BLB) method is widely utilized as a robust and computationally efficient approach in statistical inference studies involving large-scale data. However, this sampling technique overlooks the privacy protection of the original data. To address this limitation, we enhance the existing differential privacy algorithm and integrate it with the BLB method. This integration gives rise to a novel differential privacy mechanism, enabling a comprehensive statistical analysis of aggregated parameters while safeguarding the confidentiality of individual private data. Additionally, to address both the variability in noise variance under the differential privacy mechanism and the uncertainty surrounding estimate distributions, we employ the central limit theorem within the context of nonlinear expectation theory. This facilitates the derivation of the corresponding test statistic and the introduction of a hypothesis testing methodology. Furthermore, we validate the commendable performance of our proposed inference procedure through data simulation studies. The big data-oriented differential privacy-preserving mechanism proposed in this study effectively fulfills the requirements for privacy preservation without compromising subsequent statistical inference. This contribution holds significant reference value for the sharing of pertinent data and endeavors related to statistical analysis.",
        "keywords": "Differential privacy;Nonlinear Inference;Massive Data;Bag of Little Bootstraps",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "XI Chen;Jiashan Song;Hongni Wang;Bei Jiang;Xiaodong Yan",
        "authorids": "~XI_Chen38;sjsblcu@163.com;~Hongni_Wang1;~Bei_Jiang1;~Xiaodong_Yan1",
        "gender": ";;F;F;M",
        "homepage": ";;;https://www.ualberta.ca/~bei1;https://yanxiaodong128.github.io/index.html",
        "dblp": ";;;190/4697;",
        "google_scholar": ";;;https://scholar.google.ca/citations?user=MfOZ8G0AAAAJ;",
        "orcid": ";;0000-0002-5786-2715;0000-0002-0033-839X;",
        "linkedin": ";;;;",
        "or_profile": "~XI_Chen38;sjsblcu@163.com;~Hongni_Wang1;~Bei_Jiang1;~Xiaodong_Yan1",
        "aff": ";;Shandong University of Finance and Economics;University of Alberta;Shandong University",
        "aff_domain": ";;sdufe.edu.cn;ualberta.ca;edu.cn",
        "position": ";;PhD student;Associate Professor;Associate Professor",
        "bibtex": "@misc{\nchen2024nonlinear,\ntitle={Nonlinear Inference Learning for Differentially Private Massive Data},\nauthor={XI Chen and Jiashan Song and Hongni Wang and Bei Jiang and Xiaodong Yan},\nyear={2024},\nurl={https://openreview.net/forum?id=uxFme785fq}\n}",
        "github": "",
        "project": "",
        "reviewers": "YJor;AGza;f45X;YsDk",
        "site": "https://openreview.net/forum?id=uxFme785fq",
        "pdf_size": 514623,
        "rating": "1;3;3;3",
        "confidence": "3;4;5;4",
        "soundness": "2;2;3;2",
        "contribution": "1;1;3;2",
        "presentation": "1;2;3;2",
        "wc_summary": "85;29;145;43",
        "wc_strengths": "23;17;55;49",
        "wc_weaknesses": "427;296;73;271",
        "wc_questions": "13;103;18;74",
        "wc_review": "548;445;291;437",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            75.5,
            45.108203245086145
        ],
        "wc_strengths_avg": [
            36.0,
            16.278820596099706
        ],
        "wc_weaknesses_avg": [
            266.75,
            126.58272986470153
        ],
        "wc_questions_avg": [
            52.0,
            37.953919428696686
        ],
        "wc_review_avg": [
            430.25,
            91.54063305439831
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:utZQbrCoV3wJ:scholar.google.com/&scioq=Nonlinear+Inference+Learning+for+Differentially+Private+Massive+Data&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Shandong University of Finance and Economics;University of Alberta;Shandong University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.sdufe.edu.cn;https://www.ualberta.ca;http://www.sdu.edu.cn",
        "aff_unique_abbr": "SDUFE;UAlberta;SDU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "China;Canada"
    },
    {
        "id": "uxYye6i2Xi",
        "title": "Composing Recurrent Spiking Neural Networks using Locally-Recurrent Motifs and Risk-Mitigating Architectural Optimization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In neural circuits, recurrent connectivity plays a crucial role in network function and stability. However, existing recurrent spiking neural networks (RSNNs) are often constructed by random connections without optimization. While RSNNs can produce rich dynamics that are critical for memory formation and learning, systemic architectural optimization of RSNNs is still an open challenge. We aim to enable systematic design of large RSNNs via a new scalable RSNN architecture and automated architectural optimization.  We compose RSNNs based on a layer architecture called Sparsely-Connected Recurrent Motif Layer (SC-ML) that consists of multiple small recurrent motifs wired together by sparse lateral connections. The small size of the motifs and sparse inter-motif connectivity leads to an RSNN architecture scalable to large network sizes. We further propose a method called Hybrid Risk-Mitigating Architectural Search (HRMAS) to systematically optimize the topology of the proposed recurrent motifs and SC-ML layer architecture. HRMAS is an alternating two-step optimization process by which we mitigate the risk of network instability and performance degradation caused by architectural change by introducing a novel biologically-inspired \"self-repairing\" mechanism through intrinsic plasticity.  The intrinsic plasticity is introduced to the second step of each HRMAS iteration and acts as unsupervised fast self-adaptation to structural and synaptic weight modifications introduced by the first step during the RSNN architectural \"evolution\".  To the best of the authors' knowledge, this is the first work that performs systematic architectural optimization of RSNNs. Using one speech and three neuromorphic datasets, we demonstrate the significant performance improvement brought by the proposed automated architecture optimization over existing manually-designed RSNNs.",
        "keywords": "Recurrent Spiking Neural Networks;Neural Architecture Search;Intrinsic Plasticity",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/af6d8889bb31b78abbbe8c75953b8c2f172539de.zip",
        "author": "Wenrui Zhang;Hejia Geng;Peng Li",
        "authorids": "~Wenrui_Zhang1;~Hejia_Geng1;~Peng_Li8",
        "gender": "M;M;M",
        "homepage": ";;https://www.ece.ucsb.edu/~lip/",
        "dblp": "194/1610;355/2680;83/6353-1.html",
        "google_scholar": "Eod1ZQUAAAAJ;ameiXi0AAAAJ;QYQUS7gAAAAJ",
        "orcid": "0000-0003-1004-4499;;0000-0003-3548-4589",
        "linkedin": "wenrui-zhang-b76a748b/;;peng-li-ucsb/",
        "or_profile": "~Wenrui_Zhang1;~Hejia_Geng1;~Peng_Li8",
        "aff": ";University of California, Santa Barbara;UC Santa Barbara",
        "aff_domain": ";ucsb.edu;ucsb.edu",
        "position": ";MS student;Professor",
        "bibtex": "@misc{\nzhang2024composing,\ntitle={Composing Recurrent Spiking Neural Networks using Locally-Recurrent Motifs and Risk-Mitigating~Architectural Optimization},\nauthor={Wenrui Zhang and Hejia Geng and Peng Li},\nyear={2024},\nurl={https://openreview.net/forum?id=uxYye6i2Xi}\n}",
        "github": "",
        "project": "",
        "reviewers": "jEHG;8BVm;XbPq;H38J",
        "site": "https://openreview.net/forum?id=uxYye6i2Xi",
        "pdf_size": 1297937,
        "rating": "5;5;5;6",
        "confidence": "4;4;3;4",
        "soundness": "3;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "4;2;2;3",
        "wc_summary": "67;123;60;258",
        "wc_strengths": "52;17;60;62",
        "wc_weaknesses": "165;106;170;37",
        "wc_questions": "562;30;148;208",
        "wc_review": "846;276;438;565",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "453;548;427;346",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            127.0,
            79.4764115948877
        ],
        "wc_strengths_avg": [
            47.75,
            18.14352501582865
        ],
        "wc_weaknesses_avg": [
            119.5,
            53.87253474638074
        ],
        "wc_questions_avg": [
            237.0,
            198.26497421380307
        ],
        "wc_review_avg": [
            531.25,
            208.59934683502726
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            443.5,
            72.091955168382
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8940172507319996809&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 11,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of California, Santa Barbara",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucsb.edu",
        "aff_unique_abbr": "UCSB",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Santa Barbara",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "uxurbfWwRr",
        "title": "Learning Time-Varying Convexifications of Multiple Fairness Measures",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "There is an increasing appreciation that one may need to consider multiple measures of fairness, e.g., considering multiple group and individual fairness notions. The relative weights of the fairness regularisers are a priori unknown, may be time varying, and need to be learned on the fly. We consider the learning of time-varying convexifications of multiple fairness measures with traditional full-information feedback and with limited graph-structured feedback.",
        "keywords": "Fairness in Machine Learning;Multiple Fairness Measures;Graph-structured Bandits",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/43387934baa87f532b69a3b3e23eb50a516a55b1.zip",
        "author": "Quan Zhou;Jakub Marecek;Robert Noel Shorten",
        "authorids": "~Quan_Zhou2;~Jakub_Marecek1;~Robert_Noel_Shorten1",
        "gender": "F;M;",
        "homepage": ";https://www.aic.fel.cvut.cz/research-areas/optimization;",
        "dblp": ";02/4822;",
        "google_scholar": "EMLJ8cwAAAAJ;https://scholar.google.co.uk/citations?user=Ew8TNsMAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0002-7530-6624;0000-0003-0839-0691;",
        "linkedin": ";jmarecek/;",
        "or_profile": "~Quan_Zhou2;~Jakub_Marecek1;~Robert_Noel_Shorten1",
        "aff": "Imperial College London;Czech Technical University;Imperial College London",
        "aff_domain": "imperial.ac.uk;cvut.cz;imperial.ac.uk",
        "position": "PhD student;Tenured faculty;Full Professor",
        "bibtex": "@misc{\nzhou2024learning,\ntitle={Learning Time-Varying Convexifications of Multiple Fairness Measures},\nauthor={Quan Zhou and Jakub Marecek and Robert Noel Shorten},\nyear={2024},\nurl={https://openreview.net/forum?id=uxurbfWwRr}\n}",
        "github": "",
        "project": "",
        "reviewers": "wCNF;3uXb;7nxQ",
        "site": "https://openreview.net/forum?id=uxurbfWwRr",
        "pdf_size": 326829,
        "rating": "3;3;6",
        "confidence": "2;3;3",
        "soundness": "2;2;3",
        "contribution": "2;2;2",
        "presentation": "1;2;3",
        "wc_summary": "65;70;126",
        "wc_strengths": "55;42;111",
        "wc_weaknesses": "175;103;155",
        "wc_questions": "9;209;15",
        "wc_review": "304;424;407",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            87.0,
            27.65260686927485
        ],
        "wc_strengths_avg": [
            69.33333333333333,
            29.93697082575694
        ],
        "wc_weaknesses_avg": [
            144.33333333333334,
            30.34615113797611
        ],
        "wc_questions_avg": [
            77.66666666666667,
            92.89898934984288
        ],
        "wc_review_avg": [
            378.3333333333333,
            53.01781671182706
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Aa6ldbC0V8kJ:scholar.google.com/&scioq=Learning+Time-Varying+Convexifications+of+Multiple+Fairness+Measures&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Imperial College London;Czech Technical University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.imperial.ac.uk;https://www.cvut.cz",
        "aff_unique_abbr": "ICL;CTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United Kingdom;Czech Republic"
    },
    {
        "title": "Bayesian Coreset Optimization for Personalized Federated Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17557",
        "id": "uz7d2N2zul",
        "author_site": "Prateek Chanda, Shrey Modi, Ganesh Ramakrishnan",
        "tldr": "",
        "abstract": "In a distributed machine learning setting like Federated Learning where there are multiple clients involved which update their individual weights to a single central server, often training on the entire individual client's dataset for each client becomes cumbersome. To address this issue we propose CORESET-PFEDBAYES : a personalized coreset weighted federated learning setup where the training updates for each individual clients are forwarded to the central server based on only individual client coreset based representative data points instead of the entire client data. Through theoretical analysis we present how the average generalization error is minimax optimal up to logarithm bounds (upper bounded by $\\mathcal{O}(n_k^{-\\frac{2 \\beta}{2 \\beta+\\boldsymbol{\\Lambda}}} \\log ^{2 \\delta^{\\prime}}(n_k))$) and lower bounds of $\\mathcal{O}(n_k^{-\\frac{2 \\beta}{2 \\beta+\\boldsymbol{\\Lambda}}})$, and how the overall generalization error on the data likelihood differs from a vanilla Federated Learning setup as a closed form function ${\\boldsymbol{\\Im}}(\\boldsymbol{w}, n_k)$ of the coreset weights $\\boldsymbol{w}$ and coreset sample size $n_k$. \nOur experiments on different benchmark datasets based on a variety of recent personalized federated learning architectures show significant gains as compared to random sampling on the training data followed by federated learning, thereby indicating how intelligently selecting such training samples can help in performance. Additionally, through experiments on medical datasets our proposed method showcases some gains as compared to  other submodular optimization based approaches used for subset selection on client's data.",
        "keywords": "federated learning;personalized federated learning;bayesian coreset;submodularity;variational inference;coresets;optimization",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/7604c247eee116f309b53fef01d9923dab2fb777.pdf",
        "author": "Prateek Chanda;Shrey Modi;Ganesh Ramakrishnan",
        "authorids": "~Prateek_Chanda2;~Shrey_Modi1;~Ganesh_Ramakrishnan1",
        "gender": "M;M;M",
        "homepage": "https://prateekiiest.github.io/;;https://www.cse.iitb.ac.in/~ganesh/",
        "dblp": ";;r/GaneshRamakrishnan",
        "google_scholar": "https://scholar.google.co.in/citations?user=2CiQLkYAAAAJ;;https://scholar.google.com/scholar?hl=hi",
        "orcid": ";;",
        "linkedin": ";shrey-modi-b059941bb/;",
        "or_profile": "~Prateek_Chanda2;~Shrey_Modi1;~Ganesh_Ramakrishnan1",
        "aff": "Indian Institute of Technology, Bombay;Indian Institute of Technology, Bombay;Indian Institute of Technology Bombay, Indian Institute of Technology Bombay",
        "aff_domain": "iitb.ac.in;iitb.ac.in;cse.iitb.ac.in",
        "position": "PhD student;Undergrad student;Full Professor",
        "bibtex": "@inproceedings{\nchanda2024bayesian,\ntitle={Bayesian Coreset Optimization for Personalized Federated Learning},\nauthor={Prateek Chanda and Shrey Modi and Ganesh Ramakrishnan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=uz7d2N2zul}\n}",
        "github": "",
        "project": "",
        "reviewers": "QB83;YU5h;FxK1",
        "pdf_size": 2693083,
        "rating": "5;6;8",
        "confidence": "3;3;2",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "2;2;3",
        "wc_summary": "92;85;24",
        "wc_strengths": "41;88;26",
        "wc_weaknesses": "258;67;119",
        "wc_questions": "251;116;2",
        "wc_review": "642;356;171",
        "wc_reply_reviewers": "265;20;27",
        "wc_reply_authors": "2758;1487;881",
        "reply_reviewers": "2;1;1",
        "reply_authors": "7;6;3",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            67.0,
            30.539591789456953
        ],
        "wc_strengths_avg": [
            51.666666666666664,
            26.411277052720408
        ],
        "wc_weaknesses_avg": [
            148.0,
            80.62671186813131
        ],
        "wc_questions_avg": [
            123.0,
            101.7742600071354
        ],
        "wc_review_avg": [
            389.6666666666667,
            193.75299280842663
        ],
        "wc_reply_reviewers_avg": [
            104.0,
            113.88005385784933
        ],
        "wc_reply_authors_avg": [
            1708.6666666666667,
            782.1484655883576
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            5.333333333333333,
            1.699673171197595
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.944911182523068,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=131868057446423549&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=uz7d2N2zul",
        "pdf": "https://openreview.net/pdf?id=uz7d2N2zul",
        "email": "iitb.ac.in;iitb.ac.in;cse.iitb.ac.in",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Indian Institute of Technology Bombay",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.iitb.ac.in",
        "aff_unique_abbr": "IIT Bombay",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Bombay",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "India"
    },
    {
        "title": "On Stationary Point Convergence of PPO-Clip",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17556",
        "id": "uznKlCpWjV",
        "author_site": "Ruinan Jin, Shuai Li, Baoxiang Wang",
        "tldr": "",
        "abstract": "Proximal policy optimization (PPO) has gained popularity in reinforcement learning (RL). Its PPO-Clip variant is one the most frequently implemented algorithms and is one of the first-to-try algorithms in RL tasks. This variant uses a clipped surrogate objective function not typically found in other algorithms. Many works have demonstrated the practical performance of PPO-Clip, but the theoretical understanding of it is limited to specific settings. In this work, we provide a comprehensive analysis that shows the stationary point convergence of PPO-Clip and the convergence rate thereof. Our analysis is new and overcomes many challenges, including the non-smooth nature of the clip operator, the potentially unbounded score function, and the involvement of the ratio of two stochastic policies. Our results and techniques might share new insights into PPO-Clip.",
        "keywords": "PPO;PPO-Clip;stochastic optimization",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/0bbbefd1d5de0e990816dbf924e4be84503e77a5.pdf",
        "author": "Ruinan Jin;Shuai Li;Baoxiang Wang",
        "authorids": "~Ruinan_Jin3;~Shuai_Li3;~Baoxiang_Wang1",
        "gender": ";F;",
        "homepage": ";http://shuaili8.github.io;",
        "dblp": ";57/2281-10;",
        "google_scholar": ";https://scholar.google.com.hk/citations?user=kMZgQxcAAAAJ;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Ruinan_Jin3;~Shuai_Li3;~Baoxiang_Wang1",
        "aff": ";John Hopcroft Center, Shanghai Jiao Tong University;",
        "aff_domain": ";sjtu.edu.cn;",
        "position": ";Assistant Professor;",
        "bibtex": "@inproceedings{\njin2024on,\ntitle={On Stationary Point Convergence of {PPO}-Clip},\nauthor={Ruinan Jin and Shuai Li and Baoxiang Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=uznKlCpWjV}\n}",
        "github": "",
        "project": "",
        "reviewers": "v9Uz;wVXF;dSqC",
        "pdf_size": 298159,
        "rating": "3;6;8",
        "confidence": "4;2;4",
        "soundness": "3;4;3",
        "contribution": "2;2;3",
        "presentation": "3;2;3",
        "wc_summary": "23;38;56",
        "wc_strengths": "38;93;70",
        "wc_weaknesses": "57;55;119",
        "wc_questions": "17;32;140",
        "wc_review": "135;218;385",
        "wc_reply_reviewers": "10;5;23",
        "wc_reply_authors": "561;366;1056",
        "reply_reviewers": "1;1;1",
        "reply_authors": "3;2;3",
        "rating_avg": [
            5.666666666666667,
            2.0548046676563256
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            39.0,
            13.490737563232042
        ],
        "wc_strengths_avg": [
            67.0,
            22.55363976538303
        ],
        "wc_weaknesses_avg": [
            77.0,
            29.709706606876257
        ],
        "wc_questions_avg": [
            63.0,
            54.7905101272109
        ],
        "wc_review_avg": [
            246.0,
            103.96473761168575
        ],
        "wc_reply_reviewers_avg": [
            12.666666666666666,
            7.586537784494029
        ],
        "wc_reply_authors_avg": [
            661.0,
            290.43071462915213
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.11470786693528094,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1732462154713125714&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=uznKlCpWjV",
        "pdf": "https://openreview.net/pdf?id=uznKlCpWjV",
        "email": ";sjtu.edu.cn;",
        "author_num": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "Shanghai Jiao Tong University",
        "aff_unique_dep": "John Hopcroft Center",
        "aff_unique_url": "https://www.sjtu.edu.cn",
        "aff_unique_abbr": "SJTU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Shanghai",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "title": "How to Capture Higher-order Correlations? Generalizing Matrix Softmax Attention to Kronecker Computation",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17555",
        "id": "v0zNCwwkaV",
        "author_site": "Josh Alman, Zhao Song",
        "tldr": "",
        "abstract": "In the classical transformer attention scheme, we are given three $n \\times d$ size matrices $Q, K, V$ (the query, key, and value tokens), and the goal is to compute a new $n \\times d$ size matrix $D^{-1} \\exp(QK^\\top) V$ where $D = \\mathrm{diag}( \\exp(QK^\\top) {\\bf 1}_n )$. Here, $\\exp()$ is applied entry-wise and ${\\bf 1}_n$ denotes a length-$n$ vector whose entries are all ones.\n\nIntuitively, attention computation captures pairwise information between words in a sentence, but not higher-order information. Indeed, recent work \\cite{sht23} has shown that attention units cannot solve simple problems about detecting triples of connected words.\n\nIn this work, we study a generalization of attention which captures triple-wise  correlations. The generalization is based on computations involving tensors defined by tuples of words. More formally, given five $n \\times d$ size matrices $Q, K_1, K_2, V_1$ and $V_2$ (generalized query, key, and value tokens), our new goal is to compute an $n \\times d$ size matrix $D^{-1} \\exp( Q ( K_1 \\oslash K_2)^\\top ) (V_1 \\oslash V_2) $ where $D = \\mathrm{diag}( \\exp( Q ( K_1 \\oslash K_2)^\\top ) {\\bf 1}_{n^2} )$ and $K_1 \\oslash K_2 \\in \\mathbb{R}^{n^2 \\times d}$ denotes the column-wise Kronecker product of $K_1$ and $K_2$. This generalization is indeed able to solve problems about detecting triple-wise connections that were shown to be impossible for transformers.\n\nThe potential downside of this generalization is that it appears as though computations are even more difficult, since the straightforward algorithm requires cubic time in $n$. However, we show that in the bounded-entry setting (which arises in practice, and which is well-studied in both theory and practice), there is actually a near-linear time algorithm. More precisely, we show that bounded entries are both necessary and sufficient for quickly performing generalized computations:\n\n$\\bullet$ On the positive side, if all entries of the input matrices are bounded above by $o(\\sqrt[3]{\\log n})$ then we show how to approximate the ``tensor-type'' attention matrix in $n^{1+o(1)}$ time.\n\n$\\bullet$ On the negative side, we show that if the entries of the input matrices may be as large as $\\Omega(\\sqrt[3]{\\log n})$, then there is no algorithm that runs faster than $n^{3-o(1)}$ (assuming the Strong Exponential \nTime Hypothesis from fine-grained complexity theory).\n\n\nWe also show that our construction, algorithms, and lower bounds naturally generalize to higher-order tensors and correlations. Interestingly, the higher the order of the tensors, the lower the bound on the entries needs to be for an efficient algorithm. Our results thus yield a natural tradeoff between the boundedness of the entries, and order of the tensor one may use for more expressive, efficient attention computation.\n\nOur constructions make use of a novel connection with a higher-order variant on the kernel density estimation problem. They combine a number of technical tools, including the polynomial method, algebraic geometry codes, and multiparty Merlin-Arthur communication protocols.",
        "keywords": "Attention computation;kronecker computation",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Josh Alman;Zhao Song",
        "authorids": "~Josh_Alman1;~Zhao_Song3",
        "gender": "M;M",
        "homepage": "http://joshalman.com;https://www.youtube.com/@zhaosong2031",
        "dblp": "166/1624;76/4051-2",
        "google_scholar": "yyDMlesAAAAJ;yDZct7UAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Josh_Alman1;~Zhao_Song3",
        "aff": "Columbia University;Adobe",
        "aff_domain": "columbia.edu;adobe.com",
        "position": "Assistant Professor;Researcher",
        "bibtex": "@inproceedings{\nalman2024how,\ntitle={How to Capture Higher-order Correlations? Generalizing Matrix Softmax Attention to Kronecker Computation},\nauthor={Josh Alman and Zhao Song},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=v0zNCwwkaV}\n}",
        "github": "",
        "project": "",
        "reviewers": "7Xxi;FrM6;dthX",
        "pdf_size": 384442,
        "rating": "8;8;8",
        "confidence": "3;3;3",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "4;3;2",
        "wc_summary": "15;168;186",
        "wc_strengths": "37;11;87",
        "wc_weaknesses": "1;193;251",
        "wc_questions": "89;32;183",
        "wc_review": "142;404;707",
        "wc_reply_reviewers": "0;7;17",
        "wc_reply_authors": "245;236;820",
        "reply_reviewers": "0;1;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            123.0,
            76.72027111526653
        ],
        "wc_strengths_avg": [
            45.0,
            31.538336460039655
        ],
        "wc_weaknesses_avg": [
            148.33333333333334,
            106.83736341852611
        ],
        "wc_questions_avg": [
            101.33333333333333,
            62.25931434108653
        ],
        "wc_review_avg": [
            417.6666666666667,
            230.86263351949262
        ],
        "wc_reply_reviewers_avg": [
            8.0,
            6.97614984548545
        ],
        "wc_reply_authors_avg": [
            433.6666666666667,
            273.2036277618257
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 48,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16595928710079683873&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=v0zNCwwkaV",
        "pdf": "https://openreview.net/pdf?id=v0zNCwwkaV",
        "email": "columbia.edu;adobe.com",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Columbia University;Adobe",
        "aff_unique_dep": ";Adobe Inc.",
        "aff_unique_url": "https://www.columbia.edu;https://www.adobe.com",
        "aff_unique_abbr": "Columbia;Adobe",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Towards Characterizing Domain Counterfactuals for Invertible Latent Causal Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17554",
        "id": "v1VvCWJAL8",
        "author_site": "Zeyu Zhou, Ruqi Bai, Sean Kulinski, Murat Kocaoglu, David Inouye",
        "tldr": "",
        "abstract": "Answering counterfactual queries has important applications such as explainability, robustness, and fairness but is challenging when the causal variables are unobserved and the observations are non-linear mixtures of these latent variables, such as pixels in images.\nOne approach is to recover the latent Structural Causal Model (SCM), which may be infeasible in practice due to requiring strong assumptions, e.g., linearity of the causal mechanisms or perfect atomic interventions.\nMeanwhile, more practical ML-based approaches using naive domain translation models to generate counterfactual samples lack theoretical grounding and may construct invalid counterfactuals.\nIn this work, we strive to strike a balance between practicality and theoretical guarantees by analyzing a specific type of causal query called *domain counterfactuals*, which hypothesizes what a sample would have looked like if it had been generated in a different domain (or environment).\nWe show that recovering the latent SCM is unnecessary for estimating domain counterfactuals, thereby sidestepping some of the theoretic challenges.\nBy assuming invertibility and sparsity of intervention, we prove domain counterfactual estimation error can be bounded by a data fit term and intervention sparsity term.\nBuilding upon our theoretical results, we develop a theoretically grounded practical algorithm that simplifies the modeling process to generative model estimation under autoregressive and shared parameter constraints that enforce intervention sparsity.\nFinally, we show an improvement in counterfactual estimation over baseline methods through extensive simulated and image-based experiments.",
        "keywords": "counterfactual;domain;causal representation learning",
        "primary_area": "causal reasoning",
        "supplementary_material": "/attachment/7cec109388478abb7c6faf51ecc1498ca75ff0ba.zip",
        "author": "Zeyu Zhou;Ruqi Bai;Sean Kulinski;Murat Kocaoglu;David I. Inouye",
        "authorids": "~Zeyu_Zhou1;~Ruqi_Bai1;~Sean_Kulinski1;~Murat_Kocaoglu1;~David_I._Inouye1",
        "gender": "Unspecified;M;M;M;M",
        "homepage": "https://zyzhou3.github.io/;https://ruqibai.netlify.app/;https://seankulinski.com;https://www.muratkocaoglu.com;http://davidinouye.com",
        "dblp": ";;280/1126;74/11343;76/10817",
        "google_scholar": ";;NHVQqEQAAAAJ;7N7bzdwAAAAJ;SVMQ_g4AAAAJ",
        "orcid": ";;;;",
        "linkedin": "zyzhou3/;ruqi-bai/;seankulinski/;mkocaoglu/;",
        "or_profile": "~Zeyu_Zhou1;~Ruqi_Bai1;~Sean_Kulinski1;~Murat_Kocaoglu1;~David_I_Inouye1",
        "aff": "Purdue University;Purdue University;Databricks, Databricks;Purdue University;Purdue University",
        "aff_domain": "purdue.edu;purdue.edu;databricks.com;purdue.edu;purdue.edu",
        "position": "PhD student;PhD student;Researcher;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nzhou2024towards,\ntitle={Towards Characterizing Domain Counterfactuals for Invertible Latent Causal Models},\nauthor={Zeyu Zhou and Ruqi Bai and Sean Kulinski and Murat Kocaoglu and David I. Inouye},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=v1VvCWJAL8}\n}",
        "github": "",
        "project": "",
        "reviewers": "jRXL;KSip;4MQs;ji9w",
        "pdf_size": 8697093,
        "rating": "5;6;6;6",
        "confidence": "3;4;3;3",
        "soundness": "2;3;3;3",
        "contribution": "3;2;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "367;53;100;65",
        "wc_strengths": "55;20;37;341",
        "wc_weaknesses": "353;160;23;2",
        "wc_questions": "350;88;246;2",
        "wc_review": "1125;321;406;410",
        "wc_reply_reviewers": "165;9;0;81",
        "wc_reply_authors": "2020;927;465;1102",
        "reply_reviewers": "1;1;0;2",
        "reply_authors": "4;2;2;4",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            146.25,
            128.61449179622022
        ],
        "wc_strengths_avg": [
            113.25,
            132.07265992626938
        ],
        "wc_weaknesses_avg": [
            134.5,
            139.98303468635046
        ],
        "wc_questions_avg": [
            171.5,
            135.19892751053908
        ],
        "wc_review_avg": [
            565.5,
            324.9773069000357
        ],
        "wc_reply_reviewers_avg": [
            63.75,
            66.35275050817411
        ],
        "wc_reply_authors_avg": [
            1128.5,
            564.86923265478
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            3.0,
            1.0
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7463790729401843953&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=v1VvCWJAL8",
        "pdf": "https://openreview.net/pdf?id=v1VvCWJAL8",
        "email": "purdue.edu;purdue.edu;databricks.com;purdue.edu;purdue.edu",
        "author_num": 5,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "Purdue University;Databricks",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.purdue.edu;https://databricks.com",
        "aff_unique_abbr": "Purdue;Databricks",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "v2J205zwlu",
        "title": "UniPose: Detecting Any Keypoints",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "This work proposes a unified framework called UniPose to detect keypoints of any articulated (e.g., human and animal), rigid, and soft objects via visual or textual prompts for fine-grained vision understanding and manipulation. Keypoint is a structure-aware, pixel-level, and compact representation of any object, especially articulated objects. Existing fine-grained promptable tasks mainly focus on object instance detection and segmentation but often fail to identify fine-grained granularity and structured information of image and instance, such as eyes, leg, paw, etc. Meanwhile, prompt-based keypoint detection is still under-explored. To bridge the gap, we make the first attempt to develop an end-to-end prompt-based\nkeypoint detection framework called UniPose to detect keypoints of any objects. As keypoint detection tasks are unified in this framework, we can leverage 13 keypoint detection datasets with 338 keypoints across 1,237 categories over 400K instances to train a generic keypoint detection model. UniPose can effectively align text-to-keypoint and image-to-keypoint due to the mutual enhancement of\ntextual and visual prompts based on the cross-modality contrastive learning optimization objectives. Our experimental results show that UniPose has strong fine-grained localization and generalization abilities across image styles, categories, and poses. Based on UniPose as a generalist keypoint detector, we hope it could serve fine-grained visual perception, understanding, and generation.",
        "keywords": "2D Keypint Detection",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Jie Yang;Ailing Zeng;Ruimao Zhang;Lei Zhang",
        "authorids": "~Jie_Yang20;~Ailing_Zeng1;~Ruimao_Zhang1;~Lei_Zhang23",
        "gender": "M;F;M;M",
        "homepage": "https://yangjie-cv.github.io/;https://ailingzeng.site/;http://zhangruimao.site/#;https://www.leizhang.org/",
        "dblp": ";226/4720;54/10697;z/LeiZhang",
        "google_scholar": "UVzG9IcAAAAJ;Tn7fzS8AAAAJ;ZJwZdtgAAAAJ;fIlGZToAAAAJ",
        "orcid": ";;;",
        "linkedin": ";%E7%88%B1%E7%8E%B2-%E6%9B%BE-65504112a/;;",
        "or_profile": "~Jie_Yang20;~Ailing_Zeng1;~Ruimao_Zhang1;~Lei_Zhang1",
        "aff": "The Chinese University of Hong Kong, Shenzhen;International Digital Economy Academy;The Chinese University of Hong Kong (Shenzhen);International Digital Economy Academy",
        "aff_domain": "cuhk.edu.cn;idea.edu.cn;cuhk.edu.cn;idea.edu.cn",
        "position": "PhD student;Researcher;Assistant Professor;Chief Scientist",
        "bibtex": "@misc{\nyang2024unipose,\ntitle={UniPose: Detecting Any Keypoints},\nauthor={Jie Yang and Ailing Zeng and Ruimao Zhang and Lei Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=v2J205zwlu}\n}",
        "github": "",
        "project": "",
        "reviewers": "Di8P;SvA3;Ldy8;WBby",
        "site": "https://openreview.net/forum?id=v2J205zwlu",
        "pdf_size": 6785231,
        "rating": "3;5;6;6",
        "confidence": "4;5;3;3",
        "soundness": "2;2;3;3",
        "contribution": "3;2;3;3",
        "presentation": "1;2;3;4",
        "wc_summary": "69;79;101;137",
        "wc_strengths": "38;20;174;54",
        "wc_weaknesses": "235;456;15;78",
        "wc_questions": "2;2;23;17",
        "wc_review": "344;557;313;286",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1160;1811;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;3;0;0",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            96.5,
            26.091186251299497
        ],
        "wc_strengths_avg": [
            71.5,
            60.38832668653769
        ],
        "wc_weaknesses_avg": [
            196.0,
            170.15140316788458
        ],
        "wc_questions_avg": [
            11.0,
            9.246621004453464
        ],
        "wc_review_avg": [
            375.0,
            107.06306552681929
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            742.75,
            777.594166323282
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            1.299038105676658
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.4923659639173309,
        "gs_citation": 20,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8611052650744586511&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;1",
        "aff_unique_norm": "Chinese University of Hong Kong;International Digital Economy Academy",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cuhk.edu.cn;",
        "aff_unique_abbr": "CUHK;",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Shenzhen;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China;"
    },
    {
        "title": "AutomaTikZ: Text-Guided Synthesis of Scientific Vector Graphics with TikZ",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17553",
        "id": "v3K5TVP8kZ",
        "author_site": "Jonas Belouadi, Anne Lauscher, Steffen Eger",
        "tldr": "",
        "abstract": "Generating bitmap graphics from text has gained considerable attention, yet for scientific figures, vector graphics are often preferred. Given that vector graphics are typically encoded using low-level graphics primitives, generating them directly is difficult. To address this, we propose the use of TikZ, a well-known abstract graphics language that can be compiled to vector graphics, as an intermediate representation of scientific figures. TikZ offers human-oriented, high-level commands, thereby facilitating conditional language modeling with any large language model. To this end, we introduce DaTikZ the first large-scale TikZ dataset, consisting of 120k TikZ drawings aligned with captions. We fine-tune LLaMA on DaTikZ, as well as our new model CLiMA, which augments LLaMA with multimodal CLIP embeddings. In both human and automatic evaluation, CLiMA and LLaMA outperform commercial GPT-4 and Claude 2 in terms of similarity to human-created figures, with CLiMA additionally improving text-image alignment. Our detailed analysis shows that all models generalize well and are not susceptible to memorization. GPT-4 and Claude 2, however, tend to generate more simplistic figures compared to both humans and our models. We make our framework, AutomaTikZ, along with model weights and datasets, publicly available.",
        "keywords": "Vector Graphics Generation;Code Generation;Science Generation;TikZ;Text-to-Image",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/8cc68b43add54f87433a0c539a594a545b6b9782.zip",
        "author": "Jonas Belouadi;Anne Lauscher;Steffen Eger",
        "authorids": "~Jonas_Belouadi1;~Anne_Lauscher1;~Steffen_Eger1",
        "gender": "M;;M",
        "homepage": ";;https://steffeneger.github.io/",
        "dblp": "314/6088;209/6857;69/9271",
        "google_scholar": "ut5IWKwAAAAJ;https://scholar.google.it/citations?user=IbJS3UEAAAAJ;https://scholar.google.de/citations?user=TnuqAW0AAAAJ",
        "orcid": "0009-0002-2990-9536;;",
        "linkedin": "belouadi;;",
        "or_profile": "~Jonas_Belouadi1;~Anne_Lauscher1;~Steffen_Eger1",
        "aff": "Universit\u00e4t Mannheim;Universit\u00e4t Hamburg;Universit\u00e4t Mannheim",
        "aff_domain": "uni-mannheim.de;uni-hamburg.de;uni-mannheim.de",
        "position": "PhD student;Associate Professor;Associate Professor",
        "bibtex": "@inproceedings{\nbelouadi2024automatikz,\ntitle={AutomaTikZ: Text-Guided Synthesis of Scientific Vector Graphics with TikZ},\nauthor={Jonas Belouadi and Anne Lauscher and Steffen Eger},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=v3K5TVP8kZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "hZYD;stBp;1jqj;L9z3",
        "pdf_size": 850558,
        "rating": "6;6;6;8",
        "confidence": "4;3;4;3",
        "soundness": "3;2;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "65;78;36;49",
        "wc_strengths": "69;59;40;143",
        "wc_weaknesses": "100;30;87;239",
        "wc_questions": "97;33;9;64",
        "wc_review": "331;200;172;495",
        "wc_reply_reviewers": "119;0;0;19",
        "wc_reply_authors": "745;184;295;829",
        "reply_reviewers": "2;0;0;1",
        "reply_authors": "2;1;1;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            57.0,
            15.890248582070704
        ],
        "wc_strengths_avg": [
            77.75,
            39.08564314425439
        ],
        "wc_weaknesses_avg": [
            114.0,
            76.82122102648461
        ],
        "wc_questions_avg": [
            50.75,
            33.063386093986196
        ],
        "wc_review_avg": [
            299.5,
            127.8368100352946
        ],
        "wc_reply_reviewers_avg": [
            34.5,
            49.39888662712956
        ],
        "wc_reply_authors_avg": [
            513.25,
            278.13879179287454
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 32,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5175426279475371774&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=v3K5TVP8kZ",
        "pdf": "https://openreview.net/pdf?id=v3K5TVP8kZ",
        "email": "uni-mannheim.de;uni-hamburg.de;uni-mannheim.de",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Mannheim;University of Hamburg",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uni-mannheim.de;https://www.uni-hamburg.de",
        "aff_unique_abbr": "UM;UHH",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "title": "RLCD: Reinforcement Learning from Contrastive Distillation for LM Alignment",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17552",
        "id": "v3XXtxWKi6",
        "author_site": "Kevin Yang, Dan Klein, Asli Celikyilmaz, Nanyun (Violet) Peng, Yuandong Tian",
        "tldr": "",
        "abstract": "We propose Reinforcement Learning from Contrastive Distillation (RLCD), a method for aligning language models to follow principles expressed in natural language (e.g., to be more harmless) without using human feedback. RLCD creates preference pairs from two contrasting model outputs, one using a positive prompt designed to encourage following the given principles, and one using a negative prompt designed to encourage violating them. Using two different prompts causes model outputs to be more differentiated on average, resulting in cleaner preference labels in the absence of human annotations. We then use the preference pairs to train a preference model, which is in turn used to improve a base unaligned language model via reinforcement learning. Empirically, RLCD outperforms RLAIF (Bai et al., 2022b) and context distillation (Huang et al., 2022) baselines across three diverse alignment tasks\u2014harmlessness, helpfulness, and story outline generation\u2014and when using both 7B and 30B model scales for simulating preference data",
        "keywords": "Language Model;RLHF;Alignment;Instruction Tuning",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/78e4874b9230feba67d5f750b4fb538ab2013808.zip",
        "author": "Kevin Yang;Dan Klein;Asli Celikyilmaz;Nanyun Peng;Yuandong Tian",
        "authorids": "~Kevin_Yang2;~Dan_Klein1;~Asli_Celikyilmaz1;~Nanyun_Peng1;~Yuandong_Tian1",
        "gender": ";F;F;M;M",
        "homepage": "http://people.eecs.berkeley.edu/~klein/;https://asli.us;https://violetpeng.github.io/;http://yuandong-tian.com;https://people.eecs.berkeley.edu/~yangk/",
        "dblp": ";15/3724;117/4036;t/YuandongTian;13/10565",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;XxRXvX0AAAAJ;0mgEF28AAAAJ;sRpY9TIAAAAJ",
        "orcid": ";;;0000-0003-4202-4847;",
        "linkedin": "dan-klein/;aslicelikyilmaz/;;yuandongtian;",
        "or_profile": "~Dan_Klein1;~Asli_Celikyilmaz1;~Nanyun_Peng1;~Yuandong_Tian1;~Kevin_Yang1",
        "aff": "University of California, Berkeley;FAIR ;University of California, Los Angeles;Meta AI (FAIR);Scaled Cognition",
        "aff_domain": "berkeley.edu;meta.com;ucla.edu;meta.com;scaledcognition.com",
        "position": "Full Professor;Principal Researcher;Assistant Professor;Research Scientist;Researcher",
        "bibtex": "@inproceedings{\nyang2024rlcd,\ntitle={{RLCD}: Reinforcement Learning from Contrastive Distillation for {LM} Alignment},\nauthor={Kevin Yang and Dan Klein and Asli Celikyilmaz and Nanyun Peng and Yuandong Tian},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=v3XXtxWKi6}\n}",
        "github": "",
        "project": "",
        "reviewers": "Cuc6;bkDY;RAFU;UFW8;HiRS",
        "pdf_size": 744267,
        "rating": "5;6;6;6;6",
        "confidence": "3;3;3;2;3",
        "soundness": "2;2;3;3;3",
        "contribution": "2;2;2;2;2",
        "presentation": "3;3;3;3;3",
        "wc_summary": "60;84;124;140;109",
        "wc_strengths": "13;42;61;72;67",
        "wc_weaknesses": "39;143;25;125;77",
        "wc_questions": "23;2;258;29;273",
        "wc_review": "135;271;468;366;526",
        "wc_reply_reviewers": "56;35;17;0;0",
        "wc_reply_authors": "499;722;701;309;1440",
        "reply_reviewers": "1;1;1;0;0",
        "reply_authors": "2;2;2;1;2",
        "rating_avg": [
            5.8,
            0.39999999999999997
        ],
        "confidence_avg": [
            2.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            103.4,
            28.4787640181241
        ],
        "wc_strengths_avg": [
            51.0,
            21.549941995281564
        ],
        "wc_weaknesses_avg": [
            81.8,
            46.24456724848877
        ],
        "wc_questions_avg": [
            117.0,
            121.67333315069494
        ],
        "wc_review_avg": [
            353.2,
            139.6930921699423
        ],
        "wc_reply_reviewers_avg": [
            21.6,
            21.527656630483495
        ],
        "wc_reply_authors_avg": [
            734.2,
            383.5410799379905
        ],
        "reply_reviewers_avg": [
            0.6,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.8,
            0.4
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.2500000000000001,
        "gs_citation": 23,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9756226251451526912&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=v3XXtxWKi6",
        "pdf": "https://openreview.net/pdf?id=v3XXtxWKi6",
        "email": "berkeley.edu;meta.com;ucla.edu;meta.com;scaledcognition.com",
        "author_num": 5,
        "aff_unique_index": "0;1;2;1;3",
        "aff_unique_norm": "University of California, Berkeley;Meta;University of California, Los Angeles;Scaled Cognition",
        "aff_unique_dep": ";Facebook AI Research;;",
        "aff_unique_url": "https://www.berkeley.edu;https://research.facebook.com;https://www.ucla.edu;",
        "aff_unique_abbr": "UC Berkeley;FAIR;UCLA;",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Berkeley;;Los Angeles",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "v4mOfy3QZQ",
        "title": "Robustness Evaluation Using Local Substitute Networks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The robustness of a neural network against adversarial examples is important when a deep classifier is applied in safety-critical use cases like health care or autonomous driving. To assess the robustness, practitioners use various tools ranging from adversarial attacks to the exact computation of the distance to the decision boundary. We use the fact that the robustness of a neural network is a local property and empirically show that computing the same metrics for the smaller local substitute networks yields reasonable estimates of the robustness for a lower cost. To construct the substitute network, we develop several pruning techniques that preserve the local properties of the initial network around a given anchor point. Our experiments on multiple datasets prove that this approach saves a significant amount of computation.",
        "keywords": "robustness;verification;adversarial;pruning;neural networks",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/51b064352b6a80634023a464405bb858630f68d0.pdf",
        "author": "Aleksei Kuvshinov;Cristian Pavel;Stephan G\u00fcnnemann",
        "authorids": "~Aleksei_Kuvshinov1;~Cristian_Pavel1;~Stephan_G\u00fcnnemann1",
        "gender": "M;M;M",
        "homepage": "https://www.cs.cit.tum.de/daml/team/aleksei-kuvshinov/;;http://www.daml.in.tum.de",
        "dblp": "289/8401;293/8067;43/3011",
        "google_scholar": "https://scholar.google.de/citations?user=tjVXaLIAAAAJ;;",
        "orcid": ";;",
        "linkedin": ";cristian-pavel/;",
        "or_profile": "~Aleksei_Kuvshinov1;~Cristian_Pavel1;~Stephan_G\u00fcnnemann1",
        "aff": "Technical University Munich;;Technical University Munich",
        "aff_domain": "tum.de;;tum.de",
        "position": "PhD student;;Professor",
        "bibtex": "@misc{\nkuvshinov2024robustness,\ntitle={Robustness Evaluation Using Local Substitute Networks},\nauthor={Aleksei Kuvshinov and Cristian Pavel and Stephan G{\\\"u}nnemann},\nyear={2024},\nurl={https://openreview.net/forum?id=v4mOfy3QZQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "kiZT;eJVB;iXnZ;D5Te;wHPv;7VfR",
        "site": "https://openreview.net/forum?id=v4mOfy3QZQ",
        "pdf_size": 2418394,
        "rating": "3;3;3;3;5;8",
        "confidence": "4;4;4;2;2;3",
        "soundness": "2;3;2;2;2;3",
        "contribution": "1;2;2;2;2;3",
        "presentation": "1;2;2;2;3;3",
        "wc_summary": "27;47;35;24;75;87",
        "wc_strengths": "31;27;12;41;60;139",
        "wc_weaknesses": "1963;81;383;91;73;91",
        "wc_questions": "47;3;94;33;59;45",
        "wc_review": "2068;158;524;189;267;362",
        "wc_reply_reviewers": "0;0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0;0",
        "reply_authors": "0;0;0;0;0;0",
        "rating_avg": [
            4.166666666666667,
            1.863389981249825
        ],
        "confidence_avg": [
            3.1666666666666665,
            0.8975274678557507
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.5773502691896257
        ],
        "presentation_avg": [
            2.1666666666666665,
            0.6871842709362768
        ],
        "wc_summary_avg": [
            49.166666666666664,
            23.905485191106713
        ],
        "wc_strengths_avg": [
            51.666666666666664,
            41.671999658710355
        ],
        "wc_weaknesses_avg": [
            447.0,
            686.7381839779505
        ],
        "wc_questions_avg": [
            46.833333333333336,
            27.352127684860076
        ],
        "wc_review_avg": [
            594.6666666666666,
            669.8814986415301
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3155728234442119,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:4szhi8br5kUJ:scholar.google.com/&scioq=Robustness+Evaluation+Using+Local+Substitute+Networks&hl=en&as_sdt=0,44",
        "gs_version_total": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Technical University of Munich",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tum.de",
        "aff_unique_abbr": "TUM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "v5Bb7F1Wkf",
        "title": "Towards Plastic and Stable Exemplar-Free Incremental Learning: A Dual-Learner Framework with Cumulative Parameter Averaging",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The dilemma between plasticity and stability presents a significant challenge in Incremental Learning (IL), especially in the exemplar-free scenario where accessing old-task samples is strictly prohibited during the learning of a new task. A straightforward solution to this issue is learning and storing an independent model for each task, known as Single Task Learning (STL). Despite the linear growth in model storage with the number of tasks in STL, we empirically discover that averaging these model parameters can potentially preserve knowledge across all tasks. Inspired by this observation, we propose a Dual-Learner framework with Cumulative Parameter Averaging (DLCPA). DLCPA employs a dual-learner design: a plastic learner focused on acquiring new-task knowledge and a stable learner responsible for accumulating all learned knowledge. The knowledge from the plastic learner is transferred to the stable learner via cumulative parameter averaging. Additionally, several task-specific classifiers work in cooperation with the stable learner to yield the final prediction. Specifically, when learning a new task, these modules are updated in a cyclic manner: i) the plastic learner is initially optimized using a self-supervised loss besides the supervised loss to enhance the feature extraction robustness; ii) the stable learner is then updated with respect to the plastic learner in a cumulative parameter averaging manner to maintain its task-wise generalization; iii) the task-specific classifier is accordingly optimized to align with the stable learner. Experimental results on CIFAR-100 and Tiny-ImageNet show that DLCPA outperforms several state-of-the-art exemplar-free baselines in both Task-IL and Class-IL settings.",
        "keywords": "incremental learning;continual learning;self-supervised learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/38b7d34a2ef0b24ae82135374ab0d30520ecea7d.zip",
        "author": "Wenju Sun;Qingyong Li;Wen Wang;Yangliao Geng",
        "authorids": "~Wenju_Sun1;~Qingyong_Li1;~Wen_Wang5;~Yangliao_Geng1",
        "gender": "M;M;F;M",
        "homepage": "https://sunwenju123.github.io/;https://faculty.bjtu.edu.cn/7950/;https://faculty.bjtu.edu.cn/9523/;",
        "dblp": "300/7654;29/4219;29/4680-19.html;190/7083.html",
        "google_scholar": "https://scholar.google.com.hk/citations?user=iQrJw3IAAAAJ;pJ6oB1UAAAAJ;ztnNlb0AAAAJ;https://scholar.google.com.hk/citations?user=gA0xam0AAAAJ",
        "orcid": ";0000-0002-3860-4809;0000-0002-6076-9714;0000-0002-0084-5164",
        "linkedin": ";;;",
        "or_profile": "~Wenju_Sun1;~Qingyong_Li1;~Wen_Wang5;~Yangliao_Geng1",
        "aff": "Beijing Jiaotong University;Beijing Jiaotong University;Beijing Jiaotong University;Beijing Jiaotong University",
        "aff_domain": "bjtu.edu.cn;bjtu.edu.cn;bjtu.edu.cn;bjtu.edu.cn",
        "position": "PhD student;Full Professor;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nsun2024towards,\ntitle={Towards Plastic and Stable Exemplar-Free Incremental Learning: A Dual-Learner Framework with Cumulative Parameter Averaging},\nauthor={Wenju Sun and Qingyong Li and Wen Wang and Yangliao Geng},\nyear={2024},\nurl={https://openreview.net/forum?id=v5Bb7F1Wkf}\n}",
        "github": "",
        "project": "",
        "reviewers": "CE6t;bahq;Gkrh;ikP1",
        "site": "https://openreview.net/forum?id=v5Bb7F1Wkf",
        "pdf_size": 2338642,
        "rating": "3;3;5;5",
        "confidence": "3;2;3;4",
        "soundness": "2;2;2;2",
        "contribution": "2;1;2;3",
        "presentation": "2;2;3;3",
        "wc_summary": "98;47;114;108",
        "wc_strengths": "88;18;48;108",
        "wc_weaknesses": "324;118;253;68",
        "wc_questions": "35;6;56;72",
        "wc_review": "545;189;471;356",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            91.75,
            26.461056290329758
        ],
        "wc_strengths_avg": [
            65.5,
            34.910600109422354
        ],
        "wc_weaknesses_avg": [
            190.75,
            102.45822319365098
        ],
        "wc_questions_avg": [
            42.25,
            24.70197360536198
        ],
        "wc_review_avg": [
            390.25,
            134.2970122526931
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.7071067811865475,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1815915242171528178&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Beijing Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.njtu.edu.cn/en",
        "aff_unique_abbr": "BJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "v5BcZzkAXg",
        "title": "Multi-label Learning with Random Circular Vectors",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Extreme multi-label classfication (XMC) task involves learning a classifier which can predict from a large label set the most relevant subset of labels for a data instance. While deep neural networks (DNNs) have demonstrated remarkable success in XMC problems, the task is still challenging because it needs to deal with a large number of output labels, which make the DNN training computationally expensive. This paper addresses solving the issue by exploring the use of random circular vectors where each vector component is represented as a complex amplitude. In our proposed framework, we can develop an output layer and loss function of DNNs for XMC by representing the final output layer as a fully connected layer that directly predicts a low-dimensional circular vector encoding a set of labels for a data instance. In this paper, we firstly conducted experiments on synthetic datasets to verify that circular vectors have better label encoding capacity and retrieval ability than normal real-valued vectors. Then, our experimental results on XMC datasets also show that these appealing properties of circular vectors contribute to significant improvements in XMC task performances, compared with a previous model using random real-valued vectors, while reducing the size of the output layers by up to 97%.",
        "keywords": "Extreme Multi-label Classification;Random Projection;Vector Symbolic Architectures",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Ken Nishida;Katsuhiko Hayashi;Kojiro Machi;Hidetaka Kamigaito",
        "authorids": "~Ken_Nishida2;~Katsuhiko_Hayashi2;~Kojiro_Machi1;~Hidetaka_Kamigaito2",
        "gender": "M;M;M;M",
        "homepage": "https://sites.google.com/eis.hokudai.ac.jp/ken-nishida/%E3%83%9B%E3%83%BC%E3%83%A0;;;https://sites.google.com/site/hidetakakamigaito/",
        "dblp": ";23/9282;;124/2384",
        "google_scholar": ";;;https://scholar.google.co.jp/citations?user=cyZpch8AAAAJ",
        "orcid": ";;0009-0003-5239-8903;0000-0002-5249-5813",
        "linkedin": ";;;",
        "or_profile": "~Ken_Nishida2;~Katsuhiko_Hayashi2;~Kojiro_Machi1;~Hidetaka_Kamigaito2",
        "aff": "Faculty of Information Science and Technology, Hokkaido University;The University of Tokyo;Hokkaido University;Nara Institute of Science and Technology",
        "aff_domain": "hokudai.ac.jp;u-tokyo.ac.jp;hokudai.ac.jp;naist.jp",
        "position": "MS student;Associate Professor;PhD student;Associate Professor",
        "bibtex": "@misc{\nnishida2024multilabel,\ntitle={Multi-label Learning with Random Circular Vectors},\nauthor={Ken Nishida and Katsuhiko Hayashi and Kojiro Machi and Hidetaka Kamigaito},\nyear={2024},\nurl={https://openreview.net/forum?id=v5BcZzkAXg}\n}",
        "github": "",
        "project": "",
        "reviewers": "Cc3g;7H1H;vWH8;7cd9",
        "site": "https://openreview.net/forum?id=v5BcZzkAXg",
        "pdf_size": 1408817,
        "rating": "5;5;5;6",
        "confidence": "3;3;4;2",
        "soundness": "3;2;2;3",
        "contribution": "3;2;1;2",
        "presentation": "3;3;3;3",
        "wc_summary": "77;88;184;76",
        "wc_strengths": "70;23;53;19",
        "wc_weaknesses": "235;47;216;59",
        "wc_questions": "17;231;69;27",
        "wc_review": "399;389;522;181",
        "wc_reply_reviewers": "82;0;101;44",
        "wc_reply_authors": "793;820;1358;555",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "2;2;4;3",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            106.25,
            45.135213525583325
        ],
        "wc_strengths_avg": [
            41.25,
            21.1704392963396
        ],
        "wc_weaknesses_avg": [
            139.25,
            86.61516899481292
        ],
        "wc_questions_avg": [
            86.0,
            85.95929269136641
        ],
        "wc_review_avg": [
            372.75,
            122.47117007687973
        ],
        "wc_reply_reviewers_avg": [
            56.75,
            38.661188548724155
        ],
        "wc_reply_authors_avg": [
            881.5,
            293.7979748058179
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:envIWfxhqDkJ:scholar.google.com/&scioq=Multi-label+Learning+with+Random+Circular+Vectors&hl=en&as_sdt=0,14",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "Hokkaido University;University of Tokyo;Nara Institute of Science and Technology",
        "aff_unique_dep": "Faculty of Information Science and Technology;;",
        "aff_unique_url": "https://www.hokudai.ac.jp;https://www.u-tokyo.ac.jp;https://www.nist.go.jp",
        "aff_unique_abbr": "Hokkaido U;UTokyo;NIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Japan"
    },
    {
        "id": "v5PBcUSP2o",
        "title": "Score-based Neural Processes",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Neural Processes (NPs) have recently emerged as a powerful meta-learning framework capable of making predictions based on an arbitrary number of context points. However,  the learning of NPs and their variants is hindered by the need for explicit reliance on the log-likelihood of predictive distributions, which complicates the training process. To tackle this problem, we introduce Score-based Neural Process (SNP) models, drawing inspiration from recently developed score-based generative models that restore data from noise by reversing a perturbation process. With denoising score matching techniques, the SNPs bypass the intractable log-likelihood calculations, learning parameterized score functions instead. We also demonstrate that score functions possess excellent attributes that enable us to naturally represent a wide family of conditional distributions. Moreover, as data points are inherently unordered, it is crucial to incorporate appropriate inductive biases into SNPs. To this end, we propose building blocks for parameterizing permutation equivariant score functions, which induce the SNPs with the desired properties. Through extensive experimentation on both synthetic and real-world datasets, our SNPs exhibit remarkable performance and outperform existing state-of-the-art NP approaches.",
        "keywords": "Neural process; score matching; stochastic differential equations; induced point method.",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Hongkun Dou;Junzhe Lu;Wen Yao;Xiao qian Chen;Yue Deng",
        "authorids": "~Hongkun_Dou3;~Junzhe_Lu1;~Wen_Yao1;~Xiao_qian_Chen1;~Yue_Deng4",
        "gender": "M;F;;M;M",
        "homepage": ";;;;",
        "dblp": "244/4109-1.html;;61/538.html;35/8109-1;285/8223",
        "google_scholar": "hnJ4NIYAAAAJ;;;;pSNEkEwAAAAJ",
        "orcid": "0000-0002-5780-4574;0000-0001-5224-9834;;;0000-0001-6185-5369",
        "linkedin": ";;;;",
        "or_profile": "~Junzhe_Lu1;~Wen_Yao1;~Xiao_qian_Chen1;~Yue_Deng4;~hongkun_dou1",
        "aff": "Beihang University;National University of Defense Technology;;Beihang University;Beihang University",
        "aff_domain": "buaa.edu.cn;nudt.edu.cn;;buaa.edu.cn;buaa.edu.cn",
        "position": "Undergrad student;Principal Researcher;;Full Professor;PhD student",
        "bibtex": "@misc{\ndou2024scorebased,\ntitle={Score-based Neural Processes},\nauthor={Hongkun Dou and Junzhe Lu and Wen Yao and Xiao qian Chen and Yue Deng},\nyear={2024},\nurl={https://openreview.net/forum?id=v5PBcUSP2o}\n}",
        "github": "",
        "project": "",
        "reviewers": "RB5P;Gnhg;EWhp",
        "site": "https://openreview.net/forum?id=v5PBcUSP2o",
        "pdf_size": 7585855,
        "rating": "3;5;5",
        "confidence": "3;4;3",
        "soundness": "2;2;2",
        "contribution": "2;2;2",
        "presentation": "2;3;3",
        "wc_summary": "84;55;208",
        "wc_strengths": "174;32;76",
        "wc_weaknesses": "617;194;174",
        "wc_questions": "709;4;34",
        "wc_review": "1584;285;492",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            115.66666666666667,
            66.35426805329774
        ],
        "wc_strengths_avg": [
            94.0,
            59.352056970813294
        ],
        "wc_weaknesses_avg": [
            328.3333333333333,
            204.2813963357625
        ],
        "wc_questions_avg": [
            249.0,
            325.49961597519587
        ],
        "wc_review_avg": [
            787.0,
            569.8648962692824
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.49999999999999983,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:bQZ8HbuZuHQJ:scholar.google.com/&scioq=Score-based+Neural+Processes&hl=en&as_sdt=0,5",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Beihang University;National University of Defense Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.buaa.edu.cn/;http://www.nudt.edu.cn/",
        "aff_unique_abbr": "BUAA;NUDT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "v5lmhckxlu",
        "title": "Integrated Model Explanations by Independent and Collaborative Feature Influence via Linear-Nonlinear Perspectives.",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In machine learning, model-agnostic explanation methods try to give explanation to model prediction by assessing the importance of input features.  While linear simplification methods guarantee good properties, they have to include nonlinear feature interactions into linear coefficients. On the other hand,\nfeature influence analysis methods examine feature relevance, but do not consistently preserve the desirable properties for robust explanations. Our approach seeks to inherit properties from linear simplification methods while systematically capturing feature interactions. To achieve this, we consider the explained model from two aspects: the linear aspect, which focuses on the independent influence of features to model predictions, and the nonlinear aspect, which concentrates on modeling feature interactions and their collaborative impact on model predictions. In practice, our method initially investigates both the linear and nonlinear aspects of the model being explained.  It then extracts the independent and collaborative importance of features on model predictions and consistently combines them to ensure that the resulting feature importance preserves the desirable properties for robust explanations.\nConsequently, our Linear-Nonlinear Explanation (LNE) method provides a comprehensive understanding on how features influence model predictions. To validate its effectiveness, experiments demonstrate that linear, nonlinear, and the combined feature importance all offer valuable insights for explaining model predictions. We also compare the performance of LNE with other methods on explaining well-trained classifiers, and find our explanations align more closely with human intuitions. Additionally, user study shows our method can hint humans with potential biases in classifiers.",
        "keywords": "Explanation method;Linear simplification;Feature interactions;Independent influence;Collaborative influence;Linear-Nonlinear Explanation",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Shengzhe Chen;Yang Weng",
        "authorids": "~Shengzhe_Chen1;~Yang_Weng1",
        "gender": "M;",
        "homepage": ";",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": "0009-0001-2877-6252;",
        "linkedin": ";",
        "or_profile": "~Shengzhe_Chen1;~Yang_Weng1",
        "aff": "Arizona State University;",
        "aff_domain": "asu.edu;",
        "position": "PhD student;",
        "bibtex": "@misc{\nchen2024integrated,\ntitle={Integrated Model Explanations by Independent and Collaborative Feature Influence via Linear-Nonlinear Perspectives.},\nauthor={Shengzhe Chen and Yang Weng},\nyear={2024},\nurl={https://openreview.net/forum?id=v5lmhckxlu}\n}",
        "github": "",
        "project": "",
        "reviewers": "fF3Y;84DP;hDKN;9qFs;5b7M",
        "site": "https://openreview.net/forum?id=v5lmhckxlu",
        "pdf_size": 885214,
        "rating": "3;3;3;3;5",
        "confidence": "3;4;4;4;4",
        "soundness": "1;2;2;1;2",
        "contribution": "1;2;1;1;2",
        "presentation": "1;3;2;2;2",
        "wc_summary": "70;62;75;108;65",
        "wc_strengths": "34;30;52;58;68",
        "wc_weaknesses": "422;74;830;214;203",
        "wc_questions": "45;373;9;57;190",
        "wc_review": "571;539;966;437;526",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            3.4,
            0.8
        ],
        "confidence_avg": [
            3.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            1.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            1.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            76.0,
            16.601204775557708
        ],
        "wc_strengths_avg": [
            48.4,
            14.38888459888396
        ],
        "wc_weaknesses_avg": [
            348.6,
            265.2754040615149
        ],
        "wc_questions_avg": [
            134.8,
            133.9617855957437
        ],
        "wc_review_avg": [
            607.8,
            184.53118977560405
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.25,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ncgrja5mvXYJ:scholar.google.com/&scioq=Integrated+Model+Explanations+by+Independent+and+Collaborative+Feature+Influence+via+Linear-Nonlinear+Perspectives.&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Arizona State University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.asu.edu",
        "aff_unique_abbr": "ASU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Faster Sampling from Log-Concave Densities over Polytopes via Efficient Linear Solvers",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17551",
        "id": "v63GWletn8",
        "author_site": "Oren Mangoubi, Nisheeth Vishnoi",
        "tldr": "",
        "abstract": "We consider the problem of sampling from a logconcave distribution $\\pi(\\theta) \\propto e^{-f(\\theta)}$ constrained to a polytope $K:=${$\\theta \\in \\mathbb{R}^d: A\\theta \\leq b$}, where $A\\in   \\mathbb{R}^{m\\times d}$ and $b \\in \\mathbb{R}^m$. The fastest-known algorithm for the setting when $f$ is $O(1)$-Lipschitz or $O(1)$-smooth runs in roughly $O(md \\times md^{\\omega -1})$ arithmetic operations, where the $md^{\\omega -1}$ term arises because each Markov chain step requires computing a matrix inversion and determinant ($\\omega \\approx 2.37$ is the matrix multiplication constant). We present a nearly-optimal implementation of this Markov chain with per-step complexity that is roughly the number of non-zero entries of $A$ while the number of Markov chain steps remains the same. The key technical ingredients are 1) to show that the matrices that arise in this Dikin walk change slowly, 2) to deploy efficient linear solvers which can leverage this slow change to speed up matrix inversion by using information computed in previous steps, and 3) to speed up the computation of the determinantal term in the Metropolis filter step via a randomized Taylor series-based estimator. This result directly improves the runtime for applications that involve sampling from Gibbs distributions constrained to polytopes that arise in Bayesian statistics and private optimization.",
        "keywords": "Logconcave sampling;Dikin walk;Markov chain Monte Carlo;Interior point methods",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Oren Mangoubi;Nisheeth K. Vishnoi",
        "authorids": "~Oren_Mangoubi1;~Nisheeth_K._Vishnoi2",
        "gender": "M;M",
        "homepage": ";http://cs.yale.edu/homes/vishnoi/Home.html",
        "dblp": "158/6707;02/2229",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Oren_Mangoubi1;~Nisheeth_K_Vishnoi1",
        "aff": "Worcester Polytechnic Institute;Yale University",
        "aff_domain": "wpi.edu;yale.edu",
        "position": "Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\nmangoubi2024faster,\ntitle={Faster Sampling from Log-Concave Densities over Polytopes via Efficient Linear Solvers},\nauthor={Oren Mangoubi and Nisheeth K. Vishnoi},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=v63GWletn8}\n}",
        "github": "",
        "project": "",
        "reviewers": "mHXa;CJYs;nR3E;6Phh",
        "pdf_size": 596170,
        "rating": "3;8;8;8",
        "confidence": "5;3;4;3",
        "soundness": "3;3;3;3",
        "contribution": "2;4;4;3",
        "presentation": "3;3;3;2",
        "wc_summary": "91;203;119;56",
        "wc_strengths": "32;181;49;76",
        "wc_weaknesses": "224;186;60;75",
        "wc_questions": "2;3;1;1",
        "wc_review": "349;573;229;208",
        "wc_reply_reviewers": "832;0;0;32",
        "wc_reply_authors": "1822;125;126;300",
        "reply_reviewers": "3;0;0;1",
        "reply_authors": "6;1;1;2",
        "rating_avg": [
            6.75,
            2.165063509461097
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            117.25,
            54.30642227214015
        ],
        "wc_strengths_avg": [
            84.5,
            57.88134414472422
        ],
        "wc_weaknesses_avg": [
            136.25,
            70.2508896740817
        ],
        "wc_questions_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_review_avg": [
            339.75,
            145.01271495975791
        ],
        "wc_reply_reviewers_avg": [
            216.0,
            355.8876227125636
        ],
        "wc_reply_authors_avg": [
            593.25,
            712.9871580189927
        ],
        "reply_reviewers_avg": [
            1.0,
            1.224744871391589
        ],
        "reply_authors_avg": [
            2.5,
            2.0615528128088303
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.8703882797784891,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13913245802297925695&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=v63GWletn8",
        "pdf": "https://openreview.net/pdf?id=v63GWletn8",
        "email": "wpi.edu;yale.edu",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Worcester Polytechnic Institute;Yale University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.wpi.edu;https://www.yale.edu",
        "aff_unique_abbr": "WPI;Yale",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "v675Iyu0ta",
        "title": "Interpretability Illusions in the Generalization of Simplified Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "A common method to study deep learning systems is to create simplified representations---for example, using singular value decomposition to visualize the model's hidden states in a lower dimensional space. This approach assumes that the simplified model is faithful to the original model. Here, we illustrate an important caveat to this assumption: even if a simplified representation of the model can accurately approximate the original model on the training set, it may fail to match its behavior out of distribution; the understanding developed from simplified representations may be an illusion. We illustrate this by training Transformer models on controlled datasets with systematic generalization splits, focusing on the Dyck balanced-parenthesis languages. We simplify these models using tools like dimensionality-reduction and clustering, and find clear patterns in the resulting representations. We then explicitly test how these simplified proxy models match the original models behavior on various out-of-distribution test sets. Generally, the simplified proxies are less faithful out of distribution. For example, in cases where the original model generalizes to novel structures or deeper depths, the simplified model may fail to generalize, or may generalize too well. We then show the generality of these results: even model simplifications that do not directly use data can be less faithful out of distribution, and other tasks can also yield generalization gaps. Our experiments raise questions about the extent to which mechanistic interpretations derived using tools like SVD can reliably predict what a model will do in novel situations.",
        "keywords": "interpretability;generalization;language models",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Dan Friedman;Andrew Kyle Lampinen;Lucas Dixon;Danqi Chen;Asma Ghandeharioun",
        "authorids": "~Dan_Friedman2;~Andrew_Kyle_Lampinen1;~Lucas_Dixon1;~Danqi_Chen1;~Asma_Ghandeharioun1",
        "gender": ";M;Not Specified;F;",
        "homepage": "http://danfriedman0.github.io/;https://github.com/google/BIG-bench;https://research.google/people/lucas-dixon/;https://www.cs.princeton.edu/~danqic/;https://alum.mit.edu/www/asma_gh",
        "dblp": "205/9386;https://dblp.uni-trier.de/pers/hd/l/Lampinen:Andrew_K=;39/6853;87/7949;124/3110",
        "google_scholar": "1UMQ_KwAAAAJ;_N44XxAAAAAJ;nDs3-TMAAAAJ;sVR8ktkAAAAJ;CkfQy2gAAAAJ",
        "orcid": ";;0000-0003-1094-1675;;",
        "linkedin": ";;lucas-dixon-94070354/;;",
        "or_profile": "~Dan_Friedman2;~Andrew_Kyle_Lampinen1;~Lucas_Dixon1;~Danqi_Chen1;~Asma_Ghandeharioun1",
        "aff": "Princeton University;Google DeepMind;Research, Google;Princeton University;Google",
        "aff_domain": "princeton.edu;google.com;research.google.com;cs.princeton.edu;google.com",
        "position": "PhD student;Research Scientist;Researcher;Assistant Professor;Research Scientist",
        "bibtex": "@misc{\nfriedman2024interpretability,\ntitle={Interpretability Illusions in the Generalization of Simplified Models},\nauthor={Dan Friedman and Andrew Kyle Lampinen and Lucas Dixon and Danqi Chen and Asma Ghandeharioun},\nyear={2024},\nurl={https://openreview.net/forum?id=v675Iyu0ta}\n}",
        "github": "",
        "project": "",
        "reviewers": "5xMH;iDw5;H66k;nnFq;oEsb",
        "site": "https://openreview.net/forum?id=v675Iyu0ta",
        "pdf_size": 4717411,
        "rating": "3;5;6;6;8",
        "confidence": "3;2;4;2;4",
        "soundness": "3;2;3;3;4",
        "contribution": "1;2;3;3;3",
        "presentation": "3;2;3;2;4",
        "wc_summary": "108;71;85;42;65",
        "wc_strengths": "53;73;59;30;100",
        "wc_weaknesses": "91;100;64;131;201",
        "wc_questions": "35;239;166;35;7",
        "wc_review": "287;483;374;238;373",
        "wc_reply_reviewers": "0;400;117;43;19",
        "wc_reply_authors": "663;641;688;744;724",
        "reply_reviewers": "0;1;1;1;1",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            5.6,
            1.624807680927192
        ],
        "confidence_avg": [
            3.0,
            0.8944271909999159
        ],
        "soundness_avg": [
            3.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            2.4,
            0.8
        ],
        "presentation_avg": [
            2.8,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            74.2,
            21.866869917754574
        ],
        "wc_strengths_avg": [
            63.0,
            23.125743231299616
        ],
        "wc_weaknesses_avg": [
            117.4,
            46.957853443274004
        ],
        "wc_questions_avg": [
            96.4,
            90.23436152597301
        ],
        "wc_review_avg": [
            351.0,
            84.02618639448062
        ],
        "wc_reply_reviewers_avg": [
            115.8,
            147.54714500796007
        ],
        "wc_reply_authors_avg": [
            692.0,
            37.91042073098108
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.41286141192238524,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13221559855051788867&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;1;0;1",
        "aff_unique_norm": "Princeton University;Google",
        "aff_unique_dep": ";Google DeepMind",
        "aff_unique_url": "https://www.princeton.edu;https://deepmind.com",
        "aff_unique_abbr": "Princeton;DeepMind",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;0;0;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "v6a1pXXADC",
        "title": "Prompt Optimization via Adversarial In-Context Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We propose a new method, Adversarial In-Context Learning (adv-ICL), to optimize prompt for in-context learning (ICL) by employing one LLM as a generator, another as a discriminator, and a third as a prompt modifier. As in traditional adversarial learning, adv-ICL is implemented as a two player game between the generator and discriminator, where the generator tries to generate realistic enough output to fool the discriminator. In each round, given an input prefixed by task instructions and several exemplars, the generator produces an output. The discriminator is then tasked with classifying the generator input-output pair as model-generated or real data. Based on the discriminator loss, the prompt modifier proposes possible edits to the generator and discriminator prompts, and the edits that most improve the adversarial loss are selected. We show that adv-ICL results in significant improvements over state-of-the-art prompt optimization techniques for both open and closed-source models on 11 generation and classification tasks including summarization, arithmetic reasoning, machine translation, data-to-text generation, and the MMLU and big-bench hard benchmarks. In addition, because our method uses pre-trained models and updates only prompts rather than model parameters, it is computationally efficient, easy to extend to any LLM and task, and effective in low-resource settings.",
        "keywords": "Prompt Optimization;Adversarial Learning;In-Context Learning;Large Language Model",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Do Xuan Long;Yiran Zhao;Hannah Brown;Yuxi Xie;James Xu Zhao;Nancy F. Chen;Kenji Kawaguchi;Michael Qizhe Xie;Junxian He",
        "authorids": "~Do_Xuan_Long1;~Yiran_Zhao2;~Hannah_Brown1;~Yuxi_Xie1;~James_Xu_Zhao1;~Nancy_F._Chen1;~Kenji_Kawaguchi1;~Michael_Qizhe_Xie1;~Junxian_He1",
        "gender": "M;M;Non-Binary;F;;;;;M",
        "homepage": "https://dxlong2000.github.io/;https://zhaoyiran924.github.io/;;https://yuxixie.github.io/;;http://alum.mit.edu/www/nancychen;https://ml.comp.nus.edu.sg/#members;;https://jxhe.github.io",
        "dblp": "317/0657.html;;261/4912;;;84/8761;;;188/6127.html",
        "google_scholar": "uZyF8wwAAAAJ;D_HwSlEAAAAJ;t4wu34QAAAAJ;LNLECx0AAAAJ;;https://scholar.google.com.sg/citations?user=K3Z9UiAAAAAJ;aLl3rYoAAAAJ;;BIFGeoUAAAAJ",
        "orcid": ";;0000-0001-6350-874X;;;0000-0003-0872-5877;;;",
        "linkedin": ";;;yuxi-xie-494265181;;nancy-chen-4644865/?originalSubdomain=sg;;;",
        "or_profile": "~Do_Xuan_Long1;~Yiran_Zhao2;~Hannah_Brown1;~Yuxi_Xie1;~James_Xu_Zhao1;~Nancy_F._Chen1;~Kenji_Kawaguchi1;~Michael_Qizhe_Xie1;~Junxian_He1",
        "aff": "National University of Singapore;National University of Singapore;National University of Singapore;National University of Singapore;;I2R, A*STAR;National University of Singapore;;Hong Kong University of Science and Technology",
        "aff_domain": "nus.edu.sg;u.nus.edu;nus.edu;u.nus.edu;;i2r.a-star.edu.sg;nus.edu;;ust.hk",
        "position": "PhD student;PhD student;PhD student;PhD student;;Principal Researcher;Presidential Young Professor;;Assistant Professor",
        "bibtex": "@misc{\nlong2024prompt,\ntitle={Prompt Optimization via Adversarial In-Context Learning},\nauthor={Do Xuan Long and Yiran Zhao and Hannah Brown and Yuxi Xie and James Xu Zhao and Nancy F. Chen and Kenji Kawaguchi and Michael Qizhe Xie and Junxian He},\nyear={2024},\nurl={https://openreview.net/forum?id=v6a1pXXADC}\n}",
        "github": "",
        "project": "",
        "reviewers": "SGYz;9rYe;iBKM",
        "site": "https://openreview.net/forum?id=v6a1pXXADC",
        "pdf_size": 887364,
        "rating": "3;5;6",
        "confidence": "4;4;3",
        "soundness": "1;2;3",
        "contribution": "2;2;3",
        "presentation": "2;2;3",
        "wc_summary": "56;67;130",
        "wc_strengths": "31;30;55",
        "wc_weaknesses": "197;126;48",
        "wc_questions": "100;199;111",
        "wc_review": "384;422;344",
        "wc_reply_reviewers": "63;0;24",
        "wc_reply_authors": "1315;668;467",
        "reply_reviewers": "1;0;1",
        "reply_authors": "3;1;2",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            84.33333333333333,
            32.601976763516795
        ],
        "wc_strengths_avg": [
            38.666666666666664,
            11.55662388223981
        ],
        "wc_weaknesses_avg": [
            123.66666666666667,
            60.85136718997273
        ],
        "wc_questions_avg": [
            136.66666666666666,
            44.304501903180096
        ],
        "wc_review_avg": [
            383.3333333333333,
            31.8468557666565
        ],
        "wc_reply_reviewers_avg": [
            29.0,
            25.96150997149434
        ],
        "wc_reply_authors_avg": [
            816.6666666666666,
            361.80320003498525
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -0.7559289460184545,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2470406874372792818&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0;1;0;2",
        "aff_unique_norm": "National University of Singapore;A*STAR;Hong Kong University of Science and Technology",
        "aff_unique_dep": ";Institute for Infocomm Research;",
        "aff_unique_url": "https://www.nus.edu.sg;https://www.a-star.edu.sg;https://www.ust.hk",
        "aff_unique_abbr": "NUS;A*STAR;HKUST",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;0;0;1",
        "aff_country_unique": "Singapore;China"
    },
    {
        "id": "v6tPaf8V09",
        "title": "Navigating the Impending Arms Race between Attacks and Defenses in LLMs",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Over the past decade, there has been extensive research aimed at enhancing the robustness of neural networks, yet this problem remains vastly unsolved. In this context, we reflect on past challenges in the still ongoing arms race between adversarial attacks and defenses in the computer vision domain. Next, we demonstrate substantial challenges associated with an impending adversarial arms race in natural language processing, specifically with closed-source Large Language Models (LLMs), such as ChatGPT, Google Bard, or Anthropic\u2019s Claude. We provide guidelines and considerations to navigate these challenges concerning attack goals, attack capabilities, computational effort, attack complexity, and attack surfaces. Additionally, we identify embedding space attacks on LLMs as another viable threat model for the purposes of generating malicious content in open-sourced models. Finally, we demonstrate on a recently proposed defense that overlooking these guidelines can result in subpar defense evaluations. Such flawed methodologies necessitate rectifications in subsequent works, dangerously slowing down the research and providing a false sense of security.",
        "keywords": "Large Language Models;Adversarial Attacks;Arms Race",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/dd32034edfbf11fe249b5b4f975d0ab3ff9f5401.zip",
        "author": "Leo Schwinn;David Dobre;Stephan G\u00fcnnemann;Gauthier Gidel",
        "authorids": "~Leo_Schwinn1;~David_Dobre1;~Stephan_G\u00fcnnemann1;~Gauthier_Gidel1",
        "gender": "M;M;M;M",
        "homepage": ";;http://www.daml.in.tum.de;https://gauthiergidel.github.io/",
        "dblp": "259/2852;;43/3011;188/6326",
        "google_scholar": "PXT4k9cAAAAJ;;;https://scholar.google.fr/citations?user=bDrXQPUAAAAJ",
        "orcid": "0000-0003-3967-2202;;;",
        "linkedin": "leo-schwinn-34a61623b/;daviddobre/;;",
        "or_profile": "~Leo_Schwinn1;~David_Dobre1;~Stephan_G\u00fcnnemann1;~Gauthier_Gidel1",
        "aff": "Technical University of Munich;Mila - Quebec Artificial Intelligence Institute;Technical University Munich;Mila - Quebec Artificial Intelligence Institute",
        "aff_domain": "tum.de;mila.quebec;tum.de;mila.quebec",
        "position": "Postdoc;PhD student;Professor;Assistant Professor",
        "bibtex": "@misc{\nschwinn2024navigating,\ntitle={Navigating the Impending Arms Race between Attacks and Defenses in {LLM}s},\nauthor={Leo Schwinn and David Dobre and Stephan G{\\\"u}nnemann and Gauthier Gidel},\nyear={2024},\nurl={https://openreview.net/forum?id=v6tPaf8V09}\n}",
        "github": "",
        "project": "",
        "reviewers": "DYSZ;8EtR;Udyc;kbXD",
        "site": "https://openreview.net/forum?id=v6tPaf8V09",
        "pdf_size": 283508,
        "rating": "1;1;3;3",
        "confidence": "5;4;4;2",
        "soundness": "1;1;3;2",
        "contribution": "1;1;2;2",
        "presentation": "2;2;3;3",
        "wc_summary": "60;106;55;85",
        "wc_strengths": "33;12;76;43",
        "wc_weaknesses": "61;48;112;62",
        "wc_questions": "4;1;53;160",
        "wc_review": "158;167;296;350",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            76.5,
            20.47559522944327
        ],
        "wc_strengths_avg": [
            41.0,
            23.097618924902193
        ],
        "wc_weaknesses_avg": [
            70.75,
            24.44764814864612
        ],
        "wc_questions_avg": [
            54.5,
            64.31368439142638
        ],
        "wc_review_avg": [
            242.75,
            82.55112052540535
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.6882472016116854,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:W2QGf7yde9YJ:scholar.google.com/&scioq=Navigating+the+Impending+Arms+Race+between+Attacks+and+Defenses+in+LLMs&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;1",
        "aff_unique_norm": "Technical University of Munich;Quebec Artificial Intelligence Institute",
        "aff_unique_dep": ";Artificial Intelligence",
        "aff_unique_url": "https://www.tum.de;https://mila.quebec",
        "aff_unique_abbr": "TUM;Mila",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;1",
        "aff_country_unique": "Germany;Canada"
    },
    {
        "title": "Statistically Optimal $K$-means Clustering via Nonnegative Low-rank Semidefinite Programming",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17550",
        "id": "v7ZPwoHU1j",
        "author_site": "Yubo Zhuang, Xiaohui Chen, Yun Yang, Richard Zhang",
        "tldr": "",
        "abstract": "$K$-means clustering is a widely used machine learning method for identifying patterns in large datasets. Recently, semidefinite programming (SDP) relaxations have been proposed for solving the $K$-means optimization problem, which enjoy strong statistical optimality guarantees. However, the prohibitive cost of implementing an SDP solver renders these guarantees inaccessible to practical datasets. In contrast, nonnegative matrix factorization (NMF) is a simple clustering algorithm widely used by machine learning practitioners, but it lacks a solid statistical underpinning and theoretical guarantees. In this paper, we consider an NMF-like algorithm that solves a nonnegative low-rank restriction of the SDP-relaxed $K$-means formulation using a nonconvex Burer--Monteiro factorization approach. The resulting algorithm is as simple and scalable as state-of-the-art NMF algorithms while also enjoying the same strong statistical optimality guarantees as the SDP. In our experiments, we observe that our algorithm achieves significantly smaller mis-clustering errors compared to the existing state-of-the-art while maintaining scalability.",
        "keywords": "clustering;Burer-Monteiro;semidefinite programming",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Yubo Zhuang;Xiaohui Chen;Yun Yang;Richard Y. Zhang",
        "authorids": "~Yubo_Zhuang1;~Xiaohui_Chen3;~Yun_Yang4;~Richard_Y._Zhang1",
        "gender": "M;M;M;",
        "homepage": ";https://the-xiaohuichen.github.io/;https://www-math.umd.edu/people/faculty/item/1811-yy84.html;https://ryz.ece.illinois.edu/",
        "dblp": ";;;169/9027",
        "google_scholar": ";ZKij_0cAAAAJ;FY_UnPAAAAAJ;5r5Jyb4AAAAJ",
        "orcid": ";;;",
        "linkedin": "yubo-zhuang-09b282192/;xiaohui-chen-b67677a0/;;",
        "or_profile": "~Yubo_Zhuang1;~Xiaohui_Chen3;~Yun_Yang4;~Richard_Y._Zhang1",
        "aff": "University of Illinois, Urbana Champaign;University of Southern California;University of Illinois, Urbana Champaign;University of Illinois, Urbana Champaign",
        "aff_domain": "illinois.edu;usc.edu;illinois.edu;illinois.edu",
        "position": "PhD student;Associate Professor;Associate Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nzhuang2024statistically,\ntitle={Statistically Optimal \\$K\\$-means Clustering via Nonnegative Low-rank Semidefinite Programming},\nauthor={Yubo Zhuang and Xiaohui Chen and Yun Yang and Richard Y. Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=v7ZPwoHU1j}\n}",
        "github": "",
        "project": "",
        "reviewers": "hAG7;3o8f;cacp;v53M",
        "pdf_size": 1010618,
        "rating": "3;8;8;8",
        "confidence": "4;2;4;3",
        "soundness": "1;4;3;4",
        "contribution": "3;3;2;3",
        "presentation": "3;4;3;3",
        "wc_summary": "54;46;100;120",
        "wc_strengths": "17;38;173;129",
        "wc_weaknesses": "260;29;101;79",
        "wc_questions": "2;46;54;188",
        "wc_review": "333;159;428;516",
        "wc_reply_reviewers": "0;0;0;27",
        "wc_reply_authors": "1109;236;566;994",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "2;1;1;2",
        "rating_avg": [
            6.75,
            2.165063509461097
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            1.224744871391589
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            80.0,
            30.95157508108432
        ],
        "wc_strengths_avg": [
            89.25,
            64.11074402937467
        ],
        "wc_weaknesses_avg": [
            117.25,
            86.447599735331
        ],
        "wc_questions_avg": [
            72.5,
            69.56112420023126
        ],
        "wc_review_avg": [
            359.0,
            132.36880297109286
        ],
        "wc_reply_reviewers_avg": [
            6.75,
            11.691342951089922
        ],
        "wc_reply_authors_avg": [
            726.25,
            347.92698587491026
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11483975817600142312&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=v7ZPwoHU1j",
        "pdf": "https://openreview.net/pdf?id=v7ZPwoHU1j",
        "email": "illinois.edu;usc.edu;illinois.edu;illinois.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "University of Illinois Urbana-Champaign;University of Southern California",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://illinois.edu;https://www.usc.edu",
        "aff_unique_abbr": "UIUC;USC",
        "aff_campus_unique_index": "0;1;0;0",
        "aff_campus_unique": "Urbana-Champaign;Los Angeles",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Let's Verify Step by Step",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17549",
        "id": "v8L0pN6EOi",
        "author_site": "Hunter Lightman, Vineet Kosaraju, Yuri Burda, Harrison Edwards, Bowen Baker, Teddy Lee, Jan Leike, John Schulman, Ilya Sutskever, Karl Cobbe",
        "tldr": "",
        "abstract": "In recent years, large language models have greatly improved in their ability to perform complex multi-step reasoning. However, even state-of-the-art models still regularly produce logical mistakes. To train more reliable models, we can turn either to outcome supervision, which provides feedback for a final result, or process supervision, which provides feedback for each intermediate reasoning step. Given the importance of training reliable models, and given the high cost of human feedback, it is important to carefully compare the both methods. Recent work has already begun this comparison, but many questions still remain. We conduct our own investigation, finding that process supervision significantly outperforms outcome supervision for training models to solve problems from the challenging MATH dataset. Our process-supervised model solves 78% of problems from a representative subset of the MATH test set. Additionally, we show that active learning significantly improves the efficacy of process supervision. To support related research, we also release PRM800K, the complete dataset of 800,000 step-level human feedback labels used to train our best reward model.",
        "keywords": "LLMs;chain of thought;verifiers;human feedback;reasoning",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Hunter Lightman;Vineet Kosaraju;Yuri Burda;Harrison Edwards;Bowen Baker;Teddy Lee;Jan Leike;John Schulman;Ilya Sutskever;Karl Cobbe",
        "authorids": "~Hunter_Lightman1;~Vineet_Kosaraju1;~Yuri_Burda1;~Harrison_Edwards1;~Bowen_Baker2;~Teddy_Lee2;~Jan_Leike1;~John_Schulman1;~Ilya_Sutskever2;~Karl_Cobbe1",
        "gender": "M;M;M;M;M;M;;M;M;M",
        "homepage": "http://vineetkosaraju.com/;;;https://bowenbaker.github.io;;https://jan.leike.name;;https://www.cs.utoronto.ca/~ilya/;;",
        "dblp": "222/2012;156/0238;;190/7159;;https://dblp.uni-trier.de/pers/hd/l/Leike:Jan;;;232/1982;",
        "google_scholar": "wldNQHoAAAAJ;https://scholar.google.ca/citations?user=Amky96kAAAAJ;0o470HsAAAAJ;bMfPYdYAAAAJ;;beiWcokAAAAJ;;;;trHka_UAAAAJ",
        "orcid": ";;;;;;;;;",
        "linkedin": "vineet-kosaraju-0782348a/;;;;teddylee543/;;;;;",
        "or_profile": "~Vineet_Kosaraju1;~Yuri_Burda1;~Harrison_Edwards1;~Bowen_Baker2;~Teddy_Lee2;~Jan_Leike1;~John_Schulman1;~Ilya_Sutskever2;~Karl_Cobbe1;~Hunter_Lightmam1",
        "aff": ";OpenAI;;OpenAI;;OpenAI;OpenAI;OpenAI;;",
        "aff_domain": ";openai.com;;openai.com;;openai.com;openai.com;openai.com;;",
        "position": ";Researcher;;Research Scientist;;Alignment Team Lead;Researcher;Researcher;;",
        "bibtex": "@inproceedings{\nlightman2024lets,\ntitle={Let's Verify Step by Step},\nauthor={Hunter Lightman and Vineet Kosaraju and Yuri Burda and Harrison Edwards and Bowen Baker and Teddy Lee and Jan Leike and John Schulman and Ilya Sutskever and Karl Cobbe},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=v8L0pN6EOi}\n}",
        "github": "",
        "project": "",
        "reviewers": "4gd2;HKpB;DxcT;5YZq",
        "pdf_size": 4425431,
        "rating": "3;5;6;8",
        "confidence": "3;4;3;3",
        "soundness": "3;3;3;4",
        "contribution": "2;3;3;4",
        "presentation": "3;3;3;3",
        "wc_summary": "73;64;121;80",
        "wc_strengths": "49;43;48;56",
        "wc_weaknesses": "124;68;168;27",
        "wc_questions": "23;6;48;10",
        "wc_review": "269;181;385;173",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "207;180;167;48",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            84.5,
            21.823152842795196
        ],
        "wc_strengths_avg": [
            49.0,
            4.636809247747852
        ],
        "wc_weaknesses_avg": [
            96.75,
            53.64408168661292
        ],
        "wc_questions_avg": [
            21.75,
            16.406934509529805
        ],
        "wc_review_avg": [
            252.0,
            85.5277732669336
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            150.5,
            60.91182151274086
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": -0.16012815380508713,
        "gs_citation": 888,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3594089577812846684&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=v8L0pN6EOi",
        "pdf": "https://openreview.net/pdf?id=v8L0pN6EOi",
        "email": ";openai.com;;openai.com;;openai.com;openai.com;openai.com;;",
        "author_num": 10,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "OpenAI",
        "aff_unique_dep": "",
        "aff_unique_url": "https://openai.com",
        "aff_unique_abbr": "OpenAI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "v8eWha27jw",
        "title": "Accelerating Federated Learning with Quick Distributed Mean Estimation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Distributed Mean Estimation (DME), in which clients communicate vectors to a parameter server that estimates their average, is a fundamental building block in communication-efficient federated learning. In this paper, we improve on previous DME techniques that achieve the optimal Normalized Mean Squared Error (NMSE) guarantee by asymptotically improving the complexity for either encoding or decoding (or both). To achieve this, we formalize the problem in a novel way that allows us to use off-the-shelf mathematical solvers to design the quantization.",
        "keywords": "Distributed Mean Estimation;Federate Learning;Unbiased Quantization;Communication Efficient;Bandwidth Reduction;Compression",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Ran Ben-Basat;shay vargaftik;Amit Portnoy;Gil Einziger;Yaniv Ben-Itzhak;Michael Mitzenmacher",
        "authorids": "~Ran_Ben-Basat1;~shay_vargaftik1;~Amit_Portnoy1;~Gil_Einziger1;~Yaniv_Ben-Itzhak1;~Michael_Mitzenmacher1",
        "gender": ";;;M;M;M",
        "homepage": "https://bbasat.com;;;;;",
        "dblp": "140/7690;;159/8806;139/7090;75/7855;74/838",
        "google_scholar": "6G61qDwAAAAJ;;https://scholar.google.co.il/citations?user=2umZKagAAAAJ;;https://scholar.google.co.il/citations?user=6YWAONwAAAAJ;e8aRmAsAAAAJ",
        "orcid": ";;0000-0001-6491-5814;;;",
        "linkedin": ";;amit-portnoy-75060766;;yaniv-ben-itzhak-5889307/;",
        "or_profile": "~Ran_Ben-Basat1;~shay_vargaftik1;~Amit_Portnoy1;~Gil_Einziger1;~Yaniv_Ben-Itzhak1;~Michael_Mitzenmacher1",
        "aff": "University College London;;Microsoft;;VMware;Harvard University",
        "aff_domain": "ucl.ac.uk;;microsoft.com;;vmware.com;harvard.edu",
        "position": "Assistant Professor;;Researcher;;Researcher;Full Professor",
        "bibtex": "@misc{\nben-basat2024accelerating,\ntitle={Accelerating Federated Learning with Quick Distributed Mean Estimation},\nauthor={Ran Ben-Basat and shay vargaftik and Amit Portnoy and Gil Einziger and Yaniv Ben-Itzhak and Michael Mitzenmacher},\nyear={2024},\nurl={https://openreview.net/forum?id=v8eWha27jw}\n}",
        "github": "",
        "project": "",
        "reviewers": "fdHV;13gx;umvY;oj6v",
        "site": "https://openreview.net/forum?id=v8eWha27jw",
        "pdf_size": 1472853,
        "rating": "5;5;6;6",
        "confidence": "4;5;2;3",
        "soundness": "2;3;4;3",
        "contribution": "3;3;3;3",
        "presentation": "1;3;3;3",
        "wc_summary": "165;190;69;57",
        "wc_strengths": "83;57;37;74",
        "wc_weaknesses": "480;115;14;45",
        "wc_questions": "308;52;129;58",
        "wc_review": "1036;414;249;234",
        "wc_reply_reviewers": "0;84;0;0",
        "wc_reply_authors": "1282;601;221;385",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            120.25,
            58.08345289322941
        ],
        "wc_strengths_avg": [
            62.75,
            17.55526986406076
        ],
        "wc_weaknesses_avg": [
            163.5,
            186.35785467749943
        ],
        "wc_questions_avg": [
            136.75,
            103.40545198392587
        ],
        "wc_review_avg": [
            483.25,
            326.8511702594929
        ],
        "wc_reply_reviewers_avg": [
            21.0,
            36.373066958946424
        ],
        "wc_reply_authors_avg": [
            622.25,
            404.04540277053025
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.8944271909999159,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17693468417672484679&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "University College London;Microsoft;VMware, Inc.;Harvard University",
        "aff_unique_dep": ";Microsoft Corporation;;",
        "aff_unique_url": "https://www.ucl.ac.uk;https://www.microsoft.com;https://www.vmware.com;https://www.harvard.edu",
        "aff_unique_abbr": "UCL;Microsoft;VMware;Harvard",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "id": "v8jH6rjw8c",
        "title": "Fairness Improves Learning from Noisily Labeled Long-Tailed Data",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Both long-tailed and noisily labeled data frequently appear in real-world applications and impose significant challenges for learning. Most prior works treat either problem in an isolated way and do not explicitly consider the coupling effects of the two. Our empirical observation reveals that such solutions fail to consistently improve the learning when the dataset is long-tailed with label noise. Moreover, with the presence of label noise, existing methods do not observe universal improvements across different sub-populations; in other words, some sub-populations enjoyed the benefits of improved accuracy at the cost of hurting others. Based on these observations, we introduce the Fairness Regularizer (FR), inspired by regularizing the performance gap between any two sub-populations. We show that the introduced fairness regularizer improves the performances of sub-populations on the tail and the overall learning performance. Extensive experiments demonstrate the effectiveness of the proposed solution when complemented with certain existing popular robust or class-balanced methods.",
        "keywords": "long-tailed data;noisy labels;fairness regularizer",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/fb57fac0112b0dc86770fd3ec947ee7244b10105.zip",
        "author": "Jiaheng Wei;Zhaowei Zhu;Gang Niu;Tongliang Liu;Sijia Liu;Masashi Sugiyama;Yang Liu",
        "authorids": "~Jiaheng_Wei1;~Zhaowei_Zhu1;~Gang_Niu1;~Tongliang_Liu1;~Sijia_Liu1;~Masashi_Sugiyama1;~Yang_Liu3",
        "gender": "M;M;M;M;M;M;M",
        "homepage": "https://sites.google.com/ucsc.edu/jiahengwei;https://www.zzw.ai;https://niug1984.github.io;https://tongliang-liu.github.io/;https://lsjxjtu.github.io/;http://www.ms.k.u-tokyo.ac.jp/sugi/;http://www.yliuu.com",
        "dblp": "270/8936;202/1712;26/3367-1;150/6667;128/6972-1;35/1228;51/3710-18",
        "google_scholar": "https://scholar.google.com/citations?hl=en;YS8pSQoAAAAJ;https://scholar.google.co.jp/citations?user=HOkcy00AAAAJ;https://scholar.google.com.au/citations?user=EiLdZ_YAAAAJ;C7dO_UgAAAAJ;https://scholar.google.co.jp/citations?user=GkYIrlIAAAAJ;jKrIVCIAAAAJ",
        "orcid": ";0000-0003-3894-5862;;;;0000-0001-6658-6743;0000-0001-8420-6011",
        "linkedin": "jiahengwei/;;;;;;",
        "or_profile": "~Jiaheng_Wei1;~Zhaowei_Zhu1;~Gang_Niu1;~Tongliang_Liu1;~Sijia_Liu1;~Masashi_Sugiyama1;~Yang_Liu3",
        "aff": "University of California, Santa Cruz;Docta.ai;Southeast University;Mohamed bin Zayed University of Artificial Intelligence;Michigan State University;The University of Tokyo;University of California, Santa Cruz",
        "aff_domain": "ucsc.edu;docta.ai;seu.edu.cn;mbzuai.ac.ae;msu.edu;u-tokyo.ac.jp;ucsc.edu",
        "position": "PhD student;Researcher;Adjunct Full Professor;Affiliated Associate Professor;Assistant Professor;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nwei2024fairness,\ntitle={Fairness Improves Learning from Noisily Labeled Long-Tailed Data},\nauthor={Jiaheng Wei and Zhaowei Zhu and Gang Niu and Tongliang Liu and Sijia Liu and Masashi Sugiyama and Yang Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=v8jH6rjw8c}\n}",
        "github": "",
        "project": "",
        "reviewers": "Ed4g;yYZa;MjTZ;ziso",
        "site": "https://openreview.net/forum?id=v8jH6rjw8c",
        "pdf_size": 1029062,
        "rating": "3;3;5;6",
        "confidence": "4;3;4;2",
        "soundness": "2;2;3;2",
        "contribution": "2;2;2;3",
        "presentation": "2;3;2;3",
        "wc_summary": "24;129;88;68",
        "wc_strengths": "20;44;104;38",
        "wc_weaknesses": "369;407;134;64",
        "wc_questions": "121;8;55;3",
        "wc_review": "534;588;381;173",
        "wc_reply_reviewers": "76;0;38;0",
        "wc_reply_authors": "2030;1477;1201;423",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "3;3;2;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            77.25,
            37.79798275040614
        ],
        "wc_strengths_avg": [
            51.5,
            31.571347769773784
        ],
        "wc_weaknesses_avg": [
            243.5,
            147.21837521179208
        ],
        "wc_questions_avg": [
            46.75,
            47.42559962720556
        ],
        "wc_review_avg": [
            419.0,
            161.0481294520368
        ],
        "wc_reply_reviewers_avg": [
            28.5,
            31.5079355083763
        ],
        "wc_reply_authors_avg": [
            1282.75,
            579.2168743225632
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12099243312774850165&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;3;4;5;0",
        "aff_unique_norm": "University of California, Santa Cruz;Docta.ai;Southeast University;Mohamed bin Zayed University of Artificial Intelligence;Michigan State University;University of Tokyo",
        "aff_unique_dep": ";;;;;",
        "aff_unique_url": "https://www.ucsc.edu;https://docta.ai;https://www.seu.edu.cn/;https://mbzuai.ac.ae;https://www.msu.edu;https://www.u-tokyo.ac.jp",
        "aff_unique_abbr": "UCSC;Docta.ai;SEU;MBZUAI;MSU;UTokyo",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Santa Cruz;",
        "aff_country_unique_index": "0;0;1;2;0;3;0",
        "aff_country_unique": "United States;China;United Arab Emirates;Japan"
    },
    {
        "title": "Consistency Models as a Rich and Efficient Policy Class for Reinforcement Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17548",
        "id": "v8jdwkUNXb",
        "author_site": "Zihan Ding, Chi Jin",
        "tldr": "",
        "abstract": "Score-based generative models like the diffusion model have been testified to be effective in modeling multi-modal data from image generation to reinforcement learning (RL). However, the inference process of diffusion model can be slow, which hinders its usage in RL with iterative sampling. We propose to apply the consistency model as an efficient yet expressive policy representation, namely consistency policy, with an actor-critic style algorithm for three typical RL settings: offline, offline-to-online and online. For offline RL, we demonstrate the expressiveness of generative models as policies from multi-modal data. For offline-to-online RL, the consistency policy is shown to be more computational efficient than diffusion policy, with a comparable performance. For online RL, the consistency policy demonstrates significant speedup and even higher average performances than the diffusion policy.",
        "keywords": "Generative Model;Expressiveness;Deep Reinforcement Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Zihan Ding;Chi Jin",
        "authorids": "~Zihan_Ding1;~Chi_Jin1",
        "gender": "M;M",
        "homepage": "https://quantumiracle.github.io/webpage/;https://sites.google.com/view/cjin/home",
        "dblp": ";126/1802-1",
        "google_scholar": "t5DgPBAAAAAJ;GINhGvwAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Zihan_Ding1;~Chi_Jin1",
        "aff": "Princeton University;Princeton University",
        "aff_domain": "princeton.edu;princeton.edu",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nding2024consistency,\ntitle={Consistency Models as a Rich and Efficient Policy Class for Reinforcement Learning},\nauthor={Zihan Ding and Chi Jin},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=v8jdwkUNXb}\n}",
        "github": "",
        "project": "",
        "reviewers": "JCUm;gzrQ;259J",
        "pdf_size": 7259187,
        "rating": "3;6;6",
        "confidence": "4;3;3",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "3;3;3",
        "wc_summary": "104;58;139",
        "wc_strengths": "153;35;136",
        "wc_weaknesses": "533;115;32",
        "wc_questions": "79;113;33",
        "wc_review": "869;321;340",
        "wc_reply_reviewers": "536;0;0",
        "wc_reply_authors": "1320;478;157",
        "reply_reviewers": "1;0;0",
        "reply_authors": "3;1;1",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            100.33333333333333,
            33.16959786042367
        ],
        "wc_strengths_avg": [
            108.0,
            52.083266666624
        ],
        "wc_weaknesses_avg": [
            226.66666666666666,
            219.24466292756645
        ],
        "wc_questions_avg": [
            75.0,
            32.78210894171799
        ],
        "wc_review_avg": [
            510.0,
            253.96981447933268
        ],
        "wc_reply_reviewers_avg": [
            178.66666666666666,
            252.67282314399299
        ],
        "wc_reply_authors_avg": [
            651.6666666666666,
            490.41637638054283
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 36,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17719112505754350770&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=v8jdwkUNXb",
        "pdf": "https://openreview.net/pdf?id=v8jdwkUNXb",
        "email": "princeton.edu;princeton.edu",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Princeton University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.princeton.edu",
        "aff_unique_abbr": "Princeton",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "v9Pguuamfp",
        "title": "Explaining Emergent In-Context Learning as Kernel Regression",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs) have initiated a paradigm shift in transfer learning. In contrast to the classic pretraining-then-finetuning procedure, in order to use LLMs for downstream prediction tasks, one only needs to provide a few demonstrations, known as in-context examples, without adding more or updating existing model parameters. This in-context learning (ICL) capability of LLMs is intriguing, and it is not yet fully understood how pretrained LLMs acquire such capabilities.\nIn this paper, we investigate the reason why a transformer-based language model can accomplish in-context learning after pre-training on a general language corpus by proposing one hypothesis that LLMs can simulate kernel regression with internal representations when faced with in-context examples. More concretely, we first prove that Bayesian inference on in-context prompts can be asymptotically understood as kernel regression $\\hat y = \\sum_i y_i K(x, x_i)/\\sum_i K(x, x_i)$ as the number of in-context demonstrations grows. Then, we empirically investigate the in-context behaviors of language models. We find that during ICL, the attention and hidden features in LLMs match the behaviors of a kernel regression. Finally, our theory provides insights into multiple phenomena observed in the ICL field: why retrieving demonstrative samples similar to test samples can help, why ICL performance is sensitive to the output formats, and why ICL accuracy benefits from selecting in-distribution and representative samples.",
        "keywords": "In-Context Learning;Emergent Abilities;Large Language Models;Interpretability",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/11e7e49797326c59b8ec35f4c00974d806b214f1.zip",
        "author": "Chi Han;Ziqi Wang;Han Zhao;Heng Ji",
        "authorids": "~Chi_Han1;~Ziqi_Wang2;~Han_Zhao1;~Heng_Ji3",
        "gender": "M;;M;F",
        "homepage": "https://glaciohound.github.io;https://www.wzq016.github.io;https://hanzhaoml.github.io/;http://blender.cs.illinois.edu/hengji.html",
        "dblp": "255/6993;38/8097-3;03/3520-2;",
        "google_scholar": "https://scholar.google.com.sg/citations?user=DcSvbuAAAAAJ;xYRZiZkAAAAJ;x942ipYAAAAJ;z7GCqT4AAAAJ",
        "orcid": "0000-0001-6235-5841;;0000-0002-8579-1600;",
        "linkedin": "chi-han-b01a93141/;;;",
        "or_profile": "~Chi_Han1;~Ziqi_Wang2;~Han_Zhao1;~Heng_Ji3",
        "aff": "University of Illinois, Urbana Champaign;Meta Facebook;University of Illinois, Urbana Champaign;University of Illinois, Urbana-Champaign",
        "aff_domain": "illinois.edu;meta.com;illinois.edu;uiuc.edu",
        "position": "PhD student;Intern;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nhan2024explaining,\ntitle={Explaining Emergent In-Context Learning as Kernel Regression},\nauthor={Chi Han and Ziqi Wang and Han Zhao and Heng Ji},\nyear={2024},\nurl={https://openreview.net/forum?id=v9Pguuamfp}\n}",
        "github": "",
        "project": "",
        "reviewers": "Hu7i;Gjpv;iW9p;oa7R;kMXk",
        "site": "https://openreview.net/forum?id=v9Pguuamfp",
        "pdf_size": 11450959,
        "rating": "5;5;6;6;6",
        "confidence": "4;3;4;3;4",
        "soundness": "2;3;2;3;3",
        "contribution": "2;2;3;3;3",
        "presentation": "2;2;3;3;2",
        "wc_summary": "24;93;410;121;80",
        "wc_strengths": "23;40;86;77;129",
        "wc_weaknesses": "115;157;1544;138;396",
        "wc_questions": "126;102;115;97;65",
        "wc_review": "288;392;2155;433;670",
        "wc_reply_reviewers": "0;145;0;0;0",
        "wc_reply_authors": "337;640;1374;202;440",
        "reply_reviewers": "0;1;0;0;0",
        "reply_authors": "1;1;2;1;1",
        "rating_avg": [
            5.6,
            0.48989794855663565
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            145.6,
            135.91850499472102
        ],
        "wc_strengths_avg": [
            71.0,
            37.12142238654117
        ],
        "wc_weaknesses_avg": [
            470.0,
            546.4741530941789
        ],
        "wc_questions_avg": [
            101.0,
            20.659138413786767
        ],
        "wc_review_avg": [
            787.6,
            695.0472214173653
        ],
        "wc_reply_reviewers_avg": [
            29.0,
            58.0
        ],
        "wc_reply_authors_avg": [
            598.6,
            413.24065627670274
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            1.2,
            0.4
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.16666666666666666,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3597442982300268368&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "University of Illinois Urbana-Champaign;Meta;University of Illinois",
        "aff_unique_dep": ";Meta Platforms, Inc.;",
        "aff_unique_url": "https://illinois.edu;https://meta.com;https://illinois.edu",
        "aff_unique_abbr": "UIUC;Meta;UIUC",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Urbana-Champaign;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "v9Sfo2hMJl",
        "title": "Rethinking the Temporal Modeling for Time Series Forecasting with Hybrid Modeling",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Time series forecasting is a critical task in various domains, including traffic, energy, and weather series forecasting. Recent research has explored the utilization of MLPs, Transformers, and CNNs architectures for time series modeling, delivering promising results. In this work, we take a step further by systematically studying the strengths and limitations of these methods and integrating their capabilities to formulate a unified framework for time series forecasting with a hybrid modeling approach. We introduce UniTS, a simple yet scalable framework for temporal modeling that incorporates multiple feature learning techniques. Moreover, prior research employed different hyperparameter configurations in various temporal modeling approaches, which might causing unfair performance comparisons. For instance, when predicting with the same forecasting horizon, prior approaches might exhibit significant variations in lookback window lengths.  In our study, we address this issue by validating and standardizing parameters that can significantly impact performance, ensuring a more equitable comparison of models across diverse datasets. UniTS achieves state-of-the-art performance across various domains, and we conduct extensive experiments to further evaluate its capabilities. Our results are fully reproducible, and the source code for this work is available at https://anonymous.4open.science/r/UniTS-8DA8/README.md.",
        "keywords": "Time Series Forecasting",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Xiaozhuang Song;Wei Fan;Shun Zheng;Jiang Bian;Tianshu Yu",
        "authorids": "~Xiaozhuang_Song1;~Wei_Fan6;~Shun_Zheng1;~Jiang_Bian1;~Tianshu_Yu2",
        "gender": "M;M;M;M;M",
        "homepage": ";https://weifan.site/;;https://sites.google.com/view/jiangbian;https://mypage.cuhk.edu.cn/academics/yutianshu/",
        "dblp": "283/0298.html;54/3488-10;179/2615.html;09/851-2.html;152/6675",
        "google_scholar": ";cQ8zLJ4AAAAJ;21Q9To4AAAAJ;pZBEnY8AAAAJ;MTHO7DsAAAAJ",
        "orcid": ";0000-0001-7656-445X;0009-0005-7355-7090;0000-0002-9472-600X;0000-0002-6537-1924",
        "linkedin": ";;;jbian/;",
        "or_profile": "~Xiaozhuang_Song1;~Wei_Fan6;~Shun_Zheng1;~Jiang_Bian1;~Tianshu_Yu2",
        "aff": "Shanghai Artificial Intelligence Laboratory;University of Oxford;Microsoft;Microsoft;Chinese University of Hong Kong (Shenzhen)",
        "aff_domain": "pjlab.org.cn;ox.ac.uk;microsoft.com;microsoft.com;cuhk.edu.cn",
        "position": "Intern;Postdoc Researcher;Senior Researcher;Partner Research Manager;Assistant Professor",
        "bibtex": "@misc{\nsong2024rethinking,\ntitle={Rethinking the Temporal Modeling for Time Series Forecasting with Hybrid Modeling},\nauthor={Xiaozhuang Song and Wei Fan and Shun Zheng and Jiang Bian and Tianshu Yu},\nyear={2024},\nurl={https://openreview.net/forum?id=v9Sfo2hMJl}\n}",
        "github": "",
        "project": "",
        "reviewers": "gsuz;EGjq;Y4Q5",
        "site": "https://openreview.net/forum?id=v9Sfo2hMJl",
        "pdf_size": 499621,
        "rating": "5;6;6",
        "confidence": "4;4;5",
        "soundness": "2;3;2",
        "contribution": "2;2;3",
        "presentation": "3;4;3",
        "wc_summary": "21;45;71",
        "wc_strengths": "61;85;41",
        "wc_weaknesses": "97;64;245",
        "wc_questions": "3;46;4",
        "wc_review": "182;240;361",
        "wc_reply_reviewers": "0;0;65",
        "wc_reply_authors": "401;775;1266",
        "reply_reviewers": "0;0;2",
        "reply_authors": "1;2;3",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            45.666666666666664,
            20.417857108151406
        ],
        "wc_strengths_avg": [
            62.333333333333336,
            17.98765008430939
        ],
        "wc_weaknesses_avg": [
            135.33333333333334,
            78.7076164604728
        ],
        "wc_questions_avg": [
            17.666666666666668,
            20.038851153585515
        ],
        "wc_review_avg": [
            261.0,
            74.569877743407
        ],
        "wc_reply_reviewers_avg": [
            21.666666666666668,
            30.641293851417057
        ],
        "wc_reply_authors_avg": [
            814.0,
            354.2099189275572
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:mVWHQhhjW7MJ:scholar.google.com/&scioq=Rethinking+the+Temporal+Modeling+for+Time+Series+Forecasting+with+Hybrid+Modeling&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;2;3",
        "aff_unique_norm": "Shanghai Artificial Intelligence Laboratory;University of Oxford;Microsoft;Chinese University of Hong Kong",
        "aff_unique_dep": ";;Microsoft Corporation;",
        "aff_unique_url": "http://www.shailab.org/;https://www.ox.ac.uk;https://www.microsoft.com;https://www.cuhk.edu.cn",
        "aff_unique_abbr": "Shanghai AI Lab;Oxford;Microsoft;CUHK",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Shenzhen",
        "aff_country_unique_index": "0;1;2;2;0",
        "aff_country_unique": "China;United Kingdom;United States"
    },
    {
        "id": "vA5Rs9mu97",
        "title": "Compressed Online Sinkhorn",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The use of optimal transport (OT) distances, and in particular entropic-regularised OT distances, is an increasingly popular evaluation metric in many areas of machine learning and data science. Their use has largely been driven by the availability of efficient algorithms such as the Sinkhorn algorithm. One of the drawbacks of the Sinkhorn algorithm for large-scale data processing is that it is a two-phase method, where one first draws a large stream of data from the probability distributions, before applying the Sinkhorn algorithm to the discrete probability measures. More recently, there have been several works developing stochastic versions of Sinkhorn that directly handle continuous streams of data. In this work, we revisit the recently introduced online Sinkhorn algorithm of Mensch & Peyr\u00e9 (2020). Our contributions are twofold: We improve the convergence analysis for the online Sinkhorn algorithm, the new rate that we obtain is faster than the previous rate under certain parameter choices. We also present numerical results to verify the sharpness of our result. Secondly, we propose the compressed online Sinkhorn algorithm which combines measure compression techniques with the online Sinkhorn algorithm. We provide numerical experiments to show practical numerical gains, as well as theoretical guarantees on the efficiency of our approach.",
        "keywords": "computational optimal transport; online Sinkhorn; measure compression",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/d11395a2d4f16f269fe8c88afa658bac6bf75dd4.zip",
        "author": "Fengpei Wang;Clarice Poon;Tony Shardlow",
        "authorids": "~Fengpei_Wang1;~Clarice_Poon1;~Tony_Shardlow1",
        "gender": "F;F;",
        "homepage": ";;https://people.bath.ac.uk/tjs42/",
        "dblp": ";117/9288;",
        "google_scholar": ";;zReZ_jsAAAAJ",
        "orcid": ";;0000-0003-1154-855X",
        "linkedin": "fengpeiwang;;",
        "or_profile": "~Fengpei_Wang1;~Clarice_Poon1;~Tony_Shardlow1",
        "aff": "University of Bath;University of Warwick;University of Bath",
        "aff_domain": "bath.ac.uk;warwick.ac.uk;bath.ac.uk",
        "position": "PhD student;Associate Professor;Full Professor",
        "bibtex": "@misc{\nwang2024compressed,\ntitle={Compressed Online Sinkhorn},\nauthor={Fengpei Wang and Clarice Poon and Tony Shardlow},\nyear={2024},\nurl={https://openreview.net/forum?id=vA5Rs9mu97}\n}",
        "github": "",
        "project": "",
        "reviewers": "XcQQ;3eZq;q5md;5NvN",
        "site": "https://openreview.net/forum?id=vA5Rs9mu97",
        "pdf_size": 525119,
        "rating": "5;5;6;6",
        "confidence": "3;2;3;3",
        "soundness": "2;2;4;3",
        "contribution": "2;3;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "162;182;67;76",
        "wc_strengths": "28;30;42;35",
        "wc_weaknesses": "200;133;25;99",
        "wc_questions": "80;1;22;8",
        "wc_review": "470;346;156;218",
        "wc_reply_reviewers": "14;0;0;0",
        "wc_reply_authors": "322;241;110;154",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            121.75,
            50.8447391575569
        ],
        "wc_strengths_avg": [
            33.75,
            5.402545696243577
        ],
        "wc_weaknesses_avg": [
            114.25,
            63.05305305851573
        ],
        "wc_questions_avg": [
            27.75,
            31.09963826156182
        ],
        "wc_review_avg": [
            297.5,
            120.88320809773374
        ],
        "wc_reply_reviewers_avg": [
            3.5,
            6.06217782649107
        ],
        "wc_reply_authors_avg": [
            206.75,
            81.54561606855393
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:TTOCvD-xXVUJ:scholar.google.com/&scioq=Compressed+Online+Sinkhorn&hl=en&as_sdt=0,44",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Bath;University of Warwick",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.bath.ac.uk;https://www.warwick.ac.uk",
        "aff_unique_abbr": "Bath;Warwick",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "vBNTeQ7dPP",
        "title": "Reinforcement Learning for Control with Stability Guarantee",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Reinforcement learning (RL) has achieved promising performance in complicated system control. \nTo overcome this defect, we firstly apply a Lyapunov stable dynamical model as a reference system to fit the real system. Then, we prove that if the state fitting error between the reference and real system are bounded, the real system has Uniformly Ultimately Bounded (UUB) stability guarantee. Motivated by our theoretical analysis, we guide the design of reward functions for RL based on conditions of UUB guarantee for real systems and propose $\\textbf{ITSRL}$, an $\\textbf{I}$terative $\\textbf{T}$raining framework for learning $\\textbf{S}$table $\\textbf{RL}$ control policy with UUB stability guarantee, by iteratively minimizing the state fitting error between the reference and real system, which can be adapted to various advanced RL methods.  Our evaluation results on three control tasks demonstrate that the proposed ITSRL framework can improve the performance of RL controller under perturbation.",
        "keywords": "Reinforcement learning;Lyapunov stable dynamic model;uniformly ultimately bounded;iterative learning framework",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Hengheng Gong;Jiang Zhang;Tijin Yan;Yufeng Zhan;Yuanqing Xia",
        "authorids": "~Hengheng_Gong1;~Jiang_Zhang3;~Tijin_Yan1;~Yufeng_Zhan1;~Yuanqing_Xia1",
        "gender": "M;;M;M;M",
        "homepage": "https://github.com/EmiyaXL;;https://yantijin.github.io/;;",
        "dblp": "267/1200;;274/3156;173/1777.html;69/2205",
        "google_scholar": ";;Wh5cvy4AAAAJ;;HtedN3oAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Hengheng_Gong1;~Jiang_Zhang3;~Tijin_Yan1;~Yufeng_Zhan1;~Yuanqing_Xia1",
        "aff": "Beijing Institute of Technology;;Beijing Institute of Technology;Beijing Institute of Technology;Beijing Institute of Technology",
        "aff_domain": "bit.edu.cn;;bit.edu.cn;bit.edu.cn;bit.edu.cn",
        "position": "PhD student;;PhD student;Associate Professor;Full Professor",
        "bibtex": "@misc{\ngong2024reinforcement,\ntitle={Reinforcement Learning for Control with Stability Guarantee},\nauthor={Hengheng Gong and Jiang Zhang and Tijin Yan and Yufeng Zhan and Yuanqing Xia},\nyear={2024},\nurl={https://openreview.net/forum?id=vBNTeQ7dPP}\n}",
        "github": "",
        "project": "",
        "reviewers": "KFTS;4p4H;F9dy;8Gbr",
        "site": "https://openreview.net/forum?id=vBNTeQ7dPP",
        "pdf_size": 331652,
        "rating": "1;3;3;3",
        "confidence": "3;4;4;4",
        "soundness": "2;2;2;2",
        "contribution": "2;3;3;2",
        "presentation": "1;2;3;2",
        "wc_summary": "55;100;93;45",
        "wc_strengths": "16;46;28;40",
        "wc_weaknesses": "334;223;285;105",
        "wc_questions": "74;124;290;24",
        "wc_review": "479;493;696;214",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            73.25,
            23.64714570513744
        ],
        "wc_strengths_avg": [
            32.5,
            11.521718621802913
        ],
        "wc_weaknesses_avg": [
            236.75,
            85.63403237031409
        ],
        "wc_questions_avg": [
            128.0,
            99.98999949994999
        ],
        "wc_review_avg": [
            470.5,
            171.1877624130884
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:EUcJoCOp-24J:scholar.google.com/&scioq=Reinforcement+Learning+for+Control+with+Stability+Guarantee&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Beijing Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.bit.edu.cn/",
        "aff_unique_abbr": "BIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "A Framework for Inference Inspired by Human Memory Mechanisms",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17547",
        "id": "vBo7544jZx",
        "author_site": "Xiangyu Zeng, Jie Lin, Piao Hu, Ruizheng Huang, Zhicheng Zhang",
        "tldr": "",
        "abstract": "How humans and machines make sense of current inputs for relation reasoning and question-answering while putting the perceived information into context of our past memories, has been a challenging conundrum in cognitive science and artificial intelligence. Inspired by human brain's memory system and cognitive architectures, we propose a PMI framework that consists of perception, memory and inference components. Notably, the memory module comprises working and long-term memory, with the latter endowed with a higher-order structure to retain extensive and complex relational knowledge and experience. Through a differentiable competitive write access, current perceptions update working memory, which is later merged with long-term memory via outer product associations, reducing information conflicts and averting memory overflow. In the inference module, relevant information is retrieved from two separate memory origins and associatively integrated to attain a more comprehensive and precise interpretation of current perceptions. We exploratively apply our PMI to improve prevailing Transformers and CNN models on question-answering tasks like bAbI-20k and Sort-of-CLEVR datasets, as well as detecting equilateral triangles, language modeling and image classification tasks, and in each case, our PMI enhancements consistently outshine their original counterparts significantly. Visualization analyses reveal that relational memory consolidation, along with the interaction and integration of information from diverse memory sources, substantially contributes to the model effectiveness on inference tasks.",
        "keywords": "memory;transformers;architecture;inference;cognitive model",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/b079f2eb622a8d5c764bf960e19f3fab957550b1.zip",
        "author": "Xiangyu Zeng;Jie Lin;Piao Hu;Ruizheng Huang;Zhicheng Zhang",
        "authorids": "~Xiangyu_Zeng2;~Jie_Lin5;~Piao_Hu1;~Ruizheng_Huang1;~Zhicheng_Zhang4",
        "gender": "F;M;M;M;M",
        "homepage": "https://zengxyyu.github.io/;https://www.scse.uestc.edu.cn/info/1081/10964.htm;https://github.com/Piao-Hu;https://github.com/Kilosigh;http://mail.std.uestc.edu.cn/coremail/XT5/index.jsp?sid=BAVLtbPPPyPbIqDgVmreKqARuxNRJykf#mail.read%7C%7B%22fid%22%3A1%2C%22mid%22%3A%221%3A1tbiAQERBWT%2BGdcH6wAFsp%22%2C%22mboxa%22%3A%22%22%2C%22start%22%3A0%7D",
        "dblp": ";;;;",
        "google_scholar": "5Xy-gPEAAAAJ;;;;",
        "orcid": ";0000-0003-3476-7536;;;0009-0007-5970-2129",
        "linkedin": ";;;;",
        "or_profile": "~Xiangyu_Zeng2;~Jie_Lin5;~Piao_Hu1;~Ruizheng_Huang1;~Zhicheng_Zhang4",
        "aff": "University of Electronic Science and Technology of China;;University of Electronic Science and Technology of China;University of Electronic Science and Technology of China;University of Electronic Science and Technology of China",
        "aff_domain": "uestc.edu.cn;;uestc.edu.cn;uestc.edu.cn;uestc.edu.cn",
        "position": "MS student;;MS student;MS student;MS student",
        "bibtex": "@inproceedings{\nzeng2024a,\ntitle={A Framework for Inference Inspired by Human Memory Mechanisms},\nauthor={Xiangyu Zeng and Jie Lin and Piao Hu and Ruizheng Huang and Zhicheng Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=vBo7544jZx}\n}",
        "github": "",
        "project": "",
        "reviewers": "AVcH;SKET;4HGz",
        "pdf_size": 4007623,
        "rating": "6;6;8",
        "confidence": "4;3;4",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "3;3;2",
        "wc_summary": "108;117;27",
        "wc_strengths": "179;35;35",
        "wc_weaknesses": "190;100;329",
        "wc_questions": "4;1;61",
        "wc_review": "481;253;452",
        "wc_reply_reviewers": "0;58;407",
        "wc_reply_authors": "794;1198;1321",
        "reply_reviewers": "0;1;2",
        "reply_authors": "2;4;4",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            84.0,
            40.47221268969612
        ],
        "wc_strengths_avg": [
            83.0,
            67.88225099390856
        ],
        "wc_weaknesses_avg": [
            206.33333333333334,
            94.19955178001409
        ],
        "wc_questions_avg": [
            22.0,
            27.60434748368452
        ],
        "wc_review_avg": [
            395.3333333333333,
            101.33881564117254
        ],
        "wc_reply_reviewers_avg": [
            155.0,
            179.7572437112526
        ],
        "wc_reply_authors_avg": [
            1104.3333333333333,
            225.11083689793543
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.49999999999999983,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5124229066839955871&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=vBo7544jZx",
        "pdf": "https://openreview.net/pdf?id=vBo7544jZx",
        "email": "uestc.edu.cn;;uestc.edu.cn;uestc.edu.cn;uestc.edu.cn",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of Electronic Science and Technology of China",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uestc.edu.cn",
        "aff_unique_abbr": "UESTC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Encoding Unitig-level Assembly Graphs with Heterophilous Constraints for Metagenomic Contigs Binning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17546",
        "id": "vBw8JGBJWj",
        "author_site": "Hansheng Xue, Vijini Mallawaarachchi, Lexing Xie, Vaibhav Rajan",
        "tldr": "",
        "abstract": "Metagenomics studies genomic material derived from mixed microbial communities in diverse environments, holding considerable significance for both human health and environmental sustainability. Metagenomic binning refers to the clustering of genomic subsequences obtained from high-throughput DNA sequencing into distinct bins, each representing a constituent organism within the community. Mainstream binning methods primarily rely on sequence features such as composition and abundance, making them unable to effectively handle sequences shorter than 1,000 bp and inherent noise within sequences. Several binning tools have emerged, aiming to enhance binning outcomes by using the assembly graph generated by assemblers, which encodes valuable overlapping information among genomic sequences. However, existing assembly graph-based binners mainly focus on simplified contig-level assembly graphs that are recreated from assembler\u2019s original graphs, unitig-level assembly graphs. The simplification reduces the resolution of the connectivity information in original graphs. In this paper, we design a novel binning tool named UnitigBin, which leverages representation learning on unitig-level assembly graphs while adhering to heterophilious constraints imposed by single-copy marker genes, ensuring that constrained contigs cannot be grouped together. Extensive experiments conducted on synthetic and real datasets demonstrate that UnitigBin significantly surpasses state-of-the-art binning tools.",
        "keywords": "Metagenomics Binning;Computational Genomics;Graph Neural Networks",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/03c965aa19d9f065b13e9bf8a8dee9dc82c6cae3.zip",
        "author": "Hansheng Xue;Vijini Mallawaarachchi;Lexing Xie;Vaibhav Rajan",
        "authorids": "~Hansheng_Xue2;~Vijini_Mallawaarachchi1;~Lexing_Xie1;~Vaibhav_Rajan2",
        "gender": "M;F;F;M",
        "homepage": "https://xuehansheng.github.io/;;https://users.cecs.anu.edu.au/~xlx/;",
        "dblp": "193/7980.html;;59/4002.html;55/406",
        "google_scholar": "A2KV64UAAAAJ;https://scholar.google.com.au/citations?user=Ueve1zYAAAAJ;https://scholar.google.com.tw/citations?user=u0xUDSoAAAAJ;rBqhP-8AAAAJ",
        "orcid": ";;0000-0001-8319-0118;0000-0002-6748-6864",
        "linkedin": ";;;https://sg.linkedin.com/in/vaibhav-rajan-b76a4613",
        "or_profile": "~Hansheng_Xue2;~Vijini_Mallawaarachchi1;~Lexing_Xie1;~Vaibhav_Rajan2",
        "aff": "National University of Singapore;Flinders University of South Australia;University of Chicago;National University of Singapore",
        "aff_domain": "nus.edu.sg;flinders.edu.au;cs.uchicago.edu;nus.edu.sg",
        "position": "Researcher;Postdoc;Researcher;Assistant Professor",
        "bibtex": "@inproceedings{\nxue2024encoding,\ntitle={Encoding Unitig-level Assembly Graphs with Heterophilous Constraints for Metagenomic Contigs Binning},\nauthor={Hansheng Xue and Vijini Mallawaarachchi and Lexing Xie and Vaibhav Rajan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=vBw8JGBJWj}\n}",
        "github": "",
        "project": "",
        "reviewers": "WrPh;UkJP;22Pk",
        "pdf_size": 3736850,
        "rating": "3;5;5",
        "confidence": "4;3;2",
        "soundness": "2;3;3",
        "contribution": "2;2;2",
        "presentation": "2;3;3",
        "wc_summary": "82;156;44",
        "wc_strengths": "14;98;27",
        "wc_weaknesses": "239;83;158",
        "wc_questions": "37;64;121",
        "wc_review": "372;401;350",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "629;430;863",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;2",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            94.0,
            46.50448007092076
        ],
        "wc_strengths_avg": [
            46.333333333333336,
            36.91732505056249
        ],
        "wc_weaknesses_avg": [
            160.0,
            63.702433234531945
        ],
        "wc_questions_avg": [
            74.0,
            35.014282800023196
        ],
        "wc_review_avg": [
            374.3333333333333,
            20.885933597094056
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            640.6666666666666,
            176.9639009013483
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3059875327577669217&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=vBw8JGBJWj",
        "pdf": "https://openreview.net/pdf?id=vBw8JGBJWj",
        "email": "nus.edu.sg;flinders.edu.au;cs.uchicago.edu;nus.edu.sg",
        "author_num": 4,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "National University of Singapore;Flinders University;University of Chicago",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.nus.edu.sg;https://www.flinders.edu.au;https://www.uchicago.edu",
        "aff_unique_abbr": "NUS;Flinders;UChicago",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;0",
        "aff_country_unique": "Singapore;Australia;United States"
    },
    {
        "id": "vDJ4tzczlG",
        "title": "Fair Text-to-Image Diffusion via Fair Mapping",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this paper, we address the limitations of existing text-to-image diffusion models in generating demographically fair results when given human-related descriptions. These models often struggle to disentangle the target language context from sociocultural biases, resulting in biased image generation. To overcome this challenge, we propose Fair Mapping, a general, model-agnostic, and lightweight approach that modifies a pre-trained text-to-image model by controlling the prompt to achieve fair image generation. One key advantage of our approach is its high efficiency. The training process only requires updating a small number of parameters in an additional linear mapping network. This not only reduces the computational cost but also accelerates the optimization process. We first demonstrate the issue of bias in generated results caused by language biases in text-guided diffusion models. By developing a mapping network that projects language embeddings into an unbiased space, we enable the generation of relatively balanced demographic results based on a keyword specified in the prompt. With comprehensive experiments on face image generation, we show that our method significantly improves image generation performance when prompted with descriptions related to human faces. By effectively addressing the issue of bias, we produce more fair and diverse image outputs. This work contributes to the field of text-to-image generation by enhancing the ability to generate images that accurately reflect the intended demographic characteristics specified in the text.",
        "keywords": "Fairness;Social Good;Text-to-Image Diffusion Models;Bias Mitigation",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Jia Li;Lijie Hu;Jingfeng Zhang;Tianhang Zheng;Hua Zhang;Di Wang",
        "authorids": "~Jia_Li25;~Lijie_Hu1;~Jingfeng_Zhang1;~Tianhang_Zheng2;~Hua_Zhang4;~Di_Wang1",
        "gender": "F;F;M;M;M;",
        "homepage": "https://lijiae.github.io/;https://lijie-hu.github.io;https://zjfheart.github.io;;https://visionhzhang.github.io/;",
        "dblp": "23/6950-53;90/8790;227/2664.html;212/1269.html;69/2745-8;",
        "google_scholar": ";C-3UuqsAAAAJ;NS0P1FkAAAAJ;;https://scholar.google.com.hk/citations?user=KYifAy8AAAAJ;",
        "orcid": ";;0000-0003-3491-8074;;;",
        "linkedin": ";lijie-hu-98045a126;;;;",
        "or_profile": "~Jia_Li25;~Lijie_Hu1;~Jingfeng_Zhang1;~Tianhang_Zheng2;~Hua_Zhang4;~Di_Wang1",
        "aff": "University of Chinese Academy of Sciences;KAUST;University of Auckland;University of Missouri - Kansas City;Chinese Academy of Sciences;",
        "aff_domain": "ucas.edu;kaust.edu.sa;auckland.ac.nz;umkc.edu;iie.ac.cn;",
        "position": "MS student;PhD student;Assistant Professor;Assistant Professor;Full Professor;",
        "bibtex": "@misc{\nli2024fair,\ntitle={Fair Text-to-Image Diffusion via Fair Mapping},\nauthor={Jia Li and Lijie Hu and Jingfeng Zhang and Tianhang Zheng and Hua Zhang and Di Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=vDJ4tzczlG}\n}",
        "github": "",
        "project": "",
        "reviewers": "4gR2;R9zr;emxE;fsFn;ujPt",
        "site": "https://openreview.net/forum?id=vDJ4tzczlG",
        "pdf_size": 24383914,
        "rating": "5;5;5;6;6",
        "confidence": "2;4;4;3;3",
        "soundness": "2;3;2;3;3",
        "contribution": "2;2;2;3;3",
        "presentation": "3;3;3;3;3",
        "wc_summary": "82;105;73;62;85",
        "wc_strengths": "41;58;22;114;74",
        "wc_weaknesses": "158;204;96;206;157",
        "wc_questions": "57;21;6;54;94",
        "wc_review": "338;388;197;436;410",
        "wc_reply_reviewers": "0;347;347;28;48",
        "wc_reply_authors": "399;1455;976;588;948",
        "reply_reviewers": "0;1;1;1;1",
        "reply_authors": "3;6;4;2;4",
        "rating_avg": [
            5.4,
            0.48989794855663565
        ],
        "confidence_avg": [
            3.2,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            81.4,
            14.263239463740346
        ],
        "wc_strengths_avg": [
            61.8,
            31.32028096936552
        ],
        "wc_weaknesses_avg": [
            164.2,
            40.18158782328045
        ],
        "wc_questions_avg": [
            46.4,
            30.702442899547915
        ],
        "wc_review_avg": [
            353.8,
            84.75942425476946
        ],
        "wc_reply_reviewers_avg": [
            154.0,
            158.3199292571848
        ],
        "wc_reply_authors_avg": [
            873.2,
            363.5543425679303
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            3.8,
            1.32664991614216
        ],
        "replies_avg": [
            31,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.2182178902359924,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13192925504317615425&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "University of Chinese Academy of Sciences;King Abdullah University of Science and Technology;University of Auckland;University of Missouri-Kansas City;Chinese Academy of Sciences",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "http://www.ucas.ac.cn;https://www.kaust.edu.sa;https://www.auckland.ac.nz;https://www.umkc.edu;https://www.cas.cn",
        "aff_unique_abbr": "UCAS;KAUST;UoA;UMKC;CAS",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Kansas City",
        "aff_country_unique_index": "0;1;2;3;0",
        "aff_country_unique": "China;Saudi Arabia;New Zealand;United States"
    },
    {
        "id": "vDSkfIUnEO",
        "title": "Reverse Chain: A Generic Rule for LLMs to Master Multi-API Planning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "While enabling large language models to implement function calling (known as APIs) can greatly enhance the performance of LLMs, function calling is still a challenging task due to the complicated relations between different APIs, especially in a context-learning setting without fine-tuning. This paper proposes a simple yet controllable target-driven approach called Reverse Chain to empower LLMs with capabilities to use external APIs with only prompts. Given that most open-source LLMs have limited tool-use or tool-plan capabilities, LLMs in Reverse Chain are only employed to implement simple tasks, e.g., API selection and argument completion, and a generic rule is employed to implement a controllable multiple functions calling. In this generic rule, after selecting a final API to handle a given task via LLMs, we first ask LLMs to fill the required arguments from user query and context. Some missing arguments could be further completed by letting LLMs select another API based on API description before asking user. This process continues until a given task is completed. \nExtensive numerical experiments indicate an impressive capability of Reverse Chain on implementing multiple function calling. Interestingly enough, the experiments also reveal that tool-use capabilities of the existing LLMs, e.g., ChatGPT, can be greatly improved via Reverse Chain.",
        "keywords": "Reverse Chain: A Generic Rule for LLMs to Master Multi-API Planning",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Yinger Zhang;Hui Cai;Yicheng Chen;Rui Sun;Jing Zheng",
        "authorids": "~Yinger_Zhang1;~Hui_Cai1;~Yicheng_Chen1;~Rui_Sun12;~Jing_Zheng1",
        "gender": "F;M;M;M;M",
        "homepage": ";;https://www.linkedin.com/in/eason-chen-a6a419b7/;;",
        "dblp": ";;;;15/2171",
        "google_scholar": ";;;;",
        "orcid": "0000-0001-6453-7462;;;;",
        "linkedin": ";hui-cai-7b8235125/;;rui-sun-bb9295a1/;",
        "or_profile": "~Yinger_Zhang1;~Hui_Cai1;~Yicheng_Chen1;~Rui_Sun12;~Jing_Zheng1",
        "aff": "Zhejiang University;Ant Group;Ant Group;;Ant Group",
        "aff_domain": "zju.edu.cn;antgroup.com;antgroup.com;;antgroup.com",
        "position": "PhD student;Algorithm Engineer;Researcher;;Senior Staff Engineer/Manager",
        "bibtex": "@misc{\nzhang2024reverse,\ntitle={Reverse Chain: A Generic Rule for {LLM}s to Master Multi-{API} Planning},\nauthor={Yinger Zhang and Hui Cai and Yicheng Chen and Rui Sun and Jing Zheng},\nyear={2024},\nurl={https://openreview.net/forum?id=vDSkfIUnEO}\n}",
        "github": "",
        "project": "",
        "reviewers": "yWYw;xS6A;62YQ;2PHd;75Tz",
        "site": "https://openreview.net/forum?id=vDSkfIUnEO",
        "pdf_size": 407111,
        "rating": "3;3;5;5;5",
        "confidence": "5;3;3;4;4",
        "soundness": "2;2;3;3;2",
        "contribution": "3;2;3;3;2",
        "presentation": "2;2;3;3;2",
        "wc_summary": "63;65;57;325;53",
        "wc_strengths": "118;73;52;25;16",
        "wc_weaknesses": "137;66;177;24;93",
        "wc_questions": "4;233;72;3;144",
        "wc_review": "322;437;358;377;306",
        "wc_reply_reviewers": "0;0;44;0;0",
        "wc_reply_authors": "0;0;234;0;0",
        "reply_reviewers": "0;0;1;0;0",
        "reply_authors": "0;0;1;0;0",
        "rating_avg": [
            4.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.8,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            112.6,
            106.2856528417641
        ],
        "wc_strengths_avg": [
            56.8,
            36.62458190887644
        ],
        "wc_weaknesses_avg": [
            99.4,
            53.436317238372624
        ],
        "wc_questions_avg": [
            91.2,
            87.91677883089211
        ],
        "wc_review_avg": [
            360.0,
            46.00434762063255
        ],
        "wc_reply_reviewers_avg": [
            8.8,
            17.6
        ],
        "wc_reply_authors_avg": [
            46.8,
            93.59999999999998
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            0.2,
            0.4000000000000001
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.21821789023599233,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5549295985740637196&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Zhejiang University;Ant Group",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.zju.edu.cn;https://www.antgroup.com",
        "aff_unique_abbr": "ZJU;Ant Group",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "The Expressive Leaky Memory Neuron: an Efficient and Expressive Phenomenological Neuron Model Can Solve Long-Horizon Tasks.",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17545",
        "id": "vE1e1mLJ0U",
        "author_site": "Aaron Spieler, Nasim Rahaman, Georg Martius, Bernhard Schoelkopf, Anna Levina",
        "tldr": "",
        "abstract": "Biological cortical neurons are remarkably sophisticated computational devices, temporally integrating their vast synaptic input over an intricate dendritic tree, subject to complex, nonlinearly interacting internal biological processes. \nA recent study proposed to characterize this complexity by fitting accurate surrogate models to replicate the input-output relationship of a detailed biophysical cortical pyramidal neuron model and discovered it needed temporal convolutional networks (TCN) with millions of parameters. \nRequiring these many parameters, however, could stem from a misalignment between the inductive biases of the TCN and cortical neuron's computations.\nIn light of this, and to explore the computational implications of leaky memory units and nonlinear dendritic processing, we introduce the Expressive Leaky Memory (ELM) neuron model, a biologically inspired phenomenological model of a cortical neuron.\nRemarkably, by exploiting such slowly decaying memory-like hidden states and two-layered nonlinear integration of synaptic input, our ELM neuron can accurately match the aforementioned input-output relationship with under ten thousand trainable parameters.\nTo further assess the computational ramifications of our neuron design, we evaluate it on various tasks with demanding temporal structures, including the Long Range Arena (LRA) datasets, as well as a novel neuromorphic dataset based on the Spiking Heidelberg Digits dataset (SHD-Adding). Leveraging a larger number of memory units with sufficiently long timescales, and correspondingly sophisticated synaptic integration, the ELM neuron displays substantial long-range processing capabilities, reliably outperforming the classic Transformer or Chrono-LSTM architectures on LRA, and even solving the Pathfinder-X task with over 70\\% accuracy (16k context length). These findings raise further questions about the computational sophistication of individual cortical neurons and their role in extracting complex long-range temporal dependencies.",
        "keywords": "Computational Neuroscience;Phenomenological Neuron Modeling;Cortical Neurons;Recurrent Neural Networks;Machine Learning;Biologically Inspired Modelling",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/3433b77519050f9c83ff37ffe0394035f6afff45.zip",
        "author": "Aaron Spieler;Nasim Rahaman;Georg Martius;Bernhard Sch\u00f6lkopf;Anna Levina",
        "authorids": "~Aaron_Spieler1;~Nasim_Rahaman1;~Georg_Martius1;~Bernhard_Sch\u00f6lkopf1;~Anna_Levina1",
        "gender": "M;M;M;;F",
        "homepage": ";;https://uni-tuebingen.de/de/264672;;https://uni-tuebingen.de/index.php?id=161236",
        "dblp": ";222/3165;47/2706;;82/2964",
        "google_scholar": ";https://scholar.google.de/citations?user=iH9DuY0AAAAJ;https://scholar.google.de/citations?user=b-JF-UIAAAAJ;;https://scholar.google.de/citations?user=KJSnbQoAAAAJ",
        "orcid": ";;;;0000-0003-1355-6617",
        "linkedin": "aaron-spieler-9955a217a/;https://de.linkedin.com/in/nasim-rahaman/de;;;",
        "or_profile": "~Aaron_Spieler1;~Nasim_Rahaman1;~Georg_Martius1;~Bernhard_Sch\u00f6lkopf1;~Anna_Levina1",
        "aff": "Friedrich Miescher Institute ;Max Planck Institute for Intelligent Systems, Max-Planck Institute;Max Planck Institute for Intelligent Systems;;Eberhard-Karls-Universit\u00e4t T\u00fcbingen",
        "aff_domain": "fmi.ch;tuebingen.mpg.de;tuebingen.mpg.de;;uni-tuebingen.de",
        "position": "Intern;PhD student;Assistant Professor;;Assistant Professor",
        "bibtex": "@inproceedings{\nspieler2024the,\ntitle={The Expressive Leaky Memory Neuron: an Efficient and Expressive Phenomenological Neuron Model Can Solve Long-Horizon Tasks.},\nauthor={Aaron Spieler and Nasim Rahaman and Georg Martius and Bernhard Sch{\\\"o}lkopf and Anna Levina},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=vE1e1mLJ0U}\n}",
        "github": "",
        "project": "",
        "reviewers": "8X2o;27bc;nAEZ;YDMm",
        "pdf_size": 9999294,
        "rating": "5;6;8;8",
        "confidence": "4;3;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;4",
        "presentation": "3;3;3;1",
        "wc_summary": "133;108;57;90",
        "wc_strengths": "69;111;55;97",
        "wc_weaknesses": "425;195;20;200",
        "wc_questions": "36;64;113;135",
        "wc_review": "663;478;245;522",
        "wc_reply_reviewers": "0;34;9;36",
        "wc_reply_authors": "539;771;608;755",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            97.0,
            27.685736399814257
        ],
        "wc_strengths_avg": [
            83.0,
            22.135943621178654
        ],
        "wc_weaknesses_avg": [
            210.0,
            143.7445651146505
        ],
        "wc_questions_avg": [
            87.0,
            39.08324449172561
        ],
        "wc_review_avg": [
            477.0,
            150.3712073503435
        ],
        "wc_reply_reviewers_avg": [
            19.75,
            15.594470173750693
        ],
        "wc_reply_authors_avg": [
            668.25,
            98.00350759028984
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.19245008972987526,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10112205620940032098&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=vE1e1mLJ0U",
        "pdf": "https://openreview.net/pdf?id=vE1e1mLJ0U",
        "email": "fmi.ch;tuebingen.mpg.de;tuebingen.mpg.de;;uni-tuebingen.de",
        "author_num": 5,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "Friedrich Miescher Institute;Max Planck Institute for Intelligent Systems;Eberhard Karls University of T\u00fcbingen",
        "aff_unique_dep": ";Intelligent Systems;",
        "aff_unique_url": "https://www.fmi.ch;https://www.mpi-is.mpg.de;https://www.uni-tuebingen.de/",
        "aff_unique_abbr": "FMI;MPI-IS;Uni T\u00fcbingen",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";T\u00fcbingen",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "Switzerland;Germany"
    },
    {
        "title": "Threshold-Consistent Margin Loss for Open-World Deep Metric Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17544",
        "id": "vE5MyzpP92",
        "author_site": "Qin ZHANG, Linghan Xu, Jun Fang, Qingming Tang, Yingnian Wu, Joseph Tighe, Yifan Xing",
        "tldr": "",
        "abstract": "Existing losses used in deep metric learning (DML) for image retrieval often lead to highly non-uniform intra-class and inter-class representation structures across test classes and data distributions. When combined with the common practice of using a fixed threshold to declare a match, this gives rise to significant performance variations in terms of false accept rate (FAR) and false reject rate (FRR) across test classes and data distributions. We define this issue in DML as threshold inconsistency. In real-world applications, such inconsistency often complicates the threshold selection process when deploying large-scale image retrieval systems. To measure this inconsistency, we propose a novel variance-based metric called Operating-Point-Inconsistency-Score (OPIS) that quantifies the variance in the operating characteristics across classes. Using the OPIS metric, we find that achieving high accuracy levels in a DML model does not automatically guarantee threshold consistency. In fact, our investigation reveals a Pareto frontier in the high-accuracy regime, where existing methods to improve accuracy often lead to degradation in threshold consistency. To address this trade-off, we introduce the Threshold-Consistent Margin (TCM) loss, a simple yet effective regularization technique that promotes uniformity in representation structures across classes by selectively penalizing hard sample pairs. Large-scale experiments demonstrate TCM's effectiveness in enhancing threshold consistency while preserving accuracy, simplifying the threshold selection process in practical DML settings.",
        "keywords": "Deep metric learning;Open-world visual recognition;Threshold consistency",
        "primary_area": "metric learning, kernel learning, and sparse coding",
        "supplementary_material": "",
        "author": "Qin ZHANG;Linghan Xu;Jun Fang;Qingming Tang;Ying Nian Wu;Joseph Tighe;Yifan Xing",
        "authorids": "~Qin_ZHANG8;~Linghan_Xu3;~Jun_Fang2;~Qingming_Tang1;~Ying_Nian_Wu1;~Joseph_Tighe3;~Yifan_Xing1",
        "gender": "F;;;M;M;;M",
        "homepage": "https://www.amazon.science/author/qin-zhang;;;https://ttic.uchicago.edu/~qmtang/;https://jovapo.github.io/;;http://www.stat.ucla.edu/~ywu/",
        "dblp": ";;55/2632-4;79/8473;58/8741;93/10423;18/568.html",
        "google_scholar": ";;https://scholar.google.com/citations?hl=en;FVLh0QUAAAAJ;TJo2_hAAAAAJ;Tip8gvoAAAAJ;7k_1QFIAAAAJ",
        "orcid": ";;;;0000-0002-0716-8119;;",
        "linkedin": ";linghan-xu/;jun-fang-12946085;;joseph-tighe-4b85001/;;",
        "or_profile": "~Qin_ZHANG8;~Linghan_Xu3;~Jun_Fang2;~Qingming_Tang1;~Joseph_Tighe3;~Yifan_Xing1;~Yingnian_Wu1",
        "aff": "Amazon;Amazon;Amazon;Amazon, AGI;Meta;Amazon;UCLA",
        "aff_domain": "amazon.com;amazon.com;amazon.com;amazon.com;meta.com;amazon.com;stat.ucla.edu",
        "position": "Researcher;Applied Scientist;Senior Applied Scientist;Researcher;Principal Researcher;Applied Scientist;Full Professor",
        "bibtex": "@inproceedings{\nzhang2024thresholdconsistent,\ntitle={Threshold-Consistent Margin Loss for Open-World Deep Metric Learning},\nauthor={Qin ZHANG and Linghan Xu and Jun Fang and Qingming Tang and Ying Nian Wu and Joseph Tighe and Yifan Xing},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=vE5MyzpP92}\n}",
        "github": "",
        "project": "",
        "reviewers": "3dmW;4pGE;52BZ",
        "pdf_size": 4363651,
        "rating": "5;6;8",
        "confidence": "4;4;5",
        "soundness": "2;3;3",
        "contribution": "3;3;3",
        "presentation": "4;3;3",
        "wc_summary": "72;201;68",
        "wc_strengths": "57;88;43",
        "wc_weaknesses": "166;39;215",
        "wc_questions": "40;64;3",
        "wc_review": "335;392;329",
        "wc_reply_reviewers": "0;0;24",
        "wc_reply_authors": "1345;756;879",
        "reply_reviewers": "0;0;1",
        "reply_authors": "4;3;3",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            113.66666666666667,
            61.77557949725946
        ],
        "wc_strengths_avg": [
            62.666666666666664,
            18.80307303489394
        ],
        "wc_weaknesses_avg": [
            140.0,
            74.16647940051264
        ],
        "wc_questions_avg": [
            35.666666666666664,
            25.090945688745084
        ],
        "wc_review_avg": [
            352.0,
            28.39013913315678
        ],
        "wc_reply_reviewers_avg": [
            8.0,
            11.313708498984761
        ],
        "wc_reply_authors_avg": [
            993.3333333333334,
            253.68528183996452
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.944911182523068,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9190543687282042169&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=vE5MyzpP92",
        "pdf": "https://openreview.net/pdf?id=vE5MyzpP92",
        "email": "amazon.com;amazon.com;amazon.com;amazon.com;meta.com;amazon.com;stat.ucla.edu",
        "author_num": 7,
        "aff_unique_index": "0;0;0;0;1;0;2",
        "aff_unique_norm": "Amazon;Meta;University of California, Los Angeles",
        "aff_unique_dep": "Amazon.com, Inc.;Meta Platforms, Inc.;",
        "aff_unique_url": "https://www.amazon.com;https://meta.com;https://www.ucla.edu",
        "aff_unique_abbr": "Amazon;Meta;UCLA",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Los Angeles",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "vE8Vn6DM0y",
        "title": "Aligning Brains into a Shared Space Improves Their Alignment to Large Language Model",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The ability of Large Language Models (LLM) to perform remarkably well on various language processing tasks provides a computational modeling framework for studying the neural basis of human language. Recent studies show that the hidden states of the transformer layers of LLM, called contextual embeddings, can predict brain responses through linear encoding models. In this paper, we analyze the neural responses of 8 subjects while they listened to the same 30 minute podcast episode. We use a shared response model to compute the shared information space across subjects and show that LLM-based encoding models achieve significantly better performance in predicting the shared information features than the original brain responses. We also show that we can use this shared space to denoise the individual brain responses by projecting back to the neural space and this process achieves a mean 38% improvement in encoding performance across the subjects. A detailed inspection of this improvement in different brain areas reveals that the improvements are the most prominent in brain areas specialized for language comprehension, specifically in superior temporal gyrus (STG) and inferior frontal gyrus (IFG). Our analysis also shows that the shared space calculated from a group of subjects is generalizable to a new subject. This suggests that the LLM model can be used as a shared linguistic model for how information is shared across brains.",
        "keywords": "Shared response model;shared space;contextual embeddings;encoding model;Large Language Models",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "ARNAB BHATTACHARJEE;Zaid Zada;Haocheng Wang;Bobbi Aubrey;Samuel Nastase;Werner K Doyle;Sasha Devore;Patricia Dugan;Daniel Friedman;Orrin Devinsky;Adeen Flinker;Peter Ramadge;Uri Hasson;Ariel Goldstein",
        "authorids": "~ARNAB_BHATTACHARJEE1;~Zaid_Zada1;~Haocheng_Wang2;~Bobbi_Aubrey1;~Samuel_Nastase1;~Werner_K_Doyle1;~Sasha_Devore1;~Patricia_Dugan1;~Daniel_Friedman2;~Orrin_Devinsky1;~Adeen_Flinker1;~Peter_Ramadge1;~Uri_Hasson1;~Ariel_Goldstein1",
        "gender": "M;M;M;;M;M;;F;M;M;M;M;M;M",
        "homepage": ";https://zaidzada.com;;;https://snastase.github.io/;http://neuroviewtech.com;https://med.nyu.edu/faculty/sasha-devore;https://nyulangone.org/doctors/1467789107/patricia-c-dugan;;;https://flinkerlab.org;http://ee.princeton.edu/people/faculty/peter-j-ramadge;https://hassonlab.princeton.edu/;https://www.deepcognitionlab.com/",
        "dblp": ";;;;165/6494;;;;73/1093;;;77/3256;;",
        "google_scholar": "gOi-kyoAAAAJ;RC_hwc0AAAAJ;;pryO0XYAAAAJ;tjLH8mQAAAAJ;;;;CMIm2eUAAAAJ;25Q74uMAAAAJ;Us1mDooAAAAJ;BOMboVoAAAAJ;VRw8v4kAAAAJ;p8hQgVuVOTgC",
        "orcid": ";0000-0002-3096-0059;;;0000-0001-7013-5275;;;0000-0001-6199-1870;0000-0003-1068-1797;;0000-0003-1247-1283;;;",
        "linkedin": ";zzada/;ken-wang-20852218a/;;;;;;;;;;;",
        "or_profile": "~ARNAB_BHATTACHARJEE1;~Zaid_Zada1;~Haocheng_Wang2;~Bobbi_Aubrey1;~Samuel_Nastase1;~Werner_K_Doyle1;~Sasha_Devore1;~Patricia_Dugan1;~Daniel_Friedman2;~Orrin_Devinsky1;~Adeen_Flinker1;~Peter_Ramadge1;~Uri_Hasson1;~Ariel_Goldstein1",
        "aff": "Princeton University;Princeton University;;Princeton University;Princeton University;New York University;NYU Langone;NYU Grossman School of Medicine;NYU Langone;;New York University;Princeton University;;Hebrew University of Jerusalem",
        "aff_domain": "princeton.edu;princeton.edu;;princeton.edu;princeton.edu;nyu.edu;nyumc.org;nyulangone.org;nyumc.org;;nyu.edu;princeton.edu;;huji.ac.il",
        "position": "PhD student;PhD student;;Researcher;Postdoc;Associate Professor;Associate Professor;Associate Professor;Full Professor;;Assistant Professor;Full Professor;;Assistant Professor",
        "bibtex": "@misc{\nbhattacharjee2024aligning,\ntitle={Aligning Brains into a Shared Space Improves Their Alignment to Large Language Model},\nauthor={ARNAB BHATTACHARJEE and Zaid Zada and Haocheng Wang and Bobbi Aubrey and Samuel Nastase and Werner K Doyle and Sasha Devore and Patricia Dugan and Daniel Friedman and Orrin Devinsky and Adeen Flinker and Peter Ramadge and Uri Hasson and Ariel Goldstein},\nyear={2024},\nurl={https://openreview.net/forum?id=vE8Vn6DM0y}\n}",
        "github": "",
        "project": "",
        "reviewers": "6UCh;CbtZ;MBTm",
        "site": "https://openreview.net/forum?id=vE8Vn6DM0y",
        "pdf_size": 4675403,
        "rating": "3;5;6",
        "confidence": "4;1;3",
        "soundness": "2;2;3",
        "contribution": "2;1;3",
        "presentation": "2;2;3",
        "wc_summary": "148;136;92",
        "wc_strengths": "49;47;57",
        "wc_weaknesses": "243;101;44",
        "wc_questions": "34;175;51",
        "wc_review": "474;459;244",
        "wc_reply_reviewers": "0;0;13",
        "wc_reply_authors": "2404;1685;1853",
        "reply_reviewers": "0;0;1",
        "reply_authors": "7;5;6",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            125.33333333333333,
            24.073960113690383
        ],
        "wc_strengths_avg": [
            51.0,
            4.320493798938574
        ],
        "wc_weaknesses_avg": [
            129.33333333333334,
            83.67529835952516
        ],
        "wc_questions_avg": [
            86.66666666666667,
            62.84548954026498
        ],
        "wc_review_avg": [
            392.3333333333333,
            105.06611674982992
        ],
        "wc_reply_reviewers_avg": [
            4.333333333333333,
            6.128258770283413
        ],
        "wc_reply_authors_avg": [
            1980.6666666666667,
            307.0986088466627
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            6.0,
            0.816496580927726
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            14,
            0
        ],
        "corr_rating_confidence": -0.49999999999999994,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9610641040443732048&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;0;0;1;2;3;2;1;0;4",
        "aff_unique_norm": "Princeton University;New York University;NYU Langone Health;New York University Grossman School of Medicine;Hebrew University of Jerusalem",
        "aff_unique_dep": ";;;School of Medicine;",
        "aff_unique_url": "https://www.princeton.edu;https://www.nyu.edu;https://nyulangone.org;https://med.nyu.edu;https://www.huji.ac.il",
        "aff_unique_abbr": "Princeton;NYU;NYU Langone;NYU Grossman SOM;HUJI",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";New York;Jerusalem",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0;1",
        "aff_country_unique": "United States;Israel"
    },
    {
        "id": "vEEWhGjx0M",
        "title": "Adversarial Attacks on Combinatorial Multi-Armed Bandits",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We study reward poisoning attacks on Combinatorial Multi-armed Bandits (CMAB). We first provide a sufficient and necessary condition for the attackability of CMAB, which depends on the intrinsic properties of the corresponding CMAB instance such as the reward distributions of super arms and outcome distributions of base arms. Additionally, we devise an attack algorithm for attackable CMAB instances. Contrary to prior understanding of multi-armed bandits, our work reveals a surprising fact that the attackability of a specific CMAB instance also depends on whether the bandit instance is known or unknown to the adversary. This finding indicates that adversarial attacks on CMAB are difficult in practice and a general attack strategy for any CMAB instance does not exist since the environment is mostly unknown to the adversary. We validate our theoretical findings via extensive experiments on real-world CMAB applications including probabilistic maximum covering problem, online minimum spanning tree,  cascading bandits for online ranking, and online shortest path.",
        "keywords": "Adversairal attacks;combinatorial bandit;online learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/a5acb4efc790239892c49155b1ee814c1cec3119.pdf",
        "author": "Rishab Balasubramanian;Jiawei Li;Prasad Tadepalli;Huazheng Wang;Qingyun Wu;Haoyu Zhao",
        "authorids": "~Rishab_Balasubramanian1;~Jiawei_Li10;~Prasad_Tadepalli3;~Huazheng_Wang1;~Qingyun_Wu2;~Haoyu_Zhao1",
        "gender": "M;;M;;M;F",
        "homepage": "https://rishabbala.github.io/;https://jiawei-li20.github.io;http://eecs.oregonstate.edu/~tadepall;https://huazhengwang.github.io/;http://hyzhao.me;https://qingyun-wu.github.io/",
        "dblp": "277/9164.html;;42/4375.html;163/2233;;183/0579",
        "google_scholar": "K5x0hwcAAAAJ;;CXAN0i0AAAAJ;w3PrbKwAAAAJ;1MjanHUAAAAJ;Y54J21sAAAAJ",
        "orcid": ";;0000-0003-2736-3912;;;",
        "linkedin": "rishab-bala-b01110142/;;prasad-tadepalli-85857b5/;;;",
        "or_profile": "~Rishab_Balasubramanian1;~Jiawei_Li10;~Prasad_Tadepalli3;~Huazheng_Wang1;~Haoyu_Zhao1;~Qingyun_Wu1",
        "aff": "Oregon State University;University of Illinois, Urbana Champaign;Oregon State University;Oregon State University;Princeton University;Pennsylvania State University",
        "aff_domain": "oregonstate.edu;uiuc.edu;oregonstate.edu;oregonstate.edu;princeton.edu;psu.edu",
        "position": "MS student;PhD student;Full Professor;Assistant Professor;PhD student;Assistant Professor",
        "bibtex": "@misc{\nbalasubramanian2024adversarial,\ntitle={Adversarial Attacks on Combinatorial Multi-Armed Bandits},\nauthor={Rishab Balasubramanian and Jiawei Li and Prasad Tadepalli and Huazheng Wang and Qingyun Wu and Haoyu Zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=vEEWhGjx0M}\n}",
        "github": "",
        "project": "",
        "reviewers": "cTNV;grhj;UBzx;eFM9",
        "site": "https://openreview.net/forum?id=vEEWhGjx0M",
        "pdf_size": 30035948,
        "rating": "3;5;6;6",
        "confidence": "4;2;4;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "3;2;2;2",
        "wc_summary": "75;9;89;115",
        "wc_strengths": "47;34;218;93",
        "wc_weaknesses": "142;31;404;155",
        "wc_questions": "25;120;38;40",
        "wc_review": "289;194;749;403",
        "wc_reply_reviewers": "0;0;44;0",
        "wc_reply_authors": "766;438;603;1066",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            72.0,
            39.102429592034305
        ],
        "wc_strengths_avg": [
            98.0,
            72.66704892865816
        ],
        "wc_weaknesses_avg": [
            183.0,
            136.39098210658943
        ],
        "wc_questions_avg": [
            55.75,
            37.539146234297874
        ],
        "wc_review_avg": [
            408.75,
            209.91709673106666
        ],
        "wc_reply_reviewers_avg": [
            11.0,
            19.05255888325765
        ],
        "wc_reply_authors_avg": [
            718.25,
            231.85811933162918
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7302297620536087407&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;0;0;2;3",
        "aff_unique_norm": "Oregon State University;University of Illinois Urbana-Champaign;Princeton University;Pennsylvania State University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://oregonstate.edu;https://illinois.edu;https://www.princeton.edu;https://www.psu.edu",
        "aff_unique_abbr": "OSU;UIUC;Princeton;PSU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Urbana-Champaign",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Multilingual Jailbreak Challenges in Large Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17543",
        "id": "vESNKdEMGp",
        "author_site": "Yue Deng, Wenxuan Zhang, Sinno Pan, Lidong Bing",
        "tldr": "",
        "abstract": "While large language models (LLMs) exhibit remarkable capabilities across a wide range of tasks, they pose potential safety concerns, such as the ``jailbreak'' problem, wherein malicious instructions can manipulate LLMs to exhibit undesirable behavior. Although several preventive measures have been developed to mitigate the potential risks associated with LLMs, they have primarily focused on English. In this study, we reveal the presence of multilingual jailbreak challenges within LLMs and consider two potential risky scenarios: unintentional and intentional. The unintentional scenario involves users querying LLMs using non-English prompts and inadvertently bypassing the safety mechanisms, while the intentional scenario concerns malicious users combining malicious instructions with multilingual prompts to deliberately attack LLMs. The experimental results reveal that in the unintentional scenario, the rate of unsafe content increases as the availability of languages decreases. Specifically, low-resource languages exhibit about three times the likelihood of encountering harmful content compared to high-resource languages, with both ChatGPT and GPT-4. In the intentional scenario, multilingual prompts can exacerbate the negative impact of malicious instructions, with astonishingly high rates of unsafe output: 80.92\\% for ChatGPT and 40.71\\% for GPT-4. To handle such a challenge in the multilingual context, we propose a novel \\textsc{Self-Defense} framework that automatically generates multilingual training data for safety fine-tuning. Experimental results show that ChatGPT fine-tuned with such data can achieve a substantial reduction in unsafe content generation.  Data is available at \\url{https://github.com/DAMO-NLP-SG/multilingual-safety-for-LLMs}.",
        "keywords": "multilingual;safety;large language models",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Yue Deng;Wenxuan Zhang;Sinno Jialin Pan;Lidong Bing",
        "authorids": "~Yue_Deng3;~Wenxuan_Zhang1;~Sinno_Jialin_Pan1;~Lidong_Bing2",
        "gender": "M;;;M",
        "homepage": "https://ntudy.github.io/;https://isakzhang.github.io/;https://lidongbing.github.io;http://www.cse.cuhk.edu.hk/~sinnopan/",
        "dblp": "35/8109-10;85/1177-1.html;53/6625;80/5412",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en",
        "orcid": "0009-0006-3682-8047;;;",
        "linkedin": "yue0068/;wenxuan-zhang-608b88153/;;",
        "or_profile": "~Yue_Deng3;~Wenxuan_Zhang1;~Lidong_Bing3;~Sinno_Pan1",
        "aff": "School of Computer Science and  Engineering, Nanyang Technological University;Alibaba Group;Alibaba Group;Nanyang Technological University",
        "aff_domain": "scse.ntu.edu.sg;alibaba-inc.com;alibaba-inc.com;ntu.edu.sg",
        "position": "PhD student;Researcher;Scientist;Full Professor",
        "bibtex": "@inproceedings{\ndeng2024multilingual,\ntitle={Multilingual Jailbreak Challenges in Large Language Models},\nauthor={Yue Deng and Wenxuan Zhang and Sinno Jialin Pan and Lidong Bing},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=vESNKdEMGp}\n}",
        "github": "",
        "project": "",
        "reviewers": "WaDP;imbS;QBvZ;Pbxw;emGp",
        "pdf_size": 654644,
        "rating": "6;6;6;6;8",
        "confidence": "3;3;4;4;4",
        "soundness": "3;3;3;3;2",
        "contribution": "2;3;3;3;3",
        "presentation": "3;3;4;2;2",
        "wc_summary": "145;75;71;76;83",
        "wc_strengths": "64;61;75;31;57",
        "wc_weaknesses": "229;126;269;89;520",
        "wc_questions": "35;7;18;104;131",
        "wc_review": "473;269;433;300;791",
        "wc_reply_reviewers": "18;0;153;0;337",
        "wc_reply_authors": "729;511;1736;778;1895",
        "reply_reviewers": "1;0;1;0;2",
        "reply_authors": "2;2;4;2;4",
        "rating_avg": [
            6.4,
            0.7999999999999999
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.8,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.8,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            90.0,
            27.77048793233565
        ],
        "wc_strengths_avg": [
            57.6,
            14.582180906846546
        ],
        "wc_weaknesses_avg": [
            246.6,
            151.61873235190959
        ],
        "wc_questions_avg": [
            59.0,
            49.33558553417604
        ],
        "wc_review_avg": [
            453.2,
            185.6387890501336
        ],
        "wc_reply_reviewers_avg": [
            101.6,
            130.91157320878852
        ],
        "wc_reply_authors_avg": [
            1129.8,
            569.2673888428881
        ],
        "reply_reviewers_avg": [
            0.8,
            0.7483314773547883
        ],
        "reply_authors_avg": [
            2.8,
            0.9797958971132712
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.408248290463863,
        "gs_citation": 238,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7813851188728395791&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=vESNKdEMGp",
        "pdf": "https://openreview.net/pdf?id=vESNKdEMGp",
        "email": "scse.ntu.edu.sg;alibaba-inc.com;alibaba-inc.com;ntu.edu.sg",
        "author_num": 4,
        "aff_unique_index": "0;1;1;0",
        "aff_unique_norm": "Nanyang Technological University;Alibaba Group",
        "aff_unique_dep": "School of Computer Science and Engineering;",
        "aff_unique_url": "https://www.ntu.edu.sg;https://www.alibaba.com",
        "aff_unique_abbr": "NTU;Alibaba",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "Singapore;China"
    },
    {
        "title": "Learning in reverse causal strategic environments with ramifications on two sided markets",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17542",
        "id": "vEfmVS5ywF",
        "author_site": "Seamus Somerstep, Yuekai Sun, Yaacov Ritov",
        "tldr": "",
        "abstract": "Motivated by equilibrium models of labor markets, we develop a formulation of causal strategic classification in which strategic agents can directly manipulate their outcomes. As an application, we consider employers that seek to anticipate the strategic response of a labor force when developing a hiring policy. We show theoretically that employers with performatively optimal hiring policies improve employer reward, labor force skill level, and labor force equity (compared to employers that do not anticipate the strategic labor force response) in the classic Coate-Loury labor market model. Empirically, we show that these desirable properties of performative hiring policies do generalize to our own formulation of a general equilibrium labor market. On the other hand, we also observe that the benefits of performatively optimal hiring policies are brittle in some aspects. We demonstrate that in our formulation a performative employer both harms workers by reducing their aggregate welfare and fails to prevent discrimination when more sophisticated wage and cost structures are introduced.",
        "keywords": "Strategic Classification;Performative Prediction;Labor Market",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/84d2e46ae5fe4afb1db670760ce81366343f319c.zip",
        "author": "Seamus Somerstep;Yuekai Sun;Yaacov Ritov",
        "authorids": "~Seamus_Somerstep1;~Yuekai_Sun1;~Yaacov_Ritov2",
        "gender": ";;M",
        "homepage": "https://somerstep.github.io;https://yuekai.github.io/;http://www-personal.umich.edu/~yritov/jr.html",
        "dblp": ";;34/4054",
        "google_scholar": ";6T1XtW8AAAAJ;JlNrOwcAAAAJ",
        "orcid": ";;0000-0002-6046-8479",
        "linkedin": "seamus-somerstep-a1a217194;;",
        "or_profile": "~Seamus_Somerstep1;~Yuekai_Sun1;~Yaacov_Ritov2",
        "aff": "University of Michigan - Ann Arbor;University of Michigan - Ann Arbor;University of Michigan - Ann Arbor",
        "aff_domain": "umich.edu;umich.edu;umich.edu",
        "position": "PhD student;Assistant \u2192 Associate Professor of Statistics;Full Professor",
        "bibtex": "@inproceedings{\nsomerstep2024learning,\ntitle={Learning in reverse causal strategic environments with ramifications on two sided markets},\nauthor={Seamus Somerstep and Yuekai Sun and Yaacov Ritov},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=vEfmVS5ywF}\n}",
        "github": "",
        "project": "",
        "reviewers": "L1Mv;jt3C",
        "pdf_size": 701756,
        "rating": "6;8",
        "confidence": "3;4",
        "soundness": "2;3",
        "contribution": "2;3",
        "presentation": "2;3",
        "wc_summary": "213;296",
        "wc_strengths": "39;100",
        "wc_weaknesses": "176;18",
        "wc_questions": "236;1",
        "wc_review": "664;415",
        "wc_reply_reviewers": "177;0",
        "wc_reply_authors": "932;29",
        "reply_reviewers": "1;0",
        "reply_authors": "3;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            254.5,
            41.5
        ],
        "wc_strengths_avg": [
            69.5,
            30.5
        ],
        "wc_weaknesses_avg": [
            97.0,
            79.0
        ],
        "wc_questions_avg": [
            118.5,
            117.5
        ],
        "wc_review_avg": [
            539.5,
            124.5
        ],
        "wc_reply_reviewers_avg": [
            88.5,
            88.5
        ],
        "wc_reply_authors_avg": [
            480.5,
            451.5
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            1.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.9999999999999999,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9322534926350209703&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=vEfmVS5ywF",
        "pdf": "https://openreview.net/pdf?id=vEfmVS5ywF",
        "email": "umich.edu;umich.edu;umich.edu",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Michigan",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.umich.edu",
        "aff_unique_abbr": "UM",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Ann Arbor",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "vEgLnT9avP",
        "title": "ResolvNet: A Graph Convolutional Network with multi-scale Consistency",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "It is by now a well known fact in the graph learning community that the presence of bottlenecks severely limits the ability of graph neural networks to propagate information over long distances. What so far has not been appreciated is that,  counter-intuitively, also the presence of strongly connected sub-graphs may severely restrict information flow in common architectures. Motivated by this observation, we introduce the concept of multi-scale consistency. At the node level this concept refers to the retention of a connected propagation graph even if connectivity varies over a given graph. At the graph-level, multi-scale consistency refers to the fact that distinct graphs describing the same object at different resolutions should be assigned similar feature vectors. As we show, both properties are not satisfied by poular graph neural network architectures. To remedy these shortcomings, we introduce ResolvNet, a flexible  graph neural network based on the mathematical concept of resolvents. We rigorously establish its  multi-scale consistency theoretically and verify it in extensive experiments on real world data: Here networks based on this ResolvNet architecture prove expressive; out-performing baselines significantly on many tasks; in- and outside the multi-scale setting.",
        "keywords": "spectral graph convolutions;weighted graphs;scale invariance;robustness;transferability",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/de8cac457c7a70004d5c1df95d549bdc28db841f.zip",
        "author": "Christian Koke;Abhishek Saroha;Yuesong Shen;Marvin Eisenberger;Daniel Cremers",
        "authorids": "~Christian_Koke1;~Abhishek_Saroha1;~Yuesong_Shen1;~Marvin_Eisenberger1;~Daniel_Cremers1",
        "gender": ";M;M;M;M",
        "homepage": ";;https://vision.in.tum.de/members/sheny;https://vision.in.tum.de/members/eisenber;https://vision.in.tum.de/members/cremers",
        "dblp": ";230/4206;190/1791;218/6006;c/DanielCremers",
        "google_scholar": ";;;https://scholar.google.de/citations?user=6ZX5D5QAAAAJ;cXQciMEAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";abhishek-saroha/;;;",
        "or_profile": "~Christian_Koke1;~Abhishek_Saroha1;~Yuesong_Shen1;~Marvin_Eisenberger1;~Daniel_Cremers1",
        "aff": ";Department of Informatics, Technische Universit\u00e4t M\u00fcnchen;Technical University Munich;Technical University Munich;Technical University Munich",
        "aff_domain": ";in.tum.de;tum.de;tum.de;tum.de",
        "position": ";PhD student;PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nkoke2024resolvnet,\ntitle={ResolvNet: A Graph Convolutional Network with multi-scale Consistency},\nauthor={Christian Koke and Abhishek Saroha and Yuesong Shen and Marvin Eisenberger and Daniel Cremers},\nyear={2024},\nurl={https://openreview.net/forum?id=vEgLnT9avP}\n}",
        "github": "",
        "project": "",
        "reviewers": "2iPY;nd7U;ZGZ9;MwCo",
        "site": "https://openreview.net/forum?id=vEgLnT9avP",
        "pdf_size": 2474533,
        "rating": "3;5;6;8",
        "confidence": "4;3;3;2",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "1;3;3;3",
        "wc_summary": "82;108;62;223",
        "wc_strengths": "33;44;82;110",
        "wc_weaknesses": "117;147;60;103",
        "wc_questions": "60;5;69;56",
        "wc_review": "292;304;273;492",
        "wc_reply_reviewers": "0;96;0;0",
        "wc_reply_authors": "1407;2464;1083;974",
        "reply_reviewers": "0;2;0;0",
        "reply_authors": "3;6;2;3",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            118.75,
            62.35934172199062
        ],
        "wc_strengths_avg": [
            67.25,
            30.65432269680738
        ],
        "wc_weaknesses_avg": [
            106.75,
            31.32391259086259
        ],
        "wc_questions_avg": [
            47.5,
            24.984995497297973
        ],
        "wc_review_avg": [
            340.25,
            88.30734680648038
        ],
        "wc_reply_reviewers_avg": [
            24.0,
            41.569219381653056
        ],
        "wc_reply_authors_avg": [
            1482.0,
            588.9002462217179
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            3.5,
            1.5
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9805806756909202,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1521217009868506547&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Technische Universit\u00e4t M\u00fcnchen;Technical University of Munich",
        "aff_unique_dep": "Department of Informatics;",
        "aff_unique_url": "https://www.tum.de;https://www.tum.de",
        "aff_unique_abbr": "TUM;TUM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "vFPwZP0fnO",
        "title": "AugUndo: Scaling Up Augmentations for Unsupervised Depth Completion",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Unsupervised depth completion methods are trained predominantly using structure-from-motion. The training objective involves minimizing photometric reconstruction error between temporally (from video) or spatially (from stereo) adjacent images, which assumes photometric consistency in co-visible regions across frames. Block artifacts from geometric transformations, intensity saturation, and occlusions are amongst the many undesirable by-products of common data augmentation schemes that affect reconstruction quality, and thus the resulting model performance. Hence, typical data augmentations on the image that are viewed as essential to training pipelines in other vision tasks have seen limited use beyond small image intensity changes and flipping. In fact, the sparse depth modality have seen even less variety as intensity transformations alter the scale of the measured 3D scene, and geometric transformations may decimate the sparse points during resampling. We propose a method that unlocks a wide range of previously-infeasible geometric augmentations for unsupervised depth completion. This is achieved by reversing,or ``undo\"-ing, geometric transformations to the coordinates of the output depth, warping the depth map back to the original reference frame. This enables computing the photometric reprojection loss via the original images and sparse depth maps, eliminating the pitfalls resulting from naive loss computation on the augmented inputs. This simple yet effective strategy allows us to scale up augmentations to boost performance. We demonstrate our method on indoor (VOID) and outdoor (KITTI) datasets where we improve upon three existing methods by an average of 10.4% overall across both datasets.",
        "keywords": "Data Augmentation;Monocular Depth Completion",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yangchao Wu;Tian Yu Liu;Hyoungseob Park;Stefano Soatto;Dong Lao;Alex Wong",
        "authorids": "~Yangchao_Wu1;~Tian_Yu_Liu2;~Hyoungseob_Park1;~Stefano_Soatto1;~Dong_Lao1;~Alex_Wong2",
        "gender": "M;;M;;M;M",
        "homepage": "https://scholar.google.com/citations?view_op=list_works&hl=en&user=k_h1nbAAAAAJ;;;;;https://vision.cs.yale.edu/members/alex-wong/",
        "dblp": ";;268/8125;;180/5522;39/6537-1",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;;A3c4pHkAAAAJ;;dvQXYW0AAAAJ;K9_XuM8AAAAJ",
        "orcid": ";;0000-0003-0787-2082;;;0000-0002-3157-6016",
        "linkedin": ";;;;;",
        "or_profile": "~Yangchao_Wu1;~Tian_Yu_Liu2;~Hyoungseob_Park1;~Stefano_Soatto1;~Dong_Lao1;~Alex_Wong2",
        "aff": "University of California, Los Angeles;;Yale University;;University of California, Los Angeles;Yale University",
        "aff_domain": "ucla.edu;;yale.edu;;cs.ucla.edu;yale.edu",
        "position": "PhD student;;PhD student;;Postdoc;Assistant Professor",
        "bibtex": "@misc{\nwu2024augundo,\ntitle={AugUndo: Scaling Up Augmentations for Unsupervised Depth Completion},\nauthor={Yangchao Wu and Tian Yu Liu and Hyoungseob Park and Stefano Soatto and Dong Lao and Alex Wong},\nyear={2024},\nurl={https://openreview.net/forum?id=vFPwZP0fnO}\n}",
        "github": "",
        "project": "",
        "reviewers": "qT32;WQDt;YqAp;2LRv;naag",
        "site": "https://openreview.net/forum?id=vFPwZP0fnO",
        "pdf_size": 2080860,
        "rating": "3;3;3;6;6",
        "confidence": "5;4;4;4;4",
        "soundness": "2;2;2;3;3",
        "contribution": "2;2;2;2;3",
        "presentation": "2;2;3;3;3",
        "wc_summary": "82;114;35;125;30",
        "wc_strengths": "101;73;66;132;15",
        "wc_weaknesses": "157;290;168;90;83",
        "wc_questions": "43;115;223;2;20",
        "wc_review": "383;592;492;349;148",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            4.2,
            1.469693845669907
        ],
        "confidence_avg": [
            4.2,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            77.2,
            39.16835457355848
        ],
        "wc_strengths_avg": [
            77.4,
            38.93892653887624
        ],
        "wc_weaknesses_avg": [
            157.6,
            74.52945726355452
        ],
        "wc_questions_avg": [
            80.6,
            80.90142149554605
        ],
        "wc_review_avg": [
            392.8,
            149.30693219003598
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.40824829046386313,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14835020052613840327&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;0;1",
        "aff_unique_norm": "University of California, Los Angeles;Yale University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ucla.edu;https://www.yale.edu",
        "aff_unique_abbr": "UCLA;Yale",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Los Angeles;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "vFfMsKjqaH",
        "title": "Interpreting Categorical Distributional Reinforcement Learning: An Implicit Risk-Sensitive Regularization Effect",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The theoretical advantages of distributional reinforcement learning~(RL) over expectation-based RL remain elusive, despite its remarkable empirical performance. Starting from Categorical Distributional RL~(CDRL), our work attributes the potential superiority of distributional RL to its \\textit{risk-sensitive entropy regularization}. This regularization stems from the additional return distribution information regardless of only its expectation via the return density function decomposition, a variant of the gross error model in robust statistics. Compared with maximum RL that explicitly optimizes the policy to encourage the exploration, we reveal that the resulting risk-sensitive entropy regularization of CDRL plays a different role as an augmented reward function. It implicitly optimizes policies for a risk-sensitive exploration towards true target return distributions, which helps to reduce the intrinsic uncertainty of the environment. Finally, extensive experiments verify the importance of this risk-sensitive regularization in distributional RL, as well as the mutual impacts of both explicit and implicit entropy regularization.",
        "keywords": "distributional reinforcement learning;regularization;entropy",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/6778ffc852bea49174965b61dd76b017925967f0.pdf",
        "author": "Ke Sun;Yingnan Zhao;Enze Shi;Yafei Wang;Xiaodong Yan;Bei Jiang;Linglong Kong",
        "authorids": "~Ke_Sun6;~Yingnan_Zhao1;~Enze_Shi1;~Yafei_Wang1;~Xiaodong_Yan1;~Bei_Jiang1;~Linglong_Kong2",
        "gender": "M;M;M;;M;F;M",
        "homepage": "https://sites.google.com/view/kesun;;;https://apps.ualberta.ca/directory/person/yafei2;https://yanxiaodong128.github.io/index.html;https://www.ualberta.ca/~bei1;https://www.ualberta.ca/~lkong",
        "dblp": "69/476-13;;;;;190/4697;35/8525",
        "google_scholar": "lYdNhFQAAAAJ;NMgYY5cAAAAJ;;6zZR3_gAAAAJ;;https://scholar.google.ca/citations?user=MfOZ8G0AAAAJ;https://scholar.google.ca/citations?hl=en",
        "orcid": ";;;;;0000-0002-0033-839X;0000-0003-3011-9216",
        "linkedin": ";;enze-shi-554b621bb/;;;;",
        "or_profile": "~Ke_Sun6;~Yingnan_Zhao1;~Enze_Shi1;~Yafei_Wang1;~Xiaodong_Yan1;~Bei_Jiang1;~Linglong_Kong2",
        "aff": "University of Alberta;Harbin Institute of Technology;University of Alberta;University of Alberta;Shandong University;University of Alberta;University of Alberta",
        "aff_domain": "ualberta.ca;hit.edu.cn;ualberta.ca;ualberta.ca;edu.cn;ualberta.ca;ualberta.ca",
        "position": "PhD student;Assistant Professor;PhD student;Assistant Professor;Associate Professor;Associate Professor;Full Professor",
        "bibtex": "@misc{\nsun2024interpreting,\ntitle={Interpreting Categorical Distributional Reinforcement Learning: An Implicit Risk-Sensitive Regularization Effect},\nauthor={Ke Sun and Yingnan Zhao and Enze Shi and Yafei Wang and Xiaodong Yan and Bei Jiang and Linglong Kong},\nyear={2024},\nurl={https://openreview.net/forum?id=vFfMsKjqaH}\n}",
        "github": "",
        "project": "",
        "reviewers": "rBfi;FbE9;73VF;tqyH",
        "site": "https://openreview.net/forum?id=vFfMsKjqaH",
        "pdf_size": 14109898,
        "rating": "3;3;5;6",
        "confidence": "3;4;4;3",
        "soundness": "2;1;2;3",
        "contribution": "2;1;3;2",
        "presentation": "2;1;1;2",
        "wc_summary": "57;41;78;184",
        "wc_strengths": "35;48;82;13",
        "wc_weaknesses": "213;331;306;147",
        "wc_questions": "72;20;497;263",
        "wc_review": "377;440;963;607",
        "wc_reply_reviewers": "0;0;347;165",
        "wc_reply_authors": "636;567;1622;727",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "1;1;3;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            90.0,
            55.83457710057451
        ],
        "wc_strengths_avg": [
            44.5,
            25.004999500099974
        ],
        "wc_weaknesses_avg": [
            249.25,
            73.6083385222082
        ],
        "wc_questions_avg": [
            213.0,
            187.27386363291595
        ],
        "wc_review_avg": [
            596.75,
            227.5438144621822
        ],
        "wc_reply_reviewers_avg": [
            128.0,
            143.26374279628465
        ],
        "wc_reply_authors_avg": [
            888.0,
            427.55759845896785
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.19245008972987526,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:IPyIjG0PE2sJ:scholar.google.com/&scioq=Interpreting+Categorical+Distributional+Reinforcement+Learning:+An+Implicit+Risk-Sensitive+Regularization+Effect&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0;2;0;0",
        "aff_unique_norm": "University of Alberta;Harbin Institute of Technology;Shandong University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ualberta.ca;http://www.hit.edu.cn/;http://www.sdu.edu.cn",
        "aff_unique_abbr": "UAlberta;HIT;SDU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Harbin",
        "aff_country_unique_index": "0;1;0;0;1;0;0",
        "aff_country_unique": "Canada;China"
    },
    {
        "id": "vFqVifIr6E",
        "title": "Rethinking Semantic Few-Shot Image Classification",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Few-shot learning aims to train models that can be generalized to novel classes\nwith only a few samples. Recently, a line of works has been proposed to enhance\nfew-shot learning with semantic information from class names. However, these\nworks focus on injecting semantic information into existing modules such as visual\nprototypes and feature extractors of the standard few-shot learning framework,\nwhich requires complex designs of the fusion mechanism. In this paper, we\npropose a novel few-shot learning framework that uses public textual encoders\nbased on contrastive learning. To address the challenge of alignment between\nvisual features and textual embeddings obtained from public textual encoders,\nwe carefully design the textual branch of our framework and introduce a metric\nmodule to generalize the cosine similarity. For better transferability, we let the\nmetric module adapt to different few-shot tasks and adopt MAML to train the\nmodel via bi-level optimization. Moreover, we conduct extensive experiments on\nmultiple benchmarks to demonstrate the effectiveness of our method.",
        "keywords": "few-shot image classification;contrastive learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/c1fd673eae5fadb7e92fd21ec027a2644220bb65.zip",
        "author": "Zihao Jiang;Yunkai Dang;Dong Pang;Huishuai Zhang;Weiran Huang",
        "authorids": "~Zihao_Jiang1;~Yunkai_Dang1;~Dong_Pang1;~Huishuai_Zhang3;~Weiran_Huang1",
        "gender": "M;M;M;M;M",
        "homepage": ";;https://www.weiranhuang.com;https://huishuai-git.github.io;https://github.com/TJUdyk",
        "dblp": ";250/8976;170/0073-1;144/7537;352/3477",
        "google_scholar": ";LbYztZUAAAAJ;AjJ2rf8AAAAJ;w1srHyIAAAAJ;",
        "orcid": "0000-0002-2959-8427;0000-0002-4490-0313;;;",
        "linkedin": ";;;;",
        "or_profile": "~Zihao_Jiang1;~Dong_Pang1;~Weiran_Huang1;~Huishuai_Zhang2;~dang_yun_kai1",
        "aff": "Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai AI Laboratory;Peking University;Tianjin University",
        "aff_domain": "sjtu.edu.cn;sjtu.edu.cn;pjlab.org.cn;pku.edu.cn;tju.edu.cn",
        "position": "MS student;PhD student;Consultant;Assistant Professor;MS student",
        "bibtex": "@misc{\njiang2024rethinking,\ntitle={Rethinking Semantic Few-Shot Image Classification},\nauthor={Zihao Jiang and Yunkai Dang and Dong Pang and Huishuai Zhang and Weiran Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=vFqVifIr6E}\n}",
        "github": "",
        "project": "",
        "reviewers": "72Kp;rhJx;Pbba;sXdY",
        "site": "https://openreview.net/forum?id=vFqVifIr6E",
        "pdf_size": 1324227,
        "rating": "3;3;3;5",
        "confidence": "4;5;4;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "2;2;3;3",
        "wc_summary": "70;91;114;139",
        "wc_strengths": "34;29;93;48",
        "wc_weaknesses": "379;186;275;200",
        "wc_questions": "11;29;88;80",
        "wc_review": "494;335;570;467",
        "wc_reply_reviewers": "313;171;35;32",
        "wc_reply_authors": "1743;1175;1714;990",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "5;4;5;4",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            103.5,
            25.734218464915543
        ],
        "wc_strengths_avg": [
            51.0,
            25.228951623085727
        ],
        "wc_weaknesses_avg": [
            260.0,
            76.58655234439007
        ],
        "wc_questions_avg": [
            52.0,
            32.74904578762563
        ],
        "wc_review_avg": [
            466.5,
            84.7953418531938
        ],
        "wc_reply_reviewers_avg": [
            137.75,
            115.71381723891058
        ],
        "wc_reply_authors_avg": [
            1405.5,
            329.71540758660336
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            4.5,
            0.5
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:UDAeQqVRE-AJ:scholar.google.com/&scioq=Rethinking+Semantic+Few-Shot+Image+Classification&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2;3",
        "aff_unique_norm": "Shanghai Jiao Tong University;Shanghai AI Laboratory;Peking University;Tianjin University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.sjtu.edu.cn;https://www.shanghai-ai-lab.com;http://www.pku.edu.cn;http://www.tju.edu.cn",
        "aff_unique_abbr": "SJTU;SAIL;Peking U;TJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Skip-Attention: Improving Vision Transformers by Paying Less Attention",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17541",
        "id": "vI95kcLAoU",
        "author_site": "Shashank Venkataramanan, Amir Ghodrati, Yuki Asano, Fatih Porikli, Amirhossein Habibian",
        "tldr": "",
        "abstract": "This work aims to improve the efficiency of vision transformers (ViTs).  While ViTs use computationally expensive self-attention operations in every layer, we identify that these operations are highly correlated across layers --  a key redundancy that causes unnecessary computations. Based on this observation, we propose SkipAT a method to reuse self-attention computation from preceding layers to approximate attention at one or more subsequent layers. To ensure that reusing self-attention blocks across layers does not degrade the performance, we introduce a simple parametric function, which outperforms the baseline transformer's performance while running computationally faster. We show that SkipAT is agnostic to transformer architecture and is effective in image classification,  semantic segmentation on ADE20K, image denoising on SIDD, and video denoising on DAVIS. We achieve improved throughput at the same-or-higher accuracy levels in all these tasks.",
        "keywords": "vision transformers;efficiency;redundacy in attention maps;improved throughput",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Shashanka Venkataramanan;Amir Ghodrati;Yuki M Asano;Fatih Porikli;Amir Habibian",
        "authorids": "~Shashanka_Venkataramanan2;~Amir_Ghodrati2;~Yuki_M_Asano1;~Fatih_Porikli2;~Amir_Habibian1",
        "gender": "M;M;M;M;M",
        "homepage": "https://shashankvkt.github.io/;https://aghodrati.github.io;https://www.porikli.com;;https://yukimasano.github.io/",
        "dblp": "218/8893;118/3233;p/FatihMuratPorikli;;239/8823",
        "google_scholar": "CbfH47IAAAAJ;h1IvkAsAAAAJ;https://scholar.google.com.tw/citations?user=VpB8NZ8AAAAJ;https://scholar.google.co.uk/citations?user=RZ9pOY4AAAAJ;CdpLhlgAAAAJ",
        "orcid": ";;0000-0002-1520-4466;;",
        "linkedin": "shashank-venkataramanan-1b2b9993/;;fatih-porikli-a95643/;;",
        "or_profile": "~Shashanka_Venkataramanan2;~Amir_Ghodrati2;~Fatih_Porikli2;~Amir_Habibian1;~Yuki_Asano1",
        "aff": "INRIA;QualComm AI Research;QualComm;Qualcomm Inc, QualComm;University of Amsterdam",
        "aff_domain": "inria.fr;qualcomm.com;qualcomm.com;qti.qualcomm.com;uva.nl",
        "position": "PhD student;Researcher;Senior Director;Researcher;Assistant Professor",
        "bibtex": "@inproceedings{\nvenkataramanan2024skipattention,\ntitle={Skip-Attention: Improving Vision Transformers by Paying Less Attention},\nauthor={Shashanka Venkataramanan and Amir Ghodrati and Yuki M Asano and Fatih Porikli and Amir Habibian},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=vI95kcLAoU}\n}",
        "github": "",
        "project": "",
        "reviewers": "f6zn;VJcB;iYVP",
        "pdf_size": 1955738,
        "rating": "6;6;8",
        "confidence": "4;4;4",
        "soundness": "2;2;3",
        "contribution": "2;3;3",
        "presentation": "3;3;3",
        "wc_summary": "66;178;69",
        "wc_strengths": "65;40;62",
        "wc_weaknesses": "214;37;210",
        "wc_questions": "36;460;47",
        "wc_review": "381;715;388",
        "wc_reply_reviewers": "20;148;30",
        "wc_reply_authors": "505;602;490",
        "reply_reviewers": "1;1;1",
        "reply_authors": "2;2;2",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            104.33333333333333,
            52.10459565996928
        ],
        "wc_strengths_avg": [
            55.666666666666664,
            11.14550233153366
        ],
        "wc_weaknesses_avg": [
            153.66666666666666,
            82.511951996194
        ],
        "wc_questions_avg": [
            181.0,
            197.3338963955931
        ],
        "wc_review_avg": [
            494.6666666666667,
            155.82540086762347
        ],
        "wc_reply_reviewers_avg": [
            66.0,
            58.12629926863284
        ],
        "wc_reply_authors_avg": [
            532.3333333333334,
            49.64093293061909
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 34,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1999426678154098819&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=vI95kcLAoU",
        "pdf": "https://openreview.net/pdf?id=vI95kcLAoU",
        "email": "inria.fr;qualcomm.com;qualcomm.com;qti.qualcomm.com;uva.nl",
        "author_num": 5,
        "aff_unique_index": "0;1;2;2;3",
        "aff_unique_norm": "INRIA;Qualcomm AI Research;Qualcomm Incorporated;University of Amsterdam",
        "aff_unique_dep": ";Qualcomm AI Research;;",
        "aff_unique_url": "https://www.inria.fr;https://www.qualcomm.com/research;https://www.qualcomm.com;https://www.uva.nl",
        "aff_unique_abbr": "INRIA;QAI;Qualcomm;UvA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;2",
        "aff_country_unique": "France;United States;Netherlands"
    },
    {
        "id": "vJGKYWC8j8",
        "title": "Continual Traffic Forecasting via Mixture of Experts",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The real-world traffic networks undergo expansion through the installation of new sensors, implying that the traffic patterns continually evolve over time. Incrementally training a model on the newly added sensors would make the model forget the past knowledge, i.e., catastrophic forgetting, while retraining the model on the entire network to capture these changes is highly inefficient. To address these challenges, we propose a novel Traffic Forecasting Mixture of Experts (\\proposed) for traffic forecasting under evolving networks. The main idea is to segment the traffic flow into multiple homogeneous groups, and assign an expert model responsible for a specific group. This allows each expert model to concentrate on learning and adapting to a specific set of patterns, while minimizing interference between the experts during training, thereby preventing the dilution or replacement of prior knowledge, which is a major cause of catastrophic forgetting. Through extensive experiments on a real-world long-term streaming network dataset, PEMSD3-Stream, we demonstrate the effectiveness and efficiency of~\\proposed. Our results showcase superior performance and resilience in the face of catastrophic forgetting, underscoring the effectiveness of our approach in dealing with continual learning for traffic flow forecasting in long-term streaming networks.",
        "keywords": "continual learning;spatio-temporal forecasting;traffic forecasting",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "SangHyun Lee;Chanyoung Park",
        "authorids": "~SangHyun_Lee2;~Chanyoung_Park1",
        "gender": "M;M",
        "homepage": "https://github.com/ragdoll17;https://dsail.kaist.ac.kr/",
        "dblp": ";170/5430.html",
        "google_scholar": ";lWk2LtQAAAAJ",
        "orcid": "0009-0007-9285-2479;0000-0002-5957-5816",
        "linkedin": ";",
        "or_profile": "~SangHyun_Lee2;~Chanyoung_Park1",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr",
        "position": "MS student;Assistant Professor",
        "bibtex": "@misc{\nlee2024continual,\ntitle={Continual Traffic Forecasting via Mixture of Experts},\nauthor={SangHyun Lee and Chanyoung Park},\nyear={2024},\nurl={https://openreview.net/forum?id=vJGKYWC8j8}\n}",
        "github": "",
        "project": "",
        "reviewers": "TPK5;WWUg;p8v4",
        "site": "https://openreview.net/forum?id=vJGKYWC8j8",
        "pdf_size": 3810124,
        "rating": "3;3;6",
        "confidence": "4;3;1",
        "soundness": "3;2;3",
        "contribution": "2;2;3",
        "presentation": "2;2;2",
        "wc_summary": "70;32;108",
        "wc_strengths": "81;29;95",
        "wc_weaknesses": "155;53;193",
        "wc_questions": "35;2;23",
        "wc_review": "341;116;419",
        "wc_reply_reviewers": "0;0;87",
        "wc_reply_authors": "633;418;418",
        "reply_reviewers": "0;0;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            70.0,
            31.026870075253587
        ],
        "wc_strengths_avg": [
            68.33333333333333,
            28.394052585395805
        ],
        "wc_weaknesses_avg": [
            133.66666666666666,
            59.111946527095704
        ],
        "wc_questions_avg": [
            20.0,
            13.638181696985855
        ],
        "wc_review_avg": [
            292.0,
            128.46011054019843
        ],
        "wc_reply_reviewers_avg": [
            29.0,
            41.012193308819754
        ],
        "wc_reply_authors_avg": [
            489.6666666666667,
            101.3519719700718
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.9449111825230683,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11952663712335876501&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "Intriguing Properties of Data Attribution on Diffusion Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17540",
        "id": "vKViCoKGcB",
        "author_site": "Xiaosen Zheng, Tianyu Pang, Chao Du, Jing Jiang, Min Lin",
        "tldr": "",
        "abstract": "Data attribution seeks to trace model outputs back to training data. With the recent development of diffusion models, data attribution has become a desired module to properly assign valuations for high-quality or copyrighted training samples, ensuring that data contributors are fairly compensated or credited. Several theoretically motivated methods have been proposed to implement data attribution, in an effort to improve the trade-off between computational scalability and effectiveness. In this work, we conduct extensive experiments and ablation studies on attributing diffusion models, specifically focusing on DDPMs trained on CIFAR-10 and CelebA, as well as a Stable Diffusion model LoRA-finetuned on ArtBench. Intriguingly, we report counter-intuitive observations that theoretically unjustified design choices for attribution empirically outperform previous baselines by a large margin, in terms of both linear datamodeling score and counterfactual evaluation. Our work presents a significantly more efficient approach for attributing diffusion models, while the unexpected findings suggest that at least in non-convex settings, constructions guided by theoretical assumptions may lead to inferior attribution performance. The code is available at https://github.com/sail-sg/D-TRAK.",
        "keywords": "Data Attribution;Diffusion Models",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/28625df7e0867059d4398766f56340f1f5bb7514.zip",
        "author": "Xiaosen Zheng;Tianyu Pang;Chao Du;Jing Jiang;Min Lin",
        "authorids": "~Xiaosen_Zheng1;~Tianyu_Pang1;~Chao_Du1;~Jing_Jiang1;~Min_Lin1",
        "gender": "M;M;M;F;M",
        "homepage": "https://xszheng2020.github.io;https://p2333.github.io/;https://duchao0726.github.io/;http://www.mysmu.edu/faculty/jingjiang/;https://linmin.me",
        "dblp": "219/6063;202/2550;75/7523;68/1974-1;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;wYDbtFsAAAAJ;QOp7xW0AAAAJ;https://scholar.google.com.sg/citations?user=hVTK2YwAAAAJ;BGONmkIAAAAJ",
        "orcid": ";0000-0003-0639-6176;0000-0003-1244-6336;0000-0002-3035-0074;",
        "linkedin": ";%E5%A4%A9%E5%AE%87-%E5%BA%9E-b3999017a/;duchao/;;min-lin-08a3a422/",
        "or_profile": "~Xiaosen_Zheng1;~Tianyu_Pang1;~Chao_Du1;~Jing_Jiang1;~Min_Lin1",
        "aff": "Sea AI Lab;Sea AI Lab;Sea AI Lab;Singapore Management University;Sea AI Lab",
        "aff_domain": "sea.com;sea.com;sea.com;smu.edu.sg;sea.com",
        "position": "Research Intern;Senior Research Scientist;Senior Research Scientist;Full Professor;Principal Researcher",
        "bibtex": "@inproceedings{\nzheng2024intriguing,\ntitle={Intriguing Properties of Data Attribution on Diffusion Models},\nauthor={Xiaosen Zheng and Tianyu Pang and Chao Du and Jing Jiang and Min Lin},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=vKViCoKGcB}\n}",
        "github": "",
        "project": "",
        "reviewers": "3yAm;nsDq;yBWG",
        "pdf_size": 16150024,
        "rating": "6;6;6",
        "confidence": "3;4;4",
        "soundness": "2;3;4",
        "contribution": "3;2;2",
        "presentation": "3;2;4",
        "wc_summary": "173;153;40",
        "wc_strengths": "175;25;52",
        "wc_weaknesses": "695;231;150",
        "wc_questions": "9;79;2",
        "wc_review": "1052;488;244",
        "wc_reply_reviewers": "215;252;306",
        "wc_reply_authors": "1275;1055;999",
        "reply_reviewers": "1;1;4",
        "reply_authors": "3;3;5",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            122.0,
            58.55481762132529
        ],
        "wc_strengths_avg": [
            84.0,
            65.28399497579785
        ],
        "wc_weaknesses_avg": [
            358.6666666666667,
            240.11154815117817
        ],
        "wc_questions_avg": [
            30.0,
            34.76588366008646
        ],
        "wc_review_avg": [
            594.6666666666666,
            338.3778295863303
        ],
        "wc_reply_reviewers_avg": [
            257.6666666666667,
            37.366057086910075
        ],
        "wc_reply_authors_avg": [
            1109.6666666666667,
            119.12271916902428
        ],
        "reply_reviewers_avg": [
            2.0,
            1.4142135623730951
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 25,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=917124973227774302&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=vKViCoKGcB",
        "pdf": "https://openreview.net/pdf?id=vKViCoKGcB",
        "email": "sea.com;sea.com;sea.com;smu.edu.sg;sea.com",
        "author_num": 5,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "Sea AI Lab;Singapore Management University",
        "aff_unique_dep": ";",
        "aff_unique_url": ";https://www.smu.edu.sg",
        "aff_unique_abbr": ";SMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "1",
        "aff_country_unique": ";Singapore"
    },
    {
        "title": "SYMBOL: Generating Flexible Black-Box Optimizers through Symbolic Equation Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17539",
        "id": "vLJcd43U7a",
        "author_site": "Jiacheng Chen, Zeyuan Ma, Hongshu Guo, Yining Ma, Jie Zhang, Yue-Jiao Gong",
        "tldr": "",
        "abstract": "Recent Meta-learning for Black-Box Optimization (MetaBBO) methods harness neural networks to meta-learn configurations of traditional black-box optimizers. Despite their success, they are inevitably restricted by the limitations of predefined hand-crafted optimizers. In this paper, we present SYMBOL, a novel framework that promotes the automated discovery of black-box optimizers through symbolic equation learning. Specifically, we propose a Symbolic Equation Generator (SEG) that allows closed-form optimization rules to be dynamically generated for specific tasks and optimization steps. Within SYMBOL, we then develop three distinct strategies based on reinforcement learning, so as to meta-learn the SEG efficiently. Extensive experiments reveal that the optimizers generated by SYMBOL not only surpass the state-of-the-art BBO and MetaBBO baselines, but also exhibit exceptional zero-shot generalization abilities across entirely unseen tasks with different problem dimensions, population sizes, and optimization horizons. Furthermore, we conduct in-depth analyses of our SYMBOL framework and the optimization rules that it generates, underscoring its desirable flexibility and interpretability.",
        "keywords": "Black-Box Optimization;Meta-Black-Box Optimization;Deep Reinforcement Learning;Symbolic Equation Learning",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Jiacheng Chen;Zeyuan Ma;Hongshu Guo;Yining Ma;Jie Zhang;Yue-Jiao Gong",
        "authorids": "~Jiacheng_Chen4;~Zeyuan_Ma1;~Hongshu_Guo1;~Yining_Ma1;~Jie_Zhang9;~Yue-Jiao_Gong1",
        "gender": "M;M;M;M;M;F",
        "homepage": "https://jc-chen1.github.io/;https://metaevo.github.io/;https://orcid.org/0000-0001-8063-8984;https://yining043.github.io/;https://personal.ntu.edu.sg/zhangj/;https://www.gongyuejiao.com/",
        "dblp": ";295/6478;;160/6245-1;84/6889-2;65/7184",
        "google_scholar": "knvJGuQAAAAJ;Jcy8wPgAAAAJ;;4_VyBTsAAAAJ;IFV_RdMAAAAJ;Mi0Zu3IAAAAJ",
        "orcid": "0000-0002-7539-6156;0000-0001-6216-9379;0000-0001-8063-8984;0000-0002-6639-8547;;0000-0002-5648-1160",
        "linkedin": ";;;yiningma/;;",
        "or_profile": "~Jiacheng_Chen4;~Zeyuan_Ma1;~Hongshu_Guo1;~Yining_Ma1;~Jie_Zhang9;~Yue-Jiao_Gong1",
        "aff": "South China University of Technology;South China University of Technology;South China University of Technology;Nanyang Technological University;Nanyang Technological University;South China University of Technology",
        "aff_domain": "scut.edu.cn;scut.edu.cn;scut.edu.cn;ntu.edu.sg;ntu.edu.sg;scut.edu.cn",
        "position": "Undergrad student;PhD student;PhD student;Research Fellow;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nchen2024symbol,\ntitle={{SYMBOL}: Generating Flexible Black-Box Optimizers through Symbolic Equation Learning},\nauthor={Jiacheng Chen and Zeyuan Ma and Hongshu Guo and Yining Ma and Jie Zhang and Yue-Jiao Gong},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=vLJcd43U7a}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZLbt;VT1T;h4Ki;hEPw",
        "pdf_size": 26162344,
        "rating": "6;6;6;8",
        "confidence": "3;1;3;2",
        "soundness": "3;3;3;3",
        "contribution": "3;3;2;3",
        "presentation": "4;3;3;4",
        "wc_summary": "43;56;92;157",
        "wc_strengths": "105;33;72;58",
        "wc_weaknesses": "140;49;84;113",
        "wc_questions": "68;21;220;3",
        "wc_review": "356;159;468;331",
        "wc_reply_reviewers": "42;33;0;0",
        "wc_reply_authors": "860;212;1267;684",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "3;2;2;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            2.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            87.0,
            44.22103571830945
        ],
        "wc_strengths_avg": [
            67.0,
            26.009613607279906
        ],
        "wc_weaknesses_avg": [
            96.5,
            33.826764551165695
        ],
        "wc_questions_avg": [
            78.0,
            85.34928236370826
        ],
        "wc_review_avg": [
            328.5,
            110.62662428186083
        ],
        "wc_reply_reviewers_avg": [
            18.75,
            19.01808349965895
        ],
        "wc_reply_authors_avg": [
            755.75,
            378.5025594365248
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.17407765595569782,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11195414169653350456&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=vLJcd43U7a",
        "pdf": "https://openreview.net/pdf?id=vLJcd43U7a",
        "email": "scut.edu.cn;scut.edu.cn;scut.edu.cn;ntu.edu.sg;ntu.edu.sg;scut.edu.cn",
        "author_num": 6,
        "aff_unique_index": "0;0;0;1;1;0",
        "aff_unique_norm": "South China University of Technology;Nanyang Technological University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.scut.edu.cn;https://www.ntu.edu.sg",
        "aff_unique_abbr": "SCUT;NTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;1;0",
        "aff_country_unique": "China;Singapore"
    },
    {
        "id": "vLJg4wgBPu",
        "title": "GPT Is Becoming a Turing Machine: Here Are Some Ways to Program It",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We demonstrate that, through appropriate prompting, GPT-3 family of models can be triggered to perform iterative behaviors necessary to execute (rather than just write or recall) programs that involve loops, including several popular algorithms found in computer science curricula or software developer interviews. We trigger execution and description of Iterations by Regimenting Self-Attention (IRSA) in one (or a combination) of three ways: 1) Using strong repetitive structure in an example of an execution path of a target program for one particular input, 2) Prompting with fragments of execution paths, and 3) Explicitly forbidding (skipping) self-attention to parts of the generated text. On a dynamic program execution, IRSA leads to larger accuracy gains than replacing the model with the much more powerful GPT-4. IRSA has promising applications in education, as the prompts and responses resemble student assignments in data structures and algorithms classes. Our findings hold implications for evaluating LLMs, which typically target in-context learning: We show that prompts that may not even cover one full task example can trigger algorithmic behavior, allowing solving problems previously thought of as hard for LLMs, such as logical puzzles. Consequently, prompt design is even more critical in LLM performance than previously recognized.",
        "keywords": "Large Language Models;Turing machine;GPT-3;GPT-4;Prompt design;Programming",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Ana Jojic;Zhen Wang;Nebojsa Jojic",
        "authorids": "~Ana_Jojic1;~Zhen_Wang6;~Nebojsa_Jojic1",
        "gender": "F;M;",
        "homepage": ";https://zhenwang9102.github.io;www.research.microsoft.com/~jojic",
        "dblp": ";78/6727;20/1944",
        "google_scholar": ";asBaytUAAAAJ;",
        "orcid": ";0000-0001-7407-5118;",
        "linkedin": "ana-jojic-9a26a715a/;zhenwang9102/;",
        "or_profile": "~Ana_Jojic1;~Zhen_Wang6;~Nebojsa_Jojic1",
        "aff": "University of Illinois, Urbana Champaign;University of California, San Diego;Microsoft Research",
        "aff_domain": "illinois.edu;ucsd.edu; ",
        "position": "PhD student;Postdoc;Researcher",
        "bibtex": "@misc{\njojic2024gpt,\ntitle={{GPT} Is Becoming a Turing Machine: Here Are Some Ways to Program It},\nauthor={Ana Jojic and Zhen Wang and Nebojsa Jojic},\nyear={2024},\nurl={https://openreview.net/forum?id=vLJg4wgBPu}\n}",
        "github": "",
        "project": "",
        "reviewers": "uwZf;RTek;yv3R;FzpB",
        "site": "https://openreview.net/forum?id=vLJg4wgBPu",
        "pdf_size": 508248,
        "rating": "3;3;5;6",
        "confidence": "4;3;3;3",
        "soundness": "2;2;2;2",
        "contribution": "2;2;2;3",
        "presentation": "1;2;2;2",
        "wc_summary": "85;93;93;75",
        "wc_strengths": "15;100;80;84",
        "wc_weaknesses": "173;186;153;29",
        "wc_questions": "52;201;61;150",
        "wc_review": "325;580;387;338",
        "wc_reply_reviewers": "26;0;26;0",
        "wc_reply_authors": "741;812;357;578",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            86.5,
            7.399324293474371
        ],
        "wc_strengths_avg": [
            69.75,
            32.48364973336586
        ],
        "wc_weaknesses_avg": [
            135.25,
            62.45948686949005
        ],
        "wc_questions_avg": [
            116.0,
            62.25351395704503
        ],
        "wc_review_avg": [
            407.5,
            102.24113653515398
        ],
        "wc_reply_reviewers_avg": [
            13.0,
            13.0
        ],
        "wc_reply_authors_avg": [
            622.0,
            174.9442768426564
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5555555555555555,
        "gs_citation": 21,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8178619334231825325&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of Illinois Urbana-Champaign;University of California, San Diego;Microsoft",
        "aff_unique_dep": ";;Microsoft Research",
        "aff_unique_url": "https://illinois.edu;https://www.ucsd.edu;https://www.microsoft.com/en-us/research",
        "aff_unique_abbr": "UIUC;UCSD;MSR",
        "aff_campus_unique_index": "0;1",
        "aff_campus_unique": "Urbana-Champaign;San Diego;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "vLqkCvjHRD",
        "title": "Coarse-Tuning Models of Code with Reinforcement Learning Feedback",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) pre-trained on code have recently emerged as the dominant approach to program synthesis. However, these models are trained using next-token prediction, which ignores the syntax and semantics of code. We propose RLCF, that further trains a pre-trained LLM via reinforcement learning, using feedback from a grounding function that scores the quality of the code. The grounding function uses (i) compiler-derived feedback on whether the code it generates passes a set of correctness checks; and (ii) feedback from a different LLM that compares the generated code to a reference code. RLCF is model- and language-agnostic. We empirically evaluate it on the MBJP and MathQA tasks for Java. Our experiments show that RLCF raises the odds that an LLM-generated program compiles, is executable, and produces the right output on tests, often allowing LLMs to match the performance of 2x-8x larger LLMs.",
        "keywords": "Large Language Models;Program Synthesis",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Abhinav Jain;Chima Adiole;Thomas Reps;Swarat Chaudhuri;Chris Jermaine",
        "authorids": "~Abhinav_Jain1;~Chima_Adiole1;~Thomas_Reps1;~Swarat_Chaudhuri1;~Chris_Jermaine1",
        "gender": "M;;M;M;M",
        "homepage": ";;http://pages.cs.wisc.edu/~reps/;http://www.cs.utexas.edu/~swarat;https://www.cs.rice.edu/~cmj4/",
        "dblp": "167/2404-1;;r/TWReps;37/6100;j/ChrisJermaine",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?authuser=1;https://scholar.google.com.tw/citations?user=pwhyTq0AAAAJ;9j6RBYQAAAAJ;",
        "orcid": "0000-0003-4991-6872;;0000-0002-5676-9949;0000-0002-6859-1391;",
        "linkedin": "abhinav-jain-483975aa/;ca23/;thomas-reps-437b2a69/;swarat-chaudhuri-609b3092/;",
        "or_profile": "~Abhinav_Jain1;~Chima_Adiole1;~Thomas_Reps1;~Swarat_Chaudhuri1;~Chris_Jermaine1",
        "aff": "Rice University;Rice University;University of Wisconsin-Madison;University of Texas at Austin;Rice University",
        "aff_domain": "rice.edu;rice.edu;cs.wisc.edu;utexas.edu;rice.edu",
        "position": "PhD student;MS student;Full Professor;Full Professor;Professor",
        "bibtex": "@misc{\njain2024coarsetuning,\ntitle={Coarse-Tuning Models of Code with Reinforcement Learning Feedback},\nauthor={Abhinav Jain and Chima Adiole and Thomas Reps and Swarat Chaudhuri and Chris Jermaine},\nyear={2024},\nurl={https://openreview.net/forum?id=vLqkCvjHRD}\n}",
        "github": "",
        "project": "",
        "reviewers": "1rNz;HG9j;8pcA;t6g5",
        "site": "https://openreview.net/forum?id=vLqkCvjHRD",
        "pdf_size": 3418722,
        "rating": "3;5;5;6",
        "confidence": "3;3;4;4",
        "soundness": "3;2;3;3",
        "contribution": "2;2;2;2",
        "presentation": "4;2;3;3",
        "wc_summary": "72;82;95;31",
        "wc_strengths": "64;74;54;51",
        "wc_weaknesses": "406;301;109;82",
        "wc_questions": "53;22;138;57",
        "wc_review": "595;479;396;221",
        "wc_reply_reviewers": "141;163;0;0",
        "wc_reply_authors": "740;603;341;290",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            70.0,
            23.947860029656095
        ],
        "wc_strengths_avg": [
            60.75,
            9.03811374126261
        ],
        "wc_weaknesses_avg": [
            224.5,
            134.5743289041413
        ],
        "wc_questions_avg": [
            67.5,
            42.8981351576033
        ],
        "wc_review_avg": [
            422.75,
            136.2467889529878
        ],
        "wc_reply_reviewers_avg": [
            76.0,
            76.39698946948106
        ],
        "wc_reply_authors_avg": [
            493.5,
            185.35169273572873
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.6882472016116854,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4630435056225176047&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1;2;0",
        "aff_unique_norm": "Rice University;University of Wisconsin-Madison;University of Texas at Austin",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.rice.edu;https://www.wisc.edu;https://www.utexas.edu",
        "aff_unique_abbr": "Rice;UW-Madison;UT Austin",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Madison;Austin",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "vM1xZ9kDUj",
        "title": "Capture Concept through Comparison: Vision-and-Language Representation Learning with Intrinsic Information Mining",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Achieving alignment between vision and language semantics poses a critical challenge. Prior works have sought to enhance alignment by incorporating additional supervision, such as tags or object bounding boxes, as anchors between modalities. However, these methods predominantly concentrate on aligning tangible entities, disregarding other crucial abstract concepts that elude perception, such as ''side by side.\" To overcome this limitation, we propose a novel approach to Capture various Concepts through data Comparison (C3) for learning cross-modal representations. Specifically, we devise a data mining procedure to uncover intrinsic information within the database, avoiding the need for external annotations. Furthermore, we distinctly frame model inputs as triplets to better elucidate abstract semantics in images. Building upon this formulation, we propose two concept-centric pre-training objectives to signify concept learning. Extensive experiments demonstrate that models trained within the C3 framework consistently achieve significant enhancements across a wide range of comprehension and reasoning benchmarks, whether starting from scratch or fine-tuning from an existing model.",
        "keywords": "vision language model;multi-modal representation learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yun-Zhu Song;Yi-Syuan Chen;Bei Liu;Jianlong Fu;Hong-Han Shuai",
        "authorids": "~Yun-Zhu_Song1;~Yi-Syuan_Chen1;~Bei_Liu2;~Jianlong_Fu1;~Hong-Han_Shuai1",
        "gender": "F;M;F;M;M",
        "homepage": ";;https://www.microsoft.com/en-us/research/people/libei/;;http://basiclab.lab.nycu.edu.tw/",
        "dblp": "258/0863;286/0820.html;39/3711-1;83/8692;86/10294",
        "google_scholar": "https://scholar.google.com.tw/citations?user=WWXqc2YAAAAJ;https://scholar.google.com.tw/citations?hl=zh-TW;7IZyaZsAAAAJ;-WqSwu8AAAAJ;https://scholar.google.com.tw/citations?user=MSWL2noAAAAJ",
        "orcid": ";;;;0000-0003-2216-077X",
        "linkedin": "yun-zhu-song-8a3b221a1/;;;;",
        "or_profile": "~Yun-Zhu_Song1;~Yi-Syuan_Chen1;~Bei_Liu2;~Jianlong_Fu1;~Hong-Han_Shuai1",
        "aff": "National Yang Ming Chiao Tung University;National Yang Ming Chiao Tung University;Microsoft Research Asia;Microsoft;National Yang Ming Chiao Tung University",
        "aff_domain": "nycu.edu.tw;nycu.edu.tw;microsoft.com;microsoft.com;nycu.edu.tw",
        "position": "PhD student;PhD student;Researcher;Senior Researcher;Associate Professor",
        "bibtex": "@misc{\nsong2024capture,\ntitle={Capture Concept through Comparison: Vision-and-Language Representation Learning with Intrinsic Information Mining},\nauthor={Yun-Zhu Song and Yi-Syuan Chen and Bei Liu and Jianlong Fu and Hong-Han Shuai},\nyear={2024},\nurl={https://openreview.net/forum?id=vM1xZ9kDUj}\n}",
        "github": "",
        "project": "",
        "reviewers": "J1vN;xrjY;snHQ;pYtZ",
        "site": "https://openreview.net/forum?id=vM1xZ9kDUj",
        "pdf_size": 37435915,
        "rating": "5;6;6;6",
        "confidence": "4;3;4;3",
        "soundness": "3;3;3;3",
        "contribution": "3;2;3;3",
        "presentation": "3;3;4;3",
        "wc_summary": "74;189;83;165",
        "wc_strengths": "66;61;69;77",
        "wc_weaknesses": "332;257;161;142",
        "wc_questions": "41;91;50;23",
        "wc_review": "513;598;363;407",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1263;981;1175;746",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;2;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            127.75,
            50.07681599303214
        ],
        "wc_strengths_avg": [
            68.25,
            5.80409338312195
        ],
        "wc_weaknesses_avg": [
            223.0,
            76.55390257851
        ],
        "wc_questions_avg": [
            51.25,
            24.923633362734254
        ],
        "wc_review_avg": [
            470.25,
            91.72070376965061
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1041.25,
            198.66098635615398
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:E5ixZznS2IsJ:scholar.google.com/&scioq=Capture+Concept+through+Comparison:+Vision-and-Language+Representation+Learning+with+Intrinsic+Information+Mining&hl=en&as_sdt=0,14",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;1;1;0",
        "aff_unique_norm": "National Yang Ming Chiao Tung University;Microsoft",
        "aff_unique_dep": ";Research",
        "aff_unique_url": "https://www.nycu.edu.tw;https://www.microsoft.com/en-us/research/group/asia",
        "aff_unique_abbr": "NYCU;MSR Asia",
        "aff_campus_unique_index": "0;0;1;0",
        "aff_campus_unique": "Taiwan;Asia;",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "vMBNUCZ4cS",
        "title": "Graph Neural Tangent Kernel and Graph Neural Network Gaussian Processes for Node Classification/ Regression",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This work analyzes Graph Neural Networks, a generalization\nof Fully-Connected Deep Neural Nets on Graph Structured\nData, when their width, that is the number of nodes in each\nfully-connected layers is increasing to infinity. Infinite Width\nNeural Networks are connecting Deep Learning to Gaussian\nProcesses and Kernels, both Machine Learning Frameworks\nwith long traditions and extensive theoretical foundations.\nGaussian Processes and Kernels have much less hyperparameters then Neural Networks and can be used for uncertainty\nestimation, making them more user friendly for applications.\nThis works extends the increasing amount of research connecting Gaussian Processes and Kernels to Neural Networks.\nThe Kernel and Gaussian Process closed forms are derived for\na variety of architectures, namely the standard Graph Neural\nNetwork, the Graph Neural Network with Skip-Concatenate\nConnections and the Graph Attention Neural Network. All architectures are evaluated on a variety of Datasets on the task\nof Transductive Node Regression and Classification. Extending the setting to Inductive Graph Learning tasks is straightforward and is briefly discussed in 7.5.",
        "keywords": "deep learning;graph neural networks;kernel methods;gaussian processes;neural tangent kernel;graph convolutional networks",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/38fc727dad6a4846cdbddfd64f9712b4336488f7.zip",
        "author": "Yunus Cobanoglu",
        "authorids": "~Yunus_Cobanoglu1",
        "gender": "",
        "homepage": "",
        "dblp": "",
        "google_scholar": "",
        "orcid": "",
        "linkedin": "yunus-cobanoglu-5a3a54160",
        "or_profile": "~Yunus_Cobanoglu1",
        "aff": "",
        "aff_domain": "",
        "position": "",
        "bibtex": "@misc{\ncobanoglu2024graph,\ntitle={Graph Neural Tangent Kernel and Graph Neural Network Gaussian Processes for Node Classification/ Regression},\nauthor={Yunus Cobanoglu},\nyear={2024},\nurl={https://openreview.net/forum?id=vMBNUCZ4cS}\n}",
        "github": "",
        "project": "",
        "reviewers": "UHJu;V34A;s1WM",
        "site": "https://openreview.net/forum?id=vMBNUCZ4cS",
        "pdf_size": 966731,
        "rating": "5;6;6",
        "confidence": "4;4;3",
        "soundness": "2;2;3",
        "contribution": "2;3;3",
        "presentation": "3;3;3",
        "wc_summary": "44;50;65",
        "wc_strengths": "40;51;87",
        "wc_weaknesses": "273;94;89",
        "wc_questions": "50;1;4",
        "wc_review": "407;196;245",
        "wc_reply_reviewers": "400;33;22",
        "wc_reply_authors": "1716;283;382",
        "reply_reviewers": "3;2;1",
        "reply_authors": "4;2;1",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            53.0,
            8.831760866327848
        ],
        "wc_strengths_avg": [
            59.333333333333336,
            20.07209228976613
        ],
        "wc_weaknesses_avg": [
            152.0,
            85.58426646683762
        ],
        "wc_questions_avg": [
            18.333333333333332,
            22.425184255405547
        ],
        "wc_review_avg": [
            282.6666666666667,
            90.164048021124
        ],
        "wc_reply_reviewers_avg": [
            151.66666666666666,
            175.65559737420523
        ],
        "wc_reply_authors_avg": [
            793.6666666666666,
            653.4392771244234
        ],
        "reply_reviewers_avg": [
            2.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:j49W0ipmxiUJ:scholar.google.com/&scioq=Graph+Neural+Tangent+Kernel+and+Graph+Neural+Network+Gaussian+Processes+for+Node+Classification/+Regression&hl=en&as_sdt=0,33",
        "gs_version_total": 0
    },
    {
        "id": "vMNpv5OBGb",
        "title": "UniAP: Unifying Inter- and Intra-Layer Automatic Parallelism by Mixed Integer Quadratic Programming",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep learning models have demonstrated impressive performance in various domains. However, the prolonged training time of these models remains a critical problem. Manually designed parallel training strategies could enhance efficiency but require considerable time and deliver little flexibility. Hence, \\emph{automatic parallelism} is proposed to automate the parallel strategy searching process. Even so, existing approaches suffer from sub-optimal strategy space because they treat automatic parallelism as two independent processes, namely inter- and intra-layer parallelism. To address this issue, we propose UniAP, which utilizes mixed integer quadratic programming to unify inter- and intra-layer automatic parallelism. To the best of our knowledge, UniAP is the first work to optimize these two parallelism dimensions jointly for a globally optimal strategy. The experimental results show that UniAP outperforms state-of-the-art methods by up to 1.70$\\times$ in throughput and reduces strategy searching time by up to 261$\\times$ across four Transformer-like models.",
        "keywords": "Automatic Parallelism;Mixed Integer Quadratic Programming",
        "primary_area": "infrastructure, software libraries, hardware, etc.",
        "supplementary_material": "",
        "author": "Hao Lin;Ke Wu;Jun Li;Wu-Jun Li",
        "authorids": "~Hao_Lin8;~Ke_Wu4;~Jun_Li33;~Wu-Jun_Li1",
        "gender": ";;M;M",
        "homepage": "https://haolin-nju.github.io/;https://bigai-nju.github.io/members/Ke%20Wu;https://bigai-nju.github.io/members/Jun%20Li;https://cs.nju.edu.cn/lwj/",
        "dblp": ";;98/772.html;26/988.html",
        "google_scholar": "PeJKCngAAAAJ;;;NCCdqdcAAAAJ",
        "orcid": ";;0000-0002-0410-4988;",
        "linkedin": ";;;",
        "or_profile": "~Hao_Lin8;~Ke_Wu4;~Jun_Li33;~Wu-Jun_Li1",
        "aff": "Nanjing University;Nanjing University;Nanjing University;Nanjing University",
        "aff_domain": "smail.nju.edu.cn;nju.edu.cn;nju.edu.cn;nju.edu.cn",
        "position": "MS student;MS student;PhD student;Full Professor",
        "bibtex": "@misc{\nlin2024uniap,\ntitle={Uni{AP}: Unifying Inter- and Intra-Layer Automatic Parallelism by Mixed Integer Quadratic Programming},\nauthor={Hao Lin and Ke Wu and Jun Li and Wu-Jun Li},\nyear={2024},\nurl={https://openreview.net/forum?id=vMNpv5OBGb}\n}",
        "github": "",
        "project": "",
        "reviewers": "pnV8;Ye4S;S34h",
        "site": "https://openreview.net/forum?id=vMNpv5OBGb",
        "pdf_size": 795062,
        "rating": "5;6;6",
        "confidence": "4;3;4",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "2;3;4",
        "wc_summary": "50;75;72",
        "wc_strengths": "93;90;17",
        "wc_weaknesses": "529;131;140",
        "wc_questions": "136;87;140",
        "wc_review": "808;383;369",
        "wc_reply_reviewers": "210;8;0",
        "wc_reply_authors": "1698;712;227",
        "reply_reviewers": "1;1;0",
        "reply_authors": "3;1;1",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            65.66666666666667,
            11.14550233153366
        ],
        "wc_strengths_avg": [
            66.66666666666667,
            35.140985883849204
        ],
        "wc_weaknesses_avg": [
            266.6666666666667,
            185.53406395831706
        ],
        "wc_questions_avg": [
            121.0,
            24.097026095903757
        ],
        "wc_review_avg": [
            520.0,
            203.7269414355074
        ],
        "wc_reply_reviewers_avg": [
            72.66666666666667,
            97.16423667630434
        ],
        "wc_reply_authors_avg": [
            879.0,
            612.0332234990734
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5593724800157283695&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Nanjing University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nju.edu.cn",
        "aff_unique_abbr": "Nanjing U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Fine-Tuned Language Models Generate Stable Inorganic Materials as Text",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17538",
        "id": "vN9fpfqoP1",
        "author_site": "Nate Gruver, Anuroop Sriram, Andrea Madotto, Andrew Gordon Wilson, Larry Zitnick, Zachary Ulissi",
        "tldr": "",
        "abstract": "We propose fine-tuning large language models for generation of stable materials. While unorthodox, fine-tuning large language models on text-encoded atomistic data is simple to implement yet reliable, with around 90\\% of sampled structures obeying physical constraints on atom positions and charges. Using energy above hull calculations from both learned ML potentials and gold-standard DFT calculations, we show that our strongest model (fine-tuned  LLaMA-2 70B) can generate materials predicted to be metastable at about twice the rate (49\\% vs 28\\%) of CDVAE, a competing diffusion model. Because of text prompting's inherent flexibility, our models can simultaneously be used for unconditional generation of stable material, infilling of partial structures and text-conditional generation. Finally, we show that language models' ability to capture key symmetries of crystal structures improves with model scale, suggesting that the biases of pretrained LLMs are surprisingly well-suited for atomistic data.",
        "keywords": "generative model;large language model;stable materials;AI for science",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Nate Gruver;Anuroop Sriram;Andrea Madotto;Andrew Gordon Wilson;C. Lawrence Zitnick;Zachary Ward Ulissi",
        "authorids": "~Nate_Gruver1;~Anuroop_Sriram1;~Andrea_Madotto1;~Andrew_Gordon_Wilson1;~C._Lawrence_Zitnick2;~Zachary_Ward_Ulissi1",
        "gender": "M;M;M;Not Specified;;",
        "homepage": "https://ngruver.github.io/;https://anuroopsriram.com;http://andreamad8.github.io/;https://cims.nyu.edu/~andrewgw;https://zulissi.github.io/;http://larryzitnick.org/",
        "dblp": "223/5568;200/7951;174/2905;65/10453;126/3959;10/6888",
        "google_scholar": "R5QNdhcAAAAJ;D4uRc_UAAAAJ;https://scholar.google.it/citations?user=JBnyLicAAAAJ;https://scholar.google.com.tw/citations?user=twWX2LIAAAAJ;E0tlVgQAAAAJ;ZeJjFQMAAAAJ",
        "orcid": ";;;;0000-0002-9401-4918;",
        "linkedin": ";anuroopsriram/;;;zulissi/;",
        "or_profile": "~Nate_Gruver1;~Anuroop_Sriram1;~Andrea_Madotto1;~Andrew_Gordon_Wilson1;~Zachary_Ward_Ulissi1;~Larry_Zitnick1",
        "aff": "New York University;Meta Facebook;FAIR;New York University;Carnegie Mellon University;Meta",
        "aff_domain": "nyu.edu;meta.com;meta.com;nyu.edu;cmu.edu;meta.com",
        "position": "PhD student;Principal Researcher;Researcher;Associate Professor;Associate Professor;Researcher",
        "bibtex": "@inproceedings{\ngruver2024finetuned,\ntitle={Fine-Tuned Language Models Generate Stable Inorganic Materials as Text},\nauthor={Nate Gruver and Anuroop Sriram and Andrea Madotto and Andrew Gordon Wilson and C. Lawrence Zitnick and Zachary Ward Ulissi},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=vN9fpfqoP1}\n}",
        "github": "",
        "project": "",
        "reviewers": "iXqY;1Fky;9VCZ",
        "pdf_size": 2073833,
        "rating": "5;6;6",
        "confidence": "3;5;3",
        "soundness": "2;2;3",
        "contribution": "2;2;2",
        "presentation": "3;2;3",
        "wc_summary": "51;39;64",
        "wc_strengths": "25;63;25",
        "wc_weaknesses": "80;8;73",
        "wc_questions": "2;143;16",
        "wc_review": "158;253;178",
        "wc_reply_reviewers": "0;79;0",
        "wc_reply_authors": "864;2036;1260",
        "reply_reviewers": "0;1;0",
        "reply_authors": "2;4;2",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            51.333333333333336,
            10.208928554075703
        ],
        "wc_strengths_avg": [
            37.666666666666664,
            17.9133717900592
        ],
        "wc_weaknesses_avg": [
            53.666666666666664,
            32.417416443771224
        ],
        "wc_questions_avg": [
            53.666666666666664,
            63.426247633679935
        ],
        "wc_review_avg": [
            196.33333333333334,
            40.89281382128432
        ],
        "wc_reply_reviewers_avg": [
            26.333333333333332,
            37.2409571424915
        ],
        "wc_reply_authors_avg": [
            1386.6666666666667,
            486.7780694411868
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 77,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15407798164784924587&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=vN9fpfqoP1",
        "pdf": "https://openreview.net/pdf?id=vN9fpfqoP1",
        "email": "nyu.edu;meta.com;meta.com;nyu.edu;cmu.edu;meta.com",
        "author_num": 6,
        "aff_unique_index": "0;1;1;0;2;1",
        "aff_unique_norm": "New York University;Meta;Carnegie Mellon University",
        "aff_unique_dep": ";Meta Platforms, Inc.;",
        "aff_unique_url": "https://www.nyu.edu;https://meta.com;https://www.cmu.edu",
        "aff_unique_abbr": "NYU;Meta;CMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Provable Memory Efficient Self-Play Algorithm for Model-free Reinforcement Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17537",
        "id": "vNiI3aGcE6",
        "author_site": "Na Li, Yuchen Jiao, Hangguan Shan, Shefeng Yan",
        "tldr": "",
        "abstract": "The thriving field of multi-agent reinforcement learning (MARL) studies how a group of interacting agents make decisions autonomously in a shared dynamic environment. Existing theoretical studies in this area suffer from at least two of the following obstacles: memory inefficiency, the heavy dependence of sample complexity on the long horizon and the large state space, the high computational complexity, non-Markov policy, non-Nash policy, and high burn-in cost. In this work, we take a step towards settling this problem by designing a model-free self-play algorithm \\emph{Memory-Efficient Nash Q-Learning (ME-Nash-QL)} for two-player zero-sum Markov games, which is a specific setting of MARL. We prove that ME-Nash-QL can output an $\\varepsilon$-approximate Nash policy with remarkable space complexity $O(SABH)$, sample complexity $\\widetilde{O}(H^4SAB/\\varepsilon^2)$, and computational complexity $O(T\\mathrm{poly}(AB))$, where $S$ is the number of states, $\\{A, B\\}$ is the number of actions for the two players, $H$ is the horizon length, and $T$ is the number of samples. Notably, our approach outperforms in terms of space complexity compared to existing algorithms for tabular cases. It achieves the lowest computational complexity while preserving Markov policies, setting a new standard. Furthermore, our algorithm outputs a Nash policy and achieves the best sample complexity compared with the existing guarantee for long horizons, i.e. when $\\min \\\\{ A, B \\\\} \\ll H^2$. Our algorithm also achieves the best burn-in cost $O(SAB\\,\\mathrm{poly}(H))$, whereas previous algorithms need at least $O(S^3 AB\\,\\mathrm{poly}(H))$ to attain the same level of sample complexity with ours.",
        "keywords": "model-free RL;self-play;memory efficiency;Q-learning;Nash equilibrium;Markov policy",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Na Li;Yuchen Jiao;Hangguan Shan;Shefeng Yan",
        "authorids": "~Na_Li9;~Yuchen_Jiao1;~Hangguan_Shan1;~Shefeng_Yan1",
        "gender": "F;;M;M",
        "homepage": ";https://www.researchgate.net/profile/Yuchen-Jiao-2;https://person.zju.edu.cn/en/hshan;https://people.ucas.ac.cn/~sfyan",
        "dblp": ";211/7133;96/3813.html;56/2782",
        "google_scholar": "yhiF9-YAAAAJ;;;",
        "orcid": "0009-0000-3726-6230;;;",
        "linkedin": ";;;",
        "or_profile": "~Na_Li9;~Yuchen_Jiao1;~Hangguan_Shan1;~Shefeng_Yan1",
        "aff": "Zhejiang University;;Zhejiang University;Institute of Acoustics of the Chinese Academy of Sciences",
        "aff_domain": "zju.edu.cn;;zju.edu.cn;ioa.ac.cn",
        "position": "PhD student;;Associate Professor;Full Professor",
        "bibtex": "@inproceedings{\nli2024provable,\ntitle={Provable Memory Efficient Self-Play Algorithm for Model-free Reinforcement Learning},\nauthor={Na Li and Yuchen Jiao and Hangguan Shan and Shefeng Yan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=vNiI3aGcE6}\n}",
        "github": "",
        "project": "",
        "reviewers": "3yJL;Pgbr;nN5J;M7D7",
        "pdf_size": 642269,
        "rating": "6;6;8;8",
        "confidence": "3;3;4;3",
        "soundness": "3;3;3;4",
        "contribution": "3;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "49;39;38;75",
        "wc_strengths": "25;38;49;107",
        "wc_weaknesses": "99;60;183;157",
        "wc_questions": "35;65;217;72",
        "wc_review": "208;202;487;411",
        "wc_reply_reviewers": "92;41;36;32",
        "wc_reply_authors": "756;655;546;766",
        "reply_reviewers": "3;1;1;1",
        "reply_authors": "5;2;2;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            50.25,
            14.922717580923388
        ],
        "wc_strengths_avg": [
            54.75,
            31.339870771909702
        ],
        "wc_weaknesses_avg": [
            124.75,
            48.18908071337323
        ],
        "wc_questions_avg": [
            97.25,
            70.52083025603145
        ],
        "wc_review_avg": [
            327.0,
            124.9419865377528
        ],
        "wc_reply_reviewers_avg": [
            50.25,
            24.31434761617099
        ],
        "wc_reply_authors_avg": [
            680.75,
            89.09370067518803
        ],
        "reply_reviewers_avg": [
            1.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            2.75,
            1.299038105676658
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5421479576980958199&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=vNiI3aGcE6",
        "pdf": "https://openreview.net/pdf?id=vNiI3aGcE6",
        "email": "zju.edu.cn;;zju.edu.cn;ioa.ac.cn",
        "author_num": 4,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Zhejiang University;Chinese Academy of Sciences",
        "aff_unique_dep": ";Institute of Acoustics",
        "aff_unique_url": "https://www.zju.edu.cn;http://www.ioa.ac.cn",
        "aff_unique_abbr": "ZJU;CAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "vNkUeTUbSQ",
        "title": "Understanding and Controlling a Maze-Solving Policy Network",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "To understand the goals and goal representations of AI systems, we carefully study a pretrained reinforcement learning policy that solves mazes by navigating to a range of target squares. We find this network pursues multiple context-dependent goals, and we further identify circuits within the network that correspond to one of these goals. In particular, we identified eleven channels that track the location of the goal. By modifying these channels, either with hand-designed interventions or by combining forward passes, we can partially control the policy. Our work shows the goals of this network are redundant, distributed, and re-targetable, shedding light on the behaviour of AI systems and their goal-directed behaviour.",
        "keywords": "interpretability;alignment;AI safety;reinforcement learning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Ulisse Mini;peli grietzer;Mrinank Sharma;Austin Meek;Monte MacDiarmid;Alexander Matt Turner",
        "authorids": "~Ulisse_Mini1;~peli_grietzer1;~Mrinank_Sharma1;~Austin_Meek1;~Monte_MacDiarmid1;~Alexander_Matt_Turner1",
        "gender": ";;;;M;M",
        "homepage": "https://www.linkedin.com/in/ulisse-mini-779335224/;;https://mrinanksharma.github.io/;;;",
        "dblp": ";;254/2914;331/7199.html;;236/6253",
        "google_scholar": ";;https://scholar.google.co.uk/citations?user=5gslw-MAAAAJ;H_kdooIAAAAJ;;thAHiVcAAAAJ",
        "orcid": ";;0000-0002-4304-7963;;;",
        "linkedin": ";https://linkedin.com/in/peli-grietzer-98297450;;austinmeek/;;",
        "or_profile": "~Ulisse_Mini1;~peli_grietzer1;~Mrinank_Sharma1;~Austin_Meek1;~Monte_MacDiarmid1;~Alexander_Matt_Turner1",
        "aff": "Stanford Existential Risks Initiative;AOI;;University of Delaware;;Google",
        "aff_domain": "stanford.edu;objectiv.is;;udel.edu;;google.com",
        "position": "Researcher;Researcher;;PhD student;;Researcher",
        "bibtex": "@misc{\nmini2024understanding,\ntitle={Understanding and Controlling a Maze-Solving Policy Network},\nauthor={Ulisse Mini and peli grietzer and Mrinank Sharma and Austin Meek and Monte MacDiarmid and Alexander Matt Turner},\nyear={2024},\nurl={https://openreview.net/forum?id=vNkUeTUbSQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "8YEo;RNSn;Ejpo",
        "site": "https://openreview.net/forum?id=vNkUeTUbSQ",
        "pdf_size": 46328132,
        "rating": "3;3;5",
        "confidence": "4;4;3",
        "soundness": "2;2;2",
        "contribution": "1;2;2",
        "presentation": "4;3;2",
        "wc_summary": "34;119;54",
        "wc_strengths": "50;102;41",
        "wc_weaknesses": "293;215;152",
        "wc_questions": "100;41;205",
        "wc_review": "477;477;452",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "799;751;688",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            69.0,
            36.2859017617954
        ],
        "wc_strengths_avg": [
            64.33333333333333,
            26.88659310676771
        ],
        "wc_weaknesses_avg": [
            220.0,
            57.67148342118486
        ],
        "wc_questions_avg": [
            115.33333333333333,
            67.82493805542488
        ],
        "wc_review_avg": [
            468.6666666666667,
            11.785113019775793
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            746.0,
            45.45327270945405
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16217733010984793492&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Stanford University;AOI;University of Delaware;Google",
        "aff_unique_dep": "Existential Risks Initiative;;;Google",
        "aff_unique_url": "https://www.stanford.edu;;https://www.udel.edu;https://www.google.com",
        "aff_unique_abbr": "Stanford;;UD;Google",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Stanford;;Mountain View",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States;"
    },
    {
        "id": "vNrTYz1rXH",
        "title": "Fairness-Aware Domain Generalization under Covariate and Dependence Shifts",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Achieving the generalization of an invariant classifier from source domains to shifted target domains while simultaneously considering model fairness is a substantial and complex challenge in machine learning. Existing domain generalization research typically attributes domain shifts to concept shift, which relates to alterations in class labels, and covariate shift, which pertains to variations in data styles. In this paper, by introducing another form of distribution shift, known as dependence shift, which involves variations in fair dependence patterns across domains, we propose a novel domain generalization approach that addresses domain shifts by considering both covariate and dependence shifts. We assert the existence of an underlying transformation model can transform data from one domain to another. By generating data in synthetic domains through the model, a fairness-aware invariant classifier is learned that enforces both model accuracy and fairness in unseen domains. Extensive empirical studies on four benchmark datasets demonstrate that our approach surpasses state-of-the-art methods.",
        "keywords": "fairness;domain generalization;disentanglement;invariant learning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/393c9ffd564a99aa3c4fb10c5c9f586de6363665.pdf",
        "author": "Chen Zhao;Kai Jiang;Xintao Wu;Haoliang Wang;Latifur Khan;Christan Earl Grant;Feng Chen",
        "authorids": "~Chen_Zhao4;~Kai_Jiang3;~Xintao_Wu1;~Haoliang_Wang3;~Latifur_Khan1;~Christan_Earl_Grant1;~Feng_Chen7",
        "gender": "M;M;M;M;M;M;M",
        "homepage": "https://charliezhaoyinpeng.github.io/homepage/;;http://www.csce.uark.edu/~xintaowu/;https://personal.utdallas.edu/~hxw171930/;https://www.utdallas.edu/~lkhan/;https://ceg.me;https://personal.utdallas.edu/~fxc190007/",
        "dblp": "81/3-10.html;;w/XintaoWu;79/1600;k/LatifurKhan;195/5990;21/3047-1",
        "google_scholar": "xebNvXQAAAAJ;;ABnrRqQAAAAJ;;https://scholar.google.com.tw/citations?user=7nERaWEAAAAJ;qIQ3IwYAAAAJ;KOQ-SSYAAAAJ",
        "orcid": "0000-0002-6400-0048;;0000-0002-2823-3063;;;0000-0002-6684-3620;",
        "linkedin": "chen-zhao-221a8710b/;kai-jiang-/;;haoliang-wang-0713b7108/;;christan-grant-3a0bb45;",
        "or_profile": "~Chen_Zhao4;~Kai_Jiang3;~Xintao_Wu1;~Haoliang_Wang3;~Latifur_Khan1;~Christan_Earl_Grant1;~Feng_Chen7",
        "aff": "Baylor University;University of Texas at Dallas;University of Arkansas, Fayetteville;The University of Texas at Dallas;University of Texas at Dallas;University of Florida;University of Texas, Dallas",
        "aff_domain": "baylor.edu;utdallas.edu;uark.edu;cs.utdallas.edu;utdallas.edu;ufl.edu;utdallas.edu",
        "position": "Assistant Professor;PhD student;Full Professor;PhD student;Full Professor;Associate Professor;Associate Professor",
        "bibtex": "@misc{\nzhao2024fairnessaware,\ntitle={Fairness-Aware Domain Generalization under Covariate and Dependence Shifts},\nauthor={Chen Zhao and Kai Jiang and Xintao Wu and Haoliang Wang and Latifur Khan and Christan Earl Grant and Feng Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=vNrTYz1rXH}\n}",
        "github": "",
        "project": "",
        "reviewers": "hRwe;FJko;55mH",
        "site": "https://openreview.net/forum?id=vNrTYz1rXH",
        "pdf_size": 3441579,
        "rating": "3;5;5",
        "confidence": "4;3;4",
        "soundness": "2;3;2",
        "contribution": "2;2;3",
        "presentation": "1;1;2",
        "wc_summary": "58;102;130",
        "wc_strengths": "26;249;34",
        "wc_weaknesses": "359;1140;308",
        "wc_questions": "166;143;4",
        "wc_review": "609;1634;476",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "613;706;883",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;2",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            96.66666666666667,
            29.634814361190493
        ],
        "wc_strengths_avg": [
            103.0,
            103.28923790340727
        ],
        "wc_weaknesses_avg": [
            602.3333333333334,
            380.7574322613049
        ],
        "wc_questions_avg": [
            104.33333333333333,
            71.56504422939705
        ],
        "wc_review_avg": [
            906.3333333333334,
            517.394970554948
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            734.0,
            111.99107107265293
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5743542816668093161&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;1;1;3;1",
        "aff_unique_norm": "Baylor University;University of Texas at Dallas;University of Arkansas;University of Florida",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.baylor.edu;https://www.utdallas.edu;https://www.uark.edu;https://www.ufl.edu",
        "aff_unique_abbr": "Baylor;UT Dallas;UARK;UF",
        "aff_campus_unique_index": "1;2;1;1;1",
        "aff_campus_unique": ";Dallas;Fayetteville",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "vOOkWxbLs7",
        "title": "InfoIGL: Invariant Graph Learning Driven by Information Theory",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Graph-based tasks often violate the i.i.d. assumption as data collection scenarios change, having attracted significant attention to graph out-of-distribution (OOD) generalization. \n  While extracting invariant features is a popular solution, existing methods are limited by the complexity of graphs with distribution shifts in both attributes and structures. Moreover, identifying invariance on graphs is challenging due to lack of prior knowledge for the invariant features.\n  To address these problems, we propose a novel framework, InfoIGL, which leverages information theory to extract invariant graph representations. The framework treats mutual information as the invariance of graphs by exploiting rich *semantic* relations among different distributions. Specifically, InfoIGL decomposes the process of extracting invariant features for graphs into two tasks: **reducing redundant information** and **maximizing mutual information**. To reduce redundancy, InfoIGL leverages attention mechanism to reduce the entropy of graph representations through optimizing their probability distribution. Then InfoIGL integrates semantic-wise and instance-wise contrastive learning to maximize mutual information through joint optimization. Additionally, instance constraint and hard negative mining are utilized to avoid the collapse of contrastive learning. Experiments on both synthetic and real-world datasets demonstrate that our method achieves state-of-the-art performance under OOD generalization for graph classification tasks. The source code is available at https://anonymous.4open.science/r/InfoIGL-268D.",
        "keywords": "Graph OOD;Invariant Learning;Contrastive Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Wenyu Mao;Jiancan Wu;Xiang Wang",
        "authorids": "~Wenyu_Mao1;~Jiancan_Wu1;~Xiang_Wang6",
        "gender": ";M;M",
        "homepage": ";https://wujcan.github.io/;https://github.com/xiangwang1223",
        "dblp": ";257/4945;31/2864-10",
        "google_scholar": ";z9zW1UgAAAAJ;https://scholar.google.com.sg/citations?user=HdhaQB0AAAAJ",
        "orcid": ";0000-0002-6941-5218;0000-0002-6148-6329",
        "linkedin": ";;",
        "or_profile": "~Wenyu_Mao1;~Jiancan_Wu1;~Xiang_Wang6",
        "aff": ";University of Science and Technology of China;University of Science and Technology of China",
        "aff_domain": ";ustc.edu.cn;ustc.edu.cn",
        "position": ";Postdoc;Full Professor",
        "bibtex": "@misc{\nmao2024infoigl,\ntitle={Info{IGL}: Invariant Graph Learning Driven by Information Theory},\nauthor={Wenyu Mao and Jiancan Wu and Xiang Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=vOOkWxbLs7}\n}",
        "github": "",
        "project": "",
        "reviewers": "HyhR;isKn;v4yT;cgj1",
        "site": "https://openreview.net/forum?id=vOOkWxbLs7",
        "pdf_size": 768260,
        "rating": "3;3;3;5",
        "confidence": "4;4;4;2",
        "soundness": "2;3;2;2",
        "contribution": "2;2;2;3",
        "presentation": "3;3;2;2",
        "wc_summary": "68;92;53;51",
        "wc_strengths": "50;131;34;142",
        "wc_weaknesses": "84;274;153;212",
        "wc_questions": "67;6;5;63",
        "wc_review": "269;503;245;468",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            66.0,
            16.38596960817394
        ],
        "wc_strengths_avg": [
            89.25,
            47.746073136960696
        ],
        "wc_weaknesses_avg": [
            180.75,
            70.36112207746548
        ],
        "wc_questions_avg": [
            35.25,
            29.785692874264313
        ],
        "wc_review_avg": [
            371.25,
            115.23101795957545
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:yM5PAwSZiRAJ:scholar.google.com/&scioq=InfoIGL:+Invariant+Graph+Learning+Driven+by+Information+Theory&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Science and Technology of China",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.ustc.edu.cn",
        "aff_unique_abbr": "USTC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "vQiD6v1w41",
        "title": "Semi-supervised Domain Adaptation via Joint Error based Triplet Alignment",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Existing domain adaptation methods are very effective in aligning feature distributions. However, these techniques usually do not improve the performance that much when a few annotated examples are available in the target domain. To address this semi-supervised domain adaptation scenario, we propose a novel joint error based triplet alignment approach that simultaneously optimizes the classification loss as well as the joint error among the source, labeled and unlabeled target domains. Besides, we propose a novel dissimilarity measurement between two classifiers, namely maximum cross margin discrepancy, which can asymptotically bridge the gap between the theory and algorithm. We empirically demonstrate the superiority of our method over several baselines.",
        "keywords": "domain adaptation;semi-supervised learning;joint error",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Dexuan Zhang;Thomas Westfechtel;Tatsuya Harada",
        "authorids": "~Dexuan_Zhang1;~Thomas_Westfechtel1;~Tatsuya_Harada1",
        "gender": "M;M;M",
        "homepage": ";;https://www.mi.t.u-tokyo.ac.jp/harada/",
        "dblp": "87/3197;179/7894;14/5849",
        "google_scholar": "https://scholar.google.co.jp/citations?user=wHnWviMAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=ja",
        "orcid": ";;",
        "linkedin": "dexuan-zhang-4708a0119/;;",
        "or_profile": "~Dexuan_Zhang1;~Thomas_Westfechtel1;~Tatsuya_Harada1",
        "aff": "The University of Tokyo, Tokyo University;The University of Tokyo, Tokyo Institute of Technology;The University of Tokyo",
        "aff_domain": "t.u-tokyo.ac.jp;tokyo.ac.jp;u-tokyo.ac.jp",
        "position": "PhD student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nzhang2024semisupervised,\ntitle={Semi-supervised Domain Adaptation via Joint Error based Triplet Alignment},\nauthor={Dexuan Zhang and Thomas Westfechtel and Tatsuya Harada},\nyear={2024},\nurl={https://openreview.net/forum?id=vQiD6v1w41}\n}",
        "github": "",
        "project": "",
        "reviewers": "hsiV;XYg3;tePx;TnGf",
        "site": "https://openreview.net/forum?id=vQiD6v1w41",
        "pdf_size": 4938343,
        "rating": "1;3;3;3",
        "confidence": "5;4;3;3",
        "soundness": "3;3;2;3",
        "contribution": "1;2;1;2",
        "presentation": "3;1;2;3",
        "wc_summary": "41;192;36;27",
        "wc_strengths": "43;8;3;65",
        "wc_weaknesses": "82;454;76;175",
        "wc_questions": "8;195;38;3",
        "wc_review": "174;849;153;270",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            74.0,
            68.3117852204142
        ],
        "wc_strengths_avg": [
            29.75,
            25.52817071393875
        ],
        "wc_weaknesses_avg": [
            196.75,
            153.6218978531381
        ],
        "wc_questions_avg": [
            61.0,
            78.51432990225415
        ],
        "wc_review_avg": [
            361.5,
            284.8934011169792
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8703882797784891,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:7fmk3HiCxLcJ:scholar.google.com/&scioq=Semi-supervised+Domain+Adaptation+via+Joint+Error+based+Triplet+Alignment&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Tokyo",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.u-tokyo.ac.jp",
        "aff_unique_abbr": "UTokyo",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Tokyo;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Japan"
    },
    {
        "id": "vQqJJzL2Jf",
        "title": "Understanding and Mitigating Extrapolation Failures in Physics-Informed Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Physics-informed Neural Networks (PINNs) have recently gained popularity due to their effective approximation of partial differential equations (PDEs) using deep neural networks (DNNs). However, their out of domain behavior is not well understood, with previous work speculating that the presence of high frequency components in the solution function might be to blame for poor extrapolation performance. In this paper, we study the extrapolation behavior of PINNs on a representative set of PDEs of different types, including high-dimensional PDEs. We find that failure to extrapolate is not caused by high frequencies in the solution function, but rather by shifts in the support of the Fourier spectrum over time. We term these spectral shifts and quantify them by introducing a Weighted Wasserstein-Fourier distance (WWF). We show that the WWF can be used to predict PINN extrapolation performance, and that in the absence of significant spectral shifts, PINN predictions stay close to the true solution even in extrapolation. Finally, we propose a transfer learning-based strategy to mitigate the effects of larger spectral shifts, which decreases extrapolation errors by up to 82%.",
        "keywords": "Physics-informed Neural Networks;Extrapolation;Generalization;Transfer Learning",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "",
        "author": "Lukas Fesser;Luca D'Amico-Wong;Richard Qiu",
        "authorids": "~Lukas_Fesser1;~Luca_D'Amico-Wong1;~Richard_Qiu1",
        "gender": ";M;M",
        "homepage": ";;",
        "dblp": ";330/9302;318/3094",
        "google_scholar": ";;8EaQf-kAAAAJ",
        "orcid": ";;0000-0003-3462-0817",
        "linkedin": ";luca-d-amico-wong-41879712b/;",
        "or_profile": "~Lukas_Fesser1;~Luca_D'Amico-Wong1;~Richard_Qiu1",
        "aff": ";Harvard University;",
        "aff_domain": ";harvard.edu;",
        "position": ";Undergrad student;",
        "bibtex": "@misc{\nfesser2024understanding,\ntitle={Understanding and Mitigating Extrapolation Failures in Physics-Informed Neural Networks},\nauthor={Lukas Fesser and Luca D'Amico-Wong and Richard Qiu},\nyear={2024},\nurl={https://openreview.net/forum?id=vQqJJzL2Jf}\n}",
        "github": "",
        "project": "",
        "reviewers": "dasc;SeWR;uE7H;qKGX",
        "site": "https://openreview.net/forum?id=vQqJJzL2Jf",
        "pdf_size": 10938302,
        "rating": "5;5;6;8",
        "confidence": "4;4;4;5",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;3;4",
        "wc_summary": "13;67;85;93",
        "wc_strengths": "23;81;39;30",
        "wc_weaknesses": "175;265;110;176",
        "wc_questions": "31;123;129;11",
        "wc_review": "242;536;363;310",
        "wc_reply_reviewers": "0;58;27;129",
        "wc_reply_authors": "632;1272;897;250",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "2;4;3;2",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            64.5,
            31.188940347501386
        ],
        "wc_strengths_avg": [
            43.25,
            22.520823697191894
        ],
        "wc_weaknesses_avg": [
            181.5,
            55.12939324897382
        ],
        "wc_questions_avg": [
            73.5,
            53.016506863428866
        ],
        "wc_review_avg": [
            362.75,
            108.83330142929599
        ],
        "wc_reply_reviewers_avg": [
            53.5,
            48.17935242404157
        ],
        "wc_reply_authors_avg": [
            762.75,
            373.2849950105147
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.9428090415820632,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3578536035558015203&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "Harvard University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.harvard.edu",
        "aff_unique_abbr": "Harvard",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "vR5h3cAfXS",
        "title": "On robust overfitting: adversarial training induced distribution matters",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Robust overfitting has been observed to arise in adversarial training. We hypothesize that this phenomenon may be related to the evolution of the data distribution along the training trajectory. To investigate this, we select a set of checkpoints in adversarial training and perform standard training on distributions induced by adversarial perturbation w.r.t the checkpoints. We observe that the obtained models become increasingly harder to generalize when robust overfitting occurs, thereby validating the hypothesis. We show the hardness of generalization on the induced distributions is related to certain local properties of the perturbation operator at each checkpoint. This local property is characterized by a quantity defined as local dispersion in our work. The connection between the local dispersion and the generalization on the induced distribution is proved by establishing an upper bound of the generalization error.",
        "keywords": "adversarial training;adversarial robustness;robust overfitting;generalization",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Runzhi Tian;Yongyi Mao",
        "authorids": "~Runzhi_Tian1;~Yongyi_Mao2",
        "gender": ";M",
        "homepage": "https://github.com/rzTian;http://www.eecs.uottawa.ca/~yymao",
        "dblp": "278/8330;86/2933",
        "google_scholar": ";https://scholar.google.ca/citations?user=jM5l70wAAAAJ",
        "orcid": ";0000-0001-5298-5778",
        "linkedin": ";",
        "or_profile": "~Runzhi_Tian1;~Yongyi_Mao1",
        "aff": "University of Ottawa;University of Ottawa",
        "aff_domain": "uottawa.ca;eecs.uottawa.ca",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\ntian2024on,\ntitle={On robust overfitting: adversarial training induced distribution matters},\nauthor={Runzhi Tian and Yongyi Mao},\nyear={2024},\nurl={https://openreview.net/forum?id=vR5h3cAfXS}\n}",
        "github": "",
        "project": "",
        "reviewers": "Wjrq;3NwP;NYh7;jc1G",
        "site": "https://openreview.net/forum?id=vR5h3cAfXS",
        "pdf_size": 707189,
        "rating": "3;3;5;8",
        "confidence": "4;4;4;4",
        "soundness": "1;2;2;3",
        "contribution": "1;2;1;3",
        "presentation": "2;2;3;3",
        "wc_summary": "107;31;318;156",
        "wc_strengths": "35;87;61;68",
        "wc_weaknesses": "310;286;1674;47",
        "wc_questions": "1;2;583;152",
        "wc_review": "453;406;2636;423",
        "wc_reply_reviewers": "260;178;0;0",
        "wc_reply_authors": "314;1463;2839;324",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "1;3;5;1",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            153.0,
            105.1594028130628
        ],
        "wc_strengths_avg": [
            62.75,
            18.632968094214082
        ],
        "wc_weaknesses_avg": [
            579.25,
            640.3629342021601
        ],
        "wc_questions_avg": [
            184.5,
            238.13704037801426
        ],
        "wc_review_avg": [
            979.5,
            956.5287502213407
        ],
        "wc_reply_reviewers_avg": [
            109.5,
            113.27290055436914
        ],
        "wc_reply_authors_avg": [
            1235.0,
            1037.1791070012932
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            1.6583123951777
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16923815672871144010&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Ottawa",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uottawa.ca",
        "aff_unique_abbr": "U Ottawa",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "vRgMxGmEz9",
        "title": "SAM-guided Unsupervised Domain Adaptation for 3D Segmentation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Unsupervised domain adaptation (UDA) in 3D segmentation tasks presents a formidable challenge, primarily stemming from the sparse and unordered nature of point cloud data.  Especially for LiDAR point clouds, the domain discrepancy becomes obvious across varying capture scenes, fluctuating weather conditions, and the diverse array of LiDAR devices in use. While previous UDA methodologies have often sought to mitigate this gap by aligning features between source and target domains, this approach falls short when applied to 3D segmentation due to the substantial domain variations. Inspired by the remarkable generalization capabilities exhibited by the vision foundation model, SAM, in the realm of image segmentation, our approach leverages the wealth of general knowledge embedded within SAM to unify feature representations across diverse 3D domains, and further solves the 3D domain adaptation problem. Specifically, we harness the corresponding images associated with point clouds to facilitate knowledge transfer and propose an innovative hybrid feature augmentation methodology, which significantly enhances the alignment between the 3D feature space and SAM's feature space, operating at both the scene and instance levels. Our method is evaluated on many widely-recognized datasets, and achieves state-of-the-art performance.",
        "keywords": "scene understanding;3D segmentation;unsupervised domain adaptation;vision foundation model",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Xidong Peng;Runnan Chen;Feng Qiao;Lingdong Kong;Youquan Liu;Tai Wang;Xinge ZHU;Yuexin Ma",
        "authorids": "~Xidong_Peng1;~Runnan_Chen1;~Feng_Qiao1;~Lingdong_Kong1;~Youquan_Liu1;~Tai_Wang2;~Xinge_ZHU2;~Yuexin_Ma2",
        "gender": "M;M;;;M;;;F",
        "homepage": "https://github.com/linmo2333;https://scholar.google.com.hk/citations?hl=en&user=Uq2DuzkAAAAJ&view_op=list_works&sortby=pubdate;;;https://github.com/youquanl;;;http://yuexinma.me/aboutme.html",
        "dblp": "300/4516;232/1849;;;91/6914;;;209/5925",
        "google_scholar": ";https://scholar.google.com.hk/citations?hl=en;;;;;;",
        "orcid": ";;;;0000-0002-1625-4318;;;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Xidong_Peng1;~Runnan_Chen1;~Feng_Qiao1;~Lingdong_Kong1;~Youquan_Liu1;~Tai_Wang2;~Xinge_ZHU2;~Yuexin_Ma2",
        "aff": "ShanghaiTech University;the University of Hong Kong, University of Hong Kong;;;Fudan University;;;ShanghaiTech University",
        "aff_domain": "shanghaitech.edu.cn;cs.hku.hk;;;m.fudan.edu.cn;;;shanghaitech.edu.cn",
        "position": "MS student;Postdoc;;;PhD student;;;Assistant Professor",
        "bibtex": "@misc{\npeng2024samguided,\ntitle={{SAM}-guided Unsupervised Domain Adaptation for 3D Segmentation},\nauthor={Xidong Peng and Runnan Chen and Feng Qiao and Lingdong Kong and Youquan Liu and Tai Wang and Xinge ZHU and Yuexin Ma},\nyear={2024},\nurl={https://openreview.net/forum?id=vRgMxGmEz9}\n}",
        "github": "",
        "project": "",
        "reviewers": "Zd6y;z4wG;yHAr;SoFF;qceh",
        "site": "https://openreview.net/forum?id=vRgMxGmEz9",
        "pdf_size": 3165408,
        "rating": "3;5;5;6;6",
        "confidence": "4;5;4;3;3",
        "soundness": "3;3;4;3;2",
        "contribution": "2;2;2;2;2",
        "presentation": "3;2;4;3;2",
        "wc_summary": "45;72;65;82;146",
        "wc_strengths": "21;27;47;58;53",
        "wc_weaknesses": "73;240;50;82;20",
        "wc_questions": "2;127;169;50;195",
        "wc_review": "141;466;331;272;414",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            5.0,
            1.0954451150103321
        ],
        "confidence_avg": [
            3.8,
            0.7483314773547882
        ],
        "soundness_avg": [
            3.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.8,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            82.0,
            34.21695486158872
        ],
        "wc_strengths_avg": [
            41.2,
            14.593149077563758
        ],
        "wc_weaknesses_avg": [
            93.0,
            76.56108672164993
        ],
        "wc_questions_avg": [
            108.6,
            72.45577961763989
        ],
        "wc_review_avg": [
            324.8,
            113.58063215178899
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.48795003647426666,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=823911572094915887&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "ShanghaiTech University;University of Hong Kong;Fudan University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.shanghaitech.edu.cn;https://www.hku.hk;https://www.fudan.edu.cn",
        "aff_unique_abbr": "ShanghaiTech;HKU;Fudan",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Efficient Backdoor Attacks for Deep Neural Networks in Real-world Scenarios",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17536",
        "id": "vRyp2dhEQp",
        "author_site": "Ziqiang Li, Hong Sun, Pengfei Xia, Heng Li, Beihao Xia, Yi Wu, Bin Li",
        "tldr": "",
        "abstract": "Recent deep neural networks (DNNs) have came to rely on vast amounts of training data, providing an opportunity for malicious attackers to exploit and contaminate the data to carry out backdoor attacks. However, existing backdoor attack methods make unrealistic assumptions, assuming that all training data comes from a single source and that attackers have full access to the training data. In this paper, we introduce a more realistic attack scenario where victims collect data from multiple sources, and attackers cannot access the complete training data. We refer to this scenario as $\\textbf{data-constrained backdoor attacks}$. In such cases, previous attack methods suffer from severe efficiency degradation due to the $\\textbf{entanglement}$ between benign and poisoning features during the backdoor injection process. To tackle this problem, we introduce three CLIP-based technologies from two distinct streams: $\\textit{Clean Feature Suppression}$ and $\\textit{Poisoning Feature Augmentation}$. The results demonstrate remarkable improvements, with some settings achieving over $\\textbf{100}$% improvement compared to existing attacks in data-constrained scenarios.",
        "keywords": "Deep Neural Networks;Backdoor Attacks;Poisoning Efficiency.",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Ziqiang Li;Hong Sun;Pengfei Xia;Heng Li;Beihao Xia;Yi Wu;Bin Li",
        "authorids": "~Ziqiang_Li4;~Hong_Sun5;~Pengfei_Xia1;~Heng_Li10;~Beihao_Xia1;~Yi_Wu11;~Bin_Li8",
        "gender": "M;M;M;M;M;M;M",
        "homepage": "https://iceli1007.github.io/;;https://xpf.github.io/;;;https://scholar.google.com/citations?user=OnnO94cAAAAJ&hl=zh-CN&authuser=1;http://staff.ustc.edu.cn/~binli",
        "dblp": "17/616-1.html;;;02/3672-8;260/6382.html;44/3684-18;89/6764-25",
        "google_scholar": "https://scholar.google.com.hk/citations?user=mj5a8WgAAAAJ;;GSIwWNEAAAAJ;;Lx_iqH8AAAAJ;OnnO94cAAAAJ;",
        "orcid": ";0000-0002-9249-5375;;;;0000-0001-7384-5029;0000-0002-2332-3959",
        "linkedin": ";;;;%E5%8C%97%E6%B5%A9-%E5%A4%8F-4a5777117/;;",
        "or_profile": "~Ziqiang_Li4;~Hong_Sun5;~Pengfei_Xia1;~Heng_Li10;~Beihao_Xia1;~Yi_Wu11;~Bin_Li8",
        "aff": "University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China;;Huazhong University of Science and Technology;University of Science and Technology of China;University of Science and Technology of China",
        "aff_domain": "ustc.edu.cn;ustc.edu.cn;ustc.edu.cn;;hust.edu.cn;ustc.edu.cn;ustc.edu.cn",
        "position": "PhD student;MS student;PhD student;;Postdoc;PhD student;Full Professor",
        "bibtex": "@inproceedings{\nli2024efficient,\ntitle={Efficient Backdoor Attacks for Deep Neural Networks in Real-world Scenarios},\nauthor={Ziqiang Li and Hong Sun and Pengfei Xia and Heng Li and Beihao Xia and Yi Wu and Bin Li},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=vRyp2dhEQp}\n}",
        "github": "",
        "project": "",
        "reviewers": "nLdg;tXy3;rJBe;kSYS",
        "pdf_size": 1436229,
        "rating": "3;6;6;8",
        "confidence": "5;4;4;2",
        "soundness": "2;3;3;3",
        "contribution": "1;2;2;3",
        "presentation": "3;2;2;3",
        "wc_summary": "41;38;177;54",
        "wc_strengths": "20;79;66;10",
        "wc_weaknesses": "176;150;84;14",
        "wc_questions": "21;28;3;466",
        "wc_review": "258;295;330;544",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1555;1192;766;1109",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "4;2;2;2",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            77.5,
            57.76028047023318
        ],
        "wc_strengths_avg": [
            43.75,
            29.328953271468794
        ],
        "wc_weaknesses_avg": [
            106.0,
            62.81719509815764
        ],
        "wc_questions_avg": [
            129.5,
            194.4922877648366
        ],
        "wc_review_avg": [
            356.75,
            111.06614020483471
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1155.5,
            280.5374306576575
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.5,
            0.8660254037844386
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.9316142209946916,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=611332202994744345&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=vRyp2dhEQp",
        "pdf": "https://openreview.net/pdf?id=vRyp2dhEQp",
        "email": "ustc.edu.cn;ustc.edu.cn;ustc.edu.cn;;hust.edu.cn;ustc.edu.cn;ustc.edu.cn",
        "author_num": 7,
        "aff_unique_index": "0;0;0;1;0;0",
        "aff_unique_norm": "University of Science and Technology of China;Huazhong University of Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.ustc.edu.cn;http://www.hust.edu.cn",
        "aff_unique_abbr": "USTC;HUST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "vSBB2nRaoj",
        "title": "Bi-Directional Goal-Conditioning on Single Policy Function for State Space Search",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "State space search problems have a binary (found/not found) reward system. However,\nin the real world, these problems often have a vast number of states compared\nto only a limited number of goal states. This makes the rewards very sparse for\nthe search task. On the other hand, Goal-Conditioned Reinforcement Learning\n(GCRL) can be used to train an agent to solve multiple related tasks. In our work,\nwe assume the ability to sample goal states and use the same to define a forward\ntask (\u03c4 \u2217) and a reverse task (\u03c4 inv) derived from the original state space search\ntask to ensure more useful and learnable samples. We adopt the Universal Value\nFunction Approximator (UVFA) setting with a GCRL agent to learn from these\nsamples. We incorporate hindsight relabelling with goal-conditioning in the forward\ntask to reach goals sampled from \u03c4 \u2217, and similarly define \u2018Foresight\u2019 for\nthe backward task. We also use the agent\u2019s ability (from the policy function) to\nreach intermediate states and use these states as goals for new sub-tasks. Further,\nto tackle the problem of reverse transitions from the backward trajectories,\nwe spawn new instances of the agent from states in these trajectories to collect\nforward transitions which are then used to train for the main task \u03c4 \u2217. We consolidate\nthese tasks and sample generation strategies into a three-part system called\nScrambler-Resolver-Explorer (SRE). We also propose the \u2018SRE-DQN\u2019 agent that\ncombines our exploration module with the popular DQN algorithm. Finally, we\ndemonstrate the advantages of bi-directional goal-conditioning and knowledge of\nthe goal state by evaluating our framework on classical goal-reaching tasks, and\ncomparing with existing concepts extended to our bi-directional setting.",
        "keywords": "Goal-Conditioning;Deep Reinforcement Learning;State Space Search",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Vihaan Akshaay Rajendiran;Yu-Xiang Wang;Lei Li",
        "authorids": "~Vihaan_Akshaay_Rajendiran1;~Yu-Xiang_Wang1;~Lei_Li11",
        "gender": "M;;M",
        "homepage": "https://vihaanakshaay.github.io/#/;http://www.cs.ucsb.edu/~yuxiangw/publications.html;https://www.cs.cmu.edu/~leili",
        "dblp": ";62/1637-3.html;13/7007-5.html",
        "google_scholar": ";HGNZ1fkAAAAJ;BYXqAlwAAAAJ",
        "orcid": ";;0000-0003-3095-9776",
        "linkedin": "vihaanakshaayrajendiran/;;",
        "or_profile": "~Vihaan_Akshaay_Rajendiran1;~Yu-Xiang_Wang1;~Lei_Li11",
        "aff": "University of California, Santa Barbara;UC Santa Barbara;School of Computer Science, Carnegie Mellon University",
        "aff_domain": "ucsb.edu;ucsb.edu;cs.cmu.edu",
        "position": "MS student;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nrajendiran2024bidirectional,\ntitle={Bi-Directional Goal-Conditioning on Single Policy Function for State Space Search},\nauthor={Vihaan Akshaay Rajendiran and Yu-Xiang Wang and Lei Li},\nyear={2024},\nurl={https://openreview.net/forum?id=vSBB2nRaoj}\n}",
        "github": "",
        "project": "",
        "reviewers": "hi7c;bwK3;mR2i",
        "site": "https://openreview.net/forum?id=vSBB2nRaoj",
        "pdf_size": 2265945,
        "rating": "3;3;5",
        "confidence": "5;4;3",
        "soundness": "3;1;2",
        "contribution": "2;1;2",
        "presentation": "2;2;2",
        "wc_summary": "99;128;68",
        "wc_strengths": "93;19;73",
        "wc_weaknesses": "294;184;120",
        "wc_questions": "48;174;8",
        "wc_review": "534;505;269",
        "wc_reply_reviewers": "0;165;0",
        "wc_reply_authors": "500;901;465",
        "reply_reviewers": "0;1;0",
        "reply_authors": "1;2;1",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            98.33333333333333,
            24.499433100017278
        ],
        "wc_strengths_avg": [
            61.666666666666664,
            31.255221785949445
        ],
        "wc_weaknesses_avg": [
            199.33333333333334,
            71.85788443556876
        ],
        "wc_questions_avg": [
            76.66666666666667,
            70.7358152250722
        ],
        "wc_review_avg": [
            436.0,
            118.67883832708621
        ],
        "wc_reply_reviewers_avg": [
            55.0,
            77.78174593052023
        ],
        "wc_reply_authors_avg": [
            622.0,
            197.7995618464982
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8660254037844387,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:NRoBUqJLk4sJ:scholar.google.com/&scioq=Bi-Directional+Goal-Conditioning+on+Single+Policy+Function+for+State+Space+Search&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "University of California, Santa Barbara;Carnegie Mellon University",
        "aff_unique_dep": ";School of Computer Science",
        "aff_unique_url": "https://www.ucsb.edu;https://www.cmu.edu",
        "aff_unique_abbr": "UCSB;CMU",
        "aff_campus_unique_index": "0;0;1",
        "aff_campus_unique": "Santa Barbara;Pittsburgh",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "vSOTacnSNf",
        "title": "Multimodal Meta-learning of Implicit Neural Representations with Iterative Adaptation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Gradient-based meta-learning is gaining prominence in implicit neural representations (INRs) to accelerate convergence. \nHowever, existing approaches primarily concentrate on meta-learning $\\textit{weight initialization}$ for $\\textit{unimodal}$ signals. \nThis focus falls short when data is scarce, as noisy gradients from a small set of observations can hinder convergence and trigger overfitting. \nMoreover, real-world data often stems from joint multimodal distributions, which share common or complementary information across modalities. \nThis presents an opportunity to enhance convergence and performance, particularly when dealing with limited data. \nUnfortunately, existing methods do not fully exploit this potential due to their main focus on unimodal setups.\nIn this work, we introduce a novel optimization-based meta-learning framework, Multimodal Iterative Adaptation (MIA), that addresses these limitations.\nMIA fosters continuous interaction among independent unimodal INR learners, enabling them to capture cross-modal relationships and refine their understanding of signals through iterative optimization steps.\nTo achieve this goal, we introduce additional meta-learned modules, dubbed State Fusion Transformers (SFTs). \nOur SFTs are meta-learned to aggregate the states of the unimodal learners ($\\textit{e.g.}$ parameters and gradients), capture their potential cross-modal interactions, and utilize this knowledge to provide enhanced weight updates and guidance to the unimodal learners.\nIn experiments, we demonstrate that MIA significantly improves the modeling capabilities of unimodal meta-learners, achieving substantial enhancements in generalization and memorization performances over unimodal baselines across a variety of multimodal signals, ranging from 1D synthetic functions to real-world vision, climate, and audiovisual data.",
        "keywords": "Implicit Neural Representations;Meta Learning;Multimodal Learning;Optimization",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/7202dc0e5a3af66462bfbb6af4f569af9d24207a.zip",
        "author": "Sehun Lee;Wonkwang Lee;Gunhee Kim",
        "authorids": "~Sehun_Lee1;~Wonkwang_Lee2;~Gunhee_Kim1",
        "gender": "M;M;M",
        "homepage": "https://yhytoto12.github.io;https://www.github.com/1Konny;http://vision.snu.ac.kr/gunhee/",
        "dblp": "329/6567;256/4988;45/115",
        "google_scholar": "https://scholar.google.co.kr/citations?user=rgWe18cAAAAJ;y2p6gTEAAAAJ;https://scholar.google.co.kr/citations?user=CiSdOV0AAAAJ",
        "orcid": ";;0000-0002-9543-7453",
        "linkedin": "sehunlee/;;",
        "or_profile": "~Sehun_Lee1;~Wonkwang_Lee2;~Gunhee_Kim1",
        "aff": "Seoul National University;Seoul National University;Seoul National University",
        "aff_domain": "snu.ac.kr;snu.ac.kr;snu.ac.kr",
        "position": "PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nlee2024multimodal,\ntitle={Multimodal Meta-learning of Implicit Neural Representations with Iterative Adaptation},\nauthor={Sehun Lee and Wonkwang Lee and Gunhee Kim},\nyear={2024},\nurl={https://openreview.net/forum?id=vSOTacnSNf}\n}",
        "github": "",
        "project": "",
        "reviewers": "cLC2;hqqm;gNAu",
        "site": "https://openreview.net/forum?id=vSOTacnSNf",
        "pdf_size": 6233243,
        "rating": "3;5;5",
        "confidence": "4;4;4",
        "soundness": "2;2;2",
        "contribution": "2;2;3",
        "presentation": "3;2;2",
        "wc_summary": "247;11;94",
        "wc_strengths": "305;44;39",
        "wc_weaknesses": "933;420;60",
        "wc_questions": "343;4;2",
        "wc_review": "1828;479;195",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "3239;2190;426",
        "reply_reviewers": "0;0;0",
        "reply_authors": "5;6;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            117.33333333333333,
            97.7491119595922
        ],
        "wc_strengths_avg": [
            129.33333333333334,
            124.23186207875803
        ],
        "wc_weaknesses_avg": [
            471.0,
            358.2206024225854
        ],
        "wc_questions_avg": [
            116.33333333333333,
            160.27961678128494
        ],
        "wc_review_avg": [
            834.0,
            712.3627353158408
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1951.6666666666667,
            1160.7021821102758
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            4.0,
            2.160246899469287
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:mUjLwoSYt6gJ:scholar.google.com/&scioq=Multimodal+Meta-learning+of+Implicit+Neural+Representations+with+Iterative+Adaptation&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Seoul National University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.snu.ac.kr",
        "aff_unique_abbr": "SNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "How Many Pretraining Tasks Are Needed for In-Context Learning of Linear Regression?",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17535",
        "id": "vSh5ePa0ph",
        "author_site": "Jingfeng Wu, Difan Zou, Zixiang Chen, Vladimir Braverman, Quanquan Gu, Peter Bartlett",
        "tldr": "",
        "abstract": "Transformers pretrained on diverse tasks exhibit remarkable in-context learning (ICL) capabilities, enabling them to solve unseen tasks solely based on input contexts without adjusting model parameters. In this paper, we study ICL in one of its simplest setups: pretraining a single-layer linear attention model for linear regression with a Gaussian prior. We establish a statistical task complexity bound for the attention model pretraining, showing that effective pretraining only requires a small number of independent tasks. Furthermore, we prove that the pretrained model closely matches the Bayes optimal algorithm, i.e., optimally tuned ridge regression, by achieving nearly Bayes optimal risk on unseen tasks under a fixed context length. These theoretical findings complement prior experimental research and shed light on the statistical foundations of ICL.",
        "keywords": "in-context learning;linear regression;ridge regression;Bayes optimality",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Jingfeng Wu;Difan Zou;Zixiang Chen;Vladimir Braverman;Quanquan Gu;Peter Bartlett",
        "authorids": "~Jingfeng_Wu1;~Difan_Zou1;~Zixiang_Chen1;~Vladimir_Braverman1;~Quanquan_Gu1;~Peter_Bartlett1",
        "gender": "M;M;M;Unspecified;M;M",
        "homepage": "https://uuujf.github.io;https://difanzou.github.io/;https://sites.google.com/view/zxchen;http://www.cs.jhu.edu/~vova/;http://web.cs.ucla.edu/~qgu/;https://www.stat.berkeley.edu/~bartlett/",
        "dblp": ";161/8923;137/3624;14/4758;50/4597;https://dblp.org/pers/hd/b/Bartlett:Peter_L=",
        "google_scholar": "z-KILD8AAAAJ;Cp4fcTQAAAAJ;6nrCHr0AAAAJ;https://scholar.google.com.tw/citations?user=DTthB48AAAAJ;GU9HgNAAAAAJ;yQNhFGUAAAAJ",
        "orcid": "0009-0009-3414-4487;;;;;",
        "linkedin": "jingfeng-wu-79205b184/;;;;;",
        "or_profile": "~Jingfeng_Wu1;~Difan_Zou1;~Zixiang_Chen1;~Vladimir_Braverman1;~Quanquan_Gu1;~Peter_Bartlett1",
        "aff": "University of California, Berkeley;University of Hong Kong; University of California, Los Angeles;Department of Computer Science, Whiting School of Engineering;University of California, Los Angeles;University of California, Berkeley",
        "aff_domain": "berkeley.edu;hku.hk;cs.ucla.edu;cs.jhu.edu;cs.ucla.edu;berkeley",
        "position": "Postdoc;Assistant Professor;PhD student;Full Professor;Associate Professor;Professor",
        "bibtex": "@inproceedings{\nwu2024how,\ntitle={How Many Pretraining Tasks Are Needed for In-Context Learning of Linear Regression?},\nauthor={Jingfeng Wu and Difan Zou and Zixiang Chen and Vladimir Braverman and Quanquan Gu and Peter Bartlett},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=vSh5ePa0ph}\n}",
        "github": "",
        "project": "",
        "reviewers": "ozh2;dEpy;m56U;HbBb",
        "pdf_size": 658789,
        "rating": "5;6;8;8",
        "confidence": "4;3;3;3",
        "soundness": "3;4;3;3",
        "contribution": "3;3;3;3",
        "presentation": "2;4;3;3",
        "wc_summary": "84;53;81;147",
        "wc_strengths": "46;72;105;136",
        "wc_weaknesses": "131;258;223;258",
        "wc_questions": "104;101;80;8",
        "wc_review": "365;484;489;549",
        "wc_reply_reviewers": "0;6;54;0",
        "wc_reply_authors": "603;641;674;420",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "2;1;2;1",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            91.25,
            34.382953625306826
        ],
        "wc_strengths_avg": [
            89.75,
            33.914414339628514
        ],
        "wc_weaknesses_avg": [
            217.5,
            51.944682114726625
        ],
        "wc_questions_avg": [
            73.25,
            38.79030162295725
        ],
        "wc_review_avg": [
            471.75,
            66.72846094433768
        ],
        "wc_reply_reviewers_avg": [
            15.0,
            22.64950330581225
        ],
        "wc_reply_authors_avg": [
            584.5,
            98.24077564840375
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.7777777777777777,
        "gs_citation": 70,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10889850278445031965&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=vSh5ePa0ph",
        "pdf": "https://openreview.net/pdf?id=vSh5ePa0ph",
        "email": "berkeley.edu;hku.hk;cs.ucla.edu;cs.jhu.edu;cs.ucla.edu;berkeley",
        "author_num": 6,
        "aff_unique_index": "0;1;2;3;2;0",
        "aff_unique_norm": "University of California, Berkeley;University of Hong Kong;University of California, Los Angeles;Johns Hopkins University",
        "aff_unique_dep": ";;;Department of Computer Science",
        "aff_unique_url": "https://www.berkeley.edu;https://www.hku.hk;https://www.ucla.edu;https://www.jhu.edu",
        "aff_unique_abbr": "UC Berkeley;HKU;UCLA;JHU",
        "aff_campus_unique_index": "0;1;2;3;2;0",
        "aff_campus_unique": "Berkeley;Hong Kong SAR;Los Angeles;Baltimore",
        "aff_country_unique_index": "0;1;0;0;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "vSkcS3qnZk",
        "title": "Emergent Corpus Pretraining Benefits Vision Language Modeling",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Vision Language Pre-trained Models (VL-PTMs) have achieved state-of-the-art results across various tasks, but their effectiveness heavily relies on large-scale multimodal datasets. While VL-PTMs excel in scenarios with abundant data, they struggle to achieve sample efficiency in tasks with limited data resources. In this work, we explore the use of Emergent Communication (EC) for knowledge transfer in VL-PTMs. In particular, we pre-train a state-of-the-art Vision Language (VL) model on a corpus of EC tokens, generated through a referential game involving two artificial agents. Through experiments on three diverse cross-modal matching and reasoning tasks, we demonstrate significant performance improvements. For instance, EC pretraining enhances Visual Referring Expression (VRE) accuracy by $108.6\\%$ while improving Visual Entailment (VE) performance by $69.6\\%$. We further demonstrate that a vision-language model, exclusively pre-trained on EC tokens from scratch utilizing a sequence-to-sequence learning objective, can be effectively leveraged for fine-tuning numerous other vision-language downstream tasks, outperforming baseline settings without any pretraining and in some cases significantly narrowing the performance gap with models pre-trained on natural language. These results highlight the transferability and generalization capabilities of EC pretraining across different VL tasks and the potential of leveraging the multimodal grounding of EC tokens to enhance VL understanding in resource-constrained settings, especially in settings with limited natural language data. We discuss implications and propose avenues for future research to explore the connections between EC and VL for multimodal understanding and effective human-machine communication.",
        "keywords": "emergent communication;vision language pretraining;corpus transfer",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/25d2886e2349229a5fa46811d5170b81ebf968e2.pdf",
        "author": "Makanjuola Adekunmi Ogunleye;Chase Vickery;Ismini Lourentzou",
        "authorids": "~Makanjuola_Adekunmi_Ogunleye1;~Chase_Vickery1;~Ismini_Lourentzou1",
        "gender": "M;F;",
        "homepage": "https://makanju0la.github.io/;https://isminoula.github.io;",
        "dblp": ";136/7883;288/1972",
        "google_scholar": "5HHDgpsAAAAJ;CjxQvikAAAAJ;",
        "orcid": ";;0000-0002-4035-1193",
        "linkedin": "makanjuola-mackay-ogunleye-959817ab/;;",
        "or_profile": "~Makanjuola_Adekunmi_Ogunleye1;~Ismini_Lourentzou1;~Chase_Daniel_Vickery1",
        "aff": "Virginia Polytechnic Institute and State University;University of Illinois Urbana - Champaign;Virginia Polytechnic Institute and State University",
        "aff_domain": "cs.vt.edu;illinois.edu;vt.edu",
        "position": "PhD student;Assistant Professor;PhD student",
        "bibtex": "@misc{\nogunleye2024emergent,\ntitle={Emergent Corpus Pretraining Benefits Vision Language Modeling},\nauthor={Makanjuola Adekunmi Ogunleye and Chase Vickery and Ismini Lourentzou},\nyear={2024},\nurl={https://openreview.net/forum?id=vSkcS3qnZk}\n}",
        "github": "",
        "project": "",
        "reviewers": "DU5f;PktS;2A8R",
        "site": "https://openreview.net/forum?id=vSkcS3qnZk",
        "pdf_size": 2824786,
        "rating": "3;3;3",
        "confidence": "4;4;4",
        "soundness": "1;1;2",
        "contribution": "1;2;1",
        "presentation": "2;3;1",
        "wc_summary": "51;273;69",
        "wc_strengths": "40;107;23",
        "wc_weaknesses": "148;247;35",
        "wc_questions": "41;62;32",
        "wc_review": "280;689;159",
        "wc_reply_reviewers": "0;194;0",
        "wc_reply_authors": "1253;741;581",
        "reply_reviewers": "0;1;0",
        "reply_authors": "3;1;1",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            131.0,
            100.67770358922576
        ],
        "wc_strengths_avg": [
            56.666666666666664,
            36.261396675926434
        ],
        "wc_weaknesses_avg": [
            143.33333333333334,
            86.61152091699785
        ],
        "wc_questions_avg": [
            45.0,
            12.569805089976535
        ],
        "wc_review_avg": [
            376.0,
            226.77007445134083
        ],
        "wc_reply_reviewers_avg": [
            64.66666666666667,
            91.45247703346013
        ],
        "wc_reply_authors_avg": [
            858.3333333333334,
            286.6139486409473
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:p_NLYUwqTRIJ:scholar.google.com/&scioq=Emergent+Corpus+Pretraining+Benefits+Vision+Language+Modeling&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Virginia Tech;University of Illinois Urbana-Champaign",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.vt.edu;https://illinois.edu",
        "aff_unique_abbr": "VT;UIUC",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Urbana-Champaign",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Enhancing Transfer Learning with Flexible Nonparametric Posterior Sampling",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17534",
        "id": "vSwu81S33z",
        "author_site": "Hyungi Lee, Giung Nam, Edwin Fong, Juho Lee",
        "tldr": "",
        "abstract": "Transfer learning has recently shown significant performance across various tasks involving deep neural networks. In these transfer learning scenarios, the prior distribution for downstream data becomes crucial in Bayesian model averaging (BMA). While previous works proposed the prior over the neural network parameters centered around the pre-trained solution, such strategies have limitations when dealing with distribution shifts between upstream and downstream data. This paper introduces nonparametric transfer learning (NPTL), a flexible posterior sampling method to address the distribution shift issue within the context of nonparametric learning. The nonparametric learning (NPL) method is a recent approach that employs a nonparametric prior for posterior sampling, efficiently accounting for model misspecification scenarios, which is suitable for transfer learning scenarios that may involve the distribution shift between upstream and downstream tasks. Through extensive empirical validations, we demonstrate that our approach surpasses other baselines in BMA performance.",
        "keywords": "Transfer Learning;Nonparametric Learning;Bayesian Neural Network",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/4e152dfd7d4a881cbd0a7e653fe55e479393ecb8.zip",
        "author": "Hyungi Lee;Giung Nam;Edwin Fong;Juho Lee",
        "authorids": "~Hyungi_Lee1;~Giung_Nam1;~Edwin_Fong1;~Juho_Lee2",
        "gender": "M;;M;M",
        "homepage": ";https://cs-giung.github.io/;https://edfong.github.io/;https://juho.lee.github.io",
        "dblp": "221/7959;304/9008;236/6357;55/3410-1",
        "google_scholar": ";https://scholar.google.co.kr/citations?user=HO-fMd8AAAAJ;eT4pY6QAAAAJ;Py4URJUAAAAJ",
        "orcid": ";;;",
        "linkedin": "hyungi-lee-a8b161149/;;;",
        "or_profile": "~Hyungi_Lee1;~Giung_Nam1;~Edwin_Fong1;~Juho_Lee2",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;University of Hong Kong;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr;hku.hk;kaist.ac.kr",
        "position": "PhD student;PhD student;Assistant Professor;Associate Professor",
        "bibtex": "@inproceedings{\nlee2024enhancing,\ntitle={Enhancing Transfer Learning with Flexible Nonparametric Posterior Sampling},\nauthor={Hyungi Lee and Giung Nam and Edwin Fong and Juho Lee},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=vSwu81S33z}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZDrq;izux;bi4C;vw7S",
        "pdf_size": 405377,
        "rating": "6;6;6;6",
        "confidence": "4;3;4;3",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "73;88;58;81",
        "wc_strengths": "50;36;61;56",
        "wc_weaknesses": "24;30;164;169",
        "wc_questions": "171;57;4;102",
        "wc_review": "318;211;287;408",
        "wc_reply_reviewers": "28;11;662;30",
        "wc_reply_authors": "539;592;579;603",
        "reply_reviewers": "1;1;2;1",
        "reply_authors": "3;3;3;3",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            75.0,
            11.157956802210698
        ],
        "wc_strengths_avg": [
            50.75,
            9.364160400164021
        ],
        "wc_weaknesses_avg": [
            96.75,
            69.80463809805191
        ],
        "wc_questions_avg": [
            83.5,
            61.28009464744649
        ],
        "wc_review_avg": [
            306.0,
            70.59390908569945
        ],
        "wc_reply_reviewers_avg": [
            182.75,
            276.79358283746393
        ],
        "wc_reply_authors_avg": [
            578.25,
            24.200981385059574
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            0.0
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7196179213158440862&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=vSwu81S33z",
        "pdf": "https://openreview.net/pdf?id=vSwu81S33z",
        "email": "kaist.ac.kr;kaist.ac.kr;hku.hk;kaist.ac.kr",
        "author_num": 4,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology;University of Hong Kong",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.kaist.ac.kr;https://www.hku.hk",
        "aff_unique_abbr": "KAIST;HKU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "South Korea;China"
    },
    {
        "id": "vTgpSLVtyj",
        "title": "On the Verification Complexity of Deterministic Nonsmooth Nonconvex Optimization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We study the complexity of deterministic verifiers for nonsmooth nonconvex optimization when interacting with an omnipotent prover and we obtain the first exponential lower bounds for the problem. \nIn the nonsmooth setting, Goldstein stationary points constitute the solution concept recent works have focused on. Lin, Zheng and Jordan (NeurIPS '22) show that \neven uniform Goldstein stationary points of a nonsmooth nonconvex function can be found efficiently via randomized zeroth order algorithms, under a Lipschitz condition.\nAs a first step, \nwe show that verification of Goldstein stationarity via determistic algorithms is possible\nunder access to exact queries and first order oracles. This is done via a natural but novel connection with Carath\u00e9odory's theorem.\nWe next show that even verifying uniform Goldstein points \nis intractable for deterministic zeroth order algorithms. Therefore, randomization is necessary (and sufficient) for efficiently finding uniform Goldstein stationary points via zeroth order algorithms.\nMoreover, for general (nonuniform) Goldstein stationary points, we prove that any deterministic zeroth order verifier that is restricted to queries in a lattice needs a number of queries that is exponential in the dimension.",
        "keywords": "nonconvex nonsmooth optimization;optimization theory;verification complexity",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Alkis Kalavasis;Konstantinos Stavropoulos;Manolis Zampetakis",
        "authorids": "~Alkis_Kalavasis1;~Konstantinos_Stavropoulos1;~Manolis_Zampetakis2",
        "gender": "M;;M",
        "homepage": "https://alkisk.github.io/;;https://mzampet.com/",
        "dblp": "269/9425;;",
        "google_scholar": "NgVIFJwAAAAJ;;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Alkis_Kalavasis1;~Konstantinos_Stavropoulos1;~Manolis_Zampetakis2",
        "aff": "Yale University;;Yale University",
        "aff_domain": "yale.edu;;yale.edu",
        "position": "Postdoc;;Assistant Professor",
        "bibtex": "@misc{\nkalavasis2024on,\ntitle={On the Verification Complexity of Deterministic Nonsmooth Nonconvex Optimization},\nauthor={Alkis Kalavasis and Konstantinos Stavropoulos and Manolis Zampetakis},\nyear={2024},\nurl={https://openreview.net/forum?id=vTgpSLVtyj}\n}",
        "github": "",
        "project": "",
        "reviewers": "FB68;hBbf;FQ87;6VnG;hNC5",
        "site": "https://openreview.net/forum?id=vTgpSLVtyj",
        "pdf_size": 413394,
        "rating": "3;3;5;5;6",
        "confidence": "3;4;3;3;3",
        "soundness": "3;1;3;2;3",
        "contribution": "2;2;2;2;3",
        "presentation": "2;2;2;3;3",
        "wc_summary": "103;127;306;60;91",
        "wc_strengths": "38;126;70;75;73",
        "wc_weaknesses": "210;575;257;27;30",
        "wc_questions": "46;4;55;206;139",
        "wc_review": "397;832;688;368;333",
        "wc_reply_reviewers": "117;179;0;0;0",
        "wc_reply_authors": "441;511;50;150;150",
        "reply_reviewers": "1;3;0;0;0",
        "reply_authors": "2;4;1;1;1",
        "rating_avg": [
            4.4,
            1.2
        ],
        "confidence_avg": [
            3.2,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.4,
            0.8
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            137.4,
            87.01861869737994
        ],
        "wc_strengths_avg": [
            76.4,
            28.246061672381867
        ],
        "wc_weaknesses_avg": [
            219.8,
            200.42095698803556
        ],
        "wc_questions_avg": [
            90.0,
            72.68287281058723
        ],
        "wc_review_avg": [
            523.6,
            199.35154877753018
        ],
        "wc_reply_reviewers_avg": [
            59.2,
            75.1089874781973
        ],
        "wc_reply_authors_avg": [
            260.4,
            181.14149165776462
        ],
        "reply_reviewers_avg": [
            0.8,
            1.1661903789690604
        ],
        "reply_authors_avg": [
            1.8,
            1.1661903789690604
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5833333333333335,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:TySf3ZrLTlAJ:scholar.google.com/&scioq=On+the+Verification+Complexity+of+Deterministic+Nonsmooth+Nonconvex+Optimization&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Yale University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.yale.edu",
        "aff_unique_abbr": "Yale",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "vTsaPLtZTn",
        "title": "Enhanced Adversarial Domain Generation via Optimized Batch Normalization and Classifier",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In the endeavor of domain generalization, the objective is to develop a classification model, utilizing multiple source domains, that can subsequently be generalized to unseen target domains. The crux of domain generalization lies in discerning and learning discriminative features that are invariant across domains. Techniques utilizing adversarial domain generalization are paramount in achieving invariant representations. To mitigate the aforementioned impediment, we introduce a novel methodology, termed Auxiliary Classifier in Adversarial Domain Generalization (ACADG). ACADG endeavors to augment the diversity within the source domain through the integration of an auxiliary classifier. By amalgamating standard task-related losses\u2014such as cross-entropy loss for classification and adversarial loss for domain discrimination\u2014the overarching aim is to ensure the acquisition of condition-invariant features across all source domains, while concurrently enhancing the diversity of source domains. Our model demonstrates significant generalization capacity, surpassing contemporaneous state-of-the-art domain generalization methodologies. In the context of mathematical formalization, consider that the aforementioned adversarial loss, auxiliary classifier, and task-related losses are represented with pertinent LaTeX symbols and equations, reflecting the intricate interdependencies and mathematical nuances underpinning the proposed methodology.",
        "keywords": "Adversarial;Domain Generation;Optimized Batch Normalization;Classifier",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Zhenghan Chen;Nan Yin;Mengzhu Wang;Junyang Chen;Ye Wang",
        "authorids": "~Zhenghan_Chen3;~Nan_Yin4;~Mengzhu_Wang1;~Junyang_Chen1;~Ye_Wang17",
        "gender": ";M;;M;F",
        "homepage": ";;;https://csse.szu.edu.cn/pages/user/index?id=1101;",
        "dblp": ";135/8983;;196/7893.html;44/6292.html",
        "google_scholar": ";https://scholar.google.com.hk/citations?user=NoOK0pIAAAAJ;;Q0u3dRQAAAAJ;",
        "orcid": ";;;0000-0002-1139-8654;",
        "linkedin": ";yin-nan-b32943173;;;",
        "or_profile": "~Zhenghan_Chen3;~Nan_Yin4;~Mengzhu_Wang1;~Junyang_Chen1;~Ye_Wang17",
        "aff": ";Mohamed bin Zayed University of Artificial Intelligence;;Shenzhen University;",
        "aff_domain": ";mbzuai.ac.ae;;szu.edu;",
        "position": ";Postdoc;;Assistant Professor;",
        "bibtex": "@misc{\nchen2024enhanced,\ntitle={Enhanced Adversarial Domain Generation via Optimized Batch Normalization and Classifier},\nauthor={Zhenghan Chen and Nan Yin and Mengzhu Wang and Junyang Chen and Ye Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=vTsaPLtZTn}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=vTsaPLtZTn",
        "pdf_size": 692626,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:T59B8A63EIUJ:scholar.google.com/&scioq=Enhanced+Adversarial+Domain+Generation+via+Optimized+Batch+Normalization+and+Classifier&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Mohamed bin Zayed University of Artificial Intelligence;Shenzhen University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://mbzuai.ac.ae;https://www.szu.edu.cn",
        "aff_unique_abbr": "MBZUAI;SZU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United Arab Emirates;China"
    },
    {
        "id": "vULHgaoASR",
        "title": "MissDiff: Training Diffusion Models on Tabular Data with Missing Values",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The diffusion model has shown remarkable performance in modeling data distributions and synthesizing data. However, the vanilla diffusion model requires complete or fully observed training data. Incomplete data is a common issue in various real-world applications, including healthcare and finance, particularly when dealing with tabular datasets. This work considers learning from data with missing values and generating synthetic complete data, beyond missing value imputations. The main challenge for this setting is that two-stage inference frameworks, the \"impute-then-generate\" pipeline or the ``generate-then-impute'' pipeline, are either biased or computationally expensive. To address this challenge, we present a unified and principled diffusion-based framework. Our method models the score of complete data distribution by denoising score matching on data with missing values. We prove that the proposed method can recover the score of the complete data distribution, and the proposed training objective serves as an upper bound for the negative likelihood of observed data. In the presence of incomplete training data, the proposed method can be used for synthetic data generation, as well as missing value imputations based on the learned generative model.\nExtensive experiments on imputation tasks together with generation tasks demonstrate that our proposed framework outperforms existing state-of-the-art approaches on multiple tabular datasets.",
        "keywords": "Generative model;Tabular data;Missing data;Diffusion model",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/d254455cd7f7c64e0d99809ad643f21ed45ab882.zip",
        "author": "Yidong Ouyang;Liyan Xie;Chongxuan Li;Guang Cheng",
        "authorids": "~Yidong_Ouyang1;~Liyan_Xie2;~Chongxuan_Li1;~Guang_Cheng1",
        "gender": "M;F;M;M",
        "homepage": "https://yidongouyang.github.io/;https://mypage.cuhk.edu.cn/academics/xieliyan/;http://ml.cs.tsinghua.edu.cn/~chongxuan;http://www.stat.ucla.edu/~guangcheng/",
        "dblp": "270/0351;195/1316;161/9965;99/4812",
        "google_scholar": "fQwCFK0AAAAJ;KtLwkBYAAAAJ;UKMcQn4AAAAJ;",
        "orcid": ";;0000-0002-0912-9076;",
        "linkedin": ";;;",
        "or_profile": "~Yidong_Ouyang1;~Liyan_Xie2;~Chongxuan_Li1;~Guang_Cheng1",
        "aff": "University of California, Los Angeles;The Chinese University of Hong Kong, Shenzhen;Renmin University of China;University of California, Los Angeles",
        "aff_domain": "ucla.edu;cuhk.edu.cn;ruc.edu.cn;ucla.edu",
        "position": "PhD student;Assistant Professor;Associate Professor;Full Professor",
        "bibtex": "@misc{\nouyang2024missdiff,\ntitle={MissDiff: Training Diffusion Models on Tabular Data with Missing Values},\nauthor={Yidong Ouyang and Liyan Xie and Chongxuan Li and Guang Cheng},\nyear={2024},\nurl={https://openreview.net/forum?id=vULHgaoASR}\n}",
        "github": "",
        "project": "",
        "reviewers": "bE5M;JZFN;EFAN;JCWu",
        "site": "https://openreview.net/forum?id=vULHgaoASR",
        "pdf_size": 582177,
        "rating": "5;6;6;6",
        "confidence": "3;3;2;4",
        "soundness": "2;3;2;3",
        "contribution": "3;3;2;3",
        "presentation": "2;2;2;3",
        "wc_summary": "170;127;55;96",
        "wc_strengths": "14;114;25;40",
        "wc_weaknesses": "134;156;164;54",
        "wc_questions": "47;212;36;104",
        "wc_review": "365;609;280;294",
        "wc_reply_reviewers": "10;12;11;56",
        "wc_reply_authors": "360;822;683;1043",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;2;1;3",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            112.0,
            42.11294337849113
        ],
        "wc_strengths_avg": [
            48.25,
            39.06644980030819
        ],
        "wc_weaknesses_avg": [
            127.0,
            43.55456348076513
        ],
        "wc_questions_avg": [
            99.75,
            69.75806404997203
        ],
        "wc_review_avg": [
            387.0,
            132.16088680089885
        ],
        "wc_reply_reviewers_avg": [
            22.25,
            19.49839737004044
        ],
        "wc_reply_authors_avg": [
            727.0,
            247.742810188308
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 26,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10438411409045814642&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "University of California, Los Angeles;Chinese University of Hong Kong;Renmin University of China",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ucla.edu;https://www.cuhk.edu.cn;http://www.ruc.edu.cn",
        "aff_unique_abbr": "UCLA;CUHK;RUC",
        "aff_campus_unique_index": "0;1;0",
        "aff_campus_unique": "Los Angeles;Shenzhen;",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "vUgeBN7F9l",
        "title": "PolyFormer: Scalable Graph Transformer via Polynomial Attention",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph Transformers have demonstrated superior performance in graph representation learning. However, many current methods focus on attention mechanisms between node pairs, limiting their scalability and expressiveness on node-level tasks. While the recent NAGphormer attempts to address scalability by employing node tokens in conjunction with vanilla multi-head self-attention, these tokens, which are designed in the spatial domain, suffer from restricted expressiveness. On the other front, some approaches have explored encoding eigenvalues or eigenvectors in the spectral domain to boost expressiveness, but these methods incur significant computational overhead due to the requirement for eigendecomposition. To overcome these limitations, we first introduce node tokens using various polynomial bases in the spectral domain. Then, we propose a tailored polynomial attention mechanism, PolyAttn, which serves as a node-wise graph filter and offers powerful representation capabilities. Building on PolyAttn, we present PolyFormer, a graph Transformer model specifically engineered for node-level tasks, offering a desirable balance between scalability and expressiveness. Extensive experiments demonstrate that our proposed methods excel at learning arbitrary node-wise filters, showing superior performance on both homophilic and heterophilic graphs, and handling graphs containing up to 100 million nodes.",
        "keywords": "Graph Transformer;Graph Filter;Graph Neural Network",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/df73ae69476f111211957a4a3b3ab6a163d19a54.zip",
        "author": "Jiahong Ma;Mingguo He;Zhewei Wei",
        "authorids": "~Jiahong_Ma1;~Mingguo_He1;~Zhewei_Wei1",
        "gender": ";M;M",
        "homepage": ";https://www.zhihu.com/people/ying-wu-66-9;http://weizhewei.com",
        "dblp": ";294/5350;94/4260",
        "google_scholar": ";UcIEkXYAAAAJ;https://scholar.google.com.hk/citations?user=qZ7dj4gAAAAJ",
        "orcid": ";;0000-0003-3620-5086",
        "linkedin": ";;",
        "or_profile": "~Jiahong_Ma1;~Mingguo_He1;~Zhewei_Wei1",
        "aff": ";Renmin University of China;Renmin University of China",
        "aff_domain": ";ruc.edu.cn;ruc.edu.cn",
        "position": ";PhD student;Full Professor",
        "bibtex": "@misc{\nma2024polyformer,\ntitle={PolyFormer: Scalable Graph Transformer via Polynomial Attention},\nauthor={Jiahong Ma and Mingguo He and Zhewei Wei},\nyear={2024},\nurl={https://openreview.net/forum?id=vUgeBN7F9l}\n}",
        "github": "",
        "project": "",
        "reviewers": "BLsH;Wuvt;13YF;tq9c",
        "site": "https://openreview.net/forum?id=vUgeBN7F9l",
        "pdf_size": 1793365,
        "rating": "5;5;6;6",
        "confidence": "5;5;3;3",
        "soundness": "2;2;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;4",
        "wc_summary": "61;49;47;119",
        "wc_strengths": "45;42;71;26",
        "wc_weaknesses": "28;110;149;28",
        "wc_questions": "262;63;2;29",
        "wc_review": "396;264;269;202",
        "wc_reply_reviewers": "18;18;58;0",
        "wc_reply_authors": "1424;1826;1151;692",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "4;4;3;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            4.0,
            1.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            69.0,
            29.359836511806396
        ],
        "wc_strengths_avg": [
            46.0,
            16.140012391568973
        ],
        "wc_weaknesses_avg": [
            78.75,
            52.58980414491007
        ],
        "wc_questions_avg": [
            89.0,
            102.19344401672741
        ],
        "wc_review_avg": [
            282.75,
            70.51019429841334
        ],
        "wc_reply_reviewers_avg": [
            23.5,
            21.230873745562146
        ],
        "wc_reply_authors_avg": [
            1273.25,
            412.630206722678
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.25,
            0.82915619758885
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:YhZRGxxJO94J:scholar.google.com/&scioq=PolyFormer:+Scalable+Graph+Transformer+via+Polynomial+Attention&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Renmin University of China",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.ruc.edu.cn",
        "aff_unique_abbr": "RUC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "vVoWRFV5Y4",
        "title": "Solving the Quadratic Assignment Problem With Deep Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The Quadratic Assignment Problem (QAP) is an NP-hard problem which has proven particularly challenging to solve: unlike other combinatorial problems like the traveling salesman problem (TSP), which can be solved to optimality for instances with hundreds or even thousands of locations using advanced integer programming techniques, no methods are known to exactly solve QAP instances of size greater than 30. Solving the QAP is nevertheless important because of its many critical applications, such as electronic wiring design and facility layout selection. We propose a method to solve the original Koopmans-Beckman formulation of the QAP using deep reinforcement learning. Our approach relies on a novel double pointer network, which alternates between selecting a location in which to place the next facility and a facility to place in the previous location. We train our model using A2C on a large dataset of synthetic instances, producing solutions with no instance-specific retraining necessary. Out of sample, our solutions are on average within 7.5% of a high-quality local search baseline, and even outperform it on 1.2% of instances.",
        "keywords": "reinforcement learning;combinatorial optimization;quadratic assignment;actor-critic;pointer networks;attention",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/e22622d09e8b9e40ca64590225a94e3ef886d483.pdf",
        "author": "Puneet Singh Bagga;Arthur Delarue",
        "authorids": "~Puneet_Singh_Bagga1;~Arthur_Delarue1",
        "gender": "M;M",
        "homepage": ";https://adelarue.github.io",
        "dblp": ";",
        "google_scholar": ";6Atez3UAAAAJ",
        "orcid": ";0000-0002-1687-7013",
        "linkedin": "puneetsbagga/;",
        "or_profile": "~Puneet_Singh_Bagga1;~Arthur_Delarue1",
        "aff": "Georgia Institute of Technology;Georgia Institute of Technology",
        "aff_domain": "gatech.edu;gatech.edu",
        "position": "Undergrad student;Assistant Professor",
        "bibtex": "@misc{\nbagga2024solving,\ntitle={Solving the Quadratic Assignment Problem With Deep Reinforcement Learning},\nauthor={Puneet Singh Bagga and Arthur Delarue},\nyear={2024},\nurl={https://openreview.net/forum?id=vVoWRFV5Y4}\n}",
        "github": "",
        "project": "",
        "reviewers": "tFs4;Gzbd;DVdt;jXD8",
        "site": "https://openreview.net/forum?id=vVoWRFV5Y4",
        "pdf_size": 1591699,
        "rating": "1;3;5;6",
        "confidence": "4;4;5;4",
        "soundness": "1;2;3;3",
        "contribution": "1;1;3;3",
        "presentation": "2;2;3;4",
        "wc_summary": "68;44;75;61",
        "wc_strengths": "23;26;38;50",
        "wc_weaknesses": "76;203;199;58",
        "wc_questions": "4;5;1;94",
        "wc_review": "171;278;313;263",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "100;96;72;115",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.75,
            1.920286436967152
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            1.0
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            62.0,
            11.510864433221338
        ],
        "wc_strengths_avg": [
            34.25,
            10.685855136581255
        ],
        "wc_weaknesses_avg": [
            134.0,
            67.31641701695062
        ],
        "wc_questions_avg": [
            26.0,
            39.287402561126385
        ],
        "wc_review_avg": [
            256.25,
            52.45652962215476
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            95.75,
            15.433324334050653
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.3758230140014144,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:CLzre0Rz1pUJ:scholar.google.com/&scioq=Solving+the+Quadratic+Assignment+Problem+With+Deep+Reinforcement+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Georgia Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.gatech.edu",
        "aff_unique_abbr": "Georgia Tech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Provably Efficient Iterated CVaR Reinforcement Learning with Function Approximation and Human Feedback",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17533",
        "id": "vW1SkPl4kp",
        "author_site": "Yu Chen, Yihan Du, Pihe Hu, Siwei Wang, Desheng Wu, Longbo Huang",
        "tldr": "",
        "abstract": "Risk-sensitive reinforcement learning (RL) aims to optimize policies that balance the expected reward and risk. In this paper, we present a novel risk-sensitive RL framework that employs an Iterated Conditional Value-at-Risk (CVaR) objective under both linear and general function approximations, enriched by human feedback. These new formulations provide a principled way to guarantee safety in each decision making step throughout the control process. Moreover, integrating human feedback into risk-sensitive RL framework bridges the gap between algorithmic decision-making and human participation, allowing us to also guarantee safety for human-in-the-loop systems. We propose provably sample-efficient algorithms for this Iterated CVaR RL and provide rigorous theoretical analysis. Furthermore, we establish a matching lower bound to corroborate the optimality of our algorithms in a linear context.",
        "keywords": "Reinforcement Learning;Iterated CVaR;Learning Theory;Function Approximation;Human Feedback",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/f11b7c698d4722205d8df32225e7359ed786b514.pdf",
        "author": "Yu Chen;Yihan Du;Pihe Hu;Siwei Wang;Desheng Wu;Longbo Huang",
        "authorids": "~Yu_Chen19;~Yihan_Du2;~Pihe_Hu1;~Siwei_Wang2;~Desheng_Wu1;~Longbo_Huang2",
        "gender": "M;F;M;M;M;M",
        "homepage": "https://custyhs.github.io/;https://yihandu.github.io/;https://hupihe.top/;https://www.microsoft.com/en-us/research/people/siweiwang/publications/;https://orcid.org/0000-0001-6201-9047;http://people.iiis.tsinghua.edu.cn/~huang/",
        "dblp": "87/1254-74;231/1919;215/4280;51/8279-2;03/394;79/7077",
        "google_scholar": "rJ6Ipa0AAAAJ;https://scholar.google.pl/citations?user=_RSr3vUAAAAJ;https://scholar.google.com/citations?hl=en;;vhGoEu4AAAAJ;",
        "orcid": "0009-0006-9503-6613;;;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Yu_Chen19;~Yihan_Du2;~Pihe_Hu1;~Siwei_Wang2;~Desheng_Wu1;~Longbo_Huang2",
        "aff": "Tsinghua University;University of Illinois, Urbana Champaign;Tsinghua University;Microsoft;;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;illinois.edu;tsinghua.edu.cn;microsoft.com;;tsinghua.edu.cn",
        "position": "PhD student;Postdoc;PhD student;Researcher;;Full Professor",
        "bibtex": "@inproceedings{\nchen2024provably,\ntitle={Provably Efficient Iterated {CV}aR Reinforcement Learning with Function Approximation and Human Feedback},\nauthor={Yu Chen and Yihan Du and Pihe Hu and Siwei Wang and Desheng Wu and Longbo Huang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=vW1SkPl4kp}\n}",
        "github": "",
        "project": "",
        "reviewers": "wJB8;DGv8;CSXT",
        "pdf_size": 836429,
        "rating": "3;6;8",
        "confidence": "4;4;3",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "1;3;3",
        "wc_summary": "47;38;65",
        "wc_strengths": "57;69;65",
        "wc_weaknesses": "293;34;30",
        "wc_questions": "4;42;2",
        "wc_review": "401;183;162",
        "wc_reply_reviewers": "238;0;0",
        "wc_reply_authors": "1402;684;252",
        "reply_reviewers": "1;0;0",
        "reply_authors": "4;1;1",
        "rating_avg": [
            5.666666666666667,
            2.0548046676563256
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            50.0,
            11.224972160321824
        ],
        "wc_strengths_avg": [
            63.666666666666664,
            4.988876515698588
        ],
        "wc_weaknesses_avg": [
            119.0,
            123.04741633478805
        ],
        "wc_questions_avg": [
            16.0,
            18.40289832245635
        ],
        "wc_review_avg": [
            248.66666666666666,
            108.05656954679907
        ],
        "wc_reply_reviewers_avg": [
            79.33333333333333,
            112.19427594826554
        ],
        "wc_reply_authors_avg": [
            779.3333333333334,
            474.3004205025428
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            1.4142135623730951
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.8029550685469661,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15835058134350710920&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=vW1SkPl4kp",
        "pdf": "https://openreview.net/pdf?id=vW1SkPl4kp",
        "email": "tsinghua.edu.cn;illinois.edu;tsinghua.edu.cn;microsoft.com;;tsinghua.edu.cn",
        "author_num": 6,
        "aff_unique_index": "0;1;0;2;0",
        "aff_unique_norm": "Tsinghua University;University of Illinois Urbana-Champaign;Microsoft",
        "aff_unique_dep": ";;Microsoft Corporation",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://illinois.edu;https://www.microsoft.com",
        "aff_unique_abbr": "THU;UIUC;Microsoft",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Urbana-Champaign",
        "aff_country_unique_index": "0;1;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "vXf8KYTJmm",
        "title": "MAP's not dead yet: Uncovering true language model modes by conditioning away degeneracy",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "It has been widely observed that exact or approximate MAP (mode-seeking) decoding from natural language generation (NLG) models consistently leads to degenerate outputs (Stahlberg and Byrne, 2019, Holtzman et al., 2019). This has generally been attributed to either a fundamental inadequacy of modes in models or weaknesses in language modeling. Contrastingly in this work, we emphasize that degenerate modes can even occur in the absence of any model error, due to contamination of the training data. Specifically, we show that mixing even a tiny amount of low-entropy noise with a population text distribution can cause the data distribution's mode to become degenerate, implying that any models trained on it will be as well. As the unconditional mode of NLG models will often be degenerate, we therefore propose to apply MAP decoding to the model's distribution conditional on avoiding specific degeneracies. Using exact-search, we empirically verify that the length-conditional modes of machine translation models and language models are indeed more fluent and topical than their unconditional modes. For the first time, we also share many examples of exact modal sequences from these models, and from several variants of the LLaMA-7B model. Notably, the modes of the LLaMA models are still degenerate, showing that improvements in modeling have not fixed this issue. Because of the cost of exact mode finding algorithms, we develop an approximate mode finding approach, ACBS, which finds sequences that are both high-likelihood and high-quality. We apply this approach to LLaMA-7B, a model which was not trained for instruction following, and find that we are able to elicit reasonable outputs without any finetuning.",
        "keywords": "language modeling;natural language generation;decoding algorithms",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Davis Yoshida;Kartik Goyal;Kevin Gimpel",
        "authorids": "~Davis_Yoshida1;~Kartik_Goyal1;~Kevin_Gimpel1",
        "gender": "M;M;M",
        "homepage": ";https://kartikgo.github.io/;http://ttic.uchicago.edu/~kgimpel/index.html",
        "dblp": ";136/8676;47/1252",
        "google_scholar": "https://scholar.google.com/citations?hl=en;Lz6-_iIAAAAJ;http://scholar.google.com/citations?user=kDHs7DYAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Davis_Yoshida1;~Kartik_Goyal1;~Kevin_Gimpel1",
        "aff": "Amazon;Georgia Institute of Technology;Toyota Technological Institute at Chicago",
        "aff_domain": "amazon.com;gatech.edu;ttic.edu",
        "position": "Postdoc;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nyoshida2024maps,\ntitle={{MAP}'s not dead yet: Uncovering true language model modes by conditioning away degeneracy},\nauthor={Davis Yoshida and Kartik Goyal and Kevin Gimpel},\nyear={2024},\nurl={https://openreview.net/forum?id=vXf8KYTJmm}\n}",
        "github": "",
        "project": "",
        "reviewers": "vYmk;3nJt;YHYo;mRtz",
        "site": "https://openreview.net/forum?id=vXf8KYTJmm",
        "pdf_size": 801671,
        "rating": "3;5;5;8",
        "confidence": "4;3;4;4",
        "soundness": "2;3;2;4",
        "contribution": "2;2;3;4",
        "presentation": "1;3;2;3",
        "wc_summary": "63;81;70;66",
        "wc_strengths": "15;100;41;111",
        "wc_weaknesses": "292;208;432;222",
        "wc_questions": "1;77;5;51",
        "wc_review": "371;466;548;450",
        "wc_reply_reviewers": "0;0;102;0",
        "wc_reply_authors": "787;754;702;453",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            70.0,
            6.819090848492928
        ],
        "wc_strengths_avg": [
            66.75,
            40.01484099681017
        ],
        "wc_weaknesses_avg": [
            288.5,
            88.75105633174176
        ],
        "wc_questions_avg": [
            33.5,
            31.886517527005047
        ],
        "wc_review_avg": [
            458.75,
            62.83858289299656
        ],
        "wc_reply_reviewers_avg": [
            25.5,
            44.16729559300637
        ],
        "wc_reply_authors_avg": [
            674.0,
            131.14305166496624
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.08084520834544431,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9625387061313803537&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Amazon;Georgia Institute of Technology;Toyota Technological Institute at Chicago",
        "aff_unique_dep": "Amazon.com, Inc.;;",
        "aff_unique_url": "https://www.amazon.com;https://www.gatech.edu;https://www.tti-chicago.org",
        "aff_unique_abbr": "Amazon;Georgia Tech;TTI Chicago",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Chicago",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Xformer: Hybrid X-Shaped Transformer for Image Denoising",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17532",
        "id": "vXrIQLzIKY",
        "author_site": "Jiale Zhang, Yulun Zhang, Jinjin Gu, Jiahua Dong, Linghe Kong, Xiaokang Yang",
        "tldr": "",
        "abstract": "In this paper, we present a hybrid X-shaped vision Transformer, named Xformer, which performs notably on image denoising tasks. We explore strengthening the global representation of tokens from different scopes. In detail, we adopt two types of Transformer blocks. The spatial-wise Transformer block performs fine-grained local patches interactions across tokens defined by spatial dimension. The channel-wise Transformer block performs direct global context interactions across tokens defined by channel dimension. Based on the concurrent network structure, we design two branches to conduct these two interaction fashions. Within each branch, we employ an encoder-decoder architecture to capture multi-scale features. Besides, we propose the Bidirectional Connection Unit (BCU) to couple the learned representations from these two branches while providing enhanced information fusion. The joint designs make our Xformer powerful to conduct global information modeling in both spatial and channel dimensions. Extensive experiments show that Xformer, under the comparable model complexity, achieves state-of-the-art performance on the synthetic and real-world image denoising tasks. We also provide code and models at https://github.com/gladzhang/Xformer.",
        "keywords": "Image denoising;hybrid Transformer blocks",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/5e83c2dbeb7cb425684446830ad5174312caee04.zip",
        "author": "Jiale Zhang;Yulun Zhang;Jinjin Gu;Jiahua Dong;Linghe Kong;Xiaokang Yang",
        "authorids": "~Jiale_Zhang3;~Yulun_Zhang1;~Jinjin_Gu1;~Jiahua_Dong1;~Linghe_Kong1;~Xiaokang_Yang1",
        "gender": "M;M;M;;M;M",
        "homepage": ";http://yulunzhang.com/;http://www.jasongt.com;;https://www.cs.sjtu.edu.cn/~linghe.kong/;https://icne.sjtu.edu.cn/info/1064/1078.htm",
        "dblp": ";166/2763-1.html;209/5709;;23/7909;06/3071-1.html",
        "google_scholar": ";ORmLjWoAAAAJ;uMQ-G-QAAAAJ;;https://scholar.google.com.tw/citations?user=-wm2X-8AAAAJ;yDEavdMAAAAJ",
        "orcid": ";0000-0002-2288-5079;0000-0002-4389-6236;;0000-0001-9266-3044;0000-0003-4029-3322",
        "linkedin": "zhangjiale01801423b;yulun-zhang-1116b5b9/;jinjingu;;;",
        "or_profile": "~Jiale_Zhang3;~Yulun_Zhang1;~Jinjin_Gu1;~Jiahua_Dong1;~Linghe_Kong1;~Xiaokang_Yang1",
        "aff": "Shanghai Jiaotong University;Swiss Federal Institute of Technology;University of Sydney;;Shanghai Jiaotong University;Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn;ethz.ch;sydney.edu.au;;sjtu.edu.cn;sjtu.edu.cn",
        "position": "MS student;Postdoc;PhD student;;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nzhang2024xformer,\ntitle={Xformer: Hybrid X-Shaped Transformer for Image Denoising},\nauthor={Jiale Zhang and Yulun Zhang and Jinjin Gu and Jiahua Dong and Linghe Kong and Xiaokang Yang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=vXrIQLzIKY}\n}",
        "github": "",
        "project": "",
        "reviewers": "wiTn;V2SV;Md3A;GouV",
        "pdf_size": 16308096,
        "rating": "5;6;8;8",
        "confidence": "2;4;5;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;4;3",
        "presentation": "3;2;3;4",
        "wc_summary": "84;68;93;74",
        "wc_strengths": "25;47;65;141",
        "wc_weaknesses": "228;67;57;125",
        "wc_questions": "4;22;4;7",
        "wc_review": "341;204;219;347",
        "wc_reply_reviewers": "0;10;0;0",
        "wc_reply_authors": "1113;956;387;605",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            79.75,
            9.54921462739214
        ],
        "wc_strengths_avg": [
            69.5,
            43.64344166080397
        ],
        "wc_weaknesses_avg": [
            119.25,
            67.942530862487
        ],
        "wc_questions_avg": [
            9.25,
            7.46240577829965
        ],
        "wc_review_avg": [
            277.75,
            66.49577054219313
        ],
        "wc_reply_reviewers_avg": [
            2.5,
            4.330127018922194
        ],
        "wc_reply_authors_avg": [
            765.25,
            285.51214947879186
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.8388704928078611,
        "gs_citation": 36,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9766271853868822383&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=vXrIQLzIKY",
        "pdf": "https://openreview.net/pdf?id=vXrIQLzIKY",
        "email": "sjtu.edu.cn;ethz.ch;sydney.edu.au;;sjtu.edu.cn;sjtu.edu.cn",
        "author_num": 6,
        "aff_unique_index": "0;1;2;0;0",
        "aff_unique_norm": "Shanghai Jiao Tong University;Swiss Federal Institute of Technology;University of Sydney",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.sjtu.edu.cn;https://www.ethz.ch;https://www.sydney.edu.au",
        "aff_unique_abbr": "SJTU;ETH Zurich;USYD",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;0;0",
        "aff_country_unique": "China;Switzerland;Australia"
    },
    {
        "title": "SliceGPT: Compress Large Language Models by Deleting Rows and Columns",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17531",
        "id": "vXxardq6db",
        "author_site": "Saleh Ashkboos, Maximilian Croci, Marcelo Gennari do Nascimento, Torsten Hoefler, James Hensman",
        "tldr": "",
        "abstract": "Large language models have become the cornerstone of natural language processing, but their use comes with substantial costs in terms of compute and memory resources. Sparsification provides a solution to alleviate these resource constraints, and recent works have shown that trained models can be sparsified post-hoc. Existing sparsification techniques face challenges as they need additional data structures and offer constrained speedup with current hardware. In this paper we present SliceGPT, a new post-training sparsification scheme which replaces each weight matrix with a smaller (dense) matrix, reducing the embedding dimension of the network. Through extensive experimentation we show that SliceGPT can remove up to 25% of the model parameters (including embeddings) for LLAMA-2 70B, OPT 66B and Phi-2 models while maintaining 99%, 99% and 90% zero-shot task performance of the dense model respectively. Our sliced models run on fewer GPUs and run faster without any additional code optimization: on 24GB consumer GPUs we reduce the total compute for inference on LLAMA-2 70B to 64% of that of the dense model; on 40GB A100 GPUs we reduce it to 66%. We offer a new insight, computational invariance in transformer networks, which enables SliceGPT and we hope it will inspire and enable future avenues to reduce memory and computation demands for pre-trained models.",
        "keywords": "compression;sparsification;large language models",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Saleh Ashkboos;Maximilian L. Croci;Marcelo Gennari do Nascimento;Torsten Hoefler;James Hensman",
        "authorids": "~Saleh_Ashkboos2;~Maximilian_L._Croci1;~Marcelo_Gennari_do_Nascimento2;~Torsten_Hoefler1;~James_Hensman1",
        "gender": "M;;;;M",
        "homepage": "https://www.microsoft.com/applied-sciences/people/marcelo-gennari-do-nascimento;;;;http://sashkboos.github.io",
        "dblp": ";16/3869;116/2940;278/0132;195/5539.html",
        "google_scholar": "oM6ZpJ0AAAAJ;;l8dX3ssAAAAJ;X8UdvWUAAAAJ;N3RteqgAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;saleh-ashkboos-806628161/",
        "or_profile": "~Marcelo_Gennari_do_Nascimento2;~Torsten_Hoefler1;~James_Hensman1;~Maximilian_Croci1;~Saleh_Ashkboos1",
        "aff": "Microsoft;Swiss Federal Institute of Technology;Microsoft Research;Microsoft Research;Swiss Federal Institute of Technology",
        "aff_domain": "microsoft.com;ethz.ch;microsoft.com;microsoft.com;ethz.ch",
        "position": "Researcher;Professor;Principal Researcher;Postdoc;PhD student",
        "bibtex": "@inproceedings{\nashkboos2024slicegpt,\ntitle={Slice{GPT}: Compress Large Language Models by Deleting Rows and Columns},\nauthor={Saleh Ashkboos and Maximilian L. Croci and Marcelo Gennari do Nascimento and Torsten Hoefler and James Hensman},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=vXxardq6db}\n}",
        "github": "",
        "project": "",
        "reviewers": "gLsa;7EAi;jAXk;fXjP;96nz",
        "pdf_size": 520661,
        "rating": "5;5;6;6;6",
        "confidence": "3;5;4;4;4",
        "soundness": "3;3;3;4;3",
        "contribution": "3;2;3;3;3",
        "presentation": "3;3;3;3;4",
        "wc_summary": "53;70;88;37;56",
        "wc_strengths": "41;44;29;40;53",
        "wc_weaknesses": "57;98;117;52;151",
        "wc_questions": "136;138;32;216;5",
        "wc_review": "287;350;266;345;265",
        "wc_reply_reviewers": "34;0;97;87;0",
        "wc_reply_authors": "674;363;518;491;260",
        "reply_reviewers": "1;0;1;1;0",
        "reply_authors": "3;2;2;3;2",
        "rating_avg": [
            5.6,
            0.48989794855663565
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            3.2,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.8,
            0.39999999999999997
        ],
        "presentation_avg": [
            3.2,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            60.8,
            17.1743995528228
        ],
        "wc_strengths_avg": [
            41.4,
            7.709734106958554
        ],
        "wc_weaknesses_avg": [
            95.0,
            37.207526120396665
        ],
        "wc_questions_avg": [
            105.4,
            77.07035746640857
        ],
        "wc_review_avg": [
            302.6,
            37.52652395306552
        ],
        "wc_reply_reviewers_avg": [
            43.6,
            41.543230495473026
        ],
        "wc_reply_authors_avg": [
            461.2,
            141.08352136234762
        ],
        "reply_reviewers_avg": [
            0.6,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            2.4,
            0.4898979485566356
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 164,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6903691151937521935&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 20,
        "openreview": "https://openreview.net/forum?id=vXxardq6db",
        "pdf": "https://openreview.net/pdf?id=vXxardq6db",
        "email": "microsoft.com;ethz.ch;microsoft.com;microsoft.com;ethz.ch",
        "author_num": 5,
        "aff_unique_index": "0;1;0;0;1",
        "aff_unique_norm": "Microsoft;Swiss Federal Institute of Technology",
        "aff_unique_dep": "Microsoft Corporation;",
        "aff_unique_url": "https://www.microsoft.com;https://www.ethz.ch",
        "aff_unique_abbr": "Microsoft;ETH Zurich",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;1",
        "aff_country_unique": "United States;Switzerland"
    },
    {
        "id": "vY4iBYm9TU",
        "title": "A Study of the Effects of Transfer Learning on Adversarial Robustness",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The security and robustness of AI systems are critical in real-world deployments. While prior works have developed methods to train robust networks, these works implicitly assume that sufficient labeled data for robust training is present. However, in deployment scenarios with insufficient training data, robust networks cannot be trained using existing techniques. In such low-data regimes, non-robust training methods traditionally rely on *transfer learning*. First, a network is pre-trained on a large, possibly labeled dataset and then fine-tuned for a new task using the smaller set of training samples.\nThe effectiveness of transfer learning with respect to adversarial robustness, though, is not well-studied. It is unclear if transfer learning can improve adversarial performance in low-data scenarios. In this paper, we perform a broad analysis of the effects of pre-training with respect to empirical and certified adversarial robustness. Using both supervised and self-supervised pre-training methods across a range of downstream tasks, we identify the circumstances necessary to train robust models on small-scale datasets. Our work also represents the first successful demonstration of training networks with high certified robustness for small-scale datasets.",
        "keywords": "adversarial robustness;adversarial training;certified robustness;randomized smoothing;transfer learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/6a74bbc600abf5926d2f1757107da80112c54739.pdf",
        "author": "Pratik Vaishnavi;Kevin Eykholt;Amir Rahmati",
        "authorids": "~Pratik_Vaishnavi1;~Kevin_Eykholt1;~Amir_Rahmati1",
        "gender": "M;M;M",
        "homepage": "https://pratik18v.github.io;;https://amir.rahmati.com",
        "dblp": "187/7077;157/9161;125/0358",
        "google_scholar": "OUrkfK4AAAAJ;;_Y_YRLAAAAAJ",
        "orcid": ";;0000-0001-7361-1898",
        "linkedin": "pratik-vaishnavi-aa2585b3/;;ameerr/",
        "or_profile": "~Pratik_Vaishnavi1;~Kevin_Eykholt1;~Amir_Rahmati1",
        "aff": "State University of New York, Stony Brook;International Business Machines;Stony Brook University",
        "aff_domain": "cs.stonybrook.edu;ibm.com;cs.stonybrook.edu",
        "position": "PhD student;Research Scientist;Assistant Professor",
        "bibtex": "@misc{\nvaishnavi2024a,\ntitle={A Study of the Effects of Transfer Learning on Adversarial Robustness},\nauthor={Pratik Vaishnavi and Kevin Eykholt and Amir Rahmati},\nyear={2024},\nurl={https://openreview.net/forum?id=vY4iBYm9TU}\n}",
        "github": "",
        "project": "",
        "reviewers": "AUoQ;mVVr;MNnj;rH6Y",
        "site": "https://openreview.net/forum?id=vY4iBYm9TU",
        "pdf_size": 2350101,
        "rating": "3;3;3;5",
        "confidence": "3;5;5;4",
        "soundness": "2;2;2;3",
        "contribution": "1;2;1;2",
        "presentation": "2;2;2;3",
        "wc_summary": "136;72;50;49",
        "wc_strengths": "78;24;21;20",
        "wc_weaknesses": "197;186;151;47",
        "wc_questions": "100;35;44;64",
        "wc_review": "511;317;266;180",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            76.75,
            35.42156828826189
        ],
        "wc_strengths_avg": [
            35.75,
            24.437420076595647
        ],
        "wc_weaknesses_avg": [
            145.25,
            59.21306865886955
        ],
        "wc_questions_avg": [
            60.75,
            24.973736204260668
        ],
        "wc_review_avg": [
            318.5,
            121.44649027452378
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.17407765595569782,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15880595290581619045&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "State University of New York;International Business Machines Corporation;Stony Brook University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.stonybrook.edu;https://www.ibm.com;https://www.stonybrook.edu",
        "aff_unique_abbr": "SUNY Stony Brook;IBM;SBU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Stony Brook;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Vocos: Closing the gap between time-domain and Fourier-based neural vocoders for high-quality audio synthesis",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17530",
        "id": "vY9nzQmQBw",
        "tldr": "",
        "abstract": "Recent advancements in neural vocoding are predominantly driven by Generative Adversarial Networks (GANs) operating in the time-domain. While effective, this approach neglects the inductive bias offered by time-frequency representations, resulting in reduntant and computionally-intensive upsampling operations. Fourier-based time-frequency representation is an appealing alternative, aligning more accurately with human auditory perception, and benefitting from well-established fast algorithms for its computation. Nevertheless, direct reconstruction of complex-valued spectrograms has been historically problematic, primarily due to phase recovery issues. This study seeks to close this gap by presenting Vocos, a new model that directly generates Fourier spectral coefficients. Vocos not only matches the state-of-the-art in audio quality, as demonstrated in our evaluations, but it also substantially improves computational efficiency, achieving an order of magnitude increase in speed compared to prevailing time-domain neural vocoding approaches. The source code and model weights have been open-sourced.",
        "keywords": "audio synthesis;vocoder;GAN",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Hubert Siuzdak",
        "authorids": "~Hubert_Siuzdak1",
        "gender": "",
        "homepage": "",
        "dblp": "",
        "google_scholar": "",
        "orcid": "",
        "linkedin": "",
        "or_profile": "",
        "aff": "",
        "aff_domain": "",
        "position": "",
        "bibtex": "@inproceedings{\nsiuzdak2024vocos,\ntitle={Vocos: Closing the gap between time-domain and Fourier-based neural vocoders for high-quality audio synthesis},\nauthor={Hubert Siuzdak},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=vY9nzQmQBw}\n}",
        "github": "",
        "project": "",
        "reviewers": "cFuH;ayuF;9BcD;7A8e",
        "pdf_size": 6618478,
        "rating": "5;5;6;8",
        "confidence": "5;3;3;5",
        "soundness": "3;3;3;4",
        "contribution": "2;2;3;4",
        "presentation": "3;3;4;3",
        "wc_summary": "213;69;29;96",
        "wc_strengths": "43;42;51;128",
        "wc_weaknesses": "58;76;248;248",
        "wc_questions": "1;36;7;171",
        "wc_review": "315;223;335;643",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "352;345;402;499",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.0,
            1.0
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            101.75,
            68.51049189722696
        ],
        "wc_strengths_avg": [
            66.0,
            35.96526101670889
        ],
        "wc_weaknesses_avg": [
            157.5,
            90.72348097378098
        ],
        "wc_questions_avg": [
            53.75,
            68.97599220018513
        ],
        "wc_review_avg": [
            379.0,
            158.16447135814036
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            399.5,
            61.50812954398792
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0.40824829046386296,
        "gs_citation": 84,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4445816452466808234&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=vY9nzQmQBw",
        "pdf": "https://openreview.net/pdf?id=vY9nzQmQBw",
        "email": "",
        "author_num": 1
    },
    {
        "id": "vYF1q2Fqhk",
        "title": "Hierarchical-Latent Generative Models are Robust View Generators for Contrastive Representation Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "A growing area of research is exploiting pre-trained generative models as a data source for contrastive representation learning, generating anchors and the associated positive views through perturbations of the latent codes. In this study, we make significant advances in this field by formalizing the properties of a specific category of generative models, which we term Hierarchical-Latent. We show how the intrinsic properties of these models can successfully be used to create robust views for contrastive learning, outperforming not only previous methods' performance but also surpassing classic approaches trained with genuine real data. The proposed framework is evaluated on different generators and contrastive learning techniques, also investigating the effects of employing a discriminator to filter out low-quality images. Eventually, we test continuous sampling in our experiments, where the generator dynamically samples new synthetic data during contrastive training of the encoder, showing competitive or faster training time with respect to a real-data approach, while allowing a virtually unlimited training set.",
        "keywords": "Generative Models;GANs;Contrastive Learning;Representation Learning;Hierarchical Models",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Dario Serez;Marco Cristani;Alessio Del Bue;Vittorio Murino;Pietro Morerio",
        "authorids": "~Dario_Serez1;~Marco_Cristani1;~Alessio_Del_Bue2;~Vittorio_Murino1;~Pietro_Morerio1",
        "gender": "M;M;M;M;M",
        "homepage": "https://github.com/SerezD;https://www.dimi.univr.it/?ent=persona&id=218&lang=en;https://www.iit.it/people-details/-/people/vittorio-murino;https://iit.it/people/pietro-morerio;https://www.iit.it/people/alessio-delbue",
        "dblp": "356/1935;58/2811;62/6790;119/8523;73/6117",
        "google_scholar": "Se-24RIAAAAJ;https://scholar.google.it/citations?user=LbgTPRwAAAAJ;yV3_PTkAAAAJ;https://scholar.google.it/citations?hl=en;LUzvbGIAAAAJ",
        "orcid": "0009-0003-4006-3575;0000-0002-0523-6042;0000-0002-8645-2328;0000-0001-5259-1496;0000-0002-2262-4872",
        "linkedin": ";marco-cristani-3a78a017/;vittorio-murino-514b26/;;alessiodelbue/",
        "or_profile": "~Dario_Serez1;~Marco_Cristani1;~Vittorio_Murino1;~Pietro_Morerio1;~Alessio_Del_Bue1",
        "aff": "Universit\u00e0 degli Studi di Genova, Istituto Italiano di Tecnologia;Universit\u00e0 degli Studi di Verona;Istituto Italiano di Tecnologia;Istituto Italiano di Tecnologia;Istituto Italiano di Tecnologia",
        "aff_domain": "iit.it;univr.it;iit.it;iit.it;iit.it",
        "position": "PhD student;Full Professor;Principal Researcher;Researcher;Senior Researcher",
        "bibtex": "@misc{\nserez2024hierarchicallatent,\ntitle={Hierarchical-Latent Generative Models are Robust View Generators for Contrastive Representation Learning},\nauthor={Dario Serez and Marco Cristani and Alessio Del Bue and Vittorio Murino and Pietro Morerio},\nyear={2024},\nurl={https://openreview.net/forum?id=vYF1q2Fqhk}\n}",
        "github": "",
        "project": "",
        "reviewers": "o5fU;5q8s;DrZA",
        "site": "https://openreview.net/forum?id=vYF1q2Fqhk",
        "pdf_size": 2351540,
        "rating": "3;5;6",
        "confidence": "3;3;2",
        "soundness": "1;2;3",
        "contribution": "3;2;3",
        "presentation": "3;3;3",
        "wc_summary": "170;141;63",
        "wc_strengths": "101;153;45",
        "wc_weaknesses": "23;115;90",
        "wc_questions": "319;99;7",
        "wc_review": "613;508;205",
        "wc_reply_reviewers": "270;0;0",
        "wc_reply_authors": "1119;806;254",
        "reply_reviewers": "1;0;0",
        "reply_authors": "4;3;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            124.66666666666667,
            45.18357617050199
        ],
        "wc_strengths_avg": [
            99.66666666666667,
            44.100894422776605
        ],
        "wc_weaknesses_avg": [
            76.0,
            38.841558499456056
        ],
        "wc_questions_avg": [
            141.66666666666666,
            130.8977548402654
        ],
        "wc_review_avg": [
            442.0,
            172.97976760303501
        ],
        "wc_reply_reviewers_avg": [
            90.0,
            127.27922061357856
        ],
        "wc_reply_authors_avg": [
            726.3333333333334,
            357.59971414355965
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.7559289460184545,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ntjJdwdCt1wJ:scholar.google.com/&scioq=Hierarchical-Latent+Generative+Models+are+Robust+View+Generators+for+Contrastive+Representation+Learning&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;2;2",
        "aff_unique_norm": "Universit\u00e0 degli Studi di Genova;Universit\u00e0 degli Studi di Verona;Istituto Italiano di Tecnologia",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.unige.it;https://www.univr.it;https://www.iit.it",
        "aff_unique_abbr": "UniGe;UniVR;IIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Italy"
    },
    {
        "title": "CodeChain: Towards Modular Code Generation Through Chain of Self-revisions with Representative Sub-modules",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17529",
        "id": "vYhglxSj8j",
        "author_site": "Hung Le, Hailin Chen, Amrita Saha, Akash Gokul, Doyen Sahoo, Shafiq Joty",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) have already become quite proficient at solving simpler programming tasks like those in HumanEval or MBPP benchmarks. However, solving more complex and competitive programming tasks is still quite challenging for these models - possibly due to their tendency to generate solutions as monolithic code blocks instead of decomposing them into logical sub-tasks and sub-modules. On the other hand, experienced programmers instinctively write modularized code with abstraction for solving complex tasks, often reusing previously developed modules. To address this gap, we propose CodeChain, a novel framework for inference that elicits modularized code generation through a chain of self-revisions, each being guided by some representative sub-modules generated in previous iterations. Concretely, CodeChain first instructs the LLM to generate modularized codes through chain-of-thought prompting. Then it applies a chain of self-revisions by iterating the two steps: 1) extracting and clustering the generated sub-modules and selecting the cluster representatives as the more generic and re-usable implementations, and 2) augmenting the original chain-of-thought prompt with these selected module-implementations and instructing the LLM to re-generate new modularized solutions. We find that by naturally encouraging the LLM to reuse the previously developed and verified sub-modules, CodeChain can significantly boost both modularity as well as correctness of the generated solutions, achieving relative pass@1 improvements of 35\\% on APPS and 76\\% on CodeContests. It is shown to be effective on both OpenAI LLMs as well as open-sourced LLMs like WizardCoder. We also conduct comprehensive ablation studies with different methods of prompting, number of clusters, model sizes, program qualities, etc., to provide useful insights that underpin CodeChain's success.",
        "keywords": "code generation;language model;self-revision;program synthesis;modularity;llm;competitive programming;clustering",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Hung Le;Hailin Chen;Amrita Saha;Akash Gokul;Doyen Sahoo;Shafiq Joty",
        "authorids": "~Hung_Le2;~Hailin_Chen1;~Amrita_Saha2;~Akash_Gokul1;~Doyen_Sahoo1;~Shafiq_Joty1",
        "gender": ";;;;M;M",
        "homepage": ";;;;https://www.linkedin.com/in/doyensahoo/?originalSubdomain=sg;https://raihanjoty.github.io/",
        "dblp": ";36/8249;;;151/3155;62/2078",
        "google_scholar": ";oE4KrU0AAAAJ;;;https://scholar.google.com.sg/citations?hl=en;hR249csAAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";chenhailin/;;;doyensahoo/?originalSubdomain=sg;",
        "or_profile": "~Hung_Le2;~Hailin_Chen1;~Amrita_Saha2;~Akash_Gokul1;~Doyen_Sahoo1;~Shafiq_Joty1",
        "aff": ";National Technological University;;;SalesForce.com;SalesForce.com",
        "aff_domain": ";ntu.edu;;;salesforce.com;salesforce.com",
        "position": ";PhD student;;;Researcher;Principal Researcher",
        "bibtex": "@inproceedings{\nle2024codechain,\ntitle={CodeChain: Towards Modular Code Generation Through Chain of Self-revisions with Representative Sub-modules},\nauthor={Hung Le and Hailin Chen and Amrita Saha and Akash Gokul and Doyen Sahoo and Shafiq Joty},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=vYhglxSj8j}\n}",
        "github": "",
        "project": "",
        "reviewers": "dD56;hL3y;3rJJ;sbrc",
        "pdf_size": 3571743,
        "rating": "6;6;6;8",
        "confidence": "3;3;2;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "101;81;26;60",
        "wc_strengths": "124;33;33;77",
        "wc_weaknesses": "199;194;34;147",
        "wc_questions": "23;83;2;33",
        "wc_review": "447;391;95;317",
        "wc_reply_reviewers": "24;54;0;24",
        "wc_reply_authors": "820;1069;199;978",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "2;4;2;3",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            67.0,
            27.75788176356402
        ],
        "wc_strengths_avg": [
            66.75,
            37.6189779233833
        ],
        "wc_weaknesses_avg": [
            143.5,
            66.39465339920075
        ],
        "wc_questions_avg": [
            35.25,
            29.752100766164396
        ],
        "wc_review_avg": [
            312.5,
            133.7712599925709
        ],
        "wc_reply_reviewers_avg": [
            25.5,
            19.150718002205558
        ],
        "wc_reply_authors_avg": [
            766.5,
            339.5427071812911
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.816496580927726,
        "gs_citation": 37,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2156300481916551087&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=vYhglxSj8j",
        "pdf": "https://openreview.net/pdf?id=vYhglxSj8j",
        "email": ";ntu.edu;;;salesforce.com;salesforce.com",
        "author_num": 6,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "National Technological University;Salesforce",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ntu.edu;https://www.salesforce.com",
        "aff_unique_abbr": "NTU;Salesforce",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Understanding the Robustness of Randomized Feature Defense Against Query-Based Adversarial Attacks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17528",
        "id": "vZ6r9GMT1n",
        "author_site": "Hung Quang Nguyen, Yingjie Lao, Tung Pham, Kok-Seng Wong, Khoa Doan",
        "tldr": "",
        "abstract": "Recent works have shown that deep neural networks are vulnerable to adversarial examples that find samples close to the original image but can make the model misclassify. Even with access only to the model's output, an attacker can employ black-box attacks to generate such adversarial examples. In this work, we propose a simple and lightweight defense against black-box attacks by adding random noise to hidden features at intermediate layers of the model at inference time. Our theoretical analysis confirms that this method effectively enhances the model's resilience against both score-based and decision-based black-box attacks. Importantly, our defense does not necessitate adversarial training and has minimal impact on accuracy, rendering it applicable to any pre-trained model. Our analysis also reveals the significance of selectively adding noise to different parts of the model based on the gradient of the adversarial objective function, which can be varied during the attack. We demonstrate the robustness of our defense against multiple black-box attacks through extensive empirical experiments involving diverse models with various architectures.",
        "keywords": "adversarial attacks;adversarial defense;black-box attacks",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/fe9544aa26fc29d2558eed722945d5967e7ce9fb.zip",
        "author": "Nguyen Hung-Quang;Yingjie Lao;Tung Pham;Kok-Seng Wong;Khoa D Doan",
        "authorids": "~Nguyen_Hung-Quang1;~Yingjie_Lao1;~Tung_Pham1;~Kok-Seng_Wong1;~Khoa_D_Doan1",
        "gender": ";M;M;;M",
        "homepage": "https://nguyenhungquang.github.io/;https://laogroup.ece.tufts.edu/;;https://khoadoan.me;https://sail-research.com/",
        "dblp": "350/4481;135/9289;38/10862-1;238/4276.html;29/11439",
        "google_scholar": "1OXkvboAAAAJ;2xGfsD8AAAAJ;KcUuEKsAAAAJ;Zz2hMgcAAAAJ;https://scholar.google.co.kr/citations?user=WQyULhIAAAAJ",
        "orcid": ";;;;0000-0002-2029-7644",
        "linkedin": "h%C3%B9ng-quang-nguy%E1%BB%85n-48186a202/;;;;kok-seng-wong-058217204/",
        "or_profile": "~Nguyen_Hung-Quang1;~Yingjie_Lao1;~Tung_Pham1;~Khoa_Doan1;~KOK_SENG_WONG2",
        "aff": "VinUniversity ;Tufts University;VinAI Research;VinUniversity;VinUniversity",
        "aff_domain": "vinuni.edu.vn;tufts.edu;vinai.io;vinuni.edu.vn;vinuni.edu.vn",
        "position": "Research Assistant;Associate Professor;Researcher;Assistant Professor;Associate Professor",
        "bibtex": "@inproceedings{\nhung-quang2024understanding,\ntitle={Understanding the Robustness of Randomized Feature Defense Against Query-Based Adversarial Attacks},\nauthor={Nguyen Hung-Quang and Yingjie Lao and Tung Pham and Kok-Seng Wong and Khoa D Doan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=vZ6r9GMT1n}\n}",
        "github": "",
        "project": "",
        "reviewers": "nGVZ;s19G;NLrk;pa1M",
        "pdf_size": 616485,
        "rating": "3;6;6;8",
        "confidence": "4;4;4;3",
        "soundness": "1;3;3;4",
        "contribution": "2;2;2;4",
        "presentation": "1;3;3;3",
        "wc_summary": "104;201;38;55",
        "wc_strengths": "38;83;53;48",
        "wc_weaknesses": "315;995;142;34",
        "wc_questions": "58;178;58;42",
        "wc_review": "515;1457;291;179",
        "wc_reply_reviewers": "216;454;0;7",
        "wc_reply_authors": "1903;2713;579;332",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "3;5;1;1",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            1.0897247358851685
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            99.5,
            63.413326675076746
        ],
        "wc_strengths_avg": [
            55.5,
            16.77050983124842
        ],
        "wc_weaknesses_avg": [
            371.5,
            373.6713127870535
        ],
        "wc_questions_avg": [
            84.0,
            54.662601474865795
        ],
        "wc_review_avg": [
            610.5,
            503.47666281566615
        ],
        "wc_reply_reviewers_avg": [
            169.25,
            185.90236012487847
        ],
        "wc_reply_authors_avg": [
            1381.75,
            973.4360212669346
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            1.6583123951777
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.7276068751089989,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15449521704254848419&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=vZ6r9GMT1n",
        "pdf": "https://openreview.net/pdf?id=vZ6r9GMT1n",
        "email": "vinuni.edu.vn;tufts.edu;vinai.io;vinuni.edu.vn;vinuni.edu.vn",
        "author_num": 5,
        "aff_unique_index": "0;1;2;0;0",
        "aff_unique_norm": "VinUniversity;Tufts University;VinAI Research",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://vinuni.edu.vn;https://www.tufts.edu;https://www.vinai.io/",
        "aff_unique_abbr": "VinUni;Tufts;VinAI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;0",
        "aff_country_unique": "Vietnam;United States"
    },
    {
        "id": "vZEgj0clDp",
        "title": "Revisiting Knowledge Tracing: A Simple and Powerful Model",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Knowledge Tracing (KT) is a problem that assesses students\u2019 knowledge mastery (knowledge state) and predicts their future performance based on their interaction history with educational resources. Current KT research is dedicated to enhancing the performance of KT problems by integrating the most advanced deep learning techniques. However, this has led to increasingly complex models, which reduce model usability and divert researchers' attention away from exploring the core issues of KT. This paper aims to tackle the fundamental challenges of KT tasks, including the knowledge state representation and the core architecture design, and investigate a novel KT model that is both simple and powerful. We have revisited the KT task and propose the ReKT model. First, taking inspiration from the decision-making process of human teachers, we model the knowledge state of students from three distinct perspectives: questions, concepts, and domains. Second, building upon human cognitive development models, such as constructivism, we have designed a Forget-Response-Update (FRU) framework to serve as the core architecture for the KT task. The FRU is composed of just two linear regression units, making it an extremely lightweight framework. Extensive comparisons were conducted with 22 state-of-the-art KT models on 7 publicly available datasets. The experimental results demonstrate that ReKT outperforms all the comparative methods in question-based KT tasks, and consistently achieves the best (in most cases) or near-best performance in concept-based KT tasks. Furthermore, in comparison to other KT core architectures like Transformers or LSTMs, the FRU achieves superior prediction performance with approximately only 38% computing resources. Through an exploration of the ReKT model that is both simple and powerful, is able to offer new insights to future KT research. Code is available in the supplementary materials.",
        "keywords": "knowledge tracing;knowledge state representation;ai for education",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/58af57815da899117069cf5224e0afc4c0511715.zip",
        "author": "Xiaoxuan Shen;Fenghua Yu;Qian Wan;Qing Li;Sannyuya Liu;Jianwen Sun",
        "authorids": "~Xiaoxuan_Shen1;~Fenghua_Yu1;~Qian_Wan2;~Qing_Li22;~Sannyuya_Liu1;~Jianwen_Sun1",
        "gender": "M;M;F;M;M;M",
        "homepage": "http://faculty.ccnu.edu.cn/2023691014;https://orcid.org/my-orcid?orcid=0000-0003-4504-3912;http://faculty.ccnu.edu.cn/2016980057;http://faculty.ccnu.edu.cn/2006983143;http://faculty.ccnu.edu.cn/2012980010;https://github.com/lilstrawberry",
        "dblp": "216/4412.html;25/3876-7;181/2689-45;213/1613;;18/4142",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com/citations?hl=zh-CN;;;;https://scholar.google.com.hk/citations?user=VhEUtx0AAAAJ",
        "orcid": "0000-0002-6663-5821;0000-0003-4504-3912;0000-0002-6168-8430;0000-0002-4926-3720;0000-0002-0951-1072;0009-0002-1488-265X",
        "linkedin": ";;;;;",
        "or_profile": "~Xiaoxuan_Shen1;~Qian_Wan2;~Qing_Li22;~Sannyuya_Liu1;~Jianwen_Sun1;~Feng_Hua_Yu1",
        "aff": "Central China Normal University;Central China Normal University;Central China Normal University;Central China Normal University;Central China Normal University;Central China Normal University",
        "aff_domain": "ccnu.edu.cn;ccnu.edu.cn;ccnu.edu.cn;ccnu.edu.cn;ccnu.edu.cn;ccnu.edu.cn",
        "position": "Assistant Professor;Associate Professor;Associate Professor;Full Professor;Full Professor;MS student",
        "bibtex": "@misc{\nshen2024revisiting,\ntitle={Revisiting Knowledge Tracing: A Simple and Powerful Model},\nauthor={Xiaoxuan Shen and Fenghua Yu and Qian Wan and Qing Li and Sannyuya Liu and Jianwen Sun},\nyear={2024},\nurl={https://openreview.net/forum?id=vZEgj0clDp}\n}",
        "github": "",
        "project": "",
        "reviewers": "UX1Z;c4BU;RjCq;5ixm",
        "site": "https://openreview.net/forum?id=vZEgj0clDp",
        "pdf_size": 1010505,
        "rating": "5;5;6;6",
        "confidence": "4;4;3;5",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "4;3;3;3",
        "wc_summary": "150;56;133;59",
        "wc_strengths": "159;18;87;8",
        "wc_weaknesses": "178;324;118;208",
        "wc_questions": "116;48;134;46",
        "wc_review": "603;446;472;321",
        "wc_reply_reviewers": "0;0;0;20",
        "wc_reply_authors": "1327;1174;808;774",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "4;4;3;3",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            99.5,
            42.44113570582201
        ],
        "wc_strengths_avg": [
            68.0,
            60.70831903454419
        ],
        "wc_weaknesses_avg": [
            207.0,
            74.91995728776145
        ],
        "wc_questions_avg": [
            86.0,
            39.52214569073901
        ],
        "wc_review_avg": [
            460.5,
            100.1361573059402
        ],
        "wc_reply_reviewers_avg": [
            5.0,
            8.660254037844387
        ],
        "wc_reply_authors_avg": [
            1020.75,
            236.33807881930494
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.5,
            0.5
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11396590446090925557&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "Central China Normal University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.ccnu.edu.cn",
        "aff_unique_abbr": "CCNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Learning Multi-Agent Communication with Contrastive Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17527",
        "id": "vZZ4hhniJU",
        "author_site": "Yat Long (Richie) Lo, Biswa Sengupta, Jakob Foerster, Mikhail Noukhovitch",
        "tldr": "",
        "abstract": "Communication is a powerful tool for coordination in multi-agent RL. But inducing an effective, common language is a difficult challenge, particularly in the decentralized setting. In this work, we introduce an alternative perspective where communicative messages sent between agents are considered as different incomplete views of the environment state. By examining the relationship between messages sent and received, we propose to learn to communicate using contrastive learning to maximize the mutual information between messages of a given trajectory. In communication-essential environments, our method outperforms previous work in both performance and learning speed. Using qualitative metrics and representation probing, we show that our method induces more symmetric communication and captures global state information from the environment. Overall, we show the power of contrastive learning and the importance of leveraging messages as encodings for effective communication.",
        "keywords": "Multi-Agent Reinforcement Learning;Emergent Communication;Contrastive Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/52c8574df1562078d6820f8aa03acaf8a756d4b3.zip",
        "author": "Yat Long Lo;Biswa Sengupta;Jakob Nicolaus Foerster;Michael Noukhovitch",
        "authorids": "~Yat_Long_Lo1;~Biswa_Sengupta5;~Jakob_Nicolaus_Foerster1;~Michael_Noukhovitch1",
        "gender": "M;M;M;M",
        "homepage": "https://richielo.github.io;;https://www.jakobfoerster.com;http://mnoukhov.github.io",
        "dblp": "205/3209;;176/5095;218/6652",
        "google_scholar": "qBM2A3kAAAAJ;https://scholar.google.co.uk/citations?user=YZHhV9kAAAAJ;6z4lQzMAAAAJ;https://scholar.google.ca/citations?user=EwmQKdMAAAAJ",
        "orcid": ";;;",
        "linkedin": "yat-long-richie-lo-922991100/;;;",
        "or_profile": "~Yat_Long_Lo1;~Biswa_Sengupta5;~Jakob_Nicolaus_Foerster1;~Michael_Noukhovitch1",
        "aff": "Dyson Robot Learning Lab;;University of Oxford, University of Oxford;University of Montreal",
        "aff_domain": "dyson.com;;eng.ox.ac.uk;umontreal.ca",
        "position": "Researcher;;Associate Professor;PhD student",
        "bibtex": "@inproceedings{\nlo2024learning,\ntitle={Learning Multi-Agent Communication with Contrastive Learning},\nauthor={Yat Long Lo and Biswa Sengupta and Jakob Nicolaus Foerster and Michael Noukhovitch},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=vZZ4hhniJU}\n}",
        "github": "",
        "project": "",
        "reviewers": "Y1JN;sueF;64q7;aKdr",
        "pdf_size": 5872415,
        "rating": "5;5;6;8",
        "confidence": "4;4;4;4",
        "soundness": "2;1;3;4",
        "contribution": "2;2;2;3",
        "presentation": "3;2;3;4",
        "wc_summary": "74;68;32;104",
        "wc_strengths": "55;61;41;105",
        "wc_weaknesses": "67;236;318;57",
        "wc_questions": "123;231;258;11",
        "wc_review": "319;596;649;277",
        "wc_reply_reviewers": "156;123;105;0",
        "wc_reply_authors": "606;556;593;157",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "4;3;4;2",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            1.118033988749895
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            69.5,
            25.588083163847973
        ],
        "wc_strengths_avg": [
            65.5,
            23.93219588754864
        ],
        "wc_weaknesses_avg": [
            169.5,
            111.39681323987683
        ],
        "wc_questions_avg": [
            155.75,
            97.65084485041591
        ],
        "wc_review_avg": [
            460.25,
            164.00209602319111
        ],
        "wc_reply_reviewers_avg": [
            96.0,
            58.365229375031156
        ],
        "wc_reply_authors_avg": [
            478.0,
            186.23506651541217
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.25,
            0.82915619758885
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17863144174928911304&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=vZZ4hhniJU",
        "pdf": "https://openreview.net/pdf?id=vZZ4hhniJU",
        "email": "dyson.com;;eng.ox.ac.uk;umontreal.ca",
        "author_num": 4,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Dyson;University of Oxford;University of Montreal",
        "aff_unique_dep": "Robot Learning Lab;;",
        "aff_unique_url": "https://www.dyson.com;https://www.ox.ac.uk;https://wwwumontreal.ca",
        "aff_unique_abbr": "Dyson;Oxford;UM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "United Kingdom;Canada"
    },
    {
        "title": "SAS: Structured Activation Sparsification",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17526",
        "id": "vZfi5to2Xl",
        "author_site": "Yusuke Sekikawa, Shingo Yashima",
        "tldr": "",
        "abstract": "Wide networks usually yield better accuracy than their narrower counterpart at the expense of the massive $\\texttt{mult}$ cost.\nTo break this tradeoff, we advocate a novel concept of $\\textit{Structured Activation Sparsification}$, dubbed SAS, which boosts accuracy without increasing computation by utilizing the projected sparsity in activation maps with a specific structure. \nConcretely, the projected sparse activation is allowed to have N nonzero value among M consecutive activations.\nOwing to the local structure in sparsity, the wide $\\texttt{matmul}$ between a dense weight and the sparse activation is executed as an equivalent narrow $\\texttt{matmul}$ between a dense weight and dense activation, which is compatible with NVIDIA's $\\textit{SparseTensorCore}$ developed for the N:M structured sparse weight.\nIn extensive experiments, we demonstrate that increasing sparsity monotonically improves accuracy (up to 7% on CIFAR10) without increasing the $\\texttt{mult}$ count.\nFurthermore, we show that structured sparsification of $\\textit{activation}$ scales better than that of $\\textit{weight}$ given the same computational budget.",
        "keywords": "Structured;Sparse;Pruning;Projection",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/40493becbb2ae7755d2e5c2008314e84ec084dfc.zip",
        "author": "Yusuke Sekikawa;Shingo Yashima",
        "authorids": "~Yusuke_Sekikawa1;~Shingo_Yashima1",
        "gender": "M;M",
        "homepage": ";",
        "dblp": "148/8805;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;",
        "orcid": "0000-0003-1111-5949;",
        "linkedin": ";",
        "or_profile": "~Yusuke_Sekikawa1;~Shingo_Yashima1",
        "aff": "DENSO IT Laboratory;",
        "aff_domain": "d-itlab.co.jp;",
        "position": "Researcher;",
        "bibtex": "@inproceedings{\nsekikawa2024sas,\ntitle={{SAS}: Structured Activation Sparsification},\nauthor={Yusuke Sekikawa and Shingo Yashima},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=vZfi5to2Xl}\n}",
        "github": "",
        "project": "",
        "reviewers": "N3vE;W2qU;C5D8",
        "pdf_size": 2893510,
        "rating": "6;6;6",
        "confidence": "3;4;3",
        "soundness": "2;3;3",
        "contribution": "3;2;3",
        "presentation": "2;3;3",
        "wc_summary": "69;37;85",
        "wc_strengths": "67;23;178",
        "wc_weaknesses": "181;97;235",
        "wc_questions": "5;15;15",
        "wc_review": "322;172;513",
        "wc_reply_reviewers": "47;14;31",
        "wc_reply_authors": "1870;600;773",
        "reply_reviewers": "1;1;1",
        "reply_authors": "4;2;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            63.666666666666664,
            19.955506062794353
        ],
        "wc_strengths_avg": [
            89.33333333333333,
            65.21928821717971
        ],
        "wc_weaknesses_avg": [
            171.0,
            56.78027826631356
        ],
        "wc_questions_avg": [
            11.666666666666666,
            4.714045207910316
        ],
        "wc_review_avg": [
            335.6666666666667,
            139.54768201426907
        ],
        "wc_reply_reviewers_avg": [
            30.666666666666668,
            13.474255287605157
        ],
        "wc_reply_authors_avg": [
            1081.0,
            562.3599084809182
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:7sgGgZO_SvwJ:scholar.google.com/&scioq=SAS:+Structured+Activation+Sparsification&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=vZfi5to2Xl",
        "pdf": "https://openreview.net/pdf?id=vZfi5to2Xl",
        "email": "d-itlab.co.jp;",
        "author_num": 2,
        "aff_unique_index": "0",
        "aff_unique_norm": "DENSO Corporation",
        "aff_unique_dep": "IT Laboratory",
        "aff_unique_url": "https://www.denso.com",
        "aff_unique_abbr": "DENSO",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Japan"
    },
    {
        "id": "va9hbzIggi",
        "title": "Deceptive-NeRF: Enhancing NeRF Reconstruction using Pseudo-Observations from Diffusion Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We introduce Deceptive-NeRF, a novel methodology for few-shot NeRF reconstruction, which leverages diffusion models to synthesize plausible pseudo-observations to improve the reconstruction. This approach unfolds through three key steps: 1) reconstructing a coarse NeRF from sparse input data; 2) utilizing the coarse NeRF to render images and subsequently generating pseudo-observations based on them; 3) training a refined NeRF model utilizing input images augmented with pseudo-observations. We develop a rectification latent diffusion model that adeptly transitions RGB images and depth maps from coarse NeRFs into photo-realistic pseudo-observations, all while preserving scene semantics for reconstruction. Furthermore, we propose a progressive strategy for training the Deceptive-NeRF, using the current NeRF renderings to create pseudo-observations that enhance the next iteration's NeRF. Extensive experiments demonstrate that our approach is capable of synthesizing photo-realistic novel views, even for highly complex scenes with very sparse inputs. Codes will be released.",
        "keywords": "NeRF;Few-shot novel view synthesis;diffusion models",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/9853378870368ad542e201a02a87bfe93a5e75e4.zip",
        "author": "Xinhang Liu;Jiaben Chen;Shiu-hong Kao;Yu-Wing Tai;Chi-Keung Tang",
        "authorids": "~Xinhang_Liu1;~Jiaben_Chen1;~Shiu-hong_Kao1;~Yu-Wing_Tai2;~Chi-Keung_Tang1",
        "gender": ";M;M;M;Not Specified",
        "homepage": "https://xinhangliu.com;https://jiabenchen.github.io;https://cse.hkust.edu.hk/~skao/;https://yuwingtai.github.io/;http://www.cse.ust.hk/~cktang/",
        "dblp": "291/3884;297/3054;342/2799.html;40/566;34/4366",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;egMKh7MAAAAJ;hpD2pbwAAAAJ;nFhLmFkAAAAJ;https://scholar.google.com.tw/citations?user=EWfpM74AAAAJ",
        "orcid": ";0000-0002-2252-1419;0000-0002-8367-8487;0000-0002-3148-0380;",
        "linkedin": ";;danielshkao/;;",
        "or_profile": "~Xinhang_Liu1;~Jiaben_Chen1;~Shiu-hong_Kao1;~Yu-Wing_Tai2;~ChiKeung_Tang1",
        "aff": "Hong Kong University of Science and Technology;University of Massachusetts at Amherst;Department of Computer Science and Engineering, Hong Kong University of Science and Technology;Dartmouth College;Hong Kong University of Science and Technology",
        "aff_domain": "ust.hk;umass.edu;cse.ust.hk;dartmouth.edu;ust.hk",
        "position": "PhD student;PhD student;MS student;Associate Professor;Professor",
        "bibtex": "@misc{\nliu2024deceptivenerf,\ntitle={Deceptive-Ne{RF}: Enhancing Ne{RF} Reconstruction using Pseudo-Observations from Diffusion Models},\nauthor={Xinhang Liu and Jiaben Chen and Shiu-hong Kao and Yu-Wing Tai and Chi-Keung Tang},\nyear={2024},\nurl={https://openreview.net/forum?id=va9hbzIggi}\n}",
        "github": "",
        "project": "",
        "reviewers": "zKFv;beZg;QhhZ",
        "site": "https://openreview.net/forum?id=va9hbzIggi",
        "pdf_size": 13691613,
        "rating": "5;6;6",
        "confidence": "4;2;3",
        "soundness": "2;2;3",
        "contribution": "2;2;2",
        "presentation": "3;3;2",
        "wc_summary": "110;29;144",
        "wc_strengths": "89;9;28",
        "wc_weaknesses": "301;76;114",
        "wc_questions": "61;40;64",
        "wc_review": "561;154;350",
        "wc_reply_reviewers": "0;0;57",
        "wc_reply_authors": "616;436;682",
        "reply_reviewers": "0;0;1",
        "reply_authors": "2;2;2",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            94.33333333333333,
            48.23783669370849
        ],
        "wc_strengths_avg": [
            42.0,
            34.1272129929572
        ],
        "wc_weaknesses_avg": [
            163.66666666666666,
            98.34067769183254
        ],
        "wc_questions_avg": [
            55.0,
            10.677078252031311
        ],
        "wc_review_avg": [
            355.0,
            166.1946649765469
        ],
        "wc_reply_reviewers_avg": [
            19.0,
            26.870057685088806
        ],
        "wc_reply_authors_avg": [
            578.0,
            103.96153134693621
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 21,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7604565499090194533&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;0;2;0",
        "aff_unique_norm": "Hong Kong University of Science and Technology;University of Massachusetts Amherst;Dartmouth College",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ust.hk;https://www.umass.edu;https://www.dartmouth.edu",
        "aff_unique_abbr": "HKUST;UMass Amherst;Dartmouth",
        "aff_campus_unique_index": "0;1;0;0",
        "aff_campus_unique": "Hong Kong SAR;Amherst;",
        "aff_country_unique_index": "0;1;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "vb3O9jxTLc",
        "title": "Lost in Translation: Conceptual Blind Spots in Text-to-Image Diffusion Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Advancements in text-to-image diffusion models have broadened both research and practical applications. However, these models frequently struggle with interpreting complex or overlapping constructs like \"a tea cup of iced coke\", primarily due to biases in their training datasets. We propose a new classification for such visual-textual misalignment errors, termed Conceptual Blind Spots (CBS). In this study, we employ large language models (LLMs) and diffusion models to thoroughly investigate the diagnosis and remediation of CBS. We develop an automated pipeline that leverages the LLM's proficiency in semantic layering to create a Mixture of Concept Experts (MoCE) framework. To disentangle overlapping concepts, we input them into the models sequentially. Our MoCE is specifically designed to alleviate conceptual ambiguities during the diffusion model's denoising stages. Empirical assessments confirm the effectiveness of our approach, substantially reducing CBS errors and enhancing the robustness and versatility of text-to-image diffusion models.",
        "keywords": "generative models;diffusion models;misaligned text-to-image models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/dd3c535c777f2aa8187477d55a75b3841e57a8c2.zip",
        "author": "Juntu Zhao;Junyu Deng;Yixin Ye;Chongxuan Li;Zhijie Deng;Dequan Wang",
        "authorids": "~Juntu_Zhao1;~Junyu_Deng1;~Yixin_Ye1;~Chongxuan_Li1;~Zhijie_Deng1;~Dequan_Wang1",
        "gender": "M;M;F;M;M;",
        "homepage": "https://juntuzhao.run;http://joeyjoestar111.github.io;https://bleaves.github.io/;http://ml.cs.tsinghua.edu.cn/~chongxuan;https://thudzj.github.io/;",
        "dblp": ";;;161/9965;209/4959;",
        "google_scholar": ";;YOL-RtEAAAAJ;UKMcQn4AAAAJ;J3dR0sUAAAAJ;",
        "orcid": ";;;0000-0002-0912-9076;0000-0002-0932-1631;",
        "linkedin": ";;;;;",
        "or_profile": "~Juntu_Zhao1;~Junyu_Deng1;~Yixin_Ye1;~Chongxuan_Li1;~Zhijie_Deng1;~Dequan_Wang1",
        "aff": "Shanghai Jiaotong University;Fudan University;Shanghai Jiaotong University;Renmin University of China;Shanghai Jiaotong University;",
        "aff_domain": "sjtu.edu.cn;fudan.edu.cn;sjtu.edu.cn;ruc.edu.cn;sjtu.edu.cn;",
        "position": "PhD student;Undergrad student;Undergrad student;Associate Professor;Assistant Professor;",
        "bibtex": "@misc{\nzhao2024lost,\ntitle={Lost in Translation: Conceptual Blind Spots in Text-to-Image Diffusion Models},\nauthor={Juntu Zhao and Junyu Deng and Yixin Ye and Chongxuan Li and Zhijie Deng and Dequan Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=vb3O9jxTLc}\n}",
        "github": "",
        "project": "",
        "reviewers": "WGri;Edr9;unnP",
        "site": "https://openreview.net/forum?id=vb3O9jxTLc",
        "pdf_size": 30536188,
        "rating": "3;3;6",
        "confidence": "4;4;3",
        "soundness": "2;1;3",
        "contribution": "2;2;3",
        "presentation": "2;1;2",
        "wc_summary": "29;72;76",
        "wc_strengths": "32;33;28",
        "wc_weaknesses": "103;244;140",
        "wc_questions": "5;3;3",
        "wc_review": "169;352;247",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "404;1029;571",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;2;1",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            59.0,
            21.275964529643932
        ],
        "wc_strengths_avg": [
            31.0,
            2.160246899469287
        ],
        "wc_weaknesses_avg": [
            162.33333333333334,
            59.68993959528598
        ],
        "wc_questions_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "wc_review_avg": [
            256.0,
            74.97999733262199
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            668.0,
            264.2132976719125
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:PqJ8K-OHATAJ:scholar.google.com/&scioq=Lost+in+Translation:+Conceptual+Blind+Spots+in+Text-to-Image+Diffusion+Models&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;2;0",
        "aff_unique_norm": "Shanghai Jiao Tong University;Fudan University;Renmin University of China",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.sjtu.edu.cn;https://www.fudan.edu.cn;http://www.ruc.edu.cn",
        "aff_unique_abbr": "SJTU;Fudan;RUC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "vbebD7QRxP",
        "title": "Modular Learning of Deep Causal Generative Models for High-dimensional Causal Inference",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Pearl\u2019s causal hierarchy establishes a clear separation between observational, interventional, and counterfactual questions. Researchers proposed sound and complete algorithms to compute identifiable causal queries at a given level of the hierarchy using the causal structure and data from the lower levels of the hierarchy. However, most of these algorithms assume that we can accurately estimate the probability distribution of the data, which is an impractical assumption for high-dimensional variables such as images. On the other hand, modern generative deep learning architectures can be trained to learn how to accurately sample from such high-dimensional distributions.  Especially with the recent rise of foundation models for images, it is desirable to leverage pre-trained models to answer causal queries with such high-dimensional data. To address this, we propose a sequential training algorithm that, given the causal structure and a pre-trained conditional generative model, can train a deep causal generative model, which utilizes the pre-trained model and can provably sample from identifiable interventional and counterfactual distributions. Our algorithm, called WhatIfGAN, uses adversarial training to learn the network weights, and to the best of our knowledge, is the first algorithm that can make use of pre-trained models and provably sample from any identifiable causal query in the presence of latent confounders with high-dimensional data. We demonstrate the utility of our algorithm using semi-synthetic and real-world datasets containing images as variables in the causal structure.",
        "keywords": "Causal inference;Structural causal models;Causal graphs;Causal effect;Generative Adversarial Networks.",
        "primary_area": "causal reasoning",
        "supplementary_material": "/attachment/f123cb9b44560b64763ad0f03f33b27d4f3de4d7.zip",
        "author": "Md Musfiqur Rahman;Murat Kocaoglu",
        "authorids": "~Md_Musfiqur_Rahman1;~Murat_Kocaoglu1",
        "gender": "M;M",
        "homepage": "https://sites.google.com/view/musfiqshohan/home;https://www.muratkocaoglu.com",
        "dblp": "249/2369;74/11343",
        "google_scholar": "vMGENI8AAAAJ;7N7bzdwAAAAJ",
        "orcid": ";",
        "linkedin": "md-musfiqur-rahman-861b58150/;mkocaoglu/",
        "or_profile": "~Md_Musfiqur_Rahman1;~Murat_Kocaoglu1",
        "aff": "Purdue University;Purdue University",
        "aff_domain": "purdue.edu;purdue.edu",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nrahman2024modular,\ntitle={Modular Learning of Deep Causal Generative Models for High-dimensional Causal Inference},\nauthor={Md Musfiqur Rahman and Murat Kocaoglu},\nyear={2024},\nurl={https://openreview.net/forum?id=vbebD7QRxP}\n}",
        "github": "",
        "project": "",
        "reviewers": "Zypu;g68Y;UCfX;LB1R",
        "site": "https://openreview.net/forum?id=vbebD7QRxP",
        "pdf_size": 4407176,
        "rating": "3;5;5;6",
        "confidence": "3;4;3;3",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "1;2;3;3",
        "wc_summary": "100;112;84;19",
        "wc_strengths": "48;69;16;46",
        "wc_weaknesses": "121;253;37;78",
        "wc_questions": "82;7;3;47",
        "wc_review": "351;441;140;190",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1384;1431;811;770",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;2;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            78.75,
            35.89829383132296
        ],
        "wc_strengths_avg": [
            44.75,
            18.886172190256023
        ],
        "wc_weaknesses_avg": [
            122.25,
            81.12143674763163
        ],
        "wc_questions_avg": [
            34.75,
            32.251937926270415
        ],
        "wc_review_avg": [
            280.5,
            121.10016515265369
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1099.0,
            309.2870834677711
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.13245323570650439,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17563728587187365091&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Purdue University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.purdue.edu",
        "aff_unique_abbr": "Purdue",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "vbqxaiHGmL",
        "title": "Generative and Explainable Data Augmentation for Single-Domain Generalization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this work, we propose Generative and Explainable Adversarial Data Augmentation (GEADA), a novel framework designed to tackle the single-domain generalization challenge in image classification. The framework consists of two competing components: an augmentor to synthesize diverse yet semantically consistent augmentations, and a projector to learn domain-invariant representations from the augmented samples. The augmentor leverages a generative network for style transformations and an attribution-based cropping module for explainable geometric augmentations. We further incorporate theoretically-grounded contrastive loss functions, inspired by the geometric properties of unit hyperspheres, to promote the diversity of generated augmentations and the robustness of learned representations. Extensive experiments on multiple standard domain generalization benchmarks demonstrate the effectiveness of our approach against domain shifts.",
        "keywords": "Domain generalization;data augmentation;contrastive learning;generative model;model interpretation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Ning Zhang;Yuting Lan;Guang Cheng",
        "authorids": "~Ning_Zhang14;~Yuting_Lan1;~Guang_Cheng1",
        "gender": "M;;M",
        "homepage": ";;http://www.stat.ucla.edu/~guangcheng/",
        "dblp": ";181/8875;99/4812",
        "google_scholar": ";;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Ning_Zhang14;~Yuting_Lan1;~Guang_Cheng1",
        "aff": "Shanghai University of International Business and Economics;Shanghai University of Finance and Economics;University of California, Los Angeles",
        "aff_domain": "suibe.edu.cn;shufe.edu.cn;ucla.edu",
        "position": "Assistant Professor;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nzhang2024generative,\ntitle={Generative and Explainable Data Augmentation for Single-Domain Generalization},\nauthor={Ning Zhang and Yuting Lan and Guang Cheng},\nyear={2024},\nurl={https://openreview.net/forum?id=vbqxaiHGmL}\n}",
        "github": "",
        "project": "",
        "reviewers": "GN3R;H7VV;ZuPr",
        "site": "https://openreview.net/forum?id=vbqxaiHGmL",
        "pdf_size": 1410207,
        "rating": "3;5;5",
        "confidence": "4;3;3",
        "soundness": "2;2;2",
        "contribution": "2;2;2",
        "presentation": "3;2;2",
        "wc_summary": "104;65;92",
        "wc_strengths": "200;23;62",
        "wc_weaknesses": "252;151;119",
        "wc_questions": "6;91;116",
        "wc_review": "562;330;389",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            87.0,
            16.30950643030009
        ],
        "wc_strengths_avg": [
            95.0,
            75.93418202627852
        ],
        "wc_weaknesses_avg": [
            174.0,
            56.680390495008645
        ],
        "wc_questions_avg": [
            71.0,
            47.08148963941844
        ],
        "wc_review_avg": [
            427.0,
            98.45134161943486
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.9999999999999998,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:LGnu1W5irGsJ:scholar.google.com/&scioq=Generative+and+Explainable+Data+Augmentation+for+Single-Domain+Generalization&hl=en&as_sdt=0,48",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Shanghai University of International Business and Economics;Shanghai University of Finance and Economics;University of California, Los Angeles",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.suibe.edu.cn;http://www.sufe.edu.cn;https://www.ucla.edu",
        "aff_unique_abbr": "SUibe;SUFE;UCLA",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Los Angeles",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "veIzQxZUhF",
        "title": "Deep concept removal",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We address the problem of concept removal in deep neural networks, aiming to learn representations that do not encode certain specified concepts (e.g., gender etc.) We propose a novel method based on adversarial linear classifiers trained on a concept dataset, which helps to remove the targeted attribute while maintaining model performance. Our approach Deep Concept Removal incorporates adversarial probing classifiers at various layers of the network, effectively addressing concept entanglement and improving out-of-distribution generalization. We also introduce an implicit gradient-based technique to tackle the challenges associated with adversarial training using linear classifiers. We evaluate the ability to remove a concept on a set of popular distributionally robust optimization (DRO) benchmarks with spurious correlations, as well as out-of-distribution (OOD) generalization tasks.",
        "keywords": "concept activation vectors;concept removal;ood generalization",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Yegor Klochkov;Jean-Francois Ton;Ruocheng Guo;Yang Liu;Hang Li",
        "authorids": "~Yegor_Klochkov2;~Jean-Francois_Ton2;~Ruocheng_Guo1;~Yang_Liu3;~Hang_Li4",
        "gender": "M;Not Specified;M;M;M",
        "homepage": ";https://savior287.github.io/JFT-webpage/;https://rguo12.github.io;http://www.yliuu.com;https://hangli-hl.github.io/",
        "dblp": "251/3118;;167/4378;51/3710-18;https://dblp.org/pers/hd/l/Li_0001:Hang",
        "google_scholar": "T3CDHrEAAAAJ;WWVOu4kAAAAJ;8Nuj8NwAAAAJ;jKrIVCIAAAAJ;nTl5mSwAAAAJ",
        "orcid": ";;;0000-0001-8420-6011;0000-0001-9628-3487",
        "linkedin": ";;;;hang-li-84aa6314/",
        "or_profile": "~Yegor_Klochkov2;~Jean-Francois_Ton2;~Ruocheng_Guo1;~Yang_Liu3;~Hang_Li4",
        "aff": "ByteDance, AI Lab;Bytedance;Bytedance Research;University of California, Santa Cruz;ByteDance Technology",
        "aff_domain": "bytedance.com;bytedance.com;bytedance.com;ucsc.edu;bytedance.com",
        "position": "Researcher;Researcher;Researcher;Assistant Professor;Head of Research",
        "bibtex": "@misc{\nklochkov2024deep,\ntitle={Deep concept removal},\nauthor={Yegor Klochkov and Jean-Francois Ton and Ruocheng Guo and Yang Liu and Hang Li},\nyear={2024},\nurl={https://openreview.net/forum?id=veIzQxZUhF}\n}",
        "github": "",
        "project": "",
        "reviewers": "fbvP;QPRK;EJVn;pcxN",
        "site": "https://openreview.net/forum?id=veIzQxZUhF",
        "pdf_size": 4278790,
        "rating": "3;3;5;5",
        "confidence": "4;4;3;4",
        "soundness": "2;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "2;2;3;2",
        "wc_summary": "125;66;23;65",
        "wc_strengths": "73;96;15;20",
        "wc_weaknesses": "347;342;145;63",
        "wc_questions": "17;285;17;18",
        "wc_review": "562;789;200;166",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "750;568;499;351",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            69.75,
            36.31373707015019
        ],
        "wc_strengths_avg": [
            51.0,
            34.51811118818641
        ],
        "wc_weaknesses_avg": [
            224.25,
            123.70807370580144
        ],
        "wc_questions_avg": [
            84.25,
            115.90378552920521
        ],
        "wc_review_avg": [
            429.25,
            259.27724061320924
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            542.0,
            143.41373713839272
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:LPh5AusfTmcJ:scholar.google.com/&scioq=Deep+concept+removal&hl=en&as_sdt=0,48",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "ByteDance;University of California, Santa Cruz",
        "aff_unique_dep": "AI Lab;",
        "aff_unique_url": "https://www.bytedance.com;https://www.ucsc.edu",
        "aff_unique_abbr": "ByteDance;UCSC",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Santa Cruz",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Towards Robust and Efficient Cloud-Edge Elastic Model Adaptation via Selective Entropy Distillation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17525",
        "id": "vePdNU3u6n",
        "author_site": "Yaofo Chen, Shuaicheng Niu, Yaowei Wang, Shoukai Xu, Hengjie Song, Mingkui Tan",
        "tldr": "",
        "abstract": "The conventional deep learning paradigm often involves training a deep model on a server and then deploying the model or its distilled ones to resource-limited edge devices. Usually, the models shall remain fixed once deployed (at least for some period) due to the potential high cost of model adaptation for both the server and edge sides. However, in many real-world scenarios, the test environments may change dynamically (known as distribution shifts), which often results in degraded performance. Thus, one has to adapt the edge models promptly to attain promising performance. Moreover, with the increasing data collected at the edge, this paradigm also fails to further adapt the cloud model for better performance. To address these, we encounter two primary challenges: 1) the edge model has limited computation power and may only support forward propagation; 2) the data transmission budget between cloud and edge devices is limited in latency-sensitive scenarios. In this paper, we establish a Cloud-Edge Elastic Model Adaptation (CEMA) paradigm in which the edge models only need to perform forward propagation and the edge models can be adapted online. In our CEMA, to reduce the communication burden, we devise two criteria to exclude unnecessary samples from uploading to the cloud, i.e., dynamic unreliable and low-informative sample exclusion. Based on the uploaded samples, we update and distribute the affine parameters of normalization layers by distilling from the stronger foundation model to the edge model with a sample replay strategy. Extensive experimental results on ImageNet-C and ImageNet-R verify the effectiveness of our CEMA.",
        "keywords": "model adaptation;cloud-edge model deployment;cloud-edge model collaboration;test-time adaptation",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Yaofo Chen;Shuaicheng Niu;Yaowei Wang;Shoukai Xu;Hengjie Song;Mingkui Tan",
        "authorids": "~Yaofo_Chen1;~Shuaicheng_Niu1;~Yaowei_Wang1;~Shoukai_Xu1;~Hengjie_Song2;~Mingkui_Tan2",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://chenyaofo.com/;https://niushuaicheng.cn/;https://dblp.org/pid/68/2992.html;https://github.com/xushoukai;;https://tanmingkui.github.io/",
        "dblp": "270/1870.html;254/1388;68/2992-1;;65/657.html;49/2007",
        "google_scholar": "https://scholar.google.com.hk/citations?user=NHZCt2EAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=zh-CN;;;https://scholar.google.com.sg/citations?user=EVsoTGkAAAAJ",
        "orcid": ";0000-0001-8212-1831;0000-0002-6110-4036;;;0000-0001-8856-756X",
        "linkedin": ";;yaowei-wang-971ab310/;;;",
        "or_profile": "~Yaofo_Chen1;~Shuaicheng_Niu1;~Yaowei_Wang1;~Shoukai_Xu1;~Hengjie_Song2;~Mingkui_Tan1",
        "aff": "South China University of Technology;Nanyang Technological University;Pengcheng Laboratory;;;South China University of Technology",
        "aff_domain": "scut.edu.cn;ntu.edu.sg;pcl.ac.cn;;;scut.edu.cn",
        "position": "PhD student;Postdoc;Full Professor;;;Full Professor",
        "bibtex": "@inproceedings{\nchen2024towards,\ntitle={Towards Robust and Efficient Cloud-Edge Elastic Model Adaptation via Selective Entropy Distillation},\nauthor={Yaofo Chen and Shuaicheng Niu and Yaowei Wang and Shoukai Xu and Hengjie Song and Mingkui Tan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=vePdNU3u6n}\n}",
        "github": "",
        "project": "",
        "reviewers": "Q1Z2;iQ7Q;xxok;5VG6",
        "pdf_size": 1069831,
        "rating": "5;6;6;8",
        "confidence": "3;4;4;4",
        "soundness": "3;3;4;3",
        "contribution": "3;3;4;3",
        "presentation": "3;4;3;2",
        "wc_summary": "81;85;112;58",
        "wc_strengths": "26;98;130;63",
        "wc_weaknesses": "35;58;125;23",
        "wc_questions": "41;91;2;34",
        "wc_review": "183;332;369;178",
        "wc_reply_reviewers": "0;0;0;10",
        "wc_reply_authors": "1215;845;601;676",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "5;2;1;2",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            84.0,
            19.170289512680814
        ],
        "wc_strengths_avg": [
            79.25,
            38.81607270191048
        ],
        "wc_weaknesses_avg": [
            60.25,
            39.4422045529912
        ],
        "wc_questions_avg": [
            42.0,
            31.88259713385972
        ],
        "wc_review_avg": [
            265.5,
            86.01889327351289
        ],
        "wc_reply_reviewers_avg": [
            2.5,
            4.330127018922194
        ],
        "wc_reply_authors_avg": [
            834.25,
            236.92548934211362
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            1.5
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.6622661785325219,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10740781922768722500&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=vePdNU3u6n",
        "pdf": "https://openreview.net/pdf?id=vePdNU3u6n",
        "email": "scut.edu.cn;ntu.edu.sg;pcl.ac.cn;;;scut.edu.cn",
        "author_num": 6,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "South China University of Technology;Nanyang Technological University;Pengcheng Laboratory",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.scut.edu.cn;https://www.ntu.edu.sg;",
        "aff_unique_abbr": "SCUT;NTU;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "China;Singapore"
    },
    {
        "id": "vex1yNHNFL",
        "title": "Efficient VideoMAE via Temporal Progressive Training",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Masked autoencoders (MAE) have recently been adapted for video recognition, setting new performance benchmarks. Nonetheless, the computational overhead of training VideoMAE remains a prominent challenge, often demanding extensive GPU resources and days of training. To improve the training efficiency of VideoMAE, this paper presents Temporal Progressive Training (TPT), a simple way to strategically introduce longer video clips along the training process. Specifically, TPT decomposes the intricate task of long-clip reconstruction into a series of step-by-step sub-tasks, progressively transitioning from short video clips to long video clips. Our experiments extensively verify the efficacy and efficiency of TPT. For example, TPT can impressively reduce training costs by factors of $2\\times$ on Kinetics-400 and $3\\times$ on Something-Something V2, while still matching the performance of VideoMAE. Additionally, TPT consistently shows superior performance than VideoMAE when trained with the same budget.",
        "keywords": "Masked autoencoder;Video transformer;Training Efficiency",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Xianhang Li;Peng Wang;Xinyu Li;Heng Wang;Cihang Xie",
        "authorids": "~Xianhang_Li1;~Peng_Wang2;~Xinyu_Li4;~Heng_Wang2;~Cihang_Xie3",
        "gender": "M;M;M;M;M",
        "homepage": "https://xhl-video.github.io/xianhangli/;https://pengwangucla.github.io/peng-wang.github.io/;https://www.arthurlxy.com;https://cihangxie.github.io/;https://hengcv.github.io/",
        "dblp": "268/5945;95/4442;88/2359-3.html;175/3366;",
        "google_scholar": "YKpFz4YAAAAJ;Svk4ntYAAAAJ;xMnAUmkAAAAJ;X3vVZPcAAAAJ;ghmgyewAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Xianhang_Li1;~Peng_Wang2;~Xinyu_Li4;~cihang_xie1;~heng_Wang1",
        "aff": "University of California, Santa Cruz;Bytedance US AILab;Amazon;University of California, Santa Cruz;Bytedance",
        "aff_domain": "ucsc.edu;bytedance.com;amazon.com;ucsc.edu;bytedance.com",
        "position": "PhD student;Research Scientist;Researcher;Assistant Professor;research scientist",
        "bibtex": "@misc{\nli2024efficient,\ntitle={Efficient Video{MAE} via Temporal Progressive  Training},\nauthor={Xianhang Li and Peng Wang and Xinyu Li and Heng Wang and Cihang Xie},\nyear={2024},\nurl={https://openreview.net/forum?id=vex1yNHNFL}\n}",
        "github": "",
        "project": "",
        "reviewers": "eksP;RKG5;G1mA;hJSy",
        "site": "https://openreview.net/forum?id=vex1yNHNFL",
        "pdf_size": 573952,
        "rating": "3;3;5;6",
        "confidence": "4;4;5;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "2;1;2;3",
        "wc_summary": "65;98;86;46",
        "wc_strengths": "63;87;57;43",
        "wc_weaknesses": "247;475;332;132",
        "wc_questions": "80;124;32;12",
        "wc_review": "455;784;507;233",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            73.75,
            19.904459299363044
        ],
        "wc_strengths_avg": [
            62.5,
            15.898113095584646
        ],
        "wc_weaknesses_avg": [
            296.5,
            125.1329293191844
        ],
        "wc_questions_avg": [
            62.0,
            43.497126341863094
        ],
        "wc_review_avg": [
            494.75,
            196.15602845694036
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:0Ud_7CrPnYUJ:scholar.google.com/&scioq=Efficient+VideoMAE+via+Temporal+Progressive+Training&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0;1",
        "aff_unique_norm": "University of California, Santa Cruz;ByteDance;Amazon",
        "aff_unique_dep": ";AI Lab;Amazon.com, Inc.",
        "aff_unique_url": "https://www.ucsc.edu;https://www.bytedance.com;https://www.amazon.com",
        "aff_unique_abbr": "UCSC;;Amazon",
        "aff_campus_unique_index": "0;1;0",
        "aff_campus_unique": "Santa Cruz;United States;",
        "aff_country_unique_index": "0;0;0;0;1",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "vfEqSWpMfj",
        "title": "Word Importance Explains How Prompts Affect Language Model Outputs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The emergence of large language models has revolutionized numerous applications across industries. However, their ``black box'' nature often hinders the understanding of how they make specific decisions, raising concerns about their transparency, reliability, and ethical use. This study presents a method to improve the explainability of LLMs by varying prompt words to uncover their statistical impact on the model outputs. This approach, inspired by permutation importance for tabular data, masks each word in the system prompt and evaluates its effect on the outputs based on the available text scores aggregated over multiple user inputs. Unlike classical attention, word importance measures the impact of prompt words on arbitrarily-defined text scores, which enables decomposing the importance of words into the specific measures of interest--including bias, reading level, verbosity, etc. This procedure also enables measuring impact when attention is not available. To test the fidelity of this approach, we explore the effect of adding different suffixes to multiple different system prompts and comparing subsequent generations with GPT-3.5 Turbo. Results show that word importance scores are closely related to the expected suffix importances for multiple scoring functions. Finally, we share a Python project for computing these scores and discuss how it could assist developing generative AI use-cases in different industry applications.",
        "keywords": "Large Language Models;Explainability;Masking;Word Importance",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Stefan Hackmann;Haniyeh Mahmoudian;Mark Steadman;Michael Schmidt",
        "authorids": "~Stefan_Hackmann1;~Haniyeh_Mahmoudian1;mark@datarobot.com;michael.schmidt@datarobot.com",
        "gender": "M;F;;",
        "homepage": ";https://www.linkedin.com/in/haniyeh-mahmoudian-ph-d-78a18072/;;",
        "dblp": ";;;",
        "google_scholar": ";;;",
        "orcid": ";;;",
        "linkedin": "stefanhackmann/;haniyeh-mahmoudian-ph-d-78a18072/;;",
        "or_profile": "~Stefan_Hackmann1;~Haniyeh_Mahmoudian1;mark@datarobot.com;michael.schmidt@datarobot.com",
        "aff": ";;;",
        "aff_domain": ";;;",
        "position": ";;;",
        "bibtex": "@misc{\nhackmann2024word,\ntitle={Word Importance Explains How Prompts Affect Language Model Outputs},\nauthor={Stefan Hackmann and Haniyeh Mahmoudian and Mark Steadman and Michael Schmidt},\nyear={2024},\nurl={https://openreview.net/forum?id=vfEqSWpMfj}\n}",
        "github": "",
        "project": "",
        "reviewers": "Jiyw;79zL;pTAs;FVbK",
        "site": "https://openreview.net/forum?id=vfEqSWpMfj",
        "pdf_size": 2317811,
        "rating": "1;3;3;3",
        "confidence": "3;3;5;3",
        "soundness": "1;2;1;2",
        "contribution": "2;2;1;2",
        "presentation": "1;2;1;2",
        "wc_summary": "191;99;182;84",
        "wc_strengths": "32;146;55;38",
        "wc_weaknesses": "135;231;390;276",
        "wc_questions": "6;25;217;43",
        "wc_review": "364;501;844;441",
        "wc_reply_reviewers": "0;0;0;47",
        "wc_reply_authors": "238;321;412;392",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            1.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            139.0,
            47.900939447989956
        ],
        "wc_strengths_avg": [
            67.75,
            45.95854109956059
        ],
        "wc_weaknesses_avg": [
            258.0,
            91.65969670471314
        ],
        "wc_questions_avg": [
            72.75,
            84.30413690916953
        ],
        "wc_review_avg": [
            537.5,
            183.5
        ],
        "wc_reply_reviewers_avg": [
            11.75,
            20.351596988934308
        ],
        "wc_reply_authors_avg": [
            340.75,
            68.28387437748388
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14247540720766620518&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3
    },
    {
        "id": "vfHISoWo2m",
        "title": "Meta-Learning Nonlinear Dynamical Systems with Deep Kernels",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Scientific processes are often modelled by sets of differential equations. As datasets grow, individually fitting these models and quantifying their uncertainties becomes a computationally challenging task. In this paper, we focus on improving the scalability of a particular class of stochastic dynamical model, called latent force models. These offer a balance between data-driven and mechanistic inference in dynamical systems, achieved by deriving a kernel function over a low-dimensional latent force. However, exact computation of posterior kernel terms is rarely tractable, requiring approximations for complex scenarios such as nonlinear dynamics. We overcome this issue by posing the problem as meta-learning the class of latent force models corresponding to a set of differential equations. By employing a deep kernel along with a sensible function embedding, we demonstrate the ability to extrapolate from simulations to real experimental datasets. Finally, we show how our model scales compared with other approximations.",
        "keywords": "latent force models;gaussian processes;meta-learning;dynamic model;differential equations",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/f50ddb22e2c45493bd3a71e9c301fd060c79379c.zip",
        "author": "Jacob Moss;Felix Opolka;Jeremy England;Pietro Lio",
        "authorids": "~Jacob_Moss1;~Felix_Opolka1;~Jeremy_England1;~Pietro_Lio1",
        "gender": ";M;M;M",
        "homepage": ";https://www.felixopolka.me;http://Englandlab.com;https://www.cst.cam.ac.uk/people/pl219",
        "dblp": ";239/4824;;l/PietroLio.html",
        "google_scholar": ";;UnBLlzEAAAAJ;https://scholar.google.co.uk/citations?user=3YrWf7EAAAAJ",
        "orcid": ";;0000-0002-3331-2583;0000-0002-0540-5053",
        "linkedin": "cobbles/;;https://www.linkedin.com/authwall?trk=gf&trkInfo=AQH5VLanKYGxKwAAAYgY81QgGPi1fkL1Hc3BOE5tIOtyDYNgIp72_5ENZhCWg9jBXbSVpYWKSYBrkkHHQD6fI5bIYqI0PDGGBCZ3j0pUFNdNY5xbNWPPysxKatE8royGdyyyHiI=&original_referer=https://www.google.com/&sessionRedirect=https%3A%2F%2Fil.linkedin.com%2Fin%2Fjlengland;",
        "or_profile": "~Jacob_Moss1;~Felix_Opolka1;~Jeremy_England1;~Pietro_Lio1",
        "aff": "University of Cambridge;;Georgia Institute of Technology;University of Cambridge",
        "aff_domain": "cam.ac.uk;;gatech.edu;cam.ac.uk",
        "position": "PhD student;;Principal Researcher;Full Professor",
        "bibtex": "@misc{\nmoss2024metalearning,\ntitle={Meta-Learning Nonlinear Dynamical Systems with Deep Kernels},\nauthor={Jacob Moss and Felix Opolka and Jeremy England and Pietro Lio},\nyear={2024},\nurl={https://openreview.net/forum?id=vfHISoWo2m}\n}",
        "github": "",
        "project": "",
        "reviewers": "6wso;T2Lg;Sax4;r4WP",
        "site": "https://openreview.net/forum?id=vfHISoWo2m",
        "pdf_size": 2151559,
        "rating": "3;3;5;5",
        "confidence": "3;4;3;4",
        "soundness": "3;2;3;3",
        "contribution": "3;2;3;3",
        "presentation": "3;2;2;3",
        "wc_summary": "97;111;61;89",
        "wc_strengths": "33;98;64;46",
        "wc_weaknesses": "458;568;183;77",
        "wc_questions": "103;215;1;36",
        "wc_review": "691;992;309;248",
        "wc_reply_reviewers": "158;644;0;0",
        "wc_reply_authors": "625;592;0;0",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "1;1;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            89.5,
            18.2414363469547
        ],
        "wc_strengths_avg": [
            60.25,
            24.416951079117148
        ],
        "wc_weaknesses_avg": [
            321.5,
            198.97047519669846
        ],
        "wc_questions_avg": [
            88.75,
            81.5854613273713
        ],
        "wc_review_avg": [
            560.0,
            301.7159259966235
        ],
        "wc_reply_reviewers_avg": [
            200.5,
            264.0544451434211
        ],
        "wc_reply_authors_avg": [
            304.25,
            304.4736236523617
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            0.5,
            0.5
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:kUs_xn_8RV8J:scholar.google.com/&scioq=Meta-Learning+Nonlinear+Dynamical+Systems+with+Deep+Kernels&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Cambridge;Georgia Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cam.ac.uk;https://www.gatech.edu",
        "aff_unique_abbr": "Cambridge;Georgia Tech",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Cambridge;",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "id": "vfHnWtN9cH",
        "title": "Language Models as Black-Box Optimizers for Vision-Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Vision-language models (VLMs) pre-trained on web-scale datasets have demonstrated remarkable capabilities across a variety of vision and multimodal tasks. Currently, fine-tuning methods for VLMs mainly operate in a *white-box* setting, requiring access to model parameters for backpropagation. However, many VLMs rely on proprietary data and are not open-source, which restricts the use of white-box approaches for fine-tuning. Given that popular private large language models (LLMs) like ChatGPT still offer a language-based user interface, we aim to develop a novel fine-tuning approach for VLMs through *natural language prompts*, thereby avoiding the need to access model parameters, feature embeddings, or output logits. In this setup, we propose employing *chat-based LLMs as black-box optimizers* to search for the best text prompt on the illustrative task of few-shot image classification using CLIP. Specifically, we adopt an automatic \"hill-climbing\" procedure that converges on an effective prompt by evaluating the accuracy of current prompts and asking LLMs to refine them based on textual feedback, all within a conversational process without human-in-the-loop. In a challenging 1-shot learning setup, our simple approach surpasses the white-box continuous prompting method (CoOp) by an average of 1.5% across 11 datasets including ImageNet. Our approach also outperforms OpenAI's manually crafted prompts. Additionally, we highlight the advantage of *conversational feedback* that incorporates both positive and negative prompts, suggesting that LLMs can utilize the implicit \"gradient\" direction in textual feedback for a more efficient search. Lastly, we find that the text prompts generated through our strategy are not only more interpretable but also transfer well across different CLIP architectures in a black-box manner.",
        "keywords": "Vision-Language Models;Prompting;Large Language Models;Black-Box Optimization",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/1dc4074cac80b5c98ca92d825c4feeeb5a68490e.zip",
        "author": "Shihong Liu;Samuel Yu;Zhiqiu Lin;Deepak Pathak;Deva Ramanan",
        "authorids": "~Shihong_Liu1;~Samuel_Yu1;~Zhiqiu_Lin1;~Deepak_Pathak1;~Deva_Ramanan1",
        "gender": "M;M;M;M;M",
        "homepage": ";;https://linzhiqiu.github.io;https://www.cs.cmu.edu/~dpathak/;https://www.cs.cmu.edu/~deva/",
        "dblp": ";245/7594;230/4394;155/9860;49/488",
        "google_scholar": ";gxRDkLMAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.cl/citations?user=AEsPCAUAAAAJ;9B8PoXUAAAAJ",
        "orcid": "0000-0002-9427-0065;0000-0001-9734-9265;;;",
        "linkedin": "shihongliu98/;samuel-yu-76a94787/;zhiqiu-lin-b49ba7126/;pathak22/;",
        "or_profile": "~Shihong_Liu1;~Samuel_Yu1;~Zhiqiu_Lin1;~Deepak_Pathak1;~Deva_Ramanan1",
        "aff": ";Carnegie Mellon University;Carnegie Mellon University;Carnegie Mellon University;School of Computer Science, Carnegie Mellon University",
        "aff_domain": ";cmu.edu;cmu.edu;cmu.edu;cs.cmu.edu",
        "position": ";Undergrad student;PhD student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nliu2024language,\ntitle={Language Models as Black-Box Optimizers for Vision-Language Models},\nauthor={Shihong Liu and Samuel Yu and Zhiqiu Lin and Deepak Pathak and Deva Ramanan},\nyear={2024},\nurl={https://openreview.net/forum?id=vfHnWtN9cH}\n}",
        "github": "",
        "project": "",
        "reviewers": "cyGF;JF9P;ipEa;GEja",
        "site": "https://openreview.net/forum?id=vfHnWtN9cH",
        "pdf_size": 510851,
        "rating": "3;5;5;5",
        "confidence": "5;4;4;4",
        "soundness": "3;3;3;2",
        "contribution": "1;2;2;2",
        "presentation": "4;3;3;3",
        "wc_summary": "69;99;175;66",
        "wc_strengths": "25;122;53;22",
        "wc_weaknesses": "137;199;85;72",
        "wc_questions": "29;76;30;131",
        "wc_review": "260;496;343;291",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            102.25,
            43.939589210642374
        ],
        "wc_strengths_avg": [
            55.5,
            40.252329125157466
        ],
        "wc_weaknesses_avg": [
            123.25,
            50.041857479514086
        ],
        "wc_questions_avg": [
            66.5,
            41.80011961705373
        ],
        "wc_review_avg": [
            347.5,
            90.72072530574256
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 37,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10843004261573175598&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Carnegie Mellon University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cmu.edu",
        "aff_unique_abbr": "CMU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Pittsburgh",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "CODE REPRESENTATION LEARNING AT SCALE",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17524",
        "id": "vfzRRjumpX",
        "author_site": "Dejiao Zhang, Wasi Ahmad, Ming Tan, Hantian Ding, Ramesh Nallapati, Dan Roth, Xiaofei Ma, Bing Xiang",
        "tldr": "",
        "abstract": "Recent studies have shown that code language model at scale demonstrate significant performance gains on downstream tasks, i.e., code generation. However, most of the existing works on code representation learning train models at a hundred million parameter scale using very limited pretraining corpora. In this work, we fuel code representation learning with a vast amount of code data via a two-stage pretraining scheme. We first train the encoders via a mix that leverages both randomness in masking language modeling and implicit structure and semantic aspects of programming language. We then enhance the representations via contrastive learning with hard negative and hard positive constructed in an unsupervised manner. We establish an off-the-shelf encoder model that persistently outperforms the existing models on a wide variety of downstream tasks by large margins. To comprehend the factors contributing to successful code representation learning, we conduct detailed ablations and share our findings on (i) a customized and effective token-level denoising scheme for source code; (ii) the importance of hard negatives and hard positives; (iii) how the proposed bimodal contrastive learning boost the cross-lingual semantic search performance; and (iv) how the pretraining schemes decide the downstream task performance scales with the model size.",
        "keywords": "code representation learning;customized token-level denoising objective for code;hard negative;hard positive",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Dejiao Zhang;Wasi Uddin Ahmad;Ming Tan;Hantian Ding;Ramesh Nallapati;Dan Roth;Xiaofei Ma;Bing Xiang",
        "authorids": "~Dejiao_Zhang1;~Wasi_Uddin_Ahmad1;~Ming_Tan2;~Hantian_Ding1;~Ramesh_Nallapati1;~Dan_Roth3;~Xiaofei_Ma1;~Bing_Xiang2",
        "gender": "F;M;;M;M;M;M;",
        "homepage": "https://dejiao2018.github.io/;http://wasiahmad.github.io/;https://www.linkedin.com/in/ming-tan-18b3436a/;;;https://www.cis.upenn.edu/~danroth/;https://www.amazon.science/author/xiaofei-ma;",
        "dblp": "131/6876;183/0576;;242/8095;59/4797;r/DanRoth;;",
        "google_scholar": "klYBD5MAAAAJ;YCHJZOMAAAAJ;;nEuMO58AAAAJ;;E-bpPWgAAAAJ;Pc2SfvMAAAAJ;A6yjdJAAAAAJ",
        "orcid": ";;;;;;;",
        "linkedin": ";ahmadwasi/;;;;dan-roth-8667361/;xiaofei-ma-b3627928;",
        "or_profile": "~Dejiao_Zhang1;~Wasi_Uddin_Ahmad1;~Ming_Tan2;~Hantian_Ding1;~Ramesh_Nallapati1;~Dan_Roth3;~Xiaofei_Ma1;~Bing_Xiang2",
        "aff": "Amazon AWS;Amazon;Amazon;Amazon;Amazon Web Services;Amazon;Amazon Web Services;Goldman Sachs",
        "aff_domain": "amazon.com;amazon.com;amazon.com;amazon.com;amazon.com;amazon.com;amazon.com;gs.com",
        "position": "Applied Scientist;Applied Scientist;Applied Scientist;Researcher;Senior Principal Scientist;VP and Distinguished Scientist;Applied Science Manager;Managing Director",
        "bibtex": "@inproceedings{\nzhang2024code,\ntitle={{CODE} {REPRESENTATION} {LEARNING} {AT} {SCALE}},\nauthor={Dejiao Zhang and Wasi Uddin Ahmad and Ming Tan and Hantian Ding and Ramesh Nallapati and Dan Roth and Xiaofei Ma and Bing Xiang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=vfzRRjumpX}\n}",
        "github": "",
        "project": "",
        "reviewers": "RZCJ;n8qP;iHpZ;zUhF",
        "pdf_size": 752521,
        "rating": "3;6;6;8",
        "confidence": "3;5;4;4",
        "soundness": "3;3;3;3",
        "contribution": "1;2;3;4",
        "presentation": "2;2;3;4",
        "wc_summary": "128;86;74;99",
        "wc_strengths": "37;101;58;164",
        "wc_weaknesses": "81;188;524;69",
        "wc_questions": "39;19;15;118",
        "wc_review": "285;394;671;450",
        "wc_reply_reviewers": "0;0;31;72",
        "wc_reply_authors": "515;643;626;511",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "1;1;2;2",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            1.118033988749895
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            96.75,
            20.09197601033806
        ],
        "wc_strengths_avg": [
            90.0,
            48.55409354524086
        ],
        "wc_weaknesses_avg": [
            215.5,
            184.0387187523321
        ],
        "wc_questions_avg": [
            47.75,
            41.565460420883106
        ],
        "wc_review_avg": [
            450.0,
            140.71424945612296
        ],
        "wc_reply_reviewers_avg": [
            25.75,
            29.549746191803408
        ],
        "wc_reply_authors_avg": [
            573.75,
            61.06297978317141
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.5940885257860046,
        "gs_citation": 18,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5778117393101933543&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=vfzRRjumpX",
        "pdf": "https://openreview.net/pdf?id=vfzRRjumpX",
        "email": "amazon.com;amazon.com;amazon.com;amazon.com;amazon.com;amazon.com;amazon.com;gs.com",
        "author_num": 8,
        "aff_unique_index": "0;0;0;0;0;0;0;1",
        "aff_unique_norm": "Amazon;Goldman Sachs",
        "aff_unique_dep": "Amazon Web Services;",
        "aff_unique_url": "https://aws.amazon.com;https://www.goldmansachs.com",
        "aff_unique_abbr": "AWS;GS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "vg31nvdrzF",
        "title": "Small Visual Language Models can also be Open-Ended Few-Shot Learners",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We present Self-Context Adaptation (SeCAt), a self-supervised approach that unlocks open-ended few-shot abilities of small visual language models. Our proposed adaptation algorithm explicitly learns from symbolic, yet self-supervised training tasks. Specifically, our approach imitates image captions in a self-supervised way based on clustering a large pool of images followed by assigning semantically-unrelated names to clusters. By doing so, we construct the `self-context', a training signal consisting of interleaved sequences of image and pseudo-caption pairs and a query image for which the model is trained to produce the right pseudo-caption. We demonstrate the performance and flexibility of SeCAt on several multimodal few-shot datasets, spanning various granularities. By using models with approximately 1B parameters we outperform the few-shot abilities of much larger models, such as Frozen and FROMAGe. SeCAt opens new possibilities for research in open-ended few-shot learning that otherwise requires access to large or proprietary models.",
        "keywords": "multimodal few-shot learning;visual language models;self-supervised learning;in-context learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/54df5f59855021b7de5084540b28bfb79ce16ff8.pdf",
        "author": "Mohammad Mahdi Derakhshani;Ivona Najdenkoska;Cees G. M. Snoek;Marcel Worring;Yuki M Asano",
        "authorids": "~Mohammad_Mahdi_Derakhshani2;~Ivona_Najdenkoska1;~Cees_G._M._Snoek1;~Marcel_Worring2;~Yuki_M_Asano1",
        "gender": "M;F;M;M;M",
        "homepage": "https://mmderakhshani.github.io/;https://ivonajdenkoska.github.io/;https://staff.fnwi.uva.nl/m.worring/;http://www.ceessnoek.info;https://yukimasano.github.io/",
        "dblp": "220/5737;297/4696;35/4613;s/CeesSnoek;239/8823",
        "google_scholar": "n7GnOJoAAAAJ;2rFidrcAAAAJ;pdu8f3sAAAAJ;https://scholar.google.nl/citations?user=0uKdbscAAAAJ;CdpLhlgAAAAJ",
        "orcid": "0000-0003-0307-8439;0000-0001-6852-0609;;0000-0001-9092-1556;",
        "linkedin": "mmderakhshani/;ivona-najdenkoska/;;cgmsnoek/;",
        "or_profile": "~Mohammad_Mahdi_Derakhshani2;~Ivona_Najdenkoska1;~Marcel_Worring2;~Cees_Snoek1;~Yuki_Asano1",
        "aff": "Microsoft Research;University of Amsterdam;University of Amsterdam;University of Amsterdam;University of Amsterdam",
        "aff_domain": "research.microsoft.com;uva.nl;uva.nl;uva.nl;uva.nl",
        "position": "Intern;PhD student;Full Professor;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nderakhshani2024small,\ntitle={Small Visual Language Models can also be Open-Ended Few-Shot Learners},\nauthor={Mohammad Mahdi Derakhshani and Ivona Najdenkoska and Cees G. M. Snoek and Marcel Worring and Yuki M Asano},\nyear={2024},\nurl={https://openreview.net/forum?id=vg31nvdrzF}\n}",
        "github": "",
        "project": "",
        "reviewers": "uhMd;t52H;4XKc;1gge",
        "site": "https://openreview.net/forum?id=vg31nvdrzF",
        "pdf_size": 1165366,
        "rating": "3;3;5;8",
        "confidence": "4;4;4;4",
        "soundness": "2;2;2;3",
        "contribution": "1;2;2;3",
        "presentation": "3;2;3;2",
        "wc_summary": "60;41;321;88",
        "wc_strengths": "28;44;60;50",
        "wc_weaknesses": "168;174;511;45",
        "wc_questions": "16;3;215;54",
        "wc_review": "272;262;1107;237",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            127.5,
            112.96127655086056
        ],
        "wc_strengths_avg": [
            45.5,
            11.6081867662439
        ],
        "wc_weaknesses_avg": [
            224.5,
            173.23755366547982
        ],
        "wc_questions_avg": [
            72.0,
            84.66108905512614
        ],
        "wc_review_avg": [
            469.5,
            368.2814820215646
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=329035299204640538&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1;1",
        "aff_unique_norm": "Microsoft;University of Amsterdam",
        "aff_unique_dep": "Microsoft Research;",
        "aff_unique_url": "https://www.microsoft.com/en-us/research;https://www.uva.nl",
        "aff_unique_abbr": "MSR;UvA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;1",
        "aff_country_unique": "United States;Netherlands"
    },
    {
        "id": "vg7dECgAw2",
        "title": "Automatic Calibration and Error Correction for Generative Large Language Models via Pareto Optimal Self-Supervision",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Generative Large language models (LLMs) have demonstrated remarkable capabilities for a wide range of applications, but reducing ungrounded or erroneous responses remains a major growth area. Unlike task-specific models, there lack an effective method to calibrate the confidence level of LLM responses to indicate potential errors and facilitate human-in-the-loop verification. An important source of calibration stems from expert-stipulated programmatic supervision, which is often available at low cost but has its own limitations such as noise and coverage. In this paper, we introduce a Pareto optimal self-supervision framework that can leverage available programmatic supervision to systematically calibrate LLM responses by producing a risk score for every LLM response, without any additional manual efforts. This is accomplished by learning a harmonizer model to align with LLM output as well as other weak supervision sources. The model assigns higher risk scores to more uncertain LLM responses and facilitate error correction. Experiments on standard relation extraction and classification tasks in biomedical and general domains demonstrate that the proposed risk score is highly correlated with the actual LLM error rate. By using a dynamic prompting strategy based on the risk score, we observed significant accuracy improvement for off-the-shelf LLMs, boosting GPT-3.5 results past state-of-the-art (SOTA) weak supervision model and GPT-4 results past SOTA supervised results on challenging evaluation datasets.",
        "keywords": "Calibration;Self-supervision;Weak supervision;Large language model",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/88b28531bb82024724816a33294edaa9df57a485.zip",
        "author": "Theodore Zhao;Mu Wei;J. Samuel Preston;Hoifung Poon",
        "authorids": "~Theodore_Zhao1;~Mu_Wei1;~J._Samuel_Preston1;~Hoifung_Poon1",
        "gender": "M;M;M;M",
        "homepage": ";;;https://www.microsoft.com/en-us/research/people/hoifung/",
        "dblp": ";;;78/4609",
        "google_scholar": "Ftyui_wAAAAJ;JNPG9jEAAAAJ;https://scholar.google.com/citations?hl=en;yqqmVbkAAAAJ",
        "orcid": "0000-0003-1931-1426;;0000-0002-5017-6042;0000-0002-9067-0918",
        "linkedin": ";mu-wei-038a3849;;hoifung-poon-9559943/",
        "or_profile": "~Theodore_Zhao1;~Mu_Wei1;~J._Samuel_Preston1;~Hoifung_Poon1",
        "aff": "Microsoft;Microsoft;Microsoft;Microsoft",
        "aff_domain": "microsoft.com;microsoft.com;microsoft.com;microsoft.com",
        "position": "Researcher;Researcher;Applied Scientist;General Manager",
        "bibtex": "@misc{\nanonymous2024automatic,\ntitle={Automatic Calibration and Error Correction for Generative Large Language Models via Pareto Optimal Self-Supervision},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=vg7dECgAw2}\n}",
        "github": "",
        "project": "",
        "reviewers": "mUxK;Mc5b;Crzn;trZj",
        "site": "https://openreview.net/forum?id=vg7dECgAw2",
        "pdf_size": 1106413,
        "rating": "5;6;6;6",
        "confidence": "2;3;3;4",
        "soundness": "3;3;3;2",
        "contribution": "2;2;4;2",
        "presentation": "3;3;2;3",
        "wc_summary": "138;102;317;176",
        "wc_strengths": "122;31;46;81",
        "wc_weaknesses": "160;150;373;95",
        "wc_questions": "128;133;154;19",
        "wc_review": "548;416;890;371",
        "wc_reply_reviewers": "51;21;83;0",
        "wc_reply_authors": "946;641;1141;974",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "3;2;4;2",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            183.25,
            81.53335207140695
        ],
        "wc_strengths_avg": [
            70.0,
            35.078483433580764
        ],
        "wc_weaknesses_avg": [
            194.5,
            105.98702750808704
        ],
        "wc_questions_avg": [
            108.5,
            52.58564442887431
        ],
        "wc_review_avg": [
            556.25,
            203.37450061401503
        ],
        "wc_reply_reviewers_avg": [
            38.75,
            31.32391259086259
        ],
        "wc_reply_authors_avg": [
            925.5,
            180.38361899019546
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.816496580927726,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11682752161426026237&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Microsoft",
        "aff_unique_dep": "Microsoft Corporation",
        "aff_unique_url": "https://www.microsoft.com",
        "aff_unique_abbr": "Microsoft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "vgD20RxsC0",
        "title": "Time Series Prediction With Events Disturbance Based Causal Representation Learnin",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The value of time series prediction is getting more and more attention, and the prediction of time series data under extreme event disturbance has been difficult, the different distribution of data before and after the event and the different distribution of dataset will lead to the poor prediction accuracy, robustness and generalisation ability of prediction model. In this paper, based on the causal representation learning, we design the SCM structure under event interference and propose the causal representation prediction model, which is divided into two parts, CRP\\_Encoder and CRP\\_Decoder.CRP\\_Encoder completes the extraction of causal representations disturbed by events and those not disturbed by events through the causal factor extractor and the causal representation decoupler; in order to learn the causal mechanism, the equivalence of conditional structure and causal mechanism is proved, and CNN network and causal representation coupler are designed in CRP\\_Decoder to learn and predict. The experimental results show that the CRP model has high prediction accuracy, good robustness and strong generalisation ability.",
        "keywords": "Time prediction; extreme event interference; counterfactual prediction; PUNs networks; causal representation learning",
        "primary_area": "causal reasoning",
        "supplementary_material": "/attachment/8a782a6f4a411ddebc32a79f5d84711b18202431.zip",
        "author": "Xuanzhi Feng",
        "authorids": "~Xuanzhi_Feng1",
        "gender": "M",
        "homepage": "https://orcid.org/0009-0004-8766-077X",
        "dblp": "",
        "google_scholar": "",
        "orcid": "0009-0004-8766-077X",
        "linkedin": "",
        "or_profile": "~Xuanzhi_Feng1",
        "aff": "Sichuan University",
        "aff_domain": "scu.edu.cn",
        "position": "MS student",
        "bibtex": "@misc{\nfeng2024time,\ntitle={Time Series Prediction With  Events Disturbance Based Causal Representation Learnin},\nauthor={Xuanzhi Feng},\nyear={2024},\nurl={https://openreview.net/forum?id=vgD20RxsC0}\n}",
        "github": "",
        "project": "",
        "reviewers": "Huym;PJpw;arwZ;q7YY",
        "site": "https://openreview.net/forum?id=vgD20RxsC0",
        "pdf_size": 887162,
        "rating": "3;3;3;3",
        "confidence": "3;5;3;4",
        "soundness": "2;2;1;2",
        "contribution": "2;2;2;2",
        "presentation": "1;1;1;2",
        "wc_summary": "53;15;42;62",
        "wc_strengths": "32;12;12;29",
        "wc_weaknesses": "58;109;190;74",
        "wc_questions": "15;4;2;4",
        "wc_review": "158;140;246;169",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            43.0,
            17.649362594722792
        ],
        "wc_strengths_avg": [
            21.25,
            9.310612224768036
        ],
        "wc_weaknesses_avg": [
            107.75,
            50.94298283375248
        ],
        "wc_questions_avg": [
            6.25,
            5.11737237261468
        ],
        "wc_review_avg": [
            178.25,
            40.46217369346338
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:O9uM1TVpZRMJ:scholar.google.com/&scioq=Time+Series+Prediction+With+Events+Disturbance+Based+Causal+Representation+Learnin&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Sichuan University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.scu.edu.cn",
        "aff_unique_abbr": "SCU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "viC3cpWFTN",
        "title": "Clip21: Error Feedback for Gradient Clipping",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Motivated by the increasing importance of deep neural network training, we study distributed gradient methods with gradient clipping, i.e., clipping applied to the gradients computed from local information at the nodes. While gradient clipping enforces the convergence of gradient-based methods that minimize rapidly growing functions, it also induces bias which causes serious convergence issues specific to the distributed setting. Inspired by  recent progress in the error-feedback literature which is focused on taming the bias/error introduced by communication compression operators such as Top-$k$ (Richt\u00e1rik et al, 2021), and  mathematical similarities between the clipping operator and contractive compression operators, we design Clip21 -- the first provably effective and practically useful error feedback mechanism for distributed methods with gradient clipping. We prove that our method converges at the same $\\mathcal{O}({1}/{K})$ rate as distributed gradient descent in the smooth nonconvex regime, which improves the previous best $\\mathcal{O}({1}/{\\sqrt{K}})$ rate which was obtained under significantly stronger assumptions.\nOur method converges significantly faster in practice than competing methods.",
        "keywords": "clipping;error feedback;gradient-based methods;communication-efficient learning;optimization",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/8ca061caef28b21eb79219a3092ba4ee0d25ef49.pdf",
        "author": "Sarit Khirirat;Eduard Gorbunov;Samuel Horv\u00e1th;Rustem Islamov;Fakhri Karray;Peter Richt\u00e1rik",
        "authorids": "~Sarit_Khirirat1;~Eduard_Gorbunov1;~Samuel_Horv\u00e1th1;~Rustem_Islamov1;~Fakhri_Karray1;~Peter_Richt\u00e1rik1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://sarit-khirirat.netlify.app/;https://eduardgorbunov.github.io;https://sites.google.com/view/samuelhorvath;https://rustem-islamov.github.io/;https://mbzuai.ac.ae/study/faculty/professor-fakhreddine-fakhri-karray/;https://richtarik.org",
        "dblp": "213/3042;215/5512.html;234/8604;285/5128;k/FakhriKarray;62/8001",
        "google_scholar": "https://scholar.google.se/citations?user=NSFBRNAAAAAJ;https://scholar.google.ru/citations?user=85j2RqQAAAAJ;k252J7kAAAAJ;-dlYjUsAAAAJ;9_Hpd5kAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;0000-0003-0619-9260;;0000-0002-6900-315X;0000-0003-4380-5848",
        "linkedin": ";;samuel-horvath/;rustem-islamov-053345228/;;richtarik/",
        "or_profile": "~Sarit_Khirirat1;~Eduard_Gorbunov1;~Samuel_Horv\u00e1th1;~Rustem_Islamov1;~Fakhri_Karray1;~Peter_Richtarik1",
        "aff": "King Abdullah University of Science and Technology;Mohamed bin Zayed University of Artificial Intelligence;MBZUAI;University of Basel;Mohamed bin Zayed University of Artificial Intelligence;King Abdullah University of Science and Technology (KAUST)",
        "aff_domain": "kaust.edu.sa;mbzuai.ac.ae;mbzuai.ac.ae;unibas.ch;mbzuai.ac.ae;kaust.edu.sa",
        "position": "Postdoc;Postdoc;Assistant Professor;PhD student;Full Professor;Full Professor",
        "bibtex": "@misc{\nkhirirat2024clip,\ntitle={Clip21: Error Feedback for Gradient Clipping},\nauthor={Sarit Khirirat and Eduard Gorbunov and Samuel Horv{\\'a}th and Rustem Islamov and Fakhri Karray and Peter Richt{\\'a}rik},\nyear={2024},\nurl={https://openreview.net/forum?id=viC3cpWFTN}\n}",
        "github": "",
        "project": "",
        "reviewers": "Sgc9;y5AM;HYZq",
        "site": "https://openreview.net/forum?id=viC3cpWFTN",
        "pdf_size": 3710948,
        "rating": "5;5;6",
        "confidence": "3;4;3",
        "soundness": "3;3;3",
        "contribution": "2;2;3",
        "presentation": "3;3;4",
        "wc_summary": "85;70;122",
        "wc_strengths": "63;29;81",
        "wc_weaknesses": "128;102;190",
        "wc_questions": "120;38;219",
        "wc_review": "396;239;612",
        "wc_reply_reviewers": "0;70;0",
        "wc_reply_authors": "877;689;754",
        "reply_reviewers": "0;1;0",
        "reply_authors": "2;2;1",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            92.33333333333333,
            21.853044537445015
        ],
        "wc_strengths_avg": [
            57.666666666666664,
            21.561282171728305
        ],
        "wc_weaknesses_avg": [
            140.0,
            36.914315199752345
        ],
        "wc_questions_avg": [
            125.66666666666667,
            74.00150148626865
        ],
        "wc_review_avg": [
            415.6666666666667,
            152.91028597041978
        ],
        "wc_reply_reviewers_avg": [
            23.333333333333332,
            32.99831645537222
        ],
        "wc_reply_authors_avg": [
            773.3333333333334,
            77.95867851339936
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7472240340889889967&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;1;2;1;0",
        "aff_unique_norm": "King Abdullah University of Science and Technology;Mohamed bin Zayed University of Artificial Intelligence;University of Basel",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.kast.kau.edu.sa;https://mbzuai.ac.ae;https://www.unibas.ch",
        "aff_unique_abbr": "KAUST;MBZUAI;UniBas",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;2;1;0",
        "aff_country_unique": "Saudi Arabia;United Arab Emirates;Switzerland"
    },
    {
        "id": "viJlKbTfbb",
        "title": "What If You Were Not There? Learning Causally-Aware Representations of Multi-Agent Interactions",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Modeling spatial-temporal interactions between neighboring agents is at the heart of multi-agent problems such as motion forecasting and crowd navigation. Despite notable progress, it remains unclear to which extent modern representations can capture the causal relationships behind agent interactions. In this work, we take an in-depth look at the causal awareness of the learned representations, from computational formalism to controlled simulations to real-world practice. First, we cast doubt on the notion of non-causal robustness studied in the recent CausalAgents benchmark. We show that recent representations are already partially resilient to perturbations of non-causal agents, and yet modeling indirect causal effects involving mediator agents remains challenging. Further, we introduce a simple but effective regularization approach leveraging causal annotations of varying granularity. Through controlled experiments, we find that incorporating finer-grained causal annotations not only leads to higher degrees of causal awareness but also yields stronger out-of-distribution robustness. Finally, we extend our method to a sim-to-real causal transfer framework by means of cross-domain multi-task learning, which boosts generalization in practical settings even without real-world annotations. We hope our work provides more clarity to the challenges and opportunities of learning causally-aware representations in the multi-agent context while making a first step towards a practical solution.",
        "keywords": "Motion Forecasting;Multi-Agent;Causal Learning;Robustness",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Yuejiang Liu;Ahmad Rahimi;Po-Chien Luan;Frano Raji\u010d;Alexandre Alahi",
        "authorids": "~Yuejiang_Liu1;~Ahmad_Rahimi1;~Po-Chien_Luan1;~Frano_Raji\u010d1;~Alexandre_Alahi3",
        "gender": ";M;M;;M",
        "homepage": "https://sites.google.com/view/yuejiangliu;;;;https://vita.epfl.ch/",
        "dblp": "202/5799;;;;48/3455",
        "google_scholar": "https://scholar.google.com/citations?hl=en;Lc1LR18AAAAJ;Y2Oth4MAAAAJ;;UIhXQ64AAAAJ",
        "orcid": ";0000-0003-0463-6201;;;",
        "linkedin": ";ahmad-rahimi-b5a038100/;;;",
        "or_profile": "~Yuejiang_Liu1;~Ahmad_Rahimi1;~Po-Chien_Luan1;~Frano_Raji\u010d1;~Alexandre_Alahi3",
        "aff": "Stanford University;EPFL - EPF Lausanne;EPFL - EPF Lausanne;;EPFL",
        "aff_domain": "cs.stanford.edu;epfl.ch;epfl.ch;;epfl.ch",
        "position": "Postdoc;PhD student;PhD student;;Associate Professor",
        "bibtex": "@misc{\nliu2024what,\ntitle={What If You Were Not There? Learning Causally-Aware Representations of Multi-Agent Interactions},\nauthor={Yuejiang Liu and Ahmad Rahimi and Po-Chien Luan and Frano Raji{\\v{c}} and Alexandre Alahi},\nyear={2024},\nurl={https://openreview.net/forum?id=viJlKbTfbb}\n}",
        "github": "",
        "project": "",
        "reviewers": "FV83;1Bm7;d8CZ",
        "site": "https://openreview.net/forum?id=viJlKbTfbb",
        "pdf_size": 776295,
        "rating": "5;6;6",
        "confidence": "4;3;4",
        "soundness": "4;2;3",
        "contribution": "3;3;3",
        "presentation": "3;3;4",
        "wc_summary": "117;142;192",
        "wc_strengths": "49;110;91",
        "wc_weaknesses": "377;457;108",
        "wc_questions": "29;52;139",
        "wc_review": "572;761;530",
        "wc_reply_reviewers": "376;0;0",
        "wc_reply_authors": "1385;438;602",
        "reply_reviewers": "2;0;0",
        "reply_authors": "3;1;1",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            150.33333333333334,
            31.18047822311618
        ],
        "wc_strengths_avg": [
            83.33333333333333,
            25.48637980482037
        ],
        "wc_weaknesses_avg": [
            314.0,
            149.28049660510467
        ],
        "wc_questions_avg": [
            73.33333333333333,
            47.37322262863508
        ],
        "wc_review_avg": [
            621.0,
            100.46890066085126
        ],
        "wc_reply_reviewers_avg": [
            125.33333333333333,
            177.2480998174279
        ],
        "wc_reply_authors_avg": [
            808.3333333333334,
            413.2249857993692
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:e5Ah7FLDt_UJ:scholar.google.com/&scioq=What+If+You+Were+Not+There%3F+Learning+Causally-Aware+Representations+of+Multi-Agent+Interactions&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Stanford University;EPFL",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.stanford.edu;https://www.epfl.ch",
        "aff_unique_abbr": "Stanford;EPFL",
        "aff_campus_unique_index": "0;1;1",
        "aff_campus_unique": "Stanford;Lausanne;",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "United States;Switzerland"
    },
    {
        "id": "viNQSOadLg",
        "title": "Biological Sequence Editing with Generative Flow Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Editing biological sequences has extensive applications in synthetic biology and medicine, such as designing regulatory elements for nucleic-acid therapeutics and treating genetic disorders. The primary objective in biological-sequence editing is to determine the optimal modifications to a sequence which augment certain biological properties while adhering to a minimal number of alterations to ensure safety and predictability. In this paper, we propose GFNSeqEditor, a novel biological-sequence editing algorithm which builds on the recently proposed area of generative flow networks (GFlowNets). Our proposed GFNSeqEditor identifies elements within a starting seed sequence that may compromise a desired biological property. Then, using a learned stochastic policy, the algorithm makes edits at these identified locations, offering diverse modifications for each sequence in order to enhance the desired property. Notably, GFNSeqEditor prioritizes edits with a higher likelihood of substantially improving the desired property. Furthermore, the number of edits can be regulated through specific hyperparameters. We conducted extensive experiments on a range of real-world datasets and biological applications, and our results underscore the superior performance of our proposed algorithm compared to existing state-of-the-art sequence editing methods.",
        "keywords": "GFlowNet;Sequence Editing",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Pouya M. Ghari;Alex M Tseng;Gokcen Eraslan;Romain Lopez;Tommaso Biancalani;Gabriele Scalia;Ehsan Hajiramezanali",
        "authorids": "~Pouya_M._Ghari1;~Alex_M_Tseng1;eraslan.gokcen@gene.com;~Romain_Lopez1;~Tommaso_Biancalani1;~Gabriele_Scalia1;~Ehsan_Hajiramezanali1",
        "gender": ";;;;M;;M",
        "homepage": ";;;https://romain-lopez.github.io/;;;http://ehsanhajiramezanali.github.io/",
        "dblp": ";;;132/4587;;201/9258;225/3486",
        "google_scholar": ";;;https://scholar.google.fr/citations?user=Z8RR17oAAAAJ;https://scholar.google.it/citations?user=s_qd9x0AAAAJ;MxeFvewAAAAJ;20I_DMoAAAAJ",
        "orcid": ";;;0000-0003-0495-738X;;0000-0003-3305-9220;",
        "linkedin": ";;;;;gabriele-scalia;ehsan-hajiramezanali-978a3b52/",
        "or_profile": "~Pouya_M._Ghari1;~Alex_M_Tseng1;eraslan.gokcen@gene.com;~Romain_Lopez1;~Tommaso_Biancalani1;~Gabriele_Scalia1;~Ehsan_Hajiramezanali1",
        "aff": ";;;Stanford University;Genentech;Genentech;Genentech",
        "aff_domain": ";;;stanford.edu;gene.com;gene.com;gene.come",
        "position": ";;;Postdoc;Director;Researcher;Principal Researcher",
        "bibtex": "@misc{\nghari2024biological,\ntitle={Biological Sequence Editing with Generative Flow Networks},\nauthor={Pouya M. Ghari and Alex M Tseng and Gokcen Eraslan and Romain Lopez and Tommaso Biancalani and Gabriele Scalia and Ehsan Hajiramezanali},\nyear={2024},\nurl={https://openreview.net/forum?id=viNQSOadLg}\n}",
        "github": "",
        "project": "",
        "reviewers": "1B72;Arqn;aGg2",
        "site": "https://openreview.net/forum?id=viNQSOadLg",
        "pdf_size": 543135,
        "rating": "5;6;6",
        "confidence": "2;4;3",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "2;3;2",
        "wc_summary": "104;155;127",
        "wc_strengths": "34;6;55",
        "wc_weaknesses": "148;14;236",
        "wc_questions": "6;346;82",
        "wc_review": "292;521;500",
        "wc_reply_reviewers": "15;16;307",
        "wc_reply_authors": "946;1033;2291",
        "reply_reviewers": "1;1;2",
        "reply_authors": "3;3;4",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            128.66666666666666,
            20.853989759489405
        ],
        "wc_strengths_avg": [
            31.666666666666668,
            20.07209228976613
        ],
        "wc_weaknesses_avg": [
            132.66666666666666,
            91.27735510823895
        ],
        "wc_questions_avg": [
            144.66666666666666,
            145.70594436131364
        ],
        "wc_review_avg": [
            437.6666666666667,
            103.35806155733034
        ],
        "wc_reply_reviewers_avg": [
            112.66666666666667,
            137.41502424731033
        ],
        "wc_reply_authors_avg": [
            1423.3333333333333,
            614.5601860047739
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.8660254037844385,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:sAJKcCNcAZIJ:scholar.google.com/&scioq=Biological+Sequence+Editing+with+Generative+Flow+Networks&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Stanford University;Genentech",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.stanford.edu;https://www.genentech.com",
        "aff_unique_abbr": "Stanford;Genentech",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Stanford;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "General Graph Random Features",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17523",
        "id": "viftsX50Rt",
        "author_site": "Isaac Reid, Krzysztof Choromanski, Eli Berger, Adrian Weller",
        "tldr": "",
        "abstract": "We propose a novel random walk-based algorithm for unbiased estimation of arbitrary functions of a weighted adjacency matrix, coined \ngeneral graph random features (g-GRFs). This includes many of the most popular examples of kernels defined on the nodes of a graph. Our algorithm enjoys subquadratic time complexity with respect to the number of nodes, overcoming the notoriously prohibitive cubic scaling of exact graph kernel evaluation. It can also be trivially distributed across machines, permitting learning on much larger networks. At the heart of the algorithm is a modulation function which upweights or downweights the contribution from different random walks depending on their lengths. We show that by parameterising it with a neural network we can obtain g-GRFs that give higher-quality kernel estimates or perform efficient, scalable kernel learning. We provide robust theoretical analysis and support our findings with experiments including pointwise estimation of fixed graph kernels, solving non-homogeneous graph ordinary differential equations, node clustering and kernel regression on triangular meshes.",
        "keywords": "Graphs;kernels;random walks;Laplacian;adjacency matrix;kernel learning;ordinary differential equation;neural network",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Isaac Reid;Krzysztof Marcin Choromanski;Eli Berger;Adrian Weller",
        "authorids": "~Isaac_Reid3;~Krzysztof_Marcin_Choromanski1;~Eli_Berger1;~Adrian_Weller1",
        "gender": "M;;M;M",
        "homepage": "https://isaac-reid.github.io;;http://math.haifa.ac.il/berger/;http://mlg.eng.cam.ac.uk/adrian/",
        "dblp": "287/4898;78/11411;;73/8324",
        "google_scholar": "3JPyAi0AAAAJ;;;https://scholar.google.co.uk/citations?user=Ek4hM10AAAAJ",
        "orcid": "0000-0002-1664-1975;;;",
        "linkedin": ";;;",
        "or_profile": "~Isaac_Reid3;~Krzysztof_Marcin_Choromanski1;~Eli_Berger1;~Adrian_Weller1",
        "aff": "University of Cambridge;Google Brain Robotics & Columbia University;University of Haifa;University of Cambridge",
        "aff_domain": "cam.ac.uk;columbia.edu;haifa.ac.il;cam.ac.uk",
        "position": "PhD student;research scientist & adjunct assistant professor;Associate Professor;Principal Researcher",
        "bibtex": "@inproceedings{\nreid2024general,\ntitle={General Graph Random Features},\nauthor={Isaac Reid and Krzysztof Marcin Choromanski and Eli Berger and Adrian Weller},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=viftsX50Rt}\n}",
        "github": "",
        "project": "",
        "reviewers": "TqUg;9UzR;jWMX;44jF",
        "pdf_size": 683253,
        "rating": "8;8;8;8",
        "confidence": "3;4;4;5",
        "soundness": "3;2;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "62;183;115;78",
        "wc_strengths": "62;146;131;25",
        "wc_weaknesses": "110;112;96;70",
        "wc_questions": "130;365;93;138",
        "wc_review": "364;806;435;311",
        "wc_reply_reviewers": "58;49;35;73",
        "wc_reply_authors": "963;755;601;774",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "3;3;2;4",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            109.5,
            46.585942085569116
        ],
        "wc_strengths_avg": [
            91.0,
            49.553001927229396
        ],
        "wc_weaknesses_avg": [
            97.0,
            16.76305461424021
        ],
        "wc_questions_avg": [
            181.5,
            107.29515366501882
        ],
        "wc_review_avg": [
            479.0,
            193.85174747729255
        ],
        "wc_reply_reviewers_avg": [
            53.75,
            13.808964479641476
        ],
        "wc_reply_authors_avg": [
            773.25,
            128.46084033665667
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8821762065118044749&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=viftsX50Rt",
        "pdf": "https://openreview.net/pdf?id=viftsX50Rt",
        "email": "cam.ac.uk;columbia.edu;haifa.ac.il;cam.ac.uk",
        "author_num": 4,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "University of Cambridge;Google;University of Haifa",
        "aff_unique_dep": ";Google Brain Robotics;",
        "aff_unique_url": "https://www.cam.ac.uk;https://ai.google;https://www.haifa.ac.il",
        "aff_unique_abbr": "Cambridge;Google;UoH",
        "aff_campus_unique_index": "0;1;0",
        "aff_campus_unique": "Cambridge;Mountain View;",
        "aff_country_unique_index": "0;1;2;0",
        "aff_country_unique": "United Kingdom;United States;Israel"
    },
    {
        "id": "vjHCyOWc7h",
        "title": "Mixture Stochastic Block Model for Multi-Group Community Detection in Multiplex Graphs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Multiplex graphs have emerged as a powerful tool for modeling complex data due to their capability to accommodate multi-relation structures. These graphs consist of multiple layers, where each layer represents a specific type of relation. Pillar community detection, a clustering approach that assigns vertices to clusters across all layers, has been employed to identify shared community structures. However, particular layers may possess distinct divisions, deviating from the pillar-based clustering. Consequently, it becomes crucial not to identify individual layer clusters, but a similar cluster for similar layers. In this paper, we propose an approach called the \"Mixture Stochastic Block Model,\" which aims to group similar layers based on shared community structures. A common Stochastic Block Model represents each group's shared community structure. The model is rigorously defined, and an iterative technique is employed for computing the inference. We estimate the layer-to-group assignments using the expectation-maximization technique, while the vertex-to-block assignments within each group are determined using the variational estimation-maximization technique. We assess the identifiability of our proposed model and show the consistency of the maximum likelihood function. The performance of the method is evaluated using both synthetic graphs and real-world datasets, showing its efficacy in identifying consistent community structures across diverse multiplex graphs.",
        "keywords": "Stochastic Block Model;Mixture Model;Multi-Group Community Detection;Multiplex Graph",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/24b8d0f554d3f8fe71ce3975c706dff55345ee9c.zip",
        "author": "Noureddine Henka;Mohamad Assaad;Sami Tazi",
        "authorids": "~Noureddine_Henka1;~Mohamad_Assaad1;~Sami_Tazi1",
        "gender": "M;M;M",
        "homepage": "https://www.linkedin.com/in/noureddine-henka-b802b517b/;https://l2s.centralesupelec.fr/u/assaad-mohamad/;https://www.researchgate.net/profile/Sami-Tazi",
        "dblp": ";;",
        "google_scholar": ";;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Noureddine_Henka1;~Mohamad_Assaad1;~Sami_Tazi1",
        "aff": "CentraleSupelec;CentraleSupelec;",
        "aff_domain": "centralesupelec.fr;centralesupelec.fr;",
        "position": "PhD student;Full Professor;",
        "bibtex": "@misc{\nhenka2024mixture,\ntitle={Mixture Stochastic Block Model for Multi-Group Community Detection in Multiplex Graphs},\nauthor={Noureddine Henka and Mohamad Assaad and Sami Tazi},\nyear={2024},\nurl={https://openreview.net/forum?id=vjHCyOWc7h}\n}",
        "github": "",
        "project": "",
        "reviewers": "VvaF;YZJF;MACM;tJJH;gZki",
        "site": "https://openreview.net/forum?id=vjHCyOWc7h",
        "pdf_size": 1025338,
        "rating": "3;3;5;5;6",
        "confidence": "2;3;5;4;3",
        "soundness": "2;3;2;3;3",
        "contribution": "2;2;2;3;3",
        "presentation": "1;3;3;3;3",
        "wc_summary": "44;110;96;71;117",
        "wc_strengths": "18;11;45;58;45",
        "wc_weaknesses": "188;637;379;149;290",
        "wc_questions": "59;328;106;114;61",
        "wc_review": "309;1086;626;392;513",
        "wc_reply_reviewers": "0;0;35;26;100",
        "wc_reply_authors": "324;760;719;497;271",
        "reply_reviewers": "0;0;1;1;1",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            4.4,
            1.2
        ],
        "confidence_avg": [
            3.4,
            1.019803902718557
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.6,
            0.8000000000000002
        ],
        "wc_summary_avg": [
            87.6,
            26.881964213948354
        ],
        "wc_strengths_avg": [
            35.4,
            17.85049018934774
        ],
        "wc_weaknesses_avg": [
            328.6,
            173.87650790144136
        ],
        "wc_questions_avg": [
            133.6,
            99.77294222383141
        ],
        "wc_review_avg": [
            585.2,
            272.50350456462024
        ],
        "wc_reply_reviewers_avg": [
            32.2,
            36.65187580465698
        ],
        "wc_reply_authors_avg": [
            514.2,
            198.98683373530017
        ],
        "reply_reviewers_avg": [
            0.6,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5229763603684907,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:jEo8zPGnHgIJ:scholar.google.com/&scioq=Mixture+Stochastic+Block+Model+for+Multi-Group+Community+Detection+in+Multiplex+Graphs&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "CentraleSup\u00e9lec",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.centralesupelec.fr",
        "aff_unique_abbr": "CS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "France"
    },
    {
        "id": "vkKQjaS9GX",
        "title": "SDM-RL: Steady-State Divergence Maximization for Robust Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "While reinforcement learning algorithms have achieved human-level performance in complex scenarios, they often falter when subjected to perturbations in test environments. Previous attempts to mitigate this issue have explored the training of multiple policies with varied behaviors, yet these efforts are compromised due to suboptimal choices in diversity measures. Such measures often lead to training instability or fail to capture the intended diversity among policies. In this research, we offer a unified perspective that ties together previous work through the common framework of maximizing divergence between steady-state probability distributions induced by different behavioral policies. Most importantly, we introduce an innovative diversity measure, simply used as an intrinsic reward, that addresses the limitations of prior work. Our theoretical advancements are complemented by experimental evidence across a diverse set of benchmarks.",
        "keywords": "Diverse reinforcement learning;robust reinforcement learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/0431709ba41f4db3c2e2ffec306231ae0336ea32.pdf",
        "author": "Pankayaraj Pathmanathan;Furong Huang",
        "authorids": "~Pankayaraj_Pathmanathan2;~Furong_Huang1",
        "gender": "F;M",
        "homepage": "https://furong-huang.com;https://punk95.github.io/",
        "dblp": "72/8513;250/2750.html",
        "google_scholar": "13yyuCcAAAAJ;G_gAOpwAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Furong_Huang1;~Pankayaraj_Pathmanathan1",
        "aff": "University of Maryland;University of Maryland, College Park",
        "aff_domain": "cs.umd.edu;umd.edu",
        "position": "Assistant Professor;PhD student",
        "bibtex": "@misc{\npathmanathan2024sdmrl,\ntitle={{SDM}-{RL}: Steady-State Divergence Maximization for Robust Reinforcement Learning},\nauthor={Pankayaraj Pathmanathan and Furong Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=vkKQjaS9GX}\n}",
        "github": "",
        "project": "",
        "reviewers": "b7cc;YmNh;rZkm;Vyzf",
        "site": "https://openreview.net/forum?id=vkKQjaS9GX",
        "pdf_size": 1448353,
        "rating": "3;3;3;5",
        "confidence": "3;4;4;4",
        "soundness": "2;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "1;3;2;2",
        "wc_summary": "82;43;41;128",
        "wc_strengths": "20;12;41;86",
        "wc_weaknesses": "188;76;288;39",
        "wc_questions": "9;140;35;309",
        "wc_review": "299;271;405;562",
        "wc_reply_reviewers": "0;0;458;0",
        "wc_reply_authors": "292;347;521;451",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            73.5,
            35.4577213029828
        ],
        "wc_strengths_avg": [
            39.75,
            28.726077003308337
        ],
        "wc_weaknesses_avg": [
            147.75,
            97.80688881668816
        ],
        "wc_questions_avg": [
            123.25,
            117.9244991509398
        ],
        "wc_review_avg": [
            384.25,
            114.1476565681486
        ],
        "wc_reply_reviewers_avg": [
            114.5,
            198.31981746663644
        ],
        "wc_reply_authors_avg": [
            402.75,
            89.00105336455294
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ZRmkBnEP2uoJ:scholar.google.com/&scioq=SDM-RL:+Steady-State+Divergence+Maximization+for+Robust+Reinforcement+Learning&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Maryland",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www/umd.edu",
        "aff_unique_abbr": "UMD",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";College Park",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Alice Benchmarks: Connecting Real World Re-Identification with the Synthetic",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17522",
        "id": "vkkHqoerLV",
        "author_site": "Xiaoxiao Sun, Yue Yao, Shengjin Wang, Hongdong Li, Liang Zheng",
        "tldr": "",
        "abstract": "For object re-identification (re-ID), learning from synthetic data has become a promising strategy to cheaply acquire large-scale annotated datasets and effective models, with few privacy concerns. Many interesting research problems arise from this strategy, e.g., how to reduce the domain gap between synthetic source and real-world target. To facilitate developing more new approaches in learning from synthetic data, we introduce the Alice benchmarks, large-scale datasets providing benchmarks as well as evaluation protocols to the research community. Within the Alice benchmarks, two object re-ID tasks are offered: person and vehicle re-ID. We collected and annotated two challenging real-world target datasets: AlicePerson and AliceVehicle, captured under various illuminations, image resolutions, etc. As an important feature of our real target, the clusterability of its training set is not manually guaranteed to make it closer to a real domain adaptation test scenario. Correspondingly, we reuse existing PersonX and VehicleX as synthetic source domains. The primary goal is to train models from synthetic data that can work effectively in the real world. In this paper, we detail the settings of Alice benchmarks, provide an analysis of existing commonly-used domain adaptation methods, and discuss some interesting future directions. An online server has been set up for the community to evaluate methods conveniently and fairly. Datasets and the online server details are available at https://sites.google.com/view/alice-benchmarks.",
        "keywords": "Synthetic Data;Object re-ID;Benchmarks",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/7f089240669968080aecb950b4db3b05b819493e.pdf",
        "author": "Xiaoxiao Sun;Yue Yao;Shengjin Wang;Hongdong Li;Liang Zheng",
        "authorids": "~Xiaoxiao_Sun1;~Yue_Yao1;~Shengjin_Wang1;~Hongdong_Li1;~Liang_Zheng4",
        "gender": "F;M;M;M;M",
        "homepage": "https://xiaoxiaosun.com/;http://yorkeyao.cc/;http://www.ee.tsinghua.edu.cn/publish/eeen/8316/index.html;http://users.cecs.anu.edu.au/~hongdong/;http://zheng-lab.cecs.anu.edu.au/",
        "dblp": "185/7856-2;;;59/4859.html;61/7360-1",
        "google_scholar": "1oCrd64AAAAJ;dSQdVooAAAAJ;;https://scholar.google.com.tw/citations?hl=en;https://scholar.google.com.au/citations?user=vNHqr3oAAAAJ",
        "orcid": "0000-0002-6944-7914;0000-0002-9852-4667;;;",
        "linkedin": ";yao-yue-317a01147/?originalSubdomain=au;;;liang-zheng-76341311a/",
        "or_profile": "~Xiaoxiao_Sun1;~Yue_Yao1;~Shengjin_Wang1;~Hongdong_Li1;~Liang_Zheng4",
        "aff": "Australian National University;Australian National University;Tsinghua University;Australian National University;Australian National University",
        "aff_domain": "anu.edu.au;anu.edu.au;tsinghua.edu.cn;anu.edu.au;anu.edu.au",
        "position": "PhD student;Postdoc;Full Professor;Full Professor;Associate Professor",
        "bibtex": "@inproceedings{\nsun2024alice,\ntitle={Alice Benchmarks: Connecting Real World Re-Identification with the Synthetic},\nauthor={Xiaoxiao Sun and Yue Yao and Shengjin Wang and Hongdong Li and Liang Zheng},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=vkkHqoerLV}\n}",
        "github": "",
        "project": "",
        "reviewers": "6iq6;ZhRK;dCYN;txUp",
        "pdf_size": 2009427,
        "rating": "6;6;6;8",
        "confidence": "5;5;4;4",
        "soundness": "2;2;2;3",
        "contribution": "2;1;2;4",
        "presentation": "3;3;3;3",
        "wc_summary": "97;27;87;74",
        "wc_strengths": "28;20;41;87",
        "wc_weaknesses": "233;103;115;41",
        "wc_questions": "4;24;1;1",
        "wc_review": "362;174;244;203",
        "wc_reply_reviewers": "25;19;0;30",
        "wc_reply_authors": "937;730;828;248",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "2;1;2;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            1.0897247358851685
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            71.25,
            26.81767141270845
        ],
        "wc_strengths_avg": [
            44.0,
            25.93260495977988
        ],
        "wc_weaknesses_avg": [
            123.0,
            69.44062211702888
        ],
        "wc_questions_avg": [
            7.5,
            9.604686356149273
        ],
        "wc_review_avg": [
            245.75,
            71.57644514782778
        ],
        "wc_reply_reviewers_avg": [
            18.5,
            11.368817000902073
        ],
        "wc_reply_authors_avg": [
            685.75,
            263.12770188636546
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:jlak9ZB-ZGYJ:scholar.google.com/&scioq=Alice+Benchmarks:+Connecting+Real+World+Re-Identification+with+the+Synthetic&hl=en&as_sdt=0,33",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=vkkHqoerLV",
        "pdf": "https://openreview.net/pdf?id=vkkHqoerLV",
        "email": "anu.edu.au;anu.edu.au;tsinghua.edu.cn;anu.edu.au;anu.edu.au",
        "author_num": 5,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "Australian National University;Tsinghua University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.anu.edu.au;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "ANU;THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "Australia;China"
    },
    {
        "id": "vkzPuZJ80a",
        "title": "Accelerating Retrieval-augmented Language Model Serving with Speculation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Retrieval-augmented language models (RaLM) have demonstrated the potential to solve knowledge-intensive natural language processing (NLP) tasks by combining a non-parametric knowledge base with a parametric language model. Instead of fine-tuning a fully parametric model, RaLM excels at its low-cost adaptation to the latest data and better source attribution mechanisms. Among various RaLM approaches, iterative RaLM delivers a better generation quality due to a more frequent interaction between the retriever and the language model. Despite the benefits, iterative RaLM usually encounters high overheads due to the frequent retrieval step. To this end, we propose RaLMSpec, a speculation-inspired framework that provides generic speed-up over iterative RaLM while preserving the same model outputs through speculative retrieval and batched verification. By further incorporating prefetching, optimal speculation stride scheduler, and asynchronous verification, RaLMSpec can automatically exploit the acceleration potential to the fullest. Extensive evaluations over three language models on four downstream QA datasets demonstrate that RaLMSpec can achieve a speed-up ratio of 1.75-2.39\u00d7, 1.04-1.39\u00d7, and 1.31-1.77\u00d7 when the retriever is an exact dense retriever, approximate dense retriever, and sparse retriever respectively compared with the baseline.",
        "keywords": "Retrieval-augmented Language Models; Model Inference Acceleration; Speculative Execution",
        "primary_area": "infrastructure, software libraries, hardware, etc.",
        "supplementary_material": "/attachment/6214ddfaab9d2b75f697e63428398d2effd62444.zip",
        "author": "Zhihao Zhang;Alan Zhu;Lijie Yang;Yihua Xu;Lanting Li;Phitchaya Mangpo Phothilimthana;Zhihao Jia",
        "authorids": "~Zhihao_Zhang2;~Alan_Zhu1;~Lijie_Yang1;~Yihua_Xu1;~Lanting_Li1;~Phitchaya_Mangpo_Phothilimthana1;~Zhihao_Jia2",
        "gender": ";M;M;M;F;F;M",
        "homepage": ";https://az1326.github.io/;https://derrickylj.github.io/;;;https://mangpo.net/;https://www.cs.cmu.edu/~zhihaoj2/",
        "dblp": "91/5464;358/6490;98/7434-3;;;127/3128;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;5Gx-kFQAAAAJ;;6xxmZs0AAAAJ;7Fxbm0AAAAAJ;0IWLFR4AAAAJ",
        "orcid": ";0009-0001-8694-9246;;;0000-0003-2434-9285;;",
        "linkedin": ";az1326/;lijie-yang-drk/;yihua-bruce-xu-9a37381a5/;;;",
        "or_profile": "~Zhihao_Zhang2;~Alan_Zhu1;~Lijie_Yang1;~Yihua_Xu1;~Lanting_Li1;~Phitchaya_Mangpo_Phothilimthana1;~Zhihao_Jia2",
        "aff": "Carnegie Mellon University;School of Computer Science, Carnegie Mellon University;Carnegie Mellon University;University of California, Berkeley;Carnegie Mellon University;Google;Carnegie Mellon University",
        "aff_domain": "andrew.cmu.edu;cs.cmu.edu;cmu.edu;berkeley.edu;andrew.cmu.edu;google.com;cs.cmu.edu",
        "position": "PhD student;Undergrad student;Undergrad student;Undergrad student;PhD student;Researcher;Assistant Professor",
        "bibtex": "@misc{\nzhang2024accelerating,\ntitle={Accelerating Retrieval-augmented Language Model Serving with Speculation},\nauthor={Zhihao Zhang and Alan Zhu and Lijie Yang and Yihua Xu and Lanting Li and Phitchaya Mangpo Phothilimthana and Zhihao Jia},\nyear={2024},\nurl={https://openreview.net/forum?id=vkzPuZJ80a}\n}",
        "github": "",
        "project": "",
        "reviewers": "RYWk;pUX8;ee61;17wi",
        "site": "https://openreview.net/forum?id=vkzPuZJ80a",
        "pdf_size": 2440375,
        "rating": "3;3;5;6",
        "confidence": "3;3;4;3",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "50;72;163;86",
        "wc_strengths": "30;23;69;90",
        "wc_weaknesses": "312;23;50;72",
        "wc_questions": "4;39;45;40",
        "wc_review": "396;157;327;288",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "907;419;477;536",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            92.75,
            42.540421953713626
        ],
        "wc_strengths_avg": [
            53.0,
            27.631503759296198
        ],
        "wc_weaknesses_avg": [
            114.25,
            115.4824120808013
        ],
        "wc_questions_avg": [
            32.0,
            16.32482771731451
        ],
        "wc_review_avg": [
            292.0,
            87.00862026259237
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            584.75,
            190.59430080671353
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18227770287785053434&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;1;0;2;0",
        "aff_unique_norm": "Carnegie Mellon University;University of California, Berkeley;Google",
        "aff_unique_dep": ";;Google",
        "aff_unique_url": "https://www.cmu.edu;https://www.berkeley.edu;https://www.google.com",
        "aff_unique_abbr": "CMU;UC Berkeley;Google",
        "aff_campus_unique_index": "1;2;3",
        "aff_campus_unique": ";Pittsburgh;Berkeley;Mountain View",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "vl3F3s8OMg",
        "title": "Can Euclidean Symmetry Help in Reinforcement Learning and Planning?",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In robotic tasks, changes of reference frames do not affect the underlying physics of the problem. Isometric transformations, including translations, rotations, and reflections, collectively form the Euclidean group. In this work, we study reinforcement learning and planning tasks that have Euclidean group symmetry. We show that MDPs with continuous symmetries have linear approximations that satisfy steerable kernel constraints, which are widely studied in equivariant machine learning. Guided by our theory, we propose an equivariant model-based RL algorithm algorithm, which is based on sampling-based MPPI for continuous action spaces. We test our proposed equivariant TD-MPC algorithm on a set of standard RL benchmark tasks. Our work shows that equivariant methods can give a great boost in performance on control tasks with continuous symmetry.",
        "keywords": "reinforcement learning;planning;symmetry;equivariance;geometry",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/64cb56129e18b68d7595bcc77b3e24bbcbeeed58.pdf",
        "author": "Linfeng Zhao;Owen Lewis Howell;Jung Yeon Park;Xupeng Zhu;Robin Walters;Lawson L.S. Wong",
        "authorids": "~Linfeng_Zhao1;~Owen_Lewis_Howell1;~Jung_Yeon_Park1;~Xupeng_Zhu1;~Robin_Walters1;~Lawson_L.S._Wong2",
        "gender": ";M;M;M;M;M",
        "homepage": "http://lfzhao.com;;;https://zxp-s-works.github.io/;http://www.robinwalters.com;https://www.ccs.neu.edu/home/lsw/",
        "dblp": "221/4652;;240/2704;257/4426;258/3416;35/2573",
        "google_scholar": ";8bmIJtAAAAAJ;LZSRm9sAAAAJ;mwxz-8MAAAAJ;fnprJmUAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;;;",
        "linkedin": ";;;xupengzhu-skunk;;",
        "or_profile": "~Linfeng_Zhao1;~Owen_Lewis_Howell1;~Jung_Yeon_Park1;~Xupeng_Zhu1;~Robin_Walters1;~Lawson_L._S._Wong1",
        "aff": "Meta;Northeastern University;J.P. Morgan Chase;Northeastern University;Northeastern University ;Northeastern University",
        "aff_domain": "meta.com;neu.edu;jpmorganchase.com;northeastern.edu;northeastern.edu;northeastern.edu",
        "position": "ML PhD Intern;PhD student;Intern;PhD student;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nzhao2024can,\ntitle={Can Euclidean Symmetry Help in Reinforcement Learning and Planning?},\nauthor={Linfeng Zhao and Owen Lewis Howell and Jung Yeon Park and Xupeng Zhu and Robin Walters and Lawson L.S. Wong},\nyear={2024},\nurl={https://openreview.net/forum?id=vl3F3s8OMg}\n}",
        "github": "",
        "project": "",
        "reviewers": "YD5X;9qqP;7StE;NZJg",
        "site": "https://openreview.net/forum?id=vl3F3s8OMg",
        "pdf_size": 2941781,
        "rating": "3;3;5;6",
        "confidence": "3;5;3;3",
        "soundness": "3;1;2;3",
        "contribution": "2;1;2;3",
        "presentation": "1;2;1;3",
        "wc_summary": "85;39;39;122",
        "wc_strengths": "57;27;74;169",
        "wc_weaknesses": "242;706;232;43",
        "wc_questions": "173;36;2;48",
        "wc_review": "557;808;347;382",
        "wc_reply_reviewers": "97;132;0;0",
        "wc_reply_authors": "1196;1155;463;306",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            71.25,
            34.802119188348286
        ],
        "wc_strengths_avg": [
            81.75,
            53.11014498191471
        ],
        "wc_weaknesses_avg": [
            305.75,
            244.3055208135911
        ],
        "wc_questions_avg": [
            64.75,
            64.735519616359
        ],
        "wc_review_avg": [
            523.5,
            182.50821899300865
        ],
        "wc_reply_reviewers_avg": [
            57.25,
            58.572070989508305
        ],
        "wc_reply_authors_avg": [
            780.0,
            399.6392122902856
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5555555555555555,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:HiliDpY8lfcJ:scholar.google.com/&scioq=Can+Euclidean+Symmetry+Help+in+Reinforcement+Learning+and+Planning%3F&hl=en&as_sdt=0,33",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;1;1;1",
        "aff_unique_norm": "Meta;Northeastern University;JPMorgan Chase & Co.",
        "aff_unique_dep": "Meta Platforms, Inc.;;",
        "aff_unique_url": "https://meta.com;https://www.northeastern.edu;https://www.jpmorganchase.com",
        "aff_unique_abbr": "Meta;NEU;JPM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "vlQ56aWJhl",
        "title": "S-TLLR: STDP-inspired Temporal Local Learning Rule for Spiking Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Spiking Neural Networks (SNNs) are biologically plausible models that have been identified as potentially apt for deploying energy-efficient intelligence at the edge, particularly for sequential learning tasks. However, training of SNNs poses significant challenges due to the necessity for precise temporal and spatial credit assignments. Back-propagation through time (BPTT) algorithm, whilst the most widely used method for addressing these issues, incurs a high computational cost due to its temporal dependency. In this work, we propose S-TLLR, a novel three-factor temporal local learning rule inspired by the Spike-Timing Dependent Plasticity (STDP) mechanism, aimed at training deep SNNs on event-based learning tasks. Furthermore, S-TLLR is designed to have low memory and time complexities, which are independent of the number of time steps, rendering it suitable for online learning on low-power edge devices. To demonstrate the scalability of our proposed method, we have conducted extensive evaluations on event-based datasets spanning a wide range of applications, such as image and gesture recognition, audio classification, and optical flow estimation. In all the experiments, S-TLLR achieved high accuracy, comparable to BPTT, with reduction in the number of computations between $1.1-10\\times$.",
        "keywords": "Local learning;Spiking Neural Networks;Memory-efficient learning;STDP",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/f1a86a85f6b766752b6132a1a69c2eeddccae78b.zip",
        "author": "Marco Paul E. Apolinario;Kaushik Roy",
        "authorids": "~Marco_Paul_E._Apolinario1;~Kaushik_Roy1",
        "gender": "M;M",
        "homepage": "https://engineering.purdue.edu/NRL/Group;https://mapolinario94.github.io/",
        "dblp": "r/KaushikRoy;332/5073",
        "google_scholar": "to4P8KgAAAAJ;a9JiVBQAAAAJ",
        "orcid": ";0000-0002-1124-2545",
        "linkedin": ";marco-apolinario/",
        "or_profile": "~Kaushik_Roy1;~Marco_Paul_Apolinario1",
        "aff": "Purdue University;Delft University of Technology",
        "aff_domain": "purdue.edu;tudelft.nl",
        "position": "Full Professor;Intern",
        "bibtex": "@misc{\napolinario2024stllr,\ntitle={S-{TLLR}: {STDP}-inspired Temporal Local Learning Rule for Spiking Neural Networks},\nauthor={Marco Paul E. Apolinario and Kaushik Roy},\nyear={2024},\nurl={https://openreview.net/forum?id=vlQ56aWJhl}\n}",
        "github": "",
        "project": "",
        "reviewers": "KFXk;FGQ4;mZie;H5rp",
        "site": "https://openreview.net/forum?id=vlQ56aWJhl",
        "pdf_size": 1078947,
        "rating": "3;5;6;6",
        "confidence": "3;4;3;4",
        "soundness": "2;3;2;3",
        "contribution": "2;2;1;3",
        "presentation": "3;2;3;3",
        "wc_summary": "42;28;149;118",
        "wc_strengths": "16;32;32;85",
        "wc_weaknesses": "85;183;338;32",
        "wc_questions": "88;4;80;33",
        "wc_review": "231;247;599;268",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "462;376;603;240",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            84.25,
            50.69701667751269
        ],
        "wc_strengths_avg": [
            41.25,
            26.089988501338976
        ],
        "wc_weaknesses_avg": [
            159.5,
            116.42701576524239
        ],
        "wc_questions_avg": [
            51.25,
            34.43381332353418
        ],
        "wc_review_avg": [
            336.25,
            152.2651880765922
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            420.25,
            131.898398398161
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.40824829046386296,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2642528330920483612&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Purdue University;Delft University of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.purdue.edu;https://www.tudelft.nl",
        "aff_unique_abbr": "Purdue;TU Delft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United States;Netherlands"
    },
    {
        "id": "vmiV4Z99lK",
        "title": "SPFQ: A Stochastic Algorithm and Its Error Analysis for Neural Network Quantization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Quantization is a widely used compression method that effectively reduces redundancies in over-parameterized neural networks. However, existing quantization techniques for deep neural networks often lack a comprehensive error analysis due to the presence of non-convex loss functions and nonlinear activations. In this paper, we propose a fast stochastic algorithm for quantizing the weights of fully trained neural networks. Our approach leverages a greedy path-following mechanism in combination with a stochastic quantizer. Its computational complexity scales only linearly with the number of weights in the network, thereby enabling the efficient quantization of large networks. Importantly, we establish, for the first time,  full-network error bounds, under an infinite alphabet condition and minimal assumptions on the weights and input data. As an application of this result, we prove that when quantizing a multi-layer network having Gaussian weights, the relative square quantization error exhibits a linear decay as the degree of over-parametrization increases. Furthermore, we demonstrate that it is possible to achieve error bounds equivalent to those obtained in the infinite alphabet case, using on the order of a mere $\\log\\log N$ bits per weight, where $N$ represents the largest  number of neurons in a layer.",
        "keywords": "stochastic quantization;quantization of neural networks;greedy algorithm;full-network error bounds",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Jinjie Zhang;Rayan Saab",
        "authorids": "~Jinjie_Zhang1;~Rayan_Saab1",
        "gender": "M;",
        "homepage": "https://jayzhang0727.github.io;https://www.math.ucsd.edu/~rsaab/",
        "dblp": ";18/2222",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en",
        "orcid": ";",
        "linkedin": "jinjie-zhang-425940122;",
        "or_profile": "~Jinjie_Zhang1;~Rayan_Saab1",
        "aff": "GSK;University of California, San Diego",
        "aff_domain": "gsk.com;ucsd.edu",
        "position": "Researcher;Full Professor",
        "bibtex": "@misc{\nzhang2024spfq,\ntitle={{SPFQ}: A Stochastic Algorithm and Its Error Analysis for Neural Network Quantization},\nauthor={Jinjie Zhang and Rayan Saab},\nyear={2024},\nurl={https://openreview.net/forum?id=vmiV4Z99lK}\n}",
        "github": "",
        "project": "",
        "reviewers": "dz6f;nVek;sBRp;xzB6",
        "site": "https://openreview.net/forum?id=vmiV4Z99lK",
        "pdf_size": 792742,
        "rating": "3;3;5;6",
        "confidence": "3;3;4;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;3;3",
        "wc_summary": "18;216;226;120",
        "wc_strengths": "29;68;99;114",
        "wc_weaknesses": "100;544;526;56",
        "wc_questions": "1;1;231;105",
        "wc_review": "148;829;1082;395",
        "wc_reply_reviewers": "91;359;343;0",
        "wc_reply_authors": "494;1111;897;298",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "2;2;2;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            145.0,
            84.19619943916709
        ],
        "wc_strengths_avg": [
            77.5,
            32.546121120649694
        ],
        "wc_weaknesses_avg": [
            306.5,
            229.1173280221293
        ],
        "wc_questions_avg": [
            84.5,
            94.64010777677717
        ],
        "wc_review_avg": [
            613.5,
            364.13081440603185
        ],
        "wc_reply_reviewers_avg": [
            198.25,
            156.20399322680584
        ],
        "wc_reply_authors_avg": [
            700.0,
            320.84653652486264
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17331364417494770018&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "GlaxoSmithKline;University of California, San Diego",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.gsk.com;https://www.ucsd.edu",
        "aff_unique_abbr": "GSK;UCSD",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";San Diego",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "id": "vmlboYfvpf",
        "title": "Generalized Adversarial Learning--An Innovative Unsupervised Paradigm In LLM's Calibration",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recently, there has been a significant increase in the use of large-scale Question-Answering (QA) models. However, these models have started to reveal some limitations, such as generating incorrect information, which are holding back their progress. Most of the current calibration methods have their own problems, like the high cost of collecting fine-tuning data, limited interpretability and high intrusiveness, making them less suitable for wider use. To tackle this challenge, we introduce a new machine learning paradigm called \"Generalized Adversarial Learning\" (GAL) to improve the calibration of large QA models without the need for supervision. We explain the core principles and ideas behind GAL and present empirical evidence demonstrating its effectiveness, interpretability, and non-intrusive nature, achieving performance surpassing the state-of-the-art in some metrics even within the field of supervised learning.",
        "keywords": "Natural Language Processing;Adversarial Learning;Unsupervised Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "ZiXuan Chen;Jinxiu Liu;Hanlin Wang;Nuo Chen;Qi Liu",
        "authorids": "~ZiXuan_Chen7;~Jinxiu_Liu1;~Hanlin_Wang3;~Nuo_Chen7;~Qi_Liu19",
        "gender": "M;M;M;F;M",
        "homepage": ";https://brandon-liu-jx.github.io/;https://wanghanlinhenry.github.io/;;https://drliuqi.github.io/",
        "dblp": ";;;;95/2446-5.html",
        "google_scholar": ";;REIjUH0AAAAJ;;ekQx0bIAAAAJ",
        "orcid": "0009-0004-4539-4995;;0000-0001-5122-0722;0009-0004-0789-1915;0000-0001-5378-6404",
        "linkedin": ";;;;",
        "or_profile": "~ZiXuan_Chen7;~Jinxiu_Liu1;~Hanlin_Wang3;~Nuo_Chen7;~Qi_Liu19",
        "aff": "South China University of Technology;South China University of Technology;South China University of Technology;South China University of Technology;South China University of Technology",
        "aff_domain": "scut.edu.cn;scut.edu.cn;scut.edu.cn;scut.edu.cn;scut.edu.cn",
        "position": "Undergrad student;Undergrad student;Undergrad student;Undergrad student;Full Professor",
        "bibtex": "@misc{\nchen2024generalized,\ntitle={Generalized Adversarial Learning--An Innovative Unsupervised Paradigm In {LLM}'s Calibration},\nauthor={ZiXuan Chen and Jinxiu Liu and Hanlin Wang and Nuo Chen and Qi Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=vmlboYfvpf}\n}",
        "github": "",
        "project": "",
        "reviewers": "F18K;9Xja;fsZm;LxAL",
        "site": "https://openreview.net/forum?id=vmlboYfvpf",
        "pdf_size": 775630,
        "rating": "3;3;3;6",
        "confidence": "4;3;3;3",
        "soundness": "2;2;1;3",
        "contribution": "2;2;2;3",
        "presentation": "1;1;1;2",
        "wc_summary": "72;92;88;36",
        "wc_strengths": "54;57;11;40",
        "wc_weaknesses": "100;186;31;31",
        "wc_questions": "140;11;90;49",
        "wc_review": "366;346;220;156",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            72.0,
            22.090722034374522
        ],
        "wc_strengths_avg": [
            40.5,
            18.200274723201296
        ],
        "wc_weaknesses_avg": [
            87.0,
            63.72205269763365
        ],
        "wc_questions_avg": [
            72.5,
            47.95049530505394
        ],
        "wc_review_avg": [
            272.0,
            87.28115489611719
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:qDgpQ92PtG4J:scholar.google.com/&scioq=Generalized+Adversarial+Learning--An+Innovative+Unsupervised+Paradigm+In+LLM%27s+Calibration&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "South China University of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.scut.edu.cn",
        "aff_unique_abbr": "SCUT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "vmlwllg7DJ",
        "title": "GrowLength: Accelerating LLMs Pretraining by Progressively Growing Training Length",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The evolving sophistication and intricacies of Large Language Models (LLMs) yield unprecedented advancements, yet they simultaneously demand considerable computational resources and incur significant costs. To alleviate these challenges, this paper introduces a novel, simple, and effective method named ``\\growlength'' to accelerate the pretraining process of LLMs. Our method progressively increases the training length throughout the pretraining phase, thereby mitigating computational costs and enhancing efficiency. For instance, it begins with a sequence length of 128 and progressively extends to 4096. This approach enables models to process a larger number of tokens within limited time frames, potentially boosting their performance. In other words, the efficiency gain is derived from training with shorter sequences optimizing the utilization of resources. Our extensive experiments with various state-of-the-art LLMs have revealed that models trained using our method not only converge more swiftly but also exhibit superior performance metrics compared to those trained with existing methods. Furthermore, our method for LLMs pretraining acceleration does not require any additional engineering efforts, making it a practical solution in the realm of LLMs.",
        "keywords": "Large Language Model;Pretraining",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Hongye Jin;Xiaotian Han;Jingfeng Yang;Zhimeng Jiang;Chia-Yuan Chang;Xia Hu",
        "authorids": "~Hongye_Jin1;~Xiaotian_Han1;~Jingfeng_Yang2;~Zhimeng_Jiang1;~Chia-Yuan_Chang3;~Xia_Hu4",
        "gender": "M;M;M;M;Not Specified;M",
        "homepage": "https://github.com/Mooler0410;https://ahxt.github.io/;https://jingfengyang.github.io/;http://www.zhimengjiang.com/;https://z76316.github.io/;https://cs.rice.edu/~xh37/index.html",
        "dblp": "268/7929;;;217/3235;03/1382-2.html;256/9406.html",
        "google_scholar": ";Uromx98AAAAJ;hysBvrwAAAAJ;5Es3Yk4AAAAJ;EO595aMAAAAJ;https://scholar.google.com.tw/citations?user=pcCS60IAAAAJ",
        "orcid": ";;;0000-0001-6933-3952;0009-0001-1889-612X;",
        "linkedin": ";;jingfeng-yang-797864172/;;chia-yuan-chang/;",
        "or_profile": "~Hongye_Jin1;~Xiaotian_Han1;~Jingfeng_Yang2;~Zhimeng_Jiang1;~Chia-Yuan_Chang3;~Xia_Hu2",
        "aff": "Texas A&M;Texas A&M University;Amazon;VISA Research;Texas A&M University - College Station;Rice University",
        "aff_domain": "tamu.edu;tamu.edu;amazon.com;visa.com;tamu.edu;rice.edu",
        "position": "PhD student;PhD student;Researcher;Researcher;PhD student;Associate Professor",
        "bibtex": "@misc{\njin2024growlength,\ntitle={GrowLength: Accelerating {LLM}s Pretraining by Progressively Growing Training Length},\nauthor={Hongye Jin and Xiaotian Han and Jingfeng Yang and Zhimeng Jiang and Chia-Yuan Chang and Xia Hu},\nyear={2024},\nurl={https://openreview.net/forum?id=vmlwllg7DJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "gxVT;jdbk;w2Jc;TKo2",
        "site": "https://openreview.net/forum?id=vmlwllg7DJ",
        "pdf_size": 519062,
        "rating": "3;3;5;6",
        "confidence": "4;4;4;3",
        "soundness": "2;1;3;4",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "142;31;91;76",
        "wc_strengths": "44;17;111;70",
        "wc_weaknesses": "89;180;180;320",
        "wc_questions": "33;12;207;8",
        "wc_review": "308;240;589;474",
        "wc_reply_reviewers": "0;71;0;0",
        "wc_reply_authors": "523;336;824;582",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            1.118033988749895
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            85.0,
            39.62953444086872
        ],
        "wc_strengths_avg": [
            60.5,
            34.659053651246744
        ],
        "wc_weaknesses_avg": [
            192.25,
            82.58442649797841
        ],
        "wc_questions_avg": [
            65.0,
            82.5318120484459
        ],
        "wc_review_avg": [
            402.75,
            137.14112257087586
        ],
        "wc_reply_reviewers_avg": [
            17.75,
            30.74390183434757
        ],
        "wc_reply_authors_avg": [
            566.25,
            174.33355242178712
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.7777777777777777,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=262406071331320034&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1;2;0;3",
        "aff_unique_norm": "Texas A&M University;Amazon;VISA;Rice University",
        "aff_unique_dep": ";Amazon.com, Inc.;Research;",
        "aff_unique_url": "https://www.tamu.edu;https://www.amazon.com;https://www.visa.com/;https://www.rice.edu",
        "aff_unique_abbr": "TAMU;Amazon;VISA;Rice",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";College Station",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "vnKf1jG5eK",
        "title": "Making Multimodal Generation Easier: When Diffusion Models Meet LLMS",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We present EasyGen, an efficient model designed to enhance multimodal understanding and generation by harnessing the capabilities of diffusion models and large language models (LLMs). Unlike existing multimodal models that predominately depend on encoders like CLIP or ImageBind and need ample amounts of training data to bridge the gap between modalities, EasyGen is built upon a bidirectional conditional diffusion model named BiDiffuser, which promotes more efficient interactions between modalities. EasyGen handles image-to-text generation by integrating BiDiffuser and an LLM via a simple projection layer. Unlike most existing multimodal models that are limited to generating text responses, EasyGen can also facilitate text-to-image generation by leveraging the LLM to create  textual descriptions, which can be interpreted by BiDiffuser to generate appropriate visual response. Extensive quantitative and qualitative experiments demonstrate the effectiveness of EasyGen, whose training can be easily achieved in a lab setting.",
        "keywords": "Multimodal Generation;Diffusion Models;Large Language Models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/c812097cef3bec0f6510d7d393b7ee54a5658a13.zip",
        "author": "Xiangyu Zhao;Bo LIU;Qijiong Liu;Guangyuan SHI;Xiao-Ming Wu",
        "authorids": "~Xiangyu_Zhao6;~Bo_LIU28;~Qijiong_Liu1;~Guangyuan_SHI1;~Xiao-Ming_Wu1",
        "gender": "M;M;M;M;F",
        "homepage": ";;https://liu.qijiong.work;;http://www4.comp.polyu.edu.hk/~csxmwu/",
        "dblp": ";;244/2483.html;;98/2898-3",
        "google_scholar": "eTbGxsEAAAAJ;UVwZ_6YAAAAJ;_Xq5M5AAAAAJ;https://scholar.google.com/citations?view_op=list_works;3KbaUFkAAAAJ",
        "orcid": ";;0000-0001-6087-383X;0000-0001-7401-8009;",
        "linkedin": ";;jyonn;;",
        "or_profile": "~Xiangyu_Zhao6;~Bo_LIU28;~Qijiong_Liu1;~Guangyuan_SHI1;~Xiao-Ming_Wu1",
        "aff": "Hong Kong Polytechnic University;Hong Kong Polytechnic University;Hong Kong Polytechnic University;The Hong Kong Polytechnic University;Hong Kong Polytechnic University",
        "aff_domain": "polyu.edu.hk;polyu.edu.hk;polyu.edu.hk;polyu.edu.hk;polyu.edu.hk",
        "position": "PhD student;PhD student;PhD student;PhD student;Associate Professor",
        "bibtex": "@misc{\nzhao2024making,\ntitle={Making Multimodal Generation Easier: When Diffusion Models Meet {LLMS}},\nauthor={Xiangyu Zhao and Bo LIU and Qijiong Liu and Guangyuan SHI and Xiao-Ming Wu},\nyear={2024},\nurl={https://openreview.net/forum?id=vnKf1jG5eK}\n}",
        "github": "",
        "project": "",
        "reviewers": "E4up;4W6z;Sp3b;4jWn",
        "site": "https://openreview.net/forum?id=vnKf1jG5eK",
        "pdf_size": 4667637,
        "rating": "3;5;5;5",
        "confidence": "4;4;5;4",
        "soundness": "2;3;2;3",
        "contribution": "2;2;3;2",
        "presentation": "2;2;3;3",
        "wc_summary": "93;63;113;73",
        "wc_strengths": "55;50;50;66",
        "wc_weaknesses": "221;146;288;192",
        "wc_questions": "648;4;26;1",
        "wc_review": "1017;263;477;332",
        "wc_reply_reviewers": "0;0;23;0",
        "wc_reply_authors": "1097;509;569;326",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "2;1;2;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            85.5,
            19.20286436967152
        ],
        "wc_strengths_avg": [
            55.25,
            6.53356717268599
        ],
        "wc_weaknesses_avg": [
            211.75,
            51.50910113756597
        ],
        "wc_questions_avg": [
            169.75,
            276.2864229382255
        ],
        "wc_review_avg": [
            522.25,
            295.9014827607324
        ],
        "wc_reply_reviewers_avg": [
            5.75,
            9.959292143521045
        ],
        "wc_reply_authors_avg": [
            625.25,
            286.6952868465054
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6183981413240243075&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Hong Kong Polytechnic University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.polyu.edu.hk",
        "aff_unique_abbr": "PolyU",
        "aff_campus_unique_index": "0;0;0;0;0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "From Bricks to Bridges: Product of Invariances to Enhance Latent Space Communication",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17521",
        "id": "vngVydDWft",
        "author_site": "Irene Cannistraci, Luca Moschella, Marco Fumero, Valentino Maiorca, Emanuele Rodol\u00e0",
        "tldr": "",
        "abstract": "It has been observed that representations learned by distinct neural networks conceal structural similarities when the models are trained under similar inductive biases. From a geometric perspective, identifying the classes of transformations and the related invariances that connect these representations is fundamental to unlocking applications, such as merging, stitching, and reusing different neural modules. However, estimating task-specific transformations a priori can be challenging and expensive due to several factors (e.g., weights initialization, training hyperparameters, or data modality). To this end, we introduce a versatile method to directly incorporate a set of invariances into the representations, constructing a product space of invariant components on top of the latent representations without requiring prior knowledge about the optimal invariance to infuse. We validate our solution on classification and reconstruction tasks, observing consistent latent similarity and downstream performance improvements in a zero-shot stitching setting. The experimental analysis comprises three modalities (vision, text, and graphs), twelve pretrained foundational models, nine benchmarks, and several architectures trained from scratch.",
        "keywords": "invariance;latent space;latent comunication;zero-shot stitching;representation learning;relative representation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/39a674f297f00f3cbdbaa039f347931dd4105dfd.zip",
        "author": "Irene Cannistraci;Luca Moschella;Marco Fumero;Valentino Maiorca;Emanuele Rodol\u00e0",
        "authorids": "~Irene_Cannistraci1;~Luca_Moschella1;~Marco_Fumero1;~Valentino_Maiorca1;~Emanuele_Rodol\u00e01",
        "gender": "F;M;;M;M",
        "homepage": "https://irene.cannistraci.dev;https://luca.moschella.dev;;https://gladia.di.uniroma1.it/authors/maiorca/;",
        "dblp": "322/3578;205/3639;273/9625;305/9789;54/8401",
        "google_scholar": "https://scholar.google.it/citations?user=VAMKJvIAAAAJ;4byA-nefJJMC;VYEljYEAAAAJ;https://scholar.google.it/citations?user=2VUUfFEAAAAJ;-EH4wBYAAAAJ",
        "orcid": "0000-0003-1655-3059;0000-0002-0550-7498;0000-0001-5614-5004;0000-0001-5795-3695;0000-0003-0091-7241",
        "linkedin": "irene-cannistraci/;lucamoschella/;;valentino-maiorca;",
        "or_profile": "~Irene_Cannistraci1;~Luca_Moschella1;~Marco_Fumero1;~Valentino_Maiorca1;~Emanuele_Rodol\u00e01",
        "aff": "University of Roma \"La Sapienza\";Sapienza University of Rome;Institute of Science and Technology Austria(ISTA);University of Roma \"La Sapienza\";Sapienza University of Rome",
        "aff_domain": "uniroma1.it;uniroma1.it;ista.ac.at;uniroma1.it;uniroma1.it",
        "position": "PhD student;PhD student;Postdoc;PhD student;Full Professor",
        "bibtex": "@inproceedings{\ncannistraci2024from,\ntitle={From Bricks to Bridges: Product of Invariances to Enhance Latent Space Communication},\nauthor={Irene Cannistraci and Luca Moschella and Marco Fumero and Valentino Maiorca and Emanuele Rodol{\\`a}},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=vngVydDWft}\n}",
        "github": "",
        "project": "",
        "reviewers": "pGUF;8YvH;NofE;ay1h",
        "pdf_size": 12322429,
        "rating": "6;6;6;6",
        "confidence": "3;4;3;3",
        "soundness": "3;3;3;4",
        "contribution": "3;3;3;2",
        "presentation": "3;3;2;4",
        "wc_summary": "67;59;59;101",
        "wc_strengths": "16;32;38;81",
        "wc_weaknesses": "170;125;402;204",
        "wc_questions": "37;1;16;412",
        "wc_review": "290;217;515;798",
        "wc_reply_reviewers": "24;17;79;0",
        "wc_reply_authors": "485;883;1156;749",
        "reply_reviewers": "1;1;2;0",
        "reply_authors": "2;3;3;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            71.5,
            17.342145196024624
        ],
        "wc_strengths_avg": [
            41.75,
            24.045529730076648
        ],
        "wc_weaknesses_avg": [
            225.25,
            105.82385128126835
        ],
        "wc_questions_avg": [
            116.5,
            171.08550493832024
        ],
        "wc_review_avg": [
            455.0,
            226.44977368061112
        ],
        "wc_reply_reviewers_avg": [
            30.0,
            29.605742686174924
        ],
        "wc_reply_authors_avg": [
            818.25,
            241.92909601782088
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15006441956522740609&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=vngVydDWft",
        "pdf": "https://openreview.net/pdf?id=vngVydDWft",
        "email": "uniroma1.it;uniroma1.it;ista.ac.at;uniroma1.it;uniroma1.it",
        "author_num": 5,
        "aff_unique_index": "0;1;2;0;1",
        "aff_unique_norm": "University of Rome La Sapienza;Sapienza University of Rome;Institute of Science and Technology Austria",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.uniroma1.it;https://www.uniroma1.it;https://www.ista.ac.at",
        "aff_unique_abbr": "La Sapienza;Sapienza;ISTA",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Rome;",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "Italy;Austria"
    },
    {
        "id": "voLFfrWzFI",
        "title": "Task Generalization in Decision-Focused Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Real-world optimization problems often contain uncertain parameters that must be predicted prior to solving. For example, a delivery company must make its routing decisions when the traffic conditions, and thus the road traversal times, are uncertain. The models used to predict these uncertain quantities are commonly trained in a way that is agnostic of the optimization problem and that focuses solely on predictive accuracy. However, such a prediction-focused training procedure generally does not minimize the downstream task loss of interest (e.g., the suboptimality of the roads that are selected based on the predictions). This has led to the development of decision-focused learning (DFL) methods, which specifically train the predictive model to make predictions that lead to good decisions on the considered optimization task. However, as we show in this paper, such models often generalize poorly to altered optimization tasks. For example, in the context of a routing problem, their performance may deteriorate when the destination node changes. To improve on this, we first explore how the model can be trained to generalize implicitly, by simply training it on different tasks sampled at training time. We then propose a more sophisticated approach by adding the use of explicit task representations, to enable the model to adapt its predictions better to different tasks. To this end, we represent the optimization problems as bipartite variable-constraint graphs, and train graph neural networks (GNNs) to produce informative node embeddings that are then given to the predictive model. In our experiments, we start by showing that the state of the art in DFL tends to overfit to the specific task it is trained on, and generalizes poorly to changing tasks. We then show that both of our proposed strategies significantly improve on this, with the explicit task representations generally providing an additional improvement over the implicit strategy.",
        "keywords": "task generalization;decision-focused learning;operations research;constrained optimization;combinatorial optimization;linear programming",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "",
        "author": "Senne Berden;Ali \u0130rfan Mahmuto\u011fullar\u0131;Tias Guns",
        "authorids": "~Senne_Berden1;~Ali_\u0130rfan_Mahmuto\u011fullar\u01311;~Tias_Guns2",
        "gender": "M;;",
        "homepage": ";;https://people.cs.kuleuven.be/~tias.guns/",
        "dblp": "322/1025.html;;41/3130",
        "google_scholar": ";;https://scholar.google.be/citations?user=hcjme5kAAAAJ",
        "orcid": ";;0000-0002-2156-2155",
        "linkedin": ";;",
        "or_profile": "~Senne_Berden1;~Ali_\u0130rfan_Mahmuto\u011fullar\u01311;~Tias_Guns2",
        "aff": "KU Leuven;;KU Leuven",
        "aff_domain": "kuleuven.be;;kuleuven.be",
        "position": "PhD student;;Associate Professor",
        "bibtex": "@misc{\nberden2024task,\ntitle={Task Generalization in Decision-Focused Learning},\nauthor={Senne Berden and Ali {\\.I}rfan Mahmuto{\\u{g}}ullar{\\i} and Tias Guns},\nyear={2024},\nurl={https://openreview.net/forum?id=voLFfrWzFI}\n}",
        "github": "",
        "project": "",
        "reviewers": "nLem;xQeo;g5nG;jrAx",
        "site": "https://openreview.net/forum?id=voLFfrWzFI",
        "pdf_size": 298876,
        "rating": "3;3;5;8",
        "confidence": "4;4;4;4",
        "soundness": "2;4;3;4",
        "contribution": "2;2;2;3",
        "presentation": "2;4;3;4",
        "wc_summary": "113;183;82;174",
        "wc_strengths": "83;110;41;132",
        "wc_weaknesses": "397;208;190;91",
        "wc_questions": "42;92;9;121",
        "wc_review": "635;593;322;518",
        "wc_reply_reviewers": "39;94;5;124",
        "wc_reply_authors": "1559;1009;1146;663",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;2;2;1",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            138.0,
            42.07730979993849
        ],
        "wc_strengths_avg": [
            91.5,
            33.93007515464709
        ],
        "wc_weaknesses_avg": [
            221.5,
            110.68536488623958
        ],
        "wc_questions_avg": [
            66.0,
            43.376260788592646
        ],
        "wc_review_avg": [
            517.0,
            120.13117830105556
        ],
        "wc_reply_reviewers_avg": [
            65.5,
            46.360004314063644
        ],
        "wc_reply_authors_avg": [
            1094.25,
            320.9029253528238
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Qy7evFFKY1IJ:scholar.google.com/&scioq=Task+Generalization+in+Decision-Focused+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Katholieke Universiteit Leuven",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kuleuven.be",
        "aff_unique_abbr": "KU Leuven",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Belgium"
    },
    {
        "id": "voVjW1PT2c",
        "title": "Guaranteed Out-Of-Distribution Detection with Diverse Auxiliary Set",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Out-of-distribution (OOD) detection is crucial for ensuring reliable deployment of machine learning models in real-world scenarios. Recent advancements leverage auxiliary outliers to represent the unknown OOD data to regularize model during training, showing promising performance. However, detectors face challenges in effectively identifying OOD data that significantly deviate from the distribution of the auxiliary outliers, limiting their generalization capacity. In this work, we thoroughly examine this problem from the generalization perspective and demonstrate that a more diverse set of auxiliary outliers improves OOD detection. Constrained by limited access to auxiliary outliers and the high cost of data collection, we propose Provable Mixup Outlier (ProMix), a simple yet practical approach that utilizes mixup to enhance auxiliary outlier diversity. By training with these diverse outliers, our method achieves superior OOD detection. We also provide insightful theoretical analysis to verify that our method achieves better performance than prior works. Furthermore, we evaluate ProMix on standard benchmarks and demonstrate significant relative improvements of 14.2\\% and 31.5\\% (FPR95) on CIFAR-10 and CIFAR-100, respectively, compared to state-of-the-art methods. Our findings emphasize the importance of incorporating diverse auxiliary outliers during training and highlight ProMix as a promising solution to enhance model security in real-world applications. Compared with other methods, the proposed method achieves excellent performance on different metrics in almost all datasets.",
        "keywords": "out-of-distribution detection",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Haiyun Yao;Zongbo Han;Huazhu Fu;Xi Peng;Qinghua Hu;Changqing Zhang",
        "authorids": "~Haiyun_Yao2;~Zongbo_Han1;~Huazhu_Fu4;~Xi_Peng3;~Qinghua_Hu1;~Changqing_Zhang1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://github.com/HaiyunYao;https://zongbo-han.github.io/;https://hzfu.github.io;http://cic.tju.edu.cn/faculty/huqinghua/index.html;http://cic.tju.edu.cn/faculty/zhangchangqing/index.html;http://www.pengxi.me",
        "dblp": "280/1096;255/6965;63/7767;;78/2668;18/931-1",
        "google_scholar": ";F2BBkQEAAAAJ;https://scholar.google.com/citations?hl=en;TVSNq_wAAAAJ;yJGhdykAAAAJ;bw9FOHAAAAAJ",
        "orcid": ";;0000-0002-9702-5524;0000-0001-7765-8095;;",
        "linkedin": ";;;;;",
        "or_profile": "~Haiyun_Yao2;~Zongbo_Han1;~Huazhu_Fu4;~Qinghua_Hu1;~Changqing_Zhang1;~Xi_Peng2",
        "aff": "Tianjin University;Tianjin University;Institute of High Performance Computing, Singapore, A*STAR;Tianjin University;Tianjin University;Sichuan University",
        "aff_domain": "tju.edu.cn;tju.edu.cn;ihpc.a-star.edu.sg;tju.edu.cn;tju.edu.cn;scu.edu.cn",
        "position": "MS student;PhD student;Principal Scientist;Professor;Associate Professor;Full Professor",
        "bibtex": "@misc{\nyao2024guaranteed,\ntitle={Guaranteed Out-Of-Distribution Detection with Diverse Auxiliary Set},\nauthor={Haiyun Yao and Zongbo Han and Huazhu Fu and Xi Peng and Qinghua Hu and Changqing Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=voVjW1PT2c}\n}",
        "github": "",
        "project": "",
        "reviewers": "aAfD;pfu4;iVGn",
        "site": "https://openreview.net/forum?id=voVjW1PT2c",
        "pdf_size": 1191869,
        "rating": "5;5;8",
        "confidence": "4;3;4",
        "soundness": "3;2;4",
        "contribution": "2;2;2",
        "presentation": "2;3;4",
        "wc_summary": "66;62;107",
        "wc_strengths": "25;36;32",
        "wc_weaknesses": "201;181;147",
        "wc_questions": "2;4;75",
        "wc_review": "294;283;361",
        "wc_reply_reviewers": "0;39;61",
        "wc_reply_authors": "1530;1214;946",
        "reply_reviewers": "0;1;1",
        "reply_authors": "2;3;3",
        "rating_avg": [
            6.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            78.33333333333333,
            20.33606539022619
        ],
        "wc_strengths_avg": [
            31.0,
            4.546060565661952
        ],
        "wc_weaknesses_avg": [
            176.33333333333334,
            22.29100466306732
        ],
        "wc_questions_avg": [
            27.0,
            33.95094500402996
        ],
        "wc_review_avg": [
            312.6666666666667,
            34.4705993887867
        ],
        "wc_reply_reviewers_avg": [
            33.333333333333336,
            25.223445883190152
        ],
        "wc_reply_authors_avg": [
            1230.0,
            238.68528791416253
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ls1L8ko8qI0J:scholar.google.com/&scioq=Guaranteed+Out-Of-Distribution+Detection+with+Diverse+Auxiliary+Set&hl=en&as_sdt=0,48",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;0;2",
        "aff_unique_norm": "Tianjin University;Institute of High Performance Computing;Sichuan University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.tju.edu.cn;https://www.ihpc.a-star.edu.sg;https://www.scu.edu.cn",
        "aff_unique_abbr": "TJU;IHPC;SCU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0;0",
        "aff_country_unique": "China;Singapore"
    },
    {
        "id": "vogtAV1GGL",
        "title": "Simple mechanisms for representing, indexing and manipulating concepts",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep networks typically learn concepts via classifiers, which involves setting up a model and training\nit via grading descent to fit the concept-labeled data. We will argue instead that learning a concept could\nbe done by looking at its moment statistics matrix to generate a concrete representation or signature of\nthat concept. These signatures can be used to discover structure across the set of concepts and could\nrecursively produce higher-level concepts by learning this structure from those signatures. Concepts can\nbe \u2019intersected\u2019 to find a common theme in a number of related concepts. This process could be used to\nkeep a dictionary of concepts so that inputs could correctly identify and be routed to the set of concepts\ninvolved in the (latent) generation of the input.",
        "keywords": "learning theory;theory of representations;manifolds",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Yuanzhi Li;Raghu Meka;Rina Panigrahy;Kulin Shah",
        "authorids": "~Yuanzhi_Li1;~Raghu_Meka1;~Rina_Panigrahy1;~Kulin_Shah1",
        "gender": "M;M;;M",
        "homepage": ";http://raghumeka.org;;https://kulinshah98.github.io/",
        "dblp": "73/3628;76/1906;p/RinaPanigrahy;215/3581",
        "google_scholar": ";xuDZ9-sAAAAJ;;https://scholar.google.co.in/citations?user=67OmLg4AAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Yuanzhi_Li1;~Raghu_Meka1;~Rina_Panigrahy1;~Kulin_Shah1",
        "aff": "Carnegie Mellon University;University of California, Los Angeles;Google;University of Texas, Austin",
        "aff_domain": "andrew.cmu.edu;ucla.edu;google.com;cs.utexas.edu",
        "position": "Assistant Professor;Associate Professor;Research Scientist;PhD student",
        "bibtex": "@misc{\nli2024simple,\ntitle={Simple mechanisms for representing, indexing and manipulating concepts},\nauthor={Yuanzhi Li and Raghu Meka and Rina Panigrahy and Kulin Shah},\nyear={2024},\nurl={https://openreview.net/forum?id=vogtAV1GGL}\n}",
        "github": "",
        "project": "",
        "reviewers": "UZQy;G7CX;bdWm;ViNR",
        "site": "https://openreview.net/forum?id=vogtAV1GGL",
        "pdf_size": 623745,
        "rating": "3;6;6;8",
        "confidence": "3;3;2;3",
        "soundness": "2;3;3;3",
        "contribution": "1;2;2;3",
        "presentation": "1;3;3;3",
        "wc_summary": "49;241;94;66",
        "wc_strengths": "20;45;34;47",
        "wc_weaknesses": "71;170;43;131",
        "wc_questions": "135;69;4;21",
        "wc_review": "275;525;175;265",
        "wc_reply_reviewers": "74;198;37;38",
        "wc_reply_authors": "529;265;146;354",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            112.5,
            75.90948557327997
        ],
        "wc_strengths_avg": [
            36.5,
            10.735455276791944
        ],
        "wc_weaknesses_avg": [
            103.75,
            49.73617898471896
        ],
        "wc_questions_avg": [
            57.25,
            50.82506763399336
        ],
        "wc_review_avg": [
            310.0,
            130.09611831257686
        ],
        "wc_reply_reviewers_avg": [
            86.75,
            65.93699644357483
        ],
        "wc_reply_authors_avg": [
            323.5,
            139.72204550463752
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.08084520834544431,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:KjaRV2sFTOkJ:scholar.google.com/&scioq=Simple+mechanisms+for+representing,+indexing+and+manipulating+concepts&hl=en&as_sdt=0,33",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Carnegie Mellon University;University of California, Los Angeles;Google;University of Texas at Austin",
        "aff_unique_dep": ";;Google;",
        "aff_unique_url": "https://www.cmu.edu;https://www.ucla.edu;https://www.google.com;https://www.utexas.edu",
        "aff_unique_abbr": "CMU;UCLA;Google;UT Austin",
        "aff_campus_unique_index": "1;2;3",
        "aff_campus_unique": ";Los Angeles;Mountain View;Austin",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "ModernTCN: A Modern Pure Convolution Structure for General Time Series Analysis",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17520",
        "id": "vpJMJerXHU",
        "author_site": "DongHao Luo, Xue Wang",
        "tldr": "",
        "abstract": "Recently, Transformer-based and MLP-based models have emerged rapidly and\nwon dominance in time series analysis. In contrast, convolution is losing steam\nin time series tasks nowadays for inferior performance. This paper studies the\nopen question of how to better use convolution in time series analysis and makes\nefforts to bring convolution back to the arena of time series analysis. To this end,\nwe modernize the traditional TCN and conduct time series related modifications\nto make it more suitable for time series tasks. As the outcome, we propose\nModernTCN and successfully solve this open question through a seldom-explored\nway in time series community. As a pure convolution structure, ModernTCN still\nachieves the consistent state-of-the-art performance on five mainstream time series\nanalysis tasks while maintaining the efficiency advantage of convolution-based\nmodels, therefore providing a better balance of efficiency and performance than\nstate-of-the-art Transformer-based and MLP-based models. Our study further\nreveals that, compared with previous convolution-based models, our ModernTCN\nhas much larger effective receptive fields (ERFs), therefore can better unleash the\npotential of convolution in time series analysis. Code is available at this repository:\nhttps://github.com/luodhhh/ModernTCN.",
        "keywords": "Time Series Analysis;Deep Learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Luo donghao;wang xue",
        "authorids": "~Luo_donghao2;~wang_xue3",
        "gender": "M;",
        "homepage": "https://scholar.google.com.hk/citations?hl=zh-CN&user=N9buLPcAAAAJ&view_op=list_works&gmla=AJsN-F5ymBP7m0S1jkq8tAOUf3_7FncTQ1vRGOiRrSsiiD0S1sGUud1O0YBQl8nx_uRy_AH2Nxn5eZB-fNwniib0RNHhOlB6Z-eEwpdIhUJPXP8Xy_QcJDpqw6jDUm4u2kI4XiN3lMcsppA17bCST12QfhdpAL19OQ;http://faculty.dpi.tsinghua.edu.cn/wangxue.html",
        "dblp": ";39/2811-1",
        "google_scholar": "https://scholar.google.com.hk/citations?hl=zh-CN;",
        "orcid": ";0000-0003-4842-3160",
        "linkedin": ";",
        "or_profile": "~Luo_donghao2;~wang_xue3",
        "aff": "Department of Precision Instrument, Tsinghua University, Tsinghua University;Department of Precision Instrument, Tsinghua University, Tsinghua University",
        "aff_domain": "mails.tsinghua.edu.cn;mail.tsinghua.edu.cn",
        "position": "PhD student;Full Professor",
        "bibtex": "@inproceedings{\ndonghao2024moderntcn,\ntitle={Modern{TCN}: A Modern Pure Convolution Structure for General Time Series Analysis},\nauthor={Luo donghao and wang xue},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=vpJMJerXHU}\n}",
        "github": "",
        "project": "",
        "reviewers": "dxG8;exNa;kELp",
        "pdf_size": 27985970,
        "rating": "8;8;8",
        "confidence": "3;4;4",
        "soundness": "4;3;3",
        "contribution": "3;3;4",
        "presentation": "4;3;4",
        "wc_summary": "135;72;79",
        "wc_strengths": "30;34;54",
        "wc_weaknesses": "51;192;69",
        "wc_questions": "148;5;158",
        "wc_review": "364;303;360",
        "wc_reply_reviewers": "28;12;0",
        "wc_reply_authors": "875;1099;994",
        "reply_reviewers": "1;1;0",
        "reply_authors": "3;3;3",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            95.33333333333333,
            28.193773938387338
        ],
        "wc_strengths_avg": [
            39.333333333333336,
            10.498677165349081
        ],
        "wc_weaknesses_avg": [
            104.0,
            62.65780079128216
        ],
        "wc_questions_avg": [
            103.66666666666667,
            69.88721072000385
        ],
        "wc_review_avg": [
            342.3333333333333,
            27.860764925289153
        ],
        "wc_reply_reviewers_avg": [
            13.333333333333334,
            11.469767022723502
        ],
        "wc_reply_authors_avg": [
            989.3333333333334,
            91.50713390526204
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.0,
            0.0
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 128,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12124632047728180898&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=vpJMJerXHU",
        "pdf": "https://openreview.net/pdf?id=vpJMJerXHU",
        "email": "mails.tsinghua.edu.cn;mail.tsinghua.edu.cn",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Tsinghua University",
        "aff_unique_dep": "Department of Precision Instrument",
        "aff_unique_url": "https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "When should we prefer Decision Transformers for Offline Reinforcement Learning?",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17519",
        "id": "vpV7fOFQy4",
        "author_site": "Prajjwal Bhargava, Rohan Chitnis, Alborz Geramifard, Shagun Sodhani, Amy Zhang",
        "tldr": "",
        "abstract": "Offline reinforcement learning (RL) allows agents to learn effective, return-maximizing policies from a static dataset. Three popular algorithms for offline RL are Conservative Q-Learning (CQL), Behavior Cloning (BC), and Decision Transformer (DT), from the class of Q-Learning, Imitation Learning, and Sequence Modeling respectively. A key open question is: which algorithm is preferred under what conditions? We study this question empirically by exploring the performance of these algorithms across the commonly used D4RL and Robomimic benchmarks. We design targeted experiments to understand their behavior concerning data suboptimality, task complexity, and stochasticity. Our key findings are: (1) DT requires more data than CQL to learn competitive policies but is more robust; (2) DT is a substantially better choice than both CQL and BC in sparse-reward and low-quality data settings; (3) DT and BC are preferable as task horizon increases, or when data is obtained from human demonstrators; and (4) CQL excels in situations characterized by the combination of high stochasticity and low data quality. We also investigate architectural choices and scaling trends for DT on \\textsc{atari} and D4RL and make design/scaling recommendations. We find that scaling the amount of data for DT by 5x gives a 2.5x average score improvement on Atari.",
        "keywords": "offline reinforcement learning;sequence modeling;reinforcement learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/3b61dcec0e67a8a864d127107a42b037c21d59ab.zip",
        "author": "Prajjwal Bhargava;Rohan Chitnis;Alborz Geramifard;Shagun Sodhani;Amy Zhang",
        "authorids": "~Prajjwal_Bhargava1;~Rohan_Chitnis1;~Alborz_Geramifard1;~Shagun_Sodhani1;~Amy_Zhang1",
        "gender": "M;M;M;M;F",
        "homepage": "https://prajjwal1.github.io;https://rohanchitnis.com;http://alborz-geramifard.com;https://shagunsodhani.com;",
        "dblp": "225/5415;151/9589;39/3250;http://dblp.uni-trier.de/pers/hd/s/Sodhani:Shagun;43/2754",
        "google_scholar": "zTq103EAAAAJ;rNcmwggAAAAJ;https://scholar.google.com/citations?hl=en;ixp-vqMAAAAJ;",
        "orcid": ";;;;",
        "linkedin": "prajjwal1;;alborzgeramifard/;shagun-sodhani-b2239879;",
        "or_profile": "~Prajjwal_Bhargava1;~Rohan_Chitnis1;~Alborz_Geramifard1;~Shagun_Sodhani1;~Amy_Zhang2",
        "aff": ";Meta;Meta;Meta Facebook;Meta Facebook",
        "aff_domain": ";meta.com;meta.com;fb.com;facebook.com",
        "position": ";Researcher;Researcher;Researcher;Research Scientist",
        "bibtex": "@inproceedings{\nbhargava2024when,\ntitle={When should we prefer Decision Transformers for Offline Reinforcement Learning?},\nauthor={Prajjwal Bhargava and Rohan Chitnis and Alborz Geramifard and Shagun Sodhani and Amy Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=vpV7fOFQy4}\n}",
        "github": "",
        "project": "",
        "reviewers": "wytN;q2Sb;2vu5;pkaE",
        "pdf_size": 1241977,
        "rating": "6;6;6;6",
        "confidence": "4;4;4;2",
        "soundness": "4;3;3;3",
        "contribution": "3;3;2;2",
        "presentation": "4;3;4;3",
        "wc_summary": "58;80;60;182",
        "wc_strengths": "139;50;85;76",
        "wc_weaknesses": "110;254;286;109",
        "wc_questions": "13;85;42;41",
        "wc_review": "320;469;473;408",
        "wc_reply_reviewers": "5;99;38;0",
        "wc_reply_authors": "127;467;777;174",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            95.0,
            50.96076922496363
        ],
        "wc_strengths_avg": [
            87.5,
            32.39212867349104
        ],
        "wc_weaknesses_avg": [
            189.75,
            81.04435513963944
        ],
        "wc_questions_avg": [
            45.25,
            25.733004099793714
        ],
        "wc_review_avg": [
            417.5,
            61.90516941257814
        ],
        "wc_reply_reviewers_avg": [
            35.5,
            39.46200704475128
        ],
        "wc_reply_authors_avg": [
            386.25,
            260.5123557530429
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5191611822266219649&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=vpV7fOFQy4",
        "pdf": "https://openreview.net/pdf?id=vpV7fOFQy4",
        "email": ";meta.com;meta.com;fb.com;facebook.com",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Meta",
        "aff_unique_dep": "Meta Platforms, Inc.",
        "aff_unique_url": "https://meta.com",
        "aff_unique_abbr": "Meta",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "vptc5AXo3T",
        "title": "Constructive Large Language Model Alignment with Diverse Feedback",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In recent research on large language models (LLMs), there has been a growing emphasis on aligning these models with human values to reduce the impact of harmful content. However, current alignment methods often rely solely on singular forms of human feedback, such as preferences, annotated labels, or natural language critiques, overlooking the potential advantages of combining these feedback types. This limitation leads to suboptimal performance, even when ample training data is available. In this paper, we introduce Constructive and Diverse Feedback (CDF) as a novel method to enhance LLM alignment. Our approach involves collecting three distinct types of feedback tailored to problems of varying difficulty levels within the training dataset. Specifically, we exploit critique feedback for easy problems, refinement feedback for medium problems, and preference feedback for hard problems. By training our model with this diversified feedback, we achieve enhanced alignment performance while using less training data. To assess the effectiveness of CDF, we evaluate it against previous methods in three downstream tasks: question answering, dialog generation, and text summarization. Experimental results demonstrate that CDF achieves superior performance even with a smaller training dataset.",
        "keywords": "large language models;alignment;diverse feedback;constructivist learning theory;zone of proximal development",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Tianshu Yu;Ting-En Lin;Yuchuan Wu;Min Yang;Fei Huang;Yongbin Li",
        "authorids": "~Tianshu_Yu4;~Ting-En_Lin1;~Yuchuan_Wu1;~Min_Yang6;~Fei_Huang1;~Yongbin_Li2",
        "gender": "M;M;F;M;M;M",
        "homepage": ";;https://minyang.me/;https://yongbin-li.github.io/;https://sites.google.com/view/fei-huang;https://tnlin.github.io/",
        "dblp": ";87/8595;02/1640-7;;h/FeiHuang.html;242/8515",
        "google_scholar": ";y-cwb-MAAAAJ;_wop6KgAAAAJ;xF5VrokAAAAJ;9r98PpoAAAAJ;XNdFVMAAAAAJ",
        "orcid": "0009-0001-9613-5123;;;;;",
        "linkedin": ";;;;fei-huang-cas-cmu;",
        "or_profile": "~Tianshu_Yu4;~Yuchuan_Wu1;~Min_Yang6;~Yongbin_Li2;~Fei_Huang2;~Tony_Lin1",
        "aff": "Shenzhen Institutes of Advanced Technology, Chinese Academy of Sciences, Chinese Academy of Sciences;Alibaba Group;Shenzhen Institutes of Advanced Technology, Chinese Academy of Sciences, Chinese Academy of Sciences;Alibaba Group;Alibaba Group US;Alibaba Group",
        "aff_domain": "siat.ac.cn;alibaba-inc.com;siat.ac.cn;alibaba-inc.com;alibaba-inc.com;alibaba-inc.com",
        "position": "MS student;Researcher;Associate Professor;Researcher;Senior Research Director;Researcher",
        "bibtex": "@misc{\nyu2024constructive,\ntitle={Constructive Large Language Model Alignment with Diverse Feedback},\nauthor={Tianshu Yu and Ting-En Lin and Yuchuan Wu and Min Yang and Fei Huang and Yongbin Li},\nyear={2024},\nurl={https://openreview.net/forum?id=vptc5AXo3T}\n}",
        "github": "",
        "project": "",
        "reviewers": "Amop;zeGx;1jjk;wpoj",
        "site": "https://openreview.net/forum?id=vptc5AXo3T",
        "pdf_size": 948931,
        "rating": "3;5;5;6",
        "confidence": "4;4;4;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;4;3",
        "wc_summary": "213;90;66;47",
        "wc_strengths": "16;44;30;18",
        "wc_weaknesses": "144;245;245;143",
        "wc_questions": "100;84;13;129",
        "wc_review": "473;463;354;337",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            104.0,
            64.7495173727187
        ],
        "wc_strengths_avg": [
            27.0,
            11.180339887498949
        ],
        "wc_weaknesses_avg": [
            194.25,
            50.751231512151506
        ],
        "wc_questions_avg": [
            81.5,
            42.71123973850443
        ],
        "wc_review_avg": [
            406.75,
            61.645660836753144
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.6622661785325219,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15392666928417331587&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;1;1;1",
        "aff_unique_norm": "Chinese Academy of Sciences;Alibaba Group",
        "aff_unique_dep": "Shenzhen Institutes of Advanced Technology;",
        "aff_unique_url": "http://www.cas.cn;https://www.alibaba.com",
        "aff_unique_abbr": "CAS;Alibaba",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Shenzhen;",
        "aff_country_unique_index": "0;0;0;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "vq75kRCYuY",
        "title": "SOLO: Surrogate Online Learning at Once for Spiking Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Spiking Neural Networks (SNNs) show promise as energy-efficient models inspired by the brain. However, there is a lack of efficient training methods for deep SNNs with online learning rules that mimic biological systems, particularly for deployment on neuromorphic computing substrates. In this paper, we propose Surrogate Online Learning at Once (SOLO) for SNNs, which utilizes several surrogate strategies that could be implemented in a hardware-friendly manner. By exploiting expanded spatial gradient from only the final time step of forward propagation, SOLO achieves low computational complexity while maintaining comparable accruacy and convergence speed. Moreover, the update rule of SOLO takes the simple form of three-factor Hebbian learning, which could enable online on-chip learning. Our experiments on both static and neuromorphic datasets show that SOLO achieves performance comparable to conventional learning algorithms. Furthermore, SOLO is hardware-friendly, offering robustness against device non-idealities and sparse access during write operations to memory devices.",
        "keywords": "spiking neural network;learning algorithm;low complexity;hardware-friendly",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/fb477f86ba0a2cd1cf41e19c023d8c8e4f1f7dd2.zip",
        "author": "Sung Min Lee;Minsik Yoon;Hyunin Moon;Sangbum Kim",
        "authorids": "~Sung_Min_Lee1;~Minsik_Yoon1;~Hyunin_Moon1;~Sangbum_Kim2",
        "gender": ";M;M;M",
        "homepage": ";;http://neuromorphic.snu.ac.kr;",
        "dblp": ";;;67/8410",
        "google_scholar": "https://scholar.google.co.kr/citations?user=MtRCLWAAAAAJ;;;pkF_3SYAAAAJ",
        "orcid": ";;;0000-0001-7460-3750",
        "linkedin": ";msyoon1/;;sangbum-kim-03806526/",
        "or_profile": "~Sung_Min_Lee1;~Minsik_Yoon1;~Hyunin_Moon1;~Sangbum_Kim2",
        "aff": "Seoul National University;Seoul National University;Seoul National University;Seoul National University",
        "aff_domain": "snu.ac.kr;snu.ac.kr;snu.ac.kr;snu.ac.kr",
        "position": "PhD student;PhD student;Undergrad student;Associate Professor",
        "bibtex": "@misc{\nlee2024solo,\ntitle={{SOLO}: Surrogate Online Learning at Once for Spiking Neural Networks},\nauthor={Sung Min Lee and Minsik Yoon and Hyunin Moon and Sangbum Kim},\nyear={2024},\nurl={https://openreview.net/forum?id=vq75kRCYuY}\n}",
        "github": "",
        "project": "",
        "reviewers": "Ev3G;gzEk;TEM3;wijC",
        "site": "https://openreview.net/forum?id=vq75kRCYuY",
        "pdf_size": 10361605,
        "rating": "3;3;5;5",
        "confidence": "3;4;4;5",
        "soundness": "2;1;3;2",
        "contribution": "2;2;2;2",
        "presentation": "2;2;3;3",
        "wc_summary": "72;42;84;79",
        "wc_strengths": "84;17;33;43",
        "wc_weaknesses": "106;281;90;132",
        "wc_questions": "118;57;66;53",
        "wc_review": "380;397;273;307",
        "wc_reply_reviewers": "0;0;46;0",
        "wc_reply_authors": "462;287;741;259",
        "reply_reviewers": "0;0;2;0",
        "reply_authors": "1;1;3;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            69.25,
            16.29992331270304
        ],
        "wc_strengths_avg": [
            44.25,
            24.752525123712125
        ],
        "wc_weaknesses_avg": [
            152.25,
            75.82999076882444
        ],
        "wc_questions_avg": [
            73.5,
            26.119915773217954
        ],
        "wc_review_avg": [
            339.25,
            51.050832510351874
        ],
        "wc_reply_reviewers_avg": [
            11.5,
            19.91858428704209
        ],
        "wc_reply_authors_avg": [
            437.25,
            191.8493875413732
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.7071067811865475,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:lBbuEsliEQoJ:scholar.google.com/&scioq=SOLO:+Surrogate+Online+Learning+at+Once+for+Spiking+Neural+Networks&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Seoul National University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.snu.ac.kr",
        "aff_unique_abbr": "SNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "vq8BCZYAdj",
        "title": "Multi-fidelity Deep Symbolic Optimization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Although Symbolic Optimization (SO) can be used to model many challenging problems, the computational cost of evaluating large numbers of candidate solutions is intractable in many real-world domains for existing SO algorithms based on reinforcement learning (RL). While lower-fidelity surrogate models or simulations can be used to speed up solution evaluation, current methods for SO are unaware of the existence of the multiple fidelities and therefore do not natively account for the mismatch between lower and higher fidelities. We propose to explicitly reason over the multiple fidelities. For that, we introduce Multi-Fidelity Markov Decision Processes (MF-MDPs) and propose a whole new family of multi-fidelity SO algorithms that account for multiple fidelities and their associated costs. We conduct experimental evaluation in two challenging SO domains, Symbolic Regression and Antibody Optimization, and show that our methods outperform fidelity-agnostic and fidelity-aware baselines.",
        "keywords": "Symbolic Optimization;Multi-fidelity Symbolic Optimization;Deep Symbolic Optimization",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Felipe Leno da Silva;Jiachen Yang;Mikel Landajuela;Andre R Goncalves;Alexander Ladd;Daniel faissol;Brenden K. Petersen",
        "authorids": "~Felipe_Leno_da_Silva1;~Jiachen_Yang1;~Mikel_Landajuela1;~Andre_R_Goncalves1;~Alexander_Ladd1;~Daniel_faissol1;~Brenden_K._Petersen1",
        "gender": "M;;M;M;M;M;",
        "homepage": "https://f-leno.github.io;;https://landajuela.github.io/;https://andreric.github.io;https://xanderladd.github.io/;http://www.llnl.gov;",
        "dblp": "177/9513;;290/1379;56/8980.html;295/6389;;",
        "google_scholar": "XbyIZQ4AAAAJ;;Tl93fucAAAAJ;pn7hL2cAAAAJ;https://scholar.google.com/citations?hl=en;;",
        "orcid": ";;0000-0002-4804-6513;0000-0002-0320-280X;;0000-0001-6965-983X;",
        "linkedin": ";;mikel-landajuela-larma-ph-d-139aa5129/;;;;",
        "or_profile": "~Felipe_Leno_da_Silva1;~Jiachen_Yang1;~Mikel_Landajuela1;~Andre_R_Goncalves1;~Alexander_Ladd1;~Daniel_faissol1;~Brenden_K._Petersen1",
        "aff": "Lawrence Livermore National Lab;;Lawrence Livermore National Labs;Lawrence Livermore National Labs;;Lawrence Livermore National Labs;",
        "aff_domain": "llnl.gov;;llnl.gov;llnl.gov;;llnl.gov;",
        "position": "Researcher;;Researcher;Researcher;;Staff Scientist;",
        "bibtex": "@misc{\nanonymous2024multifidelity,\ntitle={Multi-fidelity Deep Symbolic Optimization},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=vq8BCZYAdj}\n}",
        "github": "",
        "project": "",
        "reviewers": "cMbu;srRU;LbGz;uXaR;u7RE",
        "site": "https://openreview.net/forum?id=vq8BCZYAdj",
        "pdf_size": 927181,
        "rating": "3;5;5;5;8",
        "confidence": "3;4;3;3;3",
        "soundness": "1;2;2;2;3",
        "contribution": "2;2;2;2;4",
        "presentation": "2;3;2;2;3",
        "wc_summary": "217;73;55;59;68",
        "wc_strengths": "113;23;57;44;57",
        "wc_weaknesses": "510;118;60;43;35",
        "wc_questions": "89;7;325;95;1",
        "wc_review": "929;221;497;241;161",
        "wc_reply_reviewers": "177;0;0;0;0",
        "wc_reply_authors": "494;360;404;527;128",
        "reply_reviewers": "1;0;0;0;0",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            5.2,
            1.6
        ],
        "confidence_avg": [
            3.2,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            2.4,
            0.8
        ],
        "presentation_avg": [
            2.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            94.4,
            61.62986289129645
        ],
        "wc_strengths_avg": [
            58.8,
            29.81543224573476
        ],
        "wc_weaknesses_avg": [
            153.2,
            180.74667355168668
        ],
        "wc_questions_avg": [
            103.4,
            117.61224426053607
        ],
        "wc_review_avg": [
            409.8,
            283.976337042367
        ],
        "wc_reply_reviewers_avg": [
            35.4,
            70.8
        ],
        "wc_reply_authors_avg": [
            382.6,
            140.74885434702477
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.0625,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:MdxO7Dqkz-IJ:scholar.google.com/&scioq=Multi-fidelity+Deep+Symbolic+Optimization&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Lawrence Livermore National Laboratory",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.llnl.gov",
        "aff_unique_abbr": "LLNL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "vqHvfEUxGu",
        "title": "A Collaborative Perspective on Exploration in Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Exploration is one of the central topic in reinforcement learning (RL). Many existing approaches take a single agent perspective when tackling this problem. In this work, we view this problem from a different angle by taking a multi-agent perspective. By doing this, we can not only learn with parallel agents, which is not fundamentally different by itself, but more importantly, it unlocks the possibility of introducing collaborative exploration and learning among these agents. We formulate this problem as *Collaborative Exploration* and proposed concrete instantiations. We introduce a collaborative reward generator as a core component to induce collaboration, which can compute novelty of a state not only from one agent's own perspective, but also respect other agents' intrinsic motivation in pursuit of novelty. This leads to collaboration and specialization of each agent within the set of agents. In addition, we discussed how to effectively leverage the shared information from other agents in the data collection and evaluation phases, respectively. Experiments on the DeepMind control suite (DMC) benchmark tasks showcase the effectiveness of the proposed method.",
        "keywords": "Exploration;Reinforcement Learning;Intrinsic Rewards",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/2ad677279fdeb1de2eb4c35e912f5e53f0781966.zip",
        "author": "Yuwei Fu;Haichao Zhang;Di Wu;Wei Xu;Benoit Boulet",
        "authorids": "~Yuwei_Fu1;~Haichao_Zhang4;~Di_Wu11;~Wei_Xu13;~Benoit_Boulet1",
        "gender": "M;M;M;M;M",
        "homepage": "http://mcgillialab.com/people/;http://mcgillialab.com/people/;;https://www.mcgill.ca/ece/benoit-boulet;https://sites.google.com/site/hczhang1/",
        "dblp": "200/1646;52/328-44.html;;;",
        "google_scholar": ";https://scholar.google.ca/citations?user=IbcoTsgAAAAJ;Gxz1fqwAAAAJ;https://scholar.google.ca/citations?user=kkGyLY4AAAAJ;_OsT-RgAAAAJ",
        "orcid": ";;;0000-0002-3191-3967;",
        "linkedin": ";;;benoit-boulet-97078012/;",
        "or_profile": "~Yuwei_Fu1;~Di_Wu11;~Wei_Xu13;~Benoit_Boulet1;~Haichao_Zhang2",
        "aff": "McGill University;McGill University;Horizon Robotics;McGill University;Horizon Robotics",
        "aff_domain": "mcgill.ca;mcgill.ca;horizon.auto;mcgill.ca;horizon.ai",
        "position": "PhD student;Adjunct Professor;Researcher;Full Professor;Research Scientist",
        "bibtex": "@misc{\nfu2024a,\ntitle={A Collaborative Perspective on Exploration in Reinforcement Learning},\nauthor={Yuwei Fu and Haichao Zhang and Di Wu and Wei Xu and Benoit Boulet},\nyear={2024},\nurl={https://openreview.net/forum?id=vqHvfEUxGu}\n}",
        "github": "",
        "project": "",
        "reviewers": "ArFd;AU7q;JJ8w;6JRU",
        "site": "https://openreview.net/forum?id=vqHvfEUxGu",
        "pdf_size": 18461159,
        "rating": "3;5;5;6",
        "confidence": "5;4;4;4",
        "soundness": "1;2;3;3",
        "contribution": "1;2;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "33;149;84;49",
        "wc_strengths": "121;61;86;42",
        "wc_weaknesses": "207;136;215;27",
        "wc_questions": "26;41;268;101",
        "wc_review": "387;387;653;219",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1287;550;841;454",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;2;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            78.75,
            44.55544298960566
        ],
        "wc_strengths_avg": [
            77.5,
            29.567718883945037
        ],
        "wc_weaknesses_avg": [
            146.25,
            75.40349792947273
        ],
        "wc_questions_avg": [
            109.0,
            95.99218718208269
        ],
        "wc_review_avg": [
            411.5,
            155.3858101629618
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            783.0,
            324.00231480654577
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9271726499455306,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Gk06Wr_s0nQJ:scholar.google.com/&scioq=A+Collaborative+Perspective+on+Exploration+in+Reinforcement+Learning&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;1",
        "aff_unique_norm": "McGill University;Horizon Robotics",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.mcgill.ca;https://www.horizon-robotics.com/",
        "aff_unique_abbr": "McGill;Horizon Robotics",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;1",
        "aff_country_unique": "Canada;China"
    },
    {
        "title": "Can Large Language Models Infer Causation from Correlation?",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17518",
        "id": "vqIH0ObdqL",
        "author_site": "Zhijing Jin, Jiarui Liu, Zhiheng LYU, spencer poff, Mrinmaya Sachan, Rada Mihalcea, Mona Diab, Bernhard Schoelkopf",
        "tldr": "",
        "abstract": "Causal inference is one of the hallmarks of human intelligence. While the field of CausalNLP has attracted much interest in the recent years, existing causal inference datasets in NLP primarily rely on discovering causality from empirical knowledge (e.g., commonsense knowledge). In this work, we propose the first benchmark dataset to test the pure causal inference skills of large language models (LLMs). Specifically, we formulate a novel task Corr2Cause, which takes a set of correlational statements and determines the causal relationship between the variables. We curate a large-scale dataset of more than 200K samples, on which we evaluate seventeen existing LLMs. Through our experiments, we identify a key shortcoming of LLMs in terms of their causal inference skills, and show that these models achieve almost close to random performance on the task. This shortcoming is somewhat mitigated when we try to re-purpose LLMs for this skill via finetuning, but we find that these models still fail to generalize \u2013 they can only perform causal inference in in-distribution settings when variable names and textual expressions used in the queries are similar to those in the training set, but fail in out-of-distribution settings generated by perturbing these queries. Corr2Cause is a challenging task for LLMs, and can be helpful in guiding future research on improving LLMs\u2019 pure reasoning skills and generalizability. Our data is at https://huggingface.co/datasets/causalnlp/corr2cause. Our code is at https://github.com/causalNLP/corr2cause.",
        "keywords": "Large Language Models;Natural Language Inference;Causal Reasoning;Correlation-to-Causation Inference;Benchmark Dataset;Causal Discovery",
        "primary_area": "causal reasoning",
        "supplementary_material": "",
        "author": "Zhijing Jin;Jiarui Liu;Zhiheng LYU;Spencer Poff;Mrinmaya Sachan;Rada Mihalcea;Mona T. Diab;Bernhard Sch\u00f6lkopf",
        "authorids": "~Zhijing_Jin1;~Jiarui_Liu1;~Zhiheng_LYU1;~Spencer_Poff1;~Mrinmaya_Sachan3;~Rada_Mihalcea1;~Mona_T._Diab1;~Bernhard_Sch\u00f6lkopf1",
        "gender": ";M;M;M;;F;F;",
        "homepage": ";https://jiarui-liu.github.io/;https://cogito233.github.io/;;;https://web.eecs.umich.edu/~mihalcea/;https://www.seas.gwu.edu/~mtdiab/;",
        "dblp": ";134/1248-4;;;;m/RadaMihalcea;15/4305;",
        "google_scholar": ";mSIhZTAAAAAJ;;a8OINFkAAAAJ;;https://scholar.google.com.tw/citations?user=UetM7FgAAAAJ;https://scholar.google.com.tw/citations?user=-y6SIhQAAAAJ;",
        "orcid": ";;;;;0000-0002-0767-6703;;",
        "linkedin": ";https://linkedin.com/in/jia-rui-liu;;;;;mona-diab-55946614/;",
        "or_profile": "~Zhijing_Jin1;~Jiarui_Liu1;~Zhiheng_LYU1;~Spencer_Poff1;~Mrinmaya_Sachan3;~Rada_Mihalcea1;~Mona_T._Diab1;~Bernhard_Sch\u00f6lkopf1",
        "aff": ";Carnegie Mellon University;University of Hong Kong;;;University of Michigan;Carnegie Mellon University;",
        "aff_domain": ";cmu.edu;hku.hk;;;umich.edu;cmu.edu;",
        "position": ";MS student;Undergrad student;;;Full Professor;Full Professor;",
        "bibtex": "@inproceedings{\njin2024can,\ntitle={Can Large Language Models Infer Causation from Correlation?},\nauthor={Zhijing Jin and Jiarui Liu and Zhiheng LYU and Spencer Poff and Mrinmaya Sachan and Rada Mihalcea and Mona T. Diab and Bernhard Sch{\\\"o}lkopf},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=vqIH0ObdqL}\n}",
        "github": "",
        "project": "",
        "reviewers": "fGug;WuGy;iTjK",
        "pdf_size": 620852,
        "rating": "6;6;6",
        "confidence": "4;4;5",
        "soundness": "3;3;2",
        "contribution": "3;3;3",
        "presentation": "3;4;4",
        "wc_summary": "74;119;108",
        "wc_strengths": "85;68;64",
        "wc_weaknesses": "82;215;168",
        "wc_questions": "1;51;334",
        "wc_review": "242;453;674",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "591;1657;1112",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;2;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            100.33333333333333,
            19.154343864744856
        ],
        "wc_strengths_avg": [
            72.33333333333333,
            9.104333522498443
        ],
        "wc_weaknesses_avg": [
            155.0,
            55.06965286495518
        ],
        "wc_questions_avg": [
            128.66666666666666,
            146.62044726284105
        ],
        "wc_review_avg": [
            456.3333333333333,
            176.37901109699973
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1120.0,
            435.22944140610093
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 125,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10622702130608075727&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=vqIH0ObdqL",
        "pdf": "https://openreview.net/pdf?id=vqIH0ObdqL",
        "email": ";cmu.edu;hku.hk;;;umich.edu;cmu.edu;",
        "author_num": 8,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Carnegie Mellon University;University of Hong Kong;University of Michigan",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.cmu.edu;https://www.hku.hk;https://www.umich.edu",
        "aff_unique_abbr": "CMU;HKU;UM",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "Towards LLM4QPE: Unsupervised Pretraining of Quantum Property Estimation and A Benchmark",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17517",
        "id": "vrBVFXwAmi",
        "author_site": "Yehui Tang, Hao Xiong, Nianzu Yang, Tailong Xiao, Junchi Yan",
        "tldr": "",
        "abstract": "Estimating the properties of quantum systems such as quantum phase has been critical in addressing the essential quantum many-body problems in physics and chemistry. Deep learning models have been recently introduced to property estimation, surpassing  conventional statistical approaches. However, these methods are tailored to the specific task and quantum data at hand. It remains an open and attractive question for devising a more universal task-agnostic pretraining model for quantum property estimation. In this paper, we propose LLM4QPE, a large language model style quantum task-agnostic pretraining and finetuning paradigm that 1) performs unsupervised pretraining on diverse quantum systems with different physical conditions; 2) uses the pretrained model for supervised finetuning and delivers high performance with limited training data, on downstream tasks. It mitigates the cost for quantum data collection and speeds up convergence. Extensive experiments show the promising efficacy of LLM4QPE in various tasks including classifying quantum phases of matter on Rydberg atom model and predicting two-body correlation function on anisotropic Heisenberg model.",
        "keywords": "quantum property estimation;pretraining;finetuning",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Yehui Tang;Hao Xiong;Nianzu Yang;Tailong Xiao;Junchi Yan",
        "authorids": "~Yehui_Tang3;~Hao_Xiong5;~Nianzu_Yang1;~Tailong_Xiao1;~Junchi_Yan2",
        "gender": ";;M;;",
        "homepage": ";;https://yangnianzu0515.github.io/;;",
        "dblp": ";;296/8412.html;;",
        "google_scholar": ";;;qo67_eUAAAAJ;",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Yehui_Tang3;~Hao_Xiong5;~Nianzu_Yang1;~Tailong_Xiao1;~Junchi_Yan2",
        "aff": ";;Shanghai Jiaotong University;Shanghai Jiaotong University;",
        "aff_domain": ";;sjtu.edu.cn;sjtu.edu.cn;",
        "position": ";;PhD student;Researcher;",
        "bibtex": "@inproceedings{\ntang2024towards,\ntitle={Towards {LLM}4{QPE}: Unsupervised Pretraining of Quantum Property Estimation and A Benchmark},\nauthor={Yehui Tang and Hao Xiong and Nianzu Yang and Tailong Xiao and Junchi Yan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=vrBVFXwAmi}\n}",
        "github": "",
        "project": "",
        "reviewers": "TiJ4;2sNf;qDBp;1o9o",
        "pdf_size": 748831,
        "rating": "8;8;8;8",
        "confidence": "4;4;5;5",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "4;3;3;3",
        "wc_summary": "50;96;44;101",
        "wc_strengths": "60;104;35;80",
        "wc_weaknesses": "220;38;283;230",
        "wc_questions": "46;191;48;6",
        "wc_review": "376;429;410;417",
        "wc_reply_reviewers": "16;26;33;24",
        "wc_reply_authors": "674;968;1794;887",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;3;4;4",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            72.75,
            25.897635027160298
        ],
        "wc_strengths_avg": [
            69.75,
            25.40054133281415
        ],
        "wc_weaknesses_avg": [
            192.75,
            92.49695940948546
        ],
        "wc_questions_avg": [
            72.75,
            70.29713721055786
        ],
        "wc_review_avg": [
            408.0,
            19.685019685029527
        ],
        "wc_reply_reviewers_avg": [
            24.75,
            6.057020719792859
        ],
        "wc_reply_authors_avg": [
            1080.75,
            425.56513896229797
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.25,
            0.82915619758885
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16192268021783188824&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=vrBVFXwAmi",
        "pdf": "https://openreview.net/pdf?id=vrBVFXwAmi",
        "email": ";;sjtu.edu.cn;sjtu.edu.cn;",
        "author_num": 5,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Shanghai Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sjtu.edu.cn",
        "aff_unique_abbr": "SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Fixed-Budget Differentially Private Best Arm Identification",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17516",
        "id": "vrE2fqAInO",
        "author_site": "Zhirui Chen, P. N. Karthik, Yeow Meng Chee, Vincent Tan",
        "tldr": "",
        "abstract": "We study best arm identification (BAI) in linear bandits in the fixed-budget regime under differential privacy constraints, when the arm rewards are supported on the unit interval. \nGiven a finite budget $T$ and a privacy parameter  $\\varepsilon>0$, the goal is to minimise the error probability in finding the arm with the largest mean after $T$ sampling rounds, subject to the constraint that the policy of the decision maker satisfies a certain {\\em $\\varepsilon$-differential privacy} ($\\varepsilon$-DP) constraint. We construct a policy satisfying the $\\varepsilon$-DP constraint (called {\\sc DP-BAI}), based on the principle of {\\em maximum absolute determinants}, and derive an upper bound on its error probability. Furthermore, we derive a minimax lower bound on the error probability, and demonstrate that the lower and the upper bounds decay exponentially in $T$, with exponents in the two bounds matching order-wise in (a) the sub-optimality gaps of the arms, (b) $\\varepsilon$, and (c) the problem complexity that is expressible as the sum of two terms, one characterising the complexity of standard fixed-budget BAI (without privacy constraints), and the other accounting for the $\\varepsilon$-DP constraint. Additionally, we present some auxiliary results that contribute to the derivation of the lower bound on the error probability. These results, we posit, may be of independent interest and could prove instrumental in proving lower bounds on error probabilities in several other bandit problems.\nWhereas prior works provide results for BAI in the fixed-budget regime without privacy constraints or in the fixed-confidence regime with privacy constraints, our work fills the gap in the literature by providing the results for BAI in the fixed-budget regime under the $\\varepsilon$-DP constraint.",
        "keywords": "Best Arm Identification;Differential Privacy",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Zhirui Chen;P. N. Karthik;Yeow Meng Chee;Vincent Tan",
        "authorids": "~Zhirui_Chen1;~P._N._Karthik1;~Yeow_Meng_Chee2;~Vincent_Tan1",
        "gender": "M;M;M;M",
        "homepage": "https://zchen42.github.io/;https://karthikpn.com;;https://www.ece.nus.edu.sg/stfpage/vtan/pubs.htm",
        "dblp": "251/9562;194/3135;c/YeowMengChee.html;60/2327",
        "google_scholar": "MMxA2qAAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com.sg/citations?user=99AJNXEAAAAJ;dJoAVvAAAAAJ",
        "orcid": "0009-0000-4684-9999;0000-0001-7798-1159;0000-0001-7823-8068;0000-0002-5008-4527",
        "linkedin": "zhirui-chen-270650308/?originalSubdomain=sg;pnkarthik/;;",
        "or_profile": "~Zhirui_Chen1;~P._N._Karthik1;~Yeow_Meng_Chee2;~Vincent_Tan1",
        "aff": "National University of Singapore;National University of Singapore;National University of Singapore;National University of Singapore",
        "aff_domain": "u.nus.edu;nus.edu.sg;nus.edu.sg;nus.edu.sg",
        "position": "PhD student;Postdoc;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nchen2024fixedbudget,\ntitle={Fixed-Budget Differentially Private Best Arm Identification},\nauthor={Zhirui Chen and P. N. Karthik and Yeow Meng Chee and Vincent Tan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=vrE2fqAInO}\n}",
        "github": "",
        "project": "",
        "reviewers": "mZMs;pqgE;fyMv;Nv4R;9gBt",
        "pdf_size": 706844,
        "rating": "5;6;8;8;8",
        "confidence": "4;2;3;3;4",
        "soundness": "3;3;3;4;3",
        "contribution": "2;3;3;3;3",
        "presentation": "3;2;3;4;3",
        "wc_summary": "29;79;107;79;54",
        "wc_strengths": "10;70;50;51;43",
        "wc_weaknesses": "11;104;91;62;72",
        "wc_questions": "69;134;3;124;4",
        "wc_review": "119;387;251;316;173",
        "wc_reply_reviewers": "0;8;9;0;0",
        "wc_reply_authors": "877;583;242;786;840",
        "reply_reviewers": "0;1;1;0;0",
        "reply_authors": "3;1;1;1;2",
        "rating_avg": [
            7.0,
            1.2649110640673518
        ],
        "confidence_avg": [
            3.2,
            0.7483314773547882
        ],
        "soundness_avg": [
            3.2,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.8,
            0.39999999999999997
        ],
        "presentation_avg": [
            3.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            69.6,
            26.33324894501246
        ],
        "wc_strengths_avg": [
            44.8,
            19.56936381183609
        ],
        "wc_weaknesses_avg": [
            68.0,
            32.01874451005224
        ],
        "wc_questions_avg": [
            66.8,
            56.225972646100125
        ],
        "wc_review_avg": [
            249.2,
            96.13823380944754
        ],
        "wc_reply_reviewers_avg": [
            3.4,
            4.17612260356422
        ],
        "wc_reply_authors_avg": [
            665.6,
            234.88771785685176
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.6,
            0.8
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:TjNisGBCqjwJ:scholar.google.com/&scioq=Fixed-Budget+Differentially+Private+Best+Arm+Identification&hl=en&as_sdt=0,33",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=vrE2fqAInO",
        "pdf": "https://openreview.net/pdf?id=vrE2fqAInO",
        "email": "u.nus.edu;nus.edu.sg;nus.edu.sg;nus.edu.sg",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "National University of Singapore",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nus.edu.sg",
        "aff_unique_abbr": "NUS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Singapore"
    },
    {
        "id": "vrhrhGrdXm",
        "title": "KBFormer: A Transformer-based Diffusion Model of Structured Entities with Heterogeneous Properties",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We present a generative attention-based architecture that models structured entities comprising different property types, such as numerical, categorical, string, and composite. This architecture handles such heterogeneous data through a mixed continuous-discrete diffusion process over the properties. This flexible framework is capable of modeling entities with arbitrary hierarchical properties, enabling applications to structured KB entities and tabular data. Experiments with a device KB and a nuclear physics dataset demonstrate the model's ability to learn representations useful for entity completion in diverse settings. This has many downstream use cases, including modeling numerical properties with high accuracy - critical for science applications. An additional benefit of the model is its inherent probabilistic nature, enabling predictions accompanied by uncertainties. These critical capabilities are leveraged in a nuclear physics dataset to make precise predictions on various properties of nuclei.",
        "keywords": "Knowledge Bases;Structured Data;Discrete State Diffusion",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/71bb24afaf0ff7e96a8c13a24515087a4093471f.zip",
        "author": "Ouail Kitouni;Niklas Nolte;James Hensman;Bhaskar Mitra",
        "authorids": "~Ouail_Kitouni1;~Niklas_Nolte1;~James_Hensman1;~Bhaskar_Mitra1",
        "gender": "M;Not Specified;;M",
        "homepage": "https://okitouni.github.io/;https://nolte.dev/about;;https://www.microsoft.com/en-us/research/people/bmitra/",
        "dblp": "285/7983.html;;116/2940;147/9120-1",
        "google_scholar": ";5elJ_uIAAAAJ;l8dX3ssAAAAJ;PFMB5SsAAAAJ",
        "orcid": ";0000-0003-2536-4209;;0000-0002-5270-5550",
        "linkedin": "ouail-kitouni-645804187/;;;bhaskarmitra/",
        "or_profile": "~Ouail_Kitouni1;~Niklas_Nolte1;~James_Hensman1;~Bhaskar_Mitra1",
        "aff": "Massachusetts Institute of Technology;Meta Facebook;Microsoft Research;Microsoft Research",
        "aff_domain": "mit.edu;meta.com;microsoft.com;microsoft.com",
        "position": "PhD student;Researcher;Principal Researcher;Researcher",
        "bibtex": "@misc{\nkitouni2024kbformer,\ntitle={{KBF}ormer: A Transformer-based Diffusion Model of Structured Entities with Heterogeneous Properties},\nauthor={Ouail Kitouni and Niklas Nolte and James Hensman and Bhaskar Mitra},\nyear={2024},\nurl={https://openreview.net/forum?id=vrhrhGrdXm}\n}",
        "github": "",
        "project": "",
        "reviewers": "QYBP;vWit;b6La;yZ6H;EEBS",
        "site": "https://openreview.net/forum?id=vrhrhGrdXm",
        "pdf_size": 910082,
        "rating": "5;5;6;6;6",
        "confidence": "2;2;4;3;3",
        "soundness": "2;2;3;3;3",
        "contribution": "2;3;2;4;3",
        "presentation": "3;2;2;3;2",
        "wc_summary": "37;88;91;130;57",
        "wc_strengths": "34;28;137;118;67",
        "wc_weaknesses": "135;66;135;119;254",
        "wc_questions": "3;1;121;149;107",
        "wc_review": "209;183;484;516;485",
        "wc_reply_reviewers": "0;0;42;169;0",
        "wc_reply_authors": "608;52;587;493;694",
        "reply_reviewers": "0;0;1;2;0",
        "reply_authors": "1;1;1;2;1",
        "rating_avg": [
            5.6,
            0.48989794855663565
        ],
        "confidence_avg": [
            2.8,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.8,
            0.7483314773547882
        ],
        "presentation_avg": [
            2.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            80.6,
            31.815719385234715
        ],
        "wc_strengths_avg": [
            76.8,
            43.888039372931665
        ],
        "wc_weaknesses_avg": [
            141.8,
            61.55777773766691
        ],
        "wc_questions_avg": [
            76.2,
            62.07865977934768
        ],
        "wc_review_avg": [
            375.4,
            147.16059255113103
        ],
        "wc_reply_reviewers_avg": [
            42.2,
            65.45349494106483
        ],
        "wc_reply_authors_avg": [
            486.8,
            226.6057369088435
        ],
        "reply_reviewers_avg": [
            0.6,
            0.7999999999999999
        ],
        "reply_authors_avg": [
            1.2,
            0.4
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.8728715609439693,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:TOXdnplC1EwJ:scholar.google.com/&scioq=KBFormer:+A+Transformer-based+Diffusion+Model+of+Structured+Entities+with+Heterogeneous+Properties&hl=en&as_sdt=0,34",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;2",
        "aff_unique_norm": "Massachusetts Institute of Technology;Meta;Microsoft",
        "aff_unique_dep": ";Meta Platforms, Inc.;Microsoft Research",
        "aff_unique_url": "https://web.mit.edu;https://meta.com;https://www.microsoft.com/en-us/research",
        "aff_unique_abbr": "MIT;Meta;MSR",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "vrjDNgAfp4",
        "title": "SEMANTIC RHEOLOGY: THE FLOW OF IDEAS IN LANGUAGE MODELS",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The flow of ideas has been extensively studied by physicists, psychologists, and machine learning engineers. This paper adopts certain tools from microrheology to investigate the similarity-based flow of ideas. We introduce a random walker in the word embeddings and study its behaviour. Such similarity mediated random walks through the embedding space shows signatures of anomalous diffusion, commonly observed in complex structured systems such as biological cells and complex fluids.  The paper concludes by proposing the application of popular tools employed in the study of random walks and diffusion of particles under Brownian motion to quantitatively assess the incorporation of diverse ideas in a document. Overall, this paper presents a self-referenced method that combines concepts from microrheology and machine learning to explore the meandering tendencies of language models and their potential association with creativity.",
        "keywords": "word embeddings;random walk;cosine similarity",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Debayan Dasgupta",
        "authorids": "~Debayan_Dasgupta1",
        "gender": "",
        "homepage": "",
        "dblp": "",
        "google_scholar": "wsMAWL0AAAAJ",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Debayan_Dasgupta1",
        "aff": "Indian Institute of Science, Indian institute of science, Bangalore",
        "aff_domain": "iisc.ac.in",
        "position": "Postdoc",
        "bibtex": "@misc{\ndasgupta2024semantic,\ntitle={{SEMANTIC} {RHEOLOGY}: {THE} {FLOW} {OF} {IDEAS} {IN} {LANGUAGE} {MODELS}},\nauthor={Debayan Dasgupta},\nyear={2024},\nurl={https://openreview.net/forum?id=vrjDNgAfp4}\n}",
        "github": "",
        "project": "",
        "reviewers": "Cm35;gMZx;aQUV;TBCQ",
        "site": "https://openreview.net/forum?id=vrjDNgAfp4",
        "pdf_size": 1639477,
        "rating": "1;3;3;6",
        "confidence": "5;3;4;3",
        "soundness": "1;2;1;3",
        "contribution": "1;1;2;3",
        "presentation": "1;2;2;2",
        "wc_summary": "20;49;67;173",
        "wc_strengths": "19;39;42;90",
        "wc_weaknesses": "274;212;292;245",
        "wc_questions": "1;46;5;71",
        "wc_review": "314;346;406;579",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            77.25,
            57.76839533862785
        ],
        "wc_strengths_avg": [
            47.5,
            26.081602711489953
        ],
        "wc_weaknesses_avg": [
            255.75,
            30.318105151872537
        ],
        "wc_questions_avg": [
            30.75,
            29.157974895386683
        ],
        "wc_review_avg": [
            411.25,
            102.32637734230603
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.8021806287494232,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:xje9o4tklfUJ:scholar.google.com/&scioq=SEMANTIC+RHEOLOGY:+THE+FLOW+OF+IDEAS+IN+LANGUAGE+MODELS&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Indian Institute of Science",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.iisc.ac.in",
        "aff_unique_abbr": "IISc",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Bangalore",
        "aff_country_unique_index": "0",
        "aff_country_unique": "India"
    },
    {
        "id": "vsW5vJqBuv",
        "title": "Toward Open-ended Embodied Tasks Solving",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Empowering embodied agents, such as robots, with Artificial Intelligence (AI) has become increasingly important in recent years. A major challenge is task open-endedness. In practice, robots often need to perform tasks with novel goals that are multifaceted, dynamic, lack a definitive \"end-state\", and were not encountered during training. To tackle this problem, this paper introduces Diffusion for Open-ended Goals (DOG), a novel framework designed to enable embodied AI to plan and act flexibly and dynamically for open-ended task goals. DOG synergizes the generative prowess of diffusion models with state-of-the-art, training-free guidance techniques to adaptively perform online planning and control. Our evaluations demonstrate that DOG can handle various kinds of novel task goals not seen during training, in both maze navigation and robot control problems. Our work sheds light on enhancing embodied AI's adaptability and competency in tackling open-ended goals.",
        "keywords": "embodied AI;diffusion models;classifier guidance",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/223ae97617528e1929799defc603d52e70751140.zip",
        "author": "Wei Wang;Dongqi Han;Xufang Luo;Yifei Shen;Charles Ling;Boyu Wang;Dongsheng Li",
        "authorids": "~Wei_Wang59;~Dongqi_Han1;~Xufang_Luo1;~Yifei_Shen1;~Charles_Ling1;~Boyu_Wang3;~Dongsheng_Li2",
        "gender": "M;M;F;M;M;M;M",
        "homepage": "https://waybaba.com;https://frosthan.github.io/;;https://openreview.net/profile?id=~Yifei_Shen1;http://cling.csd.uwo.ca/;https://sites.google.com/site/borriewang/;http://recmind.cn",
        "dblp": ";;218/7350;51/609.html;;41/6565-4.html;254/0830-2.html",
        "google_scholar": "https://scholar.google.ca/citations?user=brsAcesAAAAJ;3V_9fRUAAAAJ;;;https://scholar.google.co.uk/citations?hl=en;qAZM5KcAAAAJ;VNg5rA8AAAAJ",
        "orcid": ";0000-0002-6872-7121;;;;0000-0002-7413-4162;0000-0003-3103-8442",
        "linkedin": ";;;;;;",
        "or_profile": "~Wei_Wang59;~Dongqi_Han1;~Xufang_Luo1;~Yifei_Shen1;~Charles_Ling1;~Boyu_Wang3;~Dongsheng_Li2",
        "aff": "Western University;Microsoft;Microsoft Research;Microsoft Research Asia;Western University;University of Western Ontario;Microsoft Research Asia",
        "aff_domain": "uwo.ca;microsoft.com;microsoft.com;microsoft.com;uwo.ca;uwo.ca;microsoft.com",
        "position": "MS student;Researcher;Researcher;Research Cheerleader;Professor;Assistant Professor;Principal Researcher",
        "bibtex": "@misc{\nwang2024toward,\ntitle={Toward Open-ended Embodied Tasks Solving},\nauthor={Wei Wang and Dongqi Han and Xufang Luo and Yifei Shen and Charles Ling and Boyu Wang and Dongsheng Li},\nyear={2024},\nurl={https://openreview.net/forum?id=vsW5vJqBuv}\n}",
        "github": "",
        "project": "",
        "reviewers": "kQcF;HKQT;z7mQ;Q6JW",
        "site": "https://openreview.net/forum?id=vsW5vJqBuv",
        "pdf_size": 2430064,
        "rating": "3;3;5;6",
        "confidence": "2;4;4;3",
        "soundness": "1;2;3;3",
        "contribution": "2;1;3;3",
        "presentation": "1;1;3;3",
        "wc_summary": "59;50;100;87",
        "wc_strengths": "34;27;60;55",
        "wc_weaknesses": "87;187;5;137",
        "wc_questions": "1024;5;79;111",
        "wc_review": "1204;269;244;390",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.0,
            1.0
        ],
        "wc_summary_avg": [
            74.0,
            20.285462775100793
        ],
        "wc_strengths_avg": [
            44.0,
            13.838352503098047
        ],
        "wc_weaknesses_avg": [
            104.0,
            67.20863039818622
        ],
        "wc_questions_avg": [
            304.75,
            417.03499553394795
        ],
        "wc_review_avg": [
            526.75,
            394.8894623815632
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.17407765595569782,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10798515886305673164&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1;1;0;2;1",
        "aff_unique_norm": "Western University;Microsoft;University of Western Ontario",
        "aff_unique_dep": ";Microsoft Corporation;",
        "aff_unique_url": "https://www.uwo.ca;https://www.microsoft.com;https://www.uwo.ca",
        "aff_unique_abbr": "Western;Microsoft;UWO",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Asia",
        "aff_country_unique_index": "0;1;1;2;0;0;2",
        "aff_country_unique": "Canada;United States;China"
    },
    {
        "id": "vst5P4Pve2",
        "title": "Towards Global Interaction Efficiency of Graph Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "A graph inherently embodies comprehensive interactions among all its nodes when viewed globally. Hence, going beyond existing studies in long-range interactions, which focus on interactions between individual node pairs, we study the interactions in a graph through a global perspective. Traditional GNNs acquire such interactions by leveraging local connectivities through aggregations. While this approach has been prevalent, it has shown limitations, such as under-reaching, and over-squashing. In response, we introduce a global interaction perspective and propose interaction efficiency as a metric for assessing GNN performance. This metric provides a unified insight for understanding several key aspects of GNNs, including positional encodings in Graph Transformers, spectral graph filter expressiveness, over-squashing, and the role of nonlinearity in GNNs. Inspired by the global interaction perspective, we present Universal Interaction Graph Convolution, which exhibits superior interaction efficiency. This new architecture achieves highly competitive performance on a variety of graph-level learning tasks. Code is available at https://github.com/iclrsubmission-towards/UIGC.",
        "keywords": "graph neural networks",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Mingqi Yang;Bryan Hooi;Wenjie Feng;Bin Ji;Yi Bin;Yanming Shen",
        "authorids": "~Mingqi_Yang1;~Bryan_Hooi1;~Wenjie_Feng1;~Bin_Ji3;~Yi_Bin1;~Yanming_Shen1",
        "gender": ";;M;M;;M",
        "homepage": ";http://bhooi.github.io;https://wenchieh.github.io;https://jibin5167.github.io/;;",
        "dblp": ";169/9975;126/2373-1;119/1943-2.html;172/9392;51/3800",
        "google_scholar": ";;EV1kntYAAAAJ;31ZXPVQAAAAJ;KDdkZKQAAAAJ;MvlgpWcAAAAJ",
        "orcid": ";0000-0002-5645-1754;0000-0003-3636-0035;0000-0002-5508-5051;;",
        "linkedin": ";;;bin-ji-3b89a3269/;;",
        "or_profile": "~Mingqi_Yang1;~Bryan_Hooi1;~Wenjie_Feng1;~Bin_Ji3;~Yi_Bin1;~Yanming_Shen1",
        "aff": ";National University of Singapore;National Universiasty of Singapore;National University of Singapore;National University of Singapore;Dalian University of Technology",
        "aff_domain": ";nus.edu.sg;nus.edu.sg;nus.edu.sg;nus.edu;dlut.edu.cn",
        "position": ";Assistant Professor;Postdoc;Postdoc;Researcher;Full Professor",
        "bibtex": "@misc{\nyang2024towards,\ntitle={Towards Global Interaction Efficiency of Graph Networks},\nauthor={Mingqi Yang and Bryan Hooi and Wenjie Feng and Bin Ji and Yi Bin and Yanming Shen},\nyear={2024},\nurl={https://openreview.net/forum?id=vst5P4Pve2}\n}",
        "github": "",
        "project": "",
        "reviewers": "uvYG;vtTz;6p3F",
        "site": "https://openreview.net/forum?id=vst5P4Pve2",
        "pdf_size": 1008903,
        "rating": "3;5;6",
        "confidence": "4;3;2",
        "soundness": "2;2;3",
        "contribution": "2;3;3",
        "presentation": "2;3;2",
        "wc_summary": "85;37;69",
        "wc_strengths": "61;47;69",
        "wc_weaknesses": "511;83;104",
        "wc_questions": "5;441;120",
        "wc_review": "662;608;362",
        "wc_reply_reviewers": "86;110;0",
        "wc_reply_authors": "1828;726;690",
        "reply_reviewers": "1;1;0",
        "reply_authors": "5;2;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            63.666666666666664,
            19.955506062794353
        ],
        "wc_strengths_avg": [
            59.0,
            9.092121131323903
        ],
        "wc_weaknesses_avg": [
            232.66666666666666,
            196.99802593483577
        ],
        "wc_questions_avg": [
            188.66666666666666,
            184.49992472145408
        ],
        "wc_review_avg": [
            544.0,
            130.5679899515957
        ],
        "wc_reply_reviewers_avg": [
            65.33333333333333,
            47.22522866246623
        ],
        "wc_reply_authors_avg": [
            1081.3333333333333,
            528.1775795653916
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            1.699673171197595
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.9819805060619659,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:OG8smlbbPhwJ:scholar.google.com/&scioq=Towards+Global+Interaction+Efficiency+of+Graph+Networks&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;1",
        "aff_unique_norm": "National University of Singapore;Dalian University of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.nus.edu.sg;http://www.dlut.edu.cn/",
        "aff_unique_abbr": "NUS;DUT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;1",
        "aff_country_unique": "Singapore;China"
    },
    {
        "id": "vstaHBy5N4",
        "title": "Communication Efficient Federated Representation Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The Federated Averaging (FedAvg) algorithm is a widely utilized technique in Federated Learning. It follows a recursive pattern where nodes perform a few local stochastic gradient descents (SGD), and then the central server updates the model by taking an average.\nThe primary purpose of conducting model averaging is to mitigate the consensus error that arises between models across different nodes. \nIn our empirical examination, it becomes evident that in non-iid data distribution setting, the consensus error in the initial layers of deep neural network is considerably smaller than that observed in the later layers. This observation hints at the feasibility of applying a less intensive averaging approach for the initial layers. Typically, these layers are designed to extract meaningful representations from the neural network's input. To delve deeper into this phenomenon, we formally analyze it within the context of linear representation.\nWe illustrate that increasing the number of local SGD iterations or reducing the frequency of averaging for the representation extractor leads to enhanced generalizability in the learned model produced by FedAvg's output.\nThe paper is followed with experimental results showing the effectiveness of this method.",
        "keywords": "Federated learning;Communication efficiency;Distributed machine learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/45f81df63dedc86cd767231f2990272d8ddc8331.zip",
        "author": "Peyman Gholami;Hulya Seferoglu",
        "authorids": "~Peyman_Gholami1;~Hulya_Seferoglu1",
        "gender": "M;F",
        "homepage": ";https://sites.google.com/uic.edu/nrl/home",
        "dblp": ";27/825",
        "google_scholar": "mjfYEY8AAAAJ;3hy76zkAAAAJ",
        "orcid": "0009-0005-0604-2038;",
        "linkedin": "peyman-gholami-373049204;",
        "or_profile": "~Peyman_Gholami1;~Hulya_Seferoglu1",
        "aff": "University of Illinois at Chicago;University of Illinois Chicago",
        "aff_domain": "uic.edu;uic.edu",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\ngholami2024communication,\ntitle={Communication Efficient Federated Representation Learning},\nauthor={Peyman Gholami and Hulya Seferoglu},\nyear={2024},\nurl={https://openreview.net/forum?id=vstaHBy5N4}\n}",
        "github": "",
        "project": "",
        "reviewers": "1qmZ;w69N;fepL;iXzj",
        "site": "https://openreview.net/forum?id=vstaHBy5N4",
        "pdf_size": 589829,
        "rating": "3;3;3;5",
        "confidence": "3;3;4;4",
        "soundness": "3;1;2;3",
        "contribution": "3;1;2;3",
        "presentation": "2;2;4;3",
        "wc_summary": "200;88;91;55",
        "wc_strengths": "96;61;37;10",
        "wc_weaknesses": "78;192;294;133",
        "wc_questions": "95;6;21;14",
        "wc_review": "469;347;443;212",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            108.5,
            54.68317840067456
        ],
        "wc_strengths_avg": [
            51.0,
            31.63068130786942
        ],
        "wc_weaknesses_avg": [
            174.25,
            80.03241530779887
        ],
        "wc_questions_avg": [
            34.0,
            35.61600763701625
        ],
        "wc_review_avg": [
            367.75,
            100.75062034548472
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:UsEsUEkEg9YJ:scholar.google.com/&scioq=Communication+Efficient+Federated+Representation+Learning&hl=en&as_sdt=0,47",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Illinois at Chicago",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uic.edu",
        "aff_unique_abbr": "UIC",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Chicago",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Grokking as the transition from lazy to rich training dynamics",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17515",
        "id": "vt5mnLVIVo",
        "author_site": "Tanishq Kumar, Blake Bordelon, Samuel Gershman, Cengiz Pehlevan",
        "tldr": "",
        "abstract": "We propose that the grokking phenomenon, where the train loss of a neural network decreases much earlier than its test loss, can arise due to a neural network transitioning from lazy training dynamics to a rich, feature learning regime. To illustrate this mechanism, we study the simple setting of vanilla gradient descent on a polynomial regression problem with a two layer neural network which exhibits grokking without regularization in a way that cannot be explained by existing theories. We identify sufficient statistics for the test loss of such a network, and tracking these over training reveals that grokking arises in this setting when the network first attempts to fit a kernel regression solution with its initial features, followed by late-time feature learning where a generalizing solution is identified after train loss is already low. We find that the key determinants of grokking are the rate of feature learning---which can be controlled precisely by parameters that scale the network output---and the alignment of the initial features with the target function $y(x)$. We argue this delayed generalization arises when (1) the top eigenvectors of the initial neural tangent kernel and the task labels $y(x)$ are misaligned, but (2) the dataset size is large enough so that it is possible for the network to generalize eventually, but not so large that train loss perfectly tracks test loss at all epochs, and (3) the network begins training in the lazy regime so does not learn features immediately. We conclude with evidence that this transition from lazy (linear model) to rich training (feature learning) can control grokking in more general settings, like on MNIST, one-layer Transformers, and student-teacher networks.",
        "keywords": "Grokking;Feature Learning;Neural Tangent Kernel;Generalization;Training Dynamics",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/17845b3357ef80059733da1e2267de17efee8444.zip",
        "author": "Tanishq Kumar;Blake Bordelon;Samuel J. Gershman;Cengiz Pehlevan",
        "authorids": "~Tanishq_Kumar1;~Blake_Bordelon1;~Samuel_J._Gershman1;~Cengiz_Pehlevan2",
        "gender": "M;M;;M",
        "homepage": "https://tanishqkumar.github.io/;https://blakebordelon.github.io/;https://pehlevan.seas.harvard.edu/;http://gershmanlab.com/",
        "dblp": ";228/6993;145/3480;44/10432",
        "google_scholar": ";yeQ8_pgAAAAJ;veDLTPEAAAAJ;0HuMHFwAAAAJ",
        "orcid": ";0000-0003-0455-9445;0000-0001-9767-6063;",
        "linkedin": ";;;",
        "or_profile": "~Tanishq_Kumar1;~Blake_Bordelon1;~Cengiz_Pehlevan2;~Samuel_Gershman1",
        "aff": "Harvard College;Harvard University;School of Engineering and Applied Sciences, Harvard University;Harvard University",
        "aff_domain": "harvard.edu;harvard.edu;seas.harvard.edu;harvard.edu",
        "position": "Undergrad student;PhD student;Assistant Professor;Professor",
        "bibtex": "@inproceedings{\nkumar2024grokking,\ntitle={Grokking as the transition from lazy to rich training dynamics},\nauthor={Tanishq Kumar and Blake Bordelon and Samuel J. Gershman and Cengiz Pehlevan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=vt5mnLVIVo}\n}",
        "github": "",
        "project": "",
        "reviewers": "y5Qp;Hhk6;8XT2;sTxd",
        "pdf_size": 1538064,
        "rating": "3;5;8;8",
        "confidence": "3;3;4;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;4;3",
        "wc_summary": "92;84;147;40",
        "wc_strengths": "147;91;127;49",
        "wc_weaknesses": "568;319;59;2",
        "wc_questions": "2;3;137;130",
        "wc_review": "809;497;470;221",
        "wc_reply_reviewers": "153;0;0;0",
        "wc_reply_authors": "2257;1176;418;239",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "5;3;2;2",
        "rating_avg": [
            6.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            90.75,
            38.03534540397918
        ],
        "wc_strengths_avg": [
            103.5,
            37.319565913874186
        ],
        "wc_weaknesses_avg": [
            237.0,
            225.38522578021835
        ],
        "wc_questions_avg": [
            68.0,
            65.54769256045554
        ],
        "wc_review_avg": [
            499.25,
            208.70358765483644
        ],
        "wc_reply_reviewers_avg": [
            38.25,
            66.25094338950956
        ],
        "wc_reply_authors_avg": [
            1022.5,
            794.80264846061
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            1.224744871391589
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5443310539518174,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "openreview": "https://openreview.net/forum?id=vt5mnLVIVo",
        "pdf": "https://openreview.net/pdf?id=vt5mnLVIVo",
        "email": "harvard.edu;harvard.edu;seas.harvard.edu;harvard.edu",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Harvard University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.harvard.edu",
        "aff_unique_abbr": "Harvard",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Cambridge;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "vtMrbs8Zwd",
        "title": "The Effects of Overparameterization on Sharpness-aware Minimization: An Empirical and Theoretical Analysis",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Training an overparameterized neural network can yield minimizers of the same level of training loss and yet different generalization capabilities. With evidence that indicates a correlation between sharpness of minima and their generalization errors, increasing efforts have been made to develop an optimization method to explicitly find flat minima as more generalizable solutions.\nThis sharpness-aware minimization (SAM) strategy, however, has not been studied much yet as to how overparameterization can actually affect its behavior.\nIn this work, we analyze SAM under varying degrees of overparameterization and present both empirical and theoretical results that suggest a critical influence of overparameterization on SAM.\nSpecifically, we first use standard techniques in optimization to prove that SAM can achieve a linear convergence rate under overparameterization in a stochastic setting.\nWe also show based on a stability analysis that the solutions found by SAM are indeed flatter and have more uniformly distributed Hessian moments compared to those of SGD.\nThese results are corroborated with our experiments that reveal a consistent trend that the generalization improvement made by SAM continues to increase as the model becomes more overparameterized.\nWe further present that sparsity can open up an avenue for effective overparameterization in practice.",
        "keywords": "sharpness-aware minimization;overparameterization",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Sungbin Shin;Dongyeop Lee;Maksym Andriushchenko;Namhoon Lee",
        "authorids": "~Sungbin_Shin1;~Dongyeop_Lee1;~Maksym_Andriushchenko1;~Namhoon_Lee1",
        "gender": "M;M;M;",
        "homepage": "https://ssbin4.github.io/;https://edong6768.github.io;https://www.andriushchenko.me/;https://namhoonlee.github.io/",
        "dblp": ";;200/8865;63/5359",
        "google_scholar": ";;ZNtuJYoAAAAJ;wi9q5T8AAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Sungbin_Shin1;~Dongyeop_Lee1;~Maksym_Andriushchenko1;~Namhoon_Lee1",
        "aff": "Pohang University of Science and Technology;Pohang University of Science and Technology;Swiss Federal Institute of Technology Lausanne;Google",
        "aff_domain": "postech.ac.kr;postech.edu;epfl.ch;google.com",
        "position": "PhD student;MS student;PhD Student;Researcher",
        "bibtex": "@misc{\nshin2024the,\ntitle={The Effects of Overparameterization on Sharpness-aware Minimization: An Empirical and Theoretical Analysis},\nauthor={Sungbin Shin and Dongyeop Lee and Maksym Andriushchenko and Namhoon Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=vtMrbs8Zwd}\n}",
        "github": "",
        "project": "",
        "reviewers": "L249;jLHw;4Lps;9tdL",
        "site": "https://openreview.net/forum?id=vtMrbs8Zwd",
        "pdf_size": 1019087,
        "rating": "3;6;6;8",
        "confidence": "4;3;3;3",
        "soundness": "3;4;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "19;85;56;57",
        "wc_strengths": "13;85;20;26",
        "wc_weaknesses": "101;132;58;53",
        "wc_questions": "13;149;80;1",
        "wc_review": "146;451;214;137",
        "wc_reply_reviewers": "101;157;11;21",
        "wc_reply_authors": "2119;1498;758;467",
        "reply_reviewers": "1;2;1;1",
        "reply_authors": "5;4;2;2",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            54.25,
            23.44541533008106
        ],
        "wc_strengths_avg": [
            36.0,
            28.661821295933027
        ],
        "wc_weaknesses_avg": [
            86.0,
            32.45766473423496
        ],
        "wc_questions_avg": [
            60.75,
            59.17928269250989
        ],
        "wc_review_avg": [
            237.0,
            127.08855180542423
        ],
        "wc_reply_reviewers_avg": [
            72.5,
            59.9729105513481
        ],
        "wc_reply_authors_avg": [
            1210.5,
            645.2861768238957
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.25,
            1.299038105676658
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8892972917998875,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12858248319937515052&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "Pohang University of Science and Technology;Swiss Federal Institute of Technology Lausanne;Google",
        "aff_unique_dep": ";;Google",
        "aff_unique_url": "https://www.postech.ac.kr;https://www.epfl.ch;https://www.google.com",
        "aff_unique_abbr": "POSTECH;EPFL;Google",
        "aff_campus_unique_index": "0;0;1;2",
        "aff_campus_unique": "Pohang;Lausanne;Mountain View",
        "aff_country_unique_index": "0;0;1;2",
        "aff_country_unique": "South Korea;Switzerland;United States"
    },
    {
        "title": "CoRe-GD: A Hierarchical Framework for Scalable Graph Visualization with GNNs",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17514",
        "id": "vtyasLn4RM",
        "author_site": "Florian Gr\u00f6tschla, Jo\u00ebl Mathys, R\u00f3bert Veres, Roger Wattenhofer",
        "tldr": "",
        "abstract": "Graph Visualization, also known as Graph Drawing, aims to find geometric embeddings of graphs that optimize certain criteria. Stress is a widely used metric; stress is minimized when every pair of nodes is positioned at their shortest path distance. However, stress optimization presents computational challenges due to its inherent complexity and is usually solved using heuristics in practice. We introduce a scalable Graph Neural Network (GNN) based Graph Drawing framework with sub-quadratic runtime that can learn to optimize stress. Inspired by classical stress optimization techniques and force-directed layout algorithms, we create a coarsening hierarchy for the input graph. Beginning at the coarsest level, we iteratively refine and un-coarsen the layout, until we generate an embedding for the original graph. To enhance information propagation within the network, we propose a novel positional rewiring technique based on intermediate node positions. Our empirical evaluation demonstrates that the framework achieves state-of-the-art performance while remaining scalable.",
        "keywords": "Graph Visualization;Optimization;Scalability;Graph Neural Networks",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Florian Gr\u00f6tschla;Jo\u00ebl Mathys;Robert Veres;Roger Wattenhofer",
        "authorids": "~Florian_Gr\u00f6tschla1;~Jo\u00ebl_Mathys1;~Robert_Veres1;~Roger_Wattenhofer1",
        "gender": "M;;M;Not Specified",
        "homepage": "https://disco.ethz.ch/members/fgroetschla;;https://robertver.es/;https://disco.ethz.ch/members/wroger",
        "dblp": "334/1811;;;w/RogerWattenhofer",
        "google_scholar": ";;;https://scholar.google.ch/citations?user=EG3VPm4AAAAJ",
        "orcid": ";;;",
        "linkedin": ";;r%C3%B3bert-veres-1b937a236/;roger-wattenhofer-4466731/",
        "or_profile": "~Florian_Gr\u00f6tschla1;~Jo\u00ebl_Mathys1;~Robert_Veres1;~Roger_Wattenhofer1",
        "aff": "Oracle Labs;;ETHZ - ETH Zurich;Swiss Federal Institute of Technology",
        "aff_domain": "oracle.com;;ethz.ch;ethz.ch",
        "position": "Intern;;MS student;Full Professor",
        "bibtex": "@inproceedings{\ngr{\\\"o}tschla2024coregd,\ntitle={CoRe-{GD}: A Hierarchical Framework for Scalable Graph Visualization with {GNN}s},\nauthor={Florian Gr{\\\"o}tschla and Jo{\\\"e}l Mathys and Robert Veres and Roger Wattenhofer},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=vtyasLn4RM}\n}",
        "github": "",
        "project": "",
        "reviewers": "hLpG;Te7K;Avgq;GnFx",
        "pdf_size": 1063131,
        "rating": "5;6;6;6",
        "confidence": "3;3;2;3",
        "soundness": "3;3;3;4",
        "contribution": "3;3;3;2",
        "presentation": "3;2;3;3",
        "wc_summary": "115;61;28;122",
        "wc_strengths": "65;44;73;128",
        "wc_weaknesses": "93;156;83;154",
        "wc_questions": "45;7;284;131",
        "wc_review": "318;268;468;535",
        "wc_reply_reviewers": "0;0;76;0",
        "wc_reply_authors": "365;519;1392;895",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;2;2",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            81.5,
            38.87479903485033
        ],
        "wc_strengths_avg": [
            77.5,
            31.0201547384922
        ],
        "wc_weaknesses_avg": [
            121.5,
            33.69347117766289
        ],
        "wc_questions_avg": [
            116.75,
            106.49970657236572
        ],
        "wc_review_avg": [
            397.25,
            108.35906745630473
        ],
        "wc_reply_reviewers_avg": [
            19.0,
            32.90896534380867
        ],
        "wc_reply_authors_avg": [
            792.75,
            396.06336298627775
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9144276148420045460&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=vtyasLn4RM",
        "pdf": "https://openreview.net/pdf?id=vtyasLn4RM",
        "email": "oracle.com;;ethz.ch;ethz.ch",
        "author_num": 4,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Oracle Corporation;ETH Zurich;Swiss Federal Institute of Technology",
        "aff_unique_dep": "Oracle Labs;;",
        "aff_unique_url": "https://labs.oracle.com;https://www.ethz.ch;https://www.ethz.ch",
        "aff_unique_abbr": "Oracle Labs;ETHZ;ETH Zurich",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "United States;Switzerland"
    },
    {
        "title": "GRAPH-CONSTRAINED DIFFUSION FOR END-TO-END PATH PLANNING",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17513",
        "id": "vuK8MhVtuu",
        "author_site": "DINGYUAN SHI, Yongxin Tong, Zimu Zhou, Ke Xu, Zheng Wang, Jieping Ye",
        "tldr": "",
        "abstract": "Path planning underpins various applications such as transportation, logistics, and robotics.\nConventionally, path planning is formulated with explicit optimization objectives such as distance or time.\nHowever, real-world data reveals that user intentions are hard-to-model, suggesting a need for data-driven path planning that implicitly incorporates the complex user intentions.\nIn this paper, we propose GDP, a diffusion-based model for end-to-end data-driven path planning.\nIt effectively learns path patterns via a novel diffusion process that incorporates constraints from road networks, and plans paths as conditional path generation given the origin and destination as prior evidence.\nGDP is the first solution that bypasses the traditional search-based frameworks, a long-standing performance bottleneck in path planning.\nWe validate the efficacy of GDP on two real-world datasets.\nOur GDP beats strong baselines by 14.2% ~ 43.5% and achieves state-of-the-art performances.",
        "keywords": "path planning;diffusion model",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Dingyuan Shi;Yongxin Tong;Zimu Zhou;Ke Xu;Zheng Wang;Jieping Ye",
        "authorids": "~Dingyuan_Shi1;~Yongxin_Tong1;~Zimu_Zhou1;~Ke_Xu4;~Zheng_Wang1;~Jieping_Ye4",
        "gender": "M;M;M;;;M",
        "homepage": "https://dingyuan-shi.github.io;https://yongxintong.github.io/;https://zhouzimu.github.io/;;;http://yelabs.net/",
        "dblp": "225/8725;83/2548;133/3824;x/KeXu;;03/5454",
        "google_scholar": "nY4ZwfAAAAAJ;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com.hk/citations?user=RUF3lHQAAAAJ;;;T9AzhwcAAAAJ",
        "orcid": ";0000-0002-5598-0312;0000-0002-5457-6967;;;0000-0001-8662-5818",
        "linkedin": ";;;;;",
        "or_profile": "~Dingyuan_Shi1;~Yongxin_Tong1;~Zimu_Zhou1;~Ke_Xu4;~Zheng_Wang1;~Jieping_Ye4",
        "aff": "Beihang University;Beihang University;City University of Hong Kong;Beihang University;;Alibaba Group",
        "aff_domain": "buaa.edu.cn;buaa.edu.cn;cityu.edu.hk;buaa.edu.cn;;alibaba-inc.com",
        "position": "PhD student;Full Professor;Assistant Professor;Full Professor;;Principal Researcher",
        "bibtex": "@inproceedings{\nshi2024graphconstrained,\ntitle={{GRAPH}-{CONSTRAINED} {DIFFUSION} {FOR} {END}-{TO}-{END} {PATH} {PLANNING}},\nauthor={Dingyuan Shi and Yongxin Tong and Zimu Zhou and Ke Xu and Zheng Wang and Jieping Ye},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=vuK8MhVtuu}\n}",
        "github": "",
        "project": "",
        "reviewers": "opqU;GtR8;nmfg;YKA1;j9CR",
        "pdf_size": 6887980,
        "rating": "6;6;6;6;8",
        "confidence": "3;2;3;4;3",
        "soundness": "2;4;3;3;3",
        "contribution": "3;3;3;4;3",
        "presentation": "4;4;3;3;3",
        "wc_summary": "132;99;73;106;49",
        "wc_strengths": "107;39;46;22;33",
        "wc_weaknesses": "198;14;106;40;15",
        "wc_questions": "88;1;237;419;120",
        "wc_review": "525;153;462;587;217",
        "wc_reply_reviewers": "270;10;38;240;13",
        "wc_reply_authors": "746;197;742;990;518",
        "reply_reviewers": "2;1;1;1;1",
        "reply_authors": "2;1;2;3;1",
        "rating_avg": [
            6.4,
            0.7999999999999999
        ],
        "confidence_avg": [
            3.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            3.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            3.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            3.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            91.8,
            28.47735942814923
        ],
        "wc_strengths_avg": [
            49.4,
            29.85699248082432
        ],
        "wc_weaknesses_avg": [
            74.6,
            70.19287713151527
        ],
        "wc_questions_avg": [
            173.0,
            144.38143925034132
        ],
        "wc_review_avg": [
            388.8,
            172.22589816865522
        ],
        "wc_reply_reviewers_avg": [
            114.2,
            115.76251552208082
        ],
        "wc_reply_authors_avg": [
            638.6,
            266.5570107875611
        ],
        "reply_reviewers_avg": [
            1.2,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            1.8,
            0.7483314773547883
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17546570431386610374&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "openreview": "https://openreview.net/forum?id=vuK8MhVtuu",
        "pdf": "https://openreview.net/pdf?id=vuK8MhVtuu",
        "email": "buaa.edu.cn;buaa.edu.cn;cityu.edu.hk;buaa.edu.cn;;alibaba-inc.com",
        "author_num": 6,
        "aff_unique_index": "0;0;1;0;2",
        "aff_unique_norm": "Beihang University;City University of Hong Kong;Alibaba Group",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.buaa.edu.cn/;https://www.cityu.edu.hk;https://www.alibaba.com",
        "aff_unique_abbr": "BUAA;CityU;Alibaba",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "vueANsev2R",
        "title": "Investigating the chaotic dynamics produced by deep reinforcement learning controllers",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In recent years, deep Reinforcement Learning (RL) has demonstrated remarkable performance in simulated control tasks however there have been significantly fewer applications to real-world problems. While there are several reasons for this dichotomy, one key limitation is a need for theoretical stability guarantees in real-world applications, a property which cannot be provided by Deep Neural Network controllers. In this work, we investigate the stability of trained RL policies for continuous control tasks and identify the types of dynamics produced by the Markov Decision Process (MDP). We find the solutions produced by this interaction are deterministically chaotic with small initial inaccuracies in sensor readings or actuator movements compounding over time producing significantly different long-term outcomes, despite intervention in intermediate steps. The presence of these chaotic dynamics in the MDP provides evidence that RL controllers produce unstable solutions, limiting their application to real-world problems.",
        "keywords": "Reinforcement Learning;Chaos Theory;Dynamical Systems;Robotics",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Rory Young;Nicolas Pugeault",
        "authorids": "~Rory_Young1;~Nicolas_Pugeault2",
        "gender": "M;M",
        "homepage": ";http://pugeault.online.fr/",
        "dblp": "319/6058;35/1348",
        "google_scholar": ";https://scholar.google.co.uk/citations?user=O9mKQacAAAAJ",
        "orcid": ";0000-0002-3455-6280",
        "linkedin": "rory-young-90a09aa1/;nicolas-pugeault-6b01b25/",
        "or_profile": "~Rory_Young1;~Nicolas_Pugeault2",
        "aff": "University of Glasgow;University of Glasgow",
        "aff_domain": "gla.ac.uk;glasgow.ac.uk",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\nyoung2024investigating,\ntitle={Investigating the chaotic dynamics produced by deep reinforcement learning controllers},\nauthor={Rory Young and Nicolas Pugeault},\nyear={2024},\nurl={https://openreview.net/forum?id=vueANsev2R}\n}",
        "github": "",
        "project": "",
        "reviewers": "zKDP;Hboh;y5dK;rHqm",
        "site": "https://openreview.net/forum?id=vueANsev2R",
        "pdf_size": 481819,
        "rating": "3;3;3;6",
        "confidence": "4;4;3;3",
        "soundness": "1;2;1;3",
        "contribution": "2;2;1;2",
        "presentation": "2;3;3;3",
        "wc_summary": "40;96;39;57",
        "wc_strengths": "25;85;34;79",
        "wc_weaknesses": "230;144;304;75",
        "wc_questions": "1;54;26;99",
        "wc_review": "296;379;403;310",
        "wc_reply_reviewers": "0;0;0;19",
        "wc_reply_authors": "405;477;222;402",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            58.0,
            23.075961518428652
        ],
        "wc_strengths_avg": [
            55.75,
            26.52710877574109
        ],
        "wc_weaknesses_avg": [
            188.25,
            86.49385816345574
        ],
        "wc_questions_avg": [
            45.0,
            36.37993952716249
        ],
        "wc_review_avg": [
            347.0,
            45.0832563153994
        ],
        "wc_reply_reviewers_avg": [
            4.75,
            8.227241335952167
        ],
        "wc_reply_authors_avg": [
            376.5,
            94.11827665230595
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:kdyS-vbxvWsJ:scholar.google.com/&scioq=Investigating+the+chaotic+dynamics+produced+by+deep+reinforcement+learning+controllers&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Glasgow",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.gla.ac.uk",
        "aff_unique_abbr": "Glasgow",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "vvD4ilobth",
        "title": "TCL-VS: Temporal Contrastive Learning for Self-Supervised Video Summarization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The goal of video summarization is to extract the most important parts from the original video. \nMost existing methods are based on supervised learning and they have demonstrated superior performance. \nHowever, the scarcity of annotated data is a major obstacle in the video summarization task. \nTo reduce the impact of the scarcity, some weakly-supervised and unsupervised methods were proposed. \nAlthough they manifested positive results, existing methods ignore the intrinsic association between video clips. \nTo address it, we introduce a new self-supervised learning method called TCL-VS. Our main insight is that \na excellent summary requires not only maintaining the original video content but also eliminating redundant information.\nInspired by the observation, this work consists of two separate modules that respectively conduct \ntemporal consistency and diversity assessment of video clips. Each module predicts a sequence score by clip, \nand then we combine them using a weighted method. Extensive experiments demonstrate that \nour method achieves state-of-the-art performance on two video summarization benchmarks: SumMe and TVSum.",
        "keywords": "Video Summarization;Self-Supervised;Contrastive Learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/fea424cf21597f44574d48d997bb5711f5cb63eb.zip",
        "author": "Jiajun Han;Xuran Yang;kun shen Xu;Hui Zhang;Kanle Shi",
        "authorids": "~Jiajun_Han1;~Xuran_Yang1;~kun_shen_Xu1;~Hui_Zhang1;~Kanle_Shi1",
        "gender": "M;F;M;F;M",
        "homepage": "https://github.com/HANlol;https://github.com/kuriko1023;http://www.kuaishou.com;https://www.thss.tsinghua.edu.cn/faculty/zhanghui.htm;https://baike.baidu.com/item/%E6%96%BD%E4%BE%83%E4%B9%90/22063589",
        "dblp": ";;;z/HuiZhang13;02/8075.html",
        "google_scholar": ";;;;",
        "orcid": ";;;0000-0001-6563-9890;0000-0001-5865-6078",
        "linkedin": ";;;;https://www.linkedin.cn/injobs/in/\u4f83\u4e50-\u65bd-074699172",
        "or_profile": "~Jiajun_Han1;~Xuran_Yang1;~kun_shen_Xu1;~Hui_Zhang1;~Kan-Le_Shi1",
        "aff": "Tsinghua University;Tsinghua University;Kuaishou Technology;Tsinghua University;Kuaishou Technology",
        "aff_domain": "tsinghua.edu.cn;tsinghua.edu.cn;kuaishou.com;tsinghua.edu.cn;kuaishou.com",
        "position": "MS student;MS student;Researcher;Associate Professor;Researcher",
        "bibtex": "@misc{\nhan2024tclvs,\ntitle={{TCL}-{VS}: Temporal Contrastive Learning for Self-Supervised Video Summarization},\nauthor={Jiajun Han and Xuran Yang and kun shen Xu and Hui Zhang and Kanle Shi},\nyear={2024},\nurl={https://openreview.net/forum?id=vvD4ilobth}\n}",
        "github": "",
        "project": "",
        "reviewers": "Jbri;4CFj;PYMF",
        "site": "https://openreview.net/forum?id=vvD4ilobth",
        "pdf_size": 910602,
        "rating": "3;3;5",
        "confidence": "4;4;3",
        "soundness": "1;1;2",
        "contribution": "1;2;2",
        "presentation": "2;2;2",
        "wc_summary": "134;64;81",
        "wc_strengths": "40;27;35",
        "wc_weaknesses": "205;135;33",
        "wc_questions": "111;31;76",
        "wc_review": "490;257;225",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            93.0,
            29.81051268708183
        ],
        "wc_strengths_avg": [
            34.0,
            5.354126134736337
        ],
        "wc_weaknesses_avg": [
            124.33333333333333,
            70.62262778710203
        ],
        "wc_questions_avg": [
            72.66666666666667,
            32.744804507314164
        ],
        "wc_review_avg": [
            324.0,
            118.10447352520846
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:AqnlMmOxxgoJ:scholar.google.com/&scioq=TCL-VS:+Temporal+Contrastive+Learning+for+Self-Supervised+Video+Summarization&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;1",
        "aff_unique_norm": "Tsinghua University;Kuaishou Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.kuaishou.com",
        "aff_unique_abbr": "THU;Kuaishou",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "vvROJOMYP8",
        "title": "Creative Style Transfer",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Generating novel artistic styles from a single style is a formidable challenge for for traditional style transfer techniques, which typically focus on emulating the provided style without introducing fresh and meaningful elements. In this paper, we propose a creativity process for producing new and meaningful artistic styles, called creative style transfer (CSFer). We first introduce a neural permutation network (PerNet) to rearrange the feature maps of a single style image, thereby adapting them to the feature maps of a content image, resulting in the desired stylization content. Essentially, this permutation process enriches the bases of the single style within a high-dimensional feature space, departing from the conventional linear combination of multiple styles. To gauge the quality of our stylized content, we leverage metrics encompassing content structure, style perception, and artistic aesthetics. These metrics enable us to assess our stylized content in comparison to the output produced by traditional style transfer methods. In the training phase, PerNet learns to generate high-quality stylized content by randomly sampling permutation matrices that yield high-quality stylization outcomes. Experimental results demonstrate that our CSFer can create novel and original stylization outcomes. Furthermore, CSFer exhibits robust generalization capabilities by simply inserting the PerNet into the style transfer methods.",
        "keywords": "style transfer; creative learning;",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Jun Li;Li Shi Min;Ze-dong Zhang;Gan Sun;Hongfu Liu;Li-wei H. Lehman;Jian Yang",
        "authorids": "~Jun_Li16;~Li_Shi_Min1;~Ze-dong_Zhang1;~Gan_Sun1;~Hongfu_Liu2;~Li-wei_H._Lehman1;~Jian_Yang1",
        "gender": "M;M;M;M;M;;M",
        "homepage": ";https://mp.csdn.net/mp_blog/manage/article?spm=1011.2124.3001.5298;;;http://hongfuliu.com/;http://web.mit.edu/lilehman/www/;",
        "dblp": ";;286/9537;191/2425;32/9075-1;87/2340.html;y/JianYang3.html",
        "google_scholar": "iGPEwQsAAAAJ;;POB4LxgAAAAJ;U4a4FLIAAAAJ;https://scholar.google.com/citations?hl=en;it0h7rMAAAAJ;https://scholar.google.com.hk/citations?user=6CIDtZQAAAAJ",
        "orcid": ";;0000-0002-3328-1713;;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Jun_Li16;~Li_Shi_Min1;~Ze-dong_Zhang1;~Gan_Sun1;~Hongfu_Liu2;~Li-wei_H._Lehman1;~Jian_Yang1",
        "aff": "Nanjing University of Science and Technology;Nanjing University of Science and Technology;Nanjing University of Science and Technology;Chinese Academy of Sciences;Brandeis University;Massachusetts Institute of Technology;Nanjing University of Science and Technology",
        "aff_domain": "njust.edu.cn;njust.edu.cn;njust.edu.cn;ac.cn;brandeis.edu;mit.edu;njust.edu.cn",
        "position": "Full Professor;MS student;PhD student;Associate Professor;Assistant Professor;Researcher;Full Professor",
        "bibtex": "@misc{\nli2024creative,\ntitle={Creative Style Transfer},\nauthor={Jun Li and Li Shi Min and Ze-dong Zhang and Gan Sun and Hongfu Liu and Li-wei H. Lehman and Jian Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=vvROJOMYP8}\n}",
        "github": "",
        "project": "",
        "reviewers": "Wopn;rMps;sSvh;D5gN",
        "site": "https://openreview.net/forum?id=vvROJOMYP8",
        "pdf_size": 4450670,
        "rating": "1;1;3;5",
        "confidence": "5;5;5;2",
        "soundness": "3;1;1;2",
        "contribution": "1;1;1;2",
        "presentation": "2;1;2;3",
        "wc_summary": "51;16;101;92",
        "wc_strengths": "19;7;26;44",
        "wc_weaknesses": "336;97;198;273",
        "wc_questions": "1;40;149;5",
        "wc_review": "407;160;474;414",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.5,
            1.6583123951777
        ],
        "confidence_avg": [
            4.25,
            1.299038105676658
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            1.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            65.0,
            33.99264626356707
        ],
        "wc_strengths_avg": [
            24.0,
            13.397761006974262
        ],
        "wc_weaknesses_avg": [
            226.0,
            89.07019703582114
        ],
        "wc_questions_avg": [
            48.75,
            59.83466804453752
        ],
        "wc_review_avg": [
            363.75,
            120.48314197430278
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.8703882797784891,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0;0;0;1;2;3;0",
        "aff_unique_norm": "Nanjing University of Science and Technology;Chinese Academy of Sciences;Brandeis University;Massachusetts Institute of Technology",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "http://www.nust.edu.cn/;https://www.cas.cn;https://www.brandeis.edu;https://web.mit.edu",
        "aff_unique_abbr": "NUST;CAS;Brandeis;MIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;1;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "vwSxJEq8VO",
        "title": "Machine learning pipelines synthesis with large language models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In the realm of machine learning, the ability to seamlessly translate natural language descriptions into compilable code is a longstanding challenge. This paper presents a novel framework that addresses this challenge by introducing a pipeline capable of iteratively transforming natural language task descriptions into code through high-level machine learning instructions. Central to this framework is the fine-tuning of the LLama model, enabling it to rank different solutions for various problems and select an appropriate fit for a given task. The paper covers the fine-tuning process and provides insights into the general process of transforming natural language descriptions into code. Our approach marks a significant step towards automating code generation, bridging the gap between task descriptions and executable code, and holds promise for advancing machine learning applications across diverse domains. We showcase the effectiveness of our framework through experimental evaluations and discuss its potential applications in various domains, highlighting its implications for advancing the field of machine learning.",
        "keywords": "Data analysis pipelines;Large Language models;Machine learning pipelines synthesis;Natural language descriptions",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Ekaterina Trofimova;Emil Sataev;Andrey E Ustyuzhanin",
        "authorids": "~Ekaterina_Trofimova1;esataev@hse.ru;~Andrey_E_Ustyuzhanin1",
        "gender": "F;;M",
        "homepage": ";;",
        "dblp": ";;",
        "google_scholar": ";;https://scholar.google.ru/citations?user=vfQf9SIAAAAJ",
        "orcid": "0000-0001-5436-8511;;",
        "linkedin": ";;",
        "or_profile": "~Ekaterina_Trofimova1;esataev@hse.ru;~Andrey_E_Ustyuzhanin1",
        "aff": "Higher School of Economics;;National University of Singapore",
        "aff_domain": "hse.ru;;nus.edu.sg",
        "position": "PhD student;;Researcher",
        "bibtex": "@misc{\ntrofimova2024machine,\ntitle={Machine learning pipelines synthesis with large language models},\nauthor={Ekaterina Trofimova and Emil Sataev and Andrey E Ustyuzhanin},\nyear={2024},\nurl={https://openreview.net/forum?id=vwSxJEq8VO}\n}",
        "github": "",
        "project": "",
        "reviewers": "561Y;Vjr6;sE3z;qx6E",
        "site": "https://openreview.net/forum?id=vwSxJEq8VO",
        "pdf_size": 575343,
        "rating": "1;3;3;5",
        "confidence": "5;3;4;4",
        "soundness": "1;1;1;3",
        "contribution": "1;2;2;2",
        "presentation": "1;1;2;3",
        "wc_summary": "125;41;287;50",
        "wc_strengths": "23;52;35;154",
        "wc_weaknesses": "315;114;198;126",
        "wc_questions": "1;25;32;153",
        "wc_review": "464;232;552;483",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            1.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            125.75,
            98.64424717133787
        ],
        "wc_strengths_avg": [
            66.0,
            51.8411033833193
        ],
        "wc_weaknesses_avg": [
            188.25,
            79.91988175666928
        ],
        "wc_questions_avg": [
            52.75,
            59.010062701203765
        ],
        "wc_review_avg": [
            432.75,
            120.43955953091161
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:IX2E2SqVC9gJ:scholar.google.com/&scioq=Machine+learning+pipelines+synthesis+with+large+language+models&hl=en&as_sdt=0,31",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Higher School of Economics;National University of Singapore",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.hse.ru;https://www.nus.edu.sg",
        "aff_unique_abbr": "HSE;NUS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Russian Federation;Singapore"
    },
    {
        "id": "vwlryNhWp7",
        "title": "Improving Discriminative Multi-Modal Learning with Large-Scale Pre-Trained Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "This paper investigates how to better leverage large-scale pre-trained uni-modal models to further enhance discriminative multi-modal learning. Even when fine-tuned with only uni-modal data, these models can outperform previous multi-modal models in certain tasks. It's clear that their incorporation into multi-modal learning would significantly improve performance. However, multi-modal learning with these models still suffers from insufficient learning of uni-modal features, which weakens the resulting multi-modal model's generalization ability. While fine-tuning uni-modal models separately and then aggregating their predictions is straightforward, it doesn't allow for adequate adaptation between modalities, also leading to sub-optimal results. To this end, we introduce Multi-Modal Low-Rank Adaptation learning (MMLoRA). By freezing the weights of uni-modal fine-tuned models, adding extra trainable rank decomposition matrices to them, and subsequently performing multi-modal joint training, our method enhances adaptation between modalities and boosts overall performance. We demonstrate the effectiveness of MMLoRA on three dataset categories: audio-visual (e.g., AVE, Kinetics-Sound, CREMA-D), vision-language (e.g., MM-IMDB, UPMC Food101), and RGB-Optical Flow (UCF101).",
        "keywords": "Discriminative Multi-modal Learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/dccaf21b3944271bde7299c295394accd4f189c2.zip",
        "author": "Chenzhuang Du;Yue Zhao;Chonghua Liao;Jiacheng You;Jie Fu;Hang Zhao",
        "authorids": "~Chenzhuang_Du1;~Yue_Zhao15;~Chonghua_Liao1;~Jiacheng_You1;~Jie_Fu2;~Hang_Zhao1",
        "gender": "M;;M;M;;M",
        "homepage": "https://scholar.google.com/citations?hl=zh-CN&user=VoF-UAEAAAAJ;;;https://github.com/YouJiacheng;;http://www.mit.edu/~hangzhao/",
        "dblp": "275/3182;;304/4739.html;;;",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;;;;;DmahiOYAAAAJ",
        "orcid": ";;;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Chenzhuang_Du1;~Yue_Zhao15;~Chonghua_Liao1;~Jiacheng_You1;~Jie_Fu2;~Hang_Zhao1",
        "aff": "Tsinghua University;;Tsinghua University;Tsinghua University;;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;;tsinghua.edu.cn;tsinghua.edu.cn;;tsinghua.edu.cn",
        "position": "PhD student;;PhD student;PhD student;;Assistant Professor",
        "bibtex": "@misc{\ndu2024improving,\ntitle={Improving Discriminative Multi-Modal Learning with Large-Scale Pre-Trained Models},\nauthor={Chenzhuang Du and Yue Zhao and Chonghua Liao and Jiacheng You and Jie Fu and Hang Zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=vwlryNhWp7}\n}",
        "github": "",
        "project": "",
        "reviewers": "32xM;buaj;iWgQ;ChZV",
        "site": "https://openreview.net/forum?id=vwlryNhWp7",
        "pdf_size": 441600,
        "rating": "3;3;5;6",
        "confidence": "5;4;4;3",
        "soundness": "2;1;3;3",
        "contribution": "2;1;3;2",
        "presentation": "2;1;3;3",
        "wc_summary": "87;65;47;42",
        "wc_strengths": "62;42;36;26",
        "wc_weaknesses": "109;126;109;6",
        "wc_questions": "109;51;2;3",
        "wc_review": "367;284;194;77",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            60.25,
            17.65467360219384
        ],
        "wc_strengths_avg": [
            41.5,
            13.143439428094915
        ],
        "wc_weaknesses_avg": [
            87.5,
            47.563115961845895
        ],
        "wc_questions_avg": [
            41.25,
            43.84275880918079
        ],
        "wc_review_avg": [
            230.5,
            107.69052883146225
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16940948431191818669&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Tsinghua University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "vxZW1aROZA",
        "title": "EcoAssistant: Using LLM Assistant More Affordably and Accurately",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Today, users ask Large language models (LLMs) as assistants to answer queries that require external knowledge; they ask about the weather in a specific city, about stock prices, and even about where specific locations are within their neighborhood. These queries require the LLM to produce code that invokes external APIs to answer the user's question, yet LLMs rarely produce correct code on the first try, requiring iterative code refinement upon execution results. In addition, using LLM assistants to support high query volumes can be expensive. In this work, we contribute a framework, EcoAssistant, that enables LLMs to answer code-driven queries more affordably and accurately. EcoAssistant contains three components. First, it allows the LLM assistants to converse with an automatic code executor to iteratively refine code or to produce answers based on the execution results. Second, we use a hierarchy of LLM assistants, which attempts to answer the query with weaker, cheaper LLMs before backing off to stronger, expensive ones. Third, we retrieve solutions from past successful queries as in-context demonstrations to help subsequent queries. Empirically, we show that EcoAssistant offers distinct advantages for affordability and accuracy, surpassing GPT-4 by 10 points of success rate with less than 50% of GPT-4's cost.",
        "keywords": "Larger language models (LLMs);Conversational LLMs;LLM as assistant;Cost effective deployment of LLMs",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Jieyu Zhang;Ranjay Krishna;Ahmed Hassan Awadallah;Chi Wang",
        "authorids": "~Jieyu_Zhang1;~Ranjay_Krishna1;~Ahmed_Hassan_Awadallah1;~Chi_Wang3",
        "gender": "M;M;M;M",
        "homepage": "https://jieyuz2.github.io/;http://ranjaykrishna.com;https://www.microsoft.com/en-us/research/people/hassanam/publications/;http://chiwang.cc",
        "dblp": ";167/3785;147/9148;09/404-1",
        "google_scholar": "T_INUHUAAAAJ;IcqahyAAAAAJ;sNGk-9MAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": "0000-0002-1846-2436;0000-0001-8784-2531;;",
        "linkedin": "jieyu-zhang-3baaa8154/;ranjay-krishna-1a344444/;ahmed-hassan-awadallah-a355a27/;chi-wang-autogen/",
        "or_profile": "~Jieyu_Zhang1;~Ranjay_Krishna1;~Ahmed_Hassan_Awadallah1;~Chi_Wang3",
        "aff": "University of Washington;University of Washington;Microsoft Research;Microsoft Research",
        "aff_domain": "cs.washington.edu;cs.washington.edu;microsoft.com;microsoft.com",
        "position": "PhD student;Assistant Professor;Principal Researcher;Principal Researcher",
        "bibtex": "@misc{\nzhang2024ecoassistant,\ntitle={EcoAssistant: Using {LLM} Assistant More Affordably and Accurately},\nauthor={Jieyu Zhang and Ranjay Krishna and Ahmed Hassan Awadallah and Chi Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=vxZW1aROZA}\n}",
        "github": "",
        "project": "",
        "reviewers": "R6M4;wYWS;UE2g",
        "site": "https://openreview.net/forum?id=vxZW1aROZA",
        "pdf_size": 4979749,
        "rating": "5;5;6",
        "confidence": "4;3;2",
        "soundness": "3;2;4",
        "contribution": "2;2;2",
        "presentation": "3;3;3",
        "wc_summary": "88;31;53",
        "wc_strengths": "12;36;21",
        "wc_weaknesses": "133;73;95",
        "wc_questions": "18;171;22",
        "wc_review": "251;311;191",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "210;475;135",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            57.333333333333336,
            23.47102232304526
        ],
        "wc_strengths_avg": [
            23.0,
            9.899494936611665
        ],
        "wc_weaknesses_avg": [
            100.33333333333333,
            24.78350706058814
        ],
        "wc_questions_avg": [
            70.33333333333333,
            71.20081148101863
        ],
        "wc_review_avg": [
            251.0,
            48.98979485566356
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            273.3333333333333,
            145.84999904772786
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 40,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1826136421290589111&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;1",
        "aff_unique_norm": "University of Washington;Microsoft",
        "aff_unique_dep": ";Microsoft Research",
        "aff_unique_url": "https://www.washington.edu;https://www.microsoft.com/en-us/research",
        "aff_unique_abbr": "UW;MSR",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "vxmvbzw76R",
        "title": "Split-and-Denoise: Protect large language model inference with local differential privacy",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) shows powerful capability in natural language understanding by capturing hidden semantics in vector space. This process enriches the value of the text embeddings for various downstream tasks, thereby fostering the Embedding-as-a-Service (EaaS) business model. However, the direct transmission of text to servers poses a largely unaddressed risk of privacy leakage. To mitigate this issue, we introduce Split-N-Denoise (SnD), an innovative framework that split the model to execute the token embedding layer on the client side at minimal computational cost. This allows the client to introduce noise prior to transmitting the embeddings to the server and subsequently receive and denoise the perturbed output embeddings for downstream tasks. Our approach is designed for the inference stage of LLMs and requires no modifications to the model parameters, while also being computationally efficient on the client side. Extensive experiments demonstrate SnD's effectiveness in optimizing the privacy-utility tradeoff across various LLM architectures and diverse downstream tasks. The results reveal an significant accuracy improvement under the same privacy budget compared to the baseline, offering clients a privacy-preserving solution for local privacy protection.",
        "keywords": "Large Language Model;Local Differential Privacy;Denoising;Split learning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/d6fc6cb6ef382ccc07cb28018fb9393994d84ab1.pdf",
        "author": "Peihua Mai;Ran Yan;Zhe Huang;Youjia Yang;Yan Pang",
        "authorids": "~Peihua_Mai1;~Ran_Yan3;~Zhe_Huang6;~Youjia_Yang1;~Yan_Pang1",
        "gender": "F;F;M;;M",
        "homepage": ";;;;https://discovery.nus.edu.sg/10509-yan-james-pang",
        "dblp": "331/2673;;;;",
        "google_scholar": "ZtDss4cAAAAJ;;;;",
        "orcid": "0000-0002-5851-2290;0009-0009-3405-5361;0009-0002-4420-6601;;",
        "linkedin": ";;;youjiayang35;",
        "or_profile": "~Peihua_Mai1;~Ran_Yan3;~Zhe_Huang6;~Youjia_Yang1;~Yan_Pang1",
        "aff": "National University of Singapore;;North China Electric Power University;University of Southern California;National University of Singapore",
        "aff_domain": "nus.edu;;ncepu.edu;usc.edu;nus.edu.sg",
        "position": "PhD student;;MS student;MS student;Full Professor",
        "bibtex": "@misc{\nmai2024splitanddenoise,\ntitle={Split-and-Denoise: Protect large language model inference with local differential privacy},\nauthor={Peihua Mai and Ran Yan and Zhe Huang and Youjia Yang and Yan Pang},\nyear={2024},\nurl={https://openreview.net/forum?id=vxmvbzw76R}\n}",
        "github": "",
        "project": "",
        "reviewers": "C4Af;xFRn;4SyG;NdAW",
        "site": "https://openreview.net/forum?id=vxmvbzw76R",
        "pdf_size": 1450395,
        "rating": "3;3;5;8",
        "confidence": "3;2;4;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;1;2;3",
        "wc_summary": "48;119;192;86",
        "wc_strengths": "21;172;102;63",
        "wc_weaknesses": "303;690;343;153",
        "wc_questions": "31;159;25;38",
        "wc_review": "403;1140;662;340",
        "wc_reply_reviewers": "0;371;221;163",
        "wc_reply_authors": "410;775;906;695",
        "reply_reviewers": "0;1;2;1",
        "reply_authors": "3;3;3;2",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            111.25,
            52.95930041078715
        ],
        "wc_strengths_avg": [
            89.5,
            55.58102194094671
        ],
        "wc_weaknesses_avg": [
            372.25,
            196.65118230003094
        ],
        "wc_questions_avg": [
            63.25,
            55.472403048723244
        ],
        "wc_review_avg": [
            636.25,
            314.8796397038081
        ],
        "wc_reply_reviewers_avg": [
            188.75,
            132.80130835198875
        ],
        "wc_reply_authors_avg": [
            696.5,
            181.75326682070946
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.75,
            0.4330127018922193
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.34554737023254406,
        "gs_citation": 24,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12645019224439374827&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "National University of Singapore;North China Electric Power University;University of Southern California",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.nus.edu.sg;http://www.ncepu.edu.cn;https://www.usc.edu",
        "aff_unique_abbr": "NUS;NCEPU;USC",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Los Angeles",
        "aff_country_unique_index": "0;1;2;0",
        "aff_country_unique": "Singapore;China;United States"
    },
    {
        "id": "vxv7zQI2R4",
        "title": "Conditional variational autoencoder for vision-language models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large-scale pre-trained Vision-Language Models (VLMs), such as CLIP,  establish the connection between texts and images, achieving remarkable success on various downstream tasks with fine-tuning. In existing fine-tuning methods,  \nthe class-specific text description is matched against the whole image. We recognize that this whole image matching is not effective since images from the same class often contain a set of different semantic objects, and an object further consists of a set of semantic parts or concepts. Individual semantic parts or concepts may appear in image samples from different classes. To address this issue, in this paper, we develop a new method called cross-modal Concept Discovery and  Reasoning (CoDaR). Using the powerful text-image correlation capability of CLIP, our method automatically discovers a large set of distinctive visual concepts from images using a set of semantic text concepts. Based on these visual concepts, we construct a discriminative representation of images and learn a concept reasoning network to perform downstream image classification tasks, such as few-shot learning and domain generalization. \nExtensive experimental results demonstrate that our CoDaR method is able to improve the performance upon the current state-of-the-art methods by large margins, for example,  by up to 8.0\\% improvement on few-shot learning and by up to 1.3\\% for domain generalization.",
        "keywords": "Vision-language;domain genrealization;CLIP",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yi Zhang;Ce Zhang",
        "authorids": "~Yi_Zhang68;~Ce_Zhang5",
        "gender": "M;M",
        "homepage": "https://www.zhimeifenghua.com;https://zhangce01.github.io/",
        "dblp": "64/6544;97/919-9",
        "google_scholar": ";_z-zaU0AAAAJ",
        "orcid": ";0000-0001-6789-0130",
        "linkedin": ";ce-zhang-64263a275/",
        "or_profile": "~Yi_Zhang68;~Ce_Zhang5",
        "aff": "zhimeifenghua;Carnegie Mellon University",
        "aff_domain": "zhimeifenghua.com;cmu.edu",
        "position": "Researcher;MS student",
        "bibtex": "@misc{\nzhang2024conditional,\ntitle={Conditional variational autoencoder for vision-language models},\nauthor={Yi Zhang and Ce Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=vxv7zQI2R4}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=vxv7zQI2R4",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:wQWavjuECi8J:scholar.google.com/&scioq=Conditional+variational+autoencoder+for+vision-language+models&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Zhimeifenghua;Carnegie Mellon University",
        "aff_unique_dep": ";",
        "aff_unique_url": ";https://www.cmu.edu",
        "aff_unique_abbr": ";CMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "1",
        "aff_country_unique": ";United States"
    },
    {
        "id": "vxzRcFd837",
        "title": "Rethinking One-vs-the-Rest Loss for Instance-dependent Complementary Label Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Complementary Label Learning (CLL) is a typical weakly supervised learning protocol, where each instance is associated with one complementary label, which specifies the class that the instance does not belong to. Existing CLL methods assume that the complementary label is sampled uniformly from all non-ground-truth labels, or from a biased probability depending on the ground-truth label. However, these assumptions are normally unrealistic, for example, an annotator tends to choose a label that is largely irrelevant to the instance to avoid mistaking the ground-truth label as the complementary one. Therefore, in this paper, we introduce instance-dependent CLL (IDCLL), where non-ground-truth labels that are less relevant to the instances are more likely to be selected as the complementary ones. Accordingly, we present our generation process for instance-dependent complementary label and observe that directly applying existing CLL methods to IDCLL results in poor performance. We further empirically analyze this phenomenon and identify: Existing methods exhibit a decline in their capacity to share complementary labels under the instance-dependent setting, resulting in small logit margins, thus difficult to identify ground-truth labels. To address this problem, we introduce complementary logit margin loss (CLML) and demonstrate CLML can enhance the capacity to share complementary labels. Additionally, we propose a novel form of the complementary one-vs-the-rest loss (COVR) as the surrogate loss for CLML, and provide theoretical proof that COVR can decrease CLML to a greater extent compared to existing CLL methods. The estimation error bound of COVR is also theoretically characterized. Extensive experiments conducted on benchmark datasets demonstrate the superiority of the proposed method compared to the existing CLL methods under our instance-dependent setting.",
        "keywords": "Complementary Label Learning;Weakly Supervised Learning;Generalization Error Estimation;Instance Dependent;One-vs-the-Rest Loss;Logit Margin",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/4d08bcff7c3f6064f31b9835cf1c507d2d85ffd7.zip",
        "author": "Yiwei You;Jinlong Huang;Bo Wang;Qiang Tong",
        "authorids": "~Yiwei_You1;~Jinlong_Huang2;~Bo_Wang14;~Qiang_Tong1",
        "gender": "M;M;M;M",
        "homepage": "https://github.com/uibe-yywyy;https://github.com/hjl153;http://it.uibe.edu.cn/szdw/dsjkxyjzx/50452.htm;http://it.uibe.edu.cn/szdw/rgznx/8aa87325a4e04d29971ccbae11f0a0ff.htm",
        "dblp": ";;72/6811-49;",
        "google_scholar": ";;pNrI3CEAAAAJ;",
        "orcid": ";;0000-0002-8054-8185;",
        "linkedin": ";;;",
        "or_profile": "~Yiwei_You1;~Jinlong_Huang2;~Bo_Wang14;~Qiang_Tong1",
        "aff": "University of International Business and Economics;University of International Business and Economics;University of International Business and Economics;University of International Business and Economics",
        "aff_domain": "uibe.edu.cn;uibe.edu.cn;uibe.edu.cn;uibe.edu.cn",
        "position": "PhD student;MS student;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nyou2024rethinking,\ntitle={Rethinking One-vs-the-Rest Loss for Instance-dependent Complementary Label Learning},\nauthor={Yiwei You and Jinlong Huang and Bo Wang and Qiang Tong},\nyear={2024},\nurl={https://openreview.net/forum?id=vxzRcFd837}\n}",
        "github": "",
        "project": "",
        "reviewers": "8ujZ;uKaT;dowv",
        "site": "https://openreview.net/forum?id=vxzRcFd837",
        "pdf_size": 1603557,
        "rating": "3;5;5",
        "confidence": "4;4;3",
        "soundness": "2;2;3",
        "contribution": "2;2;2",
        "presentation": "3;3;3",
        "wc_summary": "16;52;93",
        "wc_strengths": "11;22;39",
        "wc_weaknesses": "62;273;60",
        "wc_questions": "144;9;191",
        "wc_review": "233;356;383",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "104;102;117",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            53.666666666666664,
            31.45720196641074
        ],
        "wc_strengths_avg": [
            24.0,
            11.51810169544733
        ],
        "wc_weaknesses_avg": [
            131.66666666666666,
            99.94109376138637
        ],
        "wc_questions_avg": [
            114.66666666666667,
            77.14200469840597
        ],
        "wc_review_avg": [
            324.0,
            65.28399497579785
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            107.66666666666667,
            6.649979114420002
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:hgQOE7wNEYAJ:scholar.google.com/&scioq=Rethinking+One-vs-the-Rest+Loss+for+Instance-dependent+Complementary+Label+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of International Business and Economics",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.uibe.edu.cn",
        "aff_unique_abbr": "UIBE",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Off-Policy Primal-Dual Safe Reinforcement Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17512",
        "id": "vy42bYs1Wo",
        "author_site": "Zifan Wu, Bo Tang, Qian Lin, Chao Yu, Shangqin Mao, Qianlong Xie, Xingxing Wang, Dong Wang",
        "tldr": "",
        "abstract": "Primal-dual safe RL methods commonly perform iterations between the primal update of the policy and the dual update of the Lagrange Multiplier. Such a training paradigm is highly susceptible to the error in cumulative cost estimation since this estimation serves as the key bond connecting the primal and dual update processes. We show that this problem causes significant underestimation of cost when using off-policy methods, leading to the failure to satisfy the safety constraint. To address this issue, we propose conservative policy optimization, which learns a policy in a constraint-satisfying area by considering the uncertainty in cost estimation. This improves constraint satisfaction but also potentially hinders reward maximization. We then introduce local policy convexification to help eliminate such suboptimality by gradually reducing the estimation uncertainty. We provide theoretical interpretations of the joint coupling effect of these two ingredients and further verify them by extensive experiments. Results on benchmark tasks show that our method not only achieves an asymptotic performance comparable to state-of-the-art on-policy methods while using much fewer samples, but also significantly reduces constraint violation during training. Our code is available at https://github.com/ZifanWu/CAL.",
        "keywords": "Safe Reinforcement Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/f2ff51c764c3e760d0c47f7d7d48f00f685a57b3.zip",
        "author": "Zifan Wu;Bo Tang;Qian Lin;Chao Yu;Shangqin Mao;Qianlong Xie;Xingxing Wang;Dong Wang",
        "authorids": "~Zifan_Wu2;~Bo_Tang3;~Qian_Lin3;~Chao_Yu2;~Shangqin_Mao1;~Qianlong_Xie1;~Xingxing_Wang3;~Dong_Wang34",
        "gender": "M;;M;M;M;;M;M",
        "homepage": "https://scholar.google.com/citations?user=cHCsqP8AAAAJ&hl;;https://qianlin04.github.io/;https://cse.sysu.edu.cn/teacher/YuChao;;;;",
        "dblp": "305/7804;;;36/6789-4;193/2068;;;40/3934-22.html",
        "google_scholar": "cHCsqP8AAAAJ;;https://scholar.google.com/citations?view_op=list_works;;;;;",
        "orcid": ";;0000-0003-0724-8909;;0000-0002-3247-0483;;0000-0001-5495-0827;0000-0002-1964-3984",
        "linkedin": ";;;;;;;",
        "or_profile": "~Zifan_Wu2;~Bo_Tang3;~Qian_Lin3;~Chao_Yu2;~Shangqin_Mao1;~Qianlong_Xie1;~Xingxing_Wang3;~Dong_Wang34",
        "aff": "SUN YAT-SEN UNIVERSITY;;SUN YAT-SEN UNIVERSITY;SUN YAT-SEN UNIVERSITY;;;meituan;",
        "aff_domain": "sysu.edu.cn;;sysu.edu.cn;mail.sysu.edu.cn;;;meituan.com;",
        "position": "MS student;;MS student;Associate Professor;;;Researcher;",
        "bibtex": "@inproceedings{\nwu2024offpolicy,\ntitle={Off-Policy Primal-Dual Safe Reinforcement Learning},\nauthor={Zifan Wu and Bo Tang and Qian Lin and Chao Yu and Shangqin Mao and Qianlong Xie and Xingxing Wang and Dong Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=vy42bYs1Wo}\n}",
        "github": "",
        "project": "",
        "reviewers": "oKob;M5JF;Dfxp;cCE3",
        "pdf_size": 4447944,
        "rating": "5;6;8;8",
        "confidence": "4;4;3;4",
        "soundness": "2;1;4;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;4;3",
        "wc_summary": "49;48;147;172",
        "wc_strengths": "21;26;84;81",
        "wc_weaknesses": "64;79;70;114",
        "wc_questions": "58;161;150;49",
        "wc_review": "192;314;451;416",
        "wc_reply_reviewers": "0;39;41;0",
        "wc_reply_authors": "773;862;456;407",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "2;3;1;2",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            1.118033988749895
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            104.0,
            56.20053380529406
        ],
        "wc_strengths_avg": [
            53.0,
            29.57194616524249
        ],
        "wc_weaknesses_avg": [
            81.75,
            19.369757355217438
        ],
        "wc_questions_avg": [
            104.5,
            51.24695112882326
        ],
        "wc_review_avg": [
            343.25,
            100.79031451483819
        ],
        "wc_reply_reviewers_avg": [
            20.0,
            20.0124960961895
        ],
        "wc_reply_authors_avg": [
            624.5,
            196.31416148612408
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.5555555555555555,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14577049044714083209&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=vy42bYs1Wo",
        "pdf": "https://openreview.net/pdf?id=vy42bYs1Wo",
        "email": "sysu.edu.cn;;sysu.edu.cn;mail.sysu.edu.cn;;;meituan.com;",
        "author_num": 8,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "Sun Yat-sen University;Meituan",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.sysu.edu.cn;https://www.meituan.com",
        "aff_unique_abbr": "SYSU;Meituan",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "vyGp9Mty2t",
        "title": "Implicit Neural Representations for Joint Sparse-View CT Reconstruction",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Sparse-view Computed Tomography (CT) is favored over standard CT for its reduced ionizing radiation but poses challenges due to its inherently ill-posed nature arising from undersampled measurement data. Implicit Neural Representations (INRs) have emerged as a promising solution, demonstrating effectiveness in sparse-view CT reconstruction. Given that modern CT often scans similar subjects, we propose to improve reconstruction quality via joint reconstruction of multiple objects using INRs. This approach can potentially leverage both the strengths of INRs and the statistical regularities across multiple objects. While existing techniques of INR joint reconstruction focus on enhancing convergence rates through meta-initialization, they do not optimize for final reconstruction quality. To fill this gap, we introduce a novel INR-based Bayesian framework that incorporates latent variables to capture inter-object relationships. These latent variables act as a continuously updated reference during the optimization process, thereby enhancing the quality of individual reconstructions. We conduct extensive experiments to evaluate various aspects such as reconstruction quality, susceptibility to overfitting, and generalizability. Results demonstrate that our method sets a new standard in CT reconstruction performance. Our code will be released.",
        "keywords": "implicit neural representations;CT reconstruction;representation learning;bayesian framework;variational inference",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Jiayang Shi;Junyi Zhu;Daniel Pelt;Joost Batenburg;Matthew B. Blaschko",
        "authorids": "~Jiayang_Shi2;~Junyi_Zhu1;~Daniel_Pelt1;~Joost_Batenburg1;~Matthew_B._Blaschko1",
        "gender": "Not Specified;M;;M;M",
        "homepage": ";https://junyizhu-ai.github.io/;;https://www.universiteitleiden.nl/en/staffmembers/joost-batenburg;http://homes.esat.kuleuven.be/~mblaschk/",
        "dblp": "288/0786;192/6828-2.html;140/0228;30/6502;12/5233",
        "google_scholar": "9GJ3jyMAAAAJ;3LeC4cMAAAAJ;https://scholar.google.nl/citations?user=54V8aTMAAAAJ;https://scholar.google.com.tw/citations?user=6WpX7xUAAAAJ;EmmO7LcAAAAJ",
        "orcid": "0000-0002-7014-0805;0000-0002-8980-5336;;;0000-0002-2640-181X",
        "linkedin": ";;;;matthew-blaschko-5b7a51b0/",
        "or_profile": "~Jiayang_Shi2;~Junyi_Zhu1;~Daniel_Pelt1;~Joost_Batenburg1;~Matthew_Blaschko1",
        "aff": "Leiden University, Leiden University;KU Leuven;Leiden University;Leiden University, Leiden University;KU Leuven",
        "aff_domain": "liacs.leidenuniv.nl;kuleuven.be;leidenuniv.nl;liacs.leidenuniv.nl;esat.kuleuven.be",
        "position": "PhD student;PhD student;Assistant Professor;Full Professor;Associate Professor",
        "bibtex": "@misc{\nshi2024implicit,\ntitle={Implicit Neural Representations for Joint Sparse-View {CT} Reconstruction},\nauthor={Jiayang Shi and Junyi Zhu and Daniel Pelt and Joost Batenburg and Matthew B. Blaschko},\nyear={2024},\nurl={https://openreview.net/forum?id=vyGp9Mty2t}\n}",
        "github": "",
        "project": "",
        "reviewers": "ufhh;WCTi;R9JK;PdsV",
        "site": "https://openreview.net/forum?id=vyGp9Mty2t",
        "pdf_size": 14942326,
        "rating": "3;5;6;8",
        "confidence": "4;5;3;2",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "44;49;98;76",
        "wc_strengths": "28;116;123;81",
        "wc_weaknesses": "561;924;194;6",
        "wc_questions": "16;8;21;79",
        "wc_review": "649;1097;436;242",
        "wc_reply_reviewers": "626;225;0;0",
        "wc_reply_authors": "4755;4433;791;735",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "13;12;2;1",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            66.75,
            21.76436307361187
        ],
        "wc_strengths_avg": [
            87.0,
            37.59654239421492
        ],
        "wc_weaknesses_avg": [
            421.25,
            352.26508129532226
        ],
        "wc_questions_avg": [
            31.0,
            28.098042636454235
        ],
        "wc_review_avg": [
            606.0,
            317.93316907803126
        ],
        "wc_reply_reviewers_avg": [
            212.75,
            255.66127493228223
        ],
        "wc_reply_authors_avg": [
            2678.5,
            1918.9822172182837
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            7.0,
            5.522680508593631
        ],
        "replies_avg": [
            37,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.7442084075352507,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Ln3EkEsW8AkJ:scholar.google.com/&scioq=Implicit+Neural+Representations+for+Joint+Sparse-View+CT+Reconstruction&hl=en&as_sdt=0,24",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0;1",
        "aff_unique_norm": "Leiden University;Katholieke Universiteit Leuven",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.universiteitleiden.nl;https://www.kuleuven.be",
        "aff_unique_abbr": "LU;KU Leuven",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Leiden;",
        "aff_country_unique_index": "0;1;0;0;1",
        "aff_country_unique": "Netherlands;Belgium"
    },
    {
        "id": "vyQmKicyVw",
        "title": "Revealing Hidden Causal Variables and Latent Factors from Multiple Distributions",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In many problems, the measured variables (e.g., image pixels) are just mathematical functions of the hidden causal variables (e.g., the underlying concepts or objects). For the purpose of making prediction in changing environments or making proper changes to the system, it is helpful to recover the hidden causal variables $Z_i$, their causal relations represented by graph $\\mathcal{G}_Z$, and how their causal influences change, which can be explained by suitable latent factors $\\theta_i$ governing changes in the causal mechanisms. This paper is concerned with the problem of estimating the underlying hidden causal variables and the latent factors from multiple distributions (arising from heterogeneous data or nonstationary time series) in nonparametric settings. We first show that under the sparsity constraint on the recovered graph over the latent variables and suitable sufficient change conditions on the causal influences, the recovered latent variables and their relations are related to the underlying causal model in a specific, nontrivial way.  Moreover, we show that orthogonally, under the modular change condition on the causal modules (without the sparsity constraint on the graph), the underlying latent factors $\\theta_i$ can be recovered up to component-wise invertible transformations. Putting them together, one is able to recover the hidden variables, their causal relations, and the corresponding latent factors up to minor indeterminacies.",
        "keywords": "Identifiability;Latent Variable Models;Causal Representation Learning",
        "primary_area": "causal reasoning",
        "supplementary_material": "",
        "author": "Kun Zhang;Shaoan Xie;Ignavier Ng;Yujia Zheng",
        "authorids": "~Kun_Zhang1;~Shaoan_Xie4;~Ignavier_Ng1;~Yujia_Zheng1",
        "gender": "M;;M;M",
        "homepage": "http://www.andrew.cmu.edu/user/kunz1/;https://shaoan.net;https://ignavierng.github.io/;https://yjzheng.com",
        "dblp": "96/3115-1;205/9276.html;251/3037;245/6109-1.html",
        "google_scholar": "RGoypN4AAAAJ;mChB-hQAAAAJ;;https://scholar.google.co.uk/citations?user=ioiW248AAAAJ",
        "orcid": ";;;0009-0003-5225-6366",
        "linkedin": ";;;",
        "or_profile": "~Kun_Zhang1;~Shaoan_Xie4;~Ignavier_Ng1;~Yujia_Zheng1",
        "aff": "Carnegie Mellon University;Carnegie Mellon University;Carnegie Mellon University;Carnegie Mellon University",
        "aff_domain": "cmu.edu;cmu.edu;cmu.edu;cmu.edu",
        "position": "Associate Professor;PhD student;PhD student;PhD student",
        "bibtex": "@misc{\nzhang2024revealing,\ntitle={Revealing Hidden Causal Variables and Latent Factors from Multiple Distributions},\nauthor={Kun Zhang and Shaoan Xie and Ignavier Ng and Yujia Zheng},\nyear={2024},\nurl={https://openreview.net/forum?id=vyQmKicyVw}\n}",
        "github": "",
        "project": "",
        "reviewers": "d7mo;8efN;mmWQ;xPxb",
        "site": "https://openreview.net/forum?id=vyQmKicyVw",
        "pdf_size": 1679914,
        "rating": "3;3;3;5",
        "confidence": "3;3;2;4",
        "soundness": "2;1;2;3",
        "contribution": "2;2;1;2",
        "presentation": "3;2;1;3",
        "wc_summary": "98;88;91;47",
        "wc_strengths": "40;31;65;10",
        "wc_weaknesses": "123;442;576;127",
        "wc_questions": "95;3;117;109",
        "wc_review": "356;564;849;293",
        "wc_reply_reviewers": "0;0;214;0",
        "wc_reply_authors": "961;786;1667;934",
        "reply_reviewers": "0;0;2;0",
        "reply_authors": "2;2;4;2",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            81.0,
            19.96246477767713
        ],
        "wc_strengths_avg": [
            36.5,
            19.72941965694886
        ],
        "wc_weaknesses_avg": [
            317.0,
            197.76374794183084
        ],
        "wc_questions_avg": [
            81.0,
            45.71651780264984
        ],
        "wc_review_avg": [
            515.5,
            217.09502527695102
        ],
        "wc_reply_reviewers_avg": [
            53.5,
            92.66471820493493
        ],
        "wc_reply_authors_avg": [
            1087.0,
            341.42568737574504
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            2.5,
            0.8660254037844386
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:OKKsAS7fkZQJ:scholar.google.com/&scioq=Revealing+Hidden+Causal+Variables+and+Latent+Factors+from+Multiple+Distributions&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Carnegie Mellon University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cmu.edu",
        "aff_unique_abbr": "CMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "vzvCaYFTLq",
        "title": "Sapling: $\\underline{S}$uccessive $\\underline{A}$daptation and Com$\\underline{p}$ression with $\\underline{L}$ayer Dropp$\\underline{ing}$ for LLMs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Specializing Large language models (LLMs) for local deployment and domain-specific use can deliver state-of-the-art performance while meeting latency and privacy requirements. However, conventional task-specific adaptation does not show both memory saving and inference speedup at deployment time. Practical compression techniques like quantization and pruning require hardware support or system optimization to achieve measured inference speedup. We propose Sapling, which can retain LLMs' capacity in a specific knowledge domain and achieve inference speedup on any hardware and deep learning systems by reducing the model depth. Sapling is based on the knowledge localization phenomenon we empirically observed and verified on LLMs, and achieves model compression via successive layer dropping. We evaluated Sapling on LLaMA-7B. At inference time, the models adapted on medical, legal, and financial datasets have all demonstrated reliable performance, comparable memory saving, $1.2$ to $8.5\\times$ inference speedup on consumer-level hardware compared to state-of-the-art quantization algorithms, depending on how well the algorithms are supported by efficient accelerator kernels.",
        "keywords": "Efficient Deep Learning;Layer Dropping;LLM Fine-tuning;Specialized LLMs",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Lanxiang Hu;Hao Zhang",
        "authorids": "~Lanxiang_Hu1;~Hao_Zhang2",
        "gender": "M;M",
        "homepage": "https://snyhlxde1.github.io/;https://cseweb.ucsd.edu/~haozhang/",
        "dblp": ";55/2270-25",
        "google_scholar": "KufYmg8AAAAJ;H1d4BS8AAAAJ",
        "orcid": "0000-0003-0641-3677;",
        "linkedin": "hu-lanxiang/;",
        "or_profile": "~Lanxiang_Hu1;~Hao_Zhang2",
        "aff": "University of California, San Diego;Carnegie Mellon University",
        "aff_domain": "ucsd.edu;cmu.edu",
        "position": "PhD student;PhD student",
        "bibtex": "@misc{\nhu2024sapling,\ntitle={Sapling: \\${\\textbackslash}underline\\{S\\}\\$uccessive \\${\\textbackslash}underline\\{A\\}\\$daptation and Com\\${\\textbackslash}underline\\{p\\}\\$ression with \\${\\textbackslash}underline\\{L\\}\\$ayer Dropp\\${\\textbackslash}underline\\{ing\\}\\$ for {LLM}s},\nauthor={Lanxiang Hu and Hao Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=vzvCaYFTLq}\n}",
        "github": "",
        "project": "",
        "reviewers": "JG4e;5U84;hKv9;vqsi",
        "site": "https://openreview.net/forum?id=vzvCaYFTLq",
        "pdf_size": 683525,
        "rating": "3;5;5;6",
        "confidence": "4;3;3;4",
        "soundness": "2;3;2;2",
        "contribution": "2;2;3;2",
        "presentation": "2;3;2;3",
        "wc_summary": "86;78;54;49",
        "wc_strengths": "35;114;26;123",
        "wc_weaknesses": "216;36;99;96",
        "wc_questions": "6;35;231;134",
        "wc_review": "343;263;410;402",
        "wc_reply_reviewers": "0;0;0;29",
        "wc_reply_authors": "1134;682;1357;734",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "5;4;5;3",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            66.75,
            15.610493265749165
        ],
        "wc_strengths_avg": [
            74.5,
            44.22951503238533
        ],
        "wc_weaknesses_avg": [
            111.75,
            65.22413280374067
        ],
        "wc_questions_avg": [
            101.5,
            88.55647915313706
        ],
        "wc_review_avg": [
            354.5,
            58.823889704778956
        ],
        "wc_reply_reviewers_avg": [
            7.25,
            12.55736835487436
        ],
        "wc_reply_authors_avg": [
            976.75,
            280.67897587813735
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.25,
            0.82915619758885
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.2294157338705618,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of California, San Diego;Carnegie Mellon University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ucsd.edu;https://www.cmu.edu",
        "aff_unique_abbr": "UCSD;CMU",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "San Diego;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "w0z3MKnmzu",
        "title": "ResPrompt: Residual Connection Prompting Advances Multi-Step Reasoning in Large Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Chain-of-thought (CoT) prompting, which offers step-by-step problem-solving rationales, has impressively unlocked the reasoning potential of large language models (LLMs). Yet, the standard CoT is less effective in problems demanding multiple reasoning steps. This limitation arises from the complex reasoning process in multi-step problems: later stages often depend on the results of several steps earlier, not just the results of the immediately preceding step. Such complexities suggest the reasoning process is naturally represented as a graph. The almost linear and straightforward structure of CoT prompting, however, struggles to capture this complex reasoning graph. To address this challenge, we propose Residual Connection Prompting (*RESPROMPT*), a new prompting strategy that advances multi-step reasoning in LLMs. Our key idea is to reconstruct the reasoning graph within prompts. We achieve this by integrating necessary connections\u2014links present in the reasoning graph but missing in the linear CoT flow\u2014into the prompts. Termed \u201cresidual connections\", these links are pivotal in morphing the linear CoT structure into a graph representation, effectively capturing the complex reasoning graphs inherent in multi-step problems. We evaluate *RESPROMPT* on six benchmarks across three diverse domains: math, sequential, and commonsense reasoning. For the open-sourced LLaMA family of models, *RESPROMPT* yields a significant average reasoning accuracy improvement of 12.5% on LLaMA-65B and 6.8% on LLaMA2-70B. Breakdown analysis further highlights *RESPROMPT* particularly excels in complex multi-step reasoning: for questions demanding at least five reasoning steps, *RESPROMPT* outperforms the best CoT based benchmarks by a remarkable average improvement of 21.1% on LLaMA-65B and 14.3% on LLaMA2-70B. Through extensive ablation studies and analyses, we pinpoint how to most effectively build residual connections, and assess *RESPROMPT* in view of \u201cemergent ability\", few-shot learning, and robustness, while also noting scenarios in which it might be superfluous.",
        "keywords": "Large Language Models;Multi-Step Reasoning;Residual Connections;Chain-of-Thought",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Song Jiang;Zahra Shakeri;Aaron Chan;Maziar Sanjabi;Hamed Firooz;Yinglong Xia;Bugra Akyildiz;Yizhou Sun;Jinchao Li;Qifan Wang;Asli Celikyilmaz",
        "authorids": "~Song_Jiang1;~Zahra_Shakeri1;~Aaron_Chan1;~Maziar_Sanjabi1;~Hamed_Firooz1;~Yinglong_Xia1;~Bugra_Akyildiz1;~Yizhou_Sun1;~Jinchao_Li1;~Qifan_Wang2;~Asli_Celikyilmaz1",
        "gender": "M;F;;M;M;M;;F;M;M;F",
        "homepage": "https://songjiang0909.github.io/;https://sites.google.com/view/zshakeri/home?authuser=1;;https://sites.google.com/view/maziar;;;https://bugra.github.io/;http://web.cs.ucla.edu/~yzsun/;;https://wqfcr.github.io/;https://asli.us",
        "dblp": "08/237-2;159/1512;;21/8577;;61/3251;;37/3868;https://dblp.org/pers/l/Li:Jinchao.html;33/8610;15/3724",
        "google_scholar": "SjbhMQEAAAAJ;S4ilHdMAAAAJ;;bc_N2-oAAAAJ;4pKOL5gAAAAJ;;;https://scholar.google.com.tw/citations?user=TQgOjK0AAAAJ;;LrSyLosAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;;;0000-0002-8155-5440;;;;0000-0002-7570-5756;",
        "linkedin": ";zahra-shakeri-9106669b/;;;;;;;;;aslicelikyilmaz/",
        "or_profile": "~Song_Jiang1;~Zahra_Shakeri1;~Aaron_Chan1;~Maziar_Sanjabi1;~Hamed_Firooz1;~Yinglong_Xia1;~Bugra_Akyildiz1;~Yizhou_Sun1;~Jinchao_Li1;~Qifan_Wang2;~Asli_Celikyilmaz1",
        "aff": "University of California, Los Angeles;;;Meta;LinkedIn;Meta;Bilkent University;University of California, Los Angeles;Meta Facebook;Meta AI;FAIR ",
        "aff_domain": "ucla.edu;;;meta.com;linkedin.com;meta.com;bilkent.edu.tr;ucla.edu;fb.com;fb.com;meta.com",
        "position": "PhD student;;;Researcher;Researcher;Researcher;Researcher;Associate Professor;Software Engineer;Principal Researcher;Principal Researcher",
        "bibtex": "@misc{\njiang2024resprompt,\ntitle={ResPrompt: Residual Connection Prompting Advances Multi-Step Reasoning in Large Language Models},\nauthor={Song Jiang and Zahra Shakeri and Aaron Chan and Maziar Sanjabi and Hamed Firooz and Yinglong Xia and Bugra Akyildiz and Yizhou Sun and Jinchao Li and Qifan Wang and Asli Celikyilmaz},\nyear={2024},\nurl={https://openreview.net/forum?id=w0z3MKnmzu}\n}",
        "github": "",
        "project": "",
        "reviewers": "z49G;n8nq;w7DW;BjpG",
        "site": "https://openreview.net/forum?id=w0z3MKnmzu",
        "pdf_size": 794988,
        "rating": "3;3;6;8",
        "confidence": "3;5;3;3",
        "soundness": "2;1;3;4",
        "contribution": "2;1;2;4",
        "presentation": "3;2;3;4",
        "wc_summary": "106;77;50;76",
        "wc_strengths": "42;25;69;40",
        "wc_weaknesses": "280;599;266;6",
        "wc_questions": "10;27;102;56",
        "wc_review": "438;728;487;178",
        "wc_reply_reviewers": "0;152;0;0",
        "wc_reply_authors": "1500;1830;1215;214",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "3;3;2;1",
        "rating_avg": [
            5.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.5,
            1.118033988749895
        ],
        "contribution_avg": [
            2.25,
            1.0897247358851685
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            77.25,
            19.81634426426832
        ],
        "wc_strengths_avg": [
            44.0,
            15.858751527153705
        ],
        "wc_weaknesses_avg": [
            287.75,
            210.23364978042883
        ],
        "wc_questions_avg": [
            48.75,
            34.86671048435743
        ],
        "wc_review_avg": [
            457.75,
            195.282327669454
        ],
        "wc_reply_reviewers_avg": [
            38.0,
            65.81793068761733
        ],
        "wc_reply_authors_avg": [
            1189.75,
            603.9248194104958
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": -0.5443310539518174,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17275942629146912731&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;1;3;0;1;1;1",
        "aff_unique_norm": "University of California, Los Angeles;Meta;LinkedIn Corporation;Bilkent University",
        "aff_unique_dep": ";Meta Platforms, Inc.;;",
        "aff_unique_url": "https://www.ucla.edu;https://meta.com;https://www.linkedin.com;https://www.bilkent.edu.tr",
        "aff_unique_abbr": "UCLA;Meta;LinkedIn;Bilkent",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Los Angeles;",
        "aff_country_unique_index": "0;0;0;0;1;0;0;0;0",
        "aff_country_unique": "United States;T\u00fcrkiye"
    },
    {
        "title": "Are Models Biased on Text without Gender-related Language?",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17511",
        "id": "w1JanwReU6",
        "author_site": "Catarina Bel\u00e9m, Preethi Seshadri, Yasaman Razeghi, Sameer Singh",
        "tldr": "",
        "abstract": "Gender bias research has been pivotal in revealing undesirable behaviors in large language models, exposing serious gender stereotypes associated with occupations, and emotions. A key observation in prior work is that models reinforce stereotypes as a consequence of the gendered correlations that are present in the training data. In this paper, we focus on bias where the effect from training data is unclear, and instead address the question: *Do language models still exhibit gender bias in non-stereotypical settings?* To do so, we introduce **UnStereoEval (USE)**, a novel framework tailored for investigating gender bias in stereotype-free scenarios. USE defines a sentence-level score based on pretraining data statistics to determine if the sentence contain minimal word-gender associations. To systematically benchmark the fairness of popular language models in stereotype-free scenarios, we utilize USE to automatically generate benchmarks without any gender-related language.  By leveraging USE's sentence-level score, we also repurpose prior gender bias benchmarks (Winobias and Winogender) for non-stereotypical evaluation. Surprisingly, we find low fairness across all 28 tested models.  Concretely, models demonstrate fair behavior in only 9%-41% of  stereotype-free sentences, suggesting that bias does not solely stem from the presence of gender-related words. These results raise important questions about where underlying model biases come from and highlight the need for more systematic and comprehensive bias evaluation. We release the full dataset and code at [ucinlp.github.io/unstereo-eval](https://ucinlp.github.io/unstereo-eval).",
        "keywords": "Large language models;bias evaluation;gender bias;gender co-occurring words;gender-invariant;pretraining data statistics",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Catarina G Bel\u00e9m;Preethi Seshadri;Yasaman Razeghi;Sameer Singh",
        "authorids": "~Catarina_G_Bel\u00e9m1;~Preethi_Seshadri2;~Yasaman_Razeghi1;~Sameer_Singh1",
        "gender": "F;F;F;M",
        "homepage": "https://pastelbelem8.github.io/;https://preethiseshadri518.github.io/;https://yasamanrazeghi.com/;http://sameersingh.org",
        "dblp": "377/3756;175/6462.html;https://dblp.dagstuhl.de/pid/277/6248.html;13/3568-1",
        "google_scholar": "nMwgV2UAAAAJ;;YCtmdaMAAAAJ;-hGZC54AAAAJ",
        "orcid": ";;;0000-0003-0621-6323",
        "linkedin": "catarina-belem-20a114a8/;preethi-seshadri/;;sameersingh/",
        "or_profile": "~Catarina_G_Bel\u00e9m1;~Preethi_Seshadri2;~Yasaman_Razeghi1;~Sameer_Singh1",
        "aff": "Megagon Labs;University of California, Irvine;University of California, Irvine;University of California, Irvine",
        "aff_domain": "megagon.ai;uci.edu;uci.edu;uci.edu",
        "position": "Intern;PhD student;PhD student;Full Professor",
        "bibtex": "@inproceedings{\nbel{\\'e}m2024are,\ntitle={Are Models Biased on Text without Gender-related Language?},\nauthor={Catarina G Bel{\\'e}m and Preethi Seshadri and Yasaman Razeghi and Sameer Singh},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=w1JanwReU6}\n}",
        "github": "",
        "project": "",
        "reviewers": "NYBN;WuG5;Uaff;Kwnc",
        "pdf_size": 1128115,
        "rating": "5;5;6;6",
        "confidence": "3;4;4;4",
        "soundness": "3;3;2;3",
        "contribution": "2;2;2;2",
        "presentation": "3;3;3;3",
        "wc_summary": "106;57;92;48",
        "wc_strengths": "34;51;15;29",
        "wc_weaknesses": "81;167;194;56",
        "wc_questions": "37;42;101;45",
        "wc_review": "258;317;402;178",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "329;699;252;295",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            75.75,
            23.98306694315804
        ],
        "wc_strengths_avg": [
            32.25,
            12.871965661856
        ],
        "wc_weaknesses_avg": [
            124.5,
            57.4913036902104
        ],
        "wc_questions_avg": [
            56.25,
            25.9939896899264
        ],
        "wc_review_avg": [
            288.75,
            81.90657787992366
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            393.75,
            178.33588393814634
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6439468314592202356&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=w1JanwReU6",
        "pdf": "https://openreview.net/pdf?id=w1JanwReU6",
        "email": "megagon.ai;uci.edu;uci.edu;uci.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Megagon Labs;University of California, Irvine",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.megagonlabs.com;https://www.uci.edu",
        "aff_unique_abbr": ";UCI",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Irvine",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "w1w0bwwLxG",
        "title": "Why SAM finetuning can benefit Out-of-Distribution Detection?",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The out-of-distribution (OOD) detection task is crucial for the real-world deployment of machine learning models. In this paper, we propose to study the problem from the perspective of Sharpness-aware Minimization (SAM). Compared with SGD, SAM can better improve model performance and generalization ability, and this is closely related to OOD detection~\\citep{vaze2021open}. Therefore, instead of using SGD, we fine-tune the model with SAM, and observe that the distributions of in-distribution (ID) data and OOD data are pushed far away from each other. Through further analysis, concrete theoretical analysis has been provided to explain such observation. Besides, with our carefully designed loss, the fine-tuning process is very time friendly. Usually, the OOD performance improvement can be observed after fine-tuning the model within 1 epoch. Moreover, our method is very flexible and be used to improve the performance of different OOD detection methods.\nThe extensive experiments have demonstrated that our method achieves \\emph{state-of-the-art} performance on widely-used OOD benchmarks across different CNN architectures. Extensive ablation studies and analyses are discussed to support the strong empirical results.",
        "keywords": "OOD detection; Safety in Machine Learning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/18d2561e24a0ba4bce70ac6ff8e51992cc4f51e9.pdf",
        "author": "Chi Zhang;Yue Song;Nicu Sebe;Yao Zhao;Wei Wang",
        "authorids": "~Chi_Zhang38;~Yue_Song1;~Nicu_Sebe1;~Yao_Zhao1;~Wei_Wang43",
        "gender": "M;M;M;M;M",
        "homepage": "https://abel-cat.github.io;https://kingjamessong.github.io/;http://disi.unitn.it/~sebe/;http://mepro.bjtu.edu.cn;https://weiwangtrento.github.io/",
        "dblp": ";11/1346;20/3519;45/2091-1.html;35/7092-108",
        "google_scholar": ";Uza2i10AAAAJ;https://scholar.google.it/citations?user=stFCYOAAAAAJ;474TbQYAAAAJ;https://scholar.google.com/citations?hl=en-US",
        "orcid": ";;0000-0002-6597-7248;;0000-0002-5477-1017",
        "linkedin": ";;;;",
        "or_profile": "~Chi_Zhang38;~Yue_Song1;~Nicu_Sebe1;~Yao_Zhao1;~Wei_Wang43",
        "aff": "Beijing Jiaotong University;University of Trento, Italy;University of Trento;Beijing Jiaotong University;Beijing Jiaotong University",
        "aff_domain": "bjtu.edu.cn;unitn.it;unitn.it;bjtu.edu.cn;bjtu.edu.cn",
        "position": "PhD student;PhD student;Full Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nzhang2024why,\ntitle={Why {SAM} finetuning can benefit Out-of-Distribution Detection?},\nauthor={Chi Zhang and Yue Song and Nicu Sebe and Yao Zhao and Wei Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=w1w0bwwLxG}\n}",
        "github": "",
        "project": "",
        "reviewers": "4Xsz;F3yd;uGJJ;NGyn;eCTD",
        "site": "https://openreview.net/forum?id=w1w0bwwLxG",
        "pdf_size": 749998,
        "rating": "3;3;5;5;6",
        "confidence": "5;3;4;3;4",
        "soundness": "1;1;2;2;3",
        "contribution": "1;3;2;2;3",
        "presentation": "1;1;3;2;3",
        "wc_summary": "61;31;77;40;150",
        "wc_strengths": "50;41;32;44;144",
        "wc_weaknesses": "208;477;245;33;115",
        "wc_questions": "161;101;2;15;70",
        "wc_review": "480;650;356;132;479",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            4.4,
            1.2
        ],
        "confidence_avg": [
            3.8,
            0.7483314773547882
        ],
        "soundness_avg": [
            1.8,
            0.7483314773547883
        ],
        "contribution_avg": [
            2.2,
            0.7483314773547882
        ],
        "presentation_avg": [
            2.0,
            0.8944271909999159
        ],
        "wc_summary_avg": [
            71.8,
            42.27244965695743
        ],
        "wc_strengths_avg": [
            62.2,
            41.31053134492463
        ],
        "wc_weaknesses_avg": [
            215.6,
            150.1433981232608
        ],
        "wc_questions_avg": [
            69.8,
            58.12194077970901
        ],
        "wc_review_avg": [
            419.4,
            171.4754792966038
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.13363062095621214,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:8VcG3wUcKFIJ:scholar.google.com/&scioq=Why+SAM+finetuning+can+benefit+Out-of-Distribution+Detection%3F&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;0;0",
        "aff_unique_norm": "Beijing Jiao Tong University;University of Trento",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.njtu.edu.cn/en;https://www.unitn.it",
        "aff_unique_abbr": "BJTU;UniTN",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;0;0",
        "aff_country_unique": "China;Italy"
    },
    {
        "id": "w2GFB6FLAs",
        "title": "Asymmetrically Decentralized Federated Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "To address the communication burden and privacy concerns associated with the centralized server in Federated Learning (FL), Decentralized Federated Learning (DFL) has emerged, which discards the server with a peer-to-peer (P2P) communication framework. \nHowever, most existing DFL algorithms are based on symmetric topologies, such as ring and grid topologies, which can easily lead to deadlocks and are susceptible to the impact of network link quality in practice. \nTo address these issues, This paper proposes the DFedSGPSM algorithm, which is based on asymmetric topologies and utilizes the Push-Sum protocol to effectively solve consensus optimization problems.\nTo further improve algorithm performance and alleviate local heterogeneous overfitting in Federated Learning (FL), our algorithm combines the Sharpness Aware Minimization (SAM) optimizer and local momentum. The SAM optimizer employs gradient perturbations to generate locally flat models and searches for models with uniformly low loss values, mitigating local heterogeneous overfitting. The local momentum accelerates the optimization process of the SAM optimizer. \nTheoretical analysis proves that DFedSGPSM achieves a convergence rate of $\\mathcal{O}(\\frac{1}{\\sqrt{T}})$ in a non-convex smooth setting under mild assumptions. This analysis also reveals that better topological connectivity achieves tighter upper bounds. \nEmpirically, extensive experiments are conducted on the MNIST, CIFAR10, and CIFAR100 datasets, demonstrating the superior performance of our algorithm compared to state-of-the-art optimizers.",
        "keywords": "Asymmetrically Decentralized Federated Learning\uff0cConvergence analysis",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Qinglun Li;Miao Zhang;Nan Yin;Quanjun Yin;Li Shen",
        "authorids": "~Qinglun_Li1;~Miao_Zhang8;~Nan_Yin4;~Quanjun_Yin1;~Li_Shen1",
        "gender": ";;M;M;M",
        "homepage": ";;;https://xueshu.baidu.com/scholarID/CN-BW74AD5J;https://sites.google.com/site/mathshenli/home",
        "dblp": ";;135/8983;147/8406;91/3680-8",
        "google_scholar": ";;https://scholar.google.com.hk/citations?user=NoOK0pIAAAAJ;;yVhgENIAAAAJ",
        "orcid": ";0000-0003-1839-3079;;;",
        "linkedin": ";;yin-nan-b32943173;;",
        "or_profile": "~Qinglun_Li1;~Miao_Zhang8;~Nan_Yin4;~Quanjun_Yin1;~Li_Shen1",
        "aff": ";National University of Defense Technology;Mohamed bin Zayed University of Artificial Intelligence;National University of Defense Technology;JD Explore Academy",
        "aff_domain": ";nudt.edu.cn;mbzuai.ac.ae;nudt.edu.cn;jd.com",
        "position": ";Lecturer;Postdoc;Full Professor;Researcher",
        "bibtex": "@misc{\nli2024asymmetrically,\ntitle={Asymmetrically Decentralized Federated Learning},\nauthor={Qinglun Li and Miao Zhang and Nan Yin and Quanjun Yin and Li Shen},\nyear={2024},\nurl={https://openreview.net/forum?id=w2GFB6FLAs}\n}",
        "github": "",
        "project": "",
        "reviewers": "wyFy;BHdp;38tq;9LTG",
        "site": "https://openreview.net/forum?id=w2GFB6FLAs",
        "pdf_size": 698393,
        "rating": "3;3;5;5",
        "confidence": "5;5;4;4",
        "soundness": "3;2;2;3",
        "contribution": "1;2;2;3",
        "presentation": "3;2;2;3",
        "wc_summary": "96;96;56;61",
        "wc_strengths": "56;58;47;35",
        "wc_weaknesses": "358;258;99;22",
        "wc_questions": "98;150;55;249",
        "wc_review": "608;562;257;367",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            77.25,
            18.833148966649205
        ],
        "wc_strengths_avg": [
            49.0,
            9.082951062292475
        ],
        "wc_weaknesses_avg": [
            184.25,
            131.5491828176823
        ],
        "wc_questions_avg": [
            138.0,
            72.37748268626092
        ],
        "wc_review_avg": [
            448.5,
            142.86094637793772
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5447079203877673124&as_sdt=4000005&sciodt=0,18&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "National University of Defense Technology;Mohamed bin Zayed University of Artificial Intelligence;JD",
        "aff_unique_dep": ";;JD Explore Academy",
        "aff_unique_url": "http://www.nudt.edu.cn/;https://mbzuai.ac.ae;",
        "aff_unique_abbr": "NUDT;MBZUAI;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "China;United Arab Emirates;"
    },
    {
        "id": "w2GlpOHdg1",
        "title": "Atoms as Words: A Novel Approach to Deciphering Material Properties using NLP-inspired Machine Learning on Crystallographic Information Files (CIFs)",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In condensed matter physics and materials science, predicting material properties necessitates understanding intricate many-body interactions. Conventional methods such as density functional theory (DFT) and molecular dynamics (MD) often resort to simplifying approximations and are computationally expensive. Meanwhile, recent machine learning methods use handcrafted descriptors for material representation which sometimes neglect vital crystallographic information and are often limited to single property prediction or a sub-class of crystal structures. In this study, we pioneer an unsupervised strategy, drawing inspiration from Natural Language Processing (NLP), to harness the underutilized potential of Crystallographic Information Files (CIFs). We conceptualize atoms and atomic positions within a CIF similarly to words in textual content. Using a Word2Vec-inspired technique, we produce atomic embeddings that capture intricate atomic relationships. Our model, CIFSemantics, trained on the extensive Material Project dataset, adeptly predicts 15 distinct material properties from the CIFs. Its performance rivals specialized models, marking a significant step forward in material property predictions.",
        "keywords": "Condensed matter physics;Materials science;Material properties prediction;Crystallographic Information Files (CIFs);Natural Language Processing (NLP) in materials;Word2Vec-inspired technique;Atomic embeddings;CIFSemantics model;Band gap;Formation energy;Material representation",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Lalit Yadav",
        "authorids": "~Lalit_Yadav1",
        "gender": "M",
        "homepage": "",
        "dblp": "",
        "google_scholar": "",
        "orcid": "0000-0002-0389-9424",
        "linkedin": "lalityadav07/",
        "or_profile": "~Lalit_Yadav1",
        "aff": "Duke University",
        "aff_domain": "duke.edu",
        "position": "PhD student",
        "bibtex": "@misc{\nyadav2024atoms,\ntitle={Atoms as Words: A Novel Approach to Deciphering Material Properties using {NLP}-inspired Machine Learning on Crystallographic Information Files ({CIF}s)},\nauthor={Lalit Yadav},\nyear={2024},\nurl={https://openreview.net/forum?id=w2GlpOHdg1}\n}",
        "github": "",
        "project": "",
        "reviewers": "2xVF;NdwN;DZcp;DVQC",
        "site": "https://openreview.net/forum?id=w2GlpOHdg1",
        "pdf_size": 6059002,
        "rating": "3;3;3;3",
        "confidence": "5;4;5;5",
        "soundness": "3;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "2;1;2;3",
        "wc_summary": "104;196;139;83",
        "wc_strengths": "103;66;59;33",
        "wc_weaknesses": "186;407;77;119",
        "wc_questions": "63;110;1;64",
        "wc_review": "456;779;276;299",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            130.5,
            42.78142120126446
        ],
        "wc_strengths_avg": [
            65.25,
            25.02373872945448
        ],
        "wc_weaknesses_avg": [
            197.25,
            127.18564187831895
        ],
        "wc_questions_avg": [
            59.5,
            38.74596753211875
        ],
        "wc_review_avg": [
            452.5,
            200.82890728179547
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5746854722373758808&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0",
        "aff_unique_norm": "Duke University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.duke.edu",
        "aff_unique_abbr": "Duke",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "w327zcRpYn",
        "title": "SUBER: An RL Environment with Simulated Human Behavior for Recommender Systems",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Reinforcement learning (RL) has gained popularity in the realm of recommender systems due to its ability to optimize long-term rewards and guide users in discovering relevant content.\nHowever, the successful implementation of RL in recommender systems is challenging because of several factors, including the limited availability of online data for training on-policy methods. This scarcity requires expensive human interaction for online model training. Furthermore, the development of effective evaluation frameworks that accurately reflect the quality of models remains a fundamental challenge in recommender systems. To address these challenges, we propose a comprehensive framework for synthetic environments that simulate human behavior by harnessing the capabilities of large language models (LLMs). We complement our framework with in-depth ablation studies and demonstrate its effectiveness with experiments on movie and book recommendations. By utilizing LLMs as synthetic users, this work introduces a modular and novel framework for training RL-based recommender systems. The software, including the RL environment, is publicly available.",
        "keywords": "reinforcement learning;recommender systems;large language models",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/a82a22e48878c7fc575ad618b973f0e7fbe8c5ad.pdf",
        "author": "Nathan Corecco;Giorgio Piatti;Luca A Lanzend\u00f6rfer;Flint Xiaofeng Fan;Roger Wattenhofer",
        "authorids": "~Nathan_Corecco1;~Giorgio_Piatti1;~Luca_A_Lanzend\u00f6rfer1;~Flint_Xiaofeng_Fan1;~Roger_Wattenhofer1",
        "gender": "M;;M;;Not Specified",
        "homepage": ";;;;https://disco.ethz.ch/members/wroger",
        "dblp": ";;;;w/RogerWattenhofer",
        "google_scholar": ";;;;https://scholar.google.ch/citations?user=EG3VPm4AAAAJ",
        "orcid": ";;;;",
        "linkedin": "nathan-corecco-80b3ab260/;;luca-lanzendoerfer/;;roger-wattenhofer-4466731/",
        "or_profile": "~Nathan_Corecco1;~Giorgio_Piatti1;~Luca_A_Lanzend\u00f6rfer1;~Flint_Xiaofeng_Fan1;~Roger_Wattenhofer1",
        "aff": "ETHZ - ETH Zurich;;ETHZ - ETH Zurich;;Swiss Federal Institute of Technology",
        "aff_domain": "ethz.ch;;ethz.ch;;ethz.ch",
        "position": "MS student;;PhD student;;Full Professor",
        "bibtex": "@misc{\ncorecco2024suber,\ntitle={{SUBER}: An {RL} Environment with Simulated Human Behavior for Recommender Systems},\nauthor={Nathan Corecco and Giorgio Piatti and Luca A Lanzend{\\\"o}rfer and Flint Xiaofeng Fan and Roger Wattenhofer},\nyear={2024},\nurl={https://openreview.net/forum?id=w327zcRpYn}\n}",
        "github": "",
        "project": "",
        "reviewers": "7Rhx;TXpX;K35w;g6on",
        "site": "https://openreview.net/forum?id=w327zcRpYn",
        "pdf_size": 416302,
        "rating": "3;3;5;6",
        "confidence": "5;5;4;5",
        "soundness": "1;2;3;2",
        "contribution": "1;2;3;2",
        "presentation": "3;2;3;3",
        "wc_summary": "90;56;26;90",
        "wc_strengths": "20;65;91;81",
        "wc_weaknesses": "128;217;232;176",
        "wc_questions": "4;261;175;186",
        "wc_review": "242;599;524;533",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "514;1594;1020;1019",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;3;2;2",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            65.5,
            26.69737814842499
        ],
        "wc_strengths_avg": [
            64.25,
            27.178806081209675
        ],
        "wc_weaknesses_avg": [
            188.25,
            40.37558049118304
        ],
        "wc_questions_avg": [
            156.5,
            94.05982139043216
        ],
        "wc_review_avg": [
            474.5,
            137.32170258192986
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1036.75,
            382.22727205158975
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7210842477455439648&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "ETH Zurich;Swiss Federal Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ethz.ch;https://www.ethz.ch",
        "aff_unique_abbr": "ETHZ;ETH Zurich",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Switzerland"
    },
    {
        "title": "MERT: Acoustic Music Understanding Model with Large-Scale Self-supervised Training",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17510",
        "id": "w3YZ9MSlBu",
        "author_site": "Yizhi Li, Ruibin Yuan, Ge Zhang, Yinghao MA, Xingran Chen, Hanzhi Yin, Chenghao Xiao, Chenghua Lin, Anton Ragni, Emmanouil Benetos, Norbert Gyenge, Roger Dannenberg, Ruibo Liu, Wenhu Chen, Gus Xia, Yemin Shi, Wenhao Huang, zili wang, Yike Guo, Jie Fu",
        "tldr": "",
        "abstract": "Self-supervised learning (SSL) has recently emerged as a promising paradigm for training generalisable models on large-scale data in the fields of vision, text, and speech. \nAlthough SSL has been proven effective in speech and audio, its application to music audio has yet to be thoroughly explored. This is partially due to the distinctive challenges associated with modelling musical knowledge, particularly tonal and pitched characteristics of music.\nTo address this research gap, we propose an acoustic **M**usic und**ER**standing model with large-scale self-supervised **T**raining (**MERT**), which incorporates teacher models to provide pseudo labels in the masked language modelling (MLM) style acoustic pre-training.\nIn our exploration, we identified an effective combination of teacher models, which outperforms conventional speech and audio approaches in terms of performance. \nThis combination includes an acoustic teacher based on Residual Vector Quantization - Variational AutoEncoder (RVQ-VAE) and a musical teacher based on the Constant-Q Transform (CQT). \nFurthermore, we explore a wide range of settings to overcome the instability in acoustic language model pre-training, which allows our designed paradigm to scale from 95M to 330M parameters.\nExperimental results indicate that our model can generalise and perform well on 14 music understanding tasks and attain state-of-the-art (SOTA) overall scores.",
        "keywords": "self-supervised learning;music;audio;language model",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/9d763e939566248881f9f354240d07393dbe1124.zip",
        "author": "Yizhi LI;Ruibin Yuan;Ge Zhang;Yinghao Ma;Xingran Chen;Hanzhi Yin;Chenghao Xiao;Chenghua Lin;Anton Ragni;Emmanouil Benetos;Norbert Gyenge;Roger Dannenberg;Ruibo Liu;Wenhu Chen;Gus Xia;Yemin Shi;Wenhao Huang;Zili Wang;Yike Guo;Jie Fu",
        "authorids": "~Yizhi_LI1;~Ruibin_Yuan1;~Ge_Zhang5;~Yinghao_Ma1;~Xingran_Chen1;~Hanzhi_Yin1;~Chenghao_Xiao1;~Chenghua_Lin1;~Anton_Ragni1;~Emmanouil_Benetos1;~Norbert_Gyenge1;~Roger_Dannenberg1;~Ruibo_Liu1;~Wenhu_Chen3;~Gus_Xia1;~Yemin_Shi2;~Wenhao_Huang1;~Zili_Wang1;~Yike_Guo1;~Jie_Fu2",
        "gender": "M;;M;M;M;M;M;;M;M;Not Specified;M;M;;M;;;M;M;",
        "homepage": "https://yizhilll.github.io;;;https://nicolaus625.github.io/;https://www.chenxingran.com/;https://yinhanzhi.me;;;http://mi.eng.cam.ac.uk/~ar527/;http://www.eecs.qmul.ac.uk/~emmanouilb/;;https://www.cs.cmu.edu/~rbd/;https://www.cs.dartmouth.edu/~rbliu/;;http://www.musicxlab.com;;;https://commencement.github.io/;https://cse.hkust.edu.hk/admin/people/faculty/profile/yikeguo;",
        "dblp": ";;;248/7435;203/8349;;;;68/9878;23/5543;;59/6414;;;;;;;g/YikeGuo;",
        "google_scholar": "l5NEL4wAAAAJ;;qyTrq4kAAAAJ;RiYt9toAAAAJ;X01oTv8AAAAJ;;1GtWLmIAAAAJ;;;https://scholar.google.com.tw/citations?user=Wg49oI4AAAAJ;iWWwQqIAAAAJ;https://scholar.google.com.tw/citations?user=whacJzwAAAAJ;5lgfeo4AAAAJ;;;;;E9zWgmwAAAAJ;https://scholar.google.com.tw/citations?user=-0q6cIYAAAAJ;",
        "orcid": "0000-0002-3932-9706;;;0009-0009-9500-4015;;;;;;0000-0002-6820-6764;;;;;;;;;0009-0005-8401-282X;",
        "linkedin": ";;ge-zhang-792797169/;nicolaus625/;;;;;;emmanouilb/;;;;;;;;;;",
        "or_profile": "~Yizhi_LI1;~Ruibin_Yuan1;~Ge_Zhang5;~Yinghao_Ma1;~Xingran_Chen1;~Hanzhi_Yin1;~Chenghao_Xiao1;~Chenghua_Lin1;~Anton_Ragni1;~Emmanouil_Benetos1;~Norbert_Gyenge1;~Roger_Dannenberg1;~Ruibo_Liu1;~Wenhu_Chen3;~Gus_Xia1;~Yemin_Shi2;~Wenhao_Huang1;~Zili_Wang1;~Yike_Guo1;~Jie_Fu2",
        "aff": "University of Manchester ;;University of Waterloo;Yamaha;University of Michigan - Ann Arbor;;Durham University;;University of Sheffield;Queen Mary, University of London;University of Sheffield;Carnegie Mellon University;Google DeepMind;;New York University;;;stepfun;Imperial College London;",
        "aff_domain": "manchester.ac.uk;;cs.uwaterloo.ca;bp.music.yamaha.com;umich.edu;;durham.ac.uk;;sheffield.ac.uk;qmul.ac.uk;shef.ac.uk;cmu.edu;google.com;;nyu.edu;;;stepfun.com;imperial.ac.uk;",
        "position": "PhD student;;PhD student;Intern;MS student;;PhD student;;Lecturer;Associate Professor;Researcher;Emeritus;Researcher;;Assistant Professor;;;Researcher;Full Professor;",
        "bibtex": "@inproceedings{\nli2024mert,\ntitle={{MERT}: Acoustic Music Understanding Model with Large-Scale Self-supervised Training},\nauthor={Yizhi LI and Ruibin Yuan and Ge Zhang and Yinghao Ma and Xingran Chen and Hanzhi Yin and Chenghao Xiao and Chenghua Lin and Anton Ragni and Emmanouil Benetos and Norbert Gyenge and Roger Dannenberg and Ruibo Liu and Wenhu Chen and Gus Xia and Yemin Shi and Wenhao Huang and Zili Wang and Yike Guo and Jie Fu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=w3YZ9MSlBu}\n}",
        "github": "",
        "project": "",
        "reviewers": "j7HH;Md8h;EaeP;7KYT",
        "pdf_size": 803072,
        "rating": "6;8;8;8",
        "confidence": "4;3;3;4",
        "soundness": "2;3;3;4",
        "contribution": "2;2;3;3",
        "presentation": "3;3;4;4",
        "wc_summary": "108;178;118;73",
        "wc_strengths": "115;78;145;105",
        "wc_weaknesses": "341;110;17;70",
        "wc_questions": "9;55;384;29",
        "wc_review": "573;421;664;277",
        "wc_reply_reviewers": "81;52;0;0",
        "wc_reply_authors": "785;450;338;393",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            119.25,
            37.81120865563543
        ],
        "wc_strengths_avg": [
            110.75,
            23.962209831315644
        ],
        "wc_weaknesses_avg": [
            134.5,
            123.70226352011511
        ],
        "wc_questions_avg": [
            119.25,
            153.72113550192114
        ],
        "wc_review_avg": [
            483.75,
            147.5963668252034
        ],
        "wc_reply_reviewers_avg": [
            33.25,
            34.79493497622894
        ],
        "wc_reply_authors_avg": [
            491.5,
            174.0179588433332
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            20,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 120,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7223852591740027332&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=w3YZ9MSlBu",
        "pdf": "https://openreview.net/pdf?id=w3YZ9MSlBu",
        "email": "manchester.ac.uk;;cs.uwaterloo.ca;bp.music.yamaha.com;umich.edu;;durham.ac.uk;;sheffield.ac.uk;qmul.ac.uk;shef.ac.uk;cmu.edu;google.com;;nyu.edu;;;stepfun.com;imperial.ac.uk;",
        "author_num": 20,
        "aff_unique_index": "0;1;2;3;4;5;6;5;7;8;9;10;11",
        "aff_unique_norm": "University of Manchester;University of Waterloo;Yamaha Corporation;University of Michigan;Durham University;University of Sheffield;Queen Mary, University of London;Carnegie Mellon University;Google;New York University;StepFun;Imperial College London",
        "aff_unique_dep": ";;;;;;;;Google DeepMind;;;",
        "aff_unique_url": "https://www.manchester.ac.uk;https://uwaterloo.ca;https://yamaha.com;https://www.umich.edu;https://www.dur.ac.uk;https://www.sheffield.ac.uk;https://www.qmul.ac.uk;https://www.cmu.edu;https://deepmind.com;https://www.nyu.edu;;https://www.imperial.ac.uk",
        "aff_unique_abbr": "UoM;UW;Yamaha;UM;Durham;Sheffield;QMUL;CMU;DeepMind;NYU;;ICL",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Ann Arbor;London",
        "aff_country_unique_index": "0;1;2;3;0;0;0;0;3;0;3;0",
        "aff_country_unique": "United Kingdom;Canada;Japan;United States;"
    },
    {
        "id": "w49jlMWDSA",
        "title": "GIST: Generating Image-Specific Text for Fine-grained Object Representations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent models pre-trained on image-text pairs can learn rich vision-language representations that improve downstream tasks, such as image classification. However, because of the absence of paired text/image descriptions in many domains, it is difficult to fine-tune these models for many downstream tasks. In this work, we propose GIST -- a method for generating $\\textit{image-specific}$ $\\textit{fine-grained}$ text descriptions from image-only datasets. Our findings include 1) prompting a pretrained large language model with $\\textit{domain-specific}$ prompts generates diverse fine-grained text descriptions that capture the full range of inter-class and intra-class differences, 2) using a pretrained vision-language model to match each training image to the most relevant text descriptions creates image-specific image-text pairs, and 3) summarizing the matched text using a large language model prior to fine-tuning the image encoder improves the utility of the learned representations. We demonstrate the utility of GIST by fine-tuning vision-language models on the output of GIST to learn an aligned vision-language representation space. We evaluate this learned representation space in full-shot and few-shot scenarios across four diverse fine-grained classification datasets, each from a different domain. Our method achieves an average of 1.1% improvement in accuracy over the existing state-of-the-art image-text classification method and 4.1% improvement in accuracy over CLIP linear probes on full-shot datasets. Our method achieves similar improvements across few-shot regimes. Code will be made publicly available upon publication.",
        "keywords": "representation learning;contrastive learning;fine-grained image classification;few-shot learning;large language model;multi-modal models;vision-language",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Kathleen M. Lewis;Emily Mu;Adrian V Dalca;John Guttag",
        "authorids": "~Kathleen_M._Lewis1;~Emily_Mu1;~Adrian_V_Dalca1;~John_Guttag2",
        "gender": "F;M;M;F",
        "homepage": ";http://adalca.mit.edu;https://people.csail.mit.edu/guttag/;https://katiemlewis.github.io/",
        "dblp": ";27/4108;g/JohnVGuttag;191/0537",
        "google_scholar": "OW1TCKIAAAAJ;https://scholar.google.ca/citations?user=zRy-zdAAAAAJ;;tMFi9qoAAAAJ",
        "orcid": ";0000-0002-8422-0136;;",
        "linkedin": ";adalca/;;katiemarielewis/",
        "or_profile": "~Emily_Mu1;~Adrian_V_Dalca1;~John_Guttag2;~Kathleen_M_Lewis1",
        "aff": "Massachusetts Institute of Technology;Massachusetts Institute of Technology;Massachusetts Institute of Technology;",
        "aff_domain": "mit.edu;mit.edu;mit.edu;",
        "position": "PhD student;Research Scientist;Full Professor;",
        "bibtex": "@misc{\nlewis2024gist,\ntitle={{GIST}: Generating Image-Specific Text for Fine-grained Object Representations},\nauthor={Kathleen M. Lewis and Emily Mu and Adrian V Dalca and John Guttag},\nyear={2024},\nurl={https://openreview.net/forum?id=w49jlMWDSA}\n}",
        "github": "",
        "project": "",
        "reviewers": "om6n;aPA7;zGRf",
        "site": "https://openreview.net/forum?id=w49jlMWDSA",
        "pdf_size": 27120435,
        "rating": "5;5;6",
        "confidence": "4;5;4",
        "soundness": "3;3;2",
        "contribution": "3;2;2",
        "presentation": "3;3;2",
        "wc_summary": "68;97;91",
        "wc_strengths": "29;26;63",
        "wc_weaknesses": "181;163;117",
        "wc_questions": "60;1;52",
        "wc_review": "338;287;323",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "462;296;434",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            85.33333333333333,
            12.498888839501783
        ],
        "wc_strengths_avg": [
            39.333333333333336,
            16.779617264870957
        ],
        "wc_weaknesses_avg": [
            153.66666666666666,
            26.948510575210314
        ],
        "wc_questions_avg": [
            37.666666666666664,
            26.132142830026183
        ],
        "wc_review_avg": [
            316.0,
            21.400934559032695
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            397.3333333333333,
            72.55955408413759
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:K5HYaPmWYRUJ:scholar.google.com/&scioq=GIST:+Generating+Image-Specific+Text+for+Fine-grained+Object+Representations&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Massachusetts Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://web.mit.edu",
        "aff_unique_abbr": "MIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "SuRe: Summarizing Retrievals using Answer Candidates for Open-domain QA of LLMs",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17509",
        "id": "w4DW6qkRmt",
        "author_site": "Jaehyung Kim, Jaehyun Nam, Sangwoo Mo, Jongjin Park, Sang-Woo Lee, Minjoon Seo, Jung-Woo Ha, Jinwoo Shin",
        "tldr": "",
        "abstract": "Large language models (LLMs) have made significant advancements in various natural language processing tasks, including question answering (QA) tasks. While incorporating new information with the retrieval of relevant passages is a promising way to improve QA with LLMs, the existing methods often require additional fine-tuning which becomes infeasible with recent LLMs. Augmenting retrieved passages via prompting has the potential to address this limitation, but this direction has been limitedly explored. To this end, we design a simple yet effective framework to enhance open-domain QA (ODQA) with LLMs, based on the summarized retrieval (SuRe). SuRe helps LLMs predict more accurate answers for a given question, which are well-supported by the summarized retrieval that could be viewed as an explicit rationale extracted from the retrieved passages. Specifically, SuRe first constructs summaries of the retrieved passages for each of the multiple answer candidates. Then, SuRe confirms the most plausible answer from the candidate set by evaluating the validity and ranking of the generated summaries. Experimental results on diverse ODQA benchmarks demonstrate the superiority of SuRe, with improvements of up to 4.6\\% in exact match (EM) and 4.0\\% in F1 score over standard prompting approaches. SuRe also can be integrated with a broad range of retrieval methods and LLMs. Finally, the generated summaries from SuRe show additional advantages to measure the importance of retrieved passages and serve as more preferred rationales by models and humans.",
        "keywords": "question answering;large language model;retrieval",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Jaehyung Kim;Jaehyun Nam;Sangwoo Mo;Jongjin Park;Sang-Woo Lee;Minjoon Seo;Jung-Woo Ha;Jinwoo Shin",
        "authorids": "~Jaehyung_Kim1;~Jaehyun_Nam2;~Sangwoo_Mo1;~Jongjin_Park1;~Sang-Woo_Lee1;~Minjoon_Seo1;~Jung-Woo_Ha1;~Jinwoo_Shin1",
        "gender": "M;;M;M;M;M;M;M",
        "homepage": "https://sites.google.com/view/jaehyungkim;https://jaehyun513.github.io/;https://sites.google.com/view/sangwoomo;;https://www.sang-woo-lee.com/;https://seominjoon.github.io;https://aidljwha.wordpress.com/;https://sites.google.com/site/mijirim/",
        "dblp": "02/7206-1;162/5227;198/0432;30/1783;31/5983-1;149/1367;66/867-1;31/7062",
        "google_scholar": "https://scholar.google.co.kr/citations?user=6OYOsGsAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.co.kr/citations?user=Sq9y3NMAAAAJ;F9DGEgEAAAAJ;https://scholar.google.co.kr/citations?user=TMTTMuQAAAAJ;zYze5fIAAAAJ;https://scholar.google.co.kr/citations?user=eGj3ay4AAAAJ;https://scholar.google.com.tw/citations?user=m3eDp7kAAAAJ",
        "orcid": ";;;;;;0000-0002-7400-7681;",
        "linkedin": ";;;;;minjoon-seo/;jung-woo-ha-b2782862?trk=hp-identity-name;",
        "or_profile": "~Jaehyung_Kim1;~Jaehyun_Nam2;~Sangwoo_Mo1;~Jongjin_Park1;~Sang-Woo_Lee1;~Minjoon_Seo1;~Jung-Woo_Ha1;~Jinwoo_Shin1",
        "aff": "Carnegie Mellon University;Korea Advanced Institute of Science & Technology;University of Michigan - Ann Arbor;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Twelve Labs;NAVER AI Lab;Korea Advanced Institute of Science & Technology",
        "aff_domain": "andrew.cmu.edu;kaist.ac.kr;umich.edu;kaist.ac.kr;kaist.ac.kr;twelvelabs.io;navercorp.com;kaist.ac.kr",
        "position": "Postdoc;PhD student;Postdoc;PhD student;Adjunct Professor;Chief Scientist;Research fellow;Full Professor",
        "bibtex": "@inproceedings{\nkim2024sure,\ntitle={SuRe: Summarizing Retrievals using Answer Candidates for Open-domain {QA} of {LLM}s},\nauthor={Jaehyung Kim and Jaehyun Nam and Sangwoo Mo and Jongjin Park and Sang-Woo Lee and Minjoon Seo and Jung-Woo Ha and Jinwoo Shin},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=w4DW6qkRmt}\n}",
        "github": "",
        "project": "",
        "reviewers": "MmoS;9TBy;Qrw6;mMA8;AgBt",
        "pdf_size": 659983,
        "rating": "6;6;6;6;8",
        "confidence": "4;4;4;4;4",
        "soundness": "2;3;3;3;4",
        "contribution": "2;3;3;3;3",
        "presentation": "3;3;3;3;4",
        "wc_summary": "185;86;77;184;77",
        "wc_strengths": "77;28;114;103;42",
        "wc_weaknesses": "268;98;64;265;10",
        "wc_questions": "157;31;4;2;10",
        "wc_review": "687;243;259;554;139",
        "wc_reply_reviewers": "32;0;11;53;10",
        "wc_reply_authors": "2457;1347;557;743;512",
        "reply_reviewers": "1;0;1;1;1",
        "reply_authors": "5;3;2;2;2",
        "rating_avg": [
            6.4,
            0.7999999999999999
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            2.8,
            0.39999999999999997
        ],
        "presentation_avg": [
            3.2,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            121.8,
            51.30068225667179
        ],
        "wc_strengths_avg": [
            72.8,
            33.41496670655232
        ],
        "wc_weaknesses_avg": [
            141.0,
            106.24876469870132
        ],
        "wc_questions_avg": [
            40.8,
            59.003050768583144
        ],
        "wc_review_avg": [
            376.4,
            207.82261667104473
        ],
        "wc_reply_reviewers_avg": [
            21.2,
            19.009471323527123
        ],
        "wc_reply_authors_avg": [
            1123.2,
            730.4531196456073
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            2.8,
            1.16619037896906
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 44,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1784218364337979646&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=w4DW6qkRmt",
        "pdf": "https://openreview.net/pdf?id=w4DW6qkRmt",
        "email": "andrew.cmu.edu;kaist.ac.kr;umich.edu;kaist.ac.kr;kaist.ac.kr;twelvelabs.io;navercorp.com;kaist.ac.kr",
        "author_num": 8,
        "aff_unique_index": "0;1;2;1;1;3;4;1",
        "aff_unique_norm": "Carnegie Mellon University;Korea Advanced Institute of Science and Technology;University of Michigan;Twelve Labs;NAVER Corporation",
        "aff_unique_dep": ";;;;NAVER AI Lab",
        "aff_unique_url": "https://www.cmu.edu;https://www.kaist.ac.kr;https://www.umich.edu;https://twelvelabs.com;https://www.naver.com",
        "aff_unique_abbr": "CMU;KAIST;UM;;NAVER",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Ann Arbor",
        "aff_country_unique_index": "0;1;0;1;1;0;1;1",
        "aff_country_unique": "United States;South Korea"
    },
    {
        "title": "Batched Low-Rank Adaptation of Foundation Models",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17508",
        "id": "w4abltTZ2f",
        "author_site": "Yeming Wen, Swarat Chaudhuri",
        "tldr": "",
        "abstract": "Low-Rank Adaptation (LoRA) has recently gained attention for fine-tuning foundation models by incorporating trainable low-rank matrices, thereby reducing the number of trainable parameters. While \\lora/ offers numerous advantages, its applicability for real-time serving to a diverse and global user base \nis constrained by its incapability to handle multiple task-specific adapters efficiently. This imposes a performance bottleneck in scenarios requiring personalized, task-specific adaptations for each incoming request.\n\nTo address this, we introduce FLoRA (Fast LoRA), a framework in which each input example in a minibatch can be associated with its unique low-rank adaptation weights, allowing for efficient batching of heterogeneous requests. We empirically demonstrate that \\flora/ retains the performance merits of \\lora/, showcasing competitive results on the MultiPL-E code generation benchmark spanning over 8 languages and a multilingual speech recognition task across 6 languages.",
        "keywords": "LLM Adaptation;Low-rank;Code Generation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/b123c13d023bc1349d947752af263bddf3009be5.zip",
        "author": "Yeming Wen;Swarat Chaudhuri",
        "authorids": "~Yeming_Wen1;~Swarat_Chaudhuri1",
        "gender": "M;M",
        "homepage": "https://www.cs.utexas.edu/~ywen/;http://www.cs.utexas.edu/~swarat",
        "dblp": "https://dblp.uni-trier.de/pers/hd/w/Wen:Yeming;37/6100",
        "google_scholar": "J2GzNAkAAAAJ;9j6RBYQAAAAJ",
        "orcid": ";0000-0002-6859-1391",
        "linkedin": ";swarat-chaudhuri-609b3092/",
        "or_profile": "~Yeming_Wen1;~Swarat_Chaudhuri1",
        "aff": "University of Texas, Austin;University of Texas at Austin",
        "aff_domain": "utexas.edu;utexas.edu",
        "position": "PhD student;Full Professor",
        "bibtex": "@inproceedings{\nwen2024batched,\ntitle={Batched Low-Rank Adaptation of Foundation Models},\nauthor={Yeming Wen and Swarat Chaudhuri},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=w4abltTZ2f}\n}",
        "github": "",
        "project": "",
        "reviewers": "daKT;46uC;Uf9f;1RDh",
        "pdf_size": 510881,
        "rating": "8;8;8;8",
        "confidence": "4;3;2;4",
        "soundness": "4;3;3;4",
        "contribution": "4;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "150;37;61;48",
        "wc_strengths": "79;37;60;63",
        "wc_weaknesses": "12;93;13;266",
        "wc_questions": "107;51;267;46",
        "wc_review": "348;218;401;423",
        "wc_reply_reviewers": "14;19;0;0",
        "wc_reply_authors": "161;477;272;504",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            74.0,
            44.69339996017309
        ],
        "wc_strengths_avg": [
            59.75,
            14.989579713921268
        ],
        "wc_weaknesses_avg": [
            96.0,
            103.50603847119258
        ],
        "wc_questions_avg": [
            117.75,
            89.43538170098006
        ],
        "wc_review_avg": [
            347.5,
            79.58171900631451
        ],
        "wc_reply_reviewers_avg": [
            8.25,
            8.437268515343103
        ],
        "wc_reply_authors_avg": [
            353.5,
            142.82944374322824
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 19,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14143906461659270985&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=w4abltTZ2f",
        "pdf": "https://openreview.net/pdf?id=w4abltTZ2f",
        "email": "utexas.edu;utexas.edu",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Texas at Austin",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.utexas.edu",
        "aff_unique_abbr": "UT Austin",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Austin",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Reverse Forward Curriculum Learning for Extreme Sample and Demo Efficiency",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17507",
        "id": "w4rODxXsmM",
        "author_site": "Stone Tao, Arth Shukla, Tse-kai Chan, Hao Su",
        "tldr": "",
        "abstract": "Reinforcement learning (RL) presents a promising framework to learn policies through environment interaction, but often requires an infeasible amount of interaction data to solve complex tasks from sparse rewards. One direction includes augmenting RL with offline data demonstrating desired tasks, but past work often require a lot of high-quality demonstration data that is difficult to obtain, especially for domains such as robotics. Our approach consists of a reverse curriculum followed by a forward curriculum. Unique to our approach compared to past work is the ability to efficiently leverage more than one demonstration via a per-demonstration reverse curriculum generated via state resets. The result of our reverse curriculum is an initial policy that performs well on a narrow initial state distribution and helps overcome difficult exploration problems. A forward curriculum is then used to accelerate the training of the initial policy to perform well on the full initial state distribution of the task and improve demonstration and sample efficiency. We show how the combination of a reverse curriculum and forward curriculum in our method, RFCL, enables significant improvements in demonstration and sample efficiency compared against various state-of-the-art learning-from-demonstration baselines, even solving previously unsolvable tasks that require high precision and control. Website with code and visualizations are here: https://reverseforward-cl.github.io/",
        "keywords": "reinforcement learning;learning from demonstrations;curriculum learning;reverse curriculum learning;robot learning;robotics",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Stone Tao;Arth Shukla;Tse-kai Chan;Hao Su",
        "authorids": "~Stone_Tao1;~Arth_Shukla1;~Tse-kai_Chan1;~Hao_Su1",
        "gender": "M;M;M;M",
        "homepage": "https://www.stoneztao.com;https://arth.website/;https://tsekaichan.com;http://ai.ucsd.edu/~haosu",
        "dblp": ";;;09/4945-1",
        "google_scholar": "GAMO0EwAAAAJ;;https://scholar.google.com/citations?hl=en;1P8Zu04AAAAJ",
        "orcid": ";;;",
        "linkedin": ";;tsekaichan/;",
        "or_profile": "~Stone_Tao1;~Arth_Shukla1;~Tse-kai_Chan1;~Hao_Su1",
        "aff": "University of California, San Diego;University of California, San Diego;University of California, San Diego;University of California, San Diego",
        "aff_domain": "ucsd.edu;ucsd.edu;ucsd.edu;ucsd.edu",
        "position": "PhD student;Undergrad student;Undergrad student;Associate Professor",
        "bibtex": "@inproceedings{\ntao2024reverse,\ntitle={Reverse Forward Curriculum Learning for Extreme Sample and Demo Efficiency},\nauthor={Stone Tao and Arth Shukla and Tse-kai Chan and Hao Su},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=w4rODxXsmM}\n}",
        "github": "",
        "project": "",
        "reviewers": "UCiq;gfCC;Rzng",
        "pdf_size": 10822738,
        "rating": "3;6;8",
        "confidence": "4;3;4",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "4;3;2",
        "wc_summary": "55;80;101",
        "wc_strengths": "19;49;56",
        "wc_weaknesses": "510;83;119",
        "wc_questions": "17;66;350",
        "wc_review": "601;278;626",
        "wc_reply_reviewers": "1488;110;0",
        "wc_reply_authors": "4228;1365;656",
        "reply_reviewers": "3;2;0",
        "reply_authors": "6;4;1",
        "rating_avg": [
            5.666666666666667,
            2.0548046676563256
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            78.66666666666667,
            18.803073034893938
        ],
        "wc_strengths_avg": [
            41.333333333333336,
            16.048537489614297
        ],
        "wc_weaknesses_avg": [
            237.33333333333334,
            193.3637907043497
        ],
        "wc_questions_avg": [
            144.33333333333334,
            146.7976687674418
        ],
        "wc_review_avg": [
            501.6666666666667,
            158.48519033510846
        ],
        "wc_reply_reviewers_avg": [
            532.6666666666666,
            677.0137041120774
        ],
        "wc_reply_authors_avg": [
            2083.0,
            1544.1154965437872
        ],
        "reply_reviewers_avg": [
            1.6666666666666667,
            1.247219128924647
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            2.0548046676563256
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.1147078669352809,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "openreview": "https://openreview.net/forum?id=w4rODxXsmM",
        "pdf": "https://openreview.net/pdf?id=w4rODxXsmM",
        "email": "ucsd.edu;ucsd.edu;ucsd.edu;ucsd.edu",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of California, San Diego",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucsd.edu",
        "aff_unique_abbr": "UCSD",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "San Diego",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Independent-Set Design of Experiments for Estimating Treatment and Spillover Effects under Network Interference",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17506",
        "id": "w50MQ9Vfty",
        "author_site": "Chencheng Cai, Xu Zhang, Edoardo Airoldi",
        "tldr": "",
        "abstract": "Interference is ubiquitous when conducting causal experiments over networks. Except for certain network structures, causal inference on the network in the presence of interference is difficult due to the entanglement between the treatment assignments and the interference levels. In this article, we conduct causal inference under interference on an observed, sparse, but connected network, and we propose a novel design of experiments based on an independent set. Compared to conventional designs, the independent-set design focuses on an independent subset of data and controls their interference exposures through the assignments to the rest (auxiliary set). We provide a lower bound on the size of the independent set from a greedy algorithm and justify the theoretical performance of estimators under the proposed design. Our approach is capable of estimating both spillover effects and treatment effects. We justify its superiority over conventional methods and illustrate the empirical performance through simulations.",
        "keywords": "Causal inference;Design of experiments;Interference;Random graph;Spillover effects;Treatment effects;Potential outcomes",
        "primary_area": "causal reasoning",
        "supplementary_material": "",
        "author": "Chencheng Cai;Xu Zhang;Edoardo Airoldi",
        "authorids": "~Chencheng_Cai1;~Xu_Zhang25;~Edoardo_Airoldi1",
        "gender": "M;M;M",
        "homepage": "https://chenchengcai.com;;https://www.fox.temple.edu/about-fox/directory/edoardo-airoldi/",
        "dblp": "254/3074;;a/EdoardoAiroldi",
        "google_scholar": ";;XKCyZk0AAAAJ",
        "orcid": "0000-0001-5531-278X;;",
        "linkedin": ";xu-zhang-57451a5a/;",
        "or_profile": "~Chencheng_Cai1;~Xu_Zhang25;~Edoardo_Airoldi1",
        "aff": "Washington State University;Amazon;Temple University",
        "aff_domain": "wsu.edu;amazon.com;temple.edu",
        "position": "Assistant Professor;Researcher;Full Professor",
        "bibtex": "@inproceedings{\ncai2024independentset,\ntitle={Independent-Set Design of Experiments for Estimating Treatment and Spillover Effects under Network Interference},\nauthor={Chencheng Cai and Xu Zhang and Edoardo Airoldi},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=w50MQ9Vfty}\n}",
        "github": "",
        "project": "",
        "reviewers": "hHf8;vRUq;DrFU;pw71",
        "pdf_size": 356162,
        "rating": "5;5;6;6",
        "confidence": "4;4;3;2",
        "soundness": "4;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "74;49;34;135",
        "wc_strengths": "106;32;55;35",
        "wc_weaknesses": "162;110;43;194",
        "wc_questions": "98;55;156;194",
        "wc_review": "440;246;288;558",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "465;381;617;503",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            73.0,
            38.54218468120353
        ],
        "wc_strengths_avg": [
            57.0,
            29.63950067055786
        ],
        "wc_weaknesses_avg": [
            127.25,
            57.13744394002938
        ],
        "wc_questions_avg": [
            125.75,
            53.265256030549594
        ],
        "wc_review_avg": [
            383.0,
            124.16521251944927
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            491.5,
            84.84544772702894
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.9045340337332909,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5109434328188616388&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=w50MQ9Vfty",
        "pdf": "https://openreview.net/pdf?id=w50MQ9Vfty",
        "email": "wsu.edu;amazon.com;temple.edu",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Washington State University;Amazon;Temple University",
        "aff_unique_dep": ";Amazon.com, Inc.;",
        "aff_unique_url": "https://wsu.edu;https://www.amazon.com;https://www.temple.edu",
        "aff_unique_abbr": "WSU;Amazon;Temple",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "w5oP27fmYW",
        "title": "CCD-3DR: Consistent Conditioning in Diffusion for Single-Image 3D Reconstruction",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In this paper, we present a novel shape reconstruction method leveraging a diffusion model to generate a 3D sparse point cloud for the object captured in a single RGB image. Recent methods typically leverage global embedding or local projection-based features as the condition to guide the diffusion model. However, such strategies fail to consistently align the denoised point cloud with the given image, leading to unstable conditioning and inferior performance. In this paper, we present CCD-3DR, which exploits a novel centered diffusion probabilistic model for consistent local feature conditioning. We constrain the noise and sampled point cloud from the diffusion model into a subspace where the point cloud center remains unchanged during the forward diffusion process and reverse process. The stable point cloud center further serves as an anchor to align each point with its corresponding local projection-based features. Extensive experiments on synthetic benchmark ShapeNet-R2N2 demonstrate that CCD-3DR outperforms all competitors by a large margin, with over 40% improvement. We also provide results on the real-world dataset Pix3D to thoroughly demonstrate the potential of CCD-3DR in real-world applications. Codes will be released soon.",
        "keywords": "3D reconstruction;diffusion model",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/11ebc8920b8d1c84c08a370b054c2a6f77fbc1e6.pdf",
        "author": "Yan Di;Chenyangguang Zhang;Pengyuan Wang;Guangyao Zhai;Ruida Zhang;Fabian Manhardt;Benjamin Busam;Xiangyang Ji;Federico Tombari",
        "authorids": "~Yan_Di2;~Chenyangguang_Zhang1;~Pengyuan_Wang2;~Guangyao_Zhai1;~Ruida_Zhang1;~Fabian_Manhardt1;~Benjamin_Busam2;~Xiangyang_Ji1;~Federico_Tombari1",
        "gender": "M;M;M;M;M;M;;;M",
        "homepage": ";https://zhangcyg.github.io/;https://seasandwpy.github.io/;https://ymxlzgy.com/;https://lolrudy.github.io/;http://campar.in.tum.de/Main/FabianManhardt;http://campar.in.tum.de/view/Main/BenjaminBusam;;https://federicotombari.github.io/",
        "dblp": "274/9623;336/2805;06/2271-2.html;243/2753;317/0062;173/9271;168/5446;;16/3539",
        "google_scholar": "HSlGGvwAAAAJ;https://scholar.google.com.sg/citations?user=-sCslRcAAAAJ;JrPjwOsAAAAJ;X_djKCUAAAAJ;J4u6VicAAAAJ;https://scholar.google.de/citations?user=bERItx8AAAAJ;https://scholar.google.de/citations?user=u4rJZwUAAAAJ;;TFsE4BIAAAAJ",
        "orcid": "0000-0003-0671-8323;;;0000-0002-6702-8302;;0000-0002-4577-4590;0000-0002-0620-5774;;0000-0001-5598-5212",
        "linkedin": ";chenyangguangzhang/;;guangyao-zhai-1525a6b7/;;;benjaminbusam;;fedet/",
        "or_profile": "~Yan_Di2;~Chenyangguang_Zhang1;~Pengyuan_Wang2;~Guangyao_Zhai1;~Ruida_Zhang1;~Fabian_Manhardt1;~Benjamin_Busam2;~Xiangyang_Ji1;~Federico_Tombari1",
        "aff": "Technische Universit\u00e4t M\u00fcnchen;ETHZ - ETH Zurich;Technische Universit\u00e4t M\u00fcnchen;Technische Universit\u00e4t M\u00fcnchen;Tsinghua University;Google;Technical University Munich;;Technical University Munich (TUM)",
        "aff_domain": "tum.de;ethz.ch;tum.de;tum.de;mails.tsinghua.edu.cn;google.com;tum.de;;in.tum.de",
        "position": "PhD student;Intern;PhD student;PhD student;PhD student;Researcher;Researcher;;Lecturer",
        "bibtex": "@misc{\ndi2024ccddr,\ntitle={{CCD}-3{DR}: Consistent Conditioning in Diffusion for Single-Image 3D Reconstruction},\nauthor={Yan Di and Chenyangguang Zhang and Pengyuan Wang and Guangyao Zhai and Ruida Zhang and Fabian Manhardt and Benjamin Busam and Xiangyang Ji and Federico Tombari},\nyear={2024},\nurl={https://openreview.net/forum?id=w5oP27fmYW}\n}",
        "github": "",
        "project": "",
        "reviewers": "a25m;wYQz;yrBn;9Ca5",
        "site": "https://openreview.net/forum?id=w5oP27fmYW",
        "pdf_size": 1331202,
        "rating": "3;3;5;6",
        "confidence": "2;4;4;3",
        "soundness": "2;3;2;4",
        "contribution": "3;2;2;2",
        "presentation": "2;3;3;3",
        "wc_summary": "68;126;55;50",
        "wc_strengths": "88;112;57;30",
        "wc_weaknesses": "670;84;125;106",
        "wc_questions": "18;6;2;49",
        "wc_review": "844;328;239;235",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            74.75,
            30.309858132297485
        ],
        "wc_strengths_avg": [
            71.75,
            31.003024046050733
        ],
        "wc_weaknesses_avg": [
            246.25,
            245.0820015831436
        ],
        "wc_questions_avg": [
            18.75,
            18.430613120566555
        ],
        "wc_review_avg": [
            411.5,
            252.45643188479076
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.17407765595569782,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16775607182170657044&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;0;2;3;4;5",
        "aff_unique_norm": "Technische Universit\u00e4t M\u00fcnchen;ETH Zurich;Tsinghua University;Google;Technical University of Munich;Technical University Munich",
        "aff_unique_dep": ";;;Google;;",
        "aff_unique_url": "https://www.tum.de;https://www.ethz.ch;https://www.tsinghua.edu.cn;https://www.google.com;https://www.tum.de;https://www.tum.de",
        "aff_unique_abbr": "TUM;ETHZ;THU;Google;TUM;TUM",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;0;0;2;3;0;0",
        "aff_country_unique": "Germany;Switzerland;China;United States"
    },
    {
        "id": "w73feIekdO",
        "title": "Real-time computer vision on low-end boards via clustering motion vectors",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In this work, we suggest computer vision methods, specifically for video tracking and map creation from video.\nTo this end, we utilize motion vectors and clusters, which are computed very efficiently in standard video encoders, usually via dedicated hardware.\nWe suggest a provably good tracking algorithm for clustering these vectors, by considering them as segments.\nFor this, we utilize a definition of a \\emph{coreset} which is essentially a weighted set of points that approximates the fitting loss for every model, up to a multiplicative factor of $1\\pm\\varepsilon$.\nOur method supports $M$-estimators that are robust to outliers, convex shapes, lines, and hyper-planes.\nWe demonstrate the empirical contribution of our clustering method for video tracking and map creation from video, by running it on micro-computers (Le-Potato and Raspberry Pi) on synthetic and real-world videos with real-time running time.",
        "keywords": "Coreset;Motion vectors;Segments;Robotics;Structure from motion;non-convex optimization",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/06b252e45c34307281f2f75aeaee0f4c47593499.zip",
        "author": "David Denisov;Dan Feldman;Michael Segal;Shlomi Dolev",
        "authorids": "~David_Denisov1;~Dan_Feldman1;~Michael_Segal2;dolev@cs.bgu.ac.il",
        "gender": "M;M;;",
        "homepage": ";http://people.csail.mit.edu/dannyf/;https://www.cs.bgu.ac.il/~segal;",
        "dblp": "386/2882;84/6696.html;;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;67QZN0gAAAAJ;;",
        "orcid": "0009-0008-7059-1922;;;",
        "linkedin": "david-denisov-3b8121161/;;;",
        "or_profile": "~David_Denisov1;~Dan_Feldman1;~Michael_Segal2;dolev@cs.bgu.ac.il",
        "aff": "University of Haifa;University of Haifa;;",
        "aff_domain": "haifa.ac.il;haifa.ac.il;;",
        "position": "PhD student;Associate Professor;;",
        "bibtex": "@misc{\nanonymous2024realtime,\ntitle={Real-time computer vision on low-end boards via clustering motion vectors},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=w73feIekdO}\n}",
        "github": "",
        "project": "",
        "reviewers": "qadD;aQsA;MMZa;wXa9",
        "site": "https://openreview.net/forum?id=w73feIekdO",
        "pdf_size": 4023840,
        "rating": "1;3;3;6",
        "confidence": "4;4;3;4",
        "soundness": "1;1;2;3",
        "contribution": "2;2;2;3",
        "presentation": "1;1;1;2",
        "wc_summary": "96;47;75;81",
        "wc_strengths": "111;11;48;104",
        "wc_weaknesses": "469;76;155;64",
        "wc_questions": "168;171;129;6",
        "wc_review": "844;305;407;255",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            74.75,
            17.75352077758099
        ],
        "wc_strengths_avg": [
            68.5,
            41.20982892466311
        ],
        "wc_weaknesses_avg": [
            191.0,
            164.26655167744892
        ],
        "wc_questions_avg": [
            118.5,
            67.03170891451299
        ],
        "wc_review_avg": [
            452.75,
            232.4353404712803
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.08084520834544431,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:J7AoKTj723MJ:scholar.google.com/&scioq=Real-time+computer+vision+on+low-end+boards+via+clustering+motion+vectors&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Haifa",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.haifa.ac.il",
        "aff_unique_abbr": "UoH",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Israel"
    },
    {
        "title": "Geometry-Aware Projective Mapping for Unbounded Neural Radiance Fields",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17505",
        "id": "w7BwaDHppp",
        "author_site": "Junoh Lee, Hyunjun Jung, Jinhwi Park, Inhwan Bae, Hae-Gon Jeon",
        "tldr": "",
        "abstract": "Estimating neural radiance fields (NeRFs) is able to generate novel views of a scene from known imagery. Recent approaches have afforded dramatic progress on small bounded regions of the scene. For an unbounded scene where cameras point in any direction and contents exist at any distance, certain mapping functions are used to represent it within a bounded space, yet they either work in object-centric scenes or focus on objects close to the camera. The goal of this paper is to understand how to design a proper mapping function that considers per-scene optimization, which remains unexplored. We first present a geometric understanding of existing mapping functions that express the relation between the bounded and unbounded scenes. Here, we exploit a stereographic projection method to explain failures of the mapping functions, where input ray samples are too sparse to account for scene geometry in unbounded regions. To overcome the failures, we propose a novel mapping function based on a $p$-norm distance, allowing to adaptively sample the rays by adjusting the $p$-value according to scene geometry, even in unbounded regions. To take the advantage of our mapping function, we also introduce a new ray parameterization to properly allocate ray samples in the geometry of unbounded regions. Through the incorporation of both the novel mapping function and the ray parameterization within existing NeRF frameworks, our method achieves state-of-the-art novel view synthesis results on a variety of challenging datasets.",
        "keywords": "Neural Radiance Fields;Neural Rendering",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/526f63502b24f03e1ec3b8ff9eb7e4b90ecbf5d2.zip",
        "author": "Junoh Lee;Hyunjun Jung;Jin-Hwi Park;Inhwan Bae;Hae-Gon Jeon",
        "authorids": "~Junoh_Lee1;~Hyunjun_Jung2;~Jin-Hwi_Park1;~Inhwan_Bae1;~Hae-Gon_Jeon3",
        "gender": "M;M;M;M;M",
        "homepage": "https://juno181.github.io/;https://github.com/hj-jung-01;https://ihbae.com/;https://sites.google.com/site/hgjeoncv/;https://www.jinhwipark.com/",
        "dblp": ";;294/0205;142/2427;317/1123",
        "google_scholar": "OZcCxNQAAAAJ;;og4c800AAAAJ;https://scholar.google.co.kr/citations?user=Ei00xroAAAAJ;0B-YoigAAAAJ",
        "orcid": ";;0000-0003-1884-2268;0000-0003-1105-1666;",
        "linkedin": ";;;;",
        "or_profile": "~Junoh_Lee1;~Hyunjun_Jung2;~Inhwan_Bae1;~Hae-Gon_Jeon3;~Jinhwi_Park1",
        "aff": "Gwangju Institute of Science and Technology;Gwangju Institute of Science and Technology;Gwangju Institute of Science and Technology;Gwangju Institute of Science and Technology;Gwangju Institute of Science and Technology",
        "aff_domain": "gist.ac.kr;gist.ac.kr;gist.ac.kr;gist.ac.kr;gist.ac.kr",
        "position": "PhD student;PhD student;PhD student;Associate Professor;PhD student",
        "bibtex": "@inproceedings{\nlee2024geometryaware,\ntitle={Geometry-Aware Projective Mapping for Unbounded Neural Radiance Fields},\nauthor={Junoh Lee and Hyunjun Jung and Jin-Hwi Park and Inhwan Bae and Hae-Gon Jeon},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=w7BwaDHppp}\n}",
        "github": "",
        "project": "",
        "reviewers": "oDMF;es1p;BLBe;CBov",
        "pdf_size": 22289724,
        "rating": "5;5;6;6",
        "confidence": "3;4;5;2",
        "soundness": "3;2;3;3",
        "contribution": "2;1;3;3",
        "presentation": "3;3;3;2",
        "wc_summary": "62;184;86;62",
        "wc_strengths": "45;68;86;123",
        "wc_weaknesses": "355;200;168;172",
        "wc_questions": "229;26;66;194",
        "wc_review": "691;478;406;551",
        "wc_reply_reviewers": "281;59;73;0",
        "wc_reply_authors": "1168;651;484;696",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "3;2;2;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            98.5,
            50.32643440578718
        ],
        "wc_strengths_avg": [
            80.5,
            28.5175384631984
        ],
        "wc_weaknesses_avg": [
            223.75,
            76.77361200308346
        ],
        "wc_questions_avg": [
            128.75,
            84.85686477828415
        ],
        "wc_review_avg": [
            531.5,
            105.39568302354704
        ],
        "wc_reply_reviewers_avg": [
            103.25,
            106.21764213161578
        ],
        "wc_reply_authors_avg": [
            749.75,
            254.06532132504822
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:gDBAvKHStIAJ:scholar.google.com/&scioq=Geometry-Aware+Projective+Mapping+for+Unbounded+Neural+Radiance+Fields&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=w7BwaDHppp",
        "pdf": "https://openreview.net/pdf?id=w7BwaDHppp",
        "email": "gist.ac.kr;gist.ac.kr;gist.ac.kr;gist.ac.kr;gist.ac.kr",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Gwangju Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.gist.ac.kr",
        "aff_unique_abbr": "GIST",
        "aff_campus_unique_index": "0;0;0;0;0",
        "aff_campus_unique": "Gwangju",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "Linearity of Relation Decoding in Transformer Language Models",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17504",
        "id": "w7LU2s14kE",
        "author_site": "Evan Hernandez, Arnab Sen Sharma, Tal Haklay, Kevin Meng, Martin Wattenberg, Jacob Andreas, Yonatan Belinkov, David Bau",
        "tldr": "",
        "abstract": "Much of the knowledge encoded in transformer language models (LMs) may be expressed in terms of relations: relations between words and their synonyms, entities and their attributes, etc. We show that, for a subset of relations, this computation is well-approximated by a single linear transformation on the subject representation. Linear relation representations may be obtained by constructing a first-order approximation to the LM from a single prompt, and they exist for a variety of factual, commonsense, and linguistic relations. However, we also identify many cases in which LM predictions capture relational knowledge accurately, but this knowledge is not linearly encoded in their representations. Our results thus reveal a simple, interpretable, but heterogeneously deployed knowledge representation strategy in transformer LMs.",
        "keywords": "Natural language processing;interpretability;language models",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/fa08ed208ce5ef0c0f0a4e42a0b7b2932c1391aa.zip",
        "author": "Evan Hernandez;Arnab Sen Sharma;Tal Haklay;Kevin Meng;Martin Wattenberg;Jacob Andreas;Yonatan Belinkov;David Bau",
        "authorids": "~Evan_Hernandez1;~Arnab_Sen_Sharma1;~Tal_Haklay1;~Kevin_Meng1;~Martin_Wattenberg1;~Jacob_Andreas1;~Yonatan_Belinkov1;~David_Bau1",
        "gender": "M;M;F;M;M;M;M;M",
        "homepage": "https://evandez.com;https://arnab-api.github.io/;;https://mengk.me/;http://www.bewitched.com;http://web.mit.edu/jda/www;https://www.belinkov.com;https://baulab.info/",
        "dblp": ";254/2046;;06/8478;w/MartinWattenberg;97/8154;136/8705;47/3614",
        "google_scholar": ";https://scholar.google.com/citations?view_op=list_works;;UcZbFroAAAAJ;pv54dqMAAAAJ;dnZ8udEAAAAJ;https://scholar.google.com/citations?authorid=K-6ujU4AAAAJ;CYI6cKgAAAAJ",
        "orcid": "0000-0002-8876-1781;0000-0002-0407-6526;;;;;;0000-0003-1744-6765",
        "linkedin": "evandez/;arnab-api/;tal-haklay-501032192/;kmeng01/;;;;david-bau-4b8130/",
        "or_profile": "~Evan_Hernandez1;~Arnab_Sen_Sharma1;~Tal_Haklay1;~Kevin_Meng1;~Martin_Wattenberg1;~Jacob_Andreas1;~Yonatan_Belinkov1;~David_Bau1",
        "aff": "Massachusetts Institute of Technology;Northeastern University;Technion - Israel Institute of Technology, Technion;Massachusetts Institute of Technology;Google;Microsoft;Technion, Technion;Northeastern University",
        "aff_domain": "mit.edu;northeasterd.edu;technion.ac.il;mit.edu;google.com;microsoft.com;technion.ac.il;northeastern.edu",
        "position": "PhD student;PhD student;MS student;Undergrad student;Principal Researcher;Researcher;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nhernandez2024linearity,\ntitle={Linearity of Relation Decoding in Transformer Language Models},\nauthor={Evan Hernandez and Arnab Sen Sharma and Tal Haklay and Kevin Meng and Martin Wattenberg and Jacob Andreas and Yonatan Belinkov and David Bau},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=w7LU2s14kE}\n}",
        "github": "",
        "project": "",
        "reviewers": "wBgc;zSUm;y12e",
        "pdf_size": 1600863,
        "rating": "6;8;8",
        "confidence": "4;3;3",
        "soundness": "3;3;3",
        "contribution": "2;4;3",
        "presentation": "3;4;4",
        "wc_summary": "117;215;119",
        "wc_strengths": "66;46;48",
        "wc_weaknesses": "126;340;15",
        "wc_questions": "94;18;110",
        "wc_review": "403;619;292",
        "wc_reply_reviewers": "0;44;21",
        "wc_reply_authors": "895;651;275",
        "reply_reviewers": "0;1;1",
        "reply_authors": "3;2;1",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            150.33333333333334,
            45.73352769637999
        ],
        "wc_strengths_avg": [
            53.333333333333336,
            8.993825042154693
        ],
        "wc_weaknesses_avg": [
            160.33333333333334,
            134.883488817407
        ],
        "wc_questions_avg": [
            74.0,
            40.13311184877976
        ],
        "wc_review_avg": [
            438.0,
            135.77186748365804
        ],
        "wc_reply_reviewers_avg": [
            21.666666666666668,
            17.96910929592474
        ],
        "wc_reply_authors_avg": [
            607.0,
            255.01895354398007
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.9999999999999998,
        "gs_citation": 76,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9216679122409312814&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=w7LU2s14kE",
        "pdf": "https://openreview.net/pdf?id=w7LU2s14kE",
        "email": "mit.edu;northeasterd.edu;technion.ac.il;mit.edu;google.com;microsoft.com;technion.ac.il;northeastern.edu",
        "author_num": 8,
        "aff_unique_index": "0;1;2;0;3;4;2;1",
        "aff_unique_norm": "Massachusetts Institute of Technology;Northeastern University;Technion - Israel Institute of Technology;Google;Microsoft",
        "aff_unique_dep": ";;;Google;Microsoft Corporation",
        "aff_unique_url": "https://web.mit.edu;https://www.northeastern.edu;https://www.technion.ac.il;https://www.google.com;https://www.microsoft.com",
        "aff_unique_abbr": "MIT;NEU;Technion;Google;Microsoft",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0;1;0;0;0;1;0",
        "aff_country_unique": "United States;Israel"
    },
    {
        "id": "w8BL1NShjk",
        "title": "There is More to Graphs than Meets the Eye: Learning Universal Features with Self-supervision",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We study the problem of learning universal features from multiple graphs through self-supervision. Graph self-supervised learning has been shown to facilitate representation learning, and produce competitive models compared to supervised baselines. However, existing methods of self-supervision learn features from one graph, and thus, produce models that are specialized to a particular graph. We hypothesize that leveraging multiple graphs of a family can improve the quality of learnt representations in the model by extracting features that are universal to the family of graphs. To achieve this, we propose a framework that can learn generalisable representations from disparate node features of different graphs. We first homogenise the disparate features with graph-specific modules, which feed into a universal representation learning module for generalisable feature learning. We show that leveraging multiple graphs of the same family improves the quality of representations and results in better performance on downstream node classification task compared to self-supervision with one graph. In this paper, we present a principled way to design foundation graph models that are capable of learning from a set of graphs in a holistic manner. This approach  bridges the gap between self-supervised and supervised performance, while reducing the computational time for self-supervision and parameters of the model.",
        "keywords": "Representation learning;Self supervised learning;Foundation models;Generalisability;Graph transformer",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/6e24d6afa89eaababe8a032a161ac1924bf4d0cc.zip",
        "author": "Laya Das;Sai Munikoti;Mahantesh Halappanavar",
        "authorids": "~Laya_Das1;~Sai_Munikoti1;~Mahantesh_Halappanavar1",
        "gender": ";M;M",
        "homepage": ";https://www.pnnl.gov/people/sai-munikoti;",
        "dblp": ";248/6109;41/3413",
        "google_scholar": ";2qzs41QAAAAJ;E4Wqxq8AAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Laya_Das1;~Sai_Munikoti1;~Mahantesh_Halappanavar1",
        "aff": ";Pacific Northwest National Laboratory;",
        "aff_domain": ";pnnl.gov;",
        "position": ";Research Data Scientist;",
        "bibtex": "@misc{\ndas2024there,\ntitle={There is More to Graphs than Meets the Eye: Learning Universal Features with Self-supervision},\nauthor={Laya Das and Sai Munikoti and Mahantesh Halappanavar},\nyear={2024},\nurl={https://openreview.net/forum?id=w8BL1NShjk}\n}",
        "github": "",
        "project": "",
        "reviewers": "yAZs;Z55K;sutU;w7Bu",
        "site": "https://openreview.net/forum?id=w8BL1NShjk",
        "pdf_size": 550080,
        "rating": "3;3;3;5",
        "confidence": "4;4;4;4",
        "soundness": "2;2;3;2",
        "contribution": "2;2;1;2",
        "presentation": "3;2;3;3",
        "wc_summary": "83;93;64;57",
        "wc_strengths": "42;38;38;187",
        "wc_weaknesses": "220;344;148;53",
        "wc_questions": "73;5;4;241",
        "wc_review": "418;480;254;538",
        "wc_reply_reviewers": "55;69;0;43",
        "wc_reply_authors": "138;529;344;712",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "1;2;1;2",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            74.25,
            14.411367041332339
        ],
        "wc_strengths_avg": [
            76.25,
            63.96239129363442
        ],
        "wc_weaknesses_avg": [
            191.25,
            106.2341164598266
        ],
        "wc_questions_avg": [
            80.75,
            96.65499211111654
        ],
        "wc_review_avg": [
            422.5,
            106.13552656862828
        ],
        "wc_reply_reviewers_avg": [
            41.75,
            25.800920526213787
        ],
        "wc_reply_authors_avg": [
            430.75,
            213.2971811815618
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2873092397578831045&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0",
        "aff_unique_norm": "Pacific Northwest National Laboratory",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.pnnl.gov",
        "aff_unique_abbr": "PNNL",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "w8JizpeY4y",
        "title": "Time Series Continuous Modeling for Imputation and Forecasting with Implicit Neural Representations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We introduce a novel modeling approach for time series imputation and forecasting, tailored to address the challenges often encountered in real-world data, such as irregular samples, missing data, or unaligned measurements from multiple sensors. Our method relies on a continuous-time-dependent model of the series' evolution dynamics. It leverages adaptations of conditional, implicit neural representations for sequential data. A modulation mechanism, driven by a meta-learning algorithm, allows adaptation to unseen samples and extrapolation beyond observed time-windows for long-term predictions. The model provides a highly flexible and unified framework for imputation and forecasting tasks across a wide range of challenging scenarios. It achieves state-of-the-art performance on classical benchmarks and outperforms alternative time-continuous models.",
        "keywords": "Time series;Continuous modeling;Forecasting;Imputation;Implicit Neural Representation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Etienne Le Naour;Louis Serrano;L\u00e9on Migus;Yuan Yin;Ghislain Agoua;Nicolas Baskiotis;patrick gallinari;Vincent Guigue",
        "authorids": "~Etienne_Le_Naour1;~Louis_Serrano1;~L\u00e9on_Migus1;~Yuan_Yin1;~Ghislain_Agoua1;~Nicolas_Baskiotis2;~patrick_gallinari1;~Vincent_Guigue1",
        "gender": "M;M;;M;;M;M;M",
        "homepage": ";https://www.isir.upmc.fr/personnel/serrano/;https://www.linkedin.com/in/leonmigus;https://www.isir.upmc.fr/personnel/yin/;;http://www-connex.lip6.fr/~baskiotisn/;;https://vguigue.github.io",
        "dblp": ";349/0965;323/5460;;;89/6907;g/PatrickGallinari;",
        "google_scholar": ";;;https://scholar.google.com/citations?hl=fr;;https://scholar.google.fr/citations?user=buPH8uIAAAAJ;rFaxB20AAAAJ;VvFT0nAAAAAJ",
        "orcid": ";;;0000-0003-1515-0696;;0000-0001-5015-0961;;",
        "linkedin": "etienne-le-naour-913248156/;louis-serrano-a0596578/;leonmigus;yuan-yin-nn/;;;;",
        "or_profile": "~Etienne_Le_Naour1;~Louis_Serrano1;~L\u00e9on_Migus1;~Yuan_Yin1;~Ghislain_Agoua1;~Nicolas_Baskiotis2;~patrick_gallinari1;~Vincent_Guigue1",
        "aff": "ISIR, UMR 7222;Universit\u00e9 Pierre et Marie Curie - Paris 6, Sorbonne Universit\u00e9 - Facult\u00e9 des Sciences (Paris VI);;Valeo;;ISIR, UMR 7222 Sorbonne Universite;Sorbonne Universite;AgroParisTech",
        "aff_domain": "sorbonne-universite.fr;isir.upmc.fr;;valeo.com;;sorbonne-universite.fr;sorbonne-universite.fr;agroparistech.fr",
        "position": "PhD student;PhD student;;Postdoc;;Associate Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nnaour2024time,\ntitle={Time Series Continuous Modeling for Imputation and Forecasting with Implicit Neural Representations},\nauthor={Etienne Le Naour and Louis Serrano and L{\\'e}on Migus and Yuan Yin and Ghislain Agoua and Nicolas Baskiotis and patrick gallinari and Vincent Guigue},\nyear={2024},\nurl={https://openreview.net/forum?id=w8JizpeY4y}\n}",
        "github": "",
        "project": "",
        "reviewers": "QdLC;FJUP;TAfq",
        "site": "https://openreview.net/forum?id=w8JizpeY4y",
        "pdf_size": 848567,
        "rating": "5;5;8",
        "confidence": "4;4;3",
        "soundness": "3;4;4",
        "contribution": "3;2;3",
        "presentation": "3;3;4",
        "wc_summary": "88;48;45",
        "wc_strengths": "54;120;42",
        "wc_weaknesses": "384;206;72",
        "wc_questions": "237;69;143",
        "wc_review": "763;443;302",
        "wc_reply_reviewers": "226;154;47",
        "wc_reply_authors": "2732;1551;1086",
        "reply_reviewers": "1;1;1",
        "reply_authors": "5;3;2",
        "rating_avg": [
            6.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            60.333333333333336,
            19.601587237318874
        ],
        "wc_strengths_avg": [
            72.0,
            34.292856398964496
        ],
        "wc_weaknesses_avg": [
            220.66666666666666,
            127.79497468819169
        ],
        "wc_questions_avg": [
            149.66666666666666,
            68.74752520798273
        ],
        "wc_review_avg": [
            502.6666666666667,
            192.8735913032736
        ],
        "wc_reply_reviewers_avg": [
            142.33333333333334,
            73.54061613980551
        ],
        "wc_reply_authors_avg": [
            1789.6666666666667,
            692.8445392406262
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            1.247219128924647
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12769776028687532171&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 12,
        "aff_unique_index": "0;1;2;3;4;5",
        "aff_unique_norm": "Institut des Sciences de l'Ing\u00e9nierie de Robotique;Universit\u00e9 Pierre et Marie Curie - Paris 6;Valeo;Sorbonne Universite;Sorbonne University;AgroParisTech",
        "aff_unique_dep": "UMR 7222;Facult\u00e9 des Sciences;;Institut des Sciences de l'Ing\u00e9nierie de Robotique;;",
        "aff_unique_url": "https://www.isir.upmc.fr;https://www.upmc.fr;https://www.valeo.com;https://www.sorbonne-universite.fr;https://www.sorbonne-universite.fr;https://www.agroparistech.fr",
        "aff_unique_abbr": "ISIR;UPMC;;Sorbonne U;Sorbonne;AgroParisTech",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Paris",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "France"
    },
    {
        "id": "w8Zo7jACq7",
        "title": "Model-Free, Regret-Optimal Best Policy Identification in Online CMDPs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper considers the best policy identification (BPI) problem in online Constrained Markov Decision Processes (CMDPs). We are interested in algorithms that are model-free, have low regret, and identify an optimal policy with a high probability. \nExisting model-free algorithms for online CMDPs with sublinear regret and constraint violation do not provide any convergence guarantee to an optimal policy and provide only average performance guarantees when a policy is uniformly sampled at random from all previously used policies. In this paper, we develop a new algorithm, named Pruning-Refinement-Identification (PRI), based on a fundamental structural property of CMDPs we discover, called limited stochasticity.  The property says for a CMDP with $N$ constraints, there exists an optimal policy with at most $N$ stochastic decisions. \n\nThe proposed algorithm first identifies at which step and in which state a stochastic decision has to be taken and then fine-tunes the distributions of these stochastic decisions. PRI achieves trio objectives: (i) PRI is a model-free algorithm; and (ii) it outputs a near-optimal policy with a high probability at the end of learning; and (iii) in the tabular setting, PRI guarantees $\\tilde{\\mathcal{O}}(\\sqrt{K})$ regret and constraint violation, which significantly improves the best existing regret bound $\\tilde{\\mathcal{O}}\\left(K^{\\frac{4}{5}}\\right)$  under a  model-free algorithm, where $K$ is the total number of episodes.",
        "keywords": "Reinforcement Learning;CMDPs;Model-Free;Best Policy Identification",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/aff86834da90c372be8c3cba5f72ac979de3fa34.pdf",
        "author": "Zihan Zhou;Honghao Wei;Lei Ying",
        "authorids": "~Zihan_Zhou8;~Honghao_Wei2;~Lei_Ying1",
        "gender": "M;M;M",
        "homepage": ";https://honghaow.me;http://leiying.engin.umich.edu/",
        "dblp": ";;27/4818",
        "google_scholar": ";;7f3HKI8AAAAJ",
        "orcid": ";0000-0002-1131-326X;",
        "linkedin": "zihan-zhou-114499252/;honghao-wei-19565b155/;",
        "or_profile": "~Zihan_Zhou8;~Honghao_Wei2;~Lei_Ying1",
        "aff": "IIIS, Tsinghua University;Washington State University ;University of Michigan, Ann Arbor",
        "aff_domain": "tsinghua.edu.cn;wsu.edu;umich.edu",
        "position": "Undergrad student;Assistant Professor;Professor",
        "bibtex": "@misc{\nzhou2024modelfree,\ntitle={Model-Free, Regret-Optimal Best Policy Identification in Online {CMDP}s},\nauthor={Zihan Zhou and Honghao Wei and Lei Ying},\nyear={2024},\nurl={https://openreview.net/forum?id=w8Zo7jACq7}\n}",
        "github": "",
        "project": "",
        "reviewers": "S5ah;ost9;y9UN;QLDH;3osr",
        "site": "https://openreview.net/forum?id=w8Zo7jACq7",
        "pdf_size": 0,
        "rating": "3;5;6;6;6",
        "confidence": "4;4;4;2;3",
        "soundness": "3;2;3;3;3",
        "contribution": "3;2;3;3;3",
        "presentation": "3;2;2;4;3",
        "wc_summary": "33;38;74;34;68",
        "wc_strengths": "27;31;22;63;6",
        "wc_weaknesses": "5;242;126;49;29",
        "wc_questions": "277;26;103;38;132",
        "wc_review": "342;337;325;184;235",
        "wc_reply_reviewers": "0;0;96;63;10",
        "wc_reply_authors": "286;693;598;143;220",
        "reply_reviewers": "0;0;1;1;1",
        "reply_authors": "2;3;3;2;2",
        "rating_avg": [
            5.2,
            1.16619037896906
        ],
        "confidence_avg": [
            3.4,
            0.8
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.8,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.8,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            49.4,
            17.81684596105607
        ],
        "wc_strengths_avg": [
            29.8,
            18.648324321504067
        ],
        "wc_weaknesses_avg": [
            90.2,
            86.05440139818533
        ],
        "wc_questions_avg": [
            115.2,
            90.02977285320672
        ],
        "wc_review_avg": [
            284.6,
            63.644638423043936
        ],
        "wc_reply_reviewers_avg": [
            33.8,
            38.91734831665693
        ],
        "wc_reply_authors_avg": [
            388.0,
            217.15340199960028
        ],
        "reply_reviewers_avg": [
            0.6,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            2.4,
            0.4898979485566356
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5144957554275266,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7319331076190822570&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Tsinghua University;Washington State University;University of Michigan",
        "aff_unique_dep": "Institute for Interdisciplinary Information Sciences;;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://wsu.edu;https://www.umich.edu",
        "aff_unique_abbr": "THU;WSU;UM",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Ann Arbor",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "w8cTTA0nQR",
        "title": "Can Neural Networks Improve Classical Optimization of Inverse Problems?",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Finding the values of model parameters from data is an essential task in science. While iterative optimization algorithms like BFGS can find solutions to inverse problems with machine precision for simple problems, their reliance on local information limits their effectiveness for complex problems involving local minima, chaos, or zero-gradient regions.\n\nThis study explores the potential for overcoming these limitations by jointly optimizing multiple examples. To achieve this, we employ neural networks to reparameterize the solution space and leverage the training procedure as an alternative to classical optimization.\nThis approach is as versatile as traditional optimizers and does not require additional information about the inverse problems, meaning it can be added to existing general-purpose optimization libraries. We evaluate the effectiveness of this approach by comparing it to traditional optimization on various inverse problems involving complex physical systems, such as the incompressible Navier-Stokes equations. Our findings reveal significant improvements in the accuracy of the obtained solutions.",
        "keywords": "Inverse problems;neural networks;iterative optimization;chaos;convergence",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/a6563a5347db69a667c59d520dcf059ab19d8703.zip",
        "author": "Philipp Holl;Nils Thuerey",
        "authorids": "~Philipp_Holl1;~Nils_Thuerey1",
        "gender": "M;M",
        "homepage": ";https://ge.in.tum.de",
        "dblp": "256/9374;42/478",
        "google_scholar": "LilimmEAAAAJ;https://scholar.google.com.tw/citations?user=GEehwv8AAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Philipp_Holl1;~Nils_Thuerey1",
        "aff": "Technical University Munich;Technical University Munich",
        "aff_domain": "tum.de;tum.de",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\nholl2024can,\ntitle={Can Neural Networks Improve Classical Optimization of Inverse Problems?},\nauthor={Philipp Holl and Nils Thuerey},\nyear={2024},\nurl={https://openreview.net/forum?id=w8cTTA0nQR}\n}",
        "github": "",
        "project": "",
        "reviewers": "hT1b;brPF;hHZu;EH87",
        "site": "https://openreview.net/forum?id=w8cTTA0nQR",
        "pdf_size": 1725424,
        "rating": "1;3;3;6",
        "confidence": "4;4;4;2",
        "soundness": "3;2;2;3",
        "contribution": "1;1;2;3",
        "presentation": "3;3;2;3",
        "wc_summary": "60;62;195;73",
        "wc_strengths": "6;21;25;36",
        "wc_weaknesses": "230;195;533;77",
        "wc_questions": "16;3;3;2",
        "wc_review": "312;281;756;188",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            97.5,
            56.50884886458049
        ],
        "wc_strengths_avg": [
            22.0,
            10.747092630102339
        ],
        "wc_weaknesses_avg": [
            258.75,
            168.1790340678647
        ],
        "wc_questions_avg": [
            6.0,
            5.787918451395113
        ],
        "wc_review_avg": [
            384.25,
            219.4269525377409
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.8892972917998875,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:CrCAFL1bQTUJ:scholar.google.com/&scioq=Can+Neural+Networks+Improve+Classical+Optimization+of+Inverse+Problems%3F&hl=en&as_sdt=0,47",
        "gs_version_total": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Technical University of Munich",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tum.de",
        "aff_unique_abbr": "TUM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "w8eCnnq57m",
        "title": "LoraHub: Efficient Cross-Task Generalization via Dynamic LoRA Composition",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Low-rank adaptations (LoRA) are often employed to fine-tune large language models (LLMs) for new tasks. This paper investigates LoRA composability for cross-task generalization and introduces LoraHub, a simple framework devised for the purposive assembly of LoRA modules trained on diverse given tasks, with the objective of achieving adaptable performance on unseen tasks. With just a few examples from a new task, LoraHub can fluidly combine multiple LoRA modules, eliminating the need for human expertise and assumptions.  Notably, the composition requires neither additional model parameters nor gradients.  Our empirical results, derived from the Big-Bench Hard benchmark, suggest that LoraHub can effectively mimic the performance of in-context learning in few-shot scenarios, excluding the necessity of in-context examples alongside each inference input.",
        "keywords": "Parameter Efficient Tuning;LoRA;Cross-Task Generalization",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Chengsong Huang;Qian Liu;Bill Yuchen Lin;Chao Du;Tianyu Pang;Min Lin",
        "authorids": "~Chengsong_Huang1;~Qian_Liu2;~Bill_Yuchen_Lin1;~Chao_Du1;~Tianyu_Pang1;~Min_Lin1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://chengsong-huang.github.io/;http://siviltaram.github.io/;http://yuchenlin.xyz/;https://duchao0726.github.io/;https://p2333.github.io/;https://linmin.me",
        "dblp": "211/1188;;190/4518;75/7523;202/2550;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;bcbeUo0AAAAJ;https://scholar.google.com/citations?hl=en;QOp7xW0AAAAJ;wYDbtFsAAAAJ;BGONmkIAAAAJ",
        "orcid": ";;;0000-0003-1244-6336;0000-0003-0639-6176;",
        "linkedin": ";;;duchao/;%E5%A4%A9%E5%AE%87-%E5%BA%9E-b3999017a/;min-lin-08a3a422/",
        "or_profile": "~Chengsong_Huang1;~Qian_Liu2;~Bill_Yuchen_Lin1;~Chao_Du1;~Tianyu_Pang1;~Min_Lin1",
        "aff": "Washington University, Saint Louis;Tiktok;Allen Institute for Artificial Intelligence;Sea AI Lab;Sea AI Lab;Sea AI Lab",
        "aff_domain": "wustl.edu;bytedance.com;allenai.org;sea.com;sea.com;sea.com",
        "position": "PhD student;Researcher;Researcher;Senior Research Scientist;Senior Research Scientist;Principal Researcher",
        "bibtex": "@misc{\nhuang2024lorahub,\ntitle={LoraHub: Efficient Cross-Task Generalization via Dynamic Lo{RA} Composition},\nauthor={Chengsong Huang and Qian Liu and Bill Yuchen Lin and Chao Du and Tianyu Pang and Min Lin},\nyear={2024},\nurl={https://openreview.net/forum?id=w8eCnnq57m}\n}",
        "github": "",
        "project": "",
        "reviewers": "8M9N;pXQC;ZnG8",
        "site": "https://openreview.net/forum?id=w8eCnnq57m",
        "pdf_size": 557225,
        "rating": "5;5;6",
        "confidence": "5;4;3",
        "soundness": "4;3;3",
        "contribution": "3;2;3",
        "presentation": "4;3;4",
        "wc_summary": "53;146;231",
        "wc_strengths": "55;52;94",
        "wc_weaknesses": "142;101;214",
        "wc_questions": "253;56;237",
        "wc_review": "503;355;776",
        "wc_reply_reviewers": "496;38;51",
        "wc_reply_authors": "4459;1143;1669",
        "reply_reviewers": "2;1;1",
        "reply_authors": "8;4;5",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            143.33333333333334,
            72.69265590293301
        ],
        "wc_strengths_avg": [
            67.0,
            19.131126469708992
        ],
        "wc_weaknesses_avg": [
            152.33333333333334,
            46.70712531890135
        ],
        "wc_questions_avg": [
            182.0,
            89.33457710576945
        ],
        "wc_review_avg": [
            544.6666666666666,
            174.37953498682757
        ],
        "wc_reply_reviewers_avg": [
            195.0,
            212.90529976181116
        ],
        "wc_reply_authors_avg": [
            2423.6666666666665,
            1455.1300820048891
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            5.666666666666667,
            1.699673171197595
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 197,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9929120063144632612&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;3;3;3",
        "aff_unique_norm": "Washington University in St. Louis;TikTok;Allen Institute for Artificial Intelligence;Sea AI Lab",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://wustl.edu;https://www.tiktok.com;https://allenai.org;",
        "aff_unique_abbr": "WUSTL;TikTok;AI2;",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Saint Louis;",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United States;China;"
    },
    {
        "title": "Remote Sensing Vision-Language Foundation Models without Annotations via Ground Remote Alignment",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17503",
        "id": "w9tc699w3Z",
        "author_site": "Utkarsh Kumar Mall, Cheng Perng Phoo, Meilin Liu, Carl Vondrick, Bharath Hariharan, Kavita Bala",
        "tldr": "",
        "abstract": "We introduce a method to train vision-language models for remote-sensing images without using any textual annotations. Our key insight is to use co-located internet imagery taken on the ground as an intermediary for connecting remote-sensing images and language.  Specifically, we train an image encoder for remote sensing images to align with the image encoder of CLIP using a large amount of paired internet and satellite images.  Our unsupervised approach enables the training of a first-of-its-kind large scale VLM for remote sensing images at two different resolutions. We show that these VLMs enable zero-shot, open-vocabulary image classification, retrieval, segmentation and visual question answering for satellite images. On each of these tasks, our VLM trained without textual annotations outperforms existing VLMs trained with supervision, with gains of up to 20\\% for classification and 80\\% for segmentation.",
        "keywords": "remote sensing;vision-language models;zero-shot;foundation models;label-efficiency",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Utkarsh Mall;Cheng Perng Phoo;Meilin Kelsey Liu;Carl Vondrick;Bharath Hariharan;Kavita Bala",
        "authorids": "~Utkarsh_Mall1;~Cheng_Perng_Phoo1;~Meilin_Kelsey_Liu1;~Carl_Vondrick2;~Bharath_Hariharan3;~Kavita_Bala1",
        "gender": "M;M;F;M;;M",
        "homepage": "http://www.cs.cornell.edu/~utkarshm/;https://cpphoo.github.io/;;http://www.cs.columbia.edu/~vondrick/;http://www.cs.cornell.edu/~kb;http://home.bharathh.info",
        "dblp": "183/0911;226/0521;;26/8610;b/KavitaBala;05/8412",
        "google_scholar": "AK0AFWwAAAAJ;kt9D2usAAAAJ;;3MzhkFIAAAAJ;Rh16nsIAAAAJ;TpglobcAAAAJ",
        "orcid": ";;;;0000-0001-9761-6503;",
        "linkedin": ";;kelsey-meilin-l-66a149190/;;;",
        "or_profile": "~Utkarsh_Mall1;~Cheng_Perng_Phoo1;~Meilin_Kelsey_Liu1;~Carl_Vondrick2;~Kavita_Bala1;~Bharath_Hariharan2",
        "aff": "Columbia University;Cornell University;Cornell University;Columbia University;Cornell University;Cornell University",
        "aff_domain": "columbia.edu;cornell.edu;cornell.edu;columbia.edu;cornell.edu;cornell.edu",
        "position": "Postdoc;PhD student;Undergrad student;Associate Professor;Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nmall2024remote,\ntitle={Remote Sensing Vision-Language Foundation Models without Annotations via Ground Remote Alignment},\nauthor={Utkarsh Mall and Cheng Perng Phoo and Meilin Kelsey Liu and Carl Vondrick and Bharath Hariharan and Kavita Bala},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=w9tc699w3Z}\n}",
        "github": "",
        "project": "",
        "reviewers": "J5AT;U5BT;hnot;FsSQ",
        "pdf_size": 11378465,
        "rating": "6;6;8;8",
        "confidence": "2;4;5;4",
        "soundness": "3;3;3;4",
        "contribution": "2;3;4;4",
        "presentation": "3;3;3;3",
        "wc_summary": "50;37;113;88",
        "wc_strengths": "20;39;41;35",
        "wc_weaknesses": "38;378;89;52",
        "wc_questions": "1;3;1;95",
        "wc_review": "109;457;244;270",
        "wc_reply_reviewers": "11;0;0;0",
        "wc_reply_authors": "151;592;258;556",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            72.0,
            30.191058278901057
        ],
        "wc_strengths_avg": [
            33.75,
            8.227241335952167
        ],
        "wc_weaknesses_avg": [
            139.25,
            139.09596507447654
        ],
        "wc_questions_avg": [
            25.0,
            40.422765862815474
        ],
        "wc_review_avg": [
            270.0,
            124.06248425692596
        ],
        "wc_reply_reviewers_avg": [
            2.75,
            4.763139720814412
        ],
        "wc_reply_authors_avg": [
            389.25,
            189.01240038685293
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.6882472016116854,
        "gs_citation": 50,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15865352578232574112&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=w9tc699w3Z",
        "pdf": "https://openreview.net/pdf?id=w9tc699w3Z",
        "email": "columbia.edu;cornell.edu;cornell.edu;columbia.edu;cornell.edu;cornell.edu",
        "author_num": 6,
        "aff_unique_index": "0;1;1;0;1;1",
        "aff_unique_norm": "Columbia University;Cornell University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.columbia.edu;https://www.cornell.edu",
        "aff_unique_abbr": "Columbia;Cornell",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "wAsjsSe0U6",
        "title": "Visual Semantic Learning via Early Stopping in Inverse Scale Space",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Different levels of visual information are generally coupled in image data, thus making it hard to reverse the trend of deep learning models that learn texture bias from images. Consequently, these models are vulnerable when dealing with tasks in which semantic knowledge matters. To solve this problem, we propose an instance smoothing algorithm, in which the Total Variation (TV) regularization is enforced in a differential inclusion to generate a regularized image path from large-scale (*i.e.*, semantic information) to fine-scale (*i.e.*, detailed information). Equipped with a proper early stopping mechanism, the structural information can be disentangled from detailed ones. We then propose an efficient sparse projection method to obtain the regularized images, by exploiting the graph structure of the Total Variation matrix. \nWe then propose to incorporate this algorithm into neural network training, which guides the model to learn structural features in the process of training. The utility of our framework is demonstrated by improved robustness against noisy images, adversarial attacks, and low-resolution images; and better explainability via visualization and frequency analysis.",
        "keywords": "Semantic Information;Inverse Scale Space;Total Varation;Sparsity;Frequency;Classification from Noisy Images",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/56e131bc89fa5da50ddcedb786726628ead6764e.zip",
        "author": "Zhiling Zhou;Zirui Liu;Chengming Xu;Yanwei Fu;Xinwei Sun",
        "authorids": "~Zhiling_Zhou1;~Zirui_Liu4;~Chengming_Xu1;~Yanwei_Fu2;~Xinwei_Sun1",
        "gender": "M;Not Specified;M;M;M",
        "homepage": "https://github.com/zlzhouFDU?tab=repositories;https://github.com/Dante-of-Rivia;https://chmxu.github.io;http://yanweifu.github.io;https://sunxinwei0625.github.io/sunxw.github.io/",
        "dblp": ";;115/9183-1;63/9065;145/6592-1",
        "google_scholar": ";;pjcYzvYAAAAJ;https://scholar.google.co.uk/citations?user=Vg54TcsAAAAJ;",
        "orcid": ";;0000-0003-3891-2227;0000-0002-6595-6893;",
        "linkedin": ";;;;",
        "or_profile": "~Zhiling_Zhou1;~Zirui_Liu4;~Chengming_Xu1;~Yanwei_Fu2;~Xinwei_Sun1",
        "aff": "Fudan University;Fudan University;Tencent;Fudan University,;Fudan University",
        "aff_domain": "fudan.edu.cn;fudan.edu.cn;tencent.com;fudan.edu.cn;fudan.edu.cn",
        "position": "Undergrad student;Undergrad student;Researcher;Professor;Assistant Professor",
        "bibtex": "@misc{\nzhou2024visual,\ntitle={Visual Semantic Learning via Early Stopping in Inverse Scale Space},\nauthor={Zhiling Zhou and Zirui Liu and Chengming Xu and Yanwei Fu and Xinwei Sun},\nyear={2024},\nurl={https://openreview.net/forum?id=wAsjsSe0U6}\n}",
        "github": "",
        "project": "",
        "reviewers": "xer1;5hKV;NN23;bFfP",
        "site": "https://openreview.net/forum?id=wAsjsSe0U6",
        "pdf_size": 20781454,
        "rating": "5;5;6;6",
        "confidence": "4;2;3;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;2;3",
        "wc_summary": "75;56;101;58",
        "wc_strengths": "100;26;58;115",
        "wc_weaknesses": "335;106;165;85",
        "wc_questions": "39;4;13;159",
        "wc_review": "549;192;337;417",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "744;481;510;694",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            72.5,
            18.034688796871432
        ],
        "wc_strengths_avg": [
            74.75,
            35.0526389876711
        ],
        "wc_weaknesses_avg": [
            172.75,
            98.15899092798377
        ],
        "wc_questions_avg": [
            53.75,
            62.11028497761059
        ],
        "wc_review_avg": [
            373.75,
            129.38967308096886
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            607.25,
            113.60320197952169
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:O-EOARwAXccJ:scholar.google.com/&scioq=Visual+Semantic+Learning+via+Early+Stopping+in+Inverse+Scale+Space&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "Fudan University;Tencent",
        "aff_unique_dep": ";Tencent Holdings Limited",
        "aff_unique_url": "https://www.fudan.edu.cn;https://www.tencent.com",
        "aff_unique_abbr": "Fudan;Tencent",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "wAyTOazvN0",
        "title": "Learning Multiplex Embeddings on Text-rich Networks with One Text Encoder",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In real-world scenarios, texts in a network are often linked by multiple semantic relations (e.g., papers in an academic network are referenced by other publications, written by the same author, or published in the same venue), where text documents and their relations form a multiplex text-rich network. Mainstream text representation learning methods use pretrained language models (PLMs) to generate one embedding for each text unit, expecting that all types of relations between texts can be captured by these single-view embeddings. However, this presumption does not hold particularly in multiplex text-rich networks. Along another line of work, multiplex graph neural networks (GNNs) directly initialize node attributes as a feature vector for node representation learning, but they cannot fully capture the semantics of the nodes\u2019 associated texts. To bridge these gaps, we propose METERN, a new framework for learning Multiplex Embeddings on TExt-Rich Networks. In contrast to existing methods, METERN uses one text encoder to model the shared knowledge across relations and leverages a small number of parameters per relation to derive relation-specific representations. This allows the encoder to effectively capture the multiplex structures in the network while also preserving parameter efficiency. We conduct experiments on nine downstream tasks in five networks from both academic and e-commerce domains, where METERN outperforms baselines significantly and consistently. Code is available at https://anonymous.4open.science/r/METERN-ICLR24-C6CD.",
        "keywords": "Text-Rich Network;Representation Learning on Networks",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/211c629857bac5c325b374b9d3f31d2f8b78120f.pdf",
        "author": "Bowen Jin;Wentao Zhang;Yu Zhang;Yu Meng;Han Zhao;Jiawei Han",
        "authorids": "~Bowen_Jin1;~Wentao_Zhang3;~Yu_Zhang26;~Yu_Meng1;~Han_Zhao1;~Jiawei_Han1",
        "gender": "M;;M;M;M;M",
        "homepage": "https://peterjin.me/;https://wtzhang99.github.io/;https://yuzhimanhua.github.io/;https://yumeng5.github.io/;https://hanzhaoml.github.io/;http://hanj.cs.illinois.edu/",
        "dblp": "235/8066;;50/671-44;30/4233-1;03/3520-2;h/JiaweiHan.html",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;sXAiVgsAAAAJ;N0PrmgIAAAAJ;S2-yZKcAAAAJ;x942ipYAAAAJ;https://scholar.google.com.tw/citations?user=Kv9AbjMAAAAJ",
        "orcid": "0000-0003-1295-2829;;0000-0003-0540-6758;0000-0003-2554-2888;0000-0002-8579-1600;0000-0002-3629-2696",
        "linkedin": "bowen-peter-jin/;;;;;",
        "or_profile": "~Bowen_Jin1;~Wentao_Zhang3;~Yu_Zhang26;~Yu_Meng1;~Han_Zhao1;~Jiawei_Han1",
        "aff": "University of Illinois, Urbana Champaign;University of Waterloo;University of Illinois, Urbana Champaign;University of Virginia;University of Illinois, Urbana Champaign;University of Illinois at Urbana-Champaign (UIUC)",
        "aff_domain": "illinois.edu;uwaterloo.ca;illinois.edu;virginia.edu;illinois.edu;illinois.edu",
        "position": "PhD student;PhD student;PhD student;Assistant Professor;Assistant Professor;Full Professor",
        "bibtex": "@misc{\njin2024learning,\ntitle={Learning Multiplex Embeddings on Text-rich Networks with One Text Encoder},\nauthor={Bowen Jin and Wentao Zhang and Yu Zhang and Yu Meng and Han Zhao and Jiawei Han},\nyear={2024},\nurl={https://openreview.net/forum?id=wAyTOazvN0}\n}",
        "github": "",
        "project": "",
        "reviewers": "SgSL;NTrJ;WxEq;LwBx",
        "site": "https://openreview.net/forum?id=wAyTOazvN0",
        "pdf_size": 926513,
        "rating": "5;6;6;6",
        "confidence": "3;4;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;4;3;4",
        "wc_summary": "156;93;92;151",
        "wc_strengths": "20;81;111;135",
        "wc_weaknesses": "139;207;91;61",
        "wc_questions": "7;30;38;291",
        "wc_review": "322;411;332;638",
        "wc_reply_reviewers": "0;0;21;0",
        "wc_reply_authors": "794;497;258;763",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            123.0,
            30.553232234904378
        ],
        "wc_strengths_avg": [
            86.75,
            43.0254285277904
        ],
        "wc_weaknesses_avg": [
            124.5,
            55.161127617190715
        ],
        "wc_questions_avg": [
            91.5,
            115.74217036154108
        ],
        "wc_review_avg": [
            425.75,
            127.29959740706174
        ],
        "wc_reply_reviewers_avg": [
            5.25,
            9.093266739736606
        ],
        "wc_reply_authors_avg": [
            578.0,
            217.85430911505975
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10911249535382281682&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;0;2;0;0",
        "aff_unique_norm": "University of Illinois Urbana-Champaign;University of Waterloo;University of Virginia",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://illinois.edu;https://uwaterloo.ca;https://www.virginia.edu",
        "aff_unique_abbr": "UIUC;UW;UVA",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Urbana-Champaign;",
        "aff_country_unique_index": "0;1;0;0;0;0",
        "aff_country_unique": "United States;Canada"
    },
    {
        "id": "wC6FQOEfG6",
        "title": "Neural Translation of Input Specifications into Formal Grammars for Test Case Generation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Test cases are crucial for ensuring the program's correctness and evaluating performance in programming.\nThe high diversity of test cases within constraints is necessary\nto distinguish between correct and incorrect answers.\nAutomated source code generation is currently a popular area\ndue to the inefficiency of manually generating test cases.\nRecent attempts involve generating conditional cases from problem descriptions\nusing deep-learning models that learn from source code.\nHowever, this task requires a combination of complex skills\nsuch as extracting syntactic and logical constraints for a given test case from a problem,\nand generating test cases that satisfy the constraints.\nIn this work, we introduce a modified context-free grammar\nthat explicitly represents the syntactical and logical constraints embedded within programming problems.\nOur innovative framework for automated test case generation separates restriction extraction\nfrom test case generation, simplifying the task for the model.\nOur experimental results show that, compared to current methods,\nour framework produces test cases that are more precise and effective.\nAll the codes in this paper are available in https://anonymous.4open.science/r/neural_translation_for_test_case_generation.",
        "keywords": "formal grammar;automated test case generation;semi-supervised learning",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Sicheol Sung;Aditi;Dogyu Kim;Yo-Sub Han;Sang-Ki Ko",
        "authorids": "~Sicheol_Sung1;~Aditi1;~Dogyu_Kim1;~Yo-Sub_Han1;~Sang-Ki_Ko1",
        "gender": ";F;M;;M",
        "homepage": ";https://github.com/Aditi1612;https://github.com/Oraison;http://toc.yonsei.ac.kr/~emmous/;https://sites.google.com/site/sangkikotoc/home",
        "dblp": "321/6407.html;;;h/YoSubHan;71/9491.html",
        "google_scholar": "1JeL4ckAAAAJ;;;yDOh26sAAAAJ;https://scholar.google.com/scholar?hl=en",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Sicheol_Sung1;~Aditi1;~Dogyu_Kim1;~Yo-Sub_Han1;~Sang-Ki_Ko1",
        "aff": "Yonsei University;University of Seoul;Kangwon National University;Yonsei University;University of Seoul",
        "aff_domain": "yonsei.ac.kr;uos.ac.kr;kangwon.ac.kr;yonsei.ac.kr;uos.ac.kr",
        "position": "PhD student;MS student;Undergrad student;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nsung2024neural,\ntitle={Neural Translation of Input Specifications into Formal Grammars for Test Case Generation},\nauthor={Sicheol Sung and Aditi and Dogyu Kim and Yo-Sub Han and Sang-Ki Ko},\nyear={2024},\nurl={https://openreview.net/forum?id=wC6FQOEfG6}\n}",
        "github": "",
        "project": "",
        "reviewers": "Cepj;bjCm;n1Av;862x",
        "site": "https://openreview.net/forum?id=wC6FQOEfG6",
        "pdf_size": 650500,
        "rating": "1;3;3;3",
        "confidence": "4;2;3;3",
        "soundness": "1;2;2;2",
        "contribution": "1;2;2;2",
        "presentation": "1;2;2;2",
        "wc_summary": "36;69;133;64",
        "wc_strengths": "4;28;22;68",
        "wc_weaknesses": "161;38;29;303",
        "wc_questions": "1;213;13;11",
        "wc_review": "202;348;197;446",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            75.5,
            35.5
        ],
        "wc_strengths_avg": [
            30.5,
            23.382685902179844
        ],
        "wc_weaknesses_avg": [
            132.75,
            111.27078457528732
        ],
        "wc_questions_avg": [
            59.5,
            88.73978814489023
        ],
        "wc_review_avg": [
            298.25,
            104.66703158110485
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:NfnUlsQn8TQJ:scholar.google.com/&scioq=Neural+Translation+of+Input+Specifications+into+Formal+Grammars+for+Test+Case+Generation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0;1",
        "aff_unique_norm": "Yonsei University;University of Seoul;Kangwon National University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.yonsei.ac.kr;http://www.useoul.edu;http://www.kangwon.ac.kr",
        "aff_unique_abbr": "Yonsei;UOS;KNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "wCRTEOIdmf",
        "title": "Towards Subgraph Isomorphism Counting with Graph Kernels",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Subgraph isomorphism counting is known as #P-complete and requires exponential time to find the accurate solution. Utilizing representation learning has been shown as a promising direction to represent substructures and approximate the solution. Graph kernels that implicitly capture the correlations among substructures in diverse graphs have exhibited great discriminative power in graph classification, so we pioneeringly investigate their potential in counting subgraph isomorphisms and further explore the augmentation of kernel capability through various variants, including polynomial and Gaussian kernels. Through comprehensive analysis, we enhance the graph kernels by incorporating neighborhood information. Finally, we present the results of extensive experiments to demonstrate the effectiveness of the enhanced graph kernels and discuss promising directions for future research.",
        "keywords": "subgraph isomorphism;graph kernel;representation learning",
        "primary_area": "metric learning, kernel learning, and sparse coding",
        "supplementary_material": "/attachment/2467ced97c0b43e072af7c007e3af2d99b689e94.pdf",
        "author": "Xin Liu;Weiqi Wang;Jiaxin Bai;Yangqiu Song",
        "authorids": "~Xin_Liu9;~Weiqi_Wang1;~Jiaxin_Bai1;~Yangqiu_Song1",
        "gender": "M;M;M;M",
        "homepage": "https://www.cse.ust.hk/~xliucr/;https://mighty-weaver.github.io/;http://bjx.fun/;https://www.cse.ust.hk/~yqsong/",
        "dblp": "76/1820-39.html;51/5775-1;250/9281;86/2159",
        "google_scholar": "https://scholar.google.com.hk/citations?user=WvC4upQAAAAJ;https://scholar.google.com/citations?hl=zh-CN;BHQiBpQAAAAJ;MdQZ-q8AAAAJ",
        "orcid": "0000-0001-9610-9526;0000-0002-1617-9805;0000-0002-8985-6467;0000-0002-7818-6090",
        "linkedin": "xin-liu-179830143;weiqi-wang-a49b5019a/;;yqsong/",
        "or_profile": "~Xin_Liu9;~Weiqi_Wang1;~Jiaxin_Bai1;~Yangqiu_Song1",
        "aff": "Amazon;Amazon.com;Hong Kong University of Science and Technology;Hong Kong University of Science and Technology",
        "aff_domain": "amazon.com;amazon.com;ust.hk;ust.hk",
        "position": "Researcher;Intern;PhD student;Associate Professor",
        "bibtex": "@misc{\nliu2024towards,\ntitle={Towards Subgraph Isomorphism Counting with Graph Kernels},\nauthor={Xin Liu and Weiqi Wang and Jiaxin Bai and Yangqiu Song},\nyear={2024},\nurl={https://openreview.net/forum?id=wCRTEOIdmf}\n}",
        "github": "",
        "project": "",
        "reviewers": "bo6K;oJKS;xQZL",
        "site": "https://openreview.net/forum?id=wCRTEOIdmf",
        "pdf_size": 483979,
        "rating": "3;5;5",
        "confidence": "4;3;3",
        "soundness": "4;2;3",
        "contribution": "2;2;2",
        "presentation": "4;3;2",
        "wc_summary": "69;42;117",
        "wc_strengths": "69;66;45",
        "wc_weaknesses": "381;309;329",
        "wc_questions": "108;2;1",
        "wc_review": "627;419;492",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            76.0,
            31.016124838541646
        ],
        "wc_strengths_avg": [
            60.0,
            10.677078252031311
        ],
        "wc_weaknesses_avg": [
            339.6666666666667,
            30.346151137976115
        ],
        "wc_questions_avg": [
            37.0,
            50.20624131187941
        ],
        "wc_review_avg": [
            512.6666666666666,
            86.16392645546176
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9999999999999998,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Snh0mbMniQgJ:scholar.google.com/&scioq=Towards+Subgraph+Isomorphism+Counting+with+Graph+Kernels&hl=en&as_sdt=0,33",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;1",
        "aff_unique_norm": "Amazon;Hong Kong University of Science and Technology",
        "aff_unique_dep": "Amazon.com, Inc.;",
        "aff_unique_url": "https://www.amazon.com;https://www.ust.hk",
        "aff_unique_abbr": "Amazon;HKUST",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;1;1",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "wCUw8t63vH",
        "title": "Spectral learning of shared dynamics between generalized-linear processes",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Across various science and engineering applications, there often arises a need to predict the dynamics of one data stream from another. Further, these data streams may have different statistical properties. Studying the dynamical relationship between such processes, especially for the purpose of predicting one from the other, requires accounting for their distinct statistics while also dissociating their shared dynamical subspace. Existing analytical modeling approaches, however, do not address both of these needs. Here we propose a path forward by deriving a novel analytical multi-step subspace identification algorithm that can learn a model for a primary generalized-linear process (called ``predictor\"), while also dissociating the dynamics shared with a secondary process. We demonstrate a specific application of our approach for modeling discrete Poisson point-processes activity, while finding the dynamics shared with continuous Gaussian processes. In simulations, we show that our algorithm accurately prioritizes identification of shared dynamics. Further, we also demonstrate that the method can additionally model the disjoint dynamics that exist only in the predictor Poisson data stream, if desired. Similarly, we apply our algorithm on a biological dataset to learn models of dynamics in Poisson neural population spiking streams that predict dynamics in movement streams. Compared with existing Poisson subspace identification methods, models learned with our method decoded movements better and with lower-dimensional latent states. Lastly, we discuss regimes in which our assumptions might not be met and provide recommendations and possible future directions of investigation.",
        "keywords": "state space models;subspace identification;dynamical systems;neural coding",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/94ebc05a2b6d37e749345063e3736a8a560673fd.zip",
        "author": "Lucine L Oganesian;Omid G. Sani;Maryam Shanechi",
        "authorids": "~Lucine_L_Oganesian1;~Omid_G._Sani1;~Maryam_Shanechi1",
        "gender": "F;;F",
        "homepage": "https://www.lucineoganesian.com/;;https://nseip.usc.edu/",
        "dblp": ";;50/6132",
        "google_scholar": "k4QyNUYAAAAJ;;csGAeKgAAAAJ",
        "orcid": "0000-0001-6773-6643;;0000-0002-0544-7720",
        "linkedin": "lucine-oganesian-218b9b86/;;",
        "or_profile": "~Lucine_L_Oganesian1;~Omid_G._Sani1;~Maryam_Shanechi1",
        "aff": "University of Southern California;;University of Southern California",
        "aff_domain": "usc.edu;;usc.edu",
        "position": "MS student;;Full Professor",
        "bibtex": "@misc{\noganesian2024spectral,\ntitle={Spectral learning of shared dynamics between generalized-linear processes},\nauthor={Lucine L Oganesian and Omid G. Sani and Maryam Shanechi},\nyear={2024},\nurl={https://openreview.net/forum?id=wCUw8t63vH}\n}",
        "github": "",
        "project": "",
        "reviewers": "XxLi;1pgP;QEhH;NhF4;vavJ",
        "site": "https://openreview.net/forum?id=wCUw8t63vH",
        "pdf_size": 1158711,
        "rating": "6;6;6;8;8",
        "confidence": "1;3;3;4;2",
        "soundness": "2;3;3;3;3",
        "contribution": "2;2;3;3;3",
        "presentation": "2;2;4;2;2",
        "wc_summary": "19;166;95;60;92",
        "wc_strengths": "19;69;56;107;107",
        "wc_weaknesses": "19;95;45;21;142",
        "wc_questions": "19;606;44;113;2",
        "wc_review": "76;936;240;301;343",
        "wc_reply_reviewers": "0;0;0;122;73",
        "wc_reply_authors": "0;2051;532;842;1025",
        "reply_reviewers": "0;0;0;1;2",
        "reply_authors": "0;3;1;2;3",
        "rating_avg": [
            6.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            2.6,
            1.019803902718557
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.4,
            0.8
        ],
        "wc_summary_avg": [
            86.4,
            48.334666648276375
        ],
        "wc_strengths_avg": [
            71.6,
            33.23612492454558
        ],
        "wc_weaknesses_avg": [
            64.4,
            47.49568401444493
        ],
        "wc_questions_avg": [
            156.8,
            227.76075166718255
        ],
        "wc_review_avg": [
            379.2,
            292.83401441772435
        ],
        "wc_reply_reviewers_avg": [
            39.0,
            50.215535444720686
        ],
        "wc_reply_authors_avg": [
            890.0,
            676.5669220409759
        ],
        "reply_reviewers_avg": [
            0.6,
            0.8
        ],
        "reply_authors_avg": [
            1.8,
            1.1661903789690602
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.32025630761017426,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:7AgCqgHFEKIJ:scholar.google.com/&scioq=Spectral+learning+of+shared+dynamics+between+generalized-linear+processes&hl=en&as_sdt=0,5",
        "gs_version_total": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Southern California",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.usc.edu",
        "aff_unique_abbr": "USC",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Los Angeles",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "wCVIWQ6DLD",
        "title": "A Simple and Efficient Baseline for Data Attribution on Images",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Data attribution methods play a crucial role in understanding machine learning models, providing insight into which training data points are most responsible for model outputs during deployment. However, current state-of-the-art approaches require a large ensemble of as many as 300,000 models to accurately attribute model predictions. These approaches therefore come at a high computational cost, are memory intensive, and are hard to scale to large models or datasets. \nIn this work, we focus on a minimalist baseline, utilizing the feature space of a backbone pretrained via self-supervised learning to perform data attribution. Our method is model-agnostic and scales easily to large datasets. We show results on CIFAR-10 and ImageNet, achieving strong performance that rivals or outperforms state-of-the-art approaches at a fraction of the compute or memory cost. Contrary to prior work, our results reinforce the intuition that a model's prediction on one image is most impacted by visually similar training samples. Our approach serves as a simple and efficient baseline for data attribution on images.",
        "keywords": "data attribution;explainablility;interpretability",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/9f7983e1fba724c49572e3fda2bc0d0a3741a1fc.zip",
        "author": "Vasu Singla;Pedro Sandoval-Segura;Micah Goldblum;Jonas Geiping;Tom Goldstein",
        "authorids": "~Vasu_Singla1;~Pedro_Sandoval-Segura1;~Micah_Goldblum1;~Jonas_Geiping1;~Tom_Goldstein1",
        "gender": "M;;M;M;M",
        "homepage": "https://www.cs.umd.edu/people/vsingla;;https://jonasgeiping.github.io/;https://www.cs.umd.edu/~tomg/;http://cs.umd.edu/~psando",
        "dblp": "270/9234;241/7231;190/7229;25/8184;242/4604",
        "google_scholar": "geHpT2IAAAAJ;pGDKzuUAAAAJ;https://scholar.google.de/citations?user=206vNCEAAAAJ;KmSuVtgAAAAJ;x-0RKroAAAAJ",
        "orcid": ";;;;0000-0003-1932-8092",
        "linkedin": ";;;;",
        "or_profile": "~Vasu_Singla1;~Micah_Goldblum1;~Jonas_Geiping1;~Tom_Goldstein1;~Pedro_Sandoval_Segura2",
        "aff": "Google;New York University;Max Planck Institute for Intelligent Systems, Max-Planck Institute;University of Maryland, College Park;University of Maryland",
        "aff_domain": "google.com;nyu.edu;tuebingen.mpg.de;umd.edu;umd.edu",
        "position": "Intern;Postdoc;Principal Researcher;Full Professor;PhD student",
        "bibtex": "@misc{\nsingla2024a,\ntitle={A Simple and Efficient Baseline for Data Attribution on Images},\nauthor={Vasu Singla and Pedro Sandoval-Segura and Micah Goldblum and Jonas Geiping and Tom Goldstein},\nyear={2024},\nurl={https://openreview.net/forum?id=wCVIWQ6DLD}\n}",
        "github": "",
        "project": "",
        "reviewers": "TdDF;eNuE;wyU7;n2Gq",
        "site": "https://openreview.net/forum?id=wCVIWQ6DLD",
        "pdf_size": 3266136,
        "rating": "3;3;5;5",
        "confidence": "5;4;4;2",
        "soundness": "2;2;3;2",
        "contribution": "2;2;2;3",
        "presentation": "3;3;2;3",
        "wc_summary": "52;75;120;37",
        "wc_strengths": "36;66;29;42",
        "wc_weaknesses": "601;569;198;56",
        "wc_questions": "4;81;11;97",
        "wc_review": "693;791;358;232",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "558;517;222;388",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            71.0,
            31.36080356113344
        ],
        "wc_strengths_avg": [
            43.25,
            13.91716565971678
        ],
        "wc_weaknesses_avg": [
            356.0,
            234.71152506854025
        ],
        "wc_questions_avg": [
            48.25,
            41.215136782497765
        ],
        "wc_review_avg": [
            518.5,
            230.5151838816697
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            421.25,
            131.02933831779814
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.6882472016116854,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9027330568144227724&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;3;3",
        "aff_unique_norm": "Google;New York University;Max Planck Institute for Intelligent Systems;University of Maryland",
        "aff_unique_dep": "Google;;Intelligent Systems;",
        "aff_unique_url": "https://www.google.com;https://www.nyu.edu;https://www.mpi-is.mpg.de;https://www/umd.edu",
        "aff_unique_abbr": "Google;NYU;MPI-IS;UMD",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Mountain View;;College Park",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "United States;Germany"
    },
    {
        "id": "wD8L86iCvD",
        "title": "FINE-GRAINED AUDIO-VISUAL JOINT REPRESENTATIONS FOR MULTIMODAL LARGE LANGUAGE MODELS",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Audio-visual large language models (LLM) have drawn significant attention, yet the fine-grained combination of both input streams is rather under-explored, which is challenging but necessary for LLMs to understand general video inputs. To this end, a fine-grained audio-visual joint representation (FAVOR) learning framework for multimodal LLMs is proposed in this paper, which extends a text-based LLM to simultaneously perceive speech and audio events in the audio input stream and images or videos in the visual input stream, at the frame level. To fuse the audio and visual feature streams into joint representations and to align the joint space with the LLM input embedding space, we propose a causal Q-Former structure with a causal attention module to enhance the capture of causal relations of the audio-visual frames across time. An audio-visual evaluation benchmark (AVEB) is also proposed which comprises six representative single-modal tasks with five cross-modal tasks reflecting audio-visual co-reasoning abilities. While achieving competitive single-modal performance on audio, speech and image tasks in AVEB, FAVOR achieved over 20% accuracy improvements on the video question-answering task when fine-grained information or temporal causal reasoning is required. FAVOR, in addition, demonstrated remarkable video comprehension and reasoning abilities on tasks that are unprecedented by other multimodal LLMs. An interactive demo of FAVOR is available at https://github.com/the-anonymous-bs/FAVOR.git, and the training code and model checkpoints will be released upon acceptance",
        "keywords": "audio-visual;multi-modal;large language model;fine-grained;Q-Former",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/be253b71d0350dd653259f72e6905c31e3bca75e.zip",
        "author": "Guangzhi Sun;Wenyi Yu;Changli Tang;Xianzhao Chen;Tian Tan;Wei Li;Lu Lu;Zejun MA;Chao Zhang",
        "authorids": "~Guangzhi_Sun1;~Wenyi_Yu2;~Changli_Tang1;~Xianzhao_Chen1;~Tian_Tan5;~Wei_Li78;~Lu_Lu6;~Zejun_MA1;~Chao_Zhang20",
        "gender": "M;M;M;;M;M;M;M;M",
        "homepage": "http://mi.eng.cam.ac.uk/\u223cgs534/;https://github.com/Yu-Doit;;http://chenxianzhao.bytedance.com;;;;;http://mi.eng.cam.ac.uk/~cz277/",
        "dblp": "236/4543;;331/8719;;;;;;94/3019-31.html",
        "google_scholar": "PzPAzf8AAAAJ;CGqr-V8AAAAJ;RzIjbf0AAAAJ;;ukL_E5AAAAAJ;q8ZrKVIAAAAJ;IQaR2KoAAAAJ;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.co.uk/citations?view_op=list_works",
        "orcid": ";;0000-0002-2009-3078;;;;;;",
        "linkedin": "brian-sun-59746b12b/;;;;;;;zejun-ma-58614365/;",
        "or_profile": "~Guangzhi_Sun1;~Wenyi_Yu2;~Changli_Tang1;~Xianzhao_Chen1;~Tian_Tan5;~Wei_Li78;~Lu_Lu6;~Zejun_MA1;~Chao_Zhang20",
        "aff": "University of Cambridge;Tsinghua University;Tsinghua University;;;Bytedance;;ByteDance Inc.;University College London",
        "aff_domain": "cam.ac.uk;tsinghua.edu.cn;tsinghua.edu.cn;;;bytedance.com;;bytedance.com;ucl.ac.uk",
        "position": "Junior Research Fellow;PhD student;Undergrad student;;;Researcher;;Principal Researcher;Associate Professor",
        "bibtex": "@misc{\nsun2024finegrained,\ntitle={{FINE}-{GRAINED} {AUDIO}-{VISUAL} {JOINT} {REPRESENTATIONS} {FOR} {MULTIMODAL} {LARGE} {LANGUAGE} {MODELS}},\nauthor={Guangzhi Sun and Wenyi Yu and Changli Tang and Xianzhao Chen and Tian Tan and Wei Li and Lu Lu and Zejun MA and Chao Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=wD8L86iCvD}\n}",
        "github": "",
        "project": "",
        "reviewers": "jiVL;QdMV;gnXu;AkuS",
        "site": "https://openreview.net/forum?id=wD8L86iCvD",
        "pdf_size": 7924172,
        "rating": "3;6;6;6",
        "confidence": "4;3;4;4",
        "soundness": "2;3;3;2",
        "contribution": "2;2;2;1",
        "presentation": "1;4;3;3",
        "wc_summary": "70;56;78;36",
        "wc_strengths": "12;26;66;40",
        "wc_weaknesses": "370;496;299;377",
        "wc_questions": "2;222;517;53",
        "wc_review": "454;800;960;506",
        "wc_reply_reviewers": "202;351;229;303",
        "wc_reply_authors": "1414;2012;1577;1654",
        "reply_reviewers": "1;1;1;2",
        "reply_authors": "2;3;2;4",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            60.0,
            15.937377450509228
        ],
        "wc_strengths_avg": [
            36.0,
            19.949937343260004
        ],
        "wc_weaknesses_avg": [
            385.5,
            70.71951640106145
        ],
        "wc_questions_avg": [
            198.5,
            201.10755828660444
        ],
        "wc_review_avg": [
            680.0,
            208.65761428713787
        ],
        "wc_reply_reviewers_avg": [
            271.25,
            59.052413159836235
        ],
        "wc_reply_authors_avg": [
            1664.25,
            218.67370097933588
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13449748469088615374&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1;2;2;3",
        "aff_unique_norm": "University of Cambridge;Tsinghua University;ByteDance;University College London",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.cam.ac.uk;https://www.tsinghua.edu.cn;https://www.bytedance.com;https://www.ucl.ac.uk",
        "aff_unique_abbr": "Cambridge;THU;Bytedance;UCL",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Cambridge;",
        "aff_country_unique_index": "0;1;1;1;1;0",
        "aff_country_unique": "United Kingdom;China"
    },
    {
        "id": "wDE3clrYWR",
        "title": "Combinatorial Optimization via Memory Metropolis: Template Networks for Proposal Distributions in Simulated Annealing applied to Nanophotonic Inverse Design",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We propose to utilize a neural network to build transition proposal distributions in simulated annealing (SA), which we use for combinatorial optimization on 2D-binary grids and thereby direct convergence towards states of structurally clustered patterns.\n  To accomplish this we introduce a novel class of network architectures called template networks.\n  A template network learns a template to construct a proposal distribution for state transitions of the stochastic process of the Metropolis algorithm, which forms the basis of SA.\n  Each network represents a single constant pattern and is trained on the evaluation results of intermediate states of a single optimization run, resulting in an architecture not requiring an input layer.\n  Using this learning scheme we equip the Metropolis algorithm with the ability to utilize information about past states, intentionally violating the Markov property of memorylessness, and therefore call our method Memory Metropolis (MeMe).\n  Moreover, the emergence of structural clusters is encouraged by incorporating layers with limited local connectivity in the template network, while the network depth controls the learnable cluster sizes.\n  By violating the Markov property and further dropping the consideration of transition properties when evaluating the Metropolis criterion, we deliberately bias the target distribution towards cluster formation.\\\n  Viewing the optimization objective of the Metropolis algorithm as a reward maximization links MeMe to deep reinforcement learning, where the policy is constructed from the discrepancy between the template and the current state.\n  This allows to train the template network to find high-reward template-patterns.\n  Detrimental actions (negative rewards) can be directly reverted by evaluating the Metropolis criterion which saves on computationally costly state evaluations.\\\n  We apply our algorithm to combinatorial optimization in nanophotonic inverse design and demonstrate that MeMe results in clustered design patterns suitable for direct optical chip fabrication which can not be found by plain SA or regularized SA. Code is available at https://XXXXXXXX.",
        "keywords": "Simulated Annealing;Metropolis Algorithm;Template Networks;Memory Metropolis;Combinatorial Optimization;Binary Grids;Nanophotonic Inverse Design",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Marlon Becker;Marco Butz;David Lemli;Carsten Schuck;Benjamin Risse",
        "authorids": "~Marlon_Becker1;~Marco_Butz1;~David_Lemli1;~Carsten_Schuck1;~Benjamin_Risse1",
        "gender": ";M;Not Specified;M;M",
        "homepage": ";;https://www.uni-muenster.de/Physik.PI/Schuck/team/team.html;https://www.uni-muenster.de/Physik.PI/Schuck/index.html;https://cvmls.uni-muenster.de",
        "dblp": "364/9023.html;;;;124/2684",
        "google_scholar": "FUPTvIoAAAAJ;M6uRu7cAAAAJ;;https://scholar.google.com/citations?hl=en;rWx-1t0AAAAJ",
        "orcid": ";;;0000-0002-9220-4021;0000-0001-5691-4029",
        "linkedin": "marlon-becker-26105a2a2/;;;;",
        "or_profile": "~Marlon_Becker1;~Marco_Butz1;~David_Lemli1;~Carsten_Schuck1;~Benjamin_Risse1",
        "aff": "Westf\u00e4lische Wilhelms-Universit\u00e4t M\u00fcnster;;Westf\u00e4lische Wilhelms-Universit\u00e4t M\u00fcnster;Westf\u00e4lische Wilhelms-Universit\u00e4t M\u00fcnster;University of M\u00fcnster",
        "aff_domain": "wwu.de;;wwu.de;wwu.de;uni-muenster.de",
        "position": "PhD student;;MS student;Full Professor;Full Professor",
        "bibtex": "@misc{\nbecker2024combinatorial,\ntitle={Combinatorial Optimization via Memory Metropolis: Template Networks for Proposal Distributions in Simulated Annealing applied to Nanophotonic Inverse Design},\nauthor={Marlon Becker and Marco Butz and David Lemli and Carsten Schuck and Benjamin Risse},\nyear={2024},\nurl={https://openreview.net/forum?id=wDE3clrYWR}\n}",
        "github": "",
        "project": "",
        "reviewers": "9yfn;SEFL;UWqi",
        "site": "https://openreview.net/forum?id=wDE3clrYWR",
        "pdf_size": 7700908,
        "rating": "5;5;5",
        "confidence": "3;3;2",
        "soundness": "2;3;3",
        "contribution": "2;2;2",
        "presentation": "2;3;2",
        "wc_summary": "70;222;63",
        "wc_strengths": "36;100;28",
        "wc_weaknesses": "106;127;188",
        "wc_questions": "73;41;172",
        "wc_review": "285;490;451",
        "wc_reply_reviewers": "121;67;0",
        "wc_reply_authors": "379;435;203",
        "reply_reviewers": "1;1;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            118.33333333333333,
            73.35908638713786
        ],
        "wc_strengths_avg": [
            54.666666666666664,
            32.221455929585524
        ],
        "wc_weaknesses_avg": [
            140.33333333333334,
            34.77866523539332
        ],
        "wc_questions_avg": [
            95.33333333333333,
            55.76338902501851
        ],
        "wc_review_avg": [
            408.6666666666667,
            88.88319426203259
        ],
        "wc_reply_reviewers_avg": [
            62.666666666666664,
            49.492984912566705
        ],
        "wc_reply_authors_avg": [
            339.0,
            98.84668262853674
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:exsOVI_3jc0J:scholar.google.com/&scioq=Combinatorial+Optimization+via+Memory+Metropolis:+Template+Networks+for+Proposal+Distributions+in+Simulated+Annealing+applied+to+Nanophotonic+Inverse+Design&hl=en&as_sdt=0,44",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "Westf\u00e4lische Wilhelms-Universit\u00e4t M\u00fcnster;University of M\u00fcnster",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uni-muenster.de;https://www.uni-muenster.de",
        "aff_unique_abbr": "WWU;UM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "wDd4Zcnc08",
        "title": "HP$^3$-NS: Hybrid Perovskite Property Prediction Using Nested Subgraph",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Many machine learning techniques have demonstrated superiority in large-scale material screening, enabling rapid and accurate estimation of material properties. However, data representation on hybrid organic-inorganic (HOI) crystalline materials poses a distinct challenge due to their intricate nature. Current graph-based representations often struggle to effectively capture the nuanced interactions between organic and inorganic components. Furthermore, these methods typically rely on detailed structural information that hinders the applications of the methods for novel material discovery. To address these, we propose a nested graph representation HP$^3$-NS (Hybrid Perovskite Property Prediction Using Nested Subgraph) that hierarchically encodes the distinct interactions within hybrid crystals. Our encoding scheme incorporates both intra- and inter-molecular interactions and distinguishes between the organic and inorganic components. This hierarchical representation also removes the dependence on detailed structural data, enabling the model application to newly designed materials. We demonstrate the effectiveness and significance of the method on hybrid perovskite datasets, wherein the proposed HP$^3$-NS achieves significant accuracy improvement compared to current state-of-the-art techniques for hybrid material property prediction tasks. Our method shows promising potential to accelerate hybrid perovskite development by enabling effective computational screening and analysis of HOI crystals.",
        "keywords": "Hybrid organic-inorganic materials; graph representation; material designing;",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Longhan Zhang;Temesgen Muruts Weldengus;Ruixuan Song;Zhaoliang Lei;Haowen Wang;Yiteng Zhai;Jing Jiang",
        "authorids": "~Longhan_Zhang1;~Temesgen_Muruts_Weldengus1;~Ruixuan_Song1;~Zhaoliang_Lei1;~Haowen_Wang1;~Yiteng_Zhai2;~Jing_Jiang7",
        "gender": ";;M;M;M;M;M",
        "homepage": ";;https://scholar.google.com.hk/citations?hl=zh-CN&user=Hoqc8PwAAAAJ;https://www.researchgate.net/profile/Zhaoliang-Lei;;;",
        "dblp": ";;;;;124/8986.html;",
        "google_scholar": "w8I7xusAAAAJ;;https://scholar.google.com.hk/citations?hl=zh-CN;;X-HgtJIAAAAJ;;dplQ73EAAAAJ",
        "orcid": ";;;;0000-0003-4323-7166;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Longhan_Zhang1;~Temesgen_Muruts_Weldengus1;~Ruixuan_Song1;~Zhaoliang_Lei1;~Haowen_Wang1;~Yiteng_Zhai2;~Jing_Jiang7",
        "aff": "Hong Kong University of Science and Technology;;Zhejiang Lab;Zhejiang University;Alipay;;",
        "aff_domain": "connect.hkust-gz.edu.cn;;zhejianglab.com;zju.edu.cn;alipay.com;;",
        "position": "PhD student;;Postdoc;MS student;Researcher;;",
        "bibtex": "@misc{\nzhang2024hpns,\ntitle={{HP}\\${\\textasciicircum}3\\$-{NS}: Hybrid Perovskite Property Prediction Using Nested Subgraph},\nauthor={Longhan Zhang and Temesgen Muruts Weldengus and Ruixuan Song and Zhaoliang Lei and Haowen Wang and Yiteng Zhai and Jing Jiang},\nyear={2024},\nurl={https://openreview.net/forum?id=wDd4Zcnc08}\n}",
        "github": "",
        "project": "",
        "reviewers": "Std6;nTVd;su6c;C55J",
        "site": "https://openreview.net/forum?id=wDd4Zcnc08",
        "pdf_size": 1837799,
        "rating": "5;5;5;5",
        "confidence": "4;3;3;4",
        "soundness": "3;2;2;3",
        "contribution": "3;2;2;3",
        "presentation": "3;2;2;2",
        "wc_summary": "36;44;11;66",
        "wc_strengths": "82;30;20;56",
        "wc_weaknesses": "186;96;25;34",
        "wc_questions": "3;36;19;9",
        "wc_review": "307;206;75;165",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "797;504;483;333",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            39.25,
            19.66437133498043
        ],
        "wc_strengths_avg": [
            47.0,
            24.1039415863879
        ],
        "wc_weaknesses_avg": [
            85.25,
            64.27042476909578
        ],
        "wc_questions_avg": [
            16.75,
            12.497499749949988
        ],
        "wc_review_avg": [
            188.25,
            83.34079133293612
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            529.25,
            168.06304620588074
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:EkXCCreLhZ0J:scholar.google.com/&scioq=HP%24%5E3%24-NS:+Hybrid+Perovskite+Property+Prediction+Using+Nested+Subgraph&hl=en&as_sdt=0,15",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Zhejiang Lab;Zhejiang University;Alipay",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.ust.hk;http://www.zhejianglab.com;https://www.zju.edu.cn;https://www.alipay.com",
        "aff_unique_abbr": "HKUST;;ZJU;Alipay",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "wE1I9IGqeH",
        "title": "Continual Learning in Open-vocabulary Classification with Complementary Memory Systems",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We introduce a method for flexible and efficient continual learning in open-vocabulary image classification, drawing inspiration from the complementary learning systems observed in human cognition. Specifically, we propose to combine predictions from a CLIP zero-shot model and the exemplar-based model, using the zero-shot estimated probability that a sample's class is within the exemplar classes. We also propose a \"tree probe\" method, an adaption of lazy learning principles, which enables fast learning from new examples with competitive accuracy to batch-trained linear models. We test in data incremental, class incremental, and task incremental settings, as well as ability to perform flexible inference on varying subsets of zero-shot and learned categories. Our proposed method achieves a good balance of learning speed, target task effectiveness, and zero-shot effectiveness.",
        "keywords": "Continual learning; Open-vocabulary classification; Complementary learning systems",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/e6f0773b8ff7edb160717c989d22775d5a288d79.pdf",
        "author": "Zhen Zhu;Weijie Lyu;Yao Xiao;Derek Hoiem",
        "authorids": "~Zhen_Zhu1;~Weijie_Lyu2;~Yao_Xiao3;~Derek_Hoiem1",
        "gender": "M;;;M",
        "homepage": "https://zzhu.vision;https://weijielyu.github.io/;;http://dhoiem.cs.illinois.edu/",
        "dblp": ";168/8687;;08/6948",
        "google_scholar": "nD6_ot4AAAAJ;https://scholar.google.com/citations?hl=en;;8Sfj7q8AAAAJ",
        "orcid": "0000-0003-1557-8473;;;",
        "linkedin": "zhen-zhu-8081b3203/;weijielyu/;;",
        "or_profile": "~Zhen_Zhu1;~Weijie_Lyu2;~Yao_Xiao3;~Derek_Hoiem1",
        "aff": "University of Illinois, Urbana Champaign;University of California, Merced;;Reconstruct",
        "aff_domain": "illinois.edu;ucmerced.edu;;reconstructinc.com",
        "position": "PhD student;PhD student;;Chief Scientist",
        "bibtex": "@misc{\nzhu2024continual,\ntitle={Continual Learning in Open-vocabulary Classification with Complementary Memory Systems},\nauthor={Zhen Zhu and Weijie Lyu and Yao Xiao and Derek Hoiem},\nyear={2024},\nurl={https://openreview.net/forum?id=wE1I9IGqeH}\n}",
        "github": "",
        "project": "",
        "reviewers": "aTSX;ShHL;ijNk",
        "site": "https://openreview.net/forum?id=wE1I9IGqeH",
        "pdf_size": 8557305,
        "rating": "5;5;8",
        "confidence": "4;4;3",
        "soundness": "3;3;3",
        "contribution": "2;2;3",
        "presentation": "2;2;3",
        "wc_summary": "81;161;129",
        "wc_strengths": "41;46;89",
        "wc_weaknesses": "180;225;81",
        "wc_questions": "6;55;89",
        "wc_review": "308;487;388",
        "wc_reply_reviewers": "0;0;31",
        "wc_reply_authors": "517;523;242",
        "reply_reviewers": "0;0;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            6.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            123.66666666666667,
            32.87687468250121
        ],
        "wc_strengths_avg": [
            58.666666666666664,
            21.545816814923082
        ],
        "wc_weaknesses_avg": [
            162.0,
            60.149812967290266
        ],
        "wc_questions_avg": [
            50.0,
            34.068558329736625
        ],
        "wc_review_avg": [
            394.3333333333333,
            73.2135385172867
        ],
        "wc_reply_reviewers_avg": [
            10.333333333333334,
            14.613540144521982
        ],
        "wc_reply_authors_avg": [
            427.3333333333333,
            131.07334672702237
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9859230743550093520&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Illinois Urbana-Champaign;University of California, Merced;",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://illinois.edu;https://www.ucmerced.edu;",
        "aff_unique_abbr": "UIUC;UC Merced;",
        "aff_campus_unique_index": "0;1",
        "aff_campus_unique": "Urbana-Champaign;Merced;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States;"
    },
    {
        "id": "wFPfYccHJ1",
        "title": "Out-of-Distribution Detection & Applications With Ablated Learned Temperature Energy",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "As deep neural networks become adopted in high-stakes domains, it is crucial to be able to identify when inference inputs are Out-of-Distribution (OOD) so that users can be alerted of likely drops in performance and calibration despite high confidence. Among many others, existing methods use the following two scores to do so without training on any apriori OOD examples: a learned temperature and an energy score . In this paper we introduce Ablated Learned Temperature Energy (or \"AbeT\" for short), a method which combines these prior methods in novel ways with an effective ablation. Due to these contributions, AbeT lowers the False Positive Rate at 95\\% True Positive Rate (FPR@95) by $47.32\\%$ in classification (averaged across all ID and OOD datasets measured) compared to state of the art without training networks in multiple stages or requiring hyperparameters or test-time backward passes. We additionally provide empirical insights as to why our model learns to distinguish between In-Distribution (ID) and OOD samples while only being explicitly trained on ID samples via exposure to misclassified ID examples at training time. Lastly, we show the efficacy of our method in identifying predicted bounding boxes and pixels corresponding to OOD objects in object detection and semantic segmentation, respectively - with an AUROC increase of $5.15\\%$ in object detection and both a decrease in FPR@95 of $41.48\\%$ and an increase in AUPRC of $34.20\\%$ on average in semantic segmentation compared to previous state of the art.\n\nWe make our code publicly available at https://github.com/anonymousoodauthor/abet, with our method requiring only a single line change to the architectures of classifiers, object detectors, and segmentation models prior to training.",
        "keywords": "Out-of-Distribution;Out-of-Distribution Detection;OOD;OOD Detection;Distribution Shift",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/7fd0984a055e0b6a4a4909db9ed36118d6244ded.pdf",
        "author": "Will LeVine;Benjamin Pikus;Jacob Phillips;Berk Norman;Sean M. Hendryx;Fernando Amat",
        "authorids": "~Will_LeVine1;~Benjamin_Pikus1;~Jacob_Phillips1;~Berk_Norman1;~Sean_M._Hendryx1;~Fernando_Amat1",
        "gender": ";M;M;;M;M",
        "homepage": ";;;;https://smhendryx.github.io/;",
        "dblp": ";344/0982;153/0295;;;03/482",
        "google_scholar": "x0BaVhQAAAAJ;52cRmQkAAAAJ;;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en;mVbweYgAAAAJ",
        "orcid": ";;;;;",
        "linkedin": "https://www.linkedin.com/mwlite/in/will-levine-63b986123;benjamin-pikus/;jacob-phillips-749175163/;https://www.linkedin.com/feed/;sean-hendryx-43894056/;fernando-amat-6110931/",
        "or_profile": "~Will_LeVine1;~Benjamin_Pikus1;~Jacob_Phillips1;~Berk_Norman1;~Sean_M._Hendryx1;~Fernando_Amat1",
        "aff": "Microsoft;Advex AI;Scale AI;Scale AI;Scale AI;Google",
        "aff_domain": "microsoft.com;advexai.com;scale.com;scale.com;scale.com;google.com",
        "position": "Researcher;Researcher;Researcher;Researcher;Engineering Manager, Machine Learning;Principal Researcher",
        "bibtex": "@misc{\nlevine2024outofdistribution,\ntitle={Out-of-Distribution Detection \\& Applications With Ablated Learned Temperature Energy},\nauthor={Will LeVine and Benjamin Pikus and Jacob Phillips and Berk Norman and Sean M. Hendryx and Fernando Amat},\nyear={2024},\nurl={https://openreview.net/forum?id=wFPfYccHJ1}\n}",
        "github": "",
        "project": "",
        "reviewers": "HZpi;yXfA;Jfeb;NVtq",
        "site": "https://openreview.net/forum?id=wFPfYccHJ1",
        "pdf_size": 2411589,
        "rating": "3;5;5;5",
        "confidence": "3;3;4;4",
        "soundness": "2;3;2;2",
        "contribution": "2;1;2;2",
        "presentation": "2;3;3;3",
        "wc_summary": "84;63;46;121",
        "wc_strengths": "28;45;21;114",
        "wc_weaknesses": "125;84;91;60",
        "wc_questions": "5;170;6;36",
        "wc_review": "242;362;164;331",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "252;56;316;210",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            78.5,
            27.98660393831306
        ],
        "wc_strengths_avg": [
            52.0,
            36.84426685388108
        ],
        "wc_weaknesses_avg": [
            90.0,
            23.24865587512534
        ],
        "wc_questions_avg": [
            54.25,
            67.97931670736328
        ],
        "wc_review_avg": [
            274.75,
            77.64462312356214
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            208.5,
            95.79535479343453
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5316345658563384835&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;2;2;3",
        "aff_unique_norm": "Microsoft;Advex AI;Scale AI;Google",
        "aff_unique_dep": "Microsoft Corporation;;;Google",
        "aff_unique_url": "https://www.microsoft.com;;https://scale.ai;https://www.google.com",
        "aff_unique_abbr": "Microsoft;;Scale AI;Google",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "On the Hardness of Constrained Cooperative Multi-Agent Reinforcement Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17502",
        "id": "wFWuX1Fhtj",
        "author_site": "Ziyi Chen, Yi Zhou, Heng Huang",
        "tldr": "",
        "abstract": "Constrained cooperative multi-agent reinforcement learning (MARL) is an emerging learning framework that has been widely applied to manage multi-agent systems, and many primal-dual type algorithms have been developed for it. However, the convergence of primal-dual algorithms crucially relies on strong duality -- a condition that has not been formally proved in constrained cooperative MARL. In this work, we prove that strong duality fails to hold in constrained cooperative MARL, by revealing a nonconvex quadratic type constraint on the occupation measure induced by the product policy. Consequently, our reanalysis of the primal-dual algorithm shows that its convergence rate is hindered by the nonzero duality gap. Then, we propose a decentralized primal approach for constrained cooperative MARL to avoid the duality gap, and our analysis shows that its convergence is hindered by another gap induced by the advantage functions. Moreover, we compare these two types of algorithms via concrete examples, and show that neither of them always outperforms the other one. Our study reveals that constrained cooperative MARL is generally a challenging and highly nonconvex problem, and its fundamental structure is very different from that of single-agent constrained RL.",
        "keywords": "Multi-Agent Reinforcement Learning;Constrained reinforcement learning;Primal-Dual;Duality gap;Primal algorithm",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/ac6140b7e674a60dbd2119eb7e5191c8120e3118.zip",
        "author": "Ziyi Chen;Yi Zhou;Heng Huang",
        "authorids": "~Ziyi_Chen2;~Yi_Zhou2;~Heng_Huang1",
        "gender": "M;M;M",
        "homepage": ";https://sites.google.com/site/yizhouhomepage/home;https://www.cs.umd.edu/~heng/",
        "dblp": "37/1439-2;;03/281",
        "google_scholar": "zjSBVOIAAAAJ;4fK8bYIAAAAJ;4OqLaDwAAAAJ",
        "orcid": ";;",
        "linkedin": "ziyi-chen-84616184/;;",
        "or_profile": "~Ziyi_Chen2;~Yi_Zhou2;~Heng_Huang1",
        "aff": "University of Maryland, College Park;University of Utah;Department of Computer Science, University of Maryland, College Park",
        "aff_domain": "umd.edu;utah.edu;cs.umd.edu",
        "position": "Postdoc;Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\nchen2024on,\ntitle={On the Hardness of Constrained Cooperative Multi-Agent Reinforcement Learning},\nauthor={Ziyi Chen and Yi Zhou and Heng Huang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=wFWuX1Fhtj}\n}",
        "github": "",
        "project": "",
        "reviewers": "fuRV;2Wr4;MmRm;Ycbe;WbB4;ditR",
        "pdf_size": 1184264,
        "rating": "5;6;6;6;6;6",
        "confidence": "3;2;4;4;3;2",
        "soundness": "3;3;3;3;3;3",
        "contribution": "2;3;2;3;3;2",
        "presentation": "3;3;3;3;3;4",
        "wc_summary": "92;37;87;151;297;248",
        "wc_strengths": "23;25;114;151;48;70",
        "wc_weaknesses": "155;67;171;248;160;94",
        "wc_questions": "25;42;147;4;68;94",
        "wc_review": "295;171;519;554;573;506",
        "wc_reply_reviewers": "19;0;58;35;0;0",
        "wc_reply_authors": "563;461;1156;329;478;529",
        "reply_reviewers": "1;0;1;1;0;0",
        "reply_authors": "2;1;3;1;1;1",
        "rating_avg": [
            5.833333333333333,
            0.372677996249965
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.1666666666666665,
            0.3726779962499649
        ],
        "wc_summary_avg": [
            152.0,
            92.45899992248816
        ],
        "wc_strengths_avg": [
            71.83333333333333,
            46.89497722452682
        ],
        "wc_weaknesses_avg": [
            149.16666666666666,
            58.00981717682697
        ],
        "wc_questions_avg": [
            63.333333333333336,
            47.27108583008809
        ],
        "wc_review_avg": [
            436.3333333333333,
            149.77056527309438
        ],
        "wc_reply_reviewers_avg": [
            18.666666666666668,
            21.830152440043918
        ],
        "wc_reply_authors_avg": [
            586.0,
            265.2093512680124
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.7637626158259734
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8666458945225302123&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=wFWuX1Fhtj",
        "pdf": "https://openreview.net/pdf?id=wFWuX1Fhtj",
        "email": "umd.edu;utah.edu;cs.umd.edu",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of Maryland;University of Utah;University of Maryland, College Park",
        "aff_unique_dep": ";;Department of Computer Science",
        "aff_unique_url": "https://www/umd.edu;https://www.utah.edu;https://www/umd.edu",
        "aff_unique_abbr": "UMD;Utah;UMD",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "College Park;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Causal Inference with Conditional Front-Door Adjustment and Identifiable Variational Autoencoder",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17501",
        "id": "wFf9m4v7oC",
        "author_site": "Ziqi Xu, Debo Cheng, Jiuyong Li, Jixue Liu, Lin Liu, Kui Yu",
        "tldr": "",
        "abstract": "An essential and challenging problem in causal inference is causal effect estimation from observational data. The problem becomes more difficult with the presence of unobserved confounding variables. The front-door adjustment is an approach for dealing with unobserved confounding variables. However, the restriction for the standard front-door adjustment is difficult to satisfy in practice. In this paper, we relax some of the restrictions by proposing the concept of conditional front-door (CFD) adjustment and develop the theorem that guarantees the causal effect identifiability of CFD adjustment. By leveraging the ability of deep generative models, we propose CFDiVAE to learn the representation of the CFD adjustment variable directly from data with the identifiable Variational AutoEncoder and formally prove the model identifiability. Extensive experiments on synthetic datasets validate the effectiveness of CFDiVAE and its superiority over existing methods. The experiments also show that the performance of CFDiVAE is less sensitive to the causal strength of unobserved confounding variables. We further apply CFDiVAE to a real-world dataset to demonstrate its potential application.",
        "keywords": "Causal Inference;Variational AutoEncoder;Front Door Criterion",
        "primary_area": "causal reasoning",
        "supplementary_material": "/attachment/48000a91834cc8f4cc75ee5b9dbbda296ddcc90b.zip",
        "author": "Ziqi Xu;Debo Cheng;Jiuyong Li;Jixue Liu;Lin Liu;Kui Yu",
        "authorids": "~Ziqi_Xu1;~Debo_Cheng1;~Jiuyong_Li1;~Jixue_Liu1;~Lin_Liu4;~Kui_Yu2",
        "gender": "M;;M;M;Not Specified;M",
        "homepage": "https://iron13.github.io/;;https://people.unisa.edu.au/jiuyong.li;http://people.unisa.edu.au/jixue.liu;https://people.unisa.edu.au/lin.liu;https://sites.google.com/site/yukuiwebsite/",
        "dblp": "255/6518-1;;20/1583;l/JixueLiu.html;61/2115-3;52/2586",
        "google_scholar": "znODztEAAAAJ;;https://scholar.google.com.au/citations?user=WYeM3yYAAAAJ;https://scholar.google.com.au/citations?user=Ztoa054AAAAJ;QP6jqRwAAAAJ;rlzrsxwAAAAJ",
        "orcid": "0000-0003-1748-5801;;0000-0002-9023-1878;0000-0002-0794-0404;0000-0003-2843-5738;0000-0003-2442-4572",
        "linkedin": "ziqi-xu-846510113/;;jiuyongli/?originalSubdomain=au;;;",
        "or_profile": "~Ziqi_Xu1;~Debo_Cheng1;~Jiuyong_Li1;~Jixue_Liu1;~Lin_Liu4;~Kui_Yu2",
        "aff": "University of South Australia;;University of South Australia, Australia;University of South Australia, Australia;University of South Australia, Australia;Hefei University of Technology",
        "aff_domain": "unisa.edu.au;;unisa.edu.au;unisa.edu.au;unisa.edu.au;hfut.edu.cn",
        "position": "PhD student;;Full Professor;Associate Professor;Full Professor;Full Professor",
        "bibtex": "@inproceedings{\nxu2024causal,\ntitle={Causal Inference with Conditional Front-Door Adjustment and Identifiable Variational Autoencoder},\nauthor={Ziqi Xu and Debo Cheng and Jiuyong Li and Jixue Liu and Lin Liu and Kui Yu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=wFf9m4v7oC}\n}",
        "github": "",
        "project": "",
        "reviewers": "ysmt;BvSP;s6a3;A5AY",
        "pdf_size": 1235106,
        "rating": "5;6;6;6",
        "confidence": "4;4;4;3",
        "soundness": "3;2;2;3",
        "contribution": "2;2;3;3",
        "presentation": "4;3;3;3",
        "wc_summary": "232;211;197;70",
        "wc_strengths": "90;100;35;41",
        "wc_weaknesses": "149;410;618;52",
        "wc_questions": "36;127;350;36",
        "wc_review": "507;848;1200;199",
        "wc_reply_reviewers": "178;258;250;15",
        "wc_reply_authors": "314;1034;972;97",
        "reply_reviewers": "1;3;1;1",
        "reply_authors": "2;4;2;2",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            177.5,
            63.30284353802758
        ],
        "wc_strengths_avg": [
            66.5,
            28.79670119996386
        ],
        "wc_weaknesses_avg": [
            307.25,
            222.1028759381562
        ],
        "wc_questions_avg": [
            137.25,
            128.32648791266752
        ],
        "wc_review_avg": [
            688.5,
            374.0404389902247
        ],
        "wc_reply_reviewers_avg": [
            175.25,
            97.6252400765294
        ],
        "wc_reply_authors_avg": [
            604.25,
            406.65487517058
        ],
        "reply_reviewers_avg": [
            1.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            2.5,
            0.8660254037844386
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7465004099547751107&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=wFf9m4v7oC",
        "pdf": "https://openreview.net/pdf?id=wFf9m4v7oC",
        "email": "unisa.edu.au;;unisa.edu.au;unisa.edu.au;unisa.edu.au;hfut.edu.cn",
        "author_num": 6,
        "aff_unique_index": "0;0;0;0;1",
        "aff_unique_norm": "University of South Australia;Hefei University of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.unisa.edu.au;http://www.hfut.edu.cn/",
        "aff_unique_abbr": "UNISA;HUT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;1",
        "aff_country_unique": "Australia;China"
    },
    {
        "title": "Score-based generative models break the curse of dimensionality in learning a family of sub-Gaussian distributions",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17500",
        "id": "wG12xUSqrI",
        "author_site": "Frank Cole, Yulong Lu",
        "tldr": "",
        "abstract": "While score-based generative models (SGMs) have achieved remarkable successes in enormous image generation tasks, their mathematical foundations are still limited. In this paper, we analyze the approximation and generalization of SGMs in learning a family of sub-Gaussian probability distributions. We introduce a measure of complexity for probability distributions in terms of their relative density with respect to the standard Gaussian measure. We prove that if the log-relative density can be locally approximated by a neural network whose parameters can be suitably bounded, then the distribution generated by empirical score matching approximates the target distribution in total variation with a dimension-independent rate. We illustrate our theory through examples, which include certain mixtures of Gaussians. An essential ingredient of our proof is to derive a dimension-free deep network approximation rate for the true score function associated to the forward process, which is interesting in its own right.",
        "keywords": "score-based generative models;Barron space;curse of dimensionality",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/5ee1e71919bdc63f053e83e486de6ca802c28758.pdf",
        "author": "Frank Cole;Yulong Lu",
        "authorids": "~Frank_Cole1;~Yulong_Lu1",
        "gender": "M;M",
        "homepage": "https://sites.google.com/umn.edu/frank-cole;http://lu.math.umn.edu/",
        "dblp": ";35/10371",
        "google_scholar": "LyEFT7UAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";",
        "linkedin": "frank-cole-0562b2172/;",
        "or_profile": "~Frank_Cole1;~Yulong_Lu1",
        "aff": "University of Minnesota - Twin Cities;University of Minnesota - Twin Cities",
        "aff_domain": "umn.edu;umn.edu",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\ncole2024scorebased,\ntitle={Score-based generative models break the curse of dimensionality in learning a family of sub-Gaussian distributions},\nauthor={Frank Cole and Yulong Lu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=wG12xUSqrI}\n}",
        "github": "",
        "project": "",
        "reviewers": "bdyJ;2C1B;wRd7;r8Sf",
        "pdf_size": 292081,
        "rating": "5;6;8;8",
        "confidence": "3;3;3;3",
        "soundness": "3;4;4;3",
        "contribution": "2;2;4;3",
        "presentation": "3;4;4;4",
        "wc_summary": "295;78;32;247",
        "wc_strengths": "62;77;53;86",
        "wc_weaknesses": "403;295;53;141",
        "wc_questions": "47;233;118;63",
        "wc_review": "807;683;256;537",
        "wc_reply_reviewers": "0;220;0;0",
        "wc_reply_authors": "665;581;268;413",
        "reply_reviewers": "0;2;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            163.0,
            110.52827692495708
        ],
        "wc_strengths_avg": [
            69.5,
            12.816005617976296
        ],
        "wc_weaknesses_avg": [
            223.0,
            135.2848845954344
        ],
        "wc_questions_avg": [
            115.25,
            72.90533245243451
        ],
        "wc_review_avg": [
            570.75,
            205.31728495185203
        ],
        "wc_reply_reviewers_avg": [
            55.0,
            95.26279441628824
        ],
        "wc_reply_authors_avg": [
            481.75,
            153.17208459768378
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 18,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12193642520783057343&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=wG12xUSqrI",
        "pdf": "https://openreview.net/pdf?id=wG12xUSqrI",
        "email": "umn.edu;umn.edu",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Minnesota",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.minnesota.edu",
        "aff_unique_abbr": "UMN",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Twin Cities",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "YaRN: Efficient Context Window Extension of Large Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17499",
        "id": "wHBfxhZu1u",
        "author_site": "Bowen Peng, Jeffrey Quesnelle, Honglu Fan, Enrico Shippole",
        "tldr": "",
        "abstract": "Rotary Position Embeddings (RoPE) have been shown to effectively encode positional information in transformer-based language models. However, these models fail to generalize past the sequence length they were trained on. We present YaRN (Yet another RoPE extensioN method), a compute-efficient method to extend the context window of such models, requiring 10x less tokens and 2.5x less training steps than previous methods. Using YaRN, we show that LLaMA models can effectively utilize and extrapolate to context lengths much longer than their original pre-training would allow, while also surpassing previous the state-of-the-art at context window extension. In addition, we demonstrate that YaRN exhibits the capability to extrapolate beyond the limited context of a fine-tuning dataset. The models fine-tuned using YaRN has been made available and reproduced online up to 128k context length.",
        "keywords": "transformers;nlp;fine-tuning;context window;attention;rotary embedding",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/0228d73b37d847170cfdb58dc6af360620eb089f.zip",
        "author": "Bowen Peng;Jeffrey Quesnelle;Honglu Fan;Enrico Shippole",
        "authorids": "~Bowen_Peng1;~Jeffrey_Quesnelle1;~Honglu_Fan1;~Enrico_Shippole1",
        "gender": ";;Not Specified;M",
        "homepage": "https://github.com/bloc97;https://jeffq.com;https://honglu.fan;https://github.com/conceptofmind",
        "dblp": ";;;356/2379",
        "google_scholar": ";7jZjfZ8AAAAJ;XqlOVeAAAAAJ;_mXePyUAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;enrico-shippole-495521b8",
        "or_profile": "~Bowen_Peng1;~Jeffrey_Quesnelle1;~Honglu_Fan1;~Enrico_Shippole1",
        "aff": "Nous Research;;University of Geneva;Teraflop AI",
        "aff_domain": "nousresearch.com;;unige.ch;teraflop.ai",
        "position": "Principal Researcher;;Postdoc;CEO",
        "bibtex": "@inproceedings{\npeng2024yarn,\ntitle={Ya{RN}: Efficient Context Window Extension of Large Language Models},\nauthor={Bowen Peng and Jeffrey Quesnelle and Honglu Fan and Enrico Shippole},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=wHBfxhZu1u}\n}",
        "github": "",
        "project": "",
        "reviewers": "swin;t3XG;x5Kh;HiJG",
        "pdf_size": 780208,
        "rating": "6;6;6;8",
        "confidence": "2;4;4;4",
        "soundness": "3;3;2;3",
        "contribution": "3;3;3;3",
        "presentation": "2;2;2;3",
        "wc_summary": "21;114;236;83",
        "wc_strengths": "12;104;50;148",
        "wc_weaknesses": "56;35;315;167",
        "wc_questions": "178;56;273;149",
        "wc_review": "267;309;874;547",
        "wc_reply_reviewers": "0;0;53;0",
        "wc_reply_authors": "444;413;658;431",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            113.5,
            78.25119807389532
        ],
        "wc_strengths_avg": [
            78.5,
            51.75664208582315
        ],
        "wc_weaknesses_avg": [
            143.25,
            111.1223987322088
        ],
        "wc_questions_avg": [
            164.0,
            77.4047802141444
        ],
        "wc_review_avg": [
            499.25,
            241.27409206129033
        ],
        "wc_reply_reviewers_avg": [
            13.25,
            22.949673200287624
        ],
        "wc_reply_authors_avg": [
            486.5,
            99.62554893198832
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 352,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4031663212894418290&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=wHBfxhZu1u",
        "pdf": "https://openreview.net/pdf?id=wHBfxhZu1u",
        "email": "nousresearch.com;;unige.ch;teraflop.ai",
        "author_num": 4,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Nous Research;University of Geneva;Teraflop AI",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.nousresearch.com;https://www.unige.ch;",
        "aff_unique_abbr": ";UNIGE;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "United States;Switzerland;"
    },
    {
        "title": "BarLeRIa: An Efficient Tuning Framework for Referring Image Segmentation",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17498",
        "id": "wHLDHRkmEu",
        "author_site": "Yaoming Wang, Li Jin, XIAOPENG ZHANG, Bowen Shi, Chenglin Li, Wenrui Dai, Hongkai Xiong, Qi Tian",
        "tldr": "",
        "abstract": "Pre-training followed by full fine-tuning has gradually been substituted by Parameter-Efficient Tuning (PET) in the field of computer vision. PET has gained popularity, especially in the context of large-scale models, due to its ability to reduce transfer learning costs and conserve hardware resources. However, existing PET approaches primarily focus on recognition tasks and typically support uni-modal optimization, while neglecting dense prediction tasks and vision language interactions. To address this limitation, we propose a novel PET framework called **B**i-direction**a**l Inte**r**twined Vision **L**anguage Effici**e**nt Tuning for **R**eferring **I**mage Segment**a**tion (**BarLeRIa**), which leverages bi-directional intertwined vision language adapters to fully exploit the frozen pre-trained models' potential in cross-modal dense prediction tasks. In BarLeRIa, two different tuning modules are employed for efficient attention, one for global, and the other for local, along with an intertwined vision language tuning module for efficient modal fusion.\nExtensive experiments conducted on RIS benchmarks demonstrate the superiority of BarLeRIa over prior PET methods with a significant margin, i.e., achieving an average improvement of 5.6\\%. Remarkably, without requiring additional training datasets, BarLeRIa even surpasses SOTA full fine-tuning approaches. The code is available at https://github.com/NastrondAd/BarLeRIa.",
        "keywords": "referring image segmentation; parameter efficient tuning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Yaoming Wang;Jin Li;XIAOPENG ZHANG;Bowen Shi;Chenglin Li;Wenrui Dai;Hongkai Xiong;Qi Tian",
        "authorids": "~Yaoming_Wang1;~Jin_Li10;~XIAOPENG_ZHANG7;~Bowen_Shi2;~Chenglin_Li2;~Wenrui_Dai1;~Hongkai_Xiong1;~Qi_Tian3",
        "gender": ";;M;M;M;;M;M",
        "homepage": ";;https://sites.google.com/site/zxphistory/;;https://min.sjtu.edu.cn/En/FacultyShow/4?Vid=17;;http://min.sjtu.edu.cn;https://www.qitian1987.com/index.html",
        "dblp": ";;;;;16/5135.html;21/3569;78/1467-1.html",
        "google_scholar": ";;Ud6aBAcAAAAJ;lJHbpY0AAAAJ;ltW2JMcAAAAJ;Xg8MhyAAAAAJ;bB16iN4AAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;;;;0000-0003-4552-0029;0000-0002-7252-5047",
        "linkedin": ";;;;;;;",
        "or_profile": "~Yaoming_Wang1;~Jin_Li10;~XIAOPENG_ZHANG7;~Bowen_Shi2;~Chenglin_Li2;~Wenrui_Dai1;~Hongkai_Xiong1;~Qi_Tian3",
        "aff": ";;Huawei Technologies Ltd.;Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;Huawei Technologies Ltd.",
        "aff_domain": ";;huawei.com;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;huawei.com",
        "position": ";;Principal Researcher;PhD student;Full Professor;Associate Professor;Full Professor;Principal Researcher",
        "bibtex": "@inproceedings{\nwang2024barleria,\ntitle={BarLe{RI}a: An Efficient Tuning Framework for Referring Image Segmentation},\nauthor={Yaoming Wang and Jin Li and XIAOPENG ZHANG and Bowen Shi and Chenglin Li and Wenrui Dai and Hongkai Xiong and Qi Tian},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=wHLDHRkmEu}\n}",
        "github": "",
        "project": "",
        "reviewers": "iAN9;8Qir;eHeC",
        "pdf_size": 1269224,
        "rating": "6;8;8",
        "confidence": "2;4;4",
        "soundness": "3;3;4",
        "contribution": "3;3;3",
        "presentation": "3;2;3",
        "wc_summary": "47;82;67",
        "wc_strengths": "41;32;96",
        "wc_weaknesses": "96;48;52",
        "wc_questions": "15;18;41",
        "wc_review": "199;180;256",
        "wc_reply_reviewers": "0;41;0",
        "wc_reply_authors": "699;407;451",
        "reply_reviewers": "0;1;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            65.33333333333333,
            14.337208778404378
        ],
        "wc_strengths_avg": [
            56.333333333333336,
            28.288199345702836
        ],
        "wc_weaknesses_avg": [
            65.33333333333333,
            21.74600857373345
        ],
        "wc_questions_avg": [
            24.666666666666668,
            11.61416759345623
        ],
        "wc_review_avg": [
            211.66666666666666,
            32.293790252754306
        ],
        "wc_reply_reviewers_avg": [
            13.666666666666666,
            19.3275853524323
        ],
        "wc_reply_authors_avg": [
            519.0,
            128.54052538661364
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16658899354733331742&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=wHLDHRkmEu",
        "pdf": "https://openreview.net/pdf?id=wHLDHRkmEu",
        "email": ";;huawei.com;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;huawei.com",
        "author_num": 8,
        "aff_unique_index": "0;1;1;1;1;0",
        "aff_unique_norm": "Huawei;Shanghai Jiao Tong University",
        "aff_unique_dep": "Huawei Technologies;",
        "aff_unique_url": "https://www.huawei.com;https://www.sjtu.edu.cn",
        "aff_unique_abbr": "Huawei;SJTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "wHgu98u8Sc",
        "title": "$\\nu$-ensembles: Improving deep ensemble calibration in the small data regime",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We present a method to improve the calibration of deep ensembles in the small data regime in the presence of unlabeled data. Our approach, which we name $\\nu$-ensembles, is extremely easy to implement: given an unlabeled set, for each unlabeled data point, we simply fit a different randomly selected label with each ensemble member. We provide a theoretical analysis based on a PAC-Bayes bound which guarantees that for such a labeling we obtain low negative log-likelihood and high ensemble diversity on testing samples. Empirically, through detailed experiments, we find that for low to moderately-sized training sets, $\\nu$-ensembles are more diverse and provide better calibration than standard ensembles, sometimes significantly.",
        "keywords": "deep ensembles;calibration;uncertainty;diversity;PAC-Bayes",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/0adf8fa67f1a179ce70dc8554d5851ada0641314.zip",
        "author": "Konstantinos Pitas;Julyan Arbel",
        "authorids": "~Konstantinos_Pitas1;~Julyan_Arbel1",
        "gender": "M;M",
        "homepage": "https://team.inria.fr/statify/members/;http://www.julyanarbel.com/",
        "dblp": ";172/8198",
        "google_scholar": "https://scholar.google.ch/citations?user=SAOHTb0AAAAJ;Q7P4K3wAAAAJ",
        "orcid": ";0000-0002-2525-4416",
        "linkedin": ";julyanarbel/",
        "or_profile": "~Konstantinos_Pitas1;~Julyan_Arbel1",
        "aff": "INRIA;Inria",
        "aff_domain": "inria.fr;inria.fr",
        "position": "Postdoc;Researcher",
        "bibtex": "@misc{\npitas2024nuensembles,\ntitle={\\${\\textbackslash}nu\\$-ensembles: Improving deep ensemble calibration in the small data regime},\nauthor={Konstantinos Pitas and Julyan Arbel},\nyear={2024},\nurl={https://openreview.net/forum?id=wHgu98u8Sc}\n}",
        "github": "",
        "project": "",
        "reviewers": "HFRa;bec4;My8L;3iBP;i38b",
        "site": "https://openreview.net/forum?id=wHgu98u8Sc",
        "pdf_size": 630512,
        "rating": "3;3;5;5;6",
        "confidence": "4;3;4;4;4",
        "soundness": "2;2;3;3;4",
        "contribution": "1;1;2;2;4",
        "presentation": "2;2;4;3;4",
        "wc_summary": "42;86;132;99;109",
        "wc_strengths": "92;147;99;75;88",
        "wc_weaknesses": "80;553;333;124;83",
        "wc_questions": "82;10;271;232;65",
        "wc_review": "296;796;835;530;345",
        "wc_reply_reviewers": "95;139;0;0;90",
        "wc_reply_authors": "417;827;415;653;400",
        "reply_reviewers": "1;2;0;0;1",
        "reply_authors": "2;3;1;1;1",
        "rating_avg": [
            4.4,
            1.2
        ],
        "confidence_avg": [
            3.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.8,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.0,
            1.0954451150103321
        ],
        "presentation_avg": [
            3.0,
            0.8944271909999159
        ],
        "wc_summary_avg": [
            93.6,
            29.87038667309146
        ],
        "wc_strengths_avg": [
            100.2,
            24.669008897805362
        ],
        "wc_weaknesses_avg": [
            234.6,
            184.48696430913483
        ],
        "wc_questions_avg": [
            132.0,
            101.18695568105603
        ],
        "wc_review_avg": [
            560.4,
            222.77396616301468
        ],
        "wc_reply_reviewers_avg": [
            64.8,
            55.589207585645624
        ],
        "wc_reply_authors_avg": [
            542.4,
            170.56564718606148
        ],
        "reply_reviewers_avg": [
            0.8,
            0.7483314773547883
        ],
        "reply_authors_avg": [
            1.6,
            0.8
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.5833333333333335,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:e3a1qgexQjsJ:scholar.google.com/&scioq=%24%5Cnu%24-ensembles:+Improving+deep+ensemble+calibration+in+the+small+data+regime&hl=en&as_sdt=0,31",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "INRIA",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.inria.fr",
        "aff_unique_abbr": "INRIA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "France"
    },
    {
        "id": "wHlYlC2TCM",
        "title": "Detection-Oriented Image-Text Pretraining for Open-Vocabulary Detection",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We present a new open-vocabulary detection approach based on detection-oriented image-text pretraining to bridge the gap between image-level pretraining and open-vocabulary object detection. At the pretraining phase, we replace the commonly used classification architecture with the detector architecture, which better serves the region-level recognition needs of detection by enabling the detector heads to learn from noisy image-text pairs. Using only standard contrastive loss and no pseudo-labeling, our approach is a simple yet effective extension of the contrastive learning method to learn emergent object-semantic cues. In addition, we propose a shifted-window learning approach upon window attention to make the backbone representation more robust, translation-invariant, and less biased by the window pattern. On the popular LVIS open-vocabulary detection benchmark, our approach sets a new state of the art of 40.4 mask APr using the common ViT-L backbone, significantly outperforming the best existing approach by +6.5 mask APr at system level. On the COCO benchmark, we achieve very competitive 40.8 novel AP without pseudo labeling or weak supervision. In addition, we evaluate our approach on the transfer detection setup, where ours outperforms the baseline significantly. Visualization reveals emerging object locality from the pretraining recipes compared to the baseline. Code and models will be publicly released.",
        "keywords": "open-vocabulary detection;object detection;vision and language",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Dahun Kim;Anelia Angelova;Weicheng Kuo",
        "authorids": "~Dahun_Kim1;~Anelia_Angelova1;~Weicheng_Kuo1",
        "gender": ";;M",
        "homepage": ";https://research.google/people/aneliaangelova/;https://weichengkuo.github.io/",
        "dblp": "205/2487;46/3065;163/2203",
        "google_scholar": "mHpN1xoAAAAJ;nkmDOPgAAAAJ;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Dahun_Kim1;~Anelia_Angelova1;~Weicheng_Kuo1",
        "aff": "Google;California Institute of Technology;Google Deepmind",
        "aff_domain": "google.com;caltech.edu;google.com",
        "position": "Research Scientist;PhD student;Research Scientist",
        "bibtex": "@misc{\nkim2024detectionoriented,\ntitle={Detection-Oriented Image-Text Pretraining for Open-Vocabulary Detection},\nauthor={Dahun Kim and Anelia Angelova and Weicheng Kuo},\nyear={2024},\nurl={https://openreview.net/forum?id=wHlYlC2TCM}\n}",
        "github": "",
        "project": "",
        "reviewers": "tAz1;aquR;rKe8;Gqbm",
        "site": "https://openreview.net/forum?id=wHlYlC2TCM",
        "pdf_size": 4601717,
        "rating": "3;5;5;6",
        "confidence": "5;3;4;4",
        "soundness": "2;3;2;4",
        "contribution": "2;3;2;4",
        "presentation": "3;3;2;3",
        "wc_summary": "66;55;83;94",
        "wc_strengths": "16;25;96;63",
        "wc_weaknesses": "146;196;186;124",
        "wc_questions": "12;23;105;3",
        "wc_review": "240;299;470;284",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            74.5,
            15.041608956491324
        ],
        "wc_strengths_avg": [
            50.0,
            31.88259713385972
        ],
        "wc_weaknesses_avg": [
            163.0,
            29.274562336608895
        ],
        "wc_questions_avg": [
            35.75,
            40.604033050917494
        ],
        "wc_review_avg": [
            323.25,
            87.45677503772936
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.6488856845230502,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6889175369785938889&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Google;California Institute of Technology;DeepMind",
        "aff_unique_dep": "Google;;DeepMind",
        "aff_unique_url": "https://www.google.com;https://www.caltech.edu;https://deepmind.com",
        "aff_unique_abbr": "Google;Caltech;DeepMind",
        "aff_campus_unique_index": "0;1",
        "aff_campus_unique": "Mountain View;Pasadena;",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "id": "wIFvdh1QKi",
        "title": "Metric Space Magnitude for Evaluating Unsupervised Representation Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The magnitude of a metric space was recently established as\na novel invariant, providing a measure of the `effective size' of\na space across multiple scales.\nBy capturing both geometrical and topological properties of\ndata, magnitude is poised to address challenges in unsupervised\nrepresentation learning tasks.\nWe formalise a novel notion of a dissimilarity between magnitude\nfunctions of finite metric spaces and use them to derive a quality\nmeasure for dimensionality reduction tasks.\nOur measure is provably stable under perturbations of the data, can be\nefficiently calculated, and enables a rigorous multi-scale comparison of\nembeddings.\nWe show the utility of our measure in an experimental suite that\ncomprises different domains and tasks, including the comparison of\ndata visualisations.",
        "keywords": "magnitude;metric spaces;representation learning;geometry",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/5ac08a6304d5b698af955ac5f87550f7d896b007.zip",
        "author": "Katharina Limbeck;Rayna Andreeva;Rik Sarkar;Bastian Rieck",
        "authorids": "~Katharina_Limbeck1;~Rayna_Andreeva1;~Rik_Sarkar1;~Bastian_Rieck1",
        "gender": ";;M;M",
        "homepage": ";https://rorondre.github.io/about/;https://homepages.inf.ed.ac.uk/rsarkar/;https://bastian.rieck.me",
        "dblp": ";;82/4961;119/8860",
        "google_scholar": ";scwihDYAAAAJ;rmMWizEAAAAJ;https://scholar.google.ch/citations?user=La7zuKQAAAAJ",
        "orcid": ";;;0000-0003-4335-0302",
        "linkedin": ";;;br-ml/",
        "or_profile": "~Katharina_Limbeck1;~Rayna_Andreeva1;~Rik_Sarkar1;~Bastian_Rieck1",
        "aff": ";University of Edinburgh;University of Edinburgh;Helmholtz Zentrum M\u00fcnchen",
        "aff_domain": ";ed.ac.uk;ed.ac.uk;helmholtz-munich.de",
        "position": ";PhD student;Associate Professor;Principal Investigator",
        "bibtex": "@misc{\nlimbeck2024metric,\ntitle={Metric Space Magnitude for Evaluating Unsupervised Representation Learning},\nauthor={Katharina Limbeck and Rayna Andreeva and Rik Sarkar and Bastian Rieck},\nyear={2024},\nurl={https://openreview.net/forum?id=wIFvdh1QKi}\n}",
        "github": "",
        "project": "",
        "reviewers": "545Y;WDGw;t2Dn",
        "site": "https://openreview.net/forum?id=wIFvdh1QKi",
        "pdf_size": 3348192,
        "rating": "3;5;5",
        "confidence": "2;3;4",
        "soundness": "2;2;2",
        "contribution": "2;3;2",
        "presentation": "2;4;2",
        "wc_summary": "34;114;65",
        "wc_strengths": "19;104;51",
        "wc_weaknesses": "347;146;181",
        "wc_questions": "182;3;3",
        "wc_review": "582;367;300",
        "wc_reply_reviewers": "635;16;0",
        "wc_reply_authors": "1439;261;651",
        "reply_reviewers": "2;1;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            71.0,
            32.93427798915086
        ],
        "wc_strengths_avg": [
            58.0,
            35.05234181430203
        ],
        "wc_weaknesses_avg": [
            224.66666666666666,
            87.67490455591549
        ],
        "wc_questions_avg": [
            62.666666666666664,
            84.38140922159468
        ],
        "wc_review_avg": [
            416.3333333333333,
            120.29500774715837
        ],
        "wc_reply_reviewers_avg": [
            217.0,
            295.6428024942712
        ],
        "wc_reply_authors_avg": [
            783.6666666666666,
            489.98049847814235
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.8660254037844385,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14444770678229903503&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "University of Edinburgh;Helmholtz Zentrum M\u00fcnchen",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ed.ac.uk;https://www.helmholtz-muenchen.de",
        "aff_unique_abbr": "Edinburgh;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "United Kingdom;Germany"
    },
    {
        "title": "Learning No-Regret Sparse Generalized Linear Models with Varying Observation(s)",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17497",
        "id": "wISvONp3Kq",
        "author_site": "Diyang Li, Charles Ling, Zhiqiang Xu, Huan Xiong, Bin Gu",
        "tldr": "",
        "abstract": "Generalized Linear Models (GLMs) encompass a wide array of regression and classification models, where prediction is a function of a linear combination of the input variables. Often in real-world scenarios, a number of observations would be added into or removed from the existing training dataset, necessitating the development of learning systems that can efficiently train optimal models with varying observations in an online (sequential) manner instead of retraining from scratch. Despite the significance of data-varying scenarios, most existing approaches to sparse GLMs concentrate on offline batch updates, leaving online solutions largely underexplored. In this work, we present the first algorithm without compromising accuracy for GLMs regularized by sparsity-enforcing penalties trained on varying observations. Our methodology is capable of handling the addition and deletion of observations simultaneously, while adaptively updating data-dependent regularization parameters to ensure the best statistical performance. Specifically, we recast sparse GLMs as a bilevel optimization objective upon varying observations and characterize it as an explicit gradient flow in the underlying space for the inner and outer subproblems we are optimizing over, respectively. We further derive a set of rules to ensure a proper transition at regions of non-smoothness, and establish the guarantees of theoretical consistency and finite convergence. Encouraging results are exhibited on real-world benchmarks.",
        "keywords": "Generalized Linear Models;Learning with Varying Data;Differential Equations",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/c898bc0f1b0043cbd89faff8c38bec8d88d406be.zip",
        "author": "Diyang Li;Charles Ling;zhiqiang xu;Huan Xiong;Bin Gu",
        "authorids": "~Diyang_Li1;~Charles_Ling1;~zhiqiang_xu1;~Huan_Xiong1;~Bin_Gu1",
        "gender": "M;M;M;M;M",
        "homepage": ";http://cling.csd.uwo.ca/;https://scholar.google.com/citations?user=0R20iBMAAAAJ&hl=en;https://scholar.google.com/citations?user=l4hm14MAAAAJ&hl=en;https://mbzuai.ac.ae/study/faculty/bin-gu/",
        "dblp": "127/2830;;72/51-3.html;;29/1758-1",
        "google_scholar": "_EhwwgMAAAAJ;https://scholar.google.co.uk/citations?hl=en;;l4hm14MAAAAJ;Vo8OgCgAAAAJ",
        "orcid": ";;0000-0002-5693-8933;;0000-0001-6049-1815",
        "linkedin": ";;;;",
        "or_profile": "~Diyang_Li1;~Charles_Ling1;~zhiqiang_xu1;~Huan_Xiong1;~Bin_Gu1",
        "aff": "Cornell University;Western University;Mohamed bin Zayed University of Artificial Intelligence;Harbin Institute of Technology;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_domain": "cornell.edu;uwo.ca;mbzuai.ac.ae;hit.edu.cn;mbzuai.ac.ae",
        "position": "PhD student;Professor;Assistant Professor;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nli2024learning,\ntitle={Learning No-Regret Sparse Generalized Linear Models with Varying Observation(s)},\nauthor={Diyang Li and Charles Ling and zhiqiang xu and Huan Xiong and Bin Gu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=wISvONp3Kq}\n}",
        "github": "",
        "project": "",
        "reviewers": "MPDs;244k;oT9i",
        "pdf_size": 1047504,
        "rating": "6;8;8",
        "confidence": "3;3;2",
        "soundness": "3;4;3",
        "contribution": "3;3;4",
        "presentation": "3;2;4",
        "wc_summary": "50;87;70",
        "wc_strengths": "4;44;99",
        "wc_weaknesses": "50;52;3",
        "wc_questions": "222;201;54",
        "wc_review": "326;384;226",
        "wc_reply_reviewers": "46;0;0",
        "wc_reply_authors": "2969;1791;1183",
        "reply_reviewers": "1;0;0",
        "reply_authors": "6;4;3",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            69.0,
            15.121728296285006
        ],
        "wc_strengths_avg": [
            49.0,
            38.94440481849308
        ],
        "wc_weaknesses_avg": [
            35.0,
            22.642143596988927
        ],
        "wc_questions_avg": [
            159.0,
            74.73954776421918
        ],
        "wc_review_avg": [
            312.0,
            65.25846049874811
        ],
        "wc_reply_reviewers_avg": [
            15.333333333333334,
            21.684607956387456
        ],
        "wc_reply_authors_avg": [
            1981.0,
            741.4058717508694
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            4.333333333333333,
            1.247219128924647
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:n7EBJegWC3oJ:scholar.google.com/&scioq=Learning+No-Regret+Sparse+Generalized+Linear+Models+with+Varying+Observation(s)&hl=en&as_sdt=0,5",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=wISvONp3Kq",
        "pdf": "https://openreview.net/pdf?id=wISvONp3Kq",
        "email": "cornell.edu;uwo.ca;mbzuai.ac.ae;hit.edu.cn;mbzuai.ac.ae",
        "author_num": 5,
        "aff_unique_index": "0;1;2;3;2",
        "aff_unique_norm": "Cornell University;Western University;Mohamed bin Zayed University of Artificial Intelligence;Harbin Institute of Technology",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.cornell.edu;https://www.uwo.ca;https://mbzuai.ac.ae;http://www.hit.edu.cn/",
        "aff_unique_abbr": "Cornell;Western;MBZUAI;HIT",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Harbin",
        "aff_country_unique_index": "0;1;2;3;2",
        "aff_country_unique": "United States;Canada;United Arab Emirates;China"
    },
    {
        "id": "wKB3XcQHcX",
        "title": "Speed Limits for Deep Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "State-of-the-art neural networks require extreme computational power to train. It is therefore natural to wonder whether they are optimally trained. Here we apply a recent advancement in stochastic thermodynamics which allows bounding the speed at which one can go from the initial weight distribution to the final distribution of the fully trained network, based on the ratio of their Wasserstein-2 distance and the entropy production rate of the dynamical process connecting them. Considering both gradient-flow and Langevin training dynamics, we provide analytical expressions for these speed limits for linear and linearizable (e.g. NTK) neural networks. Remarkably, given some plausible scaling assumptions on the NTK spectra and spectral decomposition of the labels-- learning is optimal in a scaling sense. Our results are consistent with small-scale experiments with CNNs and FCNs on CIFAR-10, showing a short highly non-optimal regime followed by a longer optimal regime.",
        "keywords": "Deep learning;Stochastic thermodynamics;Non-equilibrium physics;Langevin dynamics",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Inbar Seroussi;Alexander A Alemi;Moritz Helias;Zohar Ringel",
        "authorids": "~Inbar_Seroussi1;~Alexander_A_Alemi1;~Moritz_Helias1;~Zohar_Ringel1",
        "gender": "F;M;M;M",
        "homepage": "https://sites.google.com/view/inbar-seroussi/home;https://alexalemi.com;https://www.fz-juelich.de/profile/helias_m;http://old.phys.huji.ac.il/~zohar.ringel/",
        "dblp": ";160/8158;79/8535;",
        "google_scholar": "https://scholar.google.co.il/citations?user=t_Qe0CMAAAAJ;68hTs9wAAAAJ;https://scholar.google.de/citations?user=NZQ_gSAAAAAJ;https://scholar.google.co.il/citations?user=8-8VIDgAAAAJ",
        "orcid": ";;0000-0002-0404-8656;",
        "linkedin": ";;;",
        "or_profile": "~Inbar_Seroussi1;~Alexander_A_Alemi1;~Moritz_Helias1;~Zohar_Ringel1",
        "aff": "Tel Aviv University;Google;Forschungszentrum J\u00fclich;Hebrew University of Jerusalem, Israel",
        "aff_domain": "tau.ac.il;google.com;fz-juelich.de;huji.ac.il",
        "position": "Assistant Professor;Research Scientist;Principal Researcher;Associate Professor",
        "bibtex": "@misc{\nseroussi2024speed,\ntitle={Speed Limits for Deep Learning},\nauthor={Inbar Seroussi and Alexander A Alemi and Moritz Helias and Zohar Ringel},\nyear={2024},\nurl={https://openreview.net/forum?id=wKB3XcQHcX}\n}",
        "github": "",
        "project": "",
        "reviewers": "Lj3X;5tEv;8rXj;M1Mw",
        "site": "https://openreview.net/forum?id=wKB3XcQHcX",
        "pdf_size": 1741651,
        "rating": "3;6;6;8",
        "confidence": "5;2;2;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "1;3;3;3",
        "wc_summary": "177;69;137;101",
        "wc_strengths": "56;33;83;97",
        "wc_weaknesses": "850;190;111;124",
        "wc_questions": "81;46;220;185",
        "wc_review": "1164;338;551;507",
        "wc_reply_reviewers": "0;136;0;53",
        "wc_reply_authors": "0;1059;1708;833",
        "reply_reviewers": "0;2;0;1",
        "reply_authors": "0;3;3;2",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.25,
            1.299038105676658
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            121.0,
            40.29888335921977
        ],
        "wc_strengths_avg": [
            67.25,
            24.661457783350926
        ],
        "wc_weaknesses_avg": [
            318.75,
            308.1763902377987
        ],
        "wc_questions_avg": [
            133.0,
            71.66937979360502
        ],
        "wc_review_avg": [
            640.0,
            312.8058503289221
        ],
        "wc_reply_reviewers_avg": [
            47.25,
            55.620926817161184
        ],
        "wc_reply_authors_avg": [
            900.0,
            610.8670068026264
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.40422604172722165,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:5elhuFgOvMUJ:scholar.google.com/&scioq=Speed+Limits+for+Deep+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Tel Aviv University;Google;Forschungszentrum J\u00fclich;Hebrew University of Jerusalem",
        "aff_unique_dep": ";Google;;",
        "aff_unique_url": "https://www.tau.ac.il;https://www.google.com;https://www.fz-juelich.de;https://www.huji.ac.il",
        "aff_unique_abbr": "TAU;Google;FZJ;HUJI",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;2;0",
        "aff_country_unique": "Israel;United States;Germany"
    },
    {
        "id": "wKNKnXjCfT",
        "title": "Efficient Identification of Direct Causal Parents via Invariance and Minimum Error Testing",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Invariant causal prediction (ICP) is a popular technique for finding direct causes (causal parents) of a target via exploiting distribution shifts. Despite its targeted search, ICP still needs to run an exponential number of tests, which significantly limits its applicability, particularly in tasks with a large number of variables to consider. Furthermore, as others have pointed out, ICP fails to identify causes when distribution shifts only affect a few variables. We propose two approaches, MMSE-ICP and fastICP, which employ an error inequality to address the identifiability problem of ICP. The inequality states that the minimum prediction error of the predictor using causal parents is the smallest among all predictors which do not use descendants. fastICP is an efficient approximation that exploits the error inequality and a heuristic to reduce the number of tests for invariance required. Our experiments on simulated and real data show MMSE-ICP and fastICP outperforming competitive baseline approaches and fastICP being much more scalable.",
        "keywords": "causal discovery;invariance",
        "primary_area": "causal reasoning",
        "supplementary_material": "/attachment/3ed50df4c1b3fb91a78026bda30f8ebe3c39726f.pdf",
        "author": "Minh Nguyen;Mert R. Sabuncu",
        "authorids": "~Minh_Nguyen2;~Mert_R._Sabuncu1",
        "gender": "M;M",
        "homepage": ";http://sabuncu.engineering.cornell.edu",
        "dblp": "83/2833-2;36/4898",
        "google_scholar": "Fv-9At4AAAAJ;",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Minh_Nguyen2;~Mert_R._Sabuncu1",
        "aff": "Cornell University;Cornell Tech",
        "aff_domain": "cornell.edu;cornell.edu",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nnguyen2024efficient,\ntitle={Efficient Identification of Direct Causal Parents via Invariance and Minimum Error Testing},\nauthor={Minh Nguyen and Mert R. Sabuncu},\nyear={2024},\nurl={https://openreview.net/forum?id=wKNKnXjCfT}\n}",
        "github": "",
        "project": "",
        "reviewers": "ZvvZ;DSFM;ru9u",
        "site": "https://openreview.net/forum?id=wKNKnXjCfT",
        "pdf_size": 651078,
        "rating": "6;6;6",
        "confidence": "3;4;3",
        "soundness": "3;3;3",
        "contribution": "2;2;3",
        "presentation": "3;2;3",
        "wc_summary": "104;58;45",
        "wc_strengths": "33;41;22",
        "wc_weaknesses": "133;73;9",
        "wc_questions": "22;5;147",
        "wc_review": "292;177;223",
        "wc_reply_reviewers": "173;0;12",
        "wc_reply_authors": "1114;736;416",
        "reply_reviewers": "2;0;1",
        "reply_authors": "3;1;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            69.0,
            25.311394008759507
        ],
        "wc_strengths_avg": [
            32.0,
            7.788880963698615
        ],
        "wc_weaknesses_avg": [
            71.66666666666667,
            50.63156678946007
        ],
        "wc_questions_avg": [
            58.0,
            63.31403214664713
        ],
        "wc_review_avg": [
            230.66666666666666,
            47.26050735609548
        ],
        "wc_reply_reviewers_avg": [
            61.666666666666664,
            78.87683789019154
        ],
        "wc_reply_authors_avg": [
            755.3333333333334,
            285.28504264253945
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:cXznQumuA5IJ:scholar.google.com/&scioq=Efficient+Identification+of+Direct+Causal+Parents+via+Invariance+and+Minimum+Error+Testing&hl=en&as_sdt=0,5",
        "gs_version_total": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Cornell University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cornell.edu",
        "aff_unique_abbr": "Cornell",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";New York City",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "wLbL3lJNTL",
        "title": "Joint Representations for Reinforcement Learning with Multiple Sensors",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Combining inputs from multiple sensor modalities effectively in reinforcement learning (RL) is an open problem. While many self-supervised representation learning approaches exist to improve performance and sample complexity for image-based RL, they usually neglect other available information, such as robot proprioception. In this work, we show how using this proprioception for representation learning can help algorithms to focus on relevant aspects and guide them toward finding better representations. Building on Recurrent State Space Models, we systematically analyze representation learning approaches for RL from multiple sensors. We propose a novel combination of reconstruction-based and contrastive losses, which allows us to choose the most appropriate method for each sensor modality, and demonstrate its benefits in a wide range of settings. This evaluation includes model-free and model-based RL on complex tasks where the images contain distractions or occlusions, a new locomotion suite, and a visually realistic mobile manipulation task. We show that learning a joint representation by combining contrastive and reconstruction-based losses significantly improves performance compared to the common practice of combining image representations and proprioception and allows solving more complex tasks that are beyond the reach of current SOTA representation learning methods.",
        "keywords": "Representations for RL;Image-Based RL;Contrastive Learning;Reinfrocement Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/2388d8f6017fe5ad61d4bdc483bcb3cd9c5a9f80.zip",
        "author": "Philipp Becker;Sebastian Markgraf;Fabian Otto;Gerhard Neumann",
        "authorids": "~Philipp_Becker1;~Sebastian_Markgraf1;~Fabian_Otto1;~Gerhard_Neumann2",
        "gender": "M;M;;M",
        "homepage": ";;;https://alr.anthropomatik.kit.edu/",
        "dblp": "66/1316;259/3259;284/0547;60/4878",
        "google_scholar": "https://scholar.google.de/citations?user=jXx-LuQAAAAJ;https://scholar.google.com/citations?hl=en;dV8eLH8AAAAJ;https://scholar.google.com.tw/citations?user=GL360kMAAAAJ",
        "orcid": ";;0000-0003-3484-1054;",
        "linkedin": ";;ottofabian/;",
        "or_profile": "~Philipp_Becker1;~Sebastian_Markgraf1;~Fabian_Otto1;~Gerhard_Neumann1",
        "aff": "FZI Forschungszentrum Informatik ;Karlsruher Institut f\u00fcr Technologie;University of T\u00fcbingen;Karlsruhe Institute of Technology",
        "aff_domain": "fzi.de;kit.edu;uni-tuebingen.de;kit.edu",
        "position": "Researcher;MS student;PhD student;Full Professor",
        "bibtex": "@misc{\nbecker2024joint,\ntitle={Joint Representations for Reinforcement Learning with Multiple Sensors},\nauthor={Philipp Becker and Sebastian Markgraf and Fabian Otto and Gerhard Neumann},\nyear={2024},\nurl={https://openreview.net/forum?id=wLbL3lJNTL}\n}",
        "github": "",
        "project": "",
        "reviewers": "nyC5;VgNz;G7AG;ZjLm",
        "site": "https://openreview.net/forum?id=wLbL3lJNTL",
        "pdf_size": 2294875,
        "rating": "3;5;5;8",
        "confidence": "4;5;3;5",
        "soundness": "3;3;3;4",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;4",
        "wc_summary": "40;119;76;89",
        "wc_strengths": "58;54;82;65",
        "wc_weaknesses": "364;263;82;19",
        "wc_questions": "113;37;105;237",
        "wc_review": "575;473;345;410",
        "wc_reply_reviewers": "0;0;0;19",
        "wc_reply_authors": "925;888;756;326",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            81.0,
            28.34607556611673
        ],
        "wc_strengths_avg": [
            64.75,
            10.709224995301948
        ],
        "wc_weaknesses_avg": [
            182.0,
            138.07063409718955
        ],
        "wc_questions_avg": [
            123.0,
            72.13875518748573
        ],
        "wc_review_avg": [
            450.75,
            84.81855634234763
        ],
        "wc_reply_reviewers_avg": [
            4.75,
            8.227241335952167
        ],
        "wc_reply_authors_avg": [
            723.75,
            238.07811218169553
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.46442036401282394,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8094029053180403745&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "FZI Forschungszentrum Informatik;Karlsruher Institut f\u00fcr Technologie;University of T\u00fcbingen;Karlsruhe Institute of Technology",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.fzi.de;https://www.kit.edu;https://www.uni-tuebingen.de/;https://www.kit.edu",
        "aff_unique_abbr": "FZI;KIT;Uni T\u00fcbingen;KIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "wM01y5BPM9",
        "title": "Identifiable Representation Learning via Architecture Equivariances",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Despite their immense success and usefulness, current deep learning systems are still lacking in interpretability, robustness, and out of distribution generalisation. \nIn this work we propose a method that helps address some of these issues in image and video data, by exploiting equivariances naturally present in the data.\nIt enables learning latent representations that are identifiable and interpretable, and that can be intervened on to visualise counterfactual scenarios.\nThe latent representations naturally correspond to positions of objects subject to image transformations, and so our method trains object detectors completely unsupervised, without object annotations.\nWe prove that the learned latent variables are identifiable up to permutations and small shifts up to the size of model's receptive fields, and perform experiments demonstrating this in practice.\nWe apply it to real world videos of balls moving in mini pool (translational equivariance), cars driving around a roundabout (rotational equivariance) and objects approaching the camera on a conveyor belt (scale equivariance).\nIn all cases, transformation-equivariant representations are learned unsupervised.\nWe show that intervening on the learned latent space results in successful generalisation out of the training distribution, and visualise realistic counterfactual videos never observed at training time.\nThe method has natural applications in industry, such as inspection and surveillance, with static cameras.",
        "keywords": "representation learning;identifiability",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/d6f8c49a1cbb79b80eca959d4d6457bffd7ee5b9.zip",
        "author": "Marian Longa;Joao F. Henriques",
        "authorids": "~Marian_Longa1;~Joao_F._Henriques1",
        "gender": ";M",
        "homepage": "http://marianlonga.com;http://www.robots.ox.ac.uk/~joao/",
        "dblp": ";31/8617.html",
        "google_scholar": ";aCQjyp0AAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Marian_Longa1;~Joao_F._Henriques1",
        "aff": "University of Oxford;University of Oxford",
        "aff_domain": "ox.ac.uk;ox.ac.uk",
        "position": "PhD student;Principal Researcher",
        "bibtex": "@misc{\nlonga2024identifiable,\ntitle={Identifiable Representation Learning via Architecture Equivariances},\nauthor={Marian Longa and Joao F. Henriques},\nyear={2024},\nurl={https://openreview.net/forum?id=wM01y5BPM9}\n}",
        "github": "",
        "project": "",
        "reviewers": "zkMx;ad2P;MCV9;rWrK",
        "site": "https://openreview.net/forum?id=wM01y5BPM9",
        "pdf_size": 2455497,
        "rating": "1;3;5;5",
        "confidence": "4;4;4;4",
        "soundness": "2;1;2;2",
        "contribution": "1;1;2;2",
        "presentation": "2;1;3;3",
        "wc_summary": "117;206;65;56",
        "wc_strengths": "45;17;72;45",
        "wc_weaknesses": "222;662;394;147",
        "wc_questions": "44;364;26;43",
        "wc_review": "428;1249;557;291",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            1.6583123951777
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            111.0,
            59.58607219812362
        ],
        "wc_strengths_avg": [
            44.75,
            19.447043477094404
        ],
        "wc_weaknesses_avg": [
            356.25,
            197.93733225442844
        ],
        "wc_questions_avg": [
            119.25,
            141.48741110077603
        ],
        "wc_review_avg": [
            631.25,
            368.8525281193014
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:b85PfXTq6UcJ:scholar.google.com/&scioq=Identifiable+Representation+Learning+via+Architecture+Equivariances&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Oxford",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ox.ac.uk",
        "aff_unique_abbr": "Oxford",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "wMWZ78ulsK",
        "title": "An Information Theoretic Approach to Interaction Grounded Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Reinforcement learning (RL) problems where the learner attempts to infer an unobserved reward from some feedback variables have been studied in several recent papers. The setting of *Interaction-Grounded Learning (IGL)* is an example of such feedback-based reinforcement learning tasks where the learner optimizes the return by inferring latent binary rewards from the interaction with the environment. In the IGL setting, a relevant assumption used in the RL literature is that the feedback variable $Y$ is conditionally independent of the context-action $(X,A)$ given the latent reward $R$. In this work, we propose *Variational Information-based IGL (VI-IGL)* as an information-theoretic method to enforce the conditional independence assumption in the IGL-based RL problem. The VI-IGL framework learns a reward decoder using an information-based objective based on the conditional mutual information (MI) between the context-action $(X,A)$ and the feedback variable $Y$ observed from the environment. To estimate and optimize the information-based terms for the continuous random variables in the RL problem, VI-IGL leverages the variational representation of mutual information and results in a min-max optimization problem. Furthermore, we extend the VI-IGL framework to general $f$-Information measures in the information theory literature, leading to the generalized $f$-VI-IGL framework to address the RL problem under the IGL condition. Finally, we provide the empirical results of applying the VI-IGL method to several reinforcement learning settings, which indicate an improved performance in comparison to the previous IGL-based RL algorithm.",
        "keywords": "interaction-grounded learning;information-based reinforcement learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/5c1c1d663103140062f0cbe25b427ff62a52ebd0.zip",
        "author": "Xiaoyan Hu;Farzan Farnia;Ho-fung Leung",
        "authorids": "~Xiaoyan_Hu2;~Farzan_Farnia1;~Ho-fung_Leung1",
        "gender": "M;M;M",
        "homepage": "https://yannxiaoyanhu.github.io;https://www.cse.cuhk.edu.hk/~farnia/;http://www.cse.cuhk.edu.hk/~lhf/",
        "dblp": ";132/7757;l/HofungLeung",
        "google_scholar": "https://scholar.google.com/citations?hl=en;GYPCqcYAAAAJ;https://scholar.google.com.hk/citations?user=JDErdKcAAAAJ",
        "orcid": "0000-0002-5766-1059;0000-0002-6049-9232;0000-0003-4914-2934",
        "linkedin": "xiaoyan-hu-9a26661b9/;farzan-farnia-00798335;ho-fung-leung-1a73135/",
        "or_profile": "~Xiaoyan_Hu2;~Farzan_Farnia1;~Ho-fung_Leung1",
        "aff": "The Chinese University of Hong Kong;The Chinese University of Hong Kong; ",
        "aff_domain": "cse.cuhk.edu.hk;cuhk.edu.hk;outlook.com",
        "position": "PhD student;Assistant Professor;Independent Researcher",
        "bibtex": "@misc{\nhu2024an,\ntitle={An Information Theoretic Approach to Interaction Grounded Learning},\nauthor={Xiaoyan Hu and Farzan Farnia and Ho-fung Leung},\nyear={2024},\nurl={https://openreview.net/forum?id=wMWZ78ulsK}\n}",
        "github": "",
        "project": "",
        "reviewers": "Jvuq;8FsD;kBCY;yTyJ;1D19",
        "site": "https://openreview.net/forum?id=wMWZ78ulsK",
        "pdf_size": 344401,
        "rating": "3;5;5;6;6",
        "confidence": "5;4;2;3;2",
        "soundness": "2;2;3;3;3",
        "contribution": "1;2;3;3;3",
        "presentation": "2;2;3;2;3",
        "wc_summary": "65;26;330;42;20",
        "wc_strengths": "1;12;102;60;17",
        "wc_weaknesses": "114;40;115;181;10",
        "wc_questions": "43;30;2;214;4",
        "wc_review": "223;108;549;497;51",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "227;204;361;459;32",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            5.0,
            1.0954451150103321
        ],
        "confidence_avg": [
            3.2,
            1.16619037896906
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.4,
            0.8
        ],
        "presentation_avg": [
            2.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            96.6,
            117.73461682954593
        ],
        "wc_strengths_avg": [
            38.4,
            37.59042431258259
        ],
        "wc_weaknesses_avg": [
            92.0,
            60.60033003210461
        ],
        "wc_questions_avg": [
            58.6,
            79.24039373955685
        ],
        "wc_review_avg": [
            285.6,
            202.27070969371712
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            256.6,
            145.57005186507286
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.7827803638564369,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16158058583373233653&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Chinese University of Hong Kong",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cuhk.edu.hk",
        "aff_unique_abbr": "CUHK",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "wMXH8tTQE3",
        "title": "ProbTS: A Unified Toolkit to Probe Deep Time-series Forecasting",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Time-series forecasting serves as a linchpin in a myriad of applications, spanning various domains. With the growth of deep learning, this arena has bifurcated into two salient branches: one focuses on crafting specific neural architectures tailored for time series, and the other harnesses advanced deep generative models for probabilistic forecasting. While both branches have made significant progress, their differences across data scenarios, methodological focuses, and decoding schemes pose profound, yet unexplored, research questions. To bridge this knowledge chasm, we introduce ProbTS, a pioneering toolkit developed to synergize and compare these two distinct branches. Endowed with a unified data module, a modularized model module, and a comprehensive evaluator module, ProbTS allows us to revisit and benchmark leading methods from both branches. The scrutiny with ProbTS highlights their distinct characteristics, relative strengths and weaknesses, and areas that need further exploration. Our analyses point to new avenues for research, aiming for more effective time-series forecasting.",
        "keywords": "deep time-series forecasting;time-series toolkit;probabilistic forecasting",
        "primary_area": "infrastructure, software libraries, hardware, etc.",
        "supplementary_material": "/attachment/33ca95f89194e1cdfcda122bb9acc17df5cf03b9.pdf",
        "author": "Jiawen Zhang;Xumeng Wen;Shun Zheng;Jia Li;Jiang Bian",
        "authorids": "~Jiawen_Zhang1;~Xumeng_Wen1;~Shun_Zheng1;~Jia_Li4;~Jiang_Bian1",
        "gender": "F;M;M;M;M",
        "homepage": "https://imjiawen.com;https://github.com/xumwen;;https://sites.google.com/view/lijia;https://sites.google.com/view/jiangbian",
        "dblp": "59/11040-1;358/9194.html;179/2615.html;23/6950-9;09/851-2.html",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;21Q9To4AAAAJ;1gSbcYoAAAAJ;pZBEnY8AAAAJ",
        "orcid": "0009-0000-1855-9177;;0009-0005-7355-7090;0000-0002-6362-4385;0000-0002-9472-600X",
        "linkedin": ";;;;jbian/",
        "or_profile": "~Jiawen_Zhang1;~Xumeng_Wen1;~Shun_Zheng1;~Jia_Li4;~Jiang_Bian1",
        "aff": "The Hong Kong University of Science and Technology (Guangzhou);Microsoft Research Asia;Microsoft;Hong Kong University of Science and Technology (Guangzhou);Microsoft",
        "aff_domain": "connect.hkust-gz.edu.cn;microsoft.com;microsoft.com;ust.hk;microsoft.com",
        "position": "PhD student;Researcher;Senior Researcher;Assistant Professor;Partner Research Manager",
        "bibtex": "@misc{\nzhang2024probts,\ntitle={Prob{TS}: A Unified Toolkit to Probe Deep Time-series Forecasting},\nauthor={Jiawen Zhang and Xumeng Wen and Shun Zheng and Jia Li and Jiang Bian},\nyear={2024},\nurl={https://openreview.net/forum?id=wMXH8tTQE3}\n}",
        "github": "",
        "project": "",
        "reviewers": "kFUJ;AnhU;aD4Z;JfDV;eUu7",
        "site": "https://openreview.net/forum?id=wMXH8tTQE3",
        "pdf_size": 5404390,
        "rating": "3;5;6;8;8",
        "confidence": "5;4;3;4;5",
        "soundness": "2;3;3;3;3",
        "contribution": "2;2;3;3;3",
        "presentation": "1;3;3;4;3",
        "wc_summary": "39;77;26;142;46",
        "wc_strengths": "21;24;131;128;34",
        "wc_weaknesses": "330;121;75;183;123",
        "wc_questions": "1;156;42;2;88",
        "wc_review": "391;378;274;455;291",
        "wc_reply_reviewers": "631;0;0;85;0",
        "wc_reply_authors": "4043;2028;1351;819;1785",
        "reply_reviewers": "2;0;0;1;0",
        "reply_authors": "8;3;3;1;3",
        "rating_avg": [
            6.0,
            1.8973665961010275
        ],
        "confidence_avg": [
            4.2,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.8,
            0.9797958971132712
        ],
        "wc_summary_avg": [
            66.0,
            41.535526961867234
        ],
        "wc_strengths_avg": [
            67.6,
            50.73302671830255
        ],
        "wc_weaknesses_avg": [
            166.4,
            88.7008455427568
        ],
        "wc_questions_avg": [
            57.8,
            58.557322343153636
        ],
        "wc_review_avg": [
            357.8,
            66.99671633744448
        ],
        "wc_reply_reviewers_avg": [
            143.2,
            246.1116819657287
        ],
        "wc_reply_authors_avg": [
            2005.2,
            1098.7888605187077
        ],
        "reply_reviewers_avg": [
            0.6,
            0.7999999999999999
        ],
        "reply_authors_avg": [
            3.6,
            2.3323807579381204
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.14085904245475278,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3047019447905239295&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;1;0;1",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Microsoft",
        "aff_unique_dep": ";Research",
        "aff_unique_url": "https://www.ust.hk;https://www.microsoft.com/en-us/research/group/asia",
        "aff_unique_abbr": "HKUST;MSR Asia",
        "aff_campus_unique_index": "0;1;3",
        "aff_campus_unique": "Guangzhou;Asia;;Hong Kong SAR",
        "aff_country_unique_index": "0;0;1;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "wN9HBrNPSX",
        "title": "Enhancing Temporal Knowledge Graph Completion with Global Similarity and Weighted Sampling",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Temporal Knowledge Graph (TKG) completion models traditionally assume access to the entire graph during training. This overlooks challenges stemming from the evolving nature of TKGs, such as: (i) the model's requirement to generalize and assimilate new knowledge, and (ii) the task of managing new or unseen entities that often have sparse connections. In this paper, we present an incremental training framework specifically designed for TKGs, aiming to address entities that are either not observed during training or have sparse connections. Our approach combines a model-agnostic enhancement layer with a weighted sampling strategy, that can be augmented to and improve any existing TKG completion method. The enhancement layer leverages a broader, global definition of entity similarity, moving beyond mere local neighborhood proximity of GNN-based methods. The weighted sampling strategy employed in training accentuates edges linked to infrequently occurring entities. Our evaluations, conducted on two benchmark datasets, demonstrate that our framework outperforms existing methods in overall link prediction, inductive link prediction, and in addressing long-tail entities. Notably, our method achieves a 10\\% improvement in MRR for one dataset and a 15\\% boost for another. The results underscore the potential of our approach in mitigating catastrophic forgetting and enhancing the robustness of TKG completion methods, especially in an incremental training context.",
        "keywords": "Temporal Knowledge Graph;Representation Learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/5edfa625bb49a35c22bc5f30033bcaf84e7b2c75.zip",
        "author": "Mehrnoosh Mirtaheri;Ryan A. Rossi;Sungchul Kim;Kanak Mahadik;Xiang Chen;Tong Yu;Mohammad Rostami",
        "authorids": "~Mehrnoosh_Mirtaheri1;~Ryan_A._Rossi2;~Sungchul_Kim1;~Kanak_Mahadik1;~Xiang_Chen9;~Tong_Yu3;~Mohammad_Rostami1",
        "gender": "F;M;;M;;M;M",
        "homepage": "https://www.linkedin.com/in/mehrnoom/;https://sites.google.com/site/subright;https://research.adobe.com/person/kanak-mahadik/;;https://www.linkedin.com/in/tong-yu-42790744;https://viterbi.usc.edu/directory/faculty/Rostami/Mohammad;http://ryanrossi.com",
        "dblp": "236/4449;61/1573;24/10441.html;;32/1593-1;83/9890;17/5085",
        "google_scholar": "0919kI0AAAAJ;v8ISLgIAAAAJ;seADuJsAAAAJ;aPq10m4AAAAJ;https://scholar.google.com/citations?hl=en;Uzx8nLoAAAAJ;_Dc6lbQAAAAJ",
        "orcid": ";0000-0003-3580-5290;0000-0002-6780-4199;;0000-0002-5991-2050;;0000-0001-9758-0635",
        "linkedin": "mehrnoom/;;;;tong-yu-42790744;;",
        "or_profile": "~Mehrnoosh_Mirtaheri1;~Sungchul_Kim1;~Kanak_Mahadik1;~Xiang_Chen9;~Tong_Yu3;~Mohammad_Rostami1;~Ryan_Rossi1",
        "aff": "Sony AI;Adobe Systems;Adobe Inc;Adobe Systems;Adobe Research;USC/ISI;Adobe Research",
        "aff_domain": "sony.com;adobe.com;adobe.com;adobe.com;adobe.com;isi.edu;adobe.com",
        "position": "Intern;Researcher;Researcher;Researcher;Senior Research Scientist;Research Scientist;Senior Research Scientist",
        "bibtex": "@misc{\nmirtaheri2024enhancing,\ntitle={Enhancing Temporal Knowledge Graph Completion with Global Similarity and Weighted Sampling},\nauthor={Mehrnoosh Mirtaheri and Ryan A. Rossi and Sungchul Kim and Kanak Mahadik and Xiang Chen and Tong Yu and Mohammad Rostami},\nyear={2024},\nurl={https://openreview.net/forum?id=wN9HBrNPSX}\n}",
        "github": "",
        "project": "",
        "reviewers": "eLoE;Pdc3;wF5W;1RrB",
        "site": "https://openreview.net/forum?id=wN9HBrNPSX",
        "pdf_size": 459056,
        "rating": "3;5;6;6",
        "confidence": "5;3;3;4",
        "soundness": "3;2;3;3",
        "contribution": "1;2;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "49;47;54;155",
        "wc_strengths": "10;33;79;89",
        "wc_weaknesses": "121;75;51;112",
        "wc_questions": "92;75;38;29",
        "wc_review": "272;230;222;385",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "725;419;342;474",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            76.25,
            45.53775905773142
        ],
        "wc_strengths_avg": [
            52.75,
            32.48364973336586
        ],
        "wc_weaknesses_avg": [
            89.75,
            28.24336205199374
        ],
        "wc_questions_avg": [
            58.5,
            25.90849281606323
        ],
        "wc_review_avg": [
            277.25,
            65.04373528634406
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            490.0,
            143.54964298109556
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.7385489458759963,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:GgsYiZZaOu4J:scholar.google.com/&scioq=Enhancing+Temporal+Knowledge+Graph+Completion+with+Global+Similarity+and+Weighted+Sampling&hl=en&as_sdt=0,31",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1;1;2;1",
        "aff_unique_norm": "Sony;Adobe;University of Southern California",
        "aff_unique_dep": "Sony AI;Adobe Systems Incorporated;",
        "aff_unique_url": "https://www.sony.com;https://www.adobe.com;https://isi.usc.edu",
        "aff_unique_abbr": "Sony AI;Adobe;USC",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";ISI",
        "aff_country_unique_index": "0;1;1;1;1;1;1",
        "aff_country_unique": "Japan;United States"
    },
    {
        "id": "wNere1lelo",
        "title": "Certifying LLM Safety against Adversarial Prompting",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models (LLMs) released for public use incorporate guardrails to ensure their output is safe, often referred to as \"model alignment.\" An aligned language model should decline a user\u2019s request to produce harmful content. However, such safety measures are vulnerable to adversarial prompts, which contain maliciously designed token sequences to circumvent the model\u2019s safety guards and cause it to produce harmful content. In this work, we introduce erase-and-check, the first framework to defend against adversarial prompts with verifiable safety guarantees. Given a prompt, we erase tokens individually and inspect the resulting subsequences using a safety filter. Our procedure labels the input prompt as harmful if any subsequences or the input prompt itself are detected as harmful by the filter. This guarantees that any adversarial modification of a harmful prompt up to a certain size is also labeled harmful. We defend against three attack modes: i) adversarial suffix, which appends an adversarial sequence at the end of the prompt; ii) adversarial insertion, where the adversarial sequence is inserted anywhere in the middle of the prompt; and iii) adversarial infusion, where adversarial tokens are inserted at arbitrary positions in the prompt, not necessarily as a contiguous block. Our experimental results demonstrate that this procedure obtains strong certified safety guarantees on harmful prompts while maintaining good empirical performance on safe prompts. For example, against adversarial suffixes of length 20, it certifiably detects 93% of harmful prompts and labels 94% of safe prompts correctly using the open source language model Llama 2 as the safety filter. We also show that, by leveraging the unique advantages of defending against safety attacks, our method significantly outperforms well-known certifiable robustness techniques such as randomized smoothing.",
        "keywords": "Large Language Models;AI Safety;Certified Robustness;Adversarial Attacks",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/a98e9e1d142719b28a389622a839a8cb0c5b4091.zip",
        "author": "Aounon Kumar;Chirag Agarwal;Suraj Srinivas;Aaron Jiaxun Li;Soheil Feizi;Himabindu Lakkaraju",
        "authorids": "~Aounon_Kumar1;~Chirag_Agarwal1;~Suraj_Srinivas1;~Aaron_Jiaxun_Li1;~Soheil_Feizi2;~Himabindu_Lakkaraju1",
        "gender": "M;M;M;M;M;F",
        "homepage": "https://aounon.github.io;https://chirag-agarwall.github.io/;https://suraj-srinivas.github.io/;https://aaron-jx-li.github.io/;https://www.cs.umd.edu/~sfeizi/;http://web.stanford.edu/~himalv",
        "dblp": "191/8334;173/8821;144/0584;133/7864-2.html;57/2132;68/9376",
        "google_scholar": "NjhpUykAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.co.in/citations?user=J2JWgKgAAAAJ;MGqle3EAAAAJ;lptAmrMAAAAJ;",
        "orcid": ";;;;;",
        "linkedin": ";chirag-agarwal-0a6a43a1/;;aaronjxli5351/;;",
        "or_profile": "~Aounon_Kumar1;~Chirag_Agarwal1;~Suraj_Srinivas1;~Aaron_Jiaxun_Li1;~Soheil_Feizi2;~Hima_Lakkaraju1",
        "aff": "School of Engineering and Applied Sciences, Harvard University;Harvard University;School of Engineering and Applied Sciences, Harvard University;Harvard University;University of Maryland, College Park;Harvard University",
        "aff_domain": "seas.harvard.edu;hbs.edu;seas.harvard.edu;g.harvard.edu;umd.edu;harvard.edu",
        "position": "Postdoc;Postdoc;Postdoc;MS student;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nkumar2024certifying,\ntitle={Certifying {LLM} Safety against Adversarial Prompting},\nauthor={Aounon Kumar and Chirag Agarwal and Suraj Srinivas and Aaron Jiaxun Li and Soheil Feizi and Himabindu Lakkaraju},\nyear={2024},\nurl={https://openreview.net/forum?id=wNere1lelo}\n}",
        "github": "",
        "project": "",
        "reviewers": "hssG;9Y1y;oN2G;xu91",
        "site": "https://openreview.net/forum?id=wNere1lelo",
        "pdf_size": 1904930,
        "rating": "1;3;5;5",
        "confidence": "4;4;4;4",
        "soundness": "1;2;2;3",
        "contribution": "1;2;2;2",
        "presentation": "3;3;3;2",
        "wc_summary": "106;71;184;38",
        "wc_strengths": "28;55;160;128",
        "wc_weaknesses": "951;151;1347;504",
        "wc_questions": "6;112;2;367",
        "wc_review": "1091;389;1693;1037",
        "wc_reply_reviewers": "2465;202;2330;45",
        "wc_reply_authors": "2843;1291;4667;1733",
        "reply_reviewers": "4;1;3;1",
        "reply_authors": "5;3;8;4",
        "rating_avg": [
            3.5,
            1.6583123951777
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            99.75,
            54.26036767291574
        ],
        "wc_strengths_avg": [
            92.75,
            53.344985706249844
        ],
        "wc_weaknesses_avg": [
            738.25,
            451.5458863725812
        ],
        "wc_questions_avg": [
            121.75,
            148.30774592043397
        ],
        "wc_review_avg": [
            1052.5,
            461.5720420476093
        ],
        "wc_reply_reviewers_avg": [
            1260.5,
            1139.3543127578882
        ],
        "wc_reply_authors_avg": [
            2633.5,
            1303.0942981994817
        ],
        "reply_reviewers_avg": [
            2.25,
            1.299038105676658
        ],
        "reply_authors_avg": [
            5.0,
            1.8708286933869707
        ],
        "replies_avg": [
            42,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 185,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1917430191791970267&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0;1;0",
        "aff_unique_norm": "Harvard University;University of Maryland",
        "aff_unique_dep": "School of Engineering and Applied Sciences;",
        "aff_unique_url": "https://www.harvard.edu;https://www/umd.edu",
        "aff_unique_abbr": "Harvard;UMD",
        "aff_campus_unique_index": "0;0;2",
        "aff_campus_unique": "Cambridge;;College Park",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "wOMy6J8epf",
        "title": "A counterfactual-based approach to prevent crowding in intelligent subway systems",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Today, the cities we live in are far from being truly smart: overcrowding, pollution, and poor transportation management are still in the headlines. With wide-scale deployment of advanced Artificial Intelligence (AI) solutions, however, it is possible to reverse this course and apply appropriate countermeasures to take a step forward on the road to sustainability.\nIn this research, explainable AI techniques are applied to provide public transportation experts with suggestions on how to control crowding on subway platforms by leveraging interpretable, rule-based models enhanced with counterfactual explanations. The experimental scenario relies on agent-based simulations of the De Ferrari Hitachi subway station of Genoa, Italy. Numerical results for both prediction of crowding and counterfactual (i.e., countermeasures) properties are encouraging. Moreover, an assessment of the quality of the proposed explainable methodology was submitted to a team of experts in the field to validate the model.",
        "keywords": "Explainable AI;counterfactual explanation;crowding prediction;smart public transportation;data-driven modelling.",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Alberto Carlevaro;Marta Lenatti;Alessia Paglialonga;maurizio mongelli",
        "authorids": "~Alberto_Carlevaro1;~Marta_Lenatti1;~Alessia_Paglialonga1;~maurizio_mongelli1",
        "gender": "M;F;F;M",
        "homepage": ";;;",
        "dblp": ";;;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;;",
        "orcid": "0000-0002-7206-5511;0000-0003-0731-7505;0000-0002-1341-2560;0000-0001-6201-6225",
        "linkedin": ";;;",
        "or_profile": "~Alberto_Carlevaro1;~Marta_Lenatti1;~Alessia_Paglialonga1;~maurizio_mongelli1",
        "aff": "University of Genoa;Consiglio Nazionale delle Ricerche;CNR;",
        "aff_domain": "unige.it;cnr.it;cnr.it;",
        "position": "PhD student;PhD student;Principal Researcher;",
        "bibtex": "@misc{\ncarlevaro2024a,\ntitle={A counterfactual-based approach to prevent crowding in intelligent subway systems},\nauthor={Alberto Carlevaro and Marta Lenatti and Alessia Paglialonga and maurizio mongelli},\nyear={2024},\nurl={https://openreview.net/forum?id=wOMy6J8epf}\n}",
        "github": "",
        "project": "",
        "reviewers": "uUGu;fGpu;By14;UPeU",
        "site": "https://openreview.net/forum?id=wOMy6J8epf",
        "pdf_size": 609203,
        "rating": "1;3;3;6",
        "confidence": "3;3;3;1",
        "soundness": "1;2;2;3",
        "contribution": "1;2;1;2",
        "presentation": "1;3;1;3",
        "wc_summary": "21;107;108;70",
        "wc_strengths": "15;7;39;141",
        "wc_weaknesses": "459;64;120;81",
        "wc_questions": "90;25;217;72",
        "wc_review": "585;203;484;364",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            2.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            1.0
        ],
        "wc_summary_avg": [
            76.5,
            35.51408171415952
        ],
        "wc_strengths_avg": [
            50.5,
            53.56071321407138
        ],
        "wc_weaknesses_avg": [
            181.0,
            161.78226107951392
        ],
        "wc_questions_avg": [
            101.0,
            71.05279727076197
        ],
        "wc_review_avg": [
            409.0,
            142.35694573852027
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8892972917998875,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:84j-VHJM9coJ:scholar.google.com/&scioq=A+counterfactual-based+approach+to+prevent+crowding+in+intelligent+subway+systems&hl=en&as_sdt=0,33",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "University of Genoa;Consiglio Nazionale delle Ricerche",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.unige.it;https://www.cnr.it",
        "aff_unique_abbr": "UniGe;CNR",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Italy"
    },
    {
        "title": "Batch normalization is sufficient for universal function approximation in CNNs",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17496",
        "id": "wOSYMHfENq",
        "tldr": "",
        "abstract": "Normalization techniques, for which Batch Normalization (BN) is a popular choice, is an integral part of many deep learning architectures and contributes significantly to the learning success. We provide a partial explanation for this phenomenon by proving that training normalization parameters alone is already sufficient for universal function approximation if the number of available, potentially random features matches or exceeds the weight parameters of the target networks that can be expressed. Our bound on the number of required features does not only improve on a recent result for fully-connected feed-forward architectures but also applies to CNNs with and without residual connections and almost arbitrary activation functions (which include ReLUs). Our explicit construction of a given target network solves a depth-width trade-off that is driven by architectural constraints and can explain why switching off entire neurons can have representational benefits, as has been observed empirically. To validate our theory, we explicitly match target networks that outperform experimentally obtained networks with trained BN parameters by utilizing a sufficient number of random features.",
        "keywords": "deep learning;random features;batch normalization",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Rebekka Burkholz",
        "authorids": "~Rebekka_Burkholz1",
        "gender": "F",
        "homepage": "https://sites.google.com/view/rebekkaburkholz/startseite",
        "dblp": "194/3172",
        "google_scholar": "https://scholar.google.ch/citations?user=vkWBb2wAAAAJ",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Rebekka_Burkholz1",
        "aff": "Helmholtz Center CISPA for Information Security",
        "aff_domain": "cispa.saarland",
        "position": "Associate Professor",
        "bibtex": "@inproceedings{\nburkholz2024batch,\ntitle={Batch normalization is sufficient for universal function approximation in {CNN}s},\nauthor={Rebekka Burkholz},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=wOSYMHfENq}\n}",
        "github": "",
        "project": "",
        "reviewers": "pcEF;DqFm;9YBa;Zja7",
        "pdf_size": 645901,
        "rating": "3;5;8;8",
        "confidence": "2;2;3;5",
        "soundness": "2;3;3;3",
        "contribution": "3;2;3;3",
        "presentation": "2;1;3;3",
        "wc_summary": "24;86;90;42",
        "wc_strengths": "14;3;37;24",
        "wc_weaknesses": "173;19;2;20",
        "wc_questions": "1;1;290;1",
        "wc_review": "212;109;419;87",
        "wc_reply_reviewers": "0;0;254;0",
        "wc_reply_authors": "220;514;787;11",
        "reply_reviewers": "0;0;2;0",
        "reply_authors": "1;1;3;1",
        "rating_avg": [
            6.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            3.0,
            1.224744871391589
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            60.5,
            28.26216552212516
        ],
        "wc_strengths_avg": [
            19.5,
            12.539936203984453
        ],
        "wc_weaknesses_avg": [
            53.5,
            69.36317466783076
        ],
        "wc_questions_avg": [
            73.25,
            125.14067084685138
        ],
        "wc_review_avg": [
            206.75,
            131.31331806027902
        ],
        "wc_reply_reviewers_avg": [
            63.5,
            109.9852262806237
        ],
        "wc_reply_authors_avg": [
            383.0,
            293.8239268677757
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0.7698003589195009,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2953639159444177554&as_sdt=5,24&sciodt=0,24&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=wOSYMHfENq",
        "pdf": "https://openreview.net/pdf?id=wOSYMHfENq",
        "email": "cispa.saarland",
        "author_num": 1,
        "aff_unique_index": "0",
        "aff_unique_norm": "Helmholtz Center CISPA",
        "aff_unique_dep": "Information Security",
        "aff_unique_url": "https://www.cispa.de/",
        "aff_unique_abbr": "CISPA",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "wOb0xFwdpr",
        "title": "On Sarcasm Detection with OpenAI GPT-based Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Sarcasm is a form of irony that requires readers or listeners to interpret its intended meaning by considering context and social cues. Machine learning classification models have long had difficulty detecting sarcasm due to its social complexity and contradictory nature.\n\nThis paper explores the applications of the Generative Pretrained Transformer (GPT) models, including GPT-3, InstructGPT, GPT-3.5, and GPT-4, in detecting sarcasm in natural language. It assesses the differences in sarcasm detection between GPT models with and without domain context, and tests fine-tuned and zero-shot models of different sizes.\n\nThe GPT models were tested on the political and balanced (pol-bal) portion of the popular Self-Annotated Reddit Corpus (SARC 2.0) sarcasm dataset. In the fine-tuning case, the largest fine-tuned GPT-3 model achieves accuracy and $F_1$-score of 0.81, outperforming prior models. In the zero-shot case, the latest GPT-4 model yields an accuracy of 0.71 and $F_1$-score of 0.75. Other models score lower. Moreover, domain context does not enhance fine-tuning and reduce zero-shot performance. Additionally, a model's performance may improve or deteriorate with each release, highlighting the need to reassess performance after each release.",
        "keywords": "LLM;GPT;Sarcasm;SARC",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Montgomery Gole;Williams Nwadiugwu;Andriy Miranskyy",
        "authorids": "~Montgomery_Gole1;~Williams_Nwadiugwu1;~Andriy_Miranskyy2",
        "gender": "M;;M",
        "homepage": ";https://cs.torontomu.ca/~avm/;https://sites.google.com/view/williams-paul/home",
        "dblp": ";08/4221;212/6376.html",
        "google_scholar": ";;Vhd51DgAAAAJ",
        "orcid": ";;",
        "linkedin": "montgomery-gole/;;",
        "or_profile": "~Montgomery_Gole1;~Andriy_Miranskyy2;~Williams_Paul_Nwadiugwu1",
        "aff": "Toronto Metropolitan University;Toronto Metropolitan University;Toronto Metropolitan University",
        "aff_domain": "torontomu.ca;torontomu.ca;torontomu.ca",
        "position": "MS student;Associate Professor;Researcher",
        "bibtex": "@misc{\ngole2024on,\ntitle={On Sarcasm Detection with Open{AI} {GPT}-based Models},\nauthor={Montgomery Gole and Williams Nwadiugwu and Andriy Miranskyy},\nyear={2024},\nurl={https://openreview.net/forum?id=wOb0xFwdpr}\n}",
        "github": "",
        "project": "",
        "reviewers": "ir58;5eai;kn7S;XmYa",
        "site": "https://openreview.net/forum?id=wOb0xFwdpr",
        "pdf_size": 962635,
        "rating": "1;3;5;5",
        "confidence": "5;2;4;4",
        "soundness": "2;3;3;2",
        "contribution": "2;1;2;2",
        "presentation": "2;2;3;3",
        "wc_summary": "114;71;152;215",
        "wc_strengths": "74;69;54;81",
        "wc_weaknesses": "193;408;314;120",
        "wc_questions": "48;4;78;24",
        "wc_review": "429;552;598;440",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "32;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;0;0;0",
        "rating_avg": [
            3.5,
            1.6583123951777
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            138.0,
            52.891398166431564
        ],
        "wc_strengths_avg": [
            69.5,
            9.912113800799505
        ],
        "wc_weaknesses_avg": [
            258.75,
            110.56983087623857
        ],
        "wc_questions_avg": [
            38.5,
            27.617928959282953
        ],
        "wc_review_avg": [
            504.75,
            72.21279318791096
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            8.0,
            13.856406460551018
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0.25,
            0.4330127018922193
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.2075143391598224,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3374925061461142523&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Toronto Metropolitan University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tmu.ca/",
        "aff_unique_abbr": "TMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "wOelVq8fwL",
        "title": "Adapting LLM Agents Through Communication",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent advancements in large language models (LLMs) have shown potential for human-like agents. To help these agents adapt to new tasks without extensive human supervision, we propose the Learning through Communication (LTC) paradigm, a novel training approach enabling LLM agents to improve continuously through interactions with their environments and other agents. Through iterative exploration and PPO training, LTC empowers the agent to assimilate short-term experiences into long-term memory. To optimize agent interactions for task-specific learning, we introduce three structured communication patterns: Monologue, Dialogue, and Analogue\u2014tailored for common tasks such as decision-making, knowledge-intensive reasoning, and numerical reasoning. We evaluated LTC on three datasets: ALFWorld (decision-making), HotpotQA (knowledge-intensive reasoning), and GSM8k (numerical reasoning). On ALFWorld, it exceeds the instruction tuning baseline by 12% in success rate. On HotpotQA, LTC surpasses the instruction-tuned LLaMA-7B agent by 5.1% in EM score, and it outperforms the instruction-tuned 9x larger PaLM-62B agent by 0.6%. On GSM8k, LTC outperforms the CoT-Tuning baseline by 3.6% in accuracy. The results showcase the versatility and efficiency of the LTC approach across diverse domains. We will open-source our code to promote further development of the community.",
        "keywords": "LLM;agent;NLP;AI",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Kuan Wang;Yadong Lu;Michael Santacroce;Yeyun Gong;Chao Zhang;yelong shen",
        "authorids": "~Kuan_Wang1;~Yadong_Lu1;~Michael_Santacroce2;~Yeyun_Gong2;~Chao_Zhang15;~yelong_shen1",
        "gender": "M;M;M;M;;",
        "homepage": "http://kuanwang.me;https://adamlu123.github.io/;https://santacml.github.io;;http://chaozhang.org/;",
        "dblp": ";64/7873;;06/10400.html;94/3019-14;",
        "google_scholar": "c1-_-dUAAAAJ;Y69ahdAAAAAJ;tmKKPjkAAAAJ;piUkwMYAAAAJ;https://scholar.google.com/citations?hl=en;",
        "orcid": ";;0000-0002-9963-3574;;0000-0003-3009-598X;",
        "linkedin": ";;santacrocemichael;;;",
        "or_profile": "~Kuan_Wang1;~Yadong_Lu1;~Michael_Santacroce2;~Yeyun_Gong2;~Chao_Zhang15;~yelong_shen1",
        "aff": "Georgia Institute of Technology;Microsoft;Microsoft;Microsoft;Georgia Institute of Technology;",
        "aff_domain": "gatech.edu;microsoft.com;microsoft.com;microsoft.com;gatech.edu;",
        "position": "PhD student;Researcher;Researcher;Researcher;Assistant Professor;",
        "bibtex": "@misc{\nwang2024adapting,\ntitle={Adapting {LLM} Agents Through Communication},\nauthor={Kuan Wang and Yadong Lu and Michael Santacroce and Yeyun Gong and Chao Zhang and yelong shen},\nyear={2024},\nurl={https://openreview.net/forum?id=wOelVq8fwL}\n}",
        "github": "",
        "project": "",
        "reviewers": "SmMH;CuLf;7WiZ;2FJ7",
        "site": "https://openreview.net/forum?id=wOelVq8fwL",
        "pdf_size": 24239153,
        "rating": "5;5;6;6",
        "confidence": "4;4;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;2;3",
        "wc_summary": "68;85;106;81",
        "wc_strengths": "29;51;100;118",
        "wc_weaknesses": "469;61;120;235",
        "wc_questions": "135;42;33;104",
        "wc_review": "701;239;359;538",
        "wc_reply_reviewers": "0;0;205;32",
        "wc_reply_authors": "1294;441;612;864",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "2;1;1;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            85.0,
            13.656500283747663
        ],
        "wc_strengths_avg": [
            74.5,
            35.9339672176619
        ],
        "wc_weaknesses_avg": [
            221.25,
            156.12555043938195
        ],
        "wc_questions_avg": [
            78.5,
            42.55878287733332
        ],
        "wc_review_avg": [
            459.25,
            175.50267091984668
        ],
        "wc_reply_reviewers_avg": [
            59.25,
            85.15684059428227
        ],
        "wc_reply_authors_avg": [
            802.75,
            321.0633699131684
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 21,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17510879803628757619&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1;0",
        "aff_unique_norm": "Georgia Institute of Technology;Microsoft",
        "aff_unique_dep": ";Microsoft Corporation",
        "aff_unique_url": "https://www.gatech.edu;https://www.microsoft.com",
        "aff_unique_abbr": "Georgia Tech;Microsoft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "wPBYEhIBW1",
        "title": "GUC: UNSUPERVISED NON-PARAMETRIC GLOBAL CLUSTERING AND ANOMALY DETECTION",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Clustering is a crucial task in the fields of Machine and Representation Learning, with the ability of grouping similar data points together being of particular importance. In this paper, we propose a novel non-parametric algorithm that performs Global Clustering and Anomaly Detection in an unsupervised manner. Our algorithm is both effective and efficient, requiring no prior assumptions or domain knowledge to be applied.  It features two modes that utilize the distance from the dataset\u2019s center for clustering data points together. The first mode splits the dataset into global clusters where each cluster signifies proximity from the center. The second mode employs a threshold value for splitting the points into outliers and inliers.\nWe evaluate our proposal against other prominent methods using synthetic and real datasets. Our experiments demonstrate that the proposed algorithm achieves state-of-the-art performance with minimum computational cost, and can successfully \nbe applied to a wide range of Machine Learning applications.",
        "keywords": "Global Clustering;Distance-Based Clustering;Global Outlier Detection;Unsupervised Representation Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Chris Solomou",
        "authorids": "~Chris_Solomou1",
        "gender": "M",
        "homepage": "",
        "dblp": "",
        "google_scholar": "",
        "orcid": "0000-0002-7034-5755",
        "linkedin": "",
        "or_profile": "~Chris_Solomou1",
        "aff": "University of York",
        "aff_domain": "york.ac.uk",
        "position": "PhD student",
        "bibtex": "@misc{\nsolomou2024guc,\ntitle={{GUC}: {UNSUPERVISED} {NON}-{PARAMETRIC} {GLOBAL} {CLUSTERING} {AND} {ANOMALY} {DETECTION}},\nauthor={Chris Solomou},\nyear={2024},\nurl={https://openreview.net/forum?id=wPBYEhIBW1}\n}",
        "github": "",
        "project": "",
        "reviewers": "mrV6;XPjK;mhaU",
        "site": "https://openreview.net/forum?id=wPBYEhIBW1",
        "pdf_size": 2236329,
        "rating": "1;3;3",
        "confidence": "5;5;4",
        "soundness": "1;2;2",
        "contribution": "1;2;2",
        "presentation": "1;2;1",
        "wc_summary": "36;36;58",
        "wc_strengths": "55;8;15",
        "wc_weaknesses": "140;110;20",
        "wc_questions": "5;17;160",
        "wc_review": "236;171;253",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            43.333333333333336,
            10.370899457402697
        ],
        "wc_strengths_avg": [
            26.0,
            20.704266871026046
        ],
        "wc_weaknesses_avg": [
            90.0,
            50.99019513592785
        ],
        "wc_questions_avg": [
            60.666666666666664,
            70.40991091853161
        ],
        "wc_review_avg": [
            220.0,
            35.33647784749729
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:3PVz-saEpuoJ:scholar.google.com/&scioq=GUC:+UNSUPERVISED+NON-PARAMETRIC+GLOBAL+CLUSTERING+AND+ANOMALY+DETECTION&hl=en&as_sdt=0,5",
        "gs_version_total": 5,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of York",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.york.ac.uk",
        "aff_unique_abbr": "York",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United Kingdom"
    },
    {
        "id": "wPK65O4pqS",
        "title": "STFormer : Spatial Temporal Spiking Transformer",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Spiking Neural Networks (SNNs) are a type of neural network that is modelled based on the biological processes that occur within the brain. Neurons in SNNs send brief spikes of signals rather than continuous signals like neurons in traditional Artificial Neural Networks (ANNs). Due to the brain-like low energy consumption, SNNs have become prominent in the neural network community. But owing to their intricate and non-linear nature, the formation and training of SNNs pose difficulties. To better training and presenting, nowadays, SNNs are integrated with the STBP training method and attention mechanism. However, prior studies neglected the properties of the spike data, leading to an unbridgeable divide between SNNs and ANNs. To optimize the utilization of spatio-temporal characteristics in spike data, we have introduced the Temporal Core to extract temporal features and the Spatial Core to enlarge the receptive field. The data underwent evaluation from both neuromorphic and non-neuromorphic datasets and achieved state-of-the-art results. Specifically, we attained an accuracy of 96.35\\% for CIFAR10 and 81.39\\% for CIFAR100. On the neuronmorphic dataset, we reached an accuracy of 83.1\\% for CIFAR10-DVS and 98.61\\% for DVS-Gesture. Technical abbreviations are always explained when first used. The code will be made available at xxx.",
        "keywords": "spiking neural network;temporal-spatial information",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Hongzhi Wang;Xiubo Liang;XIAOYAN LIN;Tao Zhang",
        "authorids": "~Hongzhi_Wang4;~Xiubo_Liang1;~XIAOYAN_LIN2;~Tao_Zhang33",
        "gender": "M;M;F;",
        "homepage": ";https://person.zju.edu.cn/lxb;;",
        "dblp": ";20/7528;;",
        "google_scholar": ";https://scholar.google.com/citations?authuser=1;;",
        "orcid": "0000-0001-6134-1309;0000-0002-4749-5552;;0009-0004-4393-1937",
        "linkedin": ";;\u6653\u598d-\u6797-162088292;",
        "or_profile": "~Hongzhi_Wang4;~Xiubo_Liang1;~XIAOYAN_LIN2;~Tao_Zhang33",
        "aff": "Zhejiang University;Zhejiang University;Zhejiang University;Zhejiang University",
        "aff_domain": "zju.edu.cn;zju.edu.cn;zju.edu.cn;zju.edu.cn",
        "position": "PhD student;Associate Professor;MS student;MS student",
        "bibtex": "@misc{\nwang2024stformer,\ntitle={{STF}ormer : Spatial Temporal Spiking Transformer},\nauthor={Hongzhi Wang and Xiubo Liang and XIAOYAN LIN and Tao Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=wPK65O4pqS}\n}",
        "github": "",
        "project": "",
        "reviewers": "Yvtr;ALKt;Q8zi;LFnH",
        "site": "https://openreview.net/forum?id=wPK65O4pqS",
        "pdf_size": 372838,
        "rating": "3;3;3;3",
        "confidence": "5;5;3;4",
        "soundness": "2;3;2;2",
        "contribution": "1;3;2;2",
        "presentation": "1;3;1;2",
        "wc_summary": "41;48;41;75",
        "wc_strengths": "38;3;41;33",
        "wc_weaknesses": "90;165;66;95",
        "wc_questions": "285;3;309;105",
        "wc_review": "454;219;457;308",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            51.25,
            14.00669482783144
        ],
        "wc_strengths_avg": [
            28.75,
            15.138939857202683
        ],
        "wc_weaknesses_avg": [
            104.0,
            36.88495628301598
        ],
        "wc_questions_avg": [
            175.5,
            127.02263577803761
        ],
        "wc_review_avg": [
            359.5,
            101.03093585630097
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:wIxTBcLxqMoJ:scholar.google.com/&scioq=STFormer+:+Spatial+Temporal+Spiking+Transformer&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Zhejiang University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.zju.edu.cn",
        "aff_unique_abbr": "ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "STARC: A General Framework For Quantifying Differences Between Reward Functions",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17495",
        "id": "wPhbtwlCDa",
        "author_site": "Joar Skalse, Lucy Farnik, Sumeet Motwani, Erik Jenner, Adam Gleave, Alessandro Abate",
        "tldr": "",
        "abstract": "In order to solve a task using reinforcement learning, it is necessary to first formalise the goal of that task as a *reward function*. However, for many real-world tasks, it is very difficult to manually specify a reward function that never incentivises undesirable behaviour. As a result, it is increasingly popular to use *reward learning algorithms*, which attempt to *learn* a reward function from data. However, the theoretical foundations of reward learning are not yet well-developed. In particular, it is typically not known when a given reward learning algorithm with high probability will learn a reward function that is safe to optimise. This means that reward learning algorithms generally must be evaluated empirically, which is expensive, and that their failure modes are difficult to anticipate in advance. One of the roadblocks to deriving better theoretical guarantees is the lack of good methods for *quantifying* the difference between reward functions. In this paper we provide a solution to this problem, in the form of a class of pseudometrics on the space of all reward functions that we call STARC (STAndardised Reward Comparison) metrics. We show that STARC metrics induce both an upper and a lower bound on worst-case regret, which implies that our metrics are tight, and that any metric with the same properties must be bilipschitz equivalent to ours. Moreover, we also identify a number of issues with reward metrics proposed by earlier works. Finally, we evaluate our metrics empirically, to demonstrate their practical efficacy. STARC metrics can be used to make both theoretical and empirical analysis of reward learning algorithms both easier and more principled.",
        "keywords": "reward functions;reward learning;metrics;evaluations",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/f86b7f727d1a7297f3b2400a67c58293643d9204.pdf",
        "author": "Joar Max Viktor Skalse;Lucy Farnik;Sumeet Ramesh Motwani;Erik Jenner;Adam Gleave;Alessandro Abate",
        "authorids": "~Joar_Max_Viktor_Skalse1;~Lucy_Farnik1;~Sumeet_Ramesh_Motwani1;~Erik_Jenner1;~Adam_Gleave1;~Alessandro_Abate1",
        "gender": "M;F;M;M;M;M",
        "homepage": ";;https://sumeetmotwani.com;https://ejenner.com;https://gleave.me;https://www.cs.ox.ac.uk/people/alessandro.abate/",
        "dblp": "242/8125;;;295/8670;189/0008.html;19/3904",
        "google_scholar": "GuzLUmQAAAAJ;ny-Bpu8AAAAJ;;https://scholar.google.com/citations?hl=en;lBunDH0AAAAJ;https://scholar.google.co.uk/citations?hl=en",
        "orcid": ";;;0000-0002-6037-5715;0000-0002-3467-528X;0000-0002-5627-9093",
        "linkedin": ";lucy-farnik/;;erik-jenner/;adamgleave/;",
        "or_profile": "~Joar_Max_Viktor_Skalse1;~Lucy_Farnik1;~Sumeet_Ramesh_Motwani1;~Erik_Jenner1;~Adam_Gleave1;~Alessandro_Abate1",
        "aff": "University of Oxford;University of Bristol;University of California, Berkeley;University of California, Berkeley;FAR.AI;University of Oxford",
        "aff_domain": "ox.ac.uk;bris.ac.uk;berkeley.edu;berkeley.edu;far.ai;ox.ac.uk",
        "position": "PhD student;PhD student;Undergrad student;PhD student;Principal Researcher;Full Professor",
        "bibtex": "@inproceedings{\nskalse2024starc,\ntitle={{STARC}: A General Framework For Quantifying Differences Between Reward Functions},\nauthor={Joar Max Viktor Skalse and Lucy Farnik and Sumeet Ramesh Motwani and Erik Jenner and Adam Gleave and Alessandro Abate},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=wPhbtwlCDa}\n}",
        "github": "",
        "project": "",
        "reviewers": "JNkN;uyUs;9CDF;Sb1v",
        "pdf_size": 645052,
        "rating": "6;6;6;8",
        "confidence": "3;4;3;4",
        "soundness": "3;3;3;4",
        "contribution": "3;3;3;3",
        "presentation": "3;4;3;3",
        "wc_summary": "60;178;52;76",
        "wc_strengths": "49;159;41;56",
        "wc_weaknesses": "67;296;141;25",
        "wc_questions": "187;167;71;191",
        "wc_review": "363;800;305;348",
        "wc_reply_reviewers": "176;15;16;99",
        "wc_reply_authors": "948;761;402;161",
        "reply_reviewers": "2;1;1;1",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            91.5,
            50.68283733178323
        ],
        "wc_strengths_avg": [
            76.25,
            48.06961098240759
        ],
        "wc_weaknesses_avg": [
            132.25,
            103.26029004414039
        ],
        "wc_questions_avg": [
            154.0,
            48.774993593028796
        ],
        "wc_review_avg": [
            454.0,
            200.89425078881675
        ],
        "wc_reply_reviewers_avg": [
            76.5,
            66.80007485025746
        ],
        "wc_reply_authors_avg": [
            568.0,
            306.12660779487953
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5817032072926892507&as_sdt=5,31&sciodt=0,31&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=wPhbtwlCDa",
        "pdf": "https://openreview.net/pdf?id=wPhbtwlCDa",
        "email": "ox.ac.uk;bris.ac.uk;berkeley.edu;berkeley.edu;far.ai;ox.ac.uk",
        "author_num": 6,
        "aff_unique_index": "0;1;2;2;3;0",
        "aff_unique_norm": "University of Oxford;University of Bristol;University of California, Berkeley;FAR.AI",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.ox.ac.uk;https://www.bristol.ac.uk;https://www.berkeley.edu;https://www.far.ai",
        "aff_unique_abbr": "Oxford;Bristol;UC Berkeley;FAR.AI",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Berkeley",
        "aff_country_unique_index": "0;0;1;1;1;0",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "id": "wPq7fkzL2j",
        "title": "Self-Paced Augmentations (SPAug) for Improving Model Robustness",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Augmentations are crucial components in modern computer vision. While various augmentation techniques have been devised to enhance model generalization and robustness, they are conventionally applied uniformly to all dataset samples during training. In this paper, we introduce ``Self-Paced Augmentations (SPAug),'' a novel approach that dynamically adjusts the augmentation intensity for each sample based on its training statistics. Our approach incurs little to no computational overhead and can be effortlessly integrated with existing augmentation policies with just a few lines of code. We integrate our self-paced augmentations into established uniform augmentation policies such as AugMix, RandomAugment, and AutoAugment. Our experiments reveal sizeable improvements, with about 1\\% enhancement on CIFAR10-C and CIFAR100-C datasets and a 1.81\\% improvement on ImageNet-C over AugMix, all while maintaining the same natural accuracy. Furthermore, within the context of augmentations designed to enhance model generalization, we demonstrate a 0.4\\% improvement over AutoAugment on CIFAR100, coupled with a 0.7\\% enhancement in model robustness.",
        "keywords": "data augmentations",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/b6e75705f087e35233f9c1025dd18e1ff5fd50fc.pdf",
        "author": "Wele Gedara Chaminda Bandara;Amin Ghiasi;Vishwanath S;Ali Shafahi;Reza Ardekani",
        "authorids": "~Wele_Gedara_Chaminda_Bandara1;~Amin_Ghiasi1;~Vishwanath_S1;~Ali_Shafahi1;~Reza_Ardekani1",
        "gender": "M;M;M;M;M",
        "homepage": "https://www.wgcban.com/;http://cs.umd.edu/~amin;https://www.vishwanathsindagi.com;;",
        "dblp": "296/3843;239/8313;165/1783;136/0235;",
        "google_scholar": "WwLxOJYAAAAJ;tNQWOxUAAAAJ;iIGYI-wAAAAJ;5Jnk00MAAAAJ;5OZTNTQAAAAJ",
        "orcid": "0000-0003-2516-2930;;0000-0003-4192-5547;;",
        "linkedin": "chamindabandara/;;;;",
        "or_profile": "~Wele_Gedara_Chaminda_Bandara1;~Amin_Ghiasi1;~Vishwanath_S1;~Ali_Shafahi1;~Reza_Ardekani1",
        "aff": "Johns Hopkins University;Apple;Apple;Apple;Apple",
        "aff_domain": "johnshopkins.edu;apple.com;apple.com;apple.com;apple.com",
        "position": "PhD student;Researcher;Researcher;Researcher;Researcher",
        "bibtex": "@misc{\nbandara2024selfpaced,\ntitle={Self-Paced Augmentations ({SPA}ug) for Improving Model Robustness},\nauthor={Wele Gedara Chaminda Bandara and Amin Ghiasi and Vishwanath S and Ali Shafahi and Reza Ardekani},\nyear={2024},\nurl={https://openreview.net/forum?id=wPq7fkzL2j}\n}",
        "github": "",
        "project": "",
        "reviewers": "AiNq;56By;JB6n;6RhX",
        "site": "https://openreview.net/forum?id=wPq7fkzL2j",
        "pdf_size": 8083723,
        "rating": "3;5;5;5",
        "confidence": "4;3;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;2;2",
        "presentation": "2;3;2;2",
        "wc_summary": "38;50;91;45",
        "wc_strengths": "33;23;42;26",
        "wc_weaknesses": "95;182;219;421",
        "wc_questions": "4;5;104;175",
        "wc_review": "170;260;456;667",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "681;915;647;1241",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;4;5;4",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            56.0,
            20.65187642806338
        ],
        "wc_strengths_avg": [
            31.0,
            7.314369419163897
        ],
        "wc_weaknesses_avg": [
            229.25,
            119.50810641960653
        ],
        "wc_questions_avg": [
            72.0,
            72.01735901850331
        ],
        "wc_review_avg": [
            388.25,
            191.29345911452384
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            871.0,
            237.2298463515921
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            3.75,
            1.0897247358851685
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:IQKXYndKpUsJ:scholar.google.com/&scioq=Self-Paced+Augmentations+(SPAug)+for+Improving+Model+Robustness&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1;1",
        "aff_unique_norm": "Johns Hopkins University;Apple",
        "aff_unique_dep": ";Apple Inc.",
        "aff_unique_url": "https://www.jhu.edu;https://www.apple.com",
        "aff_unique_abbr": "JHU;Apple",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "wQCPHxtzGV",
        "title": "RF-POLICY: Rectified Flows are Adaptive Decision Makers",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Diffusion-based imitation learning improves Behavioral Cloning (BC) on multi-modal decision-making but comes at the cost of significantly slower inference due to the recursion in the diffusion process. However, in real-world scenarios, states that require multi-modal decision-making are rare, and the huge consumption of diffusion models is not necessary for most cases. It inspires us to design efficient policy generators that can wisely allocate computation for different contexts. To address this challenge, we propose RF-POLICY (Rectified Flow-Policy), an imitation learning algorithm based on Rectified Flow, a recent advancement in flow-based generative modeling~\\citep{liu2022flow}. RF-POLICY adopts probability flow ordinary differential equations (ODEs) for diverse policy generation, with the learning principle of following straight trajectories as much as possible. We uncover and leverage a surprisingly intriguing advantage of these flow-based models over previous diffusion models: their training objective indicates the uncertainty of a certain state, and\nwhen the state is uni-modal, they automatically reduce to one-step generators since the probability flows admit straight lines.\nTherefore, RF-POLICY is naturally an adaptive decision maker, offering rapid inference without sacrificing diversity. Our comprehensive empirical evaluation shows that \\ours{}, to the best of our knowledge, is the first algorithm to achieve high performance across all dimensions, including success rate, behavioral diversity, and inference speed.",
        "keywords": "robot learning;imitation learning;flow-based policies",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Xixi Hu;Bo Liu;Xingchao Liu;qiang liu",
        "authorids": "~Xixi_Hu2;~Bo_Liu13;~Xingchao_Liu1;~qiang_liu4",
        "gender": ";M;M;M",
        "homepage": "https://hxixixh.github.io/;https://cranial-xix.github.io/;;https://www.cs.utexas.edu/~lqiang/",
        "dblp": "234/1710;;228/7309;61/3234-1",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;VOTVE0UAAAAJ;https://scholar.google.com.tw/citations?user=2qDh4WUAAAAJ",
        "orcid": ";;;",
        "linkedin": "xixi-hu-210200160/;;;",
        "or_profile": "~Xixi_Hu2;~Bo_Liu13;~Xingchao_Liu1;~Qiang_Liu1",
        "aff": "University of Texas, Austin;University of Texas, Austin;University of Texas, Austin;University of Texas, Austin",
        "aff_domain": "utexas.edu;cs.utexas.edu;utexas.edu;utexas.edu",
        "position": "PhD student;PhD student;PhD student;Assistant Professor",
        "bibtex": "@misc{\nhu2024rfpolicy,\ntitle={{RF}-{POLICY}: Rectified Flows are Adaptive Decision Makers},\nauthor={Xixi Hu and Bo Liu and Xingchao Liu and qiang liu},\nyear={2024},\nurl={https://openreview.net/forum?id=wQCPHxtzGV}\n}",
        "github": "",
        "project": "",
        "reviewers": "Hbo4;KiF7;zCJH;J2ZQ",
        "site": "https://openreview.net/forum?id=wQCPHxtzGV",
        "pdf_size": 3073771,
        "rating": "3;5;5;6",
        "confidence": "5;4;4;3",
        "soundness": "3;1;3;3",
        "contribution": "1;3;3;3",
        "presentation": "3;2;3;4",
        "wc_summary": "68;183;110;67",
        "wc_strengths": "33;134;95;15",
        "wc_weaknesses": "330;315;86;142",
        "wc_questions": "39;110;58;156",
        "wc_review": "470;742;349;380",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1256;546;1076;795",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;1;2;2",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            107.0,
            47.185802949616104
        ],
        "wc_strengths_avg": [
            69.25,
            47.730362454102526
        ],
        "wc_weaknesses_avg": [
            218.25,
            106.24588227314976
        ],
        "wc_questions_avg": [
            90.75,
            45.76775611716179
        ],
        "wc_review_avg": [
            485.25,
            154.75363485230324
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            918.25,
            270.5183681379141
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9733285267845754,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:4R057xnz-eIJ:scholar.google.com/&scioq=RF-POLICY:+Rectified+Flows+are+Adaptive+Decision+Makers&hl=en&as_sdt=0,31",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of Texas at Austin",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.utexas.edu",
        "aff_unique_abbr": "UT Austin",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Austin",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "AutoVP: An Automated Visual Prompting Framework and Benchmark",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17494",
        "id": "wR9qVlPh0P",
        "author_site": "Hsi-Ai Tsao, Lei Hsiung, Pin-Yu Chen, Sijia Liu, Tsung-Yi Ho",
        "tldr": "",
        "abstract": "Visual prompting (VP) is an emerging parameter-efficient fine-tuning approach to adapting pre-trained vision models to solve various downstream image-classification tasks. However, there has hitherto been little systematic study of the design space of VP and no clear benchmark for evaluating its performance. To bridge this gap, we propose AutoVP, an end-to-end expandable framework for automating VP design choices, along with 12 downstream image-classification tasks that can serve as a holistic VP-performance benchmark. Our design space covers 1) the joint optimization of the prompts; 2) the selection of pre-trained models, including image classifiers and text-image encoders; and 3) model output mapping strategies, including nonparametric and trainable label mapping. Our extensive experimental results show that AutoVP outperforms the best-known current VP methods by a substantial margin, having up to 6.7% improvement in accuracy; and attains a maximum performance increase of 27.5% compared to linear-probing (LP) baseline. AutoVP thus makes a two-fold contribution: serving both as an efficient tool for hyperparameter tuning on VP design choices, and as a comprehensive benchmark that can reasonably be expected to accelerate VP\u2019s development. The source code is available at https://github.com/IBM/AutoVP.",
        "keywords": "visual prompting;reprogramming;parameter-efficient fine-tuning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Hsi-Ai Tsao;Lei Hsiung;Pin-Yu Chen;Sijia Liu;Tsung-Yi Ho",
        "authorids": "~Hsi-Ai_Tsao1;~Lei_Hsiung1;~Pin-Yu_Chen1;~Sijia_Liu1;~Tsung-Yi_Ho2",
        "gender": ";;M;M;M",
        "homepage": "https://github.com/SHI-AI-TSAO?tab=overview&from=2019-12-01&to=2019-12-31;https://hsiung.cc/;http://www.pinyuchen.com;https://lsjxjtu.github.io/;https://www.cse.cuhk.edu.hk/people/faculty/tsung-yi-ho/",
        "dblp": ";313/9417;39/8969;128/6972-1;63/4181.html",
        "google_scholar": ";CJaZ2NcAAAAJ;jxwlCUUAAAAJ;C7dO_UgAAAAJ;TRDUYkAAAAAJ",
        "orcid": ";;0000-0003-1039-8369;;0000-0001-7348-5625",
        "linkedin": ";l-hsiung/;pin-yu-chen-940062a2;;",
        "or_profile": "~Hsi-Ai_Tsao1;~Lei_Hsiung1;~Pin-Yu_Chen1;~Sijia_Liu1;~Tsung-Yi_Ho2",
        "aff": "National Tsinghua University;Dartmouth College;International Business Machines;Michigan State University;Department of Computer Science and Engineering, The Chinese University of Hong Kong",
        "aff_domain": "nthu.edu.tw;dartmouth.edu;ibm.com;msu.edu;cse.cuhk.edu.hk",
        "position": "MS student;PhD student;Principal Researcher;Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\ntsao2024autovp,\ntitle={Auto{VP}: An Automated Visual Prompting Framework and Benchmark},\nauthor={Hsi-Ai Tsao and Lei Hsiung and Pin-Yu Chen and Sijia Liu and Tsung-Yi Ho},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=wR9qVlPh0P}\n}",
        "github": "",
        "project": "",
        "reviewers": "dWYk;PZJW;aYHC;nUAn",
        "pdf_size": 4482472,
        "rating": "3;5;6;8",
        "confidence": "3;4;5;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;2;2",
        "presentation": "3;3;4;3",
        "wc_summary": "66;87;50;28",
        "wc_strengths": "39;62;15;60",
        "wc_weaknesses": "67;265;242;92",
        "wc_questions": "1;6;5;55",
        "wc_review": "173;420;312;235",
        "wc_reply_reviewers": "0;0;72;0",
        "wc_reply_authors": "809;716;1263;1256",
        "reply_reviewers": "0;0;2;0",
        "reply_authors": "3;6;7;5",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            57.75,
            21.614520582238228
        ],
        "wc_strengths_avg": [
            44.0,
            19.013153341831543
        ],
        "wc_weaknesses_avg": [
            166.5,
            87.82511030451371
        ],
        "wc_questions_avg": [
            16.75,
            22.16275028059469
        ],
        "wc_review_avg": [
            285.0,
            92.19273290232805
        ],
        "wc_reply_reviewers_avg": [
            18.0,
            31.176914536239792
        ],
        "wc_reply_authors_avg": [
            1011.0,
            250.67808041390455
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            5.25,
            1.479019945774904
        ],
        "replies_avg": [
            32,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5883484054145521,
        "gs_citation": 19,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15019280049071421893&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=wR9qVlPh0P",
        "pdf": "https://openreview.net/pdf?id=wR9qVlPh0P",
        "email": "nthu.edu.tw;dartmouth.edu;ibm.com;msu.edu;cse.cuhk.edu.hk",
        "author_num": 5,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "Tsinghua University;Dartmouth College;International Business Machines Corporation;Michigan State University;Chinese University of Hong Kong",
        "aff_unique_dep": ";;;;Department of Computer Science and Engineering",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.dartmouth.edu;https://www.ibm.com;https://www.msu.edu;https://www.cuhk.edu.hk",
        "aff_unique_abbr": "THU;Dartmouth;IBM;MSU;CUHK",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;1;1;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "wRaIBmp5yI",
        "title": "Overcoming Weak Visual-Textual Alignment for Video Moment Retrieval",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Video moment retrieval (VMR) identifies a specific moment in an untrimmed video for a given natural language query.\nThis task is prone to suffer the weak visual-textual alignment problem innate in the video datasets. \nDue to the ambiguity, a query does not fully cover the relevant details of the corresponding moment, or the moment may contain misaligned and irrelevant frames, potentially limiting further performance gains and generalization capability.\nTo tackle this problem, we propose a background-aware moment detection transformer (BM-DETR).\nOur model adopts a contrastive approach, carefully utilizing the negative queries matched to other moments in the video.\nSpecifically, our model learns to predict the target moment from the joint probability of each frame given the positive query and the complement of negative queries.\nThis leads to efficient and effective use of the surrounding background, improving moment sensitivity and enhancing overall alignments in videos.\nOur approach is efficient and outperforms previous methods, including contrastive learning-based, on multiple datasets with significantly reduced computational costs.",
        "keywords": "Video Moment Retrieval; Video and Language;",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/ca1d4e6fa86c74432cf7a632ee9f5a9587564cb5.zip",
        "author": "Minjoon Jung;Youwon Jang;Seongho Choi;Joochan Kim;Jin-Hwa Kim;Byoung-Tak Zhang",
        "authorids": "~Minjoon_Jung2;~Youwon_Jang1;~Seongho_Choi1;~Joochan_Kim1;~Jin-Hwa_Kim1;~Byoung-Tak_Zhang1",
        "gender": "M;M;M;M;Unspecified;M",
        "homepage": "https://minjoong507.github.io/;https://greeksharifa.github.io/;;https://slashpage.com/all-about-tika/;http://wityworks.com;https://bi.snu.ac.kr/~btzhang/",
        "dblp": "304/2651;264/5689;203/9040;225/0896;48/258;09/5682",
        "google_scholar": "https://scholar.google.co.kr/citations?user=YORj6_YAAAAJ;ulMB96AAAAAJ;https://scholar.google.co.kr/citations?hl=ko;https://scholar.google.co.kr/citations?user=8DtoB2QAAAAJ;https://scholar.google.co.kr/citations?user=3f2wPekAAAAJ;sYTUOu8AAAAJ",
        "orcid": ";0000-0001-6714-3717;0000-0002-7553-6761;0009-0002-9738-1788;0000-0002-0423-0415;",
        "linkedin": "minjoonjung/;youwon-jang-9bb883214/;;tikatoka/;;",
        "or_profile": "~Minjoon_Jung2;~Youwon_Jang1;~Seongho_Choi1;~Joochan_Kim1;~Jin-Hwa_Kim1;~Byoung-Tak_Zhang1",
        "aff": "Seoul National University;Seoul National University;Seoul National University;Seoul National University;NAVER;Seoul National University",
        "aff_domain": "snu.ac.kr;snu.ac.kr;snu.ac.kr;snu.ac.kr;navercorp.com;snu.ac.kr",
        "position": "PhD student;PhD student;PhD student;MS student;Research Scientist;Full Professor",
        "bibtex": "@misc{\njung2024overcoming,\ntitle={Overcoming Weak Visual-Textual Alignment for Video Moment Retrieval},\nauthor={Minjoon Jung and Youwon Jang and Seongho Choi and Joochan Kim and Jin-Hwa Kim and Byoung-Tak Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=wRaIBmp5yI}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=wRaIBmp5yI",
        "pdf_size": 5038415,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12730933996937238758&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0;1;0",
        "aff_unique_norm": "Seoul National University;NAVER Corporation",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.snu.ac.kr;https://www.naver.com",
        "aff_unique_abbr": "SNU;NAVER",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "wRkfniZIBl",
        "title": "Splicing Up Your Predictions with RNA Contrastive Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In the face of rapidly accumulating genomic data, our understanding of the RNA regulatory code remains incomplete. Recent self-supervised methods in other domains have demonstrated the ability to learn rules underlying the data-generating process such as sentence structure in language. Inspired by this, we extend contrastive learning techniques to genomic data by utilizing functional similarities between sequences generated through alternative splicing and gene duplication. Our novel dataset and contrastive objective enable the learning of generalized RNA isoform representations. We validate their utility on downstream tasks such as RNA half-life and mean ribosome load prediction. Our pre-training strategy yields competitive results using linear probing on both tasks, along with up to a two-fold increase in Pearson correlation in low-data conditions. Importantly, our exploration of the learned latent space reveals that our contrastive objective yields semantically meaningful representations, underscoring its potential as a valuable initialization technique for RNA property prediction.",
        "keywords": "Contrastive learning;genomics;self-supervised learning;RNA;representation learning;deep metric learning;SimCLR",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/df1112859ecbd177b9b00bc286edb8699828781e.zip",
        "author": "Philip Fradkin;Ruian Shi;BO WANG;Brendan Frey;Leo J Lee",
        "authorids": "~Philip_Fradkin1;~Ruian_Shi1;~BO_WANG11;~Brendan_Frey1;~Leo_J_Lee1",
        "gender": "M;;M;M;",
        "homepage": "https://phil-fradkin.github.io/;;https://wanglab.ai/;https://www.psi.toronto.edu;",
        "dblp": ";238/2739;;;",
        "google_scholar": "siqpD8oAAAAJ;p7GXhskAAAAJ;37FDILIAAAAJ;RjQ7YnMAAAAJ;",
        "orcid": ";;;;",
        "linkedin": "phil-fradkin-330a417b/;;;brendan-frey-b639b81a4/;",
        "or_profile": "~Philip_Fradkin1;~Ruian_Shi1;~BO_WANG11;~Brendan_Frey1;~Leo_J_Lee1",
        "aff": "University of Toronto;University of Toronto;Vector Institute;University of Toronto;",
        "aff_domain": "toronto.edu;cs.toronto.edu;vectorinstitute.ai;utoronto.ca;",
        "position": "PhD student;PhD student;Assistant Professor;Full Professor;",
        "bibtex": "@misc{\nfradkin2024splicing,\ntitle={Splicing Up Your Predictions with {RNA} Contrastive Learning},\nauthor={Philip Fradkin and Ruian Shi and BO WANG and Brendan Frey and Leo J Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=wRkfniZIBl}\n}",
        "github": "",
        "project": "",
        "reviewers": "rpSM;ZWCi;qo8f",
        "site": "https://openreview.net/forum?id=wRkfniZIBl",
        "pdf_size": 974509,
        "rating": "3;5;5",
        "confidence": "4;4;4",
        "soundness": "2;3;2",
        "contribution": "2;2;2",
        "presentation": "2;3;3",
        "wc_summary": "23;110;55",
        "wc_strengths": "18;21;34",
        "wc_weaknesses": "114;64;270",
        "wc_questions": "1;42;9",
        "wc_review": "156;237;368",
        "wc_reply_reviewers": "0;0;46",
        "wc_reply_authors": "38;92;671",
        "reply_reviewers": "0;0;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            62.666666666666664,
            35.92894221778438
        ],
        "wc_strengths_avg": [
            24.333333333333332,
            6.944222218666553
        ],
        "wc_weaknesses_avg": [
            149.33333333333334,
            87.73191488215043
        ],
        "wc_questions_avg": [
            17.333333333333332,
            17.745108872274887
        ],
        "wc_review_avg": [
            253.66666666666666,
            87.3473271231327
        ],
        "wc_reply_reviewers_avg": [
            15.333333333333334,
            21.684607956387456
        ],
        "wc_reply_authors_avg": [
            267.0,
            286.52050537439726
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6307263904663298392&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "University of Toronto;Vector Institute",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.utoronto.ca;https://vectorinstitute.ai/",
        "aff_unique_abbr": "U of T;Vector Institute",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "wSWJpfUWdM",
        "title": "FedLAP-DP: Federated Learning by Sharing Differentially Private Loss Approximations",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "This work proposes FedLAP-DP, a novel privacy-preserving approach for federated learning. Unlike previous linear point-wise gradient-sharing schemes, such as FedAvg, our formulation enables a type of global optimization by leveraging synthetic samples received from clients. These synthetic samples, serving as loss surrogates, approximate local loss landscapes by simulating the utility of real images within a local region. We additionally introduce an approach to measure effective approximation regions reflecting the quality of the approximation. Therefore, the server can recover an approximation of the global loss landscape and optimize the model globally. Moreover, motivated by the emerging privacy concerns, we demonstrate that our approach seamlessly works with record-level differential privacy (DP), granting theoretical privacy guarantees for every data record on the clients. Extensive results validate the efficacy of our formulation on various datasets with highly skewed distributions. Our method consistently improves over the baselines, especially considering highly skewed distributions and noisy gradients due to DP. The source code will be released upon publication.",
        "keywords": "federated learning;differential privacy",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Hui-Po Wang;Dingfan Chen;Raouf Kerkouche;Mario Fritz",
        "authorids": "~Hui-Po_Wang1;~Dingfan_Chen1;~Raouf_Kerkouche1;~Mario_Fritz1",
        "gender": "M;F;M;M",
        "homepage": "https://hui-po-wang.github.io/;https://dingfanchen.github.io/homepage/;;https://cispa.saarland/group/fritz/",
        "dblp": "237/0049;248/8198;226/7191.html;",
        "google_scholar": "UAnfs8UAAAAJ;iARn00oAAAAJ;cH5q5P4AAAAJ;https://scholar.google.de/citations?user=4V1nNm4AAAAJ",
        "orcid": ";;0000-0002-1458-7805;",
        "linkedin": "hui-po-wang-7a0158137/;dingfan-chen-44174012b/;;",
        "or_profile": "~Hui-Po_Wang1;~Dingfan_Chen1;~Raouf_Kerkouche1;~Mario_Fritz1",
        "aff": "CISPA Helmholtz Center for Information Security;CISPA, saarland university, saarland informatics campus;CISPA, saarland university, saarland informatics campus;Saarland University",
        "aff_domain": "cispa.de;cispa.saarland;cispa.saarland;uni-saarland.de",
        "position": "PhD student;PhD student;Postdoc;Full Professor",
        "bibtex": "@misc{\nwang2024fedlapdp,\ntitle={Fed{LAP}-{DP}: Federated Learning by Sharing Differentially Private Loss Approximations},\nauthor={Hui-Po Wang and Dingfan Chen and Raouf Kerkouche and Mario Fritz},\nyear={2024},\nurl={https://openreview.net/forum?id=wSWJpfUWdM}\n}",
        "github": "",
        "project": "",
        "reviewers": "QU6w;SbQA;vGpK;XtEq",
        "site": "https://openreview.net/forum?id=wSWJpfUWdM",
        "pdf_size": 6102319,
        "rating": "3;3;5;5",
        "confidence": "5;4;3;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;3;1",
        "presentation": "2;2;2;3",
        "wc_summary": "59;98;99;60",
        "wc_strengths": "32;121;40;18",
        "wc_weaknesses": "95;183;146;95",
        "wc_questions": "69;196;258;36",
        "wc_review": "255;598;543;209",
        "wc_reply_reviewers": "166;0;0;69",
        "wc_reply_authors": "1044;934;1207;710",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "3;3;4;4",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            79.0,
            19.50640920313116
        ],
        "wc_strengths_avg": [
            52.75,
            40.18317433951678
        ],
        "wc_weaknesses_avg": [
            129.75,
            37.13068138345969
        ],
        "wc_questions_avg": [
            139.75,
            90.71486923321888
        ],
        "wc_review_avg": [
            401.25,
            171.13791952691255
        ],
        "wc_reply_reviewers_avg": [
            58.75,
            68.02710856709993
        ],
        "wc_reply_authors_avg": [
            973.75,
            180.61336467714673
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.5,
            0.5
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9045340337332909,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6735277663771036153&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "CISPA Helmholtz Center for Information Security;Saarland University",
        "aff_unique_dep": ";CISPA",
        "aff_unique_url": "https://www.cispa.de/;https://www.uni-saarland.de",
        "aff_unique_abbr": "CISPA;Saarland U",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Saarland Informatics Campus",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "wT8G45QGdV",
        "title": "Consistent123: Improve Consistency for One Image to 3D Object Synthesis",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large image diffusion models enable novel view synthesis with high quality and excellent zero-shot capability. However, such models based on image-to-image translation have no guarantee of view consistency, limiting the performance for downstream tasks like 3D reconstruction and image-to-3D generation. To empower consistency, we propose Consistent123 to synthesize novel views simultaneously by incorporating additional cross-view attention layers and the shared self-attention mechanism. The proposed attention mechanism improves the interaction across all synthesized views, as well as the alignment between the condition view and novel views. In the sampling stage, such architecture supports simultaneously generating an arbitrary number of views while training at a fixed length. We also introduce a progressive classifier-free guidance strategy to achieve the trade-off between texture and geometry for synthesized object views. Qualitative and quantitative experiments show that Consistent123 outperforms baselines in view consistency by a large margin. Furthermore, we demonstrate a significant improvement of Consistent123 on varying downstream tasks, showing its great potential in the 3D generation field.",
        "keywords": "3D object synthesis;view consistency;diffusion model",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/1b1418e5656be7405294a3b7e806e3de8b6285fe.zip",
        "author": "Haohan Weng;Tianyu Yang;Jianan Wang;Yu Li;Tong Zhang;C. L. Philip Chen;Lei Zhang",
        "authorids": "~Haohan_Weng1;~Tianyu_Yang2;~Jianan_Wang2;~Yu_Li4;~Tong_Zhang14;~C._L._Philip_Chen1;~Lei_Zhang23",
        "gender": "M;M;F;M;M;M;M",
        "homepage": "https://whaohan.github.io;https://tianyu-yang.com/;https://scholar.google.com/citations?user=mt5mvZ8AAAAJ&hl=en;https://yu-li.github.io/;http://www2.scut.edu.cn/cs/2021/0317/c22284a422099/page.htm;http://www.cs.scut.edu.cn;https://www.leizhang.org/",
        "dblp": "311/3975;120/8076-3.html;49/6053,;34/2997-3;07/4227-15;48/4856;z/LeiZhang",
        "google_scholar": "V08HvHUAAAAJ;BXsWsf8AAAAJ;mt5mvZ8AAAAJ;j9lwU7kAAAAJ;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com/citations?hl=en;fIlGZToAAAAJ",
        "orcid": ";;;;;0000-0001-5451-7230;",
        "linkedin": ";;;;;;",
        "or_profile": "~Haohan_Weng1;~Tianyu_Yang2;~Jianan_Wang2;~Yu_Li4;~Tong_Zhang14;~C.L.Philip_Chen1;~Lei_Zhang1",
        "aff": "South China University of Technology;International Digital Economy Academy;International Digital Economy Academy (IDEA);International Digital Economy Academy;South China University of Technology;South China University of Technology;International Digital Economy Academy",
        "aff_domain": "scut.edu.cn;idea.edu.cn;idea.edu.cn;idea.edu.cn;scut.edu.cn;scut.edu.cn;idea.edu.cn",
        "position": "MS student;Researcher;Researcher;Principal Researcher;Full Professor;Full Professor;Chief Scientist",
        "bibtex": "@misc{\nweng2024consistent,\ntitle={Consistent123: Improve Consistency for One Image to 3D Object Synthesis},\nauthor={Haohan Weng and Tianyu Yang and Jianan Wang and Yu Li and Tong Zhang and C. L. Philip Chen and Lei Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=wT8G45QGdV}\n}",
        "github": "",
        "project": "",
        "reviewers": "n2pA;4aQC;xWyo;bDyq",
        "site": "https://openreview.net/forum?id=wT8G45QGdV",
        "pdf_size": 6761633,
        "rating": "5;5;6;6",
        "confidence": "4;5;4;4",
        "soundness": "3;3;3;3",
        "contribution": "2;3;2;2",
        "presentation": "3;3;2;3",
        "wc_summary": "91;84;32;118",
        "wc_strengths": "71;70;31;56",
        "wc_weaknesses": "167;100;174;46",
        "wc_questions": "51;68;253;55",
        "wc_review": "380;322;490;275",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1200;495;626;333",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            81.25,
            31.13980571551467
        ],
        "wc_strengths_avg": [
            57.0,
            16.140012391568973
        ],
        "wc_weaknesses_avg": [
            121.75,
            52.413619413278454
        ],
        "wc_questions_avg": [
            106.75,
            84.67105467631781
        ],
        "wc_review_avg": [
            366.75,
            80.29126664837216
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            663.5,
            326.6730016392539
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 69,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=331965732027964679&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1;1;0;0;1",
        "aff_unique_norm": "South China University of Technology;International Digital Economy Academy",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.scut.edu.cn;",
        "aff_unique_abbr": "SCUT;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China;"
    },
    {
        "id": "wTJoOqxYUk",
        "title": "Code Representation Pre-training with Complements from Program Executions",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large language models (LLMs) for natural language processing have been grafted onto programming language modeling for advancing code intelligence. Although it can be represented in the text format, code is syntactically more rigorous in order to be properly compiled or interpreted to perform a desired set of behaviors given any inputs. In this case, existing works benefit from syntactic representations to learn from code less ambiguously in the forms of abstract syntax tree, control-flow graph, etc. However, programs with the same purpose can be implemented in various ways showing different syntactic representations while the ones with similar implementations can have distinct behaviors. Though trivially demonstrated during executions, such semantics about functionality are challenging to be learned directly from code, especially in an unsupervised manner. Hence, in this paper, we propose FuzzPretrain to explore the dynamic information of programs revealed by their test cases and embed it into the feature representations of code as complements. The test cases are obtained with the assistance of a customized fuzzer and are only required during pre-training. FuzzPretrain yielded more than 6\\%/19\\% mAP improvements on code search over its counterparts trained with only source code or AST, respectively. Our extensive experimental results show the benefits of learning discriminative code representations with program executions.",
        "keywords": "Code Intelligence;Natural Language Processing;Fuzzing;Software Testing;Software Engineering",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Jiabo Huang;JIANYU ZHAO;Yuyang Rong;Yiwen Guo;Yifeng He;Hao Chen",
        "authorids": "~Jiabo_Huang1;~JIANYU_ZHAO2;~Yuyang_Rong1;~Yiwen_Guo1;~Yifeng_He1;~Hao_Chen5",
        "gender": "M;M;M;;M;",
        "homepage": ";;https://peterrong.netlify.app/;;https://yfhe.net/about/;https://www.cs.ucdavis.edu/~hchen/",
        "dblp": "239/8749;;;;;86/475-3",
        "google_scholar": "o_ecsPcAAAAJ;tN52nL8AAAAJ;feGWM20AAAAJ;;zNLAMg0AAAAJ;1Aa3qxIAAAAJ",
        "orcid": ";0009-0006-1586-1024;0000-0003-0648-0255;;0000-0002-5389-7128;0000-0002-4072-0710",
        "linkedin": ";;yuyang-peter-rong-648109127/;;yifeng-he-11470b17b/;",
        "or_profile": "~Jiabo_Huang1;~JIANYU_ZHAO2;~Yuyang_Rong1;~Yiwen_Guo1;~Yifeng_He1;~Hao_Chen5",
        "aff": "Tencent;Tencent;University of California, Davis;;University of California, Davis;University of California, Davis",
        "aff_domain": "tencent.com;tencent.com;ucdavis.edu;;ucdavis.edu;ucdavis.edu",
        "position": "Researcher;Researcher;PhD student;;PhD student;Full Professor",
        "bibtex": "@misc{\nhuang2024code,\ntitle={Code Representation Pre-training  with Complements from Program Executions},\nauthor={Jiabo Huang and JIANYU ZHAO and Yuyang Rong and Yiwen Guo and Yifeng He and Hao Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=wTJoOqxYUk}\n}",
        "github": "",
        "project": "",
        "reviewers": "TD6n;EByC;LioK;2cyZ",
        "site": "https://openreview.net/forum?id=wTJoOqxYUk",
        "pdf_size": 652087,
        "rating": "3;5;5;6",
        "confidence": "5;4;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;2",
        "presentation": "2;2;1;4",
        "wc_summary": "72;122;90;150",
        "wc_strengths": "14;25;72;93",
        "wc_weaknesses": "277;219;151;333",
        "wc_questions": "2;50;262;272",
        "wc_review": "365;416;575;848",
        "wc_reply_reviewers": "0;0;0;34",
        "wc_reply_authors": "761;1156;1486;1021",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "2;3;4;3",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            108.5,
            29.912372022292047
        ],
        "wc_strengths_avg": [
            51.0,
            32.59601202601324
        ],
        "wc_weaknesses_avg": [
            245.0,
            67.60177512462228
        ],
        "wc_questions_avg": [
            146.5,
            121.74050270965698
        ],
        "wc_review_avg": [
            551.0,
            188.15286338506783
        ],
        "wc_reply_reviewers_avg": [
            8.5,
            14.722431864335457
        ],
        "wc_reply_authors_avg": [
            1106.0,
            261.31877085276517
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.9271726499455306,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18086539999759074952&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;1;1;1",
        "aff_unique_norm": "Tencent;University of California, Davis",
        "aff_unique_dep": "Tencent Holdings Limited;",
        "aff_unique_url": "https://www.tencent.com;https://www.ucdavis.edu",
        "aff_unique_abbr": "Tencent;UC Davis",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Davis",
        "aff_country_unique_index": "0;0;1;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "wTRpjTO3F7",
        "title": "Quantifying Zero-shot Coordination Capability with Behavior Preferring Partners",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Zero-shot coordination (ZSC) is a new challenge focusing on generalizing learned coordination skills to unseen partners. \nExisting methods train the ego agent with partners from pre-trained or evolving populations. The agent's ZSC capability is typically evaluated with a few evaluation partners, including human and agent, and reported by mean returns. Current evaluation methods for ZSC capability still need to improve in constructing diverse evaluation partners and comprehensively measuring the ZSC capability. We aim to create a reliable, comprehensive, and efficient evaluation method for ZSC capability. We formally define the ideal 'diversity-complete' evaluation partners and propose the best response (BR) diversity, which is the population diversity of the BRs to the partners, to approximate the ideal evaluation partners. We propose an evaluation workflow including 'diversity-complete' evaluation partners construction and a multi-dimensional metric, the **B**est **R**esponse **Prox**imity (BR-Prox) metric. BR-Prox quantifies the ZSC capability as the performance similarity to each evaluation partner's approximate best response, demonstrating generalization capability and improvement potential.  We re-evaluate strong ZSC methods in the Overcooked environment using the proposed evaluation workflow. \nSurprisingly, the results in some of the most used layouts fail to distinguish the performance of different ZSC methods.\nMoreover, the evaluated ZSC methods must produce more diverse and high-performing training partners. Our proposed evaluation workflow calls for a change in how we efficiently evaluate ZSC methods as a supplement to human evaluation.",
        "keywords": "Zero-shot Coordination;Multi-agent Reinforcement Learning;Benchmark",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/c36d4823a288486e5d98877a08d67d38f695325e.pdf",
        "author": "Xihuai Wang;Shao Zhang;Wenhao Zhang;Wentao Dong;Jingxiao Chen;Ying Wen;Weinan Zhang",
        "authorids": "~Xihuai_Wang1;~Shao_Zhang1;~Wenhao_Zhang8;~Wentao_Dong1;~Jingxiao_Chen1;~Ying_Wen1;~Weinan_Zhang1",
        "gender": "M;F;;M;M;M;M",
        "homepage": "https://xihuai18.github.io/;https://shaozhang.info;https://github.com/bluixe;https://github.com/WentDong;https://github.com/TimerChen;https://yingwen.io;http://wnzhang.net",
        "dblp": "79/6482;57/1330;;;239/4404;41/4203-1;28/10261-1",
        "google_scholar": "hy6v3qUAAAAJ;UG36L2YAAAAJ;;;-zs1V28AAAAJ;_A1CxG8AAAAJ;Qzss0GEAAAAJ",
        "orcid": ";0000-0002-0111-0776;;;;0000-0003-1247-2382;0000-0002-0127-2425",
        "linkedin": ";;;;;wenying45;",
        "or_profile": "~Xihuai_Wang1;~Shao_Zhang1;~Wenhao_Zhang8;~Wentao_Dong1;~Jingxiao_Chen1;~Ying_Wen1;~Weinan_Zhang1",
        "aff": "Shanghai Jiaotong University;Northeastern University;Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University",
        "aff_domain": "sjtu.edu.cn;northeastern.edu;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn",
        "position": "PhD student;PhD student;Undergrad student;Undergrad student;PhD student;Associate Professor;Associate Professor",
        "bibtex": "@misc{\nwang2024quantifying,\ntitle={Quantifying Zero-shot Coordination Capability with Behavior Preferring Partners},\nauthor={Xihuai Wang and Shao Zhang and Wenhao Zhang and Wentao Dong and Jingxiao Chen and Ying Wen and Weinan Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=wTRpjTO3F7}\n}",
        "github": "",
        "project": "",
        "reviewers": "PVtL;dEYW;tgST;6Vtg",
        "site": "https://openreview.net/forum?id=wTRpjTO3F7",
        "pdf_size": 3262578,
        "rating": "3;5;6;6",
        "confidence": "4;4;5;2",
        "soundness": "2;2;2;3",
        "contribution": "2;2;3;3",
        "presentation": "1;3;3;3",
        "wc_summary": "76;51;97;128",
        "wc_strengths": "64;18;58;73",
        "wc_weaknesses": "157;142;55;62",
        "wc_questions": "191;34;79;5",
        "wc_review": "488;245;289;268",
        "wc_reply_reviewers": "442;82;23;51",
        "wc_reply_authors": "3844;2036;946;1251",
        "reply_reviewers": "2;1;1;1",
        "reply_authors": "8;4;2;3",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            88.0,
            28.257742301889582
        ],
        "wc_strengths_avg": [
            53.25,
            21.040140208658308
        ],
        "wc_weaknesses_avg": [
            104.0,
            45.87482969995638
        ],
        "wc_questions_avg": [
            77.25,
            70.76854880524257
        ],
        "wc_review_avg": [
            322.5,
            96.81038167469437
        ],
        "wc_reply_reviewers_avg": [
            149.5,
            170.15948401426235
        ],
        "wc_reply_authors_avg": [
            2019.25,
            1126.0624705139587
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.25,
            2.277608394786075
        ],
        "replies_avg": [
            32,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.18731716231633877,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8351061852714130595&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;0;0;0;0;0",
        "aff_unique_norm": "Shanghai Jiao Tong University;Northeastern University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.sjtu.edu.cn;https://www.northeastern.edu",
        "aff_unique_abbr": "SJTU;NEU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;0;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "wTtDgucL7h",
        "title": "Two Facets of SDE Under an Information-Theoretic Lens: Generalization of SGD via Training Trajectories and via Terminal States",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Stochastic differential equations (SDEs) have been shown recently to well characterize the dynamics of training machine learning models with SGD. This provides two opportunities for better understanding the generalization behaviour of SGD through its SDE approximation. Firstly, viewing SGD as full-batch gradient descent with Gaussian gradient noise allows us to obtain trajectories-based generalization bound using the information-theoretic bound from Xu & Raginsky (2017). Secondly, assuming mild conditions, we estimate the steady-state weight distribution of SDE and use information-theoretic bounds from Xu & Raginsky (2017) and Negrea et al. (2019) to establish terminal-state-based generalization bounds. Our proposed bounds have some advantages, notably the trajectories-based bound outperforms results in Wang & Mao (2022), and the terminal-state-based bound exhibits a fast decay rate comparable to stability-based bounds.",
        "keywords": "generalization;information theory;SGD;SDE",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/eaecbbe61888d382f9ee198417279af660cb7e10.zip",
        "author": "Ziqiao Wang;Yongyi Mao",
        "authorids": "~Ziqiao_Wang1;~Yongyi_Mao2",
        "gender": "M;M",
        "homepage": "https://ziqiaowanggeothe.github.io;http://www.eecs.uottawa.ca/~yymao",
        "dblp": "222/9220;86/2933",
        "google_scholar": "iBL7APIAAAAJ;https://scholar.google.ca/citations?user=jM5l70wAAAAJ",
        "orcid": "0000-0003-0504-4830;0000-0001-5298-5778",
        "linkedin": "ziqiao-wang-987565155/?locale=en_US;",
        "or_profile": "~Ziqiao_Wang1;~Yongyi_Mao1",
        "aff": "University of Ottawa;University of Ottawa",
        "aff_domain": "uottawa.ca;eecs.uottawa.ca",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nwang2024two,\ntitle={Two Facets of {SDE} Under an Information-Theoretic Lens: Generalization of {SGD} via Training Trajectories and via Terminal States},\nauthor={Ziqiao Wang and Yongyi Mao},\nyear={2024},\nurl={https://openreview.net/forum?id=wTtDgucL7h}\n}",
        "github": "",
        "project": "",
        "reviewers": "DrRU;4Y6d;2gqG;E5SG",
        "site": "https://openreview.net/forum?id=wTtDgucL7h",
        "pdf_size": 28423248,
        "rating": "5;6;6;6",
        "confidence": "4;4;2;3",
        "soundness": "3;3;3;2",
        "contribution": "2;3;3;2",
        "presentation": "3;3;3;2",
        "wc_summary": "93;181;47;84",
        "wc_strengths": "27;199;24;29",
        "wc_weaknesses": "143;162;168;539",
        "wc_questions": "104;395;130;109",
        "wc_review": "367;937;369;761",
        "wc_reply_reviewers": "0;64;70;311",
        "wc_reply_authors": "846;1041;959;1825",
        "reply_reviewers": "0;1;1;2",
        "reply_authors": "2;2;2;3",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            101.25,
            49.16490109824284
        ],
        "wc_strengths_avg": [
            69.75,
            74.64373717868098
        ],
        "wc_weaknesses_avg": [
            253.0,
            165.37986576364125
        ],
        "wc_questions_avg": [
            184.5,
            121.92313152146315
        ],
        "wc_review_avg": [
            608.5,
            248.42051042536724
        ],
        "wc_reply_reviewers_avg": [
            111.25,
            118.5440319037614
        ],
        "wc_reply_authors_avg": [
            1167.75,
            385.7274782796787
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1225137279524396609&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Ottawa",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uottawa.ca",
        "aff_unique_abbr": "U Ottawa",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "wUKVia7J10",
        "title": "GIFF: Generalized Inference Friendly Forward-Forward Algorithm",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The Forward-Forward (FF) algorithm has recently been proposed to enable neural network training using only forward passes, inspired by the human cortex excitation and inhibition mechanisms. In contrast to Backpropagation (BP), which uses a global loss function, FF utilizes local loss functions at each layer, reducing peak memory requirements. The local weight update scope allows alternative optimizers, non-differentiable neural network layers, and aggressive quantization. Despite its promise for on-device training, the original FF technique has three major limitations that hinder its potential: the label embedding problem, lack of support for convolutional layers, and inefficient inference passes. These issues hamper its performance even on basic datasets like CIFAR10 and restrict its applicability. This paper presents the Generalized Inference Friendly Forward-Forward (GIFF) algorithm to address the limitations of the FF algorithm. We demonstrate GIFF on three representative tinyML benchmarks where FF cannot function. GIFF performs as well as BP on all three tasks, using up to 43% less memory. Furthermore, GIFF requires significantly fewer computations than FF for inference. Thus, GIFF unlocks the potential benefits of the FF algorithm for efficient on-device learning.",
        "keywords": "Forward-Forward algorithm;on-device learning;tinyML;edge computing;machine learning;memory efficient",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/243396879624a527b269fa4e9a4df8c6c4002031.zip",
        "author": "Yigit Tuncel;Jiahao Lin;Xinmiao Xiong;Umit Ogras",
        "authorids": "~Yigit_Tuncel1;jlin445@wisc.edu;xxiong52@wisc.edu;~Umit_Ogras1",
        "gender": "M;;;",
        "homepage": ";;;https://elab.ece.wisc.edu",
        "dblp": ";;;",
        "google_scholar": "8eor6OcAAAAJ;;;pVo_-KEAAAAJ",
        "orcid": "0000-0001-5943-0230;;;",
        "linkedin": "yttuncel/;;;umit-ogras-aa7324b8/",
        "or_profile": "~Yigit_Tuncel1;jlin445@wisc.edu;xxiong52@wisc.edu;~Umit_Ogras1",
        "aff": ";;;",
        "aff_domain": ";;;",
        "position": ";;;",
        "bibtex": "@misc{\ntuncel2024giff,\ntitle={{GIFF}: Generalized Inference Friendly Forward-Forward Algorithm},\nauthor={Yigit Tuncel and Jiahao Lin and Xinmiao Xiong and Umit Ogras},\nyear={2024},\nurl={https://openreview.net/forum?id=wUKVia7J10}\n}",
        "github": "",
        "project": "",
        "reviewers": "QKxL;V3Fd;8xmW;8ETu",
        "site": "https://openreview.net/forum?id=wUKVia7J10",
        "pdf_size": 29807098,
        "rating": "1;5;5;5",
        "confidence": "4;4;4;2",
        "soundness": "1;3;2;3",
        "contribution": "1;3;2;3",
        "presentation": "4;3;3;3",
        "wc_summary": "125;393;52;44",
        "wc_strengths": "54;64;33;28",
        "wc_weaknesses": "363;222;143;20",
        "wc_questions": "186;473;2;11",
        "wc_review": "728;1152;230;103",
        "wc_reply_reviewers": "264;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.7320508075688772
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            153.5,
            141.8317665405039
        ],
        "wc_strengths_avg": [
            44.75,
            14.788086421170252
        ],
        "wc_weaknesses_avg": [
            187.0,
            124.5250978718748
        ],
        "wc_questions_avg": [
            168.0,
            190.7576997135371
        ],
        "wc_review_avg": [
            553.25,
            417.2094048556432
        ],
        "wc_reply_reviewers_avg": [
            66.0,
            114.3153532995459
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:WZ0zaVxWYVgJ:scholar.google.com/&scioq=GIFF:+Generalized+Inference+Friendly+Forward-Forward+Algorithm&hl=en&as_sdt=0,33",
        "gs_version_total": 0
    },
    {
        "id": "wUaOVNv94O",
        "title": "AUTOMATIC NEURAL SPATIAL INTEGRATION",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Spatial integration is essential for a number of scientific computing applications, such as solving Partial Differential Equations.\nNumerically computing a spatial integration is usually done via Monte Carlo methods, which produce accurate and unbiased results.\nHowever, they can be slow since it require evaluating the integration many times to achieve accurate low-variance results.\nRecently, researchers have proposed to use neural networks to approximate integration results.\nWhile networks are very fast to infer in test-time, they can only approximate the integration results and thus produce biased estimations.\nIn this paper, we propose to combine these two complementary classes of methods to create a fast and unbiased estimator.\nThe key idea is instead of relying on the neural network's approximate output directly, we use the network as a control variate for the Monte Carlo estimator.\nWe propose a principal way to construct such estimators and derive a training object that can minimize its variance.\nWe also provide preliminary results showing our proposed estimator can both reduce the variance of Monte Carlo PDE solvers and produce unbiased results in solving Laplace and Poisson equations.",
        "keywords": "Monte Carlo;PDE Solver",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Zilu Li;Guandao Yang;Xi Deng;Bharath Hariharan;Leonidas Guibas;Gordon Wetzstein",
        "authorids": "~Zilu_Li1;~Guandao_Yang1;xd93@cornell.edu;~Bharath_Hariharan3;~Leonidas_Guibas1;~Gordon_Wetzstein3",
        "gender": "F;M;;;M;M",
        "homepage": ";http://www.guandaoyang.com;;;http://geometry.stanford.edu/;http://web.stanford.edu/~gordonwz/",
        "dblp": ";209/9624;;;g/LeonidasJGuibas;13/4660",
        "google_scholar": ";_kElCmMAAAAJ;;;https://scholar.google.com.tw/citations?user=5JlEyTAAAAAJ;VOf45S0AAAAJ",
        "orcid": ";0000-0002-2992-5803;;;;0000-0002-9243-6885",
        "linkedin": "zilu-li-6043771b7/;guandao-yang-349b83a6/;;;;gordon-wetzstein-2406723/",
        "or_profile": "~Zilu_Li1;~Guandao_Yang1;xd93@cornell.edu;~Bharath_Hariharan3;~Leonidas_Guibas1;~Gordon_Wetzstein3",
        "aff": "Cornell University;Stanford University;;;Stanford University;Stanford University",
        "aff_domain": "cornell.edu;stanford.edu;;;stanford.edu;stanford.edu",
        "position": "Undergrad student;Postdoc;;;Full Professor;Associate Professor",
        "bibtex": "@misc{\nli2024automatic,\ntitle={{AUTOMATIC} {NEURAL} {SPATIAL} {INTEGRATION}},\nauthor={Zilu Li and Guandao Yang and Xi Deng and Bharath Hariharan and Leonidas Guibas and Gordon Wetzstein},\nyear={2024},\nurl={https://openreview.net/forum?id=wUaOVNv94O}\n}",
        "github": "",
        "project": "",
        "reviewers": "6qeM;tiF6;PQTs;X3ae",
        "site": "https://openreview.net/forum?id=wUaOVNv94O",
        "pdf_size": 1085654,
        "rating": "3;3;5;5",
        "confidence": "4;3;3;4",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;1;3;3",
        "wc_summary": "20;218;46;128",
        "wc_strengths": "33;49;64;86",
        "wc_weaknesses": "47;422;152;72",
        "wc_questions": "73;24;111;94",
        "wc_review": "173;713;373;380",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "290;281;610;420",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            103.0,
            77.44029958619737
        ],
        "wc_strengths_avg": [
            58.0,
            19.53202498462461
        ],
        "wc_weaknesses_avg": [
            173.25,
            148.760503830822
        ],
        "wc_questions_avg": [
            75.5,
            32.63816784073518
        ],
        "wc_review_avg": [
            409.75,
            193.80837830186806
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            400.25,
            133.00446421079258
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:fyZXzYvCsWUJ:scholar.google.com/&scioq=AUTOMATIC+NEURAL+SPATIAL+INTEGRATION&hl=en&as_sdt=0,31",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Cornell University;Stanford University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cornell.edu;https://www.stanford.edu",
        "aff_unique_abbr": "Cornell;Stanford",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Stanford",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "wWI1RYngAA",
        "title": "Adaptive Offline Data Replay in Offline-to-Online Reinforcement Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Offline-to-online reinforcement learning allows agents to benefit from both sample efficiency and performance by integrating offline and online learning stages. One central challenge in this setting is how to effectively combine the rich experiences collected offline with real-time online explorations. Previous works commonly adopted predetermined mixing ratios for offline data replay as a primary approach to harness offline data in online training. However, determining the best mixing ratio that suits a specific environment and offline dataset often demands empirical adjustments that are context-specific. To address this, we propose a new approach for offline data replay that dynamically adjusts the mixing ratio based on the exploration reward of the agent in the online learning phase. Specifically, our method employs a bandit model to explore and exploit various mixing ratios, subsequently establishing a dynamic adjustment pattern for these ratios to enhance offline data utilization. Empirical results demonstrate that our approach outperforms conventional offline data replay methods, consistently proving its effectiveness across various environments and datasets without the need for targeted, context-specific adjustments.",
        "keywords": "offline-to-online reinforcement learning;offline data replay",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Xu Liu;Tong Yu;Shuai Li",
        "authorids": "~Xu_Liu12;~Tong_Yu3;~Shuai_Li3",
        "gender": "M;;F",
        "homepage": "https://github.com/LiuX41;https://www.linkedin.com/in/tong-yu-42790744;http://shuaili8.github.io",
        "dblp": ";32/1593-1;57/2281-10",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;https://scholar.google.com.hk/citations?user=kMZgQxcAAAAJ",
        "orcid": ";0000-0002-5991-2050;",
        "linkedin": ";tong-yu-42790744;",
        "or_profile": "~Xu_Liu12;~Tong_Yu3;~Shuai_Li3",
        "aff": "Shanghai Jiaotong University;Adobe Research;John Hopcroft Center, Shanghai Jiao Tong University",
        "aff_domain": "sjtu.edu.cn;adobe.com;sjtu.edu.cn",
        "position": "MS student;Senior Research Scientist;Assistant Professor",
        "bibtex": "@misc{\nliu2024adaptive,\ntitle={Adaptive Offline Data Replay in Offline-to-Online Reinforcement Learning},\nauthor={Xu Liu and Tong Yu and Shuai Li},\nyear={2024},\nurl={https://openreview.net/forum?id=wWI1RYngAA}\n}",
        "github": "",
        "project": "",
        "reviewers": "27rC;nzb6;jaY3;nGv3",
        "site": "https://openreview.net/forum?id=wWI1RYngAA",
        "pdf_size": 4910341,
        "rating": "3;5;5;5",
        "confidence": "4;4;4;3",
        "soundness": "2;2;3;2",
        "contribution": "2;2;2;3",
        "presentation": "2;3;2;2",
        "wc_summary": "44;98;62;111",
        "wc_strengths": "15;98;23;121",
        "wc_weaknesses": "103;440;101;210",
        "wc_questions": "8;3;147;3",
        "wc_review": "170;639;333;445",
        "wc_reply_reviewers": "0;41;0;0",
        "wc_reply_authors": "498;434;504;426",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            78.75,
            26.920020430898635
        ],
        "wc_strengths_avg": [
            64.25,
            46.06177916668005
        ],
        "wc_weaknesses_avg": [
            213.5,
            138.0045289111919
        ],
        "wc_questions_avg": [
            40.25,
            61.66593468034033
        ],
        "wc_review_avg": [
            396.75,
            170.65517132510226
        ],
        "wc_reply_reviewers_avg": [
            10.25,
            17.75352077758099
        ],
        "wc_reply_authors_avg": [
            465.5,
            35.67562192870644
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:HCpMWt9wJfsJ:scholar.google.com/&scioq=Adaptive+Offline+Data+Replay+in+Offline-to-Online+Reinforcement+Learning&hl=en&as_sdt=0,48",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Shanghai Jiao Tong University;Adobe",
        "aff_unique_dep": ";Adobe Research",
        "aff_unique_url": "https://www.sjtu.edu.cn;https://research.adobe.com",
        "aff_unique_abbr": "SJTU;Adobe",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Shanghai",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "MVSFormer++: Revealing the Devil in Transformer's Details for Multi-View Stereo",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17493",
        "id": "wXWfvSpYHh",
        "author_site": "chenjie cao, xinlin ren, Yanwei Fu",
        "tldr": "",
        "abstract": "Recent advancements in learning-based Multi-View Stereo (MVS) methods have prominently featured transformer-based models with attention mechanisms. However, existing approaches have not thoroughly investigated the profound influence of transformers on different MVS modules, resulting in limited depth estimation capabilities. In this paper, we introduce MVSFormer++, a method that prudently maximizes the inherent characteristics of attention to enhance various components of the MVS pipeline. Formally, our approach involves infusing cross-view information into the pre-trained DINOv2 model to facilitate MVS learning. Furthermore, we employ different attention mechanisms for the feature encoder and cost volume regularization, focusing on feature and spatial aggregations respectively. Additionally, we uncover that some design details would substantially impact the performance of transformer modules in MVS, including normalized 3D positional encoding, adaptive attention scaling, and the position of layer normalization. Comprehensive experiments on DTU, Tanks-and-Temples, BlendedMVS, and ETH3D validate the effectiveness of the proposed method. Notably, MVSFormer++ achieves state-of-the-art performance on the challenging DTU and Tanks-and-Temples benchmarks. Codes and models are available at https://github.com/maybeLx/MVSFormerPlusPlus.",
        "keywords": "Multi-View Stereo;Transformer;Depth Estimation",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Chenjie Cao;Xinlin Ren;Yanwei Fu",
        "authorids": "~Chenjie_Cao1;~Xinlin_Ren1;~Yanwei_Fu2",
        "gender": "M;M;M",
        "homepage": "https://ewrfcas.github.io/;;http://yanweifu.github.io",
        "dblp": "https://dblp.uni-trier.de/pid/193/0823;286/4464;63/9065",
        "google_scholar": "1INK-I0AAAAJ;NtHPuC0AAAAJ;https://scholar.google.co.uk/citations?user=Vg54TcsAAAAJ",
        "orcid": ";;0000-0002-6595-6893",
        "linkedin": ";;",
        "or_profile": "~Chenjie_Cao1;~Xinlin_Ren1;~Yanwei_Fu2",
        "aff": "Fudan University;Fudan University;Fudan University,",
        "aff_domain": "fudan.edu.cn;fudan.edu;fudan.edu.cn",
        "position": "PhD student;PhD student;Professor",
        "bibtex": "@inproceedings{\ncao2024mvsformer,\ntitle={{MVSF}ormer++: Revealing the Devil in Transformer's Details for Multi-View Stereo},\nauthor={Chenjie Cao and Xinlin Ren and Yanwei Fu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=wXWfvSpYHh}\n}",
        "github": "",
        "project": "",
        "reviewers": "4iWa;Wn6x;Xp5d;B1hX;3kfC",
        "pdf_size": 20249912,
        "rating": "5;5;6;6;8",
        "confidence": "3;2;5;4;3",
        "soundness": "3;2;3;3;4",
        "contribution": "3;2;2;3;3",
        "presentation": "3;2;3;3;4",
        "wc_summary": "54;49;53;58;59",
        "wc_strengths": "103;84;53;109;45",
        "wc_weaknesses": "215;184;134;181;52",
        "wc_questions": "98;76;2;5;6",
        "wc_review": "470;393;242;353;162",
        "wc_reply_reviewers": "0;343;0;33;0",
        "wc_reply_authors": "1248;1606;664;815;249",
        "reply_reviewers": "0;1;0;1;0",
        "reply_authors": "3;3;1;3;1",
        "rating_avg": [
            6.0,
            1.0954451150103321
        ],
        "confidence_avg": [
            3.4,
            1.019803902718557
        ],
        "soundness_avg": [
            3.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            3.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            54.6,
            3.6110940170535577
        ],
        "wc_strengths_avg": [
            78.8,
            25.81782330096788
        ],
        "wc_weaknesses_avg": [
            153.2,
            56.834496566785916
        ],
        "wc_questions_avg": [
            37.4,
            41.112528504094705
        ],
        "wc_review_avg": [
            324.0,
            109.44039473613023
        ],
        "wc_reply_reviewers_avg": [
            75.2,
            134.50858708647564
        ],
        "wc_reply_authors_avg": [
            916.4,
            470.08875757669426
        ],
        "reply_reviewers_avg": [
            0.4,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            2.2,
            0.9797958971132712
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.17902871850985824,
        "gs_citation": 28,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16260658936951574334&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=wXWfvSpYHh",
        "pdf": "https://openreview.net/pdf?id=wXWfvSpYHh",
        "email": "fudan.edu.cn;fudan.edu;fudan.edu.cn",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Fudan University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.fudan.edu.cn",
        "aff_unique_abbr": "Fudan",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "CLEX: Continuous Length Extrapolation for Large Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17492",
        "id": "wXpSidPpc5",
        "author_site": "Guanzheng Chen, Xin Li, Zaiqiao Meng, Shangsong Liang, Lidong Bing",
        "tldr": "",
        "abstract": "Transformer-based Large Language Models (LLMs) are pioneering advances in many natural language processing tasks, however, their exceptional capabilities are restricted within the preset context window of Transformer. Position Embedding (PE) scaling methods, while effective in extending the context window to a specific length, demonstrate either notable limitations in their extrapolation abilities or sacrificing partial performance within the context window. Length extrapolation methods, although theoretically capable of extending the context window beyond the training sequence length, often underperform in practical long-context applications. To address these challenges, we propose Continuous Length EXtrapolation (CLEX) for LLMs. We generalise the PE scaling approaches to model the continuous dynamics by ordinary differential equations over the length scaling factor, thereby overcoming the constraints of current PE scaling methods designed for specific lengths. Moreover, by extending the dynamics to desired context lengths beyond the training sequence length, CLEX facilitates the length extrapolation with impressive performance in practical tasks. We demonstrate that CLEX can be seamlessly incorporated into LLMs equipped with Rotary Position Embedding, such as LLaMA and GPT-NeoX, with negligible impact on training and inference latency. Experimental results reveal that CLEX can effectively extend the context window to over 4\u00d7 or almost 8\u00d7 training length, with no deterioration in performance. Furthermore, when evaluated on the practical LongBench benchmark, our model trained on a 4k length exhibits competitive performance against state-of-the-art open-source models trained on context lengths up to 32k. Our code is available at https://github.com/DAMO-NLP-SG/CLEX.",
        "keywords": "Length Extrapolation;Long Context;Large Language Model (LLM);Neural Ordinary Differential Equation (ODE)",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Guanzheng Chen;Xin Li;Zaiqiao Meng;Shangsong Liang;Lidong Bing",
        "authorids": "~Guanzheng_Chen1;~Xin_Li40;~Zaiqiao_Meng1;~Shangsong_Liang1;~Lidong_Bing2",
        "gender": "M;M;M;M;",
        "homepage": "http://guanzhchen.github.io/;https://lixin4ever.github.io/;https://mengzaiqiao.github.io/;;https://lidongbing.github.io",
        "dblp": "314/6003;09/1365-56.html;185/0748;57/7731;53/6625",
        "google_scholar": "o_NQ8swAAAAJ;https://scholar.google.com.hk/citations?user=syD9lxQAAAAJ;https://scholar.google.com/citations?hl=en;4uggVcIAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Guanzheng_Chen1;~Xin_Li40;~Zaiqiao_Meng1;~Shangsong_Liang1;~Lidong_Bing3",
        "aff": "SUN YAT-SEN UNIVERSITY;Alibaba Group;University of Glasgow;SUN YAT-SEN UNIVERSITY;Alibaba Group",
        "aff_domain": "sysu.edu.cn;alibaba-inc.com;glasgow.ac.uk;sysu.edu.cn;alibaba-inc.com",
        "position": "MS student;Researcher;Lecturer;Associate Professor;Scientist",
        "bibtex": "@inproceedings{\nchen2024clex,\ntitle={{CLEX}: Continuous  Length Extrapolation for Large Language Models},\nauthor={Guanzheng Chen and Xin Li and Zaiqiao Meng and Shangsong Liang and Lidong Bing},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=wXpSidPpc5}\n}",
        "github": "",
        "project": "",
        "reviewers": "jLqk;pxa3;ZBA8;nREr",
        "pdf_size": 836630,
        "rating": "6;6;6;8",
        "confidence": "4;2;5;2",
        "soundness": "3;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "138;87;38;64",
        "wc_strengths": "67;53;30;69",
        "wc_weaknesses": "208;5;119;143",
        "wc_questions": "56;241;157;175",
        "wc_review": "469;386;344;451",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1634;1040;990;1312",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;2;2;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            1.299038105676658
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            81.75,
            36.81287139031673
        ],
        "wc_strengths_avg": [
            54.75,
            15.562374497485916
        ],
        "wc_weaknesses_avg": [
            118.75,
            73.3020293034238
        ],
        "wc_questions_avg": [
            157.25,
            66.29621029893036
        ],
        "wc_review_avg": [
            412.5,
            50.172203459684724
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1244.0,
            256.34742050584396
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5555555555555555,
        "gs_citation": 46,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15956873773682145679&as_sdt=5,31&sciodt=0,31&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=wXpSidPpc5",
        "pdf": "https://openreview.net/pdf?id=wXpSidPpc5",
        "email": "sysu.edu.cn;alibaba-inc.com;glasgow.ac.uk;sysu.edu.cn;alibaba-inc.com",
        "author_num": 5,
        "aff_unique_index": "0;1;2;0;1",
        "aff_unique_norm": "Sun Yat-sen University;Alibaba Group;University of Glasgow",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.sysu.edu.cn;https://www.alibaba.com;https://www.gla.ac.uk",
        "aff_unique_abbr": "SYSU;Alibaba;Glasgow",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "id": "wYmcfur889",
        "title": "Data Prediction Denoising Models: The Pupil Outdoes the Master",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Due to their flexibility, scalability, and high quality, \ndiffusion models (DMs) have become a fundamental stream of modern AIGC. However, a substantial performance deficit of DMs emerges when confronted with a scarcity of sampling steps. This limitation stems from the DM's acquisition of a series of weak denoisers obtained by minimizing a denoising auto-encoder objective. The weak denoisers lead to a decline in the quality of generated data samples in scenarios with few sampling steps. To address this, in this work, we introduce the Data-Prediction Denoising Model (DPDM), a constructor that embodies a sequence of stronger denoisers compared to conventional diffusion models. The DPDM is trained by initializing from a teacher DM. The core idea of training DPDM lies in improving the denoisers' data recovery ability with noisy data as inputs. We formulate such an idea through the minimization of suitable probability divergences between denoiser-recovered data distributions and the ground truth data distribution. The sampling algorithm of the DPDM is executed through an iterative process that interleaves data prediction and the sequential introduction of noise. We conduct a comprehensive evaluation of the DPDM on two tasks: data distribution recovery and the few-step image data generation. For the data distribution recovery, the DPDM shows significantly stronger ability to recover data distributions from noisy distribution. For the data generation task, we train DPDMs on two benchmark datasets: the CIFAR10, and the ImageNet$64\\times 64$. We compare the DPDM with baseline diffusion models together with other diffusion-based multi-step generative models under the few-step generation setting. We observe the superior performance advantage of DPDMs over competitor methods. In addition to the strong empirical performance, we also elucidate the interconnections and comparisons between the DPDM and existing methodologies, which shows that DPDM is a stand-alone generative model that is essentially different from existing models.",
        "keywords": "Diffusion Model;Generative Models",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Weijian Luo;Zhihua Zhang",
        "authorids": "~Weijian_Luo1;~Zhihua_Zhang1",
        "gender": ";M",
        "homepage": ";http://www.math.pku.edu.cn/teachers/zhzhang/",
        "dblp": ";52/5331",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Weijian_Luo1;~Zhihua_Zhang1",
        "aff": ";Peking University",
        "aff_domain": ";pku.edu.cn",
        "position": ";Full Professor",
        "bibtex": "@misc{\nluo2024data,\ntitle={Data Prediction Denoising Models: The Pupil Outdoes the Master},\nauthor={Weijian Luo and Zhihua Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=wYmcfur889}\n}",
        "github": "",
        "project": "",
        "reviewers": "twcE;u1HV;X9iJ;gGZJ",
        "site": "https://openreview.net/forum?id=wYmcfur889",
        "pdf_size": 49856917,
        "rating": "5;5;6;8",
        "confidence": "3;3;3;2",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "35;69;108;82",
        "wc_strengths": "16;73;58;127",
        "wc_weaknesses": "179;140;92;116",
        "wc_questions": "12;94;67;53",
        "wc_review": "242;376;325;378",
        "wc_reply_reviewers": "69;64;0;0",
        "wc_reply_authors": "1193;1733;526;773",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "3;4;1;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            73.5,
            26.291633650269812
        ],
        "wc_strengths_avg": [
            68.5,
            39.714606884621176
        ],
        "wc_weaknesses_avg": [
            131.75,
            32.12767498590584
        ],
        "wc_questions_avg": [
            56.5,
            29.618406439239774
        ],
        "wc_review_avg": [
            330.25,
            55.20133603455626
        ],
        "wc_reply_reviewers_avg": [
            33.25,
            33.29695932063467
        ],
        "wc_reply_authors_avg": [
            1056.25,
            457.735390263851
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            1.299038105676658
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.9428090415820632,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:UktZS9jLMMIJ:scholar.google.com/&scioq=Data+Prediction+Denoising+Models:+The+Pupil+Outdoes+the+Master&hl=en&as_sdt=0,31",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Peking University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.pku.edu.cn",
        "aff_unique_abbr": "Peking U",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "title": "Benign Oscillation of Stochastic Gradient Descent with Large Learning Rate",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17491",
        "id": "wYmvN3sQpG",
        "author_site": "Miao Lu, Beining Wu, Xiaodong Yang, Difan Zou",
        "tldr": "",
        "abstract": "In this work, we theoretically investigate the generalization properties of neural networks (NN) trained by stochastic gradient descent (SGD) with large learning rates. Under such a training regime, our finding is that, the oscillation of the NN weights caused by SGD with large learning rates turns out to be beneficial to the generalization of the NN, potentially improving over the same NN trained by SGD with small learning rates that converges more smoothly. In view of this finding, we call such a phenomenon \u201cbenign oscillation\u201d. Our theory towards demystifying such a phenomenon builds upon the feature learning perspective of deep learning. Specifically, we consider a feature-noise data generation model that consists of (i) weak features which have a small $\\ell_2$-norm and appear in each data point; (ii) strong features which have a large $\\ell_2$-norm but appear only in a certain fraction of all data points; and (iii) noise. We prove that NNs trained by oscillating SGD with a large learning rate can effectively learn the weak features in the presence of those strong features. In contrast, NNs trained by SGD with a small learning rate can only learn the strong features but make little progress in learning the weak features. Consequently, when it comes to the new testing data points that consist of only weak features, the NN trained by oscillating SGD with a large learning rate can still make correct predictions, while the NN trained by SGD with a small learning rate could not. Our theory sheds light on how large learning rate training benefits the generalization of NNs. Experimental results demonstrate our  findings on the phenomenon of \u201cbenign oscillation\u201d.",
        "keywords": "deep learning theory; large learning rate; oscillation of stochastic gradient descent;",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Miao Lu;Beining Wu;Xiaodong Yang;Difan Zou",
        "authorids": "~Miao_Lu3;~Beining_Wu1;~Xiaodong_Yang7;~Difan_Zou1",
        "gender": ";Not Specified;M;M",
        "homepage": "https://miaolu3.github.io;https://beiningw7.github.io;;https://difanzou.github.io/",
        "dblp": "09/1168;;;161/8923",
        "google_scholar": "3jS17zQAAAAJ;;;Cp4fcTQAAAAJ",
        "orcid": ";;my-orcid?orcid=0000-0002-1152-9407;",
        "linkedin": "miao-lu-5bb9a31aa/;;;",
        "or_profile": "~Miao_Lu3;~Beining_Wu1;~Xiaodong_Yang7;~Difan_Zou1",
        "aff": "Stanford University;University of Chicago;Harvard University, Harvard University;University of Hong Kong",
        "aff_domain": "stanford.edu;uchicago.edu;g.harvard.edu;hku.hk",
        "position": "PhD student;PhD student;PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nlu2024benign,\ntitle={Benign Oscillation of Stochastic Gradient Descent with Large Learning Rate},\nauthor={Miao Lu and Beining Wu and Xiaodong Yang and Difan Zou},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=wYmvN3sQpG}\n}",
        "github": "",
        "project": "",
        "reviewers": "yxwb;ahqJ;1fN5",
        "pdf_size": 972732,
        "rating": "3;6;8",
        "confidence": "4;3;3",
        "soundness": "2;3;4",
        "contribution": "1;3;3",
        "presentation": "2;4;3",
        "wc_summary": "30;103;86",
        "wc_strengths": "119;99;73",
        "wc_weaknesses": "199;165;88",
        "wc_questions": "4;82;69",
        "wc_review": "352;449;316",
        "wc_reply_reviewers": "155;0;36",
        "wc_reply_authors": "2284;1099;844",
        "reply_reviewers": "1;0;1",
        "reply_authors": "6;3;3",
        "rating_avg": [
            5.666666666666667,
            2.0548046676563256
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            73.0,
            31.187604375242845
        ],
        "wc_strengths_avg": [
            97.0,
            18.83259585576738
        ],
        "wc_weaknesses_avg": [
            150.66666666666666,
            46.43513995049678
        ],
        "wc_questions_avg": [
            51.666666666666664,
            34.120700787384514
        ],
        "wc_review_avg": [
            372.3333333333333,
            56.16839759944099
        ],
        "wc_reply_reviewers_avg": [
            63.666666666666664,
            66.23359335630893
        ],
        "wc_reply_authors_avg": [
            1409.0,
            627.4153329334564
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            4.0,
            1.4142135623730951
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9176629354822472,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14161592311094314074&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=wYmvN3sQpG",
        "pdf": "https://openreview.net/pdf?id=wYmvN3sQpG",
        "email": "stanford.edu;uchicago.edu;g.harvard.edu;hku.hk",
        "author_num": 4,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Stanford University;University of Chicago;Harvard University;University of Hong Kong",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.stanford.edu;https://www.uchicago.edu;https://www.harvard.edu;https://www.hku.hk",
        "aff_unique_abbr": "Stanford;UChicago;Harvard;HKU",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Stanford;;Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "Mixture of Weak and Strong Experts on Graphs",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17490",
        "id": "wYvuY60SdD",
        "author_site": "Hanqing Zeng, Hanjia Lyu, Diyi Hu, Yinglong Xia, Jiebo Luo",
        "tldr": "",
        "abstract": "Realistic graphs contain both (1) rich self-features of nodes and  (2) informative structures of neighborhoods, jointly handled by a Graph Neural Network (GNN) in the typical setup. We propose to decouple the two modalities by **M**ixture **o**f **w**eak and **st**rong experts (**Mowst**), where the weak expert is a light-weight Multi-layer Perceptron (MLP), and the strong expert is an off-the-shelf GNN. To adapt the experts' collaboration to different target nodes, we propose a \"confidence\" mechanism based on the dispersion of the weak expert's prediction logits. The strong expert is conditionally activated in the low-confidence region when either the node's classification relies on neighborhood information, or the weak expert has low model quality. We reveal interesting training dynamics by analyzing the influence of the confidence function on loss: our training algorithm encourages the specialization of each expert by effectively generating soft splitting of the graph. In addition, our \"confidence\" design imposes a desirable bias toward the strong expert to benefit from GNN's better generalization capability. Mowst is easy to optimize and achieves strong expressive power, with a computation cost comparable to a single GNN. Empirically, Mowst on 4 backbone GNN architectures show significant accuracy improvement on 6 standard node classification benchmarks, including both homophilous and heterophilous graphs (https://github.com/facebookresearch/mowst-gnn).",
        "keywords": "Graph Neural Networks;Mixture of experts;Node classification",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Hanqing Zeng;Hanjia Lyu;Diyi Hu;Yinglong Xia;Jiebo Luo",
        "authorids": "~Hanqing_Zeng1;~Hanjia_Lyu1;~Diyi_Hu1;~Yinglong_Xia1;~Jiebo_Luo1",
        "gender": "M;;;M;M",
        "homepage": "https://hanqingzeng.com;https://brucelyu17.github.io/;https://sites.google.com/a/usc.edu/diyi_hu/;;https://www.cs.rochester.edu/u/jluo/",
        "dblp": "136/2474;256/5541;241/1744;61/3251;25/5545",
        "google_scholar": "ubUx3R0AAAAJ;tPhwyYsAAAAJ;XnXNygkAAAAJ;;CcbnBvgAAAAJ",
        "orcid": ";0000-0002-3876-0094;;0000-0002-8155-5440;0000-0002-4516-9729",
        "linkedin": "hanqing-zeng-a9477995/;;;;jieboluo/",
        "or_profile": "~Hanqing_Zeng1;~Hanjia_Lyu1;~Diyi_Hu1;~Yinglong_Xia1;~Jiebo_Luo3",
        "aff": "Meta AI;University of Rochester;;Meta;University of Rochester",
        "aff_domain": "meta.com;rochester.edu;;meta.com;rochester.edu",
        "position": "Researcher;PhD student;;Researcher;Full Professor",
        "bibtex": "@inproceedings{\nzeng2024mixture,\ntitle={Mixture of Weak and Strong Experts on Graphs},\nauthor={Hanqing Zeng and Hanjia Lyu and Diyi Hu and Yinglong Xia and Jiebo Luo},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=wYvuY60SdD}\n}",
        "github": "",
        "project": "",
        "reviewers": "jetB;3gAn;SJRD;DN88;BGLX;MV5e",
        "pdf_size": 1270987,
        "rating": "5;5;6;6;6;8",
        "confidence": "3;4;4;4;4;3",
        "soundness": "3;3;2;2;3;3",
        "contribution": "2;2;3;3;2;3",
        "presentation": "1;4;3;3;2;3",
        "wc_summary": "260;92;132;75;91;80",
        "wc_strengths": "37;29;77;27;57;86",
        "wc_weaknesses": "133;284;832;175;642;92",
        "wc_questions": "321;44;6;40;5;80",
        "wc_review": "751;449;1047;317;795;338",
        "wc_reply_reviewers": "131;468;108;0;74;8",
        "wc_reply_authors": "3359;6123;2909;1287;2627;999",
        "reply_reviewers": "1;2;1;0;1;1",
        "reply_authors": "6;11;5;4;5;3",
        "rating_avg": [
            6.0,
            1.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.9428090415820635
        ],
        "wc_summary_avg": [
            121.66666666666667,
            64.52045326010108
        ],
        "wc_strengths_avg": [
            52.166666666666664,
            23.039217772215174
        ],
        "wc_weaknesses_avg": [
            359.6666666666667,
            278.5861127590932
        ],
        "wc_questions_avg": [
            82.66666666666667,
            109.57138718154884
        ],
        "wc_review_avg": [
            616.1666666666666,
            267.8932726955934
        ],
        "wc_reply_reviewers_avg": [
            131.5,
            157.92165779271696
        ],
        "wc_reply_authors_avg": [
            2884.0,
            1677.6498442762124
        ],
        "reply_reviewers_avg": [
            1.0,
            0.5773502691896257
        ],
        "reply_authors_avg": [
            5.666666666666667,
            2.560381915956203
        ],
        "replies_avg": [
            53,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.3535533905932738,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15111049909809146290&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=wYvuY60SdD",
        "pdf": "https://openreview.net/pdf?id=wYvuY60SdD",
        "email": "meta.com;rochester.edu;;meta.com;rochester.edu",
        "author_num": 5,
        "aff_unique_index": "0;1;0;1",
        "aff_unique_norm": "Meta;University of Rochester",
        "aff_unique_dep": "Meta AI;",
        "aff_unique_url": "https://meta.com;https://www.rochester.edu",
        "aff_unique_abbr": "Meta;U of R",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "wZNJ7rj1ok",
        "title": "SAGMAN: Stability Analysis of Graph Neural Networks (GNNs) on the Manifolds",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Graph neural networks (GNNs)  are highly effective at tasks that involve analyzing graph-structured data, such as predicting protein interactions, modeling social networks, and identifying communities within graphs. However,  modern GNNs can be sensitive to changes in the input graph structure and node features,   leading to unpredictable behavior and degraded performance. In this work, we introduce a spectral framework (SAGMAN) for analyzing the stability of GNNs. SAGMAN quantifies the stability of each node by examining the distance mapping distortions (DMDs) on the input/output manifolds: when two nearby nodes on the input manifold are mapped (through a GNN model) to two distant nodes (data samples) on the output manifold, it implies a large DMD and thus poor GNN stability.  To create low-dimensional input/output manifolds for meaningful DMD estimations while exploiting both the input graph topology and node features, we propose a spectral sparsification framework for estimating probabilistic graphical models (PGMs)  such that the constructed input/output graph structures can well preserve pair-wise distances on the manifolds. Our empirical evaluations show that SAGMAN can effectively reveal each node's stability under various edge/feature perturbations, offering a scalable approach for assessing the stability of GNNs.",
        "keywords": "Manifolds;Stability;Graph Neural Networks",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/610ca847808083583e981754e69066e1925ef8f2.zip",
        "author": "Wuxinlin Cheng;Chenhui Deng;Ali Aghdaei;Zhiru Zhang;Zhuo Feng",
        "authorids": "~Wuxinlin_Cheng1;~Chenhui_Deng1;~Ali_Aghdaei1;~Zhiru_Zhang2;~Zhuo_Feng3",
        "gender": "M;M;M;M;M",
        "homepage": "https://github.com/chengwuxinlin;https://chenhui1016.github.io;;https://www.csl.cornell.edu/~zhiruz;https://web.stevens.edu/facultyprofile/?id=2371",
        "dblp": ";250/2396;210/3216;81/4227;81/4441.html",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;;https://scholar.google.com.tw/citations?user=x05pUHsAAAAJ;",
        "orcid": ";;;;",
        "linkedin": ";chenhui-deng-113b0b16a;aliaghdaei/;;",
        "or_profile": "~Wuxinlin_Cheng1;~Chenhui_Deng1;~Ali_Aghdaei1;~Zhiru_Zhang2;~Zhuo_Feng3",
        "aff": "Stevens Institute of Technology;Cornell University;;Cornell University;",
        "aff_domain": "stevens.edu;cornell.edu;;cornell.edu;",
        "position": "PhD student;PhD;;Associate Professor;",
        "bibtex": "@misc{\ncheng2024sagman,\ntitle={{SAGMAN}: Stability Analysis of Graph Neural Networks ({GNN}s) on the Manifolds},\nauthor={Wuxinlin Cheng and Chenhui Deng and Ali Aghdaei and Zhiru Zhang and Zhuo Feng},\nyear={2024},\nurl={https://openreview.net/forum?id=wZNJ7rj1ok}\n}",
        "github": "",
        "project": "",
        "reviewers": "qUi4;9cB9;KuBc;eSPk;yWiM",
        "site": "https://openreview.net/forum?id=wZNJ7rj1ok",
        "pdf_size": 1085162,
        "rating": "3;3;5;5;6",
        "confidence": "3;4;3;3;3",
        "soundness": "2;3;3;2;4",
        "contribution": "2;2;3;2;3",
        "presentation": "3;2;3;2;2",
        "wc_summary": "70;65;32;66;69",
        "wc_strengths": "34;36;59;46;152",
        "wc_weaknesses": "83;42;129;256;216",
        "wc_questions": "6;157;107;5;99",
        "wc_review": "193;300;327;373;536",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            4.4,
            1.2
        ],
        "confidence_avg": [
            3.2,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.8,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            60.4,
            14.319217855735
        ],
        "wc_strengths_avg": [
            65.4,
            44.19773749865484
        ],
        "wc_weaknesses_avg": [
            145.2,
            80.0884511025154
        ],
        "wc_questions_avg": [
            74.8,
            59.97466131625922
        ],
        "wc_review_avg": [
            345.8,
            111.99535704662046
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5833333333333335,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:l1dESMZiks8J:scholar.google.com/&scioq=SAGMAN:+Stability+Analysis+of+Graph+Neural+Networks+(GNNs)+on+the+Manifolds&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Stevens Institute of Technology;Cornell University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.stevens.edu;https://www.cornell.edu",
        "aff_unique_abbr": "SIT;Cornell",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Game-Theoretic Robust Reinforcement Learning Handles Temporally-Coupled Perturbations",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17489",
        "id": "wZWTHU7AsQ",
        "author_site": "Yongyuan Liang, Yanchao Sun, Ruijie Zheng, Xiangyu Liu, Benjamin Eysenbach, Tuomas Sandholm, Furong Huang, Stephen McAleer",
        "tldr": "",
        "abstract": "Deploying reinforcement learning (RL) systems requires robustness to uncertainty and model misspecification, yet prior robust RL methods typically only study noise introduced independently across time. However, practical sources of uncertainty are usually coupled across time.\nWe formally introduce temporally-coupled perturbations, presenting a novel challenge for existing robust RL methods. To tackle this challenge, we propose GRAD, a novel game-theoretic approach that treats the temporally-coupled robust RL problem as a partially-observable two-player zero-sum game. By finding an approximate equilibrium within this game, GRAD optimizes for general robustness against temporally-coupled perturbations. Experiments on continuous control tasks demonstrate that, compared with prior methods, our approach achieves a higher degree of robustness to various types of attacks on different attack domains, both in settings with temporally-coupled perturbations and decoupled perturbations.",
        "keywords": "Reinforcement Learning;Robustness;Adversarial Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Yongyuan Liang;Yanchao Sun;Ruijie Zheng;Xiangyu Liu;Benjamin Eysenbach;Tuomas Sandholm;Furong Huang;Stephen Marcus McAleer",
        "authorids": "~Yongyuan_Liang1;~Yanchao_Sun1;~Ruijie_Zheng1;~Xiangyu_Liu4;~Benjamin_Eysenbach1;~Tuomas_Sandholm1;~Furong_Huang1;~Stephen_Marcus_McAleer1",
        "gender": "F;F;;M;M;M;F;M",
        "homepage": "https://cheryyunl.github.io/;https://ycsun2017.github.io/home/index.html;http://www.ruijiezheng.com;https://xiangyu-liu.github.io;https://ben-eysenbach.github.io/;http://www.cs.cmu.edu/~sandholm;https://furong-huang.com;https://www.andrew.cmu.edu/user/smcaleer/",
        "dblp": "238/4104;132/6840;294/8474;;192/1863;s/TuomasSandholm;72/8513;",
        "google_scholar": "GQToORIAAAAJ;bloBY_QAAAAJ;;;DRnOvU8AAAAJ;0DpK1EMAAAAJ;13yyuCcAAAAJ;iEFL4-YAAAAJ",
        "orcid": ";0000-0002-1137-9939;;;0009-0000-7136-6307;;;",
        "linkedin": "https://linkedin.com/in/yongyuan-l-31462a17a;;;;benjamin-eysenbach-a7235775/;;;stephen-mcaleer/",
        "or_profile": "~Yongyuan_Liang1;~Yanchao_Sun1;~Ruijie_Zheng1;~Xiangyu_Liu4;~Benjamin_Eysenbach1;~Tuomas_Sandholm1;~Furong_Huang1;~Stephen_Marcus_McAleer1",
        "aff": "University of Maryland, College Park;J.P. Morgan AI Research;University of Maryland, College Park;University of Maryland, College Park;Princeton University;Carnegie Mellon University;University of Maryland;Carnegie Mellon University",
        "aff_domain": "umd.edu;jpmchase.com;cs.umd.edu;umd.edu;princeton.edu;cmu.edu;cs.umd.edu;cmu.edu",
        "position": "PhD student;Researcher;PhD student;PhD student;Assistant Professor;Full Professor;Assistant Professor;Postdoc",
        "bibtex": "@inproceedings{\nliang2024gametheoretic,\ntitle={Game-Theoretic Robust Reinforcement Learning Handles Temporally-Coupled Perturbations},\nauthor={Yongyuan Liang and Yanchao Sun and Ruijie Zheng and Xiangyu Liu and Benjamin Eysenbach and Tuomas Sandholm and Furong Huang and Stephen Marcus McAleer},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=wZWTHU7AsQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "GZCq;mjop;JmX3",
        "pdf_size": 3015578,
        "rating": "5;5;6",
        "confidence": "4;4;5",
        "soundness": "2;2;4",
        "contribution": "2;2;3",
        "presentation": "2;2;4",
        "wc_summary": "93;57;53",
        "wc_strengths": "22;34;54",
        "wc_weaknesses": "290;148;492",
        "wc_questions": "13;9;1",
        "wc_review": "418;248;600",
        "wc_reply_reviewers": "26;193;40",
        "wc_reply_authors": "1384;2152;912",
        "reply_reviewers": "1;3;1",
        "reply_authors": "6;6;4",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            67.66666666666667,
            17.98765008430939
        ],
        "wc_strengths_avg": [
            36.666666666666664,
            13.199326582148887
        ],
        "wc_weaknesses_avg": [
            310.0,
            141.14767680222963
        ],
        "wc_questions_avg": [
            7.666666666666667,
            4.988876515698588
        ],
        "wc_review_avg": [
            422.0,
            143.7312306587078
        ],
        "wc_reply_reviewers_avg": [
            86.33333333333333,
            75.64096479788948
        ],
        "wc_reply_authors_avg": [
            1482.6666666666667,
            511.0129374313553
        ],
        "reply_reviewers_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            5.333333333333333,
            0.9428090415820634
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.9999999999999998,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4116204954480709263&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=wZWTHU7AsQ",
        "pdf": "https://openreview.net/pdf?id=wZWTHU7AsQ",
        "email": "umd.edu;jpmchase.com;cs.umd.edu;umd.edu;princeton.edu;cmu.edu;cs.umd.edu;cmu.edu",
        "author_num": 8,
        "aff_unique_index": "0;1;0;0;2;3;0;3",
        "aff_unique_norm": "University of Maryland;J.P. Morgan;Princeton University;Carnegie Mellon University",
        "aff_unique_dep": ";AI Research;;",
        "aff_unique_url": "https://www/umd.edu;https://www.jpmorgan.com;https://www.princeton.edu;https://www.cmu.edu",
        "aff_unique_abbr": "UMD;JPM;Princeton;CMU",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "College Park;",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Counterfactual Density Estimation using Kernel Stein Discrepancies",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17488",
        "id": "wZXlEFO3tZ",
        "author_site": "Diego Martinez-Taboada, Edward Kennedy",
        "tldr": "",
        "abstract": "Causal effects are usually studied in terms of the means of counterfactual distributions, which may be insufficient in many scenarios. Given a class of densities known up to normalizing constants, we propose to model counterfactual distributions by minimizing kernel Stein discrepancies in a doubly robust manner. This enables the estimation of counterfactuals over large classes of distributions while exploiting the desired double robustness. We present a theoretical analysis of the proposed estimator, providing sufficient conditions for consistency and asymptotic normality, as well as an examination of its empirical performance.",
        "keywords": "counterfactual density estimation;kernel Stein discrepancy;causal inference;kernel methods",
        "primary_area": "causal reasoning",
        "supplementary_material": "/attachment/25b58affa46ac68e7a19c7b213876b9fc42dc559.zip",
        "author": "Diego Martinez-Taboada;Edward Kennedy",
        "authorids": "~Diego_Martinez-Taboada1;~Edward_Kennedy1",
        "gender": "M;M",
        "homepage": ";http://www.ehkennedy.com/",
        "dblp": "331/8680;222/3133",
        "google_scholar": "9-p1MCsAAAAJ;dXztgDYAAAAJ",
        "orcid": ";",
        "linkedin": "diego-martinez-taboada/;",
        "or_profile": "~Diego_Martinez-Taboada1;~Edward_Kennedy1",
        "aff": "Carnegie Mellon University;Carnegie Mellon University",
        "aff_domain": "cmu.edu;cmu.edu",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nmartinez-taboada2024counterfactual,\ntitle={Counterfactual Density Estimation using Kernel Stein Discrepancies},\nauthor={Diego Martinez-Taboada and Edward Kennedy},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=wZXlEFO3tZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "bMPy;nhik;d5Rs;kcoz",
        "pdf_size": 607654,
        "rating": "5;6;6;8",
        "confidence": "3;2;4;4",
        "soundness": "3;2;3;4",
        "contribution": "3;3;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "86;58;58;24",
        "wc_strengths": "162;93;112;32",
        "wc_weaknesses": "104;81;60;126",
        "wc_questions": "4;44;142;49",
        "wc_review": "356;276;372;231",
        "wc_reply_reviewers": "0;28;0;19",
        "wc_reply_authors": "248;519;786;757",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            56.5,
            21.97157254271983
        ],
        "wc_strengths_avg": [
            99.75,
            46.53157530107916
        ],
        "wc_weaknesses_avg": [
            92.75,
            24.71209218176397
        ],
        "wc_questions_avg": [
            59.75,
            50.588412704887276
        ],
        "wc_review_avg": [
            308.75,
            57.77272280237448
        ],
        "wc_reply_reviewers_avg": [
            11.75,
            12.173228823939851
        ],
        "wc_reply_authors_avg": [
            577.5,
            216.61313441248203
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.48420012470625223,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17946627368971212731&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=wZXlEFO3tZ",
        "pdf": "https://openreview.net/pdf?id=wZXlEFO3tZ",
        "email": "cmu.edu;cmu.edu",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Carnegie Mellon University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cmu.edu",
        "aff_unique_abbr": "CMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "wZXwP3H5t6",
        "title": "Faster and Accurate Neural Networks with Semantic Inference",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep neural networks (DNNs) usually come with a significant computational and data labeling burden. While approaches such as structured pruning and mobile-specific DNNs have been proposed, they incur in drastic accuracy loss. Conversely from prior work, in this paper we leverage the intrinsic redundancy in latent representations to drastically reduce the computational load with very limited loss in performance. Specifically, we show that semantically similar inputs share a significant number of filter activations, especially in the earlier layers. As such, semantically similar classes can be \u201cclustered\u201d so as to create cluster-specific subgraphs. These may be \u201cturned on\u201d when an input belonging to a semantic cluster is being presented to the DNN, while the rest of the DNN can be \u201cturned off\u201d. To this end, we propose a new framework called Semantic Inference (SINF). In short, SINF (i) identifies the semantic cluster the object belongs to using a small additional classifier; and then (ii) executes the subgraph extracted from the base DNN related to that semantic cluster to perform the inference. To extract each cluster-specific subgraph, we propose a new approach named Discriminative Capability Score (DCS) that effectively finds the subgraph with the capability to discriminate among the members of a specific semantic cluster. Importantly, DCS is independent from SINF, as it is a general-purpose quantity that can be applied to any DNN. We benchmark the performance of DCS on the VGG16, VGG19, and ResNet50 DNNs trained on the CIFAR100 dataset against 6 state-of-the-art pruning approaches. Our results show that (i) SINF reduces the inference time of VGG19, VGG16, and ResNet50 respectively by up to 35%, 29% and 15% with only 0.17%, 3.75%, and 6.75% accuracy loss; (ii) DCS achieves respectively up to 3.65%, 4.25%, and 2.36% better accuracy with VGG16, VGG19, and ResNet50 with respect to existing discriminative scores; (iii) when used as a pruning criterion, DCS achieves up to 8.13% accuracy gain with 5.82% less parameters than the existing state of the art work published at ICLR 2023; (iv) when considering per-cluster accuracy, SINF performs on average 5.73%, 8.38% and 6.36% better than the base VGG16, VGG19, and ResNet50. We share our code for reproducibility.",
        "keywords": "Semantic Inference;Semantic Pruning;Deep Learning;Efficient Neural Networks",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "A. Q. M. Sazzad Sayyed;Jonathan Ashdown;Francesco Restuccia",
        "authorids": "~A._Q._M._Sazzad_Sayyed1;~Jonathan_Ashdown1;~Francesco_Restuccia2",
        "gender": "M;M;",
        "homepage": ";;",
        "dblp": "271/4662;;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;yX5A_YsAAAAJ;",
        "orcid": "0009-0005-3307-2953;;",
        "linkedin": "sazzad-sayyed-74a4a4180;jonathan-ashdown-ph-d-2b77486?challengeId=AQGOjWrIOHUCzgAAAYq9kbViN1jtidgrXWcO0E3rOmQwr57a7A_bM_zDlDxnelGu_jgi_CvKFXYkG1jHzMAVNkNE4-ri_0QBpA&submissionId=82501683-1843-8717-5705-0957963c2a5b&challengeSource=AgEkxNyHfDrltQAAAYq9ketAWZfTPLLD72rGA62Nfr766EfgPRw46mAQLPOZBr4&challegeType=AgESG3Ah35NiCgAAAYq9ketCIQadzOn8CK8N0Jd5VU-UK5SdcU--gDE&memberId=AgFy4cLfN8Dc0AAAAYq9ketF5VKdKGLx4wJNukPckt_W0dE&recognizeDevice=AgFn9bnEvTRwFwAAAYq9ketIYb0c9B9JS0TaH46R0AGkPlRgfcOG;",
        "or_profile": "~A._Q._M._Sazzad_Sayyed1;~Jonathan_Ashdown1;~Francesco_Restuccia2",
        "aff": "Northeastern University;Air Force Research Laboratory;",
        "aff_domain": "neu.edu;us.af.mil;",
        "position": "PhD student;Researcher;",
        "bibtex": "@misc{\nsayyed2024faster,\ntitle={Faster and Accurate Neural Networks with Semantic Inference},\nauthor={A. Q. M. Sazzad Sayyed and Jonathan Ashdown and Francesco Restuccia},\nyear={2024},\nurl={https://openreview.net/forum?id=wZXwP3H5t6}\n}",
        "github": "",
        "project": "",
        "reviewers": "n596;wsBg;wsaJ;NR9c",
        "site": "https://openreview.net/forum?id=wZXwP3H5t6",
        "pdf_size": 974335,
        "rating": "3;3;5;6",
        "confidence": "4;4;2;3",
        "soundness": "2;2;2;2",
        "contribution": "2;2;3;3",
        "presentation": "1;2;1;3",
        "wc_summary": "119;66;92;138",
        "wc_strengths": "41;31;35;83",
        "wc_weaknesses": "1152;156;269;80",
        "wc_questions": "5;10;66;39",
        "wc_review": "1317;263;462;340",
        "wc_reply_reviewers": "0;0;164;0",
        "wc_reply_authors": "1808;836;869;609",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "3;2;2;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            103.75,
            27.24311839712921
        ],
        "wc_strengths_avg": [
            47.5,
            20.80264406271472
        ],
        "wc_weaknesses_avg": [
            414.25,
            431.21594068401504
        ],
        "wc_questions_avg": [
            30.0,
            24.50510150968569
        ],
        "wc_review_avg": [
            595.5,
            422.5579841867859
        ],
        "wc_reply_reviewers_avg": [
            41.0,
            71.01408311032397
        ],
        "wc_reply_authors_avg": [
            1030.5,
            459.91330704818705
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.7543365091413573,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:BAr64XrOahMJ:scholar.google.com/&scioq=Faster+and+Accurate+Neural+Networks+with+Semantic+Inference&hl=en&as_sdt=0,5",
        "gs_version_total": 5,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Northeastern University;Air Force Research Laboratory",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.northeastern.edu;https://www.afrl.af.mil/",
        "aff_unique_abbr": "NEU;AFRL",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "wabp68RoSP",
        "title": "Active Prompting with Chain-of-Thought for Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The increasing scale of large language models (LLMs) brings emergent abilities to various complex tasks requiring reasoning, such as arithmetic and commonsense reasoning. It is known that the effective design of task-specific prompts is critical for LLMs' ability to produce high-quality answers. In particular, an effective approach for complex question-and-answering tasks is example-based prompting with chain-of-thought (CoT) reasoning, which significantly improves the performance of LLMs. However, current CoT methods rely on a fixed set of human-annotated exemplars, which are not necessarily the most effective examples for different tasks. This paper proposes a new method, Active-Prompt, to adapt LLMs to different tasks with task-specific example prompts (annotated with human-designed CoT reasoning). For this purpose, we propose a solution to the key problem of determining which questions are the most important and helpful to annotate from a pool of task-specific queries. By borrowing ideas from the related problem of uncertainty-based active learning, we introduce several metrics to characterize the uncertainty so as to select the most uncertain questions for annotation. Experimental results demonstrate the superiority of our proposed method, achieving superior performance on eight complex reasoning tasks. Further analyses of different uncertainty metrics, pool sizes, zero-shot learning, and accuracy-uncertainty relationships demonstrate the effectiveness of our method.",
        "keywords": "large language models;chain-of-thought;prompt tuning",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Shizhe Diao;Pengcheng Wang;LIN Yong;Rui Pan;Xiang Liu;Tong Zhang",
        "authorids": "~Shizhe_Diao2;~Pengcheng_Wang2;~LIN_Yong1;~Rui_Pan4;~Xiang_Liu10;~Tong_Zhang2",
        "gender": ";M;;M;M;M",
        "homepage": ";;;;https://dominic789654.github.io/;http://tongzhang-ml.org",
        "dblp": ";;;74/9957;31/5736-1;07/4227-1",
        "google_scholar": ";https://scholar.google.ca/citations?hl=en;;;VtK5lwUAAAAJ;LurWtuYAAAAJ",
        "orcid": ";0000-0002-4012-9293;;0000-0001-7217-0656;;0000-0002-5511-2558",
        "linkedin": ";pengcheng-wang-147105201?lipi=urn%3Ali%3Apage%3Ad_flagship3_profile_view_base_contact_details%3BP5Fksq3cQjiY%2FdPqcfv7sw%3D%3D;;;;",
        "or_profile": "~Shizhe_Diao2;~Pengcheng_Wang2;~LIN_Yong1;~Rui_Pan4;~Xiang_Liu10;~Tong_Zhang2",
        "aff": ";University of Toronto;;Hong Kong University of Science and Technology;Hong Kong University of Science and Technology (Guang Zhou));UIUC",
        "aff_domain": ";utoronto.ca;;ust.hk;hkust-gz.edu.cn;illinois.edu",
        "position": ";Undergrad student;;MS student;PhD student;Full Professor",
        "bibtex": "@misc{\ndiao2024active,\ntitle={Active Prompting with Chain-of-Thought for Large Language Models},\nauthor={Shizhe Diao and Pengcheng Wang and LIN Yong and Rui Pan and Xiang Liu and Tong Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=wabp68RoSP}\n}",
        "github": "",
        "project": "",
        "reviewers": "DkmB;Wb4R;hZjq;1P1b",
        "site": "https://openreview.net/forum?id=wabp68RoSP",
        "pdf_size": 820372,
        "rating": "1;3;5;6",
        "confidence": "5;4;4;4",
        "soundness": "1;2;3;3",
        "contribution": "1;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "78;154;113;82",
        "wc_strengths": "13;30;55;59",
        "wc_weaknesses": "443;288;80;178",
        "wc_questions": "22;72;37;172",
        "wc_review": "556;544;285;491",
        "wc_reply_reviewers": "0;387;0;58",
        "wc_reply_authors": "1129;1835;426;1238",
        "reply_reviewers": "0;2;0;1",
        "reply_authors": "3;4;2;4",
        "rating_avg": [
            3.75,
            1.920286436967152
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            106.75,
            30.457962834043908
        ],
        "wc_strengths_avg": [
            39.25,
            18.793283374652763
        ],
        "wc_weaknesses_avg": [
            247.25,
            134.8580271989769
        ],
        "wc_questions_avg": [
            75.75,
            58.45671475544961
        ],
        "wc_review_avg": [
            469.0,
            109.01146728670338
        ],
        "wc_reply_reviewers_avg": [
            111.25,
            160.95554510485186
        ],
        "wc_reply_authors_avg": [
            1157.0,
            500.34737932760277
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.25,
            0.82915619758885
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.8268106308031117,
        "gs_citation": 212,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17725091160210782686&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "University of Toronto;Hong Kong University of Science and Technology;University of Illinois Urbana-Champaign",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.utoronto.ca;https://www.ust.hk;https://www illinois.edu",
        "aff_unique_abbr": "U of T;HKUST;UIUC",
        "aff_campus_unique_index": "1;1;2",
        "aff_campus_unique": ";Hong Kong SAR;Urbana-Champaign",
        "aff_country_unique_index": "0;1;1;2",
        "aff_country_unique": "Canada;China;United States"
    },
    {
        "id": "waeGeAdZUx",
        "title": "AdaRec: Adaptive Sequential Recommendation for Reinforcing Long-term User Engagement",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Growing attention has been paid to Reinforcement Learning (RL) algorithms when optimizing long-term user engagement in sequential recommendation tasks. One challenge in large-scale online recommendation systems is the constant and complicated changes in users' behavior patterns, such as interaction rates and retention tendencies. When formulated as a Markov Decision Process (MDP), the dynamics and reward functions of the recommendation system are continuously affected by these changes. Existing RL algorithms for recommendation systems will suffer from distribution shift and struggle to adapt in such an MDP. In this paper, we introduce a novel paradigm called Adaptive Sequential Recommendation (AdaRec) to address this issue. AdaRec proposes a new distance-based representation loss to extract latent information from users' interaction trajectories. Such information reflects how RL policy fits to current user behavior patterns, and helps the policy to identify subtle changes in the recommendation system.\nTo make rapid adaptation to these changes, AdaRec encourages exploration with the idea of optimism under uncertainty. The exploration is further guarded by zero-order action optimization to ensure stable recommendation quality in complicated environments. We conduct extensive empirical analyses in both simulator-based and live sequential recommendation tasks, where AdaRec exhibits superior long-term performance compared to all baseline algorithms.",
        "keywords": "reinforcement learning;recommendation systems;long-term user retention;distribution shift",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Zhenghai Xue;Qingpeng Cai;Tianyou Zuo;Bin Yang;Lantao Hu;Peng Jiang;Kun Gai;Bo An",
        "authorids": "~Zhenghai_Xue1;~Qingpeng_Cai2;~Tianyou_Zuo1;~Bin_Yang13;~Lantao_Hu1;~Peng_Jiang6;~Kun_Gai1;~Bo_An2",
        "gender": ";M;M;M;M;M;M;M",
        "homepage": ";https://qingpengcai.github.io/;http://leju.com;https://www.zhihu.com/people/hui-yuan-jia-gei-liao-ke-nan;;;;https://personal.ntu.edu.sg/boan/",
        "dblp": ";183/0940-1;;;;;59/2902;42/6178-1.html",
        "google_scholar": ";uU6s1tYAAAAJ;;;P0EK1y8AAAAJ;https://scholar.google.com/citations?hl=en;PXO4ygEAAAAJ;PEEpuNwAAAAJ",
        "orcid": ";0000-0001-6451-9299;;;;0000-0002-9266-0780;;0000-0002-7064-7438",
        "linkedin": ";;;;;;;",
        "or_profile": "~Zhenghai_Xue1;~Qingpeng_Cai2;~Tianyou_Zuo1;~Bin_Yang13;~Lantao_Hu1;~Peng_Jiang6;~Kun_Gai1;~Bo_An2",
        "aff": ";Kuaishou;;;;Kuaishou Technology;Kuaishou- \u5feb\u624b\u79d1\u6280;Nanyang Technological University",
        "aff_domain": ";kuaishou.com;;;;kuaishou.com;kuaishou.com;ntu.edu.sg",
        "position": ";Senior Staff Algorithm Engineer;;;;Vice President;Instructor;Full Professor",
        "bibtex": "@misc{\nxue2024adarec,\ntitle={AdaRec: Adaptive Sequential Recommendation for Reinforcing Long-term User Engagement},\nauthor={Zhenghai Xue and Qingpeng Cai and Tianyou Zuo and Bin Yang and Lantao Hu and Peng Jiang and Kun Gai and Bo An},\nyear={2024},\nurl={https://openreview.net/forum?id=waeGeAdZUx}\n}",
        "github": "",
        "project": "",
        "reviewers": "TqZE;dRAr;kKUq",
        "site": "https://openreview.net/forum?id=waeGeAdZUx",
        "pdf_size": 1020564,
        "rating": "3;6;6",
        "confidence": "4;3;3",
        "soundness": "2;2;3",
        "contribution": "2;3;3",
        "presentation": "2;2;3",
        "wc_summary": "99;90;140",
        "wc_strengths": "41;71;85",
        "wc_weaknesses": "276;151;30",
        "wc_questions": "6;22;11",
        "wc_review": "422;334;266",
        "wc_reply_reviewers": "0;0;33",
        "wc_reply_authors": "1126;858;260",
        "reply_reviewers": "0;0;1",
        "reply_authors": "4;3;1",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            109.66666666666667,
            21.761331658599286
        ],
        "wc_strengths_avg": [
            65.66666666666667,
            18.354533197248273
        ],
        "wc_weaknesses_avg": [
            152.33333333333334,
            100.43350481233287
        ],
        "wc_questions_avg": [
            13.0,
            6.683312551921141
        ],
        "wc_review_avg": [
            340.6666666666667,
            63.860960079082915
        ],
        "wc_reply_reviewers_avg": [
            11.0,
            15.556349186104045
        ],
        "wc_reply_authors_avg": [
            748.0,
            361.99815837468935
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14189948264966864621&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "Kuaishou Technology;Nanyang Technological University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.kuaishou.com;https://www.ntu.edu.sg",
        "aff_unique_abbr": "Kuaishou;NTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "China;Singapore"
    },
    {
        "id": "wcKGK0tRHD",
        "title": "The Trifecta: Three simple techniques for training deeper Forward-Forward networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Modern machine learning models are able to outperform humans on a variety of non-trivial tasks. However, as the complexity of the models increases, they consume significant amounts of power and still struggle to generalize effectively to unseen data. Local learning, which focuses on updating subsets of a model\u2019s parameters at a time, has emerged as a promising technique to address these issues. Recently, a novel local learning algorithm, called Forward-Forward, has received widespread attention due to its innovative approach to learning. Unfortunately, its application has been limited to smaller datasets due to scalability issues. To this end, we propose The Trifecta, a collection of three simple techniques that synergize exceptionally well and drastically improve the Forward-Forward algorithm on deeper networks. Our experiments demonstrate that our models are on par with similarly structured, backpropagation-based models in both training speed and test accuracy on simple datasets. This is achieved by the ability to learn representations that are informative locally, on a layer-by-layer basis, and retain their informativeness when propagated to deeper layers in the architecture. This leads to around 84% accuracy on CIFAR-10, a notable improvement (25%) over the original FF algorithm. These results highlight the potential of Forward-Forward as a genuine competitor to backpropagation and as a promising research avenue.",
        "keywords": "Forward-Forward;Deep Learning;Local Learning;Representation Learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/c69cf7ff83e472a27a269e316955012d92b65d68.zip",
        "author": "Thomas Dooms;Ing Jyh Tsang;Jose Oramas",
        "authorids": "~Thomas_Dooms1;~Ing_Jyh_Tsang1;~Jose_Oramas1",
        "gender": "M;M;M",
        "homepage": "https://tdooms.github.io/;;http://idlab.uantwerpen.be/~joramasmogrovejo",
        "dblp": "362/3314;;47/9735",
        "google_scholar": "PPakd2AAAAAJ;YiSnYf0AAAAJ;FurBYlUAAAAJ",
        "orcid": "0009-0001-8534-2450;0000-0002-8104-0164;0000-0002-8607-5067",
        "linkedin": "thomas-dooms-5518a4169/;;https://linkedin.com/in/jos%C3%A9-oramas-m-3183501b",
        "or_profile": "~Thomas_Dooms1;~Ing_Jyh_Tsang1;~Jose_Oramas1",
        "aff": "Universiteit Antwerpen;Universiteit Antwerpen;University of Antwerp",
        "aff_domain": "ua.ac.be;ua.ac.be;uantwerpen.be",
        "position": "PhD student;Principal Researcher;Associate Professor",
        "bibtex": "@misc{\ndooms2024the,\ntitle={The Trifecta: Three simple techniques for training deeper Forward-Forward networks},\nauthor={Thomas Dooms and Ing Jyh Tsang and Jose Oramas},\nyear={2024},\nurl={https://openreview.net/forum?id=wcKGK0tRHD}\n}",
        "github": "",
        "project": "",
        "reviewers": "kPrg;i3k6;xPoW;ugNW",
        "site": "https://openreview.net/forum?id=wcKGK0tRHD",
        "pdf_size": 6034048,
        "rating": "3;5;6;6",
        "confidence": "5;4;4;2",
        "soundness": "2;3;3;3",
        "contribution": "1;3;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "90;209;87;107",
        "wc_strengths": "62;63;54;105",
        "wc_weaknesses": "208;270;44;224",
        "wc_questions": "48;36;124;132",
        "wc_review": "408;578;309;568",
        "wc_reply_reviewers": "236;87;42;0",
        "wc_reply_authors": "813;868;628;1130",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "2;3;2;3",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            123.25,
            50.091790744592075
        ],
        "wc_strengths_avg": [
            71.0,
            19.937402037376884
        ],
        "wc_weaknesses_avg": [
            186.5,
            85.36246247619617
        ],
        "wc_questions_avg": [
            85.0,
            43.30127018922193
        ],
        "wc_review_avg": [
            465.75,
            112.87243906286423
        ],
        "wc_reply_reviewers_avg": [
            91.25,
            89.05440752708425
        ],
        "wc_reply_authors_avg": [
            859.75,
            179.5805877593678
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.7492686492653551,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14891968612351127047&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Antwerp",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uantwerp.be",
        "aff_unique_abbr": "UA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Belgium"
    },
    {
        "title": "Uni3D: Exploring Unified 3D Representation at Scale",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17487",
        "id": "wcaE4Dfgt8",
        "author_site": "Junsheng Zhou, Jinsheng Wang, Baorui Ma, Yu-Shen Liu, Tiejun Huang, Xinlong Wang",
        "tldr": "",
        "abstract": "Scaling up representations for images or text has been extensively investigated in the past few years and has led to revolutions in learning vision and language. However, scalable representation for 3D objects and scenes is relatively unexplored. In this work, we present Uni3D, a 3D foundation model to explore the unified 3D representation at scale. Uni3D uses a 2D initialized ViT end-to-end pretrained to align the 3D point cloud features with the image-text aligned features. Via the simple architecture and pretext task, Uni3D can leverage abundant 2D pretrained models as initialization and image-text aligned models as the target, unlocking the great potential of 2D model zoos and scaling-up strategies to the 3D world. We efficiently scale up Uni3D to one billion parameters, and set new records on a broad range of 3D tasks, such as zero-shot classification, few-shot classification, open-world understanding and zero-shot part segmentation.  We show that the strong Uni3D representation also enables applications such as 3D painting and retrieval in the wild. We believe that Uni3D provides a new direction for exploring both scaling up and efficiency of the representation in 3D domain.",
        "keywords": "3D foundation model;universal 3D representation at scale;open-world 3D understanding",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/faa9c60de4708964c812830867850f95fe6e9169.zip",
        "author": "Junsheng Zhou;Jinsheng Wang;Baorui Ma;Yu-Shen Liu;Tiejun Huang;Xinlong Wang",
        "authorids": "~Junsheng_Zhou3;~Jinsheng_Wang1;~Baorui_Ma1;~Yu-Shen_Liu1;~Tiejun_Huang1;~Xinlong_Wang2",
        "gender": "M;M;;M;M;M",
        "homepage": "https://junshengzhou.github.io/;;;https://yushen-liu.github.io/;https://idm.pku.edu.cn/~tjhuang/;",
        "dblp": ";;;44/2229.html;h/TiejunHuang;",
        "google_scholar": "afPIrLYAAAAJ;e2aVlcYAAAAJ;;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com.tw/citations?user=knvEK4AAAAAJ;DPz0DjYAAAAJ",
        "orcid": ";;;0000-0001-7305-1915;0000-0002-4234-6099;",
        "linkedin": ";jinsheng-wang-537510172/;;;;",
        "or_profile": "~Junsheng_Zhou3;~Jinsheng_Wang1;~Baorui_Ma1;~Yu-Shen_Liu1;~Tiejun_Huang1;~Xinlong_Wang2",
        "aff": "Tsinghua University;BAAI;;Tsinghua University;Peking University;Beijing Academy of Artificial Intelligence",
        "aff_domain": "tsinghua.edu.cn;baai.ac.cn;;tsinghua.edu.cn;pku.edu.cn;baai.ac.cn",
        "position": "MS student;Technical Staff;;Associate Professor;Full Professor;Researcher",
        "bibtex": "@inproceedings{\nzhou2024unid,\ntitle={Uni3D: Exploring Unified 3D Representation at Scale},\nauthor={Junsheng Zhou and Jinsheng Wang and Baorui Ma and Yu-Shen Liu and Tiejun Huang and Xinlong Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=wcaE4Dfgt8}\n}",
        "github": "",
        "project": "",
        "reviewers": "1Xtq;8Neg;7VZo",
        "pdf_size": 24736869,
        "rating": "6;8;8",
        "confidence": "4;4;5",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "3;3;3",
        "wc_summary": "57;98;113",
        "wc_strengths": "36;107;48",
        "wc_weaknesses": "25;171;149",
        "wc_questions": "207;6;115",
        "wc_review": "325;382;425",
        "wc_reply_reviewers": "0;28;34",
        "wc_reply_authors": "1265;1227;830",
        "reply_reviewers": "0;1;2",
        "reply_authors": "3;3;3",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            89.33333333333333,
            23.66901396810231
        ],
        "wc_strengths_avg": [
            63.666666666666664,
            31.030450993965413
        ],
        "wc_weaknesses_avg": [
            115.0,
            64.27026269330682
        ],
        "wc_questions_avg": [
            109.33333333333333,
            82.15567877849683
        ],
        "wc_review_avg": [
            377.3333333333333,
            40.95797304012438
        ],
        "wc_reply_reviewers_avg": [
            20.666666666666668,
            14.817407180595245
        ],
        "wc_reply_authors_avg": [
            1107.3333333333333,
            196.7169427262318
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            3.0,
            0.0
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 99,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17881140986724591417&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=wcaE4Dfgt8",
        "pdf": "https://openreview.net/pdf?id=wcaE4Dfgt8",
        "email": "tsinghua.edu.cn;baai.ac.cn;;tsinghua.edu.cn;pku.edu.cn;baai.ac.cn",
        "author_num": 6,
        "aff_unique_index": "0;1;0;2;1",
        "aff_unique_norm": "Tsinghua University;Beijing Academy of Artificial Intelligence;Peking University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.baaic.cn;http://www.pku.edu.cn",
        "aff_unique_abbr": "THU;BAAI;Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "wceM64q7Pd",
        "title": "Depth From Camera Model",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Depth estimation is pivotal for robotics and vision-centric tasks. In monocular depth estimation, supervised learning methods typically necessitate expensive ground truth labeling. Despite their accuracy, they come with higher costs compared to self-supervised methods. Nevertheless, supervised methods outperform self-supervised ones in depth estimation accuracy. In the era of deep learning, many methods focus on leveraging image relationships to train neural networks. However, the intrinsic and extrinsic properties of the camera, which can offer a wealth of supervisory data, are often overlooked. By tapping into the camera's inherent properties, depth information for ground regions and areas connected to the ground can be deduced based on physical principles. This approach capitalizes on freely available depth prior without the need for additional sensors. It is a straightforward methodology that can be integrated to bolster the efficiency of existing supervised methods.",
        "keywords": "Depth Estimation;Camera Model;3D Reconstruction",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Praveen Kamasani;Jinchang Zhang;Xue Iuan Wong;Guoyu Lu",
        "authorids": "praveenkumarreddy.kamasani@uga.edu;jz23267@uga.edu;xwong@ford.com;~Guoyu_Lu4",
        "gender": ";;;M",
        "homepage": ";;;https://engineering.uga.edu/people/profile/guoyu-lu-ph.d",
        "dblp": ";;;120/8962.html",
        "google_scholar": ";;;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "praveenkumarreddy.kamasani@uga.edu;jz23267@uga.edu;xwong@ford.com;~Guoyu_Lu4",
        "aff": ";;;University of Georgia",
        "aff_domain": ";;;uga.edu",
        "position": ";;;Assistant Professor",
        "bibtex": "@misc{\nkamasani2024depth,\ntitle={Depth From Camera Model},\nauthor={Praveen Kamasani and Jinchang Zhang and Xue Iuan Wong and Guoyu Lu},\nyear={2024},\nurl={https://openreview.net/forum?id=wceM64q7Pd}\n}",
        "github": "",
        "project": "",
        "reviewers": "kWg1;xfJw;NJBE;hgLh",
        "site": "https://openreview.net/forum?id=wceM64q7Pd",
        "pdf_size": 9008470,
        "rating": "3;3;3;3",
        "confidence": "5;4;4;5",
        "soundness": "2;2;3;2",
        "contribution": "2;2;2;2",
        "presentation": "3;2;2;2",
        "wc_summary": "73;61;60;87",
        "wc_strengths": "30;64;52;132",
        "wc_weaknesses": "98;205;484;538",
        "wc_questions": "77;192;35;58",
        "wc_review": "278;522;631;815",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            70.25,
            10.940178243520533
        ],
        "wc_strengths_avg": [
            69.5,
            38.08871223866725
        ],
        "wc_weaknesses_avg": [
            331.25,
            184.67725225376296
        ],
        "wc_questions_avg": [
            90.5,
            60.45866356445534
        ],
        "wc_review_avg": [
            561.5,
            194.30967551823042
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Georgia",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.uga.edu",
        "aff_unique_abbr": "UGA",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Unleashing the Potential of Fractional Calculus in Graph Neural Networks with FROND",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17486",
        "id": "wcka3bd7P4",
        "author_site": "Qiyu Kang, Kai Zhao, Qinxu Ding, Feng Ji, Xuhao Li, Wenfei Liang, Yang Song, Wee Peng Tay",
        "tldr": "",
        "abstract": "We introduce the FRactional-Order graph Neural Dynamical network (FROND), a new continuous graph neural network (GNN) framework. Unlike traditional continuous GNNs that rely on integer-order differential equations, FROND employs the Caputo fractional derivative to leverage the non-local properties of fractional calculus. This approach enables the capture of long-term dependencies in feature updates, moving beyond the Markovian update mechanisms in conventional integer-order models and offering enhanced capabilities in graph representation learning. \nWe offer an interpretation of the node feature updating process in FROND from a non-Markovian random walk perspective when the feature updating is particularly governed by a diffusion process.\nWe demonstrate analytically that oversmoothing can be mitigated in this setting.\nExperimentally, we validate the FROND framework by comparing the fractional adaptations of various established integer-order continuous GNNs, demonstrating their consistently improved performance and underscoring the framework's potential as an effective extension to enhance traditional continuous GNNs.\nThe code is available at \\url{https://github.com/zknus/ICLR2024-FROND}.",
        "keywords": "graph neural network",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/f7a5cdfda884f6ce6fe939418ed344ed5b34a3b5.pdf",
        "author": "Qiyu Kang;Kai Zhao;Qinxu Ding;Feng Ji;Xuhao Li;Wenfei Liang;Yang Song;Wee Peng Tay",
        "authorids": "~Qiyu_Kang2;~Kai_Zhao7;~Qinxu_Ding1;~Feng_Ji2;~Xuhao_Li2;~Wenfei_Liang1;~Yang_Song7;~Wee_Peng_Tay1",
        "gender": ";;M;M;;;M;",
        "homepage": ";;;;http://math.ahu.edu.cn/lxh/list.htm;;https://c3-yang-song.github.io;https://personal.ntu.edu.sg/wptay/",
        "dblp": ";;232/3684;;194/5914;;24/4470-12;45/3753",
        "google_scholar": ";;orksudIAAAAJ;EA0VBD8AAAAJ;Yl5Bc0UAAAAJ;;https://scholar.google.com/citations?hl=en;BkCI7rEAAAAJ",
        "orcid": ";;;0000-0003-3442-1471;;;;0000-0002-1543-195X",
        "linkedin": ";;;;;;;",
        "or_profile": "~Qiyu_Kang2;~Kai_Zhao7;~Qinxu_Ding1;~Feng_Ji2;~Xuhao_Li2;~Wenfei_Liang1;~Yang_Song7;~Wee_Peng_Tay1",
        "aff": ";;Singapore University of Social Sciences;Nanyang Technological University;Anhui University;;C3 AI;Nanyang Technological University",
        "aff_domain": ";;suss.edu.sg;ntu.edu.sg;ahu.edu.cn;;c3.ai;ntu.edu.sg",
        "position": ";;Lecturer;Researcher;Lecturer;;Researcher;Full Professor",
        "bibtex": "@inproceedings{\nkang2024unleashing,\ntitle={Unleashing the Potential of Fractional Calculus in Graph Neural Networks with {FROND}},\nauthor={Qiyu Kang and Kai Zhao and Qinxu Ding and Feng Ji and Xuhao Li and Wenfei Liang and Yang Song and Wee Peng Tay},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=wcka3bd7P4}\n}",
        "github": "",
        "project": "",
        "reviewers": "Qi4C;7EpT;1hAW;2jGF",
        "pdf_size": 775584,
        "rating": "6;8;8;8",
        "confidence": "4;3;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;4",
        "wc_summary": "49;67;58;38",
        "wc_strengths": "41;77;79;91",
        "wc_weaknesses": "578;193;122;1",
        "wc_questions": "16;23;290;1",
        "wc_review": "684;360;549;131",
        "wc_reply_reviewers": "456;96;18;82",
        "wc_reply_authors": "4801;1559;2307;781",
        "reply_reviewers": "6;4;1;1",
        "reply_authors": "17;6;8;3",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            53.0,
            10.747092630102339
        ],
        "wc_strengths_avg": [
            72.0,
            18.681541692269406
        ],
        "wc_weaknesses_avg": [
            223.5,
            215.87554284818833
        ],
        "wc_questions_avg": [
            82.5,
            120.06352485247133
        ],
        "wc_review_avg": [
            431.0,
            207.95071531495148
        ],
        "wc_reply_reviewers_avg": [
            163.0,
            171.70032032585146
        ],
        "wc_reply_authors_avg": [
            2362.0,
            1507.9883951808117
        ],
        "reply_reviewers_avg": [
            3.0,
            2.1213203435596424
        ],
        "reply_authors_avg": [
            8.5,
            5.220153254455275
        ],
        "replies_avg": [
            56,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15973552236631345582&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=wcka3bd7P4",
        "pdf": "https://openreview.net/pdf?id=wcka3bd7P4",
        "email": ";;suss.edu.sg;ntu.edu.sg;ahu.edu.cn;;c3.ai;ntu.edu.sg",
        "author_num": 8,
        "aff_unique_index": "0;1;2;3;1",
        "aff_unique_norm": "Singapore University of Social Sciences;Nanyang Technological University;Anhui University;C3 AI",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.suss.edu.sg;https://www.ntu.edu.sg;http://www.ahu.edu.cn/;https://www.c3.ai",
        "aff_unique_abbr": "SUSS;NTU;AHU;C3 AI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;2;0",
        "aff_country_unique": "Singapore;China;United States"
    },
    {
        "id": "wdEHqQWTG4",
        "title": "Robust Reinforcement Learning for Portfolio Management via Competition and Cooperation Strategies",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In this study, we propose an intelligent system for portfolio management that applies robust reinforcement learning within a multi-agent framework. The proposed system incorporates both competition and cooperation strategies to enhance decision-making performance and adaptability. By formulating the portfolio management problem as a cooperative multi-agent environment, agents collaborate and jointly strive to achieve a common goal. On the other hand, the inclusion of competition strategies enables agents to dynamically compete for limited resources and advantages in the market. Specifically, the proposed cooperative strategies employ the absolute value of the reward, prioritizing accelerated model convergence. Meanwhile, the competitive strategies utilize previous rewards to guide action selection, aiming to seek gains and avoid losses. To assess the performance of our model, we evaluate it on a set of real-world financial data. The results obtained demonstrate that the proposed game strategies outperform traditional reinforcement learning approaches.",
        "keywords": "Reinforcement learning;Portfolio management;Competition;Cooperation;Robustness",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Xiaochuan Shi;Yihua Zhou;Lei WU",
        "authorids": "shixiaochuan@whu.edu.cn;zyh1657389281@163.com;~Lei_WU11",
        "gender": ";;",
        "homepage": ";;",
        "dblp": ";;68/5597-5",
        "google_scholar": ";;",
        "orcid": ";;0000-0001-5641-3259",
        "linkedin": ";;",
        "or_profile": "shixiaochuan@whu.edu.cn;zyh1657389281@163.com;~Lei_WU11",
        "aff": ";;",
        "aff_domain": ";;",
        "position": ";;",
        "bibtex": "@misc{\nanonymous2024robust,\ntitle={Robust Reinforcement Learning for Portfolio Management via Competition and Cooperation Strategies},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=wdEHqQWTG4}\n}",
        "github": "",
        "project": "",
        "reviewers": "Nhcj;Ju8B;vSqN;AQy4;3VrD;T3xy;uHcE;Lxrc",
        "site": "https://openreview.net/forum?id=wdEHqQWTG4",
        "pdf_size": 427063,
        "rating": "3;3;3;3;3;3;3;5",
        "confidence": "3;4;3;2;4;3;4;2",
        "soundness": "2;1;1;2;2;2;2;2",
        "contribution": "2;1;1;1;2;2;2;2",
        "presentation": "2;1;2;2;1;2;2;3",
        "wc_summary": "88;61;39;27;41;27;70;36",
        "wc_strengths": "26;7;33;13;29;35;9;53",
        "wc_weaknesses": "254;630;75;140;80;44;96;84",
        "wc_questions": "55;38;4;25;100;53;16;5",
        "wc_review": "423;736;151;205;250;159;191;178",
        "wc_reply_reviewers": "0;0;0;0;0;0;12;0",
        "wc_reply_authors": "142;55;113;82;170;90;79;28",
        "reply_reviewers": "0;0;0;0;0;0;1;0",
        "reply_authors": "1;1;1;1;1;1;1;1",
        "rating_avg": [
            3.25,
            0.6614378277661477
        ],
        "confidence_avg": [
            3.125,
            0.7806247497997998
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.625,
            0.4841229182759271
        ],
        "presentation_avg": [
            1.875,
            0.5994789404140899
        ],
        "wc_summary_avg": [
            48.625,
            20.633331650511508
        ],
        "wc_strengths_avg": [
            25.625,
            14.516692977396746
        ],
        "wc_weaknesses_avg": [
            175.375,
            182.0706851060873
        ],
        "wc_questions_avg": [
            37.0,
            30.099833886584822
        ],
        "wc_review_avg": [
            286.625,
            188.46945210033377
        ],
        "wc_reply_reviewers_avg": [
            1.5,
            3.968626966596886
        ],
        "wc_reply_authors_avg": [
            94.875,
            42.861513913999815
        ],
        "reply_reviewers_avg": [
            0.125,
            0.33071891388307384
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5447047794019221,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:kXQgaxPeKKYJ:scholar.google.com/&scioq=Robust+Reinforcement+Learning+for+Portfolio+Management+via+Competition+and+Cooperation+Strategies&hl=en&as_sdt=0,33",
        "gs_version_total": 0
    },
    {
        "id": "wdteczB4mQ",
        "title": "Learning to Compute Gr\u00f6bner Bases",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Solving a polynomial system, or computing an associated Gr\u00f6bner basis, has been a fundamental task in computational algebra. However, it is also known for its notoriously expensive computational cost\u2014doubly exponential time complexity in the number of variables in the worst case. In this paper, we achieve for the first time Gr\u00f6bner basis computation through the training of a transformer. The training requires many pairs of a polynomial system and the associated Gr\u00f6bner basis, thus motivating us to address two novel algebraic problems: random generation of Gr\u00f6bner bases and the transformation of them into non-Gr\u00f6bner polynomial systems, termed as *backward Gr\u00f6bner problem*. We resolve these problems with zero-dimensional radical ideals, the ideals appearing in various applications. The experiments show that in the five-variate case, the proposed dataset generation method is five orders of magnitude faster than a naive approach, overcoming a crucial challenge in learning to compute Gr\u00f6bner bases.",
        "keywords": "Transformer; Gr\u00f6bner bases; Computational algebra",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Hiroshi Kera;Yuki Ishihara;Yuta Kambe;Tristan Vaccon;Kazuhiro Yokoyama",
        "authorids": "~Hiroshi_Kera1;~Yuki_Ishihara1;~Yuta_Kambe1;~Tristan_Vaccon1;~Kazuhiro_Yokoyama1",
        "gender": "M;M;M;M;M",
        "homepage": ";;https://sites.google.com/view/yuta-kambe/;https://www.unilim.fr/pages_perso/tristan.vaccon/;",
        "dblp": "190/2671;179/4327.html;;;39/5838.html",
        "google_scholar": "https://scholar.google.co.jp/citations?user=M4Krt5gAAAAJ;;;khGu6GAAAAAJ;https://scholar.google.co.jp/citations?user=WUG44TcAAAAJ",
        "orcid": ";;0000-0002-8260-0186;0000-0003-4208-8349;",
        "linkedin": ";;;;",
        "or_profile": "~Hiroshi_Kera1;~Yuki_Ishihara1;~Yuta_Kambe1;~Tristan_Vaccon1;~Kazuhiro_Yokoyama1",
        "aff": "Chiba University;Tokyo University of Science;Mitsubishi Electric Information Technology R&D Center;Universit\u00e9 de Limoges;Rikkyo University (St. Paul's University)",
        "aff_domain": "chiba-u.jp;tus.ac.jp;mitsubishielectric.co.jp;unilim.fr;rikkyo.ac.jp",
        "position": "Assistant Professor;Assistant Professor;Postdoc;Associate Professor;Emeritus",
        "bibtex": "@misc{\nkera2024learning,\ntitle={Learning to Compute Gr\\\"obner Bases},\nauthor={Hiroshi Kera and Yuki Ishihara and Yuta Kambe and Tristan Vaccon and Kazuhiro Yokoyama},\nyear={2024},\nurl={https://openreview.net/forum?id=wdteczB4mQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "DA1f;t6to;Sama",
        "site": "https://openreview.net/forum?id=wdteczB4mQ",
        "pdf_size": 397511,
        "rating": "3;6;8",
        "confidence": "3;2;3",
        "soundness": "4;3;3",
        "contribution": "2;2;3",
        "presentation": "4;2;3",
        "wc_summary": "172;135;204",
        "wc_strengths": "21;47;170",
        "wc_weaknesses": "175;219;140",
        "wc_questions": "34;54;30",
        "wc_review": "402;455;544",
        "wc_reply_reviewers": "0;0;78",
        "wc_reply_authors": "913;1035;572",
        "reply_reviewers": "0;0;1",
        "reply_authors": "2;2;1",
        "rating_avg": [
            5.666666666666667,
            2.0548046676563256
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            170.33333333333334,
            28.193773938387338
        ],
        "wc_strengths_avg": [
            79.33333333333333,
            64.98375865467378
        ],
        "wc_weaknesses_avg": [
            178.0,
            32.321303604073066
        ],
        "wc_questions_avg": [
            39.333333333333336,
            10.498677165349081
        ],
        "wc_review_avg": [
            467.0,
            58.58896369340105
        ],
        "wc_reply_reviewers_avg": [
            26.0,
            36.76955262170047
        ],
        "wc_reply_authors_avg": [
            840.0,
            195.94046714925088
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.1147078669352809,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2948111103367792428&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "Chiba University;Tokyo University of Science;Mitsubishi Electric;Universit\u00e9 de Limoges;Rikkyo University",
        "aff_unique_dep": ";;Information Technology R&D Center;;",
        "aff_unique_url": "https://www.chiba-u.ac.jp;https://www.tus.ac.jp;https://www.mitsubishielectric.com;https://www.unilim.fr;https://www.rikkyo.ac.jp",
        "aff_unique_abbr": "Chiba U;TUS;MEIT;Unilim;Rikkyo",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "Japan;France"
    },
    {
        "title": "Robust Classification via Regression for Learning with Noisy Labels",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17485",
        "id": "wfgZc3IMqo",
        "author_site": "Erik Englesson, Hossein Azizpour",
        "tldr": "",
        "abstract": "Deep neural networks and large-scale datasets have revolutionized the field of machine learning. However, these large networks are susceptible to overfitting to label noise, resulting in reduced generalization. To address this challenge, two promising approaches have emerged: i) loss reweighting, which reduces the influence of noisy examples on the training loss, and ii) label correction that replaces noisy labels with estimated true labels. These directions have been pursued separately or combined as independent methods, lacking a unified approach. In this work, we present a unified method that seamlessly combines loss reweighting and label correction to enhance robustness against label noise in classification tasks. Specifically, by leveraging ideas from compositional data analysis in statistics, we frame the problem as a regression task, where loss reweighting and label correction can naturally be achieved with a shifted Gaussian label noise model. Our unified approach achieves strong performance compared to recent baselines on several noisy labelled datasets. We believe this work is a promising step towards robust deep learning in the presence of label noise. Our code is available at: https://github.com/ErikEnglesson/SGN.",
        "keywords": "label noise;noisy labels;robustness;Gaussian noise;classification;log-ratio transform;compositional data analysis",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Erik Englesson;Hossein Azizpour",
        "authorids": "~Erik_Englesson1;~Hossein_Azizpour2",
        "gender": "M;M",
        "homepage": "https://www.kth.se/profile/engless/;http://www.csc.kth.se/~azizpour/",
        "dblp": "243/3256;119/1327",
        "google_scholar": "qR-xwSQAAAAJ;https://scholar.google.se/citations?user=t6CRgJsAAAAJ",
        "orcid": ";0000-0001-5211-6388",
        "linkedin": ";hossein-azizpour-578b4ab1",
        "or_profile": "~Erik_Englesson1;~Hossein_Azizpour1",
        "aff": "KTH Royal Institute of Technology, Stockholm, Sweden;KTH Royal Institute of Technology",
        "aff_domain": "kth.se;kth.se",
        "position": "PhD student;Associate Professor",
        "bibtex": "@inproceedings{\nenglesson2024robust,\ntitle={Robust Classification via Regression for Learning with Noisy Labels},\nauthor={Erik Englesson and Hossein Azizpour},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=wfgZc3IMqo}\n}",
        "github": "",
        "project": "",
        "reviewers": "prcP;U8oG;QVE6;h549",
        "pdf_size": 653256,
        "rating": "5;5;6;8",
        "confidence": "4;4;3;4",
        "soundness": "3;3;2;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "102;107;57;133",
        "wc_strengths": "21;59;70;41",
        "wc_weaknesses": "627;148;84;87",
        "wc_questions": "9;88;283;81",
        "wc_review": "759;402;494;342",
        "wc_reply_reviewers": "63;0;420;61",
        "wc_reply_authors": "1611;1678;2952;2229",
        "reply_reviewers": "1;0;1;2",
        "reply_authors": "3;4;4;4",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            99.75,
            27.343874999714288
        ],
        "wc_strengths_avg": [
            47.75,
            18.59267328815305
        ],
        "wc_weaknesses_avg": [
            236.5,
            226.89700306526748
        ],
        "wc_questions_avg": [
            115.25,
            101.66704234903266
        ],
        "wc_review_avg": [
            499.25,
            159.43866375506286
        ],
        "wc_reply_reviewers_avg": [
            136.0,
            165.91112078459358
        ],
        "wc_reply_authors_avg": [
            2117.5,
            538.1739960273071
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            3.75,
            0.4330127018922193
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17623295157423104075&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=wfgZc3IMqo",
        "pdf": "https://openreview.net/pdf?id=wfgZc3IMqo",
        "email": "kth.se;kth.se",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "KTH Royal Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kth.se",
        "aff_unique_abbr": "KTH",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Stockholm;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Sweden"
    },
    {
        "title": "Navigating Text-To-Image Customization: From LyCORIS Fine-Tuning to Model Evaluation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17484",
        "id": "wfzXa8e783",
        "author_site": "Shih-Ying Yeh, Yu-Guan Hsieh, Zhidong Gao, Bernard Yang, Giyeong Oh, Yanmin Gong",
        "tldr": "",
        "abstract": "Text-to-image generative models have garnered immense attention for their ability to produce high-fidelity images from text prompts.  Among these, Stable Diffusion distinguishes itself as a leading open-source model in this fast-growing field.  However, the intricacies of fine-tuning these models pose multiple challenges from new methodology integration to systematic evaluation.  Addressing these issues, this paper introduces LyCORIS (Lora beYond Conventional methods, Other Rank adaptation Implementations for Stable diffusion), an open-source library that offers a wide selection of fine-tuning methodologies for Stable Diffusion.  Furthermore, we present a thorough framework for the systematic assessment of varied fine-tuning techniques. This framework employs a diverse suite of metrics and delves into multiple facets of fine-tuning, including hyperparameter adjustments and the evaluation with different prompt types across various concept categories. Through this comprehensive approach, our work provides essential insights into the nuanced effects of fine-tuning parameters, bridging the gap between state-of-the-art research and practical application.",
        "keywords": "Text-to-Image;Model Customization;Parameter-Efficient Fine-Tuning;Model Evaluation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/2f31a62f1e06307af3d3fe818132f348906a2fac.pdf",
        "author": "SHIH-YING YEH;Yu-Guan Hsieh;Zhidong Gao;Bernard B W Yang;Giyeong Oh;Yanmin Gong",
        "authorids": "~SHIH-YING_YEH1;~Yu-Guan_Hsieh1;~Zhidong_Gao1;~Bernard_B_W_Yang1;~Giyeong_Oh1;~Yanmin_Gong1",
        "gender": "M;M;M;M;M;F",
        "homepage": "https://kblueleaf.net;https://www.cyber-meow.com/;https://zhidong-gao.github.io/index.html;;https://github.com/BootsofLagrangian;https://yanmingong.github.io/",
        "dblp": ";228/6772;;;;145/6503-1",
        "google_scholar": "https://scholar.google.com/citations?hl=en;I9lAMpEAAAAJ;Fc8axmEAAAAJ;;LzzcroEAAAAJ;o3BGIEMAAAAJ",
        "orcid": "0009-0002-5962-091X;;0009-0009-9782-0083;;;",
        "linkedin": "%E9%81%A9%E7%A9%8E-%E8%91%89-80797327b/;;;byangdv/;;",
        "or_profile": "~SHIH-YING_YEH1;~Yu-Guan_Hsieh1;~Zhidong_Gao1;~Bernard_B_W_Yang1;~Giyeong_Oh1;~Yanmin_Gong1",
        "aff": "National Tsinghua University;Apple;University of Texas, San Antonio;University of Toronto;Yonsei University;University of Texas, San Antonio",
        "aff_domain": "nthu.edu.tw;apple.com;utsa.edu;utoronto.ca;yonsei.ac.kr;utsa.edu",
        "position": "Undergrad student;Postdoc;PhD student;Undergrad student;Intern;Assistant Professor",
        "bibtex": "@inproceedings{\nyeh2024navigating,\ntitle={Navigating Text-To-Image Customization: From Ly{CORIS} Fine-Tuning to Model Evaluation},\nauthor={SHIH-YING YEH and Yu-Guan Hsieh and Zhidong Gao and Bernard B W Yang and Giyeong Oh and Yanmin Gong},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=wfzXa8e783}\n}",
        "github": "",
        "project": "",
        "reviewers": "EGJf;DWom;PnHf;ekPo",
        "pdf_size": 7051622,
        "rating": "6;6;6;8",
        "confidence": "3;3;4;4",
        "soundness": "3;3;4;3",
        "contribution": "2;3;3;4",
        "presentation": "3;3;4;3",
        "wc_summary": "37;37;91;44",
        "wc_strengths": "19;52;102;41",
        "wc_weaknesses": "17;92;73;30",
        "wc_questions": "21;6;23;36",
        "wc_review": "94;187;289;151",
        "wc_reply_reviewers": "20;0;0;12",
        "wc_reply_authors": "489;395;403;321",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            52.25,
            22.554101622543072
        ],
        "wc_strengths_avg": [
            53.5,
            30.41792234851026
        ],
        "wc_weaknesses_avg": [
            53.0,
            30.602287496198713
        ],
        "wc_questions_avg": [
            21.5,
            10.641898326896381
        ],
        "wc_review_avg": [
            180.25,
            71.00484138423238
        ],
        "wc_reply_reviewers_avg": [
            8.0,
            8.48528137423857
        ],
        "wc_reply_authors_avg": [
            402.0,
            59.53990258641679
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 71,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6861324534377142065&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=wfzXa8e783",
        "pdf": "https://openreview.net/pdf?id=wfzXa8e783",
        "email": "nthu.edu.tw;apple.com;utsa.edu;utoronto.ca;yonsei.ac.kr;utsa.edu",
        "author_num": 6,
        "aff_unique_index": "0;1;2;3;4;2",
        "aff_unique_norm": "Tsinghua University;Apple;University of Texas at San Antonio;University of Toronto;Yonsei University",
        "aff_unique_dep": ";Apple Inc.;;;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.apple.com;https://www.utsa.edu;https://www.utoronto.ca;https://www.yonsei.ac.kr",
        "aff_unique_abbr": "THU;Apple;UTSA;U of T;Yonsei",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";San Antonio",
        "aff_country_unique_index": "0;1;1;2;3;1",
        "aff_country_unique": "China;United States;Canada;South Korea"
    },
    {
        "title": "$\\texttt{NAISR}$: A 3D Neural Additive Model for Interpretable Shape Representation",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17483",
        "id": "wg8NPfeMF9",
        "author_site": "Yining Jiao, Carlton ZDANSKI, Julia Kimbell, Andrew Prince, Cameron Worden, Samuel Kirse, Christopher Rutter, Benjamin Shields, William Dunn, Jisan Mahmud, Marc Niethammer",
        "tldr": "",
        "abstract": "Deep implicit functions (DIFs) have emerged as a powerful paradigm for many computer vision tasks such as 3D shape reconstruction, generation, registration, completion, editing, and understanding. However, given a set of 3D shapes with associated covariates there is at present no shape representation method which allows to precisely represent the shapes while capturing the individual dependencies on each covariate. Such a method would be of high utility to researchers to discover knowledge hidden in a population of shapes. For scientific shape discovery purpose, we propose a 3D Neural Additive Model for Interpretable Shape Representation ($\\texttt{NAISR}$) which describes individual shapes by deforming a shape atlas in accordance to the effect of disentangled covariates. Our approach captures shape population trends and allows for patient-specific predictions through shape transfer. $\\texttt{NAISR}$ is the first approach to combine the benefits of deep implicit shape representations with an atlas deforming according to specified covariates. We evaluate $\\texttt{NAISR}$ with respect to shape reconstruction, shape disentanglement, shape evolution, and shape transfer on three datasets, i.e. 1) $\\textit{Starman}$, a simulated 2D shape dataset; 2) ADNI hippocampus 3D shape dataset; 3) pediatric airway 3D shape dataset. Our experiments demonstrate that $\\texttt{NAISR}$ achieves competitive shape reconstruction performance while retaining interpretability. Our code is available at https://github.com/uncbiag/NAISR.",
        "keywords": "Shape Modeling;Medical Shape Analysis;Interpretable Representation;AI4Science",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/f3d55221c4883707005187f8cc7df1dff420474d.zip",
        "author": "Yining Jiao;Carlton Jude ZDANSKI;Julia S Kimbell;Andrew Prince;Cameron P Worden;Samuel Kirse;Christopher Rutter;Benjamin Shields;William Alexander Dunn;Jisan Mahmud;Marc Niethammer",
        "authorids": "~Yining_Jiao1;~Carlton_Jude_ZDANSKI1;~Julia_S_Kimbell1;~Andrew_Prince2;~Cameron_P_Worden1;~Samuel_Kirse1;~Christopher_Rutter1;~Benjamin_Shields1;~William_Alexander_Dunn1;~Jisan_Mahmud1;~Marc_Niethammer1",
        "gender": "F;M;F;M;M;M;M;M;M;M;M",
        "homepage": "https://jiaoyining.github.io/;https://www.med.unc.edu/ent/directory/carlton-j-zdanski-md-facs/;;;;;;;;;http://wwwx.cs.unc.edu/~mn/",
        "dblp": "234/5804;;;;;;;;;254/1787;88/3304",
        "google_scholar": "9FVJ-CkAAAAJ;;;;;;;GifAaXcAAAAJ;;LTyzKToAAAAJ;https://scholar.google.com.au/citations?user=KqtBi6MAAAAJ",
        "orcid": ";;0000-0002-1969-6373;0000-0002-0390-8116;0000-0003-2318-0975;;0000-0001-8406-8130;;0000-0001-7449-4224;;",
        "linkedin": ";;julia-kimbell-b6893027;andrewprincemd/;;samuel-k-39514691;;benhshields/;;crysoberil/;",
        "or_profile": "~Yining_Jiao1;~Carlton_Jude_ZDANSKI1;~Julia_S_Kimbell1;~Andrew_Prince2;~Cameron_P_Worden1;~Samuel_Kirse1;~Christopher_Rutter1;~Benjamin_Shields1;~William_Alexander_Dunn1;~Jisan_Mahmud1;~Marc_Niethammer1",
        "aff": "University of North Carolina at Chapel Hill;;University of North Carolina at Chapel Hill;;University of North Carolina at Chapel Hill;Wake Forest University School of Medicine;Ohio State University, Columbus;University of North Carolina at Chapel Hill;University of North Carolina at Chapel Hill;;The University of North Carolina at Chapel Hill",
        "aff_domain": "unc.edu;;unc.edu;;unc.edu;wfu.edu;osu.edu;unc.edu;unc.edu;;unc.edu",
        "position": "PhD student;;Emeritus;;Postdoc;MS student;MS student;Researcher;Researcher;;Full Professor",
        "bibtex": "@inproceedings{\njiao2024textttnaisr,\ntitle={\\${\\textbackslash}texttt\\{{NAISR}\\}\\$: A 3D Neural Additive Model for Interpretable Shape Representation},\nauthor={Yining Jiao and Carlton Jude ZDANSKI and Julia S Kimbell and Andrew Prince and Cameron P Worden and Samuel Kirse and Christopher Rutter and Benjamin Shields and William Alexander Dunn and Jisan Mahmud and Marc Niethammer},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=wg8NPfeMF9}\n}",
        "github": "",
        "project": "",
        "reviewers": "7YZF;juiL;ScLH;ftBT",
        "pdf_size": 15736568,
        "rating": "6;6;6;8",
        "confidence": "4;4;3;5",
        "soundness": "4;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "4;4;3;4",
        "wc_summary": "159;94;81;81",
        "wc_strengths": "54;83;19;113",
        "wc_weaknesses": "212;139;22;137",
        "wc_questions": "58;40;49;127",
        "wc_review": "483;356;171;458",
        "wc_reply_reviewers": "56;34;0;36",
        "wc_reply_authors": "2409;681;768;1442",
        "reply_reviewers": "2;1;0;1",
        "reply_authors": "5;3;2;5",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            103.75,
            32.33709170596515
        ],
        "wc_strengths_avg": [
            67.25,
            34.802119188348286
        ],
        "wc_weaknesses_avg": [
            127.5,
            67.994485070482
        ],
        "wc_questions_avg": [
            68.5,
            34.3693177121688
        ],
        "wc_review_avg": [
            367.0,
            122.7538186778725
        ],
        "wc_reply_reviewers_avg": [
            31.5,
            20.11839953873071
        ],
        "wc_reply_authors_avg": [
            1325.0,
            691.6881522767322
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            3.75,
            1.299038105676658
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": 0.816496580927726,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "openreview": "https://openreview.net/forum?id=wg8NPfeMF9",
        "pdf": "https://openreview.net/pdf?id=wg8NPfeMF9",
        "email": "unc.edu;;unc.edu;;unc.edu;wfu.edu;osu.edu;unc.edu;unc.edu;;unc.edu",
        "author_num": 11,
        "aff_unique_index": "0;0;0;1;2;0;0;3",
        "aff_unique_norm": "University of North Carolina;Wake Forest University;Ohio State University;University of North Carolina at Chapel Hill",
        "aff_unique_dep": ";School of Medicine;;",
        "aff_unique_url": "https://www.unc.edu;https://www.wakehealth.edu;https://www.osu.edu;https://www.unc.edu",
        "aff_unique_abbr": "UNC;WFU;OSU;UNC Chapel Hill",
        "aff_campus_unique_index": "0;0;0;2;0;0;0",
        "aff_campus_unique": "Chapel Hill;;Columbus",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "wgmOXVTGdb",
        "title": "LayoutDETR: Detection Transformer Is a Good Multimodal Layout Designer",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graphic layout designs play an essential role in visual communication. Yet handcrafting layout designs is skill-demanding, time-consuming, and non-scalable to batch production. Generative models emerge to make design automation scalable but it remains non-trivial to produce designs that comply with designers' multimodal desires, i.e., constrained by background images and driven by foreground content. We propose LayoutDETR that inherits the high quality and realism from generative modeling, while reformulating content-aware requirements as a detection problem: we learn to detect in a background image the reasonable locations, scales, and spatial relations for multimodal foreground elements in a layout. Our solution sets a new state-of-the-art performance for layout generation on public benchmarks and on our newly-curated ad banner dataset. We integrate our solution into a graphical system that facilitates user studies, and show that users prefer our designs over baselines by significant margins.",
        "keywords": "Graphic layout design;multimodalities;deep generative models;generative adversarial networks;visual detection;transformers",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/40a9654099b336fd13b41ae544eb0c1341bbe0e4.zip",
        "author": "Ning Yu;Chia-Chih Chen;Zeyuan Chen;Rui Meng;Gang Wu;Paul Josel;Juan Carlos Niebles;Caiming Xiong;Ran Xu",
        "authorids": "~Ning_Yu2;~Chia-Chih_Chen1;~Zeyuan_Chen1;~Rui_Meng1;~Gang_Wu8;~Paul_Josel1;~Juan_Carlos_Niebles1;~Caiming_Xiong1;~Ran_Xu1",
        "gender": ";M;M;M;M;M;M;M;M",
        "homepage": ";http://www.chiachih.org/;https://www.linkedin.com/in/zeyuan-chen-0253b6141/;http://memray.me;;http://pauljosel.com/;http://www.niebles.net/;http://cmxiong.com/;",
        "dblp": ";15/2783;191/1578-1.html;;https://dblp.org/rec/journals/corr/abs-2212-09877;;26/647;80/7282;",
        "google_scholar": ";0Hr1SOUAAAAJ;znf-4mgAAAAJ;s6h8L_UAAAAJ;https://scholar.google.com/scholar_lookup?arxiv_id=2212.09877;;hqNhUCYAAAAJ;vaSdahkAAAAJ;sgBB2sUAAAAJ",
        "orcid": ";;0009-0003-2471-5449;0000-0001-5583-4924;;;;;",
        "linkedin": ";chiachihchen;zeyuan-chen-/;memray/;whoisgang/;paul-josel/;;caiming-xiong-150a1417;",
        "or_profile": "~Ning_Yu2;~Chia-Chih_Chen1;~Zeyuan_Chen1;~Rui_Meng1;~Gang_Wu8;~Paul_Josel1;~Juan_Carlos_Niebles1;~Caiming_Xiong1;~Ran_Xu1",
        "aff": ";NVIDIA;Salesforce Inc;Salesforce Research;Golden Gate University;SalesForce.com;Stanford University;Salesforce Research;SalesForce.com",
        "aff_domain": ";nvidia.com;salesforce.com;salesforce.com;ggu.edu;salesforce.com;stanford.edu;salesforce.com;salesforce.com",
        "position": ";Researcher;Researcher;Researcher;MS student;Researcher;Adjunct Professor;Research Scientist;senior manager",
        "bibtex": "@misc{\nyu2024layoutdetr,\ntitle={Layout{DETR}: Detection Transformer Is a Good Multimodal Layout Designer},\nauthor={Ning Yu and Chia-Chih Chen and Zeyuan Chen and Rui Meng and Gang Wu and Paul Josel and Juan Carlos Niebles and Caiming Xiong and Ran Xu},\nyear={2024},\nurl={https://openreview.net/forum?id=wgmOXVTGdb}\n}",
        "github": "",
        "project": "",
        "reviewers": "t8xx;EPYk;Gw2u;j8Mq",
        "site": "https://openreview.net/forum?id=wgmOXVTGdb",
        "pdf_size": 39153336,
        "rating": "5;5;5;6",
        "confidence": "4;3;4;4",
        "soundness": "3;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;2;3",
        "wc_summary": "49;44;71;62",
        "wc_strengths": "30;43;53;42",
        "wc_weaknesses": "77;160;170;91",
        "wc_questions": "38;89;1;43",
        "wc_review": "194;336;295;238",
        "wc_reply_reviewers": "0;0;107;0",
        "wc_reply_authors": "955;1004;586;697",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            56.5,
            10.641898326896381
        ],
        "wc_strengths_avg": [
            42.0,
            8.154753215150045
        ],
        "wc_weaknesses_avg": [
            124.5,
            40.95424275945045
        ],
        "wc_questions_avg": [
            42.75,
            31.24399942388938
        ],
        "wc_review_avg": [
            265.75,
            54.10348879693434
        ],
        "wc_reply_reviewers_avg": [
            26.75,
            46.332359102467464
        ],
        "wc_reply_authors_avg": [
            810.5,
            174.35954232562094
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3152168629165576656&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;1;2;1;3;1;1",
        "aff_unique_norm": "NVIDIA;Salesforce;Golden Gate University;Stanford University",
        "aff_unique_dep": "NVIDIA Corporation;;;",
        "aff_unique_url": "https://www.nvidia.com;https://www.salesforce.com;https://www.ggu.edu;https://www.stanford.edu",
        "aff_unique_abbr": "NVIDIA;Salesforce;GGU;Stanford",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Stanford",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "whFQe4MRIY",
        "title": "MI-NeRF: Learning a Single Face NeRF from Multiple Identities",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this work, we introduce a method that learns a single dynamic neural radiance field (NeRF) from monocular talking face videos of multiple identities. NeRFs have shown remarkable results in modeling the 4D dynamics and appearance of human faces. However, they require expensive per-identity optimization. To address this challenge, we introduce MI-NeRF (multi-identity NeRF), a single unified network that models complex non-rigid facial motion for multiple identities, using only monocular videos of arbitrary length. The core premise in our method is to learn the non-linear interactions between identity and non-identity specific information with a multiplicative module. By training MI-NeRF on multiple videos simultaneously, we significantly reduce the total training time, compared to standard single-identity NeRFs. Our model can be further personalized for a target identity. We demonstrate results for both facial expression transfer and talking face video synthesis.",
        "keywords": "neural radiance fields;face;identity;expression",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/b28b414a4c40059894e943a0f75da31cd28f92fd.zip",
        "author": "Aggelina Chatziagapi;Grigorios Chrysos;Dimitris Samaras",
        "authorids": "~Aggelina_Chatziagapi1;~Grigorios_Chrysos1;~Dimitris_Samaras3",
        "gender": "F;M;M",
        "homepage": "https://aggelinacha.github.io/;https://grigorisg9gr.github.io/;https://www.cs.stonybrook.edu/~samaras/",
        "dblp": "251/4304;75/6117-2;s/DimitrisSamaras",
        "google_scholar": "J1wufZkAAAAJ;1bU041kAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;0000-0002-1373-0294",
        "linkedin": "aggelinacha/;;",
        "or_profile": "~Aggelina_Chatziagapi1;~Grigorios_Chrysos1;~Dimitris_Samaras3",
        "aff": "Meta Reality Labs;University of Wisconsin - Madison;Stony Brook University",
        "aff_domain": "meta.com;wisc.edu;cs.stonybrook.edu",
        "position": "Intern;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nchatziagapi2024minerf,\ntitle={{MI}-Ne{RF}: Learning a Single Face Ne{RF} from Multiple Identities},\nauthor={Aggelina Chatziagapi and Grigorios Chrysos and Dimitris Samaras},\nyear={2024},\nurl={https://openreview.net/forum?id=whFQe4MRIY}\n}",
        "github": "",
        "project": "",
        "reviewers": "ud4c;TTon;d6cv;x1A2",
        "site": "https://openreview.net/forum?id=whFQe4MRIY",
        "pdf_size": 11093577,
        "rating": "6;6;6;8",
        "confidence": "3;3;4;4",
        "soundness": "3;3;3;3",
        "contribution": "3;3;2;3",
        "presentation": "4;3;2;3",
        "wc_summary": "89;56;40;71",
        "wc_strengths": "101;44;19;66",
        "wc_weaknesses": "53;30;75;339",
        "wc_questions": "13;5;46;50",
        "wc_review": "256;135;180;526",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "216;104;705;730",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            64.0,
            18.12456896039186
        ],
        "wc_strengths_avg": [
            57.5,
            30.120590963658067
        ],
        "wc_weaknesses_avg": [
            124.25,
            125.00274996975067
        ],
        "wc_questions_avg": [
            28.5,
            19.75474626513841
        ],
        "wc_review_avg": [
            274.25,
            151.64493891983338
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            438.75,
            281.6872157198477
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5834474936930467437&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Meta;University of Wisconsin-Madison;Stony Brook University",
        "aff_unique_dep": "Meta Reality Labs;;",
        "aff_unique_url": "https://www.meta.com;https://www.wisc.edu;https://www.stonybrook.edu",
        "aff_unique_abbr": "MRL;UW-Madison;SBU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Madison",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "whXf7onmXZ",
        "title": "Learning the Unseen: Peer-to-Peer Fine-tuning of Vision Transformers",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In this paper, we propose a distributed training framework for fine-tuning vision transformers. We address the training process in scenarios where heterogeneous data is geographically distributed across a network of nodes communicating over a peer-to-peer network topology. These nodes have the capability to exchange information with neighboring nodes but do not share their personal training data in order to maintain data privacy. Typically, training the entire vision transformer model is impractical due to computational constraints. Therefore, it is highly preferable to use a pre-trained transformer and fine-tune it for specific downstream tasks as required. In this paper, we propose a privacy-aware distributed fine-tuning method for vision transformer based downstream tasks. We demonstrate that our approach enables distributed models to achieve similar performance results as achieved on a single computational device with access to the entire training dataset. We present numerical experiments for distributed fine-tuning of ViT, DeiT, and Swin-transformer models on various datasets.",
        "keywords": "Vision Transformers;Distributed Peer-to-Peer Learning;Transfer Learning;Heterogeneous Data",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/3f98a0bf3c6ce9359b92afdf9ca2f3b31a0777b5.zip",
        "author": "Muhammad Ibrahim Qureshi;Usman Khan",
        "authorids": "~Muhammad_Ibrahim_Qureshi1;~Usman_Khan1",
        "gender": "M;",
        "homepage": ";https://www.eecs.tufts.edu/~khan/",
        "dblp": ";",
        "google_scholar": "eOauqJYAAAAJ;YiMlq2cAAAAJ",
        "orcid": "0000-0002-0661-4156;0000-0002-0853-6518",
        "linkedin": ";dr-ukhan",
        "or_profile": "~Muhammad_Ibrahim_Qureshi1;~Usman_Khan1",
        "aff": "Tufts University;Tufts University",
        "aff_domain": "tufts.edu;tufts.edu",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nqureshi2024learning,\ntitle={Learning the Unseen: Peer-to-Peer Fine-tuning of Vision Transformers},\nauthor={Muhammad Ibrahim Qureshi and Usman Khan},\nyear={2024},\nurl={https://openreview.net/forum?id=whXf7onmXZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "pAbZ;n2Zn;WLob;NQ6C",
        "site": "https://openreview.net/forum?id=whXf7onmXZ",
        "pdf_size": 7097866,
        "rating": "3;3;3;6",
        "confidence": "4;2;4;4",
        "soundness": "1;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "1;2;2;3",
        "wc_summary": "44;90;29;59",
        "wc_strengths": "20;17;29;80",
        "wc_weaknesses": "97;247;91;8",
        "wc_questions": "57;3;29;2",
        "wc_review": "218;357;178;149",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            55.5,
            22.566568192793515
        ],
        "wc_strengths_avg": [
            36.5,
            25.5
        ],
        "wc_weaknesses_avg": [
            110.75,
            86.16952767655164
        ],
        "wc_questions_avg": [
            22.75,
            22.54301443906737
        ],
        "wc_review_avg": [
            225.5,
            79.77624959848639
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:KCAtQPNJxJsJ:scholar.google.com/&scioq=Learning+the+Unseen:+Peer-to-Peer+Fine-tuning+of+Vision+Transformers&hl=en&as_sdt=0,47",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Tufts University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tufts.edu",
        "aff_unique_abbr": "Tufts",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "whxKU5YcH6",
        "title": "SGOOD: Substructure-enhanced Graph-Level Out-of-Distribution Detection",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph-level representation learning is important in a wide range of applications. However, existing graph-level models are generally built on i.i.d. assumption for both training and testing graphs, which is not realistic in an open world, where models can encounter out-of-distribution (OOD) testing graphs that are from different distributions unknown during training. \nA trustworthy model should not only produce accurate predictions for in-distribution (ID) data, but also detect OOD graphs to avoid unreliable prediction.\nIn this paper, we present SGOOD, a novel graph-level OOD detection framework. We find that substructure differences commonly exist between ID and OOD graphs. Hence, SGOOD explicitly utilizes substructures to learn powerful representations to achieve superior performance.\nSpecifically, we build a super graph of substructures for every graph, and design a two-level graph encoding pipeline that works on both original graphs and super graphs to obtain substructure-enhanced graph representations. \nTo further distinguish ID and OOD graphs, we develop three graph augmentation techniques that preserve substructures and increase expressiveness. Extensive experiments against 10 competitors on numerous graph datasets demonstrate the superiority of SGOOD, often surpassing existing methods by a significant margin.  The code is available at https://anonymous.4open.science/r/SGOOD-0958.",
        "keywords": "out-of-distribution detection;graph classification",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "ZHIHAO DING;Jieming Shi",
        "authorids": "~ZHIHAO_DING1;~Jieming_Shi1",
        "gender": "M;Not Specified",
        "homepage": ";https://www4.comp.polyu.edu.hk/~jiemshi/",
        "dblp": "33/9469;147/1237-1.html",
        "google_scholar": ";",
        "orcid": "0000-0001-7778-6142;0000-0002-0465-1551",
        "linkedin": ";",
        "or_profile": "~ZHIHAO_DING1;~Jieming_Shi1",
        "aff": "The Hong Kong Polytechnic University, Hong Kong Polytechnic University;The Hong Kong Polytechnic University",
        "aff_domain": "comp.polyu.edu.hk;polyu.edu.hk",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nding2024sgood,\ntitle={{SGOOD}: Substructure-enhanced Graph-Level Out-of-Distribution Detection},\nauthor={ZHIHAO DING and Jieming Shi},\nyear={2024},\nurl={https://openreview.net/forum?id=whxKU5YcH6}\n}",
        "github": "",
        "project": "",
        "reviewers": "3dEG;NoSM;AhYj",
        "site": "https://openreview.net/forum?id=whxKU5YcH6",
        "pdf_size": 658801,
        "rating": "3;5;5",
        "confidence": "4;4;4",
        "soundness": "2;3;2",
        "contribution": "2;2;2",
        "presentation": "2;3;3",
        "wc_summary": "80;20;74",
        "wc_strengths": "36;28;30",
        "wc_weaknesses": "362;72;23",
        "wc_questions": "91;31;123",
        "wc_review": "569;151;250",
        "wc_reply_reviewers": "144;0;0",
        "wc_reply_authors": "2065;530;890",
        "reply_reviewers": "1;0;0",
        "reply_authors": "5;2;3",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            58.0,
            26.981475126464083
        ],
        "wc_strengths_avg": [
            31.333333333333332,
            3.39934634239519
        ],
        "wc_weaknesses_avg": [
            152.33333333333334,
            149.60020796182812
        ],
        "wc_questions_avg": [
            81.66666666666667,
            38.134265722866914
        ],
        "wc_review_avg": [
            323.3333333333333,
            178.35233543622454
        ],
        "wc_reply_reviewers_avg": [
            48.0,
            67.88225099390856
        ],
        "wc_reply_authors_avg": [
            1161.6666666666667,
            655.4430223562957
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            1.247219128924647
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8192809972113257195&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Hong Kong Polytechnic University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.polyu.edu.hk",
        "aff_unique_abbr": "PolyU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "wi8wMFuO0H",
        "title": "Cross-domain Recommendation from Implicit Feedback",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Existing cross-domain recommendation (CDR) algorithms aim to leverage explicit feedback from richer source domains to enhance recommendations in a target domain with limited records. However, practical scenarios often involve easily obtainable implicit feedback, such as user clicks, and purchase history, instead of explicit feedback. Thus, in this paper, we consider a more practical problem setting, called cross-domain recommendation from implicit feedback (CDRIF), where both source and target domains are based on implicit feedback. We initially observe that current CDR algorithms struggle to make recommendations when implicit feedback exists in both source and target domains. The primary issue with current CDR algorithms mainly lies in that implicit feedback can only approximately express user preferences in the dataset, inevitably introducing noisy information during the training of recommender systems. \nTo this end, we propose a noise-aware reweighting framework (NARF) for CDRIF, which effectively alleviates the negative effects brought by the implicit feedback and improves recommendation performance. Extensive experiments conducted on both synthetic and large real-world datasets demonstrate that NARF, implemented by two representative CDR algorithms, significantly outperforms the baseline methods, which further underscores the significance of handling implicit feedback in CDR. The code is available in an anonymous Github repository: https://anonymous.4open.science/r/CDR-3E2A/README.md.",
        "keywords": "recommender systems;transfer learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Jinhao Li;Mengjia Wu;Yi Zhang;Ying Ding;Yizhou Sun;Feng Liu",
        "authorids": "~Jinhao_Li2;~Mengjia_Wu1;~Yi_Zhang69;~Ying_Ding4;~Yizhou_Sun1;~Feng_Liu2",
        "gender": "M;M;M;F;F;M",
        "homepage": "https://jinhaolee.github.io;https://profiles.uts.edu.au/Mengjia.Wu;https://profiles.uts.edu.au/yi.zhang;https://yingding.ischool.utexas.edu/;http://web.cs.ucla.edu/~yzsun/;https://fengliu90.github.io/index.html",
        "dblp": "309/6695-4;271/4391;64/6544-95.html;38/6013-1.html;37/3868;77/1318-3",
        "google_scholar": "https://scholar.google.com.au/citations?user=1mPh9R8AAAAJ;https://scholar.google.com.au/citations?user=p1607ZQAAAAJ;;riuIGwIAAAAJ;https://scholar.google.com.tw/citations?user=TQgOjK0AAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": "0009-0006-9301-5579;0000-0003-3956-7808;0000-0002-7731-0301;;;0000-0002-5005-9129",
        "linkedin": "jinhao-li/;mengjia-wu-05b972212/;yi-zhang-520/;ying-ding-6a63bb/;;alexfengliu",
        "or_profile": "~Jinhao_Li2;~Mengjia_Wu1;~Yi_Zhang69;~Ying_Ding4;~Yizhou_Sun1;~Feng_Liu2",
        "aff": "University of Melbourne;University of Technology Sydney;University of Technology Sydney;University of Texas, Austin;University of California, Los Angeles;University of Melbourne",
        "aff_domain": "unimelb.edu;uts.edu.au;uts.edu.au;utexas.edu;ucla.edu;unimelb.edu.au",
        "position": "PhD student;Postdoc;Associate Professor;Full Professor;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nli2024crossdomain,\ntitle={Cross-domain Recommendation from Implicit Feedback},\nauthor={Jinhao Li and Mengjia Wu and Yi Zhang and Ying Ding and Yizhou Sun and Feng Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=wi8wMFuO0H}\n}",
        "github": "",
        "project": "",
        "reviewers": "BpkS;Bnev;LrYi;VYJS",
        "site": "https://openreview.net/forum?id=wi8wMFuO0H",
        "pdf_size": 641737,
        "rating": "1;3;3;5",
        "confidence": "5;4;4;5",
        "soundness": "2;1;3;2",
        "contribution": "1;1;1;2",
        "presentation": "3;1;2;3",
        "wc_summary": "121;149;42;85",
        "wc_strengths": "26;13;27;90",
        "wc_weaknesses": "395;59;180;497",
        "wc_questions": "214;31;56;133",
        "wc_review": "756;252;305;805",
        "wc_reply_reviewers": "0;0;209;0",
        "wc_reply_authors": "1507;786;1301;992",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "3;2;3;2",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            99.25,
            40.08974307725107
        ],
        "wc_strengths_avg": [
            39.0,
            29.958304357890484
        ],
        "wc_weaknesses_avg": [
            282.75,
            172.57226747076137
        ],
        "wc_questions_avg": [
            108.5,
            71.5768817426409
        ],
        "wc_review_avg": [
            529.5,
            252.29397535414913
        ],
        "wc_reply_reviewers_avg": [
            52.25,
            90.49965469547384
        ],
        "wc_reply_authors_avg": [
            1146.5,
            277.33598756742697
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:6VCSYIZf7YQJ:scholar.google.com/&scioq=Cross-domain+Recommendation+from+Implicit+Feedback&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;2;3;0",
        "aff_unique_norm": "University of Melbourne;University of Technology Sydney;University of Texas at Austin;University of California, Los Angeles",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.unimelb.edu.au;https://www.uts.edu.au;https://www.utexas.edu;https://www.ucla.edu",
        "aff_unique_abbr": "UniMelb;UTS;UT Austin;UCLA",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Austin;Los Angeles",
        "aff_country_unique_index": "0;0;0;1;1;0",
        "aff_country_unique": "Australia;United States"
    },
    {
        "id": "wiYV0KDAE6",
        "title": "Diffusion Models for Tabular Data Imputation and Synthetic Data Generation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Data imputation and data generation are crucial tasks in various domains, ranging from healthcare to finance, where incomplete or missing data can hinder accurate analysis and decision-making. In this paper, we explore the use of diffusion models with transformer conditioning for both data imputation and data generation tasks. Diffusion models have recently emerged as powerful generative models capable of capturing complex data distributions. By incorporating transformer conditioning, we harness the ability of transformers to model dependencies and long-range interactions within tabular data. We conduct a comprehensive evaluation by comparing the performance of diffusion models with transformer conditioning against state of the art techniques such as Variational Autoencoders (VAEs) and Generative Adversarial Networks (GANs) on benchmark datasets. For data imputation, we assess the models' ability to accurately estimate missing values while preserving the underlying data distribution. In terms of data generation, we evaluate the quality and diversity of synthetic data samples produced by the diffusion models.",
        "keywords": "Data imputation;synthetic data generation;Diffusion Model;Generative Model;Transformer",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/b4150229c52b83f869b8c33ee981b5bf55bb50e6.zip",
        "author": "Mario Villaiz\u00e1n-Vallelado;Matteo Salvatori;Carlos Segura;Ioannis Arapakis",
        "authorids": "~Mario_Villaiz\u00e1n-Vallelado1;~Matteo_Salvatori1;~Carlos_Segura1;~Ioannis_Arapakis1",
        "gender": ";M;M;",
        "homepage": ";https://github.com/MatteoSalvatori;;",
        "dblp": ";;42/6489;",
        "google_scholar": "https://scholar.google.es/citations?user=2iDbdk0AAAAJ;https://scholar.google.es/citations?user=OXSigHcAAAAJ;https://scholar.google.es/citations?user=Nypb-IYAAAAJ;",
        "orcid": "0009-0002-0754-1742;0000-0003-1499-6024;;",
        "linkedin": ";;;",
        "or_profile": "~Mario_Villaiz\u00e1n-Vallelado1;~Matteo_Salvatori1;~Carlos_Segura1;~Ioannis_Arapakis1",
        "aff": "Universidad de Valladolid;Telefonica;Telefonica Research;",
        "aff_domain": "uva.es;telefonica.com;telefonica.com;",
        "position": "PhD student;Researcher;Researcher;",
        "bibtex": "@misc{\nvillaiz{\\'a}n-vallelado2024diffusion,\ntitle={Diffusion Models for Tabular Data Imputation and Synthetic Data Generation},\nauthor={Mario Villaiz{\\'a}n-Vallelado and Matteo Salvatori and Carlos Segura and Ioannis Arapakis},\nyear={2024},\nurl={https://openreview.net/forum?id=wiYV0KDAE6}\n}",
        "github": "",
        "project": "",
        "reviewers": "uxeP;Cv2X;AvR7;TceJ",
        "site": "https://openreview.net/forum?id=wiYV0KDAE6",
        "pdf_size": 696713,
        "rating": "5;6;6;6",
        "confidence": "5;3;4;5",
        "soundness": "2;3;3;3",
        "contribution": "2;3;1;3",
        "presentation": "2;3;3;3",
        "wc_summary": "32;68;216;42",
        "wc_strengths": "16;40;43;108",
        "wc_weaknesses": "544;65;107;51",
        "wc_questions": "4;87;77;60",
        "wc_review": "596;260;443;261",
        "wc_reply_reviewers": "12;0;0;0",
        "wc_reply_authors": "453;464;347;258",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            89.5,
            74.20747940740206
        ],
        "wc_strengths_avg": [
            51.75,
            34.120191968979306
        ],
        "wc_weaknesses_avg": [
            191.75,
            204.4130316295906
        ],
        "wc_questions_avg": [
            57.0,
            32.08582241426889
        ],
        "wc_review_avg": [
            390.0,
            140.3442196885928
        ],
        "wc_reply_reviewers_avg": [
            3.0,
            5.196152422706632
        ],
        "wc_reply_authors_avg": [
            380.5,
            84.19768405366028
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12689086239006483352&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Universidad de Valladolid;Telef\u00f3nica;Telefonica",
        "aff_unique_dep": ";;Research",
        "aff_unique_url": "https://www.uv.es;https://www.telefonica.com;https://www.telefonica.com",
        "aff_unique_abbr": "UVa;Telef\u00f3nica;Telefonica",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Spain"
    },
    {
        "id": "wilJbPvRYv",
        "title": "Are We in (A)Sync?: Guidance for Efficient Federated Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Federated Learning (FL) methods have widely adopted synchronous FL (syncFL), where a server distributes and aggregates the model weights with clients in coordinated rounds. As syncFL suffers from low resource utilization on clients with heterogeneous computing power, asynchronous FL (asyncFL), which allows the server to exchange models with available clients continuously, has been proposed. Despite numerous studies on syncFL and asyncFL, how they differ in training time and resource efficiency is still unclear. Given the training and communication speed of participating clients, we present a formulation of time and resource usage on syncFL and asyncFL. Our formulation weights asyncFL against its inefficiencies stemming from stale model updates, enabling more accurate comparison to syncFL in achieving the same objectives. Unlike previous findings, the formulation reveals that no single approach always works better than the other regarding time and resource usage. Our experiments across five datasets show that the formulation predicts relative time and resource usage of syncFL and asyncFL with up to 5.5$\\times$ smaller root-mean-square error (RMSE) compared to the baseline methods. We envision our formulation to guide FL practitioners in making informed decisions between syncFL and asyncFL, depending on their resource constraints.",
        "keywords": "federated learning;synchronous federated learning;asynchronous federated learning;time-to-accuracy;resource efficiency",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Jaemin Shin;Myungjin Lee;Sung-Ju Lee;Ramana Rao Kompella",
        "authorids": "~Jaemin_Shin1;~Myungjin_Lee1;~Sung-Ju_Lee1;~Ramana_Rao_Kompella1",
        "gender": "M;M;M;M",
        "homepage": "https://jaemin-shin.github.io/;;https://nmsl.kaist.ac.kr/sjlee;https://linkedin.com/en/rkompella",
        "dblp": ";;28/1552;98/2327",
        "google_scholar": "d94q-zQAAAAJ;XjWpxJUAAAAJ;https://scholar.google.com/citations?hl=en;uf9RZboAAAAJ",
        "orcid": ";0000-0003-2360-7019;0000-0002-5518-2126;",
        "linkedin": ";;sungjulee/;",
        "or_profile": "~Jaemin_Shin1;~Myungjin_Lee1;~Sung-Ju_Lee1;~Ramana_Rao_Kompella1",
        "aff": "Korea Advanced Institute of Science & Technology;Cisco;Korea Advanced Institute of Science & Technology;Cisco",
        "aff_domain": "kaist.edu;cisco.com;kaist.ac.kr;cisco.com",
        "position": "PhD student;Principal Researcher;Full Professor;Researcher",
        "bibtex": "@misc{\nshin2024are,\ntitle={Are We in (A)Sync?: Guidance for Efficient Federated Learning},\nauthor={Jaemin Shin and Myungjin Lee and Sung-Ju Lee and Ramana Rao Kompella},\nyear={2024},\nurl={https://openreview.net/forum?id=wilJbPvRYv}\n}",
        "github": "",
        "project": "",
        "reviewers": "F9nE;pJDG;eseE",
        "site": "https://openreview.net/forum?id=wilJbPvRYv",
        "pdf_size": 411016,
        "rating": "3;3;6",
        "confidence": "4;4;3",
        "soundness": "2;3;2",
        "contribution": "2;3;2",
        "presentation": "2;3;1",
        "wc_summary": "75;46;49",
        "wc_strengths": "32;107;63",
        "wc_weaknesses": "78;207;206",
        "wc_questions": "2;257;54",
        "wc_review": "187;617;372",
        "wc_reply_reviewers": "40;0;27",
        "wc_reply_authors": "514;1416;609",
        "reply_reviewers": "1;0;1",
        "reply_authors": "2;2;2",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            56.666666666666664,
            13.021349989749739
        ],
        "wc_strengths_avg": [
            67.33333333333333,
            30.771559740918054
        ],
        "wc_weaknesses_avg": [
            163.66666666666666,
            60.576856600153455
        ],
        "wc_questions_avg": [
            104.33333333333333,
            110.01919024525778
        ],
        "wc_review_avg": [
            392.0,
            176.11549240957385
        ],
        "wc_reply_reviewers_avg": [
            22.333333333333332,
            16.659998666133067
        ],
        "wc_reply_authors_avg": [
            846.3333333333334,
            404.6779240608786
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:WAlLwe82R5MJ:scholar.google.com/&scioq=Are+We+in+(A)Sync%3F:+Guidance+for+Efficient+Federated+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;1",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology;Cisco Systems",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.kaist.ac.kr;https://www.cisco.com",
        "aff_unique_abbr": "KAIST;Cisco",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;1",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "id": "wj7nvRqdp8",
        "title": "DragDiffusion: Harnessing Diffusion Models for Interactive Point-based Image Editing",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Accurate and controllable image editing is a challenging task that has attracted significant attention recently. Notably, {\\sc DragGAN}~\\citep{pan2023drag} is an interactive point-based image editing framework that  achieves impressive editing results with pixel-level precision. However, due to its reliance on generative adversarial networks (GANs), its generality is limited by the capacity of pretrained GAN models. In this work, we extend this editing framework to diffusion models and propose a novel approach {\\sc DragDiffusion}. By harnessing large-scale pretrained diffusion models, we greatly enhance the applicability of interactive point-based editing on both real and diffusion-generated images. Our approach involves optimizing the diffusion latents to achieve precise spatial control. The supervision signal of this optimization process is from the diffusion model's UNet features, which are known to contain rich semantic and geometric information. Moreover, we introduce two additional techniques, namely LoRA fine-tuning and latent-MasaCtrl, to further preserve the identity of the original image. Lastly, we present a challenging benchmark dataset called {\\sc DragBench}---the first benchmark to evaluate the performance of interactive point-based image editing methods. Experiments across a wide range of challenging cases (e.g., images with multiple objects, diverse object categories, various styles, etc.) demonstrate the versatility and generality of {\\sc DragDiffusion}. Code and dataset will be released.",
        "keywords": "diffusion models;image editing;interactive point-based editing",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/991496fb410e02c698fc5cbe5cda55b716895162.zip",
        "author": "Yujun Shi;Chuhui Xue;Jun Hao Liew;Jiachun Pan;Hanshu Yan;Wenqing Zhang;Vincent Tan;Song Bai",
        "authorids": "~Yujun_Shi1;~Chuhui_Xue2;~Jun_Hao_Liew1;~Jiachun_Pan1;~Hanshu_Yan1;~Wenqing_Zhang1;~Vincent_Tan1;~Song_Bai3",
        "gender": "M;F;;F;;M;;M",
        "homepage": "https://yujun-shi.github.io/;;;;https://hannibalape.github.io/;https://www.ece.nus.edu.sg/stfpage/vtan/pubs.htm;https://songbai.site/;",
        "dblp": "146/4499;223/4745;;228/9156;;60/2327;;243/3583",
        "google_scholar": "Okeolr8AAAAJ;https://scholar.google.com.sg/citations?user=KJU5YRYAAAAJ;https://scholar.google.com.sg/citations?user=8gm-CYYAAAAJ;;;dJoAVvAAAAAJ;LXuWMF4AAAAJ;MG817V4AAAAJ",
        "orcid": ";;;;;0000-0002-5008-4527;;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Yujun_Shi1;~Chuhui_Xue2;~Jun_Hao_Liew1;~Jiachun_Pan1;~Wenqing_Zhang1;~Vincent_Tan1;~Song_Bai3;~Hanshu_YAN2",
        "aff": "National University of Singapore;ByteDance Inc.;ByteDance;National University of Singapore;ByteDance Inc.;National University of Singapore;ByteDance;ByteDance",
        "aff_domain": "u.nus.edu;bytedance.com;bytedance.com;nus.edu.sg;bytedance.com;nus.edu.sg;bytedance.com;bytedance.com",
        "position": "PhD student;Researcher;Researcher;Postdoc;Researcher;Full Professor;Computer Vision Lead;Research Scientist",
        "bibtex": "@misc{\nshi2024dragdiffusion,\ntitle={DragDiffusion: Harnessing Diffusion Models for Interactive Point-based Image Editing},\nauthor={Yujun Shi and Chuhui Xue and Jun Hao Liew and Jiachun Pan and Hanshu Yan and Wenqing Zhang and Vincent Tan and Song Bai},\nyear={2024},\nurl={https://openreview.net/forum?id=wj7nvRqdp8}\n}",
        "github": "",
        "project": "",
        "reviewers": "DRgP;xNxo;U8vP",
        "site": "https://openreview.net/forum?id=wj7nvRqdp8",
        "pdf_size": 14358071,
        "rating": "3;6;6",
        "confidence": "5;4;4",
        "soundness": "4;3;3",
        "contribution": "3;3;3",
        "presentation": "4;3;3",
        "wc_summary": "69;60;77",
        "wc_strengths": "25;64;121",
        "wc_weaknesses": "148;159;207",
        "wc_questions": "12;11;6",
        "wc_review": "254;294;411",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            68.66666666666667,
            6.944222218666553
        ],
        "wc_strengths_avg": [
            70.0,
            39.42080668885405
        ],
        "wc_weaknesses_avg": [
            171.33333333333334,
            25.616834742454465
        ],
        "wc_questions_avg": [
            9.666666666666666,
            2.6246692913372702
        ],
        "wc_review_avg": [
            319.6666666666667,
            66.61497996363548
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 209,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6088433274827627500&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;1;0;1;0;1;1",
        "aff_unique_norm": "National University of Singapore;ByteDance",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.nus.edu.sg;https://www.bytedance.com",
        "aff_unique_abbr": "NUS;ByteDance",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;0;1;0;1;1",
        "aff_country_unique": "Singapore;China"
    },
    {
        "id": "wk77w7DG1N",
        "title": "Evaluating and Improving Generation Consistency of Large Language Models via A Divide-Conquer-Reasoning Approach",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Evaluating the quality and variability of text generated by Large Language Models (LLMs) poses a significant, yet unresolved research challenge. Traditional evaluation methods, such as ROUGE and BERTScore, which measure token similarity, often fail to capture the holistic semantic equivalence. This results in a low correlation with human judgments and intuition, which is especially problematic in high-stakes applications like healthcare and finance where reliability, safety, and robust decision-making are highly critical. This work proposes an automated framework for evaluating the consistency of LLM-generated texts using a divide-and-conquer strategy. Unlike existing LLM-based evaluators that operate at the paragraph level, our method employs a divide-and-conquer evaluator (DCE) that breaks down the comparison between two generated responses into individual sentences, each evaluated based on predefined criteria. To facilitate this approach, we introduce an automatic metric converter (AMC) that translates the output from DCE into an interpretable numeric score. Beyond the consistency evaluation, we further present a reason-assisted improver (RAI) that leverages the analytical reasons with explanations identified by DCE to generate new responses aimed at reducing these inconsistencies. Through comprehensive and systematic empirical analysis, we show that our approach outperforms state-of-the-art methods by a large margin (e.g., +19.3\\% and +24.3\\% on the SummEval dataset) in evaluating the consistency of LLM generation across multiple benchmarks in semantic, factual, and summarization consistency tasks. Our approach also substantially reduces nearly 90\\% output inconsistencies, showing promise for effective hallucination mitigation and reduction.",
        "keywords": "consistency;divide-conquer;LLMs;evaluation",
        "primary_area": "causal reasoning",
        "supplementary_material": "",
        "author": "Wendi Cui;Jiaxin Zhang;Zhuohang Li;Damien Lopez;Kamalika Das;Bradley Malin;Sricharan Kumar",
        "authorids": "~Wendi_Cui1;~Jiaxin_Zhang2;~Zhuohang_Li1;~Damien_Lopez1;~Kamalika_Das1;~Bradley_Malin1;~Sricharan_Kumar1",
        "gender": "M;M;M;M;;;M",
        "homepage": ";https://jxzhangjhu.github.io/;https://zhuohang.li/;https://www.linkedin.com/in/damien-lopez-754b03b9/;;;http://www-personal.umich.edu/~kksreddy/",
        "dblp": "366/2309;32/7698-5.html;;;;;26/8762.html",
        "google_scholar": "qsuYsLsAAAAJ;LiDm8jEAAAAJ;_FgPQ50AAAAJ;;AF6kWHUAAAAJ;;KHtiAOMAAAAJ",
        "orcid": ";;;;;;",
        "linkedin": "wendi-cui/;jiaxin-zhang-1425289b/;;;;;",
        "or_profile": "~Wendi_Cui1;~Jiaxin_Zhang2;~Zhuohang_Li1;~Damien_Lopez1;~Kamalika_Das1;~Bradley_Malin1;~Sricharan_Kumar1",
        "aff": "Intuit;Intuit AI Research;Vanderbilt University;Austin Peay State University;Intuit;;Intuit",
        "aff_domain": "intuit.com;intuit.com;vanderbilt.edu;apsu.edu;intuit.com;;intuit.com",
        "position": "Researcher;Researcher;PhD student;Intern;Researcher;;Researcher",
        "bibtex": "@misc{\ncui2024evaluating,\ntitle={Evaluating and Improving Generation Consistency of Large Language Models via A Divide-Conquer-Reasoning Approach},\nauthor={Wendi Cui and Jiaxin Zhang and Zhuohang Li and Damien Lopez and Kamalika Das and Bradley Malin and Sricharan Kumar},\nyear={2024},\nurl={https://openreview.net/forum?id=wk77w7DG1N}\n}",
        "github": "",
        "project": "",
        "reviewers": "9wcP;Zcqt;2NAw",
        "site": "https://openreview.net/forum?id=wk77w7DG1N",
        "pdf_size": 606279,
        "rating": "3;5;6",
        "confidence": "4;4;3",
        "soundness": "3;1;3",
        "contribution": "2;2;2",
        "presentation": "3;4;3",
        "wc_summary": "48;116;78",
        "wc_strengths": "42;27;32",
        "wc_weaknesses": "128;287;357",
        "wc_questions": "60;1;34",
        "wc_review": "278;431;501",
        "wc_reply_reviewers": "0;653;91",
        "wc_reply_authors": "1797;2159;1141",
        "reply_reviewers": "0;2;2",
        "reply_authors": "5;6;4",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            80.66666666666667,
            27.824849006278942
        ],
        "wc_strengths_avg": [
            33.666666666666664,
            6.236095644623236
        ],
        "wc_weaknesses_avg": [
            257.3333333333333,
            95.81347620362295
        ],
        "wc_questions_avg": [
            31.666666666666668,
            24.143091949642425
        ],
        "wc_review_avg": [
            403.3333333333333,
            93.11760783487132
        ],
        "wc_reply_reviewers_avg": [
            248.0,
            288.77788465647205
        ],
        "wc_reply_authors_avg": [
            1699.0,
            421.33438818433353
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            5.0,
            0.816496580927726
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.7559289460184545,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13055330392970363072&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;0;0",
        "aff_unique_norm": "Intuit Inc.;Intuit;Vanderbilt University;Austin Peay State University",
        "aff_unique_dep": ";Intuit AI Research;;",
        "aff_unique_url": "https://www.intuit.com/;https://intuit.com/;https://www.vanderbilt.edu;https://www.apsu.edu",
        "aff_unique_abbr": "Intuit;Intuit;Vanderbilt;APSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "LUM-ViT: Learnable Under-sampling Mask Vision Transformer for Bandwidth Limited Optical Signal Acquisition",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17482",
        "id": "wkbeqr5XhC",
        "author_site": "Lingfeng Liu, Dong Ni, Hangjie Yuan",
        "tldr": "",
        "abstract": "Bandwidth constraints during signal acquisition frequently impede real-time detection applications. Hyperspectral data is a notable example, whose vast volume compromises real-time hyperspectral detection. To tackle this hurdle, we introduce a novel approach leveraging pre-acquisition modulation to reduce the acquisition volume. This modulation process is governed by a deep learning model, utilizing prior information. Central to our approach is LUM-ViT, a Vision Transformer variant. Uniquely, LUM-ViT incorporates a learnable under-sampling mask tailored for pre-acquisition modulation. To further optimize for optical calculations, we propose a kernel-level weight binarization technique and a three-stage fine-tuning strategy. Our evaluations reveal that, by sampling a mere 10\\% of the original image pixels, LUM-ViT maintains the accuracy loss within 1.8\\% on the ImageNet classification task. The method sustains near-original accuracy when implemented on real-world optical hardware, demonstrating its practicality. Code will be available at [https://github.com/MaxLLF/LUM-ViT](https://github.com/MaxLLF/LUM-ViT).",
        "keywords": "hyperspectral imaging;optical modulation;real-time detection;vision transformer;pre-acquisition modulation;learnable mask;weight binarization",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/0ae6e93e622aea6445c707d0073d0562674fe857.zip",
        "author": "Lingfeng Liu;Dong Ni;Hangjie Yuan",
        "authorids": "~Lingfeng_Liu1;~Dong_Ni3;~Hangjie_Yuan1",
        "gender": "M;M;M",
        "homepage": ";;https://jacobyuan7.github.io/",
        "dblp": "75/3152;;293/9956",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;;jQ3bFDMAAAAJ",
        "orcid": ";0000-0002-2227-2555;",
        "linkedin": ";;",
        "or_profile": "~Lingfeng_Liu1;~Dong_Ni3;~Hangjie_Yuan1",
        "aff": "Zhejiang University;Zhejiang University;Zhejiang University",
        "aff_domain": "zju.edu.cn;zju.edu.cn;zju.edu.cn",
        "position": "PhD student;Full Professor;PhD student",
        "bibtex": "@inproceedings{\nliu2024lumvit,\ntitle={{LUM}-ViT: Learnable Under-sampling Mask Vision Transformer for Bandwidth Limited Optical Signal Acquisition},\nauthor={Lingfeng Liu and Dong Ni and Hangjie Yuan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=wkbeqr5XhC}\n}",
        "github": "",
        "project": "",
        "reviewers": "wWh6;vQM3;rvtr",
        "pdf_size": 7089299,
        "rating": "6;6;6",
        "confidence": "5;4;3",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "3;3;3",
        "wc_summary": "104;61;19",
        "wc_strengths": "154;45;19",
        "wc_weaknesses": "262;86;75",
        "wc_questions": "38;84;5",
        "wc_review": "558;276;118",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "2009;1236;1255",
        "reply_reviewers": "0;0;0",
        "reply_authors": "4;3;4",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            61.333333333333336,
            34.70190516703978
        ],
        "wc_strengths_avg": [
            72.66666666666667,
            58.48266599790251
        ],
        "wc_weaknesses_avg": [
            141.0,
            85.67769060068477
        ],
        "wc_questions_avg": [
            42.333333333333336,
            32.396844839514166
        ],
        "wc_review_avg": [
            317.3333333333333,
            181.99145279075304
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1500.0,
            360.0009259247352
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:RKSy19ZQaYEJ:scholar.google.com/&scioq=LUM-ViT:+Learnable+Under-sampling+Mask+Vision+Transformer+for+Bandwidth+Limited+Optical+Signal+Acquisition&hl=en&as_sdt=0,47",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=wkbeqr5XhC",
        "pdf": "https://openreview.net/pdf?id=wkbeqr5XhC",
        "email": "zju.edu.cn;zju.edu.cn;zju.edu.cn",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Zhejiang University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.zju.edu.cn",
        "aff_unique_abbr": "ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "wlRp8IdLkN",
        "title": "Teaching LLMs to Teach Themselves Better Instructions via Reinforcement Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The development of Large Language Models (LLMs) often confronts challenges stemming from the heavy reliance on human annotators in the reinforcement learning with human feedback (RLHF) framework, or the frequent and costly external queries tied to the self-instruct paradigm.  In this work, we pivot to Reinforcement Learning (RL)---but with a twist. Diverging from the typical RLHF, which refines LLMs following instruction data training,  we use RL to directly generate the foundational instruction dataset  that alone suffices for fine-tuning. Our method uses a suite of textual operations and rules, prioritizing the diversification of training datasets. It facilitates the generation of  rich instructions without excessive reliance on external advanced models, paving the way for a single fine-tuning step and negating the need for subsequent RLHF stages. Our findings underscore some key advantages of our approach: a diminished need for human involvement and fewer model queries, along with boosting the capability of LLMs in crafting and comprehending complex instructions compared to strong baselines.",
        "keywords": "Large Language Models;Complex Instructions;Reinforcement Learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Shangding Gu;Alois Knoll;Ming Jin",
        "authorids": "~Shangding_Gu1;~Alois_Knoll1;~Ming_Jin2",
        "gender": "M;M;M",
        "homepage": "https://people.eecs.berkeley.edu/~shangding.gu/index.html;https://www.in.tum.de/i06/people/prof-dr-ing-habil-alois-knoll/;http://www.jinming.tech/",
        "dblp": "268/8183;k/AloisKnoll;",
        "google_scholar": "E1GCDXUAAAAJ;https://scholar.google.de/citations?user=-CA8QgwAAAAJ;YdxdTtkAAAAJ",
        "orcid": ";0000-0003-4840-076X;",
        "linkedin": ";alois-knoll-505480166;",
        "or_profile": "~Shangding_Gu1;~Alois_Knoll1;~Ming_Jin2",
        "aff": "University of California, Berkeley;Technical University Munich;Virginia Tech",
        "aff_domain": "berkeley.edu;tum.de;vt.edu",
        "position": "Postdoc;Full Professor;Assistant Professor",
        "bibtex": "@misc{\ngu2024teaching,\ntitle={Teaching {LLM}s to Teach Themselves Better Instructions via Reinforcement Learning},\nauthor={Shangding Gu and Alois Knoll and Ming Jin},\nyear={2024},\nurl={https://openreview.net/forum?id=wlRp8IdLkN}\n}",
        "github": "",
        "project": "",
        "reviewers": "1H8F;6muu;tJXC",
        "site": "https://openreview.net/forum?id=wlRp8IdLkN",
        "pdf_size": 389283,
        "rating": "3;5;6",
        "confidence": "4;3;3",
        "soundness": "2;3;2",
        "contribution": "2;2;3",
        "presentation": "1;3;2",
        "wc_summary": "82;41;341",
        "wc_strengths": "25;24;69",
        "wc_weaknesses": "124;66;178",
        "wc_questions": "91;1;61",
        "wc_review": "322;132;649",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1182;684;813",
        "reply_reviewers": "0;0;0",
        "reply_authors": "3;2;2",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            154.66666666666666,
            132.8164983058288
        ],
        "wc_strengths_avg": [
            39.333333333333336,
            20.98147330914162
        ],
        "wc_weaknesses_avg": [
            122.66666666666667,
            45.73352769637999
        ],
        "wc_questions_avg": [
            51.0,
            37.416573867739416
        ],
        "wc_review_avg": [
            367.6666666666667,
            213.5202306314062
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            893.0,
            211.03080343873972
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.9449111825230683,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:liG-2y5RnTMJ:scholar.google.com/&scioq=Teaching+LLMs+to+Teach+Themselves+Better+Instructions+via+Reinforcement+Learning&hl=en&as_sdt=0,31",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of California, Berkeley;Technical University of Munich;Virginia Tech",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.berkeley.edu;https://www.tum.de;https://www.vt.edu",
        "aff_unique_abbr": "UC Berkeley;TUM;VT",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Berkeley;",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United States;Germany"
    },
    {
        "id": "wlqkRFRkYc",
        "title": "BEV-CLIP: Multi-modal BEV Retrieval Methodology for Complex Scene in Autonomous Driving",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The demand for the retrieval of complex scene data in autonomous driving is increasing, especially as passenger vehicles have been equipped with the ability to navigate urban settings, with the imperative to address long-tail scenarios. Meanwhile, under the pre-existing two dimensional image retrieval method, some problems may arise with scene retrieval, such as lack of global feature representation and sub-par text retrieval ability. To address these issues, we have proposed BEV-CLIP, the first multimodal BEV retrieval methodology that utilize descriptive text as an input to retrieve corresponding scenes. This methodology applies the semantic feature extraction abilities of a large language model (LLM) to facilitate zero-shot retrieval of extensive text descriptions, and incorporates semi-structured information from a knowledge graph to improve the semantic richness and variety of the language embedding. Our experiments result in 87.66\\% accuracy on NuScenes dataset in text-to-BEV feature retrieval. The demonstrated cases in our paper support that our retrieval method is also indicated to be effective in identifying certain long-tail corner scenes.",
        "keywords": "Autonomous Driving;BEV;Retrieval;Multi-modal;LLM;prompt learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/f7da904b60b19542c1acd2f51e71e996b1195d3f.zip",
        "author": "dafeng wei;Zhengyu Jia;Tian Gao;Changwei Cai;Chengkai Hou;Peng Jia;Fan JingChen;YIXING ZHAO;Kun Zhan;FU LIU;YANG WANG",
        "authorids": "~dafeng_wei1;~Zhengyu_Jia2;~Tian_Gao7;~Changwei_Cai1;~Chengkai_Hou1;~Peng_Jia1;~Fan_JingChen1;~YIXING_ZHAO1;~Kun_Zhan3;~FU_LIU2;~YANG_WANG50",
        "gender": "M;;M;M;;M;M;M;M;;M",
        "homepage": "https://github.com/weidafeng;;;https://ccw1996.github.io;;https://www.lixiang.com/#li;https://www.lixiang.com/;https://github.com/zhaoyixing;https://zhankunliauto.github.io/;;https://github.com/kobeandhebe?tab=repositories",
        "dblp": "291/8791.html;;;;;;;;;;",
        "google_scholar": "BZ9EUB8AAAAJ;;;;;Z_QY_VwAAAAJ;;;;;",
        "orcid": ";;;;;;;;;;",
        "linkedin": ";;tian-gao-7808b616a;;;;;;;;",
        "or_profile": "~dafeng_wei1;~Zhengyu_Jia2;~Tian_Gao7;~Changwei_Cai1;~Chengkai_Hou1;~Peng_Jia1;~Fan_JingChen1;~YIXING_ZHAO1;~Kun_Zhan3;~FU_LIU2;~YANG_WANG50",
        "aff": "LiAuto;;Li Auto Inc.;li auto;;Li Auto;LiAuto;LiAuto;LiAuto;;Li Auto",
        "aff_domain": "lixiang.com;;lixiang.com;lixiang.com;;lixiang.com;lixiang.com;lixiang.com;liauto.com;;lixiang.com",
        "position": "Researcher;;Researcher;Researcher;;Researcher;Engneering;Researcher;Engneering;;Researcher",
        "bibtex": "@misc{\nwei2024bevclip,\ntitle={{BEV}-{CLIP}: Multi-modal {BEV} Retrieval Methodology for Complex Scene in Autonomous Driving},\nauthor={dafeng wei and Zhengyu Jia and Tian Gao and Changwei Cai and Chengkai Hou and Peng Jia and Fan JingChen and YIXING ZHAO and Kun Zhan and FU LIU and YANG WANG},\nyear={2024},\nurl={https://openreview.net/forum?id=wlqkRFRkYc}\n}",
        "github": "",
        "project": "",
        "reviewers": "Z1vR;cPYi;PBGj;gTzc",
        "site": "https://openreview.net/forum?id=wlqkRFRkYc",
        "pdf_size": 1342885,
        "rating": "3;3;5;5",
        "confidence": "5;4;4;4",
        "soundness": "2;1;2;2",
        "contribution": "2;1;2;2",
        "presentation": "2;2;3;3",
        "wc_summary": "116;31;61;73",
        "wc_strengths": "56;33;52;106",
        "wc_weaknesses": "252;106;125;235",
        "wc_questions": "55;38;16;40",
        "wc_review": "479;208;254;454",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            70.25,
            30.523556476924508
        ],
        "wc_strengths_avg": [
            61.75,
            26.984949508939238
        ],
        "wc_weaknesses_avg": [
            179.5,
            64.63164859416786
        ],
        "wc_questions_avg": [
            37.25,
            13.91716565971678
        ],
        "wc_review_avg": [
            348.75,
            119.19600454713236
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2152861406241668303&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;2;0;0;0;2",
        "aff_unique_norm": "LiAuto;Li Auto Inc.;Li Auto",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.liauto.com;https://www.liauto.com;https://www.liauto.com",
        "aff_unique_abbr": "LiAuto;Li Auto;Li Auto",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Scalable Diffusion for Materials Generation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17481",
        "id": "wm4WlHoXpC",
        "author_site": "Sherry Yang, Kwanghwan Cho, Amil Merchant, Pieter Abbeel, Dale Schuurmans, Igor Mordatch, Ekin Cubuk",
        "tldr": "",
        "abstract": "\u200b\u200b\u200b\u200bGenerative models trained on internet-scale data are capable of generating novel and realistic texts, images, and videos. A natural next question is whether these models can advance science, for example by generating novel stable materials. Traditionally, models with explicit structures (e.g., graphs) have been used in modeling structural relationships in scientific data (e.g., atoms and bonds in crystals), but generating structures can be difficult to scale to large and complex systems. Another challenge in generating materials is the mismatch between standard generative modeling metrics and downstream applications. For instance, common metrics such as the reconstruction error do not correlate well with the downstream goal of discovering novel stable materials. In this work, we tackle the scalability challenge by developing a unified crystal representation that can represent any crystal structure (UniMat), followed by training a diffusion probabilistic model on these UniMat representations. Our empirical results suggest that despite the lack of explicit structure modeling, UniMat can generate high fidelity crystal structures from larger and more complex chemical systems, outperforming previous graph-based approaches under various generative modeling metrics. To better connect the generation quality of materials to downstream applications, such as discovering novel stable materials, we propose additional metrics for evaluating generative models of materials, including per-composition formation energy and stability with respect to convex hulls through decomposition energy from Density Function Theory (DFT). Lastly, we show that conditional generation with UniMat can scale to previously established crystal datasets with up to millions of crystals structures, outperforming random structure search (the current leading method for structure discovery) in discovering new stable materials.",
        "keywords": "Generative models for materials;diffusion models;density function theory",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Sherry Yang;KwangHwan Cho;Amil Merchant;Pieter Abbeel;Dale Schuurmans;Igor Mordatch;Ekin Dogus Cubuk",
        "authorids": "~Sherry_Yang1;~KwangHwan_Cho1;~Amil_Merchant1;~Pieter_Abbeel2;~Dale_Schuurmans1;~Igor_Mordatch4;~Ekin_Dogus_Cubuk1",
        "gender": "F;M;M;M;;;M",
        "homepage": "https://sherryy.github.io;;https://scholar.google.com/citations?user=uRImMPoAAAAJ&hl=en;https://people.eecs.berkeley.edu/~pabbeel/;;;",
        "dblp": ";;;;;;83/7734",
        "google_scholar": "7c1B_fIAAAAJ;;;https://scholar.google.com.tw/citations?user=vtwH6GkAAAAJ;;;Mu_8iOEAAAAJ",
        "orcid": ";;;;;;",
        "linkedin": ";ruben-cho/;;;;;ekin-dogus-cubuk-9148b8114/",
        "or_profile": "~Sherry_Yang1;~KwangHwan_Cho1;~Amil_Merchant1;~Pieter_Abbeel2;~Dale_Schuurmans1;~Igor_Mordatch4;~Ekin_Dogus_Cubuk1",
        "aff": "University of California, Berkeley;;Stanford University;Covariant;;;Google",
        "aff_domain": "berkeley.edu;;stanford.edu;covariant.ai;;;google.com",
        "position": "Student;;PhD student;Founder;;;Staff Research Scientist",
        "bibtex": "@inproceedings{\nyang2024scalable,\ntitle={Scalable Diffusion for Materials Generation},\nauthor={Sherry Yang and KwangHwan Cho and Amil Merchant and Pieter Abbeel and Dale Schuurmans and Igor Mordatch and Ekin Dogus Cubuk},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=wm4WlHoXpC}\n}",
        "github": "",
        "project": "",
        "reviewers": "Xv1e;LWEX;JpxX;HVsx",
        "pdf_size": 2460941,
        "rating": "5;6;6;8",
        "confidence": "2;4;4;3",
        "soundness": "2;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "81;117;59;111",
        "wc_strengths": "37;138;63;131",
        "wc_weaknesses": "124;248;106;38",
        "wc_questions": "20;286;51;94",
        "wc_review": "262;789;279;374",
        "wc_reply_reviewers": "0;11;60;0",
        "wc_reply_authors": "344;502;378;258",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "2;2;2;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            92.0,
            23.430749027719962
        ],
        "wc_strengths_avg": [
            92.25,
            43.30920802785477
        ],
        "wc_weaknesses_avg": [
            129.0,
            75.82216034906945
        ],
        "wc_questions_avg": [
            112.75,
            103.41995697156328
        ],
        "wc_review_avg": [
            426.0,
            213.87963904962996
        ],
        "wc_reply_reviewers_avg": [
            17.75,
            24.80297361204902
        ],
        "wc_reply_authors_avg": [
            370.5,
            87.61706454795207
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.20751433915982243,
        "gs_citation": 55,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17732367709751968412&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=wm4WlHoXpC",
        "pdf": "https://openreview.net/pdf?id=wm4WlHoXpC",
        "email": "berkeley.edu;;stanford.edu;covariant.ai;;;google.com",
        "author_num": 7,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "University of California, Berkeley;Stanford University;Covariant;Google",
        "aff_unique_dep": ";;;Google",
        "aff_unique_url": "https://www.berkeley.edu;https://www.stanford.edu;;https://www.google.com",
        "aff_unique_abbr": "UC Berkeley;Stanford;;Google",
        "aff_campus_unique_index": "0;1;3",
        "aff_campus_unique": "Berkeley;Stanford;;Mountain View",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States;"
    },
    {
        "title": "Compositional Generative Inverse Design",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17480",
        "id": "wmX0CqFSd7",
        "author_site": "Tailin Wu, Takashi Maruyama, Long Wei, Tao Zhang, Yilun Du, Gianluca Iaccarino, Jure Leskovec",
        "tldr": "",
        "abstract": "Inverse design, where we seek to design input variables in order to optimize an underlying objective function, is an important problem that arises across fields such as mechanical engineering to aerospace engineering. Inverse design is typically formulated as an optimization problem, with recent works leveraging optimization across learned dynamics models. However, as models are optimized they tend to fall into adversarial modes, preventing effective sampling. We illustrate that by instead optimizing over the learned energy function captured by the diffusion model, we can avoid such adversarial examples and significantly improve design performance. We further illustrate how such a design system is compositional, enabling us to combine multiple different diffusion models representing subcomponents of our desired system to design systems with every specified component. In an N-body interaction task and a challenging 2D multi-airfoil design task, we demonstrate that by composing the learned diffusion model at test time, our method allows us to design initial states and boundary shapes that are more complex than those in the training data. Our method generalizes to more objects for N-body dataset and discovers formation flying to minimize drag in the multi-airfoil design task. Project website and code can be found at https://github.com/AI4Science-WestlakeU/cindm.",
        "keywords": "inverse design;generative design;PDE;physical simulation;compositional",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/2e82822f55e68862fec13756086653aeb7b83c34.pdf",
        "author": "Tailin Wu;Takashi Maruyama;Long Wei;Tao Zhang;Yilun Du;Gianluca Iaccarino;Jure Leskovec",
        "authorids": "~Tailin_Wu1;~Takashi_Maruyama2;~Long_Wei1;~Tao_Zhang35;~Yilun_Du1;~Gianluca_Iaccarino1;~Jure_Leskovec1",
        "gender": "M;M;M;M;;M;",
        "homepage": "http://tailin.org;https://sites.google.com/view/tmaruyama/home;https://longweizju.github.io/;https://zhangtao167.github.io/;https://yilundu.github.io;https://profiles.stanford.edu/gianluca-iaccarino;http://cs.stanford.edu/~jure/",
        "dblp": "200/8994;15/1541;;15/4777-33;204/4379;;l/JureLeskovec",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;GU42ydUAAAAJ;AUvVBewAAAAJ;;1cy-HoEAAAAJ;Q_kKkIUAAAAJ",
        "orcid": "0009-0003-1586-0820;;;;;;0000-0002-5411-923X",
        "linkedin": ";;;%E6%B6%9B-%E5%BC%A0-2a4043292/;;;leskovec/",
        "or_profile": "~Tailin_Wu1;~Takashi_Maruyama2;~Long_Wei1;~Tao_Zhang35;~Yilun_Du1;~Gianluca_Iaccarino1;~Jure_Leskovec1",
        "aff": "Westlake University;NEC;Westlake University;Wuhan University;Massachusetts Institute of Technology;;Kumo.AI",
        "aff_domain": "westlake.edu;nec.com;westlake.edu;whu.edu.cn;mit.edu;;kumo.ai",
        "position": "Assistant Professor;Researcher;Postdoc;Undergrad student;PhD student;;Chief Scientist",
        "bibtex": "@inproceedings{\nwu2024compositional,\ntitle={Compositional Generative Inverse Design},\nauthor={Tailin Wu and Takashi Maruyama and Long Wei and Tao Zhang and Yilun Du and Gianluca Iaccarino and Jure Leskovec},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=wmX0CqFSd7}\n}",
        "github": "",
        "project": "",
        "reviewers": "7GzX;4Mfs;WWyF;obHR",
        "pdf_size": 5478996,
        "rating": "6;6;8;8",
        "confidence": "3;3;4;3",
        "soundness": "3;4;3;3",
        "contribution": "3;3;2;3",
        "presentation": "3;3;3;2",
        "wc_summary": "57;112;113;62",
        "wc_strengths": "80;40;43;108",
        "wc_weaknesses": "88;21;198;123",
        "wc_questions": "15;146;25;34",
        "wc_review": "240;319;379;327",
        "wc_reply_reviewers": "0;0;23;403",
        "wc_reply_authors": "812;1766;3378;1826",
        "reply_reviewers": "0;0;1;2",
        "reply_authors": "1;3;7;5",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            86.0,
            26.56124997058685
        ],
        "wc_strengths_avg": [
            67.75,
            28.07467720206236
        ],
        "wc_weaknesses_avg": [
            107.5,
            63.822018144211015
        ],
        "wc_questions_avg": [
            55.0,
            52.966970840326525
        ],
        "wc_review_avg": [
            316.25,
            49.68588833864199
        ],
        "wc_reply_reviewers_avg": [
            106.5,
            171.44168104635466
        ],
        "wc_reply_authors_avg": [
            1945.5,
            919.6981841887044
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            4.0,
            2.23606797749979
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5928805138575752972&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 8,
        "openreview": "https://openreview.net/forum?id=wmX0CqFSd7",
        "pdf": "https://openreview.net/pdf?id=wmX0CqFSd7",
        "email": "westlake.edu;nec.com;westlake.edu;whu.edu.cn;mit.edu;;kumo.ai",
        "author_num": 7,
        "aff_unique_index": "0;1;0;2;3;4",
        "aff_unique_norm": "Westlake University;NEC Corporation;Wuhan University;Massachusetts Institute of Technology;Kumo.AI",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.westlake.edu.cn;https://www.nec.com;http://www.whu.edu.cn/;https://web.mit.edu;https://www.kumo.ai",
        "aff_unique_abbr": "WU;NEC;WHU;MIT;Kumo.AI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;2;2",
        "aff_country_unique": "China;Japan;United States"
    },
    {
        "id": "wmq67R2PIu",
        "title": "DockGame: Cooperative Games for Multimeric Rigid Protein Docking",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Protein interactions and assembly formation are fundamental to most biological processes. Predicting the assembly structure from constituent proteins -- referred to as the protein docking task -- is thus a crucial step in protein design applications. Most traditional and deep learning methods for docking have focused mainly on binary docking, following either a search-based, regression-based, or generative modeling paradigm. In this paper, we focus on the less-studied multimeric (i.e., two or more proteins) docking problem. We introduce DockGame, a novel game-theoretic framework for docking -- we view protein docking as a cooperative game between proteins, where the final assembly structure(s) constitute stable equilibria w.r.t. the underlying game potential. Since we do not have access to the true potential, we consider two approaches - i) learning a surrogate game potential guided by physics-based energy functions and computing equilibria by simultaneous gradient updates, and ii) sampling from the Gibbs distribution of the true potential by learning a \ndiffusion generative model over the action spaces (rotations and translations) of all proteins. Empirically, on the Docking Benchmark 5.5 (DB5.5) dataset, DockGame has much faster runtimes than traditional docking methods, can generate multiple plausible assembly structures, and achieves comparable performance to existing binary docking baselines, despite solving the harder task of coordinating multiple protein chains.",
        "keywords": "protein docking;multi-chain docking;score matching;multi-agent diffusion",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/c1c89843c6f455ec07a70245e2a8dea9d0612061.zip",
        "author": "Vignesh Ram Somnath;Pier Giuseppe Sessa;Maria Rodriguez Martinez;Andreas Krause",
        "authorids": "~Vignesh_Ram_Somnath2;~Pier_Giuseppe_Sessa1;~Maria_Rodriguez_Martinez1;~Andreas_Krause1",
        "gender": "M;;F;M",
        "homepage": "https://vsomnath.github.io/;;https://medicine.yale.edu/profile/maria-rodriguezmartinez/;https://las.inf.ethz.ch/krausea",
        "dblp": "251/3126;;178/8685;87/1831-1.html",
        "google_scholar": "dhirXLcAAAAJ;;PjKglDoAAAAJ;https://scholar.google.ch/citations?user=eDHv58AAAAAJ",
        "orcid": ";;0000-0003-3766-4233;0000-0001-7260-9673",
        "linkedin": ";;;krausea/",
        "or_profile": "~Vignesh_Ram_Somnath2;~Pier_Giuseppe_Sessa1;~Maria_Rodriguez_Martinez1;~Andreas_Krause1",
        "aff": "Swiss Federal Institute of Technology, Zurich;;Yale University;ETH Zurich",
        "aff_domain": "ethz.ch;;yale.edu;ethz.ch",
        "position": "PhD student;;Associate Professor;Full Professor",
        "bibtex": "@misc{\nsomnath2024dockgame,\ntitle={DockGame: Cooperative Games for Multimeric Rigid Protein Docking},\nauthor={Vignesh Ram Somnath and Pier Giuseppe Sessa and Maria Rodriguez Martinez and Andreas Krause},\nyear={2024},\nurl={https://openreview.net/forum?id=wmq67R2PIu}\n}",
        "github": "",
        "project": "",
        "reviewers": "tNw5;8gtr;vQeX;4vSX",
        "site": "https://openreview.net/forum?id=wmq67R2PIu",
        "pdf_size": 4579493,
        "rating": "3;3;3;5",
        "confidence": "5;4;5;5",
        "soundness": "1;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;1;3",
        "wc_summary": "94;19;42;101",
        "wc_strengths": "88;45;20;43",
        "wc_weaknesses": "149;281;48;188",
        "wc_questions": "1735;286;84;23",
        "wc_review": "2066;631;194;355",
        "wc_reply_reviewers": "0;110;65;0",
        "wc_reply_authors": "2015;930;506;589",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "4;2;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            64.0,
            34.56153931757091
        ],
        "wc_strengths_avg": [
            49.0,
            24.566236993076494
        ],
        "wc_weaknesses_avg": [
            166.5,
            83.54789045810791
        ],
        "wc_questions_avg": [
            532.0,
            701.3397892605267
        ],
        "wc_review_avg": [
            811.5,
            740.9536085342995
        ],
        "wc_reply_reviewers_avg": [
            43.75,
            46.55306112384018
        ],
        "wc_reply_authors_avg": [
            1010.0,
            601.5982878964999
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3276626536426188010&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Swiss Federal Institute of Technology (ETH Zurich);Yale University;ETH Zurich",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ethz.ch;https://www.yale.edu;https://www.ethz.ch",
        "aff_unique_abbr": "ETH Zurich;Yale;ETHZ",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Zurich;",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Switzerland;United States"
    },
    {
        "id": "wmw3Jy8MVF",
        "title": "Equivariant Graph Network Approximations of High-Degree Polynomials for Force Field Prediction",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Equivariant deep models have recently been employed to predict atomic potentials and force fields in molecular dynamics. A key advantage of these models is their ability to learn from data without requiring explicit physical modeling. Nevertheless, use of models obeying underlying physics can not only lead to better performance, but also yield physically interpretable results. In this work, we propose a new equivariant network, known as PACE, to incorporate many-body interactions by making use of the Atomic Cluster Expansion (ACE) mechanism. To provide a solid foundation for our work, we perform theoretical analysis showing that our proposed message passing scheme can approximate any equivariant polynomial functions with constrained degree. By relying physical insights and theoretical foundations, we show that our model achieves state-of-the-art performance on atomic potential and force field prediction tasks on commonly used benchmarks.",
        "keywords": "graph neural network;deep learning;molecule",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Zhao Xu;Haiyang Yu;Montgomery Bohde;Shuiwang Ji",
        "authorids": "~Zhao_Xu3;~Haiyang_Yu6;~Montgomery_Bohde1;~Shuiwang_Ji1",
        "gender": "F;M;M;M",
        "homepage": ";https://oceanusity.github.io/;https://www.mbohde.com/;http://people.tamu.edu/~sji",
        "dblp": "96/5046-5.html;90/6643-5;352/4123;84/6405",
        "google_scholar": "L5UBY3wAAAAJ;LZKU1hUAAAAJ;https://scholar.google.com/citations?view_op=list_works;BZGj6sAAAAAJ",
        "orcid": ";;0009-0007-7705-1219;0000-0002-4205-4563",
        "linkedin": "zhao-xu-9170b0b8/;;montgomery-bohde/;shuiwang-ji-9a040715/",
        "or_profile": "~Zhao_Xu3;~Haiyang_Yu6;~Montgomery_Bohde1;~Shuiwang_Ji1",
        "aff": "Texas A&M University - College Station;Texas A&M University - College Station;Massachusetts Institute of Technology;Texas A&M University",
        "aff_domain": "tamu.edu;tamu.edu;mit.edu;tamu.edu",
        "position": "PhD student;PhD student;Intern;Professor",
        "bibtex": "@misc{\nxu2024equivariant,\ntitle={Equivariant Graph Network Approximations of High-Degree Polynomials for Force Field Prediction},\nauthor={Zhao Xu and Haiyang Yu and Montgomery Bohde and Shuiwang Ji},\nyear={2024},\nurl={https://openreview.net/forum?id=wmw3Jy8MVF}\n}",
        "github": "",
        "project": "",
        "reviewers": "LgUR;8CoZ;Nhdf;9963",
        "site": "https://openreview.net/forum?id=wmw3Jy8MVF",
        "pdf_size": 2118222,
        "rating": "3;6;6;8",
        "confidence": "3;3;4;4",
        "soundness": "3;2;2;4",
        "contribution": "1;3;2;3",
        "presentation": "3;3;2;3",
        "wc_summary": "65;42;59;29",
        "wc_strengths": "20;40;34;22",
        "wc_weaknesses": "248;67;103;168",
        "wc_questions": "37;2;88;6",
        "wc_review": "370;151;284;225",
        "wc_reply_reviewers": "0;12;51;0",
        "wc_reply_authors": "830;206;293;97",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            48.75,
            14.184057952504283
        ],
        "wc_strengths_avg": [
            29.0,
            8.306623862918075
        ],
        "wc_weaknesses_avg": [
            146.5,
            68.87851624418168
        ],
        "wc_questions_avg": [
            33.25,
            34.390223901568305
        ],
        "wc_review_avg": [
            257.5,
            80.2449375350246
        ],
        "wc_reply_reviewers_avg": [
            15.75,
            20.932928605429293
        ],
        "wc_reply_authors_avg": [
            356.5,
            282.05717505498774
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.7001400420140049,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:isqE0X0upI4J:scholar.google.com/&scioq=Equivariant+Graph+Network+Approximations+of+High-Degree+Polynomials+for+Force+Field+Prediction&hl=en&as_sdt=0,34",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Texas A&M University;Massachusetts Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tamu.edu;https://web.mit.edu",
        "aff_unique_abbr": "TAMU;MIT",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "College Station;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "wmzFZ9lJrD",
        "title": "Boolformer: Symbolic Regression of Logic Functions with Transformers",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this work, we introduce the Boolformer, the first Transformer architecture trained to perform end-to-end symbolic regression of Boolean functions. First, we show that it can predict compact formulas for complex functions which were not seen during training, when provided a clean truth table. Then, we demonstrate its ability to find approximate expressions when provided incomplete and noisy observations. We compare it with classic machine learning approaches on a broad set of real-world binary classification datasets, demonstrating its potential as an interpretable alternative. Finally, we apply it to the widespread task of modelling the dynamics of gene regulatory networks. Using a recent benchmark, we show that Boolformer is competitive with state-of-the art genetic algorithms with a speedup of several orders of magnitude.",
        "keywords": "symbolic regression;boolean functions;transformers",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "/attachment/a06907de5ea05afab110532df9f363bdc40e0553.pdf",
        "author": "St\u00e9phane d'Ascoli;Samy Bengio;Joshua M. Susskind;Emmanuel Abbe",
        "authorids": "~St\u00e9phane_d'Ascoli1;~Samy_Bengio1;~Joshua_M._Susskind1;~Emmanuel_Abbe1",
        "gender": "M;M;M;",
        "homepage": "https://sdascoli.github.io/;http://bengio.abracadoudou.com;http://www.apple.com;",
        "dblp": "227/3250;b/SamyBengio;132/7797;84/5016",
        "google_scholar": "2GcqQgYAAAAJ;Vs-MdPcAAAAJ;Sv2TGqsAAAAJ;",
        "orcid": "0000-0002-3131-3371;;;",
        "linkedin": "st%C3%A9phane-d-ascoli-182642130/;bengio;joshua-susskind-8ab2ab5/;",
        "or_profile": "~St\u00e9phane_d'Ascoli1;~Samy_Bengio1;~Joshua_M._Susskind1;~Emmanuel_Abbe1",
        "aff": "Meta Facebook;Apple;Apple;Swiss Federal Institute of Technology Lausanne",
        "aff_domain": "facebook.com;apple.com;apple.com;epfl.ch",
        "position": "Researcher;Senior Director;Researcher;Full Professor",
        "bibtex": "@misc{\nd'ascoli2024boolformer,\ntitle={Boolformer: Symbolic Regression of Logic Functions with Transformers},\nauthor={St{\\'e}phane d'Ascoli and Samy Bengio and Joshua M. Susskind and Emmanuel Abbe},\nyear={2024},\nurl={https://openreview.net/forum?id=wmzFZ9lJrD}\n}",
        "github": "",
        "project": "",
        "reviewers": "V2Ca;BZRx;X8df;QDAh",
        "site": "https://openreview.net/forum?id=wmzFZ9lJrD",
        "pdf_size": 993583,
        "rating": "3;5;6;8",
        "confidence": "3;4;4;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;3;4",
        "wc_summary": "14;68;40;119",
        "wc_strengths": "62;72;65;15",
        "wc_weaknesses": "149;191;78;67",
        "wc_questions": "67;157;2;136",
        "wc_review": "292;488;185;337",
        "wc_reply_reviewers": "71;331;0;213",
        "wc_reply_authors": "158;1164;26;681",
        "reply_reviewers": "1;2;0;2",
        "reply_authors": "1;3;1;3",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            60.25,
            38.925409439079765
        ],
        "wc_strengths_avg": [
            53.5,
            22.522211259110417
        ],
        "wc_weaknesses_avg": [
            121.25,
            51.109563684304725
        ],
        "wc_questions_avg": [
            90.5,
            60.98565405076837
        ],
        "wc_review_avg": [
            325.5,
            108.85885356736034
        ],
        "wc_reply_reviewers_avg": [
            153.75,
            127.88153697856465
        ],
        "wc_reply_authors_avg": [
            507.25,
            451.4107746831039
        ],
        "reply_reviewers_avg": [
            1.25,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.0,
            1.0
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10251528459294717549&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "Meta;Apple;Swiss Federal Institute of Technology Lausanne",
        "aff_unique_dep": "Meta Platforms, Inc.;Apple Inc.;",
        "aff_unique_url": "https://meta.com;https://www.apple.com;https://www.epfl.ch",
        "aff_unique_abbr": "Meta;Apple;EPFL",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Lausanne",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "United States;Switzerland"
    },
    {
        "id": "wpTitXWGNO",
        "title": "xCodeEval: An Execution based Large Scale Multilingual Multitask Benchmark for Code Understanding, Generation, Translation and Retrieval",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recently, pre-trained large language models (LLMs) have shown impressive abilities in generating codes from natural language descriptions, repairing buggy codes, translating codes between languages, and retrieving relevant code segments. However, the evaluation of these models has often been performed in a scattered way on only one or two specific tasks, in a few languages, at a partial granularity (e.g., function) level, and in many cases without proper training data. Even more concerning is that in most cases the evaluation of generated codes has been done in terms of mere lexical overlap with a reference code rather than actual execution. We introduce **xCodeEval**, the largest executable multilingual multitask benchmark to date consisting of $25$M document-level coding examples ($16.5$B tokens) from about $7.5$K unique problems covering up to $11$ programming languages with execution-level parallelism. It features a total of $7$ tasks involving code understanding, generation, translation and retrieval. **xCodeEval** adopts an execution-based evaluation and offers a multilingual code execution engine, **ExecEval** that supports unit test based execution in all the $11$ languages. To address the challenge of balancing the distributions of text-code samples over multiple attributes in validation/test sets, we propose a novel data splitting and a data selection schema based on the geometric mean and graph-theoretic principle. Our experiments with OpenAI's LLMs and open-sourced LLMs on the tasks and languages demonstrate **xCodeEval** to be quite challenging as per the current advancements in language models. Both [xCodeEval](https://github.com/ntunlp/xCodeEval) and [ExecEval](https://github.com/ntunlp/ExecEval) are freely available at [Hugging Face](https://huggingface.co/datasets/NTU-NLP-sg/xCodeEval) and [Github](https://github.com/ntunlp/ExecEval).",
        "keywords": "programming-language;code;program-synthesis;automatic-code-repair;code-retrieval;code-translation;code-classification;execution;benchmark;multilingual;multitask;unit-test",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Mohammad Abdullah Matin Khan;M Saiful Bari;Do Xuan Long;Weishi Wang;Md Rizwan Parvez;Shafiq Joty",
        "authorids": "~Mohammad_Abdullah_Matin_Khan1;~M_Saiful_Bari2;~Do_Xuan_Long1;~Weishi_Wang2;~Md_Rizwan_Parvez1;~Shafiq_Joty1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://github.com/Jackal1586;https://dxlong2000.github.io/;;https://rizwan09.github.io/;https://raihanjoty.github.io/;https://sbmaruf.github.io/",
        "dblp": ";317/0657.html;;180/3830.html;62/2078;241/6155",
        "google_scholar": ";uZyF8wwAAAAJ;P8TGNcoAAAAJ;KhC8rtcAAAAJ;hR249csAAAAJ;xVp48HAAAAAJ",
        "orcid": ";;;0000-0002-3708-7803;;",
        "linkedin": ";;;rizwanparvez/;;sbmaruf/",
        "or_profile": "~Mohammad_Abdullah_Matin_Khan1;~Do_Xuan_Long1;~Weishi_Wang2;~Md_Rizwan_Parvez1;~Shafiq_Joty1;~M_SAIFUL_BARI1",
        "aff": "School of Computer Science and  Engineering, Nanyang Technological University;National University of Singapore;SAP SE;Qatar Computing Research Institute;SalesForce.com;National Centre of Artificial Intelligence, Saudi Data and AI Authority",
        "aff_domain": "scse.ntu.edu.sg;nus.edu.sg;sap.com;qcri.com;salesforce.com;sdaia.gov.sa",
        "position": "Researcher;PhD student;Data Scientist ;Assistant Professor;Principal Researcher;Principal Researcher",
        "bibtex": "@misc{\nkhan2024xcodeeval,\ntitle={xCodeEval: An Execution based Large Scale Multilingual Multitask Benchmark for Code Understanding, Generation, Translation and Retrieval},\nauthor={Mohammad Abdullah Matin Khan and M Saiful Bari and Do Xuan Long and Weishi Wang and Md Rizwan Parvez and Shafiq Joty},\nyear={2024},\nurl={https://openreview.net/forum?id=wpTitXWGNO}\n}",
        "github": "",
        "project": "",
        "reviewers": "LKoY;P8wu;Hh2i;eCtw",
        "site": "https://openreview.net/forum?id=wpTitXWGNO",
        "pdf_size": 1654950,
        "rating": "3;5;5;6",
        "confidence": "4;5;4;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;2;2",
        "wc_summary": "69;80;40;126",
        "wc_strengths": "46;93;68;138",
        "wc_weaknesses": "263;231;205;471",
        "wc_questions": "49;15;80;247",
        "wc_review": "427;419;393;982",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "923;990;317;845",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;1;2",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            78.75,
            30.946526460977815
        ],
        "wc_strengths_avg": [
            86.25,
            34.1933838629639
        ],
        "wc_weaknesses_avg": [
            292.5,
            105.0844898165281
        ],
        "wc_questions_avg": [
            97.75,
            89.18344857651559
        ],
        "wc_review_avg": [
            555.25,
            246.70465642139794
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            768.75,
            265.8179593255505
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.13245323570650439,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1628050403477223368&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;3;4;5",
        "aff_unique_norm": "Nanyang Technological University;National University of Singapore;SAP SE;Qatar Computing Research Institute;Salesforce;National Centre of Artificial Intelligence",
        "aff_unique_dep": "School of Computer Science and Engineering;;;;;",
        "aff_unique_url": "https://www.ntu.edu.sg;https://www.nus.edu.sg;https://www.sap.com;https://www.qcri.org;https://www.salesforce.com;",
        "aff_unique_abbr": "NTU;NUS;SAP;QCRI;Salesforce;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;2;3;4",
        "aff_country_unique": "Singapore;Germany;Qatar;United States;Saudi Arabia"
    },
    {
        "title": "Sparsistency for inverse optimal transport",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17479",
        "id": "wpXGPCBOTX",
        "author_site": "Francisco Andrade, Gabriel Peyr\u00e9, Clarice Poon",
        "tldr": "",
        "abstract": "Optimal Transport is a useful metric to compare probability distributions and to compute a pairing given a ground cost. Its entropic regularization  variant (eOT) is crucial to have fast algorithms and reflect fuzzy/noisy matchings. This work focuses on Inverse Optimal Transport (iOT), the problem of inferring the ground cost from samples drawn from a coupling that solves an eOT problem. It is a relevant problem that can be used to infer unobserved/missing links, and to obtain meaningful information about the structure of the ground cost yielding the pairing. On one side, iOT benefits from convexity, but on the other side, being ill-posed, it requires regularization to handle the sampling noise. This work presents an in-depth theoretical study of the $\\ell_1$ regularization to model for instance Euclidean costs with sparse interactions between features.  Specifically, we derive a sufficient condition for the robust recovery of the sparsity of the ground cost that can be seen as a far reaching generalization of the Lasso\u2019s celebrated ``Irrepresentability Condition\u2019\u2019. To provide additional insight into this condition (consequently on the types of recoverable costs) we work out in detail the Gaussian case. Surprisingly, varying the entropic regularizer provides evidence that the Gaussian iOT interpolates between a graphical Lasso and a classical Lasso, thereby establishing a connection between iOT and graph estimation, an important problem in ML.",
        "keywords": "Optimal transport;sparsity;sparsistency;metric learning",
        "primary_area": "metric learning, kernel learning, and sparse coding",
        "supplementary_material": "/attachment/29a7a4e647b79e16f87e3b21bfc228c7c61d4ed5.zip",
        "author": "Francisco Andrade;Gabriel Peyr\u00e9;Clarice Poon",
        "authorids": "~Francisco_Andrade1;~Gabriel_Peyr\u00e92;~Clarice_Poon1",
        "gender": "M;M;F",
        "homepage": ";http://gpeyre.com/;",
        "dblp": ";65/1759;117/9288",
        "google_scholar": ";https://scholar.google.fr/citations?user=KqA1dYcAAAAJ;",
        "orcid": "0000-0002-4149-2115;;",
        "linkedin": ";;",
        "or_profile": "~Francisco_Andrade1;~Gabriel_Peyr\u00e92;~Clarice_Poon1",
        "aff": "Ecole Normale Sup\u00e9rieure de Paris;CNRS;University of Warwick",
        "aff_domain": "ens.fr;cnrs.fr;warwick.ac.uk",
        "position": "Postdoc;Researcher;Associate Professor",
        "bibtex": "@inproceedings{\nandrade2024sparsistency,\ntitle={Sparsistency for inverse optimal transport},\nauthor={Francisco Andrade and Gabriel Peyr{\\'e} and Clarice Poon},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=wpXGPCBOTX}\n}",
        "github": "",
        "project": "",
        "reviewers": "rfzP;gfhu;2C9j;akqu",
        "pdf_size": 778768,
        "rating": "5;6;8;8",
        "confidence": "3;2;3;2",
        "soundness": "2;3;3;4",
        "contribution": "2;3;3;4",
        "presentation": "3;1;3;4",
        "wc_summary": "146;171;46;84",
        "wc_strengths": "77;57;73;73",
        "wc_weaknesses": "429;55;60;7",
        "wc_questions": "31;403;47;37",
        "wc_review": "683;686;226;201",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "771;730;347;116",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            2.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            111.75,
            49.43872470038037
        ],
        "wc_strengths_avg": [
            70.0,
            7.681145747868608
        ],
        "wc_weaknesses_avg": [
            137.75,
            169.42162642354725
        ],
        "wc_questions_avg": [
            129.5,
            158.00870229199404
        ],
        "wc_review_avg": [
            449.0,
            235.66819895777198
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            491.0,
            272.43439577263365
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.19245008972987526,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11278491333723570522&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=wpXGPCBOTX",
        "pdf": "https://openreview.net/pdf?id=wpXGPCBOTX",
        "email": "ens.fr;cnrs.fr;warwick.ac.uk",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Ecole Normale Sup\u00e9rieure de Paris;Centre National de la Recherche Scientifique;University of Warwick",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ens.fr;https://www.cnrs.fr;https://www.warwick.ac.uk",
        "aff_unique_abbr": "ENS Paris;CNRS;Warwick",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Paris;",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "France;United Kingdom"
    },
    {
        "title": "Adaptive deep spiking neural network with global-local learning via balanced excitatory and inhibitory mechanism",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17478",
        "id": "wpnlc2ONu0",
        "author_site": "Tingting Jiang, Qi Xu, Xuming Ran, Jiangrong Shen, Pan Lv, Qiang Zhang, Gang Pan",
        "tldr": "",
        "abstract": "The training method of Spiking Neural Networks (SNNs) is an essential problem, and how to integrate local and global learning is a worthy research interest. However, the current integration methods do not consider the network conditions suitable for local and global learning, and thus fail to balance their advantages. In this paper, we propose an Excitation-Inhibition Mechanism-assisted Hybrid Learning(EIHL) algorithm that adjusts the network connectivity by using the excitation-inhibition mechanism and then switches between local and global learning according to the network connectivity. The experimental results on CIFAR10/100 and DVS-CIFAR10 demonstrate that the EIHL not only has better accuracy performance than other methods but also has excellent sparsity advantage. Especially, the Spiking VGG11 is trained by EIHL, STBP, and STDP on DVS_CIFAR10, respectively. The accuracy of the Spiking VGG11 model on EIHL is 62.45%, which is 4.35% higher than STBP and 11.40% higher than STDP, and the sparsity is 18.74%, which is 18.74% higher than the other two methods. Moreover, the excitation-inhibition mechanism used in our method also offers a new perspective on the field of SNN learning.",
        "keywords": "Spiking neural networks;excitation inhibition mechanism;Long-Term Potentiation;Long-Term Depression",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "Tingting Jiang;Qi Xu;Xuming Ran;Jiangrong Shen;Pan Lv;Qiang Zhang;Gang Pan",
        "authorids": "~Tingting_Jiang4;~Qi_Xu1;~Xuming_Ran1;~Jiangrong_Shen1;~Pan_Lv1;~Qiang_Zhang13;~Gang_Pan1",
        "gender": "F;M;M;F;M;M;",
        "homepage": "https://www.researchgate.net/profile/Jiang-Tt;https://www.researchgate.net/profile/Qi_Xu43;https://ranxuming.github.io/;;;https://faculty.dlut.edu.cn/2017022144/en/index.htm;",
        "dblp": ";;258/9744;208/3564;;72/3527-8;",
        "google_scholar": ";dGEcAuYAAAAJ;oTZip-cAAAAJ;3XK6COkAAAAJ;;https://scholar.google.de/citations?hl=de;",
        "orcid": ";0000-0001-9245-5544;0000-0003-0073-0057;;0000-0003-4483-8879;0000-0003-0609-0337;",
        "linkedin": ";;;;;;",
        "or_profile": "~Tingting_Jiang4;~Qi_Xu1;~Xuming_Ran1;~Jiangrong_Shen1;~Pan_Lv1;~Qiang_Zhang13;~Gang_Pan1",
        "aff": "Dalian University of Technology;School of Computer Science and Technology;National University of Singapore;Zhejiang University;;Dalian University of Technology;",
        "aff_domain": "dlut.edu.cn;dlut.edu.cn;nus.edu.sg;zju.edu.cn;;dlut.edu.cn;",
        "position": "MS student;Associate Professor;Research Assistant;Postdoc;;Full Professor;",
        "bibtex": "@inproceedings{\njiang2024adaptive,\ntitle={Adaptive deep spiking neural network with global-local learning via balanced excitatory and inhibitory mechanism},\nauthor={Tingting Jiang and Qi Xu and Xuming Ran and Jiangrong Shen and Pan Lv and Qiang Zhang and Gang Pan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=wpnlc2ONu0}\n}",
        "github": "",
        "project": "",
        "reviewers": "p6P6;iXWZ;K674;UpZe",
        "pdf_size": 477901,
        "rating": "5;5;8;8",
        "confidence": "5;3;5;5",
        "soundness": "2;2;3;3",
        "contribution": "1;2;3;3",
        "presentation": "1;2;3;3",
        "wc_summary": "38;45;68;72",
        "wc_strengths": "20;60;66;85",
        "wc_weaknesses": "392;121;48;49",
        "wc_questions": "43;111;27;54",
        "wc_review": "493;337;209;260",
        "wc_reply_reviewers": "159;94;41;0",
        "wc_reply_authors": "3644;1590;352;465",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "8;4;2;2",
        "rating_avg": [
            6.5,
            1.5
        ],
        "confidence_avg": [
            4.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            55.75,
            14.53229162933362
        ],
        "wc_strengths_avg": [
            57.75,
            23.668280461410795
        ],
        "wc_weaknesses_avg": [
            152.5,
            141.40809736362343
        ],
        "wc_questions_avg": [
            58.75,
            31.657345119261027
        ],
        "wc_review_avg": [
            324.75,
            107.29486241195335
        ],
        "wc_reply_reviewers_avg": [
            73.5,
            59.55879448074818
        ],
        "wc_reply_authors_avg": [
            1512.75,
            1322.2438078886964
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.0,
            2.449489742783178
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.5773502691896258,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5507082800907954497&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=wpnlc2ONu0",
        "pdf": "https://openreview.net/pdf?id=wpnlc2ONu0",
        "email": "dlut.edu.cn;dlut.edu.cn;nus.edu.sg;zju.edu.cn;;dlut.edu.cn;",
        "author_num": 7,
        "aff_unique_index": "0;1;2;3;0",
        "aff_unique_norm": "Dalian University of Technology;School of Computer Science and Technology;National University of Singapore;Zhejiang University",
        "aff_unique_dep": ";Computer Science and Technology;;",
        "aff_unique_url": "http://www.dlut.edu.cn/;;https://www.nus.edu.sg;https://www.zju.edu.cn",
        "aff_unique_abbr": "DUT;;NUS;ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;2;0;0",
        "aff_country_unique": "China;;Singapore"
    },
    {
        "title": "Benchmarking Algorithms for Federated Domain Generalization",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17477",
        "id": "wprSv7ichW",
        "author_site": "Ruqi Bai, Saurabh Bagchi, David Inouye",
        "tldr": "",
        "abstract": "While prior federated learning (FL) methods mainly consider client heterogeneity, we focus on the *Federated Domain Generalization (DG)* task, which introduces train-test heterogeneity in the FL context. Existing evaluations in this field are limited in terms of the scale of the clients and dataset diversity. Thus, we propose a Federated DG benchmark that aim to test the limits of current methods with high client heterogeneity, large numbers of clients, and diverse datasets. Towards this objective, we introduce a novel data partition method that allows us to distribute any domain dataset among few or many clients while controlling client heterogeneity. We then introduce and apply our methodology to evaluate 14 DG methods, which include centralized DG methods adapted to the FL context, FL methods that handle client heterogeneity, and methods designed specifically for Federated DG on 7 datasets. Our results suggest that, despite some progress, significant performance gaps remain in Federated DG, especially when evaluating with a large number of clients, high client heterogeneity, or more realistic datasets. Furthermore, our extendable benchmark code will be publicly released to aid in benchmarking future Federated DG approaches.",
        "keywords": "federated learning;distributed learning;domain generalization;out-of-distribution generalization;benchmarking;data paritioning.",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Ruqi Bai;Saurabh Bagchi;David I. Inouye",
        "authorids": "~Ruqi_Bai1;~Saurabh_Bagchi1;~David_I._Inouye1",
        "gender": "M;M;M",
        "homepage": "https://ruqibai.netlify.app/;https://saurabhbagchi.us;http://davidinouye.com",
        "dblp": ";57/95.html;76/10817",
        "google_scholar": ";https://scholar.google.com.tw/citations?user=3EfsOvYAAAAJ;SVMQ_g4AAAAJ",
        "orcid": ";;",
        "linkedin": "ruqi-bai/;;",
        "or_profile": "~Ruqi_Bai1;~Saurabh_Bagchi1;~David_I_Inouye1",
        "aff": "Purdue University;Purdue University;Purdue University",
        "aff_domain": "purdue.edu;purdue.edu;purdue.edu",
        "position": "PhD student;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nbai2024benchmarking,\ntitle={Benchmarking Algorithms for Federated Domain Generalization},\nauthor={Ruqi Bai and Saurabh Bagchi and David I. Inouye},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=wprSv7ichW}\n}",
        "github": "",
        "project": "",
        "reviewers": "AnGM;PJ3y;EtKR",
        "pdf_size": 664752,
        "rating": "6;6;8",
        "confidence": "3;2;3",
        "soundness": "3;3;4",
        "contribution": "3;3;3",
        "presentation": "3;3;4",
        "wc_summary": "47;83;91",
        "wc_strengths": "88;71;121",
        "wc_weaknesses": "158;45;78",
        "wc_questions": "43;1;24",
        "wc_review": "336;200;314",
        "wc_reply_reviewers": "57;0;58",
        "wc_reply_authors": "1239;575;318",
        "reply_reviewers": "1;0;1",
        "reply_authors": "3;1;1",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            73.66666666666667,
            19.136933459209764
        ],
        "wc_strengths_avg": [
            93.33333333333333,
            20.75786330258702
        ],
        "wc_weaknesses_avg": [
            93.66666666666667,
            47.44353368889051
        ],
        "wc_questions_avg": [
            22.666666666666668,
            17.172329163188344
        ],
        "wc_review_avg": [
            283.3333333333333,
            59.60611452601896
        ],
        "wc_reply_reviewers_avg": [
            38.333333333333336,
            27.10883414846328
        ],
        "wc_reply_authors_avg": [
            710.6666666666666,
            388.0415212605762
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.49999999999999983,
        "gs_citation": 16,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4407420642448912114&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=wprSv7ichW",
        "pdf": "https://openreview.net/pdf?id=wprSv7ichW",
        "email": "purdue.edu;purdue.edu;purdue.edu",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Purdue University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.purdue.edu",
        "aff_unique_abbr": "Purdue",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "wpuQonyeXN",
        "title": "Provably Efficient Exploration in Quantum Reinforcement Learning with Logarithmic Worst-Case Regret",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "While quantum reinforcement learning (RL) has attracted a surge of attention recently, its theoretical understanding is limited. In particular, it remains elusive how to design provably efficient quantum RL algorithms that can address the exploration-exploitation trade-off. To this end, we propose a novel UCRL-style algorithm that takes advantage of quantum computing for tabular Markov decision processes (MDPs) with $S$ states, $A$ actions, and horizon $H$, and establish an $\\mathcal{O}(\\mathrm{poly}(S, A, H, \\log T))$ worst-case regret for it, where $T$ is the number of episodes. Furthermore, we extend our results to quantum RL with linear function approximation, which is capable of handling problems with large state spaces. Specifically, we develop a quantum algorithm based on value target regression (VTR) for linear mixture MDPs with $d$-dimensional linear representation and prove that it enjoys $\\mathcal{O}(\\mathrm{poly}(d, H, \\log T))$ regret. Our algorithms are variants of UCRL/UCRL-VTR algorithms in classical RL, which also leverage a novel combination of lazy updating mechanisms and quantum estimation subroutines. This is the key to breaking the $\\Omega(\\sqrt{T})$-regret barrier in classical RL. To the best of our knowledge, this is the first work studying the online exploration in quantum RL with provable logarithmic worst-case regret.",
        "keywords": "Quantum reinforcement learning;online exploration;logarithmic regret",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Han Zhong;Jiachen Hu;Yecheng Xue;Tongyang Li;Liwei Wang",
        "authorids": "~Han_Zhong1;~Jiachen_Hu1;~Yecheng_Xue1;~Tongyang_Li1;~Liwei_Wang1",
        "gender": ";M;;M;M",
        "homepage": "https://hanzhong-ml.github.io/;https://nickhclos.github.io/;;https://www.tongyangli.com/;http://www.liweiwang-pku.com/",
        "dblp": "137/8096.html;239/5040;340/7132;142/1312;",
        "google_scholar": "Bk5q_pAAAAAJ;5GavKiQAAAAJ;https://scholar.google.com/;ny0ZgiQAAAAJ;VZHxoh8AAAAJ",
        "orcid": ";;;0000-0002-0338-413X;",
        "linkedin": ";;;;",
        "or_profile": "~Han_Zhong1;~Jiachen_Hu1;~Yecheng_Xue1;~Tongyang_Li1;~Liwei_Wang1",
        "aff": "Peking University;Peking University;Peking University;Peking University;Peking University",
        "aff_domain": "stu.pku.edu.cn;pku.edu.cn;pku.edu.cn;pku.edu.cn;pku.edu.cn",
        "position": "PhD student;PhD student;PhD student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nzhong2024provably,\ntitle={Provably Efficient Exploration in Quantum Reinforcement Learning with Logarithmic Worst-Case Regret},\nauthor={Han Zhong and Jiachen Hu and Yecheng Xue and Tongyang Li and Liwei Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=wpuQonyeXN}\n}",
        "github": "",
        "project": "",
        "reviewers": "AteR;pp1B;KqvL;XG1J",
        "site": "https://openreview.net/forum?id=wpuQonyeXN",
        "pdf_size": 426281,
        "rating": "6;6;6;6",
        "confidence": "3;4;3;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;1;3",
        "wc_summary": "55;37;61;59",
        "wc_strengths": "17;35;43;64",
        "wc_weaknesses": "118;93;69;168",
        "wc_questions": "84;104;215;93",
        "wc_review": "274;269;388;384",
        "wc_reply_reviewers": "26;0;46;0",
        "wc_reply_authors": "762;514;1504;1858",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "2;1;4;3",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            53.0,
            9.486832980505138
        ],
        "wc_strengths_avg": [
            39.75,
            16.872685026396955
        ],
        "wc_weaknesses_avg": [
            112.0,
            36.68105778191245
        ],
        "wc_questions_avg": [
            124.0,
            53.01414905475707
        ],
        "wc_review_avg": [
            328.75,
            57.29474234168437
        ],
        "wc_reply_reviewers_avg": [
            18.0,
            19.339079605813716
        ],
        "wc_reply_authors_avg": [
            1159.5,
            543.4286981748387
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7945288915797372320&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Peking University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.pku.edu.cn",
        "aff_unique_abbr": "Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "wqi85OBVLE",
        "title": "Reward Adaptation Via Q-Manipulation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this paper, we introduce reward adaptation (RA), the problem where the learning agent adapts to a target reward function based on one or multiple existing behaviors learned a priori based on their corresponding source reward functions, providing a new perspective of modular reinforcement learning.  Reward adaptation has many applications, such as adapting an autonomous driving agent that can already operate either fast or safe to operating both fast and safe. Learning the target behavior from scratch is possible but inefficient given the source behaviors available. Assuming that the target reward function is a polynomial function of the source reward functions,  we propose an approach to reward adaptation by manipulating variants of the Q function for the source behaviors, which are assumed to be accessible and obtained when learning the source behaviors prior to learning the target behavior. It results in a novel method named ``Q-Manipulation'' that enables action pruning before learning the target. We formally prove that our pruning strategy for improving sample complexity does not affect the optimality of the returned policy. Comparison with baselines is performed in a variety of synthetic and simulation domains to demonstrate its effectiveness and generalizability.",
        "keywords": "Modular RL;Reusable RL;Action Pruning;Reward Shaping",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/0a911fb9d8c81b38e2e3af7997c6cee59fcb1eba.zip",
        "author": "Kevin Jatin Vora;Yu Zhang",
        "authorids": "~Kevin_Jatin_Vora1;~Yu_Zhang10",
        "gender": "M;M",
        "homepage": "https://kevinthebest1.github.io/#/;https://crslabasu.github.io/",
        "dblp": ";50/671-55",
        "google_scholar": "rCeJKCQAAAAJ;n0uRPLgAAAAJ",
        "orcid": " 0000-0002-9396-8429;",
        "linkedin": "kevin-vora;",
        "or_profile": "~Kevin_Jatin_Vora1;~Yu_Zhang10",
        "aff": "Arizona State University;Arizona State University",
        "aff_domain": "asu.edu;asu.edu",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\nvora2024reward,\ntitle={Reward Adaptation Via Q-Manipulation},\nauthor={Kevin Jatin Vora and Yu Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=wqi85OBVLE}\n}",
        "github": "",
        "project": "",
        "reviewers": "hu2d;xHsM;Z39j;Qwty",
        "site": "https://openreview.net/forum?id=wqi85OBVLE",
        "pdf_size": 10244398,
        "rating": "3;3;3;5",
        "confidence": "4;4;4;3",
        "soundness": "2;2;1;3",
        "contribution": "2;2;2;2",
        "presentation": "3;3;2;3",
        "wc_summary": "173;67;107;106",
        "wc_strengths": "90;12;39;84",
        "wc_weaknesses": "234;343;389;124",
        "wc_questions": "41;97;16;86",
        "wc_review": "538;519;551;400",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "66;129;103;181",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            113.25,
            38.08132744535043
        ],
        "wc_strengths_avg": [
            56.25,
            32.26743714644843
        ],
        "wc_weaknesses_avg": [
            272.5,
            102.56339502961083
        ],
        "wc_questions_avg": [
            60.0,
            32.94692701907114
        ],
        "wc_review_avg": [
            502.0,
            59.979163048512106
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            119.75,
            41.853165949543175
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:oKaNCY1Ui04J:scholar.google.com/&scioq=Reward+Adaptation+Via+Q-Manipulation&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Arizona State University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.asu.edu",
        "aff_unique_abbr": "ASU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "wraoHMbvFp",
        "title": "GPT as Visual Explainer",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In this paper, we present Language Model as Visual Explainer (\\texttt{LVX}), a systematic approach for interpreting the internal workings of vision models using a tree-structured linguistic explanation, without the need for model training. Central to our strategy is the collaboration between vision models and LLM to craft explanation. On one hand, the LLM is harnessed to delineate hierarchical visual attributes, while concurrently, a text-to-image API retrieves images that are most align with these textual concepts. By mapping the collected text and image to the vision model's embedding space, we construct a hierarchy-structured visual embedding tree. This tree is dynamically pruned and grown by querying the LLM using language templates, tailoring the explanation to the model. Such a scheme allows us to seamlessly incorporate new attributes while eliminating undesired concepts based on the model's representations. When applied to testing samples, \nour method provides human-understandable explanations in the form of attribute-laden trees. Beyond explanation, we retrained the vision model by calibrating the model on the generated concept hierarchy, {allowing the model to incorporate the refined knowledge of visual attributes}. To access the effectiveness of our approach, we introduce new benchmarks and conduct rigorous evaluations. The results unequivocally demonstrate the plausibility, faithfulness, and stability of our approach compared to existing interpretability techniques.",
        "keywords": "Explainable AI;Multi-modal Learning;Foundation Models",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/c93353cce276d8a0c7fe040d7cd07ecde5ded860.zip",
        "author": "Xingyi Yang;Xinchao Wang",
        "authorids": "~Xingyi_Yang1;~Xinchao_Wang1",
        "gender": "M;M",
        "homepage": "https://adamdad.github.io/;https://sites.google.com/site/sitexinchaowang/",
        "dblp": ";",
        "google_scholar": "1n2OPtwAAAAJ;https://scholar.google.com.tw/citations?user=w69Buq0AAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Xingyi_Yang1;~Xinchao_WANG3",
        "aff": "National University of Singapore;National University of Singapore",
        "aff_domain": "nus.edu;nus.edu",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nyang2024gpt,\ntitle={{GPT} as Visual Explainer},\nauthor={Xingyi Yang and Xinchao Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=wraoHMbvFp}\n}",
        "github": "",
        "project": "",
        "reviewers": "1ve1;dC7U",
        "site": "https://openreview.net/forum?id=wraoHMbvFp",
        "pdf_size": 6459648,
        "rating": "5;6",
        "confidence": "4;3",
        "soundness": "3;3",
        "contribution": "3;3",
        "presentation": "2;3",
        "wc_summary": "152;76",
        "wc_strengths": "56;40",
        "wc_weaknesses": "273;35",
        "wc_questions": "65;21",
        "wc_review": "546;172",
        "wc_reply_reviewers": "0;0",
        "wc_reply_authors": "0;0",
        "reply_reviewers": "0;0",
        "reply_authors": "0;0",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            114.0,
            38.0
        ],
        "wc_strengths_avg": [
            48.0,
            8.0
        ],
        "wc_weaknesses_avg": [
            154.0,
            119.0
        ],
        "wc_questions_avg": [
            43.0,
            22.0
        ],
        "wc_review_avg": [
            359.0,
            187.0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            2,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.9999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:nr7TPTmggTsJ:scholar.google.com/&scioq=GPT+as+Visual+Explainer&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "National University of Singapore",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nus.edu.sg",
        "aff_unique_abbr": "NUS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Singapore"
    },
    {
        "title": "On the Effect of Batch Size in Byzantine-Robust Distributed Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17476",
        "id": "wriKDQqiOQ",
        "author_site": "Yi-Rui Yang, Chang-Wei Shi, Wu-Jun Li",
        "tldr": "",
        "abstract": "Byzantine-robust distributed learning (BRDL), in which computing devices are likely to behave abnormally due to accidental failures or malicious attacks, has recently become a hot research topic. However, even in the independent and identically distributed (i.i.d.) case, existing BRDL methods will suffer a significant drop on model accuracy due to the large variance of stochastic gradients. Increasing batch sizes is a simple yet effective way to reduce the variance. However, when the total number of gradient computation is fixed, a too-large batch size will lead to a too-small iteration number (update number), which may also degrade the model accuracy. In view of this challenge, we mainly study the effect of batch size when the total number of gradient computation is fixed in this work. In particular, we show that when the total number of gradient computation is fixed, the optimal batch size corresponding to the tightest theoretical upper bound in BRDL increases with the fraction of Byzantine workers. Therefore, compared to the case without attacks, a larger batch size is preferred when under Byzantine attacks. Motivated by the theoretical finding, we propose a novel method called Byzantine-robust stochastic gradient descent with normalized momentum (ByzSGDnm) in order to further increase model accuracy in BRDL. We theoretically prove the convergence of ByzSGDnm for general non-convex cases under Byzantine attacks. Empirical results show that when under Byzantine attacks, compared to the cases of small batch sizes, setting a relatively large batch size can significantly increase the model accuracy, which is consistent with our theoretical results. Moreover, ByzSGDnm can achieve higher model accuracy than existing BRDL methods when under deliberately crafted attacks. In addition, we empirically show that increasing batch sizes has the bonus of training acceleration.",
        "keywords": "distributed learning;Byzantine robustness;batch size",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/23798c715130cf975ecf4fcfb1c540605233c5df.zip",
        "author": "Yi-Rui Yang;Chang-Wei Shi;Wu-Jun Li",
        "authorids": "~Yi-Rui_Yang2;~Chang-Wei_Shi1;~Wu-Jun_Li1",
        "gender": "M;M;M",
        "homepage": "http://www.lamda.nju.edu.cn/yangyr/;https://github.com/Changwei-Shi;https://cs.nju.edu.cn/lwj/",
        "dblp": "260/0404;;26/988.html",
        "google_scholar": ";;NCCdqdcAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Yi-Rui_Yang2;~Chang-Wei_Shi1;~Wu-Jun_Li1",
        "aff": "Nanjing University;Nanjing University;Nanjing University",
        "aff_domain": "nju.edu.cn;nju.edu.cn;nju.edu.cn",
        "position": "PhD student;PhD student;Full Professor",
        "bibtex": "@inproceedings{\nyang2024on,\ntitle={On the Effect of Batch Size in Byzantine-Robust Distributed Learning},\nauthor={Yi-Rui Yang and Chang-Wei Shi and Wu-Jun Li},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=wriKDQqiOQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "tTch;Rysg;jRhg",
        "pdf_size": 723263,
        "rating": "6;6;6",
        "confidence": "5;3;3",
        "soundness": "4;3;3",
        "contribution": "3;3;3",
        "presentation": "4;3;3",
        "wc_summary": "66;60;78",
        "wc_strengths": "90;13;30",
        "wc_weaknesses": "145;104;55",
        "wc_questions": "115;24;104",
        "wc_review": "416;201;267",
        "wc_reply_reviewers": "133;65;0",
        "wc_reply_authors": "1804;1102;669",
        "reply_reviewers": "1;1;0",
        "reply_authors": "3;2;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            68.0,
            7.483314773547883
        ],
        "wc_strengths_avg": [
            44.333333333333336,
            33.02860712910687
        ],
        "wc_weaknesses_avg": [
            101.33333333333333,
            36.790699307780976
        ],
        "wc_questions_avg": [
            81.0,
            40.554490092549145
        ],
        "wc_review_avg": [
            294.6666666666667,
            89.92713099442732
        ],
        "wc_reply_reviewers_avg": [
            66.0,
            54.30162674051917
        ],
        "wc_reply_authors_avg": [
            1191.6666666666667,
            467.67961493122857
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:hs-Q-p2QFEkJ:scholar.google.com/&scioq=On+the+Effect+of+Batch+Size+in+Byzantine-Robust+Distributed+Learning&hl=en&as_sdt=0,14",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=wriKDQqiOQ",
        "pdf": "https://openreview.net/pdf?id=wriKDQqiOQ",
        "email": "nju.edu.cn;nju.edu.cn;nju.edu.cn",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Nanjing University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nju.edu.cn",
        "aff_unique_abbr": "Nanjing U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "wrqAn3AJA1",
        "title": "Everybody Needs a Little HELP: Explaining Graphs via Hierarchical Concepts",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph neural networks (GNNs) have led to major breakthroughs in a variety of domains such as drug discovery, social network analysis, and travel time estimation. However, they lack interpretability which hinders human trust and thereby deployment to settings with high-stakes decisions. A line of interpretable methods approach this by discovering a small set of relevant concepts as subgraphs in the last GNN layer that together explain the prediction. This can yield oversimplified explanations, failing to explain the interaction between GNN layers. To address this oversight, we provide HELP (Hierarchical Explainable Latent Pooling), a novel, inherently interpretable graph pooling approach that reveals how concepts from different GNN layers compose to new ones in later steps. HELP is more than 1-WL expressive and is the first non-spectral, end-to-end-learnable, hierarchical graph pooling method that can learn to pool a variable number of arbitrary connected components. We empirically demonstrate that it performs on-par with standard GCNs and popular pooling methods in terms of accuracy while yielding explanations that are aligned with expert knowledge in the domains of chemistry and social networks. In addition to a qualitative analysis, we employ concept completeness scores as well as concept conformity, a novel metric to measure the noise in discovered concepts, quantitatively verifying that the discovered concepts are significantly easier to fully understand than those from previous work. Our work represents a first step towards an understanding of graph neural networks that goes beyond a set of concepts from the final layer and instead explains the complex interplay of concepts on different levels.",
        "keywords": "graph neural networks;explainability",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/c356dc1939dcbaf1ea32c6c0746a9079e8e8271f.zip",
        "author": "Jonas J\u00fcr\u00df;Lucie Charlotte Magister;Pietro Barbiero;Pietro Lio;Nikola Simidjievski",
        "authorids": "~Jonas_J\u00fcr\u00df1;~Lucie_Charlotte_Magister1;~Pietro_Barbiero1;~Pietro_Lio1;~Nikola_Simidjievski1",
        "gender": "M;F;M;M;Unspecified",
        "homepage": "https://jonasjuerss.com/;;http://www.pietrobarbiero.eu/;https://www.cst.cam.ac.uk/people/pl219;https://simidjievskin.github.io/",
        "dblp": "351/0471;298/1032;238/7860;l/PietroLio.html;",
        "google_scholar": "RzWVQVYAAAAJ;do6o-rYAAAAJ;https://scholar.google.it/citations?user=4gbToQoAAAAJ;https://scholar.google.co.uk/citations?user=3YrWf7EAAAAJ;",
        "orcid": "0009-0004-7217-8366;0000-0003-3499-5475;0000-0003-3155-2564;0000-0002-0540-5053;",
        "linkedin": "jonas-juerss;;;;",
        "or_profile": "~Jonas_J\u00fcr\u00df1;~Lucie_Charlotte_Magister1;~Pietro_Barbiero1;~Pietro_Lio1;~Nikola_Simidjievski1",
        "aff": "Cambridge Consultants;Apple;Universita della Svizzera Italiana;University of Cambridge;University of Cambridge",
        "aff_domain": "cambridgeconsultants.com;apple.com;usi.ch;cam.ac.uk;cam.ac.uk",
        "position": "Researcher;ML Research Intern;Postdoc;Full Professor;Principal Researcher",
        "bibtex": "@misc{\nj{\\\"u}r{\\ss}2024everybody,\ntitle={Everybody Needs a Little {HELP}: Explaining Graphs via Hierarchical Concepts},\nauthor={Jonas J{\\\"u}r{\\ss} and Lucie Charlotte Magister and Pietro Barbiero and Pietro Lio and Nikola Simidjievski},\nyear={2024},\nurl={https://openreview.net/forum?id=wrqAn3AJA1}\n}",
        "github": "",
        "project": "",
        "reviewers": "zgh9;VEwC;dvgz;RY8e",
        "site": "https://openreview.net/forum?id=wrqAn3AJA1",
        "pdf_size": 12653132,
        "rating": "3;3;5;6",
        "confidence": "4;3;3;3",
        "soundness": "2;2;3;2",
        "contribution": "2;2;2;2",
        "presentation": "2;2;2;2",
        "wc_summary": "130;101;65;98",
        "wc_strengths": "35;98;62;95",
        "wc_weaknesses": "120;247;185;200",
        "wc_questions": "35;139;9;56",
        "wc_review": "320;585;321;449",
        "wc_reply_reviewers": "0;22;0;0",
        "wc_reply_authors": "655;962;496;542",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            98.5,
            23.02715787933891
        ],
        "wc_strengths_avg": [
            72.5,
            25.85053190942113
        ],
        "wc_weaknesses_avg": [
            188.0,
            45.436769251345325
        ],
        "wc_questions_avg": [
            59.75,
            48.68970630431036
        ],
        "wc_review_avg": [
            418.75,
            109.38549949604838
        ],
        "wc_reply_reviewers_avg": [
            5.5,
            9.526279441628825
        ],
        "wc_reply_authors_avg": [
            663.75,
            181.65403243528618
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5555555555555555,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:qzBr_HWm1wsJ:scholar.google.com/&scioq=Everybody+Needs+a+Little+HELP:+Explaining+Graphs+via+Hierarchical+Concepts&hl=en&as_sdt=0,5",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;3;3",
        "aff_unique_norm": "Cambridge Consultants;Apple;Universita della Svizzera Italiana;University of Cambridge",
        "aff_unique_dep": ";Apple Inc.;;",
        "aff_unique_url": "https://www.cambridgeconsultants.com;https://www.apple.com;https://www.usi.ch;https://www.cam.ac.uk",
        "aff_unique_abbr": ";Apple;USI;Cambridge",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Cambridge",
        "aff_country_unique_index": "0;1;2;0;0",
        "aff_country_unique": "United Kingdom;United States;Switzerland"
    },
    {
        "id": "ws0F5NTzGw",
        "title": "AdapTable: Test-Time Adaptation for Tabular Data via Shift-Aware Uncertainty Calibrator and Label Distribution Handler",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In real-world applications, tabular data often suffer from distribution shifts due to their widespread and abundant nature, leading to a significant impact on the performance of machine learning models during testing. However, addressing these shifts in the tabular domain has been relatively underexplored due to unique challenges such as varying attributes and dataset sizes, as well as limitations representation learning capabilities of deep learning models for tabular data. Particularly, with the recent promising paradigm of test-time adaptation (TTA), where we adapt the off-the-shelf model to the unlabeled target domain during the inference phase without accessing the source domain, we observe that directly adopting commonly used TTA methods from other domains often leads to model collapse. We systematically explore challenges in tabular data test-time adaptation, including skewed entropy, complex latent space decision boundaries, confidence calibration issues with both overconfident and under-confident, and model bias towards source label distributions along with class imbalances. Based on these insights, we introduce AdapTable, a novel tabular test-time adaptation method that directly modifies output probabilities by estimating target label distributions and adjusting initial probabilities based on calibrated uncertainty.\nExtensive experiments on both real-world distribution shifts and synthetic corruptions demonstrate the adaptation efficacy of the proposed method using unlabeled test data alone.",
        "keywords": "tabular data;distribution shift robustness;test-time adaptation",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/1fc511a8b20309c85358ed8b56e3fe3c0e330cb2.pdf",
        "author": "Changhun Kim;Taewon Kim;Seungyeon Woo;June Yong Yang;Eunho Yang",
        "authorids": "~Changhun_Kim1;~Taewon_Kim1;~Seungyeon_Woo2;~June_Yong_Yang1;~Eunho_Yang1",
        "gender": "Not Specified;M;;M;",
        "homepage": "https://changhun.kim;http://nolink;http://mli.kaist.ac.kr/people/;https://sites.google.com/site/hleehome2/;",
        "dblp": ";;277/5624;96/2621;",
        "google_scholar": "mY7KEvAAAAAJ;;nkLNWg0AAAAJ;;",
        "orcid": "0009-0003-4930-6908;;;;",
        "linkedin": "changhun-kim/;;;;%EC%8A%B9%EC%97%B0-%EC%9A%B0-8ab687199/",
        "or_profile": "~Changhun_Kim1;~Taewon_Kim1;~June_Yong_Yang1;~Eunho_Yang1;~SeungYeon_Woo1",
        "aff": "KAIST;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;The Kim Jaechul Graduate School of AI at Korea Advanced Institute of Science and Technology",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr;kaist.ac.kr;kaist.ac.kr;kaist.ac.kr",
        "position": " MS Student;Undergrad student;PhD student;Associate Professor;MS student",
        "bibtex": "@misc{\nkim2024adaptable,\ntitle={AdapTable: Test-Time Adaptation for Tabular Data via Shift-Aware Uncertainty Calibrator and Label Distribution Handler},\nauthor={Changhun Kim and Taewon Kim and Seungyeon Woo and June Yong Yang and Eunho Yang},\nyear={2024},\nurl={https://openreview.net/forum?id=ws0F5NTzGw}\n}",
        "github": "",
        "project": "",
        "reviewers": "xrMn;DhMn;P5dW;A2qG",
        "site": "https://openreview.net/forum?id=ws0F5NTzGw",
        "pdf_size": 12674444,
        "rating": "3;5;5;5",
        "confidence": "5;4;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;2",
        "presentation": "3;3;4;3",
        "wc_summary": "68;42;78;55",
        "wc_strengths": "27;21;29;36",
        "wc_weaknesses": "143;53;40;115",
        "wc_questions": "46;44;2;3",
        "wc_review": "284;160;149;209",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1902;886;455;1070",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "6;3;2;3",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            60.75,
            13.5531361684298
        ],
        "wc_strengths_avg": [
            28.25,
            5.356071321407137
        ],
        "wc_weaknesses_avg": [
            87.75,
            42.669514878892166
        ],
        "wc_questions_avg": [
            23.75,
            21.26470079733077
        ],
        "wc_review_avg": [
            200.5,
            53.23767462990847
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1078.25,
            525.3648137247108
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            3.5,
            1.5
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17126810663568570709&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "Consistency-guided Prompt Learning for Vision-Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17475",
        "id": "wsRXwlwx4w",
        "author_site": "Shuvendu Roy, Ali Etemad",
        "tldr": "",
        "abstract": "We propose Consistency-guided Prompt learning (CoPrompt), a new fine-tuning method for vision-language models. Our approach improves the generalization of large foundation models when fine-tuned on downstream tasks in a few-shot setting. The basic idea of CoPrompt is to enforce a consistency constraint in the prediction of the trainable and pre-trained models to prevent overfitting on the downstream task. Additionally, we introduce the following two components into our consistency constraint to further boost the performance: enforcing consistency on two perturbed inputs and combining two dominant paradigms of tuning, prompting and adapter. Enforcing consistency on perturbed input serves to further regularize the consistency constraint, thereby improving generalization. Moreover, the integration of adapters and prompts not only enhances performance on downstream tasks but also offers increased tuning flexibility in both input and output spaces. This facilitates more effective adaptation to downstream tasks in a few-shot learning setting. Experiments show that CoPrompt outperforms existing methods on a range of evaluation suites, including base-to-novel generalization, domain generalization, and cross-dataset evaluation. On generalization, CoPrompt improves the state-of-the-art on zero-shot tasks and the overall harmonic mean over 11 datasets. Detailed ablation studies show the effectiveness of each of the components in CoPrompt. We make our code available at https://github.com/ShuvenduRoy/CoPrompt.",
        "keywords": "Zero-shot Learning;Few-shot Learning;Prompt Learning;Vision-language Model",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Shuvendu Roy;Ali Etemad",
        "authorids": "~Shuvendu_Roy1;~Ali_Etemad1",
        "gender": "M;M",
        "homepage": "https://shuvenduroy.github.io/;http://www.aiimlab.com",
        "dblp": "272/9656;15/8931",
        "google_scholar": "HCPv9toAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";0000-0001-7128-0220",
        "linkedin": "shuvenduroy/;ali-etemad-6b3379b/",
        "or_profile": "~Shuvendu_Roy1;~Ali_Etemad1",
        "aff": "Vector Institute;Queen's University",
        "aff_domain": "vectorinstitute.ai;queensu.ca",
        "position": "Intern;Associate Professor",
        "bibtex": "@inproceedings{\nroy2024consistencyguided,\ntitle={Consistency-guided Prompt Learning for Vision-Language Models},\nauthor={Shuvendu Roy and Ali Etemad},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=wsRXwlwx4w}\n}",
        "github": "",
        "project": "",
        "reviewers": "D25R;8uZQ;sWY6;iShv",
        "pdf_size": 607674,
        "rating": "5;6;6;6",
        "confidence": "5;5;4;5",
        "soundness": "3;3;2;3",
        "contribution": "2;3;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "66;133;37;149",
        "wc_strengths": "19;30;28;84",
        "wc_weaknesses": "132;181;130;252",
        "wc_questions": "19;5;41;11",
        "wc_review": "236;349;236;496",
        "wc_reply_reviewers": "62;48;33;110",
        "wc_reply_authors": "1161;587;798;1007",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "3;2;2;3",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            96.25,
            46.25675626327467
        ],
        "wc_strengths_avg": [
            40.25,
            25.59663063764448
        ],
        "wc_weaknesses_avg": [
            173.75,
            49.58011194017214
        ],
        "wc_questions_avg": [
            19.0,
            13.638181696985855
        ],
        "wc_review_avg": [
            329.25,
            106.7552691907992
        ],
        "wc_reply_reviewers_avg": [
            63.25,
            28.873647154455565
        ],
        "wc_reply_authors_avg": [
            888.25,
            216.44326623852265
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 63,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1318305180040925992&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=wsRXwlwx4w",
        "pdf": "https://openreview.net/pdf?id=wsRXwlwx4w",
        "email": "vectorinstitute.ai;queensu.ca",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Vector Institute;Queen's University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://vectorinstitute.ai/;https://www.queensu.ca",
        "aff_unique_abbr": "Vector Institute;Queen's",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Canada"
    },
    {
        "title": "Toward Student-oriented Teacher Network Training for Knowledge Distillation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17474",
        "id": "wsWGcw6qKD",
        "author_site": "Chengyu Dong, Liyuan Liu, Jingbo Shang",
        "tldr": "",
        "abstract": "How to conduct teacher training for knowledge distillation is still an open problem. It has been widely observed that a best-performing teacher does not necessarily yield the best-performing student, suggesting a fundamental discrepancy between the current teacher training practice and the ideal teacher training strategy. To fill this gap, we explore the feasibility of training a teacher that is oriented toward student performance with empirical risk minimization (ERM). Our analyses are inspired by the recent findings that the effectiveness of knowledge distillation hinges on the teacher\u2019s capability to approximate the true label distribution of training inputs. We theoretically establish that ERM minimizer can approximate the true label distribution of training data as long as the feature extractor of the learner network is Lipschitz continuous and is robust to feature transformations. In light of our theory, we propose a teacher training method SoTeacher which incorporates Lipschitz regularization and consistency regularization into ERM. Experiments on benchmark datasets using various knowledge distillation algorithms and teacher-student pairs confirm that SoTeacher can improve student accuracy consistently.",
        "keywords": "Knowledge distillation;Teacher-student training;Empirical risk minimization",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Chengyu Dong;Liyuan Liu;Jingbo Shang",
        "authorids": "~Chengyu_Dong1;~Liyuan_Liu3;~Jingbo_Shang2",
        "gender": ";M;M",
        "homepage": "https://www.chengyu-dong.me/;https://shangjingbo1226.github.io/;https://liyuanlucasliu.github.io/",
        "dblp": "14/3155;151/3145.html;06/1624",
        "google_scholar": "Ppfi7j0AAAAJ;0SkFI4MAAAAJ;RmvbkzYAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Chengyu_Dong1;~Jingbo_Shang2;~Liyuan_Liu1",
        "aff": "University of California, San Diego;University of California, San Diego;University of Illinois, Urbana Champaign",
        "aff_domain": "ucsd.edu;ucsd.edu;illinois.edu",
        "position": "PhD student;Assistant Professor;PhD student",
        "bibtex": "@inproceedings{\ndong2024toward,\ntitle={Toward Student-oriented Teacher Network Training for Knowledge Distillation},\nauthor={Chengyu Dong and Liyuan Liu and Jingbo Shang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=wsWGcw6qKD}\n}",
        "github": "",
        "project": "",
        "reviewers": "Xgmp;c1De;UYE1;peLw",
        "pdf_size": 488916,
        "rating": "5;5;5;6",
        "confidence": "3;4;3;3",
        "soundness": "2;3;3;4",
        "contribution": "2;3;2;3",
        "presentation": "2;2;3;3",
        "wc_summary": "61;78;127;112",
        "wc_strengths": "53;64;114;33",
        "wc_weaknesses": "762;127;168;301",
        "wc_questions": "62;29;8;14",
        "wc_review": "938;298;417;460",
        "wc_reply_reviewers": "30;0;0;0",
        "wc_reply_authors": "718;264;235;272",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            94.5,
            26.253571185650152
        ],
        "wc_strengths_avg": [
            66.0,
            29.857997253667232
        ],
        "wc_weaknesses_avg": [
            339.5,
            252.26821044277457
        ],
        "wc_questions_avg": [
            28.25,
            20.932928605429293
        ],
        "wc_review_avg": [
            528.25,
            243.89790384503104
        ],
        "wc_reply_reviewers_avg": [
            7.5,
            12.99038105676658
        ],
        "wc_reply_authors_avg": [
            372.25,
            200.0929471520673
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2149442896913469045&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=wsWGcw6qKD",
        "pdf": "https://openreview.net/pdf?id=wsWGcw6qKD",
        "email": "ucsd.edu;ucsd.edu;illinois.edu",
        "author_num": 3,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "University of California, San Diego;University of Illinois Urbana-Champaign",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ucsd.edu;https://illinois.edu",
        "aff_unique_abbr": "UCSD;UIUC",
        "aff_campus_unique_index": "0;0;1",
        "aff_campus_unique": "San Diego;Urbana-Champaign",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "wsjNCPqziJ",
        "title": "Learning Latent Causal Semantics from Text: An Empirical Study of Next-Token Predictors Trained on Programs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We present evidence that language models can learn to represent the semantics latent in text despite being trained only to perform next token prediction. Specifically, we train a Transformer model on a synthetic corpus of programs written in a domain-specific language for navigating 2D grid world environments. Each program in the corpus is preceded by a (partial) specification in the form of (textual) input-output examples, and hence the semantics of the programming language enter as a \\emph{latent causal variable} in the data generation process. We then probe the trained model's hidden states as it generates a program given a specification. Despite providing no inductive bias toward learning the semantics of the programming language, we find that a linear probe is able to extract abstractions of the program states from the model states, which suggests the model acquires an emergent ability to \\emph{interpret} programs in the formal sense. Moreover, there is a strong, statistically significant correlation between the accuracy of the probe and the model's ability to generate a program that correctly implements the specification. To evaluate whether the semantics are represented in the model states rather than learned by the probe, we propose a causal framework for analyzing the effects of probing, and perform interventional experiments that allow us to precisely attribute the accuracy of the probe to the semantics latent in the model's training data (rather than, e.g., the signal used to supervise the probe). In summary, this paper does not propose any new techniques for training language models, but develops an empirical framework for and provides insights into the acquisition and representation of semantics in language models.",
        "keywords": "language modeling;program synthesis;formal semantics",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Charles Jin;Martin Rinard",
        "authorids": "~Charles_Jin1;~Martin_Rinard1",
        "gender": ";Not Specified",
        "homepage": "https://charlesjin.com;http://people.csail.mit.edu/rinard/",
        "dblp": "245/5611;",
        "google_scholar": "WC99LxgAAAAJ;https://scholar.google.com.tw/citations?user=hxlxVEUAAAAJ",
        "orcid": "0000-0001-6871-5764;",
        "linkedin": ";",
        "or_profile": "~Charles_Jin1;~Martin_Rinard1",
        "aff": "Massachusetts Institute of Technology;Massachusetts Institute of Technology",
        "aff_domain": "mit.edu;mit.edu",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\njin2024learning,\ntitle={Learning Latent Causal Semantics from Text: An Empirical Study of Next-Token Predictors Trained on Programs},\nauthor={Charles Jin and Martin Rinard},\nyear={2024},\nurl={https://openreview.net/forum?id=wsjNCPqziJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "hPVi;G8pC;gauF;9VK4",
        "site": "https://openreview.net/forum?id=wsjNCPqziJ",
        "pdf_size": 3301509,
        "rating": "3;5;5;5",
        "confidence": "4;4;2;4",
        "soundness": "2;3;2;3",
        "contribution": "2;3;2;3",
        "presentation": "2;2;2;3",
        "wc_summary": "47;173;118;196",
        "wc_strengths": "48;67;20;87",
        "wc_weaknesses": "292;318;106;263",
        "wc_questions": "4;98;23;149",
        "wc_review": "391;656;267;695",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            133.5,
            57.421685799008024
        ],
        "wc_strengths_avg": [
            55.5,
            24.70323865407125
        ],
        "wc_weaknesses_avg": [
            244.75,
            82.43595999319714
        ],
        "wc_questions_avg": [
            68.5,
            58.268773798665094
        ],
        "wc_review_avg": [
            502.25,
            179.2419802947959
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:_wfc1b1K478J:scholar.google.com/&scioq=Learning+Latent+Causal+Semantics+from+Text:+An+Empirical+Study+of+Next-Token+Predictors+Trained+on+Programs&hl=en&as_sdt=0,31",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Massachusetts Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://web.mit.edu",
        "aff_unique_abbr": "MIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "wsn1lPgDvU",
        "title": "STABLE ESTIMATION OF SURVIVAL CAUSAL EFFECTS",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We study the problem of estimating survival causal effects, where the aim is to characterize the impact of an intervention on survival times, i.e., how long it takes for an event to occur. Applications include determining if a drug reduces the time to ICU discharge or if an advertising campaign increases customer dwell time. Historically, the most popular estimates have been based on parametric or semiparametric (e.g. proportional hazards) models; however, these methods suffer from problematic levels of bias. Recently debiased machine learning approaches are becoming increasingly popular, especially in applications to large datasets. However, despite their appealing theoretical properties, these estimators tend to be unstable because the debiasing step involves the use of the inverses of small estimated probabilities---small errors in the estimated probabilities can result in huge changes in their inverses and therefore the resulting estimator. This problem is exacerbated in survival settings where probabilities are a product of treatment assignment and censoring probabilities. We propose a covariate balancing approach to estimating these inverses directly, sidestepping this problem. The result is an estimator that is stable in practice and enjoys many of the same theoretical properties. In particular, under overlap and asymptotic equicontinuity conditions, our estimator is asymptotically normal with negligible bias and optimal variance. Our experiments on synthetic and semi-synthetic data demonstrate that our method has competitive bias and smaller variance than debiased machine learning approaches.",
        "keywords": "survival analysis;causal inference;covariate balancing;semi-parametric efficiency;double machine learning",
        "primary_area": "causal reasoning",
        "supplementary_material": "",
        "author": "Khiem Pham;David A. Hirshberg;Phuong-Mai Huynh-Pham;Michele Santacatterina;Ser-Nam Lim;Ramin Zabih",
        "authorids": "~Khiem_Pham3;~David_A._Hirshberg1;~Phuong-Mai_Huynh-Pham1;~Michele_Santacatterina2;~Ser-Nam_Lim3;~Ramin_Zabih1",
        "gender": "M;F;M;M;M;M",
        "homepage": "https://davidahirshberg.bitbucket.io/;;https://michelesantacatterina.github.io/;https://www.cs.cornell.edu/~rdz;https://drproduck.github.io/;https://sites.google.com/site/sernam",
        "dblp": ";;230/3613;z/RaminZabih;;04/6633",
        "google_scholar": ";3dtj4egAAAAJ;mZPN7H4AAAAJ;8Lp0W54AAAAJ;NSkcWG0AAAAJ;HX0BfLYAAAAJ",
        "orcid": ";;;0000-0001-8769-5666;;",
        "linkedin": ";mai-pham-phuong-huynh/;;;khiem-duc-pham/;",
        "or_profile": "~David_A._Hirshberg1;~Phuong-Mai_Huynh-Pham1;~Michele_Santacatterina2;~Ramin_Zabih1;~Khiem_Pham2;~Ser-Nam_Lim1",
        "aff": ";Cornell University;New York University;Cornell;Cornell University;University of Central Florida",
        "aff_domain": ";cornell.edu;nyu.edu;cornell.edu;cornell.edu;ucf.edu",
        "position": ";PhD student;Assistant Professor;Professor;PhD student;Associate Professor",
        "bibtex": "@misc{\npham2024stable,\ntitle={{STABLE} {ESTIMATION} {OF} {SURVIVAL} {CAUSAL} {EFFECTS}},\nauthor={Khiem Pham and David A. Hirshberg and Phuong-Mai Huynh-Pham and Michele Santacatterina and Ser-Nam Lim and Ramin Zabih},\nyear={2024},\nurl={https://openreview.net/forum?id=wsn1lPgDvU}\n}",
        "github": "",
        "project": "",
        "reviewers": "ogxR;CT2T;CLjR",
        "site": "https://openreview.net/forum?id=wsn1lPgDvU",
        "pdf_size": 931266,
        "rating": "3;5;6",
        "confidence": "3;4;4",
        "soundness": "1;3;3",
        "contribution": "1;2;3",
        "presentation": "1;2;3",
        "wc_summary": "14;74;40",
        "wc_strengths": "9;44;34",
        "wc_weaknesses": "160;122;118",
        "wc_questions": "29;108;6",
        "wc_review": "212;348;198",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "604;250;176",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            42.666666666666664,
            24.567367696917707
        ],
        "wc_strengths_avg": [
            29.0,
            14.719601443879744
        ],
        "wc_weaknesses_avg": [
            133.33333333333334,
            18.92675942210452
        ],
        "wc_questions_avg": [
            47.666666666666664,
            43.683202975768864
        ],
        "wc_review_avg": [
            252.66666666666666,
            67.65270791985262
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            343.3333333333333,
            186.77853790578357
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.9449111825230683,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5339140163111523730&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0;2",
        "aff_unique_norm": "Cornell University;New York University;University of Central Florida",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.cornell.edu;https://www.nyu.edu;https://www.ucf.edu",
        "aff_unique_abbr": "Cornell;NYU;UCF",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "wtJS8YDQBc",
        "title": "DEER: A Delay-Resilient Framework for Reinforcement Learning with Variable Delays",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Classic reinforcement learning (RL) frequently struggles with tasks involving delays due to the violation of the Markov property.\nExisting approaches usually tackle this issue with end-to-end solutions using state augmentation, often by augmenting the state space with a predefined maximum dimension to accommodate random delays. \nHowever, this black-box approach, characterized by incomprehensible intermediate processes and redundant information in augmented states, can result in instability and even undermine the overall performance.\nTo alleviate the delay challenges in RL, we propose DEER (Delay-resilient Encoder-Enhanced RL), a framework that can effectively enhance the interpretability and address the random delay issues. \nDEER employs a pretrained encoder to encode delayed states along with their variable-length past action sequences due to different delays. \nSpecifically, we leverage delay-free environment datasets to train the encoder and convert delayed states and their corresponding action sequences into hidden states, which serve as novel delay-free states for further policy training. \nIn a variety of delayed scenarios, the trained encoder can smoothly integrate with standard RL algorithms without extra modifications and enhance the delay-solving capability by simply adapting the input dimension of the original algorithms.\nWe evaluate DEER through extensive experiments on Gym and Mujoco, which confirm that DEER is superior to state-of-the-art RL algorithms in both constant and random delay environments.",
        "keywords": "Reinforcement learning;Random delay;Encoder;Interpretability",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Bo Xia;Yilun Kong;Bo Yuan;Yongzhe Chang;Zhiheng Li;Xueqian Wang",
        "authorids": "~Bo_Xia1;~Yilun_Kong1;~Bo_Yuan5;~Yongzhe_Chang1;~Zhiheng_Li3;~Xueqian_Wang1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://github.com/StriveInDecember;http://info.tsinghua.edu.cn/render.userLayoutRootNode.uP;http://boyuan.global-optimization.com/;;https://www.sigs.tsinghua.edu.cn/lzh/list.htm;",
        "dblp": ";305/4233;41/1662-3;;89/6935-1;43/3563-1",
        "google_scholar": ";;FMiooBoAAAAJ;https://scholar.google.com.hk/citations?user=7iRQyFcAAAAJ;;h9dN_ykAAAAJ",
        "orcid": "0009-0003-3507-9732;;0000-0003-2169-0007;0000-0002-9083-5348;;0000-0003-3542-0593",
        "linkedin": ";;;;;",
        "or_profile": "~Bo_Xia1;~Yilun_Kong1;~Bo_Yuan5;~Yongzhe_Chang1;~Zhiheng_Li3;~Xueqian_Wang1",
        "aff": "Tsinghua University;Tsinghua University;Research Institute of Tsinghua University in Shenzhen;Tsinghua University;Tsinghua University;Tsinghua University",
        "aff_domain": "mail.tsinghua.edu.cn;tsinghua.edu.cn;tsinghua-sz.org;tsinghua.edu.cn;mail.tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "PhD student;MS student;Researcher;Researcher;Associate Professor;Full Professor",
        "bibtex": "@misc{\nxia2024deer,\ntitle={{DEER}: A Delay-Resilient Framework for Reinforcement Learning with Variable Delays},\nauthor={Bo Xia and Yilun Kong and Bo Yuan and Yongzhe Chang and Zhiheng Li and Xueqian Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=wtJS8YDQBc}\n}",
        "github": "",
        "project": "",
        "reviewers": "pa1n;HvM3;b2a3;yS4B",
        "site": "https://openreview.net/forum?id=wtJS8YDQBc",
        "pdf_size": 4073170,
        "rating": "5;5;5;6",
        "confidence": "3;5;4;3",
        "soundness": "2;3;3;3",
        "contribution": "2;3;2;2",
        "presentation": "3;3;4;2",
        "wc_summary": "78;211;84;78",
        "wc_strengths": "182;58;61;29",
        "wc_weaknesses": "122;293;113;352",
        "wc_questions": "32;225;24;92",
        "wc_review": "414;787;282;551",
        "wc_reply_reviewers": "47;94;0;27",
        "wc_reply_authors": "845;1712;1156;1584",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "5;6;5;4",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            112.75,
            56.777526363870415
        ],
        "wc_strengths_avg": [
            82.5,
            58.78988008152424
        ],
        "wc_weaknesses_avg": [
            220.0,
            104.64941471408237
        ],
        "wc_questions_avg": [
            93.25,
            80.47786962886133
        ],
        "wc_review_avg": [
            508.5,
            186.81608603115524
        ],
        "wc_reply_reviewers_avg": [
            42.0,
            34.343849522148794
        ],
        "wc_reply_authors_avg": [
            1324.25,
            344.8944584941892
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            5.0,
            0.7071067811865476
        ],
        "replies_avg": [
            30,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10065650300307381917&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "Tsinghua University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "THU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Shenzhen",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "wu9nGGYvAX",
        "title": "Deep Neural Networks Can Learn Generalizable Same-Different Visual Relations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Although deep neural networks can achieve human-level performance on many object recognition benchmarks, prior work suggests that these same models fail to learn simple abstract relations, such as determining whether two objects are the same or different. Much of this prior work focuses on training convolutional neural networks to classify images of two same or two different abstract shapes, testing generalization on within-distribution stimuli. In this article, we comprehensively study whether deep neural networks can acquire and generalize same-different relations both within and out-of-distribution using a variety of architectures, forms of pretraining, and fine-tuning datasets. We find that certain pretrained transformers can learn a same-different relation that generalizes with near perfect accuracy to out-of-distribution stimuli. Furthermore, we find that fine-tuning on abstract shapes that lack texture or color provides the strongest out-of-distribution generalization. Our results suggest that, with the right approach, deep neural networks can learn abstract, generalizable same-different visual relations.",
        "keywords": "abstract relations;vision transformers;visual concept learning;out-of-distribution generalization;same-different relation;equality relation;inductive biases",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "Alexa R. Tartaglini;Sheridan Feucht;Michael A. Lepori;Wai Keen Vong;Charles Lovering;Brenden M. Lake;Ellie Pavlick",
        "authorids": "~Alexa_R._Tartaglini1;~Sheridan_Feucht1;~Michael_A._Lepori1;~Wai_Keen_Vong1;~Charles_Lovering1;~Brenden_M._Lake1;~Ellie_Pavlick1",
        "gender": "Non-Binary;M;M;;M;F;F",
        "homepage": "https://sfeucht.github.io/;https://lepori.xyz/;https://www.waikeenvong.com;https://cjlovering.github.io/;https://cims.nyu.edu/~brenden/;http://cs.brown.edu/people/epavlick/;https://www.alexatartaglini.com/",
        "dblp": "306/1619;262/0162;;;47/9567;141/4059;",
        "google_scholar": ";G1fepc8AAAAJ;SwVlB20AAAAJ;w0hYPqEAAAAJ;vspmOX8AAAAJ;sFyrSa8AAAAJ;Z-uWbOQAAAAJ",
        "orcid": ";;;;;;",
        "linkedin": "sheridan-feucht/;michael-lepori-925426124/;;;;;",
        "or_profile": "~Sheridan_Feucht1;~Michael_A._Lepori1;~Wai_Keen_Vong1;~Charles_Lovering1;~Brenden_M._Lake1;~Ellie_Pavlick1;~Alexa_Rae_Tartaglini1",
        "aff": "Northeastern University;Brown University;New York University;Kensho;New York University;Brown University;New York University",
        "aff_domain": "northeastern.edu;brown.edu;nyu.edu;kensho.com;nyu.edu;brown.edu;nyu.edu",
        "position": "PhD student;PhD student;Postdoc;Researcher;Assistant Professor;Assistant Professor;Researcher",
        "bibtex": "@misc{\ntartaglini2024deep,\ntitle={Deep Neural Networks Can Learn Generalizable Same-Different Visual Relations},\nauthor={Alexa R. Tartaglini and Sheridan Feucht and Michael A. Lepori and Wai Keen Vong and Charles Lovering and Brenden M. Lake and Ellie Pavlick},\nyear={2024},\nurl={https://openreview.net/forum?id=wu9nGGYvAX}\n}",
        "github": "",
        "project": "",
        "reviewers": "VFaW;GpvX;LAfe;Vcjk",
        "site": "https://openreview.net/forum?id=wu9nGGYvAX",
        "pdf_size": 15887731,
        "rating": "3;3;5;6",
        "confidence": "4;5;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;2",
        "presentation": "3;3;3;3",
        "wc_summary": "78;17;61;85",
        "wc_strengths": "80;21;44;120",
        "wc_weaknesses": "274;84;152;183",
        "wc_questions": "141;4;153;128",
        "wc_review": "573;126;410;516",
        "wc_reply_reviewers": "0;0;0;63",
        "wc_reply_authors": "567;205;809;629",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            60.25,
            26.45160675649024
        ],
        "wc_strengths_avg": [
            66.25,
            37.485830656396026
        ],
        "wc_weaknesses_avg": [
            173.25,
            68.30583796426188
        ],
        "wc_questions_avg": [
            106.5,
            59.83519031473035
        ],
        "wc_review_avg": [
            406.25,
            172.0499564080154
        ],
        "wc_reply_reviewers_avg": [
            15.75,
            27.279800219209818
        ],
        "wc_reply_authors_avg": [
            552.5,
            219.43734868977978
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5443310539518174,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11136091710682810012&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;3;2;1;2",
        "aff_unique_norm": "Northeastern University;Brown University;New York University;Kensho",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.northeastern.edu;https://www.brown.edu;https://www.nyu.edu;https://www.kensho.com",
        "aff_unique_abbr": "NEU;Brown;NYU;Kensho",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "wvHfsiWXUR",
        "title": "Tell, Don't Show: Internalized Reasoning influences how LLMs generalize",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this paper we investigate to what extent language models' generalization behavior during a domain shift can be influenced by declarative knowledge contained in the training data.\nIn order to study this we finetune language models to fit some distribution which has a ``natural'' generalization when the distribution shifts.\nWe then test to what extent declarative statements in the training data - that if fully internalized would greatly affect the domain shift generalization - can indeed alter the model's behavior on unseen examples.\nWhile the effect is subtle, the declarative knowledge provided in the finetuning sets systematically changes the models' predictions in the way one would expect.\nEvidence for the strength of this effect growing with model size is mixed.\nWe further show that the effect can not be explained by simple token matching behavior as it persists even when there is no overlap between the declarative descriptions and the models' test time generations.",
        "keywords": "LLM generalization;AI safety",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Alexander Meinke;Owain Evans",
        "authorids": "~Alexander_Meinke1;~Owain_Evans1",
        "gender": "M;",
        "homepage": ";https://owainevans.github.io/",
        "dblp": "249/5767;52/10432",
        "google_scholar": "https://scholar.google.de/citations?user=PqHTP_AAAAAJ;4VpTwzIAAAAJ",
        "orcid": ";",
        "linkedin": "alexander-meinke-a32904173/;",
        "or_profile": "~Alexander_Meinke1;~Owain_Evans1",
        "aff": "Max-Planck-Institute for Intelligent Systems, Max-Planck Institute;Truthful AI",
        "aff_domain": "is.mpg.de;owainevans.com",
        "position": "PhD student;Principal Researcher",
        "bibtex": "@misc{\nmeinke2024tell,\ntitle={Tell, Don't Show: Internalized Reasoning influences how {LLM}s generalize},\nauthor={Alexander Meinke and Owain Evans},\nyear={2024},\nurl={https://openreview.net/forum?id=wvHfsiWXUR}\n}",
        "github": "",
        "project": "",
        "reviewers": "4DGZ;7kVD;npPu;5z43",
        "site": "https://openreview.net/forum?id=wvHfsiWXUR",
        "pdf_size": 495221,
        "rating": "1;3;5;5",
        "confidence": "4;4;3;3",
        "soundness": "1;2;2;3",
        "contribution": "1;2;2;2",
        "presentation": "2;1;3;3",
        "wc_summary": "31;67;62;50",
        "wc_strengths": "12;43;36;35",
        "wc_weaknesses": "177;127;140;73",
        "wc_questions": "2;3;2;124",
        "wc_review": "222;240;240;282",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            1.6583123951777
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            52.5,
            13.865424623862047
        ],
        "wc_strengths_avg": [
            31.5,
            11.672617529928752
        ],
        "wc_weaknesses_avg": [
            129.25,
            37.298625980054545
        ],
        "wc_questions_avg": [
            32.75,
            52.68479382136747
        ],
        "wc_review_avg": [
            246.0,
            22.045407685048602
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.9045340337332909,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:mxAt5WeXFJAJ:scholar.google.com/&scioq=Tell,+Don%27t+Show:+Internalized+Reasoning+influences+how+LLMs+generalize&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Max-Planck-Institute for Intelligent Systems;Truthful AI",
        "aff_unique_dep": "Intelligent Systems;",
        "aff_unique_url": "https://www.mpi-is.mpg.de;",
        "aff_unique_abbr": "MPI-IS;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Germany;"
    },
    {
        "id": "wvvj8EPydm",
        "title": "Conformal Normalization in Recurrent Neural Network of Grid Cells",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Grid cells in the entorhinal cortex of the mammalian brain exhibit striking hexagon firing patterns in their response maps as the animal (e.g., a rat) navigates in a 2D open environment. The responses of the population of grid cells collectively form a vector in a high-dimensional neural activity space, and this vector represents the self-position of the agent in the 2D physical space.  As the agent moves, the vector is transformed by a recurrent neural network that takes the velocity of the agent as input. In this paper, we propose a simple and general conformal normalization of the input velocity for the recurrent neural network, so that the local displacement of the position vector in the high-dimensional neural space is proportional to the local displacement of the agent in the 2D physical space, regardless of the direction of the input velocity. Our numerical experiments on the minimally simple linear and non-linear recurrent networks show that conformal normalization leads to the emergence of the hexagon grid patterns. Furthermore, we derive a new theoretical understanding that connects conformal normalization to the emergence of hexagon grid patterns in navigation tasks.",
        "keywords": "Grid cells;Position embedding;Conformal isometry;Path integration",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "Dehong Xu;Ruiqi Gao;Wenhao Zhang;Xue-Xin Wei;Ying Nian Wu",
        "authorids": "~Dehong_Xu1;~Ruiqi_Gao1;~Wenhao_Zhang3;~Xue-Xin_Wei3;~Ying_Nian_Wu1",
        "gender": "M;F;M;M;M",
        "homepage": "https://dehongxu.github.io/;http://www.stat.ucla.edu/~ruiqigao/;https://www.zhang-cnl.org/;;http://www.stat.ucla.edu/~ywu/",
        "dblp": "126/1547;206/7084;57/7458-2;118/8207;18/568.html",
        "google_scholar": ";VdlgOXoAAAAJ;TqGPd9QAAAAJ;7Pd1QzwAAAAJ;7k_1QFIAAAAJ",
        "orcid": ";;0000-0001-7641-5024;;",
        "linkedin": "dehong-xu-61a947248/;;;;",
        "or_profile": "~Dehong_Xu1;~Ruiqi_Gao1;~Wenhao_Zhang3;~Xue-Xin_Wei3;~Yingnian_Wu1",
        "aff": "Amazon;Google;University of Texas Southwestern Medical Center;University of Texas, Austin;UCLA",
        "aff_domain": "amazon.com;google.com;utsouthwestern.edu;utexas.edu;stat.ucla.edu",
        "position": "Intern;Researcher;Assistant Professor;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nxu2024conformal,\ntitle={Conformal Normalization in Recurrent Neural Network of Grid Cells},\nauthor={Dehong Xu and Ruiqi Gao and Wenhao Zhang and Xue-Xin Wei and Ying Nian Wu},\nyear={2024},\nurl={https://openreview.net/forum?id=wvvj8EPydm}\n}",
        "github": "",
        "project": "",
        "reviewers": "rnXm;DEe1;AKJR;gVgU",
        "site": "https://openreview.net/forum?id=wvvj8EPydm",
        "pdf_size": 10644713,
        "rating": "3;3;5;5",
        "confidence": "3;4;4;2",
        "soundness": "2;2;4;4",
        "contribution": "1;1;2;2",
        "presentation": "2;1;3;3",
        "wc_summary": "36;106;65;79",
        "wc_strengths": "12;11;67;61",
        "wc_weaknesses": "783;196;68;344",
        "wc_questions": "237;58;87;1",
        "wc_review": "1068;371;287;485",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "24;24;24;24",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            1.0
        ],
        "contribution_avg": [
            1.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            71.5,
            25.243811122728676
        ],
        "wc_strengths_avg": [
            37.75,
            26.337947907914163
        ],
        "wc_weaknesses_avg": [
            347.75,
            269.60376017407475
        ],
        "wc_questions_avg": [
            95.75,
            87.22205856318686
        ],
        "wc_review_avg": [
            552.75,
            305.6667916212031
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            24.0,
            0.0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.30151134457776363,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:1NZbAGhPpsgJ:scholar.google.com/&scioq=Conformal+Normalization+in+Recurrent+Neural+Network+of+Grid+Cells&hl=en&as_sdt=0,33",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "Amazon;Google;University of Texas Southwestern Medical Center;University of Texas at Austin;University of California, Los Angeles",
        "aff_unique_dep": "Amazon.com, Inc.;Google;;;",
        "aff_unique_url": "https://www.amazon.com;https://www.google.com;https://www.utsouthwestern.edu;https://www.utexas.edu;https://www.ucla.edu",
        "aff_unique_abbr": "Amazon;Google;UT Southwestern;UT Austin;UCLA",
        "aff_campus_unique_index": "1;2;3",
        "aff_campus_unique": ";Mountain View;Austin;Los Angeles",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "wwJJUamHVp",
        "title": "Finite Element Operator Learning for Solving Parametric PDEs without Labeled Data",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Partial differential equations (PDEs) underlie our understanding and prediction of natural phenomena across numerous fields, including physics, engineering, and finance. However, solving parametric PDEs is a complex task that necessitates efficient numerical methods. In this paper, we propose a novel approach for solving parametric PDEs using a Finite Element Operator Network (FEONet). Our proposed method leverages the power of deep learning in conjunction with traditional numerical methods, specifically the finite element method, to solve parametric PDEs in the absence of any paired input-output training data. We demonstrate the effectiveness of our approach on several benchmark problems and show that it outperforms existing state-of-the-art methods in terms of accuracy, generalization, and computational flexibility. Our FEONet framework shows potential for application in various fields where PDEs play a crucial role in modeling complex domains with diverse boundary conditions and singular behavior. Furthermore, we provide theoretical convergence analysis to support our approach, utilizing finite element approximation in numerical analysis.",
        "keywords": "Scientific machine learning;finite element methods;physics-informed operator learning;parametric partial differential equations",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/200f5cdd1371a5aa07c99437bcd402868b2e224c.zip",
        "author": "Jae Yong Lee;Seungchan Ko;Youngjoon Hong",
        "authorids": "~Jae_Yong_Lee2;~Seungchan_Ko1;~Youngjoon_Hong2",
        "gender": "M;M;M",
        "homepage": "http://www.jaeyong-lee.com/;https://sites.google.com/view/scko;https://www.youngjoonhong.com",
        "dblp": "72/6418;236/1691;119/1276",
        "google_scholar": "C1FGMygAAAAJ;x7otqjUAAAAJ;",
        "orcid": "0000-0003-0193-545X;;",
        "linkedin": "jae-yong-lee-31b675158/;;",
        "or_profile": "~Jae_Yong_Lee2;~Seungchan_Ko1;~Youngjoon_Hong1",
        "aff": "Korea Institute for Advanced Study (KIAS);Inha University;KAIST",
        "aff_domain": "kias.re.kr;inha.ac.kr;kaist.ac.kr",
        "position": "Researcher;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nlee2024finite,\ntitle={Finite Element Operator Learning for Solving Parametric {PDE}s without Labeled Data},\nauthor={Jae Yong Lee and Seungchan Ko and Youngjoon Hong},\nyear={2024},\nurl={https://openreview.net/forum?id=wwJJUamHVp}\n}",
        "github": "",
        "project": "",
        "reviewers": "fxKi;jxCk;YJCJ;9X6c",
        "site": "https://openreview.net/forum?id=wwJJUamHVp",
        "pdf_size": 12227771,
        "rating": "3;3;3;3",
        "confidence": "5;3;4;5",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;2",
        "presentation": "3;2;3;3",
        "wc_summary": "147;87;79;57",
        "wc_strengths": "43;32;40;37",
        "wc_weaknesses": "826;397;123;166",
        "wc_questions": "8;19;1;341",
        "wc_review": "1024;535;243;601",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            92.5,
            33.32791622649097
        ],
        "wc_strengths_avg": [
            38.0,
            4.06201920231798
        ],
        "wc_weaknesses_avg": [
            378.0,
            278.85211134219514
        ],
        "wc_questions_avg": [
            92.25,
            143.75913014483638
        ],
        "wc_review_avg": [
            600.75,
            279.03796784667134
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:V3AjiFzHrb4J:scholar.google.com/&scioq=Finite+Element+Operator+Learning+for+Solving+Parametric+PDEs+without+Labeled+Data&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Korea Institute for Advanced Study;Inha University;Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.kias.re.kr;https://www.inha.edu/;https://www.kaist.ac.kr",
        "aff_unique_abbr": "KIAS;Inha;KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "wwotGBxtC3",
        "title": "Data-Efficient Molecular Generation with Hierarchical Textual Inversion",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Developing an effective molecular generation framework even with a limited number of molecules is often important for its practical deployment, e.g., drug discovery, since acquiring task-related molecular data requires expensive and time-consuming experimental costs. \nTo tackle this issue, we introduce Hierarchical textual Inversion for Molecular Generation (HI-Mol), a novel data-efficient molecular generation method.\nHI-Mol is inspired by a recent textual inversion technique in the visual domain that achieves data-efficient generation via simple optimization of a new single text token of a pre-trained text-to-image generative model.\nHowever, we find that its naive adoption fails for molecules due to their complicated and structured nature. \nHence, we propose a hierarchical textual inversion scheme based on introducing low-level tokens that are selected differently per molecule in addition to the original single text token in textual inversion to learn the common concept among molecules.\nWe then generate molecules using a pre-trained text-to-molecule model by interpolating the low-level tokens.\nExtensive experiments demonstrate the superiority of HI-Mol with notable data-efficiency. \nFor instance, on QM9, HI-Mol outperforms the prior state-of-the-art method \nwith 50$\\times$ less training data. \nWe also show the efficacy of HI-Mol in various applications, including molecular optimization and low-shot molecular property prediction.",
        "keywords": "Molecular generation",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/61ad714bc1a618aad1b663a696810c171d583900.zip",
        "author": "Seojin Kim;Jaehyun Nam;Sihyun Yu;Younghoon Shin;Jinwoo Shin",
        "authorids": "~Seojin_Kim2;~Jaehyun_Nam2;~Sihyun_Yu2;~Younghoon_Shin2;~Jinwoo_Shin1",
        "gender": "M;;M;M;M",
        "homepage": "https://alinlab.kaist.ac.kr/members.html;https://jaehyun513.github.io/;https://sihyun-yu.github.io;https://github.com/0HOON;https://sites.google.com/site/mijirim/",
        "dblp": "95/102;162/5227;287/4627;;31/7062",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en;;https://scholar.google.com.tw/citations?user=m3eDp7kAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Seojin_Kim2;~Jaehyun_Nam2;~Sihyun_Yu2;~Younghoon_Shin2;~Jinwoo_Shin1",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Research, Google;Korea University;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr;research.google.com;korea.ac.kr;kaist.ac.kr",
        "position": "PhD student;PhD student;Intern;Undergrad student;Full Professor",
        "bibtex": "@misc{\nkim2024dataefficient,\ntitle={Data-Efficient Molecular Generation with Hierarchical Textual Inversion},\nauthor={Seojin Kim and Jaehyun Nam and Sihyun Yu and Younghoon Shin and Jinwoo Shin},\nyear={2024},\nurl={https://openreview.net/forum?id=wwotGBxtC3}\n}",
        "github": "",
        "project": "",
        "reviewers": "89Qo;9Hsy;Mfay;5Up6",
        "site": "https://openreview.net/forum?id=wwotGBxtC3",
        "pdf_size": 3714365,
        "rating": "5;6;6;6",
        "confidence": "4;4;3;4",
        "soundness": "2;3;3;2",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;2",
        "wc_summary": "39;36;30;75",
        "wc_strengths": "44;43;36;34",
        "wc_weaknesses": "204;103;120;51",
        "wc_questions": "2;1;11;160",
        "wc_review": "289;183;197;320",
        "wc_reply_reviewers": "98;15;16;0",
        "wc_reply_authors": "1235;411;586;892",
        "reply_reviewers": "2;1;1;0",
        "reply_authors": "3;3;3;3",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            45.0,
            17.621010186706094
        ],
        "wc_strengths_avg": [
            39.25,
            4.322904116447646
        ],
        "wc_weaknesses_avg": [
            119.5,
            55.01136246267674
        ],
        "wc_questions_avg": [
            43.5,
            67.37395639265962
        ],
        "wc_review_avg": [
            247.25,
            58.49946580952684
        ],
        "wc_reply_reviewers_avg": [
            32.25,
            38.48619882503337
        ],
        "wc_reply_authors_avg": [
            781.0,
            313.5928889499888
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            3.0,
            0.0
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16201387754646065141&as_sdt=8000005&sciodt=0,19&hl=en",
        "gs_version_total": 10,
        "aff_unique_index": "0;0;1;2;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology;Google;Korea University",
        "aff_unique_dep": ";Google Research;",
        "aff_unique_url": "https://www.kaist.ac.kr;https://research.google;https://www.korea.ac.kr",
        "aff_unique_abbr": "KAIST;Google;KU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "id": "wxClzZdjqP",
        "title": "LLM4GCL: CAN LARGE LANGUAGE MODEL EM-POWER GRAPH CONTRASTIVE LEARNING?",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph contrastive learning (GCL) has made significant strides in pre-training graph neural networks (GNNs) without requiring human annotations. Previous GCL efforts have primarily concentrated on augmenting graphs, assuming the node features are pre-embedded. However, many real-world graphs contain textual node attributes (e.g., citation network), known as text-attributed graphs (TAGs). The existing GCL methods often simply convert the textual attributes into numerical features using shallow or heuristic methods like skip-gram and bag-of-words, which cannot capture the semantic nuances and general knowledge embedded in natural language. Motivated by the exceptional capabilities of large language models (LLMs), like ChatGPT, in comprehending text, in this work, we delve into the realm of GCL on TAGs in the era of LLMs, which we term LLM4GCL. We explore two potential pipelines: \\textit{LLM-as-GraphAugmentor} and \\textit{LLM-as-TextEncoder}. The former aims to directly leverage LLMs to conduct augmentations at the feature and structure levels through prompts. The latter attempts to employ LLMs to encode nodes' textual attributes into embedding vectors. Building on these two pipelines, we conduct comprehensive and systematic studies on six benchmark datasets, exploring various feasible designs. The results show the promise of LLM4GCL in enhancing the performance of state-of-the-art GCL methods. Our code and dataset will be publicly released upon acceptance.",
        "keywords": "GNN;Graph Contrastive Learning;LLM",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/c92dd07c6f94b6c11ca12c16f21b01cb184de3d7.pdf",
        "author": "Yi Fang;Xiaqiang Tang;Luyang Shang;Dongzhe Fan;Daochen Zha;Qiaoyu Tan",
        "authorids": "~Yi_Fang8;~Xiaqiang_Tang3;~Luyang_Shang1;~Dongzhe_Fan2;~Daochen_Zha1;~Qiaoyu_Tan2",
        "gender": "M;M;M;;M;M",
        "homepage": ";https://github.com/shangluyang;https://github.com/FanDongzhe;http://dczha.com/;https://qiaoyu-tan.github.io/;https://xiaqiang-tang.github.io/",
        "dblp": ";;;167/0903;197/5465.html;353/6066",
        "google_scholar": ";;;jK0NgMcAAAAJ;V9bOnV4AAAAJ;wp1ePfYAAAAJ",
        "orcid": ";;;0000-0002-6677-7504;0000-0001-8999-968X;",
        "linkedin": "yi-fang-70519124a/;;;daochen-zha;;",
        "or_profile": "~Yi_Fang8;~Luyang_Shang1;~Dongzhe_Fan2;~Daochen_Zha1;~Qiaoyu_Tan2;~xiaqiang_tang1",
        "aff": "New York University;New York University;New York University;Airbnb;New York University Shanghai;Hong Kong University of Science and Technology(GZ)",
        "aff_domain": "nyu.edu;nyu.edu;nyu.edu;airbnb.com;nyu.edu;hkust.edu",
        "position": "Researcher;MS student;PhD student;Researcher;Assistant Professor;PhD student",
        "bibtex": "@misc{\nfang2024llmgcl,\ntitle={{LLM}4{GCL}: {CAN} {LARGE} {LANGUAGE} {MODEL} {EM}-{POWER} {GRAPH} {CONTRASTIVE} {LEARNING}?},\nauthor={Yi Fang and Xiaqiang Tang and Luyang Shang and Dongzhe Fan and Daochen Zha and Qiaoyu Tan},\nyear={2024},\nurl={https://openreview.net/forum?id=wxClzZdjqP}\n}",
        "github": "",
        "project": "",
        "reviewers": "nivK;aMBc;GqWv;s2Lm",
        "site": "https://openreview.net/forum?id=wxClzZdjqP",
        "pdf_size": 532935,
        "rating": "3;3;3;5",
        "confidence": "4;4;4;4",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;2;2",
        "wc_summary": "62;76;64;180",
        "wc_strengths": "85;72;41;82",
        "wc_weaknesses": "306;173;12;139",
        "wc_questions": "4;92;189;80",
        "wc_review": "457;413;306;481",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            95.5,
            49.07901792008475
        ],
        "wc_strengths_avg": [
            70.0,
            17.421251390184345
        ],
        "wc_weaknesses_avg": [
            157.5,
            104.64822024286892
        ],
        "wc_questions_avg": [
            91.25,
            65.75475267993941
        ],
        "wc_review_avg": [
            414.25,
            67.08716345173643
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:vmPLryaL5fgJ:scholar.google.com/&scioq=LLM4GCL:+CAN+LARGE+LANGUAGE+MODEL+EM-POWER+GRAPH+CONTRASTIVE+LEARNING%3F&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1;0;2",
        "aff_unique_norm": "New York University;Airbnb;Hong Kong University of Science and Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.nyu.edu;https://www.airbnb.com;https://www.ust.hk",
        "aff_unique_abbr": "NYU;Airbnb;HKUST",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Shanghai;Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;0;1",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "The Unlocking Spell on Base LLMs: Rethinking Alignment via In-Context Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17473",
        "id": "wxJ0eXwwda",
        "author_site": "Bill Yuchen Lin, Abhilasha Ravichander, Ximing Lu, Nouha Dziri, Melanie Sclar, Khyathi Chandu, Chandra Bhagavatula, Yejin Choi",
        "tldr": "",
        "abstract": "Alignment tuning has become the de facto standard practice for enabling base large language models (LLMs) to serve as open-domain AI assistants. The alignment tuning process typically involves instruction learning through supervised fine-tuning (SFT) and preference tuning via reinforcement learning from human feedback (RLHF). A recent study, LIMA (Zhou et al., 2023), shows that using merely 1K examples for SFT can achieve significant alignment performance as well, suggesting that the effect of alignment tuning might be \"superficial.\" This raises questions about how exactly the alignment tuning transforms a base LLM. \n\nWe analyze the effect of alignment tuning by examining the token distribution shift between base LLMs and their aligned counterparts (e.g., Llama-2 and Llama-2-chat). Our findings reveal that base LLMs and their alignment-tuned versions perform nearly identically in decoding on the majority of token positions (i.e., they share the top-ranked tokens). Most distribution shifts occur with stylistic tokens (e.g., discourse markers, safety disclaimers). This direct evidence strongly supports the hypothesis that alignment tuning primarily learns to adopt the language style of AI assistants, and that the knowledge required for answering user queries predominantly comes from the base LLMs themselves. \n\nBased on these findings, we rethink the alignment of LLMs by posing the research question: how effectively can we align base LLMs without SFT or RLHF? To address this, we introduce a simple, tuning-free alignment method, URIAL (Untuned LLMs with Restyled In-context Alignment). URIAL achieves effective alignment purely through in-context learning (ICL) with base LLMs, requiring as few as three constant stylistic examples and a system prompt. We conduct a fine-grained and interpretable evaluation on a diverse set of examples, named just-eval-instruct. Results demonstrate that base LLMs with URIAL can match or even surpass the performance of LLMs aligned with SFT (Mistral-7b-Instruct) or SFT+RLHF (Llama-2-70b-chat). We show that the gap between tuning-free and tuning-based alignment methods can be significantly reduced through strategic prompting and ICL. Our findings on the superficial nature of alignment tuning and results with URIAL suggest that deeper analysis and theoretical understanding of alignment is crucial to future LLM research.",
        "keywords": "LLM;alignment;in-context learning;instruction tuning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Bill Yuchen Lin;Abhilasha Ravichander;Ximing Lu;Nouha Dziri;Melanie Sclar;Khyathi Chandu;Chandra Bhagavatula;Yejin Choi",
        "authorids": "~Bill_Yuchen_Lin1;~Abhilasha_Ravichander2;~Ximing_Lu1;~Nouha_Dziri2;~Melanie_Sclar1;~Khyathi_Chandu1;~Chandra_Bhagavatula1;~Yejin_Choi1",
        "gender": "M;;F;;F;;M;F",
        "homepage": "http://yuchenlin.xyz/;https://www.cs.cmu.edu/~aravicha/;https://gloriaximinglu.github.io/;;https://msclar.github.io;;https://www.chandrab.page;https://yejinc.github.io/",
        "dblp": "190/4518;170/4795.html;24/10879;;274/6796;;151/3093;89/579-1",
        "google_scholar": "https://scholar.google.com/citations?hl=en;6vLsKGsAAAAJ;https://scholar.google.com/citations?hl=en;;4uNPtZgAAAAJ;;AsgHp14AAAAJ;vhP-tlcAAAAJ",
        "orcid": ";;;;;;;",
        "linkedin": ";abhilasha-ravichander-57524958;;;melanie-sclar-077047b5/;;;",
        "or_profile": "~Bill_Yuchen_Lin1;~Abhilasha_Ravichander2;~Ximing_Lu1;~Nouha_Dziri2;~Melanie_Sclar1;~Khyathi_Chandu1;~Chandra_Bhagavatula1;~Yejin_Choi1",
        "aff": "Allen Institute for Artificial Intelligence;Allen Institute for Artificial Intelligence;University of Washington;;University of Washington, Seattle;;Allen Institute for Artificial Intelligence;Department of Computer Science, University of Washington",
        "aff_domain": "allenai.org;allenai.org;cs.washington.edu;;uw.edu;;allenai.org;cs.washington.edu",
        "position": "Researcher;Postdoc;PhD student;;PhD student;;Researcher;Full Professor",
        "bibtex": "@inproceedings{\nlin2024the,\ntitle={The Unlocking Spell on Base {LLM}s:  Rethinking Alignment via In-Context Learning},\nauthor={Bill Yuchen Lin and Abhilasha Ravichander and Ximing Lu and Nouha Dziri and Melanie Sclar and Khyathi Chandu and Chandra Bhagavatula and Yejin Choi},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=wxJ0eXwwda}\n}",
        "github": "",
        "project": "",
        "reviewers": "23pN;6AgL;H4Bh;vPxW",
        "pdf_size": 3554255,
        "rating": "3;5;6;6",
        "confidence": "4;5;3;4",
        "soundness": "2;3;4;3",
        "contribution": "2;2;3;3",
        "presentation": "1;3;4;4",
        "wc_summary": "69;95;132;66",
        "wc_strengths": "22;67;43;58",
        "wc_weaknesses": "703;287;44;430",
        "wc_questions": "210;39;111;24",
        "wc_review": "1004;488;330;578",
        "wc_reply_reviewers": "583;0;0;23",
        "wc_reply_authors": "3562;2927;846;1994",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "6;5;2;5",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            1.224744871391589
        ],
        "wc_summary_avg": [
            90.5,
            26.48112535373072
        ],
        "wc_strengths_avg": [
            47.5,
            17.03672503740082
        ],
        "wc_weaknesses_avg": [
            366.0,
            238.531968507368
        ],
        "wc_questions_avg": [
            96.0,
            73.57649081058433
        ],
        "wc_review_avg": [
            600.0,
            249.5716330034325
        ],
        "wc_reply_reviewers_avg": [
            151.5,
            249.3035298586845
        ],
        "wc_reply_authors_avg": [
            2332.25,
            1023.3968865987428
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            4.5,
            1.5
        ],
        "replies_avg": [
            30,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.28867513459481287,
        "gs_citation": 169,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5895503802977370265&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=wxJ0eXwwda",
        "pdf": "https://openreview.net/pdf?id=wxJ0eXwwda",
        "email": "allenai.org;allenai.org;cs.washington.edu;;uw.edu;;allenai.org;cs.washington.edu",
        "author_num": 8,
        "aff_unique_index": "0;0;1;1;0;1",
        "aff_unique_norm": "Allen Institute for Artificial Intelligence;University of Washington",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://allenai.org;https://www.washington.edu",
        "aff_unique_abbr": "AI2;UW",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Seattle",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "wy1J5aOWys",
        "title": "Probing Reasoning of Language Models with Inductive In-Context Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Despite their recent success, Language Models (LMs) have raised questions about whether they statistically repeat data (\u2018stochastic parrots\u2019) or can learn the underlying generative process of the data. Current benchmarks used to probe the reasoning ability of LMs can be ambiguous, as it is unclear whether the model has memorized the instances in the benchmark or has learned the generative process 6 of the data. In this work, we introduce a novel evaluation setting that we use with Inductive In-Context Learning (IIL) and a dataset, ReAnalogy, to probe the reasoning ability of LMs. ReAnalogy consists of sequences with positive examples, generated from regular expressions (regex), and contains quasi-natural language. We use regex to evaluate implicitly whether a LM can infer \u2018Rules\u2019 (regex) given limited sets of examples (\u2018Facts\u2019). After training the LM on Facts, we use it to generate additional Facts, to evaluate whether the generated Facts abide by the Rules. We evaluate a GPT model in our setting and compare with the same model where a Rule is injected during training to replace a Fact. We use IIL during evaluation to probe the model to infer the Rule given Facts. We then use the inferred Rule to synthesize an additional Fact. IIL improves \u2018reasoning\u2019 performance by as much as 33%. Our results suggest that LMs can learn more than statistical patterns in the data and we support our findings with ablation studies. We evaluate our dataset with existing benchmarks and baselines in inductive programming and find that current state-of-the-art symbolic or neurosymbolic approaches fail to the complexity of our dataset; while existing datasets and benchmarks in the Inductive Logic Programming domain are inapplicable for LMs. Our probing method and dataset are complex enough for LMs and applicable to evaluate the inductive reasoning abilities of LMs, while IIL can improve \u2018reasoning\u2019 of LMs. We use IIL to find that LMs can learn more than statistics in the data. We open-source our dataset and the code used for our experiments.",
        "keywords": "Generalization;HPO;Model Comparison;Bayesian",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Iordanis Fostiropoulos;Laurent Itti",
        "authorids": "~Iordanis_Fostiropoulos1;~Laurent_Itti1",
        "gender": "M;M",
        "homepage": "https://iordanis.me;http://ilab.usc.edu",
        "dblp": "227/5493;31/3256",
        "google_scholar": "XTLv1v8AAAAJ;xhUvqK8AAAAJ",
        "orcid": ";0000-0002-0168-2977",
        "linkedin": ";",
        "or_profile": "~Iordanis_Fostiropoulos1;~Laurent_Itti1",
        "aff": ";University of Southern California",
        "aff_domain": ";usc.edu",
        "position": ";Professor",
        "bibtex": "@misc{\nfostiropoulos2024probing,\ntitle={Probing Reasoning of Language Models with Inductive In-Context Learning},\nauthor={Iordanis Fostiropoulos and Laurent Itti},\nyear={2024},\nurl={https://openreview.net/forum?id=wy1J5aOWys}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=wy1J5aOWys",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:8LPN_pJdOD8J:scholar.google.com/&scioq=Probing+Reasoning+of+Language+Models+with+Inductive+In-Context+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 2,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Southern California",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.usc.edu",
        "aff_unique_abbr": "USC",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Los Angeles",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "wyHCt1P7SR",
        "title": "Harnessing Attention Prior for Reference-based Multi-view Image Synthesis",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "This paper explores the domain of multi-view image synthesis, aiming to create specific image elements or entire scenes while ensuring visual consistency with reference images. We categorize this task into two approaches: local synthesis, guided by structural cues from reference images (Reference-based inpainting, Ref-inpainting), and global synthesis, which generates entirely new images based solely on reference examples (Novel View Synthesis, NVS). In recent years, Text-to-Image (T2I) generative models have gained attention in various domains. However, adapting them for multi-view synthesis is challenging due to the intricate correlations between reference and target images. To address these challenges efficiently, we introduce Attention Reactivated Contextual Inpainting (ARCI), a unified approach that reformulates both local and global reference-based multi-view synthesis as contextual inpainting, which is enhanced with pre-existing attention mechanisms in T2I models. Formally, self-attention is leveraged to learn feature correlations across different reference views, while cross-attention is utilized to control the generation through prompt tuning. Our contributions of ARCI, built upon the StableDiffusion fine-tuned for text-guided inpainting, include skillfully handling difficult multi-view synthesis tasks with off-the-shelf T2I models, introducing task and view-specific prompt tuning for generative control, achieving end-to-end Ref-inpainting, and implementing block causal masking for autoregressive NVS. We also show the versatility of ARCI by extending it to multi-view generation for superior consistency with the same architecture, which has also been validated through extensive experiments.",
        "keywords": "Reference-guided inpainting;Novel view synthesis;Text-to-Image;Attention",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Chenjie Cao;Yunuo Cai;Qiaole Dong;Yikai Wang;Yanwei Fu",
        "authorids": "~Chenjie_Cao1;~Yunuo_Cai1;~Qiaole_Dong1;~Yikai_Wang1;~Yanwei_Fu2",
        "gender": "M;M;M;M;M",
        "homepage": "https://ewrfcas.github.io/;https://github.com/Colektan;https://dqiaole.github.io/;https://yikai-wang.github.io;http://yanweifu.github.io",
        "dblp": "https://dblp.uni-trier.de/pid/193/0823;;315/0341;85/9555-2;63/9065",
        "google_scholar": "1INK-I0AAAAJ;;8Q9k5NoAAAAJ;x8HOE_cAAAAJ;https://scholar.google.co.uk/citations?user=Vg54TcsAAAAJ",
        "orcid": ";;0000-0002-3083-5143;0000-0001-6107-5063;0000-0002-6595-6893",
        "linkedin": ";;;;",
        "or_profile": "~Chenjie_Cao1;~Yunuo_Cai1;~Qiaole_Dong1;~Yikai_Wang1;~Yanwei_Fu2",
        "aff": "Fudan University;Fudan University;Fudan University;Fudan University;Fudan University,",
        "aff_domain": "fudan.edu.cn;fudan.edu.cn;fudan.edu.cn;fudan.edu.cn;fudan.edu.cn",
        "position": "PhD student;Undergrad student;PhD student;PhD student;Professor",
        "bibtex": "@misc{\ncao2024harnessing,\ntitle={Harnessing Attention Prior for Reference-based Multi-view Image Synthesis},\nauthor={Chenjie Cao and Yunuo Cai and Qiaole Dong and Yikai Wang and Yanwei Fu},\nyear={2024},\nurl={https://openreview.net/forum?id=wyHCt1P7SR}\n}",
        "github": "",
        "project": "",
        "reviewers": "d1up;frhM;a7pP;RjKx",
        "site": "https://openreview.net/forum?id=wyHCt1P7SR",
        "pdf_size": 10182923,
        "rating": "3;3;3;6",
        "confidence": "5;5;4;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;1;1;3",
        "wc_summary": "38;21;89;76",
        "wc_strengths": "31;35;110;50",
        "wc_weaknesses": "334;422;391;12",
        "wc_questions": "96;28;64;34",
        "wc_review": "499;506;654;172",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "317;163;350;107",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            56.0,
            27.55902755904134
        ],
        "wc_strengths_avg": [
            56.5,
            31.68990375498165
        ],
        "wc_weaknesses_avg": [
            289.75,
            163.43557599249925
        ],
        "wc_questions_avg": [
            55.5,
            27.069355367278327
        ],
        "wc_review_avg": [
            457.75,
            176.2077963655411
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            234.25,
            101.87584355478977
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.8703882797784892,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:PoTzMj6LIlIJ:scholar.google.com/&scioq=Harnessing+Attention+Prior+for+Reference-based+Multi-view+Image+Synthesis&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Fudan University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.fudan.edu.cn",
        "aff_unique_abbr": "Fudan",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "x13bw5VQkf",
        "title": "A Coefficient Makes SVRG Effective",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Stochastic Variance Reduced Gradient (SVRG), introduced by Johnson & Zhang (2013), is a theoretically compelling optimization approach. However, as underscored by Defazio & Bottou (2019), its practical effectiveness in deep learning is yet to be proven. In this work, we unveil the potential of SVRG in optimizing real-world neural networks. Our analysis reveals that the variance reduction strength in SVRG should be lower for deep networks and decrease as training progresses. This insight inspires us to introduce a multiplicative coefficient $\\alpha$ to control its strength and adjust it with a linear decay schedule. We name our method $\\alpha$-SVRG. Our results demonstrate $\\alpha$-SVRG better optimizes neural networks, consistently lowering the training loss compared to both baseline and standard SVRG across various architectures and datasets. Our work is the first to bring the benefit of SVRG into training neural networks at a practical scale. We hope it encourages further exploration into gradient variance reduction techniques in deep learning.",
        "keywords": "Optimization; Variance Reduction; SGD",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/b752029dc11da5e67d5afd3c8ed2fda908c6104b.zip",
        "author": "Yida Yin;Zhiqiu Xu;Zhiyuan Li;Trevor Darrell;Zhuang Liu",
        "authorids": "~Yida_Yin1;~Zhiqiu_Xu1;~Zhiyuan_Li2;~Trevor_Darrell2;~Zhuang_Liu1",
        "gender": ";M;M;;",
        "homepage": ";https://oscarxzq.github.io;https://zhiyuanli.ttic.edu;;",
        "dblp": ";;l/ZhiyuanLi;;",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en;;",
        "orcid": ";;;;",
        "linkedin": ";oscar-xu-1250821a1/;;;",
        "or_profile": "~Yida_Yin1;~Zhiqiu_Xu1;~Zhiyuan_Li2;~Trevor_Darrell2;~Zhuang_Liu1",
        "aff": ";University of Pennsylvania;Toyota Technological Institute at Chicago;;",
        "aff_domain": ";upenn.edu;ttic.edu;;",
        "position": ";PhD student;Assistant Professor;;",
        "bibtex": "@misc{\nyin2024a,\ntitle={A Coefficient Makes {SVRG} Effective},\nauthor={Yida Yin and Zhiqiu Xu and Zhiyuan Li and Trevor Darrell and Zhuang Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=x13bw5VQkf}\n}",
        "github": "",
        "project": "",
        "reviewers": "auQR;LXQJ;3pZ5;FPSM",
        "site": "https://openreview.net/forum?id=x13bw5VQkf",
        "pdf_size": 982051,
        "rating": "5;5;5;6",
        "confidence": "4;4;4;2",
        "soundness": "3;4;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;2;3",
        "wc_summary": "50;112;41;96",
        "wc_strengths": "60;92;22;19",
        "wc_weaknesses": "181;96;203;61",
        "wc_questions": "49;287;60;1",
        "wc_review": "340;587;326;177",
        "wc_reply_reviewers": "0;272;0;0",
        "wc_reply_authors": "1326;2829;1283;421",
        "reply_reviewers": "0;3;0;0",
        "reply_authors": "3;6;2;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            74.75,
            29.961433543807612
        ],
        "wc_strengths_avg": [
            48.25,
            29.98645527567405
        ],
        "wc_weaknesses_avg": [
            135.25,
            58.601941094131
        ],
        "wc_questions_avg": [
            99.25,
            110.64441919952402
        ],
        "wc_review_avg": [
            357.5,
            147.0960570511664
        ],
        "wc_reply_reviewers_avg": [
            68.0,
            117.77945491468365
        ],
        "wc_reply_authors_avg": [
            1464.75,
            866.4405273877717
        ],
        "reply_reviewers_avg": [
            0.75,
            1.299038105676658
        ],
        "reply_authors_avg": [
            3.0,
            1.8708286933869707
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12237741885819974223&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of Pennsylvania;Toyota Technological Institute at Chicago",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.upenn.edu;https://www.tti-chicago.org",
        "aff_unique_abbr": "UPenn;TTI Chicago",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Chicago",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "x17qiTPDy5",
        "title": "DiffFlow: A Unified SDE for Score-Based Diffusion Models and Generative Adversarial Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Generative models can be categorized into two types: i) explicit generative models that define explicit density forms and allow exact likelihood inference, such as score-based diffusion models (SDMs) and normalizing flows; ii) implicit generative models that directly learn a transformation from the prior to the data distribution, such as generative adversarial nets (GANs). While these two types of models have shown great success, they suffer from respective limitations that hinder them from achieving fast sampling and high sample quality simultaneously. In this paper, we propose a unified theoretic framework for SDMs and GANs. We mainly show that: i) the learning dynamics of both SDMs and GANs can be described as a novel SDE named **D**iscriminator Deno**i**sing Di**ff**usion **Flow** (**DiffFlow**), where the drift can be determined by some weighted combinations of scores of the real data and the generated data; ii) By adjusting the relative weights between different score terms, we can obtain a smooth transition between SDMs and GANs while the marginal distribution of the SDE remains invariant to the change of the weights; iii) we prove the asymptotic and non-asymptotic convergence of the continuous SDE dynamics of DiffFlow by some weak isoperimetry of the smoothed target distribution; iv) under our unified theoretic framework, we introduce several instantiations of DiffFlow that incorporate some recently proposed hybrid algorithms of GAN and diffusion models, for instance, the TDPM (Zheng et al., 2022) as a special case. Our framework unifies GANs and SDMs into a continuous spectrum. Hence, it offers the potential to design new generative learning algorithms that could achieve a flexible trade-off between high sample quality and fast sampling speed beyond existing GAN- and/or SDM-like algorithms.",
        "keywords": "generative adversarial networks;diffusion models;stochastic differential equations",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/1541ffc0201a6ac4145d7c422f9be7df19cdfb78.zip",
        "author": "Jingwei Zhang;Han Shi;Jincheng YU;Enze Xie;Zhenguo Li",
        "authorids": "~Jingwei_Zhang6;~Han_Shi1;~Jincheng_YU1;~Enze_Xie1;~Zhenguo_Li1",
        "gender": "M;M;M;M;M",
        "homepage": ";https://han-shi.github.io/;https://lovesykun.cn;https://xieenze.github.io/;http://www.ee.columbia.edu/~zgli/",
        "dblp": ";;;218/5441;23/6479",
        "google_scholar": "zn-UAFEAAAAJ;https://scholar.google.com.hk/citations?user=Johp_14AAAAJ;;42MVVPgAAAAJ;XboZC1AAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Jingwei_Zhang6;~Han_Shi1;~Jincheng_YU1;~Enze_Xie1;~Zhenguo_Li1",
        "aff": "Hong Kong University of Science and Technology;Huawei Technologies Ltd.;Hong Kong University of Science and Technology;Huawei Noah's Ark Lab;Huawei Noah's Ark Lab",
        "aff_domain": "ust.hk;huawei.com;ust.hk;huawei.com;huawei.com",
        "position": "PhD student;Principal Researcher;MS student;Researcher;Principal Researcher",
        "bibtex": "@misc{\nzhang2024diffflow,\ntitle={DiffFlow: A Unified {SDE} for Score-Based Diffusion Models and Generative Adversarial Networks},\nauthor={Jingwei Zhang and Han Shi and Jincheng YU and Enze Xie and Zhenguo Li},\nyear={2024},\nurl={https://openreview.net/forum?id=x17qiTPDy5}\n}",
        "github": "",
        "project": "",
        "reviewers": "Pk86;G388;WfjL;WXNS",
        "site": "https://openreview.net/forum?id=x17qiTPDy5",
        "pdf_size": 1292198,
        "rating": "3;5;6;6",
        "confidence": "4;3;3;3",
        "soundness": "1;4;4;3",
        "contribution": "3;3;3;3",
        "presentation": "2;4;4;2",
        "wc_summary": "105;41;86;96",
        "wc_strengths": "160;57;81;62",
        "wc_weaknesses": "1403;41;110;243",
        "wc_questions": "66;12;116;1",
        "wc_review": "1734;151;393;402",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1961;97;693;39",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;1;1;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            1.224744871391589
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            1.0
        ],
        "wc_summary_avg": [
            82.0,
            24.606909598728564
        ],
        "wc_strengths_avg": [
            90.0,
            41.394444071638404
        ],
        "wc_weaknesses_avg": [
            449.25,
            555.4135283732293
        ],
        "wc_questions_avg": [
            48.75,
            45.963980462966866
        ],
        "wc_review_avg": [
            670.0,
            622.4969879445201
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            697.5,
            773.0903892818743
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9428090415820632,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11214504216413892541&as_sdt=5,31&sciodt=0,31&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;1;1",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Huawei",
        "aff_unique_dep": ";Huawei Technologies",
        "aff_unique_url": "https://www.ust.hk;https://www.huawei.com",
        "aff_unique_abbr": "HKUST;Huawei",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "ADOPD: A Large-Scale Document Page Decomposition Dataset",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17472",
        "id": "x1ptaXpOYa",
        "author_site": "Jiuxiang Gu, Xiangxi Shi, Jason Kuen, Lu Qi, Ruiyi Zhang, Anqi Liu, Ani Nenkova, Tong Sun",
        "tldr": "",
        "abstract": "Research in document image understanding is hindered by limited high-quality document data. To address this, we introduce ADOPD, a comprehensive dataset for document page decomposition. ADOPD stands out with its data-driven approach for document taxonomy discovery during data collection, complemented by dense annotations. Our approach integrates large-scale pretrained models with a human-in-the-loop process to guarantee diversity and balance in the resulting data collection. Leveraging our data-driven document taxonomy, we collect and densely annotate document images, addressing four document image understanding tasks: Doc2Mask, Doc2Box, Doc2Tag, and Doc2Seq. Specifically, for each image, the annotations include human-labeled entity masks, text bounding boxes, as well as automatically generated tags and captions that have been manually cleaned. We conduct comprehensive experimental analyses to validate our data and assess the four tasks using various models. We envision ADOPD as a foundational dataset with the potential to drive future research in document understanding.",
        "keywords": "Document Understanding;Dataset;Segmentation;Detection;OCR;Captioning",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Jiuxiang Gu;Xiangxi Shi;Jason Kuen;Lu Qi;Ruiyi Zhang;Anqi Liu;Ani Nenkova;Tong Sun",
        "authorids": "~Jiuxiang_Gu2;~Xiangxi_Shi1;~Jason_Kuen1;~Lu_Qi1;~Ruiyi_Zhang3;~Anqi_Liu2;~Ani_Nenkova1;~Tong_Sun1",
        "gender": "M;M;M;M;;F;;F",
        "homepage": "http://gujiuxiang.com;https://www.linkedin.com/in/%E7%BF%94%E7%86%B9-%E7%9F%B3-01996a155/;http://jasonkuen.com/;https://www.luqi.info;;https://anqiliu-ai.github.io/;;https://research.adobe.com/person/tong-sun/",
        "dblp": "173/4935.html;192/8568;165/1403;;;;;",
        "google_scholar": "https://scholar.google.com.sg/citations?user=zPxKV9EAAAAJ;RpWZqBoAAAAJ;e6u7GlQAAAAJ;https://scholar.google.com.hk/citations?user=SSI90d4AAAAJ;;Q8yp6zQAAAAJ;;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;;;0000-0002-0468-5698;;",
        "linkedin": ";%E7%BF%94%E7%86%B9-%E7%9F%B3-01996a155/;;;;;;tong-sun/?trk=hb_tab_pro_top",
        "or_profile": "~Jiuxiang_Gu2;~Xiangxi_Shi1;~Jason_Kuen1;~Lu_Qi1;~Ruiyi_Zhang3;~Anqi_Liu2;~Ani_Nenkova1;~Tong_Sun1",
        "aff": "Adobe Systems;Adobe Systems;Adobe Research;University of California, Merced;;University of Illinois, Chicago;;Adobe Systems",
        "aff_domain": "adobe.com;adobe.com;adobe.com;ucmerced.edu;;uic.edu;;adobe.com",
        "position": "Researcher;Intern;Researcher;Postdoc;;PhD student;;Director, Document Intelligence Lab",
        "bibtex": "@inproceedings{\ngu2024adopd,\ntitle={{ADOPD}: A Large-Scale Document Page Decomposition Dataset},\nauthor={Jiuxiang Gu and Xiangxi Shi and Jason Kuen and Lu Qi and Ruiyi Zhang and Anqi Liu and Ani Nenkova and Tong Sun},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=x1ptaXpOYa}\n}",
        "github": "",
        "project": "",
        "reviewers": "BGf2;aArm;umJE;ZWQe",
        "pdf_size": 19096536,
        "rating": "6;6;6;8",
        "confidence": "5;4;3;4",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;4;2;3",
        "wc_summary": "69;54;191;204",
        "wc_strengths": "93;97;85;339",
        "wc_weaknesses": "183;107;235;118",
        "wc_questions": "66;90;3;43",
        "wc_review": "411;348;514;704",
        "wc_reply_reviewers": "0;0;13;0",
        "wc_reply_authors": "632;684;763;596",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            129.5,
            68.36117319063504
        ],
        "wc_strengths_avg": [
            153.5,
            107.18558671761797
        ],
        "wc_weaknesses_avg": [
            160.75,
            51.78018443381599
        ],
        "wc_questions_avg": [
            50.5,
            32.06633748964793
        ],
        "wc_review_avg": [
            494.25,
            134.81909174890623
        ],
        "wc_reply_reviewers_avg": [
            3.25,
            5.629165124598851
        ],
        "wc_reply_authors_avg": [
            668.75,
            62.76692998705608
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12016754577610064137&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=x1ptaXpOYa",
        "pdf": "https://openreview.net/pdf?id=x1ptaXpOYa",
        "email": "adobe.com;adobe.com;adobe.com;ucmerced.edu;;uic.edu;;adobe.com",
        "author_num": 8,
        "aff_unique_index": "0;0;0;1;2;0",
        "aff_unique_norm": "Adobe;University of California, Merced;University of Illinois at Chicago",
        "aff_unique_dep": "Adobe Systems Incorporated;;",
        "aff_unique_url": "https://www.adobe.com;https://www.ucmerced.edu;https://www.uic.edu",
        "aff_unique_abbr": "Adobe;UC Merced;UIC",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Merced;Chicago",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "x2rZGCbRRd",
        "title": "Extracting Post-Treatment Covariates for Heterogeneous Treatment Effect Estimation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The exploration of causal relationships between treatments and outcomes, and the estimation of causal effects from observational data, have garnered considerable interest in the scientific community in recent years. However, traditional causal inference methods implicitly assume that all covariates are measured prior to treatment assignment, while in many real-world scenarios, some covariates are affected by the treatment and collected post-treatment. In this paper, we demonstrate how ignoring or mishandling post-treatment covariates can lead to biased estimates of heterogeneous treatment effects, referred to as the \"post-treatment bias\" problem. We discuss the possible cases in which post-treatment bias may appear and the negative impact it can have on causal effect estimation. Methodologically, we propose a novel variable decomposition approach to account for post-treatment covariates and eliminate post-treatment bias, based on a newly proposed causal graph for post-treatment causal inference analyses. Extensive experiments on synthetic, semi-synthetic, and real-world data demonstrate the superiority of our proposed method over state-of-the-art models for heterogeneous treatment effect estimation.",
        "keywords": "Causality;Deep Learning",
        "primary_area": "causal reasoning",
        "supplementary_material": "/attachment/47aa8bad6611bc1698ac13027911a7bf402dce45.pdf",
        "author": "Qiang Huang;Defu Cao;Yi Chang;Yan Liu",
        "authorids": "~Qiang_Huang4;~Defu_Cao1;~Yi_Chang4;~Yan_Liu1",
        "gender": "M;M;M;F",
        "homepage": "https://15754311016.github.io/qianghuang.github.io/;https://idevede.github.io/;http://www.yichang-cs.com;http://www-bcf.usc.edu/~liu32/",
        "dblp": "80/2732-1.html;274/1535;02/5438.html;150/4295",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en;https://scholar.google.com.hk/citations?user=drEkR50AAAAJ;UUKLPMYAAAAJ",
        "orcid": "0000-0003-0046-0923;0000-0003-0240-3818;0000-0003-2697-8093;0000-0002-7055-9518",
        "linkedin": ";;;",
        "or_profile": "~Qiang_Huang4;~Defu_Cao1;~Yi_Chang4;~Yan_Liu1",
        "aff": "Jilin University, China;University of Southern California;Jilin University, China;University of Southern California",
        "aff_domain": "jlu.edu.cn;usc.edu;jlu.edu.cn;usc.edu",
        "position": "PhD student;PhD student;Full Professor;Professor",
        "bibtex": "@misc{\nhuang2024extracting,\ntitle={Extracting Post-Treatment Covariates for Heterogeneous Treatment Effect Estimation},\nauthor={Qiang Huang and Defu Cao and Yi Chang and Yan Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=x2rZGCbRRd}\n}",
        "github": "",
        "project": "",
        "reviewers": "SsoN;mav9;zkzj;XTaX",
        "site": "https://openreview.net/forum?id=x2rZGCbRRd",
        "pdf_size": 868753,
        "rating": "5;5;6;6",
        "confidence": "4;3;4;4",
        "soundness": "3;2;3;3",
        "contribution": "2;1;3;3",
        "presentation": "3;1;3;3",
        "wc_summary": "91;46;102;108",
        "wc_strengths": "27;11;46;20",
        "wc_weaknesses": "211;400;63;114",
        "wc_questions": "5;81;120;273",
        "wc_review": "334;538;331;515",
        "wc_reply_reviewers": "0;0;0;123",
        "wc_reply_authors": "1060;1702;1017;2863",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "3;3;2;5",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            86.75,
            24.304063446263466
        ],
        "wc_strengths_avg": [
            26.0,
            12.864680330268607
        ],
        "wc_weaknesses_avg": [
            197.0,
            128.6953767623375
        ],
        "wc_questions_avg": [
            119.75,
            97.66620449264936
        ],
        "wc_review_avg": [
            429.5,
            97.34603227661619
        ],
        "wc_reply_reviewers_avg": [
            30.75,
            53.26056233274298
        ],
        "wc_reply_authors_avg": [
            1660.5,
            745.3893278012505
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.25,
            1.0897247358851685
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:0cYVhWANs_4J:scholar.google.com/&scioq=Extracting+Post-Treatment+Covariates+for+Heterogeneous+Treatment+Effect+Estimation&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;1",
        "aff_unique_norm": "Jilin University;University of Southern California",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.jlu.edu.cn;https://www.usc.edu",
        "aff_unique_abbr": "JLU;USC",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Los Angeles",
        "aff_country_unique_index": "0;1;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "x2yFdUSJ4I",
        "title": "Linear diffusion models meet contextual bandits with large action spaces",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Efficient exploration is a key challenge in contextual bandits due to the potentially large size of their action space, where uninformed exploration can result in computational and statistical inefficiencies. Fortunately, the rewards of actions are often correlated and this can be leveraged to explore them efficiently. In this work, we capture such correlations using pre-trained linear diffusion models; upon which we design diffusion Thompson sampling (dTS). Both theoretical and algorithmic foundations are developed for dTS, and empirical evaluation also shows its favorable performance.",
        "keywords": "Contextual bandits",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/38f54b678b8b51e4052753b99fb2112fd334b6ff.zip",
        "author": "Imad Aouali",
        "authorids": "~Imad_Aouali2",
        "gender": "M",
        "homepage": "https://www.iaouali.com/",
        "dblp": "298/2200",
        "google_scholar": "cG9L1BwAAAAJ",
        "orcid": "",
        "linkedin": "imad-aouali/",
        "or_profile": "~Imad_AOUALI1",
        "aff": "Ecole Nationale de la Statistique et de l'Administration Economique",
        "aff_domain": "ensae.fr",
        "position": "PhD student",
        "bibtex": "@misc{\naouali2024linear,\ntitle={Linear diffusion models meet contextual bandits with large action spaces},\nauthor={Imad Aouali},\nyear={2024},\nurl={https://openreview.net/forum?id=x2yFdUSJ4I}\n}",
        "github": "",
        "project": "",
        "reviewers": "S8eU;hKWS;zHzJ;6rz1;sz3T",
        "site": "https://openreview.net/forum?id=x2yFdUSJ4I",
        "pdf_size": 1247624,
        "rating": "3;3;6;6;6",
        "confidence": "4;5;4;3;4",
        "soundness": "2;3;4;3;3",
        "contribution": "1;2;2;2;3",
        "presentation": "3;3;4;2;3",
        "wc_summary": "46;62;46;84;51",
        "wc_strengths": "9;57;68;66;29",
        "wc_weaknesses": "29;59;275;158;153",
        "wc_questions": "150;161;54;21;3",
        "wc_review": "234;339;443;329;236",
        "wc_reply_reviewers": "447;352;0;0;0",
        "wc_reply_authors": "1861;886;662;889;732",
        "reply_reviewers": "2;2;0;0;0",
        "reply_authors": "5;3;1;2;1",
        "rating_avg": [
            4.8,
            1.469693845669907
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            3.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            2.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            3.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            57.8,
            14.344336861632886
        ],
        "wc_strengths_avg": [
            45.8,
            23.077261535979524
        ],
        "wc_weaknesses_avg": [
            134.8,
            86.56188537687936
        ],
        "wc_questions_avg": [
            77.8,
            65.60914570393369
        ],
        "wc_review_avg": [
            316.2,
            77.39612393395421
        ],
        "wc_reply_reviewers_avg": [
            159.8,
            198.00646454093362
        ],
        "wc_reply_authors_avg": [
            1006.0,
            436.46901379135727
        ],
        "reply_reviewers_avg": [
            0.8,
            0.9797958971132713
        ],
        "reply_authors_avg": [
            2.4,
            1.4966629547095764
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.6454972243679027,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4768056611359274602&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0",
        "aff_unique_norm": "Ecole Nationale de la Statistique et de l'Administration Economique",
        "aff_unique_dep": "",
        "aff_unique_url": "https://ensae.fr",
        "aff_unique_abbr": "ENSAE",
        "aff_country_unique_index": "0",
        "aff_country_unique": "France"
    },
    {
        "id": "x31F1VmiV7",
        "title": "BSPA: Exploring Black-box Stealthy Prompt Attacks against Image Generators",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Extremely large image generators offer significant transformative potential across diverse sectors. It allows users to design specific prompts to generate realistic images through some black-box APIs. However, some studies reveal that image generators are notably susceptible to attacks and generate Not Suitable For Work (NSFW) contents by manually designed toxin texts, especially imperceptible to human observers. We urgently need a multitude of universal and transferable prompts to improve the safety of image generators,  especially black-box-released APIs. Nevertheless, they are constrained by labor-intensive design processes and heavily reliant on the quality of the given instructions. To achieve this, we introduce a black-box stealthy prompt attack (BSPA) that adopts a retriever to simulate attacks from API users. It can effectively harness filter scores to tune the retrieval space of sensitive words for matching the input prompts, thereby crafting stealthy prompts tailored for image generators. Significantly, this approach is model-agnostic and requires no internal access to the model's features, ensuring its applicability to a wide range of image generators. Building on BSPA, we have constructed an automated prompt tool and a comprehensive prompt attack dataset (NSFWeval). Extensive experiments demonstrate that BSPA effectively explores the security vulnerabilities in a variety of state-of-the-art available black-box models, including Stable Diffusion XL and Midjourney. Furthermore, we have developed a resilient text filter and offer targeted recommendations to ensure the security of image generators against prompt attacks in the future.",
        "keywords": "Black-box;Prompt Attacks;Image Generator",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Yu Tian;Xiao Yang;Yinpeng Dong;Heming Yang;Hang Su;Jun Zhu",
        "authorids": "~Yu_Tian10;~Xiao_Yang4;~Yinpeng_Dong2;~Heming_Yang1;~Hang_Su3;~Jun_Zhu2",
        "gender": "M;M;M;M;M;M",
        "homepage": ";https://ml.cs.tsinghua.edu.cn/~xiaoyang/;https://dongyp13.github.io;;http://ml.cs.tsinghua.edu.cn/~jun;",
        "dblp": ";57/33851;183/0980;;50/2644-1;26/5371-6",
        "google_scholar": "https://scholar.google.com.hk/citations?user=ucPBT4QAAAAJ;bwkwp0MAAAAJ;6_4ad84AAAAJ;;axsP38wAAAAJ;dxN1_X0AAAAJ",
        "orcid": "0000-0002-8235-6507;0000-0001-9502-9962;;0009-0002-7542-0790;;",
        "linkedin": ";;;;;",
        "or_profile": "~Yu_Tian10;~Xiao_Yang4;~Yinpeng_Dong2;~Heming_Yang1;~Jun_Zhu2;~Hang_Su2",
        "aff": "Tsinghua University;Tsinghua University;Tsinghua University;University of Chinese Academy of Sciences;Tsinghua University;Tsinghua University",
        "aff_domain": "mail.tsinghua.edu.cn;mail.tsinghua.edu.cn;tsinghua.edu.cn;ucas.ac.cn;mail.tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "Assistant Professor;Postdoc;Postdoc;PhD student;Professor;Associate Professor",
        "bibtex": "@misc{\ntian2024bspa,\ntitle={{BSPA}: Exploring Black-box Stealthy Prompt Attacks against Image Generators},\nauthor={Yu Tian and Xiao Yang and Yinpeng Dong and Heming Yang and Hang Su and Jun Zhu},\nyear={2024},\nurl={https://openreview.net/forum?id=x31F1VmiV7}\n}",
        "github": "",
        "project": "",
        "reviewers": "oGes;aMMq;XfJe;vTUC",
        "site": "https://openreview.net/forum?id=x31F1VmiV7",
        "pdf_size": 3157016,
        "rating": "3;5;5;8",
        "confidence": "5;4;3;3",
        "soundness": "2;2;3;3",
        "contribution": "2;3;3;4",
        "presentation": "2;2;2;3",
        "wc_summary": "85;60;61;30",
        "wc_strengths": "76;39;24;41",
        "wc_weaknesses": "294;483;77;16",
        "wc_questions": "72;13;60;7",
        "wc_review": "527;595;222;94",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            59.0,
            19.50640920313116
        ],
        "wc_strengths_avg": [
            45.0,
            19.06567596493762
        ],
        "wc_weaknesses_avg": [
            217.5,
            184.85467264854302
        ],
        "wc_questions_avg": [
            38.0,
            28.398943642325854
        ],
        "wc_review_avg": [
            359.5,
            207.91404473964715
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.8021806287494232,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=543204169903958037&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;1;0;0",
        "aff_unique_norm": "Tsinghua University;University of Chinese Academy of Sciences",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tsinghua.edu.cn;http://www.ucas.ac.cn",
        "aff_unique_abbr": "THU;UCAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "x36mCqVHnk",
        "title": "Improving Sample Efficiency of Model-Free Algorithms for Zero-Sum Markov Games",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The problem of two-player zero-sum Markov games has recently attracted increasing interests in theoretical studies of multi-agent reinforcement learning (RL). In particular, for finite-horizon episodic Markov decision processes (MDPs), it has been shown that model-based algorithms can find an $\\epsilon$-optimal Nash Equilibrium (NE) with the sample complexity of $O(H^3SAB/\\epsilon^2)$, which is optimal in the dependence of the horizon $H$ and the number of states $S$ (where $A$ and $B$ denote the number of actions of the two players, respectively). However, none of the existing model-free algorithms can achieve such an optimality. In this work, we propose a model-free stage-based Q-learning algorithm and show that it achieves the same sample complexity as the best model-based algorithm, and hence for the first time demonstrate that model-free algorithms can enjoy the same optimality in the $H$ dependence as model-based algorithms. The main improvement of the dependency on $H$ arises by leveraging the popular variance reduction technique based on the reference-advantage decomposition previously used only for single-agent RL. However, such a technique relies on a critical monotonicity property of the value function, which does not hold in Markov games due to the update of the policy via the coarse correlated equilibrium (CCE) oracle. Thus, to extend such a technique to Markov games, our algorithm features a key novel design of updating the reference value functions as the pair of optimistic and pessimistic value functions whose value difference is the smallest in history in order to achieve the desired improvement in the sample efficiency.",
        "keywords": "Zero-sum games;reinforcement learning theory;variance reduction",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/4d02b722ac9cde7fd78713336872ced267969d3f.pdf",
        "author": "Songtao Feng;Ming Yin;Yu-Xiang Wang;Jing Yang;Yingbin Liang",
        "authorids": "~Songtao_Feng1;~Ming_Yin4;~Yu-Xiang_Wang1;~Jing_Yang3;~Yingbin_Liang1",
        "gender": "M;M;;;F",
        "homepage": ";https://mingyin0312.github.io;http://www.cs.ucsb.edu/~yuxiangw/publications.html;http://www.ee.psu.edu/yang;https://sites.google.com/view/yingbinliang/home",
        "dblp": "217/1741;89/453.html;62/1637-3.html;;51/332",
        "google_scholar": "q11fVdcAAAAJ;ncBRYIUAAAAJ;HGNZ1fkAAAAJ;https://scholar.google.com/citations?hl=en;lGgLAiIAAAAJ",
        "orcid": ";0000-0001-6458-0751;;;",
        "linkedin": ";;;;",
        "or_profile": "~Songtao_Feng1;~Ming_Yin4;~Yu-Xiang_Wang1;~Jing_Yang3;~Yingbin_Liang1",
        "aff": "University of Florida;Princeton University;UC Santa Barbara;Pennsylvania State University;The Ohio State University",
        "aff_domain": "ufl.edu;princeton.edu;ucsb.edu;psu.edu;osu.edu",
        "position": "Postdoc;Postdoc;Assistant Professor;Associate Professor;Professor",
        "bibtex": "@misc{\nfeng2024improving,\ntitle={Improving Sample Efficiency of Model-Free Algorithms for Zero-Sum Markov Games},\nauthor={Songtao Feng and Ming Yin and Yu-Xiang Wang and Jing Yang and Yingbin Liang},\nyear={2024},\nurl={https://openreview.net/forum?id=x36mCqVHnk}\n}",
        "github": "",
        "project": "",
        "reviewers": "WHVB;iS4i;GLai;iTn4",
        "site": "https://openreview.net/forum?id=x36mCqVHnk",
        "pdf_size": 323304,
        "rating": "5;5;6;6",
        "confidence": "3;2;3;4",
        "soundness": "3;2;3;3",
        "contribution": "3;2;3;3",
        "presentation": "2;1;3;4",
        "wc_summary": "27;45;57;138",
        "wc_strengths": "28;66;68;123",
        "wc_weaknesses": "93;80;79;154",
        "wc_questions": "81;330;1;240",
        "wc_review": "229;521;205;655",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "863;1394;257;1134",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;3;1;3",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            66.75,
            42.49926469952157
        ],
        "wc_strengths_avg": [
            71.25,
            33.862774546690645
        ],
        "wc_weaknesses_avg": [
            101.5,
            30.80990100600779
        ],
        "wc_questions_avg": [
            163.0,
            129.21493721702612
        ],
        "wc_review_avg": [
            402.5,
            191.64224482091623
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            912.0,
            422.20670293115904
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.5,
            0.8660254037844386
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.7071067811865475,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11342070135241651246&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 10,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "University of Florida;Princeton University;University of California, Santa Barbara;Pennsylvania State University;Ohio State University",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.ufl.edu;https://www.princeton.edu;https://www.ucsb.edu;https://www.psu.edu;https://www.osu.edu",
        "aff_unique_abbr": "UF;Princeton;UCSB;PSU;OSU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Santa Barbara",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "x3LxHdZX0f",
        "title": "PUMA: Secure Inference of LLaMA-7B in Five Minutes",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "With ChatGPT as a representative, tons of companies have began to provide ser-\nvices based on large Transformers models. However, using such a service inevitably\nleak users\u2019 prompts to the model provider. Previous studies have studied secure in-\nference for Transformer models using secure multiparty computation (MPC), where\nmodel parameters and clients\u2019 prompts are kept secret. Despite this, these frame-\nworks are still limited in terms of model performance, efficiency, and deployment.\nTo address these limitations, we propose framework PUMA to enable fast and secure\nTransformer model inference. Our framework designs high quality approximations\nfor expensive functions such as GeLU and softmax, and significantly reduce the\ncost of secure inference while preserving the model performance. Additionally, we\ndesign secure Embedding and LayerNorm procedures that faithfully implement the\ndesired functionality without undermining the Transformer architecture. PUMA is\nabout 2\u00d7 faster than the state-of-the-art framework MPCFORMER(ICLR 2023) and\nhas similar accuracy as plaintext models without fine-tuning (which the previous\nworks failed to achieve). PUMA can even evaluate LLaMA-7B in around 5 minutes\nto generate 1 token. To our best knowledge, this is the first time that a model with\nsuch a parameter size is able to be evaluated under MPC.",
        "keywords": "Secret Sharing;Privacy;Security;Transformer;Secure multi-party computation",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Ye Dong;Wen-jie Lu;Yancheng Zheng;Haoqi Wu;Derun Zhao;Jin Tan;Zhicong Huang;Cheng Hong;Tao Wei;Wenguang Chen",
        "authorids": "~Ye_Dong1;~Wen-jie_Lu1;~Yancheng_Zheng1;~Haoqi_Wu1;~Derun_Zhao1;~Jin_Tan2;~Zhicong_Huang1;~Cheng_Hong2;~Tao_Wei5;~Wenguang_Chen1",
        "gender": "M;M;M;M;M;M;M;M;M;M",
        "homepage": "https://ye-d.github.io/;https://fionser.github.io;https://www.linkedin.com/in/yancheng-zheng-bab7746a/;;;https://github.com/rivertalk;;https://pacman.cs.tsinghua.edu.cn/~cwg/;http://antcplab.github.io;https://zicofish.github.io",
        "dblp": "73/4099;231/4234;;;305/0380.html;;;;78/10002-1.html;",
        "google_scholar": "ZO7id5IAAAAJ;;;gCfQJOEAAAAJ;;;Ao3wEckAAAAJ;;IbqU0JIAAAAJ;",
        "orcid": ";;;0000-0003-0650-5459;;;;0000-0002-4281-1018;;",
        "linkedin": ";;;;;;;;;",
        "or_profile": "~Ye_Dong1;~Wen-jie_Lu1;~Yancheng_Zheng1;~Haoqi_Wu1;~Derun_Zhao1;~Jin_Tan2;~Tao_Wei5;~Wenguang_Chen1;~Cheng_Hong1;~Zhicong_Huang2",
        "aff": "Singapore University of Technology and Design;Ant Group;Ant Group;Ant Group;;Alibaba Group;Ant Group;Tsinghua University;Ant Group;Ant Group",
        "aff_domain": "sutd.edu.sg;antgroup.com;antgroup.com;antgroup.com;;antgroup.com;antgroup.com;tsinghua.edu.cn;antgroup.com;antgroup.com",
        "position": "Postdoc;Researcher;Senior Software Engineer;Researcher;;Researcher;Principal Researcher;Full Professor;Researcher;Researcher",
        "bibtex": "@misc{\ndong2024puma,\ntitle={{PUMA}: Secure Inference of {LL}a{MA}-7B in Five Minutes},\nauthor={Ye Dong and Wen-jie Lu and Yancheng Zheng and Haoqi Wu and Derun Zhao and Jin Tan and Zhicong Huang and Cheng Hong and Tao Wei and Wenguang Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=x3LxHdZX0f}\n}",
        "github": "",
        "project": "",
        "reviewers": "bbdZ;G7JD;tTd1;DyAw",
        "site": "https://openreview.net/forum?id=x3LxHdZX0f",
        "pdf_size": 355931,
        "rating": "3;5;6;6",
        "confidence": "4;3;3;4",
        "soundness": "1;3;3;2",
        "contribution": "1;2;2;2",
        "presentation": "2;3;4;3",
        "wc_summary": "10;74;56;10",
        "wc_strengths": "7;44;50;17",
        "wc_weaknesses": "77;176;64;15",
        "wc_questions": "2;85;21;45",
        "wc_review": "96;379;191;87",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "141;219;91;120",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            37.5,
            28.226760352544886
        ],
        "wc_strengths_avg": [
            29.5,
            17.979154596365202
        ],
        "wc_weaknesses_avg": [
            83.0,
            58.45938761225608
        ],
        "wc_questions_avg": [
            38.25,
            30.994959267597046
        ],
        "wc_review_avg": [
            188.25,
            117.4252421756072
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            142.75,
            47.46775221136977
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": -0.40824829046386296,
        "gs_citation": 59,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15180019305746166242&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1;1;2;1;3;1;1",
        "aff_unique_norm": "Singapore University of Technology and Design;Ant Group;Alibaba Group;Tsinghua University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.sutd.edu.sg;https://www.antgroup.com;https://www.alibaba.com;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "SUTD;Ant Group;Alibaba;THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;1;1;1;1;1",
        "aff_country_unique": "Singapore;China"
    },
    {
        "id": "x3zYMgtBYj",
        "title": "Graph-PDE: Coupled ODE Structure for Graph Neural Networks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Spike Neural Networks (SNNs), a type of ordinary differential equation (ODE), have evolved as a sophisticated approach for addressing challenges in dynamic graph neural networks. They typically sample binary features at each time step and propagate them using SNNs to achieve spike representation. However, spike ODE remain discrete solutions, limiting their ability to capture continuous changes and subtle dynamics in time series. An effective solution is to incorporate continuous graph ODE into spike ODE to model dynamic graphs from two distinct dimensions, i.e., the time dimension of graph ODE and the latency dimension of spike ODE. The key challenge is to design a structure that seamlessly integrates spike ODE and graph ODE while ensuring the stability of the model. In this paper, we propose Graph-PDE (G-PDE), which combines spike and graph ODE in a unified graph partial differential equation (PDE). Considering the incorporation of high-order structure would preserve more information, alleviating the issue of information loss in first-order ODE. Therefore, we derive the high-order spike representation and propose the second-order G-PDE. Additionally, we prove that G-PDE addresses the issues of exploding and vanishing gradients, making it easier to train deep multi-layer graph neural networks. Finally, we demonstrate the competitive performance of G-PDE compared to state-of-the-art methods across various graph-based learning tasks.",
        "keywords": "Graph PDE;Graph ODE;SNNs;GNNs",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Nan Yin;Zhenghan Chen;Mengzhu Wang;Li Shen;Giulia De Masi;Huan Xiong;Bin Gu",
        "authorids": "~Nan_Yin4;~Zhenghan_Chen3;~Mengzhu_Wang3;~Li_Shen1;~Giulia_De_Masi1;~Huan_Xiong1;~Bin_Gu1",
        "gender": "M;;;M;;M;M",
        "homepage": ";;;https://sites.google.com/site/mathshenli/home;;https://scholar.google.com/citations?user=l4hm14MAAAAJ&hl=en;https://mbzuai.ac.ae/study/faculty/bin-gu/",
        "dblp": "135/8983;;;91/3680-8;147/8719;;29/1758-1",
        "google_scholar": "https://scholar.google.com.hk/citations?user=NoOK0pIAAAAJ;;;yVhgENIAAAAJ;G1K5hX0AAAAJ;l4hm14MAAAAJ;Vo8OgCgAAAAJ",
        "orcid": ";;;;0000-0003-3284-880X;;0000-0001-6049-1815",
        "linkedin": "yin-nan-b32943173;;;;;;",
        "or_profile": "~Nan_Yin4;~Zhenghan_Chen3;~Mengzhu_Wang3;~Li_Shen1;~Giulia_De_Masi1;~Huan_Xiong1;~Bin_Gu1",
        "aff": "Mohamed bin Zayed University of Artificial Intelligence;;;JD Explore Academy;Technology Innovation Institute;Harbin Institute of Technology;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_domain": "mbzuai.ac.ae;;;jd.com;tii.ae;hit.edu.cn;mbzuai.ac.ae",
        "position": "Postdoc;;;Researcher;Principal Researcher;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nyin2024graphpde,\ntitle={Graph-{PDE}: Coupled {ODE} Structure for Graph Neural Networks},\nauthor={Nan Yin and Zhenghan Chen and Mengzhu Wang and Li Shen and Giulia De Masi and Huan Xiong and Bin Gu},\nyear={2024},\nurl={https://openreview.net/forum?id=x3zYMgtBYj}\n}",
        "github": "",
        "project": "",
        "reviewers": "KQxP;w3bP;d8xw;mPJA;9J7f",
        "site": "https://openreview.net/forum?id=x3zYMgtBYj",
        "pdf_size": 355010,
        "rating": "3;3;6;6;8",
        "confidence": "5;4;2;4;4",
        "soundness": "3;2;2;3;3",
        "contribution": "3;2;3;3;4",
        "presentation": "2;1;3;3;3",
        "wc_summary": "91;59;169;50;93",
        "wc_strengths": "49;34;122;124;137",
        "wc_weaknesses": "215;225;77;29;91",
        "wc_questions": "33;293;80;2;28",
        "wc_review": "388;611;448;205;349",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            5.2,
            1.9390719429665317
        ],
        "confidence_avg": [
            3.8,
            0.9797958971132712
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            3.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            2.4,
            0.8
        ],
        "wc_summary_avg": [
            92.4,
            41.91228936720112
        ],
        "wc_strengths_avg": [
            93.2,
            42.789718391221044
        ],
        "wc_weaknesses_avg": [
            127.4,
            78.41836519591568
        ],
        "wc_questions_avg": [
            87.2,
            105.93092088715174
        ],
        "wc_review_avg": [
            400.2,
            132.3592082176378
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.4000221625065965,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:eGkd3QVI5W8J:scholar.google.com/&scioq=Graph-PDE:+Coupled+ODE+Structure+for+Graph+Neural+Networks&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;0",
        "aff_unique_norm": "Mohamed bin Zayed University of Artificial Intelligence;JD;Technology Innovation Institute;Harbin Institute of Technology",
        "aff_unique_dep": ";JD Explore Academy;;",
        "aff_unique_url": "https://mbzuai.ac.ae;;;http://www.hit.edu.cn/",
        "aff_unique_abbr": "MBZUAI;;;HIT",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Harbin",
        "aff_country_unique_index": "0;2;0",
        "aff_country_unique": "United Arab Emirates;;China"
    },
    {
        "id": "x4AzfGqBCY",
        "title": "Multi-Resolution Active Learning of Fourier Neural Operators",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Fourier Neural Operator (FNO) is a popular operator learning framework, which not only achieves the state-of-the-art performance in many tasks, but also is highly efficient in training and prediction. However, collecting training data for the FNO is a costly bottleneck in practice, because it often demands expensive physical simulations. To overcome this problem, we propose  Multi-Resolution Active learning of FNO (MRA-FNO), which can dynamically select the input functions and resolutions to lower the data cost as much as possible while optimizing the learning efficiency. Specifically, we propose a probabilistic multi-resolution FNO and use ensemble Monte-Carlo to develop an effective posterior inference algorithm. To conduct active learning, we maximize a utility-cost ratio as the acquisition function to acquire new examples and resolutions at each step. We use moment matching and the matrix determinant lemma to enable tractable, efficient utility computation. Furthermore, we develop a cost annealing framework to avoid over-penalizing high-resolution queries at the early stage. The over-penalization is severe when the cost difference  is significant between the resolutions, which renders active learning often stuck at low-resolution queries and inferior performance. Our method overcomes this problem and  applies to general multi-fidelity active learning and optimization problems. We have shown  the advantage of our method in several benchmark operator learning tasks.",
        "keywords": "Active Learning;Neural Operators;Fourier Neural Operators",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Shibo Li;Xin Yu;WEI W. XING;Mike Kirby;Andrew Stuart;Akil Narayan;Shandian Zhe",
        "authorids": "~Shibo_Li1;~Xin_Yu4;~WEI_W._XING1;~Mike_Kirby1;~Andrew_Stuart1;~Akil_Narayan1;~Shandian_Zhe1",
        "gender": ";F;M;M;M;;",
        "homepage": "https://imshibo.com/;https://www.cs.utah.edu/~xiyu;;https://users.cs.utah.edu/~kirby/;http://www.cms.caltech.edu/people;http://www.sci.utah.edu/~akil;",
        "dblp": ";;;k/RobertMKirby.html;;;",
        "google_scholar": "thvPDwgAAAAJ;tWAfvQsAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en;;;",
        "orcid": "0009-0009-1076-282X;;;0000-0001-5712-4141;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Shibo_Li1;~Xin_Yu4;~WEI_W._XING1;~Mike_Kirby1;~Andrew_Stuart1;~Akil_Narayan1;~Shandian_Zhe1",
        "aff": "University of Utah;University of Utah;University of Sheffield;;California Institute of Technology;;",
        "aff_domain": "utah.edu;cs.utah.edu;shef.ac.uk;;;;",
        "position": "PhD student;PhD student;Lecturer;;Full Professor;;",
        "bibtex": "@misc{\nli2024multiresolution,\ntitle={Multi-Resolution Active Learning of Fourier Neural Operators},\nauthor={Shibo Li and Xin Yu and WEI W. XING and Mike Kirby and Andrew Stuart and Akil Narayan and Shandian Zhe},\nyear={2024},\nurl={https://openreview.net/forum?id=x4AzfGqBCY}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=x4AzfGqBCY",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14848188861694877100&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "University of Utah;University of Sheffield;California Institute of Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.utah.edu;https://www.sheffield.ac.uk;https://www.caltech.edu",
        "aff_unique_abbr": "Utah;Sheffield;Caltech",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Pasadena",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "title": "Privacy-Preserving In-Context Learning for Large Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17471",
        "id": "x4OPJ7lHVU",
        "author_site": "Tong Wu, Ashwinee Panda, Jiachen (Tianhao) Wang, Prateek Mittal",
        "tldr": "",
        "abstract": "In-context learning (ICL) is an important capability of Large Language Models (LLMs), enabling these models to dynamically adapt based on specific, in-context exemplars, thereby improving accuracy and relevance.\nHowever, LLM's responses may leak the sensitive private information contained in in-context exemplars. \nTo address this challenge, we propose Differentially Private In-context Learning (DP-ICL), a general paradigm for privatizing ICL tasks. \nThe key idea for DP-ICL paradigm is generating differentially private responses through a noisy consensus among an ensemble of LLM's responses based on disjoint exemplar sets. \nBased on the general paradigm of DP-ICL, we instantiate several techniques showing how to privatize ICL for text classification and language generation. \nWe experiment on four text classification benchmarks and two language generation tasks, and our empirical findings suggest that our DP-ICL achieves a strong utility-privacy tradeoff.",
        "keywords": "Large Langauge Model;In-context Learning;Differential Privacy",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Tong Wu;Ashwinee Panda;Jiachen T. Wang;Prateek Mittal",
        "authorids": "~Tong_Wu1;~Ashwinee_Panda1;~Jiachen_T._Wang1;~Prateek_Mittal1",
        "gender": "M;M;;M",
        "homepage": "https://tongwu2020.github.io/tongwu/;https://kiddyboots216.github.io/;http://www.princeton.edu/~pmittal/;https://tianhaowang.netlify.app/",
        "dblp": ";270/1582.html;;274/2144",
        "google_scholar": "dt0eV8CPx3AC;FM7JCgQAAAAJ;https://scholar.google.com.tw/citations?user=xTKD8J4AAAAJ;nvQOtgkAAAAJ",
        "orcid": ";;0000-0002-4057-0118;",
        "linkedin": "tongwu98/;https://linkedin.com/in/ashwineepanda;;tian-hao-wang/",
        "or_profile": "~Tong_Wu1;~Ashwinee_Panda1;~Prateek_Mittal1;~Tianhao_Wang2",
        "aff": "Princeton University;Princeton University;Princeton University;Princeton University",
        "aff_domain": "princeton.edu;princeton.edu;princeton.edu;princeton.edu",
        "position": "PhD student;PhD student;Full Professor;PhD student",
        "bibtex": "@inproceedings{\nwu2024privacypreserving,\ntitle={Privacy-Preserving In-Context Learning for Large Language Models},\nauthor={Tong Wu and Ashwinee Panda and Jiachen T. Wang and Prateek Mittal},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=x4OPJ7lHVU}\n}",
        "github": "",
        "project": "",
        "reviewers": "2dnr;3Mai;cEpf;ZNqV",
        "pdf_size": 1724482,
        "rating": "6;6;6;8",
        "confidence": "2;4;2;4",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;4",
        "presentation": "2;3;3;4",
        "wc_summary": "56;183;94;57",
        "wc_strengths": "50;111;13;66",
        "wc_weaknesses": "94;108;196;40",
        "wc_questions": "2;119;6;46",
        "wc_review": "202;521;309;209",
        "wc_reply_reviewers": "12;57;46;19",
        "wc_reply_authors": "1194;1549;1559;543",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "4;5;5;3",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            1.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            97.5,
            51.68413683133346
        ],
        "wc_strengths_avg": [
            60.0,
            35.16390194503448
        ],
        "wc_weaknesses_avg": [
            109.5,
            56.0245481909493
        ],
        "wc_questions_avg": [
            43.25,
            46.99667541433117
        ],
        "wc_review_avg": [
            310.25,
            128.82813163280758
        ],
        "wc_reply_reviewers_avg": [
            33.5,
            18.580904176062045
        ],
        "wc_reply_authors_avg": [
            1211.25,
            412.8742998783044
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            4.25,
            0.82915619758885
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 40,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16071339133238338724&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 8,
        "openreview": "https://openreview.net/forum?id=x4OPJ7lHVU",
        "pdf": "https://openreview.net/pdf?id=x4OPJ7lHVU",
        "email": "princeton.edu;princeton.edu;princeton.edu;princeton.edu",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Princeton University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.princeton.edu",
        "aff_unique_abbr": "Princeton",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "x4fm4T2tjM",
        "title": "RoboGPT : An intelligent agent of making embodied long-term decisions for daily instruction tasks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Robotic agents must master common sense and long-term sequential decisions to solve daily tasks through natural language instruction. \nThe developments in Large Language Models (LLMs) in natural language processing have inspired efforts to use LLMs in complex robot planning. Despite LLMs' great generalization and comprehension of instructional tasks, LLM-generated task plans sometimes lack feasibility and correctness. To address the problem, we propose a RoboGPT agent for making embodied long-term decisions for daily tasks, with two modules: 1) LLM-based planning with Re-Plan to break the task into multiple sub-goals; 2) RoboSkill individually designed for sub-goals to learn better navigation and manipulation skills. The LLM-based planning is enhanced with a new robotic dataset and re-plan, called RoboGPT. The new robotic dataset of 67k daily instruction tasks is gathered for fine-tuning the LLaMA model and obtaining RoboGPT. RoboGPT palnner with strong generalization can plan hundreds of daily tasks, and re-plan based on the environment, thereby addressing the nomenclature diversity challenge. Additionally, a low-computational Re-Plan module is designed to allow plans to flexibly adapt to the environment. The proposed RoboGPT agent outperforms SOTA methods on the ALFRED daily tasks. Moreover, RoboGPT palnner exceeds SOTA LLM-based planners like ChatGPT in task-planning rationality for hundreds of unseen daily tasks, and even other domain tasks, while keeping the large model's original broad application and generality.",
        "keywords": "Robot task planning;Daily tasks following by instructions;Embodied AI",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/9039ce7491bb40acc7f5341972f7bd2b8cf7b98d.zip",
        "author": "Yaran Chen;Wenbo Cui;Yuanwen Chen;Mining Tan;Xinyao Zhang;Dongbin Zhao;He Wang",
        "authorids": "~Yaran_Chen1;cuiwenbo2023@ia.ac.cn;chenyw220@163.com;tanmining@163.com;trisoil@bupt.edu.cn;~Dongbin_Zhao1;~He_Wang5",
        "gender": "F;;;;;M;M",
        "homepage": "https://people.ucas.ac.cn/~yaran?language=en;;;;;http://people.ucas.ac.cn/~zhaodongbin?language=en;https://hughw19.github.io",
        "dblp": "189/4413;;;;;40/255;01/6368-10",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;;;;;;roCAWkoAAAAJ",
        "orcid": "0000-0001-9356-0610;;;;;0000-0001-8218-9633;",
        "linkedin": ";;;;;;",
        "or_profile": "~Yaran_Chen1;cuiwenbo2023@ia.ac.cn;chenyw220@163.com;tanmining@163.com;trisoil@bupt.edu.cn;~Dongbin_Zhao1;~He_Wang5",
        "aff": "Institute of Automation, Chinese Academy of Sciences;;;;;Institute of Automation, Chinese Academy of Sciences;Peking University",
        "aff_domain": "ia.ac.cn;;;;;ia.ac.cn;pku.edu.cn",
        "position": "Associate Professor;;;;;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nchen2024robogpt,\ntitle={Robo{GPT} : An intelligent agent of making embodied long-term decisions for daily instruction tasks},\nauthor={Yaran Chen and Wenbo Cui and Yuanwen Chen and Mining Tan and Xinyao Zhang and Dongbin Zhao and He Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=x4fm4T2tjM}\n}",
        "github": "",
        "project": "",
        "reviewers": "ygbc;A6GH;16gg;SCK4",
        "site": "https://openreview.net/forum?id=x4fm4T2tjM",
        "pdf_size": 2461791,
        "rating": "3;3;3;6",
        "confidence": "4;4;4;4",
        "soundness": "2;3;2;3",
        "contribution": "1;2;3;2",
        "presentation": "2;1;1;3",
        "wc_summary": "88;135;187;55",
        "wc_strengths": "61;64;39;55",
        "wc_weaknesses": "352;777;563;150",
        "wc_questions": "3;165;16;150",
        "wc_review": "504;1141;805;410",
        "wc_reply_reviewers": "45;0;32;0",
        "wc_reply_authors": "536;639;814;853",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            116.25,
            49.76632897853729
        ],
        "wc_strengths_avg": [
            54.75,
            9.65336728815391
        ],
        "wc_weaknesses_avg": [
            460.5,
            233.91291114429745
        ],
        "wc_questions_avg": [
            83.5,
            74.3320253995544
        ],
        "wc_review_avg": [
            715.0,
            285.97290081404566
        ],
        "wc_reply_reviewers_avg": [
            19.25,
            19.79109648301478
        ],
        "wc_reply_authors_avg": [
            710.5,
            129.01647181658626
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15308152986231030598&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Chinese Academy of Sciences;Peking University",
        "aff_unique_dep": "Institute of Automation;",
        "aff_unique_url": "http://www.ia.cas.cn;http://www.pku.edu.cn",
        "aff_unique_abbr": "CAS;Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "PROGRAM: PROtotype GRAph Model based Pseudo-Label Learning for Test-Time Adaptation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17470",
        "id": "x5LvBK43wg",
        "author_site": "Haopeng Sun, Lumin Xu, Sheng Jin, Ping Luo, Chen Qian, Wentao Liu",
        "tldr": "",
        "abstract": "Test-time adaptation (TTA) aims to adapt a pre-trained model from a source domain to a target domain only using online unlabeled target data during testing, without accessing to the source data or modifying the original training process. Among the various TTA methods, pseudo-labeling has gained popularity. However, the presence of incorrect pseudo-labels can hinder the effectiveness of target domain adaptation. To overcome this challenge, we propose a novel TTA method, called PROtotype GRAph Model based pseudo-label learning (PROGRAM). PROGRAM consists of two key components: (1) Prototype Graph Model (PGM) for reliable pseudo-label generation; (2) Robust Self-Training (RST) for test-time adaptation with noisy pseudo-labels. PGM constructs the graph using prototypes and test samples, facilitating effective message passing among them to generate more reliable pseudo-labels. RST combines the advantages of consistency regularization and pseudo-labeling to achieve robust target domain adaptation in the presence of noisy pseudo-labels. Our proposed PROGRAM can be easily integrated into existing baselines, resulting in consistent improvement. Extensive experiments show that our PROGRAM outperforms the existing TTA methods on multiple domain generalization and image corruption benchmarks.",
        "keywords": "test-time adaptation;domain adaptation;domain shift",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Haopeng Sun;Lumin Xu;Sheng Jin;Ping Luo;Chen Qian;Wentao Liu",
        "authorids": "~Haopeng_Sun1;~Lumin_Xu1;~Sheng_Jin1;~Ping_Luo2;~Chen_Qian1;~Wentao_Liu1",
        "gender": "M;;M;M;M;",
        "homepage": ";http://mmlab.ie.cuhk.edu.hk;https://jin-s13.github.io/;;;http://luoping.me/",
        "dblp": ";212/1288;70/6780-7;;30/3943-2;54/4989-2.html",
        "google_scholar": "https://scholar.google.com.hk/citations?hl=zh-CN;;wrNd--oAAAAJ;AerkT0YAAAAJ;KZn9NWEAAAAJ;https://scholar.google.com.hk/citations?hl=en",
        "orcid": ";;0000-0001-5736-7434;;;0000-0002-6685-7950",
        "linkedin": ";;;;;",
        "or_profile": "~Haopeng_Sun1;~Lumin_Xu1;~Sheng_Jin1;~Chen_Qian1;~Wentao_Liu1;~Luo_Ping2",
        "aff": "Institute of Computing Technology, Chinese Academy of Sciences;The Chinese University of Hong Kong;The University of Hong Kong;Tsinghua University;Sensetime;The University of Hong Kong",
        "aff_domain": "ict.ac.cn;cuhk.edu.hk;hku.hk;mails.tsinghua.edu.cn;sensetime.com;hku.hk",
        "position": "PhD student;PhD student;PhD student;PhD student;Senior Researcher;Associate Professor",
        "bibtex": "@inproceedings{\nsun2024program,\ntitle={{PROGRAM}: {PRO}totype {GRA}ph Model based Pseudo-Label Learning for Test-Time Adaptation},\nauthor={Haopeng Sun and Lumin Xu and Sheng Jin and Ping Luo and Chen Qian and Wentao Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=x5LvBK43wg}\n}",
        "github": "",
        "project": "",
        "reviewers": "xjYH;XKXi;zHCF;DVoa;C9fo",
        "pdf_size": 854887,
        "rating": "5;6;6;6;8",
        "confidence": "4;5;3;2;3",
        "soundness": "3;3;2;3;3",
        "contribution": "2;3;3;3;3",
        "presentation": "2;4;2;2;3",
        "wc_summary": "70;54;44;55;103",
        "wc_strengths": "27;210;43;30;63",
        "wc_weaknesses": "81;216;130;73;74",
        "wc_questions": "57;185;2;124;82",
        "wc_review": "235;665;219;282;322",
        "wc_reply_reviewers": "0;402;25;0;0",
        "wc_reply_authors": "1240;2321;982;1074;1333",
        "reply_reviewers": "0;2;1;0;0",
        "reply_authors": "4;6;3;3;4",
        "rating_avg": [
            6.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.4,
            1.019803902718557
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.8,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.6,
            0.8
        ],
        "wc_summary_avg": [
            65.2,
            20.643643089338664
        ],
        "wc_strengths_avg": [
            74.6,
            68.87844365256811
        ],
        "wc_weaknesses_avg": [
            114.8,
            54.82116379647554
        ],
        "wc_questions_avg": [
            90.0,
            61.77054314153308
        ],
        "wc_review_avg": [
            344.6,
            164.23958110029386
        ],
        "wc_reply_reviewers_avg": [
            85.4,
            158.59583853304602
        ],
        "wc_reply_authors_avg": [
            1390.0,
            481.42081384169506
        ],
        "reply_reviewers_avg": [
            0.6,
            0.7999999999999999
        ],
        "reply_authors_avg": [
            4.0,
            1.0954451150103321
        ],
        "replies_avg": [
            31,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.2802242691589025,
        "gs_citation": 30,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2767099555068205558&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=x5LvBK43wg",
        "pdf": "https://openreview.net/pdf?id=x5LvBK43wg",
        "email": "ict.ac.cn;cuhk.edu.hk;hku.hk;mails.tsinghua.edu.cn;sensetime.com;hku.hk",
        "author_num": 6,
        "aff_unique_index": "0;1;2;3;4;2",
        "aff_unique_norm": "Chinese Academy of Sciences;Chinese University of Hong Kong;University of Hong Kong;Tsinghua University;SenseTime",
        "aff_unique_dep": "Institute of Computing Technology;;;;",
        "aff_unique_url": "http://www.ict.ac.cn;https://www.cuhk.edu.hk;https://www.hku.hk;https://www.tsinghua.edu.cn;https://www.sensetime.com",
        "aff_unique_abbr": "CAS;CUHK;HKU;THU;SenseTime",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Synaptic Weight Distributions Depend on the Geometry of Plasticity",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17469",
        "id": "x5txICnnjC",
        "author_site": "Roman Pogodin, Jonathan Cornford, Arna Ghosh, Gauthier Gidel, Guillaume Lajoie, Blake A Richards",
        "tldr": "",
        "abstract": "A growing literature in computational neuroscience leverages gradient descent and learning algorithms that approximate it to study synaptic plasticity in the brain. However, the vast majority of this work ignores a critical underlying assumption: the choice of distance for synaptic changes - i.e. the geometry of synaptic plasticity. Gradient descent assumes that the distance is Euclidean, but many other distances are possible, and there is no reason that biology necessarily uses Euclidean geometry. Here, using the theoretical tools provided by mirror descent, we show that the distribution of synaptic weights will depend on the geometry of synaptic plasticity. We use these results to show that experimentally-observed log-normal weight distributions found in several brain areas are not consistent with standard gradient descent (i.e. a Euclidean geometry), but rather with non-Euclidean distances. Finally, we show that it should be possible to experimentally test for different synaptic geometries by comparing synaptic weight distributions before and after learning. Overall, our work shows that the current paradigm in theoretical work on synaptic plasticity that assumes Euclidean synaptic geometry may be misguided and that it should be possible to experimentally determine the true geometry of synaptic plasticity in the brain.",
        "keywords": "synaptic weight distributions;synaptic plasticity;biologically plausible learning;mirror descent",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/bc85f823c1bbd6cef9bc82ae4e690f0f95420683.zip",
        "author": "Roman Pogodin;Jonathan Cornford;Arna Ghosh;Gauthier Gidel;Guillaume Lajoie;Blake Aaron Richards",
        "authorids": "~Roman_Pogodin1;~Jonathan_Cornford1;~Arna_Ghosh1;~Gauthier_Gidel1;~Guillaume_Lajoie1;~Blake_Aaron_Richards1",
        "gender": "M;;M;M;M;M",
        "homepage": "https://romanpogodin.github.io/;;https://arnaghosh.github.io/;https://gauthiergidel.github.io/;https://dms.umontreal.ca/~lajoie/;http://linclab.org",
        "dblp": "213/3672;;190/7223;188/6326;31/10384;70/10850",
        "google_scholar": "https://scholar.google.co.uk/citations?user=kLCmh2oAAAAJ;;https://scholar.google.ca/citations?user=YjS546oAAAAJ;https://scholar.google.fr/citations?user=bDrXQPUAAAAJ;;https://scholar.google.ca/citations?user=1CPY1LsAAAAJ",
        "orcid": "0000-0003-2061-3288;;;;;0000-0001-9662-2151",
        "linkedin": ";;;;;",
        "or_profile": "~Roman_Pogodin1;~Jonathan_Cornford1;~Arna_Ghosh1;~Gauthier_Gidel1;~Guillaume_Lajoie1;~Blake_Aaron_Richards1",
        "aff": "McGill/Mila;;McGill University;Mila - Quebec Artificial Intelligence Institute;Mila - Quebec Artificial Intelligence Institute;Mila - Quebec Artificial Intelligence Institute",
        "aff_domain": "mila.quebec;;mcgill.ca;mila.quebec;mila.quebec;mila.quebec",
        "position": "Postdoc;;PhD student;Assistant Professor;Associate Professor;Associate Professor",
        "bibtex": "@inproceedings{\npogodin2024synaptic,\ntitle={Synaptic Weight Distributions Depend on the Geometry of Plasticity},\nauthor={Roman Pogodin and Jonathan Cornford and Arna Ghosh and Gauthier Gidel and Guillaume Lajoie and Blake Aaron Richards},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=x5txICnnjC}\n}",
        "github": "",
        "project": "",
        "reviewers": "mbP3;DFTN;GuwS;jXnh",
        "pdf_size": 740185,
        "rating": "1;5;8;8",
        "confidence": "4;2;4;4",
        "soundness": "1;4;4;3",
        "contribution": "2;2;3;3",
        "presentation": "3;4;4;3",
        "wc_summary": "115;58;161;35",
        "wc_strengths": "21;86;104;38",
        "wc_weaknesses": "187;441;90;176",
        "wc_questions": "2;64;145;2",
        "wc_review": "325;649;500;251",
        "wc_reply_reviewers": "0;683;19;37",
        "wc_reply_authors": "1086;2425;397;984",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "2;4;1;3",
        "rating_avg": [
            5.5,
            2.8722813232690143
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            3.0,
            1.224744871391589
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            92.25,
            49.230960786886946
        ],
        "wc_strengths_avg": [
            62.25,
            33.89966813996857
        ],
        "wc_weaknesses_avg": [
            223.5,
            131.06963797920554
        ],
        "wc_questions_avg": [
            53.25,
            58.708495978009864
        ],
        "wc_review_avg": [
            431.25,
            154.85537607716432
        ],
        "wc_reply_reviewers_avg": [
            184.75,
            287.962128586382
        ],
        "wc_reply_authors_avg": [
            1223.0,
            742.1202732711188
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.10050378152592121,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2863015636989932073&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=x5txICnnjC",
        "pdf": "https://openreview.net/pdf?id=x5txICnnjC",
        "email": "mila.quebec;;mcgill.ca;mila.quebec;mila.quebec;mila.quebec",
        "author_num": 6,
        "aff_unique_index": "0;0;1;1;1",
        "aff_unique_norm": "McGill University;Quebec Artificial Intelligence Institute",
        "aff_unique_dep": "Mila;Artificial Intelligence",
        "aff_unique_url": "https://www.mcgill.ca;https://mila.quebec",
        "aff_unique_abbr": "McGill;Mila",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "id": "x6CjUdI25z",
        "title": "Suppressing Overestimation in Q-Learning through Adversarial Behaviors",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The goal of this paper is to propose a new Q-learning algorithm with a dummy adversarial player, which is called dummy adversarial Q-learning (DAQ), that can effectively control the overestimation bias in standard Q-learning. With the dummy player, the learning can be formulated as a two-player zero-sum game. The proposed DAQ unifies several Q-learning variations to control overestimation, such as Maxmin Q-learning and Minmax Q-learning (proposed in this paper) in a single framework.\nThe proposed DAQ is a simple but effective way to suppress the overestimation bias from subtle rewards and can be easily applied to off-the-shelf reinforcement learning algorithms.\nA finite-time convergence of DAQ is analyzed from an integrated perspective by adapting an adversarial Q-learning. The performance of the suggested DAQ is empirically demonstrated under various MDP environments.",
        "keywords": "Markav decision process;reinforcement Learning;Q-learning;double Q-learning;overestimation;adversarial reinforcement learning;two-player zero-sum game",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "HyeAnn Lee;Donghwan Lee",
        "authorids": "~HyeAnn_Lee1;~Donghwan_Lee2",
        "gender": "F;M",
        "homepage": ";https://sites.google.com/site/donghwanleehome",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": "hyeann-lee-936408243/;",
        "or_profile": "~HyeAnn_Lee1;~Donghwan_Lee2",
        "aff": "KAIST;Korea Advanced Institute of Science & Technology",
        "aff_domain": "ee.kaist.ac.kr;kaist.ac.kr",
        "position": "MS student;Assistant Professor",
        "bibtex": "@misc{\nlee2024suppressing,\ntitle={Suppressing Overestimation in Q-Learning through Adversarial Behaviors},\nauthor={HyeAnn Lee and Donghwan Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=x6CjUdI25z}\n}",
        "github": "",
        "project": "",
        "reviewers": "H3gW;mxLo;qny6;KWyD",
        "site": "https://openreview.net/forum?id=x6CjUdI25z",
        "pdf_size": 2762421,
        "rating": "3;3;5;6",
        "confidence": "2;3;4;4",
        "soundness": "2;1;2;3",
        "contribution": "1;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "69;54;78;69",
        "wc_strengths": "20;55;44;53",
        "wc_weaknesses": "162;306;292;55",
        "wc_questions": "2;81;57;13",
        "wc_review": "253;496;471;190",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            67.5,
            8.616843969807043
        ],
        "wc_strengths_avg": [
            43.0,
            13.910427743243556
        ],
        "wc_weaknesses_avg": [
            203.75,
            102.60695639185484
        ],
        "wc_questions_avg": [
            38.25,
            32.135455497005175
        ],
        "wc_review_avg": [
            352.5,
            133.1737586763999
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.8703882797784892,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:cARqDG8k7mMJ:scholar.google.com/&scioq=Suppressing+Overestimation+in+Q-Learning+through+Adversarial+Behaviors&hl=en&as_sdt=0,5",
        "gs_version_total": 5,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "x6gnuUXpxM",
        "title": "Constructing Sparse Neural Architecture with Deterministic Ramanujan Graphs",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We present a sparsely connected neural network architecture constructed using the theory of Ramanujan graphs which provide comparable performance to a dense network. The method can be considered as a before-training, deterministic, weight free, pruning at initialization (PaI) technique. The deterministic Ramanujan graphs occur either as Cayley graphs of certain algebraic groups or as Ramanujan $r$-coverings of the full $(k,l)$ bi-regular bipartite graph on $k + l$ vertices. Sparse networks are constructed for bipartite graphs representing both the convolution and the fully connected layers. We experimentally show that the proposed sparse architecture provides comparable accuracy with a lower sparsity ratio than those achieved by previous approaches based on non-deterministic methods for benchmark datasets. In addition, they retain other desirable properties such as path connectivity and symmetricity.",
        "keywords": "Sparse neural networks;expander graphs;pruning;Ramanujan graphs",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Arindam Biswas;Suryam Arnav Kalra;Pabitra Mitra;BISWAJIT BASU",
        "authorids": "~Arindam_Biswas1;~Suryam_Arnav_Kalra1;~Pabitra_Mitra1;~BISWAJIT_BASU1",
        "gender": ";;M;M",
        "homepage": ";;http://cse.iitkgp.ac.in/~pabitra/;https://people.tcd.ie/Profile?Username=basub",
        "dblp": ";;m/PabitraMitra;",
        "google_scholar": ";;https://scholar.google.com.tw/citations?user=5bXSZPYAAAAJ;Gjeu9sgAAAAJ",
        "orcid": ";;0000-0002-1908-9813;",
        "linkedin": ";suryam-arnav-kalra-8ba107193/;pabitra-mitra-8028235/;",
        "or_profile": "~Arindam_Biswas1;~Suryam_Arnav_Kalra1;~Pabitra_Mitra1;~BISWAJIT_BASU1",
        "aff": ";Indian Institute of Technology Kharagpur;Indian Institute of Technology Kharagpur;Trinity College, Dublin",
        "aff_domain": ";iitkgp.ac.in;iitkgp.ac.in;tcd.ie",
        "position": ";Undergrad student;Full Professor;Full Professor",
        "bibtex": "@misc{\nbiswas2024constructing,\ntitle={Constructing Sparse Neural Architecture with Deterministic Ramanujan Graphs},\nauthor={Arindam Biswas and Suryam Arnav Kalra and Pabitra Mitra and BISWAJIT BASU},\nyear={2024},\nurl={https://openreview.net/forum?id=x6gnuUXpxM}\n}",
        "github": "",
        "project": "",
        "reviewers": "t3Ja;FU2a;qgd3;Qqf9",
        "site": "https://openreview.net/forum?id=x6gnuUXpxM",
        "pdf_size": 239588,
        "rating": "3;3;5;5",
        "confidence": "4;2;2;3",
        "soundness": "2;2;2;2",
        "contribution": "2;2;1;2",
        "presentation": "2;2;1;2",
        "wc_summary": "48;38;19;37",
        "wc_strengths": "28;27;6;22",
        "wc_weaknesses": "81;149;190;82",
        "wc_questions": "33;52;1;123",
        "wc_review": "190;266;216;264",
        "wc_reply_reviewers": "0;0;32;73",
        "wc_reply_authors": "566;628;741;765",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            35.5,
            10.452272480183437
        ],
        "wc_strengths_avg": [
            20.75,
            8.814051281902097
        ],
        "wc_weaknesses_avg": [
            125.5,
            46.32763753959401
        ],
        "wc_questions_avg": [
            52.25,
            44.72904537322477
        ],
        "wc_review_avg": [
            234.0,
            32.341923257592455
        ],
        "wc_reply_reviewers_avg": [
            26.25,
            29.98645527567405
        ],
        "wc_reply_authors_avg": [
            675.0,
            81.46471628870992
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.30151134457776363,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:f04bFuWAfNYJ:scholar.google.com/&scioq=Constructing+Sparse+Neural+Architecture+with+Deterministic+Ramanujan+Graphs&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Indian Institute of Technology Kharagpur;Trinity College Dublin",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.iitkgp.ac.in;https://www.tcd.ie",
        "aff_unique_abbr": "IIT Kharagpur;TCD",
        "aff_campus_unique_index": "0;0;1",
        "aff_campus_unique": "Kharagpur;Dublin",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "India;Ireland"
    },
    {
        "title": "Tag2Text: Guiding Vision-Language Model via Image Tagging",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17468",
        "id": "x6u2BQ7xcq",
        "author_site": "Xinyu Huang, Youcai Zhang, Jinyu Ma, Weiwei Tian, Rui Feng, Yuejie Zhang, Yaqian Li, Yandong Guo, Lei Zhang",
        "tldr": "",
        "abstract": "This paper presents Tag2Text, a vision language pre-training (VLP) framework, which introduces image tagging into vision-language models to guide the learning of visual-linguistic features. In contrast to prior works which utilize object tags either manually labeled or automatically detected with a limited detector, our approach utilizes tags parsed from its paired text to learn an image tagger and meanwhile provides guidance to vision-language models. Given that, Tag2Text can utilize large-scale annotation-free image tags in accordance with image-text pairs, and provides more diverse tag categories beyond objects. Strikingly, Tag2Text showcases the ability of a foundational image tagging model, with superior zero-shot performance even comparable to full supervision manner. Moreover, by leveraging tagging guidance, Tag2Text effectively enhances the performance of vision-language models on both generation-based and alignment-based tasks. Across a wide range of downstream benchmarks, Tag2Text achieves state-of-the-art results with similar model sizes and data scales, demonstrating the efficacy of the proposed tagging guidance.",
        "keywords": "Image Recognition;Vision-Language Pretraining;Image Tagging",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Xinyu Huang;Youcai Zhang;Jinyu Ma;Weiwei Tian;Rui Feng;Yuejie Zhang;Yaqian Li;Yandong Guo;Lei Zhang",
        "authorids": "~Xinyu_Huang5;~Youcai_Zhang1;~Jinyu_Ma1;~Weiwei_Tian1;~Rui_Feng2;~Yuejie_Zhang2;~Yaqian_Li1;~Yandong_Guo2;~Lei_Zhang23",
        "gender": "M;M;M;F;;F;M;M;",
        "homepage": "https://xinyu1205.github.io/;;https://github.com/majinyu666;https://github.com/paradisetww;;http://www.cs.fudan.edu.cn/?page_id=5518;;;",
        "dblp": "91/2102;64/10215;;154/2587;;09/5786;154/1961.html;28/4272;",
        "google_scholar": "1O5b3VcAAAAJ;j5idDP8AAAAJ;;https://scholar.google.com/citations?hl=zh-CN;;;;fWDoWsQAAAAJ;",
        "orcid": ";0000-0003-1412-2677;;0000-0002-3725-8457;;0000-0001-7993-7223;;;",
        "linkedin": ";;;;;;;;",
        "or_profile": "~Xinyu_Huang5;~Youcai_Zhang1;~Jinyu_Ma1;~Weiwei_Tian1;~Rui_Feng2;~Yuejie_Zhang2;~Yaqian_Li1;~Yandong_Guo2;~Lei_Zhang23",
        "aff": "Fudan University;ByteDance Inc.;;Fudan University;;Fudan University;;AI^2 Robotics;",
        "aff_domain": "fudan.edu.cn;bytedance.com;;fudan.edu.cn;;fudan.edu.cn;;ai2robotics.com;",
        "position": "PhD student;Machine Learning Engineer ;;PhD student;;Full Professor;;Chief Scientist;",
        "bibtex": "@inproceedings{\nhuang2024tagtext,\ntitle={Tag2Text: Guiding Vision-Language Model via Image Tagging},\nauthor={Xinyu Huang and Youcai Zhang and Jinyu Ma and Weiwei Tian and Rui Feng and Yuejie Zhang and Yaqian Li and Yandong Guo and Lei Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=x6u2BQ7xcq}\n}",
        "github": "",
        "project": "",
        "reviewers": "gXiT;N6Aw;Kr1V;pdv8;Nwx3",
        "pdf_size": 2622758,
        "rating": "3;5;6;6;8",
        "confidence": "5;3;4;5;5",
        "soundness": "3;3;4;4;4",
        "contribution": "2;3;4;2;4",
        "presentation": "2;3;3;4;4",
        "wc_summary": "40;90;99;79;81",
        "wc_strengths": "86;48;85;73;157",
        "wc_weaknesses": "141;253;130;135;33",
        "wc_questions": "31;82;6;3;55",
        "wc_review": "298;473;320;290;326",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "1234;1557;598;958;650",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "4;4;2;3;1",
        "rating_avg": [
            5.6,
            1.624807680927192
        ],
        "confidence_avg": [
            4.4,
            0.7999999999999999
        ],
        "soundness_avg": [
            3.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            3.0,
            0.8944271909999159
        ],
        "presentation_avg": [
            3.2,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            77.8,
            20.193068117549647
        ],
        "wc_strengths_avg": [
            89.8,
            36.28443192334696
        ],
        "wc_weaknesses_avg": [
            138.4,
            69.75844034953764
        ],
        "wc_questions_avg": [
            35.4,
            29.96397837404105
        ],
        "wc_review_avg": [
            341.4,
            67.140449804868
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            999.4,
            360.79667404231986
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.8,
            1.16619037896906
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.12309149097933272,
        "gs_citation": 84,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5704628834136146898&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=x6u2BQ7xcq",
        "pdf": "https://openreview.net/pdf?id=x6u2BQ7xcq",
        "email": "fudan.edu.cn;bytedance.com;;fudan.edu.cn;;fudan.edu.cn;;ai2robotics.com;",
        "author_num": 9,
        "aff_unique_index": "0;1;0;0;2",
        "aff_unique_norm": "Fudan University;ByteDance;AI^2 Robotics",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.fudan.edu.cn;https://www.bytedance.com;http://ai2robotics.org/",
        "aff_unique_abbr": "Fudan;ByteDance;AI^2 Robotics",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "x7LrHqcOyh",
        "title": "DNCs require more planning steps",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "A Differentiable Neural Computer (DNC) is a memory-augmented neural computation model capable of learning to solve complex algorithmic tasks, from simple sorting algorithms, through graph problems, to text question answering. In previous works, it was always given a constant number of planning steps to complete its task.\nIn this work, we argue that the number of planning steps the model is allowed to take, which we call \"planning budget\", is a constraint that can cause the model to generalize poorly and hurt its ability to fully utilize its external memory.\nBy introducing an adaptive planning budget that scales with input size during training, the model is better able to utilize its memory space, and achieves substantially better accuracy on input sizes not seen during training.\nWe experiment with Graph Shortest Path search, which has been used as a benchmark to measure these models in the past, and with the Graph MinCut problem.\nIn both problems, our proposed approach improves performance and generalizes better compared to the standard planning budget.",
        "keywords": "Deep learning;machine learning;neural turing machines;dnc;adaptive computation time",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Yara Shamshoum;Yuval Sieradzki;Nitzan Hodos;Assaf Schuster",
        "authorids": "~Yara_Shamshoum1;~Yuval_Sieradzki1;~Nitzan_Hodos1;~Assaf_Schuster2",
        "gender": "F;M;;M",
        "homepage": ";;;https://assaf.net.technion.ac.il/",
        "dblp": "379/5983;322/9296;322/8783;s/AssafSchuster",
        "google_scholar": ";-v1mrtcAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.co.il/citations?user=KfwgjswAAAAJ",
        "orcid": ";;;0000-0002-3311-6937",
        "linkedin": "yara-shamshoum-332a571ba/;;nitzan-hodos/;",
        "or_profile": "~Yara_Shamshoum1;~Yuval_Sieradzki1;~Nitzan_Hodos1;~Assaf_Schuster2",
        "aff": "Computer Science Department, Technion - Israel Institute of Technology;Computer Science Department, Technion - Israel Institute of Technology;Taub Faculty of Computer Science, Technion - Israel Institute of Technology;Technion - Israel Institute of Technology, Technion",
        "aff_domain": "cs.technion.ac.il;cs.technion.ac.il;cs.technion.ac.il;technion.ac.il",
        "position": "PhD student;PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nshamshoum2024dncs,\ntitle={{DNC}s require more planning steps},\nauthor={Yara Shamshoum and Yuval Sieradzki and Nitzan Hodos and Assaf Schuster},\nyear={2024},\nurl={https://openreview.net/forum?id=x7LrHqcOyh}\n}",
        "github": "",
        "project": "",
        "reviewers": "vfng;oJyN;Mmrw;oFbH",
        "site": "https://openreview.net/forum?id=x7LrHqcOyh",
        "pdf_size": 2818806,
        "rating": "3;3;5;5",
        "confidence": "3;3;4;4",
        "soundness": "2;3;1;3",
        "contribution": "2;2;2;2",
        "presentation": "3;3;2;3",
        "wc_summary": "92;146;55;187",
        "wc_strengths": "69;69;54;67",
        "wc_weaknesses": "413;405;388;281",
        "wc_questions": "170;98;373;22",
        "wc_review": "744;718;870;557",
        "wc_reply_reviewers": "0;0;0;169",
        "wc_reply_authors": "534;812;774;498",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            120.0,
            50.43312403569701
        ],
        "wc_strengths_avg": [
            64.75,
            6.2599920127744575
        ],
        "wc_weaknesses_avg": [
            371.75,
            53.166601358371594
        ],
        "wc_questions_avg": [
            165.75,
            130.59933958485394
        ],
        "wc_review_avg": [
            722.25,
            111.38755540903122
        ],
        "wc_reply_reviewers_avg": [
            42.25,
            73.17914661978507
        ],
        "wc_reply_authors_avg": [
            654.5,
            139.73099155162393
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:IV0701Y3hzgJ:scholar.google.com/&scioq=DNCs+require+more+planning+steps&hl=en&as_sdt=0,14",
        "gs_version_total": 8,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Technion - Israel Institute of Technology",
        "aff_unique_dep": "Computer Science Department",
        "aff_unique_url": "https://www.technion.ac.il",
        "aff_unique_abbr": "Technion",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Israel"
    },
    {
        "id": "x7cuUZxwFS",
        "title": "Transformers Get Stable: An End-to-End Signal Propagation Theory for Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In spite of their huge success, transformer models remain difficult to scale in depth. In this work, we provide formulae that govern the moments of the forward and backward signal through all transformer components, and develop a unified signal propagation theory for transformers. Our framework can be used to understand and mitigate vanishing/exploding gradients, rank collapse, and instability associated with high attention scores. We also propose DeepScaleLM, an initialization and scaling scheme that conserves unit output/gradient moments throughout the model, enabling the training of very deep models with $100$s of layers. We find that transformer models could be much deeper -- our deep models improve $1.0$ points in perplexity, and $2.2$ points in downstream tasks compared to shallow models across multiple model sizes, without any extra parameters, and even outperform larger shallow models using only half the number of parameters.",
        "keywords": "Signal Propagation;Language Model;Training Stability;Gradient Explosion;Moment Control;Rank Collapse",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/b1c6148b6944ef4720285b1638655f5050f0c48e.zip",
        "author": "Akhil Kedia;Mohd Abbas Zaidi;Sushil Khyalia;Haejun Lee",
        "authorids": "~Akhil_Kedia1;~Mohd_Abbas_Zaidi2;~Sushil_Khyalia1;~Haejun_Lee2",
        "gender": ";M;M;M",
        "homepage": ";https://sushil-khyalia.github.io;;https://mzaidi59.github.io/",
        "dblp": "264/2699;284/0708;;266/4018.html",
        "google_scholar": "VvLIqCcAAAAJ;S2akEm4AAAAJ;https://scholar.google.co.kr/citations?hl=ko;i_cSaKgAAAAJ",
        "orcid": ";;;0000-0003-2961-4404",
        "linkedin": ";sushil-khyalia-41b829160/;;mazaidi/",
        "or_profile": "~Akhil_Kedia1;~Sushil_Khyalia1;~Haejun_Lee2;~Mohd_Abbas_Zaidi1",
        "aff": "Samsung;Carnegie Mellon University;;Georgia Institute of Technology",
        "aff_domain": "samsung.com;andrew.cmu.edu;;gatech.edu",
        "position": "Researcher;MS student;;MS student",
        "bibtex": "@misc{\nkedia2024transformers,\ntitle={Transformers Get Stable: An End-to-End Signal Propagation Theory for Language Models},\nauthor={Akhil Kedia and Mohd Abbas Zaidi and Sushil Khyalia and Haejun Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=x7cuUZxwFS}\n}",
        "github": "",
        "project": "",
        "reviewers": "PFEM;eeiy;wRZy;vaGo",
        "site": "https://openreview.net/forum?id=x7cuUZxwFS",
        "pdf_size": 804085,
        "rating": "3;5;6;6",
        "confidence": "4;4;2;3",
        "soundness": "3;3;3;3",
        "contribution": "1;2;3;3",
        "presentation": "2;3;3;2",
        "wc_summary": "96;37;29;84",
        "wc_strengths": "15;87;39;51",
        "wc_weaknesses": "248;1136;109;91",
        "wc_questions": "94;169;2;86",
        "wc_review": "453;1429;179;312",
        "wc_reply_reviewers": "31;234;19;0",
        "wc_reply_authors": "1215;3018;508;463",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "3;5;2;2",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            61.5,
            28.952547383606852
        ],
        "wc_strengths_avg": [
            48.0,
            25.98076211353316
        ],
        "wc_weaknesses_avg": [
            396.0,
            431.5373680227473
        ],
        "wc_questions_avg": [
            87.75,
            59.15393055410604
        ],
        "wc_review_avg": [
            593.25,
            492.15158995984154
        ],
        "wc_reply_reviewers_avg": [
            71.0,
            94.75494710040209
        ],
        "wc_reply_authors_avg": [
            1301.0,
            1035.202637168202
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            1.224744871391589
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.7385489458759963,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10707758445061663632&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Samsung;Carnegie Mellon University;Georgia Institute of Technology",
        "aff_unique_dep": "Samsung;;",
        "aff_unique_url": "https://www.samsung.com;https://www.cmu.edu;https://www.gatech.edu",
        "aff_unique_abbr": "Samsung;CMU;Georgia Tech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "title": "A Restoration Network as an Implicit Prior",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17467",
        "id": "x7d1qXEn1e",
        "author_site": "Yuyang Hu, Mauricio Delbracio, Peyman Milanfar, Ulugbek Kamilov",
        "tldr": "",
        "abstract": "Image denoisers have been shown to be powerful priors for solving inverse problems in imaging. In this work, we introduce a generalization of these methods that allows any image restoration network to be used as an implicit prior. The proposed method uses priors specified by deep neural networks pre-trained as general restoration operators. The method provides a principled approach for adapting state-of-the-art restoration models for other inverse problems. Our theoretical result analyzes its convergence to a stationary point of a global functional associated with the restoration operator. Numerical results show that the method using a super-resolution prior achieves state-of-the-art performance both quantitatively and qualitatively. Overall, this work offers a step forward for solving inverse problems by enabling the use of powerful pre-trained restoration models as priors.",
        "keywords": "computational imaging;inverse problems;deep learning;plug-and-play priors",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/af8eb5aeb34f18c1622509dec7a59ddff6274338.zip",
        "author": "Yuyang Hu;Mauricio Delbracio;Peyman Milanfar;Ulugbek Kamilov",
        "authorids": "~Yuyang_Hu1;~Mauricio_Delbracio1;~Peyman_Milanfar1;~Ulugbek_Kamilov1",
        "gender": "M;M;M;Not Specified",
        "homepage": "https://hu-yuyang.github.io/;;http://www.milanfar.org;https://ukmlv.github.io",
        "dblp": ";90/10811;48/6882;73/9223",
        "google_scholar": "FvRrgTsAAAAJ;lDDm920AAAAJ;iGzDl8IAAAAJ;https://scholar.google.com.tw/citations?user=3qYUSDwAAAAJ",
        "orcid": ";;;0000-0001-6770-3278",
        "linkedin": ";;;",
        "or_profile": "~Yuyang_Hu1;~Mauricio_Delbracio1;~Peyman_Milanfar1;~Ulugbek_Kamilov1",
        "aff": "Mitsubishi Electric Research Labs;Google;Google;Google",
        "aff_domain": "merl.com;google.com;google.com;google.com",
        "position": "Intern;Research Scientist;Distinguished Scientist;Visiting Faculty Researcher",
        "bibtex": "@inproceedings{\nhu2024a,\ntitle={A Restoration Network as an Implicit Prior},\nauthor={Yuyang Hu and Mauricio Delbracio and Peyman Milanfar and Ulugbek Kamilov},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=x7d1qXEn1e}\n}",
        "github": "",
        "project": "",
        "reviewers": "RzPk;3U6y;v5mr;U9fM",
        "pdf_size": 4807623,
        "rating": "5;6;6;8",
        "confidence": "4;4;4;5",
        "soundness": "2;3;3;4",
        "contribution": "2;3;3;3",
        "presentation": "2;3;2;4",
        "wc_summary": "79;50;91;75",
        "wc_strengths": "21;21;58;73",
        "wc_weaknesses": "181;112;241;378",
        "wc_questions": "8;106;136;114",
        "wc_review": "289;289;526;640",
        "wc_reply_reviewers": "161;207;58;0",
        "wc_reply_authors": "1341;1708;983;936",
        "reply_reviewers": "4;3;1;0",
        "reply_authors": "6;5;3;3",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            73.75,
            14.922717580923388
        ],
        "wc_strengths_avg": [
            43.25,
            22.873292285982796
        ],
        "wc_weaknesses_avg": [
            228.0,
            97.89535229008577
        ],
        "wc_questions_avg": [
            91.0,
            49.16299421312742
        ],
        "wc_review_avg": [
            436.0,
            152.4253915855229
        ],
        "wc_reply_reviewers_avg": [
            106.5,
            81.80006112467154
        ],
        "wc_reply_authors_avg": [
            1242.0,
            311.31736218849085
        ],
        "reply_reviewers_avg": [
            2.0,
            1.5811388300841898
        ],
        "reply_authors_avg": [
            4.25,
            1.299038105676658
        ],
        "replies_avg": [
            33,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.9271726499455306,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7827272022308987296&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=x7d1qXEn1e",
        "pdf": "https://openreview.net/pdf?id=x7d1qXEn1e",
        "email": "merl.com;google.com;google.com;google.com",
        "author_num": 4,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Mitsubishi Electric Research Laboratories;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.merl.com;https://www.google.com",
        "aff_unique_abbr": "MERL;Google",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "x7kyIVdtSz",
        "title": "Strided Transformers for Partially-Parallelized Inference",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Auto-regressive large language models have dramatically improved performance in natural language generation tasks. Popular architectures such as the transformer have enabled parallel training across tokens and scaled to large corpora of datasets. Generation--however--remains a fundamentally serial task where a token must be fully predicted before processing of the next token begins. In this work, we propose a framework for partially-parallelized large model inference by striding autoregressive dependencies between model layers, yielding strategies to improve latency in either memory or compute bound workflows, while preserving fully parallel training. The associated models require a simple modification in training by rolling representations along the sequence axes and create a favorable setup in inference with only minor degredation in accuracy.",
        "keywords": "transformers;auto-regressive;inference",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Amil Merchant;Ekin Dogus Cubuk;Stefano Ermon",
        "authorids": "~Amil_Merchant1;~Ekin_Dogus_Cubuk1;~Stefano_Ermon1",
        "gender": "M;M;M",
        "homepage": "https://scholar.google.com/citations?user=uRImMPoAAAAJ&hl=en;;http://cs.stanford.edu/~ermon/",
        "dblp": ";83/7734;47/8135",
        "google_scholar": ";Mu_8iOEAAAAJ;",
        "orcid": ";;",
        "linkedin": ";ekin-dogus-cubuk-9148b8114/;",
        "or_profile": "~Amil_Merchant1;~Ekin_Dogus_Cubuk1;~Stefano_Ermon1",
        "aff": "Stanford University;Google;Stanford University",
        "aff_domain": "stanford.edu;google.com;stanford.edu",
        "position": "PhD student;Staff Research Scientist;Associate Professor",
        "bibtex": "@misc{\nmerchant2024strided,\ntitle={Strided Transformers for Partially-Parallelized Inference},\nauthor={Amil Merchant and Ekin Dogus Cubuk and Stefano Ermon},\nyear={2024},\nurl={https://openreview.net/forum?id=x7kyIVdtSz}\n}",
        "github": "",
        "project": "",
        "reviewers": "AsVD;YvXk;6i1Q",
        "site": "https://openreview.net/forum?id=x7kyIVdtSz",
        "pdf_size": 482116,
        "rating": "1;3;3",
        "confidence": "5;4;4",
        "soundness": "1;2;1",
        "contribution": "1;2;2",
        "presentation": "1;2;2",
        "wc_summary": "26;69;40",
        "wc_strengths": "13;33;10",
        "wc_weaknesses": "76;129;81",
        "wc_questions": "1;35;9",
        "wc_review": "116;266;140",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            45.0,
            17.90716802475106
        ],
        "wc_strengths_avg": [
            18.666666666666668,
            10.208928554075703
        ],
        "wc_weaknesses_avg": [
            95.33333333333333,
            23.893281249943232
        ],
        "wc_questions_avg": [
            15.0,
            14.514360704718161
        ],
        "wc_review_avg": [
            174.0,
            65.7875368135941
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:RiF2MKYmD-kJ:scholar.google.com/&scioq=Strided+Transformers+for+Partially-Parallelized+Inference&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Stanford University;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.stanford.edu;https://www.google.com",
        "aff_unique_abbr": "Stanford;Google",
        "aff_campus_unique_index": "0;1;0",
        "aff_campus_unique": "Stanford;Mountain View",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "x8ElSuQWQp",
        "title": "IW-GAE: Importance weighted group accuracy estimation for improved calibration and model selection in unsupervised domain adaptation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Reasoning about a model's accuracy on a test sample from its confidence is a central problem in machine learning, being connected to important applications such as uncertainty representation, model selection, and exploration. While these connections have been well-studied in the i.i.d. settings, distribution shifts pose significant challenges to the traditional methods. Therefore, model calibration and model selection remain challenging in the unsupervised domain adaptation problem--a scenario where the goal is to perform well in a distribution shifted domain without labels. In this work, we tackle difficulties coming from distribution shifts by developing a novel importance weighted group accuracy estimator. Specifically, we formulate an optimization problem for finding importance weight that leads to an accurate group accuracy estimation in the distribution shifted domain with theoretical analysis. Extensive experiments show the effectiveness of group accuracy estimation on model calibration and model selection. Our results emphasize the significance of group accuracy estimation for addressing challenges in unsupervised domain adaptation, as an orthogonal improvement direction with improving transferability of accuracy.",
        "keywords": "Domain adaptation;model selection;uncertainty representation;unsupervised domain adaptation;importance weight",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Taejong Joo;Diego Klabjan",
        "authorids": "~Taejong_Joo1;~Diego_Klabjan1",
        "gender": "M;M",
        "homepage": "https://tjoo512.github.io/;http://dynresmanagement.com/index.html",
        "dblp": "237/3935;17/105",
        "google_scholar": "ESo1UqMAAAAJ;TaQZ_VUAAAAJ",
        "orcid": ";0000-0003-4213-9281",
        "linkedin": ";diegoklabjan",
        "or_profile": "~Taejong_Joo1;~Diego_Klabjan1",
        "aff": "Northwestern University;Northwestern University",
        "aff_domain": "u.northwestern.edu;u.northwestern.edu",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\njoo2024iwgae,\ntitle={{IW}-{GAE}: Importance weighted group accuracy estimation for improved calibration and model selection in unsupervised domain adaptation},\nauthor={Taejong Joo and Diego Klabjan},\nyear={2024},\nurl={https://openreview.net/forum?id=x8ElSuQWQp}\n}",
        "github": "",
        "project": "",
        "reviewers": "8U9C;WXHo;4Yn5;Yb2X",
        "site": "https://openreview.net/forum?id=x8ElSuQWQp",
        "pdf_size": 1472590,
        "rating": "3;5;5;5",
        "confidence": "3;2;3;4",
        "soundness": "2;3;3;2",
        "contribution": "2;3;2;2",
        "presentation": "2;2;3;2",
        "wc_summary": "55;38;65;67",
        "wc_strengths": "46;17;67;59",
        "wc_weaknesses": "155;3;127;382",
        "wc_questions": "35;370;6;9",
        "wc_review": "291;428;265;517",
        "wc_reply_reviewers": "0;112;0;130",
        "wc_reply_authors": "663;888;526;2339",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "1;2;1;4",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            56.25,
            11.4755174175285
        ],
        "wc_strengths_avg": [
            47.25,
            19.00493356999703
        ],
        "wc_weaknesses_avg": [
            166.75,
            136.80711787037984
        ],
        "wc_questions_avg": [
            105.0,
            153.41284170498895
        ],
        "wc_review_avg": [
            375.25,
            102.6264463966282
        ],
        "wc_reply_reviewers_avg": [
            60.5,
            60.833789952624194
        ],
        "wc_reply_authors_avg": [
            1104.0,
            724.6457755345021
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=818625207292464182&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 10,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Northwestern University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.northwestern.edu",
        "aff_unique_abbr": "NU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Are Bert Family Good Instruction Followers? A Study on Their Potential And Limitations",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17466",
        "id": "x8VNtpCu1I",
        "author_site": "yisheng xiao, Zechen Sun, Juntao Li, Min Zhang, Zechang Li, Qingrong Xia, Xinyu Duan, Zhefeng Wang",
        "tldr": "",
        "abstract": "Language modeling at scale has proven very effective and brought unprecedented success to natural language models. Many typical representatives, especially decoder-only models, e.g., BLOOM and LLaMA, and encoder-decoder models, e.g., Flan-T5 and AlexaTM, have exhibited incredible instruction-following capabilities while keeping strong task completion ability. These large language models can achieve superior performance in various tasks and even yield emergent capabilities, e.g., reasoning and universal generalization. Though the above two paradigms are mainstream and well explored, the potential of the BERT family, which are encoder-only based models and have ever been one of the most representative pre-trained models, also deserves attention, at least should be discussed. In this work, we adopt XML-R to explore the effectiveness of the BERT family for instruction following and zero-shot learning. We first design a simple yet effective strategy to utilize the encoder-only models for generation tasks and then conduct multi-task instruction tuning.  Experimental results demonstrate that our fine-tuned model, Instruct-XMLR, outperforms Bloomz on all evaluation tasks and achieves comparable performance with mT0 on most tasks. Surprisingly, Instruct-XMLR also possesses strong task and language generalization abilities, indicating that Instruct-XMLR can also serve as a good instruction follower and zero-shot learner. Besides, Instruct-XMLR can accelerate decoding due to its non-autoregressive generation manner, achieving around 3 times speedup compared with current autoregressive large language models. Although we also witnessed several limitations through our experiments, such as the performance decline in long-generation tasks and the shortcoming of length prediction, Instruct-XMLR can still become a good member of the family of current large language models.",
        "keywords": "Instruction tuning;Large language models;BERT family;Natural language generation",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "yisheng xiao;Juntao Li;Zechen Sun;Zechang Li;Qingrong Xia;Xinyu Duan;Zhefeng Wang;Min Zhang",
        "authorids": "~yisheng_xiao1;~Juntao_Li2;~Zechen_Sun1;~Zechang_Li1;~Qingrong_Xia1;~Xinyu_Duan1;~Zhefeng_Wang1;~Min_Zhang9",
        "gender": "M;M;F;;M;M;M;M",
        "homepage": "https://github.com/xysnlp;https://lijuntaopku.github.io/;https://github.com/settings/profile;;http://hlt.suda.edu.cn/kiro/;;;https://zhangmin-nlp-ai.github.io/",
        "dblp": "318/9066;;;248/7876;185/0855;31/5936;147/9113;83/5342-5",
        "google_scholar": "https://scholar.google.com.hk/citations?user=WS2_XwoAAAAJ;sZSygsYAAAAJ;;;_A4Y3PQAAAAJ;Z1XYinwAAAAJ;t22ZUJ4AAAAJ;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": ";0000-0002-6286-7529;;;;;;",
        "linkedin": ";;;;;;;",
        "or_profile": "~yisheng_xiao1;~Juntao_Li2;~Zechen_Sun1;~Zechang_Li1;~Qingrong_Xia1;~Xinyu_Duan1;~Zhefeng_Wang1;~Min_Zhang9",
        "aff": "Suzhou University;Soochow University, China;Suchow University;Alibaba Group;Huawei Technologies Ltd.;Huawei Technologies Ltd.;Huawei Technologies Ltd.;Harbin Institute of Technology, Shenzhen",
        "aff_domain": "suda.edu.cn;suda.edu.cn;suda.edu.cn;alibaba-inc.com;huawei.com;huawei.com;huawei.com;hit.edu.cn",
        "position": "PhD student;Associate Professor;PhD student;Researcher;Researcher;Researcher;Researcher;Full Professor",
        "bibtex": "@inproceedings{\nxiao2024are,\ntitle={Are Bert Family Good Instruction Followers?  A Study on Their Potential And Limitations},\nauthor={yisheng xiao and Juntao Li and Zechen Sun and Zechang Li and Qingrong Xia and Xinyu Duan and Zhefeng Wang and Min Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=x8VNtpCu1I}\n}",
        "github": "",
        "project": "",
        "reviewers": "bkXV;fL5N;oFHF",
        "pdf_size": 319052,
        "rating": "6;6;8",
        "confidence": "4;3;3",
        "soundness": "3;4;3",
        "contribution": "2;4;3",
        "presentation": "3;4;4",
        "wc_summary": "183;74;54",
        "wc_strengths": "16;64;58",
        "wc_weaknesses": "147;105;103",
        "wc_questions": "102;8;48",
        "wc_review": "448;251;263",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "745;668;286",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            103.66666666666667,
            56.68823119092318
        ],
        "wc_strengths_avg": [
            46.0,
            21.354156504062622
        ],
        "wc_weaknesses_avg": [
            118.33333333333333,
            20.28683207293725
        ],
        "wc_questions_avg": [
            52.666666666666664,
            38.5169515350781
        ],
        "wc_review_avg": [
            320.6666666666667,
            90.17144164805666
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            566.3333333333334,
            200.70265458024105
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15907110720801609639&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=x8VNtpCu1I",
        "pdf": "https://openreview.net/pdf?id=x8VNtpCu1I",
        "email": "suda.edu.cn;suda.edu.cn;suda.edu.cn;alibaba-inc.com;huawei.com;huawei.com;huawei.com;hit.edu.cn",
        "author_num": 8,
        "aff_unique_index": "0;1;2;3;4;4;4;5",
        "aff_unique_norm": "Suzhou University;Soochow University;Suchow University;Alibaba Group;Huawei;Harbin Institute of Technology",
        "aff_unique_dep": ";;;;Huawei Technologies;",
        "aff_unique_url": "https://www.suda.edu.cn;https://www.soochow.edu.cn;;https://www.alibaba.com;https://www.huawei.com;http://en.hhit.edu.cn/",
        "aff_unique_abbr": "Suda;Soochow U;;Alibaba;Huawei;HIT",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Shenzhen",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "x8mzNomCRe",
        "title": "Benchmarking the Robustness of Cross-view Geo-localization Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "This paper investigates the cross-view geo-localization task, which aims to compare ground query images with an aerial image database tagged with GPS coordinates to determine the capture location of ground images. This task holds considerable significance across multiple domains, including autonomous driving, robotic navigation, and 3D reconstruction. Despite recent notable performance improvements, existing models lack robustness against real-world environmental variations such as adverse weather conditions and sensor noise. This deficiency poses potential risks when integrating this task into safety-critical applications. To comprehensively evaluate the robustness of existing methods, this paper introduces the first benchmarks for evaluating the robustness of cross-view geo-localization models to real-world image corruptions. We applied 16 corruption types to a widely used public dataset, including CVUSA and CVACT, with 5 corruption severities per type, ultimately generating about 1.5 million corrupted images to study the robustness of different models. This study contributes by revealing the performance degradation of cross-view geo-localization models on corrupted images and provides user-friendly robustness evaluation benchmarks. Additionally, we introduce straightforward and effective robustness enhancement techniques (stylization and histogram equalization) to consistently improve the robustness of various models. The codes and benchmarks are available online.",
        "keywords": "Cross-view Geo-localization;Robustness Benchmark;Robustness Evaluation;Robustness Enhancement",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/2b7206757186e0ceaa5c6c7a6a4c97a9b8a8ebe4.zip",
        "author": "Qingwang Zhang;hongji yang;Yingying Zhu",
        "authorids": "~Qingwang_Zhang1;~hongji_yang1;~Yingying_Zhu7",
        "gender": "M;F;M",
        "homepage": ";https://csse.szu.edu.cn/pages/user/index?id=593;https://www.um.edu.mo/staff/",
        "dblp": "310/0350;40/5552-1;",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;X_aB1kAAAAAJ;",
        "orcid": ";0000-0002-3475-6186;",
        "linkedin": ";;",
        "or_profile": "~Qingwang_Zhang1;~Yingying_Zhu7;~Hongji_Yang3",
        "aff": "Shenzhen University;Shenzhen University;University of Macau",
        "aff_domain": "szu.edu.cn;szu.edu.cn;um.edu.mo",
        "position": "MS student;Full Professor;PhD student",
        "bibtex": "@misc{\nzhang2024benchmarking,\ntitle={Benchmarking the Robustness of Cross-view Geo-localization Models},\nauthor={Qingwang Zhang and hongji yang and Yingying Zhu},\nyear={2024},\nurl={https://openreview.net/forum?id=x8mzNomCRe}\n}",
        "github": "",
        "project": "",
        "reviewers": "dQuR;Lf8Y;5XKV",
        "site": "https://openreview.net/forum?id=x8mzNomCRe",
        "pdf_size": 10649563,
        "rating": "3;3;6",
        "confidence": "4;5;5",
        "soundness": "2;2;3",
        "contribution": "2;2;2",
        "presentation": "2;2;3",
        "wc_summary": "14;78;54",
        "wc_strengths": "14;50;49",
        "wc_weaknesses": "61;320;69",
        "wc_questions": "3;170;5",
        "wc_review": "92;618;177",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            48.666666666666664,
            26.398653164297773
        ],
        "wc_strengths_avg": [
            37.666666666666664,
            16.73983937265296
        ],
        "wc_weaknesses_avg": [
            150.0,
            120.2525121012724
        ],
        "wc_questions_avg": [
            59.333333333333336,
            78.25741001478532
        ],
        "wc_review_avg": [
            295.6666666666667,
            230.55054880775182
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:IVmMMsPzFeoJ:scholar.google.com/&scioq=Benchmarking+the+Robustness+of+Cross-view+Geo-localization+Models&hl=en&as_sdt=0,14",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Shenzhen University;University of Macau",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.szu.edu.cn;https://www.um.edu.mo",
        "aff_unique_abbr": "SZU;UM",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Macau SAR",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "x9cVJnlX9n",
        "title": "Risk-Controlling Model Selection via Guided Bayesian Optimization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Adjustable hyperparameters of machine learning models typically impact various key trade-offs such as accuracy, fairness, robustness, or inference cost. Our goal in this paper is to find a configuration that adheres to user-specified limits on certain risks while being useful with respect to other conflicting metrics. We solve this by combining Bayesian Optimization (BO) with rigorous risk-controlling procedures, where our core idea is to steer BO towards an efficient testing strategy. Our BO method identifies a set of Pareto optimal configurations residing in a designated region of interest. The resulting candidates are statistically verified and the best-performing configuration is selected with guaranteed risk levels. We demonstrate the effectiveness of our approach on a range of tasks with multiple desiderata, including low error rates, equitable predictions, handling spurious correlations, managing rate and distortion in generative models, and reducing computational costs.",
        "keywords": "conformal prediction;risk control;multi-objective optimization;Bayesian optimization;multiple hypothesis testing",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/3d6adf698ba4931115d32ef0179965b4a937e5cc.pdf",
        "author": "Bracha Laufer-Goldshtein;Adam Fisch;Regina Barzilay;Tommi S. Jaakkola",
        "authorids": "~Bracha_Laufer-Goldshtein1;~Adam_Fisch2;~Regina_Barzilay1;~Tommi_S._Jaakkola1",
        "gender": "F;;female;",
        "homepage": "https://brachalaufer.wixsite.com/home;;https://www.regina.csail.mit.edu/;",
        "dblp": ";;b/ReginaBarzilay;",
        "google_scholar": "1YweTFwAAAAJ;;;",
        "orcid": ";;;",
        "linkedin": "bracha-laufer-73a10422b/;;;",
        "or_profile": "~Bracha_Laufer-Goldshtein1;~Adam_Fisch2;~Regina_Barzilay1;~Tommi_S._Jaakkola1",
        "aff": "Tel Aviv University;;Massachusetts Institute of Technology;",
        "aff_domain": "tau.ac.il;;mit.edu;",
        "position": "Assistant Professor;;Professor;",
        "bibtex": "@misc{\nlaufer-goldshtein2024riskcontrolling,\ntitle={Risk-Controlling Model Selection via Guided Bayesian Optimization},\nauthor={Bracha Laufer-Goldshtein and Adam Fisch and Regina Barzilay and Tommi S. Jaakkola},\nyear={2024},\nurl={https://openreview.net/forum?id=x9cVJnlX9n}\n}",
        "github": "",
        "project": "",
        "reviewers": "riWN;kvnt;tf6K;v3KF",
        "site": "https://openreview.net/forum?id=x9cVJnlX9n",
        "pdf_size": 2961580,
        "rating": "3;5;5;6",
        "confidence": "3;3;3;2",
        "soundness": "3;3;2;2",
        "contribution": "2;3;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "73;211;105;112",
        "wc_strengths": "60;87;110;45",
        "wc_weaknesses": "144;390;293;245",
        "wc_questions": "101;205;8;139",
        "wc_review": "378;893;516;541",
        "wc_reply_reviewers": "0;181;122;25",
        "wc_reply_authors": "779;1453;1077;438",
        "reply_reviewers": "0;2;1;2",
        "reply_authors": "2;4;2;3",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            125.25,
            51.644820650284
        ],
        "wc_strengths_avg": [
            75.5,
            24.964975465639856
        ],
        "wc_weaknesses_avg": [
            268.0,
            88.6199751749006
        ],
        "wc_questions_avg": [
            113.25,
            71.25438582992629
        ],
        "wc_review_avg": [
            582.0,
            189.98289396679903
        ],
        "wc_reply_reviewers_avg": [
            82.0,
            73.09924760214705
        ],
        "wc_reply_authors_avg": [
            936.75,
            374.1058506626166
        ],
        "reply_reviewers_avg": [
            1.25,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.6622661785325219,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13368008016960452994&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Tel Aviv University;Massachusetts Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tau.ac.il;https://web.mit.edu",
        "aff_unique_abbr": "TAU;MIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "Israel;United States"
    },
    {
        "id": "xA25Ib7H8U",
        "title": "Understanding Continuous-depth Networks through the Lens of Homogeneous Ricci Flows",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The continuous-depth models pioneered by Neural ODEs have sparked a resurgence in exploring dynamic systems based on deep learning prototypes. The studies employed to investigate their theoretical properties mainly rely on Euclidean space, however, the geometric principle of general neural networks has been developed on the Riemannian manifold. Motivated by this open problem, we construct a formalized geometric theory of continuous-depth networks through the lens of homogeneous Ricci flows. From this perspective, the Riemannian metric tensor with coordinate representations learned by the continuous-depth network itself is the closed-form solution of homogeneous Ricci flows. With the presence of Ricci solitons, the Ricci curvature tensor on the underlying data manifold emerges for the first time. This implies that the continuous-depth network governs the Ricci curvature to drive the different kinds of data apart from each other, which is a novel observation between the Ricci curvature and data separation. Toy experiments confirm parts of the proposed theory, as well as provide intuitions and visualizations as to how the Ricci curvature tensor governed by continuous-depth networks evolves on the manifold to operate on data.",
        "keywords": "Riemannian geometry;Time-dependent ODE;Continuous-depth network",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Jun Chen;Guang Dai;Ivor Tsang;Yong Liu",
        "authorids": "~Jun_Chen9;~Guang_Dai1;~Ivor_Tsang1;~Yong_Liu11",
        "gender": "M;M;M;M",
        "homepage": ";;https://person.zju.edu.cn/en/yongliu;https://www.a-star.edu.sg/cfar/about-cfar/management/prof-ivor-tsang",
        "dblp": ";;29/4867-7;35/5873",
        "google_scholar": "YKc2O78AAAAJ;;https://scholar.google.com.hk/citations?user=qYcgBbEAAAAJ;rJMOlVsAAAAJ",
        "orcid": "0000-0001-6568-8801;0000-0002-3529-9087;0000-0003-4822-8939;",
        "linkedin": ";;;",
        "or_profile": "~Jun_Chen9;~Guang_Dai1;~Yong_Liu11;~Ivor_W_Tsang1",
        "aff": "Zhejiang University;SGIT AI;Zhejiang University;A*STAR",
        "aff_domain": "zju.edu.cn;sgcc.com.cn;zju.edu.cn;cfar.a-star.edu.sg",
        "position": "PhD student;Principal Researcher;Full Professor;Principal Researcher",
        "bibtex": "@misc{\nchen2024understanding,\ntitle={Understanding Continuous-depth Networks through the Lens of Homogeneous Ricci Flows},\nauthor={Jun Chen and Guang Dai and Ivor Tsang and Yong Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=xA25Ib7H8U}\n}",
        "github": "",
        "project": "",
        "reviewers": "xSRc;8HH4;6G4r",
        "site": "https://openreview.net/forum?id=xA25Ib7H8U",
        "pdf_size": 4133537,
        "rating": "1;3;3",
        "confidence": "5;3;2",
        "soundness": "2;1;2",
        "contribution": "1;2;3",
        "presentation": "2;1;1",
        "wc_summary": "34;60;63",
        "wc_strengths": "2;27;75",
        "wc_weaknesses": "211;94;282",
        "wc_questions": "1;12;131",
        "wc_review": "248;193;551",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            1.247219128924647
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            52.333333333333336,
            13.021349989749739
        ],
        "wc_strengths_avg": [
            34.666666666666664,
            30.291179500896884
        ],
        "wc_weaknesses_avg": [
            195.66666666666666,
            77.51272296998876
        ],
        "wc_questions_avg": [
            48.0,
            58.86141916966211
        ],
        "wc_review_avg": [
            330.6666666666667,
            157.4088801674021
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9449111825230683,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:VIqm3I6hr6YJ:scholar.google.com/&scioq=Understanding+Continuous-depth+Networks+through+the+Lens+of+Homogeneous+Ricci+Flows&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "Zhejiang University;SGIT AI;Agency for Science, Technology and Research",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.zju.edu.cn;;https://www.a-star.edu.sg",
        "aff_unique_abbr": "ZJU;;A*STAR",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;2",
        "aff_country_unique": "China;;Singapore"
    },
    {
        "title": "On the Stability of Expressive Positional Encodings for Graphs",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17465",
        "id": "xAqcJ9XoTf",
        "author_site": "Yinan Huang, William Lu, Joshua Robinson, Yu Yang, Muhan Zhang, Stefanie Jegelka, Pan Li",
        "tldr": "",
        "abstract": "Designing effective positional encodings for graphs is key to building powerful graph transformers and enhancing message-passing graph neural networks. Although widespread, using Laplacian eigenvectors as positional encodings faces two fundamental challenges: (1) *Non-uniqueness*: there are many different eigendecompositions of the same Laplacian, and (2) *Instability*: small perturbations to the Laplacian could result in completely different eigenspaces, leading to unpredictable changes in positional encoding.  Despite many attempts to address non-uniqueness, most methods overlook stability, leading to poor generalization on unseen graph structures. We identify the cause of instability to be the use of \"hard partition'' of eigenspaces. Hence, we introduce Stable and Expressive Positional Encodings (SPE), an architecture for processing eigenvectors that uses eigenvalues to ``softly partition'' eigenspaces. SPE is the first architecture that is (1) provably stable, and (2) universally expressive for basis invariant functions whilst respecting all symmetries of eigenvectors. Besides guaranteed stability, we prove that SPE is at least as expressive as existing methods, and highly capable of counting graph structures. Finally, we evaluate the effectiveness of our method on molecular property prediction, and out-of-distribution generalization tasks, finding improved generalization compared to existing positional encoding methods. Our code is available\nat https://github.com/Graph-COM/SPE.",
        "keywords": "graph neural networks;positional encoding;stability",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/c5dbf31c748d4fa53a93b7ad55b10ba05c893d31.zip",
        "author": "Yinan Huang;William Lu;Joshua Robinson;Yu Yang;Muhan Zhang;Stefanie Jegelka;Pan Li",
        "authorids": "~Yinan_Huang1;~William_Lu1;~Joshua_Robinson4;~Yu_Yang15;~Muhan_Zhang1;~Stefanie_Jegelka3;~Pan_Li2",
        "gender": ";;M;M;F;;M",
        "homepage": ";;;https://muhanzhang.github.io/;http://people.csail.mit.edu/stefje/;;https://joshrobinson.mit.edu/",
        "dblp": "288/1207;;;157/5518;38/7003;https://dblp.org/pers/hd/l/Li_0005:Pan;15/4759",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;;https://scholar.google.com.hk/citations?user=sC2yg2gAAAAJ;https://scholar.google.com.hk/citations?user=OBBqkosAAAAJ;gTWUZlsAAAAJ;IroP0EwAAAAJ;E02doCkAAAAJ",
        "orcid": ";0009-0007-9149-8949;;0000-0002-7680-6401;;;",
        "linkedin": ";william-lu-b01b0a153/;;jerry-muhan-zhang-a33a1777/;;pan-li-b951105a/;",
        "or_profile": "~Yinan_Huang1;~William_Lu1;~Yu_Yang15;~Muhan_Zhang1;~Stefanie_Jegelka3;~Pan_Li2;~Joshua_David_Robinson1",
        "aff": "Georgia Institute of Technology;Purdue University;Duke University;Peking University;Massachusetts Institute of Technology;Purdue University;Stanford University",
        "aff_domain": "gatech.edu;purdue.edu;duke.edu;pku.edu.cn;mit.edu;purdue.edu;stanford.edu",
        "position": "PhD student;PhD student;PhD student;Assistant Professor;Associate Professor;Assistant Professor;Postdoc",
        "bibtex": "@inproceedings{\nhuang2024on,\ntitle={On the Stability of Expressive Positional Encodings for Graphs},\nauthor={Yinan Huang and William Lu and Joshua Robinson and Yu Yang and Muhan Zhang and Stefanie Jegelka and Pan Li},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=xAqcJ9XoTf}\n}",
        "github": "",
        "project": "",
        "reviewers": "qQbF;fM7Q;mePj;TVwL;Fdup",
        "pdf_size": 733002,
        "rating": "5;5;6;6;8",
        "confidence": "4;3;4;3;4",
        "soundness": "3;3;3;3;4",
        "contribution": "3;2;3;3;2",
        "presentation": "4;2;3;3;3",
        "wc_summary": "96;53;86;78;55",
        "wc_strengths": "117;76;96;49;92",
        "wc_weaknesses": "308;117;89;282;169",
        "wc_questions": "60;5;142;28;145",
        "wc_review": "581;251;413;437;461",
        "wc_reply_reviewers": "213;0;14;387;85",
        "wc_reply_authors": "1259;776;433;964;799",
        "reply_reviewers": "1;0;1;3;2",
        "reply_authors": "4;2;1;3;2",
        "rating_avg": [
            6.0,
            1.0954451150103321
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            3.2,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            3.0,
            0.6324555320336759
        ],
        "wc_summary_avg": [
            73.6,
            17.00117642988273
        ],
        "wc_strengths_avg": [
            86.0,
            22.653917983430592
        ],
        "wc_weaknesses_avg": [
            193.0,
            87.53742056971979
        ],
        "wc_questions_avg": [
            76.0,
            57.82387050345212
        ],
        "wc_review_avg": [
            428.6,
            105.95395226229176
        ],
        "wc_reply_reviewers_avg": [
            139.8,
            144.802486166502
        ],
        "wc_reply_authors_avg": [
            846.2,
            269.13595077581147
        ],
        "reply_reviewers_avg": [
            1.4,
            1.019803902718557
        ],
        "reply_authors_avg": [
            2.4,
            1.019803902718557
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.372677996249965,
        "gs_citation": 36,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3106840890629929334&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=xAqcJ9XoTf",
        "pdf": "https://openreview.net/pdf?id=xAqcJ9XoTf",
        "email": "gatech.edu;purdue.edu;duke.edu;pku.edu.cn;mit.edu;purdue.edu;stanford.edu",
        "author_num": 7,
        "aff_unique_index": "0;1;2;3;4;1;5",
        "aff_unique_norm": "Georgia Institute of Technology;Purdue University;Duke University;Peking University;Massachusetts Institute of Technology;Stanford University",
        "aff_unique_dep": ";;;;;",
        "aff_unique_url": "https://www.gatech.edu;https://www.purdue.edu;https://www.duke.edu;http://www.pku.edu.cn;https://web.mit.edu;https://www.stanford.edu",
        "aff_unique_abbr": "Georgia Tech;Purdue;Duke;Peking U;MIT;Stanford",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Stanford",
        "aff_country_unique_index": "0;0;0;1;0;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "GeoDiffusion: Text-Prompted Geometric Control for Object Detection Data Generation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17464",
        "id": "xBfQZWeDRH",
        "author_site": "Kai Chen, Enze Xie, Zhe Chen, Yibo Wang, Lanqing HONG, Zhenguo Li, Dit-Yan Yeung",
        "tldr": "",
        "abstract": "Diffusion models have attracted significant attention due to the remarkable ability to create content and generate data for tasks like image classification. However, the usage of diffusion models to generate the high-quality object detection data remains an underexplored area, where not only image-level perceptual quality but also geometric conditions such as bounding boxes and camera views are essential. Previous studies have utilized either copy-paste synthesis or layout-to-image (L2I) generation with specifically designed modules to encode the semantic layouts. In this paper, we propose the GeoDiffusion, a simple framework that can flexibly translate various geometric conditions into text prompts and empower pre-trained text-to-image (T2I) diffusion models for high-quality detection data generation. Unlike previous L2I methods, our GeoDiffusion is able to encode not only the bounding boxes but also extra geometric conditions such as camera views in self-driving scenes. Extensive experiments demonstrate GeoDiffusion outperforms previous L2I methods while maintaining 4x training time faster. To the best of our knowledge, this is the first work to adopt diffusion models for layout-to-image generation with geometric conditions and demonstrate that L2I-generated images can be beneficial for improving the performance of object detectors.",
        "keywords": "diffusion model;controllable generation;object detection;autonomous driving",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Kai Chen;Enze Xie;Zhe Chen;Yibo Wang;Lanqing HONG;Zhenguo Li;Dit-Yan Yeung",
        "authorids": "~Kai_Chen11;~Enze_Xie1;~Zhe_Chen10;~Yibo_Wang7;~Lanqing_HONG1;~Zhenguo_Li1;~Dit-Yan_Yeung2",
        "gender": "M;M;M;M;F;M;M",
        "homepage": "https://kaichen1998.github.io/;https://xieenze.github.io/;https://czczup.github.io/;;https://racheltechie.github.io/;http://www.ee.columbia.edu/~zgli/;https://cse.hkust.edu.hk/faculty/dyyeung/",
        "dblp": "c/KaiChen24;218/5441;06/4240-17;;226/4258;23/6479;41/5668",
        "google_scholar": "3qBfyLIAAAAJ;42MVVPgAAAAJ;j1rq_lYAAAAJ;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com.sg/citations?user=2p7x6OUAAAAJ;XboZC1AAAAAJ;nEsOOx8AAAAJ",
        "orcid": ";;;;;;0000-0003-3716-8125",
        "linkedin": ";;;;;;",
        "or_profile": "~Kai_Chen11;~Enze_Xie1;~Zhe_Chen10;~Yibo_Wang7;~Lanqing_HONG1;~Zhenguo_Li1;~Dit-Yan_Yeung2",
        "aff": "Hong Kong University of Science and Technology;Huawei Noah's Ark Lab;Nanjing University;Tsinghua University;Huawei Technologies Ltd.;Huawei Noah's Ark Lab;Hong Kong University of Science and Technology",
        "aff_domain": "ust.hk;huawei.com;nju.edu.cn;mail.tsinghua.edu.cn;huawei.com;huawei.com;ust.hk",
        "position": "PhD student;Researcher;PhD student;MS student;Researcher;Principal Researcher;Chair Professor",
        "bibtex": "@inproceedings{\nchen2024geodiffusion,\ntitle={GeoDiffusion: Text-Prompted Geometric Control for Object Detection Data Generation},\nauthor={Kai Chen and Enze Xie and Zhe Chen and Yibo Wang and Lanqing HONG and Zhenguo Li and Dit-Yan Yeung},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=xBfQZWeDRH}\n}",
        "github": "",
        "project": "",
        "reviewers": "VRFf;qLFr;wbtJ;2g8v",
        "pdf_size": 18185659,
        "rating": "6;6;6;8",
        "confidence": "4;4;4;4",
        "soundness": "3;2;3;3",
        "contribution": "3;3;2;3",
        "presentation": "4;3;2;4",
        "wc_summary": "137;46;96;51",
        "wc_strengths": "25;23;60;53",
        "wc_weaknesses": "134;114;304;24",
        "wc_questions": "43;7;123;99",
        "wc_review": "339;190;583;227",
        "wc_reply_reviewers": "22;88;65;25",
        "wc_reply_authors": "516;628;1506;924",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "2;2;3;3",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            82.5,
            37.003378224156776
        ],
        "wc_strengths_avg": [
            40.25,
            16.452583383772897
        ],
        "wc_weaknesses_avg": [
            144.0,
            101.24228365658294
        ],
        "wc_questions_avg": [
            68.0,
            45.639894828976104
        ],
        "wc_review_avg": [
            334.75,
            153.46721962686365
        ],
        "wc_reply_reviewers_avg": [
            50.0,
            27.739863013360395
        ],
        "wc_reply_authors_avg": [
            893.5,
            383.7587132561292
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 24,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=354420883454384895&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=xBfQZWeDRH",
        "pdf": "https://openreview.net/pdf?id=xBfQZWeDRH",
        "email": "ust.hk;huawei.com;nju.edu.cn;mail.tsinghua.edu.cn;huawei.com;huawei.com;ust.hk",
        "author_num": 7,
        "aff_unique_index": "0;1;2;3;1;1;0",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Huawei;Nanjing University;Tsinghua University",
        "aff_unique_dep": ";Noah's Ark Lab;;",
        "aff_unique_url": "https://www.ust.hk;https://www.huawei.com;https://www.nju.edu.cn;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "HKUST;Huawei;Nanjing U;THU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Navigating Dataset Documentations in AI: A Large-Scale Analysis of Dataset Cards on HuggingFace",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17463",
        "id": "xC8xh2RSs2",
        "author_site": "Xinyu Yang, Victor Weixin Liang, James Y Zou",
        "tldr": "",
        "abstract": "Advances in machine learning are closely tied to the creation of datasets. While data documentation is widely recognized as essential to the reliability, reproducibility, and transparency of ML, we lack a systematic empirical understanding of current dataset documentation practices. To shed light on this question, here we take Hugging Face - one of the largest platforms for sharing and collaborating on ML models and datasets -  as a prominent case study. By analyzing all 7,433 dataset documentation on Hugging Face, our investigation provides an overview of the Hugging Face dataset ecosystem and insights into dataset documentation practices, yielding 5 main findings: (1) The dataset card completion rate shows marked heterogeneity correlated with dataset popularity: While 86.0\\% of the top 100 downloaded dataset cards fill out all sections suggested by Hugging Face community, only 7.9\\% of dataset cards with no downloads complete all these sections. (2) A granular examination of each section within the dataset card reveals that the practitioners seem to prioritize Dataset Description and Dataset Structure sections, accounting for 36.2\\% and 33.6\\% of the total card length, respectively, for the most downloaded datasets. In contrast, the Considerations for Using the Data section receives the lowest proportion of content, accounting for just 2.1\\% of the text. (3) By analyzing the subsections within each section and utilizing topic modeling to identify key topics, we uncover what is discussed in each section, and underscore significant themes encompassing both technical and social impacts, as well as limitations within the Considerations for Using the Data section. (4) Our findings also highlight the need for improved accessibility and reproducibility of datasets in the Usage sections. (5) In addition, our human annotation evaluation emphasizes the pivotal role of comprehensive dataset content in shaping individuals' perceptions of a dataset card's overall quality. Overall, our study offers a unique perspective on analyzing dataset documentation through large-scale data science analysis and underlines the need for more thorough dataset documentation in machine learning research.",
        "keywords": "dataset documentation;data-centric AI;large-scale analysis",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/c830b9d0854d4c57d08ce58506ae91ba3a22ed10.pdf",
        "author": "Xinyu Yang;Weixin Liang;James Zou",
        "authorids": "~Xinyu_Yang5;~Weixin_Liang1;~James_Zou1",
        "gender": "F;;",
        "homepage": "https://youngxinyu1802.github.io/;https://ai.stanford.edu/~wxliang/;",
        "dblp": ";231/1803;",
        "google_scholar": "wQvr1eoAAAAJ;7z9P1jYAAAAJ;23ZXZvEAAAAJ",
        "orcid": ";;",
        "linkedin": ";weixin-liang-2562aa154/;",
        "or_profile": "~Xinyu_Yang5;~Weixin_Liang1;~James_Zou1",
        "aff": "Cornell University;Stanford University;Stanford University",
        "aff_domain": "cornell.edu;stanford.edu;stanford.edu",
        "position": "PhD student;PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nyang2024navigating,\ntitle={Navigating Dataset Documentations in {AI}: A Large-Scale Analysis of Dataset Cards on HuggingFace},\nauthor={Xinyu Yang and Weixin Liang and James Zou},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=xC8xh2RSs2}\n}",
        "github": "",
        "project": "",
        "reviewers": "ALk3;eSEd;kkaF;gNxe",
        "pdf_size": 3644470,
        "rating": "5;5;8;8",
        "confidence": "3;4;4;5",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;2",
        "presentation": "2;4;3;4",
        "wc_summary": "26;39;88;22",
        "wc_strengths": "80;21;151;118",
        "wc_weaknesses": "106;165;13;65",
        "wc_questions": "6;190;69;123",
        "wc_review": "218;415;321;328",
        "wc_reply_reviewers": "171;0;0;0",
        "wc_reply_authors": "1768;2092;747;1269",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "5;4;2;3",
        "rating_avg": [
            6.5,
            1.5
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            43.75,
            26.309456474811487
        ],
        "wc_strengths_avg": [
            92.5,
            48.32442446630896
        ],
        "wc_weaknesses_avg": [
            87.25,
            55.68830667204741
        ],
        "wc_questions_avg": [
            97.0,
            67.80486708194331
        ],
        "wc_review_avg": [
            320.5,
            69.80866708367951
        ],
        "wc_reply_reviewers_avg": [
            42.75,
            74.0451720235695
        ],
        "wc_reply_authors_avg": [
            1469.0,
            509.6111262521649
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.5,
            1.118033988749895
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.7071067811865476,
        "gs_citation": 17,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10946356805844533642&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=xC8xh2RSs2",
        "pdf": "https://openreview.net/pdf?id=xC8xh2RSs2",
        "email": "cornell.edu;stanford.edu;stanford.edu",
        "author_num": 3,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Cornell University;Stanford University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cornell.edu;https://www.stanford.edu",
        "aff_unique_abbr": "Cornell;Stanford",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Stanford",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Score Regularized Policy Optimization through Diffusion Behavior",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17462",
        "id": "xCRr9DrolJ",
        "author_site": "Huayu Chen, Cheng Lu, Zhengyi Wang, Hang Su, Jun Zhu",
        "tldr": "",
        "abstract": "Recent developments in offline reinforcement learning have uncovered the immense potential of diffusion modeling, which excels at representing heterogeneous behavior policies. However, sampling from diffusion policies is considerably slow because it necessitates tens to hundreds of iterative inference steps for one action. To address this issue, we propose to extract an efficient deterministic inference policy from critic models and pretrained diffusion behavior models, leveraging the latter to directly regularize the policy gradient with the behavior\ndistribution\u2019s score function during optimization. Our method enjoys powerful generative capabilities of diffusion modeling while completely circumventing the computationally intensive and time-consuming diffusion sampling scheme, both during training and evaluation. Extensive results on D4RL tasks show that our method boosts action sampling speed by more than 25 times compared with various leading diffusion-based methods in locomotion tasks, while still maintaining state-of-the-art performance.",
        "keywords": "offline reinforcement learning;generative models;diffusion models;behavior modeling;computational efficiency",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/c92cd005689471bdbd0c0ec01fd63fb4b8bde9cc.zip",
        "author": "Huayu Chen;Cheng Lu;Zhengyi Wang;Hang Su;Jun Zhu",
        "authorids": "~Huayu_Chen1;~Cheng_Lu5;~Zhengyi_Wang1;~Hang_Su3;~Jun_Zhu2",
        "gender": "M;M;M;M;M",
        "homepage": "https://chendrag.github.io/;https://luchengthu.github.io/;https://thuwzy.github.io;http://ml.cs.tsinghua.edu.cn/~jun;",
        "dblp": "259/3113;91/1482-11;;50/2644-1;26/5371-6",
        "google_scholar": "0FBCHc4AAAAJ;vPE9VRoAAAAJ;dtuPuRQAAAAJ;axsP38wAAAAJ;dxN1_X0AAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Huayu_Chen1;~Cheng_Lu5;~Zhengyi_Wang1;~Jun_Zhu2;~Hang_Su2",
        "aff": "Tsinghua University;Tsinghua University;Tsinghua University;Tsinghua University;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;mail.tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "PhD student;PhD student;PhD student;Professor;Associate Professor",
        "bibtex": "@inproceedings{\nchen2024score,\ntitle={Score Regularized Policy Optimization through Diffusion Behavior},\nauthor={Huayu Chen and Cheng Lu and Zhengyi Wang and Hang Su and Jun Zhu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=xCRr9DrolJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "fYZE;f3qQ;cVKT;bNEQ",
        "pdf_size": 5015654,
        "rating": "3;6;8;8",
        "confidence": "3;3;3;3",
        "soundness": "3;3;2;4",
        "contribution": "2;3;3;4",
        "presentation": "2;2;4;4",
        "wc_summary": "73;62;147;74",
        "wc_strengths": "135;54;57;36",
        "wc_weaknesses": "192;270;125;62",
        "wc_questions": "68;37;92;30",
        "wc_review": "468;423;421;202",
        "wc_reply_reviewers": "0;35;113;0",
        "wc_reply_authors": "1441;991;1764;729",
        "reply_reviewers": "0;1;2;0",
        "reply_authors": "5;3;4;2",
        "rating_avg": [
            6.25,
            2.0463381929681126
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            1.0
        ],
        "wc_summary_avg": [
            89.0,
            33.81567683782183
        ],
        "wc_strengths_avg": [
            70.5,
            38.095275297600885
        ],
        "wc_weaknesses_avg": [
            162.25,
            77.3510665731249
        ],
        "wc_questions_avg": [
            56.75,
            24.873429598670143
        ],
        "wc_review_avg": [
            378.5,
            103.62070256469023
        ],
        "wc_reply_reviewers_avg": [
            37.0,
            46.14650582655202
        ],
        "wc_reply_authors_avg": [
            1231.25,
            399.3096386264674
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.5,
            1.118033988749895
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 20,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6739250820217201973&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=xCRr9DrolJ",
        "pdf": "https://openreview.net/pdf?id=xCRr9DrolJ",
        "email": "tsinghua.edu.cn;tsinghua.edu.cn;tsinghua.edu.cn;mail.tsinghua.edu.cn;tsinghua.edu.cn",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Tsinghua University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "xCawdgA8Qr",
        "title": "Leveraging Behavioral Cloning for Representation Alignment in Cross-Domain Policy Transfer",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The limited transferability of learned policies is a major challenge that restricts the applicability of learning-based solutions in decision-making tasks. In this paper, we present a simple method for aligning latent state representations across different domains using unaligned trajectories of proxy tasks. Once the alignment process is completed, policies trained on the shared representation can be transferred to another domain without further interaction. Our key finding is that multi-domain behavioral cloning is a powerful means of shaping a shared latent space. We also observe that the commonly used domain discriminative objective for distribution matching can be overly restrictive, potentially disrupting the latent state structure of each domain. As an alternative, we propose to use maximum mean discrepancy for regularization. Since our method focuses on capturing shared structures, it does not require discovering the exact cross-domain correspondence that existing methods aim for. Furthermore, our approach involves training only a single multi-domain policy, making it easy to extend. We evaluate our method across various domain shifts, including cross-robot and cross-viewpoint settings, and demonstrate that our approach outperforms existing methods that employ adversarial domain translation. We also conduct ablation studies to investigate the effectiveness of each loss component for different domain shifts.",
        "keywords": "imitation learning;domain transfer;zero-shot transfer",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/1de5e320df59d0af04fc0320443b29a8aaa4e262.zip",
        "author": "Hayato Watahiki;Ryo Iwase;Ryosuke Unno;Yoshimasa Tsuruoka",
        "authorids": "~Hayato_Watahiki1;~Ryo_Iwase1;~Ryosuke_Unno1;~Yoshimasa_Tsuruoka1",
        "gender": "M;;M;M",
        "homepage": ";;;https://www.logos.t.u-tokyo.ac.jp/~tsuruoka/",
        "dblp": "https://dblp.uni-trier.de/pid/249/2540;;;18/3787",
        "google_scholar": ";;;J2CkFngAAAAJ",
        "orcid": ";;;",
        "linkedin": ";%E8%AB%92-%E5%B2%A9%E7%80%AC-1954761b1/;%E8%89%AF%E4%BB%8B-%E6%B5%B7%E9%87%8E-1a72ab1b0/;",
        "or_profile": "~Hayato_Watahiki1;~Ryo_Iwase1;~Ryosuke_Unno1;~Yoshimasa_Tsuruoka1",
        "aff": "The University of Tokyo;The University of Tokyo;Line Corp;The University of Tokyo",
        "aff_domain": "u-tokyo.ac.jp;u-tokyo.ac.jp;linecorp.com;u-tokyo.ac.jp",
        "position": "PhD student;MS student;Software Engineer;Full Professor",
        "bibtex": "@misc{\nwatahiki2024leveraging,\ntitle={Leveraging Behavioral Cloning for Representation Alignment in Cross-Domain Policy Transfer},\nauthor={Hayato Watahiki and Ryo Iwase and Ryosuke Unno and Yoshimasa Tsuruoka},\nyear={2024},\nurl={https://openreview.net/forum?id=xCawdgA8Qr}\n}",
        "github": "",
        "project": "",
        "reviewers": "EC2z;NwUM;QnVM;9N3r;WwQw",
        "site": "https://openreview.net/forum?id=xCawdgA8Qr",
        "pdf_size": 8261995,
        "rating": "3;3;5;5;5",
        "confidence": "3;3;4;4;3",
        "soundness": "3;2;2;2;3",
        "contribution": "2;2;2;2;3",
        "presentation": "2;2;3;2;3",
        "wc_summary": "221;149;71;92;50",
        "wc_strengths": "111;21;112;81;96",
        "wc_weaknesses": "439;21;210;214;193",
        "wc_questions": "131;425;17;6;24",
        "wc_review": "902;616;410;393;363",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "533;550;413;119;251",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            4.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.4,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            116.6,
            61.75629522566909
        ],
        "wc_strengths_avg": [
            84.2,
            33.570224902434
        ],
        "wc_weaknesses_avg": [
            215.4,
            132.90688469752047
        ],
        "wc_questions_avg": [
            120.6,
            158.7231552105741
        ],
        "wc_review_avg": [
            536.8,
            203.27656038018748
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            373.2,
            166.08961436525763
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.6666666666666667,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2718534594943684489&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "University of Tokyo;LINE Corporation",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.u-tokyo.ac.jp;https://www.linecorp.com",
        "aff_unique_abbr": "UTokyo;Line",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Japan"
    },
    {
        "id": "xDyMF4ywzH",
        "title": "SPFormer: Enhancing Vision Transformer with Superpixel Representation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In this study, we present a novel approach to enhance Vision Transformers by leveraging superpixel representation. Unlike the traditional Vision Transformer, which uniformly partitions images into non-overlapping patches of fixed size, our superpixel approach divides an image into distinct, irregular regions, each designed to cluster pixels based on shared semantics for better capturing intricate image details. Note that this superpixel clustering is also applicable at the intermediate feature level. The resulting model, denoted as SPFormer, can be trained end-to-end, and empirically demonstrates superior performance across a range of benchmarks. Additionally, SPFormer provides better interpretability through the visualization of its learned superpixels, and exhibits strong robustness against challenging testing conditions like rotation and occlusion.",
        "keywords": "Vision Transformer; Superpixel",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/fc910b1dcdc8285293a32797698356b548914953.pdf",
        "author": "Jieru Mei;Liang-Chieh Chen;Alan Yuille;Cihang Xie",
        "authorids": "~Jieru_Mei2;~Liang-Chieh_Chen1;~Alan_Yuille1;~Cihang_Xie3",
        "gender": "M;;M;M",
        "homepage": "https://meijieru.com/;http://liangchiehchen.com/;;https://cihangxie.github.io/",
        "dblp": "198/9332.html;138/2443;y/AlanLYuille;175/3366",
        "google_scholar": "nHKExN0AAAAJ;ACjYGPUAAAAJ;;X3vVZPcAAAAJ",
        "orcid": ";;;",
        "linkedin": "meijieru/;;;",
        "or_profile": "~Jieru_Mei2;~Liang-Chieh_Chen1;~Alan_Yuille1;~cihang_xie1",
        "aff": "Johns Hopkins University;ByteDance / TikTok;Johns Hopkins University;University of California, Santa Cruz",
        "aff_domain": "jhu.edu;bytedance.com;johnshopkins.edu;ucsc.edu",
        "position": "PhD student;Research Scientist;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nmei2024spformer,\ntitle={{SPF}ormer: Enhancing Vision Transformer with Superpixel Representation},\nauthor={Jieru Mei and Liang-Chieh Chen and Alan Yuille and Cihang Xie},\nyear={2024},\nurl={https://openreview.net/forum?id=xDyMF4ywzH}\n}",
        "github": "",
        "project": "",
        "reviewers": "C59i;mr9V;BcpC;JGdc",
        "site": "https://openreview.net/forum?id=xDyMF4ywzH",
        "pdf_size": 613840,
        "rating": "3;3;5;5",
        "confidence": "4;5;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;2;2",
        "wc_summary": "56;59;51;80",
        "wc_strengths": "17;36;40;47",
        "wc_weaknesses": "165;107;239;150",
        "wc_questions": "41;16;14;5",
        "wc_review": "279;218;344;282",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            61.5,
            11.05667219374799
        ],
        "wc_strengths_avg": [
            35.0,
            11.113055385446435
        ],
        "wc_weaknesses_avg": [
            165.25,
            47.604490334421186
        ],
        "wc_questions_avg": [
            19.0,
            13.360389215887388
        ],
        "wc_review_avg": [
            280.75,
            44.5610536230911
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1696936074817319981&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "Johns Hopkins University;ByteDance;University of California, Santa Cruz",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.jhu.edu;https://www.bytedance.com;https://www.ucsc.edu",
        "aff_unique_abbr": "JHU;ByteDance;UCSC",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Santa Cruz",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "Elucidating the Exposure Bias in Diffusion Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17461",
        "id": "xEJMoj1SpX",
        "author_site": "Mang Ning, Mingxiao Li, Jianlin Su, Albert Ali Salah, Itir Onal Ertugrul",
        "tldr": "",
        "abstract": "Diffusion models have demonstrated impressive generative capabilities, but their exposure bias problem, described as the input mismatch between training and sampling, lacks in-depth exploration. In this paper, we investigate the exposure bias problem in diffusion models by first analytically modelling the sampling distribution, based on which we then attribute the prediction error at each sampling step as the root cause of the exposure bias issue. Furthermore, we discuss potential solutions to this issue and propose an intuitive metric for it. Along with the elucidation of exposure bias, we propose a simple, yet effective, training-free method called Epsilon Scaling to alleviate the exposure bias. We show that Epsilon Scaling explicitly moves the sampling trajectory closer to the vector field learned in the training phase by scaling down the network output, mitigating the input mismatch between training and sampling. Experiments on various diffusion frameworks (ADM, DDIM, EDM, LDM, DiT, PFGM++) verify the effectiveness of our method. Remarkably, our ADM-ES, as a state-of-the-art stochastic sampler, obtains 2.17 FID on CIFAR-10 under 100-step unconditional generation. The code is at https://github.com/forever208/ADM-ES",
        "keywords": "Generative models;Diffusion models",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Mang Ning;Mingxiao Li;Jianlin Su;Albert Ali Salah;Itir Onal Ertugrul",
        "authorids": "~Mang_Ning1;~Mingxiao_Li1;~Jianlin_Su1;~Albert_Ali_Salah2;~Itir_Onal_Ertugrul3",
        "gender": "M;M;M;M;",
        "homepage": ";https://mingxiao-li.github.io;http://jianlin.su;http://www.staff.science.uu.nl/~salah006/;",
        "dblp": "302/2427;186/8921-2;223/4243;75/4848;135/8878",
        "google_scholar": "dLE4q0cAAAAJ;https://scholar.google.com/citations?hl=en;cdbdaksAAAAJ;0ee8P-cAAAAJ;ixF65i4AAAAJ",
        "orcid": "0000-0001-6037-1661;0000-0003-0238-483X;;0000-0001-6342-428X;",
        "linkedin": "mang-ning-851785110/;mingxiao-li-7b9b71180/;;;",
        "or_profile": "~Mang_Ning1;~Mingxiao_Li1;~Jianlin_Su1;~Albert_Ali_Salah2;~Itir_Onal_Ertugrul3",
        "aff": "Utrecht University;KU Leuven;Moonshot AI Ltd;Utrecht University;Utrecht University",
        "aff_domain": "uu.nl;kuleuven.be;moonshot.cn;uu.nl;uu.nl",
        "position": "PhD student;Postdoc;Researcher;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nning2024elucidating,\ntitle={Elucidating the Exposure Bias in Diffusion Models},\nauthor={Mang Ning and Mingxiao Li and Jianlin Su and Albert Ali Salah and Itir Onal Ertugrul},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=xEJMoj1SpX}\n}",
        "github": "",
        "project": "",
        "reviewers": "gcKq;ujfx;FqVz;nv6a;tyf7",
        "pdf_size": 5007482,
        "rating": "6;6;6;6;8",
        "confidence": "2;4;4;4;4",
        "soundness": "3;3;2;4;3",
        "contribution": "2;3;3;3;3",
        "presentation": "3;2;2;4;3",
        "wc_summary": "106;91;79;317;205",
        "wc_strengths": "115;82;74;98;164",
        "wc_weaknesses": "89;164;450;170;241",
        "wc_questions": "15;8;136;202;73",
        "wc_review": "325;345;739;787;683",
        "wc_reply_reviewers": "0;0;0;88;230",
        "wc_reply_authors": "582;449;1349;1202;980",
        "reply_reviewers": "0;0;0;1;2",
        "reply_authors": "1;1;3;2;3",
        "rating_avg": [
            6.4,
            0.7999999999999999
        ],
        "confidence_avg": [
            3.6,
            0.8000000000000002
        ],
        "soundness_avg": [
            3.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            2.8,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.8,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            159.6,
            90.4557350310084
        ],
        "wc_strengths_avg": [
            106.6,
            31.959974968701086
        ],
        "wc_weaknesses_avg": [
            222.8,
            123.36839141368425
        ],
        "wc_questions_avg": [
            86.8,
            73.81978054695097
        ],
        "wc_review_avg": [
            575.8,
            199.44964276729098
        ],
        "wc_reply_reviewers_avg": [
            63.6,
            89.91017739944684
        ],
        "wc_reply_authors_avg": [
            912.4,
            347.2639342056702
        ],
        "reply_reviewers_avg": [
            0.6,
            0.8
        ],
        "reply_authors_avg": [
            2.0,
            0.8944271909999159
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.24999999999999992,
        "gs_citation": 37,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17318393061795565820&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=xEJMoj1SpX",
        "pdf": "https://openreview.net/pdf?id=xEJMoj1SpX",
        "email": "uu.nl;kuleuven.be;moonshot.cn;uu.nl;uu.nl",
        "author_num": 5,
        "aff_unique_index": "0;1;2;0;0",
        "aff_unique_norm": "Utrecht University;Katholieke Universiteit Leuven;Moonshot AI",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.uu.nl;https://www.kuleuven.be;https://moonshot.ai",
        "aff_unique_abbr": "UU;KU Leuven;Moonshot AI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;0;0",
        "aff_country_unique": "Netherlands;Belgium;United Kingdom"
    },
    {
        "id": "xGc7I6UWAq",
        "title": "CurrMask: Learning Versatile Skills with Automatic Masking Curricula",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recent research in reinforcement learning (RL) has shown a growing trend towards the pretraining paradigm, where a unified model pretrained on diverse and unlabeled data can be quickly adapted to various downstream tasks. Inspired by advances in other domains, masked prediction provides a generic abstraction for pretraining on decision-making data by masking part of the trajectory and predicting the missing inputs. In spite of the versatility of masked prediction, it remains unclear how to balance the learning of reusable skills at different levels of complexity. To this end, we propose CurrMask, a curriculum masking approach that adjusts its masking scheme for learning diverse and versatile skills. The main idea behind CurrMask is that using masking schemes with different block sizes and mask ratios creates varying levels of temporal granularity. By explicitly combining them in a meaningful order, CurrMask can better capture both local dynamics and global dependencies. To achieve this, CurrMask uses a multi-armed bandit algorithm to find a proper curriculum for masking schemes that maximizes overall learning progress during training. Through extensive experiments, we show that CurrMask exhibits superior finetuning performance on offline RL tasks and zero-shot performance on goal-conditioned planning and skill prompting tasks. Additionally, our analysis reveals that CurrMask gradually increases the complexity of masking scheme, encouraging the model to capture both short-term and long-term dependencies.",
        "keywords": "reinforcement learning;unsupervised pretraining;masked prediction;curriculum learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/1e5d50f4f629b69e996b0f555b7797a86dde0698.zip",
        "author": "Zhihui Xie;Yao Tang;Zichuan Lin;Deheng Ye;Shuai Li",
        "authorids": "~Zhihui_Xie2;~Yao_Tang2;~Zichuan_Lin2;~Deheng_Ye1;~Shuai_Li3",
        "gender": "M;F;M;M;F",
        "homepage": "https://fffffarmer.github.io/;https://yaotang23.github.io/;https://linzichuan.github.io/;http://yedeheng.github.io/;http://shuaili8.github.io",
        "dblp": "31/3570-2;;220/3933.html;159/9503;57/2281-10",
        "google_scholar": "Jml8NvkAAAAJ;;Tlc4yaMAAAAJ;jz5XKuQAAAAJ;https://scholar.google.com.hk/citations?user=kMZgQxcAAAAJ",
        "orcid": ";;;0000-0002-1754-1837;",
        "linkedin": ";;zichuan-lin-97560aa4/?originalSubdomain=cn;;",
        "or_profile": "~Zhihui_Xie2;~Yao_Tang2;~Zichuan_Lin2;~Deheng_Ye1;~Shuai_Li3",
        "aff": "Shanghai Jiaotong University;Shanghai Jiaotong University;Tencent;Tencent;John Hopcroft Center, Shanghai Jiao Tong University",
        "aff_domain": "sjtu.edu.cn;cs.sjtu.edu.cn;tencent.com;tencent.com;sjtu.edu.cn",
        "position": "MS student;Undergrad student;Senior Researcher;Principal Researcher;Assistant Professor",
        "bibtex": "@misc{\nxie2024currmask,\ntitle={CurrMask: Learning Versatile Skills with Automatic Masking Curricula},\nauthor={Zhihui Xie and Yao Tang and Zichuan Lin and Deheng Ye and Shuai Li},\nyear={2024},\nurl={https://openreview.net/forum?id=xGc7I6UWAq}\n}",
        "github": "",
        "project": "",
        "reviewers": "RhwK;hUSq;nmaR;zZrj",
        "site": "https://openreview.net/forum?id=xGc7I6UWAq",
        "pdf_size": 1148830,
        "rating": "3;5;5;5",
        "confidence": "4;4;4;3",
        "soundness": "3;2;2;2",
        "contribution": "2;3;2;2",
        "presentation": "3;2;3;2",
        "wc_summary": "33;66;132;49",
        "wc_strengths": "47;49;68;37",
        "wc_weaknesses": "148;69;92;172",
        "wc_questions": "116;111;36;2",
        "wc_review": "344;295;328;260",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            70.0,
            37.6497011940334
        ],
        "wc_strengths_avg": [
            50.25,
            11.211043662389331
        ],
        "wc_weaknesses_avg": [
            120.25,
            41.45102531904368
        ],
        "wc_questions_avg": [
            66.25,
            48.78716532039959
        ],
        "wc_review_avg": [
            306.75,
            32.25968846718765
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:8GhAQKbrCi4J:scholar.google.com/&scioq=CurrMask:+Learning+Versatile+Skills+with+Automatic+Masking+Curricula&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;1;0",
        "aff_unique_norm": "Shanghai Jiao Tong University;Tencent",
        "aff_unique_dep": ";Tencent Holdings Limited",
        "aff_unique_url": "https://www.sjtu.edu.cn;https://www.tencent.com",
        "aff_unique_abbr": "SJTU;Tencent",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Shanghai",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "How Over-Parameterization Slows Down Gradient Descent in Matrix Sensing: The Curses of Symmetry and Initialization",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17460",
        "id": "xGvPKAiOhq",
        "author_site": "Nuoya Xiong, Lijun Ding, Simon Du",
        "tldr": "",
        "abstract": "This paper rigorously shows how over-parameterization dramatically changes the convergence behaviors of gradient descent (GD) for the matrix sensing problem, where the goal is to recover an unknown low-rank ground-truth matrix from near-isotropic linear measurements.\nFirst, we consider the symmetric setting with the symmetric parameterization where $M^* \\in \\mathbb{R}^{n \\times n}$ is a positive semi-definite unknown matrix of rank $r \\ll n$, and one uses a symmetric parameterization $XX^\\top$ to learn $M^*$. Here $X \\in \\mathbb{R}^{n \\times k}$ with $k > r$ is the factor matrix. We give a novel $\\Omega\\left(1/T^2\\right)$ lower bound of randomly initialized GD for the over-parameterized case ($k >r$) where $T$ is the number of iterations. This is in stark contrast to the exact-parameterization scenario ($k=r$) where the convergence rate is $\\exp\\left(-\\Omega\\left(T\\right)\\right)$. Next, we study asymmetric setting where $M^* \\in \\mathbb{R}^{n_1 \\times n_2}$ is the unknown matrix of rank $r \\ll \\min\\{n_1,n_2\\}$, and one uses an asymmetric parameterization $FG^\\top$ to learn $M^*$ where $F \\in \\mathbb{R}^{n_1 \\times k}$ and $G \\in \\mathbb{R}^{n_2 \\times k}$. We give the first global exact convergence result of randomly initialized GD for the exact-parameterization case ($k=r$) with an $\\exp\\left(-\\Omega\\left(T\\right)\\right)$ rate. Furthermore, we give the first global exact convergence result for the over-parameterization case ($k>r$) with an $\\exp\\left(-\\Omega\\left(\\alpha^2 T\\right)\\right)$ rate where $\\alpha$ is the initialization scale. This linear convergence result in the over-parameterization case is especially significant because one can apply the asymmetric parameterization to the symmetric setting to speed up from $\\Omega\\left(1/T^2\\right)$ to linear convergence. Therefore, we identify a surprising phenomenon: asymmetric parameterization can exponentially speed up convergence. Equally surprising is our analysis that highlights the importance of imbalance between $F$ and $G$. This is in sharp contrast to prior works which emphasize balance.  We further give an example showing the dependency on $\\alpha$ in the convergence rate is unavoidable in the worst case. On the other hand, we propose a novel method that only modifies one step of GD and obtains a convergence rate independent of $\\alpha$, recovering the rate in the exact-parameterization case. We provide empirical studies to verify our theoretical findings.",
        "keywords": "non-convex optimization;random initialization;global convergence;matrix recovery;matrix sensing",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/ff831e16c79733570ec7acf52fea0b4c2539286f.pdf",
        "author": "Nuoya Xiong;Lijun Ding;Simon Shaolei Du",
        "authorids": "~Nuoya_Xiong1;~Lijun_Ding1;~Simon_Shaolei_Du1",
        "gender": "M;M;M",
        "homepage": "https://xiongny.github.io/index.html;https://www.lijunding.net/;http://simonshaoleidu.com",
        "dblp": "322/6141;;176/5602",
        "google_scholar": "K7Q4GWQAAAAJ;https://scholar.google.com/citations?hl=en;OttawxUAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Nuoya_Xiong1;~Lijun_Ding1;~Simon_Shaolei_Du1",
        "aff": "Tsinghua University;Texas A&M University - College Station;University of Washington",
        "aff_domain": "tsinghua.edu.cn;tamu.edu;washington.edu",
        "position": "Undergrad student;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nxiong2024how,\ntitle={How Over-Parameterization Slows Down Gradient Descent in Matrix Sensing: The Curses of Symmetry and Initialization},\nauthor={Nuoya Xiong and Lijun Ding and Simon Shaolei Du},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=xGvPKAiOhq}\n}",
        "github": "",
        "project": "",
        "reviewers": "XP68;UZwv;Z4Yg;MU8J",
        "pdf_size": 1019145,
        "rating": "8;8;8;8",
        "confidence": "4;4;4;4",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "2;3;4;3",
        "wc_summary": "65;43;187;87",
        "wc_strengths": "77;68;77;84",
        "wc_weaknesses": "10;29;56;192",
        "wc_questions": "375;326;56;43",
        "wc_review": "527;466;376;406",
        "wc_reply_reviewers": "17;18;18;18",
        "wc_reply_authors": "614;1038;195;609",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;2;1;2",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            95.5,
            55.070409477322755
        ],
        "wc_strengths_avg": [
            76.5,
            5.678908345800274
        ],
        "wc_weaknesses_avg": [
            71.75,
            71.32452243092834
        ],
        "wc_questions_avg": [
            200.0,
            151.56351803781806
        ],
        "wc_review_avg": [
            443.75,
            57.96712430334974
        ],
        "wc_reply_reviewers_avg": [
            17.75,
            0.4330127018922193
        ],
        "wc_reply_authors_avg": [
            614.0,
            298.0612353191874
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9820620385244087970&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=xGvPKAiOhq",
        "pdf": "https://openreview.net/pdf?id=xGvPKAiOhq",
        "email": "tsinghua.edu.cn;tamu.edu;washington.edu",
        "author_num": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Tsinghua University;Texas A&M University;University of Washington",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.tamu.edu;https://www.washington.edu",
        "aff_unique_abbr": "THU;TAMU;UW",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";College Station",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Correlated Noise Provably Beats Independent Noise for Differentially Private Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17459",
        "id": "xHmCdSArUC",
        "author_site": "Christopher Choquette-Choo, Krishnamurthy Dvijotham, Krishna Pillutla, Arun Ganesh, Thomas Steinke, Abhradeep Guha Thakurta",
        "tldr": "",
        "abstract": "Differentially private learning algorithms inject noise into the learning process. While the most common private learning algorithm, DP-SGD, adds independent Gaussian noise in each iteration, recent work on matrix factorization mechanisms has shown empirically that introducing correlations in the noise can greatly improve their utility. We characterize the asymptotic learning utility for any choice of the correlation function, giving precise analytical bounds for linear regression and as the solution to a convex program for general convex functions. We show, using these bounds, how correlated noise provably improves upon vanilla DP-SGD as a function of problem parameters such as the effective dimension and condition number. Moreover, our analytical expression for the near-optimal correlation function circumvents the cubic complexity of the semi-definite program used to optimize the noise correlation matrix in previous work. We validate these theoretical results with experiments on private deep learning. Our work matches or outperforms prior work while being efficient both in terms of computation and memory.",
        "keywords": "differentially private optimization;stochastic gradient descent;linear regression theory;private deep learning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/334409445c03fce78f4825d0b1e2ba7b1e679ff9.pdf",
        "author": "Christopher A. Choquette-Choo;Krishnamurthy Dj Dvijotham;Krishna Pillutla;Arun Ganesh;Thomas Steinke;Abhradeep Guha Thakurta",
        "authorids": "~Christopher_A._Choquette-Choo1;~Krishnamurthy_Dj_Dvijotham1;~Krishna_Pillutla1;~Arun_Ganesh1;~Thomas_Steinke2;~Abhradeep_Guha_Thakurta1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://www.christopherchoquette.com;https://krishnap25.github.io;https://people.eecs.berkeley.edu/~arunganesh/;http://www.thomas-steinke.net/;https://athakurta.squarespace.com/;http://dvij.github.io",
        "dblp": "250/9674;173/5185.html;201/4732;https://dblp.uni-trier.de/pid/73/4025-2.html;31/8315;16/8758",
        "google_scholar": "oDE4I64AAAAJ;IL7N6sMAAAAJ;fmwchbsAAAAJ;kwnwhrgAAAAJ;1rV69hMAAAAJ;BUtloecAAAAJ",
        "orcid": ";;;;;",
        "linkedin": "christopher-choquette-choo/;;;thomas-steinke-2841248/;;",
        "or_profile": "~Christopher_A._Choquette-Choo1;~Krishna_Pillutla1;~Arun_Ganesh1;~Thomas_Steinke2;~Abhradeep_Guha_Thakurta1;~Krishnamurthy_Dvijotham2",
        "aff": "Google DeepMind;Google;Google;Google;Google;Google DeepMind",
        "aff_domain": "google.com;google.com;google.com;google.com;google.com;google.com",
        "position": "Research Scientist;Visiting Researcher;Researcher;Research Scientist;Senior Research Scientist;Researcher",
        "bibtex": "@inproceedings{\nchoquette-choo2024correlated,\ntitle={Correlated Noise Provably Beats Independent Noise for Differentially Private Learning},\nauthor={Christopher A. Choquette-Choo and Krishnamurthy Dj Dvijotham and Krishna Pillutla and Arun Ganesh and Thomas Steinke and Abhradeep Guha Thakurta},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=xHmCdSArUC}\n}",
        "github": "",
        "project": "",
        "reviewers": "rSjm;NgBE;baaJ",
        "pdf_size": 994067,
        "rating": "1;8;8",
        "confidence": "4;2;3",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "1;3;3",
        "wc_summary": "16;172;70",
        "wc_strengths": "51;136;74",
        "wc_weaknesses": "290;82;57",
        "wc_questions": "113;80;50",
        "wc_review": "470;470;251",
        "wc_reply_reviewers": "2114;102;137",
        "wc_reply_authors": "1997;428;1036",
        "reply_reviewers": "4;1;2",
        "reply_authors": "4;3;4",
        "rating_avg": [
            5.666666666666667,
            3.299831645537222
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            86.0,
            64.68384651518491
        ],
        "wc_strengths_avg": [
            87.0,
            35.89800365851375
        ],
        "wc_weaknesses_avg": [
            143.0,
            104.44456264768725
        ],
        "wc_questions_avg": [
            81.0,
            25.729360660537214
        ],
        "wc_review_avg": [
            397.0,
            103.23759005323593
        ],
        "wc_reply_reviewers_avg": [
            784.3333333333334,
            940.3248847546729
        ],
        "wc_reply_authors_avg": [
            1153.6666666666667,
            645.9227680011151
        ],
        "reply_reviewers_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.8660254037844386,
        "gs_citation": 18,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12998075738172976542&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=xHmCdSArUC",
        "pdf": "https://openreview.net/pdf?id=xHmCdSArUC",
        "email": "google.com;google.com;google.com;google.com;google.com;google.com",
        "author_num": 6,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "Google",
        "aff_unique_dep": "Google DeepMind",
        "aff_unique_url": "https://deepmind.com",
        "aff_unique_abbr": "DeepMind",
        "aff_campus_unique_index": "1;1;1;1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;1;1;1;0",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "title": "Towards 3D Molecule-Text Interpretation in Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17458",
        "id": "xI4yNlkaqh",
        "author_site": "Sihang Li, Zhiyuan Liu, Yanchen Luo, Xiang Wang, Xiangnan He, Kenji Kawaguchi, Tat-Seng Chua, Qi Tian",
        "tldr": "",
        "abstract": "Language Models (LMs) have greatly influenced diverse domains. However, their inherent limitation in comprehending 3D molecular structures has considerably constrained their potential in the biomolecular domain. To bridge this gap, we focus on 3D molecule-text interpretation, and propose 3D-MoLM: 3D-Molecular Language Modeling. Specifically, 3D-MoLM enables an LM to interpret and analyze 3D molecules by equipping the LM with a 3D molecular encoder. This integration is achieved by a 3D molecule-text projector, bridging the 3D molecular encoder\u2019s representation space and the LM\u2019s input space. Moreover, to enhance 3D\u0002MoLM\u2019s ability of cross-modal molecular understanding and instruction following, we meticulously curated a 3D molecule-centric instruction tuning dataset \u2013 3D-MoIT. Through 3D molecule-text alignment and 3D molecule-centric instruction tuning, 3D-MoLM establishes an integration of 3D molecular encoder and LM. It significantly surpasses existing baselines on downstream tasks, including molecule\u0002text retrieval, molecule captioning, and more challenging open-text molecular QA tasks, especially focusing on 3D-dependent properties. We will release our codes and datasets at https://github.com/lsh0520/3D-MoLM.",
        "keywords": "3D molecules;Large Language Model;3D-text interpretation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Sihang Li;Zhiyuan Liu;Yanchen Luo;Xiang Wang;Xiangnan He;Kenji Kawaguchi;Tat-Seng Chua;Qi Tian",
        "authorids": "~Sihang_Li1;~Zhiyuan_Liu5;~Yanchen_Luo1;~Xiang_Wang6;~Xiangnan_He1;~Kenji_Kawaguchi1;~Tat-Seng_Chua2;~Qi_Tian3",
        "gender": ";M;M;M;M;;;M",
        "homepage": ";https://acharkq.github.io/;https://github.com/lyc0930;https://github.com/xiangwang1223;http://staff.ustc.edu.cn/~hexn;https://ml.comp.nus.edu.sg/#members;;https://www.qitian1987.com/index.html",
        "dblp": ";53/3245-10;359/3305;31/2864-10;59/1007;;;78/1467-1.html",
        "google_scholar": ";https://scholar.google.com.sg/citations?user=zF0AH64AAAAJ;e5SeNbMAAAAJ;https://scholar.google.com.sg/citations?user=HdhaQB0AAAAJ;https://scholar.google.com.sg/citations?user=X45Go24AAAAJ;aLl3rYoAAAAJ;;https://scholar.google.com/citations?hl=en",
        "orcid": ";;0009-0009-2637-176X;0000-0002-6148-6329;0000-0001-8472-7992;;;0000-0002-7252-5047",
        "linkedin": ";;;;;;;",
        "or_profile": "~Sihang_Li1;~Zhiyuan_Liu5;~Yanchen_Luo1;~Xiang_Wang6;~Xiangnan_He1;~Kenji_Kawaguchi1;~Tat-Seng_Chua2;~Qi_Tian3",
        "aff": ";National University of Singapore;University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China;National University of Singapore;;Huawei Technologies Ltd.",
        "aff_domain": ";nus.edu.sg;ustc.edu.cn;ustc.edu.cn;ustc.edu.cn;nus.edu;;huawei.com",
        "position": ";PhD student;PhD student;Full Professor;Professor;Presidential Young Professor;;Principal Researcher",
        "bibtex": "@inproceedings{\nli2024towards,\ntitle={Towards 3D Molecule-Text Interpretation in Language Models},\nauthor={Sihang Li and Zhiyuan Liu and Yanchen Luo and Xiang Wang and Xiangnan He and Kenji Kawaguchi and Tat-Seng Chua and Qi Tian},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=xI4yNlkaqh}\n}",
        "github": "",
        "project": "",
        "reviewers": "Zm2K;3SWU;mT4V;HgTH",
        "pdf_size": 1579339,
        "rating": "5;6;6;6",
        "confidence": "5;3;4;1",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "58;70;159;60",
        "wc_strengths": "38;51;75;32",
        "wc_weaknesses": "61;167;148;31",
        "wc_questions": "286;20;190;3",
        "wc_review": "443;308;572;126",
        "wc_reply_reviewers": "0;19;103;0",
        "wc_reply_authors": "2109;1174;1671;574",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "5;3;3;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.25,
            1.479019945774904
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            86.75,
            41.96054694591099
        ],
        "wc_strengths_avg": [
            49.0,
            16.507574019219177
        ],
        "wc_weaknesses_avg": [
            101.75,
            57.146194098994904
        ],
        "wc_questions_avg": [
            124.75,
            118.37942177591509
        ],
        "wc_review_avg": [
            362.25,
            165.28214513370764
        ],
        "wc_reply_reviewers_avg": [
            30.5,
            42.57052971246658
        ],
        "wc_reply_authors_avg": [
            1382.0,
            571.8780464399731
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.0,
            1.4142135623730951
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.6831300510639732,
        "gs_citation": 51,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9626326580887779244&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=xI4yNlkaqh",
        "pdf": "https://openreview.net/pdf?id=xI4yNlkaqh",
        "email": ";nus.edu.sg;ustc.edu.cn;ustc.edu.cn;ustc.edu.cn;nus.edu;;huawei.com",
        "author_num": 8,
        "aff_unique_index": "0;1;1;1;0;2",
        "aff_unique_norm": "National University of Singapore;University of Science and Technology of China;Huawei",
        "aff_unique_dep": ";;Huawei Technologies",
        "aff_unique_url": "https://www.nus.edu.sg;http://www.ustc.edu.cn;https://www.huawei.com",
        "aff_unique_abbr": "NUS;USTC;Huawei",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;0;1",
        "aff_country_unique": "Singapore;China"
    },
    {
        "title": "Subtractive Mixture Models via Squaring: Representation and Learning",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17457",
        "id": "xIHi5nxu9P",
        "author_site": "Lorenzo Loconte, Aleksanteri Sladek, Stefan Mengel, Martin Trapp, Arno Solin, Nicolas Gillis, Antonio Vergari",
        "tldr": "",
        "abstract": "Mixture models are traditionally represented and learned by adding several distributions as components. Allowing mixtures to subtract probability mass or density can drastically reduce the number of components needed to model complex distributions. However, learning such subtractive mixtures while ensuring they still encode a non-negative function is challenging. We investigate how to learn and perform inference on deep subtractive mixtures by squaring them. We do this in the framework of probabilistic circuits, which enable us to represent tensorized mixtures and generalize several other subtractive models. We theoretically prove that the class of squared circuits allowing subtractions can be exponentially more expressive than traditional additive mixtures; and, we empirically show this increased expressiveness on a series of real-world distribution estimation tasks.",
        "keywords": "tractable inference;distribution estimation;probabilistic circuits;tensor networks",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Lorenzo Loconte;Aleksanteri Mikulus Sladek;Stefan Mengel;Martin Trapp;Arno Solin;Nicolas Gillis;Antonio Vergari",
        "authorids": "~Lorenzo_Loconte1;~Aleksanteri_Mikulus_Sladek1;~Stefan_Mengel1;~Martin_Trapp2;~Arno_Solin1;~Nicolas_Gillis1;~Antonio_Vergari3",
        "gender": "M;;;M;;M;",
        "homepage": "https://loreloc.github.io/;;;https://trappmartin.github.io;http://arno.solin.fi;https://sites.google.com/site/nicolasgillis/;",
        "dblp": "336/2917;;79/9794;38/1893-1;98/11225;65/8017;",
        "google_scholar": ";;;GwCrZP4AAAAJ;U_fJCnAAAAAJ;https://scholar.google.be/citations?user=pVIJV7wAAAAJ;",
        "orcid": ";;;0000-0003-1725-3381;0000-0002-0958-7886;0000-0001-6423-6897;",
        "linkedin": ";;;;asolin/;;",
        "or_profile": "~Lorenzo_Loconte1;~Aleksanteri_Mikulus_Sladek1;~Stefan_Mengel1;~Martin_Trapp2;~Arno_Solin1;~Nicolas_Gillis1;~Antonio_Vergari3",
        "aff": "University of Edinburgh;;CNRS;Aalto University;Aalto University;University of Mons;",
        "aff_domain": "sms.ed.ac.uk;;cnrs.fr;aalto.fi;aalto.fi;umons.ac.be;",
        "position": "PhD student;;Researcher;Postdoc;Assistant Professor;Associate Professor;",
        "bibtex": "@inproceedings{\nloconte2024subtractive,\ntitle={Subtractive Mixture Models via Squaring: Representation and Learning},\nauthor={Lorenzo Loconte and Aleksanteri Mikulus Sladek and Stefan Mengel and Martin Trapp and Arno Solin and Nicolas Gillis and Antonio Vergari},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=xIHi5nxu9P}\n}",
        "github": "",
        "project": "",
        "reviewers": "5G72;nUGh;Bp5w;Lqff;uVYn",
        "pdf_size": 4409003,
        "rating": "6;6;8;8;8",
        "confidence": "3;2;4;2;3",
        "soundness": "3;3;4;3;4",
        "contribution": "2;3;3;3;4",
        "presentation": "2;2;4;2;3",
        "wc_summary": "85;54;80;139;51",
        "wc_strengths": "16;70;88;144;62",
        "wc_weaknesses": "61;384;26;509;194",
        "wc_questions": "57;4;343;110;11",
        "wc_review": "219;512;537;902;318",
        "wc_reply_reviewers": "0;0;245;0;0",
        "wc_reply_authors": "797;1065;573;835;585",
        "reply_reviewers": "0;0;1;0;0",
        "reply_authors": "2;3;2;2;1",
        "rating_avg": [
            7.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            2.8,
            0.7483314773547882
        ],
        "soundness_avg": [
            3.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            3.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            2.6,
            0.8
        ],
        "wc_summary_avg": [
            81.8,
            31.64427278355437
        ],
        "wc_strengths_avg": [
            76.0,
            41.47288270665544
        ],
        "wc_weaknesses_avg": [
            234.8,
            185.9649429328012
        ],
        "wc_questions_avg": [
            105.0,
            124.90796611905904
        ],
        "wc_review_avg": [
            497.6,
            234.59462909452978
        ],
        "wc_reply_reviewers_avg": [
            49.0,
            98.0
        ],
        "wc_reply_authors_avg": [
            771.0,
            181.66342504753123
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            2.0,
            0.6324555320336759
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.3273268353539886,
        "gs_citation": 18,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3977167561068308625&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 9,
        "openreview": "https://openreview.net/forum?id=xIHi5nxu9P",
        "pdf": "https://openreview.net/pdf?id=xIHi5nxu9P",
        "email": "sms.ed.ac.uk;;cnrs.fr;aalto.fi;aalto.fi;umons.ac.be;",
        "author_num": 7,
        "aff_unique_index": "0;1;2;2;3",
        "aff_unique_norm": "University of Edinburgh;Centre National de la Recherche Scientifique;Aalto University;University of Mons",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.ed.ac.uk;https://www.cnrs.fr;https://www.aalto.fi;https://www.umons.ac.be",
        "aff_unique_abbr": "Edinburgh;CNRS;Aalto;UMons",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;2;3",
        "aff_country_unique": "United Kingdom;France;Finland;Belgium"
    },
    {
        "id": "xIKgGWH2jI",
        "title": "Hindsight-DICE: Stable Credit Assignment for Deep Reinforcement Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Oftentimes, environments for sequential decision-making problems can be quite sparse in the provision of evaluative feedback to guide reinforcement-learning agents. In the extreme case, long trajectories of behavior are merely punctuated with a single terminal feedback signal, leading to a significant temporal delay between the observation of a non-trivial reward and the individual steps of behavior culpable for achieving said reward. Coping with such a credit assignment challenge is one of the hallmark characteristics of reinforcement learning. While prior work has introduced the concept of hindsight policies to develop a theoretically motivated method for re-weighting on-policy data by impact on achieving the observed trajectory return, we show that these methods experience instabilities which lead to inefficient learning in complex environments. In this work, we adapt existing importance-sampling ratio estimation techniques for off-policy evaluation to drastically improve the stability and efficiency of these so-called hindsight policy methods. Our hindsight distribution correction facilitates stable, efficient learning across a broad range of environments where credit assignment plagues baseline methods.",
        "keywords": "reinforcement learning;deep learning;credit assignment",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Akash Velu;Skanda Vaidyanath;Dilip Arumugam",
        "authorids": "~Akash_Velu1;~Skanda_Vaidyanath1;~Dilip_Arumugam1",
        "gender": "M;M;M",
        "homepage": ";https://skandavaidyanath.github.io/;http://dilipa.github.io/",
        "dblp": ";;165/1303",
        "google_scholar": "MgV1JEsAAAAJ;CS9tprgAAAAJ;gzHbYVQAAAAJ",
        "orcid": ";;",
        "linkedin": "akash-velu/;;",
        "or_profile": "~Akash_Velu1;~Skanda_Vaidyanath1;~Dilip_Arumugam1",
        "aff": ";Riot Games;Stanford University",
        "aff_domain": ";riotgames.com;stanford.edu",
        "position": ";Researcher;PhD student",
        "bibtex": "@misc{\nvelu2024hindsightdice,\ntitle={Hindsight-{DICE}: Stable Credit Assignment for Deep Reinforcement Learning},\nauthor={Akash Velu and Skanda Vaidyanath and Dilip Arumugam},\nyear={2024},\nurl={https://openreview.net/forum?id=xIKgGWH2jI}\n}",
        "github": "",
        "project": "",
        "reviewers": "L6UQ;UH2T;dvgs;j1vw",
        "site": "https://openreview.net/forum?id=xIKgGWH2jI",
        "pdf_size": 4760637,
        "rating": "1;5;5;6",
        "confidence": "5;4;4;4",
        "soundness": "1;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "80;45;137;33",
        "wc_strengths": "176;71;167;60",
        "wc_weaknesses": "599;386;149;105",
        "wc_questions": "17;3;36;254",
        "wc_review": "872;505;489;452",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.920286436967152
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            73.75,
            40.39415180443822
        ],
        "wc_strengths_avg": [
            118.5,
            53.23767462990847
        ],
        "wc_weaknesses_avg": [
            309.75,
            198.26922983660376
        ],
        "wc_questions_avg": [
            77.5,
            102.57314463347606
        ],
        "wc_review_avg": [
            579.5,
            169.96543766307315
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.9771398364036774,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1960621804042601522&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Riot Games;Stanford University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.riotgames.com;https://www.stanford.edu",
        "aff_unique_abbr": "Riot Games;Stanford",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Stanford",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "xIdIHRUn9t",
        "title": "MotionDirector: Motion Customization of Text-to-Video Diffusion Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large-scale pre-trained diffusion models have exhibited remarkable capabilities in diverse video generations. Given a set of video clips of the same motion concept, the task of Motion Customization is to adapt existing text-to-video diffusion models to generate videos with this motion. For example, generating a video with a car moving in a prescribed manner under specific camera movements to make a movie, or a video illustrating how a bear would lift weights to inspire creators. Adaptation methods have been developed for customizing appearance like subject or style, yet unexplored for motion. It is straightforward to extend mainstream adaption methods for motion customization, including full model tuning, parameter-efficient tuning of additional layers, and Low-Rank Adaptions (LoRAs). However, the motion concept learned by these methods is often coupled with the limited appearances in the training videos, making it difficult to generalize the customized motion to other appearances. To overcome this challenge, we propose MotionDirector, with a dual-path LoRAs architecture to decouple the learning of appearance and motion. Further, we design a novel appearance-debiased temporal loss to mitigate the influence of appearance on the temporal training objective. Experimental results show the proposed method can generate videos of diverse appearances for the customized motions. Our method also supports various downstream applications, such as the mixing of different videos with their appearance and motion respectively, and animating a single image with customized motions. Our code and model weights will be released.",
        "keywords": "Video Generation; Diffusion Models; Motion Customization",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Rui Zhao;Yuchao Gu;Jay Zhangjie Wu;David Junhao Zhang;Jia-Wei Liu;Weijia Wu;Jussi Keppo;Mike Zheng Shou",
        "authorids": "~Rui_Zhao12;~Yuchao_Gu1;~Jay_Zhangjie_Wu1;~David_Junhao_Zhang1;~Jia-Wei_Liu1;~Weijia_Wu2;~Jussi_Keppo1;~Mike_Zheng_Shou1",
        "gender": "M;M;M;M;M;M;M;",
        "homepage": ";https://ycgu.site/;https://zhangjiewu.github.io/;https://jia-wei-liu.github.io/;https://weijiawu.github.io/;https://www.jussikeppo.com;https://scholar.google.com/citations?user=6dCcnNEAAAAJ&hl=en;http://www.columbia.edu/~zs2262/",
        "dblp": "26/2578-19;266/4395;322/0749;85/3336;87/7695-1;;307/3295;284/0807",
        "google_scholar": "https://scholar.google.com.hk/citations?user=wYs7vogAAAAJ;YpfrXyQAAAAJ;WVp4yjoAAAAJ;stQQf7wAAAAJ;NgjTRe4AAAAJ;;6dCcnNEAAAAJ;h1-3lSoAAAAJ",
        "orcid": "0000-0003-4271-0206;;;;0000-0003-3912-7212;;;",
        "linkedin": ";;;;%E5%A8%81%E4%BD%B3-%E5%90%B4-07a852280/;keppo/;;",
        "or_profile": "~Rui_Zhao12;~Yuchao_Gu1;~Jay_Zhangjie_Wu1;~Jia-Wei_Liu1;~Weijia_Wu2;~Jussi_Keppo1;~Junhao_Zhang1;~Zheng_Shou1",
        "aff": "Alibaba Group;National University of Singapore;National University of Singapore;National University of Singapore;National University of Singapore;;National University of Singapore;National University of Singapore",
        "aff_domain": "alibaba-inc.com;u.nus.edu;u.nus.edu;u.nus.edu;nus.edu;;nus.edu;nus.edu.sg",
        "position": "Intern;PhD student;PhD student;PhD student;Postdoc;;PhD student;Assistant Professor",
        "bibtex": "@misc{\nzhao2024motiondirector,\ntitle={MotionDirector: Motion Customization of Text-to-Video Diffusion Models},\nauthor={Rui Zhao and Yuchao Gu and Jay Zhangjie Wu and David Junhao Zhang and Jia-Wei Liu and Weijia Wu and Jussi Keppo and Mike Zheng Shou},\nyear={2024},\nurl={https://openreview.net/forum?id=xIdIHRUn9t}\n}",
        "github": "",
        "project": "",
        "reviewers": "8uoP;E7V1;LtG6;QKrd",
        "site": "https://openreview.net/forum?id=xIdIHRUn9t",
        "pdf_size": 40277722,
        "rating": "3;5;6;8",
        "confidence": "4;5;4;2",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "65;50;60;36",
        "wc_strengths": "36;36;71;30",
        "wc_weaknesses": "161;331;98;53",
        "wc_questions": "2;2;2;126",
        "wc_review": "264;419;231;245",
        "wc_reply_reviewers": "212;0;0;0",
        "wc_reply_authors": "2429;1373;804;975",
        "reply_reviewers": "6;0;0;0",
        "reply_authors": "13;5;4;5",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            52.75,
            11.07643895843786
        ],
        "wc_strengths_avg": [
            43.25,
            16.20763708873073
        ],
        "wc_weaknesses_avg": [
            160.75,
            105.51392088250725
        ],
        "wc_questions_avg": [
            33.0,
            53.693575034635195
        ],
        "wc_review_avg": [
            289.75,
            75.5360013503495
        ],
        "wc_reply_reviewers_avg": [
            53.0,
            91.7986928011505
        ],
        "wc_reply_authors_avg": [
            1395.25,
            631.5300368945249
        ],
        "reply_reviewers_avg": [
            1.5,
            2.598076211353316
        ],
        "reply_authors_avg": [
            6.75,
            3.6314597615834874
        ],
        "replies_avg": [
            38,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.6999132392733556,
        "gs_citation": 112,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7594109510995316984&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;1;1;1;1;1",
        "aff_unique_norm": "Alibaba Group;National University of Singapore",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.alibaba.com;https://www.nus.edu.sg",
        "aff_unique_abbr": "Alibaba;NUS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1;1;1;1",
        "aff_country_unique": "China;Singapore"
    },
    {
        "id": "xJ5CF1aOOX",
        "title": "A Self-Supervised Pre-Training Model for Time Series Classification based on Data Pre-Processing",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Currently, time series is widely used in the industrial field. Many scholars have conducted research and made great progress, including pre-training models. By training the model with a large amount of data similar to a certain field, and then fine-tuning the model with a small amount of samples, a high-precision model can be obtained, which is of great value in the industrial field. However, there are two main problems with current models. First, most of them use supervised classification. Although the accuracy is high, it is not practical for many real-world data with few labeled samples. Secondly, most researchers have recently focused on contrastive learning, which has higher requirements for the form and regularity of data, indicating that they have not targeted these issues. To solve these problems, we propose an self-supervised pre-processing classification model for time series classification. First, according to the inherent features of the data, the way of data pre-processing is determined by judging the attributes of the time series. Second, a sorting similarity method is proposed for contrastive learning, and a rough similarity is used in the pre-training stage, while our sorting loss function is used in the fine-tuning stage to improve overall performance. After that, extensive experiments were conducted on $8$ different real-world datasets from various fields to verify the effectiveness and efficiency of the proposed method.",
        "keywords": "self-supervised;FIR Filter;pre-training;contrast learning;data pre-processing",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/7feaef13df84eaa95af48ab5f7136e172e89f59a.zip",
        "author": "Hanlin ZHANG",
        "authorids": "~Hanlin_ZHANG3",
        "gender": "M",
        "homepage": "",
        "dblp": "",
        "google_scholar": "",
        "orcid": "0000-0002-1336-2428",
        "linkedin": "",
        "or_profile": "~Hanlin_ZHANG3",
        "aff": "Liaoning University",
        "aff_domain": "lnu.edu.cn",
        "position": "PhD student",
        "bibtex": "@misc{\nzhang2024a,\ntitle={A Self-Supervised Pre-Training Model for Time Series Classification based on Data Pre-Processing},\nauthor={Hanlin ZHANG},\nyear={2024},\nurl={https://openreview.net/forum?id=xJ5CF1aOOX}\n}",
        "github": "",
        "project": "",
        "reviewers": "GpZ4;QovG;nrKg;PC6z",
        "site": "https://openreview.net/forum?id=xJ5CF1aOOX",
        "pdf_size": 2469305,
        "rating": "1;3;3;3",
        "confidence": "4;3;4;3",
        "soundness": "1;2;1;2",
        "contribution": "1;1;1;2",
        "presentation": "1;1;1;1",
        "wc_summary": "65;159;37;225",
        "wc_strengths": "9;78;12;136",
        "wc_weaknesses": "350;357;316;343",
        "wc_questions": "88;60;4;68",
        "wc_review": "512;654;369;772",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "510;694;280;405",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            2.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            1.5,
            0.5
        ],
        "contribution_avg": [
            1.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.0,
            0.0
        ],
        "wc_summary_avg": [
            121.5,
            74.91828882188915
        ],
        "wc_strengths_avg": [
            58.75,
            52.437462753264484
        ],
        "wc_weaknesses_avg": [
            341.5,
            15.532224567009067
        ],
        "wc_questions_avg": [
            55.0,
            31.160872901765767
        ],
        "wc_review_avg": [
            576.75,
            151.19751155359668
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            472.25,
            151.72405049958297
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:sYYa38tO4dUJ:scholar.google.com/&scioq=A+Self-Supervised+Pre-Training+Model+for+Time+Series+Classification+based+on+Data+Pre-Processing&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Liaoning University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.lnu.edu.cn/",
        "aff_unique_abbr": "LNNU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "title": "Constrained Bi-Level Optimization: Proximal Lagrangian Value Function Approach and Hessian-free Algorithm",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17456",
        "id": "xJ5N8qrEPl",
        "author_site": "Wei Yao, Chengming Yu, Shangzhi Zeng, Jin Zhang",
        "tldr": "",
        "abstract": "This paper presents a new approach and algorithm for solving a class of constrained Bi-Level Optimization (BLO) problems in which the lower-level problem involves constraints coupling both upper-level and lower-level variables. Such problems have recently gained significant attention due to their broad applicability in machine learning. However, conventional gradient-based methods unavoidably rely on computationally intensive calculations related to the Hessian matrix. To address this challenge, we devise a smooth proximal Lagrangian value function to handle the constrained lower-level problem. Utilizing this construct, we introduce a single-level reformulation for constrained BLOs that transforms the original BLO problem into an equivalent optimization problem with smooth constraints. Enabled by this reformulation, we develop a Hessian-free gradient-based algorithm\u2014termed proximal Lagrangian Value function-based Hessian-free Bi-level Algorithm (LV-HBA)\u2014that is straightforward to implement in a single loop manner. Consequently, LV-HBA is especially well-suited for machine learning applications. Furthermore, we offer non-asymptotic convergence analysis for LV-HBA, eliminating the need for traditional strong convexity assumptions for the lower-level problem while also being capable of accommodating non-singleton scenarios. Empirical results substantiate the algorithm's superior practical performance.",
        "keywords": "Bi-level Optimization;Constrained Optimization;Hessian-free;Single-loop;Value Function;Convergence Analysis",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/82a10714980dfe6b91c03f0ab2284eea266119e2.zip",
        "author": "Wei Yao;Chengming Yu;Shangzhi Zeng;Jin Zhang",
        "authorids": "~Wei_Yao3;~Chengming_Yu1;~Shangzhi_Zeng1;~Jin_Zhang8",
        "gender": ";M;M;M",
        "homepage": "https://mathscinet.ams.org/mathscinet/search/author.html?mrauthid=910710;https://faculty.sustech.edu.cn/?p=176730&tagid=zhangj9&cat=2&iscss=1&snapid=1&go=1&orderby=date;;https://math.sustech.edu.cn/c/zhangjin?lang=en",
        "dblp": ";;209/8353;",
        "google_scholar": ";;rzIzb6cAAAAJ;https://scholar.google.ca/citations?hl=en",
        "orcid": ";;0000-0002-6950-7825;",
        "linkedin": ";;;",
        "or_profile": "~Wei_Yao3;~Chengming_Yu1;~Shangzhi_Zeng1;~Jin_Zhang8",
        "aff": "Southern University of Science and Technology;Beijing University of Posts and Telecommunications;University of Victoria;",
        "aff_domain": "sustech.edu.cn;bupt.edu.cn;uvic.ca;",
        "position": "Assistant Professor;PhD student;Postdoc;",
        "bibtex": "@inproceedings{\nyao2024constrained,\ntitle={Constrained Bi-Level Optimization: Proximal Lagrangian Value Function Approach and Hessian-free Algorithm},\nauthor={Wei Yao and Chengming Yu and Shangzhi Zeng and Jin Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=xJ5N8qrEPl}\n}",
        "github": "",
        "project": "",
        "reviewers": "4Vih;7k2H;ttDx;W8M5;hK2o",
        "pdf_size": 12643950,
        "rating": "5;5;6;8;8",
        "confidence": "4;3;2;5;3",
        "soundness": "2;2;3;3;3",
        "contribution": "3;2;3;4;3",
        "presentation": "3;3;3;3;3",
        "wc_summary": "57;69;78;76;128",
        "wc_strengths": "28;47;69;76;204",
        "wc_weaknesses": "68;3;105;29;157",
        "wc_questions": "21;181;2;106;26",
        "wc_review": "174;300;254;287;515",
        "wc_reply_reviewers": "0;0;0;14;0",
        "wc_reply_authors": "2170;1113;934;848;333",
        "reply_reviewers": "0;0;0;1;0",
        "reply_authors": "5;2;2;2;1",
        "rating_avg": [
            6.4,
            1.3564659966250536
        ],
        "confidence_avg": [
            3.4,
            1.019803902718557
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            3.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            81.6,
            24.335981591051553
        ],
        "wc_strengths_avg": [
            84.8,
            61.95288532425266
        ],
        "wc_weaknesses_avg": [
            72.4,
            54.66113793180672
        ],
        "wc_questions_avg": [
            67.2,
            67.13985403618331
        ],
        "wc_review_avg": [
            306.0,
            113.31901870383453
        ],
        "wc_reply_reviewers_avg": [
            2.8,
            5.6
        ],
        "wc_reply_authors_avg": [
            1079.6,
            603.7113879992658
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4
        ],
        "reply_authors_avg": [
            2.4,
            1.3564659966250538
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3180732125814322,
        "gs_citation": 17,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5387307506795559405&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=xJ5N8qrEPl",
        "pdf": "https://openreview.net/pdf?id=xJ5N8qrEPl",
        "email": "sustech.edu.cn;bupt.edu.cn;uvic.ca;",
        "author_num": 4,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Southern University of Science and Technology;Beijing University of Posts and Telecommunications;University of Victoria",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.sustech.edu.cn;http://www.bupt.edu.cn/;https://www.uvic.ca",
        "aff_unique_abbr": "SUSTech;BUPT;UVic",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Beijing",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "China;Canada"
    },
    {
        "title": "Impact of Computation in Integral Reinforcement Learning for Continuous-Time Control",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17455",
        "id": "xJEd8PkdNz",
        "author_site": "Wenhan Cao, Wei Pan",
        "tldr": "",
        "abstract": "Integral reinforcement learning (IntRL) demands the precise computation of the utility function's integral at its policy evaluation (PEV) stage. This is achieved through quadrature rules, which are weighted sums of utility functions evaluated from state samples obtained in discrete time. Our research reveals a critical yet underexplored phenomenon: the choice of the computational method -- in this case, the quadrature rule -- can significantly impact control performance. This impact is traced back to the fact that computational errors introduced in the PEV stage can affect the policy iteration's convergence behavior, which in turn affects the learned controller. To elucidate how computation impacts control, we draw a parallel between IntRL's policy iteration and Newton's method applied to the Hamilton-Jacobi-Bellman equation. In this light, computational error in PEV manifests as an extra error term in each iteration of Newton's method, with its upper bound proportional to the computational error. Further, we demonstrate that when the utility function resides in a reproducing kernel Hilbert space (RKHS), the optimal quadrature is achievable by employing Bayesian quadrature with the RKHS-inducing kernel function. We prove that the local convergence rates for IntRL using the trapezoidal rule and Bayesian quadrature with a Mat\u00e9rn kernel to be $O(N^{-2})$ and $O(N^{-b})$, where $N$ is the number of evenly-spaced samples and $b$ is the Mat\u00e9rn kernel's smoothness parameter. These theoretical findings are finally validated by two canonical control tasks.",
        "keywords": "Integral Reinforcement Learning;Bayesian Quadrature;Newton's Method",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Wenhan Cao;Wei Pan",
        "authorids": "~Wenhan_Cao1;~Wei_Pan2",
        "gender": "M;M",
        "homepage": "https://wenhancao.github.io/;http://panweihit.github.io",
        "dblp": "254/6358;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;GqryWPsAAAAJ",
        "orcid": ";0000-0003-1121-9879",
        "linkedin": ";wei-pan-6b558b17/",
        "or_profile": "~Wenhan_Cao1;~Wei_Pan2",
        "aff": "Tsinghua University;University of Manchester",
        "aff_domain": "tsinghua.edu.cn;manchester.ac.uk",
        "position": "PhD student;Associate Professor",
        "bibtex": "@inproceedings{\ncao2024impact,\ntitle={Impact of Computation in Integral Reinforcement Learning for Continuous-Time Control},\nauthor={Wenhan Cao and Wei Pan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=xJEd8PkdNz}\n}",
        "github": "",
        "project": "",
        "reviewers": "jx6Y;3VMw;EcSW;8W8E",
        "pdf_size": 2589662,
        "rating": "6;6;8;8",
        "confidence": "2;2;3;3",
        "soundness": "3;3;4;3",
        "contribution": "2;3;3;2",
        "presentation": "2;3;2;3",
        "wc_summary": "139;74;81;102",
        "wc_strengths": "116;84;52;39",
        "wc_weaknesses": "61;2;202;54",
        "wc_questions": "26;98;39;82",
        "wc_review": "342;258;374;277",
        "wc_reply_reviewers": "8;0;217;46",
        "wc_reply_authors": "738;566;2032;1914",
        "reply_reviewers": "1;0;3;1",
        "reply_authors": "2;1;4;4",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            2.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            99.0,
            25.288337232803585
        ],
        "wc_strengths_avg": [
            72.75,
            29.86113695089321
        ],
        "wc_weaknesses_avg": [
            79.75,
            74.16999056222132
        ],
        "wc_questions_avg": [
            61.25,
            29.65952629426168
        ],
        "wc_review_avg": [
            312.75,
            47.12417108024289
        ],
        "wc_reply_reviewers_avg": [
            67.75,
            87.90442252810719
        ],
        "wc_reply_authors_avg": [
            1312.5,
            664.6042055238592
        ],
        "reply_reviewers_avg": [
            1.25,
            1.0897247358851685
        ],
        "reply_authors_avg": [
            2.75,
            1.299038105676658
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7282582178868926164&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=xJEd8PkdNz",
        "pdf": "https://openreview.net/pdf?id=xJEd8PkdNz",
        "email": "tsinghua.edu.cn;manchester.ac.uk",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Tsinghua University;University of Manchester",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.manchester.ac.uk",
        "aff_unique_abbr": "THU;UoM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "title": "SALMON: Self-Alignment with Instructable Reward Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17454",
        "id": "xJbsmB8UMx",
        "author_site": "Zhiqing Sun, Yikang Shen, Hongxin Zhang, Qinhong Zhou, Zhenfang Chen, David Cox, Yiming Yang, Chuang Gan",
        "tldr": "",
        "abstract": "Supervised Fine-Tuning (SFT) on response demonstrations combined with Reinforcement Learning from Human Feedback (RLHF) constitutes a powerful paradigm for aligning LLM-based AI agents. However, a significant limitation of such an approach is its dependency on high-quality human annotations, making its application to intricate tasks challenging due to difficulties in obtaining consistent response demonstrations and in-distribution response preferences. This paper presents a novel approach, namely SALMON, to align base language models with minimal human supervision, using only a small set of human-defined principles, yet achieving superior performance. Central to our approach is an instructable reward model. Trained on synthetic preference data, this model can generate reward scores based on arbitrary human-defined principles. By merely adjusting these principles during the RL training phase, we gain full control over the preferences with the instructable reward model, subsequently influencing the behavior of the RL-trained policy models, and reducing the reliance on the collection of online human preferences. Applying our method to the LLaMA-2-70b base language model, we developed an AI assistant named Dromedary-2. With only 6 exemplars for in-context learning and 31 human-defined principles, Dromedary-2 significantly surpasses the performance of several state-of-the-art AI systems, including LLaMA-2-Chat-70b, on various benchmark datasets. We have open-sourced the code and model weights to encourage further research into aligning LLM-based AI agents with enhanced supervision efficiency, improved controllability, and scalable oversight.",
        "keywords": "AI Alignment;Large Language Models;Scalable Oversight",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Zhiqing Sun;Yikang Shen;Hongxin Zhang;Qinhong Zhou;Zhenfang Chen;David Daniel Cox;Yiming Yang;Chuang Gan",
        "authorids": "~Zhiqing_Sun1;~Yikang_Shen1;~Hongxin_Zhang1;~Qinhong_Zhou1;~Zhenfang_Chen1;~David_Daniel_Cox1;~Yiming_Yang1;~Chuang_Gan1",
        "gender": "M;M;M;M;M;;F;M",
        "homepage": "https://www.cs.cmu.edu/~zhiqings/;;https://icefoxzhx.github.io/;https://zhouqqhh.github.io/;https://zfchenunique.github.io;;http://www.cs.cmu.edu/~yiming/;http://people.csail.mit.edu/ganchuang/",
        "dblp": "211/7692;152/8226;284/2962-5;337/9618;207/5321;48/7659;25/1666;139/6993",
        "google_scholar": "https://scholar.google.com/citations?hl=en;qff5rRYAAAAJ;https://scholar.google.com/citations?hl=en;sQW6Ni4AAAAJ;QSRdIzAAAAAJ;;MlZq4XwAAAAJ;PTeSCbIAAAAJ",
        "orcid": ";;0000-0002-6041-2440;;;;0000-0001-8322-607X;",
        "linkedin": "zhiqing-sun-5781b3100/;;;https://www.linkedin.cn/incareer/in/%E6%B2%81%E6%B3%93-%E5%91%A8-9500b7127;\u632f\u65b9-\u9648-512011bb/;;yiming-yang-24100924/;",
        "or_profile": "~Zhiqing_Sun1;~Yikang_Shen1;~Hongxin_Zhang1;~Qinhong_Zhou1;~Zhenfang_Chen1;~David_Daniel_Cox1;~Yiming_Yang1;~Chuang_Gan1",
        "aff": "Carnegie Mellon University;International Business Machines;University of Massachusetts at Amherst;University of Massachusetts at Amherst;MIT-IBM Watson AI lab;International Business Machines;School of Computer Science, Carnegie Mellon University;University of Massachusetts at Amherst",
        "aff_domain": "cs.cmu.edu;ibm.com;umass.edu;umass.edu;ibm.com;ibm.com;cs.cmu.edu;umass.edu",
        "position": "PhD student;Researcher;PhD student;PhD student;Researcher;IBM Director, MIT-IBM Watson AI Lab;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nsun2024salmon,\ntitle={{SALMON}: Self-Alignment with Instructable Reward Models},\nauthor={Zhiqing Sun and Yikang Shen and Hongxin Zhang and Qinhong Zhou and Zhenfang Chen and David Daniel Cox and Yiming Yang and Chuang Gan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=xJbsmB8UMx}\n}",
        "github": "",
        "project": "",
        "reviewers": "AyPF;DDqX;pWc3;7kRD",
        "pdf_size": 806939,
        "rating": "6;6;6;8",
        "confidence": "3;3;4;3",
        "soundness": "3;3;2;4",
        "contribution": "3;2;2;4",
        "presentation": "3;3;3;3",
        "wc_summary": "27;150;97;50",
        "wc_strengths": "21;56;61;87",
        "wc_weaknesses": "48;154;344;72",
        "wc_questions": "161;98;226;5",
        "wc_review": "257;458;728;214",
        "wc_reply_reviewers": "22;0;0;0",
        "wc_reply_authors": "460;688;1121;343",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            81.0,
            47.15400301140933
        ],
        "wc_strengths_avg": [
            56.25,
            23.509306667785847
        ],
        "wc_weaknesses_avg": [
            154.5,
            116.25295695164058
        ],
        "wc_questions_avg": [
            122.5,
            81.54906498544297
        ],
        "wc_review_avg": [
            414.25,
            203.21217360187848
        ],
        "wc_reply_reviewers_avg": [
            5.5,
            9.526279441628825
        ],
        "wc_reply_authors_avg": [
            653.0,
            297.32053410418865
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 24,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17245952669783768881&as_sdt=5,31&sciodt=0,31&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=xJbsmB8UMx",
        "pdf": "https://openreview.net/pdf?id=xJbsmB8UMx",
        "email": "cs.cmu.edu;ibm.com;umass.edu;umass.edu;ibm.com;ibm.com;cs.cmu.edu;umass.edu",
        "author_num": 8,
        "aff_unique_index": "0;1;2;2;3;1;0;2",
        "aff_unique_norm": "Carnegie Mellon University;International Business Machines Corporation;University of Massachusetts Amherst;Massachusetts Institute of Technology",
        "aff_unique_dep": ";;;IBM Watson AI lab",
        "aff_unique_url": "https://www.cmu.edu;https://www.ibm.com;https://www.umass.edu;https://www.mitibmwatsonailab.org",
        "aff_unique_abbr": "CMU;IBM;UMass Amherst;MIT-IBM AI Lab",
        "aff_campus_unique_index": "1;1;2;1",
        "aff_campus_unique": ";Amherst;Pittsburgh",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "xLRAQiqd9I",
        "title": "GeoMFormer: A General Architecture for Geometric Molecular Representation Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Molecular modeling, a central topic in quantum mechanics, aims to accurately calculate the properties and simulate the behaviors of molecular systems. The molecular model is governed by physical laws, which impose geometric constraints such as invariance and equivariance to coordinate rotation and translation. While numerous deep learning approaches have been developed to learn molecular representations under these constraints, most of them are built upon heuristic and costly modules. We argue that there is a strong need for a general and flexible framework for learning both invariant and equivariant features. In this work, we introduce a novel Transformer-based molecular model called GeoMFormer to achieve this goal. Using the standard Transformer modules, two separate streams are developed to maintain and learn invariant and equivariant representations. Carefully designed cross-attention modules bridge the two streams, allowing information fusion and enhancing geometric modeling in each stream. As a general and flexible architecture, we show that many previous architectures can be viewed as special instantiations of GeoMFormer. Extensive experiments are conducted to demonstrate the power of GeoMFormer. All empirical results show that GeoMFormer achieves strong performance on both invariant and equivariant tasks of different types and scales. Code and models will be made publicly available.",
        "keywords": "Transformer;Molecular Modeling; Geometric Molecular Representation; Invariance; Equivariance",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Tianlang Chen;Shengjie Luo;Di He;Shuxin Zheng;Tie-Yan Liu;Liwei Wang",
        "authorids": "~Tianlang_Chen2;~Shengjie_Luo1;~Di_He1;~Shuxin_Zheng1;~Tie-Yan_Liu1;~Liwei_Wang1",
        "gender": ";M;M;M;M;M",
        "homepage": ";https://lsj2408.github.io;https://dihe-pku.github.io/;https://www.microsoft.com/en-us/research/people/shuz/;http://member.acm.org/~tieyanliu;http://www.liweiwang-pku.com/",
        "dblp": ";274/2110;74/184;186/8255;l/TieYanLiu;",
        "google_scholar": ";ImWO7WYAAAAJ;https://scholar.google.co.jp/citations?user=orVoz4IAAAAJ;https://scholar.google.co.jp/citations?user=rPhGUw0AAAAJ;Nh832fgAAAAJ;VZHxoh8AAAAJ",
        "orcid": ";;;;0000-0002-0476-8020;",
        "linkedin": ";shengjie-luo-ba6137193/;;;;",
        "or_profile": "~Tianlang_Chen2;~Shengjie_Luo1;~Di_He1;~Shuxin_Zheng1;~Tie-Yan_Liu1;~Liwei_Wang1",
        "aff": ";Microsoft;Microsoft;Microsoft;Microsoft;Peking University",
        "aff_domain": ";microsoft.com;microsoft.com;microsoft.com;microsoft.com;pku.edu.cn",
        "position": ";Intern;Senior Researcher;Senior Researcher;Distinguished Scientist;Full Professor",
        "bibtex": "@misc{\nchen2024geomformer,\ntitle={Geo{MF}ormer: A General Architecture for Geometric Molecular Representation Learning},\nauthor={Tianlang Chen and Shengjie Luo and Di He and Shuxin Zheng and Tie-Yan Liu and Liwei Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=xLRAQiqd9I}\n}",
        "github": "",
        "project": "",
        "reviewers": "vMxo;K4hR;qDQg;awZP",
        "site": "https://openreview.net/forum?id=xLRAQiqd9I",
        "pdf_size": 721032,
        "rating": "5;6;6;8",
        "confidence": "4;4;3;4",
        "soundness": "3;3;3;4",
        "contribution": "1;3;3;4",
        "presentation": "3;3;3;4",
        "wc_summary": "205;54;90;79",
        "wc_strengths": "25;57;168;62",
        "wc_weaknesses": "112;19;1;45",
        "wc_questions": "50;154;90;1",
        "wc_review": "392;284;349;187",
        "wc_reply_reviewers": "173;36;0;22",
        "wc_reply_authors": "2338;1472;755;514",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "5;4;2;2",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            1.0897247358851685
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            107.0,
            58.0646191755358
        ],
        "wc_strengths_avg": [
            78.0,
            53.86557342124931
        ],
        "wc_weaknesses_avg": [
            44.25,
            42.12704000995085
        ],
        "wc_questions_avg": [
            73.75,
            56.03737592000539
        ],
        "wc_review_avg": [
            303.0,
            77.22370102500915
        ],
        "wc_reply_reviewers_avg": [
            57.75,
            67.765680842149
        ],
        "wc_reply_authors_avg": [
            1269.75,
            710.3148509639933
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.25,
            1.299038105676658
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.13245323570650439,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10674107071133876192&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;0;0;1",
        "aff_unique_norm": "Microsoft;Peking University",
        "aff_unique_dep": "Microsoft Corporation;",
        "aff_unique_url": "https://www.microsoft.com;http://www.pku.edu.cn",
        "aff_unique_abbr": "Microsoft;Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;1",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "xLoxMvO695",
        "title": "Decomposing the Enigma: Subgoal-based Demonstration Learning for Formal Theorem Proving",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large language models~(LLMs) present an intriguing avenue of exploration in the domain of formal theorem proving. Nonetheless, the full utilization of these models, particularly in terms of demonstration formatting and organization, remains an underexplored area. In an endeavor to enhance the efficacy of LLMs, we introduce a subgoal-based demonstration learning framework, consisting of two primary elements: Firstly, drawing upon the insights of subgoal learning from the domains of reinforcement learning and robotics, we propose the construction of distinct subgoals for each demonstration example and refine these subgoals in accordance with the pertinent theories of subgoal learning. Secondly, we build upon recent advances in diffusion models to predict the optimal organization, simultaneously addressing two intricate issues that persist within the domain of demonstration organization: subset selection and order determination. Through the integration of subgoal-based learning methodologies, we have successfully increased the prevailing proof accuracy from 38.9\\% to 44.3\\% on the miniF2F benchmark. Furthermore, the adoption of diffusion models for demonstration organization can lead to an additional enhancement in accuracy to 45.5\\%, or a $5\\times$ improvement in sampling efficiency compared with the long-standing state-of-the-art method.\\footnote{All data and code will be open-sourced upon publication.}",
        "keywords": "formal theorem proving; subgoal learning; in-context learning",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "",
        "author": "Xueliang Zhao;Wenda Li;Lingpeng Kong",
        "authorids": "~Xueliang_Zhao1;~Wenda_Li1;~Lingpeng_Kong1",
        "gender": "M;M;M",
        "homepage": ";https://wenda302.github.io;https://ikekonglp.github.io/",
        "dblp": ";132/9868.html;144/7656",
        "google_scholar": "h-87C9cAAAAJ;ufYxQkEAAAAJ;f1hBi5wAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Xueliang_Zhao1;~Wenda_Li1;~Lingpeng_Kong1",
        "aff": "The University of Hong Kong;University of Edinburgh;Department of Computer Science, The University of Hong Kong",
        "aff_domain": "cs.hku.hk;ed.ac.uk;cs.hku.hk",
        "position": "PhD student;Lecturer;Assistant Professor",
        "bibtex": "@misc{\nzhao2024decomposing,\ntitle={Decomposing the Enigma: Subgoal-based Demonstration Learning for Formal Theorem Proving},\nauthor={Xueliang Zhao and Wenda Li and Lingpeng Kong},\nyear={2024},\nurl={https://openreview.net/forum?id=xLoxMvO695}\n}",
        "github": "",
        "project": "",
        "reviewers": "xitB;Wmqb;kVAV",
        "site": "https://openreview.net/forum?id=xLoxMvO695",
        "pdf_size": 2456560,
        "rating": "5;6;8",
        "confidence": "3;3;2",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "2;3;3",
        "wc_summary": "124;110;165",
        "wc_strengths": "35;81;37",
        "wc_weaknesses": "207;153;130",
        "wc_questions": "7;17;8",
        "wc_review": "373;361;340",
        "wc_reply_reviewers": "110;0;12",
        "wc_reply_authors": "1463;821;646",
        "reply_reviewers": "1;0;1",
        "reply_authors": "4;2;1",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            133.0,
            23.338094752285727
        ],
        "wc_strengths_avg": [
            51.0,
            21.228911104120876
        ],
        "wc_weaknesses_avg": [
            163.33333333333334,
            32.27313984655902
        ],
        "wc_questions_avg": [
            10.666666666666666,
            4.496912521077347
        ],
        "wc_review_avg": [
            358.0,
            13.638181696985855
        ],
        "wc_reply_reviewers_avg": [
            40.666666666666664,
            49.27022991173834
        ],
        "wc_reply_authors_avg": [
            976.6666666666666,
            351.2324333290168
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.944911182523068,
        "gs_citation": 21,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1479976646415055425&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Hong Kong;University of Edinburgh",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.hku.hk;https://www.ed.ac.uk",
        "aff_unique_abbr": "HKU;Edinburgh",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "id": "xNdE7RiRyP",
        "title": "TinyTrain: Deep Neural Network Training at the Extreme Edge",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "On-device training is essential for user personalisation and privacy. With the pervasiveness of IoT devices and microcontroller units (MCU), this task becomes more challenging due to the constrained memory and compute resources, and the limited availability of labelled user data. Nonetheless, prior works neglect the data scarcity issue, require excessively long training time (e.g. a few hours), or induce substantial accuracy loss ($\\geq$10\\%). We propose TinyTrain, an on-device training approach that drastically reduces training time by selectively updating parts of the model and explicitly coping with data scarcity. TinyTrain introduces a task-adaptive sparse-update method that dynamically selects the layer/channel based on a multi-objective criterion that jointly captures user data, the memory, and the compute capabilities of the target device, leading to high accuracy on unseen tasks with reduced computation and memory footprint. TinyTrain outperforms vanilla fine-tuning of the entire network by 3.6-5.0\\% in accuracy, while reducing the backward-pass memory and computation cost by up to 1,098$\\times$ and 7.68$\\times$, respectively. Targeting broadly used real-world edge devices, TinyTrain achieves 9.5$\\times$ faster and 3.5$\\times$ more energy-efficient training over status-quo approaches, and 2.23$\\times$ smaller memory footprint than SOTA approaches, while remaining within the 1 MB memory envelope of MCU-grade platforms.",
        "keywords": "Tiny Machine Learning;On-device Training;Personalisation;Edge Computing;Microcontrollers",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/873cb784a782631f598176ae28b2c3783fa2a193.pdf",
        "author": "Young D. Kwon;Rui Li;Stylianos Venieris;Jagmohan Chauhan;Nicholas Donald Lane;Cecilia Mascolo",
        "authorids": "~Young_D._Kwon1;~Rui_Li11;~Stylianos_Venieris1;~Jagmohan_Chauhan1;~Nicholas_Donald_Lane1;~Cecilia_Mascolo1",
        "gender": "M;F;;;;F",
        "homepage": "https://theyoungkwon.github.io;https://ruihuili.github.io/;https://steliosven10.github.io/;;;http://www.cl.cam.ac.uk/users/cm542",
        "dblp": "77/5405;;169/2322;;;21/6419",
        "google_scholar": "_rp_S9MAAAAJ;;https://scholar.google.co.uk/citations?user=A1QXa5cAAAAJ;;;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;;;0000-0001-9614-4380",
        "linkedin": "theyoungkwon/;;stylianos-i-venieris-300446155;;;",
        "or_profile": "~Young_D._Kwon1;~Rui_Li11;~Stylianos_Venieris1;~Jagmohan_Chauhan1;~Nicholas_Donald_Lane1;~Cecilia_Mascolo1",
        "aff": "University of Cambridge;Samsung AI Center;Samsung AI;;;University of Cambridge",
        "aff_domain": "cam.ac.uk;samsung.com;samsung.com;;;cam.ac.uk",
        "position": "PhD student;Researcher;Researcher;;;Full Professor",
        "bibtex": "@misc{\nkwon2024tinytrain,\ntitle={TinyTrain: Deep Neural Network Training at the Extreme Edge},\nauthor={Young D. Kwon and Rui Li and Stylianos Venieris and Jagmohan Chauhan and Nicholas Donald Lane and Cecilia Mascolo},\nyear={2024},\nurl={https://openreview.net/forum?id=xNdE7RiRyP}\n}",
        "github": "",
        "project": "",
        "reviewers": "pF1F;T24f;aEBW;k57W",
        "site": "https://openreview.net/forum?id=xNdE7RiRyP",
        "pdf_size": 3001082,
        "rating": "3;5;5;8",
        "confidence": "4;5;4;4",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;2",
        "wc_summary": "69;72;100;55",
        "wc_strengths": "44;121;22;111",
        "wc_weaknesses": "34;254;122;190",
        "wc_questions": "320;2;5;146",
        "wc_review": "467;449;249;502",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "958;1024;777;895",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            74.0,
            16.32482771731451
        ],
        "wc_strengths_avg": [
            74.5,
            42.37039060476077
        ],
        "wc_weaknesses_avg": [
            150.0,
            81.6333265278342
        ],
        "wc_questions_avg": [
            118.25,
            130.20440660745703
        ],
        "wc_review_avg": [
            416.75,
            98.70758582804059
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            913.5,
            91.05630126465714
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.08084520834544431,
        "gs_citation": 19,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13015021045980767326&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1;0",
        "aff_unique_norm": "University of Cambridge;Samsung",
        "aff_unique_dep": ";AI Center",
        "aff_unique_url": "https://www.cam.ac.uk;https://www.samsung.com/global/careers/ai-center/",
        "aff_unique_abbr": "Cambridge;Samsung AI",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Cambridge;",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "United Kingdom;South Korea"
    },
    {
        "id": "xNn2nq5kiy",
        "title": "Plan-based Prompting Improves Literature Review Generation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We explore the zero-shot abilities of recent large language models (LLMs) for the task of writing the literature review of a scientific research paper conditioned on its abstract and the content of related papers. We propose and examine a novel strategy for literature review generation with an LLM in which we first generate a plan for the review, and then use it to generate the actual text. While modern LLMs can easily be trained or prompted to condition on all abstracts of papers to be cited to generate a literature review without such intermediate plans, our empirical study shows that these intermediate plans improve the quality of generated literature reviews over vanilla zero-shot generation. Furthermore, we also create a new test corpus consisting of recent arXiv papers (with full content) posted after both open-sourced and closed-sourced LLMs that were used in our study were released. This allows us to ensure that our zero-shot experiments do not suffer from test set contamination.",
        "keywords": "Large Language Models (LLMs);NLP;Multi-Document Summarization;Text Generation;Literature Review Generation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Shubham Agarwal;Issam H. Laradji;Laurent Charlin;Christopher Pal",
        "authorids": "~Shubham_Agarwal3;~Issam_H._Laradji1;~Laurent_Charlin1;~Christopher_Pal1",
        "gender": "M;M;M;",
        "homepage": "https://shubhamagarwal92.github.io/;https://issamlaradji.github.io/;http://www.cs.toronto.edu/~lcharlin/;https://scholar.google.ca/citations?user=1ScWJOoAAAAJ&hl=en&oi=ao",
        "dblp": "49/2855-1;142/0043;48/5717;45/1217",
        "google_scholar": "aSMFGScAAAAJ;https://scholar.google.ca/citations?user=8vRS7F0AAAAJ;Cul0g2YAAAAJ;https://scholar.google.ca/citations?user=1ScWJOoAAAAJ",
        "orcid": ";;0000-0002-6545-9459;",
        "linkedin": "shubham-agarwal-4b215146/;issam-laradji-67ba1a99/;;",
        "or_profile": "~Shubham_Agarwal3;~Issam_H._Laradji1;~Laurent_Charlin1;~Christopher_Pal1",
        "aff": "ServiceNow Research;ServiceNow;Mila - Quebec Artificial Intelligence Institute;Polytechnique Montreal",
        "aff_domain": "servicenow.com;servicenow.com;mila.quebec;polymtl.ca",
        "position": "Visiting Researcher;Researcher;Principal Researcher;Full Professor",
        "bibtex": "@misc{\nagarwal2024planbased,\ntitle={Plan-based Prompting Improves Literature Review Generation},\nauthor={Shubham Agarwal and Issam H. Laradji and Laurent Charlin and Christopher Pal},\nyear={2024},\nurl={https://openreview.net/forum?id=xNn2nq5kiy}\n}",
        "github": "",
        "project": "",
        "reviewers": "y3EM;CcYt;ViNE;u18m;N3Vy",
        "site": "https://openreview.net/forum?id=xNn2nq5kiy",
        "pdf_size": 1955575,
        "rating": "1;3;3;3;5",
        "confidence": "4;3;3;4;3",
        "soundness": "3;2;2;3;3",
        "contribution": "1;2;2;2;3",
        "presentation": "3;2;1;3;3",
        "wc_summary": "28;87;54;90;72",
        "wc_strengths": "11;18;81;142;65",
        "wc_weaknesses": "166;262;209;116;241",
        "wc_questions": "53;3;101;8;3",
        "wc_review": "258;370;445;356;381",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            3.0,
            1.2649110640673518
        ],
        "confidence_avg": [
            3.4,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            2.4,
            0.8
        ],
        "wc_summary_avg": [
            66.2,
            22.98173187555716
        ],
        "wc_strengths_avg": [
            63.4,
            47.53356708684927
        ],
        "wc_weaknesses_avg": [
            198.8,
            52.55625557438429
        ],
        "wc_questions_avg": [
            33.6,
            38.59326366090332
        ],
        "wc_review_avg": [
            362.0,
            60.276031720742864
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.6454972243679028,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:m1RFQY7YbsEJ:scholar.google.com/&scioq=Plan-based+Prompting+Improves+Literature+Review+Generation&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "ServiceNow;Quebec Artificial Intelligence Institute;Polytechnique Montreal",
        "aff_unique_dep": "Research;Artificial Intelligence;",
        "aff_unique_url": "https://www.servicenow.com;https://mila.quebec;https://www.polymtl.ca",
        "aff_unique_abbr": "ServiceNow;Mila;PolyMTL",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Montreal",
        "aff_country_unique_index": "0;0;1;1",
        "aff_country_unique": "United States;Canada"
    },
    {
        "id": "xRiZddh5Pb",
        "title": "Learning from A Single Graph is All You Need for Near-Shortest Path Routing",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We propose a simple algorithm that needs only a few data samples from a single graph for learning local routing policies that generalize across classes of geomet\u0002ric random graphs in Euclidean and hyperbolic metric spaces. We thus solve the all-pairs near-shortest path problem by training deep neural networks (DNNs) that let each graph node efficiently and scalably route (i.e., forward) packets by consid\u0002ering only the node\u2019s state and the state of the neighboring nodes. Our algorithm design exploits network domain knowledge in the selection of input features and in the selection of a \u201cseed graph\u201d and its data samples. The leverage of domain knowledge provides theoretical assurance that the seed graph and node subsam\u0002pling suffice for learning that is generalizable, scalable, and efficient. Remarkably, one of these DNNs we train \u2014using distance as the only input feature\u2014 learns a policy that exactly matches the well-known Greedy Forwarding policy, which forwards packets to the neighbor with the shortest distance to the destination. We also learn a new policy, which we call Greedy Tensile routing \u2014using both dis\u0002tance and stretch factor as the input features\u2014 that almost always outperforms greedy forwarding. We demonstrate the explainability and ultra-low latency run\u0002time operation of Greedy Tensile routing by symbolically interpreting its DNN in terms as a low-complexity linear actions.",
        "keywords": "zero-shot learning;local search;reinforcement learning;all-pairs shortest path routing;network knowledge",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Yung-Fu Chen;Sen Lin;Anish Arora",
        "authorids": "~Yung-Fu_Chen1;~Sen_Lin1;~Anish_Arora1",
        "gender": "M;;M",
        "homepage": ";https://slin70.github.io/;http://web.cse.ohio-state.edu/~arora.9/",
        "dblp": ";70/9499-1.html;a/AArora.html",
        "google_scholar": "5lVf8oIAAAAJ;94-TbUsAAAAJ;Bn0zSwQAAAAJ",
        "orcid": "0009-0002-5331-409X;;0000-0003-2152-0462",
        "linkedin": ";;anish-arora-6541592/",
        "or_profile": "~Yung-Fu_Chen1;~Sen_Lin1;~Anish_Arora1",
        "aff": "Ohio State University, Columbus;University of Houston;Ohio State University, Columbus",
        "aff_domain": "osu.edu;uh.edu;osu.edu",
        "position": "PhD student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nchen2024learning,\ntitle={Learning from A Single Graph is All You Need for Near-Shortest Path Routing},\nauthor={Yung-Fu Chen and Sen Lin and Anish Arora},\nyear={2024},\nurl={https://openreview.net/forum?id=xRiZddh5Pb}\n}",
        "github": "",
        "project": "",
        "reviewers": "D6sq;HSXi;JN8R;KPLY;w67p;zGzT",
        "site": "https://openreview.net/forum?id=xRiZddh5Pb",
        "pdf_size": 2130878,
        "rating": "1;3;3;3;3;6",
        "confidence": "4;4;3;3;3;3",
        "soundness": "2;2;3;1;1;2",
        "contribution": "1;2;1;3;2;3",
        "presentation": "3;2;3;2;3;2",
        "wc_summary": "230;110;386;167;99;70",
        "wc_strengths": "16;31;26;54;24;45",
        "wc_weaknesses": "351;511;156;57;413;34",
        "wc_questions": "252;10;59;601;119;49",
        "wc_review": "849;662;627;879;655;198",
        "wc_reply_reviewers": "0;0;0;0;0;20",
        "wc_reply_authors": "103;0;103;135;147;383",
        "reply_reviewers": "0;0;0;0;0;1",
        "reply_authors": "1;0;1;1;1;2",
        "rating_avg": [
            3.1666666666666665,
            1.4624940645653537
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            1.8333333333333333,
            0.6871842709362768
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            177.0,
            106.93611800197974
        ],
        "wc_strengths_avg": [
            32.666666666666664,
            12.957194483717874
        ],
        "wc_weaknesses_avg": [
            253.66666666666666,
            181.4530854579834
        ],
        "wc_questions_avg": [
            181.66666666666666,
            202.82641730197662
        ],
        "wc_review_avg": [
            645.0,
            222.44624818893516
        ],
        "wc_reply_reviewers_avg": [
            3.3333333333333335,
            7.4535599249993
        ],
        "wc_reply_authors_avg": [
            145.16666666666666,
            116.40506384555997
        ],
        "reply_reviewers_avg": [
            0.16666666666666666,
            0.372677996249965
        ],
        "reply_authors_avg": [
            1.0,
            0.5773502691896257
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5640760748177662,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:rHgqK9gf8BYJ:scholar.google.com/&scioq=Learning+from+A+Single+Graph+is+All+You+Need+for+Near-Shortest+Path+Routing&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Ohio State University;University of Houston",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.osu.edu;https://www.uh.edu",
        "aff_unique_abbr": "OSU;UH",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Columbus;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "xTFgpfIMOt",
        "title": "Adapt On-the-Go: Behavior Modulation for Single-Life Robot Deployment",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "To succeed in the real world, robots must cope with situations that differ from those seen during training. We study the problem of adapting on-the-fly to such novel scenarios during deployment, by drawing upon a diverse repertoire of previously- learned behaviors. Our approach, RObust Autonomous Modulation (ROAM), introduces a mechanism based on the perceived value of pre-trained behaviors to select and adapt pre-trained behaviors to the situation at hand. Crucially, this adaptation process all happens within a single episode at test time, without any human supervision. We provide theoretical analysis of our selection mechanism and demonstrate that ROAM enables a robot to adapt rapidly to changes in dynamics both in simulation and on a real Go1 quadruped, even successfully moving forward with roller skates on its feet. Our approach adapts over 2x as efficiently compared to existing methods when facing a variety of out-of-distribution situations during deployment by effectively choosing and adapting relevant behaviors on-the-fly.",
        "keywords": "reinforcement learning;single-life deployment;autonomous reinforcement learning;out-of-distribution adaptation",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Annie S Chen;Govind Chada;Laura Smith;Archit Sharma;Zipeng Fu;Sergey Levine;Chelsea Finn",
        "authorids": "~Annie_S_Chen1;gchada@stanford.edu;~Laura_Smith1;~Archit_Sharma1;~Zipeng_Fu1;~Sergey_Levine1;~Chelsea_Finn1",
        "gender": "F;;F;M;M;M;F",
        "homepage": "https://anniesch.github.io/;;;;https://zipengfu.github.io;https://people.eecs.berkeley.edu/~svlevine/;https://ai.stanford.edu/~cbfinn/",
        "dblp": "277/1527.html;;54/11024;220/3163.html;245/1504;80/7594;131/1783",
        "google_scholar": ";;;_0IIzxgAAAAJ;wMcPTbEAAAAJ;8R35rCwAAAAJ;vfPE6hgAAAAJ",
        "orcid": ";;;;;;",
        "linkedin": "annie-s-chen/;;;;zipengfu;;",
        "or_profile": "~Annie_S_Chen1;gchada@stanford.edu;~Laura_Smith1;~Archit_Sharma1;~Zipeng_Fu1;~Sergey_Levine1;~Chelsea_Finn1",
        "aff": "Stanford University;;University of California, Berkeley;Stanford University;Stanford University;Google;Google",
        "aff_domain": "stanford.edu;;berkeley.edu;stanford.edu;stanford.edu;google.com;google.com",
        "position": "PhD student;;PhD student;Graduate Student;PhD student;Research Scientist;Research Scientist",
        "bibtex": "@misc{\nchen2024adapt,\ntitle={Adapt On-the-Go: Behavior Modulation for Single-Life Robot Deployment},\nauthor={Annie S Chen and Govind Chada and Laura Smith and Archit Sharma and Zipeng Fu and Sergey Levine and Chelsea Finn},\nyear={2024},\nurl={https://openreview.net/forum?id=xTFgpfIMOt}\n}",
        "github": "",
        "project": "",
        "reviewers": "YRpi;TYha;K9rY",
        "site": "https://openreview.net/forum?id=xTFgpfIMOt",
        "pdf_size": 1034096,
        "rating": "3;6;8",
        "confidence": "3;3;5",
        "soundness": "2;3;4",
        "contribution": "2;2;3",
        "presentation": "3;3;4",
        "wc_summary": "121;231;33",
        "wc_strengths": "99;30;52",
        "wc_weaknesses": "311;202;62",
        "wc_questions": "46;140;5",
        "wc_review": "577;603;152",
        "wc_reply_reviewers": "551;56;0",
        "wc_reply_authors": "1410;520;48",
        "reply_reviewers": "1;1;0",
        "reply_authors": "5;2;1",
        "rating_avg": [
            5.666666666666667,
            2.0548046676563256
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            128.33333333333334,
            80.9993141260399
        ],
        "wc_strengths_avg": [
            60.333333333333336,
            28.778850258865834
        ],
        "wc_weaknesses_avg": [
            191.66666666666666,
            101.91608748813353
        ],
        "wc_questions_avg": [
            63.666666666666664,
            56.51155240794183
        ],
        "wc_review_avg": [
            444.0,
            206.747833523514
        ],
        "wc_reply_reviewers_avg": [
            202.33333333333334,
            247.60227965204376
        ],
        "wc_reply_authors_avg": [
            659.3333333333334,
            564.6953947827881
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            1.699673171197595
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.8029550685469663,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4307496860269946723&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0;0;2;2",
        "aff_unique_norm": "Stanford University;University of California, Berkeley;Google",
        "aff_unique_dep": ";;Google",
        "aff_unique_url": "https://www.stanford.edu;https://www.berkeley.edu;https://www.google.com",
        "aff_unique_abbr": "Stanford;UC Berkeley;Google",
        "aff_campus_unique_index": "0;1;0;0;2;2",
        "aff_campus_unique": "Stanford;Berkeley;Mountain View",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "xTJW1gVgGK",
        "title": "Test",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "test",
        "keywords": "test",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Xinyu Hu",
        "authorids": "~Xinyu_Hu2",
        "gender": "F",
        "homepage": "https://christine1729.github.io/posts/2022-10-17-dsml/",
        "dblp": "",
        "google_scholar": "",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Xinyu_Hu2",
        "aff": "Microsoft",
        "aff_domain": "microsoft.com",
        "position": "Researcher",
        "bibtex": "@misc{\nhu2024test,\ntitle={Test},\nauthor={Xinyu Hu},\nyear={2024},\nurl={https://openreview.net/forum?id=xTJW1gVgGK}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=xTJW1gVgGK",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0",
        "aff_unique_norm": "Microsoft",
        "aff_unique_dep": "Microsoft Corporation",
        "aff_unique_url": "https://www.microsoft.com",
        "aff_unique_abbr": "Microsoft",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "xTJW1gVgGK",
        "title": "Test",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "test",
        "keywords": "test",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Xinyu Hu",
        "authorids": "~Xinyu_Hu2",
        "gender": "F",
        "homepage": "https://christine1729.github.io/posts/2022-10-17-dsml/",
        "dblp": "",
        "google_scholar": "",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Xinyu_Hu2",
        "aff": "Microsoft",
        "aff_domain": "microsoft.com",
        "position": "Researcher",
        "bibtex": "@misc{\nhu2024test,\ntitle={Test},\nauthor={Xinyu Hu},\nyear={2024},\nurl={https://openreview.net/forum?id=xTJW1gVgGK}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=xTJW1gVgGK",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "aff_unique_index": "0",
        "aff_unique_norm": "Microsoft",
        "aff_unique_dep": "Microsoft Corporation",
        "aff_unique_url": "https://www.microsoft.com",
        "aff_unique_abbr": "Microsoft",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "xThb6APBoG",
        "title": "Adapting Retrieval Models to Task-Specific Goals using Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Given an input query, retrieval models are trained using user feedback data (e.g., click data) to output a ranked list of items. However, it is difficult to optimize task-specific goals  using supervised learning because the goals often correspond to non-differentiable losses. For example, we may want to optimize recall or novelty of the top-k items for a recommendation task or optimize accuracy of a blackbox large language model (LLM) for the retrieval-augmented generation task. To optimize arbitrary task-specific losses, we propose a reinforcement learning-based framework that applies to any pretrained retrieval model. Specifically, our solution uses policy gradient and addresses the key challenge of large action spaces by reduction to a binary action space, given both the query and the retrieved item. Our formulation also allows for exploration based on auxiliary retrieval models.  We empirically evaluate the proposed algorithm on improving recall for a query-ad retrieval task on two datasets with 4K and 1.9M actions respectively. We also show the benefit of the proposed algorithm on improving a custom metric---novelty of the retrieved items w.r.t. existing algorithms---for a commercial search engine.",
        "keywords": "information retrieval;policy gradient;large action space",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Amit Sharma;Hua Li;Xue Li;Jian Jiao",
        "authorids": "~Amit_Sharma3;~Hua_Li3;~Xue_Li7;~Jian_Jiao2",
        "gender": "M;Not Specified;F;M",
        "homepage": "http://amitsharma.in/;;;",
        "dblp": "72/2540-7;80/6898-1;;29/265-7.html",
        "google_scholar": "https://scholar.google.co.in/citations?user=CXgQufgAAAAJ;;https://scholar.google.co.jp/citations?user=5BFWARsAAAAJ;D6KwmF8AAAAJ",
        "orcid": "0000-0002-2086-3191;;;0000-0003-4779-9588",
        "linkedin": ";;;jian-jiao-82897810/",
        "or_profile": "~Amit_Sharma3;~Hua_Li3;~Xue_Li7;~Jian_Jiao2",
        "aff": "Microsoft Research;;Microsoft;Microsoft",
        "aff_domain": "microsoft.com;;microsoft.com;microsoft.com",
        "position": "Principal Researcher;;Researcher;Principal Researcher",
        "bibtex": "@misc{\nsharma2024adapting,\ntitle={Adapting Retrieval Models to Task-Specific Goals using Reinforcement Learning},\nauthor={Amit Sharma and Hua Li and Xue Li and Jian Jiao},\nyear={2024},\nurl={https://openreview.net/forum?id=xThb6APBoG}\n}",
        "github": "",
        "project": "",
        "reviewers": "MtVy;ACSz;2vic;mWCM",
        "site": "https://openreview.net/forum?id=xThb6APBoG",
        "pdf_size": 302084,
        "rating": "3;3;5;5",
        "confidence": "3;2;4;3",
        "soundness": "2;2;3;2",
        "contribution": "2;2;3;3",
        "presentation": "3;2;2;3",
        "wc_summary": "88;159;109;78",
        "wc_strengths": "52;53;12;55",
        "wc_weaknesses": "246;151;184;217",
        "wc_questions": "22;204;78;58",
        "wc_review": "408;567;383;408",
        "wc_reply_reviewers": "0;83;37;0",
        "wc_reply_authors": "108;245;164;179",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            108.5,
            31.228992939254383
        ],
        "wc_strengths_avg": [
            43.0,
            17.930421077041107
        ],
        "wc_weaknesses_avg": [
            199.5,
            35.57035282366482
        ],
        "wc_questions_avg": [
            90.5,
            68.53283884387105
        ],
        "wc_review_avg": [
            441.5,
            73.17274082607538
        ],
        "wc_reply_reviewers_avg": [
            30.0,
            34.12477106150311
        ],
        "wc_reply_authors_avg": [
            174.0,
            48.79036790187178
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.7071067811865475,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Q929L_GXJQAJ:scholar.google.com/&scioq=Adapting+Retrieval+Models+to+Task-Specific+Goals+using+Reinforcement+Learning&hl=en&as_sdt=0,10",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Microsoft",
        "aff_unique_dep": "Microsoft Research",
        "aff_unique_url": "https://www.microsoft.com/en-us/research",
        "aff_unique_abbr": "MSR",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "xU0XRbn3b5",
        "title": "Privacy at Interpolation: Precise Analysis for Random and NTK Features",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep learning models often memorize the training set. This makes them vulnerable to recovery attacks, raising privacy concerns to users, and many widespread algorithms such as empirical risk minimization (ERM) do not directly enforce safety guarantees. In this paper, we study the safety of ERM models when the training samples are interpolated (i.e., *at interpolation*) against a family of powerful black-box information retrieval attacks. Our analysis quantifies this safety via two separate terms: *(i)* the model *stability* with respect to individual training samples, and *(ii)* the *feature alignment* between attacker query and original data. While the first term is well established in learning theory and it \nis connected to the generalization error in classical work, the second one is, to the best of our knowledge, novel.\nOur key technical result characterizes precisely the feature alignment for the two prototypical settings of random features (RF) and neural tangent kernel (NTK) regression. \nThis proves that privacy strengthens with an increase in generalization capability, unveiling the role of the model and of its activation function. \nNumerical experiments show an agreement with our theory not only for RF/NTK models, but also for deep neural networks trained on standard datasets (MNIST, CIFAR-10).",
        "keywords": "Random Features;Neural Tangent Kernel;Privacy;Stability;Generalization;Empirical Risk Minimization;Interpolation",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/a1e2cc66bc8627e360cb0d0bd2624061590dbaba.zip",
        "author": "Simone Bombari;Marco Mondelli",
        "authorids": "~Simone_Bombari1;~Marco_Mondelli1",
        "gender": "Not Specified;M",
        "homepage": "https://simone-bombari.github.io/;http://marcomondelli.com",
        "dblp": "317/4969;120/7089",
        "google_scholar": ";BHdSb5AAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Simone_Bombari1;~Marco_Mondelli1",
        "aff": "Institute of Science and Technology;Institute of Science and Technology",
        "aff_domain": "ist.ac.at;ist.ac.at",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nbombari2024privacy,\ntitle={Privacy at Interpolation: Precise Analysis for Random and {NTK} Features},\nauthor={Simone Bombari and Marco Mondelli},\nyear={2024},\nurl={https://openreview.net/forum?id=xU0XRbn3b5}\n}",
        "github": "",
        "project": "",
        "reviewers": "NsZa;96SU;4po4",
        "site": "https://openreview.net/forum?id=xU0XRbn3b5",
        "pdf_size": 665667,
        "rating": "6;6;6",
        "confidence": "2;3;3",
        "soundness": "4;4;3",
        "contribution": "2;3;2",
        "presentation": "3;3;3",
        "wc_summary": "76;68;91",
        "wc_strengths": "61;137;137",
        "wc_weaknesses": "241;124;375",
        "wc_questions": "6;135;106",
        "wc_review": "384;464;709",
        "wc_reply_reviewers": "98;15;0",
        "wc_reply_authors": "1208;922;696",
        "reply_reviewers": "1;1;0",
        "reply_authors": "2;2;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            78.33333333333333,
            9.533566430716728
        ],
        "wc_strengths_avg": [
            111.66666666666667,
            35.8267435801184
        ],
        "wc_weaknesses_avg": [
            246.66666666666666,
            102.54863344882867
        ],
        "wc_questions_avg": [
            82.33333333333333,
            55.25898619731957
        ],
        "wc_review_avg": [
            519.0,
            138.26303434637427
        ],
        "wc_reply_reviewers_avg": [
            37.666666666666664,
            43.099368389287974
        ],
        "wc_reply_authors_avg": [
            942.0,
            209.50099442882524
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:C_X7Hmdg-_gJ:scholar.google.com/&scioq=Privacy+at+Interpolation:+Precise+Analysis+for+Random+and+NTK+Features&hl=en&as_sdt=0,33",
        "gs_version_total": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "",
        "aff_unique_abbr": "",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "",
        "aff_country_unique": ""
    },
    {
        "id": "xU7VWHIo1i",
        "title": "Identifiable Latent Causal Content for Domain Adaptation under Latent Covariate Shift",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Multi-source domain adaptation (MSDA) addresses the challenge of learning a label prediction function for an unlabeled target domain by leveraging both the labeled data from multiple source domains and the unlabeled data from the target domain. Conventional MSDA approaches often rely on covariate shift or conditional shift paradigms, which assume a consistent label distribution across domains. However, this assumption proves limiting in practical scenarios where label distributions do vary across domains, diminishing its applicability in real-world settings. For example, animals from different regions exhibit diverse characteristics due to varying diets and genetics.\n\nMotivated by this, we propose a novel paradigm called latent covariate shift (LCS), which introduces significantly greater variability and adaptability across domains. Notably, it provides a theoretical assurance for recovering the latent cause of the label variable, which we refer to as the latent content variable. Within this new paradigm, we present an intricate causal generative model by introducing latent noises across domains, along with a latent content variable and a latent style variable to achieve more nuanced rendering of observational data. We demonstrate that the latent content variable can be identified up to block identifiability due to its versatile yet distinct causal structure. We anchor our theoretical insights into a novel MSDA method, which learns the label distribution conditioned on the identifiable latent content variable, thereby accommodating more substantial distribution shifts. The proposed approach showcases exceptional performance and efficacy on both simulated and real-world datasets.",
        "keywords": "Latent Causal Models;Domain Adaptation;Representation Learning;Label Distribution Shift",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Yuhang Liu;Zhen Zhang;Dong Gong;Mingming Gong;Biwei Huang;Anton van den Hengel;Kun Zhang;Javen Qinfeng Shi",
        "authorids": "~Yuhang_Liu1;~Zhen_Zhang2;~Dong_Gong1;~Mingming_Gong1;~Biwei_Huang1;~Anton_van_den_Hengel1;~Kun_Zhang1;~Javen_Qinfeng_Shi1",
        "gender": ";M;M;M;F;;M;M",
        "homepage": "https://sites.google.com/view/yuhangliu/homepage;https://zzhang.org;https://donggong1.github.io;https://mingming-gong.github.io/;;;http://www.andrew.cmu.edu/user/kunz1/;https://cs.adelaide.edu.au/~javen/",
        "dblp": ";19/5112-8;125/5032;98/8479;165/3288;v/AntonvandenHengel;96/3115-1;http://dblp.uni-trier.de/pers/hd/s/Shi:Qinfeng",
        "google_scholar": "5xZspvQAAAAJ;https://scholar.google.com.sg/citations?user=4X6Hqg0AAAAJ;https://scholar.google.com.au/citations?user=e2u6hRoAAAAJ;https://scholar.google.com.au/citations?user=6BmiCJIAAAAJ;;https://scholar.google.com.au/citations?user=nMGZ2ZQAAAAJ;RGoypN4AAAAJ;https://scholar.google.com.au/citations?user=h6O9vYkAAAAJ",
        "orcid": ";0000-0003-2805-4396;0000-0002-2668-9630;0000-0001-7147-5589;;0000-0003-3027-8364;;0000-0002-9126-2107",
        "linkedin": ";;;;;;;",
        "or_profile": "~Yuhang_Liu1;~Zhen_Zhang2;~Dong_Gong1;~Mingming_Gong1;~Biwei_Huang1;~Anton_van_den_Hengel1;~Kun_Zhang1;~Javen_Shi1",
        "aff": "The University of Adelaide;The University of Adelaide;University of New South Wales;University of Melbourne;University of California, San Diego;University of Adelaide;Carnegie Mellon University;University of Adelaide",
        "aff_domain": "adelaide.edu.au;adelaide.edu.au;unsw.edu.au;unimelb.edu.au;ucsd.edu;adelaide.edu.au;cmu.edu;adelaide.edu.au",
        "position": "Postdoc;Postdoc;Assistant Professor;Assistant Professor;Assistant Professor;Professor;Associate Professor;Professor",
        "bibtex": "@misc{\nliu2024identifiable,\ntitle={Identifiable Latent Causal Content for Domain Adaptation under Latent Covariate Shift},\nauthor={Yuhang Liu and Zhen Zhang and Dong Gong and Mingming Gong and Biwei Huang and Anton van den Hengel and Kun Zhang and Javen Qinfeng Shi},\nyear={2024},\nurl={https://openreview.net/forum?id=xU7VWHIo1i}\n}",
        "github": "",
        "project": "",
        "reviewers": "4yH5;Corp;YFyZ;cTbd",
        "site": "https://openreview.net/forum?id=xU7VWHIo1i",
        "pdf_size": 3485369,
        "rating": "1;5;5;6",
        "confidence": "5;3;3;3",
        "soundness": "1;2;3;3",
        "contribution": "1;2;3;2",
        "presentation": "2;3;3;3",
        "wc_summary": "82;91;99;64",
        "wc_strengths": "5;48;81;68",
        "wc_weaknesses": "325;179;152;248",
        "wc_questions": "5;2;32;121",
        "wc_review": "417;320;364;501",
        "wc_reply_reviewers": "0;0;182;0",
        "wc_reply_authors": "1898;1152;1836;576",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "4;3;5;1",
        "rating_avg": [
            4.25,
            1.920286436967152
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            84.0,
            13.019216566291536
        ],
        "wc_strengths_avg": [
            50.5,
            28.77933286231632
        ],
        "wc_weaknesses_avg": [
            226.0,
            67.02611431375088
        ],
        "wc_questions_avg": [
            40.0,
            48.202697019980114
        ],
        "wc_review_avg": [
            400.5,
            67.4258852370512
        ],
        "wc_reply_reviewers_avg": [
            45.5,
            78.80831174438391
        ],
        "wc_reply_authors_avg": [
            1365.5,
            541.7146389013316
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.25,
            1.479019945774904
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.9771398364036774,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:sfN_G8YBBJ4J:scholar.google.com/&scioq=Identifiable+Latent+Causal+Content+for+Domain+Adaptation+under+Latent+Covariate+Shift&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1;2;3;0;4;0",
        "aff_unique_norm": "University of Adelaide;University of New South Wales;University of Melbourne;University of California, San Diego;Carnegie Mellon University",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.adelaide.edu.au;https://www.unsw.edu.au;https://www.unimelb.edu.au;https://www.ucsd.edu;https://www.cmu.edu",
        "aff_unique_abbr": "Adelaide;UNSW;UniMelb;UCSD;CMU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";San Diego",
        "aff_country_unique_index": "0;0;0;0;1;0;1;0",
        "aff_country_unique": "Australia;United States"
    },
    {
        "title": "Negative Label Guided OOD Detection with Pretrained Vision-Language Models",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17453",
        "id": "xUO1HXz4an",
        "author_site": "Xue JIANG, Feng Liu, Zhen Fang, Hong Chen, Tongliang Liu, Feng Zheng, Bo Han",
        "tldr": "",
        "abstract": "Out-of-distribution (OOD) detection aims at identifying samples from unknown classes, playing a crucial role in trustworthy models against errors on unexpected inputs.  \nExtensive research has been dedicated to exploring OOD detection in the vision modality. \n{Vision-language models (VLMs) can leverage both textual and visual information for various multi-modal applications, whereas few OOD detection methods take into account information from the text modality. \nIn this paper, we propose a novel post hoc OOD detection method, called NegLabel, which takes a vast number of negative labels from extensive corpus databases. We design a novel scheme for the OOD score collaborated with negative labels.\nTheoretical analysis helps to understand the mechanism of negative labels. Extensive experiments demonstrate that our method NegLabel achieves state-of-the-art performance on various OOD detection benchmarks and generalizes well on multiple VLM architectures. Furthermore, our method NegLabel exhibits remarkable robustness against diverse domain shifts. The codes are available at https://github.com/tmlr-group/NegLabel.",
        "keywords": "OOD detection",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Xue Jiang;Feng Liu;Zhen Fang;Hong Chen;Tongliang Liu;Feng Zheng;Bo Han",
        "authorids": "~Xue_Jiang3;~Feng_Liu2;~Zhen_Fang2;~Hong_Chen1;~Tongliang_Liu1;~Feng_Zheng1;~Bo_Han1",
        "gender": "F;M;M;;M;M;M",
        "homepage": ";https://fengliu90.github.io/index.html;https://fang-zhen.github.io/index.html;https://chenhongml.github.io/;https://tongliang-liu.github.io/;http://faculty.sustech.edu.cn/fengzheng/;https://bhanml.github.io/",
        "dblp": ";77/1318-3;;https://dblp.uni-trier.de/pers/hd/c/Chen_0004:Hong;150/6667;39/800;241/0472-3",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com/citations?hl=en;OzD6WJcAAAAJ;;https://scholar.google.com.au/citations?user=EiLdZ_YAAAAJ;PcmyXHMAAAAJ;nTNjqHwAAAAJ",
        "orcid": "0000-0003-2577-2296;0000-0002-5005-9129;0000-0003-0602-6255;;;0000-0002-1701-9141;",
        "linkedin": ";alexfengliu;;;;;",
        "or_profile": "~Xue_Jiang3;~Feng_Liu2;~Zhen_Fang2;~Hong_Chen1;~Tongliang_Liu1;~Feng_Zheng1;~bo_han2",
        "aff": "Southern University of Science and Technology;University of Melbourne;University of Technology Sydney;Huazhong Agricultural University;Mohamed bin Zayed University of Artificial Intelligence;Southern University of Science and Technology;MBZUAI",
        "aff_domain": "sustech.edu.cn;unimelb.edu.au;uts.edu.au;hzau.edu.cn;mbzuai.ac.ae;sustech.edu.cn;mbzuai.ac.ae",
        "position": "PhD student;Assistant Professor;Assistant Professor;Full Professor;Affiliated Associate Professor;Associate Professor;Researcher",
        "bibtex": "@inproceedings{\njiang2024negative,\ntitle={Negative Label Guided {OOD} Detection with Pretrained Vision-Language Models},\nauthor={Xue Jiang and Feng Liu and Zhen Fang and Hong Chen and Tongliang Liu and Feng Zheng and Bo Han},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=xUO1HXz4an}\n}",
        "github": "",
        "project": "",
        "reviewers": "JPmP;dUt1;9gus;RPtB",
        "pdf_size": 6977019,
        "rating": "6;8;8;8",
        "confidence": "4;4;4;5",
        "soundness": "3;4;4;4",
        "contribution": "3;4;4;3",
        "presentation": "3;4;4;4",
        "wc_summary": "77;172;99;83",
        "wc_strengths": "119;179;89;92",
        "wc_weaknesses": "95;137;112;432",
        "wc_questions": "74;52;93;135",
        "wc_review": "365;540;393;742",
        "wc_reply_reviewers": "0;33;20;193",
        "wc_reply_authors": "594;928;676;2091",
        "reply_reviewers": "0;1;1;2",
        "reply_authors": "1;3;1;4",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.5,
            0.5
        ],
        "presentation_avg": [
            3.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            107.75,
            37.95638944894522
        ],
        "wc_strengths_avg": [
            119.75,
            36.14813273185767
        ],
        "wc_weaknesses_avg": [
            194.0,
            138.2190290806588
        ],
        "wc_questions_avg": [
            88.5,
            30.516389039334257
        ],
        "wc_review_avg": [
            510.0,
            149.53093325462797
        ],
        "wc_reply_reviewers_avg": [
            61.5,
            76.8261023350788
        ],
        "wc_reply_authors_avg": [
            1072.25,
            600.9152914512994
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            2.25,
            1.299038105676658
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 41,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6204067626485686894&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=xUO1HXz4an",
        "pdf": "https://openreview.net/pdf?id=xUO1HXz4an",
        "email": "sustech.edu.cn;unimelb.edu.au;uts.edu.au;hzau.edu.cn;mbzuai.ac.ae;sustech.edu.cn;mbzuai.ac.ae",
        "author_num": 7,
        "aff_unique_index": "0;1;2;3;4;0;4",
        "aff_unique_norm": "Southern University of Science and Technology;University of Melbourne;University of Technology Sydney;Huazhong Agricultural University;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.sustech.edu.cn;https://www.unimelb.edu.au;https://www.uts.edu.au;http://www.hzau.edu.cn/;https://mbzuai.ac.ae",
        "aff_unique_abbr": "SUSTech;UniMelb;UTS;HAU;MBZUAI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;0;2;0;2",
        "aff_country_unique": "China;Australia;United Arab Emirates"
    },
    {
        "id": "xUe1YqEgd6",
        "title": "Unsupervised motion segmentation in one go: Smooth long-term model over a video",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Human beings have the ability to continuously analyze a video and immediately extract the main motion components. Motion segmentation methods often proceed frame by frame. We want to go beyond this classical paradigm, and perform the motion segmentation over a video sequence in one go. It will be a prominent added value for downstream computer vision tasks, and could provide a pretext criterion for unsupervised video representation learning. In this perspective, we propose a novel long-term spatio temporal model operating in a totally unsupervised way. It takes as input the volume of consecutive optical flow (OF) fields, and delivers a volume of segments of coherent motion over the video. More specifically, we have designed a transformer-based network, where we leverage a mathematically well-founded framework, the Evidence Lower Bound (ELBO), to infer the loss function. The loss function combines a flow reconstruction term involving spatio-temporal parametric motion models combining, in a novel way, polynomial (quadratic) motion models for the (x, y)-spatial dimensions and B-splines for the time dimension of the video sequence, and a regularization term enforcing temporal consistency on the masks. We report experiments on four VOS benchmarks with convincing quantitative results. We also highlight through visual results the key contributions on temporal consistency brought by our method.",
        "keywords": "motion segmentation; unsupervised learning; temporal consistency; video object segmentation; unsupervised segmentation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/d20f096f3cf8b3a86e2e6220480f676350ce4f7a.pdf",
        "author": "Etienne Meunier;Patrick Bouthemy",
        "authorids": "~Etienne_Meunier1;~Patrick_Bouthemy2",
        "gender": "M;",
        "homepage": "https://etienne-meunier.github.io/;",
        "dblp": ";07/4616",
        "google_scholar": ";https://scholar.google.com/citations?hl=en",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Etienne_Meunier1;~Patrick_Bouthemy2",
        "aff": "INRIA;INRIA",
        "aff_domain": "inria.fr;inria.fr",
        "position": "PhD student;Researcher",
        "bibtex": "@misc{\nmeunier2024unsupervised,\ntitle={Unsupervised motion segmentation in one go: Smooth long-term model over a video},\nauthor={Etienne Meunier and Patrick Bouthemy},\nyear={2024},\nurl={https://openreview.net/forum?id=xUe1YqEgd6}\n}",
        "github": "",
        "project": "",
        "reviewers": "po8i;S5Mv;Wuh7",
        "site": "https://openreview.net/forum?id=xUe1YqEgd6",
        "pdf_size": 11714237,
        "rating": "5;5;5",
        "confidence": "4;5;3",
        "soundness": "3;3;2",
        "contribution": "3;2;2",
        "presentation": "2;2;2",
        "wc_summary": "80;115;52",
        "wc_strengths": "78;68;50",
        "wc_weaknesses": "333;475;34",
        "wc_questions": "175;82;254",
        "wc_review": "666;740;390",
        "wc_reply_reviewers": "207;0;0",
        "wc_reply_authors": "901;822;263",
        "reply_reviewers": "1;0;0",
        "reply_authors": "2;1;1",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            82.33333333333333,
            25.772509040103607
        ],
        "wc_strengths_avg": [
            65.33333333333333,
            11.585431464655178
        ],
        "wc_weaknesses_avg": [
            280.6666666666667,
            183.80122113002645
        ],
        "wc_questions_avg": [
            170.33333333333334,
            70.29619872763787
        ],
        "wc_review_avg": [
            598.6666666666666,
            150.6106090405173
        ],
        "wc_reply_reviewers_avg": [
            69.0,
            97.58073580374356
        ],
        "wc_reply_authors_avg": [
            662.0,
            283.9730034117093
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11970896399573488859&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "INRIA",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.inria.fr",
        "aff_unique_abbr": "INRIA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "France"
    },
    {
        "title": "Privacy Amplification for Matrix Mechanisms",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17452",
        "id": "xUzWmFdglP",
        "author_site": "Christopher Choquette-Choo, Arun Ganesh, Thomas Steinke, Abhradeep Guha Thakurta",
        "tldr": "",
        "abstract": "Privacy amplification exploits randomness in data selection to provide tighter differential privacy (DP) guarantees. This analysis is key to DP-SGD's success in machine learning (ML), but, is not readily applicable to the newer state-of-the-art (SOTA) algorithms. This is because these algorithms, known as DP-FTRL, use the matrix mechanism to add correlated noise instead of independent noise as in DP-SGD.\n\nIn this paper, we propose \"MMCC'' (matrix mechanism conditional composition), the first algorithm to analyze privacy amplification via sampling for any generic matrix mechanism. MMCC is nearly tight in that it approaches a lower bound as $\\epsilon\\to0$. \nTo analyze correlated outputs in MMCC, we prove that they can be analyzed as if they were independent, by conditioning them on prior outputs. Our \"conditional composition theorem'' has broad utility: we use it to show that the noise added to binary-tree-DP-FTRL can asymptotically match the noise added to DP-SGD with amplification. Our algorithm also has practical empirical utility. We show that amplification leads to significant improvement in the privacy/utility trade-offs for DP-FTRL style algorithms for standard benchmark tasks.",
        "keywords": "differential privacy;privacy amplification;matrix mechanism",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/1825a069e10ffb0a1e2a70a032983fc9a0f10735.pdf",
        "author": "Christopher A. Choquette-Choo;Arun Ganesh;Thomas Steinke;Abhradeep Guha Thakurta",
        "authorids": "~Christopher_A._Choquette-Choo1;~Arun_Ganesh1;~Thomas_Steinke2;~Abhradeep_Guha_Thakurta1",
        "gender": "M;M;M;M",
        "homepage": "https://www.christopherchoquette.com;https://people.eecs.berkeley.edu/~arunganesh/;http://www.thomas-steinke.net/;https://athakurta.squarespace.com/",
        "dblp": "250/9674;201/4732;https://dblp.uni-trier.de/pid/73/4025-2.html;31/8315",
        "google_scholar": "oDE4I64AAAAJ;fmwchbsAAAAJ;kwnwhrgAAAAJ;1rV69hMAAAAJ",
        "orcid": ";;;",
        "linkedin": "christopher-choquette-choo/;;thomas-steinke-2841248/;",
        "or_profile": "~Christopher_A._Choquette-Choo1;~Arun_Ganesh1;~Thomas_Steinke2;~Abhradeep_Guha_Thakurta1",
        "aff": "Google DeepMind;Google;Google;Google",
        "aff_domain": "google.com;google.com;google.com;google.com",
        "position": "Research Scientist;Researcher;Research Scientist;Senior Research Scientist",
        "bibtex": "@inproceedings{\nchoquette-choo2024privacy,\ntitle={Privacy Amplification for Matrix Mechanisms},\nauthor={Christopher A. Choquette-Choo and Arun Ganesh and Thomas Steinke and Abhradeep Guha Thakurta},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=xUzWmFdglP}\n}",
        "github": "",
        "project": "",
        "reviewers": "5cQP;aP5d;FAAy;9Vpe",
        "pdf_size": 591803,
        "rating": "6;8;8;8",
        "confidence": "2;4;3;4",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "71;240;42;38",
        "wc_strengths": "35;70;31;58",
        "wc_weaknesses": "27;59;29;161",
        "wc_questions": "1;128;39;6",
        "wc_review": "134;497;141;263",
        "wc_reply_reviewers": "0;33;0;0",
        "wc_reply_authors": "201;651;158;330",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            97.75,
            83.10949103441797
        ],
        "wc_strengths_avg": [
            48.5,
            16.132265804901678
        ],
        "wc_weaknesses_avg": [
            69.0,
            54.607691765904185
        ],
        "wc_questions_avg": [
            43.5,
            50.92396292512986
        ],
        "wc_review_avg": [
            258.75,
            146.80663302453334
        ],
        "wc_reply_reviewers_avg": [
            8.25,
            14.289419162443238
        ],
        "wc_reply_authors_avg": [
            335.0,
            193.11007223860696
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.8703882797784891,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7028829855536667729&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=xUzWmFdglP",
        "pdf": "https://openreview.net/pdf?id=xUzWmFdglP",
        "email": "google.com;google.com;google.com;google.com",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Google",
        "aff_unique_dep": "Google DeepMind",
        "aff_unique_url": "https://deepmind.com",
        "aff_unique_abbr": "DeepMind",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "id": "xUzjizyzHg",
        "title": "DECap: Towards Generalized Explicit Caption Editing via Diffusion Mechanism",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Explicit Caption Editing (ECE) --- refining reference image captions through a sequence of explicit edit operations (e.g., KEEP, DETELE words) --- has raised significant attention due to its explainable and human-like nature. After training with carefully designed reference and ground-truth caption pairs, state-of-the-art ECE models exhibit limited generalization ability beyond the original training data distribution, i.e., they are tailored to refine content details only in in-domain samples but fail to correct errors in out-of-domain samples. To this end, we propose a new Diffusion-based Explicit Caption editing method: DECap. Specifically, we reformulate the ECE task as a denoising process under the diffusion mechanism, and introduce innovative edit-based noising and denoising processes. The noising process can help to eliminate the need for meticulous paired data selection by directly introducing word-level noises (i.e., random words) for model training, learning diverse distribution over input reference captions. The denoising process involves the explicit predictions of edit operations and corresponding content words, refining reference captions through iterative step-wise editing. To further improve the inference speed for caption editing, DECap discards the prevalent multi-stage design, and directly generates edit operations and content words simultaneously. Extensive experiments have demonstrated the strong generalization ability of DECap in various caption editing scenarios. More interestingly, it also shows great potential in improving both the quality and controllability of caption generation.",
        "keywords": "Explicit Caption Editing;Image Captioning;Diffusion Model",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Zhen Wang;Jun Xiao;Tao Chen;Long Chen",
        "authorids": "~Zhen_Wang20;~Jun_Xiao1;~Tao_Chen18;~Long_Chen8",
        "gender": ";M;M;M",
        "homepage": "https://github.com/baaaad;;https://www.tongdun.cn/;https://zjuchenlong.github.io/",
        "dblp": ";71/2308-1;;64/5725-16",
        "google_scholar": "eQ-G_bQAAAAJ;fqOwFhQAAAAJ;;https://scholar.google.com.sg/citations?user=-gtmMpIAAAAJ",
        "orcid": "0009-0008-1091-7994;;;0000-0001-6148-9709",
        "linkedin": ";;;",
        "or_profile": "~Zhen_Wang20;~Jun_Xiao1;~Tao_Chen18;~Long_Chen8",
        "aff": "Zhejiang University;Zhejiang University;Tongdun Technology Company Limited;Hong Kong University of Science and Technology",
        "aff_domain": "zju.edu.cn;zju.edu.cn;tongdun.net;ust.hk",
        "position": "PhD student;Full Professor;Tech Lead;Assistant Professor",
        "bibtex": "@misc{\nwang2024decap,\ntitle={{DEC}ap: Towards Generalized Explicit Caption Editing via Diffusion Mechanism},\nauthor={Zhen Wang and Jun Xiao and Tao Chen and Long Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=xUzjizyzHg}\n}",
        "github": "",
        "project": "",
        "reviewers": "dhFv;x69y;Y6nt;4DTL",
        "site": "https://openreview.net/forum?id=xUzjizyzHg",
        "pdf_size": 997303,
        "rating": "3;5;5;5",
        "confidence": "3;4;4;3",
        "soundness": "1;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "62;46;28;46",
        "wc_strengths": "15;57;67;34",
        "wc_weaknesses": "311;157;162;57",
        "wc_questions": "19;4;22;43",
        "wc_review": "407;264;279;180",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            45.5,
            12.031209415515965
        ],
        "wc_strengths_avg": [
            43.25,
            20.22838352414745
        ],
        "wc_weaknesses_avg": [
            171.75,
            90.65146165396342
        ],
        "wc_questions_avg": [
            22.0,
            13.910427743243556
        ],
        "wc_review_avg": [
            282.5,
            81.18035476640885
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5106071272638933065&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "Zhejiang University;Tongdun Technology;Hong Kong University of Science and Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.zju.edu.cn;https://www.tongdun.cn;https://www.ust.hk",
        "aff_unique_abbr": "ZJU;;HKUST",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "xVBXz7wD2m",
        "title": "GatedMTL: Learning to Share, Specialize, and Prune Representations for Multi-task Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Jointly learning multiple tasks with a unified network can improve accuracy and data efficiency while simultaneously reducing computational and memory costs. However, in practice, Multi-task Learning (MTL) is challenging, as optimizing one task objective may inadvertently compromise the performance of another: This is known as task interference. A promising direction to mitigate such conflicts between tasks is to allocate task-specific parameters, free from interference, on top of shared features, allowing for positive information transfer across tasks, albeit at the cost of higher computational demands. In this work, we propose a novel MTL framework, GatedMTL, to address the fundamental challenges of task interference and computational constraints in MTL. GatedMTL learns the optimal balance between shared and specialized representations for a given computational budget. We leverage a learnable gating mechanism allowing each individual task to select and combine channels from its own task-specific features and a shared memory bank of features. Moreover, we regularize the gates to learn the optimal balance between allocating additional task-specific parameters and the model\u2019s computational costs. Through extensive empirical evaluations, we demonstrate SoTA results on three MTL benchmarks using convolutional as well as transformer-based backbones on CelebA, NYUD-v2, and PASCAL-Context.",
        "keywords": "Multi-task learning;Gated networks;Sharing;Pruning;Sparsity;MTL",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Babak Ehteshami Bejnordi;Gaurav Kumar;Amelie Royer;Christos Louizos;Tijmen Blankevoort;Mohsen Ghafoorian",
        "authorids": "~Babak_Ehteshami_Bejnordi1;~Gaurav_Kumar3;~Amelie_Royer1;~Christos_Louizos1;~Tijmen_Blankevoort1;~Mohsen_Ghafoorian2",
        "gender": "M;M;F;;M;M",
        "homepage": "http://babakint.com/;;https://ameroyer.github.io;;;http://mohsenghafoorian.nl/",
        "dblp": "175/5607;;https://dblp.uni-trier.de/pid/169/4804;;;",
        "google_scholar": "https://scholar.google.se/citations?user=Qk-AMk0AAAAJ;;https://scholar.google.fr/citations?user=P9-oT8AAAAAJ;;OGEyrG8AAAAJ;https://scholar.google.nl/citations?user=989WL-wAAAAJ",
        "orcid": ";;;;;",
        "linkedin": "babakint/;munjalgk/;;;tijmen-blankevoort-a5633a24/;mohsenghafoorian-ba343753",
        "or_profile": "~Babak_Ehteshami_Bejnordi1;~Gaurav_Kumar3;~Amelie_Royer1;~Christos_Louizos1;~Tijmen_Blankevoort1;~Mohsen_Ghafoorian2",
        "aff": "Qualcomm AI Research, Qualcomm Inc, QualComm;Qualcomm Inc, QualComm;Qualcomm AI Research;;Qualcomm Inc, QualComm;Qualcomm",
        "aff_domain": "qti.qualcomm.com;qti.qualcomm.com;qualcomm.com;;qti.qualcomm.com;qualcomm.com",
        "position": "Researcher;Researcher;Researcher;;Researcher;Researcher",
        "bibtex": "@misc{\nbejnordi2024gatedmtl,\ntitle={Gated{MTL}: Learning to Share, Specialize, and Prune Representations for Multi-task Learning},\nauthor={Babak Ehteshami Bejnordi and Gaurav Kumar and Amelie Royer and Christos Louizos and Tijmen Blankevoort and Mohsen Ghafoorian},\nyear={2024},\nurl={https://openreview.net/forum?id=xVBXz7wD2m}\n}",
        "github": "",
        "project": "",
        "reviewers": "7nfe;DXQP;PvDp;wdHJ",
        "site": "https://openreview.net/forum?id=xVBXz7wD2m",
        "pdf_size": 1570789,
        "rating": "5;5;5;6",
        "confidence": "4;4;3;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;2;3",
        "wc_summary": "85;97;92;125",
        "wc_strengths": "29;32;61;79",
        "wc_weaknesses": "103;232;87;426",
        "wc_questions": "432;72;45;31",
        "wc_review": "649;433;285;661",
        "wc_reply_reviewers": "339;61;0;352",
        "wc_reply_authors": "2140;1209;642;1385",
        "reply_reviewers": "2;1;0;2",
        "reply_authors": "4;3;2;3",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            99.75,
            15.188400179084036
        ],
        "wc_strengths_avg": [
            50.25,
            20.777090749188154
        ],
        "wc_weaknesses_avg": [
            212.0,
            135.74056136615908
        ],
        "wc_questions_avg": [
            145.0,
            166.35353918687753
        ],
        "wc_review_avg": [
            507.0,
            157.0350279396288
        ],
        "wc_reply_reviewers_avg": [
            188.0,
            159.03615941036804
        ],
        "wc_reply_authors_avg": [
            1344.0,
            535.3330738895179
        ],
        "reply_reviewers_avg": [
            1.25,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:_1r133W3lgQJ:scholar.google.com/&scioq=GatedMTL:+Learning+to+Share,+Specialize,+and+Prune+Representations+for+Multi-task+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;1;1",
        "aff_unique_norm": "Qualcomm;Qualcomm Incorporated",
        "aff_unique_dep": "Qualcomm AI Research;",
        "aff_unique_url": "https://www.qualcomm.com/research;https://www.qualcomm.com",
        "aff_unique_abbr": "Qualcomm;Qualcomm",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "xVbke7yC07",
        "title": "Enhancing Tropical Cyclone Formation Prediction Using Graph Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Tropical cyclones are among the most powerful and destructive weather events on Earth, and the formation and evolution of these systems is crucial to the resilience and safety of coastal populations. Although physical models have historically been used to research tropical cyclones, these models frequently fail to capture\nthe complex interactions between many atmospheric and oceanic factors that influence cyclonic systems\u2019 behavior. In this research, we suggest a unique method of employing graph neural networks (GNNs) to analyze the development and evolution of tropical cyclones. GNNs are an effective machine learning technique\nthat can learn from huge and complex datasets, which makes them well-suited to capture the underlying patterns in the behavior of tropical cyclones. In our method, a GNN is used to estimate cyclone formation, forecast whether it will become stronger or weaker in the following time step, and match the evolution pattern of cyclones in the training set. We tested our method on a substantial\ndataset of tropical cyclones and showed that it outperformed conventional physical models in predicting the genesis of tropical cyclones. Our research also shown that the intricate connections between atmospheric and oceanic factors that affect\ntropical cyclones are better captured by the GNN-based method, leading to a better understanding of their behavior. As a result of our research, better early warning systems and disaster response planning will be possible, allowing for more\nprecise forecasts of tropical cyclone development and behavior. Our work also shows how machine learning methods may improve our comprehension of intricate meteorological processes, presenting new avenues for research in atmospheric science.",
        "keywords": "Graph Neural Network (GNN);Temporal Evolution;Node classification;Cyclone Prediction",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/1e867088e0e637f30d970eac33611cb3edf48cce.zip",
        "author": "Sabbir Rahman;Dr Nusrat Sharmin;Md. Mahbubur Rahman;Md Mokhlesur Rahman",
        "authorids": "~Sabbir_Rahman1;~Dr_Nusrat_Sharmin1;~Md._Mahbubur_Rahman1;~Md_Mokhlesur_Rahman1",
        "gender": ";F;M;M",
        "homepage": ";https://mist.ac.bd/department/cse/facultyMembers/nusrat_sharmin-358;;",
        "dblp": ";;;",
        "google_scholar": ";;_3naFRMAAAAJ;",
        "orcid": ";;0000-0001-6525-2274;0009-0003-7987-4578",
        "linkedin": "sabbir-rahman-636623253/;;;",
        "or_profile": "~Sabbir_Rahman1;~Dr_Nusrat_Sharmin1;~Md._Mahbubur_Rahman1;~Md_Mokhlesur_Rahman1",
        "aff": "Military Institute of Science and Technology;;;Military Institute of Science and Technology",
        "aff_domain": "mist.ac.bd;;;mist.ac.bd",
        "position": "MS student;;;Instructor",
        "bibtex": "@misc{\nrahman2024enhancing,\ntitle={Enhancing Tropical Cyclone Formation Prediction Using Graph Neural Networks},\nauthor={Sabbir Rahman and Dr Nusrat Sharmin and Md. Mahbubur Rahman and Md Mokhlesur Rahman},\nyear={2024},\nurl={https://openreview.net/forum?id=xVbke7yC07}\n}",
        "github": "",
        "project": "",
        "reviewers": "FizX;WaYN;QeAU",
        "site": "https://openreview.net/forum?id=xVbke7yC07",
        "pdf_size": 539651,
        "rating": "1;1;5",
        "confidence": "4;4;4",
        "soundness": "1;1;2",
        "contribution": "1;1;2",
        "presentation": "1;1;2",
        "wc_summary": "43;12;88",
        "wc_strengths": "4;1;48",
        "wc_weaknesses": "246;50;182",
        "wc_questions": "1;1;123",
        "wc_review": "294;64;441",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            2.3333333333333335,
            1.8856180831641267
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            47.666666666666664,
            31.201851796897497
        ],
        "wc_strengths_avg": [
            17.666666666666668,
            21.483844059096025
        ],
        "wc_weaknesses_avg": [
            159.33333333333334,
            81.60609998986322
        ],
        "wc_questions_avg": [
            41.666666666666664,
            57.51135153650587
        ],
        "wc_review_avg": [
            266.3333333333333,
            155.14795805581488
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ZtHbsQhYBbQJ:scholar.google.com/&scioq=Enhancing+Tropical+Cyclone+Formation+Prediction+Using+Graph+Neural+Networks&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Military Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "",
        "aff_unique_abbr": "",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Bangladesh"
    },
    {
        "id": "xVlcbh0poD",
        "title": "AutoRT: Embodied Foundation Models for Large Scale Orchestration of Robotic Agents",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Foundation models that incorporate language, vision, and more recently actions have revolutionized the ability to harness internet scale data to reason about useful tasks. However, one of the key challenges of training embodied foundation models is the lack of data grounded in the physical world. In this paper, we propose AutoRT, a system that leverages existing foundation models to scale up the deployment of operational robots in completely unseen scenarios with minimal human supervision. AutoRT leverages vision-language models (VLMs) for scene understanding and grounding, and further uses large language models (LLMs) for proposing diverse and novel instructions to be performed by a fleet of robots. Guiding data collection by tapping into the knowledge of foundation models enables AutoRT to effectively reason about autonomy tradeoffs and safety while significantly scaling up data collection for robot learning. We demonstrate AutoRT proposing instructions to over 20 robots across multiple buildings and collecting 77k real robot episodes via both teleoperation and autonomous robot policies. We experimentally show that such \u201cin-the-wild\u201d data collected by AutoRT is significantly more diverse, and that AutoRT\u2019s use of LLMs allows for instruction following data collection robots that are aligned with human preferences.",
        "keywords": "robot learning;robotics;robot manipulation;large language models;vision language models;agent;decision making",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "/attachment/3b73069642c9b78678e6dba854305660609a1332.zip",
        "author": "Michael Ahn;Debidatta Dwibedi;Chelsea Finn;Montserrat Gonzalez Arenas;Keerthana Gopalakrishnan;Karol Hausman;brian ichter;Alex Irpan;Nikhil J Joshi;Ryan Julian;Sean Kirmani;Isabel Leal;Tsang-Wei Edward Lee;Sergey Levine;Yao Lu;Sharath Maddineni;Kanishka Rao;Dorsa Sadigh;Pannag R Sanketi;Pierre Sermanet;Quan Vuong;Stefan Welker;Fei Xia;Ted Xiao;Peng Xu;Sichun Xu;Zhuo Xu",
        "authorids": "michaelahn@google.com;~Debidatta_Dwibedi1;~Chelsea_Finn1;~Montserrat_Gonzalez_Arenas1;~Keerthana_Gopalakrishnan1;~Karol_Hausman2;~brian_ichter1;~Alex_Irpan1;~Nikhil_J_Joshi1;~Ryan_Julian2;~Sean_Kirmani1;isabelleal@google.com;~Tsang-Wei_Edward_Lee1;~Sergey_Levine1;~Yao_Lu13;smaddineni@google.com;~Kanishka_Rao1;~Dorsa_Sadigh1;~Pannag_R_Sanketi1;~Pierre_Sermanet1;~Quan_Vuong2;~Stefan_Welker1;~Fei_Xia1;~Ted_Xiao1;~Peng_Xu9;sicxu@google.com;~Zhuo_Xu1",
        "gender": ";M;F;F;F;;;M;M;M;M;;M;M;;;;F;M;;M;Not Specified;M;M;M;;M",
        "homepage": ";https://debidatta.github.io/;https://ai.stanford.edu/~cbfinn/;;https://keerthanapg.com;;;http://www.alexirpan.com;;https://ryanjulian.me;https://kirmani.io/;;;https://people.eecs.berkeley.edu/~svlevine/;;;https://research.google/people/KanishkaRao/;https://dorsa.fyi/;;https://sermanet.github.io/;https://quanvuong.github.io;;;https://www.tedxiao.me;;;",
        "dblp": ";160/3739;131/1783;;;;;202/2063;;227/2645;;;236/6317.html;80/7594;26/5662-6;;;117/3174;;28/6457;;;;198/0598;;;",
        "google_scholar": ";EPfOJwQAAAAJ;vfPE6hgAAAAJ;;;;-w5DuHgAAAAJ;;XzETn4QAAAAJ;8C2_ZVsAAAAJ;iyEuK8kAAAAJ;;;8R35rCwAAAAJ;OI7zFmwAAAAJ;;;ZaJEZpYAAAAJ;GuU6oA4AAAAJ;0nPi5YYAAAAJ;NSWI3OwAAAAJ;sI0DsP8AAAAJ;pqP5_PgAAAAJ;;460NWeQAAAAJ;;",
        "orcid": ";;;;;;;;;;;;;;;;;;;;;;0000-0003-4343-1444;;;;",
        "linkedin": ";;;montse90/;;;;;nikhil-j-joshi;;skirmani;;;;;;;;;sermanet/;;;;;;;zhuo-xu-joe/",
        "or_profile": "michaelahn@google.com;~Debidatta_Dwibedi1;~Chelsea_Finn1;~Montserrat_Gonzalez_Arenas1;~Keerthana_Gopalakrishnan1;~Karol_Hausman2;~brian_ichter1;~Alex_Irpan1;~Nikhil_J_Joshi1;~Ryan_Julian2;~Sean_Kirmani1;isabelleal@google.com;~Tsang-Wei_Edward_Lee1;~Sergey_Levine1;~Yao_Lu13;smaddineni@google.com;~Kanishka_Rao1;~Dorsa_Sadigh1;~Pannag_R_Sanketi1;~Pierre_Sermanet1;~Quan_Vuong2;~Stefan_Welker1;~Fei_Xia1;~Ted_Xiao1;~Peng_Xu9;sicxu@google.com;~Zhuo_Xu1",
        "aff": ";Google;Google;;Research, Google;;Google;Google DeepMind;Research, Google;Google;Google DeepMind;;;Google;NVIDIA;;;Stanford University;Google;Google;physical intelligence;;Google;;Google;;Google DeepMind",
        "aff_domain": ";google.com;google.com;;research.google.com;;google.com;google.com;research.google.com;google.com;google.com;;;google.com;nvidia.com;;;stanford.edu;google.com;google.com;physicalintelligence.company;;google.com;;google.com;;google.com",
        "position": ";Google;Research Scientist;;Researcher;;Research Scientist;Researcher;Researcher;Senior Research Software Engineer;Researcher;;;Research Scientist;Principal Researcher;;;Assistant Professor;Researcher;Research Scientist;Researcher;;Researcher;;Researcher;;Researcher",
        "bibtex": "@misc{\nahn2024autort,\ntitle={Auto{RT}: Embodied Foundation Models for Large Scale Orchestration of Robotic Agents},\nauthor={Michael Ahn and Debidatta Dwibedi and Chelsea Finn and Montserrat Gonzalez Arenas and Keerthana Gopalakrishnan and Karol Hausman and brian ichter and Alex Irpan and Nikhil J Joshi and Ryan Julian and Sean Kirmani and Isabel Leal and Tsang-Wei Edward Lee and Sergey Levine and Yao Lu and Sharath Maddineni and Kanishka Rao and Dorsa Sadigh and Pannag R Sanketi and Pierre Sermanet and Quan Vuong and Stefan Welker and Fei Xia and Ted Xiao and Peng Xu and Sichun Xu and Zhuo Xu},\nyear={2024},\nurl={https://openreview.net/forum?id=xVlcbh0poD}\n}",
        "github": "",
        "project": "",
        "reviewers": "mKqw;F9Mu;P3WR;jtyJ",
        "site": "https://openreview.net/forum?id=xVlcbh0poD",
        "pdf_size": 26487374,
        "rating": "5;5;5;6",
        "confidence": "4;5;4;4",
        "soundness": "3;3;2;3",
        "contribution": "2;2;2;2",
        "presentation": "3;4;3;3",
        "wc_summary": "115;128;118;63",
        "wc_strengths": "99;40;61;50",
        "wc_weaknesses": "184;234;452;153",
        "wc_questions": "94;3;25;55",
        "wc_review": "492;405;656;321",
        "wc_reply_reviewers": "72;0;19;19",
        "wc_reply_authors": "1403;1051;1085;682",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "3;3;2;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            106.0,
            25.288337232803585
        ],
        "wc_strengths_avg": [
            62.5,
            22.34390297150433
        ],
        "wc_weaknesses_avg": [
            255.75,
            116.93240568807263
        ],
        "wc_questions_avg": [
            44.25,
            34.14216601213227
        ],
        "wc_review_avg": [
            468.5,
            123.99294334759539
        ],
        "wc_reply_reviewers_avg": [
            27.5,
            26.837473800639284
        ],
        "wc_reply_authors_avg": [
            1055.25,
            255.51357596026088
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            27,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 57,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5114456266063471817&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0;0;0;0;0;0;1;2;0;0;3;0;0;0",
        "aff_unique_norm": "Google;NVIDIA;Stanford University;Physical Intelligence",
        "aff_unique_dep": "Google;NVIDIA Corporation;;",
        "aff_unique_url": "https://www.google.com;https://www.nvidia.com;https://www.stanford.edu;",
        "aff_unique_abbr": "Google;NVIDIA;Stanford;",
        "aff_campus_unique_index": "0;0;0;0;0;0;0;2;0;0;0;0",
        "aff_campus_unique": "Mountain View;;Stanford",
        "aff_country_unique_index": "0;0;0;0;1;0;0;1;0;0;0;0;0;0;0;1",
        "aff_country_unique": "United States;United Kingdom;"
    },
    {
        "id": "xVoj8AtyQ1",
        "title": "Vision Transformer with Irregular Attention",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Compression of Transformer is a natural request that arose in the computer vision community. Apart from quantization that hardly rely on hardware, sparsification is another way to remove redundant parts, usually based on mask training or sparsity regularization. We propose the novel compressed structure of multi-head self-attention (MHSA) mechanism called Irregular Attention (IAtt). IAtt is built on BTD-LL1 tensor decomposition and is aimed at sparsifying pre-trained Vision Transformer by pruning query and key (QK) contraction dimension in MHSA block. We derive the algorithm of rank selection procedure for BTD-LL1 based on the structure of fusion layer obtained from CP decomposition of original MHSA kernels. In order to improve the compression ratio with least possible quality loss we introduce the fine-tuning schemes that yield each head its own sub-optimal rank for QK in the IAtt. We validated the proposed scheme for DeiT architectures on ILSVRC-2012 dataset. Our results show that IAtt has better performance compared to original MHSA compressed by SVD. It indicates that attention heads have non-uniform importance and require different QK contract dimensions.",
        "keywords": "Deep Learning;DNN;Transformer;ViT;DeiT;Tensor Decomposition;Tensor Network;BTD;BTD-LL1;CPD;DNN Compression;DNN Acceleration",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Dmitry Ermilov;Nikolay Kozyrskiy;Igor Vorona;ANH-HUY PHAN;Andrzej Cichocki",
        "authorids": "~Dmitry_Ermilov1;~Nikolay_Kozyrskiy1;~Igor_Vorona1;~ANH-HUY_PHAN1;~Andrzej_Cichocki1",
        "gender": ";M;M;M;",
        "homepage": ";;https://www.researchgate.net/profile/Igor-Vorona;;",
        "dblp": ";;297/9607;23/2408;c/AndrzejCichocki",
        "google_scholar": ";yFkmQcYAAAAJ;;pJb7n9EAAAAJ;",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Dmitry_Ermilov1;~Nikolay_Kozyrskiy1;~Igor_Vorona1;~ANH-HUY_PHAN1;~Andrzej_Cichocki1",
        "aff": ";Skolkovo Institute of Science and Technology;Skoltech;Skolkovo Institute of Science and Technology;Skoltech",
        "aff_domain": ";skoltech.ru;skoltech.ru;skoltech.ru;skoltech.ru",
        "position": ";PhD student;PhD student;Full Professor;Full Professor",
        "bibtex": "@misc{\nermilov2024vision,\ntitle={Vision Transformer with Irregular Attention},\nauthor={Dmitry Ermilov and Nikolay Kozyrskiy and Igor Vorona and ANH-HUY PHAN and Andrzej Cichocki},\nyear={2024},\nurl={https://openreview.net/forum?id=xVoj8AtyQ1}\n}",
        "github": "",
        "project": "",
        "reviewers": "v2e6;QrK6;NApC;ycW6",
        "site": "https://openreview.net/forum?id=xVoj8AtyQ1",
        "pdf_size": 1296198,
        "rating": "3;3;3;5",
        "confidence": "3;2;4;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;2;2",
        "wc_summary": "42;62;58;94",
        "wc_strengths": "32;33;20;119",
        "wc_weaknesses": "68;118;161;195",
        "wc_questions": "6;43;5;94",
        "wc_review": "148;256;244;502",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "33;164;146;325",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            64.0,
            18.867962264113206
        ],
        "wc_strengths_avg": [
            51.0,
            39.59166578965831
        ],
        "wc_weaknesses_avg": [
            135.5,
            47.573627147822144
        ],
        "wc_questions_avg": [
            37.0,
            36.29738282576307
        ],
        "wc_review_avg": [
            287.5,
            130.7239457788817
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            167.0,
            104.12732590439457
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:pxh7TwljNN8J:scholar.google.com/&scioq=Vision+Transformer+with+Irregular+Attention&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Skolkovo Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.skoltech.ru",
        "aff_unique_abbr": "Skoltech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Russian Federation"
    },
    {
        "id": "xWrAAsdKoX",
        "title": "Retrieving Texts by Abstract Descriptions",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "While instruction-tuned Large Language Models (LLMs) excel at extracting information from text, they are not suitable for locating texts conforming to a given description in a large document collection (semantic retrieval). Similarity search over embedding vectors does allow to perform retrieval by query, but the similarity reflected in the embedding is ill-defined and non-consistent, and is sub-optimal for many use cases. What, then, is a good query representation for effective retrieval?\n\nWe identify the well defined and consistent task of retrieving sentences based on abstract descriptions of their content. We demonstrate the inadequacy of current text embeddings and propose an alternative model that significantly improves when used in standard nearest neighbor search. The model is trained using positive and negative pairs sourced through prompting a LLM. While it is easy to source the training material from an LLM, the retrieval task cannot be performed by the LLM directly. This demonstrates that data from LLMs can be used not only for distilling more efficient specialized models than the original LLM, but also for creating new capabilities not immediately possible using the original model.",
        "keywords": "similarity;descriptions;LMs;retrieval",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/99bc675d09fc6e63dd59a480db5522efd02cab64.zip",
        "author": "Shauli Ravfogel;Valentina Pyatkin;Amir David Nissan Cohen;Avshalom Manevich;Yoav Goldberg",
        "authorids": "~Shauli_Ravfogel1;~Valentina_Pyatkin1;~Amir_David_Nissan_Cohen1;~Avshalom_Manevich1;~Yoav_Goldberg1",
        "gender": "M;;M;;M",
        "homepage": "https://github.com/Shaul1321;;http://www.cs.technion.ac.il/~amirc/;;https://www.cs.biu.ac.il/~yogo",
        "dblp": "227/2231;;;338/0686;68/5296",
        "google_scholar": ";;KRkQizcAAAAJ;s1mUAq8AAAAJ;https://scholar.google.co.il/citations?user=0rskDKgAAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;avshalom-manevich/;",
        "or_profile": "~Shauli_Ravfogel1;~Valentina_Pyatkin1;~Amir_David_Nissan_Cohen1;~Avshalom_Manevich1;~Yoav_Goldberg1",
        "aff": "Bar-Ilan University;;Bar Ilan University;Bar-Ilan University;Allen Institute for Artificial Intelligence",
        "aff_domain": "biu.ac.il;;biu.ac.il;biu.ac.il;allenai.org",
        "position": "PhD student;;PhD student;MS student;Principal Researcher",
        "bibtex": "@misc{\nravfogel2024retrieving,\ntitle={Retrieving Texts by Abstract Descriptions},\nauthor={Shauli Ravfogel and Valentina Pyatkin and Amir David Nissan Cohen and Avshalom Manevich and Yoav Goldberg},\nyear={2024},\nurl={https://openreview.net/forum?id=xWrAAsdKoX}\n}",
        "github": "",
        "project": "",
        "reviewers": "Uira;nR3E;s5K1;34Co;SM29",
        "site": "https://openreview.net/forum?id=xWrAAsdKoX",
        "pdf_size": 1377122,
        "rating": "3;5;5;5;5",
        "confidence": "4;3;4;5;3",
        "soundness": "2;2;2;3;3",
        "contribution": "2;2;2;3;2",
        "presentation": "3;2;3;3;3",
        "wc_summary": "60;202;113;139;65",
        "wc_strengths": "47;207;101;32;41",
        "wc_weaknesses": "197;48;173;95;80",
        "wc_questions": "19;10;156;1;67",
        "wc_review": "323;467;543;267;253",
        "wc_reply_reviewers": "60;0;108;70;0",
        "wc_reply_authors": "467;89;525;176;293",
        "reply_reviewers": "1;0;1;1;0",
        "reply_authors": "1;1;1;2;1",
        "rating_avg": [
            4.6,
            0.7999999999999999
        ],
        "confidence_avg": [
            3.8,
            0.7483314773547882
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            115.8,
            52.289195824759055
        ],
        "wc_strengths_avg": [
            85.6,
            65.31033608855493
        ],
        "wc_weaknesses_avg": [
            118.6,
            56.810562398201974
        ],
        "wc_questions_avg": [
            50.6,
            57.41985719243823
        ],
        "wc_review_avg": [
            370.6,
            114.75469489306309
        ],
        "wc_reply_reviewers_avg": [
            47.6,
            42.03617489734289
        ],
        "wc_reply_authors_avg": [
            310.0,
            166.10839834276894
        ],
        "reply_reviewers_avg": [
            0.6,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.2,
            0.4
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.13363062095621223,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:MWabdEhqHg0J:scholar.google.com/&scioq=Retrieving+Texts+by+Abstract+Descriptions&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "Bar-Ilan University;Allen Institute for Artificial Intelligence",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.biu.ac.il;https://allenai.org",
        "aff_unique_abbr": "BIU;AI2",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "Israel;United States"
    },
    {
        "id": "xXtD9P2lvH",
        "title": "Directed Graph Generation with Heat Kernels",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Existing work on graph generation has, so far, mainly focused on undirected graphs. In this paper we propose a denoising autoencoder-based generative model that exploits the global structure of directed graphs (also called digraphs) via their Laplacian dynamics and enables one-shot generation.  Our noising encoder uses closed-form expressions based on the heat equation to corrupt its digraph input with uniform noise. Our decoder reconstructs the corrupted representation by exploiting the global topological information of the graph included in its random walk Laplacian matrix. Our approach generalizes a special class of exponential kernels over discrete structures, called diffusion kernels or heat kernels, to the non-symmetric case via Reproducing Kernel Banach Spaces (RKBS). This connection with heat kernels provides us with a geometrically motivated algorithm related to Gaussian processes and dimensionality reduction techniques such as Laplacian eigenmaps. It also allows us to interpret and exploit the eigenproperties of the Laplacian matrix. We provide an experimental analysis of our approach on different types of synthetic datasets and show that our model is able to generate directed graphs that follow the distribution of the training dataset even if it is multimodal.",
        "keywords": "Directed graphs;Digraphs;Generative models;denoising autoencoders;heat kernel;diffusion kernel;heat diffusion",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Marc T. Law;Karsten Kreis;Haggai Maron",
        "authorids": "~Marc_T._Law1;~Karsten_Kreis1;~Haggai_Maron1",
        "gender": ";M;M",
        "homepage": "https://karstenkreis.github.io/;https://haggaim.github.io/;http://www.cs.toronto.edu/~law/",
        "dblp": "238/6834;181/6629;117/7668",
        "google_scholar": "https://scholar.google.de/citations?user=rFd-DiAAAAAJ;https://scholar.google.co.il/citations?user=4v8uJrIAAAAJ;https://scholar.google.fr/citations?user=_7QgnUcAAAAJ",
        "orcid": ";;",
        "linkedin": "karstenkreis;;",
        "or_profile": "~Karsten_Kreis1;~Haggai_Maron1;~Marc_T_Law1",
        "aff": "NVIDIA;NVIDIA;NVIDIA",
        "aff_domain": "nvidia.com;nvidia.com;nvidia.com",
        "position": "Research Scientist;Research Scientist;Research Scientist",
        "bibtex": "@misc{\nlaw2024directed,\ntitle={Directed Graph Generation with Heat Kernels},\nauthor={Marc T. Law and Karsten Kreis and Haggai Maron},\nyear={2024},\nurl={https://openreview.net/forum?id=xXtD9P2lvH}\n}",
        "github": "",
        "project": "",
        "reviewers": "APd2;E6dr;hJPx;t7Sc",
        "site": "https://openreview.net/forum?id=xXtD9P2lvH",
        "pdf_size": 1333725,
        "rating": "5;6;6;6",
        "confidence": "3;4;2;2",
        "soundness": "2;3;2;3",
        "contribution": "3;3;3;3",
        "presentation": "2;3;2;3",
        "wc_summary": "76;52;79;109",
        "wc_strengths": "26;108;69;19",
        "wc_weaknesses": "127;154;154;29",
        "wc_questions": "129;62;121;38",
        "wc_review": "358;376;423;195",
        "wc_reply_reviewers": "0;0;26;0",
        "wc_reply_authors": "698;495;716;239",
        "reply_reviewers": "0;0;2;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            79.0,
            20.23610634484806
        ],
        "wc_strengths_avg": [
            55.5,
            35.8503835404867
        ],
        "wc_weaknesses_avg": [
            116.0,
            51.42470223540434
        ],
        "wc_questions_avg": [
            87.5,
            38.55191305240247
        ],
        "wc_review_avg": [
            338.0,
            85.90401620413331
        ],
        "wc_reply_reviewers_avg": [
            6.5,
            11.258330249197702
        ],
        "wc_reply_authors_avg": [
            537.0,
            192.69795017072704
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.17407765595569782,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:sI4V7S9wd3UJ:scholar.google.com/&scioq=Directed+Graph+Generation+with+Heat+Kernels&hl=en&as_sdt=0,5",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "NVIDIA",
        "aff_unique_dep": "NVIDIA Corporation",
        "aff_unique_url": "https://www.nvidia.com",
        "aff_unique_abbr": "NVIDIA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "xY4861TVUc",
        "title": "Towards the Vulnerability of Watermarking Artificial Intelligence Generated Content",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Artificial Intelligence Generated Content (AIGC) is gaining great popularity in social media, with many commercial services available. These services leverage advanced generative models, such as latent diffusion models and large language models, to generate creative content (e.g., realistic images, fluent sentences) for users. The usage of such generated content needs to be highly regulated, as the service providers need to ensure the users do not violate the usage policies (e.g., abuse for commercialization, generating and distributing unsafe content). \n\nNumerous watermarking approaches have been proposed recently. However, in this paper, we show that an adversary can easily break these watermarking mechanisms. Specifically, we consider two possible attacks. (1) Watermark removal: the adversary can easily erase the embedded watermark from the generated content and then use it freely without the regulation of the service provider. (2) Watermark forge: the adversary can create illegal content with forged watermarks from another user, causing the service provider to make wrong attributions. We propose WMaGi, a unified framework to achieve both attacks in a holistic way. The key idea is to leverage a pre-trained diffusion model for content processing, and a generative adversarial network for watermark removing or forging. We evaluate WMaGi on different datasets and embedding setups. The results prove that it can achieve high success rates while maintaining the quality of the generated content. Compared with existing diffusion model-based attacks, WMaGi is 5,050$\\sim$11,000$\\times$ faster.",
        "keywords": "content watermark;generative model;AIGC",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/5909258526855f726b693e1f2bbbd5ef4909cb50.zip",
        "author": "Guanlin Li;Yifei Chen;Jie Zhang;Jiwei Li;Shangwei Guo;Tianwei Zhang",
        "authorids": "~Guanlin_Li2;~Yifei_Chen9;~Jie_Zhang11;~Jiwei_Li1;~Shangwei_Guo1;~Tianwei_Zhang1",
        "gender": "M;;M;M;M;M",
        "homepage": "https://guanlinlee.github.io/;https://github.com/MisterPANDC;https://zjzac.github.io/;https://nlp.stanford.edu/~bdlijiwei/;http://www.cs.cqu.edu.cn/info/1332/5290.htm;https://personal.ntu.edu.sg/tianwei.zhang/index.html",
        "dblp": ";;84/6889-73;73/5746-1;176/6479;77/7902-4",
        "google_scholar": "3LB0_wMAAAAJ;;7YkR3CoAAAAJ//;PwU16JEAAAAJ;wQrVkBYAAAAJ;9vpiYDIAAAAJ",
        "orcid": ";;0000-0002-4230-1077;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Guanlin_Li2;~Yifei_Chen9;~Jie_Zhang11;~Jiwei_Li1;~Shangwei_Guo1;~Tianwei_Zhang1",
        "aff": "Nanyang Technological University;Chongqing University;Nanyang Technological University;Zhejiang University;Chongqing University;Nanyang Technological University",
        "aff_domain": "ntu.edu.sg;cqu.edu.cn;ntu.edu.sg;zju.edu.cn;cqu.edu.cn;ntu.edu.sg",
        "position": "PhD student;Undergrad student;Postdoc;Assistant Professor;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nli2024towards,\ntitle={Towards the Vulnerability of Watermarking Artificial Intelligence Generated Content},\nauthor={Guanlin Li and Yifei Chen and Jie Zhang and Jiwei Li and Shangwei Guo and Tianwei Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=xY4861TVUc}\n}",
        "github": "",
        "project": "",
        "reviewers": "Z66i;K8Tz;o1H9;m88T",
        "site": "https://openreview.net/forum?id=xY4861TVUc",
        "pdf_size": 7790454,
        "rating": "3;3;5;5",
        "confidence": "4;4;3;4",
        "soundness": "3;3;2;3",
        "contribution": "2;3;2;3",
        "presentation": "1;3;3;3",
        "wc_summary": "25;118;59;73",
        "wc_strengths": "26;127;45;57",
        "wc_weaknesses": "144;139;131;168",
        "wc_questions": "54;92;68;3",
        "wc_review": "249;476;303;301",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            68.75,
            33.36446462930284
        ],
        "wc_strengths_avg": [
            63.75,
            38.15347297429161
        ],
        "wc_weaknesses_avg": [
            145.5,
            13.793114224133722
        ],
        "wc_questions_avg": [
            54.25,
            32.560520573234086
        ],
        "wc_review_avg": [
            332.25,
            85.77113442178552
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6154048807659822844&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;0;2;1;0",
        "aff_unique_norm": "Nanyang Technological University;Chongqing University;Zhejiang University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ntu.edu.sg;https://www.cqu.edu.cn;https://www.zju.edu.cn",
        "aff_unique_abbr": "NTU;CQU;ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;1;1;0",
        "aff_country_unique": "Singapore;China"
    },
    {
        "title": "Tell Your Model Where to Attend: Post-hoc Attention Steering for LLMs",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17451",
        "id": "xZDWO0oejD",
        "author_site": "Qingru Zhang, Chandan Singh, Liyuan Liu, Xiaodong Liu, Bin Yu, Jianfeng Gao, Tuo Zhao",
        "tldr": "",
        "abstract": "In human-written articles, we often leverage the subtleties of text style, such as bold and italics, to guide the attention of readers. These textual emphases are vital for the readers to grasp the conveyed information.  When interacting with large language models (LLMs), we have a similar need -- steering the model to pay closer attention to user-specified information, e.g., an instruction. Existing methods, however, are constrained to process plain text and do not support such a mechanism. This motivates us to introduce PASTA -- Post-hoc Attention STeering Approach, a method that allows LLMs to read text with user-specified emphasis marks. To this end, PASTA identifies a small subset of attention heads and applies precise attention reweighting on them, directing the model attention to user-specified parts. Like prompting, PASTA is applied at inference time and does not require changing any model parameters. Experiments demonstrate that PASTA can substantially enhance an LLM's ability to follow user instructions or integrate new knowledge from user inputs, leading to a significant performance improvement on a variety of tasks, e.g., an average accuracy improvement of 22\\% for LLAMA-7B. Our code is publicly available at https://github.com/QingruZhang/PASTA .",
        "keywords": "Attention steering;Post-hoc;Contextual emphasizing",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Qingru Zhang;Chandan Singh;Liyuan Liu;Xiaodong Liu;Bin Yu;Jianfeng Gao;Tuo Zhao",
        "authorids": "~Qingru_Zhang2;~Chandan_Singh1;~Liyuan_Liu3;~Xiaodong_Liu1;~Bin_Yu5;~Jianfeng_Gao1;~Tuo_Zhao2",
        "gender": "M;M;;M;M;M;M",
        "homepage": "https://qingruzhang.github.io/;https://csinva.io/;;https://binyu.stat.berkeley.edu;https://www.microsoft.com/en-us/research/people/jfgao/;https://liyuanlucasliu.github.io/;http://www2.isye.gatech.edu/~tzhao80",
        "dblp": "228/6749;38/2317;65/622;27/116;92/5339;06/1624;",
        "google_scholar": "7YM-faYAAAAJ;https://scholar.google.com/citations?hl=en;NIewcxMAAAAJ;https://scholar.google.com.hk/citations?user=z1iJa3UAAAAJ;https://scholar.google.com/citations?hl=en;RmvbkzYAAAAJ;EJXN6tYAAAAJ",
        "orcid": ";0000-0003-0318-2340;;0000-0003-3097-1433;;;",
        "linkedin": "qingru-zhang-4b789a187;csinva/;;bin-yu-b665063/;;;",
        "or_profile": "~Qingru_Zhang2;~Chandan_Singh1;~Xiaodong_Liu1;~Bin_Yu5;~Jianfeng_Gao1;~Liyuan_Liu1;~Tuo_Zhao1",
        "aff": "Georgia Institute of Technology;Microsoft Research;Microsoft Research;University of California, Berkeley;Microsoft Research;University of Illinois, Urbana Champaign;Georgia Institute of Technology",
        "aff_domain": "gatech.edu;microsoft.com;microsoft.com;berkeley.edu;microsoft.com;illinois.edu;gatech.edu",
        "position": "PhD student;Researcher;Researcher;Full Professor;Principal Researcher;PhD student;Associate Professor",
        "bibtex": "@inproceedings{\nzhang2024tell,\ntitle={Tell Your Model Where to Attend: Post-hoc Attention Steering for {LLM}s},\nauthor={Qingru Zhang and Chandan Singh and Liyuan Liu and Xiaodong Liu and Bin Yu and Jianfeng Gao and Tuo Zhao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=xZDWO0oejD}\n}",
        "github": "",
        "project": "",
        "reviewers": "WBEq;pBs7;ppCr;s9kK",
        "pdf_size": 824748,
        "rating": "3;6;6;8",
        "confidence": "3;4;4;4",
        "soundness": "1;2;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;4;4",
        "wc_summary": "135;87;163;135",
        "wc_strengths": "167;57;85;60",
        "wc_weaknesses": "389;264;174;15",
        "wc_questions": "137;26;130;47",
        "wc_review": "828;434;552;257",
        "wc_reply_reviewers": "203;68;99;0",
        "wc_reply_authors": "2486;1810;718;521",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "4;3;1;1",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            130.0,
            27.331300737432898
        ],
        "wc_strengths_avg": [
            92.25,
            44.5049154588569
        ],
        "wc_weaknesses_avg": [
            210.5,
            136.26903536754048
        ],
        "wc_questions_avg": [
            85.0,
            49.12738543826651
        ],
        "wc_review_avg": [
            517.75,
            207.62511288377425
        ],
        "wc_reply_reviewers_avg": [
            92.5,
            73.15907325820906
        ],
        "wc_reply_authors_avg": [
            1383.75,
            803.7730945360139
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            1.299038105676658
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.8892972917998875,
        "gs_citation": 37,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14015396888334357362&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=xZDWO0oejD",
        "pdf": "https://openreview.net/pdf?id=xZDWO0oejD",
        "email": "gatech.edu;microsoft.com;microsoft.com;berkeley.edu;microsoft.com;illinois.edu;gatech.edu",
        "author_num": 7,
        "aff_unique_index": "0;1;1;2;1;3;0",
        "aff_unique_norm": "Georgia Institute of Technology;Microsoft;University of California, Berkeley;University of Illinois Urbana-Champaign",
        "aff_unique_dep": ";Microsoft Research;;",
        "aff_unique_url": "https://www.gatech.edu;https://www.microsoft.com/en-us/research;https://www.berkeley.edu;https://illinois.edu",
        "aff_unique_abbr": "Georgia Tech;MSR;UC Berkeley;UIUC",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Berkeley;Urbana-Champaign",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "xbUlKe1iE8",
        "title": "Doubly Robust Structure Identification from Temporal Data",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Learning the causes of time-series data is a fundamental task in many applications, spanning from finance to earth sciences or bio-medical applications. Common approaches for this task are based on vector auto-regression, and they do not take into account unknown confounding between potential causes. However, in settings with many potential causes and noisy data, these approaches may be substantially biased. Furthermore, potential causes may be correlated in practical applications. Moreover, existing algorithms often do not work with cyclic data. To address these challenges, we propose a new doubly robust method for Structure Identification from Temporal Data (SITD). We provide theoretical guarantees, showing that our method asymptotically recovers the true underlying causal structure. Our analysis extends to cases where the potential causes have cycles and they may be confounded. We further perform extensive experiments to showcase the superior performance of our method.",
        "keywords": "causal discovery;time series;double machine learning",
        "primary_area": "causal reasoning",
        "supplementary_material": "/attachment/4321ea43ff4edc60127193c30207415b1faf5970.zip",
        "author": "Emmanouil Angelis;Francesco Quinzan;Ashkan Soleymani;Patrick Jaillet;Stefan Bauer",
        "authorids": "~Emmanouil_Angelis1;~Francesco_Quinzan1;~Ashkan_Soleymani1;~Patrick_Jaillet1;~Stefan_Bauer1",
        "gender": "M;;M;M;",
        "homepage": ";;https://ashkansoleymani.lids.mit.edu/;http://web.mit.edu/jaillet/www/;https://cifar.ca/bios/stefan-bauer/",
        "dblp": "260/0417;;270/3353.html;https://dblp.uni-trier.de/pers/hd/j/Jaillet:Patrick;",
        "google_scholar": "1oyQGIcAAAAJ;;omHTV3MAAAAJ;ND0FM6EAAAAJ;O-oICE8AAAAJ",
        "orcid": ";;;0000-0002-8585-6566;",
        "linkedin": ";;;patrick-jaillet-1260445/;",
        "or_profile": "~Emmanouil_Angelis1;~Francesco_Quinzan1;~Ashkan_Soleymani1;~Patrick_Jaillet1;~Stefan_Bauer1",
        "aff": "Technische Universit\u00e4t M\u00fcnchen;;Massachusetts Institute of Technology;Massachusetts Institute of Technology;Technische Universit\u00e4t M\u00fcnchen",
        "aff_domain": "tum.de;;mit.edu;mit.edu;tum.de",
        "position": "PhD student;;PhD student;Full Professor;Associate Professor",
        "bibtex": "@misc{\nangelis2024doubly,\ntitle={Doubly Robust Structure Identification from Temporal Data},\nauthor={Emmanouil Angelis and Francesco Quinzan and Ashkan Soleymani and Patrick Jaillet and Stefan Bauer},\nyear={2024},\nurl={https://openreview.net/forum?id=xbUlKe1iE8}\n}",
        "github": "",
        "project": "",
        "reviewers": "biK3;fyvt;95xj;uCS8;WUkY",
        "site": "https://openreview.net/forum?id=xbUlKe1iE8",
        "pdf_size": 667576,
        "rating": "3;3;6;6;6",
        "confidence": "3;3;2;3;3",
        "soundness": "3;2;3;3;3",
        "contribution": "3;2;2;3;3",
        "presentation": "2;2;3;2;3",
        "wc_summary": "99;108;41;41;100",
        "wc_strengths": "56;36;58;30;101",
        "wc_weaknesses": "170;226;168;21;49",
        "wc_questions": "104;221;255;13;45",
        "wc_review": "429;591;522;105;295",
        "wc_reply_reviewers": "0;230;72;0;0",
        "wc_reply_authors": "1155;1799;2012;190;424",
        "reply_reviewers": "0;2;2;0;0",
        "reply_authors": "3;4;6;2;2",
        "rating_avg": [
            4.8,
            1.469693845669907
        ],
        "confidence_avg": [
            2.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            77.8,
            30.208608044727914
        ],
        "wc_strengths_avg": [
            56.2,
            24.919069003476032
        ],
        "wc_weaknesses_avg": [
            126.8,
            78.29533830311993
        ],
        "wc_questions_avg": [
            127.6,
            95.35953020018503
        ],
        "wc_review_avg": [
            388.4,
            172.96427376773505
        ],
        "wc_reply_reviewers_avg": [
            60.4,
            89.26723923142241
        ],
        "wc_reply_authors_avg": [
            1116.0,
            722.1033167075194
        ],
        "reply_reviewers_avg": [
            0.8,
            0.9797958971132713
        ],
        "reply_authors_avg": [
            3.4,
            1.4966629547095764
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.4082482904638631,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13090419562580183623&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1;0",
        "aff_unique_norm": "Technische Universit\u00e4t M\u00fcnchen;Massachusetts Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tum.de;https://web.mit.edu",
        "aff_unique_abbr": "TUM;MIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "Germany;United States"
    },
    {
        "id": "xbXASfz8MD",
        "title": "Latent Space Symmetry Discovery",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Equivariant neural networks require explicit knowledge of the symmetry group. Automatic symmetry discovery methods aim to relax this constraint and learn invariance and equivariance from data. However, existing symmetry discovery methods are limited to linear symmetries in their search space and cannot handle the complexity of symmetries in real-world, often high-dimensional data. We propose a novel generative model, Latent LieGAN (LaLiGAN), which can discover nonlinear symmetries from data. It learns a mapping from data to a latent space where the symmetries become linear and simultaneously discovers symmetries in the latent space. Theoretically, we show that our method can express any nonlinear symmetry under certain conditions. Experimentally, our method can capture the intrinsic symmetry in high-dimensional observations, which results in a well-structured latent space that is useful for other downstream tasks. We demonstrate the use cases for LaLiGAN in improving equation discovery and long-term forecasting for various dynamical systems.",
        "keywords": "symmetry discovery;equivariance;equivariant neural network;scientific machine learning;Lie theory;equation discovery",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/a94de9df4f6ae67845d7861a874a1641cd8ae1e9.zip",
        "author": "Jianke Yang;Nima Dehmamy;Robin Walters;Rose Yu",
        "authorids": "~Jianke_Yang2;~Nima_Dehmamy1;~Robin_Walters1;~Rose_Yu1",
        "gender": ";M;M;F",
        "homepage": "https://jiankeyang.github.io;;http://www.robinwalters.com;http://roseyu.com",
        "dblp": "50/2341;198/1338;258/3416;164/7314",
        "google_scholar": "https://scholar.google.com/citations?hl=en;gvHpUtgAAAAJ;fnprJmUAAAAJ;",
        "orcid": ";0000-0003-1617-5502;;",
        "linkedin": ";nima-dehmamy-57770a4a/;;",
        "or_profile": "~Jianke_Yang2;~Nima_Dehmamy1;~Robin_Walters1;~Rose_Yu1",
        "aff": "University of California, San Diego;International Business Machines;Northeastern University ;University of California, San Diego",
        "aff_domain": "ucsd.edu;ibm.com;northeastern.edu;ucsd.edu",
        "position": "PhD student;Researcher;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nyang2024latent,\ntitle={Latent Space Symmetry Discovery},\nauthor={Jianke Yang and Nima Dehmamy and Robin Walters and Rose Yu},\nyear={2024},\nurl={https://openreview.net/forum?id=xbXASfz8MD}\n}",
        "github": "",
        "project": "",
        "reviewers": "Vcu8;BHEh;5mQG",
        "site": "https://openreview.net/forum?id=xbXASfz8MD",
        "pdf_size": 4034124,
        "rating": "3;6;8",
        "confidence": "4;3;5",
        "soundness": "1;3;4",
        "contribution": "2;3;4",
        "presentation": "3;3;4",
        "wc_summary": "104;137;88",
        "wc_strengths": "120;49;81",
        "wc_weaknesses": "575;232;51",
        "wc_questions": "7;49;215",
        "wc_review": "806;467;435",
        "wc_reply_reviewers": "432;252;68",
        "wc_reply_authors": "2654;1501;646",
        "reply_reviewers": "2;1;1",
        "reply_authors": "6;3;2",
        "rating_avg": [
            5.666666666666667,
            2.0548046676563256
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            109.66666666666667,
            20.401524997465806
        ],
        "wc_strengths_avg": [
            83.33333333333333,
            29.0325487838889
        ],
        "wc_weaknesses_avg": [
            286.0,
            217.30316764066433
        ],
        "wc_questions_avg": [
            90.33333333333333,
            89.80472642845079
        ],
        "wc_review_avg": [
            569.3333333333334,
            167.85774400432715
        ],
        "wc_reply_reviewers_avg": [
            250.66666666666666,
            148.6053685287162
        ],
        "wc_reply_authors_avg": [
            1600.3333333333333,
            822.7662014340539
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            1.699673171197595
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3973597071195132,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8366021739882753992&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 12,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "University of California, San Diego;International Business Machines Corporation;Northeastern University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ucsd.edu;https://www.ibm.com;https://www.northeastern.edu",
        "aff_unique_abbr": "UCSD;IBM;NEU",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "San Diego;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Statistical Rejection Sampling Improves Preference Optimization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17450",
        "id": "xbjSwwrQOe",
        "author_site": "Tianqi Liu, Yao Zhao, Rishabh Joshi, Misha Khalman, Mohammad Saleh, Peter Liu, Jialu Liu",
        "tldr": "",
        "abstract": "Improving the alignment of language models with human preferences remains an active research challenge. Previous approaches have primarily utilized online Reinforcement Learning from Human Feedback (RLHF). Recently, offline methods such as Sequence Likelihood Calibration (SLiC) and Direct Preference Optimization (DPO) have emerged as attractive alternatives, offering improvements in stability and scalability while maintaining competitive performance. SLiC refines its loss function using sequence pairs sampled from a supervised fine-tuned (SFT) policy, while DPO directly optimizes language models based on preference data, foregoing the need for a separate reward model. However, the maximum likelihood estimator (MLE) of the target optimal policy requires labeled preference pairs sampled from that policy. The absence of a reward model in DPO constrains its ability to sample preference pairs from the optimal policy. Meanwhile, SLiC can only sample preference pairs from the SFT policy. To address these limitations, we introduce a novel approach called Statistical Rejection Sampling Optimization (RSO) designed to source preference data from the target optimal policy using rejection sampling, enabling a more accurate estimation of the optimal policy. We also propose a unified framework that enhances the loss functions used in both SLiC and DPO from a preference modeling standpoint. Through extensive experiments across diverse tasks, we demonstrate that RSO consistently outperforms both SLiC and DPO as evaluated by both Large Language Models (LLMs) and human raters.",
        "keywords": "large language model;preference optimization;language model alignment",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Tianqi Liu;Yao Zhao;Rishabh Joshi;Misha Khalman;Mohammad Saleh;Peter J Liu;Jialu Liu",
        "authorids": "~Tianqi_Liu1;~Yao_Zhao5;~Rishabh_Joshi1;~Misha_Khalman1;~Mohammad_Saleh1;~Peter_J_Liu1;~Jialu_Liu1",
        "gender": "M;;M;;;M;M",
        "homepage": ";;http://rishabhjoshi.github.io;;http://www.peterjliu.com;https://jialu.info/;",
        "dblp": "134/5653-2;;228/5645;;190/7667;14/8399;",
        "google_scholar": "pUKhiMIAAAAJ;p7L3HrMAAAAJ;https://scholar.google.co.in/citations?user=vu2pNVAAAAAJ;MmX7K38AAAAJ;;BUERw4QAAAAJ;",
        "orcid": ";;;;;;",
        "linkedin": ";;joshi-rishabh/;mohammad-saleh-18a56b155;p3t3rliu;;khalman/",
        "or_profile": "~Tianqi_Liu1;~Yao_Zhao5;~Rishabh_Joshi1;~Mohammad_Saleh1;~Peter_J_Liu1;~Jialu_Liu1;~Mikhail_Khalman1",
        "aff": "Google DeepMind;Google;Google;;Google Brain;Google Research;Google",
        "aff_domain": "google.com;google.com;google.com;;google.com;google.com;google.com",
        "position": "Software Engineer;Researcher;Researcher;;Research Scientist;Software Engineer Manager;Researcher",
        "bibtex": "@inproceedings{\nliu2024statistical,\ntitle={Statistical Rejection Sampling Improves Preference Optimization},\nauthor={Tianqi Liu and Yao Zhao and Rishabh Joshi and Misha Khalman and Mohammad Saleh and Peter J Liu and Jialu Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=xbjSwwrQOe}\n}",
        "github": "",
        "project": "",
        "reviewers": "hBgS;nTnq;DcKN",
        "pdf_size": 2250222,
        "rating": "5;6;6",
        "confidence": "4;3;4",
        "soundness": "2;3;2",
        "contribution": "2;3;3",
        "presentation": "3;4;3",
        "wc_summary": "94;67;87",
        "wc_strengths": "92;35;25",
        "wc_weaknesses": "102;129;115",
        "wc_questions": "58;30;6",
        "wc_review": "346;261;233",
        "wc_reply_reviewers": "145;550;466",
        "wc_reply_authors": "2373;5306;2243",
        "reply_reviewers": "1;4;3",
        "reply_authors": "8;13;6",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            82.66666666666667,
            11.440668201153676
        ],
        "wc_strengths_avg": [
            50.666666666666664,
            29.510826638521817
        ],
        "wc_weaknesses_avg": [
            115.33333333333333,
            11.025223605694151
        ],
        "wc_questions_avg": [
            31.333333333333332,
            21.24983660067897
        ],
        "wc_review_avg": [
            280.0,
            48.0485865210067
        ],
        "wc_reply_reviewers_avg": [
            387.0,
            174.52220489095365
        ],
        "wc_reply_authors_avg": [
            3307.3333333333335,
            1414.2669086452136
        ],
        "reply_reviewers_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "reply_authors_avg": [
            9.0,
            2.943920288775949
        ],
        "replies_avg": [
            42,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 199,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14103100778643667433&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=xbjSwwrQOe",
        "pdf": "https://openreview.net/pdf?id=xbjSwwrQOe",
        "email": "google.com;google.com;google.com;;google.com;google.com;google.com",
        "author_num": 7,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "Google",
        "aff_unique_dep": "Google DeepMind",
        "aff_unique_url": "https://deepmind.com",
        "aff_unique_abbr": "DeepMind",
        "aff_campus_unique_index": "1;1;1;1;1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;1;1;1;1;1",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "title": "Learning to design protein-protein interactions with enhanced generalization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17449",
        "id": "xcMmebCT7s",
        "author_site": "Anton Bushuiev, Roman Bushuiev, Petr Kouba, Anatolii Filkin, Mark\u00e9ta Gabrielov\u00e1, Michal Gabriel, Jiri Sedlar, Tomas Pluskal, Jiri Damborsky, Stanislav Mazurenko, Josef Sivic",
        "tldr": "",
        "abstract": "Discovering mutations enhancing protein-protein interactions (PPIs) is critical for advancing biomedical research and developing improved therapeutics. While machine learning approaches have substantially advanced the field, they often struggle to generalize beyond training data in practical scenarios. The contributions of this work are three-fold. First, we construct PPIRef, the largest and non-redundant dataset of 3D protein-protein interactions, enabling effective large-scale learning. Second, we leverage the PPIRef dataset to pre-train PPIformer, a new SE(3)-equivariant model generalizing across diverse protein-binder variants. We fine-tune PPIformer to predict effects of mutations on protein-protein interactions via a thermodynamically motivated adjustment of the pre-training loss function. Finally, we demonstrate the enhanced generalization of our new PPIformer approach by outperforming other state-of-the-art methods on new, non-leaking splits of standard labeled PPI mutational data and independent case studies optimizing a human antibody against SARS-CoV-2 and increasing the thrombolytic activity of staphylokinase.",
        "keywords": "protein-protein interactions;protein design;generalization;self-supervised learning;equivariant 3D representations",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Anton Bushuiev;Roman Bushuiev;Petr Kouba;Anatolii Filkin;Marketa Gabrielova;Michal Gabriel;Jiri Sedlar;Tomas Pluskal;Jiri Damborsky;Stanislav Mazurenko;Josef Sivic",
        "authorids": "~Anton_Bushuiev1;roman.bushuiev@uochb.cas.cz;koubape9@fel.cvut.cz;filkiana@student.cvut.cz;makyta.gabrielova@seznam.cz;gabriel.michal@post.cz;~Jiri_Sedlar1;tomas.pluskal@uochb.cas.cz;jiri@chemi.muni.cz;mazurenko@mail.muni.cz;~Josef_Sivic1",
        "gender": ";;;;;;M;;;;M",
        "homepage": ";;;;;;https://jirisedlar.github.io/;;;;http://people.ciirc.cvut.cz/~sivic",
        "dblp": ";;;;;;79/9176;;;;71/5006",
        "google_scholar": "1KKXOA0AAAAJ;;;;;;Gqdjl-oAAAAJ;;;;https://scholar.google.fr/citations?user=NCtKHnQAAAAJ",
        "orcid": ";;;;;;0000-0002-4704-3388;;;;",
        "linkedin": "anton-bushuiev/;;;;;;;;;;",
        "or_profile": "~Anton_Bushuiev1;roman.bushuiev@uochb.cas.cz;koubape9@fel.cvut.cz;filkiana@student.cvut.cz;makyta.gabrielova@seznam.cz;gabriel.michal@post.cz;~Jiri_Sedlar1;tomas.pluskal@uochb.cas.cz;jiri@chemi.muni.cz;mazurenko@mail.muni.cz;~Josef_Sivic1",
        "aff": "Czech Technical University in Prague;;;;;;CIIRC, Czech Technical University, Czech Technical University of Prague;;;;Czech Technical University in Prague",
        "aff_domain": "cvut.cz;;;;;;ciirc.cvut.cz;;;;cvut.cz",
        "position": "PhD student;;;;;;Researcher;;;;Principal investigator",
        "bibtex": "@inproceedings{\nbushuiev2024learning,\ntitle={Learning to design protein-protein interactions with enhanced generalization},\nauthor={Anton Bushuiev and Roman Bushuiev and Petr Kouba and Anatolii Filkin and Marketa Gabrielova and Michal Gabriel and Jiri Sedlar and Tomas Pluskal and Jiri Damborsky and Stanislav Mazurenko and Josef Sivic},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=xcMmebCT7s}\n}",
        "github": "",
        "project": "",
        "reviewers": "Sjjh;Kuay;brhp;hYdu;ZbAC",
        "pdf_size": 9520877,
        "rating": "3;6;6;6;8",
        "confidence": "5;2;4;3;5",
        "soundness": "1;3;3;3;3",
        "contribution": "2;3;2;3;4",
        "presentation": "3;3;3;3;4",
        "wc_summary": "107;36;82;45;52",
        "wc_strengths": "113;70;87;30;59",
        "wc_weaknesses": "134;64;102;90;3",
        "wc_questions": "467;39;121;47;130",
        "wc_review": "821;209;392;212;244",
        "wc_reply_reviewers": "1406;0;0;101;70",
        "wc_reply_authors": "4378;654;1067;1881;1753",
        "reply_reviewers": "2;0;0;1;1",
        "reply_authors": "7;1;2;4;3",
        "rating_avg": [
            5.8,
            1.6
        ],
        "confidence_avg": [
            3.8,
            1.16619037896906
        ],
        "soundness_avg": [
            2.6,
            0.8000000000000002
        ],
        "contribution_avg": [
            2.8,
            0.7483314773547882
        ],
        "presentation_avg": [
            3.2,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            64.4,
            26.310454196003533
        ],
        "wc_strengths_avg": [
            71.8,
            27.722914709676544
        ],
        "wc_weaknesses_avg": [
            78.6,
            43.98908955638887
        ],
        "wc_questions_avg": [
            160.8,
            157.5289179801601
        ],
        "wc_review_avg": [
            375.6,
            232.58942366324396
        ],
        "wc_reply_reviewers_avg": [
            315.4,
            546.7268422164765
        ],
        "wc_reply_authors_avg": [
            1946.6,
            1295.9939197388235
        ],
        "reply_reviewers_avg": [
            0.8,
            0.7483314773547883
        ],
        "reply_authors_avg": [
            3.4,
            2.0591260281974
        ],
        "replies_avg": [
            33,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": -0.12862393885688164,
        "gs_citation": 19,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16383172203104848654&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=xcMmebCT7s",
        "pdf": "https://openreview.net/pdf?id=xcMmebCT7s",
        "email": "cvut.cz;;;;;;ciirc.cvut.cz;;;;cvut.cz",
        "author_num": 11,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Czech Technical University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ctu.cz",
        "aff_unique_abbr": "CTU",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Prague",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Czech Republic"
    },
    {
        "id": "xdnoULh5Sv",
        "title": "CARSO: Blending Adversarial Training and Purification Improves Adversarial Robustness",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this work, we propose a novel adversarial defence mechanism for image classification - CARSO - blending the paradigms of *adversarial training* and *adversarial purification* in a mutually-beneficial, robustness-enhancing way. The method builds upon an adversarially-trained classifier, and learns to map its *internal representation* associated with a potentially perturbed input onto a distribution of tentative clean reconstructions. Multiple samples from such distribution are classified by the adversarially-trained model, and an aggregation of its outputs finally constitutes the *robust prediction* of interest. Experimental evaluation by a well-established benchmark of varied, strong adaptive attacks, across different image datasets and classifier architectures, shows that CARSO is able to defend itself against foreseen and unforeseen threats, including adaptive *end-to-end* attacks devised for stochastic defences. Paying a tolerable *clean* accuracy toll, our method improves by a significant margin the *state of the art* for CIFAR-10 and CIFAR-100 $\\ell_\\infty$ robust classification accuracy against AutoAttack.",
        "keywords": "adversarial robustness;adversarial training;adversarial purification;generative purification;internal representation",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/8eb5b4ef3e08955520ad327970cbc8419354fd42.zip",
        "author": "Emanuele Ballarin;Alessio ansuini;Luca Bortolussi",
        "authorids": "~Emanuele_Ballarin1;~Alessio_ansuini1;~Luca_Bortolussi1",
        "gender": "M;M;M",
        "homepage": "https://ballarin.cc/;;https://ai-lab.units.it",
        "dblp": "348/6393;232/2196;32/1171",
        "google_scholar": "https://scholar.google.com/citations?hl=en;6lhdu6kAAAAJ;p5ynADcAAAAJ",
        "orcid": "0000-0003-3673-0665;0000-0002-3117-3532;0000-0001-8874-4001",
        "linkedin": "emaballarin;alessioansuini/;",
        "or_profile": "~Emanuele_Ballarin1;~Alessio_ansuini1;~Luca_Bortolussi1",
        "aff": "University of Trieste;AREA Science Park;University of Trieste",
        "aff_domain": "units.it;areasciencepark.it;units.it",
        "position": "PhD student;Researcher;Full Professor",
        "bibtex": "@misc{\nballarin2024carso,\ntitle={{CARSO}: Blending Adversarial Training and Purification Improves Adversarial Robustness},\nauthor={Emanuele Ballarin and Alessio ansuini and Luca Bortolussi},\nyear={2024},\nurl={https://openreview.net/forum?id=xdnoULh5Sv}\n}",
        "github": "",
        "project": "",
        "reviewers": "VTuG;yvVv;8cBw;T2NZ",
        "site": "https://openreview.net/forum?id=xdnoULh5Sv",
        "pdf_size": 495456,
        "rating": "1;5;5;5",
        "confidence": "5;3;4;2",
        "soundness": "2;2;3;2",
        "contribution": "2;2;3;2",
        "presentation": "2;2;2;2",
        "wc_summary": "92;40;39;90",
        "wc_strengths": "14;16;36;29",
        "wc_weaknesses": "552;79;147;255",
        "wc_questions": "3;58;2;141",
        "wc_review": "661;193;224;515",
        "wc_reply_reviewers": "199;0;0;0",
        "wc_reply_authors": "3516;1110;1078;1544",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "7;2;3;3",
        "rating_avg": [
            4.0,
            1.7320508075688772
        ],
        "confidence_avg": [
            3.5,
            1.118033988749895
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            65.25,
            25.762133063859444
        ],
        "wc_strengths_avg": [
            23.75,
            9.12071817347735
        ],
        "wc_weaknesses_avg": [
            258.25,
            180.83607908821736
        ],
        "wc_questions_avg": [
            51.0,
            56.68774117920029
        ],
        "wc_review_avg": [
            398.25,
            196.95097740300758
        ],
        "wc_reply_reviewers_avg": [
            49.75,
            86.16952767655164
        ],
        "wc_reply_authors_avg": [
            1812.0,
            1000.874617522095
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.75,
            1.920286436967152
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.7745966692414834,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:tNg0RQMofj0J:scholar.google.com/&scioq=CARSO:+Blending+Adversarial+Training+and+Purification+Improves+Adversarial+Robustness&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of Trieste;Area Science Park",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.units.it;https://www.area-science-park.org/",
        "aff_unique_abbr": "UniTS;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Italy"
    },
    {
        "id": "xelrLobW0n",
        "title": "TRACE: A Comprehensive Benchmark for Continual Learning in Large Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Aligned large language models (LLMs) demonstrate exceptional capabilities in task-solving, following instructions, and ensuring safety. However, the continual learning aspect of these aligned LLMs has been largely overlooked. Existing continual learning benchmarks lack sufficient challenge for leading aligned LLMs, owing to both their simplicity and the models' potential exposure during instruction tuning.\nIn this paper, we introduce TRACE, a novel benchmark designed to evaluate continual learning in LLMs. TRACE consists of 8 distinct datasets spanning challenging tasks including domain-specific tasks, multilingual capabilities, code generation, and mathematical reasoning.  All datasets are standardized into a unified format, allowing for effortless automatic evaluation of LLMs.\nOur experiments show that after training on TRACE, aligned LLMs exhibit significant declines in both general ability and instruction-following capabilities. For example, the accuracy of llama2-chat 13B on gsm8k dataset declined precipitously from 28.8\\% to 2\\% after training on our datasets. This highlights the challenge of finding a suitable tradeoff between achieving performance on specific tasks while preserving the original prowess of LLMs. Empirical analysis reveals that training on reasoning tasks effectively mitigates the loss of general abilities of LLMs. Motivated by this, we introduce the Reasoning-augmented Continual Learning (RCL) approach. RCL integrates task-specific cues with meta-rationales, effectively reducing catastrophic forgetting in LLMs while expediting convergence on novel tasks.",
        "keywords": "continual learning;benchmark;LLM",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/992214626faae558ac1d3bdb9b4a6d8a488a56cb.zip",
        "author": "Xiao Wang;Yuansen Zhang;Tianze Chen;Songyang Gao;Senjie Jin;Xianjun Yang;Zhiheng Xi;Rui Zheng;Yicheng Zou;Tao Gui;Qi Zhang;Xuanjing Huang",
        "authorids": "~Xiao_Wang12;~Yuansen_Zhang1;~Tianze_Chen1;~Songyang_Gao1;~Senjie_Jin1;~Xianjun_Yang1;~Zhiheng_Xi1;~Rui_Zheng1;~Yicheng_Zou1;~Tao_Gui1;~Qi_Zhang8;~Xuanjing_Huang1",
        "gender": "M;M;M;M;M;M;;M;M;M;M;F",
        "homepage": "https://xiaowangnlp.github.io/;;https://www.pixiv.net/users/55094416;;;;https://woooodyy.github.io/;https://github.com/ruizheng20;;;http://qizhang.info;https://xuanjing-huang.github.io/",
        "dblp": ";344/9168;;314/6067;348/5674.html;37/10237;333/4268;;224/6030.html;135/6973;52/323-1;05/6735-1",
        "google_scholar": "https://scholar.google.com.hk/citations?hl=zh-CN;oq28rjYAAAAJ;;O42mLrsAAAAJ;https://scholar.google.com.hk/citations?user=kMP_SiUAAAAJ;Tunh15sAAAAJ;https://scholar.google.com.hk/citations?user=zSVLkqAAAAAJ;https://scholar.google.com.hk/citations?user=7Z0V_SoAAAAJ;X_nKjOYAAAAJ;;XfqR3yYAAAAJ;RGsMgZA4H78C",
        "orcid": ";;;;;0000-0003-3318-8444;;;;;;0000-0001-9197-9426",
        "linkedin": ";;;;;xianjun-yang-0062aa1a6/;;;;;;",
        "or_profile": "~Xiao_Wang12;~Yuansen_Zhang1;~Tianze_Chen1;~Songyang_Gao1;~Senjie_Jin1;~Xianjun_Yang1;~Zhiheng_Xi1;~Rui_Zheng1;~Yicheng_Zou1;~Tao_Gui1;~Qi_Zhang8;~Xuanjing_Huang1",
        "aff": "Fudan University;Fudan University;;Fudan University;Fudan University;University of California, Santa Barbara;Fudan University;Fudan University;;Fudan University;Fudan University;Fudan University",
        "aff_domain": "fudan.edu.cn;fudan.edu.cn;;fudan.edu.cn;fudan.edu.cn;ucsb.edu;fudan.edu.cn;fudan.edu.cn;;fudan.edu.cn;fudan.edu.cn;fudan.edu.cn",
        "position": "PhD student;MS student;;MS student;MS student;PhD student;PhD student;PhD student;;Assistant Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nwang2024trace,\ntitle={{TRACE}: A Comprehensive Benchmark for Continual Learning in Large Language Models},\nauthor={Xiao Wang and Yuansen Zhang and Tianze Chen and Songyang Gao and Senjie Jin and Xianjun Yang and Zhiheng Xi and Rui Zheng and Yicheng Zou and Tao Gui and Qi Zhang and Xuanjing Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=xelrLobW0n}\n}",
        "github": "",
        "project": "",
        "reviewers": "hYjF;aiNx;UTqq;dqAr",
        "site": "https://openreview.net/forum?id=xelrLobW0n",
        "pdf_size": 949674,
        "rating": "3;5;6;6",
        "confidence": "5;3;4;4",
        "soundness": "2;4;3;3",
        "contribution": "2;3;3;3",
        "presentation": "1;3;3;3",
        "wc_summary": "57;175;92;38",
        "wc_strengths": "32;78;70;42",
        "wc_weaknesses": "472;200;15;87",
        "wc_questions": "12;91;35;18",
        "wc_review": "573;544;212;185",
        "wc_reply_reviewers": "0;0;22;20",
        "wc_reply_authors": "1217;1240;377;695",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "3;2;1;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            90.5,
            52.49047532648185
        ],
        "wc_strengths_avg": [
            55.5,
            19.04599695474091
        ],
        "wc_weaknesses_avg": [
            193.5,
            173.78794549680367
        ],
        "wc_questions_avg": [
            39.0,
            31.184932259025352
        ],
        "wc_review_avg": [
            378.5,
            180.54431588947907
        ],
        "wc_reply_reviewers_avg": [
            10.5,
            10.523782589924593
        ],
        "wc_reply_authors_avg": [
            882.25,
            364.13690763228055
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            12,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4757536606618579486&as_sdt=5,31&sciodt=0,31&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0;1;0;0;0;0;0",
        "aff_unique_norm": "Fudan University;University of California, Santa Barbara",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.fudan.edu.cn;https://www.ucsb.edu",
        "aff_unique_abbr": "Fudan;UCSB",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Santa Barbara",
        "aff_country_unique_index": "0;0;0;0;1;0;0;0;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "xh0XzueyCJ",
        "title": "Plug-And-Play Controllable Graph Generation With Diffusion Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Diffusion models for graph generation present transformative capabilities in generating graphs for various downstream applications. However, controlling the properties of the generated graphs remains a challenging task for these methods. Few approaches tackling this challenge focus on the ability to control for a soft differentiable property using conditional graph generation, leading to an uninterpretable control. However, in real-world applications like drug discovery, it is vital to have precise control over the generated outputs for specific features (e.g. the number of bonds in a molecule). Current diffusion models fail to support such hard non-differentiable constraints over the generated samples. To address this limitation, we propose PRODIGY (PROjected DIffusion for generating constrained Graphs), a novel plug-and-play approach to sample graphs from any pre-trained diffusion model such that they satisfy precise constraints. We formalize the problem of controllable graph generation and identify a class of constraints applicable to practical graph generation tasks. PRODIGY operates by controlling the samples at each diffusion timestep using a projection operator onto the specified constrained space. Through extensive experiments on generic and molecular graphs, we demonstrate that PRODIGY enhances the ability of pre-trained diffusion models to satisfy specified hard constraints, while staying close to the data distribution. For generic graphs, it improves constraint satisfaction performance by up to $100$%, and for molecular graphs, it achieves up to $60$% boost under a variety of constraints.",
        "keywords": "Controllable Graph Generation;Denoising Diffusion Models;Projected Sampling;Molecule Generation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/194738e74c70d0b3952d3a796b8de55d6a9d89b7.zip",
        "author": "Kartik Sharma;Srijan Kumar;Rakshit Trivedi",
        "authorids": "~Kartik_Sharma1;~Srijan_Kumar1;~Rakshit_Trivedi1",
        "gender": "M;M;",
        "homepage": "https://ksartik.github.io;https://faculty.cc.gatech.edu/~srijan/;",
        "dblp": "121/2254;131/9628;",
        "google_scholar": "XL3fNAoAAAAJ;kqfLNK8AAAAJ;",
        "orcid": ";0000-0002-5796-3532;",
        "linkedin": ";srijankr/;",
        "or_profile": "~Kartik_Sharma1;~Srijan_Kumar1;~Rakshit_Trivedi1",
        "aff": "Georgia Institute of Technology;Georgia Institute of Technology;",
        "aff_domain": "gatech.edu;gatech.edu;",
        "position": "PhD student;Assistant Professor;",
        "bibtex": "@misc{\nsharma2024plugandplay,\ntitle={Plug-And-Play Controllable Graph Generation With Diffusion Models},\nauthor={Kartik Sharma and Srijan Kumar and Rakshit Trivedi},\nyear={2024},\nurl={https://openreview.net/forum?id=xh0XzueyCJ}\n}",
        "github": "",
        "project": "",
        "reviewers": "86tq;CFiy;DbHE;pKPg",
        "site": "https://openreview.net/forum?id=xh0XzueyCJ",
        "pdf_size": 5791960,
        "rating": "5;6;6;6",
        "confidence": "5;3;3;4",
        "soundness": "2;2;3;2",
        "contribution": "3;2;3;3",
        "presentation": "3;2;2;3",
        "wc_summary": "74;31;71;61",
        "wc_strengths": "29;12;106;103",
        "wc_weaknesses": "285;107;153;132",
        "wc_questions": "26;178;20;62",
        "wc_review": "414;328;350;358",
        "wc_reply_reviewers": "40;0;79;266",
        "wc_reply_authors": "2043;1387;911;2071",
        "reply_reviewers": "2;0;1;2",
        "reply_authors": "5;3;3;4",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            59.25,
            17.005513811702368
        ],
        "wc_strengths_avg": [
            62.5,
            42.44113570582201
        ],
        "wc_weaknesses_avg": [
            169.25,
            68.78362813926
        ],
        "wc_questions_avg": [
            71.5,
            63.55116049294458
        ],
        "wc_review_avg": [
            362.5,
            31.697791721190924
        ],
        "wc_reply_reviewers_avg": [
            96.25,
            101.90774013783252
        ],
        "wc_reply_authors_avg": [
            1603.0,
            484.28916981489476
        ],
        "reply_reviewers_avg": [
            1.25,
            0.82915619758885
        ],
        "reply_authors_avg": [
            3.75,
            0.82915619758885
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8703882797784891,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2426390225877463361&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Georgia Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.gatech.edu",
        "aff_unique_abbr": "Georgia Tech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "xh3XUaB8M9",
        "title": "Visual Evidence Prompting Mitigates Hallucinations in Multimodal Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Despite the promising progress achieved, Large Vision-Language Models (LVLMs)  still suffer from the hallucination problem, i.e., they tend to predict objects and relations which are non-existent in the target images. These unfaithful outputs degrade the model performance and greatly harm the user experiences in real-world applications.  Fortunately, traditional small visual models excel at producing professional and faithful outputs, but they are not adept at interacting with humans. Therefore, this work explores how small visual models complement the LVLMs by effectively extracting contextual information from images to generate precise answers.\nIn particular, we show how such hallucination mitigates naturally in LVLMs via a simple method called visual evidence prompting, where a few visual knowledge evidences are provided as contexts in prompting. Experiments on three large language models show that visual evidence prompting improves performance on the evaluation of object hallucinations, as well as the new benchmark for relation hallucinations. We hope our work will not only serve as the minimal strongest baseline for the challenging hallucination benchmarks, but also highlight the importance of carefully exploring and analyzing the enormous visual evidence hidden inside small visual models before crafting \ufb01netuning LVLMs.",
        "keywords": "Large Vision-Language Models;Hallucination;Visual model",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/4eb4ec5c312d588642e0984491e46773da333fe4.pdf",
        "author": "Wei Li;Zhen Huang;Houqiang Li;Le Lu;Yang Lu;Xinmei Tian;Xu Shen;Jieping Ye",
        "authorids": "~Wei_Li52;~Zhen_Huang4;~Houqiang_Li1;~Le_Lu3;~Yang_Lu5;~Xinmei_Tian1;~Xu_Shen1;~Jieping_Ye4",
        "gender": ";M;M;M;F;M;M;M",
        "homepage": ";https://staff.ustc.edu.cn/~lihq/;http://www.cs.jhu.edu/~lelu/;https://jasonyanglu.github.io/;https://faculty.ustc.edu.cn/tianxinmei1/zh_CN/index.htm;;http://yelabs.net/;http://staff.ustc.edu.cn/~xinmei/students.html",
        "dblp": "22/3870;59/7017.html;78/6574-1.html;16/6317-9;03/5204-1;09/10130-1.html;03/5454;",
        "google_scholar": "WDYhR1cAAAAJ;7sFMIKoAAAAJ;kZn0f6gAAAAJ;r7r4FGwAAAAJ;https://scholar.google.com.au/citations?hl=zh-CN;38jwGs8AAAAJ;T9AzhwcAAAAJ;",
        "orcid": ";0000-0003-2188-3028;0000-0002-6799-9416;0000-0002-3497-9611;0000-0002-5952-8753;;0000-0001-8662-5818;0009-0009-7246-3534",
        "linkedin": ";;tigerlelu/;;;;;",
        "or_profile": "~Zhen_Huang4;~Houqiang_Li1;~Le_Lu3;~Yang_Lu5;~Xinmei_Tian1;~Xu_Shen1;~Jieping_Ye4;~Li_Wei5",
        "aff": ";University of Science and Technology of China;Alibaba Group;Xiamen University;University of Science and Technology of China;Alibaba Group;Alibaba Group;University of Science and Technology of China",
        "aff_domain": ";ustc.edu.cn;alibaba-inc.com;xmu.edu.cn;ustc.edu.cn;alibaba-inc.com;alibaba-inc.com;ustc.edu.cn",
        "position": ";Professor;Full Professor;Assistant Professor;Full Professor;Researcher;Principal Researcher;PhD student",
        "bibtex": "@misc{\nli2024visual,\ntitle={Visual Evidence Prompting Mitigates Hallucinations in Multimodal Large Language Models},\nauthor={Wei Li and Zhen Huang and Houqiang Li and Le Lu and Yang Lu and Xinmei Tian and Xu Shen and Jieping Ye},\nyear={2024},\nurl={https://openreview.net/forum?id=xh3XUaB8M9}\n}",
        "github": "",
        "project": "",
        "reviewers": "bJ8t;rr7K;YNjN;w1s8",
        "site": "https://openreview.net/forum?id=xh3XUaB8M9",
        "pdf_size": 7588077,
        "rating": "5;5;6;6",
        "confidence": "4;4;4;3",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;3;3;2",
        "wc_summary": "37;220;40;49",
        "wc_strengths": "16;10;55;39",
        "wc_weaknesses": "111;157;14;184",
        "wc_questions": "2;1;152;3",
        "wc_review": "166;388;261;275",
        "wc_reply_reviewers": "0;0;51;17",
        "wc_reply_authors": "1169;912;879;1571",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "4;4;4;4",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            86.5,
            77.20265539474663
        ],
        "wc_strengths_avg": [
            30.0,
            18.041618552668716
        ],
        "wc_weaknesses_avg": [
            116.5,
            64.6780488264759
        ],
        "wc_questions_avg": [
            39.5,
            64.95575417158976
        ],
        "wc_review_avg": [
            272.5,
            78.77340921910134
        ],
        "wc_reply_reviewers_avg": [
            17.0,
            20.820662813657012
        ],
        "wc_reply_authors_avg": [
            1132.75,
            276.81074310799426
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            4.0,
            0.0
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10510991920197647284&as_sdt=5,31&sciodt=0,31&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0;1;1;0",
        "aff_unique_norm": "University of Science and Technology of China;Alibaba Group;Xiamen University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.ustc.edu.cn;https://www.alibaba.com;https://www.xmu.edu.cn",
        "aff_unique_abbr": "USTC;Alibaba;XMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Towards Training Without Depth Limits: Batch Normalization Without Gradient Explosion",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17448",
        "id": "xhCZD9hiiA",
        "author_site": "Alexandru Meterez, Amir Joudaki, Francesco Orabona, Alexander Immer, Gunnar Ratsch, Hadi Daneshmand",
        "tldr": "",
        "abstract": "Normalization layers are one of the key building blocks for deep neural networks. Several theoretical studies have shown that batch normalization improves the signal propagation, by avoiding the representations from becoming collinear across the layers. However, results on mean-field theory of batch normalization also conclude that this benefit comes at the expense of exploding gradients in depth. Motivated by these two aspects of batch normalization, in this study we pose the following question: \n*Can a batch-normalized network keep the optimal signal propagation properties, but avoid exploding gradients?* We answer this question in the affirmative by giving a particular construction of an *MLP with linear activations* and batch-normalization that provably has *bounded gradients* at any depth. Based on Weingarten calculus, we develop a rigorous and non-asymptotic theory for this constructed MLP that gives a precise characterization of forward signal propagation, while proving that gradients remain bounded for linearly independent input samples, which holds in most practical settings. Inspired by our theory, we also design an activation shaping scheme that empirically achieves the same properties for non-linear activations.",
        "keywords": "mlp;batch-normalization;optimization;depth;calculus;theory;deep-learning;non-asymptotic",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/daf0abc7fdfaa944e62f3d84851efffe521a7ef0.pdf",
        "author": "Alexandru Meterez;Amir Joudaki;Francesco Orabona;Alexander Immer;Gunnar Ratsch;Hadi Daneshmand",
        "authorids": "~Alexandru_Meterez1;~Amir_Joudaki1;~Francesco_Orabona1;~Alexander_Immer1;~Gunnar_Ratsch1;~Hadi_Daneshmand1",
        "gender": "M;;M;;M;",
        "homepage": "https://alexandrumeterez.github.io/;;https://francesco.orabona.com/;;http://bmi.inf.ethz.ch;",
        "dblp": ";;80/3790.html;;https://dblp.uni-trier.de/pers/hd/r/R=auml=tsch:Gunnar;",
        "google_scholar": "wSrCMa4AAAAJ;;g1ha-iYAAAAJ;;https://scholar.google.ch/citations?user=tQuQ1FwAAAAJ;",
        "orcid": ";;;;0000-0001-5486-8532;",
        "linkedin": ";;;;;",
        "or_profile": "~Alexandru_Meterez1;~Amir_Joudaki1;~Francesco_Orabona1;~Alexander_Immer1;~Gunnar_Ratsch1;~Hadi_Daneshmand1",
        "aff": "Max Planck Institute for Intelligent Systems, Max-Planck Institute;;Boston University;;Swiss Federal Institute of Technology;",
        "aff_domain": "tue.mpg.de;;bu.edu;;ethz.ch;",
        "position": "Intern;;Associate Professor;;Professor;",
        "bibtex": "@inproceedings{\nmeterez2024towards,\ntitle={Towards Training Without Depth Limits: Batch Normalization Without Gradient Explosion},\nauthor={Alexandru Meterez and Amir Joudaki and Francesco Orabona and Alexander Immer and Gunnar Ratsch and Hadi Daneshmand},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=xhCZD9hiiA}\n}",
        "github": "",
        "project": "",
        "reviewers": "uof1;GLi5;eDWh;692A",
        "pdf_size": 1249820,
        "rating": "6;6;6;6",
        "confidence": "3;4;3;3",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "94;211;65;45",
        "wc_strengths": "23;88;68;24",
        "wc_weaknesses": "126;158;251;59",
        "wc_questions": "58;171;5;11",
        "wc_review": "301;628;389;139",
        "wc_reply_reviewers": "109;74;77;0",
        "wc_reply_authors": "783;1019;496;399",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "2;2;2;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            103.75,
            64.32485911372056
        ],
        "wc_strengths_avg": [
            50.75,
            28.154706533721853
        ],
        "wc_weaknesses_avg": [
            148.5,
            69.1248869800161
        ],
        "wc_questions_avg": [
            61.25,
            66.60471079435749
        ],
        "wc_review_avg": [
            364.25,
            176.71640416214902
        ],
        "wc_reply_reviewers_avg": [
            65.0,
            39.956226048014095
        ],
        "wc_reply_authors_avg": [
            674.25,
            244.036242185459
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9065800575509225158&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 8,
        "openreview": "https://openreview.net/forum?id=xhCZD9hiiA",
        "pdf": "https://openreview.net/pdf?id=xhCZD9hiiA",
        "email": "tue.mpg.de;;bu.edu;;ethz.ch;",
        "author_num": 6,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Max Planck Institute for Intelligent Systems;Boston University;Swiss Federal Institute of Technology",
        "aff_unique_dep": "Intelligent Systems;;",
        "aff_unique_url": "https://www.mpi-is.mpg.de;https://www.bu.edu;https://www.ethz.ch",
        "aff_unique_abbr": "MPI-IS;BU;ETH Zurich",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2",
        "aff_country_unique": "Germany;United States;Switzerland"
    },
    {
        "title": "Robust Model-Based Optimization for Challenging Fitness Landscapes",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17447",
        "id": "xhEN0kJh4q",
        "author_site": "Saba Ghaffari, Ehsan Saleh, Alex Schwing, Yu-Xiong Wang, Martin Burke, Saurabh Sinha",
        "tldr": "",
        "abstract": "Protein design, a grand challenge of the day, involves optimization on a fitness landscape, and leading methods adopt a model-based approach where a model is trained on a training set (protein sequences and fitness) and proposes candidates to explore next. These methods are challenged by sparsity of high-fitness samples in the training set, a problem that has been in the literature. A less recognized but equally important problem stems from the distribution of training samples in the design space: leading methods are not designed for scenarios where the desired optimum is in a region that is not only poorly represented in training data, but also relatively far from the highly represented low-fitness regions. We show that this problem of \u201cseparation\u201d in the design space is a significant bottleneck in existing model-based optimization tools and propose a new approach that uses a novel VAE as its search model to overcome the problem. We demonstrate its advantage over prior methods in robustly finding improved samples, regardless of the imbalance and separation between low- and high-fitness samples. Our comprehensive benchmark on real and semi-synthetic protein datasets as well as solution design for physics-informed neural networks, showcases the generality of our approach in discrete and continuous design spaces. Our implementation is available at https://github.com/sabagh1994/PGVAE.",
        "keywords": "Model based optimization;protein engineering",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Saba Ghaffari;Ehsan Saleh;Alex Schwing;Yu-Xiong Wang;Martin D. Burke;Saurabh Sinha",
        "authorids": "~Saba_Ghaffari1;~Ehsan_Saleh1;~Alex_Schwing1;~Yu-Xiong_Wang1;~Martin_D._Burke1;~Saurabh_Sinha4",
        "gender": "F;;Unspecified;;M;",
        "homepage": ";;https://ece.illinois.edu/directory/profile/aschwing;https://yxw.cs.illinois.edu/;https://chemistry.illinois.edu/mdburke;https://sites.google.com/view/sinhalaboratorygatech",
        "dblp": ";;79/9775;35/10700;;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;3B2c31wAAAAJ;T_Q-xDkAAAAJ;u4hmNXAAAAAJ;7BM1uyYAAAAJ",
        "orcid": ";;;;;",
        "linkedin": "saba-ghaffari-171a3356/;;;;;",
        "or_profile": "~Saba_Ghaffari1;~Ehsan_Saleh1;~Alex_Schwing1;~Yu-Xiong_Wang1;~Martin_D._Burke1;~Saurabh_Sinha4",
        "aff": "University of Illinois, Urbana Champaign;;University of Illinois, Urbana Champaign;Department of Computer Science, University of Illinois Urbana-Champaign;University of Illinois, Urbana Champaign;",
        "aff_domain": "illinois.edu;;illinois.edu;cs.illinois.edu;illinois.edu;",
        "position": "PhD student;;Associate Professor;Assistant Professor;Full Professor;",
        "bibtex": "@inproceedings{\nghaffari2024robust,\ntitle={Robust Model-Based Optimization for Challenging Fitness Landscapes},\nauthor={Saba Ghaffari and Ehsan Saleh and Alex Schwing and Yu-Xiong Wang and Martin D. Burke and Saurabh Sinha},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=xhEN0kJh4q}\n}",
        "github": "",
        "project": "",
        "reviewers": "soEo;7H3r;e46j;R8Dk",
        "pdf_size": 6180009,
        "rating": "5;6;6;8",
        "confidence": "2;1;3;3",
        "soundness": "3;2;3;3",
        "contribution": "3;2;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "231;75;201;95",
        "wc_strengths": "89;92;94;52",
        "wc_weaknesses": "108;65;47;33",
        "wc_questions": "50;44;45;23",
        "wc_review": "478;276;387;203",
        "wc_reply_reviewers": "32;33;0;16",
        "wc_reply_authors": "543;198;542;220",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            2.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            150.5,
            66.72892925860567
        ],
        "wc_strengths_avg": [
            81.75,
            17.268106439329124
        ],
        "wc_weaknesses_avg": [
            63.25,
            28.216794644324857
        ],
        "wc_questions_avg": [
            40.5,
            10.35615758860399
        ],
        "wc_review_avg": [
            336.0,
            104.94522380747016
        ],
        "wc_reply_reviewers_avg": [
            20.25,
            13.497684986693088
        ],
        "wc_reply_authors_avg": [
            375.75,
            166.93168512897725
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.48420012470625223,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8592410085108441401&as_sdt=805&sciodt=0,3&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=xhEN0kJh4q",
        "pdf": "https://openreview.net/pdf?id=xhEN0kJh4q",
        "email": "illinois.edu;;illinois.edu;cs.illinois.edu;illinois.edu;",
        "author_num": 6,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of Illinois Urbana-Champaign",
        "aff_unique_dep": "",
        "aff_unique_url": "https://illinois.edu",
        "aff_unique_abbr": "UIUC",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Urbana-Champaign",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "xi4qWLNbhs",
        "title": "GM-DDPM: Denoising diffusion probabilistic models with Gaussian Mixture Noise",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Denoising diffusion probabilistic models (DDPM) have shown impressive performance in various domains as a class of deep generative models. In this paper, we introduce the Gaussian Mixture noise-based DDPM (GM-DDPM), which considers the Markov diffusion posterior as a Gaussian mixture model. Specifically, GM-DDPM randomly selects a Gaussian component and then add the chosen Gaussian noise, which can be demonstrated as more efficient way to perturb the signals into a simple known distribution. We further define the reverse probabilistic model as a parameterized Gaussian mixture kernel. Due to the intractability in calculating the KL divergence between Gaussian mixture models, we derive a variational bound to maximize the likelihood, offering a concise formulation for optimizing the denoising model and valuable insights for designing the sampling strategies. Our theoretical derivation highlights that GM-DDPM only requires the inclusion of a random offset in both the diffusion and reverse processes, which can be efficiently implemented with just several lines of code. Furthermore, we present three streamlined sampling strategies that interface with diverse fast dedicated solvers for diffusion ordinary differential equations, boosting the efficacy of image representation in the sampling phase and alleviating the issue of slow generation speed, thereby enhancing both efficiency and accuracy. Extensive experiments on benchmark datasets demonstrate the effectiveness of GM-DDPM and its superiority over the original DDPM.",
        "keywords": "Diffusion model;Image generation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/8ff9b4b932e9d4409ddd22d00c59a59988450d08.zip",
        "author": "Hanzhang Wang;Xianming Liu;Xiong Zhou;Junjun Jiang;Deming Zhai;Wen Gao",
        "authorids": "~Hanzhang_Wang2;~Xianming_Liu5;~Xiong_Zhou3;~Junjun_Jiang2;~Deming_Zhai2;~Wen_Gao1",
        "gender": "M;M;M;M;F;",
        "homepage": "https://wd1511.github.io;http://homepage.hit.edu.cn/xmliu;https://hitcszx.github.io/;http://homepage.hit.edu.cn/jiangjunjun;;",
        "dblp": ";89/58201.html;;https://dblp.uni-trier.de/pers/hd/j/Jiang:Junjun;69/8937;",
        "google_scholar": ";;BMGootgAAAAJ;WNH2_rgAAAAJ;;",
        "orcid": ";0000-0002-8857-1785;0000-0002-0856-6696;0000-0002-5694-505X;;",
        "linkedin": ";;;;;",
        "or_profile": "~Hanzhang_Wang2;~Xianming_Liu5;~Xiong_Zhou3;~Junjun_Jiang2;~Deming_Zhai2;~Wen_Gao1",
        "aff": "Harbin Institute of Technology;Harbin Institute of Technology;Harbin Institute of Technology;Harbin Institute of Technology;Harbin Institute of Technology;",
        "aff_domain": "hit.edu.cn;hit.edu.cn;hit.edu.cn;hit.edu.cn;hit.edu.cn;",
        "position": "PhD student;Full Professor;PhD student;Full Professor;Associate Professor;",
        "bibtex": "@misc{\nwang2024gmddpm,\ntitle={{GM}-{DDPM}: Denoising diffusion probabilistic models with Gaussian Mixture Noise},\nauthor={Hanzhang Wang and Xianming Liu and Xiong Zhou and Junjun Jiang and Deming Zhai and Wen Gao},\nyear={2024},\nurl={https://openreview.net/forum?id=xi4qWLNbhs}\n}",
        "github": "",
        "project": "",
        "reviewers": "uDWr;JGQA;NA66;mGnb",
        "site": "https://openreview.net/forum?id=xi4qWLNbhs",
        "pdf_size": 29520952,
        "rating": "3;5;5;5",
        "confidence": "4;4;3;2",
        "soundness": "2;2;2;2",
        "contribution": "1;2;2;3",
        "presentation": "1;2;2;2",
        "wc_summary": "59;77;68;30",
        "wc_strengths": "17;26;72;17",
        "wc_weaknesses": "28;113;210;227",
        "wc_questions": "246;92;11;6",
        "wc_review": "350;308;361;280",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            58.5,
            17.64227876437735
        ],
        "wc_strengths_avg": [
            33.0,
            22.814469093099667
        ],
        "wc_weaknesses_avg": [
            144.5,
            80.09525578959094
        ],
        "wc_questions_avg": [
            88.75,
            96.99323430013044
        ],
        "wc_review_avg": [
            324.75,
            32.53747839031168
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11395593743884437813&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Harbin Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.hit.edu.cn/",
        "aff_unique_abbr": "HIT",
        "aff_campus_unique_index": "0;0;0;0;0",
        "aff_campus_unique": "Harbin",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "xiGwCVzsCi",
        "title": "Discrimination-free Pricing with Privatized Sensitive Attributes",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Fairness has emerged as a critical consideration in the landscape of machine learning algorithms, particularly as AI continue to transform decision-making across societal domains. To ensure that these algorithms are free from bias and do not discriminate against individuals based on sensitive attributes such as gender and race,  the field of algorithmic biasness has introduced various fairness concepts, including demographic parity and equalized odds, along with methodologies to achieve these notions in different contexts. Despite the rapid advancement in this field, not all sectors have embraced these fairness principles to the same extent. One specific sector that merits attention in this regard is insurance. Within the realm of insurance pricing, fairness is defined through a distinct and specialized framework. Consequently, achieving fairness according to established notions does not automatically ensure fair pricing. In particular, the regulatory bodies are increasingly emphasizing transparency in pricing algorithms and imposing constraints for insurance companies on the collection and utilization of sensitive consumer attributes.  These factors present additional challenges in the implementation of fairness in pricing algorithms. To address these complexities and comply with regulatory demands, we propose a straightforward method for constructing fair models that align with the specific fairness criteria unique to the insurance pricing domain. Notably, our approach only relies on privatized sensitive attributes and offers statistical guarantees. Further, it does not require insurers to have direct access to sensitive attributes, and it can be tailored to accommodate varying levels of transparency as required. This methodology seeks to meet the growing demands for privacy and transparency set forth by regulators while ensuring fairness in insurance pricing practices.",
        "keywords": "fairness;privatized sensitive attributes;privacy;insurance pricing;local differential privacy;noise estimation;transparency",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/13d964bfc9d5ad1e3b57c2b8b5c950ab5dfef942.zip",
        "author": "Tianhe Zhang;Suhan Liu;Peng Shi",
        "authorids": "~Tianhe_Zhang1;~Suhan_Liu1;~Peng_Shi3",
        "gender": ";M;",
        "homepage": ";;",
        "dblp": ";;",
        "google_scholar": ";;",
        "orcid": ";;",
        "linkedin": ";https://linkedin.com/in/suhan-liu-4ab453292;",
        "or_profile": "~Tianhe_Zhang1;~Suhan_Liu1;~Peng_Shi3",
        "aff": ";University of Michigan - Ann Arbor;",
        "aff_domain": ";umich.edu;",
        "position": ";MS student;",
        "bibtex": "@misc{\nzhang2024discriminationfree,\ntitle={Discrimination-free Pricing with Privatized Sensitive Attributes},\nauthor={Tianhe Zhang and Suhan Liu and Peng Shi},\nyear={2024},\nurl={https://openreview.net/forum?id=xiGwCVzsCi}\n}",
        "github": "",
        "project": "",
        "reviewers": "m8tn;rqKi;BixT",
        "site": "https://openreview.net/forum?id=xiGwCVzsCi",
        "pdf_size": 5180249,
        "rating": "5;6;6",
        "confidence": "4;2;2",
        "soundness": "1;2;3",
        "contribution": "1;2;3",
        "presentation": "2;3;2",
        "wc_summary": "66;79;116",
        "wc_strengths": "8;54;53",
        "wc_weaknesses": "71;270;202",
        "wc_questions": "29;33;92",
        "wc_review": "174;436;463",
        "wc_reply_reviewers": "22;301;35",
        "wc_reply_authors": "697;1786;1378",
        "reply_reviewers": "1;2;1",
        "reply_authors": "5;8;7",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            87.0,
            21.18175315375634
        ],
        "wc_strengths_avg": [
            38.333333333333336,
            21.452790546272116
        ],
        "wc_weaknesses_avg": [
            181.0,
            82.5873275186131
        ],
        "wc_questions_avg": [
            51.333333333333336,
            28.802006102970598
        ],
        "wc_review_avg": [
            357.6666666666667,
            130.33887456251193
        ],
        "wc_reply_reviewers_avg": [
            119.33333333333333,
            128.56731915831315
        ],
        "wc_reply_authors_avg": [
            1287.0,
            449.2148706354232
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            6.666666666666667,
            1.247219128924647
        ],
        "replies_avg": [
            30,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:TdiWVVDxXWsJ:scholar.google.com/&scioq=Discrimination-free+Pricing+with+Privatized+Sensitive+Attributes&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Michigan",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.umich.edu",
        "aff_unique_abbr": "UM",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Ann Arbor",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "xibcBSuuq0",
        "title": "Do not Start with Trembling Hands: Improving Multi-agent Reinforcement Learning with Stable Prefix Policy",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In multi-agent reinforcement learning (MARL), the $\\epsilon$-greedy method plays an important role in balancing exploration and exploitation during the decision-making process in value-based algorithms. However, we find that $\\epsilon$-greedy can be deemed as the concept of \"trembling hands\" in game theory when the agents are more in need of exploitation, which may result in the Trembling Hands Nash Equilibrium solution, a suboptimal policy convergence. Besides, eliminating the $\\epsilon$-greedy algorithm leaves no exploration and may lead to unacceptable local optimal policies. To address this dilemma, we use the previously collected trajectories to plan an existing optimal template as candidate policy, which we call \\textbf{Stable Prefix Policy}, in contrast to trembling hands. When the policy is close to the optimal policy, the agents follow the planned template, and when the policy still needs exploration, the agents will adaptively dropout. We scale our approach to various value-based MARL methods and empirically verify our method in a cooperative MARL task, SMAC benchmarks. Experimental results demonstrate that our method achieves not only better performance but also faster convergence speed than baseline algorithms within 2M time steps.",
        "keywords": "MARL;Trembling Hands;Exploration;Exploration;Prefix Policy",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/5d59d02c8a3086f29abe3af31d18de00aec0b6c1.zip",
        "author": "Yue DENG;ZiRui Wang;Yin Zhang",
        "authorids": "~Yue_DENG2;~ZiRui_Wang8;~Yin_Zhang3",
        "gender": "M;;M",
        "homepage": "https://github.com/RuoShuiDY;https://person.zju.edu.cn/en/zhangyin;https://github.com/Wongziseoi",
        "dblp": ";91/3045-6;",
        "google_scholar": ";vCoh6tYAAAAJ;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Yue_DENG2;~Yin_Zhang3;~ZiRui_Wang4",
        "aff": "Zhejiang University;Zhejiang University;Shanghai Artificial Intelligence Laboratory",
        "aff_domain": "zju.edu.cn;zju.edu.cn;pjlab.org.cn",
        "position": "PhD student;Full Professor;Intern",
        "bibtex": "@misc{\nanonymous2024do,\ntitle={Do not Start with Trembling Hands: Improving Multi-agent Reinforcement Learning with Stable Prefix Policy},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=xibcBSuuq0}\n}",
        "github": "",
        "project": "",
        "reviewers": "4uBa;3kTw;RkkR",
        "site": "https://openreview.net/forum?id=xibcBSuuq0",
        "pdf_size": 4466766,
        "rating": "5;5;5",
        "confidence": "4;4;3",
        "soundness": "2;2;2",
        "contribution": "2;3;2",
        "presentation": "1;2;3",
        "wc_summary": "69;137;122",
        "wc_strengths": "29;153;35",
        "wc_weaknesses": "306;174;107",
        "wc_questions": "38;167;75",
        "wc_review": "442;631;339",
        "wc_reply_reviewers": "886;85;144",
        "wc_reply_authors": "1478;1437;1610",
        "reply_reviewers": "3;1;1",
        "reply_authors": "3;3;3",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            109.33333333333333,
            29.169999809545576
        ],
        "wc_strengths_avg": [
            72.33333333333333,
            57.09251750935105
        ],
        "wc_weaknesses_avg": [
            195.66666666666666,
            82.67338682362596
        ],
        "wc_questions_avg": [
            93.33333333333333,
            54.23610933276423
        ],
        "wc_review_avg": [
            470.6666666666667,
            120.91962436079412
        ],
        "wc_reply_reviewers_avg": [
            371.6666666666667,
            364.48532968496215
        ],
        "wc_reply_authors_avg": [
            1508.3333333333333,
            73.81207368867388
        ],
        "reply_reviewers_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            3.0,
            0.0
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:t5A4tvrqmEgJ:scholar.google.com/&scioq=Do+not+Start+with+Trembling+Hands:+Improving+Multi-agent+Reinforcement+Learning+with+Stable+Prefix+Policy&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Zhejiang University;Shanghai Artificial Intelligence Laboratory",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.zju.edu.cn;http://www.shailab.org/",
        "aff_unique_abbr": "ZJU;Shanghai AI Lab",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Federated Recommendation with Additive Personalization",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17446",
        "id": "xkXdE81mOK",
        "author_site": "Zhiwei Li, Guodong Long, Tianyi Zhou",
        "tldr": "",
        "abstract": "Building recommendation systems via federated learning (FL) is a new emerging challenge for next-generation Internet service. Existing FL models share item embedding across clients while keeping the user embedding private and local on the client side. However, identical item embedding cannot capture users' individual differences in perceiving the same item and may lead to poor personalization. Moreover, dense item embedding in FL results in expensive communication costs and latency. To address these challenges, we propose Federated Recommendation withAdditive Personalization (FedRAP), which learns a global view of items via FL and a personalized view locally on each user. FedRAP encourages a sparse global view to save FL's communication cost and enforces the two views to be complementary via two regularizers. We propose an effective curriculum to learn the local and global views progressively with increasing regularization weights. To produce recommendations for a user, FedRAP adds the two views together to obtain a personalized item embedding. FedRAP achieves the best performance in FL setting on multiple benchmarks. It outperforms recent federated recommendation methods and several ablation study baselines. Our code is available at https://github.com/mtics/FedRAP.",
        "keywords": "Federated Learning;Federated Recommendation System",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/ca60742a8430abeff96c647f4c2d6e4998163627.zip",
        "author": "Zhiwei Li;Guodong Long;Tianyi Zhou",
        "authorids": "~Zhiwei_Li5;~Guodong_Long2;~Tianyi_Zhou1",
        "gender": "M;M;M",
        "homepage": "https://zhw.li;https://www.uts.edu.au/staff/guodong.long;https://tianyizhou.github.io/",
        "dblp": "47/3951-3;34/10089;88/8205-1",
        "google_scholar": "cAtBKKkAAAAJ;https://scholar.google.com.au/citations?user=Pl8m7hMAAAAJ;OKvgizMAAAAJ",
        "orcid": "0000-0002-8897-8905;0000-0003-3740-9515;0000-0001-5348-0632",
        "linkedin": ";;tianyizhou",
        "or_profile": "~Zhiwei_Li5;~Guodong_Long2;~Tianyi_Zhou1",
        "aff": "University of Technology Sydney;University of Technology Sydney;University of Maryland, College Park",
        "aff_domain": "uts.edu.au;uts.edu.au;umd.edu",
        "position": "PhD student;Associate Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nli2024federated,\ntitle={Federated Recommendation with Additive Personalization},\nauthor={Zhiwei Li and Guodong Long and Tianyi Zhou},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=xkXdE81mOK}\n}",
        "github": "",
        "project": "",
        "reviewers": "QwLj;MAPK;eLAA",
        "pdf_size": 1485095,
        "rating": "6;8;8",
        "confidence": "4;4;5",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "3;3;3",
        "wc_summary": "64;69;131",
        "wc_strengths": "40;52;194",
        "wc_weaknesses": "461;1;50",
        "wc_questions": "134;1;191",
        "wc_review": "699;123;566",
        "wc_reply_reviewers": "20;0;0",
        "wc_reply_authors": "1065;12;642",
        "reply_reviewers": "1;0;0",
        "reply_authors": "4;1;1",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            88.0,
            30.474032661705056
        ],
        "wc_strengths_avg": [
            95.33333333333333,
            69.93965653015144
        ],
        "wc_weaknesses_avg": [
            170.66666666666666,
            206.26897219138147
        ],
        "wc_questions_avg": [
            108.66666666666667,
            79.60876556985139
        ],
        "wc_review_avg": [
            462.6666666666667,
            246.2415255168975
        ],
        "wc_reply_reviewers_avg": [
            6.666666666666667,
            9.428090415820632
        ],
        "wc_reply_authors_avg": [
            573.0,
            432.645351298266
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            1.4142135623730951
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 35,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8211176518091011334&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=xkXdE81mOK",
        "pdf": "https://openreview.net/pdf?id=xkXdE81mOK",
        "email": "uts.edu.au;uts.edu.au;umd.edu",
        "author_num": 3,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "University of Technology Sydney;University of Maryland",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.uts.edu.au;https://www/umd.edu",
        "aff_unique_abbr": "UTS;UMD",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";College Park",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "Australia;United States"
    },
    {
        "id": "xkzbcpNqsy",
        "title": "Addressing Covariate Shifts with Influence Aware Energy Regularization",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "For classification problems where the classifier predicts $\\bar{p}(y|\\mathbf{x})$, namely the probability of label $y$ given data $\\mathbf{x}$, an energy value can be defined (*e.g.* LogSumExp of the logits) and used to evaluate the estimated $\\bar{p}(\\mathbf{x})$ by the learned model, which is widely used for generative modeling and out-of-distribution (OOD) detection. In this paper, we identify a new promising direction that energy value on training data could be regularized for better generalization performance of the classifier facing covariate shift, as a principled means to address the shifts of $p(\\mathbf{x})$, *e.g.*, long-tail recognition and domain generalization. Specifically, we propose to quantify the influence of regularizing energy value on the classification loss through the lens of influence function, a standard tool in robust statistics. This paves the way for our provably effective approach, Influence-Aware Energy Regularization (IAER), which aims at regularizing the energy value to adjust the decision margin and re-weight data samples. Experimental results demonstrate the efficacy of our method on several common benchmarks of class-imbalance classification and domain generalization. Source code will be made publicly available.",
        "keywords": "Influence Function;Energy based model;Long-tail recgonition;Domain generalization",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Yiting Chen;Qitian Wu;Junchi Yan",
        "authorids": "~Yiting_Chen1;~Qitian_Wu1;~Junchi_Yan2",
        "gender": "M;;",
        "homepage": "https://ytchen981.github.io/;;",
        "dblp": "135/6971;;",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Yiting_Chen1;~Qitian_Wu1;~Junchi_Yan2",
        "aff": "Shanghai Jiaotong University;;",
        "aff_domain": "sjtu.edu.cn;;",
        "position": "PhD student;;",
        "bibtex": "@misc{\nchen2024addressing,\ntitle={Addressing Covariate Shifts with Influence Aware Energy Regularization},\nauthor={Yiting Chen and Qitian Wu and Junchi Yan},\nyear={2024},\nurl={https://openreview.net/forum?id=xkzbcpNqsy}\n}",
        "github": "",
        "project": "",
        "reviewers": "YSaa;ibKz;NQup",
        "site": "https://openreview.net/forum?id=xkzbcpNqsy",
        "pdf_size": 1540896,
        "rating": "3;3;3",
        "confidence": "2;4;2",
        "soundness": "2;2;2",
        "contribution": "2;2;2",
        "presentation": "2;2;3",
        "wc_summary": "24;71;74",
        "wc_strengths": "45;11;77",
        "wc_weaknesses": "96;238;229",
        "wc_questions": "43;84;82",
        "wc_review": "208;404;462",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            56.333333333333336,
            22.89589968143253
        ],
        "wc_strengths_avg": [
            44.333333333333336,
            26.948510575210314
        ],
        "wc_weaknesses_avg": [
            187.66666666666666,
            64.92217563274423
        ],
        "wc_questions_avg": [
            69.66666666666667,
            18.873850222522755
        ],
        "wc_review_avg": [
            358.0,
            108.67689113453083
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:MfvwJHT1g9AJ:scholar.google.com/&scioq=Addressing+Covariate+Shifts+with+Influence+Aware+Energy+Regularization&hl=en&as_sdt=0,48",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Shanghai Jiao Tong University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.sjtu.edu.cn",
        "aff_unique_abbr": "SJTU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "id": "xlQrAm3LE4",
        "title": "DiffSim: Aligning Diffusion Model and Molecular Dynamics Simulation for Accurate Blind Docking",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Predicting the ligand\u2019s binding conformation within a target protein is a pivotal step in drug discovey. Based on prior knowledge of the binding site (protein pocket) on the target protein, biochemical researchers use molecular docking software to generate the ligand conformation within that pocket. Despite its speed, molecular docking is ill-suited for blind docking where the pocket is unknown, and the generated ligand conformation often lacks required precision. Recently, deep generative models, especially diffusion models, have been proposed for accurate blind docking. However, it is found that while deep generative models excel in locating the pocket, they still lag behind traditional methods in terms of conformation generation. Thus, bridging such gap with a hybrid approach is naturally expected to further improve the model performance. Therefore, in this study, we introduce a blind docking approach named DiffSim to seamlessly integrate the diffusion model with molecular dynamics (MD) simulation. We propose a novel loss function to align reverse diffusion sampling with MD simulation trajectories, aiming to efficiently generate ligand conformations informed by MD-modelled protein-ligand interactions at atomic resolution. Through theoretical analysis, we unveil the consistency in dynamics between diffusion models and MD simulation, demonstrating that the diffusion model is essentially a coarse-grained simulator for MD simulation. Empirical results demonstrate the effectiveness of our approach and highlight the potential of combining physics-informed MD simulation with deep learning models in drug discovery.",
        "keywords": "Diffusion Model;Molecular Dynamics Simulation;Blind Docking;Drug Discovery;Molecular Conformation Generation",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "",
        "author": "Yanlin Fei;Yurui Li;Zhiling Zhou;Haohan Wang",
        "authorids": "~Yanlin_Fei1;~Yurui_Li2;~Zhiling_Zhou1;~Haohan_Wang1",
        "gender": "F;F;M;M",
        "homepage": ";https://informatics.ischool.illinois.edu/person/yurui-li/;https://github.com/zlzhouFDU?tab=repositories;http://cs.cmu.edu/~haohanw",
        "dblp": ";;;132/4066",
        "google_scholar": ";;;nZxJGeUAAAAJ",
        "orcid": "0009-0003-8407-8576;;;",
        "linkedin": ";;;haohanwang/",
        "or_profile": "~Yanlin_Fei1;~Yurui_Li2;~Zhiling_Zhou1;~Haohan_Wang1",
        "aff": "Fudan University;University of Illinois, Urbana Champaign;Fudan University;University of Illinois, Urbana Champaign",
        "aff_domain": "fudan.edu.cn;uiuc.edu;fudan.edu.cn;illinois.edu",
        "position": "Undergrad student;PhD student;Undergrad student;Assistant Professor",
        "bibtex": "@misc{\nfei2024diffsim,\ntitle={DiffSim: Aligning Diffusion Model and Molecular Dynamics Simulation for Accurate Blind Docking},\nauthor={Yanlin Fei and Yurui Li and Zhiling Zhou and Haohan Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=xlQrAm3LE4}\n}",
        "github": "",
        "project": "",
        "reviewers": "HbHG;jMvQ;uuBj;gbXf",
        "site": "https://openreview.net/forum?id=xlQrAm3LE4",
        "pdf_size": 1286287,
        "rating": "3;3;3;5",
        "confidence": "5;4;5;3",
        "soundness": "3;2;3;3",
        "contribution": "2;3;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "29;52;92;35",
        "wc_strengths": "21;47;44;50",
        "wc_weaknesses": "156;212;101;59",
        "wc_questions": "2;59;1;153",
        "wc_review": "208;370;238;297",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "80;87;82;97",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            52.0,
            24.586581706288495
        ],
        "wc_strengths_avg": [
            40.5,
            11.4564392373896
        ],
        "wc_weaknesses_avg": [
            132.0,
            57.589061461357396
        ],
        "wc_questions_avg": [
            53.75,
            61.924853653440316
        ],
        "wc_review_avg": [
            278.25,
            61.89658714339588
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            86.5,
            6.576473218982953
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8703882797784891,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:gui9__AUbV8J:scholar.google.com/&scioq=DiffSim:+Aligning+Diffusion+Model+and+Molecular+Dynamics+Simulation+for+Accurate+Blind+Docking&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;1",
        "aff_unique_norm": "Fudan University;University of Illinois Urbana-Champaign",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.fudan.edu.cn;https://illinois.edu",
        "aff_unique_abbr": "Fudan;UIUC",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Urbana-Champaign",
        "aff_country_unique_index": "0;1;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "xle26hcxHh",
        "title": "AudoFormer: An Efficient Transformer with Consistent Auxiliary Domain for Source-free Domain Adaptation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Source-free domain adaptation (SFDA), which tackles domain adaptation without accessing the source domain directly, has gradually gained widespread attention.  However, due to the inaccessibility of source domain data, deterministic invariable features cannot be obtained. Current advanced methods mainly evaluate pseudo-labels or consistent neighbor labels for self-supervision, which are susceptible to hard samples and affected by domain bias. In this paper, we propose an efficient transFormer with a consistent Auxiliary domain for source-free domain adaptation, abbreviated as AudoFormer, which solves the invariable feature representation from a new perspective by domain consistency. Concretely, AudoFormer constructs an auxiliary domain module (ADM) block, which can achieve diversified representations from the global attention feature in the intermediate layers. Then based on the auxiliary domain and target domain, we distinguish invariable feature representation by exploiting multiple consistency strategies, i.e., dynamically evaluated consistent labels and consistent neighbors, which can divide the whole target samples into source-like easy samples and target-specific hard samples. Finally, we align the source-like with the target-specific samples by conditional guided multi-kernel max mean discrepancy (CMK-MMD), which guides the hard samples to align the corresponding easy samples. To verify the effectiveness, we conduct extensive experiments on three benchmark datasets (i.e., Office-31, Office-Home, and VISDA-C). Results show that our approach achieves significant performance among multiple domain adaptation benchmarks compared to the other state-of-the-art baselines. Code will be available.",
        "keywords": "Unsupervised learning;Transfer learning;Source-free domain adaptation;Vision transformer",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/38be055e217d5ad8233b807ef2af053d0228fc89.zip",
        "author": "Renrong Shao;Wei Zhang;Kangyang Luo;Qin Li;Jun Wang",
        "authorids": "~Renrong_Shao1;~Wei_Zhang27;~Kangyang_Luo1;~Qin_Li3;~Jun_Wang4",
        "gender": "M;M;M;M;M",
        "homepage": ";https://weizhangltt.github.io/;;;",
        "dblp": "231/1094.html;10/4661-56;;80/43-2;",
        "google_scholar": ";DKcduF0AAAAJ;https://scholar.google.com.hk/citations?hl=zh-CN;;",
        "orcid": ";0000-0001-6763-8146;;0000-0001-7476-4079;",
        "linkedin": ";;;;",
        "or_profile": "~Renrong_Shao1;~Wei_Zhang27;~Kangyang_Luo1;~Qin_Li3;~Jun_Wang4",
        "aff": "East China Normal University;East China Normal University;East China Normal University;East China Normal University;",
        "aff_domain": "ecnu.edu.cn;ecnu.edu.cn;ecnu.edu.cn;ecnu.edu.cn;",
        "position": "PhD student;Full Professor;PhD student;Associate Professor;",
        "bibtex": "@misc{\nshao2024audoformer,\ntitle={AudoFormer: An Efficient Transformer with Consistent Auxiliary Domain for Source-free Domain Adaptation},\nauthor={Renrong Shao and Wei Zhang and Kangyang Luo and Qin Li and Jun Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=xle26hcxHh}\n}",
        "github": "",
        "project": "",
        "reviewers": "n97E;2ckR;QH22;JA6w",
        "site": "https://openreview.net/forum?id=xle26hcxHh",
        "pdf_size": 806983,
        "rating": "5;5;5;5",
        "confidence": "2;5;4;4",
        "soundness": "3;3;3;3",
        "contribution": "2;3;2;2",
        "presentation": "3;3;2;3",
        "wc_summary": "36;76;136;39",
        "wc_strengths": "43;56;292;48",
        "wc_weaknesses": "33;74;348;166",
        "wc_questions": "16;33;81;4",
        "wc_review": "128;239;857;257",
        "wc_reply_reviewers": "48;0;0;0",
        "wc_reply_authors": "370;234;446;652",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "3;4;6;5",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            71.75,
            40.30120965926457
        ],
        "wc_strengths_avg": [
            109.75,
            105.32420187212433
        ],
        "wc_weaknesses_avg": [
            155.25,
            121.25876256996852
        ],
        "wc_questions_avg": [
            33.5,
            29.295904150580505
        ],
        "wc_review_avg": [
            370.25,
            285.33434335880423
        ],
        "wc_reply_reviewers_avg": [
            12.0,
            20.784609690826528
        ],
        "wc_reply_authors_avg": [
            425.5,
            151.22417134836613
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.5,
            1.118033988749895
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Hwd2BVdWc-8J:scholar.google.com/&scioq=AudoFormer:+An+Efficient+Transformer+with+Consistent+Auxiliary+Domain+for+Source-free+Domain+Adaptation&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "East China Normal University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.ecnu.edu.cn",
        "aff_unique_abbr": "ECNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "xm8okHEC3G",
        "title": "Boosting Dataset Distillation with the Assistance of Crucial Samples",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In recent years, massive datasets have significantly driven the advancement of machine learning at the expense of high computational costs and extensive storage requirements. Dataset distillation (DD) aims to address this challenge by learning a small synthetic dataset such that a model trained on it can achieve a comparable test performance as one trained on the original dataset. This task can be formulated as a bi-level learning problem where the outer loop optimizes the learned dataset and the inner loop updates the model parameters based on the distilled data. Different from previous studies that focus primarily on optimizing the inner loop in this bi-level problem, we delve into the task of dataset distillation from the perspective of sample cruciality. We find that discarding easy samples and keeping the hard ones that are difficult to be represented by the learned synthetic samples in the outer loop can be beneficial for DD. Motivated by this observation, we further develop an Infinite Semantic Augmentation~(ISA) based dataset distillation algorithm, which discards some easier samples and implicitly enriches harder ones in the semantic space through continuously interpolating between two target feature vectors. Through detailed mathematical derivation, the joint contribution to training loss of all interpolated feature points is formed into an analytical closed-form solution of an integral that can be optimized with almost no extra computational cost. Experimental results on several benchmark datasets demonstrate the effectiveness of our approach in reducing the dataset size while preserving the accuracy of the model. Furthermore, we show that high-quality distilled data can also provide benefits to downstream applications, such as continual learning and membership inference defense. The code can be found at https://github.com/to_be/released.",
        "keywords": "Distillation;hard;semantic",
        "primary_area": "metric learning, kernel learning, and sparse coding",
        "supplementary_material": "/attachment/d47c0906cfe94d37a31e182192c4913cb809f682.zip",
        "author": "Xiaodan Li;YueFeng Chen;Yao Zhu;Cen Chen;Jianmei Guo;Hui Xue'",
        "authorids": "~Xiaodan_Li1;~YueFeng_Chen1;~Yao_Zhu2;~Cen_Chen1;~Jianmei_Guo1;~Hui_Xue'1",
        "gender": "F;M;M;F;M;M",
        "homepage": ";;;https://sites.google.com/site/chencenpersonalwebsite/;https://faculty.ecnu.edu.cn/_s37/gjm/main.psp;http://www.alibaba.com",
        "dblp": "126/7789;52/8180;;152/6215-1.html;69/6953;",
        "google_scholar": "YximuHAAAAAJ;Kf-IpFsAAAAJ;Te8bmo0AAAAJ;https://scholar.google.com.sg/citations?user=3Mn4S9UAAAAJ;RwkVKswAAAAJ;",
        "orcid": ";;0000-0003-0991-1970;0000-0003-0325-1705;0000-0001-5787-6781;",
        "linkedin": ";;;;jmguo/;",
        "or_profile": "~Xiaodan_Li1;~YueFeng_Chen1;~Yao_Zhu2;~Cen_Chen1;~Jianmei_Guo1;~Hui_Xue'1",
        "aff": "Alibaba Group;Alibaba Group;Zhejiang University;East China Normal University;East China Normal University;Alibaba Group",
        "aff_domain": "alibaba-inc.com;alibaba-inc.com;zju.edu.cn;dase.ecnu.edu.cn;ecnu.edu.cn;alibaba-inc.com",
        "position": "Researcher;Staff Algorithm Engineer;PhD student;Associate Professor;Full Professor;Principal Researcher",
        "bibtex": "@misc{\nli2024boosting,\ntitle={Boosting Dataset Distillation with the Assistance of Crucial Samples},\nauthor={Xiaodan Li and YueFeng Chen and Yao Zhu and Cen Chen and Jianmei Guo and Hui Xue'},\nyear={2024},\nurl={https://openreview.net/forum?id=xm8okHEC3G}\n}",
        "github": "",
        "project": "",
        "reviewers": "wdbv;dBFm;LMPF;R7gb",
        "site": "https://openreview.net/forum?id=xm8okHEC3G",
        "pdf_size": 13550045,
        "rating": "5;6;6;6",
        "confidence": "4;4;4;5",
        "soundness": "2;3;3;4",
        "contribution": "2;3;3;2",
        "presentation": "3;2;3;4",
        "wc_summary": "82;54;154;32",
        "wc_strengths": "55;88;102;32",
        "wc_weaknesses": "426;149;98;241",
        "wc_questions": "101;6;315;6",
        "wc_review": "664;297;669;311",
        "wc_reply_reviewers": "0;168;38;64",
        "wc_reply_authors": "0;1625;1356;1726",
        "reply_reviewers": "0;3;1;1",
        "reply_authors": "0;6;5;6",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            80.5,
            45.986411036305064
        ],
        "wc_strengths_avg": [
            69.25,
            27.453369556395078
        ],
        "wc_weaknesses_avg": [
            228.5,
            125.0129993240703
        ],
        "wc_questions_avg": [
            107.0,
            126.19627569781923
        ],
        "wc_review_avg": [
            485.25,
            181.32619088261904
        ],
        "wc_reply_reviewers_avg": [
            67.5,
            62.327762674429444
        ],
        "wc_reply_authors_avg": [
            1176.75,
            692.7255499113628
        ],
        "reply_reviewers_avg": [
            1.25,
            1.0897247358851685
        ],
        "reply_authors_avg": [
            4.25,
            2.48746859276655
        ],
        "replies_avg": [
            30,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:KY0WJUpTCV0J:scholar.google.com/&scioq=Boosting+Dataset+Distillation+with+the+Assistance+of+Crucial+Samples&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2;2;0",
        "aff_unique_norm": "Alibaba Group;Zhejiang University;East China Normal University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.alibaba.com;https://www.zju.edu.cn;http://www.ecnu.edu.cn",
        "aff_unique_abbr": "Alibaba;ZJU;ECNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Exploring Target Representations for Masked Autoencoders",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17445",
        "id": "xmQMz9OPF5",
        "author_site": "xingbin liu, Jinghao Zhou, Tao Kong, Xianming Lin, Rongrong Ji",
        "tldr": "",
        "abstract": "Masked autoencoders have become popular training paradigms for self-supervised visual representation learning. These models randomly mask a portion of the input and reconstruct the masked portion according to assigned target representations. In this paper, we show that a careful choice of the target representation is unnecessary for learning good visual representation since different targets tend to derive similarly behaved models. Driven by this observation, we propose a multi-stage masked distillation pipeline and use a randomly initialized model as the teacher, enabling us to effectively train high-capacity models without any effort to carefully design the target representation. \nOn various downstream tasks, the proposed method to perform masked knowledge distillation with bootstrapped teachers (dbot) outperforms previous self-supervised methods by nontrivial margins. We hope our findings, as well as the proposed method, could motivate people to rethink the roles of target representations in pre-training masked autoencoders.",
        "keywords": "self-supervised learninf;masked image modeling",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "xingbin liu;Jinghao Zhou;Tao Kong;Xianming Lin;Rongrong Ji",
        "authorids": "~xingbin_liu1;~Jinghao_Zhou1;~Tao_Kong3;~Xianming_Lin1;~Rongrong_Ji5",
        "gender": ";M;M;M;M",
        "homepage": "https://github.com/liuxingbin;https://shallowtoil.github.io/;http://www.taokong.org;;http://mac.xmu.edu.cn/rrji-en.html",
        "dblp": ";69/5505;01/2492;146/4014.html;86/5681",
        "google_scholar": "CqL88JwAAAAJ;AoDJADEAAAAJ;kSUXLPkAAAAJ;;",
        "orcid": ";;;0000-0003-4739-8936;",
        "linkedin": ";;;;",
        "or_profile": "~xingbin_liu1;~Jinghao_Zhou1;~Tao_Kong3;~Xianming_Lin1;~Rongrong_Ji5",
        "aff": "Megvii Technology Inc.;University of Oxford, University of Oxford;Bytedance;Xiamen University;Xiamen University",
        "aff_domain": "megvii.com;eng.ox.ac.uk;bytedance.com;xmu.edu.cn;xmu.edu.cn",
        "position": "Researcher;PhD student;Researcher;Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\nliu2024exploring,\ntitle={Exploring Target Representations for Masked Autoencoders},\nauthor={xingbin liu and Jinghao Zhou and Tao Kong and Xianming Lin and Rongrong Ji},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=xmQMz9OPF5}\n}",
        "github": "",
        "project": "",
        "reviewers": "aTJx;wVuK;2u7d;tvFW",
        "pdf_size": 567261,
        "rating": "3;6;6;6",
        "confidence": "4;3;3;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;4;4",
        "wc_summary": "76;70;54;91",
        "wc_strengths": "44;33;73;116",
        "wc_weaknesses": "216;306;204;191",
        "wc_questions": "33;12;22;308",
        "wc_review": "369;421;353;706",
        "wc_reply_reviewers": "350;98;77;0",
        "wc_reply_authors": "602;355;248;445",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            72.75,
            13.254716141811564
        ],
        "wc_strengths_avg": [
            66.5,
            32.09750769140807
        ],
        "wc_weaknesses_avg": [
            229.25,
            45.18503623988809
        ],
        "wc_questions_avg": [
            93.75,
            123.9200851355421
        ],
        "wc_review_avg": [
            462.25,
            142.95694281845846
        ],
        "wc_reply_reviewers_avg": [
            131.25,
            131.4598322682636
        ],
        "wc_reply_authors_avg": [
            412.5,
            129.7430152262541
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 49,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7796975613765926250&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=xmQMz9OPF5",
        "pdf": "https://openreview.net/pdf?id=xmQMz9OPF5",
        "email": "megvii.com;eng.ox.ac.uk;bytedance.com;xmu.edu.cn;xmu.edu.cn",
        "author_num": 5,
        "aff_unique_index": "0;1;2;3;3",
        "aff_unique_norm": "Megvii Technology;University of Oxford;ByteDance;Xiamen University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.megvii.com;https://www.ox.ac.uk;https://www.bytedance.com;https://www.xmu.edu.cn",
        "aff_unique_abbr": "Megvii;Oxford;Bytedance;XMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;0",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "id": "xmQuUqSynb",
        "title": "Rethinking Adversarial Robustness in the Context of the Right to be Forgotten",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The past few years have seen an intense research interest in the practical needs of the \"right to be forgotten\", which enables machine learning models to unlearn a fraction of training data and its lineage. As a result of this growing interest, numerous machine unlearning methods have been proposed and developed to address this important aspect of data privacy. While existing machine unlearning methods prioritize the protection of individuals' private and sensitive data, they overlook investigating the unlearned models' susceptibility to adversarial attacks and security breaches. In this work, we uncover a novel security vulnerability of machine unlearning based on the insight that the adversarial vulnerabilities can be bolstered especially for adversarial robust models. To exploit this observed vulnerability, we propose a novel attack called Adversarial Unlearning Attack (AdvUA), which aims to generate a small fraction of malicious unlearning requests during the unlearning process. AdvUA causes a significant reduction of adversarial robustness in the unlearned model compared to the original model, providing an entirely new capability for adversaries that is infeasible in conventional machine learning pipelines. Notably, we also show that AdvUA can effectively enhance model stealing attacks by extracting additional decision boundary information, further emphasizing the breadth and significance of our research. Extensive numerical studies are conducted to demonstrate the effectiveness of the proposed attack. Our code is available in the supplementary material.",
        "keywords": "Adversarial robustness;Machine unlearning;Model stealing attack",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/7fa79228d0f8da852ed55db3caf9dd7455bded41.zip",
        "author": "CHENXU ZHAO;Wei Qian;Yangyi Li;Wang Li;Mengdi Huai",
        "authorids": "~CHENXU_ZHAO2;~Wei_Qian5;~Yangyi_Li1;~Wang_Li6;~Mengdi_Huai1",
        "gender": "M;M;;M;F",
        "homepage": ";;;https://tiansuy.github.io/GitHub-test-page/;https://mdhuai.github.io/",
        "dblp": ";;326/2983;;150/8482",
        "google_scholar": "6J8ln3QAAAAJ;n1gDJZQAAAAJ;evF1Es8AAAAJ;;40ZYTzEAAAAJ",
        "orcid": ";0000-0002-3298-9218;;;0000-0001-6368-5973",
        "linkedin": "chenxu-zhao-2b6590181/;;;;",
        "or_profile": "~CHENXU_ZHAO2;~Wei_Qian5;~Yangyi_Li1;~Wang_Li6;~Mengdi_Huai1",
        "aff": "Iowa State University;Iowa State University;Iowa State University;University of Memphis;Iowa State University",
        "aff_domain": "iastate.edu;cs.iastate.edu;iastate.edu;memphis.edu;iastate.edu",
        "position": "PhD student;PhD student;PhD student;PhD student;Assistant Professor",
        "bibtex": "@misc{\nzhao2024rethinking,\ntitle={Rethinking Adversarial Robustness in the Context of the Right to be Forgotten},\nauthor={CHENXU ZHAO and Wei Qian and Yangyi Li and Wang Li and Mengdi Huai},\nyear={2024},\nurl={https://openreview.net/forum?id=xmQuUqSynb}\n}",
        "github": "",
        "project": "",
        "reviewers": "HikF;dMF7;aqii;eRuv",
        "site": "https://openreview.net/forum?id=xmQuUqSynb",
        "pdf_size": 893376,
        "rating": "5;6;6;6",
        "confidence": "4;3;3;3",
        "soundness": "2;3;3;3",
        "contribution": "3;4;3;3",
        "presentation": "3;3;3;2",
        "wc_summary": "110;139;80;68",
        "wc_strengths": "84;118;36;33",
        "wc_weaknesses": "52;282;22;192",
        "wc_questions": "111;107;52;153",
        "wc_review": "357;646;190;446",
        "wc_reply_reviewers": "0;16;10;89",
        "wc_reply_authors": "1677;3249;286;1886",
        "reply_reviewers": "0;1;1;2",
        "reply_authors": "5;6;2;6",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            99.25,
            27.580563808595358
        ],
        "wc_strengths_avg": [
            67.75,
            35.3721288587498
        ],
        "wc_weaknesses_avg": [
            137.0,
            105.47511554864494
        ],
        "wc_questions_avg": [
            105.75,
            35.88436288970448
        ],
        "wc_review_avg": [
            409.75,
            164.46941204977904
        ],
        "wc_reply_reviewers_avg": [
            28.75,
            35.25177300505607
        ],
        "wc_reply_authors_avg": [
            1774.5,
            1050.2048609676115
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            4.75,
            1.6393596310755
        ],
        "replies_avg": [
            31,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=420524086692277025&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "Iowa State University;University of Memphis",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.iastate.edu;https://www.memphis.edu",
        "aff_unique_abbr": "ISU;UM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "xnUIMz5u2s",
        "title": "How FaR Are Large Language Models From Agents with Theory-of-Mind?",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "\"*Thinking is for Doing.*\" Humans can infer other people\u2019s mental states from observations\u2013an ability called Theory-of-Mind (ToM)\u2013and subsequently act pragmatically on those inferences. Existing question answering benchmarks such as ToMi ask models questions to make inferences about beliefs of characters in a story, but do not test whether models can then use these inferences to guide their actions. We propose a new evaluation paradigm for large language models (LLMs): Thinking for Doing (T4D), which requires models to connect inferences about others\u2019 mental states to actions in social scenarios. Experiments on T4D demonstrate that LLMs such as GPT-4 and PaLM 2 seemingly excel at tracking characters\u2019 beliefs in stories, but they struggle to translate this capability into strategic action.\n\nOur analysis reveals the core challenge for LLMs lies in identifying the implicit inferences about mental states without being explicitly asked about as in ToMi, that lead to choosing the correct action in T4D. To bridge this gap, we introduce a zero-shot prompting framework, Foresee and Reflect (FaR), which provides a reasoning structure that encourages LLMs to anticipate future challenges and reason about potential actions. FaR boosts GPT-4\u2019s performance from 50% to 71% on T4D, outperforming other prompting methods such as Chain-of-Thought and Self-Ask. Moreover, FaR generalizes to diverse out-of-distribution story structures and scenarios that also require ToM inferences to choose an action, consistently outperforming other methods including few-shot in-context learning.",
        "keywords": "Large Language Models;Theory-of-Mind;Social Reasoning;Language Agent;Prompting",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Pei Zhou;Aman Madaan;Srividya Pranavi Potharaju;Aditya Gupta;Kevin R. McKee;Ari Holtzman;Jay Pujara;Xiang Ren;Swaroop Mishra;Aida Nematzadeh;Shyam Upadhyay;Manaal Faruqui",
        "authorids": "~Pei_Zhou1;~Aman_Madaan1;~Srividya_Pranavi_Potharaju1;~Aditya_Gupta2;~Kevin_R._McKee1;~Ari_Holtzman1;~Jay_Pujara1;~Xiang_Ren1;~Swaroop_Mishra1;~Aida_Nematzadeh1;~Shyam_Upadhyay1;~Manaal_Faruqui2",
        "gender": "M;;;M;M;M;;M;M;;;M",
        "homepage": "https://shaoxia57.github.io/;https://madaan.github.io;;https://research.google/people/AdityaGupta/;https://www.empiricallykev.com/;http://ariholtzman.com;https://www.jaypujara.org;https://shanzhenren.github.io/;https://swarooprm.github.io/;http://www.aidanematzadeh.me/;http://shyamupa.com;http://www.manaalfaruqui.com/",
        "dblp": ";138/1043;;;217/2490;https://dblp.uni-trier.de/pers/hd/h/Holtzman:Ari;65/10103;36/360-1;249/2784;153/9556;161/0014.html;07/9769",
        "google_scholar": "13PGDZsAAAAJ;jW9ts2cAAAAJ;;HW7IZ6sAAAAJ;KKVV2nMAAAAJ;https://scholar.google.com/citations?authuser=2;yvdSr4AAAAAJ;_moJlrIAAAAJ;-7LK2SwAAAAJ;FWJZYMYAAAAJ;;W-CxZCgAAAAJ",
        "orcid": ";;;;0000-0002-4412-1686;;0000-0001-6921-1744;;;;;",
        "linkedin": "pei-zhou-169051119/;amnmadaan/;;;;;pujara;xren7;;;;",
        "or_profile": "~Pei_Zhou1;~Aman_Madaan1;~Srividya_Pranavi_Potharaju1;~Aditya_Gupta2;~Kevin_R._McKee1;~Ari_Holtzman1;~Jay_Pujara1;~Xiang_Ren1;~Swaroop_Mishra1;~Aida_Nematzadeh1;~Shyam_Upadhyay1;~Manaal_Faruqui2",
        "aff": "University of Southern California;Carnegie Mellon University;;Google;Google DeepMind;Meta;University of Southern California;University of Southern California;Google;;Google;Google",
        "aff_domain": "usc.edu;cmu.edu;;google.com;deepmind.com;meta.com;usc.edu;usc.edu;google.com;;google.com;google.com",
        "position": "PhD student;PhD student;;Researcher;Research Scientist;Postdoc;Assistant Professor;Associate Professor;Researcher;;Researcher;Research Scientist",
        "bibtex": "@misc{\nzhou2024how,\ntitle={How FaR Are Large Language Models From Agents with Theory-of-Mind?},\nauthor={Pei Zhou and Aman Madaan and Srividya Pranavi Potharaju and Aditya Gupta and Kevin R. McKee and Ari Holtzman and Jay Pujara and Xiang Ren and Swaroop Mishra and Aida Nematzadeh and Shyam Upadhyay and Manaal Faruqui},\nyear={2024},\nurl={https://openreview.net/forum?id=xnUIMz5u2s}\n}",
        "github": "",
        "project": "",
        "reviewers": "WCD3;6i9F;pfbS",
        "site": "https://openreview.net/forum?id=xnUIMz5u2s",
        "pdf_size": 778721,
        "rating": "3;6;6",
        "confidence": "5;4;3",
        "soundness": "2;2;3",
        "contribution": "1;3;3",
        "presentation": "3;3;3",
        "wc_summary": "85;239;74",
        "wc_strengths": "37;101;65",
        "wc_weaknesses": "766;200;92",
        "wc_questions": "8;192;32",
        "wc_review": "896;732;263",
        "wc_reply_reviewers": "375;102;13",
        "wc_reply_authors": "1844;746;325",
        "reply_reviewers": "1;1;1",
        "reply_authors": "5;2;3",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            132.66666666666666,
            75.32300814197184
        ],
        "wc_strengths_avg": [
            67.66666666666667,
            26.195843605851334
        ],
        "wc_weaknesses_avg": [
            352.6666666666667,
            295.5777769424187
        ],
        "wc_questions_avg": [
            77.33333333333333,
            81.67142843260562
        ],
        "wc_review_avg": [
            630.3333333333334,
            268.23414315771873
        ],
        "wc_reply_reviewers_avg": [
            163.33333333333334,
            154.01803646182339
        ],
        "wc_reply_authors_avg": [
            971.6666666666666,
            640.3302967132578
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            1.247219128924647
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            12,
            0
        ],
        "corr_rating_confidence": -0.8660254037844387,
        "gs_citation": 64,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7978252366042560178&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;2;3;0;0;2;2;2",
        "aff_unique_norm": "University of Southern California;Carnegie Mellon University;Google;Meta",
        "aff_unique_dep": ";;Google;Meta Platforms, Inc.",
        "aff_unique_url": "https://www.usc.edu;https://www.cmu.edu;https://www.google.com;https://meta.com",
        "aff_unique_abbr": "USC;CMU;Google;Meta",
        "aff_campus_unique_index": "0;2;0;0;2;2;2",
        "aff_campus_unique": "Los Angeles;;Mountain View",
        "aff_country_unique_index": "0;0;0;1;0;0;0;0;0;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "title": "On the Fairness ROAD: Robust Optimization for Adversarial Debiasing",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17444",
        "id": "xnhvVtZtLD",
        "author_site": "Vincent Grari, Thibault Laugel, Tatsunori Hashimoto, sylvain lamprier, Marcin Detyniecki",
        "tldr": "",
        "abstract": "In the field of algorithmic fairness, significant attention has been put on group fairness criteria, such as Demographic Parity and Equalized Odds. Nevertheless, these objectives, measured as global averages,  have raised concerns about persistent local disparities between sensitive groups. In this work, we address the problem of local fairness, which ensures that the predictor is unbiased not only in terms of expectations over the whole population, but also within any subregion of the feature space, unknown at training time. To enforce this objective, we introduce ROAD, a novel approach that leverages the Distributionally Robust Optimization (DRO) framework  within a fair adversarial learning objective, where an adversary tries to infer the sensitive attribute from the predictions. Using an instance-level re-weighting strategy, ROAD is designed to prioritize inputs that are likely to be locally unfair, i.e. where the adversary faces the least difficulty in reconstructing the sensitive attribute. Numerical experiments demonstrate the effectiveness of our method: it achieves Pareto dominance with respect to local fairness and accuracy for a given global fairness level across three standard datasets, and also enhances fairness generalization under distribution shift.",
        "keywords": "Fairness;DRO;Adversarial Learning",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/56745b711682eb086f29cc62b1eeee99d155f927.zip",
        "author": "Vincent Grari;Thibault Laugel;Tatsunori Hashimoto;sylvain lamprier;Marcin Detyniecki",
        "authorids": "~Vincent_Grari1;~Thibault_Laugel1;~Tatsunori_Hashimoto1;~sylvain_lamprier1;~Marcin_Detyniecki1",
        "gender": "M;M;M;M;M",
        "homepage": ";https://thibaultlaugel.github.io/;https://thashim.github.io;https://scholar.google.com/citations?user=NuGN8SUAAAAJ&hl=fr&oi=ao;",
        "dblp": "254/1073;211/8074;;28/4095.html;",
        "google_scholar": "loXXnYYAAAAJ;GAKJBJYAAAAJ;5ygiTwsAAAAJ;NuGN8SUAAAAJ;https://scholar.google.fr/citations?hl=en",
        "orcid": "0000-0003-1040-9304;;;;",
        "linkedin": ";;;;detyniecki/",
        "or_profile": "~Vincent_Grari1;~Thibault_Laugel1;~Tatsunori_Hashimoto1;~sylvain_lamprier1;~Marcin_Detyniecki1",
        "aff": "Stanford University;AXA;Stanford University;Universit\u00e9 d'Angers;LIP6",
        "aff_domain": "stanford.edu;axa.com;stanford.edu;univ-angers.fr;lip6.fr",
        "position": "Visiting Researcher;Researcher;Assistant Professor;Full Professor;Researcher",
        "bibtex": "@inproceedings{\ngrari2024on,\ntitle={On the Fairness {ROAD}: Robust Optimization for Adversarial Debiasing},\nauthor={Vincent Grari and Thibault Laugel and Tatsunori Hashimoto and sylvain lamprier and Marcin Detyniecki},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=xnhvVtZtLD}\n}",
        "github": "",
        "project": "",
        "reviewers": "Cpzk;bLrb;d8Gj;34eA",
        "pdf_size": 1774602,
        "rating": "6;6;6;8",
        "confidence": "5;3;4;4",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;4;3;3",
        "wc_summary": "60;108;182;116",
        "wc_strengths": "30;29;88;42",
        "wc_weaknesses": "20;88;125;54",
        "wc_questions": "278;318;184;53",
        "wc_review": "388;543;579;265",
        "wc_reply_reviewers": "98;252;0;10",
        "wc_reply_authors": "1831;1955;1170;931",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "3;4;2;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            116.5,
            43.45975149491768
        ],
        "wc_strengths_avg": [
            47.25,
            24.076700355322778
        ],
        "wc_weaknesses_avg": [
            71.75,
            39.0280347955159
        ],
        "wc_questions_avg": [
            208.25,
            101.98130956209575
        ],
        "wc_review_avg": [
            443.75,
            125.70078559818153
        ],
        "wc_reply_reviewers_avg": [
            90.0,
            101.00495037373169
        ],
        "wc_reply_authors_avg": [
            1471.75,
            431.87230462255854
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17607523975029599371&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=xnhvVtZtLD",
        "pdf": "https://openreview.net/pdf?id=xnhvVtZtLD",
        "email": "stanford.edu;axa.com;stanford.edu;univ-angers.fr;lip6.fr",
        "author_num": 5,
        "aff_unique_index": "0;1;0;2;3",
        "aff_unique_norm": "Stanford University;AXA;Universit\u00e9 d'Angers;Laboratoire d'Informatique de Paris 6",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.stanford.edu;https://www.axa.com;https://www.univ-angers.fr;http://www.lip6.fr",
        "aff_unique_abbr": "Stanford;AXA;UA;LIP6",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Stanford;",
        "aff_country_unique_index": "0;1;0;1;1",
        "aff_country_unique": "United States;France"
    },
    {
        "id": "xoBPfUyLWj",
        "title": "Leveraging Heterogeneous Side Information via Diffusion Models for Time-series Anomaly Detection",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In this paper, we propose a novel unsupervised learning approach for Out-of- Distribution (OoD) detection in time-series data, leveraging state-of-the-art dif- fusion models to capture the underlying data distribution. Our first contribution is the development of an effective OoD detector based on conditional sampling and reconstruction error measurement, eliminating the need for labeled data samples. We employ time series imputation techniques to reconstruct the original time se- ries, enhancing the detection process. Our second contribution is the incorporation of domain-specific side information, which bolsters the diffusion model\u2019s ability to understand the structure of time-series data and results in a more robust OoD detector. Finally, we demonstrate the state-of-the-art performance of our proposed method through experiments on three diverse datasets: IoT Event Sequence De- tection, DDoS Attack Detection, and Abnormal Network Transaction Sequence Detection. The experimental results highlight the effectiveness and versatility of our approach in addressing various OoD detection tasks across different domains",
        "keywords": "diffusion models;time series;anomaly detection",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Hanchen Xiong;Janmey Shukla;Aakarshan Chauhan;Zicun Cong;Dianhuan Lin",
        "authorids": "~Hanchen_Xiong1;~Janmey_Shukla1;~Aakarshan_Chauhan1;~Zicun_Cong1;~Dianhuan_Lin1",
        "gender": "M;M;M;M;F",
        "homepage": ";;;;",
        "dblp": "134/0599;;;;",
        "google_scholar": ";;;https://scholar.google.ca/citations?user=1bt3FOkAAAAJ;",
        "orcid": ";;;;",
        "linkedin": ";janmey-shukla;aakarshan-chauhan;https://linkedin.com/in/zicun-cong-390086a4;",
        "or_profile": "~Hanchen_Xiong1;~Janmey_Shukla1;~Aakarshan_Chauhan1;~Zicun_Cong1;~Dianhuan_Lin1",
        "aff": "Zscaler;Zscaler;;;",
        "aff_domain": "zscaler.com;zscaler.com;;;",
        "position": "Principal Researcher;Intern;;;",
        "bibtex": "@misc{\nxiong2024leveraging,\ntitle={Leveraging Heterogeneous Side Information via Diffusion Models for Time-series Anomaly Detection},\nauthor={Hanchen Xiong and Janmey Shukla and Aakarshan Chauhan and Zicun Cong and Dianhuan Lin},\nyear={2024},\nurl={https://openreview.net/forum?id=xoBPfUyLWj}\n}",
        "github": "",
        "project": "",
        "reviewers": "fEiX;Xkjb;nb7N",
        "site": "https://openreview.net/forum?id=xoBPfUyLWj",
        "pdf_size": 1641768,
        "rating": "3;5;5",
        "confidence": "3;4;4",
        "soundness": "3;3;3",
        "contribution": "1;2;3",
        "presentation": "3;2;2",
        "wc_summary": "167;79;66",
        "wc_strengths": "55;34;44",
        "wc_weaknesses": "206;32;260",
        "wc_questions": "171;26;8",
        "wc_review": "599;171;378",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            104.0,
            44.86275366789991
        ],
        "wc_strengths_avg": [
            44.333333333333336,
            8.576453553512405
        ],
        "wc_weaknesses_avg": [
            166.0,
            97.28309205612247
        ],
        "wc_questions_avg": [
            68.33333333333333,
            72.96726815649755
        ],
        "wc_review_avg": [
            382.6666666666667,
            174.76142467820398
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.9999999999999998,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:KrzcmiHIvMYJ:scholar.google.com/&scioq=Leveraging+Heterogeneous+Side+Information+via+Diffusion+Models+for+Time-series+Anomaly+Detection&hl=en&as_sdt=0,31",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Zscaler",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.zscaler.com",
        "aff_unique_abbr": "Zscaler",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "xoZ29eXUk7",
        "title": "A Multi-Agent Reinforcement Learning Framework for Evaluating the U.S. \u2018Ending the HIV Epidemic\u2019 initiative",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Human immunodeficiency virus (HIV) is a major public health concern in the United States, with about 1.2 million people living with HIV and 35,000 newly infected each year. There are considerable geographical disparities in HIV burden and care access across the U.S. The 2019 'Ending the HIV Epidemic (EHE)\u2019 initiative aims to reduce new infections by 90\\% by 2030, by improving coverage of diagnoses, treat, and prevent interventions and prioritizing jurisdictions with high HIV prevalence. Identifying optimal scale-up of intervention combinations will help inform resource allocation. Existing HIV decision analytic models either evaluate specific cities or the overall national population, thus overlooking jurisdictional interactions or differences. In this paper, we propose a multi-agent reinforcement learning (MARL) model, that enables jurisdiction-specific decision analyses but in an environment with cross-jurisdictional epidemiological interactions. In experimental analyses, conducted on jurisdictions within California and Florida, optimal policies from MARL were significantly different than those generated from single-agent RL, highlighting the influence of jurisdictional variations and interactions. By using comprehensive modeling of HIV and formulations of state space, action space, and reward functions, this work helps demonstrate the strengths and applicability of MARL for informing public health policies, and provides a framework for expanding to the national-level to inform the EHE.",
        "keywords": "Deep Reinforcement Learning;Multi-agent Reinforcement Learning;Proximal Policy Optimization;Disease Modeling;HIV Modeling",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Dinesh Sharma;Ankit Shah;Chaitra Gopalappa",
        "authorids": "~Dinesh_Sharma1;~Ankit_Shah4;~Chaitra_Gopalappa1",
        "gender": "M;;",
        "homepage": ";https://ankitshah.co;https://diseasemodeling.github.io/",
        "dblp": ";;",
        "google_scholar": ";;",
        "orcid": "0009-0005-9249-6465;;",
        "linkedin": ";;",
        "or_profile": "~Dinesh_Sharma1;~Ankit_Shah4;~Chaitra_Gopalappa1",
        "aff": "University of South Florida;;University of Massachusetts at Amherst",
        "aff_domain": "usf.edu;;umass.edu",
        "position": "PhD student;;Associate Professor",
        "bibtex": "@misc{\nsharma2024a,\ntitle={A Multi-Agent Reinforcement Learning Framework for Evaluating the U.S. {\\textquoteleft}Ending the {HIV} Epidemic{\\textquoteright} initiative},\nauthor={Dinesh Sharma and Ankit Shah and Chaitra Gopalappa},\nyear={2024},\nurl={https://openreview.net/forum?id=xoZ29eXUk7}\n}",
        "github": "",
        "project": "",
        "reviewers": "Trsi;N95H;uaHW;TfZh",
        "site": "https://openreview.net/forum?id=xoZ29eXUk7",
        "pdf_size": 576607,
        "rating": "3;5;5;5",
        "confidence": "4;3;2;2",
        "soundness": "1;2;2;3",
        "contribution": "2;2;2;2",
        "presentation": "2;1;3;3",
        "wc_summary": "47;48;83;24",
        "wc_strengths": "79;16;31;44",
        "wc_weaknesses": "367;187;51;58",
        "wc_questions": "318;18;199;39",
        "wc_review": "811;269;364;165",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "744;433;1040;380",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            50.5,
            21.07723890835799
        ],
        "wc_strengths_avg": [
            42.5,
            23.286262044390035
        ],
        "wc_weaknesses_avg": [
            165.75,
            128.1900444652392
        ],
        "wc_questions_avg": [
            143.5,
            122.67946038355402
        ],
        "wc_review_avg": [
            402.25,
            246.26345140925804
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            649.25,
            265.0107309148065
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8703882797784891,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:jP0I0RQoaOkJ:scholar.google.com/&scioq=A+Multi-Agent+Reinforcement+Learning+Framework+for+Evaluating+the+U.S.+%E2%80%98Ending+the+HIV+Epidemic%E2%80%99+initiative&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of South Florida;University of Massachusetts Amherst",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.usf.edu;https://www.umass.edu",
        "aff_unique_abbr": "USF;UMass Amherst",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Amherst",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "xp7kesUQC1",
        "title": "Cognitive Modeling for Human-Robot Value Soft Alignment",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In the domain of human-robot symbiosis, it is of utmost importance for robots to display intelligent behavior. This encompasses the capability to deduce implicit information to predict the true intentions of humans. Traditionally, humans are perceived as flawless, with their decisions acting as the standards that robots should strive to align with. However, this raises a pertinent question: What if humans make mistakes? In this research, we present a unique task, termed ''value soft alignment''. This task involves the proactive identification of potentially hazardous or unsuitable human actions before the manifestation of their repercussions, and the provision of situationally appropriate suggestions. To facilitate this task, we have constructed a dataset for model training and testing, comprising two types of data: simulated human behaviors and collected human data. We propose a value-driven cognition model to represent the understanding of human behavior, followed by a two-stage method that consists of 1) the prediction of value-based long-term intention and 2) the comparison between the long-term intention and the short-term immediate action intention. Experimental results indicate that the value-driven cognition model can assist robots in comprehending human behavioral patterns over both long-term and short-term durations, and thus the robot can offer sensible recommendations for a majority of scenarios based on the consistency between long-term and short-term intentions of humans.",
        "keywords": "Intention Recognition;Cognitive Modeling;Agent-Based Systems",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/b6bdc14189f5faeed446aad10e7d5fc0e05c753a.zip",
        "author": "Zhe Sun;Rujie Wu;Xiaodong Yang;Hongzhao Xie;Haiyan Jiang;Junda Bi;Zhenliang Zhang",
        "authorids": "~Zhe_Sun1;~Rujie_Wu2;~Xiaodong_Yang12;~Hongzhao_Xie1;~Haiyan_Jiang2;~Junda_Bi2;~Zhenliang_Zhang2",
        "gender": ";M;M;M;F;M;M",
        "homepage": ";https://rujiewu.github.io;https://www.bigai.ai/;;;https://junda.bi;http://www.zlz.link",
        "dblp": ";324/8753;;;53/3856;;74/9671-2",
        "google_scholar": ";https://scholar.google.com/citations?;;;;;https://scholar.google.com.hk/citations?user=wXOtuW0AAAAJ",
        "orcid": ";0009-0001-6426-1248;;0000-0002-7143-7619;0000-0002-5783-5805;;0000-0002-3620-7228",
        "linkedin": ";;;;;;",
        "or_profile": "~Zhe_Sun1;~Rujie_Wu2;~Xiaodong_Yang12;~Hongzhao_Xie1;~Haiyan_Jiang2;~Junda_Bi2;~Zhenliang_Zhang2",
        "aff": ";Peking University;University of Electronic Science and Technology of China;Beijing Institute for General Artificial Intelligence;Beijing Institute of Technology;;Beijing Institute for General Artificial Intelligence",
        "aff_domain": ";stu.pku.edu.cn;uestc.edu.cn;bigai.ai;bit.edu.cn;;bigai.ai",
        "position": ";PhD student;MS student;Researcher;PhD student;;Researcher",
        "bibtex": "@misc{\nsun2024cognitive,\ntitle={Cognitive Modeling for Human-Robot Value Soft Alignment},\nauthor={Zhe Sun and Rujie Wu and Xiaodong Yang and Hongzhao Xie and Haiyan Jiang and Junda Bi and Zhenliang Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=xp7kesUQC1}\n}",
        "github": "",
        "project": "",
        "reviewers": "GZXC;zjY7;rkNb",
        "site": "https://openreview.net/forum?id=xp7kesUQC1",
        "pdf_size": 4404272,
        "rating": "1;3;5",
        "confidence": "4;5;4",
        "soundness": "1;1;3",
        "contribution": "2;1;2",
        "presentation": "1;2;3",
        "wc_summary": "61;28;50",
        "wc_strengths": "36;23;50",
        "wc_weaknesses": "322;110;178",
        "wc_questions": "278;4;181",
        "wc_review": "697;165;459",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            1.632993161855452
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            46.333333333333336,
            13.719410418171117
        ],
        "wc_strengths_avg": [
            36.333333333333336,
            11.025223605694151
        ],
        "wc_weaknesses_avg": [
            203.33333333333334,
            88.38300490227493
        ],
        "wc_questions_avg": [
            154.33333333333334,
            113.43818679008503
        ],
        "wc_review_avg": [
            440.3333333333333,
            217.5888069016623
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:fbhjShvig5UJ:scholar.google.com/&scioq=Cognitive+Modeling+for+Human-Robot+Value+Soft+Alignment&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;2",
        "aff_unique_norm": "Peking University;University of Electronic Science and Technology of China;Beijing Institute for General Artificial Intelligence;Beijing Institute of Technology",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.uestc.edu.cn;http://www.bigaiai.org/;http://www.bit.edu.cn/",
        "aff_unique_abbr": "Peking U;UESTC;BIGAI;BIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Teaching Language Models to Hallucinate Less with Synthetic Tasks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17443",
        "id": "xpw7V0P136",
        "author_site": "Erik Jones, Hamid Palangi, Clarisse Ribeiro, Varun Chandrasekaran, Subhabrata Mukherjee, Arindam Mitra, Ahmed H Awadallah, Ece Kamar",
        "tldr": "",
        "abstract": "Large language models (LLMs) frequently hallucinate on abstractive summarization tasks such as document-based question-answering, meeting summarization, and clinical report generation, even though all necessary information is included in context. However, optimizing to make LLMs hallucinate less is challenging, as hallucination is hard to efficiently, cheaply, and reliably evaluate at each optimization step. In this work, we show that reducing hallucination on a _synthetic task_ can also reduce hallucination on real-world downstream tasks. Our method, SynTra, first designs a synthetic task where hallucinations are easy to elicit and measure. It next optimizes the LLM's system message via prefix tuning on the synthetic task, then uses the system message on realistic, hard-to-optimize tasks. Across three realistic abstractive summarization tasks, we reduce hallucination for two 13B-parameter LLMs using supervision signal from only a synthetic retrieval task. We also find that optimizing the system message rather than the model weights can be critical; fine-tuning the entire model on the synthetic task can counterintuitively _increase_ hallucination. Overall, SynTra demonstrates that the extra flexibility of working with synthetic data can help mitigate undesired behaviors in practice.",
        "keywords": "hallucination;large language models;synthetic data;prefix tuning;safety",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Erik Jones;Hamid Palangi;Clarisse Sim\u00f5es Ribeiro;Varun Chandrasekaran;Subhabrata Mukherjee;Arindam Mitra;Ahmed Hassan Awadallah;Ece Kamar",
        "authorids": "~Erik_Jones3;~Hamid_Palangi1;~Clarisse_Sim\u00f5es_Ribeiro1;~Varun_Chandrasekaran1;~Subhabrata_Mukherjee2;~Arindam_Mitra1;~Ahmed_Hassan_Awadallah1;~Ece_Kamar1",
        "gender": "M;M;;M;;M;M;",
        "homepage": "http://people.eecs.berkeley.edu/~erjones/;https://www.hamidpalangi.com/;;http://pages.cs.wisc.edu/~chandrasekaran/;https://subhomukherjee.com/;https://ari9dam.github.io/;https://www.microsoft.com/en-us/research/people/hassanam/publications/;https://www.ecekamar.com/",
        "dblp": "264/5304;01/963;;;37/11030.html;04/2864;147/9148;36/3834",
        "google_scholar": "_-CU2CsAAAAJ;https://scholar.google.ca/citations?user=B1lAghgAAAAJ;;Sl7nSOsAAAAJ;T4iBN5cAAAAJ;https://scholar.google.com/;sNGk-9MAAAAJ;7Xko5sYAAAAJ",
        "orcid": ";;;;;;;",
        "linkedin": "erik-jones-879239133/;;;;subho87;;ahmed-hassan-awadallah-a355a27/;",
        "or_profile": "~Erik_Jones3;~Hamid_Palangi1;~Clarisse_Sim\u00f5es_Ribeiro1;~Varun_Chandrasekaran1;~Subhabrata_Mukherjee2;~Arindam_Mitra1;~Ahmed_Hassan_Awadallah1;~Ece_Kamar1",
        "aff": "University of California, Berkeley;Google;;University of Illinois Urbana-Champaign;Hippocratic AI;Microsoft Research;Microsoft Research;",
        "aff_domain": "berkeley.edu;google.com;;illinois.edu;hippocraticai.com;research.microsoft.com;microsoft.com;",
        "position": "PhD student;Staff Research Scientist;;Assistant Professor;Chief Scientist;Researcher;Principal Researcher;",
        "bibtex": "@inproceedings{\njones2024teaching,\ntitle={Teaching Language Models to Hallucinate Less with Synthetic Tasks},\nauthor={Erik Jones and Hamid Palangi and Clarisse Sim{\\~o}es Ribeiro and Varun Chandrasekaran and Subhabrata Mukherjee and Arindam Mitra and Ahmed Hassan Awadallah and Ece Kamar},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=xpw7V0P136}\n}",
        "github": "",
        "project": "",
        "reviewers": "tStg;C5mJ;MYvf",
        "pdf_size": 442741,
        "rating": "6;6;6",
        "confidence": "3;4;3",
        "soundness": "2;3;3",
        "contribution": "3;2;3",
        "presentation": "2;3;3",
        "wc_summary": "66;73;79",
        "wc_strengths": "67;53;133",
        "wc_weaknesses": "182;244;110",
        "wc_questions": "191;44;80",
        "wc_review": "506;414;402",
        "wc_reply_reviewers": "715;111;21",
        "wc_reply_authors": "1318;600;864",
        "reply_reviewers": "2;1;1",
        "reply_authors": "4;3;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            72.66666666666667,
            5.312459150169742
        ],
        "wc_strengths_avg": [
            84.33333333333333,
            34.883934538536344
        ],
        "wc_weaknesses_avg": [
            178.66666666666666,
            54.75602452901619
        ],
        "wc_questions_avg": [
            105.0,
            62.56196927846821
        ],
        "wc_review_avg": [
            440.6666666666667,
            46.45667037382492
        ],
        "wc_reply_reviewers_avg": [
            282.3333333333333,
            308.1399393493518
        ],
        "wc_reply_authors_avg": [
            927.3333333333334,
            296.5235609900539
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.0,
            0.816496580927726
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 31,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11218164318571422338&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=xpw7V0P136",
        "pdf": "https://openreview.net/pdf?id=xpw7V0P136",
        "email": "berkeley.edu;google.com;;illinois.edu;hippocraticai.com;research.microsoft.com;microsoft.com;",
        "author_num": 8,
        "aff_unique_index": "0;1;2;3;4;4",
        "aff_unique_norm": "University of California, Berkeley;Google;University of Illinois Urbana-Champaign;Hippocratic AI;Microsoft",
        "aff_unique_dep": ";Google;;;Microsoft Research",
        "aff_unique_url": "https://www.berkeley.edu;https://www.google.com;https://illinois.edu;https://www.hippocratic.ai;https://www.microsoft.com/en-us/research",
        "aff_unique_abbr": "UC Berkeley;Google;UIUC;Hippocratic AI;MSR",
        "aff_campus_unique_index": "0;1;2",
        "aff_campus_unique": "Berkeley;Mountain View;Urbana-Champaign;",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "xpyBQn6gJY",
        "title": "Regularized Optimal Transport for Temporal Trajectory Analysis in Single-Cell Data",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The temporal relationship between different cellular states and lineages is only partially understood and has major significance for cell differentiation and cancer progression. However, two pain points persist and limit learning-based solutions: ($a$) lack of real datasets and standardized benchmark for early cell developments; ($b$) the complicated transcriptional data fail classic temporal analyses. We integrate $\\texttt{Mouse-RGC}$, a large-scale mouse retinal ganglion cell dataset with annotations for $9$ time stages and $30,000$ gene expressions. Existing approaches show a limited generalization on our datasets. To tackle the modeling bottleneck, we then translate this fundamental biology problem into a machine learning formulation, $\\textit{i.e.}$, temporal trajectory analysis. And an innovative regularized optimal transport algorithm, $\\texttt{TAROT}$, is proposed to fill in the research gap, consisting of ($1$) customized masked autoencoder to extract high-quality cell representations; ($2$) cost function regularization through biology priors for distribution transports; ($3$) continuous temporal trajectory optimization based on discrete matched time stages. Extensive empirical investigations demonstrate that our framework produces superior cell lineages and pesudotime, compared to existing approaches on $\\texttt{Mouse-RGC}$ and another two public benchmarks. Moreover, $\\texttt{TAROT}$ is capable of identifying biologically meaningful gene sets along with the developmental trajectory and its simulated gene knockout results echo the findings in physical wet lab validation. Codes are provided in the supplement.",
        "keywords": "optimal transport;temporal trajectory analysis;single-cell transcriptomics",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/172f978798a43b0f9810935d33a4bd547f337ec3.zip",
        "author": "Jie Peng;Xuan Song;Yanyong Zhang;Zhigang He;Marinka Zitnik;Manolis Kellis;Tianlong Chen",
        "authorids": "~Jie_Peng4;~Xuan_Song6;~Yanyong_Zhang2;~Zhigang_He1;~Marinka_Zitnik1;~Manolis_Kellis1;~Tianlong_Chen1",
        "gender": "M;F;F;M;;M;M",
        "homepage": "http://home.ustc.edu.cn/~pengjieb/;https://scholar.google.com.hk/citations?user=hE8Dq50AAAAJ&hl=en&oi=ao;http://staff.ustc.edu.cn/~yanyongz/;https://kirbyneuro.org/ZhigangHe/;https://zitniklab.hms.harvard.edu;http://compbio.mit.edu;https://tianlong-chen.github.io",
        "dblp": ";;44/2799;;53/11277.html;75/2690.html;",
        "google_scholar": ";https://scholar.google.com.hk/citations?user=hE8Dq50AAAAJ;qfbPQ1YAAAAJ;y6kWUEcAAAAJ;YtUDgPIAAAAJ;lsYXBx8AAAAJ;LE3ctn0AAAAJ",
        "orcid": ";;;;;0000-0001-7113-9630;0000-0001-7774-8197",
        "linkedin": ";;;;;manolis-kellis;tianlong-chen-783862167/",
        "or_profile": "~Jie_Peng4;~Xuan_Song6;~Yanyong_Zhang2;~Zhigang_He1;~Marinka_Zitnik1;~Manolis_Kellis1;~Tianlong_Chen1",
        "aff": "University of Science and Technology of China;Harvard University;University of Science and Technology of China;;Harvard University;Massachusetts Institute of Technology;Harvard University",
        "aff_domain": "ustc.edu.cn;harvard.edu;ustc.edu.cn;;harvard.edu;mit.edu;harvard.edu",
        "position": "PhD student;Postdoc;Full Professor;;Associate Professor;Full Professor;Postdoc",
        "bibtex": "@misc{\npeng2024regularized,\ntitle={Regularized Optimal Transport for Temporal Trajectory Analysis in Single-Cell Data},\nauthor={Jie Peng and Xuan Song and Yanyong Zhang and Zhigang He and Marinka Zitnik and Manolis Kellis and Tianlong Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=xpyBQn6gJY}\n}",
        "github": "",
        "project": "",
        "reviewers": "nX3H;zx3P;waBn",
        "site": "https://openreview.net/forum?id=xpyBQn6gJY",
        "pdf_size": 9150876,
        "rating": "3;3;5",
        "confidence": "3;3;3",
        "soundness": "2;2;3",
        "contribution": "2;2;3",
        "presentation": "3;1;3",
        "wc_summary": "53;79;79",
        "wc_strengths": "103;132;26",
        "wc_weaknesses": "658;447;191",
        "wc_questions": "42;63;2",
        "wc_review": "856;721;298",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            70.33333333333333,
            12.256517540566824
        ],
        "wc_strengths_avg": [
            87.0,
            44.7288124888943
        ],
        "wc_weaknesses_avg": [
            432.0,
            190.94676395966144
        ],
        "wc_questions_avg": [
            35.666666666666664,
            25.30261295246446
        ],
        "wc_review_avg": [
            625.0,
            237.70149347448367
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:T_bd8JOyY4gJ:scholar.google.com/&scioq=Regularized+Optimal+Transport+for+Temporal+Trajectory+Analysis+in+Single-Cell+Data&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;1;2;1",
        "aff_unique_norm": "University of Science and Technology of China;Harvard University;Massachusetts Institute of Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.ustc.edu.cn;https://www.harvard.edu;https://web.mit.edu",
        "aff_unique_abbr": "USTC;Harvard;MIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;1;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "xq7h9nfdY2",
        "title": "SmoothLLM: Defending Large Language Models Against Jailbreaking Attacks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Despite efforts to align large language models (LLMs) with human values, widely-used LLMs such as GPT, Llama, Claude, and PaLM are susceptible to jailbreaking attacks, wherein an adversary fools a targeted LLM into generating objectionable content.  To address this vulnerability, we propose SmoothLLM, the first algorithm designed to mitigate jailbreaking attacks on LLMs.  Based on our finding that adversarially-generated prompts are brittle to character-level changes, our defense first randomly perturbs multiple copies of a given input prompt, and then aggregates the corresponding predictions to detect adversarial inputs.  SmoothLLM reduces the attack success rate on numerous popular LLMs to below one percentage point, avoids unnecessary conservatism, and admits provable guarantees on attack mitigation.  Moreover, our defense uses exponentially fewer queries than existing attacks and is compatible with any LLM.",
        "keywords": "LLMs;jailbreak;robustness",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/78749eda9346f1f1a8277754c0daae63ee70b790.zip",
        "author": "Alexander Robey;Eric Wong;Hamed Hassani;George J. Pappas",
        "authorids": "~Alexander_Robey1;~Eric_Wong1;~Hamed_Hassani2;~George_J._Pappas1",
        "gender": "M;M;M;M",
        "homepage": "https://arobey1.github.io/;http://riceric22.github.io/;https://www.seas.upenn.edu/~hassani/;http://www.georgejpappas.org/",
        "dblp": "242/9113;64/1811-1.html;73/4984;p/GeorgeJPappas",
        "google_scholar": "V5NWZc8AAAAJ;pWnTMRkAAAAJ;;https://scholar.google.com.tw/citations?user=Kia-4B0AAAAJ",
        "orcid": ";;;0000-0001-9081-0637",
        "linkedin": "alexrobey/;;;",
        "or_profile": "~Alexander_Robey1;~Eric_Wong1;~Hamed_Hassani2;~George_Pappas1",
        "aff": "School of Engineering and Applied Science, University of Pennsylvania;University of Pennsylvania;University of Pennsylvania;School of Engineering and Applied Science, University of Pennsylvania",
        "aff_domain": "seas.upenn.edu;upenn.edu;upenn.edu;seas.upenn.edu",
        "position": "PhD student;Assistant Professor;;Full Professor",
        "bibtex": "@misc{\nrobey2024smoothllm,\ntitle={Smooth{LLM}: Defending Large Language Models Against Jailbreaking Attacks},\nauthor={Alexander Robey and Eric Wong and Hamed Hassani and George J. Pappas},\nyear={2024},\nurl={https://openreview.net/forum?id=xq7h9nfdY2}\n}",
        "github": "",
        "project": "",
        "reviewers": "rsea;qFYD;Ay91;Utne",
        "site": "https://openreview.net/forum?id=xq7h9nfdY2",
        "pdf_size": 1672002,
        "rating": "3;5;5;5",
        "confidence": "5;4;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "51;49;76;63",
        "wc_strengths": "37;28;77;48",
        "wc_weaknesses": "472;305;451;210",
        "wc_questions": "22;47;140;425",
        "wc_review": "582;429;744;746",
        "wc_reply_reviewers": "0;154;0;0",
        "wc_reply_authors": "1177;1173;2369;1416",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "2;2;3;2",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            59.75,
            10.80219885023415
        ],
        "wc_strengths_avg": [
            47.5,
            18.445866745696716
        ],
        "wc_weaknesses_avg": [
            359.5,
            107.64408948010104
        ],
        "wc_questions_avg": [
            158.5,
            160.0226546461469
        ],
        "wc_review_avg": [
            625.25,
            131.40276823568064
        ],
        "wc_reply_reviewers_avg": [
            38.5,
            66.68395609140178
        ],
        "wc_reply_authors_avg": [
            1533.75,
            492.1683528021687
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 289,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18297589991908434304&as_sdt=5,40&sciodt=0,40&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of Pennsylvania",
        "aff_unique_dep": "School of Engineering and Applied Science",
        "aff_unique_url": "https://www.upenn.edu",
        "aff_unique_abbr": "UPenn",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "xqxG5WogN6",
        "title": "Distribution Shift-Aware Prediction Refinement for Test-Time Adaptation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Test-time adaptation (TTA) enables models to adapt to test domains using only unlabeled test data, addressing the challenge of distribution shift during test time. However, existing TTA methods mainly focus on input distribution shifts, often neglecting class distribution shifts. In this work, we first reveal that existing methods can suffer from performance degradation when encountering class distribution shifts. We also show that there exist class-wise confusion patterns observed across different input distribution shifts. Based on these observations, we introduce a novel test-time adaptation method, named Distribution shift-Aware prediction Refinement for Test-time adaptation (DART), which refines the predictions made by the trained classifiers by focusing on class-wise confusion patterns. DART trains a distribution shift-aware module during intermediate time by exposing several batches with diverse class distributions using the training dataset. This module is then used during test time to detect and correct class distribution shifts, significantly improving pseudo-label accuracy for test data. This improvement leads to enhanced performance in existing TTA methods, making DART a valuable plug-in tool. Extensive experiments on CIFAR, PACS, ImageNet, and digit classification benchmarks demonstrate DART's ability to correct inaccurate predictions caused by test-time distribution shifts, resulting in significant performance gains for TTA methods.",
        "keywords": "test-time adaptation;domain adaptation;domain shift;test-time distribution shift",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/f62a10c19a4f2544967df31a42ba33081751d192.zip",
        "author": "Minguk Jang;Hye Won Chung",
        "authorids": "~Minguk_Jang1;~Hye_Won_Chung2",
        "gender": "M;F",
        "homepage": "https://www.facebook.com/minguk.jang.5/;https://iids.kaist.ac.kr/",
        "dblp": ";https://dblp.uni-trier.de/pers/hd/c/Chung:Hye_Won",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Minguk_Jang1;~Hye_Won_Chung2",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\njang2024distribution,\ntitle={Distribution Shift-Aware Prediction Refinement for Test-Time Adaptation},\nauthor={Minguk Jang and Hye Won Chung},\nyear={2024},\nurl={https://openreview.net/forum?id=xqxG5WogN6}\n}",
        "github": "",
        "project": "",
        "reviewers": "D6tt;7ZMU;JDRC",
        "site": "https://openreview.net/forum?id=xqxG5WogN6",
        "pdf_size": 771582,
        "rating": "5;6;6",
        "confidence": "5;4;5",
        "soundness": "3;3;2",
        "contribution": "2;3;2",
        "presentation": "3;3;3",
        "wc_summary": "92;120;45",
        "wc_strengths": "31;46;29",
        "wc_weaknesses": "88;145;179",
        "wc_questions": "4;58;12",
        "wc_review": "215;369;265",
        "wc_reply_reviewers": "459;0;160",
        "wc_reply_authors": "2559;1386;1183",
        "reply_reviewers": "3;0;2",
        "reply_authors": "6;2;3",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            85.66666666666667,
            30.944394574067136
        ],
        "wc_strengths_avg": [
            35.333333333333336,
            7.586537784494029
        ],
        "wc_weaknesses_avg": [
            137.33333333333334,
            37.54404820415022
        ],
        "wc_questions_avg": [
            24.666666666666668,
            23.79542439676633
        ],
        "wc_review_avg": [
            283.0,
            64.14566755959959
        ],
        "wc_reply_reviewers_avg": [
            206.33333333333334,
            190.22851754899654
        ],
        "wc_reply_authors_avg": [
            1709.3333333333333,
            606.4939314526478
        ],
        "reply_reviewers_avg": [
            1.6666666666666667,
            1.247219128924647
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            1.699673171197595
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:MH-3u4LX7agJ:scholar.google.com/&scioq=Distribution+Shift-Aware+Prediction+Refinement+for+Test-Time+Adaptation&hl=en&as_sdt=0,7",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "xrFTey4pY6",
        "title": "Interactive Model Correction with Natural Language",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In supervised learning, models are trained to extract correlations from a static dataset.  This often leads to models that rely on spurious correlations that fail to generalize to new data distributions, such as a bird classifier that relies on the background of an image. Preventing models from latching on to spurious correlations necessarily requires additional information beyond labeled data. Existing methods incorporate forms of additional instance-level supervision, such as labels for spurious features or additional labeled data from a balanced distribution. Such strategies can become prohibitively costly for large-scale datasets since they require additional annotation at a scale close to the original training data. We hypothesize that far less supervision suffices if we provide targeted feedback about the misconceptions of models trained on a given dataset. We introduce Clarify, a novel natural language interface and method for interactively correcting model misconceptions. Through Clarify, users need only provide a short text description to describe a model's consistent failure patterns, such as ``water background'' for a bird classifier. Then, in an entirely automated way, we use such descriptions to improve the training process by reweighting the training data or gathering additional targeted data. Our empirical results show that non-expert users can successfully describe model misconceptions via Clarify, improving worst-group accuracy by an average of 7.3% in two datasets with spurious correlations. Finally, we use Clarify to find and rectify 31 novel spurious correlations in ImageNet, improving minority-split accuracy from 21.1% to 28.7%.",
        "keywords": "Spurious correlations;human-computer interaction;natural language feedback;vision-language models",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/d5f87306a91f5b145df7ee5f74f8345abc398422.zip",
        "author": "Yoonho Lee;Michelle Lam;Helena Vasconcelos;Michael S. Bernstein;Chelsea Finn",
        "authorids": "~Yoonho_Lee1;mlam4@cs.stanford.edu;~Helena_Vasconcelos1;~Michael_S._Bernstein1;~Chelsea_Finn1",
        "gender": "M;;F;M;F",
        "homepage": "https://yoonholee.com/;;http://helenavasc.com;http://hci.stanford.edu/msb/;https://ai.stanford.edu/~cbfinn/",
        "dblp": "213/8086;;;48/2547;131/1783",
        "google_scholar": "https://scholar.google.co.kr/citations?user=BAAZ_ysAAAAJ;;;https://scholar.google.com.tw/citations?user=zkhHirIAAAAJ;vfPE6hgAAAAJ",
        "orcid": ";;;0000-0001-8020-9434;",
        "linkedin": ";;;;",
        "or_profile": "~Yoonho_Lee1;mlam4@cs.stanford.edu;~Helena_Vasconcelos1;~Michael_S._Bernstein1;~Chelsea_Finn1",
        "aff": "Stanford University;;Stanford University;Computer Science Department, Stanford University;Google",
        "aff_domain": "stanford.edu;;stanford.edu;cs.stanford.edu;google.com",
        "position": "PhD student;;Undergrad student;Associate Professor;Research Scientist",
        "bibtex": "@misc{\nlee2024interactive,\ntitle={Interactive Model Correction with Natural Language},\nauthor={Yoonho Lee and Michelle Lam and Helena Vasconcelos and Michael S. Bernstein and Chelsea Finn},\nyear={2024},\nurl={https://openreview.net/forum?id=xrFTey4pY6}\n}",
        "github": "",
        "project": "",
        "reviewers": "9tpF;4msS;DRXt",
        "site": "https://openreview.net/forum?id=xrFTey4pY6",
        "pdf_size": 6086375,
        "rating": "5;5;6",
        "confidence": "3;4;4",
        "soundness": "3;2;3",
        "contribution": "2;2;3",
        "presentation": "2;2;3",
        "wc_summary": "100;91;75",
        "wc_strengths": "36;30;50",
        "wc_weaknesses": "107;432;149",
        "wc_questions": "90;273;22",
        "wc_review": "333;826;296",
        "wc_reply_reviewers": "0;241;0",
        "wc_reply_authors": "790;2226;621",
        "reply_reviewers": "0;1;0",
        "reply_authors": "3;4;3",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            88.66666666666667,
            10.338708279513883
        ],
        "wc_strengths_avg": [
            38.666666666666664,
            8.379870059984356
        ],
        "wc_weaknesses_avg": [
            229.33333333333334,
            144.32909924505483
        ],
        "wc_questions_avg": [
            128.33333333333334,
            105.99475878027596
        ],
        "wc_review_avg": [
            485.0,
            241.59608164592956
        ],
        "wc_reply_reviewers_avg": [
            80.33333333333333,
            113.60848951063865
        ],
        "wc_reply_authors_avg": [
            1212.3333333333333,
            720.0834828144735
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11083093937583274855&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "Stanford University;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.stanford.edu;https://www.google.com",
        "aff_unique_abbr": "Stanford;Google",
        "aff_campus_unique_index": "0;0;0;1",
        "aff_campus_unique": "Stanford;Mountain View",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Inherently Interpretable Time Series Classification via Multiple Instance Learning",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17442",
        "id": "xriGRsoAza",
        "author_site": "Joseph Early, Gavin Cheung, Kurt Cutajar, Hanting Xie, Jas Kandola, Niall Twomey",
        "tldr": "",
        "abstract": "Conventional Time Series Classification (TSC) methods are often black boxes that obscure inherent interpretation of their decision-making processes. In this work, we leverage Multiple Instance Learning (MIL) to overcome this issue, and propose a new framework called MILLET: Multiple Instance Learning for Locally Explainable Time series classification. We apply MILLET to existing deep learning TSC models and show how they become inherently interpretable without compromising (and in some cases, even improving) predictive performance. We evaluate MILLET on 85 UCR TSC datasets and also present a novel synthetic dataset that is specially designed to facilitate interpretability evaluation. On these datasets, we show MILLET produces sparse explanations quickly that are of higher quality than other well-known interpretability methods. To the best of our knowledge, our work with MILLET is the first to develop general MIL methods for TSC and apply them to an extensive variety of domains.",
        "keywords": "Multiple Instance Learning;Time Series Classification;Interpretability",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/f50a6676872569b94e92b277ba8a1043e9184901.zip",
        "author": "Joseph Early;Gavin Cheung;Kurt Cutajar;Hanting Xie;Jas Kandola;Niall Twomey",
        "authorids": "~Joseph_Early1;~Gavin_Cheung1;~Kurt_Cutajar1;~Hanting_Xie1;~Jas_Kandola1;~Niall_Twomey1",
        "gender": "M;;M;M;M;",
        "homepage": "https://www.jearly.co.uk/;;http://kurtcutajar.com;;https://www.researchgate.net/profile/Jaz-Kandola;https://nialltwomey.com",
        "dblp": "239/4193;;182/8946;170/5352;;55/10941",
        "google_scholar": "iJ4qvd4AAAAJ;MwcZYZkAAAAJ;ieMVWCMAAAAJ;PNn7HskAAAAJ;https://scholar.google.com/scholar?hl=en;bRN8Y34AAAAJ",
        "orcid": ";;;;;0000-0002-3225-2654",
        "linkedin": "joseph-early-ai/;;kurt-cutajar-643b0886/;hanting-xie;;nialltwomey",
        "or_profile": "~Joseph_Early1;~Gavin_Cheung1;~Kurt_Cutajar1;~Hanting_Xie1;~Jas_Kandola1;~Niall_Twomey1",
        "aff": "Helsing;Amazon;Amazon;Amazon;Amazon;Amazon",
        "aff_domain": "helsing.ai;amazon.com;amazon.com;amzon.com;amazon.com;amazon.com",
        "position": "Researcher;Researcher;Applied Scientist;Researcher;Principal Researcher;Researcher",
        "bibtex": "@inproceedings{\nearly2024inherently,\ntitle={Inherently Interpretable Time Series Classification via Multiple Instance Learning},\nauthor={Joseph Early and Gavin Cheung and Kurt Cutajar and Hanting Xie and Jas Kandola and Niall Twomey},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=xriGRsoAza}\n}",
        "github": "",
        "project": "",
        "reviewers": "Yc2u;uQF7;pSU6;NeUd",
        "pdf_size": 7062781,
        "rating": "8;8;8;8",
        "confidence": "4;4;4;3",
        "soundness": "3;3;4;3",
        "contribution": "3;3;4;3",
        "presentation": "3;3;4;3",
        "wc_summary": "48;16;64;120",
        "wc_strengths": "192;36;5;199",
        "wc_weaknesses": "167;107;8;205",
        "wc_questions": "78;8;31;134",
        "wc_review": "485;167;108;658",
        "wc_reply_reviewers": "104;5;27;173",
        "wc_reply_authors": "567;419;126;513",
        "reply_reviewers": "2;1;1;1",
        "reply_authors": "2;1;2;2",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            62.0,
            37.68288736283355
        ],
        "wc_strengths_avg": [
            108.0,
            88.21847878987712
        ],
        "wc_weaknesses_avg": [
            121.75,
            74.38875923148605
        ],
        "wc_questions_avg": [
            62.75,
            48.25647624930772
        ],
        "wc_review_avg": [
            354.5,
            226.41830756367736
        ],
        "wc_reply_reviewers_avg": [
            77.25,
            66.38665151971442
        ],
        "wc_reply_authors_avg": [
            406.25,
            170.24889867485194
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 20,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15670183530456260251&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 9,
        "openreview": "https://openreview.net/forum?id=xriGRsoAza",
        "pdf": "https://openreview.net/pdf?id=xriGRsoAza",
        "email": "helsing.ai;amazon.com;amazon.com;amzon.com;amazon.com;amazon.com",
        "author_num": 6,
        "aff_unique_index": "0;1;1;1;1;1",
        "aff_unique_norm": "Helsing;Amazon",
        "aff_unique_dep": ";Amazon.com, Inc.",
        "aff_unique_url": ";https://www.amazon.com",
        "aff_unique_abbr": ";Amazon",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "1;1;1;1;1",
        "aff_country_unique": ";United States"
    },
    {
        "title": "FLD: Fourier Latent Dynamics for Structured Motion Representation and Learning",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17441",
        "id": "xsd2llWYSA",
        "author_site": "Chenhao Li, Elijah Stanger-Jones, Steve Heim, Sang bae Kim",
        "tldr": "",
        "abstract": "Motion trajectories offer reliable references for physics-based motion learning but suffer from sparsity, particularly in regions that lack sufficient data coverage. To address this challenge, we introduce a self-supervised, structured representation and generation method that extracts spatial-temporal relationships in periodic or quasi-periodic motions. The motion dynamics in a continuously parameterized latent space enable our method to enhance the interpolation and generalization capabilities of motion learning algorithms. The motion learning controller, informed by the motion parameterization, operates online tracking of a wide range of motions, including targets unseen during training. With a fallback mechanism, the controller dynamically adapts its tracking strategy and automatically resorts to safe action execution when a potentially risky target is proposed. By leveraging the identified spatial-temporal structure, our work opens new possibilities for future advancements in general motion representation and learning algorithms.",
        "keywords": "latent dynamics;motion representation and generation;representation learning;reinforcement learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/4c04baf910f4b10981278724bbc1cb2914d5e1aa.zip",
        "author": "Chenhao Li;Elijah Stanger-Jones;Steve Heim;Sang bae Kim",
        "authorids": "~Chenhao_Li3;~Elijah_Stanger-Jones1;~Steve_Heim1;~Sang_bae_Kim1",
        "gender": ";;M;M",
        "homepage": "https://breadli428.github.io/;;https://sheim.github.io/;https://biomimetics.mit.edu/",
        "dblp": "186/9145;;;",
        "google_scholar": "kw1-DxQAAAAJ;;Z9pNoygAAAAJ;",
        "orcid": ";;;",
        "linkedin": "chenhao-li-86080b1b0/;elijah-stanger-jones-216b10126/;;",
        "or_profile": "~Chenhao_Li3;~Elijah_Stanger-Jones1;~Steve_Heim1;~Sang_bae_Kim1",
        "aff": "ETHZ - ETH Zurich;Massachusetts Institute of Technology;Massachusetts Institute of Technology;Massachusetts Institute of Technology",
        "aff_domain": "ethz.ch;mit.edu;mit.edu;mit.edu",
        "position": "PhD student;PhD student;Postdoc;Full Professor",
        "bibtex": "@inproceedings{\nli2024fld,\ntitle={{FLD}: Fourier Latent Dynamics for Structured Motion Representation and Learning},\nauthor={Chenhao Li and Elijah Stanger-Jones and Steve Heim and Sang bae Kim},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=xsd2llWYSA}\n}",
        "github": "",
        "project": "",
        "reviewers": "itfQ;Sghv;RFvT",
        "pdf_size": 7703827,
        "rating": "6;8;8",
        "confidence": "4;2;4",
        "soundness": "3;4;3",
        "contribution": "2;3;3",
        "presentation": "3;3;3",
        "wc_summary": "160;234;128",
        "wc_strengths": "116;258;87",
        "wc_weaknesses": "240;165;290",
        "wc_questions": "82;97;56",
        "wc_review": "598;754;561",
        "wc_reply_reviewers": "89;16;67",
        "wc_reply_authors": "1633;1935;1505",
        "reply_reviewers": "1;1;1",
        "reply_authors": "5;4;4",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            174.0,
            44.39219150556398
        ],
        "wc_strengths_avg": [
            153.66666666666666,
            74.71873184743495
        ],
        "wc_weaknesses_avg": [
            231.66666666666666,
            51.370116691408136
        ],
        "wc_questions_avg": [
            78.33333333333333,
            16.937794687883333
        ],
        "wc_review_avg": [
            637.6666666666666,
            83.63545234461812
        ],
        "wc_reply_reviewers_avg": [
            57.333333333333336,
            30.575952787916336
        ],
        "wc_reply_authors_avg": [
            1691.0,
            180.2738657339623
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11744129754200821363&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=xsd2llWYSA",
        "pdf": "https://openreview.net/pdf?id=xsd2llWYSA",
        "email": "ethz.ch;mit.edu;mit.edu;mit.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "ETH Zurich;Massachusetts Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ethz.ch;https://web.mit.edu",
        "aff_unique_abbr": "ETHZ;MIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "Switzerland;United States"
    },
    {
        "id": "xsts7MRLey",
        "title": "DEEP UNSUPERVISED DOMAIN ADAPTATION FOR TIME SERIES CLASSIFICATION: A BENCHMARK",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Unsupervised Domain Adaptation (UDA) aims to harness labeled source data to train models for unlabeled target data. Despite extensive research in domains like computer vision and natural language processing, UDA remains underexplored for time series data, which has widespread real-world applications ranging from medicine and manufacturing to earth observation and human activity recognition. Our paper addresses this gap by introducing a comprehensive benchmark for evaluating UDA techniques for time series classification, with a focus on deep learning methods. We provide seven new benchmark datasets covering various domain shifts and temporal dynamics, facilitating fair and standardized UDA method assessments with state of the art neural network backbones (e.g. Inception) for time series data. This benchmark offers insights into the strengths and limitations of the evaluated approaches while preserving the unsupervised nature of domain adaptation, making it directly applicable to practical problems. Our paper serves as a vital resource for researchers and practitioners, advancing domain adaptation solutions for time series data and fostering innovation in this critical field.",
        "keywords": "Time series data;Unsupervised domain adaptation;Benchmark",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Hassan Ismail Fawaz;Ganesh Del Grosso;Tanguy Kerdoncuff;Aurelie Boisbunon;Illyyne Saffar",
        "authorids": "~Hassan_Ismail_Fawaz1;~Ganesh_Del_Grosso1;~Tanguy_Kerdoncuff1;~Aurelie_Boisbunon1;~Illyyne_Saffar1",
        "gender": ";M;M;F;F",
        "homepage": ";;https://hv0nnus.github.io/;http://aboisbunon.github.io/;",
        "dblp": ";;;148/9861;",
        "google_scholar": "oUrGNaoAAAAJ;;https://scholar.google.com/citations?hl=en;mwuzuB8AAAAJ;https://scholar.google.com/citations?hl=fr",
        "orcid": ";;0000-0001-9209-3096;;",
        "linkedin": ";ganesh-del-grosso-732007175/;;aur%C3%A9lie-boisbunon-370113177/;illyynesaffar/",
        "or_profile": "~Hassan_Ismail_Fawaz1;~Ganesh_Del_Grosso1;~Tanguy_Kerdoncuff1;~Aurelie_Boisbunon1;~Illyyne_Saffar1",
        "aff": "Ericsson;;;Ericsson;Ericsson",
        "aff_domain": "ericsson.com;;;ericsson.com;ericsson.com",
        "position": "Researcher;;;Researcher;Researcher",
        "bibtex": "@misc{\nfawaz2024deep,\ntitle={{DEEP} {UNSUPERVISED} {DOMAIN} {ADAPTATION} {FOR} {TIME} {SERIES} {CLASSIFICATION}: A {BENCHMARK}},\nauthor={Hassan Ismail Fawaz and Ganesh Del Grosso and Tanguy Kerdoncuff and Aurelie Boisbunon and Illyyne Saffar},\nyear={2024},\nurl={https://openreview.net/forum?id=xsts7MRLey}\n}",
        "github": "",
        "project": "",
        "reviewers": "hmFL;KuTn;wzDS",
        "site": "https://openreview.net/forum?id=xsts7MRLey",
        "pdf_size": 2251960,
        "rating": "3;5;6",
        "confidence": "4;3;3",
        "soundness": "2;2;3",
        "contribution": "1;2;4",
        "presentation": "2;2;3",
        "wc_summary": "43;47;165",
        "wc_strengths": "41;52;184",
        "wc_weaknesses": "217;127;246",
        "wc_questions": "5;3;49",
        "wc_review": "306;229;644",
        "wc_reply_reviewers": "272;148;32",
        "wc_reply_authors": "900;754;576",
        "reply_reviewers": "1;1;1",
        "reply_authors": "2;2;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            85.0,
            56.592107812544555
        ],
        "wc_strengths_avg": [
            92.33333333333333,
            64.97349887112095
        ],
        "wc_weaknesses_avg": [
            196.66666666666666,
            50.66447363674954
        ],
        "wc_questions_avg": [
            19.0,
            21.228911104120876
        ],
        "wc_review_avg": [
            393.0,
            180.24612802128834
        ],
        "wc_reply_reviewers_avg": [
            150.66666666666666,
            97.99773240006911
        ],
        "wc_reply_authors_avg": [
            743.3333333333334,
            132.48731595473166
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.9449111825230683,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6588689824423293640&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Ericsson",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ericsson.com",
        "aff_unique_abbr": "Ericsson",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Sweden"
    },
    {
        "title": "Dual RL: Unification and New Methods for Reinforcement and Imitation Learning",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17440",
        "id": "xt9Bu66rqv",
        "author_site": "Harshit Sikchi, Qinqing Zheng, Amy Zhang, Scott Niekum",
        "tldr": "",
        "abstract": "The goal of reinforcement learning (RL) is to find a policy that maximizes the expected cumulative return. It has been shown that this objective can be represented as an optimization problem of state-action visitation distribution under linear constraints. The dual problem of this formulation, which we refer to as *dual RL*, is unconstrained and easier to optimize. In this work, we first cast several state-of-the-art offline RL and offline imitation learning (IL) algorithms as instances of dual RL approaches with shared structures. Such unification allows us to identify the root cause of the shortcomings of prior methods. For offline IL, our analysis shows that prior methods are based on a restrictive coverage assumption that greatly limits their performance in practice. To fix this limitation, we propose a new discriminator-free method ReCOIL that learns to imitate from arbitrary off-policy data to obtain near-expert performance. For offline RL, our analysis frames a recent offline RL method XQL in the dual framework, and we further propose a new method $f$-DVL that provides alternative choices to the Gumbel regression loss that fixes the known training instability issue of XQL. The performance improvements by both of our proposed methods, ReCOIL and $f$-DVL, in IL and RL are validated on an extensive suite of simulated robot locomotion and manipulation tasks.",
        "keywords": "Robot Learning;Offline Imitation Learning;Offline Reinforcement Learning;Deep Reinforcement Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/a980e449192699b610c6e3ee69309be5fbbd5161.zip",
        "author": "Harshit Sikchi;Qinqing Zheng;Amy Zhang;Scott Niekum",
        "authorids": "~Harshit_Sikchi1;~Qinqing_Zheng1;~Amy_Zhang1;~Scott_Niekum1",
        "gender": "M;;M;F",
        "homepage": "https://hari-sikchi.github.io/;https://enosair.github.io;https://people.cs.umass.edu/~sniekum/index.php;",
        "dblp": "271/4663;160/8439;62/8399;43/2754",
        "google_scholar": "jFOPZE0AAAAJ;Jwnl3v0AAAAJ;4wXYfSUAAAAJ;",
        "orcid": ";0000-0003-1096-9635;;",
        "linkedin": ";;;",
        "or_profile": "~Harshit_Sikchi1;~Qinqing_Zheng1;~Scott_Niekum1;~Amy_Zhang2",
        "aff": "University of Texas, Austin;Meta Facebook;University of Massachusetts at Amherst;Meta Facebook",
        "aff_domain": "utexas.edu;fb.com;umass.edu;facebook.com",
        "position": "PhD student;Researcher;Associate Professor;Research Scientist",
        "bibtex": "@inproceedings{\nsikchi2024dual,\ntitle={Dual {RL}: Unification and New Methods for Reinforcement and Imitation Learning},\nauthor={Harshit Sikchi and Qinqing Zheng and Amy Zhang and Scott Niekum},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=xt9Bu66rqv}\n}",
        "github": "",
        "project": "",
        "reviewers": "JKJA;NyfP;7FxJ;aLZ7",
        "pdf_size": 4448101,
        "rating": "6;6;8;10",
        "confidence": "4;4;4;4",
        "soundness": "2;3;3;4",
        "contribution": "3;3;3;4",
        "presentation": "3;3;3;3",
        "wc_summary": "73;52;63;191",
        "wc_strengths": "68;85;48;134",
        "wc_weaknesses": "96;69;44;638",
        "wc_questions": "637;102;574;150",
        "wc_review": "874;308;729;1113",
        "wc_reply_reviewers": "0;0;188;115",
        "wc_reply_authors": "1418;887;755;1288",
        "reply_reviewers": "0;0;3;1",
        "reply_authors": "3;3;2;3",
        "rating_avg": [
            7.5,
            1.6583123951777
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            94.75,
            56.06413737854173
        ],
        "wc_strengths_avg": [
            83.75,
            31.830606340439072
        ],
        "wc_weaknesses_avg": [
            211.75,
            246.78165956975005
        ],
        "wc_questions_avg": [
            365.75,
            241.3797578505704
        ],
        "wc_review_avg": [
            756.0,
            292.74818530607496
        ],
        "wc_reply_reviewers_avg": [
            75.75,
            80.02616759535596
        ],
        "wc_reply_authors_avg": [
            1087.0,
            273.9461625940396
        ],
        "reply_reviewers_avg": [
            1.0,
            1.224744871391589
        ],
        "reply_authors_avg": [
            2.75,
            0.4330127018922193
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 28,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1597588923904550246&as_sdt=10005&sciodt=0,8&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=xt9Bu66rqv",
        "pdf": "https://openreview.net/pdf?id=xt9Bu66rqv",
        "email": "utexas.edu;fb.com;umass.edu;facebook.com",
        "author_num": 4,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "University of Texas at Austin;Meta;University of Massachusetts Amherst",
        "aff_unique_dep": ";Meta Platforms, Inc.;",
        "aff_unique_url": "https://www.utexas.edu;https://meta.com;https://www.umass.edu",
        "aff_unique_abbr": "UT Austin;Meta;UMass Amherst",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Austin;;Amherst",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "TACTiS-2: Better, Faster, Simpler Attentional Copulas for Multivariate Time Series",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17439",
        "id": "xtOydkE1Ku",
        "author_site": "Arjun Ashok, \u00c9tienne Marcotte, Valentina Zantedeschi, Nicolas Chapados, Alexandre Drouin",
        "tldr": "",
        "abstract": "We introduce a new model for multivariate probabilistic time series prediction, designed to flexibly address a range of tasks including forecasting, interpolation, and their combinations. Building on copula theory, we propose a simplified objective for the recently-introduced transformer-based attentional copulas (TACTiS), wherein the number of distributional parameters now scales linearly with the number of variables instead of factorially. The new objective requires the introduction of a training curriculum, which goes hand-in-hand with necessary changes to the original architecture. We show that the resulting model has significantly better training dynamics and achieves state-of-the-art performance across diverse real-world forecasting tasks, while maintaining the flexibility of prior work, such as seamless handling of unaligned and unevenly-sampled time series. Code is made available at https://github.com/ServiceNow/TACTiS.",
        "keywords": "time series;forecasting;probabilistic;multivariate;copula;transformer;density estimation",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Arjun Ashok;\u00c9tienne Marcotte;Valentina Zantedeschi;Nicolas Chapados;Alexandre Drouin",
        "authorids": "~Arjun_Ashok1;~\u00c9tienne_Marcotte1;~Valentina_Zantedeschi2;~Nicolas_Chapados1;~Alexandre_Drouin2",
        "gender": "M;;F;M;M",
        "homepage": "https://ashok-arjun.github.io/;;http://vzantedeschi.com/;;https://alexdrouin.com",
        "dblp": "https://dblp.uni-trier.de/pid/318/2945;;179/2187;58/1013;117/3861",
        "google_scholar": "https://scholar.google.com/citations?hl=en;https://scholar.google.com/citations?hl=en;tdUUrS8AAAAJ;QdnjDj8AAAAJ;https://scholar.google.ca/citations?user=LR6aJcEAAAAJ",
        "orcid": ";;;;0000-0001-7718-0319",
        "linkedin": ";https://linkedin.com/in/e-marcotte;valentina-zantedeschi-36a65a83/;;drouinalexandre/",
        "or_profile": "~Arjun_Ashok1;~\u00c9tienne_Marcotte1;~Valentina_Zantedeschi2;~Nicolas_Chapados1;~Alexandre_Drouin2",
        "aff": "ServiceNow Research;ServiceNow Research;ServiceNow Research;ServiceNow Research;ServiceNow Research ",
        "aff_domain": "servicenow.com;servicenow.com;servicenow.com;servicenow.com;servicenow.com",
        "position": "Researcher;Researcher;Researcher;VP Research;Research Scientist",
        "bibtex": "@inproceedings{\nashok2024tactis,\ntitle={{TACT}iS-2: Better, Faster, Simpler Attentional Copulas for Multivariate Time Series},\nauthor={Arjun Ashok and {\\'E}tienne Marcotte and Valentina Zantedeschi and Nicolas Chapados and Alexandre Drouin},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=xtOydkE1Ku}\n}",
        "github": "",
        "project": "",
        "reviewers": "s9Tw;NV8k;sGoi;GAmJ",
        "pdf_size": 2978769,
        "rating": "5;5;6;8",
        "confidence": "4;3;3;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "4;3;3;4",
        "wc_summary": "112;84;52;71",
        "wc_strengths": "90;60;30;87",
        "wc_weaknesses": "186;161;120;133",
        "wc_questions": "46;161;7;38",
        "wc_review": "434;466;209;329",
        "wc_reply_reviewers": "170;397;0;0",
        "wc_reply_authors": "2695;1432;1006;1232",
        "reply_reviewers": "3;5;0;0",
        "reply_authors": "9;6;3;4",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            79.75,
            21.821720830401986
        ],
        "wc_strengths_avg": [
            66.75,
            24.221632892932714
        ],
        "wc_weaknesses_avg": [
            150.0,
            25.524498036200438
        ],
        "wc_questions_avg": [
            63.0,
            58.42516581063335
        ],
        "wc_review_avg": [
            359.5,
            100.58951237579393
        ],
        "wc_reply_reviewers_avg": [
            141.75,
            162.8931781874244
        ],
        "wc_reply_authors_avg": [
            1591.25,
            654.8287466964168
        ],
        "reply_reviewers_avg": [
            2.0,
            2.1213203435596424
        ],
        "reply_authors_avg": [
            5.5,
            2.29128784747792
        ],
        "replies_avg": [
            39,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.4714045207910316,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3313910961133966717&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=xtOydkE1Ku",
        "pdf": "https://openreview.net/pdf?id=xtOydkE1Ku",
        "email": "servicenow.com;servicenow.com;servicenow.com;servicenow.com;servicenow.com",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "ServiceNow",
        "aff_unique_dep": "Research",
        "aff_unique_url": "https://www.servicenow.com",
        "aff_unique_abbr": "ServiceNow",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "xuKVVYxU5D",
        "title": "Single-Trajectory Distributionally Robust Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "To mitigate the limitation that the classical reinforcement learning (RL) framework heavily relies on identical training and test environments, Distributionally Robust RL (DRRL) has been proposed to enhance performance across a range of environments, possibly including unknown test environments. As a price for robustness gain, DRRL involves optimizing over a set of distributions, which is inherently more challenging than optimizing over a fixed distribution in the non-robust case. Existing DRRL algorithms are either model-based or fail to learn from a single sample trajectory. In this paper, we design the first fully model-free DRRL algorithm, called distributionally robust Q-learning with single trajectory (DRQ). We delicately design a multi-timescale framework to fully utilize each incrementally arriving sample and directly learn the optimal distributionally robust policy without modeling the environment, thus the algorithm can be trained along a single trajectory in a model-free fashion. Despite the algorithm's complexity, we provide asymptotic convergence guarantees by generalizing classical stochastic approximation tools. Comprehensive experimental results demonstrate the superior robustness and sample complexity of our proposed algorithm, compared to non-robust methods and other robust RL algorithms.",
        "keywords": "Distributionally Robust Optimization;Single-Trajectory;Reinforcement Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/1df49bd97d4199dce9e8998b3453e5a3681cde9a.zip",
        "author": "Zhipeng Liang;Xiaoteng Ma;Jose Blanchet;Jun Yang;Jiheng Zhang;Zhengyuan Zhou",
        "authorids": "~Zhipeng_Liang1;~Xiaoteng_Ma1;~Jose_Blanchet1;~Jun_Yang6;~Jiheng_Zhang1;~Zhengyuan_Zhou2",
        "gender": ";M;M;M;;M",
        "homepage": ";https://xtma.github.io/;https://web.stanford.edu/~jblanche/;;https://reijz.github.io;https://scholar.google.com/citations?user=hiGI9v0AAAAJ&hl=en",
        "dblp": "225/7683.html;238/3249;75/5093.html;;13/7602;125/5270",
        "google_scholar": ";CeDFnNMAAAAJ;https://scholar.google.co.in/citations?user=O24CcQQAAAAJ;ZrgN9ssAAAAJ;;",
        "orcid": "0000-0002-3101-5673;0000-0002-7250-6268;;;;",
        "linkedin": "zhipeng-liang-958977204/;;jose-blanchet;;;",
        "or_profile": "~Zhipeng_Liang1;~Xiaoteng_Ma1;~Jose_Blanchet1;~Jun_Yang6;~Jiheng_Zhang1;~Zhengyuan_Zhou2",
        "aff": "Hong Kong University of Science and Technology;;Stanford University;Tsinghua University;Hong Kong University of Science and Technology;New York University",
        "aff_domain": "hkust.edu;;stanford.edu;tsinghua.edu.cn;ust.hk;nyu.edu",
        "position": "PhD student;;Professor;Assistant Professor;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nliang2024singletrajectory,\ntitle={Single-Trajectory Distributionally Robust Reinforcement Learning},\nauthor={Zhipeng Liang and Xiaoteng Ma and Jose Blanchet and Jun Yang and Jiheng Zhang and Zhengyuan Zhou},\nyear={2024},\nurl={https://openreview.net/forum?id=xuKVVYxU5D}\n}",
        "github": "",
        "project": "",
        "reviewers": "7vQe;JJMJ;DkEx;UFU7;ogVe",
        "site": "https://openreview.net/forum?id=xuKVVYxU5D",
        "pdf_size": 5253882,
        "rating": "3;3;6;6;8",
        "confidence": "4;3;5;2;4",
        "soundness": "2;2;3;3;3",
        "contribution": "2;2;2;3;2",
        "presentation": "2;1;2;3;3",
        "wc_summary": "33;47;68;69;61",
        "wc_strengths": "30;27;41;92;43",
        "wc_weaknesses": "101;55;225;59;93",
        "wc_questions": "53;144;88;2;20",
        "wc_review": "217;273;422;222;217",
        "wc_reply_reviewers": "0;433;112;0;30",
        "wc_reply_authors": "832;1362;1312;711;1583",
        "reply_reviewers": "0;1;2;0;1",
        "reply_authors": "2;3;6;2;4",
        "rating_avg": [
            5.2,
            1.9390719429665317
        ],
        "confidence_avg": [
            3.6,
            1.019803902718557
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.2,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            55.6,
            13.763720427268202
        ],
        "wc_strengths_avg": [
            46.6,
            23.51680250374187
        ],
        "wc_weaknesses_avg": [
            106.6,
            61.90831931170478
        ],
        "wc_questions_avg": [
            61.4,
            50.68175214019342
        ],
        "wc_review_avg": [
            270.2,
            78.78426238786525
        ],
        "wc_reply_reviewers_avg": [
            115.0,
            164.19987819727515
        ],
        "wc_reply_authors_avg": [
            1160.0,
            332.2715756726717
        ],
        "reply_reviewers_avg": [
            0.8,
            0.7483314773547883
        ],
        "reply_authors_avg": [
            3.4,
            1.4966629547095764
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.14159484396097857,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15318649337541386877&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 11,
        "aff_unique_index": "0;1;2;0;3",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Stanford University;Tsinghua University;New York University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.ust.hk;https://www.stanford.edu;https://www.tsinghua.edu.cn;https://www.nyu.edu",
        "aff_unique_abbr": "HKUST;Stanford;THU;NYU",
        "aff_campus_unique_index": "0;1;0",
        "aff_campus_unique": "Hong Kong SAR;Stanford;",
        "aff_country_unique_index": "0;1;0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "ClimODE: Climate and Weather Forecasting with Physics-informed Neural ODEs",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17438",
        "id": "xuY33XhEGR",
        "author_site": "Yogesh Verma, Markus Heinonen, Vikas Garg",
        "tldr": "",
        "abstract": "Climate and weather prediction traditionally relies on complex numerical simulations of atmospheric physics. Deep learning approaches, such as transformers, have recently challenged the simulation paradigm with complex network forecasts. However, they often act as data-driven black-box models that neglect the underlying physics and lack uncertainty quantification. We address these limitations with ClimODE, a  spatiotemporal continuous-time process that implements a key principle of advection from statistical mechanics, namely, weather changes due to a spatial movement of quantities over time. ClimODE models precise weather evolution with value-conserving dynamics, learning global weather transport as a neural flow, which also enables estimating the uncertainty in predictions. Our approach outperforms existing data-driven methods in global and regional forecasting with an order of magnitude smaller parameterization, establishing a new state of the art.",
        "keywords": "neural ODE;time-series forecasting;climate prediction;physics-informed ML",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/4ab11e1b180cfcb265a6b4d81efec2238b2ee878.zip",
        "author": "Yogesh Verma;Markus Heinonen;Vikas Garg",
        "authorids": "~Yogesh_Verma1;~Markus_Heinonen1;~Vikas_Garg2",
        "gender": "M;M;",
        "homepage": "https://yoverma.github.io/yoerma.github.io/;https://users.aalto.fi/~heinom10/;",
        "dblp": "284/2155;22/7709;",
        "google_scholar": "9W9u4owAAAAJ;hFtfHZoAAAAJ;",
        "orcid": ";;",
        "linkedin": "yogeshverma1998/;;",
        "or_profile": "~Yogesh_Verma1;~Markus_Heinonen1;~Vikas_Garg2",
        "aff": "Aalto University;Aalto University;",
        "aff_domain": "aalto.fi;aalto.fi;",
        "position": "PhD student;Researcher;",
        "bibtex": "@inproceedings{\nverma2024climode,\ntitle={Clim{ODE}: Climate and Weather Forecasting with Physics-informed Neural {ODE}s},\nauthor={Yogesh Verma and Markus Heinonen and Vikas Garg},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=xuY33XhEGR}\n}",
        "github": "",
        "project": "",
        "reviewers": "MKLC;THXC;K2uQ;F1k5",
        "pdf_size": 6727489,
        "rating": "8;8;8;8",
        "confidence": "4;4;3;3",
        "soundness": "4;3;3;4",
        "contribution": "3;4;3;3",
        "presentation": "3;4;4;4",
        "wc_summary": "119;181;81;43",
        "wc_strengths": "204;105;144;73",
        "wc_weaknesses": "352;357;103;38",
        "wc_questions": "205;133;2;122",
        "wc_review": "880;776;330;276",
        "wc_reply_reviewers": "56;74;18;0",
        "wc_reply_authors": "1889;1911;522;995",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "4;4;2;3",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            106.0,
            50.96076922496363
        ],
        "wc_strengths_avg": [
            131.5,
            48.82878249557324
        ],
        "wc_weaknesses_avg": [
            212.5,
            143.8584373611781
        ],
        "wc_questions_avg": [
            115.5,
            72.87146217827662
        ],
        "wc_review_avg": [
            565.5,
            265.74941204074184
        ],
        "wc_reply_reviewers_avg": [
            37.0,
            29.410882339705484
        ],
        "wc_reply_authors_avg": [
            1329.25,
            594.7959208837935
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.25,
            0.82915619758885
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 46,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4783804866436695343&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=xuY33XhEGR",
        "pdf": "https://openreview.net/pdf?id=xuY33XhEGR",
        "email": "aalto.fi;aalto.fi;",
        "author_num": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Aalto University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.aalto.fi",
        "aff_unique_abbr": "Aalto",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Finland"
    },
    {
        "id": "xuxYaBMd9F",
        "title": "Efficient Long Sequence Modeling via State Space Augmented Transformer",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Transformer models have achieved superior performance in various natural language processing tasks. However, the quadratic computational cost of the attention mechanism limits its practicality for long sequences. There are existing attention variants that improve the computational efficiency, but they have limited ability to effectively compute global information. In parallel to Transformer models, state space models (SSMs) are tailored for long sequences, but they are not flexible enough to capture complicated local information. We propose SPADE, short for State Space Augmented Transformer. Specifically, we augment a SSM into the bottom layer of SPADE, and we employ efficient local attention methods for the other layers. The SSM augments global information, which complements the lack of long-range dependency issue in local attention methods. Experimental results on the Long Range Arena benchmark and language modeling tasks demonstrate the effectiveness of the proposed method. To further demonstrate the scalability of SPADE, we pre-train large encoder-decoder models and present fine-tuning results on natural language understanding and natural language generation tasks. Our code and pre-trained model checkpoints will be publicly available.",
        "keywords": "long sequence;language models",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/548d541393786fc0ab6fd9f2c0d8120e1b84277a.zip",
        "author": "Simiao Zuo;Xiaodong Liu;Jian Jiao;Denis X Charles;Eren Manavoglu;Tuo Zhao;Jianfeng Gao",
        "authorids": "~Simiao_Zuo1;~Xiaodong_Liu1;~Jian_Jiao2;~Denis_X_Charles1;~Eren_Manavoglu1;~Tuo_Zhao1;~Jianfeng_Gao1",
        "gender": ";;M;M;;M;M",
        "homepage": ";;;;;http://www2.isye.gatech.edu/~tzhao80;https://www.microsoft.com/en-us/research/people/jfgao/",
        "dblp": "232/2089;65/622;29/265-7.html;04/3166.html;96/5104;;92/5339",
        "google_scholar": "J8TSTXMAAAAJ;NIewcxMAAAAJ;D6KwmF8AAAAJ;Vj8VHusAAAAJ;;EJXN6tYAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;0000-0003-4779-9588;;;;",
        "linkedin": ";;jian-jiao-82897810/;denis-charles-791508b8/;;;",
        "or_profile": "~Simiao_Zuo1;~Xiaodong_Liu1;~Jian_Jiao2;~Denis_X_Charles1;~Eren_Manavoglu1;~Tuo_Zhao1;~Jianfeng_Gao1",
        "aff": "Microsoft;Microsoft Research;Microsoft;;;Georgia Institute of Technology;Microsoft Research",
        "aff_domain": "microsoft.com;microsoft.com;microsoft.com;;;gatech.edu;microsoft.com",
        "position": "Researcher;Researcher;Principal Researcher;;;Associate Professor;Principal Researcher",
        "bibtex": "@misc{\nzuo2024efficient,\ntitle={Efficient Long Sequence Modeling via State Space Augmented Transformer},\nauthor={Simiao Zuo and Xiaodong Liu and Jian Jiao and Denis X Charles and Eren Manavoglu and Tuo Zhao and Jianfeng Gao},\nyear={2024},\nurl={https://openreview.net/forum?id=xuxYaBMd9F}\n}",
        "github": "",
        "project": "",
        "reviewers": "w8HW;iRvY;6SGN;QKEi;o9d9",
        "site": "https://openreview.net/forum?id=xuxYaBMd9F",
        "pdf_size": 1419772,
        "rating": "3;5;5;6;8",
        "confidence": "4;3;4;2;4",
        "soundness": "2;3;3;3;4",
        "contribution": "2;3;2;3;3",
        "presentation": "3;3;4;3;4",
        "wc_summary": "58;125;71;71;97",
        "wc_strengths": "28;86;64;53;73",
        "wc_weaknesses": "190;53;69;56;52",
        "wc_questions": "6;84;32;50;37",
        "wc_review": "282;348;236;230;259",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "198;258;301;297;354",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            5.4,
            1.624807680927192
        ],
        "confidence_avg": [
            3.4,
            0.8
        ],
        "soundness_avg": [
            3.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            3.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            84.4,
            23.929897617833635
        ],
        "wc_strengths_avg": [
            60.8,
            19.6509541753066
        ],
        "wc_weaknesses_avg": [
            84.0,
            53.34791467339656
        ],
        "wc_questions_avg": [
            41.8,
            25.49039034616771
        ],
        "wc_review_avg": [
            271.0,
            42.661458015403085
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            281.6,
            51.771034372513746
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.12309149097933271,
        "gs_citation": 38,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6033330603342669516&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "Microsoft;Georgia Institute of Technology",
        "aff_unique_dep": "Microsoft Corporation;",
        "aff_unique_url": "https://www.microsoft.com;https://www.gatech.edu",
        "aff_unique_abbr": "Microsoft;Georgia Tech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Threaten Spiking Neural Networks through Combining Rate and Temporal Information",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17437",
        "id": "xv8iGxENyI",
        "author_site": "Zecheng Hao, Tong Bu, Xinyu Shi, Zihan Huang, Zhaofei Yu, Tiejun Huang",
        "tldr": "",
        "abstract": "Spiking Neural Networks (SNNs) have received widespread attention in academic communities due to their superior spatio-temporal processing capabilities and energy-efficient characteristics. With further in-depth application in various fields, the vulnerability of SNNs under adversarial attack has become a focus of concern. \nIn this paper, we draw inspiration from two mainstream learning algorithms of SNNs and observe that SNN models reserve both rate and temporal information. To better understand the capabilities of these two types of information, we conduct a quantitative analysis separately for each. In addition, we note that the retention degree of temporal information is related to the parameters and input settings of spiking neurons. Building on these insights, we propose a hybrid adversarial attack based on rate and temporal information (HART), which allows for dynamic adjustment of the rate and temporal attributes. Experimental results demonstrate that compared to previous works, HART attack can achieve significant superiority under different attack scenarios, data types, network architecture, time-steps, and model hyper-parameters. These findings call for further exploration into how both types of information can be effectively utilized to enhance the reliability of SNNs. Code is available at [https://github.com/hzc1208/HART_Attack](https://github.com/hzc1208/HART_Attack).",
        "keywords": "Spiking Neural Networks;Rate and Temporal Information;Hybrid Adversarial Attack",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/95bd538a91c022bae9ec4c1f29180f1f084e6b52.zip",
        "author": "Zecheng Hao;Tong Bu;Xinyu Shi;Zihan Huang;Zhaofei Yu;Tiejun Huang",
        "authorids": "~Zecheng_Hao1;~Tong_Bu1;~Xinyu_Shi2;~Zihan_Huang2;~Zhaofei_Yu1;~Tiejun_Huang1",
        "gender": ";;;M;M;M",
        "homepage": "https://hzc1208.github.io/;;;https://github.com/h-z-h-cell;https://yuzhaofei.github.io;https://idm.pku.edu.cn/~tjhuang/",
        "dblp": "339/6969;;;;166/0573;h/TiejunHuang",
        "google_scholar": "txTkX7YAAAAJ;;;;qaUgD50AAAAJ;https://scholar.google.com.tw/citations?user=knvEK4AAAAAJ",
        "orcid": "0000-0001-9074-2857;;;;;0000-0002-4234-6099",
        "linkedin": ";;;;;",
        "or_profile": "~Zecheng_Hao1;~Tong_Bu1;~Xinyu_Shi2;~Zihan_Huang2;~Zhaofei_Yu1;~Tiejun_Huang1",
        "aff": "Peking University;;;Harbin Institute of Technology;Peking University;Peking University",
        "aff_domain": "pku.edu.cn;;;hit.edu.cn;pku.edu.cn;pku.edu.cn",
        "position": "PhD student;;;Undergrad student;Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\nhao2024threaten,\ntitle={Threaten Spiking Neural Networks through Combining Rate and Temporal Information},\nauthor={Zecheng Hao and Tong Bu and Xinyu Shi and Zihan Huang and Zhaofei Yu and Tiejun Huang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=xv8iGxENyI}\n}",
        "github": "",
        "project": "",
        "reviewers": "4VCV;w1gJ;RoZ6;hCfa",
        "pdf_size": 570448,
        "rating": "6;6;8;8",
        "confidence": "4;5;4;4",
        "soundness": "2;3;3;3",
        "contribution": "3;3;3;4",
        "presentation": "2;3;3;4",
        "wc_summary": "49;59;31;63",
        "wc_strengths": "21;60;30;107",
        "wc_weaknesses": "11;83;85;34",
        "wc_questions": "128;14;29;104",
        "wc_review": "209;216;175;308",
        "wc_reply_reviewers": "16;0;50;14",
        "wc_reply_authors": "817;497;543;476",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            50.5,
            12.359207094308275
        ],
        "wc_strengths_avg": [
            54.5,
            33.57454392839909
        ],
        "wc_weaknesses_avg": [
            53.25,
            31.814894310684107
        ],
        "wc_questions_avg": [
            68.75,
            48.297903681215814
        ],
        "wc_review_avg": [
            227.0,
            49.26966612430005
        ],
        "wc_reply_reviewers_avg": [
            20.0,
            18.384776310850235
        ],
        "wc_reply_authors_avg": [
            583.25,
            137.11377574846372
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2126728137469243751&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=xv8iGxENyI",
        "pdf": "https://openreview.net/pdf?id=xv8iGxENyI",
        "email": "pku.edu.cn;;;hit.edu.cn;pku.edu.cn;pku.edu.cn",
        "author_num": 6,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "Peking University;Harbin Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.pku.edu.cn;http://www.hit.edu.cn/",
        "aff_unique_abbr": "Peking U;HIT",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Harbin",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "xvhjRjoFCN",
        "title": "BiXT: Perceiving Longer Sequences With Bi-Directional Cross-Attention Transformers",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We present a novel bi-directional Transformer architecture (BiXT) for which computational cost and memory consumption scale linearly with input size, but without suffering the drop in performance or limitation to only one input modality seen with other efficient Transformer-based approaches. BiXT is inspired by the Perceiver architectures but replaces iterative attention with an efficient bi-directional cross-attention module in which input tokens and latent variables attend to each other simultaneously, leveraging a naturally emerging attention-symmetry between the two. This approach unlocks a key bottleneck experienced by Perceiver-like architectures and enables the processing and interpretation of both semantics (\u2018what\u2019) and location (\u2018where\u2019) to develop alongside each other over multiple layers \u2013 allowing its direct application to dense and instance-based tasks alike. By combiningefficiency with the generality and performance of a full Transformer architecture, BiXT can processes longer sequences like point clouds or images at higher feature resolutions. Our model achieves accuracies up to 82.0% for classification on ImageNet1K with tiny models and no modality-specific internal components,\nand performs competitively on semantic image segmentation (ADE20K) and point cloud part segmentation (ShapeNetPart) even against modality-specific methods.",
        "keywords": "Transformers;representation learning;efficiency;efficient attention;neural architectures",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Markus Hiller;Krista A. Ehinger;Tom Drummond",
        "authorids": "~Markus_Hiller1;~Krista_A._Ehinger4;~Tom_Drummond1",
        "gender": "M;M;Not Specified",
        "homepage": ";;http://www.kehinger.com",
        "dblp": "226/1459;50/1633;13/8654",
        "google_scholar": "TOb0sisAAAAJ;https://scholar.google.com.au/citations?user=6sWGL5wAAAAJ;EdGfpdcAAAAJ",
        "orcid": "0000-0002-8133-0102;0000-0001-8204-5904;0000-0003-2247-3020",
        "linkedin": ";;",
        "or_profile": "~Markus_Hiller1;~Tom_Drummond1;~Krista_Ehinger1",
        "aff": "University of Melbourne;University of Melbourne;The University of Melbourne",
        "aff_domain": "unimelb.edu.au;unimelb.edu.au;unimelb.edu.au",
        "position": "PhD student;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nhiller2024bixt,\ntitle={Bi{XT}: Perceiving Longer Sequences With Bi-Directional Cross-Attention Transformers},\nauthor={Markus Hiller and Krista A. Ehinger and Tom Drummond},\nyear={2024},\nurl={https://openreview.net/forum?id=xvhjRjoFCN}\n}",
        "github": "",
        "project": "",
        "reviewers": "bDbJ;qx3u;mPnx",
        "site": "https://openreview.net/forum?id=xvhjRjoFCN",
        "pdf_size": 3890709,
        "rating": "1;6;6",
        "confidence": "5;4;4",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "2;3;3",
        "wc_summary": "29;168;119",
        "wc_strengths": "9;114;32",
        "wc_weaknesses": "42;281;206",
        "wc_questions": "3;3;42",
        "wc_review": "83;566;399",
        "wc_reply_reviewers": "0;28;87",
        "wc_reply_authors": "353;1063;1354",
        "reply_reviewers": "0;1;1",
        "reply_authors": "2;2;3",
        "rating_avg": [
            4.333333333333333,
            2.357022603955158
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            105.33333333333333,
            57.56349151637308
        ],
        "wc_strengths_avg": [
            51.666666666666664,
            45.065384597148274
        ],
        "wc_weaknesses_avg": [
            176.33333333333334,
            99.8009129328095
        ],
        "wc_questions_avg": [
            16.0,
            18.384776310850235
        ],
        "wc_review_avg": [
            349.3333333333333,
            200.287016276365
        ],
        "wc_reply_reviewers_avg": [
            38.333333333333336,
            36.261396675926434
        ],
        "wc_reply_authors_avg": [
            923.3333333333334,
            420.42068878155317
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:UR3ujPS4FwUJ:scholar.google.com/&scioq=BiXT:+Perceiving+Longer+Sequences+With+Bi-Directional+Cross-Attention+Transformers&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Melbourne",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.unimelb.edu.au",
        "aff_unique_abbr": "UniMelb",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Australia"
    },
    {
        "title": "LQ-LoRA: Low-rank plus Quantized Matrix Decomposition for Efficient Language Model Finetuning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17436",
        "id": "xw29VvOMmU",
        "author_site": "Han Guo, Philip Greengard, Eric Xing, Yoon Kim",
        "tldr": "",
        "abstract": "We propose a simple approach for memory-efficient adaptation of pretrained language models. Our approach uses an iterative  algorithm  to decompose each  pretrained  matrix into a high-precision low-rank component  and a memory-efficient quantized component. During finetuning, the quantized component remains fixed and only the  low-rank component is updated. We present an integer linear programming formulation of the quantization component which enables dynamic  configuration of quantization parameters (e.g., bit-width, block size) for each matrix given an overall target memory budget.  We further explore a data-aware version of the algorithm which uses an approximation of the Fisher information matrix to weight the  reconstruction objective during matrix decomposition. Experiments on finetuning RoBERTa and LLaMA-2 (7B and 70B) demonstrate that our low-rank plus quantized matrix decomposition approach (LQ-LoRA) outperforms strong QLoRA and GPTQ-LoRA baselines and enables aggressive quantization to sub-3 bits with only minor performance degradations. When finetuned on a language modeling calibration dataset, LQ-LoRA can also be used for model compression; in this setting our 2.75-bit LLaMA-2-70B model (which has 2.85 bits on average when including the low-rank components and requires 27GB of GPU memory) performs respectably compared to the 16-bit baseline.",
        "keywords": "Low-rank plus Quantized Matrix Decomposition;Efficient Language Model Finetuning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Han Guo;Philip Greengard;Eric Xing;Yoon Kim",
        "authorids": "~Han_Guo1;~Philip_Greengard1;~Eric_Xing1;~Yoon_Kim1",
        "gender": ";;M;",
        "homepage": ";;http://www.cs.cmu.edu/~epxing/;https://people.csail.mit.edu/yoonkim/",
        "dblp": ";;36/3855;",
        "google_scholar": ";;https://scholar.google.com.tw/citations?user=5pKTRxEAAAAJ;n_ts4eYAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Han_Guo1;~Philip_Greengard1;~Eric_Xing1;~Yoon_Kim1",
        "aff": ";;School of Computer Science, Carnegie Mellon University;Massachusetts Institute of Technology",
        "aff_domain": ";;cs.cmu.edu;mit.edu",
        "position": ";;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nguo2024lqlora,\ntitle={{LQ}-Lo{RA}: Low-rank plus Quantized Matrix Decomposition for Efficient Language Model Finetuning},\nauthor={Han Guo and Philip Greengard and Eric Xing and Yoon Kim},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=xw29VvOMmU}\n}",
        "github": "",
        "project": "",
        "reviewers": "4gD2;CSBT;bc89;qudp",
        "pdf_size": 528486,
        "rating": "5;6;8;8",
        "confidence": "4;4;4;4",
        "soundness": "2;3;4;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "59;87;146;312",
        "wc_strengths": "43;83;86;107",
        "wc_weaknesses": "101;178;137;366",
        "wc_questions": "1;4;109;346",
        "wc_review": "204;352;478;1131",
        "wc_reply_reviewers": "246;44;35;32",
        "wc_reply_authors": "1190;898;699;660",
        "reply_reviewers": "2;1;1;1",
        "reply_authors": "3;2;1;1",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            151.0,
            98.11472876179192
        ],
        "wc_strengths_avg": [
            79.75,
            23.14492384951828
        ],
        "wc_weaknesses_avg": [
            195.5,
            102.13838651555056
        ],
        "wc_questions_avg": [
            115.0,
            140.28007698885827
        ],
        "wc_review_avg": [
            541.25,
            354.0334553400286
        ],
        "wc_reply_reviewers_avg": [
            89.25,
            90.60732586275792
        ],
        "wc_reply_authors_avg": [
            861.75,
            209.91233289161454
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 56,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1845197315464308304&as_sdt=5,31&sciodt=0,31&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=xw29VvOMmU",
        "pdf": "https://openreview.net/pdf?id=xw29VvOMmU",
        "email": ";;cs.cmu.edu;mit.edu",
        "author_num": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Carnegie Mellon University;Massachusetts Institute of Technology",
        "aff_unique_dep": "School of Computer Science;",
        "aff_unique_url": "https://www.cmu.edu;https://web.mit.edu",
        "aff_unique_abbr": "CMU;MIT",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Pittsburgh;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "xw3fStKCwm",
        "title": "Tensor-Train Point Cloud Compression and Efficient Approximate Nearest Neighbor Search",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Nearest-neighbor search in large vector databases is crucial for various machine learning applications.\n    This paper introduces a novel method using **tensor-train** (TT) low-rank tensor decomposition to efficiently represent point clouds and enable fast approximate nearest-neighbor searches.\n    We propose a probabilistic interpretation and utilize density estimation losses like Sliced Wasserstein to train TT decompositions, resulting in robust point cloud compression.\n    We reveals an inherent hierarchical structure within TT point clouds, facilitating efficient approximate nearest-neighbor searches.\n    In our paper, we provide detailed insights into the methodology and conduct comprehensive comparisons with existing methods.\n    We demonstrate its effectiveness in various scenarios, including out-of-distribution (OOD) problems and approximate nearest-neighbor (ANN) search tasks.",
        "keywords": "Nearest neighbor search;Approximate Search;Information Storage and Retrieval",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Georgii Sergeevich Novikov;Ivan Oseledets",
        "authorids": "~Georgii_Sergeevich_Novikov1;~Ivan_Oseledets1",
        "gender": "Non-Binary;M",
        "homepage": ";http://oseledets.github.io",
        "dblp": ";56/7175",
        "google_scholar": "M5fp_DMAAAAJ;https://scholar.google.ru/citations?user=5kMqBQEAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Georgii_Sergeevich_Novikov1;~Ivan_Oseledets1",
        "aff": "Skolkovo Institute of Science and Technology;Institute of Numerical Mathematics",
        "aff_domain": "skoltech.ru;inm.ras.ru",
        "position": "PhD student;Researcher",
        "bibtex": "@misc{\nnovikov2024tensortrain,\ntitle={Tensor-Train Point Cloud Compression and Efficient Approximate Nearest Neighbor Search},\nauthor={Georgii Sergeevich Novikov and Ivan Oseledets},\nyear={2024},\nurl={https://openreview.net/forum?id=xw3fStKCwm}\n}",
        "github": "",
        "project": "",
        "reviewers": "KPPr;xaNX;ZRyV;bPyW",
        "site": "https://openreview.net/forum?id=xw3fStKCwm",
        "pdf_size": 1087257,
        "rating": "3;3;3;6",
        "confidence": "4;4;3;3",
        "soundness": "3;2;3;3",
        "contribution": "2;1;2;3",
        "presentation": "1;3;1;2",
        "wc_summary": "34;137;191;188",
        "wc_strengths": "38;33;54;26",
        "wc_weaknesses": "106;290;516;82",
        "wc_questions": "106;19;47;67",
        "wc_review": "284;479;808;363",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "512;181;306;206",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            137.5,
            63.49212549600147
        ],
        "wc_strengths_avg": [
            37.75,
            10.304731922762475
        ],
        "wc_weaknesses_avg": [
            248.5,
            174.14577227139338
        ],
        "wc_questions_avg": [
            59.75,
            31.68102744546016
        ],
        "wc_review_avg": [
            483.5,
            199.77549899825053
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            301.25,
            130.35600293043663
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:DkVaqBNvzzkJ:scholar.google.com/&scioq=Tensor-Train+Point+Cloud+Compression+and+Efficient+Approximate+Nearest+Neighbor+Search&hl=en&as_sdt=0,33",
        "gs_version_total": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Skolkovo Institute of Science and Technology;Institute of Numerical Mathematics",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.skoltech.ru;",
        "aff_unique_abbr": "Skoltech;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Russian Federation;"
    },
    {
        "title": "Retrieval meets Long Context Large Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17435",
        "id": "xw5nxFWMlo",
        "author_site": "Peng Xu, Wei Ping, Xianchao Wu, Lawrence McAfee, Chen Zhu, Zihan Liu, Sandeep Subramanian, Evelina Bakhturina, Mohammad Shoeybi, Bryan Catanzaro",
        "tldr": "",
        "abstract": "Extending the context window of large language models (LLMs) is getting popular recently, while the solution of augmenting LLMs with retrieval has existed for years. The natural questions are: i) Retrieval-augmentation versus long context window, which one is better for downstream tasks? ii) Can both methods be combined to get the best of both worlds? In this work, we answer these questions by studying both solutions using two state-of-the-art pretrained LLMs, i.e., a proprietary 43B GPT and Llama2-70B. Perhaps surprisingly, we find that LLM with 4K context window using simple retrieval-augmentation at generation can achieve comparable performance to finetuned LLM with 16K context window via positional interpolation on long context tasks, while taking much less computation. More importantly, we demonstrate that retrieval can significantly improve the performance of LLMs regardless of their extended context window sizes. Our best model, retrieval-augmented Llama2-70B with 32K context window, outperforms GPT-3.5-turbo-16k and Davinci003 in terms of average score on nine long context tasks including question answering, query-based summarization, and in-context few-shot learning tasks. It also outperforms its non-retrieval Llama2-70B-32k baseline by a margin, while being much faster at generation. Our study provides general insights on the choice of retrieval-augmentation versus long context extension of LLM for practitioners.",
        "keywords": "Large Language Models;Long Context Window;Retrieval",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/6b51f19be02b2b956eae4a50b0b71d03696242a4.pdf",
        "author": "Peng Xu;Wei Ping;Xianchao Wu;Lawrence McAfee;Chen Zhu;Zihan Liu;Sandeep Subramanian;Evelina Bakhturina;Mohammad Shoeybi;Bryan Catanzaro",
        "authorids": "~Peng_Xu7;~Wei_Ping1;~Xianchao_Wu1;~Lawrence_McAfee1;~Chen_Zhu2;~Zihan_Liu2;~Sandeep_Subramanian1;~Evelina_Bakhturina1;~Mohammad_Shoeybi1;~Bryan_Catanzaro1",
        "gender": "M;M;M;M;M;M;M;;M;M",
        "homepage": "https://scholar.google.com.hk/citations?user=PQ26NTIAAAAJ&hl=en;https://wpingnet.github.io/;https://sites.google.com/site/xianchaowu2012/home;https://nvidia.com;http://www.cs.umd.edu/~chenzhu/;https://zliucr.github.io;http://www.sandeeplearning.com/;;;https://ctnzr.io",
        "dblp": "84/586-8;08/8399.html;https://dblp.org/pers/hd/w/Wu:Xianchao;;59/10522-1.html;46/9231;138/0902;211/6749;53/9742;14/4826",
        "google_scholar": "https://scholar.google.com.hk/citations?user=PQ26NTIAAAAJ;6gKEYRgAAAAJ;0cP7RfUAAAAJ;;m-om5O8AAAAJ;LPabcsYAAAAJ;7i101rcAAAAJ;;62ElavIAAAAJ;UZ6kI2AAAAAJ",
        "orcid": ";;;;;;;;;0000-0003-0034-7728",
        "linkedin": ";wei-ping/;xianchao-wu-6239101a/;;;;;evelina-bakhturina-25269775/;shoeybi/;bryancatanzaro/",
        "or_profile": "~Peng_Xu7;~Wei_Ping1;~Xianchao_Wu1;~Lawrence_McAfee1;~Chen_Zhu2;~Zihan_Liu2;~Sandeep_Subramanian1;~Evelina_Bakhturina1;~Mohammad_Shoeybi1;~Bryan_Catanzaro1",
        "aff": "NVIDIA;NVIDIA;NVIDIA;NVIDIA;NVIDIA;NVIDIA;NVIDIA;NVIDIA;NVIDIA;NVIDIA",
        "aff_domain": "nvidia.com;nvidia.com;nvidia.com;nvidia.com;nvidia.com;nvidia.com;nvidia.com;nvidia.com;nvidia.com;nvidia.com",
        "position": "Researcher;Principal Researcher;Senior Data Scientist;Researcher;Research Scientist;Researcher;Researcher;Researcher;Director of Applied Resesrch;Vice President",
        "bibtex": "@inproceedings{\nxu2024retrieval,\ntitle={Retrieval meets Long Context Large Language Models},\nauthor={Peng Xu and Wei Ping and Xianchao Wu and Lawrence McAfee and Chen Zhu and Zihan Liu and Sandeep Subramanian and Evelina Bakhturina and Mohammad Shoeybi and Bryan Catanzaro},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=xw5nxFWMlo}\n}",
        "github": "",
        "project": "",
        "reviewers": "FNKh;MoDw;1poR;L1CH;xWjb;B6CQ",
        "pdf_size": 582083,
        "rating": "6;6;6;8;8;8",
        "confidence": "4;3;3;3;4;4",
        "soundness": "3;3;2;3;3;2",
        "contribution": "2;3;3;3;2;3",
        "presentation": "3;3;3;4;3;3",
        "wc_summary": "92;109;58;195;62;179",
        "wc_strengths": "73;94;82;110;52;220",
        "wc_weaknesses": "94;194;104;296;51;177",
        "wc_questions": "21;198;59;2;53;186",
        "wc_review": "280;595;303;603;218;762",
        "wc_reply_reviewers": "14;0;0;0;0;0",
        "wc_reply_authors": "755;773;565;694;449;1178",
        "reply_reviewers": "1;0;0;0;0;0",
        "reply_authors": "1;1;1;1;1;2",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.1666666666666665,
            0.3726779962499649
        ],
        "wc_summary_avg": [
            115.83333333333333,
            53.40854072357924
        ],
        "wc_strengths_avg": [
            105.16666666666667,
            54.36425500475678
        ],
        "wc_weaknesses_avg": [
            152.66666666666666,
            80.61361892109518
        ],
        "wc_questions_avg": [
            86.5,
            77.0730173277263
        ],
        "wc_review_avg": [
            460.1666666666667,
            202.2749091926354
        ],
        "wc_reply_reviewers_avg": [
            2.3333333333333335,
            5.21749194749951
        ],
        "wc_reply_authors_avg": [
            735.6666666666666,
            227.474296472273
        ],
        "reply_reviewers_avg": [
            0.16666666666666666,
            0.372677996249965
        ],
        "reply_authors_avg": [
            1.1666666666666667,
            0.3726779962499649
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.33333333333333326,
        "gs_citation": 171,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16583033829973979097&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=xw5nxFWMlo",
        "pdf": "https://openreview.net/pdf?id=xw5nxFWMlo",
        "email": "nvidia.com;nvidia.com;nvidia.com;nvidia.com;nvidia.com;nvidia.com;nvidia.com;nvidia.com;nvidia.com;nvidia.com",
        "author_num": 10,
        "aff_unique_index": "0;0;0;0;0;0;0;0;0;0",
        "aff_unique_norm": "NVIDIA",
        "aff_unique_dep": "NVIDIA Corporation",
        "aff_unique_url": "https://www.nvidia.com",
        "aff_unique_abbr": "NVIDIA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Emergent mechanisms for long timescales depend on training curriculum and affect performance in memory tasks",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17434",
        "id": "xwKt6bUkXj",
        "author_site": "Sina Khajehabdollahi, Roxana Zeraati, Emmanouil Giannakakis, Tim Sch\u00e4fer, Georg Martius, Anna Levina",
        "tldr": "",
        "abstract": "Recurrent neural networks (RNNs) in the brain and \\emph{in silico} excel at solving tasks with intricate temporal dependencies.\nLong timescales required for solving such tasks can arise from properties of individual neurons (single-neuron timescale, $\\tau$, e.g., membrane time constant in biological neurons) or recurrent interactions among them (network-mediated timescale, $\\tau_\\textrm{\\small{net}}$). \nHowever, the contribution of each mechanism for optimally solving memory-dependent tasks remains poorly understood. Here, we train RNNs to solve $N$-parity and $N$-delayed match-to-sample tasks with increasing memory requirements controlled by $N$, by simultaneously optimizing recurrent weights and $\\tau$s. We find that RNNs develop longer timescales with increasing $N$, but depending on the learning objective, they use different mechanisms. Two distinct curricula define learning objectives: sequential learning of a single-$N$ (single-head) or simultaneous learning of multiple $N$s (multi-head). Single-head networks increase their $\\tau$ with $N$ and can solve large-$N$ tasks, but suffer from catastrophic forgetting. However, multi-head networks, which are explicitly required to hold multiple concurrent memories, keep $\\tau$ constant and develop longer timescales through recurrent connectivity. We show that the multi-head curriculum increases training speed and stability to perturbations, and allows generalization to tasks beyond the training set.\nThis curriculum also significantly improves training GRUs and LSTMs for large-$N$ tasks. \nOur results suggest that adapting timescales to task requirements via recurrent interactions allows learning more complex objectives and improves the RNN's performance.",
        "keywords": "timescales;recurrent neural networks;memory tasks;curriculum learning",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "Sina Khajehabdollahi;Roxana Zeraati;Emmanouil Giannakakis;Tim Jakob Sch\u00e4fer;Georg Martius;Anna Levina",
        "authorids": "~Sina_Khajehabdollahi1;~Roxana_Zeraati1;~Emmanouil_Giannakakis1;~Tim_Jakob_Sch\u00e4fer1;~Georg_Martius1;~Anna_Levina1",
        "gender": "M;F;M;Not Specified;M;F",
        "homepage": ";https://t.co/gnjqrFdlMQ;https://uni-tuebingen.de/en/fakultaeten/mathematisch-naturwissenschaftliche-fakultaet/fachbereiche/informatik/lehrstuehle/self-organization-and-optimality-in-neuronal-networks/people/manos-giannakakis/;;https://uni-tuebingen.de/de/264672;https://uni-tuebingen.de/index.php?id=161236",
        "dblp": "242/6913;357/4865;277/1170.html;;47/2706;82/2964",
        "google_scholar": "https://scholar.google.ca/citations?user=OwyqJJ4AAAAJ;https://scholar.google.de/citations?user=gTp8sX8AAAAJ;https://scholar.google.com/citations?hl=en;MUVBVYsAAAAJ;https://scholar.google.de/citations?user=b-JF-UIAAAAJ;https://scholar.google.de/citations?user=KJSnbQoAAAAJ",
        "orcid": ";0000-0001-7946-1464;0000-0001-5636-5824;;;0000-0003-1355-6617",
        "linkedin": ";;emmanouil-giannakakis-2b9172174/;;;",
        "or_profile": "~Sina_Khajehabdollahi1;~Roxana_Zeraati1;~Emmanouil_Giannakakis1;~Tim_Jakob_Sch\u00e4fer1;~Georg_Martius1;~Anna_Levina1",
        "aff": "INRIA;Eberhard-Karls-Universit\u00e4t T\u00fcbingen;Eberhard-Karls-Universit\u00e4t T\u00fcbingen;Eberhard-Karls-Universit\u00e4t T\u00fcbingen;Max Planck Institute for Intelligent Systems;Eberhard-Karls-Universit\u00e4t T\u00fcbingen",
        "aff_domain": "inria.fr;uni-tuebingen.de;uni-tuebingen.de;uni-tuebingen.de;tuebingen.mpg.de;uni-tuebingen.de",
        "position": "Researcher;PhD student;PhD student;PhD student;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nkhajehabdollahi2024emergent,\ntitle={Emergent mechanisms for long timescales depend on training curriculum and affect performance in memory tasks},\nauthor={Sina Khajehabdollahi and Roxana Zeraati and Emmanouil Giannakakis and Tim Jakob Sch{\\\"a}fer and Georg Martius and Anna Levina},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=xwKt6bUkXj}\n}",
        "github": "",
        "project": "",
        "reviewers": "vRYi;h2ki;TkDB;XC2K",
        "pdf_size": 6366950,
        "rating": "5;6;8;8",
        "confidence": "4;3;3;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "4;3;3;3",
        "wc_summary": "67;390;63;169",
        "wc_strengths": "327;198;63;31",
        "wc_weaknesses": "359;353;292;44",
        "wc_questions": "280;96;434;73",
        "wc_review": "1033;1037;852;317",
        "wc_reply_reviewers": "424;0;52;62",
        "wc_reply_authors": "799;305;1085;139",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "1;1;3;1",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            172.25,
            132.70149773080936
        ],
        "wc_strengths_avg": [
            154.75,
            117.55078689655804
        ],
        "wc_weaknesses_avg": [
            262.0,
            128.56321402329672
        ],
        "wc_questions_avg": [
            220.75,
            146.9513099635386
        ],
        "wc_review_avg": [
            809.75,
            294.1388915121562
        ],
        "wc_reply_reviewers_avg": [
            134.5,
            168.7920318024521
        ],
        "wc_reply_authors_avg": [
            582.0,
            378.50891667172124
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.7777777777777777,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1379915040176263586&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=xwKt6bUkXj",
        "pdf": "https://openreview.net/pdf?id=xwKt6bUkXj",
        "email": "inria.fr;uni-tuebingen.de;uni-tuebingen.de;uni-tuebingen.de;tuebingen.mpg.de;uni-tuebingen.de",
        "author_num": 6,
        "aff_unique_index": "0;1;1;1;2;1",
        "aff_unique_norm": "INRIA;Eberhard Karls University of T\u00fcbingen;Max Planck Institute for Intelligent Systems",
        "aff_unique_dep": ";;Intelligent Systems",
        "aff_unique_url": "https://www.inria.fr;https://www.uni-tuebingen.de/;https://www.mpi-is.mpg.de",
        "aff_unique_abbr": "INRIA;Uni T\u00fcbingen;MPI-IS",
        "aff_campus_unique_index": "1;1;1;1",
        "aff_campus_unique": ";T\u00fcbingen",
        "aff_country_unique_index": "0;1;1;1;1;1",
        "aff_country_unique": "France;Germany"
    },
    {
        "id": "xwZhyKynCB",
        "title": "${\\rm EFO}_k$-CQA: Towards Knowledge Graph Complex Query Answering beyond Set Operation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "To answer complex queries on knowledge graphs, logical reasoning over incomplete knowledge is required due to the open-world assumption. Learning-based methods are essential because they are capable of generalizing over unobserved knowledge. Therefore, an appropriate dataset is fundamental to both obtaining and evaluating such methods under this paradigm. In this paper, we propose a comprehensive framework for data generation, model training, and method evaluation that covers the combinatorial space of Existential First-order Queries with multiple variables ($\\textrm{EFO}_k$). The combinatorial query space in our framework significantly extends those defined by set operations in the existing literature. Additionally, we construct a dataset, $\\textrm{EFO}_k$-CQA, with 741 query types for empirical evaluation, and our benchmark results provide new insights into how query hardness affects the results. Furthermore, we demonstrate that the existing dataset construction process is systematically biased and hinders the appropriate development of query-answering methods, highlighting the importance of our work. Our code and data are provided in~\\url{https://anonymous.4open.science/r/EFOK-CQA/README.md}.",
        "keywords": "complex query answering;knowledge graph",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Hang Yin;Zihao Wang;Weizhi Fei;Yangqiu Song",
        "authorids": "~Hang_Yin3;~Zihao_Wang11;~Weizhi_Fei1;~Yangqiu_Song1",
        "gender": ";;;M",
        "homepage": ";https://zihao-wang.github.io;;https://www.cse.ust.hk/~yqsong/",
        "dblp": ";148/9655-1;;86/2159",
        "google_scholar": ";T28rR00AAAAJ;;MdQZ-q8AAAAJ",
        "orcid": ";0000-0002-3919-0396;;0000-0002-7818-6090",
        "linkedin": ";zihao-wang-6a0a3286/;;yqsong/",
        "or_profile": "~Hang_Yin3;~Zihao_Wang11;~Weizhi_Fei1;~Yangqiu_Song1",
        "aff": ";Hong Kong University of Science and Technology;;Hong Kong University of Science and Technology",
        "aff_domain": ";cse.ust.hk;;ust.hk",
        "position": ";PhD student;;Associate Professor",
        "bibtex": "@misc{\nyin2024rm,\ntitle={\\$\\{{\\textbackslash}rm {EFO}\\}\\_k\\$-{CQA}: Towards Knowledge Graph Complex Query Answering beyond Set Operation},\nauthor={Hang Yin and Zihao Wang and Weizhi Fei and Yangqiu Song},\nyear={2024},\nurl={https://openreview.net/forum?id=xwZhyKynCB}\n}",
        "github": "",
        "project": "",
        "reviewers": "d2wZ;wF2V;LSNr;Cfvr",
        "site": "https://openreview.net/forum?id=xwZhyKynCB",
        "pdf_size": 1225750,
        "rating": "3;3;5;6",
        "confidence": "3;3;4;3",
        "soundness": "4;2;3;3",
        "contribution": "3;2;2;2",
        "presentation": "4;2;2;2",
        "wc_summary": "91;136;59;202",
        "wc_strengths": "84;72;39;56",
        "wc_weaknesses": "140;495;46;52",
        "wc_questions": "28;2;572;57",
        "wc_review": "343;705;716;367",
        "wc_reply_reviewers": "0;148;0;26",
        "wc_reply_authors": "428;1285;831;793",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "3;4;3;4",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            122.0,
            53.67960506561128
        ],
        "wc_strengths_avg": [
            62.75,
            16.931848688197046
        ],
        "wc_weaknesses_avg": [
            183.25,
            183.79523252794127
        ],
        "wc_questions_avg": [
            164.75,
            235.9294121130301
        ],
        "wc_review_avg": [
            532.75,
            177.99490863505056
        ],
        "wc_reply_reviewers_avg": [
            43.5,
            61.259693110560065
        ],
        "wc_reply_authors_avg": [
            834.25,
            304.10801946019114
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.5,
            0.5
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5464308228007727041&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Hong Kong University of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ust.hk",
        "aff_unique_abbr": "HKUST",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "xx05gm7oQw",
        "title": "Debias your VLM with Counterfactuals: A Unified Approach",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Recent advances in vision-language research have produced numerous foundation models that excel in tasks such as image classification, image-text retrieval, and image captioning. However, these models are shown to exploit spurious correlations in biased training data, raising fairness concerns for discrimination against underprivileged groups. \nIn this work, we propose CVLD, a unified framework for quantifying and mitigating vision-language biases in a task and domain-agnostic setting. By defining a causal intervention module that produces counterfactual image-text pairs, we apply causal fairness metrics to capture the discrepancy between model predictions on original and counterfactual distributions.\nBuilding on the universal fairness notion, we propose a set of bias-free adaptation techniques to mitigate the bias of pre-trained VL models by optimizing their robustness to interventions on the protected attribute, requiring minimal modification to the naive training pipeline. CVLD demonstrates robust debiasing results on image classification, retrieval and captioning using adaptation datasets of varying sizes, validating the importance of counterfactual data in studying vision-language bias.",
        "keywords": "vision-language;foundation models;bias mitigation;fairness;image editing",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Yi Li;Nuno Vasconcelos",
        "authorids": "~Yi_Li11;~Nuno_Vasconcelos1",
        "gender": ";M",
        "homepage": "http://svcl.ucsd.edu/people/yili/;http://www.svcl.ucsd.edu/~nuno/",
        "dblp": ";78/4806",
        "google_scholar": "nY-HwbwAAAAJ;Fykyo9gAAAAJ",
        "orcid": ";0000-0002-9024-4302",
        "linkedin": ";",
        "or_profile": "~Yi_Li11;~Nuno_Vasconcelos1",
        "aff": "University of California San Diego;University of California, San Diego",
        "aff_domain": "ucsd.edu;ucsd.edu",
        "position": "PhD student;Professor",
        "bibtex": "@misc{\nli2024debias,\ntitle={Debias your {VLM} with Counterfactuals: A Unified Approach},\nauthor={Yi Li and Nuno Vasconcelos},\nyear={2024},\nurl={https://openreview.net/forum?id=xx05gm7oQw}\n}",
        "github": "",
        "project": "",
        "reviewers": "nQv5;KRWy;Kjn2;sFrN",
        "site": "https://openreview.net/forum?id=xx05gm7oQw",
        "pdf_size": 12260117,
        "rating": "5;5;5;5",
        "confidence": "4;4;4;3",
        "soundness": "3;2;4;2",
        "contribution": "3;3;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "97;119;60;79",
        "wc_strengths": "61;60;66;90",
        "wc_weaknesses": "167;433;161;242",
        "wc_questions": "7;112;52;5",
        "wc_review": "332;724;339;416",
        "wc_reply_reviewers": "0;152;0;0",
        "wc_reply_authors": "302;845;628;319",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            88.75,
            21.821720830401986
        ],
        "wc_strengths_avg": [
            69.25,
            12.193748398257199
        ],
        "wc_weaknesses_avg": [
            250.75,
            109.95538868104646
        ],
        "wc_questions_avg": [
            44.0,
            43.52585438564073
        ],
        "wc_review_avg": [
            452.75,
            160.03651926982167
        ],
        "wc_reply_reviewers_avg": [
            38.0,
            65.81793068761733
        ],
        "wc_reply_authors_avg": [
            523.5,
            226.4757161375144
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:9-3xUeV1Z90J:scholar.google.com/&scioq=Debias+your+VLM+with+Counterfactuals:+A+Unified+Approach&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of California, San Diego",
        "aff_unique_dep": "",
        "aff_unique_url": "https://ucsd.edu",
        "aff_unique_abbr": "UCSD",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "San Diego",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Sparse Model Soups: A Recipe for Improved Pruning via Model Averaging",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17433",
        "id": "xx0ITyHp3u",
        "author_site": "Max Zimmer, Christoph Spiegel, Sebastian Pokutta",
        "tldr": "",
        "abstract": "Neural networks can be significantly compressed by pruning, yielding sparse models with reduced storage and computational demands while preserving predictive performance. Model soups (Wortsman et al., 2022) enhance generalization and out-of-distribution (OOD) performance by averaging the parameters of multiple models into a single one, without increasing inference time. However, achieving both sparsity and parameter averaging is challenging as averaging arbitrary sparse models reduces the overall sparsity due to differing sparse connectivities. This work addresses these challenges by demonstrating that exploring a single retraining phase of Iterative Magnitude Pruning (IMP) with varied hyperparameter configurations such as batch ordering or weight decay yields models suitable for averaging, sharing identical sparse connectivity by design. Averaging these models significantly enhances generalization and OOD performance over their individual counterparts. Building on this, we introduce Sparse Model Soups (SMS), a novel method for merging sparse models by initiating each prune-retrain cycle with the averaged model from the previous phase. SMS preserves sparsity, exploits sparse network benefits, is modular and fully parallelizable, and substantially improves IMP's performance. We further demonstrate that SMS can be adapted to enhance state-of-the-art pruning-during-training approaches.",
        "keywords": "pruning;retraining;model averaging;neural networks",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/a47956d62ee9de9ba1c42cf803737d9b42336621.zip",
        "author": "Max Zimmer;Christoph Spiegel;Sebastian Pokutta",
        "authorids": "~Max_Zimmer1;~Christoph_Spiegel1;~Sebastian_Pokutta1",
        "gender": ";;M",
        "homepage": ";;http://www.pokutta.com",
        "dblp": ";;75/7718",
        "google_scholar": ";;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Max_Zimmer1;~Christoph_Spiegel1;~Sebastian_Pokutta1",
        "aff": ";;TU Berlin",
        "aff_domain": ";;tu-berlin.de",
        "position": ";;Full Professor",
        "bibtex": "@inproceedings{\nzimmer2024sparse,\ntitle={Sparse Model Soups: A Recipe for Improved Pruning via Model Averaging},\nauthor={Max Zimmer and Christoph Spiegel and Sebastian Pokutta},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=xx0ITyHp3u}\n}",
        "github": "",
        "project": "",
        "reviewers": "TvoY;hicK;fESa;ja8N",
        "pdf_size": 551195,
        "rating": "5;6;6;6",
        "confidence": "4;4;2;4",
        "soundness": "1;3;2;2",
        "contribution": "1;3;2;2",
        "presentation": "3;3;3;3",
        "wc_summary": "48;134;59;63",
        "wc_strengths": "30;65;155;38",
        "wc_weaknesses": "121;156;70;78",
        "wc_questions": "2;4;106;71",
        "wc_review": "201;359;390;250",
        "wc_reply_reviewers": "47;115;191;0",
        "wc_reply_authors": "721;1096;1383;758",
        "reply_reviewers": "1;2;2;0",
        "reply_authors": "1;2;2;1",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            76.0,
            33.933759001914304
        ],
        "wc_strengths_avg": [
            72.0,
            49.64373072201565
        ],
        "wc_weaknesses_avg": [
            106.25,
            34.65815199920504
        ],
        "wc_questions_avg": [
            45.75,
            44.51053246142985
        ],
        "wc_review_avg": [
            300.0,
            77.26901060580497
        ],
        "wc_reply_reviewers_avg": [
            88.25,
            72.04642600434806
        ],
        "wc_reply_authors_avg": [
            989.5,
            270.12450832902965
        ],
        "reply_reviewers_avg": [
            1.25,
            0.82915619758885
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 17,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11720301879098780446&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=xx0ITyHp3u",
        "pdf": "https://openreview.net/pdf?id=xx0ITyHp3u",
        "email": ";;tu-berlin.de",
        "author_num": 3,
        "aff_unique_index": "0",
        "aff_unique_norm": "Technische Universit\u00e4t Berlin",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tu-berlin.de",
        "aff_unique_abbr": "TU Berlin",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Berlin",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "xxI4nAj7zi",
        "title": "Cross-domain Few-shot Classification via Invariant-content Feature Reconstruction",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In \\emph{cross-domain few-shot classification} (CFC), mainstream studies aim to fast train a new module to select or transform features~(a.k.a., the high-level semantic features) for previously unseen domains with a few labeled training data available on top of a powerful pre-trained model. These studies usually \\emph{assume} that high-level semantic features are shared across these domains, and only simple feature selection or transformations are enough to adapt features to those unseen domains. However, in this paper, we find that the simply transformed features are too general to fully cover the key content features regarding each class. Thus, we propose \\emph{invariant-content feature reconstruction} (IFR) to train a simple module that simultaneously consider high-level and fine-grained invariant-content features for the previously unseen domains. Specifically, the fine-grained invariant-content features are considered as a set of \\emph{informative} and \\emph{discriminative} features learned from a few labeled training data of tasks sampled from unseen domains, and are extracted by retrieving features that are invariant to style modifications from a set of content-preserving augmented data in pixel level with an attention module. Extensive experiments on the Meta-Dataset benchmark show that IFR achieves good generalization performance on unseen domains, which demonstrates the effectiveness of the fusion of the high-level features and the fine-grained invariant-content features. Specifically, IFR improves the average accuracy on unseen domains by 1.6\\% and 6.5\\% respectively under two different CFC experimental settings.",
        "keywords": "cross-domain;few-shot classification;invariant features;computer vision;deep learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/2af55e34634fd42c3905945fb9eca9a20593b2fa.zip",
        "author": "Hongduan Tian;Feng Liu;Ka Chun Cheung;Zhen Fang;Simon See;Tongliang Liu;Bo Han",
        "authorids": "~Hongduan_Tian1;~Feng_Liu2;~Ka_Chun_Cheung1;~Zhen_Fang2;~Simon_See1;~Tongliang_Liu1;~Bo_Han1",
        "gender": "M;M;M;M;M;M;M",
        "homepage": "https://hongduantian.github.io/;https://fengliu90.github.io/index.html;;https://fang-zhen.github.io/index.html;;https://tongliang-liu.github.io/;https://bhanml.github.io/",
        "dblp": "270/0676;77/1318-3;165/1089;;62/6547;150/6667;241/0472-3",
        "google_scholar": "07lUB9kAAAAJ;https://scholar.google.com/citations?hl=en;NvbCXToAAAAJ;OzD6WJcAAAAJ;ebIHTEoAAAAJ;https://scholar.google.com.au/citations?user=EiLdZ_YAAAAJ;nTNjqHwAAAAJ",
        "orcid": ";0000-0002-5005-9129;;0000-0003-0602-6255;0000-0002-4958-9237;;",
        "linkedin": ";alexfengliu;;;simonsee/;;",
        "or_profile": "~Hongduan_Tian1;~Feng_Liu2;~Ka_Chun_Cheung1;~Zhen_Fang2;~Simon_See1;~Tongliang_Liu1;~bo_han2",
        "aff": "Hong Kong Baptist University;University of Melbourne;NVIDIA;University of Technology Sydney;NVIDIA;Mohamed bin Zayed University of Artificial Intelligence;MBZUAI",
        "aff_domain": "hkbu.edu.hk;unimelb.edu.au;nvidia.com;uts.edu.au;nvidia.com;mbzuai.ac.ae;mbzuai.ac.ae",
        "position": "PhD student;Assistant Professor;Senior Manager, Solution Architect;Assistant Professor;Associate Professor;Affiliated Associate Professor;Researcher",
        "bibtex": "@misc{\ntian2024crossdomain,\ntitle={Cross-domain Few-shot Classification via Invariant-content Feature Reconstruction},\nauthor={Hongduan Tian and Feng Liu and Ka Chun Cheung and Zhen Fang and Simon See and Tongliang Liu and Bo Han},\nyear={2024},\nurl={https://openreview.net/forum?id=xxI4nAj7zi}\n}",
        "github": "",
        "project": "",
        "reviewers": "kkCh;LDzc;LoxD",
        "site": "https://openreview.net/forum?id=xxI4nAj7zi",
        "pdf_size": 6324261,
        "rating": "3;3;6",
        "confidence": "3;4;4",
        "soundness": "1;3;3",
        "contribution": "2;1;3",
        "presentation": "2;3;3",
        "wc_summary": "87;83;111",
        "wc_strengths": "28;32;109",
        "wc_weaknesses": "346;31;155",
        "wc_questions": "160;36;104",
        "wc_review": "621;182;479",
        "wc_reply_reviewers": "634;0;0",
        "wc_reply_authors": "1641;238;1551",
        "reply_reviewers": "1;0;0",
        "reply_authors": "3;1;3",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            93.66666666666667,
            12.364824660660938
        ],
        "wc_strengths_avg": [
            56.333333333333336,
            37.27674282385138
        ],
        "wc_weaknesses_avg": [
            177.33333333333334,
            129.56422688724265
        ],
        "wc_questions_avg": [
            100.0,
            50.701742244884116
        ],
        "wc_review_avg": [
            427.3333333333333,
            182.9067764979988
        ],
        "wc_reply_reviewers_avg": [
            211.33333333333334,
            298.8704661815141
        ],
        "wc_reply_authors_avg": [
            1143.3333333333333,
            641.2208841126607
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:7cLu8GSG-jAJ:scholar.google.com/&scioq=Cross-domain+Few-shot+Classification+via+Invariant-content+Feature+Reconstruction&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3;2;4;4",
        "aff_unique_norm": "Hong Kong Baptist University;University of Melbourne;NVIDIA;University of Technology Sydney;Mohamed bin Zayed University of Artificial Intelligence",
        "aff_unique_dep": ";;NVIDIA Corporation;;",
        "aff_unique_url": "https://www.hkbu.edu.hk;https://www.unimelb.edu.au;https://www.nvidia.com;https://www.uts.edu.au;https://mbzuai.ac.ae",
        "aff_unique_abbr": "HKBU;UniMelb;NVIDIA;UTS;MBZUAI",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;1;2;1;2;3;3",
        "aff_country_unique": "China;Australia;United States;United Arab Emirates"
    },
    {
        "id": "xxYRKXlviA",
        "title": "Enhancing Weakly Supervised 3D Medical Image Segmentation through Probabilistic-aware Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "3D medical image segmentation is a challenging task with crucial implications for disease diagnosis and treatment planning. Recent advances in deep learning have significantly enhanced fully supervised medical image segmentation. However, this approach heavily relies on labor-intensive and time-consuming fully annotated ground-truth labels, particularly for 3D volumes. To overcome this limitation, we propose an innovative probabilistic-aware weakly supervised learning pipeline tailored for 3D medical image segmentation. Our pipeline consists of three key components. Firstly, we introduce a Probability-based Pseudo Label Generation scheme that synthesizes dense 3D segmentation masks from sparsely annotated point annotations. Secondly, we develop a Probabilistic Multi-head Self-Attention network to extract robust probability-driven features, forming the foundation of our Probabilistic Transformer Network. Lastly, we incorporate a Probability-informed Segmentation Loss Function that effectively guides the training process by incorporating annotation confidence. Experimental results demonstrate significant improvements in weakly supervised segmentation, surpassing state-of-the-art methods.",
        "keywords": "Weakly Supervised Learning; Medical Image Segmentation; Probabilistic Methods",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Zhaoxin Fan;Runmin Jiang;Junhao Wu;Xin Huang;Tianyang Wang;Heng Huang;Min Xu",
        "authorids": "~Zhaoxin_Fan2;~Runmin_Jiang1;~Junhao_Wu1;~Xin_Huang9;~Tianyang_Wang1;~Heng_Huang1;~Min_Xu4",
        "gender": "M;M;M;;M;M;M",
        "homepage": ";;;https://sites.google.com/view/xhuang/;https://wangt0716.github.io/;https://www.cs.umd.edu/~heng/;https://www.cs.cmu.edu/~mxu1",
        "dblp": "174/0000.html;;;;;03/281;09/0-9",
        "google_scholar": "JHvyYDQAAAAJ;;;nR-JqDAAAAAJ;QbTV0r0AAAAJ;4OqLaDwAAAAJ;Y3Cqt0cAAAAJ",
        "orcid": ";;0009-0006-7170-471X;;0000-0003-3184-0566;;0000-0002-0881-5891",
        "linkedin": ";runmin-jiang-79a460226/;;;tianyang-wang-03a86a4a/;;min-xu-45b7315/",
        "or_profile": "~Zhaoxin_Fan2;~Runmin_Jiang1;~Junhao_Wu1;~Xin_Huang9;~Tianyang_Wang1;~Heng_Huang1;~Min_Xu1",
        "aff": "Carnegie Mellon University;Carnegie Mellon University;Jinan University;Towson University;University of Alabama at Birmingham;Department of Computer Science, University of Maryland, College Park;Carnegie Mellon University",
        "aff_domain": "cmu.edu;cmu.edu;jnu.edu.cn;towson.edu;uab.edu;cs.umd.edu;cmu.edu",
        "position": "PhD student;Researcher;Undergrad student;Assistant Professor;Assistant Professor;Full Professor;Associate Professor",
        "bibtex": "@misc{\nfan2024enhancing,\ntitle={Enhancing Weakly Supervised 3D Medical Image Segmentation through Probabilistic-aware Learning},\nauthor={Zhaoxin Fan and Runmin Jiang and Junhao Wu and Xin Huang and Tianyang Wang and Heng Huang and Min Xu},\nyear={2024},\nurl={https://openreview.net/forum?id=xxYRKXlviA}\n}",
        "github": "",
        "project": "",
        "reviewers": "y2ei;eHUZ;Red3;Nq7G",
        "site": "https://openreview.net/forum?id=xxYRKXlviA",
        "pdf_size": 2362027,
        "rating": "3;3;3;3",
        "confidence": "4;5;3;4",
        "soundness": "1;2;2;1",
        "contribution": "1;2;2;2",
        "presentation": "2;3;2;3",
        "wc_summary": "41;45;40;53",
        "wc_strengths": "17;51;21;73",
        "wc_weaknesses": "174;119;204;258",
        "wc_questions": "3;127;103;15",
        "wc_review": "235;342;368;399",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            1.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            44.75,
            5.11737237261468
        ],
        "wc_strengths_avg": [
            40.5,
            22.907422377910613
        ],
        "wc_weaknesses_avg": [
            188.75,
            50.276112618220594
        ],
        "wc_questions_avg": [
            62.0,
            53.842362503887216
        ],
        "wc_review_avg": [
            336.0,
            61.70494307589952
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8327248047677653069&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1;2;3;4;0",
        "aff_unique_norm": "Carnegie Mellon University;Jinan University;Towson University;University of Alabama at Birmingham;University of Maryland, College Park",
        "aff_unique_dep": ";;;;Department of Computer Science",
        "aff_unique_url": "https://www.cmu.edu;https://www.jnu.edu.cn;https://www.towson.edu;https://www.uab.edu;https://www/umd.edu",
        "aff_unique_abbr": "CMU;JNU;TU;UAB;UMD",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Birmingham;College Park",
        "aff_country_unique_index": "0;0;1;0;0;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "title": "Revisiting the Last-Iterate Convergence of Stochastic Gradient Methods",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17432",
        "id": "xxaEhwC1I4",
        "author_site": "Zijian Liu, Zhengyuan Zhou",
        "tldr": "",
        "abstract": "In the past several years, the last-iterate convergence of the Stochastic Gradient Descent (SGD) algorithm has triggered people's interest due to its good performance in practice but lack of theoretical understanding. For Lipschitz convex functions, different works have established the optimal $O(\\log(1/\\delta)\\log T/\\sqrt{T})$ or $O(\\sqrt{\\log(1/\\delta)/T})$ high-probability convergence rates for the final iterate, where $T$ is the time horizon and $\\delta$ is the failure probability. However, to prove these bounds, all the existing works are either limited to compact domains or require almost surely bounded noises. It is natural to ask whether the last iterate of SGD can still guarantee the optimal convergence rate but without these two restrictive assumptions. Besides this important question, there are still lots of theoretical problems lacking an answer. For example, compared with the last-iterate convergence of SGD for non-smooth problems, only few results for smooth optimization have yet been developed. Additionally, the existing results are all limited to a non-composite objective and the standard Euclidean norm. It still remains unclear whether the last-iterate convergence can be provably extended to wider composite optimization and non-Euclidean norms. In this work, to address the issues mentioned above, we revisit the last-iterate convergence of stochastic gradient methods and provide the first unified way to prove the convergence rates both in expectation and in high probability to accommodate general domains, composite objectives, non-Euclidean norms, Lipschitz conditions, smoothness, and (strong) convexity simultaneously.",
        "keywords": "Convex Optimization;Stochastic Optimization;Last Iterate",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Zijian Liu;Zhengyuan Zhou",
        "authorids": "~Zijian_Liu1;~Zhengyuan_Zhou2",
        "gender": ";M",
        "homepage": ";https://scholar.google.com/citations?user=hiGI9v0AAAAJ&hl=en",
        "dblp": ";125/5270",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Zijian_Liu1;~Zhengyuan_Zhou2",
        "aff": ";New York University",
        "aff_domain": ";nyu.edu",
        "position": ";Assistant Professor",
        "bibtex": "@inproceedings{\nliu2024revisiting,\ntitle={Revisiting the Last-Iterate Convergence of Stochastic Gradient Methods},\nauthor={Zijian Liu and Zhengyuan Zhou},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=xxaEhwC1I4}\n}",
        "github": "",
        "project": "",
        "reviewers": "4SRm;V1N7;yV1Y",
        "pdf_size": 460537,
        "rating": "6;6;8",
        "confidence": "2;4;3",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "3;2;3",
        "wc_summary": "22;64;110",
        "wc_strengths": "24;74;122",
        "wc_weaknesses": "53;1044;69",
        "wc_questions": "124;1663;34",
        "wc_review": "223;2845;335",
        "wc_reply_reviewers": "149;1543;36",
        "wc_reply_authors": "967;4019;158",
        "reply_reviewers": "2;3;1",
        "reply_authors": "3;10;2",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            65.33333333333333,
            35.93821859184948
        ],
        "wc_strengths_avg": [
            73.33333333333333,
            40.01110956832975
        ],
        "wc_weaknesses_avg": [
            388.6666666666667,
            463.4366791219222
        ],
        "wc_questions_avg": [
            607.0,
            747.6081861510079
        ],
        "wc_review_avg": [
            1134.3333333333333,
            1210.4878722601434
        ],
        "wc_reply_reviewers_avg": [
            576.0,
            685.3266860896829
        ],
        "wc_reply_authors_avg": [
            1714.6666666666667,
            1662.5451038159001
        ],
        "reply_reviewers_avg": [
            2.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            5.0,
            3.559026084010437
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10320070847929814272&as_sdt=4005&sciodt=0,6&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=xxaEhwC1I4",
        "pdf": "https://openreview.net/pdf?id=xxaEhwC1I4",
        "email": ";nyu.edu",
        "author_num": 2,
        "aff_unique_index": "0",
        "aff_unique_norm": "New York University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nyu.edu",
        "aff_unique_abbr": "NYU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Un-Mixing Test-Time Normalization Statistics: Combatting Label Temporal Correlation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17431",
        "id": "xyxU99Nutg",
        "author_site": "Devavrat Tomar, Guillaume Vray, Jean-Philippe Thiran, Behzad Bozorgtabar",
        "tldr": "",
        "abstract": "Recent test-time adaptation methods heavily rely on nuanced adjustments of batch normalization (BN) parameters. However, one critical assumption often goes overlooked: that of independently and identically distributed (i.i.d.) test batches with respect to unknown labels.  This oversight leads to skewed BN statistics and undermines the reliability of the model under non-i.i.d. scenarios. To tackle this challenge, this paper presents a novel method termed '$\\textbf{Un-Mix}$ing $\\textbf{T}$est-Time $\\textbf{N}$ormalization $\\textbf{S}$tatistics' (UnMix-TNS). Our method re-calibrates the statistics for each instance within a test batch by $\\textit{mixing}$ it with multiple distinct statistics components, thus inherently simulating the i.i.d. scenario. The core of this method hinges on a distinctive online $\\textit{unmixing}$ procedure that continuously updates these statistics components by incorporating the most similar instances from new test batches. Remarkably generic in its design, UnMix-TNS seamlessly integrates with a wide range of leading test-time adaptation methods and pre-trained architectures equipped with BN layers. Empirical evaluations corroborate the robustness of UnMix-TNS under varied scenarios\u2014ranging from single to continual and mixed domain shifts, particularly excelling with temporally correlated test data and corrupted non-i.i.d. real-world streams. This adaptability is maintained even with very small batch sizes or single instances. Our results highlight UnMix-TNS's capacity to markedly enhance stability and performance across various benchmarks. Our code is publicly available at https://github.com/devavratTomar/unmixtns.",
        "keywords": "test-time adaptation;batch normalization;distribution shift",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Devavrat Tomar;Guillaume Vray;Jean-Philippe Thiran;Behzad Bozorgtabar",
        "authorids": "~Devavrat_Tomar1;~Guillaume_Vray1;~Jean-Philippe_Thiran1;~Behzad_Bozorgtabar1",
        "gender": "M;;M;M",
        "homepage": ";;https://people.epfl.ch/jean-philippe.thiran;https://behzadbozorgtabar.com/",
        "dblp": "287/4211;244/8160;t/JeanPhilippeThiran;59/10419",
        "google_scholar": "S7DELUgAAAAJ;_9n9mi8AAAAJ;mII-l2cAAAAJ;kxAk6AoAAAAJ",
        "orcid": "0000-0003-3058-7351;0000-0003-3655-020X;0000-0003-2938-9657;0000-0002-5759-4896",
        "linkedin": "devavrattomar;guillaume-vray-5a91091a8/;;behzad-bozorgtabar-72838560/",
        "or_profile": "~Devavrat_Tomar1;~Guillaume_Vray1;~Jean-Philippe_Thiran1;~Behzad_Bozorgtabar1",
        "aff": "EPFL - EPF Lausanne;EPFL - EPF Lausanne;University of Lausanne;Swiss Federal Institute of Technology Lausanne",
        "aff_domain": "epfl.ch;epfl.ch;unil.ch;epfl.ch",
        "position": "PhD student;PhD student;Associate Professor;Lecturer",
        "bibtex": "@inproceedings{\ntomar2024unmixing,\ntitle={Un-Mixing Test-Time Normalization Statistics: Combatting Label Temporal Correlation},\nauthor={Devavrat Tomar and Guillaume Vray and Jean-Philippe Thiran and Behzad Bozorgtabar},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=xyxU99Nutg}\n}",
        "github": "",
        "project": "",
        "reviewers": "omE5;yuas;Yi31;auPw",
        "pdf_size": 1371782,
        "rating": "6;6;6;8",
        "confidence": "3;3;3;3",
        "soundness": "3;2;2;3",
        "contribution": "3;3;2;3",
        "presentation": "3;3;3;2",
        "wc_summary": "41;115;119;43",
        "wc_strengths": "65;116;92;65",
        "wc_weaknesses": "189;93;315;124",
        "wc_questions": "5;156;62;99",
        "wc_review": "300;480;588;331",
        "wc_reply_reviewers": "25;13;244;323",
        "wc_reply_authors": "795;564;2110;1570",
        "reply_reviewers": "1;1;2;1",
        "reply_authors": "2;2;4;3",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            79.5,
            37.53331853167263
        ],
        "wc_strengths_avg": [
            84.5,
            21.266170318136737
        ],
        "wc_weaknesses_avg": [
            180.25,
            85.16271191078874
        ],
        "wc_questions_avg": [
            80.5,
            54.96589851899085
        ],
        "wc_review_avg": [
            424.75,
            116.24838708558498
        ],
        "wc_reply_reviewers_avg": [
            151.25,
            135.23382528051184
        ],
        "wc_reply_authors_avg": [
            1259.75,
            616.2874227988107
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            0.82915619758885
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5015901750000167574&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=xyxU99Nutg",
        "pdf": "https://openreview.net/pdf?id=xyxU99Nutg",
        "email": "epfl.ch;epfl.ch;unil.ch;epfl.ch",
        "author_num": 4,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "EPFL;University of Lausanne;Swiss Federal Institute of Technology Lausanne",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.epfl.ch;https://www.unil.ch;https://www.epfl.ch",
        "aff_unique_abbr": "EPFL;UNIL;EPFL",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Lausanne;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Switzerland"
    },
    {
        "id": "xzRnzHUVE9",
        "title": "Enhancing Sample Efficiency in Black-box Combinatorial Optimization via Symmetric Replay Training",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Black-box combinatorial optimization (black-box CO) is frequently encountered in various industrial fields, such as drug discovery or hardware design. Despite its widespread relevance, solving black-box CO problems is highly challenging due to the vast combinatorial solution space and resource-intensive nature of black-box function evaluations. These inherent complexities induce significant constraints on the efficacy of existing deep reinforcement learning (DRL) methods when applied to practical problem settings. For efficient exploration with the limited availability of function evaluations, this paper introduces a new generic method to enhance sample efficiency. We propose symmetric replay training that leverages the high-reward samples and their under-explored regions in the symmetric space. In replay training, the policy is trained to imitate the symmetric trajectories of these high-rewarded samples. The proposed method is beneficial for the exploration of highly rewarded regions without the necessity for additional online interactions - free. The experimental results show that our method consistently improves the sample efficiency of various DRL methods on real-world tasks, including molecular optimization and hardware design. Our source code is available at https://anonymous.4open.science/r/sym_replay.",
        "keywords": "Black-box combinatorial optimization;sample efficiency;symmetries;drug discovery;hardware design;deep reinforcement learning;imitation learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/9bce1725004b798ac0c57fc77d05f88a1c1b924a.pdf",
        "author": "Hyeonah Kim;Minsu Kim;Sungsoo Ahn;Jinkyoo Park",
        "authorids": "~Hyeonah_Kim1;~Minsu_Kim2;~Sungsoo_Ahn1;~Jinkyoo_Park1",
        "gender": "F;M;M;M",
        "homepage": ";https://minsuukim.github.io/;https://sungsooahn.super.site/;http://silab.kaist.ac.kr/",
        "dblp": ";;90/5164;156/7535",
        "google_scholar": ";https://scholar.google.ca/citations?user=VvyLuhAAAAAJ;XTenHs0AAAAJ;sH2a0nkAAAAJ",
        "orcid": "0000-0002-0629-1879;;;0000-0003-2620-1479",
        "linkedin": "hyeonahkimm/;;;",
        "or_profile": "~Hyeonah_Kim1;~Minsu_Kim2;~Sungsoo_Ahn1;~Jinkyoo_Park1",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology;Pohang University of Science and Technology;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.edu;kaist.ac.kr;postech.ac.kr;kaist.ac.kr",
        "position": "PhD student;PhD student;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nkim2024enhancing,\ntitle={Enhancing Sample Efficiency in Black-box Combinatorial Optimization via Symmetric Replay Training},\nauthor={Hyeonah Kim and Minsu Kim and Sungsoo Ahn and Jinkyoo Park},\nyear={2024},\nurl={https://openreview.net/forum?id=xzRnzHUVE9}\n}",
        "github": "",
        "project": "",
        "reviewers": "j1D8;t4AA;zPsa;vaeD",
        "site": "https://openreview.net/forum?id=xzRnzHUVE9",
        "pdf_size": 925359,
        "rating": "5;5;6;8",
        "confidence": "4;4;4;3",
        "soundness": "2;4;3;3",
        "contribution": "2;2;2;4",
        "presentation": "2;4;3;4",
        "wc_summary": "87;116;153;214",
        "wc_strengths": "38;58;144;110",
        "wc_weaknesses": "206;310;283;236",
        "wc_questions": "117;94;251;362",
        "wc_review": "448;578;831;922",
        "wc_reply_reviewers": "123;29;0;330",
        "wc_reply_authors": "2217;703;551;1554",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "5;2;3;4",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.8660254037844386
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            142.5,
            47.447339229929426
        ],
        "wc_strengths_avg": [
            87.5,
            41.88973621306298
        ],
        "wc_weaknesses_avg": [
            258.75,
            40.357000631860636
        ],
        "wc_questions_avg": [
            206.0,
            108.19658035261558
        ],
        "wc_review_avg": [
            694.75,
            190.21221701036976
        ],
        "wc_reply_reviewers_avg": [
            120.5,
            129.21783932569062
        ],
        "wc_reply_authors_avg": [
            1256.25,
            673.639137446749
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.5,
            1.118033988749895
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9428090415820632,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:jRCbJt-mCJUJ:scholar.google.com/&scioq=Enhancing+Sample+Efficiency+in+Black-box+Combinatorial+Optimization+via+Symmetric+Replay+Training&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology;Pohang University of Science and Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.kaist.ac.kr;https://www.postech.ac.kr",
        "aff_unique_abbr": "KAIST;POSTECH",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Pohang",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "DreamLLM: Synergistic Multimodal Comprehension and Creation",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17430",
        "id": "y01KGvd9Bw",
        "author_site": "Runpei Dong, chunrui han, Yuang Peng, Zekun Qi, Zheng Ge, Jinrong Yang, Liang Zhao, Jianjian Sun, Hongyu Zhou, Haoran Wei, Xiangwen Kong, Xiangyu Zhang, Kaisheng Ma, Li Yi",
        "tldr": "",
        "abstract": "This paper presents DreamLLM, a learning framework that first achieves versatile Multimodal Large Language Models (MLLMs) empowered with frequently overlooked synergy between multimodal comprehension and creation. DreamLLM operates on two fundamental principles. The first focuses on the generative modeling of both language and image posteriors by direct sampling in the raw multimodal space. This approach circumvents the limitations and information loss inherent to external feature extractors like CLIP, and a more thorough multimodal understanding is obtained. Second, DreamLLM fosters the generation of raw, interleaved documents, modeling both text and image contents, along with unstructured layouts. This allows DreamLLM to learn all conditional, marginal, and joint multimodal distributions effectively. As a result, DreamLLM is the first MLLM capable of generating free-form interleaved content. Comprehensive experiments highlight DreamLLM's superior performance as a zero-shot multimodal generalist, reaping from the enhanced learning synergy. Project page: https://dreamllm.github.io.",
        "keywords": "Multimodal Large Language Models;Large Language Models;Generative Models;Vision Language;Representation Learning;GPT",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Runpei Dong;Chunrui Han;Yuang Peng;Zekun Qi;Zheng Ge;Jinrong Yang;Liang Zhao;Jianjian Sun;Hongyu Zhou;Haoran Wei;Xiangwen Kong;Xiangyu Zhang;Kaisheng Ma;Li Yi",
        "authorids": "~Runpei_Dong1;~Chunrui_Han3;~Yuang_Peng1;~Zekun_Qi2;~Zheng_Ge1;~Jinrong_Yang1;~Liang_Zhao17;~Jianjian_Sun1;~Hongyu_Zhou3;~Haoran_Wei1;~Xiangwen_Kong1;~Xiangyu_Zhang1;~Kaisheng_Ma1;~Li_Yi2",
        "gender": "M;M;M;M;M;M;M;M;;M;M;M;F;M",
        "homepage": "https://runpeidong.web.illinois.edu/;https://qizekun.github.io/;;https://yancie-yjr.github.io/;;;;https://github.com/Ucas-HaoranWei;;;http://group.iiis.tsinghua.edu.cn/~maks/index.html;https://ericyi.github.io/;https://github.com/hanchunrui;https://www.yuangpeng.com",
        "dblp": "298/8727;182/3981;231/1007;286/5463;63/5422-19;322/9274;;183/9682;;95/3760-5.html;133/4053.html;26/4239-1;;342/3993.html",
        "google_scholar": "z2SoXI8AAAAJ;ap8yc3oAAAAJ;hJ-VrrIAAAAJ;8Of_NYQAAAAJ;https://scholar.google.com/citations?view_op=list_works;https://scholar.google.com/citations?hl=en;i1PB3cEAAAAJ;https://scholar.google.com.hk/citations?user=J4naK0MAAAAJ;https://scholar.google.com/citations?view_op=list_works;yuB-cfoAAAAJ;VtDpVoEAAAAJ;UyZL660AAAAJ;;J0ko04IAAAAJ",
        "orcid": ";;;;;;;;;0000-0003-2138-4608;0000-0001-9226-3366;;;",
        "linkedin": ";;;;;;;;;;;;;",
        "or_profile": "~Runpei_Dong1;~Zekun_Qi2;~Zheng_Ge1;~Jinrong_Yang1;~Liang_Zhao17;~Jianjian_Sun1;~Hongyu_Zhou3;~Haoran_Wei1;~Xiangwen_Kong1;~Xiangyu_Zhang1;~Kaisheng_Ma1;~Li_Yi2;~chunrui_han1;~Yuang_Peng2",
        "aff": "Department of Computer Science, University of Illinois Urbana-Champaign;Xi'an Jiaotong University;Megvii Technology Inc.;Huazhong University of Science and Technology;Megvii Technology Inc.;Megvii Technology Inc.;Megvii Technology Inc.;Megvii Technology Inc.;StepFun;MEGVII Technology;Institute for Interdisciplinary Information Sciences (IIIS), Tsinghua University;Tsinghua University;Megvii Technology Inc.;Megvii Technology Inc.",
        "aff_domain": "illinois.edu;xjtu.edu.cn;megvii.com;hust.edu.cn;megvii.com;megvii.com;megvii.com;megvii.com;stepfun.com;megvii.com;tsinghua.edu.cn;tsinghua.edu.cn;megvii.com;megvii.com",
        "position": "PhD student;MS student;Researcher;PhD student;Researcher;Researcher;Researcher;Researcher;Researcher;Principal Researcher;Associate Professor;Assistant Professor;Researcher;Intern",
        "bibtex": "@inproceedings{\ndong2024dreamllm,\ntitle={Dream{LLM}: Synergistic Multimodal Comprehension and Creation},\nauthor={Runpei Dong and Chunrui Han and Yuang Peng and Zekun Qi and Zheng Ge and Jinrong Yang and Liang Zhao and Jianjian Sun and Hongyu Zhou and Haoran Wei and Xiangwen Kong and Xiangyu Zhang and Kaisheng Ma and Li Yi},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=y01KGvd9Bw}\n}",
        "github": "",
        "project": "",
        "reviewers": "jWvU;h8i6;t2eT",
        "pdf_size": 15806664,
        "rating": "6;6;8",
        "confidence": "4;4;4",
        "soundness": "3;2;3",
        "contribution": "3;3;3",
        "presentation": "4;3;3",
        "wc_summary": "56;100;69",
        "wc_strengths": "34;104;67",
        "wc_weaknesses": "98;235;108",
        "wc_questions": "3;36;14",
        "wc_review": "191;475;258",
        "wc_reply_reviewers": "61;15;15",
        "wc_reply_authors": "1125;1517;476",
        "reply_reviewers": "1;1;1",
        "reply_authors": "3;5;2",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            75.0,
            18.457157599876172
        ],
        "wc_strengths_avg": [
            68.33333333333333,
            28.592928418676454
        ],
        "wc_weaknesses_avg": [
            147.0,
            62.35917467916543
        ],
        "wc_questions_avg": [
            17.666666666666668,
            13.719410418171117
        ],
        "wc_review_avg": [
            308.0,
            121.2133106002252
        ],
        "wc_reply_reviewers_avg": [
            30.333333333333332,
            21.684607956387456
        ],
        "wc_reply_authors_avg": [
            1039.3333333333333,
            429.28182920884143
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            1.247219128924647
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            14,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 187,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9906106921805979798&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=y01KGvd9Bw",
        "pdf": "https://openreview.net/pdf?id=y01KGvd9Bw",
        "email": "illinois.edu;xjtu.edu.cn;megvii.com;hust.edu.cn;megvii.com;megvii.com;megvii.com;megvii.com;stepfun.com;megvii.com;tsinghua.edu.cn;tsinghua.edu.cn;megvii.com;megvii.com",
        "author_num": 14,
        "aff_unique_index": "0;1;2;3;2;2;2;2;4;2;5;5;2;2",
        "aff_unique_norm": "University of Illinois Urbana-Champaign;Xi'an Jiao Tong University;Megvii Technology;Huazhong University of Science and Technology;StepFun;Tsinghua University",
        "aff_unique_dep": "Department of Computer Science;;;;;Institute for Interdisciplinary Information Sciences (IIIS)",
        "aff_unique_url": "https://illinois.edu;https://www.xjtu.edu.cn;https://www.megvii.com;http://www.hust.edu.cn;;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "UIUC;XJTU;Megvii;HUST;;Tsinghua",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Urbana-Champaign;",
        "aff_country_unique_index": "0;1;1;1;1;1;1;1;1;1;1;1;1",
        "aff_country_unique": "United States;China;"
    },
    {
        "title": "Is Self-Repair a Silver Bullet for Code Generation?",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17429",
        "id": "y0GJXRungR",
        "author_site": "Theo X. Olausson, Jeevana Priya Inala, Chenglong Wang, Jianfeng Gao, Armando Solar-Lezama",
        "tldr": "",
        "abstract": "Large language models have shown remarkable aptitude in code generation, but still struggle to perform complex tasks. Self-repair---in which the model debugs and repairs its own code---has recently become a popular way to boost performance in these settings. However, despite its increasing popularity, existing studies of self-repair have been limited in scope; in many settings, its efficacy thus remains poorly understood. In this paper, we analyze Code Llama, GPT-3.5 and GPT-4's ability to perform self-repair on problems taken from HumanEval and APPS. We find that when the cost of carrying out repair is taken into account, performance gains are often modest, vary a lot between subsets of the data, and are sometimes not present at all. We hypothesize that this is because self-repair is bottlenecked by the model's ability to provide feedback on its own code; using a stronger model to artificially boost the quality of the feedback, we observe substantially larger performance gains. Similarly, a small-scale study in which we provide GPT-4 with feedback from human participants suggests that even for the strongest models, self-repair still lags far behind what can be achieved with human-level debugging.",
        "keywords": "program synthesis;code generation;large language models;machine learning for code",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Theo X. Olausson;Jeevana Priya Inala;Chenglong Wang;Jianfeng Gao;Armando Solar-Lezama",
        "authorids": "~Theo_X._Olausson1;~Jeevana_Priya_Inala1;~Chenglong_Wang1;~Jianfeng_Gao1;~Armando_Solar-Lezama1",
        "gender": ";M;M;M;M",
        "homepage": "http://jinala.github.io/;https://chenglongwang.org/;https://www.microsoft.com/en-us/research/people/jfgao/;https://people.csail.mit.edu/asolar/;https://people.csail.mit.edu/theoxo/",
        "dblp": "166/1342;;92/5339;95/6919;334/7669",
        "google_scholar": ";;https://scholar.google.com/citations?hl=en;https://scholar.google.com.tw/citations?user=8BX3BokAAAAJ;e7K3ZagAAAAJ",
        "orcid": ";;;;0000-0001-6653-2227",
        "linkedin": ";;;;",
        "or_profile": "~Jeevana_Priya_Inala1;~Chenglong_Wang1;~Jianfeng_Gao1;~Armando_Solar-Lezama1;~Theo_X_Olausson1",
        "aff": "Microsoft;Microsoft;Microsoft Research;Massachusetts Institute of Technology;Massachusetts Institute of Technology",
        "aff_domain": "microsoft.com;microsoft.com;microsoft.com;mit.edu;mit.edu",
        "position": "Researcher;Researcher;Principal Researcher;Full Professor;PhD student",
        "bibtex": "@inproceedings{\nolausson2024is,\ntitle={Is Self-Repair a Silver Bullet for Code Generation?},\nauthor={Theo X. Olausson and Jeevana Priya Inala and Chenglong Wang and Jianfeng Gao and Armando Solar-Lezama},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=y0GJXRungR}\n}",
        "github": "",
        "project": "",
        "reviewers": "Vfe4;LPE6;PNGf",
        "pdf_size": 2429589,
        "rating": "6;8;8",
        "confidence": "3;4;4",
        "soundness": "3;3;3",
        "contribution": "3;4;3",
        "presentation": "3;3;3",
        "wc_summary": "78;269;186",
        "wc_strengths": "80;65;177",
        "wc_weaknesses": "90;63;555",
        "wc_questions": "36;107;13",
        "wc_review": "284;504;931",
        "wc_reply_reviewers": "35;28;24",
        "wc_reply_authors": "850;372;804",
        "reply_reviewers": "1;1;1",
        "reply_authors": "2;1;2",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            177.66666666666666,
            78.19775501182173
        ],
        "wc_strengths_avg": [
            107.33333333333333,
            49.64093293061909
        ],
        "wc_weaknesses_avg": [
            236.0,
            225.83622384374036
        ],
        "wc_questions_avg": [
            52.0,
            40.00833246545858
        ],
        "wc_review_avg": [
            573.0,
            268.60503842382906
        ],
        "wc_reply_reviewers_avg": [
            29.0,
            4.546060565661952
        ],
        "wc_reply_authors_avg": [
            675.3333333333334,
            215.30959621489754
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.9999999999999998,
        "gs_citation": 106,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=945350964043598311&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=y0GJXRungR",
        "pdf": "https://openreview.net/pdf?id=y0GJXRungR",
        "email": "microsoft.com;microsoft.com;microsoft.com;mit.edu;mit.edu",
        "author_num": 5,
        "aff_unique_index": "0;0;0;1;1",
        "aff_unique_norm": "Microsoft;Massachusetts Institute of Technology",
        "aff_unique_dep": "Microsoft Corporation;",
        "aff_unique_url": "https://www.microsoft.com;https://web.mit.edu",
        "aff_unique_abbr": "Microsoft;MIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "y1AJUwqsla",
        "title": "CaStRL: Context-Aware State Representation learning with Transformer",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Learning a versatile representation from high-dimensional observation data is\na crucial stepping stone for building autonomous agents capable of effective\ndecision-making in various downstream tasks. Yet, learning such a representa-\ntion without additional supervisory signals poses formidable practical challenges.\nIn this work, we introduce Context-Aware State Representation Learning (CaStRL), \na novel unsupervised representation pre-training approach that combines\nthe strength of generative autoregressive modeling with the pretraining-finetuning\nparadigm. To encourage CaStRL to grasp the underlying dynamics information\nof the environment, we enforce it to jointly learn the latent state representation\nalong with the contexts that influence the model\u2019s ability to learn a generalizable \nrepresentation for control tasks. In CaStRL, we first employ the Video-Swin Transformer \nas a vision encoder, customizing it to support autoregressive\nmodeling through the incorporation of a causal attention mask. Then, we design\nContext-GPT to learn context from historical sequences of state representation,\nwhich drives the model towards capturing global structural patterns by propagating \ninformation across extended time horizons. This significantly improves the\nadaptability of the learned representation for diverse control tasks. By emphasizing \nreward-free evaluation and limited data constraints in both pre-training and\nfine-tuning stages, we find, across a wide range of Atari experiments, that pre-\ntrained representations can substantially facilitate downstream learning efficiency.",
        "keywords": "representation learning;reinforcement learning;deep learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/66c1cba935b8a63631c52f81082a8cc996b1927c.zip",
        "author": "Jurat Shayiding;Mohamed Zayan;Brian D Ziebart;Xinhua Zhang",
        "authorids": "~Jurat_Shayiding1;~Mohamed_Zayan1;~Brian_D_Ziebart1;~Xinhua_Zhang3",
        "gender": "M;M;M;M",
        "homepage": ";https://www.cs.uic.edu/Ziebart/;https://www.cs.uic.edu/~zhangx/;",
        "dblp": ";39/10481;45/6863;",
        "google_scholar": ";https://scholar.google.com.tw/citations?user=_JjIgGcAAAAJ;https://scholar.google.com.tw/citations?user=jrkrn3sAAAAJ;",
        "orcid": ";;;",
        "linkedin": "jurat-shayidin/;;;m-zayan/",
        "or_profile": "~Jurat_Shayiding1;~Brian_D_Ziebart1;~Xinhua_Zhang3;~Mohamed_Osama_Zayan1",
        "aff": ", University of Illinois at Chicago;University of Illinois, Chicago;University of Illinois, Chicago;Siemens Corporate Research",
        "aff_domain": "cs.uic.edu;uic.edu;uic.edu;siemens.com",
        "position": "PhD student;Full Professor;Associate Professor;Researcher",
        "bibtex": "@misc{\nshayiding2024castrl,\ntitle={CaSt{RL}: Context-Aware State Representation learning with Transformer},\nauthor={Jurat Shayiding and Mohamed Zayan and Brian D Ziebart and Xinhua Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=y1AJUwqsla}\n}",
        "github": "",
        "project": "",
        "reviewers": "JKQw;NZzK;6x1S",
        "site": "https://openreview.net/forum?id=y1AJUwqsla",
        "pdf_size": 1140848,
        "rating": "3;5;5",
        "confidence": "5;4;4",
        "soundness": "1;3;2",
        "contribution": "1;2;2",
        "presentation": "1;3;3",
        "wc_summary": "71;77;71",
        "wc_strengths": "33;167;34",
        "wc_weaknesses": "276;278;106",
        "wc_questions": "2;253;123",
        "wc_review": "382;775;334",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            73.0,
            2.8284271247461903
        ],
        "wc_strengths_avg": [
            78.0,
            62.93382768167424
        ],
        "wc_weaknesses_avg": [
            220.0,
            80.61430807658567
        ],
        "wc_questions_avg": [
            126.0,
            102.49227613174891
        ],
        "wc_review_avg": [
            497.0,
            197.5499936724879
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9999999999999997,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:IZstsMnemsEJ:scholar.google.com/&scioq=CaStRL:+Context-Aware+State+Representation+learning+with+Transformer&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "University of Illinois at Chicago;Siemens AG",
        "aff_unique_dep": ";Corporate Research",
        "aff_unique_url": "https://www.uic.edu;https://www.siemens.com/research",
        "aff_unique_abbr": "UIC;Siemens",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Chicago;",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "United States;Germany"
    },
    {
        "title": "PolyGCL: GRAPH CONTRASTIVE LEARNING via Learnable Spectral Polynomial Filters",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17428",
        "id": "y21ZO6M86t",
        "author_site": "Jingyu Chen, Runlin Lei, Zhewei Wei",
        "tldr": "",
        "abstract": "Recently, Graph Contrastive Learning (GCL) has achieved significantly superior performance in self-supervised graph representation learning. \nHowever, the existing GCL technique has inherent smooth characteristics because of its low-pass GNN encoder and objective based on homophily assumption, which poses a challenge when applying it to heterophilic graphs.\nIn supervised learning tasks, spectral GNNs with polynomial approximation excel in both homophilic and heterophilic settings by adaptively fitting graph filters of arbitrary shapes. \nYet, their applications in unsupervised learning are rarely explored.\nBased on the above analysis, a natural question arises: Can we incorporate the excellent properties of spectral polynomial filters into graph contrastive learning?\nIn this paper, we address the question by studying the necessity of introducing high-pass information for heterophily from a spectral perspective.\nWe propose PolyGCL, a GCL pipeline that utilizes polynomial filters to achieve contrastive learning between the low-pass and high-pass views.\nSpecifically, PolyGCL utilizes polynomials with learnable filter functions to generate different spectral views and an objective that incorporates high-pass information through a linear combination. \nWe theoretically prove that PolyGCL outperforms previous GCL paradigms when applied to graphs with varying levels of homophily.\nWe conduct extensive experiments on both synthetic and real-world datasets, which demonstrate the promising performance of PolyGCL on homophilic and heterophilic graphs.",
        "keywords": "Graph Contrastive Learning;Spectral Graph Neural Networks;Polynomial Filter;Heterophilic Graph Representation Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/5876143cef4cd4ade92f0e9af3c112be7cd4dfe8.zip",
        "author": "Jingyu Chen;Runlin Lei;Zhewei Wei",
        "authorids": "~Jingyu_Chen4;~Runlin_Lei1;~Zhewei_Wei1",
        "gender": "M;M;M",
        "homepage": "https://www.zhihu.com/people/jian-dan-sheng-huo-53-98;https://github.com/Leirunlin;http://weizhewei.com",
        "dblp": ";321/1838;94/4260",
        "google_scholar": ";pckN2lAAAAAJ;https://scholar.google.com.hk/citations?user=qZ7dj4gAAAAJ",
        "orcid": ";;0000-0003-3620-5086",
        "linkedin": ";;",
        "or_profile": "~Jingyu_Chen4;~Runlin_Lei1;~Zhewei_Wei1",
        "aff": "Renmin University of China;Renmin University of China;Renmin University of China",
        "aff_domain": "ruc.edu.cn;ruc.edu.cn;ruc.edu.cn",
        "position": "MS student;PhD student;Full Professor",
        "bibtex": "@inproceedings{\nchen2024polygcl,\ntitle={Poly{GCL}: {GRAPH} {CONTRASTIVE} {LEARNING} via Learnable Spectral Polynomial Filters},\nauthor={Jingyu Chen and Runlin Lei and Zhewei Wei},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=y21ZO6M86t}\n}",
        "github": "",
        "project": "",
        "reviewers": "Q45Y;LQgR;2heL;aFan",
        "pdf_size": 621179,
        "rating": "5;8;8;8",
        "confidence": "4;4;3;3",
        "soundness": "3;3;4;3",
        "contribution": "2;2;4;3",
        "presentation": "3;3;2;3",
        "wc_summary": "370;72;105;17",
        "wc_strengths": "3;56;220;32",
        "wc_weaknesses": "3;161;195;243",
        "wc_questions": "114;115;163;13",
        "wc_review": "490;404;683;305",
        "wc_reply_reviewers": "0;31;0;21",
        "wc_reply_authors": "2395;1429;1686;535",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "6;5;4;2",
        "rating_avg": [
            7.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            141.0,
            135.8988594506959
        ],
        "wc_strengths_avg": [
            77.75,
            84.24480696161633
        ],
        "wc_weaknesses_avg": [
            150.5,
            90.00416657022052
        ],
        "wc_questions_avg": [
            101.25,
            54.66431651452344
        ],
        "wc_review_avg": [
            470.5,
            139.05844095199686
        ],
        "wc_reply_reviewers_avg": [
            13.0,
            13.47219358530748
        ],
        "wc_reply_authors_avg": [
            1511.25,
            665.4661430155556
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            4.25,
            1.479019945774904
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 23,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3644187264905618055&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=y21ZO6M86t",
        "pdf": "https://openreview.net/pdf?id=y21ZO6M86t",
        "email": "ruc.edu.cn;ruc.edu.cn;ruc.edu.cn",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Renmin University of China",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.ruc.edu.cn",
        "aff_unique_abbr": "RUC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "y2D8aW4son",
        "title": "Capturing The Channel Dependency Completely Via Knowledge-Episodic Memory For Time Series Forecasting",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The forecasting of Multivariate Time Series (MTS) has long been an important but challenging task, and recent advancements in MTS forecasting methods try to discover both temporal and channel-wise dependencies. However, we explore the nature of MTS and observe two kinds of existed channel dependencies that current methods have difficulty to capture completely. \nOne is the evident channel dependency, which can be captured by mixing the channel information directly, and another is the latent channel dependency, which should be captured by finding the intrinsic variable that caused the same changes within MTS.\nTo address this issue, we introduce the knowledge and episodic memory modules, which gain the specific knowledge and  hard pattern memories with a well-designed recall method, to capture the latent and evident channel dependency respectively.\nFurther, based on the proposed memory modules, we develop a pattern memory network, which recalls both memories for capturing different channel dependencies completely, for MTS forecasting. Extensive experiments on eight datasets all verify the effectiveness of the proposed memory-based forecasting method.",
        "keywords": "multivariate time series forecasting;channel dependency;pattern memory network;",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/5f2e3030023c047194cfdaacf198f9f03e66bdbd.zip",
        "author": "Muyao Wang;Wenchao Chen;Zhibin Duan;Binhe Zhao;Bo Chen",
        "authorids": "~Muyao_Wang1;~Wenchao_Chen1;~Zhibin_Duan1;zbh20021028zbh@gmail.com;~Bo_Chen1",
        "gender": ";M;M;;M",
        "homepage": ";https://web.xidian.edu.cn/chenwenchao/;;;http://web.xidian.edu.cn/bchen/en/index.html",
        "dblp": ";;268/2560;;89/5615-1",
        "google_scholar": ";;https://scholar.google.com.hk/citations?user=bITyHaEAAAAJ;;",
        "orcid": ";;;;0000-0001-5151-9388",
        "linkedin": ";;;;",
        "or_profile": "~Muyao_Wang1;~Wenchao_Chen1;~Zhibin_Duan1;zbh20021028zbh@gmail.com;~Bo_Chen1",
        "aff": ";Xidian University;Xidian University;;Xidian University",
        "aff_domain": ";xidian.edu;xidian.edu;;xidian.edu.cn",
        "position": ";Associate Professor;PhD student;;Full Professor",
        "bibtex": "@misc{\nwang2024capturing,\ntitle={Capturing The Channel Dependency Completely Via Knowledge-Episodic Memory For Time Series Forecasting},\nauthor={Muyao Wang and Wenchao Chen and Zhibin Duan and Binhe Zhao and Bo Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=y2D8aW4son}\n}",
        "github": "",
        "project": "",
        "reviewers": "a9EC;cd83;sqDM;D3M5",
        "site": "https://openreview.net/forum?id=y2D8aW4son",
        "pdf_size": 1120243,
        "rating": "3;3;5;5",
        "confidence": "5;3;3;5",
        "soundness": "3;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "2;1;2;1",
        "wc_summary": "104;54;67;42",
        "wc_strengths": "57;36;120;23",
        "wc_weaknesses": "84;84;103;391",
        "wc_questions": "56;34;6;2",
        "wc_review": "301;208;296;458",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "426;333;442;1233",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.0,
            1.0
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            66.75,
            23.25268801665734
        ],
        "wc_strengths_avg": [
            59.0,
            37.24916106437835
        ],
        "wc_weaknesses_avg": [
            165.5,
            130.4233491365714
        ],
        "wc_questions_avg": [
            24.5,
            21.97157254271983
        ],
        "wc_review_avg": [
            315.75,
            90.07323409315333
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            608.5,
            362.94937663536496
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:tGbSUzgnmOcJ:scholar.google.com/&scioq=Capturing+The+Channel+Dependency+Completely+Via+Knowledge-Episodic+Memory+For+Time+Series+Forecasting&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Xidian University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.xidian.edu.cn/",
        "aff_unique_abbr": "Xidian",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "y2EyGMQXyb",
        "title": "Quasi-Recurrent Gist Attention: Efficiently Modeling Long Context in Large Language Model",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Transformer-based Large Language Models (LLMs) have achieved state-of-the-art on numerous Natural Language Processing tasks. However, LLMs typically come with a predetermined context window size. This limitation, combined with the quadratic complexity of self-attention, makes pretrained LLMs struggle with long sequences. In this work, we introduce a quasi-recurrent gist attention mechanism designed to effectively capture long contextual information within LLMs. The proposed approach employs quasi-recurrent context compression techniques to iteratively integrate historical context details into the gist representation. The quasi-recurrent gist attention reduces the computation complexity from $O(n^2)$ by full-attention to $O(n)$ with no change of the original Transformer model architecture, which enables seamless fine-tuning from pretrained language models such as Llama \\cite{touvron2023llama} and facilitates the natural extension of the context window. Experimental results indicate that the proposed attention mechanism yields better performance to the full-attention approach on multiple public benchmarks, while  reducing the latency for modeling long context significantly.",
        "keywords": "Large Language Models;gist attention;long contextual information",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Jing Qian;Yu Yan;Yadong Lu;Yeyun Gong;Yang Liu;yelong shen",
        "authorids": "~Jing_Qian1;~Yu_Yan1;~Yadong_Lu1;~Yeyun_Gong2;~Yang_Liu50;~yelong_shen1",
        "gender": "F;;M;M;M;",
        "homepage": "https://jing-qian.github.io;;https://adamlu123.github.io/;;https://nlp-yang.github.io/;",
        "dblp": "71/944;12/778;64/7873;06/10400.html;;",
        "google_scholar": "oZ49zMMAAAAJ;vwllVZcAAAAJ;Y69ahdAAAAAJ;piUkwMYAAAAJ;HxTr-CtMdrsC;",
        "orcid": ";;;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Jing_Qian1;~Yu_Yan1;~Yadong_Lu1;~Yeyun_Gong2;~Yang_Liu50;~yelong_shen1",
        "aff": "Microsoft;Microsoft;Microsoft;Microsoft;Microsoft;",
        "aff_domain": "microsoft.com;microsoft.com;microsoft.com;microsoft.com;microsoft.com;",
        "position": "Researcher;Researcher;Researcher;Researcher;Researcher;",
        "bibtex": "@misc{\nqian2024quasirecurrent,\ntitle={Quasi-Recurrent Gist Attention: Efficiently Modeling Long Context in Large Language Model},\nauthor={Jing Qian and Yu Yan and Yadong Lu and Yeyun Gong and Yang Liu and yelong shen},\nyear={2024},\nurl={https://openreview.net/forum?id=y2EyGMQXyb}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=y2EyGMQXyb",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:hOsKOkG7GlIJ:scholar.google.com/&scioq=Quasi-Recurrent+Gist+Attention:+Efficiently+Modeling+Long+Context+in+Large+Language+Model&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Microsoft",
        "aff_unique_dep": "Microsoft Corporation",
        "aff_unique_url": "https://www.microsoft.com",
        "aff_unique_abbr": "Microsoft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "y2qZhSTtzU",
        "title": "IMO: Greedy Layer-Wise Sparse Representation Learning for Out-of-Distribution Text Classification with Pre-trained Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Machine learning models have made incredible progress, but they still struggle when applied to examples from unseen domains. This study focuses on a specific problem of domain generalization, where a model is trained on one source domain and tested on multiple target domains that are unseen during training. We propose IMO: Invariant features Masks for O-of-Distribution text classification, to achieve\nOOD generalization by learning invariant features. During training, IMO would learn sparse mask layers to remove irrelevant features for prediction, where the remaining features keep invariant. Additionally, IMO has an attention module at the token level to focus on tokens that are useful for prediction. Our comprehensive experiments show that IMO substantially outperforms strong baselines in terms of various evaluation metrics and settings.",
        "keywords": "Domain generalization;out-of-distribution;text classification",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/a7057a96d56b8fd9734a507c4b2fcaad7a4f8045.zip",
        "author": "Tao Feng;Lizhen Qu;Zhuang Li;Haolan Zhan;YUNCHENG HUA;Gholamreza Haffari",
        "authorids": "~Tao_Feng2;~Lizhen_Qu2;~Zhuang_Li1;~Haolan_Zhan1;~YUNCHENG_HUA2;~Gholamreza_Haffari1",
        "gender": "M;M;M;;M;M",
        "homepage": "https://www.linkedin.com/in/tao-feng-035161198/;https://research.monash.edu/en/persons/lizhen-qu;https://zhuang-li.github.io/;;;https://rezahaffari.github.io/HomePage/HomePage.html",
        "dblp": "12/4774-13;58/3601;31/2814;;162/1637;",
        "google_scholar": "bWDIBXwAAAAJ;https://scholar.google.com.au/citations?user=cHXZgHUAAAAJ;https://scholar.google.com.au/citations?user=4uhU0NUAAAAJ;;https://scholar.google.com.au/citations?hl=en;https://scholar.google.com.tw/citations?user=Perjx5EAAAAJ",
        "orcid": "0009-0001-9490-7353;0000-0002-7764-431X;0000-0002-9808-9992;;0000-0002-4238-5071;",
        "linkedin": "tao-feng-035161198/;lizhen-qu-50017717/;zhuang-li-68b855b1/;;;gholamrezahaffari/?originalSubdomain=au",
        "or_profile": "~Tao_Feng2;~Lizhen_Qu2;~Zhuang_Li1;~Haolan_Zhan1;~YUNCHENG_HUA2;~Gholamreza_Haffari1",
        "aff": "Monash University;Monash University;Monash University;;Monash University;Monash University",
        "aff_domain": "monash.edu;monash.edu.au;monash.edu;;monash.edu;monash.edu",
        "position": "PhD student;Lecturer;Postdoc;;Postdoc;Full Professor",
        "bibtex": "@misc{\nfeng2024imo,\ntitle={{IMO}: Greedy Layer-Wise Sparse Representation Learning for Out-of-Distribution Text Classification with Pre-trained Models},\nauthor={Tao Feng and Lizhen Qu and Zhuang Li and Haolan Zhan and YUNCHENG HUA and Gholamreza Haffari},\nyear={2024},\nurl={https://openreview.net/forum?id=y2qZhSTtzU}\n}",
        "github": "",
        "project": "",
        "reviewers": "hBe7;vuMm;aKhG",
        "site": "https://openreview.net/forum?id=y2qZhSTtzU",
        "pdf_size": 546946,
        "rating": "3;3;3",
        "confidence": "4;4;4",
        "soundness": "2;2;2",
        "contribution": "2;2;2",
        "presentation": "2;2;2",
        "wc_summary": "30;65;124",
        "wc_strengths": "19;12;55",
        "wc_weaknesses": "31;77;158",
        "wc_questions": "241;17;53",
        "wc_review": "321;171;390",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            73.0,
            38.79003308411411
        ],
        "wc_strengths_avg": [
            28.666666666666668,
            18.83849486792639
        ],
        "wc_weaknesses_avg": [
            88.66666666666667,
            52.49973544906891
        ],
        "wc_questions_avg": [
            103.66666666666667,
            98.2151832570821
        ],
        "wc_review_avg": [
            294.0,
            91.42209798511517
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1302441050044510090&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Monash University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.monash.edu",
        "aff_unique_abbr": "Monash",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Australia"
    },
    {
        "title": "AdjointDPM: Adjoint Sensitivity Method for Gradient Backpropagation of Diffusion Probabilistic Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17427",
        "id": "y33lDRBgWI",
        "author_site": "Jiachun Pan, Jun Hao Liew, Vincent Tan, Jiashi Feng, Hanshu Yan",
        "tldr": "",
        "abstract": "This paper considers a ubiquitous problem underlying several applications of DPMs, i.e., \noptimizing the parameters of DPMs when the objective is a differentiable metric defined on the generated contents. \nSince the sampling procedure of DPMs involves recursive calls to the denoising UNet, naive gradient backpropagation requires storing the intermediate states of all iterations, resulting in extremely high memory consumption. \nTo overcome this issue, we propose a novel method AdjointDPM, which first generates new samples from diffusion models by solving the corresponding probability-flow ODEs. It then uses the adjoint sensitivity method to backpropagate the gradients of the loss to the models' parameters (including conditioning signals, network weights, and initial noises) by solving another augmented ODE. \nTo reduce numerical errors in both the forward generation and gradient backpropagation processes, we further reparameterize the probability-flow ODE and augmented ODE as simple non-stiff ODEs using exponential integration. \nAdjointDPM can effectively compute the gradients of all types of parameters in DPMs, including the network weights, conditioning text prompts, and noisy states.\nFinally, we demonstrate the effectiveness of AdjointDPM on several interesting tasks: guided generation via modifying sampling trajectories, finetuning DPM weights for stylization, and converting visual effects into text embeddings.",
        "keywords": "Diffusion Probabilistic Model;Neural ODE;Adjoint Sensitivity Method",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Jiachun Pan;Jun Hao Liew;Vincent Tan;Jiashi Feng;Hanshu Yan",
        "authorids": "~Jiachun_Pan1;~Jun_Hao_Liew1;~Vincent_Tan1;~Jiashi_Feng1;~Hanshu_Yan1",
        "gender": "F;;M;M;M",
        "homepage": ";;https://www.ece.nus.edu.sg/stfpage/vtan/pubs.htm;;https://sites.google.com/site/jshfeng/",
        "dblp": "228/9156;;60/2327;243/3583;56/8278",
        "google_scholar": ";https://scholar.google.com.sg/citations?user=8gm-CYYAAAAJ;dJoAVvAAAAAJ;MG817V4AAAAJ;https://scholar.google.com.sg/citations?user=Q8iay0gAAAAJ",
        "orcid": ";;0000-0002-5008-4527;;0000-0001-6843-0064",
        "linkedin": ";;;;",
        "or_profile": "~Jiachun_Pan1;~Jun_Hao_Liew1;~Vincent_Tan1;~Hanshu_YAN2;~Jiashi_Feng2",
        "aff": "National University of Singapore;ByteDance;National University of Singapore;ByteDance;ByteDance",
        "aff_domain": "nus.edu.sg;bytedance.com;nus.edu.sg;bytedance.com;bytedance.com",
        "position": "Postdoc;Researcher;Full Professor;Research Scientist;Research Lead",
        "bibtex": "@inproceedings{\npan2024adjointdpm,\ntitle={Adjoint{DPM}: Adjoint Sensitivity Method for Gradient Backpropagation of Diffusion Probabilistic Models},\nauthor={Jiachun Pan and Jun Hao Liew and Vincent Tan and Jiashi Feng and Hanshu Yan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=y33lDRBgWI}\n}",
        "github": "",
        "project": "",
        "reviewers": "CqXY;5NNi;6hcA",
        "pdf_size": 40142235,
        "rating": "6;6;6",
        "confidence": "3;4;5",
        "soundness": "3;3;3",
        "contribution": "3;2;3",
        "presentation": "3;3;3",
        "wc_summary": "40;64;121",
        "wc_strengths": "58;46;47",
        "wc_weaknesses": "187;201;134",
        "wc_questions": "2;42;198",
        "wc_review": "287;353;500",
        "wc_reply_reviewers": "52;19;67",
        "wc_reply_authors": "1096;881;1046",
        "reply_reviewers": "1;1;1",
        "reply_authors": "2;2;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            75.0,
            33.97057550292606
        ],
        "wc_strengths_avg": [
            50.333333333333336,
            5.436502143433364
        ],
        "wc_weaknesses_avg": [
            174.0,
            28.855964143772194
        ],
        "wc_questions_avg": [
            80.66666666666667,
            84.55898664377561
        ],
        "wc_review_avg": [
            380.0,
            89.02808545621994
        ],
        "wc_reply_reviewers_avg": [
            46.0,
            20.049937655763422
        ],
        "wc_reply_authors_avg": [
            1007.6666666666666,
            91.86342519680446
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18001683242988515474&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=y33lDRBgWI",
        "pdf": "https://openreview.net/pdf?id=y33lDRBgWI",
        "email": "nus.edu.sg;bytedance.com;nus.edu.sg;bytedance.com;bytedance.com",
        "author_num": 5,
        "aff_unique_index": "0;1;0;1;1",
        "aff_unique_norm": "National University of Singapore;ByteDance",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.nus.edu.sg;https://www.bytedance.com",
        "aff_unique_abbr": "NUS;ByteDance",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;1;1",
        "aff_country_unique": "Singapore;China"
    },
    {
        "id": "y3BuJotSKl",
        "title": "Adversarial Defense using Targeted Manifold Manipulation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Adversarial attacks on deep models are often guaranteed to find a small and innocuous perturbation to easily alter class label of a test input. We use a novel Targeted Manifold Manipulation approach to direct the gradients from the genuine data manifold towards carefully planted trapdoors during such adversarial attacks. The trapdoors are assigned an additional class label (Trapclass) to make the attacks falling in them easily identifiable. Whilst low-perturbation budget attacks will necessarily end up in the trapdoors, high-perturbation budget attacks may escape but only end up far away from the data manifold. Since our manifold manipulation is enforced only locally, we show that such out-of-distribution data can be easily detected by noting the absence of trapdoors around them. Our detection algorithm avoids learning a separate model for attack detection and thus remain semantically aligned with the original classifier. Further, since we manipulate the adversarial distribution it avoids the fundamental difficulty associated with overlapping distributions of clean and attack samples for usual, unmanipulated models. We use six state-of-the-art adversarial attacks with four well-known image datasets to evaluate our proposed defense. Our results show that the proposed method can detect \\sim99% attacks without significant drop in clean accuracy whilst also being robust to semantic-preserving, non-attack perturbations.",
        "keywords": "Adversarial Defense;Backdoor;Deep Learning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/d3c8cec1d2855fd33ec2191800224d71c7e540b4.pdf",
        "author": "Banibrata Ghosh;HARIPRIYA HARIKUMAR;Svetha Venkatesh;Santu Rana",
        "authorids": "~Banibrata_Ghosh1;~HARIPRIYA_HARIKUMAR1;~Svetha_Venkatesh1;~Santu_Rana1",
        "gender": "M;F;F;M",
        "homepage": ";https://haripriyaaharikumar.github.io/;https://www.deakin.edu.au/about-deakin/people/svetha-venkatesh;",
        "dblp": ";189/7187;81/1984;57/6712",
        "google_scholar": ";50ErN80AAAAJ;AEkRUQcAAAAJ;S9PwnMYAAAAJ",
        "orcid": "0000-0001-7306-9402;0000-0001-9918-381X;;0000-0003-2247-850X",
        "linkedin": ";haripriya-harikumar/;;santur/",
        "or_profile": "~Banibrata_Ghosh1;~HARIPRIYA_HARIKUMAR1;~Svetha_Venkatesh1;~Santu_Rana1",
        "aff": "Deakin University;Deakin University;Deakin University;Deakin University",
        "aff_domain": "deakin.edu.au;deakin.edu.au;deakin.edu.au;deakin.edu.au",
        "position": "PhD student;Postdoc;Full Professor;Associate Professor",
        "bibtex": "@misc{\nghosh2024adversarial,\ntitle={Adversarial Defense using Targeted Manifold Manipulation},\nauthor={Banibrata Ghosh and HARIPRIYA HARIKUMAR and Svetha Venkatesh and Santu Rana},\nyear={2024},\nurl={https://openreview.net/forum?id=y3BuJotSKl}\n}",
        "github": "",
        "project": "",
        "reviewers": "nFtu;18Cc;izHU",
        "site": "https://openreview.net/forum?id=y3BuJotSKl",
        "pdf_size": 965882,
        "rating": "3;5;5",
        "confidence": "3;4;4",
        "soundness": "2;3;3",
        "contribution": "2;2;3",
        "presentation": "3;2;2",
        "wc_summary": "109;82;262",
        "wc_strengths": "46;101;141",
        "wc_weaknesses": "702;248;422",
        "wc_questions": "145;6;55",
        "wc_review": "1002;437;880",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1108;273;1030",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;1;2",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            151.0,
            79.25906888173743
        ],
        "wc_strengths_avg": [
            96.0,
            38.94440481849308
        ],
        "wc_weaknesses_avg": [
            457.3333333333333,
            187.02109209628972
        ],
        "wc_questions_avg": [
            68.66666666666667,
            57.56349151637308
        ],
        "wc_review_avg": [
            773.0,
            242.7522742770223
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            803.6666666666666,
            376.5867171788665
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.9999999999999998,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:cES7FMlBww8J:scholar.google.com/&scioq=Adversarial+Defense+using+Targeted+Manifold+Manipulation&hl=en&as_sdt=0,44",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Deakin University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.deakin.edu.au",
        "aff_unique_abbr": "Deakin",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Australia"
    },
    {
        "id": "y3CsNQal2l",
        "title": "Cross-Lingual Transfer with Large Language Models via Adaptive Adapter Merging",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "As an effective alternative to the direct fine-tuning on target tasks in specific languages, cross-lingual transfer addresses the challenges of limited training data by aligning representations across languages or by explicitly translating target languages into source languages. However, these methods possess certain limitations and fail to fully exploit the potential of Large Language Models (LLMs). In this paper, we regard the ability of LLMs in a particular task and language as a combination of \"task ability\" and \"language ability\". In the context of parameter-efficient fine-tuning and cross-lingual transfer, task ability is represented by adapters fine-tuning on the target task in the source language, while language ability is the ability to solve problems using the specific target language. In this work, we propose a novel adaptive adapter merging method for cross-lingual transfer, termed as $\\texttt{AdaMergeX}$. As language ability is not tied to any specific task, we introduce another easily accessible reference task from which language ability is obtained by adapter merging. Then by further merging it with adapters tuned on the target task in the source language, we can achieve effective cross-lingual transfer. Furthermore, unlike existing model merging methods that employ arithmetic addition, we propose a new structured-adaptive merging method that adapts the merging process based on the structure of adapters. Our empirical results demonstrate that our approach yields new and effective cross-lingual transfer, outperforming existing methods across all settings.",
        "keywords": "Cross-Lingual Transfer;Model Merging;Large Language Models",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Yiran Zhao;Wenxuan Zhang;Huiming Wang;Kenji Kawaguchi;Lidong Bing",
        "authorids": "~Yiran_Zhao2;~Wenxuan_Zhang1;~Huiming_Wang1;~Kenji_Kawaguchi1;~Lidong_Bing2",
        "gender": "M;;M;;",
        "homepage": "https://zhaoyiran924.github.io/;https://isakzhang.github.io/;https://circle-ming.github.io/;https://ml.comp.nus.edu.sg/#members;https://lidongbing.github.io",
        "dblp": ";85/1177-1.html;;;53/6625",
        "google_scholar": "D_HwSlEAAAAJ;https://scholar.google.com/citations?hl=en;;aLl3rYoAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;;",
        "linkedin": ";wenxuan-zhang-608b88153/;;;",
        "or_profile": "~Yiran_Zhao2;~Wenxuan_Zhang1;~Huiming_Wang1;~Kenji_Kawaguchi1;~Lidong_Bing3",
        "aff": "National University of Singapore;Alibaba Group;Singapore University of Technology and Design;National University of Singapore;Alibaba Group",
        "aff_domain": "u.nus.edu;alibaba-inc.com;sutd.edu.sg;nus.edu;alibaba-inc.com",
        "position": "PhD student;Researcher;PhD student;Presidential Young Professor;Scientist",
        "bibtex": "@misc{\nzhao2024crosslingual,\ntitle={Cross-Lingual Transfer with Large Language Models via Adaptive Adapter Merging},\nauthor={Yiran Zhao and Wenxuan Zhang and Huiming Wang and Kenji Kawaguchi and Lidong Bing},\nyear={2024},\nurl={https://openreview.net/forum?id=y3CsNQal2l}\n}",
        "github": "",
        "project": "",
        "reviewers": "PiPR;tcUW;CTKw;NmaX",
        "site": "https://openreview.net/forum?id=y3CsNQal2l",
        "pdf_size": 688087,
        "rating": "3;3;5;8",
        "confidence": "4;5;5;2",
        "soundness": "2;2;3;4",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;4",
        "wc_summary": "114;70;166;208",
        "wc_strengths": "31;65;134;34",
        "wc_weaknesses": "413;245;500;29",
        "wc_questions": "74;22;75;83",
        "wc_review": "632;402;875;354",
        "wc_reply_reviewers": "0;0;129;0",
        "wc_reply_authors": "514;509;356;188",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            4.0,
            1.224744871391589
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            139.5,
            52.14163403653553
        ],
        "wc_strengths_avg": [
            66.0,
            41.454794656348255
        ],
        "wc_weaknesses_avg": [
            296.75,
            179.71696497548584
        ],
        "wc_questions_avg": [
            63.5,
            24.212600025606502
        ],
        "wc_review_avg": [
            565.75,
            207.16946565553525
        ],
        "wc_reply_reviewers_avg": [
            32.25,
            55.858638544096294
        ],
        "wc_reply_authors_avg": [
            391.75,
            133.68316086927328
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.7980074688861063,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:BWKRgc9xYX0J:scholar.google.com/&scioq=Cross-Lingual+Transfer+with+Large+Language+Models+via+Adaptive+Adapter+Merging&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0;1",
        "aff_unique_norm": "National University of Singapore;Alibaba Group;Singapore University of Technology and Design",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.nus.edu.sg;https://www.alibaba.com;https://www.sutd.edu.sg",
        "aff_unique_abbr": "NUS;Alibaba;SUTD",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;1",
        "aff_country_unique": "Singapore;China"
    },
    {
        "id": "y3dqBDnPay",
        "title": "HyperRep: Hypergraph-Based Self-Supervised Multimodal Representation Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Self-supervised representation learning on multimodal data plays a pivotal role in proficiently integrating and embedding information from various sources without the need for additional labeling. Notably, the majority of existing methods overlook the complex high-order inter- and intra-modality correlations characteristic of real-world multimodal data. In this paper, we introduce HyperRep, which combines the strength of hypergraph-based modeling with a self-supervised multimodal fusion information bottleneck principle. The former captures high-order correlations using hypergraphs to represent inter- and intra-modality relations, while the latter constrains the solution space, ensuring a more effective fusion of multimodal data. Our extensive experiments on four public datasets for three downstream tasks demonstrate HyperRep's superiority, as it consistently delivers competitive results against state-of-the-art methods.",
        "keywords": "hypergraph learning; multimodal learning; self-supervised learning; representation learning; clustering",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yutong Jiang;Yuhan Gao;Zunjie Zhu;Chenggang Yan;Yue Gao",
        "authorids": "~Yutong_Jiang1;~Yuhan_Gao1;~Zunjie_Zhu1;~Chenggang_Yan1;~Yue_Gao4",
        "gender": "F;F;M;M;M",
        "homepage": ";;;http://iipl.hdu.edu.cn/;http://www.gaoyue.org",
        "dblp": "https://dblp.uni-trier.de/pid/176/0410.html;;216/2729;146/1605;33/3099-2",
        "google_scholar": ";;https://scholar.google.com/citations?hl=en;;UTDfWocAAAAJ",
        "orcid": "0000-0002-3116-242X;0000-0002-7777-3613;0000-0001-6107-4538;;",
        "linkedin": ";;;;",
        "or_profile": "~Yutong_Jiang1;~Yuhan_Gao1;~Zunjie_Zhu1;~Chenggang_Yan1;~Yue_Gao4",
        "aff": "Shandong University;Hangzhou Dianzi University;Hangzhou Dianzi University;Hangzhou Dianzi University, Tsinghua University;Tsinghua University",
        "aff_domain": "sdu.edu.cn;hdu.edu.cn;hdu.edu.cn;hdu.edu.cn;tsinghua.edu.cn",
        "position": "MS student;PhD student;Assistant Professor;Full Professor;Associate Professor",
        "bibtex": "@misc{\njiang2024hyperrep,\ntitle={HyperRep: Hypergraph-Based Self-Supervised Multimodal Representation Learning},\nauthor={Yutong Jiang and Yuhan Gao and Zunjie Zhu and Chenggang Yan and Yue Gao},\nyear={2024},\nurl={https://openreview.net/forum?id=y3dqBDnPay}\n}",
        "github": "",
        "project": "",
        "reviewers": "scVn;bsih;yMHQ;N99Z",
        "site": "https://openreview.net/forum?id=y3dqBDnPay",
        "pdf_size": 6245512,
        "rating": "6;6;6;8",
        "confidence": "3;4;4;2",
        "soundness": "3;3;3;3",
        "contribution": "3;3;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "46;53;61;65",
        "wc_strengths": "38;124;98;19",
        "wc_weaknesses": "245;130;83;27",
        "wc_questions": "23;11;73;61",
        "wc_review": "352;318;315;172",
        "wc_reply_reviewers": "17;15;20;0",
        "wc_reply_authors": "1577;746;1213;602",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "5;2;3;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            56.25,
            7.327175444876422
        ],
        "wc_strengths_avg": [
            69.75,
            42.79237665753095
        ],
        "wc_weaknesses_avg": [
            121.25,
            80.21338728666181
        ],
        "wc_questions_avg": [
            42.0,
            25.709920264364882
        ],
        "wc_review_avg": [
            289.25,
            69.23646077031957
        ],
        "wc_reply_reviewers_avg": [
            13.0,
            7.713624310270756
        ],
        "wc_reply_authors_avg": [
            1034.5,
            386.15314319580517
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            1.479019945774904
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.8703882797784891,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6913441197244937191&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1;2",
        "aff_unique_norm": "Shandong University;Hangzhou Dianzi University;Tsinghua University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.sdu.edu.cn;http://www.hdu.edu.cn/;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "SDU;HGHDU;THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "y3qpL2Ioys",
        "title": "Towards Neural Architecture Search through Hierarchical Generative Modeling",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Neural Architecture Search (NAS) is gaining popularity in automating designing deep neural networks for various tasks. \nA typical NAS pipeline begins with a manually designed search space which is methodically explored during the process, aiding the discovery of high-performance models.\nAlthough NAS has shown impressive results in many cases, the strong performance remains largely dependent on, among other things, the prior knowledge about good designs which is implicitly incorporated into the process by carefully designing search spaces.\nIn general, this dependency is undesired, as it limits the applicability of NAS to less-studied tasks and/or results in an explosion of the cost needed to obtain strong results.\nIn this work, our aim is to address this limitation by leaning on the recent advances in generative modelling -- we propose a method that can navigate an extremely large, general-purpose search space efficiently, by training a two-level hierarchy of generative models.\nThe first level focuses on micro-cell design and leverages Conditional Continuous Normalizing Flow (CCNF) and the subsequent level uses a transformer-based sequence generator to produce macro architectures for a given task and architectural constraints.\nTo make the process computationally feasible, we perform task-agnostic pretraining of the generative models using a metric space of graphs and their zero-cost (ZC) similarity.\nWe evaluate our method on typical tasks, including CIFAR-10, CIFAR-100 and ImageNet models, where we show state-of-the-art performance compared to other low-cost NAS approaches.",
        "keywords": "Neural Architecture Search;Search Space Design;Generative Model",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Lichuan Xiang;\u0141ukasz Dudziak;Mohamed S Abdelfattah;Abhinav Mehrotra;Nicholas Donald Lane;Hongkai Wen",
        "authorids": "~Lichuan_Xiang1;~\u0141ukasz_Dudziak1;~Mohamed_S_Abdelfattah1;~Abhinav_Mehrotra1;~Nicholas_Donald_Lane1;~Hongkai_Wen1",
        "gender": "M;M;M;M;;",
        "homepage": ";;https://mohsaied.github.io/;https://abhinavmehrotra.github.io/;;",
        "dblp": "294/8850;228/7987;124/7095;154/4273;;",
        "google_scholar": ";R47NvpoAAAAJ;https://scholar.google.ca/citations?user=q4wBpWAAAAAJ;https://scholar.google.co.uk/citations?user=AbeyFKwAAAAJ;;",
        "orcid": ";;;;;",
        "linkedin": "lichuan-xiang-17ab43101/;;mabdelfattah/;;;",
        "or_profile": "~Lichuan_Xiang1;~\u0141ukasz_Dudziak1;~Mohamed_S_Abdelfattah1;~Abhinav_Mehrotra1;~Nicholas_Donald_Lane1;~Hongkai_Wen1",
        "aff": "The university of Warwick;Samsung;Cornell University;Samsung AI Center;;",
        "aff_domain": "warwick.ac.uk;samsung.com;cornell.edu;samsung.com;;",
        "position": "PhD student;Software Engineer;Assistant Professor;Researcher;;",
        "bibtex": "@misc{\nanonymous2024towards,\ntitle={Towards Neural Architecture Search through Hierarchical Generative Modeling},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=y3qpL2Ioys}\n}",
        "github": "",
        "project": "",
        "reviewers": "sRLa;LpBV;vDUp;2D3t",
        "site": "https://openreview.net/forum?id=y3qpL2Ioys",
        "pdf_size": 2758511,
        "rating": "3;5;5;6",
        "confidence": "4;4;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "53;58;126;149",
        "wc_strengths": "25;21;93;51",
        "wc_weaknesses": "146;78;238;97",
        "wc_questions": "5;3;163;86",
        "wc_review": "229;160;620;383",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "409;867;1588;589",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;2;2;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            96.5,
            41.8359892915179
        ],
        "wc_strengths_avg": [
            47.5,
            28.683619018526933
        ],
        "wc_weaknesses_avg": [
            139.75,
            61.91274101507702
        ],
        "wc_questions_avg": [
            64.25,
            66.11873788874074
        ],
        "wc_review_avg": [
            348.0,
            176.57434694768094
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            863.25,
            449.1193466106754
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:UZqPfeT4XtIJ:scholar.google.com/&scioq=Towards+Neural+Architecture+Search+through+Hierarchical+Generative+Modeling&hl=en&as_sdt=0,5",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "University of Warwick;Samsung;Cornell University",
        "aff_unique_dep": ";Samsung;",
        "aff_unique_url": "https://warwick.ac.uk;https://www.samsung.com;https://www.cornell.edu",
        "aff_unique_abbr": "Warwick;Samsung;Cornell",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;2;1",
        "aff_country_unique": "United Kingdom;South Korea;United States"
    },
    {
        "id": "y4bvKRvUz5",
        "title": "KernelWarehouse: Rethinking the Design of Dynamic Convolution",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Dynamic convolution learns a linear mixture of $n$ static kernels weighted with their sample-dependent attentions, demonstrating superior performance than normal convolution. However, it increases the number of convolutional parameters by $n$ times. This and the optimization difficulty lead to no research progress that can allow researchers to use a significant large value of $n$ (e.g., $n>100$ instead of typical setting $n<10$) to push forward the performance boundary of dynamic convolution while enjoying parameter efficiency. To fill this gap, in this paper, we rethink the basic concepts of **\"kernels\"**, **\"assembling kernels\"** and **\"attention function\"** in dynamic convolution through the lens of exploiting convolutional parameter dependencies within the same layer and across successive layers, and propose **\"KernelWarehouse\"**. As a more general form of dynamic convolution, KernelWarehouse provides a high degree of freedom to fit a desired parameter budget under large kernel numbers (e.g., $n=108$ or $n=188$). We validate our method on ImageNet and MS-COCO datasets with various ConvNet architectures, and show that it attains state-of-the-art results. For instance, the ResNet18$|$ResNet50$|$MobileNetV2$|$ConvNeXt-Tiny model trained with KernelWarehouse on ImageNet reaches 76.05\\%$|$81.05\\%$|$75.92\\%$|$82.55\\% top-1 accuracy. Thanks to its flexible design, KernelWarehouse can even reduce the model size of a ConvNet while improving the accuracy, e.g., our ResNet18 model with 36.45\\%$|$65.10\\% parameter reduction to the baseline shows 2.89\\%$|$2.29\\% absolute improvement to top-1 accuracy. Code is provided for results reproduction.",
        "keywords": "dynamic convolution;convolutional neural network;image classification;object detection",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/b310cf6123efbfcb7675fbd970782c31261bd168.zip",
        "author": "Chao Li;Anbang Yao",
        "authorids": "~Chao_Li16;~Anbang_Yao1",
        "gender": "M;",
        "homepage": "https://github.com/chaoli-ai/chaoli.github.io;https://yaoanbang.github.io/",
        "dblp": ";http://dblp.uni-trier.de/pers/hd/y/Yao:Anbang",
        "google_scholar": ";b9hCmPYAAAAJ",
        "orcid": ";0000-0002-3878-8679",
        "linkedin": ";anbang-yao-1805b712a/",
        "or_profile": "~Chao_Li16;~Anbang_Yao1",
        "aff": "Intel;Intel",
        "aff_domain": "intel.com;intel.com",
        "position": "Researcher;Principal Researcher",
        "bibtex": "@misc{\nli2024kernelwarehouse,\ntitle={KernelWarehouse: Rethinking the Design of Dynamic Convolution},\nauthor={Chao Li and Anbang Yao},\nyear={2024},\nurl={https://openreview.net/forum?id=y4bvKRvUz5}\n}",
        "github": "",
        "project": "",
        "reviewers": "AvKF;NHsB;MCn2;miVX;T4nD;okim",
        "site": "https://openreview.net/forum?id=y4bvKRvUz5",
        "pdf_size": 12807999,
        "rating": "5;5;5;6;6;8",
        "confidence": "3;5;4;2;4;4",
        "soundness": "3;3;3;3;3;4",
        "contribution": "2;2;2;2;3;4",
        "presentation": "2;3;3;2;3;2",
        "wc_summary": "75;38;148;44;54;58",
        "wc_strengths": "85;28;86;37;46;38",
        "wc_weaknesses": "49;226;342;36;78;182",
        "wc_questions": "25;4;3;16;2;5",
        "wc_review": "234;296;579;133;180;283",
        "wc_reply_reviewers": "0;0;0;0;0;0",
        "wc_reply_authors": "1756;2426;2896;1061;819;913",
        "reply_reviewers": "0;0;0;0;0;0",
        "reply_authors": "4;5;5;2;2;2",
        "rating_avg": [
            5.833333333333333,
            1.0671873729054748
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            3.1666666666666665,
            0.3726779962499649
        ],
        "contribution_avg": [
            2.5,
            0.7637626158259734
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            69.5,
            36.9853574630105
        ],
        "wc_strengths_avg": [
            53.333333333333336,
            23.335714164249517
        ],
        "wc_weaknesses_avg": [
            152.16666666666666,
            109.55731630318239
        ],
        "wc_questions_avg": [
            9.166666666666666,
            8.47381587925744
        ],
        "wc_review_avg": [
            284.1666666666667,
            143.34505766002383
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1645.1666666666667,
            790.1939459539171
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            1.3743685418725535
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.055215763037423274,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7538616998466727124&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Intel",
        "aff_unique_dep": "Intel Corporation",
        "aff_unique_url": "https://www.intel.com",
        "aff_unique_abbr": "Intel",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "y5e9fvvBUz",
        "title": "PRISM: Privacy-Preserving Improved Stochastic Masking For Federated Generative Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "While training generative models in distributed settings has recently become increasingly important, prior efforts often suffer from compromised performance, increased communication costs, and privacy issue. To tackle these challenges, we propose PRISM: a new federated framework tailored for generative models that emphasizes not only strong and stable performance but also resource efficiency and privacy preservation. The key of our method is to search for an optimal stochastic binary mask for a random network rather than updating the model weights; i.e., identifying a \u201cstrong lottery ticket\u201d: a sparse subnetwork with competitive generative performance. By communicating the binary mask in a stochastic manner, PRISM minimizes communication overhead while guaranteeing differential-privacy (DP). Unlike traditional GAN-based frameworks, PRISM employs the maximum mean discrepancy (MMD) loss, ensuring stable and strong generative capability, even in data-heterogeneous scenarios. Combined with our weight initialization strategy, PRISM also yields an exceptionally lightweight final model with no extra pruning or quantization, ideal for environments such as edge devices. We also provide a hybrid aggregation strategy, PRISM-$\\alpha$, which can trade off generative performance against communication cost. Experimental results on MNIST, CelebA, and CIFAR10 demonstrate that PRISM outperforms the previous methods in both IID and non-IID cases, all while preserving privacy at the lowest communication cost. To our knowledge, we are the first to successfully generate images in CelebA and CIFAR10 with distributed and privacy-considered settings.",
        "keywords": "Federated Learning;Generative Models",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Kyeongkook Seo;Dong-Jun Han;Jaejun Yoo",
        "authorids": "~Kyeongkook_Seo1;~Dong-Jun_Han1;~Jaejun_Yoo1",
        "gender": "M;M;M",
        "homepage": "https://www.tistory.com/member/blog;https://sites.google.com/view/djhan930/home?authuser=0;",
        "dblp": ";201/0078;141/8878-1",
        "google_scholar": ";https://scholar.google.co.kr/citations?user=-YR-GxUAAAAJ;https://scholar.google.co.kr/citations?user=7NBlQw4AAAAJ",
        "orcid": ";;0000-0001-5252-9668",
        "linkedin": ";;jaejunyoo/",
        "or_profile": "~Kyeongkook_Seo1;~Dong-Jun_Han1;~Jaejun_Yoo1",
        "aff": "Ulsan National Institute of Science and Technology;Purdue University;Ulsan National Institute of Science and Technology",
        "aff_domain": "unist.ac.kr;purdue.edu;unist.ac.kr",
        "position": "MS student;Postdoc;Assistant Professor",
        "bibtex": "@misc{\nseo2024prism,\ntitle={{PRISM}: Privacy-Preserving Improved Stochastic Masking For Federated Generative Models},\nauthor={Kyeongkook Seo and Dong-Jun Han and Jaejun Yoo},\nyear={2024},\nurl={https://openreview.net/forum?id=y5e9fvvBUz}\n}",
        "github": "",
        "project": "",
        "reviewers": "xZ6u;pni9;a69J;sDDa;N7hx",
        "site": "https://openreview.net/forum?id=y5e9fvvBUz",
        "pdf_size": 2630461,
        "rating": "3;3;5;5;5",
        "confidence": "3;5;4;3;3",
        "soundness": "1;2;3;3;2",
        "contribution": "1;2;1;2;2",
        "presentation": "2;3;3;2;3",
        "wc_summary": "46;84;81;57;82",
        "wc_strengths": "46;44;54;36;29",
        "wc_weaknesses": "89;249;213;158;193",
        "wc_questions": "27;61;112;2;118",
        "wc_review": "208;438;460;253;422",
        "wc_reply_reviewers": "237;91;0;29;130",
        "wc_reply_authors": "337;379;376;740;1321",
        "reply_reviewers": "4;1;0;1;1",
        "reply_authors": "4;3;2;3;5",
        "rating_avg": [
            4.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.6,
            0.8
        ],
        "soundness_avg": [
            2.2,
            0.7483314773547882
        ],
        "contribution_avg": [
            1.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            70.0,
            15.53061492665374
        ],
        "wc_strengths_avg": [
            41.8,
            8.588364221433554
        ],
        "wc_weaknesses_avg": [
            180.4,
            54.374994252873265
        ],
        "wc_questions_avg": [
            64.0,
            45.699015306678106
        ],
        "wc_review_avg": [
            356.2,
            104.31567475696066
        ],
        "wc_reply_reviewers_avg": [
            97.4,
            83.37529610142323
        ],
        "wc_reply_authors_avg": [
            630.6,
            374.9520502677642
        ],
        "reply_reviewers_avg": [
            1.4,
            1.3564659966250538
        ],
        "reply_authors_avg": [
            3.4,
            1.019803902718557
        ],
        "replies_avg": [
            33,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.4082482904638631,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:WrJbHh8r1uwJ:scholar.google.com/&scioq=PRISM:+Privacy-Preserving+Improved+Stochastic+Masking+For+Federated+Generative+Models&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Ulsan National Institute of Science and Technology;Purdue University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.unist.ac.kr;https://www.purdue.edu",
        "aff_unique_abbr": "UNIST;Purdue",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "id": "y6TIwYucUC",
        "title": "SPI-GAN: Denoising Diffusion GANs with Straight-Path Interpolations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Score-based generative models (SGMs) show the state-of-the-art sampling quality and diversity. However, their training/sampling complexity is notoriously high due to the highly complicated forward/reverse processes, so learning a simpler process is gathering much attention currently. We present an enhanced GAN-based denoising method, called SPI-GAN, using our proposed straight-path interpolation definition. To this end, we propose a GAN architecture i) denoising through the straight-path and ii) characterized by a continuous mapping neural network for imitating the denoising path. This approach drastically reduces the sampling time while achieving as high sampling quality and diversity as SGMs. As a result, SPI-GAN is one of the best-balanced models among the sampling quality, diversity, and time for CIFAR-10, CelebA-HQ-256, and LSUN-Church-256.",
        "keywords": "Score-based generative models;GAN-based denoising method;Straight-path interpolation",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/9082173ad18c5cf8748d402eb759a2ab5d78ebc5.zip",
        "author": "Jinsung Jeon;Noseong Park",
        "authorids": "~Jinsung_Jeon1;~Noseong_Park1",
        "gender": ";",
        "homepage": "https://sites.google.com/view/npark/home?authuser=0;",
        "dblp": "294/0098;",
        "google_scholar": "0R6W6lsAAAAJ;",
        "orcid": "0000-0002-9693-2739;",
        "linkedin": "jinsung-jeon-994942289/;",
        "or_profile": "~Jinsung_Jeon1;~Noseong_Park1",
        "aff": "Yonsei University;",
        "aff_domain": "yonsei.ac.kr;",
        "position": "PhD student;",
        "bibtex": "@misc{\njeon2024spigan,\ntitle={{SPI}-{GAN}: Denoising Diffusion {GAN}s with Straight-Path Interpolations},\nauthor={Jinsung Jeon and Noseong Park},\nyear={2024},\nurl={https://openreview.net/forum?id=y6TIwYucUC}\n}",
        "github": "",
        "project": "",
        "reviewers": "NZnM;vo3V;9sY8;cKVW",
        "site": "https://openreview.net/forum?id=y6TIwYucUC",
        "pdf_size": 45264794,
        "rating": "5;5;5;8",
        "confidence": "3;4;5;3",
        "soundness": "3;1;2;4",
        "contribution": "3;2;2;3",
        "presentation": "3;3;3;4",
        "wc_summary": "135;51;122;68",
        "wc_strengths": "81;126;63;45",
        "wc_weaknesses": "232;311;198;31",
        "wc_questions": "110;97;55;41",
        "wc_review": "558;585;438;185",
        "wc_reply_reviewers": "182;129;0;0",
        "wc_reply_authors": "703;1296;876;156",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "3;5;4;2",
        "rating_avg": [
            5.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            1.118033988749895
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            94.0,
            35.31996602489872
        ],
        "wc_strengths_avg": [
            78.75,
            30.102948360584218
        ],
        "wc_weaknesses_avg": [
            193.0,
            102.12002741871939
        ],
        "wc_questions_avg": [
            75.75,
            28.560243346302215
        ],
        "wc_review_avg": [
            441.5,
            158.08937345691518
        ],
        "wc_reply_reviewers_avg": [
            77.75,
            79.97616832532051
        ],
        "wc_reply_authors_avg": [
            757.75,
            408.89997248715974
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.5,
            1.118033988749895
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:cfDWqu4Oi9YJ:scholar.google.com/&scioq=SPI-GAN:+Denoising+Diffusion+GANs+with+Straight-Path+Interpolations&hl=en&as_sdt=0,44",
        "gs_version_total": 4,
        "aff_unique_index": "0",
        "aff_unique_norm": "Yonsei University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.yonsei.ac.kr",
        "aff_unique_abbr": "Yonsei",
        "aff_country_unique_index": "0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "Adapting Large Language Models via Reading Comprehension",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17426",
        "id": "y886UXPEZ0",
        "author_site": "Daixuan Cheng, Shaohan Huang, Furu Wei",
        "tldr": "",
        "abstract": "We explore how continued pre-training on domain-specific corpora influences large language models, revealing that training on the raw corpora endows the model with domain knowledge, but drastically hurts its prompting ability for question answering. Taken inspiration from human learning via reading comprehension--practice after reading improves the ability to answer questions based on the learned knowledge--we propose a simple method for transforming raw corpora into reading comprehension texts. Each raw text is enriched with a series of tasks related to its content. Our method, highly scalable and applicable to any pre-training corpora, consistently enhances performance across various tasks in three different domains: biomedicine, finance, and law. Notably, our 7B language model achieves competitive performance with domain-specific models of much larger scales, such as BloombergGPT-50B. Furthermore, we demonstrate that domain-specific reading comprehension texts can improve the model's performance even on general benchmarks, showing the potential to develop a general model across even more domains. Our model, code, and data are available at https://github.com/microsoft/LMOps.",
        "keywords": "Domain Adaption;Continual Pre-training;Large Language Model",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/bd4ad4a1f4f50780208258087dabac5316cf128a.zip",
        "author": "Daixuan Cheng;Shaohan Huang;Furu Wei",
        "authorids": "~Daixuan_Cheng1;~Shaohan_Huang1;~Furu_Wei1",
        "gender": "F;M;M",
        "homepage": ";;https://www.microsoft.com/en-us/research/people/fuwei/",
        "dblp": "289/2865;176/0380;72/5870",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;G-V1VpwAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Daixuan_Cheng1;~Shaohan_Huang1;~Furu_Wei1",
        "aff": "Beijing Insititute for General Artifical Intelligence;Microsoft;Microsoft Research",
        "aff_domain": "bigai.ai;microsoft.com;microsoft.com",
        "position": "Researcher;Researcher;Distinguished Scientist",
        "bibtex": "@inproceedings{\ncheng2024adapting,\ntitle={Adapting Large Language Models via Reading Comprehension},\nauthor={Daixuan Cheng and Shaohan Huang and Furu Wei},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=y886UXPEZ0}\n}",
        "github": "",
        "project": "",
        "reviewers": "pD3t;aRRU;Cte9;qcCv",
        "pdf_size": 669803,
        "rating": "6;6;6;8",
        "confidence": "4;4;3;3",
        "soundness": "3;4;3;3",
        "contribution": "2;4;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "44;60;96;39",
        "wc_strengths": "45;47;54;30",
        "wc_weaknesses": "75;56;72;38",
        "wc_questions": "39;47;39;38",
        "wc_review": "203;210;261;145",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "541;1417;519;123",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;3;1;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            59.75,
            22.320114247019436
        ],
        "wc_strengths_avg": [
            44.0,
            8.74642784226795
        ],
        "wc_weaknesses_avg": [
            60.25,
            14.737282653189496
        ],
        "wc_questions_avg": [
            40.75,
            3.6314597615834874
        ],
        "wc_review_avg": [
            204.75,
            41.12405014100629
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            650.0,
            473.0380534375644
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1,
        "openreview": "https://openreview.net/forum?id=y886UXPEZ0",
        "pdf": "https://openreview.net/pdf?id=y886UXPEZ0",
        "email": "bigai.ai;microsoft.com;microsoft.com",
        "author_num": 3,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Beijing Institute for General Artificial Intelligence;Microsoft",
        "aff_unique_dep": ";Microsoft Corporation",
        "aff_unique_url": "https://www.bigaiai.org;https://www.microsoft.com",
        "aff_unique_abbr": "BIGAI;Microsoft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "y8dHnNEcJu",
        "title": "SemPLeS: Semantic Prompt Learning for Weakly-Supervised Semantic Segmentation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Weakly-Supervised Semantic Segmentation (WSSS) aims to train segmentation models using training image data with only image-level supervision. Since precise pixel-level annotations are not accessible, existing methods typically focus on producing pseudo masks for training segmentation models by refining CAM-like heatmaps. However, the produced heatmaps may only capture discriminative image regions of target object categories or the associated co-occurring backgrounds. To address the issues, we propose a Semantic Prompt Learning for WSSS (SemPLeS) framework, which learns to effectively prompt the CLIP space to enhance the semantic alignment between the segmented regions and the target object categories. More specifically, we propose Contrastive Prompt Learning and Class-associated Semantic Refinement to learn the prompts that adequately describe and suppress the image backgrounds associated with each target object category. In this way, our proposed framework is able to perform better semantic matching between object regions and the associated text labels, resulting in desired pseudo masks for training the segmentation model. The proposed SemPLeS framework achieves SOTA performance on the standard WSSS benchmarks, PASCAL VOC and MS COCO, and demonstrated interpretability with the semantic visualization of our learned prompts. The source codes are provided in the supplementary.",
        "keywords": "WSSS;CLIP;prompt;weakly-supervised;semantic segmentation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/ce25c9a250920ecd1f20c3898795f559f7ff9758.zip",
        "author": "Ci-Siang Lin;Chien-Yi Wang;Yu-Chiang Frank Wang;Min-Hung Chen",
        "authorids": "~Ci-Siang_Lin1;~Chien-Yi_Wang1;~Yu-Chiang_Frank_Wang2;~Min-Hung_Chen2",
        "gender": ";M;M;M",
        "homepage": ";https://chienyiwang.github.io/;http://vllab.ee.ntu.edu.tw/ycwang.html;https://minhungchen.netlify.app/",
        "dblp": ";12/6741;30/1690;04/6305",
        "google_scholar": ";05LW2DcAAAAJ;HSGvdtoAAAAJ;ovzuxi8AAAAJ",
        "orcid": ";;0000-0002-2333-157X;0000-0002-4046-3937",
        "linkedin": ";chienyiwang/;;chensteven/",
        "or_profile": "~Ci-Siang_Lin1;~Chien-Yi_Wang1;~Yu-Chiang_Frank_Wang2;~Min-Hung_Chen2",
        "aff": ";NVIDIA;National Taiwan University;NVIDIA",
        "aff_domain": ";nvidia.com;ntu.edu.tw;nvidia.com",
        "position": ";Researcher;Full Professor;Research Scientist",
        "bibtex": "@misc{\nlin2024semples,\ntitle={Sem{PL}eS: Semantic Prompt Learning for Weakly-Supervised Semantic Segmentation},\nauthor={Ci-Siang Lin and Chien-Yi Wang and Yu-Chiang Frank Wang and Min-Hung Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=y8dHnNEcJu}\n}",
        "github": "",
        "project": "",
        "reviewers": "LBiv;ZuKn;WM2o;BYUr",
        "site": "https://openreview.net/forum?id=y8dHnNEcJu",
        "pdf_size": 3117178,
        "rating": "3;5;5;8",
        "confidence": "5;5;5;4",
        "soundness": "4;2;2;4",
        "contribution": "3;2;2;4",
        "presentation": "4;2;2;3",
        "wc_summary": "89;108;42;62",
        "wc_strengths": "45;47;55;62",
        "wc_weaknesses": "281;185;293;48",
        "wc_questions": "43;158;2;19",
        "wc_review": "458;498;392;191",
        "wc_reply_reviewers": "0;272;0;0",
        "wc_reply_authors": "304;1481;1028;247",
        "reply_reviewers": "0;2;0;0",
        "reply_authors": "2;3;3;2",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            1.0
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            75.25,
            25.21284394906691
        ],
        "wc_strengths_avg": [
            52.25,
            6.7592529172978875
        ],
        "wc_weaknesses_avg": [
            201.75,
            98.14116108952452
        ],
        "wc_questions_avg": [
            55.5,
            60.94464701678073
        ],
        "wc_review_avg": [
            384.75,
            118.09186043076805
        ],
        "wc_reply_reviewers_avg": [
            68.0,
            117.77945491468365
        ],
        "wc_reply_authors_avg": [
            765.0,
            515.4294326093534
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8892972917998875,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15880590771312616126&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "NVIDIA;National Taiwan University",
        "aff_unique_dep": "NVIDIA Corporation;",
        "aff_unique_url": "https://www.nvidia.com;https://www.ntu.edu.tw",
        "aff_unique_abbr": "NVIDIA;NTU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Taiwan",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "y9wQf6ZWS2",
        "title": "RegQ: Convergent Q-Learning with Linear Function Approximation using Regularization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Q-learning is widely used algorithm in reinforcement learning community. Under the lookup table setting, its convergence is well established. However, its behavior is known to be unstable with the linear function approximation case. This paper develops a new Q-learning algorithm, called RegQ, that converges when linear function approximation is used. We prove that simply adding an appropriate regularization term ensures convergence of the algorithm. Its stability is established using a recent analysis tool based on switching system models. Moreover, we experimentally show that RegQ converges in environments where Q-learning with linear function approximation has known to diverge. An error bound on the solution where the algorithm converges is also given.",
        "keywords": "reinforcement learning;Q-learning;convergence",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/ff69168b916bb4b175dabc3c18fc8c2527b764df.pdf",
        "author": "Han-Dong Lim;Donghwan Lee",
        "authorids": "~Han-Dong_Lim1;~Donghwan_Lee2",
        "gender": "M;M",
        "homepage": ";https://sites.google.com/site/donghwanleehome",
        "dblp": "301/8950;",
        "google_scholar": "n2Vw99sAAAAJ;",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Han-Dong_Lim1;~Donghwan_Lee2",
        "aff": "Korea Advanced Institute of Science & Technology;Korea Advanced Institute of Science & Technology",
        "aff_domain": "kaist.ac.kr;kaist.ac.kr",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nlim2024regq,\ntitle={RegQ: Convergent Q-Learning with Linear Function Approximation using Regularization},\nauthor={Han-Dong Lim and Donghwan Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=y9wQf6ZWS2}\n}",
        "github": "",
        "project": "",
        "reviewers": "iu9a;qe9J;aR4a;drQD",
        "site": "https://openreview.net/forum?id=y9wQf6ZWS2",
        "pdf_size": 917857,
        "rating": "5;5;6;8",
        "confidence": "3;3;4;4",
        "soundness": "3;2;3;4",
        "contribution": "2;1;3;3",
        "presentation": "3;3;3;2",
        "wc_summary": "60;91;46;39",
        "wc_strengths": "28;80;28;94",
        "wc_weaknesses": "120;140;101;153",
        "wc_questions": "1;32;42;32",
        "wc_review": "209;343;217;318",
        "wc_reply_reviewers": "0;0;39;0",
        "wc_reply_authors": "284;495;467;401",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            59.0,
            19.96246477767713
        ],
        "wc_strengths_avg": [
            57.5,
            29.912372022292047
        ],
        "wc_weaknesses_avg": [
            128.5,
            19.75474626513841
        ],
        "wc_questions_avg": [
            26.75,
            15.417117110536587
        ],
        "wc_review_avg": [
            271.75,
            59.478462488534454
        ],
        "wc_reply_reviewers_avg": [
            9.75,
            16.887495373796554
        ],
        "wc_reply_authors_avg": [
            411.75,
            81.26922849393858
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.8164965809277259,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2634424249051177136&as_sdt=5,31&sciodt=0,31&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Korea Advanced Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kaist.ac.kr",
        "aff_unique_abbr": "KAIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "yAcLwJu9qs",
        "title": "Assessing Visually-Continuous Corruption Robustness of Neural Networks Relative to Human Performance",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "While Neural Networks (NNs) have surpassed human accuracy in image classi- fication on ImageNet, they often lack robustness against image corruption, i.e., corruption robustness. Yet such robustness is seemingly effortless for human perception. In this paper, we propose visually-continuous corruption robustness (VCR) \u2013 an extension of corruption robustness to allow assessing it over the wide and continuous range of changes that correspond to the human perceptive quality (i.e., from the original image to the full distortion of all perceived visual information), along with two novel human-aware metrics for NN evaluation. To compare VCR of NNs with human perception, we conducted extensive experiments on 14 commonly used image corruptions with 7,718 human participants and state-of-the-art robust NN models with different training objectives (e.g., standard, adversarial, corruption robustness), different architectures (e.g., convolution NNs, vision transformers), and different amounts of training data augmentation.\nOur study showed that: 1) assessing robustness against continuous corruption can reveal insufficient robustness undetected by existing benchmarks; as a result, 2) the gap between NN and human robustness is larger than previously known; and finally, 3) some image corruptions have a similar impact on human perception, offering opportunities for more cost-effective robustness assessments. Our validation set with 14 image corruptions, human robustness data, and the evaluation code is provided as a toolbox and a benchmark.",
        "keywords": "Robustness;Computer Vision",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/25fe8ff0947fde96a69d4796a6c747c0839b5f40.pdf",
        "author": "Huakun Shen;Boyue Caroline Hu;Krzysztof Czarnecki;Lina Marsso;Marsha Chechik",
        "authorids": "~Huakun_Shen1;~Boyue_Caroline_Hu1;~Krzysztof_Czarnecki1;~Lina_Marsso1;~Marsha_Chechik1",
        "gender": "M;F;M;;F",
        "homepage": "https://huakunshen.com;https://www.cs.toronto.edu/~boyue/;https://uwaterloo.ca/waterloo-intelligent-systems-engineering-lab/people-profiles/krzysztof-czarnecki;;http://www.cs.toronto.edu/~chechik/",
        "dblp": "313/2614;245/0715;72/6806;;",
        "google_scholar": ";;https://scholar.google.ca/citations?user=ZzCpumQAAAAJ;;https://scholar.google.com.tw/citations?user=CYfxRVIAAAAJ",
        "orcid": ";;0000-0003-1642-1101;;",
        "linkedin": "huakun-shen/;;krzysztof-czarnecki-a3a266;;",
        "or_profile": "~Huakun_Shen1;~Boyue_Caroline_Hu1;~Krzysztof_Czarnecki1;~Lina_Marsso1;~Marsha_Chechik1",
        "aff": "University of Toronto;Department of Computer Science;University of Waterloo;;",
        "aff_domain": "utoronto.ca;cs.toronto.edu;uwaterloo.ca;;",
        "position": "MS student;PhD student;Full Professor;;",
        "bibtex": "@misc{\nshen2024assessing,\ntitle={Assessing Visually-Continuous Corruption Robustness of Neural Networks Relative to Human Performance},\nauthor={Huakun Shen and Boyue Caroline Hu and Krzysztof Czarnecki and Lina Marsso and Marsha Chechik},\nyear={2024},\nurl={https://openreview.net/forum?id=yAcLwJu9qs}\n}",
        "github": "",
        "project": "",
        "reviewers": "zDY4;wHpz;ZhQE;gtM1",
        "site": "https://openreview.net/forum?id=yAcLwJu9qs",
        "pdf_size": 1076202,
        "rating": "3;5;6;8",
        "confidence": "4;3;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "1;1;3;3",
        "wc_summary": "36;65;55;81",
        "wc_strengths": "39;29;62;112",
        "wc_weaknesses": "194;274;169;48",
        "wc_questions": "31;8;3;201",
        "wc_review": "300;376;289;442",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "876;143;411;872",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;1;2",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            1.0
        ],
        "wc_summary_avg": [
            59.25,
            16.315253599009733
        ],
        "wc_strengths_avg": [
            60.5,
            32.05074102107469
        ],
        "wc_weaknesses_avg": [
            171.25,
            81.04127035035914
        ],
        "wc_questions_avg": [
            60.75,
            81.658970725818
        ],
        "wc_review_avg": [
            351.75,
            61.94503612074175
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            575.5,
            313.18085829117973
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.16012815380508713,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5381773559224876237&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of Toronto;Unknown Institution;University of Waterloo",
        "aff_unique_dep": ";Department of Computer Science;",
        "aff_unique_url": "https://www.utoronto.ca;;https://uwaterloo.ca",
        "aff_unique_abbr": "U of T;;UW",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Canada;"
    },
    {
        "title": "Bandits with Replenishable Knapsacks: the Best of both Worlds",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17425",
        "id": "yBIJRIYTqa",
        "author_site": "Martino Bernasconi, Matteo Castiglioni, Andrea Celli, Federico Fusco",
        "tldr": "",
        "abstract": "The bandits with knapsacks (BwK) framework models online decision-making problems in which an agent makes a sequence of decisions subject to resource consumption constraints. The traditional model assumes that each action consumes a non-negative amount of resources and the process ends when the initial budgets are fully depleted. We study a natural generalization of the BwK framework which allows non-monotonic resource utilization, i.e., resources can be replenished by a positive amount. We propose a best-of-both-worlds primal-dual template that can handle any online learning problem with replenishment for which a suitable primal regret minimizer exists. In particular, we provide the first positive results for the case of adversarial inputs by showing that our framework guarantees a constant competitive ratio $\\alpha$ when $B=\\Omega(T)$ or when the possible per-round replenishment is a positive constant. Moreover, under a stochastic input model, our algorithm yields an instance-independent $\\tilde{\\mathcal{O}}(T^{1/2})$ regret bound which complements existing instance-dependent bounds for the same setting. Finally, we provide applications of our framework to some economic problems of practical relevance.",
        "keywords": "online learning;bandits with knapsack;best-of-both-worlds",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Martino Bernasconi;Matteo Castiglioni;Andrea Celli;Federico Fusco",
        "authorids": "~Martino_Bernasconi1;~Matteo_Castiglioni1;~Andrea_Celli1;~Federico_Fusco1",
        "gender": ";;M;M",
        "homepage": "https://sites.google.com/view/martinobernasconi/home;https://castiglionimatteo.github.io;https://andcelli.github.io/;https://sites.google.com/uniroma1.it/federicofusco/home",
        "dblp": "301/6372.html;225/7720;190/7301.html;243/5755",
        "google_scholar": "dtmoCekAAAAJ;https://scholar.google.it/citations?user=NPE3HAYAAAAJ;9wQscqEAAAAJ;https://scholar.google.co.il/citations?user=oaS8iAQAAAAJ",
        "orcid": ";0000-0002-1070-6766;;0000-0001-6250-945X",
        "linkedin": ";;;",
        "or_profile": "~Martino_Bernasconi1;~Matteo_Castiglioni1;~Andrea_Celli1;~Federico_Fusco1",
        "aff": "Bocconi University;Politecnico di Milano;Bocconi University;University of Roma \"La Sapienza\"",
        "aff_domain": "unibocconi.it;polimi.it;unibocconi.it;uniroma1.it",
        "position": "Postdoc;Assistant Professor;Assistant Professor;Lecturer",
        "bibtex": "@inproceedings{\nbernasconi2024bandits,\ntitle={Bandits with Replenishable Knapsacks: the Best of both Worlds},\nauthor={Martino Bernasconi and Matteo Castiglioni and Andrea Celli and Federico Fusco},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=yBIJRIYTqa}\n}",
        "github": "",
        "project": "",
        "reviewers": "fWPt;divY;GRFy;fu8A",
        "pdf_size": 388600,
        "rating": "6;6;6;6",
        "confidence": "4;3;3;4",
        "soundness": "3;3;2;3",
        "contribution": "2;3;2;3",
        "presentation": "3;3;3;2",
        "wc_summary": "59;33;46;198",
        "wc_strengths": "56;24;42;55",
        "wc_weaknesses": "289;63;59;187",
        "wc_questions": "2;92;53;41",
        "wc_review": "406;212;200;481",
        "wc_reply_reviewers": "0;0;23;0",
        "wc_reply_authors": "862;231;366;196",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "2;1;2;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            84.0,
            66.45675285477014
        ],
        "wc_strengths_avg": [
            44.25,
            12.93010054098575
        ],
        "wc_weaknesses_avg": [
            149.5,
            95.5758860801196
        ],
        "wc_questions_avg": [
            47.0,
            32.101401838549044
        ],
        "wc_review_avg": [
            324.75,
            121.74845994919197
        ],
        "wc_reply_reviewers_avg": [
            5.75,
            9.959292143521045
        ],
        "wc_reply_authors_avg": [
            413.75,
            266.4679858819817
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13473851197094656569&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=yBIJRIYTqa",
        "pdf": "https://openreview.net/pdf?id=yBIJRIYTqa",
        "email": "unibocconi.it;polimi.it;unibocconi.it;uniroma1.it",
        "author_num": 4,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "Bocconi University;Politecnico di Milano;University of Rome La Sapienza",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.bocconi.edu;https://www.polimi.it;https://www.uniroma1.it",
        "aff_unique_abbr": "Bocconi;Polimi;La Sapienza",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Rome",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Italy"
    },
    {
        "id": "yBP36xQhZl",
        "title": "Forward Gradient Training of Spiking Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Neuromorphic computing with spiking neural networks (SNNs) is promising for energy-efficient applications. However, the supervised learning of SNNs is challenging considering biological plausibility and neuromorphic hardware compatibility. Most existing successful methods rely on backpropagation (BP) through time and across layers for temporal and spatial credit assignments, which is hard to realize. While some online training methods tackle temporal credit assignment by eligibility traces, it remains an important problem for error signal propagation with proper spatial credit assignment. In this work, we propose a new method, forward gradient training (FGT), for spiking neural networks. FGT only leverages unidirectional forward propagation across layers and direct feedback signals from the top layer to calculate gradients for spatial credit assignment, and we improve the large variance of vanilla forward gradients by momentum feedback connections. FGT avoids layer-by-layer forward-backward calculation of BP with symmetric weights and separate phases, and has more theoretical guarantee and better performance compared with random feedback methods. When combined with online training methods, FGT enables forward and online training. This paves solid paths to on-chip SNN training. Extensive experiments demonstrate the effectiveness and robustness of FGT with similar performance as BP under both fully connected and convolutional networks on static and neuromorphic datasets.",
        "keywords": "spiking neural networks;neuromorphic computing;forward gradient;momentum feedback connections;non-backpropagation training",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/dfd9caf44be8bd8b87cba5fb60f23f1dee9cda28.zip",
        "author": "Mingqing Xiao;Qingyan Meng;Zongpeng Zhang;Di He;Zhouchen Lin",
        "authorids": "~Mingqing_Xiao1;~Qingyan_Meng1;~Zongpeng_Zhang1;~Di_He1;~Zhouchen_Lin1",
        "gender": "M;M;;M;M",
        "homepage": "https://pkuxmq.github.io/;https://zero-lab-pku.github.io/personwise/mengqingyan/;;https://dihe-pku.github.io/;https://zhouchenlin.github.io",
        "dblp": "19/2900-2;83/8497;303/0919;74/184;l/ZhouchenLin",
        "google_scholar": "Hvj-WrwAAAAJ;48VBXzUAAAAJ;;https://scholar.google.co.jp/citations?user=orVoz4IAAAAJ;https://scholar.google.com.tw/citations?user=TanjFwoAAAAJ",
        "orcid": "0000-0001-6191-7726;;0000-0002-4742-1852;;0000-0003-1493-7569",
        "linkedin": ";;;;",
        "or_profile": "~Mingqing_Xiao1;~Qingyan_Meng1;~Zongpeng_Zhang1;~Di_He1;~Zhouchen_Lin1",
        "aff": "Peking University;The Chinese University of Hong Kong, Shenzhen;Peking University;Microsoft;Peking University",
        "aff_domain": "pku.edu.cn;edu.cn;stu.pku.edu.cn;microsoft.com;pku.edu.cn",
        "position": "PhD student;PhD student;PhD student;Senior Researcher;Professor",
        "bibtex": "@misc{\nxiao2024forward,\ntitle={Forward Gradient Training of Spiking Neural Networks},\nauthor={Mingqing Xiao and Qingyan Meng and Zongpeng Zhang and Di He and Zhouchen Lin},\nyear={2024},\nurl={https://openreview.net/forum?id=yBP36xQhZl}\n}",
        "github": "",
        "project": "",
        "reviewers": "D141;NYct;Azqo",
        "site": "https://openreview.net/forum?id=yBP36xQhZl",
        "pdf_size": 1193288,
        "rating": "5;5;5",
        "confidence": "4;4;3",
        "soundness": "3;3;3",
        "contribution": "3;2;2",
        "presentation": "3;3;3",
        "wc_summary": "75;20;96",
        "wc_strengths": "62;34;115",
        "wc_weaknesses": "51;149;110",
        "wc_questions": "126;3;105",
        "wc_review": "314;206;426",
        "wc_reply_reviewers": "84;0;0",
        "wc_reply_authors": "2002;1015;1408",
        "reply_reviewers": "1;0;0",
        "reply_authors": "4;3;3",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            63.666666666666664,
            32.04510709747884
        ],
        "wc_strengths_avg": [
            70.33333333333333,
            33.58901936976164
        ],
        "wc_weaknesses_avg": [
            103.33333333333333,
            40.28509512076258
        ],
        "wc_questions_avg": [
            78.0,
            53.72150407425317
        ],
        "wc_review_avg": [
            315.3333333333333,
            89.81957222986289
        ],
        "wc_reply_reviewers_avg": [
            28.0,
            39.59797974644666
        ],
        "wc_reply_authors_avg": [
            1475.0,
            405.7166498925081
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:-y5G-RVaxDUJ:scholar.google.com/&scioq=Forward+Gradient+Training+of+Spiking+Neural+Networks&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;2;0",
        "aff_unique_norm": "Peking University;Chinese University of Hong Kong;Microsoft",
        "aff_unique_dep": ";;Microsoft Corporation",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.cuhk.edu.cn;https://www.microsoft.com",
        "aff_unique_abbr": "Peking U;CUHK;Microsoft",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Shenzhen",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "yBZd6mCWXd",
        "title": "WI3D: Weakly Incremental 3D Detection via Visual Prompts",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Class-incremental 3D object detection demands a 3D detector to locate and recognize novel categories in a stream fashion, while not forgetting its previously learned knowledge. However, existing methods require delicate 3D annotations for learning novel categories, resulting in significant labeling cost. To this end, we explore a label-efficient approach called Weakly Incremental 3D object Detection (WI3D), which teaches a 3D detector to learn new object classes using cost-effective 2D visual prompts. For that, we propose a framework that infuses (i) class-agnostic pseudo label refinement module for high-quality 3D pseudo labels generation, (ii) cross-modal knowledge transfer for representation learning of novel classes, and (iii) reweighting knowledge distillation for preserving old class information. Extensive experiments under different incremental settings on both SUN-RGBD and ScanNet show that our approach learns well to detect novel classes while effectively preserving knowledge of base classes, and surpasses baseline approaches in WI3D scenarios.",
        "keywords": "Class-Incremental 3D Object Detection; Continual Learning; Cross-Modal",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/46060c68a627ab5e01a07c9b8c2d604f75626d14.pdf",
        "author": "Mingsheng Li;Sijin Chen;Shengji Tang;Hongyuan Zhu;Fukun Yin;Tao Chen",
        "authorids": "~Mingsheng_Li2;~Sijin_Chen1;~Shengji_Tang1;~Hongyuan_Zhu1;~Fukun_Yin1;~Tao_Chen6",
        "gender": ";M;M;;M;M",
        "homepage": ";https://ch3cook-fdu.github.io/;;;https://fukunyin.github.io/;https://eetchen.github.io/",
        "dblp": ";96/9616;330/9865;;272/0842;69/510-3",
        "google_scholar": ";https://scholar.google.com/citations?hl=en;K7drMDgAAAAJ;;HGFT79EAAAAJ;https://scholar.google.com.sg/citations?user=w3OoFL0AAAAJ",
        "orcid": ";;0009-0001-3456-8310;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Mingsheng_Li2;~Sijin_Chen1;~Shengji_Tang1;~Hongyuan_Zhu1;~Fukun_Yin1;~Tao_Chen6",
        "aff": ";Fudan University;Fudan University;;Tencent PCG ;Fudan University",
        "aff_domain": ";fudan.edu.cn;fudan.edu.cn;;tencent.com;fudan.edu.cn",
        "position": ";MS student;MS student;;Intern;Full Professor",
        "bibtex": "@misc{\nanonymous2024wid,\ntitle={{WI}3D: Weakly Incremental 3D Detection via Visual Prompts},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=yBZd6mCWXd}\n}",
        "github": "",
        "project": "",
        "reviewers": "asnb;QdxM;h7RY",
        "site": "https://openreview.net/forum?id=yBZd6mCWXd",
        "pdf_size": 3378767,
        "rating": "5;5;6",
        "confidence": "5;4;3",
        "soundness": "2;3;3",
        "contribution": "2;2;3",
        "presentation": "3;2;3",
        "wc_summary": "147;126;71",
        "wc_strengths": "54;37;73",
        "wc_weaknesses": "514;71;301",
        "wc_questions": "9;426;58",
        "wc_review": "724;660;503",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1232;918;1070",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;2;2",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            114.66666666666667,
            32.04510709747884
        ],
        "wc_strengths_avg": [
            54.666666666666664,
            14.704496666741854
        ],
        "wc_weaknesses_avg": [
            295.3333333333333,
            180.89837539962105
        ],
        "wc_questions_avg": [
            164.33333333333334,
            186.10451066239335
        ],
        "wc_review_avg": [
            629.0,
            92.84754529155128
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1073.3333333333333,
            128.21163060433412
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:78HQ5EXD-EYJ:scholar.google.com/&scioq=WI3D:+Weakly+Incremental+3D+Detection+via+Visual+Prompts&hl=en&as_sdt=0,5",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Fudan University;Tencent",
        "aff_unique_dep": ";PCG (Platform and Content Group)",
        "aff_unique_url": "https://www.fudan.edu.cn;https://www.tencent.com",
        "aff_unique_abbr": "Fudan;Tencent PCG",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "yBmMgvaEtO",
        "title": "Stochastic Adaptive Sequential Black-box Optimization for Diffusion Targeted Generation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Diffusion models have demonstrated great potential in generating high-quality content for images, natural language, protein domains, etc. However, how to perform user-preferred targeted generation via diffusion models with only black-box target scores of users remains challenging.   To address this issue, we first formulate the fine-tuning of the inference phase of a pre-trained diffusion model as a sequential black-box optimization problem.  Furthermore, we propose a novel stochastic adaptive sequential optimization algorithm to optimize cumulative black-box scores under unknown transition dynamics.   Theoretically, we prove a $O(\\frac{d^2}{\\sqrt{T}})$ convergence rate for cumulative convex functions without smooth and strongly convex assumptions.   Empirically, we can naturally apply our algorithm for diffusion black-box targeted generation. Experimental results demonstrate the ability of our method to generate target-guided images with high target scores.",
        "keywords": "Black-box Optimization;Diffusion Model;Targeted Generation",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Yueming Lyu;Kim Yong Tan;Yew-Soon Ong;Ivor Tsang",
        "authorids": "~Yueming_Lyu1;~Kim_Yong_Tan2;~Yew-Soon_Ong1;~Ivor_Tsang1",
        "gender": "M;M;M;M",
        "homepage": "https://yueminglyu.github.io/;;https://www.a-star.edu.sg/cfar/about-cfar/management/prof-ivor-tsang;http://www.ntu.edu.sg/home/asysong/",
        "dblp": ";;35/5873;64/4136",
        "google_scholar": "uQXB6-oAAAAJ;;rJMOlVsAAAAJ;https://scholar.google.com.tw/citations?user=h9oWOsEAAAAJ",
        "orcid": ";0009-0008-7245-1181;;0000-0002-4480-169X",
        "linkedin": ";;;",
        "or_profile": "~Yueming_Lyu1;~Kim_Yong_Tan2;~Ivor_W_Tsang1;~Yew_Soon_Ong1",
        "aff": "Agency for Science, Technology and Research (A*STAR);Nanyang Technological University;A*STAR;Nanyang Technological University",
        "aff_domain": "astar.edu.sg;ntu.edu.sg;cfar.a-star.edu.sg;ntu.edu.sg",
        "position": "Researcher;PhD student;Principal Researcher;Full Professor",
        "bibtex": "@misc{\nlyu2024stochastic,\ntitle={Stochastic Adaptive Sequential  Black-box Optimization for  Diffusion Targeted Generation},\nauthor={Yueming Lyu and Kim Yong Tan and Yew-Soon Ong and Ivor Tsang},\nyear={2024},\nurl={https://openreview.net/forum?id=yBmMgvaEtO}\n}",
        "github": "",
        "project": "",
        "reviewers": "q9dy;djVx;NXdQ;5v9t",
        "site": "https://openreview.net/forum?id=yBmMgvaEtO",
        "pdf_size": 50473778,
        "rating": "3;5;6;6",
        "confidence": "3;2;2;2",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "1;2;1;3",
        "wc_summary": "59;73;57;73",
        "wc_strengths": "92;54;24;23",
        "wc_weaknesses": "200;177;90;77",
        "wc_questions": "620;71;61;2",
        "wc_review": "971;375;232;175",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1001;622;161;245",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            2.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            65.5,
            7.533259586659682
        ],
        "wc_strengths_avg": [
            48.25,
            28.16358464400439
        ],
        "wc_weaknesses_avg": [
            136.0,
            53.32447843157962
        ],
        "wc_questions_avg": [
            188.5,
            250.517963427775
        ],
        "wc_review_avg": [
            438.25,
            316.0944281381752
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            507.25,
            333.77415642916395
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9428090415820632,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:WDaBVJEmQhsJ:scholar.google.com/&scioq=Stochastic+Adaptive+Sequential+Black-box+Optimization+for+Diffusion+Targeted+Generation&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;1",
        "aff_unique_norm": "Agency for Science, Technology and Research;Nanyang Technological University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.a-star.edu.sg;https://www.ntu.edu.sg",
        "aff_unique_abbr": "A*STAR;NTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Singapore"
    },
    {
        "id": "yC2jjvYVzb",
        "title": "Confidence-Based Model Selection: When to Take Shortcuts in Spurious Settings",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Effective machine learning models learn both robust features that directly determine the outcome of interest (e.g., an object with wheels is more likely to be a car), and shortcut features (e.g., an object on a road is more likely to be a car). The latter can be a source of error under distributional shift, when the correlations change at test-time. The prevailing sentiment in the robustness literature is to avoid such correlative shortcut features and learn robust predictors. However, while robust predictors perform better on worst-case distributional shifts, they often sacrifice accuracy on majority subpopulations. In this paper, we argue that shortcut features should not be entirely discarded. Instead, if we can identify the subpopulation to which an input belongs, we can adaptively choose among models with different strengths to achieve high performance on both majority and minority subpopulations. We propose COnfidence-baSed MOdel Selection (COSMOS), where we observe that model confidence can effectively guide model selection. Notably, COSMOS does not require any target labels or group annotations, either of which may be difficult to obtain or unavailable. We evaluate COSMOS on four datasets with spurious correlations, each with multiple test sets with varying levels of data distribution shift. We find that COSMOS achieves 2-5% lower average regret across all subpopulations, compared to using only robust predictors or other model aggregation methods.",
        "keywords": "distribution-shift robustness;spurious correlations;shortcut features;subpopulation shifts",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Annie S Chen;Yoonho Lee;Amrith Setlur;Sergey Levine;Chelsea Finn",
        "authorids": "~Annie_S_Chen1;~Yoonho_Lee1;~Amrith_Setlur1;~Sergey_Levine1;~Chelsea_Finn1",
        "gender": "F;M;M;M;F",
        "homepage": "https://anniesch.github.io/;https://yoonholee.com/;http://ars22.github.io;https://people.eecs.berkeley.edu/~svlevine/;https://ai.stanford.edu/~cbfinn/",
        "dblp": "277/1527.html;213/8086;https://dblp.uni-trier.de/pers/hd/s/Setlur:Amrith;80/7594;131/1783",
        "google_scholar": ";https://scholar.google.co.kr/citations?user=BAAZ_ysAAAAJ;https://scholar.google.ru/citations?user=i7V1kJgAAAAJ;8R35rCwAAAAJ;vfPE6hgAAAAJ",
        "orcid": ";;0000-0002-7061-3094;;",
        "linkedin": "annie-s-chen/;;;;",
        "or_profile": "~Annie_S_Chen1;~Yoonho_Lee1;~Amrith_Setlur1;~Sergey_Levine1;~Chelsea_Finn1",
        "aff": "Stanford University;Stanford University;Carnegie Mellon University;Google;Google",
        "aff_domain": "stanford.edu;stanford.edu;cmu.edu;google.com;google.com",
        "position": "PhD student;PhD student;PhD student;Research Scientist;Research Scientist",
        "bibtex": "@misc{\nchen2024confidencebased,\ntitle={Confidence-Based Model Selection: When to Take Shortcuts in Spurious Settings},\nauthor={Annie S Chen and Yoonho Lee and Amrith Setlur and Sergey Levine and Chelsea Finn},\nyear={2024},\nurl={https://openreview.net/forum?id=yC2jjvYVzb}\n}",
        "github": "",
        "project": "",
        "reviewers": "niM7;RGsk;4daw",
        "site": "https://openreview.net/forum?id=yC2jjvYVzb",
        "pdf_size": 1924957,
        "rating": "3;5;8",
        "confidence": "3;4;4",
        "soundness": "2;2;4",
        "contribution": "2;2;4",
        "presentation": "2;2;3",
        "wc_summary": "72;97;103",
        "wc_strengths": "146;69;108",
        "wc_weaknesses": "525;60;173",
        "wc_questions": "33;1;179",
        "wc_review": "776;227;563",
        "wc_reply_reviewers": "31;0;61",
        "wc_reply_authors": "1553;257;419",
        "reply_reviewers": "1;0;1",
        "reply_authors": "4;3;1",
        "rating_avg": [
            5.333333333333333,
            2.0548046676563256
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            90.66666666666667,
            13.424687043734844
        ],
        "wc_strengths_avg": [
            107.66666666666667,
            31.43600200760622
        ],
        "wc_weaknesses_avg": [
            252.66666666666666,
            198.01739541991986
        ],
        "wc_questions_avg": [
            71.0,
            77.47687827130535
        ],
        "wc_review_avg": [
            522.0,
            225.99557517792246
        ],
        "wc_reply_reviewers_avg": [
            30.666666666666668,
            24.9042611258038
        ],
        "wc_reply_authors_avg": [
            743.0,
            576.5622256096908
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.8029550685469661,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:2zbBUcEeR3AJ:scholar.google.com/&scioq=Confidence-Based+Model+Selection:+When+to+Take+Shortcuts+in+Spurious+Settings&hl=en&as_sdt=0,5",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;1;2;2",
        "aff_unique_norm": "Stanford University;Carnegie Mellon University;Google",
        "aff_unique_dep": ";;Google",
        "aff_unique_url": "https://www.stanford.edu;https://www.cmu.edu;https://www.google.com",
        "aff_unique_abbr": "Stanford;CMU;Google",
        "aff_campus_unique_index": "0;0;2;2",
        "aff_campus_unique": "Stanford;;Mountain View",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Inverse Approximation Theory for Nonlinear Recurrent Neural Networks",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17424",
        "id": "yC2waD70Vj",
        "author_site": "Shida Wang, Zhong Li, Qianxiao Li",
        "tldr": "",
        "abstract": "We prove an inverse approximation theorem for the approximation of nonlinear sequence-to-sequence relationships using recurrent neural networks (RNNs). This is a so-called Bernstein-type result in approximation theory, which deduces properties of a target function under the assumption that it can be effectively approximated by a hypothesis space. In particular, we show that nonlinear sequence relationships that can be stably approximated by nonlinear RNNs must have an exponential decaying memory structure - a notion that can be made precise. This extends the previously identified curse of memory in linear RNNs into the general nonlinear setting, and quantifies the essential limitations of the RNN architecture for learning sequential relationships with long-term memory. Based on the analysis, we propose a principled reparameterization method to overcome the limitations. Our theoretical results are confirmed by numerical experiments.",
        "keywords": "Recurrent neural networks;sequence modelling;approximation theory",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/42faa859a8871c719aac13acc0286f8740e21966.zip",
        "author": "Shida Wang;Zhong Li;Qianxiao Li",
        "authorids": "~Shida_Wang1;~Zhong_Li2;~Qianxiao_Li1",
        "gender": "M;M;M",
        "homepage": "https://radarfudan.github.io;https://www.microsoft.com/en-us/research/people/lzhong/;https://blog.nus.edu.sg/qianxiaoli/",
        "dblp": "245/6187;;172/0930.html",
        "google_scholar": "vA2YMfgAAAAJ;https://scholar.google.com/citations?view_op=list_works;https://scholar.google.com.sg/citations?user=zLgReYoAAAAJ",
        "orcid": ";;0000-0002-3903-3737",
        "linkedin": ";;",
        "or_profile": "~Shida_Wang1;~Zhong_Li2;~Qianxiao_Li1",
        "aff": "National University of Singapore;Microsoft Research Asia;National University of Singapore",
        "aff_domain": "nus.edu.sg;microsoft.com;nus.edu.sg",
        "position": "PhD student;Researcher;Assistant Professor",
        "bibtex": "@inproceedings{\nwang2024inverse,\ntitle={Inverse Approximation Theory for Nonlinear Recurrent Neural Networks},\nauthor={Shida Wang and Zhong Li and Qianxiao Li},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=yC2waD70Vj}\n}",
        "github": "",
        "project": "",
        "reviewers": "NURo;6cRG;dqeg;aNtd",
        "pdf_size": 1647263,
        "rating": "5;8;8;8",
        "confidence": "2;3;1;4",
        "soundness": "3;3;4;4",
        "contribution": "2;3;3;3",
        "presentation": "3;2;4;4",
        "wc_summary": "54;121;64;77",
        "wc_strengths": "58;79;84;118",
        "wc_weaknesses": "126;183;12;341",
        "wc_questions": "1;2;149;45",
        "wc_review": "239;385;309;581",
        "wc_reply_reviewers": "0;12;20;16",
        "wc_reply_authors": "896;975;691;854",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            7.25,
            1.299038105676658
        ],
        "confidence_avg": [
            2.5,
            1.118033988749895
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            79.0,
            25.583197610932064
        ],
        "wc_strengths_avg": [
            84.75,
            21.533404282648853
        ],
        "wc_weaknesses_avg": [
            165.5,
            118.5632742462859
        ],
        "wc_questions_avg": [
            49.25,
            60.26763227471277
        ],
        "wc_review_avg": [
            378.5,
            127.80747239500514
        ],
        "wc_reply_reviewers_avg": [
            12.0,
            7.483314773547883
        ],
        "wc_reply_authors_avg": [
            854.0,
            103.65085624344837
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.2581988897471611,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2145156232589881687&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=yC2waD70Vj",
        "pdf": "https://openreview.net/pdf?id=yC2waD70Vj",
        "email": "nus.edu.sg;microsoft.com;nus.edu.sg",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "National University of Singapore;Microsoft",
        "aff_unique_dep": ";Research",
        "aff_unique_url": "https://www.nus.edu.sg;https://www.microsoft.com/en-us/research/group/asia",
        "aff_unique_abbr": "NUS;MSR Asia",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Asia",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "Singapore;China"
    },
    {
        "id": "yCYnKMHX3u",
        "title": "MultiLayerDiffusion: Composing Global Contexts and Local Details in Image Generation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Diffusion models have demonstrated their capability to synthesize high-quality and diverse images from textual prompts. However, simultaneous control over both global contexts (e.g., object layouts and interactions) and local details (e.g., colors and emotions) still remains a significant challenge. The models often fail to understand complex descriptions involving multiple objects and reflect specified visual attributes to wrong targets or forget to reflect them. This paper presents MultiLayerDiffusion, a novel framework which allows simultaneous control over the global contexts and the local details in text-to-image generation without requiring training or fine-tuning. It assigns multiple global and local prompts to corresponding layers and composes them to generate images using pre-trained diffusion models. Our framework enables complex global-local compositions, decomposing intricate prompts into manageable concepts and controlling object details while preserving global contexts. We demonstrate that MultiLayerDiffusion effectively generates complex images that adhere to both user-provided object interactions and object details. We also show its effectiveness not only in image generation but also in image editing.",
        "keywords": "Text-to-image generation;global-local composition;diffusion models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/f0b78d07d44661d59f9e49101ea0d5a9bd13120f.zip",
        "author": "Moyuru Yamada;Manohar Kaul",
        "authorids": "~Moyuru_Yamada1;~Manohar_Kaul1",
        "gender": "M;M",
        "homepage": ";https://manukaul.github.io/",
        "dblp": "01/11186;29/10735",
        "google_scholar": ";https://scholar.google.com.tw/citations?user=jNroyK4AAAAJ",
        "orcid": ";",
        "linkedin": "moyuru-yamada-688704b3;manu-k-72b936287/",
        "or_profile": "~Moyuru_Yamada1;~Manohar_Kaul1",
        "aff": "Fujitsu Limited;Fujitsu Research and Development Center Co. Ltm.",
        "aff_domain": "fujitsu.com;fujitsu.com",
        "position": "Senior Researcher;Principal Researcher",
        "bibtex": "@misc{\nyamada2024multilayerdiffusion,\ntitle={MultiLayerDiffusion: Composing Global Contexts and Local Details in Image Generation},\nauthor={Moyuru Yamada and Manohar Kaul},\nyear={2024},\nurl={https://openreview.net/forum?id=yCYnKMHX3u}\n}",
        "github": "",
        "project": "",
        "reviewers": "7GYr;m9tU;h5z1",
        "site": "https://openreview.net/forum?id=yCYnKMHX3u",
        "pdf_size": 1970475,
        "rating": "3;3;5",
        "confidence": "5;5;4",
        "soundness": "2;2;2",
        "contribution": "2;2;2",
        "presentation": "1;2;3",
        "wc_summary": "45;33;67",
        "wc_strengths": "19;7;55",
        "wc_weaknesses": "226;121;134",
        "wc_questions": "3;33;3",
        "wc_review": "293;194;259",
        "wc_reply_reviewers": "23;0;0",
        "wc_reply_authors": "117;63;52",
        "reply_reviewers": "1;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            48.333333333333336,
            14.079141387961917
        ],
        "wc_strengths_avg": [
            27.0,
            20.396078054371138
        ],
        "wc_weaknesses_avg": [
            160.33333333333334,
            46.735663280007294
        ],
        "wc_questions_avg": [
            13.0,
            14.142135623730951
        ],
        "wc_review_avg": [
            248.66666666666666,
            41.071752931776466
        ],
        "wc_reply_reviewers_avg": [
            7.666666666666667,
            10.842303978193728
        ],
        "wc_reply_authors_avg": [
            77.33333333333333,
            28.40578970718626
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            8,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ZGSRRXNUdpEJ:scholar.google.com/&scioq=MultiLayerDiffusion:+Composing+Global+Contexts+and+Local+Details+in+Image+Generation&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Fujitsu Limited;Fujitsu Research and Development Center",
        "aff_unique_dep": ";Research and Development",
        "aff_unique_url": "https://www.fujitsu.com;https://www.fujitsu.com/global/",
        "aff_unique_abbr": "Fujitsu;Fujitsu R&D",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Japan"
    },
    {
        "id": "yF19SY1i8M",
        "title": "Towards More Robust NLP System Evaluation: Handling Missing Scores in Benchmarks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The evaluation of natural language processing (NLP) systems is crucial for advancing the field, but current benchmarking approaches often assume that all systems have scores available for all tasks, which is not always practical. In reality, several factors such as the cost of running baseline, private systems, computational limitations, or incomplete data may prevent some systems from being evaluated on entire tasks. This paper formalize an existing problem in NLP research: benchmarking when some systems scores are missing on the task, and proposes a novel approach to address it. Our method utilizes a compatible partial ranking approach to impute missing data, which is then aggregated using the Borda count method. It includes two refinements designed specifically for scenarios where either task-level or instance-level scores are available. We also introduce an extended benchmark, which contains over 131 million scores, an order of magnitude larger than existing benchmarks. We validate our methods and demonstrate their effectiveness in addressing the challenge of missing system evaluation on an entire task. This work highlights the need for more comprehensive benchmarking approaches that can handle real-world scenarios where not all systems are evaluated on the entire task.",
        "keywords": "NLP;Evaluation;Benchmarking;Generative Models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/ff5dd0e9fe21a1445fc43a8d57d1703c8634bbe5.zip",
        "author": "Anas Himmi;Ekhine Irurozki;Nathan Noiry;Stephan Cl\u00e9men\u00e7on;Pierre Colombo",
        "authorids": "~Anas_Himmi1;~Ekhine_Irurozki1;~Nathan_Noiry1;~Stephan_Cl\u00e9men\u00e7on1;~Pierre_Colombo2",
        "gender": "M;;M;;M",
        "homepage": ";;https://noiry.perso.math.cnrs.fr/;;https://pierrecolombo.github.io/",
        "dblp": ";;;;",
        "google_scholar": ";;;;yPoMt8gAAAAJ",
        "orcid": ";;;;",
        "linkedin": "anas-himmi-60394221b;;;;",
        "or_profile": "~Anas_Himmi1;~Ekhine_Irurozki1;~Nathan_Noiry1;~Stephan_Cl\u00e9men\u00e7on1;~Pierre_Colombo2",
        "aff": "CentraleSupelec;;;;CentraleSupelec",
        "aff_domain": "centralesupelec.fr;;;;centralesupelec.fr",
        "position": "Undergrad student;;;;Assistant Professor",
        "bibtex": "@misc{\nhimmi2024towards,\ntitle={Towards More Robust {NLP} System Evaluation: Handling Missing Scores in Benchmarks},\nauthor={Anas Himmi and Ekhine Irurozki and Nathan Noiry and Stephan Cl{\\'e}men{\\c{c}}on and Pierre Colombo},\nyear={2024},\nurl={https://openreview.net/forum?id=yF19SY1i8M}\n}",
        "github": "",
        "project": "",
        "reviewers": "yPnM;cmy7;qUQT;R5ne",
        "site": "https://openreview.net/forum?id=yF19SY1i8M",
        "pdf_size": 3882289,
        "rating": "5;5;6;8",
        "confidence": "3;4;3;3",
        "soundness": "2;3;2;3",
        "contribution": "3;3;3;3",
        "presentation": "2;2;3;2",
        "wc_summary": "54;61;61;159",
        "wc_strengths": "52;165;21;101",
        "wc_weaknesses": "197;215;18;86",
        "wc_questions": "78;236;13;217",
        "wc_review": "381;677;113;563",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "613;520;267;400",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            83.75,
            43.53949356618655
        ],
        "wc_strengths_avg": [
            84.75,
            54.40760516692497
        ],
        "wc_weaknesses_avg": [
            129.0,
            80.91662375556706
        ],
        "wc_questions_avg": [
            136.0,
            93.61356739276631
        ],
        "wc_review_avg": [
            433.5,
            213.03696862281907
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            450.0,
            129.86338976016296
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.4714045207910316,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8521719879516509375&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "CentraleSup\u00e9lec",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.centralesupelec.fr",
        "aff_unique_abbr": "CS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "France"
    },
    {
        "id": "yGdoTL9g18",
        "title": "Residual Factorized Fourier Neural Operator for simulation of three-dimensional turbulence",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Neural Operators, particularly Fourier Neural Operators (FNO), have proven highly effective in simulating partial differential equations (PDEs), such as the Navier-Stokes equations. We propose the Residual Factorized Fourier Neural Operator (Res-F-FNO) for simulating three-dimensional (3D) flows, specifically focusing on flow dynamics around a cube. We extend the Factorized Fourier Neural Operator (F-FNO) architecture by incorporating additional residual connections. This change effectively reintroduces small-scale dynamic flows that may be lost due to truncated Fourier modes, resulting in improved accuracy when modeling wind fields. Our proposed Res-F-FNO model surpasses the performance of the standard F-FNO, achieving an error reduction of over 30\\% in simulating 3D flows. Furthermore, we propose the concept of a skip-corrector, to address the problem of accumulated errors over multiple time steps. The skip-corrector was specifically trained to predict the behaviour of turbulences at a considerably extended time interval. Incorporating the skip-corrector into the prediction process reduces the average error in simulating 100 time steps by more than 50\\%. Additionally, we adopt a modified training approach in which random time steps are chosen as the initial condition for each sample in every epoch, as opposed to generating a dataset by propagating each sample across all time steps. This leads to a significant reduction in the the number of training iterations required for the models to achieve convergence.",
        "keywords": "factorized fourier neural operator;fourier neural operator;navier stokes;three-dimensional turbulence prediction",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Maximilian Dauner;Ankith Bheemanakone;Benedikt Z\u00f6nnchen;Gudrun Socher",
        "authorids": "~Maximilian_Dauner1;ankith.bheemanakone@reiser-st.com;zoennchen.benedikt@hm.edu;gudrun.socher@hm.edu",
        "gender": "M;;;",
        "homepage": "https://www.cs.hm.edu/die_fakultaet/ansprechpartner/wissenschaftlichemitarbeiter/dauner/index.de.html;;;",
        "dblp": ";;;",
        "google_scholar": ";;;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Maximilian_Dauner1;ankith.bheemanakone@reiser-st.com;zoennchen.benedikt@hm.edu;gudrun.socher@hm.edu",
        "aff": "Hochschule M\u00fcnchen;;;",
        "aff_domain": "hm.edu;;;",
        "position": "PhD student;;;",
        "bibtex": "@misc{\ndauner2024residual,\ntitle={Residual Factorized Fourier Neural Operator for simulation of three-dimensional turbulence},\nauthor={Maximilian Dauner and Ankith Bheemanakone and Benedikt Z{\\\"o}nnchen and Gudrun Socher},\nyear={2024},\nurl={https://openreview.net/forum?id=yGdoTL9g18}\n}",
        "github": "",
        "project": "",
        "reviewers": "zqsB;UKe3;8Jew;P4Hh",
        "site": "https://openreview.net/forum?id=yGdoTL9g18",
        "pdf_size": 8234560,
        "rating": "3;3;3;3",
        "confidence": "3;5;4;4",
        "soundness": "2;2;2;2",
        "contribution": "2;1;1;1",
        "presentation": "2;1;2;2",
        "wc_summary": "63;82;74;68",
        "wc_strengths": "32;143;24;17",
        "wc_weaknesses": "268;475;146;241",
        "wc_questions": "48;210;244;66",
        "wc_review": "411;910;488;392",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            71.75,
            7.084313657652377
        ],
        "wc_strengths_avg": [
            54.0,
            51.657526073167695
        ],
        "wc_weaknesses_avg": [
            282.5,
            120.02187300654828
        ],
        "wc_questions_avg": [
            142.0,
            86.08135686662938
        ],
        "wc_review_avg": [
            550.25,
            210.78943877718353
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:-20GhfgfcBIJ:scholar.google.com/&scioq=Residual+Factorized+Fourier+Neural+Operator+for+simulation+of+three-dimensional+turbulence&hl=en&as_sdt=0,3",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Hochschule M\u00fcnchen",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.munich-university.de",
        "aff_unique_abbr": "HM",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "yID2fdta1Z",
        "title": "Robust Graph Neural Networks via Unbiased Aggregation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The adversarial robustness of Graph Neural Networks (GNNs) has been questioned due to the false sense of security uncovered by strong adaptive attacks despite the existence of numerous defenses.\nIn this work, we delve into the robustness analysis of representative robust GNNs and provide a unified robust estimation point of view to understand their robustness and limitations.\nOur novel analysis of estimation bias motivates the design of a robust and unbiased graph signal estimator.\nWe then develop an efficient Quasi-Newton iterative reweighted least squares algorithm to solve the estimation problem, which unfolds as robust unbiased aggregation layers in GNNs with a theoretical convergence guarantee. \nOur comprehensive experiments confirm the strong robustness of our proposed model, and the ablation study provides a deep understanding of its advantages.",
        "keywords": "Graph Neural Networks;Adversarial Attack;Unbiased Graph Estimator",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Ruiqi Feng;Zhichao Hou;Tyler Derr;Xiaorui Liu",
        "authorids": "~Ruiqi_Feng1;~Zhichao_Hou1;~Tyler_Derr1;~Xiaorui_Liu1",
        "gender": ";M;;M",
        "homepage": "https://weenming.github.io/;https://chris-hzc.github.io/;http://www.tylerderr.com;https://sites.google.com/ncsu.edu/xiaorui/",
        "dblp": "301/3170;188/4064;207/7927.html;172/0995",
        "google_scholar": "7yE7WQQAAAAJ;rraC4ZMAAAAJ;et6IhFcAAAAJ;NhvN1KoAAAAJ",
        "orcid": "0009-0001-8813-5211;0000-0002-3989-2654;;0000-0001-8217-5688",
        "linkedin": ";zhichao-hou-b022931a4/;tylersnetwork/;",
        "or_profile": "~Ruiqi_Feng1;~Zhichao_Hou1;~Tyler_Derr1;~Xiaorui_Liu1",
        "aff": "Fudan University;Amazon;Vanderbilt University;North Carolina State University",
        "aff_domain": "fudan.edu.cn;amazon.com;vanderbilt.edu;ncsu.edu",
        "position": "Undergrad student;Intern;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nfeng2024robust,\ntitle={Robust Graph Neural Networks via Unbiased Aggregation},\nauthor={Ruiqi Feng and Zhichao Hou and Tyler Derr and Xiaorui Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=yID2fdta1Z}\n}",
        "github": "",
        "project": "",
        "reviewers": "YmW7;WLQa;Vg8s;Sy27;HR1P",
        "site": "https://openreview.net/forum?id=yID2fdta1Z",
        "pdf_size": 3187012,
        "rating": "5;5;5;5;5",
        "confidence": "4;4;4;3;4",
        "soundness": "4;2;2;3;2",
        "contribution": "2;2;2;4;2",
        "presentation": "2;3;3;3;3",
        "wc_summary": "46;104;58;68;64",
        "wc_strengths": "37;24;37;45;44",
        "wc_weaknesses": "156;254;310;176;375",
        "wc_questions": "41;80;56;84;28",
        "wc_review": "280;462;461;373;511",
        "wc_reply_reviewers": "42;138;248;109;58",
        "wc_reply_authors": "2486;2592;2643;2801;3214",
        "reply_reviewers": "1;1;2;1;1",
        "reply_authors": "5;4;5;5;7",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.6,
            0.8
        ],
        "contribution_avg": [
            2.4,
            0.8
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            68.0,
            19.473058311420935
        ],
        "wc_strengths_avg": [
            37.4,
            7.49933330370107
        ],
        "wc_weaknesses_avg": [
            254.2,
            81.81051277189259
        ],
        "wc_questions_avg": [
            57.8,
            21.69239498073
        ],
        "wc_review_avg": [
            417.4,
            81.85499373892836
        ],
        "wc_reply_reviewers_avg": [
            119.0,
            73.14642848423975
        ],
        "wc_reply_authors_avg": [
            2747.2,
            254.54539870129258
        ],
        "reply_reviewers_avg": [
            1.2,
            0.4
        ],
        "reply_authors_avg": [
            5.2,
            0.9797958971132712
        ],
        "replies_avg": [
            39,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11479758961783039255&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Fudan University;Amazon;Vanderbilt University;North Carolina State University",
        "aff_unique_dep": ";Amazon.com, Inc.;;",
        "aff_unique_url": "https://www.fudan.edu.cn;https://www.amazon.com;https://www.vanderbilt.edu;https://www.ncsu.edu",
        "aff_unique_abbr": "Fudan;Amazon;Vanderbilt;NCSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "yIEKq72cTE",
        "title": "Byzantine-Robust Dynamic Weighted Aggregation Framework for Optimal Attack Mitigation in Federated Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Federated learning (FL) has emerged as a promising solution to enable distributed learning on sensitive data without centralized storage and sharing. However, FL is vulnerable to data poisoning attacks, where malicious clients aim to manipulate the training process by injecting poisonous data. Existing defense mechanisms for FL suffer from limitations, including a trade-off between precision and robustness, assumptions on asymptotic optimal bounds on error rates of parameters, i.i.d. data distributions, and strong-convexity assumptions on the optimization problem. To address these limitations, we propose a novel framework called Federated Learning Optimal Transport (FLOT). Our method leverages the Wasserstein barycentric technique to obtain a global model from a set of locally trained models on client devices. Additionally, FLOT introduces a loss function-based rejection (LFR) mechanism to suppress malicious updates and a dynamic weighting scheme to optimize the Wasserstein barycentric aggregation function. We evaluate FLOT on four benchmark datasets: GTSRB, KBTS, CIFAR10, and EMNIST. Our experimental results demonstrate that FLOT outperforms existing baseline methods under single and multi-client attack settings. Also, it serves as a robust client selection technique under no attack. We also prove the Byzantine resilience of FLOT to demonstrate its effectiveness. These results underscore the practical significance of FLOT as an effective defense mechanism against data poisoning attacks in FL while maintaining high accuracy and scalability. The robustness and effectiveness of FLOT make it a promising solution for real-world applications where data privacy and security are critical.",
        "keywords": "Federated learning;adversarial attacks;defense;optimal transport;Byzantine-robust",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "K Naveen Kumar;Vishnu Chalavadi;Srinivasa Rao Chalamala;Ajeet Kumar Singh;C Krishna Mohan",
        "authorids": "~K_Naveen_Kumar1;~Vishnu_Chalavadi1;~Srinivasa_Rao_Chalamala1;~Ajeet_Kumar_Singh2;~C_Krishna_Mohan1",
        "gender": "M;M;M;M;M",
        "homepage": "https://naveenkumar1311.github.io/;https://vish9u.github.io;https://srinivaschalamala.github.io/;https://ajeetksingh.github.io/;https://www.iith.ac.in/~ckm/",
        "dblp": "271/8085;302/7458;;147/1487;30/4639",
        "google_scholar": "Kb0j5RwAAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.co.in/citations?user=UZ-2WMgAAAAJ;mtaDclEAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";0000-0001-9184-3545;;;0000-0002-7316-0836",
        "linkedin": "naveen-kumar-k-a035a2129/;chalavadi-vishnu-phd/;;;",
        "or_profile": "~K_Naveen_Kumar1;~Vishnu_Chalavadi1;~Srinivasa_Rao_Chalamala1;~Ajeet_Kumar_Singh2;~C_Krishna_Mohan1",
        "aff": "Indian Institute of Technology Hyderabad;Indian Institute of Technology Tirupati;;Tata Consultancy Services Limited, India;Indian Institute of Technology Hyderabad",
        "aff_domain": "iith.ac.in;iittp.ac.in;;tcs.com;iith.ac.in",
        "position": "PhD student;Assistant Professor;;Researcher;Professor",
        "bibtex": "@misc{\nkumar2024byzantinerobust,\ntitle={Byzantine-Robust Dynamic Weighted Aggregation Framework for Optimal Attack Mitigation in Federated Learning},\nauthor={K Naveen Kumar and Vishnu Chalavadi and Srinivasa Rao Chalamala and Ajeet Kumar Singh and C Krishna Mohan},\nyear={2024},\nurl={https://openreview.net/forum?id=yIEKq72cTE}\n}",
        "github": "",
        "project": "",
        "reviewers": "eNX5;CP8z;eeKh;C2i6;b3Wa",
        "site": "https://openreview.net/forum?id=yIEKq72cTE",
        "pdf_size": 861959,
        "rating": "3;3;3;3;5",
        "confidence": "4;4;4;4;4",
        "soundness": "2;2;2;2;3",
        "contribution": "2;2;2;2;3",
        "presentation": "1;3;3;2;3",
        "wc_summary": "48;58;51;63;85",
        "wc_strengths": "30;31;76;24;60",
        "wc_weaknesses": "276;158;235;171;147",
        "wc_questions": "4;4;120;172;176",
        "wc_review": "358;251;482;430;468",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            3.4,
            0.8
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.2,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.4,
            0.8
        ],
        "wc_summary_avg": [
            61.0,
            13.099618315050252
        ],
        "wc_strengths_avg": [
            44.2,
            20.22275945562326
        ],
        "wc_weaknesses_avg": [
            197.4,
            49.761832763675415
        ],
        "wc_questions_avg": [
            95.2,
            77.04128763202236
        ],
        "wc_review_avg": [
            397.8,
            85.07502571260264
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:a5KkfWRIZowJ:scholar.google.com/&scioq=Byzantine-Robust+Dynamic+Weighted+Aggregation+Framework+for+Optimal+Attack+Mitigation+in+Federated+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Indian Institute of Technology Hyderabad;Indian Institute of Technology;Tata Consultancy Services Limited",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.iith.ac.in;https://iit Tirupati.ac.in;https://www.tcs.com",
        "aff_unique_abbr": "IIT Hyderabad;IIT Tirupati;TCS",
        "aff_campus_unique_index": "0;1;0",
        "aff_campus_unique": "Hyderabad;Tirupati;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "India"
    },
    {
        "id": "yIKjkRZBrX",
        "title": "Learning variable-length skills through Novelty-based Decision Point Identification",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Intelligent agents are able to make decisions based on different levels of granularity and duration. Recent advances in skill learning with data-driven behavior priors enabled the agent to solve complex, long-horizon tasks by effectively guiding the agent in choosing appropriate skills. However, the practice of using fixed-length skills can easily result in skipping valuable decision points, which ultimately limits the potential for further exploration and faster policy learning. For example, making a temporally-extended decision at a crossroad can offer more direct access to parts of the state space that would otherwise be challenging to reach. In this work, we propose to learn variable-length skills by identifying decision points through a state-action novelty module that leverages offline agent experience datasets, which turns out to be an efficient proxy for the critical decision point detection. We show that capturing critical decision points can further accelerate policy learning by enabling a more efficient exploration of the state space and facilitating transfer of knowledge across various tasks. Our approach, NBDI (Novelty-based Decision Point Identification), substantially outperforms previous baselines in complex, long-horizon tasks (e.g. robotic manipulation and maze navigation), which highlights the importance of decision point identification in skill learning.",
        "keywords": "Reinforcement Learning;Unsupervised Learning;Skill Learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Myunsoo Kim;Hayeong Lee;JunHo Seo;Seong-Woong Shim;Byung-Jun Lee",
        "authorids": "~Myunsoo_Kim1;~Hayeong_Lee1;~JunHo_Seo1;~Seong-Woong_Shim1;~Byung-Jun_Lee1",
        "gender": "M;;M;M;M",
        "homepage": "https://github.com/jack32666;https://hy-kiera.gitbook.io/hayeong/;https://github.com/junhoseo0;;https://dmlab.korea.ac.kr/professor.html",
        "dblp": "76/10657;341/8290;397/9531;367/2991;130/1678-1",
        "google_scholar": ";;;;FwoohI4AAAAJ",
        "orcid": ";;;;",
        "linkedin": ";;;%EC%84%B1%EC%9B%85-%EC%8B%AC-278221251/;",
        "or_profile": "~Myunsoo_Kim1;~Hayeong_Lee1;~JunHo_Seo1;~Seong-Woong_Shim1;~Byung-Jun_Lee1",
        "aff": "Korea University;Korea University;Korea University;Korea University;Gauss Labs Inc.",
        "aff_domain": "korea.ac.kr;korea.ac.kr;korea.ac.kr;korea.ac.kr;gausslabs.ai",
        "position": "PhD student;PhD student;PhD student;PhD student;Applied Scientist",
        "bibtex": "@misc{\nkim2024learning,\ntitle={Learning variable-length skills through Novelty-based Decision Point Identification},\nauthor={Myunsoo Kim and Hayeong Lee and JunHo Seo and Seong-Woong Shim and Byung-Jun Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=yIKjkRZBrX}\n}",
        "github": "",
        "project": "",
        "reviewers": "Yx7H;6rC9;Pqwe;zT8h",
        "site": "https://openreview.net/forum?id=yIKjkRZBrX",
        "pdf_size": 2560324,
        "rating": "3;3;5;8",
        "confidence": "4;4;3;3",
        "soundness": "2;3;2;4",
        "contribution": "2;2;2;3",
        "presentation": "2;2;2;3",
        "wc_summary": "95;53;54;179",
        "wc_strengths": "66;36;38;103",
        "wc_weaknesses": "284;234;178;224",
        "wc_questions": "109;7;80;65",
        "wc_review": "554;330;350;571",
        "wc_reply_reviewers": "0;0;0;253",
        "wc_reply_authors": "638;322;251;507",
        "reply_reviewers": "0;0;0;2",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            95.25,
            51.236583609760714
        ],
        "wc_strengths_avg": [
            60.75,
            27.123559869604136
        ],
        "wc_weaknesses_avg": [
            230.0,
            37.656340767525464
        ],
        "wc_questions_avg": [
            65.25,
            37.164331017791774
        ],
        "wc_review_avg": [
            451.25,
            111.6364075917888
        ],
        "wc_reply_reviewers_avg": [
            63.25,
            109.55221357873148
        ],
        "wc_reply_authors_avg": [
            429.5,
            152.39504585123495
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.8551861104941366,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:c4aHNjZWtYYJ:scholar.google.com/&scioq=Learning+variable-length+skills+through+Novelty-based+Decision+Point+Identification&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;1",
        "aff_unique_norm": "Korea University;Gauss Labs Inc.",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.korea.ac.kr;",
        "aff_unique_abbr": "KU;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;1",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "id": "yINucFNbcZ",
        "title": "Improving the efficiency of conformal predictors via test-time augmentation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In conformal classification, the goal is to output a _set_ of predicted classes, accompanied by a probabilistic guarantee that the set includes the true class. Conformal approaches have gained widespread traction across domains because they can be composed with existing classifiers to generate predictions with probabilistically valid uncertainty estimates. In practice, however, the utility of conformal prediction is limited by its tendency to yield large prediction sets.  We study this phenomenon and provide insights into why large set sizes persist, even for conformal methods designed to produce small sets. Using these insights, we propose a method to reduce prediction set size while maintaining coverage. We use test-time augmentation to replace a classifier's predicted probabilities with probabilites aggregated over a set of augmentations. Our approach is flexible, computationally efficient, and effective. It can be combined with any conformal score, requires no model retraining, and reduces prediction set sizes by up to 30\\%. We conduct an evaluation of the approach spanning three datasets, three models, two established conformal scoring methods, and multiple coverage values to show when and why test-time augmentation is a useful addition to the conformal pipeline.",
        "keywords": "uncertainty estimation;conformal prediction;data augmentation;image classification;test-time",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Divya M Shanmugam;Helen Lu;Swami Sankaranarayanan;John Guttag",
        "authorids": "~Divya_M_Shanmugam1;~Helen_Lu1;~Swami_Sankaranarayanan1;~John_Guttag2",
        "gender": "F;;M;M",
        "homepage": "https://dmshanmugam.github.io/;;https://swamiviv.github.io;https://people.csail.mit.edu/guttag/",
        "dblp": ";;172/9983;g/JohnVGuttag",
        "google_scholar": "E7bRAPkAAAAJ;;w3KgvQIAAAAJ;",
        "orcid": ";;;",
        "linkedin": ";;swamiviv/;",
        "or_profile": "~Divya_M_Shanmugam1;~Helen_Lu1;~Swami_Sankaranarayanan1;~John_Guttag2",
        "aff": "Massachusetts Institute of Technology;;Sony AI America;Massachusetts Institute of Technology",
        "aff_domain": "mit.edu;;sony.com;mit.edu",
        "position": "PhD student;;Researcher;Full Professor",
        "bibtex": "@misc{\nshanmugam2024improving,\ntitle={Improving the efficiency of conformal predictors via test-time augmentation},\nauthor={Divya M Shanmugam and Helen Lu and Swami Sankaranarayanan and John Guttag},\nyear={2024},\nurl={https://openreview.net/forum?id=yINucFNbcZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "L9GB;KHLY;aF3F;Gekq;YZ5v;BaaG",
        "site": "https://openreview.net/forum?id=yINucFNbcZ",
        "pdf_size": 4017113,
        "rating": "3;3;5;6;6;6",
        "confidence": "4;4;5;4;3;2",
        "soundness": "2;3;1;3;3;2",
        "contribution": "2;1;2;3;3;2",
        "presentation": "1;2;3;4;3;3",
        "wc_summary": "21;59;145;56;84;140",
        "wc_strengths": "13;26;51;15;80;54",
        "wc_weaknesses": "152;179;435;71;69;27",
        "wc_questions": "79;75;33;98;98;168",
        "wc_review": "265;339;664;240;331;389",
        "wc_reply_reviewers": "0;236;10;0;15;55",
        "wc_reply_authors": "623;697;483;541;331;272",
        "reply_reviewers": "0;1;1;0;1;1",
        "reply_authors": "1;2;1;1;1;1",
        "rating_avg": [
            4.833333333333333,
            1.3437096247164249
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.7453559924999298
        ],
        "contribution_avg": [
            2.1666666666666665,
            0.6871842709362768
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            84.16666666666667,
            45.15682549614054
        ],
        "wc_strengths_avg": [
            39.833333333333336,
            24.037586308852966
        ],
        "wc_weaknesses_avg": [
            155.5,
            135.28950439705218
        ],
        "wc_questions_avg": [
            91.83333333333333,
            40.38736050906136
        ],
        "wc_review_avg": [
            371.3333333333333,
            139.7577268784171
        ],
        "wc_reply_reviewers_avg": [
            52.666666666666664,
            84.06677240278839
        ],
        "wc_reply_authors_avg": [
            491.1666666666667,
            150.5461354166519
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.1666666666666667,
            0.3726779962499649
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.4385290096535146,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:OOihTGi-3EkJ:scholar.google.com/&scioq=Improving+the+efficiency+of+conformal+predictors+via+test-time+augmentation&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Massachusetts Institute of Technology;Sony AI America",
        "aff_unique_dep": ";Sony AI",
        "aff_unique_url": "https://web.mit.edu;https://www.sonyai.com",
        "aff_unique_abbr": "MIT;Sony AI America",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "yIv4SLzO3u",
        "title": "Bound and Average: Leveraging Weights as Knowledge for Class Incremental Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We present a novel training approach, named Bound-and-Average (BaA) for Class Incremental Learning (CIL) that leverages weight ensemble and constrained optimization, motivated by recent advances in transfer learning. Our algorithm contains two types of weight averaging: inter-task weight averaging and intra-task weight averaging. Inter-task weight averaging integrates the ability of previous models by averaging the weights of models from all previous stages. On the other hand, intra-task weight averaging enriches the learning of current task by averaging the model parameters within current stage. We also propose a bounded update technique that aims to optimize the target model with minimal cumulative updates and preserve knowledge from previous tasks; this strategy reveals that it is possible to effectively obtain new models near old ones, reducing catastrophic forgetting. BaA seamlessly integrates into existing CIL methods without modifying architecture components or revising learning objectives. We extensively evaluate our algorithm on standard CIL benchmarks and demonstrate superior performance compared to state-of-the-art methods.",
        "keywords": "continual learning;transfer learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Taehoon Kim;Dong-Hwan Jang;Bohyung Han",
        "authorids": "~Taehoon_Kim4;~Dong-Hwan_Jang1;~Bohyung_Han1",
        "gender": "M;Not Specified;M",
        "homepage": "https://sites.google.com/view/taehoonkim0723;http://cvlab.snu.ac.kr/~bhhan;https://donghwanjang.github.io",
        "dblp": ";73/4880.html;321/4685",
        "google_scholar": "n3WHyBQAAAAJ;9aaeCToAAAAJ;5MLvB1YAAAAJ",
        "orcid": ";;0000-0003-3665-5685",
        "linkedin": ";;dong-hwan-jang-b38283181/",
        "or_profile": "~Taehoon_Kim4;~Bohyung_Han1;~DongHwan_Jang1",
        "aff": "Seoul National University;Seoul National University;Samsung",
        "aff_domain": "snu.ac.kr;snu.ac.kr;samsung.com",
        "position": "MS student;Full Professor;Researcher",
        "bibtex": "@misc{\nkim2024bound,\ntitle={Bound and Average: Leveraging Weights as Knowledge for Class Incremental Learning},\nauthor={Taehoon Kim and Dong-Hwan Jang and Bohyung Han},\nyear={2024},\nurl={https://openreview.net/forum?id=yIv4SLzO3u}\n}",
        "github": "",
        "project": "",
        "reviewers": "m7u4;yYZY;vNSZ;eNr4",
        "site": "https://openreview.net/forum?id=yIv4SLzO3u",
        "pdf_size": 729503,
        "rating": "3;3;3;5",
        "confidence": "5;5;3;5",
        "soundness": "2;2;2;2",
        "contribution": "2;2;1;2",
        "presentation": "3;3;2;3",
        "wc_summary": "76;65;71;36",
        "wc_strengths": "27;41;23;42",
        "wc_weaknesses": "140;273;165;197",
        "wc_questions": "57;2;6;12",
        "wc_review": "300;381;265;287",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            62.0,
            15.508062419270823
        ],
        "wc_strengths_avg": [
            33.25,
            8.37779804005802
        ],
        "wc_weaknesses_avg": [
            193.75,
            50.016872153304426
        ],
        "wc_questions_avg": [
            19.25,
            22.083647796503186
        ],
        "wc_review_avg": [
            308.25,
            43.82564888281747
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:m2iAmWOhH-gJ:scholar.google.com/&scioq=Bound+and+Average:+Leveraging+Weights+as+Knowledge+for+Class+Incremental+Learning&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Seoul National University;Samsung",
        "aff_unique_dep": ";Samsung",
        "aff_unique_url": "https://www.snu.ac.kr;https://www.samsung.com",
        "aff_unique_abbr": "SNU;Samsung",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "yJdj2QQCUB",
        "title": "Graph Positional and Structural Encoder",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Positional and structural encodings (PSE) enable better identifiability of nodes within a graph, as in general graphs lack a canonical node ordering. This renders PSEs essential tools for empowering modern GNNs, and in particular graph Transformers. However, designing PSEs that work optimally for a variety of graph prediction tasks is a challenging and unsolved problem. Here, we present the \\underline{g}raph positional and structural encoder (GPSE), a first-ever attempt to train a graph encoder that captures rich PSE representations for augmenting any GNN. GPSE can effectively learn a common latent representation for multiple PSEs, and is highly transferable. The encoder trained on a particular graph dataset can be used effectively on datasets drawn from significantly different distributions and even modalities. We show that across a wide range of benchmarks, GPSE-enhanced models can significantly improve the performance in certain tasks, while performing on par with those that employ explicitly computed PSEs in other cases. Our results pave the way for the development of large pre-trained models for extracting graph positional and structural information and highlight their potential as a viable alternative to explicitly computed PSEs as well as to existing self-supervised pre-training approaches.",
        "keywords": "Graph Transformer;Graph Representation Learning;Molecular Representation Learning;Self-supervised Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/1dcd87dcbe056babd09a6829f1f87ab43b43ac50.zip",
        "author": "Renming Liu;Semih Cant\u00fcrk;Olivier Lapointe-Gagn\u00e9;Vincent L\u00e9tourneau;Guy Wolf;Dominique Beaini;Ladislav Ramp\u00e1\u0161ek",
        "authorids": "~Renming_Liu1;~Semih_Cant\u00fcrk1;~Olivier_Lapointe-Gagn\u00e91;~Vincent_L\u00e9tourneau1;~Guy_Wolf1;~Dominique_Beaini1;~Ladislav_Ramp\u00e1\u0161ek1",
        "gender": "M;M;;;M;M;M",
        "homepage": "https://github.com/RemyLau;;https://github.com/OlivierLapointeG;;http://guywolf.org;;https://rampasek.github.io",
        "dblp": ";268/5493;;;120/1308;201/8526;146/9832",
        "google_scholar": "by5L-BcAAAAJ;k_BbPa4AAAAJ;;;g0k3SjcAAAAJ;https://scholar.google.ca/citations?hl=en;nqeYbJcAAAAJ",
        "orcid": "0000-0002-6025-6492;0000-0002-2365-9292;;;0000-0002-6740-059X;0000-0002-4613-9388;0000-0001-7527-1196",
        "linkedin": "remy-liu-a24780213/;semihcanturk/;;vincent-l%C3%A9tourneau-1b298570/;;dbeaini/;",
        "or_profile": "~Renming_Liu1;~Semih_Cant\u00fcrk1;~Olivier_Lapointe-Gagn\u00e91;~Vincent_L\u00e9tourneau1;~Guy_Wolf1;~Dominique_Beaini1;~Ladislav_Rampasek1",
        "aff": "Michigan State University;Department of Computer Science and Operations Research, Universit\u00e9 de Montr\u00e9al;Universit\u00e9 de Montr\u00e9al;;University of Montreal;Mila - Institut Qu\u00e9b\u00e9cois d'intelligence artificielle;Isomorphic Labs",
        "aff_domain": "msu.edu;diro.umontreal.ca;umontreal.ca;;umontreal.ca;mila.quebec;google.com",
        "position": "PhD student;PhD student;MS student;;Associate Professor;Associate Professor;Researcher",
        "bibtex": "@misc{\nliu2024graph,\ntitle={Graph Positional and Structural Encoder},\nauthor={Renming Liu and Semih Cant{\\\"u}rk and Olivier Lapointe-Gagn{\\'e} and Vincent L{\\'e}tourneau and Guy Wolf and Dominique Beaini and Ladislav Ramp{\\'a}{\\v{s}}ek},\nyear={2024},\nurl={https://openreview.net/forum?id=yJdj2QQCUB}\n}",
        "github": "",
        "project": "",
        "reviewers": "vPPW;7nJh;6S8q;rYLm",
        "site": "https://openreview.net/forum?id=yJdj2QQCUB",
        "pdf_size": 1424289,
        "rating": "1;5;5;6",
        "confidence": "4;4;5;4",
        "soundness": "2;1;3;2",
        "contribution": "2;1;2;2",
        "presentation": "2;2;1;4",
        "wc_summary": "213;57;94;108",
        "wc_strengths": "154;11;45;51",
        "wc_weaknesses": "243;144;73;186",
        "wc_questions": "34;60;260;60",
        "wc_review": "644;272;472;405",
        "wc_reply_reviewers": "207;222;0;19",
        "wc_reply_authors": "1413;1325;1723;759",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "3;3;5;2",
        "rating_avg": [
            4.25,
            1.920286436967152
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            118.0,
            57.92667779184303
        ],
        "wc_strengths_avg": [
            65.25,
            53.46201922860752
        ],
        "wc_weaknesses_avg": [
            161.5,
            62.010079825783166
        ],
        "wc_questions_avg": [
            103.5,
            90.97664535472826
        ],
        "wc_review_avg": [
            448.25,
            133.99323676962206
        ],
        "wc_reply_reviewers_avg": [
            112.0,
            102.85669642760261
        ],
        "wc_reply_authors_avg": [
            1305.0,
            348.1752432324849
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.25,
            1.0897247358851685
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.22549380840084865,
        "gs_citation": 20,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17034865299338222140&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;1;1;2;3;4",
        "aff_unique_norm": "Michigan State University;Universit\u00e9 de Montr\u00e9al;University of Montreal;Mila - Quebec Artificial Intelligence Institute;Isomorphic Labs",
        "aff_unique_dep": ";Department of Computer Science and Operations Research;;Artificial Intelligence;",
        "aff_unique_url": "https://www.msu.edu;https://www.umontreal.ca;https://wwwumontreal.ca;https://mila.quebec;",
        "aff_unique_abbr": "MSU;UdeM;UM;Mila;",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Montr\u00e9al",
        "aff_country_unique_index": "0;1;1;1;1;0",
        "aff_country_unique": "United States;Canada"
    },
    {
        "id": "yKC6Jd0CsP",
        "title": "Vision ELECTRA: Adversarial Masked Image Modeling with Hierarchical Discriminator",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "As a practical pre-training strategy for natural language processing (NLP), ELECTRA first masks parts of input texts and trains a generator and discriminator to reconstruct the texts and identify which parts are original or replaced. In this work, we propose \\underline{V}ision \\underline{E}LECTRA, namely $\\mathcal{VE}$, which migrates ELECTRA to the vision domain with a non-trivial extension. Like ELECTRA, $\\mathcal{VE}$ first leverages MAE or SimMIM to reconstruct images from masked image patches by generation. Particularly, random Gaussian noise is induced into the latent space of the generator to enhance the diversity of generated patches, in an adversarial autoencoding manner. Later, given original images and the reconstructed ones, $\\mathcal{VE}$ trains an image encoder (usually ViT or Swin) via a hierarchical discrimination loss, where the discriminator is expected to (1) differentiate between original images and the reconstructed ones and (2) differentiate between original patches and generated ones. \nIt gives $\\mathcal{VE}$ a unique advantage that learns contextual representations characterizing images in both macro- and micro-levels (i.e., the entire image and individual patches). Extensive experiments have been carried out to evaluate $\\mathcal{VE}$ with baselines under fair comparisons. The findings demonstrate that $\\mathcal{VE}$ based on the ViT-B attains a top-1 acc of 83.43\\% on the ImageNet-1K image classification task with a 1.17\\% improvement over baselines under continual pre-training. When transferring $\\mathcal{VE}$ pre-trained models to other CV tasks, including segmentation and detection, our method surpasses other methods, demonstrating its applicability on various tasks.",
        "keywords": "Masked Image Modeling;Vision ELECTRA;Adversarial Pre-training",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/ad1ca48e7a71404f47e7393ce87193b441469a5a.zip",
        "author": "Song Zhang;Qingzhong Wang;Jie Fu;Jiang Bian;Haoyi Xiong",
        "authorids": "~Song_Zhang6;~Qingzhong_Wang1;~Jie_Fu2;~Jiang_Bian5;~Haoyi_Xiong1",
        "gender": "M;M;;M;M",
        "homepage": ";https://qingzwang.github.io/;https://sites.google.com/view/bjbaidurecent/home;https://sites.google.com/site/haoyixiongshomepage/;https://bigaidream.github.io/",
        "dblp": ";156/8785;;06/2700;",
        "google_scholar": ";e7ZsEIcAAAAJ;;f_Kcie0AAAAJ;66osleIAAAAJ",
        "orcid": "0000-0001-7312-6892;;;;0000-0002-4494-843X",
        "linkedin": ";;;;",
        "or_profile": "~Song_Zhang6;~Qingzhong_Wang1;~Jiang_Bian5;~Haoyi_Xiong1;~Jie_Fu1",
        "aff": "University of Chinese Academy of Sciences;Baidu;Microsoft;Baidu;Hong Kong University of Science and Technology",
        "aff_domain": "ucas.ac.cn;baidu.com;microsoft.com;baidu.com;ust.hk",
        "position": "PhD student;Researcher;Applied Scientist;Principal Researcher;Researcher",
        "bibtex": "@misc{\nzhang2024vision,\ntitle={Vision {ELECTRA}: Adversarial Masked Image Modeling with Hierarchical Discriminator},\nauthor={Song Zhang and Qingzhong Wang and Jie Fu and Jiang Bian and Haoyi Xiong},\nyear={2024},\nurl={https://openreview.net/forum?id=yKC6Jd0CsP}\n}",
        "github": "",
        "project": "",
        "reviewers": "jdSs;XJEn;rgaC",
        "site": "https://openreview.net/forum?id=yKC6Jd0CsP",
        "pdf_size": 1992600,
        "rating": "3;5;5",
        "confidence": "4;3;4",
        "soundness": "3;2;2",
        "contribution": "2;2;2",
        "presentation": "3;2;3",
        "wc_summary": "70;88;30",
        "wc_strengths": "35;101;23",
        "wc_weaknesses": "81;278;91",
        "wc_questions": "25;47;25",
        "wc_review": "211;514;169",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            62.666666666666664,
            24.239545283597124
        ],
        "wc_strengths_avg": [
            53.0,
            34.292856398964496
        ],
        "wc_weaknesses_avg": [
            150.0,
            90.60169240509067
        ],
        "wc_questions_avg": [
            32.333333333333336,
            10.370899457402697
        ],
        "wc_review_avg": [
            298.0,
            153.69450217883528
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Y77wY6GLQEgJ:scholar.google.com/&scioq=Vision+ELECTRA:+Adversarial+Masked+Image+Modeling+with+Hierarchical+Discriminator&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;1;3",
        "aff_unique_norm": "University of Chinese Academy of Sciences;Baidu;Microsoft;Hong Kong University of Science and Technology",
        "aff_unique_dep": ";Baidu, Inc.;Microsoft Corporation;",
        "aff_unique_url": "http://www.ucas.ac.cn;https://www.baidu.com;https://www.microsoft.com;https://www.ust.hk",
        "aff_unique_abbr": "UCAS;Baidu;Microsoft;HKUST",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;1;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Faithful and Efficient Explanations for Neural Networks via Neural Tangent Kernel Surrogate Models",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17423",
        "id": "yKksu38BpM",
        "author_site": "Andrew Engel, Zhichao Wang, Natalie Frank, Ioana Dumitriu, Sutanay Choudhury, Anand Sarwate, Tony Chiang",
        "tldr": "",
        "abstract": "A recent trend in explainable AI research has focused on surrogate modeling, where neural networks are approximated as simpler ML algorithms such as kernel machines. A second trend has been to utilize kernel functions in various explain-by-example or data attribution tasks. In this work, we combine these two trends to analyze approximate empirical neural tangent kernels (eNTK) for data attribution. Approximation is critical for eNTK analysis due to the high computational cost to compute the eNTK. We define new approximate eNTK and perform novel analysis on how well the resulting kernel machine surrogate models correlate with the underlying neural network. We introduce two new random projection variants of approximate eNTK which allow users to tune the time and memory complexity of their calculation. We conclude that kernel machines using approximate neural tangent kernel as the kernel function are effective surrogate models, with the introduced trace NTK the most consistent performer.",
        "keywords": "Explainability;Surrogate Models;Neural Tangent Kernel;Deep Learning;Attribution",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/52d5a42baeb7a896f948fa70baf9566f4f7c5711.zip",
        "author": "Andrew William Engel;Zhichao Wang;Natalie Frank;Ioana Dumitriu;Sutanay Choudhury;Anand Sarwate;Tony Chiang",
        "authorids": "~Andrew_William_Engel1;~Zhichao_Wang3;~Natalie_Frank1;~Ioana_Dumitriu3;~Sutanay_Choudhury2;~Anand_Sarwate1;~Tony_Chiang1",
        "gender": "M;M;F;F;;M;M",
        "homepage": ";https://mathweb.ucsd.edu/~zhw036/;https://natalie-frank.github.io/;https://math.ucsd.edu/people/profiles/ioana-dumitriu;;https://adsarwate.github.io/;https://www.pnnl.gov/people/tony-chiang",
        "dblp": "97/5194;02/10606;263/9872;57/6529;57/7437;32/4477;",
        "google_scholar": ";IjXnDdoAAAAJ;https://scholar.google.com/citations?hl=en;kSgtqZkAAAAJ;oouJk7YAAAAJ;jgr1-eEAAAAJ;ifJp-DkAAAAJ",
        "orcid": "0000-0003-2348-483X;0000-0003-3886-5053;0009-0007-5582-4487;0000-0002-0721-7849;;0000-0001-6123-5282;",
        "linkedin": "andrew-engel-281149162/;;;;;anand-sarwate-a0bab3/;eis2dot71828/",
        "or_profile": "~Andrew_William_Engel1;~Zhichao_Wang3;~Natalie_Frank1;~Ioana_Dumitriu3;~Sutanay_Choudhury2;~Anand_Sarwate1;~Tony_Chiang1",
        "aff": "Pacific Northwest National Laboratory;University of California, San Diego;New York University;University of California, San Diego;Pacific Northwest National Lab;Rutgers University;Pacific Northwest National Laboratory",
        "aff_domain": "pnnl.gov;ucsd.edu;nyu.edu;ucsd.edu;pnl.gov;rutgers.edu;pnnl.gov",
        "position": "Researcher;PhD student;PhD student;Full Professor;Scientist;Associate Professor;Principal Researcher",
        "bibtex": "@inproceedings{\nengel2024faithful,\ntitle={Faithful and Efficient Explanations for Neural Networks via Neural Tangent Kernel Surrogate Models},\nauthor={Andrew William Engel and Zhichao Wang and Natalie Frank and Ioana Dumitriu and Sutanay Choudhury and Anand Sarwate and Tony Chiang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=yKksu38BpM}\n}",
        "github": "",
        "project": "",
        "reviewers": "zBfF;LB8S;dXvz;e28a;yHxi",
        "pdf_size": 14519532,
        "rating": "5;8;8;8;8",
        "confidence": "4;4;2;4;4",
        "soundness": "2;4;3;3;3",
        "contribution": "2;3;2;3;3",
        "presentation": "2;4;2;3;3",
        "wc_summary": "25;124;257;159;101",
        "wc_strengths": "24;100;129;96;222",
        "wc_weaknesses": "204;24;579;109;434",
        "wc_questions": "80;87;185;40;247",
        "wc_review": "333;335;1150;404;1004",
        "wc_reply_reviewers": "0;0;61;11;108",
        "wc_reply_authors": "954;438;2633;910;2160",
        "reply_reviewers": "0;0;2;1;2",
        "reply_authors": "2;1;5;2;5",
        "rating_avg": [
            7.4,
            1.2
        ],
        "confidence_avg": [
            3.6,
            0.8
        ],
        "soundness_avg": [
            3.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            2.6,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.8,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            133.2,
            75.9220653038364
        ],
        "wc_strengths_avg": [
            114.2,
            64.04498419080139
        ],
        "wc_weaknesses_avg": [
            270.0,
            206.48002324680226
        ],
        "wc_questions_avg": [
            127.8,
            76.33976683223496
        ],
        "wc_review_avg": [
            645.2,
            356.4914585232022
        ],
        "wc_reply_reviewers_avg": [
            36.0,
            42.487645263064415
        ],
        "wc_reply_authors_avg": [
            1419.0,
            831.9307663501813
        ],
        "reply_reviewers_avg": [
            1.0,
            0.8944271909999159
        ],
        "reply_authors_avg": [
            3.0,
            1.6733200530681511
        ],
        "replies_avg": [
            31,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.25000000000000006,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3182239720149352773&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=yKksu38BpM",
        "pdf": "https://openreview.net/pdf?id=yKksu38BpM",
        "email": "pnnl.gov;ucsd.edu;nyu.edu;ucsd.edu;pnl.gov;rutgers.edu;pnnl.gov",
        "author_num": 7,
        "aff_unique_index": "0;1;2;1;0;3;0",
        "aff_unique_norm": "Pacific Northwest National Laboratory;University of California, San Diego;New York University;Rutgers University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.pnnl.gov;https://www.ucsd.edu;https://www.nyu.edu;https://www.rutgers.edu",
        "aff_unique_abbr": "PNNL;UCSD;NYU;Rutgers",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";San Diego",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "MAmmoTH: Building Math Generalist Models through Hybrid Instruction Tuning",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17422",
        "id": "yLClGs770I",
        "author_site": "Xiang Yue, Xingwei Qu, Ge Zhang, Yao Fu, Wenhao Huang, Huan Sun, Yu Su, Wenhu Chen",
        "tldr": "",
        "abstract": "We introduce MAmmoTH, a series of open-source large language models (LLMs) specifically tailored for general math problem-solving. The MAmmoTH models are trained on MathInstruct, our meticulously curated instruction tuning dataset. MathInstruct is compiled from 13 math datasets with intermediate rationales, six of which have rationales newly curated by us. It presents a unique hybrid of chain-of-thought (CoT) and program-of-thought (PoT) rationales, and also ensures extensive coverage of diverse fields in math. The hybrid of CoT and PoT not only unleashes the potential of tool use but also allows different thought processes for different math problems. As a result, the MAmmoTH series substantially outperform existing open-source models on nine mathematical reasoning datasets across all scales with an average accuracy gain between 16% and 32%. Remarkably, our MAmmoTH-7B model reaches 33% on MATH (a competition-level dataset), which exceeds the best open-source 7B model (WizardMath) by 23%, and the MAmmoTH-34B model achieves 44% accuracy on MATH, even surpassing GPT-4\u2019s CoT result. Our work underscores the importance of diverse problem coverage and the use of hybrid rationales in developing superior math generalist models.",
        "keywords": "Math Reasoning;Instruction Tuning;Large Language Model",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Xiang Yue;Xingwei Qu;Ge Zhang;Yao Fu;Wenhao Huang;Huan Sun;Yu Su;Wenhu Chen",
        "authorids": "~Xiang_Yue1;~Xingwei_Qu1;~Ge_Zhang5;~Yao_Fu3;~Wenhao_Huang1;~Huan_Sun1;~Yu_Su2;~Wenhu_Chen3",
        "gender": ";M;M;M;;F;M;",
        "homepage": ";https://orcid.org/my-orcid?orcid=0000-0002-3265-7133;;https://franxyao.github.io/;;https://u.osu.edu/ihudas/people/;http://ysu1989.github.io;",
        "dblp": ";;;;;33/2952-1.html;38/1070-1;",
        "google_scholar": ";https://scholar.google.com/citations?hl=zh-CN;qyTrq4kAAAAJ;liSP4cEAAAAJ;;wIFkulcAAAAJ;rIh5OqoAAAAJ;",
        "orcid": ";;;;;;;",
        "linkedin": ";;ge-zhang-792797169/;;;huan-sun-81527924/?originalSubdomain=cn;;",
        "or_profile": "~Xiang_Yue1;~Xingwei_Qu1;~Ge_Zhang5;~Yao_Fu3;~Wenhao_Huang1;~Huan_Sun1;~Yu_Su2;~Wenhu_Chen3",
        "aff": ";Hong Kong University of Science and Technology;University of Waterloo;University of Edinburgh;;The Ohio State University, Columbus;Microsoft;",
        "aff_domain": ";ust.hk;cs.uwaterloo.ca;ed.ac.uk;;osu.edu;microsoft.com;",
        "position": ";Researcher;PhD student;PhD student;;Associate Professor;Senior Researcher;",
        "bibtex": "@inproceedings{\nyue2024mammoth,\ntitle={{MA}mmo{TH}: Building Math Generalist Models through Hybrid Instruction Tuning},\nauthor={Xiang Yue and Xingwei Qu and Ge Zhang and Yao Fu and Wenhao Huang and Huan Sun and Yu Su and Wenhu Chen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=yLClGs770I}\n}",
        "github": "",
        "project": "",
        "reviewers": "JzMS;x7c7;tS94;z3BX;Dja9",
        "pdf_size": 920108,
        "rating": "6;6;8;8;8",
        "confidence": "4;3;4;4;4",
        "soundness": "3;3;4;4;3",
        "contribution": "2;3;3;3;3",
        "presentation": "3;4;4;4;2",
        "wc_summary": "62;115;69;150;45",
        "wc_strengths": "94;59;71;94;26",
        "wc_weaknesses": "206;323;42;149;82",
        "wc_questions": "62;57;33;104;13",
        "wc_review": "424;554;215;497;166",
        "wc_reply_reviewers": "0;91;0;0;142",
        "wc_reply_authors": "888;1318;368;854;581",
        "reply_reviewers": "0;1;0;0;2",
        "reply_authors": "2;3;1;2;2",
        "rating_avg": [
            7.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            3.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.8,
            0.39999999999999997
        ],
        "presentation_avg": [
            3.4,
            0.8
        ],
        "wc_summary_avg": [
            88.2,
            38.623309024473805
        ],
        "wc_strengths_avg": [
            68.8,
            25.309286833097453
        ],
        "wc_weaknesses_avg": [
            160.4,
            98.8060726878667
        ],
        "wc_questions_avg": [
            53.8,
            30.642454209805063
        ],
        "wc_review_avg": [
            371.2,
            153.9706465531661
        ],
        "wc_reply_reviewers_avg": [
            46.6,
            59.30800957712204
        ],
        "wc_reply_authors_avg": [
            801.8,
            320.4848826387916
        ],
        "reply_reviewers_avg": [
            0.6,
            0.7999999999999999
        ],
        "reply_authors_avg": [
            2.0,
            0.6324555320336759
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.6123724356957947,
        "gs_citation": 332,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12987789151489880737&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=yLClGs770I",
        "pdf": "https://openreview.net/pdf?id=yLClGs770I",
        "email": ";ust.hk;cs.uwaterloo.ca;ed.ac.uk;;osu.edu;microsoft.com;",
        "author_num": 8,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "Hong Kong University of Science and Technology;University of Waterloo;University of Edinburgh;Ohio State University;Microsoft",
        "aff_unique_dep": ";;;;Microsoft Corporation",
        "aff_unique_url": "https://www.ust.hk;https://uwaterloo.ca;https://www.ed.ac.uk;https://www.osu.edu;https://www.microsoft.com",
        "aff_unique_abbr": "HKUST;UW;Edinburgh;OSU;Microsoft",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Hong Kong SAR;;Columbus",
        "aff_country_unique_index": "0;1;2;3;3",
        "aff_country_unique": "China;Canada;United Kingdom;United States"
    },
    {
        "id": "yLgr02IsXY",
        "title": "AMPipe: Accelerating MoE Model Training with Intra-Block Pipelining",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The Mixture-of-Experts (MoE) architecture presents a compelling adaptation for expanding the model size of pre-trained models, such as large language models (LLMs), to enhance overall model performance (e.g., lower perplexity). However, as the sequence length (represented as $N$) increases, both the execution time of the attention layer ($O(N^2)$) and the all-to-all communication time of the MoE layer ($O(N)$, with a significant coefficient) become training bottlenecks. Current training systems have primarily focused on either optimizing the MoE layer (e.g., Tutel) or enhancing the attention layer (e.g., FlashAttention), yet they have demonstrated bounded performance improvements when confronted with long sequences---an essential consideration for modeling a potent language model with a long context window.\n   \n   In this paper, we introduce AMPipe, a novel pipeline system and paragdim for accelerating the training of large MoE models using Intra-Block Pipelining, particularly when dealing with lengthy sequences. AMPipe smartly optimizes two bottlenecks together by dividing and pipelining both the attention layer and MoE layer to strategically mitigate the time costs associated with these operations. Experimental results illustrate that AMPipe can consistently outperform current training systems, which solely focus on optimizing either the MoE or attention layer. Notably, AMPipe enhances the training throughput of a highly optimized transformer block by an average of 23\\% across 56 benchmark cases and by up to 41\\% in long sequence training, all without introducing statistical impact on model convergence. Our code is available at https://github.com/iclr24-3434/AMPipe.git",
        "keywords": "Deep learning systems;parallel systems;pipeline;mixture of experts",
        "primary_area": "infrastructure, software libraries, hardware, etc.",
        "supplementary_material": "",
        "author": "Yichao Fu;Yuhao QING;Shixiong Zhao;Fanxin Li;Bocheng Xiao;Dong HUANG;Heming Cui",
        "authorids": "~Yichao_Fu1;~Yuhao_QING1;~Shixiong_Zhao1;~Fanxin_Li1;~Bocheng_Xiao3;~Dong_HUANG4;~Heming_Cui1",
        "gender": ";;;M;;M;M",
        "homepage": ";;https://i.cs.hku.hk/~sxzhao/;;;https://huangd1999.github.io/;https://www.cs.hku.hk/people/academic-staff/heming",
        "dblp": ";;141/1483.html;271/6800.html;;94/3756-5.html;59/5565.html",
        "google_scholar": ";https://scholar.google.com/citations?view_op=list_works;https://scholar.google.com.hk/citations?user=tf9h_ngAAAAJ;;;UER9hrAAAAAJ;lW9bpFIAAAAJ",
        "orcid": ";;0000-0002-1643-2583;;;;0000-0001-7746-440X",
        "linkedin": ";;;;bocheng-xiao-b043b525a/;;",
        "or_profile": "~Yichao_Fu1;~Yuhao_QING1;~Shixiong_Zhao1;~Fanxin_Li1;~Bocheng_Xiao3;~Dong_HUANG4;~Heming_Cui1",
        "aff": ";The University of Hong Kong;;The University of Hong Kong;University of Hong Kong;The University of Hong Kong;the University of Hong Kong, University of Hong Kong",
        "aff_domain": ";hku.hk;;hku.hk;hku.hk;cs.hku.hk;cs.hku.hk",
        "position": ";PhD student;;PhD student;PhD student;PhD student;Associate Professor",
        "bibtex": "@misc{\nfu2024ampipe,\ntitle={{AMP}ipe: Accelerating MoE Model Training with Intra-Block Pipelining},\nauthor={Yichao Fu and Yuhao QING and Shixiong Zhao and Fanxin Li and Bocheng Xiao and Dong HUANG and Heming Cui},\nyear={2024},\nurl={https://openreview.net/forum?id=yLgr02IsXY}\n}",
        "github": "",
        "project": "",
        "reviewers": "4gRQ;wCG9;aNzs;Ai23",
        "site": "https://openreview.net/forum?id=yLgr02IsXY",
        "pdf_size": 3676784,
        "rating": "5;5;5;6",
        "confidence": "4;4;2;2",
        "soundness": "3;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;2;3;3",
        "wc_summary": "78;45;65;81",
        "wc_strengths": "46;23;31;70",
        "wc_weaknesses": "447;73;128;69",
        "wc_questions": "64;188;42;174",
        "wc_review": "635;329;266;394",
        "wc_reply_reviewers": "200;0;0;13",
        "wc_reply_authors": "1070;852;717;427",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.0,
            1.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            67.25,
            14.184057952504283
        ],
        "wc_strengths_avg": [
            42.5,
            17.89553016817328
        ],
        "wc_weaknesses_avg": [
            179.25,
            156.333577647286
        ],
        "wc_questions_avg": [
            117.0,
            64.66065264130884
        ],
        "wc_review_avg": [
            406.0,
            139.74440954828927
        ],
        "wc_reply_reviewers_avg": [
            53.25,
            84.89221106791835
        ],
        "wc_reply_authors_avg": [
            766.5,
            232.98766061746704
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:omrekJzyXJoJ:scholar.google.com/&scioq=AMPipe:+Accelerating+MoE+Model+Training+with+Intra-Block+Pipelining&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "University of Hong Kong",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.hku.hk",
        "aff_unique_abbr": "HKU",
        "aff_campus_unique_index": "0;0;0;0;0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "yMMIWHbjWS",
        "title": "On convex decision regions in deep network representations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Current work on human-machine alignment aims at understanding machine-learned latent spaces and their correspondence to human representations. G\u00e4rdenfors' conceptual spaces is a prominent framework for understanding human representations. Convexity of object regions in conceptual spaces is argued to promote generalizability, few-shot learning, and interpersonal alignment. Based on these insights, we investigate the notion of convexity of concept regions in machine-learned latent spaces. We develop a set of tools for measuring convexity in sampled data and evaluate emergent convexity in layered representations of state-of-the-art deep networks. We show that convexity is robust to basic re-parametrization and, hence, meaningful as a quality of machine-learned latent spaces. We find that approximate convexity is pervasive in neural representations in multiple application domains, including models of images, audio, human activity, text, and medical images. Generally, we observe that fine-tuning increases the convexity of label regions. We find evidence that pretraining convexity of class label regions predicts subsequent fine-tuning performance.",
        "keywords": "explainability;Transformers;convexity",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Lenka T\u011btkov\u00e1;Thea Br\u00fcsch;Teresa Scheidt;Fabian Mager;Rasmus Aagaard;Jonathan Foldager;Tommy Sonne Alstr\u00f8m;Lars Kai Hansen",
        "authorids": "~Lenka_T\u011btkov\u00e11;~Thea_Br\u00fcsch1;~Teresa_Scheidt1;~Fabian_Mager1;~Rasmus_Aagaard1;~Jonathan_Foldager1;~Tommy_Sonne_Alstr\u00f8m1;~Lars_Kai_Hansen1",
        "gender": "F;F;F;M;M;;M;M",
        "homepage": ";;;https://orbit.dtu.dk/en/persons/fabian-martin-mager;https://www.rasgaard.github.io/;;;http://cogsys.imm.dtu.dk/staff/lkhansen/lkhansen.html",
        "dblp": "345/1472;;302/8427;;;337/9972;120/7016;80/3468",
        "google_scholar": "GSJaf6kAAAAJ;d5tGeskAAAAJ;;https://scholar.google.com/citations?hl=en;;pmz2CpIAAAAJ;https://scholar.google.dk/citations?user=jAmaPr4AAAAJ;https://scholar.google.dk/citations?user=gQVuJh8AAAAJ",
        "orcid": "0000-0002-0009-6896;0009-0004-9580-9386;;0000-0003-3999-798X;;0000-0001-7470-0382;0000-0003-0941-3146;0000-0003-0442-5877",
        "linkedin": "lenka-tetkova/;thea-bruesch/;teresa-scheidt-265b451b9;fabianmager/;rasgaard;jonathan-foldager-b93041a9;;",
        "or_profile": "~Lenka_T\u011btkov\u00e11;~Thea_Br\u00fcsch1;~Teresa_Scheidt1;~Fabian_Mager1;~Rasmus_Aagaard1;~Jonathan_Foldager1;~Tommy_Sonne_Alstr\u00f8m1;~Lars_Kai_Hansen1",
        "aff": "Technical University of Denmark;Technical University of Denmark;Technical University of Denmark;Technical University of Denmark;Technical University of Denmark;;Technical University of Denmark;Technical University of Denmark",
        "aff_domain": "dtu.dk;dtu.dk;dtu.dk;dtu.dk;dtu.dk;;dtu.dk;dtu.dk",
        "position": "PhD student;PhD student;PhD student;PhD student;Research Assistant;;Associate Professor;Full Professor",
        "bibtex": "@misc{\nt{\\v{e}}tkov{\\'a}2024on,\ntitle={On convex decision regions in deep network representations},\nauthor={Lenka T{\\v{e}}tkov{\\'a} and Thea Br{\\\"u}sch and Teresa Scheidt and Fabian Mager and Rasmus Aagaard and Jonathan Foldager and Tommy Sonne Alstr{\\o}m and Lars Kai Hansen},\nyear={2024},\nurl={https://openreview.net/forum?id=yMMIWHbjWS}\n}",
        "github": "",
        "project": "",
        "reviewers": "Rwrg;NRVi;f5N3;nfkX",
        "site": "https://openreview.net/forum?id=yMMIWHbjWS",
        "pdf_size": 16014608,
        "rating": "5;5;6;8",
        "confidence": "3;3;4;2",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;4",
        "wc_summary": "85;45;92;121",
        "wc_strengths": "7;95;45;65",
        "wc_weaknesses": "293;327;522;70",
        "wc_questions": "5;8;3;22",
        "wc_review": "390;475;662;278",
        "wc_reply_reviewers": "80;24;113;118",
        "wc_reply_authors": "585;426;527;158",
        "reply_reviewers": "1;1;1;2",
        "reply_authors": "2;2;1;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            85.75,
            27.123559869604136
        ],
        "wc_strengths_avg": [
            53.0,
            31.96873472629156
        ],
        "wc_weaknesses_avg": [
            303.0,
            160.41041113344232
        ],
        "wc_questions_avg": [
            9.5,
            7.433034373659253
        ],
        "wc_review_avg": [
            451.25,
            140.309256644029
        ],
        "wc_reply_reviewers_avg": [
            83.75,
            37.459144410944575
        ],
        "wc_reply_authors_avg": [
            424.0,
            163.77576133237787
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1144969923619499623&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;0;0;0;0",
        "aff_unique_norm": "Technical University of Denmark",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tek.dk",
        "aff_unique_abbr": "DTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "Denmark"
    },
    {
        "id": "yMwJiJoadt",
        "title": "TransNeXt: Aggregating Diverse Attentions in One Vision Model",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In the design of previous Vision Transformers (ViTs), different token mixers were often alternately stacked to balance the visual model\u2019s aggregation of global and local information, or to combine the characteristics of convolution with attention mechanism. In this paper, we propose Aggregated Attention, which is a biomimetic design-based token mixer enabling each token to have fine-grained attention to its nearest neighbor features and coarse-grained attention to global features in terms of spatial information aggregation. Furthermore, we incorporate learnable tokens that interact with conventional queries and keys, which further diversifies the generation of affinity matrices beyond merely relying on the similarity between queries and keys. All of these improvements can be achieved within a single attention layer, eliminating the need for alternately stacking different token mixers.\nAdditionally, we propose Convolutional GLU, a channel mixer that bridges the gap between GLU and SE mechanism, which empowers each token to have channel attention based on its nearest neighbor image features, enhancing local modeling capability and model robustness. We combine aggregated attention and convolutional GLU to create a new visual backbone called TransNeXt. Extensive experiments demonstrate that our TransNeXt achieves state-of-the-art performance across multiple model sizes. At a resolution of $224^2$, TransNeXt-Tiny attains an ImageNet accuracy of 84.0\\%, surpassing ConvNeXt-B with 69\\% fewer parameters. Our TransNeXt-Base achieves an ImageNet accuracy of 86.2\\% and an ImageNet-A accuracy of 61.6\\% at a resolution of $384^2$, a COCO object detection mAP of 57.1, and an ADE20K semantic segmentation mIoU of 54.7.",
        "keywords": "Vision Transformer;Efficient Transformer;Self-Attention;Convolution;Visual Backbone;Image Classification;Object Detection;Image Segmentation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/5d0d31d10065a60b2ad2f771a90d5d453462856b.zip",
        "author": "Dai Shi",
        "authorids": "~Dai_Shi2",
        "gender": "",
        "homepage": "",
        "dblp": "",
        "google_scholar": "",
        "orcid": "",
        "linkedin": "",
        "or_profile": "",
        "aff": "",
        "aff_domain": "",
        "position": "",
        "bibtex": "@misc{\nshi2024transnext,\ntitle={TransNeXt: Aggregating Diverse Attentions in One Vision Model},\nauthor={Dai Shi},\nyear={2024},\nurl={https://openreview.net/forum?id=yMwJiJoadt}\n}",
        "github": "",
        "project": "",
        "reviewers": "hJkq;2Wbt;vXBQ;4sZd",
        "site": "https://openreview.net/forum?id=yMwJiJoadt",
        "pdf_size": 10629077,
        "rating": "3;5;5;5",
        "confidence": "4;5;5;4",
        "soundness": "3;3;3;3",
        "contribution": "1;3;3;2",
        "presentation": "3;3;4;3",
        "wc_summary": "31;138;154;82",
        "wc_strengths": "28;199;35;29",
        "wc_weaknesses": "252;206;225;123",
        "wc_questions": "25;69;3;3",
        "wc_review": "336;612;417;237",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1745;1528;818;1137",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;3;2;2",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            101.25,
            48.57661474413383
        ],
        "wc_strengths_avg": [
            72.75,
            72.93961543633199
        ],
        "wc_weaknesses_avg": [
            201.5,
            48.17935242404157
        ],
        "wc_questions_avg": [
            25.0,
            26.94438717061496
        ],
        "wc_review_avg": [
            400.5,
            137.7470507851257
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1307.0,
            356.61814311669565
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:3b5JUekoqCMJ:scholar.google.com/&scioq=TransNeXt:+Aggregating+Diverse+Attentions+in+One+Vision+Model&hl=en&as_sdt=0,5",
        "gs_version_total": 0
    },
    {
        "title": "Transformers as Decision Makers: Provable In-Context Reinforcement Learning via Supervised Pretraining",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17421",
        "id": "yN4Wv17ss3",
        "author_site": "Licong Lin, Yu Bai, Song Mei",
        "tldr": "",
        "abstract": "Large transformer models pretrained on offline reinforcement learning datasets have demonstrated remarkable in-context reinforcement learning (ICRL) capabilities, where they can make good decisions when prompted with interaction trajectories from unseen environments. However, when and how transformers can be trained to perform ICRL have not been theoretically well-understood. In particular, it is unclear which reinforcement-learning algorithms transformers can perform in context, and how distribution mismatch in offline training data affects the learned algorithms. \n\nThis paper provides a theoretical framework that analyzes supervised pretraining for ICRL. This includes two recently proposed training methods --- algorithm distillation and decision-pretrained transformers. First, assuming model realizability, we prove the supervised-pretrained transformer will imitate the conditional expectation of the expert algorithm given the observed trajectory. The generalization error will scale with model capacity and a distribution divergence factor between the expert and offline algorithms. Second, we show transformers with ReLU attention can efficiently approximate near-optimal online reinforcement learning algorithms like LinUCB and Thompson sampling for stochastic linear bandits, and UCB-VI for tabular Markov decision processes. This provides the first quantitative analysis of the ICRL capabilities of transformers pretrained from offline trajectories.",
        "keywords": "transformers;in-context learning;reinforcement learning;learning theory",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Licong Lin;Yu Bai;Song Mei",
        "authorids": "~Licong_Lin2;~Yu_Bai1;~Song_Mei1",
        "gender": "M;;M",
        "homepage": "https://statistics.berkeley.edu/people/licong-lin;https://yubai.org;https://www.stat.berkeley.edu/~songmei/",
        "dblp": ";03/6325-17.html;https://dblp.org/pers/hd/m/Mei:Song",
        "google_scholar": ";owqhKD8AAAAJ;https://scholar.google.com.hk/citations?hl=en",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Licong_Lin2;~Yu_Bai1;~Song_Mei1",
        "aff": "University of California, Berkeley;Salesforce Research;University of California, Berkeley",
        "aff_domain": "berkeley.edu;salesforce.com;berkeley.edu",
        "position": "PhD student;Research Scientist;Assistant Professor",
        "bibtex": "@inproceedings{\nlin2024transformers,\ntitle={Transformers as Decision Makers: Provable In-Context Reinforcement Learning via Supervised Pretraining},\nauthor={Licong Lin and Yu Bai and Song Mei},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=yN4Wv17ss3}\n}",
        "github": "",
        "project": "",
        "reviewers": "ycZf;E6sG;HUY7;fr59",
        "pdf_size": 919112,
        "rating": "5;6;6;8",
        "confidence": "3;3;1;4",
        "soundness": "3;3;3;4",
        "contribution": "2;3;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "164;116;46;186",
        "wc_strengths": "62;61;38;243",
        "wc_weaknesses": "245;45;56;622",
        "wc_questions": "8;19;40;120",
        "wc_review": "479;241;180;1171",
        "wc_reply_reviewers": "0;0;0;424",
        "wc_reply_authors": "648;329;540;794",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            2.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            128.0,
            53.68426212587819
        ],
        "wc_strengths_avg": [
            101.0,
            82.54392769913484
        ],
        "wc_weaknesses_avg": [
            242.0,
            233.3527372884235
        ],
        "wc_questions_avg": [
            46.75,
            43.82564888281747
        ],
        "wc_review_avg": [
            517.75,
            393.3518622048204
        ],
        "wc_reply_reviewers_avg": [
            106.0,
            183.597385602301
        ],
        "wc_reply_authors_avg": [
            577.75,
            169.5588024845658
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.4736842105263159,
        "gs_citation": 60,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14378238973708462337&as_sdt=5,31&sciodt=0,31&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=yN4Wv17ss3",
        "pdf": "https://openreview.net/pdf?id=yN4Wv17ss3",
        "email": "berkeley.edu;salesforce.com;berkeley.edu",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "University of California, Berkeley;Salesforce",
        "aff_unique_dep": ";Salesforce Research",
        "aff_unique_url": "https://www.berkeley.edu;https://research.salesforce.com",
        "aff_unique_abbr": "UC Berkeley;Salesforce",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Berkeley;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "yNAlwBoDcg",
        "title": "SPLITZ: Certifiable Robustness via Split Lipschitz Randomized Smoothing",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Certifiable robustness gives the guarantee that small perturbations around an input to a classifier will not change the prediction. There are two approaches to provide certifiable robustness to adversarial examples-- a) explicitly training classifiers with small Lipschitz constants, and b) Randomized smoothing, which adds random noise to the input to create a smooth classifier. We propose \\textit{SPLITZ}, a practical and novel approach which leverages the synergistic benefits of both the above ideas into a single framework. Our main idea is to \\textit{split} a classifier into two halves, constrain the Lipschitz constant of the first half, and smooth the second half via randomization. Motivation for \\textit{SPLITZ} comes from the observation that many standard deep networks exhibit heterogeneity in Lipschitz constants across layers. \\textit{SPLITZ} can exploit this heterogeneity while inheriting the scalability of randomized smoothing. \nWe present a principled approach to train \\textit{SPLITZ} and provide theoretical analysis to derive certified robustness guarantees. \nWe present a comprehensive comparison of robustness-accuracy tradeoffs and show that \\textit{SPLITZ} consistently improves upon existing state-of-the-art approaches on MNIST, CIFAR-10 and ImageNet datasets. For instance, with $\\ell_2$ norm perturbation budget of $\\epsilon=1$, \\textit{SPLITZ} achieves $\\textbf{61.7\\%}$ top-1 test accuracy on CIFAR-10 dataset compared to state-of-art top-1 test accuracy $39.8\\%$, a $55.0\\%$ improvement in certified accuracy over various approaches (including, denoising based methods, ensemble methods, and adversarial smoothing).",
        "keywords": "Certified Robustness;Randomized Smoothing;Adversarial Examples",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/7a36683011fafae94745e2b09f910a77a6d72730.zip",
        "author": "Meiyu Zhong;Ravi Tandon",
        "authorids": "~Meiyu_Zhong1;~Ravi_Tandon1",
        "gender": "F;",
        "homepage": "https://meiyuzhong.github.io/;https://tandonravi.github.io/",
        "dblp": ";19/543.html",
        "google_scholar": ";u-lTHjcAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Meiyu_Zhong1;~Ravi_Tandon1",
        "aff": "University of Arizona;University of Arizona",
        "aff_domain": "arizona.edu;arizona.edu",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nzhong2024splitz,\ntitle={{SPLITZ}: Certifiable Robustness via Split Lipschitz Randomized Smoothing},\nauthor={Meiyu Zhong and Ravi Tandon},\nyear={2024},\nurl={https://openreview.net/forum?id=yNAlwBoDcg}\n}",
        "github": "",
        "project": "",
        "reviewers": "CJku;jeFQ;3vvt;jHmH",
        "site": "https://openreview.net/forum?id=yNAlwBoDcg",
        "pdf_size": 1497518,
        "rating": "3;5;8;8",
        "confidence": "5;3;3;3",
        "soundness": "1;2;3;3",
        "contribution": "1;3;4;3",
        "presentation": "2;3;3;3",
        "wc_summary": "102;93;51;145",
        "wc_strengths": "31;28;96;78",
        "wc_weaknesses": "595;369;207;47",
        "wc_questions": "8;111;115;21",
        "wc_review": "736;601;469;291",
        "wc_reply_reviewers": "148;0;0;63",
        "wc_reply_authors": "1192;743;1032;307",
        "reply_reviewers": "2;0;0;1",
        "reply_authors": "3;1;2;1",
        "rating_avg": [
            6.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            1.0897247358851685
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            97.75,
            33.38693606786942
        ],
        "wc_strengths_avg": [
            58.25,
            29.46502163583119
        ],
        "wc_weaknesses_avg": [
            304.5,
            202.70853460079078
        ],
        "wc_questions_avg": [
            63.75,
            49.48421465477653
        ],
        "wc_review_avg": [
            524.25,
            164.45877142919437
        ],
        "wc_reply_reviewers_avg": [
            52.75,
            60.7098632843132
        ],
        "wc_reply_authors_avg": [
            818.5,
            336.30975305512624
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.8164965809277261,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10484401304353564144&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Arizona",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.arizona.edu",
        "aff_unique_abbr": "UA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "yNJEyP4Jv2",
        "title": "Understanding and Improving Adversarial Attacks on Latent Diffusion Model",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Latent Diffusion Model (LDM) has emerged as a leading tool in image generation, particularly with its capability in few-shot generation. This capability also presents risks, notably in unauthorized artwork replication and misinformation generation. In response, adversarial attacks have been designed to safeguard personal images from being used as reference data. However, existing adversarial attacks are predominantly empirical, lacking a solid theoretical foundation. In this paper, we introduce a comprehensive theoretical framework for understanding adversarial attacks on LDM. Based on the framework, we propose a novel adversarial attack that exploits a unified target to guide the adversarial attack both in the forward and the reverse process of LDM. We provide empirical evidences that our method overcomes the offset problem of the optimization of adversarial attacks in existing methods. Through rigorous experiments, our findings demonstrate that our method outperforms current attacks and is able to generalize over different state-of-the-art few-shot generation pipelines based on LDM. Our method can serve as a stronger and efficient tool for people exposed to the risk of data privacy and security to protect themselves in the new era of powerful generative models.",
        "keywords": "Generative Models;Adversarial Attack;Diffusion Models;Latent Diffusion Model",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Boyang Zheng;Chumeng Liang;Xiaoyu Wu;Yan Liu",
        "authorids": "~Boyang_Zheng1;~Chumeng_Liang2;~Xiaoyu_Wu1;~Yan_Liu1",
        "gender": "M;M;F;",
        "homepage": "https://www.boyangzheng.com/academica/;https://github.com/Nicholas0228;http://www-bcf.usc.edu/~liu32/;https://caradryanl.github.io",
        "dblp": ";;150/4295;330/5426.html",
        "google_scholar": "https://scholar.google.com/citations?hl=en;VzQkSAkAAAAJ;UUKLPMYAAAAJ;4S0PYJYAAAAJ",
        "orcid": ";;0000-0002-7055-9518;",
        "linkedin": ";;;",
        "or_profile": "~Boyang_Zheng1;~Xiaoyu_Wu1;~Yan_Liu1;~Caradryan_Liang1",
        "aff": "Shanghai Jiaotong University;Shanghai Jiaotong University;University of Southern California;University of Southern California",
        "aff_domain": "sjtu.edu.cn;sjtu.edu.cn;usc.edu;usc.edu",
        "position": "Undergrad student;MS student;Professor;MS student",
        "bibtex": "@misc{\nzheng2024understanding,\ntitle={Understanding and Improving Adversarial Attacks on Latent Diffusion Model},\nauthor={Boyang Zheng and Chumeng Liang and Xiaoyu Wu and Yan Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=yNJEyP4Jv2}\n}",
        "github": "",
        "project": "",
        "reviewers": "oH1F;FuAb;WV9g;19tS;8G7v",
        "site": "https://openreview.net/forum?id=yNJEyP4Jv2",
        "pdf_size": 24986152,
        "rating": "3;3;5;5;5",
        "confidence": "4;3;4;3;4",
        "soundness": "1;2;3;3;3",
        "contribution": "1;2;3;3;3",
        "presentation": "2;2;3;3;3",
        "wc_summary": "72;73;64;49;111",
        "wc_strengths": "16;78;55;50;38",
        "wc_weaknesses": "201;899;306;128;259",
        "wc_questions": "22;249;106;6;90",
        "wc_review": "311;1299;531;233;498",
        "wc_reply_reviewers": "0;154;49;120;29",
        "wc_reply_authors": "777;1511;603;424;388",
        "reply_reviewers": "0;1;1;1;1",
        "reply_authors": "1;3;1;1;1",
        "rating_avg": [
            4.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.4,
            0.8
        ],
        "contribution_avg": [
            2.4,
            0.8
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            73.8,
            20.48804529475665
        ],
        "wc_strengths_avg": [
            47.4,
            20.37253052519495
        ],
        "wc_weaknesses_avg": [
            358.6,
            276.6706345097
        ],
        "wc_questions_avg": [
            94.6,
            86.15242306516978
        ],
        "wc_review_avg": [
            574.4,
            379.1303733546021
        ],
        "wc_reply_reviewers_avg": [
            70.4,
            57.57985758926467
        ],
        "wc_reply_authors_avg": [
            740.6,
            409.47214801497796
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            1.4,
            0.8000000000000002
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.16666666666666663,
        "gs_citation": 27,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3196451198445503&as_sdt=40005&sciodt=0,10&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;1",
        "aff_unique_norm": "Shanghai Jiao Tong University;University of Southern California",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.sjtu.edu.cn;https://www.usc.edu",
        "aff_unique_abbr": "SJTU;USC",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Los Angeles",
        "aff_country_unique_index": "0;0;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "yNyDvFQNEm",
        "title": "Unsupervised Learning via Network-Aware Embeddings",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Data clustering, the task of grouping observations according to their similarity, is a key component of unsupervised learning -- with real world applications in diverse fields such as biology, medicine, and social science. Often in these fields the data comes with complex interdependencies between the dimensions of analysis, for instance the various characteristics and opinions people can have live on a complex social network. Current clustering methods are ill-suited to tackle this complexity: deep learning can approximate these dependencies, but not take their explicit map as the input of the analysis. In this paper, we aim at fixing this blind spot in the unsupervised learning literature. We can create network-aware embeddings by estimating the network distance between numeric node attributes via the generalized Euclidean distance. Differently from all methods in the literature that we know of, we do not cluster the nodes of the network, but rather its node attributes. In our experiments we show that having these network embeddings is always beneficial for the learning task; that our method scales to large networks; and that we can actually provide actionable insights in applications in a variety of fields such as marketing, economics, and political science. Our method is fully open source and data and code are available to reproduce all results in the paper.",
        "keywords": "graph neural networks;graph embeddings;node attributes;data clustering",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/58e351265422005707149d2398cfa67252168cdf.zip",
        "author": "Anne Sophie Riis Damstrup;Sofie Tosti Madsen;Michele Coscia",
        "authorids": "~Anne_Sophie_Riis_Damstrup1;~Sofie_Tosti_Madsen1;~Michele_Coscia1",
        "gender": "F;F;M",
        "homepage": "https://www.linkedin.com/in/annesophieriis;;https://www.michelecoscia.com/",
        "dblp": ";;90/7255",
        "google_scholar": ";;3p_bhfUAAAAJ",
        "orcid": ";;0000-0001-5984-5137",
        "linkedin": ";https://linkedin.com/in/sofietosti;",
        "or_profile": "~Anne_Sophie_Riis_Damstrup1;~Sofie_Tosti_Madsen1;~Michele_Coscia1",
        "aff": ";;IT University of Copenhagen",
        "aff_domain": ";;itu.dk",
        "position": ";;Associate Professor",
        "bibtex": "@misc{\ndamstrup2024unsupervised,\ntitle={Unsupervised Learning via Network-Aware Embeddings},\nauthor={Anne Sophie Riis Damstrup and Sofie Tosti Madsen and Michele Coscia},\nyear={2024},\nurl={https://openreview.net/forum?id=yNyDvFQNEm}\n}",
        "github": "",
        "project": "",
        "reviewers": "9U5s;b2DR;uUyU;x6pK;L2DL",
        "site": "https://openreview.net/forum?id=yNyDvFQNEm",
        "pdf_size": 1420628,
        "rating": "1;3;3;5;5",
        "confidence": "4;4;5;3;4",
        "soundness": "2;2;1;3;2",
        "contribution": "1;2;2;2;3",
        "presentation": "1;3;1;3;2",
        "wc_summary": "43;52;46;91;76",
        "wc_strengths": "12;34;13;40;57",
        "wc_weaknesses": "195;29;365;133;103",
        "wc_questions": "3;196;2;65;713",
        "wc_review": "253;311;426;329;949",
        "wc_reply_reviewers": "32;0;0;18;214",
        "wc_reply_authors": "158;543;403;336;672",
        "reply_reviewers": "1;0;0;1;1",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            3.4,
            1.4966629547095767
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            2.0,
            0.6324555320336759
        ],
        "presentation_avg": [
            2.0,
            0.8944271909999159
        ],
        "wc_summary_avg": [
            61.6,
            18.72538384119268
        ],
        "wc_strengths_avg": [
            31.2,
            17.03408347989407
        ],
        "wc_weaknesses_avg": [
            165.0,
            113.37019008540119
        ],
        "wc_questions_avg": [
            195.8,
            268.08013727242087
        ],
        "wc_review_avg": [
            453.6,
            253.8831227159458
        ],
        "wc_reply_reviewers_avg": [
            52.8,
            81.49208550528081
        ],
        "wc_reply_authors_avg": [
            422.4,
            175.8369699465957
        ],
        "reply_reviewers_avg": [
            0.6,
            0.48989794855663565
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.42257712736425823,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14167987857841807930&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0",
        "aff_unique_norm": "IT University of Copenhagen",
        "aff_unique_dep": "",
        "aff_unique_url": "https://itu.dk",
        "aff_unique_abbr": "ITU",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Denmark"
    },
    {
        "id": "yONJt6nFc3",
        "title": "Node Duplication Improves Cold-start Link Prediction",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph Neural Networks (GNNs) are prominent in graph machine learning and have shown state-of-the-art performance in Link Prediction (LP) tasks. Nonetheless, recent studies show that GNNs struggle to produce good results on low-degree nodes despite their overall strong performance. In practical applications of LP, like recommendation systems, improving performance on low-degree nodes is critical, as it amounts to tackling the cold-start problem of improving the experiences of users with few observed interactions. In this paper, we investigate improving GNNs' LP performance on low-degree nodes while preserving their performance on high-degree nodes and propose a simple yet surprisingly effective augmentation technique called NodeDup. Specifically, NodeDup duplicates low-degree nodes and creates links between nodes and their own duplicates before following the standard supervised LP training scheme. By leveraging a ''multi-view'' perspective for low-degree nodes, NodeDup shows significant LP performance improvements on low-degree nodes without compromising any performance on high-degree nodes. Additionally, as a plug-and-play augmentation module, NodeDup can be easily applied on existing GNNs with very light computational cost. Extensive experiments show that NodeDup achieves 38.49%, 13.34%, and 6.76% improvements on isolated, low-degree, and warm nodes, respectively, on average across all datasets compared to GNNs and state-of-the-art cold-start methods. We also find that our method greatly outperforms augmentation baselines on isolated and low-degree nodes, with comparable warm node performance, while running significantly faster.",
        "keywords": "Link Prediction;Graph neural networks;Graph Augmentation;Tail Nodes;Cold-start Link Prediction",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Zhichun Guo;Tong Zhao;Yozen Liu;Kaiwen Dong;William Shiao;Neil Shah;Nitesh V Chawla",
        "authorids": "~Zhichun_Guo1;~Tong_Zhao3;~Yozen_Liu1;~Kaiwen_Dong1;~William_Shiao1;~Neil_Shah2;~Nitesh_V_Chawla1",
        "gender": ";M;;M;M;M;",
        "homepage": ";https://tzhao.io/;https://www.linkedin.com/in/yozen-liu-531a67130/;https://barcavin.github.io/;https://shiao.me;http://nshah.net;",
        "dblp": ";94/6503-3;242/8056.html;301/7629;304/3898;71/7771;",
        "google_scholar": ";05cRc-MAAAAJ;i3U2JjEAAAAJ;bKccdZYAAAAJ;TIq-P5AAAAAJ;Qut69OgAAAAJ;",
        "orcid": ";0000-0001-7660-1732;;0000-0001-8244-9562;0000-0001-5813-2266;0000-0003-3261-8430;",
        "linkedin": ";;;;will-shiao;;",
        "or_profile": "~Zhichun_Guo1;~Tong_Zhao3;~Yozen_Liu1;~Kaiwen_Dong1;~William_Shiao1;~Neil_Shah2;~Nitesh_V_Chawla1",
        "aff": ";Snap Inc.;Snap Inc.;University of Notre Dame;University of California, Riverside;Snap Inc.;",
        "aff_domain": ";snap.com;snapchat.com;nd.edu;ucr.edu;snap.com;",
        "position": ";Researcher;Researcher;PhD student;PhD student;Research Scientist;",
        "bibtex": "@misc{\nguo2024node,\ntitle={Node Duplication Improves Cold-start Link Prediction},\nauthor={Zhichun Guo and Tong Zhao and Yozen Liu and Kaiwen Dong and William Shiao and Neil Shah and Nitesh V Chawla},\nyear={2024},\nurl={https://openreview.net/forum?id=yONJt6nFc3}\n}",
        "github": "",
        "project": "",
        "reviewers": "exPD;1iUU;pJyQ",
        "site": "https://openreview.net/forum?id=yONJt6nFc3",
        "pdf_size": 757500,
        "rating": "3;5;5",
        "confidence": "5;4;5",
        "soundness": "2;2;2",
        "contribution": "1;2;2",
        "presentation": "3;2;3",
        "wc_summary": "110;55;82",
        "wc_strengths": "88;77;54",
        "wc_weaknesses": "343;55;252",
        "wc_questions": "138;34;252",
        "wc_review": "679;221;640",
        "wc_reply_reviewers": "0;32;212",
        "wc_reply_authors": "2779;659;1764",
        "reply_reviewers": "0;1;4",
        "reply_authors": "7;3;4",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            82.33333333333333,
            22.45489305746572
        ],
        "wc_strengths_avg": [
            73.0,
            14.165686240583852
        ],
        "wc_weaknesses_avg": [
            216.66666666666666,
            120.20075799354271
        ],
        "wc_questions_avg": [
            141.33333333333334,
            89.02933349308094
        ],
        "wc_review_avg": [
            513.3333333333334,
            207.32315087536386
        ],
        "wc_reply_reviewers_avg": [
            81.33333333333333,
            93.31428377025436
        ],
        "wc_reply_authors_avg": [
            1734.0,
            865.7463061813586
        ],
        "reply_reviewers_avg": [
            1.6666666666666667,
            1.699673171197595
        ],
        "reply_authors_avg": [
            4.666666666666667,
            1.699673171197595
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16090772626202507302&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;2;0",
        "aff_unique_norm": "Snap Inc.;University of Notre Dame;University of California, Riverside",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.snapinc.com;https://www.nd.edu;https://www.ucr.edu",
        "aff_unique_abbr": "Snap;Notre Dame;UCR",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Riverside",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "yPEY9gvwoj",
        "title": "Amicable Perturbations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Machine learning based classifiers have achieved incredible success in a variety of sectors such as college admissions, hiring and banking.  However their ability to make classifications has not been fully exploited to understand how to improve undesirable classifications.  We propose a new framework for finding the most efficient changes that could be made in the real world to achieve a more favorable classification, and term these changes \\textit{amicable perturbations}.  We present a principled methodology for creating amicable perturbations and demonstrate their effectiveness on data sets from a variety of fields. Amicable perturbations differ from counterfactuals in that they are better suited to balance the effort-reward trade-off and lead to the most efficient plan of action. Unlike adversarial examples, which fool a classifier into making false prediction, amicable perturbations are intended to affect the true class of the data point.  To this end, we develop a novel method for verifying that a amicable perturbations change the true class probabilities. We also compare our results to those achieved by previous methods such as counterfactuals and adversarial attacks.",
        "keywords": "Machine Learning;Robust Learning;Counterfactual Explanations;AI Decision Making",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/afc8ab3346871c0c30e04dc3c2377e4d1981e34e.zip",
        "author": "Jesse Friedbaum;Ravi Tandon",
        "authorids": "~Jesse_Friedbaum1;~Ravi_Tandon1",
        "gender": "M;",
        "homepage": "https://sites.google.com/math.arizona.edu/friedbaum;https://tandonravi.github.io/",
        "dblp": ";19/543.html",
        "google_scholar": ";u-lTHjcAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Jesse_Friedbaum1;~Ravi_Tandon1",
        "aff": "University of Arizona;University of Arizona",
        "aff_domain": "arizona.edu;arizona.edu",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nfriedbaum2024amicable,\ntitle={Amicable Perturbations},\nauthor={Jesse Friedbaum and Ravi Tandon},\nyear={2024},\nurl={https://openreview.net/forum?id=yPEY9gvwoj}\n}",
        "github": "",
        "project": "",
        "reviewers": "6MjG;cADE;f8ei;v88R;syxy",
        "site": "https://openreview.net/forum?id=yPEY9gvwoj",
        "pdf_size": 2386780,
        "rating": "3;5;5;5;8",
        "confidence": "4;3;3;3;3",
        "soundness": "3;3;2;3;4",
        "contribution": "2;2;2;2;4",
        "presentation": "2;3;2;3;3",
        "wc_summary": "242;49;277;107;191",
        "wc_strengths": "46;64;112;19;161",
        "wc_weaknesses": "479;100;274;297;273",
        "wc_questions": "96;22;3;137;1018",
        "wc_review": "863;235;666;560;1643",
        "wc_reply_reviewers": "208;0;0;0;0",
        "wc_reply_authors": "1269;291;150;785;1639",
        "reply_reviewers": "1;0;0;0;0",
        "reply_authors": "3;1;1;2;3",
        "rating_avg": [
            5.2,
            1.6
        ],
        "confidence_avg": [
            3.2,
            0.39999999999999997
        ],
        "soundness_avg": [
            3.0,
            0.6324555320336759
        ],
        "contribution_avg": [
            2.4,
            0.8
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            173.2,
            84.41895521741549
        ],
        "wc_strengths_avg": [
            80.4,
            50.43252918504088
        ],
        "wc_weaknesses_avg": [
            284.6,
            120.22412403507043
        ],
        "wc_questions_avg": [
            255.2,
            384.4910402077011
        ],
        "wc_review_avg": [
            793.4,
            470.9949468943377
        ],
        "wc_reply_reviewers_avg": [
            41.6,
            83.2
        ],
        "wc_reply_authors_avg": [
            826.8,
            566.0559689642006
        ],
        "reply_reviewers_avg": [
            0.2,
            0.4000000000000001
        ],
        "reply_authors_avg": [
            2.0,
            0.8944271909999159
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.6875000000000002,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:yUS8BPtziucJ:scholar.google.com/&scioq=Amicable+Perturbations&hl=en&as_sdt=0,23",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Arizona",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.arizona.edu",
        "aff_unique_abbr": "UA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Bidirectional Temporal Diffusion Model for Temporally Consistent Human Animation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17420",
        "id": "yQDFsuG9HP",
        "author_site": "Tserendorj Adiya, Jae Shin Yoon, Jung Eun Lee, Sanghun Kim, Hwasup Lim",
        "tldr": "",
        "abstract": "We introduce a method to generate temporally coherent human animation from a single image, a video, or a random noise.\nThis problem has been formulated as modeling of an auto-regressive generation, i.e., to regress past frames to decode future frames.\nHowever, such unidirectional generation is highly prone to motion drifting over time, generating unrealistic human animation with significant artifacts such as appearance distortion. \nWe claim that bidirectional temporal modeling enforces temporal coherence on a generative network by largely suppressing the appearance ambiguity.\nTo prove our claim, we design a novel human animation framework using a denoising diffusion model: \na neural network learns to generate the image of a person by denoising temporal Gaussian noises whose intermediate results are cross-conditioned bidirectionally between consecutive frames. \nIn the experiments, our method demonstrates strong performance compared to existing unidirectional approaches with realistic temporal coherence.",
        "keywords": "Human Motion Transfer;Diffusion Model;Human Animation;Generative model.",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/2202022cefe46d08c23c8a0f5540e28b0eb0e2e3.zip",
        "author": "Tserendorj Adiya;Jae Shin Yoon;JUNGEUN LEE;Sanghun Kim;Hwasup Lim",
        "authorids": "~Tserendorj_Adiya1;~Jae_Shin_Yoon4;~JUNGEUN_LEE2;~Sanghun_Kim1;~Hwasup_Lim1",
        "gender": "M;M;F;M;M",
        "homepage": "https://typest.github.io;https://gorokee.github.io/jsyoon/;;;https://www.hwasup.net/",
        "dblp": ";174/1073;;;99/510",
        "google_scholar": "Q3n62X8AAAAJ;q7nNPyYAAAAJ;https://scholar.google.com/citations?view_op=list_works;https://scholar.google.com/citations?hl=ko;jA1KmF0AAAAJ",
        "orcid": "0000-0002-7545-7238;0000-0003-0181-4869;;;0000-0003-2957-668X",
        "linkedin": ";;;;",
        "or_profile": "~Tserendorj_Adiya1;~Jae_Shin_Yoon4;~JUNGEUN_LEE2;~Sanghun_Kim1;~Hwasup_Lim1",
        "aff": "AI Center, CJ Corporation;Adobe Systems;Korea Institute of Science and Technology;;Korea Institute of Science and Technology",
        "aff_domain": "cj.net;adobe.com;kist.re.kr;;kist.re.kr",
        "position": "Researcher;Researcher;Intern;;Principal Researcher",
        "bibtex": "@inproceedings{\nadiya2024bidirectional,\ntitle={Bidirectional Temporal Diffusion Model for Temporally Consistent Human Animation},\nauthor={Tserendorj Adiya and Jae Shin Yoon and JUNGEUN LEE and Sanghun Kim and Hwasup Lim},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=yQDFsuG9HP}\n}",
        "github": "",
        "project": "",
        "reviewers": "xCTh;rYhA;VxE3;mGPz",
        "pdf_size": 14681392,
        "rating": "6;6;6;8",
        "confidence": "4;4;3;4",
        "soundness": "3;2;2;3",
        "contribution": "3;3;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "85;83;99;45",
        "wc_strengths": "33;38;42;56",
        "wc_weaknesses": "77;156;64;43",
        "wc_questions": "5;5;41;44",
        "wc_review": "200;282;246;188",
        "wc_reply_reviewers": "0;0;35;0",
        "wc_reply_authors": "330;475;616;346",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            78.0,
            20.024984394500787
        ],
        "wc_strengths_avg": [
            42.25,
            8.554969316134336
        ],
        "wc_weaknesses_avg": [
            85.0,
            42.74926899959811
        ],
        "wc_questions_avg": [
            23.75,
            18.779976038323372
        ],
        "wc_review_avg": [
            229.0,
            37.48332962798263
        ],
        "wc_reply_reviewers_avg": [
            8.75,
            15.155444566227676
        ],
        "wc_reply_authors_avg": [
            441.75,
            115.2440345527698
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11781966651218051409&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=yQDFsuG9HP",
        "pdf": "https://openreview.net/pdf?id=yQDFsuG9HP",
        "email": "cj.net;adobe.com;kist.re.kr;;kist.re.kr",
        "author_num": 5,
        "aff_unique_index": "0;1;2;2",
        "aff_unique_norm": "CJ Corporation;Adobe;Korea Institute of Science and Technology",
        "aff_unique_dep": "AI Center;Adobe Systems Incorporated;",
        "aff_unique_url": "https://www.cj.net;https://www.adobe.com;https://www.kist.re.kr",
        "aff_unique_abbr": "CJ;Adobe;KIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "id": "yQUbpAHbIZ",
        "title": "Post-Nonlinear Causal Relationship with Finite Samples: A Maximal Correlation Perspective",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Bivariate causal discovery aims to determine the causal relationship between two random variables from passive observational data (as intervention is not affordable in many scientific fields), which is considered fundamental and challenging. Designing algorithms based on the post-nonlinear (PNL) model has aroused much attention for its generality. However, the state-of-the-art (SOTA) PNL-based algorithms involve highly non-convex objectives due to the use of neural networks and non-convex losses, thus optimizing such objectives is often time-consuming and unable to produce meaningful solutions with finite samples. In this paper, we propose a novel method that incorporates maximal correlation into the PNL model learning (short as MC-PNL) such that the underlying nonlinearities can be accurately recovered. Owing to the benign structure of our objective function, when modeling the nonlinearities with linear combinations of random Fourier features, the target optimization problem can be solved rather efficiently and rapidly via the block coordinate descent. We also compare the MC-PNL with SOTA methods on the downstream synthetic and real causal discovery tasks to show its superiority in time and accuracy. Our code is available at https://anonymous.4open.science/r/MC-PNL-3C09/.",
        "keywords": "Causal Discovery;Post-Nonlinear;Maximal Correlation",
        "primary_area": "causal reasoning",
        "supplementary_material": "",
        "author": "Tianjian Zhang;Feng Yin;Zhi-Quan Luo",
        "authorids": "~Tianjian_Zhang1;~Feng_Yin1;~Zhi-Quan_Luo1",
        "gender": "M;M;M",
        "homepage": "https://sse.cuhk.edu.cn/en/teacher/309;https://sse.cuhk.edu.cn/en/faculty/yinfeng;",
        "dblp": "190/6500;59/6917;",
        "google_scholar": ";4mW1N5oAAAAJ;dW3gcXoAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Tianjian_Zhang1;~Feng_Yin1;~Zhi-Quan_Luo1",
        "aff": "The Chinese University of Hong Kong, Shenzhen;;The Chinese University of Hong Kong, Shenzhen",
        "aff_domain": "cuhk.edu.cn;;cuhk.edu.cn",
        "position": "PhD student;;Full Professor",
        "bibtex": "@misc{\nzhang2024postnonlinear,\ntitle={Post-Nonlinear Causal Relationship with Finite Samples: A Maximal Correlation Perspective},\nauthor={Tianjian Zhang and Feng Yin and Zhi-Quan Luo},\nyear={2024},\nurl={https://openreview.net/forum?id=yQUbpAHbIZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "hazx;7AyX;m7U7",
        "site": "https://openreview.net/forum?id=yQUbpAHbIZ",
        "pdf_size": 2591655,
        "rating": "6;6;6",
        "confidence": "3;3;3",
        "soundness": "3;3;2",
        "contribution": "2;2;2",
        "presentation": "3;3;2",
        "wc_summary": "114;47;128",
        "wc_strengths": "50;81;86",
        "wc_weaknesses": "129;150;197",
        "wc_questions": "8;57;99",
        "wc_review": "301;335;510",
        "wc_reply_reviewers": "33;37;102",
        "wc_reply_authors": "357;633;641",
        "reply_reviewers": "1;1;1",
        "reply_authors": "2;1;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            96.33333333333333,
            35.34905310691583
        ],
        "wc_strengths_avg": [
            72.33333333333333,
            15.923427883328248
        ],
        "wc_weaknesses_avg": [
            158.66666666666666,
            28.429249413627197
        ],
        "wc_questions_avg": [
            54.666666666666664,
            37.18721405118819
        ],
        "wc_review_avg": [
            382.0,
            91.5678254992804
        ],
        "wc_reply_reviewers_avg": [
            57.333333333333336,
            31.626290048347787
        ],
        "wc_reply_authors_avg": [
            543.6666666666666,
            132.03366574055607
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8595699470384607998&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Chinese University of Hong Kong",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cuhk.edu.cn",
        "aff_unique_abbr": "CUHK",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Shenzhen",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "yQuF0jslCc",
        "title": "Online Fractional Knapsack With Predictions",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The well-known classical version of the online knapsack problem decides which of the arriving items of different weights and values to accept into a capacity-limited knapsack. In this paper, we consider the online fractional knapsack problem where items can be fractionally accepted. We present the first online algorithms for this problem which incorporate prediction about the input in several forms, including predictions of the smallest value chosen in the optimal offline solution, and interval predictions which give upper and lower bounds on this smallest value.\nWe present algorithms for both of these prediction models, prove their competitive ratios, and give a matching worst-case lower bound.  Furthermore, we present a learning-augmented meta-algorithm that combines our prediction techniques with a robust baseline algorithm to simultaneously achieve consistency and robustness.\nFinally, we conduct numerical experiments that show that our prediction algorithms significantly outperform a simple greedy prediction algorithm for the problem and the robust baseline algorithm, which does not use predictions.  Furthermore, we show that our learning-augmented algorithms can leverage imperfect predictions (e.g., from a machine learning model) to greatly improve average-case performance without sacrificing worst-case guarantees.",
        "keywords": "online fractional knapsack;advice;learning-augmented algorithm;robustness;consistency",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Mohammadreza Daneshvaramoli;Helia Karisani;Adam Lechowicz;Bo Sun;Cameron N Musco;Mohammad Hajiesmaili",
        "authorids": "~Mohammadreza_Daneshvaramoli1;hkarisani@umass.edu;~Adam_Lechowicz1;~Bo_Sun8;~Cameron_N_Musco1;~Mohammad_Hajiesmaili1",
        "gender": "M;;Non-Binary;;M;M",
        "homepage": ";;https://adamlechowicz.github.io;;https://people.cs.umass.edu/~cmusco/;https://groups.cs.umass.edu/hajiesmaili/",
        "dblp": ";;307/5199;;149/2327;49/7911",
        "google_scholar": "9kes09AAAAAJ;;fZ2-jm0AAAAJ;;EeYGZCwAAAAJ;XCGuYKIAAAAJ",
        "orcid": ";;0000-0002-7774-9939;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Mohammadreza_Daneshvaramoli1;hkarisani@umass.edu;~Adam_Lechowicz1;~Bo_Sun8;~Cameron_N_Musco1;~Mohammad_Hajiesmaili1",
        "aff": "University of Massachusetts at Amherst;;University of Massachusetts Amherst;;University of Massachusetts, Amherst;College of Information and Computer Science, University of Massachusetts, Amherst",
        "aff_domain": "umass.edu;;cs.umass.edu;;umass.edu;cics.umass.edu",
        "position": "PhD student;;PhD student;;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\ndaneshvaramoli2024online,\ntitle={Online Fractional Knapsack With Predictions},\nauthor={Mohammadreza Daneshvaramoli and Helia Karisani and Adam Lechowicz and Bo Sun and Cameron N Musco and Mohammad Hajiesmaili},\nyear={2024},\nurl={https://openreview.net/forum?id=yQuF0jslCc}\n}",
        "github": "",
        "project": "",
        "reviewers": "G3xe;Qu7e;BBFM;SiKU",
        "site": "https://openreview.net/forum?id=yQuF0jslCc",
        "pdf_size": 3274777,
        "rating": "3;3;6;6",
        "confidence": "4;2;4;4",
        "soundness": "3;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;2",
        "wc_summary": "132;331;453;349",
        "wc_strengths": "57;14;25;43",
        "wc_weaknesses": "235;266;68;197",
        "wc_questions": "64;140;310;52",
        "wc_review": "488;751;856;641",
        "wc_reply_reviewers": "117;138;22;0",
        "wc_reply_authors": "712;764;772;655",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            316.25,
            116.12358718193302
        ],
        "wc_strengths_avg": [
            34.75,
            16.498105951896417
        ],
        "wc_weaknesses_avg": [
            191.5,
            75.37406715840667
        ],
        "wc_questions_avg": [
            141.5,
            102.96965572439291
        ],
        "wc_review_avg": [
            684.0,
            136.32497936915303
        ],
        "wc_reply_reviewers_avg": [
            69.25,
            59.23417510187848
        ],
        "wc_reply_authors_avg": [
            725.75,
            46.89549551929268
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5773502691896258,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:ev8p6ol4VlQJ:scholar.google.com/&scioq=Online+Fractional+Knapsack+With+Predictions&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of Massachusetts Amherst",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.umass.edu",
        "aff_unique_abbr": "UMass Amherst",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Amherst",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "yR5QbFv4Xb",
        "title": "Towards Faithful Neural Network Intrinsic Interpretation with Shapley Additive Self-Attribution",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Self-interpreting neural networks have garnered significant interest in research. Existing works in this domain often (1) lack a solid theoretical foundation ensuring genuine interpretability or (2) compromise model expressiveness. In response, we formulate a generic Additive Self-Attribution (ASA) framework. Observing the absence of Shapley value in Additive Self-Attribution, we propose Shapley Additive Self-Attributing Neural Network (SASANet), with theoretical guarantees for the self-attribution value equal to the output's Shapley values. Specifically, SASANet uses a marginal contribution-based sequential schema and internal distillation-based training strategies to model meaningful outputs for any number of features, resulting in un-approximated meaningful value function. Our experimental results indicate SASANet surpasses existing self-attributing models in performance and rivals black-box models. Moreover, SASANet is shown more precise and efficient than post-hoc methods in interpreting its own predictions.",
        "keywords": "interpretability;neural networks;additive attribution;Shapley value",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Ying Sun;Hengshu Zhu;Hui Xiong",
        "authorids": "~Ying_Sun4;~Hengshu_Zhu1;~Hui_Xiong1",
        "gender": "F;;M",
        "homepage": "https://sunyinggilly.github.io;http://www.zhuhengshu.com/;https://www.hkust-gz.edu.cn/people/hui-xiong/",
        "dblp": "10/5415-6.html;61/10440;262/1686-1.html",
        "google_scholar": ";55MQBzYAAAAJ;cVDF1tkAAAAJ",
        "orcid": "0000-0002-4763-6060;0000-0003-4570-643X;0000-0001-6016-6465",
        "linkedin": ";;",
        "or_profile": "~Ying_Sun4;~Hengshu_Zhu1;~Hui_Xiong1",
        "aff": "Hong Kong University of Science and Technology (Guangzhou);Kanzhun Limited (BOSS Zhipin);Hong Kong University of Science and Technology (Guangzhou)",
        "aff_domain": "hkust-gz.edu.cn;kanzhun.com;hkust.edu",
        "position": "Assistant Professor;Chief Research Scientist;Full Professor",
        "bibtex": "@misc{\nsun2024towards,\ntitle={Towards Faithful Neural Network Intrinsic Interpretation with Shapley Additive Self-Attribution},\nauthor={Ying Sun and Hengshu Zhu and Hui Xiong},\nyear={2024},\nurl={https://openreview.net/forum?id=yR5QbFv4Xb}\n}",
        "github": "",
        "project": "",
        "reviewers": "Ff8r;2AVx;JuUA",
        "site": "https://openreview.net/forum?id=yR5QbFv4Xb",
        "pdf_size": 5832739,
        "rating": "5;5;6",
        "confidence": "3;4;3",
        "soundness": "3;3;2",
        "contribution": "2;3;4",
        "presentation": "2;2;4",
        "wc_summary": "75;71;33",
        "wc_strengths": "90;63;12",
        "wc_weaknesses": "517;326;612",
        "wc_questions": "17;52;27",
        "wc_review": "699;512;684",
        "wc_reply_reviewers": "143;198;189",
        "wc_reply_authors": "1001;1034;948",
        "reply_reviewers": "1;1;1",
        "reply_authors": "2;2;2",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            59.666666666666664,
            18.926759422104517
        ],
        "wc_strengths_avg": [
            55.0,
            32.341923257592455
        ],
        "wc_weaknesses_avg": [
            485.0,
            118.93135274883014
        ],
        "wc_questions_avg": [
            32.0,
            14.719601443879744
        ],
        "wc_review_avg": [
            631.6666666666666,
            84.83840849258993
        ],
        "wc_reply_reviewers_avg": [
            176.66666666666666,
            24.087802353519557
        ],
        "wc_reply_authors_avg": [
            994.3333333333334,
            35.424410918022176
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1197027863505492385&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Hong Kong University of Science and Technology;Kanzhun Limited",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ust.hk;https://www.zhipin.com",
        "aff_unique_abbr": "HKUST;BOSS Zhipin",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Conversational Drug Editing Using Retrieval and Domain Feedback",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17419",
        "id": "yRrPfKyJQ2",
        "author_site": "Shengchao Liu, Jiongxiao Wang, Yijin Yang, Chengpeng Wang, Ling Liu, Hongyu Guo, Chaowei Xiao",
        "tldr": "",
        "abstract": "Recent advancements in conversational large language models (LLMs), such as ChatGPT, have demonstrated remarkable promise in various domains, including drug discovery. However, existing works mainly focus on investigating the capabilities of conversational LLMs on chemical reactions and retrosynthesis. While drug editing, a critical task in the drug discovery pipeline, remains largely unexplored. To bridge this gap, we propose ChatDrug, a framework to facilitate the systematic investigation of drug editing using LLMs. ChatDrug jointly leverages a prompt module, a retrieval and domain feedback module, and a conversation module to streamline effective drug editing. We empirically show that ChatDrug reaches the best performance on all 39 drug editing tasks, encompassing small molecules, peptides, and proteins. We further demonstrate, through 10 case studies, that ChatDrug can successfully identify the key substructures for manipulation, generating diverse and valid suggestions for drug editing. Promisingly, we also show that ChatDrug can offer insightful explanations from a domain-specific perspective, enhancing interpretability and enabling informed decision-making.",
        "keywords": "Large Language Models;prompt;retrieval;domain feedback;conversation;drug editing;drug optimization;controllable generation;small molecule;peptide;protein",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Shengchao Liu;Jiongxiao Wang;Yijin Yang;Chengpeng Wang;Ling Liu;Hongyu Guo;Chaowei Xiao",
        "authorids": "~Shengchao_Liu1;~Jiongxiao_Wang1;~Yijin_Yang2;~Chengpeng_Wang1;~Ling_Liu7;~Hongyu_Guo1;~Chaowei_Xiao2",
        "gender": "M;;;M;F;M;M",
        "homepage": "https://chao1224.github.io/;https://jayfeather1024.github.io/jxwang.github.io/;https://github.com/Yijin14;;;https://hongyuharryguo.github.io/;https://xiaocw11.github.io/",
        "dblp": ";322/5991;33/6721;;;;150/3317",
        "google_scholar": "F1ws3XUAAAAJ;sIGapHMAAAAJ;jklXpQ4AAAAJ;947oUeMAAAAJ;TSqfCkkAAAAJ;https://scholar.google.ca/citations?user=bZUqlakAAAAJ;Juoqtj8AAAAJ",
        "orcid": "0000-0003-2030-2367;;;0000-0002-9196-2613;;;0000-0002-7043-4926",
        "linkedin": ";;;;;harry-h-y-guo-a582087/;",
        "or_profile": "~Shengchao_Liu1;~Jiongxiao_Wang1;~Yijin_Yang2;~Chengpeng_Wang1;~Ling_Liu7;~Hongyu_Guo1;~chaowei_xiao1",
        "aff": "University of California, Berkeley;University of Wisconsin - Madison;Arizona State University;University of Illinois, Urbana Champaign;;National Research Council Canada;NVIDIA",
        "aff_domain": "berkeley.edu;wisc.edu;asu.edu;illinois.edu;;nrc-cnrc.gc.ca;nvidia.com",
        "position": "Postdoc;PhD student;PhD student;MS student;;Senior Research Officer;Researcher",
        "bibtex": "@inproceedings{\nliu2024conversational,\ntitle={Conversational Drug Editing Using Retrieval and Domain Feedback},\nauthor={Shengchao Liu and Jiongxiao Wang and Yijin Yang and Chengpeng Wang and Ling Liu and Hongyu Guo and Chaowei Xiao},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=yRrPfKyJQ2}\n}",
        "github": "",
        "project": "",
        "reviewers": "WoGj;XYSR;pPSW",
        "pdf_size": 13854115,
        "rating": "6;6;6",
        "confidence": "2;3;4",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "2;3;3",
        "wc_summary": "67;65;83",
        "wc_strengths": "35;33;38",
        "wc_weaknesses": "97;41;241",
        "wc_questions": "3;56;32",
        "wc_review": "202;195;394",
        "wc_reply_reviewers": "87;0;73",
        "wc_reply_authors": "1004;533;685",
        "reply_reviewers": "2;0;2",
        "reply_authors": "2;1;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            71.66666666666667,
            8.055363982396383
        ],
        "wc_strengths_avg": [
            35.333333333333336,
            2.0548046676563256
        ],
        "wc_weaknesses_avg": [
            126.33333333333333,
            84.24303466096701
        ],
        "wc_questions_avg": [
            30.333333333333332,
            21.66923061752668
        ],
        "wc_review_avg": [
            263.6666666666667,
            92.20388037146569
        ],
        "wc_reply_reviewers_avg": [
            53.333333333333336,
            38.14300576631172
        ],
        "wc_reply_authors_avg": [
            740.6666666666666,
            196.2724863267618
        ],
        "reply_reviewers_avg": [
            1.3333333333333333,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 22,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16616418925890296092&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=yRrPfKyJQ2",
        "pdf": "https://openreview.net/pdf?id=yRrPfKyJQ2",
        "email": "berkeley.edu;wisc.edu;asu.edu;illinois.edu;;nrc-cnrc.gc.ca;nvidia.com",
        "author_num": 7,
        "aff_unique_index": "0;1;2;3;4;5",
        "aff_unique_norm": "University of California, Berkeley;University of Wisconsin-Madison;Arizona State University;University of Illinois Urbana-Champaign;National Research Council Canada;NVIDIA",
        "aff_unique_dep": ";;;;;NVIDIA Corporation",
        "aff_unique_url": "https://www.berkeley.edu;https://www.wisc.edu;https://www.asu.edu;https://illinois.edu;https://www.nrc-cnrc.gc.ca;https://www.nvidia.com",
        "aff_unique_abbr": "UC Berkeley;UW-Madison;ASU;UIUC;NRC-CNRC;NVIDIA",
        "aff_campus_unique_index": "0;1;3",
        "aff_campus_unique": "Berkeley;Madison;;Urbana-Champaign",
        "aff_country_unique_index": "0;0;0;0;1;0",
        "aff_country_unique": "United States;Canada"
    },
    {
        "title": "Sparse MoE with Language Guided Routing for Multilingual Machine Translation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17418",
        "id": "ySS7hH1smL",
        "author_site": "Xinyu Zhao, Xuxi Chen, Yu Cheng, Tianlong Chen",
        "tldr": "",
        "abstract": "Sparse Mixture-of-Experts (SMoE) has gained increasing popularity as a promising framework for scaling up multilingual machine translation (MMT) models with negligible extra computational overheads. However, current SMoE solutions neglect the intrinsic structures of the MMT problem: ($a$) $\\textit{Linguistics Hierarchy.}$ Languages are naturally grouped according to their lingual properties like genetic families, phonological characteristics, etc; ($b$) $\\textit{Language Complexity.}$ The learning difficulties are varied for diverse languages due to their grammar complexity, available resources, etc. Therefore, routing a fixed number of experts (e.g., $1$ or $2$ experts in usual) only at the word level leads to inferior performance. To fill in the missing puzzle, we propose $\\textbf{\\texttt{Lingual-SMoE}}$ by equipping the SMoE with adaptive and linguistic-guided routing policies. Specifically, it ($1$) extracts language representations to incorporate linguistic knowledge and uses them to allocate experts into different groups; ($2$) determines the number of activated experts for each target language in an adaptive and automatic manner, according to their translation difficulties, which aims to mitigate the potential over-/under-fitting issues of learning simple/challenges translations. Sufficient experimental studies on MMT benchmarks with {$16$, $50$, $100$} language pairs and various network architectures, consistently validate the superior performance of our proposals. For instance, $\\texttt{Lingual-SMoE}$ outperforms its dense counterpart by over $5\\%$ BLEU scores on $\\texttt{OPUS-100}$ dataset.",
        "keywords": "Sparse Mixture-of-Experts;Multilingual Machine Translation;Language Guided Routing",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/6d2d920fd5b7dffab96f43149620a57b945b95a8.zip",
        "author": "Xinyu Zhao;Xuxi Chen;Yu Cheng;Tianlong Chen",
        "authorids": "~Xinyu_Zhao3;~Xuxi_Chen1;~Yu_Cheng1;~Tianlong_Chen1",
        "gender": ";Unspecified;M;M",
        "homepage": "https://zhaocinyu.github.io/;;https://ych133.github.io;https://tianlong-chen.github.io",
        "dblp": ";267/9662;96/3060-1.html;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;afsDlKYAAAAJ;https://scholar.google.com/citations?hl=en;LE3ctn0AAAAJ",
        "orcid": "0009-0000-0253-5488;;;0000-0001-7774-8197",
        "linkedin": ";;chengyu05/;tianlong-chen-783862167/",
        "or_profile": "~Xinyu_Zhao3;~Xuxi_Chen1;~Yu_Cheng1;~Tianlong_Chen1",
        "aff": "Peking University;University of Texas at Austin;The Chinese University of Hong Kong;Harvard University",
        "aff_domain": "pku.edu.cn;utexas.edu;cuhk.edu.hk;harvard.edu",
        "position": "MS student;PhD student;Associate Professor;Postdoc",
        "bibtex": "@inproceedings{\nzhao2024sparse,\ntitle={Sparse MoE with Language Guided Routing for Multilingual Machine Translation},\nauthor={Xinyu Zhao and Xuxi Chen and Yu Cheng and Tianlong Chen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ySS7hH1smL}\n}",
        "github": "",
        "project": "",
        "reviewers": "mayu;BUYj;xU8U;BJsk",
        "pdf_size": 560883,
        "rating": "6;8;8;8",
        "confidence": "4;4;5;5",
        "soundness": "2;3;4;4",
        "contribution": "3;3;3;4",
        "presentation": "4;3;4;4",
        "wc_summary": "97;26;83;74",
        "wc_strengths": "68;48;188;76",
        "wc_weaknesses": "488;480;230;171",
        "wc_questions": "47;41;133;132",
        "wc_review": "700;595;634;453",
        "wc_reply_reviewers": "130;33;29;0",
        "wc_reply_authors": "1473;1604;1085;823",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "5;4;4;2",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            70.0,
            26.692695630078276
        ],
        "wc_strengths_avg": [
            95.0,
            54.653453687758834
        ],
        "wc_weaknesses_avg": [
            342.25,
            143.3045271441206
        ],
        "wc_questions_avg": [
            88.25,
            44.302229063558414
        ],
        "wc_review_avg": [
            595.5,
            90.42814827253736
        ],
        "wc_reply_reviewers_avg": [
            48.0,
            49.02550356702111
        ],
        "wc_reply_authors_avg": [
            1246.25,
            310.057555140977
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.75,
            1.0897247358851685
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3265253380223195506&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=ySS7hH1smL",
        "pdf": "https://openreview.net/pdf?id=ySS7hH1smL",
        "email": "pku.edu.cn;utexas.edu;cuhk.edu.hk;harvard.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Peking University;University of Texas at Austin;Chinese University of Hong Kong;Harvard University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.utexas.edu;https://www.cuhk.edu.hk;https://www.harvard.edu",
        "aff_unique_abbr": "Peking U;UT Austin;CUHK;Harvard",
        "aff_campus_unique_index": "1;2",
        "aff_campus_unique": ";Austin;Hong Kong SAR",
        "aff_country_unique_index": "0;1;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Provable Reward-Agnostic Preference-Based Reinforcement Learning",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17417",
        "id": "yTBXeXdbMf",
        "author_site": "Wenhao Zhan, Masatoshi Uehara, Wen Sun, Jason Lee",
        "tldr": "",
        "abstract": "Preference-based Reinforcement Learning (PbRL) is a paradigm in which an RL agent learns to optimize a task using pair-wise preference-based feedback over trajectories, rather than explicit reward signals. While PbRL has demonstrated practical success in fine-tuning language models, existing theoretical work focuses on regret minimization and fails to capture most of the practical frameworks. In this study, we fill in such a gap between theoretical PbRL and practical algorithms by proposing a theoretical reward-agnostic PbRL framework where exploratory trajectories that enable accurate learning of hidden reward functions are acquired before collecting any human feedback. Theoretical analysis demonstrates that our algorithm requires less human feedback for learning the optimal policy under preference-based models with linear parameterization and unknown transitions, compared to the existing theoretical literature. Specifically, our framework can incorporate linear and low-rank MDPs with efficient sample complexity. Additionally, we investigate reward-agnostic RL with action-based comparison feedback and introduce an efficient querying algorithm tailored to this scenario.",
        "keywords": "reinforcement learning theory;reward-agnostic learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/b4bea637d4e093fc1b765a2d6b4524c442a9789f.pdf",
        "author": "Wenhao Zhan;Masatoshi Uehara;Wen Sun;Jason D. Lee",
        "authorids": "~Wenhao_Zhan1;~Masatoshi_Uehara1;~Wen_Sun1;~Jason_D._Lee1",
        "gender": "M;M;;M",
        "homepage": ";https://www.masatoshiuehara.com/;https://wensun.github.io;https://jasondlee88.github.io/",
        "dblp": "275/3558;225/6517;;88/3262",
        "google_scholar": ";https://scholar.google.co.jp/citations?user=xuLKJboAAAAJ;iOLC30YAAAAJ;GR_DsT0AAAAJ",
        "orcid": ";0000-0001-9017-3105;;",
        "linkedin": ";;;",
        "or_profile": "~Wenhao_Zhan1;~Masatoshi_Uehara1;~Wen_Sun1;~Jason_D._Lee1",
        "aff": "Princeton University;Genentech ;Cornell University;Princeton University",
        "aff_domain": "princeton.edu;gene.com;cornell.edu;princeton.edu",
        "position": "PhD student;Researcher;Assistant Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nzhan2024provable,\ntitle={Provable Reward-Agnostic Preference-Based Reinforcement Learning},\nauthor={Wenhao Zhan and Masatoshi Uehara and Wen Sun and Jason D. Lee},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=yTBXeXdbMf}\n}",
        "github": "",
        "project": "",
        "reviewers": "s63Y;XEZ8;dgpw;m5cB",
        "pdf_size": 443220,
        "rating": "6;8;8;8",
        "confidence": "3;4;2;2",
        "soundness": "4;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;3;2",
        "wc_summary": "145;127;79;71",
        "wc_strengths": "47;94;88;80",
        "wc_weaknesses": "243;233;104;95",
        "wc_questions": "51;230;1;216",
        "wc_review": "486;684;272;462",
        "wc_reply_reviewers": "114;240;14;41",
        "wc_reply_authors": "1373;1526;80;871",
        "reply_reviewers": "1;2;1;1",
        "reply_authors": "5;5;2;3",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            105.5,
            31.284980421921315
        ],
        "wc_strengths_avg": [
            77.25,
            18.15729880791744
        ],
        "wc_weaknesses_avg": [
            168.75,
            69.41316517779606
        ],
        "wc_questions_avg": [
            124.5,
            100.19605780668219
        ],
        "wc_review_avg": [
            476.0,
            145.92463808418373
        ],
        "wc_reply_reviewers_avg": [
            102.25,
            87.53963388088849
        ],
        "wc_reply_authors_avg": [
            962.5,
            564.1854748218886
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.75,
            1.299038105676658
        ],
        "replies_avg": [
            26,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.17407765595569782,
        "gs_citation": 15,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5108211680675040437&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=yTBXeXdbMf",
        "pdf": "https://openreview.net/pdf?id=yTBXeXdbMf",
        "email": "princeton.edu;gene.com;cornell.edu;princeton.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Princeton University;Genentech;Cornell University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.princeton.edu;https://www.genentech.com;https://www.cornell.edu",
        "aff_unique_abbr": "Princeton;Genentech;Cornell",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "yTY1RtowlY",
        "title": "Competition Priors for Object-Centric Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Humans are very good at abstracting from data and constructing concepts that are then reused. This is missing in current learning systems. The field of object-centric learning tries to bridge this gap by learning abstract representations, often called slots, from data without human supervision. Different methods have been proposed to tackle this task for images, whereas most are overly complex, non-differentiable, or poorly scalable. In this paper, we introduce a conceptually simple, fully-differentiable, non-iterative, and scalable method called **COP** (**C**ompetition **O**ver **P**ixel features). It is implementable using only Convolution and MaxPool layers and an Attention layer. Our method encodes the input image with a convolutional neural network and then uses a branch of alternating convolution and MaxPool layers to create competition and extract primitive slots. These primitive slots are then used as queries for a variant of Cross-Attention over the encoded image. Despite its simplicity, our method is competitive or outperforms previous methods on standard benchmarks. The code is publicly available.",
        "keywords": "Object-centric;Object-centric Learning;Representation Learning;Abstraction",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/fbe05c202c2420a8e37d853b764c15f303f0bcfc.zip",
        "author": "Vihang Prakash Patil;Andreas Radler;Daniel Klotz;Sepp Hochreiter",
        "authorids": "~Vihang_Prakash_Patil1;~Andreas_Radler1;~Daniel_Klotz1;~Sepp_Hochreiter1",
        "gender": "M;M;;M",
        "homepage": "https://vihangp.github.io;;;https://www.jku.at/en/institute-for-machine-learning/about-us/team/sepp-hochreiter/",
        "dblp": "https://dblp.uni-trier.de/pid/275/2942;;;h/SeppHochreiter.html",
        "google_scholar": "1iwYpk0AAAAJ;;;https://scholar.google.at/citations?user=tvUH3WMAAAAJ",
        "orcid": ";;;0000-0001-7449-2528",
        "linkedin": ";radlera/;;https://linkedin.com/in/sepp-hochreiter-41514846",
        "or_profile": "~Vihang_Prakash_Patil1;~Andreas_Radler1;~Daniel_Klotz1;~Sepp_Hochreiter1",
        "aff": "Johannes Kepler University Linz;Johannes Kepler Universit\u00e4t Linz;;Johannes Kepler University Linz",
        "aff_domain": "jku.at;jku.at;;jku.at",
        "position": "PhD student;PhD student;;Full Professor",
        "bibtex": "@misc{\npatil2024competition,\ntitle={Competition Priors for Object-Centric Learning},\nauthor={Vihang Prakash Patil and Andreas Radler and Daniel Klotz and Sepp Hochreiter},\nyear={2024},\nurl={https://openreview.net/forum?id=yTY1RtowlY}\n}",
        "github": "",
        "project": "",
        "reviewers": "pbAn;qRty;72DU;Ep3S",
        "site": "https://openreview.net/forum?id=yTY1RtowlY",
        "pdf_size": 5251124,
        "rating": "1;3;5;6",
        "confidence": "4;4;4;4",
        "soundness": "2;2;2;3",
        "contribution": "1;1;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "73;46;71;50",
        "wc_strengths": "29;18;87;54",
        "wc_weaknesses": "827;272;276;83",
        "wc_questions": "127;91;101;2",
        "wc_review": "1056;427;535;189",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "177;81;103;64",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.75,
            1.920286436967152
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            60.0,
            12.103718436910205
        ],
        "wc_strengths_avg": [
            47.0,
            26.52357441974969
        ],
        "wc_weaknesses_avg": [
            364.5,
            278.180247321768
        ],
        "wc_questions_avg": [
            80.25,
            47.04984059484155
        ],
        "wc_review_avg": [
            551.75,
            316.89854449018856
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            106.25,
            43.12409419338567
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:hpWm8oONL0UJ:scholar.google.com/&scioq=Competition+Priors+for+Object-Centric+Learning&hl=en&as_sdt=0,14",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Johannes Kepler University;Johannes Kepler University Linz",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.jku.at;https://www.jku.at",
        "aff_unique_abbr": "JKU;JKU",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Linz",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Austria"
    },
    {
        "id": "yTbAGlu4jR",
        "title": "Learning Identifiable Balanced Prognostic Score for Treatment Effect Estimation Under Limited Overlap",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Understanding individual-level treatment effects is a fundamental and crucial problem in causal inference. In this paper, our objective is to tackle the issue of limited overlap, where certain covariates only exist in a single treatment group. We demonstrate that, under weak conditions, it is possible to simultaneously recover identifiable balanced prognostic scores and balancing scores. By leveraging these scores, we relax the requirement of overlapping conditions in a latent space, enabling us to generalize beyond overlapped regions. This approach also allows us to handle out-of-distribution treatments with no overlap. Additionally, our approach is adaptable to various tasks, including both binary and structured treatment settings. Empirical results on different benchmarks demonstrate that our method achieves state-of-the-art performance.",
        "keywords": "causal inference; prognostic score; selection bias; limited overlap",
        "primary_area": "causal reasoning",
        "supplementary_material": "",
        "author": "Tai-Wei Chang;Jiahui Li;Kun Kuang;Zhengqing Fang;Jianmin Huang;Longfei Li;JUN ZHOU;Wei Chu",
        "authorids": "~Tai-Wei_Chang1;~Jiahui_Li2;~Kun_Kuang1;~Zhengqing_Fang1;~Jianmin_Huang1;~Longfei_Li1;~JUN_ZHOU6;~Wei_Chu1",
        "gender": ";;M;M;F;M;M;M",
        "homepage": ";https://vicg.netlify.app/;http://kunkuang.github.io;;https://scholar.google.com/citations?view_op=list_works&hl=en&user=Oe3_m10AAAAJ;;https://scholar.google.com/citations?user=mCVvloEAAAAJ&hl=en;http://weichu.github.io",
        "dblp": ";153/2952-3;194/4245;266/9572.html;;139/8073;99/3847-11;",
        "google_scholar": ";;https://scholar.google.com.hk/citations?user=FOsNiMQAAAAJ;VEDFmatc5bkC;https://scholar.google.com/citations?view_op=list_works;;mCVvloEAAAAJ;3J4zb7gAAAAJ",
        "orcid": "0000-0003-0703-5161;;0009-0000-7528-8131;0000-0003-3270-0952;;;0000-0001-6033-6102;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Tai-Wei_Chang1;~Jiahui_Li2;~Kun_Kuang1;~Zhengqing_Fang1;~Jianmin_Huang1;~Longfei_Li1;~JUN_ZHOU6;~Wei_Chu1",
        "aff": "Ant Group;Ant Group;Zhejiang University;Zhejiang University;Machine intelligence;ant group;Ant Group;Inf Tech",
        "aff_domain": "antgroup.com;antgroup.com;zju.edu.cn;zju.edu.cn;antgroup.com;antgroup.com;antgroup.com;inftech.ai",
        "position": "Researcher;Researcher;Associate Professor;PhD student;Researcher;Researcher;Researcher;Researcher",
        "bibtex": "@misc{\nchang2024learning,\ntitle={Learning Identifiable Balanced Prognostic Score for Treatment Effect Estimation Under Limited Overlap},\nauthor={Tai-Wei Chang and Jiahui Li and Kun Kuang and Zhengqing Fang and Jianmin Huang and Longfei Li and JUN ZHOU and Wei Chu},\nyear={2024},\nurl={https://openreview.net/forum?id=yTbAGlu4jR}\n}",
        "github": "",
        "project": "",
        "reviewers": "DxND;AjMV;N81L;QXYk",
        "site": "https://openreview.net/forum?id=yTbAGlu4jR",
        "pdf_size": 543580,
        "rating": "3;6;6;6",
        "confidence": "4;4;2;3",
        "soundness": "1;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "1;3;3;3",
        "wc_summary": "137;68;59;216",
        "wc_strengths": "39;41;64;192",
        "wc_weaknesses": "634;36;46;9",
        "wc_questions": "133;167;44;356",
        "wc_review": "943;312;213;773",
        "wc_reply_reviewers": "174;0;19;0",
        "wc_reply_authors": "1821;993;716;960",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "4;2;1;2",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            120.0,
            63.107051903887886
        ],
        "wc_strengths_avg": [
            84.0,
            63.12289600454022
        ],
        "wc_weaknesses_avg": [
            181.25,
            261.74546318895386
        ],
        "wc_questions_avg": [
            175.0,
            113.74313166077326
        ],
        "wc_review_avg": [
            560.25,
            305.7657395785211
        ],
        "wc_reply_reviewers_avg": [
            48.25,
            73.01498133944841
        ],
        "wc_reply_authors_avg": [
            1122.5,
            417.2292535285607
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            1.0897247358851685
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.5222329678670935,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:4okywXtc7A0J:scholar.google.com/&scioq=Learning+Identifiable+Balanced+Prognostic+Score+for+Treatment+Effect+Estimation+Under+Limited+Overlap&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;1;2;0;0;3",
        "aff_unique_norm": "Ant Group;Zhejiang University;Machine Intelligence;Information Technology",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.antgroup.com;https://www.zju.edu.cn;;",
        "aff_unique_abbr": "Ant Group;ZJU;;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China;"
    },
    {
        "title": "ValUES: A Framework for Systematic Validation of Uncertainty Estimation in Semantic Segmentation",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17416",
        "id": "yV6fD7LYkF",
        "author_site": "Kim-Celine Kahl, Carsten L\u00fcth, Maximilian Zenk, Klaus Maier-Hein, Paul F. Jaeger",
        "tldr": "",
        "abstract": "Uncertainty estimation is an essential and heavily-studied component for the reliable application of semantic segmentation methods. While various studies exist claiming methodological advances on the one hand, and successful application on the other hand, the field is currently hampered by a gap between theory and practice leaving fundamental questions unanswered: Can data-related and model-related uncertainty really be separated in practice? Which components of an uncertainty method are essential for real-world performance? Which uncertainty method works well for which application? In this work, we link this research gap to a lack of systematic and comprehensive evaluation of uncertainty methods. Specifically, we identify three key pitfalls in current literature and present an evaluation framework that bridges the research gap by providing 1) a controlled environment for studying data ambiguities as well as distribution shifts, 2) systematic ablations of relevant method components, and 3) test-beds for the five predominant uncertainty applications: OoD-detection, active learning, failure detection, calibration, and ambiguity modeling. Empirical results on simulated as well as real-world data demonstrate how the proposed framework is able to answer the predominant questions in the field revealing for instance that 1) separation of uncertainty types works on simulated data but does not necessarily translate to real-world data, 2) aggregation of scores is a crucial but currently neglected component of uncertainty methods, 3) While ensembles are performing most robustly across the different downstream tasks and settings, test-time augmentation often constitutes a light-weight alternative. Code is at: https://github.com/IML-DKFZ/values",
        "keywords": "uncertainty;segmentation;validation",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/da48ee545fec241de3759e5647a0b300eea57b0d.pdf",
        "author": "Kim-Celine Kahl;Carsten T. L\u00fcth;Maximilian Zenk;Klaus Maier-Hein;Paul F Jaeger",
        "authorids": "~Kim-Celine_Kahl1;~Carsten_T._L\u00fcth1;~Maximilian_Zenk1;~Klaus_Maier-Hein1;~Paul_F_Jaeger1",
        "gender": "F;M;M;;M",
        "homepage": ";https://www.dkfz.de/en/mic/team/people/Maximilian_Zenk.html;http://www.dkfz.de/en/mic;https://pfjaeger.github.io;",
        "dblp": "268/6662;281/6999;133/0183;179/4749;244/2162",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;oCrBpVMAAAAJ;https://scholar.google.de/citations?user=9B9-8h0AAAAJ;3L6NkggAAAAJ",
        "orcid": "0000-0002-4061-9073;;0000-0002-6626-2463;;",
        "linkedin": "kim-celine-kahl-04907722b/;;;;carsten-l\u00fcth-530798190/",
        "or_profile": "~Kim-Celine_Kahl1;~Maximilian_Zenk1;~Klaus_Maier-Hein1;~Paul_F_Jaeger1;~Carsten_Tim_L\u00fcth1",
        "aff": "Deutsches Krebsforschungszentrum;Deutsches Krebsforschungszentrum (DKFZ);German Cancer Research Center;German Cancer Research Center;German Cancer Research Center",
        "aff_domain": "dkfz.de;dkfz-heidelberg.de;dkfz.de;dkfz.de;dkfz-heidelberg.de",
        "position": "PhD student;PhD student;Full Professor;Research Group Leader;PhD student",
        "bibtex": "@inproceedings{\nkahl2024values,\ntitle={Val{UES}: A Framework for Systematic Validation of Uncertainty Estimation in Semantic Segmentation},\nauthor={Kim-Celine Kahl and Carsten T. L{\\\"u}th and Maximilian Zenk and Klaus Maier-Hein and Paul F Jaeger},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=yV6fD7LYkF}\n}",
        "github": "",
        "project": "",
        "reviewers": "T66t;u7mE;6vjf;NXFz",
        "pdf_size": 4171982,
        "rating": "6;8;8;8",
        "confidence": "4;4;4;4",
        "soundness": "2;4;3;4",
        "contribution": "2;4;3;4",
        "presentation": "3;4;2;4",
        "wc_summary": "36;49;63;67",
        "wc_strengths": "25;322;62;115",
        "wc_weaknesses": "62;111;124;117",
        "wc_questions": "50;7;10;96",
        "wc_review": "173;489;259;395",
        "wc_reply_reviewers": "0;60;20;21",
        "wc_reply_authors": "834;419;566;792",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.25,
            0.82915619758885
        ],
        "contribution_avg": [
            3.25,
            0.82915619758885
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            53.75,
            12.234684303242156
        ],
        "wc_strengths_avg": [
            131.0,
            114.81942344394523
        ],
        "wc_weaknesses_avg": [
            103.5,
            24.397745797511703
        ],
        "wc_questions_avg": [
            40.75,
            36.134298111351214
        ],
        "wc_review_avg": [
            329.0,
            121.64703037887936
        ],
        "wc_reply_reviewers_avg": [
            25.25,
            21.741377601246892
        ],
        "wc_reply_authors_avg": [
            652.75,
            169.1203343776259
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 18,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14257141557965121794&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=yV6fD7LYkF",
        "pdf": "https://openreview.net/pdf?id=yV6fD7LYkF",
        "email": "dkfz.de;dkfz-heidelberg.de;dkfz.de;dkfz.de;dkfz-heidelberg.de",
        "author_num": 5,
        "aff_unique_index": "0;0;1;1;1",
        "aff_unique_norm": "Deutsches Krebsforschungszentrum;German Cancer Research Center",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.dkfz.de;https://www.dkfz.de",
        "aff_unique_abbr": "DKFZ;DKFZ",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "Germany"
    },
    {
        "title": "Bayes Conditional Distribution Estimation for Knowledge Distillation Based on Conditional Mutual Information",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17415",
        "id": "yV6wwEbtkR",
        "author_site": "Linfeng Ye, Shayan Mohajer Hamidi, Renhao Tan, EN-HUI YANG",
        "tldr": "",
        "abstract": "It is believed that in knowledge distillation (KD), the role of the teacher is to provide an estimate for the unknown Bayes conditional probability distribution (BCPD) to be used in the student training process. Conventionally, this estimate is obtained by training the teacher using maximum log-likelihood (MLL) method. To improve this estimate for KD, in this paper we introduce the concept of conditional mutual information (CMI) into the estimation of BCPD and propose a novel estimator called the maximum CMI (MCMI) method. Specifically, in MCMI estimation, both the log-likelihood and CMI of the teacher are simultaneously maximized when the teacher is trained. In fact, maximizing the teacher's CMI value ensures that the teacher can effectively capture the contextual information within the images, and for visualizing this information, we deploy Eigen-CAM. Via conducting a thorough set of experiments, we show that by employing a teacher trained via MCMI estimation rather than one trained via MLL estimation in various state-of-the-art KD frameworks, the student's classification accuracy consistently increases, with the gain of up to 3.32\\%. This suggests that the teacher's BCPD estimate provided by MCMI method is more accurate than that provided by MLL method. In addition, we show that such improvements in the student's accuracy are more drastic in zero-shot and few-shot settings. Notably, the student's accuracy increases with the gain of up to 5.72\\% when 5\\% of the training samples are available to student (few-shot), and increases from 0\\% to as high as 84\\% for an omitted class (zero-shot).",
        "keywords": "Knowledge distillation;information theroy;bayes conditional distribution estimation;conditional mutual information",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Linfeng Ye;Shayan Mohajer Hamidi;Renhao Tan;EN-HUI YANG",
        "authorids": "~Linfeng_Ye1;~Shayan_Mohajer_Hamidi1;~Renhao_Tan1;~EN-HUI_YANG1",
        "gender": "M;M;;",
        "homepage": ";;;https://uwaterloo.ca/multicom-research-group/research-team/about-director",
        "dblp": "90/3934;307/5037;294/3134;y/EnHuiYang.html",
        "google_scholar": "Q9dpvBYAAAAJ;jbTBFjAAAAAJ;;",
        "orcid": ";0000-0001-8321-7130;0009-0005-6448-9954;",
        "linkedin": ";;;",
        "or_profile": "~Linfeng_Ye1;~Shayan_Mohajer_Hamidi1;~Renhao_Tan1;~EN-HUI_YANG1",
        "aff": "University of Waterloo;University of Waterloo;University of Waterloo;University of Waterloo",
        "aff_domain": "uwaterloo.ca;uwaterloo.ca;uwaterloo.ca;uwaterloo.ca",
        "position": "MS student;PhD student;MS student;Full Professor",
        "bibtex": "@inproceedings{\nye2024bayes,\ntitle={Bayes Conditional Distribution Estimation for Knowledge Distillation Based on Conditional Mutual Information},\nauthor={Linfeng Ye and Shayan Mohajer Hamidi and Renhao Tan and EN-HUI YANG},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=yV6wwEbtkR}\n}",
        "github": "",
        "project": "",
        "reviewers": "Nadg;oUDj;AG5J",
        "pdf_size": 5861135,
        "rating": "6;6;8",
        "confidence": "3;3;4",
        "soundness": "3;3;4",
        "contribution": "3;2;3",
        "presentation": "3;3;4",
        "wc_summary": "48;149;182",
        "wc_strengths": "59;88;20",
        "wc_weaknesses": "68;85;284",
        "wc_questions": "102;114;29",
        "wc_review": "277;436;515",
        "wc_reply_reviewers": "13;26;458",
        "wc_reply_authors": "1661;1123;821",
        "reply_reviewers": "1;1;1",
        "reply_authors": "5;4;2",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            126.33333333333333,
            57.00487308604025
        ],
        "wc_strengths_avg": [
            55.666666666666664,
            27.86076492528915
        ],
        "wc_weaknesses_avg": [
            145.66666666666666,
            98.06233844969343
        ],
        "wc_questions_avg": [
            81.66666666666667,
            37.56180092712394
        ],
        "wc_review_avg": [
            409.3333333333333,
            98.97586686774824
        ],
        "wc_reply_reviewers_avg": [
            165.66666666666666,
            206.7790017278243
        ],
        "wc_reply_authors_avg": [
            1201.6666666666667,
            347.4107399350547
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            1.247219128924647
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.9999999999999998,
        "gs_citation": 17,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14886900070508493314&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=yV6wwEbtkR",
        "pdf": "https://openreview.net/pdf?id=yV6wwEbtkR",
        "email": "uwaterloo.ca;uwaterloo.ca;uwaterloo.ca;uwaterloo.ca",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "University of Waterloo",
        "aff_unique_dep": "",
        "aff_unique_url": "https://uwaterloo.ca",
        "aff_unique_abbr": "UW",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "title": "Hybrid Sharing for Multi-Label Image Classification",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17414",
        "id": "yVJd8lKyVX",
        "author_site": "Zihao Yin, Chen Gan, Kelei He, Yang Gao, Junfeng Zhang",
        "tldr": "",
        "abstract": "Existing multi-label classification methods have long suffered from label heterogeneity, where learning a label obscures another. By modeling multi-label classification as a multi-task problem, this issue can be regarded as a negative transfer, which indicates challenges to achieve simultaneously satisfied performance across multiple tasks. In this work, we propose the Hybrid Sharing Query (HSQ), a transformer-based model that introduces the mixture-of-experts architecture to image multi-label classification. HSQ is designed to leverage label correlations while mitigating heterogeneity effectively. To this end, HSQ is incorporated with a fusion expert framework that enables it to optimally combine the strengths of task-specialized experts with shared experts, ultimately enhancing multi-label classification performance across most labels. Extensive experiments are conducted on two benchmark datasets, with the results demonstrating that the proposed method achieves state-of-the-art performance and yields simultaneous improvements across most labels. The code is available at https://github.com/zihao-yin/HSQ",
        "keywords": "Multi-task learning;Multi-label learning;mixture-of-experts;image classification",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Zihao Yin;Chen Gan;Kelei He;Yang Gao;Junfeng Zhang",
        "authorids": "~Zihao_Yin1;~Chen_Gan1;~Kelei_He1;~Yang_Gao3;jfzhang@nju.edu.cn",
        "gender": "M;M;;M;",
        "homepage": "https://cs.nju.edu.cn/rl/members.htm;https://www.researchgate.net/profile/Chen-Gan-3;;https://cs.nju.edu.cn/gaoyang/;",
        "dblp": "257/3403;207/6930;;89/4402-1;",
        "google_scholar": ";;;https://scholar.google.com.tw/citations?user=CJwLwzQAAAAJ;",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Zihao_Yin1;~Chen_Gan1;~Kelei_He1;~Yang_Gao3;jfzhang@nju.edu.cn",
        "aff": "Nanjing University;Nanjing University;;Nanjing University;",
        "aff_domain": "nju.edu.cn;nju.edu.cn;;nju.edu.cn;",
        "position": "MS student;MS student;;Full Professor;",
        "bibtex": "@inproceedings{\nyin2024hybrid,\ntitle={Hybrid Sharing for Multi-Label Image Classification},\nauthor={Zihao Yin and Chen Gan and Kelei He and Yang Gao and Junfeng Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=yVJd8lKyVX}\n}",
        "github": "",
        "project": "",
        "reviewers": "7ihD;rQYR;2H28",
        "pdf_size": 974828,
        "rating": "6;6;6",
        "confidence": "5;5;4",
        "soundness": "2;3;3",
        "contribution": "2;2;2",
        "presentation": "4;2;3",
        "wc_summary": "45;66;87",
        "wc_strengths": "36;40;66",
        "wc_weaknesses": "206;89;134",
        "wc_questions": "6;5;115",
        "wc_review": "293;200;402",
        "wc_reply_reviewers": "10;0;33",
        "wc_reply_authors": "1181;704;1800",
        "reply_reviewers": "1;0;1",
        "reply_authors": "2;1;3",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            66.0,
            17.146428199482248
        ],
        "wc_strengths_avg": [
            47.333333333333336,
            13.299958228840001
        ],
        "wc_weaknesses_avg": [
            143.0,
            48.187135212627034
        ],
        "wc_questions_avg": [
            42.0,
            51.62040940041707
        ],
        "wc_review_avg": [
            298.3333333333333,
            82.5523402992846
        ],
        "wc_reply_reviewers_avg": [
            14.333333333333334,
            13.816254517375135
        ],
        "wc_reply_authors_avg": [
            1228.3333333333333,
            448.6901925481422
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.816496580927726
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13908334330761908787&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=yVJd8lKyVX",
        "pdf": "https://openreview.net/pdf?id=yVJd8lKyVX",
        "email": "nju.edu.cn;nju.edu.cn;;nju.edu.cn;",
        "author_num": 5,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Nanjing University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.nju.edu.cn",
        "aff_unique_abbr": "Nanjing U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "yW0hLmwq4f",
        "title": "Delving Deep into Sim2Real Transformation: Maximizing Impact of Synthetic Data in Training",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Synthetic data has the distinct advantage of building a large-scale labeled dataset for almost free. Still, it should be carefully integrated into learning; otherwise, the expected performance gains are difficult to achieve. The biggest hurdle for synthetic data to achieve increased training performance is the domain gap with the (real) test data. As a common solution to deal with the domain gap, the sim2real transformation is used, and its quality is affected by three factors: i) the real data serving as a reference when calculating the domain gap, ii) the synthetic data chosen to avoid the transformation quality degradation, and iii) the synthetic data pool from which the synthetic data is selected. In this paper, we investigate the impact of these factors on maximizing the effectiveness of synthetic data in training in terms of improving learning performance and acquiring domain generalization ability--two main benefits expected of using synthetic data. As an evaluation metric for the second benefit, we introduce a method for measuring the distribution gap between two datasets, which is derived as the normalized sum of the Mahalanobis distances of all test data. As a result, we have discovered several important findings that have never been investigated or have been used previously without accurate understanding. We expect that these findings can break the current trend of either naively using or being hesitant to use synthetic data in machine learning due to the lack of understanding, leading to more appropriate use in future research.",
        "keywords": "Synthetic data;sim2real transformation;distribution gap",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/a3580bb32fd4656fcd0a5962aabc95a89cee4a3a.pdf",
        "author": "Hyungtae Lee;Yan Zhang;Yi-Ting Shen;Heesung Kwon;Shuvra Shikhar Bhattacharyya",
        "authorids": "~Hyungtae_Lee3;~Yan_Zhang26;~Yi-Ting_Shen1;~Heesung_Kwon2;~Shuvra_Shikhar_Bhattacharyya1",
        "gender": ";M;M;M;M",
        "homepage": ";https://dennisshen.github.io/;;http://www.ece.umd.edu/~ssb;https://htlee79.github.io/",
        "dblp": ";211/5395;10/5946.html;;25/9990",
        "google_scholar": ";PzjeN7MAAAAJ;ayph-mwAAAAJ;rNpUIKAAAAAJ;w9aeUnsAAAAJ",
        "orcid": "0000-0002-5734-5822;0000-0002-1167-5535;0009-0003-8335-7223;0000-0001-7719-1106;0000-0002-0631-9894",
        "linkedin": ";yi-ting-shen-864867124/;heesung-kwon-44a1362b/;shuvra-bhattacharyya-3111904/;hyungtae-lee-03651647/",
        "or_profile": "~Yan_Zhang26;~Yi-Ting_Shen1;~Heesung_Kwon2;~Shuvra_Shikhar_Bhattacharyya1;~Hyungtae_Lee1",
        "aff": "University of Maryland, College Park;University of Maryland, College Park;DEVCOM Army Research Laboratory;University of Maryland, College Park;Army Research Laboratory",
        "aff_domain": "umd.edu;umd.edu;army.mil;umd.edu;army.mil",
        "position": "PhD student;PhD student;Principal Researcher;Full Professor;Research Scientist",
        "bibtex": "@misc{\nlee2024delving,\ntitle={Delving Deep into Sim2Real Transformation: Maximizing Impact of Synthetic Data in Training},\nauthor={Hyungtae Lee and Yan Zhang and Yi-Ting Shen and Heesung Kwon and Shuvra Shikhar Bhattacharyya},\nyear={2024},\nurl={https://openreview.net/forum?id=yW0hLmwq4f}\n}",
        "github": "",
        "project": "",
        "reviewers": "Eyf8;VMMc;Jce6;Gemq",
        "site": "https://openreview.net/forum?id=yW0hLmwq4f",
        "pdf_size": 1447518,
        "rating": "3;5;5;5",
        "confidence": "3;4;4;3",
        "soundness": "2;3;3;2",
        "contribution": "3;3;2;2",
        "presentation": "3;3;4;2",
        "wc_summary": "57;103;141;104",
        "wc_strengths": "109;24;64;73",
        "wc_weaknesses": "218;37;171;154",
        "wc_questions": "5;245;30;2",
        "wc_review": "389;409;406;333",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            101.25,
            29.785692874264313
        ],
        "wc_strengths_avg": [
            67.5,
            30.236567265481707
        ],
        "wc_weaknesses_avg": [
            145.0,
            66.61456297237113
        ],
        "wc_questions_avg": [
            70.5,
            101.33237389896676
        ],
        "wc_review_avg": [
            384.25,
            30.55630049596973
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Xn8kC_s7PCUJ:scholar.google.com/&scioq=Delving+Deep+into+Sim2Real+Transformation:+Maximizing+Impact+of+Synthetic+Data+in+Training&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;2",
        "aff_unique_norm": "University of Maryland;United States Army Research Laboratory;Army Research Laboratory",
        "aff_unique_dep": ";Army Research Laboratory;",
        "aff_unique_url": "https://www/umd.edu;https://www.arl.army.mil;https://www.arl.army.mil",
        "aff_unique_abbr": "UMD;ARL;ARL",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "College Park;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "yXklOV0ZIv",
        "title": "Learnable Counterfactual Attention for Singer Identification",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Counterfactual attention learning (Rao et al., 2021) utilizes counterfactual causality to guide attention learning and has demonstrated great potential in fine-grained recognition tasks. Despite its excellent performance, existing counterfactual attention is not learned directly from the network itself; instead, it relies on employing random attentions. To address the limitation, we target at singer identification (SID) task and present a learnable counterfactual attention (LCA) mechanism, to enhance the ability of counterfactual attention to help identify fine-grained vocals. Specifically, our LCA mechanism is implemented by introducing a counterfactual attention branch into the original attention-based deep-net model. Guided by multiple well-designed loss functions, the model pushes the counterfactual attention branch to uncover attention regions that are meaningful yet not overly discriminative (seemingly accurate but ultimately misleading), while guiding the main branch to deviate from those regions, thereby focusing attention on discriminative regions to learn singer-specific features in fine-grained vocals. Evaluation on the benchmark artist20 dataset (Ellis, 2007) demonstrates that our LCA mechanism brings a comprehensive performance improvement for the deep-net model of SID. Moreover, since the LCA mechanism is only used during training, it doesn't impact testing efficiency.",
        "keywords": "Singer Identification;Counterfactual Attention Learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/9d281ec03ee5ed23935fae607fe445c5602ffab7.zip",
        "author": "Yi-Xing Lin;Jen-Chun Lin;Wen-Li Wei;Jia-Ching Wang",
        "authorids": "~Yi-Xing_Lin2;~Jen-Chun_Lin1;~Wen-Li_Wei2;~Jia-Ching_Wang1",
        "gender": "M;M;F;",
        "homepage": ";https://sites.google.com/site/jenchunlin/;https://github.com/MPS-Net/MPS-Net_release;",
        "dblp": ";70/10152;09/10143;",
        "google_scholar": ";https://scholar.google.com.tw/citations?user=gB_JP-sAAAAJ;;",
        "orcid": ";;;",
        "linkedin": "yi-xing-lin-7b7294152/;;;",
        "or_profile": "~Yi-Xing_Lin2;~Jen-Chun_Lin1;~Wen-Li_Wei2;~Jia-Ching_Wang1",
        "aff": "National Central University;Academia Sinica;Academia Sinica;",
        "aff_domain": "ncu.edu.tw;iis.sinica.edu.tw;iis.sinica.edu.tw;",
        "position": "PhD student;Assistant Professor;Postdoc;",
        "bibtex": "@misc{\nlin2024learnable,\ntitle={Learnable Counterfactual Attention for Singer Identification},\nauthor={Yi-Xing Lin and Jen-Chun Lin and Wen-Li Wei and Jia-Ching Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=yXklOV0ZIv}\n}",
        "github": "",
        "project": "",
        "reviewers": "i4Hf;5eKQ;6GjB;hb43",
        "site": "https://openreview.net/forum?id=yXklOV0ZIv",
        "pdf_size": 4263797,
        "rating": "3;3;6;6",
        "confidence": "5;4;1;3",
        "soundness": "2;3;3;2",
        "contribution": "2;2;3;2",
        "presentation": "2;3;3;3",
        "wc_summary": "143;58;26;117",
        "wc_strengths": "23;30;22;72",
        "wc_weaknesses": "282;166;22;162",
        "wc_questions": "42;39;22;5",
        "wc_review": "490;293;92;356",
        "wc_reply_reviewers": "178;0;0;19",
        "wc_reply_authors": "779;467;2;601",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "2;1;1;2",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            3.25,
            1.479019945774904
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            86.0,
            46.351914739307155
        ],
        "wc_strengths_avg": [
            36.75,
            20.58367071248469
        ],
        "wc_weaknesses_avg": [
            158.0,
            92.13034245024816
        ],
        "wc_questions_avg": [
            27.0,
            14.815532390029054
        ],
        "wc_review_avg": [
            307.75,
            143.4475078208053
        ],
        "wc_reply_reviewers_avg": [
            49.25,
            74.7374571416502
        ],
        "wc_reply_authors_avg": [
            462.25,
            287.8518499158899
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.8451542547285167,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:9qIkXgV3VKAJ:scholar.google.com/&scioq=Learnable+Counterfactual+Attention+for+Singer+Identification&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "National Central University;Academia Sinica",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ncu.edu.tw;https://www.sinica.edu.tw",
        "aff_unique_abbr": "NCU;Academia Sinica",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Taiwan",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "yYjsH5wktr",
        "title": "Fairness-aware Message Passing for Graph Neural Networks",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Graph Neural Networks (GNNs) have shown great power in various domains. However, their predictions may inherit societal biases on sensitive attributes, limiting their adoption in real-world applications. Although many efforts have been taken for fair GNNs, most existing works just adopt widely used fairness techniques in machine learning to graph domains and ignore or don't have a thorough understanding of the message passing mechanism with fairness constraints, which is a distinctive feature of GNNs. To fill the gap, we propose a novel fairness-aware message passing framework GMMD, which is derived from an optimization problem that considers both graph smoothness and representation fairness. GMMD can be intuitively interpreted as encouraging a node to aggregate representations of other nodes from different sensitive groups while subtracting representations of other nodes from the same sensitive group, resulting in fair representations. We also provide a theoretical analysis to justify that GMMD can guarantee fairness, which leads to a simpler and theory-guided variant GMMD-S. Extensive experiments on graph benchmarks show that our proposed framework can significantly improve the fairness of various backbone GNN models while maintaining high accuracy.",
        "keywords": "Fairness;Message Passing;Graph Neural Networks",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Huaisheng Zhu;Guoji Fu;Zhimeng Guo;Zhiwei Zhang;Teng Xiao;Suhang Wang",
        "authorids": "~Huaisheng_Zhu1;~Guoji_Fu1;~Zhimeng_Guo1;~Zhiwei_Zhang10;~Teng_Xiao2;~Suhang_Wang1",
        "gender": "M;;M;M;;M",
        "homepage": ";;;https://zzwjames.github.io/zhiweizhang.github.io/;;https://faculty.ist.psu.edu/szw494/",
        "dblp": "264/2622.html;;304/3478;68/1980-1.html;;136/9440",
        "google_scholar": ";;Du6bnGQAAAAJ;bT8RwQMAAAAJ;;cdT_WMMAAAAJ",
        "orcid": ";;;0009-0007-6153-2739;;0000-0003-3448-4878",
        "linkedin": ";;;;;",
        "or_profile": "~Huaisheng_Zhu1;~Guoji_Fu1;~Zhimeng_Guo1;~Zhiwei_Zhang10;~Teng_Xiao2;~Suhang_Wang1",
        "aff": "Pennsylvania State University;;Pennsylvania State University;Pennsylvania State University;;Pennsylvania State University",
        "aff_domain": "psu.edu;;psu.edu;psu.edu;;psu.edu",
        "position": "PhD student;;PhD student;PhD student;;Assistant Professor",
        "bibtex": "@misc{\nzhu2024fairnessaware,\ntitle={Fairness-aware Message Passing for Graph Neural Networks},\nauthor={Huaisheng Zhu and Guoji Fu and Zhimeng Guo and Zhiwei Zhang and Teng Xiao and Suhang Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=yYjsH5wktr}\n}",
        "github": "",
        "project": "",
        "reviewers": "ci7T;6j2s;Kxjw;qojd;UpE8",
        "site": "https://openreview.net/forum?id=yYjsH5wktr",
        "pdf_size": 965551,
        "rating": "3;5;5;5;5",
        "confidence": "4;4;4;4;3",
        "soundness": "2;3;3;2;2",
        "contribution": "2;2;2;2;2",
        "presentation": "3;3;3;3;2",
        "wc_summary": "48;66;59;90;38",
        "wc_strengths": "69;68;48;115;42",
        "wc_weaknesses": "116;84;72;231;95",
        "wc_questions": "201;421;4;131;200",
        "wc_review": "434;639;183;567;375",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            4.6,
            0.7999999999999999
        ],
        "confidence_avg": [
            3.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            60.2,
            17.690675509996783
        ],
        "wc_strengths_avg": [
            68.4,
            25.632791498391274
        ],
        "wc_weaknesses_avg": [
            119.6,
            57.552063386120224
        ],
        "wc_questions_avg": [
            191.4,
            135.3877394744443
        ],
        "wc_review_avg": [
            439.6,
            158.76977042245795
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.2500000000000001,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6434615259884918955&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Pennsylvania State University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.psu.edu",
        "aff_unique_abbr": "PSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "yYylDyLnzt",
        "title": "Dantzig-Wolfe Decomposition and Deep Reinforcement Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The 3D bin packing problem is an NP-hard optimisation problem. RL solutions found in the literature tackle simplified versions of the full problem due to its large action space and long episode lengths. This work uses a Danzig-Wolfe formulation to decompose the full problem into a set partition and 3D knapsack problem. The RL agent is used to solve the 3D knapsack problem and CPLEX (a mixed integer linear programming solver) is used to solve the set partition problem. This removes the bin selection action from the action space of the agent and reduces the episode length to be only the number of items required to fill 1 bin rather than all items in the inference. We thereby simplify the learning problem compared to the full 3D bin-packing case. The trained agent is used at inference time to iteratively generate columns of the Danzig-Wolfe formulation using the column generation procedure. This algorithm provided improved solutions on up to 28/47 instances compared to those obtained by successively applying the RL agent to optimize volume occupation in a bin with the remaining items.\n\nRL solutions alone cannot provide valid lower bounds for solutions. This work also uses the Danzig-Wolfe formulation and column generation to improve on existing SOTA lower bounds by replacing the RL agent with an integer linear program for the 3D knapsack problem. An improved lower bound compared to SOTA was found on 17/47 instances by using CPLEX to solve both master and sub-problems.",
        "keywords": "Column Generation;Reinforcement Learning;MILP;bin-packing;combinatorial;optimisation",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Fares Chouaki;Rebecca Si\u00e2n Jeffers",
        "authorids": "~Fares_Chouaki1;~Rebecca_Si\u00e2n_Jeffers1",
        "gender": "M;",
        "homepage": ";",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": ";0000-0003-1539-4500",
        "linkedin": "fares-chouaki/;rebecca-jeffers-152a2380/",
        "or_profile": "~Fares_Chouaki1;~Rebecca_Si\u00e2n_Jeffers1",
        "aff": "Sorbonne Universit\u00e9 - Facult\u00e9 des Sciences (Paris VI);InstaDeep",
        "aff_domain": "upmc.fr;instadeep.com",
        "position": "PhD student;Researcher",
        "bibtex": "@misc{\nchouaki2024dantzigwolfe,\ntitle={Dantzig-Wolfe Decomposition and Deep Reinforcement Learning},\nauthor={Fares Chouaki and Rebecca Si{\\^a}n Jeffers},\nyear={2024},\nurl={https://openreview.net/forum?id=yYylDyLnzt}\n}",
        "github": "",
        "project": "",
        "reviewers": "TSyU;zq6L;kDhg",
        "site": "https://openreview.net/forum?id=yYylDyLnzt",
        "pdf_size": 1497194,
        "rating": "3;3;3",
        "confidence": "5;4;4",
        "soundness": "3;2;3",
        "contribution": "2;2;2",
        "presentation": "3;1;1",
        "wc_summary": "84;22;40",
        "wc_strengths": "29;68;42",
        "wc_weaknesses": "99;128;149",
        "wc_questions": "77;39;47",
        "wc_review": "289;257;278",
        "wc_reply_reviewers": "0;156;0",
        "wc_reply_authors": "759;830;642",
        "reply_reviewers": "0;1;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            48.666666666666664,
            26.04269997949948
        ],
        "wc_strengths_avg": [
            46.333333333333336,
            16.21384867602041
        ],
        "wc_weaknesses_avg": [
            125.33333333333333,
            20.49932248202906
        ],
        "wc_questions_avg": [
            54.333333333333336,
            16.35712552851373
        ],
        "wc_review_avg": [
            274.6666666666667,
            13.27487183449325
        ],
        "wc_reply_reviewers_avg": [
            52.0,
            73.53910524340094
        ],
        "wc_reply_authors_avg": [
            743.6666666666666,
            77.51272296998876
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:GPN0oOKFem8J:scholar.google.com/&scioq=Dantzig-Wolfe+Decomposition+and+Deep+Reinforcement+Learning&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Sorbonne Universit\u00e9;InstaDeep",
        "aff_unique_dep": "Facult\u00e9 des Sciences;",
        "aff_unique_url": "https://www.sorbonne-universite.fr;https://www.instadeep.com",
        "aff_unique_abbr": "Sorbonne U;InstaDeep",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Paris VI;",
        "aff_country_unique_index": "0;1",
        "aff_country_unique": "France;United Kingdom"
    },
    {
        "id": "yZBpnKpBCw",
        "title": "Time- and Label-efficient Active Learning by Diversity and Uncertainty of Probabilities",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We propose FALCUN, a novel deep batch active learning method that is label- and time-efficient. Our proposed acquisition uses a natural, self-adjusting balance of uncertainty and diversity: It slowly transitions from emphasizing uncertain instances at the decision boundary to emphasizing batch diversity.\nIn contrast, established deep active learning methods often have a fixed weighting of uncertainty and diversity. Moreover, most methods demand intensive search through a deep neural network's high-dimensional latent embedding space. This leads to high acquisition times during which experts are idle as they wait for the next batch to label. \nWe overcome this structural problem by exclusively operating on the low-dimensional probability space, yielding much faster acquisition times. \nIn extensive experiments, we show FALCUNs suitability for diverse use cases, including image and tabular data. \nCompared to state-of-the-art methods like BADGE, CLUE, and AlfaMix, FALCUN consistently excels in quality and speed: while FALCUN is among the fastest methods, it has the highest average label efficiency.",
        "keywords": "Active Learning;Deep Active Learning;Fast;Label-Efficient",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Sandra Gilhuber;Anna Beer;Yunpu Ma;Thomas Seidl",
        "authorids": "gilhuber@dbs.ifi.lmu.de;~Anna_Beer1;~Yunpu_Ma1;~Thomas_Seidl2",
        "gender": ";F;M;",
        "homepage": ";https://dm.cs.univie.ac.at/team/person/1009179/;https://dblp.org/pid/199/8143.html;https://www.dbs.ifi.lmu.de/cms/personen/professoren/seidl/index.html",
        "dblp": ";222/8125;199/8143.html;s/ThomasSeidl1",
        "google_scholar": ";https://scholar.google.de/citations?user=ByPvRi8AAAAJ;fj5DzgcAAAAJ;0fOi9KkAAAAJ",
        "orcid": ";0000-0002-6890-997X;;0000-0002-4861-1412",
        "linkedin": ";;yunpu-ma-05a9b41b0/?originalSubdomain=de;",
        "or_profile": "gilhuber@dbs.ifi.lmu.de;~Anna_Beer1;~Yunpu_Ma1;~Thomas_Seidl2",
        "aff": ";University of Vienna;Siemens Corporate Research;Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen",
        "aff_domain": ";univie.ac.at;siemens.com;lmu.de",
        "position": ";Postdoc;Researcher;Full Professor",
        "bibtex": "@misc{\ngilhuber2024time,\ntitle={Time- and Label-efficient Active Learning by Diversity and Uncertainty of Probabilities},\nauthor={Sandra Gilhuber and Anna Beer and Yunpu Ma and Thomas Seidl},\nyear={2024},\nurl={https://openreview.net/forum?id=yZBpnKpBCw}\n}",
        "github": "",
        "project": "",
        "reviewers": "Y5kQ;sEgU;ZfdV;z6tU",
        "site": "https://openreview.net/forum?id=yZBpnKpBCw",
        "pdf_size": 5038820,
        "rating": "3;5;5;5",
        "confidence": "3;3;5;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "189;109;54;58",
        "wc_strengths": "37;28;28;76",
        "wc_weaknesses": "485;195;189;101",
        "wc_questions": "294;84;2;193",
        "wc_review": "1005;416;273;428",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "815;1137;689;1253",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;2;1;2",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            102.5,
            54.44492630172255
        ],
        "wc_strengths_avg": [
            42.25,
            19.828956099603428
        ],
        "wc_weaknesses_avg": [
            242.5,
            144.86804340502428
        ],
        "wc_questions_avg": [
            143.25,
            110.29817541555255
        ],
        "wc_review_avg": [
            530.5,
            280.6568189087876
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            973.5,
            229.62741561059298
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13474682144663750745&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of Vienna;Siemens AG;Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen",
        "aff_unique_dep": ";Corporate Research;",
        "aff_unique_url": "https://univie.ac.at;https://www.siemens.com/research;https://www.lmu.de",
        "aff_unique_abbr": "UV;Siemens;LMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "Austria;Germany"
    },
    {
        "id": "yZJapMWdHZ",
        "title": "Shifting Attention to Relevance: Towards the Uncertainty Estimation of Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "While Large Language Models (LLMs) have demonstrated remarkable potential in natural language generation and instruction following, a persistent challenge lies in their susceptibility to \u201challucinations\u201d, which erodes trust in their outputs. Although Uncertainty Quantification (UQ) presents a promising solution, its accurate implementation within the context of LLMs remains a significant hurdle. To address this critical roadblock, our research originates from a fundamental heuristic insight: tokens within auto-regressive LLM-generated text do not equally reflect the underlying meaning. Some tokens carry greater relevance and representativeness than others, owing to the phenomenon of \u201clinguistic redundancy\u201d, wherein a select few keywords suffice to convey the essence of lengthy sentences. Regrettably, existing methodologies treat all tokens with equal importance when estimating uncertainty, disregarding these inherent generative inequalities. Our analysis reveals a significant issue with state-of-the-art: numerous tokens (and sentences) of limited semantic significance receive equal or even excessive weighting during uncertainty estimation. To rectify this bias, we propose to jointly Shifting Attention to more Relevant (SAR) components, at both the token- and the sentence-levels for accurate uncertainty estimation. We conduct extensive experiments involving a range of popular \u201coff-the-shelf\u201d LLMs, including instruction-tuned LLMs such as Vicuna, WizardLM, and LLaMA-2-chat, as well as pretrained LLMs like OPT and LLaMA, with model sizes extending up to 33B parameters. We carry out evaluation across various free-form question-answering tasks, encompassing domains such as reading comprehension, science Q&A, and medical Q&A. Our experimental results, coupled with a comprehensive demographic analysis, demonstrate the superior performance of SAR in addressing the challenges of uncertainty estimation within the realm of LLMs.",
        "keywords": "uncertainty estimation;natural language generation",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/11dbb881da897d462634e8eefe739b33fc98624f.zip",
        "author": "Jinhao Duan;Hao Cheng;Shiqi Wang;Alex Zavalny;Chenan Wang;Renjing Xu;Bhavya Kailkhura;Kaidi Xu",
        "authorids": "~Jinhao_Duan1;~Hao_Cheng15;~Shiqi_Wang2;~Alex_Zavalny1;~Chenan_Wang1;~Renjing_Xu1;~Bhavya_Kailkhura1;~Kaidi_Xu1",
        "gender": "M;M;M;M;M;;M;M",
        "homepage": "https://jinhaoduan.github.io;https://github.com/ChaduCheng;https://shiqi-wang.github.io;;;;https://people.llnl.gov/kailkhura1;https://kaidixu.com/",
        "dblp": "282/2912;;58/9145-2;;;;132/8938;195/8175",
        "google_scholar": "aWeTAXYAAAAJ;;u_MzXeMAAAAJ;;https://scholar.google.com/citations?authuser=2;;SQpJmOgAAAAJ;lYK0wlsAAAAJ",
        "orcid": ";0000-0002-3246-6636;0000-0002-6338-1432;;;;;",
        "linkedin": ";;tcwangshiqi/;alex-zavalny-a98241185/;;;;",
        "or_profile": "~Jinhao_Duan1;~Hao_Cheng15;~Shiqi_Wang2;~Alex_Zavalny1;~Chenan_Wang1;~Renjing_Xu1;~Bhavya_Kailkhura1;~Kaidi_Xu1",
        "aff": "Drexel University;Hong Kong University of Science and Technology(Guangzhou);Amazon;Drexel University;Drexel University;;Lawrence Livermore National Laboratory;Drexel University",
        "aff_domain": "drexel.edu;connect.hkust-gz.edu.cn;amazon.com;drexel.edu;drexel.edu;;llnl.gov;drexel.edu",
        "position": "PhD student;PhD student;Researcher;Undergrad student;MS student;;Research Staff;Assistant Professor",
        "bibtex": "@misc{\nduan2024shifting,\ntitle={Shifting Attention to Relevance: Towards the Uncertainty Estimation of Large Language Models},\nauthor={Jinhao Duan and Hao Cheng and Shiqi Wang and Alex Zavalny and Chenan Wang and Renjing Xu and Bhavya Kailkhura and Kaidi Xu},\nyear={2024},\nurl={https://openreview.net/forum?id=yZJapMWdHZ}\n}",
        "github": "",
        "project": "",
        "reviewers": "VX9S;UFP5;i37c",
        "site": "https://openreview.net/forum?id=yZJapMWdHZ",
        "pdf_size": 673113,
        "rating": "6;6;6",
        "confidence": "2;4;4",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "3;3;3",
        "wc_summary": "137;147;67",
        "wc_strengths": "82;60;22",
        "wc_weaknesses": "13;61;113",
        "wc_questions": "87;18;79",
        "wc_review": "319;286;281",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "545;852;465",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;3;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            117.0,
            35.59026084010437
        ],
        "wc_strengths_avg": [
            54.666666666666664,
            24.78350706058814
        ],
        "wc_weaknesses_avg": [
            62.333333333333336,
            40.83571421630281
        ],
        "wc_questions_avg": [
            61.333333333333336,
            30.814859330452176
        ],
        "wc_review_avg": [
            295.3333333333333,
            16.858891488535722
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            620.6666666666666,
            166.8059418073056
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 60,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11563184701115214801&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;0;0;3;0",
        "aff_unique_norm": "Drexel University;Hong Kong University of Science and Technology;Amazon;Lawrence Livermore National Laboratory",
        "aff_unique_dep": ";;Amazon.com, Inc.;",
        "aff_unique_url": "https://www.drexel.edu;https://www.ust.hk;https://www.amazon.com;https://www.llnl.gov",
        "aff_unique_abbr": "Drexel;HKUST;Amazon;LLNL",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;1;0;0;0;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "yacRhge4zQ",
        "title": "Regulation Games for Trustworthy Machine Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Existing work on trustworthy machine learning (ML) often focuses on a single aspect of trust in ML (e.g., fairness, or privacy) and thus fails to obtain a holistic trust assessment. Furthermore, most techniques often fail to recognize that the parties who train models are not the same as the ones who assess their trustworthiness. We propose a framework that formulates trustworthy ML as a multi-objective multi-agent optimization problem to address these limitations. A holistic characterization of trust in ML naturally lends itself to a game theoretic formulation, which we call regulation games. We introduce and study a particular game instance, the SpecGame, which models the relationship between an ML model builder and regulators seeking to specify and enforce fairness and privacy regulations. Seeking socially optimal (i.e., efficient for all agents) solutions to the game, we introduce ParetoPlay. This novel equilibrium search algorithm ensures that agents remain on the Pareto frontier of their objectives and avoids the inefficiencies of other equilibria. For instance, we show that for a gender classification application, the achieved privacy guarantee is 3.76\u00d7 worse than the ordained privacy requirement if regulators do not take the initiative to specify their desired guarantees first. We hope that our framework can provide policy guidance.",
        "keywords": "privacy;fairness;regulation;game",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/a594f4ed735340976d8f5846fea39559371e3c80.zip",
        "author": "Mohammad Yaghini;Patty Liu;Franziska Boenisch;Nicolas Papernot",
        "authorids": "~Mohammad_Yaghini1;~Patty_Liu1;~Franziska_Boenisch2;~Nicolas_Papernot1",
        "gender": "M;F;;M",
        "homepage": "https://m-yaghini.github.io;;;https://www.papernot.fr",
        "dblp": "175/1555;166/0405;;162/1405",
        "google_scholar": "t0PeZ3cAAAAJ;;;cGxq0cMAAAAJ",
        "orcid": ";;;",
        "linkedin": "myaghini/;patty-liu-2596201b5/;;nicolaspapernot",
        "or_profile": "~Mohammad_Yaghini1;~Patty_Liu1;~Franziska_Boenisch2;~Nicolas_Papernot1",
        "aff": "University of Toronto, Vector Institute;University of Toronto;;Google",
        "aff_domain": "utoronto.ca;utoronto.ca;;google.com",
        "position": "PhD student;Undergrad student;;Research Scientist",
        "bibtex": "@misc{\nyaghini2024regulation,\ntitle={Regulation Games for Trustworthy Machine Learning},\nauthor={Mohammad Yaghini and Patty Liu and Franziska Boenisch and Nicolas Papernot},\nyear={2024},\nurl={https://openreview.net/forum?id=yacRhge4zQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "kbV4;SMAr;wL1U",
        "site": "https://openreview.net/forum?id=yacRhge4zQ",
        "pdf_size": 1089910,
        "rating": "3;5;6",
        "confidence": "3;4;3",
        "soundness": "1;3;2",
        "contribution": "1;3;2",
        "presentation": "2;2;2",
        "wc_summary": "50;155;78",
        "wc_strengths": "30;25;58",
        "wc_weaknesses": "242;163;129",
        "wc_questions": "4;76;256",
        "wc_review": "326;419;521",
        "wc_reply_reviewers": "15;0;61",
        "wc_reply_authors": "654;689;1263",
        "reply_reviewers": "1;0;1",
        "reply_authors": "1;3;4",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            94.33333333333333,
            44.39469437769438
        ],
        "wc_strengths_avg": [
            37.666666666666664,
            14.522013940527977
        ],
        "wc_weaknesses_avg": [
            178.0,
            47.33568069296845
        ],
        "wc_questions_avg": [
            112.0,
            105.98113039593416
        ],
        "wc_review_avg": [
            422.0,
            79.63667496825819
        ],
        "wc_reply_reviewers_avg": [
            25.333333333333332,
            25.952948879762307
        ],
        "wc_reply_authors_avg": [
            868.6666666666666,
            279.201639600407
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.18898223650461363,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13553472162777642341&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "University of Toronto;Google",
        "aff_unique_dep": ";Google",
        "aff_unique_url": "https://www.utoronto.ca;https://www.google.com",
        "aff_unique_abbr": "U of T;Google",
        "aff_campus_unique_index": "0;2",
        "aff_campus_unique": "Toronto;;Mountain View",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "Canada;United States"
    },
    {
        "title": "Safe Collaborative Filtering",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17413",
        "id": "yarUvgEXq3",
        "author_site": "Riku Togashi, Tatsushi Oka, Naoto Ohsaka, Tetsuro Morimura",
        "tldr": "",
        "abstract": "Excellent tail performance is crucial for modern machine learning tasks, such as algorithmic fairness, class imbalance, and risk-sensitive decision making, as it ensures the effective handling of challenging samples within a dataset. Tail performance is also a vital determinant of success for personalized recommender systems to reduce the risk of losing users with low satisfaction. This study introduces a \"safe\" collaborative filtering method that prioritizes recommendation quality for less-satisfied users rather than focusing on the average performance. Our approach minimizes the conditional value at risk (CVaR), which represents the average risk over the tails of users' loss. To overcome computational challenges for web-scale recommender systems, we develop a robust yet practical algorithm that extends the most scalable method, implicit alternating least squares (iALS). Empirical evaluation on real-world datasets demonstrates the excellent tail performance of our approach while maintaining competitive computational efficiency.",
        "keywords": "recommender systems;collaborative filtering;scalability",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Riku Togashi;Tatsushi Oka;Naoto Ohsaka;Tetsuro Morimura",
        "authorids": "~Riku_Togashi3;~Tatsushi_Oka1;~Naoto_Ohsaka2;~Tetsuro_Morimura1",
        "gender": "M;;M;M",
        "homepage": "https://riktor.github.io/;;https://todo314.github.io/;",
        "dblp": "198/5462;;81/10779;36/1501",
        "google_scholar": "KVEf0M4AAAAJ;;https://scholar.google.co.jp/citations?user=Qgkc9DgAAAAJ;https://scholar.google.co.jp/citations?user=IgjF21EAAAAJ",
        "orcid": ";;0000-0001-9584-4764;",
        "linkedin": ";;;",
        "or_profile": "~Riku_Togashi3;~Tatsushi_Oka1;~Naoto_Ohsaka2;~Tetsuro_Morimura1",
        "aff": "CyberAgent;;CyberAgent, Inc.;CyberAgent, Inc.",
        "aff_domain": "cyberagent.co.jp;;cyberagent.co.jp;cyberagent.co.jp",
        "position": "Researcher;;Researcher;Researcher",
        "bibtex": "@inproceedings{\ntogashi2024safe,\ntitle={Safe Collaborative Filtering},\nauthor={Riku Togashi and Tatsushi Oka and Naoto Ohsaka and Tetsuro Morimura},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=yarUvgEXq3}\n}",
        "github": "",
        "project": "",
        "reviewers": "nPPr;QW8m;RZsQ",
        "pdf_size": 913493,
        "rating": "6;8;8",
        "confidence": "3;2;3",
        "soundness": "3;4;4",
        "contribution": "3;4;3",
        "presentation": "3;3;3",
        "wc_summary": "18;146;92",
        "wc_strengths": "9;80;21",
        "wc_weaknesses": "168;30;11",
        "wc_questions": "4;3;63",
        "wc_review": "199;259;187",
        "wc_reply_reviewers": "370;0;78",
        "wc_reply_authors": "2752;172;837",
        "reply_reviewers": "2;0;1",
        "reply_authors": "6;1;3",
        "rating_avg": [
            7.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            85.33333333333333,
            52.46797965320267
        ],
        "wc_strengths_avg": [
            36.666666666666664,
            31.030450993965413
        ],
        "wc_weaknesses_avg": [
            69.66666666666667,
            69.96348253831344
        ],
        "wc_questions_avg": [
            23.333333333333332,
            28.051539866625664
        ],
        "wc_review_avg": [
            215.0,
            31.496031496047245
        ],
        "wc_reply_reviewers_avg": [
            149.33333333333334,
            159.25102476558476
        ],
        "wc_reply_authors_avg": [
            1253.6666666666667,
            1093.7118247306078
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            2.0548046676563256
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2280998648116594681&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=yarUvgEXq3",
        "pdf": "https://openreview.net/pdf?id=yarUvgEXq3",
        "email": "cyberagent.co.jp;;cyberagent.co.jp;cyberagent.co.jp",
        "author_num": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "CyberAgent",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cyberagent.co.jp",
        "aff_unique_abbr": "CA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Japan"
    },
    {
        "id": "ybavRGEmpw",
        "title": "Adversarially Robust Deep Learning with Optimal-Transport-Regularized Divergences",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We introduce the $ARMOR_D$ methods as novel approaches to enhancing the adversarial robustness of deep learning models. These methods are based on a new class of optimal-transport-regularized divergences, constructed via an infimal convolution between an information divergence and an optimal-transport (OT) cost. We use these as tools to enhance  adversarial robustness  by maximizing the expected loss over a neighborhood of distributions, a technique known as distributionally robust optimization. Viewed as a tool for constructing adversarial samples,  our method allows samples to be both transported, according to the OT cost, and re-weighted, according to the information divergence. We demonstrate the effectiveness of our method on malware detection and image recognition applications and find that, to our knowledge, it outperforms existing methods at enhancing the robustness against adversarial attacks. $ARMOR_D$ yields the robustified accuracy of 98.29\\% against $FGSM$ and 98.18\\% against $PGD^{40}$ on the MNIST dataset, reducing the error rate by more than $19.7\\%$ and $37.2\\%$ respectively compared to prior methods. Similarly, in  malware detection, a discrete (binary) data domain, $ARMOR_D$ improves the robustified accuracy under $rFGSM^{50}$ attack compared to the previous best-performing adversarial training methods by $37.0\\%$  while lowering false negative and false positive rates by $51.1\\%$ and $57.53\\%$, respectively.",
        "keywords": "adversarial robustness;deep learning;information divergence;optimal transport;distributionally robust optimization;malware detection;image recognition",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Jeremiah Birrell;Mohammadreza Ebrahimi",
        "authorids": "~Jeremiah_Birrell1;~Mohammadreza_Ebrahimi2",
        "gender": "M;M",
        "homepage": "https://www.researchgate.net/profile/Jeremiah-Birrell;https://star-ailab.github.io/",
        "dblp": ";26/7531",
        "google_scholar": "R60hJGUAAAAJ;4DmURbEAAAAJ",
        "orcid": ";0000-0003-1367-3338",
        "linkedin": ";",
        "or_profile": "~Jeremiah_Birrell1;~Mohammadreza_Ebrahimi2",
        "aff": "Texas State University;University of South Florida",
        "aff_domain": "txstate.edu;usf.edu",
        "position": "Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nbirrell2024adversarially,\ntitle={Adversarially Robust Deep Learning with Optimal-Transport-Regularized Divergences},\nauthor={Jeremiah Birrell and Mohammadreza Ebrahimi},\nyear={2024},\nurl={https://openreview.net/forum?id=ybavRGEmpw}\n}",
        "github": "",
        "project": "",
        "reviewers": "8rju;sgR7;4TT9;2esQ",
        "site": "https://openreview.net/forum?id=ybavRGEmpw",
        "pdf_size": 857351,
        "rating": "3;5;5;5",
        "confidence": "4;3;4;4",
        "soundness": "2;4;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "57;59;88;43",
        "wc_strengths": "34;85;67;34",
        "wc_weaknesses": "300;207;181;112",
        "wc_questions": "30;56;32;27",
        "wc_review": "421;407;368;216",
        "wc_reply_reviewers": "0;10;0;0",
        "wc_reply_authors": "714;664;711;354",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            61.75,
            16.361158271956175
        ],
        "wc_strengths_avg": [
            55.0,
            21.94310825749169
        ],
        "wc_weaknesses_avg": [
            200.0,
            67.36839021380874
        ],
        "wc_questions_avg": [
            36.25,
            11.54068888758379
        ],
        "wc_review_avg": [
            353.0,
            81.44630132793017
        ],
        "wc_reply_reviewers_avg": [
            2.5,
            4.330127018922194
        ],
        "wc_reply_authors_avg": [
            610.75,
            149.5549648122723
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:oRG4GmP1zekJ:scholar.google.com/&scioq=Adversarially+Robust+Deep+Learning+with+Optimal-Transport-Regularized+Divergences&hl=en&as_sdt=0,5",
        "gs_version_total": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Texas State University;University of South Florida",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.txstate.edu;https://www.usf.edu",
        "aff_unique_abbr": "TXST;USF",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "ybiwT2yP1c",
        "title": "BIRB: A Generalization Benchmark for Information Retrieval in Bioacoustics",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The ability for a machine learning model to cope with differences in training and deployment conditions\u2014e.g. in the presence of distribution shift or the generalization to new classes altogether\u2014is crucial for real-world use cases. However, most empirical work in this area has focused on the image domain with artificial benchmarks constructed to measure individual aspects of generalization. We present BIRB, a complex benchmark centered on the retrieval of bird vocalizations from passively-recorded datasets given focal recordings from a large citizen science corpus available for training. We propose a baseline system for this collection of tasks using representation learning and a nearest-centroid search. Our thorough empirical evaluation and analysis surfaces open research directions, suggesting that BIRB fills the need for a more realistic and complex benchmark to drive progress on robustness to distribution shifts and generalization of ML models.",
        "keywords": "benchmark;generalization;retrieval;bioacoustics",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "/attachment/9abddcd05f5f1d7a13623d8567e01e8831c61105.zip",
        "author": "Jenny Hamer;Eleni Triantafillou;Bart van Merri\u00ebnboer;Stefan Kahl;Holger Klinck;tom denton;Vincent Dumoulin",
        "authorids": "~Jenny_Hamer1;~Eleni_Triantafillou1;~Bart_van_Merri\u00ebnboer1;~Stefan_Kahl1;~Holger_Klinck1;~tom_denton1;~Vincent_Dumoulin1",
        "gender": "Not Specified;F;M;M;M;M;M",
        "homepage": "https://sites.google.com/corp/view/jhamer/home/;http://www.cs.toronto.edu/~eleni/;;https://www.birds.cornell.edu/ccb/holger-klinck/;https://inventingsituations.net;;",
        "dblp": "235/5476;183/8430;169/5327;;05/10715;133/8606;147/5356",
        "google_scholar": "gNrdoNwAAAAJ;Y5x2ZgQAAAAJ;o2blBQQAAAAJ;VMy9KAUAAAAJ;M1nVuUgAAAAJ;https://scholar.google.ca/citations?user=mZfgLA4AAAAJ;XE9SDzgAAAAJ",
        "orcid": ";;;0000-0003-1078-7268;;;",
        "linkedin": ";;;holger-klinck-35900914/;;;",
        "or_profile": "~Jenny_Hamer1;~Eleni_Triantafillou1;~Stefan_Kahl1;~Holger_Klinck1;~tom_denton1;~Vincent_Dumoulin1;~Bart_van_Merrienboer1",
        "aff": "DeepMind, Google;Google;Cornell University;Cornell University;Google;Google;University of Montreal",
        "aff_domain": "deepmind.com;google.com;cornell.edu;cornell.edu;google.com;google.com;umontreal.ca",
        "position": "Researcher;Researcher;Postdoc;Researcher;SWE;Research Scientist;PhD student",
        "bibtex": "@misc{\nhamer2024birb,\ntitle={{BIRB}: A Generalization Benchmark for Information Retrieval in Bioacoustics},\nauthor={Jenny Hamer and Eleni Triantafillou and Bart van Merri{\\\"e}nboer and Stefan Kahl and Holger Klinck and tom denton and Vincent Dumoulin},\nyear={2024},\nurl={https://openreview.net/forum?id=ybiwT2yP1c}\n}",
        "github": "",
        "project": "",
        "reviewers": "sjxb;sG4k;N4MM;SRto",
        "site": "https://openreview.net/forum?id=ybiwT2yP1c",
        "pdf_size": 1243893,
        "rating": "5;5;5;5",
        "confidence": "3;3;2;3",
        "soundness": "3;2;2;1",
        "contribution": "3;3;3;2",
        "presentation": "2;2;2;2",
        "wc_summary": "40;65;85;121",
        "wc_strengths": "63;36;120;53",
        "wc_weaknesses": "118;88;173;299",
        "wc_questions": "43;57;91;23",
        "wc_review": "264;246;469;496",
        "wc_reply_reviewers": "178;0;87;131",
        "wc_reply_authors": "1357;415;1068;1513",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "3;2;3;4",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            77.75,
            29.625791128677054
        ],
        "wc_strengths_avg": [
            68.0,
            31.535694062442957
        ],
        "wc_weaknesses_avg": [
            169.5,
            80.74187265601411
        ],
        "wc_questions_avg": [
            53.5,
            24.794152536434876
        ],
        "wc_review_avg": [
            368.75,
            114.32710745925482
        ],
        "wc_reply_reviewers_avg": [
            99.0,
            65.59344479443048
        ],
        "wc_reply_authors_avg": [
            1088.25,
            420.2126693711174
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7570612218420157655&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1;1;0;0;2",
        "aff_unique_norm": "Google;Cornell University;University of Montreal",
        "aff_unique_dep": "Google AI;;",
        "aff_unique_url": "https://www.google.com;https://www.cornell.edu;https://wwwumontreal.ca",
        "aff_unique_abbr": "Google;Cornell;UM",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Mountain View",
        "aff_country_unique_index": "0;0;0;0;0;0;1",
        "aff_country_unique": "United States;Canada"
    },
    {
        "title": "Towards Assessing and Benchmarking Risk-Return Tradeoff of Off-Policy Evaluation",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17412",
        "id": "ycF7mKfVGO",
        "author_site": "Haruka Kiyohara, Ren Kishimoto, Kosuke Kawakami, Ken Kobayashi, Kazuhide Nakata, Yuta Saito",
        "tldr": "",
        "abstract": "**Off-Policy Evaluation (OPE)** aims to assess the effectiveness of counterfactual policies using offline logged data and is frequently utilized to identify the top-$k$ promising policies for deployment in online A/B tests. Existing evaluation metrics for OPE estimators primarily focus on the \"accuracy\" of OPE or that of downstream policy selection, neglecting risk-return tradeoff and *efficiency* in subsequent online policy deployment. To address this issue, we draw inspiration from portfolio evaluation in finance and develop a new metric, called **SharpeRatio@k**, which measures the risk-return tradeoff and efficiency of policy portfolios formed by an OPE estimator under varying online evaluation budgets ($k$). We first demonstrate, in two example scenarios, that our proposed metric can clearly distinguish between conservative and high-stakes OPE estimators and reliably identify the most *efficient* estimator capable of forming superior portfolios of candidate policies that maximize return with minimal risk during online deployment, while existing evaluation metrics produce only degenerate results. To facilitate a quick, accurate, and consistent evaluation of OPE via SharpeRatio@k, we have also implemented the proposed metric in an open-source software. Using SharpeRatio@k and the software, we conduct a benchmark experiment of various OPE estimators regarding their risk-return tradeoff, presenting several future directions for OPE research.",
        "keywords": "off-policy evaluation;offline reinforcement learning;offline policy selection;risk-return tradeoff",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Haruka Kiyohara;Ren Kishimoto;Kosuke Kawakami;Ken Kobayashi;Kazuhide Nakata;Yuta Saito",
        "authorids": "~Haruka_Kiyohara1;~Ren_Kishimoto1;~Kosuke_Kawakami1;~Ken_Kobayashi1;~Kazuhide_Nakata1;~Yuta_Saito1",
        "gender": ";M;M;;;M",
        "homepage": "https://sites.google.com/view/harukakiyohara;;https://k-kawakami213.github.io/;https://kenkoba2119.github.io/;http://www.iee.e.titech.ac.jp/~nakatalab/index.html;https://usait0.com/en/",
        "dblp": "294/5273;362/3086.html;;73/3956.html;;89/8195",
        "google_scholar": "wkZLqMMAAAAJ;https://scholar.google.co.jp/citations?hl=ja;https://scholar.google.co.jp/citations?user=m7VEzuoAAAAJ;https://scholar.google.co.jp/citations?user=fyMWmOMAAAAJ;;pw4hwS8AAAAJ",
        "orcid": "0009-0000-6378-4365;0009-0002-7443-5325;;;;0000-0003-4357-5835",
        "linkedin": "haruka-kiyohara-0b2384191;;;;;",
        "or_profile": "~Haruka_Kiyohara1;~Ren_Kishimoto1;~Kosuke_Kawakami1;~Ken_Kobayashi1;~Kazuhide_Nakata1;~Yuta_Saito1",
        "aff": "Cornell University;Tokyo Institute of Technology;Tokyo Institute of Technology, Tokyo Institute of Technology;Tokyo Institute of Technology;Tokyo Institute of Technology, Tokyo Institute of Technology;Cornell University",
        "aff_domain": "cornell.edu;titech.ac.jp;titech.ac.jp;m.titech.ac.jp;titech.ac.jp;cornell.edu",
        "position": "PhD student;Undergrad student;PhD student;Assistant Professor;Full Professor;PhD student",
        "bibtex": "@inproceedings{\nkiyohara2024towards,\ntitle={Towards Assessing and Benchmarking Risk-Return Tradeoff of Off-Policy Evaluation},\nauthor={Haruka Kiyohara and Ren Kishimoto and Kosuke Kawakami and Ken Kobayashi and Kazuhide Nakata and Yuta Saito},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ycF7mKfVGO}\n}",
        "github": "",
        "project": "",
        "reviewers": "qCGC;wVqE;n49S;S1vJ",
        "pdf_size": 9520459,
        "rating": "5;5;8;8",
        "confidence": "2;3;3;3",
        "soundness": "2;3;3;4",
        "contribution": "2;2;3;4",
        "presentation": "2;3;3;3",
        "wc_summary": "56;92;92;148",
        "wc_strengths": "43;66;114;109",
        "wc_weaknesses": "64;143;40;161",
        "wc_questions": "71;37;36;176",
        "wc_review": "234;338;282;594",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1321;940;338;587",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "3;3;1;1",
        "rating_avg": [
            6.5,
            1.5
        ],
        "confidence_avg": [
            2.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            97.0,
            32.90896534380867
        ],
        "wc_strengths_avg": [
            83.0,
            29.690065678607045
        ],
        "wc_weaknesses_avg": [
            102.0,
            51.112620750652184
        ],
        "wc_questions_avg": [
            80.0,
            57.18828551373087
        ],
        "wc_review_avg": [
            362.0,
            138.9100428334827
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            796.5,
            370.744184040694
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            1.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5773502691896258,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6686350352823138415&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=ycF7mKfVGO",
        "pdf": "https://openreview.net/pdf?id=ycF7mKfVGO",
        "email": "cornell.edu;titech.ac.jp;titech.ac.jp;m.titech.ac.jp;titech.ac.jp;cornell.edu",
        "author_num": 6,
        "aff_unique_index": "0;1;1;1;1;0",
        "aff_unique_norm": "Cornell University;Tokyo Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cornell.edu;https://www.titech.ac.jp",
        "aff_unique_abbr": "Cornell;Titech",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Tokyo",
        "aff_country_unique_index": "0;1;1;1;1;0",
        "aff_country_unique": "United States;Japan"
    },
    {
        "title": "EmerNeRF: Emergent Spatial-Temporal Scene Decomposition via Self-Supervision",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17411",
        "id": "ycv2z8TYur",
        "author_site": "Jiawei Yang, Boris Ivanovic, Or Litany, Xinshuo Weng, Seung Wook Kim, Boyi Li, Tong Che, Danfei Xu, Sanja Fidler, Marco Pavone, Yue Wang",
        "tldr": "",
        "abstract": "We present EmerNeRF, a simple yet powerful approach for learning spatial-temporal representations of dynamic driving scenes. Grounded in neural fields, EmerNeRF simultaneously captures scene geometry, appearance, motion, and semantics via self-bootstrapping. EmerNeRF hinges upon two core components: First, it stratifies scenes into static and dynamic fields. This decomposition emerges purely from self-supervision, enabling our model to learn from general, in-the-wild data sources. Second, EmerNeRF parameterizes an induced flow field from the dynamic field and uses this flow field to further aggregate multi-frame features, amplifying the rendering precision of dynamic objects. Coupling these three fields (static, dynamic, and flow) enables EmerNeRF to represent highly-dynamic scenes self-sufficiently, without relying on ground truth object annotations or pre-trained models for dynamic object segmentation or optical flow estimation. Our method achieves state-of-the-art performance in sensor simulation, significantly outperforming previous methods when reconstructing static (+2.93 PSNR) and dynamic (+3.70 PSNR) scenes. In addition, to bolster EmerNeRF's semantic generalization, we lift 2D visual foundation model features into 4D space-time and address a general positional bias in modern Transformers, significantly boosting 3D perception performance (e.g., 37.50% relative improvement in occupancy prediction accuracy on average). Finally, we construct a diverse and challenging 120-sequence dataset to benchmark neural fields under extreme and highly-dynamic settings. See the project page for code, data, and request pre-trained models: https://emernerf.github.io",
        "keywords": "Neural fields;spatial-temporal NeRFs;NeRF for driving",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/b0855b50287a9c5b382818ecee4057766d7fa8b1.pdf",
        "author": "Jiawei Yang;Boris Ivanovic;Or Litany;Xinshuo Weng;Seung Wook Kim;Boyi Li;Tong Che;Danfei Xu;Sanja Fidler;Marco Pavone;Yue Wang",
        "authorids": "~Jiawei_Yang1;~Boris_Ivanovic1;~Or_Litany1;~Xinshuo_Weng3;~Seung_Wook_Kim1;~Boyi_Li1;~Tong_Che1;~Danfei_Xu1;~Sanja_Fidler1;~Marco_Pavone1;~Yue_Wang2",
        "gender": "M;;M;F;M;F;M;M;F;M;M",
        "homepage": "https://jiawei-yang.github.io/;http://www.borisivanovic.com/;http://orlitany.github.io;http://www.xinshuoweng.com;http://www.cs.toronto.edu/~seung/;https://sites.google.com/site/boyilics/home;;https://cs.stanford.edu/~danfei/;http://www.cs.toronto.edu/~fidler/;https://web.stanford.edu/~pavone/;https://yuewang.xyz",
        "dblp": "96/2976;203/8356;119/1476;192/1952.html;;;125/0738;135/8443;08/6607;91/3382-1.html;33/4822-41",
        "google_scholar": "OYrpIa8AAAAJ;ey9AQcEAAAAJ;https://scholar.google.co.il/citations?user=Ihs8dwsAAAAJ;dthSEsoAAAAJ;https://scholar.google.co.kr/citations?hl=en;;7b5tlJkAAAAJ;J5D4kcoAAAAJ;CUlqK5EAAAAJ;RhOpyXcAAAAJ;v-AEFIEAAAAJ",
        "orcid": ";0000-0002-8698-202X;;0000-0002-7894-4381;;;;;;;",
        "linkedin": ";boris-ivanovic-a3103064;;xinshuoweng;;;;;sanja-fidler-2846a1a?trk=hp-identity-name;;",
        "or_profile": "~Jiawei_Yang1;~Boris_Ivanovic1;~Or_Litany1;~Xinshuo_Weng3;~Seung_Wook_Kim1;~Boyi_Li1;~Tong_Che1;~Danfei_Xu1;~Sanja_Fidler1;~Marco_Pavone1;~Yue_Wang2",
        "aff": "University of Southern California;NVIDIA;NVIDIA;NVIDIA;Vector Institute;University of California, Berkeley;NVIDIA;NVIDIA;Department of Computer Science, University of Toronto;Stanford University;NVIDIA",
        "aff_domain": "usc.edu;nvidia.com;nvidia.com;nvidia.com;vectorinstitute.ai;berkeley.edu;nvidia.com;nvidia.com;cs.toronto.edu;stanford.edu;nvidia.com",
        "position": "PhD student;Researcher;Research Scientist;Researcher;Grad student;Postdoc;Researcher;Research Scientist;Associate Professor;Associate Professor;Researcher",
        "bibtex": "@inproceedings{\nyang2024emernerf,\ntitle={EmerNe{RF}: Emergent Spatial-Temporal Scene Decomposition via Self-Supervision},\nauthor={Jiawei Yang and Boris Ivanovic and Or Litany and Xinshuo Weng and Seung Wook Kim and Boyi Li and Tong Che and Danfei Xu and Sanja Fidler and Marco Pavone and Yue Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ycv2z8TYur}\n}",
        "github": "",
        "project": "",
        "reviewers": "fQX6;qWy5;hxFT;BkKZ",
        "pdf_size": 26068861,
        "rating": "6;6;8;8",
        "confidence": "3;4;3;4",
        "soundness": "2;2;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;4;3",
        "wc_summary": "81;110;100;58",
        "wc_strengths": "40;40;52;119",
        "wc_weaknesses": "478;378;168;86",
        "wc_questions": "5;27;83;37",
        "wc_review": "604;555;403;300",
        "wc_reply_reviewers": "0;0;45;0",
        "wc_reply_authors": "2082;1024;811;607",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "5;3;2;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            87.25,
            19.84155991851447
        ],
        "wc_strengths_avg": [
            62.75,
            32.84337832805876
        ],
        "wc_weaknesses_avg": [
            277.5,
            157.29192604835126
        ],
        "wc_questions_avg": [
            38.0,
            28.442925306655784
        ],
        "wc_review_avg": [
            465.5,
            120.92249583927715
        ],
        "wc_reply_reviewers_avg": [
            11.25,
            19.48557158514987
        ],
        "wc_reply_authors_avg": [
            1131.0,
            568.5125328433842
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            1.479019945774904
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            11,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 55,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7926101116652040670&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=ycv2z8TYur",
        "pdf": "https://openreview.net/pdf?id=ycv2z8TYur",
        "email": "usc.edu;nvidia.com;nvidia.com;nvidia.com;vectorinstitute.ai;berkeley.edu;nvidia.com;nvidia.com;cs.toronto.edu;stanford.edu;nvidia.com",
        "author_num": 11,
        "aff_unique_index": "0;1;1;1;2;3;1;1;4;5;1",
        "aff_unique_norm": "University of Southern California;NVIDIA;Vector Institute;University of California, Berkeley;University of Toronto;Stanford University",
        "aff_unique_dep": ";NVIDIA Corporation;;;Department of Computer Science;",
        "aff_unique_url": "https://www.usc.edu;https://www.nvidia.com;https://vectorinstitute.ai/;https://www.berkeley.edu;https://www.utoronto.ca;https://www.stanford.edu",
        "aff_unique_abbr": "USC;NVIDIA;Vector Institute;UC Berkeley;U of T;Stanford",
        "aff_campus_unique_index": "0;2;3;4",
        "aff_campus_unique": "Los Angeles;;Berkeley;Toronto;Stanford",
        "aff_country_unique_index": "0;0;0;0;1;0;0;0;1;0;0",
        "aff_country_unique": "United States;Canada"
    },
    {
        "id": "ye3NrNrYOY",
        "title": "Temporal Causal Mechanism Transfer for Few-shot Action Recognition",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The goal of few-shot action recognition is to recognize actions in video sequences for which there exists only a few training samples. The challenge is to adapt a base model effectively and efficiently when the base and novel data have significant distributional disparities. To this end, we learn a model of a temporal causal mechanism from the base data by variational inference. When adapting the model by training on the novel data set we hold certain aspects of the causal mechanism fixed, updating only auxiliary variables and a classifier. During this adapation phase, we treat as invariant the time-delayed causal relations between latent causal variables and the mixing function that maps causal variables to action representations. Our experimental evaluations across standard action recognition datasets validate our hypothesis that our proposed method of Temporal Causal Mechanism Transfer (TCMT) enables efficient few-shot action recognition in video sequences with notable performance improvements over leading benchmarks.",
        "keywords": "few-shot action recognition;causal representation learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/3e7c1d572320098afe3792ebb782ab4a9e41f91d.zip",
        "author": "Yuke Li;Guangyi Chen;Ben Abramowitz;Stefano Anzellotti;Donglai Wei",
        "authorids": "~Yuke_Li1;~Guangyi_Chen1;~Ben_Abramowitz1;~Stefano_Anzellotti1;~Donglai_Wei1",
        "gender": ";M;;M;M",
        "homepage": ";https://chengy12.github.io/;;https://sccnlab.bc.edu/;https://donglaiw.github.io/",
        "dblp": ";c/GuangyiChen-2;210/2612;;89/10116.html",
        "google_scholar": ";https://scholar.google.com/citations?hl=zh-CN;;tK5W2p0AAAAJ;xF2mhDoAAAAJ",
        "orcid": ";;;;0000-0002-2329-5484",
        "linkedin": ";;;;",
        "or_profile": "~Yuke_Li1;~Guangyi_Chen1;~Ben_Abramowitz1;~Stefano_Anzellotti1;~Donglai_Wei1",
        "aff": ";Carnegie Mellon University;;Boston College;Boston College",
        "aff_domain": ";cmu.edu;;bc.edu;bc.edu",
        "position": ";Postdoc;;Assistant Professor;Assistant Professor",
        "bibtex": "@misc{\nli2024temporal,\ntitle={Temporal Causal Mechanism Transfer for Few-shot Action Recognition},\nauthor={Yuke Li and Guangyi Chen and Ben Abramowitz and Stefano Anzellotti and Donglai Wei},\nyear={2024},\nurl={https://openreview.net/forum?id=ye3NrNrYOY}\n}",
        "github": "",
        "project": "",
        "reviewers": "sFNL;G3yX;oCST;K1pA",
        "site": "https://openreview.net/forum?id=ye3NrNrYOY",
        "pdf_size": 4736266,
        "rating": "5;5;5;6",
        "confidence": "3;2;3;4",
        "soundness": "2;2;3;3",
        "contribution": "3;3;3;3",
        "presentation": "1;2;2;2",
        "wc_summary": "33;61;211;92",
        "wc_strengths": "15;28;161;80",
        "wc_weaknesses": "141;124;114;188",
        "wc_questions": "17;113;5;146",
        "wc_review": "206;326;491;506",
        "wc_reply_reviewers": "101;60;0;15",
        "wc_reply_authors": "1246;1832;1355;2616",
        "reply_reviewers": "1;2;0;1",
        "reply_authors": "3;6;4;7",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            99.25,
            67.80993658749432
        ],
        "wc_strengths_avg": [
            71.0,
            57.37159575957427
        ],
        "wc_weaknesses_avg": [
            141.75,
            28.39344114403888
        ],
        "wc_questions_avg": [
            70.25,
            60.536662445166236
        ],
        "wc_review_avg": [
            382.25,
            123.86358423685309
        ],
        "wc_reply_reviewers_avg": [
            44.0,
            39.62953444086872
        ],
        "wc_reply_authors_avg": [
            1762.25,
            539.9353549268653
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            5.0,
            1.5811388300841898
        ],
        "replies_avg": [
            33,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.816496580927726,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:n4wSPnPajOUJ:scholar.google.com/&scioq=Temporal+Causal+Mechanism+Transfer+for+Few-shot+Action+Recognition&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Carnegie Mellon University;Boston College",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cmu.edu;https://www.bostoncollege.edu",
        "aff_unique_abbr": "CMU;BC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "yeKQXf08Db",
        "title": "Dynamic Continuous Hyperparameter Tuning for Generalized Linear Contextual Bandits",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In stochastic contextual bandits, an agent sequentially makes actions from a time-dependent action set based on past experience to minimize the cumulative regret. Like many other machine learning algorithms, the performance of bandits heavily depends on the values of hyperparameters, and theoretically derived parameter values may lead to unsatisfactory results in practice. Moreover, it is infeasible to use offline tuning methods like cross-validation to choose hyperparameters under the bandit environment, as the decisions should be made in real time. To address this challenge, we propose the first online continuous hyperparameter tuning framework for contextual bandits to learn the optimal parameter configuration within a search space on the fly. Specifically, we use a double-layer bandit framework named CDT (Continuous Dynamic Tuning) and formulate the hyperparameter optimization as a non-stationary continuum-armed bandit, where each arm represents a combination of hyperparameters, and the corresponding reward is the algorithmic result. For the top layer, we propose the Zooming TS algorithm that utilizes Thompson Sampling (TS) for exploration and a restart technique to get around the \\textit{switching} environment. The proposed CDT framework can be easily utilized to tune contextual bandit algorithms without any pre-specified candidate set for multiple hyperparameters. We further show that it could achieve a sublinear regret in theory and performs consistently better than all existing methods on both synthetic and real datasets.",
        "keywords": "contextual bandits",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/a552845a50e9b483d429380a1c355f5cdacef682.pdf",
        "author": "Yue Kang;Cho-Jui Hsieh;Thomas Lee",
        "authorids": "~Yue_Kang1;~Cho-Jui_Hsieh1;~Thomas_Lee2",
        "gender": "M;M;",
        "homepage": ";http://web.cs.ucla.edu/~chohsieh/index.html;",
        "dblp": "135/9726-2;14/2770;",
        "google_scholar": ";Wy89g4IAAAAJ;",
        "orcid": ";;",
        "linkedin": "yue-kang-b52063158/;;",
        "or_profile": "~Yue_Kang1;~Cho-Jui_Hsieh1;~Thomas_Lee2",
        "aff": "University of California, Davis;University of California, Los Angeles;",
        "aff_domain": "ucdavis.edu;ucla.edu;",
        "position": "PhD student;Associate Professor;",
        "bibtex": "@misc{\nkang2024dynamic,\ntitle={Dynamic Continuous Hyperparameter Tuning for Generalized Linear Contextual Bandits},\nauthor={Yue Kang and Cho-Jui Hsieh and Thomas Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=yeKQXf08Db}\n}",
        "github": "",
        "project": "",
        "reviewers": "m7nW;psHy;wfPS",
        "site": "https://openreview.net/forum?id=yeKQXf08Db",
        "pdf_size": 13980369,
        "rating": "5;5;6",
        "confidence": "4;3;3",
        "soundness": "3;3;3",
        "contribution": "3;2;3",
        "presentation": "3;3;3",
        "wc_summary": "88;92;61",
        "wc_strengths": "24;2;27",
        "wc_weaknesses": "99;166;379",
        "wc_questions": "104;2;2",
        "wc_review": "315;262;469",
        "wc_reply_reviewers": "0;96;59",
        "wc_reply_authors": "1306;1505;972",
        "reply_reviewers": "0;1;1",
        "reply_authors": "3;3;3",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            80.33333333333333,
            13.767917618708923
        ],
        "wc_strengths_avg": [
            17.666666666666668,
            11.14550233153366
        ],
        "wc_weaknesses_avg": [
            214.66666666666666,
            119.37708695092576
        ],
        "wc_questions_avg": [
            36.0,
            48.08326112068523
        ],
        "wc_review_avg": [
            348.6666666666667,
            87.7964818328287
        ],
        "wc_reply_reviewers_avg": [
            51.666666666666664,
            39.53338954464806
        ],
        "wc_reply_authors_avg": [
            1261.0,
            219.91058789123062
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.0,
            0.0
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:1c0oMO4QBlMJ:scholar.google.com/&scioq=Dynamic+Continuous+Hyperparameter+Tuning+for+Generalized+Linear+Contextual+Bandits&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "University of California, Davis;University of California, Los Angeles",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.ucdavis.edu;https://www.ucla.edu",
        "aff_unique_abbr": "UC Davis;UCLA",
        "aff_campus_unique_index": "0;1",
        "aff_campus_unique": "Davis;Los Angeles",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Variance-enlarged Poisson Learning for Graph-based Semi-Supervised Learning with Extremely Sparse Labeled Data",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17410",
        "id": "yeeVBMDAwy",
        "author_site": "Xiong Zhou, Xianming Liu, Hao Yu, Jialiang Wang, Zeke Xie, Junjun Jiang, Xiangyang Ji",
        "tldr": "",
        "abstract": "Graph-based semi-supervised learning, particularly in the context of extremely sparse labeled data, often suffers from degenerate solutions where label functions tend to be nearly constant across unlabeled data. In this paper, we introduce Variance-enlarged Poisson Learning (VPL), a simple yet powerful framework tailored to alleviate the issues arising from the presence of degenerate solutions. VPL incorporates a variance-enlarged regularization term, which induces a Poisson equation specifically for unlabeled data. This intuitive approach increases the dispersion of labels from their average mean, effectively reducing the likelihood of degenerate solutions characterized by nearly constant label functions. We subsequently introduce two streamlined algorithms, V-Laplace and V-Poisson, each intricately designed to enhance Laplace and Poisson learning, respectively. Furthermore, we broaden the scope of VPL to encompass graph neural networks, introducing Variance-enlarged Graph Poisson Networks (V-GPN) to facilitate improved label propagation. To achieve a deeper understanding of VPL's behavior, we conduct a comprehensive theoretical exploration in both discrete and variational cases. Our findings elucidate that VPL inherently amplifies the importance of connections within the same class while concurrently tempering those between different classes. We support our claims with extensive experiments, demonstrating the effectiveness of VPL and showcasing its superiority over existing methods. The code is available at https://github.com/hitcszx/VPL.",
        "keywords": "Semi-Supervised Learning;Poisson Learning;Extremely Sparse Labled Data",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/dc0a1ef5263fdbc340fec376b8b5a44f91beca2c.zip",
        "author": "Xiong Zhou;Xianming Liu;Hao Yu;Jialiang Wang;Zeke Xie;Junjun Jiang;Xiangyang Ji",
        "authorids": "~Xiong_Zhou3;~Xianming_Liu5;~Hao_Yu8;~Jialiang_Wang3;~Zeke_Xie1;~Junjun_Jiang2;~Xiangyang_Ji1",
        "gender": "M;M;;M;M;M;",
        "homepage": "https://hitcszx.github.io/;http://homepage.hit.edu.cn/xmliu;https://www.researchgate.net/profile/Hao-Yu-19;https://cswjl.github.io/;https://sites.google.com/view/zeke-xie;http://homepage.hit.edu.cn/jiangjunjun;",
        "dblp": ";89/58201.html;;;210/1039;https://dblp.uni-trier.de/pers/hd/j/Jiang:Junjun;",
        "google_scholar": "BMGootgAAAAJ;;;;https://scholar.google.co.jp/citations?user=ysXmZCMAAAAJ;WNH2_rgAAAAJ;",
        "orcid": "0000-0002-0856-6696;0000-0002-8857-1785;;;;0000-0002-5694-505X;",
        "linkedin": ";;;;;;",
        "or_profile": "~Xiong_Zhou3;~Xianming_Liu5;~Hao_Yu8;~Jialiang_Wang3;~Zeke_Xie1;~Junjun_Jiang2;~Xiangyang_Ji1",
        "aff": "Harbin Institute of Technology;Harbin Institute of Technology;;Harbin Institute of Technology;Baidu;Harbin Institute of Technology;",
        "aff_domain": "hit.edu.cn;hit.edu.cn;;hit.edu.cn;baidu.com;hit.edu.cn;",
        "position": "PhD student;Full Professor;;PhD student;Researcher;Full Professor;",
        "bibtex": "@inproceedings{\nzhou2024varianceenlarged,\ntitle={Variance-enlarged Poisson Learning for Graph-based Semi-Supervised Learning with Extremely Sparse Labeled Data},\nauthor={Xiong Zhou and Xianming Liu and Hao Yu and Jialiang Wang and Zeke Xie and Junjun Jiang and Xiangyang Ji},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=yeeVBMDAwy}\n}",
        "github": "",
        "project": "",
        "reviewers": "cv8h;JXpL;CApx;HipA",
        "pdf_size": 547656,
        "rating": "6;6;6;6",
        "confidence": "4;4;5;3",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;4;3;3",
        "wc_summary": "46;140;62;202",
        "wc_strengths": "34;33;88;67",
        "wc_weaknesses": "25;18;149;32",
        "wc_questions": "182;328;25;30",
        "wc_review": "287;519;324;331",
        "wc_reply_reviewers": "0;16;42;11",
        "wc_reply_authors": "1612;941;892;385",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "4;3;4;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            112.5,
            62.727585638218216
        ],
        "wc_strengths_avg": [
            55.5,
            23.221757039466244
        ],
        "wc_weaknesses_avg": [
            56.0,
            53.92123885817165
        ],
        "wc_questions_avg": [
            141.25,
            124.9267285251639
        ],
        "wc_review_avg": [
            365.25,
            90.32822095004418
        ],
        "wc_reply_reviewers_avg": [
            17.25,
            15.417117110536587
        ],
        "wc_reply_authors_avg": [
            957.5,
            436.087433893709
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.25,
            0.82915619758885
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2965202204324242231&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=yeeVBMDAwy",
        "pdf": "https://openreview.net/pdf?id=yeeVBMDAwy",
        "email": "hit.edu.cn;hit.edu.cn;;hit.edu.cn;baidu.com;hit.edu.cn;",
        "author_num": 7,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "Harbin Institute of Technology;Baidu",
        "aff_unique_dep": ";Baidu, Inc.",
        "aff_unique_url": "http://www.hit.edu.cn/;https://www.baidu.com",
        "aff_unique_abbr": "HIT;Baidu",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Harbin;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "yf8MaCjs4j",
        "title": "Task-to-Instance Prompt Learning for Vision-Language Models at Test Time",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Prompt learning has been recently introduced into the adaption of pre-trained vision-language models (VLMs) by tuning a set of trainable tokens to replace hand-crafted text templates. Despite the encouraging results achieved, existing methods largely rely on extra annotated data for training. In this paper, we investigate a more realistic scenario, where only the unlabeled test data is available. Existing test-time prompt learning methods often separately learn a prompt for each test sample. However, relying solely on a single sample heavily limits the performance of the learned prompts, as it neglects the task-level knowledge that can be gained from multiple samples. To that end, we propose a novel test-time prompt learning method of VLMs, called Task-to-Instance PromPt LEarning (TIPPLE), which adopts a two-stage training strategy to leverage both task- and instance-level knowledge. Specifically, we reformulate the effective online pseudo-labeling paradigm along with two tailored components: an auxiliary text classification task and a diversity regularization term, to serve the task-oriented prompt learning. After that, the learned task-level prompt is further combined with a tunable residual for each test sample to integrate with instance-level knowledge. We demonstrate the superior performance of TIPPLE on 15 downstream datasets, e.g., the average improvement of 1.87% over the state-of-the-art method, using ViT-B/16 visual backbone.",
        "keywords": "Prompt Learning;Vision-Language Models;Test Time;Task-to-Instance",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Jiawang Bai;Zhihe Lu;Xin Li;Zeyu Xiao;Xinchao Wang",
        "authorids": "~Jiawang_Bai2;~Zhihe_Lu1;~Xin_Li28;~Zeyu_Xiao1;~Xinchao_Wang1",
        "gender": "M;M;M;;M",
        "homepage": ";https://zhihelu.github.io/;https://lixinustc.github.io;;https://sites.google.com/site/sitexinchaowang/",
        "dblp": "237/9675;195/9141.html;09/1365-82;276/3139;",
        "google_scholar": "https://scholar.google.com.hk/citations?user=sRksETcAAAAJ;X4LKIhgAAAAJ;sbiY97gAAAAJ;;https://scholar.google.com.tw/citations?user=w69Buq0AAAAJ",
        "orcid": ";0000-0002-6917-8654;;;",
        "linkedin": ";;;;",
        "or_profile": "~Jiawang_Bai2;~Zhihe_Lu1;~Xin_Li28;~Zeyu_Xiao1;~Xinchao_WANG3",
        "aff": "Tsinghua University;National University of Singapore;University of Science and Technology of China;University of Science and Technology of China;National University of Singapore",
        "aff_domain": "tsinghua.edu.cn;nus.edu;ustc.edu.cn;ustc.edu.cn;nus.edu",
        "position": "PhD student;Postdoc;PhD student;PhD student;Assistant Professor",
        "bibtex": "@misc{\nbai2024tasktoinstance,\ntitle={Task-to-Instance Prompt Learning for Vision-Language Models at Test Time},\nauthor={Jiawang Bai and Zhihe Lu and Xin Li and Zeyu Xiao and Xinchao Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=yf8MaCjs4j}\n}",
        "github": "",
        "project": "",
        "reviewers": "43Ye;GbQ6;R3mK;cDhi",
        "site": "https://openreview.net/forum?id=yf8MaCjs4j",
        "pdf_size": 776538,
        "rating": "5;5;6;6",
        "confidence": "4;5;5;4",
        "soundness": "3;3;3;3",
        "contribution": "3;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "91;118;50;72",
        "wc_strengths": "82;59;108;60",
        "wc_weaknesses": "167;191;171;165",
        "wc_questions": "89;110;2;6",
        "wc_review": "429;478;331;303",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            82.75,
            24.993749218554626
        ],
        "wc_strengths_avg": [
            77.25,
            19.992185973524755
        ],
        "wc_weaknesses_avg": [
            173.5,
            10.331989159885913
        ],
        "wc_questions_avg": [
            51.75,
            48.34446710844996
        ],
        "wc_review_avg": [
            385.25,
            71.10687378868515
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:7uoOo7MD_mEJ:scholar.google.com/&scioq=Task-to-Instance+Prompt+Learning+for+Vision-Language+Models+at+Test+Time&hl=en&as_sdt=0,5",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;2;1",
        "aff_unique_norm": "Tsinghua University;National University of Singapore;University of Science and Technology of China",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.nus.edu.sg;http://www.ustc.edu.cn",
        "aff_unique_abbr": "THU;NUS;USTC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;1",
        "aff_country_unique": "China;Singapore"
    },
    {
        "id": "yfdtkYQesu",
        "title": "Interpreting Adaptive Gradient Methods by Parameter Scaling for Learning-Rate-Free Optimization",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We address the challenge of estimating the learning rate for adaptive gradient methods used in training deep neural networks. While several learning-rate-free approaches have been proposed, they are typically tailored for steepest descent. However, although steepest descent methods offer an intuitive approach to finding minima, many deep learning applications require adaptive gradient methods to achieve faster convergence. In this paper, we interpret adaptive gradient methods as steepest descent applied on parameter-scaled networks, proposing learning-rate-free adaptive gradient methods. Experimental results verify the effectiveness of this approach, demonstrating comparable performance to hand-tuned learning rates across various scenarios. This work extends the applicability of learning-rate-free methods, enhancing training with adaptive gradient methods.",
        "keywords": "learning-rate-free learning;adaptive gradient methods",
        "primary_area": "optimization",
        "supplementary_material": "/attachment/596ce7e1d125a4892455e556e3197d54b4b875c7.zip",
        "author": "Min-Kook Suh;Seung-Woo Seo",
        "authorids": "~Min-Kook_Suh1;~Seung-Woo_Seo1",
        "gender": "M;",
        "homepage": "https://vi.snu.ac.kr:58240/bbs/board.php?bo_table=sub2_2&wr_id=7;http://vi.snu.ac.kr",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": "0000-0002-1654-3689;",
        "linkedin": ";",
        "or_profile": "~Min-Kook_Suh1;~Seung-Woo_Seo1",
        "aff": "Seoul National University;Seoul National University",
        "aff_domain": "snu.ac.kr;snu.ac.kr",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\nsuh2024interpreting,\ntitle={Interpreting Adaptive Gradient Methods by Parameter Scaling for Learning-Rate-Free Optimization},\nauthor={Min-Kook Suh and Seung-Woo Seo},\nyear={2024},\nurl={https://openreview.net/forum?id=yfdtkYQesu}\n}",
        "github": "",
        "project": "",
        "reviewers": "AxR5;u1Lz;jSjZ;jkmf",
        "site": "https://openreview.net/forum?id=yfdtkYQesu",
        "pdf_size": 419905,
        "rating": "3;5;5;8",
        "confidence": "2;2;3;4",
        "soundness": "2;2;2;3",
        "contribution": "1;2;2;3",
        "presentation": "1;2;2;3",
        "wc_summary": "26;38;45;53",
        "wc_strengths": "19;45;46;22",
        "wc_weaknesses": "208;60;233;40",
        "wc_questions": "5;5;5;15",
        "wc_review": "258;148;329;130",
        "wc_reply_reviewers": "0;90;0;0",
        "wc_reply_authors": "542;333;1047;310",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;2;2;1",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            2.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            40.5,
            9.912113800799505
        ],
        "wc_strengths_avg": [
            33.0,
            12.549900398011133
        ],
        "wc_weaknesses_avg": [
            135.25,
            85.99818312034272
        ],
        "wc_questions_avg": [
            7.5,
            4.330127018922194
        ],
        "wc_review_avg": [
            216.25,
            81.47507287508247
        ],
        "wc_reply_reviewers_avg": [
            22.5,
            38.97114317029974
        ],
        "wc_reply_authors_avg": [
            558.0,
            296.4397071918673
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.8866206949335731,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:tP3YD_kJrxsJ:scholar.google.com/&scioq=Interpreting+Adaptive+Gradient+Methods+by+Parameter+Scaling+for+Learning-Rate-Free+Optimization&hl=en&as_sdt=0,5",
        "gs_version_total": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Seoul National University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.snu.ac.kr",
        "aff_unique_abbr": "SNU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "title": "VDC: Versatile Data Cleanser based on Visual-Linguistic Inconsistency by Multimodal Large Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17409",
        "id": "ygxTuVz9eU",
        "author_site": "Zihao Zhu, Mingda Zhang, Shaokui Wei, Bingzhe Wu, Baoyuan Wu",
        "tldr": "",
        "abstract": "The role of data in building AI systems has recently been emphasized by the emerging concept of data-centric AI. Unfortunately, in the real-world, datasets may contain dirty samples, such as poisoned samples from backdoor attack, noisy labels in crowdsourcing, and even hybrids of them. The presence of such dirty samples makes the DNNs vunerable and unreliable.\nHence, it is critical to detect dirty samples to improve the quality and realiability of dataset. \nExisting detectors only focus on detecting poisoned samples or noisy labels, that are often prone to weak generalization when dealing with dirty samples from other fields.\nIn this paper, we find a commonality of various dirty samples is visual-linguistic inconsistency between images and associated labels. \nTo capture the semantic inconsistency between modalities, we propose versatile data cleanser (VDC) leveraging the surpassing capabilities of multimodal large language models (MLLM) in cross-modal alignment and reasoning.\nIt consists of three consecutive modules: the visual question generation module to generate insightful questions about the image; the visual question answering module to acquire the semantics of the visual content by answering the questions with MLLM; followed by the visual answer evaluation module to evaluate the inconsistency.\nExtensive experiments demonstrate its superior performance and generalization to various categories and types of dirty samples.\nThe code is available at [https://github.com/zihao-ai/vdc](https://github.com/zihao-ai/vdc).",
        "keywords": "Noisy label detection;Poisoned sample detection;data-centric AI;multimodal large language model",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Zihao Zhu;Mingda Zhang;Shaokui Wei;Bingzhe Wu;Baoyuan Wu",
        "authorids": "~Zihao_Zhu2;~Mingda_Zhang2;~Shaokui_Wei1;~Bingzhe_Wu1;~Baoyuan_Wu1",
        "gender": ";M;M;M;M",
        "homepage": ";https://github.com/mdzhangst;https://shawkui.github.io/;;https://sites.google.com/site/baoyuanwu2015/",
        "dblp": ";;323/4243;207/4843;73/7781",
        "google_scholar": ";pmwwTcgAAAAJ;WHkEfnsAAAAJ;_3hgtf8AAAAJ;JNTG1KoAAAAJ",
        "orcid": ";;;;0000-0003-2183-5990",
        "linkedin": ";;;;",
        "or_profile": "~Zihao_Zhu2;~Mingda_Zhang2;~Shaokui_Wei1;~Bingzhe_Wu1;~Baoyuan_Wu1",
        "aff": ";The Chinese University of Hong Kong, Shenzhen;The Chinese University of Hong Kong, Shenzhen;Tencent AI Lab;The Chinese University of Hong Kong, Shenzhen",
        "aff_domain": ";cuhk.edu.cn;cuhk.edu.cn;tencent.com;cuhk.edu.cn",
        "position": ";PhD student;PhD student;Researcher;Associate Professor",
        "bibtex": "@inproceedings{\nzhu2024vdc,\ntitle={{VDC}: Versatile Data Cleanser based on Visual-Linguistic Inconsistency by Multimodal Large Language Models},\nauthor={Zihao Zhu and Mingda Zhang and Shaokui Wei and Bingzhe Wu and Baoyuan Wu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ygxTuVz9eU}\n}",
        "github": "",
        "project": "",
        "reviewers": "vuG8;481L;N7YG",
        "pdf_size": 2233560,
        "rating": "6;6;6",
        "confidence": "5;4;3",
        "soundness": "2;3;3",
        "contribution": "2;2;2",
        "presentation": "3;3;3",
        "wc_summary": "96;86;60",
        "wc_strengths": "22;53;74",
        "wc_weaknesses": "103;55;118",
        "wc_questions": "236;78;54",
        "wc_review": "457;272;306",
        "wc_reply_reviewers": "139;0;0",
        "wc_reply_authors": "1782;958;1010",
        "reply_reviewers": "1;0;0",
        "reply_authors": "4;4;4",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            80.66666666666667,
            15.173075568988057
        ],
        "wc_strengths_avg": [
            49.666666666666664,
            21.359359124801056
        ],
        "wc_weaknesses_avg": [
            92.0,
            26.870057685088806
        ],
        "wc_questions_avg": [
            122.66666666666667,
            80.7355078154725
        ],
        "wc_review_avg": [
            345.0,
            80.40315085036573
        ],
        "wc_reply_reviewers_avg": [
            46.333333333333336,
            65.5252283899534
        ],
        "wc_reply_authors_avg": [
            1250.0,
            376.779334182047
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            4.0,
            0.0
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8902683321351210911&as_sdt=5,47&sciodt=0,47&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=ygxTuVz9eU",
        "pdf": "https://openreview.net/pdf?id=ygxTuVz9eU",
        "email": ";cuhk.edu.cn;cuhk.edu.cn;tencent.com;cuhk.edu.cn",
        "author_num": 5,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Chinese University of Hong Kong;Tencent",
        "aff_unique_dep": ";Tencent AI Lab",
        "aff_unique_url": "https://www.cuhk.edu.cn;https://ai.tencent.com",
        "aff_unique_abbr": "CUHK;Tencent AI Lab",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Shenzhen;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "yhBLUzHE9r",
        "title": "Silencer: Pruning-aware Backdoor Defense for Decentralized Federated Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Decentralized Federated Learning (DFL) with gossip protocol has to cope with a much larger attack surface under backdoor attacks, because by adopting aggregation without central coordination, a small percentage of adversaries in DFL may directly gossip the poisoned model updates to their neighbors, and subsequently broadcast the poisoning effect to the entire peer-to-peer (P2P) network. By examining backdoor attacks in DFL, we discover an exciting phenomenon that the poisoned parameters on  adversaries have distinct patterns on their diagonal of empirical Fisher information (FI). Next, we show that such invariant FI patterns can be utilized to cure the poisoned models through effective model pruning. Unfortunately, we also observe an unignorable downgrade of benign accuracy of models when applying the naive FI-based pruning. To attenuate the negative impact of FI-based pruning, we present {\\sc Silencer}, a \\textit{dynamic two-stage model pruning scheme} with robustness and accuracy as dual goals. At the first stage, {\\sc Silencer} employs a FI-based parameter pruning/reclamation process during per-client local training. Each client utilizes a sparse surrogate model for local training, in order to be aware and reduce the negative impact of the second stage.  At the second stage, {\\sc Silencer} performs consensus filtering to remove dummy/poisoned parameters from the global model, and recover a benign sparse core model for deployment. Extensive experiments, conducted with three representative DFL settings, demonstrate that {\\sc Silencer} \\textit{consistently} outperforms existing defenses by a large margin. Our code is available at \\url{https://anonymous.4open.science/r/Silencer-8F08/}.",
        "keywords": "Peer-to-peer;decentralized federated learning;pruning-aware training;Fisher-guided pruning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Tiansheng Huang;Sihao Hu;Fatih Ilhan;Selim Furkan Tekin;Wenqi Wei;Ling Liu",
        "authorids": "~Tiansheng_Huang1;~Sihao_Hu1;~Fatih_Ilhan1;~Selim_Furkan_Tekin1;~Wenqi_Wei1;~Ling_Liu3",
        "gender": "M;M;M;M;;",
        "homepage": "https://huangtiansheng.github.io/;https://bayi-hu.github.io/;https://fatih-ilhan.github.io/;https://sftekin.com/;;",
        "dblp": "249/2114;266/4995;260/0254;283/8174;;",
        "google_scholar": "zz6Oq8wAAAAJ;WcZbKF4AAAAJ;https://scholar.google.com.tr/citations?hl=en;a2O4Zx0AAAAJ;;",
        "orcid": "0000-0002-4557-1865;0000-0003-3297-6991;0000-0002-0173-7544;0000-0002-8662-3609;;",
        "linkedin": ";;;;;",
        "or_profile": "~Tiansheng_Huang1;~Sihao_Hu1;~Fatih_Ilhan1;~Selim_Furkan_Tekin1;~Wenqi_Wei1;~Ling_Liu3",
        "aff": "Georgia Institute of Technology;Georgia Institute of Technology;Georgia Institute of Technology;College of Computing, Georgia Institute of Technology;;",
        "aff_domain": "gatech.edu;gatech.edu;gatech.edu;cc.gatech.edu;;",
        "position": "PhD student;PhD student;PhD student;PhD student;;",
        "bibtex": "@misc{\nhuang2024silencer,\ntitle={Silencer: Pruning-aware Backdoor Defense for Decentralized Federated Learning},\nauthor={Tiansheng Huang and Sihao Hu and Fatih Ilhan and Selim Furkan Tekin and Wenqi Wei and Ling Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=yhBLUzHE9r}\n}",
        "github": "",
        "project": "",
        "reviewers": "N48q;dudw;fqq5;m7hp",
        "site": "https://openreview.net/forum?id=yhBLUzHE9r",
        "pdf_size": 5119889,
        "rating": "3;5;6;6",
        "confidence": "3;3;3;3",
        "soundness": "1;2;3;3",
        "contribution": "1;2;2;3",
        "presentation": "3;3;1;3",
        "wc_summary": "121;31;59;87",
        "wc_strengths": "18;31;42;52",
        "wc_weaknesses": "110;121;87;217",
        "wc_questions": "134;3;94;75",
        "wc_review": "383;186;282;431",
        "wc_reply_reviewers": "0;105;429;11",
        "wc_reply_authors": "2478;2193;1770;1278",
        "reply_reviewers": "0;1;2;1",
        "reply_authors": "6;5;5;4",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            74.5,
            33.35790760824186
        ],
        "wc_strengths_avg": [
            35.75,
            12.65652005884714
        ],
        "wc_weaknesses_avg": [
            133.75,
            49.605317255310446
        ],
        "wc_questions_avg": [
            76.5,
            47.47894270094902
        ],
        "wc_review_avg": [
            320.5,
            94.45766247372417
        ],
        "wc_reply_reviewers_avg": [
            136.25,
            173.87549424803944
        ],
        "wc_reply_authors_avg": [
            1929.75,
            452.8180512082088
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            5.0,
            0.7071067811865476
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6943106869518472095&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Georgia Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.gatech.edu",
        "aff_unique_abbr": "Georgia Tech",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Atlanta",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "yhrWPZs6On",
        "title": "HYBRID GRANULARITY DISTRIBUTION ESTIMATION FOR FEW-SHOT LEARNING: STATISTICS TRANSFER FROM CATEGORIES AND INSTANCES",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Distribution estimation (DE) is one of the effective strategies for few-shot learning (FSL). \nIt involves sampling additional training data for novel categories by estimating their distributions employing transferred statistics  (*i*.*e*., mean and variance) from similar base categories.\nThis strategy enhances data diversity for novel categories and leads to effective performance improvement.\nHowever, we argue that relying solely on coarse-grained estimation at category-level fails to generate representative samples due to the discrepancy between the base categories and the novel categories.\nTo pursue representativeness while maintaining the diversity of the generated samples, we propose **H**ybrid **G**ranularity **D**istribution **E**stimation (HGDE), which estimates distributions at both coarse-grained category and fine-grained instance levels. \nIn HGDE, apart from coarse-grained category statistics, we incorporate external fine-grained instance statistics derived from nearest base samples to provide a representative description of novel categories. Then we fuse the statistics from different granularity through a linear interpolation to finally characterize the novel categories. Empirical studies conducted on four FSL benchmarks demonstrate the effectiveness of HGDE in improving the recognition accuracy of novel categories. \nFurthermore, HGDE can be applied to enhance the classification performance in other FSL methods. The code is available at:\n[https://anonymous.4open.science/r/HGDE-2026}](https://anonymous.4open.science/r/HGDE-2026)",
        "keywords": "few shot learning;representation learning;computer vision",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Xingyu Zhu;Shuo Wang;Yi Tan;Yanbin Hao;Xiangnan He",
        "authorids": "~Xingyu_Zhu3;~Shuo_Wang9;~Yi_Tan3;~Yanbin_Hao1;~Xiangnan_He1",
        "gender": "M;M;M;M;M",
        "homepage": "https://zhuhsingyuu.github.io/;http://www.wangshuo.pub;;https://haoyanbin918.github.io/;http://staff.ustc.edu.cn/~hexn",
        "dblp": "132/4210-2;63/1591-8;25/5709-1;96/1538;59/1007",
        "google_scholar": "PpqUnAwAAAAJ;qTE3BacAAAAJ;kBvMv04AAAAJ;vhPSOkEAAAAJ;https://scholar.google.com.sg/citations?user=X45Go24AAAAJ",
        "orcid": ";0000-0002-4881-9344;0000-0002-8670-1312;0000-0002-0695-1566;0000-0001-8472-7992",
        "linkedin": ";;;;",
        "or_profile": "~Xingyu_Zhu3;~Shuo_Wang9;~Yi_Tan3;~Yanbin_Hao1;~Xiangnan_He1",
        "aff": "University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China",
        "aff_domain": "ustc.edu.cn;ustc.edu;ustc.edu.cn;ustc.edu.cn;ustc.edu.cn",
        "position": "PhD student;Assistant Professor;PhD student;Associate Professor;Professor",
        "bibtex": "@misc{\nanonymous2024hybrid,\ntitle={{HYBRID} {GRANULARITY} {DISTRIBUTION} {ESTIMATION} {FOR} {FEW}-{SHOT} {LEARNING}: {STATISTICS} {TRANSFER} {FROM} {CATEGORIES} {AND} {INSTANCES}},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=yhrWPZs6On}\n}",
        "github": "",
        "project": "",
        "reviewers": "Gd5o;dMbi;3X7E",
        "site": "https://openreview.net/forum?id=yhrWPZs6On",
        "pdf_size": 719497,
        "rating": "5;5;6",
        "confidence": "4;5;5",
        "soundness": "3;2;3",
        "contribution": "2;2;2",
        "presentation": "2;2;3",
        "wc_summary": "78;67;134",
        "wc_strengths": "28;20;112",
        "wc_weaknesses": "192;140;62",
        "wc_questions": "3;2;2",
        "wc_review": "301;229;310",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "1020;1353;408",
        "reply_reviewers": "0;0;0",
        "reply_authors": "3;3;2",
        "rating_avg": [
            5.333333333333333,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            93.0,
            29.337120967584166
        ],
        "wc_strengths_avg": [
            53.333333333333336,
            41.61196409153929
        ],
        "wc_weaknesses_avg": [
            131.33333333333334,
            53.42492135906446
        ],
        "wc_questions_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_review_avg": [
            280.0,
            36.24913792078372
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            927.0,
            391.35917007270956
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:7E-ictbtRwoJ:scholar.google.com/&scioq=HYBRID+GRANULARITY+DISTRIBUTION+ESTIMATION+FOR+FEW-SHOT+LEARNING:+STATISTICS+TRANSFER+FROM+CATEGORIES+AND+INSTANCES&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "University of Science and Technology of China",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.ustc.edu.cn",
        "aff_unique_abbr": "USTC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "yhvtZdqBNm",
        "title": "Pruning Attention Heads with Almost-sure Sparsity Targets",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Transformer-based architectures have been widely used to obtain high accuracy values in multiple fields including natural language processing (NLP), computer vision, and more. Multi-head attention is the key factor in the success of Transformer-based architectures that has been found to be computationally expensive. Significant research effort has been devoted to improve attention compute efficiency by reducing the self-attention complexity or pruning redundant attention heads. Previous pruning work either presents training-testing inconsistency or enforces hard structural constraints which limit model performance. We propose the notion of almost-sure sparsity to overcome these limitations and develop a generic framework for Pruning with Almost-Sure Sparsity (PASS) targets over attention heads. To further boost efficiency, we design a novel technique, concentrator, based on which we develop PASSCONC (PASS with CONCentrator).\nWe investigate PASS and PASSCONC on two widely studied architectures: encoder-decoder (ED) Transformer and BERT. Experiments on IWSLT14 German-to-English translation and GLUE benchmark tasks demonstrate that our approaches outperform the SOTA by up to 1.33 higher BLEU scores, 1.44% higher accuracy, and 60% higher attention layer speedups.",
        "keywords": "Transformer;Multi-head Attention;Model Pruning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Dujian Ding;Ganesh Jawahar;Laks V. S. Lakshmanan",
        "authorids": "~Dujian_Ding1;~Ganesh_Jawahar1;~Laks_V._S._Lakshmanan1",
        "gender": ";M;",
        "homepage": ";https://ganeshjawahar.github.io/;https://www.cs.ubc.ca/~laks",
        "dblp": "244/8792;203/9710;l/LVSLakshmanan",
        "google_scholar": "https://scholar.google.ca/citations?user=1-FsZPQAAAAJ;https://scholar.google.co.in/citations?user=X7SMP1EAAAAJ;https://scholar.google.ca/citations?user=_RCsaOsAAAAJ",
        "orcid": ";;0000-0002-9775-4241",
        "linkedin": "dujian-ding-250123133/;https://in.linkedin.com/in/ganesh-jawahar-ab928435;laksvslakshmanan/",
        "or_profile": "~Dujian_Ding1;~Ganesh_Jawahar1;~Laks_V._S._Lakshmanan1",
        "aff": "Computing Science, University of British Columbia;University of British Columbia;University of British Columbia",
        "aff_domain": "cs.ubc.ca;ubc.ca;ubc.ca",
        "position": "PhD student;PhD student;Professor",
        "bibtex": "@misc{\nding2024pruning,\ntitle={Pruning Attention Heads with Almost-sure Sparsity Targets},\nauthor={Dujian Ding and Ganesh Jawahar and Laks V. S. Lakshmanan},\nyear={2024},\nurl={https://openreview.net/forum?id=yhvtZdqBNm}\n}",
        "github": "",
        "project": "",
        "reviewers": "WBEj;BTZ5;K7dC;fbDA",
        "site": "https://openreview.net/forum?id=yhvtZdqBNm",
        "pdf_size": 3076897,
        "rating": "3;5;5;6",
        "confidence": "4;4;3;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "2;4;3;3",
        "wc_summary": "63;141;82;66",
        "wc_strengths": "45;155;32;50",
        "wc_weaknesses": "107;401;150;42",
        "wc_questions": "5;84;37;30",
        "wc_review": "220;781;301;188",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            88.0,
            31.44041984452498
        ],
        "wc_strengths_avg": [
            70.5,
            49.22651724426582
        ],
        "wc_weaknesses_avg": [
            175.0,
            136.0275707347595
        ],
        "wc_questions_avg": [
            39.0,
            28.574464124459098
        ],
        "wc_review_avg": [
            372.5,
            239.4164781296392
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.13245323570650439,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Uh2lONnF_sAJ:scholar.google.com/&scioq=Pruning+Attention+Heads+with+Almost-sure+Sparsity+Targets&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of British Columbia",
        "aff_unique_dep": "Department of Computing Science",
        "aff_unique_url": "https://www.ubc.ca",
        "aff_unique_abbr": "UBC",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Vancouver;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "title": "Chain of Log-Concave Markov Chains",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17408",
        "id": "yiMB2DOjsR",
        "author_site": "Saeed Saremi, Ji Won Park, Francis Bach",
        "tldr": "",
        "abstract": "We introduce a theoretical framework for sampling from unnormalized densities based on a smoothing scheme that uses an isotropic Gaussian kernel with a single fixed noise scale. We prove one can decompose sampling from a density (minimal assumptions made on the density) into a sequence of sampling from log-concave conditional densities via accumulation of noisy measurements with equal noise levels. Our construction is unique in that it keeps track of a history of samples, making it non-Markovian as a whole, but it is lightweight algorithmically as the history only shows up in the form of a running empirical mean of samples. Our sampling algorithm generalizes walk-jump sampling (Saremi & Hyv\u00e4rinen, 2019). The \"walk\" phase becomes a (non-Markovian) chain of (log-concave) Markov chains. The \"jump\" from the accumulated measurements is obtained by empirical Bayes. We study our sampling algorithm quantitatively using the 2-Wasserstein metric and compare it with various Langevin MCMC algorithms. We also report a remarkable capacity of our algorithm to \"tunnel\" between modes of a distribution.",
        "keywords": "Markov chain Monte Carlo;Langevin MCMC;log-concave distributions;kernel smoothing",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Saeed Saremi;Ji Won Park;Francis Bach",
        "authorids": "~Saeed_Saremi1;~Ji_Won_Park1;~Francis_Bach1",
        "gender": "M;F;M",
        "homepage": "https://saeedsaremi.github.io/;;http://www.di.ens.fr/~fbach",
        "dblp": "128/2619;83/10554;b/FrancisRBach",
        "google_scholar": ";URG3MMYAAAAJ;https://scholar.google.fr/citations?user=6PJWcFEAAAAJ",
        "orcid": ";0000-0002-0692-1092;",
        "linkedin": ";;",
        "or_profile": "~Saeed_Saremi1;~Ji_Won_Park1;~Francis_Bach1",
        "aff": "Genentech;Genentech;Ecole Normale Superieure",
        "aff_domain": "gene.com;gene.com;ens.fr",
        "position": "Senior Principal Research Scientist;Researcher;Faculty",
        "bibtex": "@inproceedings{\nsaremi2024chain,\ntitle={Chain of Log-Concave Markov Chains},\nauthor={Saeed Saremi and Ji Won Park and Francis Bach},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=yiMB2DOjsR}\n}",
        "github": "",
        "project": "",
        "reviewers": "gqez;ZJfB;3oQn;9mSy",
        "pdf_size": 3267575,
        "rating": "6;6;8;8",
        "confidence": "3;4;3;3",
        "soundness": "3;3;4;4",
        "contribution": "3;3;3;4",
        "presentation": "4;4;4;3",
        "wc_summary": "78;89;219;19",
        "wc_strengths": "185;84;197;128",
        "wc_weaknesses": "247;274;140;54",
        "wc_questions": "52;254;430;32",
        "wc_review": "562;701;986;233",
        "wc_reply_reviewers": "0;182;0;19",
        "wc_reply_authors": "308;474;373;177",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.5,
            0.5
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            101.25,
            73.00813310857907
        ],
        "wc_strengths_avg": [
            148.5,
            45.45602270326783
        ],
        "wc_weaknesses_avg": [
            178.75,
            87.74216489237088
        ],
        "wc_questions_avg": [
            192.0,
            162.5484543143982
        ],
        "wc_review_avg": [
            620.5,
            270.94695052722034
        ],
        "wc_reply_reviewers_avg": [
            50.25,
            76.46036554974087
        ],
        "wc_reply_authors_avg": [
            333.0,
            107.75203014328778
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15687289136494054801&as_sdt=5,31&sciodt=0,31&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=yiMB2DOjsR",
        "pdf": "https://openreview.net/pdf?id=yiMB2DOjsR",
        "email": "gene.com;gene.com;ens.fr",
        "author_num": 3,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Genentech;Ecole Normale Superieure",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.genentech.com;https://www.ens.fr",
        "aff_unique_abbr": "Genentech;ENS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "United States;France"
    },
    {
        "id": "yiPtWSrBrN",
        "title": "TinyStories: How Small Can Language Models Be and Still Speak Coherent English",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "anguage models(LMs) are powerful tools for natural language processing, but they often struggle to produce coherent and fluent text when they are \\textbf{small}. Models with around 125M parameters such as GPT-Neo (small) or GPT-2 (small)\\cite{radford2019language} can rarely generate coherent and consistent English text beyond a few words even after extensive training. This raises the question of whether the emergence of the ability to produce coherent English text only occurs at larger scales (with hundreds of millions of parameters or more) and complex architectures (with many layers of global attention).\n\nIn this work, we introduce \\textbf{TinyStories}, a synthetic dataset of short stories that only contain words that a typical 3 to 4-year-olds usually understand, generated by GPT-3.5 and GPT-4. We show that TinyStories can be used to train and evaluate LMs that are much smaller than the state-of-the-art models (\\textbf{below 5 million parameters}), or have much simpler architectures (\\textbf{with only one transformer block}), yet still produce fluent and consistent stories with several paragraphs that are diverse and have almost perfect grammar, and demonstrate reasoning capabilities.\n\nWe also introduce a new paradigm for the evaluation of language models: We suggest a framework which uses GPT-4 to grade the content generated by these models as if those were stories written by students and graded by a (human) teacher. This new paradigm overcomes the flaws of standard benchmarks which often requires the model's output to be very structures, and moreover provides a multidimensional score for the model, providing scores for different capabilities such as grammar, creativity and consistency.\n\nWe hope that TinyStories can facilitate the development, analysis and research of LMs, especially for low-resource or specialized domains, and shed light on the emergence of language capabilities in LMs.",
        "keywords": "Language models; Text generation; Small models; Synthetic data;",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Yuanzhi Li;Ronen Eldan",
        "authorids": "~Yuanzhi_Li1;~Ronen_Eldan1",
        "gender": "M;M",
        "homepage": ";",
        "dblp": "73/3628;85/9583",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Yuanzhi_Li1;~Ronen_Eldan1",
        "aff": "Carnegie Mellon University;Microsoft Research",
        "aff_domain": "andrew.cmu.edu;microsoft.com",
        "position": "Assistant Professor;Principal Researcher",
        "bibtex": "@misc{\nli2024tinystories,\ntitle={TinyStories: How Small Can Language Models Be and Still Speak Coherent English},\nauthor={Yuanzhi Li and Ronen Eldan},\nyear={2024},\nurl={https://openreview.net/forum?id=yiPtWSrBrN}\n}",
        "github": "",
        "project": "",
        "reviewers": "5ySx;itNL;tD6p;YfoG",
        "site": "https://openreview.net/forum?id=yiPtWSrBrN",
        "pdf_size": 4135056,
        "rating": "1;3;3;5",
        "confidence": "4;3;4;3",
        "soundness": "1;1;2;2",
        "contribution": "2;1;2;2",
        "presentation": "2;2;3;2",
        "wc_summary": "38;70;166;37",
        "wc_strengths": "53;69;38;50",
        "wc_weaknesses": "504;216;180;113",
        "wc_questions": "4;29;110;19",
        "wc_review": "599;384;494;219",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            1.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            77.75,
            52.651566928250105
        ],
        "wc_strengths_avg": [
            52.5,
            11.05667219374799
        ],
        "wc_weaknesses_avg": [
            253.25,
            149.41448222980262
        ],
        "wc_questions_avg": [
            40.5,
            41.100486615124154
        ],
        "wc_review_avg": [
            424.0,
            140.668048966352
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.7071067811865476,
        "gs_citation": 228,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=819482743989901214&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Carnegie Mellon University;Microsoft",
        "aff_unique_dep": ";Microsoft Research",
        "aff_unique_url": "https://www.cmu.edu;https://www.microsoft.com/en-us/research",
        "aff_unique_abbr": "CMU;MSR",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "yisfNWUEsD",
        "title": "SCALE: Synergized Collaboration of Asymmetric Language Translation Engines",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this paper, we introduce SCALE, a collaborative framework that connects compact Specialized Translation Models (STMs) and general-purpose Large Language Models (LLMs) as one unified translation engine. By introducing translation from STM into the triplet in-context demonstrations, SCALE unlocks refinement and pivoting ability of LLM, thus mitigating language bias of LLM and parallel data bias of STM, enhancing LLM speciality without sacrificing generality, and facilitating continual learning without expensive LLM fine-tuning.\nOur comprehensive experiments show that SCALE significantly outperforms both few-shot LLMs (GPT-4) and specialized models (NLLB) in challenging low-resource settings. Moreover, in Xhosa to English translation, SCALE experiences consistent improvement by a 4 BLEURT score without tuning LLM and surpasses few-shot GPT-4 by 2.5 COMET score and 3.8 BLEURT score when equipped with a compact model consisting of merely 600M parameters. SCALE could also effectively exploit the existing language bias of LLMs by using an English-centric STM as a pivot for translation between any language pairs, outperforming few-shot GPT-4 by an average of 6 COMET points across eight translation directions. Furthermore we provide an in-depth analysis of SCALE's robustness, translation characteristics, and latency costs, providing solid foundation for future studies exploring the potential synergy between LLMs and more specialized translation models.",
        "keywords": "large language models;machine translation;in-context learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/d966b9db74ecef3335e0660763529dd77b90a02e.zip",
        "author": "Xin Cheng;Xun Wang;Tao Ge;Si-Qing Chen;Furu Wei;Dongyan Zhao;Rui Yan",
        "authorids": "~Xin_Cheng2;~Xun_Wang5;~Tao_Ge1;~Si-Qing_Chen1;~Furu_Wei1;~Dongyan_Zhao2;~Rui_Yan2",
        "gender": ";;M;F;M;M;M",
        "homepage": ";;https://getao.github.io/;;https://www.microsoft.com/en-us/research/people/fuwei/;https://www.wict.pku.edu.cn/zhaodongyan/en/;https://gsai.ruc.edu.cn/english/ruiyan",
        "dblp": ";;136/7923;;72/5870;63/1870;19/2405-1",
        "google_scholar": ";;LYbs7Q8AAAAJ;;G-V1VpwAAAAJ;lhR8-68AAAAJ;eLw6g-UAAAAJ",
        "orcid": ";;;0000-0002-6945-4540;;;0000-0002-3356-6823",
        "linkedin": ";;;si-qing-chen-seattle/;;;",
        "or_profile": "~Xin_Cheng2;~Xun_Wang5;~Tao_Ge1;~Si-Qing_Chen1;~Furu_Wei1;~Dongyan_Zhao2;~Rui_Yan2",
        "aff": ";;Tencent AI Lab;Microsoft;Microsoft Research;Peking University;Renmin University of China",
        "aff_domain": ";;tencent.com;microsoft.com;microsoft.com;pku.edu.cn;ruc.edu.cn",
        "position": ";;Principal Researcher;Partner Applied Science Manager;Distinguished Scientist;Full Professor;Associate Professor",
        "bibtex": "@misc{\ncheng2024scale,\ntitle={{SCALE}: Synergized Collaboration of Asymmetric Language Translation Engines},\nauthor={Xin Cheng and Xun Wang and Tao Ge and Si-Qing Chen and Furu Wei and Dongyan Zhao and Rui Yan},\nyear={2024},\nurl={https://openreview.net/forum?id=yisfNWUEsD}\n}",
        "github": "",
        "project": "",
        "reviewers": "xCiG;tFyE;RsWP",
        "site": "https://openreview.net/forum?id=yisfNWUEsD",
        "pdf_size": 665986,
        "rating": "5;6;6",
        "confidence": "5;4;4",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "4;3;3",
        "wc_summary": "79;64;68",
        "wc_strengths": "50;42;25",
        "wc_weaknesses": "227;177;82",
        "wc_questions": "12;2;28",
        "wc_review": "368;285;203",
        "wc_reply_reviewers": "240;0;0",
        "wc_reply_authors": "2932;508;967",
        "reply_reviewers": "2;0;0",
        "reply_authors": "7;1;2",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            70.33333333333333,
            6.342099196813483
        ],
        "wc_strengths_avg": [
            39.0,
            10.424330514074594
        ],
        "wc_weaknesses_avg": [
            162.0,
            60.13872850889572
        ],
        "wc_questions_avg": [
            14.0,
            10.708252269472673
        ],
        "wc_review_avg": [
            285.3333333333333,
            67.36138029728573
        ],
        "wc_reply_reviewers_avg": [
            80.0,
            113.13708498984761
        ],
        "wc_reply_authors_avg": [
            1469.0,
            1051.3315366714726
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.9428090415820634
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            2.6246692913372702
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.9999999999999998,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3819779759135546455&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1;2;3",
        "aff_unique_norm": "Tencent;Microsoft;Peking University;Renmin University of China",
        "aff_unique_dep": "Tencent AI Lab;Microsoft Corporation;;",
        "aff_unique_url": "https://ai.tencent.com;https://www.microsoft.com;http://www.pku.edu.cn;http://www.ruc.edu.cn",
        "aff_unique_abbr": "Tencent AI Lab;Microsoft;Peking U;RUC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "yiyDi50xx6",
        "title": "GLASU: A Communication-Efficient Algorithm for Federated Learning with Vertically Distributed Graph Data",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Vertical federated learning (VFL) is a distributed learning paradigm, where computing clients collectively train a model based on the partial features of the same set of samples they possess. Current research on VFL focuses on the case when samples are independent, but it rarely addresses an emerging scenario when samples are interrelated through a graph. In this work, we train a graph neural network (GNN) through VFL, where each client owns a part of the node features and a different edge set. This data scenario incurs a significant communication overhead, not only because of the handling of distributed features but also due to neighborhood aggregation in a GNN. Moreover, the training analysis is faced with a challenge caused by the biased stochastic gradients. We propose a model-splitting method that splits a backbone GNN across the clients and the server and a communication-efficient algorithm, GLASU, to train such a model. GLASU adopts lazy aggregation and stale updates to skip communication in neighborhood aggregation and in model updates, respectively, greatly reducing communication while enjoying convergence guarantees. We conduct extensive numerical experiments on real-world datasets, showing that GLASU effectively trains a GNN that matches the accuracy of centralized training, while using only a fraction of the time due to communication saving.",
        "keywords": "Federated Learning;Graph Neural Network;Feature Distributed Federated Learning",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/d01ffa7e4fb284bf851ca8a425ab64e9c4c36087.zip",
        "author": "Xinwei Zhang;Mingyi Hong;Jie Chen",
        "authorids": "~Xinwei_Zhang1;~Mingyi_Hong1;~Jie_Chen1",
        "gender": "M;M;",
        "homepage": "https://564612540.github.io/;http://people.ece.umn.edu/~mhong/mingyi.html;https://jiechenjiechen.github.io",
        "dblp": "55/9870-1.html;57/8053;92/6289-7",
        "google_scholar": "uq46meMAAAAJ;qRnP-p0AAAAJ;Z-lkme8AAAAJ",
        "orcid": "0000-0001-7967-7150;;",
        "linkedin": ";;",
        "or_profile": "~Xinwei_Zhang1;~Mingyi_Hong1;~Jie_Chen1",
        "aff": "University of Southern California;University of Minnesota, Minneapolis;International Business Machines",
        "aff_domain": "usc.edu;umn.edu;ibm.com",
        "position": "Postdoc;Associate Professor;Research Staff Member",
        "bibtex": "@misc{\nzhang2024glasu,\ntitle={{GLASU}: A Communication-Efficient Algorithm for Federated Learning with Vertically Distributed Graph Data},\nauthor={Xinwei Zhang and Mingyi Hong and Jie Chen},\nyear={2024},\nurl={https://openreview.net/forum?id=yiyDi50xx6}\n}",
        "github": "",
        "project": "",
        "reviewers": "fTEG;XhfX;zunS;771W",
        "site": "https://openreview.net/forum?id=yiyDi50xx6",
        "pdf_size": 1116485,
        "rating": "3;3;5;5",
        "confidence": "4;4;3;3",
        "soundness": "2;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "74;52;72;86",
        "wc_strengths": "113;21;78;71",
        "wc_weaknesses": "326;200;313;64",
        "wc_questions": "60;93;11;30",
        "wc_review": "573;366;474;251",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            71.0,
            12.206555615733702
        ],
        "wc_strengths_avg": [
            70.75,
            32.83576556135093
        ],
        "wc_weaknesses_avg": [
            225.75,
            105.46178217724182
        ],
        "wc_questions_avg": [
            48.5,
            31.06847276581197
        ],
        "wc_review_avg": [
            416.0,
            120.14366400272634
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2907959984743993156&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "University of Southern California;University of Minnesota;International Business Machines Corporation",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.usc.edu;https://www.minnesota.edu;https://www.ibm.com",
        "aff_unique_abbr": "USC;UMN;IBM",
        "aff_campus_unique_index": "0;1",
        "aff_campus_unique": "Los Angeles;Minneapolis;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "yjX303Smre",
        "title": "Reinforcement Learning of Diverse Skills using Mixture of Deep Experts",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Agents that can acquire diverse skills to solve the same task have a benefit over other agents. Unexpected environmental changes for example may prohibit executing a learned behavior such that a complete retraining is necessary if the agent can not discard the invalid skill and rely on previously acquired, different ones. \nHowever, Reinforcement Learning (RL) policies mainly rely on Gaussian parameterization, preventing them from learning multi-modal, diverse skills. In this work, we propose a novel RL approach for training policies that exhibit diverse behavior. To this end, we propose a highly non-linear Mixture of Experts (MoE) as the policy representation, where each expert formalizes a skill as a contextual motion primitive. The context defines the task, which can be for instance the goal reaching position of the agent, or changing physical parameters like friction. Given a context, our trained policy first selects an expert out of the repertoire of skills and subsequently adapts the parameters of the contextual motion primitive. \nTo incentivize our policy to learn diverse skills, we leverage a maximum entropy objective combined with a per-expert context distribution that we optimize alongside each expert. The per-expert context distribution allows each expert to focus on a context sub-space and boost learning speed. However, these distributions need to be able to represent multi-modality and hard discontinuities in the environment's context probability space. Moreover, the distributions should not rely on environmental pre-knowledge such as context boundaries, as they are usually not given. We solve these requirements by leveraging energy-based models to represent the per-expert context distributions and show how we can efficiently train them using the standard policy gradient objective. We show that our approach can learn precise and diverse skills of challenging robot simulation tasks.",
        "keywords": "Diverse Skill Learning;black box reinforcement learning;versatile skill learning;mixture of experts policy",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/469f7aac1e845f90df232a54c497c5efa4396da2.zip",
        "author": "Onur Celik;Gerhard Neumann",
        "authorids": "~Onur_Celik1;~Gerhard_Neumann2",
        "gender": "M;M",
        "homepage": "https://alr.anthropomatik.kit.edu/21_69.php;https://alr.anthropomatik.kit.edu/",
        "dblp": "243/5913;60/4878",
        "google_scholar": "9jqaTcAAAAAJ;https://scholar.google.com.tw/citations?user=GL360kMAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Onur_Celik1;~Gerhard_Neumann1",
        "aff": "Karlsruhe Institute of Technology;Karlsruhe Institute of Technology",
        "aff_domain": "kit.edu;kit.edu",
        "position": "PhD student;Full Professor",
        "bibtex": "@misc{\ncelik2024reinforcement,\ntitle={Reinforcement Learning of Diverse Skills using Mixture of Deep Experts},\nauthor={Onur Celik and Gerhard Neumann},\nyear={2024},\nurl={https://openreview.net/forum?id=yjX303Smre}\n}",
        "github": "",
        "project": "",
        "reviewers": "ydwi;w2WU;vLLv;BduN",
        "site": "https://openreview.net/forum?id=yjX303Smre",
        "pdf_size": 2122277,
        "rating": "5;5;6;6",
        "confidence": "3;3;3;3",
        "soundness": "2;3;2;2",
        "contribution": "2;2;2;3",
        "presentation": "1;2;2;3",
        "wc_summary": "75;120;89;54",
        "wc_strengths": "15;73;65;90",
        "wc_weaknesses": "90;41;54;210",
        "wc_questions": "37;423;2;148",
        "wc_review": "217;657;210;502",
        "wc_reply_reviewers": "35;92;8;21",
        "wc_reply_authors": "1382;2776;890;1640",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "5;5;3;4",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            84.5,
            23.984369910422913
        ],
        "wc_strengths_avg": [
            60.75,
            27.913930214142187
        ],
        "wc_weaknesses_avg": [
            98.75,
            66.69098514791935
        ],
        "wc_questions_avg": [
            152.5,
            165.2127416393784
        ],
        "wc_review_avg": [
            396.5,
            191.04515173120726
        ],
        "wc_reply_reviewers_avg": [
            39.0,
            32.05464084964921
        ],
        "wc_reply_authors_avg": [
            1672.0,
            692.0014450851963
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            4.25,
            0.82915619758885
        ],
        "replies_avg": [
            30,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:YeZhE7cd85cJ:scholar.google.com/&scioq=Reinforcement+Learning+of+Diverse+Skills+using+Mixture+of+Deep+Experts&hl=en&as_sdt=0,23",
        "gs_version_total": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Karlsruhe Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.kit.edu",
        "aff_unique_abbr": "KIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Germany"
    },
    {
        "title": "Incentivized Truthful Communication for Federated Bandits",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17407",
        "id": "ykEixGIJYb",
        "author_site": "Zhepei Wei, Chuanhao Li, Tianze Ren, Haifeng Xu, Hongning Wang",
        "tldr": "",
        "abstract": "To enhance the efficiency and practicality of federated bandit learning, recent advances have introduced incentives to motivate communication among clients, where a client participates only when the incentive offered by the server outweighs its participation cost. However, existing incentive mechanisms naively assume the clients are truthful: they all report their true cost and thus the higher cost one participating client claims, the more the server has to pay. Therefore, such mechanisms are vulnerable to strategic clients aiming to optimize their own utility by misreporting. To address this issue, we propose an incentive compatible (i.e., truthful) communication protocol, named Truth-FedBan, where the incentive for each participant is independent of its self-reported cost, and reporting the true cost is the only way to achieve the best utility. More importantly, Truth-FedBan still guarantees the sub-linear regret and communication cost without any overhead. In other words, the core conceptual contribution of this paper is, for the first time, demonstrating the possibility of simultaneously achieving incentive compatibility and nearly optimal regret in federated bandit learning. Extensive numerical studies further validate the effectiveness of our proposed solution.",
        "keywords": "Contextual bandit;Federated learning;Truthful mechanism design",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/1f98a93a46d8beb43caab5eccbcdbebe155ec741.pdf",
        "author": "Zhepei Wei;Chuanhao Li;Tianze Ren;Haifeng Xu;Hongning Wang",
        "authorids": "~Zhepei_Wei1;~Chuanhao_Li1;tr2bx@virginia.edu;~Haifeng_Xu1;~Hongning_Wang1",
        "gender": "M;;;M;M",
        "homepage": "https://weizhepei.com;https://cyrilli.github.io/;;http://www.haifeng-xu.com/;http://www.cs.virginia.edu/~hw5x/",
        "dblp": "247/2560;195/9947;;04/1895;05/6545",
        "google_scholar": "qiK3538AAAAJ;w2ShljkAAAAJ;;nLgg388AAAAJ;qkdvKNoAAAAJ",
        "orcid": ";;;;0000-0002-6524-9195",
        "linkedin": "weizhepei/;;;;",
        "or_profile": "~Zhepei_Wei1;~Chuanhao_Li1;tr2bx@virginia.edu;~Haifeng_Xu1;~Hongning_Wang1",
        "aff": "University of Virginia;Yale University;;University of Chicago;Tsinghua University",
        "aff_domain": "virginia.edu;yale.edu;;cs.uchicago.edu;tsinghua.edu.cn",
        "position": "PhD student;Postdoc;;Assistant Professor;Associate Professor",
        "bibtex": "@inproceedings{\nwei2024incentivized,\ntitle={Incentivized Truthful Communication for Federated Bandits},\nauthor={Zhepei Wei and Chuanhao Li and Tianze Ren and Haifeng Xu and Hongning Wang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ykEixGIJYb}\n}",
        "github": "",
        "project": "",
        "reviewers": "Jfq6;ihns;3EFN;1gFC",
        "pdf_size": 1401555,
        "rating": "6;6;8;8",
        "confidence": "2;2;4;4",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;2;2",
        "wc_summary": "54;100;43;183",
        "wc_strengths": "29;33;50;113",
        "wc_weaknesses": "309;79;440;664",
        "wc_questions": "35;34;9;7",
        "wc_review": "427;246;542;967",
        "wc_reply_reviewers": "158;95;280;1280",
        "wc_reply_authors": "2198;348;3727;3943",
        "reply_reviewers": "2;1;2;3",
        "reply_authors": "5;1;7;8",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.0,
            1.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            95.0,
            55.122590650295095
        ],
        "wc_strengths_avg": [
            56.25,
            33.699962907991456
        ],
        "wc_weaknesses_avg": [
            373.0,
            211.95636343360866
        ],
        "wc_questions_avg": [
            21.25,
            13.273563952458284
        ],
        "wc_review_avg": [
            545.5,
            265.2437558171728
        ],
        "wc_reply_reviewers_avg": [
            453.25,
            481.93535614229427
        ],
        "wc_reply_authors_avg": [
            2554.0,
            1440.3490896307048
        ],
        "reply_reviewers_avg": [
            2.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            5.25,
            2.680951323690902
        ],
        "replies_avg": [
            41,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5227592923003639867&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=ykEixGIJYb",
        "pdf": "https://openreview.net/pdf?id=ykEixGIJYb",
        "email": "virginia.edu;yale.edu;;cs.uchicago.edu;tsinghua.edu.cn",
        "author_num": 5,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "University of Virginia;Yale University;University of Chicago;Tsinghua University",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.virginia.edu;https://www.yale.edu;https://www.uchicago.edu;https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "UVA;Yale;UChicago;THU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "ykW3hvy6DL",
        "title": "Achieving Margin Maximization Exponentially Fast via Progressive Norm Rescaling",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In this work, we investigate the margin-maximization bias exhibited by gradient-based algorithms in classifying linearly separable data. We present an in-depth analysis of the specific  properties of  the velocity field associated with (normalized) gradients, focusing on their role in   margin maximization. Inspired by this analysis, we propose a novel algorithm called  Progressive Rescaling Gradient Descent (PRGD) and show that PRGD can maximize the margin at an exponential rate. This stands in stark contrast to all existing algorithms, which maximize the margin at a slow polynomial rate. Notably,  we identify mild conditions, under which we  show that existing algorithms such as gradient descent (GD) and normalized gradient descent (NGD) provably fail in maximizing the margin efficiently.   To validate our theoretical findings, we present  both synthetic and real-world experiments. Notably, PRGD also shows promise in enhancing the generalization performance when applied to linearly non-separable datasets and deep neural networks.",
        "keywords": "implicit bias;exponentially fast;margin maximization",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Mingze Wang;Zeping Min;Lei Wu",
        "authorids": "~Mingze_Wang2;~Zeping_Min1;~Lei_Wu1",
        "gender": ";;M",
        "homepage": "https://wmz9.github.io/;;https://leiwu0.github.io/",
        "dblp": "296/7556;;",
        "google_scholar": "CkU47X0AAAAJ;;CMweeYcAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Mingze_Wang2;~Zeping_Min1;~Lei_Wu1",
        "aff": "Peking University;;Peking University",
        "aff_domain": "pku.edu.cn;;math.pku.edu.cn",
        "position": "PhD student;;Assistant Professor",
        "bibtex": "@misc{\nwang2024achieving,\ntitle={Achieving Margin Maximization Exponentially Fast via Progressive Norm Rescaling},\nauthor={Mingze Wang and Zeping Min and Lei Wu},\nyear={2024},\nurl={https://openreview.net/forum?id=ykW3hvy6DL}\n}",
        "github": "",
        "project": "",
        "reviewers": "uCJS;WCCZ;wv8x",
        "site": "https://openreview.net/forum?id=ykW3hvy6DL",
        "pdf_size": 742799,
        "rating": "3;5;6",
        "confidence": "4;4;3",
        "soundness": "3;3;3",
        "contribution": "2;2;3",
        "presentation": "2;3;3",
        "wc_summary": "94;52;70",
        "wc_strengths": "177;46;85",
        "wc_weaknesses": "503;148;72",
        "wc_questions": "27;35;113",
        "wc_review": "801;281;340",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            72.0,
            17.204650534085253
        ],
        "wc_strengths_avg": [
            102.66666666666667,
            54.92014404771916
        ],
        "wc_weaknesses_avg": [
            241.0,
            187.84213229908423
        ],
        "wc_questions_avg": [
            58.333333333333336,
            38.79289740260308
        ],
        "wc_review_avg": [
            474.0,
            232.4750882711235
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.7559289460184545,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17621373031727627894&as_sdt=5,39&sciodt=0,39&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Peking University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.pku.edu.cn",
        "aff_unique_abbr": "Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "ykhRO1mAg3",
        "title": "FPTQ: FINE-GRAINED POST-TRAINING QUANTIZATION FOR LARGE LANGUAGE MODELS",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In the era of large-scale language models, the substantial parameter size poses significant challenges for deployment. Being a prevalent compression technique, quantization has emerged as the mainstream practice to tackle this issue, which is mainly centered on two recipes W8A8 and W4A16 (i.e. weights and activations in such bit widths). In this study, we propose a novel W4A8 post-training quantization method for the available open-sourced LLMs, which combines the advantages of both two recipes. Therefore, we can leverage the benefit in the I/O utilization of 4-bit weight quantization and the acceleration due to 8-bit matrix computation. Nevertheless, the W4A8 faces notorious performance degradation. As a remedy, we involve layerwise activation quantization strategies which feature a novel logarithmic equalization for most intractable layers, and we combine them with fine-grained weight quantization. Without whistles and bells, we eliminate the necessity for further fine-tuning and obtain the state-of-the-art W4A8 quantized performance on BLOOM, LLaMA, and LLaMA-2 on standard benchmarks. We confirm that the W4A8 quantization is achievable for the deployment of large language models, fostering their wide-spreading real-world applications.",
        "keywords": "LLMs;quantization",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "QINGYUAN LI;Yifan Zhang;Liang Li;Bo Zhang",
        "authorids": "~QINGYUAN_LI3;~Yifan_Zhang14;~Liang_Li10;~Bo_Zhang7",
        "gender": "M;M;M;M",
        "homepage": "https://github.com/415905716;https://myaccount.google.com/?hl=zh-CN;;https://github.com/lippman1125",
        "dblp": ";;36/2259-46;",
        "google_scholar": ";z_fYeJoAAAAJ;uUNQnu0AAAAJ;ojNmN8AAAAAJ",
        "orcid": ";;0000-0003-0564-617X;",
        "linkedin": ";;bo-zhang-20a86588/;",
        "or_profile": "~Yifan_Zhang14;~Liang_Li10;~Bo_Zhang7;~Qingyuan_Li1",
        "aff": "Nanjing University;Meituan;Meituan Inc.;meituan",
        "aff_domain": "nju.edu.cn;meituan.com;meituan.com;meituan.com",
        "position": "MS student;Researcher;Senior Software Engineer;employee",
        "bibtex": "@misc{\nli2024fptq,\ntitle={{FPTQ}: {FINE}-{GRAINED} {POST}-{TRAINING} {QUANTIZATION} {FOR} {LARGE} {LANGUAGE} {MODELS}},\nauthor={QINGYUAN LI and Yifan Zhang and Liang Li and Bo Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=ykhRO1mAg3}\n}",
        "github": "",
        "project": "",
        "reviewers": "uu7J;yeXC;WDjT",
        "site": "https://openreview.net/forum?id=ykhRO1mAg3",
        "pdf_size": 542296,
        "rating": "3;3;6",
        "confidence": "4;5;4",
        "soundness": "2;1;3",
        "contribution": "1;2;2",
        "presentation": "2;1;3",
        "wc_summary": "82;175;122",
        "wc_strengths": "67;19;49",
        "wc_weaknesses": "146;179;73",
        "wc_questions": "128;191;80",
        "wc_review": "423;564;324",
        "wc_reply_reviewers": "26;23;26",
        "wc_reply_authors": "524;358;727",
        "reply_reviewers": "1;1;1",
        "reply_authors": "2;2;1",
        "rating_avg": [
            4.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            126.33333333333333,
            38.09053542402481
        ],
        "wc_strengths_avg": [
            45.0,
            19.79898987322333
        ],
        "wc_weaknesses_avg": [
            132.66666666666666,
            44.28945196720722
        ],
        "wc_questions_avg": [
            133.0,
            45.45327270945405
        ],
        "wc_review_avg": [
            437.0,
            98.47842403288143
        ],
        "wc_reply_reviewers_avg": [
            25.0,
            1.4142135623730951
        ],
        "wc_reply_authors_avg": [
            536.3333333333334,
            150.8958434005243
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 24,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1034390418154610968&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "Nanjing University;Meituan;Meituan Inc.",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.nju.edu.cn;https://www.meituan.com;https://www.meituan.com",
        "aff_unique_abbr": "Nanjing U;Meituan;Meituan",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "ylHLVq0psd",
        "title": "Rethinking the Noise Schedule of Diffusion-Based Generative Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In this work, we undertake both theoretical and empirical analysis of noise scheduling strategies within the scope of denoising diffusion generative models. We investigate the training noise schedule through the lens of power spectrum and introduce a novel metric, weighted signal-noise-ratio (WSNR), to uniformly represent the noise level in both RGB and latent spaces, enhancing the performance of high-resolution models in these spaces with WSNR-Equivalent training noise schedules. Further, we examine the reverse sampling process using the framework of Ordinary Differential Equations (ODEs), elucidating the concept of the optimal denoiser and providing insights into data-driven sampling noise schedules. We explore the correlation between the number of evaluation points and the generation quality to optimize the acceleration of the ODE solver in the diffusion model. Based on practical considerations of evaluation point effects, we propose an adaptive scheme to choose numerical methods within computational constraints, balancing efficacy and efficiency. Our approach, requiring no additional training, refines the FID of pre-trained CIFAR-10 and FFHQ-64 models from 1.92 and 2.45 to 1.89 and 2.25, respectively, utilizing 35 network evaluations per image.",
        "keywords": "Diffusion Model",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Qiushan Guo;Sifei Liu;Yizhou Yu;Ping Luo",
        "authorids": "~Qiushan_Guo1;~Sifei_Liu2;~Yizhou_Yu1;~Ping_Luo2",
        "gender": "M;F;M;",
        "homepage": "https://guoqiushan.github.io/;https://www.sifeiliu.net;;http://luoping.me/",
        "dblp": "231/1814;118/1301;90/6896.html;54/4989-2.html",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;j4pcHV4AAAAJ;e38fTZQAAAAJ;https://scholar.google.com.hk/citations?hl=en",
        "orcid": ";;;0000-0002-6685-7950",
        "linkedin": ";;;",
        "or_profile": "~Qiushan_Guo1;~Sifei_Liu2;~Yizhou_Yu1;~Luo_Ping2",
        "aff": "The University of Hong Kong;NVIDIA;The University of Hong Kong;The University of Hong Kong",
        "aff_domain": "hku.hk;nvidia.com;hku.hk;hku.hk",
        "position": "PhD student;Researcher;Full Professor;Associate Professor",
        "bibtex": "@misc{\nguo2024rethinking,\ntitle={Rethinking the Noise Schedule of Diffusion-Based Generative Models},\nauthor={Qiushan Guo and Sifei Liu and Yizhou Yu and Ping Luo},\nyear={2024},\nurl={https://openreview.net/forum?id=ylHLVq0psd}\n}",
        "github": "",
        "project": "",
        "reviewers": "d8X8;pugY;9Ms4;nhAz;QVZ8;jyko",
        "site": "https://openreview.net/forum?id=ylHLVq0psd",
        "pdf_size": 3256742,
        "rating": "3;5;5;6;6;8",
        "confidence": "4;4;3;3;3;4",
        "soundness": "1;2;3;3;3;4",
        "contribution": "2;3;3;3;3;3",
        "presentation": "1;3;2;2;3;4",
        "wc_summary": "57;109;126;47;49;88",
        "wc_strengths": "14;71;183;71;54;58",
        "wc_weaknesses": "278;83;103;145;61;1",
        "wc_questions": "58;7;22;6;4;49",
        "wc_review": "407;270;434;269;168;196",
        "wc_reply_reviewers": "0;0;0;0;0;0",
        "wc_reply_authors": "1603;1217;961;442;491;181",
        "reply_reviewers": "0;0;0;0;0;0",
        "reply_authors": "7;6;5;1;1;1",
        "rating_avg": [
            5.5,
            1.5
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.8333333333333335,
            0.3726779962499649
        ],
        "presentation_avg": [
            2.5,
            0.9574271077563381
        ],
        "wc_summary_avg": [
            79.33333333333333,
            30.543229837214156
        ],
        "wc_strengths_avg": [
            75.16666666666667,
            51.87618807207107
        ],
        "wc_weaknesses_avg": [
            111.83333333333333,
            86.10926521319035
        ],
        "wc_questions_avg": [
            24.333333333333332,
            21.59217965426886
        ],
        "wc_review_avg": [
            290.6666666666667,
            99.14915811823899
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            815.8333333333334,
            491.58261993506466
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            3.5,
            2.565800719723442
        ],
        "replies_avg": [
            31,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.11111111111111109,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1360119460043352752&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;0",
        "aff_unique_norm": "University of Hong Kong;NVIDIA",
        "aff_unique_dep": ";NVIDIA Corporation",
        "aff_unique_url": "https://www.hku.hk;https://www.nvidia.com",
        "aff_unique_abbr": "HKU;NVIDIA",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "yldBrD4nYB",
        "title": "CI-VAE: a Generative Deep Learning Model for Class-Specific Data Interpolation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We propose a new variant of Variational Autoencoder (VAE), Class-Informed VAE (CI-VAE), that enables interpolation between arbitrary pairs of observations of the same class. CI-VAE combines the general VAE architecture with a linear discriminator layer on the latent space to enforce the construction of a latent space where observations from different classes are linearly separable. This allows for robust latent-space linear traversal and data generation between two arbitrary observations of the same class, which has potential applications in science and engineering. One specific application is to enhance understanding of the biological processes involving the development of diseases or cancer from healthy cells. We demonstrate the effectiveness of CI-VAE on the MNIST dataset of handwritten digits, showing that it significantly improves class-specific linear traversal and data augmentation compared to VAE while maintaining comparable reconstruction error. We also apply CI-VAE to a study of colon cancer single-cell genomics data, showing that interpolation between normal cells and tumor cells using CI-VAE may enhance our understanding of the mechanism of cancer development.",
        "keywords": "Deep Learning;Generative Models;Class-Specific Interpolation;Variational Auto-Encoder",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/ca97cbbf62eaa46daa35e0ff85ac212d16e754bf.pdf",
        "author": "Mohsen Nabian;Zahra Eftekhari;Chi Wah Wong",
        "authorids": "~Mohsen_Nabian1;~Zahra_Eftekhari1;~Chi_Wah_Wong1",
        "gender": "M;F;M",
        "homepage": ";;",
        "dblp": ";;99/11106",
        "google_scholar": "NqRDPsYAAAAJ;;kV8jCaAAAAAJ",
        "orcid": ";;0000-0002-2833-979X",
        "linkedin": ";nasim-eftekhari-15b343108/;",
        "or_profile": "~Mohsen_Nabian1;~Zahra_Eftekhari1;~Chi_Wah_Wong1",
        "aff": ";City of Hope;City of Hope",
        "aff_domain": ";coh.org;coh.org",
        "position": ";Researcher;Principal Researcher",
        "bibtex": "@misc{\nnabian2024civae,\ntitle={{CI}-{VAE}: a Generative Deep Learning Model for Class-Specific Data Interpolation},\nauthor={Mohsen Nabian and Zahra Eftekhari and Chi Wah Wong},\nyear={2024},\nurl={https://openreview.net/forum?id=yldBrD4nYB}\n}",
        "github": "",
        "project": "",
        "reviewers": "UN5b;GLdb;Jd7b",
        "site": "https://openreview.net/forum?id=yldBrD4nYB",
        "pdf_size": 8062836,
        "rating": "1;1;3",
        "confidence": "4;5;4",
        "soundness": "2;2;4",
        "contribution": "1;1;1",
        "presentation": "1;1;3",
        "wc_summary": "47;53;30",
        "wc_strengths": "39;21;50",
        "wc_weaknesses": "286;392;230",
        "wc_questions": "93;4;8",
        "wc_review": "465;470;318",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "contribution_avg": [
            1.0,
            0.0
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            43.333333333333336,
            9.741092797468305
        ],
        "wc_strengths_avg": [
            36.666666666666664,
            11.953614051360738
        ],
        "wc_weaknesses_avg": [
            302.6666666666667,
            67.17803873952326
        ],
        "wc_questions_avg": [
            35.0,
            41.04469108991645
        ],
        "wc_review_avg": [
            417.6666666666667,
            70.50453098127021
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:BW4EupQZZEkJ:scholar.google.com/&scioq=CI-VAE:+a+Generative+Deep+Learning+Model+for+Class-Specific+Data+Interpolation&hl=en&as_sdt=0,5",
        "gs_version_total": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "City of Hope",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cityofhope.org",
        "aff_unique_abbr": "",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Pre-Training and Fine-Tuning Generative Flow Networks",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17406",
        "id": "ylhiMfpqkm",
        "author_site": "Ling Pan, Moksh Jain, Kanika Madan, Yoshua Bengio",
        "tldr": "",
        "abstract": "Generative Flow Networks (GFlowNets) are amortized samplers that learn stochastic policies to sequentially generate compositional objects from a given unnormalized reward distribution.\nThey can generate diverse sets of high-reward objects, which is an important consideration in scientific discovery tasks. However, as they are typically trained from a given extrinsic reward function, it remains an important open challenge about how to leverage the power of pre-training and train GFlowNets in an unsupervised fashion for efficient adaptation to downstream tasks.\nInspired by recent successes of unsupervised pre-training in various domains, we introduce a novel approach for reward-free pre-training of GFlowNets. By framing the training as a self-supervised problem, we propose an outcome-conditioned GFlowNet (OC-GFN) that learns to explore the candidate space. Specifically, OC-GFN learns to reach any targeted outcomes, akin to goal-conditioned policies in reinforcement learning. \nWe show that the pre-trained OC-GFN model can allow for a direct extraction of a policy capable of sampling from any new reward functions in downstream tasks.\nNonetheless, adapting OC-GFN on a downstream task-specific reward involves an intractable marginalization over possible outcomes. We propose a novel way to approximate this marginalization by learning an amortized predictor enabling efficient fine-tuning.\nExtensive experimental results validate the efficacy of our approach, demonstrating the effectiveness of pre-training the OC-GFN, and its ability to swiftly adapt to downstream tasks and discover modes more efficiently.\nThis work may serve as a foundation for further exploration of pre-training strategies in the context of GFlowNets.",
        "keywords": "Generative Flow Network (GFlowNets);Pre-train;Goal-conditioned",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Ling Pan;Moksh Jain;Kanika Madan;Yoshua Bengio",
        "authorids": "~Ling_Pan1;~Moksh_Jain1;~Kanika_Madan3;~Yoshua_Bengio1",
        "gender": "F;M;;M",
        "homepage": "https://ling-pan.github.io/;https://mj10.github.io;;http://yoshuabengio.org",
        "dblp": "199/9303/;249/9368;;56/953",
        "google_scholar": "qZ_zlacAAAAJ;TD07G_wAAAAJ;;kukA0LcAAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;yoshuabengio/?originalSubdomain=ca",
        "or_profile": "~Ling_Pan1;~Moksh_Jain1;~Kanika_Madan3;~Yoshua_Bengio1",
        "aff": "Montreal Institute for Learning Algorithms (MILA);Universit\u00e9 de Montr\u00e9al;;University of Montreal",
        "aff_domain": "mila.umontreal.ca;umontreal.ca;;umontreal.ca",
        "position": "Postdoc;PhD student;;Full Professor",
        "bibtex": "@inproceedings{\npan2024pretraining,\ntitle={Pre-Training and Fine-Tuning Generative Flow Networks},\nauthor={Ling Pan and Moksh Jain and Kanika Madan and Yoshua Bengio},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ylhiMfpqkm}\n}",
        "github": "",
        "project": "",
        "reviewers": "ja74;5Pd3;gG5W;Deqj",
        "pdf_size": 3969575,
        "rating": "6;6;8;8",
        "confidence": "4;4;4;3",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "139;58;110;55",
        "wc_strengths": "145;62;75;44",
        "wc_weaknesses": "274;16;31;2",
        "wc_questions": "64;45;263;49",
        "wc_review": "622;181;479;150",
        "wc_reply_reviewers": "0;0;321;0",
        "wc_reply_authors": "1498;1084;1122;287",
        "reply_reviewers": "0;0;2;0",
        "reply_authors": "4;4;5;1",
        "rating_avg": [
            7.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            90.5,
            35.52815784698103
        ],
        "wc_strengths_avg": [
            81.5,
            38.27858409084641
        ],
        "wc_weaknesses_avg": [
            80.75,
            112.04323942121631
        ],
        "wc_questions_avg": [
            105.25,
            91.35199778877308
        ],
        "wc_review_avg": [
            358.0,
            199.33012817935978
        ],
        "wc_reply_reviewers_avg": [
            80.25,
            138.9970773074024
        ],
        "wc_reply_authors_avg": [
            997.75,
            441.10450859178485
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            3.5,
            1.5
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 17,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12166299640962461554&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=ylhiMfpqkm",
        "pdf": "https://openreview.net/pdf?id=ylhiMfpqkm",
        "email": "mila.umontreal.ca;umontreal.ca;;umontreal.ca",
        "author_num": 4,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Montreal Institute for Learning Algorithms;Universit\u00e9 de Montr\u00e9al;University of Montreal",
        "aff_unique_dep": "Artificial Intelligence;;",
        "aff_unique_url": "https://mila.quebec;https://www.umontreal.ca;https://wwwumontreal.ca",
        "aff_unique_abbr": "MILA;UdeM;UM",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Montreal;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Canada"
    },
    {
        "title": "Image Background Serves as Good Proxy for Out-of-distribution Data",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17405",
        "id": "ym0ubZrsmm",
        "tldr": "",
        "abstract": "Out-of-distribution (OOD) detection empowers the model trained on the closed image set to identify unknown data in the open world. Though many prior techniques have yielded considerable improvements in this research direction, two crucial obstacles still remain. Firstly, a unified perspective has yet to be presented to view the developed arts with individual designs, which is vital for providing insights into future work. Secondly, we expect sufficient natural OOD supervision to promote the generation of compact boundaries between the in-distribution (ID) and OOD data without collecting explicit OOD samples. To tackle these issues, we propose a general probabilistic framework to interpret many existing methods and an OOD-data-free model, namely $\\textbf{S}$elf-supervised $\\textbf{S}$ampling for $\\textbf{O}$OD $\\textbf{D}$etection (SSOD). SSOD efficiently exploits natural OOD signals from the ID data based on the local property of convolution. With these supervisions, it jointly optimizes the OOD detection and conventional ID classification in an end-to-end manner. Extensive experiments reveal that SSOD establishes competitive state-of-the-art performance on many large-scale benchmarks, outperforming the best previous method by a large margin, e.g., reporting $\\textbf{-6.28}$% FPR95 and $\\textbf{+0.77}$% AUROC on ImageNet, $\\textbf{-19.01}$% FPR95 and $\\textbf{+3.04}$% AUROC on CIFAR-10, and top-ranked performance on hard OOD datasets, i.e., ImageNet-O and OpenImage-O.",
        "keywords": "Out-of-distribution detection;OOD supervision;robust image classification",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/d5be46357a8c3e37d39e09016908747c384da508.zip",
        "author": "Sen Pei",
        "authorids": "~Sen_Pei1",
        "gender": "M",
        "homepage": "https://github.com/ForeverPs",
        "dblp": "129/1503",
        "google_scholar": "jQKjG2UAAAAJ",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Sen_Pei1",
        "aff": "",
        "aff_domain": "",
        "position": "",
        "bibtex": "@inproceedings{\npei2024image,\ntitle={Image Background Serves as Good Proxy for Out-of-distribution Data},\nauthor={Sen Pei},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ym0ubZrsmm}\n}",
        "github": "",
        "project": "",
        "reviewers": "EtXA;u8Y6;f34F;TJ6P;ajFn;f65W",
        "pdf_size": 8096298,
        "rating": "3;3;6;6;6;8",
        "confidence": "4;3;3;5;2;3",
        "soundness": "2;1;3;3;3;4",
        "contribution": "2;2;2;3;3;3",
        "presentation": "2;3;3;3;3;4",
        "wc_summary": "113;49;64;125;111;145",
        "wc_strengths": "26;35;80;65;50;121",
        "wc_weaknesses": "373;360;120;456;97;70",
        "wc_questions": "2;6;179;114;85;9",
        "wc_review": "514;450;443;760;343;345",
        "wc_reply_reviewers": "0;555;0;247;19;0",
        "wc_reply_authors": "1058;1046;595;1188;469;165",
        "reply_reviewers": "0;2;0;2;1;0",
        "reply_authors": "2;2;1;2;1;1",
        "rating_avg": [
            5.333333333333333,
            1.7950549357115013
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.5773502691896257
        ],
        "wc_summary_avg": [
            101.16666666666667,
            33.73631409755501
        ],
        "wc_strengths_avg": [
            62.833333333333336,
            31.566948256399797
        ],
        "wc_weaknesses_avg": [
            246.0,
            153.99025943221213
        ],
        "wc_questions_avg": [
            65.83333333333333,
            66.305898849365
        ],
        "wc_review_avg": [
            475.8333333333333,
            140.66202598980138
        ],
        "wc_reply_reviewers_avg": [
            136.83333333333334,
            206.9842318202578
        ],
        "wc_reply_authors_avg": [
            753.5,
            369.5631430035558
        ],
        "reply_reviewers_avg": [
            0.8333333333333334,
            0.8975274678557507
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.1641330410746532,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=630065384203335162&as_sdt=5,31&sciodt=0,31&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=ym0ubZrsmm",
        "pdf": "https://openreview.net/pdf?id=ym0ubZrsmm",
        "email": "",
        "author_num": 1
    },
    {
        "id": "ymR2bz0cEs",
        "title": "Interaction-centric Hypersphere Reasoning for Multi-person Video HOI Recognition",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Human-object interaction (HOI) recognition in videos represents a fundamental yet intricate challenge in computer vision, requiring perception and reasoning across both spatial and temporal domains, espically in multi-person scenes. HOI encompasses humans, objects, and the interactions that bind them. These three facets exhibit interconnectedness and exert mutual influence upon one another. However, contemporary video HOI recognition methods focus on the utilization of disentangled representations, neglecting their inherent interdependencies. Our assertions are that these facets are inherently interdependent and that interactions hold essential semantic meaning in HOIs. In light of this, we propose an interaction-centric hypersphere reasoning model for multi-person video HOI recognition. Specifically, we design a context fuser to model the interdependencies among humans, objects and interactions. To encapsulates the semantic essence of video HOIs, our model adopts an interaction-centric hypersphere framework. Furthermore, to enable the model with the capacity for temporal reasoning, we introduce an interaction state reasoner module. Consequently, our model unravels the intricacies of HOI recognition and is felxiable for both multi-person and single-person scenarios. Empirical results on multi-person video HOI dataset MPHOI-72 indicates that our method surpasses state-of-the-art (SOTA) method by more than 15%. At the same time, on single-person datasets Bimanual Actions (single-human two-hand HOI) and CAD-120 (single-human HOI), our method achieves on par or even better results compared with SOTA methods.",
        "keywords": "Multi-person Video HOI recognition;Interaction-centric;Hypersphere reasoning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/95a83fe09c3d32110cb6692260445f22f0461254.pdf",
        "author": "Yisong Wang;Nan Xi;Jingjing Meng;Junsong Yuan",
        "authorids": "~Yisong_Wang3;~Nan_Xi1;~Jingjing_Meng1;~Junsong_Yuan2",
        "gender": ";M;F;M",
        "homepage": "https://github.com/pigeon23;;https://sites.google.com/site/jingjingmengsite/;https://cse.buffalo.edu/~jsyuan/",
        "dblp": ";245/7558.html;96/1653.html;42/3332",
        "google_scholar": ";https://scholar.google.com.hk/citations?user=AUgsw8oAAAAJ;https://scholar.google.com.sg/citations?user=ykFMLGkAAAAJ;fJ7seq0AAAAJ",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Yisong_Wang3;~Nan_Xi1;~Jingjing_Meng1;~Junsong_Yuan2",
        "aff": "Peking University;State University of New York at Buffalo;Amazon;State University of New York at Buffalo",
        "aff_domain": "pku.edu.cn;buffalo.edu;amazon.com;buffalo.edu",
        "position": "Undergrad student;PhD student;Researcher;Full Professor",
        "bibtex": "@misc{\nanonymous2024interactioncentric,\ntitle={Interaction-centric Hypersphere Reasoning for Multi-person Video {HOI} Recognition},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=ymR2bz0cEs}\n}",
        "github": "",
        "project": "",
        "reviewers": "3Vxe;dGtW;NfZw;dB2v",
        "site": "https://openreview.net/forum?id=ymR2bz0cEs",
        "pdf_size": 3100035,
        "rating": "3;5;5;5",
        "confidence": "4;4;4;3",
        "soundness": "1;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "2;3;2;2",
        "wc_summary": "36;58;37;96",
        "wc_strengths": "14;32;8;32",
        "wc_weaknesses": "195;51;20;80",
        "wc_questions": "42;70;570;228",
        "wc_review": "287;211;635;436",
        "wc_reply_reviewers": "0;21;0;0",
        "wc_reply_authors": "358;547;919;690",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "2;2;3;2",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            1.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            56.75,
            24.304063446263466
        ],
        "wc_strengths_avg": [
            21.5,
            10.712142642814275
        ],
        "wc_weaknesses_avg": [
            86.5,
            66.13811306652164
        ],
        "wc_questions_avg": [
            227.5,
            210.07320152746757
        ],
        "wc_review_avg": [
            392.25,
            161.84155059810814
        ],
        "wc_reply_reviewers_avg": [
            5.25,
            9.093266739736606
        ],
        "wc_reply_authors_avg": [
            628.5,
            204.9298660517788
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:H8Al1McphnIJ:scholar.google.com/&scioq=Interaction-centric+Hypersphere+Reasoning+for+Multi-person+Video+HOI+Recognition&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "Peking University;State University of New York at Buffalo;Amazon",
        "aff_unique_dep": ";;Amazon.com, Inc.",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.buffalo.edu;https://www.amazon.com",
        "aff_unique_abbr": "Peking U;SUNY Buffalo;Amazon",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Buffalo",
        "aff_country_unique_index": "0;1;1;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Consistency Trajectory Models: Learning Probability Flow ODE Trajectory of Diffusion",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17404",
        "id": "ymjI8feDTD",
        "author_site": "Dongjun Kim, Chieh-Hsin Lai, WeiHsiang Liao, Naoki Murata, Yuhta Takida, Toshimitsu Uesaka, Yutong He, Yuki Mitsufuji, Stefano Ermon",
        "tldr": "",
        "abstract": "Consistency Models (CM) (Song et al., 2023) accelerate score-based diffusion model sampling at the cost of sample quality but lack a natural way to trade-off quality for speed. To address this limitation, we propose Consistency Trajectory Model (CTM), a generalization encompassing CM and score-based models as special cases. CTM trains a single neural network that can -- in a single forward pass -- output scores (i.e., gradients of log-density) and enables unrestricted traversal between any initial and final time along the Probability Flow Ordinary Differential Equation (ODE) in a diffusion process. CTM enables the efficient combination of adversarial training and denoising score matching loss to enhance performance and achieves new state-of-the-art FIDs for single-step diffusion model sampling on CIFAR-10 (FID 1.73) and ImageNet at 64X64 resolution (FID 1.92). CTM also enables a new family of sampling schemes, both deterministic and stochastic, involving long jumps along the ODE solution trajectories. It consistently improves sample quality as computational budgets increase, avoiding the degradation seen in CM. Furthermore, unlike CM, CTM's access to the score function can streamline the adoption of established controllable/conditional generation methods from the diffusion community. This access also enables the computation of likelihood. The code is available at https://github.com/sony/ctm.",
        "keywords": "Diffusion Models; Score-based Models; Generative Models; Generative AI; Deep Generative Models; Distillation Models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/2a54591f4ef51579de69ab7331179c5bd6e9f8df.zip",
        "author": "Dongjun Kim;Chieh-Hsin Lai;Wei-Hsiang Liao;Naoki Murata;Yuhta Takida;Toshimitsu Uesaka;Yutong He;Yuki Mitsufuji;Stefano Ermon",
        "authorids": "~Dongjun_Kim1;~Chieh-Hsin_Lai2;~Wei-Hsiang_Liao1;~Naoki_Murata1;~Yuhta_Takida1;~Toshimitsu_Uesaka1;~Yutong_He1;~Yuki_Mitsufuji1;~Stefano_Ermon1",
        "gender": "M;M;M;M;M;M;F;M;M",
        "homepage": "https://sites.google.com/view/dongjun-kim?pli=1;https://chiehhsinjesselai.github.io/;;;;;https://kellyyutonghe.github.io/;https://www.yukimitsufuji.com/;http://cs.stanford.edu/~ermon/",
        "dblp": "03/4394;239/4021;18/4227;166/6626;225/9928;204/3391;;136/5043;47/8135",
        "google_scholar": "https://scholar.google.com/citations?hl=ko;KDnKGu8AAAAJ;zhV53JEAAAAJ;https://scholar.google.co.jp/citations?user=oyuTmwoAAAAJ;https://scholar.google.co.jp/citations?user=ahqdEYUAAAAJ;;uNF3hk0AAAAJ;https://scholar.google.com/citations?hl=en;",
        "orcid": ";;;0000-0001-7418-5173;;0009-0007-0747-8305;;0000-0002-6806-6140;",
        "linkedin": ";;wei-hsiang-liao-66283154/;;;;yutong-he-b7608b12b/;mittu1204;",
        "or_profile": "~Dongjun_Kim1;~Chieh-Hsin_Lai2;~Wei-Hsiang_Liao1;~Naoki_Murata1;~Yuhta_Takida1;~Toshimitsu_Uesaka1;~Yutong_He1;~Yuki_Mitsufuji1;~Stefano_Ermon1",
        "aff": "Sony AI;Sony AI;Sony Research Inc.;Sony Group Corporation;Sony AI;Sony AI;School of Computer Science, Carnegie Mellon University;Tokyo Institute of Technology, Tokyo Institute of Technology;Stanford University",
        "aff_domain": "sony.com;sony.com;sony.com;sony.com;sony.com;sony.com;cs.cmu.edu;titech.ac.jp;stanford.edu",
        "position": "Intern;Researcher;Staff Research Scientist;Researcher;AI Engineer;Researcher;PhD student;Associate Professor;Associate Professor",
        "bibtex": "@inproceedings{\nkim2024consistency,\ntitle={Consistency Trajectory Models: Learning Probability Flow {ODE} Trajectory of Diffusion},\nauthor={Dongjun Kim and Chieh-Hsin Lai and Wei-Hsiang Liao and Naoki Murata and Yuhta Takida and Toshimitsu Uesaka and Yutong He and Yuki Mitsufuji and Stefano Ermon},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ymjI8feDTD}\n}",
        "github": "",
        "project": "",
        "reviewers": "DUTv;csVy;6usj;RDDt",
        "pdf_size": 2380202,
        "rating": "6;6;6;8",
        "confidence": "3;4;4;4",
        "soundness": "3;4;3;3",
        "contribution": "3;2;3;3",
        "presentation": "3;4;3;4",
        "wc_summary": "81;78;122;69",
        "wc_strengths": "44;23;119;70",
        "wc_weaknesses": "274;131;307;226",
        "wc_questions": "65;2;23;4",
        "wc_review": "464;234;571;369",
        "wc_reply_reviewers": "12;51;0;33",
        "wc_reply_authors": "2492;1523;2475;1346",
        "reply_reviewers": "1;2;0;1",
        "reply_authors": "5;6;7;3",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            87.5,
            20.402205763103165
        ],
        "wc_strengths_avg": [
            64.0,
            35.85387008399512
        ],
        "wc_weaknesses_avg": [
            234.5,
            66.33438022624468
        ],
        "wc_questions_avg": [
            23.5,
            25.3229145242012
        ],
        "wc_review_avg": [
            409.5,
            123.98891079447388
        ],
        "wc_reply_reviewers_avg": [
            24.0,
            19.557607215607945
        ],
        "wc_reply_authors_avg": [
            1959.0,
            528.2542001726063
        ],
        "reply_reviewers_avg": [
            1.0,
            0.7071067811865476
        ],
        "reply_authors_avg": [
            5.25,
            1.479019945774904
        ],
        "replies_avg": [
            32,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 169,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16691486553739916295&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 7,
        "openreview": "https://openreview.net/forum?id=ymjI8feDTD",
        "pdf": "https://openreview.net/pdf?id=ymjI8feDTD",
        "email": "sony.com;sony.com;sony.com;sony.com;sony.com;sony.com;cs.cmu.edu;titech.ac.jp;stanford.edu",
        "author_num": 9,
        "aff_unique_index": "0;0;1;2;0;0;3;4;5",
        "aff_unique_norm": "Sony;Sony Research Inc.;Sony Group Corporation;Carnegie Mellon University;Tokyo Institute of Technology;Stanford University",
        "aff_unique_dep": "Sony AI;;;School of Computer Science;;",
        "aff_unique_url": "https://www.sony.com;https://www.sony.com;https://www.sony.com;https://www.cmu.edu;https://www.titech.ac.jp;https://www.stanford.edu",
        "aff_unique_abbr": "Sony AI;SRI;Sony;CMU;Titech;Stanford",
        "aff_campus_unique_index": "1;2;3",
        "aff_campus_unique": ";Pittsburgh;Tokyo;Stanford",
        "aff_country_unique_index": "0;0;1;0;0;0;1;0;1",
        "aff_country_unique": "Japan;United States"
    },
    {
        "id": "ynguffsGfa",
        "title": "Curated LLM: Synergy of LLMs and Data Curation for tabular augmentation in ultra low-data regimes",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Machine Learning (ML) in low-data settings remains an underappreciated yet crucial problem.  This challenge is pronounced in low-to-middle income countries where access to large datasets is often limited or even absent. Hence, data augmentation methods to increase the sample size of datasets needed for ML are key to unlocking the transformative potential of ML in data-deprived regions and domains. \nUnfortunately, the limited training set constrains traditional tabular synthetic data generators in their ability to generate a large and diverse augmented dataset needed for ML tasks. To address this technical challenge, we introduce $\\texttt{CLLM}$, which leverages the prior knowledge of Large Language Models (LLMs) for data augmentation in the low-data regime.  While diverse, not all the data generated by LLMs will help increase utility for a downstream task, as for any generative model. Consequently, we introduce a principled curation process, leveraging learning dynamics, coupled with confidence and uncertainty metrics, to obtain a high-quality dataset. Empirically, on multiple real-world datasets, we demonstrate the superior performance of LLMs in the low-data regime compared to conventional generators. We further show our curation mechanism improves the downstream performance for all generators, including LLMs. Additionally, we provide insights and understanding into the LLM generation and curation mechanism, shedding light on the features that enable them to output high-quality augmented datasets. $\\texttt{CLLM}$ paves the way for wider usage of ML in data scarce domains and regions, by allying the strengths of LLMs with a robust data-centric approach.",
        "keywords": "data augmentation;low-data regimes;Data-Centric AI;tabular data",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/80c754b4266e1b0fca0b74ed5351bd03cc2897e6.pdf",
        "author": "Nabeel Seedat;Nicolas Huynh;Boris van Breugel;Mihaela van der Schaar",
        "authorids": "~Nabeel_Seedat1;~Nicolas_Huynh1;~Boris_van_Breugel2;~Mihaela_van_der_Schaar2",
        "gender": ";M;;F",
        "homepage": ";;;https://www.vanderschaar-lab.com",
        "dblp": "227/8368;134/9604;284/0835;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;https://scholar.google.com/citations?hl=en;DZ3S--MAAAAJ",
        "orcid": ";;;",
        "linkedin": "nabeel-seedat/;;;",
        "or_profile": "~Nabeel_Seedat1;~Nicolas_Huynh1;~Boris_van_Breugel2;~Mihaela_van_der_Schaar2",
        "aff": "AstraZeneca;University of Cambridge;University of Cambridge;University of California, Los Angeles",
        "aff_domain": "astrazeneca.com;cam.ac.uk;cam.ac.uk;ucla.edu",
        "position": "Intern;PhD student;PhD student;Full Professor",
        "bibtex": "@misc{\nseedat2024curated,\ntitle={Curated {LLM}: Synergy of {LLM}s and Data Curation for tabular augmentation in ultra low-data regimes},\nauthor={Nabeel Seedat and Nicolas Huynh and Boris van Breugel and Mihaela van der Schaar},\nyear={2024},\nurl={https://openreview.net/forum?id=ynguffsGfa}\n}",
        "github": "",
        "project": "",
        "reviewers": "Nkcr;4AgE;AZSZ",
        "site": "https://openreview.net/forum?id=ynguffsGfa",
        "pdf_size": 2007235,
        "rating": "5;6;8",
        "confidence": "3;4;5",
        "soundness": "2;1;3",
        "contribution": "2;2;3",
        "presentation": "3;3;4",
        "wc_summary": "123;89;58",
        "wc_strengths": "103;49;137",
        "wc_weaknesses": "470;559;574",
        "wc_questions": "165;75;10",
        "wc_review": "861;772;779",
        "wc_reply_reviewers": "810;403;314",
        "wc_reply_authors": "2901;3799;1906",
        "reply_reviewers": "2;3;1",
        "reply_authors": "8;8;5",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            90.0,
            26.54555832275273
        ],
        "wc_strengths_avg": [
            96.33333333333333,
            36.23380864453651
        ],
        "wc_weaknesses_avg": [
            534.3333333333334,
            45.90085934804368
        ],
        "wc_questions_avg": [
            83.33333333333333,
            63.55225321645873
        ],
        "wc_review_avg": [
            804.0,
            40.40627014049511
        ],
        "wc_reply_reviewers_avg": [
            509.0,
            215.91819438543538
        ],
        "wc_reply_authors_avg": [
            2868.6666666666665,
            773.1521339440396
        ],
        "reply_reviewers_avg": [
            2.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            7.0,
            1.4142135623730951
        ],
        "replies_avg": [
            34,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.9819805060619659,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4575071237950190622&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "AstraZeneca;University of Cambridge;University of California, Los Angeles",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.astrazeneca.com;https://www.cam.ac.uk;https://www.ucla.edu",
        "aff_unique_abbr": "AZ;Cambridge;UCLA",
        "aff_campus_unique_index": "1;1;2",
        "aff_campus_unique": ";Cambridge;Los Angeles",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "United Kingdom;United States"
    },
    {
        "title": "Achieving Fairness in Multi-Agent MDP Using Reinforcement Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17403",
        "id": "yoVq2BGQdP",
        "author_site": "Peizhong Ju, Arnob Ghosh, Ness Shroff",
        "tldr": "",
        "abstract": "Fairness plays a crucial role in various multi-agent systems (e.g., communication networks, financial markets, etc.). Many multi-agent dynamical interactions can be cast as Markov Decision Processes (MDPs). While existing research has focused on studying fairness in known environments, the exploration of fairness in such systems for unknown environments remains open. In this paper, we propose a  Reinforcement Learning (RL) approach to achieve fairness in multi-agent finite-horizon episodic MDPs. Instead of maximizing the sum of individual agents' value functions, we introduce a fairness function that ensures equitable rewards across agents. Since the classical Bellman's equation does not hold when the sum of individual value functions is not maximized, we cannot use traditional approaches. Instead, in order to explore, we maintain a confidence bound of the unknown environment and then propose an online convex optimization based approach to obtain a policy constrained to this confidence region. We show that such an approach achieves sub-linear regret in terms of the number of episodes. Additionally, we provide a probably approximately correct (PAC) guarantee based on the obtained regret bound. We also propose an offline RL algorithm and bound the optimality gap with respect to the optimal fair solution. To mitigate computational complexity, we introduce a policy-gradient type method for the fair objective. Simulation experiments also demonstrate the efficacy of our approach.",
        "keywords": "Fairness;Multi-Agent Reinforcement Learning;Markov Decision Process",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Peizhong Ju;Arnob Ghosh;Ness Shroff",
        "authorids": "~Peizhong_Ju1;~Arnob_Ghosh3;~Ness_Shroff1",
        "gender": "M;M;M",
        "homepage": ";https://sites.google.com/site/arnob008/;http://newslab.ece.ohio-state.edu/",
        "dblp": "167/9021;34/8285;67/1991",
        "google_scholar": "VDzpfOYAAAAJ;aw2d6pQAAAAJ;https://scholar.google.com.tw/citations?user=5kL-ZrAAAAAJ",
        "orcid": "0000-0002-4569-3539;;0000-0002-4606-6879",
        "linkedin": ";;nessshroff/",
        "or_profile": "~Peizhong_Ju1;~Arnob_Ghosh3;~Ness_Shroff1",
        "aff": "Ohio State University, Columbus;New Jersey Institute of Technology;Ohio State University, Columbus",
        "aff_domain": "osu.edu;njit.edu;osu.edu",
        "position": "Postdoc;Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\nju2024achieving,\ntitle={Achieving Fairness in Multi-Agent {MDP} Using Reinforcement Learning},\nauthor={Peizhong Ju and Arnob Ghosh and Ness Shroff},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=yoVq2BGQdP}\n}",
        "github": "",
        "project": "",
        "reviewers": "uKyX;TT7q;KfsC;o4PJ",
        "pdf_size": 607554,
        "rating": "3;8;8;8",
        "confidence": "4;3;3;3",
        "soundness": "2;3;3;4",
        "contribution": "2;3;4;3",
        "presentation": "2;3;3;3",
        "wc_summary": "93;82;69;93",
        "wc_strengths": "30;34;55;59",
        "wc_weaknesses": "153;247;264;88",
        "wc_questions": "37;59;72;44",
        "wc_review": "313;422;460;284",
        "wc_reply_reviewers": "277;24;71;0",
        "wc_reply_authors": "1280;786;960;700",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "3;1;3;1",
        "rating_avg": [
            6.75,
            2.165063509461097
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            84.25,
            9.883698700385398
        ],
        "wc_strengths_avg": [
            44.5,
            12.658988901172163
        ],
        "wc_weaknesses_avg": [
            188.0,
            71.55766905091305
        ],
        "wc_questions_avg": [
            53.0,
            13.546217184144066
        ],
        "wc_review_avg": [
            369.75,
            73.2269588334788
        ],
        "wc_reply_reviewers_avg": [
            93.0,
            109.25886691706079
        ],
        "wc_reply_authors_avg": [
            931.5,
            221.93861764010336
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            1.0
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1096630864629277740&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=yoVq2BGQdP",
        "pdf": "https://openreview.net/pdf?id=yoVq2BGQdP",
        "email": "osu.edu;njit.edu;osu.edu",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Ohio State University;New Jersey Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.osu.edu;https://www.njit.edu",
        "aff_unique_abbr": "OSU;NJIT",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Columbus;",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Image Translation as Diffusion Visual Programmers",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17402",
        "id": "yozwqhIHXj",
        "author_site": "Cheng Han, James Liang, Qifan Wang, MAJID RABBANI, Sohail Dianat, Raghuveer Rao, Yingnian Wu, Dongfang Liu",
        "tldr": "",
        "abstract": "We introduce the novel Diffusion Visual Programmer (DVP), a neuro-symbolic image translation framework. Our proposed DVP seamlessly embeds a condition-flexible diffusion model within the GPT architecture, orchestrating a coherent sequence of visual programs ($i.e.$, computer vision models) for various pro-symbolic steps, which span RoI identification, style transfer, and position manipulation, facilitating transparent and controllable image translation processes. Extensive experiments demonstrate DVP\u2019s remarkable performance, surpassing concurrent arts. This success can be attributed to several key features of DVP: First, DVP achieves condition-flexible translation via instance normalization, enabling the model to eliminate sensitivity caused by the manual guidance and optimally focus on textual descriptions for high-quality content generation. Second, the frame work enhances in-context reasoning by deciphering intricate high-dimensional concepts in feature spaces into more accessible low-dimensional symbols ($e.g.$, [Prompt], [RoI object]), allowing for localized, context-free editing while maintaining overall coherence. Last but not least, DVP improves systemic controllability and explainability by offering explicit symbolic representations at each programming stage, empowering users to intuitively interpret and modify results. Our research marks a substantial step towards harmonizing artificial image translation processes with cognitive intelligence, promising broader applications.",
        "keywords": "Image translation;Diffusion model",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "",
        "author": "Cheng Han;James Chenhao Liang;Qifan Wang;MAJID RABBANI;Sohail Dianat;Raghuveer Rao;Ying Nian Wu;Dongfang Liu",
        "authorids": "~Cheng_Han1;~James_Chenhao_Liang1;~Qifan_Wang2;~MAJID_RABBANI1;~Sohail_Dianat1;~Raghuveer_Rao1;~Ying_Nian_Wu1;~Dongfang_Liu1",
        "gender": "M;M;M;M;M;;;M",
        "homepage": "https://chenghan111.github.io/;https://jamesliang819.github.io/;https://wqfcr.github.io/;https://www.rit.edu/directory/mxreee-majid-rabbani;https://www.rit.edu/engineering/directory/sadeee-sohail-dianat;;https://www.rit.edu/directory/dxleec-dongfang-liu;http://www.stat.ucla.edu/~ywu/",
        "dblp": "53/6096-1.html;323/3403;33/8610;;;;;18/568.html",
        "google_scholar": "VgkEKZwAAAAJ;cR8m4CcAAAAJ;LrSyLosAAAAJ;;https://scholar.google.com/scholar?hl=en;;uICY0vEAAAAJ;7k_1QFIAAAAJ",
        "orcid": "0000-0002-8145-3436;;0000-0002-7570-5756;;;;;",
        "linkedin": "chenghan-87129219a/;;;majid-rabbani-8056253/;;raghuveer-rao-3a99815/;;",
        "or_profile": "~Cheng_Han1;~James_Chenhao_Liang1;~Qifan_Wang2;~MAJID_RABBANI1;~Sohail_Dianat1;~Raghuveer_Rao1;~Dongfang_Liu1;~Yingnian_Wu1",
        "aff": "Rochester Institute of Technology;Rochester Institute of Technology;Meta AI;Rochester Institute of Technology;Rochester Institute of Technology;DEVCOM Army Research Laboratory;Rochester Institute of Technology;UCLA",
        "aff_domain": "rit.edu;rit.edu;fb.com;rit.edu;rit.edu;army.mil;rit.edu;stat.ucla.edu",
        "position": "PhD student;PhD student;Principal Researcher;Associate Professor;Full Professor;Researcher;Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\nhan2024image,\ntitle={Image Translation as Diffusion Visual Programmers},\nauthor={Cheng Han and James Chenhao Liang and Qifan Wang and MAJID RABBANI and Sohail Dianat and Raghuveer Rao and Ying Nian Wu and Dongfang Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=yozwqhIHXj}\n}",
        "github": "",
        "project": "",
        "reviewers": "EyuE;DvDX;TXue;fWRk",
        "pdf_size": 12898614,
        "rating": "6;6;6;6",
        "confidence": "4;3;4;3",
        "soundness": "3;3;3;3",
        "contribution": "3;2;3;3",
        "presentation": "4;3;3;3",
        "wc_summary": "109;107;88;91",
        "wc_strengths": "139;64;57;61",
        "wc_weaknesses": "198;163;131;89",
        "wc_questions": "2;116;82;62",
        "wc_review": "448;450;358;303",
        "wc_reply_reviewers": "0;12;174;39",
        "wc_reply_authors": "721;507;1162;623",
        "reply_reviewers": "0;1;3;1",
        "reply_authors": "1;1;4;2",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            98.75,
            9.33742469849155
        ],
        "wc_strengths_avg": [
            80.25,
            34.0101087913579
        ],
        "wc_weaknesses_avg": [
            145.25,
            40.20183453525473
        ],
        "wc_questions_avg": [
            65.5,
            41.433681950799404
        ],
        "wc_review_avg": [
            389.75,
            62.36335061556587
        ],
        "wc_reply_reviewers_avg": [
            56.25,
            69.43477154855483
        ],
        "wc_reply_authors_avg": [
            753.25,
            247.85113979967895
        ],
        "reply_reviewers_avg": [
            1.25,
            1.0897247358851685
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 25,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11407494154411648252&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=yozwqhIHXj",
        "pdf": "https://openreview.net/pdf?id=yozwqhIHXj",
        "email": "rit.edu;rit.edu;fb.com;rit.edu;rit.edu;army.mil;rit.edu;stat.ucla.edu",
        "author_num": 8,
        "aff_unique_index": "0;0;1;0;0;2;0;3",
        "aff_unique_norm": "Rochester Institute of Technology;Meta;United States Army Research Laboratory;University of California, Los Angeles",
        "aff_unique_dep": ";Meta AI;Army Research Laboratory;",
        "aff_unique_url": "https://www.rit.edu;https://meta.com;https://www.arl.army.mil;https://www.ucla.edu",
        "aff_unique_abbr": "RIT;Meta;ARL;UCLA",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Los Angeles",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "In defense of parameter sharing for model-compression",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17401",
        "id": "ypAT2ixD4X",
        "author_site": "Aditya Desai, Anshumali Shrivastava",
        "tldr": "",
        "abstract": "When considering a model architecture, there are several ways to reduce its memory footprint. Historically, popular approaches included selecting smaller architectures and creating sparse networks through pruning. More recently, randomized parameter-sharing (RPS) methods have gained traction for model compression at\nstart of training. In this paper, we comprehensively assess the trade-off between\nmemory and accuracy across RPS, pruning techniques, and building smaller models. Our findings demonstrate that RPS, which is both data and model-agnostic, consistently outperforms smaller models and all moderately informed pruning strategies, such as MAG, SNIP, SYNFLOW, and GRASP, across the entire compression range. This advantage becomes particularly pronounced in higher compression scenarios. Notably, even when compared to highly informed pruning techniques like Lottery Ticket Rewinding (LTR), RPS exhibits superior performance in high compression settings. This points out inherent capacity advantage that RPS enjoys over sparse models. Theoretically, we establish RPS as a superior\ntechnique in terms of memory-efficient representation when compared to pruning\nfor linear models. This paper argues in favor of paradigm shift towards RPS based\nmodels. During our rigorous evaluation of RPS, we identified issues in the state-\nof-the-art RPS technique ROAST, specifically regarding stability (ROAST\u2019s sensitivity to initialization hyperparameters, often leading to divergence) and Pareto-continuity (ROAST\u2019s inability to recover the accuracy of the original model at zero\ncompression). We provably address both of these issues. We refer to the modified\nRPS, which incorporates our improvements, as STABLE-RPS",
        "keywords": "parameter sharing;model compression;pruning",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Aditya Desai;Anshumali Shrivastava",
        "authorids": "~Aditya_Desai1;~Anshumali_Shrivastava1",
        "gender": "M;M",
        "homepage": "https://www.cs.rice.edu/~as143/;https://apd10.github.io/",
        "dblp": "63/9828;18/8339",
        "google_scholar": "https://scholar.google.com.tw/citations?user=SGT23RAAAAAJ;ymdbDZwAAAAJ",
        "orcid": ";0009-0002-9111-9391",
        "linkedin": ";aditya-desai-ai/",
        "or_profile": "~Anshumali_Shrivastava1;~Adity_Desai1",
        "aff": "ThirdAI Corp.;Rice University",
        "aff_domain": "thirdai.com;rice.edu",
        "position": "CEO;PhD student",
        "bibtex": "@inproceedings{\ndesai2024in,\ntitle={In defense of parameter sharing for model-compression},\nauthor={Aditya Desai and Anshumali Shrivastava},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ypAT2ixD4X}\n}",
        "github": "",
        "project": "",
        "reviewers": "sVzo;L2s3;YEB1;Fae8",
        "pdf_size": 2151409,
        "rating": "3;5;6;8",
        "confidence": "4;4;2;3",
        "soundness": "2;3;3;3",
        "contribution": "2;3;2;3",
        "presentation": "1;3;2;3",
        "wc_summary": "101;71;113;120",
        "wc_strengths": "45;95;132;73",
        "wc_weaknesses": "241;86;144;17",
        "wc_questions": "100;40;152;11",
        "wc_review": "487;292;541;221",
        "wc_reply_reviewers": "380;0;0;0",
        "wc_reply_authors": "702;342;767;81",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "1;1;1;2",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            101.25,
            18.73999733191016
        ],
        "wc_strengths_avg": [
            86.25,
            31.80703538527286
        ],
        "wc_weaknesses_avg": [
            122.0,
            82.10663797769338
        ],
        "wc_questions_avg": [
            75.75,
            54.48107469571429
        ],
        "wc_review_avg": [
            385.25,
            132.5563559396531
        ],
        "wc_reply_reviewers_avg": [
            95.0,
            164.54482671904336
        ],
        "wc_reply_authors_avg": [
            473.0,
            278.25438001943473
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.5853694070049635,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2443422724958642878&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=ypAT2ixD4X",
        "pdf": "https://openreview.net/pdf?id=ypAT2ixD4X",
        "email": "thirdai.com;rice.edu",
        "author_num": 2,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "ThirdAI Corp.;Rice University",
        "aff_unique_dep": ";",
        "aff_unique_url": ";https://www.rice.edu",
        "aff_unique_abbr": ";Rice",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "yqAToOgxgf",
        "title": "An old dog can learn (some) new tricks: A tale of a three-decade old architecture",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Designing novel architectures often involves combining or extending familiar components such as convolutions and attention modules. However, this approach can obscure the fundamental design principles as the focus is usually on the entire architecture. Instead, this paper takes an unconventional approach, attempting to rejuvenate an old architecture with modern tools and techniques. Our primary objective is to explore whether a 30-year-old architecture can compete with contemporary models, when equipped with modern tools. Through experiments spanning image recognition datasets, we aim to understand what aspects of the architecture contribute to its performance. We find that while an ensemble of ingredients bears significance in achieving commendable performance, only a few pivotal components have a large impact. We contend that our discoveries offer valuable insights for creating cutting-edge architectures.",
        "keywords": "Neural network architecture;network design",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Grigorios Chrysos;Yixin Cheng;Jiankang Deng;Volkan Cevher",
        "authorids": "~Grigorios_Chrysos1;~Yixin_Cheng1;~Jiankang_Deng1;~Volkan_Cevher1",
        "gender": "M;M;M;M",
        "homepage": "https://grigorisg9gr.github.io/;https://people.epfl.ch/yixin.cheng/?lang=en;https://jiankangdeng.github.io/;http://lions.epfl.ch",
        "dblp": "75/6117-2;;156/7808;70/5301",
        "google_scholar": "1bU041kAAAAJ;;Z_UoQFsAAAAJ;https://scholar.google.ch/citations?user=hlWhzU8AAAAJ",
        "orcid": ";;0000-0002-3709-6216;",
        "linkedin": ";yixin-cheng-76248219a/;jiankang-deng-b45b21b4/?originalSubdomain=uk;",
        "or_profile": "~Grigorios_Chrysos1;~Yixin_Cheng1;~Jiankang_Deng1;~Volkan_Cevher1",
        "aff": "University of Wisconsin - Madison;EPFL - EPF Lausanne;Imperial College London;Amazon Development Center Germany",
        "aff_domain": "wisc.edu;epfl.ch;imperial.ac.uk;amazon.de",
        "position": "Assistant Professor;Researcher;Lecturer;Amazon Scholar",
        "bibtex": "@misc{\nchrysos2024an,\ntitle={An old dog can learn (some) new tricks: A tale of a three-decade old architecture},\nauthor={Grigorios Chrysos and Yixin Cheng and Jiankang Deng and Volkan Cevher},\nyear={2024},\nurl={https://openreview.net/forum?id=yqAToOgxgf}\n}",
        "github": "",
        "project": "",
        "reviewers": "AAyP;6g4Q;Gb9t;jSdE",
        "site": "https://openreview.net/forum?id=yqAToOgxgf",
        "pdf_size": 1612779,
        "rating": "3;5;6;6",
        "confidence": "4;3;3;3",
        "soundness": "2;4;3;3",
        "contribution": "1;2;2;3",
        "presentation": "3;3;3;3",
        "wc_summary": "64;89;63;72",
        "wc_strengths": "23;60;197;73",
        "wc_weaknesses": "100;147;201;159",
        "wc_questions": "2;46;62;71",
        "wc_review": "189;342;523;375",
        "wc_reply_reviewers": "0;131;0;0",
        "wc_reply_authors": "376;876;387;968",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;2;1;2",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            72.0,
            10.41633332799983
        ],
        "wc_strengths_avg": [
            88.25,
            65.41167709209114
        ],
        "wc_weaknesses_avg": [
            151.75,
            35.98176621568208
        ],
        "wc_questions_avg": [
            45.25,
            26.52710877574109
        ],
        "wc_review_avg": [
            357.25,
            118.66839301178726
        ],
        "wc_reply_reviewers_avg": [
            32.75,
            56.72466394788073
        ],
        "wc_reply_authors_avg": [
            651.75,
            272.2281901273268
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.5
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.9428090415820632,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:H5NlV7u4DU0J:scholar.google.com/&scioq=An+old+dog+can+learn+(some)+new+tricks:+A+tale+of+a+three-decade+old+architecture&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "University of Wisconsin-Madison;EPFL;Imperial College London;Amazon",
        "aff_unique_dep": ";;;Development Center",
        "aff_unique_url": "https://www.wisc.edu;https://www.epfl.ch;https://www.imperial.ac.uk;https://www.amazon.de",
        "aff_unique_abbr": "UW-Madison;EPFL;ICL;Amazon",
        "aff_campus_unique_index": "0;1",
        "aff_campus_unique": "Madison;Lausanne;",
        "aff_country_unique_index": "0;1;2;3",
        "aff_country_unique": "United States;Switzerland;United Kingdom;Germany"
    },
    {
        "id": "yqIJoALgdD",
        "title": "Towards Zero Memory Footprint Spiking Neural Network Training",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Spiking Neural Networks (SNNs), as representative brain-inspired neural networks, emulate the intrinsic characteristics and functional principles of the biological brain. With their unique structure reflecting biological signal transmission through spikes, they have achieved significant success in processing temporal data. \nHowever, the training of SNNs demands a substantial memory footprint due to the added storage needs for spikes or events, resulting in intricate architectures and dynamic configurations.\nIn this paper, to address memory constraints in SNN training, we introduce an innovative framework characterized by a remarkably low memory footprint. We \\textbf{(i)} design a reversible SNN node that retains a high level of accuracy. Our design is able to achieve a $\\mathbf{58.65\\times}$ reduction in memory usage compared to the current SNN node. We \\textbf{(ii)} propose a unique algorithm to streamline the backpropagation process of our reversible SNN node. This significantly trims the backward Floating Point Operations Per Second (FLOPs), thereby accelerating the training process in comparison to the current reversible layer backpropagation method. By using our algorithm, the training time is able to be curtailed by $\\mathbf{23.8}$ % relative to existing reversible layer architectures.",
        "keywords": "Deep Neural Networks;Spiking Neural Networks;Reversible Layer",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/31266f82101ac1735b4108266cdfc95908cf06a1.zip",
        "author": "Bin Lei;Sheng Lin;Le Chen;Pei-Hung Lin;Chunhua Liao;Caiwen Ding",
        "authorids": "~Bin_Lei1;~Sheng_Lin3;~Le_Chen2;~Pei-Hung_Lin1;~Chunhua_Liao1;~Caiwen_Ding1",
        "gender": ";;M;;Not Specified;M",
        "homepage": "https://github.com/bin123apple;;https://www.cs.iastate.edu/;https://people.llnl.gov/lin32;https://people.llnl.gov/liao6;https://caiwending.cse.uconn.edu/",
        "dblp": ";;;62/7585.html;;175/2489",
        "google_scholar": ";pjYkasMAAAAJ;D7bxqR4AAAAJ;MGwC86oAAAAJ;9IY55CsAAAAJ;7hR0r_EAAAAJ",
        "orcid": ";;0000-0002-7188-6756;0000-0003-4977-814X;0000-0001-6477-0547;0000-0003-0891-1231",
        "linkedin": ";;;;;caiwen-ding-47144489/",
        "or_profile": "~Bin_Lei1;~Sheng_Lin3;~Le_Chen2;~Pei-Hung_Lin1;~Chunhua_Liao1;~Caiwen_Ding1",
        "aff": "University of Minnesota - Twin Cities;;Iowa State University;Lawrence Livermore National Labs;Lawrence Livermore National Labs;University of Connecticut",
        "aff_domain": "umn.edu;;iastate.edu;llnl.gov;llnl.gov;uconn.edu",
        "position": "PhD student;;PhD student;Researcher;Researcher;Assistant Professor",
        "bibtex": "@misc{\nlei2024towards,\ntitle={Towards Zero Memory Footprint Spiking Neural Network Training},\nauthor={Bin Lei and Sheng Lin and Le Chen and Pei-Hung Lin and Chunhua Liao and Caiwen Ding},\nyear={2024},\nurl={https://openreview.net/forum?id=yqIJoALgdD}\n}",
        "github": "",
        "project": "",
        "reviewers": "j4UM;JXdn;Umsy;u1jx",
        "site": "https://openreview.net/forum?id=yqIJoALgdD",
        "pdf_size": 621060,
        "rating": "5;5;5;8",
        "confidence": "5;4;4;5",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "2;2;1;3",
        "wc_summary": "57;50;47;102",
        "wc_strengths": "54;30;35;102",
        "wc_weaknesses": "342;164;185;118",
        "wc_questions": "2;14;4;152",
        "wc_review": "455;258;271;474",
        "wc_reply_reviewers": "116;62;137;15",
        "wc_reply_authors": "723;512;1308;544",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "1;2;2;2",
        "rating_avg": [
            5.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            64.0,
            22.237355957937087
        ],
        "wc_strengths_avg": [
            55.25,
            28.43743131859838
        ],
        "wc_weaknesses_avg": [
            202.25,
            84.24480696161633
        ],
        "wc_questions_avg": [
            43.0,
            63.095166217389426
        ],
        "wc_review_avg": [
            364.5,
            100.33070317704346
        ],
        "wc_reply_reviewers_avg": [
            82.5,
            47.61564868822013
        ],
        "wc_reply_authors_avg": [
            771.75,
            319.87526865951986
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            1.75,
            0.4330127018922193
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Ch9UzkfetEYJ:scholar.google.com/&scioq=Towards+Zero+Memory+Footprint+Spiking+Neural+Network+Training&hl=en&as_sdt=0,47",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;2;3",
        "aff_unique_norm": "University of Minnesota;Iowa State University;Lawrence Livermore National Laboratory;University of Connecticut",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.minnesota.edu;https://www.iastate.edu;https://www.llnl.gov;https://www.uconn.edu",
        "aff_unique_abbr": "UMN;ISU;LLNL;UConn",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Twin Cities;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "yrLwQ7VQ7h",
        "title": "Boosting Self-Supervised Graph Representation Learning via Anchor-Neighborhood Alignment and Isotropic Constraints",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Graph Self-Supervised Learning (GSSL) provides a guarantee for harnessing abundant unlabeled data and has attracted widespread attention. While making some strides, GSSL still faces several crucial challenges that hinder it from fully unleashing its potential, including inadequate exploration of graph information and underlying collapse issues. To overcome these obstacles, we propose two complementary components aimed at sufficiently mining valuable contents implied within graphs and transforming them into informative and diverse representations through training an expressive neural model. As a cornerstone module, an anchor-neighborhood alignment strategy, which utilizes graph diffusion to construct the probability distribution of positive samples based on the structural context of the anchor node, enables sufficient exploration of graph topology and endows the neural model with stronger structure-aware ability. To enhance diversity of node representations, a scheme of isotropic constraints is introduced to encourage representations to exhibit consistent distribution along any direction in space, which compels data points to be scattered throughout the whole representation space and naturally solves the notorious dimensional collapse in self-supervised learning. Owing to no reliance on negative samples, mutual information estimators, and additional projectors, our approach presents significant advantages in computing and storage. Extensive comparative experiments and exhaustive ablation studies demonstrate the effectiveness and efficiency of our method.",
        "keywords": "Graph Self-Supervised Learning;Anchor-Neighborhood Alignment;Isotropic Constraints;Dimensional Collapse",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Jinyong Wen;Chunxia Zhang;Shiming Xiang;Chunhong Pan",
        "authorids": "~Jinyong_Wen1;~Chunxia_Zhang1;~Shiming_Xiang1;~Chunhong_Pan1",
        "gender": "M;F;M;",
        "homepage": "https://wenjinyong.github.io/;;http://www.escience.cn/people/smxiang;http://www.ia.ac.cn/",
        "dblp": "337/4329;https://dblp.uni-trier.de/pid/69/5538-1.html;81/6575.html;",
        "google_scholar": ";;0ggsACEAAAAJ;",
        "orcid": "0000-0002-6661-7770;;;",
        "linkedin": ";;;",
        "or_profile": "~Jinyong_Wen1;~Chunxia_Zhang1;~Shiming_Xiang1;~Chunhong_Pan1",
        "aff": "University of Chinese Academy of Sciences;School of Computer Science and Technology, Beijing Institute of Technology;Institute of Automation, Chinese Academy of Sciences;Institute of Automation, Chinese Academy of Sciences",
        "aff_domain": "ucas.ac.cn;bit.edu.cn;ia.ac.cn;ia.ac.cn",
        "position": "PhD student;Associate Professor;Full Professor;Full Professor",
        "bibtex": "@misc{\nwen2024boosting,\ntitle={Boosting Self-Supervised Graph Representation Learning via Anchor-Neighborhood Alignment and Isotropic Constraints},\nauthor={Jinyong Wen and Chunxia Zhang and Shiming Xiang and Chunhong Pan},\nyear={2024},\nurl={https://openreview.net/forum?id=yrLwQ7VQ7h}\n}",
        "github": "",
        "project": "",
        "reviewers": "BwDP;MQvP;CqLJ",
        "site": "https://openreview.net/forum?id=yrLwQ7VQ7h",
        "pdf_size": 7767880,
        "rating": "3;5;5",
        "confidence": "4;4;3",
        "soundness": "1;2;2",
        "contribution": "1;2;2",
        "presentation": "2;2;2",
        "wc_summary": "101;60;86",
        "wc_strengths": "42;34;8",
        "wc_weaknesses": "233;266;75",
        "wc_questions": "44;3;109",
        "wc_review": "420;363;278",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            82.33333333333333,
            16.937794687883333
        ],
        "wc_strengths_avg": [
            28.0,
            14.514360704718161
        ],
        "wc_weaknesses_avg": [
            191.33333333333334,
            83.35599691817154
        ],
        "wc_questions_avg": [
            52.0,
            43.642486944108335
        ],
        "wc_review_avg": [
            353.6666666666667,
            58.345712972096095
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.49999999999999983,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:cKVacwDHqasJ:scholar.google.com/&scioq=Boosting+Self-Supervised+Graph+Representation+Learning+via+Anchor-Neighborhood+Alignment+and+Isotropic+Constraints&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;2",
        "aff_unique_norm": "University of Chinese Academy of Sciences;Beijing Institute of Technology;Chinese Academy of Sciences",
        "aff_unique_dep": ";School of Computer Science and Technology;Institute of Automation",
        "aff_unique_url": "http://www.ucas.ac.cn;http://www.bit.edu.cn/;http://www.ia.cas.cn",
        "aff_unique_abbr": "UCAS;BIT;CAS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Equivariant Matrix Function Neural Networks",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17400",
        "id": "yrgQdA5NkI",
        "author_site": "Ilyes Batatia, Lars Leon Schaaf, G\u00e1bor Cs\u00e1nyi, Christoph Ortner, Felix Faber",
        "tldr": "",
        "abstract": "Graph Neural Networks (GNNs), especially message-passing neural networks (MPNNs), have emerged as powerful architectures for learning on graphs in diverse applications. However, MPNNs face challenges when modeling non-local interactions in systems such as large conjugated molecules, metals, or amorphous materials.\nAlthough Spectral GNNs and traditional neural networks such as recurrent neural networks and transformers mitigate these challenges, they often lack extensivity, adaptability, generalizability, computational efficiency, or fail to capture detailed structural relationships or symmetries in the data. To address these concerns, we introduce Matrix Function Neural Networks (MFNs), a novel architecture that parameterizes non-local interactions through analytic matrix equivariant functions. Employing resolvent expansions offers a straightforward implementation and the potential for linear scaling with system size.\nThe MFN architecture achieves state-of-the-art performance in standard graph benchmarks, such as the ZINC and TU datasets, and is able to capture intricate non-local interactions in quantum systems. The code and the datasets will be made public.",
        "keywords": "equivariance;graph neural networks;long range",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/97396f626e2b7431a1ca2391fb2e38b2dd9f7e60.zip",
        "author": "Ilyes Batatia;Lars Leon Schaaf;Gabor Csanyi;Christoph Ortner;Felix Andreas Faber",
        "authorids": "~Ilyes_Batatia1;~Lars_Leon_Schaaf1;~Gabor_Csanyi1;~Christoph_Ortner1;~Felix_Andreas_Faber1",
        "gender": "M;M;M;Not Specified;",
        "homepage": ";;;https://personal.math.ubc.ca/~ortner/;",
        "dblp": "282/4552;;;;",
        "google_scholar": "fTVuWFMAAAAJ;Z18-6_YAAAAJ;q39javYAAAAJ;;9oJE270AAAAJ",
        "orcid": ";0000-0002-1935-236X;;;",
        "linkedin": ";;;;",
        "or_profile": "~Ilyes_Batatia1;~Lars_Leon_Schaaf1;~Gabor_Csanyi1;~Christoph_Ortner1;~Felix_Andreas_Faber1",
        "aff": "University of Cambridge;InstaDeep;University of Cambridge;University of British Columbia;",
        "aff_domain": "cam.ac.uk;instadeep.com;cam.ac.uk;ubc.ca;",
        "position": "MS student;Intern;Full Professor;Full Professor;",
        "bibtex": "@inproceedings{\nbatatia2024equivariant,\ntitle={Equivariant Matrix Function Neural Networks},\nauthor={Ilyes Batatia and Lars Leon Schaaf and Gabor Csanyi and Christoph Ortner and Felix Andreas Faber},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=yrgQdA5NkI}\n}",
        "github": "",
        "project": "",
        "reviewers": "qFqk;Qi1r;2GgR",
        "pdf_size": 1021765,
        "rating": "5;6;8",
        "confidence": "2;3;4",
        "soundness": "3;2;4",
        "contribution": "3;3;3",
        "presentation": "1;1;3",
        "wc_summary": "59;76;157",
        "wc_strengths": "16;118;174",
        "wc_weaknesses": "153;721;140",
        "wc_questions": "32;180;311",
        "wc_review": "260;1095;782",
        "wc_reply_reviewers": "0;572;79",
        "wc_reply_authors": "1013;2186;636",
        "reply_reviewers": "0;1;1",
        "reply_authors": "3;4;1",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            97.33333333333333,
            42.7577153531643
        ],
        "wc_strengths_avg": [
            102.66666666666667,
            65.40812046085885
        ],
        "wc_weaknesses_avg": [
            338.0,
            270.8738943986051
        ],
        "wc_questions_avg": [
            174.33333333333334,
            113.97173138789967
        ],
        "wc_review_avg": [
            712.3333333333334,
            344.4283508785084
        ],
        "wc_reply_reviewers_avg": [
            217.0,
            253.086283047238
        ],
        "wc_reply_authors_avg": [
            1278.3333333333333,
            660.0132995293015
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            1.247219128924647
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.9819805060619659,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14384427541159104600&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=yrgQdA5NkI",
        "pdf": "https://openreview.net/pdf?id=yrgQdA5NkI",
        "email": "cam.ac.uk;instadeep.com;cam.ac.uk;ubc.ca;",
        "author_num": 5,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "University of Cambridge;InstaDeep;University of British Columbia",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.cam.ac.uk;https://www.instadeep.com;https://www.ubc.ca",
        "aff_unique_abbr": "Cambridge;InstaDeep;UBC",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Cambridge;",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "United Kingdom;Canada"
    },
    {
        "title": "A Quadratic Synchronization Rule for Distributed Deep Learning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17399",
        "id": "yroyhkhWS6",
        "author_site": "Xinran Gu, Kaifeng Lyu, Sanjeev Arora, Jingzhao Zhang, Longbo Huang",
        "tldr": "",
        "abstract": "In distributed deep learning with data parallelism, synchronizing gradients at each training step can cause a huge communication overhead, especially when many nodes work together to train large models.\n  Local gradient methods, such as Local SGD, address this issue by allowing workers to compute locally for $H$ steps without synchronizing with others, hence reducing communication frequency.\n  While $H$ has been viewed as a hyperparameter to trade optimization efficiency for communication cost, recent research indicates that setting a proper  $H$ value can lead to generalization improvement. Yet, selecting a proper $H$ is elusive. This work proposes a theory-grounded method for determining $H$, named the Quadratic Synchronization Rule (QSR), which recommends dynamically setting $H$ in proportion to $\\frac{1}{\\eta^2}$ as the learning rate $\\eta$ decays over time.\n  Extensive ImageNet experiments on ResNet and ViT show that local gradient methods with QSR consistently improve the test accuracy over other synchronization strategies. Compared to the standard data parallel training, QSR enables Local AdamW to cut the training time on 16 or 64 GPUs down from 26.7 to 20.2 hours or from 8.6 to 5.5 hours and, at the same time, achieves 1.16% or 0.84% higher top-1 validation accuracy.",
        "keywords": "distributed training;Local SGD;local gradient methods;generalization;implicit bias;sharpness",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Xinran Gu;Kaifeng Lyu;Sanjeev Arora;Jingzhao Zhang;Longbo Huang",
        "authorids": "~Xinran_Gu2;~Kaifeng_Lyu2;~Sanjeev_Arora1;~Jingzhao_Zhang2;~Longbo_Huang2",
        "gender": "F;M;;M;M",
        "homepage": ";https://kaifeng.ac/;http://www.cs.princeton.edu/~arora/;https://sites.google.com/view/jingzhao/home;http://people.iiis.tsinghua.edu.cn/~huang/",
        "dblp": ";220/3283;a/SArora;220/5559;79/7077",
        "google_scholar": "6iYQL8MAAAAJ;843JJtgAAAAJ;RUP4S68AAAAJ;8NudxYsAAAAJ;",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Xinran_Gu2;~Kaifeng_Lyu2;~Sanjeev_Arora1;~Jingzhao_Zhang2;~Longbo_Huang2",
        "aff": "Tsinghua University;Princeton University;Princeton University;Tsinghua University;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;princeton.edu;princeton.edu;mail.tsinghua.edu.cn;tsinghua.edu.cn",
        "position": "PhD student;PhD student;Full Professor;Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\ngu2024a,\ntitle={A Quadratic Synchronization Rule for Distributed Deep Learning},\nauthor={Xinran Gu and Kaifeng Lyu and Sanjeev Arora and Jingzhao Zhang and Longbo Huang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=yroyhkhWS6}\n}",
        "github": "",
        "project": "",
        "reviewers": "ydD5;tFqJ;duf3;u85z",
        "pdf_size": 886999,
        "rating": "5;6;8;8",
        "confidence": "4;3;2;3",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "2;2;3;3",
        "wc_summary": "115;142;76;61",
        "wc_strengths": "55;86;49;64",
        "wc_weaknesses": "659;342;1;49",
        "wc_questions": "195;73;1;85",
        "wc_review": "1024;643;127;259",
        "wc_reply_reviewers": "0;52;0;0",
        "wc_reply_authors": "2913;1128;47;414",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "5;3;1;1",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            98.5,
            31.925694980689144
        ],
        "wc_strengths_avg": [
            63.5,
            14.044571905188139
        ],
        "wc_weaknesses_avg": [
            262.75,
            263.3898014350594
        ],
        "wc_questions_avg": [
            88.5,
            69.37398647908307
        ],
        "wc_review_avg": [
            513.25,
            350.5469832989581
        ],
        "wc_reply_reviewers_avg": [
            13.0,
            22.516660498395403
        ],
        "wc_reply_authors_avg": [
            1125.5,
            1102.7870374646232
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            1.6583123951777
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.816496580927726,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4825985021252275162&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=yroyhkhWS6",
        "pdf": "https://openreview.net/pdf?id=yroyhkhWS6",
        "email": "tsinghua.edu.cn;princeton.edu;princeton.edu;mail.tsinghua.edu.cn;tsinghua.edu.cn",
        "author_num": 5,
        "aff_unique_index": "0;1;1;0;0",
        "aff_unique_norm": "Tsinghua University;Princeton University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.princeton.edu",
        "aff_unique_abbr": "THU;Princeton",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "ysue5S6cVS",
        "title": "Confidence-driven Sampling for Backdoor Attacks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Backdoor attacks aim to surreptitiously insert malicious triggers into DNN models, granting unauthorized control during testing scenarios. Existing methods lack robustness against defense strategies and predominantly focus on enhancing trigger stealthiness while randomly selecting poisoned samples. Our research highlights the overlooked drawbacks of random sampling, which make that attack detectable and defensible. The core idea of this paper is to strategically poison samples near the model's decision boundary and increase defense difficulty. We introduce a straightforward yet highly effective sampling methodology that leverages confidence scores. Specifically, it selects samples with lower confidence scores, significantly increasing the challenge for defenders in identifying and countering these attacks. Importantly, our method operates independently of existing trigger designs, providing versatility and compatibility with various backdoor attack techniques. We substantiate the effectiveness of our approach through a comprehensive set of empirical experiments, demonstrating its potential to significantly enhance resilience against backdoor attacks in DNNs.",
        "keywords": "Backdoor attack;sampling method",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Pengfei He;Han Xu;Jie Ren;Yingqian Cui;Shenglai Zeng;Yue Xing;Jiliang Tang;Makoto Yamada;Mohammad Sabokrou",
        "authorids": "~Pengfei_He2;~Han_Xu1;~Jie_Ren6;~Yingqian_Cui1;~Shenglai_Zeng2;~Yue_Xing1;~Jiliang_Tang1;~Makoto_Yamada3;~Mohammad_Sabokrou1",
        "gender": "M;M;M;F;M;;M;M;M",
        "homepage": "https://pengfeihepower.github.io/;https://cse.msu.edu/~xuhan1/;https://renjie3.github.io/;https://yingqiancui.github.io/;https://slz-ai.github.io/;https://sites.google.com/site/xingyuecuhk/;https://www.cse.msu.edu/~tangjili/;https://groups.oist.jp/mlds;https://sabokrou.github.io/",
        "dblp": "37/10219-2;32/34-2;181/2887-19.html;;312/6540;185/5744-2.html;64/10812;56/4937;163/2030",
        "google_scholar": "nsSrd6kAAAAJ;mX2rL3IAAAAJ;;3p67r08AAAAJ;https://scholar.google.com.hk/citations?user=2EFS5WEAAAAJ;;WtzKMWAAAAAJ;1cKNu1gAAAAJ;jqHXvT0AAAAJ",
        "orcid": ";0000-0002-4016-6748;;;0009-0001-9664-8017;;0000-0001-7125-3898;;",
        "linkedin": ";;;;;;;;",
        "or_profile": "~Pengfei_He2;~Han_Xu1;~Jie_Ren6;~Yingqian_Cui1;~Shenglai_Zeng2;~Yue_Xing1;~Jiliang_Tang1;~Makoto_Yamada3;~Mohammad_Sabokrou1",
        "aff": "Michigan State University;Michigan State University;Sony Europe Ltd.;Michigan State University;Michigan State University;Michigan State University;Michigan State University;Okinawa Institute of Science and Technology (OIST);Okinawa Institute of Science and Technology (OIST)",
        "aff_domain": "msu.edu;msu.edu;sony.com;msu.edu;msu.edu;msu.edu;msu.edu;oist.jp;oist.jp",
        "position": "PhD student;PhD student;Intern;PhD student;PhD student;Assistant Professor;Full Professor;Associate Professor;Researcher",
        "bibtex": "@misc{\nhe2024confidencedriven,\ntitle={Confidence-driven Sampling for Backdoor Attacks},\nauthor={Pengfei He and Han Xu and Jie Ren and Yingqian Cui and Shenglai Zeng and Yue Xing and Jiliang Tang and Makoto Yamada and Mohammad Sabokrou},\nyear={2024},\nurl={https://openreview.net/forum?id=ysue5S6cVS}\n}",
        "github": "",
        "project": "",
        "reviewers": "gKjE;ycqn;okLZ",
        "site": "https://openreview.net/forum?id=ysue5S6cVS",
        "pdf_size": 895901,
        "rating": "5;6;6",
        "confidence": "4;4;4",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "4;3;3",
        "wc_summary": "101;208;61",
        "wc_strengths": "44;55;48",
        "wc_weaknesses": "300;74;94",
        "wc_questions": "20;32;68",
        "wc_review": "465;369;271",
        "wc_reply_reviewers": "35;15;17",
        "wc_reply_authors": "1931;814;1051",
        "reply_reviewers": "1;1;1",
        "reply_authors": "5;3;3",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            123.33333333333333,
            62.055530687352025
        ],
        "wc_strengths_avg": [
            49.0,
            4.546060565661952
        ],
        "wc_weaknesses_avg": [
            156.0,
            102.15021618511958
        ],
        "wc_questions_avg": [
            40.0,
            20.396078054371138
        ],
        "wc_review_avg": [
            368.3333333333333,
            79.20157125265186
        ],
        "wc_reply_reviewers_avg": [
            22.333333333333332,
            8.993825042154693
        ],
        "wc_reply_authors_avg": [
            1265.3333333333333,
            480.5388179487226
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8826752316862571744&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;1;0;0;0;0;2;2",
        "aff_unique_norm": "Michigan State University;Sony Europe;Okinawa Institute of Science and Technology",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.msu.edu;https://www.sony.eu;https://www.oist.jp",
        "aff_unique_abbr": "MSU;Sony Europe;OIST",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0;0;0;2;2",
        "aff_country_unique": "United States;United Kingdom;Japan"
    },
    {
        "id": "ytGU2iit80",
        "title": "From Fourier to Neural ODEs: Flow matching for modeling complex systems",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Modeling complex systems using standard neural ordinary differential equations (NODEs) often faces some essential challenges, including high computational costs and susceptibility to local optima. To address these challenges, we propose a simulation-free framework, called Fourier NODEs (FNODEs), that effectively trains NODEs by directly matching the target vector field based on Fourier analysis. Specifically, we employ the Fourier analysis to estimate temporal and potential high-order spatial gradients from noisy observational data. We then incorporate the estimated spatial gradients as additional inputs to a neural network. Furthermore, we utilize the estimated temporal gradient as the optimization objective for the output of the neural network. Later, the trained neural network generates more data points through an ODE solver without participating in the computational graph, facilitating more accurate estimations of gradients based on Fourier analysis. These two steps form a positive feedback loop, enabling accurate dynamics modeling in our framework. Consequently, our approach outperforms state-of-the-art methods in terms of training time, dynamics prediction, and robustness. Finally, we demonstrate the superior performance of our framework using a number of representative complex systems.",
        "keywords": "Fourier analysis;Neural ODEs;Flow matching;Complex dynamical systems",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/65df7acf94212f33de9fcc0ed97b792f4d29b856.zip",
        "author": "Xin Li;Jingdong Zhang;Xue Zhang;Qunxi Zhu;Chengli Zhao;Xiaojun Duan;Wei Lin",
        "authorids": "~Xin_Li59;~Jingdong_Zhang1;~Xue_Zhang6;~Qunxi_Zhu1;~Chengli_Zhao1;~Xiaojun_Duan1;~Wei_Lin1",
        "gender": "M;M;;M;M;F;M",
        "homepage": ";https://scholar.google.com/citations?user=Bjo3nfwAAAAJ&hl=zh-CN;;https://www.researchgate.net/profile/Qunxi_Zhu;https://dblp.org/pid/26/7437.html;;https://faculty.fudan.edu.cn/wlin/zh_CN/",
        "dblp": ";163/0015-1;;219/7742;26/7437.html;;99/2649",
        "google_scholar": ";Bjo3nfwAAAAJ;;https://scholar.google.co.jp/citations?user=45oFQD4AAAAJ;;;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": "0000-0002-4559-4610;0000-0002-4120-6561;0000-0002-4560-9835;0000-0001-7281-5274;;0000-0003-0386-7163;0000-0002-1863-4306",
        "linkedin": ";;;;;;",
        "or_profile": "~Xin_Li59;~Jingdong_Zhang1;~Xue_Zhang6;~Qunxi_Zhu1;~Chengli_Zhao1;~Xiaojun_Duan1;~Wei_Lin1",
        "aff": "National University of Defense Technology;Fudan University;;Fudan University;;National University of Defense Technology;Fudan University",
        "aff_domain": "nudt.edu.cn;fudan.edu.cn;;fudan.edu.cn;;nudt.edu.cn;fudan.edu.cn",
        "position": "PhD student;PhD student;;Postdoc;;Full Professor;Full Professor",
        "bibtex": "@misc{\nli2024from,\ntitle={From Fourier to Neural {ODE}s: Flow matching for modeling complex systems},\nauthor={Xin Li and Jingdong Zhang and Xue Zhang and Qunxi Zhu and Chengli Zhao and Xiaojun Duan and Wei Lin},\nyear={2024},\nurl={https://openreview.net/forum?id=ytGU2iit80}\n}",
        "github": "",
        "project": "",
        "reviewers": "533P;PMhg;Xqgc;X9WB",
        "site": "https://openreview.net/forum?id=ytGU2iit80",
        "pdf_size": 19123334,
        "rating": "3;3;5;8",
        "confidence": "4;3;3;3",
        "soundness": "2;2;3;3",
        "contribution": "2;1;3;3",
        "presentation": "1;3;2;3",
        "wc_summary": "61;135;92;44",
        "wc_strengths": "26;11;52;18",
        "wc_weaknesses": "127;254;110;10",
        "wc_questions": "330;2;121;64",
        "wc_review": "544;402;375;136",
        "wc_reply_reviewers": "144;45;66;0",
        "wc_reply_authors": "1381;1244;1047;523",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "3;3;3;1",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.82915619758885
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            83.0,
            34.60491294599655
        ],
        "wc_strengths_avg": [
            26.75,
            15.514106484100203
        ],
        "wc_weaknesses_avg": [
            125.25,
            86.73919241035162
        ],
        "wc_questions_avg": [
            129.25,
            123.30728891675463
        ],
        "wc_review_avg": [
            364.25,
            146.58508621275223
        ],
        "wc_reply_reviewers_avg": [
            63.75,
            52.10746107804524
        ],
        "wc_reply_authors_avg": [
            1048.75,
            325.93279598714827
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.8660254037844386
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.49374193110101877,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17287830580147590187&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;1;0;1",
        "aff_unique_norm": "National University of Defense Technology;Fudan University",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.nudt.edu.cn/;https://www.fudan.edu.cn",
        "aff_unique_abbr": "NUDT;Fudan",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "yuGqe96t9O",
        "title": "Stoichiometry Representation Learning with Polymorphic Crystal Structures",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Despite the recent success of machine learning (ML) in materials science, its success heavily relies on the structural description of crystal, which is itself computationally demanding and occasionally unattainable. Stoichiometry descriptors can be an alternative approach, which reveals the ratio between elements involved to form a certain compound without any structural information. However, it is not trivial to learn the representations of stoichiometry due to the nature of materials science called polymorphism, i.e., a single stoichiometry can exist in multiple structural forms due to the flexibility of atomic arrangements, inducing uncertainties in representation. To this end, we propose PolySRL, which learns the probabilistic representation of stoichiometry by utilizing the readily available structural information, whose uncertainty reveals the polymorphic structures of stoichiometry. Extensive experiments on sixteen datasets demonstrate the superiority of PolySRL, and analysis of uncertainties shed light on the applicability of PolySRL in real-world material discovery.",
        "keywords": "Materials Science;Stoichiometry;Crystalline Materials;Representation Learning;Graph Neural Networks",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/050faf68ebb3c0ab09f27fbc9f9b15eca2af9e34.zip",
        "author": "Namkyeong Lee;Heewoong Noh;Gyoung S. Na;Tianfan Fu;Jimeng Sun;Chanyoung Park",
        "authorids": "~Namkyeong_Lee1;~Heewoong_Noh2;~Gyoung_S._Na2;~Tianfan_Fu1;~Jimeng_Sun3;~Chanyoung_Park1",
        "gender": "M;M;;M;;M",
        "homepage": "https://namkyeong.github.io/;https://github.com/HeewoongNoh;;https://futianfan.github.io/;http://sunlab.org;https://dsail.kaist.ac.kr/",
        "dblp": "308/0443;342/4417;;;;170/5430.html",
        "google_scholar": "88ZqjpwAAAAJ;VIAHsCMAAAAJ;;KPQ49w4AAAAJ;9jmmp5sAAAAJ;lWk2LtQAAAAJ",
        "orcid": ";;;;0000-0003-1512-6426;0000-0002-5957-5816",
        "linkedin": ";;;;jimengsun/;",
        "or_profile": "~Namkyeong_Lee1;~Heewoong_Noh2;~Gyoung_S._Na2;~Tianfan_Fu1;~Jimeng_Sun3;~Chanyoung_Park1",
        "aff": "University of Illinois, Urbana Champaign;Korea Advanced Institute of Science & Technology;;Rensselaer Polytechnic Institute;Georgia Institute of Technology;Korea Advanced Institute of Science & Technology",
        "aff_domain": "uiuc.edu;kaist.ac.kr;;rpi.edu;gatech.edu;kaist.ac.kr",
        "position": "Researcher;MS student;;Assistant Professor;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nlee2024stoichiometry,\ntitle={Stoichiometry Representation Learning with Polymorphic Crystal Structures},\nauthor={Namkyeong Lee and Heewoong Noh and Gyoung S. Na and Tianfan Fu and Jimeng Sun and Chanyoung Park},\nyear={2024},\nurl={https://openreview.net/forum?id=yuGqe96t9O}\n}",
        "github": "",
        "project": "",
        "reviewers": "sAC5;jsDD;rRHK",
        "site": "https://openreview.net/forum?id=yuGqe96t9O",
        "pdf_size": 3892490,
        "rating": "3;6;8",
        "confidence": "5;2;4",
        "soundness": "2;3;3",
        "contribution": "1;2;3",
        "presentation": "2;3;3",
        "wc_summary": "16;69;147",
        "wc_strengths": "30;28;317",
        "wc_weaknesses": "680;260;255",
        "wc_questions": "172;6;115",
        "wc_review": "898;363;834",
        "wc_reply_reviewers": "277;0;171",
        "wc_reply_authors": "1880;1480;1788",
        "reply_reviewers": "1;0;1",
        "reply_authors": "4;4;4",
        "rating_avg": [
            5.666666666666667,
            2.0548046676563256
        ],
        "confidence_avg": [
            3.6666666666666665,
            1.247219128924647
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            77.33333333333333,
            53.80417166808619
        ],
        "wc_strengths_avg": [
            125.0,
            135.76695719749583
        ],
        "wc_weaknesses_avg": [
            398.3333333333333,
            199.1788699190309
        ],
        "wc_questions_avg": [
            97.66666666666667,
            68.86863501543274
        ],
        "wc_review_avg": [
            698.3333333333334,
            238.55164826277954
        ],
        "wc_reply_reviewers_avg": [
            149.33333333333334,
            114.11787278462954
        ],
        "wc_reply_authors_avg": [
            1716.0,
            171.0516491199856
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            4.0,
            0.0
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.43355498476206006,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8299599780038899410&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;3;1",
        "aff_unique_norm": "University of Illinois Urbana-Champaign;Korea Advanced Institute of Science and Technology;Rensselaer Polytechnic Institute;Georgia Institute of Technology",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://illinois.edu;https://www.kaist.ac.kr;https://www.rpi.edu;https://www.gatech.edu",
        "aff_unique_abbr": "UIUC;KAIST;RPI;Georgia Tech",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Urbana-Champaign;",
        "aff_country_unique_index": "0;1;0;0;1",
        "aff_country_unique": "United States;South Korea"
    },
    {
        "id": "yuYMJQIhEU",
        "title": "Communication-efficient Random-Walk Optimizer for Decentralized Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Decentralized learning has gained popularity due to its flexibility and the ability to operate without a central server. A popular family of decentralized learning methods is based on random-walk optimization, which is easy to implement and has a low computation cost. \nHowever, random-walk optimization with adaptive optimizers can suffer from high communication cost. In this paper, we propose to address this problem from three directions. First, we eliminate the communication of auxiliary parameters, such as momentum and preconditioner, in adaptive optimizers. We also perform multiple model updates on the same client before sending the model to next client. Additionally, we extend sharpness-aware minimization (SAM) to random-walk optimization to avoid overfitting on local training data. Our theoretical analysis demonstrates that the proposed method can converge faster than existing approaches with the same communication cost. Empirical results on various datasets, communication networks, and network sizes show that the proposed method outperforms existing approaches while significantly reducing communication costs.",
        "keywords": "decentralized optimization;random walk",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Hansi Yang;James Kwok",
        "authorids": "~Hansi_Yang1;~James_Kwok1",
        "gender": "M;",
        "homepage": "https://www.linkedin.com/in/%E7%80%9A%E6%80%9D-%E6%9D%A8-6463a4a1;",
        "dblp": "252/5354;",
        "google_scholar": ";",
        "orcid": "0000-0002-0479-9898;",
        "linkedin": "%E7%80%9A%E6%80%9D-%E6%9D%A8-6463a4a1;",
        "or_profile": "~Hansi_Yang1;~James_Kwok1",
        "aff": "Department of Computer Science and Engineering, Hong Kong University of Science and Technology;",
        "aff_domain": "cse.ust.hk;",
        "position": "PhD student;",
        "bibtex": "@misc{\nyang2024communicationefficient,\ntitle={Communication-efficient Random-Walk Optimizer for Decentralized Learning},\nauthor={Hansi Yang and James Kwok},\nyear={2024},\nurl={https://openreview.net/forum?id=yuYMJQIhEU}\n}",
        "github": "",
        "project": "",
        "reviewers": "w8Ss;bmmj;na6d;zbhE",
        "site": "https://openreview.net/forum?id=yuYMJQIhEU",
        "pdf_size": 1627556,
        "rating": "3;3;6;6",
        "confidence": "5;4;3;3",
        "soundness": "2;1;3;3",
        "contribution": "2;1;2;2",
        "presentation": "2;2;3;3",
        "wc_summary": "79;32;84;97",
        "wc_strengths": "32;40;101;70",
        "wc_weaknesses": "483;257;42;58",
        "wc_questions": "6;1;118;71",
        "wc_review": "600;330;345;296",
        "wc_reply_reviewers": "366;283;0;0",
        "wc_reply_authors": "2558;2180;484;494",
        "reply_reviewers": "1;2;0;0",
        "reply_authors": "5;4;1;1",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            73.0,
            24.566236993076494
        ],
        "wc_strengths_avg": [
            60.75,
            27.215574585152524
        ],
        "wc_weaknesses_avg": [
            210.0,
            178.9315511585366
        ],
        "wc_questions_avg": [
            49.0,
            48.471641193588646
        ],
        "wc_review_avg": [
            392.75,
            120.96564594958356
        ],
        "wc_reply_reviewers_avg": [
            162.25,
            164.88234441564688
        ],
        "wc_reply_authors_avg": [
            1429.0,
            949.4593198236563
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.75,
            1.7853571071357126
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.9045340337332909,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:kTmI-NdPvNcJ:scholar.google.com/&scioq=Communication-efficient+Random-Walk+Optimizer+for+Decentralized+Learning&hl=en&as_sdt=0,3",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Hong Kong University of Science and Technology",
        "aff_unique_dep": "Department of Computer Science and Engineering",
        "aff_unique_url": "https://www.ust.hk",
        "aff_unique_abbr": "HKUST",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0",
        "aff_country_unique": "China"
    },
    {
        "title": "Empirical Analysis of Model Selection for Heterogeneous Causal Effect Estimation",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17398",
        "id": "yuy6cGt3KL",
        "author_site": "Divyat Mahajan, Ioannis Mitliagkas, Brady Neal, Vasilis Syrgkanis",
        "tldr": "",
        "abstract": "We study the problem of model selection in causal inference, specifically for conditional average treatment effect (CATE) estimation. Unlike machine learning, there is no perfect analogue of cross-validation for model selection as we do not observe the counterfactual potential outcomes. Towards this, a variety of surrogate metrics have been proposed for CATE model selection that use only observed data. However, we do not have a good understanding regarding their effectiveness due to limited comparisons in prior studies. We conduct an extensive empirical analysis to benchmark the surrogate model selection metrics introduced in the literature, as well as the novel ones introduced in this work. We ensure a fair comparison by tuning the hyperparameters associated with these metrics via AutoML, and provide more detailed trends by incorporating realistic datasets via generative modeling. Our analysis suggests novel model selection strategies based on careful hyperparameter selection of CATE estimators and causal ensembling.",
        "keywords": "Heterogeneous Treatment Effect Estimation;Conditional Average Treatment Effect;Causal Inference;Model Selection",
        "primary_area": "causal reasoning",
        "supplementary_material": "",
        "author": "Divyat Mahajan;Ioannis Mitliagkas;Brady Neal;Vasilis Syrgkanis",
        "authorids": "~Divyat_Mahajan1;~Ioannis_Mitliagkas1;~Brady_Neal2;~Vasilis_Syrgkanis1",
        "gender": "M;M;;",
        "homepage": "http://divyat09.github.io/;http://mitliagkas.github.io/;https://www.bradyneal.com;https://www.vsyrgkanis.com",
        "dblp": "242/8911.html;83/8757;;",
        "google_scholar": "https://scholar.google.co.in/citations?user=z5bDMO4AAAAJ;K757SxgAAAAJ;;G1WMpcUAAAAJ",
        "orcid": ";;;",
        "linkedin": "divyat-mahajan-6221a0a6/;;;",
        "or_profile": "~Divyat_Mahajan1;~Ioannis_Mitliagkas1;~Brady_Neal2;~Vasilis_Syrgkanis1",
        "aff": "Montreal Institute of Learning Algorithms;Mila - Quebec AI Institute;University of Montreal;Stanford University",
        "aff_domain": "mila.quebec;mila.quebec;umontreal.ca;stanford.edu",
        "position": "PhD student;Principal Researcher;PhD Student;Assistant Professor",
        "bibtex": "@inproceedings{\nmahajan2024empirical,\ntitle={Empirical Analysis of Model Selection for Heterogeneous Causal Effect Estimation},\nauthor={Divyat Mahajan and Ioannis Mitliagkas and Brady Neal and Vasilis Syrgkanis},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=yuy6cGt3KL}\n}",
        "github": "",
        "project": "",
        "reviewers": "3TcV;5dxk;i3fD;RQGf",
        "pdf_size": 831796,
        "rating": "5;8;8;8",
        "confidence": "3;3;3;4",
        "soundness": "3;3;3;3",
        "contribution": "2;3;3;4",
        "presentation": "2;3;3;3",
        "wc_summary": "111;61;34;98",
        "wc_strengths": "111;83;48;124",
        "wc_weaknesses": "83;27;91;685",
        "wc_questions": "83;74;104;142",
        "wc_review": "388;245;277;1049",
        "wc_reply_reviewers": "0;53;22;17",
        "wc_reply_authors": "430;645;887;811",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "3;3;4;2",
        "rating_avg": [
            7.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            76.0,
            30.405591591021544
        ],
        "wc_strengths_avg": [
            91.5,
            29.159046623646667
        ],
        "wc_weaknesses_avg": [
            221.5,
            268.73546472321067
        ],
        "wc_questions_avg": [
            100.75,
            26.185635375144138
        ],
        "wc_review_avg": [
            489.75,
            327.2150477896761
        ],
        "wc_reply_reviewers_avg": [
            23.0,
            19.144189719076646
        ],
        "wc_reply_authors_avg": [
            693.25,
            175.38012287599756
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 27,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14367596525919376580&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=yuy6cGt3KL",
        "pdf": "https://openreview.net/pdf?id=yuy6cGt3KL",
        "email": "mila.quebec;mila.quebec;umontreal.ca;stanford.edu",
        "author_num": 4,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "Montreal Institute of Learning Algorithms;Quebec AI Institute;University of Montreal;Stanford University",
        "aff_unique_dep": "Learning Algorithms;AI Institute;;",
        "aff_unique_url": "https://mila.quebec;https://mila.quebec;https://wwwumontreal.ca;https://www.stanford.edu",
        "aff_unique_abbr": "MILA;Mila;UM;Stanford",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Stanford",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "Canada;United States"
    },
    {
        "id": "yvxDJ8eyBu",
        "title": "MuseCoco: Generating Symbolic Music from Text",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Due to the inherent ease of textual input for user engagement, it is natural to generate music from text. In this paper, we introduce MuseCoco (Music Composition Copilot), a system meticulously designed to compose symbolic music from text descriptions. It operates by utilizing musical attributes as a bridge and dividing the process into text-to-attribute understanding stage and attribute-to-music generation stage, which bestows three key advantages: First, it eliminates the need for paired text-to-music data, as text-attribute pairs for the text-to-attribute understanding stage can be automatically synthesized as many as needed, and attributes required for the attribute-to-music generation stage can be directly extracted from music data, thus alleviating the labor-intense process of human annotation. Second, thanks to the explicit attribute design, the system excels in offering precise control over musical attributes, which ensures a high degree of accuracy in shaping the musical output according to user's intentions. Third, it can offer an additional attribute-conditioned control option beyond textual input, enhancing its versatility and usability. Our experimental results demonstrate that MuseCoco significantly outperforms our top-performing baseline model, GPT-4, on musicality, controllability, and overall score, by 45.5\\%, 35.2\\%, and 47.0\\%, respectively. There is also a notable enhancement of approximately 20\\% in objective control accuracy. Additionally, we have developed a large-scale model with 1.2 billion parameters, showcasing exceptional controllability and musicality. In practical applications, MuseCoco can serve as a user-friendly tool for musicians, enabling them to effortlessly generate music by simply providing text descriptions, and offering a substantial enhancement in efficiency compared to manually composing music from scratch. Music samples generated by MuseCoco are available via this link https://musecoco.github.io.",
        "keywords": "music generation;text to music generation;symbolic music;attribute;controlled",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/95f70965a2791755b0c2c3490d0c0b173f86a87a.zip",
        "author": "Peiling Lu;Xin Xu;Chenfei Kang;Botao Yu;Chengyi Xing;Xu Tan;Jiang Bian",
        "authorids": "~Peiling_Lu1;~Xin_Xu8;~Chenfei_Kang1;~Botao_Yu1;~Chengyi_Xing1;~Xu_Tan1;~Jiang_Bian1",
        "gender": "F;F;;M;M;M;M",
        "homepage": "https://www.microsoft.com/en-us/research/people/peil/;https://xxupiano.github.io/;;https://btyu.github.io/;https://chengyi-xing.com;https://tan-xu.github.io/;https://sites.google.com/view/jiangbian",
        "dblp": ";66/3874-10;;150/2596;348/9124;96/10484-3;09/851-2.html",
        "google_scholar": ";KBdTqoEAAAAJ;;NbWw60wAAAAJ;BglGZXEAAAAJ;tob-U1oAAAAJ;pZBEnY8AAAAJ",
        "orcid": ";0000-0001-5238-0955;;0000-0002-3386-6383;;0000-0001-5631-0639;0000-0002-9472-600X",
        "linkedin": "peiling-lu-675371128/;xin-xu-800886176/;;;xcyhbp/;;jbian/",
        "or_profile": "~Peiling_Lu1;~Xin_Xu8;~Chenfei_Kang1;~Botao_Yu1;~Chengyi_Xing1;~Xu_Tan1;~Jiang_Bian1",
        "aff": "Microsoft;Zhejiang University;;The Ohio State University;Stanford University;Microsoft;Microsoft",
        "aff_domain": "microsoft.com;zju.edu.cn;;osu.edu;stanford.edu;microsoft.com;microsoft.com",
        "position": "Researcher;MS student;;PhD student;MS student;Principal Researcher;Partner Research Manager",
        "bibtex": "@misc{\nlu2024musecoco,\ntitle={MuseCoco: Generating Symbolic Music from Text},\nauthor={Peiling Lu and Xin Xu and Chenfei Kang and Botao Yu and Chengyi Xing and Xu Tan and Jiang Bian},\nyear={2024},\nurl={https://openreview.net/forum?id=yvxDJ8eyBu}\n}",
        "github": "",
        "project": "",
        "reviewers": "R4MX;WPYi;zgSb;Y1vJ",
        "site": "https://openreview.net/forum?id=yvxDJ8eyBu",
        "pdf_size": 1652895,
        "rating": "5;5;6;8",
        "confidence": "4;3;4;4",
        "soundness": "3;2;3;4",
        "contribution": "2;2;3;4",
        "presentation": "2;3;2;4",
        "wc_summary": "59;61;69;148",
        "wc_strengths": "61;36;64;110",
        "wc_weaknesses": "556;156;233;19",
        "wc_questions": "186;37;101;254",
        "wc_review": "862;290;467;531",
        "wc_reply_reviewers": "117;177;381;221",
        "wc_reply_authors": "2441;1637;983;473",
        "reply_reviewers": "1;1;1;1",
        "reply_authors": "6;4;2;2",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            84.25,
            36.99577678600627
        ],
        "wc_strengths_avg": [
            67.75,
            26.705570579937064
        ],
        "wc_weaknesses_avg": [
            241.0,
            197.35627681936037
        ],
        "wc_questions_avg": [
            144.5,
            82.40297324732889
        ],
        "wc_review_avg": [
            537.5,
            207.1044422507639
        ],
        "wc_reply_reviewers_avg": [
            224.0,
            97.87236586493657
        ],
        "wc_reply_authors_avg": [
            1383.5,
            736.8817747780168
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.5,
            1.6583123951777
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.4714045207910316,
        "gs_citation": 51,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7687462648235053818&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;3;0;0",
        "aff_unique_norm": "Microsoft;Zhejiang University;Ohio State University;Stanford University",
        "aff_unique_dep": "Microsoft Corporation;;;",
        "aff_unique_url": "https://www.microsoft.com;https://www.zju.edu.cn;https://www.osu.edu;https://www.stanford.edu",
        "aff_unique_abbr": "Microsoft;ZJU;OSU;Stanford",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Stanford",
        "aff_country_unique_index": "0;1;0;0;0;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "ywD00GsxgD",
        "title": "Synthetic Data as Validation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This study leverages synthetic data as a validation set to reduce overfitting and ease the selection of the best model in AI development. While synthetic data have been used for augmenting the training set, we find that synthetic data can also significantly diversify the validation set, offering marked advantages in domains like healthcare, where data are typically limited, sensitive, and from out-domain sources (i.e., hospitals). In this study, we illustrate the effectiveness of synthetic data for early cancer detection in computed tomography (CT) volumes, where synthetic tumors are generated and superimposed onto healthy organs, thereby creating an extensive dataset for rigorous validation. Using synthetic data as validation can improve AI robustness in both in-domain and out-domain test sets. Furthermore, we establish a new continual learning framework that continuously trains AI models on a stream of out-domain data with synthetic tumors. The AI model trained and validated in dynamically expanding synthetic data can consistently outperform models trained and validated exclusively on real-world data. Specifically, the DSC score of liver tumor segmentation improves from 26.7\\% (95\\% CI: 22.6\\%--30.9\\%) to 34.5\\% (30.8\\%--38.2\\%) when evaluated on an in-domain dataset and from 31.1\\% (26.0\\%--36.2\\%) to 35.4\\% (32.1\\%--38.7\\%) on an out-domain dataset. Importantly, the performance gain is particularly significant in identifying very tiny liver tumors (radius $<$ 5mm) in CT volumes, with Sensitivity improving from 33.1\\% to 55.4\\% on an in-domain dataset and 33.9\\% to 52.3\\% on an out-domain dataset, justifying the efficacy in the early detection of cancer. The application of synthetic data, from both training and validation perspectives, underlines a promising avenue to enhance AI model robustness when dealing with data from varying domains. Our code is attached as supplementary and will be publicly available.",
        "keywords": "Data Synthesis;Cancer Detection;Medical Image Analysis",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/b12e68133a4bb57f1d667786554adbb07ca93ab5.zip",
        "author": "Qixin Hu;Alan Yuille;Zongwei Zhou",
        "authorids": "~Qixin_Hu2;~Alan_Yuille1;~Zongwei_Zhou1",
        "gender": ";M;M",
        "homepage": ";;https://www.zongweiz.com/",
        "dblp": ";y/AlanLYuille;",
        "google_scholar": ";;JVOeczAAAAAJ",
        "orcid": ";;0000-0002-3154-9851",
        "linkedin": ";;",
        "or_profile": "~Qixin_Hu2;~Alan_Yuille1;~Zongwei_Zhou1",
        "aff": ";Johns Hopkins University;Johns Hopkins University",
        "aff_domain": ";johnshopkins.edu;jhu.edu",
        "position": ";Full Professor;Postdoc",
        "bibtex": "@misc{\nhu2024synthetic,\ntitle={Synthetic Data as Validation},\nauthor={Qixin Hu and Alan Yuille and Zongwei Zhou},\nyear={2024},\nurl={https://openreview.net/forum?id=ywD00GsxgD}\n}",
        "github": "",
        "project": "",
        "reviewers": "j62o;AHws;NsC9;Nazy;QJkJ",
        "site": "https://openreview.net/forum?id=ywD00GsxgD",
        "pdf_size": 7708085,
        "rating": "1;3;3;3;3",
        "confidence": "4;4;4;5;3",
        "soundness": "1;2;2;2;1",
        "contribution": "1;2;2;4;1",
        "presentation": "2;3;2;4;2",
        "wc_summary": "187;53;90;131;55",
        "wc_strengths": "98;16;41;108;52",
        "wc_weaknesses": "625;90;38;336;198",
        "wc_questions": "960;186;505;33;150",
        "wc_review": "1870;345;674;608;455",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            2.6,
            0.8000000000000002
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            1.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.0,
            1.0954451150103321
        ],
        "presentation_avg": [
            2.6,
            0.8
        ],
        "wc_summary_avg": [
            103.2,
            50.6217344625804
        ],
        "wc_strengths_avg": [
            63.0,
            34.82527817548627
        ],
        "wc_weaknesses_avg": [
            257.4,
            210.2356772767172
        ],
        "wc_questions_avg": [
            366.8,
            335.2905605590471
        ],
        "wc_review_avg": [
            790.4,
            551.9473163264769
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            7,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11751249241924496947&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Johns Hopkins University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.jhu.edu",
        "aff_unique_abbr": "JHU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "ywGSgEmOYb",
        "title": "Fine-Tuning Is All You Need to Mitigate Backdoor Attacks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Backdoor attacks represent one of the major threats to machine learning models.\nVarious efforts have been made to mitigate backdoors.\nHowever, existing defenses have become increasingly complex and often require high computational resources or may also jeopardize models' utility.\nIn this work, we show that fine-tuning, one of the most common and easy-to-adopt machine learning training operations, can effectively remove backdoors from machine learning models while maintaining high model utility.\nExtensive experiments over three machine learning paradigms show that fine-tuning and our newly proposed super-fine-tuning achieve strong defense performance.\nWe hope our results can help machine learning model owners better protect their models from backdoor threats.\nAlso, it calls for the design of more advanced attacks in order to comprehensively assess machine learning models' backdoor vulnerabilities.",
        "keywords": "Backdoor Defense;Fine-tuning;Backdoor Sequela",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "/attachment/c4cc6922aeac0714a28448eb99f406bd38029c9a.pdf",
        "author": "Zeyang Sha;Xinlei He;Pascal Berrang;Mathias Humbert;Yang Zhang",
        "authorids": "~Zeyang_Sha1;~Xinlei_He1;~Pascal_Berrang1;~Mathias_Humbert2;~Yang_Zhang15",
        "gender": ";M;M;M;M",
        "homepage": "https://zeyangsha.github.io;https://xinleihe.github.io/;https://pascal-berrang.de;http://mhumbert.com;https://yangzhangalmo.github.io/",
        "dblp": "311/5284;227/7262;;83/8816;06/6785-16",
        "google_scholar": "3tBByDwAAAAJ;6hZNEtoAAAAJ;;;Xeb2888AAAAJ",
        "orcid": ";;;;0000-0003-3612-7348",
        "linkedin": ";;;;",
        "or_profile": "~Zeyang_Sha1;~Xinlei_He1;~Pascal_Berrang1;~Mathias_Humbert2;~Yang_Zhang15",
        "aff": "CISPA, saarland university, saarland informatics campus;Hong Kong University of Science and Technology;University of Birmingham;Universit\u00e9 de Lausanne;CISPA Helmholtz Center for Information Security",
        "aff_domain": "cispa.saarland;hkust-gz.edu.cn;bham.ac.uk;unil.ch;cispa.de",
        "position": "PhD student;Assistant Professor;Assistant Professor;Associate Professor;Full Professor",
        "bibtex": "@misc{\nsha2024finetuning,\ntitle={Fine-Tuning Is All You Need to Mitigate Backdoor Attacks},\nauthor={Zeyang Sha and Xinlei He and Pascal Berrang and Mathias Humbert and Yang Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=ywGSgEmOYb}\n}",
        "github": "",
        "project": "",
        "reviewers": "ssXR;Mt1F;abhQ;2n3e;zR7K",
        "site": "https://openreview.net/forum?id=ywGSgEmOYb",
        "pdf_size": 745774,
        "rating": "3;3;5;5;6",
        "confidence": "4;4;4;4;4",
        "soundness": "2;3;2;2;3",
        "contribution": "2;2;2;2;2",
        "presentation": "2;2;3;3;3",
        "wc_summary": "57;81;92;72;46",
        "wc_strengths": "20;21;50;85;141",
        "wc_weaknesses": "296;430;352;107;127",
        "wc_questions": "89;3;82;90;18",
        "wc_review": "462;535;576;354;332",
        "wc_reply_reviewers": "0;0;101;66;25",
        "wc_reply_authors": "207;265;278;153;253",
        "reply_reviewers": "0;0;2;1;1",
        "reply_authors": "1;1;1;1;1",
        "rating_avg": [
            4.4,
            1.2
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            69.6,
            16.451139778143034
        ],
        "wc_strengths_avg": [
            63.4,
            45.4954942824012
        ],
        "wc_weaknesses_avg": [
            262.4,
            126.27683873141582
        ],
        "wc_questions_avg": [
            56.4,
            37.876641878603756
        ],
        "wc_review_avg": [
            451.8,
            96.30036344687386
        ],
        "wc_reply_reviewers_avg": [
            38.4,
            39.52012145730324
        ],
        "wc_reply_authors_avg": [
            231.2,
            45.844956102062085
        ],
        "reply_reviewers_avg": [
            0.8,
            0.7483314773547883
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 38,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11125928504453129343&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;2;3;4",
        "aff_unique_norm": "Saarland University;Hong Kong University of Science and Technology;University of Birmingham;Universit\u00e9 de Lausanne;CISPA Helmholtz Center for Information Security",
        "aff_unique_dep": "CISPA;;;;",
        "aff_unique_url": "https://www.uni-saarland.de;https://www.ust.hk;https://www.birmingham.ac.uk;https://www.unil.ch;https://www.cispa.de/",
        "aff_unique_abbr": "Saarland U;HKUST;Birmingham;UNIL;CISPA",
        "aff_campus_unique_index": "0;1",
        "aff_campus_unique": "Saarland Informatics Campus;Hong Kong SAR;",
        "aff_country_unique_index": "0;1;2;3;0",
        "aff_country_unique": "Germany;China;United Kingdom;Switzerland"
    },
    {
        "title": "Generating Pragmatic Examples to Train Neural Program Synthesizers",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17397",
        "id": "yxKZGQLzOP",
        "author_site": "Saujas Vaduguru, Daniel Fried, Yewen Pu",
        "tldr": "",
        "abstract": "Programming-by-example is the task of synthesizing a program that is consistent with a set of user-provided input-output examples. \nAs examples are often an under-specification of one's intent, a good synthesizer must choose the intended program from the many that are consistent with the given set of examples. Prior work frames program synthesis as a cooperative game between a listener (that synthesizes programs) and a speaker (a user choosing examples), and shows that models of computational pragmatic inference are effective in choosing the user intended programs. However, these models require counterfactual reasoning over a large set of programs and examples, which is infeasible in realistic program spaces. In this paper, we propose PraX, a novel way to amortize this search with neural networks. We sample pairs of programs and examples via self-play between listener and speaker models, and use pragmatic inference to choose informative training examples from this sample. We then use the informative dataset to train models to improve the synthesizer's ability to disambiguate user-provided examples _without human supervision_. We validate PraX on the challenging task of synthesizing regular expressions from example strings, and find that our method (1) outperforms models trained without choosing pragmatic examples by 23% (a 51% relative increase) (2) matches the performance of supervised learning on a dataset of pragmatic examples provided by humans, despite using no human data in training.",
        "keywords": "program synthesis;pragmatics;self-play",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "/attachment/b2b14cc63a89dc796fd98253199156544d204a01.zip",
        "author": "Saujas Vaduguru;Daniel Fried;Yewen Pu",
        "authorids": "~Saujas_Vaduguru1;~Daniel_Fried1;~Yewen_Pu1",
        "gender": "M;M;M",
        "homepage": "https://saujasv.github.io/;https://dpfried.github.io/;http://www.mit.edu/~yewenpu",
        "dblp": "294/8886;117/4804;53/10322",
        "google_scholar": "U2MUXuMAAAAJ;sJDqACEAAAAJ;LJnNKXMAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Saujas_Vaduguru1;~Daniel_Fried1;~Yewen_Pu1",
        "aff": "Autodesk;Carnegie Mellon University;Autodesk",
        "aff_domain": "autodesk.com;cmu.edu;autodesk.com",
        "position": "Intern;Assistant Professor;Principal Researcher",
        "bibtex": "@inproceedings{\nvaduguru2024generating,\ntitle={Generating Pragmatic Examples to Train Neural Program Synthesizers},\nauthor={Saujas Vaduguru and Daniel Fried and Yewen Pu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=yxKZGQLzOP}\n}",
        "github": "",
        "project": "",
        "reviewers": "3Xjo;Lieb;Dg1v;h5RG",
        "pdf_size": 1415880,
        "rating": "6;6;6;8",
        "confidence": "2;3;3;4",
        "soundness": "2;3;3;4",
        "contribution": "3;3;3;4",
        "presentation": "3;3;3;3",
        "wc_summary": "94;116;160;191",
        "wc_strengths": "76;52;132;100",
        "wc_weaknesses": "89;140;315;155",
        "wc_questions": "60;80;436;365",
        "wc_review": "319;388;1043;811",
        "wc_reply_reviewers": "87;91;439;45",
        "wc_reply_authors": "780;610;1065;731",
        "reply_reviewers": "2;1;1;1",
        "reply_authors": "4;3;3;2",
        "rating_avg": [
            6.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            140.25,
            37.72515738867102
        ],
        "wc_strengths_avg": [
            90.0,
            29.597297173897484
        ],
        "wc_weaknesses_avg": [
            174.75,
            84.58834139525375
        ],
        "wc_questions_avg": [
            235.25,
            167.29521063078883
        ],
        "wc_review_avg": [
            640.25,
            299.2468671515209
        ],
        "wc_reply_reviewers_avg": [
            165.5,
            158.93001604479878
        ],
        "wc_reply_authors_avg": [
            796.5,
            166.91090437715565
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.816496580927726,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15166903922698489510&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=yxKZGQLzOP",
        "pdf": "https://openreview.net/pdf?id=yxKZGQLzOP",
        "email": "autodesk.com;cmu.edu;autodesk.com",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Autodesk;Carnegie Mellon University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.autodesk.com;https://www.cmu.edu",
        "aff_unique_abbr": "Autodesk;CMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Matcher: Segment Anything with One Shot Using All-Purpose Feature Matching",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17396",
        "id": "yzRXdhk2he",
        "author_site": "Yang Liu, Muzhi Zhu, Hengtao Li, Hao Chen, Xinlong Wang, Chunhua Shen",
        "tldr": "",
        "abstract": "Powered by large-scale pre-training, vision foundation models exhibit significant potential in open-world image understanding. However, unlike large language models that excel at directly tackling various language tasks, vision foundation models require a task-specific model structure followed by fine-tuning on specific tasks. In this work, we present $\\textbf{Matcher}$, a novel perception paradigm that utilizes off-the-shelf vision foundation models to address various perception tasks. Matcher can segment anything by using an in-context example without training. Additionally, we design three effective components within the Matcher framework to collaborate with these foundation models and unleash their full potential in diverse perception tasks. Matcher demonstrates impressive generalization performance across various segmentation tasks, all without training. For example, it achieves 52.7% mIoU on COCO-20$^i$ with one example, surpassing the state-of-the-art specialist model by 1.6%. In addition, Matcher achieves 33.0% mIoU on the proposed LVIS-92$^i$ for one-shot semantic segmentation, outperforming the state-of-the-art generalist model by 14.4%. Our visualization results further showcase the open-world generality and flexibility of Matcher when applied to images in the wild.",
        "keywords": "Vision Foundation Models; Segment Anything; All-Purpose Feature Matching; Training-Free Generalist",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/b26955d2e2f8f28ad72efc8a82fc23c6000b53b7.zip",
        "author": "Yang Liu;Muzhi Zhu;Hengtao Li;Hao Chen;Xinlong Wang;Chunhua Shen",
        "authorids": "~Yang_Liu83;~Muzhi_Zhu1;~Hengtao_Li1;~Hao_Chen17;~Xinlong_Wang2;~Chunhua_Shen2",
        "gender": "M;M;M;;M;",
        "homepage": "https://github.com/yangliu96;https://z-mu-z.github.io/;https://github.com/lihengtao;;;",
        "dblp": "51/3710-98.html;157/1679;;;;",
        "google_scholar": "9JcQ2hwAAAAJ;https://scholar.google.com.hk/citations?user=064gBH4AAAAJ;;;DPz0DjYAAAAJ;",
        "orcid": "0009-0003-8540-9154;;;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Yang_Liu83;~Muzhi_Zhu1;~Hengtao_Li1;~Hao_Chen17;~Xinlong_Wang2;~Chunhua_Shen2",
        "aff": "Zhejiang University;Zhejiang University;Zhejiang University;;Beijing Academy of Artificial Intelligence;",
        "aff_domain": "zju.edu.cn;zju.edu.cn;zju.edu.cn;;baai.ac.cn;",
        "position": "PhD student;PhD student;MS student;;Researcher;",
        "bibtex": "@inproceedings{\nliu2024matcher,\ntitle={Matcher: Segment Anything with One Shot Using All-Purpose Feature Matching},\nauthor={Yang Liu and Muzhi Zhu and Hengtao Li and Hao Chen and Xinlong Wang and Chunhua Shen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=yzRXdhk2he}\n}",
        "github": "",
        "project": "",
        "reviewers": "zVyp;3ZxQ;PEjB;TD84",
        "pdf_size": 47137439,
        "rating": "5;6;6;8",
        "confidence": "4;5;4;5",
        "soundness": "3;2;3;4",
        "contribution": "2;3;2;4",
        "presentation": "3;3;3;4",
        "wc_summary": "48;38;59;85",
        "wc_strengths": "34;51;67;98",
        "wc_weaknesses": "151;162;93;148",
        "wc_questions": "2;206;26;69",
        "wc_review": "235;457;245;400",
        "wc_reply_reviewers": "0;0;0;16",
        "wc_reply_authors": "802;1130;553;328",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "3;3;2;2",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            57.5,
            17.528548142958105
        ],
        "wc_strengths_avg": [
            62.5,
            23.58495283014151
        ],
        "wc_weaknesses_avg": [
            138.5,
            26.781523481684157
        ],
        "wc_questions_avg": [
            75.75,
            78.93787113927003
        ],
        "wc_review_avg": [
            334.25,
            96.4452564929971
        ],
        "wc_reply_reviewers_avg": [
            4.0,
            6.928203230275509
        ],
        "wc_reply_authors_avg": [
            703.25,
            298.0162537513684
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.5,
            0.5
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.6882472016116854,
        "gs_citation": 96,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13178796610234931539&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=yzRXdhk2he",
        "pdf": "https://openreview.net/pdf?id=yzRXdhk2he",
        "email": "zju.edu.cn;zju.edu.cn;zju.edu.cn;;baai.ac.cn;",
        "author_num": 6,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "Zhejiang University;Beijing Academy of Artificial Intelligence",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.zju.edu.cn;https://www.baaic.cn",
        "aff_unique_abbr": "ZJU;BAAI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "yzfi15eVI7",
        "title": "iHyperTime: Interpretable Time Series Generation with Implicit Neural Representations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Implicit neural representations (INRs) have emerged as a powerful tool that provides an accurate and resolution-independent encoding of data. Their robustness as general approximators has been shown across diverse data modalities, such as images, video, audio, and 3D scenes. However, little attention has been given to leveraging these architectures for time series data. Addressing this gap, we propose an approach for time series generation based on two novel architectures: TSNet, an INR network for interpretable trend-seasonality time series representation, and iHyperTime, a hypernetwork architecture that leverages TSNet for time series generalization and synthesis.\nThrough evaluations of fidelity and usefulness metrics, we demonstrate that iHyperTime outperforms current state-of-the-art methods in challenging scenarios that involve long or irregularly sampled time series, while performing on par on regularly sampled data. Furthermore, we showcase iHyperTime fast training speed, comparable to the fastest existing methods for short sequences and significantly superior for longer ones. Finally, we empirically validate the quality of the model's unsupervised trend-seasonality decomposition by comparing against the established STL method.",
        "keywords": "Time series generation;implicit neural representations",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/f91203d8aa2443520f9157edaf185f099e56db3c.pdf",
        "author": "Elizabeth Fons;Alejandro Sztrajman;Yousef El-Laham;Andrea Coletta;Alexandros Iosifidis;Svitlana Vyetrenko",
        "authorids": "~Elizabeth_Fons1;~Alejandro_Sztrajman1;~Yousef_El-Laham1;~Andrea_Coletta1;~Alexandros_Iosifidis3;~Svitlana_Vyetrenko1",
        "gender": ";;M;Not Specified;;",
        "homepage": ";;;;;",
        "dblp": ";;;252/1425;;26/8396.html",
        "google_scholar": ";;wlERhz4AAAAJ;https://scholar.google.it/citations?user=O50E4VMAAAAJ;;",
        "orcid": ";;;0000-0003-1401-1715;;",
        "linkedin": ";;;;;",
        "or_profile": "~Elizabeth_Fons1;~Alejandro_Sztrajman1;~Yousef_El-Laham1;~Andrea_Coletta1;~Alexandros_Iosifidis3;~Svitlana_Vyetrenko1",
        "aff": ";;J.P. Morgan Chase;Banca d'Italia;;J.P. Morgan Chase",
        "aff_domain": ";;jpmorgan.com;bancaditalia.it;;jpmorgan.com",
        "position": ";;Researcher;Researcher;;AI Research Director",
        "bibtex": "@misc{\nfons2024ihypertime,\ntitle={iHyperTime: Interpretable Time Series Generation with Implicit Neural Representations},\nauthor={Elizabeth Fons and Alejandro Sztrajman and Yousef El-Laham and Andrea Coletta and Alexandros Iosifidis and Svitlana Vyetrenko},\nyear={2024},\nurl={https://openreview.net/forum?id=yzfi15eVI7}\n}",
        "github": "",
        "project": "",
        "reviewers": "y35Q;h6ka;3NpH;3ERW",
        "site": "https://openreview.net/forum?id=yzfi15eVI7",
        "pdf_size": 13875459,
        "rating": "5;5;6;8",
        "confidence": "4;4;3;4",
        "soundness": "3;2;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;2;3;2",
        "wc_summary": "52;177;54;55",
        "wc_strengths": "19;111;59;32",
        "wc_weaknesses": "107;655;54;290",
        "wc_questions": "1;301;36;34",
        "wc_review": "179;1244;203;411",
        "wc_reply_reviewers": "37;511;42;154",
        "wc_reply_authors": "851;3548;921;1769",
        "reply_reviewers": "1;2;1;1",
        "reply_authors": "2;7;3;4",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            84.5,
            53.415821626181135
        ],
        "wc_strengths_avg": [
            55.25,
            35.27304211433995
        ],
        "wc_weaknesses_avg": [
            276.5,
            235.4150589915607
        ],
        "wc_questions_avg": [
            93.0,
            120.89044627264803
        ],
        "wc_review_avg": [
            509.25,
            433.69480916884396
        ],
        "wc_reply_reviewers_avg": [
            186.0,
            193.38174681184364
        ],
        "wc_reply_authors_avg": [
            1772.25,
            1087.0403338883061
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            4.0,
            1.8708286933869707
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9884752452840182885&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "JPMorgan Chase & Co.;Banca d'Italia",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.jpmorganchase.com;https://www.bancaditalia.it",
        "aff_unique_abbr": "JPM;BDI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0",
        "aff_country_unique": "United States;Italy"
    },
    {
        "id": "z01BwvD41e",
        "title": "Leveraging Word Guessing Games to Assess the Intelligence of Large Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The automatic evaluation of LLM-based agent intelligence is critical in developing advanced LLM-based agents. Although considerable effort has been devoted to developing human-annotated evaluation datasets, such as AlpacaEval, existing techniques are costly, time-consuming, have limited scalability, and lack adaptability. In this paper, inspired by the popular language games ``Who is Spy'' and ``SpyFall'', we propose to use the word guessing game to assess the intelligence performance of LLMs.  Given a word, the LLM is asked to describe the word and determine its identity (spy or not) based on its and other players' descriptions. Ideally, an advanced agent should possess the ability to accurately describe a given word using an aggressive description while concurrently maximizing confusion in the conservative description, enhancing its participation in the game. To this end, we first develop SpyGPT to evaluate LLMs' expression and disguising abilities.  SpyGPT requires the target LLM to describe the given word in aggressive and conservative modes and utilizes the SOTA GPT-4 to determine whether the descriptive sentences can accurately describe the given word. We then introduce SpyGame, an interactive multi-agent framework designed to assess LLMs intelligence through participation in a competitive language-based board game.  Incorporating multi-agent interaction, SpyGame requires the target LLM to possess linguistic skills and strategic thinking, providing a more comprehensive evaluation of LLMs' human-like cognitive abilities and adaptability in complex communication situations. The proposed evaluation framework is very easy to implement. We collected words from multiple sources, domains, and languages and used the proposed evaluation framework to conduct experiments. Extensive experiments demonstrate that the proposed SpyGPT and SpyGame effectively evaluate the capabilities of various LLMs, capturing their ability to adapt to novel situations and engage in strategic communication.",
        "keywords": "Multi-Agent Intelligence;Large Language Models;Artificial General Intelligence",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Tian Liang;Zhiwei He;Jen-tse Huang;Wenxuan Wang;Wenxiang Jiao;Rui Wang;Yujiu Yang;Zhaopeng Tu;Shuming Shi;Xing Wang",
        "authorids": "~Tian_Liang4;~Zhiwei_He1;~Jen-tse_Huang1;~Wenxuan_Wang2;~Wenxiang_Jiao1;~Rui_Wang10;~Yujiu_Yang2;~Zhaopeng_Tu1;~Shuming_Shi1;~Xing_Wang1",
        "gender": "M;M;M;;M;M;M;M;M;M",
        "homepage": "https://skytliang.github.io/;https://zwhe99.github.io/;https://penguinnnnn.github.io/;;https://wxjiao.github.io/;https://sites.google.com/view/iigroup-thu;http://www.zptu.net;;http://xingwang4nlp.com/;https://wangruinlp.github.io/",
        "dblp": ";52/6077-2;317/7026;203/1536-1;239/4883;30/3847;71/9281;s/ShumingShi;02/3674-7;w/RuiWang15",
        "google_scholar": "Z6bZcT4AAAAJ;https://scholar.google.com/citations?hl=en;XBzDTAQAAAAJ;4v5x0bUAAAAJ;CvtODukAAAAJ;4gH3sxsAAAAJ;IvE2zRgAAAAJ;Lg31AKMAAAAJ;6AqRKa0AAAAJ;oTU0v5IAAAAJ",
        "orcid": ";0000-0002-4807-0062;0000-0003-3446-0083;;;0000-0002-6427-1024;;;0000-0002-0737-9653;0000-0001-8007-2503",
        "linkedin": ";;jen-tse-huang-08a169200/;;;;tuzhaopeng;;;",
        "or_profile": "~Tian_Liang4;~Zhiwei_He1;~Jen-tse_Huang1;~Wenxuan_Wang2;~Wenxiang_Jiao1;~Yujiu_Yang2;~Zhaopeng_Tu1;~Shuming_Shi1;~Xing_Wang1;~Rui_Wang7",
        "aff": "Graduate School at Shenzhen,Tsinghua University;Shanghai Jiaotong University;The Chinese University of Hong Kong;The Chinese University of Hong Kong;Tencent AI Lab;Tsinghua University;Tencent AI Lab;Tencent AI Lab;Tencent AI Lab;Shanghai Jiaotong University",
        "aff_domain": "tsinghua.edu.cn;sjtu.edu.cn;cuhk.edu.hk;cuhk.edu.hk;tencent.com;tsinghua.edu.cn;tencent.com;tencent.com;tencent.com;sjtu.edu.cn",
        "position": "MS student;PhD student;PhD student;PhD student;Researcher;Full Professor;Principal Researcher;Principal Researcher;Researcher;Associate Professor",
        "bibtex": "@misc{\nliang2024leveraging,\ntitle={Leveraging Word Guessing Games to Assess the Intelligence of Large Language Models},\nauthor={Tian Liang and Zhiwei He and Jen-tse Huang and Wenxuan Wang and Wenxiang Jiao and Rui Wang and Yujiu Yang and Zhaopeng Tu and Shuming Shi and Xing Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=z01BwvD41e}\n}",
        "github": "",
        "project": "",
        "reviewers": "BUuv;hXPk;c2gN",
        "site": "https://openreview.net/forum?id=z01BwvD41e",
        "pdf_size": 231971,
        "rating": "3;3;5",
        "confidence": "3;5;4",
        "soundness": "2;2;3",
        "contribution": "1;2;2",
        "presentation": "3;3;4",
        "wc_summary": "79;108;62",
        "wc_strengths": "40;65;50",
        "wc_weaknesses": "59;167;64",
        "wc_questions": "1;40;99",
        "wc_review": "179;380;275",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            83.0,
            18.991226044325487
        ],
        "wc_strengths_avg": [
            51.666666666666664,
            10.274023338281628
        ],
        "wc_weaknesses_avg": [
            96.66666666666667,
            49.775049528408864
        ],
        "wc_questions_avg": [
            46.666666666666664,
            40.28509512076258
        ],
        "wc_review_avg": [
            278.0,
            82.08532146492453
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 11,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2172293317085508612&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;2;3;0;3;3;3;1",
        "aff_unique_norm": "Tsinghua University;Shanghai Jiao Tong University;Chinese University of Hong Kong;Tencent",
        "aff_unique_dep": "Graduate School;;;Tencent AI Lab",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.sjtu.edu.cn;https://www.cuhk.edu.hk;https://ai.tencent.com",
        "aff_unique_abbr": "THU;SJTU;CUHK;Tencent AI Lab",
        "aff_campus_unique_index": "0;2;2",
        "aff_campus_unique": "Shenzhen;;Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "z0B4GJuRjo",
        "title": "Sequence-Level Certainty Reduces Hallucination In Knowledge-Grounded Dialogue Generation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Model hallucination has been a crucial interest of research in Natural Language Generation (NLG).\nIn this work, we propose sequence-level certainty as a common theme over hallucination in NLG, and explore the correlation between sequence-level certainty and the level of hallucination in model responses.\nWe categorize sequence-level certainty into two aspects: probabilistic certainty and semantic certainty, and reveal through experiments on Knowledge-Grounded Dialogue Generation (KGDG) task that both a higher level of probabilistic certainty and a higher level of semantic certainty in model responses are significantly correlated with a lower level of hallucination. \nWhat's more, we provide theoretical proof and analysis to show that semantic certainty is a good estimator of probabilistic certainty, and therefore has the potential as an alternative to probability-based certainty estimation in black-box scenarios. \nBased on the observation on the relationship between certainty and hallucination, we further propose Certainty-based Response Ranking (CRR), a decoding-time method for mitigating hallucination in NLG.\nBased on our categorization of sequence-level certainty, we propose $2$ types of CRR approach: Probabilistic CRR (P-CRR) and Semantic CRR (S-CRR).\nP-CRR ranks individually sampled model responses using their arithmetic mean log-probability of the entire sequence.\nS-CRR approaches certainty estimation from meaning-space, and ranks a number of model response candidates based on their semantic certainty level, which is estimated by the entailment-based Agreement Score (AS).\nThrough extensive experiments across $3$ KGDG datasets, $3$ decoding methods, and on $4$ different models, we validate the effectiveness of our $2$ proposed CRR methods to reduce model hallucination.",
        "keywords": "hallucination;semantic certainty;natural language generation;knowledge grounded dialogue generation",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Yixin Wan;Fanyou Wu;Weijie Xu;Srinivasan H. Sengamedu",
        "authorids": "~Yixin_Wan1;~Fanyou_Wu1;~Weijie_Xu1;~Srinivasan_H._Sengamedu1",
        "gender": "F;M;M;",
        "homepage": "https://scholar.google.com/citations?user=hZPIICQAAAAJ&hl=en;http://www.wufanyou.com;https://www.weijiexu.com;",
        "dblp": "320/5376;229/8090;195/1675;38/2372",
        "google_scholar": "hZPIICQAAAAJ;C8WYCTAAAAAJ;lWjp-dQAAAAJ;X9fVMRUAAAAJ",
        "orcid": ";;;0000-0003-1847-8398",
        "linkedin": "elaine-yixin-wan-8032b8136/;;weijie-xu-936b23101/;srinivasan-h-sengamedu",
        "or_profile": "~Yixin_Wan1;~Fanyou_Wu1;~Weijie_Xu1;~Srinivasan_H._Sengamedu1",
        "aff": "University of California, Los Angeles;Amazon;Amazon;Amazon",
        "aff_domain": "ucla.edu;amazon.com;amazon.com;amazon.com",
        "position": "PhD student;Researcher;Researcher;Applied Science Manager",
        "bibtex": "@misc{\nwan2024sequencelevel,\ntitle={Sequence-Level Certainty Reduces Hallucination In Knowledge-Grounded Dialogue Generation},\nauthor={Yixin Wan and Fanyou Wu and Weijie Xu and Srinivasan H. Sengamedu},\nyear={2024},\nurl={https://openreview.net/forum?id=z0B4GJuRjo}\n}",
        "github": "",
        "project": "",
        "reviewers": "drdo;Rt2T;Ck8E;qG74",
        "site": "https://openreview.net/forum?id=z0B4GJuRjo",
        "pdf_size": 356933,
        "rating": "3;3;5;5",
        "confidence": "3;4;4;4",
        "soundness": "3;2;2;2",
        "contribution": "2;2;2;2",
        "presentation": "1;2;2;2",
        "wc_summary": "111;64;107;74",
        "wc_strengths": "116;57;22;44",
        "wc_weaknesses": "226;445;221;68",
        "wc_questions": "7;3;43;2",
        "wc_review": "460;569;393;188",
        "wc_reply_reviewers": "89;0;0;0",
        "wc_reply_authors": "2027;1675;1009;386",
        "reply_reviewers": "2;0;0;0",
        "reply_authors": "6;8;3;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            89.0,
            20.359273071502333
        ],
        "wc_strengths_avg": [
            59.75,
            34.802119188348286
        ],
        "wc_weaknesses_avg": [
            240.0,
            134.31865097595346
        ],
        "wc_questions_avg": [
            13.75,
            16.990806337546196
        ],
        "wc_review_avg": [
            402.5,
            138.86054155158692
        ],
        "wc_reply_reviewers_avg": [
            22.25,
            38.53813046840752
        ],
        "wc_reply_authors_avg": [
            1274.25,
            629.7973384351509
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            4.5,
            2.692582403567252
        ],
        "replies_avg": [
            24,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11448437272395831179&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "University of California, Los Angeles;Amazon",
        "aff_unique_dep": ";Amazon.com, Inc.",
        "aff_unique_url": "https://www.ucla.edu;https://www.amazon.com",
        "aff_unique_abbr": "UCLA;Amazon",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Los Angeles;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "z0pn0IUDsX",
        "title": "From Categories to Classifier: Name-Only Continual Learning by Exploring the Web",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Continual Learning (CL) often relies on the availability of extensive annotated datasets, an assumption that is unrealistically time-consuming and costly in practice. We explore a novel paradigm termed name-only continual learning where time and cost constraints prohibit manual annotation. In this scenario, learners adapt to new category shifts using only category names without the luxury of annotated training data. Our proposed solution leverages the expansive and ever-evolving internet to query and download uncurated webly-supervised data for image classification. We investigate the reliability of our web data and find them comparable, and in some cases superior, to manually annotated datasets. Additionally, we show that by harnessing the web, we can create support sets that surpass state-of-the-art name-only classification that create support sets using generative models or image retrieval from LAION-5B, achieving up to 25% boost in accuracy. When applied across varied continual learning contexts, our method consistently exhibits a small performance gap in comparison to models trained on manually annotated datasets. We present EvoTrends, a class-incremental dataset made from the web to capture real-world trends, created in just minutes. Overall, this paper underscores the potential of using uncurated webly-supervised data to mitigate the challenges associated with manual data labeling in continual learning.",
        "keywords": "continual learning;zero-shot learning",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/f341f97a7ce82a179f71955f926505a427a374c4.pdf",
        "author": "Ameya Prabhu;Hasan Abed Al Kader Hammoud;Ser-Nam Lim;Bernard Ghanem;Philip Torr;Adel Bibi",
        "authorids": "~Ameya_Prabhu1;~Hasan_Abed_Al_Kader_Hammoud1;~Ser-Nam_Lim3;~Bernard_Ghanem1;~Philip_Torr1;~Adel_Bibi1",
        "gender": "M;M;M;;M;M",
        "homepage": "https://drimpossible.github.io/;https://cemse.kaust.edu.sa/vcc/people/person/hasan-abed-al-kader-hammoud;https://ivul.kaust.edu.sa;http://www.robots.ox.ac.uk/~tvg/;http://adelbibi.com;https://sites.google.com/site/sernam",
        "dblp": "181/4512;259/0615;37/2516;;176/0964;04/6633",
        "google_scholar": "0kK7sSAAAAAJ;Plf1JSIAAAAJ;rVsGTeEAAAAJ;;Q4j2laYAAAAJ;HX0BfLYAAAAJ",
        "orcid": ";;0000-0002-5534-587X;;0000-0002-6169-3918;",
        "linkedin": ";hasan-abed-al-kader-hammoud-56392a147/;bernardghanem/;;adel-bibi-ba3671ab/;",
        "or_profile": "~Ameya_Prabhu1;~Hasan_Abed_Al_Kader_Hammoud1;~Bernard_Ghanem1;~Philip_Torr1;~Adel_Bibi1;~Ser-Nam_Lim1",
        "aff": "University of Oxford;KAUST;King Abdullah University of Science and Technology;University of Oxford;University of Oxford;University of Central Florida",
        "aff_domain": "ox.ac.uk;kaust.edu.sa;kaust.edu.sa;ox.ac.uk;ox.ac.uk;ucf.edu",
        "position": "PhD student;PhD student;Full Professor;Full Professor;Senior Researcher;Associate Professor",
        "bibtex": "@misc{\nprabhu2024from,\ntitle={From Categories to Classifier: Name-Only Continual Learning by Exploring the Web},\nauthor={Ameya Prabhu and Hasan Abed Al Kader Hammoud and Ser-Nam Lim and Bernard Ghanem and Philip Torr and Adel Bibi},\nyear={2024},\nurl={https://openreview.net/forum?id=z0pn0IUDsX}\n}",
        "github": "",
        "project": "",
        "reviewers": "7o8D;M9S2;xW5K;7ydL;xoLu",
        "site": "https://openreview.net/forum?id=z0pn0IUDsX",
        "pdf_size": 7299187,
        "rating": "3;5;5;6;6",
        "confidence": "4;5;2;5;4",
        "soundness": "2;2;3;2;3",
        "contribution": "1;1;2;3;3",
        "presentation": "3;2;4;3;4",
        "wc_summary": "158;114;64;103;54",
        "wc_strengths": "73;49;41;59;116",
        "wc_weaknesses": "178;87;66;99;207",
        "wc_questions": "121;2;192;222;6",
        "wc_review": "530;252;363;483;383",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "695;396;676;630;544",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "2;1;1;1;1",
        "rating_avg": [
            5.0,
            1.0954451150103321
        ],
        "confidence_avg": [
            4.0,
            1.0954451150103321
        ],
        "soundness_avg": [
            2.4,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.0,
            0.8944271909999159
        ],
        "presentation_avg": [
            3.2,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            98.6,
            37.33952329636788
        ],
        "wc_strengths_avg": [
            67.6,
            26.45448922205832
        ],
        "wc_weaknesses_avg": [
            127.4,
            54.96398821046376
        ],
        "wc_questions_avg": [
            108.6,
            91.49775953541157
        ],
        "wc_review_avg": [
            402.2,
            97.2900817144276
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            588.2,
            109.32227586361346
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.2,
            0.4000000000000001
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.1666666666666667,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9966682849343744057&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;1;0;0;2",
        "aff_unique_norm": "University of Oxford;King Abdullah University of Science and Technology;University of Central Florida",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.ox.ac.uk;https://www.kaust.edu.sa;https://www.ucf.edu",
        "aff_unique_abbr": "Oxford;KAUST;UCF",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;0;0;2",
        "aff_country_unique": "United Kingdom;Saudi Arabia;United States"
    },
    {
        "id": "z1WiEHnjQs",
        "title": "A General Formulation of Independent Policy Optimization in Fully Decentralized MARL",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Independent learning is a straightforward solution for fully decentralized learning in cooperative multi-agent reinforcement learning (MARL). The study of independent learning has a history of decades, and the representatives, such as independent Q-learning and independent PPO, can obtain good performance in some benchmarks. However, most independent learning algorithms are without convergence guarantees or theoretical support. In this paper, we propose a general formulation of independent policy optimization, $f$-divergence policy optimization. We show the generality of such a formulation and discuss the limitation. Based on this formulation, we further propose a novel independent learning algorithm, TVPO, that theoretically guarantees convergence. Empirically, we show that TVPO outperforms state-of-the-art fully decentralized learning methods in three popular cooperative MARL benchmarks, which verifies the efficacy of TVPO.",
        "keywords": "multi-agent;reinforcement learning;policy optimization;decentralized learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Kefan Su;Zongqing Lu",
        "authorids": "~Kefan_Su1;~Zongqing_Lu2",
        "gender": ";",
        "homepage": ";",
        "dblp": ";",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Kefan_Su1;~Zongqing_Lu2",
        "aff": ";",
        "aff_domain": ";",
        "position": ";",
        "bibtex": "@misc{\nsu2024a,\ntitle={A General Formulation of Independent Policy Optimization in Fully Decentralized {MARL}},\nauthor={Kefan Su and Zongqing Lu},\nyear={2024},\nurl={https://openreview.net/forum?id=z1WiEHnjQs}\n}",
        "github": "",
        "project": "",
        "reviewers": "KN9g;5FWA;s7nG",
        "site": "https://openreview.net/forum?id=z1WiEHnjQs",
        "pdf_size": 936006,
        "rating": "1;3;6",
        "confidence": "5;3;3",
        "soundness": "1;1;3",
        "contribution": "1;2;3",
        "presentation": "2;2;3",
        "wc_summary": "41;138;46",
        "wc_strengths": "36;32;42",
        "wc_weaknesses": "545;278;48",
        "wc_questions": "12;4;2",
        "wc_review": "634;452;138",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.3333333333333335,
            2.0548046676563256
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            75.0,
            44.594469014292194
        ],
        "wc_strengths_avg": [
            36.666666666666664,
            4.109609335312651
        ],
        "wc_weaknesses_avg": [
            290.3333333333333,
            203.0867357121637
        ],
        "wc_questions_avg": [
            6.0,
            4.320493798938574
        ],
        "wc_review_avg": [
            408.0,
            204.8674368138252
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.802955068546966,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:PJwbNLwuZm4J:scholar.google.com/&scioq=A+General+Formulation+of+Independent+Policy+Optimization+in+Fully+Decentralized+MARL&hl=en&as_sdt=0,5",
        "gs_version_total": 0
    },
    {
        "id": "z282NEQDbF",
        "title": "Comparative Knowledge Distillation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In the era of large-scale pretrained models, Knowledge Distillation (KD) serves an important role in transferring the wisdom of computationally-heavy teacher models to lightweight, efficient student models while preserving performance. Traditional KD paradigms, however, assume readily available access to teacher models for frequent inference\u2014a notion increasingly at odds with the realities of costly, often proprietary, large-scale models. Addressing this gap, our paper considers how to minimize the dependency on teacher model inferences in KD in a setting we term Few-Teacher-Inference Knowledge Distillation (FTI-KD). We observe that prevalent KD techniques and state-of-the-art data augmentation strategies fall short in this constrained setting. Drawing inspiration from educational principles that emphasize learning through comparison, we propose Comparative Knowledge Distillation (CKD), which encourages student models to understand the nuanced differences in a teacher model\u2019s interpretations of samples. Critically, CKD provides additional learning signals to the student without making additional teacher calls. We also extend the principle of CKD to groups of samples, enabling even more efficient learning from limited teacher calls. Empirical evaluation across varied experimental settings indicates that CKD consistently outperforms state-of-the-art data augmentation and KD techniques.",
        "keywords": "knowledge distillation;low-resource;data augmentation",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Alex Wilf;Alex Tianyi Xu;Paul Pu Liang;Alexander Obolenskiy;Daniel Fried;Louis-Philippe Morency",
        "authorids": "~Alex_Wilf1;~Alex_Tianyi_Xu1;~Paul_Pu_Liang1;~Alexander_Obolenskiy1;~Daniel_Fried1;~Louis-Philippe_Morency1",
        "gender": "M;M;M;M;M;M",
        "homepage": "https://abwilf.github.io/;;https://pliang279.github.io/;;https://dpfried.github.io/;https://www.cs.cmu.edu/~morency/",
        "dblp": "277/0822;359/9175;207/9749;;117/4804;31/739",
        "google_scholar": "r1Zw-VEAAAAJ;AYbfPEAAAAAJ;https://scholar.google.com/citations?hl=en;;sJDqACEAAAAJ;https://scholar.google.com.tw/citations?user=APgaFK0AAAAJ",
        "orcid": "0000-0002-5587-5125;;;;;0000-0001-6376-7696",
        "linkedin": "abwilf/;alex-xu-503265219/;;alexander-obolenskiy/;;morency?challengeId=AQELGK_OvMa0vwAAAY72L-VV4X9hW8juuY80VHVeeSGHZ1PJHeeEa5LTFoeTmDGU0t1OL07MXJTYC9EAi6qgPDd2z9ztnbdFYA&submissionId=09a0ff34-04ac-c717-bef7-8c9c8811b463&challengeSource=AgFhxWkU3q7v4wAAAY72L-1xRE0eG-BnZUNE9e3eAG95pgOCZ9u1nxEg-1dK2Dw&challegeType=AgHMzV0lqKgEFwAAAY72L-11X6DHMd3V_A3Iur8XZeyYF2-oBzoufs8&memberId=AgH4yz7pZ_riCgAAAY72L-146jmR2pdr3dmhy2icxBtEQzQ&recognizeDevice=AgFDCNyrhKiFSAAAAY72L-16m7z2EH2t0ueWmMKjyk1_ZJAkfFVe",
        "or_profile": "~Alex_Wilf1;~Alex_Tianyi_Xu1;~Paul_Pu_Liang1;~Alexander_Obolenskiy1;~Daniel_Fried1;~Louis-Philippe_Morency1",
        "aff": "Carnegie Mellon University;Carnegie Mellon University;Massachusetts Institute of Technology;Carnegie Mellon University;Carnegie Mellon University;Carnegie Mellon University",
        "aff_domain": "cmu.edu;cmu.edu;mit.edu;cmu.edu;cmu.edu;cmu.edu",
        "position": "PhD student;Undergrad student;Assistant Professor;Undergrad student;Assistant Professor;Associate Professor",
        "bibtex": "@misc{\nwilf2024comparative,\ntitle={Comparative Knowledge Distillation},\nauthor={Alex Wilf and Alex Tianyi Xu and Paul Pu Liang and Alexander Obolenskiy and Daniel Fried and Louis-Philippe Morency},\nyear={2024},\nurl={https://openreview.net/forum?id=z282NEQDbF}\n}",
        "github": "",
        "project": "",
        "reviewers": "fQMq;P6qh;WFsY;xswU",
        "site": "https://openreview.net/forum?id=z282NEQDbF",
        "pdf_size": 1589310,
        "rating": "3;3;3;6",
        "confidence": "4;4;5;5",
        "soundness": "1;3;2;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;2;4",
        "wc_summary": "72;36;76;81",
        "wc_strengths": "34;15;72;105",
        "wc_weaknesses": "191;103;501;268",
        "wc_questions": "48;32;80;102",
        "wc_review": "345;186;729;556",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            66.25,
            17.75352077758099
        ],
        "wc_strengths_avg": [
            56.5,
            34.7167106736799
        ],
        "wc_weaknesses_avg": [
            265.75,
            147.83669199491715
        ],
        "wc_questions_avg": [
            65.5,
            27.253440149823287
        ],
        "wc_review_avg": [
            454.0,
            205.99393194946302
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Dtx7YoCRtqAJ:scholar.google.com/&scioq=Comparative+Knowledge+Distillation&hl=en&as_sdt=0,10",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1;0;0;0",
        "aff_unique_norm": "Carnegie Mellon University;Massachusetts Institute of Technology",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cmu.edu;https://web.mit.edu",
        "aff_unique_abbr": "CMU;MIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "z2avrOUajn",
        "title": "SubDiff: Subgraph Latent Diffusion Model",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Diffusion models have achieved impressive performances on generative tasks in various domains. While numerous approaches are striving to generate feature-rich graphs to advance foundational science research, there are still challenges hindering generating high-quality graphs. First, the discrete geometric property of graphs gains difficulty in capturing complex node-level dependencies for diffusion model. Second, there is still a gap to simultaneously unify unconditional and conditional generation. In this paper, we propose a subgraph latent diffusion model to jointly address above challenges by inheriting the nice property of subgraph. Subgraphs can adapt diffusion process to discrete geometric data by simplifying the complex dependencies between nodes. Besides, subgraph latent embedding with explicit supervision can bridge the gap between unconditional and conditional generation. To this end, we propose a subgraph latent diffusion model (SubDiff) by taking subgraphs as minimum units. Specifically, a novel Subgraph Equivariant Graph Neural Network is proposed to achieve graph equivariance. Then a Head Alterable Sampling strategy (HAS) is devised to allow different sampling routes along diffusion processes, unifying the conditional and unconditional generative learning. Theoretical analysis demonstrate that our training objective is equivalent to optimizing the variational lower bound of log-likelihood. Extensive experiments show SubDiff achieving better performance in both generative schemes.",
        "keywords": "Latent Diffusion Model;Subgraph Learning;Conditional Generative Model",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Kuo Yang;Zhengyang Zhou;Limin Li;Pengkun Wang;Xu Wang;Yang Wang",
        "authorids": "~Kuo_Yang2;~Zhengyang_Zhou1;~Limin_Li3;~Pengkun_Wang1;~Xu_Wang16;~Yang_Wang32",
        "gender": "M;M;M;M;M;M",
        "homepage": ";http://home.ustc.edu.cn/~zzy0929/Home/;http://di.ustc.edu.cn/;http://home.ustc.edu.cn/~pengkun/index.html;http://home.ustc.edu.cn/~wx309/;http://staff.ustc.edu.cn/~angyan/",
        "dblp": ";246/8238;;;181/2815-29;",
        "google_scholar": ";dPElQLUAAAAJ;;https://scholar.google.com/citations?hl=zh-CN;7hYGPC8AAAAJ;https://scholar.google.com/citations?hl=zh-CN",
        "orcid": "0000-0003-3346-5130;0000-0003-4728-7347;;0000-0002-2680-4563;0000-0002-1492-3477;0000-0002-6079-7053",
        "linkedin": "https://www.linkedin.cn/incareer/in/kuo-yang-440a241b4;;;;;",
        "or_profile": "~Kuo_Yang2;~Zhengyang_Zhou1;~Limin_Li3;~Pengkun_Wang1;~Xu_Wang16;~Yang_Wang32",
        "aff": "University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China;University of Science and Technology of China",
        "aff_domain": "ustc.edu.cn;ustc.edu.cn;ustc.edu.cn;ustc.edu.cn;ustc.edu.cn;ustc.edu.cn",
        "position": "PhD student;Researcher;PhD student;Researcher;Associate Researcher;Associate Professor",
        "bibtex": "@misc{\nyang2024subdiff,\ntitle={SubDiff: Subgraph Latent Diffusion Model},\nauthor={Kuo Yang and Zhengyang Zhou and Limin Li and Pengkun Wang and Xu Wang and Yang Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=z2avrOUajn}\n}",
        "github": "",
        "project": "",
        "reviewers": "Dfq7;tXm3;C6xG",
        "site": "https://openreview.net/forum?id=z2avrOUajn",
        "pdf_size": 2177637,
        "rating": "3;5;6",
        "confidence": "4;4;4",
        "soundness": "2;3;3",
        "contribution": "2;3;3",
        "presentation": "2;2;3",
        "wc_summary": "36;62;36",
        "wc_strengths": "24;58;50",
        "wc_weaknesses": "359;183;120",
        "wc_questions": "3;49;2",
        "wc_review": "422;352;208",
        "wc_reply_reviewers": "62;43;0",
        "wc_reply_authors": "915;1172;560",
        "reply_reviewers": "1;2;0",
        "reply_authors": "3;4;2",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            44.666666666666664,
            12.256517540566824
        ],
        "wc_strengths_avg": [
            44.0,
            14.514360704718161
        ],
        "wc_weaknesses_avg": [
            220.66666666666666,
            101.1412653448411
        ],
        "wc_questions_avg": [
            18.0,
            21.924111536540465
        ],
        "wc_review_avg": [
            327.3333333333333,
            89.08921870175362
        ],
        "wc_reply_reviewers_avg": [
            35.0,
            25.93581821856921
        ],
        "wc_reply_authors_avg": [
            882.3333333333334,
            250.91344235723113
        ],
        "reply_reviewers_avg": [
            1.0,
            0.816496580927726
        ],
        "reply_authors_avg": [
            3.0,
            0.816496580927726
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17588680301395497225&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0;0",
        "aff_unique_norm": "University of Science and Technology of China",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.ustc.edu.cn",
        "aff_unique_abbr": "USTC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Massively Scalable Inverse Reinforcement Learning in Google Maps",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17395",
        "id": "z3L59iGALM",
        "author_site": "Matt Barnes, Matthew Abueg, Oliver Lange, Matt Deeds, Jason Trader, Denali Molitor, Markus Wulfmeier, Shawn O'Banion",
        "tldr": "",
        "abstract": "Inverse reinforcement learning (IRL) offers a powerful and general framework for learning humans' latent preferences in route recommendation, yet no approach has successfully addressed planetary-scale problems with hundreds of millions of states and demonstration trajectories. In this paper, we introduce scaling techniques based on graph compression, spatial parallelization, and improved initialization conditions inspired by a connection to eigenvector algorithms. We revisit classic IRL methods in the routing context, and make the key observation that there exists a trade-off between the use of cheap, deterministic planners and expensive yet robust stochastic policies. This insight is leveraged in Receding Horizon Inverse Planning (RHIP), a new generalization of classic IRL algorithms that provides fine-grained control over performance trade-offs via its planning horizon. Our contributions culminate in a policy that achieves a 16-24% improvement in route quality at a global scale, and to the best of our knowledge, represents the largest published study of IRL algorithms in a real-world setting to date. We conclude by conducting an ablation study of key components, presenting negative results from alternative eigenvalue solvers, and identifying opportunities to further improve scalability via IRL-specific batching strategies.",
        "keywords": "Inverse reinforcement learning;route optimization",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Matt Barnes;Matthew Abueg;Oliver F. Lange;Matt Deeds;Jason Trader;Denali Molitor;Markus Wulfmeier;Shawn O'Banion",
        "authorids": "~Matt_Barnes1;~Matthew_Abueg1;~Oliver_F._Lange1;~Matt_Deeds1;~Jason_Trader1;~Denali_Molitor1;~Markus_Wulfmeier1;~Shawn_O'Banion1",
        "gender": "M;M;M;F;M;M;M;M",
        "homepage": ";;;;;;;",
        "dblp": "160/9912;95/6667;;213/7937;166/1552;127/7497;311/7352.html;24/6675",
        "google_scholar": "y5XmOJwAAAAJ;;R4G7xPcAAAAJ;;;0F-tZ9gAAAAJ;;8M-7KQ0AAAAJ",
        "orcid": ";;;;;;0000-0002-4848-1988;",
        "linkedin": ";;jasontrader17;;;;;",
        "or_profile": "~Matt_Barnes1;~Matt_Deeds1;~Jason_Trader1;~Denali_Molitor1;~Markus_Wulfmeier1;~Shawn_O'Banion1;~Matthew_Ekstrand_Abueg1;~Oliver_Lange2",
        "aff": "Google;;Google;;Google DeepMind;Google DeepMind;Research, Google;",
        "aff_domain": "google.com;;google.com;;deepmind.com;deepmind.com;research.google.com;",
        "position": "Researcher;;Software Engineer;;Research Scientist;Researcher;Software Engineer;",
        "bibtex": "@inproceedings{\nbarnes2024massively,\ntitle={Massively Scalable Inverse Reinforcement Learning in Google Maps},\nauthor={Matt Barnes and Matthew Abueg and Oliver F. Lange and Matt Deeds and Jason Trader and Denali Molitor and Markus Wulfmeier and Shawn O'Banion},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=z3L59iGALM}\n}",
        "github": "",
        "project": "",
        "reviewers": "2Fnw;Ucz3;nMaV;5CwT",
        "pdf_size": 1465107,
        "rating": "6;6;8;10",
        "confidence": "3;4;3;4",
        "soundness": "3;3;3;4",
        "contribution": "2;3;3;4",
        "presentation": "3;3;3;3",
        "wc_summary": "182;82;173;183",
        "wc_strengths": "67;62;103;154",
        "wc_weaknesses": "121;218;95;137",
        "wc_questions": "81;53;107;67",
        "wc_review": "451;415;478;541",
        "wc_reply_reviewers": "308;326;118;0",
        "wc_reply_authors": "569;1033;738;191",
        "reply_reviewers": "1;3;1;0",
        "reply_authors": "2;4;2;1",
        "rating_avg": [
            7.5,
            1.6583123951777
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            155.0,
            42.326114870136614
        ],
        "wc_strengths_avg": [
            96.5,
            36.77295201639379
        ],
        "wc_weaknesses_avg": [
            142.75,
            45.95854109956059
        ],
        "wc_questions_avg": [
            77.0,
            19.949937343260004
        ],
        "wc_review_avg": [
            471.25,
            46.05635135353212
        ],
        "wc_reply_reviewers_avg": [
            188.0,
            135.7276685130928
        ],
        "wc_reply_authors_avg": [
            632.75,
            304.33729232547233
        ],
        "reply_reviewers_avg": [
            1.25,
            1.0897247358851685
        ],
        "reply_authors_avg": [
            2.25,
            1.0897247358851685
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.30151134457776363,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15526323678583274696&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=z3L59iGALM",
        "pdf": "https://openreview.net/pdf?id=z3L59iGALM",
        "email": "google.com;;google.com;;deepmind.com;deepmind.com;research.google.com;",
        "author_num": 8,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Google",
        "aff_unique_dep": "Google",
        "aff_unique_url": "https://www.google.com",
        "aff_unique_abbr": "Google",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Mountain View;",
        "aff_country_unique_index": "0;0;1;1;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "title": "Revisit and Outstrip Entity Alignment: A Perspective of Generative Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17394",
        "id": "z3dfuRcGAK",
        "author_site": "Lingbing Guo, Zhuo Chen, Jiaoyan Chen, Yin Fang, Wen Zhang, Huajun Chen",
        "tldr": "",
        "abstract": "Recent embedding-based methods have achieved great successes in exploiting entity alignment from knowledge graph (KG) embeddings of multiple modalities. In this paper, we study embedding-based entity alignment (EEA) from a perspective of generative models. We show that EEA shares similarities with typical generative models and prove the effectiveness of the recently developed generative adversarial network (GAN)-based EEA methods theoretically. We then reveal that their incomplete objective limits the capacity on both entity alignment and entity synthesis (i.e., generating new entities). We mitigate this problem by introducing a generative EEA (GEEA) framework with the proposed mutual variational autoencoder (M-VAE) as the generative model. M-VAE enables entity conversion between KGs and generation of new entities from random noise vectors. We demonstrate the power of GEEA with theoretical analysis and empirical experiments on both entity alignment and entity synthesis tasks. The source code and datasets are available at github.com/zjukg/GEEA.",
        "keywords": "entity alignment;variational autoencoder;generative models;knowledge graphs",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/ad8e9203f5b985ccd0d5180fede805ee64690809.zip",
        "author": "Lingbing Guo;Zhuo Chen;Jiaoyan Chen;Yin Fang;Wen Zhang;Huajun Chen",
        "authorids": "~Lingbing_Guo1;~Zhuo_Chen3;~Jiaoyan_Chen1;~Yin_Fang1;~Wen_Zhang4;~Huajun_Chen1",
        "gender": "M;;M;F;;M",
        "homepage": "https://guolingbing.github.io/;;https://chenjiaoyan.github.io/;https://github.com/Fangyinfff;https://person.zju.edu.cn/en/wenzhang;",
        "dblp": "228/2586;;56/8110-1;231/7716;43/2368-15;94/5089",
        "google_scholar": "og4v8cMAAAAJ;;https://scholar.google.ch/citations?user=5Cy4z8wAAAAJ;4rWspjsAAAAJ;Ig9ho4kAAAAJ;",
        "orcid": ";;0000-0003-4643-6750;0000-0001-9538-848X;;",
        "linkedin": ";;;;;",
        "or_profile": "~Lingbing_Guo1;~Zhuo_Chen3;~Jiaoyan_Chen1;~Yin_Fang1;~Wen_Zhang4;~Huajun_Chen1",
        "aff": "Zhejiang University;;University of Oxford;Zhejiang University;Zhejiang University;Zhejiang University",
        "aff_domain": "zju.edu.cn;;cs.ox.ac.uk;zju.edu.cn;zju.edu.cn;zju.edu.cn",
        "position": "PhD student;;Senior Researcher;PhD student;Assistant Professor;Full Professor",
        "bibtex": "@inproceedings{\nguo2024revisit,\ntitle={Revisit and Outstrip Entity Alignment: A Perspective of Generative Models},\nauthor={Lingbing Guo and Zhuo Chen and Jiaoyan Chen and Yin Fang and Wen Zhang and Huajun Chen},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=z3dfuRcGAK}\n}",
        "github": "",
        "project": "",
        "reviewers": "ALxa;gcSh;sPPq",
        "pdf_size": 13295943,
        "rating": "6;6;8",
        "confidence": "3;3;4",
        "soundness": "2;2;3",
        "contribution": "2;2;4",
        "presentation": "2;2;3",
        "wc_summary": "57;50;95",
        "wc_strengths": "12;48;89",
        "wc_weaknesses": "94;65;73",
        "wc_questions": "46;87;4",
        "wc_review": "209;250;261",
        "wc_reply_reviewers": "286;12;26",
        "wc_reply_authors": "1366;1125;665",
        "reply_reviewers": "1;1;1",
        "reply_authors": "4;3;2",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            67.33333333333333,
            19.770910168449223
        ],
        "wc_strengths_avg": [
            49.666666666666664,
            31.45720196641074
        ],
        "wc_weaknesses_avg": [
            77.33333333333333,
            12.229290885229426
        ],
        "wc_questions_avg": [
            45.666666666666664,
            33.88542787426805
        ],
        "wc_review_avg": [
            240.0,
            22.37558192911788
        ],
        "wc_reply_reviewers_avg": [
            108.0,
            125.9947088836141
        ],
        "wc_reply_authors_avg": [
            1052.0,
            290.8000458505237
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            3.0,
            0.816496580927726
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.9999999999999998,
        "gs_citation": 17,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16687742967768806145&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=z3dfuRcGAK",
        "pdf": "https://openreview.net/pdf?id=z3dfuRcGAK",
        "email": "zju.edu.cn;;cs.ox.ac.uk;zju.edu.cn;zju.edu.cn;zju.edu.cn",
        "author_num": 6,
        "aff_unique_index": "0;1;0;0;0",
        "aff_unique_norm": "Zhejiang University;University of Oxford",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.zju.edu.cn;https://www.ox.ac.uk",
        "aff_unique_abbr": "ZJU;Oxford",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0;0",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "id": "z3mPLBLfGY",
        "title": "Generalist Equivariant Transformer Towards 3D Molecular Interaction Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Many processes in biology and drug discovery involve various 3D interactions between molecules, such as protein and protein, protein and small molecule, etc. Given that different molecules are usually represented in different granularity, existing methods usually encode each type of molecules independently with different models, leaving it defective to learn the universal underlying interaction physics. \nIn this paper, we first propose to universally represent an arbitrary 3D complex as a geometric graph of sets, shedding light on encoding all types of molecules with one model. We then propose a Generalist Equivariant Transformer (GET) to effectively capture both domain-specific hierarchies and domain-agnostic interaction physics. To be specific, GET consists of a bilevel attention module, a feed-forward module and a layer normalization module, where each module is E(3) equivariant and specialized for handling sets of variable sizes. Notably, in contrast to conventional pooling-based hierarchical models, our GET is able to retain fine-grained information of all levels.  Extensive experiments on the interactions between proteins, small molecules and RNA/DNAs verify the effectiveness and generalization capability of our proposed method across different domains.",
        "keywords": "unified representation; molecular interaction; equivariant transformer",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Xiangzhe Kong;Wenbing Huang;Yang Liu",
        "authorids": "~Xiangzhe_Kong1;~Wenbing_Huang1;~Yang_Liu19",
        "gender": "M;M;M",
        "homepage": "https://kxz18.github.io/;https://gsai.ruc.edu.cn/english/wenbing_huang;http://nlp.csai.tsinghua.edu.cn/~ly/",
        "dblp": "293/7526;155/3181-1.html;51/3710-5",
        "google_scholar": "0oSFYmkAAAAJ;0yNkmO4AAAAJ;https://scholar.google.com.hk/citations?user=lVhoKNcAAAAJ",
        "orcid": ";;0000-0002-3087-242X",
        "linkedin": ";;",
        "or_profile": "~Xiangzhe_Kong1;~Wenbing_Huang1;~Yang_Liu19",
        "aff": "Tsinghua University;Renmin University of China;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;ruc.edu.cn;tsinghua.edu.cn",
        "position": "PhD student;Associate Professor;Professor",
        "bibtex": "@misc{\nkong2024generalist,\ntitle={Generalist Equivariant Transformer Towards 3D Molecular Interaction Learning},\nauthor={Xiangzhe Kong and Wenbing Huang and Yang Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=z3mPLBLfGY}\n}",
        "github": "",
        "project": "",
        "reviewers": "cg1F;g12k;KrxA;cTJZ",
        "site": "https://openreview.net/forum?id=z3mPLBLfGY",
        "pdf_size": 4849817,
        "rating": "5;5;6;8",
        "confidence": "4;3;5;3",
        "soundness": "3;3;2;3",
        "contribution": "3;3;2;3",
        "presentation": "2;3;2;3",
        "wc_summary": "81;52;29;63",
        "wc_strengths": "18;83;30;34",
        "wc_weaknesses": "28;149;8;48",
        "wc_questions": "262;51;108;12",
        "wc_review": "389;335;175;157",
        "wc_reply_reviewers": "184;62;0;0",
        "wc_reply_authors": "2608;1276;680;420",
        "reply_reviewers": "2;1;0;0",
        "reply_authors": "7;5;3;2",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            56.25,
            18.833148966649205
        ],
        "wc_strengths_avg": [
            41.25,
            24.81305100143874
        ],
        "wc_weaknesses_avg": [
            58.25,
            54.26958171941258
        ],
        "wc_questions_avg": [
            108.25,
            95.10619065024106
        ],
        "wc_review_avg": [
            264.0,
            100.04498987955368
        ],
        "wc_reply_reviewers_avg": [
            61.5,
            75.11824012848011
        ],
        "wc_reply_authors_avg": [
            1246.0,
            845.366192841895
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            4.25,
            1.920286436967152
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.24618298195866545,
        "gs_citation": 13,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8111101484159480140&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Tsinghua University;Renmin University of China",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tsinghua.edu.cn;http://www.ruc.edu.cn",
        "aff_unique_abbr": "THU;RUC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Pre-training with Random Orthogonal Projection Image Modeling",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17393",
        "id": "z4Hcegjzph",
        "author_site": "Maryam Haghighat, Peyman Moghadam, Shaheer Mohamed, Piotr Koniusz",
        "tldr": "",
        "abstract": "Masked Image Modeling (MIM) is a powerful self-supervised strategy for visual pre-training without the use of labels. MIM applies random crops to input images, processes them with an encoder, and then recovers the masked inputs with a decoder, which encourages the network to capture and learn structural information about objects and scenes. The intermediate feature representations obtained from MIM are suitable for fine-tuning on downstream tasks. In this paper, we propose an Image Modeling framework based on random orthogonal projection instead of binary masking as in MIM. Our proposed Random Orthogonal Projection Image Modeling (ROPIM) reduces spatially-wise token information under guaranteed bound on the noise variance and can be considered as masking entire spatial image area under locally varying masking degrees. Since ROPIM uses a random subspace for the projection that realizes the masking step, the readily available complement of the subspace can be used during unmasking to promote recovery of removed information. In this paper, we show that using random orthogonal projection leads to superior performance compared to crop-based masking. We demonstrate state-of-the-art results on several popular benchmarks.",
        "keywords": "Random Projection;Self-supervised Learning;Image Modelling;Representation Learning;Vision Transformer",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Maryam Haghighat;Peyman Moghadam;Shaheer Mohamed;Piotr Koniusz",
        "authorids": "~Maryam_Haghighat1;~Peyman_Moghadam1;~Shaheer_Mohamed1;~Piotr_Koniusz1",
        "gender": ";M;M;",
        "homepage": ";https://research.csiro.au/robotics/;;https://www.koniusz.com",
        "dblp": ";06/2605;;25/8616",
        "google_scholar": ";QAVcuWUAAAAJ;;https://scholar.google.co.uk/citations?user=wZ7-1tUAAAAJ",
        "orcid": ";0000-0002-8169-3560;;0000-0002-6340-5289",
        "linkedin": ";https://au.linkedin.com/in/peymanmoghadam;mohamed-shaheer95/;",
        "or_profile": "~Maryam_Haghighat1;~Peyman_Moghadam1;~Shaheer_Mohamed1;~Piotr_Koniusz1",
        "aff": ";CSIRO;CSIRO;Data61, CSIRO",
        "aff_domain": ";csiro.au;data61.csiro.au;data61.csiro.au",
        "position": ";Principal Researcher;PhD student;Principal Researcher",
        "bibtex": "@inproceedings{\nhaghighat2024pretraining,\ntitle={Pre-training with Random Orthogonal Projection Image Modeling},\nauthor={Maryam Haghighat and Peyman Moghadam and Shaheer Mohamed and Piotr Koniusz},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=z4Hcegjzph}\n}",
        "github": "",
        "project": "",
        "reviewers": "zDzQ;xoq6;5QU4",
        "pdf_size": 3872542,
        "rating": "6;6;8",
        "confidence": "3;4;4",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "3;3;3",
        "wc_summary": "48;111;48",
        "wc_strengths": "55;42;69",
        "wc_weaknesses": "73;6;22",
        "wc_questions": "105;34;26",
        "wc_review": "281;193;165",
        "wc_reply_reviewers": "28;0;13",
        "wc_reply_authors": "815;469;525",
        "reply_reviewers": "1;0;1",
        "reply_authors": "2;1;2",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            69.0,
            29.698484809834994
        ],
        "wc_strengths_avg": [
            55.333333333333336,
            11.025223605694151
        ],
        "wc_weaknesses_avg": [
            33.666666666666664,
            28.56960311628816
        ],
        "wc_questions_avg": [
            55.0,
            35.505868059613285
        ],
        "wc_review_avg": [
            213.0,
            49.42334131426837
        ],
        "wc_reply_reviewers_avg": [
            13.666666666666666,
            11.440668201153676
        ],
        "wc_reply_authors_avg": [
            603.0,
            151.63992438229013
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.49999999999999983,
        "gs_citation": 8,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17425340862539138953&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=z4Hcegjzph",
        "pdf": "https://openreview.net/pdf?id=z4Hcegjzph",
        "email": ";csiro.au;data61.csiro.au;data61.csiro.au",
        "author_num": 4,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Commonwealth Scientific and Industrial Research Organisation;CSIRO",
        "aff_unique_dep": ";Data61",
        "aff_unique_url": "https://www.csiro.au;https://www.csiro.au",
        "aff_unique_abbr": "CSIRO;CSIRO",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Australia"
    },
    {
        "id": "z4qWt62BdN",
        "title": "DSparsE: Dynamic Sparse Embedding for Knowledge Graph Completion",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Addressing the incompleteness problem in knowledge graphs remains a significant challenge. Current graph completion methods, such as ComDensE (a representative of the fully connected network) and InteractE (a representative of the convolutional network), have certain limitations. Specifically, ComDensE is prone to overfitting and has constraints on network depth, while InteractE has limitations in feature interaction and interpretability. To overcome these drawbacks, we propose the Dynamic Sparse Embedding (DSparsE) model. This model employs sparse learning techniques, replacing the conventional dense layers with adaptable sparse ones. DSparsE incorporates a structure reminiscent of the Mixture of Experts (MoE) at the encoding stage and a residual structure at the decoding stage, which optimizes feature extraction and decoding without a significant increase of parameters. Comparative tests are evaluated on the FB15k-237 and WN18RR datasets. It is demonstrated that DSparsE outperforms both ComDensE and InteractE on FB15k-237 in terms of hits@1, with improvements of 2.3\\% and 3.0\\%, respectively.",
        "keywords": "Knowledge graph completion;Link prediction;Dynamic learning;Sparse embedding",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Chuhong Yang;Bin Li;Nan Wu",
        "authorids": "~Chuhong_Yang1;~Bin_Li26;~Nan_Wu6",
        "gender": "M;M;M",
        "homepage": "https://github.com/Ghostapple;;https://openreview.net/profile/activate?token=2e50993fbb9c3b58251f69ddc1c098d6ff3e2abfee5f445d37cdce91c275d406",
        "dblp": ";;",
        "google_scholar": ";TaVcC78AAAAJ;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Chuhong_Yang1;~Bin_Li26;~Nan_Wu6",
        "aff": "Beijing Institute of Technology;Beijing Institute of Technology;Beijing Institute of Technology",
        "aff_domain": "bit.edu.cn;bit.edu.cn;bit.edu.cn",
        "position": "MS student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nyang2024dsparse,\ntitle={{DS}parsE: Dynamic Sparse Embedding for Knowledge Graph Completion},\nauthor={Chuhong Yang and Bin Li and Nan Wu},\nyear={2024},\nurl={https://openreview.net/forum?id=z4qWt62BdN}\n}",
        "github": "",
        "project": "",
        "reviewers": "uERB;5L59;S6XC;jcNV",
        "site": "https://openreview.net/forum?id=z4qWt62BdN",
        "pdf_size": 2572006,
        "rating": "3;3;5;5",
        "confidence": "4;4;3;3",
        "soundness": "2;3;2;3",
        "contribution": "2;2;2;2",
        "presentation": "2;2;2;2",
        "wc_summary": "32;57;68;98",
        "wc_strengths": "17;40;28;52",
        "wc_weaknesses": "87;89;187;168",
        "wc_questions": "1;89;26;148",
        "wc_review": "137;275;309;466",
        "wc_reply_reviewers": "53;0;0;15",
        "wc_reply_authors": "2743;2991;1557;3449",
        "reply_reviewers": "1;0;0;1",
        "reply_authors": "6;6;4;6",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.0
        ],
        "wc_summary_avg": [
            63.75,
            23.689396362085716
        ],
        "wc_strengths_avg": [
            34.25,
            13.083864108129525
        ],
        "wc_weaknesses_avg": [
            132.75,
            45.256905550424015
        ],
        "wc_questions_avg": [
            66.0,
            57.17954179599553
        ],
        "wc_review_avg": [
            296.75,
            117.03498408595611
        ],
        "wc_reply_reviewers_avg": [
            17.0,
            21.66794868002045
        ],
        "wc_reply_authors_avg": [
            2685.0,
            698.7631930775976
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            5.5,
            0.8660254037844386
        ],
        "replies_avg": [
            31,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -1.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:StZHMmqqjw4J:scholar.google.com/&scioq=DSparsE:+Dynamic+Sparse+Embedding+for+Knowledge+Graph+Completion&hl=en&as_sdt=0,5",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Beijing Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.bit.edu.cn/",
        "aff_unique_abbr": "BIT",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "z62Xc88jgF",
        "title": "Neural functional a posteriori error estimates",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We propose a new loss function for supervised and physics-informed training of neural networks and operators that incorporates a posteriori error estimate. More specifically, during the training stage, the neural network learns additional physical fields that lead to rigorous error majorants after a computationally cheap postprocessing stage. Theoretical results are based upon the theory of functional a posteriori error estimates, which allows for the systematic construction of such loss functions for a diverse class of practically relevant partial differential equations. From the numerical side, we demonstrate on a series of elliptic problems that for a variety of architectures and approaches (physics-informed neural networks, physics-informed neural operators, neural operators, and classical architectures in the regression and physics-informed settings), we can reach better or comparable accuracy and in addition to that cheaply recover high-quality upper bounds on the error after training.",
        "keywords": "PDE;scientific machine learning;neural operators;a posteriori error estimate;error estimate of functional type;physics-informed neural networks",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Vladimir Fanaskov;Alexander Rudikov;Ivan Oseledets",
        "authorids": "~Vladimir_Fanaskov2;~Alexander_Rudikov1;~Ivan_Oseledets1",
        "gender": ";M;M",
        "homepage": ";http://oseledets.github.io;",
        "dblp": "338/9862.html;56/7175;",
        "google_scholar": "51rbId8AAAAJ;https://scholar.google.ru/citations?user=5kMqBQEAAAAJ;iK5gdo8AAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Alexander_Rudikov1;~Ivan_Oseledets1;~Fanaskov_Vladimir1",
        "aff": "Skolkovo Institute of Science and Technology;Institute of Numerical Mathematics;Skolkovo institute of science and technology",
        "aff_domain": "skoltech.ru;inm.ras.ru;skoltech.ru",
        "position": "Researcher;Researcher;Researcher",
        "bibtex": "@misc{\nfanaskov2024neural,\ntitle={Neural functional a posteriori error estimates},\nauthor={Vladimir Fanaskov and Alexander Rudikov and Ivan Oseledets},\nyear={2024},\nurl={https://openreview.net/forum?id=z62Xc88jgF}\n}",
        "github": "",
        "project": "",
        "reviewers": "CFkx;h1aP;SLC5;pN9X",
        "site": "https://openreview.net/forum?id=z62Xc88jgF",
        "pdf_size": 4750049,
        "rating": "3;6;6;8",
        "confidence": "3;1;3;3",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;3",
        "presentation": "1;1;3;4",
        "wc_summary": "21;98;58;75",
        "wc_strengths": "75;107;86;44",
        "wc_weaknesses": "259;231;36;69",
        "wc_questions": "2;10;13;139",
        "wc_review": "357;446;193;327",
        "wc_reply_reviewers": "0;0;49;119",
        "wc_reply_authors": "674;516;237;320",
        "reply_reviewers": "0;0;2;1",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            5.75,
            1.7853571071357126
        ],
        "confidence_avg": [
            2.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            1.299038105676658
        ],
        "wc_summary_avg": [
            63.0,
            28.098042636454235
        ],
        "wc_strengths_avg": [
            78.0,
            22.74862633215465
        ],
        "wc_weaknesses_avg": [
            148.75,
            97.45864507574483
        ],
        "wc_questions_avg": [
            41.0,
            56.72301120356711
        ],
        "wc_review_avg": [
            330.75,
            90.77547851705327
        ],
        "wc_reply_reviewers_avg": [
            42.0,
            48.74935897014442
        ],
        "wc_reply_authors_avg": [
            436.75,
            170.36633323517884
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.08084520834544431,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4469194796580456643&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Skolkovo Institute of Science and Technology;Institute of Numerical Mathematics",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.skoltech.ru;",
        "aff_unique_abbr": "Skoltech;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Russian Federation;"
    },
    {
        "title": "Byzantine Robust Cooperative Multi-Agent Reinforcement Learning as a Bayesian Game",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17392",
        "id": "z6KS9D1dxt",
        "author_site": "Simin Li, Jun Guo, Jingqiao Xiu, Ruixiao Xu, Xin Yu, Jiakai Wang, Aishan Liu, Yaodong Yang, Xianglong Liu",
        "tldr": "",
        "abstract": "In this study, we explore the robustness of cooperative multi-agent reinforcement learning (c-MARL) against Byzantine failures, where any agent can enact arbitrary, worst-case actions due to malfunction or adversarial attack. To address the uncertainty that any agent can be adversarial, we propose a Bayesian Adversarial Robust Dec-POMDP (BARDec-POMDP) framework, which views Byzantine adversaries as nature-dictated types, represented by a separate transition. This allows agents to learn policies grounded on their posterior beliefs about the type of other agents, fostering collaboration with identified allies and minimizing vulnerability to adversarial manipulation. We define the optimal solution to the BARDec-POMDP as an ex interim robust Markov perfect Bayesian equilibrium, which we proof to exist and the corresponding policy weakly dominates previous approaches as time goes to infinity. To realize this equilibrium, we put forward a two-timescale actor-critic algorithm with almost sure convergence under specific conditions. Experiments on matrix game, Level-based Foraging and StarCraft II indicate that, our method successfully acquires intricate micromanagement skills and adaptively aligns with allies under worst-case perturbations, showing resilience against non-oblivious adversaries, random allies, observation-based attacks, and transfer-based attacks.",
        "keywords": "Multi-agent reinforcement learning;Robustness;Game Theory;Adversarial Attack",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/c51bf7cfc88e08b5f921f5e3c705191cf1a381f5.zip",
        "author": "Simin Li;Jun Guo;Jingqiao Xiu;Ruixiao Xu;Xin Yu;Jiakai Wang;Aishan Liu;Yaodong Yang;Xianglong Liu",
        "authorids": "~Simin_Li5;~Jun_Guo6;~Jingqiao_Xiu1;~Ruixiao_Xu1;~Xin_Yu7;~Jiakai_Wang1;~Aishan_Liu1;~Yaodong_Yang1;~Xianglong_Liu3",
        "gender": "M;M;;;M;M;M;M;",
        "homepage": "https://siminli.github.io;;;https://xuruixiao.github.io/;https://xinyu-site.github.io/;https://jiakaiwangcn.github.io/;https://liuaishan.github.io/;https://www.yangyaodong.com;",
        "dblp": ";73/273-9;;;54/1184-9;202/9216;177/5658;170/1496-1;",
        "google_scholar": "uo8l5ckAAAAJ;tuoTR7YAAAAJ;;;WVTty-0AAAAJ;https://scholar.google.com/citations?hl=zh-CN;88tzr_sAAAAJ;https://scholar.google.co.uk/citations?user=6yL0xw8AAAAJ;",
        "orcid": ";0000-0002-6626-4135;;;0000-0002-3354-8625;0000-0001-5884-3412;;0000-0001-8132-5613;",
        "linkedin": ";;;;;;;yaodong-yang;",
        "or_profile": "~Simin_Li5;~Jun_Guo6;~Jingqiao_Xiu1;~Ruixiao_Xu1;~Xin_Yu7;~Jiakai_Wang1;~Aishan_Liu1;~Yaodong_Yang1;~Xianglong_Liu3",
        "aff": "Beihang University;Beihang University;;Beihang University;Beihang University;Zhongguancun Laboratory;Beihang University;Peking University;",
        "aff_domain": "buaa.edu.cn;buaa.edu.cn;;buaa.edu.cn;buaa.edu.cn;mail.zgclab.edu.cn;buaa.edu.cn;pku.edu.cn;",
        "position": "PhD student;MS student;;MS student;PhD student;Researcher;Assistant Professor;Assistant Professor;",
        "bibtex": "@inproceedings{\nli2024byzantine,\ntitle={Byzantine Robust Cooperative Multi-Agent Reinforcement Learning as a Bayesian Game},\nauthor={Simin Li and Jun Guo and Jingqiao Xiu and Ruixiao Xu and Xin Yu and Jiakai Wang and Aishan Liu and Yaodong Yang and Xianglong Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=z6KS9D1dxt}\n}",
        "github": "",
        "project": "",
        "reviewers": "EssV;FinH;UzHb",
        "pdf_size": 6643252,
        "rating": "5;6;8",
        "confidence": "3;4;4",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "2;3;2",
        "wc_summary": "211;112;215",
        "wc_strengths": "40;65;130",
        "wc_weaknesses": "200;46;198",
        "wc_questions": "59;11;54",
        "wc_review": "510;234;597",
        "wc_reply_reviewers": "0;41;53",
        "wc_reply_authors": "558;595;661",
        "reply_reviewers": "0;1;1",
        "reply_authors": "3;4;3",
        "rating_avg": [
            6.333333333333333,
            1.247219128924647
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            179.33333333333334,
            47.6398525979621
        ],
        "wc_strengths_avg": [
            78.33333333333333,
            37.932688922470135
        ],
        "wc_weaknesses_avg": [
            148.0,
            72.1295131459146
        ],
        "wc_questions_avg": [
            41.333333333333336,
            21.545816814923082
        ],
        "wc_review_avg": [
            447.0,
            154.7449514523818
        ],
        "wc_reply_reviewers_avg": [
            31.333333333333332,
            22.691163233490013
        ],
        "wc_reply_authors_avg": [
            604.6666666666666,
            42.60151275352659
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": 0.7559289460184545,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7316008742866348481&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=z6KS9D1dxt",
        "pdf": "https://openreview.net/pdf?id=z6KS9D1dxt",
        "email": "buaa.edu.cn;buaa.edu.cn;;buaa.edu.cn;buaa.edu.cn;mail.zgclab.edu.cn;buaa.edu.cn;pku.edu.cn;",
        "author_num": 9,
        "aff_unique_index": "0;0;0;0;1;0;2",
        "aff_unique_norm": "Beihang University;Zhongguancun Laboratory;Peking University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "http://www.buaa.edu.cn/;;http://www.pku.edu.cn",
        "aff_unique_abbr": "BUAA;;Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "An Efficient Tester-Learner for Halfspaces",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17391",
        "id": "z6n1fKMMC1",
        "author_site": "Aravind Gollakota, Adam Klivans, Konstantinos Stavropoulos, Arsen Vasilyan",
        "tldr": "",
        "abstract": "We give the first efficient algorithm for learning halfspaces in the testable learning model recently defined by Rubinfeld and Vasilyan [2022]. In this model, a learner certifies that the accuracy of its output hypothesis is near optimal whenever the training set passes an associated test, and training sets drawn from some target distribution must pass the test. This model is more challenging than distribution-specific agnostic or Massart noise models where the learner is allowed to fail arbitrarily if the distributional assumption does not hold. We consider the setting where the target distribution is the standard Gaussian in $d$ dimensions and the label noise is either Massart or adversarial (agnostic). For Massart noise, our tester-learner runs in polynomial time and outputs a hypothesis with (information-theoretically optimal) error $\\mathrm{opt}+\\epsilon$ (and extends to any fixed strongly log-concave target distribution). For adversarial noise, our tester-learner obtains error $O(\\mathrm{opt})+\\epsilon$ in polynomial time. Prior work on testable learning ignores the labels in the training set and checks that the empirical moments of the covariates are close to the moments of the base distribution. Here we develop new tests of independent interest that make critical use of the labels and combine them with the moment-matching approach of Gollakota et al. [2022]. This enables us to implement a testable variant of the algorithm of Diakonikolas et al. [2020a, 2020b] for learning noisy halfspaces using nonconvex SGD.",
        "keywords": "testable learning;pac learning;agnostic learning;Massart label noise;adversarial label noise;distribution testing",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Aravind Gollakota;Adam Klivans;Konstantinos Stavropoulos;Arsen Vasilyan",
        "authorids": "~Aravind_Gollakota1;~Adam_Klivans1;~Konstantinos_Stavropoulos1;~Arsen_Vasilyan1",
        "gender": "M;M;;",
        "homepage": "https://aravind-pg.github.io;http://www.cs.utexas.edu/~klivans;;",
        "dblp": "264/1576;k/AdamRKlivans;;",
        "google_scholar": ";;;",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Aravind_Gollakota1;~Adam_Klivans1;~Konstantinos_Stavropoulos1;~Arsen_Vasilyan1",
        "aff": "Apple;University of Texas, Austin;;",
        "aff_domain": "apple.com;cs.utexas.edu;;",
        "position": "Researcher;Professor;;",
        "bibtex": "@inproceedings{\ngollakota2024an,\ntitle={An Efficient Tester-Learner for Halfspaces},\nauthor={Aravind Gollakota and Adam Klivans and Konstantinos Stavropoulos and Arsen Vasilyan},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=z6n1fKMMC1}\n}",
        "github": "",
        "project": "",
        "reviewers": "CcgF;9fsR;HBcm;sjRf",
        "pdf_size": 1243995,
        "rating": "5;6;8;8",
        "confidence": "4;3;3;3",
        "soundness": "3;4;4;4",
        "contribution": "2;3;3;3",
        "presentation": "3;2;3;4",
        "wc_summary": "48;340;141;98",
        "wc_strengths": "52;50;160;85",
        "wc_weaknesses": "31;28;9;63",
        "wc_questions": "18;101;66;52",
        "wc_review": "149;519;376;298",
        "wc_reply_reviewers": "0;0;0;29",
        "wc_reply_authors": "25;315;263;29",
        "reply_reviewers": "0;0;0;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            156.75,
            110.80021434997317
        ],
        "wc_strengths_avg": [
            86.75,
            44.516148755255095
        ],
        "wc_weaknesses_avg": [
            32.75,
            19.395553614166314
        ],
        "wc_questions_avg": [
            59.25,
            29.76050234791073
        ],
        "wc_review_avg": [
            335.5,
            133.69835451493037
        ],
        "wc_reply_reviewers_avg": [
            7.25,
            12.55736835487436
        ],
        "wc_reply_authors_avg": [
            158.0,
            132.29134514396625
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.7777777777777777,
        "gs_citation": 14,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15030715879021468993&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=z6n1fKMMC1",
        "pdf": "https://openreview.net/pdf?id=z6n1fKMMC1",
        "email": "apple.com;cs.utexas.edu;;",
        "author_num": 4,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Apple;University of Texas at Austin",
        "aff_unique_dep": "Apple Inc.;",
        "aff_unique_url": "https://www.apple.com;https://www.utexas.edu",
        "aff_unique_abbr": "Apple;UT Austin",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Austin",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Perceptual Scales Predicted by Fisher Information Metrics",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17390",
        "id": "z7K2faBrDG",
        "author_site": "Jonathan Vacher, Pascal Mamassian",
        "tldr": "",
        "abstract": "Perception is often viewed as a process that transforms physical variables, external to an observer, into internal psychological variables. Such a process can be modeled by a function coined *perceptual scale*. The *perceptual scale* can be deduced from psychophysical measurements that consist in comparing the relative differences between stimuli (i.e. difference scaling experiments). However, this approach is often overlooked by the modeling and experimentation communities. Here, we demonstrate the value of measuring the *perceptual scale* of classical (spatial frequency, orientation) and less classical physical variables (interpolation between textures) by embedding it in recent probabilistic modeling of perception. First, we show that the assumption that an observer has an internal representation of univariate parameters such as spatial frequency or orientation while stimuli are high-dimensional does not lead to contradictory predictions when following the theoretical framework. Second, we show that the measured *perceptual scale* corresponds to the transduction function hypothesized in this framework. In particular, we demonstrate that it is related to the Fisher information of the generative model that underlies perception and we test the predictions given by the generative model of different stimuli in a set a of difference scaling experiments. Our main conclusion is that the *perceptual scale* is mostly driven by the stimulus power spectrum. Finally, we propose that this measure of *perceptual scale* is a way to push further the notion of perceptual distances by estimating the perceptual geometry of images i.e. the path between images instead of simply the distance between those.",
        "keywords": "perceptual scale;perceptual distance;gaussian texture;naturalistic textures;texture interpolation",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "",
        "author": "Jonathan Vacher;Pascal Mamassian",
        "authorids": "~Jonathan_Vacher1;~Pascal_Mamassian1",
        "gender": "M;",
        "homepage": "https://jonathanvacher.github.io;http://mamassian.free.fr",
        "dblp": "162/1400;",
        "google_scholar": "https://scholar.google.fr/citations?user=natqiOwAAAAJ;",
        "orcid": "0000-0002-4321-6309;",
        "linkedin": ";",
        "or_profile": "~Jonathan_Vacher1;~Pascal_Mamassian1",
        "aff": "Universit\u00e9 Paris-Cit\u00e9;",
        "aff_domain": "u-paris.fr;",
        "position": "Associate Professor;",
        "bibtex": "@inproceedings{\nvacher2024perceptual,\ntitle={Perceptual Scales Predicted by Fisher Information Metrics},\nauthor={Jonathan Vacher and Pascal Mamassian},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=z7K2faBrDG}\n}",
        "github": "",
        "project": "",
        "reviewers": "gWW2;wfqs;AMLy;qN8s",
        "pdf_size": 20216910,
        "rating": "3;5;5;8",
        "confidence": "3;3;2;4",
        "soundness": "2;2;3;2",
        "contribution": "2;2;2;2",
        "presentation": "2;2;1;2",
        "wc_summary": "36;16;105;149",
        "wc_strengths": "19;18;26;43",
        "wc_weaknesses": "116;130;133;112",
        "wc_questions": "106;52;108;516",
        "wc_review": "277;216;372;820",
        "wc_reply_reviewers": "0;0;5;223",
        "wc_reply_authors": "678;906;732;1576",
        "reply_reviewers": "0;0;1;2",
        "reply_authors": "1;2;2;4",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            76.5,
            53.3127564472144
        ],
        "wc_strengths_avg": [
            26.5,
            10.012492197250394
        ],
        "wc_weaknesses_avg": [
            122.75,
            8.926785535678562
        ],
        "wc_questions_avg": [
            195.5,
            186.3994366944278
        ],
        "wc_review_avg": [
            421.25,
            236.8347261277366
        ],
        "wc_reply_reviewers_avg": [
            57.0,
            95.861879806313
        ],
        "wc_reply_authors_avg": [
            973.0,
            358.1912896763404
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.25,
            1.0897247358851685
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.5940885257860046,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:K9A5qZkA9xcJ:scholar.google.com/&scioq=Perceptual+Scales+Predicted+by+Fisher+Information+Metrics&hl=en&as_sdt=0,44",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=z7K2faBrDG",
        "pdf": "https://openreview.net/pdf?id=z7K2faBrDG",
        "email": "u-paris.fr;",
        "author_num": 2,
        "aff_unique_index": "0",
        "aff_unique_norm": "Universit\u00e9 Paris-Cit\u00e9",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.universite-paris.fr",
        "aff_unique_abbr": "UPC",
        "aff_country_unique_index": "0",
        "aff_country_unique": "France"
    },
    {
        "id": "z7usV2BlEE",
        "title": "Making Large Language Models Better Reasoners with Alignment",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Reasoning is a cognitive process of using evidence to reach a sound conclusion.\nThe reasoning capability is essential for large language models (LLMs) to serve as the brain of the artificial general intelligence agent.\nRecent studies reveal that fine-tuning LLMs on data with the chain of thought (COT) reasoning process can significantly enhance their reasoning capabilities. \nHowever, we find that the fine-tuned LLMs suffer from an \\textit{Assessment Misalignment} problem, i.e., they frequently assign higher scores to subpar COTs, leading to potential limitations in their reasoning abilities.\nIn this paper, we introduce an \\textit{Alignment Fine-Tuning (AFT)} paradigm with a novel \\textit{Constrained Alignment Loss} to alleviate the assessment misalignment problem.\nSpecifically, the proposed loss has two objectives:\na) Alignment, which guarantees the  scores of high-quality COTs surpass that of subpar ones;\nb) Constraint, which keeps the subpar scores confined to a reasonable range to prevent the model degradation.\nExtensive experiments on four reasoning benchmarks with both binary and ranking feedback demonstrate the effectiveness of AFT.\nAFT also performs well in multi-task and out-of-distribution situations.\nFurthermore, we also delve deeply into recent ranking-based alignment methods, such as DPO, RRHF, and PRO, and discover that the constraint, which has been overlooked by these approaches, is also crucial for their performance.",
        "keywords": "Large Language Models;Reasoning;Alignment",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/36586227a597ebbc5a82056c658eea94cef17b0f.zip",
        "author": "Peiyi Wang;Lei Li;Liang Chen;Feifan Song;Binghuai Lin;Yunbo Cao;Tianyu Liu;Zhifang Sui",
        "authorids": "~Peiyi_Wang1;~Lei_Li14;~Liang_Chen10;~Feifan_Song1;~Binghuai_Lin1;~Yunbo_Cao3;~Tianyu_Liu3;~Zhifang_Sui1",
        "gender": "M;;M;;;M;M;F",
        "homepage": ";;https://chenllliang.github.io;;;;;http://eecs.pku.edu.cn/EN/People/Faculty/Detail/?ID=6024",
        "dblp": "236/6569.html;;01/5394-24;;146/2946;33/4066.html;134/1099-1;",
        "google_scholar": "K0uQ3ygAAAAJ;;lMKPaTYAAAAJ;;;nNVDLb4AAAAJ;https://scholar.google.com.hk/citations?user=6hHbBwwAAAAJ;",
        "orcid": ";;;;;;;",
        "linkedin": ";;;;;;;",
        "or_profile": "~Peiyi_Wang1;~Lei_Li14;~Liang_Chen10;~Feifan_Song1;~Binghuai_Lin1;~Yunbo_Cao3;~Tianyu_Liu3;~Zhifang_Sui1",
        "aff": "Peking University;;Peking University;;Tencent;Information Center, Academy of Military Science;Alibaba Group;Peking University",
        "aff_domain": "pku.edu.cn;;pku.edu.cn;;tencent.com;ams.edu;alibaba-inc.com;pku.edu.cn",
        "position": "PhD student;;PhD student;;Principal Researcher;Researcher;Staff Engineer;Full Professor",
        "bibtex": "@misc{\nwang2024making,\ntitle={Making Large Language Models Better Reasoners with Alignment},\nauthor={Peiyi Wang and Lei Li and Liang Chen and Feifan Song and Binghuai Lin and Yunbo Cao and Tianyu Liu and Zhifang Sui},\nyear={2024},\nurl={https://openreview.net/forum?id=z7usV2BlEE}\n}",
        "github": "",
        "project": "",
        "reviewers": "9VoV;rVEU;MzKF;voWS",
        "site": "https://openreview.net/forum?id=z7usV2BlEE",
        "pdf_size": 566125,
        "rating": "5;5;6;6",
        "confidence": "4;4;4;4",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "66;76;124;53",
        "wc_strengths": "26;156;39;29",
        "wc_weaknesses": "170;198;14;119",
        "wc_questions": "408;108;70;2",
        "wc_review": "670;538;247;203",
        "wc_reply_reviewers": "941;209;0;5",
        "wc_reply_authors": "2231;1598;350;158",
        "reply_reviewers": "3;2;0;1",
        "reply_authors": "6;5;1;1",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            79.75,
            26.81767141270845
        ],
        "wc_strengths_avg": [
            62.5,
            54.19640209460403
        ],
        "wc_weaknesses_avg": [
            125.25,
            70.19748927134076
        ],
        "wc_questions_avg": [
            147.0,
            155.3994851986325
        ],
        "wc_review_avg": [
            414.5,
            195.78112779325795
        ],
        "wc_reply_reviewers_avg": [
            288.75,
            385.90178478467806
        ],
        "wc_reply_authors_avg": [
            1084.25,
            862.5596718488524
        ],
        "reply_reviewers_avg": [
            1.5,
            1.118033988749895
        ],
        "reply_authors_avg": [
            3.25,
            2.277608394786075
        ],
        "replies_avg": [
            25,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 56,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15184966881704214877&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1;2;3;0",
        "aff_unique_norm": "Peking University;Tencent;Academy of Military Science;Alibaba Group",
        "aff_unique_dep": ";Tencent Holdings Limited;Information Center;",
        "aff_unique_url": "http://www.pku.edu.cn;https://www.tencent.com;;https://www.alibaba.com",
        "aff_unique_abbr": "Peking U;Tencent;;Alibaba",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "z80CwkWXmq",
        "title": "GETMusic: Generating Music Tracks with a Unified Representation and Diffusion Framework",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Symbolic music generation aims to create musical notes, which can help users compose music, such as generating target instrument tracks based on provided source tracks. In practical scenarios where there\u2019s a predefined ensemble of tracks and various composition needs, an efficient and effective generative model that can generate any target tracks based on the other tracks becomes crucial. However, previous efforts have fallen short in addressing this necessity due to limitations in their music representations and models. In this paper, we introduce a framework known as GETMusic, with \u201cGET\u201d standing for \u201cGEnerate music Tracks.\u201d This framework encompasses a novel music representation \u201cGETScore\u201d and a diffusion model \u201cGETDiff.\u201d GETScore represents musical notes as tokens and organizes tokens in a 2D structure, with tracks stacked vertically and progressing horizontally over time. At a training step, each track of a music piece is randomly selected as either the target or source. The training involves two processes: In the forward process, target tracks are corrupted by masking their tokens, while source tracks remain as the ground truth; in the denoising process, GETDiff is trained to predict the masked target tokens conditioning on the source tracks. Our proposed representation, coupled with the non-autoregressive generative model, empowers GETMusic to generate music with any arbitrary source-target track combinations. Our experiments demonstrate that the versatile GETMusic outperforms prior works proposed for certain specific composition tasks.",
        "keywords": "symbolic music generation;symbolic music representation;diffusion model",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/6962536608a2c1e2fe9ebe9fb39a15572afaea3c.zip",
        "author": "Ang Lv;Xu Tan;Peiling Lu;Wei Ye;Shikun Zhang;Jiang Bian;Rui Yan",
        "authorids": "~Ang_Lv1;~Xu_Tan1;~Peiling_Lu1;~Wei_Ye2;~Shikun_Zhang2;~Jiang_Bian1;~Rui_Yan2",
        "gender": "M;M;F;M;M;M;M",
        "homepage": "https://trestad.github.io;https://tan-xu.github.io/;https://www.microsoft.com/en-us/research/people/peil/;https://se.pku.edu.cn/kcl/weiye/;;https://sites.google.com/view/jiangbian;https://gsai.ruc.edu.cn/english/ruiyan",
        "dblp": "326/5506;96/10484-3;;09/5394-4;83/3715.html;09/851-2.html;19/2405-1",
        "google_scholar": "https://scholar.google.com/citations?view_op=list_works;tob-U1oAAAAJ;;RgLGFMIAAAAJ;uiklLscAAAAJ;pZBEnY8AAAAJ;eLw6g-UAAAAJ",
        "orcid": "0000-0002-8027-2270;0000-0001-5631-0639;;;;0000-0002-9472-600X;0000-0002-3356-6823",
        "linkedin": ";;peiling-lu-675371128/;;;jbian/;",
        "or_profile": "~Ang_Lv1;~Xu_Tan1;~Peiling_Lu1;~Wei_Ye2;~Shikun_Zhang2;~Jiang_Bian1;~Rui_Yan2",
        "aff": "Renmin University of China;Microsoft;Microsoft;Peking University;Peking University;Microsoft;Renmin University of China",
        "aff_domain": "ruc.edu.cn;microsoft.com;microsoft.com;pku.edu.cn;pku.edu.cn;microsoft.com;ruc.edu.cn",
        "position": "PhD student;Principal Researcher;Researcher;Associate Professor;Full Professor;Partner Research Manager;Associate Professor",
        "bibtex": "@misc{\nlv2024getmusic,\ntitle={{GETM}usic: Generating Music Tracks with a Unified Representation and Diffusion Framework},\nauthor={Ang Lv and Xu Tan and Peiling Lu and Wei Ye and Shikun Zhang and Jiang Bian and Rui Yan},\nyear={2024},\nurl={https://openreview.net/forum?id=z80CwkWXmq}\n}",
        "github": "",
        "project": "",
        "reviewers": "xCek;NjSU;gxWR;LUPw",
        "site": "https://openreview.net/forum?id=z80CwkWXmq",
        "pdf_size": 1544471,
        "rating": "3;3;5;6",
        "confidence": "5;4;3;3",
        "soundness": "2;2;3;2",
        "contribution": "2;1;3;2",
        "presentation": "1;3;3;3",
        "wc_summary": "93;103;273;57",
        "wc_strengths": "72;59;80;39",
        "wc_weaknesses": "716;212;210;50",
        "wc_questions": "170;74;89;38",
        "wc_review": "1051;448;652;184",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            131.5,
            83.46705937074817
        ],
        "wc_strengths_avg": [
            62.5,
            15.5
        ],
        "wc_weaknesses_avg": [
            297.0,
            250.68107228109585
        ],
        "wc_questions_avg": [
            92.75,
            48.297903681215814
        ],
        "wc_review_avg": [
            583.75,
            316.7052059881555
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.8703882797784892,
        "gs_citation": 16,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10464089972647973788&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;1;2;2;1;0",
        "aff_unique_norm": "Renmin University of China;Microsoft;Peking University",
        "aff_unique_dep": ";Microsoft Corporation;",
        "aff_unique_url": "http://www.ruc.edu.cn;https://www.microsoft.com;http://www.pku.edu.cn",
        "aff_unique_abbr": "RUC;Microsoft;Peking U",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;0;0;1;0",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "MathCoder: Seamless Code Integration in LLMs for Enhanced Mathematical Reasoning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17389",
        "id": "z8TW0ttBPp",
        "author_site": "Ke Wang, Houxing Ren, Aojun Zhou, Zimu Lu, Sichun Luo, Weikang Shi, Renrui Zhang, Linqi Song, Mingjie Zhan, Hongsheng Li",
        "tldr": "",
        "abstract": "The recently released GPT-4 Code Interpreter has demonstrated remarkable proficiency in solving challenging math problems, primarily attributed to its ability to seamlessly reason with natural language, generate code, execute code, and continue reasoning based on the execution output. In this paper, we present a method to fine-tune open-source language models, enabling them to use code for modeling and deriving math equations and, consequently, enhancing their mathematical reasoning abilities. We propose a method of generating novel and high-quality datasets with math problems and their code-based solutions, referred to as MathCodeInstruct. Each solution interleaves $\\textit{natural language}$, $\\textit{code}$, and $\\textit{execution results}$. We also introduce a customized supervised fine-tuning and inference approach. This approach yields the MathCoder models, a family of models capable of generating code-based solutions for solving challenging math problems. Impressively, the MathCoder models achieve state-of-the-art scores among open-source LLMs on the MATH (45.2%) and GSM8K (83.9%) datasets, substantially outperforming other open-source alternatives. Notably, the MathCoder model not only surpasses ChatGPT-3.5 and PaLM-2 on GSM8K and MATH but also outperforms GPT-4 on the competition-level MATH dataset. The proposed dataset and models will be released upon acceptance.",
        "keywords": "mathematical reasoning;large language models;code generation",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Ke Wang;Houxing Ren;Aojun Zhou;Zimu Lu;Sichun Luo;Weikang Shi;Renrui Zhang;Linqi Song;Mingjie Zhan;Hongsheng Li",
        "authorids": "~Ke_Wang18;~Houxing_Ren1;~Aojun_Zhou2;~Zimu_Lu1;~Sichun_Luo1;~Weikang_Shi1;~Renrui_Zhang1;~Linqi_Song1;~Mingjie_Zhan1;~Hongsheng_Li3",
        "gender": "M;M;;F;;M;M;M;M;M",
        "homepage": "https://wangk.org/;;;;;https://shiwk20.github.io;;https://sites.google.com/site/aisquaredlab/;;http://www.ee.cuhk.edu.hk/~hsli",
        "dblp": "181/2613-36;292/3943.html;;;;213/4016.html;244/1748;137/7963.html;277/1226;27/7402-1",
        "google_scholar": "woY4bS8AAAAJ;reSJxKkAAAAJ;;ewuGUCwAAAAJ;;;YlL3xN4AAAAJ;UcGN3MoAAAAJ;;BN2Ze-QAAAAJ",
        "orcid": ";0000-0001-9750-1626;;;;;;0000-0003-2756-4984;;",
        "linkedin": ";;;;;;;;;",
        "or_profile": "~Ke_Wang18;~Houxing_Ren1;~Aojun_Zhou2;~Zimu_Lu1;~Sichun_Luo1;~Weikang_Shi1;~Renrui_Zhang1;~Linqi_Song1;~Mingjie_Zhan1;~Hongsheng_Li3",
        "aff": "Nanjing University;Sensetime;;University of Science and Technology of China;;Tsinghua University;MMLab of CUHK & Shanghai AI Laboratory;City University of Hong Kong;SenseTime Research;The Chinese University of Hong Kong",
        "aff_domain": "nju.edu.cn;sensetime.com;;ustc.edu.cn;;tsinghua.edu.cn;pjlab.org.cn;cityu.edu.hk;sensetime.com;cuhk.edu.hk",
        "position": "Undergrad student;Researcher;;Undergrad student;;Undergrad student;PhD student;Assistant Professor;Researcher;Associate Professor",
        "bibtex": "@inproceedings{\nwang2024mathcoder,\ntitle={MathCoder: Seamless Code Integration in {LLM}s for Enhanced Mathematical Reasoning},\nauthor={Ke Wang and Houxing Ren and Aojun Zhou and Zimu Lu and Sichun Luo and Weikang Shi and Renrui Zhang and Linqi Song and Mingjie Zhan and Hongsheng Li},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=z8TW0ttBPp}\n}",
        "github": "",
        "project": "",
        "reviewers": "X1mb;3VCG;Gqkc;VXbY",
        "pdf_size": 698985,
        "rating": "5;6;6;6",
        "confidence": "4;4;3;5",
        "soundness": "2;3;3;3",
        "contribution": "3;2;2;3",
        "presentation": "3;3;2;3",
        "wc_summary": "94;118;227;96",
        "wc_strengths": "86;83;44;64",
        "wc_weaknesses": "210;215;107;202",
        "wc_questions": "181;34;54;124",
        "wc_review": "571;450;432;486",
        "wc_reply_reviewers": "0;19;0;20",
        "wc_reply_authors": "1703;960;535;1433",
        "reply_reviewers": "0;1;0;1",
        "reply_authors": "4;3;2;4",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            133.75,
            54.655169014467425
        ],
        "wc_strengths_avg": [
            69.25,
            16.843025262701474
        ],
        "wc_weaknesses_avg": [
            183.5,
            44.41002139157332
        ],
        "wc_questions_avg": [
            98.25,
            58.30255140214706
        ],
        "wc_review_avg": [
            484.75,
            53.45734280713923
        ],
        "wc_reply_reviewers_avg": [
            9.75,
            9.756408150543928
        ],
        "wc_reply_authors_avg": [
            1157.75,
            447.2087739523902
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            3.25,
            0.82915619758885
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 98,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2115662843830304087&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=z8TW0ttBPp",
        "pdf": "https://openreview.net/pdf?id=z8TW0ttBPp",
        "email": "nju.edu.cn;sensetime.com;;ustc.edu.cn;;tsinghua.edu.cn;pjlab.org.cn;cityu.edu.hk;sensetime.com;cuhk.edu.hk",
        "author_num": 10,
        "aff_unique_index": "0;1;2;3;4;5;1;4",
        "aff_unique_norm": "Nanjing University;SenseTime;University of Science and Technology of China;Tsinghua University;Chinese University of Hong Kong;City University of Hong Kong",
        "aff_unique_dep": ";;;;MMLab;",
        "aff_unique_url": "https://www.nju.edu.cn;https://www.sensetime.com;http://www.ustc.edu.cn;https://www.tsinghua.edu.cn;https://www.cuhk.edu.hk;https://www.cityu.edu.hk",
        "aff_unique_abbr": "Nanjing U;SenseTime;USTC;THU;CUHK;CityU",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "z8Wva86JLB",
        "title": "GEOFFair: a GEOmetric Framework for Fairness",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Fairness is a critical concern in Machine Learning, impacting its applications across domains. Existing fairness analyses often rely on complex mathematics, lacking of intuitive understanding.\nIn this study, we introduce \\emph{GEOFFair}, a Geometric Framework for Fairness. It represents Machine Learning elements as vectors and sets, offering a more intuitive understanding of fairness related concepts. GEOFFair visualizes fairness mitigation techniques as vector projections, it provides a solid base to investigate the bias injection, aiding in constructing proofs, and it enables the study of fairness properties by means of geometric considerations.\nThe main contribution of the work is to highlight GEOFFair's effectiveness in fairness studies, demonstrating that solely maximizing accuracy based on observed labels may not always be optimal for fairness.",
        "keywords": "AI fairness;geometric framework;GEOFFair",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Alessandro Maggio;Luca Giuliani;Roberta Calegari;Michele Lombardi;Michela Milano",
        "authorids": "~Alessandro_Maggio1;~Luca_Giuliani1;roberta.calegari@unibo.it;~Michele_Lombardi1;michela.milano@unibo.it",
        "gender": "M;M;;M;",
        "homepage": ";https://www.unibo.it/sitoweb/luca.giuliani13;;https://www.unibo.it/sitoweb/michele.lombardi2;",
        "dblp": ";169/6099;;l/MicheleLombardi;",
        "google_scholar": ";V1TNLkMAAAAJ;;https://scholar.google.com/citations?hl=en;",
        "orcid": ";0000-0002-9120-6949;;0000-0003-4709-8888;",
        "linkedin": "https://linkedin.com/in/alessandro-maggio-1410;luca-giuliani11/;;;",
        "or_profile": "~Alessandro_Maggio1;~Luca_Giuliani1;roberta.calegari@unibo.it;~Michele_Lombardi1;michela.milano@unibo.it",
        "aff": "University of Bologna;University of Bologna;;University of Bologna;",
        "aff_domain": "unibo.it;unibo.it;;unibo.it;",
        "position": "PhD student;PhD student;;Associate Professor;",
        "bibtex": "@misc{\nmaggio2024geoffair,\ntitle={{GEOFF}air: a {GEO}metric Framework for Fairness},\nauthor={Alessandro Maggio and Luca Giuliani and Roberta Calegari and Michele Lombardi and Michela Milano},\nyear={2024},\nurl={https://openreview.net/forum?id=z8Wva86JLB}\n}",
        "github": "",
        "project": "",
        "reviewers": "xPkB;w6Hu;p9x9",
        "site": "https://openreview.net/forum?id=z8Wva86JLB",
        "pdf_size": 305899,
        "rating": "3;3;5",
        "confidence": "4;3;3",
        "soundness": "1;3;2",
        "contribution": "1;1;2",
        "presentation": "1;2;2",
        "wc_summary": "42;45;85",
        "wc_strengths": "24;13;76",
        "wc_weaknesses": "262;116;249",
        "wc_questions": "5;15;146",
        "wc_review": "333;189;556",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            57.333333333333336,
            19.601587237318874
        ],
        "wc_strengths_avg": [
            37.666666666666664,
            27.475241379993168
        ],
        "wc_weaknesses_avg": [
            209.0,
            65.9747426419131
        ],
        "wc_questions_avg": [
            55.333333333333336,
            64.24086619036895
        ],
        "wc_review_avg": [
            359.3333333333333,
            150.97976317668832
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:hpw5-JGjfSsJ:scholar.google.com/&scioq=GEOFFair:+a+GEOmetric+Framework+for+Fairness&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Bologna",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.unibo.it",
        "aff_unique_abbr": "Unibo",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Italy"
    },
    {
        "id": "z8q8kBxC5H",
        "title": "Sharp results for NIEP and NMF",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The orthodox Non-negative Inverse Eigenvalue Problem (oNIEP) has challenged mathematicians for over $70$ years. Motivated by applications in non-negative matrix factorization (NMF) and network modeling, we consider an NIEP as follows. Consider a $K \\times K$ diagonal matrix $J_{K, m} = \\diag(1 + a_{K, m}, 1, \\ldots, 1, -1, \\ldots, -1)$,  where exactly $m$ entries are $-1$ and $a_{K, m} =  \\max\\{0, (2m-K)\\}$.  We wish to determine for which $(K, m)$, there is a $K \\times K$ orthogonal matrix $Q$ such that $Q J_{K, m} Q'$ is doubly stochastic.  Using several approaches (especially a combined Haar and Discrete Fourier Transform (DFT) approach) we developed, we show that in most of the cases, the NIEP is solvable. We show that these results are sharp. Also, since these are construction approaches, they automatically provide an explicit way for computing matrix $Q$. As a result,  these approaches give rise to  both a  computable NMF algorithm and sharp results for NMF. We also discuss the implication  of our results for social network modeling.",
        "keywords": "Non-negative matrix factorization;non-negative inverse eigenvalue problem;social network modeling;Discrete Fourier Transform;Haar basis;construction approach",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/c9d1e8c08b3e4e88c7d960ea2846ae3c7ac299e4.pdf",
        "author": "Jiashun Jin;Tzu-Kuo Huang",
        "authorids": "~Jiashun_Jin1;~Tzu-Kuo_Huang1",
        "gender": ";M",
        "homepage": ";",
        "dblp": ";22/1218",
        "google_scholar": ";",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Jiashun_Jin1;~Tzu-Kuo_Huang1",
        "aff": ";Google",
        "aff_domain": ";google.com",
        "position": ";Researcher",
        "bibtex": "@misc{\njin2024sharp,\ntitle={Sharp results for {NIEP} and {NMF}},\nauthor={Jiashun Jin and Tzu-Kuo Huang},\nyear={2024},\nurl={https://openreview.net/forum?id=z8q8kBxC5H}\n}",
        "github": "",
        "project": "",
        "reviewers": "QrTg;gqyq;dPXa;SvT9;Mjse",
        "site": "https://openreview.net/forum?id=z8q8kBxC5H",
        "pdf_size": 235811,
        "rating": "5;5;6;6;8",
        "confidence": "3;3;4;3;1",
        "soundness": "1;3;3;2;4",
        "contribution": "3;3;3;3;4",
        "presentation": "1;2;3;1;3",
        "wc_summary": "95;76;142;275;75",
        "wc_strengths": "20;36;81;196;47",
        "wc_weaknesses": "94;54;159;586;19",
        "wc_questions": "41;124;2;447;80",
        "wc_review": "250;290;384;1504;221",
        "wc_reply_reviewers": "0;60;188;0;0",
        "wc_reply_authors": "771;477;1206;751;251",
        "reply_reviewers": "0;1;3;0;0",
        "reply_authors": "1;2;3;2;1",
        "rating_avg": [
            6.0,
            1.0954451150103321
        ],
        "confidence_avg": [
            2.8,
            0.9797958971132712
        ],
        "soundness_avg": [
            2.6,
            1.019803902718557
        ],
        "contribution_avg": [
            3.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.0,
            0.8944271909999159
        ],
        "wc_summary_avg": [
            132.6,
            75.23456652363991
        ],
        "wc_strengths_avg": [
            76.0,
            63.24871540197476
        ],
        "wc_weaknesses_avg": [
            182.4,
            207.09476091876397
        ],
        "wc_questions_avg": [
            138.8,
            159.3378799909174
        ],
        "wc_review_avg": [
            529.8,
            490.19849040975225
        ],
        "wc_reply_reviewers_avg": [
            49.6,
            72.99753420493052
        ],
        "wc_reply_authors_avg": [
            691.2,
            320.81795460977554
        ],
        "reply_reviewers_avg": [
            0.8,
            1.1661903789690604
        ],
        "reply_authors_avg": [
            1.8,
            0.7483314773547883
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.74535599249993,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:TQCyL5t9lrUJ:scholar.google.com/&scioq=Sharp+results+for+NIEP+and+NMF&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Google",
        "aff_unique_dep": "Google",
        "aff_unique_url": "https://www.google.com",
        "aff_unique_abbr": "Google",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Mountain View",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "z9FXRHoQdc",
        "title": "Best Response Shaping",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We investigate the challenge of multi-agent deep reinforcement learning in partially competitive environments, where traditional methods struggle to foster non-exploitable cooperation. LOLA and POLA agents learn non-exploitable cooperative policies by differentiation through look-ahead optimization steps of their opponent. However, there is a key limitation in these techniques as they are susceptible to exploitation by further optimization. In response, we introduce a novel approach, Best Response Shaping (BRS), which differentiates through an opponent approximating the best response, termed the \"detective.\" To condition the detective on the agent's policy for complex games we propose a state-aware differentiable conditioning mechanism, facilitated by a question answering (QA) method that extracts a representation of the agent based on its behaviour on specific environment states. To empirically validate our method, we showcase its enhanced performance against a Monte Carlo Tree Search (MCTS) opponent, which serves as an approximation to the best response in the Coin Game. This work expands the applicability of multi-agent RL in partially competitive environments and provides a new pathway towards achieving improved social welfare in general sum games.",
        "keywords": "social dilemmas;multi-agent reinforcement learning;deep reinforcement learning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "/attachment/c8fbc3e60b188af13aa8bc6a004b10a0362e80ba.pdf",
        "author": "Milad Aghajohari;Tim Cooijmans;Juan Agustin Duque;Shunichi Akatsuka;Aaron Courville",
        "authorids": "~Milad_Aghajohari1;~Tim_Cooijmans1;~Juan_Agustin_Duque1;~Shunichi_Akatsuka1;~Aaron_Courville3",
        "gender": "M;M;M;M;",
        "homepage": ";;https://juanduquevan.github.io/;;",
        "dblp": "241/5265;153/5756;364/5866;;56/1688",
        "google_scholar": ";https://scholar.google.ca/citations?user=Ec6vKzwAAAAJ;;Ee2ILC8AAAAJ;https://scholar.google.ca/citations?user=km6CP8cAAAAJ",
        "orcid": ";;;0000-0002-1681-6405;",
        "linkedin": "milad-aghajohari-6b9a669b/;;;shunichi-akatsuka/;",
        "or_profile": "~Milad_Aghajohari1;~Tim_Cooijmans1;~Juan_Agustin_Duque1;~Shunichi_Akatsuka1;~Aaron_Courville3",
        "aff": "Montreal Institute for Learning Algorithms, University of Montreal, Universit\u00e9 de Montr\u00e9al;University of Montreal;Universit\u00e9 de Montr\u00e9al;Hitachi, Ltd.;Universit\u00e9 de Montr\u00e9al",
        "aff_domain": "mila.umontreal.ca;umontreal.ca;umontreal.ca;hitachi.co.jp; ",
        "position": "Researcher;PhD student;PhD student;Researcher;Assistant Professor",
        "bibtex": "@misc{\naghajohari2024best,\ntitle={Best Response Shaping},\nauthor={Milad Aghajohari and Tim Cooijmans and Juan Agustin Duque and Shunichi Akatsuka and Aaron Courville},\nyear={2024},\nurl={https://openreview.net/forum?id=z9FXRHoQdc}\n}",
        "github": "",
        "project": "",
        "reviewers": "1vtA;FRpg;Hmjc;NynT",
        "site": "https://openreview.net/forum?id=z9FXRHoQdc",
        "pdf_size": 1882706,
        "rating": "3;5;5;6",
        "confidence": "5;3;4;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;2",
        "presentation": "2;3;4;2",
        "wc_summary": "47;50;37;55",
        "wc_strengths": "31;16;34;89",
        "wc_weaknesses": "592;225;234;615",
        "wc_questions": "46;88;134;162",
        "wc_review": "716;379;439;921",
        "wc_reply_reviewers": "289;52;0;211",
        "wc_reply_authors": "817;856;643;1620",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "3;3;2;3",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            47.25,
            6.5717197140474575
        ],
        "wc_strengths_avg": [
            42.5,
            27.69927796892908
        ],
        "wc_weaknesses_avg": [
            416.5,
            187.20376598775997
        ],
        "wc_questions_avg": [
            107.5,
            44.25776767980961
        ],
        "wc_review_avg": [
            613.75,
            218.23310358421796
        ],
        "wc_reply_reviewers_avg": [
            138.0,
            116.8011130083956
        ],
        "wc_reply_authors_avg": [
            984.0,
            375.84903884405503
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            0.4330127018922193
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.6488856845230502,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2110183224632443547&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;1;2;1",
        "aff_unique_norm": "University of Montreal;Universit\u00e9 de Montr\u00e9al;Hitachi, Ltd.",
        "aff_unique_dep": "Montreal Institute for Learning Algorithms;;",
        "aff_unique_url": "https://www.mila.quebec;https://www.umontreal.ca;https://www.hitachi.com",
        "aff_unique_abbr": "MILA;UdeM;Hitachi",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Montreal;",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "Canada;Japan"
    },
    {
        "id": "z9Xb6fADe4",
        "title": "Towards Greener and Sustainable Airside Operations: A Deep Reinforcement Learning Approach to Pushback Rate Control for Mixed-Mode Runways",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Airside taxi delays have adverse consequences for airports and airlines globally, leading to airside congestion, increased Air Traffic Controller/Pilot workloads, missed passenger connections, and adverse environmental impact due to excessive fuel consumption. Effectively addressing taxi delays necessitates the synchronization of stochastic and uncertain airside operations, encompassing aircraft pushbacks, taxiway movements, and runway take-offs. With the implementation of mixed-mode runway operations (arrivals-departures on the same runway) to accommodate projected traffic growth, complexity of airside operations is expected to increase significantly. To manage airside congestion under increased traffic demand, development of efficient pushback control, also known as Departure Metering (DM), policies is a challenging problem. DM is an airside congestion management procedure that controls departure pushback timings, aiming to reduce taxi delays by transferring taxiway waiting times to gates. Under mixed-mode runway operations, however, DM must additionally maintain sufficient runway pressure---departure queues near runway for take-offs---to utilize available departure slots within incoming arrival aircraft steams. While a high pushback rate may result in extended departure queues, leading to increased taxi-out delays, a low pushback rate can result in empty slots between incoming arrival streams, leading to reduced runway throughput.\n    \n This study introduces a Deep Reinforcement Learning (DRL) based DM approach for mixed-mode runway operations. We cast the DM problem in a markov decision process framework and use Singapore Changi Airport surface movement data to simulate airside operations and evaluate different DM policies. Predictive airside hotspots are identified using a spatial-temporal event graph, serving as the observation to the DRL agent. Our DRL based DM approach utilizes pushback rate as agent's action and reward shaping to dynamically regulate pushback rates for improved runway utilization and taxi delay management under uncertainties. Benchmarking the learnt DRL based DM policy against other baselines demonstrates the superior performance of our method, especially in high traffic density scenarios. Results, on a typical day of operations at Singapore Changi Airport, demonstrate that DRL based DM can reduce peak taxi times (1-3 minutes, on average); save approximately 27\\% in fuel consumption and overall better manage the airside traffic.",
        "keywords": "Mix Mode Runways;Departure Metering;Intelligent Transportation Systems;Deep Reinforcement Learning",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Hasnain Ali;Thinh Pham;sameer alam",
        "authorids": "~Hasnain_Ali1;~Thinh_Pham3;~sameer_alam1",
        "gender": "M;M;",
        "homepage": ";;",
        "dblp": ";;",
        "google_scholar": "7gkNRBYAAAAJ;https://scholar.google.com.sg/citations?user=hrGEgUUAAAAJ;https://scholar.google.com.au/citations?user=5W6FyV0AAAAJ",
        "orcid": ";0000-0001-5156-8171;",
        "linkedin": ";;",
        "or_profile": "~Hasnain_Ali1;~Thinh_Pham3;~sameer_alam1",
        "aff": ";Nanyang Technological University;Nanyang Technological University",
        "aff_domain": ";ntu.edu.sg;ntu.edu.sg",
        "position": ";Researcher;Associate Professor",
        "bibtex": "@misc{\nali2024towards,\ntitle={Towards Greener and Sustainable Airside Operations: A Deep Reinforcement Learning Approach to Pushback Rate Control for Mixed-Mode Runways},\nauthor={Hasnain Ali and Thinh Pham and sameer alam},\nyear={2024},\nurl={https://openreview.net/forum?id=z9Xb6fADe4}\n}",
        "github": "",
        "project": "",
        "reviewers": "NYw3;WotT;f91p;n3Ra",
        "site": "https://openreview.net/forum?id=z9Xb6fADe4",
        "pdf_size": 2562780,
        "rating": "3;3;5;5",
        "confidence": "3;4;4;2",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;2",
        "presentation": "3;2;3;3",
        "wc_summary": "50;96;53;134",
        "wc_strengths": "40;103;60;51",
        "wc_weaknesses": "92;117;42;33",
        "wc_questions": "103;99;133;56",
        "wc_review": "285;415;288;274",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "560;320;639;495",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            83.25,
            34.491846862700754
        ],
        "wc_strengths_avg": [
            63.5,
            23.879907872519105
        ],
        "wc_weaknesses_avg": [
            71.0,
            34.792240514229604
        ],
        "wc_questions_avg": [
            97.75,
            27.453369556395078
        ],
        "wc_review_avg": [
            315.5,
            57.68231964822497
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            503.5,
            117.57657079537573
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.30151134457776363,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8874165198681465786&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Nanyang Technological University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ntu.edu.sg",
        "aff_unique_abbr": "NTU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Singapore"
    },
    {
        "id": "z9ySIS1inA",
        "title": "Complex-valued Scattering Representations",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Complex-valued deep learning has made significant progress with manifold geometry and group theory. It delivers leaner and better classifiers with novel complex-valued layer functions and network architectures, not only on naturally complex-valued data such as Magnetic Resonance imaging (MRI) but also on real-valued data such as RGB or multi-spectral images. However, current complex-valued representations for complex-valued and real-valued inputs are rudimentary, focusing on channel characteristics (e.g., sliding encoding) without capturing spatial and spatial-frequency properties of the input data. We propose Complex-valued Scattering Representations (CSR) as universal complex-valued representations and integrate them into complex-valued deep learning networks.  To obtain CSR, We construct filters based on complex-valued Morlet wavelets with tunable parameters and develop learnable high-dimensional complex-valued ReLU as the non-linear activation function.  By incorporating these novel components into complex-valued models, our models significantly outperform real-valued counterparts and existing complex-valued models on RGB, multi-spectral image (MSI), and MRI patch classification tasks, especially under limited labeled training data settings, greatly enhancing complex-valued networks on a broader range of applications.",
        "keywords": "Complex-valued Deep Learning;Scattering Representations;Representation Learning;Training with limited-labled data",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/c8a8892c8d20f2f83c5975cab8c82e2d4760bfff.zip",
        "author": "Ke Wang;Utkarsh Singhal;Michael Lustig;Stella X. Yu",
        "authorids": "~Ke_Wang8;~Utkarsh_Singhal1;~Michael_Lustig2;~Stella_X._Yu2",
        "gender": "M;M;;F",
        "homepage": "https://people.eecs.berkeley.edu/~kewang/;;https://people.eecs.berkeley.edu/~mlustig/;http://www.eecs.umich.edu/~stellayu",
        "dblp": ";;;58/5089",
        "google_scholar": "Iz3m3v4AAAAJ;lvA86MYAAAAJ;;https://scholar.google.com/citations?hl=en",
        "orcid": ";;;",
        "linkedin": ";;;",
        "or_profile": "~Ke_Wang8;~Utkarsh_Singhal1;~Michael_Lustig2;~Stella_Yu2",
        "aff": "Adobe Systems;University of California, Berkeley;University of California, Berkeley;University of California, Berkeley",
        "aff_domain": "adobe.com;berkeley.edu;berkeley.edu;berkeley.edu",
        "position": "Researcher;PhD student;Full Professor;Adjunct Professor",
        "bibtex": "@misc{\nwang2024complexvalued,\ntitle={Complex-valued Scattering Representations},\nauthor={Ke Wang and Utkarsh Singhal and Michael Lustig and Stella X. Yu},\nyear={2024},\nurl={https://openreview.net/forum?id=z9ySIS1inA}\n}",
        "github": "",
        "project": "",
        "reviewers": "yQE4;sNU1;G9gH;X1jj",
        "site": "https://openreview.net/forum?id=z9ySIS1inA",
        "pdf_size": 4194210,
        "rating": "3;5;5;6",
        "confidence": "3;3;4;4",
        "soundness": "3;2;2;4",
        "contribution": "2;2;2;3",
        "presentation": "1;4;2;4",
        "wc_summary": "46;73;102;141",
        "wc_strengths": "41;58;101;84",
        "wc_weaknesses": "245;93;77;251",
        "wc_questions": "108;119;104;155",
        "wc_review": "440;343;384;631",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            1.299038105676658
        ],
        "wc_summary_avg": [
            90.5,
            35.245567097154215
        ],
        "wc_strengths_avg": [
            71.0,
            23.119256043393783
        ],
        "wc_weaknesses_avg": [
            166.5,
            81.72361959678487
        ],
        "wc_questions_avg": [
            121.5,
            20.1059692628831
        ],
        "wc_review_avg": [
            449.5,
            110.30072529226632
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.6882472016116854,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:gPxVnmRE-xcJ:scholar.google.com/&scioq=Complex-valued+Scattering+Representations&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;1",
        "aff_unique_norm": "Adobe;University of California, Berkeley",
        "aff_unique_dep": "Adobe Systems Incorporated;",
        "aff_unique_url": "https://www.adobe.com;https://www.berkeley.edu",
        "aff_unique_abbr": "Adobe;UC Berkeley",
        "aff_campus_unique_index": "1;1;1",
        "aff_campus_unique": ";Berkeley",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "AgentBench: Evaluating LLMs as Agents",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17388",
        "id": "zAdUB0aCTQ",
        "author_site": "Xiao Liu, Hao Yu, Hanchen Zhang, Yifan Xu, Xuanyu Lei, Hanyu Lai, Yu Gu, Hangliang Ding, Kaiwen Men, Kejuan Yang, Shudan Zhang, Xiang Deng, Aohan Zeng, Zhengxiao Du, Chenhui Zhang, Sheng Shen, Tianjun Zhang, Yu Su, Huan Sun, Minlie Huang, Yuxiao Dong, Jie Tang",
        "tldr": "",
        "abstract": "The potential of Large Language Model (LLM) as agents has been widely acknowledged recently.\nThus, there is an urgent need to quantitatively evaluate LLMs as agents on challenging tasks in interactive environments.\nWe present AgentBench, a multi-dimensional benchmark that consists of 8 distinct environments to assess LLM-as-Agent's reasoning and decision-making abilities.\nOur extensive test over 29 API-based and open-sourced (OSS) LLMs shows that, while top commercial LLMs present a strong ability of acting as agents in complex environments, there is a significant disparity in performance between them and many OSS competitors that are no larger than 70B.\nWe identify the typical reasons of failures in environments and LLMs, showing that poor long-term reasoning, decision-making, and instruction following abilities are the main obstacles for developing usable LLM agents.\nImproving instruction following and training on high quality multi-round alignment data could improve agent performance.\nAnd different from existing assumptions, training on code present ambivalent impacts on different agent tasks.\nDatasets, environments, and an integrated evaluation package for AgentBench are released at https://github.com/THUDM/AgentBench.",
        "keywords": "Large language models;Autonomous agents;Reasoning;Evaluation;Benchmark",
        "primary_area": "datasets and benchmarks",
        "supplementary_material": "",
        "author": "Xiao Liu;Hao Yu;Hanchen Zhang;Yifan Xu;Xuanyu Lei;Hanyu Lai;Yu Gu;Hangliang Ding;Kaiwen Men;Kejuan Yang;Shudan Zhang;Xiang Deng;Aohan Zeng;Zhengxiao Du;Chenhui Zhang;Sheng Shen;Tianjun Zhang;Yu Su;Huan Sun;Minlie Huang;Yuxiao Dong;Jie Tang",
        "authorids": "~Xiao_Liu15;~Hao_Yu12;~Hanchen_Zhang1;~Yifan_Xu7;~Xuanyu_Lei1;~Hanyu_Lai2;~Yu_Gu5;~Hangliang_Ding1;~Kaiwen_Men1;~Kejuan_Yang1;~Shudan_Zhang1;~Xiang_Deng2;~Aohan_Zeng1;~Zhengxiao_Du1;~Chenhui_Zhang1;~Sheng_Shen2;~Tianjun_Zhang1;~Yu_Su2;~Huan_Sun1;~Minlie_Huang1;~Yuxiao_Dong1;~Jie_Tang1",
        "gender": "M;;M;M;M;M;M;;F;;M;M;M;M;;M;;M;F;M;M;",
        "homepage": "https://github.com/xiao9905;;https://github.com/zhc7;https://github.com/xuyifan-0731;https://github.com/leixy20;https://github.com/hanyullai;http://entslscheia.github.io;;;;https://github.com/Daniel-0222;https://xiang-deng.github.io/;;https://duzx16.github.io;;https://sincerass.github.io;https://tianjunz.github.io;http://ysu1989.github.io;https://u.osu.edu/ihudas/people/;http://coai.cs.tsinghua.edu.cn/hml;https://keg.cs.tsinghua.edu.cn/yuxiao/;",
        "dblp": "82/1364-36;;;;326/4857.html;;15/4208-16;;;;;95/4545-1;286/8519.html;234/0081;;138/5764-1.html;;38/1070-1;33/2952-1.html;;17/9267;",
        "google_scholar": "VKI8EhUAAAAJ;;pGcJcagAAAAJ;fPvbfBUAAAAJ;ZF--wKwAAAAJ;;c5RwjjcAAAAJ;;https://scholar.google.com/citations?hl=en;;;d-qpndsAAAAJ;STftvjoAAAAJ;A8x07E0AAAAJ;;https://scholar.google.com/citations?hl=en;UE9jz_MAAAAJ;rIh5OqoAAAAJ;wIFkulcAAAAJ;https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com.hk/citations?hl=en;",
        "orcid": "0000-0002-9226-4569;;0009-0001-3292-8757;;;;;;;;;;;;;;;;;;0000-0002-6092-2002;",
        "linkedin": ";;;;;;;;;;;;;;;sheng-s-ab198a174/;;;huan-sun-81527924/?originalSubdomain=cn;;;",
        "or_profile": "~Xiao_Liu15;~Hao_Yu12;~Hanchen_Zhang1;~Yifan_Xu7;~Xuanyu_Lei1;~Hanyu_Lai2;~Yu_Gu5;~Hangliang_Ding1;~Kaiwen_Men1;~Kejuan_Yang1;~Shudan_Zhang1;~Xiang_Deng2;~Aohan_Zeng1;~Zhengxiao_Du1;~Chenhui_Zhang1;~Sheng_Shen2;~Tianjun_Zhang1;~Yu_Su2;~Huan_Sun1;~Minlie_Huang1;~Yuxiao_Dong1;~Jie_Tang1",
        "aff": "Tsinghua University;;Tsinghua University;Tsinghua University;Tsinghua University;Tsinghua University;Ohio State University;;Tsinghua University;;;Google;Tsinghua University;Tsinghua University;;University of California, Berkeley;University of California, Berkeley;Microsoft;The Ohio State University, Columbus;Tsinghua University;Tsinghua University;",
        "aff_domain": "tsinghua.edu.cn;;tsinghua.edu.cn;mails.tsinghua.edu.cn;mails.tsinghua.edu.cn;tsinghua.edu.cn;osu.edu;;tsinghua.edu.cn;;;google.com;tsinghua.edu.cn;tsinghua.edu.cn;;berkeley.edu;berkeley.edu;microsoft.com;osu.edu;tsinghua.edu.cn;tsinghua.edu.cn;",
        "position": "PhD student;;Undergrad student;PhD student;Undergrad student;MS student;PhD student;;MS student;;;Researcher;PhD student;PhD student;;PhD student;PhD student;Senior Researcher;Associate Professor;Full Professor;Associate Professor;",
        "bibtex": "@inproceedings{\nliu2024agentbench,\ntitle={AgentBench: Evaluating {LLM}s as Agents},\nauthor={Xiao Liu and Hao Yu and Hanchen Zhang and Yifan Xu and Xuanyu Lei and Hanyu Lai and Yu Gu and Hangliang Ding and Kaiwen Men and Kejuan Yang and Shudan Zhang and Xiang Deng and Aohan Zeng and Zhengxiao Du and Chenhui Zhang and Sheng Shen and Tianjun Zhang and Yu Su and Huan Sun and Minlie Huang and Yuxiao Dong and Jie Tang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=zAdUB0aCTQ}\n}",
        "github": "",
        "project": "",
        "reviewers": "hDNu;39pk;eDe1;WbYN;39aA",
        "pdf_size": 23017165,
        "rating": "3;6;6;8;8",
        "confidence": "4;4;4;4;3",
        "soundness": "2;2;3;4;3",
        "contribution": "2;2;3;4;3",
        "presentation": "2;1;3;4;3",
        "wc_summary": "26;105;58;119;46",
        "wc_strengths": "15;90;31;58;43",
        "wc_weaknesses": "254;605;186;138;44",
        "wc_questions": "120;30;30;4;21",
        "wc_review": "415;830;305;319;154",
        "wc_reply_reviewers": "206;39;0;52;12",
        "wc_reply_authors": "2289;2427;1210;419;504",
        "reply_reviewers": "1;1;0;1;1",
        "reply_authors": "5;5;3;2;2",
        "rating_avg": [
            6.2,
            1.8330302779823362
        ],
        "confidence_avg": [
            3.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.8,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.8,
            0.7483314773547882
        ],
        "presentation_avg": [
            2.6,
            1.019803902718557
        ],
        "wc_summary_avg": [
            70.8,
            35.436704135683954
        ],
        "wc_strengths_avg": [
            47.4,
            25.55464732685623
        ],
        "wc_weaknesses_avg": [
            245.4,
            192.35966313133324
        ],
        "wc_questions_avg": [
            41.0,
            40.625115384451526
        ],
        "wc_review_avg": [
            404.6,
            228.52623481779943
        ],
        "wc_reply_reviewers_avg": [
            61.8,
            74.44299832757947
        ],
        "wc_reply_authors_avg": [
            1369.8,
            853.4362073406542
        ],
        "reply_reviewers_avg": [
            0.8,
            0.4
        ],
        "reply_authors_avg": [
            3.4,
            1.3564659966250538
        ],
        "replies_avg": [
            28,
            0
        ],
        "authors#_avg": [
            22,
            0
        ],
        "corr_rating_confidence": -0.4909902530309828,
        "gs_citation": 175,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17298865796446863019&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=zAdUB0aCTQ",
        "pdf": "https://openreview.net/pdf?id=zAdUB0aCTQ",
        "email": "tsinghua.edu.cn;;tsinghua.edu.cn;mails.tsinghua.edu.cn;mails.tsinghua.edu.cn;tsinghua.edu.cn;osu.edu;;tsinghua.edu.cn;;;google.com;tsinghua.edu.cn;tsinghua.edu.cn;;berkeley.edu;berkeley.edu;microsoft.com;osu.edu;tsinghua.edu.cn;tsinghua.edu.cn;",
        "author_num": 22,
        "aff_unique_index": "0;0;0;0;0;1;0;2;0;0;3;3;4;1;0;0",
        "aff_unique_norm": "Tsinghua University;Ohio State University;Google;University of California, Berkeley;Microsoft",
        "aff_unique_dep": ";;Google;;Microsoft Corporation",
        "aff_unique_url": "https://www.tsinghua.edu.cn;https://www.osu.edu;https://www.google.com;https://www.berkeley.edu;https://www.microsoft.com",
        "aff_unique_abbr": "THU;OSU;Google;UC Berkeley;Microsoft",
        "aff_campus_unique_index": "1;2;2;3",
        "aff_campus_unique": ";Mountain View;Berkeley;Columbus",
        "aff_country_unique_index": "0;0;0;0;0;1;0;1;0;0;1;1;1;1;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "zBgAlcIoZP",
        "title": "Dynamic Mode Decomposition-inspired Autoencoders for Reduced-order Modeling and Control of PDEs : Theory and Design",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Modeling and controlling complex spatiotemporal dynamical systems driven by partial differential equations (PDEs) often necessitate dimensionality reduction techniques to construct lower-order models for computational efficiency. This paper studies a deep autoencoding learning method for controlling dynamical systems governed by spatiotemporal PDEs. We first analytically show that an optimization objective for learning a linear autoencoding reduced-order model can be formulated, yielding a solution that closely resembles the result obtained through the $\\textit{dynamic mode decomposition with control}$ algorithm. Subsequently, we extend this linear autoencoding architecture to a deep autoencoding framework, enabling the development of a nonlinear reduced-order model. Furthermore, we leverage the learned reduced-order model to design controllers using stability-constrained deep neural networks. Our framework operates without prior knowledge of the governing equations of the underlying system, relying solely on time series data of observations and actuations. Empirical analyses are presented to validate the efficacy of our approach in both modeling and controlling spatiotemporal dynamical systems, exemplified through applications to reaction-diffusion systems and fluid flow systems.",
        "keywords": "PDEs;Autoencoders;Reduced-order modeling;Control;Dynamic mode decomposition",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Priyabrata Saha;Saibal Mukhopadhyay",
        "authorids": "~Priyabrata_Saha1;~Saibal_Mukhopadhyay2",
        "gender": "M;M",
        "homepage": "https://www.priyabratasaha.com/;https://greenlab.ece.gatech.edu",
        "dblp": "216/9953;66/1210",
        "google_scholar": "jhzXDhoAAAAJ;5KRtMEkAAAAJ",
        "orcid": ";0000-0002-8894-3390",
        "linkedin": ";",
        "or_profile": "~Priyabrata_Saha1;~Saibal_Mukhopadhyay2",
        "aff": "Georgia Institute of Technology;Georgia Institute of Technology",
        "aff_domain": "gatech.edu;gatech.edu",
        "position": "Postdoc;Full Professor",
        "bibtex": "@misc{\nsaha2024dynamic,\ntitle={Dynamic Mode Decomposition-inspired Autoencoders for Reduced-order Modeling and Control of {PDE}s : Theory and Design},\nauthor={Priyabrata Saha and Saibal Mukhopadhyay},\nyear={2024},\nurl={https://openreview.net/forum?id=zBgAlcIoZP}\n}",
        "github": "",
        "project": "",
        "reviewers": "Wa1W;9vtz;WjTs;Dp49",
        "site": "https://openreview.net/forum?id=zBgAlcIoZP",
        "pdf_size": 2940281,
        "rating": "6;6;6;6",
        "confidence": "3;3;3;3",
        "soundness": "4;3;2;2",
        "contribution": "3;3;3;2",
        "presentation": "3;4;3;2",
        "wc_summary": "77;46;62;58",
        "wc_strengths": "27;52;28;76",
        "wc_weaknesses": "37;21;180;214",
        "wc_questions": "1;41;38;1",
        "wc_review": "142;160;308;349",
        "wc_reply_reviewers": "18;0;59;35",
        "wc_reply_authors": "216;289;836;561",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "3;2;3;3",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            60.75,
            11.07643895843786
        ],
        "wc_strengths_avg": [
            45.75,
            20.129269733400662
        ],
        "wc_weaknesses_avg": [
            113.0,
            85.04410620378111
        ],
        "wc_questions_avg": [
            20.25,
            19.279198634798075
        ],
        "wc_review_avg": [
            239.75,
            90.15091513678605
        ],
        "wc_reply_reviewers_avg": [
            28.0,
            21.760055146988943
        ],
        "wc_reply_authors_avg": [
            475.5,
            244.63901978220892
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            0.4330127018922193
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:tE5OABStXu4J:scholar.google.com/&scioq=Dynamic+Mode+Decomposition-inspired+Autoencoders+for+Reduced-order+Modeling+and+Control+of+PDEs+:+Theory+and+Design&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Georgia Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.gatech.edu",
        "aff_unique_abbr": "Georgia Tech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "zCJFTA19K4",
        "title": "Token Alignment via Character Matching for Subword Completion",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Generative models, widely utilized in various applications, often struggle with prompts corresponding to partial tokens. This struggle stems from tokenization, where partial tokens fall out of distribution during inference, leading to incorrect or nonsensical outputs. This paper examines a technique to alleviate the tokenization artifact on text completion in generative models, maintaining performance even in regular non-subword cases. The method, termed token alignment, involves backtracking to the last complete tokens and ensuring the model\u2019s generation aligns with the prompt. This approach showcases marked improvement across many partial token scenarios, including nuanced cases like space-prefix and partial indentation, with only a minor time increase. The technique and analysis detailed in this paper contribute to the continuous advancement of generative models in handling partial inputs, bearing relevance for applications like code completion and text autocompletion.",
        "keywords": "subword handling;partial token;token alignment",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Ben Athiwaratkun;Shiqi Wang;Mingyue Shang;YUCHEN TIAN;Zijian Wang;Sujan Kumar Gonugondla;Sanjay Krishna Gouda;Robert Kwiatkowski;Ramesh Nallapati;Bing Xiang",
        "authorids": "~Ben_Athiwaratkun1;~Shiqi_Wang2;~Mingyue_Shang1;~YUCHEN_TIAN2;~Zijian_Wang1;~Sujan_Kumar_Gonugondla1;~Sanjay_Krishna_Gouda1;~Robert_Kwiatkowski1;~Ramesh_Nallapati1;~Bing_Xiang2",
        "gender": "M;M;;M;;;M;M;M;",
        "homepage": "https://benathi.github.io;https://shiqi-wang.github.io;;;;https://gsujankumar.github.io;;https://amazon.com;;",
        "dblp": "166/1659;58/9145-2;;;;166/6408.html;;;59/4797;",
        "google_scholar": "KZpZTTQAAAAJ;u_MzXeMAAAAJ;;;;F_ud9E4AAAAJ;_zJ8IOEAAAAJ;;;A6yjdJAAAAAJ",
        "orcid": ";0000-0002-6338-1432;;;;0000-0003-4743-6461;;;;",
        "linkedin": ";tcwangshiqi/;;yuchent;;sujan-kumar-gonugondla-ab6787142/;;;;",
        "or_profile": "~Ben_Athiwaratkun1;~Shiqi_Wang2;~Mingyue_Shang1;~YUCHEN_TIAN2;~Zijian_Wang1;~Sujan_Kumar_Gonugondla1;~Sanjay_Krishna_Gouda1;~Robert_Kwiatkowski1;~Ramesh_Nallapati1;~Bing_Xiang2",
        "aff": "Amazon;Amazon;;;;Amazon;Amazon;Amazon;Amazon Web Services;Goldman Sachs",
        "aff_domain": "amazon.com;amazon.com;;;;amazon.com;amazon.com;amazon.com;amazon.com;gs.com",
        "position": "AI Scientist;Researcher;;;;Researcher;Researcher;Researcher;Senior Principal Scientist;Managing Director",
        "bibtex": "@misc{\nathiwaratkun2024token,\ntitle={Token Alignment via Character Matching for Subword Completion},\nauthor={Ben Athiwaratkun and Shiqi Wang and Mingyue Shang and YUCHEN TIAN and Zijian Wang and Sujan Kumar Gonugondla and Sanjay Krishna Gouda and Robert Kwiatkowski and Ramesh Nallapati and Bing Xiang},\nyear={2024},\nurl={https://openreview.net/forum?id=zCJFTA19K4}\n}",
        "github": "",
        "project": "",
        "reviewers": "dd8B;jqrQ;kAYh;fPS1",
        "site": "https://openreview.net/forum?id=zCJFTA19K4",
        "pdf_size": 263779,
        "rating": "3;5;5;6",
        "confidence": "4;4;4;3",
        "soundness": "2;2;2;3",
        "contribution": "1;2;3;2",
        "presentation": "2;2;2;3",
        "wc_summary": "75;20;146;74",
        "wc_strengths": "8;27;153;39",
        "wc_weaknesses": "59;27;367;53",
        "wc_questions": "42;201;321;88",
        "wc_review": "184;275;987;254",
        "wc_reply_reviewers": "0;0;240;11",
        "wc_reply_authors": "147;501;862;222",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.75,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            78.75,
            44.751396626250674
        ],
        "wc_strengths_avg": [
            56.75,
            56.65851657076807
        ],
        "wc_weaknesses_avg": [
            126.5,
            139.37270177477367
        ],
        "wc_questions_avg": [
            163.0,
            108.02083132433299
        ],
        "wc_review_avg": [
            425.0,
            326.21541962329127
        ],
        "wc_reply_reviewers_avg": [
            62.75,
            102.43382009863734
        ],
        "wc_reply_authors_avg": [
            433.0,
            280.6162860562444
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": -0.6622661785325219,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2205915318170512008&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;0;0;0;0;0;1",
        "aff_unique_norm": "Amazon;Goldman Sachs",
        "aff_unique_dep": "Amazon.com, Inc.;",
        "aff_unique_url": "https://www.amazon.com;https://www.goldmansachs.com",
        "aff_unique_abbr": "Amazon;GS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "zDMM4ZX1UB",
        "title": "Exploiting Code Symmetries for Learning Program Semantics",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) hold significant potential for automating program analysis, but current code LLMs face challenges in grasping program semantics. Our paper addresses this by formalizing program semantics through code symmetries and integrating them into LLM architectures for code analysis. We introduce a group-theoretic framework that defines code symmetries as semantics-preserving transformations, enabling precise reasoning within LLMs. Our solution, SymC, employs a novel variant of group-equivariant self-attention that is provably equivariant to code symmetries. We extensively evaluate SymC on four program analysis tasks, comparing it to eight baselines against eight code transformations. Our results show that SymC generalizes to unseen code transformations, outperforming the state-of-the-art code models by 30.7%. SymC, by design, stays invariant to semantics-preserving permutations, while state-of-the-art code models like WizardCoder and GPT-4 violate these invariances at a high rate (i.e., 14% and 43%, respectively).",
        "keywords": "Code Symmetry;Program Representation;Code Modeling;Group-Equivariance;Robustness",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "",
        "author": "Kexin Pei;Weichen Li;Qirui Jin;Shuyang Liu;Scott Geng;Lorenzo Cavallaro;Junfeng Yang;Suman Jana",
        "authorids": "~Kexin_Pei1;wl2886@columbia.edu;~Qirui_Jin1;shuyangliu@hust.edu.cn;~Scott_Geng1;~Lorenzo_Cavallaro1;~Junfeng_Yang1;~Suman_Jana1",
        "gender": "M;;M;;;M;M;M",
        "homepage": "https://sites.google.com/site/kexinpeisite/;;https://c-lister.github.io;;https://www.scottgeng.com/;https://s2lab.cs.ucl.ac.uk/people/sullivan;https://www.cs.columbia.edu/~junfeng/;http://sumanj.info",
        "dblp": "145/6061;;;;330/4056.html;95/5162;71/3724.html;74/28",
        "google_scholar": "XzSkny0AAAAJ;;0g6YBJMAAAAJ;;jCg1gRoAAAAJ;oWT7fIYAAAAJ;JJ9AvbAAAAAJ;https://scholar.google.com.tw/citations?user=SDY9FwUAAAAJ",
        "orcid": "0000-0001-5052-9808;;;;;0000-0002-3878-2680;0009-0000-2277-6545;",
        "linkedin": "kexin-pei/;;;;;lorenzocavallaro/;;",
        "or_profile": "~Kexin_Pei1;wl2886@columbia.edu;~Qirui_Jin1;shuyangliu@hust.edu.cn;~Scott_Geng1;~Lorenzo_Cavallaro1;~Junfeng_Yang1;~Suman_Jana1",
        "aff": "The University of Chicago;;University of Michigan - Ann Arbor;;University of Washington;University College London;Columbia University;, Columbia University",
        "aff_domain": "uchicago.edu;;umich.edu;;cs.washington.edu;ucl.ac.uk;columbia.edu;cs.columbia.edu",
        "position": "Assistant Professor;;Undergrad student;;PhD student;Full Professor;Associate Professor;Associate Professor",
        "bibtex": "@misc{\npei2024exploiting,\ntitle={Exploiting Code Symmetries for Learning Program Semantics},\nauthor={Kexin Pei and Weichen Li and Qirui Jin and Shuyang Liu and Scott Geng and Lorenzo Cavallaro and Junfeng Yang and Suman Jana},\nyear={2024},\nurl={https://openreview.net/forum?id=zDMM4ZX1UB}\n}",
        "github": "",
        "project": "",
        "reviewers": "Srm2;nM8R;6HuJ;3XTL",
        "site": "https://openreview.net/forum?id=zDMM4ZX1UB",
        "pdf_size": 669970,
        "rating": "3;3;6;8",
        "confidence": "5;4;2;4",
        "soundness": "1;2;3;4",
        "contribution": "3;2;3;4",
        "presentation": "2;2;2;3",
        "wc_summary": "66;51;51;141",
        "wc_strengths": "79;62;58;75",
        "wc_weaknesses": "219;28;83;112",
        "wc_questions": "38;284;46;46",
        "wc_review": "402;425;238;374",
        "wc_reply_reviewers": "0;0;128;0",
        "wc_reply_authors": "1490;1301;1541;542",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "6;5;5;4",
        "rating_avg": [
            5.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            3.75,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.5,
            1.118033988749895
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            77.25,
            37.31202889149825
        ],
        "wc_strengths_avg": [
            68.5,
            8.73212459828649
        ],
        "wc_weaknesses_avg": [
            110.5,
            69.52877102322462
        ],
        "wc_questions_avg": [
            103.5,
            104.26288889149389
        ],
        "wc_review_avg": [
            359.75,
            72.57539183497393
        ],
        "wc_reply_reviewers_avg": [
            32.0,
            55.42562584220407
        ],
        "wc_reply_authors_avg": [
            1218.5,
            400.67973495049637
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            5.0,
            0.7071067811865476
        ],
        "replies_avg": [
            27,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.43259045634870014,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17308434802228616897&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 10,
        "aff_unique_index": "0;1;2;3;4;4",
        "aff_unique_norm": "University of Chicago;University of Michigan;University of Washington;University College London;Columbia University",
        "aff_unique_dep": ";;;;",
        "aff_unique_url": "https://www.uchicago.edu;https://www.umich.edu;https://www.washington.edu;https://www.ucl.ac.uk;https://www.columbia.edu",
        "aff_unique_abbr": "UChicago;UM;UW;UCL;Columbia",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Ann Arbor",
        "aff_country_unique_index": "0;0;0;1;0;0",
        "aff_country_unique": "United States;United Kingdom"
    },
    {
        "title": "SetCSE: Set Operations using Contrastive Learning of Sentence Embeddings",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17387",
        "id": "zEHGSN8Hy8",
        "tldr": "",
        "abstract": "Taking inspiration from Set Theory, we introduce SetCSE, an innovative information retrieval framework. SetCSE employs sets to represent complex semantics and incorporates well-defined operations for structured information querying under the provided context. Within this framework, we introduce an inter-set contrastive learning objective to enhance comprehension of sentence embedding models concerning the given semantics. Furthermore, we present a suite of operations, including SetCSE intersection, difference, and operation series, that leverage sentence embeddings of the enhanced model for complex sentence retrieval tasks. Throughout this paper, we demonstrate that SetCSE adheres to the conventions of human language expressions regarding compounded semantics, provides a significant enhancement in the discriminatory capability of underlying sentence embedding models, and enables numerous information retrieval tasks involving convoluted and intricate prompts which cannot be achieved using existing querying methods.",
        "keywords": "Representation Learning;Natural Language Processing;Contrastive Learning;Set Operation;Querying Framework;Sentence Embedding;Deep Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/3c0a024301ed6f318ca46208b060ea7ad04e4912.zip",
        "author": "Kang Liu",
        "authorids": "~Kang_Liu5",
        "gender": "M",
        "homepage": "https://cruyffio.github.io/mysite/",
        "dblp": "",
        "google_scholar": "NBdbmr4AAAAJ",
        "orcid": "0000-0003-2002-984X",
        "linkedin": "kang-liu",
        "or_profile": "~Kang_Liu5",
        "aff": "American Express",
        "aff_domain": "aexp.com",
        "position": "Researcher",
        "bibtex": "@inproceedings{\nliu2024setcse,\ntitle={Set{CSE}: Set Operations using Contrastive Learning of Sentence Embeddings},\nauthor={Kang Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=zEHGSN8Hy8}\n}",
        "github": "",
        "project": "",
        "reviewers": "wrMM;3g7o;fKmY;BQxn",
        "pdf_size": 37061986,
        "rating": "5;6;8;8",
        "confidence": "3;4;4;2",
        "soundness": "2;3;2;4",
        "contribution": "2;3;3;4",
        "presentation": "3;3;3;3",
        "wc_summary": "54;124;97;243",
        "wc_strengths": "50;62;104;43",
        "wc_weaknesses": "182;84;133;44",
        "wc_questions": "4;33;24;58",
        "wc_review": "290;303;358;388",
        "wc_reply_reviewers": "18;0;26;0",
        "wc_reply_authors": "745;1133;761;572",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.82915619758885
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            129.5,
            70.12310603502956
        ],
        "wc_strengths_avg": [
            64.75,
            23.657715443381257
        ],
        "wc_weaknesses_avg": [
            110.75,
            51.82361913259243
        ],
        "wc_questions_avg": [
            29.75,
            19.395553614166314
        ],
        "wc_review_avg": [
            334.75,
            39.958572296817614
        ],
        "wc_reply_reviewers_avg": [
            11.0,
            11.357816691600547
        ],
        "wc_reply_authors_avg": [
            802.75,
            204.56585125577533
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.17407765595569782,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10581340186136435675&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=zEHGSN8Hy8",
        "pdf": "https://openreview.net/pdf?id=zEHGSN8Hy8",
        "email": "aexp.com",
        "author_num": 1,
        "aff_unique_index": "0",
        "aff_unique_norm": "American Express",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.americanexpress.com",
        "aff_unique_abbr": "AmEx",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "id": "zEOnlJaRKp",
        "title": "Collaboration! Towards Robust Neural Methods for Vehicle Routing Problems",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "While enjoying desirable efficiency and less dependence on domain expertise, existing neural methods for vehicle routing problems (VRPs) are vulnerable to adversarial attacks -- their performance drops drastically on adversarial instances, i.e., clean instances with crafted perturbations. To enhance the robustness, we propose a Collaborative Neural Framework (CNF) w.r.t the adversarial defense of neural methods for VRPs, which is crucial yet underexplored in literature. Given a neural method, we adversarially train multiple models in a collaborative manner to synergistically promote the robustness against attacks, while maintaining (or even boosting) the standard generalization on clean instances. A neural router is designed to elegantly distribute instances to each model, which improves load balancing and collaborative performance. Extensive experiments verify the effectiveness and versatility of CNF to defend against various attacks for different neural methods. Notably, our trained models also achieve decent out-of-distribution generalization performance on real-world benchmark instances.",
        "keywords": "Learning to Optimize;Vehicle Routing Problem;Combinatorial Optimization",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Jianan Zhou;Yaoxin Wu;Zhiguang Cao;Wen Song;Jie Zhang",
        "authorids": "~Jianan_Zhou1;~Yaoxin_Wu2;~Zhiguang_Cao1;~Wen_Song1;~Jie_Zhang9",
        "gender": "M;M;M;M;M",
        "homepage": "https://royalskye.github.io/;https://zhiguangcaosg.github.io/;https://songwenas12.github.io/;https://personal.ntu.edu.sg/zhangj/;https://research.tue.nl/en/persons/yaoxin-wu",
        "dblp": "296/2326-2;178/8621;50/5489;84/6889-2;192/4964",
        "google_scholar": "9T58m-EAAAAJ;https://scholar.google.com.sg/citations?user=2R-cOkYAAAAJ;s8Nz-xoAAAAJ;IFV_RdMAAAAJ;0qRnmK8AAAAJ",
        "orcid": "0000-0002-4896-148X;0000-0002-4499-759X;0000-0001-7624-1861;;0000-0002-3625-6599",
        "linkedin": ";;;;",
        "or_profile": "~Jianan_Zhou1;~Zhiguang_Cao1;~Wen_Song1;~Jie_Zhang9;~YAOXIN_WU1",
        "aff": "Nanyang Technological University;Singapore Management University;Shandong University;Nanyang Technological University;Eindhoven University of Technology",
        "aff_domain": "ntu.edu.sg;smu.edu.sg;sdu.edu.cn;ntu.edu.sg;tue.nl",
        "position": "PhD student;Assistant Professor;Associate Professor;Full Professor;Assistant Professor",
        "bibtex": "@misc{\nzhou2024collaboration,\ntitle={Collaboration! Towards Robust Neural Methods for Vehicle Routing Problems},\nauthor={Jianan Zhou and Yaoxin Wu and Zhiguang Cao and Wen Song and Jie Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=zEOnlJaRKp}\n}",
        "github": "",
        "project": "",
        "reviewers": "APh6;8oTe;4zRf;ko2G",
        "site": "https://openreview.net/forum?id=zEOnlJaRKp",
        "pdf_size": 659617,
        "rating": "5;5;6;6",
        "confidence": "3;3;4;4",
        "soundness": "2;2;3;2",
        "contribution": "2;3;2;3",
        "presentation": "3;3;4;3",
        "wc_summary": "78;69;56;120",
        "wc_strengths": "17;85;47;91",
        "wc_weaknesses": "157;247;419;148",
        "wc_questions": "78;2;119;264",
        "wc_review": "330;403;641;623",
        "wc_reply_reviewers": "25;0;58;0",
        "wc_reply_authors": "1673;1321;2438;1641",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "5;4;6;4",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            80.75,
            23.972640655547316
        ],
        "wc_strengths_avg": [
            60.0,
            30.01666203960727
        ],
        "wc_weaknesses_avg": [
            242.75,
            108.87234497336777
        ],
        "wc_questions_avg": [
            115.75,
            95.33198571308583
        ],
        "wc_review_avg": [
            499.25,
            135.38532970746869
        ],
        "wc_reply_reviewers_avg": [
            20.75,
            23.805199011980555
        ],
        "wc_reply_authors_avg": [
            1768.25,
            410.4457180919299
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            4.75,
            0.82915619758885
        ],
        "replies_avg": [
            30,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1999274784556748262&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0;3",
        "aff_unique_norm": "Nanyang Technological University;Singapore Management University;Shandong University;Eindhoven University of Technology",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.ntu.edu.sg;https://www.smu.edu.sg;http://www.sdu.edu.cn;https://www.tue.nl",
        "aff_unique_abbr": "NTU;SMU;SDU;TU/e",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;2",
        "aff_country_unique": "Singapore;China;Netherlands"
    },
    {
        "id": "zEhTnQZB3D",
        "title": "Learning with Language Inference and Tips for Continual Reinforcement Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Acquiring a generalizable policy by continually learning a sequence of tasks is a natural human skill yet challenging for current reinforcement learning algorithms. This is largely due to the dilemma that the agent is expected to quickly adapt to new tasks (plasticity) while retaining the common knowledge from previous tasks (stability). In this work, we present a scheme referred to as \u201cLearning with Language Inference and Tips (LLIT)\u201d, which introduces a rewarding mechanism to parse and ground human knowledge in natural language form \n to the task space and produces an interpretable policy for each task in task-agnostic setting. LLIT trains a shared policy for each task by inferring and embedding the tips and content of the task. The language instructions inferred by the large language model (LLM) are then used to pre-train an auxiliary reward model with observations' embedding, thereby extracting the semantic representations in tasks. Simultaneously, the instructions and tips embedding will be collected and organized as a prompt pool to capture the correlation among tasks. Hence, closely related tasks exhibit greater neuron overlap in the policy network, stemming from shared semantics, which effectively curbs cross-task interference and forgetfulness. Given the auxiliary reward model trained on previous tasks that interprets human knowledge in natural language, new task adaptation reduces to highly efficient tips aggregation and sub-network finetuning. In experimental studies, LLIT achieves a desirable plasticity-stability trade-off without any task-specfic information. It also outperforms existing continual RL methods in terms of overall performance, forgetting reduction, and adaptation to unseen tasks. Our code is available at https://github.com/llm4crl/LLIT.",
        "keywords": "continual learning;reinforcement learning;language instructed method",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Yifei Chen;Bo Yuan;Xueqian Wang",
        "authorids": "~Yifei_Chen4;~Bo_Yuan5;~Xueqian_Wang1",
        "gender": "M;M;M",
        "homepage": "https://github.com/chenyf21;http://boyuan.global-optimization.com/;",
        "dblp": ";41/1662-3;43/3563-1",
        "google_scholar": ";FMiooBoAAAAJ;h9dN_ykAAAAJ",
        "orcid": ";0000-0003-2169-0007;0000-0003-3542-0593",
        "linkedin": ";;",
        "or_profile": "~Yifei_Chen4;~Bo_Yuan5;~Xueqian_Wang1",
        "aff": "Tsinghua University;Research Institute of Tsinghua University in Shenzhen;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;tsinghua-sz.org;tsinghua.edu.cn",
        "position": "MS student;Researcher;Full Professor",
        "bibtex": "@misc{\nanonymous2024learning,\ntitle={Learning with Language Inference and Tips for Continual Reinforcement Learning},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=zEhTnQZB3D}\n}",
        "github": "",
        "project": "",
        "reviewers": "LukW;8SCJ;QZUw",
        "site": "https://openreview.net/forum?id=zEhTnQZB3D",
        "pdf_size": 1005395,
        "rating": "1;3;3",
        "confidence": "5;3;4",
        "soundness": "1;1;2",
        "contribution": "2;2;2",
        "presentation": "1;1;2",
        "wc_summary": "97;127;80",
        "wc_strengths": "35;43;54",
        "wc_weaknesses": "82;129;110",
        "wc_questions": "33;332;34",
        "wc_review": "247;631;278",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            101.33333333333333,
            19.430788855719562
        ],
        "wc_strengths_avg": [
            44.0,
            7.788880963698615
        ],
        "wc_weaknesses_avg": [
            107.0,
            19.30457631409368
        ],
        "wc_questions_avg": [
            133.0,
            140.71484167161142
        ],
        "wc_review_avg": [
            385.3333333333333,
            174.17296639324434
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8660254037844387,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:GOXrHKR4ydIJ:scholar.google.com/&scioq=Learning+with+Language+Inference+and+Tips+for+Continual+Reinforcement+Learning&hl=en&as_sdt=0,47",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Tsinghua University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tsinghua.edu.cn",
        "aff_unique_abbr": "THU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Shenzhen",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "zEkvV65Wi1",
        "title": "Understanding Calibration Transfer in Knowledge Distillation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Modern deep neural networks are often miscalibrated, leading to overconfident mistakes that erode their reliability, and limit their use in critical applications. The existing confidence calibration techniques range from train-time modification of loss functions to post-hoc smoothing of the classifier's predicted confidence vector. Despite the success of these approaches, it is relatively unclear if supervision from an already trained expert classifier can further enhance a given classifier's confidence calibration. Knowledge distillation (KD) has been shown to help classifiers achieve better accuracy. However, little to no attention has been paid to a systematic understanding if the calibration can also be transferred via KD. In this work, we provide new insights into how and when expert supervision can produce well-calibrated classifiers, by studying a special class of linear teacher and student classifiers. Specifically, we provide theoretical insights into the working mechanisms of KD and show that calibrated teachers can distill calibrated students. We further show that unlike traditional KD where a smaller capacity classifier learns reliably from a larger capacity expert, transfer of calibration can be induced from lower capacity teachers to larger capacity students (aka reverse-KD). Furthermore, our findings indicate that not all training regimes are equally suitable and that a teacher classifier trained using dynamic label smoothing leads to the better calibration of student classifiers via KD. Moreover, the proposed KD-based calibration leads to a state-of-the-art(SOTA) calibration framework surpassing all existing calibration techniques. Our claims are backed up by extensive experiments on standard computer vision classification tasks. On CIFAR100 using the WRN-40-1 feature extractor, we report an  ECE of 0.98 compared to 7.61 and 2.1 by the current SOTA calibration techniques Adafocal (Ghosh, NeurIPS 2022) and CPC (Cheng and Vasconcelos, CVPR 2022)  respectively, and 11.16 by the baseline NLL loss (lower ECE is better). The calibration improvement is achieved across various architectures. Using MobileNetv2 on CIFAR100 we report an ECE of 0.88/1.83/4.17/7.76 using Ours/Adafocal/CPC/\\NLL.",
        "keywords": "Knowledge distillation;Calibration;Trustworthy ML",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/96103d74bebf3f76a54a10c91fed4190b0dde765.zip",
        "author": "Ramya Hebbalaguppe;Mayank Baranwal;Jatin Prakash;Neelabh Madan;Kartik Anand;Chetan Arora",
        "authorids": "~Ramya_Hebbalaguppe2;~Mayank_Baranwal1;~Jatin_Prakash2;~Neelabh_Madan2;~Kartik_Anand1;~Chetan_Arora1",
        "gender": "F;M;M;M;M;M",
        "homepage": "https://rhebbalaguppe.github.io/;https://www.sc.iitb.ac.in/~mayank;https://github.com/bicycleman15;https://github.com/neelabh17;https://github.com/k-styles;https://www.cse.iitd.ac.in/~chetan/",
        "dblp": "145/2287;69/10832;294/5983;317/5192;;19/1006-1",
        "google_scholar": "https://scholar.google.com/citations?hl=en;dMAimxMAAAAJ;NeBK8VMAAAAJ;;;Q8cTLNMAAAAJ",
        "orcid": "0009-0006-1186-6311;0000-0001-9354-2826;0009-0003-5474-6529;;;",
        "linkedin": "https://in.linkedin.com/in/ramya-hebbalaguppe-620b272;mayank-baranwal/;;;;",
        "or_profile": "~Ramya_Hebbalaguppe2;~Mayank_Baranwal1;~Jatin_Prakash2;~Neelabh_Madan2;~Kartik_Anand1;~Chetan_Arora1",
        "aff": "TCS Research labs;Tata Consultancy Services Limited, India;Microsoft Research;Microsoft;;Indian Institute of Technology Delhi",
        "aff_domain": "tcs.com;tcs.com;microsoft.com;microsoft.com;;iitd.ac.in",
        "position": "Researcher;Principal Researcher;Intern;Intern;;Full Professor",
        "bibtex": "@misc{\nhebbalaguppe2024understanding,\ntitle={Understanding Calibration Transfer in Knowledge Distillation},\nauthor={Ramya Hebbalaguppe and Mayank Baranwal and Jatin Prakash and Neelabh Madan and Kartik Anand and Chetan Arora},\nyear={2024},\nurl={https://openreview.net/forum?id=zEkvV65Wi1}\n}",
        "github": "",
        "project": "",
        "reviewers": "p7Qx;J1h8;U8KR;VrHg",
        "site": "https://openreview.net/forum?id=zEkvV65Wi1",
        "pdf_size": 3726335,
        "rating": "3;3;5;6",
        "confidence": "4;4;4;4",
        "soundness": "2;2;3;3",
        "contribution": "1;2;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "110;89;34;63",
        "wc_strengths": "199;86;24;57",
        "wc_weaknesses": "445;358;2;114",
        "wc_questions": "54;6;112;52",
        "wc_review": "808;539;172;286",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            74.0,
            28.469281690973517
        ],
        "wc_strengths_avg": [
            91.5,
            65.82742589529079
        ],
        "wc_weaknesses_avg": [
            229.75,
            178.91950005519243
        ],
        "wc_questions_avg": [
            56.0,
            37.603191353926334
        ],
        "wc_review_avg": [
            451.25,
            245.08098151427419
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11378836038103153110&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;2;3",
        "aff_unique_norm": "Tata Consultancy Services;Tata Consultancy Services Limited;Microsoft;Indian Institute of Technology Delhi",
        "aff_unique_dep": "Research labs;;Microsoft Research;",
        "aff_unique_url": "https://www.tcs.com;https://www.tcs.com;https://www.microsoft.com/en-us/research;https://www.iitd.ac.in",
        "aff_unique_abbr": "TCS;TCS;MSR;IIT Delhi",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Delhi",
        "aff_country_unique_index": "0;0;1;1;0",
        "aff_country_unique": "India;United States"
    },
    {
        "id": "zFWKKYz2yn",
        "title": "Stability Analysis of Various Symbolic Rule Extraction Methods from Recurrent Neural Network",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "This paper analyzes two competing rule extraction methodologies: quantization and equivalence query. We trained $3600$ RNN models, extracting $18000$ DFA (Deterministic Finite Automata) with a quantization approach (k-means and SOM) and $3600$ DFA by equivalence query($L^{*}$) methods across $10$ initialization seeds. We sampled the datasets from  $7$ Tomita and $4$ Dyck grammars and trained them on $4$ RNN cells: LSTM, GRU, O2RNN, and MIRNN. The observations from our experiments establish the superior performance of O2RNN and quantization-based rule extraction over others. $L^{*}$, primarily proposed for regular grammars, performs similarly to quantization methods for Tomita languages when neural networks are trained completely. However, for partially trained RNNs, $L^{*}$ shows instability in the number of states in DFA, e.g., for Tomita 5 and Tomita 6 languages, $L^{*}$ produced more than $100$ states. In contrast, quantization methods result in rules with the number of states very close to ground truth DFA. Among RNN cells, O2RNN produces stable DFA consistently compared to other cells. For Dyck Languages, we observe that although GRU outperforms other RNNs in network performance, the DFA extracted by O2RNN has higher performance and better stability. The stability is computed as the standard deviation of accuracy on test sets on networks trained across $10$ seeds. On Dyck Languages, quantization methods outperformed $L^{*}$ with better stability in accuracy and the number of states. $L^{*}$ often showed instability in accuracy in the order of  $16\\% - 22\\%$ for GRU and MIRNN while deviation for quantization methods varied in $5\\% - 15\\%$. In many instances with LSTM and GRU,  DFA's extracted by $L^{*}$ even failed to beat chance accuracy ($50\\%$), while those extracted by quantization method had standard deviation in the $7\\%-17\\%$ range. For O2RNN, both rule extraction methods had a deviation in the $0.5\\% - 3\\%$ range.",
        "keywords": "Formal Methods;DFA Extraction Methods;RNN",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "/attachment/0bec9c490d624a74252e9ca365b00d2005160d39.zip",
        "author": "Neisarg Dave;Daniel Kifer;C. Lee Giles;Ankur Mali",
        "authorids": "~Neisarg_Dave1;~Daniel_Kifer1;~C._Lee_Giles1;~Ankur_Mali2",
        "gender": "M;M;M;M",
        "homepage": "https://neisarg.notion.site;http://www.cse.psu.edu/~duk17/;https://clgiles.ist.psu.edu/;https://ankurmali.github.io/",
        "dblp": "220/3717;84/114;g/CLeeGiles;217/1587",
        "google_scholar": "MJjBzggAAAAJ;https://scholar.google.com.tw/citations?hl=en;https://scholar.google.com.tw/citations?user=sAkg9T8AAAAJ;https://scholar.google.co.in/citations?user=ogxlzgcAAAAJ",
        "orcid": ";;0000-0002-1931-585X;",
        "linkedin": ";;;",
        "or_profile": "~Neisarg_Dave1;~Daniel_Kifer1;~C._Lee_Giles1;~Ankur_Mali2",
        "aff": "Pennsylvania State University;Pennsylvania State University;Pennsylvania State University;University of South Florida",
        "aff_domain": "psu.edu;psu.edu;ist.psu.edu;usf.edu",
        "position": "PhD student;Professor;Full Professor;Assistant Professor",
        "bibtex": "@misc{\ndave2024stability,\ntitle={Stability Analysis of Various Symbolic Rule Extraction Methods from Recurrent Neural Network},\nauthor={Neisarg Dave and Daniel Kifer and C. Lee Giles and Ankur Mali},\nyear={2024},\nurl={https://openreview.net/forum?id=zFWKKYz2yn}\n}",
        "github": "",
        "project": "",
        "reviewers": "nZtd;17Qn;AfSv",
        "site": "https://openreview.net/forum?id=zFWKKYz2yn",
        "pdf_size": 1697817,
        "rating": "5;5;8",
        "confidence": "1;3;3",
        "soundness": "4;3;3",
        "contribution": "4;2;3",
        "presentation": "4;1;2",
        "wc_summary": "51;85;73",
        "wc_strengths": "12;111;58",
        "wc_weaknesses": "2;230;25",
        "wc_questions": "128;3;1",
        "wc_review": "193;429;157",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "540;1622;181",
        "reply_reviewers": "0;0;0",
        "reply_authors": "2;4;2",
        "rating_avg": [
            6.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.816496580927726
        ],
        "presentation_avg": [
            2.3333333333333335,
            1.247219128924647
        ],
        "wc_summary_avg": [
            69.66666666666667,
            14.079141387961918
        ],
        "wc_strengths_avg": [
            60.333333333333336,
            40.45024378445972
        ],
        "wc_weaknesses_avg": [
            85.66666666666667,
            102.49010792375145
        ],
        "wc_questions_avg": [
            44.0,
            59.40258131316068
        ],
        "wc_review_avg": [
            259.6666666666667,
            120.63535505352024
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            781.0,
            612.4709516921326
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5000000000000001,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7903043641923333269&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;1",
        "aff_unique_norm": "Pennsylvania State University;University of South Florida",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.psu.edu;https://www.usf.edu",
        "aff_unique_abbr": "PSU;USF",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "zH6zBoktYO",
        "title": "Bring Your Own Data! Self-Supervised Evaluation for Large Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "With the rise of Large Language Models (LLMs) and their ubiquitous deployment in diverse domains, measuring language model behavior on realistic data is imperative. For example, a company deploying a client-facing chatbot must ensure that the model will not respond to client requests with profanity. Current evaluations approach this problem using small, domain-specific datasets with human-curated labels. These evaluation sets are often sampled from a narrow and simplified distribution, and data sources can unknowingly be leaked into the training set, which can lead to misleading evaluations. To alleviate the issues in traditional evaluation, we propose a complementary framework for self-supervised evaluation of LLMs by analyzing their sensitivity or invariance to transformations on the input text. Self-supervised evaluation can directly monitor LLM behavior on datasets collected in the wild or streamed during live model deployment. We demonstrate self-supervised evaluation strategies for measuring closed-book knowledge, toxicity, long-range context dependence, in addition to sensitivity to grammatical structure and tokenization errors. When comparisons to similar human-labeled benchmarks are available, we find strong correlations between self-sensitivity and human-supervised evaluations. The self-sensitivity paradigm complements current evaluation strategies that rely on labeled data.",
        "keywords": "evaluation;LLMs",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/da6d0165f1c17f0219dfaedf5fe9a9d7f4acfc9a.zip",
        "author": "Neel Jain;Khalid Saifullah;Yuxin Wen;John Kirchenbauer;Manli Shu;Aniruddha Saha;Micah Goldblum;Jonas Geiping;Tom Goldstein",
        "authorids": "~Neel_Jain1;~Khalid_Saifullah1;~Yuxin_Wen2;~John_Kirchenbauer1;~Manli_Shu1;~Aniruddha_Saha1;~Micah_Goldblum1;~Jonas_Geiping1;~Tom_Goldstein1",
        "gender": ";M;;M;F;M;;M;M",
        "homepage": ";http://khalidsaifullaah.github.io/;https://yuxinwenrick.github.io/;https://jwkirchenbauer.notion.site/;https://azshue.github.io/;https://ani0075saha.github.io/;;https://jonasgeiping.github.io/;https://www.cs.umd.edu/~tomg/",
        "dblp": ";;;321/0678;263/3503;221/8102;241/7231;190/7229;25/8184",
        "google_scholar": "https://scholar.google.com/citations?hl=en;NNEbBIQAAAAJ;oUYfjg0AAAAJ;48GJrbsAAAAJ;https://scholar.google.com/citations?hl=en;xfjALj0AAAAJ;pGDKzuUAAAAJ;https://scholar.google.de/citations?user=206vNCEAAAAJ;KmSuVtgAAAAJ",
        "orcid": ";;;;;;;;",
        "linkedin": "neel-jain-0a6a239/;;;johnkirchenbauer/;manli-shu-a804a8164/;;;;",
        "or_profile": "~Neel_Jain1;~Khalid_Saifullah1;~Yuxin_Wen2;~John_Kirchenbauer1;~Manli_Shu1;~Aniruddha_Saha1;~Micah_Goldblum1;~Jonas_Geiping1;~Tom_Goldstein1",
        "aff": "University of Maryland, College Park;University of Maryland, College Park;University of Maryland, College Park;University of Maryland, College Park;Department of Computer Science, University of Maryland, College Park;University of Maryland, College Park;New York University;Max Planck Institute for Intelligent Systems, Max-Planck Institute;University of Maryland, College Park",
        "aff_domain": "umd.edu;umd.edu;umd.edu;umd.edu;cs.umd.edu;umd.edu;nyu.edu;tuebingen.mpg.de;umd.edu",
        "position": "PhD student;PhD student;PhD student;PhD student;PhD student;Postdoc;Postdoc;Principal Researcher;Full Professor",
        "bibtex": "@misc{\njain2024bring,\ntitle={Bring Your Own Data!  Self-Supervised Evaluation for Large Language Models},\nauthor={Neel Jain and Khalid Saifullah and Yuxin Wen and John Kirchenbauer and Manli Shu and Aniruddha Saha and Micah Goldblum and Jonas Geiping and Tom Goldstein},\nyear={2024},\nurl={https://openreview.net/forum?id=zH6zBoktYO}\n}",
        "github": "",
        "project": "",
        "reviewers": "AbSH;KAMN;tXds;cArL",
        "site": "https://openreview.net/forum?id=zH6zBoktYO",
        "pdf_size": 980572,
        "rating": "3;5;5;5",
        "confidence": "4;4;3;4",
        "soundness": "2;2;3;2",
        "contribution": "2;2;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "47;75;87;47",
        "wc_strengths": "47;77;101;68",
        "wc_weaknesses": "122;272;245;221",
        "wc_questions": "14;151;251;95",
        "wc_review": "230;575;684;431",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "158;709;1161;287",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            4.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            64.0,
            17.52141546793523
        ],
        "wc_strengths_avg": [
            73.25,
            19.369757355217438
        ],
        "wc_weaknesses_avg": [
            215.0,
            56.64362276549762
        ],
        "wc_questions_avg": [
            127.75,
            86.23043256298787
        ],
        "wc_review_avg": [
            480.0,
            169.95734759050578
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            578.75,
            393.10582226672756
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            10,
            0
        ],
        "authors#_avg": [
            9,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 25,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1188786261128674806&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0;1;0;2;3;0",
        "aff_unique_norm": "University of Maryland;University of Maryland, College Park;New York University;Max Planck Institute for Intelligent Systems",
        "aff_unique_dep": ";Department of Computer Science;;Intelligent Systems",
        "aff_unique_url": "https://www/umd.edu;https://www/umd.edu;https://www.nyu.edu;https://www.mpi-is.mpg.de",
        "aff_unique_abbr": "UMD;UMD;NYU;MPI-IS",
        "aff_campus_unique_index": "0;0;0;0;0;0;0",
        "aff_campus_unique": "College Park;",
        "aff_country_unique_index": "0;0;0;0;0;0;0;1;0",
        "aff_country_unique": "United States;Germany"
    },
    {
        "id": "zI6fKENVL8",
        "title": "Federated Learning with Differential Privacy for End-to-End Speech Recognition",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "While federated learning (FL) has recently emerged as a promising approach to train machine learning models, it is limited to only preliminary explorations in the domain of automatic speech recognition (ASR). \nMoreover, FL does not inherently guarantee user privacy and requires the use of differential privacy (DP) for robust privacy guarantees. \nHowever, we are not aware of prior work on applying DP to FL for ASR.\nIn this paper, we aim to bridge this research gap by formulating an ASR benchmark for FL with DP and establishing the first baselines. \nFirst, we extend the existing research on FL for ASR by exploring different aspects of recent *large end-to-end transformer models*: architecture design, seed models, data heterogeneity, domain shift, and impact of cohort size. \nWith a *practical* number of central aggregations we are able to train **FL models** that are **nearly optimal** even with heterogeneous data, a seed model from another domain, or no pre-trained seed model.\nSecond, we apply DP to FL for ASR, which is non-trivial since DP noise severely affects model training, especially for large transformer models, due to highly imbalanced gradients in the attention block. \nWe counteract the adverse effect of DP noise by reviving per-layer clipping and explaining why its effect is more apparent in our case than in the prior work.\nRemarkably, we achieve user-level ($7.2$, $10^{-9}$)-**DP** (resp. ($4.5$, $10^{-9}$)-**DP**) with a 1.3\\% (resp. 4.6\\%) absolute drop in the word error rate for extrapolation to high (resp. low) population scale for **FL with DP in ASR**.",
        "keywords": "federated learning;differential privacy;speech recognition;transformers",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Martin Pelikan;Sheikh Shams Azam;Vitaly Feldman;Jan Silovsky;Kunal Talwar;Tatiana Likhomanenko",
        "authorids": "~Martin_Pelikan1;~Sheikh_Shams_Azam1;~Vitaly_Feldman1;~Jan_Silovsky1;~Kunal_Talwar1;~Tatiana_Likhomanenko1",
        "gender": "M;M;M;M;M;F",
        "homepage": "http://martinpelikan.net;https://shams.pairml.com/;https://vtaly.net;;http://www.kunaltalwar.org;https://github.com/tlikhomanenko/tlikhomanenko",
        "dblp": "18/963.html;218/6739;67/1162;;06/3696;202/2094",
        "google_scholar": "f59x6y4AAAAJ;nLEZZDwAAAAJ;GqZBmfgAAAAJ;yRSy4fsAAAAJ;XD_01h8AAAAJ;https://scholar.google.ru/citations?user=x7Z3ysQAAAAJ",
        "orcid": "0009-0003-4101-5575;0000-0001-7678-5092;;;;0000-0003-0351-9839",
        "linkedin": "pelikanmartin/;sshamsazam/;;;kunal-talwar-128a6159;",
        "or_profile": "~Martin_Pelikan1;~Sheikh_Shams_Azam1;~Vitaly_Feldman1;~Jan_Silovsky1;~Kunal_Talwar1;~Tatiana_Likhomanenko1",
        "aff": "Apple;Purdue University;Apple AI Research;Apple;Apple;Apple",
        "aff_domain": "apple.com;purdue.edu;apple.com;apple.com;apple.com;apple.com",
        "position": "Researcher;PhD student;Research Scientist;Researcher;Research Scientist;Research Scientist",
        "bibtex": "@misc{\npelikan2024federated,\ntitle={Federated Learning with Differential Privacy for End-to-End Speech Recognition},\nauthor={Martin Pelikan and Sheikh Shams Azam and Vitaly Feldman and Jan Silovsky and Kunal Talwar and Tatiana Likhomanenko},\nyear={2024},\nurl={https://openreview.net/forum?id=zI6fKENVL8}\n}",
        "github": "",
        "project": "",
        "reviewers": "Jahb;JcFR;4uMy",
        "site": "https://openreview.net/forum?id=zI6fKENVL8",
        "pdf_size": 1470868,
        "rating": "3;3;3",
        "confidence": "3;4;4",
        "soundness": "2;3;2",
        "contribution": "2;1;2",
        "presentation": "2;3;3",
        "wc_summary": "86;24;84",
        "wc_strengths": "31;66;263",
        "wc_weaknesses": "226;147;115",
        "wc_questions": "3;402;33",
        "wc_review": "346;639;495",
        "wc_reply_reviewers": "0;51;31",
        "wc_reply_authors": "1465;1325;945",
        "reply_reviewers": "0;1;1",
        "reply_authors": "2;2;2",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            64.66666666666667,
            28.76726534718856
        ],
        "wc_strengths_avg": [
            120.0,
            102.12084344866462
        ],
        "wc_weaknesses_avg": [
            162.66666666666666,
            46.64999702274612
        ],
        "wc_questions_avg": [
            146.0,
            181.43318329346482
        ],
        "wc_review_avg": [
            493.3333333333333,
            119.62255454367941
        ],
        "wc_reply_reviewers_avg": [
            27.333333333333332,
            20.98147330914162
        ],
        "wc_reply_authors_avg": [
            1245.0,
            219.6967607104544
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14434279591690005942&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;0;0;0;0",
        "aff_unique_norm": "Apple;Purdue University",
        "aff_unique_dep": "Apple Inc.;",
        "aff_unique_url": "https://www.apple.com;https://www.purdue.edu",
        "aff_unique_abbr": "Apple;Purdue",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "zI6mMl7UmW",
        "title": "Rethinking Spectral Graph Neural Networks with Spatially Adaptive Filtering",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Whilst spectral Graph Neural Networks (GNNs) are theoretically well-founded in the spectral domain, their practical reliance on polynomial approximation implies a profound linkage to the spatial domain. As previous studies rarely examine spectral GNNs from the spatial perspective, their spatial-domain interpretability remains elusive, e.g., what information is essentially encoded by spectral GNNs in the spatial domain? In this paper, to answer this question, we establish a theoretical connection between spectral filtering and spatial aggregation, unveiling an intrinsic interaction that spectral filtering implicitly leads the original graph to an adapted new graph, explicitly computed for spatial aggregation. Both theoretical and empirical investigations reveal that the adapted new graph not only exhibits non-locality but also accommodates signed edge weights to reflect label consistency between nodes. These findings thus highlight the interpretable role of spectral GNNs in the spatial domain and inspire us to rethink graph spectral filters beyond the fixed-order polynomials, which neglect global information. Built upon the theoretical findings, we revisit the state-of-the-art spectral GNNs and propose a novel Spatially Adaptive Filtering (SAF) framework, which leverages the adapted new graph by spectral filtering for an auxiliary non-local aggregation. Notably, our proposed SAF comprehensively models both node similarity and dissimilarity from a global perspective, therefore alleviating persistent deficiencies of GNNs related to long-range dependencies and graph heterophily. Extensive experiments over 13 node classification benchmarks demonstrate the superiority of our proposed framework to the state-of-the-art models.",
        "keywords": "Graph Neural Networks;Spectral Filtering;Long-range Dependencies;Graph Heterophily",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/17e45d7c17d5378c7657b84ee0bebedd14414ddc.zip",
        "author": "Jingwei Guo;Kaizhu Huang;Xinping Yi;Zixian Su;Rui Zhang",
        "authorids": "~Jingwei_Guo1;~Kaizhu_Huang1;~Xinping_Yi1;~Zixian_Su1;~Rui_Zhang10",
        "gender": "M;M;M;F;F",
        "homepage": "https://jingweio.github.io/;https://sites.google.com/view/kaizhu-huang-homepage;https://sites.google.com/site/xinpingyi00/;;https://www.xjtlu.edu.cn/en/departments/academic-departments/mathematical-sciences/staff/rui-zhang",
        "dblp": "195/2197-1;99/3390;95/10043.html;311/4528.html;60/2536-12.html",
        "google_scholar": "https://scholar.google.com/citations?hl=zh-CN;https://scholar.google.com/citations?hl=en;wAcbI5kAAAAJ;E-Mcb5AAAAAJ;dskugr4AAAAJ",
        "orcid": "0000-0003-4336-9863;;;;",
        "linkedin": ";;;;",
        "or_profile": "~Jingwei_Guo1;~Kaizhu_Huang1;~Xinping_Yi1;~Zixian_Su1;~Rui_Zhang10",
        "aff": "Xi'an Jiaotong-Liverpool University;Xi'an Jiaotong-Liverpool University;Southeast University;University of Liverpool;Xi'an Jiaotong-Liverpool University",
        "aff_domain": "xjtlu.edu.cn;xjtlu.edu.cn;seu.edu.cn;liverpool.ac.uk;xjtlu.edu.cn",
        "position": "PhD student;Full Professor;Full Professor;PhD student;Associate Professor",
        "bibtex": "@misc{\nguo2024rethinking,\ntitle={Rethinking Spectral Graph Neural Networks with Spatially Adaptive Filtering},\nauthor={Jingwei Guo and Kaizhu Huang and Xinping Yi and Zixian Su and Rui Zhang},\nyear={2024},\nurl={https://openreview.net/forum?id=zI6mMl7UmW}\n}",
        "github": "",
        "project": "",
        "reviewers": "k2v7;2DDa;wm9b;WZnB",
        "site": "https://openreview.net/forum?id=zI6mMl7UmW",
        "pdf_size": 4177710,
        "rating": "5;5;6;6",
        "confidence": "3;3;4;5",
        "soundness": "3;4;3;3",
        "contribution": "3;3;3;3",
        "presentation": "3;3;3;3",
        "wc_summary": "110;94;123;83",
        "wc_strengths": "76;75;98;91",
        "wc_weaknesses": "184;170;70;171",
        "wc_questions": "24;8;2;32",
        "wc_review": "394;347;293;377",
        "wc_reply_reviewers": "91;0;17;91",
        "wc_reply_authors": "1126;1503;427;647",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "2;4;1;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            102.5,
            15.239750654128171
        ],
        "wc_strengths_avg": [
            85.0,
            9.82344135219425
        ],
        "wc_weaknesses_avg": [
            148.75,
            45.80051855601637
        ],
        "wc_questions_avg": [
            16.5,
            12.031209415515965
        ],
        "wc_review_avg": [
            352.75,
            38.382124745771954
        ],
        "wc_reply_reviewers_avg": [
            49.75,
            41.68557904119841
        ],
        "wc_reply_authors_avg": [
            925.75,
            418.26150611788313
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            1.0897247358851685
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.9045340337332909,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11894946542744827413&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;1;2;0",
        "aff_unique_norm": "Xi'an Jiao Tong-Liverpool University;Southeast University;University of Liverpool",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.xjtu.edu.cn/en;https://www.seu.edu.cn/;https://www.liverpool.ac.uk",
        "aff_unique_abbr": "XJTLU;SEU;Liv Uni",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Xi'an;",
        "aff_country_unique_index": "0;0;0;1;0",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "id": "zIJFG7wW2d",
        "title": "Agent Instructs Large Language Models to be General Zero-Shot Reasoners",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We introduce a method to improve the zero-shot reasoning abilities of large language models on general language understanding tasks. Unlike existing zero-shot reasoning approaches that are often suboptimal for general tasks, we build an autonomous agent to generate task-specific instructions to optimize the reasoning performance of large language models. We show our agent instructions further unleash the zero-shot reasoning abilities of large language models to more tasks. We study the performance of our method on a wide set of datasets spanning generation, classification, and reasoning. We show that our method generalizes to most tasks and obtains state-of-the-art zero-shot performance on 20 of the 29 datasets that we evaluate. For instance, our method boosts the performance of state-of-the-art large language models by a large margin, including Vicuna-13b (13.3%), Llama-2-70b-chat (23.2%), and GPT-3.5 Turbo (17.0%). Compared to zero-shot chain of thought, our improvement in reasoning is striking, with an average increase of 10.4%. With our method, Llama-2-70b-chat outperforms zero-shot GPT-3.5 Turbo by 10.2%. The code is available at https://anonymous.4open.science/r/AgentInstruct_ICLR2024.",
        "keywords": "Language Models;Large Language Models;Reasoning;Agents;Chain of Thought",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Nicholas R Crispino;Kyle Montgomery;Fankun Zeng;Dawn Song;Chenguang Wang",
        "authorids": "~Nicholas_R_Crispino1;~Kyle_Montgomery1;~Fankun_Zeng1;~Dawn_Song1;~Chenguang_Wang1",
        "gender": ";M;M;F;M",
        "homepage": "https://github.com/ncrispino;https://kylemontgomery1.github.io/;https://zengfankun.com/;;https://cgraywang.github.io/",
        "dblp": ";261/4798;;s/DXSong;62/3432-1.html",
        "google_scholar": ";O8tnCagAAAAJ;;;hsZ2aj0AAAAJ",
        "orcid": ";0009-0004-0563-347X;0009-0007-0625-0499;;",
        "linkedin": ";kyle-montgomery-/;fankun-zeng;;",
        "or_profile": "~Nicholas_R_Crispino1;~Kyle_Montgomery1;~Fankun_Zeng1;~Dawn_Song1;~Chenguang_Wang1",
        "aff": "Washington University, Saint Louis;Washington University, Saint Louis;;University of California, Berkeley;Washington University, Saint Louis",
        "aff_domain": "cse.wustl.edu;wustl.edu;;berkeley.edu;wustl.edu",
        "position": "PhD student;MS student;;Full Professor;Assistant Professor",
        "bibtex": "@misc{\ncrispino2024agent,\ntitle={Agent Instructs Large Language Models to be General Zero-Shot Reasoners},\nauthor={Nicholas R Crispino and Kyle Montgomery and Fankun Zeng and Dawn Song and Chenguang Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=zIJFG7wW2d}\n}",
        "github": "",
        "project": "",
        "reviewers": "LvbF;JX3F;tm2h",
        "site": "https://openreview.net/forum?id=zIJFG7wW2d",
        "pdf_size": 1892943,
        "rating": "3;5;6",
        "confidence": "5;4;5",
        "soundness": "1;3;3",
        "contribution": "1;2;3",
        "presentation": "3;3;3",
        "wc_summary": "44;133;78",
        "wc_strengths": "49;95;100",
        "wc_weaknesses": "325;290;136",
        "wc_questions": "50;203;13",
        "wc_review": "468;721;327",
        "wc_reply_reviewers": "156;0;0",
        "wc_reply_authors": "1328;666;440",
        "reply_reviewers": "1;0;0",
        "reply_authors": "3;1;1",
        "rating_avg": [
            4.666666666666667,
            1.247219128924647
        ],
        "confidence_avg": [
            4.666666666666667,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.0,
            0.816496580927726
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            85.0,
            36.669696844488186
        ],
        "wc_strengths_avg": [
            81.33333333333333,
            22.954060400915758
        ],
        "wc_weaknesses_avg": [
            250.33333333333334,
            82.09885640020951
        ],
        "wc_questions_avg": [
            88.66666666666667,
            82.24489176977633
        ],
        "wc_review_avg": [
            505.3333333333333,
            163.0017041492375
        ],
        "wc_reply_reviewers_avg": [
            52.0,
            73.53910524340094
        ],
        "wc_reply_authors_avg": [
            811.3333333333334,
            376.80882273228275
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.18898223650461357,
        "gs_citation": 20,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3791774223503853880&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 9,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Washington University in St. Louis;University of California, Berkeley",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://wustl.edu;https://www.berkeley.edu",
        "aff_unique_abbr": "WUSTL;UC Berkeley",
        "aff_campus_unique_index": "0;0;1;0",
        "aff_campus_unique": "Saint Louis;Berkeley",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "zIrpuifCJW",
        "title": "Exploring the Impact of Information Entropy Change in Learning Systems",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We explore the impact of entropy change in deep learning systems via noise injection at different levels, i.e., the latent space and input. The applications in this work focus on supervised learning tasks within computer vision, but the proposed method can be further adapted to other fields. Noise is conventionally viewed as a harmful perturbation in various deep learning architectures, such as convolutional neural networks (CNNs) and vision transformers (ViTs), as well as different learning tasks like image classification and transfer learning. However, this work shows noise can be an effective way to influence the entropy of the learning systems. We demonstrate that specific noise can boost the performance of various deep architectures under certain conditions. We theoretically prove the enhancement gained from positive noise by reducing the task complexity defined by information entropy and experimentally show the significant performance gain\nin large image datasets, such as the ImageNet. Herein, we use the information entropy to define the complexity of the task. We categorize the noise into two types, positive noise (PN) and harmful noise (HN), based on whether the noise can help reduce the complexity of the task. Extensive experiments of CNNs and ViTs have shown performance improvements by proactively injecting positive noise, where we achieved an unprecedented top 1 accuracy of over 95% on ImageNet. Both the oretical analysis and empirical evidence have confirmed that the presence of positive noise can benefit the learning process, while the traditionally perceived harmful noise indeed impairs deep learning models. The different roles of noise offer new explanations for deep models on specific tasks and provide a new paradigm\nfor improving model performance. Moreover, it reminds us that we can influence the performance of learning systems via information entropy change.",
        "keywords": "Information Entropy;ViT;CNN;ImageNet;ImageNetV2",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/7ee8e7cc3494af266675e59a8d54890bcb5f4476.pdf",
        "author": "Xiaowei Yu;Yao Xue;Lu Zhang;Li Wang;Tianming Liu;Dajiang Zhu",
        "authorids": "~Xiaowei_Yu1;~Yao_Xue2;~Lu_Zhang16;~Li_Wang1;~Tianming_Liu3;~Dajiang_Zhu1",
        "gender": "M;F;F;F;M;M",
        "homepage": "http://shawey94.github.io/;;https://qidianzl.github.io/;http://www.uta.edu/faculty/wangl3/;https://cobweb.cs.uga.edu/~tliu/;https://mentis.uta.edu/explore/profile/dajiang-zhu",
        "dblp": ";;;;96/5013-1.html;https://dblp.uni-trier.de/pers/hd/z/Zhu:Dajiang",
        "google_scholar": "Kc1FjToAAAAJ;;XNbe_O4AAAAJ;;92RPXm0AAAAJ;cFgudIYAAAAJ",
        "orcid": ";;;;;",
        "linkedin": "shawey94;yao-xue-a81045138;;;;",
        "or_profile": "~Xiaowei_Yu1;~Yao_Xue2;~Lu_Zhang16;~Li_Wang1;~Tianming_Liu3;~Dajiang_Zhu1",
        "aff": "University of Texas at Arlington, University of Texas at Arlington;Southern Illinois University-Carbondale;Indiana University Indianapolis;University of Texas, Arlington;University of Georgia;University of Texas at Arlington",
        "aff_domain": "mavs.uta.edu;siu.edu;iu.edu;uta.edu;uga.edu;uta.edu",
        "position": "PhD student;PhD student;Assistant Professor;Assistant Professor;Professor;Assistant Professor",
        "bibtex": "@misc{\nyu2024exploring,\ntitle={Exploring the Impact of Information Entropy Change in Learning Systems},\nauthor={Xiaowei Yu and Yao Xue and Lu Zhang and Li Wang and Tianming Liu and Dajiang Zhu},\nyear={2024},\nurl={https://openreview.net/forum?id=zIrpuifCJW}\n}",
        "github": "",
        "project": "",
        "reviewers": "FieS;H7oc;eupP",
        "site": "https://openreview.net/forum?id=zIrpuifCJW",
        "pdf_size": 985513,
        "rating": "3;5;8",
        "confidence": "5;3;3",
        "soundness": "2;3;3",
        "contribution": "1;3;3",
        "presentation": "3;3;3",
        "wc_summary": "72;100;156",
        "wc_strengths": "43;47;45",
        "wc_weaknesses": "134;53;71",
        "wc_questions": "2;16;137",
        "wc_review": "251;216;409",
        "wc_reply_reviewers": "0;90;64",
        "wc_reply_authors": "435;266;751",
        "reply_reviewers": "0;1;1",
        "reply_authors": "1;1;2",
        "rating_avg": [
            5.333333333333333,
            2.0548046676563256
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            109.33333333333333,
            34.92213560989012
        ],
        "wc_strengths_avg": [
            45.0,
            1.632993161855452
        ],
        "wc_weaknesses_avg": [
            86.0,
            34.72751070837067
        ],
        "wc_questions_avg": [
            51.666666666666664,
            60.60986351705105
        ],
        "wc_review_avg": [
            292.0,
            83.9563378588339
        ],
        "wc_reply_reviewers_avg": [
            51.333333333333336,
            37.818278943154226
        ],
        "wc_reply_authors_avg": [
            484.0,
            201.0091208544196
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.8029550685469663,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16745872301619931380&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0;3;0",
        "aff_unique_norm": "University of Texas at Arlington;Southern Illinois University;Indiana University;University of Georgia",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.uta.edu;https://www.siu.edu;https://iu.edu;https://www.uga.edu",
        "aff_unique_abbr": "UTA;SIU;IU;UGA",
        "aff_campus_unique_index": "1;2;3;3",
        "aff_campus_unique": ";Carbondale;Indianapolis;Arlington",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "zKgrmMOQjg",
        "title": "TCD: TEXT IMAGE CHANGE DETECTION FOR MULTILINGUAL DOCUMENT COMPARISON",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In general, the core technology used in imaged document comparison is basedon Optical Character Recognition (OCR). However, the main drawbacks of using OCR for document comparison are that most users have to pick relevant language models for each document. Moreover, a multilingual document needs a multilingual OCR model, or a hybrid model has poor recognition performance. To overcome such drawbacks, we propose common Text image Change Detection (TCD) model for multilingual documents that utilize the unit-level text image-to-image comparison instead of text recognition. Our model generates the change segmentation maps in both directions from source to target and target to source. Furthermore, we propose to use the correlation between multi-scale attention features, which mitigates pre-processing of text image position and scale alignment. We created test data from printed and scanned documents in different languages and added public datasets such as Distorted document images (DDI-100), and Document binarization dataset (LRDE DBD). Finally, we compare the performance of our model with state-of-the-art semantic segmentation and change detection (CD) models, and also with OCR models. Experimental results on benchmarks demonstrate that our model outperforms other semantic segmentation models relatively by a good margin and meets the similar performance that of OCR methods.",
        "keywords": "Optical Character Recognition;Semantic Segmentation;Change Detection;Text Image Change Detection",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Naresh Reddy Yarram;Doyoung Park;Sunjin Kim;Minkyu Kim;Seongho Joe;Taehee Lee",
        "authorids": "~Naresh_Reddy_Yarram1;~Doyoung_Park2;~Sunjin_Kim1;~Minkyu_Kim5;~Seongho_Joe1;~Taehee_Lee1",
        "gender": "M;;M;;M;",
        "homepage": ";;;;;",
        "dblp": ";;;;283/5449.html;l/TaeheeLee2",
        "google_scholar": ";;;;QQwJ1LMAAAAJ;SM-2GN4AAAAJ",
        "orcid": ";;;;;",
        "linkedin": "naresh-reddy-yarram-5a80a316/;do-young-park-399887b6/;sunjin-kim-3a0b66129/;minkyu-kim-b16376269/;;",
        "or_profile": "~Naresh_Reddy_Yarram1;~Doyoung_Park2;~Sunjin_Kim1;~Minkyu_Kim5;~Seongho_Joe1;~Taehee_Lee1",
        "aff": "Samsung;Samsung SDS;;Samsung SDS;Samsung;Samsung SDS",
        "aff_domain": "samsung.com;samsung.com;;samsung.com;samsung.com;samsung.com",
        "position": "Researcher;Researcher;;Researcher;Researcher;Engineering Director",
        "bibtex": "@misc{\nyarram2024tcd,\ntitle={{TCD}: {TEXT} {IMAGE} {CHANGE} {DETECTION} {FOR} {MULTILINGUAL} {DOCUMENT} {COMPARISON}},\nauthor={Naresh Reddy Yarram and Doyoung Park and Sunjin Kim and Minkyu Kim and Seongho Joe and Taehee Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=zKgrmMOQjg}\n}",
        "github": "",
        "project": "",
        "reviewers": "6nRM;ygsh;RtiC;qbQL",
        "site": "https://openreview.net/forum?id=zKgrmMOQjg",
        "pdf_size": 1105179,
        "rating": "3;3;5;5",
        "confidence": "5;5;3;4",
        "soundness": "2;1;3;2",
        "contribution": "1;2;2;2",
        "presentation": "1;1;3;2",
        "wc_summary": "156;186;86;88",
        "wc_strengths": "190;52;98;29",
        "wc_weaknesses": "144;325;118;479",
        "wc_questions": "26;121;31;197",
        "wc_review": "516;684;333;793",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.75,
            0.82915619758885
        ],
        "wc_summary_avg": [
            129.0,
            43.32435804486894
        ],
        "wc_strengths_avg": [
            92.25,
            61.66188044489075
        ],
        "wc_weaknesses_avg": [
            266.5,
            146.3190008167087
        ],
        "wc_questions_avg": [
            93.75,
            70.58815410534547
        ],
        "wc_review_avg": [
            581.5,
            174.12710874530708
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.9045340337332909,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:VDsmO1KYp0gJ:scholar.google.com/&scioq=TCD:+TEXT+IMAGE+CHANGE+DETECTION+FOR+MULTILINGUAL+DOCUMENT+COMPARISON&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Samsung",
        "aff_unique_dep": "Samsung",
        "aff_unique_url": "https://www.samsung.com",
        "aff_unique_abbr": "Samsung",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "zLwCT9srfo",
        "title": "H-Rockmate: Hierarchical Approach for Efficient Re-materialization of Large Neural Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Training modern neural networks poses a significant memory challenge, as storing intermediate results during the forward and backward passes demands substantial memory resources. To address this issue while maintaining model accuracy, re-materialization techniques have been introduced to recompute selected intermediate results rather than storing them, thereby adhering to peak memory constraints. The main algorithmic problem is to compute a re-materialization schedule that minimizes the computational overhead within a given memory budget. Our H-Rockmate framework builds upon an existing Rockmate solution and overcomes its limitation to work with sequential block structures by proposing a hierarchical approach. The framework performs an automatic decomposition of the data-flow graph into a hierarchy of small-scale subgraphs, and finds a re-materialization schedule for the whole graph by recursively solving optimization problems for each subgraph. H-Rockmate allows users to transform their PyTorch models into nn.Modules that execute forward and backward passes efficiently within the specified memory budget. This framework can handle neural networks with diverse data-flow graph structures, including U-Nets and encoder-decoder Transformers. H-Rockmate outperforms existing re-materialization approaches in terms of average training iteration time and peak memory trade-offs, demonstrating superior memory efficiency in training modern neural networks.",
        "keywords": "Rematerialization;Neural Networks;Memory-Efficient Training;PyTorch;Integer Linear Programming;Training;Checkpointing",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/53e3637fc9f02b39c5732cb96af7a44eb3239180.zip",
        "author": "Julia Gusak;Xunyi Zhao;Th\u00e9otime Le Hellard;Zhe LI;Lionel Eyraud-Dubois;Olivier Beaumont",
        "authorids": "~Julia_Gusak1;~Xunyi_Zhao1;~Th\u00e9otime_Le_Hellard1;~Zhe_LI20;~Lionel_Eyraud-Dubois1;~Olivier_Beaumont1",
        "gender": "F;M;M;F;M;M",
        "homepage": "https://juliagusak.github.io/about/;https://www.linkedin.com/in/xunyi-zhao-359a04139/;;https://www.linkedin.com/in/zheli33/;http://www.labri.fr/perso/eyraud/index.php/;",
        "dblp": "179/6722;288/4742.html;;;https://dblp.uni-trier.de/pid/e/LionelEyraudDubois.html;89/2078",
        "google_scholar": "QriHoq4AAAAJ;Mame_zUAAAAJ;az1KbQkAAAAJ;;;https://scholar.google.fr/citations?user=XT007NgAAAAJ",
        "orcid": ";;;;;0000-0003-2741-6228",
        "linkedin": "julia-gusak-0b265688/;;theotime-le-hellard-a3a066249/;;;",
        "or_profile": "~Julia_Gusak1;~Xunyi_Zhao1;~Th\u00e9otime_Le_Hellard1;~Zhe_LI20;~Lionel_Eyraud-Dubois1;~Olivier_Beaumont1",
        "aff": "INRIA;INRIA;INRIA;INSERM;INRIA;INRIA",
        "aff_domain": "inria.fr;inria.fr;inria.fr;inserm.fr;inria.fr;inria.fr",
        "position": "Researcher;PhD student;Intern;PhD student;Researcher;Researcher",
        "bibtex": "@misc{\ngusak2024hrockmate,\ntitle={H-Rockmate: Hierarchical Approach for Efficient Re-materialization of Large Neural Networks},\nauthor={Julia Gusak and Xunyi Zhao and Th{\\'e}otime Le Hellard and Zhe LI and Lionel Eyraud-Dubois and Olivier Beaumont},\nyear={2024},\nurl={https://openreview.net/forum?id=zLwCT9srfo}\n}",
        "github": "",
        "project": "",
        "reviewers": "J4PJ;u563;piuX",
        "site": "https://openreview.net/forum?id=zLwCT9srfo",
        "pdf_size": 955592,
        "rating": "3;6;6",
        "confidence": "4;4;3",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "2;2;4",
        "wc_summary": "70;84;59",
        "wc_strengths": "45;114;57",
        "wc_weaknesses": "203;283;36",
        "wc_questions": "7;68;70",
        "wc_review": "325;549;222",
        "wc_reply_reviewers": "42;78;0",
        "wc_reply_authors": "707;484;294",
        "reply_reviewers": "1;1;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            5.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "wc_summary_avg": [
            71.0,
            10.23067283548187
        ],
        "wc_strengths_avg": [
            72.0,
            30.099833886584822
        ],
        "wc_weaknesses_avg": [
            174.0,
            102.90124715797504
        ],
        "wc_questions_avg": [
            48.333333333333336,
            29.238483012784517
        ],
        "wc_review_avg": [
            365.3333333333333,
            136.50966591743196
        ],
        "wc_reply_reviewers_avg": [
            40.0,
            31.874754901018456
        ],
        "wc_reply_authors_avg": [
            495.0,
            168.78586038725717
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.5,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:La3wNNp4IiUJ:scholar.google.com/&scioq=H-Rockmate:+Hierarchical+Approach+for+Efficient+Re-materialization+of+Large+Neural+Networks&hl=en&as_sdt=0,44",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;1;0;0",
        "aff_unique_norm": "INRIA;Institut National de la Sant\u00e9 et de la Recherche M\u00e9dicale",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.inria.fr;https://www.inserm.fr",
        "aff_unique_abbr": "INRIA;INSERM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "France"
    },
    {
        "title": "Protein Discovery with Discrete Walk-Jump Sampling",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17386",
        "id": "zMPHKOmQNb",
        "author_site": "Nathan Frey, Dan Berenberg, Karina Zadorozhny, Joseph Kleinhenz, Julien Lafrance-Vanasse, Isidro Hotzel, Yan Wu, Stephen Ra, Richard Bonneau, Kyunghyun Cho, Andreas Loukas, Vladimir Gligorijevic, Saeed Saremi",
        "tldr": "",
        "abstract": "We resolve difficulties in training and sampling from a discrete generative model by learning a smoothed energy function, sampling from the smoothed data manifold with Langevin Markov chain Monte Carlo (MCMC), and projecting back to the true data manifold with one-step denoising. Our $\\textit{Discrete Walk-Jump Sampling}$ formalism combines the contrastive divergence training of an energy-based model and improved sample quality of a score-based model, while simplifying training and sampling by requiring only a single noise level. We evaluate the robustness of our approach on generative modeling of antibody proteins and introduce the $\\textit{distributional conformity score}$ to benchmark protein generative models. By optimizing and sampling from our models for the proposed distributional conformity score, 97-100\\% of generated samples are successfully expressed and purified and 70\\% of functional designs show equal or improved binding affinity compared to known functional antibodies on the first attempt in a single round of laboratory experiments. We also report the first demonstration of long-run fast-mixing MCMC chains where diverse antibody protein classes are visited in a single MCMC chain.",
        "keywords": "generative modeling;langevin mcmc;energy-based models;score-based models;protein design;protein discovery",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Nathan C. Frey;Dan Berenberg;Karina Zadorozhny;Joseph Kleinhenz;Julien Lafrance-Vanasse;Isidro Hotzel;Yan Wu;Stephen Ra;Richard Bonneau;Kyunghyun Cho;Andreas Loukas;Vladimir Gligorijevic;Saeed Saremi",
        "authorids": "~Nathan_C._Frey1;~Dan_Berenberg1;~Karina_Zadorozhny1;~Joseph_Kleinhenz1;~Julien_Lafrance-Vanasse1;~Isidro_Hotzel1;~Yan_Wu7;~Stephen_Ra1;~Richard_Bonneau2;~Kyunghyun_Cho1;~Andreas_Loukas1;~Vladimir_Gligorijevic2;~Saeed_Saremi1",
        "gender": ";M;;M;M;;F;M;;M;M;M;M",
        "homepage": "https://ncfrey.github.io/;;;;;;https://www.linkedin.com/feed/;https://www.stephenra.com;;http://kyunghyuncho.me;;https://www.gene.com/scientists/our-scientists/vladimir-gligorijevic;https://saeedsaremi.github.io/",
        "dblp": "306/1335;220/3757.html;;349/4448;;;;255/5897;;41/9736;19/10012;116/2862;128/2619",
        "google_scholar": "IMUja60AAAAJ;C9xtOq8AAAAJ;freYsaYAAAAJ;dhbTENMAAAAJ;;;;bxl__-MAAAAJ;NJXt3VAAAAAJ;https://scholar.google.fi/citations?user=0RAmmIAAAAAJ;https://scholar.google.ch/citations?user=-XGXJbQAAAAJ;rnuxS_YAAAAJ;",
        "orcid": "0000-0001-5291-6131;0000-0003-4631-0947;;0000-0003-3670-0431;0000-0001-8807-6277;;;;;;;;",
        "linkedin": "ncfrey;daniel-j-berenberg;;;julienlv/;;https://www.linkedin.com/feed/;;richard-bonneau-45b8673/;;;;",
        "or_profile": "~Nathan_C._Frey1;~Dan_Berenberg1;~Karina_Zadorozhny1;~Joseph_Kleinhenz1;~Julien_Lafrance-Vanasse1;~Isidro_Hotzel1;~Yan_Wu7;~Stephen_Ra1;~Richard_Bonneau2;~Kyunghyun_Cho1;~Andreas_Loukas1;~Vladimir_Gligorijevic2;~Saeed_Saremi1",
        "aff": "Prescient Design, Genentech;Genentech;;Genentech;;;;Prescient Design, Genentech;genentech;Genentech;Roche / Genentech;Genentech;Genentech",
        "aff_domain": "gene.com;gene.com;;gene.com;;;;gene.com;gene.com;gene.com;roche.com;gene.com;gene.com",
        "position": "Researcher;Researcher;;Researcher;;;;Director of Frontier Research;VP ML for Drug Discovery;Senior Director of Frontier Research;Principal Researcher;Researcher;Senior Principal Research Scientist",
        "bibtex": "@inproceedings{\nfrey2024protein,\ntitle={Protein Discovery with Discrete Walk-Jump Sampling},\nauthor={Nathan C. Frey and Dan Berenberg and Karina Zadorozhny and Joseph Kleinhenz and Julien Lafrance-Vanasse and Isidro Hotzel and Yan Wu and Stephen Ra and Richard Bonneau and Kyunghyun Cho and Andreas Loukas and Vladimir Gligorijevic and Saeed Saremi},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=zMPHKOmQNb}\n}",
        "github": "",
        "project": "",
        "reviewers": "BFxy;RGZR;aiU9",
        "pdf_size": 1179871,
        "rating": "8;8;8",
        "confidence": "4;3;4",
        "soundness": "4;3;4",
        "contribution": "4;3;4",
        "presentation": "4;4;3",
        "wc_summary": "106;137;224",
        "wc_strengths": "149;237;67",
        "wc_weaknesses": "180;78;51",
        "wc_questions": "156;129;181",
        "wc_review": "591;581;523",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "743;791;581",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            155.66666666666666,
            49.948862738693954
        ],
        "wc_strengths_avg": [
            151.0,
            69.41661664664065
        ],
        "wc_weaknesses_avg": [
            103.0,
            55.5517776493246
        ],
        "wc_questions_avg": [
            155.33333333333334,
            21.23414441151065
        ],
        "wc_review_avg": [
            565.0,
            29.97776954122282
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            705.0,
            89.8443097808648
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            9,
            0
        ],
        "authors#_avg": [
            13,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 42,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11558075098539322258&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=zMPHKOmQNb",
        "pdf": "https://openreview.net/pdf?id=zMPHKOmQNb",
        "email": "gene.com;gene.com;;gene.com;;;;gene.com;gene.com;gene.com;roche.com;gene.com;gene.com",
        "author_num": 13,
        "aff_unique_index": "0;0;0;0;0;0;1;0;0",
        "aff_unique_norm": "Genentech;Roche",
        "aff_unique_dep": "Prescient Design;",
        "aff_unique_url": "https://www.gene.com;https://www.roche.com",
        "aff_unique_abbr": "Genentech;Roche",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0;1;0;0",
        "aff_country_unique": "United States;Switzerland"
    },
    {
        "id": "zMR2dTNdft",
        "title": "Symmetry Leads to Structured Constraint of Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Due to common architecture designs, symmetries exist extensively in contemporary neural networks. In this work, we unveil the importance of the loss function symmetries in affecting, if not deciding, the learning behavior of machine learning models. We prove that every mirror symmetry of the loss function leads to a structured constraint, which becomes a favored solution when either the weight decay or gradient noise is large. As direct corollaries, we show that rescaling symmetry leads to sparsity, rotation symmetry leads to low rankness, and permutation symmetry leads to homogeneous ensembling. Then, we show that the theoretical framework can explain the loss of plasticity and various collapse phenomena in neural networks and suggest how symmetries can be used to design algorithms to enforce hard constraints in a differentiable way.",
        "keywords": "symmetry;structured constraint;sparsity;low-rankness;loss landscape;dynamics",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Liu Ziyin",
        "authorids": "~Liu_Ziyin1",
        "gender": "",
        "homepage": "https://www.mit.edu/~ziyinl/",
        "dblp": "",
        "google_scholar": "NpN9oRMAAAAJ",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Liu_Ziyin1",
        "aff": "Massachusetts Institute of Technology",
        "aff_domain": "mit.edu",
        "position": "Postdoc",
        "bibtex": "@misc{\nziyin2024symmetry,\ntitle={Symmetry Leads to Structured Constraint of Learning},\nauthor={Liu Ziyin},\nyear={2024},\nurl={https://openreview.net/forum?id=zMR2dTNdft}\n}",
        "github": "",
        "project": "",
        "reviewers": "Wp9T;Z5Gq;tSGN;HdbE",
        "site": "https://openreview.net/forum?id=zMR2dTNdft",
        "pdf_size": 2586064,
        "rating": "5;5;6;8",
        "confidence": "3;3;4;2",
        "soundness": "2;3;3;4",
        "contribution": "3;2;3;3",
        "presentation": "3;1;3;3",
        "wc_summary": "76;92;77;81",
        "wc_strengths": "83;49;34;85",
        "wc_weaknesses": "210;184;134;281",
        "wc_questions": "53;91;2;65",
        "wc_review": "422;416;247;512",
        "wc_reply_reviewers": "67;0;0;0",
        "wc_reply_authors": "1632;1092;786;756",
        "reply_reviewers": "1;0;0;0",
        "reply_authors": "3;2;1;1",
        "rating_avg": [
            6.0,
            1.224744871391589
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.8660254037844386
        ],
        "wc_summary_avg": [
            81.5,
            6.34428877022476
        ],
        "wc_strengths_avg": [
            62.75,
            21.9131809648896
        ],
        "wc_weaknesses_avg": [
            202.25,
            53.039490005089604
        ],
        "wc_questions_avg": [
            52.75,
            32.36027657483786
        ],
        "wc_review_avg": [
            399.25,
            95.77414839088887
        ],
        "wc_reply_reviewers_avg": [
            16.75,
            29.011851026778693
        ],
        "wc_reply_authors_avg": [
            1066.5,
            351.9698140466026
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4761868093137147749&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "Massachusetts Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://web.mit.edu",
        "aff_unique_abbr": "MIT",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States"
    },
    {
        "title": "CADS: Unleashing the Diversity of Diffusion Models through Condition-Annealed Sampling",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17385",
        "id": "zMoNrajk2X",
        "author_site": "Seyedmorteza Sadat, Jakob Buhmann, Derek Bradley, Otmar Hilliges, Romann Weber",
        "tldr": "",
        "abstract": "While conditional diffusion models are known to have good coverage of the data distribution, they still face limitations in output diversity, particularly when sampled with a high classifier-free guidance scale for optimal image quality or when trained on small datasets. We attribute this problem to the role of the conditioning signal in inference and offer an improved sampling strategy for diffusion models that can increase generation diversity, especially at high guidance scales, with minimal loss of sample quality. Our sampling strategy anneals the conditioning signal by adding scheduled, monotonically decreasing Gaussian noise to the conditioning vector during inference to balance diversity and condition alignment. Our Condition-Annealed Diffusion Sampler (CADS) can be used with any pretrained model and sampling algorithm, and we show that it boosts the diversity of diffusion models in various conditional generation tasks. Further, using an existing pretrained diffusion model, CADS achieves a new state-of-the-art FID of 1.70 and 2.31 for class-conditional ImageNet generation  at 256$\\times$256 and 512$\\times$512 respectively.",
        "keywords": "diffusion models;diversity;generative models",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Seyedmorteza Sadat;Jakob Buhmann;Derek Bradley;Otmar Hilliges;Romann M. Weber",
        "authorids": "~Seyedmorteza_Sadat1;~Jakob_Buhmann1;~Derek_Bradley1;~Otmar_Hilliges1;~Romann_M._Weber1",
        "gender": ";M;M;M;M",
        "homepage": ";;http://zurich.disneyresearch.com/derekbradley/;https://ait.ethz.ch/people/hilliges/;",
        "dblp": ";;57/3202.html;82/2289;218/7180",
        "google_scholar": ";;gRPJPkkAAAAJ;-epU9OsAAAAJ;QoETwl4AAAAJ",
        "orcid": ";0009-0008-3038-4881;;0000-0002-5068-3474;0000-0003-1196-5425",
        "linkedin": ";jakob-buhmann-02aa41141/;;;romannmweber/",
        "or_profile": "~Seyedmorteza_Sadat1;~Jakob_Buhmann1;~Derek_Bradley1;~Otmar_Hilliges1;~Romann_M._Weber1",
        "aff": ";DisneyResearch|Studios;Disney Research, Disney;ETHZ - ETH Zurich;Disney Research, Disney",
        "aff_domain": ";disneyresearch.com;disneyresearch.com;ethz.ch;disneyresearch.com",
        "position": ";Researcher;Research Scientist;Full Professor;Research Scientist",
        "bibtex": "@inproceedings{\nsadat2024cads,\ntitle={{CADS}: Unleashing the Diversity of Diffusion Models through Condition-Annealed Sampling},\nauthor={Seyedmorteza Sadat and Jakob Buhmann and Derek Bradley and Otmar Hilliges and Romann M. Weber},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=zMoNrajk2X}\n}",
        "github": "",
        "project": "",
        "reviewers": "Djqj;iK6t;fxon",
        "pdf_size": 26326529,
        "rating": "8;8;8",
        "confidence": "4;4;4",
        "soundness": "3;4;3",
        "contribution": "3;3;3",
        "presentation": "3;3;4",
        "wc_summary": "92;66;153",
        "wc_strengths": "57;53;140",
        "wc_weaknesses": "115;113;91",
        "wc_questions": "32;179;132",
        "wc_review": "296;411;516",
        "wc_reply_reviewers": "19;18;122",
        "wc_reply_authors": "683;683;853",
        "reply_reviewers": "1;1;1",
        "reply_authors": "2;2;2",
        "rating_avg": [
            8.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            103.66666666666667,
            36.46307112073194
        ],
        "wc_strengths_avg": [
            83.33333333333333,
            40.10264607506869
        ],
        "wc_weaknesses_avg": [
            106.33333333333333,
            10.873004286866728
        ],
        "wc_questions_avg": [
            114.33333333333333,
            61.298903379714346
        ],
        "wc_review_avg": [
            407.6666666666667,
            89.8455464796237
        ],
        "wc_reply_reviewers_avg": [
            53.0,
            48.792075859371536
        ],
        "wc_reply_authors_avg": [
            739.6666666666666,
            80.13876853447539
        ],
        "reply_reviewers_avg": [
            1.0,
            0.0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 38,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9309717758444883807&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=zMoNrajk2X",
        "pdf": "https://openreview.net/pdf?id=zMoNrajk2X",
        "email": ";disneyresearch.com;disneyresearch.com;ethz.ch;disneyresearch.com",
        "author_num": 5,
        "aff_unique_index": "0;0;1;0",
        "aff_unique_norm": "Disney Research;ETH Zurich",
        "aff_unique_dep": "Studios;",
        "aff_unique_url": "https://www.disneyresearch.com;https://www.ethz.ch",
        "aff_unique_abbr": "Disney Research;ETHZ",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "United States;Switzerland"
    },
    {
        "title": "Error Norm Truncation: Robust Training in the Presence of Data Noise for Text Generation Models",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17384",
        "id": "zMvMwNvs4R",
        "author_site": "Tianjian Li, Haoran Xu, Philipp Koehn, Daniel Khashabi, Kenton Murray",
        "tldr": "",
        "abstract": "Text generation models are notoriously vulnerable to errors in the training data. With the wide-spread availability of massive amounts of web-crawled data becoming more commonplace, how can we enhance the robustness of models trained on a massive amount of noisy web-crawled text? In our work, we propose Error Norm Truncation (ENT), a robust enhancement method to the standard training objective that truncates noisy data. Compared to methods that only uses the negative log-likelihood loss to estimate data quality, our method provides a more accurate estimation by considering the distribution of non-target tokens, which is often overlooked by previous work. Through comprehensive experiments across language modeling, machine translation, and text summarization, we show that equipping text generation models with ENT improves generation quality over standard training and previous soft and hard truncation methods. Furthermore, we show that our method improves the robustness of models against two of the most detrimental types of noise in machine translation, resulting in an increase of more than 2 BLEU points over the MLE baseline when up to 50\\% of noise is added to the data.",
        "keywords": "language generation;language modeling;machine translation;robustness;estimating data quality",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Tianjian Li;Haoran Xu;Philipp Koehn;Daniel Khashabi;Kenton Murray",
        "authorids": "~Tianjian_Li1;~Haoran_Xu3;~Philipp_Koehn2;~Daniel_Khashabi2;~Kenton_Murray1",
        "gender": "M;M;M;M;",
        "homepage": "https://github.com/tianjianl;https://www.fe1ixxu.com/;http://www.cs.jhu.edu/~phi/;http://danielkhashabi.com/;http://www.kentonmurray.com",
        "dblp": ";;84/4538.html;71/10515;143/9465",
        "google_scholar": ";rhcrGQ0AAAAJ;OsIZgIYAAAAJ;pK2kQvgAAAAJ;",
        "orcid": ";;0000-0003-1565-064X;;0000-0002-5628-1003",
        "linkedin": ";haoran-xu-0842b3194/;philipp-koehn-bbb8024/;;kentonmurray/",
        "or_profile": "~Tianjian_Li1;~Haoran_Xu3;~Philipp_Koehn2;~Daniel_Khashabi2;~Kenton_Murray1",
        "aff": "Johns Hopkins University;Johns Hopkins University;Johns Hopkins University;Johns Hopkins University;Johns Hopkins University",
        "aff_domain": "jhu.edu;jhu.edu;jhu.edu;jhu.edu;jhu.edu",
        "position": "MS student;PhD student;Full Professor;Assistant Professor;Researcher",
        "bibtex": "@inproceedings{\nli2024error,\ntitle={Error Norm Truncation: Robust Training in the Presence of Data Noise for Text Generation Models},\nauthor={Tianjian Li and Haoran Xu and Philipp Koehn and Daniel Khashabi and Kenton Murray},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=zMvMwNvs4R}\n}",
        "github": "",
        "project": "",
        "reviewers": "p8xo;Fsrz;FiyE;CBUj",
        "pdf_size": 589271,
        "rating": "6;6;6;6",
        "confidence": "4;4;4;4",
        "soundness": "3;4;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;4;3;3",
        "wc_summary": "37;52;65;47",
        "wc_strengths": "57;33;43;59",
        "wc_weaknesses": "175;28;257;202",
        "wc_questions": "36;82;1;119",
        "wc_review": "305;195;366;427",
        "wc_reply_reviewers": "76;29;0;0",
        "wc_reply_authors": "768;551;748;778",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "2;1;1;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            50.25,
            10.084022015049353
        ],
        "wc_strengths_avg": [
            48.0,
            10.63014581273465
        ],
        "wc_weaknesses_avg": [
            165.5,
            84.706847420973
        ],
        "wc_questions_avg": [
            59.5,
            44.78001786511479
        ],
        "wc_review_avg": [
            323.25,
            85.69240047985585
        ],
        "wc_reply_reviewers_avg": [
            26.25,
            31.06746690671771
        ],
        "wc_reply_authors_avg": [
            711.25,
            93.14873858512524
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=15688550168268548442&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=zMvMwNvs4R",
        "pdf": "https://openreview.net/pdf?id=zMvMwNvs4R",
        "email": "jhu.edu;jhu.edu;jhu.edu;jhu.edu;jhu.edu",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Johns Hopkins University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.jhu.edu",
        "aff_unique_abbr": "JHU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "zNzVhX00h4",
        "title": "Mildly Overparameterized ReLU Networks Have a Favorable Loss Landscape",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We study the loss landscape of two-layer mildly overparameterized ReLU neural networks on a generic finite input dataset for the squared error loss. Our approach involves bounding the dimension of the sets of local and global minima using the rank of the Jacobian of the parametrization map. Using results on random binary matrices, we show most activation patterns correspond to parameter regions with no bad differentiable local minima. Furthermore, for one-dimensional input data, we show most activation regions realizable by the network contain a high dimensional set of global minima and no bad local minima. We experimentally confirm these results by finding a phase transition from most regions having full rank to many regions having deficient rank depending on the amount of overparameterization.",
        "keywords": "overparameterization;loss landscape;jacobian;full rank;activation region;activation pattern",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Kedar Karhadkar;Michael Murray;Hanna Tseran;Guido Montufar",
        "authorids": "~Kedar_Karhadkar1;~Michael_Murray3;~Hanna_Tseran1;~Guido_Montufar1",
        "gender": "M;M;F;M",
        "homepage": "https://www.math.ucla.edu/~kedar/;https://www.math.ucla.edu/people/visiting/mmurray;https://hanna-tseran.github.io/;http://www.math.ucla.edu/~montufar/",
        "dblp": "278/8407;;296/3738;",
        "google_scholar": "WVdm3mQAAAAJ;wplO7UoAAAAJ;Ru1jQaAAAAAJ;https://scholar.google.de/citations?user=pDIuuVwAAAAJ",
        "orcid": ";;;0000-0002-0131-2669",
        "linkedin": ";;hanna-tseran/;",
        "or_profile": "~Kedar_Karhadkar1;~Michael_Murray3;~Hanna_Tseran1;~Guido_Montufar1",
        "aff": "Susquehanna International Group;University of California, Los Angeles;The University of Tokyo;UCLA ",
        "aff_domain": "sig.com;ucla.edu;u-tokyo.ac.jp;math.ucla.edu",
        "position": "Intern;Postdoc;Researcher;Associate Professor",
        "bibtex": "@misc{\nkarhadkar2024mildly,\ntitle={Mildly Overparameterized Re{LU} Networks Have a Favorable Loss Landscape},\nauthor={Kedar Karhadkar and Michael Murray and Hanna Tseran and Guido Montufar},\nyear={2024},\nurl={https://openreview.net/forum?id=zNzVhX00h4}\n}",
        "github": "",
        "project": "",
        "reviewers": "fi53;n6qD;T8Cv;Vqi8",
        "site": "https://openreview.net/forum?id=zNzVhX00h4",
        "pdf_size": 1482417,
        "rating": "3;6;6;6",
        "confidence": "4;3;3;4",
        "soundness": "3;3;3;3",
        "contribution": "2;3;2;2",
        "presentation": "3;3;3;3",
        "wc_summary": "216;27;71;38",
        "wc_strengths": "55;42;85;38",
        "wc_weaknesses": "378;75;169;116",
        "wc_questions": "5;107;96;95",
        "wc_review": "654;251;421;287",
        "wc_reply_reviewers": "195;19;32;0",
        "wc_reply_authors": "582;424;788;455",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            88.0,
            75.65381682373996
        ],
        "wc_strengths_avg": [
            55.0,
            18.425525772688278
        ],
        "wc_weaknesses_avg": [
            184.5,
            116.58151654529118
        ],
        "wc_questions_avg": [
            75.75,
            41.117970523847596
        ],
        "wc_review_avg": [
            403.25,
            158.0227436162276
        ],
        "wc_reply_reviewers_avg": [
            61.5,
            77.91180911774543
        ],
        "wc_reply_authors_avg": [
            562.25,
            143.1509255995224
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13412302565268628974&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "Susquehanna International Group;University of California, Los Angeles;University of Tokyo",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.susquehannainternational.com;https://www.ucla.edu;https://www.u-tokyo.ac.jp",
        "aff_unique_abbr": "SIG;UCLA;UTokyo",
        "aff_campus_unique_index": "1;1",
        "aff_campus_unique": ";Los Angeles",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "United States;Japan"
    },
    {
        "id": "zOjW6yVYkE",
        "title": "Zero-Shot Video Sampling from Image",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Incorporating a temporal dimension into pretrained image diffusion models for video generation is a prevalent approach. However, this method is computationally demanding and necessitates large-scale video datasets. More critically, the heterogeneity between image and video datasets often results in catastrophic forgetting of the image expertise. Recent attempts to directly extract video snippets from image diffusion models have somewhat mitigated these problems. Nevertheless, these methods can only generate brief video clips with simple movements and fail to capture fine-grained motion or non-grid deformation.\nIn this paper, we propose a novel Zero-Shot video Sampling algorithm, denoted as $\\mathcal{ZS}^2$, capable of directly sampling high-quality video clips from existing image synthesis methods, such as Stable Diffusion, without any training or optimization. Specifically, $\\mathcal{ZS}^2$ utilizes the dependency noise model and temporal momentum attention to ensure content consistency and animation coherence, respectively. This ability enables it to excel in related tasks, such as conditional and context-specialized video generation and instruction-guided video editing. Experimental results demonstrate that $\\mathcal{ZS}^2$ achieves state-of-the-art performance in zero-shot video generation, occasionally outperforming recent supervised methods.",
        "keywords": "AIGC;diffusion model;zero shot;video sampling",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/8946eaae3b8d1d6094dde6dc54a4ba5b135c8f85.zip",
        "author": "Dengsheng Chen;Jie Hu;Xiaoming Wei",
        "authorids": "~Dengsheng_Chen1;~Jie_Hu4;~Xiaoming_Wei1",
        "gender": ";;",
        "homepage": ";;",
        "dblp": ";;",
        "google_scholar": ";;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Dengsheng_Chen1;~Jie_Hu4;~Xiaoming_Wei1",
        "aff": ";;",
        "aff_domain": ";;",
        "position": ";;",
        "bibtex": "@misc{\ndengsheng2024zeroshot,\ntitle={Zero-Shot Video Sampling from Image},\nauthor={Dengsheng Chen and Jie Hu and Xiaoming Wei},\nyear={2024},\nurl={https://openreview.net/forum?id=zOjW6yVYkE}\n}",
        "github": "",
        "project": "",
        "reviewers": "5J99;oRp9;b1a9;m7w3",
        "site": "https://openreview.net/forum?id=zOjW6yVYkE",
        "pdf_size": 27484503,
        "rating": "3;3;5;6",
        "confidence": "4;5;3;4",
        "soundness": "2;1;2;3",
        "contribution": "2;2;2;3",
        "presentation": "1;2;2;3",
        "wc_summary": "155;58;55;68",
        "wc_strengths": "43;27;67;22",
        "wc_weaknesses": "244;181;139;79",
        "wc_questions": "15;3;74;12",
        "wc_review": "457;269;335;181",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            84.0,
            41.27347816697788
        ],
        "wc_strengths_avg": [
            39.75,
            17.541023345289748
        ],
        "wc_weaknesses_avg": [
            160.75,
            60.20122507059138
        ],
        "wc_questions_avg": [
            26.0,
            28.062430400804562
        ],
        "wc_review_avg": [
            310.5,
            100.69136010601903
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5443310539518174,
        "gs_citation": -1,
        "gs_cited_by_link": "",
        "gs_version_total": -1
    },
    {
        "id": "zOo8qtyuf6",
        "title": "Towards Robust 3D Pose Transfer with Adversarial Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "3D pose transfer that aims to transfer the desired pose to a target mesh is one of the most challenging 3D generation tasks. Previous attempts rely on well-defined parametric human models or skeletal joints as driving pose sources. However, to obtain those clean pose sources, cumbersome but necessary pre-processing pipelines are inevitable, hindering implementations of the real-time applications. This work is driven by the intuition that the robustness of the model can be enhanced by introducing adversarial samples into the training, leading to a more invulnerable model to the noisy inputs, which even can be further extended to directly handling the real-world data like raw point clouds/scans without intermediate processing. Furthermore, we propose a novel 3D pose Masked Autoencoder (3D-PoseMAE), a customized MAE that effectively learns 3D extrinsic presentations (i.e., pose). 3D-PoseMAE facilitates learning from the aspect of extrinsic attributes by simultaneously generating adversarial samples that perturb the model and learning the arbitrary raw noisy poses via a multi-scale masking strategy. Both qualitative and quantitative studies show that the transferred meshes given by our network result in much better quality. Besides, we demonstrate the strong generalizability of our method on various poses, different domains, and even raw scans. Experimental results also show meaningful insights that the intermediate adversarial samples generated in the training can successfully attack the existing pose transfer models.",
        "keywords": "3D pose transfer;3D Transformer;geometric preservation;3D generation;adversarial training",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Haoyu Chen;Hao Tang;Ehsan Adeli;Guoying Zhao",
        "authorids": "~Haoyu_Chen3;~Hao_Tang6;~Ehsan_Adeli1;~Guoying_Zhao3",
        "gender": "M;M;M;",
        "homepage": "https://www.oulu.fi/university/researcher/haoyu-chen;https://ha0tang.github.io/;http://stanford.edu/~eadeli/;https://gyzhao-nm.github.io/Guoying/",
        "dblp": "146/8170-1.html;07/5751-5;93/2941;35/814",
        "google_scholar": "QgbraMIAAAAJ;9zJkeEMAAAAJ;7NX_J_cAAAAJ;hzywrFMAAAAJ",
        "orcid": "0000-0003-3267-2664;0000-0002-2077-1246;0000-0002-0579-7763;0000-0003-3694-206X",
        "linkedin": ";hao-tang-887475138/;eadeli;",
        "or_profile": "~Haoyu_Chen3;~Hao_Tang6;~Ehsan_Adeli1;~Guoying_Zhao3",
        "aff": "University of Oulu;Carnegie Mellon University;Stanford University;University of Oulu",
        "aff_domain": "oulu.fi;cmu.edu;stanford.edu;oulu.fi",
        "position": "Postdoc;Postdoc;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nchen2024towards,\ntitle={Towards Robust 3D Pose Transfer with Adversarial Learning},\nauthor={Haoyu Chen and Hao Tang and Ehsan Adeli and Guoying Zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=zOo8qtyuf6}\n}",
        "github": "",
        "project": "",
        "reviewers": "bbpQ;qTTF;MJQ4;Sf1p;yQax",
        "site": "https://openreview.net/forum?id=zOo8qtyuf6",
        "pdf_size": 5331627,
        "rating": "3;3;5;5;5",
        "confidence": "4;3;4;3;4",
        "soundness": "2;2;2;3;2",
        "contribution": "2;2;2;2;2",
        "presentation": "2;2;3;2;2",
        "wc_summary": "86;81;88;77;72",
        "wc_strengths": "58;40;45;35;18",
        "wc_weaknesses": "157;251;545;270;205",
        "wc_questions": "5;60;2;69;415",
        "wc_review": "306;432;680;451;710",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            4.2,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.2,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.2,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            80.8,
            5.844655678480984
        ],
        "wc_strengths_avg": [
            39.2,
            13.075167302944921
        ],
        "wc_weaknesses_avg": [
            285.6,
            135.47191590879638
        ],
        "wc_questions_avg": [
            110.2,
            154.8514126509668
        ],
        "wc_review_avg": [
            515.8,
            154.86303626107815
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.16666666666666663,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2457009735304783765&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "University of Oulu;Carnegie Mellon University;Stanford University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.oulu.fi;https://www.cmu.edu;https://www.stanford.edu",
        "aff_unique_abbr": "UOulu;CMU;Stanford",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Stanford",
        "aff_country_unique_index": "0;1;1;0",
        "aff_country_unique": "Finland;United States"
    },
    {
        "id": "zQXX3ZV2HE",
        "title": "Adversarial Instance Attacks for Interactions between Human and Object",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Adversarial attacks can easily deceive deep neural networks (DNNs); however, they are also valuable for evaluating the robustness of DNNs. Existing attacks on object detection primarily focus on attacking the recognition of objects, while whether the attacks remain effective on more complex scene understanding tasks (e.g., extracting the interaction between objects) remains largely unexplored. In this paper, we, for the first time, propose Adversarial Instance Attacks, a novel black-box attacking framework for scene interactions without interfering with object detections. To achieve the goal, we first introduce an Interaction Area Sampling module that identifies vulnerable anchors (area) for adversarial instances positioning. Secondly, we design an Object Category Search module and build an interaction co-occurrence knowledge graph to explore categories with higher obfuscation scores toward specific object-interaction pairs. Finally, our framework generates perturbations that serve as adversarial instances with high co-occurrence obfuscation towards specific interactions in vulnerable areas and deceive HOI models. Extensive experiments conducted against multiple models demonstrate effectiveness in attacking interactions of HOI. Our approach surpasses existing methods by significant margins, achieving an improvement of at least +10.36%}.",
        "keywords": "Adversarial Attacks; Human Object Interaction",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/b10fe2753fb5573529a8cabf010aef05da31d0d9.pdf",
        "author": "Liang Muxue;Chuan Wang;Siyuan Liang;Aishan Liu;Zeming Liu;Liang Yang;Xiaochun Cao",
        "authorids": "~Liang_Muxue1;~Chuan_Wang1;~Siyuan_Liang1;~Aishan_Liu1;~Zeming_Liu1;~Liang_Yang2;~Xiaochun_Cao3",
        "gender": "M;F;F;M;;M;M",
        "homepage": "https://github.com/LiangMuxe;https://chuanwang-cv.github.io/;https://www.github.com/;https://liuaishan.github.io/;;http://yangliang.github.io/;https://scst.sysu.edu.cn/members/caoxiaochun.htm",
        "dblp": ";68/363-2;205/8767.html;177/5658;;05/3933-2;39/3695",
        "google_scholar": ";;Hon4nf0AAAAJ;88tzr_sAAAAJ;;7agkJogAAAAJ;https://scholar.google.com/citations?hl=en",
        "orcid": ";;0000-0002-6154-0233;;;;0000-0001-7141-708X",
        "linkedin": ";;;;;;",
        "or_profile": "~Liang_Muxue1;~Chuan_Wang1;~Siyuan_Liang1;~Aishan_Liu1;~Zeming_Liu1;~Liang_Yang2;~Xiaochun_Cao3",
        "aff": "Institute of Information Engineering\uff0cChinese Academy of Sciences;Institute of Information Engineering, Chinese Academy of Sciences;National University of Singapore;Beihang University;;Hebei University of Technology;SUN YAT-SEN UNIVERSITY",
        "aff_domain": "iie.ac.cn;iie.ac.cn;nus.edu;buaa.edu.cn;;hebut.edu.cn;sysu.edu.cn",
        "position": "MS student;Associate Professor;Researcher;Assistant Professor;;Full Professor;Full Professor",
        "bibtex": "@misc{\nanonymous2024adversarial,\ntitle={Adversarial Instance Attacks for Interactions between Human and Object},\nauthor={Anonymous},\nyear={2024},\nurl={https://openreview.net/forum?id=zQXX3ZV2HE}\n}",
        "github": "",
        "project": "",
        "reviewers": "fSia;FvgA;62sG;L4HX",
        "site": "https://openreview.net/forum?id=zQXX3ZV2HE",
        "pdf_size": 9825573,
        "rating": "1;3;3;5",
        "confidence": "2;4;4;3",
        "soundness": "2;3;3;3",
        "contribution": "2;2;2;2",
        "presentation": "1;2;2;3",
        "wc_summary": "50;119;73;80",
        "wc_strengths": "71;87;33;47",
        "wc_weaknesses": "395;117;220;83",
        "wc_questions": "6;88;52;26",
        "wc_review": "522;411;378;236",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            80.5,
            24.84451649760969
        ],
        "wc_strengths_avg": [
            59.5,
            20.898564544006366
        ],
        "wc_weaknesses_avg": [
            203.75,
            121.39475894782278
        ],
        "wc_questions_avg": [
            43.0,
            30.675723300355934
        ],
        "wc_review_avg": [
            386.75,
            102.08176869549234
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.4264014327112209,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=513868195321226513&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;2;3;4",
        "aff_unique_norm": "Chinese Academy of Sciences;National University of Singapore;Beihang University;Hebei University of Technology;Sun Yat-sen University",
        "aff_unique_dep": "Institute of Information Engineering;;;;",
        "aff_unique_url": "http://www.cas.cn;https://www.nus.edu.sg;http://www.buaa.edu.cn/;http://www.hbut.edu.cn;http://www.sysu.edu.cn",
        "aff_unique_abbr": "CAS;NUS;BUAA;HUT;SYSU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0;0",
        "aff_country_unique": "China;Singapore"
    },
    {
        "id": "zQwNAZ1cMT",
        "title": "Learning Multi-Objective Program Through Online Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We investigate the problem of learning parameters (i.e., objective functions or constraints) of a multi-objective decision making model, based on a set of sequentially arrived decisions. In particular, these decisions might not be exact and possibly carry measurement noise or are generated with the bounded rationality of decision makers. In this paper, we propose a general online learning framework to deal with this learning problem using inverse multi-objective optimization, and prove that this framework converges at a rate of under certain regularity conditions. More precisely, we develop two online learning algorithms with implicit update rules which can handle noisy data. Numerical results with both synthetic and real world datasets show that both algorithms can learn the parameters of a multi-objective program with great accuracy and are robust to noise.",
        "keywords": "Learning Multi-objective Program;Multi-objective Optimization",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Chaosheng Dong;Yijia Wang;Bo Zeng",
        "authorids": "~Chaosheng_Dong1;~Yijia_Wang2;~Bo_Zeng1",
        "gender": "M;F;M",
        "homepage": "https://chaoshengdong.github.io/;https://sites.pitt.edu/~yiw94/;https://www.engineering.pitt.edu/People/Faculty/Profiles/Bo-Zeng/",
        "dblp": "225/6556;;74/2630-1",
        "google_scholar": "nPratvEAAAAJ;FMDCrXMAAAAJ;RSdgv2YAAAAJ",
        "orcid": "0000-0003-4491-0594;;",
        "linkedin": "chaosheng-dong/;;",
        "or_profile": "~Chaosheng_Dong1;~Yijia_Wang2;~Bo_Zeng1",
        "aff": "Amazon;University of Pittsburgh;University of Pittsburgh",
        "aff_domain": "amazon.com;pitt.edu;pitt.edu",
        "position": "Researcher;Researcher;Associate Professor",
        "bibtex": "@misc{\ndong2024learning,\ntitle={Learning Multi-Objective Program Through Online Learning},\nauthor={Chaosheng Dong and Yijia Wang and Bo Zeng},\nyear={2024},\nurl={https://openreview.net/forum?id=zQwNAZ1cMT}\n}",
        "github": "",
        "project": "",
        "reviewers": "W171;Lg8p;5aAj",
        "site": "https://openreview.net/forum?id=zQwNAZ1cMT",
        "pdf_size": 2448849,
        "rating": "3;3;3",
        "confidence": "3;2;3",
        "soundness": "3;4;2",
        "contribution": "2;2;2",
        "presentation": "2;3;2",
        "wc_summary": "66;69;109",
        "wc_strengths": "52;47;130",
        "wc_weaknesses": "219;63;489",
        "wc_questions": "55;28;228",
        "wc_review": "392;207;956",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            81.33333333333333,
            19.601587237318874
        ],
        "wc_strengths_avg": [
            76.33333333333333,
            38.00292386412159
        ],
        "wc_weaknesses_avg": [
            257.0,
            175.97727125967148
        ],
        "wc_questions_avg": [
            103.66666666666667,
            88.60524188155512
        ],
        "wc_review_avg": [
            518.3333333333334,
            318.55960544648815
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17872576819016681089&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "Amazon;University of Pittsburgh",
        "aff_unique_dep": "Amazon.com, Inc.;",
        "aff_unique_url": "https://www.amazon.com;https://www.pitt.edu",
        "aff_unique_abbr": "Amazon;Pitt",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "zRMXQMyyM8",
        "title": "DISCRET: a self-interpretable framework for treatment effect estimation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Individual treatment effect is of great importance for healthcare and beyond. While most existing solutions focus on accurate treatment effect estimations, they rely on non-interpretable black-box models that can hinder stakeholders from understanding the underlying factors driving the prediction. To address this issue, we propose DISCRET, a self-interpretable framework that is inspired by how stake-\nholders make critical decisions in practice. DISCRET identifies samples similar to a target sample from a database by using interpretable rules and employs their treatment effect as the estimated ITE for the target sample. We present a deep reinforcement learning-based rule learning algorithm in DISCRET to achieve accurate ITE estimation. We conduct extensive experiments over tabular, natural language,\nand image settings. Our evaluation shows that DISCRET not only achieves comparable performance as black-box models but also generates more faithful explanations than state-of-the-art post-hoc methods and self-interpretable models.",
        "keywords": "treatment effect estimation;interpretability",
        "primary_area": "neurosymbolic & hybrid AI systems (physics-informed, logic & formal reasoning, etc.)",
        "supplementary_material": "/attachment/316955e4a723beee1381cc7d024135679510e92f.zip",
        "author": "Yinjun Wu;Neelay Velingker;Ziyang Li;Kan Chen;Mayank Keoliya;Mayur Naik;Qi Long;Eric Wong;Emily Getzen;Ravi Parikh",
        "authorids": "~Yinjun_Wu1;neelay@seas.upenn.edu;~Ziyang_Li2;~Kan_Chen3;mkeoliya@seas.upenn.edu;~Mayur_Naik1;~Qi_Long1;~Eric_Wong1;emily.getzen@pennmedicine.upenn.edu;ravi.parikh@pennmedicine.upenn.edu",
        "gender": "M;;M;M;;M;M;M;;",
        "homepage": "https://wuyinjun-1993.github.io/;;https://liby99.github.io;https://sites.google.com/sas.upenn.edu/kanchen;;http://www.cis.upenn.edu/~mhnaik/;https://www.med.upenn.edu/long-lab/;http://riceric22.github.io/;;",
        "dblp": "169/1054;;;;;92/6794;47/7320;64/1811-1.html;;",
        "google_scholar": "https://scholar.google.com/citations?hl=en;;aAQ9abEAAAAJ;;;https://scholar.google.com.tw/citations?user=fmsV6nEAAAAJ;gfklepYAAAAJ;pWnTMRkAAAAJ;;",
        "orcid": ";;;;;;0000-0003-0660-5230;;;",
        "linkedin": ";;liby99/;;;ai4code/;qi-long-9652a0125/;;;",
        "or_profile": "~Yinjun_Wu1;neelay@seas.upenn.edu;~Ziyang_Li2;~Kan_Chen3;mkeoliya@seas.upenn.edu;~Mayur_Naik1;~Qi_Long1;~Eric_Wong1;emily.getzen@pennmedicine.upenn.edu;ravi.parikh@pennmedicine.upenn.edu",
        "aff": "University of Pennsylvania;;School of Engineering and Applied Science, University of Pennsylvania;Harvard University;;University of Pennsylvania;University of Pennsylvania;University of Pennsylvania;;",
        "aff_domain": "seas.upenn.edu;;seas.upenn.edu;harvard.edu;;upenn.edu;upenn.edu;upenn.edu;;",
        "position": "Postdoc;;PhD student;Postdoc;;Professor;Professor;Assistant Professor;;",
        "bibtex": "@misc{\nwu2024discret,\ntitle={{DISCRET}: a self-interpretable framework for treatment effect estimation},\nauthor={Yinjun Wu and Neelay Velingker and Ziyang Li and Kan Chen and Mayank Keoliya and Mayur Naik and Qi Long and Eric Wong and Emily Getzen and Ravi Parikh},\nyear={2024},\nurl={https://openreview.net/forum?id=zRMXQMyyM8}\n}",
        "github": "",
        "project": "",
        "reviewers": "QYCJ;JeTi;BpHQ;XqUu",
        "site": "https://openreview.net/forum?id=zRMXQMyyM8",
        "pdf_size": 2471851,
        "rating": "3;3;5;5",
        "confidence": "4;5;5;3",
        "soundness": "2;2;3;2",
        "contribution": "2;2;3;2",
        "presentation": "2;3;3;3",
        "wc_summary": "67;43;59;78",
        "wc_strengths": "49;43;42;82",
        "wc_weaknesses": "78;233;152;99",
        "wc_questions": "58;4;61;90",
        "wc_review": "252;323;314;349",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            61.75,
            12.754901018824098
        ],
        "wc_strengths_avg": [
            54.0,
            16.38596960817394
        ],
        "wc_weaknesses_avg": [
            140.5,
            59.8268334445339
        ],
        "wc_questions_avg": [
            53.25,
            31.059418861272984
        ],
        "wc_review_avg": [
            309.5,
            35.59845502265512
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": -0.30151134457776363,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:YDPg6xofZTUJ:scholar.google.com/&scioq=DISCRET:+a+self-interpretable+framework+for+treatment+effect+estimation&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1;0;0;0",
        "aff_unique_norm": "University of Pennsylvania;Harvard University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.upenn.edu;https://www.harvard.edu",
        "aff_unique_abbr": "UPenn;Harvard",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Neural Processing of Tri-Plane Hybrid Neural Fields",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17383",
        "id": "zRkM6UcA22",
        "author_site": "Adriano Cardace, Pierluigi Zama Ramirez, Francesco Ballerini, Allan Zhou, Samuele Salti, Luigi Di Stefano",
        "tldr": "",
        "abstract": "Driven by the appealing properties of neural fields for storing and communicating 3D data, the problem of directly processing them to address tasks such as classification and part segmentation has emerged and has been investigated in recent works. \nEarly approaches employ neural fields parameterized by shared networks trained on the whole dataset, achieving good task performance but sacrificing reconstruction quality.\nTo improve the latter, later methods focus on individual neural fields parameterized as large Multi-Layer Perceptrons (MLPs), which are, however, challenging to process due to the high dimensionality of the weight space, intrinsic weight space symmetries, and sensitivity to random initialization. Hence, results turn out significantly inferior to those achieved by processing explicit representations, e.g., point clouds or meshes.\nIn the meantime, hybrid representations, in particular based on tri-planes, have emerged as a more effective and efficient alternative to realize neural fields, but their direct processing has not been investigated yet.\nIn this paper, we show that the tri-plane discrete data structure encodes rich information, which can be effectively processed by standard deep-learning machinery. We define an extensive benchmark covering a diverse set of fields such as occupancy, signed/unsigned distance, and, for the first time,  radiance fields. While processing a field with the same reconstruction quality, we achieve task performance far superior to frameworks that process large MLPs and, for the first time, almost on par with architectures handling explicit representations.",
        "keywords": "Neural Fields;3D classification",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/7dfe683cf4ffa5b103517ab6b65045683bd4adfd.pdf",
        "author": "Adriano Cardace;Pierluigi Zama Ramirez;Francesco Ballerini;Allan Zhou;Samuele Salti;Luigi di Stefano",
        "authorids": "~Adriano_Cardace1;~Pierluigi_Zama_Ramirez1;~Francesco_Ballerini1;~Allan_Zhou1;~Samuele_Salti1;~Luigi_di_Stefano1",
        "gender": "M;M;M;;M;M",
        "homepage": "https://github.com/adricarda;https://pierlui92.github.io/;https://www.unibo.it/sitoweb/francesco.ballerini4/en;http://bland.website;https://www.unibo.it/sitoweb/samuele.salti/en;https://www.unibo.it/sitoweb/luigi.distefano/en",
        "dblp": ";228/7804;358/4397;195/6907;31/495.html;00/2029",
        "google_scholar": "0uhdTI0AAAAJ;https://scholar.google.com/citations?hl=it;d_EdMVQAAAAJ;;https://scholar.google.it/citations?user=1kcIJG0AAAAJ;https://scholar.google.it/citations?user=xZVTzyAAAAAJ",
        "orcid": ";0000-0001-7734-5064;0009-0006-8774-5532;;;0000-0001-6014-6421",
        "linkedin": "adriano-cardace/;pierluigi-zama-ramirez-b02770171/;;;;",
        "or_profile": "~Adriano_Cardace1;~Pierluigi_Zama_Ramirez1;~Francesco_Ballerini1;~Allan_Zhou1;~Samuele_Salti1;~Luigi_di_Stefano1",
        "aff": "University of Bologna;University of Bologna;University of Bologna;Stanford University;University of Bologna;University of Bologna",
        "aff_domain": "unibo.it;unibo.it;unibo.it;stanford.edu;unibo.it;unibo.it",
        "position": "PhD student;Assistant Professor;PhD student;PhD student;Associate Professor;Full Professor",
        "bibtex": "@inproceedings{\ncardace2024neural,\ntitle={Neural Processing of Tri-Plane Hybrid Neural Fields},\nauthor={Adriano Cardace and Pierluigi Zama Ramirez and Francesco Ballerini and Allan Zhou and Samuele Salti and Luigi di Stefano},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=zRkM6UcA22}\n}",
        "github": "",
        "project": "",
        "reviewers": "hFtS;3J4Y;ue4V;fdy7",
        "pdf_size": 11513428,
        "rating": "3;5;6;8",
        "confidence": "5;4;4;4",
        "soundness": "3;3;3;4",
        "contribution": "3;4;3;3",
        "presentation": "2;3;3;3",
        "wc_summary": "41;45;143;124",
        "wc_strengths": "20;83;59;100",
        "wc_weaknesses": "80;211;167;145",
        "wc_questions": "4;5;72;149",
        "wc_review": "145;344;441;518",
        "wc_reply_reviewers": "0;28;0;0",
        "wc_reply_authors": "595;1061;666;641",
        "reply_reviewers": "0;1;0;0",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            4.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            88.25,
            45.76775611716179
        ],
        "wc_strengths_avg": [
            65.5,
            30.03747659175118
        ],
        "wc_weaknesses_avg": [
            150.75,
            47.256613293802594
        ],
        "wc_questions_avg": [
            57.5,
            59.583974355526166
        ],
        "wc_review_avg": [
            362.0,
            139.63344871484054
        ],
        "wc_reply_reviewers_avg": [
            7.0,
            12.12435565298214
        ],
        "wc_reply_authors_avg": [
            740.75,
            186.64186963272738
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.8006407690254357,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3114217804021738805&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=zRkM6UcA22",
        "pdf": "https://openreview.net/pdf?id=zRkM6UcA22",
        "email": "unibo.it;unibo.it;unibo.it;stanford.edu;unibo.it;unibo.it",
        "author_num": 6,
        "aff_unique_index": "0;0;0;1;0;0",
        "aff_unique_norm": "University of Bologna;Stanford University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.unibo.it;https://www.stanford.edu",
        "aff_unique_abbr": "Unibo;Stanford",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Stanford",
        "aff_country_unique_index": "0;0;0;1;0;0",
        "aff_country_unique": "Italy;United States"
    },
    {
        "id": "zSN6mXz6VF",
        "title": "Source-free Cross-modal Knowledge Transfer by Unleashing the Potential of Task-Irrelevant Data",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Source-free cross-modal knowledge transfer is a crucial yet challenging task, which aims to transfer knowledge from one source modality (e.g., RGB) to the target modality (e.g., depth or infrared) with no access to the task-relevant (TR) source data due to memory and privacy concerns. A recent attempt leverages the paired task-irrelevant (TI) data and directly matches the features from them to eliminate the modality gap. However, it ignores a pivotal clue that the paired TI data could be utilized to effectively estimate the source data distribution and better facilitate knowledge transfer to the target modality. To this end, we propose a novel yet concise framework to unlock the potential of paired TI data for enhancing source-free cross-modal knowledge transfer. Our work is buttressed by two key technical components. Firstly, to better estimate the source data distribution, we introduce a Task-irrelevant data-Guided Modality Bridging (TGMB) module. It translates the target modality data (e.g., infrared) into the source-like RGB images based on paired TI data and the guidance of the available source model to alleviate two key gaps: 1) inter-modality gap between paired TI data; 2) intra-modality gap between TI and TR target data. We then propose a Task-irrelevant data-Guided Knowledge Transfer (TGKT) module that transfers knowledge from the source model to the target model by leveraging paired TI data. Notably, due to the unavailability of labels for the TR target data and its less reliable prediction from the source model, our TGKT model incorporates a self-supervised pseudo-labeling approach to enable the target model to learn from its own predictions. Extensive experiments show that our method achieves the state-of-the-art performance on three datasets (RGB-to-depth and RGB-to-infrared).",
        "keywords": "Domain adaptation;cross-modality;knowledge distillation",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Jinjing Zhu;Yucheng Chen;Lin Wang",
        "authorids": "~Jinjing_Zhu1;~Yucheng_Chen3;~Lin_Wang2",
        "gender": "M;;M",
        "homepage": ";;https://dr.ntu.edu.sg/cris/rp/rp02550",
        "dblp": "251/2954;;",
        "google_scholar": "q2U3xtYAAAAJ;etAbMbAAAAAJ;SReb2csAAAAJ",
        "orcid": ";;0000-0002-7485-4493",
        "linkedin": ";;",
        "or_profile": "~Jinjing_Zhu1;~Yucheng_Chen3;~Lin_Wang2",
        "aff": "Hong Kong University of Science and Technology;Hong Kong University of Science and Technology;Hong Kong University of Science and Technology",
        "aff_domain": "ust.hk;hkust.edu;ust.hk",
        "position": "PhD student;MS student;Assistant Professor",
        "bibtex": "@misc{\nzhu2024sourcefree,\ntitle={Source-free Cross-modal Knowledge Transfer by Unleashing the Potential of Task-Irrelevant Data},\nauthor={Jinjing Zhu and Yucheng Chen and Lin Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=zSN6mXz6VF}\n}",
        "github": "",
        "project": "",
        "reviewers": "vgxe;CAob;aoSM;5PgS;CWKx;QmZs",
        "site": "https://openreview.net/forum?id=zSN6mXz6VF",
        "pdf_size": 16562112,
        "rating": "3;3;3;5;5;5",
        "confidence": "3;3;4;4;4;4",
        "soundness": "2;3;3;2;2;2",
        "contribution": "1;2;2;2;2;2",
        "presentation": "3;3;2;3;3;3",
        "wc_summary": "38;87;106;114;154;56",
        "wc_strengths": "53;28;77;99;253;105",
        "wc_weaknesses": "256;333;357;119;239;198",
        "wc_questions": "76;6;37;59;383;6",
        "wc_review": "423;454;577;391;1029;365",
        "wc_reply_reviewers": "0;0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0;0",
        "reply_authors": "0;0;0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.8333333333333333,
            0.3726779962499649
        ],
        "presentation_avg": [
            2.8333333333333335,
            0.3726779962499649
        ],
        "wc_summary_avg": [
            92.5,
            38.20885586701945
        ],
        "wc_strengths_avg": [
            102.5,
            72.24899076573088
        ],
        "wc_weaknesses_avg": [
            250.33333333333334,
            79.95762766754791
        ],
        "wc_questions_avg": [
            94.5,
            131.53294897730632
        ],
        "wc_review_avg": [
            539.8333333333334,
            228.910766214455
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.7071067811865476,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3323615604707430203&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Hong Kong University of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ust.hk",
        "aff_unique_abbr": "HKUST",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Hong Kong SAR",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "zSwH0Wo2wo",
        "title": "Explore, Establish, Exploit: Red Teaming Language Models from Scratch",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deploying large language models (LMs) can pose hazards from harmful outputs such as toxic or false text. Prior work has introduced automated tools that elicit harmful outputs to identify these risks. While this is a valuable step toward securing models, these approaches rely on a pre-existing way to efficiently classify undesirable outputs. Using a pre-existing classifier does not allow for red-teaming to be tailored to the target model. Furthermore, when failures can be easily classified in advance, red-teaming has limited marginal value because problems can be avoided by simply filtering training data and/or model outputs. Here, we consider red-teaming \"from scratch\" in which the adversary does not begin with a way to classify failures. Our framework consists of three steps: 1) Exploring the model's range of behaviors in the desired context; 2) Establishing a measurement for undesired behavior (e.g., a classifier trained to reflect human evaluations); and 3) Exploiting the model's flaws using this measure to develop diverse adversarial prompts. We use this approach to red-team GPT-3 to discover classes of inputs that elicit false statements. In doing so, we construct the CommonClaim dataset of 20,000 statements labeled by humans as common-knowledge-true, common knowledge-false, or neither. We are making code and data available.",
        "keywords": "red-teaming;adversarial attacks;language models",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/f61972abbc9771f2c1152735dcbe414c5335300d.zip",
        "author": "Stephen Casper;Jason Lin;Joe Kwon;Gatlen Culp;Dylan Hadfield-Menell",
        "authorids": "~Stephen_Casper1;~Jason_Lin3;~Joe_Kwon1;~Gatlen_Culp1;~Dylan_Hadfield-Menell2",
        "gender": "M;M;M;;M",
        "homepage": "https://stephencasper.com/;;http://people.csail.mit.edu/dhm/;;",
        "dblp": "255/5295.html;;135/8332;66/9828;",
        "google_scholar": "N4aglP4AAAAJ;;4mVPFQ8AAAAJ;7ju8fa4AAAAJ;",
        "orcid": "0000-0003-0084-1937;0000-0001-5704-6251;0000-0002-6168-4763;;",
        "linkedin": ";gatlen-culp/;;;joseph-k-5ba472119/",
        "or_profile": "~Stephen_Casper1;~Gatlen_Culp1;~Dylan_Hadfield-Menell2;~Jason_J_Lin1;~Joseph_Kwon2",
        "aff": "Massachusetts Institute of Technology;Massachusetts Institute of Technology;Massachusetts Institute of Technology;Stanford University;Massachusetts Institute of Technology",
        "aff_domain": "mit.edu;mit.edu;mit.edu;stanford.edu;mit.edu",
        "position": "Graduate Student;Undergrad student;Assistant Professor;Researcher;Researcher",
        "bibtex": "@misc{\ncasper2024explore,\ntitle={Explore, Establish, Exploit: Red Teaming Language Models from Scratch},\nauthor={Stephen Casper and Jason Lin and Joe Kwon and Gatlen Culp and Dylan Hadfield-Menell},\nyear={2024},\nurl={https://openreview.net/forum?id=zSwH0Wo2wo}\n}",
        "github": "",
        "project": "",
        "reviewers": "weY9;tVNe;8GJm;FuAh",
        "site": "https://openreview.net/forum?id=zSwH0Wo2wo",
        "pdf_size": 247660,
        "rating": "3;5;5;8",
        "confidence": "4;4;4;4",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;4;3;4",
        "wc_summary": "90;110;41;164",
        "wc_strengths": "55;66;32;71",
        "wc_weaknesses": "187;25;117;179",
        "wc_questions": "2;521;93;93",
        "wc_review": "334;722;283;507",
        "wc_reply_reviewers": "0;821;0;0",
        "wc_reply_authors": "715;1857;707;569",
        "reply_reviewers": "0;3;0;0",
        "reply_authors": "1;6;1;1",
        "rating_avg": [
            5.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            101.25,
            44.075928804734225
        ],
        "wc_strengths_avg": [
            56.0,
            15.016657417681207
        ],
        "wc_weaknesses_avg": [
            127.0,
            64.82283548256741
        ],
        "wc_questions_avg": [
            177.25,
            201.91133573922986
        ],
        "wc_review_avg": [
            461.5,
            171.791297800558
        ],
        "wc_reply_reviewers_avg": [
            205.25,
            355.5034282535121
        ],
        "wc_reply_authors_avg": [
            962.0,
            519.9778841450856
        ],
        "reply_reviewers_avg": [
            0.75,
            1.299038105676658
        ],
        "reply_authors_avg": [
            2.25,
            2.165063509461097
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 93,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17596552078024127407&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0;1;0",
        "aff_unique_norm": "Massachusetts Institute of Technology;Stanford University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://web.mit.edu;https://www.stanford.edu",
        "aff_unique_abbr": "MIT;Stanford",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Stanford",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Task Adaptation from Skills: Information Geometry, Disentanglement, and New Objectives for Unsupervised Reinforcement Learning",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17382",
        "id": "zSxpnKh1yS",
        "author_site": "Yucheng Yang, Tianyi Zhou, Qiang HE, Lei Han, Mykola Pechenizkiy, Meng Fang",
        "tldr": "",
        "abstract": "Unsupervised reinforcement learning (URL) aims to learn general skills for unseen downstream tasks. Mutual Information Skill Learning (MISL) addresses URL by maximizing the mutual information between states and skills but lacks sufficient theoretical analysis, e.g., how well its learned skills can initialize a downstream task's policy. Our new theoretical analysis shows that the diversity and separatability of learned skills are fundamentally critical to downstream task adaptation but MISL does not necessarily guarantee them. To improve MISL, we propose a novel disentanglement metric LSEPIN and build an information-geometric connection between LSEPIN and downstream task adaptation cost. For better geometric properties, we investigate a new strategy that replaces the KL divergence in information geometry with Wasserstein distance. We extend the geometric analysis to it, which leads to a novel skill-learning objective WSEP. It is theoretically justified to be helpful to task adaptation and it is capable of discovering more initial policies for downstream tasks than MISL. We further propose a Wasserstein distance-based algorithm PWSEP can theoretically discover all potentially optimal initial policies.",
        "keywords": "unsupervised skill learning;reward-free RL;downstream task adaptation;wasserstein distance;theoretical analysis",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Yucheng Yang;Tianyi Zhou;Qiang He;Lei Han;Mykola Pechenizkiy;Meng Fang",
        "authorids": "~Yucheng_Yang2;~Tianyi_Zhou1;~Qiang_He1;~Lei_Han1;~Mykola_Pechenizkiy1;~Meng_Fang1",
        "gender": ";M;M;M;M;M",
        "homepage": ";https://tianyizhou.github.io/;;https://www.leihan.org;http://www.win.tue.nl/~mpechen/;",
        "dblp": ";88/8205-1;;75/2307-1;37/4649;67/463",
        "google_scholar": "MDEntKcAAAAJ;OKvgizMAAAAJ;l6Y2ZDYAAAAJ;Tz4_zi8AAAAJ;https://scholar.google.com.tw/citations?user=F0uFT_kAAAAJ;IcNYP1oAAAAJ",
        "orcid": ";0000-0001-5348-0632;;;0000-0003-4955-0743;",
        "linkedin": ";tianyizhou;;;mpechen/;",
        "or_profile": "~Yucheng_Yang2;~Tianyi_Zhou1;~Qiang_He1;~Lei_Han1;~Mykola_Pechenizkiy1;~Meng_Fang1",
        "aff": "Eindhoven University of Technology;University of Maryland, College Park;Ruhr-Universit\u00e4t Bochum;Tencent Robotics X;Eindhoven University of Technology;Eindhoven University of Technology",
        "aff_domain": "tue.nl;umd.edu;ruhr-uni-bochum.de;tencent.com;tue.nl;tue.nl",
        "position": "PhD student;Assistant Professor;PhD student;Principal Researcher;Full Professor;Assistant Professor",
        "bibtex": "@inproceedings{\nyang2024task,\ntitle={Task Adaptation from Skills: Information Geometry, Disentanglement, and New Objectives for Unsupervised Reinforcement Learning},\nauthor={Yucheng Yang and Tianyi Zhou and Qiang He and Lei Han and Mykola Pechenizkiy and Meng Fang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=zSxpnKh1yS}\n}",
        "github": "",
        "project": "",
        "reviewers": "j7aV;LRDL;ZXDZ;xY4U",
        "pdf_size": 1162144,
        "rating": "6;8;8;8",
        "confidence": "3;5;3;4",
        "soundness": "2;4;3;3",
        "contribution": "3;4;3;3",
        "presentation": "1;3;2;3",
        "wc_summary": "95;91;152;159",
        "wc_strengths": "27;134;35;138",
        "wc_weaknesses": "74;42;43;51",
        "wc_questions": "298;192;83;1",
        "wc_review": "494;459;313;349",
        "wc_reply_reviewers": "277;146;373;0",
        "wc_reply_authors": "1770;886;1232;22",
        "reply_reviewers": "2;2;2;0",
        "reply_authors": "4;2;3;1",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            3.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            124.25,
            31.379730719048563
        ],
        "wc_strengths_avg": [
            83.5,
            52.59515186782903
        ],
        "wc_weaknesses_avg": [
            52.5,
            12.893796958227627
        ],
        "wc_questions_avg": [
            143.5,
            112.0145079889208
        ],
        "wc_review_avg": [
            403.75,
            74.88449438969324
        ],
        "wc_reply_reviewers_avg": [
            199.0,
            140.3299682890294
        ],
        "wc_reply_authors_avg": [
            977.5,
            635.251721760752
        ],
        "reply_reviewers_avg": [
            1.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            2.5,
            1.118033988749895
        ],
        "replies_avg": [
            22,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.5222329678670935,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11104779889951446023&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "openreview": "https://openreview.net/forum?id=zSxpnKh1yS",
        "pdf": "https://openreview.net/pdf?id=zSxpnKh1yS",
        "email": "tue.nl;umd.edu;ruhr-uni-bochum.de;tencent.com;tue.nl;tue.nl",
        "author_num": 6,
        "aff_unique_index": "0;1;2;3;0;0",
        "aff_unique_norm": "Eindhoven University of Technology;University of Maryland;Ruhr-Universit\u00e4t Bochum;Tencent",
        "aff_unique_dep": ";;;Tencent Robotics X",
        "aff_unique_url": "https://www.tue.nl;https://www/umd.edu;https://www.ruhr-uni-bochum.de;https://www.tencent.com",
        "aff_unique_abbr": "TU/e;UMD;RUB;Tencent Robotics X",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";College Park",
        "aff_country_unique_index": "0;1;2;3;0;0",
        "aff_country_unique": "Netherlands;United States;Germany;China"
    },
    {
        "id": "zUDbPgskDS",
        "title": "Crystals with Transformers on Graphs, for predictions of crystal material properties",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Graph neural networks (GNN) has found extensive applications across diverse domains, notably in the modeling molecules. Crystals differ from molecules by the ionic bonding across the lattice and the highly ordered microscopic structure, which provides crystals unique symmetry and determines the macroscopic properties. Therefore, long-range orders are essential in predicting the physical and chemical properties of crystals. GNNs successfully model the local environment of atoms in crystals, however, they struggle to capture long-range interactions due to a limitation of depth. In this paper, we propose CrysToGraph ($\\textbf{Crys}$tals with $\\textbf{T}$ransformers $\\textbf{o}$n $\\textbf{Graph}$s), a novel transformer-based geometric graph network designed specifically for crystalline systems. CrysToGraph effectively captures short-range dependencies with transformer-based graph convolution blocks and long-range dependencies with graph-wise transformer blocks. Our model outperforms most existing methods by achieving new state-of-the-art results on the MatBench benchmark datasets.",
        "keywords": "AI for science;Graph networks;transformers;materials informatics;crystal materials",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/b907403c02274c4d4ee85697740255aa12503456.pdf",
        "author": "Hongyi Wang;Ji Sun;Jinzhe Liang",
        "authorids": "~Hongyi_Wang5;~Ji_Sun1;~Jinzhe_Liang2",
        "gender": "M;;",
        "homepage": ";;",
        "dblp": ";;",
        "google_scholar": ";;71qjsCkAAAAJ",
        "orcid": "0000-0003-0125-6430;;",
        "linkedin": "hongyi-wang-91623a18b/;sunji09bjmu;",
        "or_profile": "~Hongyi_Wang5;~Ji_Sun1;~jinzhe_liang1",
        "aff": "City University of Hong Kong;Renmin University of China;",
        "aff_domain": "cityu.edu.hk;ruc.edu.cn;",
        "position": "PhD student;PhD student;",
        "bibtex": "@misc{\nwang2024crystals,\ntitle={Crystals with Transformers on Graphs, for predictions of crystal material properties},\nauthor={Hongyi Wang and Ji Sun and Jinzhe Liang},\nyear={2024},\nurl={https://openreview.net/forum?id=zUDbPgskDS}\n}",
        "github": "",
        "project": "",
        "reviewers": "cTjz;uVzi;ivKJ;5cNz",
        "site": "https://openreview.net/forum?id=zUDbPgskDS",
        "pdf_size": 1697939,
        "rating": "1;3;3;6",
        "confidence": "5;2;3;3",
        "soundness": "1;3;2;4",
        "contribution": "2;2;2;3",
        "presentation": "2;2;1;4",
        "wc_summary": "90;132;96;119",
        "wc_strengths": "48;19;24;126",
        "wc_weaknesses": "260;35;161;233",
        "wc_questions": "11;20;69;129",
        "wc_review": "409;206;350;607",
        "wc_reply_reviewers": "333;157;0;0",
        "wc_reply_authors": "207;282;452;610",
        "reply_reviewers": "2;1;0;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.25,
            1.7853571071357126
        ],
        "confidence_avg": [
            3.25,
            1.0897247358851685
        ],
        "soundness_avg": [
            2.5,
            1.118033988749895
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.25,
            1.0897247358851685
        ],
        "wc_summary_avg": [
            109.25,
            17.020208576865326
        ],
        "wc_strengths_avg": [
            54.25,
            42.85075845303091
        ],
        "wc_weaknesses_avg": [
            172.25,
            87.11307307172673
        ],
        "wc_questions_avg": [
            57.25,
            46.938124163626306
        ],
        "wc_review_avg": [
            393.0,
            143.93574955514006
        ],
        "wc_reply_reviewers_avg": [
            122.5,
            137.39814409226932
        ],
        "wc_reply_authors_avg": [
            387.75,
            156.02623978036516
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.5461186812727501,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:JJoX6SUfjP8J:scholar.google.com/&scioq=Crystals+with+Transformers+on+Graphs,+for+predictions+of+crystal+material+properties&hl=en&as_sdt=0,44",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "City University of Hong Kong;Renmin University of China",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cityu.edu.hk;http://www.ruc.edu.cn",
        "aff_unique_abbr": "CityU;RUC",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "zUHgYRRAWl",
        "title": "Objective-Agnostic Enhancement of Molecule Properties via Multi-Stage VAE",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Variational autoencoder (VAE) is a popular method for drug discovery and various architectures and pipelines have been proposed to improve its performance. However, VAE approaches are known to suffer from poor manifold recovery when the data lie on a low-dimensional manifold embedded in a higher dimensional ambient space [Dai and Wipf, 2019]. The consequences of it in drug discovery are somewhat under-explored. In this paper, we explore applying a multi-stage VAE approach, that can improve manifold recovery on a synthetic dataset, to the field of drug discovery. We experimentally evaluate our multi-stage VAE approach using the ChEMBL dataset and demonstrate its ability to improve the property statistics of generated molecules substantially from pre-existing methods without incorporating property predictors into the training pipeline. We further fine-tune our models on two curated and much smaller molecule datasets that target different proteins. Our experiments show an increase in the number of active molecules generated by the multi-stage VAE in comparison to their one-stage equivalent. For each of the two tasks, our baselines include methods that use learned property predictors to incorporate target metrics directly into the training objective and we discuss complications that arise with this methodology.",
        "keywords": "VAE;molecule generation",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/30e4b1f1117d224373fff1d92bb76f18a3108957.zip",
        "author": "Chenghui Zhou;Barnabas Poczos",
        "authorids": "~Chenghui_Zhou1;~Barnabas_Poczos1",
        "gender": "F;",
        "homepage": ";http://www.cs.cmu.edu/~bapoczos/",
        "dblp": "https://dblp.uni-trier.de/pers/hd/z/Zhou:Chenghui;15/4829",
        "google_scholar": "bl_OT0MAAAAJ;https://scholar.google.com/",
        "orcid": ";",
        "linkedin": "chenghui-zhou-35616289;",
        "or_profile": "~Chenghui_Zhou1;~Barnab\u00e1s_P\u00f3czos1",
        "aff": "Carnegie Mellon University;School of Computer Science",
        "aff_domain": "andrew.cmu.edu;cs.cmu.edu",
        "position": "PhD student;Associate Professor",
        "bibtex": "@misc{\nzhou2024objectiveagnostic,\ntitle={Objective-Agnostic Enhancement of Molecule Properties via Multi-Stage {VAE}},\nauthor={Chenghui Zhou and Barnabas Poczos},\nyear={2024},\nurl={https://openreview.net/forum?id=zUHgYRRAWl}\n}",
        "github": "",
        "project": "",
        "reviewers": "DTvh;un1d;uwWu",
        "site": "https://openreview.net/forum?id=zUHgYRRAWl",
        "pdf_size": 424210,
        "rating": "1;1;3",
        "confidence": "5;4;4",
        "soundness": "1;2;1",
        "contribution": "1;2;1",
        "presentation": "1;2;2",
        "wc_summary": "68;11;94",
        "wc_strengths": "4;5;42",
        "wc_weaknesses": "4;17;227",
        "wc_questions": "4;1;205",
        "wc_review": "80;34;568",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.333333333333333,
            0.4714045207910317
        ],
        "soundness_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "contribution_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            57.666666666666664,
            34.663461390281775
        ],
        "wc_strengths_avg": [
            17.0,
            17.682382946499793
        ],
        "wc_weaknesses_avg": [
            82.66666666666667,
            102.19697755913441
        ],
        "wc_questions_avg": [
            70.0,
            95.46727187890099
        ],
        "wc_review_avg": [
            227.33333333333334,
            241.61861591267245
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.4999999999999999,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16944341016481432477&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Carnegie Mellon University;School of Computer Science",
        "aff_unique_dep": ";Computer Science",
        "aff_unique_url": "https://www.cmu.edu;",
        "aff_unique_abbr": "CMU;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0",
        "aff_country_unique": "United States;"
    },
    {
        "id": "zW1tyw3UFu",
        "title": "Dozerformer: Sequence Adaptive Sparse Transformer for Multivariate Time Series Forecasting",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Transformers have achieved remarkable performance in multivariate time series(MTS) forecasting due to their capability to capture long-term dependencies. However, the canonical attention mechanism has two key limitations: (1) its quadratic time complexity limits the sequence length, and (2) it generates future values from the entire historical sequence. To address this, we propose a Dozer Attention mechanism consisting of three sparse components: (1) Local, each query exclusively attends to keys within a localized window of neighboring time steps. (2) Stride, enables each query to attend to keys at predefined intervals. (3) Vary, allows queries to selectively attend to keys from a subset of the historical sequence. Notably, the size of this subset dynamically expands as forecasting horizons extend. Those three components are designed to capture essential attributes of MTS data, including locality, seasonality, and global temporal dependencies. Additionally, we present the Dozerformer Framework, incorporating the Dozer Attention mechanism for the MTS forecasting task. We evaluated the proposed Dozerformer framework with recent state-of-the-art methods on nine benchmark datasets and confirmed its superior performance.",
        "keywords": "Time series forecasting;Transformer;Deep learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Yifan Zhang;Rui Wu;Sergiu Dascalu;Frederick Harris",
        "authorids": "~Yifan_Zhang24;~Rui_Wu4;~Sergiu_Dascalu1;~Frederick_Harris1",
        "gender": ";M;M;M",
        "homepage": ";;https://www.unr.edu/cse/people/sergiu-dascalu;https://www.cse.unr.edu/~fredh/",
        "dblp": ";10/2678;;",
        "google_scholar": "d4dmtPIAAAAJ;403C7GMAAAAJ;RLoNJA4AAAAJ;yhbUkg0AAAAJ",
        "orcid": ";0000-0001-6134-5393;;",
        "linkedin": "yifan-zhang-992736151/;;;",
        "or_profile": "~Yifan_Zhang24;~Rui_Wu4;~Sergiu_Dascalu1;~Frederick_Harris1",
        "aff": "University of Nevada, Reno;;University of Nevada, Reno;University of Nevada, Reno",
        "aff_domain": "unr.edu;;unr.edu;unr.edu",
        "position": "PhD student;;Full Professor;Full Professor",
        "bibtex": "@misc{\nzhang2024dozerformer,\ntitle={Dozerformer: Sequence Adaptive Sparse Transformer for Multivariate Time Series Forecasting},\nauthor={Yifan Zhang and Rui Wu and Sergiu Dascalu and Frederick Harris},\nyear={2024},\nurl={https://openreview.net/forum?id=zW1tyw3UFu}\n}",
        "github": "",
        "project": "",
        "reviewers": "nz5f;zXpM;Pv5r;xCiy",
        "site": "https://openreview.net/forum?id=zW1tyw3UFu",
        "pdf_size": 7376136,
        "rating": "3;3;6;6",
        "confidence": "4;4;2;4",
        "soundness": "2;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "108;94;74;102",
        "wc_strengths": "14;30;113;115",
        "wc_weaknesses": "500;75;33;105",
        "wc_questions": "4;45;292;85",
        "wc_review": "626;244;512;407",
        "wc_reply_reviewers": "224;0;7;0",
        "wc_reply_authors": "2716;675;953;330",
        "reply_reviewers": "2;0;1;0",
        "reply_authors": "4;1;2;1",
        "rating_avg": [
            4.5,
            1.5
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            94.5,
            12.835497652993435
        ],
        "wc_strengths_avg": [
            68.0,
            46.351914739307155
        ],
        "wc_weaknesses_avg": [
            178.25,
            187.5144994393767
        ],
        "wc_questions_avg": [
            106.5,
            110.86139995507905
        ],
        "wc_review_avg": [
            447.25,
            140.60116464667
        ],
        "wc_reply_reviewers_avg": [
            57.75,
            96.02701442823265
        ],
        "wc_reply_authors_avg": [
            1168.5,
            920.3017168298666
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            2.0,
            1.224744871391589
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896258,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Lcp5xZCPOykJ:scholar.google.com/&scioq=Dozerformer:+Sequence+Adaptive+Sparse+Transformer+for+Multivariate+Time+Series+Forecasting&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "University of Nevada",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.unr.edu",
        "aff_unique_abbr": "UNR",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Reno",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Detecting Pretraining Data from Large Language Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17381",
        "id": "zWqr3MQuNs",
        "author_site": "Weijia Shi, Anirudh Ajith, Mengzhou Xia, Yangsibo Huang, Daogao Liu, Terra Blevins, Danqi Chen, Luke Zettlemoyer",
        "tldr": "",
        "abstract": "Although large language models (LLMs) are widely deployed, the data used to train them is rarely disclosed. Given the incredible scale of this data, up to trillions of tokens, it is all but certain that it includes potentially problematic text such as copyrighted materials, personally identifiable information, and test data for widely reported reference benchmarks. However, we currently have no way to know which data of these types is included or in what proportions. In this paper, we study the pretraining data detection problem: given a piece of text and black-box access to an LLM without knowing the pretraining data, can we determine if the model was trained on the provided text? To facilitate this study, we introduce a dynamic benchmark WIKIMIA that uses data created before and after model training to support gold truth detection. We also introduce a new detection method MIN-K PROB based on a simple hypothesis: an unseen example is likely to contain a few outlier words with low probabilities under the LLM, while a seen example is less likely to have words with such low probabilities. MIN-K PROB can be applied without any knowledge about the pretrainig corpus or any additional training, departing from previous detection methods that require training a reference model on data that is similar to the pretraining data. Moreover, our experiments demonstrate that MIN-K PROB achieves a 7.4% improvement on WIKIMIA over these previous methods. We apply MIN-K PROB to two real-world scenarios, copyrighted book detection and contaminated downstream example detection, and find that it to be a consistently effective solution.",
        "keywords": "Large language models;detecting pretraining data",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Weijia Shi;Anirudh Ajith;Mengzhou Xia;Yangsibo Huang;Daogao Liu;Terra Blevins;Danqi Chen;Luke Zettlemoyer",
        "authorids": "~Weijia_Shi1;~Anirudh_Ajith1;~Mengzhou_Xia1;~Yangsibo_Huang2;~Daogao_Liu1;~Terra_Blevins1;~Danqi_Chen1;~Luke_Zettlemoyer1",
        "gender": ";M;F;F;M;F;F;M",
        "homepage": "https://weijiashi.notion.site/;https://anirudhajith.github.io;https://xiamengzhou.github.io/;https://hazelsuko07.github.io/yangsibo/;https://daogaoliu.github.io/;https://blvns.github.io;https://www.cs.princeton.edu/~danqic/;https://www.cs.washington.edu/people/faculty/lsz/",
        "dblp": "132/80601;348/5792;241/9329;;245/4078;184/3734;87/7949;21/6793",
        "google_scholar": "https://scholar.google.com/citations?hl=en;KarsBWAAAAAJ;zyJn1IcAAAAJ;NMPUDa0AAAAJ;auA3AaQAAAAJ;;sVR8ktkAAAAJ;https://scholar.google.com.tw/citations?user=UjpbO6IAAAAJ",
        "orcid": "0000-3200-0000-0011;;;;;;;",
        "linkedin": "weijia-shi-773768112;anirudhajith/;;;;;;luke-zettlemoyer-a0109b226/",
        "or_profile": "~Weijia_Shi1;~Anirudh_Ajith1;~Mengzhou_Xia1;~Yangsibo_Huang2;~Daogao_Liu1;~Terra_Blevins1;~Danqi_Chen1;~Luke_Zettlemoyer1",
        "aff": "University of Washington, Seattle;Princeton University;Princeton University;Princeton University;University of Washington, Seattle;University of Washington;Princeton University;Meta",
        "aff_domain": "uw.edu;princeton.edu;princeton.edu;princeton.edu;uw.edu;washington.edu;cs.princeton.edu;meta.com",
        "position": "PhD student;MS student;PhD student;PhD student;PhD student;PhD student;Assistant Professor;Researcher",
        "bibtex": "@inproceedings{\nshi2024detecting,\ntitle={Detecting Pretraining Data from Large Language Models},\nauthor={Weijia Shi and Anirudh Ajith and Mengzhou Xia and Yangsibo Huang and Daogao Liu and Terra Blevins and Danqi Chen and Luke Zettlemoyer},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=zWqr3MQuNs}\n}",
        "github": "",
        "project": "",
        "reviewers": "oVRd;syso;Z3oB;S4cH",
        "pdf_size": 661706,
        "rating": "5;6;6;8",
        "confidence": "3;4;3;3",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;4",
        "presentation": "3;3;3;4",
        "wc_summary": "57;143;58;167",
        "wc_strengths": "18;19;32;116",
        "wc_weaknesses": "102;358;70;394",
        "wc_questions": "67;137;3;177",
        "wc_review": "244;657;163;854",
        "wc_reply_reviewers": "92;139;0;49",
        "wc_reply_authors": "770;1090;331;664",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "2;3;2;1",
        "rating_avg": [
            6.25,
            1.0897247358851685
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            106.25,
            49.48421465477653
        ],
        "wc_strengths_avg": [
            46.25,
            40.64710936831794
        ],
        "wc_weaknesses_avg": [
            231.0,
            145.99657530229948
        ],
        "wc_questions_avg": [
            96.0,
            66.58077800686922
        ],
        "wc_review_avg": [
            479.5,
            286.0895838719054
        ],
        "wc_reply_reviewers_avg": [
            70.0,
            51.44414446756793
        ],
        "wc_reply_authors_avg": [
            713.75,
            270.97082407521293
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.0,
            0.7071067811865476
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": -0.13245323570650439,
        "gs_citation": 287,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7668256395990346715&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=zWqr3MQuNs",
        "pdf": "https://openreview.net/pdf?id=zWqr3MQuNs",
        "email": "uw.edu;princeton.edu;princeton.edu;princeton.edu;uw.edu;washington.edu;cs.princeton.edu;meta.com",
        "author_num": 8,
        "aff_unique_index": "0;1;1;1;0;0;1;2",
        "aff_unique_norm": "University of Washington;Princeton University;Meta",
        "aff_unique_dep": ";;Meta Platforms, Inc.",
        "aff_unique_url": "https://www.washington.edu;https://www.princeton.edu;https://meta.com",
        "aff_unique_abbr": "UW;Princeton;Meta",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Seattle;",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "zX0LqTw80H",
        "title": "AWRQ: Activation-aware Weight Reformulation Quantizer for Large Language Models",
        "track": "main",
        "status": "Desk Reject",
        "tldr": "",
        "abstract": "Large Language Models (LLMs) have shown great potential applications in many fields for their excellent performance on various\ntasks, but the usage is also limited by the huge computational\nand storage cost. To address this challenge, quantization is a promising way and many insightful methods have been proposed, including GPTQ, a post-training quantization method which achieves the state-of-the-art result for low bit quantization of LLMs. However, this method only focuses on generative tasks which predicts an output token given an input prompt, and does not consider the scenario that generates a list of tokens in sequential process which requires quantization of activations in practice. In this paper, we extend GPTQ to the quantization of both weights and activations\nand propose Activation-aware Weight Reformulation Quantizer (AWRQ) which transfers quantization errors of activations to weights and then quantizes weights by solving series of minimal problems. GPTQ is low efficient in calibration because it quantizes only one column of weights at each iteration step, we speedup this by the block-wise technique which quantizes a few columns in parallel at each time.\nAs low-bit quantization of activations may lead to accuracy collapse for LLMs, we perform SmoothQuant before our experiments.\nThis allows us to implement W4A6 (weight 4-bits, activation 6-bits) quantization of LLMs for the first time. \nWe implement our method on OPT and LLAMA benchmarks and demonstrate that, the models have only a bit accuracy loss when quantized to W4A8 and get state-of-the-art accuracy when quantized to W4A6. To speedup the algorithm, we use block-wise technique and obtain 4$\\times$ speedups with no accuracy degradation when quantizing OPT13B. Our algorithm is one-shot and hardware-friendly, which makes it highly efficient for quantization and deployment.",
        "keywords": "LLMs;Quantization;Weight Reformulation;Low-bits;Block-wise",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Lin Zhao",
        "authorids": "~Lin_Zhao15",
        "gender": "M",
        "homepage": "https://www.amd.com/en.html",
        "dblp": "",
        "google_scholar": "",
        "orcid": "",
        "linkedin": "",
        "or_profile": "~Lin_Zhao15",
        "aff": "",
        "aff_domain": "",
        "position": "",
        "bibtex": "@misc{\nzhao2024awrq,\ntitle={{AWRQ}: Activation-aware Weight Reformulation Quantizer for Large Language Models},\nauthor={Lin Zhao},\nyear={2024},\nurl={https://openreview.net/forum?id=zX0LqTw80H}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=zX0LqTw80H",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            1,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:EJ8PBmuv1TMJ:scholar.google.com/&scioq=AWRQ:+Activation-aware+Weight+Reformulation+Quantizer+for+Large+Language+Models&hl=en&as_sdt=0,5",
        "gs_version_total": 0
    },
    {
        "title": "FROSTER: Frozen CLIP is A Strong Teacher for Open-Vocabulary Action Recognition",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17380",
        "id": "zYXFMeHRtO",
        "author_site": "Xiaohu Huang, Hao Zhou, Kun Yao, Kai Han",
        "tldr": "",
        "abstract": "In this paper, we introduce \\textbf{FROSTER}, an effective framework for open-vocabulary action recognition. The CLIP model has achieved remarkable success in a range of image-based tasks, benefiting from its strong generalization capability stemming from pretaining on massive image-text pairs. However, applying CLIP directly to the open-vocabulary action recognition task is challenging due to the absence of temporal information in CLIP's pretraining. Further, fine-tuning CLIP on action recognition datasets may lead to overfitting and hinder its generalizability, resulting in unsatisfactory results when dealing with unseen actions.\nTo address these issues, FROSTER employs a residual feature distillation approach to ensure that CLIP retains its generalization capability while effectively adapting to the action recognition task. Specifically, the residual feature distillation treats the frozen CLIP model as a teacher to maintain the generalizability exhibited by the original CLIP and supervises the feature learning for the extraction of video-specific features to bridge the gap between images and videos. Meanwhile, it uses a residual sub-network for feature distillation to reach a balance between the two distinct objectives of learning generalizable and video-specific features.\nWe extensively evaluate FROSTER on open-vocabulary action recognition benchmarks under both base-to-novel and cross-dataset settings.  FROSTER consistently achieves state-of-the-art performance on all datasets across the board. \nProject page: \\url{https://visual-ai.github.io/froster}.",
        "keywords": "Open-Vocabulary Action Recognition;Action Recognition",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/0d97fc662d70ac0367030f51edeb80c57ec25239.pdf",
        "author": "Xiaohu Huang;Hao Zhou;Kun Yao;Kai Han",
        "authorids": "~Xiaohu_Huang1;~Hao_Zhou13;~Kun_Yao1;~Kai_Han1",
        "gender": "M;M;M;M",
        "homepage": "https://scholar.google.com/citations?user=sBjFwuQAAAAJ&hl=en;;https://github.com/kk12333;http://www.kaihan.org/",
        "dblp": "24/2054;63/778;03/6550;51/4757-1.html",
        "google_scholar": "sBjFwuQAAAAJ;xZ-0R3cAAAAJ;;tG8S_vMAAAAJ",
        "orcid": ";0000-0001-9764-1012;0000-0001-7155-4076;0000-0002-7995-9999",
        "linkedin": ";;;kaihancs/",
        "or_profile": "~Xiaohu_Huang1;~Hao_Zhou13;~Kun_Yao1;~Kai_Han1",
        "aff": "The University of Hong Kong;Baidu;Baidu;The University of Hong Kong",
        "aff_domain": "hku.hk;baidu.com;baidu.com;hku.hk",
        "position": "PhD student;Researcher;Manager;Assistant Professor",
        "bibtex": "@inproceedings{\nhuang2024froster,\ntitle={{FROSTER}: Frozen {CLIP} is A Strong Teacher for Open-Vocabulary Action Recognition},\nauthor={Xiaohu Huang and Hao Zhou and Kun Yao and Kai Han},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=zYXFMeHRtO}\n}",
        "github": "",
        "project": "",
        "reviewers": "RLyA;FMt3;zWh1;ZdtY",
        "pdf_size": 2322013,
        "rating": "6;6;6;6",
        "confidence": "4;3;5;4",
        "soundness": "3;3;3;3",
        "contribution": "3;2;3;3",
        "presentation": "3;3;3;4",
        "wc_summary": "41;22;75;90",
        "wc_strengths": "26;35;67;54",
        "wc_weaknesses": "116;60;125;103",
        "wc_questions": "4;74;25;61",
        "wc_review": "187;191;292;308",
        "wc_reply_reviewers": "15;69;0;128",
        "wc_reply_authors": "522;1281;1430;1270",
        "reply_reviewers": "1;1;0;1",
        "reply_authors": "2;3;3;4",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            57.0,
            26.89795531262553
        ],
        "wc_strengths_avg": [
            45.5,
            16.00781059358212
        ],
        "wc_weaknesses_avg": [
            101.0,
            24.92990172463582
        ],
        "wc_questions_avg": [
            41.0,
            27.90161285660741
        ],
        "wc_review_avg": [
            244.5,
            55.80546568213547
        ],
        "wc_reply_reviewers_avg": [
            53.0,
            50.333885206687555
        ],
        "wc_reply_authors_avg": [
            1125.75,
            354.2572335182445
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            3.0,
            0.7071067811865476
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 40,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13695122104976738429&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 5,
        "openreview": "https://openreview.net/forum?id=zYXFMeHRtO",
        "pdf": "https://openreview.net/pdf?id=zYXFMeHRtO",
        "email": "hku.hk;baidu.com;baidu.com;hku.hk",
        "author_num": 4,
        "aff_unique_index": "0;1;1;0",
        "aff_unique_norm": "University of Hong Kong;Baidu",
        "aff_unique_dep": ";Baidu, Inc.",
        "aff_unique_url": "https://www.hku.hk;https://www.baidu.com",
        "aff_unique_abbr": "HKU;Baidu",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "za9tj3izLn",
        "title": "A Unified View on Neural Message Passing with Opinion Dynamics for Social Networks",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Social networks represent a common form of interconnected data frequently depicted as graphs within the domain of deep learning-based inference. These communities inherently form dynamic systems, achieving stability through continuous internal communications and opinion exchanges among social actors along their social ties. In contrast, neural message passing in deep learning provides a clear and intuitive mathematical framework for understanding information propagation and aggregation among connected nodes in graphs. Node representations are dynamically updated by considering both the connectivity and status of neighboring nodes. This research harmonizes concepts from sociometry and neural message passing to analyze and infer the behavior of dynamic systems. Drawing inspiration from opinion dynamics in sociology, we propose ODNet, a novel message passing scheme incorporating bounded confidence, to refine the influence weight of local nodes for message propagation. We adjust the similarity cutoffs of bounded confidence and influence weights of ODNet and define opinion exchange rules that align with the characteristics of social network graphs. We show that ODNet enhances prediction performance across various graph types and alleviates oversmoothing issues. Furthermore, our approach surpasses conventional baselines in graph representation learning and proves its practical significance in analyzing real-world co-occurrence networks of metabolic genes. Remarkably, our method simplifies complex social network graphs solely by leveraging knowledge of interaction frequencies among entities within the system. It accurately identifies internal communities and the roles of genes in different metabolic pathways, including opinion leaders, bridge communicators, and isolators.",
        "keywords": "graph neural networks;neural message passing;opinion dynamics;sociology;genetic networks",
        "primary_area": "learning on graphs and other geometries & topologies",
        "supplementary_material": "/attachment/288adbfb2974df1d1c6bff59b41d2e637812487c.pdf",
        "author": "Outongyi Lv;Bingxin Zhou;Jing Wang;Xiang Xiao;Weishu Zhao;Lirong Zheng",
        "authorids": "~Outongyi_Lv1;~Bingxin_Zhou1;~Jing_Wang43;~Xiang_Xiao1;~Weishu_Zhao1;~Lirong_Zheng1",
        "gender": "M;F;;;;M",
        "homepage": "http://github.com;;;https://life.sjtu.edu.cn/teacher/XiangXiao;https://life.sjtu.edu.cn/teacher/weishuzhao;",
        "dblp": ";;;;;",
        "google_scholar": ";OsvArmcAAAAJ;;;;TdEQHXQAAAAJ",
        "orcid": ";;0000-0003-0547-6780;;;",
        "linkedin": ";;;;;",
        "or_profile": "~Outongyi_Lv1;~Bingxin_Zhou1;~Jing_Wang43;~Xiang_Xiao1;~Weishu_Zhao1;~Lirong_Zheng1",
        "aff": "Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;Shanghai Jiaotong University;University of Michigan",
        "aff_domain": "sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;sjtu.edu.cn;umich.edu",
        "position": "PhD student;Researcher;Postdoc;Principal Researcher;Assistant Professor;Postdoc",
        "bibtex": "@misc{\nlv2024a,\ntitle={A Unified View on Neural Message Passing with Opinion Dynamics for Social Networks},\nauthor={Outongyi Lv and Bingxin Zhou and Jing Wang and Xiang Xiao and Weishu Zhao and Lirong Zheng},\nyear={2024},\nurl={https://openreview.net/forum?id=za9tj3izLn}\n}",
        "github": "",
        "project": "",
        "reviewers": "vhvr;gTLa;Qd4r",
        "site": "https://openreview.net/forum?id=za9tj3izLn",
        "pdf_size": 2454590,
        "rating": "3;5;5",
        "confidence": "2;4;4",
        "soundness": "1;2;3",
        "contribution": "2;2;2",
        "presentation": "1;3;2",
        "wc_summary": "51;124;247",
        "wc_strengths": "41;62;11",
        "wc_weaknesses": "297;74;58",
        "wc_questions": "2;37;1",
        "wc_review": "391;297;317",
        "wc_reply_reviewers": "118;0;0",
        "wc_reply_authors": "1845;939;1116",
        "reply_reviewers": "1;0;0",
        "reply_authors": "4;2;3",
        "rating_avg": [
            4.333333333333333,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.9428090415820634
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            140.66666666666666,
            80.87988350359782
        ],
        "wc_strengths_avg": [
            38.0,
            20.92844953645635
        ],
        "wc_weaknesses_avg": [
            143.0,
            109.09017676521871
        ],
        "wc_questions_avg": [
            13.333333333333334,
            16.73983937265296
        ],
        "wc_review_avg": [
            335.0,
            40.431011200150145
        ],
        "wc_reply_reviewers_avg": [
            39.333333333333336,
            55.62573345334173
        ],
        "wc_reply_authors_avg": [
            1300.0,
            392.08927554831183
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.0,
            0.816496580927726
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=2860909993541028031&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0;0;1",
        "aff_unique_norm": "Shanghai Jiao Tong University;University of Michigan",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.sjtu.edu.cn;https://www.umich.edu",
        "aff_unique_abbr": "SJTU;UM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "zamGHHs2u8",
        "title": "If there is no underfitting, there is no Cold Posterior Effect",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The cold posterior effect (CPE) (Wenzel et al., 2020) in Bayesian deep learning shows that, for posteriors with a temperature T<1, the resulting posterior predictive could have better performances than the Bayesian posterior (T=1). In recent years, there have been several main hypotheses to explain CPE: prior misspecification, likelihood misspecification and data augmentation. In this work, we show a more nuanced understanding of the CPE as we show that \\emph{misspecification leads to CPE only when the resulting Bayesian posterior underfits}. In fact, we theoretically show that if there is no underfitting, there is no CPE.",
        "keywords": "Bayesian neural networks;model misspecification;prior misspecification;cold posterior effect",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "/attachment/83940a8865063679c2407d362ab3efe0e5421998.zip",
        "author": "Yijie Zhang;Yi-Shan Wu;Luis A. Ortega;Andres R Masegosa",
        "authorids": "~Yijie_Zhang1;~Yi-Shan_Wu1;~Luis_A._Ortega1;~Andres_R_Masegosa1",
        "gender": "M;Non-Binary;M;M",
        "homepage": "https://sites.google.com/view/yijiezhang/home;https://scholar.google.com/citations?user=IrW8ytQAAAAJ&hl=en;https://andresmasegosa.github.io/;",
        "dblp": ";138/4357-3;70/2802;304/8839",
        "google_scholar": "HVR4014AAAAJ;IrW8ytQAAAAJ;J1zoY7AAAAAJ;1Ly8qeoAAAAJ",
        "orcid": ";0000-0002-7949-0115;;",
        "linkedin": ";;;ludvins",
        "or_profile": "~Yijie_Zhang1;~Yi-Shan_Wu1;~Andres_R_Masegosa1;~Luis_Antonio_Ortega_Andr\u00e9s1",
        "aff": "University of Copenhagen;University of Southern Denmark - SDU;Aalborg University;Universidad Aut\u00f3noma de Madrid",
        "aff_domain": "di.ku.dk;sdu.dk;cs.aau.dk;uam.es",
        "position": "PhD student;Postdoc;Associate Professor;PhD student",
        "bibtex": "@misc{\nzhang2024if,\ntitle={If there is no underfitting, there is no Cold Posterior Effect},\nauthor={Yijie Zhang and Yi-Shan Wu and Luis A. Ortega and Andres R Masegosa},\nyear={2024},\nurl={https://openreview.net/forum?id=zamGHHs2u8}\n}",
        "github": "",
        "project": "",
        "reviewers": "B5C9;MuTU;wHkC;dcZF",
        "site": "https://openreview.net/forum?id=zamGHHs2u8",
        "pdf_size": 7392066,
        "rating": "5;5;5;8",
        "confidence": "4;3;4;3",
        "soundness": "2;2;2;4",
        "contribution": "3;3;2;4",
        "presentation": "3;3;3;3",
        "wc_summary": "80;57;29;126",
        "wc_strengths": "110;39;34;112",
        "wc_weaknesses": "464;117;182;44",
        "wc_questions": "61;136;58;130",
        "wc_review": "715;349;303;412",
        "wc_reply_reviewers": "372;70;96;0",
        "wc_reply_authors": "1249;606;1229;387",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "3;2;3;1",
        "rating_avg": [
            5.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.8660254037844386
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            73.0,
            35.531676008879735
        ],
        "wc_strengths_avg": [
            73.75,
            37.298625980054545
        ],
        "wc_weaknesses_avg": [
            201.75,
            159.08547230969899
        ],
        "wc_questions_avg": [
            96.25,
            36.82645109157275
        ],
        "wc_review_avg": [
            444.75,
            160.75505435288807
        ],
        "wc_reply_reviewers_avg": [
            134.5,
            141.54416271962614
        ],
        "wc_reply_authors_avg": [
            867.75,
            379.3042149778987
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.82915619758885
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.5773502691896257,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=4576511590856714798&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;3",
        "aff_unique_norm": "University of Copenhagen;University of Southern Denmark;Aalborg University;Universidad Aut\u00f3noma de Madrid",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.ku.dk;https://www.sdu.dk;https://www.aau.dk;https://www.uam.es",
        "aff_unique_abbr": "UCPH;SDU;AAU;UAM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "Denmark;Spain"
    },
    {
        "title": "On the Limitations of Temperature Scaling for Distributions with Overlaps",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17379",
        "id": "zavLQJ1XjB",
        "author_site": "Muthu Chidambaram, Rong Ge",
        "tldr": "",
        "abstract": "Despite the impressive generalization capabilities of deep neural networks, they have been repeatedly shown to be overconfident when they are wrong. Fixing this issue is known as model calibration, and has consequently received much attention in the form of modified training schemes and post-training calibration procedures such as temperature scaling. While temperature scaling is frequently used because of its simplicity, it is often outperformed by modified training schemes. In this work, we identify a specific bottleneck for the performance of temperature scaling.  We show that for empirical risk minimizers for a general set of distributions in which the supports of classes have overlaps, the performance of temperature scaling degrades with the amount of overlap between classes, and asymptotically becomes no better than random when there are a large number of classes. On the other hand, we prove that optimizing a modified form of the empirical risk induced by the Mixup data augmentation technique can in fact lead to reasonably good calibration performance, showing that training-time calibration may be necessary in some situations. We also verify that our theoretical results reflect practice by showing that Mixup significantly outperforms empirical risk minimization (with respect to multiple calibration metrics) on image classification benchmarks with class overlaps introduced in the form of label noise.",
        "keywords": "calibration;temperature scaling;mixup;label noise",
        "primary_area": "learning theory",
        "supplementary_material": "/attachment/bc181efe1d30a16ff0c40a2c58bd661e4ea210d5.zip",
        "author": "Muthu Chidambaram;Rong Ge",
        "authorids": "~Muthu_Chidambaram1;~Rong_Ge1",
        "gender": "M;M",
        "homepage": "https://2014mchidamb.github.io/;https://users.cs.duke.edu/~rongge/",
        "dblp": "304/3319;89/6869-1.html",
        "google_scholar": "R43EbqAAAAAJ;https://scholar.google.com.tw/citations?user=MVxcjEoAAAAJ",
        "orcid": ";",
        "linkedin": "muthu-chidambaram-b8803919a/;",
        "or_profile": "~Muthu_Chidambaram1;~Rong_Ge1",
        "aff": "Duke University;Duke University",
        "aff_domain": "duke.edu;duke.edu",
        "position": "PhD student;Associate Professor",
        "bibtex": "@inproceedings{\nchidambaram2024on,\ntitle={On the Limitations of Temperature Scaling for Distributions with Overlaps},\nauthor={Muthu Chidambaram and Rong Ge},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=zavLQJ1XjB}\n}",
        "github": "",
        "project": "",
        "reviewers": "JXm6;dtwE;UALj",
        "pdf_size": 1578782,
        "rating": "6;6;8",
        "confidence": "3;3;2",
        "soundness": "3;3;4",
        "contribution": "2;3;3",
        "presentation": "4;3;4",
        "wc_summary": "77;90;137",
        "wc_strengths": "174;52;80",
        "wc_weaknesses": "41;125;97",
        "wc_questions": "75;54;5",
        "wc_review": "367;321;319",
        "wc_reply_reviewers": "0;47;0",
        "wc_reply_authors": "316;856;489",
        "reply_reviewers": "0;1;0",
        "reply_authors": "1;2;1",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            101.33333333333333,
            25.77250904010361
        ],
        "wc_strengths_avg": [
            102.0,
            52.17917847826532
        ],
        "wc_weaknesses_avg": [
            87.66666666666667,
            34.92213560989012
        ],
        "wc_questions_avg": [
            44.666666666666664,
            29.32954520994525
        ],
        "wc_review_avg": [
            335.6666666666667,
            22.17105219775452
        ],
        "wc_reply_reviewers_avg": [
            15.666666666666666,
            22.15601247717849
        ],
        "wc_reply_authors_avg": [
            553.6666666666666,
            225.14637214241068
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.9999999999999998,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5507657131694538294&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=zavLQJ1XjB",
        "pdf": "https://openreview.net/pdf?id=zavLQJ1XjB",
        "email": "duke.edu;duke.edu",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Duke University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.duke.edu",
        "aff_unique_abbr": "Duke",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "How do Language Models Bind Entities in Context?",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17378",
        "id": "zb3b6oKO77",
        "author_site": "Jiahai Feng, Jacob Steinhardt",
        "tldr": "",
        "abstract": "Language models (LMs) can recall facts mentioned in context, as shown by their performance on reading comprehension tasks. When the context describes facts about more than one entity, the LM has to correctly bind attributes to their corresponding entity. We show, via causal experiments, that LMs' internal activations represent binding information by exhibiting appropriate binding ID vectors at the entity and attribute positions. We further show that binding ID vectors form a subspace and often transfer across tasks. Our results demonstrate that LMs learn interpretable strategies for representing symbolic knowledge in context, and that studying context activations is a fruitful direction for understanding LM cognition.",
        "keywords": "Interpretability;Learned Representations;Neurosymbolic AI",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "",
        "author": "Jiahai Feng;Jacob Steinhardt",
        "authorids": "~Jiahai_Feng1;~Jacob_Steinhardt1",
        "gender": "M;",
        "homepage": "https://jiahai-feng.github.io/;",
        "dblp": ";35/10625",
        "google_scholar": "vyB1pH4AAAAJ;",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Jiahai_Feng1;~Jacob_Steinhardt1",
        "aff": "University of California, Berkeley;University of California, Berkeley",
        "aff_domain": "berkeley.edu;berkeley.edu",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nfeng2024how,\ntitle={How do Language Models Bind Entities in Context?},\nauthor={Jiahai Feng and Jacob Steinhardt},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=zb3b6oKO77}\n}",
        "github": "",
        "project": "",
        "reviewers": "aQw7;n1nh;H1Kh;f6eM",
        "pdf_size": 948619,
        "rating": "5;5;6;6",
        "confidence": "2;3;2;3",
        "soundness": "3;3;3;3",
        "contribution": "3;2;4;3",
        "presentation": "2;1;2;3",
        "wc_summary": "66;87;90;203",
        "wc_strengths": "40;36;176;70",
        "wc_weaknesses": "47;53;165;244",
        "wc_questions": "117;142;502;35",
        "wc_review": "270;318;933;552",
        "wc_reply_reviewers": "0;0;89;105",
        "wc_reply_authors": "449;509;1443;1150",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "2;2;3;2",
        "rating_avg": [
            5.5,
            0.5
        ],
        "confidence_avg": [
            2.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            111.5,
            53.63068151720618
        ],
        "wc_strengths_avg": [
            80.5,
            56.681125606325075
        ],
        "wc_weaknesses_avg": [
            127.25,
            82.17169524842481
        ],
        "wc_questions_avg": [
            199.0,
            179.3585793877728
        ],
        "wc_review_avg": [
            518.25,
            262.1472630030686
        ],
        "wc_reply_reviewers_avg": [
            48.5,
            48.82878249557324
        ],
        "wc_reply_authors_avg": [
            887.75,
            422.2057407236429
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 34,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16486882646167246607&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=zb3b6oKO77",
        "pdf": "https://openreview.net/pdf?id=zb3b6oKO77",
        "email": "berkeley.edu;berkeley.edu",
        "author_num": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of California, Berkeley",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.berkeley.edu",
        "aff_unique_abbr": "UC Berkeley",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Berkeley",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Shadow Cones: A Generalized Framework for Partial Order Embeddings",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17377",
        "id": "zbKcFZ6Dbp",
        "author_site": "Tao Yu, Toni Liu, Albert Tseng, Christopher De Sa",
        "tldr": "",
        "abstract": "Hyperbolic space has proven to be well-suited for capturing hierarchical relations in data, such as trees and directed acyclic graphs. Prior work introduced the concept of entailment cones, which uses partial orders defined by nested cones in the Poincar\\'e ball to model hierarchies. Here, we introduce the ``shadow cones\" framework, a physics-inspired entailment cone construction. Specifically, we model partial orders as subset relations between shadows formed by a light source and opaque objects in hyperbolic space. The shadow cones framework generalizes entailment cones to a broad class of formulations and hyperbolic space models beyond the Poincar\\'e ball. This results in clear advantages over existing constructions: for example, shadow cones possess better optimization properties over constructions limited to the Poincar\\'e ball. Our experiments on datasets of various sizes and hierarchical structures show that shadow cones consistently and significantly outperform existing entailment cone constructions. These results indicate that shadow cones are an effective way to model partial orders in hyperbolic space, offering physically intuitive and novel insights about the nature of such structures.",
        "keywords": "partial order embedding;hyperbolic space;shadow cone;representation learning;entailment cone;hierarchy",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/3e87cfdc660f197049b53306e9a9f4f4a1b03032.pdf",
        "author": "Tao Yu;Toni J.B. Liu;Albert Tseng;Christopher De Sa",
        "authorids": "~Tao_Yu1;~Toni_J.B._Liu1;~Albert_Tseng1;~Christopher_De_Sa2",
        "gender": "M;M;;M",
        "homepage": "https://ydtydr.github.io/;;https://tsengalb99.github.io/;http://cs.cornell.edu/~cdesa",
        "dblp": ";348/5536;249/9439;154/6336",
        "google_scholar": "lbi95bUAAAAJ;;;",
        "orcid": ";0009-0001-3142-5402;;",
        "linkedin": "tao-yu-220720182/;toni-jb-liu;;",
        "or_profile": "~Tao_Yu1;~Toni_J.B._Liu1;~Albert_Tseng1;~Christopher_De_Sa1",
        "aff": "Cornell University;Cornell University;Cornell University;Cornell University",
        "aff_domain": "cornell.edu;cornell.edu;cs.cornell.edu;cornell.edu",
        "position": "PhD student;PhD student;PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\nyu2024shadow,\ntitle={Shadow Cones: A Generalized Framework for Partial Order Embeddings},\nauthor={Tao Yu and Toni J.B. Liu and Albert Tseng and Christopher De Sa},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=zbKcFZ6Dbp}\n}",
        "github": "",
        "project": "",
        "reviewers": "irmp;s6e6;SzVy;Arvf;6mLv;JBVb",
        "pdf_size": 1712820,
        "rating": "6;6;6;6;6;8",
        "confidence": "4;3;3;4;3;3",
        "soundness": "4;2;2;3;3;3",
        "contribution": "3;2;2;3;3;3",
        "presentation": "2;3;3;3;2;3",
        "wc_summary": "32;146;52;48;98;105",
        "wc_strengths": "84;105;89;37;80;59",
        "wc_weaknesses": "261;55;436;108;115;115",
        "wc_questions": "64;178;184;4;2;124",
        "wc_review": "441;484;761;197;295;403",
        "wc_reply_reviewers": "493;50;0;0;51;22",
        "wc_reply_authors": "801;262;745;268;215;261",
        "reply_reviewers": "1;1;0;0;1;1",
        "reply_authors": "2;1;1;1;2;1",
        "rating_avg": [
            6.333333333333333,
            0.7453559924999298
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.8333333333333335,
            0.6871842709362768
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            80.16666666666667,
            39.61656499776605
        ],
        "wc_strengths_avg": [
            75.66666666666667,
            21.982316125063395
        ],
        "wc_weaknesses_avg": [
            181.66666666666666,
            129.96110529265627
        ],
        "wc_questions_avg": [
            92.66666666666667,
            74.73211417382015
        ],
        "wc_review_avg": [
            430.1666666666667,
            175.99281866662122
        ],
        "wc_reply_reviewers_avg": [
            102.66666666666667,
            175.7798496857804
        ],
        "wc_reply_authors_avg": [
            425.3333333333333,
            246.97818167243483
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.31622776601683805,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1951197941906202317&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=zbKcFZ6Dbp",
        "pdf": "https://openreview.net/pdf?id=zbKcFZ6Dbp",
        "email": "cornell.edu;cornell.edu;cs.cornell.edu;cornell.edu",
        "author_num": 4,
        "aff_unique_index": "0;0;0;0",
        "aff_unique_norm": "Cornell University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cornell.edu",
        "aff_unique_abbr": "Cornell",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "A ROBUST DIFFERENTIAL NEURAL ODE OPTIMIZER",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17376",
        "id": "zbOSJ3CATY",
        "author_site": "Panagiotis Theodoropoulos, Guan-Horng Liu, Tianrong Chen, Augustinos Saravanos, Evangelos Theodorou",
        "tldr": "",
        "abstract": "Neural networks and neural ODEs tend to be vulnerable to adversarial attacks, rendering robust optimizers critical to curb the success of such attacks. In this regard, the key insight of this work is to interpret Neural ODE optimization as a min-max optimal control problem. More particularly, we present Game Theoretic Second-Order Neural Optimizer (GTSONO), a robust game theoretic optimizer based on the principles of min-max Differential Dynamic Programming.\nThe proposed method exhibits significant computational benefits due to efficient matrix decompositions and provides convergence guarantees to local saddle points.\nEmpirically, the robustness of the proposed optimizer is demonstrated through greater robust accuracy  compared to benchmark optimizers when trained on clean images. Additionally, its ability to provide a performance increase when adapted to an already existing adversarial defense technique is also illustrated.\nFinally, the superiority of the proposed update law over its gradient based counterpart highlights the potential benefits of incorporating robust optimal control paradigms into adversarial training methods.",
        "keywords": "Neural Optimizer;Differential Dynamic Programming;Adversarial Defense;Game Theory",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Panagiotis Theodoropoulos;Guan-Horng Liu;Tianrong Chen;Augustinos D Saravanos;Evangelos Theodorou",
        "authorids": "~Panagiotis_Theodoropoulos1;~Guan-Horng_Liu1;~Tianrong_Chen1;~Augustinos_D_Saravanos1;~Evangelos_Theodorou1",
        "gender": "M;;M;M;M",
        "homepage": ";https://ghliu.github.io;https://tianrongchen.github.io/;https://asaravanos.github.io/;",
        "dblp": ";143/6907;227/7295;;155/9964",
        "google_scholar": "https://scholar.google.com/citations?hl=en;2Dt0VJ4AAAAJ;r9D3Fg50gMoC;6XP9s1MAAAAJ;",
        "orcid": ";;;;",
        "linkedin": ";;tianrong-chen-757b3216a/;https://linkedin.com/in/augustine-saravanos;",
        "or_profile": "~Panagiotis_Theodoropoulos1;~Guan-Horng_Liu1;~Tianrong_Chen1;~Augustinos_D_Saravanos1;~Evangelos_Theodorou1",
        "aff": "Georgia Institute of Technology;Georgia Institute of Technology;Georgia Institute of Technology;Georgia Institute of Technology;Georgia Institute of Technology",
        "aff_domain": "gatech.edu;gatech.edu;gatech.edu;gatech.edu;gatech.edu",
        "position": "PhD student;PhD student;PhD student;PhD student;Assistant Professor",
        "bibtex": "@inproceedings{\ntheodoropoulos2024a,\ntitle={A {ROBUST} {DIFFERENTIAL} {NEURAL} {ODE} {OPTIMIZER}},\nauthor={Panagiotis Theodoropoulos and Guan-Horng Liu and Tianrong Chen and Augustinos D Saravanos and Evangelos Theodorou},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=zbOSJ3CATY}\n}",
        "github": "",
        "project": "",
        "reviewers": "gukw;L7bT;veDw",
        "pdf_size": 1314367,
        "rating": "6;6;6",
        "confidence": "3;3;4",
        "soundness": "3;3;3",
        "contribution": "3;3;2",
        "presentation": "2;2;3",
        "wc_summary": "77;50;55",
        "wc_strengths": "113;62;57",
        "wc_weaknesses": "105;236;142",
        "wc_questions": "129;141;4",
        "wc_review": "424;489;258",
        "wc_reply_reviewers": "0;97;68",
        "wc_reply_authors": "600;817;1166",
        "reply_reviewers": "0;1;1",
        "reply_authors": "2;2;4",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.3333333333333335,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            60.666666666666664,
            11.728408057172787
        ],
        "wc_strengths_avg": [
            77.33333333333333,
            25.30261295246446
        ],
        "wc_weaknesses_avg": [
            161.0,
            55.142240312365495
        ],
        "wc_questions_avg": [
            91.33333333333333,
            61.94800687314771
        ],
        "wc_review_avg": [
            390.3333333333333,
            97.26367370309545
        ],
        "wc_reply_reviewers_avg": [
            55.0,
            40.65300316909769
        ],
        "wc_reply_authors_avg": [
            861.0,
            233.15374040891274
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            2.6666666666666665,
            0.9428090415820634
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:e8D_20v5QqQJ:scholar.google.com/&scioq=A+ROBUST+DIFFERENTIAL+NEURAL+ODE+OPTIMIZER&hl=en&as_sdt=0,33",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=zbOSJ3CATY",
        "pdf": "https://openreview.net/pdf?id=zbOSJ3CATY",
        "email": "gatech.edu;gatech.edu;gatech.edu;gatech.edu;gatech.edu",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Georgia Institute of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.gatech.edu",
        "aff_unique_abbr": "Georgia Tech",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "zdboax4dlK",
        "title": "Ricci Curvature, Robustness, and Causal Inference on Networked Data",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "In the complex landscape of networked data, understanding the causal effects of interventions is a critical challenge with implications across various domains. Graph Neural Networks (GNNs) have emerged as a powerful tool for capturing complex dependencies, yet the potential of geometric deep learning for GNN-based network causal inference remains underexplored. This work makes three key contributions to bridge this gap. First, we establish a theoretical connection between graph curvature and causal inference, revealing that negative curvatures pose challenges in identifying causal effects. Second, based on this theoretical insight, we present computational results using Ricci curvature to predict the reliability of causal effect estimations, empirically demonstrating that positive curvature regions yield more accurate estimations. Lastly, we propose a method using Ricci flow to improve treatment effect estimation on networked data, showing superior performance by reducing error through flattening the edges in the network. Our findings open new avenues for leveraging geometry in causal effect estimation, offering insights and tools that enhance the performance of GNNs in causal inference tasks.",
        "keywords": "Curvature;Causal Inference;Geometric Deep Learning;Graph Neural Networks;Networks",
        "primary_area": "causal reasoning",
        "supplementary_material": "",
        "author": "Amirhossein Farzam;Allen Tannenbaum;Guillermo Sapiro",
        "authorids": "~Amirhossein_Farzam1;~Allen_Tannenbaum2;~Guillermo_Sapiro1",
        "gender": ";M;",
        "homepage": ";https://www.cs.stonybrook.edu/people/faculty/AllenTannenbaum;",
        "dblp": ";;82/5175",
        "google_scholar": ";https://scholar.google.com.tw/citations?user=w0Vl_lsAAAAJ;https://scholar.google.co.il/citations?user=ISRNX3gAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Amirhossein_Farzam1;~Allen_Tannenbaum2;~Guillermo_Sapiro1",
        "aff": ";State University of New York at Stony Brook;Duke University",
        "aff_domain": ";stonybrook.edu;duke.edu",
        "position": ";Full Professor;Full Professor",
        "bibtex": "@misc{\nfarzam2024ricci,\ntitle={Ricci Curvature, Robustness, and Causal Inference on Networked Data},\nauthor={Amirhossein Farzam and Allen Tannenbaum and Guillermo Sapiro},\nyear={2024},\nurl={https://openreview.net/forum?id=zdboax4dlK}\n}",
        "github": "",
        "project": "",
        "reviewers": "poe6;UoX4;fMiq",
        "site": "https://openreview.net/forum?id=zdboax4dlK",
        "pdf_size": 2773693,
        "rating": "3;3;5",
        "confidence": "5;3;4",
        "soundness": "2;2;2",
        "contribution": "1;3;3",
        "presentation": "1;2;2",
        "wc_summary": "57;89;35",
        "wc_strengths": "17;74;856",
        "wc_weaknesses": "64;192;7",
        "wc_questions": "173;196;7",
        "wc_review": "311;551;905",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "356;439;327",
        "reply_reviewers": "0;0;0",
        "reply_authors": "1;1;1",
        "rating_avg": [
            3.6666666666666665,
            0.9428090415820634
        ],
        "confidence_avg": [
            4.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.0,
            0.0
        ],
        "contribution_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "presentation_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            60.333333333333336,
            22.17105219775452
        ],
        "wc_strengths_avg": [
            315.6666666666667,
            382.78134170248626
        ],
        "wc_weaknesses_avg": [
            87.66666666666667,
            77.3577547646144
        ],
        "wc_questions_avg": [
            125.33333333333333,
            84.19949854693647
        ],
        "wc_review_avg": [
            589.0,
            243.98360600663315
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            374.0,
            47.462265713582056
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:u5akVNsGr7QJ:scholar.google.com/&scioq=Ricci+Curvature,+Robustness,+and+Causal+Inference+on+Networked+Data&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "State University of New York at Stony Brook;Duke University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.stonybrook.edu;https://www.duke.edu",
        "aff_unique_abbr": "SUNY Stony Brook;Duke",
        "aff_campus_unique_index": "0",
        "aff_campus_unique": "Stony Brook;",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "On the Joint Interaction of Models, Data, and Features",
        "status": "Oral",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17375",
        "id": "ze7DOLi394",
        "author_site": "Yiding Jiang, Christina Baek, J Kolter",
        "tldr": "",
        "abstract": "Learning features from data is one of the defining characteristics of deep learning,\nbut the theoretical understanding of the role features play in deep learning is still in\nearly development. To address this gap, we introduce a new tool, the interaction\ntensor, for empirically analyzing the interaction between data and model through\nfeatures. With the interaction tensor, we make several key observations about\nhow features are distributed in data and how models with different random seeds\nlearn different features. Based on these observations, we propose a conceptual\nframework for feature learning. Under this framework, the expected accuracy for a\nsingle hypothesis and agreement for a pair of hypotheses can both be derived in\nclosed form. We demonstrate that the proposed framework can explain empirically\nobserved phenomena, including the recently discovered Generalization Disagreement Equality (GDE) that allows for estimating the generalization error with only\nunlabeled data. Further, our theory also provides explicit construction of natural\ndata distributions that break the GDE. Thus, we believe this work provides valuable\nnew insight into our understanding of feature learning.",
        "keywords": "Generalization;feature learning;empirical phenomena",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/7f182dd585626e040afef3bdb2c8ab2af85d88ba.zip",
        "author": "Yiding Jiang;Christina Baek;J Zico Kolter",
        "authorids": "~Yiding_Jiang2;~Christina_Baek2;~J_Zico_Kolter1",
        "gender": "M;;M",
        "homepage": "https://yidingjiang.github.io/;https://kebaek.github.io;http://www.zicokolter.com",
        "dblp": ";202/7238;67/2526",
        "google_scholar": "x9qzWg8AAAAJ;;UXh1I6UAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Yiding_Jiang2;~Christina_Baek2;~Zico_Kolter1",
        "aff": "Carnegie Mellon University;Carnegie Mellon University;Carnegie Mellon University",
        "aff_domain": "andrew.cmu.edu;cmu.edu;cmu.edu",
        "position": "PhD student;PhD student;Full Professor",
        "bibtex": "@inproceedings{\njiang2024on,\ntitle={On the Joint Interaction of Models, Data, and Features},\nauthor={Yiding Jiang and Christina Baek and J Zico Kolter},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ze7DOLi394}\n}",
        "github": "",
        "project": "",
        "reviewers": "MLur;PinD;PxMC;AyvM",
        "pdf_size": 12288265,
        "rating": "6;8;8;8",
        "confidence": "4;4;4;2",
        "soundness": "3;3;3;3",
        "contribution": "3;4;3;3",
        "presentation": "4;4;3;3",
        "wc_summary": "65;106;51;114",
        "wc_strengths": "79;92;40;76",
        "wc_weaknesses": "396;100;16;12",
        "wc_questions": "35;88;2;48",
        "wc_review": "575;386;109;250",
        "wc_reply_reviewers": "401;43;10;19",
        "wc_reply_authors": "1632;291;108;266",
        "reply_reviewers": "2;1;1;1",
        "reply_authors": "3;1;1;1",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            84.0,
            26.61766330841233
        ],
        "wc_strengths_avg": [
            71.75,
            19.292161620720474
        ],
        "wc_weaknesses_avg": [
            131.0,
            156.98089055678082
        ],
        "wc_questions_avg": [
            43.25,
            30.80077109424373
        ],
        "wc_review_avg": [
            330.0,
            172.0479584302005
        ],
        "wc_reply_reviewers_avg": [
            118.25,
            163.69082900394878
        ],
        "wc_reply_authors_avg": [
            574.25,
            614.7098400871748
        ],
        "reply_reviewers_avg": [
            1.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.3333333333333333,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1046639089473925904&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=ze7DOLi394",
        "pdf": "https://openreview.net/pdf?id=ze7DOLi394",
        "email": "andrew.cmu.edu;cmu.edu;cmu.edu",
        "author_num": 3,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Carnegie Mellon University",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.cmu.edu",
        "aff_unique_abbr": "CMU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "zec5DTsCLv",
        "title": "Tailored Visions: Enhancing Text-to-Image Generation with Personalized Prompt Rewriting",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "We propose a novel perspective of viewing large pretrained models as search engines, thereby enabling the repurposing of techniques previously used to enhance search engine performance. As an illustration, we employ a personalized query rewriting technique in the realm of text-to-image generation. Despite significant progress in the field, it is still challenge to create personalized visual representations that align closely with the desires and preferences of individual users. This process requires users to articulate their ideas in words that are both comprehensible to the models and accurately capture their vision, posing difficulties for many users. In this paper, we tackle this challenge by leveraging historical user interactions with the system to enhance user prompts. We propose a novel approach that involves rewriting user prompts based a new large-scale text-to-image dataset with over 300k prompts from 3115 users. Our rewriting model enhances the expressiveness and alignment of user prompts with their intended visual outputs. Experimental results demonstrate the superiority of our methods over baseline approaches, as evidenced in our new offline evaluation method and online tests. Our approach opens up exciting possibilities of applying more search engine techniques to build truly personalized large pretrained models.",
        "keywords": "Text-to-Image Generation;Personalization;Prompt Rewritting",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Zijie Chen;Lichao Zhang;Fangsheng Weng;Lili Pan;Zhenzhong Lan",
        "authorids": "~Zijie_Chen3;~Lichao_Zhang1;~Fangsheng_Weng1;~Lili_Pan2;~Zhenzhong_Lan2",
        "gender": "M;M;;F;",
        "homepage": ";https://github.com/zhanglichao;https://github.com/wfs2018;;",
        "dblp": ";;;60/5610-1;27/3780",
        "google_scholar": "ZoOXqzMAAAAJ;-MPXaHEAAAAJ;;gXpdHzMAAAAJ;tlDABkgAAAAJ",
        "orcid": ";0000-0003-4580-2317;;;",
        "linkedin": ";lichao-zhanglichao-74478b15a/;;;",
        "or_profile": "~Zijie_Chen3;~Lichao_Zhang1;~Fangsheng_Weng1;~Lili_Pan2;~Zhenzhong_Lan2",
        "aff": "Zhejiang University;Westlake University;;University of Electronic Science and Technology of China;Westlake University",
        "aff_domain": "zju.edu.cn;westlake.edu;;uestc.edu.cn;westlake.edu.cn",
        "position": "PhD student;Researcher;;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nchen2024tailored,\ntitle={Tailored Visions: Enhancing Text-to-Image Generation with Personalized Prompt Rewriting},\nauthor={Zijie Chen and Lichao Zhang and Fangsheng Weng and Lili Pan and Zhenzhong Lan},\nyear={2024},\nurl={https://openreview.net/forum?id=zec5DTsCLv}\n}",
        "github": "",
        "project": "",
        "reviewers": "YATF;7uv5;hJxe",
        "site": "https://openreview.net/forum?id=zec5DTsCLv",
        "pdf_size": 24851761,
        "rating": "3;3;3",
        "confidence": "4;4;4",
        "soundness": "1;3;2",
        "contribution": "2;2;2",
        "presentation": "2;3;1",
        "wc_summary": "39;52;30",
        "wc_strengths": "30;39;32",
        "wc_weaknesses": "320;198;143",
        "wc_questions": "6;4;56",
        "wc_review": "395;293;261",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            2.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            40.333333333333336,
            9.030811456096044
        ],
        "wc_strengths_avg": [
            33.666666666666664,
            3.8586123009300755
        ],
        "wc_weaknesses_avg": [
            220.33333333333334,
            73.96545740336424
        ],
        "wc_questions_avg": [
            22.0,
            24.055491403558285
        ],
        "wc_review_avg": [
            316.3333333333333,
            57.13920623257632
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 10,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14321227432684678&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 6,
        "aff_unique_index": "0;1;2;1",
        "aff_unique_norm": "Zhejiang University;Westlake University;University of Electronic Science and Technology of China",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.zju.edu.cn;https://www.westlake.edu.cn;https://www.uestc.edu.cn",
        "aff_unique_abbr": "ZJU;WU;UESTC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "zeobgjmUCc",
        "title": "Using Machine Learning Models to Predict Genitourinary Involvement Among Gastrointestinal Stromal Tumour Patients",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Gastrointestinal stromal tumors (GISTs) can lead to involvement of other organs, including the genitourinary (GU) system. Machine learning may be a valuable tool in predicting GU involvement in GIST patients, and thus improving prognosis. This study aims to evaluate the use of machine learning algorithms to predict GU involvement among GIST patients in a specialist research center in Saudi Arabia. We analyzed data from all patients with histopathologically confirmed GIST at our facility from 2003 to 2020. Patient files were reviewed for the presence of renal cell carcinoma, adrenal tumors, or other genitourinary cancers. Three supervised machine learning algorithms were used: Logistic Regression, XGBoost Regressor, and Random Forests. A set of variables, including independent attributes, was entered into the models. A total of 170 patients were included in the study, with 58.8% (n=100) being male. The median age was 57 (range 9-91) years. The majority of GISTs were gastric (60%, n=102) with a spindle cell histology. The most common stage at diagnosis was T2 (27.6%, n=47) and N0 (20%, n=34). Six patients (3.5%) had GU involvement. The Random Forest model achieved the highest accuracy with 97.1%. Our study suggests that the Random Forest model is an effective tool for predicting GU involvement in GIST patients. Larger multicenter studies, utilizing more powerful algorithms such as deep learning and other artificial intelligence subsets, are necessary to further refine and improve these predictions.",
        "keywords": "Artificial intelligence;Gastrointestinal stromal tumors;Genitourinary oncology;Gastrointestinal oncology;Urology;Urologic oncology",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Abdulhameed Abiola Dere;Muhammad Alghafees",
        "authorids": "~Abdulhameed_Abiola_Dere1;alghafees687@gmail.com",
        "gender": "M;",
        "homepage": ";",
        "dblp": ";",
        "google_scholar": "https://scholar.google.com/citations?hl=en;",
        "orcid": "0000-0002-2656-538X;",
        "linkedin": "abdulhameed-dere-16a803155;",
        "or_profile": "~Abdulhameed_Abiola_Dere1;alghafees687@gmail.com",
        "aff": "University of Ilorin;",
        "aff_domain": "unilorin.edu.ng;",
        "position": "Undergrad student;",
        "bibtex": "@misc{\ndere2024using,\ntitle={Using Machine Learning Models to Predict Genitourinary Involvement Among Gastrointestinal Stromal Tumour Patients},\nauthor={Abdulhameed Abiola Dere and Muhammad Alghafees},\nyear={2024},\nurl={https://openreview.net/forum?id=zeobgjmUCc}\n}",
        "github": "",
        "project": "",
        "reviewers": "fnHf;GWdB;Seo4;UWW5",
        "site": "https://openreview.net/forum?id=zeobgjmUCc",
        "pdf_size": 122089,
        "rating": "1;1;1;1",
        "confidence": "5;5;5;5",
        "soundness": "1;1;1;2",
        "contribution": "1;1;1;1",
        "presentation": "1;1;1;1",
        "wc_summary": "56;26;12;57",
        "wc_strengths": "28;20;7;33",
        "wc_weaknesses": "117;20;38;100",
        "wc_questions": "2;1;15;1",
        "wc_review": "203;67;72;191",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            1.0,
            0.0
        ],
        "confidence_avg": [
            5.0,
            0.0
        ],
        "soundness_avg": [
            1.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            1.0,
            0.0
        ],
        "presentation_avg": [
            1.0,
            0.0
        ],
        "wc_summary_avg": [
            37.75,
            19.395553614166314
        ],
        "wc_strengths_avg": [
            22.0,
            9.82344135219425
        ],
        "wc_weaknesses_avg": [
            68.75,
            40.702426217610174
        ],
        "wc_questions_avg": [
            4.75,
            5.931905258852336
        ],
        "wc_review_avg": [
            133.25,
            63.91547152294192
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Swl0MZFZm0MJ:scholar.google.com/&scioq=Using+Machine+Learning+Models+to+Predict+Genitourinary+Involvement+Among+Gastrointestinal+Stromal+Tumour+Patients&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0",
        "aff_unique_norm": "University of Ilorin",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.unilorin.edu.ng",
        "aff_unique_abbr": "Unilorin",
        "aff_country_unique_index": "0",
        "aff_country_unique": "Nigeria"
    },
    {
        "id": "zfLf2qniFH",
        "title": "Leveraging Print Debugging to Improve Code Generation in Large Language Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Large language models (LLMs) have made significant progress in code generation tasks, but their performance in tackling programming problems with complex data structures and algorithms remains suboptimal. To address this issue, we propose an in-context learning approach that guides LLMs to debug using a ``print debugging'' strategy, which involves inserting print statements to trace and analysing logs for fixing the bug. We collect a Leetcode problem dataset and evaluate our methodology using the Leetcode online judging system. Experiments with GPT-4 demonstrate the effectiveness of our approach, outperforming rubber duck debugging in easy and medium-level Leetcode problems by 1.5\\% and 17.9\\%.",
        "keywords": "Large Language Model;In-context Learning;Code Generation",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Xueyu Hu;Kun Kuang;Jiankai Sun;Hongxia Yang;Fei Wu",
        "authorids": "~Xueyu_Hu1;~Kun_Kuang1;~Jiankai_Sun5;~Hongxia_Yang2;~Fei_Wu1",
        "gender": ";M;M;F;M",
        "homepage": ";http://kunkuang.github.io;http://jiankai.me;https://www4.comp.polyu.edu.hk/~hongxyang/;https://person.zju.edu.cn/wufei",
        "dblp": ";194/4245;;;84/3254-1",
        "google_scholar": ";https://scholar.google.com.hk/citations?user=FOsNiMQAAAAJ;GQ6xw-oAAAAJ;iJlC5mMAAAAJ;XJLn4MYAAAAJ",
        "orcid": ";0009-0000-7528-8131;;;",
        "linkedin": ";;jiankaisun/;;",
        "or_profile": "~Xueyu_Hu1;~Kun_Kuang1;~Jiankai_Sun5;~Hongxia_Yang2;~Fei_Wu1",
        "aff": ";Zhejiang University;ByteDance Inc.;ByteDance Inc.;Zhejiang University",
        "aff_domain": ";zju.edu.cn;bytedance.com;bytedance.com;zju.edu.cn",
        "position": ";Associate Professor;Research Scientist;Principal Researcher;Full Professor",
        "bibtex": "@misc{\nhu2024leveraging,\ntitle={Leveraging Print Debugging to Improve Code Generation in Large Language Models},\nauthor={Xueyu Hu and Kun Kuang and Jiankai Sun and Hongxia Yang and Fei Wu},\nyear={2024},\nurl={https://openreview.net/forum?id=zfLf2qniFH}\n}",
        "github": "",
        "project": "",
        "reviewers": "VJBR;Yd6T;afP2;aiKM",
        "site": "https://openreview.net/forum?id=zfLf2qniFH",
        "pdf_size": 1559028,
        "rating": "3;3;5;6",
        "confidence": "3;5;5;4",
        "soundness": "3;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "2;3;3;3",
        "wc_summary": "72;20;107;29",
        "wc_strengths": "15;32;86;53",
        "wc_weaknesses": "152;157;91;17",
        "wc_questions": "62;78;408;2",
        "wc_review": "301;287;692;101",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            1.299038105676658
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            57.0,
            34.92134018046845
        ],
        "wc_strengths_avg": [
            46.5,
            26.48112535373072
        ],
        "wc_weaknesses_avg": [
            104.25,
            56.68057427373156
        ],
        "wc_questions_avg": [
            137.5,
            158.72224166763775
        ],
        "wc_review_avg": [
            345.25,
            215.2003427041881
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.17407765595569782,
        "gs_citation": 20,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=362202018521789594&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;1;1;0",
        "aff_unique_norm": "Zhejiang University;ByteDance",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.zju.edu.cn;https://www.bytedance.com",
        "aff_unique_abbr": "ZJU;ByteDance",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "zgHamUBuuO",
        "title": "Sparling: Learning Latent Representations With Extremely Sparse Activations",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Real-world processes often contain intermediate state that can be modeled as an extremely sparse tensor. We introduce Sparling, a technique that allows you to learn models with intermediate layers that match this state from only end-to-end labeled examples (i.e., no supervision on the intermediate state). Sparling uses a new kind of informational bottleneck that enforces levels of activation sparsity unachievable using other techniques. We find that extreme sparsity is necessary to achieve good intermediate state modeling. On our synthetic DigitCircle domain as well as the LaTeXOCR and AudioMNISTSequence domains, we are able to precisely localize the intermediate states up to feature permutation with $>90\\%$ accuracy, even though we only train end-to-end.",
        "keywords": "machine learning;sparsity;interpretability;optimization",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Kavi Gupta;Osbert Bastani;Armando Solar-Lezama",
        "authorids": "~Kavi_Gupta1;~Osbert_Bastani1;~Armando_Solar-Lezama1",
        "gender": "Non-Binary;M;M",
        "homepage": ";http://obastani.github.io;https://people.csail.mit.edu/asolar/",
        "dblp": "245/4802;21/11275;95/6919",
        "google_scholar": "OqL9swoAAAAJ;cxYepGkAAAAJ;https://scholar.google.com.tw/citations?user=8BX3BokAAAAJ",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Kavi_Gupta1;~Osbert_Bastani1;~Armando_Solar-Lezama1",
        "aff": "Massachussets Institute of Technology;University of Pennsylvania;Massachusetts Institute of Technology",
        "aff_domain": "mit.edu;upenn.edu;mit.edu",
        "position": "PhD student;Assistant Professor;Full Professor",
        "bibtex": "@misc{\ngupta2024sparling,\ntitle={Sparling: Learning Latent Representations With Extremely Sparse Activations},\nauthor={Kavi Gupta and Osbert Bastani and Armando Solar-Lezama},\nyear={2024},\nurl={https://openreview.net/forum?id=zgHamUBuuO}\n}",
        "github": "",
        "project": "",
        "reviewers": "qwvn;QB7p;M5Zp;eQb3",
        "site": "https://openreview.net/forum?id=zgHamUBuuO",
        "pdf_size": 1321752,
        "rating": "1;3;3;5",
        "confidence": "3;3;3;4",
        "soundness": "1;2;2;3",
        "contribution": "2;2;2;3",
        "presentation": "1;3;2;4",
        "wc_summary": "48;108;68;75",
        "wc_strengths": "44;40;53;53",
        "wc_weaknesses": "230;237;134;131",
        "wc_questions": "50;14;15;59",
        "wc_review": "372;399;270;318",
        "wc_reply_reviewers": "0;0;115;0",
        "wc_reply_authors": "576;715;396;752",
        "reply_reviewers": "0;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            3.0,
            1.4142135623730951
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            74.75,
            21.602951187279945
        ],
        "wc_strengths_avg": [
            47.5,
            5.678908345800274
        ],
        "wc_weaknesses_avg": [
            183.0,
            50.57173123396113
        ],
        "wc_questions_avg": [
            34.5,
            20.254629100529094
        ],
        "wc_review_avg": [
            339.75,
            49.721097131901665
        ],
        "wc_reply_reviewers_avg": [
            28.75,
            49.79646071760522
        ],
        "wc_reply_authors_avg": [
            609.75,
            139.76833511207036
        ],
        "reply_reviewers_avg": [
            0.25,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.816496580927726,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=5188293241693060490&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Massachusetts Institute of Technology;University of Pennsylvania",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.mit.edu;https://www.upenn.edu",
        "aff_unique_abbr": "MIT;UPenn",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Rigid Protein-Protein Docking via Equivariant Elliptic-Paraboloid Interface Prediction",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17374",
        "id": "zgQ0PHeGnL",
        "author_site": "Ziyang Yu, Wenbing Huang, Yang Liu",
        "tldr": "",
        "abstract": "The study of rigid protein-protein docking plays an essential role in a variety of tasks such as drug design and protein engineering. Recently, several learning-based methods have been proposed for the task, exhibiting much faster docking speed than those computational methods. In this paper, we propose a novel learning-based method called ElliDock, which predicts an elliptic paraboloid to represent the protein-protein docking interface. To be specific, our model estimates elliptic paraboloid interfaces for the two input proteins respectively, and obtains the roto-translation transformation for docking by making two interfaces coincide. By its design, ElliDock is independently equivariant with respect to arbitrary rotations/translations of the proteins, which is an indispensable property to ensure the generalization of the docking process. Experimental evaluations show that ElliDock achieves the fastest inference time among all compared methods, and outperforms state-of-the-art learning-based methods, like DiffDock-PP and Alphafold-Multimer, for particularly antibody-antigen docking.",
        "keywords": "Equivariant Graph Neural Network;rigid body protein-protein docking;interface fitting",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Ziyang Yu;Wenbing Huang;Yang Liu",
        "authorids": "~Ziyang_Yu2;~Wenbing_Huang1;~Yang_Liu19",
        "gender": "M;M;M",
        "homepage": "https://yaledeus.github.io/;https://gsai.ruc.edu.cn/english/wenbing_huang;http://nlp.csai.tsinghua.edu.cn/~ly/",
        "dblp": ";155/3181-1.html;51/3710-5",
        "google_scholar": "UGH_ISwAAAAJ;0yNkmO4AAAAJ;https://scholar.google.com.hk/citations?user=lVhoKNcAAAAJ",
        "orcid": "0009-0004-6027-7658;;0000-0002-3087-242X",
        "linkedin": ";;",
        "or_profile": "~Ziyang_Yu2;~Wenbing_Huang1;~Yang_Liu19",
        "aff": "Tsinghua University;Renmin University of China;Tsinghua University",
        "aff_domain": "tsinghua.edu.cn;ruc.edu.cn;tsinghua.edu.cn",
        "position": "Undergrad student;Associate Professor;Professor",
        "bibtex": "@inproceedings{\nyu2024rigid,\ntitle={Rigid Protein-Protein Docking via Equivariant Elliptic-Paraboloid Interface Prediction},\nauthor={Ziyang Yu and Wenbing Huang and Yang Liu},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=zgQ0PHeGnL}\n}",
        "github": "",
        "project": "",
        "reviewers": "raHF;ptkL;SQcb;5pax",
        "pdf_size": 3587525,
        "rating": "3;5;8;8",
        "confidence": "4;4;3;3",
        "soundness": "3;3;3;3",
        "contribution": "2;2;3;3",
        "presentation": "3;2;3;3",
        "wc_summary": "98;61;301;78",
        "wc_strengths": "62;72;88;49",
        "wc_weaknesses": "118;223;241;58",
        "wc_questions": "60;169;84;105",
        "wc_review": "338;525;714;290",
        "wc_reply_reviewers": "0;27;32;10",
        "wc_reply_authors": "611;802;689;753",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "2;3;2;2",
        "rating_avg": [
            6.0,
            2.1213203435596424
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            134.5,
            97.01675113092584
        ],
        "wc_strengths_avg": [
            67.75,
            14.254385290148432
        ],
        "wc_weaknesses_avg": [
            160.0,
            75.32927717693832
        ],
        "wc_questions_avg": [
            104.5,
            40.5
        ],
        "wc_review_avg": [
            466.75,
            167.5878500965986
        ],
        "wc_reply_reviewers_avg": [
            17.25,
            12.871965661856
        ],
        "wc_reply_authors_avg": [
            713.75,
            71.58692268843521
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.25,
            0.4330127018922193
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.9428090415820635,
        "gs_citation": 9,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13957980889561907976&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=zgQ0PHeGnL",
        "pdf": "https://openreview.net/pdf?id=zgQ0PHeGnL",
        "email": "tsinghua.edu.cn;ruc.edu.cn;tsinghua.edu.cn",
        "author_num": 3,
        "aff_unique_index": "0;1;0",
        "aff_unique_norm": "Tsinghua University;Renmin University of China",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.tsinghua.edu.cn;http://www.ruc.edu.cn",
        "aff_unique_abbr": "THU;RUC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "zhINOCrrqI",
        "title": "AttributionLab: Faithfulness of Feature Attribution Under Controllable Environments",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Feature attribution explains neural network outputs by identifying relevant input features.\nHow do we know if the identified features are indeed relevant to the network? This notion is referred to as _faithfulness_, an essential property that reflects the alignment between the identified (attributed) features and the features used by the model.\nOne recent trend to test faithfulness is to design the data such that we know which input features are relevant to the label and then train a model on the designed data.\nSubsequently, the identified features are evaluated by comparing them with these designed ground truth features.\nHowever, this idea has the underlying assumption that the neural network learns to use _all_ and _only_ these designed features, while there is no guarantee that the learning process trains the network in this way.\nIn this paper, we solve this missing link by _explicitly designing the neural network_ by manually setting its weights, along with _designing data_, so we know precisely which input features in the dataset are relevant to the designed network. \nThus, we can test faithfulness in _AttributionLab_, our designed synthetic environment, which serves as a sanity check and is effective in filtering out attribution methods. If an attribution method is not faithful in a simple controlled environment, it can be unreliable in more complex scenarios. Furthermore, the AttributionLab environment serves as a laboratory for controlled experiments through which we can study feature attribution methods, identify issues, and suggest potential improvements.",
        "keywords": "feature attribution;explainable AI;explainability;synthetic data",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/977f0ad15d0ef5fd86f10b4bca93fa98fe5cc0cc.zip",
        "author": "Yang Zhang;Yawei Li;Hannah Brown;Mina Rezaei;Bernd Bischl;Philip Torr;Ashkan Khakzar;Kenji Kawaguchi",
        "authorids": "~Yang_Zhang22;~Yawei_Li2;~Hannah_Brown1;~Mina_Rezaei1;~Bernd_Bischl1;~Philip_Torr1;~Ashkan_Khakzar1;~Kenji_Kawaguchi1",
        "gender": "M;M;Non-Binary;F;M;;M;",
        "homepage": "https://github.com/YaNgZhAnG-V5;https://github.com/sandylaker;;https://www.compstat.statistik.uni-muenchen.de/people/minar/;https://www.slds.stat.uni-muenchen.de/;http://www.robots.ox.ac.uk/~tvg/;http://ashk-on.github.io/;https://ml.comp.nus.edu.sg/#members",
        "dblp": ";;261/4912;205/2767;48/5326;;201/0889;",
        "google_scholar": "Ri0ENAUAAAAJ;https://scholar.google.com/citations?authuser=1;t4wu34QAAAAJ;https://scholar.google.de/citations?hl=en;https://scholar.google.de/citations?user=s34UckkAAAAJ;;Tc4cWAcAAAAJ;aLl3rYoAAAAJ",
        "orcid": ";;0000-0001-6350-874X;0000-0001-6994-6345;0000-0001-6002-6980;;;",
        "linkedin": ";;;mina-rezaei-b88a3a69/;;;;",
        "or_profile": "~Yang_Zhang22;~Yawei_Li2;~Hannah_Brown1;~Mina_Rezaei1;~Bernd_Bischl1;~Philip_Torr1;~Ashkan_Khakzar1;~Kenji_Kawaguchi1",
        "aff": "National University of Singapore;Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen;National University of Singapore;Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen;LMU;University of Oxford;University of Oxford;National University of Singapore",
        "aff_domain": "nus.edu;lmu.de;nus.edu;lmu.de;uni-muenchen.de;ox.ac.uk;ox.ac.uk;nus.edu",
        "position": "PhD student;PhD student;PhD student;Principal Researcher;Full Professor;Full Professor;Postdoc;Presidential Young Professor",
        "bibtex": "@misc{\nzhang2024attributionlab,\ntitle={AttributionLab: Faithfulness of Feature Attribution Under Controllable Environments},\nauthor={Yang Zhang and Yawei Li and Hannah Brown and Mina Rezaei and Bernd Bischl and Philip Torr and Ashkan Khakzar and Kenji Kawaguchi},\nyear={2024},\nurl={https://openreview.net/forum?id=zhINOCrrqI}\n}",
        "github": "",
        "project": "",
        "reviewers": "gSud;MuCE;2xtR;7XTH",
        "site": "https://openreview.net/forum?id=zhINOCrrqI",
        "pdf_size": 5663863,
        "rating": "5;6;6;6",
        "confidence": "2;4;2;4",
        "soundness": "3;3;3;3",
        "contribution": "3;3;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "102;53;275;172",
        "wc_strengths": "52;51;71;139",
        "wc_weaknesses": "71;111;38;256",
        "wc_questions": "51;149;9;212",
        "wc_review": "276;364;393;779",
        "wc_reply_reviewers": "116;44;27;0",
        "wc_reply_authors": "739;760;229;1452",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "3;3;2;3",
        "rating_avg": [
            5.75,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.0,
            1.0
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            150.5,
            83.39814146610223
        ],
        "wc_strengths_avg": [
            78.25,
            35.967867604293694
        ],
        "wc_weaknesses_avg": [
            119.0,
            83.21358062239601
        ],
        "wc_questions_avg": [
            105.25,
            79.86981595070819
        ],
        "wc_review_avg": [
            453.0,
            193.08417853361263
        ],
        "wc_reply_reviewers_avg": [
            46.75,
            42.949825377991935
        ],
        "wc_reply_authors_avg": [
            795.0,
            434.8465246497895
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            2.75,
            0.4330127018922193
        ],
        "replies_avg": [
            20,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7646466841858545096&as_sdt=5,48&sciodt=0,48&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;0;1;2;3;3;0",
        "aff_unique_norm": "National University of Singapore;Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen;Ludwig Maximilian University of Munich;University of Oxford",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.nus.edu.sg;https://www.lmu.de;https://www.lmu.de;https://www.ox.ac.uk",
        "aff_unique_abbr": "NUS;LMU;LMU;Oxford",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;1;1;2;2;0",
        "aff_country_unique": "Singapore;Germany;United Kingdom"
    },
    {
        "id": "zhJDD85QHD",
        "title": "CEIR: Concept-based Explainable Image Representation Learning",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In modern machine learning, the trend of harnessing self-supervised learning to derive high-quality representations without label dependency has garnered significant attention. However, the absence of label information, coupled with the inherently high-dimensional nature improves the difficulty for the interpretation of learned representations. Consequently, indirect evaluations become the popular metric for evaluating the quality of these features, leading to a biased validation of the learned representation's rationale. To address these challenges, we introduce a novel approach termed \\textit{\\textbf{Concept-based Explainable Image Representation (CEIR)}}. Initially, using the Concept-based Model (CBM) incorporated with pretrained CLIP and concepts generated by GPT-4, we project input images into a concept vector space. Subsequently, a Variational Autoencoder (VAE) learns the latent representation from these projected concepts, which serves as the final image representation. Due to the representation's capability to encapsulate high-level, semantically relevant concepts, the model allows for attributions to a human-comprehensible concept space. This not only enhances interpretability but also preserves the robustness essential for downstream tasks. For instance, our method exhibits state-of-the-art unsupervised clustering performance on benchmarks such as CIFAR10, CIFAR100, and STL10. Furthermore, capitalizing on the universality of human conceptual understanding, CEIR can seamlessly extract the related concept from open-world images without fine-tuning. This offers a fresh approach to automatic label generation and label manipulation.",
        "keywords": "Explainability;Representation Learning;Concept Bottleneck Layer",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/2edbe29a9e691f9d871edf05b4e69055ab6a0233.zip",
        "author": "Yan Cui;Shuhong Liu;Liuzhuozheng Li;Zhiyuan Yuan",
        "authorids": "~Yan_Cui6;~Shuhong_Liu1;~Liuzhuozheng_Li1;~Zhiyuan_Yuan1",
        "gender": "Not Specified;;M;M",
        "homepage": "https://scholar.google.co.jp/citations?user=0ybmZnEAAAAJ&hl=zh-CN;;https://github.com/liuzhuozheng-LI;https://yuanzhiyuan.github.io/",
        "dblp": "70/2104-8;;;",
        "google_scholar": "https://scholar.google.co.jp/citations?user=0ybmZnEAAAAJ;;;",
        "orcid": "0009-0003-6066-8117;;;",
        "linkedin": "yan-cui-68872a220/;;;",
        "or_profile": "~Yan_Cui6;~Shuhong_Liu1;~Liuzhuozheng_Li1;~Zhiyuan_Yuan1",
        "aff": "Kyoto University, Kyoto University;;The University of Tokyo, Tokyo University;Fudan University",
        "aff_domain": "i.kyoto-u.ac.jp;;t.u-tokyo.ac.jp;fudan.edu.cn",
        "position": "MS student;;MS student;Assistant Professor",
        "bibtex": "@misc{\ncui2024ceir,\ntitle={{CEIR}: Concept-based Explainable Image Representation Learning},\nauthor={Yan Cui and Shuhong Liu and Liuzhuozheng Li and Zhiyuan Yuan},\nyear={2024},\nurl={https://openreview.net/forum?id=zhJDD85QHD}\n}",
        "github": "",
        "project": "",
        "reviewers": "mkN4;8cNt;Xytc;XinF",
        "site": "https://openreview.net/forum?id=zhJDD85QHD",
        "pdf_size": 24773848,
        "rating": "3;3;3;3",
        "confidence": "4;4;4;4",
        "soundness": "1;1;3;2",
        "contribution": "1;2;2;2",
        "presentation": "2;1;1;2",
        "wc_summary": "77;82;100;125",
        "wc_strengths": "13;19;64;90",
        "wc_weaknesses": "147;296;146;268",
        "wc_questions": "24;11;225;222",
        "wc_review": "261;408;535;705",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            1.75,
            0.82915619758885
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            1.5,
            0.5
        ],
        "wc_summary_avg": [
            96.0,
            18.801595676963167
        ],
        "wc_strengths_avg": [
            46.5,
            31.925694980689144
        ],
        "wc_weaknesses_avg": [
            214.25,
            68.4703402941741
        ],
        "wc_questions_avg": [
            120.5,
            103.1079531365064
        ],
        "wc_review_avg": [
            477.25,
            163.37437834617765
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 5,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16317450819809526356&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2",
        "aff_unique_norm": "Kyoto University;University of Tokyo;Fudan University",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.kyoto-u.ac.jp;https://www.u-tokyo.ac.jp;https://www.fudan.edu.cn",
        "aff_unique_abbr": "Kyoto U;UTokyo;Fudan",
        "aff_campus_unique_index": "0;1",
        "aff_campus_unique": "Kyoto;Tokyo;",
        "aff_country_unique_index": "0;0;1",
        "aff_country_unique": "Japan;China"
    },
    {
        "id": "zhZXk5Ctz2",
        "title": "Rethinking RGB Color Representation for Image Restoration Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "The per-pixel distance loss defined in the RGB color domain has been almost a compulsory choice for training image restoration models, despite its well-known tendency to guide the model to produce blurry, unrealistic textures. To enhance the visual plausibility of restored images, recent methods employ auxiliary objectives such as perceptual or adversarial losses. Nevertheless, they still do not eliminate the reliance on the per-pixel distance in the RGB domain. In this work, we try to redefine the very representation space over which the per-pixel distance is measured. Our augmented RGB ($a$RGB) space is the latent space of an autoencoder that comprises a single affine decoder and a nonlinear encoder, trained to preserve color information while capturing low-level image structures. As a direct consequence, per-pixel distance metrics, e.g., $L_{1}$, $L_{2}$, and smooth $L_{1}$ losses, can also be defined over our $a$RGB space in the same way as for the RGB space. We then replace the per-pixel losses in the RGB space with their counterparts in training various image restoration models such as deblurring, denoising, and perceptual super-resolution. By simply redirecting the loss function to act upon the proposed $a$RGB space, we demonstrate boosted performance without any modification to model architectures or other hyperparameters. Our results imply that the RGB color is not the optimal representation for image restoration tasks.",
        "keywords": "representation learning;image restoration;representation space;loss function;image super-resolution;image deblurring;image denoising;interpretability",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Jaerin Lee;JoonKyu Park;Sungyong Baik;Kyoung Mu Lee",
        "authorids": "~Jaerin_Lee1;~JoonKyu_Park1;~Sungyong_Baik1;~Kyoung_Mu_Lee2",
        "gender": "M;M;M;M",
        "homepage": "https://jaerinlee.com;https://jkpark0825.github.io/;https://dsybaik-hy.github.io/;https://cv.snu.ac.kr/kmlee/",
        "dblp": "275/3156;290/1681;243/2775;17/4029",
        "google_scholar": "LMMwadAAAAAJ;anUxIqcAAAAJ;lQ4gotkAAAAJ;Hofj9kAAAAAJ",
        "orcid": "0009-0005-5271-8270;0000-0003-3247-6831;;",
        "linkedin": "jaerin-lee-626ab1b1/;;;",
        "or_profile": "~Jaerin_Lee1;~JoonKyu_Park1;~Sungyong_Baik1;~Kyoung_Mu_Lee1",
        "aff": "Seoul National University;Meta Reality Labs Research;Hanyang University;Seoul National University",
        "aff_domain": "snu.ac.kr;meta.com;hanyang.ac.kr;snu.ac.kr",
        "position": "PhD student;Intern;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nlee2024rethinking,\ntitle={Rethinking {RGB} Color Representation for Image Restoration Models},\nauthor={Jaerin Lee and JoonKyu Park and Sungyong Baik and Kyoung Mu Lee},\nyear={2024},\nurl={https://openreview.net/forum?id=zhZXk5Ctz2}\n}",
        "github": "",
        "project": "",
        "reviewers": "tXWj;cKyU;JdZe;nF5y",
        "site": "https://openreview.net/forum?id=zhZXk5Ctz2",
        "pdf_size": 20421689,
        "rating": "3;5;6;8",
        "confidence": "5;4;4;5",
        "soundness": "2;2;3;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;4;4",
        "wc_summary": "70;70;59;106",
        "wc_strengths": "25;51;69;53",
        "wc_weaknesses": "126;139;27;72",
        "wc_questions": "28;2;157;53",
        "wc_review": "249;262;312;284",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "1248;1019;1121;915",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            5.5,
            1.8027756377319946
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.5,
            0.5
        ],
        "wc_summary_avg": [
            76.25,
            17.75352077758099
        ],
        "wc_strengths_avg": [
            49.5,
            15.771810295587505
        ],
        "wc_weaknesses_avg": [
            91.0,
            44.68221122549778
        ],
        "wc_questions_avg": [
            60.0,
            58.834513680322026
        ],
        "wc_review_avg": [
            276.75,
            23.889066536807167
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            1075.75,
            123.2667331440239
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:2IwKqgICO7kJ:scholar.google.com/&scioq=Rethinking+RGB+Color+Representation+for+Image+Restoration+Models&hl=en&as_sdt=0,18",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Seoul National University;Meta;Hanyang University",
        "aff_unique_dep": ";Research;",
        "aff_unique_url": "https://www.snu.ac.kr;https://www.meta.com;https://www.hanyang.ac.kr",
        "aff_unique_abbr": "SNU;MRL;HYU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;0;0",
        "aff_country_unique": "South Korea;United States"
    },
    {
        "title": "Long-Term Typhoon Trajectory Prediction: A Physics-Conditioned Approach Without Reanalysis Data",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17373",
        "id": "ziDFH8TPPK",
        "author_site": "Young-Jae Park, Minseok Seo, Doyi Kim, Hyeri Kim, Sanghoon Choi, Beomkyu Choi, Jeongwon Ryu, Sohee Son, Hae-Gon Jeon, Yeji Choi",
        "tldr": "",
        "abstract": "In the face of escalating climate changes, typhoon intensities and their ensuing damage have surged. Accurate trajectory prediction is crucial for effective damage control. Traditional physics-based models, while comprehensive, are computationally intensive and rely heavily on the expertise of forecasters. Contemporary data-driven methods often rely on reanalysis data, which can be considered to be the closest to the true representation of weather conditions. However, reanalysis data is not produced in real-time and requires time for adjustment since prediction models are calibrated with observational data. This reanalysis data, such as ERA5, falls short in challenging real-world situations. Optimal preparedness necessitates predictions at least 72 hours in advance, beyond the capabilities of standard physics models. In response to these constraints, we present an approach that harnesses real-time Unified Model (UM) data, sidestepping the limitations of reanalysis data. Our model provides predictions at 6-hour intervals for up to 72 hours in advance and outperforms both state-of-the-art data-driven methods and numerical weather prediction models. In line with our efforts to mitigate adversities inflicted by \\rthree{typhoons}, we release our preprocessed \\textit{PHYSICS TRACK} dataset, which includes ERA5 reanalysis data, typhoon best-track, and UM forecast data.",
        "keywords": "Weather Forecasting;Typhoon Trajectory Forecasting;Tropical Cyclone;Climate Change",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "",
        "author": "Young-Jae Park;Minseok Seo;Doyi Kim;Hyeri Kim;Sanghoon Choi;Beomkyu Choi;Jeongwon Ryu;Sohee Son;Hae-Gon Jeon;Yeji Choi",
        "authorids": "~Young-Jae_Park1;~Minseok_Seo1;~Doyi_Kim1;~Hyeri_Kim1;~Sanghoon_Choi1;~Beomkyu_Choi1;~Jeongwon_Ryu1;~Sohee_Son2;~Hae-Gon_Jeon3;~Yeji_Choi1",
        "gender": "M;M;F;;;;M;F;M;F",
        "homepage": "https://sites.google.com/view/yjparkcv/;https://sites.google.com/view/minseokcv/%ED%99%88;;;;;;;https://sites.google.com/site/hgjeoncv/;",
        "dblp": ";;;;;;;;142/2427;",
        "google_scholar": "https://scholar.google.co.kr/citations?user=eaT9X2MAAAAJ;https://scholar.google.co.kr/citations?user=pOygDIIAAAAJ;;;;;https://scholar.google.co.kr/citations?user=XpOx40MAAAAJ;https://scholar.google.com/citations?view_op=list_works;https://scholar.google.co.kr/citations?user=Ei00xroAAAAJ;qIskcgsAAAAJ",
        "orcid": ";;0000-0002-9849-3127;;;;;;0000-0003-1105-1666;0000-0002-8212-1126",
        "linkedin": ";;;hyeri-kim-511211b2;sanghoon-choi-5482b0179/;beomkyu-choi-8ba338283;jeongwon-ryu-05b6581b8/;;;",
        "or_profile": "~Young-Jae_Park1;~Minseok_Seo1;~Doyi_Kim1;~Hyeri_Kim1;~Sanghoon_Choi1;~Beomkyu_Choi1;~Jeongwon_Ryu1;~Sohee_Son2;~Hae-Gon_Jeon3;~Yeji_Choi1",
        "aff": "GWANGJU INSTITUTE OF SCIENCE AND TECHNOLOGY;SI Analytics;SI Analytics;SI Analytics;The University of Manchester;SI-Analytics;SI Analytics;SIAnalytics;Gwangju Institute of Science and Technology;SI Analytics",
        "aff_domain": "gm.gist.ac.kr;si-analytics.ai;si-analytics.ai;si-analytics.ai;manchester.ac.uk;si-analytics.ai;si-analytics.ai;si-analytics.ai;gist.ac.kr;si-analytics.ai",
        "position": "PhD student;Researcher;Researcher;Researcher;MS student;Researcher;Researcher;Researcher;Associate Professor;Research Scientist",
        "bibtex": "@inproceedings{\npark2024longterm,\ntitle={Long-Term Typhoon Trajectory Prediction: A Physics-Conditioned Approach Without Reanalysis Data},\nauthor={Young-Jae Park and Minseok Seo and Doyi Kim and Hyeri Kim and Sanghoon Choi and Beomkyu Choi and Jeongwon Ryu and Sohee Son and Hae-Gon Jeon and Yeji Choi},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ziDFH8TPPK}\n}",
        "github": "",
        "project": "",
        "reviewers": "k3qU;j264;cnGt;y7ao",
        "pdf_size": 42630447,
        "rating": "3;6;8;8",
        "confidence": "4;3;4;4",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;2",
        "presentation": "1;3;3;2",
        "wc_summary": "45;144;27;109",
        "wc_strengths": "115;79;113;45",
        "wc_weaknesses": "204;85;156;163",
        "wc_questions": "154;107;272;59",
        "wc_review": "518;415;568;376",
        "wc_reply_reviewers": "0;0;0;87",
        "wc_reply_authors": "1206;923;875;669",
        "reply_reviewers": "0;0;0;2",
        "reply_authors": "2;2;2;2",
        "rating_avg": [
            6.25,
            2.0463381929681126
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            81.25,
            47.34118186103934
        ],
        "wc_strengths_avg": [
            88.0,
            28.653097563788805
        ],
        "wc_weaknesses_avg": [
            152.0,
            42.80770958600799
        ],
        "wc_questions_avg": [
            148.0,
            79.07907434966599
        ],
        "wc_review_avg": [
            469.25,
            77.08234233597211
        ],
        "wc_reply_reviewers_avg": [
            21.75,
            37.67210506462308
        ],
        "wc_reply_authors_avg": [
            918.25,
            191.58467449146343
        ],
        "reply_reviewers_avg": [
            0.5,
            0.8660254037844386
        ],
        "reply_authors_avg": [
            2.0,
            0.0
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": 0.07053456158585983,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18159795151666205633&as_sdt=400005&sciodt=0,14&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=ziDFH8TPPK",
        "pdf": "https://openreview.net/pdf?id=ziDFH8TPPK",
        "email": "gm.gist.ac.kr;si-analytics.ai;si-analytics.ai;si-analytics.ai;manchester.ac.uk;si-analytics.ai;si-analytics.ai;si-analytics.ai;gist.ac.kr;si-analytics.ai",
        "author_num": 10,
        "aff_unique_index": "0;1;1;1;2;1;1;3;0;1",
        "aff_unique_norm": "Gwangju Institute of Science and Technology;SI Analytics;University of Manchester;SIAnalytics",
        "aff_unique_dep": ";;;",
        "aff_unique_url": "https://www.gist.ac.kr;;https://www.manchester.ac.uk;",
        "aff_unique_abbr": "GIST;;UoM;",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Gwangju;",
        "aff_country_unique_index": "0;2;0",
        "aff_country_unique": "South Korea;;United Kingdom"
    },
    {
        "id": "zjBO4a1LxR",
        "title": "Meta-Transformer: A Unified Framework for Multimodal Learning",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Multimodal learning aims to build models that can process and relate information from multiple modalities. Despite years of development in this field, it still remains challenging to design a unified network for processing various modalities ($\\textit{e.g.}$ natural language, 2D images, 3D point clouds, audio, video, time series, tabular data) due to the inherent gaps among them. In this work, we propose a framework, named Meta-Transformer, that leverages a $\\textbf{frozen}$ encoder to perform multimodal perception without any paired multimodal training data. In Meta-Transformer, the raw input data from various modalities are mapped into a shared token space, allowing a subsequent encoder with frozen parameters to extract high-level semantic features of the input data. Composed of three main components: a unified data tokenizer, a modality-shared encoder, and task-specific heads for downstream tasks, Meta-Transformer is the first framework to perform unified learning across 12 modalities with unpaired data. Experiments on different benchmarks reveal that Meta-Transformer can handle a wide range of tasks including fundamental perception (text, image, point cloud, audio, video), practical application (X-Ray, infrared, hyperspectral, and IMU), and data mining (graph, tabular, and time-series). Meanwhile, it also excels in multimodal understanding on cross-modal retrieval, referring segmentation, and grounding tasks. Meta-Transformer indicates a promising future for developing unified multimodal intelligence with transformers. We will release well-documented code and pretrained weights soon.",
        "keywords": "Unified Multimodal Learning",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/64dacfaae1d5bd5e1473ae1e8d2bd5a2f1174965.pdf",
        "author": "Yiyuan Zhang;Kaixiong Gong;Kaipeng Zhang;Hongsheng Li;Yu Qiao;Wanli Ouyang;Xiangyu Yue",
        "authorids": "~Yiyuan_Zhang1;~Kaixiong_Gong1;~Kaipeng_Zhang1;~Hongsheng_Li3;~Yu_Qiao1;~Wanli_Ouyang1;~Xiangyu_Yue1",
        "gender": "M;M;M;M;;;M",
        "homepage": "https://invictus717.github.io/;;http://kpzhang93.github.io/;http://www.ee.cuhk.edu.hk/~hsli;;;http://xyue.io/",
        "dblp": "163/6458;289/0124;179/2126;27/7402-1;;;207/7518",
        "google_scholar": "KuYlJCIAAAAJ;kBVshUUAAAAJ;4OqZBmYAAAAJ;BN2Ze-QAAAAJ;;;-xQ-C1sAAAAJ",
        "orcid": "0000-0001-6643-9698;;;;;;",
        "linkedin": ";;;;;;",
        "or_profile": "~Yiyuan_Zhang1;~Kaixiong_Gong1;~Kaipeng_Zhang1;~Hongsheng_Li3;~Yu_Qiao1;~Wanli_Ouyang1;~Xiangyu_Yue1",
        "aff": "The Chinese University of Hong Kong;The Chinese University of Hong Kong;Shanghai AI Laboratory;The Chinese University of Hong Kong;;;The Chinese University of Hong Kong",
        "aff_domain": "ie.cuhk.edu;ie.cuhk.edu;pjlab.org.cn;cuhk.edu.hk;;;ie.cuhk.edu",
        "position": "PhD student;PhD student;Researcher;Associate Professor;;;Assistant Professor",
        "bibtex": "@misc{\nzhang2024metatransformer,\ntitle={Meta-Transformer: A Unified Framework for Multimodal Learning},\nauthor={Yiyuan Zhang and Kaixiong Gong and Kaipeng Zhang and Hongsheng Li and Yu Qiao and Wanli Ouyang and Xiangyu Yue},\nyear={2024},\nurl={https://openreview.net/forum?id=zjBO4a1LxR}\n}",
        "github": "",
        "project": "",
        "reviewers": "UnBq;xeZr;7xkR;NoxF;i7Pr",
        "site": "https://openreview.net/forum?id=zjBO4a1LxR",
        "pdf_size": 1207943,
        "rating": "3;3;5;6;6",
        "confidence": "4;4;3;3;4",
        "soundness": "2;1;3;3;3",
        "contribution": "2;2;2;2;3",
        "presentation": "3;2;3;3;3",
        "wc_summary": "102;90;133;74;55",
        "wc_strengths": "40;24;105;101;79",
        "wc_weaknesses": "91;220;474;151;137",
        "wc_questions": "74;5;6;3;3",
        "wc_review": "307;339;718;329;274",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            4.6,
            1.3564659966250536
        ],
        "confidence_avg": [
            3.6,
            0.4898979485566356
        ],
        "soundness_avg": [
            2.4,
            0.8
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.8,
            0.39999999999999997
        ],
        "wc_summary_avg": [
            90.8,
            26.346916328101855
        ],
        "wc_strengths_avg": [
            69.8,
            32.50476888088885
        ],
        "wc_weaknesses_avg": [
            214.6,
            136.13317009458052
        ],
        "wc_questions_avg": [
            18.2,
            27.92418306772823
        ],
        "wc_review_avg": [
            393.4,
            163.82502861284658
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": -0.5417363388859615,
        "gs_citation": 163,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11077145075852511910&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;1;0;0",
        "aff_unique_norm": "Chinese University of Hong Kong;Shanghai AI Laboratory",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cuhk.edu.hk;https://www.shanghai-ai-lab.com",
        "aff_unique_abbr": "CUHK;SAIL",
        "aff_campus_unique_index": "0;0;0;0",
        "aff_campus_unique": "Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "zkE2js9qRe",
        "title": "Binder: Hierarchical Concept Representation through Order Embedding of Binary Vectors",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "For natural language understanding and generation, embedding concepts using an \norder-based representation is an essential task. Unlike traditional point vector based\nrepresentation, an order-based representation imposes geometric constraints on the\nrepresentation vectors for explicitly capturing various semantic relationships that may exist\nbetween a pair of concepts. In existing literature, several approaches on order-based \nembedding have been proposed, mostly focusing on capturing hierarchical relationships; examples include, Order embedding, Poincar\\'e embedding on hyperbolic space, and Box embedding. \nEach of the above approaches suffers from some significant weaknesses. Order embedding\nfails to capture full spectrum of logical operations (such as, inverse, union)\non their embedding vectors, which are essential for deducing complementary or aggregated concepts. Box embedding overcomes this limitation by making the representation richer,\nbut along the process it sacrifices simplicity requiring custom-made optimization scheme \nfor learning the representation. Poincar\\'e embedding improves embedding quality by \nexploiting the ever-expanding property of hyperbolic space, but it also suffers from the\nsame fate as box embedding as gradient descent like optimization is not easy in the\nhyperbolic space. In this work, we propose BINDER, a novel approach for order-based \nrepresentation. BINDER uses binary bits as representation vectors.\nBINDER uses a simple, yet efficient algorithm for learning representation\nvectors in a fraction of time in comparison to existing order-based representation learning\nmethods. Our experimental results show that BINDER is very accurate, yielding better\nresults than the existing state-of-the-art methods for both prediction and reconstruction tasks.",
        "keywords": "Concept Graph;Hierarchical Embedding;Order Embedding;Binary Vector Embedding",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "/attachment/cf03f510694beafc14442d283479a02190396db6.pdf",
        "author": "Croix Gyurek;Niloy Talukder;Mohammad Hasan",
        "authorids": "~Croix_Gyurek1;~Niloy_Talukder1;~Mohammad_Hasan1",
        "gender": "M;M;M",
        "homepage": ";;http://cs.iupui.edu/~alhasan/",
        "dblp": ";;87/5931.html",
        "google_scholar": "https://scholar.google.com/citations?hl=en;-YDyG6MAAAAJ;https://scholar.google.com.tw/citations?user=fsCnri8AAAAJ",
        "orcid": ";;",
        "linkedin": ";niloytalukder/;",
        "or_profile": "~Croix_Gyurek1;~Niloy_Talukder1;~Mohammad_Hasan1",
        "aff": "University of Waterloo;Indiana University;Indiana University Indianapolis",
        "aff_domain": "uwaterloo.ca;iu.edu;iu.edu",
        "position": "MS student;PhD student;Full Professor",
        "bibtex": "@misc{\ngyurek2024binder,\ntitle={Binder: Hierarchical Concept Representation through Order Embedding of Binary Vectors},\nauthor={Croix Gyurek and Niloy Talukder and Mohammad Hasan},\nyear={2024},\nurl={https://openreview.net/forum?id=zkE2js9qRe}\n}",
        "github": "",
        "project": "",
        "reviewers": "VtjX;JqKj;psGs;wKPf;EAos",
        "site": "https://openreview.net/forum?id=zkE2js9qRe",
        "pdf_size": 531613,
        "rating": "1;3;3;5;6",
        "confidence": "5;4;4;3;4",
        "soundness": "3;2;2;4;3",
        "contribution": "1;3;2;2;3",
        "presentation": "3;2;3;1;4",
        "wc_summary": "291;30;81;44;45",
        "wc_strengths": "29;15;73;71;195",
        "wc_weaknesses": "1110;154;49;556;224",
        "wc_questions": "527;37;102;87;224",
        "wc_review": "1957;236;305;758;688",
        "wc_reply_reviewers": "0;51;42;505;0",
        "wc_reply_authors": "1963;732;827;1112;1327",
        "reply_reviewers": "0;1;1;2;0",
        "reply_authors": "3;1;1;3;3",
        "rating_avg": [
            3.6,
            1.7435595774162693
        ],
        "confidence_avg": [
            4.0,
            0.6324555320336759
        ],
        "soundness_avg": [
            2.8,
            0.7483314773547882
        ],
        "contribution_avg": [
            2.2,
            0.7483314773547882
        ],
        "presentation_avg": [
            2.6,
            1.019803902718557
        ],
        "wc_summary_avg": [
            98.2,
            97.8639872476081
        ],
        "wc_strengths_avg": [
            76.6,
            63.44005044134187
        ],
        "wc_weaknesses_avg": [
            418.6,
            385.07121419290746
        ],
        "wc_questions_avg": [
            195.4,
            176.82827828150113
        ],
        "wc_review_avg": [
            788.8,
            618.942776030224
        ],
        "wc_reply_reviewers_avg": [
            119.6,
            193.83972761020894
        ],
        "wc_reply_authors_avg": [
            1192.2,
            439.06509767914827
        ],
        "reply_reviewers_avg": [
            0.8,
            0.7483314773547883
        ],
        "reply_authors_avg": [
            2.2,
            0.9797958971132712
        ],
        "replies_avg": [
            23,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.7254762501100115,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=16907487671248445587&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;1",
        "aff_unique_norm": "University of Waterloo;Indiana University",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://uwaterloo.ca;https://www.indiana.edu",
        "aff_unique_abbr": "UW;IU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Indianapolis",
        "aff_country_unique_index": "0;1;1",
        "aff_country_unique": "Canada;United States"
    },
    {
        "id": "zkVm3JqJzs",
        "title": "Conformal Prediction for Deep Classifier via Label Ranking",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Conformal prediction is a statistical framework that generates prediction sets containing ground-truth labels with a desired coverage guarantee. \nThe predicted probabilities produced by machine learning models are generally miscalibrated, leading to large prediction sets in conformal prediction. \nIn this paper, we empirically and theoretically show that disregarding the probabilities' value will mitigate the undesirable effect of miscalibrated probability values. \nThen, we propose a novel algorithm named $\\textit{Sorted Adaptive prediction sets}$ (SAPS), which discards all the probability values except for the maximum softmax probability. \nThe key idea behind SAPS is to minimize the dependence of the non-conformity score on the probability values while retaining the uncertainty information.\nIn this manner, SAPS can produce sets of small size and communicate instance-wise uncertainty. \nTheoretically, we provide a finite-sample coverage guarantee of SAPS and show that the expected value of set size from SAPS is always smaller than APS. \nExtensive experiments validate that SAPS not only lessens the prediction sets but also broadly enhances the conditional coverage rate and adaptation of prediction sets.",
        "keywords": "classification;conformal prediction;uncertainty estimation",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/d9f6cc494585fdcb2b4f285768175a94a11ffc42.zip",
        "author": "Jianguo Huang;HuaJun Xi;Linjun Zhang;Huaxiu Yao;Yue Qiu;Hongxin Wei",
        "authorids": "~Jianguo_Huang2;~HuaJun_Xi1;~Linjun_Zhang1;~Huaxiu_Yao1;~Yue_Qiu5;~Hongxin_Wei1",
        "gender": "M;;M;M;M;M",
        "homepage": "https://jianguo99.github.io/;https://github.com/Bei-jifeng?tab=repositories;;http://huaxiuyao.mystrikingly.com;https://faculty.cqu.edu.cn/qiuyue;https://hongxin001.github.io/",
        "dblp": ";;;197/1635;16/1041;150/6350",
        "google_scholar": "r-BhZGwAAAAJ;;TUAzs3sAAAAJ;A20BZnQAAAAJ;https://scholar.google.de/citations?user=QCjHDYQAAAAJ;cABH034AAAAJ",
        "orcid": ";;;;;",
        "linkedin": "jianguo-huang-1471b0232/;;;huaxiuyao/;;",
        "or_profile": "~Jianguo_Huang2;~HuaJun_Xi1;~Linjun_Zhang1;~Huaxiu_Yao1;~Yue_Qiu5;~Hongxin_Wei1",
        "aff": "ShanghaiTech University;Southern University of Science and Technology;Rutgers University;Department of Computer Science, University of North Carolina at Chapel Hill;Chongqing University;Southern University of Science and Technology",
        "aff_domain": "shanghaitech.edu.cn;sustech.edu;rutgers.edu;cs.unc.edu;cqu.edu.cn;sustech.edu.cn",
        "position": "MS student;Undergrad student;Assistant Professor;Assistant Professor;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nhuang2024conformal,\ntitle={Conformal Prediction for Deep Classifier via Label Ranking},\nauthor={Jianguo Huang and HuaJun Xi and Linjun Zhang and Huaxiu Yao and Yue Qiu and Hongxin Wei},\nyear={2024},\nurl={https://openreview.net/forum?id=zkVm3JqJzs}\n}",
        "github": "",
        "project": "",
        "reviewers": "poFk;xE2a;SVnn;JXhd",
        "site": "https://openreview.net/forum?id=zkVm3JqJzs",
        "pdf_size": 473738,
        "rating": "5;5;8;8",
        "confidence": "3;3;4;4",
        "soundness": "3;3;3;4",
        "contribution": "2;3;3;4",
        "presentation": "2;3;4;4",
        "wc_summary": "39;89;85;48",
        "wc_strengths": "40;50;58;24",
        "wc_weaknesses": "244;155;16;2",
        "wc_questions": "112;4;35;82",
        "wc_review": "435;298;194;156",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "813;809;47;181",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "2;3;1;1",
        "rating_avg": [
            6.5,
            1.5
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.25,
            0.82915619758885
        ],
        "wc_summary_avg": [
            65.25,
            22.02697210240209
        ],
        "wc_strengths_avg": [
            43.0,
            12.68857754044952
        ],
        "wc_weaknesses_avg": [
            104.25,
            100.43499141235588
        ],
        "wc_questions_avg": [
            58.25,
            41.64357693570522
        ],
        "wc_review_avg": [
            270.75,
            108.14197843575823
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            462.5,
            351.70833086522134
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            14,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 1.0,
        "gs_citation": 23,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13223554017288004150&as_sdt=5,31&sciodt=0,31&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;1;2;3;4;1",
        "aff_unique_norm": "ShanghaiTech University;Southern University of Science and Technology;Rutgers University;University of North Carolina at Chapel Hill;Chongqing University",
        "aff_unique_dep": ";;;Department of Computer Science;",
        "aff_unique_url": "https://www.shanghaitech.edu.cn;https://www.sustech.edu.cn;https://www.rutgers.edu;https://www.unc.edu;https://www.cqu.edu.cn",
        "aff_unique_abbr": "ShanghaiTech;SUSTech;Rutgers;UNC Chapel Hill;CQU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Chapel Hill",
        "aff_country_unique_index": "0;0;1;1;0;0",
        "aff_country_unique": "China;United States"
    },
    {
        "id": "zkzf0VkiNv",
        "title": "Certified Robustness on Visual Graph Matching via Searching Optimal Smoothing Range",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Deep visual graph matching (GM) is a challenging task in combinatorial learning that involves finding a permutation matrix that indicates the correspondence between keypoints from a pair of images and their associated keypoint positions. \nNevertheless, recent empirical studies have demonstrated that visual GM is susceptible to adversarial attacks, which can severely impair the matching quality and jeopardize the reliability of downstream applications.\nTo the best of our knowledge, certifying robustness for deep visual GM remains an open challenge, which entails addressing two main difficulties: how to handle the paired inputs and the large permutation output space, and how to balance the trade-off between certified robustness and matching performance. \n\nIn this paper, we propose a method, Certified Robustness based on Optimal Smoothing Range Search (CR-OSRS), which provides a robustness guarantee for deep visual GM, inspired by the random smoothing technique. Unlike the conventional random smoothing methods that use isotropic Gaussian distributions, we build the smoothed model with a joint Gaussian distribution, which can capture the structural information between keypoints and mitigate the performance degradation caused by smoothing. We design a global optimization algorithm to search the optimal joint Gaussian distribution that helps achieve a larger certified space and higher matching performance. Considering the large permutation output space, we partition the output space based on similarity, which can reduce the computational complexity and certification difficulty arising from the diversity of the output matrix. Furthermore, we apply data augmentation and a similarity-based regularization term to enhance the smoothed model performance during the training phase. Since the certified space we obtain is high-dimensional and multivariable, it is challenging to evaluate directly and quantitatively, so we propose two methods (sampling and marginal radii) to measure it. Experimental results on GM datasets show that our approach achieves state-of-the-art $\\ell_{2}$ certified robustness. The source codes will be made publicly available.",
        "keywords": "Visual graph matching (GM);certified robustness;randomized smoothing;joint smoothing distribution",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/298064e254563f86cd2cefa34d1662940f2fbb4d.zip",
        "author": "Huaqing Shao;Lanjun Wang;Yongwei Wang;Qibing Ren;Junchi Yan",
        "authorids": "~Huaqing_Shao2;~Lanjun_Wang1;~Yongwei_Wang1;~Qibing_Ren1;~Junchi_Yan2",
        "gender": ";F;M;;",
        "homepage": ";https://wanglanjun-academic.github.io/;https://enkiwang.github.io/index.html;;",
        "dblp": ";79/10976;;;",
        "google_scholar": ";-uhnrYUAAAAJ;https://scholar.google.ca/citations?hl=en;;",
        "orcid": ";0000-0002-7696-5330;0000-0001-9712-8964;;",
        "linkedin": ";;;;",
        "or_profile": "~Huaqing_Shao2;~Lanjun_Wang1;~Yongwei_Wang1;~Qibing_Ren1;~Junchi_Yan2",
        "aff": ";Tianjin University;Zhejiang University;;",
        "aff_domain": ";tju.edu.cn;zju.edu.cn;;",
        "position": ";Researcher;Assistant Professor;;",
        "bibtex": "@misc{\nshao2024certified,\ntitle={Certified Robustness on Visual Graph Matching via Searching Optimal Smoothing Range},\nauthor={Huaqing Shao and Lanjun Wang and Yongwei Wang and Qibing Ren and Junchi Yan},\nyear={2024},\nurl={https://openreview.net/forum?id=zkzf0VkiNv}\n}",
        "github": "",
        "project": "",
        "reviewers": "9yGa;mXhz;gXcF;wBHW;eczv;Gpaf;4FJt",
        "site": "https://openreview.net/forum?id=zkzf0VkiNv",
        "pdf_size": 10229585,
        "rating": "5;5;5;6;6;6;8",
        "confidence": "2;3;3;3;4;3;4",
        "soundness": "2;3;2;3;3;2;3",
        "contribution": "3;2;2;3;3;3;3",
        "presentation": "3;3;2;3;3;3;3",
        "wc_summary": "92;75;103;79;87;87;91",
        "wc_strengths": "66;74;30;29;111;37;81",
        "wc_weaknesses": "415;163;24;67;52;278;173",
        "wc_questions": "74;3;262;28;57;67;135",
        "wc_review": "647;315;419;203;307;469;480",
        "wc_reply_reviewers": "0;0;0;0;0;0;39",
        "wc_reply_authors": "0;0;0;515;1522;0;1198",
        "reply_reviewers": "0;0;0;0;0;0;1",
        "reply_authors": "0;0;0;1;3;0;3",
        "rating_avg": [
            5.857142857142857,
            0.989743318610787
        ],
        "confidence_avg": [
            3.142857142857143,
            0.6388765649999398
        ],
        "soundness_avg": [
            2.5714285714285716,
            0.49487165930539345
        ],
        "contribution_avg": [
            2.7142857142857144,
            0.4517539514526256
        ],
        "presentation_avg": [
            2.857142857142857,
            0.3499271061118826
        ],
        "wc_summary_avg": [
            87.71428571428571,
            8.463607567770643
        ],
        "wc_strengths_avg": [
            61.142857142857146,
            28.422468835304887
        ],
        "wc_weaknesses_avg": [
            167.42857142857142,
            129.58709938311998
        ],
        "wc_questions_avg": [
            89.42857142857143,
            80.08362975728585
        ],
        "wc_review_avg": [
            405.7142857142857,
            134.6876962094314
        ],
        "wc_reply_reviewers_avg": [
            5.571428571428571,
            13.64715713836342
        ],
        "wc_reply_authors_avg": [
            462.14285714285717,
            600.2238697998864
        ],
        "reply_reviewers_avg": [
            0.14285714285714285,
            0.3499271061118826
        ],
        "reply_authors_avg": [
            1.0,
            1.3093073414159542
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.7100469468046932,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:M8dmb-M6kr0J:scholar.google.com/&scioq=Certified+Robustness+on+Visual+Graph+Matching+via+Searching+Optimal+Smoothing+Range&hl=en&as_sdt=0,33",
        "gs_version_total": 3,
        "aff_unique_index": "0;1",
        "aff_unique_norm": "Tianjin University;Zhejiang University",
        "aff_unique_dep": ";",
        "aff_unique_url": "http://www.tju.edu.cn;https://www.zju.edu.cn",
        "aff_unique_abbr": "TJU;ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "zlcktbqv6b",
        "title": "Med-Tuning: Parameter-Efficient Transfer Learning with Fine-Grained Feature Enhancement for Medical Volumetric Segmentation",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Deep learning-based medical volumetric segmentation methods either train the model from scratch or follow the standard ``pre-training then finetuning\" paradigm. Although finetuning a pre-trained model on downstream tasks can harness its representation power, the standard full finetuning is costly in terms of computation and memory footprint. In this paper, we present the study on parameter-efficient transfer learning for medical volumetric segmentation and propose a new framework named Med-Tuning based on intra-stage feature enhancement and inter-stage feature interaction. Additionally, aiming at exploiting the intrinsic global properties of Fourier Transform for parameter-efficient transfer learning, a new adapter block namely Med-Adapter with a well-designed Fourier Transform branch is proposed for effectively and efficiently modeling the crucial global context for medical volumetric segmentation. Given a large-scale pre-trained model on 2D natural images, our method can exploit both the crucial spatial multi-scale feature and temporal correlations along slices for accurate segmentation. Extensive experiments on three benchmark datasets (including CT and MRI) show that our method can achieve better results than previous parameter-efficient transfer learning methods for segmentation task, with much less tuned parameter costs. Compared to full finetuning, our method reduces the finetuned model parameters by up to 4x, with even better segmentation performance.",
        "keywords": "Parameter-Efficient Transfer Learning;Medical Volumetric Segmentation;Brain Tumor;Kidney Tumor;Intra-stage enhancement;Inter-stage Interaction",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "",
        "author": "Wenxuan Wang;Jiachen Shen;Chen Chen;Jianbo Jiao;Jing Liu;Yan Zhang;Shanshan Song;Jiangyun Li",
        "authorids": "~Wenxuan_Wang3;~Jiachen_Shen1;~Chen_Chen18;~Jianbo_Jiao2;~Jing_Liu1;~Yan_Zhang20;~Shanshan_Song1;~Jiangyun_Li1",
        "gender": "M;F;M;;F;F;F;M",
        "homepage": ";;https://www.crcv.ucf.edu/chenchen/;https://jianbojiao.com/;http://www.nlpr.ia.ac.cn/iva/liujing/;;https://github.com/ShanshanSoong;http://saee.ustb.edu.cn/quantijiaoshi/2015-05-12/69.html",
        "dblp": ";;65/4423-1;150/6622;72/2590-1.html;;48/3277;",
        "google_scholar": "https://scholar.google.com.hk/citations?hl=zh-CN;https://scholar.google.com.hk/citations?user=jjVTk6wAAAAJ;TuEwcZ0AAAAJ;HkEiMMwAAAAJ;sOI-S7oAAAAJ;;;",
        "orcid": "0000-0002-9022-1370;;0000-0003-3957-7061;;;0000-0002-4773-1113;;",
        "linkedin": ";;dennychen/;;;;;",
        "or_profile": "~Wenxuan_Wang3;~Jiachen_Shen1;~Chen_Chen18;~Jianbo_Jiao2;~Jing_Liu1;~Yan_Zhang20;~Shanshan_Song1;~Jiangyun_Li1",
        "aff": "Beijing Academy of Artificial Intelligence;University of Science and Technology Beijing;University of Central Florida;University of Birmingham;Institute of automation, Chinese academy of science;University of Science and Technology Beijing;Hong Kong University of Science and Technology;University of Science and Technology Beijing",
        "aff_domain": "baai.ac.cn;ustb.edu.cn;ucf.edu;bham.ac.uk;nlpr.ia.ac.cn;ustb.edu.cn;ust.hk;ustb.edu.cn",
        "position": "PhD student;MS student;Assistant Professor;Assistant Professor;Full Professor;MS student;PhD student;Full Professor",
        "bibtex": "@misc{\nwang2024medtuning,\ntitle={Med-Tuning: Parameter-Efficient Transfer Learning with Fine-Grained Feature Enhancement for Medical Volumetric Segmentation},\nauthor={Wenxuan Wang and Jiachen Shen and Chen Chen and Jianbo Jiao and Jing Liu and Yan Zhang and Shanshan Song and Jiangyun Li},\nyear={2024},\nurl={https://openreview.net/forum?id=zlcktbqv6b}\n}",
        "github": "",
        "project": "",
        "reviewers": "bQHn;SCo3;g2xi;y6pK",
        "site": "https://openreview.net/forum?id=zlcktbqv6b",
        "pdf_size": 1156648,
        "rating": "5;5;5;6",
        "confidence": "4;4;3;4",
        "soundness": "3;3;2;3",
        "contribution": "2;2;2;2",
        "presentation": "3;3;3;4",
        "wc_summary": "29;94;186;128",
        "wc_strengths": "71;39;44;169",
        "wc_weaknesses": "161;161;288;199",
        "wc_questions": "30;30;8;100",
        "wc_review": "291;324;526;596",
        "wc_reply_reviewers": "0;103;50;0",
        "wc_reply_authors": "1431;919;1439;1496",
        "reply_reviewers": "0;1;1;0",
        "reply_authors": "3;2;3;3",
        "rating_avg": [
            5.25,
            0.4330127018922193
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            109.25,
            56.82154080980205
        ],
        "wc_strengths_avg": [
            80.75,
            52.38499308007972
        ],
        "wc_weaknesses_avg": [
            202.25,
            51.88147549944971
        ],
        "wc_questions_avg": [
            42.0,
            34.66987164671943
        ],
        "wc_review_avg": [
            434.25,
            129.66953188779544
        ],
        "wc_reply_reviewers_avg": [
            38.25,
            42.59327998640161
        ],
        "wc_reply_authors_avg": [
            1321.25,
            233.5876441509696
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.75,
            0.4330127018922193
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6434327620422339061&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;1;2;3;4;1;5;1",
        "aff_unique_norm": "Beijing Academy of Artificial Intelligence;University of Science and Technology Beijing;University of Central Florida;University of Birmingham;Chinese Academy of Sciences;Hong Kong University of Science and Technology",
        "aff_unique_dep": ";;;;Institute of Automation;",
        "aff_unique_url": "https://www.baaic.cn;http://www.ustb.edu.cn;https://www.ucf.edu;https://www.birmingham.ac.uk;http://www.ia.cas.cn;https://www.ust.hk",
        "aff_unique_abbr": "BAAI;USTB;UCF;Birmingham;CAS;HKUST",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Hong Kong SAR",
        "aff_country_unique_index": "0;0;1;2;0;0;0;0",
        "aff_country_unique": "China;United States;United Kingdom"
    },
    {
        "title": "Fast and unified path gradient estimators for normalizing flows",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17372",
        "id": "zlkXLb3wpF",
        "author_site": "Lorenz Vaitl, Ludwig Winkler, Lorenz Richter, Pan Kessel",
        "tldr": "",
        "abstract": "Recent work shows that path gradient estimators for normalizing flows have lower variance compared to standard estimators, resulting in improved training. However, they are often prohibitively more expensive from a computational point of view and cannot be applied to maximum likelihood training in a scalable manner, which severely hinders their widespread adoption. In this work, we overcome these crucial limitations. Specifically, we propose a fast path gradient estimator which works for all normalizing flow architectures of practical relevance for sampling from an unnormalized target distribution. We then show that this estimator can also be applied to maximum likelihood training and empirically establish its superior performance for several natural sciences applications.",
        "keywords": "Normalizing Flows;Gradient Estimators;Lattice Field Theory;Variational Infernce",
        "primary_area": "probabilistic methods (Bayesian methods, variational inference, sampling, UQ, etc.)",
        "supplementary_material": "",
        "author": "Lorenz Vaitl;Ludwig Winkler;Lorenz Richter;Pan Kessel",
        "authorids": "~Lorenz_Vaitl1;~Ludwig_Winkler1;~Lorenz_Richter1;~Pan_Kessel1",
        "gender": "M;M;;M",
        "homepage": "https://scholar.google.de/citations?user=ipYrOMEAAAAJ;https://ludwigwinkler.github.io;;https://www.gene.com/scientists/our-scientists/pan-kessel",
        "dblp": "322/8817;171/8795;;238/1381",
        "google_scholar": ";nu_vtVkAAAAJ;https://scholar.google.de/citations?user=uxlQvnUAAAAJ;uODjwl8AAAAJ",
        "orcid": "0009-0009-3818-8911;0000-0002-1354-4715;;",
        "linkedin": ";;;",
        "or_profile": "~Lorenz_Vaitl1;~Ludwig_Winkler1;~Lorenz_Richter1;~Pan_Kessel1",
        "aff": "Technische Universit\u00e4t Berlin;Technische Universit\u00e4t Berlin;Zuse Institute Berlin;Prescient Design",
        "aff_domain": "tu-berlin.de;tu-berlin.de;zib.de;roche.com",
        "position": "PhD student;PhD student;Postdoc;Researcher",
        "bibtex": "@inproceedings{\nvaitl2024fast,\ntitle={Fast and unified path gradient estimators for normalizing flows},\nauthor={Lorenz Vaitl and Ludwig Winkler and Lorenz Richter and Pan Kessel},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=zlkXLb3wpF}\n}",
        "github": "",
        "project": "",
        "reviewers": "UvVP;ZWTi;vn2u;yXNA",
        "pdf_size": 1141245,
        "rating": "6;8;8;8",
        "confidence": "3;4;3;3",
        "soundness": "3;2;3;3",
        "contribution": "3;2;2;3",
        "presentation": "3;2;2;3",
        "wc_summary": "103;99;82;190",
        "wc_strengths": "66;181;122;45",
        "wc_weaknesses": "105;634;148;198",
        "wc_questions": "97;2;2;157",
        "wc_review": "371;916;354;590",
        "wc_reply_reviewers": "215;364;0;157",
        "wc_reply_authors": "1471;3813;353;804",
        "reply_reviewers": "2;2;0;1",
        "reply_authors": "4;9;1;2",
        "rating_avg": [
            7.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.25,
            0.4330127018922193
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            118.5,
            42.0267771783657
        ],
        "wc_strengths_avg": [
            103.5,
            52.86066590575643
        ],
        "wc_weaknesses_avg": [
            271.25,
            212.00397991547234
        ],
        "wc_questions_avg": [
            64.5,
            66.00189391222042
        ],
        "wc_review_avg": [
            557.75,
            226.81090692468914
        ],
        "wc_reply_reviewers_avg": [
            184.0,
            130.33226768532802
        ],
        "wc_reply_authors_avg": [
            1610.25,
            1332.4990384611915
        ],
        "reply_reviewers_avg": [
            1.25,
            0.82915619758885
        ],
        "reply_authors_avg": [
            4.0,
            3.082207001484488
        ],
        "replies_avg": [
            29,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.3333333333333333,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7016821447888669086&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=zlkXLb3wpF",
        "pdf": "https://openreview.net/pdf?id=zlkXLb3wpF",
        "email": "tu-berlin.de;tu-berlin.de;zib.de;roche.com",
        "author_num": 4,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "Technische Universit\u00e4t Berlin;Zuse Institute Berlin;Prescient Design",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.tu-berlin.de;https://www.zib.de;",
        "aff_unique_abbr": "TU Berlin;ZIB;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Germany;"
    },
    {
        "title": "Nemesis: Normalizing the Soft-prompt Vectors of Vision-Language Models",
        "status": "Spotlight",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17371",
        "id": "zmJDzPh1Dm",
        "author_site": "Shuai Fu, Xiequn Wang, Qiushi Huang, Yu Zhang",
        "tldr": "",
        "abstract": "With the prevalence of large-scale pretrained vision-language models (VLMs), such as CLIP, soft-prompt tuning has become a popular method for adapting these models to various downstream tasks. However, few works delve into the inherent properties of learnable soft-prompt vectors, specifically the impact of their norms to the performance of VLMs. This motivates us to pose an unexplored research question: ``Do we need to normalize the soft prompts in VLMs?'' To fill this research gap, we first uncover a phenomenon, called the $\\textbf{Low-Norm Effect}$ by performing extensive corruption experiments, suggesting that reducing the norms of certain learned prompts occasionally enhances the performance of VLMs, while increasing them often degrades it. To harness this effect, we propose a novel method named $\\textbf{N}$ormalizing th$\\textbf{e}$ soft-pro$\\textbf{m}$pt v$\\textbf{e}$ctors of vi$\\textbf{si}$on-language model$\\textbf{s}$ ($\\textbf{Nemesis}$) to normalize soft-prompt vectors in VLMs. To the best of our knowledge, our work is the first to systematically investigate the role of norms of soft-prompt vector in VLMs, offering valuable insights for future research in soft-prompt tuning.",
        "keywords": "Vision-language models; Soft-prompt tuning; Low-norm effect; Normalizing soft prompts",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Shuai Fu;Xiequn Wang;Qiushi Huang;Yu Zhang",
        "authorids": "~Shuai_Fu1;~Xiequn_Wang1;~Qiushi_Huang1;~Yu_Zhang3",
        "gender": "M;M;M;M",
        "homepage": ";;;http://cse.sustech.edu.cn/faculty/~zhangy/",
        "dblp": ";;204/2933;50/671-6",
        "google_scholar": "https://scholar.google.com.hk/citations?user=QXoLj2oAAAAJ;;F_yGB9sAAAAJ;https://scholar.google.com.hk/citations?user=jaRS5w4AAAAJ",
        "orcid": ";0009-0000-9673-6706;;",
        "linkedin": ";;;",
        "or_profile": "~Shuai_Fu1;~Xiequn_Wang1;~Qiushi_Huang1;~Yu_Zhang3",
        "aff": "Southern University of Science and Technology;South University of Science and Technology of China;University of Surrey;Southern University of Science and Technology",
        "aff_domain": "sustech.edu.cn;sustc.edu.cn;surrey.ac.uk;sustc.edu.cn",
        "position": "Research Assistant;MS student;PhD student;Associate Professor",
        "bibtex": "@inproceedings{\nfu2024nemesis,\ntitle={Nemesis: Normalizing the Soft-prompt Vectors of Vision-Language Models},\nauthor={Shuai Fu and Xiequn Wang and Qiushi Huang and Yu Zhang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=zmJDzPh1Dm}\n}",
        "github": "",
        "project": "",
        "reviewers": "bzG1;hcSQ;KnC5",
        "pdf_size": 1715856,
        "rating": "6;6;8",
        "confidence": "3;3;4",
        "soundness": "3;2;4",
        "contribution": "3;2;3",
        "presentation": "3;3;3",
        "wc_summary": "73;179;39",
        "wc_strengths": "28;67;54",
        "wc_weaknesses": "73;246;75",
        "wc_questions": "42;78;100",
        "wc_review": "216;570;268",
        "wc_reply_reviewers": "0;35;0",
        "wc_reply_authors": "1109;2371;1642",
        "reply_reviewers": "0;1;0",
        "reply_authors": "2;5;3",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.3333333333333335,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            97.0,
            59.62102537416366
        ],
        "wc_strengths_avg": [
            49.666666666666664,
            16.21384867602041
        ],
        "wc_weaknesses_avg": [
            131.33333333333334,
            81.08568855777749
        ],
        "wc_questions_avg": [
            73.33333333333333,
            23.907228102721476
        ],
        "wc_review_avg": [
            351.3333333333333,
            156.0712088189946
        ],
        "wc_reply_reviewers_avg": [
            11.666666666666666,
            16.49915822768611
        ],
        "wc_reply_authors_avg": [
            1707.3333333333333,
            517.2764143945565
        ],
        "reply_reviewers_avg": [
            0.3333333333333333,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.3333333333333335,
            1.247219128924647
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.9999999999999998,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7259329197231458922&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=zmJDzPh1Dm",
        "pdf": "https://openreview.net/pdf?id=zmJDzPh1Dm",
        "email": "sustech.edu.cn;sustc.edu.cn;surrey.ac.uk;sustc.edu.cn",
        "author_num": 4,
        "aff_unique_index": "0;1;2;0",
        "aff_unique_norm": "Southern University of Science and Technology;South University of Science and Technology of China;University of Surrey",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.sustech.edu.cn;https://www.sustech.edu.cn;https://www.surrey.ac.uk",
        "aff_unique_abbr": "SUSTech;SUSTech;Surrey",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "China;United Kingdom"
    },
    {
        "id": "zmV50sislh",
        "title": "A Symmetry-Aware Learning Approach for Solving Mixed-Integer Linear Programs",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Recently, machine learning techniques have been widely utilized for solving mixed-integer linear programs (MILPs). Notably, learning-based approaches that encode MILPs as bipartite graphs and then leverage graph neural networks (GNNs) to identify high-quality solutions have shown remarkable potential. Symmetry as an intrinsic property of many MILPs leads to multiple equivalent solutions, which incurs noticeable computational challenges and hence is treated with care in classic optimization algorithms. However, to the best of our knowledge, none of the learning-based methods take special care of symmetry within MILPs such that their computational performance might be jeopardized. To mitigate this issue, we propose a symmetry-aware learning approach that includes (i) position embeddings as node features to differentiate interchangeable variable nodes, and (ii) a novel loss function to alleviate ambiguity caused by equivalent solutions. We conduct extensive experiments on public datasets and the computational results demonstrate that our proposed approach significantly outperforms existing ones in both computational efficiency and solution quality.",
        "keywords": "mixed-integer linear programming;symmetry;machine learning;graph neural networks",
        "primary_area": "optimization",
        "supplementary_material": "",
        "author": "Qian Chen;Tianjian Zhang;Linxin Yang;Qingyu Han;Akang Wang;Ruoyu Sun;Xiaodong Luo;Tsung-Hui Chang",
        "authorids": "~Qian_Chen10;~Tianjian_Zhang1;~Linxin_Yang1;~Qingyu_Han2;~Akang_Wang1;~Ruoyu_Sun1;~Xiaodong_Luo2;~Tsung-Hui_Chang1",
        "gender": ";M;M;M;Not Specified;;M;",
        "homepage": ";https://sse.cuhk.edu.cn/en/teacher/309;;https://www.math.sdu.edu.cn/;https://akangw.github.io/;https://ruoyus.github.io/;https://www.sribd.cn/teacher/240;",
        "dblp": ";190/6500;;;222/3290;30/9879-1;16/6157.html;",
        "google_scholar": "O74Oj08AAAAJ;;https://scholar.google.com/citations?hl=en;;TyYzzmoAAAAJ;PsfzbCMAAAAJ;;",
        "orcid": ";;;;0000-0002-3325-8441;;0000-0001-9552-0735;",
        "linkedin": ";;;;wangakang/;;;",
        "or_profile": "~Qian_Chen10;~Tianjian_Zhang1;~Linxin_Yang1;~Qingyu_Han2;~Akang_Wang1;~Ruoyu_Sun1;~Xiaodong_Luo2;~Tsung-Hui_Chang1",
        "aff": "The Chinese University of Hong Kong, Shenzhen;The Chinese University of Hong Kong, Shenzhen;The Chinese University of Hong Kong, Shenzhen;The Chinese University of Hong Kong;Shenzhen Research Institute of Big Data;The Chinese University of Hong Kong;Shenzhen Research Institute of Big Data;",
        "aff_domain": "cuhk.edu.cn;cuhk.edu.cn;link.cuhk.edu.cn;cuhk.edu.cn;sribd.cn;cuhk.edu.cn;sribd.cn;",
        "position": "PhD student;PhD student;PhD student;PhD student;Researcher;Associate Professor;Principal Researcher;",
        "bibtex": "@misc{\nchen2024a,\ntitle={A Symmetry-Aware Learning Approach for Solving Mixed-Integer Linear Programs},\nauthor={Qian Chen and Tianjian Zhang and Linxin Yang and Qingyu Han and Akang Wang and Ruoyu Sun and Xiaodong Luo and Tsung-Hui Chang},\nyear={2024},\nurl={https://openreview.net/forum?id=zmV50sislh}\n}",
        "github": "",
        "project": "",
        "reviewers": "MwS2;7CFb;Vpp5;9XGv",
        "site": "https://openreview.net/forum?id=zmV50sislh",
        "pdf_size": 689838,
        "rating": "3;3;3;5",
        "confidence": "3;3;4;4",
        "soundness": "2;3;3;2",
        "contribution": "2;1;2;2",
        "presentation": "2;2;3;3",
        "wc_summary": "136;67;76;55",
        "wc_strengths": "51;55;68;70",
        "wc_weaknesses": "108;340;146;371",
        "wc_questions": "1;37;1;114",
        "wc_review": "296;499;291;610",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            1.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            83.5,
            31.212978070027216
        ],
        "wc_strengths_avg": [
            61.0,
            8.154753215150045
        ],
        "wc_weaknesses_avg": [
            241.25,
            115.55815635427903
        ],
        "wc_questions_avg": [
            38.25,
            46.13770150321752
        ],
        "wc_review_avg": [
            424.0,
            136.28462862700255
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            8,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:FEt1RlmmmE4J:scholar.google.com/&scioq=A+Symmetry-Aware+Learning+Approach+for+Solving+Mixed-Integer+Linear+Programs&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0;0;1;0;1",
        "aff_unique_norm": "Chinese University of Hong Kong;Shenzhen Research Institute of Big Data",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://www.cuhk.edu.cn;http://www.sribd.cn",
        "aff_unique_abbr": "CUHK;",
        "aff_campus_unique_index": "0;0;0;1;1",
        "aff_campus_unique": "Shenzhen;Hong Kong SAR;",
        "aff_country_unique_index": "0;0;0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "znjaiy1Z9q",
        "title": "AUTOPARLLM: GNN-Guided Automatic Code Parallelization using Large Language Models",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Parallelizing sequentially written programs is a challenging task. Even experienced developers need to spend considerable time finding parallelism opportunities and then actually writing parallel versions of sequentially written programs. To address this issue, we present AUTOPARLLM, a framework for automatically discovering parallelism and generating the parallel version of the sequentially written program. \nOur framework consists of two major components: i) a heterogeneous Graph Neural Network (GNN) based parallelism discovery and parallel pattern detection module, and ii) an LLM-based code generator to generate the parallel counterpart of the sequential programs. We use the GNN to learn the flow-aware characteristics of the programs to identify parallel regions in sequential programs and then construct an enhanced prompt using the GNN's results for the LLM-based generator to finally produce the parallel counterparts of the sequential programs. We evaluate AUTOPARLLM on 11 applications of 2 well-known benchmark suites: NAS Parallel Benchmark and Rodinia Benchmark. Our results show that AUTOPARLLM is indeed effective in improving the state-of-the-art LLM-based models for the task of parallel code generation in terms of multiple code generation metrics. AUTOPARLLM also improves the average runtime of the parallel code generated by the state-of-the-art LLMs by as high as 3.4% and 2.9% for the NAS Parallel Benchmark and Rodinia Benchmark respectively. Additionally, to overcome the issue that well-known metrics for translation evaluation have not been optimized to evaluate the quality of the generated parallel code, we propose OMPScore for evaluating the quality of the generated code. We show that OMPScore exhibits a better correlation with human judgment than existing metrics, measured by up to 75% improvement of Spearman correlation.",
        "keywords": "LLM;RGCN;GNN;Parallel Computing;OpenMP;HPC",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "",
        "author": "Quazi Ishtiaque Mahmud;Ali TehraniJamsaz;Hung D Phan;Nesreen K. Ahmed;Ali Jannesari",
        "authorids": "~Quazi_Ishtiaque_Mahmud1;~Ali_TehraniJamsaz1;~Hung_D_Phan1;~Nesreen_K._Ahmed2;~Ali_Jannesari1",
        "gender": "M;M;M;M;F",
        "homepage": ";http://www.tehrani.xyz;https://hungphd.public.iastate.edu/index.html?n=Main.Research;https://www.cs.iastate.edu/swapp/;http://nesreenahmed.com",
        "dblp": ";;;74/1277;33/11518",
        "google_scholar": "1wYOnLkAAAAJ;XZ1al70AAAAJ;https://scholar.google.com/citations?hl=en;https://scholar.google.de/citations?user=YhWnhQEAAAAJ;AFV0nLcAAAAJ",
        "orcid": ";0009-0001-3678-5730;;0000-0001-8672-5317;",
        "linkedin": ";tehranixyz/;;ali-jannesari-6ab8a56b/;nkahmed/",
        "or_profile": "~Quazi_Ishtiaque_Mahmud1;~Ali_TehraniJamsaz1;~Hung_D_Phan1;~Ali_Jannesari1;~Nesreen_Ahmed1",
        "aff": "Iowa State University;Iowa State University;Iowa State University;Iowa State University;Intel AI Research",
        "aff_domain": "iastate.edu;iastate.edu;isu.edu;isu.edu;intel.com",
        "position": "PhD student;PhD student;PhD student;Associate Professor;Principal Researcher",
        "bibtex": "@misc{\nmahmud2024autoparllm,\ntitle={{AUTOPARLLM}: {GNN}-Guided Automatic Code Parallelization using Large Language Models},\nauthor={Quazi Ishtiaque Mahmud and Ali TehraniJamsaz and Hung D Phan and Nesreen K. Ahmed and Ali Jannesari},\nyear={2024},\nurl={https://openreview.net/forum?id=znjaiy1Z9q}\n}",
        "github": "",
        "project": "",
        "reviewers": "6MQq;PQiN;eS8a;pN6K",
        "site": "https://openreview.net/forum?id=znjaiy1Z9q",
        "pdf_size": 392028,
        "rating": "5;5;5;8",
        "confidence": "5;3;3;5",
        "soundness": "3;2;3;3",
        "contribution": "2;2;3;4",
        "presentation": "3;3;3;3",
        "wc_summary": "53;97;78;160",
        "wc_strengths": "57;55;51;118",
        "wc_weaknesses": "365;187;565;122",
        "wc_questions": "26;52;90;90",
        "wc_review": "501;391;784;490",
        "wc_reply_reviewers": "0;0;11;20",
        "wc_reply_authors": "611;659;661;314",
        "reply_reviewers": "0;0;1;1",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            5.75,
            1.299038105676658
        ],
        "confidence_avg": [
            4.0,
            1.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.75,
            0.82915619758885
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            97.0,
            39.5790348543266
        ],
        "wc_strengths_avg": [
            70.25,
            27.652983564165368
        ],
        "wc_weaknesses_avg": [
            309.75,
            172.13566597309227
        ],
        "wc_questions_avg": [
            64.5,
            27.1062723368596
        ],
        "wc_review_avg": [
            541.5,
            146.41465090625323
        ],
        "wc_reply_reviewers_avg": [
            7.75,
            8.37779804005802
        ],
        "wc_reply_authors_avg": [
            561.25,
            144.14640994488903
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6151480171068331395&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0;1",
        "aff_unique_norm": "Iowa State University;Intel",
        "aff_unique_dep": ";Intel AI Research",
        "aff_unique_url": "https://www.iastate.edu;https://www.intel.com/research",
        "aff_unique_abbr": "ISU;Intel AI",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "zopJyLgKJU",
        "title": "Unseen Image Synthesis with Diffusion Models",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "While the current trend in the generative field is scaling up towards larger models and more training data for generalized domain representations, we go the opposite direction in this work by synthesizing unseen domain images without additional training. We do so via latent sampling and geometric optimization using pre-trained and frozen Denoising Diffusion Probabilistic Models (DDPMs) on single-domain datasets. Our key observation is that DDPMs pre-trained even just on single-domain images are already equipped with sufficient representation abilities to reconstruct arbitrary images from the inverted latent encoding following bi-directional deterministic diffusion and denoising trajectories. This motivates us to investigate the statistical and geometric behaviors of the Out-Of-Distribution (OOD) samples from unseen image domains in the latent spaces along the denoising chain. Notably, we theoretically and empirically show that the inverted OOD samples also establish Gaussians that are distinguishable from the original In-Domain (ID) samples in the intermediate latent spaces, which allows us to sample from them directly.  Geometrical domain-specific information of the unseen subspace (e.g., sample-wise distance and angles) is used to further optimize the sampled OOD latent encodings from the estimated Gaussian prior. We conduct extensive analysis and experiments using pre-trained diffusion models (DDPM, iDDPM) on different datasets (AFHQ, CelebA-HQ, LSUN-Church, and LSUN-Bedroom), proving the effectiveness of this novel perspective to explore and re-think the diffusion models' data synthesis generalization ability.",
        "keywords": "Diffusion Models;Training-free;Domain Generalization;Image Synthesis",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/25b5aec39c2bb6d6ea2264075056f5e5ddc1b185.zip",
        "author": "Ye Zhu;Yu Wu;Zhiwei Deng;Olga Russakovsky;Yan Yan",
        "authorids": "~Ye_Zhu3;~Yu_Wu3;~Zhiwei_Deng3;~Olga_Russakovsky1;~Yan_Yan6",
        "gender": "F;M;M;F;M",
        "homepage": "https://l-yezhu.github.io/;https://yu-wu.net;http://www.zhiweideng.com;http://cs.princeton.edu/~olgarus;",
        "dblp": ";22/0-11;160/3578;52/6883;13/3953-2",
        "google_scholar": "uk5WuyIAAAAJ;23SZHUwAAAAJ;tWBPUHwAAAAJ;TB5OwW8AAAAJ;",
        "orcid": ";;;0000-0001-5272-3241;",
        "linkedin": ";;;;",
        "or_profile": "~Ye_Zhu3;~Yu_Wu3;~Zhiwei_Deng3;~Olga_Russakovsky1;~Yan_Yan6",
        "aff": "Princeton University;Wuhan University;Google Deepmind;Princeton University;University of Illinois Chicago",
        "aff_domain": "princeton.edu;whu.edu.cn;google.com;princeton.edu;uic.edu",
        "position": "Postdoc;Full Professor;Research Scientist;Associate Professor;Associate Professor",
        "bibtex": "@misc{\nzhu2024unseen,\ntitle={Unseen Image Synthesis with Diffusion Models},\nauthor={Ye Zhu and Yu Wu and Zhiwei Deng and Olga Russakovsky and Yan Yan},\nyear={2024},\nurl={https://openreview.net/forum?id=zopJyLgKJU}\n}",
        "github": "",
        "project": "",
        "reviewers": "RR6j;zhbU;2gqd;NgdU",
        "site": "https://openreview.net/forum?id=zopJyLgKJU",
        "pdf_size": 5047736,
        "rating": "3;5;6;6",
        "confidence": "4;4;4;4",
        "soundness": "3;2;3;3",
        "contribution": "2;3;3;2",
        "presentation": "3;2;3;3",
        "wc_summary": "111;20;93;75",
        "wc_strengths": "63;53;120;129",
        "wc_weaknesses": "409;162;44;165",
        "wc_questions": "8;2;106;54",
        "wc_review": "591;237;363;423",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.0,
            0.0
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            74.75,
            34.07620137280563
        ],
        "wc_strengths_avg": [
            91.25,
            33.58850249713434
        ],
        "wc_weaknesses_avg": [
            195.0,
            132.84012947900948
        ],
        "wc_questions_avg": [
            42.5,
            41.81805830021284
        ],
        "wc_review_avg": [
            403.5,
            127.37641068894978
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=9034564972602816797&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;2;0;3",
        "aff_unique_norm": "Princeton University;Wuhan University;DeepMind;University of Illinois at Chicago",
        "aff_unique_dep": ";;DeepMind;",
        "aff_unique_url": "https://www.princeton.edu;http://www.whu.edu.cn/;https://deepmind.com;https://www.uic.edu",
        "aff_unique_abbr": "Princeton;WHU;DeepMind;UIC",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Chicago",
        "aff_country_unique_index": "0;1;2;0;0",
        "aff_country_unique": "United States;China;United Kingdom"
    },
    {
        "title": "Get What You Want, Not What You Don't: Image Content Suppression for Text-to-Image Diffusion Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17370",
        "id": "zpVPhvVKXk",
        "author_site": "Senmao Li, Joost van de Weijer, taihang Hu, Fahad Khan, Qibin Hou, Yaxing Wang, jian Yang",
        "tldr": "",
        "abstract": "The success of recent text-to-image diffusion models is largely due to their capacity to be guided by a complex text prompt, which enables users to precisely describe the desired content. However, these models struggle to effectively suppress the generation of undesired content, which is explicitly requested to be omitted from the generated image in the prompt. In this paper, we analyze how to manipulate the text embeddings and remove unwanted content from them. We introduce two contributions, which we refer to as soft-weighted regularization and inference-time text embedding optimization. The first regularizes the text embedding matrix and effectively suppresses the undesired content. The second method aims to further suppress the unwanted content generation of the prompt, and encourages the generation of desired content. We evaluate our method quantitatively and qualitatively on extensive experiments, validating its effectiveness. Furthermore, our method is generalizability to both the pixel-space diffusion models (i.e. DeepFloyd-IF) and the latent-space diffusion models (i.e. Stable Diffusion).",
        "keywords": "Diffusion model; Content Suppression; Image Editing; Text Embeddings",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/ccf9408e4314d4b9315532777cbce289ab222ece.zip",
        "author": "Senmao Li;Joost van de Weijer;taihang Hu;Fahad Khan;Qibin Hou;Yaxing Wang;jian Yang",
        "authorids": "~Senmao_Li2;~Joost_van_de_Weijer5;~taihang_Hu1;~Fahad_Khan1;~Qibin_Hou1;~Yaxing_Wang3;~jian_Yang14",
        "gender": ";M;M;M;M;M;M",
        "homepage": "https://sen-mao.github.io/;https://hutaihang.github.io/;https://sites.google.com/view/fahadkhans/home;https://houqb.github.io/;https://yaxingwang.netlify.app/author/yaxing-wang/;;http://lamp.cvc.uab.es/",
        "dblp": "344/2376;344/1728;05/8618;40/4112;;;67/3379",
        "google_scholar": "F96SDKwAAAAJ;;zvaeYnUAAAAJ;fF8OFV8AAAAJ;https://scholar.google.es/citations?user=6CsB8k0AAAAJ;;https://scholar.google.es/citations?user=Gsw2iUEAAAAJ",
        "orcid": ";;;;;;0000-0002-9656-9706",
        "linkedin": ";;;;;;",
        "or_profile": "~Senmao_Li2;~taihang_Hu1;~Fahad_Khan1;~Qibin_Hou1;~Yaxing_Wang3;~jian_Yang14;~Joost_van_de_Weijer1",
        "aff": "Nankai University;Nankai University;Link\u00f6ping University;Nankai University;Nankai University;Nankai University;Computer Vision Center, Universitat Aut\u00f3noma de Barcelona",
        "aff_domain": "nankai.edu.cn;nankai.edu.cn;liu.se;nankai.edu.cn;nku.nankai.edu.cn;nankai.edu.cn;cvc.uab.es",
        "position": "PhD student;MS student;Associate Professor;Associate Professor;Associate Professor;Full Professor;Researcher",
        "bibtex": "@inproceedings{\nli2024get,\ntitle={Get What You Want, Not What You Don't: Image Content Suppression for Text-to-Image Diffusion Models},\nauthor={Senmao Li and Joost van de Weijer and taihang Hu and Fahad Khan and Qibin Hou and Yaxing Wang and jian Yang},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=zpVPhvVKXk}\n}",
        "github": "",
        "project": "",
        "reviewers": "B9jb;XjcJ;69SC;9uRw",
        "pdf_size": 11690941,
        "rating": "6;6;6;6",
        "confidence": "4;3;5;4",
        "soundness": "2;3;2;3",
        "contribution": "2;3;3;3",
        "presentation": "3;3;4;3",
        "wc_summary": "81;82;126;56",
        "wc_strengths": "27;36;79;54",
        "wc_weaknesses": "193;20;45;61",
        "wc_questions": "67;42;121;5",
        "wc_review": "368;180;371;176",
        "wc_reply_reviewers": "33;13;0;0",
        "wc_reply_authors": "1445;413;873;296",
        "reply_reviewers": "1;1;0;0",
        "reply_authors": "5;2;2;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            4.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            86.25,
            25.202926417382564
        ],
        "wc_strengths_avg": [
            49.0,
            19.862024066041204
        ],
        "wc_weaknesses_avg": [
            79.75,
            66.99766786985947
        ],
        "wc_questions_avg": [
            58.75,
            42.16856056352884
        ],
        "wc_review_avg": [
            273.75,
            95.76631714752322
        ],
        "wc_reply_reviewers_avg": [
            11.5,
            13.5
        ],
        "wc_reply_authors_avg": [
            756.75,
            452.1218723972553
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            2.5,
            1.5
        ],
        "replies_avg": [
            18,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 17,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=13116301372279034038&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=zpVPhvVKXk",
        "pdf": "https://openreview.net/pdf?id=zpVPhvVKXk",
        "email": "nankai.edu.cn;nankai.edu.cn;liu.se;nankai.edu.cn;nku.nankai.edu.cn;nankai.edu.cn;cvc.uab.es",
        "author_num": 7,
        "aff_unique_index": "0;0;1;0;0;0;2",
        "aff_unique_norm": "Nankai University;Link\u00f6ping University;Universitat Aut\u00f3noma de Barcelona",
        "aff_unique_dep": ";;Computer Vision Center",
        "aff_unique_url": "http://www.nankai.edu.cn;https://www.liu.se;https://www.uab.cat",
        "aff_unique_abbr": "NKU;LiU;UAB",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;1;0;0;0;2",
        "aff_country_unique": "China;Sweden;Spain"
    },
    {
        "id": "zqVvdn0NQM",
        "title": "Stop overkilling simple tasks with black-box models, use more transparent models instead",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "The ability of deep learning-based approaches to extract features autonomously from raw data while outperforming traditional methods has led to several breakthroughs in artificial intelligence. However, it is well-known that deep learning models suffer from an intrinsic opacity, making it difficult to explain why they produce specific predictions. This is problematic not only because it hinders debugging but, most importantly, because it negatively affects the perceived trustworthiness of the systems. What is often overlooked is that many relatively simple tasks can be solved efficiently and effectively with data processing strategies paired with traditional models that are inherently more transparent. This work highlights the frequently neglected perspective of using knowledge-based and explainability-driven problem-solving in ML. To support our guidelines, we propose a simple strategy for solving the task of classifying the ripeness of banana crates. This is done by planning explainability and model design together. We showcase how the task can be solved using opaque deep learning models and more transparent strategies. Notably, there is a minimal loss of accuracy but a significant gain in explainability, which is truthful to the model\u2019s inner workings. Additionally, we perform a user study to evaluate the perception of explainability by end users and discuss our findings.",
        "keywords": "Explainable AI;Computer Vision;Natural Language Processing;Transformer;Decision Tree",
        "primary_area": "visualization or interpretation of learned representations",
        "supplementary_material": "/attachment/be835a9a5984b50e7c2bed2ff4e78d68fc594d6f.pdf",
        "author": "Matteo Rizzo;Matteo Marcuzzo;Alessandro Zangari;Andrea Gasparetto;Andrea Albarelli",
        "authorids": "~Matteo_Rizzo1;matteo.marcuzzo@unive.it;alessandro.zangari@unive.it;~Andrea_Gasparetto1;~Andrea_Albarelli1",
        "gender": "M;;;M;M",
        "homepage": "https://matteo-rizzo.github.io/;;;https://www.scopus.com/authid/detail.uri?authorId=56332919000;https://www.unive.it/data/persone/5590927",
        "dblp": ";;;;44/4261.html",
        "google_scholar": "https://scholar.google.ca/citations?user=j4AvzPAAAAAJ;;;;",
        "orcid": ";;;;",
        "linkedin": "matteo-rizzo/;;;;",
        "or_profile": "~Matteo_Rizzo1;matteo.marcuzzo@unive.it;alessandro.zangari@unive.it;~Andrea_Gasparetto1;~Andrea_Albarelli1",
        "aff": "University of Venice;;;;University of Venice",
        "aff_domain": "unive.it;;;;unive.it",
        "position": "PhD student;;;;Associate Professor",
        "bibtex": "@misc{\nrizzo2024stop,\ntitle={Stop overkilling simple tasks with black-box models, use more transparent models instead},\nauthor={Matteo Rizzo and Matteo Marcuzzo and Alessandro Zangari and Andrea Gasparetto and Andrea Albarelli},\nyear={2024},\nurl={https://openreview.net/forum?id=zqVvdn0NQM}\n}",
        "github": "",
        "project": "",
        "reviewers": "wzax;qoq3;92wc;tBTh",
        "site": "https://openreview.net/forum?id=zqVvdn0NQM",
        "pdf_size": 716649,
        "rating": "3;3;3;5",
        "confidence": "4;5;3;5",
        "soundness": "1;3;2;2",
        "contribution": "1;2;1;1",
        "presentation": "1;3;2;2",
        "wc_summary": "27;72;63;75",
        "wc_strengths": "3;57;101;49",
        "wc_weaknesses": "74;217;239;107",
        "wc_questions": "15;156;10;411",
        "wc_review": "119;502;413;642",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            3.5,
            0.8660254037844386
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            1.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            59.25,
            19.13602623325961
        ],
        "wc_strengths_avg": [
            52.5,
            34.767082132384935
        ],
        "wc_weaknesses_avg": [
            159.25,
            70.1654295219519
        ],
        "wc_questions_avg": [
            148.0,
            162.76209632466646
        ],
        "wc_review_avg": [
            419.0,
            191.4771526840735
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.5222329678670935,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=7345131175740340901&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 2,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of Venice",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.unive.it",
        "aff_unique_abbr": "Unive",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Italy"
    },
    {
        "id": "zqXTZ3B7fU",
        "title": "Simplicial SMOTE: Oversampling Solution to the Imbalanced Learning Problem",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "SMOTE is the established geometric approach to random oversampling to balance classes in the imbalanced classes learning problem, followed by many extensions. Its idea is to introduce synthetic data points of the minor class, with each new point being the convex combination of an existing data point and one of its k-nearest neighbors. This could be viewed as a sampling from the edges of a geometric neighborhood graph. Borrowing tools from the topological data analysis, we propose a generalization of the sampling approach, thus sampling from the simplices of the geometric neighborhood simplicial complex. That is, a new point is defined by the barycentric coordinates with respect to a simplex spanned by an arbitrary number of data points being sufficiently close, rather than a pair. We evaluate the generalized technique which we call Simplicial SMOTE on 23 benchmark datasets, and conclude that it outperforms the original SMOTE and its extensions. Moreover, we show how simplicial sampling can be integrated into several popular SMOTE extensions, with our simplicial generalization of Borderline SMOTE further improves the performance on benchmarks datasets.",
        "keywords": "data augmentation;oversampling;imbalanced learning problem",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Oleg Kachan;Andrey Savchenko;Gleb Gennadjevich Gusev",
        "authorids": "~Oleg_Kachan1;~Andrey_Savchenko1;~Gleb_Gennadjevich_Gusev1",
        "gender": ";M;M",
        "homepage": "https://crei.skoltech.ru/ai/people/olegkachan;http://www.hse.ru/en/staff/avsavchenko;https://sberlabs.com/laboratories/sber-ai-lab",
        "dblp": "271/7527;25/9832;117/9143.html",
        "google_scholar": "2uQhiBIAAAAJ;https://scholar.google.ru/citations?user=1feIO4YAAAAJ;https://scholar.google.ru/citations?user=RWX4sYcAAAAJ",
        "orcid": "0000-0002-7679-755X;0000-0001-6196-0564;0009-0003-7298-1848",
        "linkedin": ";;gleb-gusev-55a6a0ab/",
        "or_profile": "~Oleg_Kachan1;~Andrey_Savchenko1;~Gleb_Gennadjevich_Gusev1",
        "aff": "HSE University;HSE University;ARTIFICIAL INTELLIGENCE RESEARCH INSTITUTE (AIRI)",
        "aff_domain": "hse.ru;hse.ru;airi.net",
        "position": "Researcher;Full Professor;Principal Researcher",
        "bibtex": "@misc{\nkachan2024simplicial,\ntitle={Simplicial {SMOTE}: Oversampling Solution to the Imbalanced Learning Problem},\nauthor={Oleg Kachan and Andrey Savchenko and Gleb Gennadjevich Gusev},\nyear={2024},\nurl={https://openreview.net/forum?id=zqXTZ3B7fU}\n}",
        "github": "",
        "project": "",
        "reviewers": "KN3Z;mVsN;qiAo;zg3w",
        "site": "https://openreview.net/forum?id=zqXTZ3B7fU",
        "pdf_size": 460229,
        "rating": "3;3;5;8",
        "confidence": "3;4;4;4",
        "soundness": "3;3;3;4",
        "contribution": "2;2;2;3",
        "presentation": "3;2;3;4",
        "wc_summary": "68;63;62;101",
        "wc_strengths": "58;47;59;157",
        "wc_weaknesses": "179;639;99;137",
        "wc_questions": "215;98;38;15",
        "wc_review": "520;847;258;410",
        "wc_reply_reviewers": "408;487;88;0",
        "wc_reply_authors": "952;1437;731;312",
        "reply_reviewers": "1;1;1;0",
        "reply_authors": "2;3;1;1",
        "rating_avg": [
            4.75,
            2.0463381929681126
        ],
        "confidence_avg": [
            3.75,
            0.4330127018922193
        ],
        "soundness_avg": [
            3.25,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            73.5,
            16.03901493234544
        ],
        "wc_strengths_avg": [
            80.25,
            44.5610536230911
        ],
        "wc_weaknesses_avg": [
            263.5,
            218.633826294103
        ],
        "wc_questions_avg": [
            91.5,
            77.47418925035615
        ],
        "wc_review_avg": [
            508.75,
            216.31386340223318
        ],
        "wc_reply_reviewers_avg": [
            245.75,
            206.03685956643778
        ],
        "wc_reply_authors_avg": [
            858.0,
            405.68522280211295
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.75,
            0.82915619758885
        ],
        "replies_avg": [
            16,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.49374193110101877,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:jAd_MOnYkZMJ:scholar.google.com/&scioq=Simplicial+SMOTE:+Oversampling+Solution+to+the+Imbalanced+Learning+Problem&hl=en&as_sdt=0,33",
        "gs_version_total": 0,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Higher School of Economics;",
        "aff_unique_dep": ";",
        "aff_unique_url": "https://hse.ru;",
        "aff_unique_abbr": "HSE;",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Russian Federation;"
    },
    {
        "id": "zrCybZXxC8",
        "title": "E-MCTS: Deep Exploration by Planning with Epistemic Uncertainty",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Deep model-based reinforcement learning (MBRL) is responsible for many of the greatest achievements of reinforcement learning. At the core of two of the approaches responsible for those successes, Alpha/MuZero, is a modified version of the Monte-Carlo Tree Search (MCTS) planning algorithm, replacing components of MCTS with learned models (of value and/or environment dynamics). Dedicated deep exploration, however, is a remaining challenge of Alpha/MuZero and by extension MCTS-based methods with learned models. To overcome this challenge, we develop Epistemic-MCTS. E-MCTS extends MCTS with estimation and propagation of epistemic uncertainty, and leverages the propagated uncertainty for a novel deep exploration algorithm by explicitly planning to explore. We incorporate E-MCTS into variations of MCTS-based MBRL approaches with learned (MuZero) and provided (AlphaZero) dynamics models. We compare E-MCTS to non-planning based deep-exploration baselines and demonstrate that E-MCTS significantly outperforms them in the investigated deep exploration benchmark.",
        "keywords": "Reinforcement learning;model based;exploration;uncertainty;planning",
        "primary_area": "reinforcement learning",
        "supplementary_material": "",
        "author": "Yaniv Oren;Viliam Vadocz;Matthijs T. J. Spaan;Wendelin Boehmer",
        "authorids": "~Yaniv_Oren1;~Viliam_Vadocz1;~Matthijs_T._J._Spaan1;~Wendelin_Boehmer1",
        "gender": "M;M;;M",
        "homepage": ";https://github.com/ViliamVadocz;;https://reinforceAI.net",
        "dblp": "331/8510;;;08/9988",
        "google_scholar": ";;;https://scholar.google.de/citations?user=wI5MV8IAAAAJ",
        "orcid": "0000-0003-0155-5000;;;0000-0002-4398-6792",
        "linkedin": "yaniv-oren-9a2a83135;;;wendelin-boehmer",
        "or_profile": "~Yaniv_Oren1;~Viliam_Vadocz1;~Matthijs_T._J._Spaan1;~Wendelin_Boehmer1",
        "aff": "Delft University of Technology;Delft University of Technology;;Delft University of Technology",
        "aff_domain": "tudelft.nl;tudelft.nl;;tudelft.nl",
        "position": "PhD student;Undergrad student;;Assistant Professor",
        "bibtex": "@misc{\noren2024emcts,\ntitle={E-{MCTS}: Deep Exploration by Planning with Epistemic Uncertainty},\nauthor={Yaniv Oren and Viliam Vadocz and Matthijs T. J. Spaan and Wendelin Boehmer},\nyear={2024},\nurl={https://openreview.net/forum?id=zrCybZXxC8}\n}",
        "github": "",
        "project": "",
        "reviewers": "RXgy;qzYy;9sR2;sVMG",
        "site": "https://openreview.net/forum?id=zrCybZXxC8",
        "pdf_size": 505302,
        "rating": "3;3;5;5",
        "confidence": "3;3;5;3",
        "soundness": "2;1;2;3",
        "contribution": "3;2;3;2",
        "presentation": "1;2;2;3",
        "wc_summary": "79;86;68;134",
        "wc_strengths": "85;61;57;64",
        "wc_weaknesses": "181;330;301;296",
        "wc_questions": "405;74;71;46",
        "wc_review": "750;551;497;540",
        "wc_reply_reviewers": "48;0;252;0",
        "wc_reply_authors": "540;242;297;268",
        "reply_reviewers": "1;0;1;0",
        "reply_authors": "1;1;1;1",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.5,
            0.8660254037844386
        ],
        "soundness_avg": [
            2.0,
            0.7071067811865476
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            2.0,
            0.7071067811865476
        ],
        "wc_summary_avg": [
            91.75,
            25.222757581200355
        ],
        "wc_strengths_avg": [
            66.75,
            10.825317547305483
        ],
        "wc_weaknesses_avg": [
            277.0,
            56.925389765903226
        ],
        "wc_questions_avg": [
            149.0,
            148.20087719038642
        ],
        "wc_review_avg": [
            584.5,
            97.6588449655227
        ],
        "wc_reply_reviewers_avg": [
            75.0,
            104.05287117614775
        ],
        "wc_reply_authors_avg": [
            336.75,
            118.9482555567756
        ],
        "reply_reviewers_avg": [
            0.5,
            0.5
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.5773502691896257,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:Tw6fN3odDCQJ:scholar.google.com/&scioq=E-MCTS:+Deep+Exploration+by+Planning+with+Epistemic+Uncertainty&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Delft University of Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tudelft.nl",
        "aff_unique_abbr": "TU Delft",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Netherlands"
    },
    {
        "id": "zrJJWn7O8H",
        "title": "Detect And Grasp Objects In The Sand Guided By Tactile Sensor",
        "track": "main",
        "status": "Desk Reject",
        "tldr": "",
        "abstract": "Robots rely on vision and touch as primary means to perceive and interact with the external environment. In scenarios where visual perception is limited or unavailable, tactile sensing plays a crucial role in an interaction application. This paper presents a novel grasping framework that utilizes a redesigned vision-based tactile sensor to enhance the robot's ability to explore and grasp invisible objects. The framework leverages the original tactile image acquired by the sensor to detect object contact and adjust grasping strength by analyzing the movement patterns of marker points in the tactile image. Using the framework, we achieve accurate positioning and non-destructive grasping of target objects in sand.",
        "keywords": "tactile sensors;grasp;sand",
        "primary_area": "applications to robotics, autonomy, planning",
        "supplementary_material": "",
        "author": "Shubiao An;Nan Wang;Gu Jiayang",
        "authorids": "~Shubiao_An2;~Nan_Wang11;~Gu_Jiayang1",
        "gender": "M;F;M",
        "homepage": "https://myaccount.google.com/u/1/?utm_source=sign_in_no_continue;http://it.ouc.edu.cn/wn2/main.htm;https://github.com/gu-jiayang",
        "dblp": ";;",
        "google_scholar": ";;",
        "orcid": ";;",
        "linkedin": ";;",
        "or_profile": "~Shubiao_An2;~Nan_Wang11;~Gu_Jiayang1",
        "aff": "Ocean University of China;Ocean University of China;Ocean University of China",
        "aff_domain": "ouc.edu.cn;ouc.edu.cn;ouc.edu.cn",
        "position": "MS student;Associate Professor;MS student",
        "bibtex": "@misc{\nan2024detect,\ntitle={Detect And Grasp Objects In The Sand Guided By Tactile Sensor},\nauthor={Shubiao An and Nan Wang and Gu Jiayang},\nyear={2024},\nurl={https://openreview.net/forum?id=zrJJWn7O8H}\n}",
        "github": "",
        "project": "",
        "reviewers": "",
        "site": "https://openreview.net/forum?id=zrJJWn7O8H",
        "pdf_size": 0,
        "rating": "",
        "confidence": "",
        "soundness": "",
        "contribution": "",
        "presentation": "",
        "wc_summary": "",
        "wc_strengths": "",
        "wc_weaknesses": "",
        "wc_questions": "",
        "wc_review": "",
        "wc_reply_reviewers": "",
        "wc_reply_authors": "",
        "reply_reviewers": "",
        "reply_authors": "",
        "rating_avg": [
            0,
            0
        ],
        "confidence_avg": [
            0,
            0
        ],
        "soundness_avg": [
            0,
            0
        ],
        "contribution_avg": [
            0,
            0
        ],
        "presentation_avg": [
            0,
            0
        ],
        "wc_summary_avg": [
            0,
            0
        ],
        "wc_strengths_avg": [
            0,
            0
        ],
        "wc_weaknesses_avg": [
            0,
            0
        ],
        "wc_questions_avg": [
            0,
            0
        ],
        "wc_review_avg": [
            0,
            0
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            0,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:EvMGL8q0HmgJ:scholar.google.com/&scioq=Detect+And+Grasp+Objects+In+The+Sand+Guided+By+Tactile+Sensor&hl=en&as_sdt=0,44",
        "gs_version_total": 2,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Ocean University of China",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.ouc.edu.cn",
        "aff_unique_abbr": "OUC",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "zrxlSviRqC",
        "title": "Learning energy-based models by self-normalising the likelihood",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Training an energy-based model (EBM) with maximum likelihood is challenging due to the intractable normalisation constant. Traditional methods rely on expensive Markov chain Monte Carlo (MCMC) sampling to estimate the gradient of normalisation constants. We propose a novel objective called self-normalised likelihood (SNL) that introduces a single additional learnable parameter representing the normalisation constant compared to the regular likelihood. SNL is a lower bound of the likelihood, and its optimum is the maximum likelihood estimate of the model parameters and the normalisation constant. We show that the SNL objective is concave in the model parameters for exponential family distributions. Unlike the regular likelihood, the SNL can be directly optimised using stochastic gradient techniques by sampling from a crude proposal distribution. We validate the effectiveness of our proposed method on various low-dimensional density estimation tasks as well as EBMs for regression. Our results show that the proposed method, while simpler to implement and tune, outperforms existing techniques.",
        "keywords": "generative models;energy-based models;maximum likelihood;unnormalised models",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Hugo Henri Joseph Senetaire;Paul Jeha;Jes Frellsen;Pierre-Alexandre Mattei",
        "authorids": "~Hugo_Henri_Joseph_Senetaire1;~Paul_Jeha1;~Jes_Frellsen1;~Pierre-Alexandre_Mattei3",
        "gender": "M;M;M;M",
        "homepage": "https://orbit.dtu.dk/en/persons/hugo-henri-joseph-s%C3%A9n%C3%A9taire;;https://frellsen.org;http://pamattei.github.io",
        "dblp": ";298/7731;83/8247;177/7275",
        "google_scholar": "SY5DUXkAAAAJ;;Yj2sBWkAAAAJ;https://scholar.google.fr/citations?user=Tqa_-D0AAAAJ",
        "orcid": ";;0000-0001-9224-1271;",
        "linkedin": "https://fr.linkedin.com/in/hugo-senetaire-5771a1142;pauljeha/;frellsen/;",
        "or_profile": "~Hugo_Henri_Joseph_Senetaire1;~Paul_Jeha1;~Jes_Frellsen1;~Pierre-Alexandre_Mattei3",
        "aff": "Amazon;Technical University of Denmark;Technical University of Denmark;INRIA",
        "aff_domain": "amazon.de;dtu.dk;dtu.dk;inria.fr",
        "position": "Intern;PhD student;Associate Professor;Research scientist",
        "bibtex": "@misc{\nsenetaire2024learning,\ntitle={Learning energy-based models by self-normalising the likelihood},\nauthor={Hugo Henri Joseph Senetaire and Paul Jeha and Jes Frellsen and Pierre-Alexandre Mattei},\nyear={2024},\nurl={https://openreview.net/forum?id=zrxlSviRqC}\n}",
        "github": "",
        "project": "",
        "reviewers": "qYkm;3VY8;CuDM",
        "site": "https://openreview.net/forum?id=zrxlSviRqC",
        "pdf_size": 1054323,
        "rating": "5;5;5",
        "confidence": "3;4;4",
        "soundness": "3;4;2",
        "contribution": "3;3;2",
        "presentation": "2;4;3",
        "wc_summary": "76;138;62",
        "wc_strengths": "64;29;23",
        "wc_weaknesses": "109;63;451",
        "wc_questions": "30;227;3",
        "wc_review": "279;457;539",
        "wc_reply_reviewers": "134;0;261",
        "wc_reply_authors": "310;540;1446",
        "reply_reviewers": "1;0;1",
        "reply_authors": "1;1;2",
        "rating_avg": [
            5.0,
            0.0
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.816496580927726
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            3.0,
            0.816496580927726
        ],
        "wc_summary_avg": [
            92.0,
            33.0252428706689
        ],
        "wc_strengths_avg": [
            38.666666666666664,
            18.080068829760823
        ],
        "wc_weaknesses_avg": [
            207.66666666666666,
            173.08443668401333
        ],
        "wc_questions_avg": [
            86.66666666666667,
            99.84098468175392
        ],
        "wc_review_avg": [
            425.0,
            108.52956586417669
        ],
        "wc_reply_reviewers_avg": [
            131.66666666666666,
            106.56557709796454
        ],
        "wc_reply_authors_avg": [
            765.3333333333334,
            490.3776322613239
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.3333333333333333,
            0.4714045207910317
        ],
        "replies_avg": [
            12,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:_NkorX93HvUJ:scholar.google.com/&scioq=Learning+energy-based+models+by+self-normalising+the+likelihood&hl=en&as_sdt=0,5",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;1;2",
        "aff_unique_norm": "Amazon;Technical University of Denmark;INRIA",
        "aff_unique_dep": "Amazon.com, Inc.;;",
        "aff_unique_url": "https://www.amazon.com;https://www.tek.dk;https://www.inria.fr",
        "aff_unique_abbr": "Amazon;DTU;INRIA",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;1;1;2",
        "aff_country_unique": "United States;Denmark;France"
    },
    {
        "id": "zsfrzYWoOP",
        "title": "FABRIC: Personalizing Diffusion Models with Iterative Feedback",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "In an era where visual content generation is increasingly driven by machine learning, the integration of human feedback into generative models presents significant opportunities for enhancing user experience and output quality.\nThis study explores strategies for incorporating iterative human feedback into the generative process of diffusion-based text-to-image models.\nWe propose FABRIC, a training-free approach applicable to a wide range of popular diffusion models, which exploits the self-attention layer present in the most widely used architectures to condition the diffusion process on a set of feedback images.\nTo ensure a rigorous assessment of our approach, we introduce a comprehensive evaluation methodology, offering a robust mechanism to quantify the performance of generative visual models that integrate human feedback. \nWe show that generation results improve over multiple rounds of iterative feedback through exhaustive analysis, implicitly optimizing arbitrary user preferences.\nThe potential applications of these findings extend to fields such as personalized content creation and customization.",
        "keywords": "text-to-image;human feedback;personalized generation;controllable generation;diffusion models",
        "primary_area": "generative models",
        "supplementary_material": "",
        "author": "Dimitri von R\u00fctte;Elisabetta Fedele;Jonathan Thomm;Lukas Wolf",
        "authorids": "~Dimitri_von_R\u00fctte1;~Elisabetta_Fedele1;~Jonathan_Thomm1;~Lukas_Wolf1",
        "gender": ";F;M;M",
        "homepage": ";;;https://lu-wo.github.io",
        "dblp": ";;352/5370.html;305/7412",
        "google_scholar": "wVQcUf8AAAAJ;;;_FvMBFIAAAAJ",
        "orcid": ";;;",
        "linkedin": "dimitri-von-r%C3%BCtte-890633215/;elisabetta-f-0a35bb113/;jonathan-thomm/?locale=en_US;lukas-wolf-14a992143/",
        "or_profile": "~Dimitri_von_R\u00fctte1;~Elisabetta_Fedele1;~Jonathan_Thomm1;~Lukas_Wolf1",
        "aff": "ETH Zurich;ETHZ - ETH Zurich;Department of Computer Science, ETHZ - ETH Zurich;",
        "aff_domain": "ethz.ch;ethz.ch;inf.ethz.ch;",
        "position": "MS student;MS student;MS student;",
        "bibtex": "@misc{\nr{\\\"u}tte2024fabric,\ntitle={{FABRIC}: Personalizing Diffusion Models with Iterative Feedback},\nauthor={Dimitri von R{\\\"u}tte and Elisabetta Fedele and Jonathan Thomm and Lukas Wolf},\nyear={2024},\nurl={https://openreview.net/forum?id=zsfrzYWoOP}\n}",
        "github": "",
        "project": "",
        "reviewers": "dJNm;bHFH;vmZN",
        "site": "https://openreview.net/forum?id=zsfrzYWoOP",
        "pdf_size": 2865838,
        "rating": "5;6;6",
        "confidence": "3;4;4",
        "soundness": "3;3;3",
        "contribution": "2;3;3",
        "presentation": "3;3;2",
        "wc_summary": "68;73;34",
        "wc_strengths": "57;143;59",
        "wc_weaknesses": "253;153;30",
        "wc_questions": "84;2;12",
        "wc_review": "462;371;135",
        "wc_reply_reviewers": "48;0;23",
        "wc_reply_authors": "1441;746;68",
        "reply_reviewers": "1;0;1",
        "reply_authors": "3;1;1",
        "rating_avg": [
            5.666666666666667,
            0.4714045207910317
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            58.333333333333336,
            17.326921891156037
        ],
        "wc_strengths_avg": [
            86.33333333333333,
            40.07770230717103
        ],
        "wc_weaknesses_avg": [
            145.33333333333334,
            91.20063352606469
        ],
        "wc_questions_avg": [
            32.666666666666664,
            36.527006751473934
        ],
        "wc_review_avg": [
            322.6666666666667,
            137.80259633096742
        ],
        "wc_reply_reviewers_avg": [
            23.666666666666668,
            19.601587237318874
        ],
        "wc_reply_authors_avg": [
            751.6666666666666,
            560.5392245170915
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.6666666666666667,
            0.9428090415820634
        ],
        "replies_avg": [
            13,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": 0.9999999999999997,
        "gs_citation": 12,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8987134632007076370&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "ETH Zurich",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ethz.ch",
        "aff_unique_abbr": "ETHZ",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Zurich",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "Switzerland"
    },
    {
        "id": "zt8bb6vC4m",
        "title": "Pricing with Contextual Elasticity and Heteroscedastic Valuation",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "We study an online contextual dynamic pricing problem, where customers decide whether to purchase a product based on its features and price. We introduce a novel approach to modeling a customer's expected demand by incorporating feature-based price elasticity, which can be equivalently represented as a valuation with heteroscedastic noise. To solve the problem, we propose a computationally efficient algorithm called \"Pricing with Perturbation (PwP)\", which enjoys an $O(\\sqrt{dT\\log T})$ regret while allowing arbitrary adversarial input context sequences. We also prove a matching lower bound at $\\Omega(\\sqrt{dT})$ to show the optimality (up to $\\log T$ factors). Our results shed light on the relationship between contextual elasticity and heteroscedastic valuation, providing insights for effective and practical pricing strategies.",
        "keywords": "dynamic pricing;online learning",
        "primary_area": "learning theory",
        "supplementary_material": "",
        "author": "Jianyu Xu;Yu-Xiang Wang",
        "authorids": "~Jianyu_Xu1;~Yu-Xiang_Wang1",
        "gender": "M;",
        "homepage": "https://xu-jy.github.io/;http://www.cs.ucsb.edu/~yuxiangw/publications.html",
        "dblp": ";62/1637-3.html",
        "google_scholar": "3ubVhAMAAAAJ;HGNZ1fkAAAAJ",
        "orcid": ";",
        "linkedin": ";",
        "or_profile": "~Jianyu_Xu1;~Yu-Xiang_Wang1",
        "aff": "UC Santa Barbara;UC Santa Barbara",
        "aff_domain": "ucsb.edu;ucsb.edu",
        "position": "PhD student;Assistant Professor",
        "bibtex": "@misc{\nxu2024pricing,\ntitle={Pricing with Contextual Elasticity and Heteroscedastic Valuation},\nauthor={Jianyu Xu and Yu-Xiang Wang},\nyear={2024},\nurl={https://openreview.net/forum?id=zt8bb6vC4m}\n}",
        "github": "",
        "project": "",
        "reviewers": "DP3X;6Reb;vsAQ;g3du",
        "site": "https://openreview.net/forum?id=zt8bb6vC4m",
        "pdf_size": 7247251,
        "rating": "3;6;6;6",
        "confidence": "3;5;4;3",
        "soundness": "2;3;3;3",
        "contribution": "2;3;3;2",
        "presentation": "3;3;3;3",
        "wc_summary": "72;48;48;54",
        "wc_strengths": "19;95;47;29",
        "wc_weaknesses": "103;35;274;178",
        "wc_questions": "2;144;2;1",
        "wc_review": "196;322;371;262",
        "wc_reply_reviewers": "189;0;10;16",
        "wc_reply_authors": "730;602;700;621",
        "reply_reviewers": "1;0;1;1",
        "reply_authors": "3;1;1;1",
        "rating_avg": [
            5.25,
            1.299038105676658
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            2.5,
            0.5
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            55.5,
            9.836157786453
        ],
        "wc_strengths_avg": [
            47.5,
            29.201883500897676
        ],
        "wc_weaknesses_avg": [
            147.5,
            88.83833631940661
        ],
        "wc_questions_avg": [
            37.25,
            61.633493329520114
        ],
        "wc_review_avg": [
            287.75,
            65.54530875661507
        ],
        "wc_reply_reviewers_avg": [
            53.75,
            78.29551392001972
        ],
        "wc_reply_authors_avg": [
            663.25,
            53.25117369598533
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.5,
            0.8660254037844386
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": 0.5222329678670935,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=1906783157447010543&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 8,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "University of California, Santa Barbara",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ucsb.edu",
        "aff_unique_abbr": "UCSB",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Santa Barbara",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "Enhancing Small Medical Learners with Privacy-preserving Contextual Prompting",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17369",
        "id": "ztpy1gsUpT",
        "author_site": "xinlu zhang, Shiyang Li, Xianjun Yang, Chenxin Tian, Yao Qin, Linda Petzold",
        "tldr": "",
        "abstract": "Large language models (LLMs) demonstrate remarkable medical expertise, but data privacy concerns impede their direct use in healthcare environments. Although offering improved data privacy protection, domain-specific small language models (SLMs) often underperform LLMs, emphasizing the need for methods that reduce this performance gap while alleviating privacy concerns. In this paper, we present a simple yet effective method that harnesses LLMs' medical proficiency to boost SLM performance in medical tasks under $privacy-restricted$ scenarios. Specifically, we mitigate patient privacy issues by extracting keywords from medical data and prompting the LLM to generate a medical knowledge-intensive context by simulating clinicians' thought processes. This context serves as additional input for SLMs, augmenting their decision-making capabilities. Our method significantly enhances performance in both few-shot and full training settings across three medical knowledge-intensive tasks, achieving up to a 22.57% increase in absolute accuracy compared to SLM fine-tuning without context, and sets new state-of-the-art results in two medical tasks within privacy-restricted scenarios. Further out-of-domain testing and experiments in two general domain datasets showcase its generalizability and broad applicability.",
        "keywords": "natural language processing;large language model prompting;application in healthcare;privacy",
        "primary_area": "applications to physical sciences (physics, chemistry, biology, etc.)",
        "supplementary_material": "/attachment/d8d2f75fb2a6dc8fb0455ed0712335805dac6fbc.pdf",
        "author": "Xinlu Zhang;Shiyang Li;Xianjun Yang;Chenxin Tian;Yao Qin;Linda Ruth Petzold",
        "authorids": "~Xinlu_Zhang1;~Shiyang_Li1;~Xianjun_Yang1;~Chenxin_Tian1;~Yao_Qin1;~Linda_Ruth_Petzold1",
        "gender": ";;M;F;;",
        "homepage": ";;;;https://yaoqin1.github.io;",
        "dblp": "45/4569;;37/10237;;66/10420-1;",
        "google_scholar": "Bymi2YYAAAAJ;;Tunh15sAAAAJ;;https://scholar.google.com/citations?view_op=list_works;",
        "orcid": ";;0000-0003-3318-8444;;;",
        "linkedin": "xinlu-zhang-970501/;;xianjun-yang-0062aa1a6/;tracyctian/;;",
        "or_profile": "~Xinlu_Zhang1;~Shiyang_Li1;~Xianjun_Yang1;~Chenxin_Tian1;~Yao_Qin1;~Linda_Ruth_Petzold1",
        "aff": "University of California, Santa Barbara;;University of California, Santa Barbara;Peking Union Medical Collage;Google;",
        "aff_domain": "ucsb.edu;;ucsb.edu;pumc.edu;google.com;",
        "position": "PhD student;;PhD student;PhD student;Researcher;",
        "bibtex": "@inproceedings{\nzhang2024enhancing,\ntitle={Enhancing Small Medical Learners with Privacy-preserving Contextual Prompting},\nauthor={Xinlu Zhang and Shiyang Li and Xianjun Yang and Chenxin Tian and Yao Qin and Linda Ruth Petzold},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=ztpy1gsUpT}\n}",
        "github": "",
        "project": "",
        "reviewers": "JSi7;gXvF;TtE2;EBQC",
        "pdf_size": 724432,
        "rating": "6;6;6;6",
        "confidence": "3;4;4;3",
        "soundness": "3;3;2;3",
        "contribution": "3;3;3;3",
        "presentation": "3;2;2;3",
        "wc_summary": "63;55;53;83",
        "wc_strengths": "2;39;75;117",
        "wc_weaknesses": "182;202;246;58",
        "wc_questions": "4;30;52;120",
        "wc_review": "251;326;426;378",
        "wc_reply_reviewers": "0;15;135;0",
        "wc_reply_authors": "402;386;699;667",
        "reply_reviewers": "0;1;2;0",
        "reply_authors": "1;1;2;1",
        "rating_avg": [
            6.0,
            0.0
        ],
        "confidence_avg": [
            3.5,
            0.5
        ],
        "soundness_avg": [
            2.75,
            0.4330127018922193
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            2.5,
            0.5
        ],
        "wc_summary_avg": [
            63.5,
            11.863810517704673
        ],
        "wc_strengths_avg": [
            58.25,
            42.62261723545376
        ],
        "wc_weaknesses_avg": [
            172.0,
            69.77105417004964
        ],
        "wc_questions_avg": [
            51.5,
            43.04358256465184
        ],
        "wc_review_avg": [
            345.25,
            64.89751536075939
        ],
        "wc_reply_reviewers_avg": [
            37.5,
            56.62375826453062
        ],
        "wc_reply_authors_avg": [
            538.5,
            145.05257667480436
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            15,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": 0.0,
        "gs_citation": 3,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11868761606833320041&as_sdt=5,44&sciodt=0,44&hl=en",
        "gs_version_total": 4,
        "openreview": "https://openreview.net/forum?id=ztpy1gsUpT",
        "pdf": "https://openreview.net/pdf?id=ztpy1gsUpT",
        "email": "ucsb.edu;;ucsb.edu;pumc.edu;google.com;",
        "author_num": 6,
        "aff_unique_index": "0;0;1;2",
        "aff_unique_norm": "University of California, Santa Barbara;Peking Union Medical College;Google",
        "aff_unique_dep": ";;Google",
        "aff_unique_url": "https://www.ucsb.edu;http://www.pumc.edu.cn;https://www.google.com",
        "aff_unique_abbr": "UCSB;PUMC;Google",
        "aff_campus_unique_index": "0;0;2",
        "aff_campus_unique": "Santa Barbara;;Mountain View",
        "aff_country_unique_index": "0;0;1;0",
        "aff_country_unique": "United States;China"
    },
    {
        "id": "ztuCObOc2i",
        "title": "Neural Sinkhorn Gradient Flow",
        "track": "main",
        "status": "Reject",
        "tldr": "",
        "abstract": "Wasserstein Gradient Flows (WGF) with respect to specific functionals have been widely used in the machine learning literature. \nRecently, neural networks have been adopted to approximate certain intractable parts of the underlying Wasserstein gradient flow and result in efficient inference procedures. In this paper, we introduce the Neural Sinkhorn Gradient Flow (NSGF) model,  which parametrizes the time-varying velocity field of the Wasserstein gradient flow w.r.t. the Sinkhorn divergence to the target distribution starting a given source distribution.  We utilize the velocity field matching training scheme in NSGF, which only requires samples from the source and target distribution to compute an empirical velocity field approximation. Our theoretical analyses show that as the sample size increases to infinity, the mean-field limit of the empirical approximation converges to the true underlying velocity field. With specific source and target data samples, our NSGF models can be used in many machine learning tasks such as unconditional/conditional image generating, style transfer, and audio-text translations.  Numerical experiments with synthetic and real-world benchmark datasets support our theoretical results and demonstrate the effectiveness of the proposed method.",
        "keywords": "Wasserstein gradient flow;Sinkhorn Divergence",
        "primary_area": "generative models",
        "supplementary_material": "/attachment/55945cc26f333b349abc4ab1aa165d87f6c6c50d.zip",
        "author": "Huminhao Zhu;Fangyikang Wang;Chao Zhang;Hanbin Zhao;Hui Qian",
        "authorids": "~Huminhao_Zhu1;~Fangyikang_Wang1;~Chao_Zhang19;~Hanbin_Zhao1;~Hui_Qian1",
        "gender": "M;M;M;M;M",
        "homepage": "https://lab304.pages.dev/zh-CN/team/;;;;",
        "dblp": "365/9439;365/8666;94/3019-29;222/7871;66/5293",
        "google_scholar": "https://scholar.google.com.hk/citations?hl=zh-CN;j80akcEAAAAJ;;F2kiw10AAAAJ;",
        "orcid": ";;;;",
        "linkedin": ";;;;",
        "or_profile": "~Huminhao_Zhu1;~Fangyikang_Wang1;~Chao_Zhang19;~Hanbin_Zhao1;~Hui_Qian1",
        "aff": "College of Computer Science and Technology, Zhejiang University;Zhejiang University;Zhejiang University;Zhejiang University;Zhejiang University",
        "aff_domain": "cs.zju.edu.cn;zju.edu.cn;zju.edu.cn;zju.edu.cn;zju.edu.cn",
        "position": "MS student;MS student;Assistant Professor;Assistant Professor;Full Professor",
        "bibtex": "@misc{\nzhu2024neural,\ntitle={Neural Sinkhorn Gradient Flow},\nauthor={Huminhao Zhu and Fangyikang Wang and Chao Zhang and Hanbin Zhao and Hui Qian},\nyear={2024},\nurl={https://openreview.net/forum?id=ztuCObOc2i}\n}",
        "github": "",
        "project": "",
        "reviewers": "AcYB;KKim;KkYD;Kh9H;MEFG",
        "site": "https://openreview.net/forum?id=ztuCObOc2i",
        "pdf_size": 3954762,
        "rating": "5;5;5;6;6",
        "confidence": "4;4;4;4;3",
        "soundness": "3;2;2;3;3",
        "contribution": "2;2;2;2;3",
        "presentation": "2;2;3;2;3",
        "wc_summary": "64;110;138;78;60",
        "wc_strengths": "39;61;144;16;38",
        "wc_weaknesses": "367;427;163;152;70",
        "wc_questions": "46;275;382;16;62",
        "wc_review": "516;873;827;262;230",
        "wc_reply_reviewers": "205;428;0;0;78",
        "wc_reply_authors": "1074;1506;912;157;486",
        "reply_reviewers": "2;1;0;0;1",
        "reply_authors": "2;3;2;1;2",
        "rating_avg": [
            5.4,
            0.48989794855663565
        ],
        "confidence_avg": [
            3.8,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.6,
            0.4898979485566356
        ],
        "contribution_avg": [
            2.2,
            0.39999999999999997
        ],
        "presentation_avg": [
            2.4,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            90.0,
            29.74558790812513
        ],
        "wc_strengths_avg": [
            59.6,
            44.53582827342498
        ],
        "wc_weaknesses_avg": [
            235.8,
            136.80847926937864
        ],
        "wc_questions_avg": [
            156.2,
            145.4460724804902
        ],
        "wc_review_avg": [
            541.6,
            271.000073800728
        ],
        "wc_reply_reviewers_avg": [
            142.2,
            161.36220127402822
        ],
        "wc_reply_authors_avg": [
            827.0,
            467.8580981451534
        ],
        "reply_reviewers_avg": [
            0.8,
            0.7483314773547883
        ],
        "reply_authors_avg": [
            2.0,
            0.6324555320336759
        ],
        "replies_avg": [
            21,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": -0.6123724356957945,
        "gs_citation": 7,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=6933912586063860391&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "Zhejiang University",
        "aff_unique_dep": "College of Computer Science and Technology",
        "aff_unique_url": "http://www.zju.edu.cn",
        "aff_unique_abbr": "ZJU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "China"
    },
    {
        "id": "zvTnwY5uS7",
        "title": "Improving Knowledge Distillation via Regularizing Feature Direction and Norm",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Knowledge distillation (KD) exploits a large well-trained {\\tt teacher} neural network to train a small {\\tt student} network on the same dataset for the same task.\nTreating {\\tt teacher}'s feature as knowledge, prevailing methods train {\\tt student} by aligning its features with the {\\tt teacher}'s, e.g., by minimizing the KL-divergence between their logits or L2 distance between their features at intermediate layers. \nWhile it is natural to assume that better feature alignment helps distill {\\tt teacher}'s knowledge, simply forcing this alignment does not directly contribute to the {\\tt student}'s performance, e.g., classification accuracy.\nFor example, minimizing the L2 distance between the penultimate-layer features (used to compute logits for classification) does not necessarily help learn a better {\\tt student}-classifier.\nTherefore, we are motivated to regularize {\\tt student} features at the penultimate layer using {\\tt teacher} towards training a better {\\tt student} classifier.\nSpecifically, we present a rather simple method that uses {\\tt teacher}'s class-mean features to align {\\tt student} features w.r.t their {\\em direction}.\nExperiments show that this significantly improves KD performance. Moreover, we empirically find that {\\tt student} produces features that have notably smaller norms than {\\tt teacher}'s, motivating us to regularize {\\tt student} to produce large-norm features.\nExperiments show that doing so also yields better performance. Finally, we present a simple loss as our main technical contribution that regularizes {\\tt student} by simultaneously (1) aligning the \\emph{direction} of its features with the {\\tt teacher} class-mean feature, and (2) encouraging it to produce large-\\emph{norm} features.\nExperiments on standard benchmarks demonstrate that adopting our technique remarkably improves existing KD methods, achieving the state-of-the-art KD performance through the lens of image classification (on ImageNet and CIFAR100 datasets) and object detection (on the COCO dataset).",
        "keywords": "knowledge distillation;feature norm;feature direction;network compression;feature regularization;student training",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/abc3b017786ee90d808a17f5048dab586b67a899.zip",
        "author": "Yuzhu Wang;Lechao Cheng;Manni Duan;Yongheng Wang;Zunlei Feng;Shu Kong",
        "authorids": "~Yuzhu_Wang1;~Lechao_Cheng2;~Manni_Duan2;~Yongheng_Wang1;~Zunlei_Feng1;~Shu_Kong1",
        "gender": ";M;F;M;M;M",
        "homepage": ";https://faculty.hfut.edu.cn/ChengLechao;;;https://person.zju.edu.cn/en/zunleifeng;https://aimerykong.github.io/",
        "dblp": ";165/9781;03/3126;34/6716.html;191/2455;26/11141",
        "google_scholar": "ApZFks8AAAAJ;PKFAv-cAAAAJ;lIlNBQoAAAAJ;LTZcz5cAAAAJ;wMtjcGwAAAAJ;sm9FdLoAAAAJ",
        "orcid": "0009-0005-8827-3779;0000-0002-7546-9052;;;;0000-0002-1362-5937",
        "linkedin": ";;;yongheng-wang-34615a277/;;aimerykong/",
        "or_profile": "~Yuzhu_Wang1;~Lechao_Cheng2;~Manni_Duan2;~Yongheng_Wang1;~Zunlei_Feng1;~Shu_Kong1",
        "aff": "Zhejiang lab;Hefei University of Technology;Zhejiang Lab;Zhejiang lab;Zhejiang University;Texas A&M University - College Station",
        "aff_domain": "zhejianglab.com;hfut.edu.cn;zhejianglab.com;zhejianglab.com;zju.edu.cn;tamu.edu",
        "position": "Algorithm Engineer;Associate Professor;Researcher;Researcher;Associate Professor;Assistant Professor",
        "bibtex": "@misc{\nwang2024improving,\ntitle={Improving Knowledge Distillation via Regularizing Feature Direction and Norm},\nauthor={Yuzhu Wang and Lechao Cheng and Manni Duan and Yongheng Wang and Zunlei Feng and Shu Kong},\nyear={2024},\nurl={https://openreview.net/forum?id=zvTnwY5uS7}\n}",
        "github": "",
        "project": "",
        "reviewers": "HgHQ;AuzT;yLjx;VRvE",
        "site": "https://openreview.net/forum?id=zvTnwY5uS7",
        "pdf_size": 1273991,
        "rating": "3;5;6;6",
        "confidence": "5;4;5;4",
        "soundness": "2;2;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;2;3;3",
        "wc_summary": "19;24;205;52",
        "wc_strengths": "26;10;108;59",
        "wc_weaknesses": "28;74;168;123",
        "wc_questions": "73;3;29;1",
        "wc_review": "146;111;510;235",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            5.0,
            1.224744871391589
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            75.0,
            76.10190536379493
        ],
        "wc_strengths_avg": [
            50.75,
            37.47916087641237
        ],
        "wc_weaknesses_avg": [
            98.25,
            52.44223012039057
        ],
        "wc_questions_avg": [
            26.5,
            29.03015673398957
        ],
        "wc_review_avg": [
            250.5,
            156.493610093192
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            6,
            0
        ],
        "corr_rating_confidence": -0.40824829046386296,
        "gs_citation": 4,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=10673550256093591161&as_sdt=80000005&sciodt=0,23&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;1;2;0;0;3",
        "aff_unique_norm": "Zhejiang University;Hefei University of Technology;Zhejiang Lab;Texas A&M University",
        "aff_unique_dep": "Zhejiang Lab;;;",
        "aff_unique_url": "http://www.zju.edu.cn;http://www.hfut.edu.cn/;http://www.zhejianglab.com;https://www.tamu.edu",
        "aff_unique_abbr": "ZJU;HUT;;TAMU",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";College Station",
        "aff_country_unique_index": "0;0;0;0;0;1",
        "aff_country_unique": "China;United States"
    },
    {
        "title": "Out-of-Variable Generalisation for Discriminative Models",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17368",
        "id": "zwMfg9PfPs",
        "author_site": "Siyuan Guo, Jonas Wildberger, Bernhard Schoelkopf",
        "tldr": "",
        "abstract": "The ability of an agent to do well in new environments is a critical aspect of intelligence. In machine learning, this ability is known as $\\textit{strong}$ or $\\textit{out-of-distribution}$ generalization. However, merely considering differences in distributions is inadequate for fully capturing differences between learning environments. In the present paper, we investigate $\\textit{out-of-variable}$ generalization, which pertains to an agent's generalization capabilities concerning environments with variables that were never jointly observed before. This skill closely reflects the process of animate learning: we, too, explore Nature by probing, observing, and measuring proper $\\textit{subsets}$ of variables at any given time. Mathematically, $\\textit{oov}$ generalization requires the efficient re-use of past marginal information, i.e., information over subsets of previously observed variables. We study this problem, focusing on prediction tasks across environments that contain overlapping, yet distinct, sets of causes. We show that after fitting a classifier, the residual distribution in one environment reveals the partial derivative of the true generating function with respect to the unobserved causal parent in that environment. We leverage this information and propose a method that exhibits non-trivial out-of-variable generalization performance when facing an overlapping, yet distinct, set of causal predictors. Code: https://github.com/syguo96/Out-of-Variable-Generalization",
        "keywords": "Out-of-Variable Generalization;Causality",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/cf0a8133935fe54905fad0549253af560be4d3ee.pdf",
        "author": "Siyuan Guo;Jonas Bernhard Wildberger;Bernhard Sch\u00f6lkopf",
        "authorids": "~Siyuan_Guo1;~Jonas_Bernhard_Wildberger1;~Bernhard_Sch\u00f6lkopf1",
        "gender": "F;M;",
        "homepage": "https://siyuanguo.com/;;",
        "dblp": ";309/6792;",
        "google_scholar": ";;",
        "orcid": ";0000-0002-3433-5920;",
        "linkedin": ";;",
        "or_profile": "~Siyuan_Guo1;~Jonas_Bernhard_Wildberger1;~Bernhard_Sch\u00f6lkopf1",
        "aff": "Max Planck Institute for Intelligent Systems, Max-Planck Institute;Max Planck Institute for Intelligent Systems, Max-Planck Institute;",
        "aff_domain": "tuebingen.mpg.de;tuebingen.mpg.de;",
        "position": "PhD student;PhD student;",
        "bibtex": "@inproceedings{\nguo2024outofvariable,\ntitle={Out-of-Variable Generalisation for Discriminative Models},\nauthor={Siyuan Guo and Jonas Bernhard Wildberger and Bernhard Sch{\\\"o}lkopf},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=zwMfg9PfPs}\n}",
        "github": "",
        "project": "",
        "reviewers": "qFZD;woi7;s9Ga;xwQY",
        "pdf_size": 645388,
        "rating": "5;6;8;8",
        "confidence": "2;3;4;3",
        "soundness": "3;3;3;3",
        "contribution": "2;2;2;3",
        "presentation": "3;3;4;3",
        "wc_summary": "89;81;132;96",
        "wc_strengths": "19;48;110;293",
        "wc_weaknesses": "124;69;49;91",
        "wc_questions": "4;295;163;122",
        "wc_review": "236;493;454;602",
        "wc_reply_reviewers": "0;75;138;271",
        "wc_reply_authors": "782;1207;423;339",
        "reply_reviewers": "0;1;1;1",
        "reply_authors": "1;2;1;1",
        "rating_avg": [
            6.75,
            1.299038105676658
        ],
        "confidence_avg": [
            3.0,
            0.7071067811865476
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            2.25,
            0.4330127018922193
        ],
        "presentation_avg": [
            3.25,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            99.5,
            19.5
        ],
        "wc_strengths_avg": [
            117.5,
            106.52347159194541
        ],
        "wc_weaknesses_avg": [
            83.25,
            27.82422505659412
        ],
        "wc_questions_avg": [
            146.0,
            103.95912658347991
        ],
        "wc_review_avg": [
            446.25,
            132.9555846890231
        ],
        "wc_reply_reviewers_avg": [
            121.0,
            99.4308805150593
        ],
        "wc_reply_authors_avg": [
            687.75,
            342.86394896518357
        ],
        "reply_reviewers_avg": [
            0.75,
            0.4330127018922193
        ],
        "reply_authors_avg": [
            1.25,
            0.4330127018922193
        ],
        "replies_avg": [
            19,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": 0.816496580927726,
        "gs_citation": 6,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=12437950867346060999&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 3,
        "openreview": "https://openreview.net/forum?id=zwMfg9PfPs",
        "pdf": "https://openreview.net/pdf?id=zwMfg9PfPs",
        "email": "tuebingen.mpg.de;tuebingen.mpg.de;",
        "author_num": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Max Planck Institute for Intelligent Systems",
        "aff_unique_dep": "Intelligent Systems",
        "aff_unique_url": "https://www.mpi-is.mpg.de",
        "aff_unique_abbr": "MPI-IS",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Germany"
    },
    {
        "title": "Learning Mean Field Games on Sparse Graphs: A Hybrid Graphex Approach",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17367",
        "id": "zwU9scoU4A",
        "author_site": "Christian Fabian, Kai Cui, Heinz Koeppl",
        "tldr": "",
        "abstract": "Learning the behavior of large agent populations is an important task for numerous research areas. Although the field of multi-agent reinforcement learning (MARL) has made significant progress towards solving these systems, solutions for many agents often remain computationally infeasible and lack theoretical guarantees. Mean Field Games (MFGs) address both of these issues and can be extended to Graphon MFGs (GMFGs) to include network structures between agents. Despite their merits, the real world applicability of GMFGs is limited by the fact that graphons only capture dense graphs. Since most empirically observed networks show some degree of sparsity, such as power law graphs, the GMFG framework is insufficient for capturing these network topologies. Thus, we introduce the novel concept of Graphex MFGs (GXMFGs) which builds on the graph theoretical concept of graphexes. Graphexes are the limiting objects to sparse graph sequences that also have other desirable features such as the small world property. Learning equilibria in these games is challenging due to the rich and sparse structure of the underlying graphs. To tackle these challenges, we design a new learning algorithm tailored to the GXMFG setup. This hybrid graphex learning approach leverages that the system mainly consists of a highly connected core and a sparse periphery. After defining the system and providing a theoretical analysis, we state our learning approach and demonstrate its learning capabilities on both synthetic graphs and real-world networks. This comparison shows that our GXMFG learning algorithm successfully extends MFGs to a highly relevant class of hard, realistic learning problems that are not accurately addressed by current MARL and MFG methods.",
        "keywords": "Mean Field Games;Equilibrium Learning;Networks;Large Graphs;Multi Agent Systems",
        "primary_area": "general machine learning (i.e., none of the above)",
        "supplementary_material": "/attachment/3e1112e852db6b6dfd996270da5046c5b45038c2.zip",
        "author": "Christian Fabian;Kai Cui;Heinz Koeppl",
        "authorids": "~Christian_Fabian1;~Kai_Cui3;~Heinz_Koeppl1",
        "gender": "M;;M",
        "homepage": "https://www.bcs.tu-darmstadt.de/team_sos/fabianchristian.en.jsp;;",
        "dblp": "85/10135-1;;41/6084",
        "google_scholar": "https://scholar.google.de/citations?user=hYtlGkMAAAAJ;;https://scholar.google.de/citations?user=WaPW80kAAAAJ",
        "orcid": "0000-0003-4239-3861;;",
        "linkedin": "https://de.linkedin.com/in/-christian-fabian;;",
        "or_profile": "~Christian_Fabian1;~Kai_Cui3;~Heinz_Koeppl1",
        "aff": "Technische Universit\u00e4t Darmstadt;;TU Darmstadt",
        "aff_domain": "tu-darmstadt.de;;tu-darmstadt.de",
        "position": "PhD student;;Full Professor",
        "bibtex": "@inproceedings{\nfabian2024learning,\ntitle={Learning Mean Field Games on Sparse Graphs: A Hybrid Graphex Approach},\nauthor={Christian Fabian and Kai Cui and Heinz Koeppl},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=zwU9scoU4A}\n}",
        "github": "",
        "project": "",
        "reviewers": "e4bh;P6cQ;hgJx",
        "pdf_size": 1926306,
        "rating": "6;6;8",
        "confidence": "3;4;2",
        "soundness": "3;3;3",
        "contribution": "3;3;3",
        "presentation": "3;3;3",
        "wc_summary": "88;70;110",
        "wc_strengths": "58;48;75",
        "wc_weaknesses": "81;72;32",
        "wc_questions": "21;134;58",
        "wc_review": "248;324;275",
        "wc_reply_reviewers": "40;0;17",
        "wc_reply_authors": "600;625;375",
        "reply_reviewers": "1;0;1",
        "reply_authors": "1;1;1",
        "rating_avg": [
            6.666666666666667,
            0.9428090415820634
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            3.0,
            0.0
        ],
        "contribution_avg": [
            3.0,
            0.0
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            89.33333333333333,
            16.35712552851373
        ],
        "wc_strengths_avg": [
            60.333333333333336,
            11.145502331533658
        ],
        "wc_weaknesses_avg": [
            61.666666666666664,
            21.296843793284385
        ],
        "wc_questions_avg": [
            71.0,
            47.038990918882035
        ],
        "wc_review_avg": [
            282.3333333333333,
            31.457201966410736
        ],
        "wc_reply_reviewers_avg": [
            19.0,
            16.391054470858997
        ],
        "wc_reply_authors_avg": [
            533.3333333333334,
            112.42281302693368
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            1.0,
            0.0
        ],
        "replies_avg": [
            11,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=3211149925687914311&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=zwU9scoU4A",
        "pdf": "https://openreview.net/pdf?id=zwU9scoU4A",
        "email": "tu-darmstadt.de;;tu-darmstadt.de",
        "author_num": 3,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Technische Universit\u00e4t Darmstadt",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.tu-darmstadt.de",
        "aff_unique_abbr": "TUD",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Darmstadt",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "Germany"
    },
    {
        "id": "zwcRnM8lD6",
        "title": "MILE: Mutual Information LogDet Estimator",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Mutual information (MI) estimation plays an important role in representational learning. However, accurately estimating mutual information is challenging, especially for high-dimensional variables with limited batch data. In this work, we approach the mutual information estimation problem via the logdet function of data covariance. To extend the logdet function for entropy estimation of non-Gaussian variables, we assume that the data can be approximated well by a Gaussian mixture distribution and introduce a lower and upper bound for the entropy of such distributions. To deal with high dimensionality, we introduce ``ridge'' term in the logdet function to stabilize the estimation. Consequently, the mutual information can be estimated by the entropy decomposition. Our method MILE significant outperforms conventional neural network-based MI estimators in obtaining low bias and low variance MI estimation. Besides, it well pass the challenging self-consistency tests. Simulation studies also show that, beyond a better MI estimator, MILE can simultaneously gain competitive performance with SOTA MI based loss in self-supervised learning.",
        "keywords": "Mutual Information;Entropy;LogDet Function;Lower and Upper bounds;Self-consistency;Self-supervised Learning",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/64a67962225a031df65ea50423b0491f84dd16bc.zip",
        "author": "Chunlin Ji;Feng Chen;Fu Yuhao;Jun Liu",
        "authorids": "~Chunlin_Ji1;~Feng_Chen17;~Fu_Yuhao1;~Jun_Liu3",
        "gender": "M;;M;M",
        "homepage": "https://www.researchgate.net/profile/Chunlin_Ji;http://www.kuang-chi.org/;;https://sites.harvard.edu/junliu/",
        "dblp": ";;;",
        "google_scholar": ";;F36QvVgAAAAJ;-bHzVq8AAAAJ",
        "orcid": ";;;0000-0002-4450-7239",
        "linkedin": ";;;",
        "or_profile": "~Chunlin_Ji1;~Feng_Chen17;~Fu_Yuhao1;~Jun_Liu3",
        "aff": "Independent;;Independent;Harvard University",
        "aff_domain": "bayesianai.org;;bayesianai.org;fas.harvard.edu",
        "position": "Researcher;;Researcher;Full Professor",
        "bibtex": "@misc{\nji2024mile,\ntitle={{MILE}: Mutual Information LogDet Estimator},\nauthor={Chunlin Ji and Feng Chen and Fu Yuhao and Jun Liu},\nyear={2024},\nurl={https://openreview.net/forum?id=zwcRnM8lD6}\n}",
        "github": "",
        "project": "",
        "reviewers": "mr2r;fvqj;MHkc;oYZA;F4Ta",
        "site": "https://openreview.net/forum?id=zwcRnM8lD6",
        "pdf_size": 968662,
        "rating": "3;3;3;3;6",
        "confidence": "4;5;4;4;4",
        "soundness": "2;2;2;2;3",
        "contribution": "1;2;2;2;2",
        "presentation": "2;1;3;2;3",
        "wc_summary": "30;54;40;86;78",
        "wc_strengths": "23;48;5;49;48",
        "wc_weaknesses": "55;277;74;567;258",
        "wc_questions": "717;4;68;64;63",
        "wc_review": "825;383;187;766;447",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            3.6,
            1.2
        ],
        "confidence_avg": [
            4.2,
            0.39999999999999997
        ],
        "soundness_avg": [
            2.2,
            0.39999999999999997
        ],
        "contribution_avg": [
            1.8,
            0.4000000000000001
        ],
        "presentation_avg": [
            2.2,
            0.7483314773547882
        ],
        "wc_summary_avg": [
            57.6,
            21.481154531356086
        ],
        "wc_strengths_avg": [
            34.6,
            17.76063061943466
        ],
        "wc_weaknesses_avg": [
            246.2,
            184.505176079155
        ],
        "wc_questions_avg": [
            183.2,
            267.9488010796092
        ],
        "wc_review_avg": [
            521.6,
            240.21457074873703
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            5,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.25000000000000006,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:_Sys09IrvzIJ:scholar.google.com/&scioq=MILE:+Mutual+Information+LogDet+Estimator&hl=en&as_sdt=0,31",
        "gs_version_total": 0,
        "aff_unique_index": "0;0;1",
        "aff_unique_norm": "Independent;Harvard University",
        "aff_unique_dep": ";",
        "aff_unique_url": ";https://www.harvard.edu",
        "aff_unique_abbr": ";Harvard",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "1",
        "aff_country_unique": ";United States"
    },
    {
        "id": "zxOFe1mx26",
        "title": "CFASL: Composite Factor-Aligned Symmetry Learning for Disentanglement in Variational Autoencoder",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Implemented symmetries of input and latent vectors is important for disentanglement learning in VAEs, but most works focus on disentangling each factor without consideration of multi-factor change close to real world transformation between two samples, and even a few studies to handle it in autoencoder literature are constrained to pre-defined factors. We propose a novel disentanglement framework\nfor Composite Factor-Aligned Symmetry Learning (CFASL) on VAEs for the extension to general multi-factor change condition without constraint. CFASL disentangles representations by 1) aligning their changes, explicit symmetries, and unknown factors via proposed inductive bias, 2) building a composite symmetry for multi-factor change between two samples, and 3) inducing group equivariant\nencoder and decoder in the condition. To set up the multi-factor change condition, we propose sample pairing for inputs, and an extended evaluation metric. In quantitative and in-depth qualitative analysis, CFASL shows significant improvement of disentanglement in multi-factor change condition compared to state-of-the-art methods and also gradually improves in single factor change condition on common benchmarks.",
        "keywords": "Disentanglement learning;Symmetries;Variational AutoEncoder",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "/attachment/cc3d08ce8670b9ba941d228206dd48a29a545b1d.zip",
        "author": "Hee-Jun Jung;Jaehyoung Jeong;Kangil Kim",
        "authorids": "~Hee-Jun_Jung1;~Jaehyoung_Jeong1;~Kangil_Kim1",
        "gender": "M;M;M",
        "homepage": ";https://LynAlpha.github.io;",
        "dblp": ";;45/8372",
        "google_scholar": "wE6eHi0AAAAJ;;RZggOtkAAAAJ",
        "orcid": "0000-0002-9805-8192;;0000-0003-3220-6401",
        "linkedin": ";;",
        "or_profile": "~Hee-Jun_Jung1;~Jaehyoung_Jeong1;~Kangil_Kim1",
        "aff": "Gwangju Institute of Science and Technology;Gwangju Institute of Science and Technology;Gwangju Institute of Science and Technology",
        "aff_domain": "gist.ac.kr;gist.ac.kr;gist.ac.kr",
        "position": "PhD student;PhD student;Associate Professor",
        "bibtex": "@misc{\njung2024cfasl,\ntitle={{CFASL}: Composite Factor-Aligned Symmetry Learning for Disentanglement in Variational Autoencoder},\nauthor={Hee-Jun Jung and Jaehyoung Jeong and Kangil Kim},\nyear={2024},\nurl={https://openreview.net/forum?id=zxOFe1mx26}\n}",
        "github": "",
        "project": "",
        "reviewers": "5Cgw;DbMo;oACj;A4b1",
        "site": "https://openreview.net/forum?id=zxOFe1mx26",
        "pdf_size": 7560926,
        "rating": "3;3;5;5",
        "confidence": "5;4;3;3",
        "soundness": "3;2;3;2",
        "contribution": "2;2;2;2",
        "presentation": "2;2;1;2",
        "wc_summary": "109;42;84;165",
        "wc_strengths": "82;22;132;109",
        "wc_weaknesses": "233;194;332;133",
        "wc_questions": "59;26;196;54",
        "wc_review": "483;284;744;461",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.0,
            1.0
        ],
        "confidence_avg": [
            3.75,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.0
        ],
        "presentation_avg": [
            1.75,
            0.4330127018922193
        ],
        "wc_summary_avg": [
            100.0,
            44.51404272810997
        ],
        "wc_strengths_avg": [
            86.25,
            41.09972627646077
        ],
        "wc_weaknesses_avg": [
            223.0,
            72.32219576312654
        ],
        "wc_questions_avg": [
            83.75,
            66.01656988968755
        ],
        "wc_review_avg": [
            493.0,
            164.16912011703053
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            3,
            0
        ],
        "corr_rating_confidence": -0.9045340337332909,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=17663699385228329357&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 5,
        "aff_unique_index": "0;0;0",
        "aff_unique_norm": "Gwangju Institute of Science and Technology",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.gist.ac.kr",
        "aff_unique_abbr": "GIST",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Gwangju",
        "aff_country_unique_index": "0;0;0",
        "aff_country_unique": "South Korea"
    },
    {
        "id": "zxPDdw8koz",
        "title": "CLIP meets Model Zoo Experts: Pseudo-Supervision for Visual Enhancement",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Contrastive language image pretraining (CLIP) is a standard method for training vision-language models. While CLIP is scalable, promptable, and robust to distribution shifts on image classification tasks, it lacks object localization capabilities.  This paper studies the following question: Can we augment CLIP training with task-specific vision models from model zoos to improve its visual representations? Towards this end, we leverage open-source task-specific vision models to generate pseudo-labels for an uncurated and noisy image-text dataset. Subsequently, we train CLIP models on these pseudo-labels in addition to the contrastive training on image and text pairs. This simple setup shows substantial improvements of up to 16.3\\% across different vision tasks, including segmentation, detection, depth estimation, and surface normal estimation. Importantly, these enhancements are achieved without compromising CLIP's existing capabilities, including its proficiency in promptable zero-shot classification.",
        "keywords": "Contrastive Learning;CLIP;Distillation;Dense prediction;3D Understanding;Task-specific experts",
        "primary_area": "representation learning for computer vision, audio, language, and other modalities",
        "supplementary_material": "",
        "author": "Mohammadreza Salehi;Mehrdad Farajtabar;Maxwell Horton;Fartash Faghri;Hadi Pouransari;Raviteja Vemulapalli;Oncel Tuzel;Ali Farhadi;Mohammad Rastegari;Sachin Mehta",
        "authorids": "~Mohammadreza_Salehi3;~Mehrdad_Farajtabar1;~Maxwell_Horton1;~Fartash_Faghri1;~Hadi_Pouransari1;~Raviteja_Vemulapalli1;~Oncel_Tuzel2;~Ali_Farhadi3;~Mohammad_Rastegari2;~Sachin_Mehta1",
        "gender": "M;M;M;M;M;M;M;M;M;M",
        "homepage": "https://homes.cs.washington.edu/~mrsalehi/;https://www.cc.gatech.edu/~mfarajta/;https://homes.cs.washington.edu/~mchorton/;;;http://ravitejav.weebly.com/;http://www.onceltuzel.net;https://homes.cs.washington.edu/~ali/;https://mrastegari.github.io/;https://sacmehta.github.io/",
        "dblp": ";21/9988;;115/7922;162/5187;135/4940;73/2943.html;37/5826;31/5228;34/11140",
        "google_scholar": "NFddT_4AAAAJ;shkKxnQAAAAJ;zP3Rp-MAAAAJ;https://scholar.google.ca/citations?user=KUG_tG0AAAAJ;besz69AAAAAJ;0OFqm7YAAAAJ;Fe7NTe0AAAAJ;jeOFRDsAAAAJ;N4-2Z_cAAAAJ;https://scholar.google.co.in/citations?user=cnRJ0GUAAAAJ",
        "orcid": ";;;;;;;;;",
        "linkedin": "mrezasalehi/;;;fartash-faghri;;raviteja-vemulapalli-85146113?utm_source=share&utm_campaign=share_via&utm_content=profile&utm_medium=ios_app;;;;",
        "or_profile": "~Mohammadreza_Salehi3;~Mehrdad_Farajtabar1;~Maxwell_Horton1;~Fartash_Faghri1;~Hadi_Pouransari1;~Raviteja_Vemulapalli1;~Oncel_Tuzel2;~Ali_Farhadi3;~Mohammad_Rastegari2;~Sachin_Mehta1",
        "aff": "University of Washington;Apple;Apple;Apple;Apple;Apple;Apple;University of Washington;Department of Computer Science, University of Washington;Apple",
        "aff_domain": "cs.washington.edu;apple.com;apple.com;apple.com;apple.com;apple.com;apple.com;cs.uw.edu;cs.washington.edu;apple.com",
        "position": "PhD student;Researcher;Researcher;Researcher;Principal Researcher;Researcher;Principal Researcher;Full Professor;Assistant Professor;Researcher",
        "bibtex": "@misc{\nsalehi2024clip,\ntitle={{CLIP} meets Model Zoo Experts: Pseudo-Supervision for Visual Enhancement},\nauthor={Mohammadreza Salehi and Mehrdad Farajtabar and Maxwell Horton and Fartash Faghri and Hadi Pouransari and Raviteja Vemulapalli and Oncel Tuzel and Ali Farhadi and Mohammad Rastegari and Sachin Mehta},\nyear={2024},\nurl={https://openreview.net/forum?id=zxPDdw8koz}\n}",
        "github": "",
        "project": "",
        "reviewers": "BcRN;hJxN;8Cdu;Q843",
        "site": "https://openreview.net/forum?id=zxPDdw8koz",
        "pdf_size": 607706,
        "rating": "3;3;3;8",
        "confidence": "4;5;5;3",
        "soundness": "3;2;2;3",
        "contribution": "2;2;1;3",
        "presentation": "3;3;3;3",
        "wc_summary": "63;50;73;41",
        "wc_strengths": "55;37;52;48",
        "wc_weaknesses": "68;170;133;114",
        "wc_questions": "40;4;6;25",
        "wc_review": "226;261;264;228",
        "wc_reply_reviewers": "0;0;0;0",
        "wc_reply_authors": "0;0;0;0",
        "reply_reviewers": "0;0;0;0",
        "reply_authors": "0;0;0;0",
        "rating_avg": [
            4.25,
            2.165063509461097
        ],
        "confidence_avg": [
            4.25,
            0.82915619758885
        ],
        "soundness_avg": [
            2.5,
            0.5
        ],
        "contribution_avg": [
            2.0,
            0.7071067811865476
        ],
        "presentation_avg": [
            3.0,
            0.0
        ],
        "wc_summary_avg": [
            56.75,
            12.214233500306108
        ],
        "wc_strengths_avg": [
            48.0,
            6.819090848492928
        ],
        "wc_weaknesses_avg": [
            121.25,
            36.75170064092273
        ],
        "wc_questions_avg": [
            18.75,
            14.7542366796795
        ],
        "wc_review_avg": [
            244.75,
            17.795715776557007
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            4,
            0
        ],
        "authors#_avg": [
            10,
            0
        ],
        "corr_rating_confidence": -0.8703882797784891,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=14309327701079788079&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 4,
        "aff_unique_index": "0;1;1;1;1;1;1;0;0;1",
        "aff_unique_norm": "University of Washington;Apple",
        "aff_unique_dep": ";Apple Inc.",
        "aff_unique_url": "https://www.washington.edu;https://www.apple.com",
        "aff_unique_abbr": "UW;Apple",
        "aff_campus_unique_index": "1",
        "aff_campus_unique": ";Seattle",
        "aff_country_unique_index": "0;0;0;0;0;0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "title": "On the generalization capacity of neural networks during generic multimodal reasoning",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17366",
        "id": "zyBJodMrn5",
        "author_site": "Takuya Ito, Soham Dan, Mattia Rigotti, James Kozloski, Murray Campbell",
        "tldr": "",
        "abstract": "The advent of the Transformer has led to the development of large language models (LLM), which appear to demonstrate human-like capabilities. To assess the generality of this class of models and a variety of other base neural network architectures to multimodal domains, we evaluated and compared their capacity for multimodal generalization. We introduce a multimodal question-answer benchmark to evaluate three specific types of out-of-distribution (OOD) generalization performance: distractor generalization (generalization in the presence of distractors), systematic compositional generalization (generalization to new task permutations), and productive compositional generalization (generalization to more complex tasks with deeper dependencies). While we found that most architectures faired poorly on most forms of generalization (e.g., RNNs and standard Transformers), models that leveraged cross-attention mechanisms between input domains, such as the Perceiver, fared better. Our positive results demonstrate that for multimodal distractor and systematic generalization, cross-attention is an important mechanism to integrate multiple sources of information. On the other hand, all architectures failed in productive generalization, suggesting fundamental limitations of existing architectures for specific types of multimodal OOD generalization. These results demonstrate the strengths and limitations of specific architectural components underlying modern neural models for multimodal reasoning. Finally, we provide *Generic COG* (gCOG), a configurable benchmark with several multimodal generalization splits, for future studies to explore.",
        "keywords": "compositional generalization;compositionality;representation learning;out-of-distribution generalization;multimodal reasoning",
        "primary_area": "applications to neuroscience & cognitive science",
        "supplementary_material": "/attachment/a1d3114f70fe359e19150d56c76803648d2fee27.zip",
        "author": "Takuya Ito;Soham Dan;Mattia Rigotti;James Kozloski;Murray Campbell",
        "authorids": "~Takuya_Ito1;~Soham_Dan1;~Mattia_Rigotti1;~James_Kozloski1;~Murray_Campbell1",
        "gender": "M;M;;M;M",
        "homepage": "https://ito-takuya.github.io;https://sdan2.github.io/;http://www.matrig.net;http://ibm.co/kozloski;https://researcher.watson.ibm.com/researcher/view.php?person=us-mcam",
        "dblp": "32/3223;181/9448;01/9816;;72/3339",
        "google_scholar": "Ym08_RMAAAAJ;nOsmu8UAAAAJ;TmHt7CwAAAAJ;JI1pCocAAAAJ;8rykXfcAAAAJ",
        "orcid": "0000-0002-2060-4608;;0000-0001-6466-2810;0000-0003-3420-4688;0000-0001-8158-894X",
        "linkedin": ";;;jameskozloski/;murray-campbell-5b42a75/",
        "or_profile": "~Takuya_Ito1;~Soham_Dan1;~Mattia_Rigotti1;~James_Kozloski1;~Murray_Campbell1",
        "aff": "International Business Machines;International Business Machines;International Business Machines;International Business Machines;International Business Machines",
        "aff_domain": "ibm.com;ibm.com;ibm.com;ibm.com;ibm.com",
        "position": "Postdoc;Researcher;Researcher;Researcher;Research Scientist",
        "bibtex": "@inproceedings{\nito2024on,\ntitle={On the generalization capacity of neural networks during generic multimodal reasoning},\nauthor={Takuya Ito and Soham Dan and Mattia Rigotti and James Kozloski and Murray Campbell},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=zyBJodMrn5}\n}",
        "github": "",
        "project": "",
        "reviewers": "a4Su;skmj;DJb6",
        "pdf_size": 6581193,
        "rating": "3;6;8",
        "confidence": "3;4;4",
        "soundness": "1;3;3",
        "contribution": "2;3;3",
        "presentation": "2;3;3",
        "wc_summary": "42;145;34",
        "wc_strengths": "95;48;192",
        "wc_weaknesses": "473;52;154",
        "wc_questions": "250;73;211",
        "wc_review": "860;318;591",
        "wc_reply_reviewers": "311;0;27",
        "wc_reply_authors": "2769;963;1202",
        "reply_reviewers": "1;0;1",
        "reply_authors": "5;2;2",
        "rating_avg": [
            5.666666666666667,
            2.0548046676563256
        ],
        "confidence_avg": [
            3.6666666666666665,
            0.4714045207910317
        ],
        "soundness_avg": [
            2.3333333333333335,
            0.9428090415820634
        ],
        "contribution_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            73.66666666666667,
            50.545908725522864
        ],
        "wc_strengths_avg": [
            111.66666666666667,
            59.95739227892495
        ],
        "wc_weaknesses_avg": [
            226.33333333333334,
            179.3215609518895
        ],
        "wc_questions_avg": [
            178.0,
            75.93418202627852
        ],
        "wc_review_avg": [
            589.6666666666666,
            221.27258202397232
        ],
        "wc_reply_reviewers_avg": [
            112.66666666666667,
            140.67535518190653
        ],
        "wc_reply_authors_avg": [
            1644.6666666666667,
            800.9886946074139
        ],
        "reply_reviewers_avg": [
            0.6666666666666666,
            0.4714045207910317
        ],
        "reply_authors_avg": [
            3.0,
            1.4142135623730951
        ],
        "replies_avg": [
            17,
            0
        ],
        "authors#_avg": [
            5,
            0
        ],
        "corr_rating_confidence": 0.9176629354822472,
        "gs_citation": 2,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=11210294290156305692&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 6,
        "openreview": "https://openreview.net/forum?id=zyBJodMrn5",
        "pdf": "https://openreview.net/pdf?id=zyBJodMrn5",
        "email": "ibm.com;ibm.com;ibm.com;ibm.com;ibm.com",
        "author_num": 5,
        "aff_unique_index": "0;0;0;0;0",
        "aff_unique_norm": "International Business Machines Corporation",
        "aff_unique_dep": "",
        "aff_unique_url": "https://www.ibm.com",
        "aff_unique_abbr": "IBM",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0;0;0;0",
        "aff_country_unique": "United States"
    },
    {
        "id": "zz61V8bIab",
        "title": "Stochastic Adversarial Networks for Multi-Domain Text Classification",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Adversarial training has played a pivotal role in the significant advancements of multi-domain text classification (MDTC). Recent MDTC methods often adopt the shared-private paradigm, wherein a shared feature extractor captures domain-invariant knowledge, while private feature extractors per domain extract domain-dependent knowledge. These approaches have demonstrated state-of-the-art performance. However, a major challenge remains: the exponential increase in model parameters as new domains emerge. To address this challenge, we propose the Stochastic Adversarial Network (SAN), which models multiple domain-specific feature extractors as a multivariate Gaussian distribution rather than weight vectors. With SAN, we can sample as many domain-specific feature extractors as necessary without drastically increasing the number of model parameters. Consequently, the model size of SAN remains comparable to having a single domain-specific feature extractor when data from multiple domains. Additionally, we incorporate domain label smoothing and robust pseudo-label regularization techniques to enhance the stability of the adversarial training and improve feature discriminability, respectively. The evaluations conducted on two prominent MDTC benchmarks validate the competitiveness of our proposed SAN method against state-of-the-art approaches.",
        "keywords": "Multi-domain text classification;Adversarial training;Multivariate gaussian distribution",
        "primary_area": "transfer learning, meta learning, and lifelong learning",
        "supplementary_material": "/attachment/2eb01af4fa81f4adc4d789218d89f9bdd87d7484.zip",
        "author": "Xu Wang;Yuan Wu",
        "authorids": "~Xu_Wang22;~Yuan_Wu2",
        "gender": "F;M",
        "homepage": "https://github.com/xwang2022;",
        "dblp": ";41/5176-2",
        "google_scholar": ";KVeRu2QAAAAJ",
        "orcid": ";",
        "linkedin": ";yuan-wu-953208150/",
        "or_profile": "~Xu_Wang22;~Yuan_Wu2",
        "aff": "Jilin University;Jilin University",
        "aff_domain": "jlu.edu.cn;jlu.edu.cn",
        "position": "MS student;Assistant Professor",
        "bibtex": "@misc{\nwang2024stochastic,\ntitle={Stochastic Adversarial Networks for Multi-Domain Text Classification},\nauthor={Xu Wang and Yuan Wu},\nyear={2024},\nurl={https://openreview.net/forum?id=zz61V8bIab}\n}",
        "github": "",
        "project": "",
        "reviewers": "NpVu;agCZ;bAwA",
        "site": "https://openreview.net/forum?id=zz61V8bIab",
        "pdf_size": 1517082,
        "rating": "1;5;5",
        "confidence": "4;3;2",
        "soundness": "1;2;3",
        "contribution": "1;2;2",
        "presentation": "3;2;3",
        "wc_summary": "72;121;53",
        "wc_strengths": "32;79;42",
        "wc_weaknesses": "351;194;96",
        "wc_questions": "29;140;22",
        "wc_review": "484;534;213",
        "wc_reply_reviewers": "0;0;0",
        "wc_reply_authors": "0;0;0",
        "reply_reviewers": "0;0;0",
        "reply_authors": "0;0;0",
        "rating_avg": [
            3.6666666666666665,
            1.8856180831641267
        ],
        "confidence_avg": [
            3.0,
            0.816496580927726
        ],
        "soundness_avg": [
            2.0,
            0.816496580927726
        ],
        "contribution_avg": [
            1.6666666666666667,
            0.4714045207910317
        ],
        "presentation_avg": [
            2.6666666666666665,
            0.4714045207910317
        ],
        "wc_summary_avg": [
            82.0,
            28.647280266487194
        ],
        "wc_strengths_avg": [
            51.0,
            20.215505600075073
        ],
        "wc_weaknesses_avg": [
            213.66666666666666,
            105.02803858441273
        ],
        "wc_questions_avg": [
            63.666666666666664,
            54.05141585153488
        ],
        "wc_review_avg": [
            410.3333333333333,
            141.02088103855007
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            3,
            0
        ],
        "authors#_avg": [
            2,
            0
        ],
        "corr_rating_confidence": -0.8660254037844385,
        "gs_citation": 0,
        "gs_cited_by_link": "https://scholar.google.com/scholar?q=related:LAPUDLZ89XoJ:scholar.google.com/&scioq=Stochastic+Adversarial+Networks+for+Multi-Domain+Text+Classification&hl=en&as_sdt=0,48",
        "gs_version_total": 4,
        "aff_unique_index": "0;0",
        "aff_unique_norm": "Jilin University",
        "aff_unique_dep": "",
        "aff_unique_url": "http://www.jlu.edu.cn",
        "aff_unique_abbr": "JLU",
        "aff_campus_unique_index": "",
        "aff_campus_unique": "",
        "aff_country_unique_index": "0;0",
        "aff_country_unique": "China"
    },
    {
        "title": "Breaking Physical and Linguistic Borders: Multilingual Federated Prompt Tuning for Low-Resource Languages",
        "status": "Poster",
        "track": "main",
        "site": "https://iclr.cc/virtual/2024/poster/17365",
        "id": "zzqn5G9fjn",
        "author_site": "Wanru Zhao, Yihong Chen, Royson Lee, Xinchi Qiu, Yan Gao, Hongxiang Fan, Nic Lane",
        "tldr": "",
        "abstract": "Pretrained large language models (LLMs) have emerged as a cornerstone in modern natural language processing, with their utility expanding to various applications and languages. However, the fine-tuning of multilingual LLMs, particularly for low-resource languages, is fraught with challenges steming from data-sharing restrictions (the physical border) and from the inherent linguistic differences (the linguistic border). These barriers hinder users of various languages, especially those in low-resource regions, from fully benefiting from the advantages of LLMs.\n\nTo overcome these challenges, we propose the Federated Prompt Tuning Paradigm for Multilingual Scenarios, which leverages parameter-efficient fine-tuning in a manner that preserves user privacy. We have designed a comprehensive set of experiments and introduced the concept of \"language distance\" to highlight the several strengths of this paradigm. Even under computational constraints, our method not only bolsters data efficiency but also facilitates mutual enhancements across languages, particularly benefiting low-resource ones. Compared to traditional local crosslingual transfer tuning methods, our approach achieves a 6.9\\% higher accuracy, reduces the training parameters by over 99\\%, and demonstrates stronger cross-lingual generalization. Such findings underscore the potential of our approach to promote social equality, ensure user privacy, and champion linguistic diversity.",
        "keywords": "Multilingual Federated Learning;Natural Language Processing",
        "primary_area": "societal considerations including fairness, safety, privacy",
        "supplementary_material": "",
        "author": "Wanru Zhao;Yihong Chen;Royson Lee;Xinchi Qiu;Yan Gao;Hongxiang Fan;Nicholas Donald Lane",
        "authorids": "~Wanru_Zhao1;~Yihong_Chen3;~Royson_Lee1;~Xinchi_Qiu1;~Yan_Gao4;~Hongxiang_Fan1;~Nicholas_Donald_Lane1",
        "gender": ";;;F;M;M;",
        "homepage": ";;;;https://www.cst.cam.ac.uk/people/yg381;https://os-hxfan.github.io/;",
        "dblp": ";;247/5940;265/6559;;;",
        "google_scholar": ";;qNu3yNoAAAAJ;yW6vsS8AAAAJ;https://scholar.google.com/citations?hl=en;iBT_uw4AAAAJ;",
        "orcid": ";;;;;;",
        "linkedin": ";;royson-lee-025a09169/;xinchi-qiu-686a7394/;;;",
        "or_profile": "~Wanru_Zhao1;~Yihong_Chen3;~Royson_Lee1;~Xinchi_Qiu1;~Yan_Gao4;~Hongxiang_Fan1;~Nicholas_Donald_Lane1",
        "aff": ";;Samsung AI Center, Cambridge;University of Cambridge;University of Cambridge;Samsung;",
        "aff_domain": ";;samsung.com;cam.ac.uk;cam.ac.uk;samsung.com;",
        "position": ";;Research Engineer;PhD student;PhD student;Researcher;",
        "bibtex": "@inproceedings{\nzhao2024breaking,\ntitle={Breaking Physical and Linguistic Borders: Multilingual Federated Prompt Tuning for Low-Resource Languages},\nauthor={Wanru Zhao and Yihong Chen and Royson Lee and Xinchi Qiu and Yan Gao and Hongxiang Fan and Nicholas Donald Lane},\nbooktitle={The Twelfth International Conference on Learning Representations},\nyear={2024},\nurl={https://openreview.net/forum?id=zzqn5G9fjn}\n}",
        "github": "",
        "project": "",
        "reviewers": "E7Lk;AG4r;LsRx;xDut",
        "pdf_size": 1026787,
        "rating": "1;3;5;8",
        "confidence": "5;4;4;5",
        "soundness": "1;4;3;4",
        "contribution": "2;3;3;3",
        "presentation": "2;1;3;4",
        "wc_summary": "50;66;65;76",
        "wc_strengths": "59;45;39;56",
        "wc_weaknesses": "506;134;57;101",
        "wc_questions": "31;48;73;29",
        "wc_review": "646;293;234;262",
        "wc_reply_reviewers": "0;33;0;18",
        "wc_reply_authors": "2454;1811;1539;475",
        "reply_reviewers": "0;2;0;1",
        "reply_authors": "8;6;3;2",
        "rating_avg": [
            4.25,
            2.5860201081971503
        ],
        "confidence_avg": [
            4.5,
            0.5
        ],
        "soundness_avg": [
            3.0,
            1.224744871391589
        ],
        "contribution_avg": [
            2.75,
            0.4330127018922193
        ],
        "presentation_avg": [
            2.5,
            1.118033988749895
        ],
        "wc_summary_avg": [
            64.25,
            9.283722313813572
        ],
        "wc_strengths_avg": [
            49.75,
            8.104782538723663
        ],
        "wc_weaknesses_avg": [
            199.5,
            179.05376287584687
        ],
        "wc_questions_avg": [
            45.25,
            17.640507362318125
        ],
        "wc_review_avg": [
            358.75,
            167.1516900901693
        ],
        "wc_reply_reviewers_avg": [
            12.75,
            13.808964479641476
        ],
        "wc_reply_authors_avg": [
            1569.75,
            714.0593025092523
        ],
        "reply_reviewers_avg": [
            0.75,
            0.82915619758885
        ],
        "reply_authors_avg": [
            4.75,
            2.384848003542364
        ],
        "replies_avg": [
            30,
            0
        ],
        "authors#_avg": [
            7,
            0
        ],
        "corr_rating_confidence": 0.09667364890456637,
        "gs_citation": 17,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=8777483654787268830&as_sdt=5,33&sciodt=0,33&hl=en",
        "gs_version_total": 2,
        "openreview": "https://openreview.net/forum?id=zzqn5G9fjn",
        "pdf": "https://openreview.net/pdf?id=zzqn5G9fjn",
        "email": ";;samsung.com;cam.ac.uk;cam.ac.uk;samsung.com;",
        "author_num": 7,
        "aff_unique_index": "0;1;1;0",
        "aff_unique_norm": "Samsung;University of Cambridge",
        "aff_unique_dep": "AI Center;",
        "aff_unique_url": "https://www.samsung.com/global/research-innovation/ai-research-centers/samsung-ai-center-cambridge/;https://www.cam.ac.uk",
        "aff_unique_abbr": "SAC;Cambridge",
        "aff_campus_unique_index": "0;0;0",
        "aff_campus_unique": "Cambridge;",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "United Kingdom;South Korea"
    },
    {
        "id": "zzv4Bf50RW",
        "title": "Learning SO(3)-Invariant Correspondence via Point-wise Local Shape Transform",
        "track": "main",
        "status": "Withdraw",
        "tldr": "",
        "abstract": "Establishing accurate dense 3D correspondences between diverse shapes stands as a pivotal challenge with profound implications for computer vision and robotics. However, existing self-supervised methods for this problem assume perfect input shape alignment, restricting their real-world applicability. In this work, we introduce a novel self-supervised SO(3)-invariant 3D correspondence learner, dubbed LSTNet, that learns to establish dense correspondences between shapes even under challenging intra-class variations. Specifically, LSTNet learns to dynamically formulate an SO(3)-invariant local shape transform for each point, which maps the SO(3)-equivariant global shape descriptor of the input shape to a local shape descriptor. These local shape descriptors are provided as inputs to our decoder to facilitate point cloud self- and cross-reconstruction. Our proposed self-supervised training pipeline encourages semantically corresponding points from different shape instances to be mapped to similar local shape descriptors, enabling LSTNet to establish the dense point-wise correspondences. LSTNet demonstrates state-of-the-art performances on 3D semantic keypoint transfer and part segmentation label transfer given arbitrarily rotated point cloud pairs, outperforming existing methods by significant margins.",
        "keywords": "Point cloud understanding;3D dense correspondence;SO(3)-invariance;Part label transfer",
        "primary_area": "unsupervised, self-supervised, semi-supervised, and supervised representation learning",
        "supplementary_material": "",
        "author": "Chunghyun Park;Seungwook Kim;Jaesik Park;Minsu Cho",
        "authorids": "~Chunghyun_Park1;~Seungwook_Kim2;~Jaesik_Park3;~Minsu_Cho1",
        "gender": "M;M;M;M",
        "homepage": "https://chrockey.github.io/;http://jaesik.info;http://cvlab.postech.ac.kr/~mcho/;https://wookiekim.github.io",
        "dblp": "307/2929;00/10336;;07/10150-5",
        "google_scholar": "5ABvjQcAAAAJ;_3q6KBIAAAAJ;5TyoF5QAAAAJ;kZ4AN54AAAAJ",
        "orcid": ";;;",
        "linkedin": "chunghyun-park-7a50b0170/;;minsu-cho-062b3750/;seung-wook-kim-77b9bb117/",
        "or_profile": "~Chunghyun_Park1;~Jaesik_Park3;~Minsu_Cho1;~Seung_Wook_Kim2",
        "aff": "Pohang University of Science and Technology;Seoul National University;POSTECH;ByteDance",
        "aff_domain": "postech.ac.kr;snu.ac.kr;postech.ac.kr;bytedance.com",
        "position": "PhD student;Assistant Professor;Associate Professor;Intern",
        "bibtex": "@misc{\npark2024learning,\ntitle={Learning {SO}(3)-Invariant Correspondence via Point-wise Local Shape Transform},\nauthor={Chunghyun Park and Seungwook Kim and Jaesik Park and Minsu Cho},\nyear={2024},\nurl={https://openreview.net/forum?id=zzv4Bf50RW}\n}",
        "github": "",
        "project": "",
        "reviewers": "wiS9;jP4i;a6Ps;Frem;eS3u",
        "site": "https://openreview.net/forum?id=zzv4Bf50RW",
        "pdf_size": 11372971,
        "rating": "3;5;5;5;6",
        "confidence": "4;4;4;4;2",
        "soundness": "2;3;3;3;3",
        "contribution": "2;2;3;2;3",
        "presentation": "2;3;3;3;2",
        "wc_summary": "45;55;46;70;112",
        "wc_strengths": "31;35;62;27;35",
        "wc_weaknesses": "492;120;142;187;23",
        "wc_questions": "2;5;162;6;21",
        "wc_review": "570;215;412;290;191",
        "wc_reply_reviewers": "0;0;0;0;0",
        "wc_reply_authors": "0;0;0;0;0",
        "reply_reviewers": "0;0;0;0;0",
        "reply_authors": "0;0;0;0;0",
        "rating_avg": [
            4.8,
            0.9797958971132712
        ],
        "confidence_avg": [
            3.6,
            0.8
        ],
        "soundness_avg": [
            2.8,
            0.39999999999999997
        ],
        "contribution_avg": [
            2.4,
            0.4898979485566356
        ],
        "presentation_avg": [
            2.6,
            0.4898979485566356
        ],
        "wc_summary_avg": [
            65.6,
            24.87247474619283
        ],
        "wc_strengths_avg": [
            38.0,
            12.361229712289955
        ],
        "wc_weaknesses_avg": [
            192.8,
            158.91305799083975
        ],
        "wc_questions_avg": [
            39.2,
            61.75240885989793
        ],
        "wc_review_avg": [
            335.6,
            140.2235358276206
        ],
        "wc_reply_reviewers_avg": [
            0,
            0
        ],
        "wc_reply_authors_avg": [
            0,
            0
        ],
        "reply_reviewers_avg": [
            0,
            0
        ],
        "reply_authors_avg": [
            0,
            0
        ],
        "replies_avg": [
            6,
            0
        ],
        "authors#_avg": [
            4,
            0
        ],
        "corr_rating_confidence": -0.6123724356957946,
        "gs_citation": 1,
        "gs_cited_by_link": "https://scholar.google.com/scholar?cites=18096948393088354490&as_sdt=2005&sciodt=0,5&hl=en",
        "gs_version_total": 0,
        "aff_unique_index": "0;1;0;2",
        "aff_unique_norm": "Pohang University of Science and Technology;Seoul National University;ByteDance",
        "aff_unique_dep": ";;",
        "aff_unique_url": "https://www.postech.ac.kr;https://www.snu.ac.kr;https://www.bytedance.com",
        "aff_unique_abbr": "POSTECH;SNU;ByteDance",
        "aff_campus_unique_index": "0;0",
        "aff_campus_unique": "Pohang;",
        "aff_country_unique_index": "0;0;0;1",
        "aff_country_unique": "South Korea;China"
    }
]